{"train_loss": 5.736958980560303, "global_step": 0, "epoch": 0} {"train_loss": 5.71656608581543, "global_step": 1, "epoch": 0} {"train_loss": 5.7620744705200195, "global_step": 2, "epoch": 0} {"train_loss": 5.719610691070557, "global_step": 3, "epoch": 0} {"train_loss": 5.694396018981934, "global_step": 4, "epoch": 0} {"train_loss": 5.699533462524414, "global_step": 5, "epoch": 0} {"train_loss": 5.669809818267822, "global_step": 6, "epoch": 0} {"train_loss": 5.643962383270264, "global_step": 7, "epoch": 0} {"train_loss": 5.7003302574157715, "global_step": 8, "epoch": 0} {"train_loss": 5.5641326904296875, "global_step": 9, "epoch": 0} {"train_loss": 5.607228755950928, "global_step": 10, "epoch": 0} {"train_loss": 5.6228461265563965, "global_step": 11, "epoch": 0} {"train_loss": 5.639288425445557, "global_step": 12, "epoch": 0} {"train_loss": 5.604483604431152, "global_step": 13, "epoch": 0} {"train_loss": 5.510524272918701, "global_step": 14, "epoch": 0} {"train_loss": 5.576995372772217, "global_step": 15, "epoch": 0} {"train_loss": 5.587479591369629, "global_step": 16, "epoch": 0} {"train_loss": 5.460461616516113, "global_step": 17, "epoch": 0} {"train_loss": 5.5133795738220215, "global_step": 18, "epoch": 0} {"train_loss": 5.462527275085449, "global_step": 19, "epoch": 0} {"train_loss": 5.439237117767334, "global_step": 20, "epoch": 0} {"train_loss": 5.4164652824401855, "global_step": 21, "epoch": 0} {"train_loss": 5.447843074798584, "global_step": 22, "epoch": 0} {"train_loss": 5.384339332580566, "global_step": 23, "epoch": 0} {"train_loss": 5.321449279785156, "global_step": 24, "epoch": 0} {"train_loss": 5.326919078826904, "global_step": 25, "epoch": 0} {"train_loss": 5.247729778289795, "global_step": 26, "epoch": 0} {"train_loss": 5.212467193603516, "global_step": 27, "epoch": 0} {"train_loss": 5.1577467918396, "global_step": 28, "epoch": 0} {"train_loss": 5.040174961090088, "global_step": 29, "epoch": 0} {"train_loss": 5.060283184051514, "global_step": 30, "epoch": 0} {"train_loss": 4.978970527648926, "global_step": 31, "epoch": 0} {"train_loss": 4.907073974609375, "global_step": 32, "epoch": 0} {"train_loss": 4.800963878631592, "global_step": 33, "epoch": 0} {"train_loss": 4.710259914398193, "global_step": 34, "epoch": 0} {"train_loss": 4.620222568511963, "global_step": 35, "epoch": 0} {"train_loss": 4.4766764640808105, "global_step": 36, "epoch": 0} {"train_loss": 4.328598976135254, "global_step": 37, "epoch": 0} {"train_loss": 4.242432117462158, "global_step": 38, "epoch": 0} {"train_loss": 4.068613529205322, "global_step": 39, "epoch": 0} {"train_loss": 3.9017999172210693, "global_step": 40, "epoch": 0} {"train_loss": 3.7259833812713623, "global_step": 41, "epoch": 0} {"train_loss": 3.537712812423706, "global_step": 42, "epoch": 0} {"train_loss": 3.331028699874878, "global_step": 43, "epoch": 0} {"train_loss": 3.2378273010253906, "global_step": 44, "epoch": 0} {"train_loss": 2.9970669746398926, "global_step": 45, "epoch": 0} {"train_loss": 2.7047832012176514, "global_step": 46, "epoch": 0} {"train_loss": 2.9772427082061768, "global_step": 47, "epoch": 0} {"train_loss": 2.707545518875122, "global_step": 48, "epoch": 0} {"train_loss": 2.538024663925171, "global_step": 49, "epoch": 0} {"train_loss": 2.2010560035705566, "global_step": 50, "epoch": 0} {"train_loss": 2.212515354156494, "global_step": 51, "epoch": 0} {"train_loss": 2.1012966632843018, "global_step": 52, "epoch": 0} {"train_loss": 1.883592963218689, "global_step": 53, "epoch": 0} {"train_loss": 1.6456588506698608, "global_step": 54, "epoch": 0} {"train_loss": 1.6005362272262573, "global_step": 55, "epoch": 0} {"train_loss": 1.446663737297058, "global_step": 56, "epoch": 0} {"train_loss": 1.4314358234405518, "global_step": 57, "epoch": 0} {"train_loss": 1.2584418058395386, "global_step": 58, "epoch": 0} {"train_loss": 1.4174555540084839, "global_step": 59, "epoch": 0} {"train_loss": 1.2564549446105957, "global_step": 60, "epoch": 0} {"train_loss": 1.2233853340148926, "global_step": 61, "epoch": 0} {"train_loss": 1.001904010772705, "global_step": 62, "epoch": 0} {"train_loss": 1.1137773990631104, "global_step": 63, "epoch": 0} {"train_loss": 0.7914817333221436, "global_step": 64, "epoch": 0} {"train_loss": 0.6831570267677307, "global_step": 65, "epoch": 0} {"train_loss": 0.8035978674888611, "global_step": 66, "epoch": 0} {"train_loss": 0.6655568480491638, "global_step": 67, "epoch": 0} {"train_loss": 0.8647875189781189, "global_step": 68, "epoch": 0} {"train_loss": 0.5679526925086975, "global_step": 69, "epoch": 0} {"train_loss": 0.40569669008255005, "global_step": 70, "epoch": 0} {"train_loss": 0.6225261092185974, "global_step": 71, "epoch": 0} {"train_loss": 0.618179440498352, "global_step": 72, "epoch": 0} {"train_loss": 0.3161129951477051, "global_step": 73, "epoch": 0} {"train_loss": 0.31708571314811707, "global_step": 74, "epoch": 0} {"train_loss": 0.34814342856407166, "global_step": 75, "epoch": 0} {"train_loss": 0.3208047151565552, "global_step": 76, "epoch": 0} {"train_loss": 0.07712607830762863, "global_step": 77, "epoch": 0} {"train_loss": 0.10817413777112961, "global_step": 78, "epoch": 0} {"train_loss": -0.027730876579880714, "global_step": 79, "epoch": 0} {"train_loss": 0.024855250492691994, "global_step": 80, "epoch": 0} {"train_loss": -0.045291468501091, "global_step": 81, "epoch": 0} {"train_loss": 3.281361535371068, "global_step": 82, "epoch": 0, "train/sim_max_reward_0": 0.0, "train/sim_max_reward_1": 0.0, "train/sim_max_reward_2": 0.0, "train/sim_max_reward_3": 0.0, "train/sim_max_reward_4": 0.0, "train/sim_max_reward_5": 0.0, "test/sim_max_reward_4500000": 0.0, "test/sim_max_reward_4500001": 0.0, "test/sim_max_reward_4500002": 0.0, "test/sim_max_reward_4500003": 0.0, "test/sim_max_reward_4500004": 0.0, "test/sim_max_reward_4500005": 0.0, "test/sim_max_reward_4500006": 0.0, "test/sim_max_reward_4500007": 0.0, "test/sim_max_reward_4500008": 0.0, "test/sim_max_reward_4500009": 0.0, "test/sim_max_reward_4500010": 0.0, "test/sim_max_reward_4500011": 0.0, "test/sim_max_reward_4500012": 0.0, "test/sim_max_reward_4500013": 0.0, "test/sim_max_reward_4500014": 0.0, "test/sim_max_reward_4500015": 0.0, "test/sim_max_reward_4500016": 0.0, "test/sim_max_reward_4500017": 0.0, "test/sim_max_reward_4500018": 0.0, "test/sim_max_reward_4500019": 0.0, "test/sim_max_reward_4500020": 0.0, "test/sim_max_reward_4500021": 0.0, "train/mean_score": 0.0, "test/mean_score": 0.0, "val_loss": 26523278.0} {"train_loss": 0.16347356140613556, "global_step": 83, "epoch": 1} {"train_loss": -0.297528475522995, "global_step": 84, "epoch": 1} {"train_loss": -0.1840350180864334, "global_step": 85, "epoch": 1} {"train_loss": 0.046098534017801285, "global_step": 86, "epoch": 1} {"train_loss": -0.17644163966178894, "global_step": 87, "epoch": 1} {"train_loss": -0.13597983121871948, "global_step": 88, "epoch": 1} {"train_loss": -0.4989403784275055, "global_step": 89, "epoch": 1} {"train_loss": -0.5720109343528748, "global_step": 90, "epoch": 1} {"train_loss": -0.41890421509742737, "global_step": 91, "epoch": 1} {"train_loss": -0.6321880221366882, "global_step": 92, "epoch": 1} {"train_loss": -0.5728775262832642, "global_step": 93, "epoch": 1} {"train_loss": -0.5360209345817566, "global_step": 94, "epoch": 1} {"train_loss": -0.9560322761535645, "global_step": 95, "epoch": 1} {"train_loss": -0.8921911120414734, "global_step": 96, "epoch": 1} {"train_loss": -0.5665821433067322, "global_step": 97, "epoch": 1} {"train_loss": -0.5307345390319824, "global_step": 98, "epoch": 1} {"train_loss": -0.8891260027885437, "global_step": 99, "epoch": 1} {"train_loss": -0.8435810208320618, "global_step": 100, "epoch": 1} {"train_loss": -1.0840743780136108, "global_step": 101, "epoch": 1} {"train_loss": -1.1291500329971313, "global_step": 102, "epoch": 1} {"train_loss": -1.2392537593841553, "global_step": 103, "epoch": 1} {"train_loss": -1.0657018423080444, "global_step": 104, "epoch": 1} {"train_loss": -1.2963364124298096, "global_step": 105, "epoch": 1} {"train_loss": -1.3579699993133545, "global_step": 106, "epoch": 1} {"train_loss": -1.094484567642212, "global_step": 107, "epoch": 1} {"train_loss": -1.33470618724823, "global_step": 108, "epoch": 1} {"train_loss": -1.5575097799301147, "global_step": 109, "epoch": 1} {"train_loss": -1.2578890323638916, "global_step": 110, "epoch": 1} {"train_loss": -1.5155572891235352, "global_step": 111, "epoch": 1} {"train_loss": -1.2258317470550537, "global_step": 112, "epoch": 1} {"train_loss": -1.451870322227478, "global_step": 113, "epoch": 1} {"train_loss": -1.422573447227478, "global_step": 114, "epoch": 1} {"train_loss": -1.4615707397460938, "global_step": 115, "epoch": 1} {"train_loss": -1.480276107788086, "global_step": 116, "epoch": 1} {"train_loss": -1.7354274988174438, "global_step": 117, "epoch": 1} {"train_loss": -1.7096484899520874, "global_step": 118, "epoch": 1} {"train_loss": -1.6677433252334595, "global_step": 119, "epoch": 1} {"train_loss": -1.6609026193618774, "global_step": 120, "epoch": 1} {"train_loss": -1.9388684034347534, "global_step": 121, "epoch": 1} {"train_loss": -2.046160936355591, "global_step": 122, "epoch": 1} {"train_loss": -1.603786826133728, "global_step": 123, "epoch": 1} {"train_loss": -1.9972803592681885, "global_step": 124, "epoch": 1} {"train_loss": -1.7041454315185547, "global_step": 125, "epoch": 1} {"train_loss": -2.053601026535034, "global_step": 126, "epoch": 1} {"train_loss": -2.1093318462371826, "global_step": 127, "epoch": 1} {"train_loss": -1.8338373899459839, "global_step": 128, "epoch": 1} {"train_loss": -2.2195398807525635, "global_step": 129, "epoch": 1} {"train_loss": -2.245208263397217, "global_step": 130, "epoch": 1} {"train_loss": -2.295109987258911, "global_step": 131, "epoch": 1} {"train_loss": -2.2311599254608154, "global_step": 132, "epoch": 1} {"train_loss": -2.4173474311828613, "global_step": 133, "epoch": 1} {"train_loss": -2.2517566680908203, "global_step": 134, "epoch": 1} {"train_loss": -2.363579750061035, "global_step": 135, "epoch": 1} {"train_loss": -2.365036964416504, "global_step": 136, "epoch": 1} {"train_loss": -2.498894453048706, "global_step": 137, "epoch": 1} {"train_loss": -2.1998393535614014, "global_step": 138, "epoch": 1} {"train_loss": -2.647784948348999, "global_step": 139, "epoch": 1} {"train_loss": -2.34232759475708, "global_step": 140, "epoch": 1} {"train_loss": -2.4722137451171875, "global_step": 141, "epoch": 1} {"train_loss": -2.5402519702911377, "global_step": 142, "epoch": 1} {"train_loss": -2.6088221073150635, "global_step": 143, "epoch": 1} {"train_loss": -2.349841594696045, "global_step": 144, "epoch": 1} {"train_loss": -2.6443498134613037, "global_step": 145, "epoch": 1} {"train_loss": -2.624370574951172, "global_step": 146, "epoch": 1} {"train_loss": -3.124140501022339, "global_step": 147, "epoch": 1} {"train_loss": -2.7620818614959717, "global_step": 148, "epoch": 1} {"train_loss": -3.3775887489318848, "global_step": 149, "epoch": 1} {"train_loss": -3.0380351543426514, "global_step": 150, "epoch": 1} {"train_loss": -3.166180372238159, "global_step": 151, "epoch": 1} {"train_loss": -3.0682194232940674, "global_step": 152, "epoch": 1} {"train_loss": -2.9268834590911865, "global_step": 153, "epoch": 1} {"train_loss": -2.911458969116211, "global_step": 154, "epoch": 1} {"train_loss": -2.968770742416382, "global_step": 155, "epoch": 1} {"train_loss": -3.0927045345306396, "global_step": 156, "epoch": 1} {"train_loss": -3.5846047401428223, "global_step": 157, "epoch": 1} {"train_loss": -3.54681658744812, "global_step": 158, "epoch": 1} {"train_loss": -3.1031484603881836, "global_step": 159, "epoch": 1} {"train_loss": -2.9251930713653564, "global_step": 160, "epoch": 1} {"train_loss": -3.487920045852661, "global_step": 161, "epoch": 1} {"train_loss": -3.66276478767395, "global_step": 162, "epoch": 1} {"train_loss": -3.486783742904663, "global_step": 163, "epoch": 1} {"train_loss": -3.5024261474609375, "global_step": 164, "epoch": 1} {"train_loss": -1.8839824192046402, "global_step": 165, "epoch": 1, "val_loss": 20234292.0} {"train_loss": -3.488797903060913, "global_step": 166, "epoch": 2} {"train_loss": -3.559619188308716, "global_step": 167, "epoch": 2} {"train_loss": -3.4879531860351562, "global_step": 168, "epoch": 2} {"train_loss": -3.833918333053589, "global_step": 169, "epoch": 2} {"train_loss": -3.4765050411224365, "global_step": 170, "epoch": 2} {"train_loss": -3.45926833152771, "global_step": 171, "epoch": 2} {"train_loss": -3.7407166957855225, "global_step": 172, "epoch": 2} {"train_loss": -3.502763032913208, "global_step": 173, "epoch": 2} {"train_loss": -3.9596290588378906, "global_step": 174, "epoch": 2} {"train_loss": -4.062737464904785, "global_step": 175, "epoch": 2} {"train_loss": -3.543914556503296, "global_step": 176, "epoch": 2} {"train_loss": -4.320113182067871, "global_step": 177, "epoch": 2} {"train_loss": -3.8386707305908203, "global_step": 178, "epoch": 2} {"train_loss": -4.315290927886963, "global_step": 179, "epoch": 2} {"train_loss": -4.50949239730835, "global_step": 180, "epoch": 2} {"train_loss": -4.14003324508667, "global_step": 181, "epoch": 2} {"train_loss": -4.067769527435303, "global_step": 182, "epoch": 2} {"train_loss": -4.482964992523193, "global_step": 183, "epoch": 2} {"train_loss": -4.5073771476745605, "global_step": 184, "epoch": 2} {"train_loss": -4.141049385070801, "global_step": 185, "epoch": 2} {"train_loss": -4.664222240447998, "global_step": 186, "epoch": 2} {"train_loss": -4.981025218963623, "global_step": 187, "epoch": 2} {"train_loss": -4.038976192474365, "global_step": 188, "epoch": 2} {"train_loss": -4.670980930328369, "global_step": 189, "epoch": 2} {"train_loss": -4.599591255187988, "global_step": 190, "epoch": 2} {"train_loss": -4.294175624847412, "global_step": 191, "epoch": 2} {"train_loss": -4.74044942855835, "global_step": 192, "epoch": 2} {"train_loss": -4.673286437988281, "global_step": 193, "epoch": 2} {"train_loss": -4.816579818725586, "global_step": 194, "epoch": 2} {"train_loss": -4.866641998291016, "global_step": 195, "epoch": 2} {"train_loss": -4.9280686378479, "global_step": 196, "epoch": 2} {"train_loss": -5.092643737792969, "global_step": 197, "epoch": 2} {"train_loss": -4.7256083488464355, "global_step": 198, "epoch": 2} {"train_loss": -4.983392238616943, "global_step": 199, "epoch": 2} {"train_loss": -5.247251033782959, "global_step": 200, "epoch": 2} {"train_loss": -4.817037582397461, "global_step": 201, "epoch": 2} {"train_loss": -4.5449066162109375, "global_step": 202, "epoch": 2} {"train_loss": -4.946573257446289, "global_step": 203, "epoch": 2} {"train_loss": -4.991574287414551, "global_step": 204, "epoch": 2} {"train_loss": -4.592307090759277, "global_step": 205, "epoch": 2} {"train_loss": -4.359903335571289, "global_step": 206, "epoch": 2} {"train_loss": -4.983523845672607, "global_step": 207, "epoch": 2} {"train_loss": -5.53792142868042, "global_step": 208, "epoch": 2} {"train_loss": -5.136178493499756, "global_step": 209, "epoch": 2} {"train_loss": -5.248623847961426, "global_step": 210, "epoch": 2} {"train_loss": -5.603679180145264, "global_step": 211, "epoch": 2} {"train_loss": -5.248854160308838, "global_step": 212, "epoch": 2} {"train_loss": -5.202224254608154, "global_step": 213, "epoch": 2} {"train_loss": -4.633695125579834, "global_step": 214, "epoch": 2} {"train_loss": -5.334878444671631, "global_step": 215, "epoch": 2} {"train_loss": -5.454220771789551, "global_step": 216, "epoch": 2} {"train_loss": -5.187795162200928, "global_step": 217, "epoch": 2} {"train_loss": -5.686246395111084, "global_step": 218, "epoch": 2} {"train_loss": -5.362339019775391, "global_step": 219, "epoch": 2} {"train_loss": -5.492605209350586, "global_step": 220, "epoch": 2} {"train_loss": -5.258874416351318, "global_step": 221, "epoch": 2} {"train_loss": -5.238292694091797, "global_step": 222, "epoch": 2} {"train_loss": -5.2455339431762695, "global_step": 223, "epoch": 2} {"train_loss": -5.411601543426514, "global_step": 224, "epoch": 2} {"train_loss": -5.455422878265381, "global_step": 225, "epoch": 2} {"train_loss": -5.819943904876709, "global_step": 226, "epoch": 2} {"train_loss": -5.900252819061279, "global_step": 227, "epoch": 2} {"train_loss": -5.590345859527588, "global_step": 228, "epoch": 2} {"train_loss": -5.76223611831665, "global_step": 229, "epoch": 2} {"train_loss": -6.185096740722656, "global_step": 230, "epoch": 2} {"train_loss": -5.577355861663818, "global_step": 231, "epoch": 2} {"train_loss": -6.531198024749756, "global_step": 232, "epoch": 2} {"train_loss": -5.938549995422363, "global_step": 233, "epoch": 2} {"train_loss": -5.763294219970703, "global_step": 234, "epoch": 2} {"train_loss": -5.782286643981934, "global_step": 235, "epoch": 2} {"train_loss": -5.6617913246154785, "global_step": 236, "epoch": 2} {"train_loss": -6.444640636444092, "global_step": 237, "epoch": 2} {"train_loss": -5.559779167175293, "global_step": 238, "epoch": 2} {"train_loss": -6.069427967071533, "global_step": 239, "epoch": 2} {"train_loss": -6.437251567840576, "global_step": 240, "epoch": 2} {"train_loss": -5.953137397766113, "global_step": 241, "epoch": 2} {"train_loss": -5.760448932647705, "global_step": 242, "epoch": 2} {"train_loss": -6.214760780334473, "global_step": 243, "epoch": 2} {"train_loss": -5.635955333709717, "global_step": 244, "epoch": 2} {"train_loss": -6.1116743087768555, "global_step": 245, "epoch": 2} {"train_loss": -5.991672515869141, "global_step": 246, "epoch": 2} {"train_loss": -6.083964824676514, "global_step": 247, "epoch": 2} {"train_loss": -5.021459412862019, "global_step": 248, "epoch": 2, "val_loss": 16516012.0} {"train_loss": -6.450387001037598, "global_step": 249, "epoch": 3} {"train_loss": -6.277089595794678, "global_step": 250, "epoch": 3} {"train_loss": -5.99481725692749, "global_step": 251, "epoch": 3} {"train_loss": -6.2353973388671875, "global_step": 252, "epoch": 3} {"train_loss": -6.3404860496521, "global_step": 253, "epoch": 3} {"train_loss": -6.000674724578857, "global_step": 254, "epoch": 3} {"train_loss": -6.412147045135498, "global_step": 255, "epoch": 3} {"train_loss": -6.218980312347412, "global_step": 256, "epoch": 3} {"train_loss": -6.88318395614624, "global_step": 257, "epoch": 3} {"train_loss": -7.150398254394531, "global_step": 258, "epoch": 3} {"train_loss": -5.477867126464844, "global_step": 259, "epoch": 3} {"train_loss": -7.303230285644531, "global_step": 260, "epoch": 3} {"train_loss": -6.456686496734619, "global_step": 261, "epoch": 3} {"train_loss": -6.24389123916626, "global_step": 262, "epoch": 3} {"train_loss": -6.787257671356201, "global_step": 263, "epoch": 3} {"train_loss": -6.8305840492248535, "global_step": 264, "epoch": 3} {"train_loss": -6.274066925048828, "global_step": 265, "epoch": 3} {"train_loss": -7.241925239562988, "global_step": 266, "epoch": 3} {"train_loss": -6.093277931213379, "global_step": 267, "epoch": 3} {"train_loss": -7.278388500213623, "global_step": 268, "epoch": 3} {"train_loss": -7.352006435394287, "global_step": 269, "epoch": 3} {"train_loss": -6.840943336486816, "global_step": 270, "epoch": 3} {"train_loss": -7.0675506591796875, "global_step": 271, "epoch": 3} {"train_loss": -7.46907901763916, "global_step": 272, "epoch": 3} {"train_loss": -7.164992809295654, "global_step": 273, "epoch": 3} {"train_loss": -7.516148567199707, "global_step": 274, "epoch": 3} {"train_loss": -7.264733791351318, "global_step": 275, "epoch": 3} {"train_loss": -7.44576358795166, "global_step": 276, "epoch": 3} {"train_loss": -7.033890724182129, "global_step": 277, "epoch": 3} {"train_loss": -7.542733669281006, "global_step": 278, "epoch": 3} {"train_loss": -7.5959296226501465, "global_step": 279, "epoch": 3} {"train_loss": -7.33242654800415, "global_step": 280, "epoch": 3} {"train_loss": -7.328592777252197, "global_step": 281, "epoch": 3} {"train_loss": -8.007067680358887, "global_step": 282, "epoch": 3} {"train_loss": -7.874487400054932, "global_step": 283, "epoch": 3} {"train_loss": -7.695059299468994, "global_step": 284, "epoch": 3} {"train_loss": -7.881994724273682, "global_step": 285, "epoch": 3} {"train_loss": -7.76936674118042, "global_step": 286, "epoch": 3} {"train_loss": -8.094231605529785, "global_step": 287, "epoch": 3} {"train_loss": -8.239466667175293, "global_step": 288, "epoch": 3} {"train_loss": -7.547791481018066, "global_step": 289, "epoch": 3} {"train_loss": -7.391887187957764, "global_step": 290, "epoch": 3} {"train_loss": -8.44946575164795, "global_step": 291, "epoch": 3} {"train_loss": -8.859990119934082, "global_step": 292, "epoch": 3} {"train_loss": -8.878655433654785, "global_step": 293, "epoch": 3} {"train_loss": -8.525717735290527, "global_step": 294, "epoch": 3} {"train_loss": -7.86825704574585, "global_step": 295, "epoch": 3} {"train_loss": -8.340103149414062, "global_step": 296, "epoch": 3} {"train_loss": -8.799680709838867, "global_step": 297, "epoch": 3} {"train_loss": -8.274471282958984, "global_step": 298, "epoch": 3} {"train_loss": -8.730441093444824, "global_step": 299, "epoch": 3} {"train_loss": -8.590605735778809, "global_step": 300, "epoch": 3} {"train_loss": -8.47697925567627, "global_step": 301, "epoch": 3} {"train_loss": -8.975646018981934, "global_step": 302, "epoch": 3} {"train_loss": -8.759364128112793, "global_step": 303, "epoch": 3} {"train_loss": -8.931475639343262, "global_step": 304, "epoch": 3} {"train_loss": -9.429778099060059, "global_step": 305, "epoch": 3} {"train_loss": -8.759221076965332, "global_step": 306, "epoch": 3} {"train_loss": -8.912163734436035, "global_step": 307, "epoch": 3} {"train_loss": -9.018539428710938, "global_step": 308, "epoch": 3} {"train_loss": -8.74503231048584, "global_step": 309, "epoch": 3} {"train_loss": -9.197072982788086, "global_step": 310, "epoch": 3} {"train_loss": -9.960376739501953, "global_step": 311, "epoch": 3} {"train_loss": -9.20964527130127, "global_step": 312, "epoch": 3} {"train_loss": -9.318541526794434, "global_step": 313, "epoch": 3} {"train_loss": -9.530122756958008, "global_step": 314, "epoch": 3} {"train_loss": -9.47057056427002, "global_step": 315, "epoch": 3} {"train_loss": -9.481950759887695, "global_step": 316, "epoch": 3} {"train_loss": -9.626298904418945, "global_step": 317, "epoch": 3} {"train_loss": -9.567351341247559, "global_step": 318, "epoch": 3} {"train_loss": -9.797965049743652, "global_step": 319, "epoch": 3} {"train_loss": -10.176108360290527, "global_step": 320, "epoch": 3} {"train_loss": -10.256624221801758, "global_step": 321, "epoch": 3} {"train_loss": -9.614964485168457, "global_step": 322, "epoch": 3} {"train_loss": -9.566985130310059, "global_step": 323, "epoch": 3} {"train_loss": -9.98318099975586, "global_step": 324, "epoch": 3} {"train_loss": -10.641753196716309, "global_step": 325, "epoch": 3} {"train_loss": -10.21626091003418, "global_step": 326, "epoch": 3} {"train_loss": -9.639554023742676, "global_step": 327, "epoch": 3} {"train_loss": -9.908953666687012, "global_step": 328, "epoch": 3} {"train_loss": -9.982539176940918, "global_step": 329, "epoch": 3} {"train_loss": -10.080877304077148, "global_step": 330, "epoch": 3} {"train_loss": -8.117176096123385, "global_step": 331, "epoch": 3, "val_loss": 13851053.0} {"train_loss": -10.610185623168945, "global_step": 332, "epoch": 4} {"train_loss": -10.269757270812988, "global_step": 333, "epoch": 4} {"train_loss": -10.375900268554688, "global_step": 334, "epoch": 4} {"train_loss": -10.038566589355469, "global_step": 335, "epoch": 4} {"train_loss": -9.914397239685059, "global_step": 336, "epoch": 4} {"train_loss": -10.559306144714355, "global_step": 337, "epoch": 4} {"train_loss": -10.111808776855469, "global_step": 338, "epoch": 4} {"train_loss": -10.483390808105469, "global_step": 339, "epoch": 4} {"train_loss": -10.644271850585938, "global_step": 340, "epoch": 4} {"train_loss": -10.816923141479492, "global_step": 341, "epoch": 4} {"train_loss": -10.685256004333496, "global_step": 342, "epoch": 4} {"train_loss": -11.004294395446777, "global_step": 343, "epoch": 4} {"train_loss": -11.071969985961914, "global_step": 344, "epoch": 4} {"train_loss": -10.507372856140137, "global_step": 345, "epoch": 4} {"train_loss": -10.712322235107422, "global_step": 346, "epoch": 4} {"train_loss": -10.545235633850098, "global_step": 347, "epoch": 4} {"train_loss": -10.955191612243652, "global_step": 348, "epoch": 4} {"train_loss": -10.874275207519531, "global_step": 349, "epoch": 4} {"train_loss": -11.004145622253418, "global_step": 350, "epoch": 4} {"train_loss": -11.29580020904541, "global_step": 351, "epoch": 4} {"train_loss": -10.908365249633789, "global_step": 352, "epoch": 4} {"train_loss": -11.138312339782715, "global_step": 353, "epoch": 4} {"train_loss": -11.415701866149902, "global_step": 354, "epoch": 4} {"train_loss": -11.14867877960205, "global_step": 355, "epoch": 4} {"train_loss": -11.368329048156738, "global_step": 356, "epoch": 4} {"train_loss": -11.765477180480957, "global_step": 357, "epoch": 4} {"train_loss": -11.462080955505371, "global_step": 358, "epoch": 4} {"train_loss": -11.442657470703125, "global_step": 359, "epoch": 4} {"train_loss": -11.313654899597168, "global_step": 360, "epoch": 4} {"train_loss": -11.479535102844238, "global_step": 361, "epoch": 4} {"train_loss": -11.888827323913574, "global_step": 362, "epoch": 4} {"train_loss": -11.243709564208984, "global_step": 363, "epoch": 4} {"train_loss": -11.925033569335938, "global_step": 364, "epoch": 4} {"train_loss": -11.355137825012207, "global_step": 365, "epoch": 4} {"train_loss": -11.469833374023438, "global_step": 366, "epoch": 4} {"train_loss": -11.55595588684082, "global_step": 367, "epoch": 4} {"train_loss": -10.994231224060059, "global_step": 368, "epoch": 4} {"train_loss": -12.183821678161621, "global_step": 369, "epoch": 4} {"train_loss": -11.125432014465332, "global_step": 370, "epoch": 4} {"train_loss": -11.448661804199219, "global_step": 371, "epoch": 4} {"train_loss": -11.860570907592773, "global_step": 372, "epoch": 4} {"train_loss": -11.815791130065918, "global_step": 373, "epoch": 4} {"train_loss": -11.885024070739746, "global_step": 374, "epoch": 4} {"train_loss": -11.811442375183105, "global_step": 375, "epoch": 4} {"train_loss": -11.643888473510742, "global_step": 376, "epoch": 4} {"train_loss": -11.295547485351562, "global_step": 377, "epoch": 4} {"train_loss": -11.897119522094727, "global_step": 378, "epoch": 4} {"train_loss": -11.983955383300781, "global_step": 379, "epoch": 4} {"train_loss": -11.886923789978027, "global_step": 380, "epoch": 4} {"train_loss": -12.013920783996582, "global_step": 381, "epoch": 4} {"train_loss": -11.693963050842285, "global_step": 382, "epoch": 4} {"train_loss": -11.870162963867188, "global_step": 383, "epoch": 4} {"train_loss": -11.803317070007324, "global_step": 384, "epoch": 4} {"train_loss": -11.368534088134766, "global_step": 385, "epoch": 4} {"train_loss": -12.036813735961914, "global_step": 386, "epoch": 4} {"train_loss": -12.287202835083008, "global_step": 387, "epoch": 4} {"train_loss": -11.3599214553833, "global_step": 388, "epoch": 4} {"train_loss": -11.665827751159668, "global_step": 389, "epoch": 4} {"train_loss": -12.08215618133545, "global_step": 390, "epoch": 4} {"train_loss": -12.172327041625977, "global_step": 391, "epoch": 4} {"train_loss": -12.00053882598877, "global_step": 392, "epoch": 4} {"train_loss": -11.874357223510742, "global_step": 393, "epoch": 4} {"train_loss": -12.066764831542969, "global_step": 394, "epoch": 4} {"train_loss": -12.028389930725098, "global_step": 395, "epoch": 4} {"train_loss": -11.79220962524414, "global_step": 396, "epoch": 4} {"train_loss": -12.001906394958496, "global_step": 397, "epoch": 4} {"train_loss": -11.874902725219727, "global_step": 398, "epoch": 4} {"train_loss": -12.166945457458496, "global_step": 399, "epoch": 4} {"train_loss": -12.514033317565918, "global_step": 400, "epoch": 4} {"train_loss": -12.08518123626709, "global_step": 401, "epoch": 4} {"train_loss": -11.999436378479004, "global_step": 402, "epoch": 4} {"train_loss": -12.47201156616211, "global_step": 403, "epoch": 4} {"train_loss": -11.82763671875, "global_step": 404, "epoch": 4} {"train_loss": -12.370932579040527, "global_step": 405, "epoch": 4} {"train_loss": -11.984855651855469, "global_step": 406, "epoch": 4} {"train_loss": -12.148040771484375, "global_step": 407, "epoch": 4} {"train_loss": -12.149580955505371, "global_step": 408, "epoch": 4} {"train_loss": -12.067931175231934, "global_step": 409, "epoch": 4} {"train_loss": -12.212059020996094, "global_step": 410, "epoch": 4} {"train_loss": -12.228133201599121, "global_step": 411, "epoch": 4} {"train_loss": -12.461697578430176, "global_step": 412, "epoch": 4} {"train_loss": -12.583648681640625, "global_step": 413, "epoch": 4} {"train_loss": -11.517750406839761, "global_step": 414, "epoch": 4, "val_loss": 14230494.0} {"train_loss": -12.0811185836792, "global_step": 415, "epoch": 5} {"train_loss": -12.131091117858887, "global_step": 416, "epoch": 5} {"train_loss": -12.412823677062988, "global_step": 417, "epoch": 5} {"train_loss": -12.430700302124023, "global_step": 418, "epoch": 5} {"train_loss": -12.78021240234375, "global_step": 419, "epoch": 5} {"train_loss": -12.520418167114258, "global_step": 420, "epoch": 5} {"train_loss": -12.025530815124512, "global_step": 421, "epoch": 5} {"train_loss": -12.297385215759277, "global_step": 422, "epoch": 5} {"train_loss": -12.518332481384277, "global_step": 423, "epoch": 5} {"train_loss": -12.494522094726562, "global_step": 424, "epoch": 5} {"train_loss": -12.620501518249512, "global_step": 425, "epoch": 5} {"train_loss": -12.597477912902832, "global_step": 426, "epoch": 5} {"train_loss": -12.52283763885498, "global_step": 427, "epoch": 5} {"train_loss": -12.625365257263184, "global_step": 428, "epoch": 5} {"train_loss": -12.374464988708496, "global_step": 429, "epoch": 5} {"train_loss": -12.606767654418945, "global_step": 430, "epoch": 5} {"train_loss": -12.232266426086426, "global_step": 431, "epoch": 5} {"train_loss": -12.74555492401123, "global_step": 432, "epoch": 5} {"train_loss": -12.582079887390137, "global_step": 433, "epoch": 5} {"train_loss": -12.68399715423584, "global_step": 434, "epoch": 5} {"train_loss": -12.836023330688477, "global_step": 435, "epoch": 5} {"train_loss": -12.34002685546875, "global_step": 436, "epoch": 5} {"train_loss": -12.806190490722656, "global_step": 437, "epoch": 5} {"train_loss": -13.274014472961426, "global_step": 438, "epoch": 5} {"train_loss": -12.586215019226074, "global_step": 439, "epoch": 5} {"train_loss": -12.8953275680542, "global_step": 440, "epoch": 5} {"train_loss": -13.205474853515625, "global_step": 441, "epoch": 5} {"train_loss": -12.427281379699707, "global_step": 442, "epoch": 5} {"train_loss": -12.740406036376953, "global_step": 443, "epoch": 5} {"train_loss": -12.782191276550293, "global_step": 444, "epoch": 5} {"train_loss": -12.772021293640137, "global_step": 445, "epoch": 5} {"train_loss": -13.17016315460205, "global_step": 446, "epoch": 5} {"train_loss": -12.796653747558594, "global_step": 447, "epoch": 5} {"train_loss": -12.773550987243652, "global_step": 448, "epoch": 5} {"train_loss": -13.143078804016113, "global_step": 449, "epoch": 5} {"train_loss": -12.631806373596191, "global_step": 450, "epoch": 5} {"train_loss": -12.966934204101562, "global_step": 451, "epoch": 5} {"train_loss": -12.849591255187988, "global_step": 452, "epoch": 5} {"train_loss": -12.53525447845459, "global_step": 453, "epoch": 5} {"train_loss": -13.114665031433105, "global_step": 454, "epoch": 5} {"train_loss": -12.901633262634277, "global_step": 455, "epoch": 5} {"train_loss": -12.820785522460938, "global_step": 456, "epoch": 5} {"train_loss": -12.726466178894043, "global_step": 457, "epoch": 5} {"train_loss": -12.487120628356934, "global_step": 458, "epoch": 5} {"train_loss": -13.256128311157227, "global_step": 459, "epoch": 5} {"train_loss": -12.445269584655762, "global_step": 460, "epoch": 5} {"train_loss": -12.93479061126709, "global_step": 461, "epoch": 5} {"train_loss": -13.097338676452637, "global_step": 462, "epoch": 5} {"train_loss": -13.036486625671387, "global_step": 463, "epoch": 5} {"train_loss": -13.044184684753418, "global_step": 464, "epoch": 5} {"train_loss": -13.249335289001465, "global_step": 465, "epoch": 5} {"train_loss": -13.156195640563965, "global_step": 466, "epoch": 5} {"train_loss": -12.858325004577637, "global_step": 467, "epoch": 5} {"train_loss": -12.810633659362793, "global_step": 468, "epoch": 5} {"train_loss": -13.113051414489746, "global_step": 469, "epoch": 5} {"train_loss": -12.60124683380127, "global_step": 470, "epoch": 5} {"train_loss": -13.301230430603027, "global_step": 471, "epoch": 5} {"train_loss": -13.000338554382324, "global_step": 472, "epoch": 5} {"train_loss": -12.9629487991333, "global_step": 473, "epoch": 5} {"train_loss": -13.115002632141113, "global_step": 474, "epoch": 5} {"train_loss": -13.493097305297852, "global_step": 475, "epoch": 5} {"train_loss": -12.903413772583008, "global_step": 476, "epoch": 5} {"train_loss": -13.127171516418457, "global_step": 477, "epoch": 5} {"train_loss": -13.227084159851074, "global_step": 478, "epoch": 5} {"train_loss": -13.369067192077637, "global_step": 479, "epoch": 5} {"train_loss": -13.14066219329834, "global_step": 480, "epoch": 5} {"train_loss": -12.873797416687012, "global_step": 481, "epoch": 5} {"train_loss": -13.117575645446777, "global_step": 482, "epoch": 5} {"train_loss": -13.50097942352295, "global_step": 483, "epoch": 5} {"train_loss": -13.136201858520508, "global_step": 484, "epoch": 5} {"train_loss": -13.52527141571045, "global_step": 485, "epoch": 5} {"train_loss": -13.296754837036133, "global_step": 486, "epoch": 5} {"train_loss": -13.4009370803833, "global_step": 487, "epoch": 5} {"train_loss": -13.2767915725708, "global_step": 488, "epoch": 5} {"train_loss": -13.25139045715332, "global_step": 489, "epoch": 5} {"train_loss": -13.200297355651855, "global_step": 490, "epoch": 5} {"train_loss": -12.90421199798584, "global_step": 491, "epoch": 5} {"train_loss": -13.438821792602539, "global_step": 492, "epoch": 5} {"train_loss": -13.316021919250488, "global_step": 493, "epoch": 5} {"train_loss": -13.397189140319824, "global_step": 494, "epoch": 5} {"train_loss": -13.27957820892334, "global_step": 495, "epoch": 5} {"train_loss": -12.794966697692871, "global_step": 496, "epoch": 5} {"train_loss": -12.889147080570819, "global_step": 497, "epoch": 5, "val_loss": 10837706.0} {"train_loss": -12.900702476501465, "global_step": 498, "epoch": 6} {"train_loss": -13.069058418273926, "global_step": 499, "epoch": 6} {"train_loss": -13.307639122009277, "global_step": 500, "epoch": 6} {"train_loss": -13.624734878540039, "global_step": 501, "epoch": 6} {"train_loss": -14.083758354187012, "global_step": 502, "epoch": 6} {"train_loss": -13.392760276794434, "global_step": 503, "epoch": 6} {"train_loss": -13.421699523925781, "global_step": 504, "epoch": 6} {"train_loss": -13.896735191345215, "global_step": 505, "epoch": 6} {"train_loss": -13.455395698547363, "global_step": 506, "epoch": 6} {"train_loss": -13.142593383789062, "global_step": 507, "epoch": 6} {"train_loss": -13.223451614379883, "global_step": 508, "epoch": 6} {"train_loss": -13.2801513671875, "global_step": 509, "epoch": 6} {"train_loss": -13.414420127868652, "global_step": 510, "epoch": 6} {"train_loss": -13.234457969665527, "global_step": 511, "epoch": 6} {"train_loss": -13.26654052734375, "global_step": 512, "epoch": 6} {"train_loss": -13.52478313446045, "global_step": 513, "epoch": 6} {"train_loss": -13.171957969665527, "global_step": 514, "epoch": 6} {"train_loss": -13.842890739440918, "global_step": 515, "epoch": 6} {"train_loss": -13.147849082946777, "global_step": 516, "epoch": 6} {"train_loss": -13.197860717773438, "global_step": 517, "epoch": 6} {"train_loss": -13.068742752075195, "global_step": 518, "epoch": 6} {"train_loss": -13.395744323730469, "global_step": 519, "epoch": 6} {"train_loss": -13.158884048461914, "global_step": 520, "epoch": 6} {"train_loss": -13.598126411437988, "global_step": 521, "epoch": 6} {"train_loss": -13.266051292419434, "global_step": 522, "epoch": 6} {"train_loss": -13.097848892211914, "global_step": 523, "epoch": 6} {"train_loss": -13.331694602966309, "global_step": 524, "epoch": 6} {"train_loss": -13.529932022094727, "global_step": 525, "epoch": 6} {"train_loss": -13.810197830200195, "global_step": 526, "epoch": 6} {"train_loss": -13.488347053527832, "global_step": 527, "epoch": 6} {"train_loss": -13.550888061523438, "global_step": 528, "epoch": 6} {"train_loss": -13.36148738861084, "global_step": 529, "epoch": 6} {"train_loss": -13.413864135742188, "global_step": 530, "epoch": 6} {"train_loss": -13.363898277282715, "global_step": 531, "epoch": 6} {"train_loss": -13.542994499206543, "global_step": 532, "epoch": 6} {"train_loss": -13.0447998046875, "global_step": 533, "epoch": 6} {"train_loss": -13.238446235656738, "global_step": 534, "epoch": 6} {"train_loss": -13.323371887207031, "global_step": 535, "epoch": 6} {"train_loss": -13.548970222473145, "global_step": 536, "epoch": 6} {"train_loss": -13.521272659301758, "global_step": 537, "epoch": 6} {"train_loss": -13.495440483093262, "global_step": 538, "epoch": 6} {"train_loss": -13.309745788574219, "global_step": 539, "epoch": 6} {"train_loss": -13.55224609375, "global_step": 540, "epoch": 6} {"train_loss": -13.588065147399902, "global_step": 541, "epoch": 6} {"train_loss": -13.759332656860352, "global_step": 542, "epoch": 6} {"train_loss": -13.183067321777344, "global_step": 543, "epoch": 6} {"train_loss": -12.563925743103027, "global_step": 544, "epoch": 6} {"train_loss": -13.097439765930176, "global_step": 545, "epoch": 6} {"train_loss": -13.410552978515625, "global_step": 546, "epoch": 6} {"train_loss": -13.37682819366455, "global_step": 547, "epoch": 6} {"train_loss": -13.5721435546875, "global_step": 548, "epoch": 6} {"train_loss": -13.217554092407227, "global_step": 549, "epoch": 6} {"train_loss": -13.32282543182373, "global_step": 550, "epoch": 6} {"train_loss": -14.01507568359375, "global_step": 551, "epoch": 6} {"train_loss": -13.472220420837402, "global_step": 552, "epoch": 6} {"train_loss": -13.543174743652344, "global_step": 553, "epoch": 6} {"train_loss": -14.018739700317383, "global_step": 554, "epoch": 6} {"train_loss": -13.541186332702637, "global_step": 555, "epoch": 6} {"train_loss": -13.7991304397583, "global_step": 556, "epoch": 6} {"train_loss": -13.610635757446289, "global_step": 557, "epoch": 6} {"train_loss": -14.162692070007324, "global_step": 558, "epoch": 6} {"train_loss": -13.741253852844238, "global_step": 559, "epoch": 6} {"train_loss": -13.57230281829834, "global_step": 560, "epoch": 6} {"train_loss": -13.7360258102417, "global_step": 561, "epoch": 6} {"train_loss": -13.669776916503906, "global_step": 562, "epoch": 6} {"train_loss": -13.858154296875, "global_step": 563, "epoch": 6} {"train_loss": -13.634576797485352, "global_step": 564, "epoch": 6} {"train_loss": -13.742578506469727, "global_step": 565, "epoch": 6} {"train_loss": -13.23241901397705, "global_step": 566, "epoch": 6} {"train_loss": -14.073943138122559, "global_step": 567, "epoch": 6} {"train_loss": -13.720309257507324, "global_step": 568, "epoch": 6} {"train_loss": -13.75414752960205, "global_step": 569, "epoch": 6} {"train_loss": -13.552035331726074, "global_step": 570, "epoch": 6} {"train_loss": -13.74352741241455, "global_step": 571, "epoch": 6} {"train_loss": -13.698532104492188, "global_step": 572, "epoch": 6} {"train_loss": -13.955987930297852, "global_step": 573, "epoch": 6} {"train_loss": -13.301966667175293, "global_step": 574, "epoch": 6} {"train_loss": -13.633795738220215, "global_step": 575, "epoch": 6} {"train_loss": -13.775253295898438, "global_step": 576, "epoch": 6} {"train_loss": -13.744211196899414, "global_step": 577, "epoch": 6} {"train_loss": -13.750825881958008, "global_step": 578, "epoch": 6} {"train_loss": -13.633038520812988, "global_step": 579, "epoch": 6} {"train_loss": -13.474801810390979, "global_step": 580, "epoch": 6, "val_loss": 11364628.0} {"train_loss": -13.342737197875977, "global_step": 581, "epoch": 7} {"train_loss": -13.944543838500977, "global_step": 582, "epoch": 7} {"train_loss": -13.404767036437988, "global_step": 583, "epoch": 7} {"train_loss": -13.741485595703125, "global_step": 584, "epoch": 7} {"train_loss": -13.242715835571289, "global_step": 585, "epoch": 7} {"train_loss": -13.820355415344238, "global_step": 586, "epoch": 7} {"train_loss": -13.770329475402832, "global_step": 587, "epoch": 7} {"train_loss": -13.518292427062988, "global_step": 588, "epoch": 7} {"train_loss": -13.626306533813477, "global_step": 589, "epoch": 7} {"train_loss": -13.874342918395996, "global_step": 590, "epoch": 7} {"train_loss": -13.588104248046875, "global_step": 591, "epoch": 7} {"train_loss": -14.089194297790527, "global_step": 592, "epoch": 7} {"train_loss": -13.547021865844727, "global_step": 593, "epoch": 7} {"train_loss": -13.497355461120605, "global_step": 594, "epoch": 7} {"train_loss": -13.922205924987793, "global_step": 595, "epoch": 7} {"train_loss": -13.212356567382812, "global_step": 596, "epoch": 7} {"train_loss": -13.7981595993042, "global_step": 597, "epoch": 7} {"train_loss": -13.41336727142334, "global_step": 598, "epoch": 7} {"train_loss": -13.546259880065918, "global_step": 599, "epoch": 7} {"train_loss": -13.74186897277832, "global_step": 600, "epoch": 7} {"train_loss": -13.790417671203613, "global_step": 601, "epoch": 7} {"train_loss": -13.596376419067383, "global_step": 602, "epoch": 7} {"train_loss": -13.649520874023438, "global_step": 603, "epoch": 7} {"train_loss": -13.91922664642334, "global_step": 604, "epoch": 7} {"train_loss": -13.55322551727295, "global_step": 605, "epoch": 7} {"train_loss": -13.801520347595215, "global_step": 606, "epoch": 7} {"train_loss": -14.01712703704834, "global_step": 607, "epoch": 7} {"train_loss": -13.819476127624512, "global_step": 608, "epoch": 7} {"train_loss": -13.272333145141602, "global_step": 609, "epoch": 7} {"train_loss": -13.664265632629395, "global_step": 610, "epoch": 7} {"train_loss": -14.063014030456543, "global_step": 611, "epoch": 7} {"train_loss": -13.51383113861084, "global_step": 612, "epoch": 7} {"train_loss": -13.957423210144043, "global_step": 613, "epoch": 7} {"train_loss": -14.046801567077637, "global_step": 614, "epoch": 7} {"train_loss": -13.894553184509277, "global_step": 615, "epoch": 7} {"train_loss": -13.864778518676758, "global_step": 616, "epoch": 7} {"train_loss": -13.826690673828125, "global_step": 617, "epoch": 7} {"train_loss": -13.914108276367188, "global_step": 618, "epoch": 7} {"train_loss": -13.991671562194824, "global_step": 619, "epoch": 7} {"train_loss": -13.80634593963623, "global_step": 620, "epoch": 7} {"train_loss": -13.879040718078613, "global_step": 621, "epoch": 7} {"train_loss": -13.554181098937988, "global_step": 622, "epoch": 7} {"train_loss": -13.807687759399414, "global_step": 623, "epoch": 7} {"train_loss": -13.8419771194458, "global_step": 624, "epoch": 7} {"train_loss": -13.398462295532227, "global_step": 625, "epoch": 7} {"train_loss": -14.148836135864258, "global_step": 626, "epoch": 7} {"train_loss": -13.76646900177002, "global_step": 627, "epoch": 7} {"train_loss": -13.85709285736084, "global_step": 628, "epoch": 7} {"train_loss": -13.962554931640625, "global_step": 629, "epoch": 7} {"train_loss": -13.703991889953613, "global_step": 630, "epoch": 7} {"train_loss": -13.661234855651855, "global_step": 631, "epoch": 7} {"train_loss": -14.06082820892334, "global_step": 632, "epoch": 7} {"train_loss": -13.892669677734375, "global_step": 633, "epoch": 7} {"train_loss": -13.987067222595215, "global_step": 634, "epoch": 7} {"train_loss": -13.900494575500488, "global_step": 635, "epoch": 7} {"train_loss": -13.82395076751709, "global_step": 636, "epoch": 7} {"train_loss": -14.298235893249512, "global_step": 637, "epoch": 7} {"train_loss": -13.875317573547363, "global_step": 638, "epoch": 7} {"train_loss": -13.964312553405762, "global_step": 639, "epoch": 7} {"train_loss": -14.01129150390625, "global_step": 640, "epoch": 7} {"train_loss": -14.023759841918945, "global_step": 641, "epoch": 7} {"train_loss": -13.694750785827637, "global_step": 642, "epoch": 7} {"train_loss": -13.896466255187988, "global_step": 643, "epoch": 7} {"train_loss": -13.891322135925293, "global_step": 644, "epoch": 7} {"train_loss": -13.67551326751709, "global_step": 645, "epoch": 7} {"train_loss": -13.857355117797852, "global_step": 646, "epoch": 7} {"train_loss": -14.124099731445312, "global_step": 647, "epoch": 7} {"train_loss": -13.899426460266113, "global_step": 648, "epoch": 7} {"train_loss": -13.563261985778809, "global_step": 649, "epoch": 7} {"train_loss": -14.10192584991455, "global_step": 650, "epoch": 7} {"train_loss": -13.645003318786621, "global_step": 651, "epoch": 7} {"train_loss": -14.143686294555664, "global_step": 652, "epoch": 7} {"train_loss": -13.91345500946045, "global_step": 653, "epoch": 7} {"train_loss": -14.164898872375488, "global_step": 654, "epoch": 7} {"train_loss": -13.917718887329102, "global_step": 655, "epoch": 7} {"train_loss": -13.9186372756958, "global_step": 656, "epoch": 7} {"train_loss": -14.142621040344238, "global_step": 657, "epoch": 7} {"train_loss": -14.089080810546875, "global_step": 658, "epoch": 7} {"train_loss": -14.34473705291748, "global_step": 659, "epoch": 7} {"train_loss": -13.797162055969238, "global_step": 660, "epoch": 7} {"train_loss": -14.133819580078125, "global_step": 661, "epoch": 7} {"train_loss": -14.021588325500488, "global_step": 662, "epoch": 7} {"train_loss": -13.820226037358664, "global_step": 663, "epoch": 7, "val_loss": 10996907.0} {"train_loss": -13.22223949432373, "global_step": 664, "epoch": 8} {"train_loss": -13.423334121704102, "global_step": 665, "epoch": 8} {"train_loss": -14.337834358215332, "global_step": 666, "epoch": 8} {"train_loss": -13.927833557128906, "global_step": 667, "epoch": 8} {"train_loss": -13.666183471679688, "global_step": 668, "epoch": 8} {"train_loss": -14.139899253845215, "global_step": 669, "epoch": 8} {"train_loss": -13.548425674438477, "global_step": 670, "epoch": 8} {"train_loss": -13.851890563964844, "global_step": 671, "epoch": 8} {"train_loss": -14.331315994262695, "global_step": 672, "epoch": 8} {"train_loss": -13.513031005859375, "global_step": 673, "epoch": 8} {"train_loss": -13.831461906433105, "global_step": 674, "epoch": 8} {"train_loss": -13.687832832336426, "global_step": 675, "epoch": 8} {"train_loss": -13.900538444519043, "global_step": 676, "epoch": 8} {"train_loss": -13.739214897155762, "global_step": 677, "epoch": 8} {"train_loss": -13.80307674407959, "global_step": 678, "epoch": 8} {"train_loss": -14.264784812927246, "global_step": 679, "epoch": 8} {"train_loss": -13.766359329223633, "global_step": 680, "epoch": 8} {"train_loss": -14.313194274902344, "global_step": 681, "epoch": 8} {"train_loss": -13.847485542297363, "global_step": 682, "epoch": 8} {"train_loss": -14.286009788513184, "global_step": 683, "epoch": 8} {"train_loss": -14.045186042785645, "global_step": 684, "epoch": 8} {"train_loss": -13.899553298950195, "global_step": 685, "epoch": 8} {"train_loss": -14.09075927734375, "global_step": 686, "epoch": 8} {"train_loss": -14.363212585449219, "global_step": 687, "epoch": 8} {"train_loss": -14.2680082321167, "global_step": 688, "epoch": 8} {"train_loss": -14.020880699157715, "global_step": 689, "epoch": 8} {"train_loss": -14.237215995788574, "global_step": 690, "epoch": 8} {"train_loss": -14.016550064086914, "global_step": 691, "epoch": 8} {"train_loss": -14.204790115356445, "global_step": 692, "epoch": 8} {"train_loss": -13.932055473327637, "global_step": 693, "epoch": 8} {"train_loss": -14.15794563293457, "global_step": 694, "epoch": 8} {"train_loss": -14.134544372558594, "global_step": 695, "epoch": 8} {"train_loss": -14.07360553741455, "global_step": 696, "epoch": 8} {"train_loss": -14.231485366821289, "global_step": 697, "epoch": 8} {"train_loss": -14.180157661437988, "global_step": 698, "epoch": 8} {"train_loss": -13.978189468383789, "global_step": 699, "epoch": 8} {"train_loss": -14.292388916015625, "global_step": 700, "epoch": 8} {"train_loss": -14.405410766601562, "global_step": 701, "epoch": 8} {"train_loss": -14.344339370727539, "global_step": 702, "epoch": 8} {"train_loss": -13.449009895324707, "global_step": 703, "epoch": 8} {"train_loss": -14.723910331726074, "global_step": 704, "epoch": 8} {"train_loss": -14.0772066116333, "global_step": 705, "epoch": 8} {"train_loss": -14.198440551757812, "global_step": 706, "epoch": 8} {"train_loss": -14.091972351074219, "global_step": 707, "epoch": 8} {"train_loss": -13.868250846862793, "global_step": 708, "epoch": 8} {"train_loss": -14.715011596679688, "global_step": 709, "epoch": 8} {"train_loss": -14.089276313781738, "global_step": 710, "epoch": 8} {"train_loss": -14.25377368927002, "global_step": 711, "epoch": 8} {"train_loss": -14.121771812438965, "global_step": 712, "epoch": 8} {"train_loss": -13.836053848266602, "global_step": 713, "epoch": 8} {"train_loss": -14.244501113891602, "global_step": 714, "epoch": 8} {"train_loss": -14.302278518676758, "global_step": 715, "epoch": 8} {"train_loss": -14.134714126586914, "global_step": 716, "epoch": 8} {"train_loss": -14.106610298156738, "global_step": 717, "epoch": 8} {"train_loss": -14.201791763305664, "global_step": 718, "epoch": 8} {"train_loss": -14.275212287902832, "global_step": 719, "epoch": 8} {"train_loss": -13.990897178649902, "global_step": 720, "epoch": 8} {"train_loss": -14.207003593444824, "global_step": 721, "epoch": 8} {"train_loss": -14.506708145141602, "global_step": 722, "epoch": 8} {"train_loss": -14.156588554382324, "global_step": 723, "epoch": 8} {"train_loss": -14.026138305664062, "global_step": 724, "epoch": 8} {"train_loss": -13.949647903442383, "global_step": 725, "epoch": 8} {"train_loss": -14.40625, "global_step": 726, "epoch": 8} {"train_loss": -14.524054527282715, "global_step": 727, "epoch": 8} {"train_loss": -14.166996955871582, "global_step": 728, "epoch": 8} {"train_loss": -14.017146110534668, "global_step": 729, "epoch": 8} {"train_loss": -14.011981010437012, "global_step": 730, "epoch": 8} {"train_loss": -13.907111167907715, "global_step": 731, "epoch": 8} {"train_loss": -14.248181343078613, "global_step": 732, "epoch": 8} {"train_loss": -14.08390998840332, "global_step": 733, "epoch": 8} {"train_loss": -14.03303050994873, "global_step": 734, "epoch": 8} {"train_loss": -14.047629356384277, "global_step": 735, "epoch": 8} {"train_loss": -14.09107494354248, "global_step": 736, "epoch": 8} {"train_loss": -14.222250938415527, "global_step": 737, "epoch": 8} {"train_loss": -14.02709674835205, "global_step": 738, "epoch": 8} {"train_loss": -14.186566352844238, "global_step": 739, "epoch": 8} {"train_loss": -14.111979484558105, "global_step": 740, "epoch": 8} {"train_loss": -14.576704978942871, "global_step": 741, "epoch": 8} {"train_loss": -14.36718463897705, "global_step": 742, "epoch": 8} {"train_loss": -14.174356460571289, "global_step": 743, "epoch": 8} {"train_loss": -14.022295951843262, "global_step": 744, "epoch": 8} {"train_loss": -14.146199226379395, "global_step": 745, "epoch": 8} {"train_loss": -14.107473292982721, "global_step": 746, "epoch": 8, "val_loss": 10850613.0} {"train_loss": -13.942230224609375, "global_step": 747, "epoch": 9} {"train_loss": -14.283595085144043, "global_step": 748, "epoch": 9} {"train_loss": -14.282958030700684, "global_step": 749, "epoch": 9} {"train_loss": -13.847163200378418, "global_step": 750, "epoch": 9} {"train_loss": -13.820039749145508, "global_step": 751, "epoch": 9} {"train_loss": -14.06339168548584, "global_step": 752, "epoch": 9} {"train_loss": -14.563560485839844, "global_step": 753, "epoch": 9} {"train_loss": -14.20067024230957, "global_step": 754, "epoch": 9} {"train_loss": -13.988018989562988, "global_step": 755, "epoch": 9} {"train_loss": -14.091400146484375, "global_step": 756, "epoch": 9} {"train_loss": -14.45871639251709, "global_step": 757, "epoch": 9} {"train_loss": -14.144174575805664, "global_step": 758, "epoch": 9} {"train_loss": -14.160333633422852, "global_step": 759, "epoch": 9} {"train_loss": -13.768594741821289, "global_step": 760, "epoch": 9} {"train_loss": -14.254948616027832, "global_step": 761, "epoch": 9} {"train_loss": -14.089790344238281, "global_step": 762, "epoch": 9} {"train_loss": -14.209063529968262, "global_step": 763, "epoch": 9} {"train_loss": -14.405117988586426, "global_step": 764, "epoch": 9} {"train_loss": -14.64037799835205, "global_step": 765, "epoch": 9} {"train_loss": -14.042795181274414, "global_step": 766, "epoch": 9} {"train_loss": -14.331405639648438, "global_step": 767, "epoch": 9} {"train_loss": -14.283839225769043, "global_step": 768, "epoch": 9} {"train_loss": -14.187167167663574, "global_step": 769, "epoch": 9} {"train_loss": -14.062979698181152, "global_step": 770, "epoch": 9} {"train_loss": -14.452194213867188, "global_step": 771, "epoch": 9} {"train_loss": -14.111251831054688, "global_step": 772, "epoch": 9} {"train_loss": -14.335932731628418, "global_step": 773, "epoch": 9} {"train_loss": -14.305264472961426, "global_step": 774, "epoch": 9} {"train_loss": -14.159346580505371, "global_step": 775, "epoch": 9} {"train_loss": -14.478311538696289, "global_step": 776, "epoch": 9} {"train_loss": -14.670321464538574, "global_step": 777, "epoch": 9} {"train_loss": -14.132600784301758, "global_step": 778, "epoch": 9} {"train_loss": -14.381815910339355, "global_step": 779, "epoch": 9} {"train_loss": -13.691400527954102, "global_step": 780, "epoch": 9} {"train_loss": -13.98808765411377, "global_step": 781, "epoch": 9} {"train_loss": -14.578852653503418, "global_step": 782, "epoch": 9} {"train_loss": -14.324989318847656, "global_step": 783, "epoch": 9} {"train_loss": -14.402091026306152, "global_step": 784, "epoch": 9} {"train_loss": -14.044058799743652, "global_step": 785, "epoch": 9} {"train_loss": -14.846649169921875, "global_step": 786, "epoch": 9} {"train_loss": -14.488551139831543, "global_step": 787, "epoch": 9} {"train_loss": -14.272810935974121, "global_step": 788, "epoch": 9} {"train_loss": -14.664224624633789, "global_step": 789, "epoch": 9} {"train_loss": -13.88708209991455, "global_step": 790, "epoch": 9} {"train_loss": -14.413260459899902, "global_step": 791, "epoch": 9} {"train_loss": -14.487452507019043, "global_step": 792, "epoch": 9} {"train_loss": -15.02085018157959, "global_step": 793, "epoch": 9} {"train_loss": -14.510293960571289, "global_step": 794, "epoch": 9} {"train_loss": -14.468588829040527, "global_step": 795, "epoch": 9} {"train_loss": -14.390494346618652, "global_step": 796, "epoch": 9} {"train_loss": -14.266093254089355, "global_step": 797, "epoch": 9} {"train_loss": -14.335909843444824, "global_step": 798, "epoch": 9} {"train_loss": -14.366801261901855, "global_step": 799, "epoch": 9} {"train_loss": -14.8099365234375, "global_step": 800, "epoch": 9} {"train_loss": -14.326705932617188, "global_step": 801, "epoch": 9} {"train_loss": -14.20883846282959, "global_step": 802, "epoch": 9} {"train_loss": -14.41454792022705, "global_step": 803, "epoch": 9} {"train_loss": -14.538909912109375, "global_step": 804, "epoch": 9} {"train_loss": -14.195016860961914, "global_step": 805, "epoch": 9} {"train_loss": -14.112530708312988, "global_step": 806, "epoch": 9} {"train_loss": -14.057573318481445, "global_step": 807, "epoch": 9} {"train_loss": -14.560564994812012, "global_step": 808, "epoch": 9} {"train_loss": -14.705767631530762, "global_step": 809, "epoch": 9} {"train_loss": -14.478598594665527, "global_step": 810, "epoch": 9} {"train_loss": -14.1560640335083, "global_step": 811, "epoch": 9} {"train_loss": -14.237597465515137, "global_step": 812, "epoch": 9} {"train_loss": -14.123723030090332, "global_step": 813, "epoch": 9} {"train_loss": -14.00390625, "global_step": 814, "epoch": 9} {"train_loss": -13.846234321594238, "global_step": 815, "epoch": 9} {"train_loss": -14.20184326171875, "global_step": 816, "epoch": 9} {"train_loss": -14.74528980255127, "global_step": 817, "epoch": 9} {"train_loss": -14.198694229125977, "global_step": 818, "epoch": 9} {"train_loss": -14.037686347961426, "global_step": 819, "epoch": 9} {"train_loss": -14.627705574035645, "global_step": 820, "epoch": 9} {"train_loss": -14.446405410766602, "global_step": 821, "epoch": 9} {"train_loss": -14.657191276550293, "global_step": 822, "epoch": 9} {"train_loss": -14.223620414733887, "global_step": 823, "epoch": 9} {"train_loss": -14.687411308288574, "global_step": 824, "epoch": 9} {"train_loss": -14.477721214294434, "global_step": 825, "epoch": 9} {"train_loss": -14.482831001281738, "global_step": 826, "epoch": 9} {"train_loss": -13.775189399719238, "global_step": 827, "epoch": 9} {"train_loss": -14.659558296203613, "global_step": 828, "epoch": 9} {"train_loss": -14.30456788855863, "global_step": 829, "epoch": 9, "val_loss": 10709952.0} {"train_loss": -14.307463645935059, "global_step": 830, "epoch": 10} {"train_loss": -13.993487358093262, "global_step": 831, "epoch": 10} {"train_loss": -14.330162048339844, "global_step": 832, "epoch": 10} {"train_loss": -14.85693645477295, "global_step": 833, "epoch": 10} {"train_loss": -14.071937561035156, "global_step": 834, "epoch": 10} {"train_loss": -14.103144645690918, "global_step": 835, "epoch": 10} {"train_loss": -14.22590160369873, "global_step": 836, "epoch": 10} {"train_loss": -14.261474609375, "global_step": 837, "epoch": 10} {"train_loss": -14.728192329406738, "global_step": 838, "epoch": 10} {"train_loss": -14.626187324523926, "global_step": 839, "epoch": 10} {"train_loss": -14.223355293273926, "global_step": 840, "epoch": 10} {"train_loss": -14.398810386657715, "global_step": 841, "epoch": 10} {"train_loss": -14.585006713867188, "global_step": 842, "epoch": 10} {"train_loss": -14.679779052734375, "global_step": 843, "epoch": 10} {"train_loss": -14.293957710266113, "global_step": 844, "epoch": 10} {"train_loss": -14.404617309570312, "global_step": 845, "epoch": 10} {"train_loss": -14.6333646774292, "global_step": 846, "epoch": 10} {"train_loss": -14.683981895446777, "global_step": 847, "epoch": 10} {"train_loss": -14.7405424118042, "global_step": 848, "epoch": 10} {"train_loss": -14.700759887695312, "global_step": 849, "epoch": 10} {"train_loss": -14.55052661895752, "global_step": 850, "epoch": 10} {"train_loss": -14.239389419555664, "global_step": 851, "epoch": 10} {"train_loss": -14.622824668884277, "global_step": 852, "epoch": 10} {"train_loss": -14.508587837219238, "global_step": 853, "epoch": 10} {"train_loss": -14.18411922454834, "global_step": 854, "epoch": 10} {"train_loss": -14.805441856384277, "global_step": 855, "epoch": 10} {"train_loss": -14.77835750579834, "global_step": 856, "epoch": 10} {"train_loss": -14.476855278015137, "global_step": 857, "epoch": 10} {"train_loss": -14.938560485839844, "global_step": 858, "epoch": 10} {"train_loss": -14.071565628051758, "global_step": 859, "epoch": 10} {"train_loss": -14.691940307617188, "global_step": 860, "epoch": 10} {"train_loss": -14.419036865234375, "global_step": 861, "epoch": 10} {"train_loss": -14.556780815124512, "global_step": 862, "epoch": 10} {"train_loss": -14.528329849243164, "global_step": 863, "epoch": 10} {"train_loss": -14.498703002929688, "global_step": 864, "epoch": 10} {"train_loss": -14.433624267578125, "global_step": 865, "epoch": 10} {"train_loss": -14.444841384887695, "global_step": 866, "epoch": 10} {"train_loss": -14.514159202575684, "global_step": 867, "epoch": 10} {"train_loss": -14.316744804382324, "global_step": 868, "epoch": 10} {"train_loss": -14.637176513671875, "global_step": 869, "epoch": 10} {"train_loss": -13.851733207702637, "global_step": 870, "epoch": 10} {"train_loss": -14.73144817352295, "global_step": 871, "epoch": 10} {"train_loss": -14.84886646270752, "global_step": 872, "epoch": 10} {"train_loss": -14.036895751953125, "global_step": 873, "epoch": 10} {"train_loss": -15.494305610656738, "global_step": 874, "epoch": 10} {"train_loss": -14.545788764953613, "global_step": 875, "epoch": 10} {"train_loss": -14.774121284484863, "global_step": 876, "epoch": 10} {"train_loss": -14.503796577453613, "global_step": 877, "epoch": 10} {"train_loss": -14.453221321105957, "global_step": 878, "epoch": 10} {"train_loss": -14.645767211914062, "global_step": 879, "epoch": 10} {"train_loss": -14.435172080993652, "global_step": 880, "epoch": 10} {"train_loss": -14.739944458007812, "global_step": 881, "epoch": 10} {"train_loss": -14.180548667907715, "global_step": 882, "epoch": 10} {"train_loss": -15.127140998840332, "global_step": 883, "epoch": 10} {"train_loss": -14.525290489196777, "global_step": 884, "epoch": 10} {"train_loss": -13.878229141235352, "global_step": 885, "epoch": 10} {"train_loss": -14.748703002929688, "global_step": 886, "epoch": 10} {"train_loss": -14.292284965515137, "global_step": 887, "epoch": 10} {"train_loss": -14.578251838684082, "global_step": 888, "epoch": 10} {"train_loss": -14.441153526306152, "global_step": 889, "epoch": 10} {"train_loss": -15.044903755187988, "global_step": 890, "epoch": 10} {"train_loss": -14.6168851852417, "global_step": 891, "epoch": 10} {"train_loss": -14.920989990234375, "global_step": 892, "epoch": 10} {"train_loss": -14.3814697265625, "global_step": 893, "epoch": 10} {"train_loss": -14.010062217712402, "global_step": 894, "epoch": 10} {"train_loss": -14.272839546203613, "global_step": 895, "epoch": 10} {"train_loss": -14.451606750488281, "global_step": 896, "epoch": 10} {"train_loss": -14.583714485168457, "global_step": 897, "epoch": 10} {"train_loss": -14.545315742492676, "global_step": 898, "epoch": 10} {"train_loss": -14.21953296661377, "global_step": 899, "epoch": 10} {"train_loss": -14.194108963012695, "global_step": 900, "epoch": 10} {"train_loss": -14.429712295532227, "global_step": 901, "epoch": 10} {"train_loss": -14.473030090332031, "global_step": 902, "epoch": 10} {"train_loss": -14.386453628540039, "global_step": 903, "epoch": 10} {"train_loss": -14.570391654968262, "global_step": 904, "epoch": 10} {"train_loss": -14.392102241516113, "global_step": 905, "epoch": 10} {"train_loss": -14.1636962890625, "global_step": 906, "epoch": 10} {"train_loss": -14.640029907226562, "global_step": 907, "epoch": 10} {"train_loss": -14.896334648132324, "global_step": 908, "epoch": 10} {"train_loss": -14.267740249633789, "global_step": 909, "epoch": 10} {"train_loss": -14.74871826171875, "global_step": 910, "epoch": 10} {"train_loss": -15.021547317504883, "global_step": 911, "epoch": 10} {"train_loss": -14.502205779753536, "global_step": 912, "epoch": 10, "val_loss": 9874927.0} {"train_loss": -14.659113883972168, "global_step": 913, "epoch": 11} {"train_loss": -14.666356086730957, "global_step": 914, "epoch": 11} {"train_loss": -14.3639497756958, "global_step": 915, "epoch": 11} {"train_loss": -14.524802207946777, "global_step": 916, "epoch": 11} {"train_loss": -14.45892333984375, "global_step": 917, "epoch": 11} {"train_loss": -14.286356925964355, "global_step": 918, "epoch": 11} {"train_loss": -14.736688613891602, "global_step": 919, "epoch": 11} {"train_loss": -14.514846801757812, "global_step": 920, "epoch": 11} {"train_loss": -14.420135498046875, "global_step": 921, "epoch": 11} {"train_loss": -14.637102127075195, "global_step": 922, "epoch": 11} {"train_loss": -14.213516235351562, "global_step": 923, "epoch": 11} {"train_loss": -14.947196960449219, "global_step": 924, "epoch": 11} {"train_loss": -14.97447395324707, "global_step": 925, "epoch": 11} {"train_loss": -14.72913646697998, "global_step": 926, "epoch": 11} {"train_loss": -14.7299222946167, "global_step": 927, "epoch": 11} {"train_loss": -14.8897123336792, "global_step": 928, "epoch": 11} {"train_loss": -14.251968383789062, "global_step": 929, "epoch": 11} {"train_loss": -14.890631675720215, "global_step": 930, "epoch": 11} {"train_loss": -14.496978759765625, "global_step": 931, "epoch": 11} {"train_loss": -14.692519187927246, "global_step": 932, "epoch": 11} {"train_loss": -15.009592056274414, "global_step": 933, "epoch": 11} {"train_loss": -14.502169609069824, "global_step": 934, "epoch": 11} {"train_loss": -14.25749397277832, "global_step": 935, "epoch": 11} {"train_loss": -15.063974380493164, "global_step": 936, "epoch": 11} {"train_loss": -14.777256965637207, "global_step": 937, "epoch": 11} {"train_loss": -14.791396141052246, "global_step": 938, "epoch": 11} {"train_loss": -14.5200777053833, "global_step": 939, "epoch": 11} {"train_loss": -14.902922630310059, "global_step": 940, "epoch": 11} {"train_loss": -14.700398445129395, "global_step": 941, "epoch": 11} {"train_loss": -15.325759887695312, "global_step": 942, "epoch": 11} {"train_loss": -14.591479301452637, "global_step": 943, "epoch": 11} {"train_loss": -14.292617797851562, "global_step": 944, "epoch": 11} {"train_loss": -14.337233543395996, "global_step": 945, "epoch": 11} {"train_loss": -14.737318992614746, "global_step": 946, "epoch": 11} {"train_loss": -14.396512031555176, "global_step": 947, "epoch": 11} {"train_loss": -14.506024360656738, "global_step": 948, "epoch": 11} {"train_loss": -14.577086448669434, "global_step": 949, "epoch": 11} {"train_loss": -15.110015869140625, "global_step": 950, "epoch": 11} {"train_loss": -14.593127250671387, "global_step": 951, "epoch": 11} {"train_loss": -14.245953559875488, "global_step": 952, "epoch": 11} {"train_loss": -14.866050720214844, "global_step": 953, "epoch": 11} {"train_loss": -14.92166805267334, "global_step": 954, "epoch": 11} {"train_loss": -14.764373779296875, "global_step": 955, "epoch": 11} {"train_loss": -14.993067741394043, "global_step": 956, "epoch": 11} {"train_loss": -15.120678901672363, "global_step": 957, "epoch": 11} {"train_loss": -14.42846965789795, "global_step": 958, "epoch": 11} {"train_loss": -14.802348136901855, "global_step": 959, "epoch": 11} {"train_loss": -14.709147453308105, "global_step": 960, "epoch": 11} {"train_loss": -15.049298286437988, "global_step": 961, "epoch": 11} {"train_loss": -15.018710136413574, "global_step": 962, "epoch": 11} {"train_loss": -14.426953315734863, "global_step": 963, "epoch": 11} {"train_loss": -14.69512939453125, "global_step": 964, "epoch": 11} {"train_loss": -14.831860542297363, "global_step": 965, "epoch": 11} {"train_loss": -14.716989517211914, "global_step": 966, "epoch": 11} {"train_loss": -13.571948051452637, "global_step": 967, "epoch": 11} {"train_loss": -14.936915397644043, "global_step": 968, "epoch": 11} {"train_loss": -14.904312133789062, "global_step": 969, "epoch": 11} {"train_loss": -14.831517219543457, "global_step": 970, "epoch": 11} {"train_loss": -14.623910903930664, "global_step": 971, "epoch": 11} {"train_loss": -14.703018188476562, "global_step": 972, "epoch": 11} {"train_loss": -14.57837200164795, "global_step": 973, "epoch": 11} {"train_loss": -14.712862968444824, "global_step": 974, "epoch": 11} {"train_loss": -14.856460571289062, "global_step": 975, "epoch": 11} {"train_loss": -14.958670616149902, "global_step": 976, "epoch": 11} {"train_loss": -15.028755187988281, "global_step": 977, "epoch": 11} {"train_loss": -14.860709190368652, "global_step": 978, "epoch": 11} {"train_loss": -14.859916687011719, "global_step": 979, "epoch": 11} {"train_loss": -15.22296142578125, "global_step": 980, "epoch": 11} {"train_loss": -14.955947875976562, "global_step": 981, "epoch": 11} {"train_loss": -14.891084671020508, "global_step": 982, "epoch": 11} {"train_loss": -14.638521194458008, "global_step": 983, "epoch": 11} {"train_loss": -14.7925443649292, "global_step": 984, "epoch": 11} {"train_loss": -14.375226020812988, "global_step": 985, "epoch": 11} {"train_loss": -15.0117769241333, "global_step": 986, "epoch": 11} {"train_loss": -14.912506103515625, "global_step": 987, "epoch": 11} {"train_loss": -14.581889152526855, "global_step": 988, "epoch": 11} {"train_loss": -14.667620658874512, "global_step": 989, "epoch": 11} {"train_loss": -14.730351448059082, "global_step": 990, "epoch": 11} {"train_loss": -14.706146240234375, "global_step": 991, "epoch": 11} {"train_loss": -15.028616905212402, "global_step": 992, "epoch": 11} {"train_loss": -14.903510093688965, "global_step": 993, "epoch": 11} {"train_loss": -14.782754898071289, "global_step": 994, "epoch": 11} {"train_loss": -14.712347398321313, "global_step": 995, "epoch": 11, "val_loss": 9732485.0} {"train_loss": -14.579011917114258, "global_step": 996, "epoch": 12} {"train_loss": -14.27957820892334, "global_step": 997, "epoch": 12} {"train_loss": -14.800102233886719, "global_step": 998, "epoch": 12} {"train_loss": -14.263358116149902, "global_step": 999, "epoch": 12} {"train_loss": -14.661894798278809, "global_step": 1000, "epoch": 12} {"train_loss": -14.759366035461426, "global_step": 1001, "epoch": 12} {"train_loss": -14.75538158416748, "global_step": 1002, "epoch": 12} {"train_loss": -14.912409782409668, "global_step": 1003, "epoch": 12} {"train_loss": -14.969775199890137, "global_step": 1004, "epoch": 12} {"train_loss": -14.692178726196289, "global_step": 1005, "epoch": 12} {"train_loss": -14.64570140838623, "global_step": 1006, "epoch": 12} {"train_loss": -14.718901634216309, "global_step": 1007, "epoch": 12} {"train_loss": -14.998323440551758, "global_step": 1008, "epoch": 12} {"train_loss": -14.757662773132324, "global_step": 1009, "epoch": 12} {"train_loss": -14.350117683410645, "global_step": 1010, "epoch": 12} {"train_loss": -15.003252029418945, "global_step": 1011, "epoch": 12} {"train_loss": -14.540579795837402, "global_step": 1012, "epoch": 12} {"train_loss": -14.518094062805176, "global_step": 1013, "epoch": 12} {"train_loss": -15.133633613586426, "global_step": 1014, "epoch": 12} {"train_loss": -14.855401992797852, "global_step": 1015, "epoch": 12} {"train_loss": -15.23343563079834, "global_step": 1016, "epoch": 12} {"train_loss": -14.89573860168457, "global_step": 1017, "epoch": 12} {"train_loss": -14.957118034362793, "global_step": 1018, "epoch": 12} {"train_loss": -14.854225158691406, "global_step": 1019, "epoch": 12} {"train_loss": -14.985734939575195, "global_step": 1020, "epoch": 12} {"train_loss": -15.084887504577637, "global_step": 1021, "epoch": 12} {"train_loss": -14.566873550415039, "global_step": 1022, "epoch": 12} {"train_loss": -15.335932731628418, "global_step": 1023, "epoch": 12} {"train_loss": -14.849345207214355, "global_step": 1024, "epoch": 12} {"train_loss": -15.02397632598877, "global_step": 1025, "epoch": 12} {"train_loss": -15.025189399719238, "global_step": 1026, "epoch": 12} {"train_loss": -15.038558959960938, "global_step": 1027, "epoch": 12} {"train_loss": -14.776272773742676, "global_step": 1028, "epoch": 12} {"train_loss": -14.625935554504395, "global_step": 1029, "epoch": 12} {"train_loss": -15.123603820800781, "global_step": 1030, "epoch": 12} {"train_loss": -15.089555740356445, "global_step": 1031, "epoch": 12} {"train_loss": -15.2432861328125, "global_step": 1032, "epoch": 12} {"train_loss": -14.907307624816895, "global_step": 1033, "epoch": 12} {"train_loss": -14.695197105407715, "global_step": 1034, "epoch": 12} {"train_loss": -14.638928413391113, "global_step": 1035, "epoch": 12} {"train_loss": -14.63538646697998, "global_step": 1036, "epoch": 12} {"train_loss": -15.116930961608887, "global_step": 1037, "epoch": 12} {"train_loss": -14.91381549835205, "global_step": 1038, "epoch": 12} {"train_loss": -15.178466796875, "global_step": 1039, "epoch": 12} {"train_loss": -14.700340270996094, "global_step": 1040, "epoch": 12} {"train_loss": -14.571515083312988, "global_step": 1041, "epoch": 12} {"train_loss": -14.446710586547852, "global_step": 1042, "epoch": 12} {"train_loss": -14.795907974243164, "global_step": 1043, "epoch": 12} {"train_loss": -14.896598815917969, "global_step": 1044, "epoch": 12} {"train_loss": -14.723296165466309, "global_step": 1045, "epoch": 12} {"train_loss": -14.787530899047852, "global_step": 1046, "epoch": 12} {"train_loss": -14.961104393005371, "global_step": 1047, "epoch": 12} {"train_loss": -14.742843627929688, "global_step": 1048, "epoch": 12} {"train_loss": -15.07694149017334, "global_step": 1049, "epoch": 12} {"train_loss": -15.227729797363281, "global_step": 1050, "epoch": 12} {"train_loss": -14.7260160446167, "global_step": 1051, "epoch": 12} {"train_loss": -15.150901794433594, "global_step": 1052, "epoch": 12} {"train_loss": -14.523648262023926, "global_step": 1053, "epoch": 12} {"train_loss": -14.573417663574219, "global_step": 1054, "epoch": 12} {"train_loss": -14.471976280212402, "global_step": 1055, "epoch": 12} {"train_loss": -14.6498384475708, "global_step": 1056, "epoch": 12} {"train_loss": -14.887112617492676, "global_step": 1057, "epoch": 12} {"train_loss": -15.226963996887207, "global_step": 1058, "epoch": 12} {"train_loss": -14.816184043884277, "global_step": 1059, "epoch": 12} {"train_loss": -15.249588012695312, "global_step": 1060, "epoch": 12} {"train_loss": -15.486119270324707, "global_step": 1061, "epoch": 12} {"train_loss": -14.626593589782715, "global_step": 1062, "epoch": 12} {"train_loss": -15.008994102478027, "global_step": 1063, "epoch": 12} {"train_loss": -14.942941665649414, "global_step": 1064, "epoch": 12} {"train_loss": -15.13561725616455, "global_step": 1065, "epoch": 12} {"train_loss": -14.69688892364502, "global_step": 1066, "epoch": 12} {"train_loss": -14.916653633117676, "global_step": 1067, "epoch": 12} {"train_loss": -14.515494346618652, "global_step": 1068, "epoch": 12} {"train_loss": -14.683402061462402, "global_step": 1069, "epoch": 12} {"train_loss": -14.12816047668457, "global_step": 1070, "epoch": 12} {"train_loss": -15.087870597839355, "global_step": 1071, "epoch": 12} {"train_loss": -14.944086074829102, "global_step": 1072, "epoch": 12} {"train_loss": -14.430322647094727, "global_step": 1073, "epoch": 12} {"train_loss": -15.355669975280762, "global_step": 1074, "epoch": 12} {"train_loss": -15.2025785446167, "global_step": 1075, "epoch": 12} {"train_loss": -14.601724624633789, "global_step": 1076, "epoch": 12} {"train_loss": -14.560004234313965, "global_step": 1077, "epoch": 12} {"train_loss": -14.86554745593703, "global_step": 1078, "epoch": 12, "val_loss": 9376002.0} {"train_loss": -14.450461387634277, "global_step": 1079, "epoch": 13} {"train_loss": -15.147311210632324, "global_step": 1080, "epoch": 13} {"train_loss": -14.613136291503906, "global_step": 1081, "epoch": 13} {"train_loss": -14.658929824829102, "global_step": 1082, "epoch": 13} {"train_loss": -15.349087715148926, "global_step": 1083, "epoch": 13} {"train_loss": -15.18420696258545, "global_step": 1084, "epoch": 13} {"train_loss": -14.692835807800293, "global_step": 1085, "epoch": 13} {"train_loss": -14.629870414733887, "global_step": 1086, "epoch": 13} {"train_loss": -14.615832328796387, "global_step": 1087, "epoch": 13} {"train_loss": -15.131026268005371, "global_step": 1088, "epoch": 13} {"train_loss": -14.7290620803833, "global_step": 1089, "epoch": 13} {"train_loss": -15.0556001663208, "global_step": 1090, "epoch": 13} {"train_loss": -14.677230834960938, "global_step": 1091, "epoch": 13} {"train_loss": -15.37744140625, "global_step": 1092, "epoch": 13} {"train_loss": -14.646875381469727, "global_step": 1093, "epoch": 13} {"train_loss": -14.685089111328125, "global_step": 1094, "epoch": 13} {"train_loss": -14.962854385375977, "global_step": 1095, "epoch": 13} {"train_loss": -15.22416877746582, "global_step": 1096, "epoch": 13} {"train_loss": -14.8491849899292, "global_step": 1097, "epoch": 13} {"train_loss": -14.827609062194824, "global_step": 1098, "epoch": 13} {"train_loss": -14.914898872375488, "global_step": 1099, "epoch": 13} {"train_loss": -15.020052909851074, "global_step": 1100, "epoch": 13} {"train_loss": -15.500869750976562, "global_step": 1101, "epoch": 13} {"train_loss": -15.01785945892334, "global_step": 1102, "epoch": 13} {"train_loss": -15.06833553314209, "global_step": 1103, "epoch": 13} {"train_loss": -15.321036338806152, "global_step": 1104, "epoch": 13} {"train_loss": -14.76867389678955, "global_step": 1105, "epoch": 13} {"train_loss": -15.018381118774414, "global_step": 1106, "epoch": 13} {"train_loss": -14.304303169250488, "global_step": 1107, "epoch": 13} {"train_loss": -14.912490844726562, "global_step": 1108, "epoch": 13} {"train_loss": -15.36083698272705, "global_step": 1109, "epoch": 13} {"train_loss": -15.082155227661133, "global_step": 1110, "epoch": 13} {"train_loss": -14.901872634887695, "global_step": 1111, "epoch": 13} {"train_loss": -14.932672500610352, "global_step": 1112, "epoch": 13} {"train_loss": -15.316981315612793, "global_step": 1113, "epoch": 13} {"train_loss": -15.325594902038574, "global_step": 1114, "epoch": 13} {"train_loss": -14.775408744812012, "global_step": 1115, "epoch": 13} {"train_loss": -15.192916870117188, "global_step": 1116, "epoch": 13} {"train_loss": -14.879541397094727, "global_step": 1117, "epoch": 13} {"train_loss": -14.5700101852417, "global_step": 1118, "epoch": 13} {"train_loss": -15.008801460266113, "global_step": 1119, "epoch": 13} {"train_loss": -14.99761962890625, "global_step": 1120, "epoch": 13} {"train_loss": -14.92070198059082, "global_step": 1121, "epoch": 13} {"train_loss": -15.545923233032227, "global_step": 1122, "epoch": 13} {"train_loss": -15.329272270202637, "global_step": 1123, "epoch": 13} {"train_loss": -15.17730712890625, "global_step": 1124, "epoch": 13} {"train_loss": -14.875139236450195, "global_step": 1125, "epoch": 13} {"train_loss": -14.941858291625977, "global_step": 1126, "epoch": 13} {"train_loss": -15.100489616394043, "global_step": 1127, "epoch": 13} {"train_loss": -15.072891235351562, "global_step": 1128, "epoch": 13} {"train_loss": -14.941108703613281, "global_step": 1129, "epoch": 13} {"train_loss": -14.921160697937012, "global_step": 1130, "epoch": 13} {"train_loss": -15.242545127868652, "global_step": 1131, "epoch": 13} {"train_loss": -15.027254104614258, "global_step": 1132, "epoch": 13} {"train_loss": -15.339400291442871, "global_step": 1133, "epoch": 13} {"train_loss": -15.129034996032715, "global_step": 1134, "epoch": 13} {"train_loss": -14.8157320022583, "global_step": 1135, "epoch": 13} {"train_loss": -14.859155654907227, "global_step": 1136, "epoch": 13} {"train_loss": -15.275995254516602, "global_step": 1137, "epoch": 13} {"train_loss": -15.189203262329102, "global_step": 1138, "epoch": 13} {"train_loss": -15.062753677368164, "global_step": 1139, "epoch": 13} {"train_loss": -15.402722358703613, "global_step": 1140, "epoch": 13} {"train_loss": -14.687896728515625, "global_step": 1141, "epoch": 13} {"train_loss": -15.155621528625488, "global_step": 1142, "epoch": 13} {"train_loss": -15.012214660644531, "global_step": 1143, "epoch": 13} {"train_loss": -15.186152458190918, "global_step": 1144, "epoch": 13} {"train_loss": -15.227426528930664, "global_step": 1145, "epoch": 13} {"train_loss": -15.359061241149902, "global_step": 1146, "epoch": 13} {"train_loss": -15.257941246032715, "global_step": 1147, "epoch": 13} {"train_loss": -14.87022590637207, "global_step": 1148, "epoch": 13} {"train_loss": -14.8604097366333, "global_step": 1149, "epoch": 13} {"train_loss": -15.270407676696777, "global_step": 1150, "epoch": 13} {"train_loss": -14.953680992126465, "global_step": 1151, "epoch": 13} {"train_loss": -15.633540153503418, "global_step": 1152, "epoch": 13} {"train_loss": -15.174304008483887, "global_step": 1153, "epoch": 13} {"train_loss": -15.078471183776855, "global_step": 1154, "epoch": 13} {"train_loss": -15.235318183898926, "global_step": 1155, "epoch": 13} {"train_loss": -14.8363618850708, "global_step": 1156, "epoch": 13} {"train_loss": -15.8319091796875, "global_step": 1157, "epoch": 13} {"train_loss": -14.760421752929688, "global_step": 1158, "epoch": 13} {"train_loss": -15.336700439453125, "global_step": 1159, "epoch": 13} {"train_loss": -14.747024536132812, "global_step": 1160, "epoch": 13} {"train_loss": -15.03468241174537, "global_step": 1161, "epoch": 13, "val_loss": 9224254.0} {"train_loss": -15.308847427368164, "global_step": 1162, "epoch": 14} {"train_loss": -14.967126846313477, "global_step": 1163, "epoch": 14} {"train_loss": -15.1658296585083, "global_step": 1164, "epoch": 14} {"train_loss": -15.15142822265625, "global_step": 1165, "epoch": 14} {"train_loss": -14.652313232421875, "global_step": 1166, "epoch": 14} {"train_loss": -14.511731147766113, "global_step": 1167, "epoch": 14} {"train_loss": -14.933334350585938, "global_step": 1168, "epoch": 14} {"train_loss": -15.1569242477417, "global_step": 1169, "epoch": 14} {"train_loss": -15.027679443359375, "global_step": 1170, "epoch": 14} {"train_loss": -14.700915336608887, "global_step": 1171, "epoch": 14} {"train_loss": -15.426276206970215, "global_step": 1172, "epoch": 14} {"train_loss": -15.466635704040527, "global_step": 1173, "epoch": 14} {"train_loss": -15.106863975524902, "global_step": 1174, "epoch": 14} {"train_loss": -15.513836860656738, "global_step": 1175, "epoch": 14} {"train_loss": -15.295001029968262, "global_step": 1176, "epoch": 14} {"train_loss": -15.07529354095459, "global_step": 1177, "epoch": 14} {"train_loss": -15.536813735961914, "global_step": 1178, "epoch": 14} {"train_loss": -15.036099433898926, "global_step": 1179, "epoch": 14} {"train_loss": -15.120584487915039, "global_step": 1180, "epoch": 14} {"train_loss": -14.483179092407227, "global_step": 1181, "epoch": 14} {"train_loss": -15.11107063293457, "global_step": 1182, "epoch": 14} {"train_loss": -15.18411922454834, "global_step": 1183, "epoch": 14} {"train_loss": -15.002344131469727, "global_step": 1184, "epoch": 14} {"train_loss": -15.085357666015625, "global_step": 1185, "epoch": 14} {"train_loss": -14.804405212402344, "global_step": 1186, "epoch": 14} {"train_loss": -15.153863906860352, "global_step": 1187, "epoch": 14} {"train_loss": -14.699980735778809, "global_step": 1188, "epoch": 14} {"train_loss": -14.91968822479248, "global_step": 1189, "epoch": 14} {"train_loss": -15.129638671875, "global_step": 1190, "epoch": 14} {"train_loss": -15.820904731750488, "global_step": 1191, "epoch": 14} {"train_loss": -14.782587051391602, "global_step": 1192, "epoch": 14} {"train_loss": -15.754977226257324, "global_step": 1193, "epoch": 14} {"train_loss": -14.785913467407227, "global_step": 1194, "epoch": 14} {"train_loss": -15.324441909790039, "global_step": 1195, "epoch": 14} {"train_loss": -14.910244941711426, "global_step": 1196, "epoch": 14} {"train_loss": -15.040743827819824, "global_step": 1197, "epoch": 14} {"train_loss": -14.841635704040527, "global_step": 1198, "epoch": 14} {"train_loss": -14.535364151000977, "global_step": 1199, "epoch": 14} {"train_loss": -15.15479564666748, "global_step": 1200, "epoch": 14} {"train_loss": -14.8695707321167, "global_step": 1201, "epoch": 14} {"train_loss": -15.339212417602539, "global_step": 1202, "epoch": 14} {"train_loss": -15.303733825683594, "global_step": 1203, "epoch": 14} {"train_loss": -14.929890632629395, "global_step": 1204, "epoch": 14} {"train_loss": -15.02648639678955, "global_step": 1205, "epoch": 14} {"train_loss": -15.55535888671875, "global_step": 1206, "epoch": 14} {"train_loss": -15.685541152954102, "global_step": 1207, "epoch": 14} {"train_loss": -15.292864799499512, "global_step": 1208, "epoch": 14} {"train_loss": -15.313328742980957, "global_step": 1209, "epoch": 14} {"train_loss": -15.02838134765625, "global_step": 1210, "epoch": 14} {"train_loss": -14.778973579406738, "global_step": 1211, "epoch": 14} {"train_loss": -15.758310317993164, "global_step": 1212, "epoch": 14} {"train_loss": -15.0891695022583, "global_step": 1213, "epoch": 14} {"train_loss": -14.782670974731445, "global_step": 1214, "epoch": 14} {"train_loss": -15.058786392211914, "global_step": 1215, "epoch": 14} {"train_loss": -15.173515319824219, "global_step": 1216, "epoch": 14} {"train_loss": -15.121687889099121, "global_step": 1217, "epoch": 14} {"train_loss": -15.470817565917969, "global_step": 1218, "epoch": 14} {"train_loss": -15.423075675964355, "global_step": 1219, "epoch": 14} {"train_loss": -15.459060668945312, "global_step": 1220, "epoch": 14} {"train_loss": -15.178049087524414, "global_step": 1221, "epoch": 14} {"train_loss": -15.24688720703125, "global_step": 1222, "epoch": 14} {"train_loss": -15.476391792297363, "global_step": 1223, "epoch": 14} {"train_loss": -15.084856986999512, "global_step": 1224, "epoch": 14} {"train_loss": -15.158843040466309, "global_step": 1225, "epoch": 14} {"train_loss": -14.789807319641113, "global_step": 1226, "epoch": 14} {"train_loss": -15.137811660766602, "global_step": 1227, "epoch": 14} {"train_loss": -15.629180908203125, "global_step": 1228, "epoch": 14} {"train_loss": -14.862309455871582, "global_step": 1229, "epoch": 14} {"train_loss": -15.516242980957031, "global_step": 1230, "epoch": 14} {"train_loss": -15.288395881652832, "global_step": 1231, "epoch": 14} {"train_loss": -15.173059463500977, "global_step": 1232, "epoch": 14} {"train_loss": -15.239168167114258, "global_step": 1233, "epoch": 14} {"train_loss": -14.98388671875, "global_step": 1234, "epoch": 14} {"train_loss": -15.187753677368164, "global_step": 1235, "epoch": 14} {"train_loss": -14.930493354797363, "global_step": 1236, "epoch": 14} {"train_loss": -15.19589900970459, "global_step": 1237, "epoch": 14} {"train_loss": -15.218365669250488, "global_step": 1238, "epoch": 14} {"train_loss": -15.439849853515625, "global_step": 1239, "epoch": 14} {"train_loss": -15.412497520446777, "global_step": 1240, "epoch": 14} {"train_loss": -15.25256061553955, "global_step": 1241, "epoch": 14} {"train_loss": -15.208149909973145, "global_step": 1242, "epoch": 14} {"train_loss": -15.1226224899292, "global_step": 1243, "epoch": 14} {"train_loss": -15.14175974604595, "global_step": 1244, "epoch": 14, "val_loss": 9115954.0} {"train_loss": -14.785529136657715, "global_step": 1245, "epoch": 15} {"train_loss": -15.419939994812012, "global_step": 1246, "epoch": 15} {"train_loss": -15.235963821411133, "global_step": 1247, "epoch": 15} {"train_loss": -15.587002754211426, "global_step": 1248, "epoch": 15} {"train_loss": -14.851366996765137, "global_step": 1249, "epoch": 15} {"train_loss": -15.411224365234375, "global_step": 1250, "epoch": 15} {"train_loss": -15.47824764251709, "global_step": 1251, "epoch": 15} {"train_loss": -15.185528755187988, "global_step": 1252, "epoch": 15} {"train_loss": -15.549356460571289, "global_step": 1253, "epoch": 15} {"train_loss": -15.453343391418457, "global_step": 1254, "epoch": 15} {"train_loss": -15.251311302185059, "global_step": 1255, "epoch": 15} {"train_loss": -14.901972770690918, "global_step": 1256, "epoch": 15} {"train_loss": -15.180102348327637, "global_step": 1257, "epoch": 15} {"train_loss": -15.175108909606934, "global_step": 1258, "epoch": 15} {"train_loss": -15.185035705566406, "global_step": 1259, "epoch": 15} {"train_loss": -15.286338806152344, "global_step": 1260, "epoch": 15} {"train_loss": -15.475931167602539, "global_step": 1261, "epoch": 15} {"train_loss": -15.233810424804688, "global_step": 1262, "epoch": 15} {"train_loss": -15.428954124450684, "global_step": 1263, "epoch": 15} {"train_loss": -15.074020385742188, "global_step": 1264, "epoch": 15} {"train_loss": -15.541460990905762, "global_step": 1265, "epoch": 15} {"train_loss": -15.340703010559082, "global_step": 1266, "epoch": 15} {"train_loss": -15.294000625610352, "global_step": 1267, "epoch": 15} {"train_loss": -15.068498611450195, "global_step": 1268, "epoch": 15} {"train_loss": -15.606722831726074, "global_step": 1269, "epoch": 15} {"train_loss": -15.336020469665527, "global_step": 1270, "epoch": 15} {"train_loss": -15.519902229309082, "global_step": 1271, "epoch": 15} {"train_loss": -15.58197021484375, "global_step": 1272, "epoch": 15} {"train_loss": -15.388940811157227, "global_step": 1273, "epoch": 15} {"train_loss": -15.3590726852417, "global_step": 1274, "epoch": 15} {"train_loss": -15.500048637390137, "global_step": 1275, "epoch": 15} {"train_loss": -15.074464797973633, "global_step": 1276, "epoch": 15} {"train_loss": -15.40778636932373, "global_step": 1277, "epoch": 15} {"train_loss": -15.203722953796387, "global_step": 1278, "epoch": 15} {"train_loss": -15.590184211730957, "global_step": 1279, "epoch": 15} {"train_loss": -15.475737571716309, "global_step": 1280, "epoch": 15} {"train_loss": -15.124809265136719, "global_step": 1281, "epoch": 15} {"train_loss": -15.310641288757324, "global_step": 1282, "epoch": 15} {"train_loss": -15.148640632629395, "global_step": 1283, "epoch": 15} {"train_loss": -15.675264358520508, "global_step": 1284, "epoch": 15} {"train_loss": -15.126062393188477, "global_step": 1285, "epoch": 15} {"train_loss": -15.00662899017334, "global_step": 1286, "epoch": 15} {"train_loss": -15.230079650878906, "global_step": 1287, "epoch": 15} {"train_loss": -15.0313138961792, "global_step": 1288, "epoch": 15} {"train_loss": -14.935343742370605, "global_step": 1289, "epoch": 15} {"train_loss": -15.236017227172852, "global_step": 1290, "epoch": 15} {"train_loss": -15.194483757019043, "global_step": 1291, "epoch": 15} {"train_loss": -15.529913902282715, "global_step": 1292, "epoch": 15} {"train_loss": -15.149545669555664, "global_step": 1293, "epoch": 15} {"train_loss": -15.218283653259277, "global_step": 1294, "epoch": 15} {"train_loss": -15.097735404968262, "global_step": 1295, "epoch": 15} {"train_loss": -15.274194717407227, "global_step": 1296, "epoch": 15} {"train_loss": -15.123507499694824, "global_step": 1297, "epoch": 15} {"train_loss": -15.142788887023926, "global_step": 1298, "epoch": 15} {"train_loss": -14.838668823242188, "global_step": 1299, "epoch": 15} {"train_loss": -15.744613647460938, "global_step": 1300, "epoch": 15} {"train_loss": -14.851519584655762, "global_step": 1301, "epoch": 15} {"train_loss": -15.650398254394531, "global_step": 1302, "epoch": 15} {"train_loss": -15.22314453125, "global_step": 1303, "epoch": 15} {"train_loss": -15.111172676086426, "global_step": 1304, "epoch": 15} {"train_loss": -15.43729305267334, "global_step": 1305, "epoch": 15} {"train_loss": -15.627573013305664, "global_step": 1306, "epoch": 15} {"train_loss": -15.5076904296875, "global_step": 1307, "epoch": 15} {"train_loss": -15.202232360839844, "global_step": 1308, "epoch": 15} {"train_loss": -15.459311485290527, "global_step": 1309, "epoch": 15} {"train_loss": -15.219322204589844, "global_step": 1310, "epoch": 15} {"train_loss": -15.283717155456543, "global_step": 1311, "epoch": 15} {"train_loss": -15.239877700805664, "global_step": 1312, "epoch": 15} {"train_loss": -15.202349662780762, "global_step": 1313, "epoch": 15} {"train_loss": -15.182089805603027, "global_step": 1314, "epoch": 15} {"train_loss": -15.50943660736084, "global_step": 1315, "epoch": 15} {"train_loss": -14.714154243469238, "global_step": 1316, "epoch": 15} {"train_loss": -15.198060989379883, "global_step": 1317, "epoch": 15} {"train_loss": -15.077948570251465, "global_step": 1318, "epoch": 15} {"train_loss": -15.210661888122559, "global_step": 1319, "epoch": 15} {"train_loss": -15.274713516235352, "global_step": 1320, "epoch": 15} {"train_loss": -14.799426078796387, "global_step": 1321, "epoch": 15} {"train_loss": -15.561004638671875, "global_step": 1322, "epoch": 15} {"train_loss": -15.488740921020508, "global_step": 1323, "epoch": 15} {"train_loss": -15.254440307617188, "global_step": 1324, "epoch": 15} {"train_loss": -15.444632530212402, "global_step": 1325, "epoch": 15} {"train_loss": -15.1431884765625, "global_step": 1326, "epoch": 15} {"train_loss": -15.271526164319141, "global_step": 1327, "epoch": 15, "val_loss": 9038108.0} {"train_loss": -15.677932739257812, "global_step": 1328, "epoch": 16} {"train_loss": -14.91590404510498, "global_step": 1329, "epoch": 16} {"train_loss": -15.40518856048584, "global_step": 1330, "epoch": 16} {"train_loss": -15.067522048950195, "global_step": 1331, "epoch": 16} {"train_loss": -15.500235557556152, "global_step": 1332, "epoch": 16} {"train_loss": -15.216147422790527, "global_step": 1333, "epoch": 16} {"train_loss": -15.128893852233887, "global_step": 1334, "epoch": 16} {"train_loss": -15.311784744262695, "global_step": 1335, "epoch": 16} {"train_loss": -14.963678359985352, "global_step": 1336, "epoch": 16} {"train_loss": -14.95550537109375, "global_step": 1337, "epoch": 16} {"train_loss": -15.29150676727295, "global_step": 1338, "epoch": 16} {"train_loss": -14.837615966796875, "global_step": 1339, "epoch": 16} {"train_loss": -15.41791820526123, "global_step": 1340, "epoch": 16} {"train_loss": -15.22803020477295, "global_step": 1341, "epoch": 16} {"train_loss": -15.360003471374512, "global_step": 1342, "epoch": 16} {"train_loss": -15.210009574890137, "global_step": 1343, "epoch": 16} {"train_loss": -15.191195487976074, "global_step": 1344, "epoch": 16} {"train_loss": -15.214853286743164, "global_step": 1345, "epoch": 16} {"train_loss": -15.19398021697998, "global_step": 1346, "epoch": 16} {"train_loss": -15.150166511535645, "global_step": 1347, "epoch": 16} {"train_loss": -15.674160957336426, "global_step": 1348, "epoch": 16} {"train_loss": -15.047396659851074, "global_step": 1349, "epoch": 16} {"train_loss": -15.323511123657227, "global_step": 1350, "epoch": 16} {"train_loss": -15.447209358215332, "global_step": 1351, "epoch": 16} {"train_loss": -14.965814590454102, "global_step": 1352, "epoch": 16} {"train_loss": -15.434196472167969, "global_step": 1353, "epoch": 16} {"train_loss": -15.425729751586914, "global_step": 1354, "epoch": 16} {"train_loss": -15.489465713500977, "global_step": 1355, "epoch": 16} {"train_loss": -15.198043823242188, "global_step": 1356, "epoch": 16} {"train_loss": -15.002037048339844, "global_step": 1357, "epoch": 16} {"train_loss": -15.398323059082031, "global_step": 1358, "epoch": 16} {"train_loss": -15.72537899017334, "global_step": 1359, "epoch": 16} {"train_loss": -15.51525592803955, "global_step": 1360, "epoch": 16} {"train_loss": -15.489008903503418, "global_step": 1361, "epoch": 16} {"train_loss": -15.408668518066406, "global_step": 1362, "epoch": 16} {"train_loss": -15.395851135253906, "global_step": 1363, "epoch": 16} {"train_loss": -15.339731216430664, "global_step": 1364, "epoch": 16} {"train_loss": -15.636115074157715, "global_step": 1365, "epoch": 16} {"train_loss": -15.098919868469238, "global_step": 1366, "epoch": 16} {"train_loss": -15.401965141296387, "global_step": 1367, "epoch": 16} {"train_loss": -15.821261405944824, "global_step": 1368, "epoch": 16} {"train_loss": -15.363286018371582, "global_step": 1369, "epoch": 16} {"train_loss": -15.600035667419434, "global_step": 1370, "epoch": 16} {"train_loss": -15.679373741149902, "global_step": 1371, "epoch": 16} {"train_loss": -15.386914253234863, "global_step": 1372, "epoch": 16} {"train_loss": -15.501080513000488, "global_step": 1373, "epoch": 16} {"train_loss": -15.766159057617188, "global_step": 1374, "epoch": 16} {"train_loss": -15.2777738571167, "global_step": 1375, "epoch": 16} {"train_loss": -14.945548057556152, "global_step": 1376, "epoch": 16} {"train_loss": -15.565844535827637, "global_step": 1377, "epoch": 16} {"train_loss": -15.347480773925781, "global_step": 1378, "epoch": 16} {"train_loss": -15.411966323852539, "global_step": 1379, "epoch": 16} {"train_loss": -15.241436958312988, "global_step": 1380, "epoch": 16} {"train_loss": -15.638676643371582, "global_step": 1381, "epoch": 16} {"train_loss": -15.254206657409668, "global_step": 1382, "epoch": 16} {"train_loss": -15.693506240844727, "global_step": 1383, "epoch": 16} {"train_loss": -15.446356773376465, "global_step": 1384, "epoch": 16} {"train_loss": -15.964571952819824, "global_step": 1385, "epoch": 16} {"train_loss": -15.149373054504395, "global_step": 1386, "epoch": 16} {"train_loss": -15.6152925491333, "global_step": 1387, "epoch": 16} {"train_loss": -15.3878173828125, "global_step": 1388, "epoch": 16} {"train_loss": -15.325085639953613, "global_step": 1389, "epoch": 16} {"train_loss": -15.43901252746582, "global_step": 1390, "epoch": 16} {"train_loss": -15.361926078796387, "global_step": 1391, "epoch": 16} {"train_loss": -15.301872253417969, "global_step": 1392, "epoch": 16} {"train_loss": -15.144757270812988, "global_step": 1393, "epoch": 16} {"train_loss": -15.373125076293945, "global_step": 1394, "epoch": 16} {"train_loss": -15.421843528747559, "global_step": 1395, "epoch": 16} {"train_loss": -15.524558067321777, "global_step": 1396, "epoch": 16} {"train_loss": -15.705044746398926, "global_step": 1397, "epoch": 16} {"train_loss": -15.510119438171387, "global_step": 1398, "epoch": 16} {"train_loss": -15.114250183105469, "global_step": 1399, "epoch": 16} {"train_loss": -15.305310249328613, "global_step": 1400, "epoch": 16} {"train_loss": -15.3101167678833, "global_step": 1401, "epoch": 16} {"train_loss": -15.398383140563965, "global_step": 1402, "epoch": 16} {"train_loss": -15.177008628845215, "global_step": 1403, "epoch": 16} {"train_loss": -15.261377334594727, "global_step": 1404, "epoch": 16} {"train_loss": -15.50723934173584, "global_step": 1405, "epoch": 16} {"train_loss": -15.598077774047852, "global_step": 1406, "epoch": 16} {"train_loss": -15.349865913391113, "global_step": 1407, "epoch": 16} {"train_loss": -15.470873832702637, "global_step": 1408, "epoch": 16} {"train_loss": -15.068066596984863, "global_step": 1409, "epoch": 16} {"train_loss": -15.359962130167398, "global_step": 1410, "epoch": 16, "val_loss": 8729304.0} {"train_loss": -15.04478645324707, "global_step": 1411, "epoch": 17} {"train_loss": -15.210731506347656, "global_step": 1412, "epoch": 17} {"train_loss": -15.14617919921875, "global_step": 1413, "epoch": 17} {"train_loss": -15.409573554992676, "global_step": 1414, "epoch": 17} {"train_loss": -15.345102310180664, "global_step": 1415, "epoch": 17} {"train_loss": -15.2091703414917, "global_step": 1416, "epoch": 17} {"train_loss": -15.096254348754883, "global_step": 1417, "epoch": 17} {"train_loss": -15.626410484313965, "global_step": 1418, "epoch": 17} {"train_loss": -15.376733779907227, "global_step": 1419, "epoch": 17} {"train_loss": -15.193900108337402, "global_step": 1420, "epoch": 17} {"train_loss": -15.151613235473633, "global_step": 1421, "epoch": 17} {"train_loss": -15.197549819946289, "global_step": 1422, "epoch": 17} {"train_loss": -15.663435935974121, "global_step": 1423, "epoch": 17} {"train_loss": -15.459677696228027, "global_step": 1424, "epoch": 17} {"train_loss": -15.24413776397705, "global_step": 1425, "epoch": 17} {"train_loss": -15.303070068359375, "global_step": 1426, "epoch": 17} {"train_loss": -15.360095024108887, "global_step": 1427, "epoch": 17} {"train_loss": -15.6129732131958, "global_step": 1428, "epoch": 17} {"train_loss": -15.52111530303955, "global_step": 1429, "epoch": 17} {"train_loss": -15.754800796508789, "global_step": 1430, "epoch": 17} {"train_loss": -15.471435546875, "global_step": 1431, "epoch": 17} {"train_loss": -15.538626670837402, "global_step": 1432, "epoch": 17} {"train_loss": -15.275545120239258, "global_step": 1433, "epoch": 17} {"train_loss": -15.62688159942627, "global_step": 1434, "epoch": 17} {"train_loss": -15.371174812316895, "global_step": 1435, "epoch": 17} {"train_loss": -15.396466255187988, "global_step": 1436, "epoch": 17} {"train_loss": -15.217875480651855, "global_step": 1437, "epoch": 17} {"train_loss": -15.361602783203125, "global_step": 1438, "epoch": 17} {"train_loss": -15.698153495788574, "global_step": 1439, "epoch": 17} {"train_loss": -15.633990287780762, "global_step": 1440, "epoch": 17} {"train_loss": -15.125990867614746, "global_step": 1441, "epoch": 17} {"train_loss": -15.151407241821289, "global_step": 1442, "epoch": 17} {"train_loss": -15.25108528137207, "global_step": 1443, "epoch": 17} {"train_loss": -15.099392890930176, "global_step": 1444, "epoch": 17} {"train_loss": -15.597549438476562, "global_step": 1445, "epoch": 17} {"train_loss": -15.259071350097656, "global_step": 1446, "epoch": 17} {"train_loss": -15.652978897094727, "global_step": 1447, "epoch": 17} {"train_loss": -15.599960327148438, "global_step": 1448, "epoch": 17} {"train_loss": -15.748272895812988, "global_step": 1449, "epoch": 17} {"train_loss": -15.535669326782227, "global_step": 1450, "epoch": 17} {"train_loss": -15.350512504577637, "global_step": 1451, "epoch": 17} {"train_loss": -15.66055965423584, "global_step": 1452, "epoch": 17} {"train_loss": -15.557812690734863, "global_step": 1453, "epoch": 17} {"train_loss": -15.363753318786621, "global_step": 1454, "epoch": 17} {"train_loss": -15.110383987426758, "global_step": 1455, "epoch": 17} {"train_loss": -15.508682250976562, "global_step": 1456, "epoch": 17} {"train_loss": -15.270878791809082, "global_step": 1457, "epoch": 17} {"train_loss": -15.737727165222168, "global_step": 1458, "epoch": 17} {"train_loss": -15.492965698242188, "global_step": 1459, "epoch": 17} {"train_loss": -15.427833557128906, "global_step": 1460, "epoch": 17} {"train_loss": -15.382553100585938, "global_step": 1461, "epoch": 17} {"train_loss": -15.601953506469727, "global_step": 1462, "epoch": 17} {"train_loss": -15.549220085144043, "global_step": 1463, "epoch": 17} {"train_loss": -15.210268020629883, "global_step": 1464, "epoch": 17} {"train_loss": -15.348441123962402, "global_step": 1465, "epoch": 17} {"train_loss": -15.24277400970459, "global_step": 1466, "epoch": 17} {"train_loss": -15.575624465942383, "global_step": 1467, "epoch": 17} {"train_loss": -15.914955139160156, "global_step": 1468, "epoch": 17} {"train_loss": -15.412894248962402, "global_step": 1469, "epoch": 17} {"train_loss": -15.669000625610352, "global_step": 1470, "epoch": 17} {"train_loss": -15.677444458007812, "global_step": 1471, "epoch": 17} {"train_loss": -15.468655586242676, "global_step": 1472, "epoch": 17} {"train_loss": -15.751497268676758, "global_step": 1473, "epoch": 17} {"train_loss": -15.39255428314209, "global_step": 1474, "epoch": 17} {"train_loss": -15.297507286071777, "global_step": 1475, "epoch": 17} {"train_loss": -15.905142784118652, "global_step": 1476, "epoch": 17} {"train_loss": -15.992932319641113, "global_step": 1477, "epoch": 17} {"train_loss": -15.449371337890625, "global_step": 1478, "epoch": 17} {"train_loss": -15.132145881652832, "global_step": 1479, "epoch": 17} {"train_loss": -15.708734512329102, "global_step": 1480, "epoch": 17} {"train_loss": -15.767840385437012, "global_step": 1481, "epoch": 17} {"train_loss": -15.711337089538574, "global_step": 1482, "epoch": 17} {"train_loss": -15.781966209411621, "global_step": 1483, "epoch": 17} {"train_loss": -15.223868370056152, "global_step": 1484, "epoch": 17} {"train_loss": -15.952285766601562, "global_step": 1485, "epoch": 17} {"train_loss": -15.9692964553833, "global_step": 1486, "epoch": 17} {"train_loss": -15.281704902648926, "global_step": 1487, "epoch": 17} {"train_loss": -15.426825523376465, "global_step": 1488, "epoch": 17} {"train_loss": -15.23850154876709, "global_step": 1489, "epoch": 17} {"train_loss": -15.401476860046387, "global_step": 1490, "epoch": 17} {"train_loss": -15.499651908874512, "global_step": 1491, "epoch": 17} {"train_loss": -15.279324531555176, "global_step": 1492, "epoch": 17} {"train_loss": -15.454302477549357, "global_step": 1493, "epoch": 17, "val_loss": 8676233.0} {"train_loss": -15.398490905761719, "global_step": 1494, "epoch": 18} {"train_loss": -15.205459594726562, "global_step": 1495, "epoch": 18} {"train_loss": -15.473956108093262, "global_step": 1496, "epoch": 18} {"train_loss": -15.613909721374512, "global_step": 1497, "epoch": 18} {"train_loss": -15.577966690063477, "global_step": 1498, "epoch": 18} {"train_loss": -15.48209285736084, "global_step": 1499, "epoch": 18} {"train_loss": -15.302508354187012, "global_step": 1500, "epoch": 18} {"train_loss": -15.621752738952637, "global_step": 1501, "epoch": 18} {"train_loss": -15.441667556762695, "global_step": 1502, "epoch": 18} {"train_loss": -15.124397277832031, "global_step": 1503, "epoch": 18} {"train_loss": -15.694327354431152, "global_step": 1504, "epoch": 18} {"train_loss": -15.679303169250488, "global_step": 1505, "epoch": 18} {"train_loss": -15.579025268554688, "global_step": 1506, "epoch": 18} {"train_loss": -15.31652545928955, "global_step": 1507, "epoch": 18} {"train_loss": -15.355737686157227, "global_step": 1508, "epoch": 18} {"train_loss": -15.71710205078125, "global_step": 1509, "epoch": 18} {"train_loss": -15.694368362426758, "global_step": 1510, "epoch": 18} {"train_loss": -15.644968032836914, "global_step": 1511, "epoch": 18} {"train_loss": -15.289688110351562, "global_step": 1512, "epoch": 18} {"train_loss": -15.383874893188477, "global_step": 1513, "epoch": 18} {"train_loss": -15.38165283203125, "global_step": 1514, "epoch": 18} {"train_loss": -15.499414443969727, "global_step": 1515, "epoch": 18} {"train_loss": -15.22038459777832, "global_step": 1516, "epoch": 18} {"train_loss": -15.532782554626465, "global_step": 1517, "epoch": 18} {"train_loss": -15.231689453125, "global_step": 1518, "epoch": 18} {"train_loss": -15.470189094543457, "global_step": 1519, "epoch": 18} {"train_loss": -15.531880378723145, "global_step": 1520, "epoch": 18} {"train_loss": -15.083198547363281, "global_step": 1521, "epoch": 18} {"train_loss": -15.578737258911133, "global_step": 1522, "epoch": 18} {"train_loss": -15.622624397277832, "global_step": 1523, "epoch": 18} {"train_loss": -15.761514663696289, "global_step": 1524, "epoch": 18} {"train_loss": -15.565035820007324, "global_step": 1525, "epoch": 18} {"train_loss": -16.02941131591797, "global_step": 1526, "epoch": 18} {"train_loss": -15.197344779968262, "global_step": 1527, "epoch": 18} {"train_loss": -15.572527885437012, "global_step": 1528, "epoch": 18} {"train_loss": -15.618616104125977, "global_step": 1529, "epoch": 18} {"train_loss": -15.957640647888184, "global_step": 1530, "epoch": 18} {"train_loss": -15.644685745239258, "global_step": 1531, "epoch": 18} {"train_loss": -15.578558921813965, "global_step": 1532, "epoch": 18} {"train_loss": -15.797492027282715, "global_step": 1533, "epoch": 18} {"train_loss": -15.442370414733887, "global_step": 1534, "epoch": 18} {"train_loss": -16.185293197631836, "global_step": 1535, "epoch": 18} {"train_loss": -15.87781810760498, "global_step": 1536, "epoch": 18} {"train_loss": -15.778897285461426, "global_step": 1537, "epoch": 18} {"train_loss": -15.32489013671875, "global_step": 1538, "epoch": 18} {"train_loss": -15.35118293762207, "global_step": 1539, "epoch": 18} {"train_loss": -15.3485107421875, "global_step": 1540, "epoch": 18} {"train_loss": -15.491601943969727, "global_step": 1541, "epoch": 18} {"train_loss": -15.731292724609375, "global_step": 1542, "epoch": 18} {"train_loss": -15.78448486328125, "global_step": 1543, "epoch": 18} {"train_loss": -15.445141792297363, "global_step": 1544, "epoch": 18} {"train_loss": -15.743951797485352, "global_step": 1545, "epoch": 18} {"train_loss": -15.586560249328613, "global_step": 1546, "epoch": 18} {"train_loss": -15.663400650024414, "global_step": 1547, "epoch": 18} {"train_loss": -15.106803894042969, "global_step": 1548, "epoch": 18} {"train_loss": -15.585800170898438, "global_step": 1549, "epoch": 18} {"train_loss": -15.47752857208252, "global_step": 1550, "epoch": 18} {"train_loss": -15.76867389678955, "global_step": 1551, "epoch": 18} {"train_loss": -15.678671836853027, "global_step": 1552, "epoch": 18} {"train_loss": -15.603998184204102, "global_step": 1553, "epoch": 18} {"train_loss": -15.347549438476562, "global_step": 1554, "epoch": 18} {"train_loss": -16.045455932617188, "global_step": 1555, "epoch": 18} {"train_loss": -15.241572380065918, "global_step": 1556, "epoch": 18} {"train_loss": -15.071539878845215, "global_step": 1557, "epoch": 18} {"train_loss": -15.50577449798584, "global_step": 1558, "epoch": 18} {"train_loss": -15.854300498962402, "global_step": 1559, "epoch": 18} {"train_loss": -15.892013549804688, "global_step": 1560, "epoch": 18} {"train_loss": -15.801190376281738, "global_step": 1561, "epoch": 18} {"train_loss": -15.197772026062012, "global_step": 1562, "epoch": 18} {"train_loss": -15.438136100769043, "global_step": 1563, "epoch": 18} {"train_loss": -15.416025161743164, "global_step": 1564, "epoch": 18} {"train_loss": -15.31682014465332, "global_step": 1565, "epoch": 18} {"train_loss": -15.370460510253906, "global_step": 1566, "epoch": 18} {"train_loss": -15.491061210632324, "global_step": 1567, "epoch": 18} {"train_loss": -15.879500389099121, "global_step": 1568, "epoch": 18} {"train_loss": -15.645538330078125, "global_step": 1569, "epoch": 18} {"train_loss": -15.922751426696777, "global_step": 1570, "epoch": 18} {"train_loss": -15.388861656188965, "global_step": 1571, "epoch": 18} {"train_loss": -15.682258605957031, "global_step": 1572, "epoch": 18} {"train_loss": -15.535992622375488, "global_step": 1573, "epoch": 18} {"train_loss": -15.829306602478027, "global_step": 1574, "epoch": 18} {"train_loss": -15.128741264343262, "global_step": 1575, "epoch": 18} {"train_loss": -15.555360817047486, "global_step": 1576, "epoch": 18, "val_loss": 8790864.0} {"train_loss": -15.241194725036621, "global_step": 1577, "epoch": 19} {"train_loss": -15.822290420532227, "global_step": 1578, "epoch": 19} {"train_loss": -15.725346565246582, "global_step": 1579, "epoch": 19} {"train_loss": -15.436373710632324, "global_step": 1580, "epoch": 19} {"train_loss": -15.649786949157715, "global_step": 1581, "epoch": 19} {"train_loss": -15.637824058532715, "global_step": 1582, "epoch": 19} {"train_loss": -15.55302906036377, "global_step": 1583, "epoch": 19} {"train_loss": -15.580789566040039, "global_step": 1584, "epoch": 19} {"train_loss": -15.528903007507324, "global_step": 1585, "epoch": 19} {"train_loss": -15.50253963470459, "global_step": 1586, "epoch": 19} {"train_loss": -15.509124755859375, "global_step": 1587, "epoch": 19} {"train_loss": -15.240277290344238, "global_step": 1588, "epoch": 19} {"train_loss": -15.391006469726562, "global_step": 1589, "epoch": 19} {"train_loss": -15.424914360046387, "global_step": 1590, "epoch": 19} {"train_loss": -15.066986083984375, "global_step": 1591, "epoch": 19} {"train_loss": -15.91771125793457, "global_step": 1592, "epoch": 19} {"train_loss": -15.592065811157227, "global_step": 1593, "epoch": 19} {"train_loss": -15.889813423156738, "global_step": 1594, "epoch": 19} {"train_loss": -15.37454891204834, "global_step": 1595, "epoch": 19} {"train_loss": -15.837448120117188, "global_step": 1596, "epoch": 19} {"train_loss": -15.478446006774902, "global_step": 1597, "epoch": 19} {"train_loss": -15.513522148132324, "global_step": 1598, "epoch": 19} {"train_loss": -15.7373685836792, "global_step": 1599, "epoch": 19} {"train_loss": -15.470393180847168, "global_step": 1600, "epoch": 19} {"train_loss": -15.525924682617188, "global_step": 1601, "epoch": 19} {"train_loss": -15.489944458007812, "global_step": 1602, "epoch": 19} {"train_loss": -15.783503532409668, "global_step": 1603, "epoch": 19} {"train_loss": -15.521811485290527, "global_step": 1604, "epoch": 19} {"train_loss": -15.386781692504883, "global_step": 1605, "epoch": 19} {"train_loss": -15.511052131652832, "global_step": 1606, "epoch": 19} {"train_loss": -15.4203519821167, "global_step": 1607, "epoch": 19} {"train_loss": -15.734341621398926, "global_step": 1608, "epoch": 19} {"train_loss": -15.810763359069824, "global_step": 1609, "epoch": 19} {"train_loss": -15.474807739257812, "global_step": 1610, "epoch": 19} {"train_loss": -15.666226387023926, "global_step": 1611, "epoch": 19} {"train_loss": -15.524866104125977, "global_step": 1612, "epoch": 19} {"train_loss": -15.725836753845215, "global_step": 1613, "epoch": 19} {"train_loss": -15.813531875610352, "global_step": 1614, "epoch": 19} {"train_loss": -15.5450439453125, "global_step": 1615, "epoch": 19} {"train_loss": -15.556225776672363, "global_step": 1616, "epoch": 19} {"train_loss": -15.897656440734863, "global_step": 1617, "epoch": 19} {"train_loss": -15.479888916015625, "global_step": 1618, "epoch": 19} {"train_loss": -15.73276424407959, "global_step": 1619, "epoch": 19} {"train_loss": -15.377128601074219, "global_step": 1620, "epoch": 19} {"train_loss": -15.548869132995605, "global_step": 1621, "epoch": 19} {"train_loss": -15.431988716125488, "global_step": 1622, "epoch": 19} {"train_loss": -16.01051139831543, "global_step": 1623, "epoch": 19} {"train_loss": -15.536730766296387, "global_step": 1624, "epoch": 19} {"train_loss": -15.813281059265137, "global_step": 1625, "epoch": 19} {"train_loss": -15.348421096801758, "global_step": 1626, "epoch": 19} {"train_loss": -15.475630760192871, "global_step": 1627, "epoch": 19} {"train_loss": -15.966961860656738, "global_step": 1628, "epoch": 19} {"train_loss": -15.47393798828125, "global_step": 1629, "epoch": 19} {"train_loss": -15.878649711608887, "global_step": 1630, "epoch": 19} {"train_loss": -15.8673734664917, "global_step": 1631, "epoch": 19} {"train_loss": -15.441800117492676, "global_step": 1632, "epoch": 19} {"train_loss": -15.652384757995605, "global_step": 1633, "epoch": 19} {"train_loss": -15.618464469909668, "global_step": 1634, "epoch": 19} {"train_loss": -14.995017051696777, "global_step": 1635, "epoch": 19} {"train_loss": -15.723733901977539, "global_step": 1636, "epoch": 19} {"train_loss": -16.054330825805664, "global_step": 1637, "epoch": 19} {"train_loss": -15.525717735290527, "global_step": 1638, "epoch": 19} {"train_loss": -15.713465690612793, "global_step": 1639, "epoch": 19} {"train_loss": -15.346402168273926, "global_step": 1640, "epoch": 19} {"train_loss": -15.7568998336792, "global_step": 1641, "epoch": 19} {"train_loss": -15.325575828552246, "global_step": 1642, "epoch": 19} {"train_loss": -15.637145042419434, "global_step": 1643, "epoch": 19} {"train_loss": -15.595425605773926, "global_step": 1644, "epoch": 19} {"train_loss": -15.795092582702637, "global_step": 1645, "epoch": 19} {"train_loss": -16.11233901977539, "global_step": 1646, "epoch": 19} {"train_loss": -15.389081001281738, "global_step": 1647, "epoch": 19} {"train_loss": -15.691901206970215, "global_step": 1648, "epoch": 19} {"train_loss": -15.641085624694824, "global_step": 1649, "epoch": 19} {"train_loss": -15.274029731750488, "global_step": 1650, "epoch": 19} {"train_loss": -15.3728609085083, "global_step": 1651, "epoch": 19} {"train_loss": -15.789405822753906, "global_step": 1652, "epoch": 19} {"train_loss": -15.267730712890625, "global_step": 1653, "epoch": 19} {"train_loss": -15.743499755859375, "global_step": 1654, "epoch": 19} {"train_loss": -15.790336608886719, "global_step": 1655, "epoch": 19} {"train_loss": -15.600333213806152, "global_step": 1656, "epoch": 19} {"train_loss": -15.92479419708252, "global_step": 1657, "epoch": 19} {"train_loss": -16.010583877563477, "global_step": 1658, "epoch": 19} {"train_loss": -15.623180849006378, "global_step": 1659, "epoch": 19, "val_loss": 8436794.0} {"train_loss": -15.135249137878418, "global_step": 1660, "epoch": 20} {"train_loss": -15.189404487609863, "global_step": 1661, "epoch": 20} {"train_loss": -15.481477737426758, "global_step": 1662, "epoch": 20} {"train_loss": -15.770057678222656, "global_step": 1663, "epoch": 20} {"train_loss": -15.290144920349121, "global_step": 1664, "epoch": 20} {"train_loss": -15.228927612304688, "global_step": 1665, "epoch": 20} {"train_loss": -15.330939292907715, "global_step": 1666, "epoch": 20} {"train_loss": -15.299830436706543, "global_step": 1667, "epoch": 20} {"train_loss": -15.575957298278809, "global_step": 1668, "epoch": 20} {"train_loss": -15.38463020324707, "global_step": 1669, "epoch": 20} {"train_loss": -15.2037992477417, "global_step": 1670, "epoch": 20} {"train_loss": -15.750500679016113, "global_step": 1671, "epoch": 20} {"train_loss": -16.004758834838867, "global_step": 1672, "epoch": 20} {"train_loss": -15.347704887390137, "global_step": 1673, "epoch": 20} {"train_loss": -15.6744966506958, "global_step": 1674, "epoch": 20} {"train_loss": -15.628504753112793, "global_step": 1675, "epoch": 20} {"train_loss": -15.54979133605957, "global_step": 1676, "epoch": 20} {"train_loss": -15.553118705749512, "global_step": 1677, "epoch": 20} {"train_loss": -15.233283042907715, "global_step": 1678, "epoch": 20} {"train_loss": -15.744257926940918, "global_step": 1679, "epoch": 20} {"train_loss": -15.74828815460205, "global_step": 1680, "epoch": 20} {"train_loss": -15.491244316101074, "global_step": 1681, "epoch": 20} {"train_loss": -15.844171524047852, "global_step": 1682, "epoch": 20} {"train_loss": -15.390265464782715, "global_step": 1683, "epoch": 20} {"train_loss": -15.514838218688965, "global_step": 1684, "epoch": 20} {"train_loss": -15.890097618103027, "global_step": 1685, "epoch": 20} {"train_loss": -15.850082397460938, "global_step": 1686, "epoch": 20} {"train_loss": -15.615796089172363, "global_step": 1687, "epoch": 20} {"train_loss": -15.585339546203613, "global_step": 1688, "epoch": 20} {"train_loss": -15.610821723937988, "global_step": 1689, "epoch": 20} {"train_loss": -15.281352043151855, "global_step": 1690, "epoch": 20} {"train_loss": -16.01578712463379, "global_step": 1691, "epoch": 20} {"train_loss": -15.779306411743164, "global_step": 1692, "epoch": 20} {"train_loss": -15.74112606048584, "global_step": 1693, "epoch": 20} {"train_loss": -15.79656982421875, "global_step": 1694, "epoch": 20} {"train_loss": -15.833487510681152, "global_step": 1695, "epoch": 20} {"train_loss": -15.959612846374512, "global_step": 1696, "epoch": 20} {"train_loss": -15.659286499023438, "global_step": 1697, "epoch": 20} {"train_loss": -15.725064277648926, "global_step": 1698, "epoch": 20} {"train_loss": -15.191710472106934, "global_step": 1699, "epoch": 20} {"train_loss": -16.091806411743164, "global_step": 1700, "epoch": 20} {"train_loss": -15.652907371520996, "global_step": 1701, "epoch": 20} {"train_loss": -15.918792724609375, "global_step": 1702, "epoch": 20} {"train_loss": -15.859901428222656, "global_step": 1703, "epoch": 20} {"train_loss": -15.827725410461426, "global_step": 1704, "epoch": 20} {"train_loss": -15.445490837097168, "global_step": 1705, "epoch": 20} {"train_loss": -15.78369426727295, "global_step": 1706, "epoch": 20} {"train_loss": -15.526826858520508, "global_step": 1707, "epoch": 20} {"train_loss": -15.505023002624512, "global_step": 1708, "epoch": 20} {"train_loss": -15.619491577148438, "global_step": 1709, "epoch": 20} {"train_loss": -15.68943977355957, "global_step": 1710, "epoch": 20} {"train_loss": -16.087581634521484, "global_step": 1711, "epoch": 20} {"train_loss": -15.416857719421387, "global_step": 1712, "epoch": 20} {"train_loss": -15.702319145202637, "global_step": 1713, "epoch": 20} {"train_loss": -15.355325698852539, "global_step": 1714, "epoch": 20} {"train_loss": -15.50016975402832, "global_step": 1715, "epoch": 20} {"train_loss": -15.839431762695312, "global_step": 1716, "epoch": 20} {"train_loss": -15.70810604095459, "global_step": 1717, "epoch": 20} {"train_loss": -15.475674629211426, "global_step": 1718, "epoch": 20} {"train_loss": -15.437642097473145, "global_step": 1719, "epoch": 20} {"train_loss": -16.158897399902344, "global_step": 1720, "epoch": 20} {"train_loss": -15.86798095703125, "global_step": 1721, "epoch": 20} {"train_loss": -15.917343139648438, "global_step": 1722, "epoch": 20} {"train_loss": -15.7050199508667, "global_step": 1723, "epoch": 20} {"train_loss": -15.307408332824707, "global_step": 1724, "epoch": 20} {"train_loss": -16.006223678588867, "global_step": 1725, "epoch": 20} {"train_loss": -15.887812614440918, "global_step": 1726, "epoch": 20} {"train_loss": -15.77375316619873, "global_step": 1727, "epoch": 20} {"train_loss": -16.090747833251953, "global_step": 1728, "epoch": 20} {"train_loss": -15.602118492126465, "global_step": 1729, "epoch": 20} {"train_loss": -15.847384452819824, "global_step": 1730, "epoch": 20} {"train_loss": -15.809249877929688, "global_step": 1731, "epoch": 20} {"train_loss": -15.765179634094238, "global_step": 1732, "epoch": 20} {"train_loss": -16.098255157470703, "global_step": 1733, "epoch": 20} {"train_loss": -15.706610679626465, "global_step": 1734, "epoch": 20} {"train_loss": -16.135889053344727, "global_step": 1735, "epoch": 20} {"train_loss": -15.822641372680664, "global_step": 1736, "epoch": 20} {"train_loss": -15.34094524383545, "global_step": 1737, "epoch": 20} {"train_loss": -15.46739673614502, "global_step": 1738, "epoch": 20} {"train_loss": -15.679898262023926, "global_step": 1739, "epoch": 20} {"train_loss": -15.989455223083496, "global_step": 1740, "epoch": 20} {"train_loss": -15.40812873840332, "global_step": 1741, "epoch": 20} {"train_loss": -15.651131262262183, "global_step": 1742, "epoch": 20, "val_loss": 8290580.5} {"train_loss": -15.777816772460938, "global_step": 1743, "epoch": 21} {"train_loss": -15.661259651184082, "global_step": 1744, "epoch": 21} {"train_loss": -15.525970458984375, "global_step": 1745, "epoch": 21} {"train_loss": -15.496788024902344, "global_step": 1746, "epoch": 21} {"train_loss": -15.785890579223633, "global_step": 1747, "epoch": 21} {"train_loss": -15.836297988891602, "global_step": 1748, "epoch": 21} {"train_loss": -15.640955924987793, "global_step": 1749, "epoch": 21} {"train_loss": -15.789384841918945, "global_step": 1750, "epoch": 21} {"train_loss": -15.7184419631958, "global_step": 1751, "epoch": 21} {"train_loss": -15.634894371032715, "global_step": 1752, "epoch": 21} {"train_loss": -15.509485244750977, "global_step": 1753, "epoch": 21} {"train_loss": -15.667337417602539, "global_step": 1754, "epoch": 21} {"train_loss": -15.694162368774414, "global_step": 1755, "epoch": 21} {"train_loss": -15.743524551391602, "global_step": 1756, "epoch": 21} {"train_loss": -15.30853271484375, "global_step": 1757, "epoch": 21} {"train_loss": -15.445777893066406, "global_step": 1758, "epoch": 21} {"train_loss": -15.655441284179688, "global_step": 1759, "epoch": 21} {"train_loss": -15.392931938171387, "global_step": 1760, "epoch": 21} {"train_loss": -15.87219524383545, "global_step": 1761, "epoch": 21} {"train_loss": -15.909710884094238, "global_step": 1762, "epoch": 21} {"train_loss": -15.527521133422852, "global_step": 1763, "epoch": 21} {"train_loss": -15.658859252929688, "global_step": 1764, "epoch": 21} {"train_loss": -15.732699394226074, "global_step": 1765, "epoch": 21} {"train_loss": -15.76072883605957, "global_step": 1766, "epoch": 21} {"train_loss": -15.79477596282959, "global_step": 1767, "epoch": 21} {"train_loss": -16.02385139465332, "global_step": 1768, "epoch": 21} {"train_loss": -15.663284301757812, "global_step": 1769, "epoch": 21} {"train_loss": -15.621515274047852, "global_step": 1770, "epoch": 21} {"train_loss": -15.840533256530762, "global_step": 1771, "epoch": 21} {"train_loss": -15.226022720336914, "global_step": 1772, "epoch": 21} {"train_loss": -15.937997817993164, "global_step": 1773, "epoch": 21} {"train_loss": -15.529083251953125, "global_step": 1774, "epoch": 21} {"train_loss": -15.606099128723145, "global_step": 1775, "epoch": 21} {"train_loss": -15.872797012329102, "global_step": 1776, "epoch": 21} {"train_loss": -15.905667304992676, "global_step": 1777, "epoch": 21} {"train_loss": -15.968828201293945, "global_step": 1778, "epoch": 21} {"train_loss": -15.473258018493652, "global_step": 1779, "epoch": 21} {"train_loss": -15.793120384216309, "global_step": 1780, "epoch": 21} {"train_loss": -15.672999382019043, "global_step": 1781, "epoch": 21} {"train_loss": -15.451178550720215, "global_step": 1782, "epoch": 21} {"train_loss": -16.014150619506836, "global_step": 1783, "epoch": 21} {"train_loss": -15.838793754577637, "global_step": 1784, "epoch": 21} {"train_loss": -15.684653282165527, "global_step": 1785, "epoch": 21} {"train_loss": -16.24217414855957, "global_step": 1786, "epoch": 21} {"train_loss": -15.706491470336914, "global_step": 1787, "epoch": 21} {"train_loss": -15.925536155700684, "global_step": 1788, "epoch": 21} {"train_loss": -16.061786651611328, "global_step": 1789, "epoch": 21} {"train_loss": -16.02142333984375, "global_step": 1790, "epoch": 21} {"train_loss": -15.788986206054688, "global_step": 1791, "epoch": 21} {"train_loss": -15.925918579101562, "global_step": 1792, "epoch": 21} {"train_loss": -15.949957847595215, "global_step": 1793, "epoch": 21} {"train_loss": -15.89151668548584, "global_step": 1794, "epoch": 21} {"train_loss": -16.18070411682129, "global_step": 1795, "epoch": 21} {"train_loss": -15.126309394836426, "global_step": 1796, "epoch": 21} {"train_loss": -15.852096557617188, "global_step": 1797, "epoch": 21} {"train_loss": -16.02721405029297, "global_step": 1798, "epoch": 21} {"train_loss": -15.850438117980957, "global_step": 1799, "epoch": 21} {"train_loss": -15.943330764770508, "global_step": 1800, "epoch": 21} {"train_loss": -15.757287979125977, "global_step": 1801, "epoch": 21} {"train_loss": -15.444047927856445, "global_step": 1802, "epoch": 21} {"train_loss": -15.600836753845215, "global_step": 1803, "epoch": 21} {"train_loss": -15.705283164978027, "global_step": 1804, "epoch": 21} {"train_loss": -15.723367691040039, "global_step": 1805, "epoch": 21} {"train_loss": -15.478418350219727, "global_step": 1806, "epoch": 21} {"train_loss": -15.973380088806152, "global_step": 1807, "epoch": 21} {"train_loss": -15.995465278625488, "global_step": 1808, "epoch": 21} {"train_loss": -16.01777458190918, "global_step": 1809, "epoch": 21} {"train_loss": -16.005361557006836, "global_step": 1810, "epoch": 21} {"train_loss": -15.844046592712402, "global_step": 1811, "epoch": 21} {"train_loss": -15.819592475891113, "global_step": 1812, "epoch": 21} {"train_loss": -15.644217491149902, "global_step": 1813, "epoch": 21} {"train_loss": -15.364447593688965, "global_step": 1814, "epoch": 21} {"train_loss": -15.670051574707031, "global_step": 1815, "epoch": 21} {"train_loss": -15.53235149383545, "global_step": 1816, "epoch": 21} {"train_loss": -16.01099967956543, "global_step": 1817, "epoch": 21} {"train_loss": -15.66613483428955, "global_step": 1818, "epoch": 21} {"train_loss": -15.949307441711426, "global_step": 1819, "epoch": 21} {"train_loss": -15.501708030700684, "global_step": 1820, "epoch": 21} {"train_loss": -16.062923431396484, "global_step": 1821, "epoch": 21} {"train_loss": -15.50914478302002, "global_step": 1822, "epoch": 21} {"train_loss": -15.942026138305664, "global_step": 1823, "epoch": 21} {"train_loss": -15.518736839294434, "global_step": 1824, "epoch": 21} {"train_loss": -15.744229385651737, "global_step": 1825, "epoch": 21, "val_loss": 8125925.0} {"train_loss": -15.148874282836914, "global_step": 1826, "epoch": 22} {"train_loss": -16.04416275024414, "global_step": 1827, "epoch": 22} {"train_loss": -15.981654167175293, "global_step": 1828, "epoch": 22} {"train_loss": -15.768475532531738, "global_step": 1829, "epoch": 22} {"train_loss": -15.750704765319824, "global_step": 1830, "epoch": 22} {"train_loss": -15.345003128051758, "global_step": 1831, "epoch": 22} {"train_loss": -16.0238094329834, "global_step": 1832, "epoch": 22} {"train_loss": -15.904492378234863, "global_step": 1833, "epoch": 22} {"train_loss": -16.30306053161621, "global_step": 1834, "epoch": 22} {"train_loss": -16.012380599975586, "global_step": 1835, "epoch": 22} {"train_loss": -15.810661315917969, "global_step": 1836, "epoch": 22} {"train_loss": -16.018207550048828, "global_step": 1837, "epoch": 22} {"train_loss": -15.72099781036377, "global_step": 1838, "epoch": 22} {"train_loss": -15.836374282836914, "global_step": 1839, "epoch": 22} {"train_loss": -15.80548095703125, "global_step": 1840, "epoch": 22} {"train_loss": -15.56096363067627, "global_step": 1841, "epoch": 22} {"train_loss": -15.780611038208008, "global_step": 1842, "epoch": 22} {"train_loss": -14.938891410827637, "global_step": 1843, "epoch": 22} {"train_loss": -15.882043838500977, "global_step": 1844, "epoch": 22} {"train_loss": -15.587666511535645, "global_step": 1845, "epoch": 22} {"train_loss": -15.560961723327637, "global_step": 1846, "epoch": 22} {"train_loss": -15.29077434539795, "global_step": 1847, "epoch": 22} {"train_loss": -15.851602554321289, "global_step": 1848, "epoch": 22} {"train_loss": -15.681323051452637, "global_step": 1849, "epoch": 22} {"train_loss": -15.865099906921387, "global_step": 1850, "epoch": 22} {"train_loss": -15.796027183532715, "global_step": 1851, "epoch": 22} {"train_loss": -16.00453758239746, "global_step": 1852, "epoch": 22} {"train_loss": -15.504404067993164, "global_step": 1853, "epoch": 22} {"train_loss": -15.613580703735352, "global_step": 1854, "epoch": 22} {"train_loss": -15.613608360290527, "global_step": 1855, "epoch": 22} {"train_loss": -15.730262756347656, "global_step": 1856, "epoch": 22} {"train_loss": -16.010913848876953, "global_step": 1857, "epoch": 22} {"train_loss": -15.617667198181152, "global_step": 1858, "epoch": 22} {"train_loss": -15.966238975524902, "global_step": 1859, "epoch": 22} {"train_loss": -15.99628734588623, "global_step": 1860, "epoch": 22} {"train_loss": -15.844611167907715, "global_step": 1861, "epoch": 22} {"train_loss": -15.591211318969727, "global_step": 1862, "epoch": 22} {"train_loss": -15.867120742797852, "global_step": 1863, "epoch": 22} {"train_loss": -15.666098594665527, "global_step": 1864, "epoch": 22} {"train_loss": -16.185707092285156, "global_step": 1865, "epoch": 22} {"train_loss": -15.928458213806152, "global_step": 1866, "epoch": 22} {"train_loss": -15.374963760375977, "global_step": 1867, "epoch": 22} {"train_loss": -15.890945434570312, "global_step": 1868, "epoch": 22} {"train_loss": -15.477513313293457, "global_step": 1869, "epoch": 22} {"train_loss": -16.05416488647461, "global_step": 1870, "epoch": 22} {"train_loss": -15.855422973632812, "global_step": 1871, "epoch": 22} {"train_loss": -15.652668952941895, "global_step": 1872, "epoch": 22} {"train_loss": -15.80908203125, "global_step": 1873, "epoch": 22} {"train_loss": -15.777815818786621, "global_step": 1874, "epoch": 22} {"train_loss": -15.789239883422852, "global_step": 1875, "epoch": 22} {"train_loss": -15.946809768676758, "global_step": 1876, "epoch": 22} {"train_loss": -15.935495376586914, "global_step": 1877, "epoch": 22} {"train_loss": -15.579248428344727, "global_step": 1878, "epoch": 22} {"train_loss": -16.140893936157227, "global_step": 1879, "epoch": 22} {"train_loss": -15.936495780944824, "global_step": 1880, "epoch": 22} {"train_loss": -15.881834983825684, "global_step": 1881, "epoch": 22} {"train_loss": -15.738090515136719, "global_step": 1882, "epoch": 22} {"train_loss": -16.11122703552246, "global_step": 1883, "epoch": 22} {"train_loss": -15.768332481384277, "global_step": 1884, "epoch": 22} {"train_loss": -15.846747398376465, "global_step": 1885, "epoch": 22} {"train_loss": -15.822066307067871, "global_step": 1886, "epoch": 22} {"train_loss": -15.784625053405762, "global_step": 1887, "epoch": 22} {"train_loss": -16.070270538330078, "global_step": 1888, "epoch": 22} {"train_loss": -15.824450492858887, "global_step": 1889, "epoch": 22} {"train_loss": -16.121585845947266, "global_step": 1890, "epoch": 22} {"train_loss": -15.536709785461426, "global_step": 1891, "epoch": 22} {"train_loss": -15.903225898742676, "global_step": 1892, "epoch": 22} {"train_loss": -15.670554161071777, "global_step": 1893, "epoch": 22} {"train_loss": -15.925091743469238, "global_step": 1894, "epoch": 22} {"train_loss": -15.811172485351562, "global_step": 1895, "epoch": 22} {"train_loss": -15.853957176208496, "global_step": 1896, "epoch": 22} {"train_loss": -15.817855834960938, "global_step": 1897, "epoch": 22} {"train_loss": -15.884042739868164, "global_step": 1898, "epoch": 22} {"train_loss": -15.822664260864258, "global_step": 1899, "epoch": 22} {"train_loss": -15.836685180664062, "global_step": 1900, "epoch": 22} {"train_loss": -15.963220596313477, "global_step": 1901, "epoch": 22} {"train_loss": -15.883615493774414, "global_step": 1902, "epoch": 22} {"train_loss": -15.790928840637207, "global_step": 1903, "epoch": 22} {"train_loss": -16.15777015686035, "global_step": 1904, "epoch": 22} {"train_loss": -15.821512222290039, "global_step": 1905, "epoch": 22} {"train_loss": -15.769970893859863, "global_step": 1906, "epoch": 22} {"train_loss": -15.766357421875, "global_step": 1907, "epoch": 22} {"train_loss": -15.811405101454401, "global_step": 1908, "epoch": 22, "val_loss": 8000362.0} {"train_loss": -15.858833312988281, "global_step": 1909, "epoch": 23} {"train_loss": -16.034900665283203, "global_step": 1910, "epoch": 23} {"train_loss": -15.437491416931152, "global_step": 1911, "epoch": 23} {"train_loss": -15.805304527282715, "global_step": 1912, "epoch": 23} {"train_loss": -16.086139678955078, "global_step": 1913, "epoch": 23} {"train_loss": -15.872398376464844, "global_step": 1914, "epoch": 23} {"train_loss": -15.7651948928833, "global_step": 1915, "epoch": 23} {"train_loss": -15.689801216125488, "global_step": 1916, "epoch": 23} {"train_loss": -15.758414268493652, "global_step": 1917, "epoch": 23} {"train_loss": -15.606103897094727, "global_step": 1918, "epoch": 23} {"train_loss": -15.644125938415527, "global_step": 1919, "epoch": 23} {"train_loss": -15.81189250946045, "global_step": 1920, "epoch": 23} {"train_loss": -15.990121841430664, "global_step": 1921, "epoch": 23} {"train_loss": -15.47636604309082, "global_step": 1922, "epoch": 23} {"train_loss": -15.854208946228027, "global_step": 1923, "epoch": 23} {"train_loss": -15.622942924499512, "global_step": 1924, "epoch": 23} {"train_loss": -16.5074462890625, "global_step": 1925, "epoch": 23} {"train_loss": -15.583523750305176, "global_step": 1926, "epoch": 23} {"train_loss": -15.921905517578125, "global_step": 1927, "epoch": 23} {"train_loss": -16.18160057067871, "global_step": 1928, "epoch": 23} {"train_loss": -15.6113862991333, "global_step": 1929, "epoch": 23} {"train_loss": -15.910659790039062, "global_step": 1930, "epoch": 23} {"train_loss": -15.95465087890625, "global_step": 1931, "epoch": 23} {"train_loss": -15.699853897094727, "global_step": 1932, "epoch": 23} {"train_loss": -15.644006729125977, "global_step": 1933, "epoch": 23} {"train_loss": -15.644792556762695, "global_step": 1934, "epoch": 23} {"train_loss": -15.855348587036133, "global_step": 1935, "epoch": 23} {"train_loss": -15.508746147155762, "global_step": 1936, "epoch": 23} {"train_loss": -15.760481834411621, "global_step": 1937, "epoch": 23} {"train_loss": -15.709149360656738, "global_step": 1938, "epoch": 23} {"train_loss": -15.378802299499512, "global_step": 1939, "epoch": 23} {"train_loss": -15.485383987426758, "global_step": 1940, "epoch": 23} {"train_loss": -15.929120063781738, "global_step": 1941, "epoch": 23} {"train_loss": -15.911337852478027, "global_step": 1942, "epoch": 23} {"train_loss": -15.728201866149902, "global_step": 1943, "epoch": 23} {"train_loss": -16.426681518554688, "global_step": 1944, "epoch": 23} {"train_loss": -15.736846923828125, "global_step": 1945, "epoch": 23} {"train_loss": -16.150999069213867, "global_step": 1946, "epoch": 23} {"train_loss": -15.860997200012207, "global_step": 1947, "epoch": 23} {"train_loss": -15.984509468078613, "global_step": 1948, "epoch": 23} {"train_loss": -15.4181489944458, "global_step": 1949, "epoch": 23} {"train_loss": -15.952252388000488, "global_step": 1950, "epoch": 23} {"train_loss": -15.739108085632324, "global_step": 1951, "epoch": 23} {"train_loss": -15.819941520690918, "global_step": 1952, "epoch": 23} {"train_loss": -15.41778564453125, "global_step": 1953, "epoch": 23} {"train_loss": -15.847149848937988, "global_step": 1954, "epoch": 23} {"train_loss": -15.816781997680664, "global_step": 1955, "epoch": 23} {"train_loss": -16.020263671875, "global_step": 1956, "epoch": 23} {"train_loss": -16.0555477142334, "global_step": 1957, "epoch": 23} {"train_loss": -15.566702842712402, "global_step": 1958, "epoch": 23} {"train_loss": -15.993494033813477, "global_step": 1959, "epoch": 23} {"train_loss": -15.483477592468262, "global_step": 1960, "epoch": 23} {"train_loss": -15.858670234680176, "global_step": 1961, "epoch": 23} {"train_loss": -15.352633476257324, "global_step": 1962, "epoch": 23} {"train_loss": -15.76605224609375, "global_step": 1963, "epoch": 23} {"train_loss": -15.885283470153809, "global_step": 1964, "epoch": 23} {"train_loss": -15.946733474731445, "global_step": 1965, "epoch": 23} {"train_loss": -15.878287315368652, "global_step": 1966, "epoch": 23} {"train_loss": -15.78088092803955, "global_step": 1967, "epoch": 23} {"train_loss": -16.052814483642578, "global_step": 1968, "epoch": 23} {"train_loss": -15.726373672485352, "global_step": 1969, "epoch": 23} {"train_loss": -15.746722221374512, "global_step": 1970, "epoch": 23} {"train_loss": -15.638165473937988, "global_step": 1971, "epoch": 23} {"train_loss": -15.77048397064209, "global_step": 1972, "epoch": 23} {"train_loss": -15.492350578308105, "global_step": 1973, "epoch": 23} {"train_loss": -15.699029922485352, "global_step": 1974, "epoch": 23} {"train_loss": -16.052066802978516, "global_step": 1975, "epoch": 23} {"train_loss": -15.578167915344238, "global_step": 1976, "epoch": 23} {"train_loss": -15.786447525024414, "global_step": 1977, "epoch": 23} {"train_loss": -16.09578514099121, "global_step": 1978, "epoch": 23} {"train_loss": -16.01823616027832, "global_step": 1979, "epoch": 23} {"train_loss": -15.582797050476074, "global_step": 1980, "epoch": 23} {"train_loss": -15.970858573913574, "global_step": 1981, "epoch": 23} {"train_loss": -15.89987850189209, "global_step": 1982, "epoch": 23} {"train_loss": -15.795297622680664, "global_step": 1983, "epoch": 23} {"train_loss": -15.59769344329834, "global_step": 1984, "epoch": 23} {"train_loss": -16.047712326049805, "global_step": 1985, "epoch": 23} {"train_loss": -16.032499313354492, "global_step": 1986, "epoch": 23} {"train_loss": -15.925036430358887, "global_step": 1987, "epoch": 23} {"train_loss": -15.992929458618164, "global_step": 1988, "epoch": 23} {"train_loss": -16.356220245361328, "global_step": 1989, "epoch": 23} {"train_loss": -15.884918212890625, "global_step": 1990, "epoch": 23} {"train_loss": -15.814257541334772, "global_step": 1991, "epoch": 23, "val_loss": 8093486.0} {"train_loss": -15.728116035461426, "global_step": 1992, "epoch": 24} {"train_loss": -15.820563316345215, "global_step": 1993, "epoch": 24} {"train_loss": -15.887771606445312, "global_step": 1994, "epoch": 24} {"train_loss": -15.823864936828613, "global_step": 1995, "epoch": 24} {"train_loss": -16.083637237548828, "global_step": 1996, "epoch": 24} {"train_loss": -15.69487190246582, "global_step": 1997, "epoch": 24} {"train_loss": -15.581494331359863, "global_step": 1998, "epoch": 24} {"train_loss": -15.94016170501709, "global_step": 1999, "epoch": 24} {"train_loss": -15.651483535766602, "global_step": 2000, "epoch": 24} {"train_loss": -15.716005325317383, "global_step": 2001, "epoch": 24} {"train_loss": -16.314462661743164, "global_step": 2002, "epoch": 24} {"train_loss": -16.07413101196289, "global_step": 2003, "epoch": 24} {"train_loss": -15.854840278625488, "global_step": 2004, "epoch": 24} {"train_loss": -15.764662742614746, "global_step": 2005, "epoch": 24} {"train_loss": -15.86731243133545, "global_step": 2006, "epoch": 24} {"train_loss": -15.955151557922363, "global_step": 2007, "epoch": 24} {"train_loss": -15.752410888671875, "global_step": 2008, "epoch": 24} {"train_loss": -15.552664756774902, "global_step": 2009, "epoch": 24} {"train_loss": -16.115453720092773, "global_step": 2010, "epoch": 24} {"train_loss": -15.965008735656738, "global_step": 2011, "epoch": 24} {"train_loss": -15.646202087402344, "global_step": 2012, "epoch": 24} {"train_loss": -15.818979263305664, "global_step": 2013, "epoch": 24} {"train_loss": -15.845077514648438, "global_step": 2014, "epoch": 24} {"train_loss": -15.432734489440918, "global_step": 2015, "epoch": 24} {"train_loss": -15.791444778442383, "global_step": 2016, "epoch": 24} {"train_loss": -15.688931465148926, "global_step": 2017, "epoch": 24} {"train_loss": -16.13856315612793, "global_step": 2018, "epoch": 24} {"train_loss": -15.86816692352295, "global_step": 2019, "epoch": 24} {"train_loss": -15.803071975708008, "global_step": 2020, "epoch": 24} {"train_loss": -15.815431594848633, "global_step": 2021, "epoch": 24} {"train_loss": -15.81701374053955, "global_step": 2022, "epoch": 24} {"train_loss": -15.712725639343262, "global_step": 2023, "epoch": 24} {"train_loss": -15.90516185760498, "global_step": 2024, "epoch": 24} {"train_loss": -16.04804039001465, "global_step": 2025, "epoch": 24} {"train_loss": -15.364280700683594, "global_step": 2026, "epoch": 24} {"train_loss": -15.716361045837402, "global_step": 2027, "epoch": 24} {"train_loss": -15.972061157226562, "global_step": 2028, "epoch": 24} {"train_loss": -15.628680229187012, "global_step": 2029, "epoch": 24} {"train_loss": -15.937762260437012, "global_step": 2030, "epoch": 24} {"train_loss": -15.731833457946777, "global_step": 2031, "epoch": 24} {"train_loss": -15.751025199890137, "global_step": 2032, "epoch": 24} {"train_loss": -15.989114761352539, "global_step": 2033, "epoch": 24} {"train_loss": -15.717065811157227, "global_step": 2034, "epoch": 24} {"train_loss": -15.747000694274902, "global_step": 2035, "epoch": 24} {"train_loss": -15.620999336242676, "global_step": 2036, "epoch": 24} {"train_loss": -15.77546215057373, "global_step": 2037, "epoch": 24} {"train_loss": -15.909422874450684, "global_step": 2038, "epoch": 24} {"train_loss": -15.747845649719238, "global_step": 2039, "epoch": 24} {"train_loss": -15.848238945007324, "global_step": 2040, "epoch": 24} {"train_loss": -15.907748222351074, "global_step": 2041, "epoch": 24} {"train_loss": -15.814663887023926, "global_step": 2042, "epoch": 24} {"train_loss": -16.188785552978516, "global_step": 2043, "epoch": 24} {"train_loss": -16.024351119995117, "global_step": 2044, "epoch": 24} {"train_loss": -15.819757461547852, "global_step": 2045, "epoch": 24} {"train_loss": -16.400535583496094, "global_step": 2046, "epoch": 24} {"train_loss": -16.075368881225586, "global_step": 2047, "epoch": 24} {"train_loss": -15.8839750289917, "global_step": 2048, "epoch": 24} {"train_loss": -16.345319747924805, "global_step": 2049, "epoch": 24} {"train_loss": -15.892184257507324, "global_step": 2050, "epoch": 24} {"train_loss": -16.288549423217773, "global_step": 2051, "epoch": 24} {"train_loss": -15.908818244934082, "global_step": 2052, "epoch": 24} {"train_loss": -15.959274291992188, "global_step": 2053, "epoch": 24} {"train_loss": -16.15243911743164, "global_step": 2054, "epoch": 24} {"train_loss": -16.273849487304688, "global_step": 2055, "epoch": 24} {"train_loss": -16.020788192749023, "global_step": 2056, "epoch": 24} {"train_loss": -15.484301567077637, "global_step": 2057, "epoch": 24} {"train_loss": -15.79997444152832, "global_step": 2058, "epoch": 24} {"train_loss": -16.10694122314453, "global_step": 2059, "epoch": 24} {"train_loss": -16.004484176635742, "global_step": 2060, "epoch": 24} {"train_loss": -15.886771202087402, "global_step": 2061, "epoch": 24} {"train_loss": -15.903613090515137, "global_step": 2062, "epoch": 24} {"train_loss": -16.096452713012695, "global_step": 2063, "epoch": 24} {"train_loss": -16.073049545288086, "global_step": 2064, "epoch": 24} {"train_loss": -15.877707481384277, "global_step": 2065, "epoch": 24} {"train_loss": -15.694262504577637, "global_step": 2066, "epoch": 24} {"train_loss": -16.008426666259766, "global_step": 2067, "epoch": 24} {"train_loss": -16.198863983154297, "global_step": 2068, "epoch": 24} {"train_loss": -16.35416603088379, "global_step": 2069, "epoch": 24} {"train_loss": -16.185224533081055, "global_step": 2070, "epoch": 24} {"train_loss": -16.10100555419922, "global_step": 2071, "epoch": 24} {"train_loss": -16.03557777404785, "global_step": 2072, "epoch": 24} {"train_loss": -15.916953086853027, "global_step": 2073, "epoch": 24} {"train_loss": -15.894047645201166, "global_step": 2074, "epoch": 24, "val_loss": 7819275.0} {"train_loss": -16.36625099182129, "global_step": 2075, "epoch": 25} {"train_loss": -15.719461441040039, "global_step": 2076, "epoch": 25} {"train_loss": -15.989450454711914, "global_step": 2077, "epoch": 25} {"train_loss": -15.731955528259277, "global_step": 2078, "epoch": 25} {"train_loss": -15.333131790161133, "global_step": 2079, "epoch": 25} {"train_loss": -15.955790519714355, "global_step": 2080, "epoch": 25} {"train_loss": -15.721506118774414, "global_step": 2081, "epoch": 25} {"train_loss": -15.99585247039795, "global_step": 2082, "epoch": 25} {"train_loss": -15.804484367370605, "global_step": 2083, "epoch": 25} {"train_loss": -15.852765083312988, "global_step": 2084, "epoch": 25} {"train_loss": -16.28091812133789, "global_step": 2085, "epoch": 25} {"train_loss": -15.834063529968262, "global_step": 2086, "epoch": 25} {"train_loss": -16.11945152282715, "global_step": 2087, "epoch": 25} {"train_loss": -16.241241455078125, "global_step": 2088, "epoch": 25} {"train_loss": -16.13079261779785, "global_step": 2089, "epoch": 25} {"train_loss": -15.93761157989502, "global_step": 2090, "epoch": 25} {"train_loss": -16.11366844177246, "global_step": 2091, "epoch": 25} {"train_loss": -15.87231731414795, "global_step": 2092, "epoch": 25} {"train_loss": -15.876733779907227, "global_step": 2093, "epoch": 25} {"train_loss": -15.897193908691406, "global_step": 2094, "epoch": 25} {"train_loss": -15.801068305969238, "global_step": 2095, "epoch": 25} {"train_loss": -16.081195831298828, "global_step": 2096, "epoch": 25} {"train_loss": -16.228395462036133, "global_step": 2097, "epoch": 25} {"train_loss": -15.665936470031738, "global_step": 2098, "epoch": 25} {"train_loss": -15.977396965026855, "global_step": 2099, "epoch": 25} {"train_loss": -16.2122745513916, "global_step": 2100, "epoch": 25} {"train_loss": -15.907198905944824, "global_step": 2101, "epoch": 25} {"train_loss": -15.715062141418457, "global_step": 2102, "epoch": 25} {"train_loss": -15.957237243652344, "global_step": 2103, "epoch": 25} {"train_loss": -16.07508659362793, "global_step": 2104, "epoch": 25} {"train_loss": -15.800027847290039, "global_step": 2105, "epoch": 25} {"train_loss": -15.624533653259277, "global_step": 2106, "epoch": 25} {"train_loss": -15.795343399047852, "global_step": 2107, "epoch": 25} {"train_loss": -15.730979919433594, "global_step": 2108, "epoch": 25} {"train_loss": -15.9520902633667, "global_step": 2109, "epoch": 25} {"train_loss": -15.954913139343262, "global_step": 2110, "epoch": 25} {"train_loss": -16.333932876586914, "global_step": 2111, "epoch": 25} {"train_loss": -15.991029739379883, "global_step": 2112, "epoch": 25} {"train_loss": -16.13308334350586, "global_step": 2113, "epoch": 25} {"train_loss": -15.802653312683105, "global_step": 2114, "epoch": 25} {"train_loss": -16.031734466552734, "global_step": 2115, "epoch": 25} {"train_loss": -15.936538696289062, "global_step": 2116, "epoch": 25} {"train_loss": -15.957354545593262, "global_step": 2117, "epoch": 25} {"train_loss": -15.504633903503418, "global_step": 2118, "epoch": 25} {"train_loss": -16.206632614135742, "global_step": 2119, "epoch": 25} {"train_loss": -16.196298599243164, "global_step": 2120, "epoch": 25} {"train_loss": -15.801318168640137, "global_step": 2121, "epoch": 25} {"train_loss": -15.843817710876465, "global_step": 2122, "epoch": 25} {"train_loss": -15.944429397583008, "global_step": 2123, "epoch": 25} {"train_loss": -15.8405122756958, "global_step": 2124, "epoch": 25} {"train_loss": -15.987899780273438, "global_step": 2125, "epoch": 25} {"train_loss": -15.535811424255371, "global_step": 2126, "epoch": 25} {"train_loss": -15.958000183105469, "global_step": 2127, "epoch": 25} {"train_loss": -15.955473899841309, "global_step": 2128, "epoch": 25} {"train_loss": -15.763910293579102, "global_step": 2129, "epoch": 25} {"train_loss": -16.432523727416992, "global_step": 2130, "epoch": 25} {"train_loss": -15.983100891113281, "global_step": 2131, "epoch": 25} {"train_loss": -16.089414596557617, "global_step": 2132, "epoch": 25} {"train_loss": -15.753206253051758, "global_step": 2133, "epoch": 25} {"train_loss": -15.572070121765137, "global_step": 2134, "epoch": 25} {"train_loss": -16.26405143737793, "global_step": 2135, "epoch": 25} {"train_loss": -16.251625061035156, "global_step": 2136, "epoch": 25} {"train_loss": -16.169904708862305, "global_step": 2137, "epoch": 25} {"train_loss": -15.965927124023438, "global_step": 2138, "epoch": 25} {"train_loss": -15.467328071594238, "global_step": 2139, "epoch": 25} {"train_loss": -15.79113483428955, "global_step": 2140, "epoch": 25} {"train_loss": -15.735394477844238, "global_step": 2141, "epoch": 25} {"train_loss": -15.889262199401855, "global_step": 2142, "epoch": 25} {"train_loss": -15.922749519348145, "global_step": 2143, "epoch": 25} {"train_loss": -16.02666664123535, "global_step": 2144, "epoch": 25} {"train_loss": -16.39212989807129, "global_step": 2145, "epoch": 25} {"train_loss": -16.056379318237305, "global_step": 2146, "epoch": 25} {"train_loss": -15.642813682556152, "global_step": 2147, "epoch": 25} {"train_loss": -16.17498779296875, "global_step": 2148, "epoch": 25} {"train_loss": -15.63287353515625, "global_step": 2149, "epoch": 25} {"train_loss": -15.52780818939209, "global_step": 2150, "epoch": 25} {"train_loss": -16.2852725982666, "global_step": 2151, "epoch": 25} {"train_loss": -16.228315353393555, "global_step": 2152, "epoch": 25} {"train_loss": -15.797037124633789, "global_step": 2153, "epoch": 25} {"train_loss": -16.290729522705078, "global_step": 2154, "epoch": 25} {"train_loss": -15.877062797546387, "global_step": 2155, "epoch": 25} {"train_loss": -16.122560501098633, "global_step": 2156, "epoch": 25} {"train_loss": -15.919958413365375, "global_step": 2157, "epoch": 25, "val_loss": 7664328.5} {"train_loss": -16.04840850830078, "global_step": 2158, "epoch": 26} {"train_loss": -15.875981330871582, "global_step": 2159, "epoch": 26} {"train_loss": -16.021467208862305, "global_step": 2160, "epoch": 26} {"train_loss": -15.780829429626465, "global_step": 2161, "epoch": 26} {"train_loss": -15.841925621032715, "global_step": 2162, "epoch": 26} {"train_loss": -15.823147773742676, "global_step": 2163, "epoch": 26} {"train_loss": -16.065221786499023, "global_step": 2164, "epoch": 26} {"train_loss": -16.03275489807129, "global_step": 2165, "epoch": 26} {"train_loss": -15.717467308044434, "global_step": 2166, "epoch": 26} {"train_loss": -15.879632949829102, "global_step": 2167, "epoch": 26} {"train_loss": -15.724327087402344, "global_step": 2168, "epoch": 26} {"train_loss": -16.445348739624023, "global_step": 2169, "epoch": 26} {"train_loss": -15.868023872375488, "global_step": 2170, "epoch": 26} {"train_loss": -16.06345558166504, "global_step": 2171, "epoch": 26} {"train_loss": -16.137041091918945, "global_step": 2172, "epoch": 26} {"train_loss": -15.853545188903809, "global_step": 2173, "epoch": 26} {"train_loss": -15.843500137329102, "global_step": 2174, "epoch": 26} {"train_loss": -15.6481351852417, "global_step": 2175, "epoch": 26} {"train_loss": -15.80841064453125, "global_step": 2176, "epoch": 26} {"train_loss": -15.674676895141602, "global_step": 2177, "epoch": 26} {"train_loss": -16.027929306030273, "global_step": 2178, "epoch": 26} {"train_loss": -15.983591079711914, "global_step": 2179, "epoch": 26} {"train_loss": -16.177427291870117, "global_step": 2180, "epoch": 26} {"train_loss": -15.86798095703125, "global_step": 2181, "epoch": 26} {"train_loss": -16.20244598388672, "global_step": 2182, "epoch": 26} {"train_loss": -15.952250480651855, "global_step": 2183, "epoch": 26} {"train_loss": -15.584872245788574, "global_step": 2184, "epoch": 26} {"train_loss": -16.092742919921875, "global_step": 2185, "epoch": 26} {"train_loss": -15.982413291931152, "global_step": 2186, "epoch": 26} {"train_loss": -16.04703712463379, "global_step": 2187, "epoch": 26} {"train_loss": -16.011810302734375, "global_step": 2188, "epoch": 26} {"train_loss": -16.165822982788086, "global_step": 2189, "epoch": 26} {"train_loss": -16.415069580078125, "global_step": 2190, "epoch": 26} {"train_loss": -15.936924934387207, "global_step": 2191, "epoch": 26} {"train_loss": -16.040912628173828, "global_step": 2192, "epoch": 26} {"train_loss": -15.839545249938965, "global_step": 2193, "epoch": 26} {"train_loss": -15.986872673034668, "global_step": 2194, "epoch": 26} {"train_loss": -15.661334037780762, "global_step": 2195, "epoch": 26} {"train_loss": -15.982039451599121, "global_step": 2196, "epoch": 26} {"train_loss": -15.75818157196045, "global_step": 2197, "epoch": 26} {"train_loss": -15.649641990661621, "global_step": 2198, "epoch": 26} {"train_loss": -16.32106590270996, "global_step": 2199, "epoch": 26} {"train_loss": -15.977989196777344, "global_step": 2200, "epoch": 26} {"train_loss": -15.972314834594727, "global_step": 2201, "epoch": 26} {"train_loss": -15.884849548339844, "global_step": 2202, "epoch": 26} {"train_loss": -15.735243797302246, "global_step": 2203, "epoch": 26} {"train_loss": -15.723372459411621, "global_step": 2204, "epoch": 26} {"train_loss": -15.844757080078125, "global_step": 2205, "epoch": 26} {"train_loss": -15.927556037902832, "global_step": 2206, "epoch": 26} {"train_loss": -15.770428657531738, "global_step": 2207, "epoch": 26} {"train_loss": -16.11833953857422, "global_step": 2208, "epoch": 26} {"train_loss": -15.754007339477539, "global_step": 2209, "epoch": 26} {"train_loss": -15.966771125793457, "global_step": 2210, "epoch": 26} {"train_loss": -15.837600708007812, "global_step": 2211, "epoch": 26} {"train_loss": -15.895187377929688, "global_step": 2212, "epoch": 26} {"train_loss": -16.10756492614746, "global_step": 2213, "epoch": 26} {"train_loss": -16.1798152923584, "global_step": 2214, "epoch": 26} {"train_loss": -15.8911771774292, "global_step": 2215, "epoch": 26} {"train_loss": -16.148313522338867, "global_step": 2216, "epoch": 26} {"train_loss": -15.977261543273926, "global_step": 2217, "epoch": 26} {"train_loss": -15.963866233825684, "global_step": 2218, "epoch": 26} {"train_loss": -16.053842544555664, "global_step": 2219, "epoch": 26} {"train_loss": -15.954935073852539, "global_step": 2220, "epoch": 26} {"train_loss": -16.107267379760742, "global_step": 2221, "epoch": 26} {"train_loss": -16.199914932250977, "global_step": 2222, "epoch": 26} {"train_loss": -15.888545036315918, "global_step": 2223, "epoch": 26} {"train_loss": -15.838665962219238, "global_step": 2224, "epoch": 26} {"train_loss": -15.942378044128418, "global_step": 2225, "epoch": 26} {"train_loss": -16.065412521362305, "global_step": 2226, "epoch": 26} {"train_loss": -16.422666549682617, "global_step": 2227, "epoch": 26} {"train_loss": -16.271196365356445, "global_step": 2228, "epoch": 26} {"train_loss": -15.811271667480469, "global_step": 2229, "epoch": 26} {"train_loss": -15.869046211242676, "global_step": 2230, "epoch": 26} {"train_loss": -15.769546508789062, "global_step": 2231, "epoch": 26} {"train_loss": -15.738425254821777, "global_step": 2232, "epoch": 26} {"train_loss": -15.84508991241455, "global_step": 2233, "epoch": 26} {"train_loss": -15.836186408996582, "global_step": 2234, "epoch": 26} {"train_loss": -16.212543487548828, "global_step": 2235, "epoch": 26} {"train_loss": -15.851669311523438, "global_step": 2236, "epoch": 26} {"train_loss": -16.23154640197754, "global_step": 2237, "epoch": 26} {"train_loss": -15.972023010253906, "global_step": 2238, "epoch": 26} {"train_loss": -16.360570907592773, "global_step": 2239, "epoch": 26} {"train_loss": -15.959273223417352, "global_step": 2240, "epoch": 26, "val_loss": 7776909.5} {"train_loss": -15.749272346496582, "global_step": 2241, "epoch": 27} {"train_loss": -15.663060188293457, "global_step": 2242, "epoch": 27} {"train_loss": -16.12543296813965, "global_step": 2243, "epoch": 27} {"train_loss": -15.745787620544434, "global_step": 2244, "epoch": 27} {"train_loss": -16.2467098236084, "global_step": 2245, "epoch": 27} {"train_loss": -15.704208374023438, "global_step": 2246, "epoch": 27} {"train_loss": -15.829699516296387, "global_step": 2247, "epoch": 27} {"train_loss": -16.356901168823242, "global_step": 2248, "epoch": 27} {"train_loss": -15.373217582702637, "global_step": 2249, "epoch": 27} {"train_loss": -16.173006057739258, "global_step": 2250, "epoch": 27} {"train_loss": -16.214162826538086, "global_step": 2251, "epoch": 27} {"train_loss": -16.068679809570312, "global_step": 2252, "epoch": 27} {"train_loss": -16.06325340270996, "global_step": 2253, "epoch": 27} {"train_loss": -15.988577842712402, "global_step": 2254, "epoch": 27} {"train_loss": -16.266279220581055, "global_step": 2255, "epoch": 27} {"train_loss": -16.062091827392578, "global_step": 2256, "epoch": 27} {"train_loss": -15.53625202178955, "global_step": 2257, "epoch": 27} {"train_loss": -15.9612398147583, "global_step": 2258, "epoch": 27} {"train_loss": -15.956832885742188, "global_step": 2259, "epoch": 27} {"train_loss": -16.23294448852539, "global_step": 2260, "epoch": 27} {"train_loss": -16.008647918701172, "global_step": 2261, "epoch": 27} {"train_loss": -16.169469833374023, "global_step": 2262, "epoch": 27} {"train_loss": -16.026853561401367, "global_step": 2263, "epoch": 27} {"train_loss": -16.145172119140625, "global_step": 2264, "epoch": 27} {"train_loss": -16.002099990844727, "global_step": 2265, "epoch": 27} {"train_loss": -15.964761734008789, "global_step": 2266, "epoch": 27} {"train_loss": -16.15492057800293, "global_step": 2267, "epoch": 27} {"train_loss": -15.360033988952637, "global_step": 2268, "epoch": 27} {"train_loss": -15.810442924499512, "global_step": 2269, "epoch": 27} {"train_loss": -15.907768249511719, "global_step": 2270, "epoch": 27} {"train_loss": -16.056400299072266, "global_step": 2271, "epoch": 27} {"train_loss": -15.80718994140625, "global_step": 2272, "epoch": 27} {"train_loss": -16.019784927368164, "global_step": 2273, "epoch": 27} {"train_loss": -16.009435653686523, "global_step": 2274, "epoch": 27} {"train_loss": -16.084659576416016, "global_step": 2275, "epoch": 27} {"train_loss": -15.7869291305542, "global_step": 2276, "epoch": 27} {"train_loss": -16.099912643432617, "global_step": 2277, "epoch": 27} {"train_loss": -16.26947021484375, "global_step": 2278, "epoch": 27} {"train_loss": -16.487592697143555, "global_step": 2279, "epoch": 27} {"train_loss": -15.837478637695312, "global_step": 2280, "epoch": 27} {"train_loss": -16.139177322387695, "global_step": 2281, "epoch": 27} {"train_loss": -16.41612434387207, "global_step": 2282, "epoch": 27} {"train_loss": -16.274831771850586, "global_step": 2283, "epoch": 27} {"train_loss": -15.819951057434082, "global_step": 2284, "epoch": 27} {"train_loss": -16.291860580444336, "global_step": 2285, "epoch": 27} {"train_loss": -16.006011962890625, "global_step": 2286, "epoch": 27} {"train_loss": -15.77308177947998, "global_step": 2287, "epoch": 27} {"train_loss": -15.652687072753906, "global_step": 2288, "epoch": 27} {"train_loss": -15.93213939666748, "global_step": 2289, "epoch": 27} {"train_loss": -16.05657386779785, "global_step": 2290, "epoch": 27} {"train_loss": -16.370344161987305, "global_step": 2291, "epoch": 27} {"train_loss": -15.992566108703613, "global_step": 2292, "epoch": 27} {"train_loss": -16.190338134765625, "global_step": 2293, "epoch": 27} {"train_loss": -16.187114715576172, "global_step": 2294, "epoch": 27} {"train_loss": -15.848639488220215, "global_step": 2295, "epoch": 27} {"train_loss": -15.9827299118042, "global_step": 2296, "epoch": 27} {"train_loss": -15.965812683105469, "global_step": 2297, "epoch": 27} {"train_loss": -16.259653091430664, "global_step": 2298, "epoch": 27} {"train_loss": -15.860223770141602, "global_step": 2299, "epoch": 27} {"train_loss": -16.011411666870117, "global_step": 2300, "epoch": 27} {"train_loss": -15.999567985534668, "global_step": 2301, "epoch": 27} {"train_loss": -16.30331802368164, "global_step": 2302, "epoch": 27} {"train_loss": -16.01416015625, "global_step": 2303, "epoch": 27} {"train_loss": -16.201488494873047, "global_step": 2304, "epoch": 27} {"train_loss": -16.356245040893555, "global_step": 2305, "epoch": 27} {"train_loss": -16.110395431518555, "global_step": 2306, "epoch": 27} {"train_loss": -16.19862174987793, "global_step": 2307, "epoch": 27} {"train_loss": -16.195032119750977, "global_step": 2308, "epoch": 27} {"train_loss": -15.93834114074707, "global_step": 2309, "epoch": 27} {"train_loss": -15.736900329589844, "global_step": 2310, "epoch": 27} {"train_loss": -16.12177276611328, "global_step": 2311, "epoch": 27} {"train_loss": -15.905654907226562, "global_step": 2312, "epoch": 27} {"train_loss": -16.145984649658203, "global_step": 2313, "epoch": 27} {"train_loss": -16.065046310424805, "global_step": 2314, "epoch": 27} {"train_loss": -16.30248260498047, "global_step": 2315, "epoch": 27} {"train_loss": -16.49003791809082, "global_step": 2316, "epoch": 27} {"train_loss": -16.137563705444336, "global_step": 2317, "epoch": 27} {"train_loss": -16.1855411529541, "global_step": 2318, "epoch": 27} {"train_loss": -16.4349365234375, "global_step": 2319, "epoch": 27} {"train_loss": -15.5582275390625, "global_step": 2320, "epoch": 27} {"train_loss": -16.020404815673828, "global_step": 2321, "epoch": 27} {"train_loss": -16.25959014892578, "global_step": 2322, "epoch": 27} {"train_loss": -16.03134192041604, "global_step": 2323, "epoch": 27, "val_loss": 7700729.0} {"train_loss": -15.371968269348145, "global_step": 2324, "epoch": 28} {"train_loss": -15.47343635559082, "global_step": 2325, "epoch": 28} {"train_loss": -15.858848571777344, "global_step": 2326, "epoch": 28} {"train_loss": -15.527249336242676, "global_step": 2327, "epoch": 28} {"train_loss": -15.560681343078613, "global_step": 2328, "epoch": 28} {"train_loss": -15.872179985046387, "global_step": 2329, "epoch": 28} {"train_loss": -15.917291641235352, "global_step": 2330, "epoch": 28} {"train_loss": -15.69293212890625, "global_step": 2331, "epoch": 28} {"train_loss": -15.807904243469238, "global_step": 2332, "epoch": 28} {"train_loss": -15.884561538696289, "global_step": 2333, "epoch": 28} {"train_loss": -15.723037719726562, "global_step": 2334, "epoch": 28} {"train_loss": -15.53582763671875, "global_step": 2335, "epoch": 28} {"train_loss": -16.008174896240234, "global_step": 2336, "epoch": 28} {"train_loss": -16.411558151245117, "global_step": 2337, "epoch": 28} {"train_loss": -15.87442684173584, "global_step": 2338, "epoch": 28} {"train_loss": -15.822305679321289, "global_step": 2339, "epoch": 28} {"train_loss": -15.923382759094238, "global_step": 2340, "epoch": 28} {"train_loss": -16.140039443969727, "global_step": 2341, "epoch": 28} {"train_loss": -15.54948902130127, "global_step": 2342, "epoch": 28} {"train_loss": -16.205427169799805, "global_step": 2343, "epoch": 28} {"train_loss": -15.667673110961914, "global_step": 2344, "epoch": 28} {"train_loss": -16.004989624023438, "global_step": 2345, "epoch": 28} {"train_loss": -15.692463874816895, "global_step": 2346, "epoch": 28} {"train_loss": -16.079116821289062, "global_step": 2347, "epoch": 28} {"train_loss": -15.925726890563965, "global_step": 2348, "epoch": 28} {"train_loss": -15.964152336120605, "global_step": 2349, "epoch": 28} {"train_loss": -16.122028350830078, "global_step": 2350, "epoch": 28} {"train_loss": -15.84355354309082, "global_step": 2351, "epoch": 28} {"train_loss": -16.160526275634766, "global_step": 2352, "epoch": 28} {"train_loss": -16.04374122619629, "global_step": 2353, "epoch": 28} {"train_loss": -15.993102073669434, "global_step": 2354, "epoch": 28} {"train_loss": -16.239107131958008, "global_step": 2355, "epoch": 28} {"train_loss": -16.17722511291504, "global_step": 2356, "epoch": 28} {"train_loss": -15.829272270202637, "global_step": 2357, "epoch": 28} {"train_loss": -16.053293228149414, "global_step": 2358, "epoch": 28} {"train_loss": -16.119558334350586, "global_step": 2359, "epoch": 28} {"train_loss": -15.97369384765625, "global_step": 2360, "epoch": 28} {"train_loss": -16.21288299560547, "global_step": 2361, "epoch": 28} {"train_loss": -15.867423057556152, "global_step": 2362, "epoch": 28} {"train_loss": -15.582740783691406, "global_step": 2363, "epoch": 28} {"train_loss": -16.072385787963867, "global_step": 2364, "epoch": 28} {"train_loss": -16.16735076904297, "global_step": 2365, "epoch": 28} {"train_loss": -16.300682067871094, "global_step": 2366, "epoch": 28} {"train_loss": -16.32225227355957, "global_step": 2367, "epoch": 28} {"train_loss": -16.049802780151367, "global_step": 2368, "epoch": 28} {"train_loss": -16.43080711364746, "global_step": 2369, "epoch": 28} {"train_loss": -15.952629089355469, "global_step": 2370, "epoch": 28} {"train_loss": -16.137739181518555, "global_step": 2371, "epoch": 28} {"train_loss": -15.928817749023438, "global_step": 2372, "epoch": 28} {"train_loss": -15.842913627624512, "global_step": 2373, "epoch": 28} {"train_loss": -16.27556800842285, "global_step": 2374, "epoch": 28} {"train_loss": -15.857109069824219, "global_step": 2375, "epoch": 28} {"train_loss": -16.383981704711914, "global_step": 2376, "epoch": 28} {"train_loss": -16.281417846679688, "global_step": 2377, "epoch": 28} {"train_loss": -15.87560749053955, "global_step": 2378, "epoch": 28} {"train_loss": -16.63330078125, "global_step": 2379, "epoch": 28} {"train_loss": -16.343992233276367, "global_step": 2380, "epoch": 28} {"train_loss": -16.00128173828125, "global_step": 2381, "epoch": 28} {"train_loss": -16.696016311645508, "global_step": 2382, "epoch": 28} {"train_loss": -15.955451011657715, "global_step": 2383, "epoch": 28} {"train_loss": -16.174219131469727, "global_step": 2384, "epoch": 28} {"train_loss": -16.19573211669922, "global_step": 2385, "epoch": 28} {"train_loss": -15.71644115447998, "global_step": 2386, "epoch": 28} {"train_loss": -15.993674278259277, "global_step": 2387, "epoch": 28} {"train_loss": -16.102001190185547, "global_step": 2388, "epoch": 28} {"train_loss": -16.190704345703125, "global_step": 2389, "epoch": 28} {"train_loss": -15.893588066101074, "global_step": 2390, "epoch": 28} {"train_loss": -15.81931209564209, "global_step": 2391, "epoch": 28} {"train_loss": -15.789377212524414, "global_step": 2392, "epoch": 28} {"train_loss": -16.159048080444336, "global_step": 2393, "epoch": 28} {"train_loss": -16.136632919311523, "global_step": 2394, "epoch": 28} {"train_loss": -16.2197322845459, "global_step": 2395, "epoch": 28} {"train_loss": -16.316364288330078, "global_step": 2396, "epoch": 28} {"train_loss": -15.998896598815918, "global_step": 2397, "epoch": 28} {"train_loss": -15.75907039642334, "global_step": 2398, "epoch": 28} {"train_loss": -15.942526817321777, "global_step": 2399, "epoch": 28} {"train_loss": -15.8606595993042, "global_step": 2400, "epoch": 28} {"train_loss": -15.994760513305664, "global_step": 2401, "epoch": 28} {"train_loss": -16.20233154296875, "global_step": 2402, "epoch": 28} {"train_loss": -16.096439361572266, "global_step": 2403, "epoch": 28} {"train_loss": -16.214216232299805, "global_step": 2404, "epoch": 28} {"train_loss": -16.29910659790039, "global_step": 2405, "epoch": 28} {"train_loss": -16.007856725210168, "global_step": 2406, "epoch": 28, "val_loss": 7652925.0} {"train_loss": -16.229656219482422, "global_step": 2407, "epoch": 29} {"train_loss": -15.920730590820312, "global_step": 2408, "epoch": 29} {"train_loss": -16.131460189819336, "global_step": 2409, "epoch": 29} {"train_loss": -15.937506675720215, "global_step": 2410, "epoch": 29} {"train_loss": -16.03093910217285, "global_step": 2411, "epoch": 29} {"train_loss": -16.288175582885742, "global_step": 2412, "epoch": 29} {"train_loss": -15.626152038574219, "global_step": 2413, "epoch": 29} {"train_loss": -15.84742259979248, "global_step": 2414, "epoch": 29} {"train_loss": -16.235002517700195, "global_step": 2415, "epoch": 29} {"train_loss": -16.17538070678711, "global_step": 2416, "epoch": 29} {"train_loss": -15.70995807647705, "global_step": 2417, "epoch": 29} {"train_loss": -16.0865535736084, "global_step": 2418, "epoch": 29} {"train_loss": -16.166213989257812, "global_step": 2419, "epoch": 29} {"train_loss": -16.113561630249023, "global_step": 2420, "epoch": 29} {"train_loss": -16.1126651763916, "global_step": 2421, "epoch": 29} {"train_loss": -15.830949783325195, "global_step": 2422, "epoch": 29} {"train_loss": -15.815688133239746, "global_step": 2423, "epoch": 29} {"train_loss": -16.063213348388672, "global_step": 2424, "epoch": 29} {"train_loss": -16.48129653930664, "global_step": 2425, "epoch": 29} {"train_loss": -16.036619186401367, "global_step": 2426, "epoch": 29} {"train_loss": -15.958108901977539, "global_step": 2427, "epoch": 29} {"train_loss": -16.17549705505371, "global_step": 2428, "epoch": 29} {"train_loss": -16.080881118774414, "global_step": 2429, "epoch": 29} {"train_loss": -15.828353881835938, "global_step": 2430, "epoch": 29} {"train_loss": -15.770342826843262, "global_step": 2431, "epoch": 29} {"train_loss": -15.964784622192383, "global_step": 2432, "epoch": 29} {"train_loss": -16.06047248840332, "global_step": 2433, "epoch": 29} {"train_loss": -16.410690307617188, "global_step": 2434, "epoch": 29} {"train_loss": -16.31020164489746, "global_step": 2435, "epoch": 29} {"train_loss": -16.10368537902832, "global_step": 2436, "epoch": 29} {"train_loss": -16.341276168823242, "global_step": 2437, "epoch": 29} {"train_loss": -16.14920425415039, "global_step": 2438, "epoch": 29} {"train_loss": -15.597970962524414, "global_step": 2439, "epoch": 29} {"train_loss": -16.397964477539062, "global_step": 2440, "epoch": 29} {"train_loss": -15.658953666687012, "global_step": 2441, "epoch": 29} {"train_loss": -16.171916961669922, "global_step": 2442, "epoch": 29} {"train_loss": -15.967828750610352, "global_step": 2443, "epoch": 29} {"train_loss": -16.222959518432617, "global_step": 2444, "epoch": 29} {"train_loss": -15.983748435974121, "global_step": 2445, "epoch": 29} {"train_loss": -16.291566848754883, "global_step": 2446, "epoch": 29} {"train_loss": -16.481300354003906, "global_step": 2447, "epoch": 29} {"train_loss": -16.482988357543945, "global_step": 2448, "epoch": 29} {"train_loss": -16.380661010742188, "global_step": 2449, "epoch": 29} {"train_loss": -15.816084861755371, "global_step": 2450, "epoch": 29} {"train_loss": -15.997942924499512, "global_step": 2451, "epoch": 29} {"train_loss": -15.996789932250977, "global_step": 2452, "epoch": 29} {"train_loss": -16.27680206298828, "global_step": 2453, "epoch": 29} {"train_loss": -15.69519329071045, "global_step": 2454, "epoch": 29} {"train_loss": -15.963484764099121, "global_step": 2455, "epoch": 29} {"train_loss": -16.349424362182617, "global_step": 2456, "epoch": 29} {"train_loss": -16.212778091430664, "global_step": 2457, "epoch": 29} {"train_loss": -15.936578750610352, "global_step": 2458, "epoch": 29} {"train_loss": -16.304086685180664, "global_step": 2459, "epoch": 29} {"train_loss": -16.33053970336914, "global_step": 2460, "epoch": 29} {"train_loss": -16.02365493774414, "global_step": 2461, "epoch": 29} {"train_loss": -16.046306610107422, "global_step": 2462, "epoch": 29} {"train_loss": -16.400312423706055, "global_step": 2463, "epoch": 29} {"train_loss": -16.23273277282715, "global_step": 2464, "epoch": 29} {"train_loss": -16.421085357666016, "global_step": 2465, "epoch": 29} {"train_loss": -16.219249725341797, "global_step": 2466, "epoch": 29} {"train_loss": -16.18686294555664, "global_step": 2467, "epoch": 29} {"train_loss": -15.975539207458496, "global_step": 2468, "epoch": 29} {"train_loss": -16.00891876220703, "global_step": 2469, "epoch": 29} {"train_loss": -16.028934478759766, "global_step": 2470, "epoch": 29} {"train_loss": -16.253162384033203, "global_step": 2471, "epoch": 29} {"train_loss": -15.9647798538208, "global_step": 2472, "epoch": 29} {"train_loss": -16.39708137512207, "global_step": 2473, "epoch": 29} {"train_loss": -16.01873779296875, "global_step": 2474, "epoch": 29} {"train_loss": -15.690582275390625, "global_step": 2475, "epoch": 29} {"train_loss": -16.079954147338867, "global_step": 2476, "epoch": 29} {"train_loss": -16.137439727783203, "global_step": 2477, "epoch": 29} {"train_loss": -15.882098197937012, "global_step": 2478, "epoch": 29} {"train_loss": -16.217119216918945, "global_step": 2479, "epoch": 29} {"train_loss": -16.030344009399414, "global_step": 2480, "epoch": 29} {"train_loss": -16.22443389892578, "global_step": 2481, "epoch": 29} {"train_loss": -16.431900024414062, "global_step": 2482, "epoch": 29} {"train_loss": -16.153182983398438, "global_step": 2483, "epoch": 29} {"train_loss": -16.05288314819336, "global_step": 2484, "epoch": 29} {"train_loss": -16.200180053710938, "global_step": 2485, "epoch": 29} {"train_loss": -16.172121047973633, "global_step": 2486, "epoch": 29} {"train_loss": -16.039701461791992, "global_step": 2487, "epoch": 29} {"train_loss": -16.318958282470703, "global_step": 2488, "epoch": 29} {"train_loss": -16.11348579590579, "global_step": 2489, "epoch": 29, "val_loss": 7224555.0} {"train_loss": -15.644278526306152, "global_step": 2490, "epoch": 30} {"train_loss": -16.1085262298584, "global_step": 2491, "epoch": 30} {"train_loss": -16.19831085205078, "global_step": 2492, "epoch": 30} {"train_loss": -15.83996295928955, "global_step": 2493, "epoch": 30} {"train_loss": -16.4953670501709, "global_step": 2494, "epoch": 30} {"train_loss": -16.015430450439453, "global_step": 2495, "epoch": 30} {"train_loss": -15.911673545837402, "global_step": 2496, "epoch": 30} {"train_loss": -15.9127779006958, "global_step": 2497, "epoch": 30} {"train_loss": -16.179956436157227, "global_step": 2498, "epoch": 30} {"train_loss": -16.68987464904785, "global_step": 2499, "epoch": 30} {"train_loss": -16.387277603149414, "global_step": 2500, "epoch": 30} {"train_loss": -16.282211303710938, "global_step": 2501, "epoch": 30} {"train_loss": -15.874777793884277, "global_step": 2502, "epoch": 30} {"train_loss": -16.32191276550293, "global_step": 2503, "epoch": 30} {"train_loss": -16.435340881347656, "global_step": 2504, "epoch": 30} {"train_loss": -16.232606887817383, "global_step": 2505, "epoch": 30} {"train_loss": -16.03752899169922, "global_step": 2506, "epoch": 30} {"train_loss": -16.000688552856445, "global_step": 2507, "epoch": 30} {"train_loss": -15.698712348937988, "global_step": 2508, "epoch": 30} {"train_loss": -16.09784507751465, "global_step": 2509, "epoch": 30} {"train_loss": -16.262510299682617, "global_step": 2510, "epoch": 30} {"train_loss": -15.985989570617676, "global_step": 2511, "epoch": 30} {"train_loss": -16.364980697631836, "global_step": 2512, "epoch": 30} {"train_loss": -16.378995895385742, "global_step": 2513, "epoch": 30} {"train_loss": -16.284048080444336, "global_step": 2514, "epoch": 30} {"train_loss": -15.952966690063477, "global_step": 2515, "epoch": 30} {"train_loss": -16.465238571166992, "global_step": 2516, "epoch": 30} {"train_loss": -15.930459976196289, "global_step": 2517, "epoch": 30} {"train_loss": -16.08363914489746, "global_step": 2518, "epoch": 30} {"train_loss": -15.948880195617676, "global_step": 2519, "epoch": 30} {"train_loss": -16.091053009033203, "global_step": 2520, "epoch": 30} {"train_loss": -15.99109172821045, "global_step": 2521, "epoch": 30} {"train_loss": -16.4924373626709, "global_step": 2522, "epoch": 30} {"train_loss": -16.41389274597168, "global_step": 2523, "epoch": 30} {"train_loss": -16.418649673461914, "global_step": 2524, "epoch": 30} {"train_loss": -16.321760177612305, "global_step": 2525, "epoch": 30} {"train_loss": -16.053258895874023, "global_step": 2526, "epoch": 30} {"train_loss": -16.487642288208008, "global_step": 2527, "epoch": 30} {"train_loss": -16.044300079345703, "global_step": 2528, "epoch": 30} {"train_loss": -15.981169700622559, "global_step": 2529, "epoch": 30} {"train_loss": -15.851984024047852, "global_step": 2530, "epoch": 30} {"train_loss": -16.05292320251465, "global_step": 2531, "epoch": 30} {"train_loss": -16.01200294494629, "global_step": 2532, "epoch": 30} {"train_loss": -16.277124404907227, "global_step": 2533, "epoch": 30} {"train_loss": -16.336179733276367, "global_step": 2534, "epoch": 30} {"train_loss": -16.17885398864746, "global_step": 2535, "epoch": 30} {"train_loss": -16.280067443847656, "global_step": 2536, "epoch": 30} {"train_loss": -16.460840225219727, "global_step": 2537, "epoch": 30} {"train_loss": -16.509977340698242, "global_step": 2538, "epoch": 30} {"train_loss": -16.364364624023438, "global_step": 2539, "epoch": 30} {"train_loss": -15.654675483703613, "global_step": 2540, "epoch": 30} {"train_loss": -16.592832565307617, "global_step": 2541, "epoch": 30} {"train_loss": -16.271081924438477, "global_step": 2542, "epoch": 30} {"train_loss": -15.668863296508789, "global_step": 2543, "epoch": 30} {"train_loss": -16.564701080322266, "global_step": 2544, "epoch": 30} {"train_loss": -16.081052780151367, "global_step": 2545, "epoch": 30} {"train_loss": -16.051429748535156, "global_step": 2546, "epoch": 30} {"train_loss": -16.08498191833496, "global_step": 2547, "epoch": 30} {"train_loss": -16.04835319519043, "global_step": 2548, "epoch": 30} {"train_loss": -16.144628524780273, "global_step": 2549, "epoch": 30} {"train_loss": -16.13936424255371, "global_step": 2550, "epoch": 30} {"train_loss": -16.00889015197754, "global_step": 2551, "epoch": 30} {"train_loss": -16.464994430541992, "global_step": 2552, "epoch": 30} {"train_loss": -16.398548126220703, "global_step": 2553, "epoch": 30} {"train_loss": -16.31132698059082, "global_step": 2554, "epoch": 30} {"train_loss": -16.354145050048828, "global_step": 2555, "epoch": 30} {"train_loss": -15.851058006286621, "global_step": 2556, "epoch": 30} {"train_loss": -15.925349235534668, "global_step": 2557, "epoch": 30} {"train_loss": -16.3356990814209, "global_step": 2558, "epoch": 30} {"train_loss": -16.034439086914062, "global_step": 2559, "epoch": 30} {"train_loss": -16.055217742919922, "global_step": 2560, "epoch": 30} {"train_loss": -16.227235794067383, "global_step": 2561, "epoch": 30} {"train_loss": -16.00943374633789, "global_step": 2562, "epoch": 30} {"train_loss": -16.544164657592773, "global_step": 2563, "epoch": 30} {"train_loss": -16.139163970947266, "global_step": 2564, "epoch": 30} {"train_loss": -15.840387344360352, "global_step": 2565, "epoch": 30} {"train_loss": -16.09914207458496, "global_step": 2566, "epoch": 30} {"train_loss": -16.134729385375977, "global_step": 2567, "epoch": 30} {"train_loss": -16.26129722595215, "global_step": 2568, "epoch": 30} {"train_loss": -15.641554832458496, "global_step": 2569, "epoch": 30} {"train_loss": -15.91922664642334, "global_step": 2570, "epoch": 30} {"train_loss": -16.09537124633789, "global_step": 2571, "epoch": 30} {"train_loss": -16.16437157090888, "global_step": 2572, "epoch": 30, "val_loss": 7421374.0} {"train_loss": -15.78478717803955, "global_step": 2573, "epoch": 31} {"train_loss": -16.078107833862305, "global_step": 2574, "epoch": 31} {"train_loss": -16.201507568359375, "global_step": 2575, "epoch": 31} {"train_loss": -16.289161682128906, "global_step": 2576, "epoch": 31} {"train_loss": -15.815787315368652, "global_step": 2577, "epoch": 31} {"train_loss": -15.809100151062012, "global_step": 2578, "epoch": 31} {"train_loss": -15.80840015411377, "global_step": 2579, "epoch": 31} {"train_loss": -16.041748046875, "global_step": 2580, "epoch": 31} {"train_loss": -16.235448837280273, "global_step": 2581, "epoch": 31} {"train_loss": -16.050626754760742, "global_step": 2582, "epoch": 31} {"train_loss": -16.142894744873047, "global_step": 2583, "epoch": 31} {"train_loss": -16.309894561767578, "global_step": 2584, "epoch": 31} {"train_loss": -15.846809387207031, "global_step": 2585, "epoch": 31} {"train_loss": -15.960306167602539, "global_step": 2586, "epoch": 31} {"train_loss": -16.236677169799805, "global_step": 2587, "epoch": 31} {"train_loss": -16.603750228881836, "global_step": 2588, "epoch": 31} {"train_loss": -16.462812423706055, "global_step": 2589, "epoch": 31} {"train_loss": -15.650796890258789, "global_step": 2590, "epoch": 31} {"train_loss": -16.702199935913086, "global_step": 2591, "epoch": 31} {"train_loss": -16.05533218383789, "global_step": 2592, "epoch": 31} {"train_loss": -16.02956199645996, "global_step": 2593, "epoch": 31} {"train_loss": -16.442928314208984, "global_step": 2594, "epoch": 31} {"train_loss": -16.455881118774414, "global_step": 2595, "epoch": 31} {"train_loss": -16.25131607055664, "global_step": 2596, "epoch": 31} {"train_loss": -16.514028549194336, "global_step": 2597, "epoch": 31} {"train_loss": -16.037063598632812, "global_step": 2598, "epoch": 31} {"train_loss": -15.895865440368652, "global_step": 2599, "epoch": 31} {"train_loss": -15.93540096282959, "global_step": 2600, "epoch": 31} {"train_loss": -16.31740379333496, "global_step": 2601, "epoch": 31} {"train_loss": -16.045907974243164, "global_step": 2602, "epoch": 31} {"train_loss": -16.201435089111328, "global_step": 2603, "epoch": 31} {"train_loss": -16.039905548095703, "global_step": 2604, "epoch": 31} {"train_loss": -16.2696590423584, "global_step": 2605, "epoch": 31} {"train_loss": -15.972765922546387, "global_step": 2606, "epoch": 31} {"train_loss": -16.11616325378418, "global_step": 2607, "epoch": 31} {"train_loss": -16.07111930847168, "global_step": 2608, "epoch": 31} {"train_loss": -15.813166618347168, "global_step": 2609, "epoch": 31} {"train_loss": -16.143712997436523, "global_step": 2610, "epoch": 31} {"train_loss": -16.279129028320312, "global_step": 2611, "epoch": 31} {"train_loss": -16.454191207885742, "global_step": 2612, "epoch": 31} {"train_loss": -16.235620498657227, "global_step": 2613, "epoch": 31} {"train_loss": -16.35491180419922, "global_step": 2614, "epoch": 31} {"train_loss": -16.518417358398438, "global_step": 2615, "epoch": 31} {"train_loss": -16.2840576171875, "global_step": 2616, "epoch": 31} {"train_loss": -16.36433219909668, "global_step": 2617, "epoch": 31} {"train_loss": -16.415952682495117, "global_step": 2618, "epoch": 31} {"train_loss": -16.04738426208496, "global_step": 2619, "epoch": 31} {"train_loss": -15.954695701599121, "global_step": 2620, "epoch": 31} {"train_loss": -16.49736213684082, "global_step": 2621, "epoch": 31} {"train_loss": -15.972589492797852, "global_step": 2622, "epoch": 31} {"train_loss": -16.67201042175293, "global_step": 2623, "epoch": 31} {"train_loss": -15.814401626586914, "global_step": 2624, "epoch": 31} {"train_loss": -15.967071533203125, "global_step": 2625, "epoch": 31} {"train_loss": -16.21725845336914, "global_step": 2626, "epoch": 31} {"train_loss": -15.934416770935059, "global_step": 2627, "epoch": 31} {"train_loss": -16.480146408081055, "global_step": 2628, "epoch": 31} {"train_loss": -16.264236450195312, "global_step": 2629, "epoch": 31} {"train_loss": -16.556852340698242, "global_step": 2630, "epoch": 31} {"train_loss": -16.073572158813477, "global_step": 2631, "epoch": 31} {"train_loss": -16.536090850830078, "global_step": 2632, "epoch": 31} {"train_loss": -16.192289352416992, "global_step": 2633, "epoch": 31} {"train_loss": -16.458295822143555, "global_step": 2634, "epoch": 31} {"train_loss": -16.3348445892334, "global_step": 2635, "epoch": 31} {"train_loss": -16.19710350036621, "global_step": 2636, "epoch": 31} {"train_loss": -16.152219772338867, "global_step": 2637, "epoch": 31} {"train_loss": -15.786028861999512, "global_step": 2638, "epoch": 31} {"train_loss": -16.24317169189453, "global_step": 2639, "epoch": 31} {"train_loss": -16.285369873046875, "global_step": 2640, "epoch": 31} {"train_loss": -15.400827407836914, "global_step": 2641, "epoch": 31} {"train_loss": -16.158233642578125, "global_step": 2642, "epoch": 31} {"train_loss": -16.295846939086914, "global_step": 2643, "epoch": 31} {"train_loss": -16.39899253845215, "global_step": 2644, "epoch": 31} {"train_loss": -16.215219497680664, "global_step": 2645, "epoch": 31} {"train_loss": -16.1940860748291, "global_step": 2646, "epoch": 31} {"train_loss": -16.322509765625, "global_step": 2647, "epoch": 31} {"train_loss": -16.63020896911621, "global_step": 2648, "epoch": 31} {"train_loss": -15.990610122680664, "global_step": 2649, "epoch": 31} {"train_loss": -16.016263961791992, "global_step": 2650, "epoch": 31} {"train_loss": -16.326387405395508, "global_step": 2651, "epoch": 31} {"train_loss": -15.873373985290527, "global_step": 2652, "epoch": 31} {"train_loss": -15.956442832946777, "global_step": 2653, "epoch": 31} {"train_loss": -16.360687255859375, "global_step": 2654, "epoch": 31} {"train_loss": -16.16206140403288, "global_step": 2655, "epoch": 31, "val_loss": 7346244.0} {"train_loss": -16.18007469177246, "global_step": 2656, "epoch": 32} {"train_loss": -15.956149101257324, "global_step": 2657, "epoch": 32} {"train_loss": -16.034015655517578, "global_step": 2658, "epoch": 32} {"train_loss": -16.391088485717773, "global_step": 2659, "epoch": 32} {"train_loss": -16.1772518157959, "global_step": 2660, "epoch": 32} {"train_loss": -16.150487899780273, "global_step": 2661, "epoch": 32} {"train_loss": -16.25429344177246, "global_step": 2662, "epoch": 32} {"train_loss": -15.79526424407959, "global_step": 2663, "epoch": 32} {"train_loss": -16.402997970581055, "global_step": 2664, "epoch": 32} {"train_loss": -16.595088958740234, "global_step": 2665, "epoch": 32} {"train_loss": -16.332443237304688, "global_step": 2666, "epoch": 32} {"train_loss": -16.703702926635742, "global_step": 2667, "epoch": 32} {"train_loss": -15.99462890625, "global_step": 2668, "epoch": 32} {"train_loss": -16.275413513183594, "global_step": 2669, "epoch": 32} {"train_loss": -16.073896408081055, "global_step": 2670, "epoch": 32} {"train_loss": -15.935446739196777, "global_step": 2671, "epoch": 32} {"train_loss": -16.10776138305664, "global_step": 2672, "epoch": 32} {"train_loss": -15.8595552444458, "global_step": 2673, "epoch": 32} {"train_loss": -16.03155517578125, "global_step": 2674, "epoch": 32} {"train_loss": -16.414281845092773, "global_step": 2675, "epoch": 32} {"train_loss": -15.669781684875488, "global_step": 2676, "epoch": 32} {"train_loss": -16.13563346862793, "global_step": 2677, "epoch": 32} {"train_loss": -16.222557067871094, "global_step": 2678, "epoch": 32} {"train_loss": -16.245838165283203, "global_step": 2679, "epoch": 32} {"train_loss": -16.44474220275879, "global_step": 2680, "epoch": 32} {"train_loss": -16.269163131713867, "global_step": 2681, "epoch": 32} {"train_loss": -16.432382583618164, "global_step": 2682, "epoch": 32} {"train_loss": -16.01090431213379, "global_step": 2683, "epoch": 32} {"train_loss": -16.348684310913086, "global_step": 2684, "epoch": 32} {"train_loss": -16.534921646118164, "global_step": 2685, "epoch": 32} {"train_loss": -16.286039352416992, "global_step": 2686, "epoch": 32} {"train_loss": -16.356077194213867, "global_step": 2687, "epoch": 32} {"train_loss": -15.943285942077637, "global_step": 2688, "epoch": 32} {"train_loss": -15.88073444366455, "global_step": 2689, "epoch": 32} {"train_loss": -16.22869300842285, "global_step": 2690, "epoch": 32} {"train_loss": -16.047758102416992, "global_step": 2691, "epoch": 32} {"train_loss": -16.162582397460938, "global_step": 2692, "epoch": 32} {"train_loss": -15.981013298034668, "global_step": 2693, "epoch": 32} {"train_loss": -16.399166107177734, "global_step": 2694, "epoch": 32} {"train_loss": -16.032245635986328, "global_step": 2695, "epoch": 32} {"train_loss": -16.347700119018555, "global_step": 2696, "epoch": 32} {"train_loss": -16.241050720214844, "global_step": 2697, "epoch": 32} {"train_loss": -16.34078598022461, "global_step": 2698, "epoch": 32} {"train_loss": -16.268217086791992, "global_step": 2699, "epoch": 32} {"train_loss": -16.020450592041016, "global_step": 2700, "epoch": 32} {"train_loss": -16.25577163696289, "global_step": 2701, "epoch": 32} {"train_loss": -15.909151077270508, "global_step": 2702, "epoch": 32} {"train_loss": -16.459638595581055, "global_step": 2703, "epoch": 32} {"train_loss": -16.393041610717773, "global_step": 2704, "epoch": 32} {"train_loss": -16.455413818359375, "global_step": 2705, "epoch": 32} {"train_loss": -16.49810218811035, "global_step": 2706, "epoch": 32} {"train_loss": -15.82934284210205, "global_step": 2707, "epoch": 32} {"train_loss": -16.52425193786621, "global_step": 2708, "epoch": 32} {"train_loss": -16.28594970703125, "global_step": 2709, "epoch": 32} {"train_loss": -16.365549087524414, "global_step": 2710, "epoch": 32} {"train_loss": -15.840014457702637, "global_step": 2711, "epoch": 32} {"train_loss": -16.10205841064453, "global_step": 2712, "epoch": 32} {"train_loss": -16.028501510620117, "global_step": 2713, "epoch": 32} {"train_loss": -16.674152374267578, "global_step": 2714, "epoch": 32} {"train_loss": -16.65131950378418, "global_step": 2715, "epoch": 32} {"train_loss": -16.347383499145508, "global_step": 2716, "epoch": 32} {"train_loss": -16.09439468383789, "global_step": 2717, "epoch": 32} {"train_loss": -16.014951705932617, "global_step": 2718, "epoch": 32} {"train_loss": -16.370540618896484, "global_step": 2719, "epoch": 32} {"train_loss": -16.358692169189453, "global_step": 2720, "epoch": 32} {"train_loss": -16.269344329833984, "global_step": 2721, "epoch": 32} {"train_loss": -16.20940399169922, "global_step": 2722, "epoch": 32} {"train_loss": -16.280662536621094, "global_step": 2723, "epoch": 32} {"train_loss": -16.13164710998535, "global_step": 2724, "epoch": 32} {"train_loss": -16.155174255371094, "global_step": 2725, "epoch": 32} {"train_loss": -16.264907836914062, "global_step": 2726, "epoch": 32} {"train_loss": -16.42023468017578, "global_step": 2727, "epoch": 32} {"train_loss": -16.393049240112305, "global_step": 2728, "epoch": 32} {"train_loss": -16.778919219970703, "global_step": 2729, "epoch": 32} {"train_loss": -16.097562789916992, "global_step": 2730, "epoch": 32} {"train_loss": -16.209840774536133, "global_step": 2731, "epoch": 32} {"train_loss": -16.57145118713379, "global_step": 2732, "epoch": 32} {"train_loss": -15.940637588500977, "global_step": 2733, "epoch": 32} {"train_loss": -16.317035675048828, "global_step": 2734, "epoch": 32} {"train_loss": -16.233264923095703, "global_step": 2735, "epoch": 32} {"train_loss": -16.310115814208984, "global_step": 2736, "epoch": 32} {"train_loss": -15.867652893066406, "global_step": 2737, "epoch": 32} {"train_loss": -16.22500401232616, "global_step": 2738, "epoch": 32, "val_loss": 7478083.0} {"train_loss": -15.943170547485352, "global_step": 2739, "epoch": 33} {"train_loss": -16.109947204589844, "global_step": 2740, "epoch": 33} {"train_loss": -16.23497772216797, "global_step": 2741, "epoch": 33} {"train_loss": -15.804160118103027, "global_step": 2742, "epoch": 33} {"train_loss": -16.46296501159668, "global_step": 2743, "epoch": 33} {"train_loss": -15.720260620117188, "global_step": 2744, "epoch": 33} {"train_loss": -16.281408309936523, "global_step": 2745, "epoch": 33} {"train_loss": -16.466476440429688, "global_step": 2746, "epoch": 33} {"train_loss": -16.415775299072266, "global_step": 2747, "epoch": 33} {"train_loss": -15.96884822845459, "global_step": 2748, "epoch": 33} {"train_loss": -16.42591667175293, "global_step": 2749, "epoch": 33} {"train_loss": -16.31744956970215, "global_step": 2750, "epoch": 33} {"train_loss": -16.3603458404541, "global_step": 2751, "epoch": 33} {"train_loss": -16.587238311767578, "global_step": 2752, "epoch": 33} {"train_loss": -16.48698616027832, "global_step": 2753, "epoch": 33} {"train_loss": -15.739837646484375, "global_step": 2754, "epoch": 33} {"train_loss": -15.990954399108887, "global_step": 2755, "epoch": 33} {"train_loss": -16.16963768005371, "global_step": 2756, "epoch": 33} {"train_loss": -16.51966094970703, "global_step": 2757, "epoch": 33} {"train_loss": -15.739697456359863, "global_step": 2758, "epoch": 33} {"train_loss": -16.035375595092773, "global_step": 2759, "epoch": 33} {"train_loss": -16.28635025024414, "global_step": 2760, "epoch": 33} {"train_loss": -16.614505767822266, "global_step": 2761, "epoch": 33} {"train_loss": -16.41646957397461, "global_step": 2762, "epoch": 33} {"train_loss": -16.384395599365234, "global_step": 2763, "epoch": 33} {"train_loss": -16.29848289489746, "global_step": 2764, "epoch": 33} {"train_loss": -16.2790470123291, "global_step": 2765, "epoch": 33} {"train_loss": -16.356632232666016, "global_step": 2766, "epoch": 33} {"train_loss": -16.585166931152344, "global_step": 2767, "epoch": 33} {"train_loss": -16.272550582885742, "global_step": 2768, "epoch": 33} {"train_loss": -16.18699073791504, "global_step": 2769, "epoch": 33} {"train_loss": -16.250715255737305, "global_step": 2770, "epoch": 33} {"train_loss": -15.820784568786621, "global_step": 2771, "epoch": 33} {"train_loss": -16.160181045532227, "global_step": 2772, "epoch": 33} {"train_loss": -15.912521362304688, "global_step": 2773, "epoch": 33} {"train_loss": -16.49519920349121, "global_step": 2774, "epoch": 33} {"train_loss": -16.533843994140625, "global_step": 2775, "epoch": 33} {"train_loss": -16.339048385620117, "global_step": 2776, "epoch": 33} {"train_loss": -16.061752319335938, "global_step": 2777, "epoch": 33} {"train_loss": -16.41716957092285, "global_step": 2778, "epoch": 33} {"train_loss": -16.14151382446289, "global_step": 2779, "epoch": 33} {"train_loss": -16.32695960998535, "global_step": 2780, "epoch": 33} {"train_loss": -15.8486328125, "global_step": 2781, "epoch": 33} {"train_loss": -16.385581970214844, "global_step": 2782, "epoch": 33} {"train_loss": -16.03591537475586, "global_step": 2783, "epoch": 33} {"train_loss": -16.179975509643555, "global_step": 2784, "epoch": 33} {"train_loss": -15.920036315917969, "global_step": 2785, "epoch": 33} {"train_loss": -16.532241821289062, "global_step": 2786, "epoch": 33} {"train_loss": -16.482379913330078, "global_step": 2787, "epoch": 33} {"train_loss": -16.37660026550293, "global_step": 2788, "epoch": 33} {"train_loss": -16.219377517700195, "global_step": 2789, "epoch": 33} {"train_loss": -16.267366409301758, "global_step": 2790, "epoch": 33} {"train_loss": -16.072301864624023, "global_step": 2791, "epoch": 33} {"train_loss": -16.075775146484375, "global_step": 2792, "epoch": 33} {"train_loss": -16.071794509887695, "global_step": 2793, "epoch": 33} {"train_loss": -16.18510627746582, "global_step": 2794, "epoch": 33} {"train_loss": -16.22003936767578, "global_step": 2795, "epoch": 33} {"train_loss": -16.546585083007812, "global_step": 2796, "epoch": 33} {"train_loss": -16.352237701416016, "global_step": 2797, "epoch": 33} {"train_loss": -16.346527099609375, "global_step": 2798, "epoch": 33} {"train_loss": -16.638870239257812, "global_step": 2799, "epoch": 33} {"train_loss": -16.529399871826172, "global_step": 2800, "epoch": 33} {"train_loss": -16.151758193969727, "global_step": 2801, "epoch": 33} {"train_loss": -16.2585506439209, "global_step": 2802, "epoch": 33} {"train_loss": -16.36336326599121, "global_step": 2803, "epoch": 33} {"train_loss": -15.958539009094238, "global_step": 2804, "epoch": 33} {"train_loss": -16.391803741455078, "global_step": 2805, "epoch": 33} {"train_loss": -16.40471076965332, "global_step": 2806, "epoch": 33} {"train_loss": -16.44257164001465, "global_step": 2807, "epoch": 33} {"train_loss": -16.4462833404541, "global_step": 2808, "epoch": 33} {"train_loss": -16.081268310546875, "global_step": 2809, "epoch": 33} {"train_loss": -16.500537872314453, "global_step": 2810, "epoch": 33} {"train_loss": -16.511001586914062, "global_step": 2811, "epoch": 33} {"train_loss": -16.389524459838867, "global_step": 2812, "epoch": 33} {"train_loss": -16.4599552154541, "global_step": 2813, "epoch": 33} {"train_loss": -15.9994478225708, "global_step": 2814, "epoch": 33} {"train_loss": -15.697176933288574, "global_step": 2815, "epoch": 33} {"train_loss": -16.09592056274414, "global_step": 2816, "epoch": 33} {"train_loss": -16.263174057006836, "global_step": 2817, "epoch": 33} {"train_loss": -16.159061431884766, "global_step": 2818, "epoch": 33} {"train_loss": -16.469160079956055, "global_step": 2819, "epoch": 33} {"train_loss": -16.078983306884766, "global_step": 2820, "epoch": 33} {"train_loss": -16.247598900852434, "global_step": 2821, "epoch": 33, "val_loss": 7308602.0} {"train_loss": -16.289932250976562, "global_step": 2822, "epoch": 34} {"train_loss": -16.443246841430664, "global_step": 2823, "epoch": 34} {"train_loss": -16.329954147338867, "global_step": 2824, "epoch": 34} {"train_loss": -16.500646591186523, "global_step": 2825, "epoch": 34} {"train_loss": -15.960413932800293, "global_step": 2826, "epoch": 34} {"train_loss": -16.62383270263672, "global_step": 2827, "epoch": 34} {"train_loss": -16.004291534423828, "global_step": 2828, "epoch": 34} {"train_loss": -15.827964782714844, "global_step": 2829, "epoch": 34} {"train_loss": -16.355131149291992, "global_step": 2830, "epoch": 34} {"train_loss": -15.70493221282959, "global_step": 2831, "epoch": 34} {"train_loss": -15.9721040725708, "global_step": 2832, "epoch": 34} {"train_loss": -16.345535278320312, "global_step": 2833, "epoch": 34} {"train_loss": -16.742416381835938, "global_step": 2834, "epoch": 34} {"train_loss": -16.43799591064453, "global_step": 2835, "epoch": 34} {"train_loss": -16.266101837158203, "global_step": 2836, "epoch": 34} {"train_loss": -15.995251655578613, "global_step": 2837, "epoch": 34} {"train_loss": -16.2283878326416, "global_step": 2838, "epoch": 34} {"train_loss": -16.35177993774414, "global_step": 2839, "epoch": 34} {"train_loss": -16.37370491027832, "global_step": 2840, "epoch": 34} {"train_loss": -16.298988342285156, "global_step": 2841, "epoch": 34} {"train_loss": -16.419103622436523, "global_step": 2842, "epoch": 34} {"train_loss": -16.327688217163086, "global_step": 2843, "epoch": 34} {"train_loss": -16.37653923034668, "global_step": 2844, "epoch": 34} {"train_loss": -16.4623966217041, "global_step": 2845, "epoch": 34} {"train_loss": -16.372982025146484, "global_step": 2846, "epoch": 34} {"train_loss": -16.487594604492188, "global_step": 2847, "epoch": 34} {"train_loss": -15.676658630371094, "global_step": 2848, "epoch": 34} {"train_loss": -16.150320053100586, "global_step": 2849, "epoch": 34} {"train_loss": -16.637346267700195, "global_step": 2850, "epoch": 34} {"train_loss": -16.19435691833496, "global_step": 2851, "epoch": 34} {"train_loss": -16.453763961791992, "global_step": 2852, "epoch": 34} {"train_loss": -16.188114166259766, "global_step": 2853, "epoch": 34} {"train_loss": -16.355802536010742, "global_step": 2854, "epoch": 34} {"train_loss": -16.164552688598633, "global_step": 2855, "epoch": 34} {"train_loss": -16.106109619140625, "global_step": 2856, "epoch": 34} {"train_loss": -16.119970321655273, "global_step": 2857, "epoch": 34} {"train_loss": -16.043869018554688, "global_step": 2858, "epoch": 34} {"train_loss": -16.115110397338867, "global_step": 2859, "epoch": 34} {"train_loss": -16.045305252075195, "global_step": 2860, "epoch": 34} {"train_loss": -16.326202392578125, "global_step": 2861, "epoch": 34} {"train_loss": -16.425580978393555, "global_step": 2862, "epoch": 34} {"train_loss": -16.331298828125, "global_step": 2863, "epoch": 34} {"train_loss": -16.325204849243164, "global_step": 2864, "epoch": 34} {"train_loss": -16.32284164428711, "global_step": 2865, "epoch": 34} {"train_loss": -15.888153076171875, "global_step": 2866, "epoch": 34} {"train_loss": -16.47832679748535, "global_step": 2867, "epoch": 34} {"train_loss": -16.51542091369629, "global_step": 2868, "epoch": 34} {"train_loss": -16.636154174804688, "global_step": 2869, "epoch": 34} {"train_loss": -16.250091552734375, "global_step": 2870, "epoch": 34} {"train_loss": -16.586584091186523, "global_step": 2871, "epoch": 34} {"train_loss": -16.776443481445312, "global_step": 2872, "epoch": 34} {"train_loss": -16.479726791381836, "global_step": 2873, "epoch": 34} {"train_loss": -16.166481018066406, "global_step": 2874, "epoch": 34} {"train_loss": -16.5300235748291, "global_step": 2875, "epoch": 34} {"train_loss": -16.42181968688965, "global_step": 2876, "epoch": 34} {"train_loss": -16.468124389648438, "global_step": 2877, "epoch": 34} {"train_loss": -15.997881889343262, "global_step": 2878, "epoch": 34} {"train_loss": -16.1651611328125, "global_step": 2879, "epoch": 34} {"train_loss": -16.081153869628906, "global_step": 2880, "epoch": 34} {"train_loss": -16.17225456237793, "global_step": 2881, "epoch": 34} {"train_loss": -16.085859298706055, "global_step": 2882, "epoch": 34} {"train_loss": -16.251920700073242, "global_step": 2883, "epoch": 34} {"train_loss": -16.303970336914062, "global_step": 2884, "epoch": 34} {"train_loss": -16.474729537963867, "global_step": 2885, "epoch": 34} {"train_loss": -16.099517822265625, "global_step": 2886, "epoch": 34} {"train_loss": -16.1867733001709, "global_step": 2887, "epoch": 34} {"train_loss": -16.625654220581055, "global_step": 2888, "epoch": 34} {"train_loss": -16.18366050720215, "global_step": 2889, "epoch": 34} {"train_loss": -16.537933349609375, "global_step": 2890, "epoch": 34} {"train_loss": -16.169153213500977, "global_step": 2891, "epoch": 34} {"train_loss": -16.570892333984375, "global_step": 2892, "epoch": 34} {"train_loss": -16.207975387573242, "global_step": 2893, "epoch": 34} {"train_loss": -16.209716796875, "global_step": 2894, "epoch": 34} {"train_loss": -16.494306564331055, "global_step": 2895, "epoch": 34} {"train_loss": -16.479238510131836, "global_step": 2896, "epoch": 34} {"train_loss": -16.27605438232422, "global_step": 2897, "epoch": 34} {"train_loss": -16.005874633789062, "global_step": 2898, "epoch": 34} {"train_loss": -16.497648239135742, "global_step": 2899, "epoch": 34} {"train_loss": -16.339223861694336, "global_step": 2900, "epoch": 34} {"train_loss": -16.228551864624023, "global_step": 2901, "epoch": 34} {"train_loss": -16.178699493408203, "global_step": 2902, "epoch": 34} {"train_loss": -16.333541870117188, "global_step": 2903, "epoch": 34} {"train_loss": -16.2871847382511, "global_step": 2904, "epoch": 34, "val_loss": 7474972.0} {"train_loss": -15.550353050231934, "global_step": 2905, "epoch": 35} {"train_loss": -15.825393676757812, "global_step": 2906, "epoch": 35} {"train_loss": -16.18621826171875, "global_step": 2907, "epoch": 35} {"train_loss": -16.229394912719727, "global_step": 2908, "epoch": 35} {"train_loss": -15.58923053741455, "global_step": 2909, "epoch": 35} {"train_loss": -16.064817428588867, "global_step": 2910, "epoch": 35} {"train_loss": -16.33951187133789, "global_step": 2911, "epoch": 35} {"train_loss": -16.329727172851562, "global_step": 2912, "epoch": 35} {"train_loss": -15.955443382263184, "global_step": 2913, "epoch": 35} {"train_loss": -16.84427261352539, "global_step": 2914, "epoch": 35} {"train_loss": -15.896585464477539, "global_step": 2915, "epoch": 35} {"train_loss": -16.436325073242188, "global_step": 2916, "epoch": 35} {"train_loss": -16.574228286743164, "global_step": 2917, "epoch": 35} {"train_loss": -16.04227638244629, "global_step": 2918, "epoch": 35} {"train_loss": -16.540538787841797, "global_step": 2919, "epoch": 35} {"train_loss": -16.538349151611328, "global_step": 2920, "epoch": 35} {"train_loss": -16.078725814819336, "global_step": 2921, "epoch": 35} {"train_loss": -16.581113815307617, "global_step": 2922, "epoch": 35} {"train_loss": -15.901214599609375, "global_step": 2923, "epoch": 35} {"train_loss": -16.481338500976562, "global_step": 2924, "epoch": 35} {"train_loss": -16.232070922851562, "global_step": 2925, "epoch": 35} {"train_loss": -16.318140029907227, "global_step": 2926, "epoch": 35} {"train_loss": -16.087438583374023, "global_step": 2927, "epoch": 35} {"train_loss": -16.370994567871094, "global_step": 2928, "epoch": 35} {"train_loss": -16.35451316833496, "global_step": 2929, "epoch": 35} {"train_loss": -16.347986221313477, "global_step": 2930, "epoch": 35} {"train_loss": -16.35717010498047, "global_step": 2931, "epoch": 35} {"train_loss": -16.18739128112793, "global_step": 2932, "epoch": 35} {"train_loss": -16.41167640686035, "global_step": 2933, "epoch": 35} {"train_loss": -16.3140869140625, "global_step": 2934, "epoch": 35} {"train_loss": -16.24615478515625, "global_step": 2935, "epoch": 35} {"train_loss": -16.24550437927246, "global_step": 2936, "epoch": 35} {"train_loss": -16.409936904907227, "global_step": 2937, "epoch": 35} {"train_loss": -15.879074096679688, "global_step": 2938, "epoch": 35} {"train_loss": -16.44826316833496, "global_step": 2939, "epoch": 35} {"train_loss": -16.123794555664062, "global_step": 2940, "epoch": 35} {"train_loss": -15.602310180664062, "global_step": 2941, "epoch": 35} {"train_loss": -16.33522605895996, "global_step": 2942, "epoch": 35} {"train_loss": -16.252714157104492, "global_step": 2943, "epoch": 35} {"train_loss": -16.62643051147461, "global_step": 2944, "epoch": 35} {"train_loss": -16.61539649963379, "global_step": 2945, "epoch": 35} {"train_loss": -16.182819366455078, "global_step": 2946, "epoch": 35} {"train_loss": -16.33255958557129, "global_step": 2947, "epoch": 35} {"train_loss": -16.407684326171875, "global_step": 2948, "epoch": 35} {"train_loss": -16.401052474975586, "global_step": 2949, "epoch": 35} {"train_loss": -16.44508171081543, "global_step": 2950, "epoch": 35} {"train_loss": -16.460866928100586, "global_step": 2951, "epoch": 35} {"train_loss": -16.283689498901367, "global_step": 2952, "epoch": 35} {"train_loss": -16.205677032470703, "global_step": 2953, "epoch": 35} {"train_loss": -16.362506866455078, "global_step": 2954, "epoch": 35} {"train_loss": -16.273452758789062, "global_step": 2955, "epoch": 35} {"train_loss": -16.40582275390625, "global_step": 2956, "epoch": 35} {"train_loss": -15.977442741394043, "global_step": 2957, "epoch": 35} {"train_loss": -16.06532859802246, "global_step": 2958, "epoch": 35} {"train_loss": -16.548608779907227, "global_step": 2959, "epoch": 35} {"train_loss": -16.098554611206055, "global_step": 2960, "epoch": 35} {"train_loss": -16.464609146118164, "global_step": 2961, "epoch": 35} {"train_loss": -16.50274085998535, "global_step": 2962, "epoch": 35} {"train_loss": -16.388399124145508, "global_step": 2963, "epoch": 35} {"train_loss": -16.15056800842285, "global_step": 2964, "epoch": 35} {"train_loss": -16.52051544189453, "global_step": 2965, "epoch": 35} {"train_loss": -16.134159088134766, "global_step": 2966, "epoch": 35} {"train_loss": -16.4012451171875, "global_step": 2967, "epoch": 35} {"train_loss": -16.089073181152344, "global_step": 2968, "epoch": 35} {"train_loss": -15.906720161437988, "global_step": 2969, "epoch": 35} {"train_loss": -16.460378646850586, "global_step": 2970, "epoch": 35} {"train_loss": -16.194869995117188, "global_step": 2971, "epoch": 35} {"train_loss": -16.4011173248291, "global_step": 2972, "epoch": 35} {"train_loss": -16.16217803955078, "global_step": 2973, "epoch": 35} {"train_loss": -16.374755859375, "global_step": 2974, "epoch": 35} {"train_loss": -16.50905418395996, "global_step": 2975, "epoch": 35} {"train_loss": -16.49979591369629, "global_step": 2976, "epoch": 35} {"train_loss": -16.016159057617188, "global_step": 2977, "epoch": 35} {"train_loss": -16.738828659057617, "global_step": 2978, "epoch": 35} {"train_loss": -16.473514556884766, "global_step": 2979, "epoch": 35} {"train_loss": -16.143949508666992, "global_step": 2980, "epoch": 35} {"train_loss": -16.424997329711914, "global_step": 2981, "epoch": 35} {"train_loss": -16.69809913635254, "global_step": 2982, "epoch": 35} {"train_loss": -16.13796615600586, "global_step": 2983, "epoch": 35} {"train_loss": -16.466754913330078, "global_step": 2984, "epoch": 35} {"train_loss": -16.575441360473633, "global_step": 2985, "epoch": 35} {"train_loss": -16.616683959960938, "global_step": 2986, "epoch": 35} {"train_loss": -16.294146491820555, "global_step": 2987, "epoch": 35, "val_loss": 7055652.0} {"train_loss": -16.437606811523438, "global_step": 2988, "epoch": 36} {"train_loss": -16.423263549804688, "global_step": 2989, "epoch": 36} {"train_loss": -16.143205642700195, "global_step": 2990, "epoch": 36} {"train_loss": -16.1926326751709, "global_step": 2991, "epoch": 36} {"train_loss": -16.145952224731445, "global_step": 2992, "epoch": 36} {"train_loss": -16.12639045715332, "global_step": 2993, "epoch": 36} {"train_loss": -15.900758743286133, "global_step": 2994, "epoch": 36} {"train_loss": -16.214075088500977, "global_step": 2995, "epoch": 36} {"train_loss": -16.58396339416504, "global_step": 2996, "epoch": 36} {"train_loss": -16.805221557617188, "global_step": 2997, "epoch": 36} {"train_loss": -16.008991241455078, "global_step": 2998, "epoch": 36} {"train_loss": -16.100675582885742, "global_step": 2999, "epoch": 36} {"train_loss": -16.231643676757812, "global_step": 3000, "epoch": 36} {"train_loss": -15.997833251953125, "global_step": 3001, "epoch": 36} {"train_loss": -16.336774826049805, "global_step": 3002, "epoch": 36} {"train_loss": -16.547637939453125, "global_step": 3003, "epoch": 36} {"train_loss": -16.480411529541016, "global_step": 3004, "epoch": 36} {"train_loss": -16.544307708740234, "global_step": 3005, "epoch": 36} {"train_loss": -16.45888328552246, "global_step": 3006, "epoch": 36} {"train_loss": -16.604368209838867, "global_step": 3007, "epoch": 36} {"train_loss": -16.76291847229004, "global_step": 3008, "epoch": 36} {"train_loss": -16.4942684173584, "global_step": 3009, "epoch": 36} {"train_loss": -16.81570053100586, "global_step": 3010, "epoch": 36} {"train_loss": -16.234939575195312, "global_step": 3011, "epoch": 36} {"train_loss": -15.982953071594238, "global_step": 3012, "epoch": 36} {"train_loss": -16.430578231811523, "global_step": 3013, "epoch": 36} {"train_loss": -16.619693756103516, "global_step": 3014, "epoch": 36} {"train_loss": -16.076501846313477, "global_step": 3015, "epoch": 36} {"train_loss": -16.533035278320312, "global_step": 3016, "epoch": 36} {"train_loss": -16.616376876831055, "global_step": 3017, "epoch": 36} {"train_loss": -16.428043365478516, "global_step": 3018, "epoch": 36} {"train_loss": -16.784976959228516, "global_step": 3019, "epoch": 36} {"train_loss": -16.215227127075195, "global_step": 3020, "epoch": 36} {"train_loss": -16.62885856628418, "global_step": 3021, "epoch": 36} {"train_loss": -16.132095336914062, "global_step": 3022, "epoch": 36} {"train_loss": -16.456979751586914, "global_step": 3023, "epoch": 36} {"train_loss": -16.414518356323242, "global_step": 3024, "epoch": 36} {"train_loss": -16.283733367919922, "global_step": 3025, "epoch": 36} {"train_loss": -16.735803604125977, "global_step": 3026, "epoch": 36} {"train_loss": -16.08112907409668, "global_step": 3027, "epoch": 36} {"train_loss": -16.253646850585938, "global_step": 3028, "epoch": 36} {"train_loss": -16.188955307006836, "global_step": 3029, "epoch": 36} {"train_loss": -16.043624877929688, "global_step": 3030, "epoch": 36} {"train_loss": -16.42447280883789, "global_step": 3031, "epoch": 36} {"train_loss": -16.51321029663086, "global_step": 3032, "epoch": 36} {"train_loss": -16.250511169433594, "global_step": 3033, "epoch": 36} {"train_loss": -16.002578735351562, "global_step": 3034, "epoch": 36} {"train_loss": -16.539356231689453, "global_step": 3035, "epoch": 36} {"train_loss": -16.35129737854004, "global_step": 3036, "epoch": 36} {"train_loss": -16.292755126953125, "global_step": 3037, "epoch": 36} {"train_loss": -16.60774803161621, "global_step": 3038, "epoch": 36} {"train_loss": -16.189958572387695, "global_step": 3039, "epoch": 36} {"train_loss": -16.195253372192383, "global_step": 3040, "epoch": 36} {"train_loss": -16.34189224243164, "global_step": 3041, "epoch": 36} {"train_loss": -16.663171768188477, "global_step": 3042, "epoch": 36} {"train_loss": -16.36326026916504, "global_step": 3043, "epoch": 36} {"train_loss": -16.15595054626465, "global_step": 3044, "epoch": 36} {"train_loss": -16.197336196899414, "global_step": 3045, "epoch": 36} {"train_loss": -16.364362716674805, "global_step": 3046, "epoch": 36} {"train_loss": -16.337732315063477, "global_step": 3047, "epoch": 36} {"train_loss": -16.207839965820312, "global_step": 3048, "epoch": 36} {"train_loss": -16.491846084594727, "global_step": 3049, "epoch": 36} {"train_loss": -16.226957321166992, "global_step": 3050, "epoch": 36} {"train_loss": -16.223388671875, "global_step": 3051, "epoch": 36} {"train_loss": -16.238494873046875, "global_step": 3052, "epoch": 36} {"train_loss": -16.32345962524414, "global_step": 3053, "epoch": 36} {"train_loss": -16.335412979125977, "global_step": 3054, "epoch": 36} {"train_loss": -16.302291870117188, "global_step": 3055, "epoch": 36} {"train_loss": -17.068620681762695, "global_step": 3056, "epoch": 36} {"train_loss": -16.639759063720703, "global_step": 3057, "epoch": 36} {"train_loss": -15.958813667297363, "global_step": 3058, "epoch": 36} {"train_loss": -16.31131935119629, "global_step": 3059, "epoch": 36} {"train_loss": -16.3254451751709, "global_step": 3060, "epoch": 36} {"train_loss": -16.165029525756836, "global_step": 3061, "epoch": 36} {"train_loss": -16.296667098999023, "global_step": 3062, "epoch": 36} {"train_loss": -16.154165267944336, "global_step": 3063, "epoch": 36} {"train_loss": -16.483983993530273, "global_step": 3064, "epoch": 36} {"train_loss": -16.811664581298828, "global_step": 3065, "epoch": 36} {"train_loss": -16.477737426757812, "global_step": 3066, "epoch": 36} {"train_loss": -16.54865074157715, "global_step": 3067, "epoch": 36} {"train_loss": -16.413305282592773, "global_step": 3068, "epoch": 36} {"train_loss": -16.445743560791016, "global_step": 3069, "epoch": 36} {"train_loss": -16.35114568687347, "global_step": 3070, "epoch": 36, "val_loss": 7400971.0} {"train_loss": -15.88419246673584, "global_step": 3071, "epoch": 37} {"train_loss": -15.842315673828125, "global_step": 3072, "epoch": 37} {"train_loss": -16.33807945251465, "global_step": 3073, "epoch": 37} {"train_loss": -16.302621841430664, "global_step": 3074, "epoch": 37} {"train_loss": -16.12592124938965, "global_step": 3075, "epoch": 37} {"train_loss": -15.934134483337402, "global_step": 3076, "epoch": 37} {"train_loss": -16.03112030029297, "global_step": 3077, "epoch": 37} {"train_loss": -16.272863388061523, "global_step": 3078, "epoch": 37} {"train_loss": -16.490209579467773, "global_step": 3079, "epoch": 37} {"train_loss": -16.42604637145996, "global_step": 3080, "epoch": 37} {"train_loss": -16.032983779907227, "global_step": 3081, "epoch": 37} {"train_loss": -16.5589656829834, "global_step": 3082, "epoch": 37} {"train_loss": -16.363784790039062, "global_step": 3083, "epoch": 37} {"train_loss": -16.249608993530273, "global_step": 3084, "epoch": 37} {"train_loss": -16.229490280151367, "global_step": 3085, "epoch": 37} {"train_loss": -16.43877601623535, "global_step": 3086, "epoch": 37} {"train_loss": -16.610754013061523, "global_step": 3087, "epoch": 37} {"train_loss": -16.05864715576172, "global_step": 3088, "epoch": 37} {"train_loss": -16.219018936157227, "global_step": 3089, "epoch": 37} {"train_loss": -16.209287643432617, "global_step": 3090, "epoch": 37} {"train_loss": -16.5007266998291, "global_step": 3091, "epoch": 37} {"train_loss": -16.16094398498535, "global_step": 3092, "epoch": 37} {"train_loss": -16.274580001831055, "global_step": 3093, "epoch": 37} {"train_loss": -16.253881454467773, "global_step": 3094, "epoch": 37} {"train_loss": -16.658374786376953, "global_step": 3095, "epoch": 37} {"train_loss": -16.061979293823242, "global_step": 3096, "epoch": 37} {"train_loss": -16.55231475830078, "global_step": 3097, "epoch": 37} {"train_loss": -16.33487892150879, "global_step": 3098, "epoch": 37} {"train_loss": -16.344100952148438, "global_step": 3099, "epoch": 37} {"train_loss": -15.9508695602417, "global_step": 3100, "epoch": 37} {"train_loss": -16.11349868774414, "global_step": 3101, "epoch": 37} {"train_loss": -16.760671615600586, "global_step": 3102, "epoch": 37} {"train_loss": -16.558616638183594, "global_step": 3103, "epoch": 37} {"train_loss": -16.50531005859375, "global_step": 3104, "epoch": 37} {"train_loss": -16.65301513671875, "global_step": 3105, "epoch": 37} {"train_loss": -16.524295806884766, "global_step": 3106, "epoch": 37} {"train_loss": -16.99542808532715, "global_step": 3107, "epoch": 37} {"train_loss": -16.635000228881836, "global_step": 3108, "epoch": 37} {"train_loss": -16.409793853759766, "global_step": 3109, "epoch": 37} {"train_loss": -15.985983848571777, "global_step": 3110, "epoch": 37} {"train_loss": -16.225339889526367, "global_step": 3111, "epoch": 37} {"train_loss": -16.056617736816406, "global_step": 3112, "epoch": 37} {"train_loss": -16.23883819580078, "global_step": 3113, "epoch": 37} {"train_loss": -16.208097457885742, "global_step": 3114, "epoch": 37} {"train_loss": -16.56682777404785, "global_step": 3115, "epoch": 37} {"train_loss": -16.45866584777832, "global_step": 3116, "epoch": 37} {"train_loss": -16.371564865112305, "global_step": 3117, "epoch": 37} {"train_loss": -16.53580665588379, "global_step": 3118, "epoch": 37} {"train_loss": -15.759970664978027, "global_step": 3119, "epoch": 37} {"train_loss": -16.396942138671875, "global_step": 3120, "epoch": 37} {"train_loss": -16.17195701599121, "global_step": 3121, "epoch": 37} {"train_loss": -16.232751846313477, "global_step": 3122, "epoch": 37} {"train_loss": -16.375730514526367, "global_step": 3123, "epoch": 37} {"train_loss": -16.50885581970215, "global_step": 3124, "epoch": 37} {"train_loss": -16.533496856689453, "global_step": 3125, "epoch": 37} {"train_loss": -16.432071685791016, "global_step": 3126, "epoch": 37} {"train_loss": -16.530668258666992, "global_step": 3127, "epoch": 37} {"train_loss": -16.642507553100586, "global_step": 3128, "epoch": 37} {"train_loss": -16.5349178314209, "global_step": 3129, "epoch": 37} {"train_loss": -16.47528648376465, "global_step": 3130, "epoch": 37} {"train_loss": -16.801311492919922, "global_step": 3131, "epoch": 37} {"train_loss": -15.942553520202637, "global_step": 3132, "epoch": 37} {"train_loss": -16.150707244873047, "global_step": 3133, "epoch": 37} {"train_loss": -16.561208724975586, "global_step": 3134, "epoch": 37} {"train_loss": -16.302703857421875, "global_step": 3135, "epoch": 37} {"train_loss": -16.40238380432129, "global_step": 3136, "epoch": 37} {"train_loss": -16.18477439880371, "global_step": 3137, "epoch": 37} {"train_loss": -16.392086029052734, "global_step": 3138, "epoch": 37} {"train_loss": -16.337032318115234, "global_step": 3139, "epoch": 37} {"train_loss": -16.541303634643555, "global_step": 3140, "epoch": 37} {"train_loss": -16.575334548950195, "global_step": 3141, "epoch": 37} {"train_loss": -16.706308364868164, "global_step": 3142, "epoch": 37} {"train_loss": -16.178258895874023, "global_step": 3143, "epoch": 37} {"train_loss": -16.415334701538086, "global_step": 3144, "epoch": 37} {"train_loss": -16.468765258789062, "global_step": 3145, "epoch": 37} {"train_loss": -16.126157760620117, "global_step": 3146, "epoch": 37} {"train_loss": -16.711467742919922, "global_step": 3147, "epoch": 37} {"train_loss": -16.3029842376709, "global_step": 3148, "epoch": 37} {"train_loss": -16.261831283569336, "global_step": 3149, "epoch": 37} {"train_loss": -16.255369186401367, "global_step": 3150, "epoch": 37} {"train_loss": -16.212629318237305, "global_step": 3151, "epoch": 37} {"train_loss": -16.212160110473633, "global_step": 3152, "epoch": 37} {"train_loss": -16.352086561271943, "global_step": 3153, "epoch": 37, "val_loss": 7253567.0} {"train_loss": -16.58810806274414, "global_step": 3154, "epoch": 38} {"train_loss": -15.930996894836426, "global_step": 3155, "epoch": 38} {"train_loss": -16.626310348510742, "global_step": 3156, "epoch": 38} {"train_loss": -16.47933006286621, "global_step": 3157, "epoch": 38} {"train_loss": -16.09578514099121, "global_step": 3158, "epoch": 38} {"train_loss": -16.687030792236328, "global_step": 3159, "epoch": 38} {"train_loss": -16.49909019470215, "global_step": 3160, "epoch": 38} {"train_loss": -16.376638412475586, "global_step": 3161, "epoch": 38} {"train_loss": -16.553640365600586, "global_step": 3162, "epoch": 38} {"train_loss": -16.464221954345703, "global_step": 3163, "epoch": 38} {"train_loss": -16.616256713867188, "global_step": 3164, "epoch": 38} {"train_loss": -16.314420700073242, "global_step": 3165, "epoch": 38} {"train_loss": -16.541305541992188, "global_step": 3166, "epoch": 38} {"train_loss": -16.52874755859375, "global_step": 3167, "epoch": 38} {"train_loss": -16.56631851196289, "global_step": 3168, "epoch": 38} {"train_loss": -16.354856491088867, "global_step": 3169, "epoch": 38} {"train_loss": -16.0664119720459, "global_step": 3170, "epoch": 38} {"train_loss": -16.33611488342285, "global_step": 3171, "epoch": 38} {"train_loss": -16.153339385986328, "global_step": 3172, "epoch": 38} {"train_loss": -16.14948081970215, "global_step": 3173, "epoch": 38} {"train_loss": -16.0716552734375, "global_step": 3174, "epoch": 38} {"train_loss": -16.596332550048828, "global_step": 3175, "epoch": 38} {"train_loss": -16.373884201049805, "global_step": 3176, "epoch": 38} {"train_loss": -16.558528900146484, "global_step": 3177, "epoch": 38} {"train_loss": -16.40059471130371, "global_step": 3178, "epoch": 38} {"train_loss": -16.206083297729492, "global_step": 3179, "epoch": 38} {"train_loss": -16.519241333007812, "global_step": 3180, "epoch": 38} {"train_loss": -15.979669570922852, "global_step": 3181, "epoch": 38} {"train_loss": -16.622299194335938, "global_step": 3182, "epoch": 38} {"train_loss": -16.450830459594727, "global_step": 3183, "epoch": 38} {"train_loss": -16.00051498413086, "global_step": 3184, "epoch": 38} {"train_loss": -16.259584426879883, "global_step": 3185, "epoch": 38} {"train_loss": -16.278064727783203, "global_step": 3186, "epoch": 38} {"train_loss": -16.820348739624023, "global_step": 3187, "epoch": 38} {"train_loss": -16.69109535217285, "global_step": 3188, "epoch": 38} {"train_loss": -16.126323699951172, "global_step": 3189, "epoch": 38} {"train_loss": -16.556028366088867, "global_step": 3190, "epoch": 38} {"train_loss": -16.780363082885742, "global_step": 3191, "epoch": 38} {"train_loss": -16.2446346282959, "global_step": 3192, "epoch": 38} {"train_loss": -15.90936279296875, "global_step": 3193, "epoch": 38} {"train_loss": -16.49281883239746, "global_step": 3194, "epoch": 38} {"train_loss": -16.24822425842285, "global_step": 3195, "epoch": 38} {"train_loss": -16.72006607055664, "global_step": 3196, "epoch": 38} {"train_loss": -16.212242126464844, "global_step": 3197, "epoch": 38} {"train_loss": -16.071020126342773, "global_step": 3198, "epoch": 38} {"train_loss": -16.237581253051758, "global_step": 3199, "epoch": 38} {"train_loss": -16.343847274780273, "global_step": 3200, "epoch": 38} {"train_loss": -16.3773136138916, "global_step": 3201, "epoch": 38} {"train_loss": -16.341886520385742, "global_step": 3202, "epoch": 38} {"train_loss": -16.396635055541992, "global_step": 3203, "epoch": 38} {"train_loss": -16.33645248413086, "global_step": 3204, "epoch": 38} {"train_loss": -16.679691314697266, "global_step": 3205, "epoch": 38} {"train_loss": -16.66129493713379, "global_step": 3206, "epoch": 38} {"train_loss": -16.074377059936523, "global_step": 3207, "epoch": 38} {"train_loss": -15.993759155273438, "global_step": 3208, "epoch": 38} {"train_loss": -16.472688674926758, "global_step": 3209, "epoch": 38} {"train_loss": -16.624235153198242, "global_step": 3210, "epoch": 38} {"train_loss": -16.387659072875977, "global_step": 3211, "epoch": 38} {"train_loss": -16.540090560913086, "global_step": 3212, "epoch": 38} {"train_loss": -16.3883113861084, "global_step": 3213, "epoch": 38} {"train_loss": -16.46803092956543, "global_step": 3214, "epoch": 38} {"train_loss": -16.460542678833008, "global_step": 3215, "epoch": 38} {"train_loss": -16.459339141845703, "global_step": 3216, "epoch": 38} {"train_loss": -16.45383644104004, "global_step": 3217, "epoch": 38} {"train_loss": -16.438135147094727, "global_step": 3218, "epoch": 38} {"train_loss": -16.334197998046875, "global_step": 3219, "epoch": 38} {"train_loss": -16.555356979370117, "global_step": 3220, "epoch": 38} {"train_loss": -16.280141830444336, "global_step": 3221, "epoch": 38} {"train_loss": -16.49962043762207, "global_step": 3222, "epoch": 38} {"train_loss": -16.31846809387207, "global_step": 3223, "epoch": 38} {"train_loss": -16.659353256225586, "global_step": 3224, "epoch": 38} {"train_loss": -16.182172775268555, "global_step": 3225, "epoch": 38} {"train_loss": -16.592666625976562, "global_step": 3226, "epoch": 38} {"train_loss": -15.938504219055176, "global_step": 3227, "epoch": 38} {"train_loss": -16.389753341674805, "global_step": 3228, "epoch": 38} {"train_loss": -16.357484817504883, "global_step": 3229, "epoch": 38} {"train_loss": -16.37958335876465, "global_step": 3230, "epoch": 38} {"train_loss": -16.57728385925293, "global_step": 3231, "epoch": 38} {"train_loss": -16.39413833618164, "global_step": 3232, "epoch": 38} {"train_loss": -16.43334197998047, "global_step": 3233, "epoch": 38} {"train_loss": -16.656949996948242, "global_step": 3234, "epoch": 38} {"train_loss": -16.335660934448242, "global_step": 3235, "epoch": 38} {"train_loss": -16.37027025797281, "global_step": 3236, "epoch": 38, "val_loss": 7192798.0} {"train_loss": -16.178407669067383, "global_step": 3237, "epoch": 39} {"train_loss": -16.259321212768555, "global_step": 3238, "epoch": 39} {"train_loss": -15.872794151306152, "global_step": 3239, "epoch": 39} {"train_loss": -16.136581420898438, "global_step": 3240, "epoch": 39} {"train_loss": -16.554428100585938, "global_step": 3241, "epoch": 39} {"train_loss": -16.51651954650879, "global_step": 3242, "epoch": 39} {"train_loss": -16.094013214111328, "global_step": 3243, "epoch": 39} {"train_loss": -16.068037033081055, "global_step": 3244, "epoch": 39} {"train_loss": -16.462345123291016, "global_step": 3245, "epoch": 39} {"train_loss": -16.46834373474121, "global_step": 3246, "epoch": 39} {"train_loss": -16.383991241455078, "global_step": 3247, "epoch": 39} {"train_loss": -16.335254669189453, "global_step": 3248, "epoch": 39} {"train_loss": -16.80055809020996, "global_step": 3249, "epoch": 39} {"train_loss": -16.166818618774414, "global_step": 3250, "epoch": 39} {"train_loss": -16.34177589416504, "global_step": 3251, "epoch": 39} {"train_loss": -16.560544967651367, "global_step": 3252, "epoch": 39} {"train_loss": -16.216075897216797, "global_step": 3253, "epoch": 39} {"train_loss": -16.51136016845703, "global_step": 3254, "epoch": 39} {"train_loss": -16.124439239501953, "global_step": 3255, "epoch": 39} {"train_loss": -16.212736129760742, "global_step": 3256, "epoch": 39} {"train_loss": -16.477155685424805, "global_step": 3257, "epoch": 39} {"train_loss": -16.088586807250977, "global_step": 3258, "epoch": 39} {"train_loss": -16.311765670776367, "global_step": 3259, "epoch": 39} {"train_loss": -16.301612854003906, "global_step": 3260, "epoch": 39} {"train_loss": -15.877867698669434, "global_step": 3261, "epoch": 39} {"train_loss": -16.972631454467773, "global_step": 3262, "epoch": 39} {"train_loss": -16.34011459350586, "global_step": 3263, "epoch": 39} {"train_loss": -16.076993942260742, "global_step": 3264, "epoch": 39} {"train_loss": -16.297683715820312, "global_step": 3265, "epoch": 39} {"train_loss": -16.47074317932129, "global_step": 3266, "epoch": 39} {"train_loss": -16.07421112060547, "global_step": 3267, "epoch": 39} {"train_loss": -16.30030632019043, "global_step": 3268, "epoch": 39} {"train_loss": -16.391773223876953, "global_step": 3269, "epoch": 39} {"train_loss": -16.45210075378418, "global_step": 3270, "epoch": 39} {"train_loss": -16.464645385742188, "global_step": 3271, "epoch": 39} {"train_loss": -16.563026428222656, "global_step": 3272, "epoch": 39} {"train_loss": -16.50361442565918, "global_step": 3273, "epoch": 39} {"train_loss": -16.730148315429688, "global_step": 3274, "epoch": 39} {"train_loss": -16.79364013671875, "global_step": 3275, "epoch": 39} {"train_loss": -16.392093658447266, "global_step": 3276, "epoch": 39} {"train_loss": -16.142776489257812, "global_step": 3277, "epoch": 39} {"train_loss": -16.32517433166504, "global_step": 3278, "epoch": 39} {"train_loss": -16.463422775268555, "global_step": 3279, "epoch": 39} {"train_loss": -16.46126365661621, "global_step": 3280, "epoch": 39} {"train_loss": -16.49466896057129, "global_step": 3281, "epoch": 39} {"train_loss": -16.67362403869629, "global_step": 3282, "epoch": 39} {"train_loss": -16.396268844604492, "global_step": 3283, "epoch": 39} {"train_loss": -16.432849884033203, "global_step": 3284, "epoch": 39} {"train_loss": -16.511899948120117, "global_step": 3285, "epoch": 39} {"train_loss": -15.904887199401855, "global_step": 3286, "epoch": 39} {"train_loss": -16.06879234313965, "global_step": 3287, "epoch": 39} {"train_loss": -16.657751083374023, "global_step": 3288, "epoch": 39} {"train_loss": -16.40732765197754, "global_step": 3289, "epoch": 39} {"train_loss": -16.704914093017578, "global_step": 3290, "epoch": 39} {"train_loss": -16.52181053161621, "global_step": 3291, "epoch": 39} {"train_loss": -16.252185821533203, "global_step": 3292, "epoch": 39} {"train_loss": -16.039037704467773, "global_step": 3293, "epoch": 39} {"train_loss": -16.093185424804688, "global_step": 3294, "epoch": 39} {"train_loss": -16.860462188720703, "global_step": 3295, "epoch": 39} {"train_loss": -16.497055053710938, "global_step": 3296, "epoch": 39} {"train_loss": -16.587682723999023, "global_step": 3297, "epoch": 39} {"train_loss": -16.18483543395996, "global_step": 3298, "epoch": 39} {"train_loss": -15.891717910766602, "global_step": 3299, "epoch": 39} {"train_loss": -16.39706802368164, "global_step": 3300, "epoch": 39} {"train_loss": -16.407207489013672, "global_step": 3301, "epoch": 39} {"train_loss": -16.312387466430664, "global_step": 3302, "epoch": 39} {"train_loss": -16.668973922729492, "global_step": 3303, "epoch": 39} {"train_loss": -16.37477684020996, "global_step": 3304, "epoch": 39} {"train_loss": -16.775245666503906, "global_step": 3305, "epoch": 39} {"train_loss": -16.131093978881836, "global_step": 3306, "epoch": 39} {"train_loss": -16.702627182006836, "global_step": 3307, "epoch": 39} {"train_loss": -16.303518295288086, "global_step": 3308, "epoch": 39} {"train_loss": -16.653284072875977, "global_step": 3309, "epoch": 39} {"train_loss": -16.09157943725586, "global_step": 3310, "epoch": 39} {"train_loss": -16.530960083007812, "global_step": 3311, "epoch": 39} {"train_loss": -16.516706466674805, "global_step": 3312, "epoch": 39} {"train_loss": -16.724117279052734, "global_step": 3313, "epoch": 39} {"train_loss": -16.975797653198242, "global_step": 3314, "epoch": 39} {"train_loss": -16.2203311920166, "global_step": 3315, "epoch": 39} {"train_loss": -16.623870849609375, "global_step": 3316, "epoch": 39} {"train_loss": -16.411401748657227, "global_step": 3317, "epoch": 39} {"train_loss": -16.537668228149414, "global_step": 3318, "epoch": 39} {"train_loss": -16.385154712631042, "global_step": 3319, "epoch": 39, "val_loss": 7059949.0} {"train_loss": -16.36598777770996, "global_step": 3320, "epoch": 40} {"train_loss": -16.187742233276367, "global_step": 3321, "epoch": 40} {"train_loss": -16.88287353515625, "global_step": 3322, "epoch": 40} {"train_loss": -16.616954803466797, "global_step": 3323, "epoch": 40} {"train_loss": -16.20121192932129, "global_step": 3324, "epoch": 40} {"train_loss": -16.25605583190918, "global_step": 3325, "epoch": 40} {"train_loss": -16.020360946655273, "global_step": 3326, "epoch": 40} {"train_loss": -16.51682472229004, "global_step": 3327, "epoch": 40} {"train_loss": -16.39125633239746, "global_step": 3328, "epoch": 40} {"train_loss": -16.61492919921875, "global_step": 3329, "epoch": 40} {"train_loss": -16.276472091674805, "global_step": 3330, "epoch": 40} {"train_loss": -16.875473022460938, "global_step": 3331, "epoch": 40} {"train_loss": -16.7032413482666, "global_step": 3332, "epoch": 40} {"train_loss": -16.356504440307617, "global_step": 3333, "epoch": 40} {"train_loss": -16.63034439086914, "global_step": 3334, "epoch": 40} {"train_loss": -16.60772132873535, "global_step": 3335, "epoch": 40} {"train_loss": -16.383472442626953, "global_step": 3336, "epoch": 40} {"train_loss": -16.4610595703125, "global_step": 3337, "epoch": 40} {"train_loss": -16.535512924194336, "global_step": 3338, "epoch": 40} {"train_loss": -16.385120391845703, "global_step": 3339, "epoch": 40} {"train_loss": -16.404905319213867, "global_step": 3340, "epoch": 40} {"train_loss": -16.402015686035156, "global_step": 3341, "epoch": 40} {"train_loss": -16.230209350585938, "global_step": 3342, "epoch": 40} {"train_loss": -16.382152557373047, "global_step": 3343, "epoch": 40} {"train_loss": -16.373350143432617, "global_step": 3344, "epoch": 40} {"train_loss": -16.580509185791016, "global_step": 3345, "epoch": 40} {"train_loss": -16.53889274597168, "global_step": 3346, "epoch": 40} {"train_loss": -16.241321563720703, "global_step": 3347, "epoch": 40} {"train_loss": -16.972055435180664, "global_step": 3348, "epoch": 40} {"train_loss": -16.648462295532227, "global_step": 3349, "epoch": 40} {"train_loss": -16.553075790405273, "global_step": 3350, "epoch": 40} {"train_loss": -16.400510787963867, "global_step": 3351, "epoch": 40} {"train_loss": -16.345884323120117, "global_step": 3352, "epoch": 40} {"train_loss": -16.78660774230957, "global_step": 3353, "epoch": 40} {"train_loss": -15.991435050964355, "global_step": 3354, "epoch": 40} {"train_loss": -16.479970932006836, "global_step": 3355, "epoch": 40} {"train_loss": -16.598129272460938, "global_step": 3356, "epoch": 40} {"train_loss": -16.246000289916992, "global_step": 3357, "epoch": 40} {"train_loss": -16.593978881835938, "global_step": 3358, "epoch": 40} {"train_loss": -16.29136085510254, "global_step": 3359, "epoch": 40} {"train_loss": -16.47319984436035, "global_step": 3360, "epoch": 40} {"train_loss": -16.167301177978516, "global_step": 3361, "epoch": 40} {"train_loss": -16.834043502807617, "global_step": 3362, "epoch": 40} {"train_loss": -16.169357299804688, "global_step": 3363, "epoch": 40} {"train_loss": -16.49650001525879, "global_step": 3364, "epoch": 40} {"train_loss": -16.30535125732422, "global_step": 3365, "epoch": 40} {"train_loss": -16.09115219116211, "global_step": 3366, "epoch": 40} {"train_loss": -16.198408126831055, "global_step": 3367, "epoch": 40} {"train_loss": -16.528528213500977, "global_step": 3368, "epoch": 40} {"train_loss": -16.442106246948242, "global_step": 3369, "epoch": 40} {"train_loss": -16.873779296875, "global_step": 3370, "epoch": 40} {"train_loss": -16.485280990600586, "global_step": 3371, "epoch": 40} {"train_loss": -16.334152221679688, "global_step": 3372, "epoch": 40} {"train_loss": -16.67535972595215, "global_step": 3373, "epoch": 40} {"train_loss": -16.533143997192383, "global_step": 3374, "epoch": 40} {"train_loss": -16.829256057739258, "global_step": 3375, "epoch": 40} {"train_loss": -16.36081886291504, "global_step": 3376, "epoch": 40} {"train_loss": -16.454145431518555, "global_step": 3377, "epoch": 40} {"train_loss": -16.629432678222656, "global_step": 3378, "epoch": 40} {"train_loss": -15.995051383972168, "global_step": 3379, "epoch": 40} {"train_loss": -16.524526596069336, "global_step": 3380, "epoch": 40} {"train_loss": -16.353864669799805, "global_step": 3381, "epoch": 40} {"train_loss": -16.87102508544922, "global_step": 3382, "epoch": 40} {"train_loss": -16.559415817260742, "global_step": 3383, "epoch": 40} {"train_loss": -16.653127670288086, "global_step": 3384, "epoch": 40} {"train_loss": -16.556055068969727, "global_step": 3385, "epoch": 40} {"train_loss": -16.394052505493164, "global_step": 3386, "epoch": 40} {"train_loss": -16.481687545776367, "global_step": 3387, "epoch": 40} {"train_loss": -16.424158096313477, "global_step": 3388, "epoch": 40} {"train_loss": -16.56219482421875, "global_step": 3389, "epoch": 40} {"train_loss": -16.246490478515625, "global_step": 3390, "epoch": 40} {"train_loss": -16.4072208404541, "global_step": 3391, "epoch": 40} {"train_loss": -16.26932144165039, "global_step": 3392, "epoch": 40} {"train_loss": -16.294824600219727, "global_step": 3393, "epoch": 40} {"train_loss": -16.248945236206055, "global_step": 3394, "epoch": 40} {"train_loss": -16.482486724853516, "global_step": 3395, "epoch": 40} {"train_loss": -16.668054580688477, "global_step": 3396, "epoch": 40} {"train_loss": -16.255857467651367, "global_step": 3397, "epoch": 40} {"train_loss": -16.340320587158203, "global_step": 3398, "epoch": 40} {"train_loss": -16.79136085510254, "global_step": 3399, "epoch": 40} {"train_loss": -16.603435516357422, "global_step": 3400, "epoch": 40} {"train_loss": -16.312057495117188, "global_step": 3401, "epoch": 40} {"train_loss": -16.464395775852434, "global_step": 3402, "epoch": 40, "val_loss": 7103615.5} {"train_loss": -16.385438919067383, "global_step": 3403, "epoch": 41} {"train_loss": -16.448209762573242, "global_step": 3404, "epoch": 41} {"train_loss": -16.44028091430664, "global_step": 3405, "epoch": 41} {"train_loss": -16.7359561920166, "global_step": 3406, "epoch": 41} {"train_loss": -16.29876708984375, "global_step": 3407, "epoch": 41} {"train_loss": -16.32196044921875, "global_step": 3408, "epoch": 41} {"train_loss": -16.49711799621582, "global_step": 3409, "epoch": 41} {"train_loss": -16.32880973815918, "global_step": 3410, "epoch": 41} {"train_loss": -16.040678024291992, "global_step": 3411, "epoch": 41} {"train_loss": -16.11528205871582, "global_step": 3412, "epoch": 41} {"train_loss": -16.383901596069336, "global_step": 3413, "epoch": 41} {"train_loss": -16.380178451538086, "global_step": 3414, "epoch": 41} {"train_loss": -16.182783126831055, "global_step": 3415, "epoch": 41} {"train_loss": -16.71980094909668, "global_step": 3416, "epoch": 41} {"train_loss": -16.318777084350586, "global_step": 3417, "epoch": 41} {"train_loss": -16.565053939819336, "global_step": 3418, "epoch": 41} {"train_loss": -16.774917602539062, "global_step": 3419, "epoch": 41} {"train_loss": -16.260339736938477, "global_step": 3420, "epoch": 41} {"train_loss": -16.210689544677734, "global_step": 3421, "epoch": 41} {"train_loss": -16.0757999420166, "global_step": 3422, "epoch": 41} {"train_loss": -16.108102798461914, "global_step": 3423, "epoch": 41} {"train_loss": -16.239099502563477, "global_step": 3424, "epoch": 41} {"train_loss": -16.481674194335938, "global_step": 3425, "epoch": 41} {"train_loss": -16.271867752075195, "global_step": 3426, "epoch": 41} {"train_loss": -16.12641716003418, "global_step": 3427, "epoch": 41} {"train_loss": -16.677261352539062, "global_step": 3428, "epoch": 41} {"train_loss": -16.45954704284668, "global_step": 3429, "epoch": 41} {"train_loss": -16.546689987182617, "global_step": 3430, "epoch": 41} {"train_loss": -16.354215621948242, "global_step": 3431, "epoch": 41} {"train_loss": -16.473508834838867, "global_step": 3432, "epoch": 41} {"train_loss": -16.491226196289062, "global_step": 3433, "epoch": 41} {"train_loss": -16.94503402709961, "global_step": 3434, "epoch": 41} {"train_loss": -16.276142120361328, "global_step": 3435, "epoch": 41} {"train_loss": -16.04837417602539, "global_step": 3436, "epoch": 41} {"train_loss": -16.49725914001465, "global_step": 3437, "epoch": 41} {"train_loss": -16.390085220336914, "global_step": 3438, "epoch": 41} {"train_loss": -16.71700096130371, "global_step": 3439, "epoch": 41} {"train_loss": -16.2834529876709, "global_step": 3440, "epoch": 41} {"train_loss": -16.62279510498047, "global_step": 3441, "epoch": 41} {"train_loss": -16.69538688659668, "global_step": 3442, "epoch": 41} {"train_loss": -16.621450424194336, "global_step": 3443, "epoch": 41} {"train_loss": -16.041486740112305, "global_step": 3444, "epoch": 41} {"train_loss": -16.57045555114746, "global_step": 3445, "epoch": 41} {"train_loss": -16.722524642944336, "global_step": 3446, "epoch": 41} {"train_loss": -16.779333114624023, "global_step": 3447, "epoch": 41} {"train_loss": -16.4139347076416, "global_step": 3448, "epoch": 41} {"train_loss": -16.338973999023438, "global_step": 3449, "epoch": 41} {"train_loss": -16.503189086914062, "global_step": 3450, "epoch": 41} {"train_loss": -16.946176528930664, "global_step": 3451, "epoch": 41} {"train_loss": -16.711441040039062, "global_step": 3452, "epoch": 41} {"train_loss": -16.40004539489746, "global_step": 3453, "epoch": 41} {"train_loss": -16.40079689025879, "global_step": 3454, "epoch": 41} {"train_loss": -16.357791900634766, "global_step": 3455, "epoch": 41} {"train_loss": -16.880582809448242, "global_step": 3456, "epoch": 41} {"train_loss": -16.468887329101562, "global_step": 3457, "epoch": 41} {"train_loss": -16.337465286254883, "global_step": 3458, "epoch": 41} {"train_loss": -16.804410934448242, "global_step": 3459, "epoch": 41} {"train_loss": -16.318822860717773, "global_step": 3460, "epoch": 41} {"train_loss": -16.54322624206543, "global_step": 3461, "epoch": 41} {"train_loss": -16.158140182495117, "global_step": 3462, "epoch": 41} {"train_loss": -16.755910873413086, "global_step": 3463, "epoch": 41} {"train_loss": -16.885099411010742, "global_step": 3464, "epoch": 41} {"train_loss": -16.460844039916992, "global_step": 3465, "epoch": 41} {"train_loss": -16.54196548461914, "global_step": 3466, "epoch": 41} {"train_loss": -16.650983810424805, "global_step": 3467, "epoch": 41} {"train_loss": -16.4498348236084, "global_step": 3468, "epoch": 41} {"train_loss": -16.606531143188477, "global_step": 3469, "epoch": 41} {"train_loss": -16.71535301208496, "global_step": 3470, "epoch": 41} {"train_loss": -16.69188117980957, "global_step": 3471, "epoch": 41} {"train_loss": -16.494455337524414, "global_step": 3472, "epoch": 41} {"train_loss": -16.441648483276367, "global_step": 3473, "epoch": 41} {"train_loss": -16.51263427734375, "global_step": 3474, "epoch": 41} {"train_loss": -16.756656646728516, "global_step": 3475, "epoch": 41} {"train_loss": -16.629262924194336, "global_step": 3476, "epoch": 41} {"train_loss": -16.357919692993164, "global_step": 3477, "epoch": 41} {"train_loss": -16.841751098632812, "global_step": 3478, "epoch": 41} {"train_loss": -16.592344284057617, "global_step": 3479, "epoch": 41} {"train_loss": -16.858366012573242, "global_step": 3480, "epoch": 41} {"train_loss": -15.941339492797852, "global_step": 3481, "epoch": 41} {"train_loss": -16.64089012145996, "global_step": 3482, "epoch": 41} {"train_loss": -16.83321762084961, "global_step": 3483, "epoch": 41} {"train_loss": -16.3980770111084, "global_step": 3484, "epoch": 41} {"train_loss": -16.473927428923457, "global_step": 3485, "epoch": 41, "val_loss": 7233138.0} {"train_loss": -16.105710983276367, "global_step": 3486, "epoch": 42} {"train_loss": -16.551679611206055, "global_step": 3487, "epoch": 42} {"train_loss": -16.524564743041992, "global_step": 3488, "epoch": 42} {"train_loss": -16.43381690979004, "global_step": 3489, "epoch": 42} {"train_loss": -16.426794052124023, "global_step": 3490, "epoch": 42} {"train_loss": -16.321340560913086, "global_step": 3491, "epoch": 42} {"train_loss": -16.73423194885254, "global_step": 3492, "epoch": 42} {"train_loss": -16.336624145507812, "global_step": 3493, "epoch": 42} {"train_loss": -16.550018310546875, "global_step": 3494, "epoch": 42} {"train_loss": -16.172334671020508, "global_step": 3495, "epoch": 42} {"train_loss": -16.484786987304688, "global_step": 3496, "epoch": 42} {"train_loss": -16.491104125976562, "global_step": 3497, "epoch": 42} {"train_loss": -16.509429931640625, "global_step": 3498, "epoch": 42} {"train_loss": -16.723506927490234, "global_step": 3499, "epoch": 42} {"train_loss": -16.581457138061523, "global_step": 3500, "epoch": 42} {"train_loss": -16.468002319335938, "global_step": 3501, "epoch": 42} {"train_loss": -16.811634063720703, "global_step": 3502, "epoch": 42} {"train_loss": -16.948074340820312, "global_step": 3503, "epoch": 42} {"train_loss": -16.46335792541504, "global_step": 3504, "epoch": 42} {"train_loss": -16.4541015625, "global_step": 3505, "epoch": 42} {"train_loss": -16.582761764526367, "global_step": 3506, "epoch": 42} {"train_loss": -16.409637451171875, "global_step": 3507, "epoch": 42} {"train_loss": -16.68976593017578, "global_step": 3508, "epoch": 42} {"train_loss": -16.715450286865234, "global_step": 3509, "epoch": 42} {"train_loss": -16.41265296936035, "global_step": 3510, "epoch": 42} {"train_loss": -16.241806030273438, "global_step": 3511, "epoch": 42} {"train_loss": -16.426767349243164, "global_step": 3512, "epoch": 42} {"train_loss": -16.395538330078125, "global_step": 3513, "epoch": 42} {"train_loss": -16.355558395385742, "global_step": 3514, "epoch": 42} {"train_loss": -16.06144905090332, "global_step": 3515, "epoch": 42} {"train_loss": -16.233753204345703, "global_step": 3516, "epoch": 42} {"train_loss": -16.461971282958984, "global_step": 3517, "epoch": 42} {"train_loss": -16.08559226989746, "global_step": 3518, "epoch": 42} {"train_loss": -16.796926498413086, "global_step": 3519, "epoch": 42} {"train_loss": -16.396732330322266, "global_step": 3520, "epoch": 42} {"train_loss": -16.25839614868164, "global_step": 3521, "epoch": 42} {"train_loss": -17.02090072631836, "global_step": 3522, "epoch": 42} {"train_loss": -16.513151168823242, "global_step": 3523, "epoch": 42} {"train_loss": -16.430164337158203, "global_step": 3524, "epoch": 42} {"train_loss": -16.12275505065918, "global_step": 3525, "epoch": 42} {"train_loss": -16.515409469604492, "global_step": 3526, "epoch": 42} {"train_loss": -16.42104148864746, "global_step": 3527, "epoch": 42} {"train_loss": -16.846128463745117, "global_step": 3528, "epoch": 42} {"train_loss": -16.415021896362305, "global_step": 3529, "epoch": 42} {"train_loss": -16.404144287109375, "global_step": 3530, "epoch": 42} {"train_loss": -16.59161949157715, "global_step": 3531, "epoch": 42} {"train_loss": -16.66450309753418, "global_step": 3532, "epoch": 42} {"train_loss": -16.4526424407959, "global_step": 3533, "epoch": 42} {"train_loss": -16.850971221923828, "global_step": 3534, "epoch": 42} {"train_loss": -16.78065299987793, "global_step": 3535, "epoch": 42} {"train_loss": -16.31199836730957, "global_step": 3536, "epoch": 42} {"train_loss": -16.7276554107666, "global_step": 3537, "epoch": 42} {"train_loss": -16.552453994750977, "global_step": 3538, "epoch": 42} {"train_loss": -16.477062225341797, "global_step": 3539, "epoch": 42} {"train_loss": -16.705554962158203, "global_step": 3540, "epoch": 42} {"train_loss": -16.439163208007812, "global_step": 3541, "epoch": 42} {"train_loss": -16.603851318359375, "global_step": 3542, "epoch": 42} {"train_loss": -16.474212646484375, "global_step": 3543, "epoch": 42} {"train_loss": -16.510486602783203, "global_step": 3544, "epoch": 42} {"train_loss": -16.541704177856445, "global_step": 3545, "epoch": 42} {"train_loss": -16.537982940673828, "global_step": 3546, "epoch": 42} {"train_loss": -16.41037368774414, "global_step": 3547, "epoch": 42} {"train_loss": -16.090957641601562, "global_step": 3548, "epoch": 42} {"train_loss": -16.390106201171875, "global_step": 3549, "epoch": 42} {"train_loss": -16.71698570251465, "global_step": 3550, "epoch": 42} {"train_loss": -16.39496421813965, "global_step": 3551, "epoch": 42} {"train_loss": -16.579627990722656, "global_step": 3552, "epoch": 42} {"train_loss": -16.82451629638672, "global_step": 3553, "epoch": 42} {"train_loss": -15.806924819946289, "global_step": 3554, "epoch": 42} {"train_loss": -16.606292724609375, "global_step": 3555, "epoch": 42} {"train_loss": -16.506628036499023, "global_step": 3556, "epoch": 42} {"train_loss": -16.515695571899414, "global_step": 3557, "epoch": 42} {"train_loss": -16.787263870239258, "global_step": 3558, "epoch": 42} {"train_loss": -16.60279655456543, "global_step": 3559, "epoch": 42} {"train_loss": -17.091129302978516, "global_step": 3560, "epoch": 42} {"train_loss": -15.976633071899414, "global_step": 3561, "epoch": 42} {"train_loss": -16.63759422302246, "global_step": 3562, "epoch": 42} {"train_loss": -16.305557250976562, "global_step": 3563, "epoch": 42} {"train_loss": -16.476356506347656, "global_step": 3564, "epoch": 42} {"train_loss": -16.47101402282715, "global_step": 3565, "epoch": 42} {"train_loss": -16.627412796020508, "global_step": 3566, "epoch": 42} {"train_loss": -16.06612777709961, "global_step": 3567, "epoch": 42} {"train_loss": -16.49844668284956, "global_step": 3568, "epoch": 42, "val_loss": 7124595.5} {"train_loss": -16.38551902770996, "global_step": 3569, "epoch": 43} {"train_loss": -16.22848892211914, "global_step": 3570, "epoch": 43} {"train_loss": -16.564563751220703, "global_step": 3571, "epoch": 43} {"train_loss": -16.270156860351562, "global_step": 3572, "epoch": 43} {"train_loss": -16.519495010375977, "global_step": 3573, "epoch": 43} {"train_loss": -16.449644088745117, "global_step": 3574, "epoch": 43} {"train_loss": -16.58778953552246, "global_step": 3575, "epoch": 43} {"train_loss": -16.748563766479492, "global_step": 3576, "epoch": 43} {"train_loss": -16.000642776489258, "global_step": 3577, "epoch": 43} {"train_loss": -16.114303588867188, "global_step": 3578, "epoch": 43} {"train_loss": -16.20065689086914, "global_step": 3579, "epoch": 43} {"train_loss": -16.631376266479492, "global_step": 3580, "epoch": 43} {"train_loss": -16.538236618041992, "global_step": 3581, "epoch": 43} {"train_loss": -16.331207275390625, "global_step": 3582, "epoch": 43} {"train_loss": -16.616886138916016, "global_step": 3583, "epoch": 43} {"train_loss": -16.49039649963379, "global_step": 3584, "epoch": 43} {"train_loss": -16.720569610595703, "global_step": 3585, "epoch": 43} {"train_loss": -16.198265075683594, "global_step": 3586, "epoch": 43} {"train_loss": -16.350448608398438, "global_step": 3587, "epoch": 43} {"train_loss": -16.340551376342773, "global_step": 3588, "epoch": 43} {"train_loss": -16.161046981811523, "global_step": 3589, "epoch": 43} {"train_loss": -16.109968185424805, "global_step": 3590, "epoch": 43} {"train_loss": -16.462377548217773, "global_step": 3591, "epoch": 43} {"train_loss": -16.40110969543457, "global_step": 3592, "epoch": 43} {"train_loss": -16.29767417907715, "global_step": 3593, "epoch": 43} {"train_loss": -16.503549575805664, "global_step": 3594, "epoch": 43} {"train_loss": -16.748411178588867, "global_step": 3595, "epoch": 43} {"train_loss": -16.413223266601562, "global_step": 3596, "epoch": 43} {"train_loss": -16.397472381591797, "global_step": 3597, "epoch": 43} {"train_loss": -16.31011390686035, "global_step": 3598, "epoch": 43} {"train_loss": -16.319944381713867, "global_step": 3599, "epoch": 43} {"train_loss": -16.20181655883789, "global_step": 3600, "epoch": 43} {"train_loss": -16.551593780517578, "global_step": 3601, "epoch": 43} {"train_loss": -16.36861228942871, "global_step": 3602, "epoch": 43} {"train_loss": -16.542423248291016, "global_step": 3603, "epoch": 43} {"train_loss": -16.85886573791504, "global_step": 3604, "epoch": 43} {"train_loss": -16.0695858001709, "global_step": 3605, "epoch": 43} {"train_loss": -16.60135841369629, "global_step": 3606, "epoch": 43} {"train_loss": -16.627723693847656, "global_step": 3607, "epoch": 43} {"train_loss": -16.549036026000977, "global_step": 3608, "epoch": 43} {"train_loss": -16.55888557434082, "global_step": 3609, "epoch": 43} {"train_loss": -16.64780044555664, "global_step": 3610, "epoch": 43} {"train_loss": -16.394819259643555, "global_step": 3611, "epoch": 43} {"train_loss": -16.431127548217773, "global_step": 3612, "epoch": 43} {"train_loss": -16.547800064086914, "global_step": 3613, "epoch": 43} {"train_loss": -16.46063804626465, "global_step": 3614, "epoch": 43} {"train_loss": -16.34952735900879, "global_step": 3615, "epoch": 43} {"train_loss": -16.77155113220215, "global_step": 3616, "epoch": 43} {"train_loss": -16.63260269165039, "global_step": 3617, "epoch": 43} {"train_loss": -16.773155212402344, "global_step": 3618, "epoch": 43} {"train_loss": -16.59210777282715, "global_step": 3619, "epoch": 43} {"train_loss": -16.399986267089844, "global_step": 3620, "epoch": 43} {"train_loss": -16.363300323486328, "global_step": 3621, "epoch": 43} {"train_loss": -16.80265235900879, "global_step": 3622, "epoch": 43} {"train_loss": -16.44258689880371, "global_step": 3623, "epoch": 43} {"train_loss": -16.2496395111084, "global_step": 3624, "epoch": 43} {"train_loss": -16.66813850402832, "global_step": 3625, "epoch": 43} {"train_loss": -16.440080642700195, "global_step": 3626, "epoch": 43} {"train_loss": -16.34908103942871, "global_step": 3627, "epoch": 43} {"train_loss": -17.104124069213867, "global_step": 3628, "epoch": 43} {"train_loss": -16.85395050048828, "global_step": 3629, "epoch": 43} {"train_loss": -16.23630714416504, "global_step": 3630, "epoch": 43} {"train_loss": -16.376449584960938, "global_step": 3631, "epoch": 43} {"train_loss": -17.073043823242188, "global_step": 3632, "epoch": 43} {"train_loss": -16.526718139648438, "global_step": 3633, "epoch": 43} {"train_loss": -16.651172637939453, "global_step": 3634, "epoch": 43} {"train_loss": -16.57636070251465, "global_step": 3635, "epoch": 43} {"train_loss": -16.448776245117188, "global_step": 3636, "epoch": 43} {"train_loss": -16.642019271850586, "global_step": 3637, "epoch": 43} {"train_loss": -16.557052612304688, "global_step": 3638, "epoch": 43} {"train_loss": -16.76188087463379, "global_step": 3639, "epoch": 43} {"train_loss": -16.917896270751953, "global_step": 3640, "epoch": 43} {"train_loss": -16.603513717651367, "global_step": 3641, "epoch": 43} {"train_loss": -16.698026657104492, "global_step": 3642, "epoch": 43} {"train_loss": -16.60211181640625, "global_step": 3643, "epoch": 43} {"train_loss": -16.50917625427246, "global_step": 3644, "epoch": 43} {"train_loss": -16.991727828979492, "global_step": 3645, "epoch": 43} {"train_loss": -16.275676727294922, "global_step": 3646, "epoch": 43} {"train_loss": -16.68834686279297, "global_step": 3647, "epoch": 43} {"train_loss": -16.868850708007812, "global_step": 3648, "epoch": 43} {"train_loss": -17.123062133789062, "global_step": 3649, "epoch": 43} {"train_loss": -16.743183135986328, "global_step": 3650, "epoch": 43} {"train_loss": -16.507677376988422, "global_step": 3651, "epoch": 43, "val_loss": 7138807.0} {"train_loss": -16.177595138549805, "global_step": 3652, "epoch": 44} {"train_loss": -16.453279495239258, "global_step": 3653, "epoch": 44} {"train_loss": -16.004398345947266, "global_step": 3654, "epoch": 44} {"train_loss": -16.257549285888672, "global_step": 3655, "epoch": 44} {"train_loss": -16.70563316345215, "global_step": 3656, "epoch": 44} {"train_loss": -16.445852279663086, "global_step": 3657, "epoch": 44} {"train_loss": -16.718557357788086, "global_step": 3658, "epoch": 44} {"train_loss": -16.523096084594727, "global_step": 3659, "epoch": 44} {"train_loss": -16.664886474609375, "global_step": 3660, "epoch": 44} {"train_loss": -16.17373275756836, "global_step": 3661, "epoch": 44} {"train_loss": -16.76719856262207, "global_step": 3662, "epoch": 44} {"train_loss": -16.10202407836914, "global_step": 3663, "epoch": 44} {"train_loss": -16.244802474975586, "global_step": 3664, "epoch": 44} {"train_loss": -16.687129974365234, "global_step": 3665, "epoch": 44} {"train_loss": -16.31245994567871, "global_step": 3666, "epoch": 44} {"train_loss": -16.530508041381836, "global_step": 3667, "epoch": 44} {"train_loss": -16.536840438842773, "global_step": 3668, "epoch": 44} {"train_loss": -16.89931297302246, "global_step": 3669, "epoch": 44} {"train_loss": -16.51759147644043, "global_step": 3670, "epoch": 44} {"train_loss": -16.782224655151367, "global_step": 3671, "epoch": 44} {"train_loss": -16.401596069335938, "global_step": 3672, "epoch": 44} {"train_loss": -16.333646774291992, "global_step": 3673, "epoch": 44} {"train_loss": -16.804309844970703, "global_step": 3674, "epoch": 44} {"train_loss": -16.879907608032227, "global_step": 3675, "epoch": 44} {"train_loss": -16.481525421142578, "global_step": 3676, "epoch": 44} {"train_loss": -16.620622634887695, "global_step": 3677, "epoch": 44} {"train_loss": -16.600765228271484, "global_step": 3678, "epoch": 44} {"train_loss": -16.29671287536621, "global_step": 3679, "epoch": 44} {"train_loss": -16.788732528686523, "global_step": 3680, "epoch": 44} {"train_loss": -16.4149169921875, "global_step": 3681, "epoch": 44} {"train_loss": -16.293399810791016, "global_step": 3682, "epoch": 44} {"train_loss": -16.49185562133789, "global_step": 3683, "epoch": 44} {"train_loss": -16.324026107788086, "global_step": 3684, "epoch": 44} {"train_loss": -16.35207176208496, "global_step": 3685, "epoch": 44} {"train_loss": -16.569143295288086, "global_step": 3686, "epoch": 44} {"train_loss": -16.515348434448242, "global_step": 3687, "epoch": 44} {"train_loss": -16.3739070892334, "global_step": 3688, "epoch": 44} {"train_loss": -16.58487892150879, "global_step": 3689, "epoch": 44} {"train_loss": -16.398162841796875, "global_step": 3690, "epoch": 44} {"train_loss": -16.739965438842773, "global_step": 3691, "epoch": 44} {"train_loss": -16.71957778930664, "global_step": 3692, "epoch": 44} {"train_loss": -16.562509536743164, "global_step": 3693, "epoch": 44} {"train_loss": -16.84088134765625, "global_step": 3694, "epoch": 44} {"train_loss": -16.63214683532715, "global_step": 3695, "epoch": 44} {"train_loss": -17.018999099731445, "global_step": 3696, "epoch": 44} {"train_loss": -16.459171295166016, "global_step": 3697, "epoch": 44} {"train_loss": -16.63949966430664, "global_step": 3698, "epoch": 44} {"train_loss": -16.186948776245117, "global_step": 3699, "epoch": 44} {"train_loss": -16.675329208374023, "global_step": 3700, "epoch": 44} {"train_loss": -16.47829246520996, "global_step": 3701, "epoch": 44} {"train_loss": -16.461957931518555, "global_step": 3702, "epoch": 44} {"train_loss": -16.93684959411621, "global_step": 3703, "epoch": 44} {"train_loss": -16.2194881439209, "global_step": 3704, "epoch": 44} {"train_loss": -16.707284927368164, "global_step": 3705, "epoch": 44} {"train_loss": -16.190160751342773, "global_step": 3706, "epoch": 44} {"train_loss": -16.38558578491211, "global_step": 3707, "epoch": 44} {"train_loss": -16.6699161529541, "global_step": 3708, "epoch": 44} {"train_loss": -16.73227310180664, "global_step": 3709, "epoch": 44} {"train_loss": -16.480253219604492, "global_step": 3710, "epoch": 44} {"train_loss": -16.62067985534668, "global_step": 3711, "epoch": 44} {"train_loss": -16.98078727722168, "global_step": 3712, "epoch": 44} {"train_loss": -16.896760940551758, "global_step": 3713, "epoch": 44} {"train_loss": -16.497528076171875, "global_step": 3714, "epoch": 44} {"train_loss": -16.457639694213867, "global_step": 3715, "epoch": 44} {"train_loss": -16.58037757873535, "global_step": 3716, "epoch": 44} {"train_loss": -16.480005264282227, "global_step": 3717, "epoch": 44} {"train_loss": -16.70705223083496, "global_step": 3718, "epoch": 44} {"train_loss": -16.53944969177246, "global_step": 3719, "epoch": 44} {"train_loss": -16.662782669067383, "global_step": 3720, "epoch": 44} {"train_loss": -16.651987075805664, "global_step": 3721, "epoch": 44} {"train_loss": -16.42831802368164, "global_step": 3722, "epoch": 44} {"train_loss": -16.566085815429688, "global_step": 3723, "epoch": 44} {"train_loss": -16.761770248413086, "global_step": 3724, "epoch": 44} {"train_loss": -16.074926376342773, "global_step": 3725, "epoch": 44} {"train_loss": -16.678516387939453, "global_step": 3726, "epoch": 44} {"train_loss": -16.3420467376709, "global_step": 3727, "epoch": 44} {"train_loss": -16.259977340698242, "global_step": 3728, "epoch": 44} {"train_loss": -16.711591720581055, "global_step": 3729, "epoch": 44} {"train_loss": -16.468040466308594, "global_step": 3730, "epoch": 44} {"train_loss": -16.421369552612305, "global_step": 3731, "epoch": 44} {"train_loss": -16.771259307861328, "global_step": 3732, "epoch": 44} {"train_loss": -16.70050621032715, "global_step": 3733, "epoch": 44} {"train_loss": -16.536060517092785, "global_step": 3734, "epoch": 44, "val_loss": 6929137.0} {"train_loss": -16.67782974243164, "global_step": 3735, "epoch": 45} {"train_loss": -15.755705833435059, "global_step": 3736, "epoch": 45} {"train_loss": -16.386272430419922, "global_step": 3737, "epoch": 45} {"train_loss": -16.185035705566406, "global_step": 3738, "epoch": 45} {"train_loss": -16.750242233276367, "global_step": 3739, "epoch": 45} {"train_loss": -16.56292724609375, "global_step": 3740, "epoch": 45} {"train_loss": -16.02613639831543, "global_step": 3741, "epoch": 45} {"train_loss": -16.88430404663086, "global_step": 3742, "epoch": 45} {"train_loss": -16.640195846557617, "global_step": 3743, "epoch": 45} {"train_loss": -16.12890625, "global_step": 3744, "epoch": 45} {"train_loss": -16.183490753173828, "global_step": 3745, "epoch": 45} {"train_loss": -16.247346878051758, "global_step": 3746, "epoch": 45} {"train_loss": -16.418581008911133, "global_step": 3747, "epoch": 45} {"train_loss": -16.207700729370117, "global_step": 3748, "epoch": 45} {"train_loss": -16.579980850219727, "global_step": 3749, "epoch": 45} {"train_loss": -16.584741592407227, "global_step": 3750, "epoch": 45} {"train_loss": -16.07040786743164, "global_step": 3751, "epoch": 45} {"train_loss": -16.505542755126953, "global_step": 3752, "epoch": 45} {"train_loss": -16.4991397857666, "global_step": 3753, "epoch": 45} {"train_loss": -16.703500747680664, "global_step": 3754, "epoch": 45} {"train_loss": -16.21204376220703, "global_step": 3755, "epoch": 45} {"train_loss": -16.437353134155273, "global_step": 3756, "epoch": 45} {"train_loss": -16.429187774658203, "global_step": 3757, "epoch": 45} {"train_loss": -16.590436935424805, "global_step": 3758, "epoch": 45} {"train_loss": -16.666303634643555, "global_step": 3759, "epoch": 45} {"train_loss": -16.46626091003418, "global_step": 3760, "epoch": 45} {"train_loss": -16.43619155883789, "global_step": 3761, "epoch": 45} {"train_loss": -16.77349281311035, "global_step": 3762, "epoch": 45} {"train_loss": -16.742490768432617, "global_step": 3763, "epoch": 45} {"train_loss": -16.8313045501709, "global_step": 3764, "epoch": 45} {"train_loss": -16.880447387695312, "global_step": 3765, "epoch": 45} {"train_loss": -16.65114402770996, "global_step": 3766, "epoch": 45} {"train_loss": -16.471622467041016, "global_step": 3767, "epoch": 45} {"train_loss": -16.785078048706055, "global_step": 3768, "epoch": 45} {"train_loss": -16.424386978149414, "global_step": 3769, "epoch": 45} {"train_loss": -16.772329330444336, "global_step": 3770, "epoch": 45} {"train_loss": -16.778562545776367, "global_step": 3771, "epoch": 45} {"train_loss": -16.740360260009766, "global_step": 3772, "epoch": 45} {"train_loss": -16.372243881225586, "global_step": 3773, "epoch": 45} {"train_loss": -16.470277786254883, "global_step": 3774, "epoch": 45} {"train_loss": -16.46766471862793, "global_step": 3775, "epoch": 45} {"train_loss": -16.77262306213379, "global_step": 3776, "epoch": 45} {"train_loss": -16.599365234375, "global_step": 3777, "epoch": 45} {"train_loss": -16.68009376525879, "global_step": 3778, "epoch": 45} {"train_loss": -16.69673728942871, "global_step": 3779, "epoch": 45} {"train_loss": -16.52176284790039, "global_step": 3780, "epoch": 45} {"train_loss": -16.798789978027344, "global_step": 3781, "epoch": 45} {"train_loss": -16.3920955657959, "global_step": 3782, "epoch": 45} {"train_loss": -16.603574752807617, "global_step": 3783, "epoch": 45} {"train_loss": -16.62393569946289, "global_step": 3784, "epoch": 45} {"train_loss": -16.93768310546875, "global_step": 3785, "epoch": 45} {"train_loss": -16.61732292175293, "global_step": 3786, "epoch": 45} {"train_loss": -16.529800415039062, "global_step": 3787, "epoch": 45} {"train_loss": -16.88641929626465, "global_step": 3788, "epoch": 45} {"train_loss": -16.152137756347656, "global_step": 3789, "epoch": 45} {"train_loss": -16.425317764282227, "global_step": 3790, "epoch": 45} {"train_loss": -16.732587814331055, "global_step": 3791, "epoch": 45} {"train_loss": -16.859739303588867, "global_step": 3792, "epoch": 45} {"train_loss": -17.015178680419922, "global_step": 3793, "epoch": 45} {"train_loss": -16.580175399780273, "global_step": 3794, "epoch": 45} {"train_loss": -16.7998104095459, "global_step": 3795, "epoch": 45} {"train_loss": -16.753610610961914, "global_step": 3796, "epoch": 45} {"train_loss": -16.72865867614746, "global_step": 3797, "epoch": 45} {"train_loss": -16.6457462310791, "global_step": 3798, "epoch": 45} {"train_loss": -16.241769790649414, "global_step": 3799, "epoch": 45} {"train_loss": -16.70796012878418, "global_step": 3800, "epoch": 45} {"train_loss": -16.740026473999023, "global_step": 3801, "epoch": 45} {"train_loss": -16.76625633239746, "global_step": 3802, "epoch": 45} {"train_loss": -16.403470993041992, "global_step": 3803, "epoch": 45} {"train_loss": -16.436193466186523, "global_step": 3804, "epoch": 45} {"train_loss": -17.060209274291992, "global_step": 3805, "epoch": 45} {"train_loss": -16.744958877563477, "global_step": 3806, "epoch": 45} {"train_loss": -16.222412109375, "global_step": 3807, "epoch": 45} {"train_loss": -16.58393669128418, "global_step": 3808, "epoch": 45} {"train_loss": -16.814355850219727, "global_step": 3809, "epoch": 45} {"train_loss": -16.599929809570312, "global_step": 3810, "epoch": 45} {"train_loss": -16.488479614257812, "global_step": 3811, "epoch": 45} {"train_loss": -16.802927017211914, "global_step": 3812, "epoch": 45} {"train_loss": -16.723575592041016, "global_step": 3813, "epoch": 45} {"train_loss": -16.349424362182617, "global_step": 3814, "epoch": 45} {"train_loss": -16.56003189086914, "global_step": 3815, "epoch": 45} {"train_loss": -16.558752059936523, "global_step": 3816, "epoch": 45} {"train_loss": -16.56056308746338, "global_step": 3817, "epoch": 45, "val_loss": 6932148.5} {"train_loss": -16.659719467163086, "global_step": 3818, "epoch": 46} {"train_loss": -16.425748825073242, "global_step": 3819, "epoch": 46} {"train_loss": -16.488590240478516, "global_step": 3820, "epoch": 46} {"train_loss": -16.357240676879883, "global_step": 3821, "epoch": 46} {"train_loss": -16.4455623626709, "global_step": 3822, "epoch": 46} {"train_loss": -16.4117488861084, "global_step": 3823, "epoch": 46} {"train_loss": -16.59688377380371, "global_step": 3824, "epoch": 46} {"train_loss": -16.77159309387207, "global_step": 3825, "epoch": 46} {"train_loss": -16.128910064697266, "global_step": 3826, "epoch": 46} {"train_loss": -16.782873153686523, "global_step": 3827, "epoch": 46} {"train_loss": -16.448720932006836, "global_step": 3828, "epoch": 46} {"train_loss": -16.175031661987305, "global_step": 3829, "epoch": 46} {"train_loss": -16.539783477783203, "global_step": 3830, "epoch": 46} {"train_loss": -16.60970115661621, "global_step": 3831, "epoch": 46} {"train_loss": -16.270261764526367, "global_step": 3832, "epoch": 46} {"train_loss": -16.68135643005371, "global_step": 3833, "epoch": 46} {"train_loss": -16.412023544311523, "global_step": 3834, "epoch": 46} {"train_loss": -16.34871482849121, "global_step": 3835, "epoch": 46} {"train_loss": -16.211576461791992, "global_step": 3836, "epoch": 46} {"train_loss": -16.673120498657227, "global_step": 3837, "epoch": 46} {"train_loss": -16.363554000854492, "global_step": 3838, "epoch": 46} {"train_loss": -16.57853889465332, "global_step": 3839, "epoch": 46} {"train_loss": -16.282934188842773, "global_step": 3840, "epoch": 46} {"train_loss": -16.54012107849121, "global_step": 3841, "epoch": 46} {"train_loss": -16.551532745361328, "global_step": 3842, "epoch": 46} {"train_loss": -16.493120193481445, "global_step": 3843, "epoch": 46} {"train_loss": -16.70200538635254, "global_step": 3844, "epoch": 46} {"train_loss": -16.197324752807617, "global_step": 3845, "epoch": 46} {"train_loss": -16.396326065063477, "global_step": 3846, "epoch": 46} {"train_loss": -16.19891929626465, "global_step": 3847, "epoch": 46} {"train_loss": -16.596145629882812, "global_step": 3848, "epoch": 46} {"train_loss": -17.037548065185547, "global_step": 3849, "epoch": 46} {"train_loss": -16.5295467376709, "global_step": 3850, "epoch": 46} {"train_loss": -16.883052825927734, "global_step": 3851, "epoch": 46} {"train_loss": -16.736923217773438, "global_step": 3852, "epoch": 46} {"train_loss": -16.16562843322754, "global_step": 3853, "epoch": 46} {"train_loss": -16.758342742919922, "global_step": 3854, "epoch": 46} {"train_loss": -17.038360595703125, "global_step": 3855, "epoch": 46} {"train_loss": -16.939687728881836, "global_step": 3856, "epoch": 46} {"train_loss": -16.661849975585938, "global_step": 3857, "epoch": 46} {"train_loss": -16.90673828125, "global_step": 3858, "epoch": 46} {"train_loss": -16.429676055908203, "global_step": 3859, "epoch": 46} {"train_loss": -16.607513427734375, "global_step": 3860, "epoch": 46} {"train_loss": -16.808595657348633, "global_step": 3861, "epoch": 46} {"train_loss": -16.651456832885742, "global_step": 3862, "epoch": 46} {"train_loss": -16.802871704101562, "global_step": 3863, "epoch": 46} {"train_loss": -16.367151260375977, "global_step": 3864, "epoch": 46} {"train_loss": -16.781234741210938, "global_step": 3865, "epoch": 46} {"train_loss": -16.70153045654297, "global_step": 3866, "epoch": 46} {"train_loss": -16.468034744262695, "global_step": 3867, "epoch": 46} {"train_loss": -16.32695198059082, "global_step": 3868, "epoch": 46} {"train_loss": -16.615705490112305, "global_step": 3869, "epoch": 46} {"train_loss": -16.921634674072266, "global_step": 3870, "epoch": 46} {"train_loss": -16.813093185424805, "global_step": 3871, "epoch": 46} {"train_loss": -16.760412216186523, "global_step": 3872, "epoch": 46} {"train_loss": -16.5263729095459, "global_step": 3873, "epoch": 46} {"train_loss": -16.74629020690918, "global_step": 3874, "epoch": 46} {"train_loss": -16.628984451293945, "global_step": 3875, "epoch": 46} {"train_loss": -16.268692016601562, "global_step": 3876, "epoch": 46} {"train_loss": -16.652036666870117, "global_step": 3877, "epoch": 46} {"train_loss": -16.500577926635742, "global_step": 3878, "epoch": 46} {"train_loss": -16.51438331604004, "global_step": 3879, "epoch": 46} {"train_loss": -16.733192443847656, "global_step": 3880, "epoch": 46} {"train_loss": -16.136783599853516, "global_step": 3881, "epoch": 46} {"train_loss": -16.629486083984375, "global_step": 3882, "epoch": 46} {"train_loss": -16.866071701049805, "global_step": 3883, "epoch": 46} {"train_loss": -16.91707420349121, "global_step": 3884, "epoch": 46} {"train_loss": -16.904956817626953, "global_step": 3885, "epoch": 46} {"train_loss": -16.22197151184082, "global_step": 3886, "epoch": 46} {"train_loss": -16.323888778686523, "global_step": 3887, "epoch": 46} {"train_loss": -17.171573638916016, "global_step": 3888, "epoch": 46} {"train_loss": -16.574338912963867, "global_step": 3889, "epoch": 46} {"train_loss": -16.490758895874023, "global_step": 3890, "epoch": 46} {"train_loss": -16.101335525512695, "global_step": 3891, "epoch": 46} {"train_loss": -16.41124153137207, "global_step": 3892, "epoch": 46} {"train_loss": -16.888412475585938, "global_step": 3893, "epoch": 46} {"train_loss": -16.70804786682129, "global_step": 3894, "epoch": 46} {"train_loss": -16.76101303100586, "global_step": 3895, "epoch": 46} {"train_loss": -16.85272979736328, "global_step": 3896, "epoch": 46} {"train_loss": -16.47258758544922, "global_step": 3897, "epoch": 46} {"train_loss": -16.95725440979004, "global_step": 3898, "epoch": 46} {"train_loss": -16.502532958984375, "global_step": 3899, "epoch": 46} {"train_loss": -16.57378821775138, "global_step": 3900, "epoch": 46, "val_loss": 7079333.5} {"train_loss": -16.23038101196289, "global_step": 3901, "epoch": 47} {"train_loss": -16.24679183959961, "global_step": 3902, "epoch": 47} {"train_loss": -16.462726593017578, "global_step": 3903, "epoch": 47} {"train_loss": -16.785348892211914, "global_step": 3904, "epoch": 47} {"train_loss": -16.672040939331055, "global_step": 3905, "epoch": 47} {"train_loss": -16.782514572143555, "global_step": 3906, "epoch": 47} {"train_loss": -16.526288986206055, "global_step": 3907, "epoch": 47} {"train_loss": -16.726545333862305, "global_step": 3908, "epoch": 47} {"train_loss": -16.602508544921875, "global_step": 3909, "epoch": 47} {"train_loss": -16.739681243896484, "global_step": 3910, "epoch": 47} {"train_loss": -16.57898712158203, "global_step": 3911, "epoch": 47} {"train_loss": -16.888532638549805, "global_step": 3912, "epoch": 47} {"train_loss": -16.453214645385742, "global_step": 3913, "epoch": 47} {"train_loss": -16.720430374145508, "global_step": 3914, "epoch": 47} {"train_loss": -16.738525390625, "global_step": 3915, "epoch": 47} {"train_loss": -16.6806640625, "global_step": 3916, "epoch": 47} {"train_loss": -16.731294631958008, "global_step": 3917, "epoch": 47} {"train_loss": -16.47114372253418, "global_step": 3918, "epoch": 47} {"train_loss": -16.827960968017578, "global_step": 3919, "epoch": 47} {"train_loss": -16.41326904296875, "global_step": 3920, "epoch": 47} {"train_loss": -16.37249755859375, "global_step": 3921, "epoch": 47} {"train_loss": -16.705976486206055, "global_step": 3922, "epoch": 47} {"train_loss": -16.94219398498535, "global_step": 3923, "epoch": 47} {"train_loss": -16.464773178100586, "global_step": 3924, "epoch": 47} {"train_loss": -16.48578453063965, "global_step": 3925, "epoch": 47} {"train_loss": -16.333471298217773, "global_step": 3926, "epoch": 47} {"train_loss": -16.287694931030273, "global_step": 3927, "epoch": 47} {"train_loss": -16.838865280151367, "global_step": 3928, "epoch": 47} {"train_loss": -16.437101364135742, "global_step": 3929, "epoch": 47} {"train_loss": -16.65028953552246, "global_step": 3930, "epoch": 47} {"train_loss": -16.79275894165039, "global_step": 3931, "epoch": 47} {"train_loss": -16.77388572692871, "global_step": 3932, "epoch": 47} {"train_loss": -16.785253524780273, "global_step": 3933, "epoch": 47} {"train_loss": -16.705699920654297, "global_step": 3934, "epoch": 47} {"train_loss": -16.468677520751953, "global_step": 3935, "epoch": 47} {"train_loss": -16.882366180419922, "global_step": 3936, "epoch": 47} {"train_loss": -16.330463409423828, "global_step": 3937, "epoch": 47} {"train_loss": -16.443744659423828, "global_step": 3938, "epoch": 47} {"train_loss": -16.858991622924805, "global_step": 3939, "epoch": 47} {"train_loss": -16.87823486328125, "global_step": 3940, "epoch": 47} {"train_loss": -16.7916316986084, "global_step": 3941, "epoch": 47} {"train_loss": -17.1604061126709, "global_step": 3942, "epoch": 47} {"train_loss": -16.537540435791016, "global_step": 3943, "epoch": 47} {"train_loss": -16.84099006652832, "global_step": 3944, "epoch": 47} {"train_loss": -16.719247817993164, "global_step": 3945, "epoch": 47} {"train_loss": -16.573347091674805, "global_step": 3946, "epoch": 47} {"train_loss": -16.813737869262695, "global_step": 3947, "epoch": 47} {"train_loss": -16.60717010498047, "global_step": 3948, "epoch": 47} {"train_loss": -16.405841827392578, "global_step": 3949, "epoch": 47} {"train_loss": -16.929767608642578, "global_step": 3950, "epoch": 47} {"train_loss": -16.52064323425293, "global_step": 3951, "epoch": 47} {"train_loss": -16.381071090698242, "global_step": 3952, "epoch": 47} {"train_loss": -16.68439292907715, "global_step": 3953, "epoch": 47} {"train_loss": -16.456350326538086, "global_step": 3954, "epoch": 47} {"train_loss": -16.71442985534668, "global_step": 3955, "epoch": 47} {"train_loss": -16.67237091064453, "global_step": 3956, "epoch": 47} {"train_loss": -16.4044132232666, "global_step": 3957, "epoch": 47} {"train_loss": -16.762027740478516, "global_step": 3958, "epoch": 47} {"train_loss": -16.671981811523438, "global_step": 3959, "epoch": 47} {"train_loss": -16.567529678344727, "global_step": 3960, "epoch": 47} {"train_loss": -16.423219680786133, "global_step": 3961, "epoch": 47} {"train_loss": -16.895130157470703, "global_step": 3962, "epoch": 47} {"train_loss": -16.81399154663086, "global_step": 3963, "epoch": 47} {"train_loss": -16.313230514526367, "global_step": 3964, "epoch": 47} {"train_loss": -16.549802780151367, "global_step": 3965, "epoch": 47} {"train_loss": -16.175962448120117, "global_step": 3966, "epoch": 47} {"train_loss": -16.79505729675293, "global_step": 3967, "epoch": 47} {"train_loss": -16.76215171813965, "global_step": 3968, "epoch": 47} {"train_loss": -16.53554344177246, "global_step": 3969, "epoch": 47} {"train_loss": -16.405256271362305, "global_step": 3970, "epoch": 47} {"train_loss": -16.68985939025879, "global_step": 3971, "epoch": 47} {"train_loss": -16.56827163696289, "global_step": 3972, "epoch": 47} {"train_loss": -16.222578048706055, "global_step": 3973, "epoch": 47} {"train_loss": -16.614688873291016, "global_step": 3974, "epoch": 47} {"train_loss": -16.41705894470215, "global_step": 3975, "epoch": 47} {"train_loss": -16.478849411010742, "global_step": 3976, "epoch": 47} {"train_loss": -16.459880828857422, "global_step": 3977, "epoch": 47} {"train_loss": -16.433860778808594, "global_step": 3978, "epoch": 47} {"train_loss": -16.694782257080078, "global_step": 3979, "epoch": 47} {"train_loss": -16.914857864379883, "global_step": 3980, "epoch": 47} {"train_loss": -17.01283073425293, "global_step": 3981, "epoch": 47} {"train_loss": -16.574026107788086, "global_step": 3982, "epoch": 47} {"train_loss": -16.614789572106787, "global_step": 3983, "epoch": 47, "val_loss": 6997308.5} {"train_loss": -16.346397399902344, "global_step": 3984, "epoch": 48} {"train_loss": -16.904998779296875, "global_step": 3985, "epoch": 48} {"train_loss": -16.336423873901367, "global_step": 3986, "epoch": 48} {"train_loss": -16.581928253173828, "global_step": 3987, "epoch": 48} {"train_loss": -16.753528594970703, "global_step": 3988, "epoch": 48} {"train_loss": -16.703044891357422, "global_step": 3989, "epoch": 48} {"train_loss": -16.21708106994629, "global_step": 3990, "epoch": 48} {"train_loss": -16.211050033569336, "global_step": 3991, "epoch": 48} {"train_loss": -16.716711044311523, "global_step": 3992, "epoch": 48} {"train_loss": -16.339391708374023, "global_step": 3993, "epoch": 48} {"train_loss": -16.516122817993164, "global_step": 3994, "epoch": 48} {"train_loss": -16.790842056274414, "global_step": 3995, "epoch": 48} {"train_loss": -16.209260940551758, "global_step": 3996, "epoch": 48} {"train_loss": -16.90717887878418, "global_step": 3997, "epoch": 48} {"train_loss": -16.729228973388672, "global_step": 3998, "epoch": 48} {"train_loss": -16.770246505737305, "global_step": 3999, "epoch": 48} {"train_loss": -16.23233413696289, "global_step": 4000, "epoch": 48} {"train_loss": -16.83149528503418, "global_step": 4001, "epoch": 48} {"train_loss": -16.69452476501465, "global_step": 4002, "epoch": 48} {"train_loss": -16.74216651916504, "global_step": 4003, "epoch": 48} {"train_loss": -16.576696395874023, "global_step": 4004, "epoch": 48} {"train_loss": -16.82050132751465, "global_step": 4005, "epoch": 48} {"train_loss": -16.597267150878906, "global_step": 4006, "epoch": 48} {"train_loss": -16.757516860961914, "global_step": 4007, "epoch": 48} {"train_loss": -16.90592384338379, "global_step": 4008, "epoch": 48} {"train_loss": -16.51576042175293, "global_step": 4009, "epoch": 48} {"train_loss": -16.804594039916992, "global_step": 4010, "epoch": 48} {"train_loss": -17.19685173034668, "global_step": 4011, "epoch": 48} {"train_loss": -16.73067283630371, "global_step": 4012, "epoch": 48} {"train_loss": -16.728910446166992, "global_step": 4013, "epoch": 48} {"train_loss": -16.8632755279541, "global_step": 4014, "epoch": 48} {"train_loss": -16.562482833862305, "global_step": 4015, "epoch": 48} {"train_loss": -16.577238082885742, "global_step": 4016, "epoch": 48} {"train_loss": -16.738079071044922, "global_step": 4017, "epoch": 48} {"train_loss": -16.339330673217773, "global_step": 4018, "epoch": 48} {"train_loss": -16.620962142944336, "global_step": 4019, "epoch": 48} {"train_loss": -16.195430755615234, "global_step": 4020, "epoch": 48} {"train_loss": -16.59686851501465, "global_step": 4021, "epoch": 48} {"train_loss": -16.91167640686035, "global_step": 4022, "epoch": 48} {"train_loss": -16.75953483581543, "global_step": 4023, "epoch": 48} {"train_loss": -16.6328125, "global_step": 4024, "epoch": 48} {"train_loss": -16.701797485351562, "global_step": 4025, "epoch": 48} {"train_loss": -16.789859771728516, "global_step": 4026, "epoch": 48} {"train_loss": -16.502227783203125, "global_step": 4027, "epoch": 48} {"train_loss": -16.7025146484375, "global_step": 4028, "epoch": 48} {"train_loss": -16.667709350585938, "global_step": 4029, "epoch": 48} {"train_loss": -16.519813537597656, "global_step": 4030, "epoch": 48} {"train_loss": -17.08037757873535, "global_step": 4031, "epoch": 48} {"train_loss": -16.122005462646484, "global_step": 4032, "epoch": 48} {"train_loss": -16.835020065307617, "global_step": 4033, "epoch": 48} {"train_loss": -16.429096221923828, "global_step": 4034, "epoch": 48} {"train_loss": -17.026281356811523, "global_step": 4035, "epoch": 48} {"train_loss": -16.442115783691406, "global_step": 4036, "epoch": 48} {"train_loss": -16.575031280517578, "global_step": 4037, "epoch": 48} {"train_loss": -16.76320457458496, "global_step": 4038, "epoch": 48} {"train_loss": -16.569711685180664, "global_step": 4039, "epoch": 48} {"train_loss": -16.69989585876465, "global_step": 4040, "epoch": 48} {"train_loss": -16.657699584960938, "global_step": 4041, "epoch": 48} {"train_loss": -16.793060302734375, "global_step": 4042, "epoch": 48} {"train_loss": -16.376150131225586, "global_step": 4043, "epoch": 48} {"train_loss": -16.58039665222168, "global_step": 4044, "epoch": 48} {"train_loss": -16.6898250579834, "global_step": 4045, "epoch": 48} {"train_loss": -16.620437622070312, "global_step": 4046, "epoch": 48} {"train_loss": -16.779848098754883, "global_step": 4047, "epoch": 48} {"train_loss": -16.517568588256836, "global_step": 4048, "epoch": 48} {"train_loss": -16.763822555541992, "global_step": 4049, "epoch": 48} {"train_loss": -16.54300880432129, "global_step": 4050, "epoch": 48} {"train_loss": -16.19881820678711, "global_step": 4051, "epoch": 48} {"train_loss": -16.9967041015625, "global_step": 4052, "epoch": 48} {"train_loss": -16.4218692779541, "global_step": 4053, "epoch": 48} {"train_loss": -16.544391632080078, "global_step": 4054, "epoch": 48} {"train_loss": -16.782236099243164, "global_step": 4055, "epoch": 48} {"train_loss": -16.542280197143555, "global_step": 4056, "epoch": 48} {"train_loss": -16.672088623046875, "global_step": 4057, "epoch": 48} {"train_loss": -16.89230728149414, "global_step": 4058, "epoch": 48} {"train_loss": -16.788955688476562, "global_step": 4059, "epoch": 48} {"train_loss": -16.24942970275879, "global_step": 4060, "epoch": 48} {"train_loss": -16.52652359008789, "global_step": 4061, "epoch": 48} {"train_loss": -16.979795455932617, "global_step": 4062, "epoch": 48} {"train_loss": -16.108190536499023, "global_step": 4063, "epoch": 48} {"train_loss": -16.64565086364746, "global_step": 4064, "epoch": 48} {"train_loss": -16.491018295288086, "global_step": 4065, "epoch": 48} {"train_loss": -16.639274918889424, "global_step": 4066, "epoch": 48, "val_loss": 7057206.0} {"train_loss": -16.40622901916504, "global_step": 4067, "epoch": 49} {"train_loss": -16.521345138549805, "global_step": 4068, "epoch": 49} {"train_loss": -16.79581642150879, "global_step": 4069, "epoch": 49} {"train_loss": -16.365966796875, "global_step": 4070, "epoch": 49} {"train_loss": -16.387060165405273, "global_step": 4071, "epoch": 49} {"train_loss": -16.49519920349121, "global_step": 4072, "epoch": 49} {"train_loss": -16.55438804626465, "global_step": 4073, "epoch": 49} {"train_loss": -16.69338035583496, "global_step": 4074, "epoch": 49} {"train_loss": -16.948392868041992, "global_step": 4075, "epoch": 49} {"train_loss": -16.69190788269043, "global_step": 4076, "epoch": 49} {"train_loss": -16.442127227783203, "global_step": 4077, "epoch": 49} {"train_loss": -16.366397857666016, "global_step": 4078, "epoch": 49} {"train_loss": -16.817245483398438, "global_step": 4079, "epoch": 49} {"train_loss": -16.854549407958984, "global_step": 4080, "epoch": 49} {"train_loss": -16.481609344482422, "global_step": 4081, "epoch": 49} {"train_loss": -16.57453727722168, "global_step": 4082, "epoch": 49} {"train_loss": -16.57576560974121, "global_step": 4083, "epoch": 49} {"train_loss": -16.576162338256836, "global_step": 4084, "epoch": 49} {"train_loss": -16.76426124572754, "global_step": 4085, "epoch": 49} {"train_loss": -16.871929168701172, "global_step": 4086, "epoch": 49} {"train_loss": -16.63963508605957, "global_step": 4087, "epoch": 49} {"train_loss": -16.63008689880371, "global_step": 4088, "epoch": 49} {"train_loss": -16.82635498046875, "global_step": 4089, "epoch": 49} {"train_loss": -16.639951705932617, "global_step": 4090, "epoch": 49} {"train_loss": -16.78730583190918, "global_step": 4091, "epoch": 49} {"train_loss": -16.967573165893555, "global_step": 4092, "epoch": 49} {"train_loss": -16.68512535095215, "global_step": 4093, "epoch": 49} {"train_loss": -17.117328643798828, "global_step": 4094, "epoch": 49} {"train_loss": -16.937026977539062, "global_step": 4095, "epoch": 49} {"train_loss": -16.274152755737305, "global_step": 4096, "epoch": 49} {"train_loss": -16.677947998046875, "global_step": 4097, "epoch": 49} {"train_loss": -16.76962661743164, "global_step": 4098, "epoch": 49} {"train_loss": -16.77531623840332, "global_step": 4099, "epoch": 49} {"train_loss": -16.587621688842773, "global_step": 4100, "epoch": 49} {"train_loss": -16.71837615966797, "global_step": 4101, "epoch": 49} {"train_loss": -16.209501266479492, "global_step": 4102, "epoch": 49} {"train_loss": -16.5985050201416, "global_step": 4103, "epoch": 49} {"train_loss": -16.388076782226562, "global_step": 4104, "epoch": 49} {"train_loss": -16.935258865356445, "global_step": 4105, "epoch": 49} {"train_loss": -16.713537216186523, "global_step": 4106, "epoch": 49} {"train_loss": -16.60725975036621, "global_step": 4107, "epoch": 49} {"train_loss": -16.916885375976562, "global_step": 4108, "epoch": 49} {"train_loss": -16.447521209716797, "global_step": 4109, "epoch": 49} {"train_loss": -16.613378524780273, "global_step": 4110, "epoch": 49} {"train_loss": -16.293577194213867, "global_step": 4111, "epoch": 49} {"train_loss": -16.68602180480957, "global_step": 4112, "epoch": 49} {"train_loss": -16.483976364135742, "global_step": 4113, "epoch": 49} {"train_loss": -16.10943603515625, "global_step": 4114, "epoch": 49} {"train_loss": -16.78291130065918, "global_step": 4115, "epoch": 49} {"train_loss": -16.833784103393555, "global_step": 4116, "epoch": 49} {"train_loss": -16.387405395507812, "global_step": 4117, "epoch": 49} {"train_loss": -16.783706665039062, "global_step": 4118, "epoch": 49} {"train_loss": -16.676374435424805, "global_step": 4119, "epoch": 49} {"train_loss": -16.87087059020996, "global_step": 4120, "epoch": 49} {"train_loss": -16.972333908081055, "global_step": 4121, "epoch": 49} {"train_loss": -16.77857780456543, "global_step": 4122, "epoch": 49} {"train_loss": -17.00765037536621, "global_step": 4123, "epoch": 49} {"train_loss": -16.421144485473633, "global_step": 4124, "epoch": 49} {"train_loss": -16.719823837280273, "global_step": 4125, "epoch": 49} {"train_loss": -16.99748420715332, "global_step": 4126, "epoch": 49} {"train_loss": -16.505407333374023, "global_step": 4127, "epoch": 49} {"train_loss": -16.686094284057617, "global_step": 4128, "epoch": 49} {"train_loss": -17.08363151550293, "global_step": 4129, "epoch": 49} {"train_loss": -17.06509017944336, "global_step": 4130, "epoch": 49} {"train_loss": -16.046003341674805, "global_step": 4131, "epoch": 49} {"train_loss": -16.823911666870117, "global_step": 4132, "epoch": 49} {"train_loss": -16.50533103942871, "global_step": 4133, "epoch": 49} {"train_loss": -16.472482681274414, "global_step": 4134, "epoch": 49} {"train_loss": -16.72610855102539, "global_step": 4135, "epoch": 49} {"train_loss": -16.52008628845215, "global_step": 4136, "epoch": 49} {"train_loss": -16.55997657775879, "global_step": 4137, "epoch": 49} {"train_loss": -16.945402145385742, "global_step": 4138, "epoch": 49} {"train_loss": -16.637226104736328, "global_step": 4139, "epoch": 49} {"train_loss": -17.0013370513916, "global_step": 4140, "epoch": 49} {"train_loss": -17.056625366210938, "global_step": 4141, "epoch": 49} {"train_loss": -16.400251388549805, "global_step": 4142, "epoch": 49} {"train_loss": -17.047290802001953, "global_step": 4143, "epoch": 49} {"train_loss": -16.35776710510254, "global_step": 4144, "epoch": 49} {"train_loss": -16.419147491455078, "global_step": 4145, "epoch": 49} {"train_loss": -16.755645751953125, "global_step": 4146, "epoch": 49} {"train_loss": -16.30727195739746, "global_step": 4147, "epoch": 49} {"train_loss": -16.797805786132812, "global_step": 4148, "epoch": 49} {"train_loss": -16.64574204870017, "global_step": 4149, "epoch": 49, "val_loss": 7087303.5} {"train_loss": -16.336572647094727, "global_step": 4150, "epoch": 50} {"train_loss": -16.66197967529297, "global_step": 4151, "epoch": 50} {"train_loss": -16.66002655029297, "global_step": 4152, "epoch": 50} {"train_loss": -16.816076278686523, "global_step": 4153, "epoch": 50} {"train_loss": -16.596595764160156, "global_step": 4154, "epoch": 50} {"train_loss": -16.66595458984375, "global_step": 4155, "epoch": 50} {"train_loss": -16.62738037109375, "global_step": 4156, "epoch": 50} {"train_loss": -16.30238914489746, "global_step": 4157, "epoch": 50} {"train_loss": -16.431867599487305, "global_step": 4158, "epoch": 50} {"train_loss": -17.1517391204834, "global_step": 4159, "epoch": 50} {"train_loss": -16.983091354370117, "global_step": 4160, "epoch": 50} {"train_loss": -16.100210189819336, "global_step": 4161, "epoch": 50} {"train_loss": -16.502817153930664, "global_step": 4162, "epoch": 50} {"train_loss": -16.659334182739258, "global_step": 4163, "epoch": 50} {"train_loss": -16.96451759338379, "global_step": 4164, "epoch": 50} {"train_loss": -16.601119995117188, "global_step": 4165, "epoch": 50} {"train_loss": -16.665435791015625, "global_step": 4166, "epoch": 50} {"train_loss": -16.851160049438477, "global_step": 4167, "epoch": 50} {"train_loss": -16.54237937927246, "global_step": 4168, "epoch": 50} {"train_loss": -16.99762535095215, "global_step": 4169, "epoch": 50} {"train_loss": -16.26262855529785, "global_step": 4170, "epoch": 50} {"train_loss": -16.496610641479492, "global_step": 4171, "epoch": 50} {"train_loss": -16.898534774780273, "global_step": 4172, "epoch": 50} {"train_loss": -16.40448570251465, "global_step": 4173, "epoch": 50} {"train_loss": -16.999267578125, "global_step": 4174, "epoch": 50} {"train_loss": -16.58881950378418, "global_step": 4175, "epoch": 50} {"train_loss": -16.771207809448242, "global_step": 4176, "epoch": 50} {"train_loss": -16.546157836914062, "global_step": 4177, "epoch": 50} {"train_loss": -16.801265716552734, "global_step": 4178, "epoch": 50} {"train_loss": -16.490999221801758, "global_step": 4179, "epoch": 50} {"train_loss": -16.90410804748535, "global_step": 4180, "epoch": 50} {"train_loss": -16.383407592773438, "global_step": 4181, "epoch": 50} {"train_loss": -16.778894424438477, "global_step": 4182, "epoch": 50} {"train_loss": -16.654117584228516, "global_step": 4183, "epoch": 50} {"train_loss": -16.90451431274414, "global_step": 4184, "epoch": 50} {"train_loss": -16.685199737548828, "global_step": 4185, "epoch": 50} {"train_loss": -16.605777740478516, "global_step": 4186, "epoch": 50} {"train_loss": -16.84905242919922, "global_step": 4187, "epoch": 50} {"train_loss": -16.325475692749023, "global_step": 4188, "epoch": 50} {"train_loss": -16.46643829345703, "global_step": 4189, "epoch": 50} {"train_loss": -16.394155502319336, "global_step": 4190, "epoch": 50} {"train_loss": -16.630552291870117, "global_step": 4191, "epoch": 50} {"train_loss": -16.401063919067383, "global_step": 4192, "epoch": 50} {"train_loss": -16.308218002319336, "global_step": 4193, "epoch": 50} {"train_loss": -16.847736358642578, "global_step": 4194, "epoch": 50} {"train_loss": -16.86994171142578, "global_step": 4195, "epoch": 50} {"train_loss": -16.82781410217285, "global_step": 4196, "epoch": 50} {"train_loss": -16.877334594726562, "global_step": 4197, "epoch": 50} {"train_loss": -16.777257919311523, "global_step": 4198, "epoch": 50} {"train_loss": -16.910907745361328, "global_step": 4199, "epoch": 50} {"train_loss": -16.92098045349121, "global_step": 4200, "epoch": 50} {"train_loss": -16.582860946655273, "global_step": 4201, "epoch": 50} {"train_loss": -16.608440399169922, "global_step": 4202, "epoch": 50} {"train_loss": -16.48935890197754, "global_step": 4203, "epoch": 50} {"train_loss": -16.739187240600586, "global_step": 4204, "epoch": 50} {"train_loss": -16.831579208374023, "global_step": 4205, "epoch": 50} {"train_loss": -17.042444229125977, "global_step": 4206, "epoch": 50} {"train_loss": -16.680452346801758, "global_step": 4207, "epoch": 50} {"train_loss": -16.65852165222168, "global_step": 4208, "epoch": 50} {"train_loss": -17.087844848632812, "global_step": 4209, "epoch": 50} {"train_loss": -17.08936882019043, "global_step": 4210, "epoch": 50} {"train_loss": -16.83186149597168, "global_step": 4211, "epoch": 50} {"train_loss": -16.722475051879883, "global_step": 4212, "epoch": 50} {"train_loss": -16.859037399291992, "global_step": 4213, "epoch": 50} {"train_loss": -16.558977127075195, "global_step": 4214, "epoch": 50} {"train_loss": -16.707387924194336, "global_step": 4215, "epoch": 50} {"train_loss": -16.60218620300293, "global_step": 4216, "epoch": 50} {"train_loss": -16.799158096313477, "global_step": 4217, "epoch": 50} {"train_loss": -16.418386459350586, "global_step": 4218, "epoch": 50} {"train_loss": -17.21487808227539, "global_step": 4219, "epoch": 50} {"train_loss": -16.636388778686523, "global_step": 4220, "epoch": 50} {"train_loss": -16.603384017944336, "global_step": 4221, "epoch": 50} {"train_loss": -16.49248695373535, "global_step": 4222, "epoch": 50} {"train_loss": -16.324949264526367, "global_step": 4223, "epoch": 50} {"train_loss": -16.794450759887695, "global_step": 4224, "epoch": 50} {"train_loss": -16.807510375976562, "global_step": 4225, "epoch": 50} {"train_loss": -16.81037712097168, "global_step": 4226, "epoch": 50} {"train_loss": -16.69610595703125, "global_step": 4227, "epoch": 50} {"train_loss": -16.751811981201172, "global_step": 4228, "epoch": 50} {"train_loss": -16.912343978881836, "global_step": 4229, "epoch": 50} {"train_loss": -16.4514217376709, "global_step": 4230, "epoch": 50} {"train_loss": -16.721410751342773, "global_step": 4231, "epoch": 50} {"train_loss": -16.68774000420628, "global_step": 4232, "epoch": 50, "train/sim_max_reward_0": 0.0, "train/sim_max_reward_1": 0.0, "train/sim_max_reward_2": 0.0, "train/sim_max_reward_3": 0.0, "train/sim_max_reward_4": 0.0, "train/sim_max_reward_5": 0.0, "test/sim_max_reward_4500000": 0.0, "test/sim_max_reward_4500001": 0.0, "test/sim_max_reward_4500002": 0.0, "test/sim_max_reward_4500003": 0.0, "test/sim_max_reward_4500004": 0.0, "test/sim_max_reward_4500005": 0.0, "test/sim_max_reward_4500006": 0.0, "test/sim_max_reward_4500007": 0.0, "test/sim_max_reward_4500008": 0.0, "test/sim_max_reward_4500009": 0.0, "test/sim_max_reward_4500010": 0.0, "test/sim_max_reward_4500011": 0.0, "test/sim_max_reward_4500012": 0.0, "test/sim_max_reward_4500013": 0.0, "test/sim_max_reward_4500014": 0.0, "test/sim_max_reward_4500015": 0.0, "test/sim_max_reward_4500016": 0.0, "test/sim_max_reward_4500017": 0.0, "test/sim_max_reward_4500018": 0.0, "test/sim_max_reward_4500019": 0.0, "test/sim_max_reward_4500020": 0.0, "test/sim_max_reward_4500021": 0.0, "train/mean_score": 0.0, "test/mean_score": 0.0, "val_loss": 6941661.0} {"train_loss": -16.687515258789062, "global_step": 4233, "epoch": 51} {"train_loss": -16.36140251159668, "global_step": 4234, "epoch": 51} {"train_loss": -16.51016616821289, "global_step": 4235, "epoch": 51} {"train_loss": -16.399002075195312, "global_step": 4236, "epoch": 51} {"train_loss": -16.499135971069336, "global_step": 4237, "epoch": 51} {"train_loss": -16.55417823791504, "global_step": 4238, "epoch": 51} {"train_loss": -16.83237648010254, "global_step": 4239, "epoch": 51} {"train_loss": -16.941247940063477, "global_step": 4240, "epoch": 51} {"train_loss": -16.774824142456055, "global_step": 4241, "epoch": 51} {"train_loss": -16.813274383544922, "global_step": 4242, "epoch": 51} {"train_loss": -17.106666564941406, "global_step": 4243, "epoch": 51} {"train_loss": -16.729270935058594, "global_step": 4244, "epoch": 51} {"train_loss": -16.575965881347656, "global_step": 4245, "epoch": 51} {"train_loss": -16.39030647277832, "global_step": 4246, "epoch": 51} {"train_loss": -16.67158317565918, "global_step": 4247, "epoch": 51} {"train_loss": -16.757299423217773, "global_step": 4248, "epoch": 51} {"train_loss": -16.872787475585938, "global_step": 4249, "epoch": 51} {"train_loss": -16.69483757019043, "global_step": 4250, "epoch": 51} {"train_loss": -16.734874725341797, "global_step": 4251, "epoch": 51} {"train_loss": -16.607553482055664, "global_step": 4252, "epoch": 51} {"train_loss": -16.827686309814453, "global_step": 4253, "epoch": 51} {"train_loss": -16.729829788208008, "global_step": 4254, "epoch": 51} {"train_loss": -16.512380599975586, "global_step": 4255, "epoch": 51} {"train_loss": -16.76141357421875, "global_step": 4256, "epoch": 51} {"train_loss": -16.64849853515625, "global_step": 4257, "epoch": 51} {"train_loss": -16.42510986328125, "global_step": 4258, "epoch": 51} {"train_loss": -17.016616821289062, "global_step": 4259, "epoch": 51} {"train_loss": -16.850317001342773, "global_step": 4260, "epoch": 51} {"train_loss": -16.868330001831055, "global_step": 4261, "epoch": 51} {"train_loss": -16.74981689453125, "global_step": 4262, "epoch": 51} {"train_loss": -17.018451690673828, "global_step": 4263, "epoch": 51} {"train_loss": -16.6503963470459, "global_step": 4264, "epoch": 51} {"train_loss": -16.669143676757812, "global_step": 4265, "epoch": 51} {"train_loss": -16.653654098510742, "global_step": 4266, "epoch": 51} {"train_loss": -16.510303497314453, "global_step": 4267, "epoch": 51} {"train_loss": -16.826278686523438, "global_step": 4268, "epoch": 51} {"train_loss": -16.64200782775879, "global_step": 4269, "epoch": 51} {"train_loss": -16.815214157104492, "global_step": 4270, "epoch": 51} {"train_loss": -16.701751708984375, "global_step": 4271, "epoch": 51} {"train_loss": -17.02146339416504, "global_step": 4272, "epoch": 51} {"train_loss": -16.647764205932617, "global_step": 4273, "epoch": 51} {"train_loss": -16.489023208618164, "global_step": 4274, "epoch": 51} {"train_loss": -16.511539459228516, "global_step": 4275, "epoch": 51} {"train_loss": -16.77440643310547, "global_step": 4276, "epoch": 51} {"train_loss": -16.55059051513672, "global_step": 4277, "epoch": 51} {"train_loss": -16.807676315307617, "global_step": 4278, "epoch": 51} {"train_loss": -16.75356101989746, "global_step": 4279, "epoch": 51} {"train_loss": -16.57990074157715, "global_step": 4280, "epoch": 51} {"train_loss": -16.756803512573242, "global_step": 4281, "epoch": 51} {"train_loss": -16.910999298095703, "global_step": 4282, "epoch": 51} {"train_loss": -16.73102569580078, "global_step": 4283, "epoch": 51} {"train_loss": -16.310020446777344, "global_step": 4284, "epoch": 51} {"train_loss": -16.71150779724121, "global_step": 4285, "epoch": 51} {"train_loss": -16.008438110351562, "global_step": 4286, "epoch": 51} {"train_loss": -16.96157455444336, "global_step": 4287, "epoch": 51} {"train_loss": -16.402267456054688, "global_step": 4288, "epoch": 51} {"train_loss": -16.288244247436523, "global_step": 4289, "epoch": 51} {"train_loss": -16.553945541381836, "global_step": 4290, "epoch": 51} {"train_loss": -16.404376983642578, "global_step": 4291, "epoch": 51} {"train_loss": -16.837329864501953, "global_step": 4292, "epoch": 51} {"train_loss": -16.84978485107422, "global_step": 4293, "epoch": 51} {"train_loss": -17.008955001831055, "global_step": 4294, "epoch": 51} {"train_loss": -17.08359718322754, "global_step": 4295, "epoch": 51} {"train_loss": -17.15894889831543, "global_step": 4296, "epoch": 51} {"train_loss": -16.61395835876465, "global_step": 4297, "epoch": 51} {"train_loss": -16.604528427124023, "global_step": 4298, "epoch": 51} {"train_loss": -16.992252349853516, "global_step": 4299, "epoch": 51} {"train_loss": -16.701459884643555, "global_step": 4300, "epoch": 51} {"train_loss": -16.720035552978516, "global_step": 4301, "epoch": 51} {"train_loss": -16.561702728271484, "global_step": 4302, "epoch": 51} {"train_loss": -16.888029098510742, "global_step": 4303, "epoch": 51} {"train_loss": -16.73377799987793, "global_step": 4304, "epoch": 51} {"train_loss": -16.225130081176758, "global_step": 4305, "epoch": 51} {"train_loss": -16.557144165039062, "global_step": 4306, "epoch": 51} {"train_loss": -16.88202476501465, "global_step": 4307, "epoch": 51} {"train_loss": -16.834583282470703, "global_step": 4308, "epoch": 51} {"train_loss": -16.474538803100586, "global_step": 4309, "epoch": 51} {"train_loss": -16.94123649597168, "global_step": 4310, "epoch": 51} {"train_loss": -16.673763275146484, "global_step": 4311, "epoch": 51} {"train_loss": -16.711416244506836, "global_step": 4312, "epoch": 51} {"train_loss": -16.8256778717041, "global_step": 4313, "epoch": 51} {"train_loss": -16.7939510345459, "global_step": 4314, "epoch": 51} {"train_loss": -16.68866653901985, "global_step": 4315, "epoch": 51, "val_loss": 6955668.0} {"train_loss": -16.48682975769043, "global_step": 4316, "epoch": 52} {"train_loss": -16.73048973083496, "global_step": 4317, "epoch": 52} {"train_loss": -16.532384872436523, "global_step": 4318, "epoch": 52} {"train_loss": -16.90321159362793, "global_step": 4319, "epoch": 52} {"train_loss": -16.81560707092285, "global_step": 4320, "epoch": 52} {"train_loss": -16.598987579345703, "global_step": 4321, "epoch": 52} {"train_loss": -17.09541130065918, "global_step": 4322, "epoch": 52} {"train_loss": -17.021686553955078, "global_step": 4323, "epoch": 52} {"train_loss": -16.77389907836914, "global_step": 4324, "epoch": 52} {"train_loss": -16.15520668029785, "global_step": 4325, "epoch": 52} {"train_loss": -16.359638214111328, "global_step": 4326, "epoch": 52} {"train_loss": -16.636722564697266, "global_step": 4327, "epoch": 52} {"train_loss": -16.54139518737793, "global_step": 4328, "epoch": 52} {"train_loss": -16.557538986206055, "global_step": 4329, "epoch": 52} {"train_loss": -16.502084732055664, "global_step": 4330, "epoch": 52} {"train_loss": -16.845945358276367, "global_step": 4331, "epoch": 52} {"train_loss": -16.865625381469727, "global_step": 4332, "epoch": 52} {"train_loss": -16.29344367980957, "global_step": 4333, "epoch": 52} {"train_loss": -16.649227142333984, "global_step": 4334, "epoch": 52} {"train_loss": -16.394887924194336, "global_step": 4335, "epoch": 52} {"train_loss": -16.862167358398438, "global_step": 4336, "epoch": 52} {"train_loss": -16.73727798461914, "global_step": 4337, "epoch": 52} {"train_loss": -17.016422271728516, "global_step": 4338, "epoch": 52} {"train_loss": -16.780920028686523, "global_step": 4339, "epoch": 52} {"train_loss": -16.755041122436523, "global_step": 4340, "epoch": 52} {"train_loss": -16.75242042541504, "global_step": 4341, "epoch": 52} {"train_loss": -16.89641761779785, "global_step": 4342, "epoch": 52} {"train_loss": -17.07354736328125, "global_step": 4343, "epoch": 52} {"train_loss": -16.549930572509766, "global_step": 4344, "epoch": 52} {"train_loss": -16.341175079345703, "global_step": 4345, "epoch": 52} {"train_loss": -17.172895431518555, "global_step": 4346, "epoch": 52} {"train_loss": -16.94288444519043, "global_step": 4347, "epoch": 52} {"train_loss": -16.732534408569336, "global_step": 4348, "epoch": 52} {"train_loss": -16.794843673706055, "global_step": 4349, "epoch": 52} {"train_loss": -16.862218856811523, "global_step": 4350, "epoch": 52} {"train_loss": -16.502227783203125, "global_step": 4351, "epoch": 52} {"train_loss": -16.81660270690918, "global_step": 4352, "epoch": 52} {"train_loss": -16.592498779296875, "global_step": 4353, "epoch": 52} {"train_loss": -16.628576278686523, "global_step": 4354, "epoch": 52} {"train_loss": -16.55726432800293, "global_step": 4355, "epoch": 52} {"train_loss": -16.748308181762695, "global_step": 4356, "epoch": 52} {"train_loss": -16.20941162109375, "global_step": 4357, "epoch": 52} {"train_loss": -16.875934600830078, "global_step": 4358, "epoch": 52} {"train_loss": -17.017658233642578, "global_step": 4359, "epoch": 52} {"train_loss": -16.75929069519043, "global_step": 4360, "epoch": 52} {"train_loss": -16.76904296875, "global_step": 4361, "epoch": 52} {"train_loss": -16.87593650817871, "global_step": 4362, "epoch": 52} {"train_loss": -16.873727798461914, "global_step": 4363, "epoch": 52} {"train_loss": -16.77756690979004, "global_step": 4364, "epoch": 52} {"train_loss": -16.737110137939453, "global_step": 4365, "epoch": 52} {"train_loss": -16.41090202331543, "global_step": 4366, "epoch": 52} {"train_loss": -16.75322914123535, "global_step": 4367, "epoch": 52} {"train_loss": -16.58901023864746, "global_step": 4368, "epoch": 52} {"train_loss": -16.605426788330078, "global_step": 4369, "epoch": 52} {"train_loss": -16.712615966796875, "global_step": 4370, "epoch": 52} {"train_loss": -17.061948776245117, "global_step": 4371, "epoch": 52} {"train_loss": -16.147104263305664, "global_step": 4372, "epoch": 52} {"train_loss": -16.790042877197266, "global_step": 4373, "epoch": 52} {"train_loss": -16.839651107788086, "global_step": 4374, "epoch": 52} {"train_loss": -17.291168212890625, "global_step": 4375, "epoch": 52} {"train_loss": -16.779470443725586, "global_step": 4376, "epoch": 52} {"train_loss": -16.265506744384766, "global_step": 4377, "epoch": 52} {"train_loss": -16.848676681518555, "global_step": 4378, "epoch": 52} {"train_loss": -16.63330841064453, "global_step": 4379, "epoch": 52} {"train_loss": -16.479215621948242, "global_step": 4380, "epoch": 52} {"train_loss": -16.59310531616211, "global_step": 4381, "epoch": 52} {"train_loss": -16.98367691040039, "global_step": 4382, "epoch": 52} {"train_loss": -16.620603561401367, "global_step": 4383, "epoch": 52} {"train_loss": -16.86201286315918, "global_step": 4384, "epoch": 52} {"train_loss": -17.07009506225586, "global_step": 4385, "epoch": 52} {"train_loss": -16.893857955932617, "global_step": 4386, "epoch": 52} {"train_loss": -16.79781150817871, "global_step": 4387, "epoch": 52} {"train_loss": -16.586524963378906, "global_step": 4388, "epoch": 52} {"train_loss": -16.385034561157227, "global_step": 4389, "epoch": 52} {"train_loss": -16.81093406677246, "global_step": 4390, "epoch": 52} {"train_loss": -16.39790916442871, "global_step": 4391, "epoch": 52} {"train_loss": -16.990354537963867, "global_step": 4392, "epoch": 52} {"train_loss": -16.690860748291016, "global_step": 4393, "epoch": 52} {"train_loss": -16.884902954101562, "global_step": 4394, "epoch": 52} {"train_loss": -16.687829971313477, "global_step": 4395, "epoch": 52} {"train_loss": -16.962833404541016, "global_step": 4396, "epoch": 52} {"train_loss": -16.728891372680664, "global_step": 4397, "epoch": 52} {"train_loss": -16.708330039518426, "global_step": 4398, "epoch": 52, "val_loss": 6778327.5} {"train_loss": -16.623859405517578, "global_step": 4399, "epoch": 53} {"train_loss": -16.45783233642578, "global_step": 4400, "epoch": 53} {"train_loss": -16.603525161743164, "global_step": 4401, "epoch": 53} {"train_loss": -16.94213104248047, "global_step": 4402, "epoch": 53} {"train_loss": -16.330060958862305, "global_step": 4403, "epoch": 53} {"train_loss": -16.37056541442871, "global_step": 4404, "epoch": 53} {"train_loss": -16.664854049682617, "global_step": 4405, "epoch": 53} {"train_loss": -16.605167388916016, "global_step": 4406, "epoch": 53} {"train_loss": -16.60761260986328, "global_step": 4407, "epoch": 53} {"train_loss": -16.713682174682617, "global_step": 4408, "epoch": 53} {"train_loss": -16.37422752380371, "global_step": 4409, "epoch": 53} {"train_loss": -16.58687973022461, "global_step": 4410, "epoch": 53} {"train_loss": -16.540502548217773, "global_step": 4411, "epoch": 53} {"train_loss": -16.528823852539062, "global_step": 4412, "epoch": 53} {"train_loss": -16.460599899291992, "global_step": 4413, "epoch": 53} {"train_loss": -16.92584991455078, "global_step": 4414, "epoch": 53} {"train_loss": -16.64139747619629, "global_step": 4415, "epoch": 53} {"train_loss": -16.6718692779541, "global_step": 4416, "epoch": 53} {"train_loss": -16.344144821166992, "global_step": 4417, "epoch": 53} {"train_loss": -16.752578735351562, "global_step": 4418, "epoch": 53} {"train_loss": -16.559457778930664, "global_step": 4419, "epoch": 53} {"train_loss": -16.89447021484375, "global_step": 4420, "epoch": 53} {"train_loss": -16.885896682739258, "global_step": 4421, "epoch": 53} {"train_loss": -16.89664649963379, "global_step": 4422, "epoch": 53} {"train_loss": -16.894994735717773, "global_step": 4423, "epoch": 53} {"train_loss": -16.65591812133789, "global_step": 4424, "epoch": 53} {"train_loss": -17.103748321533203, "global_step": 4425, "epoch": 53} {"train_loss": -17.033843994140625, "global_step": 4426, "epoch": 53} {"train_loss": -16.45173454284668, "global_step": 4427, "epoch": 53} {"train_loss": -16.753376007080078, "global_step": 4428, "epoch": 53} {"train_loss": -16.621641159057617, "global_step": 4429, "epoch": 53} {"train_loss": -16.738595962524414, "global_step": 4430, "epoch": 53} {"train_loss": -16.784414291381836, "global_step": 4431, "epoch": 53} {"train_loss": -16.623554229736328, "global_step": 4432, "epoch": 53} {"train_loss": -16.7722225189209, "global_step": 4433, "epoch": 53} {"train_loss": -16.788389205932617, "global_step": 4434, "epoch": 53} {"train_loss": -16.34812355041504, "global_step": 4435, "epoch": 53} {"train_loss": -17.009557723999023, "global_step": 4436, "epoch": 53} {"train_loss": -16.704349517822266, "global_step": 4437, "epoch": 53} {"train_loss": -17.172088623046875, "global_step": 4438, "epoch": 53} {"train_loss": -16.752601623535156, "global_step": 4439, "epoch": 53} {"train_loss": -16.329662322998047, "global_step": 4440, "epoch": 53} {"train_loss": -16.92192268371582, "global_step": 4441, "epoch": 53} {"train_loss": -16.922164916992188, "global_step": 4442, "epoch": 53} {"train_loss": -16.620466232299805, "global_step": 4443, "epoch": 53} {"train_loss": -16.84381675720215, "global_step": 4444, "epoch": 53} {"train_loss": -16.827091217041016, "global_step": 4445, "epoch": 53} {"train_loss": -16.703269958496094, "global_step": 4446, "epoch": 53} {"train_loss": -16.72149085998535, "global_step": 4447, "epoch": 53} {"train_loss": -16.48855972290039, "global_step": 4448, "epoch": 53} {"train_loss": -16.712650299072266, "global_step": 4449, "epoch": 53} {"train_loss": -16.763364791870117, "global_step": 4450, "epoch": 53} {"train_loss": -16.557348251342773, "global_step": 4451, "epoch": 53} {"train_loss": -16.5821475982666, "global_step": 4452, "epoch": 53} {"train_loss": -16.288875579833984, "global_step": 4453, "epoch": 53} {"train_loss": -16.638879776000977, "global_step": 4454, "epoch": 53} {"train_loss": -16.926067352294922, "global_step": 4455, "epoch": 53} {"train_loss": -16.906911849975586, "global_step": 4456, "epoch": 53} {"train_loss": -17.050464630126953, "global_step": 4457, "epoch": 53} {"train_loss": -16.918310165405273, "global_step": 4458, "epoch": 53} {"train_loss": -17.004581451416016, "global_step": 4459, "epoch": 53} {"train_loss": -16.65015983581543, "global_step": 4460, "epoch": 53} {"train_loss": -16.83270835876465, "global_step": 4461, "epoch": 53} {"train_loss": -16.610471725463867, "global_step": 4462, "epoch": 53} {"train_loss": -16.543994903564453, "global_step": 4463, "epoch": 53} {"train_loss": -16.672422409057617, "global_step": 4464, "epoch": 53} {"train_loss": -17.270580291748047, "global_step": 4465, "epoch": 53} {"train_loss": -16.728927612304688, "global_step": 4466, "epoch": 53} {"train_loss": -16.99223518371582, "global_step": 4467, "epoch": 53} {"train_loss": -16.555524826049805, "global_step": 4468, "epoch": 53} {"train_loss": -16.705810546875, "global_step": 4469, "epoch": 53} {"train_loss": -17.042043685913086, "global_step": 4470, "epoch": 53} {"train_loss": -16.81861114501953, "global_step": 4471, "epoch": 53} {"train_loss": -16.75169563293457, "global_step": 4472, "epoch": 53} {"train_loss": -16.5932674407959, "global_step": 4473, "epoch": 53} {"train_loss": -16.859416961669922, "global_step": 4474, "epoch": 53} {"train_loss": -17.098962783813477, "global_step": 4475, "epoch": 53} {"train_loss": -16.850645065307617, "global_step": 4476, "epoch": 53} {"train_loss": -16.76984214782715, "global_step": 4477, "epoch": 53} {"train_loss": -16.717147827148438, "global_step": 4478, "epoch": 53} {"train_loss": -16.648008346557617, "global_step": 4479, "epoch": 53} {"train_loss": -17.128570556640625, "global_step": 4480, "epoch": 53} {"train_loss": -16.730908796011683, "global_step": 4481, "epoch": 53, "val_loss": 6884328.0} {"train_loss": -16.463804244995117, "global_step": 4482, "epoch": 54} {"train_loss": -16.486221313476562, "global_step": 4483, "epoch": 54} {"train_loss": -16.926761627197266, "global_step": 4484, "epoch": 54} {"train_loss": -16.553903579711914, "global_step": 4485, "epoch": 54} {"train_loss": -16.684417724609375, "global_step": 4486, "epoch": 54} {"train_loss": -16.449018478393555, "global_step": 4487, "epoch": 54} {"train_loss": -16.38117790222168, "global_step": 4488, "epoch": 54} {"train_loss": -16.854459762573242, "global_step": 4489, "epoch": 54} {"train_loss": -17.04183006286621, "global_step": 4490, "epoch": 54} {"train_loss": -16.642921447753906, "global_step": 4491, "epoch": 54} {"train_loss": -16.709178924560547, "global_step": 4492, "epoch": 54} {"train_loss": -16.587677001953125, "global_step": 4493, "epoch": 54} {"train_loss": -16.714492797851562, "global_step": 4494, "epoch": 54} {"train_loss": -16.80427360534668, "global_step": 4495, "epoch": 54} {"train_loss": -16.578535079956055, "global_step": 4496, "epoch": 54} {"train_loss": -16.872861862182617, "global_step": 4497, "epoch": 54} {"train_loss": -16.57935905456543, "global_step": 4498, "epoch": 54} {"train_loss": -16.78815269470215, "global_step": 4499, "epoch": 54} {"train_loss": -16.507705688476562, "global_step": 4500, "epoch": 54} {"train_loss": -16.408761978149414, "global_step": 4501, "epoch": 54} {"train_loss": -16.65998649597168, "global_step": 4502, "epoch": 54} {"train_loss": -16.800928115844727, "global_step": 4503, "epoch": 54} {"train_loss": -16.507474899291992, "global_step": 4504, "epoch": 54} {"train_loss": -16.908857345581055, "global_step": 4505, "epoch": 54} {"train_loss": -16.75149917602539, "global_step": 4506, "epoch": 54} {"train_loss": -17.16554069519043, "global_step": 4507, "epoch": 54} {"train_loss": -16.587533950805664, "global_step": 4508, "epoch": 54} {"train_loss": -16.839189529418945, "global_step": 4509, "epoch": 54} {"train_loss": -16.9035587310791, "global_step": 4510, "epoch": 54} {"train_loss": -17.090795516967773, "global_step": 4511, "epoch": 54} {"train_loss": -16.535398483276367, "global_step": 4512, "epoch": 54} {"train_loss": -16.49534034729004, "global_step": 4513, "epoch": 54} {"train_loss": -16.44782829284668, "global_step": 4514, "epoch": 54} {"train_loss": -16.618213653564453, "global_step": 4515, "epoch": 54} {"train_loss": -16.95929527282715, "global_step": 4516, "epoch": 54} {"train_loss": -16.878664016723633, "global_step": 4517, "epoch": 54} {"train_loss": -16.934539794921875, "global_step": 4518, "epoch": 54} {"train_loss": -16.679738998413086, "global_step": 4519, "epoch": 54} {"train_loss": -16.959585189819336, "global_step": 4520, "epoch": 54} {"train_loss": -16.9339542388916, "global_step": 4521, "epoch": 54} {"train_loss": -16.499799728393555, "global_step": 4522, "epoch": 54} {"train_loss": -16.92084312438965, "global_step": 4523, "epoch": 54} {"train_loss": -16.7509765625, "global_step": 4524, "epoch": 54} {"train_loss": -16.614980697631836, "global_step": 4525, "epoch": 54} {"train_loss": -16.82200813293457, "global_step": 4526, "epoch": 54} {"train_loss": -16.855798721313477, "global_step": 4527, "epoch": 54} {"train_loss": -16.671039581298828, "global_step": 4528, "epoch": 54} {"train_loss": -16.64040184020996, "global_step": 4529, "epoch": 54} {"train_loss": -16.413999557495117, "global_step": 4530, "epoch": 54} {"train_loss": -16.6447811126709, "global_step": 4531, "epoch": 54} {"train_loss": -17.154172897338867, "global_step": 4532, "epoch": 54} {"train_loss": -16.489721298217773, "global_step": 4533, "epoch": 54} {"train_loss": -16.977493286132812, "global_step": 4534, "epoch": 54} {"train_loss": -16.59052085876465, "global_step": 4535, "epoch": 54} {"train_loss": -16.50301170349121, "global_step": 4536, "epoch": 54} {"train_loss": -16.535680770874023, "global_step": 4537, "epoch": 54} {"train_loss": -17.193504333496094, "global_step": 4538, "epoch": 54} {"train_loss": -16.844093322753906, "global_step": 4539, "epoch": 54} {"train_loss": -16.823183059692383, "global_step": 4540, "epoch": 54} {"train_loss": -16.352834701538086, "global_step": 4541, "epoch": 54} {"train_loss": -16.983266830444336, "global_step": 4542, "epoch": 54} {"train_loss": -16.474851608276367, "global_step": 4543, "epoch": 54} {"train_loss": -16.63627815246582, "global_step": 4544, "epoch": 54} {"train_loss": -17.09511947631836, "global_step": 4545, "epoch": 54} {"train_loss": -16.526004791259766, "global_step": 4546, "epoch": 54} {"train_loss": -16.901525497436523, "global_step": 4547, "epoch": 54} {"train_loss": -16.900182723999023, "global_step": 4548, "epoch": 54} {"train_loss": -16.53657341003418, "global_step": 4549, "epoch": 54} {"train_loss": -16.90170669555664, "global_step": 4550, "epoch": 54} {"train_loss": -16.790857315063477, "global_step": 4551, "epoch": 54} {"train_loss": -16.403762817382812, "global_step": 4552, "epoch": 54} {"train_loss": -16.889163970947266, "global_step": 4553, "epoch": 54} {"train_loss": -17.296737670898438, "global_step": 4554, "epoch": 54} {"train_loss": -16.823354721069336, "global_step": 4555, "epoch": 54} {"train_loss": -16.788333892822266, "global_step": 4556, "epoch": 54} {"train_loss": -16.645780563354492, "global_step": 4557, "epoch": 54} {"train_loss": -16.96754264831543, "global_step": 4558, "epoch": 54} {"train_loss": -16.87027359008789, "global_step": 4559, "epoch": 54} {"train_loss": -16.743886947631836, "global_step": 4560, "epoch": 54} {"train_loss": -17.095895767211914, "global_step": 4561, "epoch": 54} {"train_loss": -16.88157081604004, "global_step": 4562, "epoch": 54} {"train_loss": -16.449140548706055, "global_step": 4563, "epoch": 54} {"train_loss": -16.717423668826918, "global_step": 4564, "epoch": 54, "val_loss": 6875827.0} {"train_loss": -16.877716064453125, "global_step": 4565, "epoch": 55} {"train_loss": -16.35848045349121, "global_step": 4566, "epoch": 55} {"train_loss": -16.526981353759766, "global_step": 4567, "epoch": 55} {"train_loss": -16.51988410949707, "global_step": 4568, "epoch": 55} {"train_loss": -16.884016036987305, "global_step": 4569, "epoch": 55} {"train_loss": -16.15801429748535, "global_step": 4570, "epoch": 55} {"train_loss": -16.40253257751465, "global_step": 4571, "epoch": 55} {"train_loss": -16.90584373474121, "global_step": 4572, "epoch": 55} {"train_loss": -16.643646240234375, "global_step": 4573, "epoch": 55} {"train_loss": -16.84747886657715, "global_step": 4574, "epoch": 55} {"train_loss": -16.779647827148438, "global_step": 4575, "epoch": 55} {"train_loss": -16.82191276550293, "global_step": 4576, "epoch": 55} {"train_loss": -16.45305824279785, "global_step": 4577, "epoch": 55} {"train_loss": -16.579986572265625, "global_step": 4578, "epoch": 55} {"train_loss": -16.97125244140625, "global_step": 4579, "epoch": 55} {"train_loss": -16.62468719482422, "global_step": 4580, "epoch": 55} {"train_loss": -16.79515266418457, "global_step": 4581, "epoch": 55} {"train_loss": -16.642650604248047, "global_step": 4582, "epoch": 55} {"train_loss": -16.518680572509766, "global_step": 4583, "epoch": 55} {"train_loss": -16.840362548828125, "global_step": 4584, "epoch": 55} {"train_loss": -16.829694747924805, "global_step": 4585, "epoch": 55} {"train_loss": -16.7056827545166, "global_step": 4586, "epoch": 55} {"train_loss": -17.0989990234375, "global_step": 4587, "epoch": 55} {"train_loss": -16.707860946655273, "global_step": 4588, "epoch": 55} {"train_loss": -16.9202938079834, "global_step": 4589, "epoch": 55} {"train_loss": -16.798425674438477, "global_step": 4590, "epoch": 55} {"train_loss": -16.986175537109375, "global_step": 4591, "epoch": 55} {"train_loss": -16.611108779907227, "global_step": 4592, "epoch": 55} {"train_loss": -17.07184410095215, "global_step": 4593, "epoch": 55} {"train_loss": -16.76496124267578, "global_step": 4594, "epoch": 55} {"train_loss": -16.77043342590332, "global_step": 4595, "epoch": 55} {"train_loss": -16.7794132232666, "global_step": 4596, "epoch": 55} {"train_loss": -16.497358322143555, "global_step": 4597, "epoch": 55} {"train_loss": -16.514301300048828, "global_step": 4598, "epoch": 55} {"train_loss": -16.70111656188965, "global_step": 4599, "epoch": 55} {"train_loss": -16.68389892578125, "global_step": 4600, "epoch": 55} {"train_loss": -17.03072738647461, "global_step": 4601, "epoch": 55} {"train_loss": -16.354904174804688, "global_step": 4602, "epoch": 55} {"train_loss": -16.959362030029297, "global_step": 4603, "epoch": 55} {"train_loss": -16.93455696105957, "global_step": 4604, "epoch": 55} {"train_loss": -16.36042022705078, "global_step": 4605, "epoch": 55} {"train_loss": -16.98438262939453, "global_step": 4606, "epoch": 55} {"train_loss": -17.272672653198242, "global_step": 4607, "epoch": 55} {"train_loss": -16.807748794555664, "global_step": 4608, "epoch": 55} {"train_loss": -16.630464553833008, "global_step": 4609, "epoch": 55} {"train_loss": -16.25338363647461, "global_step": 4610, "epoch": 55} {"train_loss": -16.663196563720703, "global_step": 4611, "epoch": 55} {"train_loss": -16.665658950805664, "global_step": 4612, "epoch": 55} {"train_loss": -16.647239685058594, "global_step": 4613, "epoch": 55} {"train_loss": -16.469791412353516, "global_step": 4614, "epoch": 55} {"train_loss": -16.755334854125977, "global_step": 4615, "epoch": 55} {"train_loss": -16.640823364257812, "global_step": 4616, "epoch": 55} {"train_loss": -17.15343475341797, "global_step": 4617, "epoch": 55} {"train_loss": -16.90937614440918, "global_step": 4618, "epoch": 55} {"train_loss": -16.62398338317871, "global_step": 4619, "epoch": 55} {"train_loss": -17.194080352783203, "global_step": 4620, "epoch": 55} {"train_loss": -16.743284225463867, "global_step": 4621, "epoch": 55} {"train_loss": -16.735742568969727, "global_step": 4622, "epoch": 55} {"train_loss": -16.82674217224121, "global_step": 4623, "epoch": 55} {"train_loss": -16.657817840576172, "global_step": 4624, "epoch": 55} {"train_loss": -16.84270668029785, "global_step": 4625, "epoch": 55} {"train_loss": -16.882780075073242, "global_step": 4626, "epoch": 55} {"train_loss": -17.0505428314209, "global_step": 4627, "epoch": 55} {"train_loss": -17.201902389526367, "global_step": 4628, "epoch": 55} {"train_loss": -17.064908981323242, "global_step": 4629, "epoch": 55} {"train_loss": -17.063627243041992, "global_step": 4630, "epoch": 55} {"train_loss": -16.563541412353516, "global_step": 4631, "epoch": 55} {"train_loss": -16.67949676513672, "global_step": 4632, "epoch": 55} {"train_loss": -16.794368743896484, "global_step": 4633, "epoch": 55} {"train_loss": -16.960372924804688, "global_step": 4634, "epoch": 55} {"train_loss": -16.810394287109375, "global_step": 4635, "epoch": 55} {"train_loss": -16.780752182006836, "global_step": 4636, "epoch": 55} {"train_loss": -17.00845718383789, "global_step": 4637, "epoch": 55} {"train_loss": -16.98647117614746, "global_step": 4638, "epoch": 55} {"train_loss": -17.006454467773438, "global_step": 4639, "epoch": 55} {"train_loss": -16.89816665649414, "global_step": 4640, "epoch": 55} {"train_loss": -16.943668365478516, "global_step": 4641, "epoch": 55} {"train_loss": -17.096019744873047, "global_step": 4642, "epoch": 55} {"train_loss": -16.32428550720215, "global_step": 4643, "epoch": 55} {"train_loss": -16.42268180847168, "global_step": 4644, "epoch": 55} {"train_loss": -16.895910263061523, "global_step": 4645, "epoch": 55} {"train_loss": -16.77240562438965, "global_step": 4646, "epoch": 55} {"train_loss": -16.769836035119482, "global_step": 4647, "epoch": 55, "val_loss": 6744460.0} {"train_loss": -16.65629005432129, "global_step": 4648, "epoch": 56} {"train_loss": -16.409204483032227, "global_step": 4649, "epoch": 56} {"train_loss": -16.661191940307617, "global_step": 4650, "epoch": 56} {"train_loss": -16.85029411315918, "global_step": 4651, "epoch": 56} {"train_loss": -16.908689498901367, "global_step": 4652, "epoch": 56} {"train_loss": -16.768335342407227, "global_step": 4653, "epoch": 56} {"train_loss": -17.10859489440918, "global_step": 4654, "epoch": 56} {"train_loss": -16.597517013549805, "global_step": 4655, "epoch": 56} {"train_loss": -16.6669979095459, "global_step": 4656, "epoch": 56} {"train_loss": -16.277679443359375, "global_step": 4657, "epoch": 56} {"train_loss": -16.453083038330078, "global_step": 4658, "epoch": 56} {"train_loss": -16.621252059936523, "global_step": 4659, "epoch": 56} {"train_loss": -16.793262481689453, "global_step": 4660, "epoch": 56} {"train_loss": -16.289846420288086, "global_step": 4661, "epoch": 56} {"train_loss": -16.72616958618164, "global_step": 4662, "epoch": 56} {"train_loss": -16.782506942749023, "global_step": 4663, "epoch": 56} {"train_loss": -16.692289352416992, "global_step": 4664, "epoch": 56} {"train_loss": -16.910764694213867, "global_step": 4665, "epoch": 56} {"train_loss": -16.8060245513916, "global_step": 4666, "epoch": 56} {"train_loss": -17.002470016479492, "global_step": 4667, "epoch": 56} {"train_loss": -16.756269454956055, "global_step": 4668, "epoch": 56} {"train_loss": -16.817943572998047, "global_step": 4669, "epoch": 56} {"train_loss": -16.9169864654541, "global_step": 4670, "epoch": 56} {"train_loss": -17.17184829711914, "global_step": 4671, "epoch": 56} {"train_loss": -16.626699447631836, "global_step": 4672, "epoch": 56} {"train_loss": -17.09639549255371, "global_step": 4673, "epoch": 56} {"train_loss": -16.72735023498535, "global_step": 4674, "epoch": 56} {"train_loss": -16.732650756835938, "global_step": 4675, "epoch": 56} {"train_loss": -17.19707679748535, "global_step": 4676, "epoch": 56} {"train_loss": -17.0144100189209, "global_step": 4677, "epoch": 56} {"train_loss": -17.33795738220215, "global_step": 4678, "epoch": 56} {"train_loss": -16.48647117614746, "global_step": 4679, "epoch": 56} {"train_loss": -17.041748046875, "global_step": 4680, "epoch": 56} {"train_loss": -16.933115005493164, "global_step": 4681, "epoch": 56} {"train_loss": -16.87764549255371, "global_step": 4682, "epoch": 56} {"train_loss": -17.084095001220703, "global_step": 4683, "epoch": 56} {"train_loss": -17.3532772064209, "global_step": 4684, "epoch": 56} {"train_loss": -17.01259422302246, "global_step": 4685, "epoch": 56} {"train_loss": -16.627473831176758, "global_step": 4686, "epoch": 56} {"train_loss": -16.89422035217285, "global_step": 4687, "epoch": 56} {"train_loss": -16.686683654785156, "global_step": 4688, "epoch": 56} {"train_loss": -16.854618072509766, "global_step": 4689, "epoch": 56} {"train_loss": -16.926593780517578, "global_step": 4690, "epoch": 56} {"train_loss": -17.011728286743164, "global_step": 4691, "epoch": 56} {"train_loss": -16.429336547851562, "global_step": 4692, "epoch": 56} {"train_loss": -17.050268173217773, "global_step": 4693, "epoch": 56} {"train_loss": -17.01662826538086, "global_step": 4694, "epoch": 56} {"train_loss": -16.61276626586914, "global_step": 4695, "epoch": 56} {"train_loss": -17.001821517944336, "global_step": 4696, "epoch": 56} {"train_loss": -17.08298683166504, "global_step": 4697, "epoch": 56} {"train_loss": -16.925931930541992, "global_step": 4698, "epoch": 56} {"train_loss": -17.209014892578125, "global_step": 4699, "epoch": 56} {"train_loss": -17.24650764465332, "global_step": 4700, "epoch": 56} {"train_loss": -16.982419967651367, "global_step": 4701, "epoch": 56} {"train_loss": -16.65875244140625, "global_step": 4702, "epoch": 56} {"train_loss": -17.192346572875977, "global_step": 4703, "epoch": 56} {"train_loss": -16.673227310180664, "global_step": 4704, "epoch": 56} {"train_loss": -16.93916893005371, "global_step": 4705, "epoch": 56} {"train_loss": -16.743391036987305, "global_step": 4706, "epoch": 56} {"train_loss": -16.579679489135742, "global_step": 4707, "epoch": 56} {"train_loss": -16.797801971435547, "global_step": 4708, "epoch": 56} {"train_loss": -16.95404052734375, "global_step": 4709, "epoch": 56} {"train_loss": -16.94114112854004, "global_step": 4710, "epoch": 56} {"train_loss": -16.344043731689453, "global_step": 4711, "epoch": 56} {"train_loss": -16.79439353942871, "global_step": 4712, "epoch": 56} {"train_loss": -16.884403228759766, "global_step": 4713, "epoch": 56} {"train_loss": -16.960500717163086, "global_step": 4714, "epoch": 56} {"train_loss": -16.89288902282715, "global_step": 4715, "epoch": 56} {"train_loss": -16.728803634643555, "global_step": 4716, "epoch": 56} {"train_loss": -16.327865600585938, "global_step": 4717, "epoch": 56} {"train_loss": -16.442182540893555, "global_step": 4718, "epoch": 56} {"train_loss": -17.095869064331055, "global_step": 4719, "epoch": 56} {"train_loss": -16.7703800201416, "global_step": 4720, "epoch": 56} {"train_loss": -17.024017333984375, "global_step": 4721, "epoch": 56} {"train_loss": -16.889904022216797, "global_step": 4722, "epoch": 56} {"train_loss": -16.920392990112305, "global_step": 4723, "epoch": 56} {"train_loss": -16.546689987182617, "global_step": 4724, "epoch": 56} {"train_loss": -16.831317901611328, "global_step": 4725, "epoch": 56} {"train_loss": -16.80238914489746, "global_step": 4726, "epoch": 56} {"train_loss": -16.542139053344727, "global_step": 4727, "epoch": 56} {"train_loss": -16.536056518554688, "global_step": 4728, "epoch": 56} {"train_loss": -16.956317901611328, "global_step": 4729, "epoch": 56} {"train_loss": -16.822403597544476, "global_step": 4730, "epoch": 56, "val_loss": 6816995.0} {"train_loss": -16.504657745361328, "global_step": 4731, "epoch": 57} {"train_loss": -16.467817306518555, "global_step": 4732, "epoch": 57} {"train_loss": -16.796377182006836, "global_step": 4733, "epoch": 57} {"train_loss": -16.630767822265625, "global_step": 4734, "epoch": 57} {"train_loss": -16.494953155517578, "global_step": 4735, "epoch": 57} {"train_loss": -16.520164489746094, "global_step": 4736, "epoch": 57} {"train_loss": -16.7711124420166, "global_step": 4737, "epoch": 57} {"train_loss": -16.884483337402344, "global_step": 4738, "epoch": 57} {"train_loss": -16.645681381225586, "global_step": 4739, "epoch": 57} {"train_loss": -16.980005264282227, "global_step": 4740, "epoch": 57} {"train_loss": -16.77239418029785, "global_step": 4741, "epoch": 57} {"train_loss": -16.958999633789062, "global_step": 4742, "epoch": 57} {"train_loss": -16.747909545898438, "global_step": 4743, "epoch": 57} {"train_loss": -16.46631622314453, "global_step": 4744, "epoch": 57} {"train_loss": -17.023529052734375, "global_step": 4745, "epoch": 57} {"train_loss": -16.74658203125, "global_step": 4746, "epoch": 57} {"train_loss": -16.621782302856445, "global_step": 4747, "epoch": 57} {"train_loss": -16.60943603515625, "global_step": 4748, "epoch": 57} {"train_loss": -17.117048263549805, "global_step": 4749, "epoch": 57} {"train_loss": -17.1658878326416, "global_step": 4750, "epoch": 57} {"train_loss": -16.7735652923584, "global_step": 4751, "epoch": 57} {"train_loss": -17.043336868286133, "global_step": 4752, "epoch": 57} {"train_loss": -16.722875595092773, "global_step": 4753, "epoch": 57} {"train_loss": -16.9559383392334, "global_step": 4754, "epoch": 57} {"train_loss": -16.825027465820312, "global_step": 4755, "epoch": 57} {"train_loss": -16.719696044921875, "global_step": 4756, "epoch": 57} {"train_loss": -16.457874298095703, "global_step": 4757, "epoch": 57} {"train_loss": -17.162769317626953, "global_step": 4758, "epoch": 57} {"train_loss": -17.245405197143555, "global_step": 4759, "epoch": 57} {"train_loss": -16.48282241821289, "global_step": 4760, "epoch": 57} {"train_loss": -17.086591720581055, "global_step": 4761, "epoch": 57} {"train_loss": -17.006284713745117, "global_step": 4762, "epoch": 57} {"train_loss": -16.540771484375, "global_step": 4763, "epoch": 57} {"train_loss": -16.836450576782227, "global_step": 4764, "epoch": 57} {"train_loss": -16.59952163696289, "global_step": 4765, "epoch": 57} {"train_loss": -16.676044464111328, "global_step": 4766, "epoch": 57} {"train_loss": -17.352375030517578, "global_step": 4767, "epoch": 57} {"train_loss": -17.117300033569336, "global_step": 4768, "epoch": 57} {"train_loss": -16.5195369720459, "global_step": 4769, "epoch": 57} {"train_loss": -16.995832443237305, "global_step": 4770, "epoch": 57} {"train_loss": -16.804086685180664, "global_step": 4771, "epoch": 57} {"train_loss": -16.873952865600586, "global_step": 4772, "epoch": 57} {"train_loss": -17.076053619384766, "global_step": 4773, "epoch": 57} {"train_loss": -16.636075973510742, "global_step": 4774, "epoch": 57} {"train_loss": -16.746129989624023, "global_step": 4775, "epoch": 57} {"train_loss": -16.427751541137695, "global_step": 4776, "epoch": 57} {"train_loss": -17.162506103515625, "global_step": 4777, "epoch": 57} {"train_loss": -16.855722427368164, "global_step": 4778, "epoch": 57} {"train_loss": -16.640094757080078, "global_step": 4779, "epoch": 57} {"train_loss": -17.208951950073242, "global_step": 4780, "epoch": 57} {"train_loss": -17.10431480407715, "global_step": 4781, "epoch": 57} {"train_loss": -16.549285888671875, "global_step": 4782, "epoch": 57} {"train_loss": -16.97475242614746, "global_step": 4783, "epoch": 57} {"train_loss": -16.527996063232422, "global_step": 4784, "epoch": 57} {"train_loss": -17.153549194335938, "global_step": 4785, "epoch": 57} {"train_loss": -16.753910064697266, "global_step": 4786, "epoch": 57} {"train_loss": -16.964645385742188, "global_step": 4787, "epoch": 57} {"train_loss": -16.905302047729492, "global_step": 4788, "epoch": 57} {"train_loss": -16.613996505737305, "global_step": 4789, "epoch": 57} {"train_loss": -17.101240158081055, "global_step": 4790, "epoch": 57} {"train_loss": -16.70163917541504, "global_step": 4791, "epoch": 57} {"train_loss": -16.916013717651367, "global_step": 4792, "epoch": 57} {"train_loss": -17.102909088134766, "global_step": 4793, "epoch": 57} {"train_loss": -16.56844711303711, "global_step": 4794, "epoch": 57} {"train_loss": -16.772489547729492, "global_step": 4795, "epoch": 57} {"train_loss": -16.707616806030273, "global_step": 4796, "epoch": 57} {"train_loss": -17.012691497802734, "global_step": 4797, "epoch": 57} {"train_loss": -16.735004425048828, "global_step": 4798, "epoch": 57} {"train_loss": -16.69443702697754, "global_step": 4799, "epoch": 57} {"train_loss": -17.115161895751953, "global_step": 4800, "epoch": 57} {"train_loss": -16.511751174926758, "global_step": 4801, "epoch": 57} {"train_loss": -16.97697639465332, "global_step": 4802, "epoch": 57} {"train_loss": -17.1539306640625, "global_step": 4803, "epoch": 57} {"train_loss": -16.732187271118164, "global_step": 4804, "epoch": 57} {"train_loss": -16.987689971923828, "global_step": 4805, "epoch": 57} {"train_loss": -16.84208869934082, "global_step": 4806, "epoch": 57} {"train_loss": -16.819074630737305, "global_step": 4807, "epoch": 57} {"train_loss": -16.72942543029785, "global_step": 4808, "epoch": 57} {"train_loss": -16.724340438842773, "global_step": 4809, "epoch": 57} {"train_loss": -16.6829891204834, "global_step": 4810, "epoch": 57} {"train_loss": -17.025226593017578, "global_step": 4811, "epoch": 57} {"train_loss": -16.8663330078125, "global_step": 4812, "epoch": 57} {"train_loss": -16.824529463986316, "global_step": 4813, "epoch": 57, "val_loss": 6915151.0} {"train_loss": -16.93050193786621, "global_step": 4814, "epoch": 58} {"train_loss": -16.784208297729492, "global_step": 4815, "epoch": 58} {"train_loss": -16.575302124023438, "global_step": 4816, "epoch": 58} {"train_loss": -16.434356689453125, "global_step": 4817, "epoch": 58} {"train_loss": -16.66416358947754, "global_step": 4818, "epoch": 58} {"train_loss": -16.86560821533203, "global_step": 4819, "epoch": 58} {"train_loss": -17.066213607788086, "global_step": 4820, "epoch": 58} {"train_loss": -16.489965438842773, "global_step": 4821, "epoch": 58} {"train_loss": -16.72000503540039, "global_step": 4822, "epoch": 58} {"train_loss": -16.09153175354004, "global_step": 4823, "epoch": 58} {"train_loss": -16.660898208618164, "global_step": 4824, "epoch": 58} {"train_loss": -17.061765670776367, "global_step": 4825, "epoch": 58} {"train_loss": -16.672021865844727, "global_step": 4826, "epoch": 58} {"train_loss": -17.02741813659668, "global_step": 4827, "epoch": 58} {"train_loss": -16.6671142578125, "global_step": 4828, "epoch": 58} {"train_loss": -16.532384872436523, "global_step": 4829, "epoch": 58} {"train_loss": -17.153181076049805, "global_step": 4830, "epoch": 58} {"train_loss": -16.548458099365234, "global_step": 4831, "epoch": 58} {"train_loss": -17.090864181518555, "global_step": 4832, "epoch": 58} {"train_loss": -16.772985458374023, "global_step": 4833, "epoch": 58} {"train_loss": -16.79536247253418, "global_step": 4834, "epoch": 58} {"train_loss": -16.767515182495117, "global_step": 4835, "epoch": 58} {"train_loss": -16.76899528503418, "global_step": 4836, "epoch": 58} {"train_loss": -16.44948959350586, "global_step": 4837, "epoch": 58} {"train_loss": -16.949249267578125, "global_step": 4838, "epoch": 58} {"train_loss": -16.671607971191406, "global_step": 4839, "epoch": 58} {"train_loss": -16.826936721801758, "global_step": 4840, "epoch": 58} {"train_loss": -16.579071044921875, "global_step": 4841, "epoch": 58} {"train_loss": -16.810861587524414, "global_step": 4842, "epoch": 58} {"train_loss": -16.752735137939453, "global_step": 4843, "epoch": 58} {"train_loss": -16.89887046813965, "global_step": 4844, "epoch": 58} {"train_loss": -16.77439308166504, "global_step": 4845, "epoch": 58} {"train_loss": -17.055078506469727, "global_step": 4846, "epoch": 58} {"train_loss": -17.109853744506836, "global_step": 4847, "epoch": 58} {"train_loss": -16.948163986206055, "global_step": 4848, "epoch": 58} {"train_loss": -16.744340896606445, "global_step": 4849, "epoch": 58} {"train_loss": -17.042739868164062, "global_step": 4850, "epoch": 58} {"train_loss": -16.7781982421875, "global_step": 4851, "epoch": 58} {"train_loss": -16.6491756439209, "global_step": 4852, "epoch": 58} {"train_loss": -17.137332916259766, "global_step": 4853, "epoch": 58} {"train_loss": -16.77888298034668, "global_step": 4854, "epoch": 58} {"train_loss": -16.991304397583008, "global_step": 4855, "epoch": 58} {"train_loss": -16.79640007019043, "global_step": 4856, "epoch": 58} {"train_loss": -17.017934799194336, "global_step": 4857, "epoch": 58} {"train_loss": -16.986051559448242, "global_step": 4858, "epoch": 58} {"train_loss": -17.353822708129883, "global_step": 4859, "epoch": 58} {"train_loss": -17.019250869750977, "global_step": 4860, "epoch": 58} {"train_loss": -16.71213722229004, "global_step": 4861, "epoch": 58} {"train_loss": -16.799739837646484, "global_step": 4862, "epoch": 58} {"train_loss": -16.955886840820312, "global_step": 4863, "epoch": 58} {"train_loss": -16.6860408782959, "global_step": 4864, "epoch": 58} {"train_loss": -16.635339736938477, "global_step": 4865, "epoch": 58} {"train_loss": -16.532636642456055, "global_step": 4866, "epoch": 58} {"train_loss": -17.147729873657227, "global_step": 4867, "epoch": 58} {"train_loss": -16.798147201538086, "global_step": 4868, "epoch": 58} {"train_loss": -16.80498504638672, "global_step": 4869, "epoch": 58} {"train_loss": -17.026559829711914, "global_step": 4870, "epoch": 58} {"train_loss": -17.0169677734375, "global_step": 4871, "epoch": 58} {"train_loss": -16.741626739501953, "global_step": 4872, "epoch": 58} {"train_loss": -16.859704971313477, "global_step": 4873, "epoch": 58} {"train_loss": -16.908124923706055, "global_step": 4874, "epoch": 58} {"train_loss": -16.6617431640625, "global_step": 4875, "epoch": 58} {"train_loss": -16.983591079711914, "global_step": 4876, "epoch": 58} {"train_loss": -16.657629013061523, "global_step": 4877, "epoch": 58} {"train_loss": -17.12989616394043, "global_step": 4878, "epoch": 58} {"train_loss": -16.49074363708496, "global_step": 4879, "epoch": 58} {"train_loss": -16.810588836669922, "global_step": 4880, "epoch": 58} {"train_loss": -17.30379867553711, "global_step": 4881, "epoch": 58} {"train_loss": -16.620019912719727, "global_step": 4882, "epoch": 58} {"train_loss": -16.98179054260254, "global_step": 4883, "epoch": 58} {"train_loss": -16.836332321166992, "global_step": 4884, "epoch": 58} {"train_loss": -16.886934280395508, "global_step": 4885, "epoch": 58} {"train_loss": -17.22260284423828, "global_step": 4886, "epoch": 58} {"train_loss": -16.84480857849121, "global_step": 4887, "epoch": 58} {"train_loss": -17.013532638549805, "global_step": 4888, "epoch": 58} {"train_loss": -16.88759994506836, "global_step": 4889, "epoch": 58} {"train_loss": -16.660383224487305, "global_step": 4890, "epoch": 58} {"train_loss": -17.01178550720215, "global_step": 4891, "epoch": 58} {"train_loss": -17.03815269470215, "global_step": 4892, "epoch": 58} {"train_loss": -17.179061889648438, "global_step": 4893, "epoch": 58} {"train_loss": -16.69571876525879, "global_step": 4894, "epoch": 58} {"train_loss": -16.762353897094727, "global_step": 4895, "epoch": 58} {"train_loss": -16.82393242939409, "global_step": 4896, "epoch": 58, "val_loss": 6777354.0} {"train_loss": -16.554107666015625, "global_step": 4897, "epoch": 59} {"train_loss": -16.646085739135742, "global_step": 4898, "epoch": 59} {"train_loss": -16.56640625, "global_step": 4899, "epoch": 59} {"train_loss": -16.761762619018555, "global_step": 4900, "epoch": 59} {"train_loss": -16.641447067260742, "global_step": 4901, "epoch": 59} {"train_loss": -16.712127685546875, "global_step": 4902, "epoch": 59} {"train_loss": -16.518840789794922, "global_step": 4903, "epoch": 59} {"train_loss": -16.523683547973633, "global_step": 4904, "epoch": 59} {"train_loss": -16.361684799194336, "global_step": 4905, "epoch": 59} {"train_loss": -16.838134765625, "global_step": 4906, "epoch": 59} {"train_loss": -16.46396255493164, "global_step": 4907, "epoch": 59} {"train_loss": -16.975385665893555, "global_step": 4908, "epoch": 59} {"train_loss": -16.773473739624023, "global_step": 4909, "epoch": 59} {"train_loss": -17.371604919433594, "global_step": 4910, "epoch": 59} {"train_loss": -16.86769676208496, "global_step": 4911, "epoch": 59} {"train_loss": -16.873945236206055, "global_step": 4912, "epoch": 59} {"train_loss": -16.90591812133789, "global_step": 4913, "epoch": 59} {"train_loss": -17.047330856323242, "global_step": 4914, "epoch": 59} {"train_loss": -16.618764877319336, "global_step": 4915, "epoch": 59} {"train_loss": -16.659622192382812, "global_step": 4916, "epoch": 59} {"train_loss": -16.756549835205078, "global_step": 4917, "epoch": 59} {"train_loss": -16.821020126342773, "global_step": 4918, "epoch": 59} {"train_loss": -16.84488868713379, "global_step": 4919, "epoch": 59} {"train_loss": -17.031400680541992, "global_step": 4920, "epoch": 59} {"train_loss": -17.11163902282715, "global_step": 4921, "epoch": 59} {"train_loss": -17.072113037109375, "global_step": 4922, "epoch": 59} {"train_loss": -17.05425453186035, "global_step": 4923, "epoch": 59} {"train_loss": -16.941640853881836, "global_step": 4924, "epoch": 59} {"train_loss": -16.711462020874023, "global_step": 4925, "epoch": 59} {"train_loss": -16.874271392822266, "global_step": 4926, "epoch": 59} {"train_loss": -16.81528091430664, "global_step": 4927, "epoch": 59} {"train_loss": -16.829904556274414, "global_step": 4928, "epoch": 59} {"train_loss": -17.01872444152832, "global_step": 4929, "epoch": 59} {"train_loss": -16.94978141784668, "global_step": 4930, "epoch": 59} {"train_loss": -16.869049072265625, "global_step": 4931, "epoch": 59} {"train_loss": -16.740427017211914, "global_step": 4932, "epoch": 59} {"train_loss": -16.598554611206055, "global_step": 4933, "epoch": 59} {"train_loss": -16.6763916015625, "global_step": 4934, "epoch": 59} {"train_loss": -16.491426467895508, "global_step": 4935, "epoch": 59} {"train_loss": -17.09526252746582, "global_step": 4936, "epoch": 59} {"train_loss": -17.210172653198242, "global_step": 4937, "epoch": 59} {"train_loss": -16.80373191833496, "global_step": 4938, "epoch": 59} {"train_loss": -17.085983276367188, "global_step": 4939, "epoch": 59} {"train_loss": -17.009498596191406, "global_step": 4940, "epoch": 59} {"train_loss": -16.4491024017334, "global_step": 4941, "epoch": 59} {"train_loss": -17.074970245361328, "global_step": 4942, "epoch": 59} {"train_loss": -17.006092071533203, "global_step": 4943, "epoch": 59} {"train_loss": -16.69528579711914, "global_step": 4944, "epoch": 59} {"train_loss": -17.014551162719727, "global_step": 4945, "epoch": 59} {"train_loss": -16.75539207458496, "global_step": 4946, "epoch": 59} {"train_loss": -16.836959838867188, "global_step": 4947, "epoch": 59} {"train_loss": -16.634536743164062, "global_step": 4948, "epoch": 59} {"train_loss": -16.967058181762695, "global_step": 4949, "epoch": 59} {"train_loss": -16.844711303710938, "global_step": 4950, "epoch": 59} {"train_loss": -16.81049919128418, "global_step": 4951, "epoch": 59} {"train_loss": -16.976057052612305, "global_step": 4952, "epoch": 59} {"train_loss": -16.81207847595215, "global_step": 4953, "epoch": 59} {"train_loss": -17.078632354736328, "global_step": 4954, "epoch": 59} {"train_loss": -17.40506935119629, "global_step": 4955, "epoch": 59} {"train_loss": -16.716276168823242, "global_step": 4956, "epoch": 59} {"train_loss": -16.50191307067871, "global_step": 4957, "epoch": 59} {"train_loss": -16.77214241027832, "global_step": 4958, "epoch": 59} {"train_loss": -17.2602596282959, "global_step": 4959, "epoch": 59} {"train_loss": -16.902605056762695, "global_step": 4960, "epoch": 59} {"train_loss": -16.956226348876953, "global_step": 4961, "epoch": 59} {"train_loss": -16.91070556640625, "global_step": 4962, "epoch": 59} {"train_loss": -17.1380672454834, "global_step": 4963, "epoch": 59} {"train_loss": -16.801862716674805, "global_step": 4964, "epoch": 59} {"train_loss": -16.99546241760254, "global_step": 4965, "epoch": 59} {"train_loss": -16.989652633666992, "global_step": 4966, "epoch": 59} {"train_loss": -16.954038619995117, "global_step": 4967, "epoch": 59} {"train_loss": -16.830671310424805, "global_step": 4968, "epoch": 59} {"train_loss": -16.856870651245117, "global_step": 4969, "epoch": 59} {"train_loss": -16.717788696289062, "global_step": 4970, "epoch": 59} {"train_loss": -16.763404846191406, "global_step": 4971, "epoch": 59} {"train_loss": -16.660402297973633, "global_step": 4972, "epoch": 59} {"train_loss": -17.24762535095215, "global_step": 4973, "epoch": 59} {"train_loss": -16.717700958251953, "global_step": 4974, "epoch": 59} {"train_loss": -16.626407623291016, "global_step": 4975, "epoch": 59} {"train_loss": -17.052894592285156, "global_step": 4976, "epoch": 59} {"train_loss": -16.778928756713867, "global_step": 4977, "epoch": 59} {"train_loss": -16.84041404724121, "global_step": 4978, "epoch": 59} {"train_loss": -16.847937043890894, "global_step": 4979, "epoch": 59, "val_loss": 6886415.0} {"train_loss": -16.41371726989746, "global_step": 4980, "epoch": 60} {"train_loss": -16.97663116455078, "global_step": 4981, "epoch": 60} {"train_loss": -16.9415225982666, "global_step": 4982, "epoch": 60} {"train_loss": -16.486722946166992, "global_step": 4983, "epoch": 60} {"train_loss": -17.096601486206055, "global_step": 4984, "epoch": 60} {"train_loss": -16.956266403198242, "global_step": 4985, "epoch": 60} {"train_loss": -16.630964279174805, "global_step": 4986, "epoch": 60} {"train_loss": -16.792362213134766, "global_step": 4987, "epoch": 60} {"train_loss": -16.60639762878418, "global_step": 4988, "epoch": 60} {"train_loss": -16.928512573242188, "global_step": 4989, "epoch": 60} {"train_loss": -17.04286003112793, "global_step": 4990, "epoch": 60} {"train_loss": -16.88959312438965, "global_step": 4991, "epoch": 60} {"train_loss": -16.869613647460938, "global_step": 4992, "epoch": 60} {"train_loss": -17.009578704833984, "global_step": 4993, "epoch": 60} {"train_loss": -16.588090896606445, "global_step": 4994, "epoch": 60} {"train_loss": -16.726560592651367, "global_step": 4995, "epoch": 60} {"train_loss": -16.709882736206055, "global_step": 4996, "epoch": 60} {"train_loss": -16.69097900390625, "global_step": 4997, "epoch": 60} {"train_loss": -16.660114288330078, "global_step": 4998, "epoch": 60} {"train_loss": -16.831663131713867, "global_step": 4999, "epoch": 60} {"train_loss": -17.052549362182617, "global_step": 5000, "epoch": 60} {"train_loss": -16.953153610229492, "global_step": 5001, "epoch": 60} {"train_loss": -16.81110191345215, "global_step": 5002, "epoch": 60} {"train_loss": -16.586477279663086, "global_step": 5003, "epoch": 60} {"train_loss": -17.024625778198242, "global_step": 5004, "epoch": 60} {"train_loss": -16.84372901916504, "global_step": 5005, "epoch": 60} {"train_loss": -17.060007095336914, "global_step": 5006, "epoch": 60} {"train_loss": -16.92997169494629, "global_step": 5007, "epoch": 60} {"train_loss": -16.93979835510254, "global_step": 5008, "epoch": 60} {"train_loss": -16.79374122619629, "global_step": 5009, "epoch": 60} {"train_loss": -17.043487548828125, "global_step": 5010, "epoch": 60} {"train_loss": -16.838247299194336, "global_step": 5011, "epoch": 60} {"train_loss": -17.028318405151367, "global_step": 5012, "epoch": 60} {"train_loss": -17.019060134887695, "global_step": 5013, "epoch": 60} {"train_loss": -17.20062828063965, "global_step": 5014, "epoch": 60} {"train_loss": -17.269086837768555, "global_step": 5015, "epoch": 60} {"train_loss": -17.03139305114746, "global_step": 5016, "epoch": 60} {"train_loss": -17.01476287841797, "global_step": 5017, "epoch": 60} {"train_loss": -16.444732666015625, "global_step": 5018, "epoch": 60} {"train_loss": -16.8083438873291, "global_step": 5019, "epoch": 60} {"train_loss": -17.211673736572266, "global_step": 5020, "epoch": 60} {"train_loss": -16.989269256591797, "global_step": 5021, "epoch": 60} {"train_loss": -16.893930435180664, "global_step": 5022, "epoch": 60} {"train_loss": -16.80360984802246, "global_step": 5023, "epoch": 60} {"train_loss": -16.87009048461914, "global_step": 5024, "epoch": 60} {"train_loss": -17.14398765563965, "global_step": 5025, "epoch": 60} {"train_loss": -16.900236129760742, "global_step": 5026, "epoch": 60} {"train_loss": -17.251544952392578, "global_step": 5027, "epoch": 60} {"train_loss": -17.173946380615234, "global_step": 5028, "epoch": 60} {"train_loss": -17.3160400390625, "global_step": 5029, "epoch": 60} {"train_loss": -17.136259078979492, "global_step": 5030, "epoch": 60} {"train_loss": -16.916860580444336, "global_step": 5031, "epoch": 60} {"train_loss": -16.834671020507812, "global_step": 5032, "epoch": 60} {"train_loss": -16.528125762939453, "global_step": 5033, "epoch": 60} {"train_loss": -16.88773536682129, "global_step": 5034, "epoch": 60} {"train_loss": -16.76930809020996, "global_step": 5035, "epoch": 60} {"train_loss": -17.265708923339844, "global_step": 5036, "epoch": 60} {"train_loss": -16.3292293548584, "global_step": 5037, "epoch": 60} {"train_loss": -16.632089614868164, "global_step": 5038, "epoch": 60} {"train_loss": -17.19328498840332, "global_step": 5039, "epoch": 60} {"train_loss": -17.01109504699707, "global_step": 5040, "epoch": 60} {"train_loss": -16.601850509643555, "global_step": 5041, "epoch": 60} {"train_loss": -17.098812103271484, "global_step": 5042, "epoch": 60} {"train_loss": -16.95054054260254, "global_step": 5043, "epoch": 60} {"train_loss": -16.70710563659668, "global_step": 5044, "epoch": 60} {"train_loss": -16.992145538330078, "global_step": 5045, "epoch": 60} {"train_loss": -16.63838005065918, "global_step": 5046, "epoch": 60} {"train_loss": -16.920196533203125, "global_step": 5047, "epoch": 60} {"train_loss": -17.031204223632812, "global_step": 5048, "epoch": 60} {"train_loss": -16.71022605895996, "global_step": 5049, "epoch": 60} {"train_loss": -16.7883243560791, "global_step": 5050, "epoch": 60} {"train_loss": -16.558942794799805, "global_step": 5051, "epoch": 60} {"train_loss": -16.795331954956055, "global_step": 5052, "epoch": 60} {"train_loss": -16.970088958740234, "global_step": 5053, "epoch": 60} {"train_loss": -16.50303077697754, "global_step": 5054, "epoch": 60} {"train_loss": -16.805133819580078, "global_step": 5055, "epoch": 60} {"train_loss": -17.050992965698242, "global_step": 5056, "epoch": 60} {"train_loss": -16.8511905670166, "global_step": 5057, "epoch": 60} {"train_loss": -16.957162857055664, "global_step": 5058, "epoch": 60} {"train_loss": -16.8701171875, "global_step": 5059, "epoch": 60} {"train_loss": -17.116365432739258, "global_step": 5060, "epoch": 60} {"train_loss": -17.05739402770996, "global_step": 5061, "epoch": 60} {"train_loss": -16.886451882052135, "global_step": 5062, "epoch": 60, "val_loss": 6827168.0} {"train_loss": -16.99734878540039, "global_step": 5063, "epoch": 61} {"train_loss": -16.705707550048828, "global_step": 5064, "epoch": 61} {"train_loss": -16.510366439819336, "global_step": 5065, "epoch": 61} {"train_loss": -16.547748565673828, "global_step": 5066, "epoch": 61} {"train_loss": -16.5304012298584, "global_step": 5067, "epoch": 61} {"train_loss": -16.438657760620117, "global_step": 5068, "epoch": 61} {"train_loss": -17.05731773376465, "global_step": 5069, "epoch": 61} {"train_loss": -17.074155807495117, "global_step": 5070, "epoch": 61} {"train_loss": -16.870161056518555, "global_step": 5071, "epoch": 61} {"train_loss": -16.6696720123291, "global_step": 5072, "epoch": 61} {"train_loss": -17.01823616027832, "global_step": 5073, "epoch": 61} {"train_loss": -17.126436233520508, "global_step": 5074, "epoch": 61} {"train_loss": -17.224088668823242, "global_step": 5075, "epoch": 61} {"train_loss": -16.54215431213379, "global_step": 5076, "epoch": 61} {"train_loss": -16.880958557128906, "global_step": 5077, "epoch": 61} {"train_loss": -17.110204696655273, "global_step": 5078, "epoch": 61} {"train_loss": -16.614255905151367, "global_step": 5079, "epoch": 61} {"train_loss": -17.42453384399414, "global_step": 5080, "epoch": 61} {"train_loss": -16.993146896362305, "global_step": 5081, "epoch": 61} {"train_loss": -17.069982528686523, "global_step": 5082, "epoch": 61} {"train_loss": -16.920269012451172, "global_step": 5083, "epoch": 61} {"train_loss": -16.455015182495117, "global_step": 5084, "epoch": 61} {"train_loss": -17.04685401916504, "global_step": 5085, "epoch": 61} {"train_loss": -16.940570831298828, "global_step": 5086, "epoch": 61} {"train_loss": -16.915990829467773, "global_step": 5087, "epoch": 61} {"train_loss": -16.792190551757812, "global_step": 5088, "epoch": 61} {"train_loss": -16.57110023498535, "global_step": 5089, "epoch": 61} {"train_loss": -16.876136779785156, "global_step": 5090, "epoch": 61} {"train_loss": -16.77902603149414, "global_step": 5091, "epoch": 61} {"train_loss": -17.048553466796875, "global_step": 5092, "epoch": 61} {"train_loss": -16.794631958007812, "global_step": 5093, "epoch": 61} {"train_loss": -16.96379280090332, "global_step": 5094, "epoch": 61} {"train_loss": -16.946701049804688, "global_step": 5095, "epoch": 61} {"train_loss": -17.06397819519043, "global_step": 5096, "epoch": 61} {"train_loss": -16.525068283081055, "global_step": 5097, "epoch": 61} {"train_loss": -16.73902702331543, "global_step": 5098, "epoch": 61} {"train_loss": -16.98128318786621, "global_step": 5099, "epoch": 61} {"train_loss": -16.81162452697754, "global_step": 5100, "epoch": 61} {"train_loss": -16.847553253173828, "global_step": 5101, "epoch": 61} {"train_loss": -16.42011070251465, "global_step": 5102, "epoch": 61} {"train_loss": -17.174100875854492, "global_step": 5103, "epoch": 61} {"train_loss": -16.923391342163086, "global_step": 5104, "epoch": 61} {"train_loss": -17.238428115844727, "global_step": 5105, "epoch": 61} {"train_loss": -17.014841079711914, "global_step": 5106, "epoch": 61} {"train_loss": -17.0612735748291, "global_step": 5107, "epoch": 61} {"train_loss": -16.859039306640625, "global_step": 5108, "epoch": 61} {"train_loss": -16.84157371520996, "global_step": 5109, "epoch": 61} {"train_loss": -17.094467163085938, "global_step": 5110, "epoch": 61} {"train_loss": -16.99056053161621, "global_step": 5111, "epoch": 61} {"train_loss": -16.961402893066406, "global_step": 5112, "epoch": 61} {"train_loss": -16.947725296020508, "global_step": 5113, "epoch": 61} {"train_loss": -16.783058166503906, "global_step": 5114, "epoch": 61} {"train_loss": -16.934843063354492, "global_step": 5115, "epoch": 61} {"train_loss": -16.658451080322266, "global_step": 5116, "epoch": 61} {"train_loss": -16.964141845703125, "global_step": 5117, "epoch": 61} {"train_loss": -17.165729522705078, "global_step": 5118, "epoch": 61} {"train_loss": -17.070446014404297, "global_step": 5119, "epoch": 61} {"train_loss": -17.0623836517334, "global_step": 5120, "epoch": 61} {"train_loss": -17.211637496948242, "global_step": 5121, "epoch": 61} {"train_loss": -17.170364379882812, "global_step": 5122, "epoch": 61} {"train_loss": -16.757081985473633, "global_step": 5123, "epoch": 61} {"train_loss": -17.110790252685547, "global_step": 5124, "epoch": 61} {"train_loss": -16.62239646911621, "global_step": 5125, "epoch": 61} {"train_loss": -16.704788208007812, "global_step": 5126, "epoch": 61} {"train_loss": -17.149648666381836, "global_step": 5127, "epoch": 61} {"train_loss": -16.955698013305664, "global_step": 5128, "epoch": 61} {"train_loss": -16.853418350219727, "global_step": 5129, "epoch": 61} {"train_loss": -17.02568817138672, "global_step": 5130, "epoch": 61} {"train_loss": -17.005006790161133, "global_step": 5131, "epoch": 61} {"train_loss": -16.600849151611328, "global_step": 5132, "epoch": 61} {"train_loss": -16.906940460205078, "global_step": 5133, "epoch": 61} {"train_loss": -16.906192779541016, "global_step": 5134, "epoch": 61} {"train_loss": -16.80401611328125, "global_step": 5135, "epoch": 61} {"train_loss": -16.529218673706055, "global_step": 5136, "epoch": 61} {"train_loss": -16.829574584960938, "global_step": 5137, "epoch": 61} {"train_loss": -16.75444984436035, "global_step": 5138, "epoch": 61} {"train_loss": -16.81275749206543, "global_step": 5139, "epoch": 61} {"train_loss": -16.731409072875977, "global_step": 5140, "epoch": 61} {"train_loss": -16.917295455932617, "global_step": 5141, "epoch": 61} {"train_loss": -16.68669891357422, "global_step": 5142, "epoch": 61} {"train_loss": -17.077754974365234, "global_step": 5143, "epoch": 61} {"train_loss": -17.694255828857422, "global_step": 5144, "epoch": 61} {"train_loss": -16.890664158097234, "global_step": 5145, "epoch": 61, "val_loss": 6701046.5} {"train_loss": -17.035444259643555, "global_step": 5146, "epoch": 62} {"train_loss": -16.4880313873291, "global_step": 5147, "epoch": 62} {"train_loss": -17.024276733398438, "global_step": 5148, "epoch": 62} {"train_loss": -16.78473472595215, "global_step": 5149, "epoch": 62} {"train_loss": -16.79782485961914, "global_step": 5150, "epoch": 62} {"train_loss": -16.56964683532715, "global_step": 5151, "epoch": 62} {"train_loss": -16.78792381286621, "global_step": 5152, "epoch": 62} {"train_loss": -16.811250686645508, "global_step": 5153, "epoch": 62} {"train_loss": -16.904216766357422, "global_step": 5154, "epoch": 62} {"train_loss": -17.199670791625977, "global_step": 5155, "epoch": 62} {"train_loss": -16.848798751831055, "global_step": 5156, "epoch": 62} {"train_loss": -16.88892936706543, "global_step": 5157, "epoch": 62} {"train_loss": -16.838903427124023, "global_step": 5158, "epoch": 62} {"train_loss": -16.728321075439453, "global_step": 5159, "epoch": 62} {"train_loss": -16.521108627319336, "global_step": 5160, "epoch": 62} {"train_loss": -16.763805389404297, "global_step": 5161, "epoch": 62} {"train_loss": -17.070837020874023, "global_step": 5162, "epoch": 62} {"train_loss": -16.63100242614746, "global_step": 5163, "epoch": 62} {"train_loss": -16.851024627685547, "global_step": 5164, "epoch": 62} {"train_loss": -16.683584213256836, "global_step": 5165, "epoch": 62} {"train_loss": -17.284061431884766, "global_step": 5166, "epoch": 62} {"train_loss": -16.699296951293945, "global_step": 5167, "epoch": 62} {"train_loss": -16.832462310791016, "global_step": 5168, "epoch": 62} {"train_loss": -16.866931915283203, "global_step": 5169, "epoch": 62} {"train_loss": -16.655410766601562, "global_step": 5170, "epoch": 62} {"train_loss": -16.779640197753906, "global_step": 5171, "epoch": 62} {"train_loss": -16.981901168823242, "global_step": 5172, "epoch": 62} {"train_loss": -16.842483520507812, "global_step": 5173, "epoch": 62} {"train_loss": -17.229629516601562, "global_step": 5174, "epoch": 62} {"train_loss": -17.24403953552246, "global_step": 5175, "epoch": 62} {"train_loss": -17.198915481567383, "global_step": 5176, "epoch": 62} {"train_loss": -16.682029724121094, "global_step": 5177, "epoch": 62} {"train_loss": -16.702484130859375, "global_step": 5178, "epoch": 62} {"train_loss": -17.391010284423828, "global_step": 5179, "epoch": 62} {"train_loss": -16.62233543395996, "global_step": 5180, "epoch": 62} {"train_loss": -16.757190704345703, "global_step": 5181, "epoch": 62} {"train_loss": -17.281299591064453, "global_step": 5182, "epoch": 62} {"train_loss": -16.984169006347656, "global_step": 5183, "epoch": 62} {"train_loss": -16.91563606262207, "global_step": 5184, "epoch": 62} {"train_loss": -16.610321044921875, "global_step": 5185, "epoch": 62} {"train_loss": -17.014623641967773, "global_step": 5186, "epoch": 62} {"train_loss": -17.114667892456055, "global_step": 5187, "epoch": 62} {"train_loss": -16.776151657104492, "global_step": 5188, "epoch": 62} {"train_loss": -17.308372497558594, "global_step": 5189, "epoch": 62} {"train_loss": -17.06026268005371, "global_step": 5190, "epoch": 62} {"train_loss": -17.137371063232422, "global_step": 5191, "epoch": 62} {"train_loss": -16.908309936523438, "global_step": 5192, "epoch": 62} {"train_loss": -16.751800537109375, "global_step": 5193, "epoch": 62} {"train_loss": -16.75286293029785, "global_step": 5194, "epoch": 62} {"train_loss": -17.0379638671875, "global_step": 5195, "epoch": 62} {"train_loss": -16.9456787109375, "global_step": 5196, "epoch": 62} {"train_loss": -17.462078094482422, "global_step": 5197, "epoch": 62} {"train_loss": -17.055383682250977, "global_step": 5198, "epoch": 62} {"train_loss": -16.87250328063965, "global_step": 5199, "epoch": 62} {"train_loss": -17.144258499145508, "global_step": 5200, "epoch": 62} {"train_loss": -16.850955963134766, "global_step": 5201, "epoch": 62} {"train_loss": -16.81421661376953, "global_step": 5202, "epoch": 62} {"train_loss": -17.195932388305664, "global_step": 5203, "epoch": 62} {"train_loss": -16.987173080444336, "global_step": 5204, "epoch": 62} {"train_loss": -17.154428482055664, "global_step": 5205, "epoch": 62} {"train_loss": -16.712995529174805, "global_step": 5206, "epoch": 62} {"train_loss": -16.617189407348633, "global_step": 5207, "epoch": 62} {"train_loss": -17.039260864257812, "global_step": 5208, "epoch": 62} {"train_loss": -17.316722869873047, "global_step": 5209, "epoch": 62} {"train_loss": -16.955673217773438, "global_step": 5210, "epoch": 62} {"train_loss": -16.862049102783203, "global_step": 5211, "epoch": 62} {"train_loss": -16.735355377197266, "global_step": 5212, "epoch": 62} {"train_loss": -16.863449096679688, "global_step": 5213, "epoch": 62} {"train_loss": -16.576642990112305, "global_step": 5214, "epoch": 62} {"train_loss": -17.113718032836914, "global_step": 5215, "epoch": 62} {"train_loss": -16.603872299194336, "global_step": 5216, "epoch": 62} {"train_loss": -17.28656578063965, "global_step": 5217, "epoch": 62} {"train_loss": -17.420032501220703, "global_step": 5218, "epoch": 62} {"train_loss": -16.840747833251953, "global_step": 5219, "epoch": 62} {"train_loss": -16.734182357788086, "global_step": 5220, "epoch": 62} {"train_loss": -17.00128746032715, "global_step": 5221, "epoch": 62} {"train_loss": -16.80392074584961, "global_step": 5222, "epoch": 62} {"train_loss": -17.170856475830078, "global_step": 5223, "epoch": 62} {"train_loss": -17.255043029785156, "global_step": 5224, "epoch": 62} {"train_loss": -17.202539443969727, "global_step": 5225, "epoch": 62} {"train_loss": -17.185575485229492, "global_step": 5226, "epoch": 62} {"train_loss": -17.075143814086914, "global_step": 5227, "epoch": 62} {"train_loss": -16.940538199551135, "global_step": 5228, "epoch": 62, "val_loss": 6700235.0} {"train_loss": -16.152286529541016, "global_step": 5229, "epoch": 63} {"train_loss": -16.94907569885254, "global_step": 5230, "epoch": 63} {"train_loss": -16.699848175048828, "global_step": 5231, "epoch": 63} {"train_loss": -17.045516967773438, "global_step": 5232, "epoch": 63} {"train_loss": -17.245107650756836, "global_step": 5233, "epoch": 63} {"train_loss": -16.965288162231445, "global_step": 5234, "epoch": 63} {"train_loss": -16.512691497802734, "global_step": 5235, "epoch": 63} {"train_loss": -16.768173217773438, "global_step": 5236, "epoch": 63} {"train_loss": -17.0273380279541, "global_step": 5237, "epoch": 63} {"train_loss": -16.853010177612305, "global_step": 5238, "epoch": 63} {"train_loss": -16.93889808654785, "global_step": 5239, "epoch": 63} {"train_loss": -16.93122673034668, "global_step": 5240, "epoch": 63} {"train_loss": -16.754423141479492, "global_step": 5241, "epoch": 63} {"train_loss": -17.054899215698242, "global_step": 5242, "epoch": 63} {"train_loss": -17.211816787719727, "global_step": 5243, "epoch": 63} {"train_loss": -16.850051879882812, "global_step": 5244, "epoch": 63} {"train_loss": -17.270278930664062, "global_step": 5245, "epoch": 63} {"train_loss": -16.449289321899414, "global_step": 5246, "epoch": 63} {"train_loss": -17.106843948364258, "global_step": 5247, "epoch": 63} {"train_loss": -16.697246551513672, "global_step": 5248, "epoch": 63} {"train_loss": -16.687698364257812, "global_step": 5249, "epoch": 63} {"train_loss": -16.968252182006836, "global_step": 5250, "epoch": 63} {"train_loss": -17.070833206176758, "global_step": 5251, "epoch": 63} {"train_loss": -16.736143112182617, "global_step": 5252, "epoch": 63} {"train_loss": -16.90669059753418, "global_step": 5253, "epoch": 63} {"train_loss": -16.86541748046875, "global_step": 5254, "epoch": 63} {"train_loss": -17.055282592773438, "global_step": 5255, "epoch": 63} {"train_loss": -17.010129928588867, "global_step": 5256, "epoch": 63} {"train_loss": -16.68732452392578, "global_step": 5257, "epoch": 63} {"train_loss": -16.938447952270508, "global_step": 5258, "epoch": 63} {"train_loss": -17.348941802978516, "global_step": 5259, "epoch": 63} {"train_loss": -17.13345718383789, "global_step": 5260, "epoch": 63} {"train_loss": -17.029338836669922, "global_step": 5261, "epoch": 63} {"train_loss": -16.879013061523438, "global_step": 5262, "epoch": 63} {"train_loss": -16.787246704101562, "global_step": 5263, "epoch": 63} {"train_loss": -16.875808715820312, "global_step": 5264, "epoch": 63} {"train_loss": -17.110015869140625, "global_step": 5265, "epoch": 63} {"train_loss": -17.24793243408203, "global_step": 5266, "epoch": 63} {"train_loss": -16.445255279541016, "global_step": 5267, "epoch": 63} {"train_loss": -16.95170021057129, "global_step": 5268, "epoch": 63} {"train_loss": -17.207944869995117, "global_step": 5269, "epoch": 63} {"train_loss": -16.820125579833984, "global_step": 5270, "epoch": 63} {"train_loss": -16.85592269897461, "global_step": 5271, "epoch": 63} {"train_loss": -17.095914840698242, "global_step": 5272, "epoch": 63} {"train_loss": -17.511619567871094, "global_step": 5273, "epoch": 63} {"train_loss": -16.942716598510742, "global_step": 5274, "epoch": 63} {"train_loss": -17.08530616760254, "global_step": 5275, "epoch": 63} {"train_loss": -17.27035903930664, "global_step": 5276, "epoch": 63} {"train_loss": -17.10597038269043, "global_step": 5277, "epoch": 63} {"train_loss": -17.105093002319336, "global_step": 5278, "epoch": 63} {"train_loss": -17.105051040649414, "global_step": 5279, "epoch": 63} {"train_loss": -17.001949310302734, "global_step": 5280, "epoch": 63} {"train_loss": -17.280057907104492, "global_step": 5281, "epoch": 63} {"train_loss": -16.861427307128906, "global_step": 5282, "epoch": 63} {"train_loss": -17.221118927001953, "global_step": 5283, "epoch": 63} {"train_loss": -16.743314743041992, "global_step": 5284, "epoch": 63} {"train_loss": -16.6892147064209, "global_step": 5285, "epoch": 63} {"train_loss": -17.2570743560791, "global_step": 5286, "epoch": 63} {"train_loss": -16.815353393554688, "global_step": 5287, "epoch": 63} {"train_loss": -16.758596420288086, "global_step": 5288, "epoch": 63} {"train_loss": -17.06197166442871, "global_step": 5289, "epoch": 63} {"train_loss": -17.415237426757812, "global_step": 5290, "epoch": 63} {"train_loss": -17.256427764892578, "global_step": 5291, "epoch": 63} {"train_loss": -17.40230369567871, "global_step": 5292, "epoch": 63} {"train_loss": -16.720895767211914, "global_step": 5293, "epoch": 63} {"train_loss": -16.68621826171875, "global_step": 5294, "epoch": 63} {"train_loss": -16.9156494140625, "global_step": 5295, "epoch": 63} {"train_loss": -16.94406509399414, "global_step": 5296, "epoch": 63} {"train_loss": -16.928678512573242, "global_step": 5297, "epoch": 63} {"train_loss": -16.78229522705078, "global_step": 5298, "epoch": 63} {"train_loss": -16.975114822387695, "global_step": 5299, "epoch": 63} {"train_loss": -17.07708740234375, "global_step": 5300, "epoch": 63} {"train_loss": -17.204936981201172, "global_step": 5301, "epoch": 63} {"train_loss": -16.858871459960938, "global_step": 5302, "epoch": 63} {"train_loss": -16.92091941833496, "global_step": 5303, "epoch": 63} {"train_loss": -17.0339298248291, "global_step": 5304, "epoch": 63} {"train_loss": -16.530363082885742, "global_step": 5305, "epoch": 63} {"train_loss": -17.192893981933594, "global_step": 5306, "epoch": 63} {"train_loss": -17.037382125854492, "global_step": 5307, "epoch": 63} {"train_loss": -16.7685604095459, "global_step": 5308, "epoch": 63} {"train_loss": -16.990558624267578, "global_step": 5309, "epoch": 63} {"train_loss": -16.912099838256836, "global_step": 5310, "epoch": 63} {"train_loss": -16.956770081117927, "global_step": 5311, "epoch": 63, "val_loss": 6600626.0} {"train_loss": -16.592344284057617, "global_step": 5312, "epoch": 64} {"train_loss": -15.819938659667969, "global_step": 5313, "epoch": 64} {"train_loss": -17.23029136657715, "global_step": 5314, "epoch": 64} {"train_loss": -16.684833526611328, "global_step": 5315, "epoch": 64} {"train_loss": -16.70002555847168, "global_step": 5316, "epoch": 64} {"train_loss": -16.907665252685547, "global_step": 5317, "epoch": 64} {"train_loss": -16.838998794555664, "global_step": 5318, "epoch": 64} {"train_loss": -16.58968162536621, "global_step": 5319, "epoch": 64} {"train_loss": -17.130460739135742, "global_step": 5320, "epoch": 64} {"train_loss": -16.95729637145996, "global_step": 5321, "epoch": 64} {"train_loss": -16.725196838378906, "global_step": 5322, "epoch": 64} {"train_loss": -16.81801414489746, "global_step": 5323, "epoch": 64} {"train_loss": -17.109956741333008, "global_step": 5324, "epoch": 64} {"train_loss": -17.052152633666992, "global_step": 5325, "epoch": 64} {"train_loss": -17.343046188354492, "global_step": 5326, "epoch": 64} {"train_loss": -17.04112434387207, "global_step": 5327, "epoch": 64} {"train_loss": -17.275468826293945, "global_step": 5328, "epoch": 64} {"train_loss": -17.206283569335938, "global_step": 5329, "epoch": 64} {"train_loss": -17.02362632751465, "global_step": 5330, "epoch": 64} {"train_loss": -16.764463424682617, "global_step": 5331, "epoch": 64} {"train_loss": -17.590377807617188, "global_step": 5332, "epoch": 64} {"train_loss": -16.86952018737793, "global_step": 5333, "epoch": 64} {"train_loss": -16.67599868774414, "global_step": 5334, "epoch": 64} {"train_loss": -16.917470932006836, "global_step": 5335, "epoch": 64} {"train_loss": -17.16106605529785, "global_step": 5336, "epoch": 64} {"train_loss": -16.762510299682617, "global_step": 5337, "epoch": 64} {"train_loss": -16.85109519958496, "global_step": 5338, "epoch": 64} {"train_loss": -17.185012817382812, "global_step": 5339, "epoch": 64} {"train_loss": -16.750761032104492, "global_step": 5340, "epoch": 64} {"train_loss": -17.070392608642578, "global_step": 5341, "epoch": 64} {"train_loss": -17.45759391784668, "global_step": 5342, "epoch": 64} {"train_loss": -16.605262756347656, "global_step": 5343, "epoch": 64} {"train_loss": -16.944425582885742, "global_step": 5344, "epoch": 64} {"train_loss": -17.28192710876465, "global_step": 5345, "epoch": 64} {"train_loss": -16.867944717407227, "global_step": 5346, "epoch": 64} {"train_loss": -16.855121612548828, "global_step": 5347, "epoch": 64} {"train_loss": -16.9200496673584, "global_step": 5348, "epoch": 64} {"train_loss": -16.61665916442871, "global_step": 5349, "epoch": 64} {"train_loss": -17.228830337524414, "global_step": 5350, "epoch": 64} {"train_loss": -17.04928207397461, "global_step": 5351, "epoch": 64} {"train_loss": -17.20825958251953, "global_step": 5352, "epoch": 64} {"train_loss": -16.905136108398438, "global_step": 5353, "epoch": 64} {"train_loss": -17.23732566833496, "global_step": 5354, "epoch": 64} {"train_loss": -16.97411346435547, "global_step": 5355, "epoch": 64} {"train_loss": -16.724721908569336, "global_step": 5356, "epoch": 64} {"train_loss": -16.4803524017334, "global_step": 5357, "epoch": 64} {"train_loss": -16.847562789916992, "global_step": 5358, "epoch": 64} {"train_loss": -16.86587905883789, "global_step": 5359, "epoch": 64} {"train_loss": -17.05242347717285, "global_step": 5360, "epoch": 64} {"train_loss": -17.254880905151367, "global_step": 5361, "epoch": 64} {"train_loss": -16.879390716552734, "global_step": 5362, "epoch": 64} {"train_loss": -16.494924545288086, "global_step": 5363, "epoch": 64} {"train_loss": -17.103389739990234, "global_step": 5364, "epoch": 64} {"train_loss": -16.815624237060547, "global_step": 5365, "epoch": 64} {"train_loss": -17.069049835205078, "global_step": 5366, "epoch": 64} {"train_loss": -17.087671279907227, "global_step": 5367, "epoch": 64} {"train_loss": -16.824352264404297, "global_step": 5368, "epoch": 64} {"train_loss": -16.767438888549805, "global_step": 5369, "epoch": 64} {"train_loss": -16.843280792236328, "global_step": 5370, "epoch": 64} {"train_loss": -17.05327606201172, "global_step": 5371, "epoch": 64} {"train_loss": -17.22334098815918, "global_step": 5372, "epoch": 64} {"train_loss": -17.0522518157959, "global_step": 5373, "epoch": 64} {"train_loss": -16.861967086791992, "global_step": 5374, "epoch": 64} {"train_loss": -16.705808639526367, "global_step": 5375, "epoch": 64} {"train_loss": -17.53972053527832, "global_step": 5376, "epoch": 64} {"train_loss": -17.3075008392334, "global_step": 5377, "epoch": 64} {"train_loss": -16.939308166503906, "global_step": 5378, "epoch": 64} {"train_loss": -16.73273468017578, "global_step": 5379, "epoch": 64} {"train_loss": -16.845163345336914, "global_step": 5380, "epoch": 64} {"train_loss": -17.1186580657959, "global_step": 5381, "epoch": 64} {"train_loss": -16.86200523376465, "global_step": 5382, "epoch": 64} {"train_loss": -16.920425415039062, "global_step": 5383, "epoch": 64} {"train_loss": -17.194595336914062, "global_step": 5384, "epoch": 64} {"train_loss": -17.06598472595215, "global_step": 5385, "epoch": 64} {"train_loss": -16.947193145751953, "global_step": 5386, "epoch": 64} {"train_loss": -17.327816009521484, "global_step": 5387, "epoch": 64} {"train_loss": -16.776365280151367, "global_step": 5388, "epoch": 64} {"train_loss": -17.414743423461914, "global_step": 5389, "epoch": 64} {"train_loss": -16.81199073791504, "global_step": 5390, "epoch": 64} {"train_loss": -16.85761070251465, "global_step": 5391, "epoch": 64} {"train_loss": -17.219070434570312, "global_step": 5392, "epoch": 64} {"train_loss": -17.08194923400879, "global_step": 5393, "epoch": 64} {"train_loss": -16.961791348744587, "global_step": 5394, "epoch": 64, "val_loss": 6538876.0} {"train_loss": -16.85861587524414, "global_step": 5395, "epoch": 65} {"train_loss": -16.981910705566406, "global_step": 5396, "epoch": 65} {"train_loss": -17.144411087036133, "global_step": 5397, "epoch": 65} {"train_loss": -16.91134262084961, "global_step": 5398, "epoch": 65} {"train_loss": -16.95354652404785, "global_step": 5399, "epoch": 65} {"train_loss": -16.795286178588867, "global_step": 5400, "epoch": 65} {"train_loss": -16.694488525390625, "global_step": 5401, "epoch": 65} {"train_loss": -16.99742889404297, "global_step": 5402, "epoch": 65} {"train_loss": -17.366687774658203, "global_step": 5403, "epoch": 65} {"train_loss": -17.380178451538086, "global_step": 5404, "epoch": 65} {"train_loss": -16.910255432128906, "global_step": 5405, "epoch": 65} {"train_loss": -17.059240341186523, "global_step": 5406, "epoch": 65} {"train_loss": -17.015371322631836, "global_step": 5407, "epoch": 65} {"train_loss": -16.91952896118164, "global_step": 5408, "epoch": 65} {"train_loss": -17.005464553833008, "global_step": 5409, "epoch": 65} {"train_loss": -16.98079490661621, "global_step": 5410, "epoch": 65} {"train_loss": -17.055103302001953, "global_step": 5411, "epoch": 65} {"train_loss": -16.815759658813477, "global_step": 5412, "epoch": 65} {"train_loss": -16.801847457885742, "global_step": 5413, "epoch": 65} {"train_loss": -16.826208114624023, "global_step": 5414, "epoch": 65} {"train_loss": -16.656023025512695, "global_step": 5415, "epoch": 65} {"train_loss": -16.734577178955078, "global_step": 5416, "epoch": 65} {"train_loss": -17.019346237182617, "global_step": 5417, "epoch": 65} {"train_loss": -16.990585327148438, "global_step": 5418, "epoch": 65} {"train_loss": -17.21482276916504, "global_step": 5419, "epoch": 65} {"train_loss": -16.740861892700195, "global_step": 5420, "epoch": 65} {"train_loss": -16.937870025634766, "global_step": 5421, "epoch": 65} {"train_loss": -16.901935577392578, "global_step": 5422, "epoch": 65} {"train_loss": -17.18907356262207, "global_step": 5423, "epoch": 65} {"train_loss": -16.845491409301758, "global_step": 5424, "epoch": 65} {"train_loss": -16.863859176635742, "global_step": 5425, "epoch": 65} {"train_loss": -17.023723602294922, "global_step": 5426, "epoch": 65} {"train_loss": -16.855070114135742, "global_step": 5427, "epoch": 65} {"train_loss": -17.049745559692383, "global_step": 5428, "epoch": 65} {"train_loss": -16.821382522583008, "global_step": 5429, "epoch": 65} {"train_loss": -16.68044090270996, "global_step": 5430, "epoch": 65} {"train_loss": -17.241897583007812, "global_step": 5431, "epoch": 65} {"train_loss": -16.926904678344727, "global_step": 5432, "epoch": 65} {"train_loss": -17.457748413085938, "global_step": 5433, "epoch": 65} {"train_loss": -17.17360496520996, "global_step": 5434, "epoch": 65} {"train_loss": -16.97870445251465, "global_step": 5435, "epoch": 65} {"train_loss": -17.076358795166016, "global_step": 5436, "epoch": 65} {"train_loss": -16.90163230895996, "global_step": 5437, "epoch": 65} {"train_loss": -16.9188175201416, "global_step": 5438, "epoch": 65} {"train_loss": -16.62648582458496, "global_step": 5439, "epoch": 65} {"train_loss": -17.006526947021484, "global_step": 5440, "epoch": 65} {"train_loss": -17.37691307067871, "global_step": 5441, "epoch": 65} {"train_loss": -16.644662857055664, "global_step": 5442, "epoch": 65} {"train_loss": -16.722021102905273, "global_step": 5443, "epoch": 65} {"train_loss": -16.80893325805664, "global_step": 5444, "epoch": 65} {"train_loss": -17.229633331298828, "global_step": 5445, "epoch": 65} {"train_loss": -16.44359588623047, "global_step": 5446, "epoch": 65} {"train_loss": -16.92514419555664, "global_step": 5447, "epoch": 65} {"train_loss": -17.18971061706543, "global_step": 5448, "epoch": 65} {"train_loss": -16.84910011291504, "global_step": 5449, "epoch": 65} {"train_loss": -17.00946617126465, "global_step": 5450, "epoch": 65} {"train_loss": -16.855958938598633, "global_step": 5451, "epoch": 65} {"train_loss": -16.8485107421875, "global_step": 5452, "epoch": 65} {"train_loss": -17.129270553588867, "global_step": 5453, "epoch": 65} {"train_loss": -17.00872230529785, "global_step": 5454, "epoch": 65} {"train_loss": -16.793054580688477, "global_step": 5455, "epoch": 65} {"train_loss": -16.968414306640625, "global_step": 5456, "epoch": 65} {"train_loss": -16.956541061401367, "global_step": 5457, "epoch": 65} {"train_loss": -16.901737213134766, "global_step": 5458, "epoch": 65} {"train_loss": -17.067153930664062, "global_step": 5459, "epoch": 65} {"train_loss": -17.199583053588867, "global_step": 5460, "epoch": 65} {"train_loss": -16.637868881225586, "global_step": 5461, "epoch": 65} {"train_loss": -16.917524337768555, "global_step": 5462, "epoch": 65} {"train_loss": -17.166528701782227, "global_step": 5463, "epoch": 65} {"train_loss": -17.089937210083008, "global_step": 5464, "epoch": 65} {"train_loss": -17.011520385742188, "global_step": 5465, "epoch": 65} {"train_loss": -17.138036727905273, "global_step": 5466, "epoch": 65} {"train_loss": -16.825550079345703, "global_step": 5467, "epoch": 65} {"train_loss": -17.032302856445312, "global_step": 5468, "epoch": 65} {"train_loss": -17.254770278930664, "global_step": 5469, "epoch": 65} {"train_loss": -17.10359001159668, "global_step": 5470, "epoch": 65} {"train_loss": -16.93790626525879, "global_step": 5471, "epoch": 65} {"train_loss": -17.51633644104004, "global_step": 5472, "epoch": 65} {"train_loss": -17.1023006439209, "global_step": 5473, "epoch": 65} {"train_loss": -17.281957626342773, "global_step": 5474, "epoch": 65} {"train_loss": -16.924612045288086, "global_step": 5475, "epoch": 65} {"train_loss": -17.386381149291992, "global_step": 5476, "epoch": 65} {"train_loss": -16.986308155289617, "global_step": 5477, "epoch": 65, "val_loss": 6621742.0} {"train_loss": -16.90951156616211, "global_step": 5478, "epoch": 66} {"train_loss": -16.4410457611084, "global_step": 5479, "epoch": 66} {"train_loss": -16.760374069213867, "global_step": 5480, "epoch": 66} {"train_loss": -16.703540802001953, "global_step": 5481, "epoch": 66} {"train_loss": -16.794109344482422, "global_step": 5482, "epoch": 66} {"train_loss": -16.452571868896484, "global_step": 5483, "epoch": 66} {"train_loss": -16.664236068725586, "global_step": 5484, "epoch": 66} {"train_loss": -16.941303253173828, "global_step": 5485, "epoch": 66} {"train_loss": -17.070514678955078, "global_step": 5486, "epoch": 66} {"train_loss": -16.852325439453125, "global_step": 5487, "epoch": 66} {"train_loss": -16.740121841430664, "global_step": 5488, "epoch": 66} {"train_loss": -16.905725479125977, "global_step": 5489, "epoch": 66} {"train_loss": -16.7856502532959, "global_step": 5490, "epoch": 66} {"train_loss": -16.552154541015625, "global_step": 5491, "epoch": 66} {"train_loss": -16.78375244140625, "global_step": 5492, "epoch": 66} {"train_loss": -16.85481071472168, "global_step": 5493, "epoch": 66} {"train_loss": -16.915393829345703, "global_step": 5494, "epoch": 66} {"train_loss": -16.96571922302246, "global_step": 5495, "epoch": 66} {"train_loss": -16.469099044799805, "global_step": 5496, "epoch": 66} {"train_loss": -17.0142879486084, "global_step": 5497, "epoch": 66} {"train_loss": -16.8591251373291, "global_step": 5498, "epoch": 66} {"train_loss": -17.008825302124023, "global_step": 5499, "epoch": 66} {"train_loss": -16.75136375427246, "global_step": 5500, "epoch": 66} {"train_loss": -16.914758682250977, "global_step": 5501, "epoch": 66} {"train_loss": -16.8076114654541, "global_step": 5502, "epoch": 66} {"train_loss": -16.801122665405273, "global_step": 5503, "epoch": 66} {"train_loss": -16.84174156188965, "global_step": 5504, "epoch": 66} {"train_loss": -16.542097091674805, "global_step": 5505, "epoch": 66} {"train_loss": -16.937509536743164, "global_step": 5506, "epoch": 66} {"train_loss": -16.601022720336914, "global_step": 5507, "epoch": 66} {"train_loss": -17.27570915222168, "global_step": 5508, "epoch": 66} {"train_loss": -16.51392936706543, "global_step": 5509, "epoch": 66} {"train_loss": -16.92892837524414, "global_step": 5510, "epoch": 66} {"train_loss": -16.426006317138672, "global_step": 5511, "epoch": 66} {"train_loss": -16.82474708557129, "global_step": 5512, "epoch": 66} {"train_loss": -16.737728118896484, "global_step": 5513, "epoch": 66} {"train_loss": -17.20906639099121, "global_step": 5514, "epoch": 66} {"train_loss": -16.814355850219727, "global_step": 5515, "epoch": 66} {"train_loss": -16.893386840820312, "global_step": 5516, "epoch": 66} {"train_loss": -16.966716766357422, "global_step": 5517, "epoch": 66} {"train_loss": -17.013484954833984, "global_step": 5518, "epoch": 66} {"train_loss": -16.49531364440918, "global_step": 5519, "epoch": 66} {"train_loss": -16.699487686157227, "global_step": 5520, "epoch": 66} {"train_loss": -16.600540161132812, "global_step": 5521, "epoch": 66} {"train_loss": -17.069896697998047, "global_step": 5522, "epoch": 66} {"train_loss": -16.659231185913086, "global_step": 5523, "epoch": 66} {"train_loss": -16.523462295532227, "global_step": 5524, "epoch": 66} {"train_loss": -16.744352340698242, "global_step": 5525, "epoch": 66} {"train_loss": -16.6075382232666, "global_step": 5526, "epoch": 66} {"train_loss": -16.591894149780273, "global_step": 5527, "epoch": 66} {"train_loss": -17.250036239624023, "global_step": 5528, "epoch": 66} {"train_loss": -17.046859741210938, "global_step": 5529, "epoch": 66} {"train_loss": -16.835744857788086, "global_step": 5530, "epoch": 66} {"train_loss": -17.1182918548584, "global_step": 5531, "epoch": 66} {"train_loss": -16.813289642333984, "global_step": 5532, "epoch": 66} {"train_loss": -16.90877342224121, "global_step": 5533, "epoch": 66} {"train_loss": -16.714017868041992, "global_step": 5534, "epoch": 66} {"train_loss": -16.788908004760742, "global_step": 5535, "epoch": 66} {"train_loss": -17.395009994506836, "global_step": 5536, "epoch": 66} {"train_loss": -17.132394790649414, "global_step": 5537, "epoch": 66} {"train_loss": -16.608936309814453, "global_step": 5538, "epoch": 66} {"train_loss": -16.907819747924805, "global_step": 5539, "epoch": 66} {"train_loss": -17.16489028930664, "global_step": 5540, "epoch": 66} {"train_loss": -16.65450668334961, "global_step": 5541, "epoch": 66} {"train_loss": -16.781736373901367, "global_step": 5542, "epoch": 66} {"train_loss": -16.73056983947754, "global_step": 5543, "epoch": 66} {"train_loss": -17.162551879882812, "global_step": 5544, "epoch": 66} {"train_loss": -16.590524673461914, "global_step": 5545, "epoch": 66} {"train_loss": -17.12660789489746, "global_step": 5546, "epoch": 66} {"train_loss": -16.894943237304688, "global_step": 5547, "epoch": 66} {"train_loss": -17.123279571533203, "global_step": 5548, "epoch": 66} {"train_loss": -16.85731315612793, "global_step": 5549, "epoch": 66} {"train_loss": -16.789039611816406, "global_step": 5550, "epoch": 66} {"train_loss": -16.84331703186035, "global_step": 5551, "epoch": 66} {"train_loss": -16.995946884155273, "global_step": 5552, "epoch": 66} {"train_loss": -16.780500411987305, "global_step": 5553, "epoch": 66} {"train_loss": -16.677640914916992, "global_step": 5554, "epoch": 66} {"train_loss": -16.75142478942871, "global_step": 5555, "epoch": 66} {"train_loss": -16.920364379882812, "global_step": 5556, "epoch": 66} {"train_loss": -17.016088485717773, "global_step": 5557, "epoch": 66} {"train_loss": -16.974430084228516, "global_step": 5558, "epoch": 66} {"train_loss": -16.7734375, "global_step": 5559, "epoch": 66} {"train_loss": -16.84475813716291, "global_step": 5560, "epoch": 66, "val_loss": 6541549.0} {"train_loss": -16.440832138061523, "global_step": 5561, "epoch": 67} {"train_loss": -16.654743194580078, "global_step": 5562, "epoch": 67} {"train_loss": -16.241586685180664, "global_step": 5563, "epoch": 67} {"train_loss": -16.56626319885254, "global_step": 5564, "epoch": 67} {"train_loss": -16.36141014099121, "global_step": 5565, "epoch": 67} {"train_loss": -16.316492080688477, "global_step": 5566, "epoch": 67} {"train_loss": -16.07245445251465, "global_step": 5567, "epoch": 67} {"train_loss": -16.792505264282227, "global_step": 5568, "epoch": 67} {"train_loss": -16.096275329589844, "global_step": 5569, "epoch": 67} {"train_loss": -16.08560562133789, "global_step": 5570, "epoch": 67} {"train_loss": -16.53492546081543, "global_step": 5571, "epoch": 67} {"train_loss": -16.815200805664062, "global_step": 5572, "epoch": 67} {"train_loss": -16.501523971557617, "global_step": 5573, "epoch": 67} {"train_loss": -16.617504119873047, "global_step": 5574, "epoch": 67} {"train_loss": -17.044635772705078, "global_step": 5575, "epoch": 67} {"train_loss": -16.781930923461914, "global_step": 5576, "epoch": 67} {"train_loss": -16.71953582763672, "global_step": 5577, "epoch": 67} {"train_loss": -16.47228240966797, "global_step": 5578, "epoch": 67} {"train_loss": -17.024511337280273, "global_step": 5579, "epoch": 67} {"train_loss": -16.702970504760742, "global_step": 5580, "epoch": 67} {"train_loss": -16.047574996948242, "global_step": 5581, "epoch": 67} {"train_loss": -16.67067527770996, "global_step": 5582, "epoch": 67} {"train_loss": -16.504505157470703, "global_step": 5583, "epoch": 67} {"train_loss": -16.441116333007812, "global_step": 5584, "epoch": 67} {"train_loss": -16.65894889831543, "global_step": 5585, "epoch": 67} {"train_loss": -17.064929962158203, "global_step": 5586, "epoch": 67} {"train_loss": -16.746143341064453, "global_step": 5587, "epoch": 67} {"train_loss": -16.598684310913086, "global_step": 5588, "epoch": 67} {"train_loss": -16.43538475036621, "global_step": 5589, "epoch": 67} {"train_loss": -16.894065856933594, "global_step": 5590, "epoch": 67} {"train_loss": -17.013261795043945, "global_step": 5591, "epoch": 67} {"train_loss": -16.522592544555664, "global_step": 5592, "epoch": 67} {"train_loss": -16.831857681274414, "global_step": 5593, "epoch": 67} {"train_loss": -16.55525779724121, "global_step": 5594, "epoch": 67} {"train_loss": -16.756616592407227, "global_step": 5595, "epoch": 67} {"train_loss": -16.53360366821289, "global_step": 5596, "epoch": 67} {"train_loss": -16.964414596557617, "global_step": 5597, "epoch": 67} {"train_loss": -16.644384384155273, "global_step": 5598, "epoch": 67} {"train_loss": -17.165849685668945, "global_step": 5599, "epoch": 67} {"train_loss": -16.6744441986084, "global_step": 5600, "epoch": 67} {"train_loss": -17.038522720336914, "global_step": 5601, "epoch": 67} {"train_loss": -16.717302322387695, "global_step": 5602, "epoch": 67} {"train_loss": -16.621353149414062, "global_step": 5603, "epoch": 67} {"train_loss": -16.69742202758789, "global_step": 5604, "epoch": 67} {"train_loss": -16.737354278564453, "global_step": 5605, "epoch": 67} {"train_loss": -17.1249942779541, "global_step": 5606, "epoch": 67} {"train_loss": -16.292125701904297, "global_step": 5607, "epoch": 67} {"train_loss": -16.85689353942871, "global_step": 5608, "epoch": 67} {"train_loss": -16.56915283203125, "global_step": 5609, "epoch": 67} {"train_loss": -16.83040428161621, "global_step": 5610, "epoch": 67} {"train_loss": -16.456531524658203, "global_step": 5611, "epoch": 67} {"train_loss": -17.039297103881836, "global_step": 5612, "epoch": 67} {"train_loss": -16.87025260925293, "global_step": 5613, "epoch": 67} {"train_loss": -16.509855270385742, "global_step": 5614, "epoch": 67} {"train_loss": -16.938085556030273, "global_step": 5615, "epoch": 67} {"train_loss": -17.155214309692383, "global_step": 5616, "epoch": 67} {"train_loss": -16.989444732666016, "global_step": 5617, "epoch": 67} {"train_loss": -17.032861709594727, "global_step": 5618, "epoch": 67} {"train_loss": -16.83715057373047, "global_step": 5619, "epoch": 67} {"train_loss": -16.913984298706055, "global_step": 5620, "epoch": 67} {"train_loss": -16.406259536743164, "global_step": 5621, "epoch": 67} {"train_loss": -16.944910049438477, "global_step": 5622, "epoch": 67} {"train_loss": -16.591157913208008, "global_step": 5623, "epoch": 67} {"train_loss": -17.0369930267334, "global_step": 5624, "epoch": 67} {"train_loss": -16.718442916870117, "global_step": 5625, "epoch": 67} {"train_loss": -17.321683883666992, "global_step": 5626, "epoch": 67} {"train_loss": -16.92873764038086, "global_step": 5627, "epoch": 67} {"train_loss": -16.713998794555664, "global_step": 5628, "epoch": 67} {"train_loss": -16.737186431884766, "global_step": 5629, "epoch": 67} {"train_loss": -16.69327735900879, "global_step": 5630, "epoch": 67} {"train_loss": -16.99967384338379, "global_step": 5631, "epoch": 67} {"train_loss": -16.61631202697754, "global_step": 5632, "epoch": 67} {"train_loss": -17.1165714263916, "global_step": 5633, "epoch": 67} {"train_loss": -16.753576278686523, "global_step": 5634, "epoch": 67} {"train_loss": -17.116130828857422, "global_step": 5635, "epoch": 67} {"train_loss": -16.7357177734375, "global_step": 5636, "epoch": 67} {"train_loss": -16.5848388671875, "global_step": 5637, "epoch": 67} {"train_loss": -16.765533447265625, "global_step": 5638, "epoch": 67} {"train_loss": -16.647933959960938, "global_step": 5639, "epoch": 67} {"train_loss": -16.696130752563477, "global_step": 5640, "epoch": 67} {"train_loss": -16.767709732055664, "global_step": 5641, "epoch": 67} {"train_loss": -16.894887924194336, "global_step": 5642, "epoch": 67} {"train_loss": -16.73299617077931, "global_step": 5643, "epoch": 67, "val_loss": 6713372.0} {"train_loss": -16.447433471679688, "global_step": 5644, "epoch": 68} {"train_loss": -16.711767196655273, "global_step": 5645, "epoch": 68} {"train_loss": -16.784833908081055, "global_step": 5646, "epoch": 68} {"train_loss": -16.617576599121094, "global_step": 5647, "epoch": 68} {"train_loss": -16.415735244750977, "global_step": 5648, "epoch": 68} {"train_loss": -16.91200065612793, "global_step": 5649, "epoch": 68} {"train_loss": -16.767797470092773, "global_step": 5650, "epoch": 68} {"train_loss": -16.981781005859375, "global_step": 5651, "epoch": 68} {"train_loss": -16.68983268737793, "global_step": 5652, "epoch": 68} {"train_loss": -17.06361961364746, "global_step": 5653, "epoch": 68} {"train_loss": -16.846160888671875, "global_step": 5654, "epoch": 68} {"train_loss": -16.8120174407959, "global_step": 5655, "epoch": 68} {"train_loss": -17.356781005859375, "global_step": 5656, "epoch": 68} {"train_loss": -16.77566909790039, "global_step": 5657, "epoch": 68} {"train_loss": -17.135318756103516, "global_step": 5658, "epoch": 68} {"train_loss": -16.92488670349121, "global_step": 5659, "epoch": 68} {"train_loss": -17.052518844604492, "global_step": 5660, "epoch": 68} {"train_loss": -17.096832275390625, "global_step": 5661, "epoch": 68} {"train_loss": -17.09178352355957, "global_step": 5662, "epoch": 68} {"train_loss": -16.825387954711914, "global_step": 5663, "epoch": 68} {"train_loss": -16.628019332885742, "global_step": 5664, "epoch": 68} {"train_loss": -16.794607162475586, "global_step": 5665, "epoch": 68} {"train_loss": -17.112770080566406, "global_step": 5666, "epoch": 68} {"train_loss": -16.44024658203125, "global_step": 5667, "epoch": 68} {"train_loss": -17.463239669799805, "global_step": 5668, "epoch": 68} {"train_loss": -17.090396881103516, "global_step": 5669, "epoch": 68} {"train_loss": -17.44886589050293, "global_step": 5670, "epoch": 68} {"train_loss": -16.78389549255371, "global_step": 5671, "epoch": 68} {"train_loss": -16.625200271606445, "global_step": 5672, "epoch": 68} {"train_loss": -17.057615280151367, "global_step": 5673, "epoch": 68} {"train_loss": -16.924943923950195, "global_step": 5674, "epoch": 68} {"train_loss": -16.347753524780273, "global_step": 5675, "epoch": 68} {"train_loss": -17.0274600982666, "global_step": 5676, "epoch": 68} {"train_loss": -17.196853637695312, "global_step": 5677, "epoch": 68} {"train_loss": -16.85144805908203, "global_step": 5678, "epoch": 68} {"train_loss": -16.702768325805664, "global_step": 5679, "epoch": 68} {"train_loss": -16.852127075195312, "global_step": 5680, "epoch": 68} {"train_loss": -16.91973114013672, "global_step": 5681, "epoch": 68} {"train_loss": -17.00040626525879, "global_step": 5682, "epoch": 68} {"train_loss": -16.913427352905273, "global_step": 5683, "epoch": 68} {"train_loss": -16.920995712280273, "global_step": 5684, "epoch": 68} {"train_loss": -16.854764938354492, "global_step": 5685, "epoch": 68} {"train_loss": -16.801794052124023, "global_step": 5686, "epoch": 68} {"train_loss": -16.733539581298828, "global_step": 5687, "epoch": 68} {"train_loss": -16.723140716552734, "global_step": 5688, "epoch": 68} {"train_loss": -16.8546199798584, "global_step": 5689, "epoch": 68} {"train_loss": -16.8088321685791, "global_step": 5690, "epoch": 68} {"train_loss": -16.86213493347168, "global_step": 5691, "epoch": 68} {"train_loss": -17.158525466918945, "global_step": 5692, "epoch": 68} {"train_loss": -16.980539321899414, "global_step": 5693, "epoch": 68} {"train_loss": -16.871139526367188, "global_step": 5694, "epoch": 68} {"train_loss": -16.733152389526367, "global_step": 5695, "epoch": 68} {"train_loss": -17.356027603149414, "global_step": 5696, "epoch": 68} {"train_loss": -17.111997604370117, "global_step": 5697, "epoch": 68} {"train_loss": -17.17763328552246, "global_step": 5698, "epoch": 68} {"train_loss": -16.72534942626953, "global_step": 5699, "epoch": 68} {"train_loss": -16.753671646118164, "global_step": 5700, "epoch": 68} {"train_loss": -16.986724853515625, "global_step": 5701, "epoch": 68} {"train_loss": -16.3656063079834, "global_step": 5702, "epoch": 68} {"train_loss": -17.142742156982422, "global_step": 5703, "epoch": 68} {"train_loss": -17.16656494140625, "global_step": 5704, "epoch": 68} {"train_loss": -17.108259201049805, "global_step": 5705, "epoch": 68} {"train_loss": -16.979936599731445, "global_step": 5706, "epoch": 68} {"train_loss": -17.241783142089844, "global_step": 5707, "epoch": 68} {"train_loss": -17.35965347290039, "global_step": 5708, "epoch": 68} {"train_loss": -17.096731185913086, "global_step": 5709, "epoch": 68} {"train_loss": -17.026100158691406, "global_step": 5710, "epoch": 68} {"train_loss": -17.111711502075195, "global_step": 5711, "epoch": 68} {"train_loss": -17.038156509399414, "global_step": 5712, "epoch": 68} {"train_loss": -16.908910751342773, "global_step": 5713, "epoch": 68} {"train_loss": -16.702054977416992, "global_step": 5714, "epoch": 68} {"train_loss": -16.802148818969727, "global_step": 5715, "epoch": 68} {"train_loss": -16.877704620361328, "global_step": 5716, "epoch": 68} {"train_loss": -16.875110626220703, "global_step": 5717, "epoch": 68} {"train_loss": -17.048871994018555, "global_step": 5718, "epoch": 68} {"train_loss": -17.34793472290039, "global_step": 5719, "epoch": 68} {"train_loss": -16.886701583862305, "global_step": 5720, "epoch": 68} {"train_loss": -17.1957950592041, "global_step": 5721, "epoch": 68} {"train_loss": -16.911794662475586, "global_step": 5722, "epoch": 68} {"train_loss": -16.93568992614746, "global_step": 5723, "epoch": 68} {"train_loss": -16.79863739013672, "global_step": 5724, "epoch": 68} {"train_loss": -17.253137588500977, "global_step": 5725, "epoch": 68} {"train_loss": -16.919340340487928, "global_step": 5726, "epoch": 68, "val_loss": 6607876.0} {"train_loss": -16.83540153503418, "global_step": 5727, "epoch": 69} {"train_loss": -16.780324935913086, "global_step": 5728, "epoch": 69} {"train_loss": -16.778841018676758, "global_step": 5729, "epoch": 69} {"train_loss": -16.772075653076172, "global_step": 5730, "epoch": 69} {"train_loss": -16.636676788330078, "global_step": 5731, "epoch": 69} {"train_loss": -16.807207107543945, "global_step": 5732, "epoch": 69} {"train_loss": -17.08745002746582, "global_step": 5733, "epoch": 69} {"train_loss": -16.757781982421875, "global_step": 5734, "epoch": 69} {"train_loss": -16.750202178955078, "global_step": 5735, "epoch": 69} {"train_loss": -17.204626083374023, "global_step": 5736, "epoch": 69} {"train_loss": -17.02296257019043, "global_step": 5737, "epoch": 69} {"train_loss": -17.283863067626953, "global_step": 5738, "epoch": 69} {"train_loss": -17.197477340698242, "global_step": 5739, "epoch": 69} {"train_loss": -17.0275936126709, "global_step": 5740, "epoch": 69} {"train_loss": -17.230274200439453, "global_step": 5741, "epoch": 69} {"train_loss": -17.16999626159668, "global_step": 5742, "epoch": 69} {"train_loss": -16.830808639526367, "global_step": 5743, "epoch": 69} {"train_loss": -17.215423583984375, "global_step": 5744, "epoch": 69} {"train_loss": -16.8960018157959, "global_step": 5745, "epoch": 69} {"train_loss": -17.23052406311035, "global_step": 5746, "epoch": 69} {"train_loss": -16.823904037475586, "global_step": 5747, "epoch": 69} {"train_loss": -17.397397994995117, "global_step": 5748, "epoch": 69} {"train_loss": -17.414325714111328, "global_step": 5749, "epoch": 69} {"train_loss": -16.964618682861328, "global_step": 5750, "epoch": 69} {"train_loss": -17.16666030883789, "global_step": 5751, "epoch": 69} {"train_loss": -16.571455001831055, "global_step": 5752, "epoch": 69} {"train_loss": -17.272502899169922, "global_step": 5753, "epoch": 69} {"train_loss": -17.377283096313477, "global_step": 5754, "epoch": 69} {"train_loss": -17.1889705657959, "global_step": 5755, "epoch": 69} {"train_loss": -16.78285789489746, "global_step": 5756, "epoch": 69} {"train_loss": -17.198415756225586, "global_step": 5757, "epoch": 69} {"train_loss": -17.239133834838867, "global_step": 5758, "epoch": 69} {"train_loss": -17.00538444519043, "global_step": 5759, "epoch": 69} {"train_loss": -16.614837646484375, "global_step": 5760, "epoch": 69} {"train_loss": -16.87067222595215, "global_step": 5761, "epoch": 69} {"train_loss": -17.081655502319336, "global_step": 5762, "epoch": 69} {"train_loss": -17.22006607055664, "global_step": 5763, "epoch": 69} {"train_loss": -17.205556869506836, "global_step": 5764, "epoch": 69} {"train_loss": -17.400772094726562, "global_step": 5765, "epoch": 69} {"train_loss": -17.178436279296875, "global_step": 5766, "epoch": 69} {"train_loss": -17.262983322143555, "global_step": 5767, "epoch": 69} {"train_loss": -16.910654067993164, "global_step": 5768, "epoch": 69} {"train_loss": -16.9368896484375, "global_step": 5769, "epoch": 69} {"train_loss": -17.122901916503906, "global_step": 5770, "epoch": 69} {"train_loss": -17.168310165405273, "global_step": 5771, "epoch": 69} {"train_loss": -16.9708251953125, "global_step": 5772, "epoch": 69} {"train_loss": -16.84876251220703, "global_step": 5773, "epoch": 69} {"train_loss": -16.95747947692871, "global_step": 5774, "epoch": 69} {"train_loss": -17.250852584838867, "global_step": 5775, "epoch": 69} {"train_loss": -17.2251033782959, "global_step": 5776, "epoch": 69} {"train_loss": -16.747461318969727, "global_step": 5777, "epoch": 69} {"train_loss": -17.10915184020996, "global_step": 5778, "epoch": 69} {"train_loss": -17.244062423706055, "global_step": 5779, "epoch": 69} {"train_loss": -17.0571231842041, "global_step": 5780, "epoch": 69} {"train_loss": -17.34847068786621, "global_step": 5781, "epoch": 69} {"train_loss": -17.402685165405273, "global_step": 5782, "epoch": 69} {"train_loss": -17.20817756652832, "global_step": 5783, "epoch": 69} {"train_loss": -16.87625503540039, "global_step": 5784, "epoch": 69} {"train_loss": -17.302085876464844, "global_step": 5785, "epoch": 69} {"train_loss": -16.992399215698242, "global_step": 5786, "epoch": 69} {"train_loss": -16.780637741088867, "global_step": 5787, "epoch": 69} {"train_loss": -17.02048683166504, "global_step": 5788, "epoch": 69} {"train_loss": -17.391860961914062, "global_step": 5789, "epoch": 69} {"train_loss": -17.2545108795166, "global_step": 5790, "epoch": 69} {"train_loss": -17.213438034057617, "global_step": 5791, "epoch": 69} {"train_loss": -17.039457321166992, "global_step": 5792, "epoch": 69} {"train_loss": -16.990201950073242, "global_step": 5793, "epoch": 69} {"train_loss": -16.985288619995117, "global_step": 5794, "epoch": 69} {"train_loss": -16.883108139038086, "global_step": 5795, "epoch": 69} {"train_loss": -17.317188262939453, "global_step": 5796, "epoch": 69} {"train_loss": -16.908231735229492, "global_step": 5797, "epoch": 69} {"train_loss": -17.013975143432617, "global_step": 5798, "epoch": 69} {"train_loss": -17.233295440673828, "global_step": 5799, "epoch": 69} {"train_loss": -17.243988037109375, "global_step": 5800, "epoch": 69} {"train_loss": -17.21703338623047, "global_step": 5801, "epoch": 69} {"train_loss": -16.834075927734375, "global_step": 5802, "epoch": 69} {"train_loss": -16.68861198425293, "global_step": 5803, "epoch": 69} {"train_loss": -17.23537826538086, "global_step": 5804, "epoch": 69} {"train_loss": -17.026126861572266, "global_step": 5805, "epoch": 69} {"train_loss": -17.05633544921875, "global_step": 5806, "epoch": 69} {"train_loss": -16.816274642944336, "global_step": 5807, "epoch": 69} {"train_loss": -17.343706130981445, "global_step": 5808, "epoch": 69} {"train_loss": -17.062346332044488, "global_step": 5809, "epoch": 69, "val_loss": 6486750.0} {"train_loss": -16.75745391845703, "global_step": 5810, "epoch": 70} {"train_loss": -16.526988983154297, "global_step": 5811, "epoch": 70} {"train_loss": -16.994834899902344, "global_step": 5812, "epoch": 70} {"train_loss": -16.88155174255371, "global_step": 5813, "epoch": 70} {"train_loss": -17.087800979614258, "global_step": 5814, "epoch": 70} {"train_loss": -16.612998962402344, "global_step": 5815, "epoch": 70} {"train_loss": -16.884109497070312, "global_step": 5816, "epoch": 70} {"train_loss": -17.49750328063965, "global_step": 5817, "epoch": 70} {"train_loss": -17.097318649291992, "global_step": 5818, "epoch": 70} {"train_loss": -16.94733238220215, "global_step": 5819, "epoch": 70} {"train_loss": -16.817365646362305, "global_step": 5820, "epoch": 70} {"train_loss": -17.109634399414062, "global_step": 5821, "epoch": 70} {"train_loss": -16.725101470947266, "global_step": 5822, "epoch": 70} {"train_loss": -17.177949905395508, "global_step": 5823, "epoch": 70} {"train_loss": -17.243091583251953, "global_step": 5824, "epoch": 70} {"train_loss": -17.3273983001709, "global_step": 5825, "epoch": 70} {"train_loss": -17.05023956298828, "global_step": 5826, "epoch": 70} {"train_loss": -16.776885986328125, "global_step": 5827, "epoch": 70} {"train_loss": -17.344547271728516, "global_step": 5828, "epoch": 70} {"train_loss": -17.12007713317871, "global_step": 5829, "epoch": 70} {"train_loss": -16.97501564025879, "global_step": 5830, "epoch": 70} {"train_loss": -17.205467224121094, "global_step": 5831, "epoch": 70} {"train_loss": -17.15296745300293, "global_step": 5832, "epoch": 70} {"train_loss": -17.174253463745117, "global_step": 5833, "epoch": 70} {"train_loss": -17.221481323242188, "global_step": 5834, "epoch": 70} {"train_loss": -17.28362464904785, "global_step": 5835, "epoch": 70} {"train_loss": -17.327205657958984, "global_step": 5836, "epoch": 70} {"train_loss": -17.316789627075195, "global_step": 5837, "epoch": 70} {"train_loss": -16.983003616333008, "global_step": 5838, "epoch": 70} {"train_loss": -17.09663963317871, "global_step": 5839, "epoch": 70} {"train_loss": -17.08405113220215, "global_step": 5840, "epoch": 70} {"train_loss": -17.366077423095703, "global_step": 5841, "epoch": 70} {"train_loss": -17.082965850830078, "global_step": 5842, "epoch": 70} {"train_loss": -17.06328582763672, "global_step": 5843, "epoch": 70} {"train_loss": -16.890981674194336, "global_step": 5844, "epoch": 70} {"train_loss": -16.802692413330078, "global_step": 5845, "epoch": 70} {"train_loss": -17.158599853515625, "global_step": 5846, "epoch": 70} {"train_loss": -17.135082244873047, "global_step": 5847, "epoch": 70} {"train_loss": -17.16318702697754, "global_step": 5848, "epoch": 70} {"train_loss": -16.83338737487793, "global_step": 5849, "epoch": 70} {"train_loss": -16.811201095581055, "global_step": 5850, "epoch": 70} {"train_loss": -17.23356056213379, "global_step": 5851, "epoch": 70} {"train_loss": -17.068479537963867, "global_step": 5852, "epoch": 70} {"train_loss": -17.30063247680664, "global_step": 5853, "epoch": 70} {"train_loss": -17.19281578063965, "global_step": 5854, "epoch": 70} {"train_loss": -17.284358978271484, "global_step": 5855, "epoch": 70} {"train_loss": -17.300241470336914, "global_step": 5856, "epoch": 70} {"train_loss": -17.31747817993164, "global_step": 5857, "epoch": 70} {"train_loss": -16.97079849243164, "global_step": 5858, "epoch": 70} {"train_loss": -17.040781021118164, "global_step": 5859, "epoch": 70} {"train_loss": -17.01656150817871, "global_step": 5860, "epoch": 70} {"train_loss": -17.4342041015625, "global_step": 5861, "epoch": 70} {"train_loss": -17.22601890563965, "global_step": 5862, "epoch": 70} {"train_loss": -17.199338912963867, "global_step": 5863, "epoch": 70} {"train_loss": -17.074506759643555, "global_step": 5864, "epoch": 70} {"train_loss": -17.23233985900879, "global_step": 5865, "epoch": 70} {"train_loss": -17.019765853881836, "global_step": 5866, "epoch": 70} {"train_loss": -17.386661529541016, "global_step": 5867, "epoch": 70} {"train_loss": -16.766904830932617, "global_step": 5868, "epoch": 70} {"train_loss": -16.633535385131836, "global_step": 5869, "epoch": 70} {"train_loss": -17.21636199951172, "global_step": 5870, "epoch": 70} {"train_loss": -17.252134323120117, "global_step": 5871, "epoch": 70} {"train_loss": -17.068592071533203, "global_step": 5872, "epoch": 70} {"train_loss": -17.475370407104492, "global_step": 5873, "epoch": 70} {"train_loss": -16.90279197692871, "global_step": 5874, "epoch": 70} {"train_loss": -16.979795455932617, "global_step": 5875, "epoch": 70} {"train_loss": -17.025426864624023, "global_step": 5876, "epoch": 70} {"train_loss": -17.405454635620117, "global_step": 5877, "epoch": 70} {"train_loss": -16.9936466217041, "global_step": 5878, "epoch": 70} {"train_loss": -17.12787437438965, "global_step": 5879, "epoch": 70} {"train_loss": -16.88731575012207, "global_step": 5880, "epoch": 70} {"train_loss": -17.400650024414062, "global_step": 5881, "epoch": 70} {"train_loss": -16.77664566040039, "global_step": 5882, "epoch": 70} {"train_loss": -17.168622970581055, "global_step": 5883, "epoch": 70} {"train_loss": -17.1312198638916, "global_step": 5884, "epoch": 70} {"train_loss": -17.330764770507812, "global_step": 5885, "epoch": 70} {"train_loss": -17.077722549438477, "global_step": 5886, "epoch": 70} {"train_loss": -17.021833419799805, "global_step": 5887, "epoch": 70} {"train_loss": -17.623844146728516, "global_step": 5888, "epoch": 70} {"train_loss": -17.466964721679688, "global_step": 5889, "epoch": 70} {"train_loss": -17.320844650268555, "global_step": 5890, "epoch": 70} {"train_loss": -17.12742042541504, "global_step": 5891, "epoch": 70} {"train_loss": -17.120307945343384, "global_step": 5892, "epoch": 70, "val_loss": 6488259.0} {"train_loss": -16.672576904296875, "global_step": 5893, "epoch": 71} {"train_loss": -16.572559356689453, "global_step": 5894, "epoch": 71} {"train_loss": -17.046905517578125, "global_step": 5895, "epoch": 71} {"train_loss": -17.065616607666016, "global_step": 5896, "epoch": 71} {"train_loss": -16.671796798706055, "global_step": 5897, "epoch": 71} {"train_loss": -16.79286003112793, "global_step": 5898, "epoch": 71} {"train_loss": -16.56376838684082, "global_step": 5899, "epoch": 71} {"train_loss": -16.577985763549805, "global_step": 5900, "epoch": 71} {"train_loss": -16.68890953063965, "global_step": 5901, "epoch": 71} {"train_loss": -17.11366081237793, "global_step": 5902, "epoch": 71} {"train_loss": -16.609766006469727, "global_step": 5903, "epoch": 71} {"train_loss": -17.17353630065918, "global_step": 5904, "epoch": 71} {"train_loss": -16.410932540893555, "global_step": 5905, "epoch": 71} {"train_loss": -17.312341690063477, "global_step": 5906, "epoch": 71} {"train_loss": -16.611326217651367, "global_step": 5907, "epoch": 71} {"train_loss": -17.0778865814209, "global_step": 5908, "epoch": 71} {"train_loss": -16.623077392578125, "global_step": 5909, "epoch": 71} {"train_loss": -17.13904571533203, "global_step": 5910, "epoch": 71} {"train_loss": -16.612991333007812, "global_step": 5911, "epoch": 71} {"train_loss": -16.7786922454834, "global_step": 5912, "epoch": 71} {"train_loss": -16.51318359375, "global_step": 5913, "epoch": 71} {"train_loss": -16.699819564819336, "global_step": 5914, "epoch": 71} {"train_loss": -16.91040802001953, "global_step": 5915, "epoch": 71} {"train_loss": -16.348066329956055, "global_step": 5916, "epoch": 71} {"train_loss": -16.807947158813477, "global_step": 5917, "epoch": 71} {"train_loss": -16.689451217651367, "global_step": 5918, "epoch": 71} {"train_loss": -17.167402267456055, "global_step": 5919, "epoch": 71} {"train_loss": -16.70368766784668, "global_step": 5920, "epoch": 71} {"train_loss": -16.529783248901367, "global_step": 5921, "epoch": 71} {"train_loss": -16.967960357666016, "global_step": 5922, "epoch": 71} {"train_loss": -17.197378158569336, "global_step": 5923, "epoch": 71} {"train_loss": -16.933639526367188, "global_step": 5924, "epoch": 71} {"train_loss": -16.8339900970459, "global_step": 5925, "epoch": 71} {"train_loss": -16.998228073120117, "global_step": 5926, "epoch": 71} {"train_loss": -17.151264190673828, "global_step": 5927, "epoch": 71} {"train_loss": -16.897140502929688, "global_step": 5928, "epoch": 71} {"train_loss": -16.97698402404785, "global_step": 5929, "epoch": 71} {"train_loss": -16.762611389160156, "global_step": 5930, "epoch": 71} {"train_loss": -16.913511276245117, "global_step": 5931, "epoch": 71} {"train_loss": -17.245925903320312, "global_step": 5932, "epoch": 71} {"train_loss": -16.909330368041992, "global_step": 5933, "epoch": 71} {"train_loss": -16.83327865600586, "global_step": 5934, "epoch": 71} {"train_loss": -16.586740493774414, "global_step": 5935, "epoch": 71} {"train_loss": -16.584075927734375, "global_step": 5936, "epoch": 71} {"train_loss": -16.82213592529297, "global_step": 5937, "epoch": 71} {"train_loss": -16.7558650970459, "global_step": 5938, "epoch": 71} {"train_loss": -17.10057830810547, "global_step": 5939, "epoch": 71} {"train_loss": -16.944107055664062, "global_step": 5940, "epoch": 71} {"train_loss": -17.095355987548828, "global_step": 5941, "epoch": 71} {"train_loss": -16.755752563476562, "global_step": 5942, "epoch": 71} {"train_loss": -16.936080932617188, "global_step": 5943, "epoch": 71} {"train_loss": -16.64432716369629, "global_step": 5944, "epoch": 71} {"train_loss": -16.905532836914062, "global_step": 5945, "epoch": 71} {"train_loss": -16.560237884521484, "global_step": 5946, "epoch": 71} {"train_loss": -16.71826934814453, "global_step": 5947, "epoch": 71} {"train_loss": -16.86013412475586, "global_step": 5948, "epoch": 71} {"train_loss": -17.04911231994629, "global_step": 5949, "epoch": 71} {"train_loss": -17.309677124023438, "global_step": 5950, "epoch": 71} {"train_loss": -16.81975555419922, "global_step": 5951, "epoch": 71} {"train_loss": -16.38667106628418, "global_step": 5952, "epoch": 71} {"train_loss": -16.45992660522461, "global_step": 5953, "epoch": 71} {"train_loss": -16.956769943237305, "global_step": 5954, "epoch": 71} {"train_loss": -16.75007438659668, "global_step": 5955, "epoch": 71} {"train_loss": -17.023456573486328, "global_step": 5956, "epoch": 71} {"train_loss": -16.958362579345703, "global_step": 5957, "epoch": 71} {"train_loss": -17.131179809570312, "global_step": 5958, "epoch": 71} {"train_loss": -17.1020450592041, "global_step": 5959, "epoch": 71} {"train_loss": -17.15528106689453, "global_step": 5960, "epoch": 71} {"train_loss": -17.161958694458008, "global_step": 5961, "epoch": 71} {"train_loss": -17.251733779907227, "global_step": 5962, "epoch": 71} {"train_loss": -16.88016128540039, "global_step": 5963, "epoch": 71} {"train_loss": -17.240036010742188, "global_step": 5964, "epoch": 71} {"train_loss": -16.938440322875977, "global_step": 5965, "epoch": 71} {"train_loss": -17.058639526367188, "global_step": 5966, "epoch": 71} {"train_loss": -16.75204849243164, "global_step": 5967, "epoch": 71} {"train_loss": -17.05446434020996, "global_step": 5968, "epoch": 71} {"train_loss": -16.665224075317383, "global_step": 5969, "epoch": 71} {"train_loss": -17.1799259185791, "global_step": 5970, "epoch": 71} {"train_loss": -17.042068481445312, "global_step": 5971, "epoch": 71} {"train_loss": -16.966405868530273, "global_step": 5972, "epoch": 71} {"train_loss": -16.68773651123047, "global_step": 5973, "epoch": 71} {"train_loss": -16.797164916992188, "global_step": 5974, "epoch": 71} {"train_loss": -16.86699791414192, "global_step": 5975, "epoch": 71, "val_loss": 6666205.0} {"train_loss": -16.647851943969727, "global_step": 5976, "epoch": 72} {"train_loss": -17.026329040527344, "global_step": 5977, "epoch": 72} {"train_loss": -16.885295867919922, "global_step": 5978, "epoch": 72} {"train_loss": -16.733083724975586, "global_step": 5979, "epoch": 72} {"train_loss": -16.955198287963867, "global_step": 5980, "epoch": 72} {"train_loss": -16.385343551635742, "global_step": 5981, "epoch": 72} {"train_loss": -16.962446212768555, "global_step": 5982, "epoch": 72} {"train_loss": -16.714468002319336, "global_step": 5983, "epoch": 72} {"train_loss": -16.53169822692871, "global_step": 5984, "epoch": 72} {"train_loss": -17.11457633972168, "global_step": 5985, "epoch": 72} {"train_loss": -16.765735626220703, "global_step": 5986, "epoch": 72} {"train_loss": -16.7731990814209, "global_step": 5987, "epoch": 72} {"train_loss": -17.032718658447266, "global_step": 5988, "epoch": 72} {"train_loss": -16.97413444519043, "global_step": 5989, "epoch": 72} {"train_loss": -16.927831649780273, "global_step": 5990, "epoch": 72} {"train_loss": -16.909452438354492, "global_step": 5991, "epoch": 72} {"train_loss": -16.79422378540039, "global_step": 5992, "epoch": 72} {"train_loss": -17.174575805664062, "global_step": 5993, "epoch": 72} {"train_loss": -17.32743263244629, "global_step": 5994, "epoch": 72} {"train_loss": -16.93100357055664, "global_step": 5995, "epoch": 72} {"train_loss": -17.339801788330078, "global_step": 5996, "epoch": 72} {"train_loss": -17.280136108398438, "global_step": 5997, "epoch": 72} {"train_loss": -17.124011993408203, "global_step": 5998, "epoch": 72} {"train_loss": -16.823081970214844, "global_step": 5999, "epoch": 72} {"train_loss": -17.046876907348633, "global_step": 6000, "epoch": 72} {"train_loss": -17.091215133666992, "global_step": 6001, "epoch": 72} {"train_loss": -17.020389556884766, "global_step": 6002, "epoch": 72} {"train_loss": -16.96463394165039, "global_step": 6003, "epoch": 72} {"train_loss": -16.907129287719727, "global_step": 6004, "epoch": 72} {"train_loss": -17.10811424255371, "global_step": 6005, "epoch": 72} {"train_loss": -17.051687240600586, "global_step": 6006, "epoch": 72} {"train_loss": -16.997339248657227, "global_step": 6007, "epoch": 72} {"train_loss": -16.934757232666016, "global_step": 6008, "epoch": 72} {"train_loss": -16.932912826538086, "global_step": 6009, "epoch": 72} {"train_loss": -16.832551956176758, "global_step": 6010, "epoch": 72} {"train_loss": -17.099658966064453, "global_step": 6011, "epoch": 72} {"train_loss": -16.857250213623047, "global_step": 6012, "epoch": 72} {"train_loss": -17.095075607299805, "global_step": 6013, "epoch": 72} {"train_loss": -16.89568519592285, "global_step": 6014, "epoch": 72} {"train_loss": -16.59503173828125, "global_step": 6015, "epoch": 72} {"train_loss": -16.413589477539062, "global_step": 6016, "epoch": 72} {"train_loss": -16.532447814941406, "global_step": 6017, "epoch": 72} {"train_loss": -17.16090965270996, "global_step": 6018, "epoch": 72} {"train_loss": -16.722023010253906, "global_step": 6019, "epoch": 72} {"train_loss": -17.086210250854492, "global_step": 6020, "epoch": 72} {"train_loss": -17.000158309936523, "global_step": 6021, "epoch": 72} {"train_loss": -16.837772369384766, "global_step": 6022, "epoch": 72} {"train_loss": -16.927753448486328, "global_step": 6023, "epoch": 72} {"train_loss": -16.40871238708496, "global_step": 6024, "epoch": 72} {"train_loss": -16.766096115112305, "global_step": 6025, "epoch": 72} {"train_loss": -16.920812606811523, "global_step": 6026, "epoch": 72} {"train_loss": -16.383838653564453, "global_step": 6027, "epoch": 72} {"train_loss": -17.062360763549805, "global_step": 6028, "epoch": 72} {"train_loss": -16.580337524414062, "global_step": 6029, "epoch": 72} {"train_loss": -16.436582565307617, "global_step": 6030, "epoch": 72} {"train_loss": -16.944442749023438, "global_step": 6031, "epoch": 72} {"train_loss": -16.804059982299805, "global_step": 6032, "epoch": 72} {"train_loss": -16.873065948486328, "global_step": 6033, "epoch": 72} {"train_loss": -16.94851303100586, "global_step": 6034, "epoch": 72} {"train_loss": -16.634830474853516, "global_step": 6035, "epoch": 72} {"train_loss": -17.14162254333496, "global_step": 6036, "epoch": 72} {"train_loss": -17.07071876525879, "global_step": 6037, "epoch": 72} {"train_loss": -17.144086837768555, "global_step": 6038, "epoch": 72} {"train_loss": -16.956409454345703, "global_step": 6039, "epoch": 72} {"train_loss": -17.228120803833008, "global_step": 6040, "epoch": 72} {"train_loss": -16.87310218811035, "global_step": 6041, "epoch": 72} {"train_loss": -16.92937660217285, "global_step": 6042, "epoch": 72} {"train_loss": -17.31429672241211, "global_step": 6043, "epoch": 72} {"train_loss": -17.056989669799805, "global_step": 6044, "epoch": 72} {"train_loss": -16.88250160217285, "global_step": 6045, "epoch": 72} {"train_loss": -17.19048309326172, "global_step": 6046, "epoch": 72} {"train_loss": -16.95995330810547, "global_step": 6047, "epoch": 72} {"train_loss": -17.043893814086914, "global_step": 6048, "epoch": 72} {"train_loss": -17.2630672454834, "global_step": 6049, "epoch": 72} {"train_loss": -16.951547622680664, "global_step": 6050, "epoch": 72} {"train_loss": -16.93264389038086, "global_step": 6051, "epoch": 72} {"train_loss": -16.817462921142578, "global_step": 6052, "epoch": 72} {"train_loss": -17.058467864990234, "global_step": 6053, "epoch": 72} {"train_loss": -16.52623176574707, "global_step": 6054, "epoch": 72} {"train_loss": -17.11830711364746, "global_step": 6055, "epoch": 72} {"train_loss": -17.052934646606445, "global_step": 6056, "epoch": 72} {"train_loss": -16.92276954650879, "global_step": 6057, "epoch": 72} {"train_loss": -16.90217405342194, "global_step": 6058, "epoch": 72, "val_loss": 6806420.0} {"train_loss": -16.652393341064453, "global_step": 6059, "epoch": 73} {"train_loss": -16.416940689086914, "global_step": 6060, "epoch": 73} {"train_loss": -16.404600143432617, "global_step": 6061, "epoch": 73} {"train_loss": -16.69355583190918, "global_step": 6062, "epoch": 73} {"train_loss": -16.761945724487305, "global_step": 6063, "epoch": 73} {"train_loss": -17.157438278198242, "global_step": 6064, "epoch": 73} {"train_loss": -16.28759765625, "global_step": 6065, "epoch": 73} {"train_loss": -16.5888729095459, "global_step": 6066, "epoch": 73} {"train_loss": -16.5612735748291, "global_step": 6067, "epoch": 73} {"train_loss": -16.707542419433594, "global_step": 6068, "epoch": 73} {"train_loss": -16.54378318786621, "global_step": 6069, "epoch": 73} {"train_loss": -16.409011840820312, "global_step": 6070, "epoch": 73} {"train_loss": -16.823057174682617, "global_step": 6071, "epoch": 73} {"train_loss": -17.379270553588867, "global_step": 6072, "epoch": 73} {"train_loss": -16.841474533081055, "global_step": 6073, "epoch": 73} {"train_loss": -16.784597396850586, "global_step": 6074, "epoch": 73} {"train_loss": -16.646848678588867, "global_step": 6075, "epoch": 73} {"train_loss": -16.839111328125, "global_step": 6076, "epoch": 73} {"train_loss": -17.112775802612305, "global_step": 6077, "epoch": 73} {"train_loss": -17.173587799072266, "global_step": 6078, "epoch": 73} {"train_loss": -17.015897750854492, "global_step": 6079, "epoch": 73} {"train_loss": -17.14393424987793, "global_step": 6080, "epoch": 73} {"train_loss": -16.78603172302246, "global_step": 6081, "epoch": 73} {"train_loss": -16.896116256713867, "global_step": 6082, "epoch": 73} {"train_loss": -17.1977596282959, "global_step": 6083, "epoch": 73} {"train_loss": -16.79410171508789, "global_step": 6084, "epoch": 73} {"train_loss": -16.81892204284668, "global_step": 6085, "epoch": 73} {"train_loss": -17.034826278686523, "global_step": 6086, "epoch": 73} {"train_loss": -16.849990844726562, "global_step": 6087, "epoch": 73} {"train_loss": -16.994430541992188, "global_step": 6088, "epoch": 73} {"train_loss": -17.25555992126465, "global_step": 6089, "epoch": 73} {"train_loss": -16.675153732299805, "global_step": 6090, "epoch": 73} {"train_loss": -16.891469955444336, "global_step": 6091, "epoch": 73} {"train_loss": -16.93807029724121, "global_step": 6092, "epoch": 73} {"train_loss": -17.01068687438965, "global_step": 6093, "epoch": 73} {"train_loss": -17.081741333007812, "global_step": 6094, "epoch": 73} {"train_loss": -17.206024169921875, "global_step": 6095, "epoch": 73} {"train_loss": -17.132160186767578, "global_step": 6096, "epoch": 73} {"train_loss": -16.91718864440918, "global_step": 6097, "epoch": 73} {"train_loss": -17.074487686157227, "global_step": 6098, "epoch": 73} {"train_loss": -17.22975730895996, "global_step": 6099, "epoch": 73} {"train_loss": -17.154556274414062, "global_step": 6100, "epoch": 73} {"train_loss": -17.109193801879883, "global_step": 6101, "epoch": 73} {"train_loss": -16.7041015625, "global_step": 6102, "epoch": 73} {"train_loss": -17.137130737304688, "global_step": 6103, "epoch": 73} {"train_loss": -16.56367301940918, "global_step": 6104, "epoch": 73} {"train_loss": -17.03499412536621, "global_step": 6105, "epoch": 73} {"train_loss": -17.0053768157959, "global_step": 6106, "epoch": 73} {"train_loss": -17.26069450378418, "global_step": 6107, "epoch": 73} {"train_loss": -16.829782485961914, "global_step": 6108, "epoch": 73} {"train_loss": -16.98455810546875, "global_step": 6109, "epoch": 73} {"train_loss": -16.95694351196289, "global_step": 6110, "epoch": 73} {"train_loss": -16.893659591674805, "global_step": 6111, "epoch": 73} {"train_loss": -17.006994247436523, "global_step": 6112, "epoch": 73} {"train_loss": -17.00697898864746, "global_step": 6113, "epoch": 73} {"train_loss": -17.294452667236328, "global_step": 6114, "epoch": 73} {"train_loss": -16.8407039642334, "global_step": 6115, "epoch": 73} {"train_loss": -16.98556137084961, "global_step": 6116, "epoch": 73} {"train_loss": -16.877216339111328, "global_step": 6117, "epoch": 73} {"train_loss": -17.196455001831055, "global_step": 6118, "epoch": 73} {"train_loss": -16.88010597229004, "global_step": 6119, "epoch": 73} {"train_loss": -16.957656860351562, "global_step": 6120, "epoch": 73} {"train_loss": -17.18748664855957, "global_step": 6121, "epoch": 73} {"train_loss": -16.954608917236328, "global_step": 6122, "epoch": 73} {"train_loss": -16.916433334350586, "global_step": 6123, "epoch": 73} {"train_loss": -17.264101028442383, "global_step": 6124, "epoch": 73} {"train_loss": -17.134300231933594, "global_step": 6125, "epoch": 73} {"train_loss": -17.4450626373291, "global_step": 6126, "epoch": 73} {"train_loss": -17.064762115478516, "global_step": 6127, "epoch": 73} {"train_loss": -17.29368019104004, "global_step": 6128, "epoch": 73} {"train_loss": -17.08054542541504, "global_step": 6129, "epoch": 73} {"train_loss": -16.227476119995117, "global_step": 6130, "epoch": 73} {"train_loss": -17.25611114501953, "global_step": 6131, "epoch": 73} {"train_loss": -16.781984329223633, "global_step": 6132, "epoch": 73} {"train_loss": -17.0782413482666, "global_step": 6133, "epoch": 73} {"train_loss": -17.099233627319336, "global_step": 6134, "epoch": 73} {"train_loss": -17.02191734313965, "global_step": 6135, "epoch": 73} {"train_loss": -17.0321102142334, "global_step": 6136, "epoch": 73} {"train_loss": -16.948917388916016, "global_step": 6137, "epoch": 73} {"train_loss": -16.944669723510742, "global_step": 6138, "epoch": 73} {"train_loss": -17.319229125976562, "global_step": 6139, "epoch": 73} {"train_loss": -17.028303146362305, "global_step": 6140, "epoch": 73} {"train_loss": -16.938183841935125, "global_step": 6141, "epoch": 73, "val_loss": 6763182.5} {"train_loss": -17.073591232299805, "global_step": 6142, "epoch": 74} {"train_loss": -16.70452880859375, "global_step": 6143, "epoch": 74} {"train_loss": -17.04659080505371, "global_step": 6144, "epoch": 74} {"train_loss": -16.871826171875, "global_step": 6145, "epoch": 74} {"train_loss": -16.701566696166992, "global_step": 6146, "epoch": 74} {"train_loss": -17.186344146728516, "global_step": 6147, "epoch": 74} {"train_loss": -16.521596908569336, "global_step": 6148, "epoch": 74} {"train_loss": -17.01618003845215, "global_step": 6149, "epoch": 74} {"train_loss": -16.6264591217041, "global_step": 6150, "epoch": 74} {"train_loss": -16.93073081970215, "global_step": 6151, "epoch": 74} {"train_loss": -17.191801071166992, "global_step": 6152, "epoch": 74} {"train_loss": -16.96625328063965, "global_step": 6153, "epoch": 74} {"train_loss": -16.778181076049805, "global_step": 6154, "epoch": 74} {"train_loss": -16.871389389038086, "global_step": 6155, "epoch": 74} {"train_loss": -16.7171573638916, "global_step": 6156, "epoch": 74} {"train_loss": -16.809904098510742, "global_step": 6157, "epoch": 74} {"train_loss": -17.248849868774414, "global_step": 6158, "epoch": 74} {"train_loss": -17.333251953125, "global_step": 6159, "epoch": 74} {"train_loss": -17.050493240356445, "global_step": 6160, "epoch": 74} {"train_loss": -17.29585838317871, "global_step": 6161, "epoch": 74} {"train_loss": -16.559091567993164, "global_step": 6162, "epoch": 74} {"train_loss": -17.126571655273438, "global_step": 6163, "epoch": 74} {"train_loss": -16.809406280517578, "global_step": 6164, "epoch": 74} {"train_loss": -16.92045783996582, "global_step": 6165, "epoch": 74} {"train_loss": -17.260475158691406, "global_step": 6166, "epoch": 74} {"train_loss": -17.00241470336914, "global_step": 6167, "epoch": 74} {"train_loss": -16.88141441345215, "global_step": 6168, "epoch": 74} {"train_loss": -17.1004695892334, "global_step": 6169, "epoch": 74} {"train_loss": -16.823644638061523, "global_step": 6170, "epoch": 74} {"train_loss": -17.131689071655273, "global_step": 6171, "epoch": 74} {"train_loss": -17.101224899291992, "global_step": 6172, "epoch": 74} {"train_loss": -16.94942283630371, "global_step": 6173, "epoch": 74} {"train_loss": -16.922428131103516, "global_step": 6174, "epoch": 74} {"train_loss": -17.139663696289062, "global_step": 6175, "epoch": 74} {"train_loss": -16.7867488861084, "global_step": 6176, "epoch": 74} {"train_loss": -16.945219039916992, "global_step": 6177, "epoch": 74} {"train_loss": -17.438318252563477, "global_step": 6178, "epoch": 74} {"train_loss": -16.979217529296875, "global_step": 6179, "epoch": 74} {"train_loss": -16.997882843017578, "global_step": 6180, "epoch": 74} {"train_loss": -16.721271514892578, "global_step": 6181, "epoch": 74} {"train_loss": -17.193124771118164, "global_step": 6182, "epoch": 74} {"train_loss": -16.683469772338867, "global_step": 6183, "epoch": 74} {"train_loss": -17.14601707458496, "global_step": 6184, "epoch": 74} {"train_loss": -17.037282943725586, "global_step": 6185, "epoch": 74} {"train_loss": -17.119901657104492, "global_step": 6186, "epoch": 74} {"train_loss": -16.918947219848633, "global_step": 6187, "epoch": 74} {"train_loss": -17.04371452331543, "global_step": 6188, "epoch": 74} {"train_loss": -17.06162452697754, "global_step": 6189, "epoch": 74} {"train_loss": -16.883502960205078, "global_step": 6190, "epoch": 74} {"train_loss": -16.884437561035156, "global_step": 6191, "epoch": 74} {"train_loss": -17.099552154541016, "global_step": 6192, "epoch": 74} {"train_loss": -17.540559768676758, "global_step": 6193, "epoch": 74} {"train_loss": -17.190311431884766, "global_step": 6194, "epoch": 74} {"train_loss": -17.05177116394043, "global_step": 6195, "epoch": 74} {"train_loss": -16.917001724243164, "global_step": 6196, "epoch": 74} {"train_loss": -16.794836044311523, "global_step": 6197, "epoch": 74} {"train_loss": -16.871999740600586, "global_step": 6198, "epoch": 74} {"train_loss": -16.97426414489746, "global_step": 6199, "epoch": 74} {"train_loss": -16.705080032348633, "global_step": 6200, "epoch": 74} {"train_loss": -16.938302993774414, "global_step": 6201, "epoch": 74} {"train_loss": -17.224374771118164, "global_step": 6202, "epoch": 74} {"train_loss": -16.961933135986328, "global_step": 6203, "epoch": 74} {"train_loss": -16.995874404907227, "global_step": 6204, "epoch": 74} {"train_loss": -17.355871200561523, "global_step": 6205, "epoch": 74} {"train_loss": -17.15245246887207, "global_step": 6206, "epoch": 74} {"train_loss": -17.245264053344727, "global_step": 6207, "epoch": 74} {"train_loss": -16.78026008605957, "global_step": 6208, "epoch": 74} {"train_loss": -17.306934356689453, "global_step": 6209, "epoch": 74} {"train_loss": -17.063289642333984, "global_step": 6210, "epoch": 74} {"train_loss": -17.19375228881836, "global_step": 6211, "epoch": 74} {"train_loss": -16.882524490356445, "global_step": 6212, "epoch": 74} {"train_loss": -17.170974731445312, "global_step": 6213, "epoch": 74} {"train_loss": -17.00503158569336, "global_step": 6214, "epoch": 74} {"train_loss": -16.9659366607666, "global_step": 6215, "epoch": 74} {"train_loss": -17.07378578186035, "global_step": 6216, "epoch": 74} {"train_loss": -17.105316162109375, "global_step": 6217, "epoch": 74} {"train_loss": -17.081571578979492, "global_step": 6218, "epoch": 74} {"train_loss": -17.001630783081055, "global_step": 6219, "epoch": 74} {"train_loss": -16.596250534057617, "global_step": 6220, "epoch": 74} {"train_loss": -16.985807418823242, "global_step": 6221, "epoch": 74} {"train_loss": -17.128698348999023, "global_step": 6222, "epoch": 74} {"train_loss": -16.89504623413086, "global_step": 6223, "epoch": 74} {"train_loss": -16.995696630822607, "global_step": 6224, "epoch": 74, "val_loss": 6572091.0} {"train_loss": -17.084026336669922, "global_step": 6225, "epoch": 75} {"train_loss": -16.74526023864746, "global_step": 6226, "epoch": 75} {"train_loss": -17.141096115112305, "global_step": 6227, "epoch": 75} {"train_loss": -17.047468185424805, "global_step": 6228, "epoch": 75} {"train_loss": -17.086523056030273, "global_step": 6229, "epoch": 75} {"train_loss": -16.84345817565918, "global_step": 6230, "epoch": 75} {"train_loss": -17.230661392211914, "global_step": 6231, "epoch": 75} {"train_loss": -17.0916805267334, "global_step": 6232, "epoch": 75} {"train_loss": -16.74649429321289, "global_step": 6233, "epoch": 75} {"train_loss": -16.607892990112305, "global_step": 6234, "epoch": 75} {"train_loss": -16.69858169555664, "global_step": 6235, "epoch": 75} {"train_loss": -16.897125244140625, "global_step": 6236, "epoch": 75} {"train_loss": -17.08157730102539, "global_step": 6237, "epoch": 75} {"train_loss": -16.616361618041992, "global_step": 6238, "epoch": 75} {"train_loss": -16.97402000427246, "global_step": 6239, "epoch": 75} {"train_loss": -17.046720504760742, "global_step": 6240, "epoch": 75} {"train_loss": -17.117725372314453, "global_step": 6241, "epoch": 75} {"train_loss": -17.109943389892578, "global_step": 6242, "epoch": 75} {"train_loss": -17.03306007385254, "global_step": 6243, "epoch": 75} {"train_loss": -16.957883834838867, "global_step": 6244, "epoch": 75} {"train_loss": -16.944517135620117, "global_step": 6245, "epoch": 75} {"train_loss": -16.52005958557129, "global_step": 6246, "epoch": 75} {"train_loss": -16.903701782226562, "global_step": 6247, "epoch": 75} {"train_loss": -17.183582305908203, "global_step": 6248, "epoch": 75} {"train_loss": -16.76114845275879, "global_step": 6249, "epoch": 75} {"train_loss": -17.17437171936035, "global_step": 6250, "epoch": 75} {"train_loss": -17.005216598510742, "global_step": 6251, "epoch": 75} {"train_loss": -17.4056339263916, "global_step": 6252, "epoch": 75} {"train_loss": -17.2657413482666, "global_step": 6253, "epoch": 75} {"train_loss": -17.01357078552246, "global_step": 6254, "epoch": 75} {"train_loss": -17.469865798950195, "global_step": 6255, "epoch": 75} {"train_loss": -17.43182945251465, "global_step": 6256, "epoch": 75} {"train_loss": -16.709306716918945, "global_step": 6257, "epoch": 75} {"train_loss": -17.287662506103516, "global_step": 6258, "epoch": 75} {"train_loss": -16.94434928894043, "global_step": 6259, "epoch": 75} {"train_loss": -17.0240421295166, "global_step": 6260, "epoch": 75} {"train_loss": -17.31214141845703, "global_step": 6261, "epoch": 75} {"train_loss": -17.236650466918945, "global_step": 6262, "epoch": 75} {"train_loss": -16.861270904541016, "global_step": 6263, "epoch": 75} {"train_loss": -16.829587936401367, "global_step": 6264, "epoch": 75} {"train_loss": -17.06525993347168, "global_step": 6265, "epoch": 75} {"train_loss": -17.121932983398438, "global_step": 6266, "epoch": 75} {"train_loss": -17.183496475219727, "global_step": 6267, "epoch": 75} {"train_loss": -16.92731285095215, "global_step": 6268, "epoch": 75} {"train_loss": -17.177608489990234, "global_step": 6269, "epoch": 75} {"train_loss": -17.07146644592285, "global_step": 6270, "epoch": 75} {"train_loss": -17.071985244750977, "global_step": 6271, "epoch": 75} {"train_loss": -16.90071678161621, "global_step": 6272, "epoch": 75} {"train_loss": -16.84677505493164, "global_step": 6273, "epoch": 75} {"train_loss": -17.177026748657227, "global_step": 6274, "epoch": 75} {"train_loss": -16.626096725463867, "global_step": 6275, "epoch": 75} {"train_loss": -16.80588150024414, "global_step": 6276, "epoch": 75} {"train_loss": -17.097623825073242, "global_step": 6277, "epoch": 75} {"train_loss": -17.158430099487305, "global_step": 6278, "epoch": 75} {"train_loss": -16.91370964050293, "global_step": 6279, "epoch": 75} {"train_loss": -17.035642623901367, "global_step": 6280, "epoch": 75} {"train_loss": -17.016035079956055, "global_step": 6281, "epoch": 75} {"train_loss": -17.182369232177734, "global_step": 6282, "epoch": 75} {"train_loss": -16.932554244995117, "global_step": 6283, "epoch": 75} {"train_loss": -16.729711532592773, "global_step": 6284, "epoch": 75} {"train_loss": -17.02686309814453, "global_step": 6285, "epoch": 75} {"train_loss": -16.533063888549805, "global_step": 6286, "epoch": 75} {"train_loss": -17.159025192260742, "global_step": 6287, "epoch": 75} {"train_loss": -17.48432159423828, "global_step": 6288, "epoch": 75} {"train_loss": -16.95902442932129, "global_step": 6289, "epoch": 75} {"train_loss": -17.4365291595459, "global_step": 6290, "epoch": 75} {"train_loss": -17.172958374023438, "global_step": 6291, "epoch": 75} {"train_loss": -17.16777992248535, "global_step": 6292, "epoch": 75} {"train_loss": -17.02930450439453, "global_step": 6293, "epoch": 75} {"train_loss": -17.438888549804688, "global_step": 6294, "epoch": 75} {"train_loss": -17.130165100097656, "global_step": 6295, "epoch": 75} {"train_loss": -17.10558319091797, "global_step": 6296, "epoch": 75} {"train_loss": -16.77862548828125, "global_step": 6297, "epoch": 75} {"train_loss": -16.692930221557617, "global_step": 6298, "epoch": 75} {"train_loss": -17.35567283630371, "global_step": 6299, "epoch": 75} {"train_loss": -17.10015296936035, "global_step": 6300, "epoch": 75} {"train_loss": -17.31220054626465, "global_step": 6301, "epoch": 75} {"train_loss": -17.40748405456543, "global_step": 6302, "epoch": 75} {"train_loss": -16.872848510742188, "global_step": 6303, "epoch": 75} {"train_loss": -17.14445686340332, "global_step": 6304, "epoch": 75} {"train_loss": -17.345155715942383, "global_step": 6305, "epoch": 75} {"train_loss": -16.839187622070312, "global_step": 6306, "epoch": 75} {"train_loss": -17.04753241481551, "global_step": 6307, "epoch": 75, "val_loss": 6847385.0} {"train_loss": -16.606870651245117, "global_step": 6308, "epoch": 76} {"train_loss": -16.946903228759766, "global_step": 6309, "epoch": 76} {"train_loss": -16.92603874206543, "global_step": 6310, "epoch": 76} {"train_loss": -16.89097023010254, "global_step": 6311, "epoch": 76} {"train_loss": -16.700014114379883, "global_step": 6312, "epoch": 76} {"train_loss": -17.35304832458496, "global_step": 6313, "epoch": 76} {"train_loss": -17.262296676635742, "global_step": 6314, "epoch": 76} {"train_loss": -16.53720474243164, "global_step": 6315, "epoch": 76} {"train_loss": -16.8394775390625, "global_step": 6316, "epoch": 76} {"train_loss": -17.312604904174805, "global_step": 6317, "epoch": 76} {"train_loss": -16.872541427612305, "global_step": 6318, "epoch": 76} {"train_loss": -17.042003631591797, "global_step": 6319, "epoch": 76} {"train_loss": -17.495956420898438, "global_step": 6320, "epoch": 76} {"train_loss": -17.193958282470703, "global_step": 6321, "epoch": 76} {"train_loss": -17.21675682067871, "global_step": 6322, "epoch": 76} {"train_loss": -17.48782730102539, "global_step": 6323, "epoch": 76} {"train_loss": -17.115400314331055, "global_step": 6324, "epoch": 76} {"train_loss": -16.982961654663086, "global_step": 6325, "epoch": 76} {"train_loss": -17.085954666137695, "global_step": 6326, "epoch": 76} {"train_loss": -16.89454460144043, "global_step": 6327, "epoch": 76} {"train_loss": -17.30341148376465, "global_step": 6328, "epoch": 76} {"train_loss": -16.81915855407715, "global_step": 6329, "epoch": 76} {"train_loss": -17.082115173339844, "global_step": 6330, "epoch": 76} {"train_loss": -16.92856216430664, "global_step": 6331, "epoch": 76} {"train_loss": -16.93943214416504, "global_step": 6332, "epoch": 76} {"train_loss": -17.39278221130371, "global_step": 6333, "epoch": 76} {"train_loss": -17.16697883605957, "global_step": 6334, "epoch": 76} {"train_loss": -17.282913208007812, "global_step": 6335, "epoch": 76} {"train_loss": -17.011232376098633, "global_step": 6336, "epoch": 76} {"train_loss": -17.19646644592285, "global_step": 6337, "epoch": 76} {"train_loss": -17.17030906677246, "global_step": 6338, "epoch": 76} {"train_loss": -16.711517333984375, "global_step": 6339, "epoch": 76} {"train_loss": -17.299570083618164, "global_step": 6340, "epoch": 76} {"train_loss": -17.250844955444336, "global_step": 6341, "epoch": 76} {"train_loss": -16.907873153686523, "global_step": 6342, "epoch": 76} {"train_loss": -17.097564697265625, "global_step": 6343, "epoch": 76} {"train_loss": -16.89281463623047, "global_step": 6344, "epoch": 76} {"train_loss": -16.649627685546875, "global_step": 6345, "epoch": 76} {"train_loss": -17.130773544311523, "global_step": 6346, "epoch": 76} {"train_loss": -17.385404586791992, "global_step": 6347, "epoch": 76} {"train_loss": -16.929601669311523, "global_step": 6348, "epoch": 76} {"train_loss": -17.11192512512207, "global_step": 6349, "epoch": 76} {"train_loss": -17.371030807495117, "global_step": 6350, "epoch": 76} {"train_loss": -17.18540382385254, "global_step": 6351, "epoch": 76} {"train_loss": -17.1959285736084, "global_step": 6352, "epoch": 76} {"train_loss": -17.11329460144043, "global_step": 6353, "epoch": 76} {"train_loss": -17.129695892333984, "global_step": 6354, "epoch": 76} {"train_loss": -17.13397789001465, "global_step": 6355, "epoch": 76} {"train_loss": -17.07529640197754, "global_step": 6356, "epoch": 76} {"train_loss": -16.740636825561523, "global_step": 6357, "epoch": 76} {"train_loss": -16.999988555908203, "global_step": 6358, "epoch": 76} {"train_loss": -17.211244583129883, "global_step": 6359, "epoch": 76} {"train_loss": -17.1102352142334, "global_step": 6360, "epoch": 76} {"train_loss": -17.549352645874023, "global_step": 6361, "epoch": 76} {"train_loss": -16.89375877380371, "global_step": 6362, "epoch": 76} {"train_loss": -16.823522567749023, "global_step": 6363, "epoch": 76} {"train_loss": -17.2266902923584, "global_step": 6364, "epoch": 76} {"train_loss": -17.28688621520996, "global_step": 6365, "epoch": 76} {"train_loss": -17.42589569091797, "global_step": 6366, "epoch": 76} {"train_loss": -17.006698608398438, "global_step": 6367, "epoch": 76} {"train_loss": -17.18977928161621, "global_step": 6368, "epoch": 76} {"train_loss": -16.646240234375, "global_step": 6369, "epoch": 76} {"train_loss": -17.375410079956055, "global_step": 6370, "epoch": 76} {"train_loss": -16.641441345214844, "global_step": 6371, "epoch": 76} {"train_loss": -16.95978355407715, "global_step": 6372, "epoch": 76} {"train_loss": -17.046674728393555, "global_step": 6373, "epoch": 76} {"train_loss": -17.21160888671875, "global_step": 6374, "epoch": 76} {"train_loss": -17.1186580657959, "global_step": 6375, "epoch": 76} {"train_loss": -17.118915557861328, "global_step": 6376, "epoch": 76} {"train_loss": -16.708683013916016, "global_step": 6377, "epoch": 76} {"train_loss": -17.04970359802246, "global_step": 6378, "epoch": 76} {"train_loss": -17.008907318115234, "global_step": 6379, "epoch": 76} {"train_loss": -17.147336959838867, "global_step": 6380, "epoch": 76} {"train_loss": -17.590103149414062, "global_step": 6381, "epoch": 76} {"train_loss": -16.727340698242188, "global_step": 6382, "epoch": 76} {"train_loss": -16.895845413208008, "global_step": 6383, "epoch": 76} {"train_loss": -17.218664169311523, "global_step": 6384, "epoch": 76} {"train_loss": -16.931753158569336, "global_step": 6385, "epoch": 76} {"train_loss": -16.74650001525879, "global_step": 6386, "epoch": 76} {"train_loss": -17.3978214263916, "global_step": 6387, "epoch": 76} {"train_loss": -16.97199821472168, "global_step": 6388, "epoch": 76} {"train_loss": -16.857511520385742, "global_step": 6389, "epoch": 76} {"train_loss": -17.038726703230157, "global_step": 6390, "epoch": 76, "val_loss": 6800600.0} {"train_loss": -16.64324378967285, "global_step": 6391, "epoch": 77} {"train_loss": -16.8741455078125, "global_step": 6392, "epoch": 77} {"train_loss": -17.09930419921875, "global_step": 6393, "epoch": 77} {"train_loss": -17.077301025390625, "global_step": 6394, "epoch": 77} {"train_loss": -16.709266662597656, "global_step": 6395, "epoch": 77} {"train_loss": -17.108997344970703, "global_step": 6396, "epoch": 77} {"train_loss": -17.04901695251465, "global_step": 6397, "epoch": 77} {"train_loss": -17.08351707458496, "global_step": 6398, "epoch": 77} {"train_loss": -17.081632614135742, "global_step": 6399, "epoch": 77} {"train_loss": -17.154468536376953, "global_step": 6400, "epoch": 77} {"train_loss": -16.65771484375, "global_step": 6401, "epoch": 77} {"train_loss": -16.84909439086914, "global_step": 6402, "epoch": 77} {"train_loss": -17.092344284057617, "global_step": 6403, "epoch": 77} {"train_loss": -16.755863189697266, "global_step": 6404, "epoch": 77} {"train_loss": -16.956192016601562, "global_step": 6405, "epoch": 77} {"train_loss": -17.269941329956055, "global_step": 6406, "epoch": 77} {"train_loss": -17.097036361694336, "global_step": 6407, "epoch": 77} {"train_loss": -17.121673583984375, "global_step": 6408, "epoch": 77} {"train_loss": -16.853967666625977, "global_step": 6409, "epoch": 77} {"train_loss": -17.381689071655273, "global_step": 6410, "epoch": 77} {"train_loss": -17.24460792541504, "global_step": 6411, "epoch": 77} {"train_loss": -17.10410499572754, "global_step": 6412, "epoch": 77} {"train_loss": -17.101774215698242, "global_step": 6413, "epoch": 77} {"train_loss": -16.7984676361084, "global_step": 6414, "epoch": 77} {"train_loss": -17.03316879272461, "global_step": 6415, "epoch": 77} {"train_loss": -17.199182510375977, "global_step": 6416, "epoch": 77} {"train_loss": -17.028579711914062, "global_step": 6417, "epoch": 77} {"train_loss": -17.607702255249023, "global_step": 6418, "epoch": 77} {"train_loss": -17.000730514526367, "global_step": 6419, "epoch": 77} {"train_loss": -16.81416893005371, "global_step": 6420, "epoch": 77} {"train_loss": -17.24146842956543, "global_step": 6421, "epoch": 77} {"train_loss": -16.991859436035156, "global_step": 6422, "epoch": 77} {"train_loss": -16.839038848876953, "global_step": 6423, "epoch": 77} {"train_loss": -16.616226196289062, "global_step": 6424, "epoch": 77} {"train_loss": -17.191171646118164, "global_step": 6425, "epoch": 77} {"train_loss": -17.074960708618164, "global_step": 6426, "epoch": 77} {"train_loss": -16.921049118041992, "global_step": 6427, "epoch": 77} {"train_loss": -16.97889518737793, "global_step": 6428, "epoch": 77} {"train_loss": -16.99287986755371, "global_step": 6429, "epoch": 77} {"train_loss": -17.386747360229492, "global_step": 6430, "epoch": 77} {"train_loss": -17.128143310546875, "global_step": 6431, "epoch": 77} {"train_loss": -16.909147262573242, "global_step": 6432, "epoch": 77} {"train_loss": -17.456857681274414, "global_step": 6433, "epoch": 77} {"train_loss": -17.3592586517334, "global_step": 6434, "epoch": 77} {"train_loss": -16.46088981628418, "global_step": 6435, "epoch": 77} {"train_loss": -17.247465133666992, "global_step": 6436, "epoch": 77} {"train_loss": -17.26674461364746, "global_step": 6437, "epoch": 77} {"train_loss": -17.26352310180664, "global_step": 6438, "epoch": 77} {"train_loss": -17.259546279907227, "global_step": 6439, "epoch": 77} {"train_loss": -17.303796768188477, "global_step": 6440, "epoch": 77} {"train_loss": -16.922285079956055, "global_step": 6441, "epoch": 77} {"train_loss": -17.141557693481445, "global_step": 6442, "epoch": 77} {"train_loss": -17.16037940979004, "global_step": 6443, "epoch": 77} {"train_loss": -17.31540870666504, "global_step": 6444, "epoch": 77} {"train_loss": -16.927770614624023, "global_step": 6445, "epoch": 77} {"train_loss": -17.428190231323242, "global_step": 6446, "epoch": 77} {"train_loss": -17.230695724487305, "global_step": 6447, "epoch": 77} {"train_loss": -17.161880493164062, "global_step": 6448, "epoch": 77} {"train_loss": -17.35617446899414, "global_step": 6449, "epoch": 77} {"train_loss": -17.075895309448242, "global_step": 6450, "epoch": 77} {"train_loss": -16.840986251831055, "global_step": 6451, "epoch": 77} {"train_loss": -16.739458084106445, "global_step": 6452, "epoch": 77} {"train_loss": -17.213653564453125, "global_step": 6453, "epoch": 77} {"train_loss": -17.4458065032959, "global_step": 6454, "epoch": 77} {"train_loss": -17.035690307617188, "global_step": 6455, "epoch": 77} {"train_loss": -17.31707191467285, "global_step": 6456, "epoch": 77} {"train_loss": -16.718217849731445, "global_step": 6457, "epoch": 77} {"train_loss": -16.867752075195312, "global_step": 6458, "epoch": 77} {"train_loss": -16.866901397705078, "global_step": 6459, "epoch": 77} {"train_loss": -16.911733627319336, "global_step": 6460, "epoch": 77} {"train_loss": -17.127771377563477, "global_step": 6461, "epoch": 77} {"train_loss": -17.220163345336914, "global_step": 6462, "epoch": 77} {"train_loss": -17.034442901611328, "global_step": 6463, "epoch": 77} {"train_loss": -16.917932510375977, "global_step": 6464, "epoch": 77} {"train_loss": -16.98274040222168, "global_step": 6465, "epoch": 77} {"train_loss": -17.19490623474121, "global_step": 6466, "epoch": 77} {"train_loss": -16.956411361694336, "global_step": 6467, "epoch": 77} {"train_loss": -17.135005950927734, "global_step": 6468, "epoch": 77} {"train_loss": -17.151830673217773, "global_step": 6469, "epoch": 77} {"train_loss": -17.017070770263672, "global_step": 6470, "epoch": 77} {"train_loss": -16.949953079223633, "global_step": 6471, "epoch": 77} {"train_loss": -17.3604679107666, "global_step": 6472, "epoch": 77} {"train_loss": -17.089008193418206, "global_step": 6473, "epoch": 77, "val_loss": 6600730.0} {"train_loss": -17.068265914916992, "global_step": 6474, "epoch": 78} {"train_loss": -17.376501083374023, "global_step": 6475, "epoch": 78} {"train_loss": -17.0379581451416, "global_step": 6476, "epoch": 78} {"train_loss": -17.212139129638672, "global_step": 6477, "epoch": 78} {"train_loss": -17.265878677368164, "global_step": 6478, "epoch": 78} {"train_loss": -17.13156509399414, "global_step": 6479, "epoch": 78} {"train_loss": -17.073322296142578, "global_step": 6480, "epoch": 78} {"train_loss": -17.751707077026367, "global_step": 6481, "epoch": 78} {"train_loss": -17.310806274414062, "global_step": 6482, "epoch": 78} {"train_loss": -17.078786849975586, "global_step": 6483, "epoch": 78} {"train_loss": -17.01202964782715, "global_step": 6484, "epoch": 78} {"train_loss": -16.92970848083496, "global_step": 6485, "epoch": 78} {"train_loss": -17.169591903686523, "global_step": 6486, "epoch": 78} {"train_loss": -17.059598922729492, "global_step": 6487, "epoch": 78} {"train_loss": -17.125736236572266, "global_step": 6488, "epoch": 78} {"train_loss": -17.279605865478516, "global_step": 6489, "epoch": 78} {"train_loss": -16.909015655517578, "global_step": 6490, "epoch": 78} {"train_loss": -16.786766052246094, "global_step": 6491, "epoch": 78} {"train_loss": -16.9710693359375, "global_step": 6492, "epoch": 78} {"train_loss": -17.203853607177734, "global_step": 6493, "epoch": 78} {"train_loss": -17.14313316345215, "global_step": 6494, "epoch": 78} {"train_loss": -16.934619903564453, "global_step": 6495, "epoch": 78} {"train_loss": -17.51805877685547, "global_step": 6496, "epoch": 78} {"train_loss": -16.917530059814453, "global_step": 6497, "epoch": 78} {"train_loss": -16.66068458557129, "global_step": 6498, "epoch": 78} {"train_loss": -17.10349464416504, "global_step": 6499, "epoch": 78} {"train_loss": -17.04877281188965, "global_step": 6500, "epoch": 78} {"train_loss": -17.401081085205078, "global_step": 6501, "epoch": 78} {"train_loss": -17.17041015625, "global_step": 6502, "epoch": 78} {"train_loss": -17.101764678955078, "global_step": 6503, "epoch": 78} {"train_loss": -16.940959930419922, "global_step": 6504, "epoch": 78} {"train_loss": -16.842313766479492, "global_step": 6505, "epoch": 78} {"train_loss": -17.18478775024414, "global_step": 6506, "epoch": 78} {"train_loss": -16.842992782592773, "global_step": 6507, "epoch": 78} {"train_loss": -16.974658966064453, "global_step": 6508, "epoch": 78} {"train_loss": -17.075164794921875, "global_step": 6509, "epoch": 78} {"train_loss": -17.3966121673584, "global_step": 6510, "epoch": 78} {"train_loss": -17.162220001220703, "global_step": 6511, "epoch": 78} {"train_loss": -16.85127830505371, "global_step": 6512, "epoch": 78} {"train_loss": -17.0122127532959, "global_step": 6513, "epoch": 78} {"train_loss": -16.955251693725586, "global_step": 6514, "epoch": 78} {"train_loss": -17.28144645690918, "global_step": 6515, "epoch": 78} {"train_loss": -17.131826400756836, "global_step": 6516, "epoch": 78} {"train_loss": -16.949926376342773, "global_step": 6517, "epoch": 78} {"train_loss": -17.614715576171875, "global_step": 6518, "epoch": 78} {"train_loss": -17.103620529174805, "global_step": 6519, "epoch": 78} {"train_loss": -16.959035873413086, "global_step": 6520, "epoch": 78} {"train_loss": -17.618284225463867, "global_step": 6521, "epoch": 78} {"train_loss": -16.719392776489258, "global_step": 6522, "epoch": 78} {"train_loss": -17.12229347229004, "global_step": 6523, "epoch": 78} {"train_loss": -17.42388916015625, "global_step": 6524, "epoch": 78} {"train_loss": -16.953168869018555, "global_step": 6525, "epoch": 78} {"train_loss": -17.216787338256836, "global_step": 6526, "epoch": 78} {"train_loss": -17.47504997253418, "global_step": 6527, "epoch": 78} {"train_loss": -17.160503387451172, "global_step": 6528, "epoch": 78} {"train_loss": -16.70876121520996, "global_step": 6529, "epoch": 78} {"train_loss": -17.143583297729492, "global_step": 6530, "epoch": 78} {"train_loss": -16.534637451171875, "global_step": 6531, "epoch": 78} {"train_loss": -16.938034057617188, "global_step": 6532, "epoch": 78} {"train_loss": -16.701316833496094, "global_step": 6533, "epoch": 78} {"train_loss": -17.00535011291504, "global_step": 6534, "epoch": 78} {"train_loss": -16.957006454467773, "global_step": 6535, "epoch": 78} {"train_loss": -16.61905860900879, "global_step": 6536, "epoch": 78} {"train_loss": -17.1505069732666, "global_step": 6537, "epoch": 78} {"train_loss": -17.259994506835938, "global_step": 6538, "epoch": 78} {"train_loss": -17.307723999023438, "global_step": 6539, "epoch": 78} {"train_loss": -17.37344741821289, "global_step": 6540, "epoch": 78} {"train_loss": -17.1513729095459, "global_step": 6541, "epoch": 78} {"train_loss": -17.33194923400879, "global_step": 6542, "epoch": 78} {"train_loss": -17.461578369140625, "global_step": 6543, "epoch": 78} {"train_loss": -17.1062068939209, "global_step": 6544, "epoch": 78} {"train_loss": -16.79672622680664, "global_step": 6545, "epoch": 78} {"train_loss": -17.300710678100586, "global_step": 6546, "epoch": 78} {"train_loss": -17.331270217895508, "global_step": 6547, "epoch": 78} {"train_loss": -17.313501358032227, "global_step": 6548, "epoch": 78} {"train_loss": -17.214298248291016, "global_step": 6549, "epoch": 78} {"train_loss": -17.113040924072266, "global_step": 6550, "epoch": 78} {"train_loss": -16.884973526000977, "global_step": 6551, "epoch": 78} {"train_loss": -16.683218002319336, "global_step": 6552, "epoch": 78} {"train_loss": -17.154356002807617, "global_step": 6553, "epoch": 78} {"train_loss": -17.308290481567383, "global_step": 6554, "epoch": 78} {"train_loss": -16.80684471130371, "global_step": 6555, "epoch": 78} {"train_loss": -17.12082449212132, "global_step": 6556, "epoch": 78, "val_loss": 6571949.0} {"train_loss": -17.21976661682129, "global_step": 6557, "epoch": 79} {"train_loss": -16.400835037231445, "global_step": 6558, "epoch": 79} {"train_loss": -16.795297622680664, "global_step": 6559, "epoch": 79} {"train_loss": -16.717851638793945, "global_step": 6560, "epoch": 79} {"train_loss": -17.430696487426758, "global_step": 6561, "epoch": 79} {"train_loss": -17.06495475769043, "global_step": 6562, "epoch": 79} {"train_loss": -17.09096336364746, "global_step": 6563, "epoch": 79} {"train_loss": -17.49680519104004, "global_step": 6564, "epoch": 79} {"train_loss": -17.138715744018555, "global_step": 6565, "epoch": 79} {"train_loss": -16.904279708862305, "global_step": 6566, "epoch": 79} {"train_loss": -17.536579132080078, "global_step": 6567, "epoch": 79} {"train_loss": -16.765119552612305, "global_step": 6568, "epoch": 79} {"train_loss": -17.162540435791016, "global_step": 6569, "epoch": 79} {"train_loss": -16.874176025390625, "global_step": 6570, "epoch": 79} {"train_loss": -17.03864860534668, "global_step": 6571, "epoch": 79} {"train_loss": -17.188547134399414, "global_step": 6572, "epoch": 79} {"train_loss": -16.96541404724121, "global_step": 6573, "epoch": 79} {"train_loss": -16.96158218383789, "global_step": 6574, "epoch": 79} {"train_loss": -17.110153198242188, "global_step": 6575, "epoch": 79} {"train_loss": -17.15535545349121, "global_step": 6576, "epoch": 79} {"train_loss": -17.067848205566406, "global_step": 6577, "epoch": 79} {"train_loss": -17.214187622070312, "global_step": 6578, "epoch": 79} {"train_loss": -17.30067253112793, "global_step": 6579, "epoch": 79} {"train_loss": -17.127805709838867, "global_step": 6580, "epoch": 79} {"train_loss": -17.49786949157715, "global_step": 6581, "epoch": 79} {"train_loss": -17.329914093017578, "global_step": 6582, "epoch": 79} {"train_loss": -17.46957778930664, "global_step": 6583, "epoch": 79} {"train_loss": -17.148534774780273, "global_step": 6584, "epoch": 79} {"train_loss": -17.25861930847168, "global_step": 6585, "epoch": 79} {"train_loss": -16.745458602905273, "global_step": 6586, "epoch": 79} {"train_loss": -17.670021057128906, "global_step": 6587, "epoch": 79} {"train_loss": -16.960739135742188, "global_step": 6588, "epoch": 79} {"train_loss": -17.56698989868164, "global_step": 6589, "epoch": 79} {"train_loss": -17.278730392456055, "global_step": 6590, "epoch": 79} {"train_loss": -17.1893310546875, "global_step": 6591, "epoch": 79} {"train_loss": -17.202682495117188, "global_step": 6592, "epoch": 79} {"train_loss": -16.973560333251953, "global_step": 6593, "epoch": 79} {"train_loss": -17.274381637573242, "global_step": 6594, "epoch": 79} {"train_loss": -16.924358367919922, "global_step": 6595, "epoch": 79} {"train_loss": -17.347335815429688, "global_step": 6596, "epoch": 79} {"train_loss": -17.19091796875, "global_step": 6597, "epoch": 79} {"train_loss": -17.418991088867188, "global_step": 6598, "epoch": 79} {"train_loss": -16.981821060180664, "global_step": 6599, "epoch": 79} {"train_loss": -17.065431594848633, "global_step": 6600, "epoch": 79} {"train_loss": -17.15987777709961, "global_step": 6601, "epoch": 79} {"train_loss": -17.038938522338867, "global_step": 6602, "epoch": 79} {"train_loss": -17.41572380065918, "global_step": 6603, "epoch": 79} {"train_loss": -16.9603328704834, "global_step": 6604, "epoch": 79} {"train_loss": -16.880300521850586, "global_step": 6605, "epoch": 79} {"train_loss": -17.5416316986084, "global_step": 6606, "epoch": 79} {"train_loss": -17.280263900756836, "global_step": 6607, "epoch": 79} {"train_loss": -17.35674476623535, "global_step": 6608, "epoch": 79} {"train_loss": -17.252120971679688, "global_step": 6609, "epoch": 79} {"train_loss": -17.248291015625, "global_step": 6610, "epoch": 79} {"train_loss": -17.03669548034668, "global_step": 6611, "epoch": 79} {"train_loss": -16.864898681640625, "global_step": 6612, "epoch": 79} {"train_loss": -17.37898826599121, "global_step": 6613, "epoch": 79} {"train_loss": -17.160947799682617, "global_step": 6614, "epoch": 79} {"train_loss": -17.15635108947754, "global_step": 6615, "epoch": 79} {"train_loss": -17.748281478881836, "global_step": 6616, "epoch": 79} {"train_loss": -17.233701705932617, "global_step": 6617, "epoch": 79} {"train_loss": -16.891633987426758, "global_step": 6618, "epoch": 79} {"train_loss": -17.05939292907715, "global_step": 6619, "epoch": 79} {"train_loss": -17.291236877441406, "global_step": 6620, "epoch": 79} {"train_loss": -17.1389217376709, "global_step": 6621, "epoch": 79} {"train_loss": -17.238819122314453, "global_step": 6622, "epoch": 79} {"train_loss": -17.146869659423828, "global_step": 6623, "epoch": 79} {"train_loss": -17.28829574584961, "global_step": 6624, "epoch": 79} {"train_loss": -17.113683700561523, "global_step": 6625, "epoch": 79} {"train_loss": -17.144519805908203, "global_step": 6626, "epoch": 79} {"train_loss": -17.353620529174805, "global_step": 6627, "epoch": 79} {"train_loss": -17.09256935119629, "global_step": 6628, "epoch": 79} {"train_loss": -16.7114315032959, "global_step": 6629, "epoch": 79} {"train_loss": -16.799612045288086, "global_step": 6630, "epoch": 79} {"train_loss": -17.003868103027344, "global_step": 6631, "epoch": 79} {"train_loss": -17.260324478149414, "global_step": 6632, "epoch": 79} {"train_loss": -16.831735610961914, "global_step": 6633, "epoch": 79} {"train_loss": -16.786163330078125, "global_step": 6634, "epoch": 79} {"train_loss": -16.9082088470459, "global_step": 6635, "epoch": 79} {"train_loss": -17.160856246948242, "global_step": 6636, "epoch": 79} {"train_loss": -17.06561851501465, "global_step": 6637, "epoch": 79} {"train_loss": -17.700679779052734, "global_step": 6638, "epoch": 79} {"train_loss": -17.133989173245716, "global_step": 6639, "epoch": 79, "val_loss": 6753931.0} {"train_loss": -16.929548263549805, "global_step": 6640, "epoch": 80} {"train_loss": -17.45528221130371, "global_step": 6641, "epoch": 80} {"train_loss": -16.69504165649414, "global_step": 6642, "epoch": 80} {"train_loss": -17.04628562927246, "global_step": 6643, "epoch": 80} {"train_loss": -16.801830291748047, "global_step": 6644, "epoch": 80} {"train_loss": -16.968326568603516, "global_step": 6645, "epoch": 80} {"train_loss": -17.023271560668945, "global_step": 6646, "epoch": 80} {"train_loss": -16.828725814819336, "global_step": 6647, "epoch": 80} {"train_loss": -17.20815086364746, "global_step": 6648, "epoch": 80} {"train_loss": -17.054853439331055, "global_step": 6649, "epoch": 80} {"train_loss": -17.145418167114258, "global_step": 6650, "epoch": 80} {"train_loss": -17.20294761657715, "global_step": 6651, "epoch": 80} {"train_loss": -17.068302154541016, "global_step": 6652, "epoch": 80} {"train_loss": -16.75691032409668, "global_step": 6653, "epoch": 80} {"train_loss": -17.056119918823242, "global_step": 6654, "epoch": 80} {"train_loss": -17.181720733642578, "global_step": 6655, "epoch": 80} {"train_loss": -17.119173049926758, "global_step": 6656, "epoch": 80} {"train_loss": -16.848896026611328, "global_step": 6657, "epoch": 80} {"train_loss": -16.873289108276367, "global_step": 6658, "epoch": 80} {"train_loss": -17.33635902404785, "global_step": 6659, "epoch": 80} {"train_loss": -17.131757736206055, "global_step": 6660, "epoch": 80} {"train_loss": -16.83279800415039, "global_step": 6661, "epoch": 80} {"train_loss": -17.21143913269043, "global_step": 6662, "epoch": 80} {"train_loss": -16.94905662536621, "global_step": 6663, "epoch": 80} {"train_loss": -16.54115104675293, "global_step": 6664, "epoch": 80} {"train_loss": -17.082000732421875, "global_step": 6665, "epoch": 80} {"train_loss": -17.131681442260742, "global_step": 6666, "epoch": 80} {"train_loss": -17.166013717651367, "global_step": 6667, "epoch": 80} {"train_loss": -17.34667205810547, "global_step": 6668, "epoch": 80} {"train_loss": -17.091840744018555, "global_step": 6669, "epoch": 80} {"train_loss": -17.219833374023438, "global_step": 6670, "epoch": 80} {"train_loss": -17.1545352935791, "global_step": 6671, "epoch": 80} {"train_loss": -16.636262893676758, "global_step": 6672, "epoch": 80} {"train_loss": -17.256912231445312, "global_step": 6673, "epoch": 80} {"train_loss": -17.33658218383789, "global_step": 6674, "epoch": 80} {"train_loss": -17.65947914123535, "global_step": 6675, "epoch": 80} {"train_loss": -16.986799240112305, "global_step": 6676, "epoch": 80} {"train_loss": -17.072036743164062, "global_step": 6677, "epoch": 80} {"train_loss": -17.5042724609375, "global_step": 6678, "epoch": 80} {"train_loss": -17.440996170043945, "global_step": 6679, "epoch": 80} {"train_loss": -17.506343841552734, "global_step": 6680, "epoch": 80} {"train_loss": -17.043781280517578, "global_step": 6681, "epoch": 80} {"train_loss": -17.110700607299805, "global_step": 6682, "epoch": 80} {"train_loss": -17.538496017456055, "global_step": 6683, "epoch": 80} {"train_loss": -16.940649032592773, "global_step": 6684, "epoch": 80} {"train_loss": -17.218976974487305, "global_step": 6685, "epoch": 80} {"train_loss": -17.37909698486328, "global_step": 6686, "epoch": 80} {"train_loss": -16.918949127197266, "global_step": 6687, "epoch": 80} {"train_loss": -17.302875518798828, "global_step": 6688, "epoch": 80} {"train_loss": -17.121068954467773, "global_step": 6689, "epoch": 80} {"train_loss": -17.158327102661133, "global_step": 6690, "epoch": 80} {"train_loss": -17.177976608276367, "global_step": 6691, "epoch": 80} {"train_loss": -17.21535301208496, "global_step": 6692, "epoch": 80} {"train_loss": -16.70069694519043, "global_step": 6693, "epoch": 80} {"train_loss": -17.238866806030273, "global_step": 6694, "epoch": 80} {"train_loss": -16.933839797973633, "global_step": 6695, "epoch": 80} {"train_loss": -17.374515533447266, "global_step": 6696, "epoch": 80} {"train_loss": -17.27967643737793, "global_step": 6697, "epoch": 80} {"train_loss": -17.04583168029785, "global_step": 6698, "epoch": 80} {"train_loss": -17.427974700927734, "global_step": 6699, "epoch": 80} {"train_loss": -16.86600685119629, "global_step": 6700, "epoch": 80} {"train_loss": -17.551006317138672, "global_step": 6701, "epoch": 80} {"train_loss": -17.01059341430664, "global_step": 6702, "epoch": 80} {"train_loss": -17.51849937438965, "global_step": 6703, "epoch": 80} {"train_loss": -17.111709594726562, "global_step": 6704, "epoch": 80} {"train_loss": -17.179712295532227, "global_step": 6705, "epoch": 80} {"train_loss": -17.366710662841797, "global_step": 6706, "epoch": 80} {"train_loss": -17.240680694580078, "global_step": 6707, "epoch": 80} {"train_loss": -17.1865177154541, "global_step": 6708, "epoch": 80} {"train_loss": -17.33542823791504, "global_step": 6709, "epoch": 80} {"train_loss": -17.138031005859375, "global_step": 6710, "epoch": 80} {"train_loss": -17.00934410095215, "global_step": 6711, "epoch": 80} {"train_loss": -17.192752838134766, "global_step": 6712, "epoch": 80} {"train_loss": -16.97760009765625, "global_step": 6713, "epoch": 80} {"train_loss": -17.486705780029297, "global_step": 6714, "epoch": 80} {"train_loss": -17.005250930786133, "global_step": 6715, "epoch": 80} {"train_loss": -17.20900535583496, "global_step": 6716, "epoch": 80} {"train_loss": -17.14344024658203, "global_step": 6717, "epoch": 80} {"train_loss": -17.1496639251709, "global_step": 6718, "epoch": 80} {"train_loss": -16.91027069091797, "global_step": 6719, "epoch": 80} {"train_loss": -17.393339157104492, "global_step": 6720, "epoch": 80} {"train_loss": -16.935972213745117, "global_step": 6721, "epoch": 80} {"train_loss": -17.14043256460902, "global_step": 6722, "epoch": 80, "val_loss": 6657960.0} {"train_loss": -17.011154174804688, "global_step": 6723, "epoch": 81} {"train_loss": -16.845142364501953, "global_step": 6724, "epoch": 81} {"train_loss": -17.255176544189453, "global_step": 6725, "epoch": 81} {"train_loss": -17.170011520385742, "global_step": 6726, "epoch": 81} {"train_loss": -17.15199851989746, "global_step": 6727, "epoch": 81} {"train_loss": -17.118213653564453, "global_step": 6728, "epoch": 81} {"train_loss": -17.36014175415039, "global_step": 6729, "epoch": 81} {"train_loss": -17.237119674682617, "global_step": 6730, "epoch": 81} {"train_loss": -16.76984214782715, "global_step": 6731, "epoch": 81} {"train_loss": -16.814220428466797, "global_step": 6732, "epoch": 81} {"train_loss": -16.980403900146484, "global_step": 6733, "epoch": 81} {"train_loss": -17.202972412109375, "global_step": 6734, "epoch": 81} {"train_loss": -16.83662223815918, "global_step": 6735, "epoch": 81} {"train_loss": -16.980405807495117, "global_step": 6736, "epoch": 81} {"train_loss": -16.860599517822266, "global_step": 6737, "epoch": 81} {"train_loss": -17.293441772460938, "global_step": 6738, "epoch": 81} {"train_loss": -17.176294326782227, "global_step": 6739, "epoch": 81} {"train_loss": -17.186279296875, "global_step": 6740, "epoch": 81} {"train_loss": -17.15403175354004, "global_step": 6741, "epoch": 81} {"train_loss": -17.120380401611328, "global_step": 6742, "epoch": 81} {"train_loss": -17.224393844604492, "global_step": 6743, "epoch": 81} {"train_loss": -16.993680953979492, "global_step": 6744, "epoch": 81} {"train_loss": -17.300411224365234, "global_step": 6745, "epoch": 81} {"train_loss": -17.284942626953125, "global_step": 6746, "epoch": 81} {"train_loss": -16.896162033081055, "global_step": 6747, "epoch": 81} {"train_loss": -17.226882934570312, "global_step": 6748, "epoch": 81} {"train_loss": -17.107866287231445, "global_step": 6749, "epoch": 81} {"train_loss": -17.118606567382812, "global_step": 6750, "epoch": 81} {"train_loss": -17.115087509155273, "global_step": 6751, "epoch": 81} {"train_loss": -16.912851333618164, "global_step": 6752, "epoch": 81} {"train_loss": -17.187875747680664, "global_step": 6753, "epoch": 81} {"train_loss": -17.08902931213379, "global_step": 6754, "epoch": 81} {"train_loss": -17.192977905273438, "global_step": 6755, "epoch": 81} {"train_loss": -17.323942184448242, "global_step": 6756, "epoch": 81} {"train_loss": -17.356393814086914, "global_step": 6757, "epoch": 81} {"train_loss": -17.218276977539062, "global_step": 6758, "epoch": 81} {"train_loss": -17.249547958374023, "global_step": 6759, "epoch": 81} {"train_loss": -17.33015251159668, "global_step": 6760, "epoch": 81} {"train_loss": -17.374479293823242, "global_step": 6761, "epoch": 81} {"train_loss": -17.137418746948242, "global_step": 6762, "epoch": 81} {"train_loss": -17.022869110107422, "global_step": 6763, "epoch": 81} {"train_loss": -17.285863876342773, "global_step": 6764, "epoch": 81} {"train_loss": -17.00397300720215, "global_step": 6765, "epoch": 81} {"train_loss": -16.74104118347168, "global_step": 6766, "epoch": 81} {"train_loss": -17.171995162963867, "global_step": 6767, "epoch": 81} {"train_loss": -17.479887008666992, "global_step": 6768, "epoch": 81} {"train_loss": -16.953004837036133, "global_step": 6769, "epoch": 81} {"train_loss": -17.339876174926758, "global_step": 6770, "epoch": 81} {"train_loss": -17.111831665039062, "global_step": 6771, "epoch": 81} {"train_loss": -17.004436492919922, "global_step": 6772, "epoch": 81} {"train_loss": -16.994470596313477, "global_step": 6773, "epoch": 81} {"train_loss": -17.102582931518555, "global_step": 6774, "epoch": 81} {"train_loss": -16.96518898010254, "global_step": 6775, "epoch": 81} {"train_loss": -17.388202667236328, "global_step": 6776, "epoch": 81} {"train_loss": -17.013505935668945, "global_step": 6777, "epoch": 81} {"train_loss": -16.94682502746582, "global_step": 6778, "epoch": 81} {"train_loss": -17.34490966796875, "global_step": 6779, "epoch": 81} {"train_loss": -16.983110427856445, "global_step": 6780, "epoch": 81} {"train_loss": -17.041181564331055, "global_step": 6781, "epoch": 81} {"train_loss": -17.080190658569336, "global_step": 6782, "epoch": 81} {"train_loss": -16.685678482055664, "global_step": 6783, "epoch": 81} {"train_loss": -17.381330490112305, "global_step": 6784, "epoch": 81} {"train_loss": -17.42753791809082, "global_step": 6785, "epoch": 81} {"train_loss": -17.104089736938477, "global_step": 6786, "epoch": 81} {"train_loss": -17.050092697143555, "global_step": 6787, "epoch": 81} {"train_loss": -17.137893676757812, "global_step": 6788, "epoch": 81} {"train_loss": -16.828699111938477, "global_step": 6789, "epoch": 81} {"train_loss": -17.01966667175293, "global_step": 6790, "epoch": 81} {"train_loss": -17.12510108947754, "global_step": 6791, "epoch": 81} {"train_loss": -17.203216552734375, "global_step": 6792, "epoch": 81} {"train_loss": -17.31324577331543, "global_step": 6793, "epoch": 81} {"train_loss": -17.455026626586914, "global_step": 6794, "epoch": 81} {"train_loss": -17.2656307220459, "global_step": 6795, "epoch": 81} {"train_loss": -17.091232299804688, "global_step": 6796, "epoch": 81} {"train_loss": -17.286813735961914, "global_step": 6797, "epoch": 81} {"train_loss": -17.46683120727539, "global_step": 6798, "epoch": 81} {"train_loss": -17.291059494018555, "global_step": 6799, "epoch": 81} {"train_loss": -17.137136459350586, "global_step": 6800, "epoch": 81} {"train_loss": -17.13886833190918, "global_step": 6801, "epoch": 81} {"train_loss": -17.14412498474121, "global_step": 6802, "epoch": 81} {"train_loss": -17.46002769470215, "global_step": 6803, "epoch": 81} {"train_loss": -17.390146255493164, "global_step": 6804, "epoch": 81} {"train_loss": -17.145872001188348, "global_step": 6805, "epoch": 81, "val_loss": 6418377.0} {"train_loss": -16.993616104125977, "global_step": 6806, "epoch": 82} {"train_loss": -17.431276321411133, "global_step": 6807, "epoch": 82} {"train_loss": -17.166980743408203, "global_step": 6808, "epoch": 82} {"train_loss": -17.415739059448242, "global_step": 6809, "epoch": 82} {"train_loss": -17.58193016052246, "global_step": 6810, "epoch": 82} {"train_loss": -17.482925415039062, "global_step": 6811, "epoch": 82} {"train_loss": -17.03276824951172, "global_step": 6812, "epoch": 82} {"train_loss": -16.65906524658203, "global_step": 6813, "epoch": 82} {"train_loss": -16.924564361572266, "global_step": 6814, "epoch": 82} {"train_loss": -17.02203941345215, "global_step": 6815, "epoch": 82} {"train_loss": -16.837934494018555, "global_step": 6816, "epoch": 82} {"train_loss": -16.98940086364746, "global_step": 6817, "epoch": 82} {"train_loss": -17.145009994506836, "global_step": 6818, "epoch": 82} {"train_loss": -17.072599411010742, "global_step": 6819, "epoch": 82} {"train_loss": -17.63772964477539, "global_step": 6820, "epoch": 82} {"train_loss": -17.051315307617188, "global_step": 6821, "epoch": 82} {"train_loss": -17.21844482421875, "global_step": 6822, "epoch": 82} {"train_loss": -17.430421829223633, "global_step": 6823, "epoch": 82} {"train_loss": -16.97761344909668, "global_step": 6824, "epoch": 82} {"train_loss": -17.326635360717773, "global_step": 6825, "epoch": 82} {"train_loss": -16.73967933654785, "global_step": 6826, "epoch": 82} {"train_loss": -16.970928192138672, "global_step": 6827, "epoch": 82} {"train_loss": -17.147113800048828, "global_step": 6828, "epoch": 82} {"train_loss": -16.99673843383789, "global_step": 6829, "epoch": 82} {"train_loss": -17.35125160217285, "global_step": 6830, "epoch": 82} {"train_loss": -17.40654945373535, "global_step": 6831, "epoch": 82} {"train_loss": -17.081850051879883, "global_step": 6832, "epoch": 82} {"train_loss": -17.14717674255371, "global_step": 6833, "epoch": 82} {"train_loss": -17.3120174407959, "global_step": 6834, "epoch": 82} {"train_loss": -17.456012725830078, "global_step": 6835, "epoch": 82} {"train_loss": -16.915679931640625, "global_step": 6836, "epoch": 82} {"train_loss": -17.18258285522461, "global_step": 6837, "epoch": 82} {"train_loss": -17.191543579101562, "global_step": 6838, "epoch": 82} {"train_loss": -17.623828887939453, "global_step": 6839, "epoch": 82} {"train_loss": -17.139921188354492, "global_step": 6840, "epoch": 82} {"train_loss": -17.522279739379883, "global_step": 6841, "epoch": 82} {"train_loss": -16.811542510986328, "global_step": 6842, "epoch": 82} {"train_loss": -17.658100128173828, "global_step": 6843, "epoch": 82} {"train_loss": -17.36480712890625, "global_step": 6844, "epoch": 82} {"train_loss": -17.221660614013672, "global_step": 6845, "epoch": 82} {"train_loss": -17.224008560180664, "global_step": 6846, "epoch": 82} {"train_loss": -16.94618797302246, "global_step": 6847, "epoch": 82} {"train_loss": -16.766881942749023, "global_step": 6848, "epoch": 82} {"train_loss": -17.08177375793457, "global_step": 6849, "epoch": 82} {"train_loss": -17.307132720947266, "global_step": 6850, "epoch": 82} {"train_loss": -17.04672622680664, "global_step": 6851, "epoch": 82} {"train_loss": -16.979450225830078, "global_step": 6852, "epoch": 82} {"train_loss": -17.466524124145508, "global_step": 6853, "epoch": 82} {"train_loss": -17.02973747253418, "global_step": 6854, "epoch": 82} {"train_loss": -17.059545516967773, "global_step": 6855, "epoch": 82} {"train_loss": -17.224803924560547, "global_step": 6856, "epoch": 82} {"train_loss": -17.025959014892578, "global_step": 6857, "epoch": 82} {"train_loss": -17.26457977294922, "global_step": 6858, "epoch": 82} {"train_loss": -17.249286651611328, "global_step": 6859, "epoch": 82} {"train_loss": -17.477752685546875, "global_step": 6860, "epoch": 82} {"train_loss": -17.02692222595215, "global_step": 6861, "epoch": 82} {"train_loss": -17.055723190307617, "global_step": 6862, "epoch": 82} {"train_loss": -17.144569396972656, "global_step": 6863, "epoch": 82} {"train_loss": -16.896026611328125, "global_step": 6864, "epoch": 82} {"train_loss": -17.36101722717285, "global_step": 6865, "epoch": 82} {"train_loss": -17.565702438354492, "global_step": 6866, "epoch": 82} {"train_loss": -17.19837760925293, "global_step": 6867, "epoch": 82} {"train_loss": -16.70798110961914, "global_step": 6868, "epoch": 82} {"train_loss": -17.218931198120117, "global_step": 6869, "epoch": 82} {"train_loss": -16.898639678955078, "global_step": 6870, "epoch": 82} {"train_loss": -17.35455322265625, "global_step": 6871, "epoch": 82} {"train_loss": -17.38349723815918, "global_step": 6872, "epoch": 82} {"train_loss": -16.93204116821289, "global_step": 6873, "epoch": 82} {"train_loss": -17.546274185180664, "global_step": 6874, "epoch": 82} {"train_loss": -17.368452072143555, "global_step": 6875, "epoch": 82} {"train_loss": -17.722232818603516, "global_step": 6876, "epoch": 82} {"train_loss": -17.086589813232422, "global_step": 6877, "epoch": 82} {"train_loss": -16.80927848815918, "global_step": 6878, "epoch": 82} {"train_loss": -17.355876922607422, "global_step": 6879, "epoch": 82} {"train_loss": -16.917945861816406, "global_step": 6880, "epoch": 82} {"train_loss": -17.02267837524414, "global_step": 6881, "epoch": 82} {"train_loss": -17.35019302368164, "global_step": 6882, "epoch": 82} {"train_loss": -16.73489761352539, "global_step": 6883, "epoch": 82} {"train_loss": -17.266630172729492, "global_step": 6884, "epoch": 82} {"train_loss": -17.71990394592285, "global_step": 6885, "epoch": 82} {"train_loss": -17.132909774780273, "global_step": 6886, "epoch": 82} {"train_loss": -17.413068771362305, "global_step": 6887, "epoch": 82} {"train_loss": -17.181405515555877, "global_step": 6888, "epoch": 82, "val_loss": 6529155.0} {"train_loss": -17.14839744567871, "global_step": 6889, "epoch": 83} {"train_loss": -16.306303024291992, "global_step": 6890, "epoch": 83} {"train_loss": -17.499940872192383, "global_step": 6891, "epoch": 83} {"train_loss": -17.10598373413086, "global_step": 6892, "epoch": 83} {"train_loss": -17.23373794555664, "global_step": 6893, "epoch": 83} {"train_loss": -17.055803298950195, "global_step": 6894, "epoch": 83} {"train_loss": -16.79644203186035, "global_step": 6895, "epoch": 83} {"train_loss": -17.667966842651367, "global_step": 6896, "epoch": 83} {"train_loss": -16.921159744262695, "global_step": 6897, "epoch": 83} {"train_loss": -16.930919647216797, "global_step": 6898, "epoch": 83} {"train_loss": -16.599119186401367, "global_step": 6899, "epoch": 83} {"train_loss": -17.200727462768555, "global_step": 6900, "epoch": 83} {"train_loss": -17.230031967163086, "global_step": 6901, "epoch": 83} {"train_loss": -17.22372817993164, "global_step": 6902, "epoch": 83} {"train_loss": -17.2800235748291, "global_step": 6903, "epoch": 83} {"train_loss": -17.330829620361328, "global_step": 6904, "epoch": 83} {"train_loss": -17.425947189331055, "global_step": 6905, "epoch": 83} {"train_loss": -17.085811614990234, "global_step": 6906, "epoch": 83} {"train_loss": -17.5363826751709, "global_step": 6907, "epoch": 83} {"train_loss": -17.251514434814453, "global_step": 6908, "epoch": 83} {"train_loss": -17.092069625854492, "global_step": 6909, "epoch": 83} {"train_loss": -16.922128677368164, "global_step": 6910, "epoch": 83} {"train_loss": -16.86936378479004, "global_step": 6911, "epoch": 83} {"train_loss": -16.859663009643555, "global_step": 6912, "epoch": 83} {"train_loss": -16.832265853881836, "global_step": 6913, "epoch": 83} {"train_loss": -17.399179458618164, "global_step": 6914, "epoch": 83} {"train_loss": -17.47669792175293, "global_step": 6915, "epoch": 83} {"train_loss": -17.43939781188965, "global_step": 6916, "epoch": 83} {"train_loss": -16.999826431274414, "global_step": 6917, "epoch": 83} {"train_loss": -17.5478572845459, "global_step": 6918, "epoch": 83} {"train_loss": -16.97621726989746, "global_step": 6919, "epoch": 83} {"train_loss": -16.988771438598633, "global_step": 6920, "epoch": 83} {"train_loss": -17.563812255859375, "global_step": 6921, "epoch": 83} {"train_loss": -16.86730194091797, "global_step": 6922, "epoch": 83} {"train_loss": -16.888721466064453, "global_step": 6923, "epoch": 83} {"train_loss": -17.333932876586914, "global_step": 6924, "epoch": 83} {"train_loss": -17.418081283569336, "global_step": 6925, "epoch": 83} {"train_loss": -17.17831802368164, "global_step": 6926, "epoch": 83} {"train_loss": -17.275466918945312, "global_step": 6927, "epoch": 83} {"train_loss": -17.300012588500977, "global_step": 6928, "epoch": 83} {"train_loss": -17.426054000854492, "global_step": 6929, "epoch": 83} {"train_loss": -17.366724014282227, "global_step": 6930, "epoch": 83} {"train_loss": -17.570898056030273, "global_step": 6931, "epoch": 83} {"train_loss": -17.26436424255371, "global_step": 6932, "epoch": 83} {"train_loss": -17.265241622924805, "global_step": 6933, "epoch": 83} {"train_loss": -17.182083129882812, "global_step": 6934, "epoch": 83} {"train_loss": -17.460947036743164, "global_step": 6935, "epoch": 83} {"train_loss": -17.166318893432617, "global_step": 6936, "epoch": 83} {"train_loss": -17.080533981323242, "global_step": 6937, "epoch": 83} {"train_loss": -16.92168617248535, "global_step": 6938, "epoch": 83} {"train_loss": -17.09958267211914, "global_step": 6939, "epoch": 83} {"train_loss": -17.500516891479492, "global_step": 6940, "epoch": 83} {"train_loss": -16.93524742126465, "global_step": 6941, "epoch": 83} {"train_loss": -17.19816017150879, "global_step": 6942, "epoch": 83} {"train_loss": -16.946691513061523, "global_step": 6943, "epoch": 83} {"train_loss": -16.879941940307617, "global_step": 6944, "epoch": 83} {"train_loss": -17.28515625, "global_step": 6945, "epoch": 83} {"train_loss": -17.314842224121094, "global_step": 6946, "epoch": 83} {"train_loss": -17.09956169128418, "global_step": 6947, "epoch": 83} {"train_loss": -16.772619247436523, "global_step": 6948, "epoch": 83} {"train_loss": -17.611127853393555, "global_step": 6949, "epoch": 83} {"train_loss": -17.26058578491211, "global_step": 6950, "epoch": 83} {"train_loss": -17.598302841186523, "global_step": 6951, "epoch": 83} {"train_loss": -16.884572982788086, "global_step": 6952, "epoch": 83} {"train_loss": -17.354326248168945, "global_step": 6953, "epoch": 83} {"train_loss": -17.477554321289062, "global_step": 6954, "epoch": 83} {"train_loss": -17.10695457458496, "global_step": 6955, "epoch": 83} {"train_loss": -17.264297485351562, "global_step": 6956, "epoch": 83} {"train_loss": -17.333219528198242, "global_step": 6957, "epoch": 83} {"train_loss": -17.20094871520996, "global_step": 6958, "epoch": 83} {"train_loss": -17.413131713867188, "global_step": 6959, "epoch": 83} {"train_loss": -17.29580307006836, "global_step": 6960, "epoch": 83} {"train_loss": -17.377695083618164, "global_step": 6961, "epoch": 83} {"train_loss": -17.164209365844727, "global_step": 6962, "epoch": 83} {"train_loss": -17.32233238220215, "global_step": 6963, "epoch": 83} {"train_loss": -17.84791374206543, "global_step": 6964, "epoch": 83} {"train_loss": -16.8310604095459, "global_step": 6965, "epoch": 83} {"train_loss": -17.36309814453125, "global_step": 6966, "epoch": 83} {"train_loss": -17.324419021606445, "global_step": 6967, "epoch": 83} {"train_loss": -17.374528884887695, "global_step": 6968, "epoch": 83} {"train_loss": -17.340587615966797, "global_step": 6969, "epoch": 83} {"train_loss": -16.406078338623047, "global_step": 6970, "epoch": 83} {"train_loss": -17.206103428300604, "global_step": 6971, "epoch": 83, "val_loss": 6548601.5} {"train_loss": -17.104238510131836, "global_step": 6972, "epoch": 84} {"train_loss": -17.270238876342773, "global_step": 6973, "epoch": 84} {"train_loss": -17.16581916809082, "global_step": 6974, "epoch": 84} {"train_loss": -17.41163444519043, "global_step": 6975, "epoch": 84} {"train_loss": -17.26185417175293, "global_step": 6976, "epoch": 84} {"train_loss": -17.345571517944336, "global_step": 6977, "epoch": 84} {"train_loss": -16.714200973510742, "global_step": 6978, "epoch": 84} {"train_loss": -16.87849235534668, "global_step": 6979, "epoch": 84} {"train_loss": -17.333703994750977, "global_step": 6980, "epoch": 84} {"train_loss": -17.094152450561523, "global_step": 6981, "epoch": 84} {"train_loss": -16.662294387817383, "global_step": 6982, "epoch": 84} {"train_loss": -17.074155807495117, "global_step": 6983, "epoch": 84} {"train_loss": -17.072721481323242, "global_step": 6984, "epoch": 84} {"train_loss": -17.38099479675293, "global_step": 6985, "epoch": 84} {"train_loss": -17.222776412963867, "global_step": 6986, "epoch": 84} {"train_loss": -17.214994430541992, "global_step": 6987, "epoch": 84} {"train_loss": -16.834882736206055, "global_step": 6988, "epoch": 84} {"train_loss": -17.32501983642578, "global_step": 6989, "epoch": 84} {"train_loss": -17.194177627563477, "global_step": 6990, "epoch": 84} {"train_loss": -17.001968383789062, "global_step": 6991, "epoch": 84} {"train_loss": -17.365909576416016, "global_step": 6992, "epoch": 84} {"train_loss": -17.118032455444336, "global_step": 6993, "epoch": 84} {"train_loss": -16.835033416748047, "global_step": 6994, "epoch": 84} {"train_loss": -17.141721725463867, "global_step": 6995, "epoch": 84} {"train_loss": -17.130029678344727, "global_step": 6996, "epoch": 84} {"train_loss": -16.975055694580078, "global_step": 6997, "epoch": 84} {"train_loss": -17.26239776611328, "global_step": 6998, "epoch": 84} {"train_loss": -16.883832931518555, "global_step": 6999, "epoch": 84} {"train_loss": -17.360637664794922, "global_step": 7000, "epoch": 84} {"train_loss": -17.025588989257812, "global_step": 7001, "epoch": 84} {"train_loss": -16.90752601623535, "global_step": 7002, "epoch": 84} {"train_loss": -17.22688102722168, "global_step": 7003, "epoch": 84} {"train_loss": -17.017702102661133, "global_step": 7004, "epoch": 84} {"train_loss": -17.37125587463379, "global_step": 7005, "epoch": 84} {"train_loss": -16.96881103515625, "global_step": 7006, "epoch": 84} {"train_loss": -17.119455337524414, "global_step": 7007, "epoch": 84} {"train_loss": -17.47859764099121, "global_step": 7008, "epoch": 84} {"train_loss": -17.59259033203125, "global_step": 7009, "epoch": 84} {"train_loss": -17.239938735961914, "global_step": 7010, "epoch": 84} {"train_loss": -17.428770065307617, "global_step": 7011, "epoch": 84} {"train_loss": -17.538925170898438, "global_step": 7012, "epoch": 84} {"train_loss": -17.14227867126465, "global_step": 7013, "epoch": 84} {"train_loss": -17.20355224609375, "global_step": 7014, "epoch": 84} {"train_loss": -17.12354850769043, "global_step": 7015, "epoch": 84} {"train_loss": -16.98574447631836, "global_step": 7016, "epoch": 84} {"train_loss": -17.2753963470459, "global_step": 7017, "epoch": 84} {"train_loss": -16.925405502319336, "global_step": 7018, "epoch": 84} {"train_loss": -17.27662467956543, "global_step": 7019, "epoch": 84} {"train_loss": -17.412494659423828, "global_step": 7020, "epoch": 84} {"train_loss": -17.23221778869629, "global_step": 7021, "epoch": 84} {"train_loss": -17.27117347717285, "global_step": 7022, "epoch": 84} {"train_loss": -17.479352951049805, "global_step": 7023, "epoch": 84} {"train_loss": -17.462997436523438, "global_step": 7024, "epoch": 84} {"train_loss": -17.049612045288086, "global_step": 7025, "epoch": 84} {"train_loss": -17.017457962036133, "global_step": 7026, "epoch": 84} {"train_loss": -17.197803497314453, "global_step": 7027, "epoch": 84} {"train_loss": -17.068029403686523, "global_step": 7028, "epoch": 84} {"train_loss": -17.161724090576172, "global_step": 7029, "epoch": 84} {"train_loss": -17.081714630126953, "global_step": 7030, "epoch": 84} {"train_loss": -17.161182403564453, "global_step": 7031, "epoch": 84} {"train_loss": -16.859973907470703, "global_step": 7032, "epoch": 84} {"train_loss": -17.727161407470703, "global_step": 7033, "epoch": 84} {"train_loss": -17.05744743347168, "global_step": 7034, "epoch": 84} {"train_loss": -17.463220596313477, "global_step": 7035, "epoch": 84} {"train_loss": -17.45206642150879, "global_step": 7036, "epoch": 84} {"train_loss": -17.237592697143555, "global_step": 7037, "epoch": 84} {"train_loss": -16.941146850585938, "global_step": 7038, "epoch": 84} {"train_loss": -17.08089828491211, "global_step": 7039, "epoch": 84} {"train_loss": -17.08505630493164, "global_step": 7040, "epoch": 84} {"train_loss": -17.197311401367188, "global_step": 7041, "epoch": 84} {"train_loss": -17.367450714111328, "global_step": 7042, "epoch": 84} {"train_loss": -17.20804214477539, "global_step": 7043, "epoch": 84} {"train_loss": -17.663055419921875, "global_step": 7044, "epoch": 84} {"train_loss": -17.308767318725586, "global_step": 7045, "epoch": 84} {"train_loss": -17.33680534362793, "global_step": 7046, "epoch": 84} {"train_loss": -17.19379234313965, "global_step": 7047, "epoch": 84} {"train_loss": -17.388301849365234, "global_step": 7048, "epoch": 84} {"train_loss": -17.29982566833496, "global_step": 7049, "epoch": 84} {"train_loss": -17.726322174072266, "global_step": 7050, "epoch": 84} {"train_loss": -17.762266159057617, "global_step": 7051, "epoch": 84} {"train_loss": -16.92925262451172, "global_step": 7052, "epoch": 84} {"train_loss": -17.265655517578125, "global_step": 7053, "epoch": 84} {"train_loss": -17.192656505538757, "global_step": 7054, "epoch": 84, "val_loss": 6463110.0} {"train_loss": -17.142383575439453, "global_step": 7055, "epoch": 85} {"train_loss": -17.32781410217285, "global_step": 7056, "epoch": 85} {"train_loss": -17.311147689819336, "global_step": 7057, "epoch": 85} {"train_loss": -17.076807022094727, "global_step": 7058, "epoch": 85} {"train_loss": -17.25177764892578, "global_step": 7059, "epoch": 85} {"train_loss": -17.220182418823242, "global_step": 7060, "epoch": 85} {"train_loss": -17.359865188598633, "global_step": 7061, "epoch": 85} {"train_loss": -16.820112228393555, "global_step": 7062, "epoch": 85} {"train_loss": -17.023784637451172, "global_step": 7063, "epoch": 85} {"train_loss": -17.24549674987793, "global_step": 7064, "epoch": 85} {"train_loss": -16.97125816345215, "global_step": 7065, "epoch": 85} {"train_loss": -16.943496704101562, "global_step": 7066, "epoch": 85} {"train_loss": -17.272043228149414, "global_step": 7067, "epoch": 85} {"train_loss": -17.106597900390625, "global_step": 7068, "epoch": 85} {"train_loss": -16.89204978942871, "global_step": 7069, "epoch": 85} {"train_loss": -17.397232055664062, "global_step": 7070, "epoch": 85} {"train_loss": -16.945144653320312, "global_step": 7071, "epoch": 85} {"train_loss": -17.181987762451172, "global_step": 7072, "epoch": 85} {"train_loss": -17.04387855529785, "global_step": 7073, "epoch": 85} {"train_loss": -17.453746795654297, "global_step": 7074, "epoch": 85} {"train_loss": -17.453739166259766, "global_step": 7075, "epoch": 85} {"train_loss": -16.8079833984375, "global_step": 7076, "epoch": 85} {"train_loss": -16.959211349487305, "global_step": 7077, "epoch": 85} {"train_loss": -17.37869644165039, "global_step": 7078, "epoch": 85} {"train_loss": -17.382596969604492, "global_step": 7079, "epoch": 85} {"train_loss": -17.120037078857422, "global_step": 7080, "epoch": 85} {"train_loss": -17.397985458374023, "global_step": 7081, "epoch": 85} {"train_loss": -17.27634620666504, "global_step": 7082, "epoch": 85} {"train_loss": -17.5771484375, "global_step": 7083, "epoch": 85} {"train_loss": -17.35762596130371, "global_step": 7084, "epoch": 85} {"train_loss": -17.20721435546875, "global_step": 7085, "epoch": 85} {"train_loss": -17.44637107849121, "global_step": 7086, "epoch": 85} {"train_loss": -17.839353561401367, "global_step": 7087, "epoch": 85} {"train_loss": -17.203765869140625, "global_step": 7088, "epoch": 85} {"train_loss": -17.108320236206055, "global_step": 7089, "epoch": 85} {"train_loss": -17.217153549194336, "global_step": 7090, "epoch": 85} {"train_loss": -17.4306697845459, "global_step": 7091, "epoch": 85} {"train_loss": -17.21341896057129, "global_step": 7092, "epoch": 85} {"train_loss": -17.094594955444336, "global_step": 7093, "epoch": 85} {"train_loss": -17.589262008666992, "global_step": 7094, "epoch": 85} {"train_loss": -17.272302627563477, "global_step": 7095, "epoch": 85} {"train_loss": -17.551427841186523, "global_step": 7096, "epoch": 85} {"train_loss": -17.237154006958008, "global_step": 7097, "epoch": 85} {"train_loss": -17.19815444946289, "global_step": 7098, "epoch": 85} {"train_loss": -17.300024032592773, "global_step": 7099, "epoch": 85} {"train_loss": -17.1773624420166, "global_step": 7100, "epoch": 85} {"train_loss": -17.36981964111328, "global_step": 7101, "epoch": 85} {"train_loss": -17.07079315185547, "global_step": 7102, "epoch": 85} {"train_loss": -17.51460838317871, "global_step": 7103, "epoch": 85} {"train_loss": -17.28518295288086, "global_step": 7104, "epoch": 85} {"train_loss": -17.006200790405273, "global_step": 7105, "epoch": 85} {"train_loss": -17.272363662719727, "global_step": 7106, "epoch": 85} {"train_loss": -17.31545066833496, "global_step": 7107, "epoch": 85} {"train_loss": -17.068086624145508, "global_step": 7108, "epoch": 85} {"train_loss": -17.13160514831543, "global_step": 7109, "epoch": 85} {"train_loss": -17.403852462768555, "global_step": 7110, "epoch": 85} {"train_loss": -17.250507354736328, "global_step": 7111, "epoch": 85} {"train_loss": -17.03217887878418, "global_step": 7112, "epoch": 85} {"train_loss": -17.086551666259766, "global_step": 7113, "epoch": 85} {"train_loss": -17.437368392944336, "global_step": 7114, "epoch": 85} {"train_loss": -17.13301658630371, "global_step": 7115, "epoch": 85} {"train_loss": -17.531888961791992, "global_step": 7116, "epoch": 85} {"train_loss": -16.863807678222656, "global_step": 7117, "epoch": 85} {"train_loss": -17.308034896850586, "global_step": 7118, "epoch": 85} {"train_loss": -17.16036033630371, "global_step": 7119, "epoch": 85} {"train_loss": -17.406553268432617, "global_step": 7120, "epoch": 85} {"train_loss": -17.293668746948242, "global_step": 7121, "epoch": 85} {"train_loss": -17.438133239746094, "global_step": 7122, "epoch": 85} {"train_loss": -17.145214080810547, "global_step": 7123, "epoch": 85} {"train_loss": -17.193622589111328, "global_step": 7124, "epoch": 85} {"train_loss": -17.153560638427734, "global_step": 7125, "epoch": 85} {"train_loss": -17.115802764892578, "global_step": 7126, "epoch": 85} {"train_loss": -17.252958297729492, "global_step": 7127, "epoch": 85} {"train_loss": -17.202312469482422, "global_step": 7128, "epoch": 85} {"train_loss": -17.285003662109375, "global_step": 7129, "epoch": 85} {"train_loss": -17.364540100097656, "global_step": 7130, "epoch": 85} {"train_loss": -17.26400375366211, "global_step": 7131, "epoch": 85} {"train_loss": -17.016538619995117, "global_step": 7132, "epoch": 85} {"train_loss": -17.28196907043457, "global_step": 7133, "epoch": 85} {"train_loss": -17.20644187927246, "global_step": 7134, "epoch": 85} {"train_loss": -17.101795196533203, "global_step": 7135, "epoch": 85} {"train_loss": -17.320621490478516, "global_step": 7136, "epoch": 85} {"train_loss": -17.252745685807195, "global_step": 7137, "epoch": 85, "val_loss": 6864198.0} {"train_loss": -17.242431640625, "global_step": 7138, "epoch": 86} {"train_loss": -17.30771827697754, "global_step": 7139, "epoch": 86} {"train_loss": -16.928312301635742, "global_step": 7140, "epoch": 86} {"train_loss": -17.07917594909668, "global_step": 7141, "epoch": 86} {"train_loss": -17.11470603942871, "global_step": 7142, "epoch": 86} {"train_loss": -17.122756958007812, "global_step": 7143, "epoch": 86} {"train_loss": -17.029951095581055, "global_step": 7144, "epoch": 86} {"train_loss": -17.226806640625, "global_step": 7145, "epoch": 86} {"train_loss": -16.769147872924805, "global_step": 7146, "epoch": 86} {"train_loss": -16.8736572265625, "global_step": 7147, "epoch": 86} {"train_loss": -17.105344772338867, "global_step": 7148, "epoch": 86} {"train_loss": -17.163124084472656, "global_step": 7149, "epoch": 86} {"train_loss": -17.462249755859375, "global_step": 7150, "epoch": 86} {"train_loss": -17.622949600219727, "global_step": 7151, "epoch": 86} {"train_loss": -17.114213943481445, "global_step": 7152, "epoch": 86} {"train_loss": -17.12078285217285, "global_step": 7153, "epoch": 86} {"train_loss": -17.51581382751465, "global_step": 7154, "epoch": 86} {"train_loss": -17.238346099853516, "global_step": 7155, "epoch": 86} {"train_loss": -17.16275405883789, "global_step": 7156, "epoch": 86} {"train_loss": -16.87896156311035, "global_step": 7157, "epoch": 86} {"train_loss": -17.392093658447266, "global_step": 7158, "epoch": 86} {"train_loss": -17.540813446044922, "global_step": 7159, "epoch": 86} {"train_loss": -17.47811508178711, "global_step": 7160, "epoch": 86} {"train_loss": -17.281156539916992, "global_step": 7161, "epoch": 86} {"train_loss": -16.950366973876953, "global_step": 7162, "epoch": 86} {"train_loss": -17.111982345581055, "global_step": 7163, "epoch": 86} {"train_loss": -17.0018310546875, "global_step": 7164, "epoch": 86} {"train_loss": -17.43088150024414, "global_step": 7165, "epoch": 86} {"train_loss": -16.870145797729492, "global_step": 7166, "epoch": 86} {"train_loss": -17.45171356201172, "global_step": 7167, "epoch": 86} {"train_loss": -17.08175277709961, "global_step": 7168, "epoch": 86} {"train_loss": -17.289865493774414, "global_step": 7169, "epoch": 86} {"train_loss": -17.54782485961914, "global_step": 7170, "epoch": 86} {"train_loss": -17.4167537689209, "global_step": 7171, "epoch": 86} {"train_loss": -17.3746395111084, "global_step": 7172, "epoch": 86} {"train_loss": -17.301939010620117, "global_step": 7173, "epoch": 86} {"train_loss": -17.4551944732666, "global_step": 7174, "epoch": 86} {"train_loss": -16.903547286987305, "global_step": 7175, "epoch": 86} {"train_loss": -17.028417587280273, "global_step": 7176, "epoch": 86} {"train_loss": -17.18362808227539, "global_step": 7177, "epoch": 86} {"train_loss": -16.976999282836914, "global_step": 7178, "epoch": 86} {"train_loss": -17.23002052307129, "global_step": 7179, "epoch": 86} {"train_loss": -17.17806053161621, "global_step": 7180, "epoch": 86} {"train_loss": -17.440275192260742, "global_step": 7181, "epoch": 86} {"train_loss": -17.388113021850586, "global_step": 7182, "epoch": 86} {"train_loss": -17.128610610961914, "global_step": 7183, "epoch": 86} {"train_loss": -17.492719650268555, "global_step": 7184, "epoch": 86} {"train_loss": -17.175800323486328, "global_step": 7185, "epoch": 86} {"train_loss": -17.244674682617188, "global_step": 7186, "epoch": 86} {"train_loss": -17.360204696655273, "global_step": 7187, "epoch": 86} {"train_loss": -17.724294662475586, "global_step": 7188, "epoch": 86} {"train_loss": -17.276973724365234, "global_step": 7189, "epoch": 86} {"train_loss": -17.047704696655273, "global_step": 7190, "epoch": 86} {"train_loss": -17.2175350189209, "global_step": 7191, "epoch": 86} {"train_loss": -16.766773223876953, "global_step": 7192, "epoch": 86} {"train_loss": -17.334217071533203, "global_step": 7193, "epoch": 86} {"train_loss": -17.22153091430664, "global_step": 7194, "epoch": 86} {"train_loss": -17.363231658935547, "global_step": 7195, "epoch": 86} {"train_loss": -17.398141860961914, "global_step": 7196, "epoch": 86} {"train_loss": -17.23308753967285, "global_step": 7197, "epoch": 86} {"train_loss": -17.298410415649414, "global_step": 7198, "epoch": 86} {"train_loss": -17.168434143066406, "global_step": 7199, "epoch": 86} {"train_loss": -17.195236206054688, "global_step": 7200, "epoch": 86} {"train_loss": -17.408340454101562, "global_step": 7201, "epoch": 86} {"train_loss": -17.532840728759766, "global_step": 7202, "epoch": 86} {"train_loss": -16.789289474487305, "global_step": 7203, "epoch": 86} {"train_loss": -17.371320724487305, "global_step": 7204, "epoch": 86} {"train_loss": -17.702085494995117, "global_step": 7205, "epoch": 86} {"train_loss": -17.262121200561523, "global_step": 7206, "epoch": 86} {"train_loss": -17.467538833618164, "global_step": 7207, "epoch": 86} {"train_loss": -16.879348754882812, "global_step": 7208, "epoch": 86} {"train_loss": -16.909807205200195, "global_step": 7209, "epoch": 86} {"train_loss": -17.343860626220703, "global_step": 7210, "epoch": 86} {"train_loss": -17.270933151245117, "global_step": 7211, "epoch": 86} {"train_loss": -17.249675750732422, "global_step": 7212, "epoch": 86} {"train_loss": -17.402620315551758, "global_step": 7213, "epoch": 86} {"train_loss": -17.376203536987305, "global_step": 7214, "epoch": 86} {"train_loss": -16.915746688842773, "global_step": 7215, "epoch": 86} {"train_loss": -17.029720306396484, "global_step": 7216, "epoch": 86} {"train_loss": -17.296167373657227, "global_step": 7217, "epoch": 86} {"train_loss": -17.216596603393555, "global_step": 7218, "epoch": 86} {"train_loss": -17.172800064086914, "global_step": 7219, "epoch": 86} {"train_loss": -17.23158464087061, "global_step": 7220, "epoch": 86, "val_loss": 6525383.0} {"train_loss": -16.65720558166504, "global_step": 7221, "epoch": 87} {"train_loss": -17.5707950592041, "global_step": 7222, "epoch": 87} {"train_loss": -16.91392707824707, "global_step": 7223, "epoch": 87} {"train_loss": -17.376808166503906, "global_step": 7224, "epoch": 87} {"train_loss": -16.720739364624023, "global_step": 7225, "epoch": 87} {"train_loss": -16.81662940979004, "global_step": 7226, "epoch": 87} {"train_loss": -17.570323944091797, "global_step": 7227, "epoch": 87} {"train_loss": -17.28754997253418, "global_step": 7228, "epoch": 87} {"train_loss": -17.31269645690918, "global_step": 7229, "epoch": 87} {"train_loss": -16.819456100463867, "global_step": 7230, "epoch": 87} {"train_loss": -17.09232521057129, "global_step": 7231, "epoch": 87} {"train_loss": -17.564544677734375, "global_step": 7232, "epoch": 87} {"train_loss": -16.872875213623047, "global_step": 7233, "epoch": 87} {"train_loss": -17.468250274658203, "global_step": 7234, "epoch": 87} {"train_loss": -17.26901626586914, "global_step": 7235, "epoch": 87} {"train_loss": -17.085351943969727, "global_step": 7236, "epoch": 87} {"train_loss": -17.31720733642578, "global_step": 7237, "epoch": 87} {"train_loss": -17.319284439086914, "global_step": 7238, "epoch": 87} {"train_loss": -17.0681209564209, "global_step": 7239, "epoch": 87} {"train_loss": -17.31703758239746, "global_step": 7240, "epoch": 87} {"train_loss": -17.40730857849121, "global_step": 7241, "epoch": 87} {"train_loss": -17.3543643951416, "global_step": 7242, "epoch": 87} {"train_loss": -16.98893928527832, "global_step": 7243, "epoch": 87} {"train_loss": -17.272621154785156, "global_step": 7244, "epoch": 87} {"train_loss": -17.470319747924805, "global_step": 7245, "epoch": 87} {"train_loss": -17.546173095703125, "global_step": 7246, "epoch": 87} {"train_loss": -17.616552352905273, "global_step": 7247, "epoch": 87} {"train_loss": -17.349079132080078, "global_step": 7248, "epoch": 87} {"train_loss": -17.10752296447754, "global_step": 7249, "epoch": 87} {"train_loss": -17.135112762451172, "global_step": 7250, "epoch": 87} {"train_loss": -17.410486221313477, "global_step": 7251, "epoch": 87} {"train_loss": -17.549829483032227, "global_step": 7252, "epoch": 87} {"train_loss": -17.46123695373535, "global_step": 7253, "epoch": 87} {"train_loss": -17.134260177612305, "global_step": 7254, "epoch": 87} {"train_loss": -16.97945213317871, "global_step": 7255, "epoch": 87} {"train_loss": -17.346927642822266, "global_step": 7256, "epoch": 87} {"train_loss": -17.15009117126465, "global_step": 7257, "epoch": 87} {"train_loss": -17.274076461791992, "global_step": 7258, "epoch": 87} {"train_loss": -17.365285873413086, "global_step": 7259, "epoch": 87} {"train_loss": -17.49756622314453, "global_step": 7260, "epoch": 87} {"train_loss": -17.640317916870117, "global_step": 7261, "epoch": 87} {"train_loss": -16.984155654907227, "global_step": 7262, "epoch": 87} {"train_loss": -17.5009708404541, "global_step": 7263, "epoch": 87} {"train_loss": -17.33804702758789, "global_step": 7264, "epoch": 87} {"train_loss": -17.533084869384766, "global_step": 7265, "epoch": 87} {"train_loss": -17.34819984436035, "global_step": 7266, "epoch": 87} {"train_loss": -16.97589683532715, "global_step": 7267, "epoch": 87} {"train_loss": -17.459060668945312, "global_step": 7268, "epoch": 87} {"train_loss": -17.741342544555664, "global_step": 7269, "epoch": 87} {"train_loss": -17.19251251220703, "global_step": 7270, "epoch": 87} {"train_loss": -17.172870635986328, "global_step": 7271, "epoch": 87} {"train_loss": -17.462356567382812, "global_step": 7272, "epoch": 87} {"train_loss": -17.48283576965332, "global_step": 7273, "epoch": 87} {"train_loss": -17.6259708404541, "global_step": 7274, "epoch": 87} {"train_loss": -17.419706344604492, "global_step": 7275, "epoch": 87} {"train_loss": -17.37578010559082, "global_step": 7276, "epoch": 87} {"train_loss": -17.130380630493164, "global_step": 7277, "epoch": 87} {"train_loss": -17.25352668762207, "global_step": 7278, "epoch": 87} {"train_loss": -17.07375144958496, "global_step": 7279, "epoch": 87} {"train_loss": -17.351791381835938, "global_step": 7280, "epoch": 87} {"train_loss": -17.07948112487793, "global_step": 7281, "epoch": 87} {"train_loss": -17.181976318359375, "global_step": 7282, "epoch": 87} {"train_loss": -17.30751609802246, "global_step": 7283, "epoch": 87} {"train_loss": -17.271926879882812, "global_step": 7284, "epoch": 87} {"train_loss": -17.561552047729492, "global_step": 7285, "epoch": 87} {"train_loss": -17.399215698242188, "global_step": 7286, "epoch": 87} {"train_loss": -17.068212509155273, "global_step": 7287, "epoch": 87} {"train_loss": -17.36130142211914, "global_step": 7288, "epoch": 87} {"train_loss": -17.630212783813477, "global_step": 7289, "epoch": 87} {"train_loss": -17.169458389282227, "global_step": 7290, "epoch": 87} {"train_loss": -17.527509689331055, "global_step": 7291, "epoch": 87} {"train_loss": -17.05661392211914, "global_step": 7292, "epoch": 87} {"train_loss": -17.12037467956543, "global_step": 7293, "epoch": 87} {"train_loss": -17.320165634155273, "global_step": 7294, "epoch": 87} {"train_loss": -17.05557632446289, "global_step": 7295, "epoch": 87} {"train_loss": -17.10321617126465, "global_step": 7296, "epoch": 87} {"train_loss": -17.045637130737305, "global_step": 7297, "epoch": 87} {"train_loss": -17.278244018554688, "global_step": 7298, "epoch": 87} {"train_loss": -17.38675880432129, "global_step": 7299, "epoch": 87} {"train_loss": -17.110736846923828, "global_step": 7300, "epoch": 87} {"train_loss": -17.22005844116211, "global_step": 7301, "epoch": 87} {"train_loss": -17.47433853149414, "global_step": 7302, "epoch": 87} {"train_loss": -17.25759236209364, "global_step": 7303, "epoch": 87, "val_loss": 6347111.0} {"train_loss": -17.306726455688477, "global_step": 7304, "epoch": 88} {"train_loss": -17.503826141357422, "global_step": 7305, "epoch": 88} {"train_loss": -16.936908721923828, "global_step": 7306, "epoch": 88} {"train_loss": -17.217016220092773, "global_step": 7307, "epoch": 88} {"train_loss": -16.937536239624023, "global_step": 7308, "epoch": 88} {"train_loss": -17.197174072265625, "global_step": 7309, "epoch": 88} {"train_loss": -16.784399032592773, "global_step": 7310, "epoch": 88} {"train_loss": -17.191020965576172, "global_step": 7311, "epoch": 88} {"train_loss": -17.387786865234375, "global_step": 7312, "epoch": 88} {"train_loss": -17.270063400268555, "global_step": 7313, "epoch": 88} {"train_loss": -17.3621883392334, "global_step": 7314, "epoch": 88} {"train_loss": -17.001447677612305, "global_step": 7315, "epoch": 88} {"train_loss": -17.401121139526367, "global_step": 7316, "epoch": 88} {"train_loss": -17.384798049926758, "global_step": 7317, "epoch": 88} {"train_loss": -17.236581802368164, "global_step": 7318, "epoch": 88} {"train_loss": -17.582944869995117, "global_step": 7319, "epoch": 88} {"train_loss": -17.562570571899414, "global_step": 7320, "epoch": 88} {"train_loss": -16.880098342895508, "global_step": 7321, "epoch": 88} {"train_loss": -17.344566345214844, "global_step": 7322, "epoch": 88} {"train_loss": -17.06791114807129, "global_step": 7323, "epoch": 88} {"train_loss": -17.559005737304688, "global_step": 7324, "epoch": 88} {"train_loss": -16.768512725830078, "global_step": 7325, "epoch": 88} {"train_loss": -17.37558364868164, "global_step": 7326, "epoch": 88} {"train_loss": -16.674123764038086, "global_step": 7327, "epoch": 88} {"train_loss": -17.319366455078125, "global_step": 7328, "epoch": 88} {"train_loss": -17.266372680664062, "global_step": 7329, "epoch": 88} {"train_loss": -17.513044357299805, "global_step": 7330, "epoch": 88} {"train_loss": -17.256393432617188, "global_step": 7331, "epoch": 88} {"train_loss": -16.853872299194336, "global_step": 7332, "epoch": 88} {"train_loss": -17.12660026550293, "global_step": 7333, "epoch": 88} {"train_loss": -17.283445358276367, "global_step": 7334, "epoch": 88} {"train_loss": -17.25351333618164, "global_step": 7335, "epoch": 88} {"train_loss": -17.380563735961914, "global_step": 7336, "epoch": 88} {"train_loss": -17.478315353393555, "global_step": 7337, "epoch": 88} {"train_loss": -17.31561851501465, "global_step": 7338, "epoch": 88} {"train_loss": -17.414140701293945, "global_step": 7339, "epoch": 88} {"train_loss": -17.45136070251465, "global_step": 7340, "epoch": 88} {"train_loss": -17.691181182861328, "global_step": 7341, "epoch": 88} {"train_loss": -17.21299171447754, "global_step": 7342, "epoch": 88} {"train_loss": -17.12015151977539, "global_step": 7343, "epoch": 88} {"train_loss": -17.289697647094727, "global_step": 7344, "epoch": 88} {"train_loss": -17.12764549255371, "global_step": 7345, "epoch": 88} {"train_loss": -17.355615615844727, "global_step": 7346, "epoch": 88} {"train_loss": -17.42534637451172, "global_step": 7347, "epoch": 88} {"train_loss": -17.407949447631836, "global_step": 7348, "epoch": 88} {"train_loss": -16.99484634399414, "global_step": 7349, "epoch": 88} {"train_loss": -17.423280715942383, "global_step": 7350, "epoch": 88} {"train_loss": -17.20086669921875, "global_step": 7351, "epoch": 88} {"train_loss": -17.368558883666992, "global_step": 7352, "epoch": 88} {"train_loss": -16.895456314086914, "global_step": 7353, "epoch": 88} {"train_loss": -17.23809051513672, "global_step": 7354, "epoch": 88} {"train_loss": -17.21585464477539, "global_step": 7355, "epoch": 88} {"train_loss": -17.36708641052246, "global_step": 7356, "epoch": 88} {"train_loss": -17.5596866607666, "global_step": 7357, "epoch": 88} {"train_loss": -17.535472869873047, "global_step": 7358, "epoch": 88} {"train_loss": -17.38020896911621, "global_step": 7359, "epoch": 88} {"train_loss": -17.636371612548828, "global_step": 7360, "epoch": 88} {"train_loss": -17.18121910095215, "global_step": 7361, "epoch": 88} {"train_loss": -17.487905502319336, "global_step": 7362, "epoch": 88} {"train_loss": -17.437091827392578, "global_step": 7363, "epoch": 88} {"train_loss": -16.957849502563477, "global_step": 7364, "epoch": 88} {"train_loss": -17.44154930114746, "global_step": 7365, "epoch": 88} {"train_loss": -17.402456283569336, "global_step": 7366, "epoch": 88} {"train_loss": -17.17903709411621, "global_step": 7367, "epoch": 88} {"train_loss": -17.28769302368164, "global_step": 7368, "epoch": 88} {"train_loss": -17.25999641418457, "global_step": 7369, "epoch": 88} {"train_loss": -17.405004501342773, "global_step": 7370, "epoch": 88} {"train_loss": -17.23651695251465, "global_step": 7371, "epoch": 88} {"train_loss": -17.14850425720215, "global_step": 7372, "epoch": 88} {"train_loss": -17.70302391052246, "global_step": 7373, "epoch": 88} {"train_loss": -17.565927505493164, "global_step": 7374, "epoch": 88} {"train_loss": -17.393875122070312, "global_step": 7375, "epoch": 88} {"train_loss": -17.096271514892578, "global_step": 7376, "epoch": 88} {"train_loss": -17.299976348876953, "global_step": 7377, "epoch": 88} {"train_loss": -17.40574073791504, "global_step": 7378, "epoch": 88} {"train_loss": -17.349416732788086, "global_step": 7379, "epoch": 88} {"train_loss": -17.282136917114258, "global_step": 7380, "epoch": 88} {"train_loss": -17.011032104492188, "global_step": 7381, "epoch": 88} {"train_loss": -16.822757720947266, "global_step": 7382, "epoch": 88} {"train_loss": -17.411874771118164, "global_step": 7383, "epoch": 88} {"train_loss": -17.072038650512695, "global_step": 7384, "epoch": 88} {"train_loss": -16.86988639831543, "global_step": 7385, "epoch": 88} {"train_loss": -17.277308084878577, "global_step": 7386, "epoch": 88, "val_loss": 6342447.0} {"train_loss": -17.090103149414062, "global_step": 7387, "epoch": 89} {"train_loss": -17.246780395507812, "global_step": 7388, "epoch": 89} {"train_loss": -16.977344512939453, "global_step": 7389, "epoch": 89} {"train_loss": -16.9240665435791, "global_step": 7390, "epoch": 89} {"train_loss": -17.054244995117188, "global_step": 7391, "epoch": 89} {"train_loss": -17.220993041992188, "global_step": 7392, "epoch": 89} {"train_loss": -16.686872482299805, "global_step": 7393, "epoch": 89} {"train_loss": -16.969911575317383, "global_step": 7394, "epoch": 89} {"train_loss": -17.091758728027344, "global_step": 7395, "epoch": 89} {"train_loss": -16.898452758789062, "global_step": 7396, "epoch": 89} {"train_loss": -17.27789306640625, "global_step": 7397, "epoch": 89} {"train_loss": -17.175344467163086, "global_step": 7398, "epoch": 89} {"train_loss": -17.3775691986084, "global_step": 7399, "epoch": 89} {"train_loss": -17.23651695251465, "global_step": 7400, "epoch": 89} {"train_loss": -16.793256759643555, "global_step": 7401, "epoch": 89} {"train_loss": -17.28864097595215, "global_step": 7402, "epoch": 89} {"train_loss": -17.393966674804688, "global_step": 7403, "epoch": 89} {"train_loss": -17.18532371520996, "global_step": 7404, "epoch": 89} {"train_loss": -16.9542293548584, "global_step": 7405, "epoch": 89} {"train_loss": -16.893239974975586, "global_step": 7406, "epoch": 89} {"train_loss": -17.62204933166504, "global_step": 7407, "epoch": 89} {"train_loss": -17.210689544677734, "global_step": 7408, "epoch": 89} {"train_loss": -17.333864212036133, "global_step": 7409, "epoch": 89} {"train_loss": -17.591571807861328, "global_step": 7410, "epoch": 89} {"train_loss": -17.50311851501465, "global_step": 7411, "epoch": 89} {"train_loss": -17.30519676208496, "global_step": 7412, "epoch": 89} {"train_loss": -17.133258819580078, "global_step": 7413, "epoch": 89} {"train_loss": -17.547100067138672, "global_step": 7414, "epoch": 89} {"train_loss": -17.440580368041992, "global_step": 7415, "epoch": 89} {"train_loss": -17.072290420532227, "global_step": 7416, "epoch": 89} {"train_loss": -17.21824073791504, "global_step": 7417, "epoch": 89} {"train_loss": -17.64994239807129, "global_step": 7418, "epoch": 89} {"train_loss": -17.47907829284668, "global_step": 7419, "epoch": 89} {"train_loss": -17.729785919189453, "global_step": 7420, "epoch": 89} {"train_loss": -17.327436447143555, "global_step": 7421, "epoch": 89} {"train_loss": -17.143268585205078, "global_step": 7422, "epoch": 89} {"train_loss": -16.916507720947266, "global_step": 7423, "epoch": 89} {"train_loss": -17.57269859313965, "global_step": 7424, "epoch": 89} {"train_loss": -17.24196434020996, "global_step": 7425, "epoch": 89} {"train_loss": -16.68234634399414, "global_step": 7426, "epoch": 89} {"train_loss": -17.33747673034668, "global_step": 7427, "epoch": 89} {"train_loss": -17.115402221679688, "global_step": 7428, "epoch": 89} {"train_loss": -16.931116104125977, "global_step": 7429, "epoch": 89} {"train_loss": -17.83749771118164, "global_step": 7430, "epoch": 89} {"train_loss": -17.162839889526367, "global_step": 7431, "epoch": 89} {"train_loss": -17.801193237304688, "global_step": 7432, "epoch": 89} {"train_loss": -17.101417541503906, "global_step": 7433, "epoch": 89} {"train_loss": -17.628976821899414, "global_step": 7434, "epoch": 89} {"train_loss": -17.660757064819336, "global_step": 7435, "epoch": 89} {"train_loss": -17.26796531677246, "global_step": 7436, "epoch": 89} {"train_loss": -16.985504150390625, "global_step": 7437, "epoch": 89} {"train_loss": -17.5358943939209, "global_step": 7438, "epoch": 89} {"train_loss": -16.930906295776367, "global_step": 7439, "epoch": 89} {"train_loss": -17.05323600769043, "global_step": 7440, "epoch": 89} {"train_loss": -17.641263961791992, "global_step": 7441, "epoch": 89} {"train_loss": -16.8266544342041, "global_step": 7442, "epoch": 89} {"train_loss": -17.735872268676758, "global_step": 7443, "epoch": 89} {"train_loss": -17.387292861938477, "global_step": 7444, "epoch": 89} {"train_loss": -17.262388229370117, "global_step": 7445, "epoch": 89} {"train_loss": -17.568613052368164, "global_step": 7446, "epoch": 89} {"train_loss": -17.324554443359375, "global_step": 7447, "epoch": 89} {"train_loss": -17.75764274597168, "global_step": 7448, "epoch": 89} {"train_loss": -17.080400466918945, "global_step": 7449, "epoch": 89} {"train_loss": -17.144447326660156, "global_step": 7450, "epoch": 89} {"train_loss": -17.358768463134766, "global_step": 7451, "epoch": 89} {"train_loss": -17.329370498657227, "global_step": 7452, "epoch": 89} {"train_loss": -17.00139808654785, "global_step": 7453, "epoch": 89} {"train_loss": -17.40690040588379, "global_step": 7454, "epoch": 89} {"train_loss": -17.295869827270508, "global_step": 7455, "epoch": 89} {"train_loss": -16.9150390625, "global_step": 7456, "epoch": 89} {"train_loss": -17.344831466674805, "global_step": 7457, "epoch": 89} {"train_loss": -17.118009567260742, "global_step": 7458, "epoch": 89} {"train_loss": -17.71271514892578, "global_step": 7459, "epoch": 89} {"train_loss": -17.260107040405273, "global_step": 7460, "epoch": 89} {"train_loss": -17.311277389526367, "global_step": 7461, "epoch": 89} {"train_loss": -17.484952926635742, "global_step": 7462, "epoch": 89} {"train_loss": -17.034122467041016, "global_step": 7463, "epoch": 89} {"train_loss": -17.425827026367188, "global_step": 7464, "epoch": 89} {"train_loss": -17.255834579467773, "global_step": 7465, "epoch": 89} {"train_loss": -17.185863494873047, "global_step": 7466, "epoch": 89} {"train_loss": -17.362836837768555, "global_step": 7467, "epoch": 89} {"train_loss": -17.523847579956055, "global_step": 7468, "epoch": 89} {"train_loss": -17.260373150009706, "global_step": 7469, "epoch": 89, "val_loss": 6285190.5} {"train_loss": -17.464290618896484, "global_step": 7470, "epoch": 90} {"train_loss": -17.002485275268555, "global_step": 7471, "epoch": 90} {"train_loss": -17.504379272460938, "global_step": 7472, "epoch": 90} {"train_loss": -17.374547958374023, "global_step": 7473, "epoch": 90} {"train_loss": -17.23619270324707, "global_step": 7474, "epoch": 90} {"train_loss": -17.17777442932129, "global_step": 7475, "epoch": 90} {"train_loss": -17.496692657470703, "global_step": 7476, "epoch": 90} {"train_loss": -17.4901065826416, "global_step": 7477, "epoch": 90} {"train_loss": -17.16646385192871, "global_step": 7478, "epoch": 90} {"train_loss": -17.454572677612305, "global_step": 7479, "epoch": 90} {"train_loss": -16.854345321655273, "global_step": 7480, "epoch": 90} {"train_loss": -16.68866539001465, "global_step": 7481, "epoch": 90} {"train_loss": -17.38430404663086, "global_step": 7482, "epoch": 90} {"train_loss": -17.414356231689453, "global_step": 7483, "epoch": 90} {"train_loss": -17.264921188354492, "global_step": 7484, "epoch": 90} {"train_loss": -17.284334182739258, "global_step": 7485, "epoch": 90} {"train_loss": -17.315475463867188, "global_step": 7486, "epoch": 90} {"train_loss": -17.08551788330078, "global_step": 7487, "epoch": 90} {"train_loss": -17.100629806518555, "global_step": 7488, "epoch": 90} {"train_loss": -17.413299560546875, "global_step": 7489, "epoch": 90} {"train_loss": -17.659427642822266, "global_step": 7490, "epoch": 90} {"train_loss": -17.140216827392578, "global_step": 7491, "epoch": 90} {"train_loss": -17.599607467651367, "global_step": 7492, "epoch": 90} {"train_loss": -17.41547203063965, "global_step": 7493, "epoch": 90} {"train_loss": -17.208467483520508, "global_step": 7494, "epoch": 90} {"train_loss": -17.711576461791992, "global_step": 7495, "epoch": 90} {"train_loss": -17.11677360534668, "global_step": 7496, "epoch": 90} {"train_loss": -17.66507339477539, "global_step": 7497, "epoch": 90} {"train_loss": -17.21807861328125, "global_step": 7498, "epoch": 90} {"train_loss": -17.473316192626953, "global_step": 7499, "epoch": 90} {"train_loss": -17.25275993347168, "global_step": 7500, "epoch": 90} {"train_loss": -17.244234085083008, "global_step": 7501, "epoch": 90} {"train_loss": -17.171995162963867, "global_step": 7502, "epoch": 90} {"train_loss": -17.163183212280273, "global_step": 7503, "epoch": 90} {"train_loss": -17.507648468017578, "global_step": 7504, "epoch": 90} {"train_loss": -17.518417358398438, "global_step": 7505, "epoch": 90} {"train_loss": -17.424116134643555, "global_step": 7506, "epoch": 90} {"train_loss": -17.272581100463867, "global_step": 7507, "epoch": 90} {"train_loss": -17.48334312438965, "global_step": 7508, "epoch": 90} {"train_loss": -17.156965255737305, "global_step": 7509, "epoch": 90} {"train_loss": -17.352773666381836, "global_step": 7510, "epoch": 90} {"train_loss": -17.159143447875977, "global_step": 7511, "epoch": 90} {"train_loss": -16.911487579345703, "global_step": 7512, "epoch": 90} {"train_loss": -17.32695960998535, "global_step": 7513, "epoch": 90} {"train_loss": -16.799108505249023, "global_step": 7514, "epoch": 90} {"train_loss": -16.95293426513672, "global_step": 7515, "epoch": 90} {"train_loss": -16.835800170898438, "global_step": 7516, "epoch": 90} {"train_loss": -17.119117736816406, "global_step": 7517, "epoch": 90} {"train_loss": -17.798933029174805, "global_step": 7518, "epoch": 90} {"train_loss": -17.572961807250977, "global_step": 7519, "epoch": 90} {"train_loss": -17.115530014038086, "global_step": 7520, "epoch": 90} {"train_loss": -17.221654891967773, "global_step": 7521, "epoch": 90} {"train_loss": -17.3964786529541, "global_step": 7522, "epoch": 90} {"train_loss": -16.895858764648438, "global_step": 7523, "epoch": 90} {"train_loss": -17.112653732299805, "global_step": 7524, "epoch": 90} {"train_loss": -17.41332244873047, "global_step": 7525, "epoch": 90} {"train_loss": -16.930753707885742, "global_step": 7526, "epoch": 90} {"train_loss": -17.001386642456055, "global_step": 7527, "epoch": 90} {"train_loss": -17.261871337890625, "global_step": 7528, "epoch": 90} {"train_loss": -17.367603302001953, "global_step": 7529, "epoch": 90} {"train_loss": -17.580154418945312, "global_step": 7530, "epoch": 90} {"train_loss": -17.605791091918945, "global_step": 7531, "epoch": 90} {"train_loss": -17.69907569885254, "global_step": 7532, "epoch": 90} {"train_loss": -17.050262451171875, "global_step": 7533, "epoch": 90} {"train_loss": -17.232128143310547, "global_step": 7534, "epoch": 90} {"train_loss": -17.577041625976562, "global_step": 7535, "epoch": 90} {"train_loss": -17.62879753112793, "global_step": 7536, "epoch": 90} {"train_loss": -17.7034969329834, "global_step": 7537, "epoch": 90} {"train_loss": -17.38156509399414, "global_step": 7538, "epoch": 90} {"train_loss": -17.168750762939453, "global_step": 7539, "epoch": 90} {"train_loss": -16.934476852416992, "global_step": 7540, "epoch": 90} {"train_loss": -17.183551788330078, "global_step": 7541, "epoch": 90} {"train_loss": -17.334033966064453, "global_step": 7542, "epoch": 90} {"train_loss": -17.23408317565918, "global_step": 7543, "epoch": 90} {"train_loss": -17.103178024291992, "global_step": 7544, "epoch": 90} {"train_loss": -17.381406784057617, "global_step": 7545, "epoch": 90} {"train_loss": -17.34182357788086, "global_step": 7546, "epoch": 90} {"train_loss": -17.1138973236084, "global_step": 7547, "epoch": 90} {"train_loss": -17.141258239746094, "global_step": 7548, "epoch": 90} {"train_loss": -17.051700592041016, "global_step": 7549, "epoch": 90} {"train_loss": -17.42209815979004, "global_step": 7550, "epoch": 90} {"train_loss": -17.287490844726562, "global_step": 7551, "epoch": 90} {"train_loss": -17.271195515092597, "global_step": 7552, "epoch": 90, "val_loss": 6412230.5} {"train_loss": -17.040369033813477, "global_step": 7553, "epoch": 91} {"train_loss": -17.17183494567871, "global_step": 7554, "epoch": 91} {"train_loss": -17.151212692260742, "global_step": 7555, "epoch": 91} {"train_loss": -17.1419734954834, "global_step": 7556, "epoch": 91} {"train_loss": -17.66292953491211, "global_step": 7557, "epoch": 91} {"train_loss": -17.093542098999023, "global_step": 7558, "epoch": 91} {"train_loss": -17.274587631225586, "global_step": 7559, "epoch": 91} {"train_loss": -17.08186149597168, "global_step": 7560, "epoch": 91} {"train_loss": -16.918195724487305, "global_step": 7561, "epoch": 91} {"train_loss": -17.142297744750977, "global_step": 7562, "epoch": 91} {"train_loss": -17.133834838867188, "global_step": 7563, "epoch": 91} {"train_loss": -17.018198013305664, "global_step": 7564, "epoch": 91} {"train_loss": -17.274921417236328, "global_step": 7565, "epoch": 91} {"train_loss": -16.90641212463379, "global_step": 7566, "epoch": 91} {"train_loss": -17.040842056274414, "global_step": 7567, "epoch": 91} {"train_loss": -17.665037155151367, "global_step": 7568, "epoch": 91} {"train_loss": -17.25019645690918, "global_step": 7569, "epoch": 91} {"train_loss": -17.13726234436035, "global_step": 7570, "epoch": 91} {"train_loss": -17.56207275390625, "global_step": 7571, "epoch": 91} {"train_loss": -17.530858993530273, "global_step": 7572, "epoch": 91} {"train_loss": -17.275596618652344, "global_step": 7573, "epoch": 91} {"train_loss": -17.4619197845459, "global_step": 7574, "epoch": 91} {"train_loss": -17.223312377929688, "global_step": 7575, "epoch": 91} {"train_loss": -17.567113876342773, "global_step": 7576, "epoch": 91} {"train_loss": -17.480871200561523, "global_step": 7577, "epoch": 91} {"train_loss": -17.15485191345215, "global_step": 7578, "epoch": 91} {"train_loss": -17.56230926513672, "global_step": 7579, "epoch": 91} {"train_loss": -17.230886459350586, "global_step": 7580, "epoch": 91} {"train_loss": -17.252546310424805, "global_step": 7581, "epoch": 91} {"train_loss": -17.619070053100586, "global_step": 7582, "epoch": 91} {"train_loss": -17.640457153320312, "global_step": 7583, "epoch": 91} {"train_loss": -17.535400390625, "global_step": 7584, "epoch": 91} {"train_loss": -17.122777938842773, "global_step": 7585, "epoch": 91} {"train_loss": -17.62424087524414, "global_step": 7586, "epoch": 91} {"train_loss": -17.287193298339844, "global_step": 7587, "epoch": 91} {"train_loss": -17.60394859313965, "global_step": 7588, "epoch": 91} {"train_loss": -17.659887313842773, "global_step": 7589, "epoch": 91} {"train_loss": -17.492834091186523, "global_step": 7590, "epoch": 91} {"train_loss": -17.34119987487793, "global_step": 7591, "epoch": 91} {"train_loss": -17.52724266052246, "global_step": 7592, "epoch": 91} {"train_loss": -17.0186767578125, "global_step": 7593, "epoch": 91} {"train_loss": -17.179113388061523, "global_step": 7594, "epoch": 91} {"train_loss": -17.345975875854492, "global_step": 7595, "epoch": 91} {"train_loss": -17.799978256225586, "global_step": 7596, "epoch": 91} {"train_loss": -17.543283462524414, "global_step": 7597, "epoch": 91} {"train_loss": -17.35700035095215, "global_step": 7598, "epoch": 91} {"train_loss": -17.393232345581055, "global_step": 7599, "epoch": 91} {"train_loss": -17.397964477539062, "global_step": 7600, "epoch": 91} {"train_loss": -17.717090606689453, "global_step": 7601, "epoch": 91} {"train_loss": -17.310590744018555, "global_step": 7602, "epoch": 91} {"train_loss": -17.172372817993164, "global_step": 7603, "epoch": 91} {"train_loss": -17.417064666748047, "global_step": 7604, "epoch": 91} {"train_loss": -17.381912231445312, "global_step": 7605, "epoch": 91} {"train_loss": -17.52913475036621, "global_step": 7606, "epoch": 91} {"train_loss": -17.188405990600586, "global_step": 7607, "epoch": 91} {"train_loss": -17.58737564086914, "global_step": 7608, "epoch": 91} {"train_loss": -17.43758201599121, "global_step": 7609, "epoch": 91} {"train_loss": -17.303390502929688, "global_step": 7610, "epoch": 91} {"train_loss": -16.940698623657227, "global_step": 7611, "epoch": 91} {"train_loss": -17.379283905029297, "global_step": 7612, "epoch": 91} {"train_loss": -17.568387985229492, "global_step": 7613, "epoch": 91} {"train_loss": -16.88351821899414, "global_step": 7614, "epoch": 91} {"train_loss": -17.1304988861084, "global_step": 7615, "epoch": 91} {"train_loss": -17.5089054107666, "global_step": 7616, "epoch": 91} {"train_loss": -17.350475311279297, "global_step": 7617, "epoch": 91} {"train_loss": -17.09490966796875, "global_step": 7618, "epoch": 91} {"train_loss": -17.516536712646484, "global_step": 7619, "epoch": 91} {"train_loss": -17.14263343811035, "global_step": 7620, "epoch": 91} {"train_loss": -17.701833724975586, "global_step": 7621, "epoch": 91} {"train_loss": -17.093908309936523, "global_step": 7622, "epoch": 91} {"train_loss": -17.262271881103516, "global_step": 7623, "epoch": 91} {"train_loss": -17.200870513916016, "global_step": 7624, "epoch": 91} {"train_loss": -16.48674964904785, "global_step": 7625, "epoch": 91} {"train_loss": -17.46154022216797, "global_step": 7626, "epoch": 91} {"train_loss": -17.340322494506836, "global_step": 7627, "epoch": 91} {"train_loss": -17.07857894897461, "global_step": 7628, "epoch": 91} {"train_loss": -17.103012084960938, "global_step": 7629, "epoch": 91} {"train_loss": -17.299381256103516, "global_step": 7630, "epoch": 91} {"train_loss": -17.3053035736084, "global_step": 7631, "epoch": 91} {"train_loss": -17.450632095336914, "global_step": 7632, "epoch": 91} {"train_loss": -17.260046005249023, "global_step": 7633, "epoch": 91} {"train_loss": -17.050703048706055, "global_step": 7634, "epoch": 91} {"train_loss": -17.320280948317194, "global_step": 7635, "epoch": 91, "val_loss": 6566257.0} {"train_loss": -16.829099655151367, "global_step": 7636, "epoch": 92} {"train_loss": -16.87261390686035, "global_step": 7637, "epoch": 92} {"train_loss": -17.10592269897461, "global_step": 7638, "epoch": 92} {"train_loss": -16.955049514770508, "global_step": 7639, "epoch": 92} {"train_loss": -17.12257957458496, "global_step": 7640, "epoch": 92} {"train_loss": -17.291824340820312, "global_step": 7641, "epoch": 92} {"train_loss": -17.10525894165039, "global_step": 7642, "epoch": 92} {"train_loss": -17.13789176940918, "global_step": 7643, "epoch": 92} {"train_loss": -16.844696044921875, "global_step": 7644, "epoch": 92} {"train_loss": -16.98853874206543, "global_step": 7645, "epoch": 92} {"train_loss": -16.962509155273438, "global_step": 7646, "epoch": 92} {"train_loss": -17.311986923217773, "global_step": 7647, "epoch": 92} {"train_loss": -17.425323486328125, "global_step": 7648, "epoch": 92} {"train_loss": -17.2236385345459, "global_step": 7649, "epoch": 92} {"train_loss": -17.162139892578125, "global_step": 7650, "epoch": 92} {"train_loss": -17.518827438354492, "global_step": 7651, "epoch": 92} {"train_loss": -17.124006271362305, "global_step": 7652, "epoch": 92} {"train_loss": -17.49490737915039, "global_step": 7653, "epoch": 92} {"train_loss": -17.645244598388672, "global_step": 7654, "epoch": 92} {"train_loss": -17.268972396850586, "global_step": 7655, "epoch": 92} {"train_loss": -17.397125244140625, "global_step": 7656, "epoch": 92} {"train_loss": -17.4935359954834, "global_step": 7657, "epoch": 92} {"train_loss": -17.27028465270996, "global_step": 7658, "epoch": 92} {"train_loss": -16.990854263305664, "global_step": 7659, "epoch": 92} {"train_loss": -17.1448974609375, "global_step": 7660, "epoch": 92} {"train_loss": -17.00446891784668, "global_step": 7661, "epoch": 92} {"train_loss": -17.43351173400879, "global_step": 7662, "epoch": 92} {"train_loss": -17.231155395507812, "global_step": 7663, "epoch": 92} {"train_loss": -17.150144577026367, "global_step": 7664, "epoch": 92} {"train_loss": -17.16351318359375, "global_step": 7665, "epoch": 92} {"train_loss": -17.142797470092773, "global_step": 7666, "epoch": 92} {"train_loss": -17.358060836791992, "global_step": 7667, "epoch": 92} {"train_loss": -17.30873680114746, "global_step": 7668, "epoch": 92} {"train_loss": -17.45152473449707, "global_step": 7669, "epoch": 92} {"train_loss": -17.515195846557617, "global_step": 7670, "epoch": 92} {"train_loss": -17.528236389160156, "global_step": 7671, "epoch": 92} {"train_loss": -17.588748931884766, "global_step": 7672, "epoch": 92} {"train_loss": -17.169641494750977, "global_step": 7673, "epoch": 92} {"train_loss": -17.53810691833496, "global_step": 7674, "epoch": 92} {"train_loss": -16.89366912841797, "global_step": 7675, "epoch": 92} {"train_loss": -17.310888290405273, "global_step": 7676, "epoch": 92} {"train_loss": -17.386554718017578, "global_step": 7677, "epoch": 92} {"train_loss": -17.161970138549805, "global_step": 7678, "epoch": 92} {"train_loss": -17.7154483795166, "global_step": 7679, "epoch": 92} {"train_loss": -17.502361297607422, "global_step": 7680, "epoch": 92} {"train_loss": -17.2379093170166, "global_step": 7681, "epoch": 92} {"train_loss": -17.554615020751953, "global_step": 7682, "epoch": 92} {"train_loss": -17.29050636291504, "global_step": 7683, "epoch": 92} {"train_loss": -17.427824020385742, "global_step": 7684, "epoch": 92} {"train_loss": -17.11146354675293, "global_step": 7685, "epoch": 92} {"train_loss": -17.197799682617188, "global_step": 7686, "epoch": 92} {"train_loss": -17.218143463134766, "global_step": 7687, "epoch": 92} {"train_loss": -17.484952926635742, "global_step": 7688, "epoch": 92} {"train_loss": -17.666858673095703, "global_step": 7689, "epoch": 92} {"train_loss": -17.40053939819336, "global_step": 7690, "epoch": 92} {"train_loss": -16.95271110534668, "global_step": 7691, "epoch": 92} {"train_loss": -17.273006439208984, "global_step": 7692, "epoch": 92} {"train_loss": -17.180295944213867, "global_step": 7693, "epoch": 92} {"train_loss": -17.486236572265625, "global_step": 7694, "epoch": 92} {"train_loss": -17.3470458984375, "global_step": 7695, "epoch": 92} {"train_loss": -17.486249923706055, "global_step": 7696, "epoch": 92} {"train_loss": -17.298757553100586, "global_step": 7697, "epoch": 92} {"train_loss": -17.099319458007812, "global_step": 7698, "epoch": 92} {"train_loss": -17.228368759155273, "global_step": 7699, "epoch": 92} {"train_loss": -17.133214950561523, "global_step": 7700, "epoch": 92} {"train_loss": -17.476905822753906, "global_step": 7701, "epoch": 92} {"train_loss": -17.574581146240234, "global_step": 7702, "epoch": 92} {"train_loss": -17.597646713256836, "global_step": 7703, "epoch": 92} {"train_loss": -17.421024322509766, "global_step": 7704, "epoch": 92} {"train_loss": -17.386035919189453, "global_step": 7705, "epoch": 92} {"train_loss": -17.22801971435547, "global_step": 7706, "epoch": 92} {"train_loss": -17.104984283447266, "global_step": 7707, "epoch": 92} {"train_loss": -17.330615997314453, "global_step": 7708, "epoch": 92} {"train_loss": -17.346420288085938, "global_step": 7709, "epoch": 92} {"train_loss": -17.131330490112305, "global_step": 7710, "epoch": 92} {"train_loss": -17.655149459838867, "global_step": 7711, "epoch": 92} {"train_loss": -17.535184860229492, "global_step": 7712, "epoch": 92} {"train_loss": -17.348386764526367, "global_step": 7713, "epoch": 92} {"train_loss": -17.242088317871094, "global_step": 7714, "epoch": 92} {"train_loss": -16.76021385192871, "global_step": 7715, "epoch": 92} {"train_loss": -17.170291900634766, "global_step": 7716, "epoch": 92} {"train_loss": -17.436878204345703, "global_step": 7717, "epoch": 92} {"train_loss": -17.261376047708904, "global_step": 7718, "epoch": 92, "val_loss": 6311059.0} {"train_loss": -17.107606887817383, "global_step": 7719, "epoch": 93} {"train_loss": -17.341703414916992, "global_step": 7720, "epoch": 93} {"train_loss": -17.26511001586914, "global_step": 7721, "epoch": 93} {"train_loss": -17.19772720336914, "global_step": 7722, "epoch": 93} {"train_loss": -17.290361404418945, "global_step": 7723, "epoch": 93} {"train_loss": -17.772863388061523, "global_step": 7724, "epoch": 93} {"train_loss": -17.406034469604492, "global_step": 7725, "epoch": 93} {"train_loss": -17.111398696899414, "global_step": 7726, "epoch": 93} {"train_loss": -17.244525909423828, "global_step": 7727, "epoch": 93} {"train_loss": -17.606176376342773, "global_step": 7728, "epoch": 93} {"train_loss": -17.298206329345703, "global_step": 7729, "epoch": 93} {"train_loss": -17.145004272460938, "global_step": 7730, "epoch": 93} {"train_loss": -17.261350631713867, "global_step": 7731, "epoch": 93} {"train_loss": -16.937551498413086, "global_step": 7732, "epoch": 93} {"train_loss": -17.659912109375, "global_step": 7733, "epoch": 93} {"train_loss": -17.20850944519043, "global_step": 7734, "epoch": 93} {"train_loss": -17.230146408081055, "global_step": 7735, "epoch": 93} {"train_loss": -17.25986099243164, "global_step": 7736, "epoch": 93} {"train_loss": -17.505212783813477, "global_step": 7737, "epoch": 93} {"train_loss": -17.01047706604004, "global_step": 7738, "epoch": 93} {"train_loss": -17.142812728881836, "global_step": 7739, "epoch": 93} {"train_loss": -17.152265548706055, "global_step": 7740, "epoch": 93} {"train_loss": -17.59683609008789, "global_step": 7741, "epoch": 93} {"train_loss": -17.573728561401367, "global_step": 7742, "epoch": 93} {"train_loss": -17.30321502685547, "global_step": 7743, "epoch": 93} {"train_loss": -17.73332977294922, "global_step": 7744, "epoch": 93} {"train_loss": -17.27264404296875, "global_step": 7745, "epoch": 93} {"train_loss": -17.360557556152344, "global_step": 7746, "epoch": 93} {"train_loss": -17.427913665771484, "global_step": 7747, "epoch": 93} {"train_loss": -17.278783798217773, "global_step": 7748, "epoch": 93} {"train_loss": -17.34430503845215, "global_step": 7749, "epoch": 93} {"train_loss": -17.455488204956055, "global_step": 7750, "epoch": 93} {"train_loss": -17.608896255493164, "global_step": 7751, "epoch": 93} {"train_loss": -16.995229721069336, "global_step": 7752, "epoch": 93} {"train_loss": -16.978240966796875, "global_step": 7753, "epoch": 93} {"train_loss": -17.53413200378418, "global_step": 7754, "epoch": 93} {"train_loss": -17.702617645263672, "global_step": 7755, "epoch": 93} {"train_loss": -17.33837890625, "global_step": 7756, "epoch": 93} {"train_loss": -17.256635665893555, "global_step": 7757, "epoch": 93} {"train_loss": -17.522071838378906, "global_step": 7758, "epoch": 93} {"train_loss": -17.469635009765625, "global_step": 7759, "epoch": 93} {"train_loss": -17.42450523376465, "global_step": 7760, "epoch": 93} {"train_loss": -17.447328567504883, "global_step": 7761, "epoch": 93} {"train_loss": -17.516054153442383, "global_step": 7762, "epoch": 93} {"train_loss": -17.777179718017578, "global_step": 7763, "epoch": 93} {"train_loss": -17.43612289428711, "global_step": 7764, "epoch": 93} {"train_loss": -16.972332000732422, "global_step": 7765, "epoch": 93} {"train_loss": -17.338943481445312, "global_step": 7766, "epoch": 93} {"train_loss": -17.329835891723633, "global_step": 7767, "epoch": 93} {"train_loss": -16.91523551940918, "global_step": 7768, "epoch": 93} {"train_loss": -16.859708786010742, "global_step": 7769, "epoch": 93} {"train_loss": -17.251754760742188, "global_step": 7770, "epoch": 93} {"train_loss": -16.91401481628418, "global_step": 7771, "epoch": 93} {"train_loss": -17.39169692993164, "global_step": 7772, "epoch": 93} {"train_loss": -17.449066162109375, "global_step": 7773, "epoch": 93} {"train_loss": -17.458738327026367, "global_step": 7774, "epoch": 93} {"train_loss": -17.430015563964844, "global_step": 7775, "epoch": 93} {"train_loss": -17.68520164489746, "global_step": 7776, "epoch": 93} {"train_loss": -17.35529136657715, "global_step": 7777, "epoch": 93} {"train_loss": -17.11594009399414, "global_step": 7778, "epoch": 93} {"train_loss": -17.517974853515625, "global_step": 7779, "epoch": 93} {"train_loss": -17.5186767578125, "global_step": 7780, "epoch": 93} {"train_loss": -17.365787506103516, "global_step": 7781, "epoch": 93} {"train_loss": -17.438541412353516, "global_step": 7782, "epoch": 93} {"train_loss": -17.39483070373535, "global_step": 7783, "epoch": 93} {"train_loss": -17.32740592956543, "global_step": 7784, "epoch": 93} {"train_loss": -16.66571617126465, "global_step": 7785, "epoch": 93} {"train_loss": -17.160995483398438, "global_step": 7786, "epoch": 93} {"train_loss": -17.455799102783203, "global_step": 7787, "epoch": 93} {"train_loss": -17.541717529296875, "global_step": 7788, "epoch": 93} {"train_loss": -17.345006942749023, "global_step": 7789, "epoch": 93} {"train_loss": -17.28215980529785, "global_step": 7790, "epoch": 93} {"train_loss": -17.39716148376465, "global_step": 7791, "epoch": 93} {"train_loss": -17.103939056396484, "global_step": 7792, "epoch": 93} {"train_loss": -17.3122615814209, "global_step": 7793, "epoch": 93} {"train_loss": -17.50722312927246, "global_step": 7794, "epoch": 93} {"train_loss": -17.3727970123291, "global_step": 7795, "epoch": 93} {"train_loss": -17.312997817993164, "global_step": 7796, "epoch": 93} {"train_loss": -17.65178680419922, "global_step": 7797, "epoch": 93} {"train_loss": -17.111303329467773, "global_step": 7798, "epoch": 93} {"train_loss": -17.12405776977539, "global_step": 7799, "epoch": 93} {"train_loss": -17.937686920166016, "global_step": 7800, "epoch": 93} {"train_loss": -17.346701380718184, "global_step": 7801, "epoch": 93, "val_loss": 6123651.0} {"train_loss": -17.42850112915039, "global_step": 7802, "epoch": 94} {"train_loss": -17.313810348510742, "global_step": 7803, "epoch": 94} {"train_loss": -17.498966217041016, "global_step": 7804, "epoch": 94} {"train_loss": -17.135154724121094, "global_step": 7805, "epoch": 94} {"train_loss": -17.4979305267334, "global_step": 7806, "epoch": 94} {"train_loss": -17.265371322631836, "global_step": 7807, "epoch": 94} {"train_loss": -17.01143455505371, "global_step": 7808, "epoch": 94} {"train_loss": -17.417417526245117, "global_step": 7809, "epoch": 94} {"train_loss": -17.56806755065918, "global_step": 7810, "epoch": 94} {"train_loss": -17.375486373901367, "global_step": 7811, "epoch": 94} {"train_loss": -17.503061294555664, "global_step": 7812, "epoch": 94} {"train_loss": -17.553409576416016, "global_step": 7813, "epoch": 94} {"train_loss": -17.22754669189453, "global_step": 7814, "epoch": 94} {"train_loss": -17.098447799682617, "global_step": 7815, "epoch": 94} {"train_loss": -17.39089012145996, "global_step": 7816, "epoch": 94} {"train_loss": -17.176700592041016, "global_step": 7817, "epoch": 94} {"train_loss": -17.134729385375977, "global_step": 7818, "epoch": 94} {"train_loss": -17.10634422302246, "global_step": 7819, "epoch": 94} {"train_loss": -17.562274932861328, "global_step": 7820, "epoch": 94} {"train_loss": -17.617128372192383, "global_step": 7821, "epoch": 94} {"train_loss": -17.492549896240234, "global_step": 7822, "epoch": 94} {"train_loss": -16.906291961669922, "global_step": 7823, "epoch": 94} {"train_loss": -17.75655174255371, "global_step": 7824, "epoch": 94} {"train_loss": -17.2412052154541, "global_step": 7825, "epoch": 94} {"train_loss": -17.17257308959961, "global_step": 7826, "epoch": 94} {"train_loss": -17.118501663208008, "global_step": 7827, "epoch": 94} {"train_loss": -17.344850540161133, "global_step": 7828, "epoch": 94} {"train_loss": -16.97357177734375, "global_step": 7829, "epoch": 94} {"train_loss": -17.597667694091797, "global_step": 7830, "epoch": 94} {"train_loss": -17.502317428588867, "global_step": 7831, "epoch": 94} {"train_loss": -17.059646606445312, "global_step": 7832, "epoch": 94} {"train_loss": -17.74055290222168, "global_step": 7833, "epoch": 94} {"train_loss": -17.577526092529297, "global_step": 7834, "epoch": 94} {"train_loss": -17.54039764404297, "global_step": 7835, "epoch": 94} {"train_loss": -17.384597778320312, "global_step": 7836, "epoch": 94} {"train_loss": -17.813495635986328, "global_step": 7837, "epoch": 94} {"train_loss": -17.258901596069336, "global_step": 7838, "epoch": 94} {"train_loss": -17.407373428344727, "global_step": 7839, "epoch": 94} {"train_loss": -17.209196090698242, "global_step": 7840, "epoch": 94} {"train_loss": -17.679418563842773, "global_step": 7841, "epoch": 94} {"train_loss": -17.207128524780273, "global_step": 7842, "epoch": 94} {"train_loss": -17.00613784790039, "global_step": 7843, "epoch": 94} {"train_loss": -17.373661041259766, "global_step": 7844, "epoch": 94} {"train_loss": -17.385841369628906, "global_step": 7845, "epoch": 94} {"train_loss": -17.228452682495117, "global_step": 7846, "epoch": 94} {"train_loss": -17.2962646484375, "global_step": 7847, "epoch": 94} {"train_loss": -17.60715675354004, "global_step": 7848, "epoch": 94} {"train_loss": -17.768009185791016, "global_step": 7849, "epoch": 94} {"train_loss": -17.31196403503418, "global_step": 7850, "epoch": 94} {"train_loss": -17.213132858276367, "global_step": 7851, "epoch": 94} {"train_loss": -17.598127365112305, "global_step": 7852, "epoch": 94} {"train_loss": -17.579931259155273, "global_step": 7853, "epoch": 94} {"train_loss": -17.083492279052734, "global_step": 7854, "epoch": 94} {"train_loss": -17.451171875, "global_step": 7855, "epoch": 94} {"train_loss": -17.471586227416992, "global_step": 7856, "epoch": 94} {"train_loss": -17.49941062927246, "global_step": 7857, "epoch": 94} {"train_loss": -17.66460609436035, "global_step": 7858, "epoch": 94} {"train_loss": -17.436872482299805, "global_step": 7859, "epoch": 94} {"train_loss": -17.213138580322266, "global_step": 7860, "epoch": 94} {"train_loss": -17.357603073120117, "global_step": 7861, "epoch": 94} {"train_loss": -17.58330726623535, "global_step": 7862, "epoch": 94} {"train_loss": -17.190338134765625, "global_step": 7863, "epoch": 94} {"train_loss": -17.177295684814453, "global_step": 7864, "epoch": 94} {"train_loss": -17.4268856048584, "global_step": 7865, "epoch": 94} {"train_loss": -17.56214141845703, "global_step": 7866, "epoch": 94} {"train_loss": -17.2701473236084, "global_step": 7867, "epoch": 94} {"train_loss": -16.885061264038086, "global_step": 7868, "epoch": 94} {"train_loss": -17.281753540039062, "global_step": 7869, "epoch": 94} {"train_loss": -17.25089454650879, "global_step": 7870, "epoch": 94} {"train_loss": -16.92351531982422, "global_step": 7871, "epoch": 94} {"train_loss": -17.037979125976562, "global_step": 7872, "epoch": 94} {"train_loss": -17.290857315063477, "global_step": 7873, "epoch": 94} {"train_loss": -17.671741485595703, "global_step": 7874, "epoch": 94} {"train_loss": -17.537412643432617, "global_step": 7875, "epoch": 94} {"train_loss": -17.455547332763672, "global_step": 7876, "epoch": 94} {"train_loss": -17.478750228881836, "global_step": 7877, "epoch": 94} {"train_loss": -17.135400772094727, "global_step": 7878, "epoch": 94} {"train_loss": -17.106149673461914, "global_step": 7879, "epoch": 94} {"train_loss": -17.200620651245117, "global_step": 7880, "epoch": 94} {"train_loss": -17.282094955444336, "global_step": 7881, "epoch": 94} {"train_loss": -17.648427963256836, "global_step": 7882, "epoch": 94} {"train_loss": -17.08220863342285, "global_step": 7883, "epoch": 94} {"train_loss": -17.36381687026426, "global_step": 7884, "epoch": 94, "val_loss": 6228151.0} {"train_loss": -17.16579246520996, "global_step": 7885, "epoch": 95} {"train_loss": -17.22376823425293, "global_step": 7886, "epoch": 95} {"train_loss": -17.15337371826172, "global_step": 7887, "epoch": 95} {"train_loss": -17.42145347595215, "global_step": 7888, "epoch": 95} {"train_loss": -17.565174102783203, "global_step": 7889, "epoch": 95} {"train_loss": -17.36556053161621, "global_step": 7890, "epoch": 95} {"train_loss": -17.102079391479492, "global_step": 7891, "epoch": 95} {"train_loss": -17.183422088623047, "global_step": 7892, "epoch": 95} {"train_loss": -17.274673461914062, "global_step": 7893, "epoch": 95} {"train_loss": -17.22674560546875, "global_step": 7894, "epoch": 95} {"train_loss": -17.572118759155273, "global_step": 7895, "epoch": 95} {"train_loss": -17.428726196289062, "global_step": 7896, "epoch": 95} {"train_loss": -17.637569427490234, "global_step": 7897, "epoch": 95} {"train_loss": -17.342329025268555, "global_step": 7898, "epoch": 95} {"train_loss": -17.56660270690918, "global_step": 7899, "epoch": 95} {"train_loss": -17.204021453857422, "global_step": 7900, "epoch": 95} {"train_loss": -17.460824966430664, "global_step": 7901, "epoch": 95} {"train_loss": -17.458621978759766, "global_step": 7902, "epoch": 95} {"train_loss": -17.4425106048584, "global_step": 7903, "epoch": 95} {"train_loss": -17.428922653198242, "global_step": 7904, "epoch": 95} {"train_loss": -17.408266067504883, "global_step": 7905, "epoch": 95} {"train_loss": -17.552047729492188, "global_step": 7906, "epoch": 95} {"train_loss": -17.3590030670166, "global_step": 7907, "epoch": 95} {"train_loss": -17.289047241210938, "global_step": 7908, "epoch": 95} {"train_loss": -17.118263244628906, "global_step": 7909, "epoch": 95} {"train_loss": -16.7652530670166, "global_step": 7910, "epoch": 95} {"train_loss": -17.682941436767578, "global_step": 7911, "epoch": 95} {"train_loss": -17.506650924682617, "global_step": 7912, "epoch": 95} {"train_loss": -17.28706932067871, "global_step": 7913, "epoch": 95} {"train_loss": -17.5689754486084, "global_step": 7914, "epoch": 95} {"train_loss": -17.525798797607422, "global_step": 7915, "epoch": 95} {"train_loss": -17.50758171081543, "global_step": 7916, "epoch": 95} {"train_loss": -17.57210922241211, "global_step": 7917, "epoch": 95} {"train_loss": -17.385400772094727, "global_step": 7918, "epoch": 95} {"train_loss": -17.598785400390625, "global_step": 7919, "epoch": 95} {"train_loss": -17.40714454650879, "global_step": 7920, "epoch": 95} {"train_loss": -17.03129005432129, "global_step": 7921, "epoch": 95} {"train_loss": -17.397876739501953, "global_step": 7922, "epoch": 95} {"train_loss": -17.583118438720703, "global_step": 7923, "epoch": 95} {"train_loss": -17.144563674926758, "global_step": 7924, "epoch": 95} {"train_loss": -17.38104820251465, "global_step": 7925, "epoch": 95} {"train_loss": -17.557191848754883, "global_step": 7926, "epoch": 95} {"train_loss": -17.362525939941406, "global_step": 7927, "epoch": 95} {"train_loss": -17.340267181396484, "global_step": 7928, "epoch": 95} {"train_loss": -17.662025451660156, "global_step": 7929, "epoch": 95} {"train_loss": -16.9710750579834, "global_step": 7930, "epoch": 95} {"train_loss": -17.168554306030273, "global_step": 7931, "epoch": 95} {"train_loss": -17.43063735961914, "global_step": 7932, "epoch": 95} {"train_loss": -17.4079532623291, "global_step": 7933, "epoch": 95} {"train_loss": -17.437145233154297, "global_step": 7934, "epoch": 95} {"train_loss": -17.375980377197266, "global_step": 7935, "epoch": 95} {"train_loss": -17.626575469970703, "global_step": 7936, "epoch": 95} {"train_loss": -17.126150131225586, "global_step": 7937, "epoch": 95} {"train_loss": -17.5610408782959, "global_step": 7938, "epoch": 95} {"train_loss": -17.38807487487793, "global_step": 7939, "epoch": 95} {"train_loss": -17.351043701171875, "global_step": 7940, "epoch": 95} {"train_loss": -17.146991729736328, "global_step": 7941, "epoch": 95} {"train_loss": -17.252599716186523, "global_step": 7942, "epoch": 95} {"train_loss": -17.18800163269043, "global_step": 7943, "epoch": 95} {"train_loss": -17.54613494873047, "global_step": 7944, "epoch": 95} {"train_loss": -16.939599990844727, "global_step": 7945, "epoch": 95} {"train_loss": -17.329143524169922, "global_step": 7946, "epoch": 95} {"train_loss": -17.563650131225586, "global_step": 7947, "epoch": 95} {"train_loss": -17.512836456298828, "global_step": 7948, "epoch": 95} {"train_loss": -17.501291275024414, "global_step": 7949, "epoch": 95} {"train_loss": -17.492727279663086, "global_step": 7950, "epoch": 95} {"train_loss": -17.607746124267578, "global_step": 7951, "epoch": 95} {"train_loss": -17.49989891052246, "global_step": 7952, "epoch": 95} {"train_loss": -17.667306900024414, "global_step": 7953, "epoch": 95} {"train_loss": -16.997909545898438, "global_step": 7954, "epoch": 95} {"train_loss": -17.648035049438477, "global_step": 7955, "epoch": 95} {"train_loss": -17.410465240478516, "global_step": 7956, "epoch": 95} {"train_loss": -18.089330673217773, "global_step": 7957, "epoch": 95} {"train_loss": -17.57181167602539, "global_step": 7958, "epoch": 95} {"train_loss": -17.55590057373047, "global_step": 7959, "epoch": 95} {"train_loss": -17.573041915893555, "global_step": 7960, "epoch": 95} {"train_loss": -17.099164962768555, "global_step": 7961, "epoch": 95} {"train_loss": -17.42927360534668, "global_step": 7962, "epoch": 95} {"train_loss": -17.341306686401367, "global_step": 7963, "epoch": 95} {"train_loss": -17.65445899963379, "global_step": 7964, "epoch": 95} {"train_loss": -17.523632049560547, "global_step": 7965, "epoch": 95} {"train_loss": -16.933515548706055, "global_step": 7966, "epoch": 95} {"train_loss": -17.391885412744728, "global_step": 7967, "epoch": 95, "val_loss": 6504503.0} {"train_loss": -17.040056228637695, "global_step": 7968, "epoch": 96} {"train_loss": -16.867692947387695, "global_step": 7969, "epoch": 96} {"train_loss": -16.75225830078125, "global_step": 7970, "epoch": 96} {"train_loss": -17.2825870513916, "global_step": 7971, "epoch": 96} {"train_loss": -16.978147506713867, "global_step": 7972, "epoch": 96} {"train_loss": -16.62367820739746, "global_step": 7973, "epoch": 96} {"train_loss": -16.873809814453125, "global_step": 7974, "epoch": 96} {"train_loss": -17.344013214111328, "global_step": 7975, "epoch": 96} {"train_loss": -17.04636001586914, "global_step": 7976, "epoch": 96} {"train_loss": -17.042203903198242, "global_step": 7977, "epoch": 96} {"train_loss": -16.927127838134766, "global_step": 7978, "epoch": 96} {"train_loss": -17.254697799682617, "global_step": 7979, "epoch": 96} {"train_loss": -17.477441787719727, "global_step": 7980, "epoch": 96} {"train_loss": -17.46929359436035, "global_step": 7981, "epoch": 96} {"train_loss": -17.24123191833496, "global_step": 7982, "epoch": 96} {"train_loss": -17.177326202392578, "global_step": 7983, "epoch": 96} {"train_loss": -17.167375564575195, "global_step": 7984, "epoch": 96} {"train_loss": -17.180639266967773, "global_step": 7985, "epoch": 96} {"train_loss": -17.425241470336914, "global_step": 7986, "epoch": 96} {"train_loss": -17.20224952697754, "global_step": 7987, "epoch": 96} {"train_loss": -17.313678741455078, "global_step": 7988, "epoch": 96} {"train_loss": -16.665813446044922, "global_step": 7989, "epoch": 96} {"train_loss": -17.403331756591797, "global_step": 7990, "epoch": 96} {"train_loss": -17.049348831176758, "global_step": 7991, "epoch": 96} {"train_loss": -17.583574295043945, "global_step": 7992, "epoch": 96} {"train_loss": -17.34442710876465, "global_step": 7993, "epoch": 96} {"train_loss": -17.46826934814453, "global_step": 7994, "epoch": 96} {"train_loss": -17.041593551635742, "global_step": 7995, "epoch": 96} {"train_loss": -17.54876708984375, "global_step": 7996, "epoch": 96} {"train_loss": -17.4190616607666, "global_step": 7997, "epoch": 96} {"train_loss": -17.500656127929688, "global_step": 7998, "epoch": 96} {"train_loss": -17.531980514526367, "global_step": 7999, "epoch": 96} {"train_loss": -17.707412719726562, "global_step": 8000, "epoch": 96} {"train_loss": -17.44513702392578, "global_step": 8001, "epoch": 96} {"train_loss": -17.40410041809082, "global_step": 8002, "epoch": 96} {"train_loss": -17.475412368774414, "global_step": 8003, "epoch": 96} {"train_loss": -17.661108016967773, "global_step": 8004, "epoch": 96} {"train_loss": -17.2672061920166, "global_step": 8005, "epoch": 96} {"train_loss": -17.622392654418945, "global_step": 8006, "epoch": 96} {"train_loss": -17.61679458618164, "global_step": 8007, "epoch": 96} {"train_loss": -17.594913482666016, "global_step": 8008, "epoch": 96} {"train_loss": -17.266427993774414, "global_step": 8009, "epoch": 96} {"train_loss": -17.4648380279541, "global_step": 8010, "epoch": 96} {"train_loss": -17.209070205688477, "global_step": 8011, "epoch": 96} {"train_loss": -17.10672950744629, "global_step": 8012, "epoch": 96} {"train_loss": -17.52180290222168, "global_step": 8013, "epoch": 96} {"train_loss": -16.88972282409668, "global_step": 8014, "epoch": 96} {"train_loss": -17.137983322143555, "global_step": 8015, "epoch": 96} {"train_loss": -17.571517944335938, "global_step": 8016, "epoch": 96} {"train_loss": -17.359268188476562, "global_step": 8017, "epoch": 96} {"train_loss": -17.402996063232422, "global_step": 8018, "epoch": 96} {"train_loss": -17.67448616027832, "global_step": 8019, "epoch": 96} {"train_loss": -17.537710189819336, "global_step": 8020, "epoch": 96} {"train_loss": -16.924365997314453, "global_step": 8021, "epoch": 96} {"train_loss": -17.68522834777832, "global_step": 8022, "epoch": 96} {"train_loss": -17.57305145263672, "global_step": 8023, "epoch": 96} {"train_loss": -17.515993118286133, "global_step": 8024, "epoch": 96} {"train_loss": -17.34047508239746, "global_step": 8025, "epoch": 96} {"train_loss": -17.115503311157227, "global_step": 8026, "epoch": 96} {"train_loss": -17.59791374206543, "global_step": 8027, "epoch": 96} {"train_loss": -17.62557029724121, "global_step": 8028, "epoch": 96} {"train_loss": -17.566896438598633, "global_step": 8029, "epoch": 96} {"train_loss": -17.670522689819336, "global_step": 8030, "epoch": 96} {"train_loss": -17.387332916259766, "global_step": 8031, "epoch": 96} {"train_loss": -17.174468994140625, "global_step": 8032, "epoch": 96} {"train_loss": -17.331403732299805, "global_step": 8033, "epoch": 96} {"train_loss": -17.55365562438965, "global_step": 8034, "epoch": 96} {"train_loss": -17.436845779418945, "global_step": 8035, "epoch": 96} {"train_loss": -17.4462947845459, "global_step": 8036, "epoch": 96} {"train_loss": -17.54575538635254, "global_step": 8037, "epoch": 96} {"train_loss": -17.43745994567871, "global_step": 8038, "epoch": 96} {"train_loss": -17.120771408081055, "global_step": 8039, "epoch": 96} {"train_loss": -17.55152702331543, "global_step": 8040, "epoch": 96} {"train_loss": -17.448793411254883, "global_step": 8041, "epoch": 96} {"train_loss": -17.09368896484375, "global_step": 8042, "epoch": 96} {"train_loss": -17.177457809448242, "global_step": 8043, "epoch": 96} {"train_loss": -17.755151748657227, "global_step": 8044, "epoch": 96} {"train_loss": -17.57857894897461, "global_step": 8045, "epoch": 96} {"train_loss": -17.21425437927246, "global_step": 8046, "epoch": 96} {"train_loss": -17.632902145385742, "global_step": 8047, "epoch": 96} {"train_loss": -17.290973663330078, "global_step": 8048, "epoch": 96} {"train_loss": -17.302165985107422, "global_step": 8049, "epoch": 96} {"train_loss": -17.33855325629912, "global_step": 8050, "epoch": 96, "val_loss": 6544815.5} {"train_loss": -17.04270362854004, "global_step": 8051, "epoch": 97} {"train_loss": -17.131633758544922, "global_step": 8052, "epoch": 97} {"train_loss": -17.17222023010254, "global_step": 8053, "epoch": 97} {"train_loss": -17.299211502075195, "global_step": 8054, "epoch": 97} {"train_loss": -17.54376792907715, "global_step": 8055, "epoch": 97} {"train_loss": -17.12838363647461, "global_step": 8056, "epoch": 97} {"train_loss": -17.0806884765625, "global_step": 8057, "epoch": 97} {"train_loss": -17.263450622558594, "global_step": 8058, "epoch": 97} {"train_loss": -17.53017807006836, "global_step": 8059, "epoch": 97} {"train_loss": -17.146268844604492, "global_step": 8060, "epoch": 97} {"train_loss": -17.5603084564209, "global_step": 8061, "epoch": 97} {"train_loss": -17.317541122436523, "global_step": 8062, "epoch": 97} {"train_loss": -17.35481834411621, "global_step": 8063, "epoch": 97} {"train_loss": -17.301712036132812, "global_step": 8064, "epoch": 97} {"train_loss": -17.43848991394043, "global_step": 8065, "epoch": 97} {"train_loss": -17.35712242126465, "global_step": 8066, "epoch": 97} {"train_loss": -17.47499656677246, "global_step": 8067, "epoch": 97} {"train_loss": -17.43399429321289, "global_step": 8068, "epoch": 97} {"train_loss": -17.38044548034668, "global_step": 8069, "epoch": 97} {"train_loss": -17.526025772094727, "global_step": 8070, "epoch": 97} {"train_loss": -17.169071197509766, "global_step": 8071, "epoch": 97} {"train_loss": -17.700231552124023, "global_step": 8072, "epoch": 97} {"train_loss": -17.359420776367188, "global_step": 8073, "epoch": 97} {"train_loss": -17.613929748535156, "global_step": 8074, "epoch": 97} {"train_loss": -17.3497257232666, "global_step": 8075, "epoch": 97} {"train_loss": -17.598297119140625, "global_step": 8076, "epoch": 97} {"train_loss": -17.647598266601562, "global_step": 8077, "epoch": 97} {"train_loss": -17.52768898010254, "global_step": 8078, "epoch": 97} {"train_loss": -17.241378784179688, "global_step": 8079, "epoch": 97} {"train_loss": -17.54306411743164, "global_step": 8080, "epoch": 97} {"train_loss": -17.42340850830078, "global_step": 8081, "epoch": 97} {"train_loss": -16.97099494934082, "global_step": 8082, "epoch": 97} {"train_loss": -17.376707077026367, "global_step": 8083, "epoch": 97} {"train_loss": -17.78315544128418, "global_step": 8084, "epoch": 97} {"train_loss": -16.68583869934082, "global_step": 8085, "epoch": 97} {"train_loss": -17.202566146850586, "global_step": 8086, "epoch": 97} {"train_loss": -17.09470558166504, "global_step": 8087, "epoch": 97} {"train_loss": -17.69875717163086, "global_step": 8088, "epoch": 97} {"train_loss": -17.152379989624023, "global_step": 8089, "epoch": 97} {"train_loss": -17.567615509033203, "global_step": 8090, "epoch": 97} {"train_loss": -17.47028923034668, "global_step": 8091, "epoch": 97} {"train_loss": -17.54300880432129, "global_step": 8092, "epoch": 97} {"train_loss": -16.868749618530273, "global_step": 8093, "epoch": 97} {"train_loss": -17.56203842163086, "global_step": 8094, "epoch": 97} {"train_loss": -17.422128677368164, "global_step": 8095, "epoch": 97} {"train_loss": -17.439455032348633, "global_step": 8096, "epoch": 97} {"train_loss": -17.354949951171875, "global_step": 8097, "epoch": 97} {"train_loss": -17.682126998901367, "global_step": 8098, "epoch": 97} {"train_loss": -17.781801223754883, "global_step": 8099, "epoch": 97} {"train_loss": -17.586042404174805, "global_step": 8100, "epoch": 97} {"train_loss": -16.490488052368164, "global_step": 8101, "epoch": 97} {"train_loss": -17.679912567138672, "global_step": 8102, "epoch": 97} {"train_loss": -17.520238876342773, "global_step": 8103, "epoch": 97} {"train_loss": -17.450424194335938, "global_step": 8104, "epoch": 97} {"train_loss": -17.41278648376465, "global_step": 8105, "epoch": 97} {"train_loss": -17.137487411499023, "global_step": 8106, "epoch": 97} {"train_loss": -17.392444610595703, "global_step": 8107, "epoch": 97} {"train_loss": -17.528844833374023, "global_step": 8108, "epoch": 97} {"train_loss": -17.721019744873047, "global_step": 8109, "epoch": 97} {"train_loss": -17.39459991455078, "global_step": 8110, "epoch": 97} {"train_loss": -17.54636573791504, "global_step": 8111, "epoch": 97} {"train_loss": -17.144216537475586, "global_step": 8112, "epoch": 97} {"train_loss": -17.0335693359375, "global_step": 8113, "epoch": 97} {"train_loss": -17.193729400634766, "global_step": 8114, "epoch": 97} {"train_loss": -17.472618103027344, "global_step": 8115, "epoch": 97} {"train_loss": -17.543310165405273, "global_step": 8116, "epoch": 97} {"train_loss": -17.46341896057129, "global_step": 8117, "epoch": 97} {"train_loss": -17.309921264648438, "global_step": 8118, "epoch": 97} {"train_loss": -17.43558692932129, "global_step": 8119, "epoch": 97} {"train_loss": -17.454904556274414, "global_step": 8120, "epoch": 97} {"train_loss": -16.91347312927246, "global_step": 8121, "epoch": 97} {"train_loss": -17.363357543945312, "global_step": 8122, "epoch": 97} {"train_loss": -17.63887596130371, "global_step": 8123, "epoch": 97} {"train_loss": -17.542789459228516, "global_step": 8124, "epoch": 97} {"train_loss": -17.552066802978516, "global_step": 8125, "epoch": 97} {"train_loss": -17.236352920532227, "global_step": 8126, "epoch": 97} {"train_loss": -17.408994674682617, "global_step": 8127, "epoch": 97} {"train_loss": -17.70465660095215, "global_step": 8128, "epoch": 97} {"train_loss": -17.311538696289062, "global_step": 8129, "epoch": 97} {"train_loss": -17.491865158081055, "global_step": 8130, "epoch": 97} {"train_loss": -17.19799041748047, "global_step": 8131, "epoch": 97} {"train_loss": -17.169597625732422, "global_step": 8132, "epoch": 97} {"train_loss": -17.384530722376812, "global_step": 8133, "epoch": 97, "val_loss": 6262598.5} {"train_loss": -16.92481231689453, "global_step": 8134, "epoch": 98} {"train_loss": -17.02927589416504, "global_step": 8135, "epoch": 98} {"train_loss": -17.15399169921875, "global_step": 8136, "epoch": 98} {"train_loss": -17.127151489257812, "global_step": 8137, "epoch": 98} {"train_loss": -17.391822814941406, "global_step": 8138, "epoch": 98} {"train_loss": -17.7083740234375, "global_step": 8139, "epoch": 98} {"train_loss": -17.45274543762207, "global_step": 8140, "epoch": 98} {"train_loss": -17.33151626586914, "global_step": 8141, "epoch": 98} {"train_loss": -17.450321197509766, "global_step": 8142, "epoch": 98} {"train_loss": -16.884418487548828, "global_step": 8143, "epoch": 98} {"train_loss": -17.822599411010742, "global_step": 8144, "epoch": 98} {"train_loss": -17.56117820739746, "global_step": 8145, "epoch": 98} {"train_loss": -17.355152130126953, "global_step": 8146, "epoch": 98} {"train_loss": -17.12745475769043, "global_step": 8147, "epoch": 98} {"train_loss": -17.465167999267578, "global_step": 8148, "epoch": 98} {"train_loss": -17.340566635131836, "global_step": 8149, "epoch": 98} {"train_loss": -17.418699264526367, "global_step": 8150, "epoch": 98} {"train_loss": -17.476499557495117, "global_step": 8151, "epoch": 98} {"train_loss": -17.531835556030273, "global_step": 8152, "epoch": 98} {"train_loss": -17.638980865478516, "global_step": 8153, "epoch": 98} {"train_loss": -17.37945556640625, "global_step": 8154, "epoch": 98} {"train_loss": -17.367950439453125, "global_step": 8155, "epoch": 98} {"train_loss": -17.672592163085938, "global_step": 8156, "epoch": 98} {"train_loss": -17.737586975097656, "global_step": 8157, "epoch": 98} {"train_loss": -17.359922409057617, "global_step": 8158, "epoch": 98} {"train_loss": -17.570369720458984, "global_step": 8159, "epoch": 98} {"train_loss": -17.73197364807129, "global_step": 8160, "epoch": 98} {"train_loss": -17.365530014038086, "global_step": 8161, "epoch": 98} {"train_loss": -17.691381454467773, "global_step": 8162, "epoch": 98} {"train_loss": -17.676870346069336, "global_step": 8163, "epoch": 98} {"train_loss": -17.345685958862305, "global_step": 8164, "epoch": 98} {"train_loss": -17.631328582763672, "global_step": 8165, "epoch": 98} {"train_loss": -17.30475425720215, "global_step": 8166, "epoch": 98} {"train_loss": -17.560739517211914, "global_step": 8167, "epoch": 98} {"train_loss": -17.25605583190918, "global_step": 8168, "epoch": 98} {"train_loss": -17.081396102905273, "global_step": 8169, "epoch": 98} {"train_loss": -17.273801803588867, "global_step": 8170, "epoch": 98} {"train_loss": -17.29709815979004, "global_step": 8171, "epoch": 98} {"train_loss": -17.18627166748047, "global_step": 8172, "epoch": 98} {"train_loss": -17.434839248657227, "global_step": 8173, "epoch": 98} {"train_loss": -17.195659637451172, "global_step": 8174, "epoch": 98} {"train_loss": -17.579238891601562, "global_step": 8175, "epoch": 98} {"train_loss": -17.528852462768555, "global_step": 8176, "epoch": 98} {"train_loss": -17.53401756286621, "global_step": 8177, "epoch": 98} {"train_loss": -17.080156326293945, "global_step": 8178, "epoch": 98} {"train_loss": -17.75528335571289, "global_step": 8179, "epoch": 98} {"train_loss": -17.621551513671875, "global_step": 8180, "epoch": 98} {"train_loss": -17.572067260742188, "global_step": 8181, "epoch": 98} {"train_loss": -17.490535736083984, "global_step": 8182, "epoch": 98} {"train_loss": -17.1748046875, "global_step": 8183, "epoch": 98} {"train_loss": -17.279769897460938, "global_step": 8184, "epoch": 98} {"train_loss": -17.43939208984375, "global_step": 8185, "epoch": 98} {"train_loss": -17.9528751373291, "global_step": 8186, "epoch": 98} {"train_loss": -17.041248321533203, "global_step": 8187, "epoch": 98} {"train_loss": -17.281177520751953, "global_step": 8188, "epoch": 98} {"train_loss": -17.296890258789062, "global_step": 8189, "epoch": 98} {"train_loss": -17.46879005432129, "global_step": 8190, "epoch": 98} {"train_loss": -17.706256866455078, "global_step": 8191, "epoch": 98} {"train_loss": -17.735654830932617, "global_step": 8192, "epoch": 98} {"train_loss": -17.58711051940918, "global_step": 8193, "epoch": 98} {"train_loss": -17.447519302368164, "global_step": 8194, "epoch": 98} {"train_loss": -17.522966384887695, "global_step": 8195, "epoch": 98} {"train_loss": -17.295530319213867, "global_step": 8196, "epoch": 98} {"train_loss": -17.341190338134766, "global_step": 8197, "epoch": 98} {"train_loss": -17.4390926361084, "global_step": 8198, "epoch": 98} {"train_loss": -17.205190658569336, "global_step": 8199, "epoch": 98} {"train_loss": -17.524564743041992, "global_step": 8200, "epoch": 98} {"train_loss": -17.14717674255371, "global_step": 8201, "epoch": 98} {"train_loss": -17.6494197845459, "global_step": 8202, "epoch": 98} {"train_loss": -17.505718231201172, "global_step": 8203, "epoch": 98} {"train_loss": -17.48370361328125, "global_step": 8204, "epoch": 98} {"train_loss": -17.26213836669922, "global_step": 8205, "epoch": 98} {"train_loss": -17.497665405273438, "global_step": 8206, "epoch": 98} {"train_loss": -17.53742790222168, "global_step": 8207, "epoch": 98} {"train_loss": -17.27833366394043, "global_step": 8208, "epoch": 98} {"train_loss": -17.224288940429688, "global_step": 8209, "epoch": 98} {"train_loss": -17.64977264404297, "global_step": 8210, "epoch": 98} {"train_loss": -17.463125228881836, "global_step": 8211, "epoch": 98} {"train_loss": -17.311391830444336, "global_step": 8212, "epoch": 98} {"train_loss": -17.498050689697266, "global_step": 8213, "epoch": 98} {"train_loss": -17.461349487304688, "global_step": 8214, "epoch": 98} {"train_loss": -17.552637100219727, "global_step": 8215, "epoch": 98} {"train_loss": -17.4167583649417, "global_step": 8216, "epoch": 98, "val_loss": 6325471.0} {"train_loss": -16.993999481201172, "global_step": 8217, "epoch": 99} {"train_loss": -16.60036277770996, "global_step": 8218, "epoch": 99} {"train_loss": -17.472726821899414, "global_step": 8219, "epoch": 99} {"train_loss": -17.516340255737305, "global_step": 8220, "epoch": 99} {"train_loss": -17.214399337768555, "global_step": 8221, "epoch": 99} {"train_loss": -17.286304473876953, "global_step": 8222, "epoch": 99} {"train_loss": -17.223493576049805, "global_step": 8223, "epoch": 99} {"train_loss": -17.004724502563477, "global_step": 8224, "epoch": 99} {"train_loss": -17.332544326782227, "global_step": 8225, "epoch": 99} {"train_loss": -17.550294876098633, "global_step": 8226, "epoch": 99} {"train_loss": -16.9489803314209, "global_step": 8227, "epoch": 99} {"train_loss": -17.492969512939453, "global_step": 8228, "epoch": 99} {"train_loss": -17.361724853515625, "global_step": 8229, "epoch": 99} {"train_loss": -17.517637252807617, "global_step": 8230, "epoch": 99} {"train_loss": -17.235578536987305, "global_step": 8231, "epoch": 99} {"train_loss": -17.109817504882812, "global_step": 8232, "epoch": 99} {"train_loss": -17.57048797607422, "global_step": 8233, "epoch": 99} {"train_loss": -17.498565673828125, "global_step": 8234, "epoch": 99} {"train_loss": -17.552457809448242, "global_step": 8235, "epoch": 99} {"train_loss": -17.29085350036621, "global_step": 8236, "epoch": 99} {"train_loss": -17.112756729125977, "global_step": 8237, "epoch": 99} {"train_loss": -17.65115737915039, "global_step": 8238, "epoch": 99} {"train_loss": -16.90251350402832, "global_step": 8239, "epoch": 99} {"train_loss": -17.405614852905273, "global_step": 8240, "epoch": 99} {"train_loss": -17.16675567626953, "global_step": 8241, "epoch": 99} {"train_loss": -17.43541145324707, "global_step": 8242, "epoch": 99} {"train_loss": -17.295766830444336, "global_step": 8243, "epoch": 99} {"train_loss": -17.306102752685547, "global_step": 8244, "epoch": 99} {"train_loss": -17.498432159423828, "global_step": 8245, "epoch": 99} {"train_loss": -17.208932876586914, "global_step": 8246, "epoch": 99} {"train_loss": -17.502201080322266, "global_step": 8247, "epoch": 99} {"train_loss": -17.53612518310547, "global_step": 8248, "epoch": 99} {"train_loss": -17.308685302734375, "global_step": 8249, "epoch": 99} {"train_loss": -17.042707443237305, "global_step": 8250, "epoch": 99} {"train_loss": -17.533273696899414, "global_step": 8251, "epoch": 99} {"train_loss": -17.13429069519043, "global_step": 8252, "epoch": 99} {"train_loss": -17.370969772338867, "global_step": 8253, "epoch": 99} {"train_loss": -17.566707611083984, "global_step": 8254, "epoch": 99} {"train_loss": -17.480113983154297, "global_step": 8255, "epoch": 99} {"train_loss": -17.27239418029785, "global_step": 8256, "epoch": 99} {"train_loss": -17.596588134765625, "global_step": 8257, "epoch": 99} {"train_loss": -17.188426971435547, "global_step": 8258, "epoch": 99} {"train_loss": -17.38413429260254, "global_step": 8259, "epoch": 99} {"train_loss": -17.286954879760742, "global_step": 8260, "epoch": 99} {"train_loss": -17.649524688720703, "global_step": 8261, "epoch": 99} {"train_loss": -17.506017684936523, "global_step": 8262, "epoch": 99} {"train_loss": -17.6942195892334, "global_step": 8263, "epoch": 99} {"train_loss": -17.243379592895508, "global_step": 8264, "epoch": 99} {"train_loss": -17.738866806030273, "global_step": 8265, "epoch": 99} {"train_loss": -17.2886962890625, "global_step": 8266, "epoch": 99} {"train_loss": -17.33831787109375, "global_step": 8267, "epoch": 99} {"train_loss": -17.620969772338867, "global_step": 8268, "epoch": 99} {"train_loss": -17.506088256835938, "global_step": 8269, "epoch": 99} {"train_loss": -17.313159942626953, "global_step": 8270, "epoch": 99} {"train_loss": -17.58906364440918, "global_step": 8271, "epoch": 99} {"train_loss": -17.554401397705078, "global_step": 8272, "epoch": 99} {"train_loss": -17.48225212097168, "global_step": 8273, "epoch": 99} {"train_loss": -17.15753936767578, "global_step": 8274, "epoch": 99} {"train_loss": -16.95175552368164, "global_step": 8275, "epoch": 99} {"train_loss": -17.93967056274414, "global_step": 8276, "epoch": 99} {"train_loss": -17.420961380004883, "global_step": 8277, "epoch": 99} {"train_loss": -17.09902000427246, "global_step": 8278, "epoch": 99} {"train_loss": -17.806066513061523, "global_step": 8279, "epoch": 99} {"train_loss": -17.334157943725586, "global_step": 8280, "epoch": 99} {"train_loss": -17.657712936401367, "global_step": 8281, "epoch": 99} {"train_loss": -17.810503005981445, "global_step": 8282, "epoch": 99} {"train_loss": -17.623022079467773, "global_step": 8283, "epoch": 99} {"train_loss": -17.537700653076172, "global_step": 8284, "epoch": 99} {"train_loss": -17.211715698242188, "global_step": 8285, "epoch": 99} {"train_loss": -17.65254783630371, "global_step": 8286, "epoch": 99} {"train_loss": -17.59860610961914, "global_step": 8287, "epoch": 99} {"train_loss": -17.60751724243164, "global_step": 8288, "epoch": 99} {"train_loss": -17.61884117126465, "global_step": 8289, "epoch": 99} {"train_loss": -17.60458755493164, "global_step": 8290, "epoch": 99} {"train_loss": -17.53465461730957, "global_step": 8291, "epoch": 99} {"train_loss": -17.72335433959961, "global_step": 8292, "epoch": 99} {"train_loss": -17.371021270751953, "global_step": 8293, "epoch": 99} {"train_loss": -17.14784049987793, "global_step": 8294, "epoch": 99} {"train_loss": -17.547651290893555, "global_step": 8295, "epoch": 99} {"train_loss": -17.561216354370117, "global_step": 8296, "epoch": 99} {"train_loss": -17.64432716369629, "global_step": 8297, "epoch": 99} {"train_loss": -17.186752319335938, "global_step": 8298, "epoch": 99} {"train_loss": -17.40146701307182, "global_step": 8299, "epoch": 99, "val_loss": 6229310.0} {"train_loss": -17.189905166625977, "global_step": 8300, "epoch": 100} {"train_loss": -17.245372772216797, "global_step": 8301, "epoch": 100} {"train_loss": -17.143146514892578, "global_step": 8302, "epoch": 100} {"train_loss": -17.317886352539062, "global_step": 8303, "epoch": 100} {"train_loss": -17.37311363220215, "global_step": 8304, "epoch": 100} {"train_loss": -17.546606063842773, "global_step": 8305, "epoch": 100} {"train_loss": -17.37960433959961, "global_step": 8306, "epoch": 100} {"train_loss": -17.659334182739258, "global_step": 8307, "epoch": 100} {"train_loss": -17.354145050048828, "global_step": 8308, "epoch": 100} {"train_loss": -17.31110382080078, "global_step": 8309, "epoch": 100} {"train_loss": -17.43012046813965, "global_step": 8310, "epoch": 100} {"train_loss": -17.437496185302734, "global_step": 8311, "epoch": 100} {"train_loss": -17.803218841552734, "global_step": 8312, "epoch": 100} {"train_loss": -17.18097496032715, "global_step": 8313, "epoch": 100} {"train_loss": -17.72083854675293, "global_step": 8314, "epoch": 100} {"train_loss": -17.440410614013672, "global_step": 8315, "epoch": 100} {"train_loss": -17.333927154541016, "global_step": 8316, "epoch": 100} {"train_loss": -17.486059188842773, "global_step": 8317, "epoch": 100} {"train_loss": -17.389476776123047, "global_step": 8318, "epoch": 100} {"train_loss": -17.69549560546875, "global_step": 8319, "epoch": 100} {"train_loss": -17.247806549072266, "global_step": 8320, "epoch": 100} {"train_loss": -17.45900535583496, "global_step": 8321, "epoch": 100} {"train_loss": -17.30136489868164, "global_step": 8322, "epoch": 100} {"train_loss": -17.278852462768555, "global_step": 8323, "epoch": 100} {"train_loss": -17.75812339782715, "global_step": 8324, "epoch": 100} {"train_loss": -17.651212692260742, "global_step": 8325, "epoch": 100} {"train_loss": -17.411500930786133, "global_step": 8326, "epoch": 100} {"train_loss": -17.32862663269043, "global_step": 8327, "epoch": 100} {"train_loss": -17.238548278808594, "global_step": 8328, "epoch": 100} {"train_loss": -17.552268981933594, "global_step": 8329, "epoch": 100} {"train_loss": -17.543771743774414, "global_step": 8330, "epoch": 100} {"train_loss": -17.641830444335938, "global_step": 8331, "epoch": 100} {"train_loss": -17.265722274780273, "global_step": 8332, "epoch": 100} {"train_loss": -17.597654342651367, "global_step": 8333, "epoch": 100} {"train_loss": -17.522388458251953, "global_step": 8334, "epoch": 100} {"train_loss": -17.366670608520508, "global_step": 8335, "epoch": 100} {"train_loss": -17.39082145690918, "global_step": 8336, "epoch": 100} {"train_loss": -17.51837158203125, "global_step": 8337, "epoch": 100} {"train_loss": -17.283361434936523, "global_step": 8338, "epoch": 100} {"train_loss": -16.996923446655273, "global_step": 8339, "epoch": 100} {"train_loss": -17.7526912689209, "global_step": 8340, "epoch": 100} {"train_loss": -17.59539222717285, "global_step": 8341, "epoch": 100} {"train_loss": -17.242258071899414, "global_step": 8342, "epoch": 100} {"train_loss": -17.590774536132812, "global_step": 8343, "epoch": 100} {"train_loss": -17.596906661987305, "global_step": 8344, "epoch": 100} {"train_loss": -17.46796226501465, "global_step": 8345, "epoch": 100} {"train_loss": -17.649677276611328, "global_step": 8346, "epoch": 100} {"train_loss": -17.48627281188965, "global_step": 8347, "epoch": 100} {"train_loss": -17.53916358947754, "global_step": 8348, "epoch": 100} {"train_loss": -17.571945190429688, "global_step": 8349, "epoch": 100} {"train_loss": -17.45694351196289, "global_step": 8350, "epoch": 100} {"train_loss": -17.438657760620117, "global_step": 8351, "epoch": 100} {"train_loss": -17.257190704345703, "global_step": 8352, "epoch": 100} {"train_loss": -17.339111328125, "global_step": 8353, "epoch": 100} {"train_loss": -17.52018165588379, "global_step": 8354, "epoch": 100} {"train_loss": -17.562637329101562, "global_step": 8355, "epoch": 100} {"train_loss": -17.516056060791016, "global_step": 8356, "epoch": 100} {"train_loss": -17.277179718017578, "global_step": 8357, "epoch": 100} {"train_loss": -17.468854904174805, "global_step": 8358, "epoch": 100} {"train_loss": -17.391199111938477, "global_step": 8359, "epoch": 100} {"train_loss": -17.446569442749023, "global_step": 8360, "epoch": 100} {"train_loss": -17.4235897064209, "global_step": 8361, "epoch": 100} {"train_loss": -16.848331451416016, "global_step": 8362, "epoch": 100} {"train_loss": -17.478485107421875, "global_step": 8363, "epoch": 100} {"train_loss": -17.351612091064453, "global_step": 8364, "epoch": 100} {"train_loss": -17.626142501831055, "global_step": 8365, "epoch": 100} {"train_loss": -17.462865829467773, "global_step": 8366, "epoch": 100} {"train_loss": -17.599931716918945, "global_step": 8367, "epoch": 100} {"train_loss": -16.87054443359375, "global_step": 8368, "epoch": 100} {"train_loss": -17.430509567260742, "global_step": 8369, "epoch": 100} {"train_loss": -17.503684997558594, "global_step": 8370, "epoch": 100} {"train_loss": -17.139080047607422, "global_step": 8371, "epoch": 100} {"train_loss": -17.776443481445312, "global_step": 8372, "epoch": 100} {"train_loss": -17.7518253326416, "global_step": 8373, "epoch": 100} {"train_loss": -17.51456642150879, "global_step": 8374, "epoch": 100} {"train_loss": -16.989839553833008, "global_step": 8375, "epoch": 100} {"train_loss": -16.973730087280273, "global_step": 8376, "epoch": 100} {"train_loss": -17.62067985534668, "global_step": 8377, "epoch": 100} {"train_loss": -17.500036239624023, "global_step": 8378, "epoch": 100} {"train_loss": -17.45599365234375, "global_step": 8379, "epoch": 100} {"train_loss": -17.254911422729492, "global_step": 8380, "epoch": 100} {"train_loss": -17.4090633392334, "global_step": 8381, "epoch": 100} {"train_loss": -17.434961824532014, "global_step": 8382, "epoch": 100, "train/sim_max_reward_0": 0.0, "train/sim_max_reward_1": 0.0, "train/sim_max_reward_2": 0.0, "train/sim_max_reward_3": 0.0, "train/sim_max_reward_4": 0.0, "train/sim_max_reward_5": 0.0, "test/sim_max_reward_4500000": 0.0, "test/sim_max_reward_4500001": 0.0, "test/sim_max_reward_4500002": 0.0, "test/sim_max_reward_4500003": 0.0, "test/sim_max_reward_4500004": 0.0, "test/sim_max_reward_4500005": 0.0, "test/sim_max_reward_4500006": 0.0, "test/sim_max_reward_4500007": 0.0, "test/sim_max_reward_4500008": 0.0, "test/sim_max_reward_4500009": 0.0, "test/sim_max_reward_4500010": 0.0, "test/sim_max_reward_4500011": 0.0, "test/sim_max_reward_4500012": 0.0, "test/sim_max_reward_4500013": 0.0, "test/sim_max_reward_4500014": 0.0, "test/sim_max_reward_4500015": 0.0, "test/sim_max_reward_4500016": 0.0, "test/sim_max_reward_4500017": 0.0, "test/sim_max_reward_4500018": 0.0, "test/sim_max_reward_4500019": 0.0, "test/sim_max_reward_4500020": 0.0, "test/sim_max_reward_4500021": 0.0, "train/mean_score": 0.0, "test/mean_score": 0.0, "val_loss": 6284586.0} {"train_loss": -17.361431121826172, "global_step": 8383, "epoch": 101} {"train_loss": -16.784515380859375, "global_step": 8384, "epoch": 101} {"train_loss": -17.517257690429688, "global_step": 8385, "epoch": 101} {"train_loss": -17.495559692382812, "global_step": 8386, "epoch": 101} {"train_loss": -17.022397994995117, "global_step": 8387, "epoch": 101} {"train_loss": -17.651355743408203, "global_step": 8388, "epoch": 101} {"train_loss": -17.333616256713867, "global_step": 8389, "epoch": 101} {"train_loss": -17.2605037689209, "global_step": 8390, "epoch": 101} {"train_loss": -17.329370498657227, "global_step": 8391, "epoch": 101} {"train_loss": -17.257043838500977, "global_step": 8392, "epoch": 101} {"train_loss": -17.292861938476562, "global_step": 8393, "epoch": 101} {"train_loss": -17.1778507232666, "global_step": 8394, "epoch": 101} {"train_loss": -17.212360382080078, "global_step": 8395, "epoch": 101} {"train_loss": -17.21099853515625, "global_step": 8396, "epoch": 101} {"train_loss": -17.600433349609375, "global_step": 8397, "epoch": 101} {"train_loss": -17.2645263671875, "global_step": 8398, "epoch": 101} {"train_loss": -17.22516441345215, "global_step": 8399, "epoch": 101} {"train_loss": -17.424245834350586, "global_step": 8400, "epoch": 101} {"train_loss": -17.353790283203125, "global_step": 8401, "epoch": 101} {"train_loss": -17.1677303314209, "global_step": 8402, "epoch": 101} {"train_loss": -17.33676528930664, "global_step": 8403, "epoch": 101} {"train_loss": -17.355701446533203, "global_step": 8404, "epoch": 101} {"train_loss": -17.31662368774414, "global_step": 8405, "epoch": 101} {"train_loss": -17.429349899291992, "global_step": 8406, "epoch": 101} {"train_loss": -17.282142639160156, "global_step": 8407, "epoch": 101} {"train_loss": -17.264150619506836, "global_step": 8408, "epoch": 101} {"train_loss": -17.636587142944336, "global_step": 8409, "epoch": 101} {"train_loss": -17.3789119720459, "global_step": 8410, "epoch": 101} {"train_loss": -17.002182006835938, "global_step": 8411, "epoch": 101} {"train_loss": -17.937641143798828, "global_step": 8412, "epoch": 101} {"train_loss": -17.583757400512695, "global_step": 8413, "epoch": 101} {"train_loss": -17.117231369018555, "global_step": 8414, "epoch": 101} {"train_loss": -18.038522720336914, "global_step": 8415, "epoch": 101} {"train_loss": -17.17255973815918, "global_step": 8416, "epoch": 101} {"train_loss": -17.738950729370117, "global_step": 8417, "epoch": 101} {"train_loss": -17.819570541381836, "global_step": 8418, "epoch": 101} {"train_loss": -17.49268913269043, "global_step": 8419, "epoch": 101} {"train_loss": -17.236562728881836, "global_step": 8420, "epoch": 101} {"train_loss": -17.55152702331543, "global_step": 8421, "epoch": 101} {"train_loss": -17.437610626220703, "global_step": 8422, "epoch": 101} {"train_loss": -17.39703941345215, "global_step": 8423, "epoch": 101} {"train_loss": -17.76166343688965, "global_step": 8424, "epoch": 101} {"train_loss": -17.603336334228516, "global_step": 8425, "epoch": 101} {"train_loss": -17.65620994567871, "global_step": 8426, "epoch": 101} {"train_loss": -17.8808536529541, "global_step": 8427, "epoch": 101} {"train_loss": -17.812393188476562, "global_step": 8428, "epoch": 101} {"train_loss": -17.212568283081055, "global_step": 8429, "epoch": 101} {"train_loss": -17.506467819213867, "global_step": 8430, "epoch": 101} {"train_loss": -17.595605850219727, "global_step": 8431, "epoch": 101} {"train_loss": -17.339574813842773, "global_step": 8432, "epoch": 101} {"train_loss": -17.297670364379883, "global_step": 8433, "epoch": 101} {"train_loss": -17.187334060668945, "global_step": 8434, "epoch": 101} {"train_loss": -17.47675132751465, "global_step": 8435, "epoch": 101} {"train_loss": -17.536043167114258, "global_step": 8436, "epoch": 101} {"train_loss": -17.607473373413086, "global_step": 8437, "epoch": 101} {"train_loss": -17.427793502807617, "global_step": 8438, "epoch": 101} {"train_loss": -17.29646873474121, "global_step": 8439, "epoch": 101} {"train_loss": -17.58320426940918, "global_step": 8440, "epoch": 101} {"train_loss": -17.73270034790039, "global_step": 8441, "epoch": 101} {"train_loss": -17.421518325805664, "global_step": 8442, "epoch": 101} {"train_loss": -17.38954734802246, "global_step": 8443, "epoch": 101} {"train_loss": -17.465883255004883, "global_step": 8444, "epoch": 101} {"train_loss": -17.363618850708008, "global_step": 8445, "epoch": 101} {"train_loss": -17.369632720947266, "global_step": 8446, "epoch": 101} {"train_loss": -17.748098373413086, "global_step": 8447, "epoch": 101} {"train_loss": -17.49504852294922, "global_step": 8448, "epoch": 101} {"train_loss": -17.53619956970215, "global_step": 8449, "epoch": 101} {"train_loss": -17.147855758666992, "global_step": 8450, "epoch": 101} {"train_loss": -17.460220336914062, "global_step": 8451, "epoch": 101} {"train_loss": -17.268896102905273, "global_step": 8452, "epoch": 101} {"train_loss": -17.686431884765625, "global_step": 8453, "epoch": 101} {"train_loss": -17.55953025817871, "global_step": 8454, "epoch": 101} {"train_loss": -17.606765747070312, "global_step": 8455, "epoch": 101} {"train_loss": -17.519468307495117, "global_step": 8456, "epoch": 101} {"train_loss": -17.155628204345703, "global_step": 8457, "epoch": 101} {"train_loss": -17.65057945251465, "global_step": 8458, "epoch": 101} {"train_loss": -17.436445236206055, "global_step": 8459, "epoch": 101} {"train_loss": -17.545141220092773, "global_step": 8460, "epoch": 101} {"train_loss": -17.174453735351562, "global_step": 8461, "epoch": 101} {"train_loss": -17.283857345581055, "global_step": 8462, "epoch": 101} {"train_loss": -17.43486213684082, "global_step": 8463, "epoch": 101} {"train_loss": -17.445449829101562, "global_step": 8464, "epoch": 101} {"train_loss": -17.445371168205536, "global_step": 8465, "epoch": 101, "val_loss": 6468897.5} {"train_loss": -17.058897018432617, "global_step": 8466, "epoch": 102} {"train_loss": -17.43855094909668, "global_step": 8467, "epoch": 102} {"train_loss": -17.331613540649414, "global_step": 8468, "epoch": 102} {"train_loss": -17.415693283081055, "global_step": 8469, "epoch": 102} {"train_loss": -16.942340850830078, "global_step": 8470, "epoch": 102} {"train_loss": -17.70491600036621, "global_step": 8471, "epoch": 102} {"train_loss": -17.087669372558594, "global_step": 8472, "epoch": 102} {"train_loss": -17.184703826904297, "global_step": 8473, "epoch": 102} {"train_loss": -17.053884506225586, "global_step": 8474, "epoch": 102} {"train_loss": -17.07986831665039, "global_step": 8475, "epoch": 102} {"train_loss": -17.260482788085938, "global_step": 8476, "epoch": 102} {"train_loss": -17.503971099853516, "global_step": 8477, "epoch": 102} {"train_loss": -17.458547592163086, "global_step": 8478, "epoch": 102} {"train_loss": -17.03321647644043, "global_step": 8479, "epoch": 102} {"train_loss": -17.318096160888672, "global_step": 8480, "epoch": 102} {"train_loss": -17.505277633666992, "global_step": 8481, "epoch": 102} {"train_loss": -17.071231842041016, "global_step": 8482, "epoch": 102} {"train_loss": -17.48417091369629, "global_step": 8483, "epoch": 102} {"train_loss": -17.64603614807129, "global_step": 8484, "epoch": 102} {"train_loss": -17.386722564697266, "global_step": 8485, "epoch": 102} {"train_loss": -17.190662384033203, "global_step": 8486, "epoch": 102} {"train_loss": -17.543546676635742, "global_step": 8487, "epoch": 102} {"train_loss": -17.19563865661621, "global_step": 8488, "epoch": 102} {"train_loss": -17.588138580322266, "global_step": 8489, "epoch": 102} {"train_loss": -17.35457992553711, "global_step": 8490, "epoch": 102} {"train_loss": -17.319438934326172, "global_step": 8491, "epoch": 102} {"train_loss": -17.60147476196289, "global_step": 8492, "epoch": 102} {"train_loss": -17.295969009399414, "global_step": 8493, "epoch": 102} {"train_loss": -17.4128360748291, "global_step": 8494, "epoch": 102} {"train_loss": -17.439966201782227, "global_step": 8495, "epoch": 102} {"train_loss": -17.2376708984375, "global_step": 8496, "epoch": 102} {"train_loss": -17.679906845092773, "global_step": 8497, "epoch": 102} {"train_loss": -17.156513214111328, "global_step": 8498, "epoch": 102} {"train_loss": -17.603116989135742, "global_step": 8499, "epoch": 102} {"train_loss": -17.141820907592773, "global_step": 8500, "epoch": 102} {"train_loss": -17.848413467407227, "global_step": 8501, "epoch": 102} {"train_loss": -17.39682388305664, "global_step": 8502, "epoch": 102} {"train_loss": -17.76891326904297, "global_step": 8503, "epoch": 102} {"train_loss": -17.144695281982422, "global_step": 8504, "epoch": 102} {"train_loss": -17.12831687927246, "global_step": 8505, "epoch": 102} {"train_loss": -17.263965606689453, "global_step": 8506, "epoch": 102} {"train_loss": -17.81896209716797, "global_step": 8507, "epoch": 102} {"train_loss": -17.224294662475586, "global_step": 8508, "epoch": 102} {"train_loss": -17.791318893432617, "global_step": 8509, "epoch": 102} {"train_loss": -17.547134399414062, "global_step": 8510, "epoch": 102} {"train_loss": -17.896963119506836, "global_step": 8511, "epoch": 102} {"train_loss": -17.503347396850586, "global_step": 8512, "epoch": 102} {"train_loss": -17.474056243896484, "global_step": 8513, "epoch": 102} {"train_loss": -17.464111328125, "global_step": 8514, "epoch": 102} {"train_loss": -17.54054832458496, "global_step": 8515, "epoch": 102} {"train_loss": -17.61403465270996, "global_step": 8516, "epoch": 102} {"train_loss": -17.47456169128418, "global_step": 8517, "epoch": 102} {"train_loss": -17.4864559173584, "global_step": 8518, "epoch": 102} {"train_loss": -17.99676513671875, "global_step": 8519, "epoch": 102} {"train_loss": -17.80818748474121, "global_step": 8520, "epoch": 102} {"train_loss": -17.787458419799805, "global_step": 8521, "epoch": 102} {"train_loss": -17.369150161743164, "global_step": 8522, "epoch": 102} {"train_loss": -17.321958541870117, "global_step": 8523, "epoch": 102} {"train_loss": -17.431180953979492, "global_step": 8524, "epoch": 102} {"train_loss": -17.55316162109375, "global_step": 8525, "epoch": 102} {"train_loss": -17.318199157714844, "global_step": 8526, "epoch": 102} {"train_loss": -17.337472915649414, "global_step": 8527, "epoch": 102} {"train_loss": -17.171966552734375, "global_step": 8528, "epoch": 102} {"train_loss": -17.274877548217773, "global_step": 8529, "epoch": 102} {"train_loss": -17.49407958984375, "global_step": 8530, "epoch": 102} {"train_loss": -17.539308547973633, "global_step": 8531, "epoch": 102} {"train_loss": -17.47418975830078, "global_step": 8532, "epoch": 102} {"train_loss": -17.549449920654297, "global_step": 8533, "epoch": 102} {"train_loss": -17.259166717529297, "global_step": 8534, "epoch": 102} {"train_loss": -17.49012565612793, "global_step": 8535, "epoch": 102} {"train_loss": -17.20392417907715, "global_step": 8536, "epoch": 102} {"train_loss": -17.5296688079834, "global_step": 8537, "epoch": 102} {"train_loss": -17.263141632080078, "global_step": 8538, "epoch": 102} {"train_loss": -17.348514556884766, "global_step": 8539, "epoch": 102} {"train_loss": -17.8143367767334, "global_step": 8540, "epoch": 102} {"train_loss": -17.679035186767578, "global_step": 8541, "epoch": 102} {"train_loss": -17.121732711791992, "global_step": 8542, "epoch": 102} {"train_loss": -17.686365127563477, "global_step": 8543, "epoch": 102} {"train_loss": -17.63169288635254, "global_step": 8544, "epoch": 102} {"train_loss": -17.33863067626953, "global_step": 8545, "epoch": 102} {"train_loss": -17.7003173828125, "global_step": 8546, "epoch": 102} {"train_loss": -17.33204460144043, "global_step": 8547, "epoch": 102} {"train_loss": -17.42515497322542, "global_step": 8548, "epoch": 102, "val_loss": 6221181.0} {"train_loss": -17.383520126342773, "global_step": 8549, "epoch": 103} {"train_loss": -17.2702579498291, "global_step": 8550, "epoch": 103} {"train_loss": -17.523279190063477, "global_step": 8551, "epoch": 103} {"train_loss": -17.5922908782959, "global_step": 8552, "epoch": 103} {"train_loss": -17.312673568725586, "global_step": 8553, "epoch": 103} {"train_loss": -17.47355079650879, "global_step": 8554, "epoch": 103} {"train_loss": -17.345258712768555, "global_step": 8555, "epoch": 103} {"train_loss": -17.670759201049805, "global_step": 8556, "epoch": 103} {"train_loss": -17.4876766204834, "global_step": 8557, "epoch": 103} {"train_loss": -17.410686492919922, "global_step": 8558, "epoch": 103} {"train_loss": -17.37367820739746, "global_step": 8559, "epoch": 103} {"train_loss": -16.988525390625, "global_step": 8560, "epoch": 103} {"train_loss": -17.40717887878418, "global_step": 8561, "epoch": 103} {"train_loss": -17.039005279541016, "global_step": 8562, "epoch": 103} {"train_loss": -17.564672470092773, "global_step": 8563, "epoch": 103} {"train_loss": -17.461408615112305, "global_step": 8564, "epoch": 103} {"train_loss": -17.44734764099121, "global_step": 8565, "epoch": 103} {"train_loss": -17.187070846557617, "global_step": 8566, "epoch": 103} {"train_loss": -17.693185806274414, "global_step": 8567, "epoch": 103} {"train_loss": -17.50924301147461, "global_step": 8568, "epoch": 103} {"train_loss": -17.631664276123047, "global_step": 8569, "epoch": 103} {"train_loss": -17.323719024658203, "global_step": 8570, "epoch": 103} {"train_loss": -17.597578048706055, "global_step": 8571, "epoch": 103} {"train_loss": -17.205991744995117, "global_step": 8572, "epoch": 103} {"train_loss": -17.139738082885742, "global_step": 8573, "epoch": 103} {"train_loss": -17.609973907470703, "global_step": 8574, "epoch": 103} {"train_loss": -17.817163467407227, "global_step": 8575, "epoch": 103} {"train_loss": -17.063077926635742, "global_step": 8576, "epoch": 103} {"train_loss": -17.23028564453125, "global_step": 8577, "epoch": 103} {"train_loss": -17.11138343811035, "global_step": 8578, "epoch": 103} {"train_loss": -17.863611221313477, "global_step": 8579, "epoch": 103} {"train_loss": -17.519567489624023, "global_step": 8580, "epoch": 103} {"train_loss": -17.40435218811035, "global_step": 8581, "epoch": 103} {"train_loss": -17.47149658203125, "global_step": 8582, "epoch": 103} {"train_loss": -17.379989624023438, "global_step": 8583, "epoch": 103} {"train_loss": -17.264114379882812, "global_step": 8584, "epoch": 103} {"train_loss": -17.299312591552734, "global_step": 8585, "epoch": 103} {"train_loss": -17.376501083374023, "global_step": 8586, "epoch": 103} {"train_loss": -17.564434051513672, "global_step": 8587, "epoch": 103} {"train_loss": -17.682830810546875, "global_step": 8588, "epoch": 103} {"train_loss": -17.527509689331055, "global_step": 8589, "epoch": 103} {"train_loss": -17.113187789916992, "global_step": 8590, "epoch": 103} {"train_loss": -16.952743530273438, "global_step": 8591, "epoch": 103} {"train_loss": -17.52044105529785, "global_step": 8592, "epoch": 103} {"train_loss": -17.694915771484375, "global_step": 8593, "epoch": 103} {"train_loss": -17.23801612854004, "global_step": 8594, "epoch": 103} {"train_loss": -17.38719940185547, "global_step": 8595, "epoch": 103} {"train_loss": -17.295316696166992, "global_step": 8596, "epoch": 103} {"train_loss": -17.390588760375977, "global_step": 8597, "epoch": 103} {"train_loss": -17.389371871948242, "global_step": 8598, "epoch": 103} {"train_loss": -17.41938591003418, "global_step": 8599, "epoch": 103} {"train_loss": -16.931400299072266, "global_step": 8600, "epoch": 103} {"train_loss": -17.41554069519043, "global_step": 8601, "epoch": 103} {"train_loss": -17.599973678588867, "global_step": 8602, "epoch": 103} {"train_loss": -17.43703269958496, "global_step": 8603, "epoch": 103} {"train_loss": -17.7187557220459, "global_step": 8604, "epoch": 103} {"train_loss": -17.734088897705078, "global_step": 8605, "epoch": 103} {"train_loss": -17.69025993347168, "global_step": 8606, "epoch": 103} {"train_loss": -17.770706176757812, "global_step": 8607, "epoch": 103} {"train_loss": -17.816564559936523, "global_step": 8608, "epoch": 103} {"train_loss": -17.683210372924805, "global_step": 8609, "epoch": 103} {"train_loss": -17.768335342407227, "global_step": 8610, "epoch": 103} {"train_loss": -17.808717727661133, "global_step": 8611, "epoch": 103} {"train_loss": -17.815811157226562, "global_step": 8612, "epoch": 103} {"train_loss": -17.646690368652344, "global_step": 8613, "epoch": 103} {"train_loss": -17.143259048461914, "global_step": 8614, "epoch": 103} {"train_loss": -17.56732749938965, "global_step": 8615, "epoch": 103} {"train_loss": -17.359861373901367, "global_step": 8616, "epoch": 103} {"train_loss": -17.510995864868164, "global_step": 8617, "epoch": 103} {"train_loss": -17.439794540405273, "global_step": 8618, "epoch": 103} {"train_loss": -17.588727951049805, "global_step": 8619, "epoch": 103} {"train_loss": -17.390243530273438, "global_step": 8620, "epoch": 103} {"train_loss": -16.706907272338867, "global_step": 8621, "epoch": 103} {"train_loss": -17.494905471801758, "global_step": 8622, "epoch": 103} {"train_loss": -17.40862464904785, "global_step": 8623, "epoch": 103} {"train_loss": -17.66827392578125, "global_step": 8624, "epoch": 103} {"train_loss": -17.49214744567871, "global_step": 8625, "epoch": 103} {"train_loss": -17.61020278930664, "global_step": 8626, "epoch": 103} {"train_loss": -17.518489837646484, "global_step": 8627, "epoch": 103} {"train_loss": -17.418399810791016, "global_step": 8628, "epoch": 103} {"train_loss": -17.667591094970703, "global_step": 8629, "epoch": 103} {"train_loss": -17.490415573120117, "global_step": 8630, "epoch": 103} {"train_loss": -17.47769792395902, "global_step": 8631, "epoch": 103, "val_loss": 6188851.0} {"train_loss": -17.40106773376465, "global_step": 8632, "epoch": 104} {"train_loss": -17.5396728515625, "global_step": 8633, "epoch": 104} {"train_loss": -17.43134880065918, "global_step": 8634, "epoch": 104} {"train_loss": -17.272783279418945, "global_step": 8635, "epoch": 104} {"train_loss": -17.434463500976562, "global_step": 8636, "epoch": 104} {"train_loss": -17.57929801940918, "global_step": 8637, "epoch": 104} {"train_loss": -17.6844539642334, "global_step": 8638, "epoch": 104} {"train_loss": -17.429412841796875, "global_step": 8639, "epoch": 104} {"train_loss": -16.628177642822266, "global_step": 8640, "epoch": 104} {"train_loss": -17.502025604248047, "global_step": 8641, "epoch": 104} {"train_loss": -17.286453247070312, "global_step": 8642, "epoch": 104} {"train_loss": -17.387678146362305, "global_step": 8643, "epoch": 104} {"train_loss": -17.391393661499023, "global_step": 8644, "epoch": 104} {"train_loss": -17.446866989135742, "global_step": 8645, "epoch": 104} {"train_loss": -17.223379135131836, "global_step": 8646, "epoch": 104} {"train_loss": -17.45314598083496, "global_step": 8647, "epoch": 104} {"train_loss": -17.874235153198242, "global_step": 8648, "epoch": 104} {"train_loss": -17.581058502197266, "global_step": 8649, "epoch": 104} {"train_loss": -17.07809829711914, "global_step": 8650, "epoch": 104} {"train_loss": -17.51303482055664, "global_step": 8651, "epoch": 104} {"train_loss": -17.675317764282227, "global_step": 8652, "epoch": 104} {"train_loss": -18.0741024017334, "global_step": 8653, "epoch": 104} {"train_loss": -17.315439224243164, "global_step": 8654, "epoch": 104} {"train_loss": -17.557485580444336, "global_step": 8655, "epoch": 104} {"train_loss": -17.932384490966797, "global_step": 8656, "epoch": 104} {"train_loss": -17.41670799255371, "global_step": 8657, "epoch": 104} {"train_loss": -17.979097366333008, "global_step": 8658, "epoch": 104} {"train_loss": -17.83315086364746, "global_step": 8659, "epoch": 104} {"train_loss": -17.675617218017578, "global_step": 8660, "epoch": 104} {"train_loss": -17.622970581054688, "global_step": 8661, "epoch": 104} {"train_loss": -17.3846492767334, "global_step": 8662, "epoch": 104} {"train_loss": -17.30600929260254, "global_step": 8663, "epoch": 104} {"train_loss": -17.633453369140625, "global_step": 8664, "epoch": 104} {"train_loss": -17.43781852722168, "global_step": 8665, "epoch": 104} {"train_loss": -17.77857780456543, "global_step": 8666, "epoch": 104} {"train_loss": -17.716114044189453, "global_step": 8667, "epoch": 104} {"train_loss": -17.33500099182129, "global_step": 8668, "epoch": 104} {"train_loss": -17.246536254882812, "global_step": 8669, "epoch": 104} {"train_loss": -17.456085205078125, "global_step": 8670, "epoch": 104} {"train_loss": -17.220468521118164, "global_step": 8671, "epoch": 104} {"train_loss": -17.578113555908203, "global_step": 8672, "epoch": 104} {"train_loss": -17.262292861938477, "global_step": 8673, "epoch": 104} {"train_loss": -17.440168380737305, "global_step": 8674, "epoch": 104} {"train_loss": -17.941150665283203, "global_step": 8675, "epoch": 104} {"train_loss": -17.21639633178711, "global_step": 8676, "epoch": 104} {"train_loss": -17.519800186157227, "global_step": 8677, "epoch": 104} {"train_loss": -17.156408309936523, "global_step": 8678, "epoch": 104} {"train_loss": -17.609344482421875, "global_step": 8679, "epoch": 104} {"train_loss": -17.67909049987793, "global_step": 8680, "epoch": 104} {"train_loss": -17.489118576049805, "global_step": 8681, "epoch": 104} {"train_loss": -17.42624282836914, "global_step": 8682, "epoch": 104} {"train_loss": -17.34478759765625, "global_step": 8683, "epoch": 104} {"train_loss": -17.73737144470215, "global_step": 8684, "epoch": 104} {"train_loss": -17.215465545654297, "global_step": 8685, "epoch": 104} {"train_loss": -17.121946334838867, "global_step": 8686, "epoch": 104} {"train_loss": -16.949316024780273, "global_step": 8687, "epoch": 104} {"train_loss": -17.425674438476562, "global_step": 8688, "epoch": 104} {"train_loss": -17.43047523498535, "global_step": 8689, "epoch": 104} {"train_loss": -17.636770248413086, "global_step": 8690, "epoch": 104} {"train_loss": -17.658323287963867, "global_step": 8691, "epoch": 104} {"train_loss": -17.445148468017578, "global_step": 8692, "epoch": 104} {"train_loss": -17.58321762084961, "global_step": 8693, "epoch": 104} {"train_loss": -17.414167404174805, "global_step": 8694, "epoch": 104} {"train_loss": -17.36089515686035, "global_step": 8695, "epoch": 104} {"train_loss": -17.476503372192383, "global_step": 8696, "epoch": 104} {"train_loss": -17.064496994018555, "global_step": 8697, "epoch": 104} {"train_loss": -17.591693878173828, "global_step": 8698, "epoch": 104} {"train_loss": -17.251440048217773, "global_step": 8699, "epoch": 104} {"train_loss": -17.500822067260742, "global_step": 8700, "epoch": 104} {"train_loss": -17.9149169921875, "global_step": 8701, "epoch": 104} {"train_loss": -17.84819221496582, "global_step": 8702, "epoch": 104} {"train_loss": -17.40821647644043, "global_step": 8703, "epoch": 104} {"train_loss": -17.54183006286621, "global_step": 8704, "epoch": 104} {"train_loss": -17.3284854888916, "global_step": 8705, "epoch": 104} {"train_loss": -17.51948356628418, "global_step": 8706, "epoch": 104} {"train_loss": -17.384206771850586, "global_step": 8707, "epoch": 104} {"train_loss": -17.814285278320312, "global_step": 8708, "epoch": 104} {"train_loss": -17.639738082885742, "global_step": 8709, "epoch": 104} {"train_loss": -17.563093185424805, "global_step": 8710, "epoch": 104} {"train_loss": -17.56215476989746, "global_step": 8711, "epoch": 104} {"train_loss": -17.671918869018555, "global_step": 8712, "epoch": 104} {"train_loss": -17.360525131225586, "global_step": 8713, "epoch": 104} {"train_loss": -17.493764601558087, "global_step": 8714, "epoch": 104, "val_loss": 6341163.5} {"train_loss": -17.08414649963379, "global_step": 8715, "epoch": 105} {"train_loss": -17.289724349975586, "global_step": 8716, "epoch": 105} {"train_loss": -17.39154052734375, "global_step": 8717, "epoch": 105} {"train_loss": -17.16303062438965, "global_step": 8718, "epoch": 105} {"train_loss": -17.5245418548584, "global_step": 8719, "epoch": 105} {"train_loss": -17.587045669555664, "global_step": 8720, "epoch": 105} {"train_loss": -17.18743896484375, "global_step": 8721, "epoch": 105} {"train_loss": -17.19647789001465, "global_step": 8722, "epoch": 105} {"train_loss": -17.7255916595459, "global_step": 8723, "epoch": 105} {"train_loss": -17.347192764282227, "global_step": 8724, "epoch": 105} {"train_loss": -17.310171127319336, "global_step": 8725, "epoch": 105} {"train_loss": -17.42805290222168, "global_step": 8726, "epoch": 105} {"train_loss": -17.042186737060547, "global_step": 8727, "epoch": 105} {"train_loss": -17.490398406982422, "global_step": 8728, "epoch": 105} {"train_loss": -17.483692169189453, "global_step": 8729, "epoch": 105} {"train_loss": -17.429059982299805, "global_step": 8730, "epoch": 105} {"train_loss": -17.67405891418457, "global_step": 8731, "epoch": 105} {"train_loss": -17.662168502807617, "global_step": 8732, "epoch": 105} {"train_loss": -17.586956024169922, "global_step": 8733, "epoch": 105} {"train_loss": -17.565868377685547, "global_step": 8734, "epoch": 105} {"train_loss": -17.673044204711914, "global_step": 8735, "epoch": 105} {"train_loss": -17.5550594329834, "global_step": 8736, "epoch": 105} {"train_loss": -17.395401000976562, "global_step": 8737, "epoch": 105} {"train_loss": -17.348745346069336, "global_step": 8738, "epoch": 105} {"train_loss": -17.18662452697754, "global_step": 8739, "epoch": 105} {"train_loss": -17.376623153686523, "global_step": 8740, "epoch": 105} {"train_loss": -17.53377342224121, "global_step": 8741, "epoch": 105} {"train_loss": -17.3055362701416, "global_step": 8742, "epoch": 105} {"train_loss": -17.4486026763916, "global_step": 8743, "epoch": 105} {"train_loss": -17.530221939086914, "global_step": 8744, "epoch": 105} {"train_loss": -17.547590255737305, "global_step": 8745, "epoch": 105} {"train_loss": -17.799728393554688, "global_step": 8746, "epoch": 105} {"train_loss": -17.780323028564453, "global_step": 8747, "epoch": 105} {"train_loss": -17.2439022064209, "global_step": 8748, "epoch": 105} {"train_loss": -17.730615615844727, "global_step": 8749, "epoch": 105} {"train_loss": -17.671964645385742, "global_step": 8750, "epoch": 105} {"train_loss": -17.52010154724121, "global_step": 8751, "epoch": 105} {"train_loss": -17.30182456970215, "global_step": 8752, "epoch": 105} {"train_loss": -17.44539451599121, "global_step": 8753, "epoch": 105} {"train_loss": -17.68641471862793, "global_step": 8754, "epoch": 105} {"train_loss": -17.44870948791504, "global_step": 8755, "epoch": 105} {"train_loss": -17.227031707763672, "global_step": 8756, "epoch": 105} {"train_loss": -17.642776489257812, "global_step": 8757, "epoch": 105} {"train_loss": -17.35770034790039, "global_step": 8758, "epoch": 105} {"train_loss": -17.765140533447266, "global_step": 8759, "epoch": 105} {"train_loss": -17.303251266479492, "global_step": 8760, "epoch": 105} {"train_loss": -17.69724464416504, "global_step": 8761, "epoch": 105} {"train_loss": -17.269371032714844, "global_step": 8762, "epoch": 105} {"train_loss": -17.780385971069336, "global_step": 8763, "epoch": 105} {"train_loss": -16.607620239257812, "global_step": 8764, "epoch": 105} {"train_loss": -17.701322555541992, "global_step": 8765, "epoch": 105} {"train_loss": -17.058042526245117, "global_step": 8766, "epoch": 105} {"train_loss": -17.374286651611328, "global_step": 8767, "epoch": 105} {"train_loss": -17.634347915649414, "global_step": 8768, "epoch": 105} {"train_loss": -17.641616821289062, "global_step": 8769, "epoch": 105} {"train_loss": -17.167945861816406, "global_step": 8770, "epoch": 105} {"train_loss": -17.283048629760742, "global_step": 8771, "epoch": 105} {"train_loss": -17.270933151245117, "global_step": 8772, "epoch": 105} {"train_loss": -17.343751907348633, "global_step": 8773, "epoch": 105} {"train_loss": -17.389297485351562, "global_step": 8774, "epoch": 105} {"train_loss": -17.315519332885742, "global_step": 8775, "epoch": 105} {"train_loss": -17.682758331298828, "global_step": 8776, "epoch": 105} {"train_loss": -17.443092346191406, "global_step": 8777, "epoch": 105} {"train_loss": -17.422100067138672, "global_step": 8778, "epoch": 105} {"train_loss": -17.03192138671875, "global_step": 8779, "epoch": 105} {"train_loss": -17.337879180908203, "global_step": 8780, "epoch": 105} {"train_loss": -17.297452926635742, "global_step": 8781, "epoch": 105} {"train_loss": -17.239818572998047, "global_step": 8782, "epoch": 105} {"train_loss": -17.590002059936523, "global_step": 8783, "epoch": 105} {"train_loss": -17.485443115234375, "global_step": 8784, "epoch": 105} {"train_loss": -17.540128707885742, "global_step": 8785, "epoch": 105} {"train_loss": -17.74610710144043, "global_step": 8786, "epoch": 105} {"train_loss": -17.982999801635742, "global_step": 8787, "epoch": 105} {"train_loss": -17.45037841796875, "global_step": 8788, "epoch": 105} {"train_loss": -17.525976181030273, "global_step": 8789, "epoch": 105} {"train_loss": -17.16263771057129, "global_step": 8790, "epoch": 105} {"train_loss": -17.655689239501953, "global_step": 8791, "epoch": 105} {"train_loss": -17.49519157409668, "global_step": 8792, "epoch": 105} {"train_loss": -17.63106918334961, "global_step": 8793, "epoch": 105} {"train_loss": -17.522605895996094, "global_step": 8794, "epoch": 105} {"train_loss": -17.184864044189453, "global_step": 8795, "epoch": 105} {"train_loss": -17.627056121826172, "global_step": 8796, "epoch": 105} {"train_loss": -17.45220368167004, "global_step": 8797, "epoch": 105, "val_loss": 6389768.0} {"train_loss": -17.555646896362305, "global_step": 8798, "epoch": 106} {"train_loss": -17.28498649597168, "global_step": 8799, "epoch": 106} {"train_loss": -17.775009155273438, "global_step": 8800, "epoch": 106} {"train_loss": -17.829809188842773, "global_step": 8801, "epoch": 106} {"train_loss": -17.01898193359375, "global_step": 8802, "epoch": 106} {"train_loss": -17.4151668548584, "global_step": 8803, "epoch": 106} {"train_loss": -17.339475631713867, "global_step": 8804, "epoch": 106} {"train_loss": -17.327733993530273, "global_step": 8805, "epoch": 106} {"train_loss": -17.42433738708496, "global_step": 8806, "epoch": 106} {"train_loss": -17.2155818939209, "global_step": 8807, "epoch": 106} {"train_loss": -17.672595977783203, "global_step": 8808, "epoch": 106} {"train_loss": -17.445236206054688, "global_step": 8809, "epoch": 106} {"train_loss": -17.423490524291992, "global_step": 8810, "epoch": 106} {"train_loss": -17.63492774963379, "global_step": 8811, "epoch": 106} {"train_loss": -17.630794525146484, "global_step": 8812, "epoch": 106} {"train_loss": -17.108102798461914, "global_step": 8813, "epoch": 106} {"train_loss": -17.37417984008789, "global_step": 8814, "epoch": 106} {"train_loss": -17.572336196899414, "global_step": 8815, "epoch": 106} {"train_loss": -17.98484230041504, "global_step": 8816, "epoch": 106} {"train_loss": -17.813919067382812, "global_step": 8817, "epoch": 106} {"train_loss": -17.511816024780273, "global_step": 8818, "epoch": 106} {"train_loss": -17.441547393798828, "global_step": 8819, "epoch": 106} {"train_loss": -17.14686393737793, "global_step": 8820, "epoch": 106} {"train_loss": -17.52141761779785, "global_step": 8821, "epoch": 106} {"train_loss": -17.68202781677246, "global_step": 8822, "epoch": 106} {"train_loss": -17.586200714111328, "global_step": 8823, "epoch": 106} {"train_loss": -17.60184097290039, "global_step": 8824, "epoch": 106} {"train_loss": -17.667951583862305, "global_step": 8825, "epoch": 106} {"train_loss": -17.18427848815918, "global_step": 8826, "epoch": 106} {"train_loss": -17.320791244506836, "global_step": 8827, "epoch": 106} {"train_loss": -17.071941375732422, "global_step": 8828, "epoch": 106} {"train_loss": -17.615524291992188, "global_step": 8829, "epoch": 106} {"train_loss": -17.470169067382812, "global_step": 8830, "epoch": 106} {"train_loss": -17.35824966430664, "global_step": 8831, "epoch": 106} {"train_loss": -18.11782455444336, "global_step": 8832, "epoch": 106} {"train_loss": -17.214191436767578, "global_step": 8833, "epoch": 106} {"train_loss": -17.427371978759766, "global_step": 8834, "epoch": 106} {"train_loss": -17.552108764648438, "global_step": 8835, "epoch": 106} {"train_loss": -17.540403366088867, "global_step": 8836, "epoch": 106} {"train_loss": -17.44539451599121, "global_step": 8837, "epoch": 106} {"train_loss": -17.347837448120117, "global_step": 8838, "epoch": 106} {"train_loss": -17.311439514160156, "global_step": 8839, "epoch": 106} {"train_loss": -17.78433609008789, "global_step": 8840, "epoch": 106} {"train_loss": -17.44501304626465, "global_step": 8841, "epoch": 106} {"train_loss": -17.56345558166504, "global_step": 8842, "epoch": 106} {"train_loss": -17.282529830932617, "global_step": 8843, "epoch": 106} {"train_loss": -17.248422622680664, "global_step": 8844, "epoch": 106} {"train_loss": -17.83599281311035, "global_step": 8845, "epoch": 106} {"train_loss": -17.25051498413086, "global_step": 8846, "epoch": 106} {"train_loss": -17.64423942565918, "global_step": 8847, "epoch": 106} {"train_loss": -17.459325790405273, "global_step": 8848, "epoch": 106} {"train_loss": -17.76932716369629, "global_step": 8849, "epoch": 106} {"train_loss": -17.535093307495117, "global_step": 8850, "epoch": 106} {"train_loss": -17.388532638549805, "global_step": 8851, "epoch": 106} {"train_loss": -17.345197677612305, "global_step": 8852, "epoch": 106} {"train_loss": -17.614713668823242, "global_step": 8853, "epoch": 106} {"train_loss": -17.641918182373047, "global_step": 8854, "epoch": 106} {"train_loss": -17.252042770385742, "global_step": 8855, "epoch": 106} {"train_loss": -17.594995498657227, "global_step": 8856, "epoch": 106} {"train_loss": -18.02808952331543, "global_step": 8857, "epoch": 106} {"train_loss": -17.275192260742188, "global_step": 8858, "epoch": 106} {"train_loss": -17.77986717224121, "global_step": 8859, "epoch": 106} {"train_loss": -17.025753021240234, "global_step": 8860, "epoch": 106} {"train_loss": -17.700891494750977, "global_step": 8861, "epoch": 106} {"train_loss": -17.502716064453125, "global_step": 8862, "epoch": 106} {"train_loss": -17.386030197143555, "global_step": 8863, "epoch": 106} {"train_loss": -18.101999282836914, "global_step": 8864, "epoch": 106} {"train_loss": -17.56727409362793, "global_step": 8865, "epoch": 106} {"train_loss": -17.476022720336914, "global_step": 8866, "epoch": 106} {"train_loss": -17.15380859375, "global_step": 8867, "epoch": 106} {"train_loss": -17.617992401123047, "global_step": 8868, "epoch": 106} {"train_loss": -17.623144149780273, "global_step": 8869, "epoch": 106} {"train_loss": -17.588300704956055, "global_step": 8870, "epoch": 106} {"train_loss": -17.408716201782227, "global_step": 8871, "epoch": 106} {"train_loss": -17.396902084350586, "global_step": 8872, "epoch": 106} {"train_loss": -17.636493682861328, "global_step": 8873, "epoch": 106} {"train_loss": -17.31722068786621, "global_step": 8874, "epoch": 106} {"train_loss": -17.424327850341797, "global_step": 8875, "epoch": 106} {"train_loss": -17.323049545288086, "global_step": 8876, "epoch": 106} {"train_loss": -17.568021774291992, "global_step": 8877, "epoch": 106} {"train_loss": -17.458410263061523, "global_step": 8878, "epoch": 106} {"train_loss": -17.453567504882812, "global_step": 8879, "epoch": 106} {"train_loss": -17.474778083433588, "global_step": 8880, "epoch": 106, "val_loss": 6291483.0} {"train_loss": -17.25217056274414, "global_step": 8881, "epoch": 107} {"train_loss": -16.813541412353516, "global_step": 8882, "epoch": 107} {"train_loss": -17.375308990478516, "global_step": 8883, "epoch": 107} {"train_loss": -17.67800521850586, "global_step": 8884, "epoch": 107} {"train_loss": -17.68638038635254, "global_step": 8885, "epoch": 107} {"train_loss": -17.486501693725586, "global_step": 8886, "epoch": 107} {"train_loss": -17.1953125, "global_step": 8887, "epoch": 107} {"train_loss": -17.471546173095703, "global_step": 8888, "epoch": 107} {"train_loss": -17.228788375854492, "global_step": 8889, "epoch": 107} {"train_loss": -17.318090438842773, "global_step": 8890, "epoch": 107} {"train_loss": -17.432464599609375, "global_step": 8891, "epoch": 107} {"train_loss": -17.55972671508789, "global_step": 8892, "epoch": 107} {"train_loss": -17.580533981323242, "global_step": 8893, "epoch": 107} {"train_loss": -16.878751754760742, "global_step": 8894, "epoch": 107} {"train_loss": -17.400136947631836, "global_step": 8895, "epoch": 107} {"train_loss": -17.093839645385742, "global_step": 8896, "epoch": 107} {"train_loss": -17.067859649658203, "global_step": 8897, "epoch": 107} {"train_loss": -17.8929500579834, "global_step": 8898, "epoch": 107} {"train_loss": -17.6474552154541, "global_step": 8899, "epoch": 107} {"train_loss": -17.780630111694336, "global_step": 8900, "epoch": 107} {"train_loss": -17.57489776611328, "global_step": 8901, "epoch": 107} {"train_loss": -17.424901962280273, "global_step": 8902, "epoch": 107} {"train_loss": -17.648462295532227, "global_step": 8903, "epoch": 107} {"train_loss": -17.733774185180664, "global_step": 8904, "epoch": 107} {"train_loss": -17.141035079956055, "global_step": 8905, "epoch": 107} {"train_loss": -17.455263137817383, "global_step": 8906, "epoch": 107} {"train_loss": -17.317306518554688, "global_step": 8907, "epoch": 107} {"train_loss": -17.290512084960938, "global_step": 8908, "epoch": 107} {"train_loss": -17.5161075592041, "global_step": 8909, "epoch": 107} {"train_loss": -17.62906837463379, "global_step": 8910, "epoch": 107} {"train_loss": -17.741079330444336, "global_step": 8911, "epoch": 107} {"train_loss": -17.529077529907227, "global_step": 8912, "epoch": 107} {"train_loss": -17.44132423400879, "global_step": 8913, "epoch": 107} {"train_loss": -17.485652923583984, "global_step": 8914, "epoch": 107} {"train_loss": -17.81559181213379, "global_step": 8915, "epoch": 107} {"train_loss": -17.435226440429688, "global_step": 8916, "epoch": 107} {"train_loss": -17.273193359375, "global_step": 8917, "epoch": 107} {"train_loss": -17.138559341430664, "global_step": 8918, "epoch": 107} {"train_loss": -17.24667739868164, "global_step": 8919, "epoch": 107} {"train_loss": -17.19976234436035, "global_step": 8920, "epoch": 107} {"train_loss": -17.6467342376709, "global_step": 8921, "epoch": 107} {"train_loss": -17.485092163085938, "global_step": 8922, "epoch": 107} {"train_loss": -17.523035049438477, "global_step": 8923, "epoch": 107} {"train_loss": -17.52716636657715, "global_step": 8924, "epoch": 107} {"train_loss": -18.17405128479004, "global_step": 8925, "epoch": 107} {"train_loss": -17.58989715576172, "global_step": 8926, "epoch": 107} {"train_loss": -17.637542724609375, "global_step": 8927, "epoch": 107} {"train_loss": -17.662216186523438, "global_step": 8928, "epoch": 107} {"train_loss": -17.434255599975586, "global_step": 8929, "epoch": 107} {"train_loss": -17.7386417388916, "global_step": 8930, "epoch": 107} {"train_loss": -17.22092628479004, "global_step": 8931, "epoch": 107} {"train_loss": -17.357120513916016, "global_step": 8932, "epoch": 107} {"train_loss": -17.411592483520508, "global_step": 8933, "epoch": 107} {"train_loss": -17.311742782592773, "global_step": 8934, "epoch": 107} {"train_loss": -17.69679069519043, "global_step": 8935, "epoch": 107} {"train_loss": -17.478185653686523, "global_step": 8936, "epoch": 107} {"train_loss": -17.623126983642578, "global_step": 8937, "epoch": 107} {"train_loss": -17.511417388916016, "global_step": 8938, "epoch": 107} {"train_loss": -17.654626846313477, "global_step": 8939, "epoch": 107} {"train_loss": -17.56892967224121, "global_step": 8940, "epoch": 107} {"train_loss": -17.41999053955078, "global_step": 8941, "epoch": 107} {"train_loss": -17.663162231445312, "global_step": 8942, "epoch": 107} {"train_loss": -17.49016761779785, "global_step": 8943, "epoch": 107} {"train_loss": -17.706384658813477, "global_step": 8944, "epoch": 107} {"train_loss": -17.991626739501953, "global_step": 8945, "epoch": 107} {"train_loss": -17.7280216217041, "global_step": 8946, "epoch": 107} {"train_loss": -17.45334815979004, "global_step": 8947, "epoch": 107} {"train_loss": -17.472126007080078, "global_step": 8948, "epoch": 107} {"train_loss": -17.59841537475586, "global_step": 8949, "epoch": 107} {"train_loss": -17.3140869140625, "global_step": 8950, "epoch": 107} {"train_loss": -17.09193229675293, "global_step": 8951, "epoch": 107} {"train_loss": -17.087644577026367, "global_step": 8952, "epoch": 107} {"train_loss": -17.678342819213867, "global_step": 8953, "epoch": 107} {"train_loss": -17.352005004882812, "global_step": 8954, "epoch": 107} {"train_loss": -17.63031005859375, "global_step": 8955, "epoch": 107} {"train_loss": -17.328964233398438, "global_step": 8956, "epoch": 107} {"train_loss": -17.51651382446289, "global_step": 8957, "epoch": 107} {"train_loss": -17.384052276611328, "global_step": 8958, "epoch": 107} {"train_loss": -17.326139450073242, "global_step": 8959, "epoch": 107} {"train_loss": -17.34619140625, "global_step": 8960, "epoch": 107} {"train_loss": -17.702199935913086, "global_step": 8961, "epoch": 107} {"train_loss": -17.464975357055664, "global_step": 8962, "epoch": 107} {"train_loss": -17.491497177675544, "global_step": 8963, "epoch": 107, "val_loss": 6158991.0} {"train_loss": -17.301755905151367, "global_step": 8964, "epoch": 108} {"train_loss": -17.69894790649414, "global_step": 8965, "epoch": 108} {"train_loss": -17.28898811340332, "global_step": 8966, "epoch": 108} {"train_loss": -17.355304718017578, "global_step": 8967, "epoch": 108} {"train_loss": -17.877120971679688, "global_step": 8968, "epoch": 108} {"train_loss": -17.457618713378906, "global_step": 8969, "epoch": 108} {"train_loss": -17.429746627807617, "global_step": 8970, "epoch": 108} {"train_loss": -16.973546981811523, "global_step": 8971, "epoch": 108} {"train_loss": -17.643545150756836, "global_step": 8972, "epoch": 108} {"train_loss": -17.440351486206055, "global_step": 8973, "epoch": 108} {"train_loss": -17.88453483581543, "global_step": 8974, "epoch": 108} {"train_loss": -17.546966552734375, "global_step": 8975, "epoch": 108} {"train_loss": -17.89585304260254, "global_step": 8976, "epoch": 108} {"train_loss": -17.44321632385254, "global_step": 8977, "epoch": 108} {"train_loss": -17.434463500976562, "global_step": 8978, "epoch": 108} {"train_loss": -17.605331420898438, "global_step": 8979, "epoch": 108} {"train_loss": -17.310949325561523, "global_step": 8980, "epoch": 108} {"train_loss": -17.49671745300293, "global_step": 8981, "epoch": 108} {"train_loss": -17.147001266479492, "global_step": 8982, "epoch": 108} {"train_loss": -17.709606170654297, "global_step": 8983, "epoch": 108} {"train_loss": -17.518741607666016, "global_step": 8984, "epoch": 108} {"train_loss": -17.577293395996094, "global_step": 8985, "epoch": 108} {"train_loss": -17.50313377380371, "global_step": 8986, "epoch": 108} {"train_loss": -17.49835968017578, "global_step": 8987, "epoch": 108} {"train_loss": -17.55858039855957, "global_step": 8988, "epoch": 108} {"train_loss": -17.849294662475586, "global_step": 8989, "epoch": 108} {"train_loss": -17.203567504882812, "global_step": 8990, "epoch": 108} {"train_loss": -17.612594604492188, "global_step": 8991, "epoch": 108} {"train_loss": -17.72757911682129, "global_step": 8992, "epoch": 108} {"train_loss": -17.42449378967285, "global_step": 8993, "epoch": 108} {"train_loss": -17.518558502197266, "global_step": 8994, "epoch": 108} {"train_loss": -17.543073654174805, "global_step": 8995, "epoch": 108} {"train_loss": -17.695520401000977, "global_step": 8996, "epoch": 108} {"train_loss": -17.768375396728516, "global_step": 8997, "epoch": 108} {"train_loss": -17.331436157226562, "global_step": 8998, "epoch": 108} {"train_loss": -16.903549194335938, "global_step": 8999, "epoch": 108} {"train_loss": -17.846681594848633, "global_step": 9000, "epoch": 108} {"train_loss": -17.47383689880371, "global_step": 9001, "epoch": 108} {"train_loss": -17.659069061279297, "global_step": 9002, "epoch": 108} {"train_loss": -17.644412994384766, "global_step": 9003, "epoch": 108} {"train_loss": -17.498586654663086, "global_step": 9004, "epoch": 108} {"train_loss": -17.51424217224121, "global_step": 9005, "epoch": 108} {"train_loss": -17.575315475463867, "global_step": 9006, "epoch": 108} {"train_loss": -17.7335262298584, "global_step": 9007, "epoch": 108} {"train_loss": -17.460229873657227, "global_step": 9008, "epoch": 108} {"train_loss": -17.39012908935547, "global_step": 9009, "epoch": 108} {"train_loss": -17.62093734741211, "global_step": 9010, "epoch": 108} {"train_loss": -17.11041831970215, "global_step": 9011, "epoch": 108} {"train_loss": -17.117910385131836, "global_step": 9012, "epoch": 108} {"train_loss": -17.563020706176758, "global_step": 9013, "epoch": 108} {"train_loss": -17.985897064208984, "global_step": 9014, "epoch": 108} {"train_loss": -17.055288314819336, "global_step": 9015, "epoch": 108} {"train_loss": -17.68116569519043, "global_step": 9016, "epoch": 108} {"train_loss": -17.1718807220459, "global_step": 9017, "epoch": 108} {"train_loss": -17.703824996948242, "global_step": 9018, "epoch": 108} {"train_loss": -17.729673385620117, "global_step": 9019, "epoch": 108} {"train_loss": -17.865629196166992, "global_step": 9020, "epoch": 108} {"train_loss": -17.641826629638672, "global_step": 9021, "epoch": 108} {"train_loss": -17.517578125, "global_step": 9022, "epoch": 108} {"train_loss": -17.851245880126953, "global_step": 9023, "epoch": 108} {"train_loss": -17.580114364624023, "global_step": 9024, "epoch": 108} {"train_loss": -17.33679962158203, "global_step": 9025, "epoch": 108} {"train_loss": -17.986543655395508, "global_step": 9026, "epoch": 108} {"train_loss": -17.929418563842773, "global_step": 9027, "epoch": 108} {"train_loss": -17.669767379760742, "global_step": 9028, "epoch": 108} {"train_loss": -17.654577255249023, "global_step": 9029, "epoch": 108} {"train_loss": -17.3867244720459, "global_step": 9030, "epoch": 108} {"train_loss": -17.48299789428711, "global_step": 9031, "epoch": 108} {"train_loss": -17.67045021057129, "global_step": 9032, "epoch": 108} {"train_loss": -17.28645896911621, "global_step": 9033, "epoch": 108} {"train_loss": -17.441728591918945, "global_step": 9034, "epoch": 108} {"train_loss": -17.60845947265625, "global_step": 9035, "epoch": 108} {"train_loss": -17.3780574798584, "global_step": 9036, "epoch": 108} {"train_loss": -17.321060180664062, "global_step": 9037, "epoch": 108} {"train_loss": -17.37129783630371, "global_step": 9038, "epoch": 108} {"train_loss": -17.807235717773438, "global_step": 9039, "epoch": 108} {"train_loss": -17.591672897338867, "global_step": 9040, "epoch": 108} {"train_loss": -17.09830093383789, "global_step": 9041, "epoch": 108} {"train_loss": -17.141427993774414, "global_step": 9042, "epoch": 108} {"train_loss": -17.559799194335938, "global_step": 9043, "epoch": 108} {"train_loss": -17.05891990661621, "global_step": 9044, "epoch": 108} {"train_loss": -17.57594871520996, "global_step": 9045, "epoch": 108} {"train_loss": -17.50882435993976, "global_step": 9046, "epoch": 108, "val_loss": 6116555.0} {"train_loss": -17.899778366088867, "global_step": 9047, "epoch": 109} {"train_loss": -17.426698684692383, "global_step": 9048, "epoch": 109} {"train_loss": -17.44866180419922, "global_step": 9049, "epoch": 109} {"train_loss": -16.970914840698242, "global_step": 9050, "epoch": 109} {"train_loss": -17.193967819213867, "global_step": 9051, "epoch": 109} {"train_loss": -17.633790969848633, "global_step": 9052, "epoch": 109} {"train_loss": -17.70798683166504, "global_step": 9053, "epoch": 109} {"train_loss": -17.464542388916016, "global_step": 9054, "epoch": 109} {"train_loss": -17.4415283203125, "global_step": 9055, "epoch": 109} {"train_loss": -17.717132568359375, "global_step": 9056, "epoch": 109} {"train_loss": -17.368345260620117, "global_step": 9057, "epoch": 109} {"train_loss": -17.246774673461914, "global_step": 9058, "epoch": 109} {"train_loss": -17.4100399017334, "global_step": 9059, "epoch": 109} {"train_loss": -17.676801681518555, "global_step": 9060, "epoch": 109} {"train_loss": -17.905426025390625, "global_step": 9061, "epoch": 109} {"train_loss": -17.20511245727539, "global_step": 9062, "epoch": 109} {"train_loss": -16.981748580932617, "global_step": 9063, "epoch": 109} {"train_loss": -17.54244041442871, "global_step": 9064, "epoch": 109} {"train_loss": -17.26338768005371, "global_step": 9065, "epoch": 109} {"train_loss": -17.440689086914062, "global_step": 9066, "epoch": 109} {"train_loss": -17.921812057495117, "global_step": 9067, "epoch": 109} {"train_loss": -17.52852439880371, "global_step": 9068, "epoch": 109} {"train_loss": -17.567138671875, "global_step": 9069, "epoch": 109} {"train_loss": -17.70207977294922, "global_step": 9070, "epoch": 109} {"train_loss": -17.280672073364258, "global_step": 9071, "epoch": 109} {"train_loss": -17.232057571411133, "global_step": 9072, "epoch": 109} {"train_loss": -17.293750762939453, "global_step": 9073, "epoch": 109} {"train_loss": -17.61404037475586, "global_step": 9074, "epoch": 109} {"train_loss": -17.57154655456543, "global_step": 9075, "epoch": 109} {"train_loss": -17.198928833007812, "global_step": 9076, "epoch": 109} {"train_loss": -17.289365768432617, "global_step": 9077, "epoch": 109} {"train_loss": -17.56830596923828, "global_step": 9078, "epoch": 109} {"train_loss": -17.722259521484375, "global_step": 9079, "epoch": 109} {"train_loss": -17.91304588317871, "global_step": 9080, "epoch": 109} {"train_loss": -17.783994674682617, "global_step": 9081, "epoch": 109} {"train_loss": -17.4276180267334, "global_step": 9082, "epoch": 109} {"train_loss": -17.475996017456055, "global_step": 9083, "epoch": 109} {"train_loss": -17.571264266967773, "global_step": 9084, "epoch": 109} {"train_loss": -17.67656707763672, "global_step": 9085, "epoch": 109} {"train_loss": -17.804929733276367, "global_step": 9086, "epoch": 109} {"train_loss": -17.458162307739258, "global_step": 9087, "epoch": 109} {"train_loss": -17.986392974853516, "global_step": 9088, "epoch": 109} {"train_loss": -17.44369888305664, "global_step": 9089, "epoch": 109} {"train_loss": -17.821340560913086, "global_step": 9090, "epoch": 109} {"train_loss": -17.280609130859375, "global_step": 9091, "epoch": 109} {"train_loss": -17.58570671081543, "global_step": 9092, "epoch": 109} {"train_loss": -17.666473388671875, "global_step": 9093, "epoch": 109} {"train_loss": -17.365537643432617, "global_step": 9094, "epoch": 109} {"train_loss": -17.468442916870117, "global_step": 9095, "epoch": 109} {"train_loss": -17.558408737182617, "global_step": 9096, "epoch": 109} {"train_loss": -17.802759170532227, "global_step": 9097, "epoch": 109} {"train_loss": -17.69650650024414, "global_step": 9098, "epoch": 109} {"train_loss": -17.4717960357666, "global_step": 9099, "epoch": 109} {"train_loss": -17.519834518432617, "global_step": 9100, "epoch": 109} {"train_loss": -17.987146377563477, "global_step": 9101, "epoch": 109} {"train_loss": -17.708553314208984, "global_step": 9102, "epoch": 109} {"train_loss": -17.37391471862793, "global_step": 9103, "epoch": 109} {"train_loss": -17.467334747314453, "global_step": 9104, "epoch": 109} {"train_loss": -18.01881217956543, "global_step": 9105, "epoch": 109} {"train_loss": -17.222217559814453, "global_step": 9106, "epoch": 109} {"train_loss": -17.62833595275879, "global_step": 9107, "epoch": 109} {"train_loss": -17.59075355529785, "global_step": 9108, "epoch": 109} {"train_loss": -17.300296783447266, "global_step": 9109, "epoch": 109} {"train_loss": -17.513654708862305, "global_step": 9110, "epoch": 109} {"train_loss": -17.333784103393555, "global_step": 9111, "epoch": 109} {"train_loss": -17.295589447021484, "global_step": 9112, "epoch": 109} {"train_loss": -17.791059494018555, "global_step": 9113, "epoch": 109} {"train_loss": -17.32010841369629, "global_step": 9114, "epoch": 109} {"train_loss": -17.382787704467773, "global_step": 9115, "epoch": 109} {"train_loss": -17.679746627807617, "global_step": 9116, "epoch": 109} {"train_loss": -17.267915725708008, "global_step": 9117, "epoch": 109} {"train_loss": -17.582067489624023, "global_step": 9118, "epoch": 109} {"train_loss": -17.626920700073242, "global_step": 9119, "epoch": 109} {"train_loss": -17.3675537109375, "global_step": 9120, "epoch": 109} {"train_loss": -17.330188751220703, "global_step": 9121, "epoch": 109} {"train_loss": -17.52859878540039, "global_step": 9122, "epoch": 109} {"train_loss": -17.362537384033203, "global_step": 9123, "epoch": 109} {"train_loss": -17.37269401550293, "global_step": 9124, "epoch": 109} {"train_loss": -17.764135360717773, "global_step": 9125, "epoch": 109} {"train_loss": -17.535470962524414, "global_step": 9126, "epoch": 109} {"train_loss": -18.00811195373535, "global_step": 9127, "epoch": 109} {"train_loss": -17.5987548828125, "global_step": 9128, "epoch": 109} {"train_loss": -17.514224086899354, "global_step": 9129, "epoch": 109, "val_loss": 6265654.0} {"train_loss": -17.519514083862305, "global_step": 9130, "epoch": 110} {"train_loss": -17.567886352539062, "global_step": 9131, "epoch": 110} {"train_loss": -17.309268951416016, "global_step": 9132, "epoch": 110} {"train_loss": -17.920576095581055, "global_step": 9133, "epoch": 110} {"train_loss": -17.15497398376465, "global_step": 9134, "epoch": 110} {"train_loss": -17.335830688476562, "global_step": 9135, "epoch": 110} {"train_loss": -17.247648239135742, "global_step": 9136, "epoch": 110} {"train_loss": -17.806900024414062, "global_step": 9137, "epoch": 110} {"train_loss": -17.95857810974121, "global_step": 9138, "epoch": 110} {"train_loss": -17.33343505859375, "global_step": 9139, "epoch": 110} {"train_loss": -17.52461051940918, "global_step": 9140, "epoch": 110} {"train_loss": -17.60621452331543, "global_step": 9141, "epoch": 110} {"train_loss": -17.43058204650879, "global_step": 9142, "epoch": 110} {"train_loss": -17.30063819885254, "global_step": 9143, "epoch": 110} {"train_loss": -17.428668975830078, "global_step": 9144, "epoch": 110} {"train_loss": -17.36903953552246, "global_step": 9145, "epoch": 110} {"train_loss": -17.768123626708984, "global_step": 9146, "epoch": 110} {"train_loss": -17.55851173400879, "global_step": 9147, "epoch": 110} {"train_loss": -17.46175193786621, "global_step": 9148, "epoch": 110} {"train_loss": -17.678728103637695, "global_step": 9149, "epoch": 110} {"train_loss": -17.445053100585938, "global_step": 9150, "epoch": 110} {"train_loss": -17.29578971862793, "global_step": 9151, "epoch": 110} {"train_loss": -17.60848045349121, "global_step": 9152, "epoch": 110} {"train_loss": -17.789749145507812, "global_step": 9153, "epoch": 110} {"train_loss": -17.5710506439209, "global_step": 9154, "epoch": 110} {"train_loss": -17.75634002685547, "global_step": 9155, "epoch": 110} {"train_loss": -17.680158615112305, "global_step": 9156, "epoch": 110} {"train_loss": -17.64820098876953, "global_step": 9157, "epoch": 110} {"train_loss": -17.57752799987793, "global_step": 9158, "epoch": 110} {"train_loss": -17.716794967651367, "global_step": 9159, "epoch": 110} {"train_loss": -17.861719131469727, "global_step": 9160, "epoch": 110} {"train_loss": -17.241430282592773, "global_step": 9161, "epoch": 110} {"train_loss": -17.29987907409668, "global_step": 9162, "epoch": 110} {"train_loss": -17.85910987854004, "global_step": 9163, "epoch": 110} {"train_loss": -17.346296310424805, "global_step": 9164, "epoch": 110} {"train_loss": -17.787355422973633, "global_step": 9165, "epoch": 110} {"train_loss": -17.232778549194336, "global_step": 9166, "epoch": 110} {"train_loss": -17.853506088256836, "global_step": 9167, "epoch": 110} {"train_loss": -17.940176010131836, "global_step": 9168, "epoch": 110} {"train_loss": -17.63856315612793, "global_step": 9169, "epoch": 110} {"train_loss": -17.385154724121094, "global_step": 9170, "epoch": 110} {"train_loss": -17.566659927368164, "global_step": 9171, "epoch": 110} {"train_loss": -17.506601333618164, "global_step": 9172, "epoch": 110} {"train_loss": -17.37824249267578, "global_step": 9173, "epoch": 110} {"train_loss": -17.70459747314453, "global_step": 9174, "epoch": 110} {"train_loss": -17.198415756225586, "global_step": 9175, "epoch": 110} {"train_loss": -17.235774993896484, "global_step": 9176, "epoch": 110} {"train_loss": -17.38484001159668, "global_step": 9177, "epoch": 110} {"train_loss": -17.617820739746094, "global_step": 9178, "epoch": 110} {"train_loss": -17.58847427368164, "global_step": 9179, "epoch": 110} {"train_loss": -17.35184097290039, "global_step": 9180, "epoch": 110} {"train_loss": -17.401960372924805, "global_step": 9181, "epoch": 110} {"train_loss": -17.46309471130371, "global_step": 9182, "epoch": 110} {"train_loss": -17.525075912475586, "global_step": 9183, "epoch": 110} {"train_loss": -17.002389907836914, "global_step": 9184, "epoch": 110} {"train_loss": -17.68229103088379, "global_step": 9185, "epoch": 110} {"train_loss": -17.179140090942383, "global_step": 9186, "epoch": 110} {"train_loss": -17.17201805114746, "global_step": 9187, "epoch": 110} {"train_loss": -17.495954513549805, "global_step": 9188, "epoch": 110} {"train_loss": -17.5362606048584, "global_step": 9189, "epoch": 110} {"train_loss": -17.64530372619629, "global_step": 9190, "epoch": 110} {"train_loss": -17.50775146484375, "global_step": 9191, "epoch": 110} {"train_loss": -17.5454158782959, "global_step": 9192, "epoch": 110} {"train_loss": -17.700658798217773, "global_step": 9193, "epoch": 110} {"train_loss": -17.582324981689453, "global_step": 9194, "epoch": 110} {"train_loss": -17.581724166870117, "global_step": 9195, "epoch": 110} {"train_loss": -17.62409782409668, "global_step": 9196, "epoch": 110} {"train_loss": -17.064210891723633, "global_step": 9197, "epoch": 110} {"train_loss": -17.740846633911133, "global_step": 9198, "epoch": 110} {"train_loss": -17.57085609436035, "global_step": 9199, "epoch": 110} {"train_loss": -18.036771774291992, "global_step": 9200, "epoch": 110} {"train_loss": -17.131052017211914, "global_step": 9201, "epoch": 110} {"train_loss": -17.54050064086914, "global_step": 9202, "epoch": 110} {"train_loss": -17.207359313964844, "global_step": 9203, "epoch": 110} {"train_loss": -17.77174186706543, "global_step": 9204, "epoch": 110} {"train_loss": -17.922077178955078, "global_step": 9205, "epoch": 110} {"train_loss": -17.87543296813965, "global_step": 9206, "epoch": 110} {"train_loss": -17.516220092773438, "global_step": 9207, "epoch": 110} {"train_loss": -17.685646057128906, "global_step": 9208, "epoch": 110} {"train_loss": -17.558801651000977, "global_step": 9209, "epoch": 110} {"train_loss": -17.392927169799805, "global_step": 9210, "epoch": 110} {"train_loss": -17.654361724853516, "global_step": 9211, "epoch": 110} {"train_loss": -17.53646469116211, "global_step": 9212, "epoch": 110, "val_loss": 6215156.0} {"train_loss": -17.138235092163086, "global_step": 9213, "epoch": 111} {"train_loss": -17.469003677368164, "global_step": 9214, "epoch": 111} {"train_loss": -17.06508445739746, "global_step": 9215, "epoch": 111} {"train_loss": -17.501707077026367, "global_step": 9216, "epoch": 111} {"train_loss": -17.532503128051758, "global_step": 9217, "epoch": 111} {"train_loss": -17.34395408630371, "global_step": 9218, "epoch": 111} {"train_loss": -17.64716148376465, "global_step": 9219, "epoch": 111} {"train_loss": -17.03053092956543, "global_step": 9220, "epoch": 111} {"train_loss": -17.230131149291992, "global_step": 9221, "epoch": 111} {"train_loss": -17.309371948242188, "global_step": 9222, "epoch": 111} {"train_loss": -17.612241744995117, "global_step": 9223, "epoch": 111} {"train_loss": -18.00469970703125, "global_step": 9224, "epoch": 111} {"train_loss": -17.24380874633789, "global_step": 9225, "epoch": 111} {"train_loss": -17.287076950073242, "global_step": 9226, "epoch": 111} {"train_loss": -17.48675537109375, "global_step": 9227, "epoch": 111} {"train_loss": -17.281415939331055, "global_step": 9228, "epoch": 111} {"train_loss": -17.406204223632812, "global_step": 9229, "epoch": 111} {"train_loss": -17.224863052368164, "global_step": 9230, "epoch": 111} {"train_loss": -17.808429718017578, "global_step": 9231, "epoch": 111} {"train_loss": -17.007030487060547, "global_step": 9232, "epoch": 111} {"train_loss": -17.400245666503906, "global_step": 9233, "epoch": 111} {"train_loss": -17.77253532409668, "global_step": 9234, "epoch": 111} {"train_loss": -17.05440902709961, "global_step": 9235, "epoch": 111} {"train_loss": -17.740751266479492, "global_step": 9236, "epoch": 111} {"train_loss": -17.59212303161621, "global_step": 9237, "epoch": 111} {"train_loss": -17.41645622253418, "global_step": 9238, "epoch": 111} {"train_loss": -17.38567352294922, "global_step": 9239, "epoch": 111} {"train_loss": -17.438310623168945, "global_step": 9240, "epoch": 111} {"train_loss": -17.344268798828125, "global_step": 9241, "epoch": 111} {"train_loss": -17.520618438720703, "global_step": 9242, "epoch": 111} {"train_loss": -17.58124542236328, "global_step": 9243, "epoch": 111} {"train_loss": -17.92268180847168, "global_step": 9244, "epoch": 111} {"train_loss": -17.47060203552246, "global_step": 9245, "epoch": 111} {"train_loss": -17.372894287109375, "global_step": 9246, "epoch": 111} {"train_loss": -17.253448486328125, "global_step": 9247, "epoch": 111} {"train_loss": -17.250675201416016, "global_step": 9248, "epoch": 111} {"train_loss": -17.695283889770508, "global_step": 9249, "epoch": 111} {"train_loss": -17.699087142944336, "global_step": 9250, "epoch": 111} {"train_loss": -17.96180534362793, "global_step": 9251, "epoch": 111} {"train_loss": -17.53009605407715, "global_step": 9252, "epoch": 111} {"train_loss": -17.652952194213867, "global_step": 9253, "epoch": 111} {"train_loss": -17.60190773010254, "global_step": 9254, "epoch": 111} {"train_loss": -18.002567291259766, "global_step": 9255, "epoch": 111} {"train_loss": -17.998144149780273, "global_step": 9256, "epoch": 111} {"train_loss": -17.81797981262207, "global_step": 9257, "epoch": 111} {"train_loss": -17.52230453491211, "global_step": 9258, "epoch": 111} {"train_loss": -17.117889404296875, "global_step": 9259, "epoch": 111} {"train_loss": -17.81159210205078, "global_step": 9260, "epoch": 111} {"train_loss": -17.68023109436035, "global_step": 9261, "epoch": 111} {"train_loss": -17.414148330688477, "global_step": 9262, "epoch": 111} {"train_loss": -17.605566024780273, "global_step": 9263, "epoch": 111} {"train_loss": -17.559030532836914, "global_step": 9264, "epoch": 111} {"train_loss": -17.72039031982422, "global_step": 9265, "epoch": 111} {"train_loss": -17.506427764892578, "global_step": 9266, "epoch": 111} {"train_loss": -17.693021774291992, "global_step": 9267, "epoch": 111} {"train_loss": -17.769498825073242, "global_step": 9268, "epoch": 111} {"train_loss": -17.663389205932617, "global_step": 9269, "epoch": 111} {"train_loss": -17.381351470947266, "global_step": 9270, "epoch": 111} {"train_loss": -17.851247787475586, "global_step": 9271, "epoch": 111} {"train_loss": -17.609281539916992, "global_step": 9272, "epoch": 111} {"train_loss": -17.471309661865234, "global_step": 9273, "epoch": 111} {"train_loss": -17.67655372619629, "global_step": 9274, "epoch": 111} {"train_loss": -17.262924194335938, "global_step": 9275, "epoch": 111} {"train_loss": -17.310325622558594, "global_step": 9276, "epoch": 111} {"train_loss": -17.65752601623535, "global_step": 9277, "epoch": 111} {"train_loss": -17.468887329101562, "global_step": 9278, "epoch": 111} {"train_loss": -17.433713912963867, "global_step": 9279, "epoch": 111} {"train_loss": -17.739145278930664, "global_step": 9280, "epoch": 111} {"train_loss": -17.748727798461914, "global_step": 9281, "epoch": 111} {"train_loss": -17.69137954711914, "global_step": 9282, "epoch": 111} {"train_loss": -17.735504150390625, "global_step": 9283, "epoch": 111} {"train_loss": -17.421850204467773, "global_step": 9284, "epoch": 111} {"train_loss": -17.411657333374023, "global_step": 9285, "epoch": 111} {"train_loss": -17.46611976623535, "global_step": 9286, "epoch": 111} {"train_loss": -17.980426788330078, "global_step": 9287, "epoch": 111} {"train_loss": -17.487714767456055, "global_step": 9288, "epoch": 111} {"train_loss": -17.688568115234375, "global_step": 9289, "epoch": 111} {"train_loss": -17.844619750976562, "global_step": 9290, "epoch": 111} {"train_loss": -17.299476623535156, "global_step": 9291, "epoch": 111} {"train_loss": -17.65888023376465, "global_step": 9292, "epoch": 111} {"train_loss": -17.664655685424805, "global_step": 9293, "epoch": 111} {"train_loss": -17.68861198425293, "global_step": 9294, "epoch": 111} {"train_loss": -17.516203684979175, "global_step": 9295, "epoch": 111, "val_loss": 6172574.0} {"train_loss": -17.27052116394043, "global_step": 9296, "epoch": 112} {"train_loss": -17.91872215270996, "global_step": 9297, "epoch": 112} {"train_loss": -17.254730224609375, "global_step": 9298, "epoch": 112} {"train_loss": -17.676586151123047, "global_step": 9299, "epoch": 112} {"train_loss": -17.607940673828125, "global_step": 9300, "epoch": 112} {"train_loss": -17.3794002532959, "global_step": 9301, "epoch": 112} {"train_loss": -17.385986328125, "global_step": 9302, "epoch": 112} {"train_loss": -16.9481143951416, "global_step": 9303, "epoch": 112} {"train_loss": -17.539127349853516, "global_step": 9304, "epoch": 112} {"train_loss": -17.44367790222168, "global_step": 9305, "epoch": 112} {"train_loss": -17.65594482421875, "global_step": 9306, "epoch": 112} {"train_loss": -17.605775833129883, "global_step": 9307, "epoch": 112} {"train_loss": -17.460241317749023, "global_step": 9308, "epoch": 112} {"train_loss": -17.620834350585938, "global_step": 9309, "epoch": 112} {"train_loss": -17.642906188964844, "global_step": 9310, "epoch": 112} {"train_loss": -17.36350440979004, "global_step": 9311, "epoch": 112} {"train_loss": -17.238475799560547, "global_step": 9312, "epoch": 112} {"train_loss": -17.494815826416016, "global_step": 9313, "epoch": 112} {"train_loss": -17.111757278442383, "global_step": 9314, "epoch": 112} {"train_loss": -17.83650779724121, "global_step": 9315, "epoch": 112} {"train_loss": -17.330854415893555, "global_step": 9316, "epoch": 112} {"train_loss": -17.463594436645508, "global_step": 9317, "epoch": 112} {"train_loss": -17.57575798034668, "global_step": 9318, "epoch": 112} {"train_loss": -17.952762603759766, "global_step": 9319, "epoch": 112} {"train_loss": -17.68031883239746, "global_step": 9320, "epoch": 112} {"train_loss": -17.631427764892578, "global_step": 9321, "epoch": 112} {"train_loss": -18.18356704711914, "global_step": 9322, "epoch": 112} {"train_loss": -17.2054386138916, "global_step": 9323, "epoch": 112} {"train_loss": -17.928510665893555, "global_step": 9324, "epoch": 112} {"train_loss": -17.73200035095215, "global_step": 9325, "epoch": 112} {"train_loss": -17.6781005859375, "global_step": 9326, "epoch": 112} {"train_loss": -17.632871627807617, "global_step": 9327, "epoch": 112} {"train_loss": -17.620141983032227, "global_step": 9328, "epoch": 112} {"train_loss": -17.612754821777344, "global_step": 9329, "epoch": 112} {"train_loss": -17.883291244506836, "global_step": 9330, "epoch": 112} {"train_loss": -17.702939987182617, "global_step": 9331, "epoch": 112} {"train_loss": -17.29549217224121, "global_step": 9332, "epoch": 112} {"train_loss": -17.92645835876465, "global_step": 9333, "epoch": 112} {"train_loss": -17.414562225341797, "global_step": 9334, "epoch": 112} {"train_loss": -17.377904891967773, "global_step": 9335, "epoch": 112} {"train_loss": -17.629549026489258, "global_step": 9336, "epoch": 112} {"train_loss": -17.750457763671875, "global_step": 9337, "epoch": 112} {"train_loss": -17.83601188659668, "global_step": 9338, "epoch": 112} {"train_loss": -17.826921463012695, "global_step": 9339, "epoch": 112} {"train_loss": -17.50490951538086, "global_step": 9340, "epoch": 112} {"train_loss": -18.009557723999023, "global_step": 9341, "epoch": 112} {"train_loss": -17.24567985534668, "global_step": 9342, "epoch": 112} {"train_loss": -17.68179702758789, "global_step": 9343, "epoch": 112} {"train_loss": -17.574296951293945, "global_step": 9344, "epoch": 112} {"train_loss": -17.450666427612305, "global_step": 9345, "epoch": 112} {"train_loss": -17.40193748474121, "global_step": 9346, "epoch": 112} {"train_loss": -17.393234252929688, "global_step": 9347, "epoch": 112} {"train_loss": -17.57027244567871, "global_step": 9348, "epoch": 112} {"train_loss": -17.99263572692871, "global_step": 9349, "epoch": 112} {"train_loss": -17.40781593322754, "global_step": 9350, "epoch": 112} {"train_loss": -17.839967727661133, "global_step": 9351, "epoch": 112} {"train_loss": -17.350479125976562, "global_step": 9352, "epoch": 112} {"train_loss": -17.334516525268555, "global_step": 9353, "epoch": 112} {"train_loss": -17.26088523864746, "global_step": 9354, "epoch": 112} {"train_loss": -17.433530807495117, "global_step": 9355, "epoch": 112} {"train_loss": -17.55718994140625, "global_step": 9356, "epoch": 112} {"train_loss": -17.415424346923828, "global_step": 9357, "epoch": 112} {"train_loss": -17.342390060424805, "global_step": 9358, "epoch": 112} {"train_loss": -17.20368003845215, "global_step": 9359, "epoch": 112} {"train_loss": -17.620582580566406, "global_step": 9360, "epoch": 112} {"train_loss": -17.4176082611084, "global_step": 9361, "epoch": 112} {"train_loss": -17.25821304321289, "global_step": 9362, "epoch": 112} {"train_loss": -18.10414695739746, "global_step": 9363, "epoch": 112} {"train_loss": -17.364408493041992, "global_step": 9364, "epoch": 112} {"train_loss": -17.281408309936523, "global_step": 9365, "epoch": 112} {"train_loss": -17.404783248901367, "global_step": 9366, "epoch": 112} {"train_loss": -17.650644302368164, "global_step": 9367, "epoch": 112} {"train_loss": -17.73470115661621, "global_step": 9368, "epoch": 112} {"train_loss": -17.340124130249023, "global_step": 9369, "epoch": 112} {"train_loss": -17.2997989654541, "global_step": 9370, "epoch": 112} {"train_loss": -17.136701583862305, "global_step": 9371, "epoch": 112} {"train_loss": -17.25587272644043, "global_step": 9372, "epoch": 112} {"train_loss": -17.950775146484375, "global_step": 9373, "epoch": 112} {"train_loss": -17.911985397338867, "global_step": 9374, "epoch": 112} {"train_loss": -17.742795944213867, "global_step": 9375, "epoch": 112} {"train_loss": -17.540931701660156, "global_step": 9376, "epoch": 112} {"train_loss": -17.524391174316406, "global_step": 9377, "epoch": 112} {"train_loss": -17.555290084287346, "global_step": 9378, "epoch": 112, "val_loss": 6377929.0} {"train_loss": -17.38916778564453, "global_step": 9379, "epoch": 113} {"train_loss": -17.632755279541016, "global_step": 9380, "epoch": 113} {"train_loss": -17.39473533630371, "global_step": 9381, "epoch": 113} {"train_loss": -17.288768768310547, "global_step": 9382, "epoch": 113} {"train_loss": -17.7883358001709, "global_step": 9383, "epoch": 113} {"train_loss": -17.81810188293457, "global_step": 9384, "epoch": 113} {"train_loss": -17.30719757080078, "global_step": 9385, "epoch": 113} {"train_loss": -17.434743881225586, "global_step": 9386, "epoch": 113} {"train_loss": -17.09145164489746, "global_step": 9387, "epoch": 113} {"train_loss": -17.026386260986328, "global_step": 9388, "epoch": 113} {"train_loss": -17.755971908569336, "global_step": 9389, "epoch": 113} {"train_loss": -17.431901931762695, "global_step": 9390, "epoch": 113} {"train_loss": -17.38772201538086, "global_step": 9391, "epoch": 113} {"train_loss": -17.325435638427734, "global_step": 9392, "epoch": 113} {"train_loss": -17.337873458862305, "global_step": 9393, "epoch": 113} {"train_loss": -17.410024642944336, "global_step": 9394, "epoch": 113} {"train_loss": -17.671056747436523, "global_step": 9395, "epoch": 113} {"train_loss": -17.3212833404541, "global_step": 9396, "epoch": 113} {"train_loss": -17.586257934570312, "global_step": 9397, "epoch": 113} {"train_loss": -17.06484031677246, "global_step": 9398, "epoch": 113} {"train_loss": -17.19611930847168, "global_step": 9399, "epoch": 113} {"train_loss": -17.510255813598633, "global_step": 9400, "epoch": 113} {"train_loss": -17.64326286315918, "global_step": 9401, "epoch": 113} {"train_loss": -17.601028442382812, "global_step": 9402, "epoch": 113} {"train_loss": -17.54426383972168, "global_step": 9403, "epoch": 113} {"train_loss": -17.3404541015625, "global_step": 9404, "epoch": 113} {"train_loss": -17.627416610717773, "global_step": 9405, "epoch": 113} {"train_loss": -17.456283569335938, "global_step": 9406, "epoch": 113} {"train_loss": -17.70620346069336, "global_step": 9407, "epoch": 113} {"train_loss": -17.79977798461914, "global_step": 9408, "epoch": 113} {"train_loss": -17.675830841064453, "global_step": 9409, "epoch": 113} {"train_loss": -17.18625259399414, "global_step": 9410, "epoch": 113} {"train_loss": -17.68283462524414, "global_step": 9411, "epoch": 113} {"train_loss": -17.4672794342041, "global_step": 9412, "epoch": 113} {"train_loss": -17.865209579467773, "global_step": 9413, "epoch": 113} {"train_loss": -17.506147384643555, "global_step": 9414, "epoch": 113} {"train_loss": -17.219297409057617, "global_step": 9415, "epoch": 113} {"train_loss": -17.529104232788086, "global_step": 9416, "epoch": 113} {"train_loss": -17.395336151123047, "global_step": 9417, "epoch": 113} {"train_loss": -17.68208122253418, "global_step": 9418, "epoch": 113} {"train_loss": -17.715986251831055, "global_step": 9419, "epoch": 113} {"train_loss": -17.460790634155273, "global_step": 9420, "epoch": 113} {"train_loss": -17.651634216308594, "global_step": 9421, "epoch": 113} {"train_loss": -17.84222984313965, "global_step": 9422, "epoch": 113} {"train_loss": -17.30319595336914, "global_step": 9423, "epoch": 113} {"train_loss": -17.654041290283203, "global_step": 9424, "epoch": 113} {"train_loss": -17.794797897338867, "global_step": 9425, "epoch": 113} {"train_loss": -17.688247680664062, "global_step": 9426, "epoch": 113} {"train_loss": -17.690370559692383, "global_step": 9427, "epoch": 113} {"train_loss": -17.58631706237793, "global_step": 9428, "epoch": 113} {"train_loss": -17.697559356689453, "global_step": 9429, "epoch": 113} {"train_loss": -17.34885597229004, "global_step": 9430, "epoch": 113} {"train_loss": -17.31546401977539, "global_step": 9431, "epoch": 113} {"train_loss": -17.804431915283203, "global_step": 9432, "epoch": 113} {"train_loss": -17.68288230895996, "global_step": 9433, "epoch": 113} {"train_loss": -17.872180938720703, "global_step": 9434, "epoch": 113} {"train_loss": -17.69588851928711, "global_step": 9435, "epoch": 113} {"train_loss": -17.599449157714844, "global_step": 9436, "epoch": 113} {"train_loss": -17.3583984375, "global_step": 9437, "epoch": 113} {"train_loss": -18.195276260375977, "global_step": 9438, "epoch": 113} {"train_loss": -17.9620304107666, "global_step": 9439, "epoch": 113} {"train_loss": -17.096525192260742, "global_step": 9440, "epoch": 113} {"train_loss": -17.755929946899414, "global_step": 9441, "epoch": 113} {"train_loss": -17.749530792236328, "global_step": 9442, "epoch": 113} {"train_loss": -17.639020919799805, "global_step": 9443, "epoch": 113} {"train_loss": -17.825435638427734, "global_step": 9444, "epoch": 113} {"train_loss": -17.663803100585938, "global_step": 9445, "epoch": 113} {"train_loss": -17.84878921508789, "global_step": 9446, "epoch": 113} {"train_loss": -17.255189895629883, "global_step": 9447, "epoch": 113} {"train_loss": -17.967330932617188, "global_step": 9448, "epoch": 113} {"train_loss": -17.426441192626953, "global_step": 9449, "epoch": 113} {"train_loss": -17.553152084350586, "global_step": 9450, "epoch": 113} {"train_loss": -17.612966537475586, "global_step": 9451, "epoch": 113} {"train_loss": -17.563329696655273, "global_step": 9452, "epoch": 113} {"train_loss": -17.66959571838379, "global_step": 9453, "epoch": 113} {"train_loss": -17.70151138305664, "global_step": 9454, "epoch": 113} {"train_loss": -17.573789596557617, "global_step": 9455, "epoch": 113} {"train_loss": -17.26289176940918, "global_step": 9456, "epoch": 113} {"train_loss": -17.596799850463867, "global_step": 9457, "epoch": 113} {"train_loss": -17.70551872253418, "global_step": 9458, "epoch": 113} {"train_loss": -17.241697311401367, "global_step": 9459, "epoch": 113} {"train_loss": -17.702909469604492, "global_step": 9460, "epoch": 113} {"train_loss": -17.555393471775286, "global_step": 9461, "epoch": 113, "val_loss": 6285300.0} {"train_loss": -17.242292404174805, "global_step": 9462, "epoch": 114} {"train_loss": -17.792526245117188, "global_step": 9463, "epoch": 114} {"train_loss": -17.177249908447266, "global_step": 9464, "epoch": 114} {"train_loss": -17.41338348388672, "global_step": 9465, "epoch": 114} {"train_loss": -17.285030364990234, "global_step": 9466, "epoch": 114} {"train_loss": -17.468456268310547, "global_step": 9467, "epoch": 114} {"train_loss": -18.07954216003418, "global_step": 9468, "epoch": 114} {"train_loss": -17.88225746154785, "global_step": 9469, "epoch": 114} {"train_loss": -17.37175178527832, "global_step": 9470, "epoch": 114} {"train_loss": -17.685110092163086, "global_step": 9471, "epoch": 114} {"train_loss": -17.87935447692871, "global_step": 9472, "epoch": 114} {"train_loss": -17.356428146362305, "global_step": 9473, "epoch": 114} {"train_loss": -17.46915626525879, "global_step": 9474, "epoch": 114} {"train_loss": -17.42135238647461, "global_step": 9475, "epoch": 114} {"train_loss": -17.283489227294922, "global_step": 9476, "epoch": 114} {"train_loss": -17.53873062133789, "global_step": 9477, "epoch": 114} {"train_loss": -17.721298217773438, "global_step": 9478, "epoch": 114} {"train_loss": -17.410795211791992, "global_step": 9479, "epoch": 114} {"train_loss": -17.50398063659668, "global_step": 9480, "epoch": 114} {"train_loss": -17.16986846923828, "global_step": 9481, "epoch": 114} {"train_loss": -17.131710052490234, "global_step": 9482, "epoch": 114} {"train_loss": -16.995214462280273, "global_step": 9483, "epoch": 114} {"train_loss": -17.664091110229492, "global_step": 9484, "epoch": 114} {"train_loss": -18.003154754638672, "global_step": 9485, "epoch": 114} {"train_loss": -17.872480392456055, "global_step": 9486, "epoch": 114} {"train_loss": -17.61252784729004, "global_step": 9487, "epoch": 114} {"train_loss": -17.583974838256836, "global_step": 9488, "epoch": 114} {"train_loss": -17.431772232055664, "global_step": 9489, "epoch": 114} {"train_loss": -17.44717025756836, "global_step": 9490, "epoch": 114} {"train_loss": -17.727006912231445, "global_step": 9491, "epoch": 114} {"train_loss": -18.13175392150879, "global_step": 9492, "epoch": 114} {"train_loss": -17.305917739868164, "global_step": 9493, "epoch": 114} {"train_loss": -17.3268985748291, "global_step": 9494, "epoch": 114} {"train_loss": -17.706878662109375, "global_step": 9495, "epoch": 114} {"train_loss": -17.94877052307129, "global_step": 9496, "epoch": 114} {"train_loss": -17.680583953857422, "global_step": 9497, "epoch": 114} {"train_loss": -17.450965881347656, "global_step": 9498, "epoch": 114} {"train_loss": -17.681316375732422, "global_step": 9499, "epoch": 114} {"train_loss": -17.500638961791992, "global_step": 9500, "epoch": 114} {"train_loss": -16.87295150756836, "global_step": 9501, "epoch": 114} {"train_loss": -17.778411865234375, "global_step": 9502, "epoch": 114} {"train_loss": -17.75177574157715, "global_step": 9503, "epoch": 114} {"train_loss": -17.428808212280273, "global_step": 9504, "epoch": 114} {"train_loss": -18.02654457092285, "global_step": 9505, "epoch": 114} {"train_loss": -17.215707778930664, "global_step": 9506, "epoch": 114} {"train_loss": -17.59478187561035, "global_step": 9507, "epoch": 114} {"train_loss": -17.71323585510254, "global_step": 9508, "epoch": 114} {"train_loss": -17.579574584960938, "global_step": 9509, "epoch": 114} {"train_loss": -17.719276428222656, "global_step": 9510, "epoch": 114} {"train_loss": -17.653715133666992, "global_step": 9511, "epoch": 114} {"train_loss": -17.72748374938965, "global_step": 9512, "epoch": 114} {"train_loss": -17.76904296875, "global_step": 9513, "epoch": 114} {"train_loss": -17.55463981628418, "global_step": 9514, "epoch": 114} {"train_loss": -17.305864334106445, "global_step": 9515, "epoch": 114} {"train_loss": -17.444108963012695, "global_step": 9516, "epoch": 114} {"train_loss": -17.79652976989746, "global_step": 9517, "epoch": 114} {"train_loss": -17.822195053100586, "global_step": 9518, "epoch": 114} {"train_loss": -17.420562744140625, "global_step": 9519, "epoch": 114} {"train_loss": -17.663227081298828, "global_step": 9520, "epoch": 114} {"train_loss": -17.665985107421875, "global_step": 9521, "epoch": 114} {"train_loss": -17.20358657836914, "global_step": 9522, "epoch": 114} {"train_loss": -17.541833877563477, "global_step": 9523, "epoch": 114} {"train_loss": -17.854490280151367, "global_step": 9524, "epoch": 114} {"train_loss": -17.2549991607666, "global_step": 9525, "epoch": 114} {"train_loss": -17.719079971313477, "global_step": 9526, "epoch": 114} {"train_loss": -17.5474796295166, "global_step": 9527, "epoch": 114} {"train_loss": -17.377843856811523, "global_step": 9528, "epoch": 114} {"train_loss": -17.52704429626465, "global_step": 9529, "epoch": 114} {"train_loss": -17.411710739135742, "global_step": 9530, "epoch": 114} {"train_loss": -17.683523178100586, "global_step": 9531, "epoch": 114} {"train_loss": -17.487340927124023, "global_step": 9532, "epoch": 114} {"train_loss": -17.475759506225586, "global_step": 9533, "epoch": 114} {"train_loss": -17.851652145385742, "global_step": 9534, "epoch": 114} {"train_loss": -17.688081741333008, "global_step": 9535, "epoch": 114} {"train_loss": -17.652456283569336, "global_step": 9536, "epoch": 114} {"train_loss": -17.722028732299805, "global_step": 9537, "epoch": 114} {"train_loss": -18.104625701904297, "global_step": 9538, "epoch": 114} {"train_loss": -17.30011558532715, "global_step": 9539, "epoch": 114} {"train_loss": -17.714649200439453, "global_step": 9540, "epoch": 114} {"train_loss": -17.307321548461914, "global_step": 9541, "epoch": 114} {"train_loss": -17.58845329284668, "global_step": 9542, "epoch": 114} {"train_loss": -17.736289978027344, "global_step": 9543, "epoch": 114} {"train_loss": -17.556167556578856, "global_step": 9544, "epoch": 114, "val_loss": 6333157.0} {"train_loss": -17.411828994750977, "global_step": 9545, "epoch": 115} {"train_loss": -17.203495025634766, "global_step": 9546, "epoch": 115} {"train_loss": -17.476896286010742, "global_step": 9547, "epoch": 115} {"train_loss": -17.50572967529297, "global_step": 9548, "epoch": 115} {"train_loss": -17.77150535583496, "global_step": 9549, "epoch": 115} {"train_loss": -17.477481842041016, "global_step": 9550, "epoch": 115} {"train_loss": -17.68827247619629, "global_step": 9551, "epoch": 115} {"train_loss": -17.178327560424805, "global_step": 9552, "epoch": 115} {"train_loss": -17.46471405029297, "global_step": 9553, "epoch": 115} {"train_loss": -17.391559600830078, "global_step": 9554, "epoch": 115} {"train_loss": -17.852619171142578, "global_step": 9555, "epoch": 115} {"train_loss": -17.4666805267334, "global_step": 9556, "epoch": 115} {"train_loss": -17.492395401000977, "global_step": 9557, "epoch": 115} {"train_loss": -17.6666316986084, "global_step": 9558, "epoch": 115} {"train_loss": -17.775171279907227, "global_step": 9559, "epoch": 115} {"train_loss": -17.258726119995117, "global_step": 9560, "epoch": 115} {"train_loss": -17.590627670288086, "global_step": 9561, "epoch": 115} {"train_loss": -17.363895416259766, "global_step": 9562, "epoch": 115} {"train_loss": -17.33219337463379, "global_step": 9563, "epoch": 115} {"train_loss": -17.262300491333008, "global_step": 9564, "epoch": 115} {"train_loss": -17.598417282104492, "global_step": 9565, "epoch": 115} {"train_loss": -17.5813045501709, "global_step": 9566, "epoch": 115} {"train_loss": -17.4984188079834, "global_step": 9567, "epoch": 115} {"train_loss": -17.778539657592773, "global_step": 9568, "epoch": 115} {"train_loss": -17.70039176940918, "global_step": 9569, "epoch": 115} {"train_loss": -17.218854904174805, "global_step": 9570, "epoch": 115} {"train_loss": -17.538022994995117, "global_step": 9571, "epoch": 115} {"train_loss": -17.51006507873535, "global_step": 9572, "epoch": 115} {"train_loss": -17.578001022338867, "global_step": 9573, "epoch": 115} {"train_loss": -18.022022247314453, "global_step": 9574, "epoch": 115} {"train_loss": -17.69666290283203, "global_step": 9575, "epoch": 115} {"train_loss": -17.50165367126465, "global_step": 9576, "epoch": 115} {"train_loss": -17.448585510253906, "global_step": 9577, "epoch": 115} {"train_loss": -17.47376251220703, "global_step": 9578, "epoch": 115} {"train_loss": -17.404041290283203, "global_step": 9579, "epoch": 115} {"train_loss": -17.463287353515625, "global_step": 9580, "epoch": 115} {"train_loss": -17.605817794799805, "global_step": 9581, "epoch": 115} {"train_loss": -18.101255416870117, "global_step": 9582, "epoch": 115} {"train_loss": -16.814712524414062, "global_step": 9583, "epoch": 115} {"train_loss": -17.579343795776367, "global_step": 9584, "epoch": 115} {"train_loss": -17.836523056030273, "global_step": 9585, "epoch": 115} {"train_loss": -17.165403366088867, "global_step": 9586, "epoch": 115} {"train_loss": -17.613143920898438, "global_step": 9587, "epoch": 115} {"train_loss": -17.49970054626465, "global_step": 9588, "epoch": 115} {"train_loss": -17.62467384338379, "global_step": 9589, "epoch": 115} {"train_loss": -17.21012306213379, "global_step": 9590, "epoch": 115} {"train_loss": -17.16727066040039, "global_step": 9591, "epoch": 115} {"train_loss": -17.760513305664062, "global_step": 9592, "epoch": 115} {"train_loss": -17.672910690307617, "global_step": 9593, "epoch": 115} {"train_loss": -17.54453468322754, "global_step": 9594, "epoch": 115} {"train_loss": -17.841440200805664, "global_step": 9595, "epoch": 115} {"train_loss": -17.861555099487305, "global_step": 9596, "epoch": 115} {"train_loss": -17.59706687927246, "global_step": 9597, "epoch": 115} {"train_loss": -17.906831741333008, "global_step": 9598, "epoch": 115} {"train_loss": -18.112045288085938, "global_step": 9599, "epoch": 115} {"train_loss": -17.043447494506836, "global_step": 9600, "epoch": 115} {"train_loss": -17.756420135498047, "global_step": 9601, "epoch": 115} {"train_loss": -17.872724533081055, "global_step": 9602, "epoch": 115} {"train_loss": -17.776430130004883, "global_step": 9603, "epoch": 115} {"train_loss": -17.6711368560791, "global_step": 9604, "epoch": 115} {"train_loss": -17.640233993530273, "global_step": 9605, "epoch": 115} {"train_loss": -17.541133880615234, "global_step": 9606, "epoch": 115} {"train_loss": -17.7872314453125, "global_step": 9607, "epoch": 115} {"train_loss": -17.502456665039062, "global_step": 9608, "epoch": 115} {"train_loss": -17.440387725830078, "global_step": 9609, "epoch": 115} {"train_loss": -17.64752769470215, "global_step": 9610, "epoch": 115} {"train_loss": -17.73613929748535, "global_step": 9611, "epoch": 115} {"train_loss": -17.686769485473633, "global_step": 9612, "epoch": 115} {"train_loss": -17.571792602539062, "global_step": 9613, "epoch": 115} {"train_loss": -17.552343368530273, "global_step": 9614, "epoch": 115} {"train_loss": -17.47654914855957, "global_step": 9615, "epoch": 115} {"train_loss": -17.625364303588867, "global_step": 9616, "epoch": 115} {"train_loss": -17.448963165283203, "global_step": 9617, "epoch": 115} {"train_loss": -17.4742488861084, "global_step": 9618, "epoch": 115} {"train_loss": -17.679285049438477, "global_step": 9619, "epoch": 115} {"train_loss": -17.980234146118164, "global_step": 9620, "epoch": 115} {"train_loss": -17.892118453979492, "global_step": 9621, "epoch": 115} {"train_loss": -17.590255737304688, "global_step": 9622, "epoch": 115} {"train_loss": -17.784744262695312, "global_step": 9623, "epoch": 115} {"train_loss": -17.407913208007812, "global_step": 9624, "epoch": 115} {"train_loss": -17.85316276550293, "global_step": 9625, "epoch": 115} {"train_loss": -17.61739158630371, "global_step": 9626, "epoch": 115} {"train_loss": -17.5618157214429, "global_step": 9627, "epoch": 115, "val_loss": 6078053.0} {"train_loss": -17.080730438232422, "global_step": 9628, "epoch": 116} {"train_loss": -17.2453556060791, "global_step": 9629, "epoch": 116} {"train_loss": -17.4200439453125, "global_step": 9630, "epoch": 116} {"train_loss": -17.516971588134766, "global_step": 9631, "epoch": 116} {"train_loss": -17.643136978149414, "global_step": 9632, "epoch": 116} {"train_loss": -17.77548599243164, "global_step": 9633, "epoch": 116} {"train_loss": -16.87929344177246, "global_step": 9634, "epoch": 116} {"train_loss": -17.312986373901367, "global_step": 9635, "epoch": 116} {"train_loss": -17.968063354492188, "global_step": 9636, "epoch": 116} {"train_loss": -16.966474533081055, "global_step": 9637, "epoch": 116} {"train_loss": -17.856124877929688, "global_step": 9638, "epoch": 116} {"train_loss": -17.343854904174805, "global_step": 9639, "epoch": 116} {"train_loss": -17.310253143310547, "global_step": 9640, "epoch": 116} {"train_loss": -17.338529586791992, "global_step": 9641, "epoch": 116} {"train_loss": -17.553848266601562, "global_step": 9642, "epoch": 116} {"train_loss": -17.704687118530273, "global_step": 9643, "epoch": 116} {"train_loss": -17.746068954467773, "global_step": 9644, "epoch": 116} {"train_loss": -17.48468017578125, "global_step": 9645, "epoch": 116} {"train_loss": -17.466527938842773, "global_step": 9646, "epoch": 116} {"train_loss": -17.5572566986084, "global_step": 9647, "epoch": 116} {"train_loss": -17.54323387145996, "global_step": 9648, "epoch": 116} {"train_loss": -17.44744300842285, "global_step": 9649, "epoch": 116} {"train_loss": -17.750947952270508, "global_step": 9650, "epoch": 116} {"train_loss": -17.628137588500977, "global_step": 9651, "epoch": 116} {"train_loss": -17.59676170349121, "global_step": 9652, "epoch": 116} {"train_loss": -17.808425903320312, "global_step": 9653, "epoch": 116} {"train_loss": -17.543920516967773, "global_step": 9654, "epoch": 116} {"train_loss": -17.458738327026367, "global_step": 9655, "epoch": 116} {"train_loss": -18.04276466369629, "global_step": 9656, "epoch": 116} {"train_loss": -17.4560546875, "global_step": 9657, "epoch": 116} {"train_loss": -17.61173439025879, "global_step": 9658, "epoch": 116} {"train_loss": -17.44515037536621, "global_step": 9659, "epoch": 116} {"train_loss": -17.70062828063965, "global_step": 9660, "epoch": 116} {"train_loss": -17.786176681518555, "global_step": 9661, "epoch": 116} {"train_loss": -17.5689697265625, "global_step": 9662, "epoch": 116} {"train_loss": -17.53607940673828, "global_step": 9663, "epoch": 116} {"train_loss": -17.45469093322754, "global_step": 9664, "epoch": 116} {"train_loss": -17.844322204589844, "global_step": 9665, "epoch": 116} {"train_loss": -17.333419799804688, "global_step": 9666, "epoch": 116} {"train_loss": -17.53948211669922, "global_step": 9667, "epoch": 116} {"train_loss": -17.133115768432617, "global_step": 9668, "epoch": 116} {"train_loss": -17.537565231323242, "global_step": 9669, "epoch": 116} {"train_loss": -17.425230026245117, "global_step": 9670, "epoch": 116} {"train_loss": -17.437150955200195, "global_step": 9671, "epoch": 116} {"train_loss": -17.68097496032715, "global_step": 9672, "epoch": 116} {"train_loss": -17.817394256591797, "global_step": 9673, "epoch": 116} {"train_loss": -17.839078903198242, "global_step": 9674, "epoch": 116} {"train_loss": -18.075714111328125, "global_step": 9675, "epoch": 116} {"train_loss": -17.50337028503418, "global_step": 9676, "epoch": 116} {"train_loss": -17.6782283782959, "global_step": 9677, "epoch": 116} {"train_loss": -17.38006591796875, "global_step": 9678, "epoch": 116} {"train_loss": -17.25410270690918, "global_step": 9679, "epoch": 116} {"train_loss": -17.647912979125977, "global_step": 9680, "epoch": 116} {"train_loss": -17.578105926513672, "global_step": 9681, "epoch": 116} {"train_loss": -17.53956413269043, "global_step": 9682, "epoch": 116} {"train_loss": -17.083139419555664, "global_step": 9683, "epoch": 116} {"train_loss": -17.522939682006836, "global_step": 9684, "epoch": 116} {"train_loss": -17.605358123779297, "global_step": 9685, "epoch": 116} {"train_loss": -17.194623947143555, "global_step": 9686, "epoch": 116} {"train_loss": -17.969594955444336, "global_step": 9687, "epoch": 116} {"train_loss": -17.55903434753418, "global_step": 9688, "epoch": 116} {"train_loss": -17.514984130859375, "global_step": 9689, "epoch": 116} {"train_loss": -17.78168296813965, "global_step": 9690, "epoch": 116} {"train_loss": -17.718393325805664, "global_step": 9691, "epoch": 116} {"train_loss": -17.27475929260254, "global_step": 9692, "epoch": 116} {"train_loss": -17.491811752319336, "global_step": 9693, "epoch": 116} {"train_loss": -17.593429565429688, "global_step": 9694, "epoch": 116} {"train_loss": -17.55984878540039, "global_step": 9695, "epoch": 116} {"train_loss": -17.64271354675293, "global_step": 9696, "epoch": 116} {"train_loss": -17.894866943359375, "global_step": 9697, "epoch": 116} {"train_loss": -17.675107955932617, "global_step": 9698, "epoch": 116} {"train_loss": -18.011428833007812, "global_step": 9699, "epoch": 116} {"train_loss": -17.250110626220703, "global_step": 9700, "epoch": 116} {"train_loss": -17.66091537475586, "global_step": 9701, "epoch": 116} {"train_loss": -17.588315963745117, "global_step": 9702, "epoch": 116} {"train_loss": -17.83871841430664, "global_step": 9703, "epoch": 116} {"train_loss": -17.84627342224121, "global_step": 9704, "epoch": 116} {"train_loss": -17.35729217529297, "global_step": 9705, "epoch": 116} {"train_loss": -17.429019927978516, "global_step": 9706, "epoch": 116} {"train_loss": -17.360198974609375, "global_step": 9707, "epoch": 116} {"train_loss": -17.565351486206055, "global_step": 9708, "epoch": 116} {"train_loss": -17.38400650024414, "global_step": 9709, "epoch": 116} {"train_loss": -17.54980050512107, "global_step": 9710, "epoch": 116, "val_loss": 6174224.5} {"train_loss": -17.688474655151367, "global_step": 9711, "epoch": 117} {"train_loss": -17.511892318725586, "global_step": 9712, "epoch": 117} {"train_loss": -17.057004928588867, "global_step": 9713, "epoch": 117} {"train_loss": -17.640289306640625, "global_step": 9714, "epoch": 117} {"train_loss": -17.50971794128418, "global_step": 9715, "epoch": 117} {"train_loss": -17.55666732788086, "global_step": 9716, "epoch": 117} {"train_loss": -17.094438552856445, "global_step": 9717, "epoch": 117} {"train_loss": -17.621700286865234, "global_step": 9718, "epoch": 117} {"train_loss": -17.810169219970703, "global_step": 9719, "epoch": 117} {"train_loss": -17.753660202026367, "global_step": 9720, "epoch": 117} {"train_loss": -17.50249671936035, "global_step": 9721, "epoch": 117} {"train_loss": -17.645296096801758, "global_step": 9722, "epoch": 117} {"train_loss": -17.602054595947266, "global_step": 9723, "epoch": 117} {"train_loss": -17.67030143737793, "global_step": 9724, "epoch": 117} {"train_loss": -17.823184967041016, "global_step": 9725, "epoch": 117} {"train_loss": -17.825641632080078, "global_step": 9726, "epoch": 117} {"train_loss": -17.748624801635742, "global_step": 9727, "epoch": 117} {"train_loss": -17.35986328125, "global_step": 9728, "epoch": 117} {"train_loss": -17.589941024780273, "global_step": 9729, "epoch": 117} {"train_loss": -17.493877410888672, "global_step": 9730, "epoch": 117} {"train_loss": -17.707441329956055, "global_step": 9731, "epoch": 117} {"train_loss": -17.7974853515625, "global_step": 9732, "epoch": 117} {"train_loss": -17.446006774902344, "global_step": 9733, "epoch": 117} {"train_loss": -17.32430648803711, "global_step": 9734, "epoch": 117} {"train_loss": -17.685382843017578, "global_step": 9735, "epoch": 117} {"train_loss": -18.062437057495117, "global_step": 9736, "epoch": 117} {"train_loss": -17.284992218017578, "global_step": 9737, "epoch": 117} {"train_loss": -17.612119674682617, "global_step": 9738, "epoch": 117} {"train_loss": -17.474702835083008, "global_step": 9739, "epoch": 117} {"train_loss": -17.387327194213867, "global_step": 9740, "epoch": 117} {"train_loss": -17.870126724243164, "global_step": 9741, "epoch": 117} {"train_loss": -17.338457107543945, "global_step": 9742, "epoch": 117} {"train_loss": -17.27561378479004, "global_step": 9743, "epoch": 117} {"train_loss": -17.575908660888672, "global_step": 9744, "epoch": 117} {"train_loss": -17.63349723815918, "global_step": 9745, "epoch": 117} {"train_loss": -17.60862159729004, "global_step": 9746, "epoch": 117} {"train_loss": -17.775251388549805, "global_step": 9747, "epoch": 117} {"train_loss": -17.490455627441406, "global_step": 9748, "epoch": 117} {"train_loss": -17.49403953552246, "global_step": 9749, "epoch": 117} {"train_loss": -17.744260787963867, "global_step": 9750, "epoch": 117} {"train_loss": -17.701488494873047, "global_step": 9751, "epoch": 117} {"train_loss": -17.893213272094727, "global_step": 9752, "epoch": 117} {"train_loss": -17.971235275268555, "global_step": 9753, "epoch": 117} {"train_loss": -17.463727951049805, "global_step": 9754, "epoch": 117} {"train_loss": -17.809675216674805, "global_step": 9755, "epoch": 117} {"train_loss": -17.855825424194336, "global_step": 9756, "epoch": 117} {"train_loss": -17.611635208129883, "global_step": 9757, "epoch": 117} {"train_loss": -17.52760124206543, "global_step": 9758, "epoch": 117} {"train_loss": -17.789159774780273, "global_step": 9759, "epoch": 117} {"train_loss": -17.647428512573242, "global_step": 9760, "epoch": 117} {"train_loss": -17.447834014892578, "global_step": 9761, "epoch": 117} {"train_loss": -17.568115234375, "global_step": 9762, "epoch": 117} {"train_loss": -17.38408851623535, "global_step": 9763, "epoch": 117} {"train_loss": -17.53631019592285, "global_step": 9764, "epoch": 117} {"train_loss": -17.8950252532959, "global_step": 9765, "epoch": 117} {"train_loss": -17.793073654174805, "global_step": 9766, "epoch": 117} {"train_loss": -18.011144638061523, "global_step": 9767, "epoch": 117} {"train_loss": -17.421676635742188, "global_step": 9768, "epoch": 117} {"train_loss": -17.652868270874023, "global_step": 9769, "epoch": 117} {"train_loss": -17.249135971069336, "global_step": 9770, "epoch": 117} {"train_loss": -17.76464080810547, "global_step": 9771, "epoch": 117} {"train_loss": -17.173315048217773, "global_step": 9772, "epoch": 117} {"train_loss": -17.29865837097168, "global_step": 9773, "epoch": 117} {"train_loss": -18.1981258392334, "global_step": 9774, "epoch": 117} {"train_loss": -17.728849411010742, "global_step": 9775, "epoch": 117} {"train_loss": -17.560134887695312, "global_step": 9776, "epoch": 117} {"train_loss": -17.749109268188477, "global_step": 9777, "epoch": 117} {"train_loss": -17.544614791870117, "global_step": 9778, "epoch": 117} {"train_loss": -17.534645080566406, "global_step": 9779, "epoch": 117} {"train_loss": -17.697956085205078, "global_step": 9780, "epoch": 117} {"train_loss": -17.221885681152344, "global_step": 9781, "epoch": 117} {"train_loss": -17.52531623840332, "global_step": 9782, "epoch": 117} {"train_loss": -17.580835342407227, "global_step": 9783, "epoch": 117} {"train_loss": -17.650564193725586, "global_step": 9784, "epoch": 117} {"train_loss": -17.38979148864746, "global_step": 9785, "epoch": 117} {"train_loss": -17.382831573486328, "global_step": 9786, "epoch": 117} {"train_loss": -17.608808517456055, "global_step": 9787, "epoch": 117} {"train_loss": -17.517881393432617, "global_step": 9788, "epoch": 117} {"train_loss": -17.615825653076172, "global_step": 9789, "epoch": 117} {"train_loss": -17.04539680480957, "global_step": 9790, "epoch": 117} {"train_loss": -17.54914665222168, "global_step": 9791, "epoch": 117} {"train_loss": -17.432926177978516, "global_step": 9792, "epoch": 117} {"train_loss": -17.591583274933228, "global_step": 9793, "epoch": 117, "val_loss": 6291967.0} {"train_loss": -17.21515464782715, "global_step": 9794, "epoch": 118} {"train_loss": -17.498943328857422, "global_step": 9795, "epoch": 118} {"train_loss": -17.785207748413086, "global_step": 9796, "epoch": 118} {"train_loss": -17.690500259399414, "global_step": 9797, "epoch": 118} {"train_loss": -17.533828735351562, "global_step": 9798, "epoch": 118} {"train_loss": -17.349008560180664, "global_step": 9799, "epoch": 118} {"train_loss": -17.62351417541504, "global_step": 9800, "epoch": 118} {"train_loss": -17.561359405517578, "global_step": 9801, "epoch": 118} {"train_loss": -17.637243270874023, "global_step": 9802, "epoch": 118} {"train_loss": -17.239477157592773, "global_step": 9803, "epoch": 118} {"train_loss": -17.88975715637207, "global_step": 9804, "epoch": 118} {"train_loss": -17.621824264526367, "global_step": 9805, "epoch": 118} {"train_loss": -17.05105209350586, "global_step": 9806, "epoch": 118} {"train_loss": -17.353239059448242, "global_step": 9807, "epoch": 118} {"train_loss": -17.552499771118164, "global_step": 9808, "epoch": 118} {"train_loss": -17.85664939880371, "global_step": 9809, "epoch": 118} {"train_loss": -17.91636085510254, "global_step": 9810, "epoch": 118} {"train_loss": -17.780860900878906, "global_step": 9811, "epoch": 118} {"train_loss": -17.973966598510742, "global_step": 9812, "epoch": 118} {"train_loss": -17.565690994262695, "global_step": 9813, "epoch": 118} {"train_loss": -17.982755661010742, "global_step": 9814, "epoch": 118} {"train_loss": -17.8096981048584, "global_step": 9815, "epoch": 118} {"train_loss": -17.7589111328125, "global_step": 9816, "epoch": 118} {"train_loss": -17.599395751953125, "global_step": 9817, "epoch": 118} {"train_loss": -17.572153091430664, "global_step": 9818, "epoch": 118} {"train_loss": -17.810117721557617, "global_step": 9819, "epoch": 118} {"train_loss": -17.45539665222168, "global_step": 9820, "epoch": 118} {"train_loss": -17.648664474487305, "global_step": 9821, "epoch": 118} {"train_loss": -17.4118595123291, "global_step": 9822, "epoch": 118} {"train_loss": -17.447952270507812, "global_step": 9823, "epoch": 118} {"train_loss": -17.48971176147461, "global_step": 9824, "epoch": 118} {"train_loss": -17.876399993896484, "global_step": 9825, "epoch": 118} {"train_loss": -17.7163143157959, "global_step": 9826, "epoch": 118} {"train_loss": -17.47903823852539, "global_step": 9827, "epoch": 118} {"train_loss": -17.55599021911621, "global_step": 9828, "epoch": 118} {"train_loss": -17.571887969970703, "global_step": 9829, "epoch": 118} {"train_loss": -17.61453628540039, "global_step": 9830, "epoch": 118} {"train_loss": -17.5163631439209, "global_step": 9831, "epoch": 118} {"train_loss": -17.430919647216797, "global_step": 9832, "epoch": 118} {"train_loss": -17.937519073486328, "global_step": 9833, "epoch": 118} {"train_loss": -17.50508689880371, "global_step": 9834, "epoch": 118} {"train_loss": -17.653417587280273, "global_step": 9835, "epoch": 118} {"train_loss": -17.621139526367188, "global_step": 9836, "epoch": 118} {"train_loss": -17.481372833251953, "global_step": 9837, "epoch": 118} {"train_loss": -17.945316314697266, "global_step": 9838, "epoch": 118} {"train_loss": -17.663869857788086, "global_step": 9839, "epoch": 118} {"train_loss": -18.03042221069336, "global_step": 9840, "epoch": 118} {"train_loss": -17.87997817993164, "global_step": 9841, "epoch": 118} {"train_loss": -17.371219635009766, "global_step": 9842, "epoch": 118} {"train_loss": -17.74931526184082, "global_step": 9843, "epoch": 118} {"train_loss": -17.476154327392578, "global_step": 9844, "epoch": 118} {"train_loss": -17.875768661499023, "global_step": 9845, "epoch": 118} {"train_loss": -17.50858497619629, "global_step": 9846, "epoch": 118} {"train_loss": -17.638614654541016, "global_step": 9847, "epoch": 118} {"train_loss": -17.54477310180664, "global_step": 9848, "epoch": 118} {"train_loss": -17.505020141601562, "global_step": 9849, "epoch": 118} {"train_loss": -17.454763412475586, "global_step": 9850, "epoch": 118} {"train_loss": -17.499345779418945, "global_step": 9851, "epoch": 118} {"train_loss": -17.484281539916992, "global_step": 9852, "epoch": 118} {"train_loss": -17.922639846801758, "global_step": 9853, "epoch": 118} {"train_loss": -16.80609130859375, "global_step": 9854, "epoch": 118} {"train_loss": -17.517370223999023, "global_step": 9855, "epoch": 118} {"train_loss": -17.814481735229492, "global_step": 9856, "epoch": 118} {"train_loss": -17.645679473876953, "global_step": 9857, "epoch": 118} {"train_loss": -17.506847381591797, "global_step": 9858, "epoch": 118} {"train_loss": -17.4749698638916, "global_step": 9859, "epoch": 118} {"train_loss": -17.488622665405273, "global_step": 9860, "epoch": 118} {"train_loss": -17.86319923400879, "global_step": 9861, "epoch": 118} {"train_loss": -17.39348793029785, "global_step": 9862, "epoch": 118} {"train_loss": -17.76618003845215, "global_step": 9863, "epoch": 118} {"train_loss": -17.179916381835938, "global_step": 9864, "epoch": 118} {"train_loss": -17.462993621826172, "global_step": 9865, "epoch": 118} {"train_loss": -17.7338924407959, "global_step": 9866, "epoch": 118} {"train_loss": -17.98954963684082, "global_step": 9867, "epoch": 118} {"train_loss": -17.378219604492188, "global_step": 9868, "epoch": 118} {"train_loss": -17.348608016967773, "global_step": 9869, "epoch": 118} {"train_loss": -17.499906539916992, "global_step": 9870, "epoch": 118} {"train_loss": -17.65189552307129, "global_step": 9871, "epoch": 118} {"train_loss": -17.479549407958984, "global_step": 9872, "epoch": 118} {"train_loss": -17.768680572509766, "global_step": 9873, "epoch": 118} {"train_loss": -17.17790985107422, "global_step": 9874, "epoch": 118} {"train_loss": -17.157758712768555, "global_step": 9875, "epoch": 118} {"train_loss": -17.604353226811053, "global_step": 9876, "epoch": 118, "val_loss": 6167885.0} {"train_loss": -17.284915924072266, "global_step": 9877, "epoch": 119} {"train_loss": -17.57927894592285, "global_step": 9878, "epoch": 119} {"train_loss": -17.146957397460938, "global_step": 9879, "epoch": 119} {"train_loss": -17.21856689453125, "global_step": 9880, "epoch": 119} {"train_loss": -17.78780174255371, "global_step": 9881, "epoch": 119} {"train_loss": -17.727262496948242, "global_step": 9882, "epoch": 119} {"train_loss": -17.679969787597656, "global_step": 9883, "epoch": 119} {"train_loss": -17.428213119506836, "global_step": 9884, "epoch": 119} {"train_loss": -17.2532958984375, "global_step": 9885, "epoch": 119} {"train_loss": -17.577373504638672, "global_step": 9886, "epoch": 119} {"train_loss": -17.393190383911133, "global_step": 9887, "epoch": 119} {"train_loss": -17.48792839050293, "global_step": 9888, "epoch": 119} {"train_loss": -17.476774215698242, "global_step": 9889, "epoch": 119} {"train_loss": -17.458194732666016, "global_step": 9890, "epoch": 119} {"train_loss": -17.568557739257812, "global_step": 9891, "epoch": 119} {"train_loss": -17.731855392456055, "global_step": 9892, "epoch": 119} {"train_loss": -17.373655319213867, "global_step": 9893, "epoch": 119} {"train_loss": -17.428741455078125, "global_step": 9894, "epoch": 119} {"train_loss": -17.58892822265625, "global_step": 9895, "epoch": 119} {"train_loss": -16.934114456176758, "global_step": 9896, "epoch": 119} {"train_loss": -17.597179412841797, "global_step": 9897, "epoch": 119} {"train_loss": -17.433897018432617, "global_step": 9898, "epoch": 119} {"train_loss": -17.732070922851562, "global_step": 9899, "epoch": 119} {"train_loss": -17.72024917602539, "global_step": 9900, "epoch": 119} {"train_loss": -17.777257919311523, "global_step": 9901, "epoch": 119} {"train_loss": -17.415740966796875, "global_step": 9902, "epoch": 119} {"train_loss": -17.539283752441406, "global_step": 9903, "epoch": 119} {"train_loss": -17.9343318939209, "global_step": 9904, "epoch": 119} {"train_loss": -17.946157455444336, "global_step": 9905, "epoch": 119} {"train_loss": -17.616958618164062, "global_step": 9906, "epoch": 119} {"train_loss": -17.7308292388916, "global_step": 9907, "epoch": 119} {"train_loss": -17.977453231811523, "global_step": 9908, "epoch": 119} {"train_loss": -18.24720573425293, "global_step": 9909, "epoch": 119} {"train_loss": -17.899274826049805, "global_step": 9910, "epoch": 119} {"train_loss": -17.40963363647461, "global_step": 9911, "epoch": 119} {"train_loss": -17.642677307128906, "global_step": 9912, "epoch": 119} {"train_loss": -17.486806869506836, "global_step": 9913, "epoch": 119} {"train_loss": -17.555578231811523, "global_step": 9914, "epoch": 119} {"train_loss": -17.749391555786133, "global_step": 9915, "epoch": 119} {"train_loss": -17.54542350769043, "global_step": 9916, "epoch": 119} {"train_loss": -17.506038665771484, "global_step": 9917, "epoch": 119} {"train_loss": -17.835817337036133, "global_step": 9918, "epoch": 119} {"train_loss": -17.86952781677246, "global_step": 9919, "epoch": 119} {"train_loss": -17.876802444458008, "global_step": 9920, "epoch": 119} {"train_loss": -17.615896224975586, "global_step": 9921, "epoch": 119} {"train_loss": -17.704763412475586, "global_step": 9922, "epoch": 119} {"train_loss": -18.138490676879883, "global_step": 9923, "epoch": 119} {"train_loss": -17.63703727722168, "global_step": 9924, "epoch": 119} {"train_loss": -17.286195755004883, "global_step": 9925, "epoch": 119} {"train_loss": -17.641611099243164, "global_step": 9926, "epoch": 119} {"train_loss": -17.651914596557617, "global_step": 9927, "epoch": 119} {"train_loss": -17.826154708862305, "global_step": 9928, "epoch": 119} {"train_loss": -17.874614715576172, "global_step": 9929, "epoch": 119} {"train_loss": -17.5792293548584, "global_step": 9930, "epoch": 119} {"train_loss": -17.755727767944336, "global_step": 9931, "epoch": 119} {"train_loss": -17.75324058532715, "global_step": 9932, "epoch": 119} {"train_loss": -17.36228370666504, "global_step": 9933, "epoch": 119} {"train_loss": -17.466426849365234, "global_step": 9934, "epoch": 119} {"train_loss": -17.77261734008789, "global_step": 9935, "epoch": 119} {"train_loss": -17.17049217224121, "global_step": 9936, "epoch": 119} {"train_loss": -17.770273208618164, "global_step": 9937, "epoch": 119} {"train_loss": -17.493879318237305, "global_step": 9938, "epoch": 119} {"train_loss": -17.835664749145508, "global_step": 9939, "epoch": 119} {"train_loss": -17.79292106628418, "global_step": 9940, "epoch": 119} {"train_loss": -17.715259552001953, "global_step": 9941, "epoch": 119} {"train_loss": -17.245458602905273, "global_step": 9942, "epoch": 119} {"train_loss": -17.679487228393555, "global_step": 9943, "epoch": 119} {"train_loss": -17.746912002563477, "global_step": 9944, "epoch": 119} {"train_loss": -17.474559783935547, "global_step": 9945, "epoch": 119} {"train_loss": -17.64981460571289, "global_step": 9946, "epoch": 119} {"train_loss": -17.584577560424805, "global_step": 9947, "epoch": 119} {"train_loss": -17.4008731842041, "global_step": 9948, "epoch": 119} {"train_loss": -17.611865997314453, "global_step": 9949, "epoch": 119} {"train_loss": -17.48227882385254, "global_step": 9950, "epoch": 119} {"train_loss": -17.63926124572754, "global_step": 9951, "epoch": 119} {"train_loss": -17.331205368041992, "global_step": 9952, "epoch": 119} {"train_loss": -17.72465705871582, "global_step": 9953, "epoch": 119} {"train_loss": -17.643898010253906, "global_step": 9954, "epoch": 119} {"train_loss": -17.62447166442871, "global_step": 9955, "epoch": 119} {"train_loss": -17.509740829467773, "global_step": 9956, "epoch": 119} {"train_loss": -17.872480392456055, "global_step": 9957, "epoch": 119} {"train_loss": -17.490509033203125, "global_step": 9958, "epoch": 119} {"train_loss": -17.59883676092309, "global_step": 9959, "epoch": 119, "val_loss": 6051247.0} {"train_loss": -17.105880737304688, "global_step": 9960, "epoch": 120} {"train_loss": -17.52700424194336, "global_step": 9961, "epoch": 120} {"train_loss": -17.58614158630371, "global_step": 9962, "epoch": 120} {"train_loss": -17.199527740478516, "global_step": 9963, "epoch": 120} {"train_loss": -17.469877243041992, "global_step": 9964, "epoch": 120} {"train_loss": -17.537281036376953, "global_step": 9965, "epoch": 120} {"train_loss": -17.446317672729492, "global_step": 9966, "epoch": 120} {"train_loss": -17.52838706970215, "global_step": 9967, "epoch": 120} {"train_loss": -17.659957885742188, "global_step": 9968, "epoch": 120} {"train_loss": -17.261228561401367, "global_step": 9969, "epoch": 120} {"train_loss": -17.759748458862305, "global_step": 9970, "epoch": 120} {"train_loss": -17.691104888916016, "global_step": 9971, "epoch": 120} {"train_loss": -17.690526962280273, "global_step": 9972, "epoch": 120} {"train_loss": -17.511539459228516, "global_step": 9973, "epoch": 120} {"train_loss": -17.583847045898438, "global_step": 9974, "epoch": 120} {"train_loss": -17.2376708984375, "global_step": 9975, "epoch": 120} {"train_loss": -17.43495750427246, "global_step": 9976, "epoch": 120} {"train_loss": -17.423175811767578, "global_step": 9977, "epoch": 120} {"train_loss": -17.52447509765625, "global_step": 9978, "epoch": 120} {"train_loss": -17.69327163696289, "global_step": 9979, "epoch": 120} {"train_loss": -17.806547164916992, "global_step": 9980, "epoch": 120} {"train_loss": -17.152179718017578, "global_step": 9981, "epoch": 120} {"train_loss": -17.769559860229492, "global_step": 9982, "epoch": 120} {"train_loss": -17.96525001525879, "global_step": 9983, "epoch": 120} {"train_loss": -17.61139488220215, "global_step": 9984, "epoch": 120} {"train_loss": -17.464208602905273, "global_step": 9985, "epoch": 120} {"train_loss": -18.012313842773438, "global_step": 9986, "epoch": 120} {"train_loss": -17.96625328063965, "global_step": 9987, "epoch": 120} {"train_loss": -17.3111629486084, "global_step": 9988, "epoch": 120} {"train_loss": -17.545734405517578, "global_step": 9989, "epoch": 120} {"train_loss": -16.91205406188965, "global_step": 9990, "epoch": 120} {"train_loss": -17.84543228149414, "global_step": 9991, "epoch": 120} {"train_loss": -17.466964721679688, "global_step": 9992, "epoch": 120} {"train_loss": -17.433927536010742, "global_step": 9993, "epoch": 120} {"train_loss": -17.64713478088379, "global_step": 9994, "epoch": 120} {"train_loss": -17.413850784301758, "global_step": 9995, "epoch": 120} {"train_loss": -17.662017822265625, "global_step": 9996, "epoch": 120} {"train_loss": -17.55908203125, "global_step": 9997, "epoch": 120} {"train_loss": -17.863683700561523, "global_step": 9998, "epoch": 120} {"train_loss": -17.61024284362793, "global_step": 9999, "epoch": 120} {"train_loss": -17.73029136657715, "global_step": 10000, "epoch": 120} {"train_loss": -17.6502685546875, "global_step": 10001, "epoch": 120} {"train_loss": -17.54695701599121, "global_step": 10002, "epoch": 120} {"train_loss": -17.942258834838867, "global_step": 10003, "epoch": 120} {"train_loss": -17.321542739868164, "global_step": 10004, "epoch": 120} {"train_loss": -17.594858169555664, "global_step": 10005, "epoch": 120} {"train_loss": -17.20387840270996, "global_step": 10006, "epoch": 120} {"train_loss": -17.57501792907715, "global_step": 10007, "epoch": 120} {"train_loss": -18.007904052734375, "global_step": 10008, "epoch": 120} {"train_loss": -17.98175621032715, "global_step": 10009, "epoch": 120} {"train_loss": -17.810964584350586, "global_step": 10010, "epoch": 120} {"train_loss": -17.534330368041992, "global_step": 10011, "epoch": 120} {"train_loss": -17.700162887573242, "global_step": 10012, "epoch": 120} {"train_loss": -17.830135345458984, "global_step": 10013, "epoch": 120} {"train_loss": -17.590900421142578, "global_step": 10014, "epoch": 120} {"train_loss": -17.520936965942383, "global_step": 10015, "epoch": 120} {"train_loss": -17.74155616760254, "global_step": 10016, "epoch": 120} {"train_loss": -17.59847068786621, "global_step": 10017, "epoch": 120} {"train_loss": -17.60289764404297, "global_step": 10018, "epoch": 120} {"train_loss": -17.696500778198242, "global_step": 10019, "epoch": 120} {"train_loss": -18.150230407714844, "global_step": 10020, "epoch": 120} {"train_loss": -17.51861572265625, "global_step": 10021, "epoch": 120} {"train_loss": -17.879043579101562, "global_step": 10022, "epoch": 120} {"train_loss": -17.813400268554688, "global_step": 10023, "epoch": 120} {"train_loss": -17.885305404663086, "global_step": 10024, "epoch": 120} {"train_loss": -18.04340171813965, "global_step": 10025, "epoch": 120} {"train_loss": -17.526906967163086, "global_step": 10026, "epoch": 120} {"train_loss": -17.879650115966797, "global_step": 10027, "epoch": 120} {"train_loss": -17.48969078063965, "global_step": 10028, "epoch": 120} {"train_loss": -17.35512351989746, "global_step": 10029, "epoch": 120} {"train_loss": -17.75052261352539, "global_step": 10030, "epoch": 120} {"train_loss": -17.412612915039062, "global_step": 10031, "epoch": 120} {"train_loss": -17.97735023498535, "global_step": 10032, "epoch": 120} {"train_loss": -17.556381225585938, "global_step": 10033, "epoch": 120} {"train_loss": -17.535850524902344, "global_step": 10034, "epoch": 120} {"train_loss": -17.420475006103516, "global_step": 10035, "epoch": 120} {"train_loss": -17.917394638061523, "global_step": 10036, "epoch": 120} {"train_loss": -17.069379806518555, "global_step": 10037, "epoch": 120} {"train_loss": -17.70197868347168, "global_step": 10038, "epoch": 120} {"train_loss": -17.54865074157715, "global_step": 10039, "epoch": 120} {"train_loss": -17.603071212768555, "global_step": 10040, "epoch": 120} {"train_loss": -17.656566619873047, "global_step": 10041, "epoch": 120} {"train_loss": -17.6076172978045, "global_step": 10042, "epoch": 120, "val_loss": 6171637.5} {"train_loss": -17.392501831054688, "global_step": 10043, "epoch": 121} {"train_loss": -17.61577796936035, "global_step": 10044, "epoch": 121} {"train_loss": -16.64654541015625, "global_step": 10045, "epoch": 121} {"train_loss": -17.83497428894043, "global_step": 10046, "epoch": 121} {"train_loss": -17.44869041442871, "global_step": 10047, "epoch": 121} {"train_loss": -17.636262893676758, "global_step": 10048, "epoch": 121} {"train_loss": -17.14414405822754, "global_step": 10049, "epoch": 121} {"train_loss": -17.436599731445312, "global_step": 10050, "epoch": 121} {"train_loss": -17.672962188720703, "global_step": 10051, "epoch": 121} {"train_loss": -17.39031982421875, "global_step": 10052, "epoch": 121} {"train_loss": -17.786161422729492, "global_step": 10053, "epoch": 121} {"train_loss": -17.306989669799805, "global_step": 10054, "epoch": 121} {"train_loss": -17.89382553100586, "global_step": 10055, "epoch": 121} {"train_loss": -17.42447853088379, "global_step": 10056, "epoch": 121} {"train_loss": -17.458759307861328, "global_step": 10057, "epoch": 121} {"train_loss": -17.665115356445312, "global_step": 10058, "epoch": 121} {"train_loss": -17.234472274780273, "global_step": 10059, "epoch": 121} {"train_loss": -17.44868278503418, "global_step": 10060, "epoch": 121} {"train_loss": -18.170886993408203, "global_step": 10061, "epoch": 121} {"train_loss": -17.618642807006836, "global_step": 10062, "epoch": 121} {"train_loss": -17.468421936035156, "global_step": 10063, "epoch": 121} {"train_loss": -17.407819747924805, "global_step": 10064, "epoch": 121} {"train_loss": -17.488645553588867, "global_step": 10065, "epoch": 121} {"train_loss": -17.59078025817871, "global_step": 10066, "epoch": 121} {"train_loss": -17.721515655517578, "global_step": 10067, "epoch": 121} {"train_loss": -17.677549362182617, "global_step": 10068, "epoch": 121} {"train_loss": -17.538488388061523, "global_step": 10069, "epoch": 121} {"train_loss": -17.77141761779785, "global_step": 10070, "epoch": 121} {"train_loss": -17.668405532836914, "global_step": 10071, "epoch": 121} {"train_loss": -18.088293075561523, "global_step": 10072, "epoch": 121} {"train_loss": -17.992948532104492, "global_step": 10073, "epoch": 121} {"train_loss": -17.709760665893555, "global_step": 10074, "epoch": 121} {"train_loss": -17.448808670043945, "global_step": 10075, "epoch": 121} {"train_loss": -17.45257568359375, "global_step": 10076, "epoch": 121} {"train_loss": -17.66431999206543, "global_step": 10077, "epoch": 121} {"train_loss": -17.55800437927246, "global_step": 10078, "epoch": 121} {"train_loss": -17.66053009033203, "global_step": 10079, "epoch": 121} {"train_loss": -17.7637939453125, "global_step": 10080, "epoch": 121} {"train_loss": -17.553897857666016, "global_step": 10081, "epoch": 121} {"train_loss": -17.644927978515625, "global_step": 10082, "epoch": 121} {"train_loss": -17.51333999633789, "global_step": 10083, "epoch": 121} {"train_loss": -17.661184310913086, "global_step": 10084, "epoch": 121} {"train_loss": -17.453943252563477, "global_step": 10085, "epoch": 121} {"train_loss": -17.522071838378906, "global_step": 10086, "epoch": 121} {"train_loss": -17.462568283081055, "global_step": 10087, "epoch": 121} {"train_loss": -17.59375, "global_step": 10088, "epoch": 121} {"train_loss": -17.315710067749023, "global_step": 10089, "epoch": 121} {"train_loss": -17.557153701782227, "global_step": 10090, "epoch": 121} {"train_loss": -17.5234317779541, "global_step": 10091, "epoch": 121} {"train_loss": -18.152667999267578, "global_step": 10092, "epoch": 121} {"train_loss": -17.636302947998047, "global_step": 10093, "epoch": 121} {"train_loss": -17.777587890625, "global_step": 10094, "epoch": 121} {"train_loss": -17.876888275146484, "global_step": 10095, "epoch": 121} {"train_loss": -17.62653923034668, "global_step": 10096, "epoch": 121} {"train_loss": -17.26152229309082, "global_step": 10097, "epoch": 121} {"train_loss": -17.428800582885742, "global_step": 10098, "epoch": 121} {"train_loss": -17.45234489440918, "global_step": 10099, "epoch": 121} {"train_loss": -17.90557098388672, "global_step": 10100, "epoch": 121} {"train_loss": -17.663557052612305, "global_step": 10101, "epoch": 121} {"train_loss": -17.926250457763672, "global_step": 10102, "epoch": 121} {"train_loss": -17.620655059814453, "global_step": 10103, "epoch": 121} {"train_loss": -17.650537490844727, "global_step": 10104, "epoch": 121} {"train_loss": -17.93764305114746, "global_step": 10105, "epoch": 121} {"train_loss": -17.651350021362305, "global_step": 10106, "epoch": 121} {"train_loss": -17.669424057006836, "global_step": 10107, "epoch": 121} {"train_loss": -17.651039123535156, "global_step": 10108, "epoch": 121} {"train_loss": -17.67925262451172, "global_step": 10109, "epoch": 121} {"train_loss": -17.985946655273438, "global_step": 10110, "epoch": 121} {"train_loss": -17.629838943481445, "global_step": 10111, "epoch": 121} {"train_loss": -17.479320526123047, "global_step": 10112, "epoch": 121} {"train_loss": -17.758655548095703, "global_step": 10113, "epoch": 121} {"train_loss": -17.709457397460938, "global_step": 10114, "epoch": 121} {"train_loss": -17.4760684967041, "global_step": 10115, "epoch": 121} {"train_loss": -17.33767318725586, "global_step": 10116, "epoch": 121} {"train_loss": -17.625164031982422, "global_step": 10117, "epoch": 121} {"train_loss": -17.584369659423828, "global_step": 10118, "epoch": 121} {"train_loss": -17.856807708740234, "global_step": 10119, "epoch": 121} {"train_loss": -17.73714256286621, "global_step": 10120, "epoch": 121} {"train_loss": -17.480403900146484, "global_step": 10121, "epoch": 121} {"train_loss": -17.874372482299805, "global_step": 10122, "epoch": 121} {"train_loss": -17.35175895690918, "global_step": 10123, "epoch": 121} {"train_loss": -17.954160690307617, "global_step": 10124, "epoch": 121} {"train_loss": -17.618569040872966, "global_step": 10125, "epoch": 121, "val_loss": 6029530.0} {"train_loss": -17.880664825439453, "global_step": 10126, "epoch": 122} {"train_loss": -18.039871215820312, "global_step": 10127, "epoch": 122} {"train_loss": -17.66611099243164, "global_step": 10128, "epoch": 122} {"train_loss": -17.917409896850586, "global_step": 10129, "epoch": 122} {"train_loss": -17.276086807250977, "global_step": 10130, "epoch": 122} {"train_loss": -17.98977279663086, "global_step": 10131, "epoch": 122} {"train_loss": -17.639081954956055, "global_step": 10132, "epoch": 122} {"train_loss": -17.67372703552246, "global_step": 10133, "epoch": 122} {"train_loss": -17.343671798706055, "global_step": 10134, "epoch": 122} {"train_loss": -17.86484718322754, "global_step": 10135, "epoch": 122} {"train_loss": -17.930253982543945, "global_step": 10136, "epoch": 122} {"train_loss": -17.820432662963867, "global_step": 10137, "epoch": 122} {"train_loss": -17.8102970123291, "global_step": 10138, "epoch": 122} {"train_loss": -17.872800827026367, "global_step": 10139, "epoch": 122} {"train_loss": -17.403091430664062, "global_step": 10140, "epoch": 122} {"train_loss": -17.482091903686523, "global_step": 10141, "epoch": 122} {"train_loss": -17.712100982666016, "global_step": 10142, "epoch": 122} {"train_loss": -17.661727905273438, "global_step": 10143, "epoch": 122} {"train_loss": -17.2818603515625, "global_step": 10144, "epoch": 122} {"train_loss": -17.617584228515625, "global_step": 10145, "epoch": 122} {"train_loss": -17.923730850219727, "global_step": 10146, "epoch": 122} {"train_loss": -17.437002182006836, "global_step": 10147, "epoch": 122} {"train_loss": -17.764846801757812, "global_step": 10148, "epoch": 122} {"train_loss": -17.142316818237305, "global_step": 10149, "epoch": 122} {"train_loss": -17.366262435913086, "global_step": 10150, "epoch": 122} {"train_loss": -17.882911682128906, "global_step": 10151, "epoch": 122} {"train_loss": -17.78850746154785, "global_step": 10152, "epoch": 122} {"train_loss": -17.45512580871582, "global_step": 10153, "epoch": 122} {"train_loss": -17.23347282409668, "global_step": 10154, "epoch": 122} {"train_loss": -17.361652374267578, "global_step": 10155, "epoch": 122} {"train_loss": -18.24295997619629, "global_step": 10156, "epoch": 122} {"train_loss": -17.860702514648438, "global_step": 10157, "epoch": 122} {"train_loss": -17.681964874267578, "global_step": 10158, "epoch": 122} {"train_loss": -17.43979835510254, "global_step": 10159, "epoch": 122} {"train_loss": -17.467432022094727, "global_step": 10160, "epoch": 122} {"train_loss": -17.770986557006836, "global_step": 10161, "epoch": 122} {"train_loss": -17.898338317871094, "global_step": 10162, "epoch": 122} {"train_loss": -17.155141830444336, "global_step": 10163, "epoch": 122} {"train_loss": -17.745025634765625, "global_step": 10164, "epoch": 122} {"train_loss": -17.50240135192871, "global_step": 10165, "epoch": 122} {"train_loss": -17.754852294921875, "global_step": 10166, "epoch": 122} {"train_loss": -17.671621322631836, "global_step": 10167, "epoch": 122} {"train_loss": -17.43633460998535, "global_step": 10168, "epoch": 122} {"train_loss": -17.68440055847168, "global_step": 10169, "epoch": 122} {"train_loss": -17.620603561401367, "global_step": 10170, "epoch": 122} {"train_loss": -17.504467010498047, "global_step": 10171, "epoch": 122} {"train_loss": -17.204050064086914, "global_step": 10172, "epoch": 122} {"train_loss": -17.48229217529297, "global_step": 10173, "epoch": 122} {"train_loss": -17.721086502075195, "global_step": 10174, "epoch": 122} {"train_loss": -17.86647605895996, "global_step": 10175, "epoch": 122} {"train_loss": -17.51947593688965, "global_step": 10176, "epoch": 122} {"train_loss": -17.795608520507812, "global_step": 10177, "epoch": 122} {"train_loss": -17.37139320373535, "global_step": 10178, "epoch": 122} {"train_loss": -17.69399070739746, "global_step": 10179, "epoch": 122} {"train_loss": -17.405122756958008, "global_step": 10180, "epoch": 122} {"train_loss": -17.605680465698242, "global_step": 10181, "epoch": 122} {"train_loss": -17.225784301757812, "global_step": 10182, "epoch": 122} {"train_loss": -17.947221755981445, "global_step": 10183, "epoch": 122} {"train_loss": -17.76753807067871, "global_step": 10184, "epoch": 122} {"train_loss": -17.615806579589844, "global_step": 10185, "epoch": 122} {"train_loss": -17.73782730102539, "global_step": 10186, "epoch": 122} {"train_loss": -17.98562240600586, "global_step": 10187, "epoch": 122} {"train_loss": -17.37009048461914, "global_step": 10188, "epoch": 122} {"train_loss": -17.642642974853516, "global_step": 10189, "epoch": 122} {"train_loss": -17.55898094177246, "global_step": 10190, "epoch": 122} {"train_loss": -17.680612564086914, "global_step": 10191, "epoch": 122} {"train_loss": -17.6297664642334, "global_step": 10192, "epoch": 122} {"train_loss": -18.09230613708496, "global_step": 10193, "epoch": 122} {"train_loss": -17.256641387939453, "global_step": 10194, "epoch": 122} {"train_loss": -17.662797927856445, "global_step": 10195, "epoch": 122} {"train_loss": -17.428564071655273, "global_step": 10196, "epoch": 122} {"train_loss": -17.92580223083496, "global_step": 10197, "epoch": 122} {"train_loss": -17.66334342956543, "global_step": 10198, "epoch": 122} {"train_loss": -17.690710067749023, "global_step": 10199, "epoch": 122} {"train_loss": -18.10027503967285, "global_step": 10200, "epoch": 122} {"train_loss": -17.948728561401367, "global_step": 10201, "epoch": 122} {"train_loss": -17.531574249267578, "global_step": 10202, "epoch": 122} {"train_loss": -17.79798126220703, "global_step": 10203, "epoch": 122} {"train_loss": -17.371232986450195, "global_step": 10204, "epoch": 122} {"train_loss": -17.556970596313477, "global_step": 10205, "epoch": 122} {"train_loss": -17.85725212097168, "global_step": 10206, "epoch": 122} {"train_loss": -17.652812957763672, "global_step": 10207, "epoch": 122} {"train_loss": -17.639352384820043, "global_step": 10208, "epoch": 122, "val_loss": 6166348.5} {"train_loss": -17.431262969970703, "global_step": 10209, "epoch": 123} {"train_loss": -17.662065505981445, "global_step": 10210, "epoch": 123} {"train_loss": -17.815963745117188, "global_step": 10211, "epoch": 123} {"train_loss": -18.021026611328125, "global_step": 10212, "epoch": 123} {"train_loss": -17.523157119750977, "global_step": 10213, "epoch": 123} {"train_loss": -17.332456588745117, "global_step": 10214, "epoch": 123} {"train_loss": -17.601520538330078, "global_step": 10215, "epoch": 123} {"train_loss": -17.7120361328125, "global_step": 10216, "epoch": 123} {"train_loss": -17.42197608947754, "global_step": 10217, "epoch": 123} {"train_loss": -17.411142349243164, "global_step": 10218, "epoch": 123} {"train_loss": -17.789371490478516, "global_step": 10219, "epoch": 123} {"train_loss": -17.81155776977539, "global_step": 10220, "epoch": 123} {"train_loss": -17.593992233276367, "global_step": 10221, "epoch": 123} {"train_loss": -17.558500289916992, "global_step": 10222, "epoch": 123} {"train_loss": -17.73258399963379, "global_step": 10223, "epoch": 123} {"train_loss": -17.523456573486328, "global_step": 10224, "epoch": 123} {"train_loss": -17.6096134185791, "global_step": 10225, "epoch": 123} {"train_loss": -17.844388961791992, "global_step": 10226, "epoch": 123} {"train_loss": -17.582395553588867, "global_step": 10227, "epoch": 123} {"train_loss": -17.591827392578125, "global_step": 10228, "epoch": 123} {"train_loss": -17.534719467163086, "global_step": 10229, "epoch": 123} {"train_loss": -17.899633407592773, "global_step": 10230, "epoch": 123} {"train_loss": -17.46685791015625, "global_step": 10231, "epoch": 123} {"train_loss": -17.78443145751953, "global_step": 10232, "epoch": 123} {"train_loss": -17.982999801635742, "global_step": 10233, "epoch": 123} {"train_loss": -17.63028335571289, "global_step": 10234, "epoch": 123} {"train_loss": -17.76979637145996, "global_step": 10235, "epoch": 123} {"train_loss": -17.61028289794922, "global_step": 10236, "epoch": 123} {"train_loss": -17.355741500854492, "global_step": 10237, "epoch": 123} {"train_loss": -17.264850616455078, "global_step": 10238, "epoch": 123} {"train_loss": -17.285043716430664, "global_step": 10239, "epoch": 123} {"train_loss": -17.630544662475586, "global_step": 10240, "epoch": 123} {"train_loss": -17.64361000061035, "global_step": 10241, "epoch": 123} {"train_loss": -17.82620620727539, "global_step": 10242, "epoch": 123} {"train_loss": -17.91998291015625, "global_step": 10243, "epoch": 123} {"train_loss": -17.218618392944336, "global_step": 10244, "epoch": 123} {"train_loss": -17.609716415405273, "global_step": 10245, "epoch": 123} {"train_loss": -17.484806060791016, "global_step": 10246, "epoch": 123} {"train_loss": -17.753820419311523, "global_step": 10247, "epoch": 123} {"train_loss": -17.609363555908203, "global_step": 10248, "epoch": 123} {"train_loss": -17.934709548950195, "global_step": 10249, "epoch": 123} {"train_loss": -17.6926326751709, "global_step": 10250, "epoch": 123} {"train_loss": -17.694229125976562, "global_step": 10251, "epoch": 123} {"train_loss": -18.02815055847168, "global_step": 10252, "epoch": 123} {"train_loss": -17.829622268676758, "global_step": 10253, "epoch": 123} {"train_loss": -17.93879508972168, "global_step": 10254, "epoch": 123} {"train_loss": -17.506980895996094, "global_step": 10255, "epoch": 123} {"train_loss": -17.6790828704834, "global_step": 10256, "epoch": 123} {"train_loss": -17.286901473999023, "global_step": 10257, "epoch": 123} {"train_loss": -17.790109634399414, "global_step": 10258, "epoch": 123} {"train_loss": -17.484210968017578, "global_step": 10259, "epoch": 123} {"train_loss": -18.12989616394043, "global_step": 10260, "epoch": 123} {"train_loss": -17.61049461364746, "global_step": 10261, "epoch": 123} {"train_loss": -17.43560791015625, "global_step": 10262, "epoch": 123} {"train_loss": -17.54630470275879, "global_step": 10263, "epoch": 123} {"train_loss": -17.67631721496582, "global_step": 10264, "epoch": 123} {"train_loss": -17.434415817260742, "global_step": 10265, "epoch": 123} {"train_loss": -18.004789352416992, "global_step": 10266, "epoch": 123} {"train_loss": -17.48424530029297, "global_step": 10267, "epoch": 123} {"train_loss": -17.91246223449707, "global_step": 10268, "epoch": 123} {"train_loss": -17.654455184936523, "global_step": 10269, "epoch": 123} {"train_loss": -17.497013092041016, "global_step": 10270, "epoch": 123} {"train_loss": -17.75848960876465, "global_step": 10271, "epoch": 123} {"train_loss": -17.004209518432617, "global_step": 10272, "epoch": 123} {"train_loss": -17.53020668029785, "global_step": 10273, "epoch": 123} {"train_loss": -17.54273796081543, "global_step": 10274, "epoch": 123} {"train_loss": -17.64977264404297, "global_step": 10275, "epoch": 123} {"train_loss": -17.49742317199707, "global_step": 10276, "epoch": 123} {"train_loss": -18.04031753540039, "global_step": 10277, "epoch": 123} {"train_loss": -18.065265655517578, "global_step": 10278, "epoch": 123} {"train_loss": -17.59810447692871, "global_step": 10279, "epoch": 123} {"train_loss": -17.644262313842773, "global_step": 10280, "epoch": 123} {"train_loss": -17.783597946166992, "global_step": 10281, "epoch": 123} {"train_loss": -17.635347366333008, "global_step": 10282, "epoch": 123} {"train_loss": -17.863237380981445, "global_step": 10283, "epoch": 123} {"train_loss": -17.89127540588379, "global_step": 10284, "epoch": 123} {"train_loss": -17.57857322692871, "global_step": 10285, "epoch": 123} {"train_loss": -17.598983764648438, "global_step": 10286, "epoch": 123} {"train_loss": -18.15520668029785, "global_step": 10287, "epoch": 123} {"train_loss": -17.258573532104492, "global_step": 10288, "epoch": 123} {"train_loss": -17.886188507080078, "global_step": 10289, "epoch": 123} {"train_loss": -17.666473388671875, "global_step": 10290, "epoch": 123} {"train_loss": -17.68007209502071, "global_step": 10291, "epoch": 123, "val_loss": 6237128.0} {"train_loss": -18.029653549194336, "global_step": 10292, "epoch": 124} {"train_loss": -17.840518951416016, "global_step": 10293, "epoch": 124} {"train_loss": -17.3333797454834, "global_step": 10294, "epoch": 124} {"train_loss": -17.739946365356445, "global_step": 10295, "epoch": 124} {"train_loss": -17.510887145996094, "global_step": 10296, "epoch": 124} {"train_loss": -17.5136775970459, "global_step": 10297, "epoch": 124} {"train_loss": -17.47605323791504, "global_step": 10298, "epoch": 124} {"train_loss": -17.507583618164062, "global_step": 10299, "epoch": 124} {"train_loss": -17.18135643005371, "global_step": 10300, "epoch": 124} {"train_loss": -17.700284957885742, "global_step": 10301, "epoch": 124} {"train_loss": -17.622777938842773, "global_step": 10302, "epoch": 124} {"train_loss": -18.000690460205078, "global_step": 10303, "epoch": 124} {"train_loss": -17.893396377563477, "global_step": 10304, "epoch": 124} {"train_loss": -17.42267417907715, "global_step": 10305, "epoch": 124} {"train_loss": -17.628528594970703, "global_step": 10306, "epoch": 124} {"train_loss": -17.328855514526367, "global_step": 10307, "epoch": 124} {"train_loss": -17.647226333618164, "global_step": 10308, "epoch": 124} {"train_loss": -17.778221130371094, "global_step": 10309, "epoch": 124} {"train_loss": -17.7221622467041, "global_step": 10310, "epoch": 124} {"train_loss": -17.94915008544922, "global_step": 10311, "epoch": 124} {"train_loss": -17.6319580078125, "global_step": 10312, "epoch": 124} {"train_loss": -17.736221313476562, "global_step": 10313, "epoch": 124} {"train_loss": -17.25782585144043, "global_step": 10314, "epoch": 124} {"train_loss": -17.493505477905273, "global_step": 10315, "epoch": 124} {"train_loss": -17.365467071533203, "global_step": 10316, "epoch": 124} {"train_loss": -17.525842666625977, "global_step": 10317, "epoch": 124} {"train_loss": -17.639320373535156, "global_step": 10318, "epoch": 124} {"train_loss": -17.676897048950195, "global_step": 10319, "epoch": 124} {"train_loss": -17.824573516845703, "global_step": 10320, "epoch": 124} {"train_loss": -17.771408081054688, "global_step": 10321, "epoch": 124} {"train_loss": -17.822874069213867, "global_step": 10322, "epoch": 124} {"train_loss": -17.796833038330078, "global_step": 10323, "epoch": 124} {"train_loss": -18.00947380065918, "global_step": 10324, "epoch": 124} {"train_loss": -17.80617332458496, "global_step": 10325, "epoch": 124} {"train_loss": -17.284109115600586, "global_step": 10326, "epoch": 124} {"train_loss": -17.71299934387207, "global_step": 10327, "epoch": 124} {"train_loss": -17.87946128845215, "global_step": 10328, "epoch": 124} {"train_loss": -17.73628807067871, "global_step": 10329, "epoch": 124} {"train_loss": -18.098005294799805, "global_step": 10330, "epoch": 124} {"train_loss": -17.423559188842773, "global_step": 10331, "epoch": 124} {"train_loss": -17.833288192749023, "global_step": 10332, "epoch": 124} {"train_loss": -18.16855239868164, "global_step": 10333, "epoch": 124} {"train_loss": -17.57485008239746, "global_step": 10334, "epoch": 124} {"train_loss": -17.743616104125977, "global_step": 10335, "epoch": 124} {"train_loss": -17.668506622314453, "global_step": 10336, "epoch": 124} {"train_loss": -17.779356002807617, "global_step": 10337, "epoch": 124} {"train_loss": -17.632524490356445, "global_step": 10338, "epoch": 124} {"train_loss": -17.322355270385742, "global_step": 10339, "epoch": 124} {"train_loss": -17.73072624206543, "global_step": 10340, "epoch": 124} {"train_loss": -17.771137237548828, "global_step": 10341, "epoch": 124} {"train_loss": -18.033740997314453, "global_step": 10342, "epoch": 124} {"train_loss": -17.344390869140625, "global_step": 10343, "epoch": 124} {"train_loss": -17.90462303161621, "global_step": 10344, "epoch": 124} {"train_loss": -17.886703491210938, "global_step": 10345, "epoch": 124} {"train_loss": -17.549259185791016, "global_step": 10346, "epoch": 124} {"train_loss": -17.3813419342041, "global_step": 10347, "epoch": 124} {"train_loss": -17.662221908569336, "global_step": 10348, "epoch": 124} {"train_loss": -17.708694458007812, "global_step": 10349, "epoch": 124} {"train_loss": -17.388029098510742, "global_step": 10350, "epoch": 124} {"train_loss": -17.350996017456055, "global_step": 10351, "epoch": 124} {"train_loss": -17.94110107421875, "global_step": 10352, "epoch": 124} {"train_loss": -17.835599899291992, "global_step": 10353, "epoch": 124} {"train_loss": -17.40319061279297, "global_step": 10354, "epoch": 124} {"train_loss": -17.761173248291016, "global_step": 10355, "epoch": 124} {"train_loss": -17.45570945739746, "global_step": 10356, "epoch": 124} {"train_loss": -17.677488327026367, "global_step": 10357, "epoch": 124} {"train_loss": -17.576892852783203, "global_step": 10358, "epoch": 124} {"train_loss": -17.495939254760742, "global_step": 10359, "epoch": 124} {"train_loss": -17.960712432861328, "global_step": 10360, "epoch": 124} {"train_loss": -17.957284927368164, "global_step": 10361, "epoch": 124} {"train_loss": -17.28135108947754, "global_step": 10362, "epoch": 124} {"train_loss": -17.402372360229492, "global_step": 10363, "epoch": 124} {"train_loss": -18.00698471069336, "global_step": 10364, "epoch": 124} {"train_loss": -17.615447998046875, "global_step": 10365, "epoch": 124} {"train_loss": -17.925992965698242, "global_step": 10366, "epoch": 124} {"train_loss": -17.54157066345215, "global_step": 10367, "epoch": 124} {"train_loss": -18.074567794799805, "global_step": 10368, "epoch": 124} {"train_loss": -17.799144744873047, "global_step": 10369, "epoch": 124} {"train_loss": -17.38484764099121, "global_step": 10370, "epoch": 124} {"train_loss": -17.669151306152344, "global_step": 10371, "epoch": 124} {"train_loss": -17.684736251831055, "global_step": 10372, "epoch": 124} {"train_loss": -17.679166793823242, "global_step": 10373, "epoch": 124} {"train_loss": -17.684028119925994, "global_step": 10374, "epoch": 124, "val_loss": 6143322.0} {"train_loss": -17.430768966674805, "global_step": 10375, "epoch": 125} {"train_loss": -17.258949279785156, "global_step": 10376, "epoch": 125} {"train_loss": -17.591337203979492, "global_step": 10377, "epoch": 125} {"train_loss": -17.509374618530273, "global_step": 10378, "epoch": 125} {"train_loss": -17.625608444213867, "global_step": 10379, "epoch": 125} {"train_loss": -17.55611228942871, "global_step": 10380, "epoch": 125} {"train_loss": -17.810195922851562, "global_step": 10381, "epoch": 125} {"train_loss": -17.85575294494629, "global_step": 10382, "epoch": 125} {"train_loss": -17.876752853393555, "global_step": 10383, "epoch": 125} {"train_loss": -17.389713287353516, "global_step": 10384, "epoch": 125} {"train_loss": -18.064477920532227, "global_step": 10385, "epoch": 125} {"train_loss": -18.002992630004883, "global_step": 10386, "epoch": 125} {"train_loss": -17.865337371826172, "global_step": 10387, "epoch": 125} {"train_loss": -17.46786880493164, "global_step": 10388, "epoch": 125} {"train_loss": -17.81801414489746, "global_step": 10389, "epoch": 125} {"train_loss": -17.5264892578125, "global_step": 10390, "epoch": 125} {"train_loss": -17.622007369995117, "global_step": 10391, "epoch": 125} {"train_loss": -17.601423263549805, "global_step": 10392, "epoch": 125} {"train_loss": -17.585262298583984, "global_step": 10393, "epoch": 125} {"train_loss": -17.55462074279785, "global_step": 10394, "epoch": 125} {"train_loss": -17.414209365844727, "global_step": 10395, "epoch": 125} {"train_loss": -17.670368194580078, "global_step": 10396, "epoch": 125} {"train_loss": -17.701459884643555, "global_step": 10397, "epoch": 125} {"train_loss": -17.231792449951172, "global_step": 10398, "epoch": 125} {"train_loss": -17.951507568359375, "global_step": 10399, "epoch": 125} {"train_loss": -17.903127670288086, "global_step": 10400, "epoch": 125} {"train_loss": -17.741214752197266, "global_step": 10401, "epoch": 125} {"train_loss": -17.91189956665039, "global_step": 10402, "epoch": 125} {"train_loss": -17.762414932250977, "global_step": 10403, "epoch": 125} {"train_loss": -17.704416275024414, "global_step": 10404, "epoch": 125} {"train_loss": -17.420562744140625, "global_step": 10405, "epoch": 125} {"train_loss": -17.884349822998047, "global_step": 10406, "epoch": 125} {"train_loss": -18.077104568481445, "global_step": 10407, "epoch": 125} {"train_loss": -17.810245513916016, "global_step": 10408, "epoch": 125} {"train_loss": -17.636865615844727, "global_step": 10409, "epoch": 125} {"train_loss": -17.744834899902344, "global_step": 10410, "epoch": 125} {"train_loss": -17.791582107543945, "global_step": 10411, "epoch": 125} {"train_loss": -17.683202743530273, "global_step": 10412, "epoch": 125} {"train_loss": -17.74180793762207, "global_step": 10413, "epoch": 125} {"train_loss": -17.909549713134766, "global_step": 10414, "epoch": 125} {"train_loss": -17.576919555664062, "global_step": 10415, "epoch": 125} {"train_loss": -17.709613800048828, "global_step": 10416, "epoch": 125} {"train_loss": -17.478240966796875, "global_step": 10417, "epoch": 125} {"train_loss": -17.6560115814209, "global_step": 10418, "epoch": 125} {"train_loss": -18.097000122070312, "global_step": 10419, "epoch": 125} {"train_loss": -17.635677337646484, "global_step": 10420, "epoch": 125} {"train_loss": -17.65351676940918, "global_step": 10421, "epoch": 125} {"train_loss": -17.63636589050293, "global_step": 10422, "epoch": 125} {"train_loss": -17.6412353515625, "global_step": 10423, "epoch": 125} {"train_loss": -17.811864852905273, "global_step": 10424, "epoch": 125} {"train_loss": -17.514392852783203, "global_step": 10425, "epoch": 125} {"train_loss": -17.778499603271484, "global_step": 10426, "epoch": 125} {"train_loss": -17.922597885131836, "global_step": 10427, "epoch": 125} {"train_loss": -17.882923126220703, "global_step": 10428, "epoch": 125} {"train_loss": -17.474374771118164, "global_step": 10429, "epoch": 125} {"train_loss": -18.098922729492188, "global_step": 10430, "epoch": 125} {"train_loss": -17.597070693969727, "global_step": 10431, "epoch": 125} {"train_loss": -17.739334106445312, "global_step": 10432, "epoch": 125} {"train_loss": -17.345827102661133, "global_step": 10433, "epoch": 125} {"train_loss": -17.813623428344727, "global_step": 10434, "epoch": 125} {"train_loss": -17.581083297729492, "global_step": 10435, "epoch": 125} {"train_loss": -17.457582473754883, "global_step": 10436, "epoch": 125} {"train_loss": -17.893573760986328, "global_step": 10437, "epoch": 125} {"train_loss": -17.848480224609375, "global_step": 10438, "epoch": 125} {"train_loss": -17.475048065185547, "global_step": 10439, "epoch": 125} {"train_loss": -17.77603530883789, "global_step": 10440, "epoch": 125} {"train_loss": -17.846593856811523, "global_step": 10441, "epoch": 125} {"train_loss": -17.373706817626953, "global_step": 10442, "epoch": 125} {"train_loss": -17.61037254333496, "global_step": 10443, "epoch": 125} {"train_loss": -17.638534545898438, "global_step": 10444, "epoch": 125} {"train_loss": -17.782567977905273, "global_step": 10445, "epoch": 125} {"train_loss": -17.607025146484375, "global_step": 10446, "epoch": 125} {"train_loss": -17.612245559692383, "global_step": 10447, "epoch": 125} {"train_loss": -17.369800567626953, "global_step": 10448, "epoch": 125} {"train_loss": -17.982221603393555, "global_step": 10449, "epoch": 125} {"train_loss": -18.080093383789062, "global_step": 10450, "epoch": 125} {"train_loss": -17.80220603942871, "global_step": 10451, "epoch": 125} {"train_loss": -17.63096809387207, "global_step": 10452, "epoch": 125} {"train_loss": -17.760086059570312, "global_step": 10453, "epoch": 125} {"train_loss": -17.53969955444336, "global_step": 10454, "epoch": 125} {"train_loss": -17.752470016479492, "global_step": 10455, "epoch": 125} {"train_loss": -17.75453758239746, "global_step": 10456, "epoch": 125} {"train_loss": -17.706156006778578, "global_step": 10457, "epoch": 125, "val_loss": 6826737.5} {"train_loss": -17.17397689819336, "global_step": 10458, "epoch": 126} {"train_loss": -17.43267059326172, "global_step": 10459, "epoch": 126} {"train_loss": -17.426977157592773, "global_step": 10460, "epoch": 126} {"train_loss": -17.75705337524414, "global_step": 10461, "epoch": 126} {"train_loss": -17.196887969970703, "global_step": 10462, "epoch": 126} {"train_loss": -17.535743713378906, "global_step": 10463, "epoch": 126} {"train_loss": -17.84139060974121, "global_step": 10464, "epoch": 126} {"train_loss": -17.46051597595215, "global_step": 10465, "epoch": 126} {"train_loss": -17.567026138305664, "global_step": 10466, "epoch": 126} {"train_loss": -17.353063583374023, "global_step": 10467, "epoch": 126} {"train_loss": -17.459653854370117, "global_step": 10468, "epoch": 126} {"train_loss": -17.416120529174805, "global_step": 10469, "epoch": 126} {"train_loss": -17.53273582458496, "global_step": 10470, "epoch": 126} {"train_loss": -17.40856170654297, "global_step": 10471, "epoch": 126} {"train_loss": -17.69921875, "global_step": 10472, "epoch": 126} {"train_loss": -17.1092472076416, "global_step": 10473, "epoch": 126} {"train_loss": -17.76373291015625, "global_step": 10474, "epoch": 126} {"train_loss": -17.623159408569336, "global_step": 10475, "epoch": 126} {"train_loss": -17.575729370117188, "global_step": 10476, "epoch": 126} {"train_loss": -17.654346466064453, "global_step": 10477, "epoch": 126} {"train_loss": -17.708606719970703, "global_step": 10478, "epoch": 126} {"train_loss": -17.66120147705078, "global_step": 10479, "epoch": 126} {"train_loss": -17.30389976501465, "global_step": 10480, "epoch": 126} {"train_loss": -17.634977340698242, "global_step": 10481, "epoch": 126} {"train_loss": -17.508275985717773, "global_step": 10482, "epoch": 126} {"train_loss": -17.424158096313477, "global_step": 10483, "epoch": 126} {"train_loss": -17.277700424194336, "global_step": 10484, "epoch": 126} {"train_loss": -17.601015090942383, "global_step": 10485, "epoch": 126} {"train_loss": -18.16120719909668, "global_step": 10486, "epoch": 126} {"train_loss": -17.607908248901367, "global_step": 10487, "epoch": 126} {"train_loss": -17.57159996032715, "global_step": 10488, "epoch": 126} {"train_loss": -17.74495506286621, "global_step": 10489, "epoch": 126} {"train_loss": -17.929475784301758, "global_step": 10490, "epoch": 126} {"train_loss": -17.905424118041992, "global_step": 10491, "epoch": 126} {"train_loss": -17.8640193939209, "global_step": 10492, "epoch": 126} {"train_loss": -17.88202476501465, "global_step": 10493, "epoch": 126} {"train_loss": -17.678762435913086, "global_step": 10494, "epoch": 126} {"train_loss": -17.902111053466797, "global_step": 10495, "epoch": 126} {"train_loss": -17.769824981689453, "global_step": 10496, "epoch": 126} {"train_loss": -17.91242027282715, "global_step": 10497, "epoch": 126} {"train_loss": -17.601816177368164, "global_step": 10498, "epoch": 126} {"train_loss": -17.38688087463379, "global_step": 10499, "epoch": 126} {"train_loss": -17.644800186157227, "global_step": 10500, "epoch": 126} {"train_loss": -17.903791427612305, "global_step": 10501, "epoch": 126} {"train_loss": -17.58548355102539, "global_step": 10502, "epoch": 126} {"train_loss": -17.952062606811523, "global_step": 10503, "epoch": 126} {"train_loss": -17.59637451171875, "global_step": 10504, "epoch": 126} {"train_loss": -17.405502319335938, "global_step": 10505, "epoch": 126} {"train_loss": -17.636417388916016, "global_step": 10506, "epoch": 126} {"train_loss": -17.851110458374023, "global_step": 10507, "epoch": 126} {"train_loss": -17.78458023071289, "global_step": 10508, "epoch": 126} {"train_loss": -17.634414672851562, "global_step": 10509, "epoch": 126} {"train_loss": -17.729331970214844, "global_step": 10510, "epoch": 126} {"train_loss": -17.61541175842285, "global_step": 10511, "epoch": 126} {"train_loss": -17.405868530273438, "global_step": 10512, "epoch": 126} {"train_loss": -17.79164695739746, "global_step": 10513, "epoch": 126} {"train_loss": -17.420761108398438, "global_step": 10514, "epoch": 126} {"train_loss": -17.5159854888916, "global_step": 10515, "epoch": 126} {"train_loss": -17.608692169189453, "global_step": 10516, "epoch": 126} {"train_loss": -17.4620418548584, "global_step": 10517, "epoch": 126} {"train_loss": -18.228422164916992, "global_step": 10518, "epoch": 126} {"train_loss": -17.662168502807617, "global_step": 10519, "epoch": 126} {"train_loss": -17.60613441467285, "global_step": 10520, "epoch": 126} {"train_loss": -17.678749084472656, "global_step": 10521, "epoch": 126} {"train_loss": -17.806678771972656, "global_step": 10522, "epoch": 126} {"train_loss": -17.684167861938477, "global_step": 10523, "epoch": 126} {"train_loss": -17.799551010131836, "global_step": 10524, "epoch": 126} {"train_loss": -17.718637466430664, "global_step": 10525, "epoch": 126} {"train_loss": -17.764610290527344, "global_step": 10526, "epoch": 126} {"train_loss": -17.580337524414062, "global_step": 10527, "epoch": 126} {"train_loss": -17.345876693725586, "global_step": 10528, "epoch": 126} {"train_loss": -17.626367568969727, "global_step": 10529, "epoch": 126} {"train_loss": -17.125303268432617, "global_step": 10530, "epoch": 126} {"train_loss": -17.506223678588867, "global_step": 10531, "epoch": 126} {"train_loss": -17.865022659301758, "global_step": 10532, "epoch": 126} {"train_loss": -17.726268768310547, "global_step": 10533, "epoch": 126} {"train_loss": -17.49526023864746, "global_step": 10534, "epoch": 126} {"train_loss": -17.297704696655273, "global_step": 10535, "epoch": 126} {"train_loss": -17.90068817138672, "global_step": 10536, "epoch": 126} {"train_loss": -17.787214279174805, "global_step": 10537, "epoch": 126} {"train_loss": -17.58001136779785, "global_step": 10538, "epoch": 126} {"train_loss": -17.655742645263672, "global_step": 10539, "epoch": 126} {"train_loss": -17.640432059046734, "global_step": 10540, "epoch": 126, "val_loss": 6176896.0} {"train_loss": -17.374404907226562, "global_step": 10541, "epoch": 127} {"train_loss": -17.755558013916016, "global_step": 10542, "epoch": 127} {"train_loss": -17.6474552154541, "global_step": 10543, "epoch": 127} {"train_loss": -17.880779266357422, "global_step": 10544, "epoch": 127} {"train_loss": -17.630441665649414, "global_step": 10545, "epoch": 127} {"train_loss": -17.383512496948242, "global_step": 10546, "epoch": 127} {"train_loss": -17.731788635253906, "global_step": 10547, "epoch": 127} {"train_loss": -17.658784866333008, "global_step": 10548, "epoch": 127} {"train_loss": -17.87282371520996, "global_step": 10549, "epoch": 127} {"train_loss": -17.8070011138916, "global_step": 10550, "epoch": 127} {"train_loss": -17.81019401550293, "global_step": 10551, "epoch": 127} {"train_loss": -17.975439071655273, "global_step": 10552, "epoch": 127} {"train_loss": -17.778121948242188, "global_step": 10553, "epoch": 127} {"train_loss": -17.454946517944336, "global_step": 10554, "epoch": 127} {"train_loss": -17.770191192626953, "global_step": 10555, "epoch": 127} {"train_loss": -17.721982955932617, "global_step": 10556, "epoch": 127} {"train_loss": -17.50948143005371, "global_step": 10557, "epoch": 127} {"train_loss": -17.857242584228516, "global_step": 10558, "epoch": 127} {"train_loss": -17.789663314819336, "global_step": 10559, "epoch": 127} {"train_loss": -17.752500534057617, "global_step": 10560, "epoch": 127} {"train_loss": -17.898897171020508, "global_step": 10561, "epoch": 127} {"train_loss": -17.668100357055664, "global_step": 10562, "epoch": 127} {"train_loss": -18.009458541870117, "global_step": 10563, "epoch": 127} {"train_loss": -17.546924591064453, "global_step": 10564, "epoch": 127} {"train_loss": -17.75298500061035, "global_step": 10565, "epoch": 127} {"train_loss": -17.731502532958984, "global_step": 10566, "epoch": 127} {"train_loss": -17.772855758666992, "global_step": 10567, "epoch": 127} {"train_loss": -17.44583511352539, "global_step": 10568, "epoch": 127} {"train_loss": -17.831872940063477, "global_step": 10569, "epoch": 127} {"train_loss": -17.78312110900879, "global_step": 10570, "epoch": 127} {"train_loss": -17.312036514282227, "global_step": 10571, "epoch": 127} {"train_loss": -17.33367156982422, "global_step": 10572, "epoch": 127} {"train_loss": -17.7253360748291, "global_step": 10573, "epoch": 127} {"train_loss": -17.596364974975586, "global_step": 10574, "epoch": 127} {"train_loss": -17.336933135986328, "global_step": 10575, "epoch": 127} {"train_loss": -17.817676544189453, "global_step": 10576, "epoch": 127} {"train_loss": -17.505783081054688, "global_step": 10577, "epoch": 127} {"train_loss": -17.622041702270508, "global_step": 10578, "epoch": 127} {"train_loss": -17.304929733276367, "global_step": 10579, "epoch": 127} {"train_loss": -17.274112701416016, "global_step": 10580, "epoch": 127} {"train_loss": -17.55977439880371, "global_step": 10581, "epoch": 127} {"train_loss": -17.821290969848633, "global_step": 10582, "epoch": 127} {"train_loss": -17.91761589050293, "global_step": 10583, "epoch": 127} {"train_loss": -17.65315818786621, "global_step": 10584, "epoch": 127} {"train_loss": -17.5848388671875, "global_step": 10585, "epoch": 127} {"train_loss": -17.653379440307617, "global_step": 10586, "epoch": 127} {"train_loss": -17.382856369018555, "global_step": 10587, "epoch": 127} {"train_loss": -17.608335494995117, "global_step": 10588, "epoch": 127} {"train_loss": -17.509048461914062, "global_step": 10589, "epoch": 127} {"train_loss": -17.40237045288086, "global_step": 10590, "epoch": 127} {"train_loss": -17.61521339416504, "global_step": 10591, "epoch": 127} {"train_loss": -17.408618927001953, "global_step": 10592, "epoch": 127} {"train_loss": -17.05739402770996, "global_step": 10593, "epoch": 127} {"train_loss": -17.88138771057129, "global_step": 10594, "epoch": 127} {"train_loss": -17.9472599029541, "global_step": 10595, "epoch": 127} {"train_loss": -17.500463485717773, "global_step": 10596, "epoch": 127} {"train_loss": -17.865453720092773, "global_step": 10597, "epoch": 127} {"train_loss": -17.603355407714844, "global_step": 10598, "epoch": 127} {"train_loss": -17.82162094116211, "global_step": 10599, "epoch": 127} {"train_loss": -17.918428421020508, "global_step": 10600, "epoch": 127} {"train_loss": -17.91412925720215, "global_step": 10601, "epoch": 127} {"train_loss": -17.497177124023438, "global_step": 10602, "epoch": 127} {"train_loss": -18.128759384155273, "global_step": 10603, "epoch": 127} {"train_loss": -17.372116088867188, "global_step": 10604, "epoch": 127} {"train_loss": -18.256546020507812, "global_step": 10605, "epoch": 127} {"train_loss": -17.688600540161133, "global_step": 10606, "epoch": 127} {"train_loss": -17.986042022705078, "global_step": 10607, "epoch": 127} {"train_loss": -17.418760299682617, "global_step": 10608, "epoch": 127} {"train_loss": -17.869169235229492, "global_step": 10609, "epoch": 127} {"train_loss": -17.294443130493164, "global_step": 10610, "epoch": 127} {"train_loss": -17.673633575439453, "global_step": 10611, "epoch": 127} {"train_loss": -17.844236373901367, "global_step": 10612, "epoch": 127} {"train_loss": -17.536205291748047, "global_step": 10613, "epoch": 127} {"train_loss": -17.931167602539062, "global_step": 10614, "epoch": 127} {"train_loss": -17.639781951904297, "global_step": 10615, "epoch": 127} {"train_loss": -17.803443908691406, "global_step": 10616, "epoch": 127} {"train_loss": -17.838254928588867, "global_step": 10617, "epoch": 127} {"train_loss": -17.940021514892578, "global_step": 10618, "epoch": 127} {"train_loss": -17.722455978393555, "global_step": 10619, "epoch": 127} {"train_loss": -18.144912719726562, "global_step": 10620, "epoch": 127} {"train_loss": -17.569318771362305, "global_step": 10621, "epoch": 127} {"train_loss": -17.769926071166992, "global_step": 10622, "epoch": 127} {"train_loss": -17.705201068556452, "global_step": 10623, "epoch": 127, "val_loss": 6166080.0} {"train_loss": -17.757917404174805, "global_step": 10624, "epoch": 128} {"train_loss": -17.807842254638672, "global_step": 10625, "epoch": 128} {"train_loss": -17.687524795532227, "global_step": 10626, "epoch": 128} {"train_loss": -18.198820114135742, "global_step": 10627, "epoch": 128} {"train_loss": -17.303531646728516, "global_step": 10628, "epoch": 128} {"train_loss": -17.365707397460938, "global_step": 10629, "epoch": 128} {"train_loss": -17.571125030517578, "global_step": 10630, "epoch": 128} {"train_loss": -17.789112091064453, "global_step": 10631, "epoch": 128} {"train_loss": -17.56247901916504, "global_step": 10632, "epoch": 128} {"train_loss": -17.312509536743164, "global_step": 10633, "epoch": 128} {"train_loss": -17.60555076599121, "global_step": 10634, "epoch": 128} {"train_loss": -17.453092575073242, "global_step": 10635, "epoch": 128} {"train_loss": -17.87422752380371, "global_step": 10636, "epoch": 128} {"train_loss": -17.665205001831055, "global_step": 10637, "epoch": 128} {"train_loss": -18.062036514282227, "global_step": 10638, "epoch": 128} {"train_loss": -17.60932731628418, "global_step": 10639, "epoch": 128} {"train_loss": -17.804950714111328, "global_step": 10640, "epoch": 128} {"train_loss": -17.430360794067383, "global_step": 10641, "epoch": 128} {"train_loss": -17.67305564880371, "global_step": 10642, "epoch": 128} {"train_loss": -17.897050857543945, "global_step": 10643, "epoch": 128} {"train_loss": -17.9720458984375, "global_step": 10644, "epoch": 128} {"train_loss": -18.166065216064453, "global_step": 10645, "epoch": 128} {"train_loss": -17.659212112426758, "global_step": 10646, "epoch": 128} {"train_loss": -17.512765884399414, "global_step": 10647, "epoch": 128} {"train_loss": -17.820575714111328, "global_step": 10648, "epoch": 128} {"train_loss": -17.648324966430664, "global_step": 10649, "epoch": 128} {"train_loss": -17.461267471313477, "global_step": 10650, "epoch": 128} {"train_loss": -17.673952102661133, "global_step": 10651, "epoch": 128} {"train_loss": -17.620086669921875, "global_step": 10652, "epoch": 128} {"train_loss": -18.004507064819336, "global_step": 10653, "epoch": 128} {"train_loss": -17.811246871948242, "global_step": 10654, "epoch": 128} {"train_loss": -17.620155334472656, "global_step": 10655, "epoch": 128} {"train_loss": -17.4953670501709, "global_step": 10656, "epoch": 128} {"train_loss": -17.666425704956055, "global_step": 10657, "epoch": 128} {"train_loss": -17.501819610595703, "global_step": 10658, "epoch": 128} {"train_loss": -17.020240783691406, "global_step": 10659, "epoch": 128} {"train_loss": -17.403295516967773, "global_step": 10660, "epoch": 128} {"train_loss": -17.450592041015625, "global_step": 10661, "epoch": 128} {"train_loss": -17.638092041015625, "global_step": 10662, "epoch": 128} {"train_loss": -17.25194549560547, "global_step": 10663, "epoch": 128} {"train_loss": -17.927383422851562, "global_step": 10664, "epoch": 128} {"train_loss": -17.775882720947266, "global_step": 10665, "epoch": 128} {"train_loss": -17.965076446533203, "global_step": 10666, "epoch": 128} {"train_loss": -17.992624282836914, "global_step": 10667, "epoch": 128} {"train_loss": -17.23784828186035, "global_step": 10668, "epoch": 128} {"train_loss": -17.451141357421875, "global_step": 10669, "epoch": 128} {"train_loss": -17.55201530456543, "global_step": 10670, "epoch": 128} {"train_loss": -17.374937057495117, "global_step": 10671, "epoch": 128} {"train_loss": -17.4083309173584, "global_step": 10672, "epoch": 128} {"train_loss": -17.643814086914062, "global_step": 10673, "epoch": 128} {"train_loss": -17.493738174438477, "global_step": 10674, "epoch": 128} {"train_loss": -17.852827072143555, "global_step": 10675, "epoch": 128} {"train_loss": -17.743085861206055, "global_step": 10676, "epoch": 128} {"train_loss": -17.774633407592773, "global_step": 10677, "epoch": 128} {"train_loss": -17.918981552124023, "global_step": 10678, "epoch": 128} {"train_loss": -18.204593658447266, "global_step": 10679, "epoch": 128} {"train_loss": -17.643753051757812, "global_step": 10680, "epoch": 128} {"train_loss": -17.868209838867188, "global_step": 10681, "epoch": 128} {"train_loss": -18.040014266967773, "global_step": 10682, "epoch": 128} {"train_loss": -17.512985229492188, "global_step": 10683, "epoch": 128} {"train_loss": -18.042133331298828, "global_step": 10684, "epoch": 128} {"train_loss": -17.544940948486328, "global_step": 10685, "epoch": 128} {"train_loss": -17.65582847595215, "global_step": 10686, "epoch": 128} {"train_loss": -17.902786254882812, "global_step": 10687, "epoch": 128} {"train_loss": -17.6396427154541, "global_step": 10688, "epoch": 128} {"train_loss": -17.581405639648438, "global_step": 10689, "epoch": 128} {"train_loss": -17.824892044067383, "global_step": 10690, "epoch": 128} {"train_loss": -17.52448272705078, "global_step": 10691, "epoch": 128} {"train_loss": -17.56195068359375, "global_step": 10692, "epoch": 128} {"train_loss": -18.0375919342041, "global_step": 10693, "epoch": 128} {"train_loss": -17.536344528198242, "global_step": 10694, "epoch": 128} {"train_loss": -17.293685913085938, "global_step": 10695, "epoch": 128} {"train_loss": -18.23638343811035, "global_step": 10696, "epoch": 128} {"train_loss": -17.59868812561035, "global_step": 10697, "epoch": 128} {"train_loss": -17.895429611206055, "global_step": 10698, "epoch": 128} {"train_loss": -18.008630752563477, "global_step": 10699, "epoch": 128} {"train_loss": -17.702442169189453, "global_step": 10700, "epoch": 128} {"train_loss": -17.95466423034668, "global_step": 10701, "epoch": 128} {"train_loss": -17.676761627197266, "global_step": 10702, "epoch": 128} {"train_loss": -17.450153350830078, "global_step": 10703, "epoch": 128} {"train_loss": -17.356103897094727, "global_step": 10704, "epoch": 128} {"train_loss": -17.708972930908203, "global_step": 10705, "epoch": 128} {"train_loss": -17.658184063003723, "global_step": 10706, "epoch": 128, "val_loss": 6364039.0} {"train_loss": -17.1220760345459, "global_step": 10707, "epoch": 129} {"train_loss": -17.6675968170166, "global_step": 10708, "epoch": 129} {"train_loss": -17.279294967651367, "global_step": 10709, "epoch": 129} {"train_loss": -17.225828170776367, "global_step": 10710, "epoch": 129} {"train_loss": -17.497425079345703, "global_step": 10711, "epoch": 129} {"train_loss": -17.416831970214844, "global_step": 10712, "epoch": 129} {"train_loss": -17.7825984954834, "global_step": 10713, "epoch": 129} {"train_loss": -17.8132266998291, "global_step": 10714, "epoch": 129} {"train_loss": -17.396390914916992, "global_step": 10715, "epoch": 129} {"train_loss": -17.111717224121094, "global_step": 10716, "epoch": 129} {"train_loss": -17.487186431884766, "global_step": 10717, "epoch": 129} {"train_loss": -17.563459396362305, "global_step": 10718, "epoch": 129} {"train_loss": -17.90553092956543, "global_step": 10719, "epoch": 129} {"train_loss": -18.065692901611328, "global_step": 10720, "epoch": 129} {"train_loss": -17.692941665649414, "global_step": 10721, "epoch": 129} {"train_loss": -17.898229598999023, "global_step": 10722, "epoch": 129} {"train_loss": -17.364519119262695, "global_step": 10723, "epoch": 129} {"train_loss": -17.81009292602539, "global_step": 10724, "epoch": 129} {"train_loss": -17.851028442382812, "global_step": 10725, "epoch": 129} {"train_loss": -17.57686424255371, "global_step": 10726, "epoch": 129} {"train_loss": -17.78846549987793, "global_step": 10727, "epoch": 129} {"train_loss": -18.00592803955078, "global_step": 10728, "epoch": 129} {"train_loss": -17.665939331054688, "global_step": 10729, "epoch": 129} {"train_loss": -17.894132614135742, "global_step": 10730, "epoch": 129} {"train_loss": -17.26285743713379, "global_step": 10731, "epoch": 129} {"train_loss": -17.46089744567871, "global_step": 10732, "epoch": 129} {"train_loss": -17.958948135375977, "global_step": 10733, "epoch": 129} {"train_loss": -17.141294479370117, "global_step": 10734, "epoch": 129} {"train_loss": -17.8145809173584, "global_step": 10735, "epoch": 129} {"train_loss": -17.958126068115234, "global_step": 10736, "epoch": 129} {"train_loss": -17.589048385620117, "global_step": 10737, "epoch": 129} {"train_loss": -18.16274642944336, "global_step": 10738, "epoch": 129} {"train_loss": -17.57939338684082, "global_step": 10739, "epoch": 129} {"train_loss": -17.952085494995117, "global_step": 10740, "epoch": 129} {"train_loss": -17.92713165283203, "global_step": 10741, "epoch": 129} {"train_loss": -17.389596939086914, "global_step": 10742, "epoch": 129} {"train_loss": -18.02925682067871, "global_step": 10743, "epoch": 129} {"train_loss": -18.035974502563477, "global_step": 10744, "epoch": 129} {"train_loss": -17.49232292175293, "global_step": 10745, "epoch": 129} {"train_loss": -18.03546142578125, "global_step": 10746, "epoch": 129} {"train_loss": -17.79277801513672, "global_step": 10747, "epoch": 129} {"train_loss": -17.531911849975586, "global_step": 10748, "epoch": 129} {"train_loss": -17.885530471801758, "global_step": 10749, "epoch": 129} {"train_loss": -17.21309471130371, "global_step": 10750, "epoch": 129} {"train_loss": -17.512218475341797, "global_step": 10751, "epoch": 129} {"train_loss": -17.694753646850586, "global_step": 10752, "epoch": 129} {"train_loss": -17.9594783782959, "global_step": 10753, "epoch": 129} {"train_loss": -17.493070602416992, "global_step": 10754, "epoch": 129} {"train_loss": -18.025951385498047, "global_step": 10755, "epoch": 129} {"train_loss": -17.585533142089844, "global_step": 10756, "epoch": 129} {"train_loss": -17.940031051635742, "global_step": 10757, "epoch": 129} {"train_loss": -17.764036178588867, "global_step": 10758, "epoch": 129} {"train_loss": -17.872831344604492, "global_step": 10759, "epoch": 129} {"train_loss": -17.175628662109375, "global_step": 10760, "epoch": 129} {"train_loss": -17.520933151245117, "global_step": 10761, "epoch": 129} {"train_loss": -17.94927978515625, "global_step": 10762, "epoch": 129} {"train_loss": -17.951650619506836, "global_step": 10763, "epoch": 129} {"train_loss": -17.529006958007812, "global_step": 10764, "epoch": 129} {"train_loss": -17.414968490600586, "global_step": 10765, "epoch": 129} {"train_loss": -17.7974796295166, "global_step": 10766, "epoch": 129} {"train_loss": -17.958772659301758, "global_step": 10767, "epoch": 129} {"train_loss": -17.592092514038086, "global_step": 10768, "epoch": 129} {"train_loss": -17.851322174072266, "global_step": 10769, "epoch": 129} {"train_loss": -17.881824493408203, "global_step": 10770, "epoch": 129} {"train_loss": -17.87898063659668, "global_step": 10771, "epoch": 129} {"train_loss": -17.976293563842773, "global_step": 10772, "epoch": 129} {"train_loss": -17.73225975036621, "global_step": 10773, "epoch": 129} {"train_loss": -17.698307037353516, "global_step": 10774, "epoch": 129} {"train_loss": -17.98347282409668, "global_step": 10775, "epoch": 129} {"train_loss": -17.84419059753418, "global_step": 10776, "epoch": 129} {"train_loss": -17.72391128540039, "global_step": 10777, "epoch": 129} {"train_loss": -17.67865753173828, "global_step": 10778, "epoch": 129} {"train_loss": -17.522611618041992, "global_step": 10779, "epoch": 129} {"train_loss": -17.862777709960938, "global_step": 10780, "epoch": 129} {"train_loss": -17.762428283691406, "global_step": 10781, "epoch": 129} {"train_loss": -17.554197311401367, "global_step": 10782, "epoch": 129} {"train_loss": -17.645706176757812, "global_step": 10783, "epoch": 129} {"train_loss": -18.379207611083984, "global_step": 10784, "epoch": 129} {"train_loss": -17.401132583618164, "global_step": 10785, "epoch": 129} {"train_loss": -17.878347396850586, "global_step": 10786, "epoch": 129} {"train_loss": -17.425643920898438, "global_step": 10787, "epoch": 129} {"train_loss": -17.52349281311035, "global_step": 10788, "epoch": 129} {"train_loss": -17.694262630968208, "global_step": 10789, "epoch": 129, "val_loss": 6253937.5} {"train_loss": -17.421743392944336, "global_step": 10790, "epoch": 130} {"train_loss": -17.810361862182617, "global_step": 10791, "epoch": 130} {"train_loss": -16.887022018432617, "global_step": 10792, "epoch": 130} {"train_loss": -17.32667350769043, "global_step": 10793, "epoch": 130} {"train_loss": -17.428218841552734, "global_step": 10794, "epoch": 130} {"train_loss": -17.80830955505371, "global_step": 10795, "epoch": 130} {"train_loss": -17.778091430664062, "global_step": 10796, "epoch": 130} {"train_loss": -17.457937240600586, "global_step": 10797, "epoch": 130} {"train_loss": -17.444604873657227, "global_step": 10798, "epoch": 130} {"train_loss": -17.912073135375977, "global_step": 10799, "epoch": 130} {"train_loss": -17.94776725769043, "global_step": 10800, "epoch": 130} {"train_loss": -17.82062339782715, "global_step": 10801, "epoch": 130} {"train_loss": -17.631357192993164, "global_step": 10802, "epoch": 130} {"train_loss": -17.633893966674805, "global_step": 10803, "epoch": 130} {"train_loss": -17.728429794311523, "global_step": 10804, "epoch": 130} {"train_loss": -17.932058334350586, "global_step": 10805, "epoch": 130} {"train_loss": -17.324874877929688, "global_step": 10806, "epoch": 130} {"train_loss": -17.425004959106445, "global_step": 10807, "epoch": 130} {"train_loss": -18.066076278686523, "global_step": 10808, "epoch": 130} {"train_loss": -17.785322189331055, "global_step": 10809, "epoch": 130} {"train_loss": -17.795385360717773, "global_step": 10810, "epoch": 130} {"train_loss": -17.835508346557617, "global_step": 10811, "epoch": 130} {"train_loss": -17.518814086914062, "global_step": 10812, "epoch": 130} {"train_loss": -17.464420318603516, "global_step": 10813, "epoch": 130} {"train_loss": -17.61676597595215, "global_step": 10814, "epoch": 130} {"train_loss": -17.831022262573242, "global_step": 10815, "epoch": 130} {"train_loss": -17.484439849853516, "global_step": 10816, "epoch": 130} {"train_loss": -17.81613540649414, "global_step": 10817, "epoch": 130} {"train_loss": -17.8491268157959, "global_step": 10818, "epoch": 130} {"train_loss": -18.219968795776367, "global_step": 10819, "epoch": 130} {"train_loss": -17.573698043823242, "global_step": 10820, "epoch": 130} {"train_loss": -17.50983238220215, "global_step": 10821, "epoch": 130} {"train_loss": -17.878591537475586, "global_step": 10822, "epoch": 130} {"train_loss": -17.61445426940918, "global_step": 10823, "epoch": 130} {"train_loss": -17.486310958862305, "global_step": 10824, "epoch": 130} {"train_loss": -17.9263916015625, "global_step": 10825, "epoch": 130} {"train_loss": -17.566232681274414, "global_step": 10826, "epoch": 130} {"train_loss": -17.665311813354492, "global_step": 10827, "epoch": 130} {"train_loss": -17.62022590637207, "global_step": 10828, "epoch": 130} {"train_loss": -17.605894088745117, "global_step": 10829, "epoch": 130} {"train_loss": -17.81772804260254, "global_step": 10830, "epoch": 130} {"train_loss": -17.59708023071289, "global_step": 10831, "epoch": 130} {"train_loss": -17.480043411254883, "global_step": 10832, "epoch": 130} {"train_loss": -17.46754264831543, "global_step": 10833, "epoch": 130} {"train_loss": -17.93535804748535, "global_step": 10834, "epoch": 130} {"train_loss": -17.846195220947266, "global_step": 10835, "epoch": 130} {"train_loss": -18.189008712768555, "global_step": 10836, "epoch": 130} {"train_loss": -17.478761672973633, "global_step": 10837, "epoch": 130} {"train_loss": -17.626192092895508, "global_step": 10838, "epoch": 130} {"train_loss": -17.7777042388916, "global_step": 10839, "epoch": 130} {"train_loss": -17.8466739654541, "global_step": 10840, "epoch": 130} {"train_loss": -17.738826751708984, "global_step": 10841, "epoch": 130} {"train_loss": -17.690738677978516, "global_step": 10842, "epoch": 130} {"train_loss": -17.73377799987793, "global_step": 10843, "epoch": 130} {"train_loss": -17.468246459960938, "global_step": 10844, "epoch": 130} {"train_loss": -17.77943229675293, "global_step": 10845, "epoch": 130} {"train_loss": -17.825504302978516, "global_step": 10846, "epoch": 130} {"train_loss": -18.12493324279785, "global_step": 10847, "epoch": 130} {"train_loss": -17.737838745117188, "global_step": 10848, "epoch": 130} {"train_loss": -18.149377822875977, "global_step": 10849, "epoch": 130} {"train_loss": -18.150653839111328, "global_step": 10850, "epoch": 130} {"train_loss": -17.80417251586914, "global_step": 10851, "epoch": 130} {"train_loss": -17.75701904296875, "global_step": 10852, "epoch": 130} {"train_loss": -17.794912338256836, "global_step": 10853, "epoch": 130} {"train_loss": -18.119407653808594, "global_step": 10854, "epoch": 130} {"train_loss": -18.065677642822266, "global_step": 10855, "epoch": 130} {"train_loss": -17.585468292236328, "global_step": 10856, "epoch": 130} {"train_loss": -17.622039794921875, "global_step": 10857, "epoch": 130} {"train_loss": -17.854408264160156, "global_step": 10858, "epoch": 130} {"train_loss": -17.92426872253418, "global_step": 10859, "epoch": 130} {"train_loss": -17.56239128112793, "global_step": 10860, "epoch": 130} {"train_loss": -18.09218406677246, "global_step": 10861, "epoch": 130} {"train_loss": -17.89362335205078, "global_step": 10862, "epoch": 130} {"train_loss": -17.776138305664062, "global_step": 10863, "epoch": 130} {"train_loss": -17.581253051757812, "global_step": 10864, "epoch": 130} {"train_loss": -17.566007614135742, "global_step": 10865, "epoch": 130} {"train_loss": -17.78717613220215, "global_step": 10866, "epoch": 130} {"train_loss": -17.910390853881836, "global_step": 10867, "epoch": 130} {"train_loss": -17.82684898376465, "global_step": 10868, "epoch": 130} {"train_loss": -17.511316299438477, "global_step": 10869, "epoch": 130} {"train_loss": -17.76027488708496, "global_step": 10870, "epoch": 130} {"train_loss": -17.715665817260742, "global_step": 10871, "epoch": 130} {"train_loss": -17.723829085568347, "global_step": 10872, "epoch": 130, "val_loss": 6238479.5} {"train_loss": -17.336444854736328, "global_step": 10873, "epoch": 131} {"train_loss": -17.725427627563477, "global_step": 10874, "epoch": 131} {"train_loss": -17.692419052124023, "global_step": 10875, "epoch": 131} {"train_loss": -17.737733840942383, "global_step": 10876, "epoch": 131} {"train_loss": -17.533655166625977, "global_step": 10877, "epoch": 131} {"train_loss": -17.7906436920166, "global_step": 10878, "epoch": 131} {"train_loss": -17.71097183227539, "global_step": 10879, "epoch": 131} {"train_loss": -17.56791114807129, "global_step": 10880, "epoch": 131} {"train_loss": -17.66279411315918, "global_step": 10881, "epoch": 131} {"train_loss": -17.111587524414062, "global_step": 10882, "epoch": 131} {"train_loss": -17.60763168334961, "global_step": 10883, "epoch": 131} {"train_loss": -17.965681076049805, "global_step": 10884, "epoch": 131} {"train_loss": -18.06388282775879, "global_step": 10885, "epoch": 131} {"train_loss": -17.371511459350586, "global_step": 10886, "epoch": 131} {"train_loss": -17.384145736694336, "global_step": 10887, "epoch": 131} {"train_loss": -17.556272506713867, "global_step": 10888, "epoch": 131} {"train_loss": -17.58698844909668, "global_step": 10889, "epoch": 131} {"train_loss": -17.66035270690918, "global_step": 10890, "epoch": 131} {"train_loss": -17.5134334564209, "global_step": 10891, "epoch": 131} {"train_loss": -17.430326461791992, "global_step": 10892, "epoch": 131} {"train_loss": -17.96559715270996, "global_step": 10893, "epoch": 131} {"train_loss": -17.192106246948242, "global_step": 10894, "epoch": 131} {"train_loss": -17.355924606323242, "global_step": 10895, "epoch": 131} {"train_loss": -17.599828720092773, "global_step": 10896, "epoch": 131} {"train_loss": -17.58306121826172, "global_step": 10897, "epoch": 131} {"train_loss": -17.673236846923828, "global_step": 10898, "epoch": 131} {"train_loss": -17.722806930541992, "global_step": 10899, "epoch": 131} {"train_loss": -17.562894821166992, "global_step": 10900, "epoch": 131} {"train_loss": -17.78944206237793, "global_step": 10901, "epoch": 131} {"train_loss": -17.461639404296875, "global_step": 10902, "epoch": 131} {"train_loss": -17.91995620727539, "global_step": 10903, "epoch": 131} {"train_loss": -18.21259880065918, "global_step": 10904, "epoch": 131} {"train_loss": -17.671175003051758, "global_step": 10905, "epoch": 131} {"train_loss": -18.002065658569336, "global_step": 10906, "epoch": 131} {"train_loss": -17.8503360748291, "global_step": 10907, "epoch": 131} {"train_loss": -17.486478805541992, "global_step": 10908, "epoch": 131} {"train_loss": -17.631446838378906, "global_step": 10909, "epoch": 131} {"train_loss": -17.700855255126953, "global_step": 10910, "epoch": 131} {"train_loss": -17.71046257019043, "global_step": 10911, "epoch": 131} {"train_loss": -17.49538230895996, "global_step": 10912, "epoch": 131} {"train_loss": -17.853256225585938, "global_step": 10913, "epoch": 131} {"train_loss": -17.20700454711914, "global_step": 10914, "epoch": 131} {"train_loss": -17.552444458007812, "global_step": 10915, "epoch": 131} {"train_loss": -17.48650550842285, "global_step": 10916, "epoch": 131} {"train_loss": -17.748571395874023, "global_step": 10917, "epoch": 131} {"train_loss": -17.94453239440918, "global_step": 10918, "epoch": 131} {"train_loss": -17.7032413482666, "global_step": 10919, "epoch": 131} {"train_loss": -17.6409969329834, "global_step": 10920, "epoch": 131} {"train_loss": -17.71062660217285, "global_step": 10921, "epoch": 131} {"train_loss": -17.622648239135742, "global_step": 10922, "epoch": 131} {"train_loss": -17.883697509765625, "global_step": 10923, "epoch": 131} {"train_loss": -17.532255172729492, "global_step": 10924, "epoch": 131} {"train_loss": -17.816312789916992, "global_step": 10925, "epoch": 131} {"train_loss": -17.670867919921875, "global_step": 10926, "epoch": 131} {"train_loss": -17.86745834350586, "global_step": 10927, "epoch": 131} {"train_loss": -17.76084327697754, "global_step": 10928, "epoch": 131} {"train_loss": -17.668941497802734, "global_step": 10929, "epoch": 131} {"train_loss": -17.96578598022461, "global_step": 10930, "epoch": 131} {"train_loss": -17.29401206970215, "global_step": 10931, "epoch": 131} {"train_loss": -17.83602523803711, "global_step": 10932, "epoch": 131} {"train_loss": -17.865081787109375, "global_step": 10933, "epoch": 131} {"train_loss": -17.749649047851562, "global_step": 10934, "epoch": 131} {"train_loss": -17.89649772644043, "global_step": 10935, "epoch": 131} {"train_loss": -17.504545211791992, "global_step": 10936, "epoch": 131} {"train_loss": -18.138280868530273, "global_step": 10937, "epoch": 131} {"train_loss": -17.776975631713867, "global_step": 10938, "epoch": 131} {"train_loss": -17.681699752807617, "global_step": 10939, "epoch": 131} {"train_loss": -17.579059600830078, "global_step": 10940, "epoch": 131} {"train_loss": -17.957775115966797, "global_step": 10941, "epoch": 131} {"train_loss": -17.23744773864746, "global_step": 10942, "epoch": 131} {"train_loss": -18.388402938842773, "global_step": 10943, "epoch": 131} {"train_loss": -17.845809936523438, "global_step": 10944, "epoch": 131} {"train_loss": -17.760339736938477, "global_step": 10945, "epoch": 131} {"train_loss": -17.825647354125977, "global_step": 10946, "epoch": 131} {"train_loss": -17.964811325073242, "global_step": 10947, "epoch": 131} {"train_loss": -17.665739059448242, "global_step": 10948, "epoch": 131} {"train_loss": -17.927824020385742, "global_step": 10949, "epoch": 131} {"train_loss": -18.164264678955078, "global_step": 10950, "epoch": 131} {"train_loss": -17.7677001953125, "global_step": 10951, "epoch": 131} {"train_loss": -17.5495548248291, "global_step": 10952, "epoch": 131} {"train_loss": -17.814287185668945, "global_step": 10953, "epoch": 131} {"train_loss": -17.604419708251953, "global_step": 10954, "epoch": 131} {"train_loss": -17.6967859383089, "global_step": 10955, "epoch": 131, "val_loss": 6188834.0} {"train_loss": -17.579761505126953, "global_step": 10956, "epoch": 132} {"train_loss": -18.021310806274414, "global_step": 10957, "epoch": 132} {"train_loss": -17.558074951171875, "global_step": 10958, "epoch": 132} {"train_loss": -18.237686157226562, "global_step": 10959, "epoch": 132} {"train_loss": -17.656251907348633, "global_step": 10960, "epoch": 132} {"train_loss": -17.619226455688477, "global_step": 10961, "epoch": 132} {"train_loss": -17.78379249572754, "global_step": 10962, "epoch": 132} {"train_loss": -17.789188385009766, "global_step": 10963, "epoch": 132} {"train_loss": -17.43401527404785, "global_step": 10964, "epoch": 132} {"train_loss": -17.9547061920166, "global_step": 10965, "epoch": 132} {"train_loss": -17.608694076538086, "global_step": 10966, "epoch": 132} {"train_loss": -18.00766944885254, "global_step": 10967, "epoch": 132} {"train_loss": -17.859251022338867, "global_step": 10968, "epoch": 132} {"train_loss": -17.75652503967285, "global_step": 10969, "epoch": 132} {"train_loss": -17.520450592041016, "global_step": 10970, "epoch": 132} {"train_loss": -17.899581909179688, "global_step": 10971, "epoch": 132} {"train_loss": -17.790876388549805, "global_step": 10972, "epoch": 132} {"train_loss": -17.50328254699707, "global_step": 10973, "epoch": 132} {"train_loss": -18.0793399810791, "global_step": 10974, "epoch": 132} {"train_loss": -18.02277946472168, "global_step": 10975, "epoch": 132} {"train_loss": -17.829635620117188, "global_step": 10976, "epoch": 132} {"train_loss": -17.768659591674805, "global_step": 10977, "epoch": 132} {"train_loss": -17.741832733154297, "global_step": 10978, "epoch": 132} {"train_loss": -17.986743927001953, "global_step": 10979, "epoch": 132} {"train_loss": -17.59200096130371, "global_step": 10980, "epoch": 132} {"train_loss": -17.538665771484375, "global_step": 10981, "epoch": 132} {"train_loss": -17.29168128967285, "global_step": 10982, "epoch": 132} {"train_loss": -17.948667526245117, "global_step": 10983, "epoch": 132} {"train_loss": -17.911739349365234, "global_step": 10984, "epoch": 132} {"train_loss": -17.486736297607422, "global_step": 10985, "epoch": 132} {"train_loss": -17.3300838470459, "global_step": 10986, "epoch": 132} {"train_loss": -17.88056755065918, "global_step": 10987, "epoch": 132} {"train_loss": -17.816654205322266, "global_step": 10988, "epoch": 132} {"train_loss": -18.0920352935791, "global_step": 10989, "epoch": 132} {"train_loss": -17.41718101501465, "global_step": 10990, "epoch": 132} {"train_loss": -17.92542266845703, "global_step": 10991, "epoch": 132} {"train_loss": -17.95952796936035, "global_step": 10992, "epoch": 132} {"train_loss": -17.690628051757812, "global_step": 10993, "epoch": 132} {"train_loss": -17.67068099975586, "global_step": 10994, "epoch": 132} {"train_loss": -17.801166534423828, "global_step": 10995, "epoch": 132} {"train_loss": -17.559173583984375, "global_step": 10996, "epoch": 132} {"train_loss": -18.00618553161621, "global_step": 10997, "epoch": 132} {"train_loss": -17.757099151611328, "global_step": 10998, "epoch": 132} {"train_loss": -18.12289810180664, "global_step": 10999, "epoch": 132} {"train_loss": -17.77167320251465, "global_step": 11000, "epoch": 132} {"train_loss": -17.402563095092773, "global_step": 11001, "epoch": 132} {"train_loss": -17.228681564331055, "global_step": 11002, "epoch": 132} {"train_loss": -17.711278915405273, "global_step": 11003, "epoch": 132} {"train_loss": -18.033267974853516, "global_step": 11004, "epoch": 132} {"train_loss": -17.654848098754883, "global_step": 11005, "epoch": 132} {"train_loss": -18.178709030151367, "global_step": 11006, "epoch": 132} {"train_loss": -17.723880767822266, "global_step": 11007, "epoch": 132} {"train_loss": -17.73992919921875, "global_step": 11008, "epoch": 132} {"train_loss": -17.523334503173828, "global_step": 11009, "epoch": 132} {"train_loss": -17.819799423217773, "global_step": 11010, "epoch": 132} {"train_loss": -17.617935180664062, "global_step": 11011, "epoch": 132} {"train_loss": -17.665634155273438, "global_step": 11012, "epoch": 132} {"train_loss": -17.29361343383789, "global_step": 11013, "epoch": 132} {"train_loss": -17.88480567932129, "global_step": 11014, "epoch": 132} {"train_loss": -17.696317672729492, "global_step": 11015, "epoch": 132} {"train_loss": -18.01210594177246, "global_step": 11016, "epoch": 132} {"train_loss": -18.08566665649414, "global_step": 11017, "epoch": 132} {"train_loss": -17.28635597229004, "global_step": 11018, "epoch": 132} {"train_loss": -17.818374633789062, "global_step": 11019, "epoch": 132} {"train_loss": -17.671049118041992, "global_step": 11020, "epoch": 132} {"train_loss": -17.811681747436523, "global_step": 11021, "epoch": 132} {"train_loss": -17.488008499145508, "global_step": 11022, "epoch": 132} {"train_loss": -18.333471298217773, "global_step": 11023, "epoch": 132} {"train_loss": -18.064224243164062, "global_step": 11024, "epoch": 132} {"train_loss": -17.652883529663086, "global_step": 11025, "epoch": 132} {"train_loss": -17.925905227661133, "global_step": 11026, "epoch": 132} {"train_loss": -17.51045799255371, "global_step": 11027, "epoch": 132} {"train_loss": -17.862136840820312, "global_step": 11028, "epoch": 132} {"train_loss": -17.656721115112305, "global_step": 11029, "epoch": 132} {"train_loss": -17.816646575927734, "global_step": 11030, "epoch": 132} {"train_loss": -17.858047485351562, "global_step": 11031, "epoch": 132} {"train_loss": -17.474227905273438, "global_step": 11032, "epoch": 132} {"train_loss": -17.503137588500977, "global_step": 11033, "epoch": 132} {"train_loss": -17.928970336914062, "global_step": 11034, "epoch": 132} {"train_loss": -17.56159019470215, "global_step": 11035, "epoch": 132} {"train_loss": -18.07862663269043, "global_step": 11036, "epoch": 132} {"train_loss": -17.82270050048828, "global_step": 11037, "epoch": 132} {"train_loss": -17.768479703420617, "global_step": 11038, "epoch": 132, "val_loss": 6197439.5} {"train_loss": -17.61280632019043, "global_step": 11039, "epoch": 133} {"train_loss": -18.10309600830078, "global_step": 11040, "epoch": 133} {"train_loss": -17.37479019165039, "global_step": 11041, "epoch": 133} {"train_loss": -18.037328720092773, "global_step": 11042, "epoch": 133} {"train_loss": -17.611557006835938, "global_step": 11043, "epoch": 133} {"train_loss": -17.560791015625, "global_step": 11044, "epoch": 133} {"train_loss": -17.40537452697754, "global_step": 11045, "epoch": 133} {"train_loss": -17.622711181640625, "global_step": 11046, "epoch": 133} {"train_loss": -17.539260864257812, "global_step": 11047, "epoch": 133} {"train_loss": -17.491106033325195, "global_step": 11048, "epoch": 133} {"train_loss": -17.727441787719727, "global_step": 11049, "epoch": 133} {"train_loss": -17.675155639648438, "global_step": 11050, "epoch": 133} {"train_loss": -18.119009017944336, "global_step": 11051, "epoch": 133} {"train_loss": -17.58998680114746, "global_step": 11052, "epoch": 133} {"train_loss": -17.507484436035156, "global_step": 11053, "epoch": 133} {"train_loss": -18.036481857299805, "global_step": 11054, "epoch": 133} {"train_loss": -17.745059967041016, "global_step": 11055, "epoch": 133} {"train_loss": -17.49083709716797, "global_step": 11056, "epoch": 133} {"train_loss": -17.794137954711914, "global_step": 11057, "epoch": 133} {"train_loss": -17.99028778076172, "global_step": 11058, "epoch": 133} {"train_loss": -17.975553512573242, "global_step": 11059, "epoch": 133} {"train_loss": -17.92049217224121, "global_step": 11060, "epoch": 133} {"train_loss": -17.587926864624023, "global_step": 11061, "epoch": 133} {"train_loss": -17.817901611328125, "global_step": 11062, "epoch": 133} {"train_loss": -17.557849884033203, "global_step": 11063, "epoch": 133} {"train_loss": -17.855703353881836, "global_step": 11064, "epoch": 133} {"train_loss": -18.00314712524414, "global_step": 11065, "epoch": 133} {"train_loss": -18.053091049194336, "global_step": 11066, "epoch": 133} {"train_loss": -17.37945556640625, "global_step": 11067, "epoch": 133} {"train_loss": -17.8990535736084, "global_step": 11068, "epoch": 133} {"train_loss": -17.827939987182617, "global_step": 11069, "epoch": 133} {"train_loss": -17.893491744995117, "global_step": 11070, "epoch": 133} {"train_loss": -17.470457077026367, "global_step": 11071, "epoch": 133} {"train_loss": -17.549158096313477, "global_step": 11072, "epoch": 133} {"train_loss": -18.13167953491211, "global_step": 11073, "epoch": 133} {"train_loss": -17.599172592163086, "global_step": 11074, "epoch": 133} {"train_loss": -18.021326065063477, "global_step": 11075, "epoch": 133} {"train_loss": -18.075681686401367, "global_step": 11076, "epoch": 133} {"train_loss": -17.697477340698242, "global_step": 11077, "epoch": 133} {"train_loss": -17.894062042236328, "global_step": 11078, "epoch": 133} {"train_loss": -17.218358993530273, "global_step": 11079, "epoch": 133} {"train_loss": -17.771629333496094, "global_step": 11080, "epoch": 133} {"train_loss": -17.64967155456543, "global_step": 11081, "epoch": 133} {"train_loss": -18.131628036499023, "global_step": 11082, "epoch": 133} {"train_loss": -18.2022705078125, "global_step": 11083, "epoch": 133} {"train_loss": -17.81441879272461, "global_step": 11084, "epoch": 133} {"train_loss": -17.95418357849121, "global_step": 11085, "epoch": 133} {"train_loss": -17.70808219909668, "global_step": 11086, "epoch": 133} {"train_loss": -18.17852210998535, "global_step": 11087, "epoch": 133} {"train_loss": -17.424497604370117, "global_step": 11088, "epoch": 133} {"train_loss": -18.0590763092041, "global_step": 11089, "epoch": 133} {"train_loss": -17.816869735717773, "global_step": 11090, "epoch": 133} {"train_loss": -18.1602840423584, "global_step": 11091, "epoch": 133} {"train_loss": -17.718320846557617, "global_step": 11092, "epoch": 133} {"train_loss": -18.223886489868164, "global_step": 11093, "epoch": 133} {"train_loss": -17.7396183013916, "global_step": 11094, "epoch": 133} {"train_loss": -17.85076904296875, "global_step": 11095, "epoch": 133} {"train_loss": -17.72542953491211, "global_step": 11096, "epoch": 133} {"train_loss": -17.772703170776367, "global_step": 11097, "epoch": 133} {"train_loss": -18.055444717407227, "global_step": 11098, "epoch": 133} {"train_loss": -18.201875686645508, "global_step": 11099, "epoch": 133} {"train_loss": -17.69904136657715, "global_step": 11100, "epoch": 133} {"train_loss": -17.650413513183594, "global_step": 11101, "epoch": 133} {"train_loss": -17.475379943847656, "global_step": 11102, "epoch": 133} {"train_loss": -17.39539909362793, "global_step": 11103, "epoch": 133} {"train_loss": -17.857431411743164, "global_step": 11104, "epoch": 133} {"train_loss": -17.556760787963867, "global_step": 11105, "epoch": 133} {"train_loss": -17.60223388671875, "global_step": 11106, "epoch": 133} {"train_loss": -17.773733139038086, "global_step": 11107, "epoch": 133} {"train_loss": -17.684532165527344, "global_step": 11108, "epoch": 133} {"train_loss": -17.601774215698242, "global_step": 11109, "epoch": 133} {"train_loss": -18.051586151123047, "global_step": 11110, "epoch": 133} {"train_loss": -17.257034301757812, "global_step": 11111, "epoch": 133} {"train_loss": -17.495399475097656, "global_step": 11112, "epoch": 133} {"train_loss": -18.12019920349121, "global_step": 11113, "epoch": 133} {"train_loss": -17.821577072143555, "global_step": 11114, "epoch": 133} {"train_loss": -17.5563907623291, "global_step": 11115, "epoch": 133} {"train_loss": -17.74637794494629, "global_step": 11116, "epoch": 133} {"train_loss": -17.543058395385742, "global_step": 11117, "epoch": 133} {"train_loss": -17.786420822143555, "global_step": 11118, "epoch": 133} {"train_loss": -17.6023006439209, "global_step": 11119, "epoch": 133} {"train_loss": -17.856735229492188, "global_step": 11120, "epoch": 133} {"train_loss": -17.77835917185588, "global_step": 11121, "epoch": 133, "val_loss": 6113703.0} {"train_loss": -17.6359920501709, "global_step": 11122, "epoch": 134} {"train_loss": -17.72467803955078, "global_step": 11123, "epoch": 134} {"train_loss": -17.8181095123291, "global_step": 11124, "epoch": 134} {"train_loss": -17.696569442749023, "global_step": 11125, "epoch": 134} {"train_loss": -17.739089965820312, "global_step": 11126, "epoch": 134} {"train_loss": -17.92354393005371, "global_step": 11127, "epoch": 134} {"train_loss": -17.473020553588867, "global_step": 11128, "epoch": 134} {"train_loss": -17.48672103881836, "global_step": 11129, "epoch": 134} {"train_loss": -17.270536422729492, "global_step": 11130, "epoch": 134} {"train_loss": -17.59050178527832, "global_step": 11131, "epoch": 134} {"train_loss": -17.627222061157227, "global_step": 11132, "epoch": 134} {"train_loss": -17.809749603271484, "global_step": 11133, "epoch": 134} {"train_loss": -17.868194580078125, "global_step": 11134, "epoch": 134} {"train_loss": -17.818592071533203, "global_step": 11135, "epoch": 134} {"train_loss": -17.76849365234375, "global_step": 11136, "epoch": 134} {"train_loss": -17.934640884399414, "global_step": 11137, "epoch": 134} {"train_loss": -17.784530639648438, "global_step": 11138, "epoch": 134} {"train_loss": -17.640857696533203, "global_step": 11139, "epoch": 134} {"train_loss": -17.64657211303711, "global_step": 11140, "epoch": 134} {"train_loss": -17.85432243347168, "global_step": 11141, "epoch": 134} {"train_loss": -17.748762130737305, "global_step": 11142, "epoch": 134} {"train_loss": -17.703275680541992, "global_step": 11143, "epoch": 134} {"train_loss": -18.042800903320312, "global_step": 11144, "epoch": 134} {"train_loss": -17.647714614868164, "global_step": 11145, "epoch": 134} {"train_loss": -18.03447723388672, "global_step": 11146, "epoch": 134} {"train_loss": -17.549589157104492, "global_step": 11147, "epoch": 134} {"train_loss": -17.800352096557617, "global_step": 11148, "epoch": 134} {"train_loss": -17.96442985534668, "global_step": 11149, "epoch": 134} {"train_loss": -17.96661376953125, "global_step": 11150, "epoch": 134} {"train_loss": -17.935277938842773, "global_step": 11151, "epoch": 134} {"train_loss": -17.778656005859375, "global_step": 11152, "epoch": 134} {"train_loss": -17.3975887298584, "global_step": 11153, "epoch": 134} {"train_loss": -17.409976959228516, "global_step": 11154, "epoch": 134} {"train_loss": -18.3792781829834, "global_step": 11155, "epoch": 134} {"train_loss": -17.98805046081543, "global_step": 11156, "epoch": 134} {"train_loss": -17.835359573364258, "global_step": 11157, "epoch": 134} {"train_loss": -17.211584091186523, "global_step": 11158, "epoch": 134} {"train_loss": -17.69623374938965, "global_step": 11159, "epoch": 134} {"train_loss": -18.02569580078125, "global_step": 11160, "epoch": 134} {"train_loss": -17.84383201599121, "global_step": 11161, "epoch": 134} {"train_loss": -18.00839614868164, "global_step": 11162, "epoch": 134} {"train_loss": -17.596546173095703, "global_step": 11163, "epoch": 134} {"train_loss": -17.812807083129883, "global_step": 11164, "epoch": 134} {"train_loss": -17.86402702331543, "global_step": 11165, "epoch": 134} {"train_loss": -17.717573165893555, "global_step": 11166, "epoch": 134} {"train_loss": -17.560110092163086, "global_step": 11167, "epoch": 134} {"train_loss": -18.0308837890625, "global_step": 11168, "epoch": 134} {"train_loss": -17.52158546447754, "global_step": 11169, "epoch": 134} {"train_loss": -18.0047664642334, "global_step": 11170, "epoch": 134} {"train_loss": -17.515897750854492, "global_step": 11171, "epoch": 134} {"train_loss": -18.105100631713867, "global_step": 11172, "epoch": 134} {"train_loss": -17.685087203979492, "global_step": 11173, "epoch": 134} {"train_loss": -17.58021354675293, "global_step": 11174, "epoch": 134} {"train_loss": -18.205121994018555, "global_step": 11175, "epoch": 134} {"train_loss": -17.737733840942383, "global_step": 11176, "epoch": 134} {"train_loss": -18.006765365600586, "global_step": 11177, "epoch": 134} {"train_loss": -17.40665054321289, "global_step": 11178, "epoch": 134} {"train_loss": -17.598934173583984, "global_step": 11179, "epoch": 134} {"train_loss": -17.753942489624023, "global_step": 11180, "epoch": 134} {"train_loss": -17.826269149780273, "global_step": 11181, "epoch": 134} {"train_loss": -17.91499137878418, "global_step": 11182, "epoch": 134} {"train_loss": -17.717239379882812, "global_step": 11183, "epoch": 134} {"train_loss": -18.07564353942871, "global_step": 11184, "epoch": 134} {"train_loss": -17.7633113861084, "global_step": 11185, "epoch": 134} {"train_loss": -17.829851150512695, "global_step": 11186, "epoch": 134} {"train_loss": -17.6854248046875, "global_step": 11187, "epoch": 134} {"train_loss": -17.7759952545166, "global_step": 11188, "epoch": 134} {"train_loss": -17.998987197875977, "global_step": 11189, "epoch": 134} {"train_loss": -17.866201400756836, "global_step": 11190, "epoch": 134} {"train_loss": -17.87409019470215, "global_step": 11191, "epoch": 134} {"train_loss": -17.86516761779785, "global_step": 11192, "epoch": 134} {"train_loss": -17.48921012878418, "global_step": 11193, "epoch": 134} {"train_loss": -17.61899185180664, "global_step": 11194, "epoch": 134} {"train_loss": -17.618436813354492, "global_step": 11195, "epoch": 134} {"train_loss": -17.693145751953125, "global_step": 11196, "epoch": 134} {"train_loss": -17.867258071899414, "global_step": 11197, "epoch": 134} {"train_loss": -17.869144439697266, "global_step": 11198, "epoch": 134} {"train_loss": -17.7227840423584, "global_step": 11199, "epoch": 134} {"train_loss": -17.99361228942871, "global_step": 11200, "epoch": 134} {"train_loss": -17.4818172454834, "global_step": 11201, "epoch": 134} {"train_loss": -17.95876121520996, "global_step": 11202, "epoch": 134} {"train_loss": -17.51897621154785, "global_step": 11203, "epoch": 134} {"train_loss": -17.773878740977093, "global_step": 11204, "epoch": 134, "val_loss": 6186254.0} {"train_loss": -17.29823112487793, "global_step": 11205, "epoch": 135} {"train_loss": -17.576074600219727, "global_step": 11206, "epoch": 135} {"train_loss": -17.404386520385742, "global_step": 11207, "epoch": 135} {"train_loss": -17.28213882446289, "global_step": 11208, "epoch": 135} {"train_loss": -17.59889793395996, "global_step": 11209, "epoch": 135} {"train_loss": -16.95560073852539, "global_step": 11210, "epoch": 135} {"train_loss": -17.479169845581055, "global_step": 11211, "epoch": 135} {"train_loss": -17.5228328704834, "global_step": 11212, "epoch": 135} {"train_loss": -17.39162254333496, "global_step": 11213, "epoch": 135} {"train_loss": -17.541297912597656, "global_step": 11214, "epoch": 135} {"train_loss": -17.693449020385742, "global_step": 11215, "epoch": 135} {"train_loss": -17.521982192993164, "global_step": 11216, "epoch": 135} {"train_loss": -17.594425201416016, "global_step": 11217, "epoch": 135} {"train_loss": -17.676197052001953, "global_step": 11218, "epoch": 135} {"train_loss": -17.410369873046875, "global_step": 11219, "epoch": 135} {"train_loss": -17.222753524780273, "global_step": 11220, "epoch": 135} {"train_loss": -17.612165451049805, "global_step": 11221, "epoch": 135} {"train_loss": -17.199533462524414, "global_step": 11222, "epoch": 135} {"train_loss": -17.52680015563965, "global_step": 11223, "epoch": 135} {"train_loss": -17.590381622314453, "global_step": 11224, "epoch": 135} {"train_loss": -17.868661880493164, "global_step": 11225, "epoch": 135} {"train_loss": -17.937366485595703, "global_step": 11226, "epoch": 135} {"train_loss": -17.642038345336914, "global_step": 11227, "epoch": 135} {"train_loss": -17.669858932495117, "global_step": 11228, "epoch": 135} {"train_loss": -17.980087280273438, "global_step": 11229, "epoch": 135} {"train_loss": -17.749536514282227, "global_step": 11230, "epoch": 135} {"train_loss": -17.932050704956055, "global_step": 11231, "epoch": 135} {"train_loss": -18.001766204833984, "global_step": 11232, "epoch": 135} {"train_loss": -17.9104061126709, "global_step": 11233, "epoch": 135} {"train_loss": -17.523847579956055, "global_step": 11234, "epoch": 135} {"train_loss": -17.84716796875, "global_step": 11235, "epoch": 135} {"train_loss": -17.924604415893555, "global_step": 11236, "epoch": 135} {"train_loss": -17.921232223510742, "global_step": 11237, "epoch": 135} {"train_loss": -18.02679443359375, "global_step": 11238, "epoch": 135} {"train_loss": -17.388959884643555, "global_step": 11239, "epoch": 135} {"train_loss": -17.99386978149414, "global_step": 11240, "epoch": 135} {"train_loss": -17.735910415649414, "global_step": 11241, "epoch": 135} {"train_loss": -17.636066436767578, "global_step": 11242, "epoch": 135} {"train_loss": -17.67574119567871, "global_step": 11243, "epoch": 135} {"train_loss": -17.71980094909668, "global_step": 11244, "epoch": 135} {"train_loss": -17.762727737426758, "global_step": 11245, "epoch": 135} {"train_loss": -17.976896286010742, "global_step": 11246, "epoch": 135} {"train_loss": -17.662656784057617, "global_step": 11247, "epoch": 135} {"train_loss": -17.83000946044922, "global_step": 11248, "epoch": 135} {"train_loss": -17.82967185974121, "global_step": 11249, "epoch": 135} {"train_loss": -18.007200241088867, "global_step": 11250, "epoch": 135} {"train_loss": -17.6055965423584, "global_step": 11251, "epoch": 135} {"train_loss": -17.505884170532227, "global_step": 11252, "epoch": 135} {"train_loss": -17.714818954467773, "global_step": 11253, "epoch": 135} {"train_loss": -17.32977867126465, "global_step": 11254, "epoch": 135} {"train_loss": -17.963748931884766, "global_step": 11255, "epoch": 135} {"train_loss": -17.740232467651367, "global_step": 11256, "epoch": 135} {"train_loss": -17.77960968017578, "global_step": 11257, "epoch": 135} {"train_loss": -17.79461669921875, "global_step": 11258, "epoch": 135} {"train_loss": -17.517253875732422, "global_step": 11259, "epoch": 135} {"train_loss": -18.080350875854492, "global_step": 11260, "epoch": 135} {"train_loss": -17.91327476501465, "global_step": 11261, "epoch": 135} {"train_loss": -17.65074348449707, "global_step": 11262, "epoch": 135} {"train_loss": -18.05927848815918, "global_step": 11263, "epoch": 135} {"train_loss": -17.76497459411621, "global_step": 11264, "epoch": 135} {"train_loss": -18.056903839111328, "global_step": 11265, "epoch": 135} {"train_loss": -17.747041702270508, "global_step": 11266, "epoch": 135} {"train_loss": -17.672618865966797, "global_step": 11267, "epoch": 135} {"train_loss": -18.15625, "global_step": 11268, "epoch": 135} {"train_loss": -17.87451171875, "global_step": 11269, "epoch": 135} {"train_loss": -17.540679931640625, "global_step": 11270, "epoch": 135} {"train_loss": -17.651044845581055, "global_step": 11271, "epoch": 135} {"train_loss": -17.437097549438477, "global_step": 11272, "epoch": 135} {"train_loss": -17.2865047454834, "global_step": 11273, "epoch": 135} {"train_loss": -18.031295776367188, "global_step": 11274, "epoch": 135} {"train_loss": -18.04568862915039, "global_step": 11275, "epoch": 135} {"train_loss": -17.880266189575195, "global_step": 11276, "epoch": 135} {"train_loss": -17.587162017822266, "global_step": 11277, "epoch": 135} {"train_loss": -17.14383888244629, "global_step": 11278, "epoch": 135} {"train_loss": -18.118715286254883, "global_step": 11279, "epoch": 135} {"train_loss": -18.084171295166016, "global_step": 11280, "epoch": 135} {"train_loss": -17.9892520904541, "global_step": 11281, "epoch": 135} {"train_loss": -17.898622512817383, "global_step": 11282, "epoch": 135} {"train_loss": -17.656909942626953, "global_step": 11283, "epoch": 135} {"train_loss": -17.70941734313965, "global_step": 11284, "epoch": 135} {"train_loss": -17.411001205444336, "global_step": 11285, "epoch": 135} {"train_loss": -17.564136505126953, "global_step": 11286, "epoch": 135} {"train_loss": -17.70290797589773, "global_step": 11287, "epoch": 135, "val_loss": 6052085.0} {"train_loss": -17.759092330932617, "global_step": 11288, "epoch": 136} {"train_loss": -17.50203514099121, "global_step": 11289, "epoch": 136} {"train_loss": -17.70673942565918, "global_step": 11290, "epoch": 136} {"train_loss": -17.565500259399414, "global_step": 11291, "epoch": 136} {"train_loss": -17.80781364440918, "global_step": 11292, "epoch": 136} {"train_loss": -18.036291122436523, "global_step": 11293, "epoch": 136} {"train_loss": -17.55988311767578, "global_step": 11294, "epoch": 136} {"train_loss": -17.882720947265625, "global_step": 11295, "epoch": 136} {"train_loss": -17.847272872924805, "global_step": 11296, "epoch": 136} {"train_loss": -17.803659439086914, "global_step": 11297, "epoch": 136} {"train_loss": -17.315265655517578, "global_step": 11298, "epoch": 136} {"train_loss": -17.446205139160156, "global_step": 11299, "epoch": 136} {"train_loss": -17.875316619873047, "global_step": 11300, "epoch": 136} {"train_loss": -17.465970993041992, "global_step": 11301, "epoch": 136} {"train_loss": -18.123321533203125, "global_step": 11302, "epoch": 136} {"train_loss": -17.84731101989746, "global_step": 11303, "epoch": 136} {"train_loss": -18.135610580444336, "global_step": 11304, "epoch": 136} {"train_loss": -17.818143844604492, "global_step": 11305, "epoch": 136} {"train_loss": -18.072154998779297, "global_step": 11306, "epoch": 136} {"train_loss": -18.030874252319336, "global_step": 11307, "epoch": 136} {"train_loss": -17.682552337646484, "global_step": 11308, "epoch": 136} {"train_loss": -17.84504508972168, "global_step": 11309, "epoch": 136} {"train_loss": -17.590978622436523, "global_step": 11310, "epoch": 136} {"train_loss": -17.886455535888672, "global_step": 11311, "epoch": 136} {"train_loss": -18.16213607788086, "global_step": 11312, "epoch": 136} {"train_loss": -17.481306076049805, "global_step": 11313, "epoch": 136} {"train_loss": -17.442523956298828, "global_step": 11314, "epoch": 136} {"train_loss": -17.487258911132812, "global_step": 11315, "epoch": 136} {"train_loss": -17.934326171875, "global_step": 11316, "epoch": 136} {"train_loss": -17.76190757751465, "global_step": 11317, "epoch": 136} {"train_loss": -17.94705581665039, "global_step": 11318, "epoch": 136} {"train_loss": -17.924890518188477, "global_step": 11319, "epoch": 136} {"train_loss": -17.989917755126953, "global_step": 11320, "epoch": 136} {"train_loss": -17.973812103271484, "global_step": 11321, "epoch": 136} {"train_loss": -17.535324096679688, "global_step": 11322, "epoch": 136} {"train_loss": -17.807342529296875, "global_step": 11323, "epoch": 136} {"train_loss": -17.573522567749023, "global_step": 11324, "epoch": 136} {"train_loss": -17.400724411010742, "global_step": 11325, "epoch": 136} {"train_loss": -17.90420913696289, "global_step": 11326, "epoch": 136} {"train_loss": -17.573476791381836, "global_step": 11327, "epoch": 136} {"train_loss": -17.9417724609375, "global_step": 11328, "epoch": 136} {"train_loss": -17.506498336791992, "global_step": 11329, "epoch": 136} {"train_loss": -17.508520126342773, "global_step": 11330, "epoch": 136} {"train_loss": -17.723352432250977, "global_step": 11331, "epoch": 136} {"train_loss": -17.796445846557617, "global_step": 11332, "epoch": 136} {"train_loss": -17.72774314880371, "global_step": 11333, "epoch": 136} {"train_loss": -17.335830688476562, "global_step": 11334, "epoch": 136} {"train_loss": -17.612594604492188, "global_step": 11335, "epoch": 136} {"train_loss": -17.928442001342773, "global_step": 11336, "epoch": 136} {"train_loss": -17.649063110351562, "global_step": 11337, "epoch": 136} {"train_loss": -17.866413116455078, "global_step": 11338, "epoch": 136} {"train_loss": -17.598047256469727, "global_step": 11339, "epoch": 136} {"train_loss": -17.904943466186523, "global_step": 11340, "epoch": 136} {"train_loss": -17.817235946655273, "global_step": 11341, "epoch": 136} {"train_loss": -17.791889190673828, "global_step": 11342, "epoch": 136} {"train_loss": -17.942792892456055, "global_step": 11343, "epoch": 136} {"train_loss": -17.732847213745117, "global_step": 11344, "epoch": 136} {"train_loss": -17.72847557067871, "global_step": 11345, "epoch": 136} {"train_loss": -17.941349029541016, "global_step": 11346, "epoch": 136} {"train_loss": -17.80666160583496, "global_step": 11347, "epoch": 136} {"train_loss": -17.66270637512207, "global_step": 11348, "epoch": 136} {"train_loss": -17.615324020385742, "global_step": 11349, "epoch": 136} {"train_loss": -17.99382972717285, "global_step": 11350, "epoch": 136} {"train_loss": -17.873876571655273, "global_step": 11351, "epoch": 136} {"train_loss": -17.87078857421875, "global_step": 11352, "epoch": 136} {"train_loss": -17.72954559326172, "global_step": 11353, "epoch": 136} {"train_loss": -18.030067443847656, "global_step": 11354, "epoch": 136} {"train_loss": -17.84065055847168, "global_step": 11355, "epoch": 136} {"train_loss": -17.78034019470215, "global_step": 11356, "epoch": 136} {"train_loss": -17.749006271362305, "global_step": 11357, "epoch": 136} {"train_loss": -17.733240127563477, "global_step": 11358, "epoch": 136} {"train_loss": -17.784473419189453, "global_step": 11359, "epoch": 136} {"train_loss": -17.790130615234375, "global_step": 11360, "epoch": 136} {"train_loss": -17.621536254882812, "global_step": 11361, "epoch": 136} {"train_loss": -18.1019344329834, "global_step": 11362, "epoch": 136} {"train_loss": -17.84391212463379, "global_step": 11363, "epoch": 136} {"train_loss": -18.03468132019043, "global_step": 11364, "epoch": 136} {"train_loss": -17.424346923828125, "global_step": 11365, "epoch": 136} {"train_loss": -18.044822692871094, "global_step": 11366, "epoch": 136} {"train_loss": -17.992116928100586, "global_step": 11367, "epoch": 136} {"train_loss": -17.672910690307617, "global_step": 11368, "epoch": 136} {"train_loss": -17.66873550415039, "global_step": 11369, "epoch": 136} {"train_loss": -17.764721008668463, "global_step": 11370, "epoch": 136, "val_loss": 6081524.0} {"train_loss": -17.379669189453125, "global_step": 11371, "epoch": 137} {"train_loss": -17.83348846435547, "global_step": 11372, "epoch": 137} {"train_loss": -17.59634017944336, "global_step": 11373, "epoch": 137} {"train_loss": -17.780071258544922, "global_step": 11374, "epoch": 137} {"train_loss": -17.898412704467773, "global_step": 11375, "epoch": 137} {"train_loss": -17.72112274169922, "global_step": 11376, "epoch": 137} {"train_loss": -17.831480026245117, "global_step": 11377, "epoch": 137} {"train_loss": -17.563541412353516, "global_step": 11378, "epoch": 137} {"train_loss": -17.880464553833008, "global_step": 11379, "epoch": 137} {"train_loss": -17.791086196899414, "global_step": 11380, "epoch": 137} {"train_loss": -17.696916580200195, "global_step": 11381, "epoch": 137} {"train_loss": -17.8851375579834, "global_step": 11382, "epoch": 137} {"train_loss": -17.706274032592773, "global_step": 11383, "epoch": 137} {"train_loss": -17.042205810546875, "global_step": 11384, "epoch": 137} {"train_loss": -17.533430099487305, "global_step": 11385, "epoch": 137} {"train_loss": -17.564401626586914, "global_step": 11386, "epoch": 137} {"train_loss": -18.253219604492188, "global_step": 11387, "epoch": 137} {"train_loss": -17.801651000976562, "global_step": 11388, "epoch": 137} {"train_loss": -17.995840072631836, "global_step": 11389, "epoch": 137} {"train_loss": -17.68312644958496, "global_step": 11390, "epoch": 137} {"train_loss": -17.794574737548828, "global_step": 11391, "epoch": 137} {"train_loss": -17.899494171142578, "global_step": 11392, "epoch": 137} {"train_loss": -17.786867141723633, "global_step": 11393, "epoch": 137} {"train_loss": -17.47035789489746, "global_step": 11394, "epoch": 137} {"train_loss": -17.77328109741211, "global_step": 11395, "epoch": 137} {"train_loss": -17.512924194335938, "global_step": 11396, "epoch": 137} {"train_loss": -18.001556396484375, "global_step": 11397, "epoch": 137} {"train_loss": -17.654109954833984, "global_step": 11398, "epoch": 137} {"train_loss": -17.870424270629883, "global_step": 11399, "epoch": 137} {"train_loss": -17.989044189453125, "global_step": 11400, "epoch": 137} {"train_loss": -17.783981323242188, "global_step": 11401, "epoch": 137} {"train_loss": -17.691404342651367, "global_step": 11402, "epoch": 137} {"train_loss": -18.081344604492188, "global_step": 11403, "epoch": 137} {"train_loss": -17.557607650756836, "global_step": 11404, "epoch": 137} {"train_loss": -17.875110626220703, "global_step": 11405, "epoch": 137} {"train_loss": -17.9521541595459, "global_step": 11406, "epoch": 137} {"train_loss": -17.555561065673828, "global_step": 11407, "epoch": 137} {"train_loss": -17.799114227294922, "global_step": 11408, "epoch": 137} {"train_loss": -17.833032608032227, "global_step": 11409, "epoch": 137} {"train_loss": -17.34067726135254, "global_step": 11410, "epoch": 137} {"train_loss": -17.866138458251953, "global_step": 11411, "epoch": 137} {"train_loss": -17.229419708251953, "global_step": 11412, "epoch": 137} {"train_loss": -17.5125789642334, "global_step": 11413, "epoch": 137} {"train_loss": -17.979341506958008, "global_step": 11414, "epoch": 137} {"train_loss": -17.81854248046875, "global_step": 11415, "epoch": 137} {"train_loss": -17.26152229309082, "global_step": 11416, "epoch": 137} {"train_loss": -17.73756217956543, "global_step": 11417, "epoch": 137} {"train_loss": -17.74569320678711, "global_step": 11418, "epoch": 137} {"train_loss": -17.718460083007812, "global_step": 11419, "epoch": 137} {"train_loss": -17.855607986450195, "global_step": 11420, "epoch": 137} {"train_loss": -17.764936447143555, "global_step": 11421, "epoch": 137} {"train_loss": -17.758655548095703, "global_step": 11422, "epoch": 137} {"train_loss": -17.247329711914062, "global_step": 11423, "epoch": 137} {"train_loss": -17.360015869140625, "global_step": 11424, "epoch": 137} {"train_loss": -17.988874435424805, "global_step": 11425, "epoch": 137} {"train_loss": -17.647422790527344, "global_step": 11426, "epoch": 137} {"train_loss": -17.99928092956543, "global_step": 11427, "epoch": 137} {"train_loss": -17.72193717956543, "global_step": 11428, "epoch": 137} {"train_loss": -17.90135383605957, "global_step": 11429, "epoch": 137} {"train_loss": -18.17409324645996, "global_step": 11430, "epoch": 137} {"train_loss": -18.140029907226562, "global_step": 11431, "epoch": 137} {"train_loss": -17.866113662719727, "global_step": 11432, "epoch": 137} {"train_loss": -17.817197799682617, "global_step": 11433, "epoch": 137} {"train_loss": -17.780241012573242, "global_step": 11434, "epoch": 137} {"train_loss": -17.98575210571289, "global_step": 11435, "epoch": 137} {"train_loss": -17.82529640197754, "global_step": 11436, "epoch": 137} {"train_loss": -17.9696102142334, "global_step": 11437, "epoch": 137} {"train_loss": -17.431772232055664, "global_step": 11438, "epoch": 137} {"train_loss": -17.989673614501953, "global_step": 11439, "epoch": 137} {"train_loss": -17.60774803161621, "global_step": 11440, "epoch": 137} {"train_loss": -17.887014389038086, "global_step": 11441, "epoch": 137} {"train_loss": -17.41839599609375, "global_step": 11442, "epoch": 137} {"train_loss": -17.779943466186523, "global_step": 11443, "epoch": 137} {"train_loss": -17.963651657104492, "global_step": 11444, "epoch": 137} {"train_loss": -17.9265079498291, "global_step": 11445, "epoch": 137} {"train_loss": -17.86634635925293, "global_step": 11446, "epoch": 137} {"train_loss": -18.08909797668457, "global_step": 11447, "epoch": 137} {"train_loss": -17.485774993896484, "global_step": 11448, "epoch": 137} {"train_loss": -17.63382911682129, "global_step": 11449, "epoch": 137} {"train_loss": -17.70305633544922, "global_step": 11450, "epoch": 137} {"train_loss": -18.090282440185547, "global_step": 11451, "epoch": 137} {"train_loss": -17.898696899414062, "global_step": 11452, "epoch": 137} {"train_loss": -17.761316138577747, "global_step": 11453, "epoch": 137, "val_loss": 6367265.0} {"train_loss": -17.13522720336914, "global_step": 11454, "epoch": 138} {"train_loss": -17.468936920166016, "global_step": 11455, "epoch": 138} {"train_loss": -17.958845138549805, "global_step": 11456, "epoch": 138} {"train_loss": -18.043176651000977, "global_step": 11457, "epoch": 138} {"train_loss": -17.107772827148438, "global_step": 11458, "epoch": 138} {"train_loss": -17.4560604095459, "global_step": 11459, "epoch": 138} {"train_loss": -17.248449325561523, "global_step": 11460, "epoch": 138} {"train_loss": -17.581159591674805, "global_step": 11461, "epoch": 138} {"train_loss": -17.805212020874023, "global_step": 11462, "epoch": 138} {"train_loss": -17.774686813354492, "global_step": 11463, "epoch": 138} {"train_loss": -17.737102508544922, "global_step": 11464, "epoch": 138} {"train_loss": -17.473346710205078, "global_step": 11465, "epoch": 138} {"train_loss": -17.927593231201172, "global_step": 11466, "epoch": 138} {"train_loss": -17.68750762939453, "global_step": 11467, "epoch": 138} {"train_loss": -17.754323959350586, "global_step": 11468, "epoch": 138} {"train_loss": -17.831262588500977, "global_step": 11469, "epoch": 138} {"train_loss": -17.779850006103516, "global_step": 11470, "epoch": 138} {"train_loss": -17.523313522338867, "global_step": 11471, "epoch": 138} {"train_loss": -17.844053268432617, "global_step": 11472, "epoch": 138} {"train_loss": -17.6871280670166, "global_step": 11473, "epoch": 138} {"train_loss": -18.044769287109375, "global_step": 11474, "epoch": 138} {"train_loss": -18.13381004333496, "global_step": 11475, "epoch": 138} {"train_loss": -18.206619262695312, "global_step": 11476, "epoch": 138} {"train_loss": -17.79727554321289, "global_step": 11477, "epoch": 138} {"train_loss": -17.825952529907227, "global_step": 11478, "epoch": 138} {"train_loss": -17.611074447631836, "global_step": 11479, "epoch": 138} {"train_loss": -17.739215850830078, "global_step": 11480, "epoch": 138} {"train_loss": -17.828935623168945, "global_step": 11481, "epoch": 138} {"train_loss": -17.868589401245117, "global_step": 11482, "epoch": 138} {"train_loss": -17.46175765991211, "global_step": 11483, "epoch": 138} {"train_loss": -17.890321731567383, "global_step": 11484, "epoch": 138} {"train_loss": -17.677534103393555, "global_step": 11485, "epoch": 138} {"train_loss": -17.958219528198242, "global_step": 11486, "epoch": 138} {"train_loss": -17.159324645996094, "global_step": 11487, "epoch": 138} {"train_loss": -17.394535064697266, "global_step": 11488, "epoch": 138} {"train_loss": -17.909469604492188, "global_step": 11489, "epoch": 138} {"train_loss": -17.67591667175293, "global_step": 11490, "epoch": 138} {"train_loss": -17.89935874938965, "global_step": 11491, "epoch": 138} {"train_loss": -17.955446243286133, "global_step": 11492, "epoch": 138} {"train_loss": -17.44068717956543, "global_step": 11493, "epoch": 138} {"train_loss": -17.841276168823242, "global_step": 11494, "epoch": 138} {"train_loss": -17.401601791381836, "global_step": 11495, "epoch": 138} {"train_loss": -17.599136352539062, "global_step": 11496, "epoch": 138} {"train_loss": -17.522375106811523, "global_step": 11497, "epoch": 138} {"train_loss": -17.911582946777344, "global_step": 11498, "epoch": 138} {"train_loss": -17.88955307006836, "global_step": 11499, "epoch": 138} {"train_loss": -18.237890243530273, "global_step": 11500, "epoch": 138} {"train_loss": -17.8705997467041, "global_step": 11501, "epoch": 138} {"train_loss": -17.744352340698242, "global_step": 11502, "epoch": 138} {"train_loss": -17.651172637939453, "global_step": 11503, "epoch": 138} {"train_loss": -18.010025024414062, "global_step": 11504, "epoch": 138} {"train_loss": -17.596664428710938, "global_step": 11505, "epoch": 138} {"train_loss": -17.92092514038086, "global_step": 11506, "epoch": 138} {"train_loss": -17.856552124023438, "global_step": 11507, "epoch": 138} {"train_loss": -17.680904388427734, "global_step": 11508, "epoch": 138} {"train_loss": -18.092199325561523, "global_step": 11509, "epoch": 138} {"train_loss": -17.920679092407227, "global_step": 11510, "epoch": 138} {"train_loss": -17.437284469604492, "global_step": 11511, "epoch": 138} {"train_loss": -17.886545181274414, "global_step": 11512, "epoch": 138} {"train_loss": -17.879505157470703, "global_step": 11513, "epoch": 138} {"train_loss": -17.745121002197266, "global_step": 11514, "epoch": 138} {"train_loss": -17.813119888305664, "global_step": 11515, "epoch": 138} {"train_loss": -17.751602172851562, "global_step": 11516, "epoch": 138} {"train_loss": -17.4458065032959, "global_step": 11517, "epoch": 138} {"train_loss": -17.774961471557617, "global_step": 11518, "epoch": 138} {"train_loss": -18.359268188476562, "global_step": 11519, "epoch": 138} {"train_loss": -17.784955978393555, "global_step": 11520, "epoch": 138} {"train_loss": -18.033517837524414, "global_step": 11521, "epoch": 138} {"train_loss": -17.662107467651367, "global_step": 11522, "epoch": 138} {"train_loss": -17.514713287353516, "global_step": 11523, "epoch": 138} {"train_loss": -17.787118911743164, "global_step": 11524, "epoch": 138} {"train_loss": -17.861730575561523, "global_step": 11525, "epoch": 138} {"train_loss": -17.9729061126709, "global_step": 11526, "epoch": 138} {"train_loss": -17.461627960205078, "global_step": 11527, "epoch": 138} {"train_loss": -17.75176429748535, "global_step": 11528, "epoch": 138} {"train_loss": -17.4652099609375, "global_step": 11529, "epoch": 138} {"train_loss": -17.94589614868164, "global_step": 11530, "epoch": 138} {"train_loss": -17.859270095825195, "global_step": 11531, "epoch": 138} {"train_loss": -17.803958892822266, "global_step": 11532, "epoch": 138} {"train_loss": -17.866596221923828, "global_step": 11533, "epoch": 138} {"train_loss": -17.59842872619629, "global_step": 11534, "epoch": 138} {"train_loss": -17.91451072692871, "global_step": 11535, "epoch": 138} {"train_loss": -17.74461955334767, "global_step": 11536, "epoch": 138, "val_loss": 5950297.5} {"train_loss": -17.235910415649414, "global_step": 11537, "epoch": 139} {"train_loss": -17.524789810180664, "global_step": 11538, "epoch": 139} {"train_loss": -17.861724853515625, "global_step": 11539, "epoch": 139} {"train_loss": -17.744688034057617, "global_step": 11540, "epoch": 139} {"train_loss": -18.326690673828125, "global_step": 11541, "epoch": 139} {"train_loss": -17.843719482421875, "global_step": 11542, "epoch": 139} {"train_loss": -17.72562599182129, "global_step": 11543, "epoch": 139} {"train_loss": -17.614242553710938, "global_step": 11544, "epoch": 139} {"train_loss": -17.552555084228516, "global_step": 11545, "epoch": 139} {"train_loss": -17.864084243774414, "global_step": 11546, "epoch": 139} {"train_loss": -17.53837776184082, "global_step": 11547, "epoch": 139} {"train_loss": -17.431884765625, "global_step": 11548, "epoch": 139} {"train_loss": -17.844806671142578, "global_step": 11549, "epoch": 139} {"train_loss": -17.98750877380371, "global_step": 11550, "epoch": 139} {"train_loss": -17.439687728881836, "global_step": 11551, "epoch": 139} {"train_loss": -17.780935287475586, "global_step": 11552, "epoch": 139} {"train_loss": -17.652666091918945, "global_step": 11553, "epoch": 139} {"train_loss": -17.692724227905273, "global_step": 11554, "epoch": 139} {"train_loss": -18.12392234802246, "global_step": 11555, "epoch": 139} {"train_loss": -17.616947174072266, "global_step": 11556, "epoch": 139} {"train_loss": -17.925052642822266, "global_step": 11557, "epoch": 139} {"train_loss": -17.64959144592285, "global_step": 11558, "epoch": 139} {"train_loss": -17.667102813720703, "global_step": 11559, "epoch": 139} {"train_loss": -18.02210807800293, "global_step": 11560, "epoch": 139} {"train_loss": -18.11543846130371, "global_step": 11561, "epoch": 139} {"train_loss": -17.77640151977539, "global_step": 11562, "epoch": 139} {"train_loss": -18.19954490661621, "global_step": 11563, "epoch": 139} {"train_loss": -17.740659713745117, "global_step": 11564, "epoch": 139} {"train_loss": -17.43751335144043, "global_step": 11565, "epoch": 139} {"train_loss": -17.534692764282227, "global_step": 11566, "epoch": 139} {"train_loss": -17.93849754333496, "global_step": 11567, "epoch": 139} {"train_loss": -17.93915557861328, "global_step": 11568, "epoch": 139} {"train_loss": -17.2456111907959, "global_step": 11569, "epoch": 139} {"train_loss": -18.022565841674805, "global_step": 11570, "epoch": 139} {"train_loss": -17.756999969482422, "global_step": 11571, "epoch": 139} {"train_loss": -18.273345947265625, "global_step": 11572, "epoch": 139} {"train_loss": -17.707061767578125, "global_step": 11573, "epoch": 139} {"train_loss": -17.522438049316406, "global_step": 11574, "epoch": 139} {"train_loss": -17.779020309448242, "global_step": 11575, "epoch": 139} {"train_loss": -17.785537719726562, "global_step": 11576, "epoch": 139} {"train_loss": -17.621795654296875, "global_step": 11577, "epoch": 139} {"train_loss": -17.787872314453125, "global_step": 11578, "epoch": 139} {"train_loss": -18.26401710510254, "global_step": 11579, "epoch": 139} {"train_loss": -17.747228622436523, "global_step": 11580, "epoch": 139} {"train_loss": -17.972732543945312, "global_step": 11581, "epoch": 139} {"train_loss": -18.21190071105957, "global_step": 11582, "epoch": 139} {"train_loss": -17.867246627807617, "global_step": 11583, "epoch": 139} {"train_loss": -17.94752311706543, "global_step": 11584, "epoch": 139} {"train_loss": -18.0096492767334, "global_step": 11585, "epoch": 139} {"train_loss": -18.057945251464844, "global_step": 11586, "epoch": 139} {"train_loss": -17.73256492614746, "global_step": 11587, "epoch": 139} {"train_loss": -17.616626739501953, "global_step": 11588, "epoch": 139} {"train_loss": -18.02744483947754, "global_step": 11589, "epoch": 139} {"train_loss": -17.59567642211914, "global_step": 11590, "epoch": 139} {"train_loss": -18.0296688079834, "global_step": 11591, "epoch": 139} {"train_loss": -17.83072280883789, "global_step": 11592, "epoch": 139} {"train_loss": -18.282812118530273, "global_step": 11593, "epoch": 139} {"train_loss": -17.865325927734375, "global_step": 11594, "epoch": 139} {"train_loss": -17.809865951538086, "global_step": 11595, "epoch": 139} {"train_loss": -17.6640625, "global_step": 11596, "epoch": 139} {"train_loss": -17.90537452697754, "global_step": 11597, "epoch": 139} {"train_loss": -17.824268341064453, "global_step": 11598, "epoch": 139} {"train_loss": -17.910846710205078, "global_step": 11599, "epoch": 139} {"train_loss": -17.555683135986328, "global_step": 11600, "epoch": 139} {"train_loss": -17.60226058959961, "global_step": 11601, "epoch": 139} {"train_loss": -17.797225952148438, "global_step": 11602, "epoch": 139} {"train_loss": -17.5379581451416, "global_step": 11603, "epoch": 139} {"train_loss": -17.855924606323242, "global_step": 11604, "epoch": 139} {"train_loss": -17.86337661743164, "global_step": 11605, "epoch": 139} {"train_loss": -17.859834671020508, "global_step": 11606, "epoch": 139} {"train_loss": -17.61101531982422, "global_step": 11607, "epoch": 139} {"train_loss": -17.780399322509766, "global_step": 11608, "epoch": 139} {"train_loss": -17.5499210357666, "global_step": 11609, "epoch": 139} {"train_loss": -17.803064346313477, "global_step": 11610, "epoch": 139} {"train_loss": -17.566621780395508, "global_step": 11611, "epoch": 139} {"train_loss": -17.652456283569336, "global_step": 11612, "epoch": 139} {"train_loss": -18.31340980529785, "global_step": 11613, "epoch": 139} {"train_loss": -17.65481948852539, "global_step": 11614, "epoch": 139} {"train_loss": -17.832387924194336, "global_step": 11615, "epoch": 139} {"train_loss": -17.84303092956543, "global_step": 11616, "epoch": 139} {"train_loss": -17.902524948120117, "global_step": 11617, "epoch": 139} {"train_loss": -17.391555786132812, "global_step": 11618, "epoch": 139} {"train_loss": -17.796039788119764, "global_step": 11619, "epoch": 139, "val_loss": 6068496.0} {"train_loss": -17.510957717895508, "global_step": 11620, "epoch": 140} {"train_loss": -18.07169532775879, "global_step": 11621, "epoch": 140} {"train_loss": -17.88442039489746, "global_step": 11622, "epoch": 140} {"train_loss": -17.493030548095703, "global_step": 11623, "epoch": 140} {"train_loss": -17.565380096435547, "global_step": 11624, "epoch": 140} {"train_loss": -17.876220703125, "global_step": 11625, "epoch": 140} {"train_loss": -17.448888778686523, "global_step": 11626, "epoch": 140} {"train_loss": -17.74945640563965, "global_step": 11627, "epoch": 140} {"train_loss": -17.657941818237305, "global_step": 11628, "epoch": 140} {"train_loss": -17.608816146850586, "global_step": 11629, "epoch": 140} {"train_loss": -17.893966674804688, "global_step": 11630, "epoch": 140} {"train_loss": -17.896268844604492, "global_step": 11631, "epoch": 140} {"train_loss": -17.648305892944336, "global_step": 11632, "epoch": 140} {"train_loss": -17.873931884765625, "global_step": 11633, "epoch": 140} {"train_loss": -17.3377628326416, "global_step": 11634, "epoch": 140} {"train_loss": -17.774290084838867, "global_step": 11635, "epoch": 140} {"train_loss": -17.934921264648438, "global_step": 11636, "epoch": 140} {"train_loss": -17.998794555664062, "global_step": 11637, "epoch": 140} {"train_loss": -17.458921432495117, "global_step": 11638, "epoch": 140} {"train_loss": -17.474763870239258, "global_step": 11639, "epoch": 140} {"train_loss": -17.617040634155273, "global_step": 11640, "epoch": 140} {"train_loss": -17.845849990844727, "global_step": 11641, "epoch": 140} {"train_loss": -17.4349365234375, "global_step": 11642, "epoch": 140} {"train_loss": -17.265562057495117, "global_step": 11643, "epoch": 140} {"train_loss": -17.498689651489258, "global_step": 11644, "epoch": 140} {"train_loss": -17.73421287536621, "global_step": 11645, "epoch": 140} {"train_loss": -17.994306564331055, "global_step": 11646, "epoch": 140} {"train_loss": -18.220245361328125, "global_step": 11647, "epoch": 140} {"train_loss": -17.626813888549805, "global_step": 11648, "epoch": 140} {"train_loss": -17.712413787841797, "global_step": 11649, "epoch": 140} {"train_loss": -17.793792724609375, "global_step": 11650, "epoch": 140} {"train_loss": -18.070947647094727, "global_step": 11651, "epoch": 140} {"train_loss": -17.738906860351562, "global_step": 11652, "epoch": 140} {"train_loss": -17.73297119140625, "global_step": 11653, "epoch": 140} {"train_loss": -17.7016658782959, "global_step": 11654, "epoch": 140} {"train_loss": -17.65151023864746, "global_step": 11655, "epoch": 140} {"train_loss": -17.75813102722168, "global_step": 11656, "epoch": 140} {"train_loss": -17.67534828186035, "global_step": 11657, "epoch": 140} {"train_loss": -17.93917465209961, "global_step": 11658, "epoch": 140} {"train_loss": -17.658830642700195, "global_step": 11659, "epoch": 140} {"train_loss": -17.69441795349121, "global_step": 11660, "epoch": 140} {"train_loss": -17.69693946838379, "global_step": 11661, "epoch": 140} {"train_loss": -17.42104148864746, "global_step": 11662, "epoch": 140} {"train_loss": -17.377817153930664, "global_step": 11663, "epoch": 140} {"train_loss": -17.884748458862305, "global_step": 11664, "epoch": 140} {"train_loss": -17.66813850402832, "global_step": 11665, "epoch": 140} {"train_loss": -18.096433639526367, "global_step": 11666, "epoch": 140} {"train_loss": -17.98333168029785, "global_step": 11667, "epoch": 140} {"train_loss": -18.135852813720703, "global_step": 11668, "epoch": 140} {"train_loss": -17.503551483154297, "global_step": 11669, "epoch": 140} {"train_loss": -17.98138999938965, "global_step": 11670, "epoch": 140} {"train_loss": -17.5490779876709, "global_step": 11671, "epoch": 140} {"train_loss": -18.21150016784668, "global_step": 11672, "epoch": 140} {"train_loss": -17.70492935180664, "global_step": 11673, "epoch": 140} {"train_loss": -17.978851318359375, "global_step": 11674, "epoch": 140} {"train_loss": -17.693857192993164, "global_step": 11675, "epoch": 140} {"train_loss": -17.88700294494629, "global_step": 11676, "epoch": 140} {"train_loss": -18.17596435546875, "global_step": 11677, "epoch": 140} {"train_loss": -17.901386260986328, "global_step": 11678, "epoch": 140} {"train_loss": -17.460233688354492, "global_step": 11679, "epoch": 140} {"train_loss": -18.127464294433594, "global_step": 11680, "epoch": 140} {"train_loss": -18.09149169921875, "global_step": 11681, "epoch": 140} {"train_loss": -17.853017807006836, "global_step": 11682, "epoch": 140} {"train_loss": -17.557220458984375, "global_step": 11683, "epoch": 140} {"train_loss": -18.010290145874023, "global_step": 11684, "epoch": 140} {"train_loss": -17.683979034423828, "global_step": 11685, "epoch": 140} {"train_loss": -17.647563934326172, "global_step": 11686, "epoch": 140} {"train_loss": -17.739517211914062, "global_step": 11687, "epoch": 140} {"train_loss": -18.14799690246582, "global_step": 11688, "epoch": 140} {"train_loss": -17.767385482788086, "global_step": 11689, "epoch": 140} {"train_loss": -17.7769718170166, "global_step": 11690, "epoch": 140} {"train_loss": -17.68992805480957, "global_step": 11691, "epoch": 140} {"train_loss": -18.08335304260254, "global_step": 11692, "epoch": 140} {"train_loss": -17.65044593811035, "global_step": 11693, "epoch": 140} {"train_loss": -17.85565185546875, "global_step": 11694, "epoch": 140} {"train_loss": -17.756914138793945, "global_step": 11695, "epoch": 140} {"train_loss": -18.03248405456543, "global_step": 11696, "epoch": 140} {"train_loss": -17.709726333618164, "global_step": 11697, "epoch": 140} {"train_loss": -17.793210983276367, "global_step": 11698, "epoch": 140} {"train_loss": -18.117130279541016, "global_step": 11699, "epoch": 140} {"train_loss": -17.926681518554688, "global_step": 11700, "epoch": 140} {"train_loss": -17.872053146362305, "global_step": 11701, "epoch": 140} {"train_loss": -17.78824629266578, "global_step": 11702, "epoch": 140, "val_loss": 6062206.0} {"train_loss": -17.17826271057129, "global_step": 11703, "epoch": 141} {"train_loss": -17.918437957763672, "global_step": 11704, "epoch": 141} {"train_loss": -17.869626998901367, "global_step": 11705, "epoch": 141} {"train_loss": -17.411970138549805, "global_step": 11706, "epoch": 141} {"train_loss": -17.60422134399414, "global_step": 11707, "epoch": 141} {"train_loss": -17.552392959594727, "global_step": 11708, "epoch": 141} {"train_loss": -17.456480026245117, "global_step": 11709, "epoch": 141} {"train_loss": -17.38747787475586, "global_step": 11710, "epoch": 141} {"train_loss": -17.632816314697266, "global_step": 11711, "epoch": 141} {"train_loss": -17.505054473876953, "global_step": 11712, "epoch": 141} {"train_loss": -17.94019317626953, "global_step": 11713, "epoch": 141} {"train_loss": -17.90457534790039, "global_step": 11714, "epoch": 141} {"train_loss": -18.004331588745117, "global_step": 11715, "epoch": 141} {"train_loss": -17.208507537841797, "global_step": 11716, "epoch": 141} {"train_loss": -17.294864654541016, "global_step": 11717, "epoch": 141} {"train_loss": -18.054372787475586, "global_step": 11718, "epoch": 141} {"train_loss": -17.932661056518555, "global_step": 11719, "epoch": 141} {"train_loss": -17.513019561767578, "global_step": 11720, "epoch": 141} {"train_loss": -17.582658767700195, "global_step": 11721, "epoch": 141} {"train_loss": -17.253009796142578, "global_step": 11722, "epoch": 141} {"train_loss": -17.463653564453125, "global_step": 11723, "epoch": 141} {"train_loss": -17.737960815429688, "global_step": 11724, "epoch": 141} {"train_loss": -17.663400650024414, "global_step": 11725, "epoch": 141} {"train_loss": -17.964399337768555, "global_step": 11726, "epoch": 141} {"train_loss": -17.447294235229492, "global_step": 11727, "epoch": 141} {"train_loss": -17.358707427978516, "global_step": 11728, "epoch": 141} {"train_loss": -18.010379791259766, "global_step": 11729, "epoch": 141} {"train_loss": -17.747875213623047, "global_step": 11730, "epoch": 141} {"train_loss": -17.91309928894043, "global_step": 11731, "epoch": 141} {"train_loss": -18.25990104675293, "global_step": 11732, "epoch": 141} {"train_loss": -17.50667953491211, "global_step": 11733, "epoch": 141} {"train_loss": -18.05695915222168, "global_step": 11734, "epoch": 141} {"train_loss": -17.394309997558594, "global_step": 11735, "epoch": 141} {"train_loss": -17.836820602416992, "global_step": 11736, "epoch": 141} {"train_loss": -17.669973373413086, "global_step": 11737, "epoch": 141} {"train_loss": -17.714447021484375, "global_step": 11738, "epoch": 141} {"train_loss": -18.03911781311035, "global_step": 11739, "epoch": 141} {"train_loss": -17.41981315612793, "global_step": 11740, "epoch": 141} {"train_loss": -17.743030548095703, "global_step": 11741, "epoch": 141} {"train_loss": -17.763214111328125, "global_step": 11742, "epoch": 141} {"train_loss": -17.664587020874023, "global_step": 11743, "epoch": 141} {"train_loss": -18.17352294921875, "global_step": 11744, "epoch": 141} {"train_loss": -18.072885513305664, "global_step": 11745, "epoch": 141} {"train_loss": -17.99496841430664, "global_step": 11746, "epoch": 141} {"train_loss": -17.724075317382812, "global_step": 11747, "epoch": 141} {"train_loss": -17.646745681762695, "global_step": 11748, "epoch": 141} {"train_loss": -17.59800910949707, "global_step": 11749, "epoch": 141} {"train_loss": -18.16159439086914, "global_step": 11750, "epoch": 141} {"train_loss": -17.74393653869629, "global_step": 11751, "epoch": 141} {"train_loss": -17.938953399658203, "global_step": 11752, "epoch": 141} {"train_loss": -17.495548248291016, "global_step": 11753, "epoch": 141} {"train_loss": -17.800926208496094, "global_step": 11754, "epoch": 141} {"train_loss": -17.806352615356445, "global_step": 11755, "epoch": 141} {"train_loss": -18.26181411743164, "global_step": 11756, "epoch": 141} {"train_loss": -17.722951889038086, "global_step": 11757, "epoch": 141} {"train_loss": -17.87906265258789, "global_step": 11758, "epoch": 141} {"train_loss": -17.776870727539062, "global_step": 11759, "epoch": 141} {"train_loss": -17.885953903198242, "global_step": 11760, "epoch": 141} {"train_loss": -17.852169036865234, "global_step": 11761, "epoch": 141} {"train_loss": -18.123706817626953, "global_step": 11762, "epoch": 141} {"train_loss": -17.9222469329834, "global_step": 11763, "epoch": 141} {"train_loss": -17.597497940063477, "global_step": 11764, "epoch": 141} {"train_loss": -17.562349319458008, "global_step": 11765, "epoch": 141} {"train_loss": -18.062856674194336, "global_step": 11766, "epoch": 141} {"train_loss": -17.688858032226562, "global_step": 11767, "epoch": 141} {"train_loss": -17.55965232849121, "global_step": 11768, "epoch": 141} {"train_loss": -17.537023544311523, "global_step": 11769, "epoch": 141} {"train_loss": -17.90298843383789, "global_step": 11770, "epoch": 141} {"train_loss": -17.573139190673828, "global_step": 11771, "epoch": 141} {"train_loss": -18.030973434448242, "global_step": 11772, "epoch": 141} {"train_loss": -17.84345054626465, "global_step": 11773, "epoch": 141} {"train_loss": -17.85871696472168, "global_step": 11774, "epoch": 141} {"train_loss": -17.55512046813965, "global_step": 11775, "epoch": 141} {"train_loss": -17.661455154418945, "global_step": 11776, "epoch": 141} {"train_loss": -17.9212589263916, "global_step": 11777, "epoch": 141} {"train_loss": -17.864727020263672, "global_step": 11778, "epoch": 141} {"train_loss": -17.829702377319336, "global_step": 11779, "epoch": 141} {"train_loss": -18.06772232055664, "global_step": 11780, "epoch": 141} {"train_loss": -17.546192169189453, "global_step": 11781, "epoch": 141} {"train_loss": -18.234689712524414, "global_step": 11782, "epoch": 141} {"train_loss": -17.982633590698242, "global_step": 11783, "epoch": 141} {"train_loss": -17.865827560424805, "global_step": 11784, "epoch": 141} {"train_loss": -17.756580490663826, "global_step": 11785, "epoch": 141, "val_loss": 6222441.0} {"train_loss": -17.174575805664062, "global_step": 11786, "epoch": 142} {"train_loss": -17.390743255615234, "global_step": 11787, "epoch": 142} {"train_loss": -17.7020206451416, "global_step": 11788, "epoch": 142} {"train_loss": -17.457929611206055, "global_step": 11789, "epoch": 142} {"train_loss": -17.56976890563965, "global_step": 11790, "epoch": 142} {"train_loss": -17.652236938476562, "global_step": 11791, "epoch": 142} {"train_loss": -17.68546485900879, "global_step": 11792, "epoch": 142} {"train_loss": -17.347211837768555, "global_step": 11793, "epoch": 142} {"train_loss": -17.836811065673828, "global_step": 11794, "epoch": 142} {"train_loss": -18.266071319580078, "global_step": 11795, "epoch": 142} {"train_loss": -17.582712173461914, "global_step": 11796, "epoch": 142} {"train_loss": -17.442401885986328, "global_step": 11797, "epoch": 142} {"train_loss": -17.68663215637207, "global_step": 11798, "epoch": 142} {"train_loss": -17.8757266998291, "global_step": 11799, "epoch": 142} {"train_loss": -17.985050201416016, "global_step": 11800, "epoch": 142} {"train_loss": -17.371747970581055, "global_step": 11801, "epoch": 142} {"train_loss": -18.04555320739746, "global_step": 11802, "epoch": 142} {"train_loss": -17.95894432067871, "global_step": 11803, "epoch": 142} {"train_loss": -17.61188316345215, "global_step": 11804, "epoch": 142} {"train_loss": -17.79972267150879, "global_step": 11805, "epoch": 142} {"train_loss": -18.00051498413086, "global_step": 11806, "epoch": 142} {"train_loss": -17.655445098876953, "global_step": 11807, "epoch": 142} {"train_loss": -17.38567543029785, "global_step": 11808, "epoch": 142} {"train_loss": -17.753644943237305, "global_step": 11809, "epoch": 142} {"train_loss": -17.794160842895508, "global_step": 11810, "epoch": 142} {"train_loss": -17.214628219604492, "global_step": 11811, "epoch": 142} {"train_loss": -18.093399047851562, "global_step": 11812, "epoch": 142} {"train_loss": -17.914417266845703, "global_step": 11813, "epoch": 142} {"train_loss": -17.474140167236328, "global_step": 11814, "epoch": 142} {"train_loss": -18.073392868041992, "global_step": 11815, "epoch": 142} {"train_loss": -17.84558868408203, "global_step": 11816, "epoch": 142} {"train_loss": -17.427125930786133, "global_step": 11817, "epoch": 142} {"train_loss": -17.949390411376953, "global_step": 11818, "epoch": 142} {"train_loss": -17.6093692779541, "global_step": 11819, "epoch": 142} {"train_loss": -18.060331344604492, "global_step": 11820, "epoch": 142} {"train_loss": -17.505096435546875, "global_step": 11821, "epoch": 142} {"train_loss": -18.32502555847168, "global_step": 11822, "epoch": 142} {"train_loss": -17.91281509399414, "global_step": 11823, "epoch": 142} {"train_loss": -17.942964553833008, "global_step": 11824, "epoch": 142} {"train_loss": -17.78046989440918, "global_step": 11825, "epoch": 142} {"train_loss": -17.724578857421875, "global_step": 11826, "epoch": 142} {"train_loss": -17.752893447875977, "global_step": 11827, "epoch": 142} {"train_loss": -17.524457931518555, "global_step": 11828, "epoch": 142} {"train_loss": -18.191478729248047, "global_step": 11829, "epoch": 142} {"train_loss": -18.06574821472168, "global_step": 11830, "epoch": 142} {"train_loss": -18.107887268066406, "global_step": 11831, "epoch": 142} {"train_loss": -17.782529830932617, "global_step": 11832, "epoch": 142} {"train_loss": -18.039052963256836, "global_step": 11833, "epoch": 142} {"train_loss": -17.9720458984375, "global_step": 11834, "epoch": 142} {"train_loss": -17.4658203125, "global_step": 11835, "epoch": 142} {"train_loss": -17.66693687438965, "global_step": 11836, "epoch": 142} {"train_loss": -17.504615783691406, "global_step": 11837, "epoch": 142} {"train_loss": -18.19904899597168, "global_step": 11838, "epoch": 142} {"train_loss": -17.74256706237793, "global_step": 11839, "epoch": 142} {"train_loss": -17.914968490600586, "global_step": 11840, "epoch": 142} {"train_loss": -17.8483943939209, "global_step": 11841, "epoch": 142} {"train_loss": -17.940998077392578, "global_step": 11842, "epoch": 142} {"train_loss": -17.47296142578125, "global_step": 11843, "epoch": 142} {"train_loss": -17.714462280273438, "global_step": 11844, "epoch": 142} {"train_loss": -17.768245697021484, "global_step": 11845, "epoch": 142} {"train_loss": -18.038541793823242, "global_step": 11846, "epoch": 142} {"train_loss": -17.85658073425293, "global_step": 11847, "epoch": 142} {"train_loss": -17.498214721679688, "global_step": 11848, "epoch": 142} {"train_loss": -17.513792037963867, "global_step": 11849, "epoch": 142} {"train_loss": -18.163698196411133, "global_step": 11850, "epoch": 142} {"train_loss": -17.954877853393555, "global_step": 11851, "epoch": 142} {"train_loss": -17.833099365234375, "global_step": 11852, "epoch": 142} {"train_loss": -17.652271270751953, "global_step": 11853, "epoch": 142} {"train_loss": -17.90094757080078, "global_step": 11854, "epoch": 142} {"train_loss": -17.70265769958496, "global_step": 11855, "epoch": 142} {"train_loss": -17.775495529174805, "global_step": 11856, "epoch": 142} {"train_loss": -17.739805221557617, "global_step": 11857, "epoch": 142} {"train_loss": -17.85197639465332, "global_step": 11858, "epoch": 142} {"train_loss": -17.866817474365234, "global_step": 11859, "epoch": 142} {"train_loss": -18.586811065673828, "global_step": 11860, "epoch": 142} {"train_loss": -17.965190887451172, "global_step": 11861, "epoch": 142} {"train_loss": -18.20686149597168, "global_step": 11862, "epoch": 142} {"train_loss": -17.5694637298584, "global_step": 11863, "epoch": 142} {"train_loss": -17.953882217407227, "global_step": 11864, "epoch": 142} {"train_loss": -18.015295028686523, "global_step": 11865, "epoch": 142} {"train_loss": -17.727006912231445, "global_step": 11866, "epoch": 142} {"train_loss": -17.798940658569336, "global_step": 11867, "epoch": 142} {"train_loss": -17.767666138798358, "global_step": 11868, "epoch": 142, "val_loss": 6390110.5} {"train_loss": -17.080686569213867, "global_step": 11869, "epoch": 143} {"train_loss": -17.979007720947266, "global_step": 11870, "epoch": 143} {"train_loss": -17.291400909423828, "global_step": 11871, "epoch": 143} {"train_loss": -17.19817543029785, "global_step": 11872, "epoch": 143} {"train_loss": -17.88816261291504, "global_step": 11873, "epoch": 143} {"train_loss": -17.680551528930664, "global_step": 11874, "epoch": 143} {"train_loss": -17.572965621948242, "global_step": 11875, "epoch": 143} {"train_loss": -17.97756004333496, "global_step": 11876, "epoch": 143} {"train_loss": -17.02894401550293, "global_step": 11877, "epoch": 143} {"train_loss": -17.646488189697266, "global_step": 11878, "epoch": 143} {"train_loss": -17.67374038696289, "global_step": 11879, "epoch": 143} {"train_loss": -17.46099853515625, "global_step": 11880, "epoch": 143} {"train_loss": -17.892776489257812, "global_step": 11881, "epoch": 143} {"train_loss": -17.802209854125977, "global_step": 11882, "epoch": 143} {"train_loss": -17.740863800048828, "global_step": 11883, "epoch": 143} {"train_loss": -17.72515869140625, "global_step": 11884, "epoch": 143} {"train_loss": -17.70842933654785, "global_step": 11885, "epoch": 143} {"train_loss": -17.416913986206055, "global_step": 11886, "epoch": 143} {"train_loss": -18.393285751342773, "global_step": 11887, "epoch": 143} {"train_loss": -18.00763511657715, "global_step": 11888, "epoch": 143} {"train_loss": -17.48272132873535, "global_step": 11889, "epoch": 143} {"train_loss": -17.656423568725586, "global_step": 11890, "epoch": 143} {"train_loss": -17.838058471679688, "global_step": 11891, "epoch": 143} {"train_loss": -17.586978912353516, "global_step": 11892, "epoch": 143} {"train_loss": -17.926021575927734, "global_step": 11893, "epoch": 143} {"train_loss": -17.71940803527832, "global_step": 11894, "epoch": 143} {"train_loss": -17.698514938354492, "global_step": 11895, "epoch": 143} {"train_loss": -17.602996826171875, "global_step": 11896, "epoch": 143} {"train_loss": -17.737226486206055, "global_step": 11897, "epoch": 143} {"train_loss": -17.99899673461914, "global_step": 11898, "epoch": 143} {"train_loss": -17.87127685546875, "global_step": 11899, "epoch": 143} {"train_loss": -17.841796875, "global_step": 11900, "epoch": 143} {"train_loss": -17.9056396484375, "global_step": 11901, "epoch": 143} {"train_loss": -17.4320068359375, "global_step": 11902, "epoch": 143} {"train_loss": -17.617549896240234, "global_step": 11903, "epoch": 143} {"train_loss": -17.930362701416016, "global_step": 11904, "epoch": 143} {"train_loss": -18.115249633789062, "global_step": 11905, "epoch": 143} {"train_loss": -17.763750076293945, "global_step": 11906, "epoch": 143} {"train_loss": -18.061620712280273, "global_step": 11907, "epoch": 143} {"train_loss": -18.11396598815918, "global_step": 11908, "epoch": 143} {"train_loss": -17.973608016967773, "global_step": 11909, "epoch": 143} {"train_loss": -17.856369018554688, "global_step": 11910, "epoch": 143} {"train_loss": -17.638967514038086, "global_step": 11911, "epoch": 143} {"train_loss": -18.083236694335938, "global_step": 11912, "epoch": 143} {"train_loss": -17.46695327758789, "global_step": 11913, "epoch": 143} {"train_loss": -18.044673919677734, "global_step": 11914, "epoch": 143} {"train_loss": -17.7637996673584, "global_step": 11915, "epoch": 143} {"train_loss": -17.504009246826172, "global_step": 11916, "epoch": 143} {"train_loss": -17.72089195251465, "global_step": 11917, "epoch": 143} {"train_loss": -18.001224517822266, "global_step": 11918, "epoch": 143} {"train_loss": -17.974781036376953, "global_step": 11919, "epoch": 143} {"train_loss": -17.58247184753418, "global_step": 11920, "epoch": 143} {"train_loss": -17.964801788330078, "global_step": 11921, "epoch": 143} {"train_loss": -17.816686630249023, "global_step": 11922, "epoch": 143} {"train_loss": -18.016326904296875, "global_step": 11923, "epoch": 143} {"train_loss": -17.548803329467773, "global_step": 11924, "epoch": 143} {"train_loss": -17.661808013916016, "global_step": 11925, "epoch": 143} {"train_loss": -17.133872985839844, "global_step": 11926, "epoch": 143} {"train_loss": -18.096384048461914, "global_step": 11927, "epoch": 143} {"train_loss": -17.81954002380371, "global_step": 11928, "epoch": 143} {"train_loss": -17.913732528686523, "global_step": 11929, "epoch": 143} {"train_loss": -18.428205490112305, "global_step": 11930, "epoch": 143} {"train_loss": -18.045053482055664, "global_step": 11931, "epoch": 143} {"train_loss": -17.90437889099121, "global_step": 11932, "epoch": 143} {"train_loss": -18.025854110717773, "global_step": 11933, "epoch": 143} {"train_loss": -17.820505142211914, "global_step": 11934, "epoch": 143} {"train_loss": -17.5938777923584, "global_step": 11935, "epoch": 143} {"train_loss": -18.152769088745117, "global_step": 11936, "epoch": 143} {"train_loss": -17.840944290161133, "global_step": 11937, "epoch": 143} {"train_loss": -18.130210876464844, "global_step": 11938, "epoch": 143} {"train_loss": -17.76142692565918, "global_step": 11939, "epoch": 143} {"train_loss": -17.90631866455078, "global_step": 11940, "epoch": 143} {"train_loss": -17.995412826538086, "global_step": 11941, "epoch": 143} {"train_loss": -18.08775520324707, "global_step": 11942, "epoch": 143} {"train_loss": -17.75680923461914, "global_step": 11943, "epoch": 143} {"train_loss": -17.93212127685547, "global_step": 11944, "epoch": 143} {"train_loss": -18.039682388305664, "global_step": 11945, "epoch": 143} {"train_loss": -18.223575592041016, "global_step": 11946, "epoch": 143} {"train_loss": -17.71195411682129, "global_step": 11947, "epoch": 143} {"train_loss": -17.595975875854492, "global_step": 11948, "epoch": 143} {"train_loss": -17.84271812438965, "global_step": 11949, "epoch": 143} {"train_loss": -17.934412002563477, "global_step": 11950, "epoch": 143} {"train_loss": -17.79914883533156, "global_step": 11951, "epoch": 143, "val_loss": 6297672.0} {"train_loss": -17.753522872924805, "global_step": 11952, "epoch": 144} {"train_loss": -17.83084487915039, "global_step": 11953, "epoch": 144} {"train_loss": -17.635848999023438, "global_step": 11954, "epoch": 144} {"train_loss": -17.914793014526367, "global_step": 11955, "epoch": 144} {"train_loss": -17.919227600097656, "global_step": 11956, "epoch": 144} {"train_loss": -17.772432327270508, "global_step": 11957, "epoch": 144} {"train_loss": -17.67987823486328, "global_step": 11958, "epoch": 144} {"train_loss": -17.52608299255371, "global_step": 11959, "epoch": 144} {"train_loss": -18.0582332611084, "global_step": 11960, "epoch": 144} {"train_loss": -17.945144653320312, "global_step": 11961, "epoch": 144} {"train_loss": -17.7435359954834, "global_step": 11962, "epoch": 144} {"train_loss": -17.860923767089844, "global_step": 11963, "epoch": 144} {"train_loss": -17.720905303955078, "global_step": 11964, "epoch": 144} {"train_loss": -17.995481491088867, "global_step": 11965, "epoch": 144} {"train_loss": -17.98586082458496, "global_step": 11966, "epoch": 144} {"train_loss": -17.774404525756836, "global_step": 11967, "epoch": 144} {"train_loss": -17.79198455810547, "global_step": 11968, "epoch": 144} {"train_loss": -18.208820343017578, "global_step": 11969, "epoch": 144} {"train_loss": -17.8143367767334, "global_step": 11970, "epoch": 144} {"train_loss": -17.677698135375977, "global_step": 11971, "epoch": 144} {"train_loss": -17.581146240234375, "global_step": 11972, "epoch": 144} {"train_loss": -17.601537704467773, "global_step": 11973, "epoch": 144} {"train_loss": -17.460309982299805, "global_step": 11974, "epoch": 144} {"train_loss": -18.094812393188477, "global_step": 11975, "epoch": 144} {"train_loss": -18.190683364868164, "global_step": 11976, "epoch": 144} {"train_loss": -17.631637573242188, "global_step": 11977, "epoch": 144} {"train_loss": -17.909364700317383, "global_step": 11978, "epoch": 144} {"train_loss": -17.833927154541016, "global_step": 11979, "epoch": 144} {"train_loss": -17.792682647705078, "global_step": 11980, "epoch": 144} {"train_loss": -18.23290252685547, "global_step": 11981, "epoch": 144} {"train_loss": -18.062210083007812, "global_step": 11982, "epoch": 144} {"train_loss": -17.816129684448242, "global_step": 11983, "epoch": 144} {"train_loss": -17.60211181640625, "global_step": 11984, "epoch": 144} {"train_loss": -18.042064666748047, "global_step": 11985, "epoch": 144} {"train_loss": -18.087554931640625, "global_step": 11986, "epoch": 144} {"train_loss": -18.133474349975586, "global_step": 11987, "epoch": 144} {"train_loss": -18.03118324279785, "global_step": 11988, "epoch": 144} {"train_loss": -17.610471725463867, "global_step": 11989, "epoch": 144} {"train_loss": -17.66739845275879, "global_step": 11990, "epoch": 144} {"train_loss": -18.15778923034668, "global_step": 11991, "epoch": 144} {"train_loss": -17.802915573120117, "global_step": 11992, "epoch": 144} {"train_loss": -17.775775909423828, "global_step": 11993, "epoch": 144} {"train_loss": -17.662208557128906, "global_step": 11994, "epoch": 144} {"train_loss": -17.9353084564209, "global_step": 11995, "epoch": 144} {"train_loss": -17.682636260986328, "global_step": 11996, "epoch": 144} {"train_loss": -17.98703384399414, "global_step": 11997, "epoch": 144} {"train_loss": -18.065982818603516, "global_step": 11998, "epoch": 144} {"train_loss": -18.091928482055664, "global_step": 11999, "epoch": 144} {"train_loss": -18.023775100708008, "global_step": 12000, "epoch": 144} {"train_loss": -17.634191513061523, "global_step": 12001, "epoch": 144} {"train_loss": -18.025066375732422, "global_step": 12002, "epoch": 144} {"train_loss": -17.798603057861328, "global_step": 12003, "epoch": 144} {"train_loss": -17.801345825195312, "global_step": 12004, "epoch": 144} {"train_loss": -17.8095645904541, "global_step": 12005, "epoch": 144} {"train_loss": -17.91126823425293, "global_step": 12006, "epoch": 144} {"train_loss": -17.76080894470215, "global_step": 12007, "epoch": 144} {"train_loss": -17.641239166259766, "global_step": 12008, "epoch": 144} {"train_loss": -17.963552474975586, "global_step": 12009, "epoch": 144} {"train_loss": -17.488658905029297, "global_step": 12010, "epoch": 144} {"train_loss": -18.06479835510254, "global_step": 12011, "epoch": 144} {"train_loss": -17.777021408081055, "global_step": 12012, "epoch": 144} {"train_loss": -17.61763572692871, "global_step": 12013, "epoch": 144} {"train_loss": -17.73003578186035, "global_step": 12014, "epoch": 144} {"train_loss": -17.726234436035156, "global_step": 12015, "epoch": 144} {"train_loss": -17.559133529663086, "global_step": 12016, "epoch": 144} {"train_loss": -17.714061737060547, "global_step": 12017, "epoch": 144} {"train_loss": -17.819416046142578, "global_step": 12018, "epoch": 144} {"train_loss": -18.06353187561035, "global_step": 12019, "epoch": 144} {"train_loss": -17.542821884155273, "global_step": 12020, "epoch": 144} {"train_loss": -17.79587173461914, "global_step": 12021, "epoch": 144} {"train_loss": -17.779417037963867, "global_step": 12022, "epoch": 144} {"train_loss": -17.808740615844727, "global_step": 12023, "epoch": 144} {"train_loss": -17.726049423217773, "global_step": 12024, "epoch": 144} {"train_loss": -17.766550064086914, "global_step": 12025, "epoch": 144} {"train_loss": -17.969743728637695, "global_step": 12026, "epoch": 144} {"train_loss": -17.63530158996582, "global_step": 12027, "epoch": 144} {"train_loss": -18.160673141479492, "global_step": 12028, "epoch": 144} {"train_loss": -17.8986873626709, "global_step": 12029, "epoch": 144} {"train_loss": -17.236865997314453, "global_step": 12030, "epoch": 144} {"train_loss": -17.84181022644043, "global_step": 12031, "epoch": 144} {"train_loss": -17.6685791015625, "global_step": 12032, "epoch": 144} {"train_loss": -17.33431053161621, "global_step": 12033, "epoch": 144} {"train_loss": -17.824266640536756, "global_step": 12034, "epoch": 144, "val_loss": 6310730.0} {"train_loss": -17.532411575317383, "global_step": 12035, "epoch": 145} {"train_loss": -17.263168334960938, "global_step": 12036, "epoch": 145} {"train_loss": -17.727970123291016, "global_step": 12037, "epoch": 145} {"train_loss": -17.228174209594727, "global_step": 12038, "epoch": 145} {"train_loss": -17.70840072631836, "global_step": 12039, "epoch": 145} {"train_loss": -17.637685775756836, "global_step": 12040, "epoch": 145} {"train_loss": -17.586048126220703, "global_step": 12041, "epoch": 145} {"train_loss": -17.25594139099121, "global_step": 12042, "epoch": 145} {"train_loss": -17.6697998046875, "global_step": 12043, "epoch": 145} {"train_loss": -17.59809684753418, "global_step": 12044, "epoch": 145} {"train_loss": -17.549758911132812, "global_step": 12045, "epoch": 145} {"train_loss": -18.03831672668457, "global_step": 12046, "epoch": 145} {"train_loss": -17.72144889831543, "global_step": 12047, "epoch": 145} {"train_loss": -17.35530662536621, "global_step": 12048, "epoch": 145} {"train_loss": -17.74217987060547, "global_step": 12049, "epoch": 145} {"train_loss": -17.665708541870117, "global_step": 12050, "epoch": 145} {"train_loss": -17.75104331970215, "global_step": 12051, "epoch": 145} {"train_loss": -17.796337127685547, "global_step": 12052, "epoch": 145} {"train_loss": -17.41438102722168, "global_step": 12053, "epoch": 145} {"train_loss": -17.933252334594727, "global_step": 12054, "epoch": 145} {"train_loss": -17.663082122802734, "global_step": 12055, "epoch": 145} {"train_loss": -17.30173110961914, "global_step": 12056, "epoch": 145} {"train_loss": -17.582233428955078, "global_step": 12057, "epoch": 145} {"train_loss": -17.829294204711914, "global_step": 12058, "epoch": 145} {"train_loss": -18.048282623291016, "global_step": 12059, "epoch": 145} {"train_loss": -17.374547958374023, "global_step": 12060, "epoch": 145} {"train_loss": -17.986541748046875, "global_step": 12061, "epoch": 145} {"train_loss": -17.823898315429688, "global_step": 12062, "epoch": 145} {"train_loss": -17.774600982666016, "global_step": 12063, "epoch": 145} {"train_loss": -17.820880889892578, "global_step": 12064, "epoch": 145} {"train_loss": -17.71200942993164, "global_step": 12065, "epoch": 145} {"train_loss": -17.97632598876953, "global_step": 12066, "epoch": 145} {"train_loss": -17.79850959777832, "global_step": 12067, "epoch": 145} {"train_loss": -18.06039810180664, "global_step": 12068, "epoch": 145} {"train_loss": -17.92311668395996, "global_step": 12069, "epoch": 145} {"train_loss": -17.784154891967773, "global_step": 12070, "epoch": 145} {"train_loss": -17.711774826049805, "global_step": 12071, "epoch": 145} {"train_loss": -17.92338752746582, "global_step": 12072, "epoch": 145} {"train_loss": -18.07107925415039, "global_step": 12073, "epoch": 145} {"train_loss": -17.62923240661621, "global_step": 12074, "epoch": 145} {"train_loss": -17.642292022705078, "global_step": 12075, "epoch": 145} {"train_loss": -17.880172729492188, "global_step": 12076, "epoch": 145} {"train_loss": -17.72159767150879, "global_step": 12077, "epoch": 145} {"train_loss": -18.021833419799805, "global_step": 12078, "epoch": 145} {"train_loss": -17.526687622070312, "global_step": 12079, "epoch": 145} {"train_loss": -18.032474517822266, "global_step": 12080, "epoch": 145} {"train_loss": -18.44788932800293, "global_step": 12081, "epoch": 145} {"train_loss": -17.476287841796875, "global_step": 12082, "epoch": 145} {"train_loss": -18.453046798706055, "global_step": 12083, "epoch": 145} {"train_loss": -17.840721130371094, "global_step": 12084, "epoch": 145} {"train_loss": -17.796472549438477, "global_step": 12085, "epoch": 145} {"train_loss": -17.8931941986084, "global_step": 12086, "epoch": 145} {"train_loss": -17.941577911376953, "global_step": 12087, "epoch": 145} {"train_loss": -17.967071533203125, "global_step": 12088, "epoch": 145} {"train_loss": -18.008888244628906, "global_step": 12089, "epoch": 145} {"train_loss": -18.243732452392578, "global_step": 12090, "epoch": 145} {"train_loss": -17.690946578979492, "global_step": 12091, "epoch": 145} {"train_loss": -17.812074661254883, "global_step": 12092, "epoch": 145} {"train_loss": -17.926280975341797, "global_step": 12093, "epoch": 145} {"train_loss": -18.132022857666016, "global_step": 12094, "epoch": 145} {"train_loss": -17.69145393371582, "global_step": 12095, "epoch": 145} {"train_loss": -18.49311637878418, "global_step": 12096, "epoch": 145} {"train_loss": -17.718137741088867, "global_step": 12097, "epoch": 145} {"train_loss": -17.907114028930664, "global_step": 12098, "epoch": 145} {"train_loss": -17.905622482299805, "global_step": 12099, "epoch": 145} {"train_loss": -17.668853759765625, "global_step": 12100, "epoch": 145} {"train_loss": -17.421812057495117, "global_step": 12101, "epoch": 145} {"train_loss": -17.89767837524414, "global_step": 12102, "epoch": 145} {"train_loss": -18.089475631713867, "global_step": 12103, "epoch": 145} {"train_loss": -17.800771713256836, "global_step": 12104, "epoch": 145} {"train_loss": -18.02853012084961, "global_step": 12105, "epoch": 145} {"train_loss": -17.543380737304688, "global_step": 12106, "epoch": 145} {"train_loss": -17.946714401245117, "global_step": 12107, "epoch": 145} {"train_loss": -17.60125732421875, "global_step": 12108, "epoch": 145} {"train_loss": -18.005308151245117, "global_step": 12109, "epoch": 145} {"train_loss": -17.832677841186523, "global_step": 12110, "epoch": 145} {"train_loss": -18.102706909179688, "global_step": 12111, "epoch": 145} {"train_loss": -17.646909713745117, "global_step": 12112, "epoch": 145} {"train_loss": -17.75156593322754, "global_step": 12113, "epoch": 145} {"train_loss": -17.953857421875, "global_step": 12114, "epoch": 145} {"train_loss": -17.94748878479004, "global_step": 12115, "epoch": 145} {"train_loss": -17.843856811523438, "global_step": 12116, "epoch": 145} {"train_loss": -17.806231257427168, "global_step": 12117, "epoch": 145, "val_loss": 6037252.5} {"train_loss": -17.764328002929688, "global_step": 12118, "epoch": 146} {"train_loss": -17.859228134155273, "global_step": 12119, "epoch": 146} {"train_loss": -17.722166061401367, "global_step": 12120, "epoch": 146} {"train_loss": -17.915266036987305, "global_step": 12121, "epoch": 146} {"train_loss": -18.374258041381836, "global_step": 12122, "epoch": 146} {"train_loss": -17.6859130859375, "global_step": 12123, "epoch": 146} {"train_loss": -17.98853874206543, "global_step": 12124, "epoch": 146} {"train_loss": -18.276792526245117, "global_step": 12125, "epoch": 146} {"train_loss": -17.736053466796875, "global_step": 12126, "epoch": 146} {"train_loss": -17.98915672302246, "global_step": 12127, "epoch": 146} {"train_loss": -17.627471923828125, "global_step": 12128, "epoch": 146} {"train_loss": -17.693647384643555, "global_step": 12129, "epoch": 146} {"train_loss": -17.539352416992188, "global_step": 12130, "epoch": 146} {"train_loss": -17.79695701599121, "global_step": 12131, "epoch": 146} {"train_loss": -17.764102935791016, "global_step": 12132, "epoch": 146} {"train_loss": -17.87278938293457, "global_step": 12133, "epoch": 146} {"train_loss": -17.905149459838867, "global_step": 12134, "epoch": 146} {"train_loss": -17.55792999267578, "global_step": 12135, "epoch": 146} {"train_loss": -17.498802185058594, "global_step": 12136, "epoch": 146} {"train_loss": -17.918426513671875, "global_step": 12137, "epoch": 146} {"train_loss": -18.317461013793945, "global_step": 12138, "epoch": 146} {"train_loss": -17.683942794799805, "global_step": 12139, "epoch": 146} {"train_loss": -17.410602569580078, "global_step": 12140, "epoch": 146} {"train_loss": -18.197233200073242, "global_step": 12141, "epoch": 146} {"train_loss": -17.98615837097168, "global_step": 12142, "epoch": 146} {"train_loss": -18.098581314086914, "global_step": 12143, "epoch": 146} {"train_loss": -17.908353805541992, "global_step": 12144, "epoch": 146} {"train_loss": -17.663394927978516, "global_step": 12145, "epoch": 146} {"train_loss": -17.828161239624023, "global_step": 12146, "epoch": 146} {"train_loss": -17.922103881835938, "global_step": 12147, "epoch": 146} {"train_loss": -18.03224754333496, "global_step": 12148, "epoch": 146} {"train_loss": -17.9299259185791, "global_step": 12149, "epoch": 146} {"train_loss": -17.627790451049805, "global_step": 12150, "epoch": 146} {"train_loss": -17.97774314880371, "global_step": 12151, "epoch": 146} {"train_loss": -17.588163375854492, "global_step": 12152, "epoch": 146} {"train_loss": -17.808246612548828, "global_step": 12153, "epoch": 146} {"train_loss": -17.9594783782959, "global_step": 12154, "epoch": 146} {"train_loss": -17.821779251098633, "global_step": 12155, "epoch": 146} {"train_loss": -18.135385513305664, "global_step": 12156, "epoch": 146} {"train_loss": -17.970340728759766, "global_step": 12157, "epoch": 146} {"train_loss": -17.763263702392578, "global_step": 12158, "epoch": 146} {"train_loss": -17.6825008392334, "global_step": 12159, "epoch": 146} {"train_loss": -18.229469299316406, "global_step": 12160, "epoch": 146} {"train_loss": -17.91411590576172, "global_step": 12161, "epoch": 146} {"train_loss": -18.189329147338867, "global_step": 12162, "epoch": 146} {"train_loss": -17.695730209350586, "global_step": 12163, "epoch": 146} {"train_loss": -18.125337600708008, "global_step": 12164, "epoch": 146} {"train_loss": -17.913537979125977, "global_step": 12165, "epoch": 146} {"train_loss": -17.671798706054688, "global_step": 12166, "epoch": 146} {"train_loss": -17.80147361755371, "global_step": 12167, "epoch": 146} {"train_loss": -17.430130004882812, "global_step": 12168, "epoch": 146} {"train_loss": -17.59482192993164, "global_step": 12169, "epoch": 146} {"train_loss": -17.812000274658203, "global_step": 12170, "epoch": 146} {"train_loss": -17.7794246673584, "global_step": 12171, "epoch": 146} {"train_loss": -17.313871383666992, "global_step": 12172, "epoch": 146} {"train_loss": -17.987592697143555, "global_step": 12173, "epoch": 146} {"train_loss": -18.11704444885254, "global_step": 12174, "epoch": 146} {"train_loss": -17.871856689453125, "global_step": 12175, "epoch": 146} {"train_loss": -17.860654830932617, "global_step": 12176, "epoch": 146} {"train_loss": -17.85150718688965, "global_step": 12177, "epoch": 146} {"train_loss": -17.76679039001465, "global_step": 12178, "epoch": 146} {"train_loss": -18.011220932006836, "global_step": 12179, "epoch": 146} {"train_loss": -17.991256713867188, "global_step": 12180, "epoch": 146} {"train_loss": -17.52119255065918, "global_step": 12181, "epoch": 146} {"train_loss": -17.820831298828125, "global_step": 12182, "epoch": 146} {"train_loss": -17.676128387451172, "global_step": 12183, "epoch": 146} {"train_loss": -17.889005661010742, "global_step": 12184, "epoch": 146} {"train_loss": -17.67952537536621, "global_step": 12185, "epoch": 146} {"train_loss": -17.82442283630371, "global_step": 12186, "epoch": 146} {"train_loss": -17.98659324645996, "global_step": 12187, "epoch": 146} {"train_loss": -18.06519889831543, "global_step": 12188, "epoch": 146} {"train_loss": -17.743778228759766, "global_step": 12189, "epoch": 146} {"train_loss": -17.71462631225586, "global_step": 12190, "epoch": 146} {"train_loss": -17.649307250976562, "global_step": 12191, "epoch": 146} {"train_loss": -18.269214630126953, "global_step": 12192, "epoch": 146} {"train_loss": -17.883642196655273, "global_step": 12193, "epoch": 146} {"train_loss": -18.03706169128418, "global_step": 12194, "epoch": 146} {"train_loss": -17.59182357788086, "global_step": 12195, "epoch": 146} {"train_loss": -17.550642013549805, "global_step": 12196, "epoch": 146} {"train_loss": -18.312997817993164, "global_step": 12197, "epoch": 146} {"train_loss": -17.840667724609375, "global_step": 12198, "epoch": 146} {"train_loss": -17.68641471862793, "global_step": 12199, "epoch": 146} {"train_loss": -17.848377802285803, "global_step": 12200, "epoch": 146, "val_loss": 6112869.5} {"train_loss": -17.850671768188477, "global_step": 12201, "epoch": 147} {"train_loss": -17.3960018157959, "global_step": 12202, "epoch": 147} {"train_loss": -17.68923568725586, "global_step": 12203, "epoch": 147} {"train_loss": -17.743314743041992, "global_step": 12204, "epoch": 147} {"train_loss": -17.868549346923828, "global_step": 12205, "epoch": 147} {"train_loss": -17.615768432617188, "global_step": 12206, "epoch": 147} {"train_loss": -17.596847534179688, "global_step": 12207, "epoch": 147} {"train_loss": -17.864294052124023, "global_step": 12208, "epoch": 147} {"train_loss": -18.01692008972168, "global_step": 12209, "epoch": 147} {"train_loss": -18.080535888671875, "global_step": 12210, "epoch": 147} {"train_loss": -17.808393478393555, "global_step": 12211, "epoch": 147} {"train_loss": -17.378341674804688, "global_step": 12212, "epoch": 147} {"train_loss": -17.96016502380371, "global_step": 12213, "epoch": 147} {"train_loss": -18.195966720581055, "global_step": 12214, "epoch": 147} {"train_loss": -17.768163681030273, "global_step": 12215, "epoch": 147} {"train_loss": -17.43798828125, "global_step": 12216, "epoch": 147} {"train_loss": -17.92388343811035, "global_step": 12217, "epoch": 147} {"train_loss": -17.895246505737305, "global_step": 12218, "epoch": 147} {"train_loss": -18.061925888061523, "global_step": 12219, "epoch": 147} {"train_loss": -17.72767448425293, "global_step": 12220, "epoch": 147} {"train_loss": -17.816701889038086, "global_step": 12221, "epoch": 147} {"train_loss": -18.115528106689453, "global_step": 12222, "epoch": 147} {"train_loss": -17.922367095947266, "global_step": 12223, "epoch": 147} {"train_loss": -18.02503204345703, "global_step": 12224, "epoch": 147} {"train_loss": -17.7103328704834, "global_step": 12225, "epoch": 147} {"train_loss": -17.726428985595703, "global_step": 12226, "epoch": 147} {"train_loss": -18.107105255126953, "global_step": 12227, "epoch": 147} {"train_loss": -17.837818145751953, "global_step": 12228, "epoch": 147} {"train_loss": -17.76102066040039, "global_step": 12229, "epoch": 147} {"train_loss": -18.189924240112305, "global_step": 12230, "epoch": 147} {"train_loss": -17.10359001159668, "global_step": 12231, "epoch": 147} {"train_loss": -17.938013076782227, "global_step": 12232, "epoch": 147} {"train_loss": -17.74472427368164, "global_step": 12233, "epoch": 147} {"train_loss": -17.84893798828125, "global_step": 12234, "epoch": 147} {"train_loss": -17.946500778198242, "global_step": 12235, "epoch": 147} {"train_loss": -17.49846839904785, "global_step": 12236, "epoch": 147} {"train_loss": -18.112537384033203, "global_step": 12237, "epoch": 147} {"train_loss": -17.58126449584961, "global_step": 12238, "epoch": 147} {"train_loss": -17.7534122467041, "global_step": 12239, "epoch": 147} {"train_loss": -18.000009536743164, "global_step": 12240, "epoch": 147} {"train_loss": -17.67799186706543, "global_step": 12241, "epoch": 147} {"train_loss": -18.390989303588867, "global_step": 12242, "epoch": 147} {"train_loss": -18.25485610961914, "global_step": 12243, "epoch": 147} {"train_loss": -18.106416702270508, "global_step": 12244, "epoch": 147} {"train_loss": -18.031156539916992, "global_step": 12245, "epoch": 147} {"train_loss": -17.974430084228516, "global_step": 12246, "epoch": 147} {"train_loss": -18.27301597595215, "global_step": 12247, "epoch": 147} {"train_loss": -17.5261287689209, "global_step": 12248, "epoch": 147} {"train_loss": -17.37929344177246, "global_step": 12249, "epoch": 147} {"train_loss": -18.13802146911621, "global_step": 12250, "epoch": 147} {"train_loss": -17.8869686126709, "global_step": 12251, "epoch": 147} {"train_loss": -17.422483444213867, "global_step": 12252, "epoch": 147} {"train_loss": -17.82358169555664, "global_step": 12253, "epoch": 147} {"train_loss": -17.86503028869629, "global_step": 12254, "epoch": 147} {"train_loss": -17.893430709838867, "global_step": 12255, "epoch": 147} {"train_loss": -17.94191551208496, "global_step": 12256, "epoch": 147} {"train_loss": -17.857135772705078, "global_step": 12257, "epoch": 147} {"train_loss": -17.882226943969727, "global_step": 12258, "epoch": 147} {"train_loss": -18.35213279724121, "global_step": 12259, "epoch": 147} {"train_loss": -17.58385467529297, "global_step": 12260, "epoch": 147} {"train_loss": -17.92141342163086, "global_step": 12261, "epoch": 147} {"train_loss": -17.65730857849121, "global_step": 12262, "epoch": 147} {"train_loss": -18.11250877380371, "global_step": 12263, "epoch": 147} {"train_loss": -18.242782592773438, "global_step": 12264, "epoch": 147} {"train_loss": -17.665000915527344, "global_step": 12265, "epoch": 147} {"train_loss": -17.853090286254883, "global_step": 12266, "epoch": 147} {"train_loss": -17.815994262695312, "global_step": 12267, "epoch": 147} {"train_loss": -18.087003707885742, "global_step": 12268, "epoch": 147} {"train_loss": -18.017316818237305, "global_step": 12269, "epoch": 147} {"train_loss": -17.755229949951172, "global_step": 12270, "epoch": 147} {"train_loss": -18.208005905151367, "global_step": 12271, "epoch": 147} {"train_loss": -17.716171264648438, "global_step": 12272, "epoch": 147} {"train_loss": -17.65188980102539, "global_step": 12273, "epoch": 147} {"train_loss": -17.706510543823242, "global_step": 12274, "epoch": 147} {"train_loss": -17.568931579589844, "global_step": 12275, "epoch": 147} {"train_loss": -17.983049392700195, "global_step": 12276, "epoch": 147} {"train_loss": -17.477766036987305, "global_step": 12277, "epoch": 147} {"train_loss": -18.17229652404785, "global_step": 12278, "epoch": 147} {"train_loss": -17.77376365661621, "global_step": 12279, "epoch": 147} {"train_loss": -18.041051864624023, "global_step": 12280, "epoch": 147} {"train_loss": -17.953529357910156, "global_step": 12281, "epoch": 147} {"train_loss": -17.77542495727539, "global_step": 12282, "epoch": 147} {"train_loss": -17.845218934208514, "global_step": 12283, "epoch": 147, "val_loss": 6029102.5} {"train_loss": -17.806440353393555, "global_step": 12284, "epoch": 148} {"train_loss": -17.73084831237793, "global_step": 12285, "epoch": 148} {"train_loss": -17.46178436279297, "global_step": 12286, "epoch": 148} {"train_loss": -17.68962860107422, "global_step": 12287, "epoch": 148} {"train_loss": -18.047325134277344, "global_step": 12288, "epoch": 148} {"train_loss": -17.839128494262695, "global_step": 12289, "epoch": 148} {"train_loss": -17.975046157836914, "global_step": 12290, "epoch": 148} {"train_loss": -17.56976890563965, "global_step": 12291, "epoch": 148} {"train_loss": -17.70334815979004, "global_step": 12292, "epoch": 148} {"train_loss": -17.75510597229004, "global_step": 12293, "epoch": 148} {"train_loss": -17.1851806640625, "global_step": 12294, "epoch": 148} {"train_loss": -17.77191925048828, "global_step": 12295, "epoch": 148} {"train_loss": -17.649045944213867, "global_step": 12296, "epoch": 148} {"train_loss": -17.936506271362305, "global_step": 12297, "epoch": 148} {"train_loss": -17.779165267944336, "global_step": 12298, "epoch": 148} {"train_loss": -17.856382369995117, "global_step": 12299, "epoch": 148} {"train_loss": -17.672563552856445, "global_step": 12300, "epoch": 148} {"train_loss": -18.0319881439209, "global_step": 12301, "epoch": 148} {"train_loss": -18.14082145690918, "global_step": 12302, "epoch": 148} {"train_loss": -17.9510498046875, "global_step": 12303, "epoch": 148} {"train_loss": -17.522708892822266, "global_step": 12304, "epoch": 148} {"train_loss": -17.850385665893555, "global_step": 12305, "epoch": 148} {"train_loss": -18.130884170532227, "global_step": 12306, "epoch": 148} {"train_loss": -17.70773696899414, "global_step": 12307, "epoch": 148} {"train_loss": -17.917173385620117, "global_step": 12308, "epoch": 148} {"train_loss": -18.094541549682617, "global_step": 12309, "epoch": 148} {"train_loss": -18.162771224975586, "global_step": 12310, "epoch": 148} {"train_loss": -17.730640411376953, "global_step": 12311, "epoch": 148} {"train_loss": -17.517061233520508, "global_step": 12312, "epoch": 148} {"train_loss": -17.813398361206055, "global_step": 12313, "epoch": 148} {"train_loss": -17.674335479736328, "global_step": 12314, "epoch": 148} {"train_loss": -17.773569107055664, "global_step": 12315, "epoch": 148} {"train_loss": -17.740488052368164, "global_step": 12316, "epoch": 148} {"train_loss": -17.62538719177246, "global_step": 12317, "epoch": 148} {"train_loss": -18.019790649414062, "global_step": 12318, "epoch": 148} {"train_loss": -17.718143463134766, "global_step": 12319, "epoch": 148} {"train_loss": -18.01604652404785, "global_step": 12320, "epoch": 148} {"train_loss": -18.12877082824707, "global_step": 12321, "epoch": 148} {"train_loss": -18.007444381713867, "global_step": 12322, "epoch": 148} {"train_loss": -18.198598861694336, "global_step": 12323, "epoch": 148} {"train_loss": -17.98246192932129, "global_step": 12324, "epoch": 148} {"train_loss": -17.783405303955078, "global_step": 12325, "epoch": 148} {"train_loss": -17.927682876586914, "global_step": 12326, "epoch": 148} {"train_loss": -17.62714195251465, "global_step": 12327, "epoch": 148} {"train_loss": -17.8633975982666, "global_step": 12328, "epoch": 148} {"train_loss": -18.24186897277832, "global_step": 12329, "epoch": 148} {"train_loss": -18.017864227294922, "global_step": 12330, "epoch": 148} {"train_loss": -17.932580947875977, "global_step": 12331, "epoch": 148} {"train_loss": -17.801855087280273, "global_step": 12332, "epoch": 148} {"train_loss": -17.822494506835938, "global_step": 12333, "epoch": 148} {"train_loss": -18.153226852416992, "global_step": 12334, "epoch": 148} {"train_loss": -17.735370635986328, "global_step": 12335, "epoch": 148} {"train_loss": -17.782995223999023, "global_step": 12336, "epoch": 148} {"train_loss": -17.66839599609375, "global_step": 12337, "epoch": 148} {"train_loss": -17.9691162109375, "global_step": 12338, "epoch": 148} {"train_loss": -18.088451385498047, "global_step": 12339, "epoch": 148} {"train_loss": -18.144607543945312, "global_step": 12340, "epoch": 148} {"train_loss": -17.928266525268555, "global_step": 12341, "epoch": 148} {"train_loss": -17.915929794311523, "global_step": 12342, "epoch": 148} {"train_loss": -18.010587692260742, "global_step": 12343, "epoch": 148} {"train_loss": -18.261117935180664, "global_step": 12344, "epoch": 148} {"train_loss": -17.765199661254883, "global_step": 12345, "epoch": 148} {"train_loss": -17.811006546020508, "global_step": 12346, "epoch": 148} {"train_loss": -18.206369400024414, "global_step": 12347, "epoch": 148} {"train_loss": -17.906591415405273, "global_step": 12348, "epoch": 148} {"train_loss": -18.16506576538086, "global_step": 12349, "epoch": 148} {"train_loss": -17.692291259765625, "global_step": 12350, "epoch": 148} {"train_loss": -17.54949188232422, "global_step": 12351, "epoch": 148} {"train_loss": -18.286333084106445, "global_step": 12352, "epoch": 148} {"train_loss": -18.23006248474121, "global_step": 12353, "epoch": 148} {"train_loss": -17.550695419311523, "global_step": 12354, "epoch": 148} {"train_loss": -17.801042556762695, "global_step": 12355, "epoch": 148} {"train_loss": -17.99410057067871, "global_step": 12356, "epoch": 148} {"train_loss": -17.974512100219727, "global_step": 12357, "epoch": 148} {"train_loss": -17.80780029296875, "global_step": 12358, "epoch": 148} {"train_loss": -17.676620483398438, "global_step": 12359, "epoch": 148} {"train_loss": -17.74796485900879, "global_step": 12360, "epoch": 148} {"train_loss": -17.81978416442871, "global_step": 12361, "epoch": 148} {"train_loss": -18.108198165893555, "global_step": 12362, "epoch": 148} {"train_loss": -18.064043045043945, "global_step": 12363, "epoch": 148} {"train_loss": -17.985797882080078, "global_step": 12364, "epoch": 148} {"train_loss": -17.81110954284668, "global_step": 12365, "epoch": 148} {"train_loss": -17.886226194450654, "global_step": 12366, "epoch": 148, "val_loss": 5944297.0} {"train_loss": -17.356550216674805, "global_step": 12367, "epoch": 149} {"train_loss": -17.683013916015625, "global_step": 12368, "epoch": 149} {"train_loss": -17.567415237426758, "global_step": 12369, "epoch": 149} {"train_loss": -17.4703426361084, "global_step": 12370, "epoch": 149} {"train_loss": -17.691312789916992, "global_step": 12371, "epoch": 149} {"train_loss": -17.82469367980957, "global_step": 12372, "epoch": 149} {"train_loss": -17.702816009521484, "global_step": 12373, "epoch": 149} {"train_loss": -17.702478408813477, "global_step": 12374, "epoch": 149} {"train_loss": -17.610244750976562, "global_step": 12375, "epoch": 149} {"train_loss": -18.255834579467773, "global_step": 12376, "epoch": 149} {"train_loss": -17.698532104492188, "global_step": 12377, "epoch": 149} {"train_loss": -17.887819290161133, "global_step": 12378, "epoch": 149} {"train_loss": -17.432912826538086, "global_step": 12379, "epoch": 149} {"train_loss": -17.778711318969727, "global_step": 12380, "epoch": 149} {"train_loss": -17.74415397644043, "global_step": 12381, "epoch": 149} {"train_loss": -17.67365837097168, "global_step": 12382, "epoch": 149} {"train_loss": -17.809553146362305, "global_step": 12383, "epoch": 149} {"train_loss": -18.105926513671875, "global_step": 12384, "epoch": 149} {"train_loss": -17.348840713500977, "global_step": 12385, "epoch": 149} {"train_loss": -17.577056884765625, "global_step": 12386, "epoch": 149} {"train_loss": -18.070159912109375, "global_step": 12387, "epoch": 149} {"train_loss": -17.40470314025879, "global_step": 12388, "epoch": 149} {"train_loss": -17.588699340820312, "global_step": 12389, "epoch": 149} {"train_loss": -17.8343505859375, "global_step": 12390, "epoch": 149} {"train_loss": -17.646142959594727, "global_step": 12391, "epoch": 149} {"train_loss": -17.692859649658203, "global_step": 12392, "epoch": 149} {"train_loss": -17.721670150756836, "global_step": 12393, "epoch": 149} {"train_loss": -17.715864181518555, "global_step": 12394, "epoch": 149} {"train_loss": -17.946714401245117, "global_step": 12395, "epoch": 149} {"train_loss": -17.885778427124023, "global_step": 12396, "epoch": 149} {"train_loss": -17.455806732177734, "global_step": 12397, "epoch": 149} {"train_loss": -18.022506713867188, "global_step": 12398, "epoch": 149} {"train_loss": -17.636489868164062, "global_step": 12399, "epoch": 149} {"train_loss": -17.9377498626709, "global_step": 12400, "epoch": 149} {"train_loss": -17.636091232299805, "global_step": 12401, "epoch": 149} {"train_loss": -18.24997901916504, "global_step": 12402, "epoch": 149} {"train_loss": -18.101749420166016, "global_step": 12403, "epoch": 149} {"train_loss": -18.097898483276367, "global_step": 12404, "epoch": 149} {"train_loss": -18.398557662963867, "global_step": 12405, "epoch": 149} {"train_loss": -17.764760971069336, "global_step": 12406, "epoch": 149} {"train_loss": -18.084335327148438, "global_step": 12407, "epoch": 149} {"train_loss": -18.34920310974121, "global_step": 12408, "epoch": 149} {"train_loss": -17.544586181640625, "global_step": 12409, "epoch": 149} {"train_loss": -18.032358169555664, "global_step": 12410, "epoch": 149} {"train_loss": -18.12418556213379, "global_step": 12411, "epoch": 149} {"train_loss": -17.998083114624023, "global_step": 12412, "epoch": 149} {"train_loss": -18.047163009643555, "global_step": 12413, "epoch": 149} {"train_loss": -17.829811096191406, "global_step": 12414, "epoch": 149} {"train_loss": -18.249828338623047, "global_step": 12415, "epoch": 149} {"train_loss": -18.11993980407715, "global_step": 12416, "epoch": 149} {"train_loss": -17.915239334106445, "global_step": 12417, "epoch": 149} {"train_loss": -17.914976119995117, "global_step": 12418, "epoch": 149} {"train_loss": -17.944843292236328, "global_step": 12419, "epoch": 149} {"train_loss": -17.744823455810547, "global_step": 12420, "epoch": 149} {"train_loss": -17.967187881469727, "global_step": 12421, "epoch": 149} {"train_loss": -17.63187599182129, "global_step": 12422, "epoch": 149} {"train_loss": -17.951120376586914, "global_step": 12423, "epoch": 149} {"train_loss": -17.586668014526367, "global_step": 12424, "epoch": 149} {"train_loss": -18.162933349609375, "global_step": 12425, "epoch": 149} {"train_loss": -18.17816734313965, "global_step": 12426, "epoch": 149} {"train_loss": -17.465646743774414, "global_step": 12427, "epoch": 149} {"train_loss": -17.767242431640625, "global_step": 12428, "epoch": 149} {"train_loss": -17.596942901611328, "global_step": 12429, "epoch": 149} {"train_loss": -17.81244468688965, "global_step": 12430, "epoch": 149} {"train_loss": -18.38758087158203, "global_step": 12431, "epoch": 149} {"train_loss": -17.782541275024414, "global_step": 12432, "epoch": 149} {"train_loss": -17.759328842163086, "global_step": 12433, "epoch": 149} {"train_loss": -17.772930145263672, "global_step": 12434, "epoch": 149} {"train_loss": -17.9837589263916, "global_step": 12435, "epoch": 149} {"train_loss": -17.8505802154541, "global_step": 12436, "epoch": 149} {"train_loss": -17.418643951416016, "global_step": 12437, "epoch": 149} {"train_loss": -17.59336280822754, "global_step": 12438, "epoch": 149} {"train_loss": -17.809038162231445, "global_step": 12439, "epoch": 149} {"train_loss": -18.2485408782959, "global_step": 12440, "epoch": 149} {"train_loss": -17.46009635925293, "global_step": 12441, "epoch": 149} {"train_loss": -17.8410587310791, "global_step": 12442, "epoch": 149} {"train_loss": -17.964706420898438, "global_step": 12443, "epoch": 149} {"train_loss": -17.731632232666016, "global_step": 12444, "epoch": 149} {"train_loss": -18.05145835876465, "global_step": 12445, "epoch": 149} {"train_loss": -17.97474479675293, "global_step": 12446, "epoch": 149} {"train_loss": -17.74234390258789, "global_step": 12447, "epoch": 149} {"train_loss": -18.163755416870117, "global_step": 12448, "epoch": 149} {"train_loss": -17.821588286434313, "global_step": 12449, "epoch": 149, "val_loss": 6108641.5} {"train_loss": -17.37034797668457, "global_step": 12450, "epoch": 150} {"train_loss": -17.28447151184082, "global_step": 12451, "epoch": 150} {"train_loss": -17.62247085571289, "global_step": 12452, "epoch": 150} {"train_loss": -17.530820846557617, "global_step": 12453, "epoch": 150} {"train_loss": -17.64748191833496, "global_step": 12454, "epoch": 150} {"train_loss": -17.506420135498047, "global_step": 12455, "epoch": 150} {"train_loss": -18.057737350463867, "global_step": 12456, "epoch": 150} {"train_loss": -17.55547523498535, "global_step": 12457, "epoch": 150} {"train_loss": -17.775808334350586, "global_step": 12458, "epoch": 150} {"train_loss": -17.636388778686523, "global_step": 12459, "epoch": 150} {"train_loss": -17.71979331970215, "global_step": 12460, "epoch": 150} {"train_loss": -17.82465171813965, "global_step": 12461, "epoch": 150} {"train_loss": -17.880529403686523, "global_step": 12462, "epoch": 150} {"train_loss": -17.65081214904785, "global_step": 12463, "epoch": 150} {"train_loss": -17.667184829711914, "global_step": 12464, "epoch": 150} {"train_loss": -17.66119384765625, "global_step": 12465, "epoch": 150} {"train_loss": -17.967390060424805, "global_step": 12466, "epoch": 150} {"train_loss": -18.10757827758789, "global_step": 12467, "epoch": 150} {"train_loss": -18.144737243652344, "global_step": 12468, "epoch": 150} {"train_loss": -17.79224967956543, "global_step": 12469, "epoch": 150} {"train_loss": -17.491107940673828, "global_step": 12470, "epoch": 150} {"train_loss": -17.87340545654297, "global_step": 12471, "epoch": 150} {"train_loss": -18.049949645996094, "global_step": 12472, "epoch": 150} {"train_loss": -17.3801326751709, "global_step": 12473, "epoch": 150} {"train_loss": -17.817537307739258, "global_step": 12474, "epoch": 150} {"train_loss": -18.066268920898438, "global_step": 12475, "epoch": 150} {"train_loss": -18.211977005004883, "global_step": 12476, "epoch": 150} {"train_loss": -17.98874855041504, "global_step": 12477, "epoch": 150} {"train_loss": -17.759658813476562, "global_step": 12478, "epoch": 150} {"train_loss": -17.707284927368164, "global_step": 12479, "epoch": 150} {"train_loss": -17.505939483642578, "global_step": 12480, "epoch": 150} {"train_loss": -17.761491775512695, "global_step": 12481, "epoch": 150} {"train_loss": -17.800893783569336, "global_step": 12482, "epoch": 150} {"train_loss": -18.165327072143555, "global_step": 12483, "epoch": 150} {"train_loss": -18.007612228393555, "global_step": 12484, "epoch": 150} {"train_loss": -17.568241119384766, "global_step": 12485, "epoch": 150} {"train_loss": -17.948408126831055, "global_step": 12486, "epoch": 150} {"train_loss": -18.22492790222168, "global_step": 12487, "epoch": 150} {"train_loss": -17.712757110595703, "global_step": 12488, "epoch": 150} {"train_loss": -18.2375545501709, "global_step": 12489, "epoch": 150} {"train_loss": -17.46112060546875, "global_step": 12490, "epoch": 150} {"train_loss": -17.963193893432617, "global_step": 12491, "epoch": 150} {"train_loss": -17.93500328063965, "global_step": 12492, "epoch": 150} {"train_loss": -17.854734420776367, "global_step": 12493, "epoch": 150} {"train_loss": -18.030548095703125, "global_step": 12494, "epoch": 150} {"train_loss": -18.082618713378906, "global_step": 12495, "epoch": 150} {"train_loss": -18.038679122924805, "global_step": 12496, "epoch": 150} {"train_loss": -17.494596481323242, "global_step": 12497, "epoch": 150} {"train_loss": -17.730051040649414, "global_step": 12498, "epoch": 150} {"train_loss": -17.740676879882812, "global_step": 12499, "epoch": 150} {"train_loss": -17.97652816772461, "global_step": 12500, "epoch": 150} {"train_loss": -17.490358352661133, "global_step": 12501, "epoch": 150} {"train_loss": -18.086034774780273, "global_step": 12502, "epoch": 150} {"train_loss": -18.11862564086914, "global_step": 12503, "epoch": 150} {"train_loss": -17.643898010253906, "global_step": 12504, "epoch": 150} {"train_loss": -18.03516960144043, "global_step": 12505, "epoch": 150} {"train_loss": -17.83154296875, "global_step": 12506, "epoch": 150} {"train_loss": -17.97785758972168, "global_step": 12507, "epoch": 150} {"train_loss": -18.106306076049805, "global_step": 12508, "epoch": 150} {"train_loss": -18.036758422851562, "global_step": 12509, "epoch": 150} {"train_loss": -18.076669692993164, "global_step": 12510, "epoch": 150} {"train_loss": -17.752126693725586, "global_step": 12511, "epoch": 150} {"train_loss": -17.911169052124023, "global_step": 12512, "epoch": 150} {"train_loss": -18.309829711914062, "global_step": 12513, "epoch": 150} {"train_loss": -18.04524803161621, "global_step": 12514, "epoch": 150} {"train_loss": -17.903600692749023, "global_step": 12515, "epoch": 150} {"train_loss": -17.929325103759766, "global_step": 12516, "epoch": 150} {"train_loss": -17.800451278686523, "global_step": 12517, "epoch": 150} {"train_loss": -17.588531494140625, "global_step": 12518, "epoch": 150} {"train_loss": -18.05742645263672, "global_step": 12519, "epoch": 150} {"train_loss": -18.114194869995117, "global_step": 12520, "epoch": 150} {"train_loss": -17.715482711791992, "global_step": 12521, "epoch": 150} {"train_loss": -18.182235717773438, "global_step": 12522, "epoch": 150} {"train_loss": -17.95891761779785, "global_step": 12523, "epoch": 150} {"train_loss": -17.56135368347168, "global_step": 12524, "epoch": 150} {"train_loss": -17.85615348815918, "global_step": 12525, "epoch": 150} {"train_loss": -18.27822494506836, "global_step": 12526, "epoch": 150} {"train_loss": -17.832656860351562, "global_step": 12527, "epoch": 150} {"train_loss": -17.601858139038086, "global_step": 12528, "epoch": 150} {"train_loss": -18.111190795898438, "global_step": 12529, "epoch": 150} {"train_loss": -17.857545852661133, "global_step": 12530, "epoch": 150} {"train_loss": -18.096054077148438, "global_step": 12531, "epoch": 150} {"train_loss": -17.855080064520777, "global_step": 12532, "epoch": 150, "train/sim_max_reward_0": 0.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 0.0, "train/sim_max_reward_3": 0.0, "train/sim_max_reward_4": 0.0, "train/sim_max_reward_5": 0.0, "test/sim_max_reward_4500000": 0.0, "test/sim_max_reward_4500001": 0.0, "test/sim_max_reward_4500002": 0.0, "test/sim_max_reward_4500003": 1.0, "test/sim_max_reward_4500004": 0.0, "test/sim_max_reward_4500005": 0.0, "test/sim_max_reward_4500006": 1.0, "test/sim_max_reward_4500007": 1.0, "test/sim_max_reward_4500008": 1.0, "test/sim_max_reward_4500009": 0.0, "test/sim_max_reward_4500010": 1.0, "test/sim_max_reward_4500011": 0.0, "test/sim_max_reward_4500012": 1.0, "test/sim_max_reward_4500013": 1.0, "test/sim_max_reward_4500014": 1.0, "test/sim_max_reward_4500015": 0.0, "test/sim_max_reward_4500016": 1.0, "test/sim_max_reward_4500017": 0.0, "test/sim_max_reward_4500018": 1.0, "test/sim_max_reward_4500019": 0.0, "test/sim_max_reward_4500020": 1.0, "test/sim_max_reward_4500021": 1.0, "train/mean_score": 0.16666666666666666, "test/mean_score": 0.5454545454545454, "val_loss": 6082007.5} {"train_loss": -16.848730087280273, "global_step": 12533, "epoch": 151} {"train_loss": -17.53660774230957, "global_step": 12534, "epoch": 151} {"train_loss": -17.509275436401367, "global_step": 12535, "epoch": 151} {"train_loss": -17.822111129760742, "global_step": 12536, "epoch": 151} {"train_loss": -17.865741729736328, "global_step": 12537, "epoch": 151} {"train_loss": -17.36960792541504, "global_step": 12538, "epoch": 151} {"train_loss": -17.7333927154541, "global_step": 12539, "epoch": 151} {"train_loss": -17.78896141052246, "global_step": 12540, "epoch": 151} {"train_loss": -17.72177505493164, "global_step": 12541, "epoch": 151} {"train_loss": -18.00184440612793, "global_step": 12542, "epoch": 151} {"train_loss": -17.78584861755371, "global_step": 12543, "epoch": 151} {"train_loss": -17.79207420349121, "global_step": 12544, "epoch": 151} {"train_loss": -17.799020767211914, "global_step": 12545, "epoch": 151} {"train_loss": -18.115392684936523, "global_step": 12546, "epoch": 151} {"train_loss": -17.776987075805664, "global_step": 12547, "epoch": 151} {"train_loss": -17.777416229248047, "global_step": 12548, "epoch": 151} {"train_loss": -17.8969669342041, "global_step": 12549, "epoch": 151} {"train_loss": -17.371856689453125, "global_step": 12550, "epoch": 151} {"train_loss": -17.90812110900879, "global_step": 12551, "epoch": 151} {"train_loss": -17.851255416870117, "global_step": 12552, "epoch": 151} {"train_loss": -18.204275131225586, "global_step": 12553, "epoch": 151} {"train_loss": -17.74544334411621, "global_step": 12554, "epoch": 151} {"train_loss": -17.839996337890625, "global_step": 12555, "epoch": 151} {"train_loss": -17.72311019897461, "global_step": 12556, "epoch": 151} {"train_loss": -17.882368087768555, "global_step": 12557, "epoch": 151} {"train_loss": -17.859073638916016, "global_step": 12558, "epoch": 151} {"train_loss": -17.908161163330078, "global_step": 12559, "epoch": 151} {"train_loss": -18.030494689941406, "global_step": 12560, "epoch": 151} {"train_loss": -18.331146240234375, "global_step": 12561, "epoch": 151} {"train_loss": -18.138477325439453, "global_step": 12562, "epoch": 151} {"train_loss": -17.604780197143555, "global_step": 12563, "epoch": 151} {"train_loss": -18.173498153686523, "global_step": 12564, "epoch": 151} {"train_loss": -17.928266525268555, "global_step": 12565, "epoch": 151} {"train_loss": -18.116104125976562, "global_step": 12566, "epoch": 151} {"train_loss": -17.626890182495117, "global_step": 12567, "epoch": 151} {"train_loss": -18.281906127929688, "global_step": 12568, "epoch": 151} {"train_loss": -18.13258171081543, "global_step": 12569, "epoch": 151} {"train_loss": -17.84486961364746, "global_step": 12570, "epoch": 151} {"train_loss": -17.865421295166016, "global_step": 12571, "epoch": 151} {"train_loss": -17.664859771728516, "global_step": 12572, "epoch": 151} {"train_loss": -17.530506134033203, "global_step": 12573, "epoch": 151} {"train_loss": -18.08743667602539, "global_step": 12574, "epoch": 151} {"train_loss": -17.61911392211914, "global_step": 12575, "epoch": 151} {"train_loss": -17.69075584411621, "global_step": 12576, "epoch": 151} {"train_loss": -18.423330307006836, "global_step": 12577, "epoch": 151} {"train_loss": -17.73233413696289, "global_step": 12578, "epoch": 151} {"train_loss": -17.7177677154541, "global_step": 12579, "epoch": 151} {"train_loss": -17.68951988220215, "global_step": 12580, "epoch": 151} {"train_loss": -17.632917404174805, "global_step": 12581, "epoch": 151} {"train_loss": -17.86895179748535, "global_step": 12582, "epoch": 151} {"train_loss": -17.7840576171875, "global_step": 12583, "epoch": 151} {"train_loss": -17.591867446899414, "global_step": 12584, "epoch": 151} {"train_loss": -18.154199600219727, "global_step": 12585, "epoch": 151} {"train_loss": -18.166006088256836, "global_step": 12586, "epoch": 151} {"train_loss": -17.53497886657715, "global_step": 12587, "epoch": 151} {"train_loss": -18.134815216064453, "global_step": 12588, "epoch": 151} {"train_loss": -17.896846771240234, "global_step": 12589, "epoch": 151} {"train_loss": -18.32986831665039, "global_step": 12590, "epoch": 151} {"train_loss": -17.6767635345459, "global_step": 12591, "epoch": 151} {"train_loss": -18.039615631103516, "global_step": 12592, "epoch": 151} {"train_loss": -18.063518524169922, "global_step": 12593, "epoch": 151} {"train_loss": -17.450775146484375, "global_step": 12594, "epoch": 151} {"train_loss": -17.649158477783203, "global_step": 12595, "epoch": 151} {"train_loss": -17.468259811401367, "global_step": 12596, "epoch": 151} {"train_loss": -18.02341079711914, "global_step": 12597, "epoch": 151} {"train_loss": -17.717885971069336, "global_step": 12598, "epoch": 151} {"train_loss": -17.61893081665039, "global_step": 12599, "epoch": 151} {"train_loss": -18.203733444213867, "global_step": 12600, "epoch": 151} {"train_loss": -18.334260940551758, "global_step": 12601, "epoch": 151} {"train_loss": -17.898269653320312, "global_step": 12602, "epoch": 151} {"train_loss": -17.754018783569336, "global_step": 12603, "epoch": 151} {"train_loss": -17.872339248657227, "global_step": 12604, "epoch": 151} {"train_loss": -17.803878784179688, "global_step": 12605, "epoch": 151} {"train_loss": -18.05018424987793, "global_step": 12606, "epoch": 151} {"train_loss": -17.981931686401367, "global_step": 12607, "epoch": 151} {"train_loss": -17.441247940063477, "global_step": 12608, "epoch": 151} {"train_loss": -17.697147369384766, "global_step": 12609, "epoch": 151} {"train_loss": -17.81638526916504, "global_step": 12610, "epoch": 151} {"train_loss": -18.034719467163086, "global_step": 12611, "epoch": 151} {"train_loss": -17.345579147338867, "global_step": 12612, "epoch": 151} {"train_loss": -17.757461547851562, "global_step": 12613, "epoch": 151} {"train_loss": -17.391098022460938, "global_step": 12614, "epoch": 151} {"train_loss": -17.80727609381618, "global_step": 12615, "epoch": 151, "val_loss": 6028753.0} {"train_loss": -17.735187530517578, "global_step": 12616, "epoch": 152} {"train_loss": -17.785459518432617, "global_step": 12617, "epoch": 152} {"train_loss": -18.062530517578125, "global_step": 12618, "epoch": 152} {"train_loss": -17.937347412109375, "global_step": 12619, "epoch": 152} {"train_loss": -17.949237823486328, "global_step": 12620, "epoch": 152} {"train_loss": -17.86086082458496, "global_step": 12621, "epoch": 152} {"train_loss": -18.111379623413086, "global_step": 12622, "epoch": 152} {"train_loss": -18.0011043548584, "global_step": 12623, "epoch": 152} {"train_loss": -17.65227508544922, "global_step": 12624, "epoch": 152} {"train_loss": -18.11290740966797, "global_step": 12625, "epoch": 152} {"train_loss": -17.8593807220459, "global_step": 12626, "epoch": 152} {"train_loss": -17.895465850830078, "global_step": 12627, "epoch": 152} {"train_loss": -17.721853256225586, "global_step": 12628, "epoch": 152} {"train_loss": -17.826217651367188, "global_step": 12629, "epoch": 152} {"train_loss": -17.5418643951416, "global_step": 12630, "epoch": 152} {"train_loss": -18.05074119567871, "global_step": 12631, "epoch": 152} {"train_loss": -17.866729736328125, "global_step": 12632, "epoch": 152} {"train_loss": -17.751373291015625, "global_step": 12633, "epoch": 152} {"train_loss": -17.8084659576416, "global_step": 12634, "epoch": 152} {"train_loss": -18.016271591186523, "global_step": 12635, "epoch": 152} {"train_loss": -17.95161247253418, "global_step": 12636, "epoch": 152} {"train_loss": -18.092313766479492, "global_step": 12637, "epoch": 152} {"train_loss": -17.860496520996094, "global_step": 12638, "epoch": 152} {"train_loss": -17.745290756225586, "global_step": 12639, "epoch": 152} {"train_loss": -18.135726928710938, "global_step": 12640, "epoch": 152} {"train_loss": -18.26177406311035, "global_step": 12641, "epoch": 152} {"train_loss": -17.554182052612305, "global_step": 12642, "epoch": 152} {"train_loss": -17.846160888671875, "global_step": 12643, "epoch": 152} {"train_loss": -18.02197265625, "global_step": 12644, "epoch": 152} {"train_loss": -18.07816505432129, "global_step": 12645, "epoch": 152} {"train_loss": -17.605085372924805, "global_step": 12646, "epoch": 152} {"train_loss": -17.674314498901367, "global_step": 12647, "epoch": 152} {"train_loss": -18.139413833618164, "global_step": 12648, "epoch": 152} {"train_loss": -17.631122589111328, "global_step": 12649, "epoch": 152} {"train_loss": -17.83056640625, "global_step": 12650, "epoch": 152} {"train_loss": -17.669675827026367, "global_step": 12651, "epoch": 152} {"train_loss": -18.54194450378418, "global_step": 12652, "epoch": 152} {"train_loss": -17.777393341064453, "global_step": 12653, "epoch": 152} {"train_loss": -17.80048942565918, "global_step": 12654, "epoch": 152} {"train_loss": -17.953413009643555, "global_step": 12655, "epoch": 152} {"train_loss": -17.971715927124023, "global_step": 12656, "epoch": 152} {"train_loss": -17.45883560180664, "global_step": 12657, "epoch": 152} {"train_loss": -17.505313873291016, "global_step": 12658, "epoch": 152} {"train_loss": -17.852802276611328, "global_step": 12659, "epoch": 152} {"train_loss": -17.355257034301758, "global_step": 12660, "epoch": 152} {"train_loss": -18.173831939697266, "global_step": 12661, "epoch": 152} {"train_loss": -18.13932228088379, "global_step": 12662, "epoch": 152} {"train_loss": -18.032989501953125, "global_step": 12663, "epoch": 152} {"train_loss": -17.768661499023438, "global_step": 12664, "epoch": 152} {"train_loss": -17.95475959777832, "global_step": 12665, "epoch": 152} {"train_loss": -17.693098068237305, "global_step": 12666, "epoch": 152} {"train_loss": -18.025121688842773, "global_step": 12667, "epoch": 152} {"train_loss": -18.039243698120117, "global_step": 12668, "epoch": 152} {"train_loss": -17.683460235595703, "global_step": 12669, "epoch": 152} {"train_loss": -18.0794734954834, "global_step": 12670, "epoch": 152} {"train_loss": -17.792800903320312, "global_step": 12671, "epoch": 152} {"train_loss": -17.898042678833008, "global_step": 12672, "epoch": 152} {"train_loss": -18.322568893432617, "global_step": 12673, "epoch": 152} {"train_loss": -17.70427894592285, "global_step": 12674, "epoch": 152} {"train_loss": -17.85780906677246, "global_step": 12675, "epoch": 152} {"train_loss": -18.0344295501709, "global_step": 12676, "epoch": 152} {"train_loss": -17.967361450195312, "global_step": 12677, "epoch": 152} {"train_loss": -18.030475616455078, "global_step": 12678, "epoch": 152} {"train_loss": -17.898731231689453, "global_step": 12679, "epoch": 152} {"train_loss": -17.600143432617188, "global_step": 12680, "epoch": 152} {"train_loss": -17.772354125976562, "global_step": 12681, "epoch": 152} {"train_loss": -17.573606491088867, "global_step": 12682, "epoch": 152} {"train_loss": -17.841806411743164, "global_step": 12683, "epoch": 152} {"train_loss": -18.016233444213867, "global_step": 12684, "epoch": 152} {"train_loss": -17.650602340698242, "global_step": 12685, "epoch": 152} {"train_loss": -18.285764694213867, "global_step": 12686, "epoch": 152} {"train_loss": -18.093673706054688, "global_step": 12687, "epoch": 152} {"train_loss": -18.17445182800293, "global_step": 12688, "epoch": 152} {"train_loss": -17.614360809326172, "global_step": 12689, "epoch": 152} {"train_loss": -17.893342971801758, "global_step": 12690, "epoch": 152} {"train_loss": -18.050378799438477, "global_step": 12691, "epoch": 152} {"train_loss": -17.571136474609375, "global_step": 12692, "epoch": 152} {"train_loss": -17.844207763671875, "global_step": 12693, "epoch": 152} {"train_loss": -17.884031295776367, "global_step": 12694, "epoch": 152} {"train_loss": -17.61607551574707, "global_step": 12695, "epoch": 152} {"train_loss": -17.888507843017578, "global_step": 12696, "epoch": 152} {"train_loss": -17.76860237121582, "global_step": 12697, "epoch": 152} {"train_loss": -17.88261776659862, "global_step": 12698, "epoch": 152, "val_loss": 6030630.5} {"train_loss": -17.425092697143555, "global_step": 12699, "epoch": 153} {"train_loss": -17.795591354370117, "global_step": 12700, "epoch": 153} {"train_loss": -17.604995727539062, "global_step": 12701, "epoch": 153} {"train_loss": -17.16914939880371, "global_step": 12702, "epoch": 153} {"train_loss": -17.492597579956055, "global_step": 12703, "epoch": 153} {"train_loss": -17.75394058227539, "global_step": 12704, "epoch": 153} {"train_loss": -17.373991012573242, "global_step": 12705, "epoch": 153} {"train_loss": -17.98252296447754, "global_step": 12706, "epoch": 153} {"train_loss": -17.873279571533203, "global_step": 12707, "epoch": 153} {"train_loss": -18.04544448852539, "global_step": 12708, "epoch": 153} {"train_loss": -17.875579833984375, "global_step": 12709, "epoch": 153} {"train_loss": -18.220796585083008, "global_step": 12710, "epoch": 153} {"train_loss": -17.5280818939209, "global_step": 12711, "epoch": 153} {"train_loss": -17.974666595458984, "global_step": 12712, "epoch": 153} {"train_loss": -17.894025802612305, "global_step": 12713, "epoch": 153} {"train_loss": -17.837568283081055, "global_step": 12714, "epoch": 153} {"train_loss": -18.26829719543457, "global_step": 12715, "epoch": 153} {"train_loss": -17.669116973876953, "global_step": 12716, "epoch": 153} {"train_loss": -17.92545509338379, "global_step": 12717, "epoch": 153} {"train_loss": -17.670738220214844, "global_step": 12718, "epoch": 153} {"train_loss": -18.25473403930664, "global_step": 12719, "epoch": 153} {"train_loss": -18.061609268188477, "global_step": 12720, "epoch": 153} {"train_loss": -17.63667869567871, "global_step": 12721, "epoch": 153} {"train_loss": -18.134693145751953, "global_step": 12722, "epoch": 153} {"train_loss": -18.200613021850586, "global_step": 12723, "epoch": 153} {"train_loss": -17.7413330078125, "global_step": 12724, "epoch": 153} {"train_loss": -17.999727249145508, "global_step": 12725, "epoch": 153} {"train_loss": -17.786405563354492, "global_step": 12726, "epoch": 153} {"train_loss": -17.51375389099121, "global_step": 12727, "epoch": 153} {"train_loss": -18.11278533935547, "global_step": 12728, "epoch": 153} {"train_loss": -18.09626007080078, "global_step": 12729, "epoch": 153} {"train_loss": -17.90749168395996, "global_step": 12730, "epoch": 153} {"train_loss": -17.947994232177734, "global_step": 12731, "epoch": 153} {"train_loss": -17.44294548034668, "global_step": 12732, "epoch": 153} {"train_loss": -17.795373916625977, "global_step": 12733, "epoch": 153} {"train_loss": -17.912275314331055, "global_step": 12734, "epoch": 153} {"train_loss": -17.771581649780273, "global_step": 12735, "epoch": 153} {"train_loss": -17.710241317749023, "global_step": 12736, "epoch": 153} {"train_loss": -18.07770347595215, "global_step": 12737, "epoch": 153} {"train_loss": -17.671695709228516, "global_step": 12738, "epoch": 153} {"train_loss": -18.036972045898438, "global_step": 12739, "epoch": 153} {"train_loss": -18.168607711791992, "global_step": 12740, "epoch": 153} {"train_loss": -17.6456356048584, "global_step": 12741, "epoch": 153} {"train_loss": -17.73809051513672, "global_step": 12742, "epoch": 153} {"train_loss": -17.979185104370117, "global_step": 12743, "epoch": 153} {"train_loss": -17.30268669128418, "global_step": 12744, "epoch": 153} {"train_loss": -17.604448318481445, "global_step": 12745, "epoch": 153} {"train_loss": -17.970083236694336, "global_step": 12746, "epoch": 153} {"train_loss": -17.826339721679688, "global_step": 12747, "epoch": 153} {"train_loss": -17.881378173828125, "global_step": 12748, "epoch": 153} {"train_loss": -17.601367950439453, "global_step": 12749, "epoch": 153} {"train_loss": -18.156536102294922, "global_step": 12750, "epoch": 153} {"train_loss": -17.816694259643555, "global_step": 12751, "epoch": 153} {"train_loss": -17.89713478088379, "global_step": 12752, "epoch": 153} {"train_loss": -17.774444580078125, "global_step": 12753, "epoch": 153} {"train_loss": -17.956281661987305, "global_step": 12754, "epoch": 153} {"train_loss": -17.867185592651367, "global_step": 12755, "epoch": 153} {"train_loss": -18.00445556640625, "global_step": 12756, "epoch": 153} {"train_loss": -17.88388442993164, "global_step": 12757, "epoch": 153} {"train_loss": -18.0649471282959, "global_step": 12758, "epoch": 153} {"train_loss": -18.069705963134766, "global_step": 12759, "epoch": 153} {"train_loss": -18.22938346862793, "global_step": 12760, "epoch": 153} {"train_loss": -18.286558151245117, "global_step": 12761, "epoch": 153} {"train_loss": -17.9093074798584, "global_step": 12762, "epoch": 153} {"train_loss": -18.18265724182129, "global_step": 12763, "epoch": 153} {"train_loss": -17.768972396850586, "global_step": 12764, "epoch": 153} {"train_loss": -18.102399826049805, "global_step": 12765, "epoch": 153} {"train_loss": -17.53889274597168, "global_step": 12766, "epoch": 153} {"train_loss": -17.73697280883789, "global_step": 12767, "epoch": 153} {"train_loss": -17.711233139038086, "global_step": 12768, "epoch": 153} {"train_loss": -18.279321670532227, "global_step": 12769, "epoch": 153} {"train_loss": -17.599924087524414, "global_step": 12770, "epoch": 153} {"train_loss": -18.00673484802246, "global_step": 12771, "epoch": 153} {"train_loss": -17.71189308166504, "global_step": 12772, "epoch": 153} {"train_loss": -18.26283836364746, "global_step": 12773, "epoch": 153} {"train_loss": -18.06941795349121, "global_step": 12774, "epoch": 153} {"train_loss": -18.317630767822266, "global_step": 12775, "epoch": 153} {"train_loss": -17.79823112487793, "global_step": 12776, "epoch": 153} {"train_loss": -17.86761474609375, "global_step": 12777, "epoch": 153} {"train_loss": -17.897777557373047, "global_step": 12778, "epoch": 153} {"train_loss": -18.07399559020996, "global_step": 12779, "epoch": 153} {"train_loss": -17.601804733276367, "global_step": 12780, "epoch": 153} {"train_loss": -17.8719545617161, "global_step": 12781, "epoch": 153, "val_loss": 6103758.0} {"train_loss": -17.698270797729492, "global_step": 12782, "epoch": 154} {"train_loss": -17.717147827148438, "global_step": 12783, "epoch": 154} {"train_loss": -17.94236183166504, "global_step": 12784, "epoch": 154} {"train_loss": -17.826719284057617, "global_step": 12785, "epoch": 154} {"train_loss": -18.175064086914062, "global_step": 12786, "epoch": 154} {"train_loss": -17.39434814453125, "global_step": 12787, "epoch": 154} {"train_loss": -17.80476951599121, "global_step": 12788, "epoch": 154} {"train_loss": -18.017881393432617, "global_step": 12789, "epoch": 154} {"train_loss": -17.808237075805664, "global_step": 12790, "epoch": 154} {"train_loss": -17.707870483398438, "global_step": 12791, "epoch": 154} {"train_loss": -18.000707626342773, "global_step": 12792, "epoch": 154} {"train_loss": -17.768651962280273, "global_step": 12793, "epoch": 154} {"train_loss": -17.629240036010742, "global_step": 12794, "epoch": 154} {"train_loss": -17.83875274658203, "global_step": 12795, "epoch": 154} {"train_loss": -17.8428955078125, "global_step": 12796, "epoch": 154} {"train_loss": -18.020891189575195, "global_step": 12797, "epoch": 154} {"train_loss": -18.1179141998291, "global_step": 12798, "epoch": 154} {"train_loss": -17.91639518737793, "global_step": 12799, "epoch": 154} {"train_loss": -17.828983306884766, "global_step": 12800, "epoch": 154} {"train_loss": -18.332422256469727, "global_step": 12801, "epoch": 154} {"train_loss": -17.681907653808594, "global_step": 12802, "epoch": 154} {"train_loss": -17.827600479125977, "global_step": 12803, "epoch": 154} {"train_loss": -17.90363883972168, "global_step": 12804, "epoch": 154} {"train_loss": -18.04389190673828, "global_step": 12805, "epoch": 154} {"train_loss": -17.781024932861328, "global_step": 12806, "epoch": 154} {"train_loss": -17.56104850769043, "global_step": 12807, "epoch": 154} {"train_loss": -18.0272159576416, "global_step": 12808, "epoch": 154} {"train_loss": -18.137617111206055, "global_step": 12809, "epoch": 154} {"train_loss": -17.787757873535156, "global_step": 12810, "epoch": 154} {"train_loss": -17.875242233276367, "global_step": 12811, "epoch": 154} {"train_loss": -17.91566276550293, "global_step": 12812, "epoch": 154} {"train_loss": -18.080718994140625, "global_step": 12813, "epoch": 154} {"train_loss": -17.671472549438477, "global_step": 12814, "epoch": 154} {"train_loss": -17.935035705566406, "global_step": 12815, "epoch": 154} {"train_loss": -18.15273094177246, "global_step": 12816, "epoch": 154} {"train_loss": -18.08322525024414, "global_step": 12817, "epoch": 154} {"train_loss": -17.796207427978516, "global_step": 12818, "epoch": 154} {"train_loss": -18.039688110351562, "global_step": 12819, "epoch": 154} {"train_loss": -17.869352340698242, "global_step": 12820, "epoch": 154} {"train_loss": -17.91840934753418, "global_step": 12821, "epoch": 154} {"train_loss": -18.034456253051758, "global_step": 12822, "epoch": 154} {"train_loss": -18.067829132080078, "global_step": 12823, "epoch": 154} {"train_loss": -18.219322204589844, "global_step": 12824, "epoch": 154} {"train_loss": -17.770273208618164, "global_step": 12825, "epoch": 154} {"train_loss": -18.0482177734375, "global_step": 12826, "epoch": 154} {"train_loss": -18.04707145690918, "global_step": 12827, "epoch": 154} {"train_loss": -18.36586570739746, "global_step": 12828, "epoch": 154} {"train_loss": -18.028522491455078, "global_step": 12829, "epoch": 154} {"train_loss": -17.696624755859375, "global_step": 12830, "epoch": 154} {"train_loss": -17.745304107666016, "global_step": 12831, "epoch": 154} {"train_loss": -17.628835678100586, "global_step": 12832, "epoch": 154} {"train_loss": -17.808969497680664, "global_step": 12833, "epoch": 154} {"train_loss": -17.984678268432617, "global_step": 12834, "epoch": 154} {"train_loss": -17.89133644104004, "global_step": 12835, "epoch": 154} {"train_loss": -17.74530792236328, "global_step": 12836, "epoch": 154} {"train_loss": -17.972700119018555, "global_step": 12837, "epoch": 154} {"train_loss": -17.94878578186035, "global_step": 12838, "epoch": 154} {"train_loss": -17.96132469177246, "global_step": 12839, "epoch": 154} {"train_loss": -17.908203125, "global_step": 12840, "epoch": 154} {"train_loss": -17.987695693969727, "global_step": 12841, "epoch": 154} {"train_loss": -17.929197311401367, "global_step": 12842, "epoch": 154} {"train_loss": -17.49698257446289, "global_step": 12843, "epoch": 154} {"train_loss": -17.724964141845703, "global_step": 12844, "epoch": 154} {"train_loss": -17.624771118164062, "global_step": 12845, "epoch": 154} {"train_loss": -17.95212173461914, "global_step": 12846, "epoch": 154} {"train_loss": -17.969165802001953, "global_step": 12847, "epoch": 154} {"train_loss": -17.90988540649414, "global_step": 12848, "epoch": 154} {"train_loss": -17.850255966186523, "global_step": 12849, "epoch": 154} {"train_loss": -18.060985565185547, "global_step": 12850, "epoch": 154} {"train_loss": -17.99112892150879, "global_step": 12851, "epoch": 154} {"train_loss": -17.9620304107666, "global_step": 12852, "epoch": 154} {"train_loss": -18.2052001953125, "global_step": 12853, "epoch": 154} {"train_loss": -18.20589828491211, "global_step": 12854, "epoch": 154} {"train_loss": -17.706470489501953, "global_step": 12855, "epoch": 154} {"train_loss": -17.9276180267334, "global_step": 12856, "epoch": 154} {"train_loss": -18.38494873046875, "global_step": 12857, "epoch": 154} {"train_loss": -18.093021392822266, "global_step": 12858, "epoch": 154} {"train_loss": -17.92633056640625, "global_step": 12859, "epoch": 154} {"train_loss": -17.943321228027344, "global_step": 12860, "epoch": 154} {"train_loss": -17.932992935180664, "global_step": 12861, "epoch": 154} {"train_loss": -17.92044448852539, "global_step": 12862, "epoch": 154} {"train_loss": -18.2879581451416, "global_step": 12863, "epoch": 154} {"train_loss": -17.919904364160743, "global_step": 12864, "epoch": 154, "val_loss": 6159117.5} {"train_loss": -17.676393508911133, "global_step": 12865, "epoch": 155} {"train_loss": -17.932647705078125, "global_step": 12866, "epoch": 155} {"train_loss": -17.3869571685791, "global_step": 12867, "epoch": 155} {"train_loss": -17.740468978881836, "global_step": 12868, "epoch": 155} {"train_loss": -17.997474670410156, "global_step": 12869, "epoch": 155} {"train_loss": -17.745901107788086, "global_step": 12870, "epoch": 155} {"train_loss": -17.18172264099121, "global_step": 12871, "epoch": 155} {"train_loss": -17.42098045349121, "global_step": 12872, "epoch": 155} {"train_loss": -17.82539176940918, "global_step": 12873, "epoch": 155} {"train_loss": -18.03192710876465, "global_step": 12874, "epoch": 155} {"train_loss": -18.06708526611328, "global_step": 12875, "epoch": 155} {"train_loss": -17.768068313598633, "global_step": 12876, "epoch": 155} {"train_loss": -18.127830505371094, "global_step": 12877, "epoch": 155} {"train_loss": -18.061613082885742, "global_step": 12878, "epoch": 155} {"train_loss": -17.941593170166016, "global_step": 12879, "epoch": 155} {"train_loss": -18.060455322265625, "global_step": 12880, "epoch": 155} {"train_loss": -17.824201583862305, "global_step": 12881, "epoch": 155} {"train_loss": -17.53126335144043, "global_step": 12882, "epoch": 155} {"train_loss": -17.60211753845215, "global_step": 12883, "epoch": 155} {"train_loss": -18.177213668823242, "global_step": 12884, "epoch": 155} {"train_loss": -17.792877197265625, "global_step": 12885, "epoch": 155} {"train_loss": -17.800762176513672, "global_step": 12886, "epoch": 155} {"train_loss": -17.803125381469727, "global_step": 12887, "epoch": 155} {"train_loss": -18.210866928100586, "global_step": 12888, "epoch": 155} {"train_loss": -17.678884506225586, "global_step": 12889, "epoch": 155} {"train_loss": -17.778289794921875, "global_step": 12890, "epoch": 155} {"train_loss": -18.044830322265625, "global_step": 12891, "epoch": 155} {"train_loss": -17.950498580932617, "global_step": 12892, "epoch": 155} {"train_loss": -18.178129196166992, "global_step": 12893, "epoch": 155} {"train_loss": -18.189273834228516, "global_step": 12894, "epoch": 155} {"train_loss": -17.916671752929688, "global_step": 12895, "epoch": 155} {"train_loss": -17.854352951049805, "global_step": 12896, "epoch": 155} {"train_loss": -17.60253143310547, "global_step": 12897, "epoch": 155} {"train_loss": -18.290576934814453, "global_step": 12898, "epoch": 155} {"train_loss": -18.17084312438965, "global_step": 12899, "epoch": 155} {"train_loss": -18.12337303161621, "global_step": 12900, "epoch": 155} {"train_loss": -17.78105926513672, "global_step": 12901, "epoch": 155} {"train_loss": -17.683719635009766, "global_step": 12902, "epoch": 155} {"train_loss": -18.208337783813477, "global_step": 12903, "epoch": 155} {"train_loss": -18.007400512695312, "global_step": 12904, "epoch": 155} {"train_loss": -17.989517211914062, "global_step": 12905, "epoch": 155} {"train_loss": -17.526166915893555, "global_step": 12906, "epoch": 155} {"train_loss": -18.1414737701416, "global_step": 12907, "epoch": 155} {"train_loss": -17.70749855041504, "global_step": 12908, "epoch": 155} {"train_loss": -18.003572463989258, "global_step": 12909, "epoch": 155} {"train_loss": -18.032556533813477, "global_step": 12910, "epoch": 155} {"train_loss": -17.85138511657715, "global_step": 12911, "epoch": 155} {"train_loss": -18.157655715942383, "global_step": 12912, "epoch": 155} {"train_loss": -17.897289276123047, "global_step": 12913, "epoch": 155} {"train_loss": -17.780454635620117, "global_step": 12914, "epoch": 155} {"train_loss": -18.286706924438477, "global_step": 12915, "epoch": 155} {"train_loss": -18.129409790039062, "global_step": 12916, "epoch": 155} {"train_loss": -18.10577392578125, "global_step": 12917, "epoch": 155} {"train_loss": -17.53151512145996, "global_step": 12918, "epoch": 155} {"train_loss": -17.86345672607422, "global_step": 12919, "epoch": 155} {"train_loss": -17.776159286499023, "global_step": 12920, "epoch": 155} {"train_loss": -17.602331161499023, "global_step": 12921, "epoch": 155} {"train_loss": -17.69217872619629, "global_step": 12922, "epoch": 155} {"train_loss": -17.708473205566406, "global_step": 12923, "epoch": 155} {"train_loss": -18.186063766479492, "global_step": 12924, "epoch": 155} {"train_loss": -18.140262603759766, "global_step": 12925, "epoch": 155} {"train_loss": -17.44740104675293, "global_step": 12926, "epoch": 155} {"train_loss": -17.57843589782715, "global_step": 12927, "epoch": 155} {"train_loss": -18.45672035217285, "global_step": 12928, "epoch": 155} {"train_loss": -17.514636993408203, "global_step": 12929, "epoch": 155} {"train_loss": -18.265892028808594, "global_step": 12930, "epoch": 155} {"train_loss": -17.594758987426758, "global_step": 12931, "epoch": 155} {"train_loss": -18.02715492248535, "global_step": 12932, "epoch": 155} {"train_loss": -17.714468002319336, "global_step": 12933, "epoch": 155} {"train_loss": -17.988271713256836, "global_step": 12934, "epoch": 155} {"train_loss": -18.063093185424805, "global_step": 12935, "epoch": 155} {"train_loss": -17.754133224487305, "global_step": 12936, "epoch": 155} {"train_loss": -17.69427490234375, "global_step": 12937, "epoch": 155} {"train_loss": -17.663854598999023, "global_step": 12938, "epoch": 155} {"train_loss": -18.12201499938965, "global_step": 12939, "epoch": 155} {"train_loss": -17.848844528198242, "global_step": 12940, "epoch": 155} {"train_loss": -17.867931365966797, "global_step": 12941, "epoch": 155} {"train_loss": -17.594785690307617, "global_step": 12942, "epoch": 155} {"train_loss": -17.99057960510254, "global_step": 12943, "epoch": 155} {"train_loss": -17.577085494995117, "global_step": 12944, "epoch": 155} {"train_loss": -18.4666690826416, "global_step": 12945, "epoch": 155} {"train_loss": -17.91800880432129, "global_step": 12946, "epoch": 155} {"train_loss": -17.905943652233447, "global_step": 12947, "epoch": 155, "val_loss": 6122929.5} {"train_loss": -17.837865829467773, "global_step": 12948, "epoch": 156} {"train_loss": -17.79366111755371, "global_step": 12949, "epoch": 156} {"train_loss": -17.7806339263916, "global_step": 12950, "epoch": 156} {"train_loss": -17.632902145385742, "global_step": 12951, "epoch": 156} {"train_loss": -18.199356079101562, "global_step": 12952, "epoch": 156} {"train_loss": -17.200363159179688, "global_step": 12953, "epoch": 156} {"train_loss": -18.20507049560547, "global_step": 12954, "epoch": 156} {"train_loss": -17.759740829467773, "global_step": 12955, "epoch": 156} {"train_loss": -17.92399024963379, "global_step": 12956, "epoch": 156} {"train_loss": -17.9346981048584, "global_step": 12957, "epoch": 156} {"train_loss": -18.217628479003906, "global_step": 12958, "epoch": 156} {"train_loss": -17.845916748046875, "global_step": 12959, "epoch": 156} {"train_loss": -18.347944259643555, "global_step": 12960, "epoch": 156} {"train_loss": -17.599225997924805, "global_step": 12961, "epoch": 156} {"train_loss": -17.946435928344727, "global_step": 12962, "epoch": 156} {"train_loss": -17.840572357177734, "global_step": 12963, "epoch": 156} {"train_loss": -17.906482696533203, "global_step": 12964, "epoch": 156} {"train_loss": -17.849103927612305, "global_step": 12965, "epoch": 156} {"train_loss": -17.924955368041992, "global_step": 12966, "epoch": 156} {"train_loss": -17.573278427124023, "global_step": 12967, "epoch": 156} {"train_loss": -17.75830841064453, "global_step": 12968, "epoch": 156} {"train_loss": -17.61508560180664, "global_step": 12969, "epoch": 156} {"train_loss": -17.855899810791016, "global_step": 12970, "epoch": 156} {"train_loss": -17.819128036499023, "global_step": 12971, "epoch": 156} {"train_loss": -18.106603622436523, "global_step": 12972, "epoch": 156} {"train_loss": -17.57154655456543, "global_step": 12973, "epoch": 156} {"train_loss": -17.698911666870117, "global_step": 12974, "epoch": 156} {"train_loss": -17.451894760131836, "global_step": 12975, "epoch": 156} {"train_loss": -18.263126373291016, "global_step": 12976, "epoch": 156} {"train_loss": -17.68546485900879, "global_step": 12977, "epoch": 156} {"train_loss": -18.142972946166992, "global_step": 12978, "epoch": 156} {"train_loss": -17.625747680664062, "global_step": 12979, "epoch": 156} {"train_loss": -18.53359603881836, "global_step": 12980, "epoch": 156} {"train_loss": -17.91132926940918, "global_step": 12981, "epoch": 156} {"train_loss": -18.24457359313965, "global_step": 12982, "epoch": 156} {"train_loss": -18.059690475463867, "global_step": 12983, "epoch": 156} {"train_loss": -17.65648078918457, "global_step": 12984, "epoch": 156} {"train_loss": -17.898054122924805, "global_step": 12985, "epoch": 156} {"train_loss": -17.97562026977539, "global_step": 12986, "epoch": 156} {"train_loss": -17.789098739624023, "global_step": 12987, "epoch": 156} {"train_loss": -18.00295066833496, "global_step": 12988, "epoch": 156} {"train_loss": -17.763425827026367, "global_step": 12989, "epoch": 156} {"train_loss": -17.619836807250977, "global_step": 12990, "epoch": 156} {"train_loss": -17.93839454650879, "global_step": 12991, "epoch": 156} {"train_loss": -17.64735221862793, "global_step": 12992, "epoch": 156} {"train_loss": -17.94582748413086, "global_step": 12993, "epoch": 156} {"train_loss": -17.53934097290039, "global_step": 12994, "epoch": 156} {"train_loss": -18.07271385192871, "global_step": 12995, "epoch": 156} {"train_loss": -18.200780868530273, "global_step": 12996, "epoch": 156} {"train_loss": -17.974451065063477, "global_step": 12997, "epoch": 156} {"train_loss": -17.976835250854492, "global_step": 12998, "epoch": 156} {"train_loss": -17.97879409790039, "global_step": 12999, "epoch": 156} {"train_loss": -17.86423110961914, "global_step": 13000, "epoch": 156} {"train_loss": -18.25605010986328, "global_step": 13001, "epoch": 156} {"train_loss": -17.74022674560547, "global_step": 13002, "epoch": 156} {"train_loss": -18.13212013244629, "global_step": 13003, "epoch": 156} {"train_loss": -17.389516830444336, "global_step": 13004, "epoch": 156} {"train_loss": -17.666217803955078, "global_step": 13005, "epoch": 156} {"train_loss": -17.833024978637695, "global_step": 13006, "epoch": 156} {"train_loss": -18.170129776000977, "global_step": 13007, "epoch": 156} {"train_loss": -18.169692993164062, "global_step": 13008, "epoch": 156} {"train_loss": -17.976659774780273, "global_step": 13009, "epoch": 156} {"train_loss": -17.680601119995117, "global_step": 13010, "epoch": 156} {"train_loss": -17.986539840698242, "global_step": 13011, "epoch": 156} {"train_loss": -18.195066452026367, "global_step": 13012, "epoch": 156} {"train_loss": -17.93157386779785, "global_step": 13013, "epoch": 156} {"train_loss": -17.792028427124023, "global_step": 13014, "epoch": 156} {"train_loss": -17.446334838867188, "global_step": 13015, "epoch": 156} {"train_loss": -18.137876510620117, "global_step": 13016, "epoch": 156} {"train_loss": -17.922794342041016, "global_step": 13017, "epoch": 156} {"train_loss": -18.182090759277344, "global_step": 13018, "epoch": 156} {"train_loss": -17.749662399291992, "global_step": 13019, "epoch": 156} {"train_loss": -18.141098022460938, "global_step": 13020, "epoch": 156} {"train_loss": -17.879520416259766, "global_step": 13021, "epoch": 156} {"train_loss": -17.942115783691406, "global_step": 13022, "epoch": 156} {"train_loss": -18.067541122436523, "global_step": 13023, "epoch": 156} {"train_loss": -17.757980346679688, "global_step": 13024, "epoch": 156} {"train_loss": -17.862512588500977, "global_step": 13025, "epoch": 156} {"train_loss": -18.01961326599121, "global_step": 13026, "epoch": 156} {"train_loss": -18.218280792236328, "global_step": 13027, "epoch": 156} {"train_loss": -17.68758201599121, "global_step": 13028, "epoch": 156} {"train_loss": -17.737598419189453, "global_step": 13029, "epoch": 156} {"train_loss": -17.890345240213787, "global_step": 13030, "epoch": 156, "val_loss": 6187060.0} {"train_loss": -17.84317970275879, "global_step": 13031, "epoch": 157} {"train_loss": -17.81996726989746, "global_step": 13032, "epoch": 157} {"train_loss": -18.058757781982422, "global_step": 13033, "epoch": 157} {"train_loss": -17.654455184936523, "global_step": 13034, "epoch": 157} {"train_loss": -18.2871150970459, "global_step": 13035, "epoch": 157} {"train_loss": -17.904937744140625, "global_step": 13036, "epoch": 157} {"train_loss": -17.920324325561523, "global_step": 13037, "epoch": 157} {"train_loss": -18.20945930480957, "global_step": 13038, "epoch": 157} {"train_loss": -17.80238151550293, "global_step": 13039, "epoch": 157} {"train_loss": -18.040054321289062, "global_step": 13040, "epoch": 157} {"train_loss": -17.99765968322754, "global_step": 13041, "epoch": 157} {"train_loss": -17.796499252319336, "global_step": 13042, "epoch": 157} {"train_loss": -18.411893844604492, "global_step": 13043, "epoch": 157} {"train_loss": -17.98274803161621, "global_step": 13044, "epoch": 157} {"train_loss": -17.97148895263672, "global_step": 13045, "epoch": 157} {"train_loss": -18.111709594726562, "global_step": 13046, "epoch": 157} {"train_loss": -18.1529541015625, "global_step": 13047, "epoch": 157} {"train_loss": -18.264680862426758, "global_step": 13048, "epoch": 157} {"train_loss": -17.52672576904297, "global_step": 13049, "epoch": 157} {"train_loss": -17.63939094543457, "global_step": 13050, "epoch": 157} {"train_loss": -18.00432777404785, "global_step": 13051, "epoch": 157} {"train_loss": -18.083524703979492, "global_step": 13052, "epoch": 157} {"train_loss": -17.874042510986328, "global_step": 13053, "epoch": 157} {"train_loss": -18.02680206298828, "global_step": 13054, "epoch": 157} {"train_loss": -18.2359619140625, "global_step": 13055, "epoch": 157} {"train_loss": -17.813016891479492, "global_step": 13056, "epoch": 157} {"train_loss": -18.181251525878906, "global_step": 13057, "epoch": 157} {"train_loss": -17.81705093383789, "global_step": 13058, "epoch": 157} {"train_loss": -17.79644203186035, "global_step": 13059, "epoch": 157} {"train_loss": -17.920866012573242, "global_step": 13060, "epoch": 157} {"train_loss": -17.675792694091797, "global_step": 13061, "epoch": 157} {"train_loss": -18.106002807617188, "global_step": 13062, "epoch": 157} {"train_loss": -17.692867279052734, "global_step": 13063, "epoch": 157} {"train_loss": -17.82413101196289, "global_step": 13064, "epoch": 157} {"train_loss": -17.722152709960938, "global_step": 13065, "epoch": 157} {"train_loss": -18.09852409362793, "global_step": 13066, "epoch": 157} {"train_loss": -17.926481246948242, "global_step": 13067, "epoch": 157} {"train_loss": -17.860132217407227, "global_step": 13068, "epoch": 157} {"train_loss": -17.9495906829834, "global_step": 13069, "epoch": 157} {"train_loss": -18.24165916442871, "global_step": 13070, "epoch": 157} {"train_loss": -18.446531295776367, "global_step": 13071, "epoch": 157} {"train_loss": -17.807392120361328, "global_step": 13072, "epoch": 157} {"train_loss": -17.877592086791992, "global_step": 13073, "epoch": 157} {"train_loss": -18.097183227539062, "global_step": 13074, "epoch": 157} {"train_loss": -17.7609920501709, "global_step": 13075, "epoch": 157} {"train_loss": -17.63863182067871, "global_step": 13076, "epoch": 157} {"train_loss": -18.03314208984375, "global_step": 13077, "epoch": 157} {"train_loss": -18.029218673706055, "global_step": 13078, "epoch": 157} {"train_loss": -17.504606246948242, "global_step": 13079, "epoch": 157} {"train_loss": -18.49445152282715, "global_step": 13080, "epoch": 157} {"train_loss": -17.93497657775879, "global_step": 13081, "epoch": 157} {"train_loss": -17.884328842163086, "global_step": 13082, "epoch": 157} {"train_loss": -17.574750900268555, "global_step": 13083, "epoch": 157} {"train_loss": -17.86490821838379, "global_step": 13084, "epoch": 157} {"train_loss": -18.311399459838867, "global_step": 13085, "epoch": 157} {"train_loss": -18.328283309936523, "global_step": 13086, "epoch": 157} {"train_loss": -17.624021530151367, "global_step": 13087, "epoch": 157} {"train_loss": -17.91080665588379, "global_step": 13088, "epoch": 157} {"train_loss": -17.896554946899414, "global_step": 13089, "epoch": 157} {"train_loss": -17.74726676940918, "global_step": 13090, "epoch": 157} {"train_loss": -17.589111328125, "global_step": 13091, "epoch": 157} {"train_loss": -17.796537399291992, "global_step": 13092, "epoch": 157} {"train_loss": -18.069381713867188, "global_step": 13093, "epoch": 157} {"train_loss": -17.68838882446289, "global_step": 13094, "epoch": 157} {"train_loss": -17.95637321472168, "global_step": 13095, "epoch": 157} {"train_loss": -17.75038719177246, "global_step": 13096, "epoch": 157} {"train_loss": -18.07191276550293, "global_step": 13097, "epoch": 157} {"train_loss": -18.437952041625977, "global_step": 13098, "epoch": 157} {"train_loss": -17.556804656982422, "global_step": 13099, "epoch": 157} {"train_loss": -17.866762161254883, "global_step": 13100, "epoch": 157} {"train_loss": -17.4169921875, "global_step": 13101, "epoch": 157} {"train_loss": -18.06427001953125, "global_step": 13102, "epoch": 157} {"train_loss": -18.33705711364746, "global_step": 13103, "epoch": 157} {"train_loss": -18.022705078125, "global_step": 13104, "epoch": 157} {"train_loss": -18.097640991210938, "global_step": 13105, "epoch": 157} {"train_loss": -18.077802658081055, "global_step": 13106, "epoch": 157} {"train_loss": -18.02858543395996, "global_step": 13107, "epoch": 157} {"train_loss": -18.211565017700195, "global_step": 13108, "epoch": 157} {"train_loss": -17.742084503173828, "global_step": 13109, "epoch": 157} {"train_loss": -17.816659927368164, "global_step": 13110, "epoch": 157} {"train_loss": -18.068218231201172, "global_step": 13111, "epoch": 157} {"train_loss": -17.850112915039062, "global_step": 13112, "epoch": 157} {"train_loss": -17.928435291152404, "global_step": 13113, "epoch": 157, "val_loss": 6031102.0} {"train_loss": -17.841520309448242, "global_step": 13114, "epoch": 158} {"train_loss": -17.768156051635742, "global_step": 13115, "epoch": 158} {"train_loss": -17.684595108032227, "global_step": 13116, "epoch": 158} {"train_loss": -17.720727920532227, "global_step": 13117, "epoch": 158} {"train_loss": -17.121408462524414, "global_step": 13118, "epoch": 158} {"train_loss": -17.86952018737793, "global_step": 13119, "epoch": 158} {"train_loss": -17.756376266479492, "global_step": 13120, "epoch": 158} {"train_loss": -17.80916976928711, "global_step": 13121, "epoch": 158} {"train_loss": -17.584821701049805, "global_step": 13122, "epoch": 158} {"train_loss": -17.892343521118164, "global_step": 13123, "epoch": 158} {"train_loss": -17.683279037475586, "global_step": 13124, "epoch": 158} {"train_loss": -17.497812271118164, "global_step": 13125, "epoch": 158} {"train_loss": -17.933908462524414, "global_step": 13126, "epoch": 158} {"train_loss": -17.664432525634766, "global_step": 13127, "epoch": 158} {"train_loss": -17.92435073852539, "global_step": 13128, "epoch": 158} {"train_loss": -17.93057632446289, "global_step": 13129, "epoch": 158} {"train_loss": -18.275495529174805, "global_step": 13130, "epoch": 158} {"train_loss": -17.889352798461914, "global_step": 13131, "epoch": 158} {"train_loss": -17.99126625061035, "global_step": 13132, "epoch": 158} {"train_loss": -18.13652992248535, "global_step": 13133, "epoch": 158} {"train_loss": -17.914430618286133, "global_step": 13134, "epoch": 158} {"train_loss": -17.88956642150879, "global_step": 13135, "epoch": 158} {"train_loss": -17.834548950195312, "global_step": 13136, "epoch": 158} {"train_loss": -17.95953941345215, "global_step": 13137, "epoch": 158} {"train_loss": -17.981374740600586, "global_step": 13138, "epoch": 158} {"train_loss": -18.17466163635254, "global_step": 13139, "epoch": 158} {"train_loss": -17.804691314697266, "global_step": 13140, "epoch": 158} {"train_loss": -17.878183364868164, "global_step": 13141, "epoch": 158} {"train_loss": -17.775691986083984, "global_step": 13142, "epoch": 158} {"train_loss": -18.105371475219727, "global_step": 13143, "epoch": 158} {"train_loss": -18.29706382751465, "global_step": 13144, "epoch": 158} {"train_loss": -18.078580856323242, "global_step": 13145, "epoch": 158} {"train_loss": -18.140798568725586, "global_step": 13146, "epoch": 158} {"train_loss": -17.968149185180664, "global_step": 13147, "epoch": 158} {"train_loss": -18.14889907836914, "global_step": 13148, "epoch": 158} {"train_loss": -17.58409309387207, "global_step": 13149, "epoch": 158} {"train_loss": -18.010257720947266, "global_step": 13150, "epoch": 158} {"train_loss": -17.930143356323242, "global_step": 13151, "epoch": 158} {"train_loss": -17.85934829711914, "global_step": 13152, "epoch": 158} {"train_loss": -17.954240798950195, "global_step": 13153, "epoch": 158} {"train_loss": -17.763700485229492, "global_step": 13154, "epoch": 158} {"train_loss": -17.959569931030273, "global_step": 13155, "epoch": 158} {"train_loss": -17.818370819091797, "global_step": 13156, "epoch": 158} {"train_loss": -18.443151473999023, "global_step": 13157, "epoch": 158} {"train_loss": -17.90995979309082, "global_step": 13158, "epoch": 158} {"train_loss": -17.672306060791016, "global_step": 13159, "epoch": 158} {"train_loss": -17.759727478027344, "global_step": 13160, "epoch": 158} {"train_loss": -17.898101806640625, "global_step": 13161, "epoch": 158} {"train_loss": -17.972949981689453, "global_step": 13162, "epoch": 158} {"train_loss": -17.8447265625, "global_step": 13163, "epoch": 158} {"train_loss": -17.78555679321289, "global_step": 13164, "epoch": 158} {"train_loss": -18.096479415893555, "global_step": 13165, "epoch": 158} {"train_loss": -17.88155174255371, "global_step": 13166, "epoch": 158} {"train_loss": -18.097299575805664, "global_step": 13167, "epoch": 158} {"train_loss": -17.543729782104492, "global_step": 13168, "epoch": 158} {"train_loss": -17.957656860351562, "global_step": 13169, "epoch": 158} {"train_loss": -17.826505661010742, "global_step": 13170, "epoch": 158} {"train_loss": -17.92061424255371, "global_step": 13171, "epoch": 158} {"train_loss": -17.9820556640625, "global_step": 13172, "epoch": 158} {"train_loss": -17.997072219848633, "global_step": 13173, "epoch": 158} {"train_loss": -18.263229370117188, "global_step": 13174, "epoch": 158} {"train_loss": -18.24104881286621, "global_step": 13175, "epoch": 158} {"train_loss": -18.13384437561035, "global_step": 13176, "epoch": 158} {"train_loss": -18.11867332458496, "global_step": 13177, "epoch": 158} {"train_loss": -17.790077209472656, "global_step": 13178, "epoch": 158} {"train_loss": -17.954875946044922, "global_step": 13179, "epoch": 158} {"train_loss": -17.892526626586914, "global_step": 13180, "epoch": 158} {"train_loss": -18.151456832885742, "global_step": 13181, "epoch": 158} {"train_loss": -17.956932067871094, "global_step": 13182, "epoch": 158} {"train_loss": -17.979406356811523, "global_step": 13183, "epoch": 158} {"train_loss": -17.93549919128418, "global_step": 13184, "epoch": 158} {"train_loss": -17.974956512451172, "global_step": 13185, "epoch": 158} {"train_loss": -17.661575317382812, "global_step": 13186, "epoch": 158} {"train_loss": -17.6768856048584, "global_step": 13187, "epoch": 158} {"train_loss": -17.569608688354492, "global_step": 13188, "epoch": 158} {"train_loss": -18.26104164123535, "global_step": 13189, "epoch": 158} {"train_loss": -17.87671661376953, "global_step": 13190, "epoch": 158} {"train_loss": -18.314401626586914, "global_step": 13191, "epoch": 158} {"train_loss": -18.026700973510742, "global_step": 13192, "epoch": 158} {"train_loss": -18.068470001220703, "global_step": 13193, "epoch": 158} {"train_loss": -18.377851486206055, "global_step": 13194, "epoch": 158} {"train_loss": -18.038917541503906, "global_step": 13195, "epoch": 158} {"train_loss": -17.922265018325255, "global_step": 13196, "epoch": 158, "val_loss": 6200180.0} {"train_loss": -17.99140739440918, "global_step": 13197, "epoch": 159} {"train_loss": -17.842018127441406, "global_step": 13198, "epoch": 159} {"train_loss": -17.915632247924805, "global_step": 13199, "epoch": 159} {"train_loss": -18.0474796295166, "global_step": 13200, "epoch": 159} {"train_loss": -17.618261337280273, "global_step": 13201, "epoch": 159} {"train_loss": -17.699352264404297, "global_step": 13202, "epoch": 159} {"train_loss": -17.87776756286621, "global_step": 13203, "epoch": 159} {"train_loss": -17.68123435974121, "global_step": 13204, "epoch": 159} {"train_loss": -17.961380004882812, "global_step": 13205, "epoch": 159} {"train_loss": -17.8804988861084, "global_step": 13206, "epoch": 159} {"train_loss": -18.024717330932617, "global_step": 13207, "epoch": 159} {"train_loss": -18.003063201904297, "global_step": 13208, "epoch": 159} {"train_loss": -17.59901237487793, "global_step": 13209, "epoch": 159} {"train_loss": -17.686796188354492, "global_step": 13210, "epoch": 159} {"train_loss": -18.208288192749023, "global_step": 13211, "epoch": 159} {"train_loss": -18.142139434814453, "global_step": 13212, "epoch": 159} {"train_loss": -18.053930282592773, "global_step": 13213, "epoch": 159} {"train_loss": -18.0054874420166, "global_step": 13214, "epoch": 159} {"train_loss": -18.34455680847168, "global_step": 13215, "epoch": 159} {"train_loss": -17.744455337524414, "global_step": 13216, "epoch": 159} {"train_loss": -17.864887237548828, "global_step": 13217, "epoch": 159} {"train_loss": -18.243009567260742, "global_step": 13218, "epoch": 159} {"train_loss": -18.141403198242188, "global_step": 13219, "epoch": 159} {"train_loss": -17.42963981628418, "global_step": 13220, "epoch": 159} {"train_loss": -17.719654083251953, "global_step": 13221, "epoch": 159} {"train_loss": -18.146726608276367, "global_step": 13222, "epoch": 159} {"train_loss": -17.858423233032227, "global_step": 13223, "epoch": 159} {"train_loss": -17.81754493713379, "global_step": 13224, "epoch": 159} {"train_loss": -18.324430465698242, "global_step": 13225, "epoch": 159} {"train_loss": -17.81597328186035, "global_step": 13226, "epoch": 159} {"train_loss": -17.89903450012207, "global_step": 13227, "epoch": 159} {"train_loss": -17.945409774780273, "global_step": 13228, "epoch": 159} {"train_loss": -17.82459831237793, "global_step": 13229, "epoch": 159} {"train_loss": -18.11793327331543, "global_step": 13230, "epoch": 159} {"train_loss": -17.804601669311523, "global_step": 13231, "epoch": 159} {"train_loss": -17.810169219970703, "global_step": 13232, "epoch": 159} {"train_loss": -18.001422882080078, "global_step": 13233, "epoch": 159} {"train_loss": -18.09450340270996, "global_step": 13234, "epoch": 159} {"train_loss": -18.389577865600586, "global_step": 13235, "epoch": 159} {"train_loss": -17.82498550415039, "global_step": 13236, "epoch": 159} {"train_loss": -17.81842613220215, "global_step": 13237, "epoch": 159} {"train_loss": -17.89423179626465, "global_step": 13238, "epoch": 159} {"train_loss": -17.880859375, "global_step": 13239, "epoch": 159} {"train_loss": -18.092954635620117, "global_step": 13240, "epoch": 159} {"train_loss": -17.934595108032227, "global_step": 13241, "epoch": 159} {"train_loss": -18.22783660888672, "global_step": 13242, "epoch": 159} {"train_loss": -17.993125915527344, "global_step": 13243, "epoch": 159} {"train_loss": -18.02802085876465, "global_step": 13244, "epoch": 159} {"train_loss": -17.933340072631836, "global_step": 13245, "epoch": 159} {"train_loss": -18.29261589050293, "global_step": 13246, "epoch": 159} {"train_loss": -18.13232421875, "global_step": 13247, "epoch": 159} {"train_loss": -17.845504760742188, "global_step": 13248, "epoch": 159} {"train_loss": -17.98529815673828, "global_step": 13249, "epoch": 159} {"train_loss": -17.8449764251709, "global_step": 13250, "epoch": 159} {"train_loss": -17.7021484375, "global_step": 13251, "epoch": 159} {"train_loss": -18.199491500854492, "global_step": 13252, "epoch": 159} {"train_loss": -18.196317672729492, "global_step": 13253, "epoch": 159} {"train_loss": -17.97019386291504, "global_step": 13254, "epoch": 159} {"train_loss": -17.891803741455078, "global_step": 13255, "epoch": 159} {"train_loss": -18.423904418945312, "global_step": 13256, "epoch": 159} {"train_loss": -18.085050582885742, "global_step": 13257, "epoch": 159} {"train_loss": -17.964984893798828, "global_step": 13258, "epoch": 159} {"train_loss": -18.375497817993164, "global_step": 13259, "epoch": 159} {"train_loss": -17.99966049194336, "global_step": 13260, "epoch": 159} {"train_loss": -17.389015197753906, "global_step": 13261, "epoch": 159} {"train_loss": -18.4154052734375, "global_step": 13262, "epoch": 159} {"train_loss": -18.178089141845703, "global_step": 13263, "epoch": 159} {"train_loss": -17.865354537963867, "global_step": 13264, "epoch": 159} {"train_loss": -17.858745574951172, "global_step": 13265, "epoch": 159} {"train_loss": -17.870136260986328, "global_step": 13266, "epoch": 159} {"train_loss": -17.797353744506836, "global_step": 13267, "epoch": 159} {"train_loss": -17.66693687438965, "global_step": 13268, "epoch": 159} {"train_loss": -18.179895401000977, "global_step": 13269, "epoch": 159} {"train_loss": -17.783416748046875, "global_step": 13270, "epoch": 159} {"train_loss": -17.714731216430664, "global_step": 13271, "epoch": 159} {"train_loss": -17.693662643432617, "global_step": 13272, "epoch": 159} {"train_loss": -18.018741607666016, "global_step": 13273, "epoch": 159} {"train_loss": -17.842744827270508, "global_step": 13274, "epoch": 159} {"train_loss": -18.262557983398438, "global_step": 13275, "epoch": 159} {"train_loss": -17.55942726135254, "global_step": 13276, "epoch": 159} {"train_loss": -18.503278732299805, "global_step": 13277, "epoch": 159} {"train_loss": -17.735393524169922, "global_step": 13278, "epoch": 159} {"train_loss": -17.952691710138897, "global_step": 13279, "epoch": 159, "val_loss": 6134606.0} {"train_loss": -17.740331649780273, "global_step": 13280, "epoch": 160} {"train_loss": -17.95180892944336, "global_step": 13281, "epoch": 160} {"train_loss": -17.776052474975586, "global_step": 13282, "epoch": 160} {"train_loss": -17.859237670898438, "global_step": 13283, "epoch": 160} {"train_loss": -17.95039176940918, "global_step": 13284, "epoch": 160} {"train_loss": -17.772876739501953, "global_step": 13285, "epoch": 160} {"train_loss": -17.957773208618164, "global_step": 13286, "epoch": 160} {"train_loss": -17.54459571838379, "global_step": 13287, "epoch": 160} {"train_loss": -17.879833221435547, "global_step": 13288, "epoch": 160} {"train_loss": -18.531204223632812, "global_step": 13289, "epoch": 160} {"train_loss": -17.774160385131836, "global_step": 13290, "epoch": 160} {"train_loss": -17.244518280029297, "global_step": 13291, "epoch": 160} {"train_loss": -18.131593704223633, "global_step": 13292, "epoch": 160} {"train_loss": -17.9541015625, "global_step": 13293, "epoch": 160} {"train_loss": -17.943744659423828, "global_step": 13294, "epoch": 160} {"train_loss": -17.56707763671875, "global_step": 13295, "epoch": 160} {"train_loss": -18.041196823120117, "global_step": 13296, "epoch": 160} {"train_loss": -17.930456161499023, "global_step": 13297, "epoch": 160} {"train_loss": -17.87758445739746, "global_step": 13298, "epoch": 160} {"train_loss": -17.964990615844727, "global_step": 13299, "epoch": 160} {"train_loss": -17.552698135375977, "global_step": 13300, "epoch": 160} {"train_loss": -18.211904525756836, "global_step": 13301, "epoch": 160} {"train_loss": -17.980697631835938, "global_step": 13302, "epoch": 160} {"train_loss": -18.229297637939453, "global_step": 13303, "epoch": 160} {"train_loss": -18.203298568725586, "global_step": 13304, "epoch": 160} {"train_loss": -18.13382339477539, "global_step": 13305, "epoch": 160} {"train_loss": -17.590316772460938, "global_step": 13306, "epoch": 160} {"train_loss": -17.869455337524414, "global_step": 13307, "epoch": 160} {"train_loss": -18.17083168029785, "global_step": 13308, "epoch": 160} {"train_loss": -18.058286666870117, "global_step": 13309, "epoch": 160} {"train_loss": -18.148696899414062, "global_step": 13310, "epoch": 160} {"train_loss": -18.01393699645996, "global_step": 13311, "epoch": 160} {"train_loss": -18.18311882019043, "global_step": 13312, "epoch": 160} {"train_loss": -18.121957778930664, "global_step": 13313, "epoch": 160} {"train_loss": -18.10353660583496, "global_step": 13314, "epoch": 160} {"train_loss": -17.74525260925293, "global_step": 13315, "epoch": 160} {"train_loss": -17.787893295288086, "global_step": 13316, "epoch": 160} {"train_loss": -17.954301834106445, "global_step": 13317, "epoch": 160} {"train_loss": -17.666501998901367, "global_step": 13318, "epoch": 160} {"train_loss": -18.255064010620117, "global_step": 13319, "epoch": 160} {"train_loss": -17.92098617553711, "global_step": 13320, "epoch": 160} {"train_loss": -17.524934768676758, "global_step": 13321, "epoch": 160} {"train_loss": -18.402311325073242, "global_step": 13322, "epoch": 160} {"train_loss": -18.044301986694336, "global_step": 13323, "epoch": 160} {"train_loss": -18.133554458618164, "global_step": 13324, "epoch": 160} {"train_loss": -18.188810348510742, "global_step": 13325, "epoch": 160} {"train_loss": -18.027894973754883, "global_step": 13326, "epoch": 160} {"train_loss": -18.197010040283203, "global_step": 13327, "epoch": 160} {"train_loss": -17.950435638427734, "global_step": 13328, "epoch": 160} {"train_loss": -18.030868530273438, "global_step": 13329, "epoch": 160} {"train_loss": -18.094985961914062, "global_step": 13330, "epoch": 160} {"train_loss": -17.683433532714844, "global_step": 13331, "epoch": 160} {"train_loss": -18.15027618408203, "global_step": 13332, "epoch": 160} {"train_loss": -17.799386978149414, "global_step": 13333, "epoch": 160} {"train_loss": -17.924076080322266, "global_step": 13334, "epoch": 160} {"train_loss": -18.132383346557617, "global_step": 13335, "epoch": 160} {"train_loss": -18.18052101135254, "global_step": 13336, "epoch": 160} {"train_loss": -18.128555297851562, "global_step": 13337, "epoch": 160} {"train_loss": -17.902029037475586, "global_step": 13338, "epoch": 160} {"train_loss": -17.66315460205078, "global_step": 13339, "epoch": 160} {"train_loss": -17.963125228881836, "global_step": 13340, "epoch": 160} {"train_loss": -17.272363662719727, "global_step": 13341, "epoch": 160} {"train_loss": -17.734357833862305, "global_step": 13342, "epoch": 160} {"train_loss": -17.974130630493164, "global_step": 13343, "epoch": 160} {"train_loss": -18.01031494140625, "global_step": 13344, "epoch": 160} {"train_loss": -17.807178497314453, "global_step": 13345, "epoch": 160} {"train_loss": -18.21795082092285, "global_step": 13346, "epoch": 160} {"train_loss": -17.94046401977539, "global_step": 13347, "epoch": 160} {"train_loss": -17.788562774658203, "global_step": 13348, "epoch": 160} {"train_loss": -18.009668350219727, "global_step": 13349, "epoch": 160} {"train_loss": -17.906518936157227, "global_step": 13350, "epoch": 160} {"train_loss": -17.8137149810791, "global_step": 13351, "epoch": 160} {"train_loss": -18.128393173217773, "global_step": 13352, "epoch": 160} {"train_loss": -17.708215713500977, "global_step": 13353, "epoch": 160} {"train_loss": -18.320371627807617, "global_step": 13354, "epoch": 160} {"train_loss": -18.249923706054688, "global_step": 13355, "epoch": 160} {"train_loss": -18.32755470275879, "global_step": 13356, "epoch": 160} {"train_loss": -18.05643653869629, "global_step": 13357, "epoch": 160} {"train_loss": -17.9456787109375, "global_step": 13358, "epoch": 160} {"train_loss": -17.74912452697754, "global_step": 13359, "epoch": 160} {"train_loss": -17.861494064331055, "global_step": 13360, "epoch": 160} {"train_loss": -17.864377975463867, "global_step": 13361, "epoch": 160} {"train_loss": -17.955955919012965, "global_step": 13362, "epoch": 160, "val_loss": 6130065.0} {"train_loss": -17.55474853515625, "global_step": 13363, "epoch": 161} {"train_loss": -17.896696090698242, "global_step": 13364, "epoch": 161} {"train_loss": -17.99263572692871, "global_step": 13365, "epoch": 161} {"train_loss": -18.186349868774414, "global_step": 13366, "epoch": 161} {"train_loss": -18.177637100219727, "global_step": 13367, "epoch": 161} {"train_loss": -17.860668182373047, "global_step": 13368, "epoch": 161} {"train_loss": -17.83381462097168, "global_step": 13369, "epoch": 161} {"train_loss": -17.85159683227539, "global_step": 13370, "epoch": 161} {"train_loss": -17.9422664642334, "global_step": 13371, "epoch": 161} {"train_loss": -17.567541122436523, "global_step": 13372, "epoch": 161} {"train_loss": -17.856426239013672, "global_step": 13373, "epoch": 161} {"train_loss": -18.053298950195312, "global_step": 13374, "epoch": 161} {"train_loss": -17.958724975585938, "global_step": 13375, "epoch": 161} {"train_loss": -17.949743270874023, "global_step": 13376, "epoch": 161} {"train_loss": -17.611042022705078, "global_step": 13377, "epoch": 161} {"train_loss": -17.8858585357666, "global_step": 13378, "epoch": 161} {"train_loss": -18.194900512695312, "global_step": 13379, "epoch": 161} {"train_loss": -17.738388061523438, "global_step": 13380, "epoch": 161} {"train_loss": -18.023950576782227, "global_step": 13381, "epoch": 161} {"train_loss": -17.934207916259766, "global_step": 13382, "epoch": 161} {"train_loss": -17.69758415222168, "global_step": 13383, "epoch": 161} {"train_loss": -18.3348331451416, "global_step": 13384, "epoch": 161} {"train_loss": -17.885038375854492, "global_step": 13385, "epoch": 161} {"train_loss": -17.69057846069336, "global_step": 13386, "epoch": 161} {"train_loss": -17.728384017944336, "global_step": 13387, "epoch": 161} {"train_loss": -17.936201095581055, "global_step": 13388, "epoch": 161} {"train_loss": -17.706464767456055, "global_step": 13389, "epoch": 161} {"train_loss": -17.92275047302246, "global_step": 13390, "epoch": 161} {"train_loss": -18.305326461791992, "global_step": 13391, "epoch": 161} {"train_loss": -18.200342178344727, "global_step": 13392, "epoch": 161} {"train_loss": -17.65558433532715, "global_step": 13393, "epoch": 161} {"train_loss": -17.534669876098633, "global_step": 13394, "epoch": 161} {"train_loss": -18.29581069946289, "global_step": 13395, "epoch": 161} {"train_loss": -17.39518165588379, "global_step": 13396, "epoch": 161} {"train_loss": -17.820804595947266, "global_step": 13397, "epoch": 161} {"train_loss": -18.17350196838379, "global_step": 13398, "epoch": 161} {"train_loss": -17.95978546142578, "global_step": 13399, "epoch": 161} {"train_loss": -17.695575714111328, "global_step": 13400, "epoch": 161} {"train_loss": -17.443729400634766, "global_step": 13401, "epoch": 161} {"train_loss": -18.125539779663086, "global_step": 13402, "epoch": 161} {"train_loss": -17.876466751098633, "global_step": 13403, "epoch": 161} {"train_loss": -17.888439178466797, "global_step": 13404, "epoch": 161} {"train_loss": -18.177705764770508, "global_step": 13405, "epoch": 161} {"train_loss": -17.776235580444336, "global_step": 13406, "epoch": 161} {"train_loss": -18.22691535949707, "global_step": 13407, "epoch": 161} {"train_loss": -18.054443359375, "global_step": 13408, "epoch": 161} {"train_loss": -18.17209815979004, "global_step": 13409, "epoch": 161} {"train_loss": -18.082889556884766, "global_step": 13410, "epoch": 161} {"train_loss": -17.513423919677734, "global_step": 13411, "epoch": 161} {"train_loss": -18.017168045043945, "global_step": 13412, "epoch": 161} {"train_loss": -18.205780029296875, "global_step": 13413, "epoch": 161} {"train_loss": -17.67642593383789, "global_step": 13414, "epoch": 161} {"train_loss": -18.110410690307617, "global_step": 13415, "epoch": 161} {"train_loss": -18.061935424804688, "global_step": 13416, "epoch": 161} {"train_loss": -17.801298141479492, "global_step": 13417, "epoch": 161} {"train_loss": -17.85203742980957, "global_step": 13418, "epoch": 161} {"train_loss": -17.896718978881836, "global_step": 13419, "epoch": 161} {"train_loss": -18.020139694213867, "global_step": 13420, "epoch": 161} {"train_loss": -18.205671310424805, "global_step": 13421, "epoch": 161} {"train_loss": -18.0989990234375, "global_step": 13422, "epoch": 161} {"train_loss": -18.03450584411621, "global_step": 13423, "epoch": 161} {"train_loss": -17.658000946044922, "global_step": 13424, "epoch": 161} {"train_loss": -17.776315689086914, "global_step": 13425, "epoch": 161} {"train_loss": -18.245962142944336, "global_step": 13426, "epoch": 161} {"train_loss": -17.89471435546875, "global_step": 13427, "epoch": 161} {"train_loss": -17.864730834960938, "global_step": 13428, "epoch": 161} {"train_loss": -17.8568058013916, "global_step": 13429, "epoch": 161} {"train_loss": -17.813587188720703, "global_step": 13430, "epoch": 161} {"train_loss": -17.97962760925293, "global_step": 13431, "epoch": 161} {"train_loss": -18.134660720825195, "global_step": 13432, "epoch": 161} {"train_loss": -18.146474838256836, "global_step": 13433, "epoch": 161} {"train_loss": -18.012243270874023, "global_step": 13434, "epoch": 161} {"train_loss": -18.115629196166992, "global_step": 13435, "epoch": 161} {"train_loss": -17.796375274658203, "global_step": 13436, "epoch": 161} {"train_loss": -18.11258888244629, "global_step": 13437, "epoch": 161} {"train_loss": -18.52338981628418, "global_step": 13438, "epoch": 161} {"train_loss": -17.878219604492188, "global_step": 13439, "epoch": 161} {"train_loss": -18.398977279663086, "global_step": 13440, "epoch": 161} {"train_loss": -18.05348014831543, "global_step": 13441, "epoch": 161} {"train_loss": -17.8281307220459, "global_step": 13442, "epoch": 161} {"train_loss": -18.198503494262695, "global_step": 13443, "epoch": 161} {"train_loss": -17.893590927124023, "global_step": 13444, "epoch": 161} {"train_loss": -17.93297360891319, "global_step": 13445, "epoch": 161, "val_loss": 6202804.0} {"train_loss": -17.909183502197266, "global_step": 13446, "epoch": 162} {"train_loss": -17.372058868408203, "global_step": 13447, "epoch": 162} {"train_loss": -17.58232307434082, "global_step": 13448, "epoch": 162} {"train_loss": -17.604211807250977, "global_step": 13449, "epoch": 162} {"train_loss": -17.490203857421875, "global_step": 13450, "epoch": 162} {"train_loss": -17.756315231323242, "global_step": 13451, "epoch": 162} {"train_loss": -17.953554153442383, "global_step": 13452, "epoch": 162} {"train_loss": -17.906856536865234, "global_step": 13453, "epoch": 162} {"train_loss": -17.459680557250977, "global_step": 13454, "epoch": 162} {"train_loss": -17.972274780273438, "global_step": 13455, "epoch": 162} {"train_loss": -17.74226188659668, "global_step": 13456, "epoch": 162} {"train_loss": -18.09498405456543, "global_step": 13457, "epoch": 162} {"train_loss": -17.98120880126953, "global_step": 13458, "epoch": 162} {"train_loss": -17.921592712402344, "global_step": 13459, "epoch": 162} {"train_loss": -18.07633399963379, "global_step": 13460, "epoch": 162} {"train_loss": -17.541345596313477, "global_step": 13461, "epoch": 162} {"train_loss": -17.610702514648438, "global_step": 13462, "epoch": 162} {"train_loss": -17.623260498046875, "global_step": 13463, "epoch": 162} {"train_loss": -17.81329917907715, "global_step": 13464, "epoch": 162} {"train_loss": -18.042943954467773, "global_step": 13465, "epoch": 162} {"train_loss": -17.975021362304688, "global_step": 13466, "epoch": 162} {"train_loss": -17.896085739135742, "global_step": 13467, "epoch": 162} {"train_loss": -17.853002548217773, "global_step": 13468, "epoch": 162} {"train_loss": -17.750171661376953, "global_step": 13469, "epoch": 162} {"train_loss": -18.227943420410156, "global_step": 13470, "epoch": 162} {"train_loss": -18.064956665039062, "global_step": 13471, "epoch": 162} {"train_loss": -18.11696434020996, "global_step": 13472, "epoch": 162} {"train_loss": -17.952260971069336, "global_step": 13473, "epoch": 162} {"train_loss": -17.9913272857666, "global_step": 13474, "epoch": 162} {"train_loss": -18.247501373291016, "global_step": 13475, "epoch": 162} {"train_loss": -17.9249324798584, "global_step": 13476, "epoch": 162} {"train_loss": -18.15330696105957, "global_step": 13477, "epoch": 162} {"train_loss": -17.761865615844727, "global_step": 13478, "epoch": 162} {"train_loss": -18.17179298400879, "global_step": 13479, "epoch": 162} {"train_loss": -17.839736938476562, "global_step": 13480, "epoch": 162} {"train_loss": -18.207252502441406, "global_step": 13481, "epoch": 162} {"train_loss": -18.05964469909668, "global_step": 13482, "epoch": 162} {"train_loss": -18.087318420410156, "global_step": 13483, "epoch": 162} {"train_loss": -18.17179298400879, "global_step": 13484, "epoch": 162} {"train_loss": -17.97370719909668, "global_step": 13485, "epoch": 162} {"train_loss": -17.783178329467773, "global_step": 13486, "epoch": 162} {"train_loss": -17.849172592163086, "global_step": 13487, "epoch": 162} {"train_loss": -17.62563133239746, "global_step": 13488, "epoch": 162} {"train_loss": -17.883081436157227, "global_step": 13489, "epoch": 162} {"train_loss": -18.067785263061523, "global_step": 13490, "epoch": 162} {"train_loss": -18.09738540649414, "global_step": 13491, "epoch": 162} {"train_loss": -17.894447326660156, "global_step": 13492, "epoch": 162} {"train_loss": -18.161823272705078, "global_step": 13493, "epoch": 162} {"train_loss": -17.8808650970459, "global_step": 13494, "epoch": 162} {"train_loss": -18.363527297973633, "global_step": 13495, "epoch": 162} {"train_loss": -17.650981903076172, "global_step": 13496, "epoch": 162} {"train_loss": -17.994951248168945, "global_step": 13497, "epoch": 162} {"train_loss": -18.286407470703125, "global_step": 13498, "epoch": 162} {"train_loss": -18.255741119384766, "global_step": 13499, "epoch": 162} {"train_loss": -18.023488998413086, "global_step": 13500, "epoch": 162} {"train_loss": -17.924726486206055, "global_step": 13501, "epoch": 162} {"train_loss": -17.829442977905273, "global_step": 13502, "epoch": 162} {"train_loss": -18.017911911010742, "global_step": 13503, "epoch": 162} {"train_loss": -18.043996810913086, "global_step": 13504, "epoch": 162} {"train_loss": -17.92987060546875, "global_step": 13505, "epoch": 162} {"train_loss": -17.76586151123047, "global_step": 13506, "epoch": 162} {"train_loss": -17.812332153320312, "global_step": 13507, "epoch": 162} {"train_loss": -18.00261878967285, "global_step": 13508, "epoch": 162} {"train_loss": -18.251909255981445, "global_step": 13509, "epoch": 162} {"train_loss": -17.766021728515625, "global_step": 13510, "epoch": 162} {"train_loss": -18.059795379638672, "global_step": 13511, "epoch": 162} {"train_loss": -18.074872970581055, "global_step": 13512, "epoch": 162} {"train_loss": -17.91381072998047, "global_step": 13513, "epoch": 162} {"train_loss": -17.857421875, "global_step": 13514, "epoch": 162} {"train_loss": -17.667011260986328, "global_step": 13515, "epoch": 162} {"train_loss": -17.96760368347168, "global_step": 13516, "epoch": 162} {"train_loss": -17.858808517456055, "global_step": 13517, "epoch": 162} {"train_loss": -18.466312408447266, "global_step": 13518, "epoch": 162} {"train_loss": -18.21088218688965, "global_step": 13519, "epoch": 162} {"train_loss": -17.94771385192871, "global_step": 13520, "epoch": 162} {"train_loss": -18.09567642211914, "global_step": 13521, "epoch": 162} {"train_loss": -17.712066650390625, "global_step": 13522, "epoch": 162} {"train_loss": -18.05966567993164, "global_step": 13523, "epoch": 162} {"train_loss": -17.903676986694336, "global_step": 13524, "epoch": 162} {"train_loss": -17.90092658996582, "global_step": 13525, "epoch": 162} {"train_loss": -17.782203674316406, "global_step": 13526, "epoch": 162} {"train_loss": -17.808494567871094, "global_step": 13527, "epoch": 162} {"train_loss": -17.91988653160003, "global_step": 13528, "epoch": 162, "val_loss": 6176880.0} {"train_loss": -18.074369430541992, "global_step": 13529, "epoch": 163} {"train_loss": -17.78281593322754, "global_step": 13530, "epoch": 163} {"train_loss": -17.919530868530273, "global_step": 13531, "epoch": 163} {"train_loss": -17.528501510620117, "global_step": 13532, "epoch": 163} {"train_loss": -17.29562759399414, "global_step": 13533, "epoch": 163} {"train_loss": -17.548725128173828, "global_step": 13534, "epoch": 163} {"train_loss": -17.699331283569336, "global_step": 13535, "epoch": 163} {"train_loss": -17.8418025970459, "global_step": 13536, "epoch": 163} {"train_loss": -18.123044967651367, "global_step": 13537, "epoch": 163} {"train_loss": -17.750167846679688, "global_step": 13538, "epoch": 163} {"train_loss": -17.7479248046875, "global_step": 13539, "epoch": 163} {"train_loss": -18.201828002929688, "global_step": 13540, "epoch": 163} {"train_loss": -17.86830711364746, "global_step": 13541, "epoch": 163} {"train_loss": -17.978376388549805, "global_step": 13542, "epoch": 163} {"train_loss": -18.1108455657959, "global_step": 13543, "epoch": 163} {"train_loss": -17.708820343017578, "global_step": 13544, "epoch": 163} {"train_loss": -18.14089584350586, "global_step": 13545, "epoch": 163} {"train_loss": -18.104232788085938, "global_step": 13546, "epoch": 163} {"train_loss": -17.930824279785156, "global_step": 13547, "epoch": 163} {"train_loss": -18.264575958251953, "global_step": 13548, "epoch": 163} {"train_loss": -18.3363094329834, "global_step": 13549, "epoch": 163} {"train_loss": -18.013866424560547, "global_step": 13550, "epoch": 163} {"train_loss": -17.4858455657959, "global_step": 13551, "epoch": 163} {"train_loss": -18.2069034576416, "global_step": 13552, "epoch": 163} {"train_loss": -18.179637908935547, "global_step": 13553, "epoch": 163} {"train_loss": -18.11979103088379, "global_step": 13554, "epoch": 163} {"train_loss": -17.98678970336914, "global_step": 13555, "epoch": 163} {"train_loss": -18.271299362182617, "global_step": 13556, "epoch": 163} {"train_loss": -17.55351448059082, "global_step": 13557, "epoch": 163} {"train_loss": -18.20100212097168, "global_step": 13558, "epoch": 163} {"train_loss": -18.06112289428711, "global_step": 13559, "epoch": 163} {"train_loss": -17.7382869720459, "global_step": 13560, "epoch": 163} {"train_loss": -17.927730560302734, "global_step": 13561, "epoch": 163} {"train_loss": -17.978160858154297, "global_step": 13562, "epoch": 163} {"train_loss": -17.838821411132812, "global_step": 13563, "epoch": 163} {"train_loss": -18.127939224243164, "global_step": 13564, "epoch": 163} {"train_loss": -17.617887496948242, "global_step": 13565, "epoch": 163} {"train_loss": -17.66631317138672, "global_step": 13566, "epoch": 163} {"train_loss": -17.848857879638672, "global_step": 13567, "epoch": 163} {"train_loss": -17.691553115844727, "global_step": 13568, "epoch": 163} {"train_loss": -17.90236473083496, "global_step": 13569, "epoch": 163} {"train_loss": -18.246234893798828, "global_step": 13570, "epoch": 163} {"train_loss": -18.1008243560791, "global_step": 13571, "epoch": 163} {"train_loss": -18.033252716064453, "global_step": 13572, "epoch": 163} {"train_loss": -18.013296127319336, "global_step": 13573, "epoch": 163} {"train_loss": -17.89349937438965, "global_step": 13574, "epoch": 163} {"train_loss": -17.600278854370117, "global_step": 13575, "epoch": 163} {"train_loss": -18.18479347229004, "global_step": 13576, "epoch": 163} {"train_loss": -17.983205795288086, "global_step": 13577, "epoch": 163} {"train_loss": -17.814010620117188, "global_step": 13578, "epoch": 163} {"train_loss": -18.004186630249023, "global_step": 13579, "epoch": 163} {"train_loss": -17.957775115966797, "global_step": 13580, "epoch": 163} {"train_loss": -18.209613800048828, "global_step": 13581, "epoch": 163} {"train_loss": -17.92589569091797, "global_step": 13582, "epoch": 163} {"train_loss": -18.1556453704834, "global_step": 13583, "epoch": 163} {"train_loss": -18.130558013916016, "global_step": 13584, "epoch": 163} {"train_loss": -17.7006893157959, "global_step": 13585, "epoch": 163} {"train_loss": -17.978076934814453, "global_step": 13586, "epoch": 163} {"train_loss": -17.982580184936523, "global_step": 13587, "epoch": 163} {"train_loss": -17.932296752929688, "global_step": 13588, "epoch": 163} {"train_loss": -18.154766082763672, "global_step": 13589, "epoch": 163} {"train_loss": -17.803003311157227, "global_step": 13590, "epoch": 163} {"train_loss": -18.108991622924805, "global_step": 13591, "epoch": 163} {"train_loss": -17.53143310546875, "global_step": 13592, "epoch": 163} {"train_loss": -18.423505783081055, "global_step": 13593, "epoch": 163} {"train_loss": -18.49806785583496, "global_step": 13594, "epoch": 163} {"train_loss": -18.150753021240234, "global_step": 13595, "epoch": 163} {"train_loss": -18.065074920654297, "global_step": 13596, "epoch": 163} {"train_loss": -18.237674713134766, "global_step": 13597, "epoch": 163} {"train_loss": -17.886281967163086, "global_step": 13598, "epoch": 163} {"train_loss": -18.100072860717773, "global_step": 13599, "epoch": 163} {"train_loss": -17.993032455444336, "global_step": 13600, "epoch": 163} {"train_loss": -17.929128646850586, "global_step": 13601, "epoch": 163} {"train_loss": -17.63324546813965, "global_step": 13602, "epoch": 163} {"train_loss": -17.6965389251709, "global_step": 13603, "epoch": 163} {"train_loss": -17.84680938720703, "global_step": 13604, "epoch": 163} {"train_loss": -18.11428451538086, "global_step": 13605, "epoch": 163} {"train_loss": -17.894065856933594, "global_step": 13606, "epoch": 163} {"train_loss": -17.876949310302734, "global_step": 13607, "epoch": 163} {"train_loss": -18.040014266967773, "global_step": 13608, "epoch": 163} {"train_loss": -18.033954620361328, "global_step": 13609, "epoch": 163} {"train_loss": -18.431732177734375, "global_step": 13610, "epoch": 163} {"train_loss": -17.953513019056206, "global_step": 13611, "epoch": 163, "val_loss": 6053790.0} {"train_loss": -17.507099151611328, "global_step": 13612, "epoch": 164} {"train_loss": -17.541933059692383, "global_step": 13613, "epoch": 164} {"train_loss": -17.89015007019043, "global_step": 13614, "epoch": 164} {"train_loss": -17.497772216796875, "global_step": 13615, "epoch": 164} {"train_loss": -17.710969924926758, "global_step": 13616, "epoch": 164} {"train_loss": -18.076047897338867, "global_step": 13617, "epoch": 164} {"train_loss": -17.7403507232666, "global_step": 13618, "epoch": 164} {"train_loss": -17.799413681030273, "global_step": 13619, "epoch": 164} {"train_loss": -17.594018936157227, "global_step": 13620, "epoch": 164} {"train_loss": -17.63931655883789, "global_step": 13621, "epoch": 164} {"train_loss": -17.77103042602539, "global_step": 13622, "epoch": 164} {"train_loss": -18.010717391967773, "global_step": 13623, "epoch": 164} {"train_loss": -17.47821044921875, "global_step": 13624, "epoch": 164} {"train_loss": -17.845561981201172, "global_step": 13625, "epoch": 164} {"train_loss": -17.539154052734375, "global_step": 13626, "epoch": 164} {"train_loss": -18.060571670532227, "global_step": 13627, "epoch": 164} {"train_loss": -17.80454444885254, "global_step": 13628, "epoch": 164} {"train_loss": -17.831438064575195, "global_step": 13629, "epoch": 164} {"train_loss": -17.704580307006836, "global_step": 13630, "epoch": 164} {"train_loss": -17.90559196472168, "global_step": 13631, "epoch": 164} {"train_loss": -17.802114486694336, "global_step": 13632, "epoch": 164} {"train_loss": -17.85070037841797, "global_step": 13633, "epoch": 164} {"train_loss": -18.182435989379883, "global_step": 13634, "epoch": 164} {"train_loss": -18.256938934326172, "global_step": 13635, "epoch": 164} {"train_loss": -17.872751235961914, "global_step": 13636, "epoch": 164} {"train_loss": -17.799442291259766, "global_step": 13637, "epoch": 164} {"train_loss": -17.877220153808594, "global_step": 13638, "epoch": 164} {"train_loss": -18.078487396240234, "global_step": 13639, "epoch": 164} {"train_loss": -18.3245906829834, "global_step": 13640, "epoch": 164} {"train_loss": -18.19025993347168, "global_step": 13641, "epoch": 164} {"train_loss": -18.386072158813477, "global_step": 13642, "epoch": 164} {"train_loss": -17.835691452026367, "global_step": 13643, "epoch": 164} {"train_loss": -17.99318504333496, "global_step": 13644, "epoch": 164} {"train_loss": -18.220876693725586, "global_step": 13645, "epoch": 164} {"train_loss": -18.04375648498535, "global_step": 13646, "epoch": 164} {"train_loss": -18.14621353149414, "global_step": 13647, "epoch": 164} {"train_loss": -17.62982749938965, "global_step": 13648, "epoch": 164} {"train_loss": -17.955692291259766, "global_step": 13649, "epoch": 164} {"train_loss": -18.003599166870117, "global_step": 13650, "epoch": 164} {"train_loss": -18.00577163696289, "global_step": 13651, "epoch": 164} {"train_loss": -17.939725875854492, "global_step": 13652, "epoch": 164} {"train_loss": -18.017993927001953, "global_step": 13653, "epoch": 164} {"train_loss": -18.043914794921875, "global_step": 13654, "epoch": 164} {"train_loss": -17.963993072509766, "global_step": 13655, "epoch": 164} {"train_loss": -18.01734733581543, "global_step": 13656, "epoch": 164} {"train_loss": -17.829906463623047, "global_step": 13657, "epoch": 164} {"train_loss": -18.058734893798828, "global_step": 13658, "epoch": 164} {"train_loss": -17.82573890686035, "global_step": 13659, "epoch": 164} {"train_loss": -18.043577194213867, "global_step": 13660, "epoch": 164} {"train_loss": -17.886564254760742, "global_step": 13661, "epoch": 164} {"train_loss": -18.189838409423828, "global_step": 13662, "epoch": 164} {"train_loss": -17.729848861694336, "global_step": 13663, "epoch": 164} {"train_loss": -17.952350616455078, "global_step": 13664, "epoch": 164} {"train_loss": -18.056360244750977, "global_step": 13665, "epoch": 164} {"train_loss": -17.94239616394043, "global_step": 13666, "epoch": 164} {"train_loss": -17.981918334960938, "global_step": 13667, "epoch": 164} {"train_loss": -17.91798210144043, "global_step": 13668, "epoch": 164} {"train_loss": -17.555028915405273, "global_step": 13669, "epoch": 164} {"train_loss": -18.058317184448242, "global_step": 13670, "epoch": 164} {"train_loss": -17.51282501220703, "global_step": 13671, "epoch": 164} {"train_loss": -18.018041610717773, "global_step": 13672, "epoch": 164} {"train_loss": -17.984338760375977, "global_step": 13673, "epoch": 164} {"train_loss": -17.704858779907227, "global_step": 13674, "epoch": 164} {"train_loss": -18.03656005859375, "global_step": 13675, "epoch": 164} {"train_loss": -18.028345108032227, "global_step": 13676, "epoch": 164} {"train_loss": -17.77925682067871, "global_step": 13677, "epoch": 164} {"train_loss": -17.94939613342285, "global_step": 13678, "epoch": 164} {"train_loss": -18.296619415283203, "global_step": 13679, "epoch": 164} {"train_loss": -18.362455368041992, "global_step": 13680, "epoch": 164} {"train_loss": -18.125789642333984, "global_step": 13681, "epoch": 164} {"train_loss": -18.149124145507812, "global_step": 13682, "epoch": 164} {"train_loss": -17.6662654876709, "global_step": 13683, "epoch": 164} {"train_loss": -17.2655086517334, "global_step": 13684, "epoch": 164} {"train_loss": -17.872821807861328, "global_step": 13685, "epoch": 164} {"train_loss": -18.34507179260254, "global_step": 13686, "epoch": 164} {"train_loss": -18.04298973083496, "global_step": 13687, "epoch": 164} {"train_loss": -17.840951919555664, "global_step": 13688, "epoch": 164} {"train_loss": -18.198514938354492, "global_step": 13689, "epoch": 164} {"train_loss": -17.96984100341797, "global_step": 13690, "epoch": 164} {"train_loss": -17.87461280822754, "global_step": 13691, "epoch": 164} {"train_loss": -18.261627197265625, "global_step": 13692, "epoch": 164} {"train_loss": -18.077529907226562, "global_step": 13693, "epoch": 164} {"train_loss": -17.925001351230115, "global_step": 13694, "epoch": 164, "val_loss": 6037683.5} {"train_loss": -17.61167335510254, "global_step": 13695, "epoch": 165} {"train_loss": -17.797147750854492, "global_step": 13696, "epoch": 165} {"train_loss": -18.20696449279785, "global_step": 13697, "epoch": 165} {"train_loss": -17.48096466064453, "global_step": 13698, "epoch": 165} {"train_loss": -18.41748809814453, "global_step": 13699, "epoch": 165} {"train_loss": -18.068714141845703, "global_step": 13700, "epoch": 165} {"train_loss": -17.724111557006836, "global_step": 13701, "epoch": 165} {"train_loss": -17.972976684570312, "global_step": 13702, "epoch": 165} {"train_loss": -17.887187957763672, "global_step": 13703, "epoch": 165} {"train_loss": -17.840063095092773, "global_step": 13704, "epoch": 165} {"train_loss": -17.9119815826416, "global_step": 13705, "epoch": 165} {"train_loss": -17.524375915527344, "global_step": 13706, "epoch": 165} {"train_loss": -18.11372947692871, "global_step": 13707, "epoch": 165} {"train_loss": -18.067258834838867, "global_step": 13708, "epoch": 165} {"train_loss": -18.2415771484375, "global_step": 13709, "epoch": 165} {"train_loss": -17.887039184570312, "global_step": 13710, "epoch": 165} {"train_loss": -17.753705978393555, "global_step": 13711, "epoch": 165} {"train_loss": -17.805471420288086, "global_step": 13712, "epoch": 165} {"train_loss": -18.1085205078125, "global_step": 13713, "epoch": 165} {"train_loss": -18.034631729125977, "global_step": 13714, "epoch": 165} {"train_loss": -17.82798957824707, "global_step": 13715, "epoch": 165} {"train_loss": -17.78238296508789, "global_step": 13716, "epoch": 165} {"train_loss": -18.300960540771484, "global_step": 13717, "epoch": 165} {"train_loss": -18.145187377929688, "global_step": 13718, "epoch": 165} {"train_loss": -17.691129684448242, "global_step": 13719, "epoch": 165} {"train_loss": -17.904447555541992, "global_step": 13720, "epoch": 165} {"train_loss": -17.871328353881836, "global_step": 13721, "epoch": 165} {"train_loss": -18.230152130126953, "global_step": 13722, "epoch": 165} {"train_loss": -18.170024871826172, "global_step": 13723, "epoch": 165} {"train_loss": -18.0778751373291, "global_step": 13724, "epoch": 165} {"train_loss": -18.31536293029785, "global_step": 13725, "epoch": 165} {"train_loss": -17.98110580444336, "global_step": 13726, "epoch": 165} {"train_loss": -18.187335968017578, "global_step": 13727, "epoch": 165} {"train_loss": -17.61078453063965, "global_step": 13728, "epoch": 165} {"train_loss": -18.09612274169922, "global_step": 13729, "epoch": 165} {"train_loss": -17.762893676757812, "global_step": 13730, "epoch": 165} {"train_loss": -18.077808380126953, "global_step": 13731, "epoch": 165} {"train_loss": -17.986433029174805, "global_step": 13732, "epoch": 165} {"train_loss": -18.09205436706543, "global_step": 13733, "epoch": 165} {"train_loss": -18.094642639160156, "global_step": 13734, "epoch": 165} {"train_loss": -18.076467514038086, "global_step": 13735, "epoch": 165} {"train_loss": -18.1983585357666, "global_step": 13736, "epoch": 165} {"train_loss": -17.694950103759766, "global_step": 13737, "epoch": 165} {"train_loss": -18.11585807800293, "global_step": 13738, "epoch": 165} {"train_loss": -17.718006134033203, "global_step": 13739, "epoch": 165} {"train_loss": -18.268461227416992, "global_step": 13740, "epoch": 165} {"train_loss": -18.26386260986328, "global_step": 13741, "epoch": 165} {"train_loss": -17.655832290649414, "global_step": 13742, "epoch": 165} {"train_loss": -18.03474235534668, "global_step": 13743, "epoch": 165} {"train_loss": -17.942270278930664, "global_step": 13744, "epoch": 165} {"train_loss": -18.016122817993164, "global_step": 13745, "epoch": 165} {"train_loss": -17.82490348815918, "global_step": 13746, "epoch": 165} {"train_loss": -18.270156860351562, "global_step": 13747, "epoch": 165} {"train_loss": -17.830158233642578, "global_step": 13748, "epoch": 165} {"train_loss": -18.61849021911621, "global_step": 13749, "epoch": 165} {"train_loss": -17.934986114501953, "global_step": 13750, "epoch": 165} {"train_loss": -17.926223754882812, "global_step": 13751, "epoch": 165} {"train_loss": -17.811359405517578, "global_step": 13752, "epoch": 165} {"train_loss": -17.68363380432129, "global_step": 13753, "epoch": 165} {"train_loss": -18.21108055114746, "global_step": 13754, "epoch": 165} {"train_loss": -18.3017578125, "global_step": 13755, "epoch": 165} {"train_loss": -18.052427291870117, "global_step": 13756, "epoch": 165} {"train_loss": -17.697965621948242, "global_step": 13757, "epoch": 165} {"train_loss": -18.173555374145508, "global_step": 13758, "epoch": 165} {"train_loss": -17.800931930541992, "global_step": 13759, "epoch": 165} {"train_loss": -18.137353897094727, "global_step": 13760, "epoch": 165} {"train_loss": -17.885440826416016, "global_step": 13761, "epoch": 165} {"train_loss": -17.681337356567383, "global_step": 13762, "epoch": 165} {"train_loss": -17.715009689331055, "global_step": 13763, "epoch": 165} {"train_loss": -17.962818145751953, "global_step": 13764, "epoch": 165} {"train_loss": -18.064069747924805, "global_step": 13765, "epoch": 165} {"train_loss": -17.8176212310791, "global_step": 13766, "epoch": 165} {"train_loss": -18.305137634277344, "global_step": 13767, "epoch": 165} {"train_loss": -18.106992721557617, "global_step": 13768, "epoch": 165} {"train_loss": -17.909868240356445, "global_step": 13769, "epoch": 165} {"train_loss": -18.29596519470215, "global_step": 13770, "epoch": 165} {"train_loss": -17.98594093322754, "global_step": 13771, "epoch": 165} {"train_loss": -18.341766357421875, "global_step": 13772, "epoch": 165} {"train_loss": -17.747587203979492, "global_step": 13773, "epoch": 165} {"train_loss": -17.615995407104492, "global_step": 13774, "epoch": 165} {"train_loss": -17.865951538085938, "global_step": 13775, "epoch": 165} {"train_loss": -18.187429428100586, "global_step": 13776, "epoch": 165} {"train_loss": -17.980042101388953, "global_step": 13777, "epoch": 165, "val_loss": 6106907.5} {"train_loss": -18.55890464782715, "global_step": 13778, "epoch": 166} {"train_loss": -17.735883712768555, "global_step": 13779, "epoch": 166} {"train_loss": -18.183801651000977, "global_step": 13780, "epoch": 166} {"train_loss": -17.72747039794922, "global_step": 13781, "epoch": 166} {"train_loss": -17.804136276245117, "global_step": 13782, "epoch": 166} {"train_loss": -17.715110778808594, "global_step": 13783, "epoch": 166} {"train_loss": -18.01778221130371, "global_step": 13784, "epoch": 166} {"train_loss": -18.050512313842773, "global_step": 13785, "epoch": 166} {"train_loss": -17.74579620361328, "global_step": 13786, "epoch": 166} {"train_loss": -18.14484214782715, "global_step": 13787, "epoch": 166} {"train_loss": -17.9572696685791, "global_step": 13788, "epoch": 166} {"train_loss": -17.930593490600586, "global_step": 13789, "epoch": 166} {"train_loss": -17.925168991088867, "global_step": 13790, "epoch": 166} {"train_loss": -17.753660202026367, "global_step": 13791, "epoch": 166} {"train_loss": -17.152725219726562, "global_step": 13792, "epoch": 166} {"train_loss": -18.013145446777344, "global_step": 13793, "epoch": 166} {"train_loss": -18.165647506713867, "global_step": 13794, "epoch": 166} {"train_loss": -18.123334884643555, "global_step": 13795, "epoch": 166} {"train_loss": -17.86482810974121, "global_step": 13796, "epoch": 166} {"train_loss": -18.05660057067871, "global_step": 13797, "epoch": 166} {"train_loss": -17.725980758666992, "global_step": 13798, "epoch": 166} {"train_loss": -17.906044006347656, "global_step": 13799, "epoch": 166} {"train_loss": -18.07973289489746, "global_step": 13800, "epoch": 166} {"train_loss": -17.938955307006836, "global_step": 13801, "epoch": 166} {"train_loss": -17.89601707458496, "global_step": 13802, "epoch": 166} {"train_loss": -17.969318389892578, "global_step": 13803, "epoch": 166} {"train_loss": -17.86248207092285, "global_step": 13804, "epoch": 166} {"train_loss": -17.914752960205078, "global_step": 13805, "epoch": 166} {"train_loss": -17.90266227722168, "global_step": 13806, "epoch": 166} {"train_loss": -17.95081329345703, "global_step": 13807, "epoch": 166} {"train_loss": -17.63052749633789, "global_step": 13808, "epoch": 166} {"train_loss": -17.818580627441406, "global_step": 13809, "epoch": 166} {"train_loss": -18.497329711914062, "global_step": 13810, "epoch": 166} {"train_loss": -18.054824829101562, "global_step": 13811, "epoch": 166} {"train_loss": -18.20334815979004, "global_step": 13812, "epoch": 166} {"train_loss": -18.17925262451172, "global_step": 13813, "epoch": 166} {"train_loss": -17.864229202270508, "global_step": 13814, "epoch": 166} {"train_loss": -18.1495418548584, "global_step": 13815, "epoch": 166} {"train_loss": -17.64680290222168, "global_step": 13816, "epoch": 166} {"train_loss": -18.187458038330078, "global_step": 13817, "epoch": 166} {"train_loss": -18.090177536010742, "global_step": 13818, "epoch": 166} {"train_loss": -17.78905487060547, "global_step": 13819, "epoch": 166} {"train_loss": -17.6953067779541, "global_step": 13820, "epoch": 166} {"train_loss": -17.90950584411621, "global_step": 13821, "epoch": 166} {"train_loss": -17.911649703979492, "global_step": 13822, "epoch": 166} {"train_loss": -17.721969604492188, "global_step": 13823, "epoch": 166} {"train_loss": -18.333715438842773, "global_step": 13824, "epoch": 166} {"train_loss": -18.022048950195312, "global_step": 13825, "epoch": 166} {"train_loss": -18.110334396362305, "global_step": 13826, "epoch": 166} {"train_loss": -17.702661514282227, "global_step": 13827, "epoch": 166} {"train_loss": -18.301198959350586, "global_step": 13828, "epoch": 166} {"train_loss": -18.076696395874023, "global_step": 13829, "epoch": 166} {"train_loss": -18.026662826538086, "global_step": 13830, "epoch": 166} {"train_loss": -17.916561126708984, "global_step": 13831, "epoch": 166} {"train_loss": -18.16152000427246, "global_step": 13832, "epoch": 166} {"train_loss": -18.00057029724121, "global_step": 13833, "epoch": 166} {"train_loss": -17.746204376220703, "global_step": 13834, "epoch": 166} {"train_loss": -17.77935791015625, "global_step": 13835, "epoch": 166} {"train_loss": -18.17743492126465, "global_step": 13836, "epoch": 166} {"train_loss": -17.742450714111328, "global_step": 13837, "epoch": 166} {"train_loss": -18.2391414642334, "global_step": 13838, "epoch": 166} {"train_loss": -18.015554428100586, "global_step": 13839, "epoch": 166} {"train_loss": -17.862661361694336, "global_step": 13840, "epoch": 166} {"train_loss": -18.367361068725586, "global_step": 13841, "epoch": 166} {"train_loss": -17.94756507873535, "global_step": 13842, "epoch": 166} {"train_loss": -18.435409545898438, "global_step": 13843, "epoch": 166} {"train_loss": -17.6402530670166, "global_step": 13844, "epoch": 166} {"train_loss": -18.308202743530273, "global_step": 13845, "epoch": 166} {"train_loss": -17.8908748626709, "global_step": 13846, "epoch": 166} {"train_loss": -18.161470413208008, "global_step": 13847, "epoch": 166} {"train_loss": -18.218687057495117, "global_step": 13848, "epoch": 166} {"train_loss": -18.06910514831543, "global_step": 13849, "epoch": 166} {"train_loss": -18.253616333007812, "global_step": 13850, "epoch": 166} {"train_loss": -18.113388061523438, "global_step": 13851, "epoch": 166} {"train_loss": -17.74067497253418, "global_step": 13852, "epoch": 166} {"train_loss": -18.09737205505371, "global_step": 13853, "epoch": 166} {"train_loss": -18.24605941772461, "global_step": 13854, "epoch": 166} {"train_loss": -18.306072235107422, "global_step": 13855, "epoch": 166} {"train_loss": -18.25431251525879, "global_step": 13856, "epoch": 166} {"train_loss": -18.140138626098633, "global_step": 13857, "epoch": 166} {"train_loss": -18.122766494750977, "global_step": 13858, "epoch": 166} {"train_loss": -18.098297119140625, "global_step": 13859, "epoch": 166} {"train_loss": -18.01606210455837, "global_step": 13860, "epoch": 166, "val_loss": 6101480.0} {"train_loss": -17.79084014892578, "global_step": 13861, "epoch": 167} {"train_loss": -17.86342430114746, "global_step": 13862, "epoch": 167} {"train_loss": -18.05538558959961, "global_step": 13863, "epoch": 167} {"train_loss": -17.850406646728516, "global_step": 13864, "epoch": 167} {"train_loss": -18.067636489868164, "global_step": 13865, "epoch": 167} {"train_loss": -17.810047149658203, "global_step": 13866, "epoch": 167} {"train_loss": -17.86821937561035, "global_step": 13867, "epoch": 167} {"train_loss": -18.00647735595703, "global_step": 13868, "epoch": 167} {"train_loss": -17.94841957092285, "global_step": 13869, "epoch": 167} {"train_loss": -17.986988067626953, "global_step": 13870, "epoch": 167} {"train_loss": -18.009363174438477, "global_step": 13871, "epoch": 167} {"train_loss": -18.084754943847656, "global_step": 13872, "epoch": 167} {"train_loss": -18.053516387939453, "global_step": 13873, "epoch": 167} {"train_loss": -17.620285034179688, "global_step": 13874, "epoch": 167} {"train_loss": -17.686294555664062, "global_step": 13875, "epoch": 167} {"train_loss": -17.9393310546875, "global_step": 13876, "epoch": 167} {"train_loss": -17.757051467895508, "global_step": 13877, "epoch": 167} {"train_loss": -18.042110443115234, "global_step": 13878, "epoch": 167} {"train_loss": -18.056554794311523, "global_step": 13879, "epoch": 167} {"train_loss": -17.725866317749023, "global_step": 13880, "epoch": 167} {"train_loss": -17.984342575073242, "global_step": 13881, "epoch": 167} {"train_loss": -18.116147994995117, "global_step": 13882, "epoch": 167} {"train_loss": -17.72273063659668, "global_step": 13883, "epoch": 167} {"train_loss": -17.984201431274414, "global_step": 13884, "epoch": 167} {"train_loss": -18.236547470092773, "global_step": 13885, "epoch": 167} {"train_loss": -17.80794906616211, "global_step": 13886, "epoch": 167} {"train_loss": -18.338674545288086, "global_step": 13887, "epoch": 167} {"train_loss": -17.87700080871582, "global_step": 13888, "epoch": 167} {"train_loss": -18.4182071685791, "global_step": 13889, "epoch": 167} {"train_loss": -18.081186294555664, "global_step": 13890, "epoch": 167} {"train_loss": -17.68560218811035, "global_step": 13891, "epoch": 167} {"train_loss": -18.240964889526367, "global_step": 13892, "epoch": 167} {"train_loss": -17.529966354370117, "global_step": 13893, "epoch": 167} {"train_loss": -18.057851791381836, "global_step": 13894, "epoch": 167} {"train_loss": -18.043216705322266, "global_step": 13895, "epoch": 167} {"train_loss": -18.251052856445312, "global_step": 13896, "epoch": 167} {"train_loss": -18.101072311401367, "global_step": 13897, "epoch": 167} {"train_loss": -18.168445587158203, "global_step": 13898, "epoch": 167} {"train_loss": -17.548419952392578, "global_step": 13899, "epoch": 167} {"train_loss": -18.16641616821289, "global_step": 13900, "epoch": 167} {"train_loss": -18.172840118408203, "global_step": 13901, "epoch": 167} {"train_loss": -18.156991958618164, "global_step": 13902, "epoch": 167} {"train_loss": -18.437973022460938, "global_step": 13903, "epoch": 167} {"train_loss": -18.08088493347168, "global_step": 13904, "epoch": 167} {"train_loss": -18.260587692260742, "global_step": 13905, "epoch": 167} {"train_loss": -18.18668556213379, "global_step": 13906, "epoch": 167} {"train_loss": -18.193403244018555, "global_step": 13907, "epoch": 167} {"train_loss": -17.928268432617188, "global_step": 13908, "epoch": 167} {"train_loss": -18.156349182128906, "global_step": 13909, "epoch": 167} {"train_loss": -17.581348419189453, "global_step": 13910, "epoch": 167} {"train_loss": -17.70570945739746, "global_step": 13911, "epoch": 167} {"train_loss": -18.497394561767578, "global_step": 13912, "epoch": 167} {"train_loss": -17.822458267211914, "global_step": 13913, "epoch": 167} {"train_loss": -17.609130859375, "global_step": 13914, "epoch": 167} {"train_loss": -18.245288848876953, "global_step": 13915, "epoch": 167} {"train_loss": -17.522165298461914, "global_step": 13916, "epoch": 167} {"train_loss": -17.90828514099121, "global_step": 13917, "epoch": 167} {"train_loss": -17.71820068359375, "global_step": 13918, "epoch": 167} {"train_loss": -17.76924705505371, "global_step": 13919, "epoch": 167} {"train_loss": -17.69598960876465, "global_step": 13920, "epoch": 167} {"train_loss": -18.167875289916992, "global_step": 13921, "epoch": 167} {"train_loss": -17.815771102905273, "global_step": 13922, "epoch": 167} {"train_loss": -18.294143676757812, "global_step": 13923, "epoch": 167} {"train_loss": -17.720378875732422, "global_step": 13924, "epoch": 167} {"train_loss": -18.211538314819336, "global_step": 13925, "epoch": 167} {"train_loss": -17.931781768798828, "global_step": 13926, "epoch": 167} {"train_loss": -17.91702651977539, "global_step": 13927, "epoch": 167} {"train_loss": -17.832937240600586, "global_step": 13928, "epoch": 167} {"train_loss": -18.10288429260254, "global_step": 13929, "epoch": 167} {"train_loss": -17.91499900817871, "global_step": 13930, "epoch": 167} {"train_loss": -18.247648239135742, "global_step": 13931, "epoch": 167} {"train_loss": -18.154279708862305, "global_step": 13932, "epoch": 167} {"train_loss": -17.87493896484375, "global_step": 13933, "epoch": 167} {"train_loss": -18.039093017578125, "global_step": 13934, "epoch": 167} {"train_loss": -18.013269424438477, "global_step": 13935, "epoch": 167} {"train_loss": -18.142824172973633, "global_step": 13936, "epoch": 167} {"train_loss": -18.355257034301758, "global_step": 13937, "epoch": 167} {"train_loss": -18.056320190429688, "global_step": 13938, "epoch": 167} {"train_loss": -18.04836082458496, "global_step": 13939, "epoch": 167} {"train_loss": -18.095279693603516, "global_step": 13940, "epoch": 167} {"train_loss": -18.02073860168457, "global_step": 13941, "epoch": 167} {"train_loss": -18.075138092041016, "global_step": 13942, "epoch": 167} {"train_loss": -18.00858796360981, "global_step": 13943, "epoch": 167, "val_loss": 6034063.0} {"train_loss": -17.809200286865234, "global_step": 13944, "epoch": 168} {"train_loss": -17.976726531982422, "global_step": 13945, "epoch": 168} {"train_loss": -17.804929733276367, "global_step": 13946, "epoch": 168} {"train_loss": -17.278226852416992, "global_step": 13947, "epoch": 168} {"train_loss": -18.345552444458008, "global_step": 13948, "epoch": 168} {"train_loss": -17.807586669921875, "global_step": 13949, "epoch": 168} {"train_loss": -18.479293823242188, "global_step": 13950, "epoch": 168} {"train_loss": -17.867658615112305, "global_step": 13951, "epoch": 168} {"train_loss": -18.3321590423584, "global_step": 13952, "epoch": 168} {"train_loss": -17.83534812927246, "global_step": 13953, "epoch": 168} {"train_loss": -17.95992088317871, "global_step": 13954, "epoch": 168} {"train_loss": -17.80214500427246, "global_step": 13955, "epoch": 168} {"train_loss": -18.453996658325195, "global_step": 13956, "epoch": 168} {"train_loss": -18.202369689941406, "global_step": 13957, "epoch": 168} {"train_loss": -17.99519157409668, "global_step": 13958, "epoch": 168} {"train_loss": -17.762441635131836, "global_step": 13959, "epoch": 168} {"train_loss": -17.884538650512695, "global_step": 13960, "epoch": 168} {"train_loss": -17.868799209594727, "global_step": 13961, "epoch": 168} {"train_loss": -17.8786678314209, "global_step": 13962, "epoch": 168} {"train_loss": -17.886272430419922, "global_step": 13963, "epoch": 168} {"train_loss": -18.04581642150879, "global_step": 13964, "epoch": 168} {"train_loss": -17.941314697265625, "global_step": 13965, "epoch": 168} {"train_loss": -17.831815719604492, "global_step": 13966, "epoch": 168} {"train_loss": -18.14517593383789, "global_step": 13967, "epoch": 168} {"train_loss": -17.43814468383789, "global_step": 13968, "epoch": 168} {"train_loss": -18.211034774780273, "global_step": 13969, "epoch": 168} {"train_loss": -17.9105281829834, "global_step": 13970, "epoch": 168} {"train_loss": -18.39166831970215, "global_step": 13971, "epoch": 168} {"train_loss": -18.15096664428711, "global_step": 13972, "epoch": 168} {"train_loss": -18.09640884399414, "global_step": 13973, "epoch": 168} {"train_loss": -18.142215728759766, "global_step": 13974, "epoch": 168} {"train_loss": -17.907926559448242, "global_step": 13975, "epoch": 168} {"train_loss": -17.820585250854492, "global_step": 13976, "epoch": 168} {"train_loss": -17.895917892456055, "global_step": 13977, "epoch": 168} {"train_loss": -18.235214233398438, "global_step": 13978, "epoch": 168} {"train_loss": -18.212202072143555, "global_step": 13979, "epoch": 168} {"train_loss": -18.221027374267578, "global_step": 13980, "epoch": 168} {"train_loss": -17.804555892944336, "global_step": 13981, "epoch": 168} {"train_loss": -18.036508560180664, "global_step": 13982, "epoch": 168} {"train_loss": -17.857879638671875, "global_step": 13983, "epoch": 168} {"train_loss": -18.197309494018555, "global_step": 13984, "epoch": 168} {"train_loss": -18.21286392211914, "global_step": 13985, "epoch": 168} {"train_loss": -18.177278518676758, "global_step": 13986, "epoch": 168} {"train_loss": -17.576797485351562, "global_step": 13987, "epoch": 168} {"train_loss": -17.67952537536621, "global_step": 13988, "epoch": 168} {"train_loss": -17.971288681030273, "global_step": 13989, "epoch": 168} {"train_loss": -17.88657569885254, "global_step": 13990, "epoch": 168} {"train_loss": -17.7844181060791, "global_step": 13991, "epoch": 168} {"train_loss": -18.021270751953125, "global_step": 13992, "epoch": 168} {"train_loss": -17.930747985839844, "global_step": 13993, "epoch": 168} {"train_loss": -17.82511329650879, "global_step": 13994, "epoch": 168} {"train_loss": -18.04881477355957, "global_step": 13995, "epoch": 168} {"train_loss": -17.89699363708496, "global_step": 13996, "epoch": 168} {"train_loss": -18.11375617980957, "global_step": 13997, "epoch": 168} {"train_loss": -17.720956802368164, "global_step": 13998, "epoch": 168} {"train_loss": -18.01188850402832, "global_step": 13999, "epoch": 168} {"train_loss": -18.20648765563965, "global_step": 14000, "epoch": 168} {"train_loss": -18.089946746826172, "global_step": 14001, "epoch": 168} {"train_loss": -17.91849136352539, "global_step": 14002, "epoch": 168} {"train_loss": -17.780460357666016, "global_step": 14003, "epoch": 168} {"train_loss": -17.95456886291504, "global_step": 14004, "epoch": 168} {"train_loss": -17.91609764099121, "global_step": 14005, "epoch": 168} {"train_loss": -18.359027862548828, "global_step": 14006, "epoch": 168} {"train_loss": -17.944238662719727, "global_step": 14007, "epoch": 168} {"train_loss": -18.23606300354004, "global_step": 14008, "epoch": 168} {"train_loss": -18.018957138061523, "global_step": 14009, "epoch": 168} {"train_loss": -18.146886825561523, "global_step": 14010, "epoch": 168} {"train_loss": -18.24518394470215, "global_step": 14011, "epoch": 168} {"train_loss": -17.713502883911133, "global_step": 14012, "epoch": 168} {"train_loss": -17.875885009765625, "global_step": 14013, "epoch": 168} {"train_loss": -18.147363662719727, "global_step": 14014, "epoch": 168} {"train_loss": -18.45846939086914, "global_step": 14015, "epoch": 168} {"train_loss": -18.32753562927246, "global_step": 14016, "epoch": 168} {"train_loss": -17.712730407714844, "global_step": 14017, "epoch": 168} {"train_loss": -18.053531646728516, "global_step": 14018, "epoch": 168} {"train_loss": -17.891254425048828, "global_step": 14019, "epoch": 168} {"train_loss": -18.51239585876465, "global_step": 14020, "epoch": 168} {"train_loss": -17.89273452758789, "global_step": 14021, "epoch": 168} {"train_loss": -17.848119735717773, "global_step": 14022, "epoch": 168} {"train_loss": -18.1925106048584, "global_step": 14023, "epoch": 168} {"train_loss": -17.96843147277832, "global_step": 14024, "epoch": 168} {"train_loss": -17.9599666595459, "global_step": 14025, "epoch": 168} {"train_loss": -17.992118237966515, "global_step": 14026, "epoch": 168, "val_loss": 6032597.5} {"train_loss": -17.613821029663086, "global_step": 14027, "epoch": 169} {"train_loss": -18.074831008911133, "global_step": 14028, "epoch": 169} {"train_loss": -17.834753036499023, "global_step": 14029, "epoch": 169} {"train_loss": -17.439245223999023, "global_step": 14030, "epoch": 169} {"train_loss": -17.717668533325195, "global_step": 14031, "epoch": 169} {"train_loss": -17.734277725219727, "global_step": 14032, "epoch": 169} {"train_loss": -17.4487361907959, "global_step": 14033, "epoch": 169} {"train_loss": -17.930051803588867, "global_step": 14034, "epoch": 169} {"train_loss": -17.862918853759766, "global_step": 14035, "epoch": 169} {"train_loss": -17.892704010009766, "global_step": 14036, "epoch": 169} {"train_loss": -18.06525421142578, "global_step": 14037, "epoch": 169} {"train_loss": -17.566089630126953, "global_step": 14038, "epoch": 169} {"train_loss": -18.433231353759766, "global_step": 14039, "epoch": 169} {"train_loss": -17.777666091918945, "global_step": 14040, "epoch": 169} {"train_loss": -18.188735961914062, "global_step": 14041, "epoch": 169} {"train_loss": -17.791231155395508, "global_step": 14042, "epoch": 169} {"train_loss": -17.98075294494629, "global_step": 14043, "epoch": 169} {"train_loss": -18.230802536010742, "global_step": 14044, "epoch": 169} {"train_loss": -18.15447235107422, "global_step": 14045, "epoch": 169} {"train_loss": -17.82303810119629, "global_step": 14046, "epoch": 169} {"train_loss": -18.104597091674805, "global_step": 14047, "epoch": 169} {"train_loss": -18.39739418029785, "global_step": 14048, "epoch": 169} {"train_loss": -18.416168212890625, "global_step": 14049, "epoch": 169} {"train_loss": -18.09181022644043, "global_step": 14050, "epoch": 169} {"train_loss": -18.217458724975586, "global_step": 14051, "epoch": 169} {"train_loss": -17.923458099365234, "global_step": 14052, "epoch": 169} {"train_loss": -18.191946029663086, "global_step": 14053, "epoch": 169} {"train_loss": -17.759092330932617, "global_step": 14054, "epoch": 169} {"train_loss": -18.245956420898438, "global_step": 14055, "epoch": 169} {"train_loss": -18.199174880981445, "global_step": 14056, "epoch": 169} {"train_loss": -17.69301986694336, "global_step": 14057, "epoch": 169} {"train_loss": -18.208913803100586, "global_step": 14058, "epoch": 169} {"train_loss": -18.063566207885742, "global_step": 14059, "epoch": 169} {"train_loss": -18.10500717163086, "global_step": 14060, "epoch": 169} {"train_loss": -18.2209529876709, "global_step": 14061, "epoch": 169} {"train_loss": -17.943822860717773, "global_step": 14062, "epoch": 169} {"train_loss": -18.203588485717773, "global_step": 14063, "epoch": 169} {"train_loss": -18.096891403198242, "global_step": 14064, "epoch": 169} {"train_loss": -18.226667404174805, "global_step": 14065, "epoch": 169} {"train_loss": -18.104162216186523, "global_step": 14066, "epoch": 169} {"train_loss": -18.316099166870117, "global_step": 14067, "epoch": 169} {"train_loss": -17.74220848083496, "global_step": 14068, "epoch": 169} {"train_loss": -17.935714721679688, "global_step": 14069, "epoch": 169} {"train_loss": -18.166257858276367, "global_step": 14070, "epoch": 169} {"train_loss": -17.853788375854492, "global_step": 14071, "epoch": 169} {"train_loss": -18.071735382080078, "global_step": 14072, "epoch": 169} {"train_loss": -18.06239891052246, "global_step": 14073, "epoch": 169} {"train_loss": -17.980579376220703, "global_step": 14074, "epoch": 169} {"train_loss": -18.1728515625, "global_step": 14075, "epoch": 169} {"train_loss": -18.161510467529297, "global_step": 14076, "epoch": 169} {"train_loss": -18.57632827758789, "global_step": 14077, "epoch": 169} {"train_loss": -18.19334602355957, "global_step": 14078, "epoch": 169} {"train_loss": -17.784059524536133, "global_step": 14079, "epoch": 169} {"train_loss": -18.180870056152344, "global_step": 14080, "epoch": 169} {"train_loss": -17.917312622070312, "global_step": 14081, "epoch": 169} {"train_loss": -18.09266471862793, "global_step": 14082, "epoch": 169} {"train_loss": -18.026342391967773, "global_step": 14083, "epoch": 169} {"train_loss": -18.120803833007812, "global_step": 14084, "epoch": 169} {"train_loss": -17.852142333984375, "global_step": 14085, "epoch": 169} {"train_loss": -17.987598419189453, "global_step": 14086, "epoch": 169} {"train_loss": -18.12247657775879, "global_step": 14087, "epoch": 169} {"train_loss": -17.87525177001953, "global_step": 14088, "epoch": 169} {"train_loss": -18.103471755981445, "global_step": 14089, "epoch": 169} {"train_loss": -18.322242736816406, "global_step": 14090, "epoch": 169} {"train_loss": -17.860776901245117, "global_step": 14091, "epoch": 169} {"train_loss": -17.48265838623047, "global_step": 14092, "epoch": 169} {"train_loss": -17.650150299072266, "global_step": 14093, "epoch": 169} {"train_loss": -17.8922119140625, "global_step": 14094, "epoch": 169} {"train_loss": -18.264516830444336, "global_step": 14095, "epoch": 169} {"train_loss": -18.131473541259766, "global_step": 14096, "epoch": 169} {"train_loss": -18.05124282836914, "global_step": 14097, "epoch": 169} {"train_loss": -17.637161254882812, "global_step": 14098, "epoch": 169} {"train_loss": -18.009428024291992, "global_step": 14099, "epoch": 169} {"train_loss": -17.554901123046875, "global_step": 14100, "epoch": 169} {"train_loss": -17.656734466552734, "global_step": 14101, "epoch": 169} {"train_loss": -18.351484298706055, "global_step": 14102, "epoch": 169} {"train_loss": -18.20356559753418, "global_step": 14103, "epoch": 169} {"train_loss": -18.076345443725586, "global_step": 14104, "epoch": 169} {"train_loss": -18.41766357421875, "global_step": 14105, "epoch": 169} {"train_loss": -17.852420806884766, "global_step": 14106, "epoch": 169} {"train_loss": -17.90192985534668, "global_step": 14107, "epoch": 169} {"train_loss": -18.056554794311523, "global_step": 14108, "epoch": 169} {"train_loss": -18.00240925708449, "global_step": 14109, "epoch": 169, "val_loss": 6170175.5} {"train_loss": -17.4903564453125, "global_step": 14110, "epoch": 170} {"train_loss": -17.142065048217773, "global_step": 14111, "epoch": 170} {"train_loss": -17.736858367919922, "global_step": 14112, "epoch": 170} {"train_loss": -18.104455947875977, "global_step": 14113, "epoch": 170} {"train_loss": -17.760251998901367, "global_step": 14114, "epoch": 170} {"train_loss": -17.686725616455078, "global_step": 14115, "epoch": 170} {"train_loss": -18.250144958496094, "global_step": 14116, "epoch": 170} {"train_loss": -17.481319427490234, "global_step": 14117, "epoch": 170} {"train_loss": -18.038232803344727, "global_step": 14118, "epoch": 170} {"train_loss": -17.71535301208496, "global_step": 14119, "epoch": 170} {"train_loss": -18.00417137145996, "global_step": 14120, "epoch": 170} {"train_loss": -17.95513343811035, "global_step": 14121, "epoch": 170} {"train_loss": -18.073978424072266, "global_step": 14122, "epoch": 170} {"train_loss": -18.188753128051758, "global_step": 14123, "epoch": 170} {"train_loss": -17.831754684448242, "global_step": 14124, "epoch": 170} {"train_loss": -18.088163375854492, "global_step": 14125, "epoch": 170} {"train_loss": -18.228374481201172, "global_step": 14126, "epoch": 170} {"train_loss": -18.07038688659668, "global_step": 14127, "epoch": 170} {"train_loss": -17.972665786743164, "global_step": 14128, "epoch": 170} {"train_loss": -18.092864990234375, "global_step": 14129, "epoch": 170} {"train_loss": -18.185684204101562, "global_step": 14130, "epoch": 170} {"train_loss": -18.06654167175293, "global_step": 14131, "epoch": 170} {"train_loss": -17.855899810791016, "global_step": 14132, "epoch": 170} {"train_loss": -17.996856689453125, "global_step": 14133, "epoch": 170} {"train_loss": -17.86427116394043, "global_step": 14134, "epoch": 170} {"train_loss": -17.75229263305664, "global_step": 14135, "epoch": 170} {"train_loss": -17.840408325195312, "global_step": 14136, "epoch": 170} {"train_loss": -18.393951416015625, "global_step": 14137, "epoch": 170} {"train_loss": -18.189727783203125, "global_step": 14138, "epoch": 170} {"train_loss": -18.169055938720703, "global_step": 14139, "epoch": 170} {"train_loss": -17.755537033081055, "global_step": 14140, "epoch": 170} {"train_loss": -17.878110885620117, "global_step": 14141, "epoch": 170} {"train_loss": -18.441659927368164, "global_step": 14142, "epoch": 170} {"train_loss": -17.78479766845703, "global_step": 14143, "epoch": 170} {"train_loss": -17.903390884399414, "global_step": 14144, "epoch": 170} {"train_loss": -18.32105255126953, "global_step": 14145, "epoch": 170} {"train_loss": -18.20907974243164, "global_step": 14146, "epoch": 170} {"train_loss": -18.08420181274414, "global_step": 14147, "epoch": 170} {"train_loss": -18.19015121459961, "global_step": 14148, "epoch": 170} {"train_loss": -17.912933349609375, "global_step": 14149, "epoch": 170} {"train_loss": -17.835880279541016, "global_step": 14150, "epoch": 170} {"train_loss": -18.09157371520996, "global_step": 14151, "epoch": 170} {"train_loss": -17.80885887145996, "global_step": 14152, "epoch": 170} {"train_loss": -18.37451171875, "global_step": 14153, "epoch": 170} {"train_loss": -18.336545944213867, "global_step": 14154, "epoch": 170} {"train_loss": -18.187442779541016, "global_step": 14155, "epoch": 170} {"train_loss": -17.739887237548828, "global_step": 14156, "epoch": 170} {"train_loss": -17.472455978393555, "global_step": 14157, "epoch": 170} {"train_loss": -17.890317916870117, "global_step": 14158, "epoch": 170} {"train_loss": -17.8584041595459, "global_step": 14159, "epoch": 170} {"train_loss": -18.097373962402344, "global_step": 14160, "epoch": 170} {"train_loss": -17.837007522583008, "global_step": 14161, "epoch": 170} {"train_loss": -18.293184280395508, "global_step": 14162, "epoch": 170} {"train_loss": -17.84938621520996, "global_step": 14163, "epoch": 170} {"train_loss": -18.334096908569336, "global_step": 14164, "epoch": 170} {"train_loss": -18.170839309692383, "global_step": 14165, "epoch": 170} {"train_loss": -17.998870849609375, "global_step": 14166, "epoch": 170} {"train_loss": -18.108095169067383, "global_step": 14167, "epoch": 170} {"train_loss": -17.755674362182617, "global_step": 14168, "epoch": 170} {"train_loss": -17.858642578125, "global_step": 14169, "epoch": 170} {"train_loss": -18.01735496520996, "global_step": 14170, "epoch": 170} {"train_loss": -18.05154800415039, "global_step": 14171, "epoch": 170} {"train_loss": -18.3562068939209, "global_step": 14172, "epoch": 170} {"train_loss": -18.1173095703125, "global_step": 14173, "epoch": 170} {"train_loss": -17.64060401916504, "global_step": 14174, "epoch": 170} {"train_loss": -18.24095344543457, "global_step": 14175, "epoch": 170} {"train_loss": -17.723037719726562, "global_step": 14176, "epoch": 170} {"train_loss": -17.595983505249023, "global_step": 14177, "epoch": 170} {"train_loss": -18.139211654663086, "global_step": 14178, "epoch": 170} {"train_loss": -18.327848434448242, "global_step": 14179, "epoch": 170} {"train_loss": -17.952219009399414, "global_step": 14180, "epoch": 170} {"train_loss": -17.827056884765625, "global_step": 14181, "epoch": 170} {"train_loss": -18.178693771362305, "global_step": 14182, "epoch": 170} {"train_loss": -18.3080997467041, "global_step": 14183, "epoch": 170} {"train_loss": -18.08245849609375, "global_step": 14184, "epoch": 170} {"train_loss": -18.38759422302246, "global_step": 14185, "epoch": 170} {"train_loss": -18.074186325073242, "global_step": 14186, "epoch": 170} {"train_loss": -18.01744842529297, "global_step": 14187, "epoch": 170} {"train_loss": -18.259811401367188, "global_step": 14188, "epoch": 170} {"train_loss": -18.137723922729492, "global_step": 14189, "epoch": 170} {"train_loss": -17.966901779174805, "global_step": 14190, "epoch": 170} {"train_loss": -18.21712303161621, "global_step": 14191, "epoch": 170} {"train_loss": -18.003586619733326, "global_step": 14192, "epoch": 170, "val_loss": 6075513.0} {"train_loss": -17.771129608154297, "global_step": 14193, "epoch": 171} {"train_loss": -18.28530502319336, "global_step": 14194, "epoch": 171} {"train_loss": -18.193286895751953, "global_step": 14195, "epoch": 171} {"train_loss": -17.825084686279297, "global_step": 14196, "epoch": 171} {"train_loss": -18.14109992980957, "global_step": 14197, "epoch": 171} {"train_loss": -18.07496452331543, "global_step": 14198, "epoch": 171} {"train_loss": -18.18073844909668, "global_step": 14199, "epoch": 171} {"train_loss": -17.735776901245117, "global_step": 14200, "epoch": 171} {"train_loss": -18.08102798461914, "global_step": 14201, "epoch": 171} {"train_loss": -18.099903106689453, "global_step": 14202, "epoch": 171} {"train_loss": -18.212570190429688, "global_step": 14203, "epoch": 171} {"train_loss": -18.170175552368164, "global_step": 14204, "epoch": 171} {"train_loss": -18.373693466186523, "global_step": 14205, "epoch": 171} {"train_loss": -18.18195152282715, "global_step": 14206, "epoch": 171} {"train_loss": -17.646442413330078, "global_step": 14207, "epoch": 171} {"train_loss": -17.83283233642578, "global_step": 14208, "epoch": 171} {"train_loss": -17.77094841003418, "global_step": 14209, "epoch": 171} {"train_loss": -17.959671020507812, "global_step": 14210, "epoch": 171} {"train_loss": -17.996463775634766, "global_step": 14211, "epoch": 171} {"train_loss": -17.953388214111328, "global_step": 14212, "epoch": 171} {"train_loss": -18.15821075439453, "global_step": 14213, "epoch": 171} {"train_loss": -17.777341842651367, "global_step": 14214, "epoch": 171} {"train_loss": -18.022663116455078, "global_step": 14215, "epoch": 171} {"train_loss": -18.0148868560791, "global_step": 14216, "epoch": 171} {"train_loss": -17.98917007446289, "global_step": 14217, "epoch": 171} {"train_loss": -17.66128921508789, "global_step": 14218, "epoch": 171} {"train_loss": -17.935718536376953, "global_step": 14219, "epoch": 171} {"train_loss": -17.96966552734375, "global_step": 14220, "epoch": 171} {"train_loss": -17.89969253540039, "global_step": 14221, "epoch": 171} {"train_loss": -17.874784469604492, "global_step": 14222, "epoch": 171} {"train_loss": -18.232053756713867, "global_step": 14223, "epoch": 171} {"train_loss": -17.838916778564453, "global_step": 14224, "epoch": 171} {"train_loss": -18.270505905151367, "global_step": 14225, "epoch": 171} {"train_loss": -18.342823028564453, "global_step": 14226, "epoch": 171} {"train_loss": -17.950551986694336, "global_step": 14227, "epoch": 171} {"train_loss": -17.685274124145508, "global_step": 14228, "epoch": 171} {"train_loss": -17.568565368652344, "global_step": 14229, "epoch": 171} {"train_loss": -17.896408081054688, "global_step": 14230, "epoch": 171} {"train_loss": -17.979320526123047, "global_step": 14231, "epoch": 171} {"train_loss": -17.97768783569336, "global_step": 14232, "epoch": 171} {"train_loss": -18.144147872924805, "global_step": 14233, "epoch": 171} {"train_loss": -18.031524658203125, "global_step": 14234, "epoch": 171} {"train_loss": -17.884830474853516, "global_step": 14235, "epoch": 171} {"train_loss": -18.003311157226562, "global_step": 14236, "epoch": 171} {"train_loss": -17.915014266967773, "global_step": 14237, "epoch": 171} {"train_loss": -17.813339233398438, "global_step": 14238, "epoch": 171} {"train_loss": -18.056894302368164, "global_step": 14239, "epoch": 171} {"train_loss": -18.261119842529297, "global_step": 14240, "epoch": 171} {"train_loss": -18.03126335144043, "global_step": 14241, "epoch": 171} {"train_loss": -18.164594650268555, "global_step": 14242, "epoch": 171} {"train_loss": -18.054685592651367, "global_step": 14243, "epoch": 171} {"train_loss": -17.654800415039062, "global_step": 14244, "epoch": 171} {"train_loss": -18.0448055267334, "global_step": 14245, "epoch": 171} {"train_loss": -18.139928817749023, "global_step": 14246, "epoch": 171} {"train_loss": -18.3952693939209, "global_step": 14247, "epoch": 171} {"train_loss": -17.87312889099121, "global_step": 14248, "epoch": 171} {"train_loss": -18.2189884185791, "global_step": 14249, "epoch": 171} {"train_loss": -18.096349716186523, "global_step": 14250, "epoch": 171} {"train_loss": -18.00295066833496, "global_step": 14251, "epoch": 171} {"train_loss": -18.155654907226562, "global_step": 14252, "epoch": 171} {"train_loss": -18.16497230529785, "global_step": 14253, "epoch": 171} {"train_loss": -17.657642364501953, "global_step": 14254, "epoch": 171} {"train_loss": -18.12965965270996, "global_step": 14255, "epoch": 171} {"train_loss": -17.9919376373291, "global_step": 14256, "epoch": 171} {"train_loss": -18.13865089416504, "global_step": 14257, "epoch": 171} {"train_loss": -18.5822811126709, "global_step": 14258, "epoch": 171} {"train_loss": -18.19803237915039, "global_step": 14259, "epoch": 171} {"train_loss": -18.032373428344727, "global_step": 14260, "epoch": 171} {"train_loss": -17.86797523498535, "global_step": 14261, "epoch": 171} {"train_loss": -18.102725982666016, "global_step": 14262, "epoch": 171} {"train_loss": -17.675086975097656, "global_step": 14263, "epoch": 171} {"train_loss": -18.19808006286621, "global_step": 14264, "epoch": 171} {"train_loss": -18.032644271850586, "global_step": 14265, "epoch": 171} {"train_loss": -17.95442771911621, "global_step": 14266, "epoch": 171} {"train_loss": -17.732397079467773, "global_step": 14267, "epoch": 171} {"train_loss": -18.093603134155273, "global_step": 14268, "epoch": 171} {"train_loss": -17.970273971557617, "global_step": 14269, "epoch": 171} {"train_loss": -18.48951530456543, "global_step": 14270, "epoch": 171} {"train_loss": -17.655961990356445, "global_step": 14271, "epoch": 171} {"train_loss": -17.518550872802734, "global_step": 14272, "epoch": 171} {"train_loss": -17.961225509643555, "global_step": 14273, "epoch": 171} {"train_loss": -17.652708053588867, "global_step": 14274, "epoch": 171} {"train_loss": -18.014045347650367, "global_step": 14275, "epoch": 171, "val_loss": 6121919.5} {"train_loss": -17.71375846862793, "global_step": 14276, "epoch": 172} {"train_loss": -17.665292739868164, "global_step": 14277, "epoch": 172} {"train_loss": -18.288022994995117, "global_step": 14278, "epoch": 172} {"train_loss": -17.522668838500977, "global_step": 14279, "epoch": 172} {"train_loss": -18.210899353027344, "global_step": 14280, "epoch": 172} {"train_loss": -17.474735260009766, "global_step": 14281, "epoch": 172} {"train_loss": -17.662233352661133, "global_step": 14282, "epoch": 172} {"train_loss": -18.12122917175293, "global_step": 14283, "epoch": 172} {"train_loss": -17.70130729675293, "global_step": 14284, "epoch": 172} {"train_loss": -17.850522994995117, "global_step": 14285, "epoch": 172} {"train_loss": -17.676904678344727, "global_step": 14286, "epoch": 172} {"train_loss": -17.869869232177734, "global_step": 14287, "epoch": 172} {"train_loss": -17.832252502441406, "global_step": 14288, "epoch": 172} {"train_loss": -18.145395278930664, "global_step": 14289, "epoch": 172} {"train_loss": -17.95709800720215, "global_step": 14290, "epoch": 172} {"train_loss": -17.535030364990234, "global_step": 14291, "epoch": 172} {"train_loss": -18.568906784057617, "global_step": 14292, "epoch": 172} {"train_loss": -17.78553581237793, "global_step": 14293, "epoch": 172} {"train_loss": -18.242122650146484, "global_step": 14294, "epoch": 172} {"train_loss": -17.806812286376953, "global_step": 14295, "epoch": 172} {"train_loss": -17.789548873901367, "global_step": 14296, "epoch": 172} {"train_loss": -17.6488094329834, "global_step": 14297, "epoch": 172} {"train_loss": -18.146957397460938, "global_step": 14298, "epoch": 172} {"train_loss": -18.107994079589844, "global_step": 14299, "epoch": 172} {"train_loss": -17.991180419921875, "global_step": 14300, "epoch": 172} {"train_loss": -18.3071346282959, "global_step": 14301, "epoch": 172} {"train_loss": -18.323780059814453, "global_step": 14302, "epoch": 172} {"train_loss": -18.054685592651367, "global_step": 14303, "epoch": 172} {"train_loss": -18.231708526611328, "global_step": 14304, "epoch": 172} {"train_loss": -17.70265007019043, "global_step": 14305, "epoch": 172} {"train_loss": -18.089618682861328, "global_step": 14306, "epoch": 172} {"train_loss": -17.79433250427246, "global_step": 14307, "epoch": 172} {"train_loss": -17.766183853149414, "global_step": 14308, "epoch": 172} {"train_loss": -18.331449508666992, "global_step": 14309, "epoch": 172} {"train_loss": -17.98675537109375, "global_step": 14310, "epoch": 172} {"train_loss": -17.71837043762207, "global_step": 14311, "epoch": 172} {"train_loss": -18.316022872924805, "global_step": 14312, "epoch": 172} {"train_loss": -18.587583541870117, "global_step": 14313, "epoch": 172} {"train_loss": -18.10201072692871, "global_step": 14314, "epoch": 172} {"train_loss": -18.094867706298828, "global_step": 14315, "epoch": 172} {"train_loss": -17.973676681518555, "global_step": 14316, "epoch": 172} {"train_loss": -17.652090072631836, "global_step": 14317, "epoch": 172} {"train_loss": -18.007150650024414, "global_step": 14318, "epoch": 172} {"train_loss": -17.960620880126953, "global_step": 14319, "epoch": 172} {"train_loss": -18.053266525268555, "global_step": 14320, "epoch": 172} {"train_loss": -18.072677612304688, "global_step": 14321, "epoch": 172} {"train_loss": -17.97410011291504, "global_step": 14322, "epoch": 172} {"train_loss": -18.160303115844727, "global_step": 14323, "epoch": 172} {"train_loss": -17.80734634399414, "global_step": 14324, "epoch": 172} {"train_loss": -18.11884880065918, "global_step": 14325, "epoch": 172} {"train_loss": -17.95745277404785, "global_step": 14326, "epoch": 172} {"train_loss": -17.76007652282715, "global_step": 14327, "epoch": 172} {"train_loss": -17.995359420776367, "global_step": 14328, "epoch": 172} {"train_loss": -18.08013343811035, "global_step": 14329, "epoch": 172} {"train_loss": -17.999094009399414, "global_step": 14330, "epoch": 172} {"train_loss": -17.816009521484375, "global_step": 14331, "epoch": 172} {"train_loss": -18.2216739654541, "global_step": 14332, "epoch": 172} {"train_loss": -18.1979923248291, "global_step": 14333, "epoch": 172} {"train_loss": -17.73651123046875, "global_step": 14334, "epoch": 172} {"train_loss": -17.941627502441406, "global_step": 14335, "epoch": 172} {"train_loss": -18.3023738861084, "global_step": 14336, "epoch": 172} {"train_loss": -17.738386154174805, "global_step": 14337, "epoch": 172} {"train_loss": -18.001108169555664, "global_step": 14338, "epoch": 172} {"train_loss": -17.9718074798584, "global_step": 14339, "epoch": 172} {"train_loss": -17.912662506103516, "global_step": 14340, "epoch": 172} {"train_loss": -17.959867477416992, "global_step": 14341, "epoch": 172} {"train_loss": -17.74659538269043, "global_step": 14342, "epoch": 172} {"train_loss": -18.046051025390625, "global_step": 14343, "epoch": 172} {"train_loss": -17.795394897460938, "global_step": 14344, "epoch": 172} {"train_loss": -18.28960418701172, "global_step": 14345, "epoch": 172} {"train_loss": -18.107975006103516, "global_step": 14346, "epoch": 172} {"train_loss": -18.124114990234375, "global_step": 14347, "epoch": 172} {"train_loss": -18.257322311401367, "global_step": 14348, "epoch": 172} {"train_loss": -18.059186935424805, "global_step": 14349, "epoch": 172} {"train_loss": -18.37995719909668, "global_step": 14350, "epoch": 172} {"train_loss": -17.884801864624023, "global_step": 14351, "epoch": 172} {"train_loss": -18.296817779541016, "global_step": 14352, "epoch": 172} {"train_loss": -17.82741928100586, "global_step": 14353, "epoch": 172} {"train_loss": -18.51993179321289, "global_step": 14354, "epoch": 172} {"train_loss": -18.29928970336914, "global_step": 14355, "epoch": 172} {"train_loss": -17.97771644592285, "global_step": 14356, "epoch": 172} {"train_loss": -17.88083839416504, "global_step": 14357, "epoch": 172} {"train_loss": -18.01513322577419, "global_step": 14358, "epoch": 172, "val_loss": 6097486.0} {"train_loss": -17.53902244567871, "global_step": 14359, "epoch": 173} {"train_loss": -18.019500732421875, "global_step": 14360, "epoch": 173} {"train_loss": -17.705900192260742, "global_step": 14361, "epoch": 173} {"train_loss": -17.850980758666992, "global_step": 14362, "epoch": 173} {"train_loss": -17.727672576904297, "global_step": 14363, "epoch": 173} {"train_loss": -18.411203384399414, "global_step": 14364, "epoch": 173} {"train_loss": -17.9104061126709, "global_step": 14365, "epoch": 173} {"train_loss": -18.020246505737305, "global_step": 14366, "epoch": 173} {"train_loss": -17.804349899291992, "global_step": 14367, "epoch": 173} {"train_loss": -17.846914291381836, "global_step": 14368, "epoch": 173} {"train_loss": -17.911212921142578, "global_step": 14369, "epoch": 173} {"train_loss": -17.641128540039062, "global_step": 14370, "epoch": 173} {"train_loss": -17.949691772460938, "global_step": 14371, "epoch": 173} {"train_loss": -17.500242233276367, "global_step": 14372, "epoch": 173} {"train_loss": -18.011747360229492, "global_step": 14373, "epoch": 173} {"train_loss": -17.59956169128418, "global_step": 14374, "epoch": 173} {"train_loss": -17.904390335083008, "global_step": 14375, "epoch": 173} {"train_loss": -18.228242874145508, "global_step": 14376, "epoch": 173} {"train_loss": -17.646703720092773, "global_step": 14377, "epoch": 173} {"train_loss": -17.88718032836914, "global_step": 14378, "epoch": 173} {"train_loss": -18.211505889892578, "global_step": 14379, "epoch": 173} {"train_loss": -17.961103439331055, "global_step": 14380, "epoch": 173} {"train_loss": -17.667774200439453, "global_step": 14381, "epoch": 173} {"train_loss": -17.815227508544922, "global_step": 14382, "epoch": 173} {"train_loss": -17.49654197692871, "global_step": 14383, "epoch": 173} {"train_loss": -18.16927719116211, "global_step": 14384, "epoch": 173} {"train_loss": -18.21921730041504, "global_step": 14385, "epoch": 173} {"train_loss": -17.881052017211914, "global_step": 14386, "epoch": 173} {"train_loss": -17.722320556640625, "global_step": 14387, "epoch": 173} {"train_loss": -18.352323532104492, "global_step": 14388, "epoch": 173} {"train_loss": -18.31260108947754, "global_step": 14389, "epoch": 173} {"train_loss": -18.09581184387207, "global_step": 14390, "epoch": 173} {"train_loss": -18.357248306274414, "global_step": 14391, "epoch": 173} {"train_loss": -18.100732803344727, "global_step": 14392, "epoch": 173} {"train_loss": -17.866687774658203, "global_step": 14393, "epoch": 173} {"train_loss": -18.072954177856445, "global_step": 14394, "epoch": 173} {"train_loss": -18.063119888305664, "global_step": 14395, "epoch": 173} {"train_loss": -18.278583526611328, "global_step": 14396, "epoch": 173} {"train_loss": -18.284093856811523, "global_step": 14397, "epoch": 173} {"train_loss": -18.101715087890625, "global_step": 14398, "epoch": 173} {"train_loss": -18.254568099975586, "global_step": 14399, "epoch": 173} {"train_loss": -18.230365753173828, "global_step": 14400, "epoch": 173} {"train_loss": -17.849903106689453, "global_step": 14401, "epoch": 173} {"train_loss": -17.893808364868164, "global_step": 14402, "epoch": 173} {"train_loss": -17.89791488647461, "global_step": 14403, "epoch": 173} {"train_loss": -17.849952697753906, "global_step": 14404, "epoch": 173} {"train_loss": -18.092023849487305, "global_step": 14405, "epoch": 173} {"train_loss": -18.262670516967773, "global_step": 14406, "epoch": 173} {"train_loss": -18.195178985595703, "global_step": 14407, "epoch": 173} {"train_loss": -18.163909912109375, "global_step": 14408, "epoch": 173} {"train_loss": -18.065433502197266, "global_step": 14409, "epoch": 173} {"train_loss": -18.08794593811035, "global_step": 14410, "epoch": 173} {"train_loss": -17.93037223815918, "global_step": 14411, "epoch": 173} {"train_loss": -18.220443725585938, "global_step": 14412, "epoch": 173} {"train_loss": -17.753150939941406, "global_step": 14413, "epoch": 173} {"train_loss": -18.01950454711914, "global_step": 14414, "epoch": 173} {"train_loss": -18.327795028686523, "global_step": 14415, "epoch": 173} {"train_loss": -17.60683250427246, "global_step": 14416, "epoch": 173} {"train_loss": -17.814434051513672, "global_step": 14417, "epoch": 173} {"train_loss": -18.561614990234375, "global_step": 14418, "epoch": 173} {"train_loss": -18.252172470092773, "global_step": 14419, "epoch": 173} {"train_loss": -18.00164222717285, "global_step": 14420, "epoch": 173} {"train_loss": -18.456796646118164, "global_step": 14421, "epoch": 173} {"train_loss": -18.037691116333008, "global_step": 14422, "epoch": 173} {"train_loss": -18.514842987060547, "global_step": 14423, "epoch": 173} {"train_loss": -17.92926788330078, "global_step": 14424, "epoch": 173} {"train_loss": -18.202077865600586, "global_step": 14425, "epoch": 173} {"train_loss": -18.062009811401367, "global_step": 14426, "epoch": 173} {"train_loss": -18.20347023010254, "global_step": 14427, "epoch": 173} {"train_loss": -18.12058448791504, "global_step": 14428, "epoch": 173} {"train_loss": -18.127042770385742, "global_step": 14429, "epoch": 173} {"train_loss": -17.916547775268555, "global_step": 14430, "epoch": 173} {"train_loss": -18.20259666442871, "global_step": 14431, "epoch": 173} {"train_loss": -18.121076583862305, "global_step": 14432, "epoch": 173} {"train_loss": -18.070293426513672, "global_step": 14433, "epoch": 173} {"train_loss": -18.046314239501953, "global_step": 14434, "epoch": 173} {"train_loss": -18.116180419921875, "global_step": 14435, "epoch": 173} {"train_loss": -18.365875244140625, "global_step": 14436, "epoch": 173} {"train_loss": -17.80833625793457, "global_step": 14437, "epoch": 173} {"train_loss": -18.24200439453125, "global_step": 14438, "epoch": 173} {"train_loss": -18.147668838500977, "global_step": 14439, "epoch": 173} {"train_loss": -17.99982261657715, "global_step": 14440, "epoch": 173} {"train_loss": -18.03274772827884, "global_step": 14441, "epoch": 173, "val_loss": 6071821.0} {"train_loss": -18.07855796813965, "global_step": 14442, "epoch": 174} {"train_loss": -17.68190574645996, "global_step": 14443, "epoch": 174} {"train_loss": -18.015453338623047, "global_step": 14444, "epoch": 174} {"train_loss": -17.750486373901367, "global_step": 14445, "epoch": 174} {"train_loss": -18.137434005737305, "global_step": 14446, "epoch": 174} {"train_loss": -17.65644645690918, "global_step": 14447, "epoch": 174} {"train_loss": -18.022872924804688, "global_step": 14448, "epoch": 174} {"train_loss": -18.167766571044922, "global_step": 14449, "epoch": 174} {"train_loss": -18.198511123657227, "global_step": 14450, "epoch": 174} {"train_loss": -18.18863296508789, "global_step": 14451, "epoch": 174} {"train_loss": -18.04908561706543, "global_step": 14452, "epoch": 174} {"train_loss": -17.75602912902832, "global_step": 14453, "epoch": 174} {"train_loss": -17.966705322265625, "global_step": 14454, "epoch": 174} {"train_loss": -18.270917892456055, "global_step": 14455, "epoch": 174} {"train_loss": -18.170019149780273, "global_step": 14456, "epoch": 174} {"train_loss": -17.997453689575195, "global_step": 14457, "epoch": 174} {"train_loss": -18.19815444946289, "global_step": 14458, "epoch": 174} {"train_loss": -17.933589935302734, "global_step": 14459, "epoch": 174} {"train_loss": -17.77552604675293, "global_step": 14460, "epoch": 174} {"train_loss": -18.120832443237305, "global_step": 14461, "epoch": 174} {"train_loss": -17.919092178344727, "global_step": 14462, "epoch": 174} {"train_loss": -18.2348575592041, "global_step": 14463, "epoch": 174} {"train_loss": -18.335308074951172, "global_step": 14464, "epoch": 174} {"train_loss": -18.2579402923584, "global_step": 14465, "epoch": 174} {"train_loss": -17.896421432495117, "global_step": 14466, "epoch": 174} {"train_loss": -18.217655181884766, "global_step": 14467, "epoch": 174} {"train_loss": -18.267902374267578, "global_step": 14468, "epoch": 174} {"train_loss": -18.081247329711914, "global_step": 14469, "epoch": 174} {"train_loss": -17.96651268005371, "global_step": 14470, "epoch": 174} {"train_loss": -18.048734664916992, "global_step": 14471, "epoch": 174} {"train_loss": -17.95863151550293, "global_step": 14472, "epoch": 174} {"train_loss": -17.81867790222168, "global_step": 14473, "epoch": 174} {"train_loss": -17.575136184692383, "global_step": 14474, "epoch": 174} {"train_loss": -17.84157371520996, "global_step": 14475, "epoch": 174} {"train_loss": -18.192676544189453, "global_step": 14476, "epoch": 174} {"train_loss": -17.651151657104492, "global_step": 14477, "epoch": 174} {"train_loss": -18.075952529907227, "global_step": 14478, "epoch": 174} {"train_loss": -18.318105697631836, "global_step": 14479, "epoch": 174} {"train_loss": -17.834463119506836, "global_step": 14480, "epoch": 174} {"train_loss": -18.263463973999023, "global_step": 14481, "epoch": 174} {"train_loss": -18.09857940673828, "global_step": 14482, "epoch": 174} {"train_loss": -17.900848388671875, "global_step": 14483, "epoch": 174} {"train_loss": -17.742460250854492, "global_step": 14484, "epoch": 174} {"train_loss": -18.159284591674805, "global_step": 14485, "epoch": 174} {"train_loss": -18.187549591064453, "global_step": 14486, "epoch": 174} {"train_loss": -18.29163360595703, "global_step": 14487, "epoch": 174} {"train_loss": -18.224376678466797, "global_step": 14488, "epoch": 174} {"train_loss": -17.833524703979492, "global_step": 14489, "epoch": 174} {"train_loss": -17.673059463500977, "global_step": 14490, "epoch": 174} {"train_loss": -17.766231536865234, "global_step": 14491, "epoch": 174} {"train_loss": -17.942371368408203, "global_step": 14492, "epoch": 174} {"train_loss": -17.81057357788086, "global_step": 14493, "epoch": 174} {"train_loss": -18.173233032226562, "global_step": 14494, "epoch": 174} {"train_loss": -17.950498580932617, "global_step": 14495, "epoch": 174} {"train_loss": -17.980260848999023, "global_step": 14496, "epoch": 174} {"train_loss": -18.471786499023438, "global_step": 14497, "epoch": 174} {"train_loss": -17.861059188842773, "global_step": 14498, "epoch": 174} {"train_loss": -18.352340698242188, "global_step": 14499, "epoch": 174} {"train_loss": -18.09235191345215, "global_step": 14500, "epoch": 174} {"train_loss": -18.074934005737305, "global_step": 14501, "epoch": 174} {"train_loss": -17.94795799255371, "global_step": 14502, "epoch": 174} {"train_loss": -18.079153060913086, "global_step": 14503, "epoch": 174} {"train_loss": -17.789377212524414, "global_step": 14504, "epoch": 174} {"train_loss": -17.73959732055664, "global_step": 14505, "epoch": 174} {"train_loss": -18.39562225341797, "global_step": 14506, "epoch": 174} {"train_loss": -18.051433563232422, "global_step": 14507, "epoch": 174} {"train_loss": -18.42740821838379, "global_step": 14508, "epoch": 174} {"train_loss": -18.00417137145996, "global_step": 14509, "epoch": 174} {"train_loss": -18.041635513305664, "global_step": 14510, "epoch": 174} {"train_loss": -18.210721969604492, "global_step": 14511, "epoch": 174} {"train_loss": -17.482425689697266, "global_step": 14512, "epoch": 174} {"train_loss": -18.014873504638672, "global_step": 14513, "epoch": 174} {"train_loss": -18.128463745117188, "global_step": 14514, "epoch": 174} {"train_loss": -17.90397071838379, "global_step": 14515, "epoch": 174} {"train_loss": -18.09331703186035, "global_step": 14516, "epoch": 174} {"train_loss": -18.152870178222656, "global_step": 14517, "epoch": 174} {"train_loss": -18.15553855895996, "global_step": 14518, "epoch": 174} {"train_loss": -18.152694702148438, "global_step": 14519, "epoch": 174} {"train_loss": -17.59903335571289, "global_step": 14520, "epoch": 174} {"train_loss": -17.766408920288086, "global_step": 14521, "epoch": 174} {"train_loss": -18.289596557617188, "global_step": 14522, "epoch": 174} {"train_loss": -18.160308837890625, "global_step": 14523, "epoch": 174} {"train_loss": -18.027885873633696, "global_step": 14524, "epoch": 174, "val_loss": 6080380.0} {"train_loss": -17.744243621826172, "global_step": 14525, "epoch": 175} {"train_loss": -17.970104217529297, "global_step": 14526, "epoch": 175} {"train_loss": -18.0559139251709, "global_step": 14527, "epoch": 175} {"train_loss": -18.0632266998291, "global_step": 14528, "epoch": 175} {"train_loss": -17.86382293701172, "global_step": 14529, "epoch": 175} {"train_loss": -17.36408805847168, "global_step": 14530, "epoch": 175} {"train_loss": -17.98164176940918, "global_step": 14531, "epoch": 175} {"train_loss": -17.753992080688477, "global_step": 14532, "epoch": 175} {"train_loss": -18.171009063720703, "global_step": 14533, "epoch": 175} {"train_loss": -18.02402114868164, "global_step": 14534, "epoch": 175} {"train_loss": -18.008216857910156, "global_step": 14535, "epoch": 175} {"train_loss": -17.82416343688965, "global_step": 14536, "epoch": 175} {"train_loss": -18.21126365661621, "global_step": 14537, "epoch": 175} {"train_loss": -17.964384078979492, "global_step": 14538, "epoch": 175} {"train_loss": -18.272001266479492, "global_step": 14539, "epoch": 175} {"train_loss": -18.039871215820312, "global_step": 14540, "epoch": 175} {"train_loss": -17.881345748901367, "global_step": 14541, "epoch": 175} {"train_loss": -18.176025390625, "global_step": 14542, "epoch": 175} {"train_loss": -18.48046875, "global_step": 14543, "epoch": 175} {"train_loss": -17.68045425415039, "global_step": 14544, "epoch": 175} {"train_loss": -18.211374282836914, "global_step": 14545, "epoch": 175} {"train_loss": -17.860471725463867, "global_step": 14546, "epoch": 175} {"train_loss": -17.768644332885742, "global_step": 14547, "epoch": 175} {"train_loss": -17.693531036376953, "global_step": 14548, "epoch": 175} {"train_loss": -18.369186401367188, "global_step": 14549, "epoch": 175} {"train_loss": -18.387187957763672, "global_step": 14550, "epoch": 175} {"train_loss": -17.94925308227539, "global_step": 14551, "epoch": 175} {"train_loss": -17.94660758972168, "global_step": 14552, "epoch": 175} {"train_loss": -18.18940544128418, "global_step": 14553, "epoch": 175} {"train_loss": -17.820886611938477, "global_step": 14554, "epoch": 175} {"train_loss": -17.942678451538086, "global_step": 14555, "epoch": 175} {"train_loss": -18.195287704467773, "global_step": 14556, "epoch": 175} {"train_loss": -17.87163543701172, "global_step": 14557, "epoch": 175} {"train_loss": -17.86130714416504, "global_step": 14558, "epoch": 175} {"train_loss": -17.934064865112305, "global_step": 14559, "epoch": 175} {"train_loss": -18.31907081604004, "global_step": 14560, "epoch": 175} {"train_loss": -18.348724365234375, "global_step": 14561, "epoch": 175} {"train_loss": -18.211658477783203, "global_step": 14562, "epoch": 175} {"train_loss": -18.35449981689453, "global_step": 14563, "epoch": 175} {"train_loss": -18.01064109802246, "global_step": 14564, "epoch": 175} {"train_loss": -18.186613082885742, "global_step": 14565, "epoch": 175} {"train_loss": -18.208301544189453, "global_step": 14566, "epoch": 175} {"train_loss": -18.33181381225586, "global_step": 14567, "epoch": 175} {"train_loss": -18.46131134033203, "global_step": 14568, "epoch": 175} {"train_loss": -17.885526657104492, "global_step": 14569, "epoch": 175} {"train_loss": -18.430927276611328, "global_step": 14570, "epoch": 175} {"train_loss": -18.006696701049805, "global_step": 14571, "epoch": 175} {"train_loss": -18.056806564331055, "global_step": 14572, "epoch": 175} {"train_loss": -18.115886688232422, "global_step": 14573, "epoch": 175} {"train_loss": -17.641372680664062, "global_step": 14574, "epoch": 175} {"train_loss": -18.142715454101562, "global_step": 14575, "epoch": 175} {"train_loss": -17.93235969543457, "global_step": 14576, "epoch": 175} {"train_loss": -18.202428817749023, "global_step": 14577, "epoch": 175} {"train_loss": -18.18239402770996, "global_step": 14578, "epoch": 175} {"train_loss": -18.016881942749023, "global_step": 14579, "epoch": 175} {"train_loss": -18.016782760620117, "global_step": 14580, "epoch": 175} {"train_loss": -18.387117385864258, "global_step": 14581, "epoch": 175} {"train_loss": -18.091352462768555, "global_step": 14582, "epoch": 175} {"train_loss": -18.065139770507812, "global_step": 14583, "epoch": 175} {"train_loss": -17.986087799072266, "global_step": 14584, "epoch": 175} {"train_loss": -18.29878807067871, "global_step": 14585, "epoch": 175} {"train_loss": -17.72921371459961, "global_step": 14586, "epoch": 175} {"train_loss": -18.392288208007812, "global_step": 14587, "epoch": 175} {"train_loss": -17.98847770690918, "global_step": 14588, "epoch": 175} {"train_loss": -18.079763412475586, "global_step": 14589, "epoch": 175} {"train_loss": -17.98244857788086, "global_step": 14590, "epoch": 175} {"train_loss": -17.679609298706055, "global_step": 14591, "epoch": 175} {"train_loss": -18.09551239013672, "global_step": 14592, "epoch": 175} {"train_loss": -18.155553817749023, "global_step": 14593, "epoch": 175} {"train_loss": -18.55240249633789, "global_step": 14594, "epoch": 175} {"train_loss": -18.300434112548828, "global_step": 14595, "epoch": 175} {"train_loss": -18.379243850708008, "global_step": 14596, "epoch": 175} {"train_loss": -18.27872085571289, "global_step": 14597, "epoch": 175} {"train_loss": -17.890064239501953, "global_step": 14598, "epoch": 175} {"train_loss": -17.875930786132812, "global_step": 14599, "epoch": 175} {"train_loss": -17.71242904663086, "global_step": 14600, "epoch": 175} {"train_loss": -18.089584350585938, "global_step": 14601, "epoch": 175} {"train_loss": -17.89361572265625, "global_step": 14602, "epoch": 175} {"train_loss": -17.892822265625, "global_step": 14603, "epoch": 175} {"train_loss": -17.81416893005371, "global_step": 14604, "epoch": 175} {"train_loss": -17.844480514526367, "global_step": 14605, "epoch": 175} {"train_loss": -18.138198852539062, "global_step": 14606, "epoch": 175} {"train_loss": -18.055554815085536, "global_step": 14607, "epoch": 175, "val_loss": 6119851.0} {"train_loss": -17.89555549621582, "global_step": 14608, "epoch": 176} {"train_loss": -18.20044708251953, "global_step": 14609, "epoch": 176} {"train_loss": -18.05292510986328, "global_step": 14610, "epoch": 176} {"train_loss": -18.02898406982422, "global_step": 14611, "epoch": 176} {"train_loss": -18.104631423950195, "global_step": 14612, "epoch": 176} {"train_loss": -17.971195220947266, "global_step": 14613, "epoch": 176} {"train_loss": -17.847997665405273, "global_step": 14614, "epoch": 176} {"train_loss": -17.96201515197754, "global_step": 14615, "epoch": 176} {"train_loss": -18.116474151611328, "global_step": 14616, "epoch": 176} {"train_loss": -17.729490280151367, "global_step": 14617, "epoch": 176} {"train_loss": -18.09956169128418, "global_step": 14618, "epoch": 176} {"train_loss": -18.279834747314453, "global_step": 14619, "epoch": 176} {"train_loss": -18.071086883544922, "global_step": 14620, "epoch": 176} {"train_loss": -18.039854049682617, "global_step": 14621, "epoch": 176} {"train_loss": -18.23990821838379, "global_step": 14622, "epoch": 176} {"train_loss": -18.23414421081543, "global_step": 14623, "epoch": 176} {"train_loss": -18.364614486694336, "global_step": 14624, "epoch": 176} {"train_loss": -18.47292709350586, "global_step": 14625, "epoch": 176} {"train_loss": -18.12173843383789, "global_step": 14626, "epoch": 176} {"train_loss": -17.861967086791992, "global_step": 14627, "epoch": 176} {"train_loss": -18.1409912109375, "global_step": 14628, "epoch": 176} {"train_loss": -18.29000473022461, "global_step": 14629, "epoch": 176} {"train_loss": -17.92169189453125, "global_step": 14630, "epoch": 176} {"train_loss": -18.036039352416992, "global_step": 14631, "epoch": 176} {"train_loss": -18.255170822143555, "global_step": 14632, "epoch": 176} {"train_loss": -17.672182083129883, "global_step": 14633, "epoch": 176} {"train_loss": -18.483877182006836, "global_step": 14634, "epoch": 176} {"train_loss": -18.17683982849121, "global_step": 14635, "epoch": 176} {"train_loss": -17.913633346557617, "global_step": 14636, "epoch": 176} {"train_loss": -18.248350143432617, "global_step": 14637, "epoch": 176} {"train_loss": -18.084688186645508, "global_step": 14638, "epoch": 176} {"train_loss": -18.017637252807617, "global_step": 14639, "epoch": 176} {"train_loss": -17.9144287109375, "global_step": 14640, "epoch": 176} {"train_loss": -17.787860870361328, "global_step": 14641, "epoch": 176} {"train_loss": -17.716413497924805, "global_step": 14642, "epoch": 176} {"train_loss": -17.757963180541992, "global_step": 14643, "epoch": 176} {"train_loss": -18.252227783203125, "global_step": 14644, "epoch": 176} {"train_loss": -18.16751480102539, "global_step": 14645, "epoch": 176} {"train_loss": -17.9149227142334, "global_step": 14646, "epoch": 176} {"train_loss": -17.88153076171875, "global_step": 14647, "epoch": 176} {"train_loss": -17.78648567199707, "global_step": 14648, "epoch": 176} {"train_loss": -18.351303100585938, "global_step": 14649, "epoch": 176} {"train_loss": -18.204208374023438, "global_step": 14650, "epoch": 176} {"train_loss": -18.1444091796875, "global_step": 14651, "epoch": 176} {"train_loss": -18.075103759765625, "global_step": 14652, "epoch": 176} {"train_loss": -18.057350158691406, "global_step": 14653, "epoch": 176} {"train_loss": -18.122936248779297, "global_step": 14654, "epoch": 176} {"train_loss": -18.329431533813477, "global_step": 14655, "epoch": 176} {"train_loss": -18.01057243347168, "global_step": 14656, "epoch": 176} {"train_loss": -17.791175842285156, "global_step": 14657, "epoch": 176} {"train_loss": -18.334732055664062, "global_step": 14658, "epoch": 176} {"train_loss": -18.09556770324707, "global_step": 14659, "epoch": 176} {"train_loss": -18.16153335571289, "global_step": 14660, "epoch": 176} {"train_loss": -18.099945068359375, "global_step": 14661, "epoch": 176} {"train_loss": -17.83897590637207, "global_step": 14662, "epoch": 176} {"train_loss": -18.097412109375, "global_step": 14663, "epoch": 176} {"train_loss": -18.154541015625, "global_step": 14664, "epoch": 176} {"train_loss": -18.280685424804688, "global_step": 14665, "epoch": 176} {"train_loss": -17.868505477905273, "global_step": 14666, "epoch": 176} {"train_loss": -17.46254539489746, "global_step": 14667, "epoch": 176} {"train_loss": -18.011445999145508, "global_step": 14668, "epoch": 176} {"train_loss": -17.7694091796875, "global_step": 14669, "epoch": 176} {"train_loss": -17.984394073486328, "global_step": 14670, "epoch": 176} {"train_loss": -18.114421844482422, "global_step": 14671, "epoch": 176} {"train_loss": -18.439863204956055, "global_step": 14672, "epoch": 176} {"train_loss": -17.590681076049805, "global_step": 14673, "epoch": 176} {"train_loss": -18.156330108642578, "global_step": 14674, "epoch": 176} {"train_loss": -17.974206924438477, "global_step": 14675, "epoch": 176} {"train_loss": -17.884702682495117, "global_step": 14676, "epoch": 176} {"train_loss": -18.060293197631836, "global_step": 14677, "epoch": 176} {"train_loss": -18.08405303955078, "global_step": 14678, "epoch": 176} {"train_loss": -17.518463134765625, "global_step": 14679, "epoch": 176} {"train_loss": -18.318845748901367, "global_step": 14680, "epoch": 176} {"train_loss": -17.883207321166992, "global_step": 14681, "epoch": 176} {"train_loss": -18.098064422607422, "global_step": 14682, "epoch": 176} {"train_loss": -18.299442291259766, "global_step": 14683, "epoch": 176} {"train_loss": -18.369953155517578, "global_step": 14684, "epoch": 176} {"train_loss": -18.236419677734375, "global_step": 14685, "epoch": 176} {"train_loss": -18.07695770263672, "global_step": 14686, "epoch": 176} {"train_loss": -17.511219024658203, "global_step": 14687, "epoch": 176} {"train_loss": -17.970067977905273, "global_step": 14688, "epoch": 176} {"train_loss": -17.716793060302734, "global_step": 14689, "epoch": 176} {"train_loss": -18.065155948501037, "global_step": 14690, "epoch": 176, "val_loss": 6221412.0} {"train_loss": -18.040969848632812, "global_step": 14691, "epoch": 177} {"train_loss": -17.767154693603516, "global_step": 14692, "epoch": 177} {"train_loss": -17.992414474487305, "global_step": 14693, "epoch": 177} {"train_loss": -18.039270401000977, "global_step": 14694, "epoch": 177} {"train_loss": -18.12834930419922, "global_step": 14695, "epoch": 177} {"train_loss": -17.959253311157227, "global_step": 14696, "epoch": 177} {"train_loss": -17.67600440979004, "global_step": 14697, "epoch": 177} {"train_loss": -17.737821578979492, "global_step": 14698, "epoch": 177} {"train_loss": -17.62318992614746, "global_step": 14699, "epoch": 177} {"train_loss": -18.280914306640625, "global_step": 14700, "epoch": 177} {"train_loss": -17.910741806030273, "global_step": 14701, "epoch": 177} {"train_loss": -18.309349060058594, "global_step": 14702, "epoch": 177} {"train_loss": -17.327804565429688, "global_step": 14703, "epoch": 177} {"train_loss": -17.87946128845215, "global_step": 14704, "epoch": 177} {"train_loss": -18.423826217651367, "global_step": 14705, "epoch": 177} {"train_loss": -17.775524139404297, "global_step": 14706, "epoch": 177} {"train_loss": -17.901485443115234, "global_step": 14707, "epoch": 177} {"train_loss": -17.864233016967773, "global_step": 14708, "epoch": 177} {"train_loss": -18.212238311767578, "global_step": 14709, "epoch": 177} {"train_loss": -17.84183692932129, "global_step": 14710, "epoch": 177} {"train_loss": -17.967641830444336, "global_step": 14711, "epoch": 177} {"train_loss": -18.00275993347168, "global_step": 14712, "epoch": 177} {"train_loss": -17.905900955200195, "global_step": 14713, "epoch": 177} {"train_loss": -18.17744255065918, "global_step": 14714, "epoch": 177} {"train_loss": -17.955490112304688, "global_step": 14715, "epoch": 177} {"train_loss": -18.057157516479492, "global_step": 14716, "epoch": 177} {"train_loss": -17.884532928466797, "global_step": 14717, "epoch": 177} {"train_loss": -18.28356170654297, "global_step": 14718, "epoch": 177} {"train_loss": -18.022258758544922, "global_step": 14719, "epoch": 177} {"train_loss": -18.10546875, "global_step": 14720, "epoch": 177} {"train_loss": -17.931921005249023, "global_step": 14721, "epoch": 177} {"train_loss": -18.012969970703125, "global_step": 14722, "epoch": 177} {"train_loss": -18.057220458984375, "global_step": 14723, "epoch": 177} {"train_loss": -18.232084274291992, "global_step": 14724, "epoch": 177} {"train_loss": -18.43575096130371, "global_step": 14725, "epoch": 177} {"train_loss": -18.24517822265625, "global_step": 14726, "epoch": 177} {"train_loss": -18.396860122680664, "global_step": 14727, "epoch": 177} {"train_loss": -18.099748611450195, "global_step": 14728, "epoch": 177} {"train_loss": -18.17291259765625, "global_step": 14729, "epoch": 177} {"train_loss": -17.53878402709961, "global_step": 14730, "epoch": 177} {"train_loss": -18.009872436523438, "global_step": 14731, "epoch": 177} {"train_loss": -18.179433822631836, "global_step": 14732, "epoch": 177} {"train_loss": -18.10127067565918, "global_step": 14733, "epoch": 177} {"train_loss": -18.211017608642578, "global_step": 14734, "epoch": 177} {"train_loss": -18.052536010742188, "global_step": 14735, "epoch": 177} {"train_loss": -17.864418029785156, "global_step": 14736, "epoch": 177} {"train_loss": -17.759845733642578, "global_step": 14737, "epoch": 177} {"train_loss": -18.303909301757812, "global_step": 14738, "epoch": 177} {"train_loss": -18.396902084350586, "global_step": 14739, "epoch": 177} {"train_loss": -18.320514678955078, "global_step": 14740, "epoch": 177} {"train_loss": -18.12026023864746, "global_step": 14741, "epoch": 177} {"train_loss": -18.33722496032715, "global_step": 14742, "epoch": 177} {"train_loss": -18.348583221435547, "global_step": 14743, "epoch": 177} {"train_loss": -18.027612686157227, "global_step": 14744, "epoch": 177} {"train_loss": -17.8730525970459, "global_step": 14745, "epoch": 177} {"train_loss": -17.831562042236328, "global_step": 14746, "epoch": 177} {"train_loss": -17.954647064208984, "global_step": 14747, "epoch": 177} {"train_loss": -18.225383758544922, "global_step": 14748, "epoch": 177} {"train_loss": -17.722593307495117, "global_step": 14749, "epoch": 177} {"train_loss": -18.136539459228516, "global_step": 14750, "epoch": 177} {"train_loss": -17.862319946289062, "global_step": 14751, "epoch": 177} {"train_loss": -18.3491153717041, "global_step": 14752, "epoch": 177} {"train_loss": -17.79592514038086, "global_step": 14753, "epoch": 177} {"train_loss": -18.079605102539062, "global_step": 14754, "epoch": 177} {"train_loss": -18.465742111206055, "global_step": 14755, "epoch": 177} {"train_loss": -18.4392032623291, "global_step": 14756, "epoch": 177} {"train_loss": -18.015180587768555, "global_step": 14757, "epoch": 177} {"train_loss": -18.005956649780273, "global_step": 14758, "epoch": 177} {"train_loss": -18.13804054260254, "global_step": 14759, "epoch": 177} {"train_loss": -17.891996383666992, "global_step": 14760, "epoch": 177} {"train_loss": -18.167373657226562, "global_step": 14761, "epoch": 177} {"train_loss": -17.902935028076172, "global_step": 14762, "epoch": 177} {"train_loss": -17.8413143157959, "global_step": 14763, "epoch": 177} {"train_loss": -18.0280704498291, "global_step": 14764, "epoch": 177} {"train_loss": -17.59044075012207, "global_step": 14765, "epoch": 177} {"train_loss": -18.146434783935547, "global_step": 14766, "epoch": 177} {"train_loss": -18.008981704711914, "global_step": 14767, "epoch": 177} {"train_loss": -18.100269317626953, "global_step": 14768, "epoch": 177} {"train_loss": -17.78077507019043, "global_step": 14769, "epoch": 177} {"train_loss": -18.472064971923828, "global_step": 14770, "epoch": 177} {"train_loss": -18.17085838317871, "global_step": 14771, "epoch": 177} {"train_loss": -17.77159309387207, "global_step": 14772, "epoch": 177} {"train_loss": -18.032682189022204, "global_step": 14773, "epoch": 177, "val_loss": 6141961.5} {"train_loss": -17.548376083374023, "global_step": 14774, "epoch": 178} {"train_loss": -17.876697540283203, "global_step": 14775, "epoch": 178} {"train_loss": -17.840394973754883, "global_step": 14776, "epoch": 178} {"train_loss": -17.874311447143555, "global_step": 14777, "epoch": 178} {"train_loss": -17.983932495117188, "global_step": 14778, "epoch": 178} {"train_loss": -17.96966552734375, "global_step": 14779, "epoch": 178} {"train_loss": -17.900691986083984, "global_step": 14780, "epoch": 178} {"train_loss": -17.96500587463379, "global_step": 14781, "epoch": 178} {"train_loss": -18.24092674255371, "global_step": 14782, "epoch": 178} {"train_loss": -17.907896041870117, "global_step": 14783, "epoch": 178} {"train_loss": -17.62582778930664, "global_step": 14784, "epoch": 178} {"train_loss": -17.765390396118164, "global_step": 14785, "epoch": 178} {"train_loss": -17.92835807800293, "global_step": 14786, "epoch": 178} {"train_loss": -18.04937171936035, "global_step": 14787, "epoch": 178} {"train_loss": -17.849533081054688, "global_step": 14788, "epoch": 178} {"train_loss": -18.186134338378906, "global_step": 14789, "epoch": 178} {"train_loss": -18.04026985168457, "global_step": 14790, "epoch": 178} {"train_loss": -18.17693519592285, "global_step": 14791, "epoch": 178} {"train_loss": -17.809768676757812, "global_step": 14792, "epoch": 178} {"train_loss": -18.349191665649414, "global_step": 14793, "epoch": 178} {"train_loss": -17.96237564086914, "global_step": 14794, "epoch": 178} {"train_loss": -18.123191833496094, "global_step": 14795, "epoch": 178} {"train_loss": -17.670372009277344, "global_step": 14796, "epoch": 178} {"train_loss": -18.2699031829834, "global_step": 14797, "epoch": 178} {"train_loss": -18.01092529296875, "global_step": 14798, "epoch": 178} {"train_loss": -18.498220443725586, "global_step": 14799, "epoch": 178} {"train_loss": -17.812503814697266, "global_step": 14800, "epoch": 178} {"train_loss": -18.32320213317871, "global_step": 14801, "epoch": 178} {"train_loss": -18.28023338317871, "global_step": 14802, "epoch": 178} {"train_loss": -18.098163604736328, "global_step": 14803, "epoch": 178} {"train_loss": -17.98691177368164, "global_step": 14804, "epoch": 178} {"train_loss": -18.439599990844727, "global_step": 14805, "epoch": 178} {"train_loss": -18.03378677368164, "global_step": 14806, "epoch": 178} {"train_loss": -17.93878173828125, "global_step": 14807, "epoch": 178} {"train_loss": -18.343276977539062, "global_step": 14808, "epoch": 178} {"train_loss": -17.572568893432617, "global_step": 14809, "epoch": 178} {"train_loss": -18.126907348632812, "global_step": 14810, "epoch": 178} {"train_loss": -18.126291275024414, "global_step": 14811, "epoch": 178} {"train_loss": -18.16608238220215, "global_step": 14812, "epoch": 178} {"train_loss": -18.190040588378906, "global_step": 14813, "epoch": 178} {"train_loss": -18.15888786315918, "global_step": 14814, "epoch": 178} {"train_loss": -18.34749412536621, "global_step": 14815, "epoch": 178} {"train_loss": -18.313947677612305, "global_step": 14816, "epoch": 178} {"train_loss": -18.072660446166992, "global_step": 14817, "epoch": 178} {"train_loss": -18.045312881469727, "global_step": 14818, "epoch": 178} {"train_loss": -18.083698272705078, "global_step": 14819, "epoch": 178} {"train_loss": -18.3245792388916, "global_step": 14820, "epoch": 178} {"train_loss": -18.03217887878418, "global_step": 14821, "epoch": 178} {"train_loss": -18.201330184936523, "global_step": 14822, "epoch": 178} {"train_loss": -17.86479949951172, "global_step": 14823, "epoch": 178} {"train_loss": -18.09958267211914, "global_step": 14824, "epoch": 178} {"train_loss": -18.269906997680664, "global_step": 14825, "epoch": 178} {"train_loss": -17.924304962158203, "global_step": 14826, "epoch": 178} {"train_loss": -17.927560806274414, "global_step": 14827, "epoch": 178} {"train_loss": -17.591856002807617, "global_step": 14828, "epoch": 178} {"train_loss": -18.053668975830078, "global_step": 14829, "epoch": 178} {"train_loss": -17.881025314331055, "global_step": 14830, "epoch": 178} {"train_loss": -17.841665267944336, "global_step": 14831, "epoch": 178} {"train_loss": -18.122163772583008, "global_step": 14832, "epoch": 178} {"train_loss": -17.780515670776367, "global_step": 14833, "epoch": 178} {"train_loss": -17.961666107177734, "global_step": 14834, "epoch": 178} {"train_loss": -17.82112693786621, "global_step": 14835, "epoch": 178} {"train_loss": -18.007061004638672, "global_step": 14836, "epoch": 178} {"train_loss": -18.412853240966797, "global_step": 14837, "epoch": 178} {"train_loss": -18.186819076538086, "global_step": 14838, "epoch": 178} {"train_loss": -18.247333526611328, "global_step": 14839, "epoch": 178} {"train_loss": -17.960575103759766, "global_step": 14840, "epoch": 178} {"train_loss": -18.069198608398438, "global_step": 14841, "epoch": 178} {"train_loss": -17.85369300842285, "global_step": 14842, "epoch": 178} {"train_loss": -17.99948501586914, "global_step": 14843, "epoch": 178} {"train_loss": -18.306819915771484, "global_step": 14844, "epoch": 178} {"train_loss": -17.91857147216797, "global_step": 14845, "epoch": 178} {"train_loss": -17.851701736450195, "global_step": 14846, "epoch": 178} {"train_loss": -18.438833236694336, "global_step": 14847, "epoch": 178} {"train_loss": -18.340906143188477, "global_step": 14848, "epoch": 178} {"train_loss": -17.72276496887207, "global_step": 14849, "epoch": 178} {"train_loss": -18.073575973510742, "global_step": 14850, "epoch": 178} {"train_loss": -17.591461181640625, "global_step": 14851, "epoch": 178} {"train_loss": -18.17458152770996, "global_step": 14852, "epoch": 178} {"train_loss": -18.229965209960938, "global_step": 14853, "epoch": 178} {"train_loss": -18.249248504638672, "global_step": 14854, "epoch": 178} {"train_loss": -18.134872436523438, "global_step": 14855, "epoch": 178} {"train_loss": -18.043535784066442, "global_step": 14856, "epoch": 178, "val_loss": 6130687.0} {"train_loss": -18.08778190612793, "global_step": 14857, "epoch": 179} {"train_loss": -17.834949493408203, "global_step": 14858, "epoch": 179} {"train_loss": -17.672657012939453, "global_step": 14859, "epoch": 179} {"train_loss": -18.262775421142578, "global_step": 14860, "epoch": 179} {"train_loss": -18.137338638305664, "global_step": 14861, "epoch": 179} {"train_loss": -18.07082176208496, "global_step": 14862, "epoch": 179} {"train_loss": -18.201461791992188, "global_step": 14863, "epoch": 179} {"train_loss": -17.807119369506836, "global_step": 14864, "epoch": 179} {"train_loss": -17.976205825805664, "global_step": 14865, "epoch": 179} {"train_loss": -17.976016998291016, "global_step": 14866, "epoch": 179} {"train_loss": -17.91126823425293, "global_step": 14867, "epoch": 179} {"train_loss": -18.062898635864258, "global_step": 14868, "epoch": 179} {"train_loss": -17.955873489379883, "global_step": 14869, "epoch": 179} {"train_loss": -18.337902069091797, "global_step": 14870, "epoch": 179} {"train_loss": -18.062530517578125, "global_step": 14871, "epoch": 179} {"train_loss": -17.858306884765625, "global_step": 14872, "epoch": 179} {"train_loss": -18.01544189453125, "global_step": 14873, "epoch": 179} {"train_loss": -18.004384994506836, "global_step": 14874, "epoch": 179} {"train_loss": -18.022443771362305, "global_step": 14875, "epoch": 179} {"train_loss": -18.2277889251709, "global_step": 14876, "epoch": 179} {"train_loss": -17.767385482788086, "global_step": 14877, "epoch": 179} {"train_loss": -18.40260887145996, "global_step": 14878, "epoch": 179} {"train_loss": -18.326770782470703, "global_step": 14879, "epoch": 179} {"train_loss": -17.97351837158203, "global_step": 14880, "epoch": 179} {"train_loss": -18.05646324157715, "global_step": 14881, "epoch": 179} {"train_loss": -18.06163787841797, "global_step": 14882, "epoch": 179} {"train_loss": -17.963531494140625, "global_step": 14883, "epoch": 179} {"train_loss": -17.872419357299805, "global_step": 14884, "epoch": 179} {"train_loss": -18.24942970275879, "global_step": 14885, "epoch": 179} {"train_loss": -17.9952392578125, "global_step": 14886, "epoch": 179} {"train_loss": -18.05378532409668, "global_step": 14887, "epoch": 179} {"train_loss": -18.27088737487793, "global_step": 14888, "epoch": 179} {"train_loss": -17.867918014526367, "global_step": 14889, "epoch": 179} {"train_loss": -18.038864135742188, "global_step": 14890, "epoch": 179} {"train_loss": -18.31245231628418, "global_step": 14891, "epoch": 179} {"train_loss": -18.298120498657227, "global_step": 14892, "epoch": 179} {"train_loss": -17.76326560974121, "global_step": 14893, "epoch": 179} {"train_loss": -17.682767868041992, "global_step": 14894, "epoch": 179} {"train_loss": -18.260698318481445, "global_step": 14895, "epoch": 179} {"train_loss": -17.826791763305664, "global_step": 14896, "epoch": 179} {"train_loss": -17.87738037109375, "global_step": 14897, "epoch": 179} {"train_loss": -18.149250030517578, "global_step": 14898, "epoch": 179} {"train_loss": -18.252649307250977, "global_step": 14899, "epoch": 179} {"train_loss": -18.37538719177246, "global_step": 14900, "epoch": 179} {"train_loss": -17.958471298217773, "global_step": 14901, "epoch": 179} {"train_loss": -18.14457130432129, "global_step": 14902, "epoch": 179} {"train_loss": -18.400127410888672, "global_step": 14903, "epoch": 179} {"train_loss": -17.893329620361328, "global_step": 14904, "epoch": 179} {"train_loss": -17.648664474487305, "global_step": 14905, "epoch": 179} {"train_loss": -18.047649383544922, "global_step": 14906, "epoch": 179} {"train_loss": -18.117780685424805, "global_step": 14907, "epoch": 179} {"train_loss": -18.117467880249023, "global_step": 14908, "epoch": 179} {"train_loss": -18.21657943725586, "global_step": 14909, "epoch": 179} {"train_loss": -18.41352653503418, "global_step": 14910, "epoch": 179} {"train_loss": -17.91497802734375, "global_step": 14911, "epoch": 179} {"train_loss": -17.625089645385742, "global_step": 14912, "epoch": 179} {"train_loss": -18.37723731994629, "global_step": 14913, "epoch": 179} {"train_loss": -18.106081008911133, "global_step": 14914, "epoch": 179} {"train_loss": -17.86811637878418, "global_step": 14915, "epoch": 179} {"train_loss": -17.75507926940918, "global_step": 14916, "epoch": 179} {"train_loss": -17.95187759399414, "global_step": 14917, "epoch": 179} {"train_loss": -18.190702438354492, "global_step": 14918, "epoch": 179} {"train_loss": -18.104045867919922, "global_step": 14919, "epoch": 179} {"train_loss": -18.2708797454834, "global_step": 14920, "epoch": 179} {"train_loss": -18.130292892456055, "global_step": 14921, "epoch": 179} {"train_loss": -18.097318649291992, "global_step": 14922, "epoch": 179} {"train_loss": -17.94502067565918, "global_step": 14923, "epoch": 179} {"train_loss": -18.294282913208008, "global_step": 14924, "epoch": 179} {"train_loss": -18.20669174194336, "global_step": 14925, "epoch": 179} {"train_loss": -18.19319725036621, "global_step": 14926, "epoch": 179} {"train_loss": -18.039926528930664, "global_step": 14927, "epoch": 179} {"train_loss": -18.30246353149414, "global_step": 14928, "epoch": 179} {"train_loss": -18.053117752075195, "global_step": 14929, "epoch": 179} {"train_loss": -17.699426651000977, "global_step": 14930, "epoch": 179} {"train_loss": -18.1828556060791, "global_step": 14931, "epoch": 179} {"train_loss": -18.276865005493164, "global_step": 14932, "epoch": 179} {"train_loss": -18.220291137695312, "global_step": 14933, "epoch": 179} {"train_loss": -18.062332153320312, "global_step": 14934, "epoch": 179} {"train_loss": -18.06485939025879, "global_step": 14935, "epoch": 179} {"train_loss": -18.070556640625, "global_step": 14936, "epoch": 179} {"train_loss": -18.38043212890625, "global_step": 14937, "epoch": 179} {"train_loss": -18.049720764160156, "global_step": 14938, "epoch": 179} {"train_loss": -18.06177313931017, "global_step": 14939, "epoch": 179, "val_loss": 6005022.5} {"train_loss": -17.85282325744629, "global_step": 14940, "epoch": 180} {"train_loss": -18.277963638305664, "global_step": 14941, "epoch": 180} {"train_loss": -17.86304473876953, "global_step": 14942, "epoch": 180} {"train_loss": -17.695480346679688, "global_step": 14943, "epoch": 180} {"train_loss": -18.134113311767578, "global_step": 14944, "epoch": 180} {"train_loss": -17.82021141052246, "global_step": 14945, "epoch": 180} {"train_loss": -17.947345733642578, "global_step": 14946, "epoch": 180} {"train_loss": -18.25357437133789, "global_step": 14947, "epoch": 180} {"train_loss": -18.011428833007812, "global_step": 14948, "epoch": 180} {"train_loss": -17.946744918823242, "global_step": 14949, "epoch": 180} {"train_loss": -18.15223503112793, "global_step": 14950, "epoch": 180} {"train_loss": -18.17691421508789, "global_step": 14951, "epoch": 180} {"train_loss": -17.832632064819336, "global_step": 14952, "epoch": 180} {"train_loss": -18.040115356445312, "global_step": 14953, "epoch": 180} {"train_loss": -18.18436622619629, "global_step": 14954, "epoch": 180} {"train_loss": -17.931415557861328, "global_step": 14955, "epoch": 180} {"train_loss": -18.028398513793945, "global_step": 14956, "epoch": 180} {"train_loss": -17.944082260131836, "global_step": 14957, "epoch": 180} {"train_loss": -17.659284591674805, "global_step": 14958, "epoch": 180} {"train_loss": -18.170654296875, "global_step": 14959, "epoch": 180} {"train_loss": -17.70729637145996, "global_step": 14960, "epoch": 180} {"train_loss": -18.141555786132812, "global_step": 14961, "epoch": 180} {"train_loss": -18.359695434570312, "global_step": 14962, "epoch": 180} {"train_loss": -17.82987403869629, "global_step": 14963, "epoch": 180} {"train_loss": -18.099332809448242, "global_step": 14964, "epoch": 180} {"train_loss": -18.049072265625, "global_step": 14965, "epoch": 180} {"train_loss": -18.278186798095703, "global_step": 14966, "epoch": 180} {"train_loss": -18.033315658569336, "global_step": 14967, "epoch": 180} {"train_loss": -18.304357528686523, "global_step": 14968, "epoch": 180} {"train_loss": -17.936203002929688, "global_step": 14969, "epoch": 180} {"train_loss": -17.946170806884766, "global_step": 14970, "epoch": 180} {"train_loss": -18.075056076049805, "global_step": 14971, "epoch": 180} {"train_loss": -17.64661979675293, "global_step": 14972, "epoch": 180} {"train_loss": -18.194303512573242, "global_step": 14973, "epoch": 180} {"train_loss": -17.994993209838867, "global_step": 14974, "epoch": 180} {"train_loss": -18.56729507446289, "global_step": 14975, "epoch": 180} {"train_loss": -18.20369529724121, "global_step": 14976, "epoch": 180} {"train_loss": -17.902690887451172, "global_step": 14977, "epoch": 180} {"train_loss": -18.009061813354492, "global_step": 14978, "epoch": 180} {"train_loss": -18.080469131469727, "global_step": 14979, "epoch": 180} {"train_loss": -18.173892974853516, "global_step": 14980, "epoch": 180} {"train_loss": -18.202280044555664, "global_step": 14981, "epoch": 180} {"train_loss": -18.546329498291016, "global_step": 14982, "epoch": 180} {"train_loss": -18.05888557434082, "global_step": 14983, "epoch": 180} {"train_loss": -18.442279815673828, "global_step": 14984, "epoch": 180} {"train_loss": -17.89799690246582, "global_step": 14985, "epoch": 180} {"train_loss": -18.12887954711914, "global_step": 14986, "epoch": 180} {"train_loss": -17.929746627807617, "global_step": 14987, "epoch": 180} {"train_loss": -18.08548355102539, "global_step": 14988, "epoch": 180} {"train_loss": -18.053504943847656, "global_step": 14989, "epoch": 180} {"train_loss": -18.493457794189453, "global_step": 14990, "epoch": 180} {"train_loss": -18.33584976196289, "global_step": 14991, "epoch": 180} {"train_loss": -18.38174819946289, "global_step": 14992, "epoch": 180} {"train_loss": -18.081220626831055, "global_step": 14993, "epoch": 180} {"train_loss": -18.03767204284668, "global_step": 14994, "epoch": 180} {"train_loss": -17.97413444519043, "global_step": 14995, "epoch": 180} {"train_loss": -17.869853973388672, "global_step": 14996, "epoch": 180} {"train_loss": -17.81011962890625, "global_step": 14997, "epoch": 180} {"train_loss": -18.04840660095215, "global_step": 14998, "epoch": 180} {"train_loss": -17.845775604248047, "global_step": 14999, "epoch": 180} {"train_loss": -18.585163116455078, "global_step": 15000, "epoch": 180} {"train_loss": -17.62148094177246, "global_step": 15001, "epoch": 180} {"train_loss": -18.619298934936523, "global_step": 15002, "epoch": 180} {"train_loss": -17.678136825561523, "global_step": 15003, "epoch": 180} {"train_loss": -18.06761932373047, "global_step": 15004, "epoch": 180} {"train_loss": -18.190176010131836, "global_step": 15005, "epoch": 180} {"train_loss": -17.476980209350586, "global_step": 15006, "epoch": 180} {"train_loss": -18.141437530517578, "global_step": 15007, "epoch": 180} {"train_loss": -18.31328773498535, "global_step": 15008, "epoch": 180} {"train_loss": -18.09114646911621, "global_step": 15009, "epoch": 180} {"train_loss": -18.333648681640625, "global_step": 15010, "epoch": 180} {"train_loss": -17.98793601989746, "global_step": 15011, "epoch": 180} {"train_loss": -18.140609741210938, "global_step": 15012, "epoch": 180} {"train_loss": -17.919328689575195, "global_step": 15013, "epoch": 180} {"train_loss": -17.90592384338379, "global_step": 15014, "epoch": 180} {"train_loss": -18.023778915405273, "global_step": 15015, "epoch": 180} {"train_loss": -18.031911849975586, "global_step": 15016, "epoch": 180} {"train_loss": -18.403213500976562, "global_step": 15017, "epoch": 180} {"train_loss": -17.951311111450195, "global_step": 15018, "epoch": 180} {"train_loss": -18.153244018554688, "global_step": 15019, "epoch": 180} {"train_loss": -18.41305923461914, "global_step": 15020, "epoch": 180} {"train_loss": -17.839021682739258, "global_step": 15021, "epoch": 180} {"train_loss": -18.072271094264753, "global_step": 15022, "epoch": 180, "val_loss": 6379806.0} {"train_loss": -17.946603775024414, "global_step": 15023, "epoch": 181} {"train_loss": -17.705503463745117, "global_step": 15024, "epoch": 181} {"train_loss": -18.139116287231445, "global_step": 15025, "epoch": 181} {"train_loss": -18.042531967163086, "global_step": 15026, "epoch": 181} {"train_loss": -18.068775177001953, "global_step": 15027, "epoch": 181} {"train_loss": -17.90700340270996, "global_step": 15028, "epoch": 181} {"train_loss": -18.020658493041992, "global_step": 15029, "epoch": 181} {"train_loss": -18.074199676513672, "global_step": 15030, "epoch": 181} {"train_loss": -17.878578186035156, "global_step": 15031, "epoch": 181} {"train_loss": -17.789306640625, "global_step": 15032, "epoch": 181} {"train_loss": -18.042510986328125, "global_step": 15033, "epoch": 181} {"train_loss": -17.95574188232422, "global_step": 15034, "epoch": 181} {"train_loss": -18.144203186035156, "global_step": 15035, "epoch": 181} {"train_loss": -18.161975860595703, "global_step": 15036, "epoch": 181} {"train_loss": -17.831302642822266, "global_step": 15037, "epoch": 181} {"train_loss": -18.58953285217285, "global_step": 15038, "epoch": 181} {"train_loss": -17.8701171875, "global_step": 15039, "epoch": 181} {"train_loss": -18.13589096069336, "global_step": 15040, "epoch": 181} {"train_loss": -18.057172775268555, "global_step": 15041, "epoch": 181} {"train_loss": -18.112207412719727, "global_step": 15042, "epoch": 181} {"train_loss": -17.96091079711914, "global_step": 15043, "epoch": 181} {"train_loss": -17.68531608581543, "global_step": 15044, "epoch": 181} {"train_loss": -18.24505615234375, "global_step": 15045, "epoch": 181} {"train_loss": -18.24549674987793, "global_step": 15046, "epoch": 181} {"train_loss": -18.300132751464844, "global_step": 15047, "epoch": 181} {"train_loss": -18.42860221862793, "global_step": 15048, "epoch": 181} {"train_loss": -18.165781021118164, "global_step": 15049, "epoch": 181} {"train_loss": -18.128416061401367, "global_step": 15050, "epoch": 181} {"train_loss": -17.92549705505371, "global_step": 15051, "epoch": 181} {"train_loss": -18.49810218811035, "global_step": 15052, "epoch": 181} {"train_loss": -18.293493270874023, "global_step": 15053, "epoch": 181} {"train_loss": -18.203954696655273, "global_step": 15054, "epoch": 181} {"train_loss": -18.101682662963867, "global_step": 15055, "epoch": 181} {"train_loss": -17.732053756713867, "global_step": 15056, "epoch": 181} {"train_loss": -18.349536895751953, "global_step": 15057, "epoch": 181} {"train_loss": -18.02191734313965, "global_step": 15058, "epoch": 181} {"train_loss": -17.81644630432129, "global_step": 15059, "epoch": 181} {"train_loss": -17.87531852722168, "global_step": 15060, "epoch": 181} {"train_loss": -18.076263427734375, "global_step": 15061, "epoch": 181} {"train_loss": -17.903461456298828, "global_step": 15062, "epoch": 181} {"train_loss": -17.77433204650879, "global_step": 15063, "epoch": 181} {"train_loss": -18.394962310791016, "global_step": 15064, "epoch": 181} {"train_loss": -18.099624633789062, "global_step": 15065, "epoch": 181} {"train_loss": -17.742307662963867, "global_step": 15066, "epoch": 181} {"train_loss": -17.95192527770996, "global_step": 15067, "epoch": 181} {"train_loss": -18.127017974853516, "global_step": 15068, "epoch": 181} {"train_loss": -18.0296688079834, "global_step": 15069, "epoch": 181} {"train_loss": -18.377389907836914, "global_step": 15070, "epoch": 181} {"train_loss": -18.29157829284668, "global_step": 15071, "epoch": 181} {"train_loss": -17.88197135925293, "global_step": 15072, "epoch": 181} {"train_loss": -17.77846908569336, "global_step": 15073, "epoch": 181} {"train_loss": -18.533681869506836, "global_step": 15074, "epoch": 181} {"train_loss": -18.181798934936523, "global_step": 15075, "epoch": 181} {"train_loss": -17.66350746154785, "global_step": 15076, "epoch": 181} {"train_loss": -17.775156021118164, "global_step": 15077, "epoch": 181} {"train_loss": -18.086759567260742, "global_step": 15078, "epoch": 181} {"train_loss": -17.661039352416992, "global_step": 15079, "epoch": 181} {"train_loss": -18.218631744384766, "global_step": 15080, "epoch": 181} {"train_loss": -18.184520721435547, "global_step": 15081, "epoch": 181} {"train_loss": -18.287378311157227, "global_step": 15082, "epoch": 181} {"train_loss": -18.148038864135742, "global_step": 15083, "epoch": 181} {"train_loss": -18.157337188720703, "global_step": 15084, "epoch": 181} {"train_loss": -18.143447875976562, "global_step": 15085, "epoch": 181} {"train_loss": -17.993417739868164, "global_step": 15086, "epoch": 181} {"train_loss": -18.061704635620117, "global_step": 15087, "epoch": 181} {"train_loss": -17.720407485961914, "global_step": 15088, "epoch": 181} {"train_loss": -18.24002456665039, "global_step": 15089, "epoch": 181} {"train_loss": -18.219694137573242, "global_step": 15090, "epoch": 181} {"train_loss": -18.2558650970459, "global_step": 15091, "epoch": 181} {"train_loss": -17.656240463256836, "global_step": 15092, "epoch": 181} {"train_loss": -17.993118286132812, "global_step": 15093, "epoch": 181} {"train_loss": -18.0470027923584, "global_step": 15094, "epoch": 181} {"train_loss": -17.998287200927734, "global_step": 15095, "epoch": 181} {"train_loss": -18.276609420776367, "global_step": 15096, "epoch": 181} {"train_loss": -18.01828956604004, "global_step": 15097, "epoch": 181} {"train_loss": -18.156925201416016, "global_step": 15098, "epoch": 181} {"train_loss": -18.14360809326172, "global_step": 15099, "epoch": 181} {"train_loss": -17.950714111328125, "global_step": 15100, "epoch": 181} {"train_loss": -17.99735450744629, "global_step": 15101, "epoch": 181} {"train_loss": -18.200220108032227, "global_step": 15102, "epoch": 181} {"train_loss": -18.36567497253418, "global_step": 15103, "epoch": 181} {"train_loss": -17.834270477294922, "global_step": 15104, "epoch": 181} {"train_loss": -18.056336161601973, "global_step": 15105, "epoch": 181, "val_loss": 6088931.0} {"train_loss": -17.852527618408203, "global_step": 15106, "epoch": 182} {"train_loss": -18.078027725219727, "global_step": 15107, "epoch": 182} {"train_loss": -17.781177520751953, "global_step": 15108, "epoch": 182} {"train_loss": -18.447956085205078, "global_step": 15109, "epoch": 182} {"train_loss": -17.957075119018555, "global_step": 15110, "epoch": 182} {"train_loss": -17.836252212524414, "global_step": 15111, "epoch": 182} {"train_loss": -18.1474666595459, "global_step": 15112, "epoch": 182} {"train_loss": -17.706594467163086, "global_step": 15113, "epoch": 182} {"train_loss": -17.298145294189453, "global_step": 15114, "epoch": 182} {"train_loss": -17.832456588745117, "global_step": 15115, "epoch": 182} {"train_loss": -17.771547317504883, "global_step": 15116, "epoch": 182} {"train_loss": -17.7342529296875, "global_step": 15117, "epoch": 182} {"train_loss": -18.162641525268555, "global_step": 15118, "epoch": 182} {"train_loss": -17.69916343688965, "global_step": 15119, "epoch": 182} {"train_loss": -17.826234817504883, "global_step": 15120, "epoch": 182} {"train_loss": -17.794763565063477, "global_step": 15121, "epoch": 182} {"train_loss": -17.819250106811523, "global_step": 15122, "epoch": 182} {"train_loss": -17.735885620117188, "global_step": 15123, "epoch": 182} {"train_loss": -18.077411651611328, "global_step": 15124, "epoch": 182} {"train_loss": -18.027847290039062, "global_step": 15125, "epoch": 182} {"train_loss": -18.09736442565918, "global_step": 15126, "epoch": 182} {"train_loss": -17.76059913635254, "global_step": 15127, "epoch": 182} {"train_loss": -18.082639694213867, "global_step": 15128, "epoch": 182} {"train_loss": -18.385046005249023, "global_step": 15129, "epoch": 182} {"train_loss": -17.954788208007812, "global_step": 15130, "epoch": 182} {"train_loss": -18.248735427856445, "global_step": 15131, "epoch": 182} {"train_loss": -18.009952545166016, "global_step": 15132, "epoch": 182} {"train_loss": -18.346603393554688, "global_step": 15133, "epoch": 182} {"train_loss": -18.08917236328125, "global_step": 15134, "epoch": 182} {"train_loss": -18.020227432250977, "global_step": 15135, "epoch": 182} {"train_loss": -18.089588165283203, "global_step": 15136, "epoch": 182} {"train_loss": -18.25614356994629, "global_step": 15137, "epoch": 182} {"train_loss": -18.091257095336914, "global_step": 15138, "epoch": 182} {"train_loss": -18.150253295898438, "global_step": 15139, "epoch": 182} {"train_loss": -18.18772315979004, "global_step": 15140, "epoch": 182} {"train_loss": -18.18647575378418, "global_step": 15141, "epoch": 182} {"train_loss": -18.175947189331055, "global_step": 15142, "epoch": 182} {"train_loss": -18.61714744567871, "global_step": 15143, "epoch": 182} {"train_loss": -18.17998504638672, "global_step": 15144, "epoch": 182} {"train_loss": -18.161365509033203, "global_step": 15145, "epoch": 182} {"train_loss": -18.146072387695312, "global_step": 15146, "epoch": 182} {"train_loss": -18.30030632019043, "global_step": 15147, "epoch": 182} {"train_loss": -18.032209396362305, "global_step": 15148, "epoch": 182} {"train_loss": -18.43352699279785, "global_step": 15149, "epoch": 182} {"train_loss": -18.166793823242188, "global_step": 15150, "epoch": 182} {"train_loss": -18.03969383239746, "global_step": 15151, "epoch": 182} {"train_loss": -18.127140045166016, "global_step": 15152, "epoch": 182} {"train_loss": -18.22127342224121, "global_step": 15153, "epoch": 182} {"train_loss": -18.14899253845215, "global_step": 15154, "epoch": 182} {"train_loss": -17.883216857910156, "global_step": 15155, "epoch": 182} {"train_loss": -17.971454620361328, "global_step": 15156, "epoch": 182} {"train_loss": -18.318893432617188, "global_step": 15157, "epoch": 182} {"train_loss": -18.00254249572754, "global_step": 15158, "epoch": 182} {"train_loss": -18.05975341796875, "global_step": 15159, "epoch": 182} {"train_loss": -17.633975982666016, "global_step": 15160, "epoch": 182} {"train_loss": -17.898170471191406, "global_step": 15161, "epoch": 182} {"train_loss": -18.377609252929688, "global_step": 15162, "epoch": 182} {"train_loss": -18.39097785949707, "global_step": 15163, "epoch": 182} {"train_loss": -17.986631393432617, "global_step": 15164, "epoch": 182} {"train_loss": -17.835519790649414, "global_step": 15165, "epoch": 182} {"train_loss": -18.069015502929688, "global_step": 15166, "epoch": 182} {"train_loss": -17.796552658081055, "global_step": 15167, "epoch": 182} {"train_loss": -17.902952194213867, "global_step": 15168, "epoch": 182} {"train_loss": -18.05177116394043, "global_step": 15169, "epoch": 182} {"train_loss": -18.277847290039062, "global_step": 15170, "epoch": 182} {"train_loss": -18.146976470947266, "global_step": 15171, "epoch": 182} {"train_loss": -17.780532836914062, "global_step": 15172, "epoch": 182} {"train_loss": -18.25634765625, "global_step": 15173, "epoch": 182} {"train_loss": -18.39007568359375, "global_step": 15174, "epoch": 182} {"train_loss": -18.156211853027344, "global_step": 15175, "epoch": 182} {"train_loss": -18.233247756958008, "global_step": 15176, "epoch": 182} {"train_loss": -17.85334014892578, "global_step": 15177, "epoch": 182} {"train_loss": -18.038232803344727, "global_step": 15178, "epoch": 182} {"train_loss": -18.046133041381836, "global_step": 15179, "epoch": 182} {"train_loss": -17.893590927124023, "global_step": 15180, "epoch": 182} {"train_loss": -18.00446891784668, "global_step": 15181, "epoch": 182} {"train_loss": -18.41151237487793, "global_step": 15182, "epoch": 182} {"train_loss": -18.21320152282715, "global_step": 15183, "epoch": 182} {"train_loss": -18.49013328552246, "global_step": 15184, "epoch": 182} {"train_loss": -18.324277877807617, "global_step": 15185, "epoch": 182} {"train_loss": -18.228208541870117, "global_step": 15186, "epoch": 182} {"train_loss": -18.008222579956055, "global_step": 15187, "epoch": 182} {"train_loss": -18.055938743683228, "global_step": 15188, "epoch": 182, "val_loss": 6099207.5} {"train_loss": -18.04999542236328, "global_step": 15189, "epoch": 183} {"train_loss": -17.993000030517578, "global_step": 15190, "epoch": 183} {"train_loss": -17.988754272460938, "global_step": 15191, "epoch": 183} {"train_loss": -18.079177856445312, "global_step": 15192, "epoch": 183} {"train_loss": -18.30714225769043, "global_step": 15193, "epoch": 183} {"train_loss": -18.243314743041992, "global_step": 15194, "epoch": 183} {"train_loss": -18.406911849975586, "global_step": 15195, "epoch": 183} {"train_loss": -18.28994369506836, "global_step": 15196, "epoch": 183} {"train_loss": -18.204137802124023, "global_step": 15197, "epoch": 183} {"train_loss": -18.60343360900879, "global_step": 15198, "epoch": 183} {"train_loss": -17.995908737182617, "global_step": 15199, "epoch": 183} {"train_loss": -18.441864013671875, "global_step": 15200, "epoch": 183} {"train_loss": -18.037643432617188, "global_step": 15201, "epoch": 183} {"train_loss": -18.374929428100586, "global_step": 15202, "epoch": 183} {"train_loss": -17.766950607299805, "global_step": 15203, "epoch": 183} {"train_loss": -18.067182540893555, "global_step": 15204, "epoch": 183} {"train_loss": -18.30560874938965, "global_step": 15205, "epoch": 183} {"train_loss": -18.100683212280273, "global_step": 15206, "epoch": 183} {"train_loss": -18.323644638061523, "global_step": 15207, "epoch": 183} {"train_loss": -18.519689559936523, "global_step": 15208, "epoch": 183} {"train_loss": -17.86471939086914, "global_step": 15209, "epoch": 183} {"train_loss": -17.951597213745117, "global_step": 15210, "epoch": 183} {"train_loss": -17.908401489257812, "global_step": 15211, "epoch": 183} {"train_loss": -17.911527633666992, "global_step": 15212, "epoch": 183} {"train_loss": -18.118223190307617, "global_step": 15213, "epoch": 183} {"train_loss": -17.9884033203125, "global_step": 15214, "epoch": 183} {"train_loss": -17.967069625854492, "global_step": 15215, "epoch": 183} {"train_loss": -18.127304077148438, "global_step": 15216, "epoch": 183} {"train_loss": -18.032047271728516, "global_step": 15217, "epoch": 183} {"train_loss": -17.647817611694336, "global_step": 15218, "epoch": 183} {"train_loss": -18.334033966064453, "global_step": 15219, "epoch": 183} {"train_loss": -18.25701332092285, "global_step": 15220, "epoch": 183} {"train_loss": -18.28200340270996, "global_step": 15221, "epoch": 183} {"train_loss": -17.999256134033203, "global_step": 15222, "epoch": 183} {"train_loss": -17.93763542175293, "global_step": 15223, "epoch": 183} {"train_loss": -17.87322425842285, "global_step": 15224, "epoch": 183} {"train_loss": -18.10011100769043, "global_step": 15225, "epoch": 183} {"train_loss": -17.85970115661621, "global_step": 15226, "epoch": 183} {"train_loss": -18.2226619720459, "global_step": 15227, "epoch": 183} {"train_loss": -18.23318099975586, "global_step": 15228, "epoch": 183} {"train_loss": -17.759984970092773, "global_step": 15229, "epoch": 183} {"train_loss": -18.041336059570312, "global_step": 15230, "epoch": 183} {"train_loss": -17.968524932861328, "global_step": 15231, "epoch": 183} {"train_loss": -17.693859100341797, "global_step": 15232, "epoch": 183} {"train_loss": -17.897811889648438, "global_step": 15233, "epoch": 183} {"train_loss": -17.954364776611328, "global_step": 15234, "epoch": 183} {"train_loss": -18.001739501953125, "global_step": 15235, "epoch": 183} {"train_loss": -17.908641815185547, "global_step": 15236, "epoch": 183} {"train_loss": -17.941509246826172, "global_step": 15237, "epoch": 183} {"train_loss": -18.01578140258789, "global_step": 15238, "epoch": 183} {"train_loss": -17.80959129333496, "global_step": 15239, "epoch": 183} {"train_loss": -18.314550399780273, "global_step": 15240, "epoch": 183} {"train_loss": -17.910017013549805, "global_step": 15241, "epoch": 183} {"train_loss": -18.242177963256836, "global_step": 15242, "epoch": 183} {"train_loss": -17.7275447845459, "global_step": 15243, "epoch": 183} {"train_loss": -18.13373565673828, "global_step": 15244, "epoch": 183} {"train_loss": -18.212385177612305, "global_step": 15245, "epoch": 183} {"train_loss": -18.36616325378418, "global_step": 15246, "epoch": 183} {"train_loss": -17.8468017578125, "global_step": 15247, "epoch": 183} {"train_loss": -17.795507431030273, "global_step": 15248, "epoch": 183} {"train_loss": -18.43123435974121, "global_step": 15249, "epoch": 183} {"train_loss": -18.016462326049805, "global_step": 15250, "epoch": 183} {"train_loss": -18.201297760009766, "global_step": 15251, "epoch": 183} {"train_loss": -18.196460723876953, "global_step": 15252, "epoch": 183} {"train_loss": -18.49281883239746, "global_step": 15253, "epoch": 183} {"train_loss": -18.176685333251953, "global_step": 15254, "epoch": 183} {"train_loss": -18.098453521728516, "global_step": 15255, "epoch": 183} {"train_loss": -18.13089370727539, "global_step": 15256, "epoch": 183} {"train_loss": -18.44710350036621, "global_step": 15257, "epoch": 183} {"train_loss": -17.951459884643555, "global_step": 15258, "epoch": 183} {"train_loss": -18.261276245117188, "global_step": 15259, "epoch": 183} {"train_loss": -18.007492065429688, "global_step": 15260, "epoch": 183} {"train_loss": -18.317108154296875, "global_step": 15261, "epoch": 183} {"train_loss": -18.08567237854004, "global_step": 15262, "epoch": 183} {"train_loss": -18.058692932128906, "global_step": 15263, "epoch": 183} {"train_loss": -18.23858642578125, "global_step": 15264, "epoch": 183} {"train_loss": -17.857587814331055, "global_step": 15265, "epoch": 183} {"train_loss": -18.2622013092041, "global_step": 15266, "epoch": 183} {"train_loss": -18.29536247253418, "global_step": 15267, "epoch": 183} {"train_loss": -17.64033317565918, "global_step": 15268, "epoch": 183} {"train_loss": -17.92677116394043, "global_step": 15269, "epoch": 183} {"train_loss": -17.86322021484375, "global_step": 15270, "epoch": 183} {"train_loss": -18.082371930041944, "global_step": 15271, "epoch": 183, "val_loss": 6116197.5} {"train_loss": -17.787734985351562, "global_step": 15272, "epoch": 184} {"train_loss": -17.682010650634766, "global_step": 15273, "epoch": 184} {"train_loss": -18.11867904663086, "global_step": 15274, "epoch": 184} {"train_loss": -18.2353515625, "global_step": 15275, "epoch": 184} {"train_loss": -17.903106689453125, "global_step": 15276, "epoch": 184} {"train_loss": -17.966270446777344, "global_step": 15277, "epoch": 184} {"train_loss": -17.932098388671875, "global_step": 15278, "epoch": 184} {"train_loss": -18.113168716430664, "global_step": 15279, "epoch": 184} {"train_loss": -18.0268497467041, "global_step": 15280, "epoch": 184} {"train_loss": -18.084148406982422, "global_step": 15281, "epoch": 184} {"train_loss": -17.80159568786621, "global_step": 15282, "epoch": 184} {"train_loss": -17.760116577148438, "global_step": 15283, "epoch": 184} {"train_loss": -18.327558517456055, "global_step": 15284, "epoch": 184} {"train_loss": -17.895034790039062, "global_step": 15285, "epoch": 184} {"train_loss": -18.319223403930664, "global_step": 15286, "epoch": 184} {"train_loss": -17.744741439819336, "global_step": 15287, "epoch": 184} {"train_loss": -18.29817008972168, "global_step": 15288, "epoch": 184} {"train_loss": -18.0269775390625, "global_step": 15289, "epoch": 184} {"train_loss": -18.235593795776367, "global_step": 15290, "epoch": 184} {"train_loss": -17.73103904724121, "global_step": 15291, "epoch": 184} {"train_loss": -18.099271774291992, "global_step": 15292, "epoch": 184} {"train_loss": -17.900699615478516, "global_step": 15293, "epoch": 184} {"train_loss": -18.17500114440918, "global_step": 15294, "epoch": 184} {"train_loss": -18.064680099487305, "global_step": 15295, "epoch": 184} {"train_loss": -18.12110137939453, "global_step": 15296, "epoch": 184} {"train_loss": -18.032297134399414, "global_step": 15297, "epoch": 184} {"train_loss": -18.159399032592773, "global_step": 15298, "epoch": 184} {"train_loss": -18.548805236816406, "global_step": 15299, "epoch": 184} {"train_loss": -18.173908233642578, "global_step": 15300, "epoch": 184} {"train_loss": -17.90260887145996, "global_step": 15301, "epoch": 184} {"train_loss": -18.394073486328125, "global_step": 15302, "epoch": 184} {"train_loss": -18.18071174621582, "global_step": 15303, "epoch": 184} {"train_loss": -17.805734634399414, "global_step": 15304, "epoch": 184} {"train_loss": -18.52197265625, "global_step": 15305, "epoch": 184} {"train_loss": -18.03213882446289, "global_step": 15306, "epoch": 184} {"train_loss": -18.14503288269043, "global_step": 15307, "epoch": 184} {"train_loss": -18.44008445739746, "global_step": 15308, "epoch": 184} {"train_loss": -17.848331451416016, "global_step": 15309, "epoch": 184} {"train_loss": -17.632238388061523, "global_step": 15310, "epoch": 184} {"train_loss": -17.94024658203125, "global_step": 15311, "epoch": 184} {"train_loss": -17.644630432128906, "global_step": 15312, "epoch": 184} {"train_loss": -18.103166580200195, "global_step": 15313, "epoch": 184} {"train_loss": -18.18317985534668, "global_step": 15314, "epoch": 184} {"train_loss": -18.264204025268555, "global_step": 15315, "epoch": 184} {"train_loss": -18.141956329345703, "global_step": 15316, "epoch": 184} {"train_loss": -18.325769424438477, "global_step": 15317, "epoch": 184} {"train_loss": -17.78011131286621, "global_step": 15318, "epoch": 184} {"train_loss": -18.042198181152344, "global_step": 15319, "epoch": 184} {"train_loss": -18.12563133239746, "global_step": 15320, "epoch": 184} {"train_loss": -17.85573959350586, "global_step": 15321, "epoch": 184} {"train_loss": -18.244714736938477, "global_step": 15322, "epoch": 184} {"train_loss": -18.0245304107666, "global_step": 15323, "epoch": 184} {"train_loss": -18.357885360717773, "global_step": 15324, "epoch": 184} {"train_loss": -17.792470932006836, "global_step": 15325, "epoch": 184} {"train_loss": -17.872344970703125, "global_step": 15326, "epoch": 184} {"train_loss": -18.143566131591797, "global_step": 15327, "epoch": 184} {"train_loss": -18.293062210083008, "global_step": 15328, "epoch": 184} {"train_loss": -18.075960159301758, "global_step": 15329, "epoch": 184} {"train_loss": -18.583614349365234, "global_step": 15330, "epoch": 184} {"train_loss": -18.16387939453125, "global_step": 15331, "epoch": 184} {"train_loss": -17.980031967163086, "global_step": 15332, "epoch": 184} {"train_loss": -18.251022338867188, "global_step": 15333, "epoch": 184} {"train_loss": -17.882606506347656, "global_step": 15334, "epoch": 184} {"train_loss": -18.1571102142334, "global_step": 15335, "epoch": 184} {"train_loss": -18.223148345947266, "global_step": 15336, "epoch": 184} {"train_loss": -17.934349060058594, "global_step": 15337, "epoch": 184} {"train_loss": -18.30743408203125, "global_step": 15338, "epoch": 184} {"train_loss": -18.120325088500977, "global_step": 15339, "epoch": 184} {"train_loss": -17.721847534179688, "global_step": 15340, "epoch": 184} {"train_loss": -18.359586715698242, "global_step": 15341, "epoch": 184} {"train_loss": -18.436426162719727, "global_step": 15342, "epoch": 184} {"train_loss": -17.92286491394043, "global_step": 15343, "epoch": 184} {"train_loss": -18.266162872314453, "global_step": 15344, "epoch": 184} {"train_loss": -18.078153610229492, "global_step": 15345, "epoch": 184} {"train_loss": -17.968521118164062, "global_step": 15346, "epoch": 184} {"train_loss": -18.292844772338867, "global_step": 15347, "epoch": 184} {"train_loss": -17.9222354888916, "global_step": 15348, "epoch": 184} {"train_loss": -18.30182456970215, "global_step": 15349, "epoch": 184} {"train_loss": -18.354169845581055, "global_step": 15350, "epoch": 184} {"train_loss": -18.254491806030273, "global_step": 15351, "epoch": 184} {"train_loss": -17.865270614624023, "global_step": 15352, "epoch": 184} {"train_loss": -18.27633285522461, "global_step": 15353, "epoch": 184} {"train_loss": -18.105646501104516, "global_step": 15354, "epoch": 184, "val_loss": 6085752.0} {"train_loss": -17.862457275390625, "global_step": 15355, "epoch": 185} {"train_loss": -18.273303985595703, "global_step": 15356, "epoch": 185} {"train_loss": -17.61276626586914, "global_step": 15357, "epoch": 185} {"train_loss": -17.687488555908203, "global_step": 15358, "epoch": 185} {"train_loss": -17.570646286010742, "global_step": 15359, "epoch": 185} {"train_loss": -18.0062198638916, "global_step": 15360, "epoch": 185} {"train_loss": -17.862579345703125, "global_step": 15361, "epoch": 185} {"train_loss": -18.29176902770996, "global_step": 15362, "epoch": 185} {"train_loss": -17.77308464050293, "global_step": 15363, "epoch": 185} {"train_loss": -18.248554229736328, "global_step": 15364, "epoch": 185} {"train_loss": -18.3172550201416, "global_step": 15365, "epoch": 185} {"train_loss": -18.030534744262695, "global_step": 15366, "epoch": 185} {"train_loss": -18.068510055541992, "global_step": 15367, "epoch": 185} {"train_loss": -18.368562698364258, "global_step": 15368, "epoch": 185} {"train_loss": -18.46979331970215, "global_step": 15369, "epoch": 185} {"train_loss": -17.985300064086914, "global_step": 15370, "epoch": 185} {"train_loss": -17.90158462524414, "global_step": 15371, "epoch": 185} {"train_loss": -18.11628532409668, "global_step": 15372, "epoch": 185} {"train_loss": -18.170154571533203, "global_step": 15373, "epoch": 185} {"train_loss": -18.210311889648438, "global_step": 15374, "epoch": 185} {"train_loss": -17.875003814697266, "global_step": 15375, "epoch": 185} {"train_loss": -17.986356735229492, "global_step": 15376, "epoch": 185} {"train_loss": -18.10869789123535, "global_step": 15377, "epoch": 185} {"train_loss": -18.074005126953125, "global_step": 15378, "epoch": 185} {"train_loss": -18.061553955078125, "global_step": 15379, "epoch": 185} {"train_loss": -17.896425247192383, "global_step": 15380, "epoch": 185} {"train_loss": -18.326385498046875, "global_step": 15381, "epoch": 185} {"train_loss": -17.981277465820312, "global_step": 15382, "epoch": 185} {"train_loss": -18.03067970275879, "global_step": 15383, "epoch": 185} {"train_loss": -18.02069091796875, "global_step": 15384, "epoch": 185} {"train_loss": -17.940433502197266, "global_step": 15385, "epoch": 185} {"train_loss": -18.061185836791992, "global_step": 15386, "epoch": 185} {"train_loss": -18.10436248779297, "global_step": 15387, "epoch": 185} {"train_loss": -18.36747169494629, "global_step": 15388, "epoch": 185} {"train_loss": -18.304906845092773, "global_step": 15389, "epoch": 185} {"train_loss": -17.941207885742188, "global_step": 15390, "epoch": 185} {"train_loss": -18.170989990234375, "global_step": 15391, "epoch": 185} {"train_loss": -18.29167938232422, "global_step": 15392, "epoch": 185} {"train_loss": -18.141565322875977, "global_step": 15393, "epoch": 185} {"train_loss": -18.045032501220703, "global_step": 15394, "epoch": 185} {"train_loss": -18.140670776367188, "global_step": 15395, "epoch": 185} {"train_loss": -18.34797477722168, "global_step": 15396, "epoch": 185} {"train_loss": -17.767847061157227, "global_step": 15397, "epoch": 185} {"train_loss": -18.043943405151367, "global_step": 15398, "epoch": 185} {"train_loss": -17.922565460205078, "global_step": 15399, "epoch": 185} {"train_loss": -18.17852783203125, "global_step": 15400, "epoch": 185} {"train_loss": -18.25519371032715, "global_step": 15401, "epoch": 185} {"train_loss": -18.27490234375, "global_step": 15402, "epoch": 185} {"train_loss": -18.30078125, "global_step": 15403, "epoch": 185} {"train_loss": -18.127243041992188, "global_step": 15404, "epoch": 185} {"train_loss": -18.071462631225586, "global_step": 15405, "epoch": 185} {"train_loss": -18.020349502563477, "global_step": 15406, "epoch": 185} {"train_loss": -17.892623901367188, "global_step": 15407, "epoch": 185} {"train_loss": -17.82010841369629, "global_step": 15408, "epoch": 185} {"train_loss": -18.360849380493164, "global_step": 15409, "epoch": 185} {"train_loss": -18.179616928100586, "global_step": 15410, "epoch": 185} {"train_loss": -18.25591468811035, "global_step": 15411, "epoch": 185} {"train_loss": -18.360410690307617, "global_step": 15412, "epoch": 185} {"train_loss": -18.122465133666992, "global_step": 15413, "epoch": 185} {"train_loss": -18.24639892578125, "global_step": 15414, "epoch": 185} {"train_loss": -18.491212844848633, "global_step": 15415, "epoch": 185} {"train_loss": -18.045917510986328, "global_step": 15416, "epoch": 185} {"train_loss": -18.128324508666992, "global_step": 15417, "epoch": 185} {"train_loss": -18.08511734008789, "global_step": 15418, "epoch": 185} {"train_loss": -17.90015983581543, "global_step": 15419, "epoch": 185} {"train_loss": -18.217376708984375, "global_step": 15420, "epoch": 185} {"train_loss": -17.941781997680664, "global_step": 15421, "epoch": 185} {"train_loss": -18.432117462158203, "global_step": 15422, "epoch": 185} {"train_loss": -18.34870719909668, "global_step": 15423, "epoch": 185} {"train_loss": -18.22844886779785, "global_step": 15424, "epoch": 185} {"train_loss": -18.47067642211914, "global_step": 15425, "epoch": 185} {"train_loss": -17.46553611755371, "global_step": 15426, "epoch": 185} {"train_loss": -18.12347984313965, "global_step": 15427, "epoch": 185} {"train_loss": -18.184675216674805, "global_step": 15428, "epoch": 185} {"train_loss": -18.171356201171875, "global_step": 15429, "epoch": 185} {"train_loss": -17.90449333190918, "global_step": 15430, "epoch": 185} {"train_loss": -18.029653549194336, "global_step": 15431, "epoch": 185} {"train_loss": -18.260841369628906, "global_step": 15432, "epoch": 185} {"train_loss": -18.09775161743164, "global_step": 15433, "epoch": 185} {"train_loss": -17.613174438476562, "global_step": 15434, "epoch": 185} {"train_loss": -18.096027374267578, "global_step": 15435, "epoch": 185} {"train_loss": -17.934988021850586, "global_step": 15436, "epoch": 185} {"train_loss": -18.072630434151154, "global_step": 15437, "epoch": 185, "val_loss": 6406101.0} {"train_loss": -17.77889060974121, "global_step": 15438, "epoch": 186} {"train_loss": -17.92316246032715, "global_step": 15439, "epoch": 186} {"train_loss": -17.619770050048828, "global_step": 15440, "epoch": 186} {"train_loss": -17.918790817260742, "global_step": 15441, "epoch": 186} {"train_loss": -17.736774444580078, "global_step": 15442, "epoch": 186} {"train_loss": -18.502975463867188, "global_step": 15443, "epoch": 186} {"train_loss": -17.70293617248535, "global_step": 15444, "epoch": 186} {"train_loss": -17.935922622680664, "global_step": 15445, "epoch": 186} {"train_loss": -17.630556106567383, "global_step": 15446, "epoch": 186} {"train_loss": -18.16741943359375, "global_step": 15447, "epoch": 186} {"train_loss": -17.935855865478516, "global_step": 15448, "epoch": 186} {"train_loss": -17.792932510375977, "global_step": 15449, "epoch": 186} {"train_loss": -17.96449089050293, "global_step": 15450, "epoch": 186} {"train_loss": -18.14703941345215, "global_step": 15451, "epoch": 186} {"train_loss": -17.911882400512695, "global_step": 15452, "epoch": 186} {"train_loss": -17.933393478393555, "global_step": 15453, "epoch": 186} {"train_loss": -17.93634796142578, "global_step": 15454, "epoch": 186} {"train_loss": -18.037433624267578, "global_step": 15455, "epoch": 186} {"train_loss": -17.495080947875977, "global_step": 15456, "epoch": 186} {"train_loss": -18.152692794799805, "global_step": 15457, "epoch": 186} {"train_loss": -17.921802520751953, "global_step": 15458, "epoch": 186} {"train_loss": -18.18573570251465, "global_step": 15459, "epoch": 186} {"train_loss": -18.209516525268555, "global_step": 15460, "epoch": 186} {"train_loss": -17.656173706054688, "global_step": 15461, "epoch": 186} {"train_loss": -17.656280517578125, "global_step": 15462, "epoch": 186} {"train_loss": -17.72344398498535, "global_step": 15463, "epoch": 186} {"train_loss": -17.971458435058594, "global_step": 15464, "epoch": 186} {"train_loss": -18.201902389526367, "global_step": 15465, "epoch": 186} {"train_loss": -17.902328491210938, "global_step": 15466, "epoch": 186} {"train_loss": -17.808942794799805, "global_step": 15467, "epoch": 186} {"train_loss": -18.401580810546875, "global_step": 15468, "epoch": 186} {"train_loss": -18.27194595336914, "global_step": 15469, "epoch": 186} {"train_loss": -17.844053268432617, "global_step": 15470, "epoch": 186} {"train_loss": -18.262081146240234, "global_step": 15471, "epoch": 186} {"train_loss": -18.20607566833496, "global_step": 15472, "epoch": 186} {"train_loss": -18.570451736450195, "global_step": 15473, "epoch": 186} {"train_loss": -18.057371139526367, "global_step": 15474, "epoch": 186} {"train_loss": -18.13128662109375, "global_step": 15475, "epoch": 186} {"train_loss": -17.847883224487305, "global_step": 15476, "epoch": 186} {"train_loss": -18.37949562072754, "global_step": 15477, "epoch": 186} {"train_loss": -18.590194702148438, "global_step": 15478, "epoch": 186} {"train_loss": -18.511699676513672, "global_step": 15479, "epoch": 186} {"train_loss": -17.872289657592773, "global_step": 15480, "epoch": 186} {"train_loss": -18.206602096557617, "global_step": 15481, "epoch": 186} {"train_loss": -18.552518844604492, "global_step": 15482, "epoch": 186} {"train_loss": -17.89286231994629, "global_step": 15483, "epoch": 186} {"train_loss": -18.464859008789062, "global_step": 15484, "epoch": 186} {"train_loss": -17.810028076171875, "global_step": 15485, "epoch": 186} {"train_loss": -18.02130699157715, "global_step": 15486, "epoch": 186} {"train_loss": -18.215103149414062, "global_step": 15487, "epoch": 186} {"train_loss": -18.396854400634766, "global_step": 15488, "epoch": 186} {"train_loss": -17.9501895904541, "global_step": 15489, "epoch": 186} {"train_loss": -18.28430938720703, "global_step": 15490, "epoch": 186} {"train_loss": -18.218917846679688, "global_step": 15491, "epoch": 186} {"train_loss": -18.101299285888672, "global_step": 15492, "epoch": 186} {"train_loss": -18.27627944946289, "global_step": 15493, "epoch": 186} {"train_loss": -18.330533981323242, "global_step": 15494, "epoch": 186} {"train_loss": -18.087512969970703, "global_step": 15495, "epoch": 186} {"train_loss": -18.144620895385742, "global_step": 15496, "epoch": 186} {"train_loss": -18.213348388671875, "global_step": 15497, "epoch": 186} {"train_loss": -18.398523330688477, "global_step": 15498, "epoch": 186} {"train_loss": -17.990604400634766, "global_step": 15499, "epoch": 186} {"train_loss": -18.174766540527344, "global_step": 15500, "epoch": 186} {"train_loss": -17.73390007019043, "global_step": 15501, "epoch": 186} {"train_loss": -18.12556266784668, "global_step": 15502, "epoch": 186} {"train_loss": -18.628028869628906, "global_step": 15503, "epoch": 186} {"train_loss": -18.163330078125, "global_step": 15504, "epoch": 186} {"train_loss": -17.91410255432129, "global_step": 15505, "epoch": 186} {"train_loss": -18.04425048828125, "global_step": 15506, "epoch": 186} {"train_loss": -18.03494644165039, "global_step": 15507, "epoch": 186} {"train_loss": -18.363922119140625, "global_step": 15508, "epoch": 186} {"train_loss": -18.05109977722168, "global_step": 15509, "epoch": 186} {"train_loss": -18.33445167541504, "global_step": 15510, "epoch": 186} {"train_loss": -18.10748863220215, "global_step": 15511, "epoch": 186} {"train_loss": -18.054061889648438, "global_step": 15512, "epoch": 186} {"train_loss": -18.093048095703125, "global_step": 15513, "epoch": 186} {"train_loss": -18.178701400756836, "global_step": 15514, "epoch": 186} {"train_loss": -18.405309677124023, "global_step": 15515, "epoch": 186} {"train_loss": -18.311084747314453, "global_step": 15516, "epoch": 186} {"train_loss": -18.316360473632812, "global_step": 15517, "epoch": 186} {"train_loss": -18.144590377807617, "global_step": 15518, "epoch": 186} {"train_loss": -17.942230224609375, "global_step": 15519, "epoch": 186} {"train_loss": -18.10047526531909, "global_step": 15520, "epoch": 186, "val_loss": 6154507.0} {"train_loss": -17.86587142944336, "global_step": 15521, "epoch": 187} {"train_loss": -17.68763542175293, "global_step": 15522, "epoch": 187} {"train_loss": -18.203699111938477, "global_step": 15523, "epoch": 187} {"train_loss": -18.256208419799805, "global_step": 15524, "epoch": 187} {"train_loss": -17.86427116394043, "global_step": 15525, "epoch": 187} {"train_loss": -18.011510848999023, "global_step": 15526, "epoch": 187} {"train_loss": -17.82941246032715, "global_step": 15527, "epoch": 187} {"train_loss": -18.01568031311035, "global_step": 15528, "epoch": 187} {"train_loss": -18.3121337890625, "global_step": 15529, "epoch": 187} {"train_loss": -18.03659439086914, "global_step": 15530, "epoch": 187} {"train_loss": -18.034162521362305, "global_step": 15531, "epoch": 187} {"train_loss": -18.17127799987793, "global_step": 15532, "epoch": 187} {"train_loss": -18.16013526916504, "global_step": 15533, "epoch": 187} {"train_loss": -17.849693298339844, "global_step": 15534, "epoch": 187} {"train_loss": -17.847841262817383, "global_step": 15535, "epoch": 187} {"train_loss": -18.204557418823242, "global_step": 15536, "epoch": 187} {"train_loss": -18.001277923583984, "global_step": 15537, "epoch": 187} {"train_loss": -18.348846435546875, "global_step": 15538, "epoch": 187} {"train_loss": -18.133983612060547, "global_step": 15539, "epoch": 187} {"train_loss": -18.148733139038086, "global_step": 15540, "epoch": 187} {"train_loss": -17.940229415893555, "global_step": 15541, "epoch": 187} {"train_loss": -18.466447830200195, "global_step": 15542, "epoch": 187} {"train_loss": -18.406579971313477, "global_step": 15543, "epoch": 187} {"train_loss": -17.667428970336914, "global_step": 15544, "epoch": 187} {"train_loss": -17.925222396850586, "global_step": 15545, "epoch": 187} {"train_loss": -18.3280086517334, "global_step": 15546, "epoch": 187} {"train_loss": -18.012189865112305, "global_step": 15547, "epoch": 187} {"train_loss": -17.973674774169922, "global_step": 15548, "epoch": 187} {"train_loss": -18.228267669677734, "global_step": 15549, "epoch": 187} {"train_loss": -18.145654678344727, "global_step": 15550, "epoch": 187} {"train_loss": -17.90140151977539, "global_step": 15551, "epoch": 187} {"train_loss": -18.190587997436523, "global_step": 15552, "epoch": 187} {"train_loss": -18.166608810424805, "global_step": 15553, "epoch": 187} {"train_loss": -18.680789947509766, "global_step": 15554, "epoch": 187} {"train_loss": -17.87955665588379, "global_step": 15555, "epoch": 187} {"train_loss": -18.31024742126465, "global_step": 15556, "epoch": 187} {"train_loss": -18.32261085510254, "global_step": 15557, "epoch": 187} {"train_loss": -17.990375518798828, "global_step": 15558, "epoch": 187} {"train_loss": -18.290019989013672, "global_step": 15559, "epoch": 187} {"train_loss": -17.810224533081055, "global_step": 15560, "epoch": 187} {"train_loss": -17.699695587158203, "global_step": 15561, "epoch": 187} {"train_loss": -18.1302490234375, "global_step": 15562, "epoch": 187} {"train_loss": -18.423450469970703, "global_step": 15563, "epoch": 187} {"train_loss": -18.258075714111328, "global_step": 15564, "epoch": 187} {"train_loss": -18.028676986694336, "global_step": 15565, "epoch": 187} {"train_loss": -17.953659057617188, "global_step": 15566, "epoch": 187} {"train_loss": -17.66175651550293, "global_step": 15567, "epoch": 187} {"train_loss": -18.592670440673828, "global_step": 15568, "epoch": 187} {"train_loss": -17.786191940307617, "global_step": 15569, "epoch": 187} {"train_loss": -17.965938568115234, "global_step": 15570, "epoch": 187} {"train_loss": -18.046287536621094, "global_step": 15571, "epoch": 187} {"train_loss": -18.205036163330078, "global_step": 15572, "epoch": 187} {"train_loss": -18.137739181518555, "global_step": 15573, "epoch": 187} {"train_loss": -18.17450523376465, "global_step": 15574, "epoch": 187} {"train_loss": -18.259065628051758, "global_step": 15575, "epoch": 187} {"train_loss": -18.395421981811523, "global_step": 15576, "epoch": 187} {"train_loss": -18.5913143157959, "global_step": 15577, "epoch": 187} {"train_loss": -17.711509704589844, "global_step": 15578, "epoch": 187} {"train_loss": -18.344058990478516, "global_step": 15579, "epoch": 187} {"train_loss": -18.105510711669922, "global_step": 15580, "epoch": 187} {"train_loss": -18.362934112548828, "global_step": 15581, "epoch": 187} {"train_loss": -18.29955291748047, "global_step": 15582, "epoch": 187} {"train_loss": -18.186796188354492, "global_step": 15583, "epoch": 187} {"train_loss": -17.856098175048828, "global_step": 15584, "epoch": 187} {"train_loss": -18.30992889404297, "global_step": 15585, "epoch": 187} {"train_loss": -18.333969116210938, "global_step": 15586, "epoch": 187} {"train_loss": -18.053016662597656, "global_step": 15587, "epoch": 187} {"train_loss": -17.83185577392578, "global_step": 15588, "epoch": 187} {"train_loss": -18.33804702758789, "global_step": 15589, "epoch": 187} {"train_loss": -18.03822135925293, "global_step": 15590, "epoch": 187} {"train_loss": -18.089868545532227, "global_step": 15591, "epoch": 187} {"train_loss": -17.95572853088379, "global_step": 15592, "epoch": 187} {"train_loss": -18.256624221801758, "global_step": 15593, "epoch": 187} {"train_loss": -18.3514404296875, "global_step": 15594, "epoch": 187} {"train_loss": -18.473535537719727, "global_step": 15595, "epoch": 187} {"train_loss": -18.179790496826172, "global_step": 15596, "epoch": 187} {"train_loss": -18.333415985107422, "global_step": 15597, "epoch": 187} {"train_loss": -17.7665958404541, "global_step": 15598, "epoch": 187} {"train_loss": -17.965234756469727, "global_step": 15599, "epoch": 187} {"train_loss": -18.425500869750977, "global_step": 15600, "epoch": 187} {"train_loss": -18.171831130981445, "global_step": 15601, "epoch": 187} {"train_loss": -18.17856788635254, "global_step": 15602, "epoch": 187} {"train_loss": -18.099996612732667, "global_step": 15603, "epoch": 187, "val_loss": 6142403.5} {"train_loss": -18.33871078491211, "global_step": 15604, "epoch": 188} {"train_loss": -18.294897079467773, "global_step": 15605, "epoch": 188} {"train_loss": -18.180295944213867, "global_step": 15606, "epoch": 188} {"train_loss": -17.939863204956055, "global_step": 15607, "epoch": 188} {"train_loss": -18.254840850830078, "global_step": 15608, "epoch": 188} {"train_loss": -17.856266021728516, "global_step": 15609, "epoch": 188} {"train_loss": -17.96890640258789, "global_step": 15610, "epoch": 188} {"train_loss": -17.866165161132812, "global_step": 15611, "epoch": 188} {"train_loss": -17.770343780517578, "global_step": 15612, "epoch": 188} {"train_loss": -17.776050567626953, "global_step": 15613, "epoch": 188} {"train_loss": -18.182525634765625, "global_step": 15614, "epoch": 188} {"train_loss": -17.67524528503418, "global_step": 15615, "epoch": 188} {"train_loss": -17.578947067260742, "global_step": 15616, "epoch": 188} {"train_loss": -17.71799659729004, "global_step": 15617, "epoch": 188} {"train_loss": -18.090856552124023, "global_step": 15618, "epoch": 188} {"train_loss": -17.974210739135742, "global_step": 15619, "epoch": 188} {"train_loss": -18.0986270904541, "global_step": 15620, "epoch": 188} {"train_loss": -18.004806518554688, "global_step": 15621, "epoch": 188} {"train_loss": -17.759292602539062, "global_step": 15622, "epoch": 188} {"train_loss": -17.930723190307617, "global_step": 15623, "epoch": 188} {"train_loss": -18.45357894897461, "global_step": 15624, "epoch": 188} {"train_loss": -18.016799926757812, "global_step": 15625, "epoch": 188} {"train_loss": -18.2954044342041, "global_step": 15626, "epoch": 188} {"train_loss": -18.36123275756836, "global_step": 15627, "epoch": 188} {"train_loss": -17.941822052001953, "global_step": 15628, "epoch": 188} {"train_loss": -18.07408905029297, "global_step": 15629, "epoch": 188} {"train_loss": -18.155454635620117, "global_step": 15630, "epoch": 188} {"train_loss": -18.364978790283203, "global_step": 15631, "epoch": 188} {"train_loss": -18.135910034179688, "global_step": 15632, "epoch": 188} {"train_loss": -18.35871696472168, "global_step": 15633, "epoch": 188} {"train_loss": -18.37141990661621, "global_step": 15634, "epoch": 188} {"train_loss": -18.468017578125, "global_step": 15635, "epoch": 188} {"train_loss": -17.897174835205078, "global_step": 15636, "epoch": 188} {"train_loss": -18.145994186401367, "global_step": 15637, "epoch": 188} {"train_loss": -18.091882705688477, "global_step": 15638, "epoch": 188} {"train_loss": -18.25632095336914, "global_step": 15639, "epoch": 188} {"train_loss": -18.308364868164062, "global_step": 15640, "epoch": 188} {"train_loss": -18.008270263671875, "global_step": 15641, "epoch": 188} {"train_loss": -17.911746978759766, "global_step": 15642, "epoch": 188} {"train_loss": -17.974258422851562, "global_step": 15643, "epoch": 188} {"train_loss": -18.525312423706055, "global_step": 15644, "epoch": 188} {"train_loss": -18.503591537475586, "global_step": 15645, "epoch": 188} {"train_loss": -18.110837936401367, "global_step": 15646, "epoch": 188} {"train_loss": -17.927274703979492, "global_step": 15647, "epoch": 188} {"train_loss": -18.054555892944336, "global_step": 15648, "epoch": 188} {"train_loss": -17.786123275756836, "global_step": 15649, "epoch": 188} {"train_loss": -18.166593551635742, "global_step": 15650, "epoch": 188} {"train_loss": -18.139188766479492, "global_step": 15651, "epoch": 188} {"train_loss": -18.45328712463379, "global_step": 15652, "epoch": 188} {"train_loss": -18.267316818237305, "global_step": 15653, "epoch": 188} {"train_loss": -18.039031982421875, "global_step": 15654, "epoch": 188} {"train_loss": -18.01898765563965, "global_step": 15655, "epoch": 188} {"train_loss": -17.897092819213867, "global_step": 15656, "epoch": 188} {"train_loss": -18.25994300842285, "global_step": 15657, "epoch": 188} {"train_loss": -18.114259719848633, "global_step": 15658, "epoch": 188} {"train_loss": -18.04412078857422, "global_step": 15659, "epoch": 188} {"train_loss": -18.15556526184082, "global_step": 15660, "epoch": 188} {"train_loss": -18.368072509765625, "global_step": 15661, "epoch": 188} {"train_loss": -17.650999069213867, "global_step": 15662, "epoch": 188} {"train_loss": -18.155717849731445, "global_step": 15663, "epoch": 188} {"train_loss": -18.199525833129883, "global_step": 15664, "epoch": 188} {"train_loss": -17.900358200073242, "global_step": 15665, "epoch": 188} {"train_loss": -17.836732864379883, "global_step": 15666, "epoch": 188} {"train_loss": -17.941883087158203, "global_step": 15667, "epoch": 188} {"train_loss": -18.139347076416016, "global_step": 15668, "epoch": 188} {"train_loss": -18.4622802734375, "global_step": 15669, "epoch": 188} {"train_loss": -18.418704986572266, "global_step": 15670, "epoch": 188} {"train_loss": -18.17891502380371, "global_step": 15671, "epoch": 188} {"train_loss": -17.949697494506836, "global_step": 15672, "epoch": 188} {"train_loss": -18.03361701965332, "global_step": 15673, "epoch": 188} {"train_loss": -18.176145553588867, "global_step": 15674, "epoch": 188} {"train_loss": -18.296411514282227, "global_step": 15675, "epoch": 188} {"train_loss": -18.129592895507812, "global_step": 15676, "epoch": 188} {"train_loss": -17.8985652923584, "global_step": 15677, "epoch": 188} {"train_loss": -18.57529640197754, "global_step": 15678, "epoch": 188} {"train_loss": -18.270431518554688, "global_step": 15679, "epoch": 188} {"train_loss": -17.960020065307617, "global_step": 15680, "epoch": 188} {"train_loss": -18.210865020751953, "global_step": 15681, "epoch": 188} {"train_loss": -17.753612518310547, "global_step": 15682, "epoch": 188} {"train_loss": -18.058820724487305, "global_step": 15683, "epoch": 188} {"train_loss": -18.12017250061035, "global_step": 15684, "epoch": 188} {"train_loss": -17.74776840209961, "global_step": 15685, "epoch": 188} {"train_loss": -18.09172667078225, "global_step": 15686, "epoch": 188, "val_loss": 5926161.0} {"train_loss": -18.289936065673828, "global_step": 15687, "epoch": 189} {"train_loss": -18.15259552001953, "global_step": 15688, "epoch": 189} {"train_loss": -18.12322425842285, "global_step": 15689, "epoch": 189} {"train_loss": -18.000654220581055, "global_step": 15690, "epoch": 189} {"train_loss": -18.09183692932129, "global_step": 15691, "epoch": 189} {"train_loss": -17.996810913085938, "global_step": 15692, "epoch": 189} {"train_loss": -18.582923889160156, "global_step": 15693, "epoch": 189} {"train_loss": -17.883544921875, "global_step": 15694, "epoch": 189} {"train_loss": -18.192424774169922, "global_step": 15695, "epoch": 189} {"train_loss": -17.952022552490234, "global_step": 15696, "epoch": 189} {"train_loss": -17.984024047851562, "global_step": 15697, "epoch": 189} {"train_loss": -18.154376983642578, "global_step": 15698, "epoch": 189} {"train_loss": -17.755966186523438, "global_step": 15699, "epoch": 189} {"train_loss": -18.061573028564453, "global_step": 15700, "epoch": 189} {"train_loss": -17.939085006713867, "global_step": 15701, "epoch": 189} {"train_loss": -18.25472068786621, "global_step": 15702, "epoch": 189} {"train_loss": -17.87734031677246, "global_step": 15703, "epoch": 189} {"train_loss": -18.06162452697754, "global_step": 15704, "epoch": 189} {"train_loss": -18.19480323791504, "global_step": 15705, "epoch": 189} {"train_loss": -18.195322036743164, "global_step": 15706, "epoch": 189} {"train_loss": -17.99428939819336, "global_step": 15707, "epoch": 189} {"train_loss": -18.017391204833984, "global_step": 15708, "epoch": 189} {"train_loss": -17.930118560791016, "global_step": 15709, "epoch": 189} {"train_loss": -18.050281524658203, "global_step": 15710, "epoch": 189} {"train_loss": -18.544145584106445, "global_step": 15711, "epoch": 189} {"train_loss": -18.180973052978516, "global_step": 15712, "epoch": 189} {"train_loss": -18.215768814086914, "global_step": 15713, "epoch": 189} {"train_loss": -18.50732421875, "global_step": 15714, "epoch": 189} {"train_loss": -17.804641723632812, "global_step": 15715, "epoch": 189} {"train_loss": -18.118507385253906, "global_step": 15716, "epoch": 189} {"train_loss": -18.03265380859375, "global_step": 15717, "epoch": 189} {"train_loss": -18.33296775817871, "global_step": 15718, "epoch": 189} {"train_loss": -18.37775993347168, "global_step": 15719, "epoch": 189} {"train_loss": -18.384048461914062, "global_step": 15720, "epoch": 189} {"train_loss": -18.3049373626709, "global_step": 15721, "epoch": 189} {"train_loss": -17.98373031616211, "global_step": 15722, "epoch": 189} {"train_loss": -18.063385009765625, "global_step": 15723, "epoch": 189} {"train_loss": -18.315204620361328, "global_step": 15724, "epoch": 189} {"train_loss": -18.5140380859375, "global_step": 15725, "epoch": 189} {"train_loss": -18.409469604492188, "global_step": 15726, "epoch": 189} {"train_loss": -18.180044174194336, "global_step": 15727, "epoch": 189} {"train_loss": -18.492645263671875, "global_step": 15728, "epoch": 189} {"train_loss": -18.061389923095703, "global_step": 15729, "epoch": 189} {"train_loss": -18.00010871887207, "global_step": 15730, "epoch": 189} {"train_loss": -18.231725692749023, "global_step": 15731, "epoch": 189} {"train_loss": -18.108278274536133, "global_step": 15732, "epoch": 189} {"train_loss": -18.489086151123047, "global_step": 15733, "epoch": 189} {"train_loss": -18.27625846862793, "global_step": 15734, "epoch": 189} {"train_loss": -18.173189163208008, "global_step": 15735, "epoch": 189} {"train_loss": -18.196096420288086, "global_step": 15736, "epoch": 189} {"train_loss": -18.3183650970459, "global_step": 15737, "epoch": 189} {"train_loss": -18.459287643432617, "global_step": 15738, "epoch": 189} {"train_loss": -18.01503562927246, "global_step": 15739, "epoch": 189} {"train_loss": -18.19501304626465, "global_step": 15740, "epoch": 189} {"train_loss": -18.618587493896484, "global_step": 15741, "epoch": 189} {"train_loss": -18.238554000854492, "global_step": 15742, "epoch": 189} {"train_loss": -18.00856590270996, "global_step": 15743, "epoch": 189} {"train_loss": -18.071924209594727, "global_step": 15744, "epoch": 189} {"train_loss": -18.324756622314453, "global_step": 15745, "epoch": 189} {"train_loss": -17.700857162475586, "global_step": 15746, "epoch": 189} {"train_loss": -18.090810775756836, "global_step": 15747, "epoch": 189} {"train_loss": -18.132925033569336, "global_step": 15748, "epoch": 189} {"train_loss": -18.047616958618164, "global_step": 15749, "epoch": 189} {"train_loss": -17.808664321899414, "global_step": 15750, "epoch": 189} {"train_loss": -18.12200927734375, "global_step": 15751, "epoch": 189} {"train_loss": -18.146520614624023, "global_step": 15752, "epoch": 189} {"train_loss": -18.1240177154541, "global_step": 15753, "epoch": 189} {"train_loss": -17.989294052124023, "global_step": 15754, "epoch": 189} {"train_loss": -18.12381362915039, "global_step": 15755, "epoch": 189} {"train_loss": -18.234426498413086, "global_step": 15756, "epoch": 189} {"train_loss": -17.869915008544922, "global_step": 15757, "epoch": 189} {"train_loss": -17.814523696899414, "global_step": 15758, "epoch": 189} {"train_loss": -17.964231491088867, "global_step": 15759, "epoch": 189} {"train_loss": -18.18928337097168, "global_step": 15760, "epoch": 189} {"train_loss": -18.087684631347656, "global_step": 15761, "epoch": 189} {"train_loss": -18.417129516601562, "global_step": 15762, "epoch": 189} {"train_loss": -18.03118896484375, "global_step": 15763, "epoch": 189} {"train_loss": -17.835912704467773, "global_step": 15764, "epoch": 189} {"train_loss": -17.822174072265625, "global_step": 15765, "epoch": 189} {"train_loss": -18.455915451049805, "global_step": 15766, "epoch": 189} {"train_loss": -18.148372650146484, "global_step": 15767, "epoch": 189} {"train_loss": -18.069149017333984, "global_step": 15768, "epoch": 189} {"train_loss": -18.1581968054714, "global_step": 15769, "epoch": 189, "val_loss": 5919873.5} {"train_loss": -18.300209045410156, "global_step": 15770, "epoch": 190} {"train_loss": -18.51632308959961, "global_step": 15771, "epoch": 190} {"train_loss": -18.138748168945312, "global_step": 15772, "epoch": 190} {"train_loss": -18.38019371032715, "global_step": 15773, "epoch": 190} {"train_loss": -18.054662704467773, "global_step": 15774, "epoch": 190} {"train_loss": -18.00132179260254, "global_step": 15775, "epoch": 190} {"train_loss": -18.1867733001709, "global_step": 15776, "epoch": 190} {"train_loss": -17.814184188842773, "global_step": 15777, "epoch": 190} {"train_loss": -17.964454650878906, "global_step": 15778, "epoch": 190} {"train_loss": -18.137407302856445, "global_step": 15779, "epoch": 190} {"train_loss": -18.570058822631836, "global_step": 15780, "epoch": 190} {"train_loss": -18.330490112304688, "global_step": 15781, "epoch": 190} {"train_loss": -17.87696647644043, "global_step": 15782, "epoch": 190} {"train_loss": -18.2838191986084, "global_step": 15783, "epoch": 190} {"train_loss": -18.2362117767334, "global_step": 15784, "epoch": 190} {"train_loss": -18.399152755737305, "global_step": 15785, "epoch": 190} {"train_loss": -17.889923095703125, "global_step": 15786, "epoch": 190} {"train_loss": -18.55000877380371, "global_step": 15787, "epoch": 190} {"train_loss": -18.046659469604492, "global_step": 15788, "epoch": 190} {"train_loss": -18.154176712036133, "global_step": 15789, "epoch": 190} {"train_loss": -17.786163330078125, "global_step": 15790, "epoch": 190} {"train_loss": -18.242063522338867, "global_step": 15791, "epoch": 190} {"train_loss": -17.990018844604492, "global_step": 15792, "epoch": 190} {"train_loss": -18.130537033081055, "global_step": 15793, "epoch": 190} {"train_loss": -17.37082862854004, "global_step": 15794, "epoch": 190} {"train_loss": -17.892288208007812, "global_step": 15795, "epoch": 190} {"train_loss": -18.207365036010742, "global_step": 15796, "epoch": 190} {"train_loss": -18.095579147338867, "global_step": 15797, "epoch": 190} {"train_loss": -17.65410614013672, "global_step": 15798, "epoch": 190} {"train_loss": -18.174779891967773, "global_step": 15799, "epoch": 190} {"train_loss": -17.76650047302246, "global_step": 15800, "epoch": 190} {"train_loss": -18.013334274291992, "global_step": 15801, "epoch": 190} {"train_loss": -17.90413475036621, "global_step": 15802, "epoch": 190} {"train_loss": -18.652732849121094, "global_step": 15803, "epoch": 190} {"train_loss": -18.333999633789062, "global_step": 15804, "epoch": 190} {"train_loss": -18.217676162719727, "global_step": 15805, "epoch": 190} {"train_loss": -17.75471305847168, "global_step": 15806, "epoch": 190} {"train_loss": -18.220142364501953, "global_step": 15807, "epoch": 190} {"train_loss": -17.882139205932617, "global_step": 15808, "epoch": 190} {"train_loss": -17.86514663696289, "global_step": 15809, "epoch": 190} {"train_loss": -18.152149200439453, "global_step": 15810, "epoch": 190} {"train_loss": -18.057126998901367, "global_step": 15811, "epoch": 190} {"train_loss": -18.223922729492188, "global_step": 15812, "epoch": 190} {"train_loss": -18.111848831176758, "global_step": 15813, "epoch": 190} {"train_loss": -18.056171417236328, "global_step": 15814, "epoch": 190} {"train_loss": -17.974889755249023, "global_step": 15815, "epoch": 190} {"train_loss": -17.587377548217773, "global_step": 15816, "epoch": 190} {"train_loss": -17.97182273864746, "global_step": 15817, "epoch": 190} {"train_loss": -18.024587631225586, "global_step": 15818, "epoch": 190} {"train_loss": -18.173419952392578, "global_step": 15819, "epoch": 190} {"train_loss": -18.036041259765625, "global_step": 15820, "epoch": 190} {"train_loss": -17.941434860229492, "global_step": 15821, "epoch": 190} {"train_loss": -18.264413833618164, "global_step": 15822, "epoch": 190} {"train_loss": -17.969392776489258, "global_step": 15823, "epoch": 190} {"train_loss": -17.83969497680664, "global_step": 15824, "epoch": 190} {"train_loss": -18.000261306762695, "global_step": 15825, "epoch": 190} {"train_loss": -18.539384841918945, "global_step": 15826, "epoch": 190} {"train_loss": -18.031858444213867, "global_step": 15827, "epoch": 190} {"train_loss": -18.247072219848633, "global_step": 15828, "epoch": 190} {"train_loss": -17.933631896972656, "global_step": 15829, "epoch": 190} {"train_loss": -18.363018035888672, "global_step": 15830, "epoch": 190} {"train_loss": -18.123977661132812, "global_step": 15831, "epoch": 190} {"train_loss": -18.04945945739746, "global_step": 15832, "epoch": 190} {"train_loss": -18.195093154907227, "global_step": 15833, "epoch": 190} {"train_loss": -18.244613647460938, "global_step": 15834, "epoch": 190} {"train_loss": -18.337087631225586, "global_step": 15835, "epoch": 190} {"train_loss": -18.278453826904297, "global_step": 15836, "epoch": 190} {"train_loss": -18.23213768005371, "global_step": 15837, "epoch": 190} {"train_loss": -18.319477081298828, "global_step": 15838, "epoch": 190} {"train_loss": -18.001691818237305, "global_step": 15839, "epoch": 190} {"train_loss": -18.462909698486328, "global_step": 15840, "epoch": 190} {"train_loss": -17.86127281188965, "global_step": 15841, "epoch": 190} {"train_loss": -18.190820693969727, "global_step": 15842, "epoch": 190} {"train_loss": -18.110614776611328, "global_step": 15843, "epoch": 190} {"train_loss": -18.2770938873291, "global_step": 15844, "epoch": 190} {"train_loss": -18.05441665649414, "global_step": 15845, "epoch": 190} {"train_loss": -18.156476974487305, "global_step": 15846, "epoch": 190} {"train_loss": -17.91050148010254, "global_step": 15847, "epoch": 190} {"train_loss": -18.342206954956055, "global_step": 15848, "epoch": 190} {"train_loss": -18.398101806640625, "global_step": 15849, "epoch": 190} {"train_loss": -18.11598777770996, "global_step": 15850, "epoch": 190} {"train_loss": -18.0595703125, "global_step": 15851, "epoch": 190} {"train_loss": -18.109717725271203, "global_step": 15852, "epoch": 190, "val_loss": 6100029.5} {"train_loss": -17.793498992919922, "global_step": 15853, "epoch": 191} {"train_loss": -17.811397552490234, "global_step": 15854, "epoch": 191} {"train_loss": -17.88665199279785, "global_step": 15855, "epoch": 191} {"train_loss": -17.808237075805664, "global_step": 15856, "epoch": 191} {"train_loss": -17.832853317260742, "global_step": 15857, "epoch": 191} {"train_loss": -17.92122459411621, "global_step": 15858, "epoch": 191} {"train_loss": -17.84868049621582, "global_step": 15859, "epoch": 191} {"train_loss": -18.136112213134766, "global_step": 15860, "epoch": 191} {"train_loss": -17.699920654296875, "global_step": 15861, "epoch": 191} {"train_loss": -17.635488510131836, "global_step": 15862, "epoch": 191} {"train_loss": -18.12116050720215, "global_step": 15863, "epoch": 191} {"train_loss": -17.86407470703125, "global_step": 15864, "epoch": 191} {"train_loss": -17.93875503540039, "global_step": 15865, "epoch": 191} {"train_loss": -17.999738693237305, "global_step": 15866, "epoch": 191} {"train_loss": -18.395557403564453, "global_step": 15867, "epoch": 191} {"train_loss": -17.94300651550293, "global_step": 15868, "epoch": 191} {"train_loss": -17.88429069519043, "global_step": 15869, "epoch": 191} {"train_loss": -18.441192626953125, "global_step": 15870, "epoch": 191} {"train_loss": -18.180057525634766, "global_step": 15871, "epoch": 191} {"train_loss": -17.950559616088867, "global_step": 15872, "epoch": 191} {"train_loss": -18.309486389160156, "global_step": 15873, "epoch": 191} {"train_loss": -18.056957244873047, "global_step": 15874, "epoch": 191} {"train_loss": -18.29508399963379, "global_step": 15875, "epoch": 191} {"train_loss": -18.32973861694336, "global_step": 15876, "epoch": 191} {"train_loss": -18.02429962158203, "global_step": 15877, "epoch": 191} {"train_loss": -17.99265480041504, "global_step": 15878, "epoch": 191} {"train_loss": -18.05422592163086, "global_step": 15879, "epoch": 191} {"train_loss": -18.363554000854492, "global_step": 15880, "epoch": 191} {"train_loss": -18.162900924682617, "global_step": 15881, "epoch": 191} {"train_loss": -18.43621253967285, "global_step": 15882, "epoch": 191} {"train_loss": -18.11162757873535, "global_step": 15883, "epoch": 191} {"train_loss": -18.07185935974121, "global_step": 15884, "epoch": 191} {"train_loss": -18.132404327392578, "global_step": 15885, "epoch": 191} {"train_loss": -18.21857261657715, "global_step": 15886, "epoch": 191} {"train_loss": -18.2719783782959, "global_step": 15887, "epoch": 191} {"train_loss": -18.159778594970703, "global_step": 15888, "epoch": 191} {"train_loss": -18.5521297454834, "global_step": 15889, "epoch": 191} {"train_loss": -18.328540802001953, "global_step": 15890, "epoch": 191} {"train_loss": -18.16031837463379, "global_step": 15891, "epoch": 191} {"train_loss": -17.931955337524414, "global_step": 15892, "epoch": 191} {"train_loss": -18.367115020751953, "global_step": 15893, "epoch": 191} {"train_loss": -18.23339080810547, "global_step": 15894, "epoch": 191} {"train_loss": -18.395355224609375, "global_step": 15895, "epoch": 191} {"train_loss": -18.032957077026367, "global_step": 15896, "epoch": 191} {"train_loss": -18.146207809448242, "global_step": 15897, "epoch": 191} {"train_loss": -18.1181640625, "global_step": 15898, "epoch": 191} {"train_loss": -17.81684112548828, "global_step": 15899, "epoch": 191} {"train_loss": -18.187490463256836, "global_step": 15900, "epoch": 191} {"train_loss": -18.187118530273438, "global_step": 15901, "epoch": 191} {"train_loss": -18.022422790527344, "global_step": 15902, "epoch": 191} {"train_loss": -18.253982543945312, "global_step": 15903, "epoch": 191} {"train_loss": -18.120227813720703, "global_step": 15904, "epoch": 191} {"train_loss": -18.21927833557129, "global_step": 15905, "epoch": 191} {"train_loss": -18.285301208496094, "global_step": 15906, "epoch": 191} {"train_loss": -18.114072799682617, "global_step": 15907, "epoch": 191} {"train_loss": -17.98029899597168, "global_step": 15908, "epoch": 191} {"train_loss": -17.993736267089844, "global_step": 15909, "epoch": 191} {"train_loss": -17.936038970947266, "global_step": 15910, "epoch": 191} {"train_loss": -18.082380294799805, "global_step": 15911, "epoch": 191} {"train_loss": -18.391178131103516, "global_step": 15912, "epoch": 191} {"train_loss": -18.126052856445312, "global_step": 15913, "epoch": 191} {"train_loss": -17.438247680664062, "global_step": 15914, "epoch": 191} {"train_loss": -17.99749755859375, "global_step": 15915, "epoch": 191} {"train_loss": -18.11798667907715, "global_step": 15916, "epoch": 191} {"train_loss": -18.516727447509766, "global_step": 15917, "epoch": 191} {"train_loss": -18.070947647094727, "global_step": 15918, "epoch": 191} {"train_loss": -18.312236785888672, "global_step": 15919, "epoch": 191} {"train_loss": -17.907621383666992, "global_step": 15920, "epoch": 191} {"train_loss": -18.48267936706543, "global_step": 15921, "epoch": 191} {"train_loss": -18.354787826538086, "global_step": 15922, "epoch": 191} {"train_loss": -18.38698387145996, "global_step": 15923, "epoch": 191} {"train_loss": -18.129201889038086, "global_step": 15924, "epoch": 191} {"train_loss": -18.41317367553711, "global_step": 15925, "epoch": 191} {"train_loss": -18.274555206298828, "global_step": 15926, "epoch": 191} {"train_loss": -17.819156646728516, "global_step": 15927, "epoch": 191} {"train_loss": -18.387971878051758, "global_step": 15928, "epoch": 191} {"train_loss": -18.00028419494629, "global_step": 15929, "epoch": 191} {"train_loss": -18.20515251159668, "global_step": 15930, "epoch": 191} {"train_loss": -17.9667911529541, "global_step": 15931, "epoch": 191} {"train_loss": -17.86268424987793, "global_step": 15932, "epoch": 191} {"train_loss": -18.429357528686523, "global_step": 15933, "epoch": 191} {"train_loss": -18.204357147216797, "global_step": 15934, "epoch": 191} {"train_loss": -18.117022181131755, "global_step": 15935, "epoch": 191, "val_loss": 6006249.0} {"train_loss": -18.41627311706543, "global_step": 15936, "epoch": 192} {"train_loss": -18.34329605102539, "global_step": 15937, "epoch": 192} {"train_loss": -18.23532485961914, "global_step": 15938, "epoch": 192} {"train_loss": -18.099742889404297, "global_step": 15939, "epoch": 192} {"train_loss": -18.34956169128418, "global_step": 15940, "epoch": 192} {"train_loss": -18.0340633392334, "global_step": 15941, "epoch": 192} {"train_loss": -18.32587242126465, "global_step": 15942, "epoch": 192} {"train_loss": -18.342639923095703, "global_step": 15943, "epoch": 192} {"train_loss": -18.502500534057617, "global_step": 15944, "epoch": 192} {"train_loss": -17.84916877746582, "global_step": 15945, "epoch": 192} {"train_loss": -17.93311882019043, "global_step": 15946, "epoch": 192} {"train_loss": -17.658233642578125, "global_step": 15947, "epoch": 192} {"train_loss": -18.056968688964844, "global_step": 15948, "epoch": 192} {"train_loss": -18.45135498046875, "global_step": 15949, "epoch": 192} {"train_loss": -18.237810134887695, "global_step": 15950, "epoch": 192} {"train_loss": -18.48902702331543, "global_step": 15951, "epoch": 192} {"train_loss": -18.159183502197266, "global_step": 15952, "epoch": 192} {"train_loss": -18.08308982849121, "global_step": 15953, "epoch": 192} {"train_loss": -18.562009811401367, "global_step": 15954, "epoch": 192} {"train_loss": -18.0969181060791, "global_step": 15955, "epoch": 192} {"train_loss": -18.25316047668457, "global_step": 15956, "epoch": 192} {"train_loss": -18.125553131103516, "global_step": 15957, "epoch": 192} {"train_loss": -18.10828971862793, "global_step": 15958, "epoch": 192} {"train_loss": -18.0549373626709, "global_step": 15959, "epoch": 192} {"train_loss": -18.31165313720703, "global_step": 15960, "epoch": 192} {"train_loss": -18.23235511779785, "global_step": 15961, "epoch": 192} {"train_loss": -18.210302352905273, "global_step": 15962, "epoch": 192} {"train_loss": -18.106609344482422, "global_step": 15963, "epoch": 192} {"train_loss": -18.055707931518555, "global_step": 15964, "epoch": 192} {"train_loss": -17.879552841186523, "global_step": 15965, "epoch": 192} {"train_loss": -18.03120231628418, "global_step": 15966, "epoch": 192} {"train_loss": -18.212297439575195, "global_step": 15967, "epoch": 192} {"train_loss": -18.094390869140625, "global_step": 15968, "epoch": 192} {"train_loss": -18.11469841003418, "global_step": 15969, "epoch": 192} {"train_loss": -17.696239471435547, "global_step": 15970, "epoch": 192} {"train_loss": -17.929393768310547, "global_step": 15971, "epoch": 192} {"train_loss": -18.223892211914062, "global_step": 15972, "epoch": 192} {"train_loss": -17.7935791015625, "global_step": 15973, "epoch": 192} {"train_loss": -18.280969619750977, "global_step": 15974, "epoch": 192} {"train_loss": -18.42641258239746, "global_step": 15975, "epoch": 192} {"train_loss": -18.23822021484375, "global_step": 15976, "epoch": 192} {"train_loss": -18.39275360107422, "global_step": 15977, "epoch": 192} {"train_loss": -17.89066505432129, "global_step": 15978, "epoch": 192} {"train_loss": -17.93730354309082, "global_step": 15979, "epoch": 192} {"train_loss": -18.020544052124023, "global_step": 15980, "epoch": 192} {"train_loss": -18.1282901763916, "global_step": 15981, "epoch": 192} {"train_loss": -18.189411163330078, "global_step": 15982, "epoch": 192} {"train_loss": -18.671213150024414, "global_step": 15983, "epoch": 192} {"train_loss": -18.1657657623291, "global_step": 15984, "epoch": 192} {"train_loss": -17.866168975830078, "global_step": 15985, "epoch": 192} {"train_loss": -18.284074783325195, "global_step": 15986, "epoch": 192} {"train_loss": -18.267057418823242, "global_step": 15987, "epoch": 192} {"train_loss": -17.976627349853516, "global_step": 15988, "epoch": 192} {"train_loss": -17.896337509155273, "global_step": 15989, "epoch": 192} {"train_loss": -17.95208740234375, "global_step": 15990, "epoch": 192} {"train_loss": -17.907495498657227, "global_step": 15991, "epoch": 192} {"train_loss": -18.025211334228516, "global_step": 15992, "epoch": 192} {"train_loss": -18.364072799682617, "global_step": 15993, "epoch": 192} {"train_loss": -18.588651657104492, "global_step": 15994, "epoch": 192} {"train_loss": -18.16639518737793, "global_step": 15995, "epoch": 192} {"train_loss": -18.00179100036621, "global_step": 15996, "epoch": 192} {"train_loss": -18.15614128112793, "global_step": 15997, "epoch": 192} {"train_loss": -18.13001251220703, "global_step": 15998, "epoch": 192} {"train_loss": -17.77707290649414, "global_step": 15999, "epoch": 192} {"train_loss": -18.679542541503906, "global_step": 16000, "epoch": 192} {"train_loss": -18.280044555664062, "global_step": 16001, "epoch": 192} {"train_loss": -17.982080459594727, "global_step": 16002, "epoch": 192} {"train_loss": -17.614681243896484, "global_step": 16003, "epoch": 192} {"train_loss": -17.948135375976562, "global_step": 16004, "epoch": 192} {"train_loss": -18.02434730529785, "global_step": 16005, "epoch": 192} {"train_loss": -18.376840591430664, "global_step": 16006, "epoch": 192} {"train_loss": -18.249624252319336, "global_step": 16007, "epoch": 192} {"train_loss": -18.353504180908203, "global_step": 16008, "epoch": 192} {"train_loss": -18.204435348510742, "global_step": 16009, "epoch": 192} {"train_loss": -18.24623680114746, "global_step": 16010, "epoch": 192} {"train_loss": -18.397132873535156, "global_step": 16011, "epoch": 192} {"train_loss": -17.878433227539062, "global_step": 16012, "epoch": 192} {"train_loss": -18.403902053833008, "global_step": 16013, "epoch": 192} {"train_loss": -18.29986000061035, "global_step": 16014, "epoch": 192} {"train_loss": -18.107107162475586, "global_step": 16015, "epoch": 192} {"train_loss": -18.075958251953125, "global_step": 16016, "epoch": 192} {"train_loss": -18.41781997680664, "global_step": 16017, "epoch": 192} {"train_loss": -18.139657744442125, "global_step": 16018, "epoch": 192, "val_loss": 6057379.0} {"train_loss": -18.207508087158203, "global_step": 16019, "epoch": 193} {"train_loss": -18.077287673950195, "global_step": 16020, "epoch": 193} {"train_loss": -17.754959106445312, "global_step": 16021, "epoch": 193} {"train_loss": -18.05812644958496, "global_step": 16022, "epoch": 193} {"train_loss": -18.167631149291992, "global_step": 16023, "epoch": 193} {"train_loss": -17.874731063842773, "global_step": 16024, "epoch": 193} {"train_loss": -17.987409591674805, "global_step": 16025, "epoch": 193} {"train_loss": -18.156436920166016, "global_step": 16026, "epoch": 193} {"train_loss": -17.895357131958008, "global_step": 16027, "epoch": 193} {"train_loss": -17.922603607177734, "global_step": 16028, "epoch": 193} {"train_loss": -17.786691665649414, "global_step": 16029, "epoch": 193} {"train_loss": -18.2973690032959, "global_step": 16030, "epoch": 193} {"train_loss": -18.059345245361328, "global_step": 16031, "epoch": 193} {"train_loss": -18.326292037963867, "global_step": 16032, "epoch": 193} {"train_loss": -17.956546783447266, "global_step": 16033, "epoch": 193} {"train_loss": -18.398212432861328, "global_step": 16034, "epoch": 193} {"train_loss": -18.163711547851562, "global_step": 16035, "epoch": 193} {"train_loss": -17.978891372680664, "global_step": 16036, "epoch": 193} {"train_loss": -18.09690284729004, "global_step": 16037, "epoch": 193} {"train_loss": -17.905080795288086, "global_step": 16038, "epoch": 193} {"train_loss": -18.030048370361328, "global_step": 16039, "epoch": 193} {"train_loss": -17.9897518157959, "global_step": 16040, "epoch": 193} {"train_loss": -18.080535888671875, "global_step": 16041, "epoch": 193} {"train_loss": -18.37732696533203, "global_step": 16042, "epoch": 193} {"train_loss": -18.7371883392334, "global_step": 16043, "epoch": 193} {"train_loss": -18.089221954345703, "global_step": 16044, "epoch": 193} {"train_loss": -17.807153701782227, "global_step": 16045, "epoch": 193} {"train_loss": -17.895265579223633, "global_step": 16046, "epoch": 193} {"train_loss": -18.26637077331543, "global_step": 16047, "epoch": 193} {"train_loss": -18.213991165161133, "global_step": 16048, "epoch": 193} {"train_loss": -18.610591888427734, "global_step": 16049, "epoch": 193} {"train_loss": -18.4753360748291, "global_step": 16050, "epoch": 193} {"train_loss": -18.162057876586914, "global_step": 16051, "epoch": 193} {"train_loss": -18.51140785217285, "global_step": 16052, "epoch": 193} {"train_loss": -18.037017822265625, "global_step": 16053, "epoch": 193} {"train_loss": -17.70379066467285, "global_step": 16054, "epoch": 193} {"train_loss": -18.04888343811035, "global_step": 16055, "epoch": 193} {"train_loss": -18.6080379486084, "global_step": 16056, "epoch": 193} {"train_loss": -18.073511123657227, "global_step": 16057, "epoch": 193} {"train_loss": -18.101221084594727, "global_step": 16058, "epoch": 193} {"train_loss": -18.294391632080078, "global_step": 16059, "epoch": 193} {"train_loss": -17.94751739501953, "global_step": 16060, "epoch": 193} {"train_loss": -18.13890838623047, "global_step": 16061, "epoch": 193} {"train_loss": -17.824758529663086, "global_step": 16062, "epoch": 193} {"train_loss": -18.54681396484375, "global_step": 16063, "epoch": 193} {"train_loss": -18.495567321777344, "global_step": 16064, "epoch": 193} {"train_loss": -17.936038970947266, "global_step": 16065, "epoch": 193} {"train_loss": -18.39859962463379, "global_step": 16066, "epoch": 193} {"train_loss": -18.056928634643555, "global_step": 16067, "epoch": 193} {"train_loss": -18.120182037353516, "global_step": 16068, "epoch": 193} {"train_loss": -18.06898307800293, "global_step": 16069, "epoch": 193} {"train_loss": -18.281879425048828, "global_step": 16070, "epoch": 193} {"train_loss": -18.17024803161621, "global_step": 16071, "epoch": 193} {"train_loss": -17.947959899902344, "global_step": 16072, "epoch": 193} {"train_loss": -17.743810653686523, "global_step": 16073, "epoch": 193} {"train_loss": -18.237268447875977, "global_step": 16074, "epoch": 193} {"train_loss": -18.100112915039062, "global_step": 16075, "epoch": 193} {"train_loss": -18.4919490814209, "global_step": 16076, "epoch": 193} {"train_loss": -18.374576568603516, "global_step": 16077, "epoch": 193} {"train_loss": -17.837751388549805, "global_step": 16078, "epoch": 193} {"train_loss": -18.05275535583496, "global_step": 16079, "epoch": 193} {"train_loss": -18.526260375976562, "global_step": 16080, "epoch": 193} {"train_loss": -18.166540145874023, "global_step": 16081, "epoch": 193} {"train_loss": -18.224563598632812, "global_step": 16082, "epoch": 193} {"train_loss": -18.082324981689453, "global_step": 16083, "epoch": 193} {"train_loss": -18.083288192749023, "global_step": 16084, "epoch": 193} {"train_loss": -18.216835021972656, "global_step": 16085, "epoch": 193} {"train_loss": -18.156591415405273, "global_step": 16086, "epoch": 193} {"train_loss": -18.19818687438965, "global_step": 16087, "epoch": 193} {"train_loss": -18.01447868347168, "global_step": 16088, "epoch": 193} {"train_loss": -17.954076766967773, "global_step": 16089, "epoch": 193} {"train_loss": -17.95296859741211, "global_step": 16090, "epoch": 193} {"train_loss": -18.292510986328125, "global_step": 16091, "epoch": 193} {"train_loss": -18.476728439331055, "global_step": 16092, "epoch": 193} {"train_loss": -18.06797981262207, "global_step": 16093, "epoch": 193} {"train_loss": -17.887847900390625, "global_step": 16094, "epoch": 193} {"train_loss": -17.88636589050293, "global_step": 16095, "epoch": 193} {"train_loss": -17.954195022583008, "global_step": 16096, "epoch": 193} {"train_loss": -18.156173706054688, "global_step": 16097, "epoch": 193} {"train_loss": -18.59087562561035, "global_step": 16098, "epoch": 193} {"train_loss": -18.077566146850586, "global_step": 16099, "epoch": 193} {"train_loss": -17.85215950012207, "global_step": 16100, "epoch": 193} {"train_loss": -18.130724343908838, "global_step": 16101, "epoch": 193, "val_loss": 5973296.0} {"train_loss": -17.602846145629883, "global_step": 16102, "epoch": 194} {"train_loss": -17.346546173095703, "global_step": 16103, "epoch": 194} {"train_loss": -17.921916961669922, "global_step": 16104, "epoch": 194} {"train_loss": -17.688873291015625, "global_step": 16105, "epoch": 194} {"train_loss": -18.10276222229004, "global_step": 16106, "epoch": 194} {"train_loss": -18.362144470214844, "global_step": 16107, "epoch": 194} {"train_loss": -18.00421142578125, "global_step": 16108, "epoch": 194} {"train_loss": -17.937108993530273, "global_step": 16109, "epoch": 194} {"train_loss": -18.117929458618164, "global_step": 16110, "epoch": 194} {"train_loss": -18.199071884155273, "global_step": 16111, "epoch": 194} {"train_loss": -17.963285446166992, "global_step": 16112, "epoch": 194} {"train_loss": -17.934743881225586, "global_step": 16113, "epoch": 194} {"train_loss": -18.060354232788086, "global_step": 16114, "epoch": 194} {"train_loss": -17.917387008666992, "global_step": 16115, "epoch": 194} {"train_loss": -17.987634658813477, "global_step": 16116, "epoch": 194} {"train_loss": -18.126508712768555, "global_step": 16117, "epoch": 194} {"train_loss": -17.95253562927246, "global_step": 16118, "epoch": 194} {"train_loss": -18.01951026916504, "global_step": 16119, "epoch": 194} {"train_loss": -18.221616744995117, "global_step": 16120, "epoch": 194} {"train_loss": -17.87916374206543, "global_step": 16121, "epoch": 194} {"train_loss": -18.449344635009766, "global_step": 16122, "epoch": 194} {"train_loss": -18.473020553588867, "global_step": 16123, "epoch": 194} {"train_loss": -17.808597564697266, "global_step": 16124, "epoch": 194} {"train_loss": -18.049901962280273, "global_step": 16125, "epoch": 194} {"train_loss": -17.804140090942383, "global_step": 16126, "epoch": 194} {"train_loss": -18.45136833190918, "global_step": 16127, "epoch": 194} {"train_loss": -18.01264762878418, "global_step": 16128, "epoch": 194} {"train_loss": -17.687541961669922, "global_step": 16129, "epoch": 194} {"train_loss": -18.184064865112305, "global_step": 16130, "epoch": 194} {"train_loss": -18.19293785095215, "global_step": 16131, "epoch": 194} {"train_loss": -18.123371124267578, "global_step": 16132, "epoch": 194} {"train_loss": -18.02370834350586, "global_step": 16133, "epoch": 194} {"train_loss": -18.2230224609375, "global_step": 16134, "epoch": 194} {"train_loss": -18.318744659423828, "global_step": 16135, "epoch": 194} {"train_loss": -18.3907413482666, "global_step": 16136, "epoch": 194} {"train_loss": -17.930387496948242, "global_step": 16137, "epoch": 194} {"train_loss": -18.439590454101562, "global_step": 16138, "epoch": 194} {"train_loss": -17.879932403564453, "global_step": 16139, "epoch": 194} {"train_loss": -18.297435760498047, "global_step": 16140, "epoch": 194} {"train_loss": -18.31104850769043, "global_step": 16141, "epoch": 194} {"train_loss": -17.850833892822266, "global_step": 16142, "epoch": 194} {"train_loss": -18.071149826049805, "global_step": 16143, "epoch": 194} {"train_loss": -18.239744186401367, "global_step": 16144, "epoch": 194} {"train_loss": -18.067264556884766, "global_step": 16145, "epoch": 194} {"train_loss": -18.368406295776367, "global_step": 16146, "epoch": 194} {"train_loss": -18.02011489868164, "global_step": 16147, "epoch": 194} {"train_loss": -18.263565063476562, "global_step": 16148, "epoch": 194} {"train_loss": -18.199359893798828, "global_step": 16149, "epoch": 194} {"train_loss": -17.680654525756836, "global_step": 16150, "epoch": 194} {"train_loss": -18.14569091796875, "global_step": 16151, "epoch": 194} {"train_loss": -18.18968391418457, "global_step": 16152, "epoch": 194} {"train_loss": -18.37838363647461, "global_step": 16153, "epoch": 194} {"train_loss": -18.21898078918457, "global_step": 16154, "epoch": 194} {"train_loss": -18.23598289489746, "global_step": 16155, "epoch": 194} {"train_loss": -18.33139991760254, "global_step": 16156, "epoch": 194} {"train_loss": -18.23323631286621, "global_step": 16157, "epoch": 194} {"train_loss": -18.31961441040039, "global_step": 16158, "epoch": 194} {"train_loss": -18.133275985717773, "global_step": 16159, "epoch": 194} {"train_loss": -18.173185348510742, "global_step": 16160, "epoch": 194} {"train_loss": -18.07857322692871, "global_step": 16161, "epoch": 194} {"train_loss": -18.20159339904785, "global_step": 16162, "epoch": 194} {"train_loss": -18.00368309020996, "global_step": 16163, "epoch": 194} {"train_loss": -18.26527214050293, "global_step": 16164, "epoch": 194} {"train_loss": -18.537567138671875, "global_step": 16165, "epoch": 194} {"train_loss": -18.379873275756836, "global_step": 16166, "epoch": 194} {"train_loss": -18.23779296875, "global_step": 16167, "epoch": 194} {"train_loss": -18.24140739440918, "global_step": 16168, "epoch": 194} {"train_loss": -17.853870391845703, "global_step": 16169, "epoch": 194} {"train_loss": -18.363243103027344, "global_step": 16170, "epoch": 194} {"train_loss": -18.35506248474121, "global_step": 16171, "epoch": 194} {"train_loss": -18.149118423461914, "global_step": 16172, "epoch": 194} {"train_loss": -18.017520904541016, "global_step": 16173, "epoch": 194} {"train_loss": -18.076345443725586, "global_step": 16174, "epoch": 194} {"train_loss": -17.960174560546875, "global_step": 16175, "epoch": 194} {"train_loss": -18.517576217651367, "global_step": 16176, "epoch": 194} {"train_loss": -17.987424850463867, "global_step": 16177, "epoch": 194} {"train_loss": -18.365692138671875, "global_step": 16178, "epoch": 194} {"train_loss": -18.09041976928711, "global_step": 16179, "epoch": 194} {"train_loss": -18.538589477539062, "global_step": 16180, "epoch": 194} {"train_loss": -18.032590866088867, "global_step": 16181, "epoch": 194} {"train_loss": -18.096837997436523, "global_step": 16182, "epoch": 194} {"train_loss": -18.08272361755371, "global_step": 16183, "epoch": 194} {"train_loss": -18.12237783225186, "global_step": 16184, "epoch": 194, "val_loss": 6108904.5} {"train_loss": -18.160480499267578, "global_step": 16185, "epoch": 195} {"train_loss": -18.18489646911621, "global_step": 16186, "epoch": 195} {"train_loss": -17.867033004760742, "global_step": 16187, "epoch": 195} {"train_loss": -18.40468406677246, "global_step": 16188, "epoch": 195} {"train_loss": -17.822317123413086, "global_step": 16189, "epoch": 195} {"train_loss": -18.024065017700195, "global_step": 16190, "epoch": 195} {"train_loss": -17.893674850463867, "global_step": 16191, "epoch": 195} {"train_loss": -17.955562591552734, "global_step": 16192, "epoch": 195} {"train_loss": -18.125350952148438, "global_step": 16193, "epoch": 195} {"train_loss": -17.99747657775879, "global_step": 16194, "epoch": 195} {"train_loss": -18.12403106689453, "global_step": 16195, "epoch": 195} {"train_loss": -18.059541702270508, "global_step": 16196, "epoch": 195} {"train_loss": -17.994962692260742, "global_step": 16197, "epoch": 195} {"train_loss": -18.345321655273438, "global_step": 16198, "epoch": 195} {"train_loss": -17.926137924194336, "global_step": 16199, "epoch": 195} {"train_loss": -17.815366744995117, "global_step": 16200, "epoch": 195} {"train_loss": -17.892507553100586, "global_step": 16201, "epoch": 195} {"train_loss": -18.002836227416992, "global_step": 16202, "epoch": 195} {"train_loss": -18.312894821166992, "global_step": 16203, "epoch": 195} {"train_loss": -18.396263122558594, "global_step": 16204, "epoch": 195} {"train_loss": -18.43477439880371, "global_step": 16205, "epoch": 195} {"train_loss": -18.192190170288086, "global_step": 16206, "epoch": 195} {"train_loss": -18.090309143066406, "global_step": 16207, "epoch": 195} {"train_loss": -18.091794967651367, "global_step": 16208, "epoch": 195} {"train_loss": -18.572864532470703, "global_step": 16209, "epoch": 195} {"train_loss": -18.452741622924805, "global_step": 16210, "epoch": 195} {"train_loss": -18.3154239654541, "global_step": 16211, "epoch": 195} {"train_loss": -18.420814514160156, "global_step": 16212, "epoch": 195} {"train_loss": -18.034290313720703, "global_step": 16213, "epoch": 195} {"train_loss": -18.19855308532715, "global_step": 16214, "epoch": 195} {"train_loss": -18.73713493347168, "global_step": 16215, "epoch": 195} {"train_loss": -18.29816246032715, "global_step": 16216, "epoch": 195} {"train_loss": -18.115203857421875, "global_step": 16217, "epoch": 195} {"train_loss": -17.503469467163086, "global_step": 16218, "epoch": 195} {"train_loss": -18.265060424804688, "global_step": 16219, "epoch": 195} {"train_loss": -17.926578521728516, "global_step": 16220, "epoch": 195} {"train_loss": -18.120107650756836, "global_step": 16221, "epoch": 195} {"train_loss": -18.70042610168457, "global_step": 16222, "epoch": 195} {"train_loss": -17.858835220336914, "global_step": 16223, "epoch": 195} {"train_loss": -18.160486221313477, "global_step": 16224, "epoch": 195} {"train_loss": -17.86917495727539, "global_step": 16225, "epoch": 195} {"train_loss": -18.402708053588867, "global_step": 16226, "epoch": 195} {"train_loss": -18.195384979248047, "global_step": 16227, "epoch": 195} {"train_loss": -18.416851043701172, "global_step": 16228, "epoch": 195} {"train_loss": -17.9299373626709, "global_step": 16229, "epoch": 195} {"train_loss": -18.14958953857422, "global_step": 16230, "epoch": 195} {"train_loss": -18.544321060180664, "global_step": 16231, "epoch": 195} {"train_loss": -18.038833618164062, "global_step": 16232, "epoch": 195} {"train_loss": -18.099163055419922, "global_step": 16233, "epoch": 195} {"train_loss": -18.187280654907227, "global_step": 16234, "epoch": 195} {"train_loss": -18.22846031188965, "global_step": 16235, "epoch": 195} {"train_loss": -18.45228385925293, "global_step": 16236, "epoch": 195} {"train_loss": -18.18623924255371, "global_step": 16237, "epoch": 195} {"train_loss": -18.119461059570312, "global_step": 16238, "epoch": 195} {"train_loss": -18.355541229248047, "global_step": 16239, "epoch": 195} {"train_loss": -17.909067153930664, "global_step": 16240, "epoch": 195} {"train_loss": -17.862478256225586, "global_step": 16241, "epoch": 195} {"train_loss": -18.227827072143555, "global_step": 16242, "epoch": 195} {"train_loss": -18.1254940032959, "global_step": 16243, "epoch": 195} {"train_loss": -18.34638023376465, "global_step": 16244, "epoch": 195} {"train_loss": -17.38910675048828, "global_step": 16245, "epoch": 195} {"train_loss": -17.946887969970703, "global_step": 16246, "epoch": 195} {"train_loss": -18.19751739501953, "global_step": 16247, "epoch": 195} {"train_loss": -18.439130783081055, "global_step": 16248, "epoch": 195} {"train_loss": -18.226226806640625, "global_step": 16249, "epoch": 195} {"train_loss": -18.184480667114258, "global_step": 16250, "epoch": 195} {"train_loss": -17.736154556274414, "global_step": 16251, "epoch": 195} {"train_loss": -18.455490112304688, "global_step": 16252, "epoch": 195} {"train_loss": -17.960664749145508, "global_step": 16253, "epoch": 195} {"train_loss": -18.226926803588867, "global_step": 16254, "epoch": 195} {"train_loss": -17.919034957885742, "global_step": 16255, "epoch": 195} {"train_loss": -18.487653732299805, "global_step": 16256, "epoch": 195} {"train_loss": -18.134798049926758, "global_step": 16257, "epoch": 195} {"train_loss": -18.113630294799805, "global_step": 16258, "epoch": 195} {"train_loss": -18.066679000854492, "global_step": 16259, "epoch": 195} {"train_loss": -18.08187484741211, "global_step": 16260, "epoch": 195} {"train_loss": -18.04217529296875, "global_step": 16261, "epoch": 195} {"train_loss": -18.12346839904785, "global_step": 16262, "epoch": 195} {"train_loss": -18.27216911315918, "global_step": 16263, "epoch": 195} {"train_loss": -18.29355239868164, "global_step": 16264, "epoch": 195} {"train_loss": -18.237512588500977, "global_step": 16265, "epoch": 195} {"train_loss": -18.22738265991211, "global_step": 16266, "epoch": 195} {"train_loss": -18.134408445243377, "global_step": 16267, "epoch": 195, "val_loss": 5970005.0} {"train_loss": -17.684865951538086, "global_step": 16268, "epoch": 196} {"train_loss": -18.364294052124023, "global_step": 16269, "epoch": 196} {"train_loss": -17.76786994934082, "global_step": 16270, "epoch": 196} {"train_loss": -17.92441177368164, "global_step": 16271, "epoch": 196} {"train_loss": -18.293943405151367, "global_step": 16272, "epoch": 196} {"train_loss": -17.815351486206055, "global_step": 16273, "epoch": 196} {"train_loss": -18.632638931274414, "global_step": 16274, "epoch": 196} {"train_loss": -18.089128494262695, "global_step": 16275, "epoch": 196} {"train_loss": -18.540969848632812, "global_step": 16276, "epoch": 196} {"train_loss": -18.009878158569336, "global_step": 16277, "epoch": 196} {"train_loss": -18.098730087280273, "global_step": 16278, "epoch": 196} {"train_loss": -17.49605369567871, "global_step": 16279, "epoch": 196} {"train_loss": -18.06673240661621, "global_step": 16280, "epoch": 196} {"train_loss": -18.04545021057129, "global_step": 16281, "epoch": 196} {"train_loss": -17.969785690307617, "global_step": 16282, "epoch": 196} {"train_loss": -18.364030838012695, "global_step": 16283, "epoch": 196} {"train_loss": -18.3348445892334, "global_step": 16284, "epoch": 196} {"train_loss": -17.910123825073242, "global_step": 16285, "epoch": 196} {"train_loss": -18.05386734008789, "global_step": 16286, "epoch": 196} {"train_loss": -17.767820358276367, "global_step": 16287, "epoch": 196} {"train_loss": -18.119056701660156, "global_step": 16288, "epoch": 196} {"train_loss": -17.93214225769043, "global_step": 16289, "epoch": 196} {"train_loss": -17.994543075561523, "global_step": 16290, "epoch": 196} {"train_loss": -18.18610954284668, "global_step": 16291, "epoch": 196} {"train_loss": -18.077747344970703, "global_step": 16292, "epoch": 196} {"train_loss": -18.668182373046875, "global_step": 16293, "epoch": 196} {"train_loss": -18.26355743408203, "global_step": 16294, "epoch": 196} {"train_loss": -18.148590087890625, "global_step": 16295, "epoch": 196} {"train_loss": -18.08030891418457, "global_step": 16296, "epoch": 196} {"train_loss": -18.576677322387695, "global_step": 16297, "epoch": 196} {"train_loss": -17.899337768554688, "global_step": 16298, "epoch": 196} {"train_loss": -18.154272079467773, "global_step": 16299, "epoch": 196} {"train_loss": -18.051389694213867, "global_step": 16300, "epoch": 196} {"train_loss": -18.28961753845215, "global_step": 16301, "epoch": 196} {"train_loss": -18.032766342163086, "global_step": 16302, "epoch": 196} {"train_loss": -18.434762954711914, "global_step": 16303, "epoch": 196} {"train_loss": -18.442907333374023, "global_step": 16304, "epoch": 196} {"train_loss": -18.6280574798584, "global_step": 16305, "epoch": 196} {"train_loss": -18.302366256713867, "global_step": 16306, "epoch": 196} {"train_loss": -18.128101348876953, "global_step": 16307, "epoch": 196} {"train_loss": -18.242420196533203, "global_step": 16308, "epoch": 196} {"train_loss": -18.218887329101562, "global_step": 16309, "epoch": 196} {"train_loss": -18.562482833862305, "global_step": 16310, "epoch": 196} {"train_loss": -18.071002960205078, "global_step": 16311, "epoch": 196} {"train_loss": -17.97132682800293, "global_step": 16312, "epoch": 196} {"train_loss": -18.504913330078125, "global_step": 16313, "epoch": 196} {"train_loss": -18.49725914001465, "global_step": 16314, "epoch": 196} {"train_loss": -18.33138084411621, "global_step": 16315, "epoch": 196} {"train_loss": -18.252981185913086, "global_step": 16316, "epoch": 196} {"train_loss": -18.27976417541504, "global_step": 16317, "epoch": 196} {"train_loss": -18.040250778198242, "global_step": 16318, "epoch": 196} {"train_loss": -17.985252380371094, "global_step": 16319, "epoch": 196} {"train_loss": -18.054641723632812, "global_step": 16320, "epoch": 196} {"train_loss": -18.26272964477539, "global_step": 16321, "epoch": 196} {"train_loss": -17.681079864501953, "global_step": 16322, "epoch": 196} {"train_loss": -18.185287475585938, "global_step": 16323, "epoch": 196} {"train_loss": -18.138917922973633, "global_step": 16324, "epoch": 196} {"train_loss": -18.356876373291016, "global_step": 16325, "epoch": 196} {"train_loss": -18.38520622253418, "global_step": 16326, "epoch": 196} {"train_loss": -17.77301597595215, "global_step": 16327, "epoch": 196} {"train_loss": -18.24344253540039, "global_step": 16328, "epoch": 196} {"train_loss": -18.23270034790039, "global_step": 16329, "epoch": 196} {"train_loss": -18.294340133666992, "global_step": 16330, "epoch": 196} {"train_loss": -18.110023498535156, "global_step": 16331, "epoch": 196} {"train_loss": -18.131147384643555, "global_step": 16332, "epoch": 196} {"train_loss": -18.09341812133789, "global_step": 16333, "epoch": 196} {"train_loss": -18.338144302368164, "global_step": 16334, "epoch": 196} {"train_loss": -18.455171585083008, "global_step": 16335, "epoch": 196} {"train_loss": -18.318937301635742, "global_step": 16336, "epoch": 196} {"train_loss": -17.936264038085938, "global_step": 16337, "epoch": 196} {"train_loss": -17.950902938842773, "global_step": 16338, "epoch": 196} {"train_loss": -18.167869567871094, "global_step": 16339, "epoch": 196} {"train_loss": -18.5151309967041, "global_step": 16340, "epoch": 196} {"train_loss": -18.11881446838379, "global_step": 16341, "epoch": 196} {"train_loss": -18.64866065979004, "global_step": 16342, "epoch": 196} {"train_loss": -18.2994384765625, "global_step": 16343, "epoch": 196} {"train_loss": -18.637929916381836, "global_step": 16344, "epoch": 196} {"train_loss": -18.174890518188477, "global_step": 16345, "epoch": 196} {"train_loss": -18.202817916870117, "global_step": 16346, "epoch": 196} {"train_loss": -17.62212562561035, "global_step": 16347, "epoch": 196} {"train_loss": -18.456478118896484, "global_step": 16348, "epoch": 196} {"train_loss": -18.140541076660156, "global_step": 16349, "epoch": 196} {"train_loss": -18.175679195358093, "global_step": 16350, "epoch": 196, "val_loss": 6027077.0} {"train_loss": -17.82561683654785, "global_step": 16351, "epoch": 197} {"train_loss": -17.878076553344727, "global_step": 16352, "epoch": 197} {"train_loss": -17.8895263671875, "global_step": 16353, "epoch": 197} {"train_loss": -18.164037704467773, "global_step": 16354, "epoch": 197} {"train_loss": -18.421323776245117, "global_step": 16355, "epoch": 197} {"train_loss": -17.948429107666016, "global_step": 16356, "epoch": 197} {"train_loss": -17.8118896484375, "global_step": 16357, "epoch": 197} {"train_loss": -18.000171661376953, "global_step": 16358, "epoch": 197} {"train_loss": -18.16631317138672, "global_step": 16359, "epoch": 197} {"train_loss": -17.86443519592285, "global_step": 16360, "epoch": 197} {"train_loss": -17.676969528198242, "global_step": 16361, "epoch": 197} {"train_loss": -18.640844345092773, "global_step": 16362, "epoch": 197} {"train_loss": -17.71314811706543, "global_step": 16363, "epoch": 197} {"train_loss": -18.53084373474121, "global_step": 16364, "epoch": 197} {"train_loss": -17.988004684448242, "global_step": 16365, "epoch": 197} {"train_loss": -18.03499412536621, "global_step": 16366, "epoch": 197} {"train_loss": -18.26065444946289, "global_step": 16367, "epoch": 197} {"train_loss": -17.859777450561523, "global_step": 16368, "epoch": 197} {"train_loss": -18.30698013305664, "global_step": 16369, "epoch": 197} {"train_loss": -18.169034957885742, "global_step": 16370, "epoch": 197} {"train_loss": -18.15000343322754, "global_step": 16371, "epoch": 197} {"train_loss": -18.2605037689209, "global_step": 16372, "epoch": 197} {"train_loss": -18.493453979492188, "global_step": 16373, "epoch": 197} {"train_loss": -18.209056854248047, "global_step": 16374, "epoch": 197} {"train_loss": -18.197065353393555, "global_step": 16375, "epoch": 197} {"train_loss": -18.01301383972168, "global_step": 16376, "epoch": 197} {"train_loss": -18.49445915222168, "global_step": 16377, "epoch": 197} {"train_loss": -18.336048126220703, "global_step": 16378, "epoch": 197} {"train_loss": -17.91059684753418, "global_step": 16379, "epoch": 197} {"train_loss": -18.17133140563965, "global_step": 16380, "epoch": 197} {"train_loss": -18.26753044128418, "global_step": 16381, "epoch": 197} {"train_loss": -18.01546287536621, "global_step": 16382, "epoch": 197} {"train_loss": -18.36249351501465, "global_step": 16383, "epoch": 197} {"train_loss": -18.017087936401367, "global_step": 16384, "epoch": 197} {"train_loss": -17.88599395751953, "global_step": 16385, "epoch": 197} {"train_loss": -18.215055465698242, "global_step": 16386, "epoch": 197} {"train_loss": -17.748952865600586, "global_step": 16387, "epoch": 197} {"train_loss": -17.822416305541992, "global_step": 16388, "epoch": 197} {"train_loss": -18.000385284423828, "global_step": 16389, "epoch": 197} {"train_loss": -18.27849578857422, "global_step": 16390, "epoch": 197} {"train_loss": -18.31504249572754, "global_step": 16391, "epoch": 197} {"train_loss": -18.596420288085938, "global_step": 16392, "epoch": 197} {"train_loss": -18.3445987701416, "global_step": 16393, "epoch": 197} {"train_loss": -17.98823356628418, "global_step": 16394, "epoch": 197} {"train_loss": -17.976240158081055, "global_step": 16395, "epoch": 197} {"train_loss": -18.50745964050293, "global_step": 16396, "epoch": 197} {"train_loss": -18.459375381469727, "global_step": 16397, "epoch": 197} {"train_loss": -18.30042839050293, "global_step": 16398, "epoch": 197} {"train_loss": -17.974748611450195, "global_step": 16399, "epoch": 197} {"train_loss": -17.944250106811523, "global_step": 16400, "epoch": 197} {"train_loss": -18.057294845581055, "global_step": 16401, "epoch": 197} {"train_loss": -17.86655616760254, "global_step": 16402, "epoch": 197} {"train_loss": -18.47090721130371, "global_step": 16403, "epoch": 197} {"train_loss": -18.17568016052246, "global_step": 16404, "epoch": 197} {"train_loss": -18.087888717651367, "global_step": 16405, "epoch": 197} {"train_loss": -18.34423828125, "global_step": 16406, "epoch": 197} {"train_loss": -18.7522029876709, "global_step": 16407, "epoch": 197} {"train_loss": -18.125219345092773, "global_step": 16408, "epoch": 197} {"train_loss": -18.428800582885742, "global_step": 16409, "epoch": 197} {"train_loss": -18.0429744720459, "global_step": 16410, "epoch": 197} {"train_loss": -18.28785514831543, "global_step": 16411, "epoch": 197} {"train_loss": -18.243757247924805, "global_step": 16412, "epoch": 197} {"train_loss": -18.046518325805664, "global_step": 16413, "epoch": 197} {"train_loss": -18.01854705810547, "global_step": 16414, "epoch": 197} {"train_loss": -18.67298698425293, "global_step": 16415, "epoch": 197} {"train_loss": -18.584003448486328, "global_step": 16416, "epoch": 197} {"train_loss": -17.831113815307617, "global_step": 16417, "epoch": 197} {"train_loss": -18.36862564086914, "global_step": 16418, "epoch": 197} {"train_loss": -18.070951461791992, "global_step": 16419, "epoch": 197} {"train_loss": -18.07683753967285, "global_step": 16420, "epoch": 197} {"train_loss": -18.223495483398438, "global_step": 16421, "epoch": 197} {"train_loss": -17.905668258666992, "global_step": 16422, "epoch": 197} {"train_loss": -18.31079864501953, "global_step": 16423, "epoch": 197} {"train_loss": -18.079252243041992, "global_step": 16424, "epoch": 197} {"train_loss": -18.464340209960938, "global_step": 16425, "epoch": 197} {"train_loss": -18.131494522094727, "global_step": 16426, "epoch": 197} {"train_loss": -18.218490600585938, "global_step": 16427, "epoch": 197} {"train_loss": -18.34779930114746, "global_step": 16428, "epoch": 197} {"train_loss": -17.990589141845703, "global_step": 16429, "epoch": 197} {"train_loss": -17.965600967407227, "global_step": 16430, "epoch": 197} {"train_loss": -18.404438018798828, "global_step": 16431, "epoch": 197} {"train_loss": -18.2078800201416, "global_step": 16432, "epoch": 197} {"train_loss": -18.165260820503693, "global_step": 16433, "epoch": 197, "val_loss": 6025511.0} {"train_loss": -18.154067993164062, "global_step": 16434, "epoch": 198} {"train_loss": -17.931562423706055, "global_step": 16435, "epoch": 198} {"train_loss": -17.742136001586914, "global_step": 16436, "epoch": 198} {"train_loss": -18.13942527770996, "global_step": 16437, "epoch": 198} {"train_loss": -17.931360244750977, "global_step": 16438, "epoch": 198} {"train_loss": -17.853437423706055, "global_step": 16439, "epoch": 198} {"train_loss": -18.28928565979004, "global_step": 16440, "epoch": 198} {"train_loss": -17.92325782775879, "global_step": 16441, "epoch": 198} {"train_loss": -17.742189407348633, "global_step": 16442, "epoch": 198} {"train_loss": -18.35049819946289, "global_step": 16443, "epoch": 198} {"train_loss": -17.905418395996094, "global_step": 16444, "epoch": 198} {"train_loss": -17.83570671081543, "global_step": 16445, "epoch": 198} {"train_loss": -18.12388038635254, "global_step": 16446, "epoch": 198} {"train_loss": -17.884153366088867, "global_step": 16447, "epoch": 198} {"train_loss": -18.19728660583496, "global_step": 16448, "epoch": 198} {"train_loss": -17.553220748901367, "global_step": 16449, "epoch": 198} {"train_loss": -18.445261001586914, "global_step": 16450, "epoch": 198} {"train_loss": -17.837182998657227, "global_step": 16451, "epoch": 198} {"train_loss": -18.393686294555664, "global_step": 16452, "epoch": 198} {"train_loss": -18.08995246887207, "global_step": 16453, "epoch": 198} {"train_loss": -18.035633087158203, "global_step": 16454, "epoch": 198} {"train_loss": -18.287311553955078, "global_step": 16455, "epoch": 198} {"train_loss": -17.729150772094727, "global_step": 16456, "epoch": 198} {"train_loss": -18.030033111572266, "global_step": 16457, "epoch": 198} {"train_loss": -18.05629539489746, "global_step": 16458, "epoch": 198} {"train_loss": -17.979415893554688, "global_step": 16459, "epoch": 198} {"train_loss": -17.93429946899414, "global_step": 16460, "epoch": 198} {"train_loss": -18.119388580322266, "global_step": 16461, "epoch": 198} {"train_loss": -18.234973907470703, "global_step": 16462, "epoch": 198} {"train_loss": -18.339170455932617, "global_step": 16463, "epoch": 198} {"train_loss": -18.354475021362305, "global_step": 16464, "epoch": 198} {"train_loss": -18.064834594726562, "global_step": 16465, "epoch": 198} {"train_loss": -18.3523006439209, "global_step": 16466, "epoch": 198} {"train_loss": -18.133087158203125, "global_step": 16467, "epoch": 198} {"train_loss": -18.177505493164062, "global_step": 16468, "epoch": 198} {"train_loss": -18.157447814941406, "global_step": 16469, "epoch": 198} {"train_loss": -18.202028274536133, "global_step": 16470, "epoch": 198} {"train_loss": -18.039447784423828, "global_step": 16471, "epoch": 198} {"train_loss": -17.869869232177734, "global_step": 16472, "epoch": 198} {"train_loss": -18.28290367126465, "global_step": 16473, "epoch": 198} {"train_loss": -18.49300193786621, "global_step": 16474, "epoch": 198} {"train_loss": -18.072553634643555, "global_step": 16475, "epoch": 198} {"train_loss": -18.171119689941406, "global_step": 16476, "epoch": 198} {"train_loss": -18.280261993408203, "global_step": 16477, "epoch": 198} {"train_loss": -18.24503517150879, "global_step": 16478, "epoch": 198} {"train_loss": -18.293039321899414, "global_step": 16479, "epoch": 198} {"train_loss": -18.17293930053711, "global_step": 16480, "epoch": 198} {"train_loss": -18.441076278686523, "global_step": 16481, "epoch": 198} {"train_loss": -17.726119995117188, "global_step": 16482, "epoch": 198} {"train_loss": -18.360992431640625, "global_step": 16483, "epoch": 198} {"train_loss": -18.10626220703125, "global_step": 16484, "epoch": 198} {"train_loss": -18.297164916992188, "global_step": 16485, "epoch": 198} {"train_loss": -17.907548904418945, "global_step": 16486, "epoch": 198} {"train_loss": -18.048059463500977, "global_step": 16487, "epoch": 198} {"train_loss": -18.491323471069336, "global_step": 16488, "epoch": 198} {"train_loss": -18.50796127319336, "global_step": 16489, "epoch": 198} {"train_loss": -18.16742515563965, "global_step": 16490, "epoch": 198} {"train_loss": -18.094125747680664, "global_step": 16491, "epoch": 198} {"train_loss": -18.334524154663086, "global_step": 16492, "epoch": 198} {"train_loss": -18.350543975830078, "global_step": 16493, "epoch": 198} {"train_loss": -18.110090255737305, "global_step": 16494, "epoch": 198} {"train_loss": -18.539453506469727, "global_step": 16495, "epoch": 198} {"train_loss": -18.116470336914062, "global_step": 16496, "epoch": 198} {"train_loss": -17.912750244140625, "global_step": 16497, "epoch": 198} {"train_loss": -18.427875518798828, "global_step": 16498, "epoch": 198} {"train_loss": -17.82838249206543, "global_step": 16499, "epoch": 198} {"train_loss": -18.310291290283203, "global_step": 16500, "epoch": 198} {"train_loss": -18.124134063720703, "global_step": 16501, "epoch": 198} {"train_loss": -17.72654914855957, "global_step": 16502, "epoch": 198} {"train_loss": -18.130033493041992, "global_step": 16503, "epoch": 198} {"train_loss": -18.30561065673828, "global_step": 16504, "epoch": 198} {"train_loss": -18.260143280029297, "global_step": 16505, "epoch": 198} {"train_loss": -18.07245445251465, "global_step": 16506, "epoch": 198} {"train_loss": -18.309314727783203, "global_step": 16507, "epoch": 198} {"train_loss": -18.042678833007812, "global_step": 16508, "epoch": 198} {"train_loss": -18.111900329589844, "global_step": 16509, "epoch": 198} {"train_loss": -18.362411499023438, "global_step": 16510, "epoch": 198} {"train_loss": -18.14073944091797, "global_step": 16511, "epoch": 198} {"train_loss": -18.339067459106445, "global_step": 16512, "epoch": 198} {"train_loss": -18.169456481933594, "global_step": 16513, "epoch": 198} {"train_loss": -18.035831451416016, "global_step": 16514, "epoch": 198} {"train_loss": -18.233020782470703, "global_step": 16515, "epoch": 198} {"train_loss": -18.102095626922974, "global_step": 16516, "epoch": 198, "val_loss": 6038649.0} {"train_loss": -18.199970245361328, "global_step": 16517, "epoch": 199} {"train_loss": -17.69097900390625, "global_step": 16518, "epoch": 199} {"train_loss": -18.16364860534668, "global_step": 16519, "epoch": 199} {"train_loss": -17.79385757446289, "global_step": 16520, "epoch": 199} {"train_loss": -18.113615036010742, "global_step": 16521, "epoch": 199} {"train_loss": -18.11570167541504, "global_step": 16522, "epoch": 199} {"train_loss": -18.005327224731445, "global_step": 16523, "epoch": 199} {"train_loss": -18.367069244384766, "global_step": 16524, "epoch": 199} {"train_loss": -17.82937240600586, "global_step": 16525, "epoch": 199} {"train_loss": -18.107358932495117, "global_step": 16526, "epoch": 199} {"train_loss": -18.172832489013672, "global_step": 16527, "epoch": 199} {"train_loss": -18.084571838378906, "global_step": 16528, "epoch": 199} {"train_loss": -18.027372360229492, "global_step": 16529, "epoch": 199} {"train_loss": -17.673290252685547, "global_step": 16530, "epoch": 199} {"train_loss": -18.1738224029541, "global_step": 16531, "epoch": 199} {"train_loss": -18.140745162963867, "global_step": 16532, "epoch": 199} {"train_loss": -18.057662963867188, "global_step": 16533, "epoch": 199} {"train_loss": -18.019697189331055, "global_step": 16534, "epoch": 199} {"train_loss": -18.508773803710938, "global_step": 16535, "epoch": 199} {"train_loss": -18.512556076049805, "global_step": 16536, "epoch": 199} {"train_loss": -17.952177047729492, "global_step": 16537, "epoch": 199} {"train_loss": -18.431333541870117, "global_step": 16538, "epoch": 199} {"train_loss": -18.153152465820312, "global_step": 16539, "epoch": 199} {"train_loss": -18.117624282836914, "global_step": 16540, "epoch": 199} {"train_loss": -18.155744552612305, "global_step": 16541, "epoch": 199} {"train_loss": -18.182098388671875, "global_step": 16542, "epoch": 199} {"train_loss": -18.10235595703125, "global_step": 16543, "epoch": 199} {"train_loss": -18.132869720458984, "global_step": 16544, "epoch": 199} {"train_loss": -18.308950424194336, "global_step": 16545, "epoch": 199} {"train_loss": -18.405914306640625, "global_step": 16546, "epoch": 199} {"train_loss": -18.22865867614746, "global_step": 16547, "epoch": 199} {"train_loss": -18.27239990234375, "global_step": 16548, "epoch": 199} {"train_loss": -17.950382232666016, "global_step": 16549, "epoch": 199} {"train_loss": -18.493854522705078, "global_step": 16550, "epoch": 199} {"train_loss": -18.320898056030273, "global_step": 16551, "epoch": 199} {"train_loss": -18.230993270874023, "global_step": 16552, "epoch": 199} {"train_loss": -18.334863662719727, "global_step": 16553, "epoch": 199} {"train_loss": -18.42549705505371, "global_step": 16554, "epoch": 199} {"train_loss": -18.504667282104492, "global_step": 16555, "epoch": 199} {"train_loss": -18.17683982849121, "global_step": 16556, "epoch": 199} {"train_loss": -18.321657180786133, "global_step": 16557, "epoch": 199} {"train_loss": -18.294513702392578, "global_step": 16558, "epoch": 199} {"train_loss": -18.17115592956543, "global_step": 16559, "epoch": 199} {"train_loss": -18.068288803100586, "global_step": 16560, "epoch": 199} {"train_loss": -18.041105270385742, "global_step": 16561, "epoch": 199} {"train_loss": -18.391632080078125, "global_step": 16562, "epoch": 199} {"train_loss": -18.282140731811523, "global_step": 16563, "epoch": 199} {"train_loss": -18.215639114379883, "global_step": 16564, "epoch": 199} {"train_loss": -17.972705841064453, "global_step": 16565, "epoch": 199} {"train_loss": -18.0803165435791, "global_step": 16566, "epoch": 199} {"train_loss": -18.116151809692383, "global_step": 16567, "epoch": 199} {"train_loss": -18.343557357788086, "global_step": 16568, "epoch": 199} {"train_loss": -18.384206771850586, "global_step": 16569, "epoch": 199} {"train_loss": -17.959882736206055, "global_step": 16570, "epoch": 199} {"train_loss": -18.16390609741211, "global_step": 16571, "epoch": 199} {"train_loss": -18.07447624206543, "global_step": 16572, "epoch": 199} {"train_loss": -18.164443969726562, "global_step": 16573, "epoch": 199} {"train_loss": -18.42397117614746, "global_step": 16574, "epoch": 199} {"train_loss": -18.49690055847168, "global_step": 16575, "epoch": 199} {"train_loss": -18.34473991394043, "global_step": 16576, "epoch": 199} {"train_loss": -17.879247665405273, "global_step": 16577, "epoch": 199} {"train_loss": -18.510704040527344, "global_step": 16578, "epoch": 199} {"train_loss": -17.899362564086914, "global_step": 16579, "epoch": 199} {"train_loss": -18.190458297729492, "global_step": 16580, "epoch": 199} {"train_loss": -18.127737045288086, "global_step": 16581, "epoch": 199} {"train_loss": -18.099149703979492, "global_step": 16582, "epoch": 199} {"train_loss": -18.180498123168945, "global_step": 16583, "epoch": 199} {"train_loss": -18.083837509155273, "global_step": 16584, "epoch": 199} {"train_loss": -18.155071258544922, "global_step": 16585, "epoch": 199} {"train_loss": -18.05621337890625, "global_step": 16586, "epoch": 199} {"train_loss": -18.10873031616211, "global_step": 16587, "epoch": 199} {"train_loss": -17.93335723876953, "global_step": 16588, "epoch": 199} {"train_loss": -18.28679656982422, "global_step": 16589, "epoch": 199} {"train_loss": -18.270278930664062, "global_step": 16590, "epoch": 199} {"train_loss": -18.29300880432129, "global_step": 16591, "epoch": 199} {"train_loss": -18.193944931030273, "global_step": 16592, "epoch": 199} {"train_loss": -18.15181541442871, "global_step": 16593, "epoch": 199} {"train_loss": -18.38190269470215, "global_step": 16594, "epoch": 199} {"train_loss": -18.138214111328125, "global_step": 16595, "epoch": 199} {"train_loss": -18.371938705444336, "global_step": 16596, "epoch": 199} {"train_loss": -18.450658798217773, "global_step": 16597, "epoch": 199} {"train_loss": -17.73059844970703, "global_step": 16598, "epoch": 199} {"train_loss": -18.17901324076825, "global_step": 16599, "epoch": 199, "val_loss": 6039014.0} {"train_loss": -18.225465774536133, "global_step": 16600, "epoch": 200} {"train_loss": -18.357898712158203, "global_step": 16601, "epoch": 200} {"train_loss": -17.9368896484375, "global_step": 16602, "epoch": 200} {"train_loss": -17.865018844604492, "global_step": 16603, "epoch": 200} {"train_loss": -18.27193832397461, "global_step": 16604, "epoch": 200} {"train_loss": -18.258974075317383, "global_step": 16605, "epoch": 200} {"train_loss": -18.013444900512695, "global_step": 16606, "epoch": 200} {"train_loss": -18.222257614135742, "global_step": 16607, "epoch": 200} {"train_loss": -18.036052703857422, "global_step": 16608, "epoch": 200} {"train_loss": -18.488718032836914, "global_step": 16609, "epoch": 200} {"train_loss": -18.27813148498535, "global_step": 16610, "epoch": 200} {"train_loss": -17.8145809173584, "global_step": 16611, "epoch": 200} {"train_loss": -18.451845169067383, "global_step": 16612, "epoch": 200} {"train_loss": -18.3940486907959, "global_step": 16613, "epoch": 200} {"train_loss": -18.240398406982422, "global_step": 16614, "epoch": 200} {"train_loss": -18.10772705078125, "global_step": 16615, "epoch": 200} {"train_loss": -18.41853904724121, "global_step": 16616, "epoch": 200} {"train_loss": -18.389341354370117, "global_step": 16617, "epoch": 200} {"train_loss": -18.10988998413086, "global_step": 16618, "epoch": 200} {"train_loss": -18.198808670043945, "global_step": 16619, "epoch": 200} {"train_loss": -18.23006248474121, "global_step": 16620, "epoch": 200} {"train_loss": -18.397092819213867, "global_step": 16621, "epoch": 200} {"train_loss": -18.358057022094727, "global_step": 16622, "epoch": 200} {"train_loss": -18.326841354370117, "global_step": 16623, "epoch": 200} {"train_loss": -18.085756301879883, "global_step": 16624, "epoch": 200} {"train_loss": -17.997509002685547, "global_step": 16625, "epoch": 200} {"train_loss": -18.318370819091797, "global_step": 16626, "epoch": 200} {"train_loss": -18.019577026367188, "global_step": 16627, "epoch": 200} {"train_loss": -18.658212661743164, "global_step": 16628, "epoch": 200} {"train_loss": -18.06954002380371, "global_step": 16629, "epoch": 200} {"train_loss": -17.970144271850586, "global_step": 16630, "epoch": 200} {"train_loss": -18.3978271484375, "global_step": 16631, "epoch": 200} {"train_loss": -18.101613998413086, "global_step": 16632, "epoch": 200} {"train_loss": -18.086660385131836, "global_step": 16633, "epoch": 200} {"train_loss": -17.846906661987305, "global_step": 16634, "epoch": 200} {"train_loss": -17.8084659576416, "global_step": 16635, "epoch": 200} {"train_loss": -18.323232650756836, "global_step": 16636, "epoch": 200} {"train_loss": -18.177091598510742, "global_step": 16637, "epoch": 200} {"train_loss": -17.846193313598633, "global_step": 16638, "epoch": 200} {"train_loss": -18.14795684814453, "global_step": 16639, "epoch": 200} {"train_loss": -18.339975357055664, "global_step": 16640, "epoch": 200} {"train_loss": -18.00141716003418, "global_step": 16641, "epoch": 200} {"train_loss": -17.7154541015625, "global_step": 16642, "epoch": 200} {"train_loss": -18.409345626831055, "global_step": 16643, "epoch": 200} {"train_loss": -18.153654098510742, "global_step": 16644, "epoch": 200} {"train_loss": -17.944889068603516, "global_step": 16645, "epoch": 200} {"train_loss": -17.99152183532715, "global_step": 16646, "epoch": 200} {"train_loss": -18.561416625976562, "global_step": 16647, "epoch": 200} {"train_loss": -18.4765625, "global_step": 16648, "epoch": 200} {"train_loss": -18.43317985534668, "global_step": 16649, "epoch": 200} {"train_loss": -18.0965633392334, "global_step": 16650, "epoch": 200} {"train_loss": -18.00273895263672, "global_step": 16651, "epoch": 200} {"train_loss": -18.535110473632812, "global_step": 16652, "epoch": 200} {"train_loss": -17.9332218170166, "global_step": 16653, "epoch": 200} {"train_loss": -18.5245361328125, "global_step": 16654, "epoch": 200} {"train_loss": -18.188642501831055, "global_step": 16655, "epoch": 200} {"train_loss": -18.262760162353516, "global_step": 16656, "epoch": 200} {"train_loss": -18.267606735229492, "global_step": 16657, "epoch": 200} {"train_loss": -18.130971908569336, "global_step": 16658, "epoch": 200} {"train_loss": -18.337963104248047, "global_step": 16659, "epoch": 200} {"train_loss": -18.158451080322266, "global_step": 16660, "epoch": 200} {"train_loss": -18.2718563079834, "global_step": 16661, "epoch": 200} {"train_loss": -18.246376037597656, "global_step": 16662, "epoch": 200} {"train_loss": -18.33021354675293, "global_step": 16663, "epoch": 200} {"train_loss": -18.117794036865234, "global_step": 16664, "epoch": 200} {"train_loss": -18.430917739868164, "global_step": 16665, "epoch": 200} {"train_loss": -18.200050354003906, "global_step": 16666, "epoch": 200} {"train_loss": -18.120267868041992, "global_step": 16667, "epoch": 200} {"train_loss": -18.51235008239746, "global_step": 16668, "epoch": 200} {"train_loss": -18.134689331054688, "global_step": 16669, "epoch": 200} {"train_loss": -18.5322208404541, "global_step": 16670, "epoch": 200} {"train_loss": -18.122356414794922, "global_step": 16671, "epoch": 200} {"train_loss": -18.546676635742188, "global_step": 16672, "epoch": 200} {"train_loss": -18.370769500732422, "global_step": 16673, "epoch": 200} {"train_loss": -18.37985610961914, "global_step": 16674, "epoch": 200} {"train_loss": -18.11774253845215, "global_step": 16675, "epoch": 200} {"train_loss": -18.171945571899414, "global_step": 16676, "epoch": 200} {"train_loss": -18.1568660736084, "global_step": 16677, "epoch": 200} {"train_loss": -18.066064834594727, "global_step": 16678, "epoch": 200} {"train_loss": -18.30631446838379, "global_step": 16679, "epoch": 200} {"train_loss": -18.001441955566406, "global_step": 16680, "epoch": 200} {"train_loss": -18.03767967224121, "global_step": 16681, "epoch": 200} {"train_loss": -18.183016076145403, "global_step": 16682, "epoch": 200, "train/sim_max_reward_0": 1.0, "train/sim_max_reward_1": 0.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 0.0, "train/sim_max_reward_4": 0.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4500000": 0.0, "test/sim_max_reward_4500001": 0.0, "test/sim_max_reward_4500002": 0.0, "test/sim_max_reward_4500003": 0.0, "test/sim_max_reward_4500004": 0.0, "test/sim_max_reward_4500005": 0.0, "test/sim_max_reward_4500006": 1.0, "test/sim_max_reward_4500007": 0.0, "test/sim_max_reward_4500008": 1.0, "test/sim_max_reward_4500009": 0.0, "test/sim_max_reward_4500010": 0.0, "test/sim_max_reward_4500011": 0.0, "test/sim_max_reward_4500012": 1.0, "test/sim_max_reward_4500013": 1.0, "test/sim_max_reward_4500014": 1.0, "test/sim_max_reward_4500015": 0.0, "test/sim_max_reward_4500016": 0.0, "test/sim_max_reward_4500017": 0.0, "test/sim_max_reward_4500018": 0.0, "test/sim_max_reward_4500019": 0.0, "test/sim_max_reward_4500020": 0.0, "test/sim_max_reward_4500021": 1.0, "train/mean_score": 0.5, "test/mean_score": 0.2727272727272727, "val_loss": 6325432.5} {"train_loss": -18.11858367919922, "global_step": 16683, "epoch": 201} {"train_loss": -18.095184326171875, "global_step": 16684, "epoch": 201} {"train_loss": -17.793502807617188, "global_step": 16685, "epoch": 201} {"train_loss": -18.035608291625977, "global_step": 16686, "epoch": 201} {"train_loss": -18.220869064331055, "global_step": 16687, "epoch": 201} {"train_loss": -17.806842803955078, "global_step": 16688, "epoch": 201} {"train_loss": -18.07440948486328, "global_step": 16689, "epoch": 201} {"train_loss": -18.15302085876465, "global_step": 16690, "epoch": 201} {"train_loss": -18.384017944335938, "global_step": 16691, "epoch": 201} {"train_loss": -18.171945571899414, "global_step": 16692, "epoch": 201} {"train_loss": -17.606460571289062, "global_step": 16693, "epoch": 201} {"train_loss": -18.05984878540039, "global_step": 16694, "epoch": 201} {"train_loss": -18.170217514038086, "global_step": 16695, "epoch": 201} {"train_loss": -18.012914657592773, "global_step": 16696, "epoch": 201} {"train_loss": -18.08987045288086, "global_step": 16697, "epoch": 201} {"train_loss": -17.988683700561523, "global_step": 16698, "epoch": 201} {"train_loss": -17.79067039489746, "global_step": 16699, "epoch": 201} {"train_loss": -17.88739585876465, "global_step": 16700, "epoch": 201} {"train_loss": -18.13658332824707, "global_step": 16701, "epoch": 201} {"train_loss": -17.827226638793945, "global_step": 16702, "epoch": 201} {"train_loss": -17.97138786315918, "global_step": 16703, "epoch": 201} {"train_loss": -18.321062088012695, "global_step": 16704, "epoch": 201} {"train_loss": -18.0462646484375, "global_step": 16705, "epoch": 201} {"train_loss": -17.896390914916992, "global_step": 16706, "epoch": 201} {"train_loss": -17.959930419921875, "global_step": 16707, "epoch": 201} {"train_loss": -18.201963424682617, "global_step": 16708, "epoch": 201} {"train_loss": -17.87099266052246, "global_step": 16709, "epoch": 201} {"train_loss": -17.820898056030273, "global_step": 16710, "epoch": 201} {"train_loss": -18.317302703857422, "global_step": 16711, "epoch": 201} {"train_loss": -18.198633193969727, "global_step": 16712, "epoch": 201} {"train_loss": -18.09627342224121, "global_step": 16713, "epoch": 201} {"train_loss": -18.072973251342773, "global_step": 16714, "epoch": 201} {"train_loss": -18.23752784729004, "global_step": 16715, "epoch": 201} {"train_loss": -18.377912521362305, "global_step": 16716, "epoch": 201} {"train_loss": -18.26447105407715, "global_step": 16717, "epoch": 201} {"train_loss": -18.038135528564453, "global_step": 16718, "epoch": 201} {"train_loss": -18.06890869140625, "global_step": 16719, "epoch": 201} {"train_loss": -18.543886184692383, "global_step": 16720, "epoch": 201} {"train_loss": -18.28986930847168, "global_step": 16721, "epoch": 201} {"train_loss": -18.429677963256836, "global_step": 16722, "epoch": 201} {"train_loss": -18.435436248779297, "global_step": 16723, "epoch": 201} {"train_loss": -18.363746643066406, "global_step": 16724, "epoch": 201} {"train_loss": -18.3902645111084, "global_step": 16725, "epoch": 201} {"train_loss": -17.914413452148438, "global_step": 16726, "epoch": 201} {"train_loss": -18.344377517700195, "global_step": 16727, "epoch": 201} {"train_loss": -18.315404891967773, "global_step": 16728, "epoch": 201} {"train_loss": -18.11998176574707, "global_step": 16729, "epoch": 201} {"train_loss": -18.32630729675293, "global_step": 16730, "epoch": 201} {"train_loss": -18.08909034729004, "global_step": 16731, "epoch": 201} {"train_loss": -17.961585998535156, "global_step": 16732, "epoch": 201} {"train_loss": -18.43185806274414, "global_step": 16733, "epoch": 201} {"train_loss": -18.078781127929688, "global_step": 16734, "epoch": 201} {"train_loss": -18.39179229736328, "global_step": 16735, "epoch": 201} {"train_loss": -18.12213706970215, "global_step": 16736, "epoch": 201} {"train_loss": -17.98871421813965, "global_step": 16737, "epoch": 201} {"train_loss": -18.0212345123291, "global_step": 16738, "epoch": 201} {"train_loss": -18.263246536254883, "global_step": 16739, "epoch": 201} {"train_loss": -18.040361404418945, "global_step": 16740, "epoch": 201} {"train_loss": -18.252052307128906, "global_step": 16741, "epoch": 201} {"train_loss": -17.990875244140625, "global_step": 16742, "epoch": 201} {"train_loss": -18.019201278686523, "global_step": 16743, "epoch": 201} {"train_loss": -18.194740295410156, "global_step": 16744, "epoch": 201} {"train_loss": -18.311437606811523, "global_step": 16745, "epoch": 201} {"train_loss": -18.096054077148438, "global_step": 16746, "epoch": 201} {"train_loss": -18.306310653686523, "global_step": 16747, "epoch": 201} {"train_loss": -18.494487762451172, "global_step": 16748, "epoch": 201} {"train_loss": -17.949432373046875, "global_step": 16749, "epoch": 201} {"train_loss": -18.170623779296875, "global_step": 16750, "epoch": 201} {"train_loss": -18.247371673583984, "global_step": 16751, "epoch": 201} {"train_loss": -18.242725372314453, "global_step": 16752, "epoch": 201} {"train_loss": -18.07090187072754, "global_step": 16753, "epoch": 201} {"train_loss": -18.4873104095459, "global_step": 16754, "epoch": 201} {"train_loss": -18.323665618896484, "global_step": 16755, "epoch": 201} {"train_loss": -18.322654724121094, "global_step": 16756, "epoch": 201} {"train_loss": -18.16933250427246, "global_step": 16757, "epoch": 201} {"train_loss": -18.15096092224121, "global_step": 16758, "epoch": 201} {"train_loss": -18.380813598632812, "global_step": 16759, "epoch": 201} {"train_loss": -17.858854293823242, "global_step": 16760, "epoch": 201} {"train_loss": -18.28917694091797, "global_step": 16761, "epoch": 201} {"train_loss": -18.29805564880371, "global_step": 16762, "epoch": 201} {"train_loss": -18.20754051208496, "global_step": 16763, "epoch": 201} {"train_loss": -18.04574966430664, "global_step": 16764, "epoch": 201} {"train_loss": -18.153648905007238, "global_step": 16765, "epoch": 201, "val_loss": 6116926.0} {"train_loss": -18.25323486328125, "global_step": 16766, "epoch": 202} {"train_loss": -18.140913009643555, "global_step": 16767, "epoch": 202} {"train_loss": -18.23297119140625, "global_step": 16768, "epoch": 202} {"train_loss": -18.016422271728516, "global_step": 16769, "epoch": 202} {"train_loss": -17.906293869018555, "global_step": 16770, "epoch": 202} {"train_loss": -18.287261962890625, "global_step": 16771, "epoch": 202} {"train_loss": -18.037342071533203, "global_step": 16772, "epoch": 202} {"train_loss": -18.102563858032227, "global_step": 16773, "epoch": 202} {"train_loss": -18.04288101196289, "global_step": 16774, "epoch": 202} {"train_loss": -18.054527282714844, "global_step": 16775, "epoch": 202} {"train_loss": -18.282102584838867, "global_step": 16776, "epoch": 202} {"train_loss": -18.372133255004883, "global_step": 16777, "epoch": 202} {"train_loss": -18.54084587097168, "global_step": 16778, "epoch": 202} {"train_loss": -18.13515281677246, "global_step": 16779, "epoch": 202} {"train_loss": -17.98740577697754, "global_step": 16780, "epoch": 202} {"train_loss": -18.462461471557617, "global_step": 16781, "epoch": 202} {"train_loss": -17.999731063842773, "global_step": 16782, "epoch": 202} {"train_loss": -18.371835708618164, "global_step": 16783, "epoch": 202} {"train_loss": -18.44202995300293, "global_step": 16784, "epoch": 202} {"train_loss": -18.312503814697266, "global_step": 16785, "epoch": 202} {"train_loss": -18.15545654296875, "global_step": 16786, "epoch": 202} {"train_loss": -17.953704833984375, "global_step": 16787, "epoch": 202} {"train_loss": -17.958860397338867, "global_step": 16788, "epoch": 202} {"train_loss": -18.076990127563477, "global_step": 16789, "epoch": 202} {"train_loss": -18.118606567382812, "global_step": 16790, "epoch": 202} {"train_loss": -18.133102416992188, "global_step": 16791, "epoch": 202} {"train_loss": -18.133848190307617, "global_step": 16792, "epoch": 202} {"train_loss": -18.286457061767578, "global_step": 16793, "epoch": 202} {"train_loss": -18.309022903442383, "global_step": 16794, "epoch": 202} {"train_loss": -18.290647506713867, "global_step": 16795, "epoch": 202} {"train_loss": -18.15789794921875, "global_step": 16796, "epoch": 202} {"train_loss": -18.480178833007812, "global_step": 16797, "epoch": 202} {"train_loss": -17.974172592163086, "global_step": 16798, "epoch": 202} {"train_loss": -18.215085983276367, "global_step": 16799, "epoch": 202} {"train_loss": -18.389135360717773, "global_step": 16800, "epoch": 202} {"train_loss": -18.46933364868164, "global_step": 16801, "epoch": 202} {"train_loss": -18.03962516784668, "global_step": 16802, "epoch": 202} {"train_loss": -18.430164337158203, "global_step": 16803, "epoch": 202} {"train_loss": -17.995838165283203, "global_step": 16804, "epoch": 202} {"train_loss": -18.04469108581543, "global_step": 16805, "epoch": 202} {"train_loss": -18.43379020690918, "global_step": 16806, "epoch": 202} {"train_loss": -18.109050750732422, "global_step": 16807, "epoch": 202} {"train_loss": -17.891542434692383, "global_step": 16808, "epoch": 202} {"train_loss": -18.163053512573242, "global_step": 16809, "epoch": 202} {"train_loss": -17.633255004882812, "global_step": 16810, "epoch": 202} {"train_loss": -18.33681869506836, "global_step": 16811, "epoch": 202} {"train_loss": -17.91423225402832, "global_step": 16812, "epoch": 202} {"train_loss": -17.826679229736328, "global_step": 16813, "epoch": 202} {"train_loss": -18.021055221557617, "global_step": 16814, "epoch": 202} {"train_loss": -18.678747177124023, "global_step": 16815, "epoch": 202} {"train_loss": -18.39534568786621, "global_step": 16816, "epoch": 202} {"train_loss": -18.25969696044922, "global_step": 16817, "epoch": 202} {"train_loss": -18.164100646972656, "global_step": 16818, "epoch": 202} {"train_loss": -18.118497848510742, "global_step": 16819, "epoch": 202} {"train_loss": -18.079050064086914, "global_step": 16820, "epoch": 202} {"train_loss": -18.031028747558594, "global_step": 16821, "epoch": 202} {"train_loss": -18.33255386352539, "global_step": 16822, "epoch": 202} {"train_loss": -18.279748916625977, "global_step": 16823, "epoch": 202} {"train_loss": -18.010786056518555, "global_step": 16824, "epoch": 202} {"train_loss": -18.094318389892578, "global_step": 16825, "epoch": 202} {"train_loss": -18.58793067932129, "global_step": 16826, "epoch": 202} {"train_loss": -18.312744140625, "global_step": 16827, "epoch": 202} {"train_loss": -17.912071228027344, "global_step": 16828, "epoch": 202} {"train_loss": -18.60244369506836, "global_step": 16829, "epoch": 202} {"train_loss": -18.248239517211914, "global_step": 16830, "epoch": 202} {"train_loss": -17.99018669128418, "global_step": 16831, "epoch": 202} {"train_loss": -17.80597686767578, "global_step": 16832, "epoch": 202} {"train_loss": -18.3883056640625, "global_step": 16833, "epoch": 202} {"train_loss": -18.554983139038086, "global_step": 16834, "epoch": 202} {"train_loss": -18.204206466674805, "global_step": 16835, "epoch": 202} {"train_loss": -18.26873207092285, "global_step": 16836, "epoch": 202} {"train_loss": -18.43086051940918, "global_step": 16837, "epoch": 202} {"train_loss": -18.109039306640625, "global_step": 16838, "epoch": 202} {"train_loss": -18.51804542541504, "global_step": 16839, "epoch": 202} {"train_loss": -18.07382583618164, "global_step": 16840, "epoch": 202} {"train_loss": -18.705289840698242, "global_step": 16841, "epoch": 202} {"train_loss": -18.12721824645996, "global_step": 16842, "epoch": 202} {"train_loss": -18.56494903564453, "global_step": 16843, "epoch": 202} {"train_loss": -18.1940860748291, "global_step": 16844, "epoch": 202} {"train_loss": -17.925283432006836, "global_step": 16845, "epoch": 202} {"train_loss": -18.363025665283203, "global_step": 16846, "epoch": 202} {"train_loss": -18.48059844970703, "global_step": 16847, "epoch": 202} {"train_loss": -18.208465920873437, "global_step": 16848, "epoch": 202, "val_loss": 5994589.5} {"train_loss": -18.053775787353516, "global_step": 16849, "epoch": 203} {"train_loss": -18.086271286010742, "global_step": 16850, "epoch": 203} {"train_loss": -17.92314910888672, "global_step": 16851, "epoch": 203} {"train_loss": -17.845840454101562, "global_step": 16852, "epoch": 203} {"train_loss": -18.306989669799805, "global_step": 16853, "epoch": 203} {"train_loss": -17.927778244018555, "global_step": 16854, "epoch": 203} {"train_loss": -18.041906356811523, "global_step": 16855, "epoch": 203} {"train_loss": -18.017244338989258, "global_step": 16856, "epoch": 203} {"train_loss": -18.47128677368164, "global_step": 16857, "epoch": 203} {"train_loss": -18.015392303466797, "global_step": 16858, "epoch": 203} {"train_loss": -18.610301971435547, "global_step": 16859, "epoch": 203} {"train_loss": -17.988656997680664, "global_step": 16860, "epoch": 203} {"train_loss": -18.22332763671875, "global_step": 16861, "epoch": 203} {"train_loss": -18.308544158935547, "global_step": 16862, "epoch": 203} {"train_loss": -18.162858963012695, "global_step": 16863, "epoch": 203} {"train_loss": -17.7415771484375, "global_step": 16864, "epoch": 203} {"train_loss": -18.0947322845459, "global_step": 16865, "epoch": 203} {"train_loss": -18.28573226928711, "global_step": 16866, "epoch": 203} {"train_loss": -18.407934188842773, "global_step": 16867, "epoch": 203} {"train_loss": -18.07849884033203, "global_step": 16868, "epoch": 203} {"train_loss": -18.367212295532227, "global_step": 16869, "epoch": 203} {"train_loss": -17.962461471557617, "global_step": 16870, "epoch": 203} {"train_loss": -18.361486434936523, "global_step": 16871, "epoch": 203} {"train_loss": -18.021997451782227, "global_step": 16872, "epoch": 203} {"train_loss": -18.151880264282227, "global_step": 16873, "epoch": 203} {"train_loss": -18.412954330444336, "global_step": 16874, "epoch": 203} {"train_loss": -18.201187133789062, "global_step": 16875, "epoch": 203} {"train_loss": -18.278005599975586, "global_step": 16876, "epoch": 203} {"train_loss": -18.439828872680664, "global_step": 16877, "epoch": 203} {"train_loss": -18.594579696655273, "global_step": 16878, "epoch": 203} {"train_loss": -18.326753616333008, "global_step": 16879, "epoch": 203} {"train_loss": -18.69525718688965, "global_step": 16880, "epoch": 203} {"train_loss": -18.522552490234375, "global_step": 16881, "epoch": 203} {"train_loss": -17.783464431762695, "global_step": 16882, "epoch": 203} {"train_loss": -18.21506690979004, "global_step": 16883, "epoch": 203} {"train_loss": -17.878461837768555, "global_step": 16884, "epoch": 203} {"train_loss": -18.36425018310547, "global_step": 16885, "epoch": 203} {"train_loss": -18.055456161499023, "global_step": 16886, "epoch": 203} {"train_loss": -18.18942642211914, "global_step": 16887, "epoch": 203} {"train_loss": -18.295852661132812, "global_step": 16888, "epoch": 203} {"train_loss": -18.079639434814453, "global_step": 16889, "epoch": 203} {"train_loss": -17.858129501342773, "global_step": 16890, "epoch": 203} {"train_loss": -18.329315185546875, "global_step": 16891, "epoch": 203} {"train_loss": -18.12357521057129, "global_step": 16892, "epoch": 203} {"train_loss": -18.287979125976562, "global_step": 16893, "epoch": 203} {"train_loss": -18.388158798217773, "global_step": 16894, "epoch": 203} {"train_loss": -18.397796630859375, "global_step": 16895, "epoch": 203} {"train_loss": -17.839323043823242, "global_step": 16896, "epoch": 203} {"train_loss": -18.2578125, "global_step": 16897, "epoch": 203} {"train_loss": -18.04132652282715, "global_step": 16898, "epoch": 203} {"train_loss": -18.123210906982422, "global_step": 16899, "epoch": 203} {"train_loss": -18.26116371154785, "global_step": 16900, "epoch": 203} {"train_loss": -17.96126365661621, "global_step": 16901, "epoch": 203} {"train_loss": -18.448043823242188, "global_step": 16902, "epoch": 203} {"train_loss": -18.346410751342773, "global_step": 16903, "epoch": 203} {"train_loss": -17.967655181884766, "global_step": 16904, "epoch": 203} {"train_loss": -18.411863327026367, "global_step": 16905, "epoch": 203} {"train_loss": -18.717695236206055, "global_step": 16906, "epoch": 203} {"train_loss": -18.54079818725586, "global_step": 16907, "epoch": 203} {"train_loss": -18.1980037689209, "global_step": 16908, "epoch": 203} {"train_loss": -18.22254753112793, "global_step": 16909, "epoch": 203} {"train_loss": -18.761518478393555, "global_step": 16910, "epoch": 203} {"train_loss": -18.328123092651367, "global_step": 16911, "epoch": 203} {"train_loss": -18.329626083374023, "global_step": 16912, "epoch": 203} {"train_loss": -18.091066360473633, "global_step": 16913, "epoch": 203} {"train_loss": -18.125091552734375, "global_step": 16914, "epoch": 203} {"train_loss": -18.023300170898438, "global_step": 16915, "epoch": 203} {"train_loss": -18.06614112854004, "global_step": 16916, "epoch": 203} {"train_loss": -17.952672958374023, "global_step": 16917, "epoch": 203} {"train_loss": -18.3563232421875, "global_step": 16918, "epoch": 203} {"train_loss": -18.35342025756836, "global_step": 16919, "epoch": 203} {"train_loss": -18.19952392578125, "global_step": 16920, "epoch": 203} {"train_loss": -17.96895408630371, "global_step": 16921, "epoch": 203} {"train_loss": -18.470396041870117, "global_step": 16922, "epoch": 203} {"train_loss": -18.036418914794922, "global_step": 16923, "epoch": 203} {"train_loss": -18.185949325561523, "global_step": 16924, "epoch": 203} {"train_loss": -18.653348922729492, "global_step": 16925, "epoch": 203} {"train_loss": -18.13738250732422, "global_step": 16926, "epoch": 203} {"train_loss": -17.455198287963867, "global_step": 16927, "epoch": 203} {"train_loss": -18.456449508666992, "global_step": 16928, "epoch": 203} {"train_loss": -18.573312759399414, "global_step": 16929, "epoch": 203} {"train_loss": -17.85760498046875, "global_step": 16930, "epoch": 203} {"train_loss": -18.209591532328044, "global_step": 16931, "epoch": 203, "val_loss": 6291723.0} {"train_loss": -17.71061134338379, "global_step": 16932, "epoch": 204} {"train_loss": -17.960790634155273, "global_step": 16933, "epoch": 204} {"train_loss": -18.625120162963867, "global_step": 16934, "epoch": 204} {"train_loss": -18.256967544555664, "global_step": 16935, "epoch": 204} {"train_loss": -18.33505630493164, "global_step": 16936, "epoch": 204} {"train_loss": -18.252172470092773, "global_step": 16937, "epoch": 204} {"train_loss": -18.359037399291992, "global_step": 16938, "epoch": 204} {"train_loss": -18.46198844909668, "global_step": 16939, "epoch": 204} {"train_loss": -17.86663246154785, "global_step": 16940, "epoch": 204} {"train_loss": -18.81105613708496, "global_step": 16941, "epoch": 204} {"train_loss": -18.35663414001465, "global_step": 16942, "epoch": 204} {"train_loss": -18.304534912109375, "global_step": 16943, "epoch": 204} {"train_loss": -18.218027114868164, "global_step": 16944, "epoch": 204} {"train_loss": -18.23874855041504, "global_step": 16945, "epoch": 204} {"train_loss": -17.79806137084961, "global_step": 16946, "epoch": 204} {"train_loss": -18.200916290283203, "global_step": 16947, "epoch": 204} {"train_loss": -18.180011749267578, "global_step": 16948, "epoch": 204} {"train_loss": -17.818885803222656, "global_step": 16949, "epoch": 204} {"train_loss": -18.260501861572266, "global_step": 16950, "epoch": 204} {"train_loss": -18.24881935119629, "global_step": 16951, "epoch": 204} {"train_loss": -18.163522720336914, "global_step": 16952, "epoch": 204} {"train_loss": -18.471561431884766, "global_step": 16953, "epoch": 204} {"train_loss": -18.10358428955078, "global_step": 16954, "epoch": 204} {"train_loss": -18.436447143554688, "global_step": 16955, "epoch": 204} {"train_loss": -18.152090072631836, "global_step": 16956, "epoch": 204} {"train_loss": -18.15870475769043, "global_step": 16957, "epoch": 204} {"train_loss": -18.495344161987305, "global_step": 16958, "epoch": 204} {"train_loss": -17.975852966308594, "global_step": 16959, "epoch": 204} {"train_loss": -17.813505172729492, "global_step": 16960, "epoch": 204} {"train_loss": -17.71116065979004, "global_step": 16961, "epoch": 204} {"train_loss": -18.512195587158203, "global_step": 16962, "epoch": 204} {"train_loss": -18.174665451049805, "global_step": 16963, "epoch": 204} {"train_loss": -17.851123809814453, "global_step": 16964, "epoch": 204} {"train_loss": -18.368572235107422, "global_step": 16965, "epoch": 204} {"train_loss": -18.55338478088379, "global_step": 16966, "epoch": 204} {"train_loss": -18.181976318359375, "global_step": 16967, "epoch": 204} {"train_loss": -17.929096221923828, "global_step": 16968, "epoch": 204} {"train_loss": -18.334325790405273, "global_step": 16969, "epoch": 204} {"train_loss": -18.0843448638916, "global_step": 16970, "epoch": 204} {"train_loss": -18.440702438354492, "global_step": 16971, "epoch": 204} {"train_loss": -18.112300872802734, "global_step": 16972, "epoch": 204} {"train_loss": -17.905406951904297, "global_step": 16973, "epoch": 204} {"train_loss": -18.319293975830078, "global_step": 16974, "epoch": 204} {"train_loss": -17.613861083984375, "global_step": 16975, "epoch": 204} {"train_loss": -18.309127807617188, "global_step": 16976, "epoch": 204} {"train_loss": -18.554214477539062, "global_step": 16977, "epoch": 204} {"train_loss": -18.118009567260742, "global_step": 16978, "epoch": 204} {"train_loss": -18.33130645751953, "global_step": 16979, "epoch": 204} {"train_loss": -18.388975143432617, "global_step": 16980, "epoch": 204} {"train_loss": -18.01532554626465, "global_step": 16981, "epoch": 204} {"train_loss": -17.964338302612305, "global_step": 16982, "epoch": 204} {"train_loss": -17.8456974029541, "global_step": 16983, "epoch": 204} {"train_loss": -18.25128936767578, "global_step": 16984, "epoch": 204} {"train_loss": -18.21010398864746, "global_step": 16985, "epoch": 204} {"train_loss": -18.347631454467773, "global_step": 16986, "epoch": 204} {"train_loss": -18.11037254333496, "global_step": 16987, "epoch": 204} {"train_loss": -18.104209899902344, "global_step": 16988, "epoch": 204} {"train_loss": -18.247446060180664, "global_step": 16989, "epoch": 204} {"train_loss": -18.152257919311523, "global_step": 16990, "epoch": 204} {"train_loss": -18.451980590820312, "global_step": 16991, "epoch": 204} {"train_loss": -18.19545555114746, "global_step": 16992, "epoch": 204} {"train_loss": -17.910879135131836, "global_step": 16993, "epoch": 204} {"train_loss": -18.68694496154785, "global_step": 16994, "epoch": 204} {"train_loss": -18.013816833496094, "global_step": 16995, "epoch": 204} {"train_loss": -18.379840850830078, "global_step": 16996, "epoch": 204} {"train_loss": -17.778305053710938, "global_step": 16997, "epoch": 204} {"train_loss": -18.328031539916992, "global_step": 16998, "epoch": 204} {"train_loss": -18.59848403930664, "global_step": 16999, "epoch": 204} {"train_loss": -17.991727828979492, "global_step": 17000, "epoch": 204} {"train_loss": -18.502164840698242, "global_step": 17001, "epoch": 204} {"train_loss": -18.278268814086914, "global_step": 17002, "epoch": 204} {"train_loss": -18.312841415405273, "global_step": 17003, "epoch": 204} {"train_loss": -18.274948120117188, "global_step": 17004, "epoch": 204} {"train_loss": -18.323331832885742, "global_step": 17005, "epoch": 204} {"train_loss": -18.257741928100586, "global_step": 17006, "epoch": 204} {"train_loss": -18.0891056060791, "global_step": 17007, "epoch": 204} {"train_loss": -18.444257736206055, "global_step": 17008, "epoch": 204} {"train_loss": -18.36737632751465, "global_step": 17009, "epoch": 204} {"train_loss": -18.388586044311523, "global_step": 17010, "epoch": 204} {"train_loss": -18.37294578552246, "global_step": 17011, "epoch": 204} {"train_loss": -18.603513717651367, "global_step": 17012, "epoch": 204} {"train_loss": -18.018735885620117, "global_step": 17013, "epoch": 204} {"train_loss": -18.236907890044062, "global_step": 17014, "epoch": 204, "val_loss": 6000914.0} {"train_loss": -18.206274032592773, "global_step": 17015, "epoch": 205} {"train_loss": -17.915695190429688, "global_step": 17016, "epoch": 205} {"train_loss": -17.478273391723633, "global_step": 17017, "epoch": 205} {"train_loss": -18.154287338256836, "global_step": 17018, "epoch": 205} {"train_loss": -18.592144012451172, "global_step": 17019, "epoch": 205} {"train_loss": -18.3895320892334, "global_step": 17020, "epoch": 205} {"train_loss": -17.953100204467773, "global_step": 17021, "epoch": 205} {"train_loss": -17.975496292114258, "global_step": 17022, "epoch": 205} {"train_loss": -18.116193771362305, "global_step": 17023, "epoch": 205} {"train_loss": -17.864337921142578, "global_step": 17024, "epoch": 205} {"train_loss": -18.067285537719727, "global_step": 17025, "epoch": 205} {"train_loss": -18.75223731994629, "global_step": 17026, "epoch": 205} {"train_loss": -18.390865325927734, "global_step": 17027, "epoch": 205} {"train_loss": -18.57484245300293, "global_step": 17028, "epoch": 205} {"train_loss": -18.3172550201416, "global_step": 17029, "epoch": 205} {"train_loss": -18.440277099609375, "global_step": 17030, "epoch": 205} {"train_loss": -17.990055084228516, "global_step": 17031, "epoch": 205} {"train_loss": -18.32184410095215, "global_step": 17032, "epoch": 205} {"train_loss": -18.457595825195312, "global_step": 17033, "epoch": 205} {"train_loss": -18.355945587158203, "global_step": 17034, "epoch": 205} {"train_loss": -17.983997344970703, "global_step": 17035, "epoch": 205} {"train_loss": -18.119295120239258, "global_step": 17036, "epoch": 205} {"train_loss": -18.36476707458496, "global_step": 17037, "epoch": 205} {"train_loss": -18.483016967773438, "global_step": 17038, "epoch": 205} {"train_loss": -18.07362937927246, "global_step": 17039, "epoch": 205} {"train_loss": -18.431310653686523, "global_step": 17040, "epoch": 205} {"train_loss": -18.00087547302246, "global_step": 17041, "epoch": 205} {"train_loss": -17.91652488708496, "global_step": 17042, "epoch": 205} {"train_loss": -18.296358108520508, "global_step": 17043, "epoch": 205} {"train_loss": -18.618566513061523, "global_step": 17044, "epoch": 205} {"train_loss": -18.31300163269043, "global_step": 17045, "epoch": 205} {"train_loss": -18.0466365814209, "global_step": 17046, "epoch": 205} {"train_loss": -18.144704818725586, "global_step": 17047, "epoch": 205} {"train_loss": -18.284059524536133, "global_step": 17048, "epoch": 205} {"train_loss": -18.276838302612305, "global_step": 17049, "epoch": 205} {"train_loss": -18.196094512939453, "global_step": 17050, "epoch": 205} {"train_loss": -17.73805046081543, "global_step": 17051, "epoch": 205} {"train_loss": -18.372220993041992, "global_step": 17052, "epoch": 205} {"train_loss": -18.404422760009766, "global_step": 17053, "epoch": 205} {"train_loss": -18.18194580078125, "global_step": 17054, "epoch": 205} {"train_loss": -18.214258193969727, "global_step": 17055, "epoch": 205} {"train_loss": -18.24066734313965, "global_step": 17056, "epoch": 205} {"train_loss": -18.432655334472656, "global_step": 17057, "epoch": 205} {"train_loss": -18.26906394958496, "global_step": 17058, "epoch": 205} {"train_loss": -18.031658172607422, "global_step": 17059, "epoch": 205} {"train_loss": -18.074779510498047, "global_step": 17060, "epoch": 205} {"train_loss": -18.121810913085938, "global_step": 17061, "epoch": 205} {"train_loss": -18.366334915161133, "global_step": 17062, "epoch": 205} {"train_loss": -17.768766403198242, "global_step": 17063, "epoch": 205} {"train_loss": -18.39531898498535, "global_step": 17064, "epoch": 205} {"train_loss": -18.113697052001953, "global_step": 17065, "epoch": 205} {"train_loss": -18.329635620117188, "global_step": 17066, "epoch": 205} {"train_loss": -17.8792781829834, "global_step": 17067, "epoch": 205} {"train_loss": -18.279071807861328, "global_step": 17068, "epoch": 205} {"train_loss": -18.26478385925293, "global_step": 17069, "epoch": 205} {"train_loss": -18.198671340942383, "global_step": 17070, "epoch": 205} {"train_loss": -18.092260360717773, "global_step": 17071, "epoch": 205} {"train_loss": -18.460847854614258, "global_step": 17072, "epoch": 205} {"train_loss": -18.258359909057617, "global_step": 17073, "epoch": 205} {"train_loss": -18.379636764526367, "global_step": 17074, "epoch": 205} {"train_loss": -18.320297241210938, "global_step": 17075, "epoch": 205} {"train_loss": -17.936994552612305, "global_step": 17076, "epoch": 205} {"train_loss": -18.242733001708984, "global_step": 17077, "epoch": 205} {"train_loss": -18.21443748474121, "global_step": 17078, "epoch": 205} {"train_loss": -18.221797943115234, "global_step": 17079, "epoch": 205} {"train_loss": -17.951492309570312, "global_step": 17080, "epoch": 205} {"train_loss": -18.556997299194336, "global_step": 17081, "epoch": 205} {"train_loss": -18.309207916259766, "global_step": 17082, "epoch": 205} {"train_loss": -18.519529342651367, "global_step": 17083, "epoch": 205} {"train_loss": -18.195032119750977, "global_step": 17084, "epoch": 205} {"train_loss": -18.31787109375, "global_step": 17085, "epoch": 205} {"train_loss": -18.156583786010742, "global_step": 17086, "epoch": 205} {"train_loss": -17.64993667602539, "global_step": 17087, "epoch": 205} {"train_loss": -18.350875854492188, "global_step": 17088, "epoch": 205} {"train_loss": -17.99518585205078, "global_step": 17089, "epoch": 205} {"train_loss": -18.418231964111328, "global_step": 17090, "epoch": 205} {"train_loss": -18.21149253845215, "global_step": 17091, "epoch": 205} {"train_loss": -17.686290740966797, "global_step": 17092, "epoch": 205} {"train_loss": -18.27487564086914, "global_step": 17093, "epoch": 205} {"train_loss": -18.49318504333496, "global_step": 17094, "epoch": 205} {"train_loss": -18.111289978027344, "global_step": 17095, "epoch": 205} {"train_loss": -18.805612564086914, "global_step": 17096, "epoch": 205} {"train_loss": -18.212766509458245, "global_step": 17097, "epoch": 205, "val_loss": 6174329.0} {"train_loss": -18.1300048828125, "global_step": 17098, "epoch": 206} {"train_loss": -18.11359977722168, "global_step": 17099, "epoch": 206} {"train_loss": -17.561416625976562, "global_step": 17100, "epoch": 206} {"train_loss": -17.87520408630371, "global_step": 17101, "epoch": 206} {"train_loss": -18.306385040283203, "global_step": 17102, "epoch": 206} {"train_loss": -17.92167091369629, "global_step": 17103, "epoch": 206} {"train_loss": -18.172500610351562, "global_step": 17104, "epoch": 206} {"train_loss": -18.200641632080078, "global_step": 17105, "epoch": 206} {"train_loss": -17.8192081451416, "global_step": 17106, "epoch": 206} {"train_loss": -17.488056182861328, "global_step": 17107, "epoch": 206} {"train_loss": -17.723249435424805, "global_step": 17108, "epoch": 206} {"train_loss": -18.01731300354004, "global_step": 17109, "epoch": 206} {"train_loss": -18.110841751098633, "global_step": 17110, "epoch": 206} {"train_loss": -17.975156784057617, "global_step": 17111, "epoch": 206} {"train_loss": -18.199399948120117, "global_step": 17112, "epoch": 206} {"train_loss": -18.039724349975586, "global_step": 17113, "epoch": 206} {"train_loss": -17.92105484008789, "global_step": 17114, "epoch": 206} {"train_loss": -17.98634147644043, "global_step": 17115, "epoch": 206} {"train_loss": -18.471256256103516, "global_step": 17116, "epoch": 206} {"train_loss": -18.473983764648438, "global_step": 17117, "epoch": 206} {"train_loss": -18.240299224853516, "global_step": 17118, "epoch": 206} {"train_loss": -18.409162521362305, "global_step": 17119, "epoch": 206} {"train_loss": -18.291227340698242, "global_step": 17120, "epoch": 206} {"train_loss": -18.250043869018555, "global_step": 17121, "epoch": 206} {"train_loss": -17.858224868774414, "global_step": 17122, "epoch": 206} {"train_loss": -17.92620277404785, "global_step": 17123, "epoch": 206} {"train_loss": -18.542781829833984, "global_step": 17124, "epoch": 206} {"train_loss": -18.462682723999023, "global_step": 17125, "epoch": 206} {"train_loss": -18.378570556640625, "global_step": 17126, "epoch": 206} {"train_loss": -18.40059471130371, "global_step": 17127, "epoch": 206} {"train_loss": -18.542585372924805, "global_step": 17128, "epoch": 206} {"train_loss": -18.075624465942383, "global_step": 17129, "epoch": 206} {"train_loss": -18.272724151611328, "global_step": 17130, "epoch": 206} {"train_loss": -18.158620834350586, "global_step": 17131, "epoch": 206} {"train_loss": -18.316665649414062, "global_step": 17132, "epoch": 206} {"train_loss": -18.31117057800293, "global_step": 17133, "epoch": 206} {"train_loss": -18.35112953186035, "global_step": 17134, "epoch": 206} {"train_loss": -18.08876609802246, "global_step": 17135, "epoch": 206} {"train_loss": -18.417877197265625, "global_step": 17136, "epoch": 206} {"train_loss": -18.524587631225586, "global_step": 17137, "epoch": 206} {"train_loss": -18.538238525390625, "global_step": 17138, "epoch": 206} {"train_loss": -18.18898582458496, "global_step": 17139, "epoch": 206} {"train_loss": -18.23763656616211, "global_step": 17140, "epoch": 206} {"train_loss": -17.94159507751465, "global_step": 17141, "epoch": 206} {"train_loss": -18.423959732055664, "global_step": 17142, "epoch": 206} {"train_loss": -18.294021606445312, "global_step": 17143, "epoch": 206} {"train_loss": -17.87477684020996, "global_step": 17144, "epoch": 206} {"train_loss": -18.654184341430664, "global_step": 17145, "epoch": 206} {"train_loss": -18.364526748657227, "global_step": 17146, "epoch": 206} {"train_loss": -18.152875900268555, "global_step": 17147, "epoch": 206} {"train_loss": -18.129711151123047, "global_step": 17148, "epoch": 206} {"train_loss": -17.97393798828125, "global_step": 17149, "epoch": 206} {"train_loss": -17.843122482299805, "global_step": 17150, "epoch": 206} {"train_loss": -18.352859497070312, "global_step": 17151, "epoch": 206} {"train_loss": -18.44957733154297, "global_step": 17152, "epoch": 206} {"train_loss": -18.37200927734375, "global_step": 17153, "epoch": 206} {"train_loss": -18.64798355102539, "global_step": 17154, "epoch": 206} {"train_loss": -18.149700164794922, "global_step": 17155, "epoch": 206} {"train_loss": -18.128854751586914, "global_step": 17156, "epoch": 206} {"train_loss": -18.306476593017578, "global_step": 17157, "epoch": 206} {"train_loss": -18.014089584350586, "global_step": 17158, "epoch": 206} {"train_loss": -18.01190757751465, "global_step": 17159, "epoch": 206} {"train_loss": -18.050230026245117, "global_step": 17160, "epoch": 206} {"train_loss": -17.86652183532715, "global_step": 17161, "epoch": 206} {"train_loss": -18.308197021484375, "global_step": 17162, "epoch": 206} {"train_loss": -17.969221115112305, "global_step": 17163, "epoch": 206} {"train_loss": -18.174169540405273, "global_step": 17164, "epoch": 206} {"train_loss": -18.221200942993164, "global_step": 17165, "epoch": 206} {"train_loss": -18.403553009033203, "global_step": 17166, "epoch": 206} {"train_loss": -17.966176986694336, "global_step": 17167, "epoch": 206} {"train_loss": -18.131006240844727, "global_step": 17168, "epoch": 206} {"train_loss": -18.155197143554688, "global_step": 17169, "epoch": 206} {"train_loss": -18.412261962890625, "global_step": 17170, "epoch": 206} {"train_loss": -18.420339584350586, "global_step": 17171, "epoch": 206} {"train_loss": -17.87288475036621, "global_step": 17172, "epoch": 206} {"train_loss": -18.119577407836914, "global_step": 17173, "epoch": 206} {"train_loss": -18.62354850769043, "global_step": 17174, "epoch": 206} {"train_loss": -18.203792572021484, "global_step": 17175, "epoch": 206} {"train_loss": -18.369314193725586, "global_step": 17176, "epoch": 206} {"train_loss": -18.06733512878418, "global_step": 17177, "epoch": 206} {"train_loss": -18.306171417236328, "global_step": 17178, "epoch": 206} {"train_loss": -18.332326889038086, "global_step": 17179, "epoch": 206} {"train_loss": -18.182948813380964, "global_step": 17180, "epoch": 206, "val_loss": 5992804.0} {"train_loss": -17.904653549194336, "global_step": 17181, "epoch": 207} {"train_loss": -17.98487663269043, "global_step": 17182, "epoch": 207} {"train_loss": -17.775909423828125, "global_step": 17183, "epoch": 207} {"train_loss": -18.37908363342285, "global_step": 17184, "epoch": 207} {"train_loss": -18.184003829956055, "global_step": 17185, "epoch": 207} {"train_loss": -18.227041244506836, "global_step": 17186, "epoch": 207} {"train_loss": -17.759552001953125, "global_step": 17187, "epoch": 207} {"train_loss": -18.077295303344727, "global_step": 17188, "epoch": 207} {"train_loss": -17.9852352142334, "global_step": 17189, "epoch": 207} {"train_loss": -17.85244369506836, "global_step": 17190, "epoch": 207} {"train_loss": -17.609256744384766, "global_step": 17191, "epoch": 207} {"train_loss": -18.333372116088867, "global_step": 17192, "epoch": 207} {"train_loss": -18.489395141601562, "global_step": 17193, "epoch": 207} {"train_loss": -18.260791778564453, "global_step": 17194, "epoch": 207} {"train_loss": -18.205049514770508, "global_step": 17195, "epoch": 207} {"train_loss": -18.020408630371094, "global_step": 17196, "epoch": 207} {"train_loss": -18.0109920501709, "global_step": 17197, "epoch": 207} {"train_loss": -17.889150619506836, "global_step": 17198, "epoch": 207} {"train_loss": -17.75420570373535, "global_step": 17199, "epoch": 207} {"train_loss": -18.44162368774414, "global_step": 17200, "epoch": 207} {"train_loss": -17.7091064453125, "global_step": 17201, "epoch": 207} {"train_loss": -18.341785430908203, "global_step": 17202, "epoch": 207} {"train_loss": -17.846546173095703, "global_step": 17203, "epoch": 207} {"train_loss": -18.06436538696289, "global_step": 17204, "epoch": 207} {"train_loss": -17.895395278930664, "global_step": 17205, "epoch": 207} {"train_loss": -17.93204689025879, "global_step": 17206, "epoch": 207} {"train_loss": -18.077838897705078, "global_step": 17207, "epoch": 207} {"train_loss": -18.367990493774414, "global_step": 17208, "epoch": 207} {"train_loss": -17.87442970275879, "global_step": 17209, "epoch": 207} {"train_loss": -17.906347274780273, "global_step": 17210, "epoch": 207} {"train_loss": -18.21398162841797, "global_step": 17211, "epoch": 207} {"train_loss": -17.87093734741211, "global_step": 17212, "epoch": 207} {"train_loss": -18.089162826538086, "global_step": 17213, "epoch": 207} {"train_loss": -18.069316864013672, "global_step": 17214, "epoch": 207} {"train_loss": -17.740835189819336, "global_step": 17215, "epoch": 207} {"train_loss": -18.11346435546875, "global_step": 17216, "epoch": 207} {"train_loss": -18.245153427124023, "global_step": 17217, "epoch": 207} {"train_loss": -17.987226486206055, "global_step": 17218, "epoch": 207} {"train_loss": -18.18450355529785, "global_step": 17219, "epoch": 207} {"train_loss": -18.476415634155273, "global_step": 17220, "epoch": 207} {"train_loss": -18.019094467163086, "global_step": 17221, "epoch": 207} {"train_loss": -18.113840103149414, "global_step": 17222, "epoch": 207} {"train_loss": -18.241830825805664, "global_step": 17223, "epoch": 207} {"train_loss": -18.274639129638672, "global_step": 17224, "epoch": 207} {"train_loss": -18.136884689331055, "global_step": 17225, "epoch": 207} {"train_loss": -18.413801193237305, "global_step": 17226, "epoch": 207} {"train_loss": -18.305856704711914, "global_step": 17227, "epoch": 207} {"train_loss": -17.958740234375, "global_step": 17228, "epoch": 207} {"train_loss": -18.19550895690918, "global_step": 17229, "epoch": 207} {"train_loss": -18.09223175048828, "global_step": 17230, "epoch": 207} {"train_loss": -17.8561954498291, "global_step": 17231, "epoch": 207} {"train_loss": -17.921920776367188, "global_step": 17232, "epoch": 207} {"train_loss": -17.94198989868164, "global_step": 17233, "epoch": 207} {"train_loss": -18.056617736816406, "global_step": 17234, "epoch": 207} {"train_loss": -17.987613677978516, "global_step": 17235, "epoch": 207} {"train_loss": -18.090576171875, "global_step": 17236, "epoch": 207} {"train_loss": -18.079587936401367, "global_step": 17237, "epoch": 207} {"train_loss": -18.132198333740234, "global_step": 17238, "epoch": 207} {"train_loss": -18.106096267700195, "global_step": 17239, "epoch": 207} {"train_loss": -18.20316505432129, "global_step": 17240, "epoch": 207} {"train_loss": -17.852548599243164, "global_step": 17241, "epoch": 207} {"train_loss": -18.66008949279785, "global_step": 17242, "epoch": 207} {"train_loss": -18.186471939086914, "global_step": 17243, "epoch": 207} {"train_loss": -17.921489715576172, "global_step": 17244, "epoch": 207} {"train_loss": -18.078174591064453, "global_step": 17245, "epoch": 207} {"train_loss": -17.607229232788086, "global_step": 17246, "epoch": 207} {"train_loss": -18.138690948486328, "global_step": 17247, "epoch": 207} {"train_loss": -18.294677734375, "global_step": 17248, "epoch": 207} {"train_loss": -18.556684494018555, "global_step": 17249, "epoch": 207} {"train_loss": -18.368661880493164, "global_step": 17250, "epoch": 207} {"train_loss": -18.211172103881836, "global_step": 17251, "epoch": 207} {"train_loss": -18.03558349609375, "global_step": 17252, "epoch": 207} {"train_loss": -18.318769454956055, "global_step": 17253, "epoch": 207} {"train_loss": -18.27895736694336, "global_step": 17254, "epoch": 207} {"train_loss": -18.204410552978516, "global_step": 17255, "epoch": 207} {"train_loss": -17.883163452148438, "global_step": 17256, "epoch": 207} {"train_loss": -17.938562393188477, "global_step": 17257, "epoch": 207} {"train_loss": -18.42693519592285, "global_step": 17258, "epoch": 207} {"train_loss": -18.395383834838867, "global_step": 17259, "epoch": 207} {"train_loss": -17.9538631439209, "global_step": 17260, "epoch": 207} {"train_loss": -17.977441787719727, "global_step": 17261, "epoch": 207} {"train_loss": -17.916271209716797, "global_step": 17262, "epoch": 207} {"train_loss": -18.091003349028437, "global_step": 17263, "epoch": 207, "val_loss": 6509725.0} {"train_loss": -17.213443756103516, "global_step": 17264, "epoch": 208} {"train_loss": -17.366304397583008, "global_step": 17265, "epoch": 208} {"train_loss": -17.699268341064453, "global_step": 17266, "epoch": 208} {"train_loss": -17.98711585998535, "global_step": 17267, "epoch": 208} {"train_loss": -17.823177337646484, "global_step": 17268, "epoch": 208} {"train_loss": -17.986988067626953, "global_step": 17269, "epoch": 208} {"train_loss": -17.7437801361084, "global_step": 17270, "epoch": 208} {"train_loss": -17.993131637573242, "global_step": 17271, "epoch": 208} {"train_loss": -17.48061180114746, "global_step": 17272, "epoch": 208} {"train_loss": -18.15011978149414, "global_step": 17273, "epoch": 208} {"train_loss": -17.95427894592285, "global_step": 17274, "epoch": 208} {"train_loss": -17.724563598632812, "global_step": 17275, "epoch": 208} {"train_loss": -18.157007217407227, "global_step": 17276, "epoch": 208} {"train_loss": -17.886383056640625, "global_step": 17277, "epoch": 208} {"train_loss": -17.97684097290039, "global_step": 17278, "epoch": 208} {"train_loss": -18.184799194335938, "global_step": 17279, "epoch": 208} {"train_loss": -17.656164169311523, "global_step": 17280, "epoch": 208} {"train_loss": -18.1086483001709, "global_step": 17281, "epoch": 208} {"train_loss": -17.829395294189453, "global_step": 17282, "epoch": 208} {"train_loss": -18.369308471679688, "global_step": 17283, "epoch": 208} {"train_loss": -18.042400360107422, "global_step": 17284, "epoch": 208} {"train_loss": -18.0426025390625, "global_step": 17285, "epoch": 208} {"train_loss": -18.349376678466797, "global_step": 17286, "epoch": 208} {"train_loss": -18.136106491088867, "global_step": 17287, "epoch": 208} {"train_loss": -18.505414962768555, "global_step": 17288, "epoch": 208} {"train_loss": -17.964811325073242, "global_step": 17289, "epoch": 208} {"train_loss": -18.074125289916992, "global_step": 17290, "epoch": 208} {"train_loss": -18.490896224975586, "global_step": 17291, "epoch": 208} {"train_loss": -18.122116088867188, "global_step": 17292, "epoch": 208} {"train_loss": -17.870838165283203, "global_step": 17293, "epoch": 208} {"train_loss": -18.16664695739746, "global_step": 17294, "epoch": 208} {"train_loss": -18.197818756103516, "global_step": 17295, "epoch": 208} {"train_loss": -17.985328674316406, "global_step": 17296, "epoch": 208} {"train_loss": -18.198856353759766, "global_step": 17297, "epoch": 208} {"train_loss": -18.123987197875977, "global_step": 17298, "epoch": 208} {"train_loss": -18.567869186401367, "global_step": 17299, "epoch": 208} {"train_loss": -18.273786544799805, "global_step": 17300, "epoch": 208} {"train_loss": -17.703327178955078, "global_step": 17301, "epoch": 208} {"train_loss": -18.125003814697266, "global_step": 17302, "epoch": 208} {"train_loss": -18.42580223083496, "global_step": 17303, "epoch": 208} {"train_loss": -18.044506072998047, "global_step": 17304, "epoch": 208} {"train_loss": -18.06727409362793, "global_step": 17305, "epoch": 208} {"train_loss": -18.42376136779785, "global_step": 17306, "epoch": 208} {"train_loss": -18.022937774658203, "global_step": 17307, "epoch": 208} {"train_loss": -18.367231369018555, "global_step": 17308, "epoch": 208} {"train_loss": -17.883821487426758, "global_step": 17309, "epoch": 208} {"train_loss": -18.231775283813477, "global_step": 17310, "epoch": 208} {"train_loss": -18.049869537353516, "global_step": 17311, "epoch": 208} {"train_loss": -17.519821166992188, "global_step": 17312, "epoch": 208} {"train_loss": -18.322721481323242, "global_step": 17313, "epoch": 208} {"train_loss": -18.293790817260742, "global_step": 17314, "epoch": 208} {"train_loss": -17.97776222229004, "global_step": 17315, "epoch": 208} {"train_loss": -18.19887924194336, "global_step": 17316, "epoch": 208} {"train_loss": -18.13495445251465, "global_step": 17317, "epoch": 208} {"train_loss": -18.25896644592285, "global_step": 17318, "epoch": 208} {"train_loss": -18.537527084350586, "global_step": 17319, "epoch": 208} {"train_loss": -18.455381393432617, "global_step": 17320, "epoch": 208} {"train_loss": -18.49323844909668, "global_step": 17321, "epoch": 208} {"train_loss": -18.433931350708008, "global_step": 17322, "epoch": 208} {"train_loss": -18.02528953552246, "global_step": 17323, "epoch": 208} {"train_loss": -18.076068878173828, "global_step": 17324, "epoch": 208} {"train_loss": -18.26715087890625, "global_step": 17325, "epoch": 208} {"train_loss": -18.038930892944336, "global_step": 17326, "epoch": 208} {"train_loss": -18.027103424072266, "global_step": 17327, "epoch": 208} {"train_loss": -18.302698135375977, "global_step": 17328, "epoch": 208} {"train_loss": -18.07019805908203, "global_step": 17329, "epoch": 208} {"train_loss": -18.146650314331055, "global_step": 17330, "epoch": 208} {"train_loss": -18.434471130371094, "global_step": 17331, "epoch": 208} {"train_loss": -18.070743560791016, "global_step": 17332, "epoch": 208} {"train_loss": -18.30340576171875, "global_step": 17333, "epoch": 208} {"train_loss": -17.840612411499023, "global_step": 17334, "epoch": 208} {"train_loss": -18.594099044799805, "global_step": 17335, "epoch": 208} {"train_loss": -18.58400535583496, "global_step": 17336, "epoch": 208} {"train_loss": -18.444122314453125, "global_step": 17337, "epoch": 208} {"train_loss": -18.40254020690918, "global_step": 17338, "epoch": 208} {"train_loss": -17.77559471130371, "global_step": 17339, "epoch": 208} {"train_loss": -18.26849365234375, "global_step": 17340, "epoch": 208} {"train_loss": -18.274621963500977, "global_step": 17341, "epoch": 208} {"train_loss": -17.973655700683594, "global_step": 17342, "epoch": 208} {"train_loss": -18.31906509399414, "global_step": 17343, "epoch": 208} {"train_loss": -18.27252769470215, "global_step": 17344, "epoch": 208} {"train_loss": -18.232173919677734, "global_step": 17345, "epoch": 208} {"train_loss": -18.127238537891802, "global_step": 17346, "epoch": 208, "val_loss": 5867597.0} {"train_loss": -18.206968307495117, "global_step": 17347, "epoch": 209} {"train_loss": -18.14873504638672, "global_step": 17348, "epoch": 209} {"train_loss": -18.051742553710938, "global_step": 17349, "epoch": 209} {"train_loss": -18.205408096313477, "global_step": 17350, "epoch": 209} {"train_loss": -18.39301300048828, "global_step": 17351, "epoch": 209} {"train_loss": -18.36652183532715, "global_step": 17352, "epoch": 209} {"train_loss": -17.88643455505371, "global_step": 17353, "epoch": 209} {"train_loss": -18.445810317993164, "global_step": 17354, "epoch": 209} {"train_loss": -18.27998924255371, "global_step": 17355, "epoch": 209} {"train_loss": -18.33082389831543, "global_step": 17356, "epoch": 209} {"train_loss": -18.282194137573242, "global_step": 17357, "epoch": 209} {"train_loss": -18.337125778198242, "global_step": 17358, "epoch": 209} {"train_loss": -18.179386138916016, "global_step": 17359, "epoch": 209} {"train_loss": -18.093019485473633, "global_step": 17360, "epoch": 209} {"train_loss": -18.679025650024414, "global_step": 17361, "epoch": 209} {"train_loss": -18.804773330688477, "global_step": 17362, "epoch": 209} {"train_loss": -18.528234481811523, "global_step": 17363, "epoch": 209} {"train_loss": -18.50174903869629, "global_step": 17364, "epoch": 209} {"train_loss": -18.199844360351562, "global_step": 17365, "epoch": 209} {"train_loss": -17.88857078552246, "global_step": 17366, "epoch": 209} {"train_loss": -18.18254852294922, "global_step": 17367, "epoch": 209} {"train_loss": -18.187667846679688, "global_step": 17368, "epoch": 209} {"train_loss": -18.36030387878418, "global_step": 17369, "epoch": 209} {"train_loss": -18.220924377441406, "global_step": 17370, "epoch": 209} {"train_loss": -18.05595588684082, "global_step": 17371, "epoch": 209} {"train_loss": -18.167564392089844, "global_step": 17372, "epoch": 209} {"train_loss": -18.430089950561523, "global_step": 17373, "epoch": 209} {"train_loss": -18.05182647705078, "global_step": 17374, "epoch": 209} {"train_loss": -18.37507438659668, "global_step": 17375, "epoch": 209} {"train_loss": -18.57269287109375, "global_step": 17376, "epoch": 209} {"train_loss": -18.2884578704834, "global_step": 17377, "epoch": 209} {"train_loss": -17.855148315429688, "global_step": 17378, "epoch": 209} {"train_loss": -18.568016052246094, "global_step": 17379, "epoch": 209} {"train_loss": -18.477405548095703, "global_step": 17380, "epoch": 209} {"train_loss": -18.16650390625, "global_step": 17381, "epoch": 209} {"train_loss": -18.510095596313477, "global_step": 17382, "epoch": 209} {"train_loss": -17.705121994018555, "global_step": 17383, "epoch": 209} {"train_loss": -18.818639755249023, "global_step": 17384, "epoch": 209} {"train_loss": -18.230335235595703, "global_step": 17385, "epoch": 209} {"train_loss": -18.335330963134766, "global_step": 17386, "epoch": 209} {"train_loss": -18.297353744506836, "global_step": 17387, "epoch": 209} {"train_loss": -18.297101974487305, "global_step": 17388, "epoch": 209} {"train_loss": -18.11805534362793, "global_step": 17389, "epoch": 209} {"train_loss": -18.164566040039062, "global_step": 17390, "epoch": 209} {"train_loss": -18.47484016418457, "global_step": 17391, "epoch": 209} {"train_loss": -18.275272369384766, "global_step": 17392, "epoch": 209} {"train_loss": -18.471302032470703, "global_step": 17393, "epoch": 209} {"train_loss": -18.385427474975586, "global_step": 17394, "epoch": 209} {"train_loss": -18.210556030273438, "global_step": 17395, "epoch": 209} {"train_loss": -18.22381591796875, "global_step": 17396, "epoch": 209} {"train_loss": -17.89666748046875, "global_step": 17397, "epoch": 209} {"train_loss": -18.061298370361328, "global_step": 17398, "epoch": 209} {"train_loss": -18.071929931640625, "global_step": 17399, "epoch": 209} {"train_loss": -18.281309127807617, "global_step": 17400, "epoch": 209} {"train_loss": -18.400650024414062, "global_step": 17401, "epoch": 209} {"train_loss": -18.000917434692383, "global_step": 17402, "epoch": 209} {"train_loss": -18.43564796447754, "global_step": 17403, "epoch": 209} {"train_loss": -18.308670043945312, "global_step": 17404, "epoch": 209} {"train_loss": -17.865177154541016, "global_step": 17405, "epoch": 209} {"train_loss": -18.181310653686523, "global_step": 17406, "epoch": 209} {"train_loss": -18.064626693725586, "global_step": 17407, "epoch": 209} {"train_loss": -18.195981979370117, "global_step": 17408, "epoch": 209} {"train_loss": -18.440811157226562, "global_step": 17409, "epoch": 209} {"train_loss": -18.642160415649414, "global_step": 17410, "epoch": 209} {"train_loss": -18.430830001831055, "global_step": 17411, "epoch": 209} {"train_loss": -18.246828079223633, "global_step": 17412, "epoch": 209} {"train_loss": -18.284852981567383, "global_step": 17413, "epoch": 209} {"train_loss": -18.02919578552246, "global_step": 17414, "epoch": 209} {"train_loss": -18.290307998657227, "global_step": 17415, "epoch": 209} {"train_loss": -18.278818130493164, "global_step": 17416, "epoch": 209} {"train_loss": -18.350692749023438, "global_step": 17417, "epoch": 209} {"train_loss": -18.2838191986084, "global_step": 17418, "epoch": 209} {"train_loss": -18.24947738647461, "global_step": 17419, "epoch": 209} {"train_loss": -18.187646865844727, "global_step": 17420, "epoch": 209} {"train_loss": -18.390583038330078, "global_step": 17421, "epoch": 209} {"train_loss": -18.273340225219727, "global_step": 17422, "epoch": 209} {"train_loss": -18.322765350341797, "global_step": 17423, "epoch": 209} {"train_loss": -18.091768264770508, "global_step": 17424, "epoch": 209} {"train_loss": -18.00620460510254, "global_step": 17425, "epoch": 209} {"train_loss": -17.924705505371094, "global_step": 17426, "epoch": 209} {"train_loss": -18.447540283203125, "global_step": 17427, "epoch": 209} {"train_loss": -18.1285457611084, "global_step": 17428, "epoch": 209} {"train_loss": -18.264851627579656, "global_step": 17429, "epoch": 209, "val_loss": 5757905.5} {"train_loss": -17.9748477935791, "global_step": 17430, "epoch": 210} {"train_loss": -18.0067195892334, "global_step": 17431, "epoch": 210} {"train_loss": -17.82605743408203, "global_step": 17432, "epoch": 210} {"train_loss": -17.97562026977539, "global_step": 17433, "epoch": 210} {"train_loss": -18.165403366088867, "global_step": 17434, "epoch": 210} {"train_loss": -17.74668312072754, "global_step": 17435, "epoch": 210} {"train_loss": -17.999576568603516, "global_step": 17436, "epoch": 210} {"train_loss": -18.3172664642334, "global_step": 17437, "epoch": 210} {"train_loss": -18.28605079650879, "global_step": 17438, "epoch": 210} {"train_loss": -18.25453758239746, "global_step": 17439, "epoch": 210} {"train_loss": -18.145278930664062, "global_step": 17440, "epoch": 210} {"train_loss": -17.8179988861084, "global_step": 17441, "epoch": 210} {"train_loss": -18.33056640625, "global_step": 17442, "epoch": 210} {"train_loss": -18.391958236694336, "global_step": 17443, "epoch": 210} {"train_loss": -18.340375900268555, "global_step": 17444, "epoch": 210} {"train_loss": -18.23996925354004, "global_step": 17445, "epoch": 210} {"train_loss": -18.23284912109375, "global_step": 17446, "epoch": 210} {"train_loss": -17.96061134338379, "global_step": 17447, "epoch": 210} {"train_loss": -18.03778648376465, "global_step": 17448, "epoch": 210} {"train_loss": -18.25680923461914, "global_step": 17449, "epoch": 210} {"train_loss": -18.346046447753906, "global_step": 17450, "epoch": 210} {"train_loss": -17.982078552246094, "global_step": 17451, "epoch": 210} {"train_loss": -18.14460563659668, "global_step": 17452, "epoch": 210} {"train_loss": -18.474992752075195, "global_step": 17453, "epoch": 210} {"train_loss": -18.46034049987793, "global_step": 17454, "epoch": 210} {"train_loss": -18.328664779663086, "global_step": 17455, "epoch": 210} {"train_loss": -18.216472625732422, "global_step": 17456, "epoch": 210} {"train_loss": -18.567739486694336, "global_step": 17457, "epoch": 210} {"train_loss": -18.70368766784668, "global_step": 17458, "epoch": 210} {"train_loss": -18.159423828125, "global_step": 17459, "epoch": 210} {"train_loss": -18.175987243652344, "global_step": 17460, "epoch": 210} {"train_loss": -18.31304931640625, "global_step": 17461, "epoch": 210} {"train_loss": -17.843448638916016, "global_step": 17462, "epoch": 210} {"train_loss": -18.209562301635742, "global_step": 17463, "epoch": 210} {"train_loss": -18.41495704650879, "global_step": 17464, "epoch": 210} {"train_loss": -18.620376586914062, "global_step": 17465, "epoch": 210} {"train_loss": -18.218015670776367, "global_step": 17466, "epoch": 210} {"train_loss": -17.955549240112305, "global_step": 17467, "epoch": 210} {"train_loss": -18.106250762939453, "global_step": 17468, "epoch": 210} {"train_loss": -18.6279239654541, "global_step": 17469, "epoch": 210} {"train_loss": -18.22977066040039, "global_step": 17470, "epoch": 210} {"train_loss": -17.690019607543945, "global_step": 17471, "epoch": 210} {"train_loss": -18.26654052734375, "global_step": 17472, "epoch": 210} {"train_loss": -18.050153732299805, "global_step": 17473, "epoch": 210} {"train_loss": -18.158817291259766, "global_step": 17474, "epoch": 210} {"train_loss": -18.244722366333008, "global_step": 17475, "epoch": 210} {"train_loss": -18.289600372314453, "global_step": 17476, "epoch": 210} {"train_loss": -18.220714569091797, "global_step": 17477, "epoch": 210} {"train_loss": -18.07284927368164, "global_step": 17478, "epoch": 210} {"train_loss": -18.444854736328125, "global_step": 17479, "epoch": 210} {"train_loss": -18.109352111816406, "global_step": 17480, "epoch": 210} {"train_loss": -18.64869499206543, "global_step": 17481, "epoch": 210} {"train_loss": -18.151941299438477, "global_step": 17482, "epoch": 210} {"train_loss": -18.15669059753418, "global_step": 17483, "epoch": 210} {"train_loss": -18.336450576782227, "global_step": 17484, "epoch": 210} {"train_loss": -18.248258590698242, "global_step": 17485, "epoch": 210} {"train_loss": -18.419052124023438, "global_step": 17486, "epoch": 210} {"train_loss": -18.37114906311035, "global_step": 17487, "epoch": 210} {"train_loss": -18.231369018554688, "global_step": 17488, "epoch": 210} {"train_loss": -18.46199607849121, "global_step": 17489, "epoch": 210} {"train_loss": -18.49403190612793, "global_step": 17490, "epoch": 210} {"train_loss": -18.6216983795166, "global_step": 17491, "epoch": 210} {"train_loss": -18.001142501831055, "global_step": 17492, "epoch": 210} {"train_loss": -18.296186447143555, "global_step": 17493, "epoch": 210} {"train_loss": -18.508087158203125, "global_step": 17494, "epoch": 210} {"train_loss": -18.77737808227539, "global_step": 17495, "epoch": 210} {"train_loss": -18.336593627929688, "global_step": 17496, "epoch": 210} {"train_loss": -18.323993682861328, "global_step": 17497, "epoch": 210} {"train_loss": -18.417051315307617, "global_step": 17498, "epoch": 210} {"train_loss": -18.24773597717285, "global_step": 17499, "epoch": 210} {"train_loss": -18.344511032104492, "global_step": 17500, "epoch": 210} {"train_loss": -18.224210739135742, "global_step": 17501, "epoch": 210} {"train_loss": -18.277359008789062, "global_step": 17502, "epoch": 210} {"train_loss": -18.39914894104004, "global_step": 17503, "epoch": 210} {"train_loss": -18.612289428710938, "global_step": 17504, "epoch": 210} {"train_loss": -18.293155670166016, "global_step": 17505, "epoch": 210} {"train_loss": -18.121347427368164, "global_step": 17506, "epoch": 210} {"train_loss": -18.136816024780273, "global_step": 17507, "epoch": 210} {"train_loss": -18.05209732055664, "global_step": 17508, "epoch": 210} {"train_loss": -18.00710105895996, "global_step": 17509, "epoch": 210} {"train_loss": -18.31789207458496, "global_step": 17510, "epoch": 210} {"train_loss": -18.24205780029297, "global_step": 17511, "epoch": 210} {"train_loss": -18.240303453192652, "global_step": 17512, "epoch": 210, "val_loss": 5977348.5} {"train_loss": -18.080623626708984, "global_step": 17513, "epoch": 211} {"train_loss": -18.35370445251465, "global_step": 17514, "epoch": 211} {"train_loss": -18.051950454711914, "global_step": 17515, "epoch": 211} {"train_loss": -18.290668487548828, "global_step": 17516, "epoch": 211} {"train_loss": -18.362356185913086, "global_step": 17517, "epoch": 211} {"train_loss": -18.1335506439209, "global_step": 17518, "epoch": 211} {"train_loss": -18.3251895904541, "global_step": 17519, "epoch": 211} {"train_loss": -18.213045120239258, "global_step": 17520, "epoch": 211} {"train_loss": -18.437061309814453, "global_step": 17521, "epoch": 211} {"train_loss": -18.276031494140625, "global_step": 17522, "epoch": 211} {"train_loss": -18.088224411010742, "global_step": 17523, "epoch": 211} {"train_loss": -18.48897933959961, "global_step": 17524, "epoch": 211} {"train_loss": -18.41082763671875, "global_step": 17525, "epoch": 211} {"train_loss": -18.2384090423584, "global_step": 17526, "epoch": 211} {"train_loss": -17.838022232055664, "global_step": 17527, "epoch": 211} {"train_loss": -18.224388122558594, "global_step": 17528, "epoch": 211} {"train_loss": -18.244382858276367, "global_step": 17529, "epoch": 211} {"train_loss": -18.401933670043945, "global_step": 17530, "epoch": 211} {"train_loss": -18.40323829650879, "global_step": 17531, "epoch": 211} {"train_loss": -17.816173553466797, "global_step": 17532, "epoch": 211} {"train_loss": -18.084489822387695, "global_step": 17533, "epoch": 211} {"train_loss": -18.092330932617188, "global_step": 17534, "epoch": 211} {"train_loss": -18.00782012939453, "global_step": 17535, "epoch": 211} {"train_loss": -18.448505401611328, "global_step": 17536, "epoch": 211} {"train_loss": -17.925613403320312, "global_step": 17537, "epoch": 211} {"train_loss": -18.318801879882812, "global_step": 17538, "epoch": 211} {"train_loss": -18.169414520263672, "global_step": 17539, "epoch": 211} {"train_loss": -18.361433029174805, "global_step": 17540, "epoch": 211} {"train_loss": -18.143356323242188, "global_step": 17541, "epoch": 211} {"train_loss": -18.415029525756836, "global_step": 17542, "epoch": 211} {"train_loss": -18.398609161376953, "global_step": 17543, "epoch": 211} {"train_loss": -18.333473205566406, "global_step": 17544, "epoch": 211} {"train_loss": -17.93370819091797, "global_step": 17545, "epoch": 211} {"train_loss": -18.336118698120117, "global_step": 17546, "epoch": 211} {"train_loss": -18.517807006835938, "global_step": 17547, "epoch": 211} {"train_loss": -18.365978240966797, "global_step": 17548, "epoch": 211} {"train_loss": -17.94160270690918, "global_step": 17549, "epoch": 211} {"train_loss": -18.20294761657715, "global_step": 17550, "epoch": 211} {"train_loss": -18.207698822021484, "global_step": 17551, "epoch": 211} {"train_loss": -18.404163360595703, "global_step": 17552, "epoch": 211} {"train_loss": -18.058948516845703, "global_step": 17553, "epoch": 211} {"train_loss": -18.336694717407227, "global_step": 17554, "epoch": 211} {"train_loss": -18.311033248901367, "global_step": 17555, "epoch": 211} {"train_loss": -18.48859214782715, "global_step": 17556, "epoch": 211} {"train_loss": -18.3147029876709, "global_step": 17557, "epoch": 211} {"train_loss": -18.77647590637207, "global_step": 17558, "epoch": 211} {"train_loss": -18.311622619628906, "global_step": 17559, "epoch": 211} {"train_loss": -17.94016456604004, "global_step": 17560, "epoch": 211} {"train_loss": -18.210697174072266, "global_step": 17561, "epoch": 211} {"train_loss": -18.31559181213379, "global_step": 17562, "epoch": 211} {"train_loss": -18.069467544555664, "global_step": 17563, "epoch": 211} {"train_loss": -18.01955223083496, "global_step": 17564, "epoch": 211} {"train_loss": -18.641016006469727, "global_step": 17565, "epoch": 211} {"train_loss": -18.510528564453125, "global_step": 17566, "epoch": 211} {"train_loss": -18.741437911987305, "global_step": 17567, "epoch": 211} {"train_loss": -18.76888084411621, "global_step": 17568, "epoch": 211} {"train_loss": -18.49802589416504, "global_step": 17569, "epoch": 211} {"train_loss": -18.260162353515625, "global_step": 17570, "epoch": 211} {"train_loss": -18.173473358154297, "global_step": 17571, "epoch": 211} {"train_loss": -18.49225616455078, "global_step": 17572, "epoch": 211} {"train_loss": -18.097335815429688, "global_step": 17573, "epoch": 211} {"train_loss": -18.278947830200195, "global_step": 17574, "epoch": 211} {"train_loss": -18.494077682495117, "global_step": 17575, "epoch": 211} {"train_loss": -18.291427612304688, "global_step": 17576, "epoch": 211} {"train_loss": -18.14939308166504, "global_step": 17577, "epoch": 211} {"train_loss": -18.391515731811523, "global_step": 17578, "epoch": 211} {"train_loss": -18.30950927734375, "global_step": 17579, "epoch": 211} {"train_loss": -18.330249786376953, "global_step": 17580, "epoch": 211} {"train_loss": -18.549097061157227, "global_step": 17581, "epoch": 211} {"train_loss": -18.783742904663086, "global_step": 17582, "epoch": 211} {"train_loss": -18.46536636352539, "global_step": 17583, "epoch": 211} {"train_loss": -18.32879066467285, "global_step": 17584, "epoch": 211} {"train_loss": -18.143390655517578, "global_step": 17585, "epoch": 211} {"train_loss": -18.333009719848633, "global_step": 17586, "epoch": 211} {"train_loss": -18.29414176940918, "global_step": 17587, "epoch": 211} {"train_loss": -17.84562110900879, "global_step": 17588, "epoch": 211} {"train_loss": -18.21822166442871, "global_step": 17589, "epoch": 211} {"train_loss": -18.17255401611328, "global_step": 17590, "epoch": 211} {"train_loss": -18.316007614135742, "global_step": 17591, "epoch": 211} {"train_loss": -18.24967384338379, "global_step": 17592, "epoch": 211} {"train_loss": -18.3366641998291, "global_step": 17593, "epoch": 211} {"train_loss": -18.022348403930664, "global_step": 17594, "epoch": 211} {"train_loss": -18.296235509665614, "global_step": 17595, "epoch": 211, "val_loss": 5798520.0} {"train_loss": -18.11116600036621, "global_step": 17596, "epoch": 212} {"train_loss": -18.424264907836914, "global_step": 17597, "epoch": 212} {"train_loss": -18.110015869140625, "global_step": 17598, "epoch": 212} {"train_loss": -18.399595260620117, "global_step": 17599, "epoch": 212} {"train_loss": -18.322912216186523, "global_step": 17600, "epoch": 212} {"train_loss": -18.14032554626465, "global_step": 17601, "epoch": 212} {"train_loss": -18.5751953125, "global_step": 17602, "epoch": 212} {"train_loss": -18.052221298217773, "global_step": 17603, "epoch": 212} {"train_loss": -17.874027252197266, "global_step": 17604, "epoch": 212} {"train_loss": -18.09600830078125, "global_step": 17605, "epoch": 212} {"train_loss": -18.35390281677246, "global_step": 17606, "epoch": 212} {"train_loss": -18.517440795898438, "global_step": 17607, "epoch": 212} {"train_loss": -18.435617446899414, "global_step": 17608, "epoch": 212} {"train_loss": -18.138296127319336, "global_step": 17609, "epoch": 212} {"train_loss": -18.33196258544922, "global_step": 17610, "epoch": 212} {"train_loss": -17.49384307861328, "global_step": 17611, "epoch": 212} {"train_loss": -18.027267456054688, "global_step": 17612, "epoch": 212} {"train_loss": -18.471233367919922, "global_step": 17613, "epoch": 212} {"train_loss": -17.818323135375977, "global_step": 17614, "epoch": 212} {"train_loss": -18.587026596069336, "global_step": 17615, "epoch": 212} {"train_loss": -18.197723388671875, "global_step": 17616, "epoch": 212} {"train_loss": -18.024850845336914, "global_step": 17617, "epoch": 212} {"train_loss": -18.26970863342285, "global_step": 17618, "epoch": 212} {"train_loss": -18.33293342590332, "global_step": 17619, "epoch": 212} {"train_loss": -18.246322631835938, "global_step": 17620, "epoch": 212} {"train_loss": -18.001663208007812, "global_step": 17621, "epoch": 212} {"train_loss": -18.29319190979004, "global_step": 17622, "epoch": 212} {"train_loss": -18.54070472717285, "global_step": 17623, "epoch": 212} {"train_loss": -18.46909523010254, "global_step": 17624, "epoch": 212} {"train_loss": -18.73103141784668, "global_step": 17625, "epoch": 212} {"train_loss": -18.154470443725586, "global_step": 17626, "epoch": 212} {"train_loss": -18.218734741210938, "global_step": 17627, "epoch": 212} {"train_loss": -18.274030685424805, "global_step": 17628, "epoch": 212} {"train_loss": -18.339357376098633, "global_step": 17629, "epoch": 212} {"train_loss": -18.319162368774414, "global_step": 17630, "epoch": 212} {"train_loss": -18.177734375, "global_step": 17631, "epoch": 212} {"train_loss": -17.644163131713867, "global_step": 17632, "epoch": 212} {"train_loss": -18.551557540893555, "global_step": 17633, "epoch": 212} {"train_loss": -18.863056182861328, "global_step": 17634, "epoch": 212} {"train_loss": -18.8311767578125, "global_step": 17635, "epoch": 212} {"train_loss": -18.014171600341797, "global_step": 17636, "epoch": 212} {"train_loss": -18.506610870361328, "global_step": 17637, "epoch": 212} {"train_loss": -18.05088233947754, "global_step": 17638, "epoch": 212} {"train_loss": -18.15705108642578, "global_step": 17639, "epoch": 212} {"train_loss": -18.458133697509766, "global_step": 17640, "epoch": 212} {"train_loss": -18.4799861907959, "global_step": 17641, "epoch": 212} {"train_loss": -18.47317123413086, "global_step": 17642, "epoch": 212} {"train_loss": -18.064289093017578, "global_step": 17643, "epoch": 212} {"train_loss": -18.40554428100586, "global_step": 17644, "epoch": 212} {"train_loss": -18.67537498474121, "global_step": 17645, "epoch": 212} {"train_loss": -18.307859420776367, "global_step": 17646, "epoch": 212} {"train_loss": -18.191953659057617, "global_step": 17647, "epoch": 212} {"train_loss": -18.370229721069336, "global_step": 17648, "epoch": 212} {"train_loss": -18.20669937133789, "global_step": 17649, "epoch": 212} {"train_loss": -18.544687271118164, "global_step": 17650, "epoch": 212} {"train_loss": -18.194721221923828, "global_step": 17651, "epoch": 212} {"train_loss": -18.44295310974121, "global_step": 17652, "epoch": 212} {"train_loss": -18.61297607421875, "global_step": 17653, "epoch": 212} {"train_loss": -18.5900821685791, "global_step": 17654, "epoch": 212} {"train_loss": -18.395475387573242, "global_step": 17655, "epoch": 212} {"train_loss": -18.298032760620117, "global_step": 17656, "epoch": 212} {"train_loss": -18.352231979370117, "global_step": 17657, "epoch": 212} {"train_loss": -17.67537498474121, "global_step": 17658, "epoch": 212} {"train_loss": -18.496610641479492, "global_step": 17659, "epoch": 212} {"train_loss": -18.618236541748047, "global_step": 17660, "epoch": 212} {"train_loss": -18.215625762939453, "global_step": 17661, "epoch": 212} {"train_loss": -17.881093978881836, "global_step": 17662, "epoch": 212} {"train_loss": -18.2179012298584, "global_step": 17663, "epoch": 212} {"train_loss": -18.29759407043457, "global_step": 17664, "epoch": 212} {"train_loss": -18.043983459472656, "global_step": 17665, "epoch": 212} {"train_loss": -18.447568893432617, "global_step": 17666, "epoch": 212} {"train_loss": -18.320526123046875, "global_step": 17667, "epoch": 212} {"train_loss": -18.226837158203125, "global_step": 17668, "epoch": 212} {"train_loss": -18.27467918395996, "global_step": 17669, "epoch": 212} {"train_loss": -18.205076217651367, "global_step": 17670, "epoch": 212} {"train_loss": -18.618257522583008, "global_step": 17671, "epoch": 212} {"train_loss": -17.897205352783203, "global_step": 17672, "epoch": 212} {"train_loss": -18.309110641479492, "global_step": 17673, "epoch": 212} {"train_loss": -18.178754806518555, "global_step": 17674, "epoch": 212} {"train_loss": -18.015439987182617, "global_step": 17675, "epoch": 212} {"train_loss": -18.349233627319336, "global_step": 17676, "epoch": 212} {"train_loss": -18.406843185424805, "global_step": 17677, "epoch": 212} {"train_loss": -18.290164028305604, "global_step": 17678, "epoch": 212, "val_loss": 5802562.5} {"train_loss": -18.213178634643555, "global_step": 17679, "epoch": 213} {"train_loss": -18.12837791442871, "global_step": 17680, "epoch": 213} {"train_loss": -18.475339889526367, "global_step": 17681, "epoch": 213} {"train_loss": -18.0470027923584, "global_step": 17682, "epoch": 213} {"train_loss": -18.205110549926758, "global_step": 17683, "epoch": 213} {"train_loss": -18.033735275268555, "global_step": 17684, "epoch": 213} {"train_loss": -18.220449447631836, "global_step": 17685, "epoch": 213} {"train_loss": -18.25311279296875, "global_step": 17686, "epoch": 213} {"train_loss": -18.294248580932617, "global_step": 17687, "epoch": 213} {"train_loss": -18.529144287109375, "global_step": 17688, "epoch": 213} {"train_loss": -18.317895889282227, "global_step": 17689, "epoch": 213} {"train_loss": -18.357641220092773, "global_step": 17690, "epoch": 213} {"train_loss": -18.314245223999023, "global_step": 17691, "epoch": 213} {"train_loss": -18.464420318603516, "global_step": 17692, "epoch": 213} {"train_loss": -18.42426109313965, "global_step": 17693, "epoch": 213} {"train_loss": -18.34220314025879, "global_step": 17694, "epoch": 213} {"train_loss": -18.18117332458496, "global_step": 17695, "epoch": 213} {"train_loss": -18.397085189819336, "global_step": 17696, "epoch": 213} {"train_loss": -18.681180953979492, "global_step": 17697, "epoch": 213} {"train_loss": -18.135902404785156, "global_step": 17698, "epoch": 213} {"train_loss": -18.39130210876465, "global_step": 17699, "epoch": 213} {"train_loss": -18.54096031188965, "global_step": 17700, "epoch": 213} {"train_loss": -17.959781646728516, "global_step": 17701, "epoch": 213} {"train_loss": -18.20194435119629, "global_step": 17702, "epoch": 213} {"train_loss": -18.172117233276367, "global_step": 17703, "epoch": 213} {"train_loss": -18.42151641845703, "global_step": 17704, "epoch": 213} {"train_loss": -18.235197067260742, "global_step": 17705, "epoch": 213} {"train_loss": -18.16845703125, "global_step": 17706, "epoch": 213} {"train_loss": -18.44732666015625, "global_step": 17707, "epoch": 213} {"train_loss": -18.359743118286133, "global_step": 17708, "epoch": 213} {"train_loss": -17.9503116607666, "global_step": 17709, "epoch": 213} {"train_loss": -18.023740768432617, "global_step": 17710, "epoch": 213} {"train_loss": -18.378475189208984, "global_step": 17711, "epoch": 213} {"train_loss": -18.1014461517334, "global_step": 17712, "epoch": 213} {"train_loss": -18.498519897460938, "global_step": 17713, "epoch": 213} {"train_loss": -18.2744197845459, "global_step": 17714, "epoch": 213} {"train_loss": -18.026227951049805, "global_step": 17715, "epoch": 213} {"train_loss": -18.3319034576416, "global_step": 17716, "epoch": 213} {"train_loss": -18.598608016967773, "global_step": 17717, "epoch": 213} {"train_loss": -18.131330490112305, "global_step": 17718, "epoch": 213} {"train_loss": -18.26104164123535, "global_step": 17719, "epoch": 213} {"train_loss": -18.201658248901367, "global_step": 17720, "epoch": 213} {"train_loss": -18.445804595947266, "global_step": 17721, "epoch": 213} {"train_loss": -18.255430221557617, "global_step": 17722, "epoch": 213} {"train_loss": -18.264509201049805, "global_step": 17723, "epoch": 213} {"train_loss": -18.761838912963867, "global_step": 17724, "epoch": 213} {"train_loss": -17.93334197998047, "global_step": 17725, "epoch": 213} {"train_loss": -18.24176597595215, "global_step": 17726, "epoch": 213} {"train_loss": -17.992382049560547, "global_step": 17727, "epoch": 213} {"train_loss": -18.3592472076416, "global_step": 17728, "epoch": 213} {"train_loss": -17.90887451171875, "global_step": 17729, "epoch": 213} {"train_loss": -18.31353759765625, "global_step": 17730, "epoch": 213} {"train_loss": -18.27496337890625, "global_step": 17731, "epoch": 213} {"train_loss": -18.184181213378906, "global_step": 17732, "epoch": 213} {"train_loss": -18.27644920349121, "global_step": 17733, "epoch": 213} {"train_loss": -18.155250549316406, "global_step": 17734, "epoch": 213} {"train_loss": -18.3892879486084, "global_step": 17735, "epoch": 213} {"train_loss": -18.33301544189453, "global_step": 17736, "epoch": 213} {"train_loss": -18.372587203979492, "global_step": 17737, "epoch": 213} {"train_loss": -18.311193466186523, "global_step": 17738, "epoch": 213} {"train_loss": -18.121036529541016, "global_step": 17739, "epoch": 213} {"train_loss": -18.15760612487793, "global_step": 17740, "epoch": 213} {"train_loss": -18.454193115234375, "global_step": 17741, "epoch": 213} {"train_loss": -18.5167236328125, "global_step": 17742, "epoch": 213} {"train_loss": -18.490610122680664, "global_step": 17743, "epoch": 213} {"train_loss": -18.06858253479004, "global_step": 17744, "epoch": 213} {"train_loss": -18.47237777709961, "global_step": 17745, "epoch": 213} {"train_loss": -18.430879592895508, "global_step": 17746, "epoch": 213} {"train_loss": -18.542184829711914, "global_step": 17747, "epoch": 213} {"train_loss": -18.355613708496094, "global_step": 17748, "epoch": 213} {"train_loss": -18.435237884521484, "global_step": 17749, "epoch": 213} {"train_loss": -18.65993309020996, "global_step": 17750, "epoch": 213} {"train_loss": -18.607084274291992, "global_step": 17751, "epoch": 213} {"train_loss": -17.893749237060547, "global_step": 17752, "epoch": 213} {"train_loss": -18.19237518310547, "global_step": 17753, "epoch": 213} {"train_loss": -18.382953643798828, "global_step": 17754, "epoch": 213} {"train_loss": -18.775634765625, "global_step": 17755, "epoch": 213} {"train_loss": -18.509246826171875, "global_step": 17756, "epoch": 213} {"train_loss": -18.124126434326172, "global_step": 17757, "epoch": 213} {"train_loss": -18.076457977294922, "global_step": 17758, "epoch": 213} {"train_loss": -18.47650718688965, "global_step": 17759, "epoch": 213} {"train_loss": -18.231481552124023, "global_step": 17760, "epoch": 213} {"train_loss": -18.292891008308136, "global_step": 17761, "epoch": 213, "val_loss": 5896533.5} {"train_loss": -18.568363189697266, "global_step": 17762, "epoch": 214} {"train_loss": -18.254798889160156, "global_step": 17763, "epoch": 214} {"train_loss": -18.269742965698242, "global_step": 17764, "epoch": 214} {"train_loss": -18.173053741455078, "global_step": 17765, "epoch": 214} {"train_loss": -18.241849899291992, "global_step": 17766, "epoch": 214} {"train_loss": -18.470247268676758, "global_step": 17767, "epoch": 214} {"train_loss": -18.399938583374023, "global_step": 17768, "epoch": 214} {"train_loss": -17.917665481567383, "global_step": 17769, "epoch": 214} {"train_loss": -18.065963745117188, "global_step": 17770, "epoch": 214} {"train_loss": -18.55998420715332, "global_step": 17771, "epoch": 214} {"train_loss": -18.346473693847656, "global_step": 17772, "epoch": 214} {"train_loss": -18.26949119567871, "global_step": 17773, "epoch": 214} {"train_loss": -18.578527450561523, "global_step": 17774, "epoch": 214} {"train_loss": -18.36207389831543, "global_step": 17775, "epoch": 214} {"train_loss": -18.141016006469727, "global_step": 17776, "epoch": 214} {"train_loss": -18.378324508666992, "global_step": 17777, "epoch": 214} {"train_loss": -18.00240135192871, "global_step": 17778, "epoch": 214} {"train_loss": -18.393524169921875, "global_step": 17779, "epoch": 214} {"train_loss": -18.34537696838379, "global_step": 17780, "epoch": 214} {"train_loss": -18.311161041259766, "global_step": 17781, "epoch": 214} {"train_loss": -18.451801300048828, "global_step": 17782, "epoch": 214} {"train_loss": -18.506879806518555, "global_step": 17783, "epoch": 214} {"train_loss": -18.186899185180664, "global_step": 17784, "epoch": 214} {"train_loss": -18.420392990112305, "global_step": 17785, "epoch": 214} {"train_loss": -17.820972442626953, "global_step": 17786, "epoch": 214} {"train_loss": -18.3038387298584, "global_step": 17787, "epoch": 214} {"train_loss": -18.306921005249023, "global_step": 17788, "epoch": 214} {"train_loss": -18.257009506225586, "global_step": 17789, "epoch": 214} {"train_loss": -18.2849178314209, "global_step": 17790, "epoch": 214} {"train_loss": -17.82756996154785, "global_step": 17791, "epoch": 214} {"train_loss": -18.124164581298828, "global_step": 17792, "epoch": 214} {"train_loss": -18.483240127563477, "global_step": 17793, "epoch": 214} {"train_loss": -18.262115478515625, "global_step": 17794, "epoch": 214} {"train_loss": -18.202587127685547, "global_step": 17795, "epoch": 214} {"train_loss": -18.101957321166992, "global_step": 17796, "epoch": 214} {"train_loss": -18.464385986328125, "global_step": 17797, "epoch": 214} {"train_loss": -18.342679977416992, "global_step": 17798, "epoch": 214} {"train_loss": -18.209121704101562, "global_step": 17799, "epoch": 214} {"train_loss": -18.690797805786133, "global_step": 17800, "epoch": 214} {"train_loss": -18.248214721679688, "global_step": 17801, "epoch": 214} {"train_loss": -18.39055824279785, "global_step": 17802, "epoch": 214} {"train_loss": -18.251201629638672, "global_step": 17803, "epoch": 214} {"train_loss": -18.64344596862793, "global_step": 17804, "epoch": 214} {"train_loss": -18.33608055114746, "global_step": 17805, "epoch": 214} {"train_loss": -18.322154998779297, "global_step": 17806, "epoch": 214} {"train_loss": -18.3602237701416, "global_step": 17807, "epoch": 214} {"train_loss": -18.209976196289062, "global_step": 17808, "epoch": 214} {"train_loss": -18.139616012573242, "global_step": 17809, "epoch": 214} {"train_loss": -18.052749633789062, "global_step": 17810, "epoch": 214} {"train_loss": -18.707847595214844, "global_step": 17811, "epoch": 214} {"train_loss": -18.16232681274414, "global_step": 17812, "epoch": 214} {"train_loss": -18.432483673095703, "global_step": 17813, "epoch": 214} {"train_loss": -18.120420455932617, "global_step": 17814, "epoch": 214} {"train_loss": -18.387662887573242, "global_step": 17815, "epoch": 214} {"train_loss": -18.356159210205078, "global_step": 17816, "epoch": 214} {"train_loss": -18.346786499023438, "global_step": 17817, "epoch": 214} {"train_loss": -18.399023056030273, "global_step": 17818, "epoch": 214} {"train_loss": -18.378015518188477, "global_step": 17819, "epoch": 214} {"train_loss": -18.202869415283203, "global_step": 17820, "epoch": 214} {"train_loss": -18.856199264526367, "global_step": 17821, "epoch": 214} {"train_loss": -18.370880126953125, "global_step": 17822, "epoch": 214} {"train_loss": -18.448270797729492, "global_step": 17823, "epoch": 214} {"train_loss": -18.313440322875977, "global_step": 17824, "epoch": 214} {"train_loss": -18.765478134155273, "global_step": 17825, "epoch": 214} {"train_loss": -18.190229415893555, "global_step": 17826, "epoch": 214} {"train_loss": -18.25617027282715, "global_step": 17827, "epoch": 214} {"train_loss": -18.511865615844727, "global_step": 17828, "epoch": 214} {"train_loss": -18.39393424987793, "global_step": 17829, "epoch": 214} {"train_loss": -18.402769088745117, "global_step": 17830, "epoch": 214} {"train_loss": -18.184158325195312, "global_step": 17831, "epoch": 214} {"train_loss": -18.673776626586914, "global_step": 17832, "epoch": 214} {"train_loss": -18.59078025817871, "global_step": 17833, "epoch": 214} {"train_loss": -18.483078002929688, "global_step": 17834, "epoch": 214} {"train_loss": -18.06441307067871, "global_step": 17835, "epoch": 214} {"train_loss": -18.065519332885742, "global_step": 17836, "epoch": 214} {"train_loss": -17.93825912475586, "global_step": 17837, "epoch": 214} {"train_loss": -17.860828399658203, "global_step": 17838, "epoch": 214} {"train_loss": -18.530200958251953, "global_step": 17839, "epoch": 214} {"train_loss": -18.422534942626953, "global_step": 17840, "epoch": 214} {"train_loss": -18.016860961914062, "global_step": 17841, "epoch": 214} {"train_loss": -18.181032180786133, "global_step": 17842, "epoch": 214} {"train_loss": -18.1606388092041, "global_step": 17843, "epoch": 214} {"train_loss": -18.32622408579631, "global_step": 17844, "epoch": 214, "val_loss": 5702824.0} {"train_loss": -18.05040740966797, "global_step": 17845, "epoch": 215} {"train_loss": -18.722736358642578, "global_step": 17846, "epoch": 215} {"train_loss": -18.276874542236328, "global_step": 17847, "epoch": 215} {"train_loss": -18.49140739440918, "global_step": 17848, "epoch": 215} {"train_loss": -18.28817367553711, "global_step": 17849, "epoch": 215} {"train_loss": -18.279254913330078, "global_step": 17850, "epoch": 215} {"train_loss": -18.464954376220703, "global_step": 17851, "epoch": 215} {"train_loss": -18.362276077270508, "global_step": 17852, "epoch": 215} {"train_loss": -18.372051239013672, "global_step": 17853, "epoch": 215} {"train_loss": -18.147905349731445, "global_step": 17854, "epoch": 215} {"train_loss": -17.93998146057129, "global_step": 17855, "epoch": 215} {"train_loss": -18.56685447692871, "global_step": 17856, "epoch": 215} {"train_loss": -18.263742446899414, "global_step": 17857, "epoch": 215} {"train_loss": -18.00746726989746, "global_step": 17858, "epoch": 215} {"train_loss": -18.117280960083008, "global_step": 17859, "epoch": 215} {"train_loss": -18.185482025146484, "global_step": 17860, "epoch": 215} {"train_loss": -18.416128158569336, "global_step": 17861, "epoch": 215} {"train_loss": -18.095443725585938, "global_step": 17862, "epoch": 215} {"train_loss": -18.59600257873535, "global_step": 17863, "epoch": 215} {"train_loss": -18.0831298828125, "global_step": 17864, "epoch": 215} {"train_loss": -18.83492088317871, "global_step": 17865, "epoch": 215} {"train_loss": -18.07740592956543, "global_step": 17866, "epoch": 215} {"train_loss": -18.39911460876465, "global_step": 17867, "epoch": 215} {"train_loss": -18.433996200561523, "global_step": 17868, "epoch": 215} {"train_loss": -18.234724044799805, "global_step": 17869, "epoch": 215} {"train_loss": -18.040857315063477, "global_step": 17870, "epoch": 215} {"train_loss": -18.290647506713867, "global_step": 17871, "epoch": 215} {"train_loss": -18.302946090698242, "global_step": 17872, "epoch": 215} {"train_loss": -18.17500114440918, "global_step": 17873, "epoch": 215} {"train_loss": -18.530500411987305, "global_step": 17874, "epoch": 215} {"train_loss": -18.357358932495117, "global_step": 17875, "epoch": 215} {"train_loss": -18.07213592529297, "global_step": 17876, "epoch": 215} {"train_loss": -18.134366989135742, "global_step": 17877, "epoch": 215} {"train_loss": -18.157827377319336, "global_step": 17878, "epoch": 215} {"train_loss": -18.37742805480957, "global_step": 17879, "epoch": 215} {"train_loss": -18.262226104736328, "global_step": 17880, "epoch": 215} {"train_loss": -18.64444923400879, "global_step": 17881, "epoch": 215} {"train_loss": -17.99774169921875, "global_step": 17882, "epoch": 215} {"train_loss": -18.125749588012695, "global_step": 17883, "epoch": 215} {"train_loss": -18.313161849975586, "global_step": 17884, "epoch": 215} {"train_loss": -18.281612396240234, "global_step": 17885, "epoch": 215} {"train_loss": -18.334135055541992, "global_step": 17886, "epoch": 215} {"train_loss": -18.552928924560547, "global_step": 17887, "epoch": 215} {"train_loss": -18.21394920349121, "global_step": 17888, "epoch": 215} {"train_loss": -18.342355728149414, "global_step": 17889, "epoch": 215} {"train_loss": -18.6628360748291, "global_step": 17890, "epoch": 215} {"train_loss": -18.23895263671875, "global_step": 17891, "epoch": 215} {"train_loss": -18.259323120117188, "global_step": 17892, "epoch": 215} {"train_loss": -18.25599479675293, "global_step": 17893, "epoch": 215} {"train_loss": -18.128875732421875, "global_step": 17894, "epoch": 215} {"train_loss": -18.264448165893555, "global_step": 17895, "epoch": 215} {"train_loss": -18.373313903808594, "global_step": 17896, "epoch": 215} {"train_loss": -18.17730140686035, "global_step": 17897, "epoch": 215} {"train_loss": -18.33414077758789, "global_step": 17898, "epoch": 215} {"train_loss": -18.587478637695312, "global_step": 17899, "epoch": 215} {"train_loss": -18.39227294921875, "global_step": 17900, "epoch": 215} {"train_loss": -18.473867416381836, "global_step": 17901, "epoch": 215} {"train_loss": -18.23872184753418, "global_step": 17902, "epoch": 215} {"train_loss": -18.423545837402344, "global_step": 17903, "epoch": 215} {"train_loss": -18.368324279785156, "global_step": 17904, "epoch": 215} {"train_loss": -18.087858200073242, "global_step": 17905, "epoch": 215} {"train_loss": -18.49601173400879, "global_step": 17906, "epoch": 215} {"train_loss": -18.156158447265625, "global_step": 17907, "epoch": 215} {"train_loss": -18.184804916381836, "global_step": 17908, "epoch": 215} {"train_loss": -18.531023025512695, "global_step": 17909, "epoch": 215} {"train_loss": -18.34625816345215, "global_step": 17910, "epoch": 215} {"train_loss": -18.550922393798828, "global_step": 17911, "epoch": 215} {"train_loss": -18.060277938842773, "global_step": 17912, "epoch": 215} {"train_loss": -18.312936782836914, "global_step": 17913, "epoch": 215} {"train_loss": -18.221651077270508, "global_step": 17914, "epoch": 215} {"train_loss": -18.11676025390625, "global_step": 17915, "epoch": 215} {"train_loss": -18.696044921875, "global_step": 17916, "epoch": 215} {"train_loss": -18.08479881286621, "global_step": 17917, "epoch": 215} {"train_loss": -18.130443572998047, "global_step": 17918, "epoch": 215} {"train_loss": -18.25582504272461, "global_step": 17919, "epoch": 215} {"train_loss": -18.168302536010742, "global_step": 17920, "epoch": 215} {"train_loss": -18.567670822143555, "global_step": 17921, "epoch": 215} {"train_loss": -18.664731979370117, "global_step": 17922, "epoch": 215} {"train_loss": -18.11031150817871, "global_step": 17923, "epoch": 215} {"train_loss": -18.097272872924805, "global_step": 17924, "epoch": 215} {"train_loss": -18.4310359954834, "global_step": 17925, "epoch": 215} {"train_loss": -18.192066192626953, "global_step": 17926, "epoch": 215} {"train_loss": -18.31357852522149, "global_step": 17927, "epoch": 215, "val_loss": 5780224.5} {"train_loss": -18.071346282958984, "global_step": 17928, "epoch": 216} {"train_loss": -17.95808219909668, "global_step": 17929, "epoch": 216} {"train_loss": -18.032550811767578, "global_step": 17930, "epoch": 216} {"train_loss": -18.567312240600586, "global_step": 17931, "epoch": 216} {"train_loss": -18.32240104675293, "global_step": 17932, "epoch": 216} {"train_loss": -18.04500389099121, "global_step": 17933, "epoch": 216} {"train_loss": -18.335119247436523, "global_step": 17934, "epoch": 216} {"train_loss": -18.29526710510254, "global_step": 17935, "epoch": 216} {"train_loss": -18.142398834228516, "global_step": 17936, "epoch": 216} {"train_loss": -18.497390747070312, "global_step": 17937, "epoch": 216} {"train_loss": -18.286163330078125, "global_step": 17938, "epoch": 216} {"train_loss": -18.385848999023438, "global_step": 17939, "epoch": 216} {"train_loss": -18.265043258666992, "global_step": 17940, "epoch": 216} {"train_loss": -18.850528717041016, "global_step": 17941, "epoch": 216} {"train_loss": -18.04096031188965, "global_step": 17942, "epoch": 216} {"train_loss": -18.633644104003906, "global_step": 17943, "epoch": 216} {"train_loss": -18.486351013183594, "global_step": 17944, "epoch": 216} {"train_loss": -18.223848342895508, "global_step": 17945, "epoch": 216} {"train_loss": -18.18647003173828, "global_step": 17946, "epoch": 216} {"train_loss": -18.407026290893555, "global_step": 17947, "epoch": 216} {"train_loss": -18.67124366760254, "global_step": 17948, "epoch": 216} {"train_loss": -18.64173698425293, "global_step": 17949, "epoch": 216} {"train_loss": -18.471988677978516, "global_step": 17950, "epoch": 216} {"train_loss": -18.285831451416016, "global_step": 17951, "epoch": 216} {"train_loss": -18.269535064697266, "global_step": 17952, "epoch": 216} {"train_loss": -18.2781982421875, "global_step": 17953, "epoch": 216} {"train_loss": -18.026546478271484, "global_step": 17954, "epoch": 216} {"train_loss": -18.44632911682129, "global_step": 17955, "epoch": 216} {"train_loss": -18.055952072143555, "global_step": 17956, "epoch": 216} {"train_loss": -18.25107765197754, "global_step": 17957, "epoch": 216} {"train_loss": -18.026073455810547, "global_step": 17958, "epoch": 216} {"train_loss": -18.167890548706055, "global_step": 17959, "epoch": 216} {"train_loss": -18.114599227905273, "global_step": 17960, "epoch": 216} {"train_loss": -18.60443687438965, "global_step": 17961, "epoch": 216} {"train_loss": -17.89216423034668, "global_step": 17962, "epoch": 216} {"train_loss": -17.98062515258789, "global_step": 17963, "epoch": 216} {"train_loss": -18.351831436157227, "global_step": 17964, "epoch": 216} {"train_loss": -18.13018226623535, "global_step": 17965, "epoch": 216} {"train_loss": -18.457914352416992, "global_step": 17966, "epoch": 216} {"train_loss": -18.353126525878906, "global_step": 17967, "epoch": 216} {"train_loss": -18.144697189331055, "global_step": 17968, "epoch": 216} {"train_loss": -18.476669311523438, "global_step": 17969, "epoch": 216} {"train_loss": -18.125577926635742, "global_step": 17970, "epoch": 216} {"train_loss": -18.158639907836914, "global_step": 17971, "epoch": 216} {"train_loss": -18.320079803466797, "global_step": 17972, "epoch": 216} {"train_loss": -18.09463882446289, "global_step": 17973, "epoch": 216} {"train_loss": -18.387266159057617, "global_step": 17974, "epoch": 216} {"train_loss": -18.197065353393555, "global_step": 17975, "epoch": 216} {"train_loss": -18.427785873413086, "global_step": 17976, "epoch": 216} {"train_loss": -18.316553115844727, "global_step": 17977, "epoch": 216} {"train_loss": -18.505084991455078, "global_step": 17978, "epoch": 216} {"train_loss": -18.400671005249023, "global_step": 17979, "epoch": 216} {"train_loss": -18.466827392578125, "global_step": 17980, "epoch": 216} {"train_loss": -18.500574111938477, "global_step": 17981, "epoch": 216} {"train_loss": -18.335447311401367, "global_step": 17982, "epoch": 216} {"train_loss": -18.539640426635742, "global_step": 17983, "epoch": 216} {"train_loss": -18.32869529724121, "global_step": 17984, "epoch": 216} {"train_loss": -18.043739318847656, "global_step": 17985, "epoch": 216} {"train_loss": -18.5251407623291, "global_step": 17986, "epoch": 216} {"train_loss": -18.092254638671875, "global_step": 17987, "epoch": 216} {"train_loss": -17.95652198791504, "global_step": 17988, "epoch": 216} {"train_loss": -18.484628677368164, "global_step": 17989, "epoch": 216} {"train_loss": -18.32600212097168, "global_step": 17990, "epoch": 216} {"train_loss": -18.258466720581055, "global_step": 17991, "epoch": 216} {"train_loss": -18.41708755493164, "global_step": 17992, "epoch": 216} {"train_loss": -18.2965030670166, "global_step": 17993, "epoch": 216} {"train_loss": -18.090850830078125, "global_step": 17994, "epoch": 216} {"train_loss": -18.327590942382812, "global_step": 17995, "epoch": 216} {"train_loss": -18.682859420776367, "global_step": 17996, "epoch": 216} {"train_loss": -18.603548049926758, "global_step": 17997, "epoch": 216} {"train_loss": -18.472490310668945, "global_step": 17998, "epoch": 216} {"train_loss": -18.242849349975586, "global_step": 17999, "epoch": 216} {"train_loss": -18.146879196166992, "global_step": 18000, "epoch": 216} {"train_loss": -18.354604721069336, "global_step": 18001, "epoch": 216} {"train_loss": -18.44081687927246, "global_step": 18002, "epoch": 216} {"train_loss": -18.14591407775879, "global_step": 18003, "epoch": 216} {"train_loss": -18.44767189025879, "global_step": 18004, "epoch": 216} {"train_loss": -18.62318992614746, "global_step": 18005, "epoch": 216} {"train_loss": -18.26970863342285, "global_step": 18006, "epoch": 216} {"train_loss": -18.06435203552246, "global_step": 18007, "epoch": 216} {"train_loss": -18.09646987915039, "global_step": 18008, "epoch": 216} {"train_loss": -18.54227638244629, "global_step": 18009, "epoch": 216} {"train_loss": -18.31165168946048, "global_step": 18010, "epoch": 216, "val_loss": 5977351.5} {"train_loss": -17.769084930419922, "global_step": 18011, "epoch": 217} {"train_loss": -18.65791893005371, "global_step": 18012, "epoch": 217} {"train_loss": -18.044233322143555, "global_step": 18013, "epoch": 217} {"train_loss": -18.156375885009766, "global_step": 18014, "epoch": 217} {"train_loss": -18.126737594604492, "global_step": 18015, "epoch": 217} {"train_loss": -18.003002166748047, "global_step": 18016, "epoch": 217} {"train_loss": -18.038816452026367, "global_step": 18017, "epoch": 217} {"train_loss": -18.68393898010254, "global_step": 18018, "epoch": 217} {"train_loss": -17.93036460876465, "global_step": 18019, "epoch": 217} {"train_loss": -17.861846923828125, "global_step": 18020, "epoch": 217} {"train_loss": -18.044179916381836, "global_step": 18021, "epoch": 217} {"train_loss": -18.707265853881836, "global_step": 18022, "epoch": 217} {"train_loss": -17.864971160888672, "global_step": 18023, "epoch": 217} {"train_loss": -17.899587631225586, "global_step": 18024, "epoch": 217} {"train_loss": -17.969358444213867, "global_step": 18025, "epoch": 217} {"train_loss": -17.978761672973633, "global_step": 18026, "epoch": 217} {"train_loss": -18.159250259399414, "global_step": 18027, "epoch": 217} {"train_loss": -18.454299926757812, "global_step": 18028, "epoch": 217} {"train_loss": -18.345584869384766, "global_step": 18029, "epoch": 217} {"train_loss": -18.205522537231445, "global_step": 18030, "epoch": 217} {"train_loss": -18.525636672973633, "global_step": 18031, "epoch": 217} {"train_loss": -18.067201614379883, "global_step": 18032, "epoch": 217} {"train_loss": -18.175024032592773, "global_step": 18033, "epoch": 217} {"train_loss": -18.222274780273438, "global_step": 18034, "epoch": 217} {"train_loss": -18.351184844970703, "global_step": 18035, "epoch": 217} {"train_loss": -18.240293502807617, "global_step": 18036, "epoch": 217} {"train_loss": -18.33367156982422, "global_step": 18037, "epoch": 217} {"train_loss": -18.4896297454834, "global_step": 18038, "epoch": 217} {"train_loss": -18.126066207885742, "global_step": 18039, "epoch": 217} {"train_loss": -18.26066017150879, "global_step": 18040, "epoch": 217} {"train_loss": -18.417394638061523, "global_step": 18041, "epoch": 217} {"train_loss": -18.376890182495117, "global_step": 18042, "epoch": 217} {"train_loss": -18.323705673217773, "global_step": 18043, "epoch": 217} {"train_loss": -18.50619888305664, "global_step": 18044, "epoch": 217} {"train_loss": -18.413305282592773, "global_step": 18045, "epoch": 217} {"train_loss": -18.338680267333984, "global_step": 18046, "epoch": 217} {"train_loss": -18.378143310546875, "global_step": 18047, "epoch": 217} {"train_loss": -18.31377601623535, "global_step": 18048, "epoch": 217} {"train_loss": -18.100431442260742, "global_step": 18049, "epoch": 217} {"train_loss": -18.22316551208496, "global_step": 18050, "epoch": 217} {"train_loss": -17.95197868347168, "global_step": 18051, "epoch": 217} {"train_loss": -18.4457950592041, "global_step": 18052, "epoch": 217} {"train_loss": -18.40775489807129, "global_step": 18053, "epoch": 217} {"train_loss": -18.58005142211914, "global_step": 18054, "epoch": 217} {"train_loss": -18.264789581298828, "global_step": 18055, "epoch": 217} {"train_loss": -18.563398361206055, "global_step": 18056, "epoch": 217} {"train_loss": -18.37152099609375, "global_step": 18057, "epoch": 217} {"train_loss": -17.956411361694336, "global_step": 18058, "epoch": 217} {"train_loss": -18.420652389526367, "global_step": 18059, "epoch": 217} {"train_loss": -18.712575912475586, "global_step": 18060, "epoch": 217} {"train_loss": -18.462745666503906, "global_step": 18061, "epoch": 217} {"train_loss": -18.291807174682617, "global_step": 18062, "epoch": 217} {"train_loss": -18.319015502929688, "global_step": 18063, "epoch": 217} {"train_loss": -18.104978561401367, "global_step": 18064, "epoch": 217} {"train_loss": -18.413957595825195, "global_step": 18065, "epoch": 217} {"train_loss": -18.521535873413086, "global_step": 18066, "epoch": 217} {"train_loss": -18.396549224853516, "global_step": 18067, "epoch": 217} {"train_loss": -18.348379135131836, "global_step": 18068, "epoch": 217} {"train_loss": -18.21935272216797, "global_step": 18069, "epoch": 217} {"train_loss": -18.51889419555664, "global_step": 18070, "epoch": 217} {"train_loss": -18.380786895751953, "global_step": 18071, "epoch": 217} {"train_loss": -18.155485153198242, "global_step": 18072, "epoch": 217} {"train_loss": -18.558012008666992, "global_step": 18073, "epoch": 217} {"train_loss": -18.604856491088867, "global_step": 18074, "epoch": 217} {"train_loss": -18.196455001831055, "global_step": 18075, "epoch": 217} {"train_loss": -18.504369735717773, "global_step": 18076, "epoch": 217} {"train_loss": -18.480039596557617, "global_step": 18077, "epoch": 217} {"train_loss": -18.250364303588867, "global_step": 18078, "epoch": 217} {"train_loss": -18.323392868041992, "global_step": 18079, "epoch": 217} {"train_loss": -18.449308395385742, "global_step": 18080, "epoch": 217} {"train_loss": -18.224225997924805, "global_step": 18081, "epoch": 217} {"train_loss": -18.343931198120117, "global_step": 18082, "epoch": 217} {"train_loss": -18.377023696899414, "global_step": 18083, "epoch": 217} {"train_loss": -18.43924903869629, "global_step": 18084, "epoch": 217} {"train_loss": -18.42632293701172, "global_step": 18085, "epoch": 217} {"train_loss": -18.22968101501465, "global_step": 18086, "epoch": 217} {"train_loss": -18.250511169433594, "global_step": 18087, "epoch": 217} {"train_loss": -18.63787269592285, "global_step": 18088, "epoch": 217} {"train_loss": -17.901857376098633, "global_step": 18089, "epoch": 217} {"train_loss": -18.26214599609375, "global_step": 18090, "epoch": 217} {"train_loss": -18.170825958251953, "global_step": 18091, "epoch": 217} {"train_loss": -17.967315673828125, "global_step": 18092, "epoch": 217} {"train_loss": -18.272663369236223, "global_step": 18093, "epoch": 217, "val_loss": 5838638.5} {"train_loss": -18.22834587097168, "global_step": 18094, "epoch": 218} {"train_loss": -18.000965118408203, "global_step": 18095, "epoch": 218} {"train_loss": -18.231998443603516, "global_step": 18096, "epoch": 218} {"train_loss": -18.26173210144043, "global_step": 18097, "epoch": 218} {"train_loss": -17.785314559936523, "global_step": 18098, "epoch": 218} {"train_loss": -18.394134521484375, "global_step": 18099, "epoch": 218} {"train_loss": -18.065786361694336, "global_step": 18100, "epoch": 218} {"train_loss": -17.940874099731445, "global_step": 18101, "epoch": 218} {"train_loss": -18.235553741455078, "global_step": 18102, "epoch": 218} {"train_loss": -18.772024154663086, "global_step": 18103, "epoch": 218} {"train_loss": -17.993803024291992, "global_step": 18104, "epoch": 218} {"train_loss": -18.227046966552734, "global_step": 18105, "epoch": 218} {"train_loss": -18.265222549438477, "global_step": 18106, "epoch": 218} {"train_loss": -18.4737491607666, "global_step": 18107, "epoch": 218} {"train_loss": -18.53751564025879, "global_step": 18108, "epoch": 218} {"train_loss": -18.330341339111328, "global_step": 18109, "epoch": 218} {"train_loss": -18.336828231811523, "global_step": 18110, "epoch": 218} {"train_loss": -18.23127555847168, "global_step": 18111, "epoch": 218} {"train_loss": -18.172189712524414, "global_step": 18112, "epoch": 218} {"train_loss": -18.3575382232666, "global_step": 18113, "epoch": 218} {"train_loss": -18.37621307373047, "global_step": 18114, "epoch": 218} {"train_loss": -18.12596893310547, "global_step": 18115, "epoch": 218} {"train_loss": -18.214136123657227, "global_step": 18116, "epoch": 218} {"train_loss": -18.56032371520996, "global_step": 18117, "epoch": 218} {"train_loss": -17.99714469909668, "global_step": 18118, "epoch": 218} {"train_loss": -18.140615463256836, "global_step": 18119, "epoch": 218} {"train_loss": -18.058435440063477, "global_step": 18120, "epoch": 218} {"train_loss": -18.07070541381836, "global_step": 18121, "epoch": 218} {"train_loss": -18.14043426513672, "global_step": 18122, "epoch": 218} {"train_loss": -18.264633178710938, "global_step": 18123, "epoch": 218} {"train_loss": -18.412988662719727, "global_step": 18124, "epoch": 218} {"train_loss": -18.303091049194336, "global_step": 18125, "epoch": 218} {"train_loss": -18.071910858154297, "global_step": 18126, "epoch": 218} {"train_loss": -18.243879318237305, "global_step": 18127, "epoch": 218} {"train_loss": -17.99325180053711, "global_step": 18128, "epoch": 218} {"train_loss": -18.215238571166992, "global_step": 18129, "epoch": 218} {"train_loss": -18.376895904541016, "global_step": 18130, "epoch": 218} {"train_loss": -18.41242790222168, "global_step": 18131, "epoch": 218} {"train_loss": -18.24176597595215, "global_step": 18132, "epoch": 218} {"train_loss": -18.18250274658203, "global_step": 18133, "epoch": 218} {"train_loss": -18.530881881713867, "global_step": 18134, "epoch": 218} {"train_loss": -18.34842872619629, "global_step": 18135, "epoch": 218} {"train_loss": -18.042247772216797, "global_step": 18136, "epoch": 218} {"train_loss": -18.23175048828125, "global_step": 18137, "epoch": 218} {"train_loss": -18.33194351196289, "global_step": 18138, "epoch": 218} {"train_loss": -18.630910873413086, "global_step": 18139, "epoch": 218} {"train_loss": -18.452394485473633, "global_step": 18140, "epoch": 218} {"train_loss": -18.346906661987305, "global_step": 18141, "epoch": 218} {"train_loss": -18.64389991760254, "global_step": 18142, "epoch": 218} {"train_loss": -18.26978874206543, "global_step": 18143, "epoch": 218} {"train_loss": -18.18204689025879, "global_step": 18144, "epoch": 218} {"train_loss": -18.797119140625, "global_step": 18145, "epoch": 218} {"train_loss": -18.612287521362305, "global_step": 18146, "epoch": 218} {"train_loss": -18.530670166015625, "global_step": 18147, "epoch": 218} {"train_loss": -18.560911178588867, "global_step": 18148, "epoch": 218} {"train_loss": -18.6870059967041, "global_step": 18149, "epoch": 218} {"train_loss": -18.338685989379883, "global_step": 18150, "epoch": 218} {"train_loss": -18.272497177124023, "global_step": 18151, "epoch": 218} {"train_loss": -18.319950103759766, "global_step": 18152, "epoch": 218} {"train_loss": -18.471073150634766, "global_step": 18153, "epoch": 218} {"train_loss": -17.879316329956055, "global_step": 18154, "epoch": 218} {"train_loss": -18.350683212280273, "global_step": 18155, "epoch": 218} {"train_loss": -18.486848831176758, "global_step": 18156, "epoch": 218} {"train_loss": -18.45530128479004, "global_step": 18157, "epoch": 218} {"train_loss": -18.213048934936523, "global_step": 18158, "epoch": 218} {"train_loss": -18.545455932617188, "global_step": 18159, "epoch": 218} {"train_loss": -18.007871627807617, "global_step": 18160, "epoch": 218} {"train_loss": -18.48191261291504, "global_step": 18161, "epoch": 218} {"train_loss": -18.404516220092773, "global_step": 18162, "epoch": 218} {"train_loss": -18.499286651611328, "global_step": 18163, "epoch": 218} {"train_loss": -18.49236488342285, "global_step": 18164, "epoch": 218} {"train_loss": -18.23054313659668, "global_step": 18165, "epoch": 218} {"train_loss": -18.303476333618164, "global_step": 18166, "epoch": 218} {"train_loss": -18.23766326904297, "global_step": 18167, "epoch": 218} {"train_loss": -18.44465446472168, "global_step": 18168, "epoch": 218} {"train_loss": -18.495071411132812, "global_step": 18169, "epoch": 218} {"train_loss": -18.16017723083496, "global_step": 18170, "epoch": 218} {"train_loss": -18.304065704345703, "global_step": 18171, "epoch": 218} {"train_loss": -18.444442749023438, "global_step": 18172, "epoch": 218} {"train_loss": -17.984291076660156, "global_step": 18173, "epoch": 218} {"train_loss": -18.556365966796875, "global_step": 18174, "epoch": 218} {"train_loss": -18.542112350463867, "global_step": 18175, "epoch": 218} {"train_loss": -18.308355836983186, "global_step": 18176, "epoch": 218, "val_loss": 5854189.0} {"train_loss": -18.22545623779297, "global_step": 18177, "epoch": 219} {"train_loss": -17.653806686401367, "global_step": 18178, "epoch": 219} {"train_loss": -17.98850440979004, "global_step": 18179, "epoch": 219} {"train_loss": -17.95319938659668, "global_step": 18180, "epoch": 219} {"train_loss": -17.929920196533203, "global_step": 18181, "epoch": 219} {"train_loss": -18.304746627807617, "global_step": 18182, "epoch": 219} {"train_loss": -17.89485740661621, "global_step": 18183, "epoch": 219} {"train_loss": -17.990385055541992, "global_step": 18184, "epoch": 219} {"train_loss": -18.007978439331055, "global_step": 18185, "epoch": 219} {"train_loss": -17.796079635620117, "global_step": 18186, "epoch": 219} {"train_loss": -18.163415908813477, "global_step": 18187, "epoch": 219} {"train_loss": -18.615800857543945, "global_step": 18188, "epoch": 219} {"train_loss": -18.109188079833984, "global_step": 18189, "epoch": 219} {"train_loss": -18.206037521362305, "global_step": 18190, "epoch": 219} {"train_loss": -18.455188751220703, "global_step": 18191, "epoch": 219} {"train_loss": -18.34621238708496, "global_step": 18192, "epoch": 219} {"train_loss": -18.335861206054688, "global_step": 18193, "epoch": 219} {"train_loss": -18.494245529174805, "global_step": 18194, "epoch": 219} {"train_loss": -18.56679344177246, "global_step": 18195, "epoch": 219} {"train_loss": -18.484312057495117, "global_step": 18196, "epoch": 219} {"train_loss": -18.44892692565918, "global_step": 18197, "epoch": 219} {"train_loss": -18.591278076171875, "global_step": 18198, "epoch": 219} {"train_loss": -18.517276763916016, "global_step": 18199, "epoch": 219} {"train_loss": -18.17068862915039, "global_step": 18200, "epoch": 219} {"train_loss": -17.975446701049805, "global_step": 18201, "epoch": 219} {"train_loss": -18.272541046142578, "global_step": 18202, "epoch": 219} {"train_loss": -17.786903381347656, "global_step": 18203, "epoch": 219} {"train_loss": -18.16362953186035, "global_step": 18204, "epoch": 219} {"train_loss": -17.911954879760742, "global_step": 18205, "epoch": 219} {"train_loss": -18.438308715820312, "global_step": 18206, "epoch": 219} {"train_loss": -18.770151138305664, "global_step": 18207, "epoch": 219} {"train_loss": -18.21260643005371, "global_step": 18208, "epoch": 219} {"train_loss": -18.156007766723633, "global_step": 18209, "epoch": 219} {"train_loss": -18.261320114135742, "global_step": 18210, "epoch": 219} {"train_loss": -18.26774787902832, "global_step": 18211, "epoch": 219} {"train_loss": -18.009305953979492, "global_step": 18212, "epoch": 219} {"train_loss": -18.24482536315918, "global_step": 18213, "epoch": 219} {"train_loss": -18.50416374206543, "global_step": 18214, "epoch": 219} {"train_loss": -17.99789810180664, "global_step": 18215, "epoch": 219} {"train_loss": -18.000123977661133, "global_step": 18216, "epoch": 219} {"train_loss": -18.398086547851562, "global_step": 18217, "epoch": 219} {"train_loss": -18.126371383666992, "global_step": 18218, "epoch": 219} {"train_loss": -18.289642333984375, "global_step": 18219, "epoch": 219} {"train_loss": -18.519556045532227, "global_step": 18220, "epoch": 219} {"train_loss": -18.299833297729492, "global_step": 18221, "epoch": 219} {"train_loss": -18.05675506591797, "global_step": 18222, "epoch": 219} {"train_loss": -18.268861770629883, "global_step": 18223, "epoch": 219} {"train_loss": -18.130508422851562, "global_step": 18224, "epoch": 219} {"train_loss": -18.288742065429688, "global_step": 18225, "epoch": 219} {"train_loss": -18.2947998046875, "global_step": 18226, "epoch": 219} {"train_loss": -18.184951782226562, "global_step": 18227, "epoch": 219} {"train_loss": -18.47454833984375, "global_step": 18228, "epoch": 219} {"train_loss": -18.490997314453125, "global_step": 18229, "epoch": 219} {"train_loss": -18.304662704467773, "global_step": 18230, "epoch": 219} {"train_loss": -18.16254234313965, "global_step": 18231, "epoch": 219} {"train_loss": -18.074804306030273, "global_step": 18232, "epoch": 219} {"train_loss": -18.51179313659668, "global_step": 18233, "epoch": 219} {"train_loss": -18.32971954345703, "global_step": 18234, "epoch": 219} {"train_loss": -18.58366584777832, "global_step": 18235, "epoch": 219} {"train_loss": -18.702306747436523, "global_step": 18236, "epoch": 219} {"train_loss": -18.496686935424805, "global_step": 18237, "epoch": 219} {"train_loss": -18.28390884399414, "global_step": 18238, "epoch": 219} {"train_loss": -18.56068229675293, "global_step": 18239, "epoch": 219} {"train_loss": -18.359121322631836, "global_step": 18240, "epoch": 219} {"train_loss": -18.044239044189453, "global_step": 18241, "epoch": 219} {"train_loss": -18.21438980102539, "global_step": 18242, "epoch": 219} {"train_loss": -18.188024520874023, "global_step": 18243, "epoch": 219} {"train_loss": -18.164289474487305, "global_step": 18244, "epoch": 219} {"train_loss": -18.664382934570312, "global_step": 18245, "epoch": 219} {"train_loss": -18.358869552612305, "global_step": 18246, "epoch": 219} {"train_loss": -18.508703231811523, "global_step": 18247, "epoch": 219} {"train_loss": -18.31617546081543, "global_step": 18248, "epoch": 219} {"train_loss": -18.06846046447754, "global_step": 18249, "epoch": 219} {"train_loss": -18.352590560913086, "global_step": 18250, "epoch": 219} {"train_loss": -18.824003219604492, "global_step": 18251, "epoch": 219} {"train_loss": -18.44093894958496, "global_step": 18252, "epoch": 219} {"train_loss": -18.35053253173828, "global_step": 18253, "epoch": 219} {"train_loss": -18.401906967163086, "global_step": 18254, "epoch": 219} {"train_loss": -18.4969425201416, "global_step": 18255, "epoch": 219} {"train_loss": -18.43355369567871, "global_step": 18256, "epoch": 219} {"train_loss": -18.762451171875, "global_step": 18257, "epoch": 219} {"train_loss": -18.288299560546875, "global_step": 18258, "epoch": 219} {"train_loss": -18.273397514619024, "global_step": 18259, "epoch": 219, "val_loss": 5830107.5} {"train_loss": -17.99949836730957, "global_step": 18260, "epoch": 220} {"train_loss": -17.839487075805664, "global_step": 18261, "epoch": 220} {"train_loss": -18.0539493560791, "global_step": 18262, "epoch": 220} {"train_loss": -17.90338134765625, "global_step": 18263, "epoch": 220} {"train_loss": -17.89247703552246, "global_step": 18264, "epoch": 220} {"train_loss": -17.659406661987305, "global_step": 18265, "epoch": 220} {"train_loss": -17.93517303466797, "global_step": 18266, "epoch": 220} {"train_loss": -18.1738338470459, "global_step": 18267, "epoch": 220} {"train_loss": -17.921051025390625, "global_step": 18268, "epoch": 220} {"train_loss": -18.517784118652344, "global_step": 18269, "epoch": 220} {"train_loss": -18.106603622436523, "global_step": 18270, "epoch": 220} {"train_loss": -18.089069366455078, "global_step": 18271, "epoch": 220} {"train_loss": -17.90778923034668, "global_step": 18272, "epoch": 220} {"train_loss": -18.13815689086914, "global_step": 18273, "epoch": 220} {"train_loss": -18.498676300048828, "global_step": 18274, "epoch": 220} {"train_loss": -17.945178985595703, "global_step": 18275, "epoch": 220} {"train_loss": -18.108776092529297, "global_step": 18276, "epoch": 220} {"train_loss": -18.156143188476562, "global_step": 18277, "epoch": 220} {"train_loss": -18.0373477935791, "global_step": 18278, "epoch": 220} {"train_loss": -18.2633113861084, "global_step": 18279, "epoch": 220} {"train_loss": -18.629201889038086, "global_step": 18280, "epoch": 220} {"train_loss": -17.95591926574707, "global_step": 18281, "epoch": 220} {"train_loss": -18.368871688842773, "global_step": 18282, "epoch": 220} {"train_loss": -18.2971134185791, "global_step": 18283, "epoch": 220} {"train_loss": -18.06195640563965, "global_step": 18284, "epoch": 220} {"train_loss": -18.523452758789062, "global_step": 18285, "epoch": 220} {"train_loss": -18.68047332763672, "global_step": 18286, "epoch": 220} {"train_loss": -18.358745574951172, "global_step": 18287, "epoch": 220} {"train_loss": -18.42005729675293, "global_step": 18288, "epoch": 220} {"train_loss": -18.654693603515625, "global_step": 18289, "epoch": 220} {"train_loss": -18.32611656188965, "global_step": 18290, "epoch": 220} {"train_loss": -18.429288864135742, "global_step": 18291, "epoch": 220} {"train_loss": -18.44947052001953, "global_step": 18292, "epoch": 220} {"train_loss": -18.537784576416016, "global_step": 18293, "epoch": 220} {"train_loss": -18.433252334594727, "global_step": 18294, "epoch": 220} {"train_loss": -18.608964920043945, "global_step": 18295, "epoch": 220} {"train_loss": -18.37773323059082, "global_step": 18296, "epoch": 220} {"train_loss": -18.14223289489746, "global_step": 18297, "epoch": 220} {"train_loss": -18.18509292602539, "global_step": 18298, "epoch": 220} {"train_loss": -18.346330642700195, "global_step": 18299, "epoch": 220} {"train_loss": -18.495473861694336, "global_step": 18300, "epoch": 220} {"train_loss": -17.867551803588867, "global_step": 18301, "epoch": 220} {"train_loss": -18.554729461669922, "global_step": 18302, "epoch": 220} {"train_loss": -18.501407623291016, "global_step": 18303, "epoch": 220} {"train_loss": -18.400514602661133, "global_step": 18304, "epoch": 220} {"train_loss": -18.473709106445312, "global_step": 18305, "epoch": 220} {"train_loss": -18.257568359375, "global_step": 18306, "epoch": 220} {"train_loss": -18.23701286315918, "global_step": 18307, "epoch": 220} {"train_loss": -18.520261764526367, "global_step": 18308, "epoch": 220} {"train_loss": -18.41147804260254, "global_step": 18309, "epoch": 220} {"train_loss": -18.420101165771484, "global_step": 18310, "epoch": 220} {"train_loss": -18.68988037109375, "global_step": 18311, "epoch": 220} {"train_loss": -18.06519889831543, "global_step": 18312, "epoch": 220} {"train_loss": -18.50563621520996, "global_step": 18313, "epoch": 220} {"train_loss": -18.291976928710938, "global_step": 18314, "epoch": 220} {"train_loss": -18.409597396850586, "global_step": 18315, "epoch": 220} {"train_loss": -18.187320709228516, "global_step": 18316, "epoch": 220} {"train_loss": -18.36353874206543, "global_step": 18317, "epoch": 220} {"train_loss": -18.17478370666504, "global_step": 18318, "epoch": 220} {"train_loss": -18.424549102783203, "global_step": 18319, "epoch": 220} {"train_loss": -18.407821655273438, "global_step": 18320, "epoch": 220} {"train_loss": -18.705869674682617, "global_step": 18321, "epoch": 220} {"train_loss": -18.495534896850586, "global_step": 18322, "epoch": 220} {"train_loss": -18.56348991394043, "global_step": 18323, "epoch": 220} {"train_loss": -18.210554122924805, "global_step": 18324, "epoch": 220} {"train_loss": -18.482481002807617, "global_step": 18325, "epoch": 220} {"train_loss": -18.382898330688477, "global_step": 18326, "epoch": 220} {"train_loss": -18.496122360229492, "global_step": 18327, "epoch": 220} {"train_loss": -18.364974975585938, "global_step": 18328, "epoch": 220} {"train_loss": -18.154022216796875, "global_step": 18329, "epoch": 220} {"train_loss": -18.319259643554688, "global_step": 18330, "epoch": 220} {"train_loss": -18.18299102783203, "global_step": 18331, "epoch": 220} {"train_loss": -18.58094596862793, "global_step": 18332, "epoch": 220} {"train_loss": -18.270261764526367, "global_step": 18333, "epoch": 220} {"train_loss": -18.20769691467285, "global_step": 18334, "epoch": 220} {"train_loss": -18.20054054260254, "global_step": 18335, "epoch": 220} {"train_loss": -18.782312393188477, "global_step": 18336, "epoch": 220} {"train_loss": -18.212909698486328, "global_step": 18337, "epoch": 220} {"train_loss": -18.182220458984375, "global_step": 18338, "epoch": 220} {"train_loss": -17.876066207885742, "global_step": 18339, "epoch": 220} {"train_loss": -18.198312759399414, "global_step": 18340, "epoch": 220} {"train_loss": -17.840839385986328, "global_step": 18341, "epoch": 220} {"train_loss": -18.28294076115252, "global_step": 18342, "epoch": 220, "val_loss": 5961084.0} {"train_loss": -18.280487060546875, "global_step": 18343, "epoch": 221} {"train_loss": -18.30647850036621, "global_step": 18344, "epoch": 221} {"train_loss": -18.624820709228516, "global_step": 18345, "epoch": 221} {"train_loss": -18.25470542907715, "global_step": 18346, "epoch": 221} {"train_loss": -18.6861515045166, "global_step": 18347, "epoch": 221} {"train_loss": -18.137670516967773, "global_step": 18348, "epoch": 221} {"train_loss": -18.073476791381836, "global_step": 18349, "epoch": 221} {"train_loss": -18.609533309936523, "global_step": 18350, "epoch": 221} {"train_loss": -18.280256271362305, "global_step": 18351, "epoch": 221} {"train_loss": -18.05177116394043, "global_step": 18352, "epoch": 221} {"train_loss": -18.108482360839844, "global_step": 18353, "epoch": 221} {"train_loss": -18.2948055267334, "global_step": 18354, "epoch": 221} {"train_loss": -18.39613151550293, "global_step": 18355, "epoch": 221} {"train_loss": -18.550846099853516, "global_step": 18356, "epoch": 221} {"train_loss": -18.07291603088379, "global_step": 18357, "epoch": 221} {"train_loss": -18.561628341674805, "global_step": 18358, "epoch": 221} {"train_loss": -18.22904396057129, "global_step": 18359, "epoch": 221} {"train_loss": -17.934860229492188, "global_step": 18360, "epoch": 221} {"train_loss": -18.348037719726562, "global_step": 18361, "epoch": 221} {"train_loss": -18.45281219482422, "global_step": 18362, "epoch": 221} {"train_loss": -18.271635055541992, "global_step": 18363, "epoch": 221} {"train_loss": -17.933277130126953, "global_step": 18364, "epoch": 221} {"train_loss": -18.717594146728516, "global_step": 18365, "epoch": 221} {"train_loss": -18.584644317626953, "global_step": 18366, "epoch": 221} {"train_loss": -18.529346466064453, "global_step": 18367, "epoch": 221} {"train_loss": -18.2757511138916, "global_step": 18368, "epoch": 221} {"train_loss": -18.434797286987305, "global_step": 18369, "epoch": 221} {"train_loss": -18.316055297851562, "global_step": 18370, "epoch": 221} {"train_loss": -18.728654861450195, "global_step": 18371, "epoch": 221} {"train_loss": -18.435535430908203, "global_step": 18372, "epoch": 221} {"train_loss": -18.229047775268555, "global_step": 18373, "epoch": 221} {"train_loss": -18.084716796875, "global_step": 18374, "epoch": 221} {"train_loss": -18.643423080444336, "global_step": 18375, "epoch": 221} {"train_loss": -18.39454460144043, "global_step": 18376, "epoch": 221} {"train_loss": -18.45595932006836, "global_step": 18377, "epoch": 221} {"train_loss": -18.473596572875977, "global_step": 18378, "epoch": 221} {"train_loss": -18.093332290649414, "global_step": 18379, "epoch": 221} {"train_loss": -18.25404167175293, "global_step": 18380, "epoch": 221} {"train_loss": -18.760650634765625, "global_step": 18381, "epoch": 221} {"train_loss": -18.158044815063477, "global_step": 18382, "epoch": 221} {"train_loss": -18.359846115112305, "global_step": 18383, "epoch": 221} {"train_loss": -18.197362899780273, "global_step": 18384, "epoch": 221} {"train_loss": -18.371234893798828, "global_step": 18385, "epoch": 221} {"train_loss": -18.37857437133789, "global_step": 18386, "epoch": 221} {"train_loss": -18.312063217163086, "global_step": 18387, "epoch": 221} {"train_loss": -18.460426330566406, "global_step": 18388, "epoch": 221} {"train_loss": -18.48494529724121, "global_step": 18389, "epoch": 221} {"train_loss": -18.209732055664062, "global_step": 18390, "epoch": 221} {"train_loss": -18.150203704833984, "global_step": 18391, "epoch": 221} {"train_loss": -18.355571746826172, "global_step": 18392, "epoch": 221} {"train_loss": -18.4610538482666, "global_step": 18393, "epoch": 221} {"train_loss": -17.997291564941406, "global_step": 18394, "epoch": 221} {"train_loss": -17.94731330871582, "global_step": 18395, "epoch": 221} {"train_loss": -18.245893478393555, "global_step": 18396, "epoch": 221} {"train_loss": -18.10029411315918, "global_step": 18397, "epoch": 221} {"train_loss": -18.51935386657715, "global_step": 18398, "epoch": 221} {"train_loss": -18.31684684753418, "global_step": 18399, "epoch": 221} {"train_loss": -18.2332820892334, "global_step": 18400, "epoch": 221} {"train_loss": -18.587106704711914, "global_step": 18401, "epoch": 221} {"train_loss": -18.42345428466797, "global_step": 18402, "epoch": 221} {"train_loss": -18.4738826751709, "global_step": 18403, "epoch": 221} {"train_loss": -18.619083404541016, "global_step": 18404, "epoch": 221} {"train_loss": -18.400833129882812, "global_step": 18405, "epoch": 221} {"train_loss": -18.219837188720703, "global_step": 18406, "epoch": 221} {"train_loss": -18.32413101196289, "global_step": 18407, "epoch": 221} {"train_loss": -18.096860885620117, "global_step": 18408, "epoch": 221} {"train_loss": -18.57969093322754, "global_step": 18409, "epoch": 221} {"train_loss": -18.562149047851562, "global_step": 18410, "epoch": 221} {"train_loss": -18.4051570892334, "global_step": 18411, "epoch": 221} {"train_loss": -18.327871322631836, "global_step": 18412, "epoch": 221} {"train_loss": -18.26985740661621, "global_step": 18413, "epoch": 221} {"train_loss": -19.02496910095215, "global_step": 18414, "epoch": 221} {"train_loss": -18.390235900878906, "global_step": 18415, "epoch": 221} {"train_loss": -18.51616859436035, "global_step": 18416, "epoch": 221} {"train_loss": -17.998291015625, "global_step": 18417, "epoch": 221} {"train_loss": -18.227907180786133, "global_step": 18418, "epoch": 221} {"train_loss": -18.426536560058594, "global_step": 18419, "epoch": 221} {"train_loss": -17.993640899658203, "global_step": 18420, "epoch": 221} {"train_loss": -18.197330474853516, "global_step": 18421, "epoch": 221} {"train_loss": -18.626535415649414, "global_step": 18422, "epoch": 221} {"train_loss": -18.282724380493164, "global_step": 18423, "epoch": 221} {"train_loss": -18.06805419921875, "global_step": 18424, "epoch": 221} {"train_loss": -18.34821227659662, "global_step": 18425, "epoch": 221, "val_loss": 5749030.0} {"train_loss": -17.5985164642334, "global_step": 18426, "epoch": 222} {"train_loss": -18.024948120117188, "global_step": 18427, "epoch": 222} {"train_loss": -17.994443893432617, "global_step": 18428, "epoch": 222} {"train_loss": -18.043766021728516, "global_step": 18429, "epoch": 222} {"train_loss": -18.256793975830078, "global_step": 18430, "epoch": 222} {"train_loss": -18.253875732421875, "global_step": 18431, "epoch": 222} {"train_loss": -17.863386154174805, "global_step": 18432, "epoch": 222} {"train_loss": -17.976835250854492, "global_step": 18433, "epoch": 222} {"train_loss": -18.037128448486328, "global_step": 18434, "epoch": 222} {"train_loss": -18.216400146484375, "global_step": 18435, "epoch": 222} {"train_loss": -18.1208438873291, "global_step": 18436, "epoch": 222} {"train_loss": -18.017593383789062, "global_step": 18437, "epoch": 222} {"train_loss": -17.9979248046875, "global_step": 18438, "epoch": 222} {"train_loss": -18.388626098632812, "global_step": 18439, "epoch": 222} {"train_loss": -18.401750564575195, "global_step": 18440, "epoch": 222} {"train_loss": -18.478769302368164, "global_step": 18441, "epoch": 222} {"train_loss": -18.365018844604492, "global_step": 18442, "epoch": 222} {"train_loss": -18.564359664916992, "global_step": 18443, "epoch": 222} {"train_loss": -18.18118667602539, "global_step": 18444, "epoch": 222} {"train_loss": -18.582918167114258, "global_step": 18445, "epoch": 222} {"train_loss": -18.31344223022461, "global_step": 18446, "epoch": 222} {"train_loss": -18.42776107788086, "global_step": 18447, "epoch": 222} {"train_loss": -18.10207176208496, "global_step": 18448, "epoch": 222} {"train_loss": -18.374509811401367, "global_step": 18449, "epoch": 222} {"train_loss": -18.194438934326172, "global_step": 18450, "epoch": 222} {"train_loss": -18.145484924316406, "global_step": 18451, "epoch": 222} {"train_loss": -18.156597137451172, "global_step": 18452, "epoch": 222} {"train_loss": -18.281137466430664, "global_step": 18453, "epoch": 222} {"train_loss": -18.44837188720703, "global_step": 18454, "epoch": 222} {"train_loss": -18.412168502807617, "global_step": 18455, "epoch": 222} {"train_loss": -18.55598258972168, "global_step": 18456, "epoch": 222} {"train_loss": -18.391687393188477, "global_step": 18457, "epoch": 222} {"train_loss": -18.40300941467285, "global_step": 18458, "epoch": 222} {"train_loss": -18.29885482788086, "global_step": 18459, "epoch": 222} {"train_loss": -18.332626342773438, "global_step": 18460, "epoch": 222} {"train_loss": -18.326353073120117, "global_step": 18461, "epoch": 222} {"train_loss": -18.67523765563965, "global_step": 18462, "epoch": 222} {"train_loss": -18.06635093688965, "global_step": 18463, "epoch": 222} {"train_loss": -18.175657272338867, "global_step": 18464, "epoch": 222} {"train_loss": -18.499120712280273, "global_step": 18465, "epoch": 222} {"train_loss": -18.01968765258789, "global_step": 18466, "epoch": 222} {"train_loss": -18.202829360961914, "global_step": 18467, "epoch": 222} {"train_loss": -18.531789779663086, "global_step": 18468, "epoch": 222} {"train_loss": -18.477096557617188, "global_step": 18469, "epoch": 222} {"train_loss": -18.28289031982422, "global_step": 18470, "epoch": 222} {"train_loss": -18.45597267150879, "global_step": 18471, "epoch": 222} {"train_loss": -18.432687759399414, "global_step": 18472, "epoch": 222} {"train_loss": -18.511343002319336, "global_step": 18473, "epoch": 222} {"train_loss": -18.421798706054688, "global_step": 18474, "epoch": 222} {"train_loss": -18.397903442382812, "global_step": 18475, "epoch": 222} {"train_loss": -18.187463760375977, "global_step": 18476, "epoch": 222} {"train_loss": -18.591514587402344, "global_step": 18477, "epoch": 222} {"train_loss": -17.972179412841797, "global_step": 18478, "epoch": 222} {"train_loss": -18.43267059326172, "global_step": 18479, "epoch": 222} {"train_loss": -18.39544105529785, "global_step": 18480, "epoch": 222} {"train_loss": -18.37348175048828, "global_step": 18481, "epoch": 222} {"train_loss": -18.33123207092285, "global_step": 18482, "epoch": 222} {"train_loss": -18.12664794921875, "global_step": 18483, "epoch": 222} {"train_loss": -18.044797897338867, "global_step": 18484, "epoch": 222} {"train_loss": -18.066593170166016, "global_step": 18485, "epoch": 222} {"train_loss": -18.586471557617188, "global_step": 18486, "epoch": 222} {"train_loss": -18.4975528717041, "global_step": 18487, "epoch": 222} {"train_loss": -18.4460506439209, "global_step": 18488, "epoch": 222} {"train_loss": -18.505054473876953, "global_step": 18489, "epoch": 222} {"train_loss": -18.412092208862305, "global_step": 18490, "epoch": 222} {"train_loss": -18.03664779663086, "global_step": 18491, "epoch": 222} {"train_loss": -18.370885848999023, "global_step": 18492, "epoch": 222} {"train_loss": -18.262866973876953, "global_step": 18493, "epoch": 222} {"train_loss": -18.296354293823242, "global_step": 18494, "epoch": 222} {"train_loss": -18.265024185180664, "global_step": 18495, "epoch": 222} {"train_loss": -18.329858779907227, "global_step": 18496, "epoch": 222} {"train_loss": -18.50787925720215, "global_step": 18497, "epoch": 222} {"train_loss": -18.555879592895508, "global_step": 18498, "epoch": 222} {"train_loss": -18.352432250976562, "global_step": 18499, "epoch": 222} {"train_loss": -18.169635772705078, "global_step": 18500, "epoch": 222} {"train_loss": -18.11097526550293, "global_step": 18501, "epoch": 222} {"train_loss": -18.230192184448242, "global_step": 18502, "epoch": 222} {"train_loss": -18.22987174987793, "global_step": 18503, "epoch": 222} {"train_loss": -18.373376846313477, "global_step": 18504, "epoch": 222} {"train_loss": -18.34063720703125, "global_step": 18505, "epoch": 222} {"train_loss": -18.079456329345703, "global_step": 18506, "epoch": 222} {"train_loss": -18.750919342041016, "global_step": 18507, "epoch": 222} {"train_loss": -18.292989822755377, "global_step": 18508, "epoch": 222, "val_loss": 5876862.5} {"train_loss": -18.195215225219727, "global_step": 18509, "epoch": 223} {"train_loss": -18.111597061157227, "global_step": 18510, "epoch": 223} {"train_loss": -18.240188598632812, "global_step": 18511, "epoch": 223} {"train_loss": -18.255712509155273, "global_step": 18512, "epoch": 223} {"train_loss": -18.52842140197754, "global_step": 18513, "epoch": 223} {"train_loss": -18.11945915222168, "global_step": 18514, "epoch": 223} {"train_loss": -18.093276977539062, "global_step": 18515, "epoch": 223} {"train_loss": -18.026845932006836, "global_step": 18516, "epoch": 223} {"train_loss": -18.31928825378418, "global_step": 18517, "epoch": 223} {"train_loss": -18.171310424804688, "global_step": 18518, "epoch": 223} {"train_loss": -18.5491943359375, "global_step": 18519, "epoch": 223} {"train_loss": -18.31906509399414, "global_step": 18520, "epoch": 223} {"train_loss": -18.38759422302246, "global_step": 18521, "epoch": 223} {"train_loss": -18.746753692626953, "global_step": 18522, "epoch": 223} {"train_loss": -18.447309494018555, "global_step": 18523, "epoch": 223} {"train_loss": -18.35212516784668, "global_step": 18524, "epoch": 223} {"train_loss": -18.25287628173828, "global_step": 18525, "epoch": 223} {"train_loss": -17.964553833007812, "global_step": 18526, "epoch": 223} {"train_loss": -17.991098403930664, "global_step": 18527, "epoch": 223} {"train_loss": -18.52568244934082, "global_step": 18528, "epoch": 223} {"train_loss": -18.42086410522461, "global_step": 18529, "epoch": 223} {"train_loss": -18.01093864440918, "global_step": 18530, "epoch": 223} {"train_loss": -18.36614418029785, "global_step": 18531, "epoch": 223} {"train_loss": -18.162220001220703, "global_step": 18532, "epoch": 223} {"train_loss": -17.869657516479492, "global_step": 18533, "epoch": 223} {"train_loss": -18.060382843017578, "global_step": 18534, "epoch": 223} {"train_loss": -18.477771759033203, "global_step": 18535, "epoch": 223} {"train_loss": -18.320066452026367, "global_step": 18536, "epoch": 223} {"train_loss": -18.1585693359375, "global_step": 18537, "epoch": 223} {"train_loss": -18.112030029296875, "global_step": 18538, "epoch": 223} {"train_loss": -18.34419822692871, "global_step": 18539, "epoch": 223} {"train_loss": -17.62588119506836, "global_step": 18540, "epoch": 223} {"train_loss": -18.076004028320312, "global_step": 18541, "epoch": 223} {"train_loss": -18.47774314880371, "global_step": 18542, "epoch": 223} {"train_loss": -18.00421714782715, "global_step": 18543, "epoch": 223} {"train_loss": -18.56788444519043, "global_step": 18544, "epoch": 223} {"train_loss": -18.45229148864746, "global_step": 18545, "epoch": 223} {"train_loss": -18.6593074798584, "global_step": 18546, "epoch": 223} {"train_loss": -18.503625869750977, "global_step": 18547, "epoch": 223} {"train_loss": -18.286418914794922, "global_step": 18548, "epoch": 223} {"train_loss": -18.243423461914062, "global_step": 18549, "epoch": 223} {"train_loss": -18.2672176361084, "global_step": 18550, "epoch": 223} {"train_loss": -18.02728843688965, "global_step": 18551, "epoch": 223} {"train_loss": -18.678430557250977, "global_step": 18552, "epoch": 223} {"train_loss": -18.452543258666992, "global_step": 18553, "epoch": 223} {"train_loss": -18.68834114074707, "global_step": 18554, "epoch": 223} {"train_loss": -18.174680709838867, "global_step": 18555, "epoch": 223} {"train_loss": -18.595304489135742, "global_step": 18556, "epoch": 223} {"train_loss": -18.670284271240234, "global_step": 18557, "epoch": 223} {"train_loss": -18.4303035736084, "global_step": 18558, "epoch": 223} {"train_loss": -18.397153854370117, "global_step": 18559, "epoch": 223} {"train_loss": -18.324792861938477, "global_step": 18560, "epoch": 223} {"train_loss": -18.412546157836914, "global_step": 18561, "epoch": 223} {"train_loss": -18.436132431030273, "global_step": 18562, "epoch": 223} {"train_loss": -18.916210174560547, "global_step": 18563, "epoch": 223} {"train_loss": -18.614044189453125, "global_step": 18564, "epoch": 223} {"train_loss": -18.318395614624023, "global_step": 18565, "epoch": 223} {"train_loss": -18.353673934936523, "global_step": 18566, "epoch": 223} {"train_loss": -18.549238204956055, "global_step": 18567, "epoch": 223} {"train_loss": -18.6054744720459, "global_step": 18568, "epoch": 223} {"train_loss": -18.2664852142334, "global_step": 18569, "epoch": 223} {"train_loss": -17.740720748901367, "global_step": 18570, "epoch": 223} {"train_loss": -18.521631240844727, "global_step": 18571, "epoch": 223} {"train_loss": -18.468759536743164, "global_step": 18572, "epoch": 223} {"train_loss": -18.213245391845703, "global_step": 18573, "epoch": 223} {"train_loss": -18.56598472595215, "global_step": 18574, "epoch": 223} {"train_loss": -18.787769317626953, "global_step": 18575, "epoch": 223} {"train_loss": -18.384618759155273, "global_step": 18576, "epoch": 223} {"train_loss": -18.640966415405273, "global_step": 18577, "epoch": 223} {"train_loss": -18.57952308654785, "global_step": 18578, "epoch": 223} {"train_loss": -18.042339324951172, "global_step": 18579, "epoch": 223} {"train_loss": -18.60762596130371, "global_step": 18580, "epoch": 223} {"train_loss": -18.357559204101562, "global_step": 18581, "epoch": 223} {"train_loss": -18.39569664001465, "global_step": 18582, "epoch": 223} {"train_loss": -18.425949096679688, "global_step": 18583, "epoch": 223} {"train_loss": -18.487279891967773, "global_step": 18584, "epoch": 223} {"train_loss": -18.389719009399414, "global_step": 18585, "epoch": 223} {"train_loss": -18.517919540405273, "global_step": 18586, "epoch": 223} {"train_loss": -18.51622772216797, "global_step": 18587, "epoch": 223} {"train_loss": -18.417165756225586, "global_step": 18588, "epoch": 223} {"train_loss": -18.110498428344727, "global_step": 18589, "epoch": 223} {"train_loss": -18.458711624145508, "global_step": 18590, "epoch": 223} {"train_loss": -18.34847424978233, "global_step": 18591, "epoch": 223, "val_loss": 5844493.0} {"train_loss": -18.173933029174805, "global_step": 18592, "epoch": 224} {"train_loss": -18.522321701049805, "global_step": 18593, "epoch": 224} {"train_loss": -18.33418846130371, "global_step": 18594, "epoch": 224} {"train_loss": -18.6071720123291, "global_step": 18595, "epoch": 224} {"train_loss": -18.587549209594727, "global_step": 18596, "epoch": 224} {"train_loss": -18.185522079467773, "global_step": 18597, "epoch": 224} {"train_loss": -17.420452117919922, "global_step": 18598, "epoch": 224} {"train_loss": -18.418914794921875, "global_step": 18599, "epoch": 224} {"train_loss": -18.09564781188965, "global_step": 18600, "epoch": 224} {"train_loss": -18.19788360595703, "global_step": 18601, "epoch": 224} {"train_loss": -18.38469886779785, "global_step": 18602, "epoch": 224} {"train_loss": -18.07486343383789, "global_step": 18603, "epoch": 224} {"train_loss": -18.297622680664062, "global_step": 18604, "epoch": 224} {"train_loss": -18.084707260131836, "global_step": 18605, "epoch": 224} {"train_loss": -18.402917861938477, "global_step": 18606, "epoch": 224} {"train_loss": -18.184072494506836, "global_step": 18607, "epoch": 224} {"train_loss": -18.165180206298828, "global_step": 18608, "epoch": 224} {"train_loss": -18.430309295654297, "global_step": 18609, "epoch": 224} {"train_loss": -18.469589233398438, "global_step": 18610, "epoch": 224} {"train_loss": -18.25030517578125, "global_step": 18611, "epoch": 224} {"train_loss": -18.065980911254883, "global_step": 18612, "epoch": 224} {"train_loss": -18.27747917175293, "global_step": 18613, "epoch": 224} {"train_loss": -18.47771644592285, "global_step": 18614, "epoch": 224} {"train_loss": -18.628036499023438, "global_step": 18615, "epoch": 224} {"train_loss": -18.300689697265625, "global_step": 18616, "epoch": 224} {"train_loss": -18.59162712097168, "global_step": 18617, "epoch": 224} {"train_loss": -18.46845054626465, "global_step": 18618, "epoch": 224} {"train_loss": -18.479631423950195, "global_step": 18619, "epoch": 224} {"train_loss": -18.513391494750977, "global_step": 18620, "epoch": 224} {"train_loss": -18.168603897094727, "global_step": 18621, "epoch": 224} {"train_loss": -18.42176628112793, "global_step": 18622, "epoch": 224} {"train_loss": -18.352270126342773, "global_step": 18623, "epoch": 224} {"train_loss": -18.4594783782959, "global_step": 18624, "epoch": 224} {"train_loss": -18.298086166381836, "global_step": 18625, "epoch": 224} {"train_loss": -18.61100196838379, "global_step": 18626, "epoch": 224} {"train_loss": -18.169553756713867, "global_step": 18627, "epoch": 224} {"train_loss": -18.28618812561035, "global_step": 18628, "epoch": 224} {"train_loss": -18.24823760986328, "global_step": 18629, "epoch": 224} {"train_loss": -18.093250274658203, "global_step": 18630, "epoch": 224} {"train_loss": -18.408096313476562, "global_step": 18631, "epoch": 224} {"train_loss": -18.365676879882812, "global_step": 18632, "epoch": 224} {"train_loss": -18.16817283630371, "global_step": 18633, "epoch": 224} {"train_loss": -18.444549560546875, "global_step": 18634, "epoch": 224} {"train_loss": -18.302892684936523, "global_step": 18635, "epoch": 224} {"train_loss": -18.017669677734375, "global_step": 18636, "epoch": 224} {"train_loss": -18.42118263244629, "global_step": 18637, "epoch": 224} {"train_loss": -18.544496536254883, "global_step": 18638, "epoch": 224} {"train_loss": -18.503877639770508, "global_step": 18639, "epoch": 224} {"train_loss": -18.066131591796875, "global_step": 18640, "epoch": 224} {"train_loss": -18.594236373901367, "global_step": 18641, "epoch": 224} {"train_loss": -18.277179718017578, "global_step": 18642, "epoch": 224} {"train_loss": -18.319053649902344, "global_step": 18643, "epoch": 224} {"train_loss": -18.11354637145996, "global_step": 18644, "epoch": 224} {"train_loss": -17.873037338256836, "global_step": 18645, "epoch": 224} {"train_loss": -18.095487594604492, "global_step": 18646, "epoch": 224} {"train_loss": -18.341552734375, "global_step": 18647, "epoch": 224} {"train_loss": -18.71616554260254, "global_step": 18648, "epoch": 224} {"train_loss": -18.344280242919922, "global_step": 18649, "epoch": 224} {"train_loss": -17.998241424560547, "global_step": 18650, "epoch": 224} {"train_loss": -18.5235652923584, "global_step": 18651, "epoch": 224} {"train_loss": -18.2785701751709, "global_step": 18652, "epoch": 224} {"train_loss": -18.33736228942871, "global_step": 18653, "epoch": 224} {"train_loss": -18.150470733642578, "global_step": 18654, "epoch": 224} {"train_loss": -18.453554153442383, "global_step": 18655, "epoch": 224} {"train_loss": -18.52983856201172, "global_step": 18656, "epoch": 224} {"train_loss": -18.499624252319336, "global_step": 18657, "epoch": 224} {"train_loss": -18.268558502197266, "global_step": 18658, "epoch": 224} {"train_loss": -18.442895889282227, "global_step": 18659, "epoch": 224} {"train_loss": -18.529132843017578, "global_step": 18660, "epoch": 224} {"train_loss": -18.46755027770996, "global_step": 18661, "epoch": 224} {"train_loss": -18.38441276550293, "global_step": 18662, "epoch": 224} {"train_loss": -18.394287109375, "global_step": 18663, "epoch": 224} {"train_loss": -18.6129150390625, "global_step": 18664, "epoch": 224} {"train_loss": -18.66217613220215, "global_step": 18665, "epoch": 224} {"train_loss": -18.47055435180664, "global_step": 18666, "epoch": 224} {"train_loss": -18.63130760192871, "global_step": 18667, "epoch": 224} {"train_loss": -18.26268768310547, "global_step": 18668, "epoch": 224} {"train_loss": -18.20537757873535, "global_step": 18669, "epoch": 224} {"train_loss": -18.102481842041016, "global_step": 18670, "epoch": 224} {"train_loss": -18.633411407470703, "global_step": 18671, "epoch": 224} {"train_loss": -18.382022857666016, "global_step": 18672, "epoch": 224} {"train_loss": -18.111616134643555, "global_step": 18673, "epoch": 224} {"train_loss": -18.335561108876423, "global_step": 18674, "epoch": 224, "val_loss": 5841267.0} {"train_loss": -18.134002685546875, "global_step": 18675, "epoch": 225} {"train_loss": -17.79115867614746, "global_step": 18676, "epoch": 225} {"train_loss": -17.828357696533203, "global_step": 18677, "epoch": 225} {"train_loss": -18.12276268005371, "global_step": 18678, "epoch": 225} {"train_loss": -17.961376190185547, "global_step": 18679, "epoch": 225} {"train_loss": -18.2443904876709, "global_step": 18680, "epoch": 225} {"train_loss": -17.918386459350586, "global_step": 18681, "epoch": 225} {"train_loss": -18.174985885620117, "global_step": 18682, "epoch": 225} {"train_loss": -18.5854549407959, "global_step": 18683, "epoch": 225} {"train_loss": -18.32307243347168, "global_step": 18684, "epoch": 225} {"train_loss": -18.2004337310791, "global_step": 18685, "epoch": 225} {"train_loss": -18.0523624420166, "global_step": 18686, "epoch": 225} {"train_loss": -17.781911849975586, "global_step": 18687, "epoch": 225} {"train_loss": -18.095779418945312, "global_step": 18688, "epoch": 225} {"train_loss": -18.12324333190918, "global_step": 18689, "epoch": 225} {"train_loss": -18.533510208129883, "global_step": 18690, "epoch": 225} {"train_loss": -18.418554306030273, "global_step": 18691, "epoch": 225} {"train_loss": -18.271865844726562, "global_step": 18692, "epoch": 225} {"train_loss": -18.170684814453125, "global_step": 18693, "epoch": 225} {"train_loss": -18.041027069091797, "global_step": 18694, "epoch": 225} {"train_loss": -18.545867919921875, "global_step": 18695, "epoch": 225} {"train_loss": -18.071775436401367, "global_step": 18696, "epoch": 225} {"train_loss": -18.317228317260742, "global_step": 18697, "epoch": 225} {"train_loss": -17.954465866088867, "global_step": 18698, "epoch": 225} {"train_loss": -17.939138412475586, "global_step": 18699, "epoch": 225} {"train_loss": -18.08152961730957, "global_step": 18700, "epoch": 225} {"train_loss": -17.896814346313477, "global_step": 18701, "epoch": 225} {"train_loss": -18.067581176757812, "global_step": 18702, "epoch": 225} {"train_loss": -18.4226016998291, "global_step": 18703, "epoch": 225} {"train_loss": -18.206464767456055, "global_step": 18704, "epoch": 225} {"train_loss": -18.29656982421875, "global_step": 18705, "epoch": 225} {"train_loss": -18.276477813720703, "global_step": 18706, "epoch": 225} {"train_loss": -18.26393699645996, "global_step": 18707, "epoch": 225} {"train_loss": -17.99960708618164, "global_step": 18708, "epoch": 225} {"train_loss": -18.071523666381836, "global_step": 18709, "epoch": 225} {"train_loss": -18.282855987548828, "global_step": 18710, "epoch": 225} {"train_loss": -18.117509841918945, "global_step": 18711, "epoch": 225} {"train_loss": -18.071561813354492, "global_step": 18712, "epoch": 225} {"train_loss": -18.233932495117188, "global_step": 18713, "epoch": 225} {"train_loss": -18.164384841918945, "global_step": 18714, "epoch": 225} {"train_loss": -18.099472045898438, "global_step": 18715, "epoch": 225} {"train_loss": -18.279260635375977, "global_step": 18716, "epoch": 225} {"train_loss": -18.102258682250977, "global_step": 18717, "epoch": 225} {"train_loss": -18.659582138061523, "global_step": 18718, "epoch": 225} {"train_loss": -18.195301055908203, "global_step": 18719, "epoch": 225} {"train_loss": -18.771493911743164, "global_step": 18720, "epoch": 225} {"train_loss": -18.10401725769043, "global_step": 18721, "epoch": 225} {"train_loss": -18.05236053466797, "global_step": 18722, "epoch": 225} {"train_loss": -18.476682662963867, "global_step": 18723, "epoch": 225} {"train_loss": -18.47243309020996, "global_step": 18724, "epoch": 225} {"train_loss": -18.020994186401367, "global_step": 18725, "epoch": 225} {"train_loss": -18.54852867126465, "global_step": 18726, "epoch": 225} {"train_loss": -18.070388793945312, "global_step": 18727, "epoch": 225} {"train_loss": -18.226139068603516, "global_step": 18728, "epoch": 225} {"train_loss": -18.37758445739746, "global_step": 18729, "epoch": 225} {"train_loss": -18.567394256591797, "global_step": 18730, "epoch": 225} {"train_loss": -18.250518798828125, "global_step": 18731, "epoch": 225} {"train_loss": -17.947538375854492, "global_step": 18732, "epoch": 225} {"train_loss": -17.993854522705078, "global_step": 18733, "epoch": 225} {"train_loss": -17.994075775146484, "global_step": 18734, "epoch": 225} {"train_loss": -18.11697769165039, "global_step": 18735, "epoch": 225} {"train_loss": -18.166288375854492, "global_step": 18736, "epoch": 225} {"train_loss": -18.131608963012695, "global_step": 18737, "epoch": 225} {"train_loss": -18.201438903808594, "global_step": 18738, "epoch": 225} {"train_loss": -18.155038833618164, "global_step": 18739, "epoch": 225} {"train_loss": -18.201480865478516, "global_step": 18740, "epoch": 225} {"train_loss": -18.5426025390625, "global_step": 18741, "epoch": 225} {"train_loss": -18.257123947143555, "global_step": 18742, "epoch": 225} {"train_loss": -18.024999618530273, "global_step": 18743, "epoch": 225} {"train_loss": -18.321115493774414, "global_step": 18744, "epoch": 225} {"train_loss": -18.29515266418457, "global_step": 18745, "epoch": 225} {"train_loss": -18.15492057800293, "global_step": 18746, "epoch": 225} {"train_loss": -18.036962509155273, "global_step": 18747, "epoch": 225} {"train_loss": -17.712905883789062, "global_step": 18748, "epoch": 225} {"train_loss": -18.24555778503418, "global_step": 18749, "epoch": 225} {"train_loss": -18.277423858642578, "global_step": 18750, "epoch": 225} {"train_loss": -18.524831771850586, "global_step": 18751, "epoch": 225} {"train_loss": -18.238388061523438, "global_step": 18752, "epoch": 225} {"train_loss": -18.03668975830078, "global_step": 18753, "epoch": 225} {"train_loss": -18.1846866607666, "global_step": 18754, "epoch": 225} {"train_loss": -17.988239288330078, "global_step": 18755, "epoch": 225} {"train_loss": -18.448307037353516, "global_step": 18756, "epoch": 225} {"train_loss": -18.192330670644, "global_step": 18757, "epoch": 225, "val_loss": 6011629.0} {"train_loss": -18.315196990966797, "global_step": 18758, "epoch": 226} {"train_loss": -18.22205924987793, "global_step": 18759, "epoch": 226} {"train_loss": -18.363096237182617, "global_step": 18760, "epoch": 226} {"train_loss": -18.197500228881836, "global_step": 18761, "epoch": 226} {"train_loss": -18.19257926940918, "global_step": 18762, "epoch": 226} {"train_loss": -18.26420021057129, "global_step": 18763, "epoch": 226} {"train_loss": -17.76125144958496, "global_step": 18764, "epoch": 226} {"train_loss": -17.99581527709961, "global_step": 18765, "epoch": 226} {"train_loss": -18.22125244140625, "global_step": 18766, "epoch": 226} {"train_loss": -18.557764053344727, "global_step": 18767, "epoch": 226} {"train_loss": -17.923887252807617, "global_step": 18768, "epoch": 226} {"train_loss": -18.04741668701172, "global_step": 18769, "epoch": 226} {"train_loss": -17.796857833862305, "global_step": 18770, "epoch": 226} {"train_loss": -17.853822708129883, "global_step": 18771, "epoch": 226} {"train_loss": -18.123836517333984, "global_step": 18772, "epoch": 226} {"train_loss": -18.166189193725586, "global_step": 18773, "epoch": 226} {"train_loss": -18.485214233398438, "global_step": 18774, "epoch": 226} {"train_loss": -18.262372970581055, "global_step": 18775, "epoch": 226} {"train_loss": -18.209287643432617, "global_step": 18776, "epoch": 226} {"train_loss": -18.1085262298584, "global_step": 18777, "epoch": 226} {"train_loss": -18.667573928833008, "global_step": 18778, "epoch": 226} {"train_loss": -18.326587677001953, "global_step": 18779, "epoch": 226} {"train_loss": -18.007875442504883, "global_step": 18780, "epoch": 226} {"train_loss": -18.601383209228516, "global_step": 18781, "epoch": 226} {"train_loss": -18.6324520111084, "global_step": 18782, "epoch": 226} {"train_loss": -18.25942039489746, "global_step": 18783, "epoch": 226} {"train_loss": -18.45618438720703, "global_step": 18784, "epoch": 226} {"train_loss": -18.44437599182129, "global_step": 18785, "epoch": 226} {"train_loss": -18.511991500854492, "global_step": 18786, "epoch": 226} {"train_loss": -18.676223754882812, "global_step": 18787, "epoch": 226} {"train_loss": -18.02522850036621, "global_step": 18788, "epoch": 226} {"train_loss": -18.497516632080078, "global_step": 18789, "epoch": 226} {"train_loss": -18.264551162719727, "global_step": 18790, "epoch": 226} {"train_loss": -18.28125, "global_step": 18791, "epoch": 226} {"train_loss": -17.944461822509766, "global_step": 18792, "epoch": 226} {"train_loss": -18.30073356628418, "global_step": 18793, "epoch": 226} {"train_loss": -17.9560604095459, "global_step": 18794, "epoch": 226} {"train_loss": -18.1046199798584, "global_step": 18795, "epoch": 226} {"train_loss": -18.303726196289062, "global_step": 18796, "epoch": 226} {"train_loss": -17.91866111755371, "global_step": 18797, "epoch": 226} {"train_loss": -18.13416862487793, "global_step": 18798, "epoch": 226} {"train_loss": -18.595876693725586, "global_step": 18799, "epoch": 226} {"train_loss": -18.21907615661621, "global_step": 18800, "epoch": 226} {"train_loss": -18.314146041870117, "global_step": 18801, "epoch": 226} {"train_loss": -17.95084571838379, "global_step": 18802, "epoch": 226} {"train_loss": -18.27080726623535, "global_step": 18803, "epoch": 226} {"train_loss": -18.257596969604492, "global_step": 18804, "epoch": 226} {"train_loss": -18.178817749023438, "global_step": 18805, "epoch": 226} {"train_loss": -17.85621452331543, "global_step": 18806, "epoch": 226} {"train_loss": -18.41651725769043, "global_step": 18807, "epoch": 226} {"train_loss": -17.990243911743164, "global_step": 18808, "epoch": 226} {"train_loss": -18.426000595092773, "global_step": 18809, "epoch": 226} {"train_loss": -18.32016372680664, "global_step": 18810, "epoch": 226} {"train_loss": -18.014984130859375, "global_step": 18811, "epoch": 226} {"train_loss": -17.847341537475586, "global_step": 18812, "epoch": 226} {"train_loss": -18.298627853393555, "global_step": 18813, "epoch": 226} {"train_loss": -18.335763931274414, "global_step": 18814, "epoch": 226} {"train_loss": -18.203641891479492, "global_step": 18815, "epoch": 226} {"train_loss": -17.987226486206055, "global_step": 18816, "epoch": 226} {"train_loss": -18.334299087524414, "global_step": 18817, "epoch": 226} {"train_loss": -18.458600997924805, "global_step": 18818, "epoch": 226} {"train_loss": -17.949567794799805, "global_step": 18819, "epoch": 226} {"train_loss": -18.167993545532227, "global_step": 18820, "epoch": 226} {"train_loss": -18.227222442626953, "global_step": 18821, "epoch": 226} {"train_loss": -18.134836196899414, "global_step": 18822, "epoch": 226} {"train_loss": -18.297924041748047, "global_step": 18823, "epoch": 226} {"train_loss": -18.512601852416992, "global_step": 18824, "epoch": 226} {"train_loss": -18.04927635192871, "global_step": 18825, "epoch": 226} {"train_loss": -18.430055618286133, "global_step": 18826, "epoch": 226} {"train_loss": -18.14179039001465, "global_step": 18827, "epoch": 226} {"train_loss": -17.799182891845703, "global_step": 18828, "epoch": 226} {"train_loss": -18.40303611755371, "global_step": 18829, "epoch": 226} {"train_loss": -18.267845153808594, "global_step": 18830, "epoch": 226} {"train_loss": -18.20155906677246, "global_step": 18831, "epoch": 226} {"train_loss": -18.26131248474121, "global_step": 18832, "epoch": 226} {"train_loss": -18.034332275390625, "global_step": 18833, "epoch": 226} {"train_loss": -18.443470001220703, "global_step": 18834, "epoch": 226} {"train_loss": -18.308740615844727, "global_step": 18835, "epoch": 226} {"train_loss": -18.144269943237305, "global_step": 18836, "epoch": 226} {"train_loss": -18.31717300415039, "global_step": 18837, "epoch": 226} {"train_loss": -18.21269416809082, "global_step": 18838, "epoch": 226} {"train_loss": -17.713293075561523, "global_step": 18839, "epoch": 226} {"train_loss": -18.23403365353504, "global_step": 18840, "epoch": 226, "val_loss": 6278106.0} {"train_loss": -17.68832778930664, "global_step": 18841, "epoch": 227} {"train_loss": -18.323427200317383, "global_step": 18842, "epoch": 227} {"train_loss": -17.893978118896484, "global_step": 18843, "epoch": 227} {"train_loss": -17.747526168823242, "global_step": 18844, "epoch": 227} {"train_loss": -18.16069793701172, "global_step": 18845, "epoch": 227} {"train_loss": -17.87734031677246, "global_step": 18846, "epoch": 227} {"train_loss": -18.393457412719727, "global_step": 18847, "epoch": 227} {"train_loss": -17.86615562438965, "global_step": 18848, "epoch": 227} {"train_loss": -18.076574325561523, "global_step": 18849, "epoch": 227} {"train_loss": -18.20759391784668, "global_step": 18850, "epoch": 227} {"train_loss": -18.16231346130371, "global_step": 18851, "epoch": 227} {"train_loss": -18.517921447753906, "global_step": 18852, "epoch": 227} {"train_loss": -17.84372329711914, "global_step": 18853, "epoch": 227} {"train_loss": -18.273860931396484, "global_step": 18854, "epoch": 227} {"train_loss": -18.546911239624023, "global_step": 18855, "epoch": 227} {"train_loss": -18.230316162109375, "global_step": 18856, "epoch": 227} {"train_loss": -18.033361434936523, "global_step": 18857, "epoch": 227} {"train_loss": -17.842456817626953, "global_step": 18858, "epoch": 227} {"train_loss": -18.166608810424805, "global_step": 18859, "epoch": 227} {"train_loss": -18.304723739624023, "global_step": 18860, "epoch": 227} {"train_loss": -18.015104293823242, "global_step": 18861, "epoch": 227} {"train_loss": -18.544437408447266, "global_step": 18862, "epoch": 227} {"train_loss": -17.94193458557129, "global_step": 18863, "epoch": 227} {"train_loss": -18.491178512573242, "global_step": 18864, "epoch": 227} {"train_loss": -18.82917022705078, "global_step": 18865, "epoch": 227} {"train_loss": -18.427566528320312, "global_step": 18866, "epoch": 227} {"train_loss": -18.396827697753906, "global_step": 18867, "epoch": 227} {"train_loss": -18.484909057617188, "global_step": 18868, "epoch": 227} {"train_loss": -18.266769409179688, "global_step": 18869, "epoch": 227} {"train_loss": -18.4056396484375, "global_step": 18870, "epoch": 227} {"train_loss": -18.34747886657715, "global_step": 18871, "epoch": 227} {"train_loss": -18.072994232177734, "global_step": 18872, "epoch": 227} {"train_loss": -18.17337417602539, "global_step": 18873, "epoch": 227} {"train_loss": -18.426610946655273, "global_step": 18874, "epoch": 227} {"train_loss": -17.923200607299805, "global_step": 18875, "epoch": 227} {"train_loss": -18.401527404785156, "global_step": 18876, "epoch": 227} {"train_loss": -18.012718200683594, "global_step": 18877, "epoch": 227} {"train_loss": -18.401620864868164, "global_step": 18878, "epoch": 227} {"train_loss": -18.590490341186523, "global_step": 18879, "epoch": 227} {"train_loss": -18.272233963012695, "global_step": 18880, "epoch": 227} {"train_loss": -17.981687545776367, "global_step": 18881, "epoch": 227} {"train_loss": -18.056270599365234, "global_step": 18882, "epoch": 227} {"train_loss": -18.090831756591797, "global_step": 18883, "epoch": 227} {"train_loss": -18.351158142089844, "global_step": 18884, "epoch": 227} {"train_loss": -18.273700714111328, "global_step": 18885, "epoch": 227} {"train_loss": -18.01432228088379, "global_step": 18886, "epoch": 227} {"train_loss": -18.577978134155273, "global_step": 18887, "epoch": 227} {"train_loss": -18.349674224853516, "global_step": 18888, "epoch": 227} {"train_loss": -18.349145889282227, "global_step": 18889, "epoch": 227} {"train_loss": -18.299625396728516, "global_step": 18890, "epoch": 227} {"train_loss": -18.00933837890625, "global_step": 18891, "epoch": 227} {"train_loss": -18.315961837768555, "global_step": 18892, "epoch": 227} {"train_loss": -18.51399803161621, "global_step": 18893, "epoch": 227} {"train_loss": -18.41359519958496, "global_step": 18894, "epoch": 227} {"train_loss": -18.215641021728516, "global_step": 18895, "epoch": 227} {"train_loss": -18.300901412963867, "global_step": 18896, "epoch": 227} {"train_loss": -18.12577247619629, "global_step": 18897, "epoch": 227} {"train_loss": -18.283994674682617, "global_step": 18898, "epoch": 227} {"train_loss": -18.358579635620117, "global_step": 18899, "epoch": 227} {"train_loss": -18.445423126220703, "global_step": 18900, "epoch": 227} {"train_loss": -18.091875076293945, "global_step": 18901, "epoch": 227} {"train_loss": -18.3212947845459, "global_step": 18902, "epoch": 227} {"train_loss": -18.79010581970215, "global_step": 18903, "epoch": 227} {"train_loss": -18.116376876831055, "global_step": 18904, "epoch": 227} {"train_loss": -18.5009765625, "global_step": 18905, "epoch": 227} {"train_loss": -18.2276611328125, "global_step": 18906, "epoch": 227} {"train_loss": -18.33466148376465, "global_step": 18907, "epoch": 227} {"train_loss": -18.25600242614746, "global_step": 18908, "epoch": 227} {"train_loss": -18.010242462158203, "global_step": 18909, "epoch": 227} {"train_loss": -18.246938705444336, "global_step": 18910, "epoch": 227} {"train_loss": -18.173933029174805, "global_step": 18911, "epoch": 227} {"train_loss": -17.954008102416992, "global_step": 18912, "epoch": 227} {"train_loss": -18.28372573852539, "global_step": 18913, "epoch": 227} {"train_loss": -18.724395751953125, "global_step": 18914, "epoch": 227} {"train_loss": -18.17738914489746, "global_step": 18915, "epoch": 227} {"train_loss": -18.3196964263916, "global_step": 18916, "epoch": 227} {"train_loss": -18.030324935913086, "global_step": 18917, "epoch": 227} {"train_loss": -18.260711669921875, "global_step": 18918, "epoch": 227} {"train_loss": -18.428327560424805, "global_step": 18919, "epoch": 227} {"train_loss": -18.678213119506836, "global_step": 18920, "epoch": 227} {"train_loss": -18.354637145996094, "global_step": 18921, "epoch": 227} {"train_loss": -18.607114791870117, "global_step": 18922, "epoch": 227} {"train_loss": -18.273959837764142, "global_step": 18923, "epoch": 227, "val_loss": 5965847.0} {"train_loss": -17.69481086730957, "global_step": 18924, "epoch": 228} {"train_loss": -17.55359649658203, "global_step": 18925, "epoch": 228} {"train_loss": -18.09962272644043, "global_step": 18926, "epoch": 228} {"train_loss": -17.615392684936523, "global_step": 18927, "epoch": 228} {"train_loss": -17.91576385498047, "global_step": 18928, "epoch": 228} {"train_loss": -18.150794982910156, "global_step": 18929, "epoch": 228} {"train_loss": -17.987173080444336, "global_step": 18930, "epoch": 228} {"train_loss": -18.294397354125977, "global_step": 18931, "epoch": 228} {"train_loss": -17.983016967773438, "global_step": 18932, "epoch": 228} {"train_loss": -18.015413284301758, "global_step": 18933, "epoch": 228} {"train_loss": -18.163183212280273, "global_step": 18934, "epoch": 228} {"train_loss": -18.451017379760742, "global_step": 18935, "epoch": 228} {"train_loss": -18.151750564575195, "global_step": 18936, "epoch": 228} {"train_loss": -18.0975284576416, "global_step": 18937, "epoch": 228} {"train_loss": -18.205442428588867, "global_step": 18938, "epoch": 228} {"train_loss": -18.3753662109375, "global_step": 18939, "epoch": 228} {"train_loss": -18.356760025024414, "global_step": 18940, "epoch": 228} {"train_loss": -18.02171516418457, "global_step": 18941, "epoch": 228} {"train_loss": -17.683271408081055, "global_step": 18942, "epoch": 228} {"train_loss": -17.968780517578125, "global_step": 18943, "epoch": 228} {"train_loss": -18.28316307067871, "global_step": 18944, "epoch": 228} {"train_loss": -17.931421279907227, "global_step": 18945, "epoch": 228} {"train_loss": -17.970548629760742, "global_step": 18946, "epoch": 228} {"train_loss": -18.027931213378906, "global_step": 18947, "epoch": 228} {"train_loss": -18.567304611206055, "global_step": 18948, "epoch": 228} {"train_loss": -18.52889060974121, "global_step": 18949, "epoch": 228} {"train_loss": -18.091703414916992, "global_step": 18950, "epoch": 228} {"train_loss": -18.40657615661621, "global_step": 18951, "epoch": 228} {"train_loss": -18.661556243896484, "global_step": 18952, "epoch": 228} {"train_loss": -18.43202781677246, "global_step": 18953, "epoch": 228} {"train_loss": -18.097442626953125, "global_step": 18954, "epoch": 228} {"train_loss": -18.47254180908203, "global_step": 18955, "epoch": 228} {"train_loss": -18.518545150756836, "global_step": 18956, "epoch": 228} {"train_loss": -18.567861557006836, "global_step": 18957, "epoch": 228} {"train_loss": -17.713220596313477, "global_step": 18958, "epoch": 228} {"train_loss": -18.22123908996582, "global_step": 18959, "epoch": 228} {"train_loss": -18.19662857055664, "global_step": 18960, "epoch": 228} {"train_loss": -18.414764404296875, "global_step": 18961, "epoch": 228} {"train_loss": -18.441753387451172, "global_step": 18962, "epoch": 228} {"train_loss": -18.06560707092285, "global_step": 18963, "epoch": 228} {"train_loss": -18.36720848083496, "global_step": 18964, "epoch": 228} {"train_loss": -17.857606887817383, "global_step": 18965, "epoch": 228} {"train_loss": -18.500356674194336, "global_step": 18966, "epoch": 228} {"train_loss": -18.41019058227539, "global_step": 18967, "epoch": 228} {"train_loss": -17.878496170043945, "global_step": 18968, "epoch": 228} {"train_loss": -18.433195114135742, "global_step": 18969, "epoch": 228} {"train_loss": -18.345813751220703, "global_step": 18970, "epoch": 228} {"train_loss": -17.6403751373291, "global_step": 18971, "epoch": 228} {"train_loss": -18.217269897460938, "global_step": 18972, "epoch": 228} {"train_loss": -18.4680118560791, "global_step": 18973, "epoch": 228} {"train_loss": -18.098995208740234, "global_step": 18974, "epoch": 228} {"train_loss": -18.591373443603516, "global_step": 18975, "epoch": 228} {"train_loss": -18.278778076171875, "global_step": 18976, "epoch": 228} {"train_loss": -18.18630027770996, "global_step": 18977, "epoch": 228} {"train_loss": -18.49086570739746, "global_step": 18978, "epoch": 228} {"train_loss": -18.39215660095215, "global_step": 18979, "epoch": 228} {"train_loss": -18.38370704650879, "global_step": 18980, "epoch": 228} {"train_loss": -18.4338436126709, "global_step": 18981, "epoch": 228} {"train_loss": -18.091562271118164, "global_step": 18982, "epoch": 228} {"train_loss": -18.217716217041016, "global_step": 18983, "epoch": 228} {"train_loss": -18.210567474365234, "global_step": 18984, "epoch": 228} {"train_loss": -18.427001953125, "global_step": 18985, "epoch": 228} {"train_loss": -18.625905990600586, "global_step": 18986, "epoch": 228} {"train_loss": -18.07219886779785, "global_step": 18987, "epoch": 228} {"train_loss": -18.32836151123047, "global_step": 18988, "epoch": 228} {"train_loss": -18.52596092224121, "global_step": 18989, "epoch": 228} {"train_loss": -18.37469482421875, "global_step": 18990, "epoch": 228} {"train_loss": -18.104907989501953, "global_step": 18991, "epoch": 228} {"train_loss": -18.303428649902344, "global_step": 18992, "epoch": 228} {"train_loss": -18.075546264648438, "global_step": 18993, "epoch": 228} {"train_loss": -18.193450927734375, "global_step": 18994, "epoch": 228} {"train_loss": -18.627811431884766, "global_step": 18995, "epoch": 228} {"train_loss": -18.446378707885742, "global_step": 18996, "epoch": 228} {"train_loss": -18.78754997253418, "global_step": 18997, "epoch": 228} {"train_loss": -18.39412498474121, "global_step": 18998, "epoch": 228} {"train_loss": -18.411518096923828, "global_step": 18999, "epoch": 228} {"train_loss": -18.50345802307129, "global_step": 19000, "epoch": 228} {"train_loss": -18.267826080322266, "global_step": 19001, "epoch": 228} {"train_loss": -17.94495964050293, "global_step": 19002, "epoch": 228} {"train_loss": -18.39222526550293, "global_step": 19003, "epoch": 228} {"train_loss": -18.395893096923828, "global_step": 19004, "epoch": 228} {"train_loss": -18.235610961914062, "global_step": 19005, "epoch": 228} {"train_loss": -18.229936760592174, "global_step": 19006, "epoch": 228, "val_loss": 5810094.0} {"train_loss": -17.91472816467285, "global_step": 19007, "epoch": 229} {"train_loss": -18.371978759765625, "global_step": 19008, "epoch": 229} {"train_loss": -18.182554244995117, "global_step": 19009, "epoch": 229} {"train_loss": -18.286415100097656, "global_step": 19010, "epoch": 229} {"train_loss": -18.353012084960938, "global_step": 19011, "epoch": 229} {"train_loss": -17.8915958404541, "global_step": 19012, "epoch": 229} {"train_loss": -18.027132034301758, "global_step": 19013, "epoch": 229} {"train_loss": -18.491146087646484, "global_step": 19014, "epoch": 229} {"train_loss": -18.369781494140625, "global_step": 19015, "epoch": 229} {"train_loss": -18.008390426635742, "global_step": 19016, "epoch": 229} {"train_loss": -18.114286422729492, "global_step": 19017, "epoch": 229} {"train_loss": -18.10445785522461, "global_step": 19018, "epoch": 229} {"train_loss": -18.48518180847168, "global_step": 19019, "epoch": 229} {"train_loss": -18.202194213867188, "global_step": 19020, "epoch": 229} {"train_loss": -18.15302276611328, "global_step": 19021, "epoch": 229} {"train_loss": -18.113615036010742, "global_step": 19022, "epoch": 229} {"train_loss": -18.493377685546875, "global_step": 19023, "epoch": 229} {"train_loss": -18.221405029296875, "global_step": 19024, "epoch": 229} {"train_loss": -18.827550888061523, "global_step": 19025, "epoch": 229} {"train_loss": -18.181747436523438, "global_step": 19026, "epoch": 229} {"train_loss": -18.186172485351562, "global_step": 19027, "epoch": 229} {"train_loss": -18.509815216064453, "global_step": 19028, "epoch": 229} {"train_loss": -18.03740119934082, "global_step": 19029, "epoch": 229} {"train_loss": -17.934507369995117, "global_step": 19030, "epoch": 229} {"train_loss": -18.068950653076172, "global_step": 19031, "epoch": 229} {"train_loss": -18.748289108276367, "global_step": 19032, "epoch": 229} {"train_loss": -18.18897247314453, "global_step": 19033, "epoch": 229} {"train_loss": -18.348073959350586, "global_step": 19034, "epoch": 229} {"train_loss": -18.175800323486328, "global_step": 19035, "epoch": 229} {"train_loss": -18.2622127532959, "global_step": 19036, "epoch": 229} {"train_loss": -17.893003463745117, "global_step": 19037, "epoch": 229} {"train_loss": -18.37138557434082, "global_step": 19038, "epoch": 229} {"train_loss": -18.3642578125, "global_step": 19039, "epoch": 229} {"train_loss": -18.51129150390625, "global_step": 19040, "epoch": 229} {"train_loss": -18.6460018157959, "global_step": 19041, "epoch": 229} {"train_loss": -18.394750595092773, "global_step": 19042, "epoch": 229} {"train_loss": -17.88775062561035, "global_step": 19043, "epoch": 229} {"train_loss": -18.433895111083984, "global_step": 19044, "epoch": 229} {"train_loss": -18.786657333374023, "global_step": 19045, "epoch": 229} {"train_loss": -18.136106491088867, "global_step": 19046, "epoch": 229} {"train_loss": -18.18929100036621, "global_step": 19047, "epoch": 229} {"train_loss": -18.361860275268555, "global_step": 19048, "epoch": 229} {"train_loss": -18.24416160583496, "global_step": 19049, "epoch": 229} {"train_loss": -18.29408073425293, "global_step": 19050, "epoch": 229} {"train_loss": -18.75872802734375, "global_step": 19051, "epoch": 229} {"train_loss": -18.356414794921875, "global_step": 19052, "epoch": 229} {"train_loss": -18.319265365600586, "global_step": 19053, "epoch": 229} {"train_loss": -18.16253089904785, "global_step": 19054, "epoch": 229} {"train_loss": -18.089481353759766, "global_step": 19055, "epoch": 229} {"train_loss": -18.15830421447754, "global_step": 19056, "epoch": 229} {"train_loss": -18.576431274414062, "global_step": 19057, "epoch": 229} {"train_loss": -18.345373153686523, "global_step": 19058, "epoch": 229} {"train_loss": -18.219541549682617, "global_step": 19059, "epoch": 229} {"train_loss": -18.46356964111328, "global_step": 19060, "epoch": 229} {"train_loss": -18.479032516479492, "global_step": 19061, "epoch": 229} {"train_loss": -18.335981369018555, "global_step": 19062, "epoch": 229} {"train_loss": -18.21870994567871, "global_step": 19063, "epoch": 229} {"train_loss": -18.359113693237305, "global_step": 19064, "epoch": 229} {"train_loss": -18.34410285949707, "global_step": 19065, "epoch": 229} {"train_loss": -18.441835403442383, "global_step": 19066, "epoch": 229} {"train_loss": -17.91193199157715, "global_step": 19067, "epoch": 229} {"train_loss": -18.02459716796875, "global_step": 19068, "epoch": 229} {"train_loss": -18.10359764099121, "global_step": 19069, "epoch": 229} {"train_loss": -17.972583770751953, "global_step": 19070, "epoch": 229} {"train_loss": -18.38447380065918, "global_step": 19071, "epoch": 229} {"train_loss": -18.529539108276367, "global_step": 19072, "epoch": 229} {"train_loss": -18.099031448364258, "global_step": 19073, "epoch": 229} {"train_loss": -18.64211082458496, "global_step": 19074, "epoch": 229} {"train_loss": -18.243061065673828, "global_step": 19075, "epoch": 229} {"train_loss": -18.401811599731445, "global_step": 19076, "epoch": 229} {"train_loss": -18.19060707092285, "global_step": 19077, "epoch": 229} {"train_loss": -18.55055809020996, "global_step": 19078, "epoch": 229} {"train_loss": -18.178678512573242, "global_step": 19079, "epoch": 229} {"train_loss": -18.371482849121094, "global_step": 19080, "epoch": 229} {"train_loss": -18.07419204711914, "global_step": 19081, "epoch": 229} {"train_loss": -18.19273567199707, "global_step": 19082, "epoch": 229} {"train_loss": -18.23756217956543, "global_step": 19083, "epoch": 229} {"train_loss": -18.41935920715332, "global_step": 19084, "epoch": 229} {"train_loss": -18.383764266967773, "global_step": 19085, "epoch": 229} {"train_loss": -18.414575576782227, "global_step": 19086, "epoch": 229} {"train_loss": -18.164630889892578, "global_step": 19087, "epoch": 229} {"train_loss": -18.165494918823242, "global_step": 19088, "epoch": 229} {"train_loss": -18.29993519151067, "global_step": 19089, "epoch": 229, "val_loss": 6055163.0} {"train_loss": -18.070053100585938, "global_step": 19090, "epoch": 230} {"train_loss": -18.457141876220703, "global_step": 19091, "epoch": 230} {"train_loss": -18.237293243408203, "global_step": 19092, "epoch": 230} {"train_loss": -18.34170913696289, "global_step": 19093, "epoch": 230} {"train_loss": -17.772525787353516, "global_step": 19094, "epoch": 230} {"train_loss": -18.271268844604492, "global_step": 19095, "epoch": 230} {"train_loss": -18.222558975219727, "global_step": 19096, "epoch": 230} {"train_loss": -18.21339988708496, "global_step": 19097, "epoch": 230} {"train_loss": -18.359756469726562, "global_step": 19098, "epoch": 230} {"train_loss": -18.335491180419922, "global_step": 19099, "epoch": 230} {"train_loss": -18.176162719726562, "global_step": 19100, "epoch": 230} {"train_loss": -18.3022518157959, "global_step": 19101, "epoch": 230} {"train_loss": -18.044527053833008, "global_step": 19102, "epoch": 230} {"train_loss": -18.49735450744629, "global_step": 19103, "epoch": 230} {"train_loss": -18.161020278930664, "global_step": 19104, "epoch": 230} {"train_loss": -18.39784812927246, "global_step": 19105, "epoch": 230} {"train_loss": -18.172719955444336, "global_step": 19106, "epoch": 230} {"train_loss": -18.390913009643555, "global_step": 19107, "epoch": 230} {"train_loss": -18.144601821899414, "global_step": 19108, "epoch": 230} {"train_loss": -18.250404357910156, "global_step": 19109, "epoch": 230} {"train_loss": -18.16732406616211, "global_step": 19110, "epoch": 230} {"train_loss": -18.280193328857422, "global_step": 19111, "epoch": 230} {"train_loss": -18.048200607299805, "global_step": 19112, "epoch": 230} {"train_loss": -18.278091430664062, "global_step": 19113, "epoch": 230} {"train_loss": -18.707046508789062, "global_step": 19114, "epoch": 230} {"train_loss": -18.658784866333008, "global_step": 19115, "epoch": 230} {"train_loss": -18.180660247802734, "global_step": 19116, "epoch": 230} {"train_loss": -18.320444107055664, "global_step": 19117, "epoch": 230} {"train_loss": -18.421049118041992, "global_step": 19118, "epoch": 230} {"train_loss": -18.05582618713379, "global_step": 19119, "epoch": 230} {"train_loss": -18.548486709594727, "global_step": 19120, "epoch": 230} {"train_loss": -18.346303939819336, "global_step": 19121, "epoch": 230} {"train_loss": -18.20416259765625, "global_step": 19122, "epoch": 230} {"train_loss": -18.156084060668945, "global_step": 19123, "epoch": 230} {"train_loss": -18.137189865112305, "global_step": 19124, "epoch": 230} {"train_loss": -18.47525978088379, "global_step": 19125, "epoch": 230} {"train_loss": -18.115665435791016, "global_step": 19126, "epoch": 230} {"train_loss": -18.231794357299805, "global_step": 19127, "epoch": 230} {"train_loss": -18.572660446166992, "global_step": 19128, "epoch": 230} {"train_loss": -18.303205490112305, "global_step": 19129, "epoch": 230} {"train_loss": -17.96177101135254, "global_step": 19130, "epoch": 230} {"train_loss": -18.334901809692383, "global_step": 19131, "epoch": 230} {"train_loss": -18.34890365600586, "global_step": 19132, "epoch": 230} {"train_loss": -17.959697723388672, "global_step": 19133, "epoch": 230} {"train_loss": -18.3845157623291, "global_step": 19134, "epoch": 230} {"train_loss": -18.242767333984375, "global_step": 19135, "epoch": 230} {"train_loss": -17.90381622314453, "global_step": 19136, "epoch": 230} {"train_loss": -18.30132293701172, "global_step": 19137, "epoch": 230} {"train_loss": -18.289039611816406, "global_step": 19138, "epoch": 230} {"train_loss": -18.257747650146484, "global_step": 19139, "epoch": 230} {"train_loss": -18.265958786010742, "global_step": 19140, "epoch": 230} {"train_loss": -18.56636619567871, "global_step": 19141, "epoch": 230} {"train_loss": -18.138736724853516, "global_step": 19142, "epoch": 230} {"train_loss": -18.47799301147461, "global_step": 19143, "epoch": 230} {"train_loss": -18.457422256469727, "global_step": 19144, "epoch": 230} {"train_loss": -18.348363876342773, "global_step": 19145, "epoch": 230} {"train_loss": -18.089845657348633, "global_step": 19146, "epoch": 230} {"train_loss": -18.154342651367188, "global_step": 19147, "epoch": 230} {"train_loss": -18.177730560302734, "global_step": 19148, "epoch": 230} {"train_loss": -18.58885383605957, "global_step": 19149, "epoch": 230} {"train_loss": -18.33955955505371, "global_step": 19150, "epoch": 230} {"train_loss": -18.483779907226562, "global_step": 19151, "epoch": 230} {"train_loss": -18.374624252319336, "global_step": 19152, "epoch": 230} {"train_loss": -18.32976722717285, "global_step": 19153, "epoch": 230} {"train_loss": -18.14557647705078, "global_step": 19154, "epoch": 230} {"train_loss": -18.31023597717285, "global_step": 19155, "epoch": 230} {"train_loss": -18.428342819213867, "global_step": 19156, "epoch": 230} {"train_loss": -18.15298843383789, "global_step": 19157, "epoch": 230} {"train_loss": -18.13142967224121, "global_step": 19158, "epoch": 230} {"train_loss": -18.27461051940918, "global_step": 19159, "epoch": 230} {"train_loss": -18.44725227355957, "global_step": 19160, "epoch": 230} {"train_loss": -18.14460563659668, "global_step": 19161, "epoch": 230} {"train_loss": -18.206228256225586, "global_step": 19162, "epoch": 230} {"train_loss": -18.146408081054688, "global_step": 19163, "epoch": 230} {"train_loss": -18.46478271484375, "global_step": 19164, "epoch": 230} {"train_loss": -18.496932983398438, "global_step": 19165, "epoch": 230} {"train_loss": -18.597776412963867, "global_step": 19166, "epoch": 230} {"train_loss": -17.856168746948242, "global_step": 19167, "epoch": 230} {"train_loss": -18.2624568939209, "global_step": 19168, "epoch": 230} {"train_loss": -18.199569702148438, "global_step": 19169, "epoch": 230} {"train_loss": -18.163373947143555, "global_step": 19170, "epoch": 230} {"train_loss": -18.351871490478516, "global_step": 19171, "epoch": 230} {"train_loss": -18.257913267756084, "global_step": 19172, "epoch": 230, "val_loss": 5981271.5} {"train_loss": -18.48053741455078, "global_step": 19173, "epoch": 231} {"train_loss": -18.295949935913086, "global_step": 19174, "epoch": 231} {"train_loss": -18.197580337524414, "global_step": 19175, "epoch": 231} {"train_loss": -18.167142868041992, "global_step": 19176, "epoch": 231} {"train_loss": -18.22745132446289, "global_step": 19177, "epoch": 231} {"train_loss": -18.211002349853516, "global_step": 19178, "epoch": 231} {"train_loss": -18.1352596282959, "global_step": 19179, "epoch": 231} {"train_loss": -18.21242332458496, "global_step": 19180, "epoch": 231} {"train_loss": -18.24509620666504, "global_step": 19181, "epoch": 231} {"train_loss": -18.47816276550293, "global_step": 19182, "epoch": 231} {"train_loss": -18.4681339263916, "global_step": 19183, "epoch": 231} {"train_loss": -18.488889694213867, "global_step": 19184, "epoch": 231} {"train_loss": -18.17620277404785, "global_step": 19185, "epoch": 231} {"train_loss": -18.561260223388672, "global_step": 19186, "epoch": 231} {"train_loss": -18.334775924682617, "global_step": 19187, "epoch": 231} {"train_loss": -18.70842933654785, "global_step": 19188, "epoch": 231} {"train_loss": -18.29276466369629, "global_step": 19189, "epoch": 231} {"train_loss": -18.02162742614746, "global_step": 19190, "epoch": 231} {"train_loss": -18.592321395874023, "global_step": 19191, "epoch": 231} {"train_loss": -18.153522491455078, "global_step": 19192, "epoch": 231} {"train_loss": -18.235876083374023, "global_step": 19193, "epoch": 231} {"train_loss": -18.666717529296875, "global_step": 19194, "epoch": 231} {"train_loss": -18.09824562072754, "global_step": 19195, "epoch": 231} {"train_loss": -18.715024948120117, "global_step": 19196, "epoch": 231} {"train_loss": -18.428150177001953, "global_step": 19197, "epoch": 231} {"train_loss": -18.049909591674805, "global_step": 19198, "epoch": 231} {"train_loss": -18.451370239257812, "global_step": 19199, "epoch": 231} {"train_loss": -17.991453170776367, "global_step": 19200, "epoch": 231} {"train_loss": -18.25054359436035, "global_step": 19201, "epoch": 231} {"train_loss": -18.420398712158203, "global_step": 19202, "epoch": 231} {"train_loss": -18.250478744506836, "global_step": 19203, "epoch": 231} {"train_loss": -18.42670249938965, "global_step": 19204, "epoch": 231} {"train_loss": -18.415485382080078, "global_step": 19205, "epoch": 231} {"train_loss": -18.290706634521484, "global_step": 19206, "epoch": 231} {"train_loss": -18.113584518432617, "global_step": 19207, "epoch": 231} {"train_loss": -18.100727081298828, "global_step": 19208, "epoch": 231} {"train_loss": -18.566768646240234, "global_step": 19209, "epoch": 231} {"train_loss": -18.30718994140625, "global_step": 19210, "epoch": 231} {"train_loss": -18.269195556640625, "global_step": 19211, "epoch": 231} {"train_loss": -17.98220443725586, "global_step": 19212, "epoch": 231} {"train_loss": -18.276527404785156, "global_step": 19213, "epoch": 231} {"train_loss": -18.1131649017334, "global_step": 19214, "epoch": 231} {"train_loss": -18.556955337524414, "global_step": 19215, "epoch": 231} {"train_loss": -18.61497688293457, "global_step": 19216, "epoch": 231} {"train_loss": -18.748559951782227, "global_step": 19217, "epoch": 231} {"train_loss": -18.350107192993164, "global_step": 19218, "epoch": 231} {"train_loss": -18.123483657836914, "global_step": 19219, "epoch": 231} {"train_loss": -18.3255615234375, "global_step": 19220, "epoch": 231} {"train_loss": -18.276641845703125, "global_step": 19221, "epoch": 231} {"train_loss": -18.65435218811035, "global_step": 19222, "epoch": 231} {"train_loss": -17.94417381286621, "global_step": 19223, "epoch": 231} {"train_loss": -18.255674362182617, "global_step": 19224, "epoch": 231} {"train_loss": -18.605228424072266, "global_step": 19225, "epoch": 231} {"train_loss": -18.311681747436523, "global_step": 19226, "epoch": 231} {"train_loss": -18.506303787231445, "global_step": 19227, "epoch": 231} {"train_loss": -18.302677154541016, "global_step": 19228, "epoch": 231} {"train_loss": -18.26688575744629, "global_step": 19229, "epoch": 231} {"train_loss": -18.76128578186035, "global_step": 19230, "epoch": 231} {"train_loss": -18.321603775024414, "global_step": 19231, "epoch": 231} {"train_loss": -18.29666519165039, "global_step": 19232, "epoch": 231} {"train_loss": -18.480369567871094, "global_step": 19233, "epoch": 231} {"train_loss": -18.24074363708496, "global_step": 19234, "epoch": 231} {"train_loss": -18.581090927124023, "global_step": 19235, "epoch": 231} {"train_loss": -18.068716049194336, "global_step": 19236, "epoch": 231} {"train_loss": -18.50581932067871, "global_step": 19237, "epoch": 231} {"train_loss": -17.89223289489746, "global_step": 19238, "epoch": 231} {"train_loss": -18.694311141967773, "global_step": 19239, "epoch": 231} {"train_loss": -18.359220504760742, "global_step": 19240, "epoch": 231} {"train_loss": -18.185400009155273, "global_step": 19241, "epoch": 231} {"train_loss": -18.058835983276367, "global_step": 19242, "epoch": 231} {"train_loss": -18.22864532470703, "global_step": 19243, "epoch": 231} {"train_loss": -18.018619537353516, "global_step": 19244, "epoch": 231} {"train_loss": -18.027738571166992, "global_step": 19245, "epoch": 231} {"train_loss": -17.935461044311523, "global_step": 19246, "epoch": 231} {"train_loss": -18.238113403320312, "global_step": 19247, "epoch": 231} {"train_loss": -18.17391586303711, "global_step": 19248, "epoch": 231} {"train_loss": -18.449777603149414, "global_step": 19249, "epoch": 231} {"train_loss": -18.47593879699707, "global_step": 19250, "epoch": 231} {"train_loss": -18.020706176757812, "global_step": 19251, "epoch": 231} {"train_loss": -18.229318618774414, "global_step": 19252, "epoch": 231} {"train_loss": -18.20551109313965, "global_step": 19253, "epoch": 231} {"train_loss": -18.030786514282227, "global_step": 19254, "epoch": 231} {"train_loss": -18.308246290827373, "global_step": 19255, "epoch": 231, "val_loss": 6020121.0} {"train_loss": -17.883153915405273, "global_step": 19256, "epoch": 232} {"train_loss": -17.674474716186523, "global_step": 19257, "epoch": 232} {"train_loss": -18.09613609313965, "global_step": 19258, "epoch": 232} {"train_loss": -17.938343048095703, "global_step": 19259, "epoch": 232} {"train_loss": -18.406564712524414, "global_step": 19260, "epoch": 232} {"train_loss": -18.476577758789062, "global_step": 19261, "epoch": 232} {"train_loss": -18.290939331054688, "global_step": 19262, "epoch": 232} {"train_loss": -18.10743522644043, "global_step": 19263, "epoch": 232} {"train_loss": -18.058828353881836, "global_step": 19264, "epoch": 232} {"train_loss": -18.415708541870117, "global_step": 19265, "epoch": 232} {"train_loss": -18.234426498413086, "global_step": 19266, "epoch": 232} {"train_loss": -18.198217391967773, "global_step": 19267, "epoch": 232} {"train_loss": -17.7689208984375, "global_step": 19268, "epoch": 232} {"train_loss": -18.1070613861084, "global_step": 19269, "epoch": 232} {"train_loss": -18.51991844177246, "global_step": 19270, "epoch": 232} {"train_loss": -18.041425704956055, "global_step": 19271, "epoch": 232} {"train_loss": -18.85649299621582, "global_step": 19272, "epoch": 232} {"train_loss": -18.366464614868164, "global_step": 19273, "epoch": 232} {"train_loss": -18.159637451171875, "global_step": 19274, "epoch": 232} {"train_loss": -18.153980255126953, "global_step": 19275, "epoch": 232} {"train_loss": -18.231449127197266, "global_step": 19276, "epoch": 232} {"train_loss": -18.061080932617188, "global_step": 19277, "epoch": 232} {"train_loss": -18.229589462280273, "global_step": 19278, "epoch": 232} {"train_loss": -18.321094512939453, "global_step": 19279, "epoch": 232} {"train_loss": -18.381635665893555, "global_step": 19280, "epoch": 232} {"train_loss": -18.368064880371094, "global_step": 19281, "epoch": 232} {"train_loss": -18.128318786621094, "global_step": 19282, "epoch": 232} {"train_loss": -18.389768600463867, "global_step": 19283, "epoch": 232} {"train_loss": -18.41407012939453, "global_step": 19284, "epoch": 232} {"train_loss": -18.644411087036133, "global_step": 19285, "epoch": 232} {"train_loss": -18.516525268554688, "global_step": 19286, "epoch": 232} {"train_loss": -18.30307960510254, "global_step": 19287, "epoch": 232} {"train_loss": -18.461164474487305, "global_step": 19288, "epoch": 232} {"train_loss": -18.25334930419922, "global_step": 19289, "epoch": 232} {"train_loss": -18.553485870361328, "global_step": 19290, "epoch": 232} {"train_loss": -17.993667602539062, "global_step": 19291, "epoch": 232} {"train_loss": -18.772907257080078, "global_step": 19292, "epoch": 232} {"train_loss": -18.424640655517578, "global_step": 19293, "epoch": 232} {"train_loss": -17.75478172302246, "global_step": 19294, "epoch": 232} {"train_loss": -18.38568687438965, "global_step": 19295, "epoch": 232} {"train_loss": -18.265426635742188, "global_step": 19296, "epoch": 232} {"train_loss": -18.52155113220215, "global_step": 19297, "epoch": 232} {"train_loss": -18.23749351501465, "global_step": 19298, "epoch": 232} {"train_loss": -18.334941864013672, "global_step": 19299, "epoch": 232} {"train_loss": -18.405893325805664, "global_step": 19300, "epoch": 232} {"train_loss": -18.45035171508789, "global_step": 19301, "epoch": 232} {"train_loss": -18.08583641052246, "global_step": 19302, "epoch": 232} {"train_loss": -18.317689895629883, "global_step": 19303, "epoch": 232} {"train_loss": -18.051206588745117, "global_step": 19304, "epoch": 232} {"train_loss": -18.062164306640625, "global_step": 19305, "epoch": 232} {"train_loss": -18.625329971313477, "global_step": 19306, "epoch": 232} {"train_loss": -18.206912994384766, "global_step": 19307, "epoch": 232} {"train_loss": -18.220584869384766, "global_step": 19308, "epoch": 232} {"train_loss": -18.241559982299805, "global_step": 19309, "epoch": 232} {"train_loss": -18.451581954956055, "global_step": 19310, "epoch": 232} {"train_loss": -18.72565269470215, "global_step": 19311, "epoch": 232} {"train_loss": -18.430112838745117, "global_step": 19312, "epoch": 232} {"train_loss": -18.352846145629883, "global_step": 19313, "epoch": 232} {"train_loss": -18.574512481689453, "global_step": 19314, "epoch": 232} {"train_loss": -18.465301513671875, "global_step": 19315, "epoch": 232} {"train_loss": -18.544857025146484, "global_step": 19316, "epoch": 232} {"train_loss": -18.556913375854492, "global_step": 19317, "epoch": 232} {"train_loss": -18.502559661865234, "global_step": 19318, "epoch": 232} {"train_loss": -18.352806091308594, "global_step": 19319, "epoch": 232} {"train_loss": -18.203350067138672, "global_step": 19320, "epoch": 232} {"train_loss": -18.394062042236328, "global_step": 19321, "epoch": 232} {"train_loss": -18.0351619720459, "global_step": 19322, "epoch": 232} {"train_loss": -18.23324966430664, "global_step": 19323, "epoch": 232} {"train_loss": -18.11837387084961, "global_step": 19324, "epoch": 232} {"train_loss": -18.432540893554688, "global_step": 19325, "epoch": 232} {"train_loss": -18.332706451416016, "global_step": 19326, "epoch": 232} {"train_loss": -18.469873428344727, "global_step": 19327, "epoch": 232} {"train_loss": -18.22175407409668, "global_step": 19328, "epoch": 232} {"train_loss": -18.310344696044922, "global_step": 19329, "epoch": 232} {"train_loss": -18.632366180419922, "global_step": 19330, "epoch": 232} {"train_loss": -17.947141647338867, "global_step": 19331, "epoch": 232} {"train_loss": -18.32232093811035, "global_step": 19332, "epoch": 232} {"train_loss": -18.320035934448242, "global_step": 19333, "epoch": 232} {"train_loss": -18.594839096069336, "global_step": 19334, "epoch": 232} {"train_loss": -18.19782066345215, "global_step": 19335, "epoch": 232} {"train_loss": -18.317060470581055, "global_step": 19336, "epoch": 232} {"train_loss": -18.42371940612793, "global_step": 19337, "epoch": 232} {"train_loss": -18.311524770346033, "global_step": 19338, "epoch": 232, "val_loss": 5870888.0} {"train_loss": -17.751617431640625, "global_step": 19339, "epoch": 233} {"train_loss": -18.173398971557617, "global_step": 19340, "epoch": 233} {"train_loss": -18.401506423950195, "global_step": 19341, "epoch": 233} {"train_loss": -18.0519962310791, "global_step": 19342, "epoch": 233} {"train_loss": -18.373567581176758, "global_step": 19343, "epoch": 233} {"train_loss": -17.905790328979492, "global_step": 19344, "epoch": 233} {"train_loss": -18.205245971679688, "global_step": 19345, "epoch": 233} {"train_loss": -18.224306106567383, "global_step": 19346, "epoch": 233} {"train_loss": -18.220853805541992, "global_step": 19347, "epoch": 233} {"train_loss": -18.108173370361328, "global_step": 19348, "epoch": 233} {"train_loss": -18.21905517578125, "global_step": 19349, "epoch": 233} {"train_loss": -18.16670036315918, "global_step": 19350, "epoch": 233} {"train_loss": -18.479938507080078, "global_step": 19351, "epoch": 233} {"train_loss": -18.092777252197266, "global_step": 19352, "epoch": 233} {"train_loss": -18.278980255126953, "global_step": 19353, "epoch": 233} {"train_loss": -18.39276123046875, "global_step": 19354, "epoch": 233} {"train_loss": -18.2476749420166, "global_step": 19355, "epoch": 233} {"train_loss": -18.0430965423584, "global_step": 19356, "epoch": 233} {"train_loss": -18.449670791625977, "global_step": 19357, "epoch": 233} {"train_loss": -18.30011558532715, "global_step": 19358, "epoch": 233} {"train_loss": -18.315649032592773, "global_step": 19359, "epoch": 233} {"train_loss": -18.308195114135742, "global_step": 19360, "epoch": 233} {"train_loss": -18.14398765563965, "global_step": 19361, "epoch": 233} {"train_loss": -18.049222946166992, "global_step": 19362, "epoch": 233} {"train_loss": -17.951099395751953, "global_step": 19363, "epoch": 233} {"train_loss": -17.8123722076416, "global_step": 19364, "epoch": 233} {"train_loss": -18.129629135131836, "global_step": 19365, "epoch": 233} {"train_loss": -18.056591033935547, "global_step": 19366, "epoch": 233} {"train_loss": -18.14641761779785, "global_step": 19367, "epoch": 233} {"train_loss": -18.27663230895996, "global_step": 19368, "epoch": 233} {"train_loss": -18.104496002197266, "global_step": 19369, "epoch": 233} {"train_loss": -18.380325317382812, "global_step": 19370, "epoch": 233} {"train_loss": -18.68582534790039, "global_step": 19371, "epoch": 233} {"train_loss": -18.084224700927734, "global_step": 19372, "epoch": 233} {"train_loss": -18.05787467956543, "global_step": 19373, "epoch": 233} {"train_loss": -18.39035987854004, "global_step": 19374, "epoch": 233} {"train_loss": -18.50963020324707, "global_step": 19375, "epoch": 233} {"train_loss": -18.446470260620117, "global_step": 19376, "epoch": 233} {"train_loss": -18.503738403320312, "global_step": 19377, "epoch": 233} {"train_loss": -18.020172119140625, "global_step": 19378, "epoch": 233} {"train_loss": -18.2093563079834, "global_step": 19379, "epoch": 233} {"train_loss": -18.501056671142578, "global_step": 19380, "epoch": 233} {"train_loss": -17.89521598815918, "global_step": 19381, "epoch": 233} {"train_loss": -18.684297561645508, "global_step": 19382, "epoch": 233} {"train_loss": -18.19944190979004, "global_step": 19383, "epoch": 233} {"train_loss": -18.189105987548828, "global_step": 19384, "epoch": 233} {"train_loss": -18.46483039855957, "global_step": 19385, "epoch": 233} {"train_loss": -18.215124130249023, "global_step": 19386, "epoch": 233} {"train_loss": -18.690732955932617, "global_step": 19387, "epoch": 233} {"train_loss": -18.3632869720459, "global_step": 19388, "epoch": 233} {"train_loss": -18.93776512145996, "global_step": 19389, "epoch": 233} {"train_loss": -18.130006790161133, "global_step": 19390, "epoch": 233} {"train_loss": -18.456302642822266, "global_step": 19391, "epoch": 233} {"train_loss": -18.305633544921875, "global_step": 19392, "epoch": 233} {"train_loss": -18.21719741821289, "global_step": 19393, "epoch": 233} {"train_loss": -17.99264144897461, "global_step": 19394, "epoch": 233} {"train_loss": -18.20955467224121, "global_step": 19395, "epoch": 233} {"train_loss": -18.44455909729004, "global_step": 19396, "epoch": 233} {"train_loss": -18.04793357849121, "global_step": 19397, "epoch": 233} {"train_loss": -17.967487335205078, "global_step": 19398, "epoch": 233} {"train_loss": -18.282194137573242, "global_step": 19399, "epoch": 233} {"train_loss": -18.377445220947266, "global_step": 19400, "epoch": 233} {"train_loss": -18.112062454223633, "global_step": 19401, "epoch": 233} {"train_loss": -18.12551498413086, "global_step": 19402, "epoch": 233} {"train_loss": -18.278472900390625, "global_step": 19403, "epoch": 233} {"train_loss": -18.327985763549805, "global_step": 19404, "epoch": 233} {"train_loss": -18.15409278869629, "global_step": 19405, "epoch": 233} {"train_loss": -18.93893814086914, "global_step": 19406, "epoch": 233} {"train_loss": -18.584203720092773, "global_step": 19407, "epoch": 233} {"train_loss": -18.33184814453125, "global_step": 19408, "epoch": 233} {"train_loss": -18.163894653320312, "global_step": 19409, "epoch": 233} {"train_loss": -18.210479736328125, "global_step": 19410, "epoch": 233} {"train_loss": -18.51148796081543, "global_step": 19411, "epoch": 233} {"train_loss": -18.23322105407715, "global_step": 19412, "epoch": 233} {"train_loss": -18.30719566345215, "global_step": 19413, "epoch": 233} {"train_loss": -18.634817123413086, "global_step": 19414, "epoch": 233} {"train_loss": -18.58878517150879, "global_step": 19415, "epoch": 233} {"train_loss": -18.208023071289062, "global_step": 19416, "epoch": 233} {"train_loss": -18.428030014038086, "global_step": 19417, "epoch": 233} {"train_loss": -18.122940063476562, "global_step": 19418, "epoch": 233} {"train_loss": -18.69722557067871, "global_step": 19419, "epoch": 233} {"train_loss": -18.550039291381836, "global_step": 19420, "epoch": 233} {"train_loss": -18.287750749702912, "global_step": 19421, "epoch": 233, "val_loss": 6010817.5} {"train_loss": -17.542219161987305, "global_step": 19422, "epoch": 234} {"train_loss": -17.929370880126953, "global_step": 19423, "epoch": 234} {"train_loss": -17.646087646484375, "global_step": 19424, "epoch": 234} {"train_loss": -18.433801651000977, "global_step": 19425, "epoch": 234} {"train_loss": -17.932188034057617, "global_step": 19426, "epoch": 234} {"train_loss": -18.39728355407715, "global_step": 19427, "epoch": 234} {"train_loss": -17.75481414794922, "global_step": 19428, "epoch": 234} {"train_loss": -18.35964584350586, "global_step": 19429, "epoch": 234} {"train_loss": -18.152029037475586, "global_step": 19430, "epoch": 234} {"train_loss": -18.167104721069336, "global_step": 19431, "epoch": 234} {"train_loss": -17.81378746032715, "global_step": 19432, "epoch": 234} {"train_loss": -18.480587005615234, "global_step": 19433, "epoch": 234} {"train_loss": -18.25506019592285, "global_step": 19434, "epoch": 234} {"train_loss": -17.875110626220703, "global_step": 19435, "epoch": 234} {"train_loss": -18.32025909423828, "global_step": 19436, "epoch": 234} {"train_loss": -18.367420196533203, "global_step": 19437, "epoch": 234} {"train_loss": -17.91268539428711, "global_step": 19438, "epoch": 234} {"train_loss": -18.23046875, "global_step": 19439, "epoch": 234} {"train_loss": -18.19720458984375, "global_step": 19440, "epoch": 234} {"train_loss": -18.16571617126465, "global_step": 19441, "epoch": 234} {"train_loss": -18.512859344482422, "global_step": 19442, "epoch": 234} {"train_loss": -18.160877227783203, "global_step": 19443, "epoch": 234} {"train_loss": -18.113370895385742, "global_step": 19444, "epoch": 234} {"train_loss": -18.246845245361328, "global_step": 19445, "epoch": 234} {"train_loss": -18.450536727905273, "global_step": 19446, "epoch": 234} {"train_loss": -18.071712493896484, "global_step": 19447, "epoch": 234} {"train_loss": -18.426443099975586, "global_step": 19448, "epoch": 234} {"train_loss": -18.303068161010742, "global_step": 19449, "epoch": 234} {"train_loss": -18.490676879882812, "global_step": 19450, "epoch": 234} {"train_loss": -18.718128204345703, "global_step": 19451, "epoch": 234} {"train_loss": -18.249835968017578, "global_step": 19452, "epoch": 234} {"train_loss": -18.599231719970703, "global_step": 19453, "epoch": 234} {"train_loss": -18.243335723876953, "global_step": 19454, "epoch": 234} {"train_loss": -18.130048751831055, "global_step": 19455, "epoch": 234} {"train_loss": -17.7379093170166, "global_step": 19456, "epoch": 234} {"train_loss": -18.3094539642334, "global_step": 19457, "epoch": 234} {"train_loss": -18.40411949157715, "global_step": 19458, "epoch": 234} {"train_loss": -18.3758602142334, "global_step": 19459, "epoch": 234} {"train_loss": -18.43470573425293, "global_step": 19460, "epoch": 234} {"train_loss": -18.28791618347168, "global_step": 19461, "epoch": 234} {"train_loss": -18.31863784790039, "global_step": 19462, "epoch": 234} {"train_loss": -18.36183738708496, "global_step": 19463, "epoch": 234} {"train_loss": -18.325559616088867, "global_step": 19464, "epoch": 234} {"train_loss": -18.26073455810547, "global_step": 19465, "epoch": 234} {"train_loss": -18.353530883789062, "global_step": 19466, "epoch": 234} {"train_loss": -18.145431518554688, "global_step": 19467, "epoch": 234} {"train_loss": -18.394100189208984, "global_step": 19468, "epoch": 234} {"train_loss": -18.217803955078125, "global_step": 19469, "epoch": 234} {"train_loss": -18.482786178588867, "global_step": 19470, "epoch": 234} {"train_loss": -18.426618576049805, "global_step": 19471, "epoch": 234} {"train_loss": -18.174766540527344, "global_step": 19472, "epoch": 234} {"train_loss": -18.440265655517578, "global_step": 19473, "epoch": 234} {"train_loss": -18.18092155456543, "global_step": 19474, "epoch": 234} {"train_loss": -18.465429306030273, "global_step": 19475, "epoch": 234} {"train_loss": -18.234230041503906, "global_step": 19476, "epoch": 234} {"train_loss": -18.294437408447266, "global_step": 19477, "epoch": 234} {"train_loss": -18.41837501525879, "global_step": 19478, "epoch": 234} {"train_loss": -18.205839157104492, "global_step": 19479, "epoch": 234} {"train_loss": -18.06379508972168, "global_step": 19480, "epoch": 234} {"train_loss": -18.479883193969727, "global_step": 19481, "epoch": 234} {"train_loss": -18.452022552490234, "global_step": 19482, "epoch": 234} {"train_loss": -18.21278953552246, "global_step": 19483, "epoch": 234} {"train_loss": -18.043943405151367, "global_step": 19484, "epoch": 234} {"train_loss": -18.481420516967773, "global_step": 19485, "epoch": 234} {"train_loss": -18.454639434814453, "global_step": 19486, "epoch": 234} {"train_loss": -18.480436325073242, "global_step": 19487, "epoch": 234} {"train_loss": -18.235599517822266, "global_step": 19488, "epoch": 234} {"train_loss": -18.412708282470703, "global_step": 19489, "epoch": 234} {"train_loss": -18.28736686706543, "global_step": 19490, "epoch": 234} {"train_loss": -18.24139976501465, "global_step": 19491, "epoch": 234} {"train_loss": -18.30735969543457, "global_step": 19492, "epoch": 234} {"train_loss": -18.60980987548828, "global_step": 19493, "epoch": 234} {"train_loss": -18.30988121032715, "global_step": 19494, "epoch": 234} {"train_loss": -18.35630226135254, "global_step": 19495, "epoch": 234} {"train_loss": -18.08255386352539, "global_step": 19496, "epoch": 234} {"train_loss": -18.0726375579834, "global_step": 19497, "epoch": 234} {"train_loss": -18.268054962158203, "global_step": 19498, "epoch": 234} {"train_loss": -18.359529495239258, "global_step": 19499, "epoch": 234} {"train_loss": -18.26960563659668, "global_step": 19500, "epoch": 234} {"train_loss": -18.53318214416504, "global_step": 19501, "epoch": 234} {"train_loss": -18.262922286987305, "global_step": 19502, "epoch": 234} {"train_loss": -18.178529739379883, "global_step": 19503, "epoch": 234} {"train_loss": -18.272933431418544, "global_step": 19504, "epoch": 234, "val_loss": 6025353.0} {"train_loss": -17.97444725036621, "global_step": 19505, "epoch": 235} {"train_loss": -18.46523094177246, "global_step": 19506, "epoch": 235} {"train_loss": -17.949167251586914, "global_step": 19507, "epoch": 235} {"train_loss": -17.84339714050293, "global_step": 19508, "epoch": 235} {"train_loss": -18.33124351501465, "global_step": 19509, "epoch": 235} {"train_loss": -18.544654846191406, "global_step": 19510, "epoch": 235} {"train_loss": -18.3729305267334, "global_step": 19511, "epoch": 235} {"train_loss": -18.527318954467773, "global_step": 19512, "epoch": 235} {"train_loss": -18.130590438842773, "global_step": 19513, "epoch": 235} {"train_loss": -18.31646156311035, "global_step": 19514, "epoch": 235} {"train_loss": -18.39114761352539, "global_step": 19515, "epoch": 235} {"train_loss": -18.045713424682617, "global_step": 19516, "epoch": 235} {"train_loss": -18.38642120361328, "global_step": 19517, "epoch": 235} {"train_loss": -18.297361373901367, "global_step": 19518, "epoch": 235} {"train_loss": -18.055992126464844, "global_step": 19519, "epoch": 235} {"train_loss": -18.062971115112305, "global_step": 19520, "epoch": 235} {"train_loss": -18.286212921142578, "global_step": 19521, "epoch": 235} {"train_loss": -18.47761344909668, "global_step": 19522, "epoch": 235} {"train_loss": -18.251291275024414, "global_step": 19523, "epoch": 235} {"train_loss": -18.118616104125977, "global_step": 19524, "epoch": 235} {"train_loss": -18.149084091186523, "global_step": 19525, "epoch": 235} {"train_loss": -18.585041046142578, "global_step": 19526, "epoch": 235} {"train_loss": -18.3504695892334, "global_step": 19527, "epoch": 235} {"train_loss": -18.198659896850586, "global_step": 19528, "epoch": 235} {"train_loss": -18.575124740600586, "global_step": 19529, "epoch": 235} {"train_loss": -18.58193588256836, "global_step": 19530, "epoch": 235} {"train_loss": -18.056903839111328, "global_step": 19531, "epoch": 235} {"train_loss": -18.789899826049805, "global_step": 19532, "epoch": 235} {"train_loss": -18.42184829711914, "global_step": 19533, "epoch": 235} {"train_loss": -18.16823387145996, "global_step": 19534, "epoch": 235} {"train_loss": -18.412614822387695, "global_step": 19535, "epoch": 235} {"train_loss": -18.531494140625, "global_step": 19536, "epoch": 235} {"train_loss": -18.272741317749023, "global_step": 19537, "epoch": 235} {"train_loss": -18.276620864868164, "global_step": 19538, "epoch": 235} {"train_loss": -18.079971313476562, "global_step": 19539, "epoch": 235} {"train_loss": -18.276193618774414, "global_step": 19540, "epoch": 235} {"train_loss": -18.105010986328125, "global_step": 19541, "epoch": 235} {"train_loss": -18.282394409179688, "global_step": 19542, "epoch": 235} {"train_loss": -18.319091796875, "global_step": 19543, "epoch": 235} {"train_loss": -17.71077537536621, "global_step": 19544, "epoch": 235} {"train_loss": -17.80750846862793, "global_step": 19545, "epoch": 235} {"train_loss": -18.63714027404785, "global_step": 19546, "epoch": 235} {"train_loss": -18.256147384643555, "global_step": 19547, "epoch": 235} {"train_loss": -18.560754776000977, "global_step": 19548, "epoch": 235} {"train_loss": -18.006324768066406, "global_step": 19549, "epoch": 235} {"train_loss": -18.11724281311035, "global_step": 19550, "epoch": 235} {"train_loss": -18.262577056884766, "global_step": 19551, "epoch": 235} {"train_loss": -18.428129196166992, "global_step": 19552, "epoch": 235} {"train_loss": -18.349491119384766, "global_step": 19553, "epoch": 235} {"train_loss": -18.506996154785156, "global_step": 19554, "epoch": 235} {"train_loss": -18.23409080505371, "global_step": 19555, "epoch": 235} {"train_loss": -18.50870132446289, "global_step": 19556, "epoch": 235} {"train_loss": -18.545284271240234, "global_step": 19557, "epoch": 235} {"train_loss": -18.722766876220703, "global_step": 19558, "epoch": 235} {"train_loss": -18.388206481933594, "global_step": 19559, "epoch": 235} {"train_loss": -18.565683364868164, "global_step": 19560, "epoch": 235} {"train_loss": -18.190404891967773, "global_step": 19561, "epoch": 235} {"train_loss": -18.16458511352539, "global_step": 19562, "epoch": 235} {"train_loss": -18.380216598510742, "global_step": 19563, "epoch": 235} {"train_loss": -18.196531295776367, "global_step": 19564, "epoch": 235} {"train_loss": -18.232288360595703, "global_step": 19565, "epoch": 235} {"train_loss": -18.74167823791504, "global_step": 19566, "epoch": 235} {"train_loss": -18.55109977722168, "global_step": 19567, "epoch": 235} {"train_loss": -17.98784828186035, "global_step": 19568, "epoch": 235} {"train_loss": -18.143091201782227, "global_step": 19569, "epoch": 235} {"train_loss": -18.259580612182617, "global_step": 19570, "epoch": 235} {"train_loss": -18.271087646484375, "global_step": 19571, "epoch": 235} {"train_loss": -18.547672271728516, "global_step": 19572, "epoch": 235} {"train_loss": -18.256183624267578, "global_step": 19573, "epoch": 235} {"train_loss": -18.15378189086914, "global_step": 19574, "epoch": 235} {"train_loss": -18.54847526550293, "global_step": 19575, "epoch": 235} {"train_loss": -18.098081588745117, "global_step": 19576, "epoch": 235} {"train_loss": -18.112380981445312, "global_step": 19577, "epoch": 235} {"train_loss": -18.519826889038086, "global_step": 19578, "epoch": 235} {"train_loss": -18.243162155151367, "global_step": 19579, "epoch": 235} {"train_loss": -18.444400787353516, "global_step": 19580, "epoch": 235} {"train_loss": -18.276878356933594, "global_step": 19581, "epoch": 235} {"train_loss": -18.21681785583496, "global_step": 19582, "epoch": 235} {"train_loss": -18.441137313842773, "global_step": 19583, "epoch": 235} {"train_loss": -18.045204162597656, "global_step": 19584, "epoch": 235} {"train_loss": -18.21201515197754, "global_step": 19585, "epoch": 235} {"train_loss": -18.49603843688965, "global_step": 19586, "epoch": 235} {"train_loss": -18.289761485823664, "global_step": 19587, "epoch": 235, "val_loss": 5868165.0} {"train_loss": -18.406450271606445, "global_step": 19588, "epoch": 236} {"train_loss": -18.098180770874023, "global_step": 19589, "epoch": 236} {"train_loss": -18.365942001342773, "global_step": 19590, "epoch": 236} {"train_loss": -17.981569290161133, "global_step": 19591, "epoch": 236} {"train_loss": -18.030609130859375, "global_step": 19592, "epoch": 236} {"train_loss": -18.154104232788086, "global_step": 19593, "epoch": 236} {"train_loss": -18.53162956237793, "global_step": 19594, "epoch": 236} {"train_loss": -17.90675163269043, "global_step": 19595, "epoch": 236} {"train_loss": -18.279237747192383, "global_step": 19596, "epoch": 236} {"train_loss": -18.625375747680664, "global_step": 19597, "epoch": 236} {"train_loss": -17.937177658081055, "global_step": 19598, "epoch": 236} {"train_loss": -18.46358299255371, "global_step": 19599, "epoch": 236} {"train_loss": -18.251455307006836, "global_step": 19600, "epoch": 236} {"train_loss": -18.20795249938965, "global_step": 19601, "epoch": 236} {"train_loss": -18.598154067993164, "global_step": 19602, "epoch": 236} {"train_loss": -18.53952407836914, "global_step": 19603, "epoch": 236} {"train_loss": -18.691020965576172, "global_step": 19604, "epoch": 236} {"train_loss": -18.374364852905273, "global_step": 19605, "epoch": 236} {"train_loss": -18.535879135131836, "global_step": 19606, "epoch": 236} {"train_loss": -17.907400131225586, "global_step": 19607, "epoch": 236} {"train_loss": -18.691198348999023, "global_step": 19608, "epoch": 236} {"train_loss": -18.31342124938965, "global_step": 19609, "epoch": 236} {"train_loss": -18.193254470825195, "global_step": 19610, "epoch": 236} {"train_loss": -18.208251953125, "global_step": 19611, "epoch": 236} {"train_loss": -18.334701538085938, "global_step": 19612, "epoch": 236} {"train_loss": -18.484113693237305, "global_step": 19613, "epoch": 236} {"train_loss": -18.56996726989746, "global_step": 19614, "epoch": 236} {"train_loss": -18.258808135986328, "global_step": 19615, "epoch": 236} {"train_loss": -18.151580810546875, "global_step": 19616, "epoch": 236} {"train_loss": -18.2251033782959, "global_step": 19617, "epoch": 236} {"train_loss": -18.380640029907227, "global_step": 19618, "epoch": 236} {"train_loss": -18.210067749023438, "global_step": 19619, "epoch": 236} {"train_loss": -17.80950927734375, "global_step": 19620, "epoch": 236} {"train_loss": -18.1298885345459, "global_step": 19621, "epoch": 236} {"train_loss": -18.4121036529541, "global_step": 19622, "epoch": 236} {"train_loss": -18.207149505615234, "global_step": 19623, "epoch": 236} {"train_loss": -18.2945556640625, "global_step": 19624, "epoch": 236} {"train_loss": -18.386932373046875, "global_step": 19625, "epoch": 236} {"train_loss": -18.5636043548584, "global_step": 19626, "epoch": 236} {"train_loss": -18.318960189819336, "global_step": 19627, "epoch": 236} {"train_loss": -18.368831634521484, "global_step": 19628, "epoch": 236} {"train_loss": -18.301504135131836, "global_step": 19629, "epoch": 236} {"train_loss": -18.310224533081055, "global_step": 19630, "epoch": 236} {"train_loss": -18.0860595703125, "global_step": 19631, "epoch": 236} {"train_loss": -18.794309616088867, "global_step": 19632, "epoch": 236} {"train_loss": -18.527313232421875, "global_step": 19633, "epoch": 236} {"train_loss": -18.18586540222168, "global_step": 19634, "epoch": 236} {"train_loss": -18.344451904296875, "global_step": 19635, "epoch": 236} {"train_loss": -18.279939651489258, "global_step": 19636, "epoch": 236} {"train_loss": -18.369003295898438, "global_step": 19637, "epoch": 236} {"train_loss": -18.221525192260742, "global_step": 19638, "epoch": 236} {"train_loss": -18.071033477783203, "global_step": 19639, "epoch": 236} {"train_loss": -18.368162155151367, "global_step": 19640, "epoch": 236} {"train_loss": -18.455778121948242, "global_step": 19641, "epoch": 236} {"train_loss": -18.3392276763916, "global_step": 19642, "epoch": 236} {"train_loss": -18.01299476623535, "global_step": 19643, "epoch": 236} {"train_loss": -18.404325485229492, "global_step": 19644, "epoch": 236} {"train_loss": -18.199857711791992, "global_step": 19645, "epoch": 236} {"train_loss": -18.11641502380371, "global_step": 19646, "epoch": 236} {"train_loss": -18.330570220947266, "global_step": 19647, "epoch": 236} {"train_loss": -18.422916412353516, "global_step": 19648, "epoch": 236} {"train_loss": -18.446035385131836, "global_step": 19649, "epoch": 236} {"train_loss": -18.19036102294922, "global_step": 19650, "epoch": 236} {"train_loss": -18.629032135009766, "global_step": 19651, "epoch": 236} {"train_loss": -18.120025634765625, "global_step": 19652, "epoch": 236} {"train_loss": -18.188608169555664, "global_step": 19653, "epoch": 236} {"train_loss": -18.059057235717773, "global_step": 19654, "epoch": 236} {"train_loss": -18.32501792907715, "global_step": 19655, "epoch": 236} {"train_loss": -18.43503189086914, "global_step": 19656, "epoch": 236} {"train_loss": -18.537431716918945, "global_step": 19657, "epoch": 236} {"train_loss": -18.31022834777832, "global_step": 19658, "epoch": 236} {"train_loss": -18.15611457824707, "global_step": 19659, "epoch": 236} {"train_loss": -18.5544490814209, "global_step": 19660, "epoch": 236} {"train_loss": -18.20992088317871, "global_step": 19661, "epoch": 236} {"train_loss": -18.41376304626465, "global_step": 19662, "epoch": 236} {"train_loss": -18.44542121887207, "global_step": 19663, "epoch": 236} {"train_loss": -18.53856086730957, "global_step": 19664, "epoch": 236} {"train_loss": -18.391483306884766, "global_step": 19665, "epoch": 236} {"train_loss": -18.091014862060547, "global_step": 19666, "epoch": 236} {"train_loss": -18.348066329956055, "global_step": 19667, "epoch": 236} {"train_loss": -17.905757904052734, "global_step": 19668, "epoch": 236} {"train_loss": -18.411603927612305, "global_step": 19669, "epoch": 236} {"train_loss": -18.314725783934076, "global_step": 19670, "epoch": 236, "val_loss": 5900230.0} {"train_loss": -17.917800903320312, "global_step": 19671, "epoch": 237} {"train_loss": -18.221342086791992, "global_step": 19672, "epoch": 237} {"train_loss": -18.30369758605957, "global_step": 19673, "epoch": 237} {"train_loss": -17.97784423828125, "global_step": 19674, "epoch": 237} {"train_loss": -18.20609474182129, "global_step": 19675, "epoch": 237} {"train_loss": -18.193357467651367, "global_step": 19676, "epoch": 237} {"train_loss": -17.69019889831543, "global_step": 19677, "epoch": 237} {"train_loss": -18.509450912475586, "global_step": 19678, "epoch": 237} {"train_loss": -18.7901554107666, "global_step": 19679, "epoch": 237} {"train_loss": -18.319000244140625, "global_step": 19680, "epoch": 237} {"train_loss": -18.24833106994629, "global_step": 19681, "epoch": 237} {"train_loss": -18.366634368896484, "global_step": 19682, "epoch": 237} {"train_loss": -18.37238883972168, "global_step": 19683, "epoch": 237} {"train_loss": -18.29935646057129, "global_step": 19684, "epoch": 237} {"train_loss": -18.492576599121094, "global_step": 19685, "epoch": 237} {"train_loss": -18.006757736206055, "global_step": 19686, "epoch": 237} {"train_loss": -18.351226806640625, "global_step": 19687, "epoch": 237} {"train_loss": -18.462188720703125, "global_step": 19688, "epoch": 237} {"train_loss": -18.251291275024414, "global_step": 19689, "epoch": 237} {"train_loss": -18.430295944213867, "global_step": 19690, "epoch": 237} {"train_loss": -18.358545303344727, "global_step": 19691, "epoch": 237} {"train_loss": -18.0388126373291, "global_step": 19692, "epoch": 237} {"train_loss": -18.395660400390625, "global_step": 19693, "epoch": 237} {"train_loss": -18.188695907592773, "global_step": 19694, "epoch": 237} {"train_loss": -18.30181121826172, "global_step": 19695, "epoch": 237} {"train_loss": -18.221725463867188, "global_step": 19696, "epoch": 237} {"train_loss": -18.16314697265625, "global_step": 19697, "epoch": 237} {"train_loss": -18.16356658935547, "global_step": 19698, "epoch": 237} {"train_loss": -18.946882247924805, "global_step": 19699, "epoch": 237} {"train_loss": -18.184297561645508, "global_step": 19700, "epoch": 237} {"train_loss": -18.412975311279297, "global_step": 19701, "epoch": 237} {"train_loss": -18.49751091003418, "global_step": 19702, "epoch": 237} {"train_loss": -18.493453979492188, "global_step": 19703, "epoch": 237} {"train_loss": -18.24655532836914, "global_step": 19704, "epoch": 237} {"train_loss": -18.166553497314453, "global_step": 19705, "epoch": 237} {"train_loss": -18.272523880004883, "global_step": 19706, "epoch": 237} {"train_loss": -18.071622848510742, "global_step": 19707, "epoch": 237} {"train_loss": -18.395978927612305, "global_step": 19708, "epoch": 237} {"train_loss": -18.476072311401367, "global_step": 19709, "epoch": 237} {"train_loss": -17.874950408935547, "global_step": 19710, "epoch": 237} {"train_loss": -18.65634536743164, "global_step": 19711, "epoch": 237} {"train_loss": -18.278709411621094, "global_step": 19712, "epoch": 237} {"train_loss": -18.303918838500977, "global_step": 19713, "epoch": 237} {"train_loss": -18.27534294128418, "global_step": 19714, "epoch": 237} {"train_loss": -18.20209312438965, "global_step": 19715, "epoch": 237} {"train_loss": -18.672449111938477, "global_step": 19716, "epoch": 237} {"train_loss": -17.89069366455078, "global_step": 19717, "epoch": 237} {"train_loss": -18.422977447509766, "global_step": 19718, "epoch": 237} {"train_loss": -18.199216842651367, "global_step": 19719, "epoch": 237} {"train_loss": -18.08202362060547, "global_step": 19720, "epoch": 237} {"train_loss": -18.231592178344727, "global_step": 19721, "epoch": 237} {"train_loss": -18.4594783782959, "global_step": 19722, "epoch": 237} {"train_loss": -18.39874267578125, "global_step": 19723, "epoch": 237} {"train_loss": -18.395780563354492, "global_step": 19724, "epoch": 237} {"train_loss": -18.46669578552246, "global_step": 19725, "epoch": 237} {"train_loss": -18.51900291442871, "global_step": 19726, "epoch": 237} {"train_loss": -18.166217803955078, "global_step": 19727, "epoch": 237} {"train_loss": -18.101709365844727, "global_step": 19728, "epoch": 237} {"train_loss": -18.63013458251953, "global_step": 19729, "epoch": 237} {"train_loss": -18.113630294799805, "global_step": 19730, "epoch": 237} {"train_loss": -18.32389259338379, "global_step": 19731, "epoch": 237} {"train_loss": -18.389280319213867, "global_step": 19732, "epoch": 237} {"train_loss": -18.074949264526367, "global_step": 19733, "epoch": 237} {"train_loss": -18.566696166992188, "global_step": 19734, "epoch": 237} {"train_loss": -18.261953353881836, "global_step": 19735, "epoch": 237} {"train_loss": -18.173498153686523, "global_step": 19736, "epoch": 237} {"train_loss": -18.196353912353516, "global_step": 19737, "epoch": 237} {"train_loss": -18.740140914916992, "global_step": 19738, "epoch": 237} {"train_loss": -18.3109130859375, "global_step": 19739, "epoch": 237} {"train_loss": -18.58428382873535, "global_step": 19740, "epoch": 237} {"train_loss": -18.391183853149414, "global_step": 19741, "epoch": 237} {"train_loss": -18.481836318969727, "global_step": 19742, "epoch": 237} {"train_loss": -18.489898681640625, "global_step": 19743, "epoch": 237} {"train_loss": -18.241331100463867, "global_step": 19744, "epoch": 237} {"train_loss": -18.163427352905273, "global_step": 19745, "epoch": 237} {"train_loss": -18.45941734313965, "global_step": 19746, "epoch": 237} {"train_loss": -18.608036041259766, "global_step": 19747, "epoch": 237} {"train_loss": -18.219003677368164, "global_step": 19748, "epoch": 237} {"train_loss": -18.184274673461914, "global_step": 19749, "epoch": 237} {"train_loss": -18.172971725463867, "global_step": 19750, "epoch": 237} {"train_loss": -18.5611629486084, "global_step": 19751, "epoch": 237} {"train_loss": -17.753931045532227, "global_step": 19752, "epoch": 237} {"train_loss": -18.301869334944758, "global_step": 19753, "epoch": 237, "val_loss": 5950304.0} {"train_loss": -18.32192039489746, "global_step": 19754, "epoch": 238} {"train_loss": -18.3546199798584, "global_step": 19755, "epoch": 238} {"train_loss": -18.08643913269043, "global_step": 19756, "epoch": 238} {"train_loss": -18.531326293945312, "global_step": 19757, "epoch": 238} {"train_loss": -18.50309181213379, "global_step": 19758, "epoch": 238} {"train_loss": -18.18882179260254, "global_step": 19759, "epoch": 238} {"train_loss": -18.147794723510742, "global_step": 19760, "epoch": 238} {"train_loss": -18.80725860595703, "global_step": 19761, "epoch": 238} {"train_loss": -18.065519332885742, "global_step": 19762, "epoch": 238} {"train_loss": -18.16290283203125, "global_step": 19763, "epoch": 238} {"train_loss": -18.364456176757812, "global_step": 19764, "epoch": 238} {"train_loss": -18.34305191040039, "global_step": 19765, "epoch": 238} {"train_loss": -18.64273452758789, "global_step": 19766, "epoch": 238} {"train_loss": -18.380083084106445, "global_step": 19767, "epoch": 238} {"train_loss": -18.03406524658203, "global_step": 19768, "epoch": 238} {"train_loss": -18.332233428955078, "global_step": 19769, "epoch": 238} {"train_loss": -18.356491088867188, "global_step": 19770, "epoch": 238} {"train_loss": -18.537376403808594, "global_step": 19771, "epoch": 238} {"train_loss": -18.820371627807617, "global_step": 19772, "epoch": 238} {"train_loss": -17.988035202026367, "global_step": 19773, "epoch": 238} {"train_loss": -18.65342140197754, "global_step": 19774, "epoch": 238} {"train_loss": -18.44960594177246, "global_step": 19775, "epoch": 238} {"train_loss": -18.364179611206055, "global_step": 19776, "epoch": 238} {"train_loss": -18.568845748901367, "global_step": 19777, "epoch": 238} {"train_loss": -18.541950225830078, "global_step": 19778, "epoch": 238} {"train_loss": -18.15780258178711, "global_step": 19779, "epoch": 238} {"train_loss": -18.50823974609375, "global_step": 19780, "epoch": 238} {"train_loss": -18.411924362182617, "global_step": 19781, "epoch": 238} {"train_loss": -18.45815658569336, "global_step": 19782, "epoch": 238} {"train_loss": -18.17068099975586, "global_step": 19783, "epoch": 238} {"train_loss": -18.3317813873291, "global_step": 19784, "epoch": 238} {"train_loss": -18.696884155273438, "global_step": 19785, "epoch": 238} {"train_loss": -18.033710479736328, "global_step": 19786, "epoch": 238} {"train_loss": -18.300607681274414, "global_step": 19787, "epoch": 238} {"train_loss": -18.249465942382812, "global_step": 19788, "epoch": 238} {"train_loss": -17.927875518798828, "global_step": 19789, "epoch": 238} {"train_loss": -18.128469467163086, "global_step": 19790, "epoch": 238} {"train_loss": -18.3131160736084, "global_step": 19791, "epoch": 238} {"train_loss": -18.380895614624023, "global_step": 19792, "epoch": 238} {"train_loss": -18.2968807220459, "global_step": 19793, "epoch": 238} {"train_loss": -18.053966522216797, "global_step": 19794, "epoch": 238} {"train_loss": -18.16615104675293, "global_step": 19795, "epoch": 238} {"train_loss": -18.436813354492188, "global_step": 19796, "epoch": 238} {"train_loss": -18.014379501342773, "global_step": 19797, "epoch": 238} {"train_loss": -18.2734432220459, "global_step": 19798, "epoch": 238} {"train_loss": -18.09299659729004, "global_step": 19799, "epoch": 238} {"train_loss": -18.390825271606445, "global_step": 19800, "epoch": 238} {"train_loss": -18.183055877685547, "global_step": 19801, "epoch": 238} {"train_loss": -18.372028350830078, "global_step": 19802, "epoch": 238} {"train_loss": -18.38959503173828, "global_step": 19803, "epoch": 238} {"train_loss": -18.536746978759766, "global_step": 19804, "epoch": 238} {"train_loss": -18.35150909423828, "global_step": 19805, "epoch": 238} {"train_loss": -18.16739273071289, "global_step": 19806, "epoch": 238} {"train_loss": -18.680620193481445, "global_step": 19807, "epoch": 238} {"train_loss": -18.15102195739746, "global_step": 19808, "epoch": 238} {"train_loss": -18.197118759155273, "global_step": 19809, "epoch": 238} {"train_loss": -18.319982528686523, "global_step": 19810, "epoch": 238} {"train_loss": -18.546844482421875, "global_step": 19811, "epoch": 238} {"train_loss": -18.176645278930664, "global_step": 19812, "epoch": 238} {"train_loss": -18.338659286499023, "global_step": 19813, "epoch": 238} {"train_loss": -18.007837295532227, "global_step": 19814, "epoch": 238} {"train_loss": -18.10529899597168, "global_step": 19815, "epoch": 238} {"train_loss": -18.354822158813477, "global_step": 19816, "epoch": 238} {"train_loss": -18.165668487548828, "global_step": 19817, "epoch": 238} {"train_loss": -18.6210994720459, "global_step": 19818, "epoch": 238} {"train_loss": -18.150691986083984, "global_step": 19819, "epoch": 238} {"train_loss": -18.333520889282227, "global_step": 19820, "epoch": 238} {"train_loss": -18.70515251159668, "global_step": 19821, "epoch": 238} {"train_loss": -18.280160903930664, "global_step": 19822, "epoch": 238} {"train_loss": -18.58705711364746, "global_step": 19823, "epoch": 238} {"train_loss": -18.18785858154297, "global_step": 19824, "epoch": 238} {"train_loss": -18.40338706970215, "global_step": 19825, "epoch": 238} {"train_loss": -18.32916831970215, "global_step": 19826, "epoch": 238} {"train_loss": -18.39742088317871, "global_step": 19827, "epoch": 238} {"train_loss": -18.283193588256836, "global_step": 19828, "epoch": 238} {"train_loss": -18.223026275634766, "global_step": 19829, "epoch": 238} {"train_loss": -18.590139389038086, "global_step": 19830, "epoch": 238} {"train_loss": -18.22469711303711, "global_step": 19831, "epoch": 238} {"train_loss": -18.27149200439453, "global_step": 19832, "epoch": 238} {"train_loss": -18.299970626831055, "global_step": 19833, "epoch": 238} {"train_loss": -18.339555740356445, "global_step": 19834, "epoch": 238} {"train_loss": -18.50873374938965, "global_step": 19835, "epoch": 238} {"train_loss": -18.33924514127065, "global_step": 19836, "epoch": 238, "val_loss": 5908853.0} {"train_loss": -17.648283004760742, "global_step": 19837, "epoch": 239} {"train_loss": -17.89540672302246, "global_step": 19838, "epoch": 239} {"train_loss": -18.235122680664062, "global_step": 19839, "epoch": 239} {"train_loss": -17.897197723388672, "global_step": 19840, "epoch": 239} {"train_loss": -18.314132690429688, "global_step": 19841, "epoch": 239} {"train_loss": -17.910051345825195, "global_step": 19842, "epoch": 239} {"train_loss": -18.261526107788086, "global_step": 19843, "epoch": 239} {"train_loss": -18.304107666015625, "global_step": 19844, "epoch": 239} {"train_loss": -18.209524154663086, "global_step": 19845, "epoch": 239} {"train_loss": -18.167818069458008, "global_step": 19846, "epoch": 239} {"train_loss": -18.365646362304688, "global_step": 19847, "epoch": 239} {"train_loss": -18.123544692993164, "global_step": 19848, "epoch": 239} {"train_loss": -17.843481063842773, "global_step": 19849, "epoch": 239} {"train_loss": -18.590587615966797, "global_step": 19850, "epoch": 239} {"train_loss": -17.943910598754883, "global_step": 19851, "epoch": 239} {"train_loss": -18.199228286743164, "global_step": 19852, "epoch": 239} {"train_loss": -18.20160484313965, "global_step": 19853, "epoch": 239} {"train_loss": -18.23240852355957, "global_step": 19854, "epoch": 239} {"train_loss": -18.495878219604492, "global_step": 19855, "epoch": 239} {"train_loss": -17.733341217041016, "global_step": 19856, "epoch": 239} {"train_loss": -18.64986228942871, "global_step": 19857, "epoch": 239} {"train_loss": -17.818614959716797, "global_step": 19858, "epoch": 239} {"train_loss": -18.398595809936523, "global_step": 19859, "epoch": 239} {"train_loss": -18.077590942382812, "global_step": 19860, "epoch": 239} {"train_loss": -17.89067840576172, "global_step": 19861, "epoch": 239} {"train_loss": -18.23140525817871, "global_step": 19862, "epoch": 239} {"train_loss": -18.294193267822266, "global_step": 19863, "epoch": 239} {"train_loss": -18.582910537719727, "global_step": 19864, "epoch": 239} {"train_loss": -18.383453369140625, "global_step": 19865, "epoch": 239} {"train_loss": -18.196870803833008, "global_step": 19866, "epoch": 239} {"train_loss": -18.16804313659668, "global_step": 19867, "epoch": 239} {"train_loss": -17.969797134399414, "global_step": 19868, "epoch": 239} {"train_loss": -18.3814754486084, "global_step": 19869, "epoch": 239} {"train_loss": -18.052236557006836, "global_step": 19870, "epoch": 239} {"train_loss": -18.320005416870117, "global_step": 19871, "epoch": 239} {"train_loss": -18.66535758972168, "global_step": 19872, "epoch": 239} {"train_loss": -18.355077743530273, "global_step": 19873, "epoch": 239} {"train_loss": -18.394224166870117, "global_step": 19874, "epoch": 239} {"train_loss": -18.339170455932617, "global_step": 19875, "epoch": 239} {"train_loss": -18.4792423248291, "global_step": 19876, "epoch": 239} {"train_loss": -18.43677520751953, "global_step": 19877, "epoch": 239} {"train_loss": -18.41543960571289, "global_step": 19878, "epoch": 239} {"train_loss": -18.508079528808594, "global_step": 19879, "epoch": 239} {"train_loss": -18.34175682067871, "global_step": 19880, "epoch": 239} {"train_loss": -18.20953941345215, "global_step": 19881, "epoch": 239} {"train_loss": -18.361331939697266, "global_step": 19882, "epoch": 239} {"train_loss": -18.640424728393555, "global_step": 19883, "epoch": 239} {"train_loss": -18.1334285736084, "global_step": 19884, "epoch": 239} {"train_loss": -18.454225540161133, "global_step": 19885, "epoch": 239} {"train_loss": -18.495086669921875, "global_step": 19886, "epoch": 239} {"train_loss": -18.472238540649414, "global_step": 19887, "epoch": 239} {"train_loss": -18.48422622680664, "global_step": 19888, "epoch": 239} {"train_loss": -18.168476104736328, "global_step": 19889, "epoch": 239} {"train_loss": -18.37405014038086, "global_step": 19890, "epoch": 239} {"train_loss": -18.30524444580078, "global_step": 19891, "epoch": 239} {"train_loss": -18.617765426635742, "global_step": 19892, "epoch": 239} {"train_loss": -18.134492874145508, "global_step": 19893, "epoch": 239} {"train_loss": -18.30133056640625, "global_step": 19894, "epoch": 239} {"train_loss": -18.4616641998291, "global_step": 19895, "epoch": 239} {"train_loss": -18.37343406677246, "global_step": 19896, "epoch": 239} {"train_loss": -18.244359970092773, "global_step": 19897, "epoch": 239} {"train_loss": -18.33633804321289, "global_step": 19898, "epoch": 239} {"train_loss": -18.465116500854492, "global_step": 19899, "epoch": 239} {"train_loss": -18.046016693115234, "global_step": 19900, "epoch": 239} {"train_loss": -18.695926666259766, "global_step": 19901, "epoch": 239} {"train_loss": -18.26362419128418, "global_step": 19902, "epoch": 239} {"train_loss": -18.273393630981445, "global_step": 19903, "epoch": 239} {"train_loss": -18.3082332611084, "global_step": 19904, "epoch": 239} {"train_loss": -18.03997802734375, "global_step": 19905, "epoch": 239} {"train_loss": -18.277814865112305, "global_step": 19906, "epoch": 239} {"train_loss": -18.089508056640625, "global_step": 19907, "epoch": 239} {"train_loss": -18.32828140258789, "global_step": 19908, "epoch": 239} {"train_loss": -18.38801383972168, "global_step": 19909, "epoch": 239} {"train_loss": -18.177793502807617, "global_step": 19910, "epoch": 239} {"train_loss": -18.34394645690918, "global_step": 19911, "epoch": 239} {"train_loss": -18.75467872619629, "global_step": 19912, "epoch": 239} {"train_loss": -18.327749252319336, "global_step": 19913, "epoch": 239} {"train_loss": -18.494495391845703, "global_step": 19914, "epoch": 239} {"train_loss": -18.44403076171875, "global_step": 19915, "epoch": 239} {"train_loss": -18.207773208618164, "global_step": 19916, "epoch": 239} {"train_loss": -18.635459899902344, "global_step": 19917, "epoch": 239} {"train_loss": -18.301610946655273, "global_step": 19918, "epoch": 239} {"train_loss": -18.288104804165393, "global_step": 19919, "epoch": 239, "val_loss": 6038273.5} {"train_loss": -18.42549705505371, "global_step": 19920, "epoch": 240} {"train_loss": -17.911479949951172, "global_step": 19921, "epoch": 240} {"train_loss": -17.763744354248047, "global_step": 19922, "epoch": 240} {"train_loss": -18.162527084350586, "global_step": 19923, "epoch": 240} {"train_loss": -18.412961959838867, "global_step": 19924, "epoch": 240} {"train_loss": -18.21605682373047, "global_step": 19925, "epoch": 240} {"train_loss": -18.333484649658203, "global_step": 19926, "epoch": 240} {"train_loss": -18.142271041870117, "global_step": 19927, "epoch": 240} {"train_loss": -18.053436279296875, "global_step": 19928, "epoch": 240} {"train_loss": -17.87030029296875, "global_step": 19929, "epoch": 240} {"train_loss": -18.460798263549805, "global_step": 19930, "epoch": 240} {"train_loss": -18.59501075744629, "global_step": 19931, "epoch": 240} {"train_loss": -18.133283615112305, "global_step": 19932, "epoch": 240} {"train_loss": -18.394577026367188, "global_step": 19933, "epoch": 240} {"train_loss": -18.100631713867188, "global_step": 19934, "epoch": 240} {"train_loss": -18.43573760986328, "global_step": 19935, "epoch": 240} {"train_loss": -18.41714859008789, "global_step": 19936, "epoch": 240} {"train_loss": -18.211233139038086, "global_step": 19937, "epoch": 240} {"train_loss": -18.47502899169922, "global_step": 19938, "epoch": 240} {"train_loss": -18.32598876953125, "global_step": 19939, "epoch": 240} {"train_loss": -18.147430419921875, "global_step": 19940, "epoch": 240} {"train_loss": -18.66684913635254, "global_step": 19941, "epoch": 240} {"train_loss": -18.43861961364746, "global_step": 19942, "epoch": 240} {"train_loss": -18.636693954467773, "global_step": 19943, "epoch": 240} {"train_loss": -18.445783615112305, "global_step": 19944, "epoch": 240} {"train_loss": -18.248428344726562, "global_step": 19945, "epoch": 240} {"train_loss": -18.548629760742188, "global_step": 19946, "epoch": 240} {"train_loss": -18.38458251953125, "global_step": 19947, "epoch": 240} {"train_loss": -18.15888786315918, "global_step": 19948, "epoch": 240} {"train_loss": -18.337003707885742, "global_step": 19949, "epoch": 240} {"train_loss": -18.229230880737305, "global_step": 19950, "epoch": 240} {"train_loss": -18.149635314941406, "global_step": 19951, "epoch": 240} {"train_loss": -17.95469093322754, "global_step": 19952, "epoch": 240} {"train_loss": -18.65876579284668, "global_step": 19953, "epoch": 240} {"train_loss": -18.453922271728516, "global_step": 19954, "epoch": 240} {"train_loss": -18.3017578125, "global_step": 19955, "epoch": 240} {"train_loss": -18.22760772705078, "global_step": 19956, "epoch": 240} {"train_loss": -18.596885681152344, "global_step": 19957, "epoch": 240} {"train_loss": -18.237470626831055, "global_step": 19958, "epoch": 240} {"train_loss": -18.813404083251953, "global_step": 19959, "epoch": 240} {"train_loss": -18.413297653198242, "global_step": 19960, "epoch": 240} {"train_loss": -18.242464065551758, "global_step": 19961, "epoch": 240} {"train_loss": -18.103689193725586, "global_step": 19962, "epoch": 240} {"train_loss": -18.44598960876465, "global_step": 19963, "epoch": 240} {"train_loss": -18.801694869995117, "global_step": 19964, "epoch": 240} {"train_loss": -18.338857650756836, "global_step": 19965, "epoch": 240} {"train_loss": -18.14385414123535, "global_step": 19966, "epoch": 240} {"train_loss": -18.243375778198242, "global_step": 19967, "epoch": 240} {"train_loss": -18.335580825805664, "global_step": 19968, "epoch": 240} {"train_loss": -18.316974639892578, "global_step": 19969, "epoch": 240} {"train_loss": -18.528844833374023, "global_step": 19970, "epoch": 240} {"train_loss": -18.205265045166016, "global_step": 19971, "epoch": 240} {"train_loss": -18.668302536010742, "global_step": 19972, "epoch": 240} {"train_loss": -18.54884910583496, "global_step": 19973, "epoch": 240} {"train_loss": -18.780784606933594, "global_step": 19974, "epoch": 240} {"train_loss": -18.628759384155273, "global_step": 19975, "epoch": 240} {"train_loss": -18.290624618530273, "global_step": 19976, "epoch": 240} {"train_loss": -18.192218780517578, "global_step": 19977, "epoch": 240} {"train_loss": -18.368431091308594, "global_step": 19978, "epoch": 240} {"train_loss": -18.15702247619629, "global_step": 19979, "epoch": 240} {"train_loss": -18.725078582763672, "global_step": 19980, "epoch": 240} {"train_loss": -18.293760299682617, "global_step": 19981, "epoch": 240} {"train_loss": -18.50669288635254, "global_step": 19982, "epoch": 240} {"train_loss": -18.88704490661621, "global_step": 19983, "epoch": 240} {"train_loss": -18.343950271606445, "global_step": 19984, "epoch": 240} {"train_loss": -18.0722599029541, "global_step": 19985, "epoch": 240} {"train_loss": -18.703840255737305, "global_step": 19986, "epoch": 240} {"train_loss": -18.14777183532715, "global_step": 19987, "epoch": 240} {"train_loss": -18.246408462524414, "global_step": 19988, "epoch": 240} {"train_loss": -18.72397232055664, "global_step": 19989, "epoch": 240} {"train_loss": -18.839136123657227, "global_step": 19990, "epoch": 240} {"train_loss": -18.21858787536621, "global_step": 19991, "epoch": 240} {"train_loss": -18.439071655273438, "global_step": 19992, "epoch": 240} {"train_loss": -18.212194442749023, "global_step": 19993, "epoch": 240} {"train_loss": -18.186626434326172, "global_step": 19994, "epoch": 240} {"train_loss": -18.2016658782959, "global_step": 19995, "epoch": 240} {"train_loss": -18.589391708374023, "global_step": 19996, "epoch": 240} {"train_loss": -17.727996826171875, "global_step": 19997, "epoch": 240} {"train_loss": -18.358774185180664, "global_step": 19998, "epoch": 240} {"train_loss": -18.56178855895996, "global_step": 19999, "epoch": 240} {"train_loss": -18.36812973022461, "global_step": 20000, "epoch": 240} {"train_loss": -18.331796646118164, "global_step": 20001, "epoch": 240} {"train_loss": -18.352976235998682, "global_step": 20002, "epoch": 240, "val_loss": 6006009.0} {"train_loss": -18.578109741210938, "global_step": 20003, "epoch": 241} {"train_loss": -18.408084869384766, "global_step": 20004, "epoch": 241} {"train_loss": -18.51844596862793, "global_step": 20005, "epoch": 241} {"train_loss": -18.46674156188965, "global_step": 20006, "epoch": 241} {"train_loss": -18.261211395263672, "global_step": 20007, "epoch": 241} {"train_loss": -18.25799560546875, "global_step": 20008, "epoch": 241} {"train_loss": -18.505212783813477, "global_step": 20009, "epoch": 241} {"train_loss": -18.513994216918945, "global_step": 20010, "epoch": 241} {"train_loss": -18.28983497619629, "global_step": 20011, "epoch": 241} {"train_loss": -18.479801177978516, "global_step": 20012, "epoch": 241} {"train_loss": -18.791091918945312, "global_step": 20013, "epoch": 241} {"train_loss": -18.50609588623047, "global_step": 20014, "epoch": 241} {"train_loss": -18.25221061706543, "global_step": 20015, "epoch": 241} {"train_loss": -18.31597137451172, "global_step": 20016, "epoch": 241} {"train_loss": -18.074485778808594, "global_step": 20017, "epoch": 241} {"train_loss": -18.442764282226562, "global_step": 20018, "epoch": 241} {"train_loss": -18.286832809448242, "global_step": 20019, "epoch": 241} {"train_loss": -18.45973014831543, "global_step": 20020, "epoch": 241} {"train_loss": -18.50226402282715, "global_step": 20021, "epoch": 241} {"train_loss": -18.446319580078125, "global_step": 20022, "epoch": 241} {"train_loss": -18.64158058166504, "global_step": 20023, "epoch": 241} {"train_loss": -18.69746208190918, "global_step": 20024, "epoch": 241} {"train_loss": -18.600740432739258, "global_step": 20025, "epoch": 241} {"train_loss": -18.29549217224121, "global_step": 20026, "epoch": 241} {"train_loss": -18.72743034362793, "global_step": 20027, "epoch": 241} {"train_loss": -18.15766716003418, "global_step": 20028, "epoch": 241} {"train_loss": -18.21632194519043, "global_step": 20029, "epoch": 241} {"train_loss": -18.351720809936523, "global_step": 20030, "epoch": 241} {"train_loss": -18.37343406677246, "global_step": 20031, "epoch": 241} {"train_loss": -18.44093894958496, "global_step": 20032, "epoch": 241} {"train_loss": -18.56157875061035, "global_step": 20033, "epoch": 241} {"train_loss": -18.476884841918945, "global_step": 20034, "epoch": 241} {"train_loss": -17.972209930419922, "global_step": 20035, "epoch": 241} {"train_loss": -18.41520118713379, "global_step": 20036, "epoch": 241} {"train_loss": -18.16094398498535, "global_step": 20037, "epoch": 241} {"train_loss": -18.11225128173828, "global_step": 20038, "epoch": 241} {"train_loss": -18.260629653930664, "global_step": 20039, "epoch": 241} {"train_loss": -18.127290725708008, "global_step": 20040, "epoch": 241} {"train_loss": -18.344858169555664, "global_step": 20041, "epoch": 241} {"train_loss": -18.35897445678711, "global_step": 20042, "epoch": 241} {"train_loss": -18.184993743896484, "global_step": 20043, "epoch": 241} {"train_loss": -18.54648780822754, "global_step": 20044, "epoch": 241} {"train_loss": -18.81121826171875, "global_step": 20045, "epoch": 241} {"train_loss": -18.446714401245117, "global_step": 20046, "epoch": 241} {"train_loss": -18.404434204101562, "global_step": 20047, "epoch": 241} {"train_loss": -17.935306549072266, "global_step": 20048, "epoch": 241} {"train_loss": -18.015613555908203, "global_step": 20049, "epoch": 241} {"train_loss": -17.894750595092773, "global_step": 20050, "epoch": 241} {"train_loss": -18.69977378845215, "global_step": 20051, "epoch": 241} {"train_loss": -17.93646812438965, "global_step": 20052, "epoch": 241} {"train_loss": -18.25434112548828, "global_step": 20053, "epoch": 241} {"train_loss": -18.773080825805664, "global_step": 20054, "epoch": 241} {"train_loss": -18.29413414001465, "global_step": 20055, "epoch": 241} {"train_loss": -18.733434677124023, "global_step": 20056, "epoch": 241} {"train_loss": -18.551542282104492, "global_step": 20057, "epoch": 241} {"train_loss": -18.13587760925293, "global_step": 20058, "epoch": 241} {"train_loss": -18.240528106689453, "global_step": 20059, "epoch": 241} {"train_loss": -18.103519439697266, "global_step": 20060, "epoch": 241} {"train_loss": -18.15230369567871, "global_step": 20061, "epoch": 241} {"train_loss": -18.30008888244629, "global_step": 20062, "epoch": 241} {"train_loss": -18.2427921295166, "global_step": 20063, "epoch": 241} {"train_loss": -18.383508682250977, "global_step": 20064, "epoch": 241} {"train_loss": -18.247230529785156, "global_step": 20065, "epoch": 241} {"train_loss": -18.367115020751953, "global_step": 20066, "epoch": 241} {"train_loss": -18.403635025024414, "global_step": 20067, "epoch": 241} {"train_loss": -18.559707641601562, "global_step": 20068, "epoch": 241} {"train_loss": -18.648517608642578, "global_step": 20069, "epoch": 241} {"train_loss": -18.305089950561523, "global_step": 20070, "epoch": 241} {"train_loss": -18.124286651611328, "global_step": 20071, "epoch": 241} {"train_loss": -18.09382438659668, "global_step": 20072, "epoch": 241} {"train_loss": -18.09910011291504, "global_step": 20073, "epoch": 241} {"train_loss": -18.527509689331055, "global_step": 20074, "epoch": 241} {"train_loss": -18.334951400756836, "global_step": 20075, "epoch": 241} {"train_loss": -18.439123153686523, "global_step": 20076, "epoch": 241} {"train_loss": -18.23623275756836, "global_step": 20077, "epoch": 241} {"train_loss": -18.381072998046875, "global_step": 20078, "epoch": 241} {"train_loss": -18.351301193237305, "global_step": 20079, "epoch": 241} {"train_loss": -18.376760482788086, "global_step": 20080, "epoch": 241} {"train_loss": -18.602487564086914, "global_step": 20081, "epoch": 241} {"train_loss": -18.279186248779297, "global_step": 20082, "epoch": 241} {"train_loss": -18.189077377319336, "global_step": 20083, "epoch": 241} {"train_loss": -18.225767135620117, "global_step": 20084, "epoch": 241} {"train_loss": -18.358029836631683, "global_step": 20085, "epoch": 241, "val_loss": 5931654.0} {"train_loss": -17.99847984313965, "global_step": 20086, "epoch": 242} {"train_loss": -18.426908493041992, "global_step": 20087, "epoch": 242} {"train_loss": -18.283323287963867, "global_step": 20088, "epoch": 242} {"train_loss": -18.59700584411621, "global_step": 20089, "epoch": 242} {"train_loss": -18.050657272338867, "global_step": 20090, "epoch": 242} {"train_loss": -18.628942489624023, "global_step": 20091, "epoch": 242} {"train_loss": -18.558914184570312, "global_step": 20092, "epoch": 242} {"train_loss": -18.30713653564453, "global_step": 20093, "epoch": 242} {"train_loss": -18.006132125854492, "global_step": 20094, "epoch": 242} {"train_loss": -18.763105392456055, "global_step": 20095, "epoch": 242} {"train_loss": -18.324647903442383, "global_step": 20096, "epoch": 242} {"train_loss": -18.52610206604004, "global_step": 20097, "epoch": 242} {"train_loss": -18.48982048034668, "global_step": 20098, "epoch": 242} {"train_loss": -18.585418701171875, "global_step": 20099, "epoch": 242} {"train_loss": -18.177845001220703, "global_step": 20100, "epoch": 242} {"train_loss": -18.49690818786621, "global_step": 20101, "epoch": 242} {"train_loss": -18.165708541870117, "global_step": 20102, "epoch": 242} {"train_loss": -18.78759765625, "global_step": 20103, "epoch": 242} {"train_loss": -18.37090492248535, "global_step": 20104, "epoch": 242} {"train_loss": -18.266382217407227, "global_step": 20105, "epoch": 242} {"train_loss": -18.26565933227539, "global_step": 20106, "epoch": 242} {"train_loss": -18.47964859008789, "global_step": 20107, "epoch": 242} {"train_loss": -18.304983139038086, "global_step": 20108, "epoch": 242} {"train_loss": -18.42972755432129, "global_step": 20109, "epoch": 242} {"train_loss": -18.500341415405273, "global_step": 20110, "epoch": 242} {"train_loss": -18.375078201293945, "global_step": 20111, "epoch": 242} {"train_loss": -18.291353225708008, "global_step": 20112, "epoch": 242} {"train_loss": -18.168922424316406, "global_step": 20113, "epoch": 242} {"train_loss": -18.387475967407227, "global_step": 20114, "epoch": 242} {"train_loss": -18.573068618774414, "global_step": 20115, "epoch": 242} {"train_loss": -18.557424545288086, "global_step": 20116, "epoch": 242} {"train_loss": -18.734973907470703, "global_step": 20117, "epoch": 242} {"train_loss": -18.427734375, "global_step": 20118, "epoch": 242} {"train_loss": -18.023147583007812, "global_step": 20119, "epoch": 242} {"train_loss": -18.369916915893555, "global_step": 20120, "epoch": 242} {"train_loss": -18.04487419128418, "global_step": 20121, "epoch": 242} {"train_loss": -18.61123275756836, "global_step": 20122, "epoch": 242} {"train_loss": -18.501447677612305, "global_step": 20123, "epoch": 242} {"train_loss": -17.93973159790039, "global_step": 20124, "epoch": 242} {"train_loss": -18.62604331970215, "global_step": 20125, "epoch": 242} {"train_loss": -18.30754852294922, "global_step": 20126, "epoch": 242} {"train_loss": -18.397674560546875, "global_step": 20127, "epoch": 242} {"train_loss": -18.185392379760742, "global_step": 20128, "epoch": 242} {"train_loss": -18.30086326599121, "global_step": 20129, "epoch": 242} {"train_loss": -18.338376998901367, "global_step": 20130, "epoch": 242} {"train_loss": -18.430103302001953, "global_step": 20131, "epoch": 242} {"train_loss": -17.888212203979492, "global_step": 20132, "epoch": 242} {"train_loss": -18.385679244995117, "global_step": 20133, "epoch": 242} {"train_loss": -18.196313858032227, "global_step": 20134, "epoch": 242} {"train_loss": -18.291738510131836, "global_step": 20135, "epoch": 242} {"train_loss": -18.280324935913086, "global_step": 20136, "epoch": 242} {"train_loss": -18.045520782470703, "global_step": 20137, "epoch": 242} {"train_loss": -18.160442352294922, "global_step": 20138, "epoch": 242} {"train_loss": -18.310871124267578, "global_step": 20139, "epoch": 242} {"train_loss": -18.280893325805664, "global_step": 20140, "epoch": 242} {"train_loss": -18.389240264892578, "global_step": 20141, "epoch": 242} {"train_loss": -18.072097778320312, "global_step": 20142, "epoch": 242} {"train_loss": -18.412755966186523, "global_step": 20143, "epoch": 242} {"train_loss": -18.485227584838867, "global_step": 20144, "epoch": 242} {"train_loss": -18.389692306518555, "global_step": 20145, "epoch": 242} {"train_loss": -18.152650833129883, "global_step": 20146, "epoch": 242} {"train_loss": -18.52794075012207, "global_step": 20147, "epoch": 242} {"train_loss": -18.38715934753418, "global_step": 20148, "epoch": 242} {"train_loss": -18.247283935546875, "global_step": 20149, "epoch": 242} {"train_loss": -18.50614356994629, "global_step": 20150, "epoch": 242} {"train_loss": -18.154544830322266, "global_step": 20151, "epoch": 242} {"train_loss": -18.038721084594727, "global_step": 20152, "epoch": 242} {"train_loss": -18.061992645263672, "global_step": 20153, "epoch": 242} {"train_loss": -18.398273468017578, "global_step": 20154, "epoch": 242} {"train_loss": -18.36110496520996, "global_step": 20155, "epoch": 242} {"train_loss": -18.52503776550293, "global_step": 20156, "epoch": 242} {"train_loss": -18.65682029724121, "global_step": 20157, "epoch": 242} {"train_loss": -18.68438720703125, "global_step": 20158, "epoch": 242} {"train_loss": -18.285608291625977, "global_step": 20159, "epoch": 242} {"train_loss": -18.432191848754883, "global_step": 20160, "epoch": 242} {"train_loss": -18.761463165283203, "global_step": 20161, "epoch": 242} {"train_loss": -18.44685935974121, "global_step": 20162, "epoch": 242} {"train_loss": -18.136661529541016, "global_step": 20163, "epoch": 242} {"train_loss": -18.456022262573242, "global_step": 20164, "epoch": 242} {"train_loss": -18.05870246887207, "global_step": 20165, "epoch": 242} {"train_loss": -18.057161331176758, "global_step": 20166, "epoch": 242} {"train_loss": -18.275415420532227, "global_step": 20167, "epoch": 242} {"train_loss": -18.34088422016925, "global_step": 20168, "epoch": 242, "val_loss": 6011983.0} {"train_loss": -17.901161193847656, "global_step": 20169, "epoch": 243} {"train_loss": -18.13283920288086, "global_step": 20170, "epoch": 243} {"train_loss": -18.10185432434082, "global_step": 20171, "epoch": 243} {"train_loss": -17.78293800354004, "global_step": 20172, "epoch": 243} {"train_loss": -18.815828323364258, "global_step": 20173, "epoch": 243} {"train_loss": -18.316242218017578, "global_step": 20174, "epoch": 243} {"train_loss": -17.781307220458984, "global_step": 20175, "epoch": 243} {"train_loss": -18.746662139892578, "global_step": 20176, "epoch": 243} {"train_loss": -18.526912689208984, "global_step": 20177, "epoch": 243} {"train_loss": -18.09852409362793, "global_step": 20178, "epoch": 243} {"train_loss": -18.380037307739258, "global_step": 20179, "epoch": 243} {"train_loss": -18.248544692993164, "global_step": 20180, "epoch": 243} {"train_loss": -18.025693893432617, "global_step": 20181, "epoch": 243} {"train_loss": -18.389892578125, "global_step": 20182, "epoch": 243} {"train_loss": -18.19873046875, "global_step": 20183, "epoch": 243} {"train_loss": -18.19854736328125, "global_step": 20184, "epoch": 243} {"train_loss": -18.60120964050293, "global_step": 20185, "epoch": 243} {"train_loss": -18.296815872192383, "global_step": 20186, "epoch": 243} {"train_loss": -18.672727584838867, "global_step": 20187, "epoch": 243} {"train_loss": -18.296239852905273, "global_step": 20188, "epoch": 243} {"train_loss": -18.21002769470215, "global_step": 20189, "epoch": 243} {"train_loss": -18.567495346069336, "global_step": 20190, "epoch": 243} {"train_loss": -18.602834701538086, "global_step": 20191, "epoch": 243} {"train_loss": -18.12143898010254, "global_step": 20192, "epoch": 243} {"train_loss": -18.66645622253418, "global_step": 20193, "epoch": 243} {"train_loss": -18.130844116210938, "global_step": 20194, "epoch": 243} {"train_loss": -18.57261085510254, "global_step": 20195, "epoch": 243} {"train_loss": -18.31085968017578, "global_step": 20196, "epoch": 243} {"train_loss": -18.03395652770996, "global_step": 20197, "epoch": 243} {"train_loss": -18.426420211791992, "global_step": 20198, "epoch": 243} {"train_loss": -18.41123390197754, "global_step": 20199, "epoch": 243} {"train_loss": -18.463117599487305, "global_step": 20200, "epoch": 243} {"train_loss": -18.6170711517334, "global_step": 20201, "epoch": 243} {"train_loss": -18.139577865600586, "global_step": 20202, "epoch": 243} {"train_loss": -17.84735679626465, "global_step": 20203, "epoch": 243} {"train_loss": -18.109891891479492, "global_step": 20204, "epoch": 243} {"train_loss": -18.61615562438965, "global_step": 20205, "epoch": 243} {"train_loss": -17.98244857788086, "global_step": 20206, "epoch": 243} {"train_loss": -18.584476470947266, "global_step": 20207, "epoch": 243} {"train_loss": -18.516387939453125, "global_step": 20208, "epoch": 243} {"train_loss": -18.59969139099121, "global_step": 20209, "epoch": 243} {"train_loss": -18.33610725402832, "global_step": 20210, "epoch": 243} {"train_loss": -17.801862716674805, "global_step": 20211, "epoch": 243} {"train_loss": -18.453134536743164, "global_step": 20212, "epoch": 243} {"train_loss": -18.095829010009766, "global_step": 20213, "epoch": 243} {"train_loss": -18.38584327697754, "global_step": 20214, "epoch": 243} {"train_loss": -18.16349220275879, "global_step": 20215, "epoch": 243} {"train_loss": -18.586772918701172, "global_step": 20216, "epoch": 243} {"train_loss": -18.31625747680664, "global_step": 20217, "epoch": 243} {"train_loss": -18.46468162536621, "global_step": 20218, "epoch": 243} {"train_loss": -18.52541160583496, "global_step": 20219, "epoch": 243} {"train_loss": -18.469497680664062, "global_step": 20220, "epoch": 243} {"train_loss": -18.76759147644043, "global_step": 20221, "epoch": 243} {"train_loss": -18.281299591064453, "global_step": 20222, "epoch": 243} {"train_loss": -18.55175018310547, "global_step": 20223, "epoch": 243} {"train_loss": -18.40107536315918, "global_step": 20224, "epoch": 243} {"train_loss": -18.2674617767334, "global_step": 20225, "epoch": 243} {"train_loss": -17.9189453125, "global_step": 20226, "epoch": 243} {"train_loss": -18.235210418701172, "global_step": 20227, "epoch": 243} {"train_loss": -18.527616500854492, "global_step": 20228, "epoch": 243} {"train_loss": -18.4271297454834, "global_step": 20229, "epoch": 243} {"train_loss": -18.256845474243164, "global_step": 20230, "epoch": 243} {"train_loss": -18.39031219482422, "global_step": 20231, "epoch": 243} {"train_loss": -18.309127807617188, "global_step": 20232, "epoch": 243} {"train_loss": -18.317123413085938, "global_step": 20233, "epoch": 243} {"train_loss": -17.933334350585938, "global_step": 20234, "epoch": 243} {"train_loss": -18.33290672302246, "global_step": 20235, "epoch": 243} {"train_loss": -18.46392250061035, "global_step": 20236, "epoch": 243} {"train_loss": -18.496511459350586, "global_step": 20237, "epoch": 243} {"train_loss": -18.37140464782715, "global_step": 20238, "epoch": 243} {"train_loss": -18.601333618164062, "global_step": 20239, "epoch": 243} {"train_loss": -18.62774085998535, "global_step": 20240, "epoch": 243} {"train_loss": -18.729549407958984, "global_step": 20241, "epoch": 243} {"train_loss": -18.608488082885742, "global_step": 20242, "epoch": 243} {"train_loss": -18.552488327026367, "global_step": 20243, "epoch": 243} {"train_loss": -18.446239471435547, "global_step": 20244, "epoch": 243} {"train_loss": -18.425453186035156, "global_step": 20245, "epoch": 243} {"train_loss": -18.32697868347168, "global_step": 20246, "epoch": 243} {"train_loss": -18.41472053527832, "global_step": 20247, "epoch": 243} {"train_loss": -18.5357723236084, "global_step": 20248, "epoch": 243} {"train_loss": -18.129358291625977, "global_step": 20249, "epoch": 243} {"train_loss": -18.732664108276367, "global_step": 20250, "epoch": 243} {"train_loss": -18.333548672227973, "global_step": 20251, "epoch": 243, "val_loss": 5956702.5} {"train_loss": -18.258869171142578, "global_step": 20252, "epoch": 244} {"train_loss": -17.905685424804688, "global_step": 20253, "epoch": 244} {"train_loss": -18.201215744018555, "global_step": 20254, "epoch": 244} {"train_loss": -18.25062370300293, "global_step": 20255, "epoch": 244} {"train_loss": -18.37708854675293, "global_step": 20256, "epoch": 244} {"train_loss": -18.155954360961914, "global_step": 20257, "epoch": 244} {"train_loss": -18.373050689697266, "global_step": 20258, "epoch": 244} {"train_loss": -18.326169967651367, "global_step": 20259, "epoch": 244} {"train_loss": -18.36900520324707, "global_step": 20260, "epoch": 244} {"train_loss": -18.57309341430664, "global_step": 20261, "epoch": 244} {"train_loss": -18.51481819152832, "global_step": 20262, "epoch": 244} {"train_loss": -18.580951690673828, "global_step": 20263, "epoch": 244} {"train_loss": -18.12881851196289, "global_step": 20264, "epoch": 244} {"train_loss": -18.433835983276367, "global_step": 20265, "epoch": 244} {"train_loss": -18.524568557739258, "global_step": 20266, "epoch": 244} {"train_loss": -18.222139358520508, "global_step": 20267, "epoch": 244} {"train_loss": -18.03645896911621, "global_step": 20268, "epoch": 244} {"train_loss": -18.736413955688477, "global_step": 20269, "epoch": 244} {"train_loss": -18.496549606323242, "global_step": 20270, "epoch": 244} {"train_loss": -18.36020851135254, "global_step": 20271, "epoch": 244} {"train_loss": -18.12803840637207, "global_step": 20272, "epoch": 244} {"train_loss": -18.28285789489746, "global_step": 20273, "epoch": 244} {"train_loss": -18.53580093383789, "global_step": 20274, "epoch": 244} {"train_loss": -18.047048568725586, "global_step": 20275, "epoch": 244} {"train_loss": -18.282865524291992, "global_step": 20276, "epoch": 244} {"train_loss": -18.17816162109375, "global_step": 20277, "epoch": 244} {"train_loss": -18.442846298217773, "global_step": 20278, "epoch": 244} {"train_loss": -18.305646896362305, "global_step": 20279, "epoch": 244} {"train_loss": -18.5393009185791, "global_step": 20280, "epoch": 244} {"train_loss": -18.261159896850586, "global_step": 20281, "epoch": 244} {"train_loss": -18.591806411743164, "global_step": 20282, "epoch": 244} {"train_loss": -18.29628562927246, "global_step": 20283, "epoch": 244} {"train_loss": -18.45682144165039, "global_step": 20284, "epoch": 244} {"train_loss": -18.467267990112305, "global_step": 20285, "epoch": 244} {"train_loss": -18.453954696655273, "global_step": 20286, "epoch": 244} {"train_loss": -18.16351890563965, "global_step": 20287, "epoch": 244} {"train_loss": -18.313739776611328, "global_step": 20288, "epoch": 244} {"train_loss": -18.270580291748047, "global_step": 20289, "epoch": 244} {"train_loss": -18.353981018066406, "global_step": 20290, "epoch": 244} {"train_loss": -18.649999618530273, "global_step": 20291, "epoch": 244} {"train_loss": -18.340717315673828, "global_step": 20292, "epoch": 244} {"train_loss": -18.31934928894043, "global_step": 20293, "epoch": 244} {"train_loss": -18.64077377319336, "global_step": 20294, "epoch": 244} {"train_loss": -18.20170021057129, "global_step": 20295, "epoch": 244} {"train_loss": -18.32413101196289, "global_step": 20296, "epoch": 244} {"train_loss": -17.920625686645508, "global_step": 20297, "epoch": 244} {"train_loss": -18.536991119384766, "global_step": 20298, "epoch": 244} {"train_loss": -18.48988914489746, "global_step": 20299, "epoch": 244} {"train_loss": -18.398242950439453, "global_step": 20300, "epoch": 244} {"train_loss": -18.484161376953125, "global_step": 20301, "epoch": 244} {"train_loss": -18.552045822143555, "global_step": 20302, "epoch": 244} {"train_loss": -18.366567611694336, "global_step": 20303, "epoch": 244} {"train_loss": -18.56395721435547, "global_step": 20304, "epoch": 244} {"train_loss": -18.835586547851562, "global_step": 20305, "epoch": 244} {"train_loss": -18.279748916625977, "global_step": 20306, "epoch": 244} {"train_loss": -18.566680908203125, "global_step": 20307, "epoch": 244} {"train_loss": -18.25686264038086, "global_step": 20308, "epoch": 244} {"train_loss": -18.433862686157227, "global_step": 20309, "epoch": 244} {"train_loss": -18.380157470703125, "global_step": 20310, "epoch": 244} {"train_loss": -18.33147430419922, "global_step": 20311, "epoch": 244} {"train_loss": -18.460813522338867, "global_step": 20312, "epoch": 244} {"train_loss": -18.4032039642334, "global_step": 20313, "epoch": 244} {"train_loss": -18.374027252197266, "global_step": 20314, "epoch": 244} {"train_loss": -18.34962272644043, "global_step": 20315, "epoch": 244} {"train_loss": -18.382661819458008, "global_step": 20316, "epoch": 244} {"train_loss": -18.3868350982666, "global_step": 20317, "epoch": 244} {"train_loss": -18.429269790649414, "global_step": 20318, "epoch": 244} {"train_loss": -18.492828369140625, "global_step": 20319, "epoch": 244} {"train_loss": -18.648109436035156, "global_step": 20320, "epoch": 244} {"train_loss": -18.721708297729492, "global_step": 20321, "epoch": 244} {"train_loss": -18.047800064086914, "global_step": 20322, "epoch": 244} {"train_loss": -18.495689392089844, "global_step": 20323, "epoch": 244} {"train_loss": -18.32420539855957, "global_step": 20324, "epoch": 244} {"train_loss": -18.25911521911621, "global_step": 20325, "epoch": 244} {"train_loss": -18.3696346282959, "global_step": 20326, "epoch": 244} {"train_loss": -18.64150047302246, "global_step": 20327, "epoch": 244} {"train_loss": -18.389432907104492, "global_step": 20328, "epoch": 244} {"train_loss": -18.46824073791504, "global_step": 20329, "epoch": 244} {"train_loss": -18.194168090820312, "global_step": 20330, "epoch": 244} {"train_loss": -18.42603874206543, "global_step": 20331, "epoch": 244} {"train_loss": -18.274032592773438, "global_step": 20332, "epoch": 244} {"train_loss": -18.48164176940918, "global_step": 20333, "epoch": 244} {"train_loss": -18.392448861914946, "global_step": 20334, "epoch": 244, "val_loss": 6132379.5} {"train_loss": -18.45436668395996, "global_step": 20335, "epoch": 245} {"train_loss": -18.110803604125977, "global_step": 20336, "epoch": 245} {"train_loss": -18.23949432373047, "global_step": 20337, "epoch": 245} {"train_loss": -18.434452056884766, "global_step": 20338, "epoch": 245} {"train_loss": -18.182510375976562, "global_step": 20339, "epoch": 245} {"train_loss": -18.457317352294922, "global_step": 20340, "epoch": 245} {"train_loss": -18.405229568481445, "global_step": 20341, "epoch": 245} {"train_loss": -18.341970443725586, "global_step": 20342, "epoch": 245} {"train_loss": -18.27696418762207, "global_step": 20343, "epoch": 245} {"train_loss": -18.09821128845215, "global_step": 20344, "epoch": 245} {"train_loss": -18.188642501831055, "global_step": 20345, "epoch": 245} {"train_loss": -18.131122589111328, "global_step": 20346, "epoch": 245} {"train_loss": -18.294824600219727, "global_step": 20347, "epoch": 245} {"train_loss": -18.51834487915039, "global_step": 20348, "epoch": 245} {"train_loss": -17.937042236328125, "global_step": 20349, "epoch": 245} {"train_loss": -18.344253540039062, "global_step": 20350, "epoch": 245} {"train_loss": -18.15749740600586, "global_step": 20351, "epoch": 245} {"train_loss": -18.44736671447754, "global_step": 20352, "epoch": 245} {"train_loss": -18.552932739257812, "global_step": 20353, "epoch": 245} {"train_loss": -18.383337020874023, "global_step": 20354, "epoch": 245} {"train_loss": -18.14171600341797, "global_step": 20355, "epoch": 245} {"train_loss": -18.368743896484375, "global_step": 20356, "epoch": 245} {"train_loss": -18.317399978637695, "global_step": 20357, "epoch": 245} {"train_loss": -18.345388412475586, "global_step": 20358, "epoch": 245} {"train_loss": -18.426130294799805, "global_step": 20359, "epoch": 245} {"train_loss": -18.3040828704834, "global_step": 20360, "epoch": 245} {"train_loss": -18.299482345581055, "global_step": 20361, "epoch": 245} {"train_loss": -18.439208984375, "global_step": 20362, "epoch": 245} {"train_loss": -18.333724975585938, "global_step": 20363, "epoch": 245} {"train_loss": -18.659299850463867, "global_step": 20364, "epoch": 245} {"train_loss": -17.999584197998047, "global_step": 20365, "epoch": 245} {"train_loss": -18.780982971191406, "global_step": 20366, "epoch": 245} {"train_loss": -18.231008529663086, "global_step": 20367, "epoch": 245} {"train_loss": -18.0950870513916, "global_step": 20368, "epoch": 245} {"train_loss": -18.572978973388672, "global_step": 20369, "epoch": 245} {"train_loss": -18.268735885620117, "global_step": 20370, "epoch": 245} {"train_loss": -18.898426055908203, "global_step": 20371, "epoch": 245} {"train_loss": -18.179792404174805, "global_step": 20372, "epoch": 245} {"train_loss": -18.653127670288086, "global_step": 20373, "epoch": 245} {"train_loss": -18.459671020507812, "global_step": 20374, "epoch": 245} {"train_loss": -18.391145706176758, "global_step": 20375, "epoch": 245} {"train_loss": -18.056854248046875, "global_step": 20376, "epoch": 245} {"train_loss": -18.496137619018555, "global_step": 20377, "epoch": 245} {"train_loss": -18.585023880004883, "global_step": 20378, "epoch": 245} {"train_loss": -18.4200382232666, "global_step": 20379, "epoch": 245} {"train_loss": -18.272216796875, "global_step": 20380, "epoch": 245} {"train_loss": -18.524059295654297, "global_step": 20381, "epoch": 245} {"train_loss": -18.240482330322266, "global_step": 20382, "epoch": 245} {"train_loss": -18.514419555664062, "global_step": 20383, "epoch": 245} {"train_loss": -18.50760269165039, "global_step": 20384, "epoch": 245} {"train_loss": -18.390045166015625, "global_step": 20385, "epoch": 245} {"train_loss": -18.70267105102539, "global_step": 20386, "epoch": 245} {"train_loss": -18.51252555847168, "global_step": 20387, "epoch": 245} {"train_loss": -18.430362701416016, "global_step": 20388, "epoch": 245} {"train_loss": -18.566043853759766, "global_step": 20389, "epoch": 245} {"train_loss": -18.681522369384766, "global_step": 20390, "epoch": 245} {"train_loss": -18.139585494995117, "global_step": 20391, "epoch": 245} {"train_loss": -18.353181838989258, "global_step": 20392, "epoch": 245} {"train_loss": -18.422351837158203, "global_step": 20393, "epoch": 245} {"train_loss": -18.256345748901367, "global_step": 20394, "epoch": 245} {"train_loss": -18.391399383544922, "global_step": 20395, "epoch": 245} {"train_loss": -18.757335662841797, "global_step": 20396, "epoch": 245} {"train_loss": -18.244115829467773, "global_step": 20397, "epoch": 245} {"train_loss": -18.48943519592285, "global_step": 20398, "epoch": 245} {"train_loss": -18.193429946899414, "global_step": 20399, "epoch": 245} {"train_loss": -18.64519691467285, "global_step": 20400, "epoch": 245} {"train_loss": -18.35182762145996, "global_step": 20401, "epoch": 245} {"train_loss": -18.303625106811523, "global_step": 20402, "epoch": 245} {"train_loss": -18.88124656677246, "global_step": 20403, "epoch": 245} {"train_loss": -17.836233139038086, "global_step": 20404, "epoch": 245} {"train_loss": -18.18305015563965, "global_step": 20405, "epoch": 245} {"train_loss": -18.353256225585938, "global_step": 20406, "epoch": 245} {"train_loss": -18.47723388671875, "global_step": 20407, "epoch": 245} {"train_loss": -18.1826171875, "global_step": 20408, "epoch": 245} {"train_loss": -18.601415634155273, "global_step": 20409, "epoch": 245} {"train_loss": -17.9887752532959, "global_step": 20410, "epoch": 245} {"train_loss": -18.146873474121094, "global_step": 20411, "epoch": 245} {"train_loss": -18.392362594604492, "global_step": 20412, "epoch": 245} {"train_loss": -18.469552993774414, "global_step": 20413, "epoch": 245} {"train_loss": -18.257020950317383, "global_step": 20414, "epoch": 245} {"train_loss": -18.70414924621582, "global_step": 20415, "epoch": 245} {"train_loss": -18.56941795349121, "global_step": 20416, "epoch": 245} {"train_loss": -18.377529948590748, "global_step": 20417, "epoch": 245, "val_loss": 6155642.5} {"train_loss": -18.04823875427246, "global_step": 20418, "epoch": 246} {"train_loss": -17.85292625427246, "global_step": 20419, "epoch": 246} {"train_loss": -18.3342342376709, "global_step": 20420, "epoch": 246} {"train_loss": -17.93344497680664, "global_step": 20421, "epoch": 246} {"train_loss": -18.064306259155273, "global_step": 20422, "epoch": 246} {"train_loss": -17.9899845123291, "global_step": 20423, "epoch": 246} {"train_loss": -18.193742752075195, "global_step": 20424, "epoch": 246} {"train_loss": -18.42719078063965, "global_step": 20425, "epoch": 246} {"train_loss": -18.088558197021484, "global_step": 20426, "epoch": 246} {"train_loss": -18.094318389892578, "global_step": 20427, "epoch": 246} {"train_loss": -17.968538284301758, "global_step": 20428, "epoch": 246} {"train_loss": -18.621551513671875, "global_step": 20429, "epoch": 246} {"train_loss": -17.956632614135742, "global_step": 20430, "epoch": 246} {"train_loss": -18.091928482055664, "global_step": 20431, "epoch": 246} {"train_loss": -18.46759796142578, "global_step": 20432, "epoch": 246} {"train_loss": -18.273605346679688, "global_step": 20433, "epoch": 246} {"train_loss": -18.07485008239746, "global_step": 20434, "epoch": 246} {"train_loss": -18.426809310913086, "global_step": 20435, "epoch": 246} {"train_loss": -18.133451461791992, "global_step": 20436, "epoch": 246} {"train_loss": -18.39984703063965, "global_step": 20437, "epoch": 246} {"train_loss": -18.519437789916992, "global_step": 20438, "epoch": 246} {"train_loss": -18.490427017211914, "global_step": 20439, "epoch": 246} {"train_loss": -18.34450912475586, "global_step": 20440, "epoch": 246} {"train_loss": -18.367406845092773, "global_step": 20441, "epoch": 246} {"train_loss": -18.304075241088867, "global_step": 20442, "epoch": 246} {"train_loss": -18.229572296142578, "global_step": 20443, "epoch": 246} {"train_loss": -18.667264938354492, "global_step": 20444, "epoch": 246} {"train_loss": -18.23026466369629, "global_step": 20445, "epoch": 246} {"train_loss": -18.369535446166992, "global_step": 20446, "epoch": 246} {"train_loss": -17.949831008911133, "global_step": 20447, "epoch": 246} {"train_loss": -18.43318748474121, "global_step": 20448, "epoch": 246} {"train_loss": -18.79587173461914, "global_step": 20449, "epoch": 246} {"train_loss": -18.241525650024414, "global_step": 20450, "epoch": 246} {"train_loss": -18.661497116088867, "global_step": 20451, "epoch": 246} {"train_loss": -18.538360595703125, "global_step": 20452, "epoch": 246} {"train_loss": -18.610475540161133, "global_step": 20453, "epoch": 246} {"train_loss": -18.114938735961914, "global_step": 20454, "epoch": 246} {"train_loss": -18.518224716186523, "global_step": 20455, "epoch": 246} {"train_loss": -18.21184730529785, "global_step": 20456, "epoch": 246} {"train_loss": -18.149324417114258, "global_step": 20457, "epoch": 246} {"train_loss": -18.481924057006836, "global_step": 20458, "epoch": 246} {"train_loss": -18.231847763061523, "global_step": 20459, "epoch": 246} {"train_loss": -18.257444381713867, "global_step": 20460, "epoch": 246} {"train_loss": -18.329999923706055, "global_step": 20461, "epoch": 246} {"train_loss": -18.224685668945312, "global_step": 20462, "epoch": 246} {"train_loss": -18.209383010864258, "global_step": 20463, "epoch": 246} {"train_loss": -18.354215621948242, "global_step": 20464, "epoch": 246} {"train_loss": -18.13478660583496, "global_step": 20465, "epoch": 246} {"train_loss": -18.7081241607666, "global_step": 20466, "epoch": 246} {"train_loss": -18.45009422302246, "global_step": 20467, "epoch": 246} {"train_loss": -18.77399253845215, "global_step": 20468, "epoch": 246} {"train_loss": -18.489036560058594, "global_step": 20469, "epoch": 246} {"train_loss": -18.602008819580078, "global_step": 20470, "epoch": 246} {"train_loss": -18.504499435424805, "global_step": 20471, "epoch": 246} {"train_loss": -18.765897750854492, "global_step": 20472, "epoch": 246} {"train_loss": -18.497901916503906, "global_step": 20473, "epoch": 246} {"train_loss": -18.081693649291992, "global_step": 20474, "epoch": 246} {"train_loss": -18.525428771972656, "global_step": 20475, "epoch": 246} {"train_loss": -18.715139389038086, "global_step": 20476, "epoch": 246} {"train_loss": -18.203540802001953, "global_step": 20477, "epoch": 246} {"train_loss": -18.29645347595215, "global_step": 20478, "epoch": 246} {"train_loss": -18.31635093688965, "global_step": 20479, "epoch": 246} {"train_loss": -18.54121971130371, "global_step": 20480, "epoch": 246} {"train_loss": -18.345169067382812, "global_step": 20481, "epoch": 246} {"train_loss": -18.653928756713867, "global_step": 20482, "epoch": 246} {"train_loss": -18.564699172973633, "global_step": 20483, "epoch": 246} {"train_loss": -18.118635177612305, "global_step": 20484, "epoch": 246} {"train_loss": -18.242481231689453, "global_step": 20485, "epoch": 246} {"train_loss": -18.606733322143555, "global_step": 20486, "epoch": 246} {"train_loss": -18.434362411499023, "global_step": 20487, "epoch": 246} {"train_loss": -18.171415328979492, "global_step": 20488, "epoch": 246} {"train_loss": -18.208566665649414, "global_step": 20489, "epoch": 246} {"train_loss": -18.744552612304688, "global_step": 20490, "epoch": 246} {"train_loss": -18.660810470581055, "global_step": 20491, "epoch": 246} {"train_loss": -18.360828399658203, "global_step": 20492, "epoch": 246} {"train_loss": -18.240690231323242, "global_step": 20493, "epoch": 246} {"train_loss": -18.497005462646484, "global_step": 20494, "epoch": 246} {"train_loss": -18.489503860473633, "global_step": 20495, "epoch": 246} {"train_loss": -18.582326889038086, "global_step": 20496, "epoch": 246} {"train_loss": -18.405384063720703, "global_step": 20497, "epoch": 246} {"train_loss": -18.525156021118164, "global_step": 20498, "epoch": 246} {"train_loss": -18.36519432067871, "global_step": 20499, "epoch": 246} {"train_loss": -18.3705578999347, "global_step": 20500, "epoch": 246, "val_loss": 5948474.5} {"train_loss": -18.184146881103516, "global_step": 20501, "epoch": 247} {"train_loss": -18.6674861907959, "global_step": 20502, "epoch": 247} {"train_loss": -18.280160903930664, "global_step": 20503, "epoch": 247} {"train_loss": -18.489988327026367, "global_step": 20504, "epoch": 247} {"train_loss": -18.49916648864746, "global_step": 20505, "epoch": 247} {"train_loss": -18.2734432220459, "global_step": 20506, "epoch": 247} {"train_loss": -18.602994918823242, "global_step": 20507, "epoch": 247} {"train_loss": -18.247804641723633, "global_step": 20508, "epoch": 247} {"train_loss": -18.213571548461914, "global_step": 20509, "epoch": 247} {"train_loss": -18.43035888671875, "global_step": 20510, "epoch": 247} {"train_loss": -18.432437896728516, "global_step": 20511, "epoch": 247} {"train_loss": -18.57741355895996, "global_step": 20512, "epoch": 247} {"train_loss": -18.36800193786621, "global_step": 20513, "epoch": 247} {"train_loss": -18.280242919921875, "global_step": 20514, "epoch": 247} {"train_loss": -18.20918846130371, "global_step": 20515, "epoch": 247} {"train_loss": -18.400915145874023, "global_step": 20516, "epoch": 247} {"train_loss": -18.37588882446289, "global_step": 20517, "epoch": 247} {"train_loss": -18.125898361206055, "global_step": 20518, "epoch": 247} {"train_loss": -18.629465103149414, "global_step": 20519, "epoch": 247} {"train_loss": -18.34282684326172, "global_step": 20520, "epoch": 247} {"train_loss": -18.291934967041016, "global_step": 20521, "epoch": 247} {"train_loss": -18.31319236755371, "global_step": 20522, "epoch": 247} {"train_loss": -18.332229614257812, "global_step": 20523, "epoch": 247} {"train_loss": -18.382844924926758, "global_step": 20524, "epoch": 247} {"train_loss": -18.76930809020996, "global_step": 20525, "epoch": 247} {"train_loss": -18.273080825805664, "global_step": 20526, "epoch": 247} {"train_loss": -18.759763717651367, "global_step": 20527, "epoch": 247} {"train_loss": -18.718053817749023, "global_step": 20528, "epoch": 247} {"train_loss": -18.637495040893555, "global_step": 20529, "epoch": 247} {"train_loss": -18.036176681518555, "global_step": 20530, "epoch": 247} {"train_loss": -18.416675567626953, "global_step": 20531, "epoch": 247} {"train_loss": -18.49893569946289, "global_step": 20532, "epoch": 247} {"train_loss": -18.314558029174805, "global_step": 20533, "epoch": 247} {"train_loss": -18.658645629882812, "global_step": 20534, "epoch": 247} {"train_loss": -18.03952980041504, "global_step": 20535, "epoch": 247} {"train_loss": -18.190250396728516, "global_step": 20536, "epoch": 247} {"train_loss": -19.072153091430664, "global_step": 20537, "epoch": 247} {"train_loss": -18.250614166259766, "global_step": 20538, "epoch": 247} {"train_loss": -18.240970611572266, "global_step": 20539, "epoch": 247} {"train_loss": -18.64462661743164, "global_step": 20540, "epoch": 247} {"train_loss": -18.238706588745117, "global_step": 20541, "epoch": 247} {"train_loss": -18.167158126831055, "global_step": 20542, "epoch": 247} {"train_loss": -18.502721786499023, "global_step": 20543, "epoch": 247} {"train_loss": -18.60597038269043, "global_step": 20544, "epoch": 247} {"train_loss": -18.158998489379883, "global_step": 20545, "epoch": 247} {"train_loss": -18.93659782409668, "global_step": 20546, "epoch": 247} {"train_loss": -18.428415298461914, "global_step": 20547, "epoch": 247} {"train_loss": -18.23640251159668, "global_step": 20548, "epoch": 247} {"train_loss": -18.412328720092773, "global_step": 20549, "epoch": 247} {"train_loss": -18.54689598083496, "global_step": 20550, "epoch": 247} {"train_loss": -18.6287899017334, "global_step": 20551, "epoch": 247} {"train_loss": -18.31440544128418, "global_step": 20552, "epoch": 247} {"train_loss": -18.527013778686523, "global_step": 20553, "epoch": 247} {"train_loss": -18.54207992553711, "global_step": 20554, "epoch": 247} {"train_loss": -18.69197654724121, "global_step": 20555, "epoch": 247} {"train_loss": -18.669921875, "global_step": 20556, "epoch": 247} {"train_loss": -18.16930389404297, "global_step": 20557, "epoch": 247} {"train_loss": -18.345823287963867, "global_step": 20558, "epoch": 247} {"train_loss": -18.10158348083496, "global_step": 20559, "epoch": 247} {"train_loss": -18.345951080322266, "global_step": 20560, "epoch": 247} {"train_loss": -18.580663681030273, "global_step": 20561, "epoch": 247} {"train_loss": -18.61325454711914, "global_step": 20562, "epoch": 247} {"train_loss": -18.3658390045166, "global_step": 20563, "epoch": 247} {"train_loss": -18.337200164794922, "global_step": 20564, "epoch": 247} {"train_loss": -18.09546661376953, "global_step": 20565, "epoch": 247} {"train_loss": -18.584768295288086, "global_step": 20566, "epoch": 247} {"train_loss": -18.422931671142578, "global_step": 20567, "epoch": 247} {"train_loss": -18.346525192260742, "global_step": 20568, "epoch": 247} {"train_loss": -18.386066436767578, "global_step": 20569, "epoch": 247} {"train_loss": -18.508865356445312, "global_step": 20570, "epoch": 247} {"train_loss": -18.60297966003418, "global_step": 20571, "epoch": 247} {"train_loss": -18.264846801757812, "global_step": 20572, "epoch": 247} {"train_loss": -18.315753936767578, "global_step": 20573, "epoch": 247} {"train_loss": -18.163471221923828, "global_step": 20574, "epoch": 247} {"train_loss": -18.18018913269043, "global_step": 20575, "epoch": 247} {"train_loss": -18.607038497924805, "global_step": 20576, "epoch": 247} {"train_loss": -18.13924217224121, "global_step": 20577, "epoch": 247} {"train_loss": -18.655805587768555, "global_step": 20578, "epoch": 247} {"train_loss": -18.163692474365234, "global_step": 20579, "epoch": 247} {"train_loss": -18.673419952392578, "global_step": 20580, "epoch": 247} {"train_loss": -18.68147087097168, "global_step": 20581, "epoch": 247} {"train_loss": -18.149946212768555, "global_step": 20582, "epoch": 247} {"train_loss": -18.407088521015215, "global_step": 20583, "epoch": 247, "val_loss": 5842892.0} {"train_loss": -18.35614013671875, "global_step": 20584, "epoch": 248} {"train_loss": -17.82066535949707, "global_step": 20585, "epoch": 248} {"train_loss": -18.478147506713867, "global_step": 20586, "epoch": 248} {"train_loss": -18.34381103515625, "global_step": 20587, "epoch": 248} {"train_loss": -18.407804489135742, "global_step": 20588, "epoch": 248} {"train_loss": -18.52471351623535, "global_step": 20589, "epoch": 248} {"train_loss": -18.434114456176758, "global_step": 20590, "epoch": 248} {"train_loss": -17.878158569335938, "global_step": 20591, "epoch": 248} {"train_loss": -18.3197078704834, "global_step": 20592, "epoch": 248} {"train_loss": -18.299367904663086, "global_step": 20593, "epoch": 248} {"train_loss": -18.241979598999023, "global_step": 20594, "epoch": 248} {"train_loss": -18.426836013793945, "global_step": 20595, "epoch": 248} {"train_loss": -18.68718147277832, "global_step": 20596, "epoch": 248} {"train_loss": -18.40261459350586, "global_step": 20597, "epoch": 248} {"train_loss": -18.134992599487305, "global_step": 20598, "epoch": 248} {"train_loss": -18.47719383239746, "global_step": 20599, "epoch": 248} {"train_loss": -18.506305694580078, "global_step": 20600, "epoch": 248} {"train_loss": -18.31900978088379, "global_step": 20601, "epoch": 248} {"train_loss": -18.23804473876953, "global_step": 20602, "epoch": 248} {"train_loss": -18.662450790405273, "global_step": 20603, "epoch": 248} {"train_loss": -18.487401962280273, "global_step": 20604, "epoch": 248} {"train_loss": -18.301786422729492, "global_step": 20605, "epoch": 248} {"train_loss": -18.56393814086914, "global_step": 20606, "epoch": 248} {"train_loss": -17.901840209960938, "global_step": 20607, "epoch": 248} {"train_loss": -18.199548721313477, "global_step": 20608, "epoch": 248} {"train_loss": -18.671491622924805, "global_step": 20609, "epoch": 248} {"train_loss": -18.299230575561523, "global_step": 20610, "epoch": 248} {"train_loss": -18.280935287475586, "global_step": 20611, "epoch": 248} {"train_loss": -18.236326217651367, "global_step": 20612, "epoch": 248} {"train_loss": -18.406753540039062, "global_step": 20613, "epoch": 248} {"train_loss": -18.570804595947266, "global_step": 20614, "epoch": 248} {"train_loss": -18.560302734375, "global_step": 20615, "epoch": 248} {"train_loss": -18.141141891479492, "global_step": 20616, "epoch": 248} {"train_loss": -18.29327392578125, "global_step": 20617, "epoch": 248} {"train_loss": -18.27088737487793, "global_step": 20618, "epoch": 248} {"train_loss": -18.261253356933594, "global_step": 20619, "epoch": 248} {"train_loss": -18.333023071289062, "global_step": 20620, "epoch": 248} {"train_loss": -18.485210418701172, "global_step": 20621, "epoch": 248} {"train_loss": -18.66328239440918, "global_step": 20622, "epoch": 248} {"train_loss": -18.388864517211914, "global_step": 20623, "epoch": 248} {"train_loss": -18.457256317138672, "global_step": 20624, "epoch": 248} {"train_loss": -18.418729782104492, "global_step": 20625, "epoch": 248} {"train_loss": -18.516620635986328, "global_step": 20626, "epoch": 248} {"train_loss": -18.355031967163086, "global_step": 20627, "epoch": 248} {"train_loss": -18.75997543334961, "global_step": 20628, "epoch": 248} {"train_loss": -18.32662010192871, "global_step": 20629, "epoch": 248} {"train_loss": -18.268701553344727, "global_step": 20630, "epoch": 248} {"train_loss": -18.490896224975586, "global_step": 20631, "epoch": 248} {"train_loss": -18.537967681884766, "global_step": 20632, "epoch": 248} {"train_loss": -18.616926193237305, "global_step": 20633, "epoch": 248} {"train_loss": -18.75196647644043, "global_step": 20634, "epoch": 248} {"train_loss": -18.438894271850586, "global_step": 20635, "epoch": 248} {"train_loss": -18.579166412353516, "global_step": 20636, "epoch": 248} {"train_loss": -18.825777053833008, "global_step": 20637, "epoch": 248} {"train_loss": -18.610107421875, "global_step": 20638, "epoch": 248} {"train_loss": -18.524322509765625, "global_step": 20639, "epoch": 248} {"train_loss": -18.41678237915039, "global_step": 20640, "epoch": 248} {"train_loss": -18.338571548461914, "global_step": 20641, "epoch": 248} {"train_loss": -18.823822021484375, "global_step": 20642, "epoch": 248} {"train_loss": -18.46299171447754, "global_step": 20643, "epoch": 248} {"train_loss": -18.27459716796875, "global_step": 20644, "epoch": 248} {"train_loss": -18.469091415405273, "global_step": 20645, "epoch": 248} {"train_loss": -18.287616729736328, "global_step": 20646, "epoch": 248} {"train_loss": -18.13856315612793, "global_step": 20647, "epoch": 248} {"train_loss": -18.164478302001953, "global_step": 20648, "epoch": 248} {"train_loss": -18.863327026367188, "global_step": 20649, "epoch": 248} {"train_loss": -18.03105926513672, "global_step": 20650, "epoch": 248} {"train_loss": -18.453508377075195, "global_step": 20651, "epoch": 248} {"train_loss": -18.507490158081055, "global_step": 20652, "epoch": 248} {"train_loss": -18.349843978881836, "global_step": 20653, "epoch": 248} {"train_loss": -18.57758903503418, "global_step": 20654, "epoch": 248} {"train_loss": -18.091140747070312, "global_step": 20655, "epoch": 248} {"train_loss": -18.546316146850586, "global_step": 20656, "epoch": 248} {"train_loss": -18.684083938598633, "global_step": 20657, "epoch": 248} {"train_loss": -18.117341995239258, "global_step": 20658, "epoch": 248} {"train_loss": -18.30768585205078, "global_step": 20659, "epoch": 248} {"train_loss": -18.80191993713379, "global_step": 20660, "epoch": 248} {"train_loss": -18.40297508239746, "global_step": 20661, "epoch": 248} {"train_loss": -18.278852462768555, "global_step": 20662, "epoch": 248} {"train_loss": -18.25467872619629, "global_step": 20663, "epoch": 248} {"train_loss": -18.42108917236328, "global_step": 20664, "epoch": 248} {"train_loss": -18.33905601501465, "global_step": 20665, "epoch": 248} {"train_loss": -18.402248244687737, "global_step": 20666, "epoch": 248, "val_loss": 5833144.0} {"train_loss": -18.151350021362305, "global_step": 20667, "epoch": 249} {"train_loss": -18.122577667236328, "global_step": 20668, "epoch": 249} {"train_loss": -18.333417892456055, "global_step": 20669, "epoch": 249} {"train_loss": -18.14432144165039, "global_step": 20670, "epoch": 249} {"train_loss": -18.25494956970215, "global_step": 20671, "epoch": 249} {"train_loss": -18.410703659057617, "global_step": 20672, "epoch": 249} {"train_loss": -18.571828842163086, "global_step": 20673, "epoch": 249} {"train_loss": -18.5165958404541, "global_step": 20674, "epoch": 249} {"train_loss": -18.28216552734375, "global_step": 20675, "epoch": 249} {"train_loss": -18.423757553100586, "global_step": 20676, "epoch": 249} {"train_loss": -18.368274688720703, "global_step": 20677, "epoch": 249} {"train_loss": -17.954519271850586, "global_step": 20678, "epoch": 249} {"train_loss": -18.31899070739746, "global_step": 20679, "epoch": 249} {"train_loss": -18.235822677612305, "global_step": 20680, "epoch": 249} {"train_loss": -18.30381202697754, "global_step": 20681, "epoch": 249} {"train_loss": -18.378564834594727, "global_step": 20682, "epoch": 249} {"train_loss": -18.415395736694336, "global_step": 20683, "epoch": 249} {"train_loss": -18.108552932739258, "global_step": 20684, "epoch": 249} {"train_loss": -18.571149826049805, "global_step": 20685, "epoch": 249} {"train_loss": -18.27564811706543, "global_step": 20686, "epoch": 249} {"train_loss": -18.76251220703125, "global_step": 20687, "epoch": 249} {"train_loss": -18.358007431030273, "global_step": 20688, "epoch": 249} {"train_loss": -18.273649215698242, "global_step": 20689, "epoch": 249} {"train_loss": -18.799285888671875, "global_step": 20690, "epoch": 249} {"train_loss": -18.446500778198242, "global_step": 20691, "epoch": 249} {"train_loss": -18.31110191345215, "global_step": 20692, "epoch": 249} {"train_loss": -18.20949363708496, "global_step": 20693, "epoch": 249} {"train_loss": -17.8360538482666, "global_step": 20694, "epoch": 249} {"train_loss": -18.383031845092773, "global_step": 20695, "epoch": 249} {"train_loss": -18.107391357421875, "global_step": 20696, "epoch": 249} {"train_loss": -18.847963333129883, "global_step": 20697, "epoch": 249} {"train_loss": -18.069778442382812, "global_step": 20698, "epoch": 249} {"train_loss": -18.682153701782227, "global_step": 20699, "epoch": 249} {"train_loss": -18.69475746154785, "global_step": 20700, "epoch": 249} {"train_loss": -18.383991241455078, "global_step": 20701, "epoch": 249} {"train_loss": -18.767963409423828, "global_step": 20702, "epoch": 249} {"train_loss": -18.21565055847168, "global_step": 20703, "epoch": 249} {"train_loss": -18.567289352416992, "global_step": 20704, "epoch": 249} {"train_loss": -18.510601043701172, "global_step": 20705, "epoch": 249} {"train_loss": -18.289499282836914, "global_step": 20706, "epoch": 249} {"train_loss": -18.449132919311523, "global_step": 20707, "epoch": 249} {"train_loss": -18.602890014648438, "global_step": 20708, "epoch": 249} {"train_loss": -18.33540916442871, "global_step": 20709, "epoch": 249} {"train_loss": -18.270566940307617, "global_step": 20710, "epoch": 249} {"train_loss": -18.459381103515625, "global_step": 20711, "epoch": 249} {"train_loss": -18.26622772216797, "global_step": 20712, "epoch": 249} {"train_loss": -18.352401733398438, "global_step": 20713, "epoch": 249} {"train_loss": -18.04273223876953, "global_step": 20714, "epoch": 249} {"train_loss": -18.13665199279785, "global_step": 20715, "epoch": 249} {"train_loss": -18.538732528686523, "global_step": 20716, "epoch": 249} {"train_loss": -18.1850528717041, "global_step": 20717, "epoch": 249} {"train_loss": -18.026784896850586, "global_step": 20718, "epoch": 249} {"train_loss": -18.629173278808594, "global_step": 20719, "epoch": 249} {"train_loss": -18.64815902709961, "global_step": 20720, "epoch": 249} {"train_loss": -18.630186080932617, "global_step": 20721, "epoch": 249} {"train_loss": -18.17268180847168, "global_step": 20722, "epoch": 249} {"train_loss": -18.376224517822266, "global_step": 20723, "epoch": 249} {"train_loss": -18.69058609008789, "global_step": 20724, "epoch": 249} {"train_loss": -18.178190231323242, "global_step": 20725, "epoch": 249} {"train_loss": -18.248397827148438, "global_step": 20726, "epoch": 249} {"train_loss": -18.434816360473633, "global_step": 20727, "epoch": 249} {"train_loss": -18.67573356628418, "global_step": 20728, "epoch": 249} {"train_loss": -18.48664093017578, "global_step": 20729, "epoch": 249} {"train_loss": -18.689172744750977, "global_step": 20730, "epoch": 249} {"train_loss": -18.5212345123291, "global_step": 20731, "epoch": 249} {"train_loss": -18.6151123046875, "global_step": 20732, "epoch": 249} {"train_loss": -18.633453369140625, "global_step": 20733, "epoch": 249} {"train_loss": -18.880788803100586, "global_step": 20734, "epoch": 249} {"train_loss": -18.173254013061523, "global_step": 20735, "epoch": 249} {"train_loss": -18.665481567382812, "global_step": 20736, "epoch": 249} {"train_loss": -18.38030433654785, "global_step": 20737, "epoch": 249} {"train_loss": -18.494911193847656, "global_step": 20738, "epoch": 249} {"train_loss": -18.724782943725586, "global_step": 20739, "epoch": 249} {"train_loss": -18.710718154907227, "global_step": 20740, "epoch": 249} {"train_loss": -18.4146728515625, "global_step": 20741, "epoch": 249} {"train_loss": -18.334487915039062, "global_step": 20742, "epoch": 249} {"train_loss": -18.397014617919922, "global_step": 20743, "epoch": 249} {"train_loss": -18.531946182250977, "global_step": 20744, "epoch": 249} {"train_loss": -18.16751480102539, "global_step": 20745, "epoch": 249} {"train_loss": -18.379474639892578, "global_step": 20746, "epoch": 249} {"train_loss": -18.134057998657227, "global_step": 20747, "epoch": 249} {"train_loss": -18.227548599243164, "global_step": 20748, "epoch": 249} {"train_loss": -18.369433207684253, "global_step": 20749, "epoch": 249, "val_loss": 5949394.0} {"train_loss": -18.02915382385254, "global_step": 20750, "epoch": 250} {"train_loss": -18.15389060974121, "global_step": 20751, "epoch": 250} {"train_loss": -18.075986862182617, "global_step": 20752, "epoch": 250} {"train_loss": -18.601806640625, "global_step": 20753, "epoch": 250} {"train_loss": -18.413436889648438, "global_step": 20754, "epoch": 250} {"train_loss": -18.459640502929688, "global_step": 20755, "epoch": 250} {"train_loss": -18.42820167541504, "global_step": 20756, "epoch": 250} {"train_loss": -18.222593307495117, "global_step": 20757, "epoch": 250} {"train_loss": -18.460052490234375, "global_step": 20758, "epoch": 250} {"train_loss": -18.046825408935547, "global_step": 20759, "epoch": 250} {"train_loss": -18.372045516967773, "global_step": 20760, "epoch": 250} {"train_loss": -17.70903968811035, "global_step": 20761, "epoch": 250} {"train_loss": -18.412822723388672, "global_step": 20762, "epoch": 250} {"train_loss": -18.87653923034668, "global_step": 20763, "epoch": 250} {"train_loss": -18.569538116455078, "global_step": 20764, "epoch": 250} {"train_loss": -18.576719284057617, "global_step": 20765, "epoch": 250} {"train_loss": -18.276582717895508, "global_step": 20766, "epoch": 250} {"train_loss": -18.235429763793945, "global_step": 20767, "epoch": 250} {"train_loss": -18.219383239746094, "global_step": 20768, "epoch": 250} {"train_loss": -18.15606117248535, "global_step": 20769, "epoch": 250} {"train_loss": -18.23885726928711, "global_step": 20770, "epoch": 250} {"train_loss": -18.39188003540039, "global_step": 20771, "epoch": 250} {"train_loss": -18.377887725830078, "global_step": 20772, "epoch": 250} {"train_loss": -18.640409469604492, "global_step": 20773, "epoch": 250} {"train_loss": -18.42763328552246, "global_step": 20774, "epoch": 250} {"train_loss": -18.40692138671875, "global_step": 20775, "epoch": 250} {"train_loss": -18.102264404296875, "global_step": 20776, "epoch": 250} {"train_loss": -18.395273208618164, "global_step": 20777, "epoch": 250} {"train_loss": -18.672348022460938, "global_step": 20778, "epoch": 250} {"train_loss": -18.351232528686523, "global_step": 20779, "epoch": 250} {"train_loss": -18.406757354736328, "global_step": 20780, "epoch": 250} {"train_loss": -18.412702560424805, "global_step": 20781, "epoch": 250} {"train_loss": -18.404733657836914, "global_step": 20782, "epoch": 250} {"train_loss": -18.166364669799805, "global_step": 20783, "epoch": 250} {"train_loss": -18.735082626342773, "global_step": 20784, "epoch": 250} {"train_loss": -18.569456100463867, "global_step": 20785, "epoch": 250} {"train_loss": -18.296232223510742, "global_step": 20786, "epoch": 250} {"train_loss": -18.59598159790039, "global_step": 20787, "epoch": 250} {"train_loss": -18.32219696044922, "global_step": 20788, "epoch": 250} {"train_loss": -18.719831466674805, "global_step": 20789, "epoch": 250} {"train_loss": -18.144712448120117, "global_step": 20790, "epoch": 250} {"train_loss": -18.373279571533203, "global_step": 20791, "epoch": 250} {"train_loss": -18.391836166381836, "global_step": 20792, "epoch": 250} {"train_loss": -18.321962356567383, "global_step": 20793, "epoch": 250} {"train_loss": -18.596385955810547, "global_step": 20794, "epoch": 250} {"train_loss": -18.283836364746094, "global_step": 20795, "epoch": 250} {"train_loss": -18.17359733581543, "global_step": 20796, "epoch": 250} {"train_loss": -18.50734519958496, "global_step": 20797, "epoch": 250} {"train_loss": -18.432653427124023, "global_step": 20798, "epoch": 250} {"train_loss": -18.63996696472168, "global_step": 20799, "epoch": 250} {"train_loss": -17.947895050048828, "global_step": 20800, "epoch": 250} {"train_loss": -18.505855560302734, "global_step": 20801, "epoch": 250} {"train_loss": -18.356555938720703, "global_step": 20802, "epoch": 250} {"train_loss": -18.57784652709961, "global_step": 20803, "epoch": 250} {"train_loss": -18.178781509399414, "global_step": 20804, "epoch": 250} {"train_loss": -18.70073890686035, "global_step": 20805, "epoch": 250} {"train_loss": -18.15389633178711, "global_step": 20806, "epoch": 250} {"train_loss": -18.56785011291504, "global_step": 20807, "epoch": 250} {"train_loss": -17.97891616821289, "global_step": 20808, "epoch": 250} {"train_loss": -18.496658325195312, "global_step": 20809, "epoch": 250} {"train_loss": -18.759241104125977, "global_step": 20810, "epoch": 250} {"train_loss": -18.5062198638916, "global_step": 20811, "epoch": 250} {"train_loss": -18.553802490234375, "global_step": 20812, "epoch": 250} {"train_loss": -18.2943058013916, "global_step": 20813, "epoch": 250} {"train_loss": -18.436721801757812, "global_step": 20814, "epoch": 250} {"train_loss": -18.33982276916504, "global_step": 20815, "epoch": 250} {"train_loss": -18.389890670776367, "global_step": 20816, "epoch": 250} {"train_loss": -18.55597496032715, "global_step": 20817, "epoch": 250} {"train_loss": -18.31661033630371, "global_step": 20818, "epoch": 250} {"train_loss": -18.32960319519043, "global_step": 20819, "epoch": 250} {"train_loss": -18.148775100708008, "global_step": 20820, "epoch": 250} {"train_loss": -18.555631637573242, "global_step": 20821, "epoch": 250} {"train_loss": -18.430591583251953, "global_step": 20822, "epoch": 250} {"train_loss": -18.796640396118164, "global_step": 20823, "epoch": 250} {"train_loss": -18.208356857299805, "global_step": 20824, "epoch": 250} {"train_loss": -18.546823501586914, "global_step": 20825, "epoch": 250} {"train_loss": -18.555707931518555, "global_step": 20826, "epoch": 250} {"train_loss": -18.3732852935791, "global_step": 20827, "epoch": 250} {"train_loss": -18.021848678588867, "global_step": 20828, "epoch": 250} {"train_loss": -18.639089584350586, "global_step": 20829, "epoch": 250} {"train_loss": -18.433162689208984, "global_step": 20830, "epoch": 250} {"train_loss": -18.486608505249023, "global_step": 20831, "epoch": 250} {"train_loss": -18.405098421027862, "global_step": 20832, "epoch": 250, "train/sim_max_reward_0": 1.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 0.0, "train/sim_max_reward_4": 0.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4500000": 0.0, "test/sim_max_reward_4500001": 1.0, "test/sim_max_reward_4500002": 1.0, "test/sim_max_reward_4500003": 0.0, "test/sim_max_reward_4500004": 0.0, "test/sim_max_reward_4500005": 1.0, "test/sim_max_reward_4500006": 1.0, "test/sim_max_reward_4500007": 1.0, "test/sim_max_reward_4500008": 1.0, "test/sim_max_reward_4500009": 1.0, "test/sim_max_reward_4500010": 1.0, "test/sim_max_reward_4500011": 1.0, "test/sim_max_reward_4500012": 1.0, "test/sim_max_reward_4500013": 1.0, "test/sim_max_reward_4500014": 1.0, "test/sim_max_reward_4500015": 1.0, "test/sim_max_reward_4500016": 1.0, "test/sim_max_reward_4500017": 0.0, "test/sim_max_reward_4500018": 1.0, "test/sim_max_reward_4500019": 0.0, "test/sim_max_reward_4500020": 1.0, "test/sim_max_reward_4500021": 0.0, "train/mean_score": 0.6666666666666666, "test/mean_score": 0.7272727272727273, "val_loss": 5993427.0} {"train_loss": -18.351613998413086, "global_step": 20833, "epoch": 251} {"train_loss": -18.129812240600586, "global_step": 20834, "epoch": 251} {"train_loss": -18.19663429260254, "global_step": 20835, "epoch": 251} {"train_loss": -18.148767471313477, "global_step": 20836, "epoch": 251} {"train_loss": -18.767616271972656, "global_step": 20837, "epoch": 251} {"train_loss": -18.419687271118164, "global_step": 20838, "epoch": 251} {"train_loss": -17.989694595336914, "global_step": 20839, "epoch": 251} {"train_loss": -18.364105224609375, "global_step": 20840, "epoch": 251} {"train_loss": -18.03687858581543, "global_step": 20841, "epoch": 251} {"train_loss": -18.670398712158203, "global_step": 20842, "epoch": 251} {"train_loss": -18.027774810791016, "global_step": 20843, "epoch": 251} {"train_loss": -18.440793991088867, "global_step": 20844, "epoch": 251} {"train_loss": -18.20755386352539, "global_step": 20845, "epoch": 251} {"train_loss": -18.81308937072754, "global_step": 20846, "epoch": 251} {"train_loss": -18.135515213012695, "global_step": 20847, "epoch": 251} {"train_loss": -18.05904197692871, "global_step": 20848, "epoch": 251} {"train_loss": -18.3680477142334, "global_step": 20849, "epoch": 251} {"train_loss": -18.35188865661621, "global_step": 20850, "epoch": 251} {"train_loss": -18.34604835510254, "global_step": 20851, "epoch": 251} {"train_loss": -18.501667022705078, "global_step": 20852, "epoch": 251} {"train_loss": -18.51422119140625, "global_step": 20853, "epoch": 251} {"train_loss": -17.859851837158203, "global_step": 20854, "epoch": 251} {"train_loss": -18.707778930664062, "global_step": 20855, "epoch": 251} {"train_loss": -18.16598129272461, "global_step": 20856, "epoch": 251} {"train_loss": -18.2095947265625, "global_step": 20857, "epoch": 251} {"train_loss": -18.033832550048828, "global_step": 20858, "epoch": 251} {"train_loss": -18.27955436706543, "global_step": 20859, "epoch": 251} {"train_loss": -18.246816635131836, "global_step": 20860, "epoch": 251} {"train_loss": -18.656719207763672, "global_step": 20861, "epoch": 251} {"train_loss": -18.042654037475586, "global_step": 20862, "epoch": 251} {"train_loss": -18.365739822387695, "global_step": 20863, "epoch": 251} {"train_loss": -18.225317001342773, "global_step": 20864, "epoch": 251} {"train_loss": -18.494985580444336, "global_step": 20865, "epoch": 251} {"train_loss": -18.30033302307129, "global_step": 20866, "epoch": 251} {"train_loss": -18.623340606689453, "global_step": 20867, "epoch": 251} {"train_loss": -18.017974853515625, "global_step": 20868, "epoch": 251} {"train_loss": -18.315473556518555, "global_step": 20869, "epoch": 251} {"train_loss": -18.044599533081055, "global_step": 20870, "epoch": 251} {"train_loss": -18.858549118041992, "global_step": 20871, "epoch": 251} {"train_loss": -17.92378807067871, "global_step": 20872, "epoch": 251} {"train_loss": -18.754837036132812, "global_step": 20873, "epoch": 251} {"train_loss": -18.317216873168945, "global_step": 20874, "epoch": 251} {"train_loss": -18.548044204711914, "global_step": 20875, "epoch": 251} {"train_loss": -18.466466903686523, "global_step": 20876, "epoch": 251} {"train_loss": -18.525850296020508, "global_step": 20877, "epoch": 251} {"train_loss": -18.37424659729004, "global_step": 20878, "epoch": 251} {"train_loss": -18.456392288208008, "global_step": 20879, "epoch": 251} {"train_loss": -18.287004470825195, "global_step": 20880, "epoch": 251} {"train_loss": -18.278858184814453, "global_step": 20881, "epoch": 251} {"train_loss": -17.98587417602539, "global_step": 20882, "epoch": 251} {"train_loss": -18.41697883605957, "global_step": 20883, "epoch": 251} {"train_loss": -18.759130477905273, "global_step": 20884, "epoch": 251} {"train_loss": -18.609291076660156, "global_step": 20885, "epoch": 251} {"train_loss": -18.57465934753418, "global_step": 20886, "epoch": 251} {"train_loss": -18.679763793945312, "global_step": 20887, "epoch": 251} {"train_loss": -18.735294342041016, "global_step": 20888, "epoch": 251} {"train_loss": -18.418668746948242, "global_step": 20889, "epoch": 251} {"train_loss": -18.792551040649414, "global_step": 20890, "epoch": 251} {"train_loss": -18.139617919921875, "global_step": 20891, "epoch": 251} {"train_loss": -18.48240089416504, "global_step": 20892, "epoch": 251} {"train_loss": -18.19554328918457, "global_step": 20893, "epoch": 251} {"train_loss": -18.39005470275879, "global_step": 20894, "epoch": 251} {"train_loss": -18.6663818359375, "global_step": 20895, "epoch": 251} {"train_loss": -18.710172653198242, "global_step": 20896, "epoch": 251} {"train_loss": -18.454330444335938, "global_step": 20897, "epoch": 251} {"train_loss": -18.4686336517334, "global_step": 20898, "epoch": 251} {"train_loss": -18.19710922241211, "global_step": 20899, "epoch": 251} {"train_loss": -18.700645446777344, "global_step": 20900, "epoch": 251} {"train_loss": -18.46350860595703, "global_step": 20901, "epoch": 251} {"train_loss": -18.582801818847656, "global_step": 20902, "epoch": 251} {"train_loss": -18.288509368896484, "global_step": 20903, "epoch": 251} {"train_loss": -18.444618225097656, "global_step": 20904, "epoch": 251} {"train_loss": -18.530630111694336, "global_step": 20905, "epoch": 251} {"train_loss": -18.551868438720703, "global_step": 20906, "epoch": 251} {"train_loss": -18.366079330444336, "global_step": 20907, "epoch": 251} {"train_loss": -18.626209259033203, "global_step": 20908, "epoch": 251} {"train_loss": -18.34274673461914, "global_step": 20909, "epoch": 251} {"train_loss": -18.46786880493164, "global_step": 20910, "epoch": 251} {"train_loss": -18.90032958984375, "global_step": 20911, "epoch": 251} {"train_loss": -18.296775817871094, "global_step": 20912, "epoch": 251} {"train_loss": -18.933164596557617, "global_step": 20913, "epoch": 251} {"train_loss": -18.35707664489746, "global_step": 20914, "epoch": 251} {"train_loss": -18.37605244280344, "global_step": 20915, "epoch": 251, "val_loss": 5943252.0} {"train_loss": -18.422775268554688, "global_step": 20916, "epoch": 252} {"train_loss": -18.16058349609375, "global_step": 20917, "epoch": 252} {"train_loss": -18.328744888305664, "global_step": 20918, "epoch": 252} {"train_loss": -18.314062118530273, "global_step": 20919, "epoch": 252} {"train_loss": -18.29780387878418, "global_step": 20920, "epoch": 252} {"train_loss": -18.27663230895996, "global_step": 20921, "epoch": 252} {"train_loss": -18.27425193786621, "global_step": 20922, "epoch": 252} {"train_loss": -18.10811424255371, "global_step": 20923, "epoch": 252} {"train_loss": -18.08938217163086, "global_step": 20924, "epoch": 252} {"train_loss": -18.290069580078125, "global_step": 20925, "epoch": 252} {"train_loss": -18.359914779663086, "global_step": 20926, "epoch": 252} {"train_loss": -18.319931030273438, "global_step": 20927, "epoch": 252} {"train_loss": -18.450166702270508, "global_step": 20928, "epoch": 252} {"train_loss": -18.347591400146484, "global_step": 20929, "epoch": 252} {"train_loss": -18.803136825561523, "global_step": 20930, "epoch": 252} {"train_loss": -18.712915420532227, "global_step": 20931, "epoch": 252} {"train_loss": -18.17693328857422, "global_step": 20932, "epoch": 252} {"train_loss": -18.48271369934082, "global_step": 20933, "epoch": 252} {"train_loss": -18.405488967895508, "global_step": 20934, "epoch": 252} {"train_loss": -18.66037940979004, "global_step": 20935, "epoch": 252} {"train_loss": -18.66697120666504, "global_step": 20936, "epoch": 252} {"train_loss": -18.39179801940918, "global_step": 20937, "epoch": 252} {"train_loss": -18.495038986206055, "global_step": 20938, "epoch": 252} {"train_loss": -18.146793365478516, "global_step": 20939, "epoch": 252} {"train_loss": -18.601177215576172, "global_step": 20940, "epoch": 252} {"train_loss": -18.344465255737305, "global_step": 20941, "epoch": 252} {"train_loss": -18.248563766479492, "global_step": 20942, "epoch": 252} {"train_loss": -18.170042037963867, "global_step": 20943, "epoch": 252} {"train_loss": -18.724315643310547, "global_step": 20944, "epoch": 252} {"train_loss": -18.328229904174805, "global_step": 20945, "epoch": 252} {"train_loss": -18.56184196472168, "global_step": 20946, "epoch": 252} {"train_loss": -18.488300323486328, "global_step": 20947, "epoch": 252} {"train_loss": -18.16851806640625, "global_step": 20948, "epoch": 252} {"train_loss": -18.042993545532227, "global_step": 20949, "epoch": 252} {"train_loss": -18.542369842529297, "global_step": 20950, "epoch": 252} {"train_loss": -18.771163940429688, "global_step": 20951, "epoch": 252} {"train_loss": -18.530271530151367, "global_step": 20952, "epoch": 252} {"train_loss": -18.327884674072266, "global_step": 20953, "epoch": 252} {"train_loss": -18.561315536499023, "global_step": 20954, "epoch": 252} {"train_loss": -19.077817916870117, "global_step": 20955, "epoch": 252} {"train_loss": -18.294309616088867, "global_step": 20956, "epoch": 252} {"train_loss": -18.262388229370117, "global_step": 20957, "epoch": 252} {"train_loss": -18.35573387145996, "global_step": 20958, "epoch": 252} {"train_loss": -17.97077178955078, "global_step": 20959, "epoch": 252} {"train_loss": -18.206674575805664, "global_step": 20960, "epoch": 252} {"train_loss": -18.345808029174805, "global_step": 20961, "epoch": 252} {"train_loss": -18.329971313476562, "global_step": 20962, "epoch": 252} {"train_loss": -18.571256637573242, "global_step": 20963, "epoch": 252} {"train_loss": -18.644847869873047, "global_step": 20964, "epoch": 252} {"train_loss": -18.129886627197266, "global_step": 20965, "epoch": 252} {"train_loss": -18.276391983032227, "global_step": 20966, "epoch": 252} {"train_loss": -18.812049865722656, "global_step": 20967, "epoch": 252} {"train_loss": -18.693349838256836, "global_step": 20968, "epoch": 252} {"train_loss": -18.567920684814453, "global_step": 20969, "epoch": 252} {"train_loss": -18.820465087890625, "global_step": 20970, "epoch": 252} {"train_loss": -18.64627456665039, "global_step": 20971, "epoch": 252} {"train_loss": -18.600936889648438, "global_step": 20972, "epoch": 252} {"train_loss": -18.518884658813477, "global_step": 20973, "epoch": 252} {"train_loss": -18.43889045715332, "global_step": 20974, "epoch": 252} {"train_loss": -18.59223747253418, "global_step": 20975, "epoch": 252} {"train_loss": -18.44057273864746, "global_step": 20976, "epoch": 252} {"train_loss": -18.77044105529785, "global_step": 20977, "epoch": 252} {"train_loss": -18.83966636657715, "global_step": 20978, "epoch": 252} {"train_loss": -18.529048919677734, "global_step": 20979, "epoch": 252} {"train_loss": -18.37006187438965, "global_step": 20980, "epoch": 252} {"train_loss": -18.498315811157227, "global_step": 20981, "epoch": 252} {"train_loss": -18.299680709838867, "global_step": 20982, "epoch": 252} {"train_loss": -18.481353759765625, "global_step": 20983, "epoch": 252} {"train_loss": -18.508695602416992, "global_step": 20984, "epoch": 252} {"train_loss": -18.407032012939453, "global_step": 20985, "epoch": 252} {"train_loss": -18.556344985961914, "global_step": 20986, "epoch": 252} {"train_loss": -18.272390365600586, "global_step": 20987, "epoch": 252} {"train_loss": -18.292821884155273, "global_step": 20988, "epoch": 252} {"train_loss": -18.49464988708496, "global_step": 20989, "epoch": 252} {"train_loss": -18.67872428894043, "global_step": 20990, "epoch": 252} {"train_loss": -18.556289672851562, "global_step": 20991, "epoch": 252} {"train_loss": -18.4588623046875, "global_step": 20992, "epoch": 252} {"train_loss": -18.867918014526367, "global_step": 20993, "epoch": 252} {"train_loss": -18.19936752319336, "global_step": 20994, "epoch": 252} {"train_loss": -18.567153930664062, "global_step": 20995, "epoch": 252} {"train_loss": -18.567428588867188, "global_step": 20996, "epoch": 252} {"train_loss": -18.332529067993164, "global_step": 20997, "epoch": 252} {"train_loss": -18.428282795182195, "global_step": 20998, "epoch": 252, "val_loss": 5899997.0} {"train_loss": -17.985458374023438, "global_step": 20999, "epoch": 253} {"train_loss": -18.368606567382812, "global_step": 21000, "epoch": 253} {"train_loss": -17.982624053955078, "global_step": 21001, "epoch": 253} {"train_loss": -18.315536499023438, "global_step": 21002, "epoch": 253} {"train_loss": -18.161048889160156, "global_step": 21003, "epoch": 253} {"train_loss": -18.367826461791992, "global_step": 21004, "epoch": 253} {"train_loss": -18.228525161743164, "global_step": 21005, "epoch": 253} {"train_loss": -18.172752380371094, "global_step": 21006, "epoch": 253} {"train_loss": -18.45309829711914, "global_step": 21007, "epoch": 253} {"train_loss": -18.750619888305664, "global_step": 21008, "epoch": 253} {"train_loss": -18.128751754760742, "global_step": 21009, "epoch": 253} {"train_loss": -18.976715087890625, "global_step": 21010, "epoch": 253} {"train_loss": -17.989059448242188, "global_step": 21011, "epoch": 253} {"train_loss": -18.376705169677734, "global_step": 21012, "epoch": 253} {"train_loss": -18.172468185424805, "global_step": 21013, "epoch": 253} {"train_loss": -18.847455978393555, "global_step": 21014, "epoch": 253} {"train_loss": -18.175100326538086, "global_step": 21015, "epoch": 253} {"train_loss": -18.42806053161621, "global_step": 21016, "epoch": 253} {"train_loss": -18.441797256469727, "global_step": 21017, "epoch": 253} {"train_loss": -18.4102840423584, "global_step": 21018, "epoch": 253} {"train_loss": -18.204492568969727, "global_step": 21019, "epoch": 253} {"train_loss": -18.439306259155273, "global_step": 21020, "epoch": 253} {"train_loss": -18.525924682617188, "global_step": 21021, "epoch": 253} {"train_loss": -18.45159339904785, "global_step": 21022, "epoch": 253} {"train_loss": -18.598194122314453, "global_step": 21023, "epoch": 253} {"train_loss": -18.217151641845703, "global_step": 21024, "epoch": 253} {"train_loss": -18.039642333984375, "global_step": 21025, "epoch": 253} {"train_loss": -18.56130027770996, "global_step": 21026, "epoch": 253} {"train_loss": -18.35041618347168, "global_step": 21027, "epoch": 253} {"train_loss": -18.336889266967773, "global_step": 21028, "epoch": 253} {"train_loss": -18.590560913085938, "global_step": 21029, "epoch": 253} {"train_loss": -18.359819412231445, "global_step": 21030, "epoch": 253} {"train_loss": -18.636144638061523, "global_step": 21031, "epoch": 253} {"train_loss": -17.94917106628418, "global_step": 21032, "epoch": 253} {"train_loss": -18.244497299194336, "global_step": 21033, "epoch": 253} {"train_loss": -18.59783363342285, "global_step": 21034, "epoch": 253} {"train_loss": -18.54509162902832, "global_step": 21035, "epoch": 253} {"train_loss": -17.870670318603516, "global_step": 21036, "epoch": 253} {"train_loss": -18.57108497619629, "global_step": 21037, "epoch": 253} {"train_loss": -18.374542236328125, "global_step": 21038, "epoch": 253} {"train_loss": -18.38326072692871, "global_step": 21039, "epoch": 253} {"train_loss": -18.445825576782227, "global_step": 21040, "epoch": 253} {"train_loss": -18.35653305053711, "global_step": 21041, "epoch": 253} {"train_loss": -18.354848861694336, "global_step": 21042, "epoch": 253} {"train_loss": -18.748594284057617, "global_step": 21043, "epoch": 253} {"train_loss": -18.39536476135254, "global_step": 21044, "epoch": 253} {"train_loss": -18.07036781311035, "global_step": 21045, "epoch": 253} {"train_loss": -18.368528366088867, "global_step": 21046, "epoch": 253} {"train_loss": -18.75571060180664, "global_step": 21047, "epoch": 253} {"train_loss": -18.725732803344727, "global_step": 21048, "epoch": 253} {"train_loss": -18.300495147705078, "global_step": 21049, "epoch": 253} {"train_loss": -18.225698471069336, "global_step": 21050, "epoch": 253} {"train_loss": -18.347370147705078, "global_step": 21051, "epoch": 253} {"train_loss": -18.592138290405273, "global_step": 21052, "epoch": 253} {"train_loss": -18.176362991333008, "global_step": 21053, "epoch": 253} {"train_loss": -18.740833282470703, "global_step": 21054, "epoch": 253} {"train_loss": -18.293859481811523, "global_step": 21055, "epoch": 253} {"train_loss": -18.435161590576172, "global_step": 21056, "epoch": 253} {"train_loss": -18.286102294921875, "global_step": 21057, "epoch": 253} {"train_loss": -18.20218849182129, "global_step": 21058, "epoch": 253} {"train_loss": -18.388216018676758, "global_step": 21059, "epoch": 253} {"train_loss": -18.972097396850586, "global_step": 21060, "epoch": 253} {"train_loss": -18.28656005859375, "global_step": 21061, "epoch": 253} {"train_loss": -18.55820083618164, "global_step": 21062, "epoch": 253} {"train_loss": -18.36610984802246, "global_step": 21063, "epoch": 253} {"train_loss": -18.624792098999023, "global_step": 21064, "epoch": 253} {"train_loss": -17.972461700439453, "global_step": 21065, "epoch": 253} {"train_loss": -18.671911239624023, "global_step": 21066, "epoch": 253} {"train_loss": -18.40772247314453, "global_step": 21067, "epoch": 253} {"train_loss": -18.361881256103516, "global_step": 21068, "epoch": 253} {"train_loss": -18.63239097595215, "global_step": 21069, "epoch": 253} {"train_loss": -18.534061431884766, "global_step": 21070, "epoch": 253} {"train_loss": -18.177465438842773, "global_step": 21071, "epoch": 253} {"train_loss": -18.35206413269043, "global_step": 21072, "epoch": 253} {"train_loss": -18.667226791381836, "global_step": 21073, "epoch": 253} {"train_loss": -18.09006118774414, "global_step": 21074, "epoch": 253} {"train_loss": -18.435827255249023, "global_step": 21075, "epoch": 253} {"train_loss": -18.674467086791992, "global_step": 21076, "epoch": 253} {"train_loss": -18.4891300201416, "global_step": 21077, "epoch": 253} {"train_loss": -18.240022659301758, "global_step": 21078, "epoch": 253} {"train_loss": -18.102643966674805, "global_step": 21079, "epoch": 253} {"train_loss": -18.35979461669922, "global_step": 21080, "epoch": 253} {"train_loss": -18.385371150740657, "global_step": 21081, "epoch": 253, "val_loss": 5931734.0} {"train_loss": -18.461231231689453, "global_step": 21082, "epoch": 254} {"train_loss": -18.52652359008789, "global_step": 21083, "epoch": 254} {"train_loss": -18.372169494628906, "global_step": 21084, "epoch": 254} {"train_loss": -18.531240463256836, "global_step": 21085, "epoch": 254} {"train_loss": -18.500547409057617, "global_step": 21086, "epoch": 254} {"train_loss": -18.261398315429688, "global_step": 21087, "epoch": 254} {"train_loss": -18.73992347717285, "global_step": 21088, "epoch": 254} {"train_loss": -18.26927947998047, "global_step": 21089, "epoch": 254} {"train_loss": -18.710046768188477, "global_step": 21090, "epoch": 254} {"train_loss": -18.502662658691406, "global_step": 21091, "epoch": 254} {"train_loss": -18.30767822265625, "global_step": 21092, "epoch": 254} {"train_loss": -18.391218185424805, "global_step": 21093, "epoch": 254} {"train_loss": -18.569049835205078, "global_step": 21094, "epoch": 254} {"train_loss": -17.954641342163086, "global_step": 21095, "epoch": 254} {"train_loss": -18.12392234802246, "global_step": 21096, "epoch": 254} {"train_loss": -18.47041130065918, "global_step": 21097, "epoch": 254} {"train_loss": -18.326765060424805, "global_step": 21098, "epoch": 254} {"train_loss": -18.5403995513916, "global_step": 21099, "epoch": 254} {"train_loss": -18.41727638244629, "global_step": 21100, "epoch": 254} {"train_loss": -18.274917602539062, "global_step": 21101, "epoch": 254} {"train_loss": -18.691564559936523, "global_step": 21102, "epoch": 254} {"train_loss": -18.194490432739258, "global_step": 21103, "epoch": 254} {"train_loss": -18.072315216064453, "global_step": 21104, "epoch": 254} {"train_loss": -18.350584030151367, "global_step": 21105, "epoch": 254} {"train_loss": -18.595733642578125, "global_step": 21106, "epoch": 254} {"train_loss": -18.31365966796875, "global_step": 21107, "epoch": 254} {"train_loss": -18.533966064453125, "global_step": 21108, "epoch": 254} {"train_loss": -18.39923667907715, "global_step": 21109, "epoch": 254} {"train_loss": -18.582448959350586, "global_step": 21110, "epoch": 254} {"train_loss": -18.226938247680664, "global_step": 21111, "epoch": 254} {"train_loss": -18.46241569519043, "global_step": 21112, "epoch": 254} {"train_loss": -18.381742477416992, "global_step": 21113, "epoch": 254} {"train_loss": -18.175390243530273, "global_step": 21114, "epoch": 254} {"train_loss": -18.549606323242188, "global_step": 21115, "epoch": 254} {"train_loss": -18.146392822265625, "global_step": 21116, "epoch": 254} {"train_loss": -18.25406837463379, "global_step": 21117, "epoch": 254} {"train_loss": -18.644826889038086, "global_step": 21118, "epoch": 254} {"train_loss": -18.49808692932129, "global_step": 21119, "epoch": 254} {"train_loss": -18.4746150970459, "global_step": 21120, "epoch": 254} {"train_loss": -18.25324249267578, "global_step": 21121, "epoch": 254} {"train_loss": -18.648025512695312, "global_step": 21122, "epoch": 254} {"train_loss": -18.52924919128418, "global_step": 21123, "epoch": 254} {"train_loss": -18.465024948120117, "global_step": 21124, "epoch": 254} {"train_loss": -18.495849609375, "global_step": 21125, "epoch": 254} {"train_loss": -18.487812042236328, "global_step": 21126, "epoch": 254} {"train_loss": -18.565122604370117, "global_step": 21127, "epoch": 254} {"train_loss": -18.275548934936523, "global_step": 21128, "epoch": 254} {"train_loss": -18.522520065307617, "global_step": 21129, "epoch": 254} {"train_loss": -18.312734603881836, "global_step": 21130, "epoch": 254} {"train_loss": -18.325721740722656, "global_step": 21131, "epoch": 254} {"train_loss": -18.422313690185547, "global_step": 21132, "epoch": 254} {"train_loss": -18.58519172668457, "global_step": 21133, "epoch": 254} {"train_loss": -18.74598503112793, "global_step": 21134, "epoch": 254} {"train_loss": -18.659494400024414, "global_step": 21135, "epoch": 254} {"train_loss": -18.47112464904785, "global_step": 21136, "epoch": 254} {"train_loss": -18.46246910095215, "global_step": 21137, "epoch": 254} {"train_loss": -18.59781837463379, "global_step": 21138, "epoch": 254} {"train_loss": -18.60433006286621, "global_step": 21139, "epoch": 254} {"train_loss": -18.51423454284668, "global_step": 21140, "epoch": 254} {"train_loss": -18.62937355041504, "global_step": 21141, "epoch": 254} {"train_loss": -18.332754135131836, "global_step": 21142, "epoch": 254} {"train_loss": -18.722980499267578, "global_step": 21143, "epoch": 254} {"train_loss": -18.5673770904541, "global_step": 21144, "epoch": 254} {"train_loss": -18.471782684326172, "global_step": 21145, "epoch": 254} {"train_loss": -18.50336265563965, "global_step": 21146, "epoch": 254} {"train_loss": -18.47071647644043, "global_step": 21147, "epoch": 254} {"train_loss": -18.481372833251953, "global_step": 21148, "epoch": 254} {"train_loss": -18.13970947265625, "global_step": 21149, "epoch": 254} {"train_loss": -18.562482833862305, "global_step": 21150, "epoch": 254} {"train_loss": -18.15264892578125, "global_step": 21151, "epoch": 254} {"train_loss": -18.472463607788086, "global_step": 21152, "epoch": 254} {"train_loss": -18.39864158630371, "global_step": 21153, "epoch": 254} {"train_loss": -18.324186325073242, "global_step": 21154, "epoch": 254} {"train_loss": -18.797285079956055, "global_step": 21155, "epoch": 254} {"train_loss": -18.42807960510254, "global_step": 21156, "epoch": 254} {"train_loss": -18.324127197265625, "global_step": 21157, "epoch": 254} {"train_loss": -18.348846435546875, "global_step": 21158, "epoch": 254} {"train_loss": -17.734439849853516, "global_step": 21159, "epoch": 254} {"train_loss": -18.46674919128418, "global_step": 21160, "epoch": 254} {"train_loss": -18.35402488708496, "global_step": 21161, "epoch": 254} {"train_loss": -18.588340759277344, "global_step": 21162, "epoch": 254} {"train_loss": -18.276206970214844, "global_step": 21163, "epoch": 254} {"train_loss": -18.411932726940478, "global_step": 21164, "epoch": 254, "val_loss": 6063407.5} {"train_loss": -18.15043067932129, "global_step": 21165, "epoch": 255} {"train_loss": -18.456436157226562, "global_step": 21166, "epoch": 255} {"train_loss": -18.278783798217773, "global_step": 21167, "epoch": 255} {"train_loss": -17.903173446655273, "global_step": 21168, "epoch": 255} {"train_loss": -18.44827651977539, "global_step": 21169, "epoch": 255} {"train_loss": -17.944791793823242, "global_step": 21170, "epoch": 255} {"train_loss": -17.926834106445312, "global_step": 21171, "epoch": 255} {"train_loss": -18.319669723510742, "global_step": 21172, "epoch": 255} {"train_loss": -18.064016342163086, "global_step": 21173, "epoch": 255} {"train_loss": -18.108478546142578, "global_step": 21174, "epoch": 255} {"train_loss": -18.40247917175293, "global_step": 21175, "epoch": 255} {"train_loss": -17.84251594543457, "global_step": 21176, "epoch": 255} {"train_loss": -18.300756454467773, "global_step": 21177, "epoch": 255} {"train_loss": -18.338584899902344, "global_step": 21178, "epoch": 255} {"train_loss": -18.040395736694336, "global_step": 21179, "epoch": 255} {"train_loss": -18.196889877319336, "global_step": 21180, "epoch": 255} {"train_loss": -18.74127769470215, "global_step": 21181, "epoch": 255} {"train_loss": -18.39653778076172, "global_step": 21182, "epoch": 255} {"train_loss": -18.49421501159668, "global_step": 21183, "epoch": 255} {"train_loss": -18.324695587158203, "global_step": 21184, "epoch": 255} {"train_loss": -18.11115837097168, "global_step": 21185, "epoch": 255} {"train_loss": -17.998212814331055, "global_step": 21186, "epoch": 255} {"train_loss": -18.5562744140625, "global_step": 21187, "epoch": 255} {"train_loss": -18.337385177612305, "global_step": 21188, "epoch": 255} {"train_loss": -18.392248153686523, "global_step": 21189, "epoch": 255} {"train_loss": -18.494205474853516, "global_step": 21190, "epoch": 255} {"train_loss": -18.96059226989746, "global_step": 21191, "epoch": 255} {"train_loss": -18.226926803588867, "global_step": 21192, "epoch": 255} {"train_loss": -18.701505661010742, "global_step": 21193, "epoch": 255} {"train_loss": -18.32953453063965, "global_step": 21194, "epoch": 255} {"train_loss": -18.3496150970459, "global_step": 21195, "epoch": 255} {"train_loss": -18.484861373901367, "global_step": 21196, "epoch": 255} {"train_loss": -18.4061222076416, "global_step": 21197, "epoch": 255} {"train_loss": -18.665180206298828, "global_step": 21198, "epoch": 255} {"train_loss": -18.216796875, "global_step": 21199, "epoch": 255} {"train_loss": -18.338592529296875, "global_step": 21200, "epoch": 255} {"train_loss": -18.09347915649414, "global_step": 21201, "epoch": 255} {"train_loss": -18.58595848083496, "global_step": 21202, "epoch": 255} {"train_loss": -18.71895408630371, "global_step": 21203, "epoch": 255} {"train_loss": -18.275007247924805, "global_step": 21204, "epoch": 255} {"train_loss": -18.46134376525879, "global_step": 21205, "epoch": 255} {"train_loss": -18.49176597595215, "global_step": 21206, "epoch": 255} {"train_loss": -18.349990844726562, "global_step": 21207, "epoch": 255} {"train_loss": -18.678998947143555, "global_step": 21208, "epoch": 255} {"train_loss": -18.258941650390625, "global_step": 21209, "epoch": 255} {"train_loss": -18.436500549316406, "global_step": 21210, "epoch": 255} {"train_loss": -18.498525619506836, "global_step": 21211, "epoch": 255} {"train_loss": -18.60816764831543, "global_step": 21212, "epoch": 255} {"train_loss": -19.00327491760254, "global_step": 21213, "epoch": 255} {"train_loss": -18.587997436523438, "global_step": 21214, "epoch": 255} {"train_loss": -18.32294273376465, "global_step": 21215, "epoch": 255} {"train_loss": -18.46600914001465, "global_step": 21216, "epoch": 255} {"train_loss": -18.409744262695312, "global_step": 21217, "epoch": 255} {"train_loss": -18.419158935546875, "global_step": 21218, "epoch": 255} {"train_loss": -18.46681785583496, "global_step": 21219, "epoch": 255} {"train_loss": -18.495763778686523, "global_step": 21220, "epoch": 255} {"train_loss": -18.650171279907227, "global_step": 21221, "epoch": 255} {"train_loss": -18.74055290222168, "global_step": 21222, "epoch": 255} {"train_loss": -18.608671188354492, "global_step": 21223, "epoch": 255} {"train_loss": -18.753889083862305, "global_step": 21224, "epoch": 255} {"train_loss": -18.650203704833984, "global_step": 21225, "epoch": 255} {"train_loss": -18.72971534729004, "global_step": 21226, "epoch": 255} {"train_loss": -18.74873924255371, "global_step": 21227, "epoch": 255} {"train_loss": -18.896045684814453, "global_step": 21228, "epoch": 255} {"train_loss": -18.526540756225586, "global_step": 21229, "epoch": 255} {"train_loss": -18.323001861572266, "global_step": 21230, "epoch": 255} {"train_loss": -18.2850341796875, "global_step": 21231, "epoch": 255} {"train_loss": -18.3183650970459, "global_step": 21232, "epoch": 255} {"train_loss": -18.608728408813477, "global_step": 21233, "epoch": 255} {"train_loss": -18.50113296508789, "global_step": 21234, "epoch": 255} {"train_loss": -18.491910934448242, "global_step": 21235, "epoch": 255} {"train_loss": -18.863393783569336, "global_step": 21236, "epoch": 255} {"train_loss": -18.908767700195312, "global_step": 21237, "epoch": 255} {"train_loss": -18.57295036315918, "global_step": 21238, "epoch": 255} {"train_loss": -18.13760757446289, "global_step": 21239, "epoch": 255} {"train_loss": -18.084264755249023, "global_step": 21240, "epoch": 255} {"train_loss": -18.78390884399414, "global_step": 21241, "epoch": 255} {"train_loss": -18.406349182128906, "global_step": 21242, "epoch": 255} {"train_loss": -18.1994686126709, "global_step": 21243, "epoch": 255} {"train_loss": -17.73486328125, "global_step": 21244, "epoch": 255} {"train_loss": -18.410436630249023, "global_step": 21245, "epoch": 255} {"train_loss": -18.411731719970703, "global_step": 21246, "epoch": 255} {"train_loss": -18.40030477133142, "global_step": 21247, "epoch": 255, "val_loss": 5927775.0} {"train_loss": -18.173492431640625, "global_step": 21248, "epoch": 256} {"train_loss": -18.384925842285156, "global_step": 21249, "epoch": 256} {"train_loss": -18.75739288330078, "global_step": 21250, "epoch": 256} {"train_loss": -18.4970760345459, "global_step": 21251, "epoch": 256} {"train_loss": -18.575084686279297, "global_step": 21252, "epoch": 256} {"train_loss": -18.511266708374023, "global_step": 21253, "epoch": 256} {"train_loss": -18.560739517211914, "global_step": 21254, "epoch": 256} {"train_loss": -18.216659545898438, "global_step": 21255, "epoch": 256} {"train_loss": -18.739376068115234, "global_step": 21256, "epoch": 256} {"train_loss": -18.49344825744629, "global_step": 21257, "epoch": 256} {"train_loss": -18.294038772583008, "global_step": 21258, "epoch": 256} {"train_loss": -18.4425048828125, "global_step": 21259, "epoch": 256} {"train_loss": -18.50330924987793, "global_step": 21260, "epoch": 256} {"train_loss": -18.307647705078125, "global_step": 21261, "epoch": 256} {"train_loss": -18.417667388916016, "global_step": 21262, "epoch": 256} {"train_loss": -18.46262550354004, "global_step": 21263, "epoch": 256} {"train_loss": -18.582590103149414, "global_step": 21264, "epoch": 256} {"train_loss": -18.440776824951172, "global_step": 21265, "epoch": 256} {"train_loss": -18.59797477722168, "global_step": 21266, "epoch": 256} {"train_loss": -18.420272827148438, "global_step": 21267, "epoch": 256} {"train_loss": -18.544382095336914, "global_step": 21268, "epoch": 256} {"train_loss": -18.405216217041016, "global_step": 21269, "epoch": 256} {"train_loss": -18.161100387573242, "global_step": 21270, "epoch": 256} {"train_loss": -18.300302505493164, "global_step": 21271, "epoch": 256} {"train_loss": -18.48638343811035, "global_step": 21272, "epoch": 256} {"train_loss": -18.418838500976562, "global_step": 21273, "epoch": 256} {"train_loss": -18.543195724487305, "global_step": 21274, "epoch": 256} {"train_loss": -18.204193115234375, "global_step": 21275, "epoch": 256} {"train_loss": -18.193113327026367, "global_step": 21276, "epoch": 256} {"train_loss": -18.075584411621094, "global_step": 21277, "epoch": 256} {"train_loss": -18.175872802734375, "global_step": 21278, "epoch": 256} {"train_loss": -18.823837280273438, "global_step": 21279, "epoch": 256} {"train_loss": -18.308435440063477, "global_step": 21280, "epoch": 256} {"train_loss": -18.6347599029541, "global_step": 21281, "epoch": 256} {"train_loss": -18.450088500976562, "global_step": 21282, "epoch": 256} {"train_loss": -18.415855407714844, "global_step": 21283, "epoch": 256} {"train_loss": -18.61032485961914, "global_step": 21284, "epoch": 256} {"train_loss": -18.352705001831055, "global_step": 21285, "epoch": 256} {"train_loss": -18.551603317260742, "global_step": 21286, "epoch": 256} {"train_loss": -18.334129333496094, "global_step": 21287, "epoch": 256} {"train_loss": -18.609434127807617, "global_step": 21288, "epoch": 256} {"train_loss": -18.42610740661621, "global_step": 21289, "epoch": 256} {"train_loss": -18.33127784729004, "global_step": 21290, "epoch": 256} {"train_loss": -18.353713989257812, "global_step": 21291, "epoch": 256} {"train_loss": -18.76212501525879, "global_step": 21292, "epoch": 256} {"train_loss": -18.291608810424805, "global_step": 21293, "epoch": 256} {"train_loss": -18.500436782836914, "global_step": 21294, "epoch": 256} {"train_loss": -18.205869674682617, "global_step": 21295, "epoch": 256} {"train_loss": -18.625097274780273, "global_step": 21296, "epoch": 256} {"train_loss": -18.537343978881836, "global_step": 21297, "epoch": 256} {"train_loss": -18.67984962463379, "global_step": 21298, "epoch": 256} {"train_loss": -18.480016708374023, "global_step": 21299, "epoch": 256} {"train_loss": -18.519901275634766, "global_step": 21300, "epoch": 256} {"train_loss": -18.55023765563965, "global_step": 21301, "epoch": 256} {"train_loss": -18.571435928344727, "global_step": 21302, "epoch": 256} {"train_loss": -18.453811645507812, "global_step": 21303, "epoch": 256} {"train_loss": -18.506629943847656, "global_step": 21304, "epoch": 256} {"train_loss": -18.526968002319336, "global_step": 21305, "epoch": 256} {"train_loss": -18.293729782104492, "global_step": 21306, "epoch": 256} {"train_loss": -18.59834861755371, "global_step": 21307, "epoch": 256} {"train_loss": -18.554325103759766, "global_step": 21308, "epoch": 256} {"train_loss": -18.47249412536621, "global_step": 21309, "epoch": 256} {"train_loss": -18.457738876342773, "global_step": 21310, "epoch": 256} {"train_loss": -18.519468307495117, "global_step": 21311, "epoch": 256} {"train_loss": -18.120864868164062, "global_step": 21312, "epoch": 256} {"train_loss": -18.38460350036621, "global_step": 21313, "epoch": 256} {"train_loss": -18.3529109954834, "global_step": 21314, "epoch": 256} {"train_loss": -18.007343292236328, "global_step": 21315, "epoch": 256} {"train_loss": -18.732656478881836, "global_step": 21316, "epoch": 256} {"train_loss": -18.63155174255371, "global_step": 21317, "epoch": 256} {"train_loss": -18.452896118164062, "global_step": 21318, "epoch": 256} {"train_loss": -18.638275146484375, "global_step": 21319, "epoch": 256} {"train_loss": -18.328733444213867, "global_step": 21320, "epoch": 256} {"train_loss": -18.670082092285156, "global_step": 21321, "epoch": 256} {"train_loss": -18.01185417175293, "global_step": 21322, "epoch": 256} {"train_loss": -18.694948196411133, "global_step": 21323, "epoch": 256} {"train_loss": -18.485998153686523, "global_step": 21324, "epoch": 256} {"train_loss": -18.606908798217773, "global_step": 21325, "epoch": 256} {"train_loss": -18.318334579467773, "global_step": 21326, "epoch": 256} {"train_loss": -18.42719078063965, "global_step": 21327, "epoch": 256} {"train_loss": -18.566499710083008, "global_step": 21328, "epoch": 256} {"train_loss": -18.65803337097168, "global_step": 21329, "epoch": 256} {"train_loss": -18.454659335584527, "global_step": 21330, "epoch": 256, "val_loss": 5964370.0} {"train_loss": -18.36880874633789, "global_step": 21331, "epoch": 257} {"train_loss": -18.24664878845215, "global_step": 21332, "epoch": 257} {"train_loss": -17.969945907592773, "global_step": 21333, "epoch": 257} {"train_loss": -18.59765625, "global_step": 21334, "epoch": 257} {"train_loss": -18.30683135986328, "global_step": 21335, "epoch": 257} {"train_loss": -18.018070220947266, "global_step": 21336, "epoch": 257} {"train_loss": -18.26004409790039, "global_step": 21337, "epoch": 257} {"train_loss": -18.19122886657715, "global_step": 21338, "epoch": 257} {"train_loss": -18.3941593170166, "global_step": 21339, "epoch": 257} {"train_loss": -18.474422454833984, "global_step": 21340, "epoch": 257} {"train_loss": -18.403915405273438, "global_step": 21341, "epoch": 257} {"train_loss": -18.704069137573242, "global_step": 21342, "epoch": 257} {"train_loss": -18.306182861328125, "global_step": 21343, "epoch": 257} {"train_loss": -18.57647705078125, "global_step": 21344, "epoch": 257} {"train_loss": -18.640527725219727, "global_step": 21345, "epoch": 257} {"train_loss": -18.306615829467773, "global_step": 21346, "epoch": 257} {"train_loss": -18.36164665222168, "global_step": 21347, "epoch": 257} {"train_loss": -18.465150833129883, "global_step": 21348, "epoch": 257} {"train_loss": -18.159366607666016, "global_step": 21349, "epoch": 257} {"train_loss": -18.060062408447266, "global_step": 21350, "epoch": 257} {"train_loss": -18.289691925048828, "global_step": 21351, "epoch": 257} {"train_loss": -18.292078018188477, "global_step": 21352, "epoch": 257} {"train_loss": -18.36089515686035, "global_step": 21353, "epoch": 257} {"train_loss": -18.395938873291016, "global_step": 21354, "epoch": 257} {"train_loss": -18.754302978515625, "global_step": 21355, "epoch": 257} {"train_loss": -18.44767189025879, "global_step": 21356, "epoch": 257} {"train_loss": -18.574344635009766, "global_step": 21357, "epoch": 257} {"train_loss": -18.804441452026367, "global_step": 21358, "epoch": 257} {"train_loss": -18.491941452026367, "global_step": 21359, "epoch": 257} {"train_loss": -18.525768280029297, "global_step": 21360, "epoch": 257} {"train_loss": -17.98349380493164, "global_step": 21361, "epoch": 257} {"train_loss": -18.2165470123291, "global_step": 21362, "epoch": 257} {"train_loss": -18.555051803588867, "global_step": 21363, "epoch": 257} {"train_loss": -18.373634338378906, "global_step": 21364, "epoch": 257} {"train_loss": -18.51346206665039, "global_step": 21365, "epoch": 257} {"train_loss": -18.19272804260254, "global_step": 21366, "epoch": 257} {"train_loss": -18.394067764282227, "global_step": 21367, "epoch": 257} {"train_loss": -18.09966468811035, "global_step": 21368, "epoch": 257} {"train_loss": -18.320907592773438, "global_step": 21369, "epoch": 257} {"train_loss": -18.58424186706543, "global_step": 21370, "epoch": 257} {"train_loss": -18.65433120727539, "global_step": 21371, "epoch": 257} {"train_loss": -18.57904624938965, "global_step": 21372, "epoch": 257} {"train_loss": -18.26799964904785, "global_step": 21373, "epoch": 257} {"train_loss": -18.602468490600586, "global_step": 21374, "epoch": 257} {"train_loss": -18.404129028320312, "global_step": 21375, "epoch": 257} {"train_loss": -18.338483810424805, "global_step": 21376, "epoch": 257} {"train_loss": -18.423980712890625, "global_step": 21377, "epoch": 257} {"train_loss": -18.61891746520996, "global_step": 21378, "epoch": 257} {"train_loss": -18.2805233001709, "global_step": 21379, "epoch": 257} {"train_loss": -18.359289169311523, "global_step": 21380, "epoch": 257} {"train_loss": -18.987613677978516, "global_step": 21381, "epoch": 257} {"train_loss": -18.290849685668945, "global_step": 21382, "epoch": 257} {"train_loss": -18.335651397705078, "global_step": 21383, "epoch": 257} {"train_loss": -18.603046417236328, "global_step": 21384, "epoch": 257} {"train_loss": -18.463542938232422, "global_step": 21385, "epoch": 257} {"train_loss": -18.668527603149414, "global_step": 21386, "epoch": 257} {"train_loss": -18.538175582885742, "global_step": 21387, "epoch": 257} {"train_loss": -18.833890914916992, "global_step": 21388, "epoch": 257} {"train_loss": -18.935012817382812, "global_step": 21389, "epoch": 257} {"train_loss": -18.514602661132812, "global_step": 21390, "epoch": 257} {"train_loss": -18.444150924682617, "global_step": 21391, "epoch": 257} {"train_loss": -18.19009017944336, "global_step": 21392, "epoch": 257} {"train_loss": -18.69880485534668, "global_step": 21393, "epoch": 257} {"train_loss": -18.438262939453125, "global_step": 21394, "epoch": 257} {"train_loss": -18.3894100189209, "global_step": 21395, "epoch": 257} {"train_loss": -18.743600845336914, "global_step": 21396, "epoch": 257} {"train_loss": -18.4780216217041, "global_step": 21397, "epoch": 257} {"train_loss": -18.459232330322266, "global_step": 21398, "epoch": 257} {"train_loss": -18.598814010620117, "global_step": 21399, "epoch": 257} {"train_loss": -18.815326690673828, "global_step": 21400, "epoch": 257} {"train_loss": -18.868452072143555, "global_step": 21401, "epoch": 257} {"train_loss": -18.35603141784668, "global_step": 21402, "epoch": 257} {"train_loss": -18.637800216674805, "global_step": 21403, "epoch": 257} {"train_loss": -18.052518844604492, "global_step": 21404, "epoch": 257} {"train_loss": -18.38482666015625, "global_step": 21405, "epoch": 257} {"train_loss": -18.462923049926758, "global_step": 21406, "epoch": 257} {"train_loss": -18.21636962890625, "global_step": 21407, "epoch": 257} {"train_loss": -18.6711368560791, "global_step": 21408, "epoch": 257} {"train_loss": -18.69768714904785, "global_step": 21409, "epoch": 257} {"train_loss": -18.27726936340332, "global_step": 21410, "epoch": 257} {"train_loss": -18.49248695373535, "global_step": 21411, "epoch": 257} {"train_loss": -18.13983917236328, "global_step": 21412, "epoch": 257} {"train_loss": -18.450932537216737, "global_step": 21413, "epoch": 257, "val_loss": 6090162.0} {"train_loss": -18.53177261352539, "global_step": 21414, "epoch": 258} {"train_loss": -18.302968978881836, "global_step": 21415, "epoch": 258} {"train_loss": -18.18821907043457, "global_step": 21416, "epoch": 258} {"train_loss": -18.193307876586914, "global_step": 21417, "epoch": 258} {"train_loss": -18.355741500854492, "global_step": 21418, "epoch": 258} {"train_loss": -18.114500045776367, "global_step": 21419, "epoch": 258} {"train_loss": -18.368574142456055, "global_step": 21420, "epoch": 258} {"train_loss": -18.492345809936523, "global_step": 21421, "epoch": 258} {"train_loss": -18.256855010986328, "global_step": 21422, "epoch": 258} {"train_loss": -18.421850204467773, "global_step": 21423, "epoch": 258} {"train_loss": -18.496685028076172, "global_step": 21424, "epoch": 258} {"train_loss": -18.3204288482666, "global_step": 21425, "epoch": 258} {"train_loss": -18.142330169677734, "global_step": 21426, "epoch": 258} {"train_loss": -18.34828758239746, "global_step": 21427, "epoch": 258} {"train_loss": -18.24151611328125, "global_step": 21428, "epoch": 258} {"train_loss": -18.54644203186035, "global_step": 21429, "epoch": 258} {"train_loss": -18.500242233276367, "global_step": 21430, "epoch": 258} {"train_loss": -18.059038162231445, "global_step": 21431, "epoch": 258} {"train_loss": -18.469755172729492, "global_step": 21432, "epoch": 258} {"train_loss": -18.5501766204834, "global_step": 21433, "epoch": 258} {"train_loss": -18.635854721069336, "global_step": 21434, "epoch": 258} {"train_loss": -18.097951889038086, "global_step": 21435, "epoch": 258} {"train_loss": -18.529287338256836, "global_step": 21436, "epoch": 258} {"train_loss": -18.646875381469727, "global_step": 21437, "epoch": 258} {"train_loss": -18.416778564453125, "global_step": 21438, "epoch": 258} {"train_loss": -18.822500228881836, "global_step": 21439, "epoch": 258} {"train_loss": -18.5281925201416, "global_step": 21440, "epoch": 258} {"train_loss": -18.547481536865234, "global_step": 21441, "epoch": 258} {"train_loss": -18.35540771484375, "global_step": 21442, "epoch": 258} {"train_loss": -18.384668350219727, "global_step": 21443, "epoch": 258} {"train_loss": -18.765859603881836, "global_step": 21444, "epoch": 258} {"train_loss": -18.426359176635742, "global_step": 21445, "epoch": 258} {"train_loss": -18.292661666870117, "global_step": 21446, "epoch": 258} {"train_loss": -18.469823837280273, "global_step": 21447, "epoch": 258} {"train_loss": -18.166522979736328, "global_step": 21448, "epoch": 258} {"train_loss": -18.27906608581543, "global_step": 21449, "epoch": 258} {"train_loss": -18.5035343170166, "global_step": 21450, "epoch": 258} {"train_loss": -18.69576072692871, "global_step": 21451, "epoch": 258} {"train_loss": -18.589712142944336, "global_step": 21452, "epoch": 258} {"train_loss": -18.64588737487793, "global_step": 21453, "epoch": 258} {"train_loss": -18.249601364135742, "global_step": 21454, "epoch": 258} {"train_loss": -18.902677536010742, "global_step": 21455, "epoch": 258} {"train_loss": -18.402576446533203, "global_step": 21456, "epoch": 258} {"train_loss": -18.64401626586914, "global_step": 21457, "epoch": 258} {"train_loss": -18.579591751098633, "global_step": 21458, "epoch": 258} {"train_loss": -18.30628776550293, "global_step": 21459, "epoch": 258} {"train_loss": -18.20649528503418, "global_step": 21460, "epoch": 258} {"train_loss": -18.484622955322266, "global_step": 21461, "epoch": 258} {"train_loss": -18.453182220458984, "global_step": 21462, "epoch": 258} {"train_loss": -18.53293800354004, "global_step": 21463, "epoch": 258} {"train_loss": -18.36852264404297, "global_step": 21464, "epoch": 258} {"train_loss": -18.60902214050293, "global_step": 21465, "epoch": 258} {"train_loss": -18.654367446899414, "global_step": 21466, "epoch": 258} {"train_loss": -18.428735733032227, "global_step": 21467, "epoch": 258} {"train_loss": -18.666418075561523, "global_step": 21468, "epoch": 258} {"train_loss": -18.391225814819336, "global_step": 21469, "epoch": 258} {"train_loss": -18.27626609802246, "global_step": 21470, "epoch": 258} {"train_loss": -18.51323890686035, "global_step": 21471, "epoch": 258} {"train_loss": -18.459753036499023, "global_step": 21472, "epoch": 258} {"train_loss": -18.492170333862305, "global_step": 21473, "epoch": 258} {"train_loss": -18.805280685424805, "global_step": 21474, "epoch": 258} {"train_loss": -18.56422233581543, "global_step": 21475, "epoch": 258} {"train_loss": -18.223966598510742, "global_step": 21476, "epoch": 258} {"train_loss": -18.54395866394043, "global_step": 21477, "epoch": 258} {"train_loss": -18.7049503326416, "global_step": 21478, "epoch": 258} {"train_loss": -19.09783935546875, "global_step": 21479, "epoch": 258} {"train_loss": -18.427892684936523, "global_step": 21480, "epoch": 258} {"train_loss": -18.730113983154297, "global_step": 21481, "epoch": 258} {"train_loss": -18.44582176208496, "global_step": 21482, "epoch": 258} {"train_loss": -18.305904388427734, "global_step": 21483, "epoch": 258} {"train_loss": -18.199522018432617, "global_step": 21484, "epoch": 258} {"train_loss": -18.541278839111328, "global_step": 21485, "epoch": 258} {"train_loss": -18.64954948425293, "global_step": 21486, "epoch": 258} {"train_loss": -18.07853126525879, "global_step": 21487, "epoch": 258} {"train_loss": -18.560710906982422, "global_step": 21488, "epoch": 258} {"train_loss": -18.437664031982422, "global_step": 21489, "epoch": 258} {"train_loss": -18.877450942993164, "global_step": 21490, "epoch": 258} {"train_loss": -18.60127830505371, "global_step": 21491, "epoch": 258} {"train_loss": -18.74288558959961, "global_step": 21492, "epoch": 258} {"train_loss": -18.360517501831055, "global_step": 21493, "epoch": 258} {"train_loss": -18.44050407409668, "global_step": 21494, "epoch": 258} {"train_loss": -18.889434814453125, "global_step": 21495, "epoch": 258} {"train_loss": -18.46443822010454, "global_step": 21496, "epoch": 258, "val_loss": 5892350.5} {"train_loss": -18.469741821289062, "global_step": 21497, "epoch": 259} {"train_loss": -18.389909744262695, "global_step": 21498, "epoch": 259} {"train_loss": -18.111963272094727, "global_step": 21499, "epoch": 259} {"train_loss": -18.72342872619629, "global_step": 21500, "epoch": 259} {"train_loss": -18.80499267578125, "global_step": 21501, "epoch": 259} {"train_loss": -18.31477165222168, "global_step": 21502, "epoch": 259} {"train_loss": -18.538990020751953, "global_step": 21503, "epoch": 259} {"train_loss": -18.549230575561523, "global_step": 21504, "epoch": 259} {"train_loss": -18.0865478515625, "global_step": 21505, "epoch": 259} {"train_loss": -18.5914306640625, "global_step": 21506, "epoch": 259} {"train_loss": -18.401941299438477, "global_step": 21507, "epoch": 259} {"train_loss": -18.80915641784668, "global_step": 21508, "epoch": 259} {"train_loss": -18.615447998046875, "global_step": 21509, "epoch": 259} {"train_loss": -18.697128295898438, "global_step": 21510, "epoch": 259} {"train_loss": -18.450239181518555, "global_step": 21511, "epoch": 259} {"train_loss": -18.277021408081055, "global_step": 21512, "epoch": 259} {"train_loss": -18.275875091552734, "global_step": 21513, "epoch": 259} {"train_loss": -18.7753963470459, "global_step": 21514, "epoch": 259} {"train_loss": -18.517513275146484, "global_step": 21515, "epoch": 259} {"train_loss": -18.620227813720703, "global_step": 21516, "epoch": 259} {"train_loss": -18.364622116088867, "global_step": 21517, "epoch": 259} {"train_loss": -18.20990753173828, "global_step": 21518, "epoch": 259} {"train_loss": -18.445037841796875, "global_step": 21519, "epoch": 259} {"train_loss": -18.534969329833984, "global_step": 21520, "epoch": 259} {"train_loss": -18.324466705322266, "global_step": 21521, "epoch": 259} {"train_loss": -18.542566299438477, "global_step": 21522, "epoch": 259} {"train_loss": -18.747146606445312, "global_step": 21523, "epoch": 259} {"train_loss": -18.751558303833008, "global_step": 21524, "epoch": 259} {"train_loss": -18.811655044555664, "global_step": 21525, "epoch": 259} {"train_loss": -18.332778930664062, "global_step": 21526, "epoch": 259} {"train_loss": -18.353918075561523, "global_step": 21527, "epoch": 259} {"train_loss": -18.586759567260742, "global_step": 21528, "epoch": 259} {"train_loss": -18.295576095581055, "global_step": 21529, "epoch": 259} {"train_loss": -18.22776985168457, "global_step": 21530, "epoch": 259} {"train_loss": -18.63102149963379, "global_step": 21531, "epoch": 259} {"train_loss": -18.379981994628906, "global_step": 21532, "epoch": 259} {"train_loss": -18.539840698242188, "global_step": 21533, "epoch": 259} {"train_loss": -18.44446563720703, "global_step": 21534, "epoch": 259} {"train_loss": -18.028608322143555, "global_step": 21535, "epoch": 259} {"train_loss": -18.613492965698242, "global_step": 21536, "epoch": 259} {"train_loss": -18.38750457763672, "global_step": 21537, "epoch": 259} {"train_loss": -18.534900665283203, "global_step": 21538, "epoch": 259} {"train_loss": -18.240636825561523, "global_step": 21539, "epoch": 259} {"train_loss": -18.665382385253906, "global_step": 21540, "epoch": 259} {"train_loss": -18.616085052490234, "global_step": 21541, "epoch": 259} {"train_loss": -18.299072265625, "global_step": 21542, "epoch": 259} {"train_loss": -18.519102096557617, "global_step": 21543, "epoch": 259} {"train_loss": -18.169097900390625, "global_step": 21544, "epoch": 259} {"train_loss": -18.37899398803711, "global_step": 21545, "epoch": 259} {"train_loss": -18.44154167175293, "global_step": 21546, "epoch": 259} {"train_loss": -18.57814598083496, "global_step": 21547, "epoch": 259} {"train_loss": -18.622303009033203, "global_step": 21548, "epoch": 259} {"train_loss": -18.756877899169922, "global_step": 21549, "epoch": 259} {"train_loss": -18.25202751159668, "global_step": 21550, "epoch": 259} {"train_loss": -18.61655044555664, "global_step": 21551, "epoch": 259} {"train_loss": -18.11141586303711, "global_step": 21552, "epoch": 259} {"train_loss": -18.621566772460938, "global_step": 21553, "epoch": 259} {"train_loss": -18.482229232788086, "global_step": 21554, "epoch": 259} {"train_loss": -18.562482833862305, "global_step": 21555, "epoch": 259} {"train_loss": -18.530420303344727, "global_step": 21556, "epoch": 259} {"train_loss": -18.540990829467773, "global_step": 21557, "epoch": 259} {"train_loss": -18.748273849487305, "global_step": 21558, "epoch": 259} {"train_loss": -18.15431022644043, "global_step": 21559, "epoch": 259} {"train_loss": -18.669336318969727, "global_step": 21560, "epoch": 259} {"train_loss": -18.430740356445312, "global_step": 21561, "epoch": 259} {"train_loss": -18.49285125732422, "global_step": 21562, "epoch": 259} {"train_loss": -18.641103744506836, "global_step": 21563, "epoch": 259} {"train_loss": -18.317035675048828, "global_step": 21564, "epoch": 259} {"train_loss": -18.374513626098633, "global_step": 21565, "epoch": 259} {"train_loss": -18.179851531982422, "global_step": 21566, "epoch": 259} {"train_loss": -18.264728546142578, "global_step": 21567, "epoch": 259} {"train_loss": -18.152629852294922, "global_step": 21568, "epoch": 259} {"train_loss": -18.76071548461914, "global_step": 21569, "epoch": 259} {"train_loss": -18.252044677734375, "global_step": 21570, "epoch": 259} {"train_loss": -18.300220489501953, "global_step": 21571, "epoch": 259} {"train_loss": -18.58715057373047, "global_step": 21572, "epoch": 259} {"train_loss": -18.569761276245117, "global_step": 21573, "epoch": 259} {"train_loss": -18.3289737701416, "global_step": 21574, "epoch": 259} {"train_loss": -18.562578201293945, "global_step": 21575, "epoch": 259} {"train_loss": -18.3355770111084, "global_step": 21576, "epoch": 259} {"train_loss": -18.51170539855957, "global_step": 21577, "epoch": 259} {"train_loss": -18.59029197692871, "global_step": 21578, "epoch": 259} {"train_loss": -18.463604639811688, "global_step": 21579, "epoch": 259, "val_loss": 6101364.0} {"train_loss": -17.998388290405273, "global_step": 21580, "epoch": 260} {"train_loss": -18.4320011138916, "global_step": 21581, "epoch": 260} {"train_loss": -18.249433517456055, "global_step": 21582, "epoch": 260} {"train_loss": -18.549333572387695, "global_step": 21583, "epoch": 260} {"train_loss": -18.021554946899414, "global_step": 21584, "epoch": 260} {"train_loss": -18.388418197631836, "global_step": 21585, "epoch": 260} {"train_loss": -18.502897262573242, "global_step": 21586, "epoch": 260} {"train_loss": -18.719751358032227, "global_step": 21587, "epoch": 260} {"train_loss": -18.446128845214844, "global_step": 21588, "epoch": 260} {"train_loss": -18.29829978942871, "global_step": 21589, "epoch": 260} {"train_loss": -18.32682228088379, "global_step": 21590, "epoch": 260} {"train_loss": -18.543621063232422, "global_step": 21591, "epoch": 260} {"train_loss": -18.249229431152344, "global_step": 21592, "epoch": 260} {"train_loss": -18.478084564208984, "global_step": 21593, "epoch": 260} {"train_loss": -18.59303092956543, "global_step": 21594, "epoch": 260} {"train_loss": -18.233367919921875, "global_step": 21595, "epoch": 260} {"train_loss": -18.6712589263916, "global_step": 21596, "epoch": 260} {"train_loss": -17.999296188354492, "global_step": 21597, "epoch": 260} {"train_loss": -18.481414794921875, "global_step": 21598, "epoch": 260} {"train_loss": -18.626914978027344, "global_step": 21599, "epoch": 260} {"train_loss": -18.63517189025879, "global_step": 21600, "epoch": 260} {"train_loss": -18.548208236694336, "global_step": 21601, "epoch": 260} {"train_loss": -18.273855209350586, "global_step": 21602, "epoch": 260} {"train_loss": -18.73036003112793, "global_step": 21603, "epoch": 260} {"train_loss": -18.48689079284668, "global_step": 21604, "epoch": 260} {"train_loss": -18.575714111328125, "global_step": 21605, "epoch": 260} {"train_loss": -18.515323638916016, "global_step": 21606, "epoch": 260} {"train_loss": -18.427188873291016, "global_step": 21607, "epoch": 260} {"train_loss": -18.471567153930664, "global_step": 21608, "epoch": 260} {"train_loss": -18.379629135131836, "global_step": 21609, "epoch": 260} {"train_loss": -18.777299880981445, "global_step": 21610, "epoch": 260} {"train_loss": -18.345373153686523, "global_step": 21611, "epoch": 260} {"train_loss": -18.607519149780273, "global_step": 21612, "epoch": 260} {"train_loss": -18.81220054626465, "global_step": 21613, "epoch": 260} {"train_loss": -18.528038024902344, "global_step": 21614, "epoch": 260} {"train_loss": -18.22476577758789, "global_step": 21615, "epoch": 260} {"train_loss": -18.487951278686523, "global_step": 21616, "epoch": 260} {"train_loss": -18.55316162109375, "global_step": 21617, "epoch": 260} {"train_loss": -18.42647361755371, "global_step": 21618, "epoch": 260} {"train_loss": -18.40316390991211, "global_step": 21619, "epoch": 260} {"train_loss": -18.66290855407715, "global_step": 21620, "epoch": 260} {"train_loss": -18.46052360534668, "global_step": 21621, "epoch": 260} {"train_loss": -18.355573654174805, "global_step": 21622, "epoch": 260} {"train_loss": -18.25050926208496, "global_step": 21623, "epoch": 260} {"train_loss": -18.606672286987305, "global_step": 21624, "epoch": 260} {"train_loss": -18.447805404663086, "global_step": 21625, "epoch": 260} {"train_loss": -18.56966781616211, "global_step": 21626, "epoch": 260} {"train_loss": -18.31020164489746, "global_step": 21627, "epoch": 260} {"train_loss": -18.28126335144043, "global_step": 21628, "epoch": 260} {"train_loss": -18.304664611816406, "global_step": 21629, "epoch": 260} {"train_loss": -18.4305477142334, "global_step": 21630, "epoch": 260} {"train_loss": -18.51885986328125, "global_step": 21631, "epoch": 260} {"train_loss": -18.70625877380371, "global_step": 21632, "epoch": 260} {"train_loss": -18.643503189086914, "global_step": 21633, "epoch": 260} {"train_loss": -18.543813705444336, "global_step": 21634, "epoch": 260} {"train_loss": -18.649442672729492, "global_step": 21635, "epoch": 260} {"train_loss": -18.180116653442383, "global_step": 21636, "epoch": 260} {"train_loss": -18.196645736694336, "global_step": 21637, "epoch": 260} {"train_loss": -18.348886489868164, "global_step": 21638, "epoch": 260} {"train_loss": -18.552135467529297, "global_step": 21639, "epoch": 260} {"train_loss": -18.71088218688965, "global_step": 21640, "epoch": 260} {"train_loss": -18.288997650146484, "global_step": 21641, "epoch": 260} {"train_loss": -18.49118995666504, "global_step": 21642, "epoch": 260} {"train_loss": -18.769824981689453, "global_step": 21643, "epoch": 260} {"train_loss": -18.421144485473633, "global_step": 21644, "epoch": 260} {"train_loss": -18.8056697845459, "global_step": 21645, "epoch": 260} {"train_loss": -18.51333236694336, "global_step": 21646, "epoch": 260} {"train_loss": -18.28985595703125, "global_step": 21647, "epoch": 260} {"train_loss": -18.147382736206055, "global_step": 21648, "epoch": 260} {"train_loss": -18.227218627929688, "global_step": 21649, "epoch": 260} {"train_loss": -18.774185180664062, "global_step": 21650, "epoch": 260} {"train_loss": -18.384565353393555, "global_step": 21651, "epoch": 260} {"train_loss": -18.34388542175293, "global_step": 21652, "epoch": 260} {"train_loss": -18.384206771850586, "global_step": 21653, "epoch": 260} {"train_loss": -18.46538734436035, "global_step": 21654, "epoch": 260} {"train_loss": -18.33551597595215, "global_step": 21655, "epoch": 260} {"train_loss": -18.745893478393555, "global_step": 21656, "epoch": 260} {"train_loss": -18.250242233276367, "global_step": 21657, "epoch": 260} {"train_loss": -18.496591567993164, "global_step": 21658, "epoch": 260} {"train_loss": -18.820249557495117, "global_step": 21659, "epoch": 260} {"train_loss": -18.412870407104492, "global_step": 21660, "epoch": 260} {"train_loss": -18.337234497070312, "global_step": 21661, "epoch": 260} {"train_loss": -18.453088599515247, "global_step": 21662, "epoch": 260, "val_loss": 5874381.0} {"train_loss": -17.98598289489746, "global_step": 21663, "epoch": 261} {"train_loss": -17.9226016998291, "global_step": 21664, "epoch": 261} {"train_loss": -18.36374282836914, "global_step": 21665, "epoch": 261} {"train_loss": -18.443500518798828, "global_step": 21666, "epoch": 261} {"train_loss": -18.469491958618164, "global_step": 21667, "epoch": 261} {"train_loss": -18.09177017211914, "global_step": 21668, "epoch": 261} {"train_loss": -18.10329246520996, "global_step": 21669, "epoch": 261} {"train_loss": -18.177785873413086, "global_step": 21670, "epoch": 261} {"train_loss": -18.277942657470703, "global_step": 21671, "epoch": 261} {"train_loss": -18.782596588134766, "global_step": 21672, "epoch": 261} {"train_loss": -18.487104415893555, "global_step": 21673, "epoch": 261} {"train_loss": -18.48469352722168, "global_step": 21674, "epoch": 261} {"train_loss": -18.383222579956055, "global_step": 21675, "epoch": 261} {"train_loss": -17.99156951904297, "global_step": 21676, "epoch": 261} {"train_loss": -18.398319244384766, "global_step": 21677, "epoch": 261} {"train_loss": -18.215234756469727, "global_step": 21678, "epoch": 261} {"train_loss": -18.55992317199707, "global_step": 21679, "epoch": 261} {"train_loss": -18.53864097595215, "global_step": 21680, "epoch": 261} {"train_loss": -18.183242797851562, "global_step": 21681, "epoch": 261} {"train_loss": -18.618860244750977, "global_step": 21682, "epoch": 261} {"train_loss": -18.46552276611328, "global_step": 21683, "epoch": 261} {"train_loss": -18.64350128173828, "global_step": 21684, "epoch": 261} {"train_loss": -18.324934005737305, "global_step": 21685, "epoch": 261} {"train_loss": -18.306264877319336, "global_step": 21686, "epoch": 261} {"train_loss": -18.618261337280273, "global_step": 21687, "epoch": 261} {"train_loss": -18.271162033081055, "global_step": 21688, "epoch": 261} {"train_loss": -18.665176391601562, "global_step": 21689, "epoch": 261} {"train_loss": -18.47208595275879, "global_step": 21690, "epoch": 261} {"train_loss": -18.840919494628906, "global_step": 21691, "epoch": 261} {"train_loss": -18.7402400970459, "global_step": 21692, "epoch": 261} {"train_loss": -18.59528923034668, "global_step": 21693, "epoch": 261} {"train_loss": -18.788883209228516, "global_step": 21694, "epoch": 261} {"train_loss": -18.629810333251953, "global_step": 21695, "epoch": 261} {"train_loss": -18.561511993408203, "global_step": 21696, "epoch": 261} {"train_loss": -18.40006446838379, "global_step": 21697, "epoch": 261} {"train_loss": -18.297306060791016, "global_step": 21698, "epoch": 261} {"train_loss": -18.502796173095703, "global_step": 21699, "epoch": 261} {"train_loss": -18.401914596557617, "global_step": 21700, "epoch": 261} {"train_loss": -18.373966217041016, "global_step": 21701, "epoch": 261} {"train_loss": -18.406408309936523, "global_step": 21702, "epoch": 261} {"train_loss": -18.678232192993164, "global_step": 21703, "epoch": 261} {"train_loss": -18.453548431396484, "global_step": 21704, "epoch": 261} {"train_loss": -18.273269653320312, "global_step": 21705, "epoch": 261} {"train_loss": -18.62895965576172, "global_step": 21706, "epoch": 261} {"train_loss": -18.470783233642578, "global_step": 21707, "epoch": 261} {"train_loss": -18.333452224731445, "global_step": 21708, "epoch": 261} {"train_loss": -18.155073165893555, "global_step": 21709, "epoch": 261} {"train_loss": -18.626556396484375, "global_step": 21710, "epoch": 261} {"train_loss": -18.661046981811523, "global_step": 21711, "epoch": 261} {"train_loss": -18.28181266784668, "global_step": 21712, "epoch": 261} {"train_loss": -18.223581314086914, "global_step": 21713, "epoch": 261} {"train_loss": -18.630924224853516, "global_step": 21714, "epoch": 261} {"train_loss": -18.618074417114258, "global_step": 21715, "epoch": 261} {"train_loss": -18.679550170898438, "global_step": 21716, "epoch": 261} {"train_loss": -18.57406234741211, "global_step": 21717, "epoch": 261} {"train_loss": -18.708805084228516, "global_step": 21718, "epoch": 261} {"train_loss": -18.445253372192383, "global_step": 21719, "epoch": 261} {"train_loss": -18.405853271484375, "global_step": 21720, "epoch": 261} {"train_loss": -18.760578155517578, "global_step": 21721, "epoch": 261} {"train_loss": -18.387300491333008, "global_step": 21722, "epoch": 261} {"train_loss": -18.39206314086914, "global_step": 21723, "epoch": 261} {"train_loss": -18.547882080078125, "global_step": 21724, "epoch": 261} {"train_loss": -18.58502960205078, "global_step": 21725, "epoch": 261} {"train_loss": -18.34359359741211, "global_step": 21726, "epoch": 261} {"train_loss": -18.286314010620117, "global_step": 21727, "epoch": 261} {"train_loss": -18.412343978881836, "global_step": 21728, "epoch": 261} {"train_loss": -17.82997703552246, "global_step": 21729, "epoch": 261} {"train_loss": -18.637893676757812, "global_step": 21730, "epoch": 261} {"train_loss": -18.50532341003418, "global_step": 21731, "epoch": 261} {"train_loss": -18.652767181396484, "global_step": 21732, "epoch": 261} {"train_loss": -18.475631713867188, "global_step": 21733, "epoch": 261} {"train_loss": -18.33036231994629, "global_step": 21734, "epoch": 261} {"train_loss": -18.28911590576172, "global_step": 21735, "epoch": 261} {"train_loss": -18.61825942993164, "global_step": 21736, "epoch": 261} {"train_loss": -18.32724952697754, "global_step": 21737, "epoch": 261} {"train_loss": -18.28426170349121, "global_step": 21738, "epoch": 261} {"train_loss": -18.57545280456543, "global_step": 21739, "epoch": 261} {"train_loss": -18.261560440063477, "global_step": 21740, "epoch": 261} {"train_loss": -18.54737663269043, "global_step": 21741, "epoch": 261} {"train_loss": -18.632291793823242, "global_step": 21742, "epoch": 261} {"train_loss": -18.69891357421875, "global_step": 21743, "epoch": 261} {"train_loss": -18.121662139892578, "global_step": 21744, "epoch": 261} {"train_loss": -18.449480194643318, "global_step": 21745, "epoch": 261, "val_loss": 5923392.5} {"train_loss": -18.51282501220703, "global_step": 21746, "epoch": 262} {"train_loss": -18.507816314697266, "global_step": 21747, "epoch": 262} {"train_loss": -19.06546974182129, "global_step": 21748, "epoch": 262} {"train_loss": -18.23099136352539, "global_step": 21749, "epoch": 262} {"train_loss": -18.531843185424805, "global_step": 21750, "epoch": 262} {"train_loss": -18.680200576782227, "global_step": 21751, "epoch": 262} {"train_loss": -18.643033981323242, "global_step": 21752, "epoch": 262} {"train_loss": -19.111539840698242, "global_step": 21753, "epoch": 262} {"train_loss": -18.456411361694336, "global_step": 21754, "epoch": 262} {"train_loss": -18.292499542236328, "global_step": 21755, "epoch": 262} {"train_loss": -18.61372184753418, "global_step": 21756, "epoch": 262} {"train_loss": -18.656686782836914, "global_step": 21757, "epoch": 262} {"train_loss": -18.621854782104492, "global_step": 21758, "epoch": 262} {"train_loss": -18.155014038085938, "global_step": 21759, "epoch": 262} {"train_loss": -18.27915382385254, "global_step": 21760, "epoch": 262} {"train_loss": -18.4903621673584, "global_step": 21761, "epoch": 262} {"train_loss": -18.7114315032959, "global_step": 21762, "epoch": 262} {"train_loss": -18.54239273071289, "global_step": 21763, "epoch": 262} {"train_loss": -18.48478126525879, "global_step": 21764, "epoch": 262} {"train_loss": -18.51557731628418, "global_step": 21765, "epoch": 262} {"train_loss": -18.062097549438477, "global_step": 21766, "epoch": 262} {"train_loss": -18.695775985717773, "global_step": 21767, "epoch": 262} {"train_loss": -18.217300415039062, "global_step": 21768, "epoch": 262} {"train_loss": -18.278623580932617, "global_step": 21769, "epoch": 262} {"train_loss": -18.26105308532715, "global_step": 21770, "epoch": 262} {"train_loss": -18.423612594604492, "global_step": 21771, "epoch": 262} {"train_loss": -18.497920989990234, "global_step": 21772, "epoch": 262} {"train_loss": -18.61376953125, "global_step": 21773, "epoch": 262} {"train_loss": -18.792692184448242, "global_step": 21774, "epoch": 262} {"train_loss": -18.05500602722168, "global_step": 21775, "epoch": 262} {"train_loss": -18.155820846557617, "global_step": 21776, "epoch": 262} {"train_loss": -18.641935348510742, "global_step": 21777, "epoch": 262} {"train_loss": -18.16394805908203, "global_step": 21778, "epoch": 262} {"train_loss": -18.417814254760742, "global_step": 21779, "epoch": 262} {"train_loss": -18.411212921142578, "global_step": 21780, "epoch": 262} {"train_loss": -18.50995445251465, "global_step": 21781, "epoch": 262} {"train_loss": -18.47959327697754, "global_step": 21782, "epoch": 262} {"train_loss": -18.550329208374023, "global_step": 21783, "epoch": 262} {"train_loss": -18.768285751342773, "global_step": 21784, "epoch": 262} {"train_loss": -18.54096031188965, "global_step": 21785, "epoch": 262} {"train_loss": -18.500600814819336, "global_step": 21786, "epoch": 262} {"train_loss": -18.490772247314453, "global_step": 21787, "epoch": 262} {"train_loss": -18.708526611328125, "global_step": 21788, "epoch": 262} {"train_loss": -18.559431076049805, "global_step": 21789, "epoch": 262} {"train_loss": -18.491165161132812, "global_step": 21790, "epoch": 262} {"train_loss": -18.361616134643555, "global_step": 21791, "epoch": 262} {"train_loss": -18.501508712768555, "global_step": 21792, "epoch": 262} {"train_loss": -18.259130477905273, "global_step": 21793, "epoch": 262} {"train_loss": -18.482797622680664, "global_step": 21794, "epoch": 262} {"train_loss": -18.666664123535156, "global_step": 21795, "epoch": 262} {"train_loss": -18.57557487487793, "global_step": 21796, "epoch": 262} {"train_loss": -18.132497787475586, "global_step": 21797, "epoch": 262} {"train_loss": -18.401708602905273, "global_step": 21798, "epoch": 262} {"train_loss": -18.858522415161133, "global_step": 21799, "epoch": 262} {"train_loss": -18.512296676635742, "global_step": 21800, "epoch": 262} {"train_loss": -18.402414321899414, "global_step": 21801, "epoch": 262} {"train_loss": -18.10359764099121, "global_step": 21802, "epoch": 262} {"train_loss": -18.911611557006836, "global_step": 21803, "epoch": 262} {"train_loss": -18.37639808654785, "global_step": 21804, "epoch": 262} {"train_loss": -18.419157028198242, "global_step": 21805, "epoch": 262} {"train_loss": -18.348905563354492, "global_step": 21806, "epoch": 262} {"train_loss": -18.196548461914062, "global_step": 21807, "epoch": 262} {"train_loss": -18.273136138916016, "global_step": 21808, "epoch": 262} {"train_loss": -18.72188949584961, "global_step": 21809, "epoch": 262} {"train_loss": -18.423938751220703, "global_step": 21810, "epoch": 262} {"train_loss": -18.445552825927734, "global_step": 21811, "epoch": 262} {"train_loss": -18.5568790435791, "global_step": 21812, "epoch": 262} {"train_loss": -18.48247718811035, "global_step": 21813, "epoch": 262} {"train_loss": -18.476621627807617, "global_step": 21814, "epoch": 262} {"train_loss": -18.23137855529785, "global_step": 21815, "epoch": 262} {"train_loss": -18.437742233276367, "global_step": 21816, "epoch": 262} {"train_loss": -18.153701782226562, "global_step": 21817, "epoch": 262} {"train_loss": -18.385099411010742, "global_step": 21818, "epoch": 262} {"train_loss": -18.409683227539062, "global_step": 21819, "epoch": 262} {"train_loss": -18.52224349975586, "global_step": 21820, "epoch": 262} {"train_loss": -18.420316696166992, "global_step": 21821, "epoch": 262} {"train_loss": -18.39588737487793, "global_step": 21822, "epoch": 262} {"train_loss": -18.5393009185791, "global_step": 21823, "epoch": 262} {"train_loss": -18.3458309173584, "global_step": 21824, "epoch": 262} {"train_loss": -18.294057846069336, "global_step": 21825, "epoch": 262} {"train_loss": -18.743505477905273, "global_step": 21826, "epoch": 262} {"train_loss": -18.226032257080078, "global_step": 21827, "epoch": 262} {"train_loss": -18.459577215723243, "global_step": 21828, "epoch": 262, "val_loss": 5964178.0} {"train_loss": -17.817445755004883, "global_step": 21829, "epoch": 263} {"train_loss": -18.286611557006836, "global_step": 21830, "epoch": 263} {"train_loss": -17.84183120727539, "global_step": 21831, "epoch": 263} {"train_loss": -18.29768180847168, "global_step": 21832, "epoch": 263} {"train_loss": -18.093303680419922, "global_step": 21833, "epoch": 263} {"train_loss": -18.24410629272461, "global_step": 21834, "epoch": 263} {"train_loss": -18.60879898071289, "global_step": 21835, "epoch": 263} {"train_loss": -18.457021713256836, "global_step": 21836, "epoch": 263} {"train_loss": -17.82463836669922, "global_step": 21837, "epoch": 263} {"train_loss": -18.361326217651367, "global_step": 21838, "epoch": 263} {"train_loss": -17.945539474487305, "global_step": 21839, "epoch": 263} {"train_loss": -18.44131851196289, "global_step": 21840, "epoch": 263} {"train_loss": -18.032794952392578, "global_step": 21841, "epoch": 263} {"train_loss": -18.293058395385742, "global_step": 21842, "epoch": 263} {"train_loss": -18.142410278320312, "global_step": 21843, "epoch": 263} {"train_loss": -18.511037826538086, "global_step": 21844, "epoch": 263} {"train_loss": -18.333091735839844, "global_step": 21845, "epoch": 263} {"train_loss": -18.52338218688965, "global_step": 21846, "epoch": 263} {"train_loss": -18.213733673095703, "global_step": 21847, "epoch": 263} {"train_loss": -18.538433074951172, "global_step": 21848, "epoch": 263} {"train_loss": -18.300418853759766, "global_step": 21849, "epoch": 263} {"train_loss": -18.760520935058594, "global_step": 21850, "epoch": 263} {"train_loss": -18.29007911682129, "global_step": 21851, "epoch": 263} {"train_loss": -18.602216720581055, "global_step": 21852, "epoch": 263} {"train_loss": -18.16472816467285, "global_step": 21853, "epoch": 263} {"train_loss": -18.260374069213867, "global_step": 21854, "epoch": 263} {"train_loss": -18.249290466308594, "global_step": 21855, "epoch": 263} {"train_loss": -18.945091247558594, "global_step": 21856, "epoch": 263} {"train_loss": -18.455732345581055, "global_step": 21857, "epoch": 263} {"train_loss": -18.174123764038086, "global_step": 21858, "epoch": 263} {"train_loss": -18.440155029296875, "global_step": 21859, "epoch": 263} {"train_loss": -18.446212768554688, "global_step": 21860, "epoch": 263} {"train_loss": -18.188589096069336, "global_step": 21861, "epoch": 263} {"train_loss": -18.588293075561523, "global_step": 21862, "epoch": 263} {"train_loss": -18.150327682495117, "global_step": 21863, "epoch": 263} {"train_loss": -18.635955810546875, "global_step": 21864, "epoch": 263} {"train_loss": -18.527420043945312, "global_step": 21865, "epoch": 263} {"train_loss": -18.549694061279297, "global_step": 21866, "epoch": 263} {"train_loss": -18.379104614257812, "global_step": 21867, "epoch": 263} {"train_loss": -18.273242950439453, "global_step": 21868, "epoch": 263} {"train_loss": -18.48048973083496, "global_step": 21869, "epoch": 263} {"train_loss": -18.27024269104004, "global_step": 21870, "epoch": 263} {"train_loss": -18.629730224609375, "global_step": 21871, "epoch": 263} {"train_loss": -18.41370964050293, "global_step": 21872, "epoch": 263} {"train_loss": -18.551523208618164, "global_step": 21873, "epoch": 263} {"train_loss": -18.667203903198242, "global_step": 21874, "epoch": 263} {"train_loss": -18.613401412963867, "global_step": 21875, "epoch": 263} {"train_loss": -18.811277389526367, "global_step": 21876, "epoch": 263} {"train_loss": -18.161474227905273, "global_step": 21877, "epoch": 263} {"train_loss": -18.441259384155273, "global_step": 21878, "epoch": 263} {"train_loss": -18.400577545166016, "global_step": 21879, "epoch": 263} {"train_loss": -18.748815536499023, "global_step": 21880, "epoch": 263} {"train_loss": -18.044235229492188, "global_step": 21881, "epoch": 263} {"train_loss": -18.175344467163086, "global_step": 21882, "epoch": 263} {"train_loss": -18.36005210876465, "global_step": 21883, "epoch": 263} {"train_loss": -18.727436065673828, "global_step": 21884, "epoch": 263} {"train_loss": -18.147968292236328, "global_step": 21885, "epoch": 263} {"train_loss": -18.30299186706543, "global_step": 21886, "epoch": 263} {"train_loss": -18.44972801208496, "global_step": 21887, "epoch": 263} {"train_loss": -18.80726432800293, "global_step": 21888, "epoch": 263} {"train_loss": -18.61771583557129, "global_step": 21889, "epoch": 263} {"train_loss": -18.267858505249023, "global_step": 21890, "epoch": 263} {"train_loss": -18.66637420654297, "global_step": 21891, "epoch": 263} {"train_loss": -18.370527267456055, "global_step": 21892, "epoch": 263} {"train_loss": -18.4041805267334, "global_step": 21893, "epoch": 263} {"train_loss": -18.548419952392578, "global_step": 21894, "epoch": 263} {"train_loss": -18.493932723999023, "global_step": 21895, "epoch": 263} {"train_loss": -18.660093307495117, "global_step": 21896, "epoch": 263} {"train_loss": -18.610010147094727, "global_step": 21897, "epoch": 263} {"train_loss": -18.619783401489258, "global_step": 21898, "epoch": 263} {"train_loss": -18.186628341674805, "global_step": 21899, "epoch": 263} {"train_loss": -18.345062255859375, "global_step": 21900, "epoch": 263} {"train_loss": -18.667818069458008, "global_step": 21901, "epoch": 263} {"train_loss": -18.44221305847168, "global_step": 21902, "epoch": 263} {"train_loss": -18.863134384155273, "global_step": 21903, "epoch": 263} {"train_loss": -18.593597412109375, "global_step": 21904, "epoch": 263} {"train_loss": -18.70941925048828, "global_step": 21905, "epoch": 263} {"train_loss": -18.52286720275879, "global_step": 21906, "epoch": 263} {"train_loss": -18.68892478942871, "global_step": 21907, "epoch": 263} {"train_loss": -18.243431091308594, "global_step": 21908, "epoch": 263} {"train_loss": -18.417638778686523, "global_step": 21909, "epoch": 263} {"train_loss": -18.88125991821289, "global_step": 21910, "epoch": 263} {"train_loss": -18.42522779717503, "global_step": 21911, "epoch": 263, "val_loss": 6085384.0} {"train_loss": -17.529855728149414, "global_step": 21912, "epoch": 264} {"train_loss": -18.380033493041992, "global_step": 21913, "epoch": 264} {"train_loss": -17.910856246948242, "global_step": 21914, "epoch": 264} {"train_loss": -18.268957138061523, "global_step": 21915, "epoch": 264} {"train_loss": -18.470155715942383, "global_step": 21916, "epoch": 264} {"train_loss": -18.24341583251953, "global_step": 21917, "epoch": 264} {"train_loss": -18.48976707458496, "global_step": 21918, "epoch": 264} {"train_loss": -18.205690383911133, "global_step": 21919, "epoch": 264} {"train_loss": -18.547605514526367, "global_step": 21920, "epoch": 264} {"train_loss": -18.03851890563965, "global_step": 21921, "epoch": 264} {"train_loss": -18.343603134155273, "global_step": 21922, "epoch": 264} {"train_loss": -17.92164421081543, "global_step": 21923, "epoch": 264} {"train_loss": -18.55769157409668, "global_step": 21924, "epoch": 264} {"train_loss": -18.710372924804688, "global_step": 21925, "epoch": 264} {"train_loss": -18.189359664916992, "global_step": 21926, "epoch": 264} {"train_loss": -18.823713302612305, "global_step": 21927, "epoch": 264} {"train_loss": -18.21197509765625, "global_step": 21928, "epoch": 264} {"train_loss": -18.667316436767578, "global_step": 21929, "epoch": 264} {"train_loss": -18.533201217651367, "global_step": 21930, "epoch": 264} {"train_loss": -18.17839241027832, "global_step": 21931, "epoch": 264} {"train_loss": -18.295473098754883, "global_step": 21932, "epoch": 264} {"train_loss": -18.333694458007812, "global_step": 21933, "epoch": 264} {"train_loss": -18.37895965576172, "global_step": 21934, "epoch": 264} {"train_loss": -18.671743392944336, "global_step": 21935, "epoch": 264} {"train_loss": -18.654661178588867, "global_step": 21936, "epoch": 264} {"train_loss": -18.444095611572266, "global_step": 21937, "epoch": 264} {"train_loss": -18.055213928222656, "global_step": 21938, "epoch": 264} {"train_loss": -18.61728286743164, "global_step": 21939, "epoch": 264} {"train_loss": -18.70891761779785, "global_step": 21940, "epoch": 264} {"train_loss": -18.565711975097656, "global_step": 21941, "epoch": 264} {"train_loss": -18.608427047729492, "global_step": 21942, "epoch": 264} {"train_loss": -18.57920265197754, "global_step": 21943, "epoch": 264} {"train_loss": -18.443883895874023, "global_step": 21944, "epoch": 264} {"train_loss": -18.629669189453125, "global_step": 21945, "epoch": 264} {"train_loss": -18.536108016967773, "global_step": 21946, "epoch": 264} {"train_loss": -18.093130111694336, "global_step": 21947, "epoch": 264} {"train_loss": -18.723621368408203, "global_step": 21948, "epoch": 264} {"train_loss": -19.056026458740234, "global_step": 21949, "epoch": 264} {"train_loss": -18.482954025268555, "global_step": 21950, "epoch": 264} {"train_loss": -18.45994758605957, "global_step": 21951, "epoch": 264} {"train_loss": -18.488941192626953, "global_step": 21952, "epoch": 264} {"train_loss": -18.202871322631836, "global_step": 21953, "epoch": 264} {"train_loss": -18.45606231689453, "global_step": 21954, "epoch": 264} {"train_loss": -18.235265731811523, "global_step": 21955, "epoch": 264} {"train_loss": -18.743288040161133, "global_step": 21956, "epoch": 264} {"train_loss": -18.611133575439453, "global_step": 21957, "epoch": 264} {"train_loss": -18.434762954711914, "global_step": 21958, "epoch": 264} {"train_loss": -18.418636322021484, "global_step": 21959, "epoch": 264} {"train_loss": -18.36395835876465, "global_step": 21960, "epoch": 264} {"train_loss": -18.526700973510742, "global_step": 21961, "epoch": 264} {"train_loss": -18.439939498901367, "global_step": 21962, "epoch": 264} {"train_loss": -18.613683700561523, "global_step": 21963, "epoch": 264} {"train_loss": -18.372163772583008, "global_step": 21964, "epoch": 264} {"train_loss": -18.560026168823242, "global_step": 21965, "epoch": 264} {"train_loss": -18.180931091308594, "global_step": 21966, "epoch": 264} {"train_loss": -18.81697654724121, "global_step": 21967, "epoch": 264} {"train_loss": -18.58180046081543, "global_step": 21968, "epoch": 264} {"train_loss": -18.396833419799805, "global_step": 21969, "epoch": 264} {"train_loss": -18.194578170776367, "global_step": 21970, "epoch": 264} {"train_loss": -18.80914878845215, "global_step": 21971, "epoch": 264} {"train_loss": -18.17432975769043, "global_step": 21972, "epoch": 264} {"train_loss": -19.14823341369629, "global_step": 21973, "epoch": 264} {"train_loss": -18.684782028198242, "global_step": 21974, "epoch": 264} {"train_loss": -18.58241081237793, "global_step": 21975, "epoch": 264} {"train_loss": -18.573076248168945, "global_step": 21976, "epoch": 264} {"train_loss": -18.353044509887695, "global_step": 21977, "epoch": 264} {"train_loss": -18.469547271728516, "global_step": 21978, "epoch": 264} {"train_loss": -18.456647872924805, "global_step": 21979, "epoch": 264} {"train_loss": -18.490737915039062, "global_step": 21980, "epoch": 264} {"train_loss": -18.291391372680664, "global_step": 21981, "epoch": 264} {"train_loss": -18.384220123291016, "global_step": 21982, "epoch": 264} {"train_loss": -18.50187110900879, "global_step": 21983, "epoch": 264} {"train_loss": -18.396825790405273, "global_step": 21984, "epoch": 264} {"train_loss": -18.595373153686523, "global_step": 21985, "epoch": 264} {"train_loss": -18.750259399414062, "global_step": 21986, "epoch": 264} {"train_loss": -18.47212791442871, "global_step": 21987, "epoch": 264} {"train_loss": -18.595064163208008, "global_step": 21988, "epoch": 264} {"train_loss": -18.60858917236328, "global_step": 21989, "epoch": 264} {"train_loss": -18.578535079956055, "global_step": 21990, "epoch": 264} {"train_loss": -18.551116943359375, "global_step": 21991, "epoch": 264} {"train_loss": -18.26563262939453, "global_step": 21992, "epoch": 264} {"train_loss": -18.221460342407227, "global_step": 21993, "epoch": 264} {"train_loss": -18.45922095517078, "global_step": 21994, "epoch": 264, "val_loss": 6000329.5} {"train_loss": -17.92751121520996, "global_step": 21995, "epoch": 265} {"train_loss": -18.657602310180664, "global_step": 21996, "epoch": 265} {"train_loss": -18.206113815307617, "global_step": 21997, "epoch": 265} {"train_loss": -18.131959915161133, "global_step": 21998, "epoch": 265} {"train_loss": -18.28365135192871, "global_step": 21999, "epoch": 265} {"train_loss": -18.12387466430664, "global_step": 22000, "epoch": 265} {"train_loss": -18.401334762573242, "global_step": 22001, "epoch": 265} {"train_loss": -18.55597496032715, "global_step": 22002, "epoch": 265} {"train_loss": -18.721471786499023, "global_step": 22003, "epoch": 265} {"train_loss": -18.76337242126465, "global_step": 22004, "epoch": 265} {"train_loss": -18.348283767700195, "global_step": 22005, "epoch": 265} {"train_loss": -18.34891128540039, "global_step": 22006, "epoch": 265} {"train_loss": -18.204118728637695, "global_step": 22007, "epoch": 265} {"train_loss": -18.162120819091797, "global_step": 22008, "epoch": 265} {"train_loss": -18.36526870727539, "global_step": 22009, "epoch": 265} {"train_loss": -18.65079689025879, "global_step": 22010, "epoch": 265} {"train_loss": -18.54507064819336, "global_step": 22011, "epoch": 265} {"train_loss": -18.241619110107422, "global_step": 22012, "epoch": 265} {"train_loss": -18.75168800354004, "global_step": 22013, "epoch": 265} {"train_loss": -18.488494873046875, "global_step": 22014, "epoch": 265} {"train_loss": -18.849689483642578, "global_step": 22015, "epoch": 265} {"train_loss": -17.961381912231445, "global_step": 22016, "epoch": 265} {"train_loss": -18.406728744506836, "global_step": 22017, "epoch": 265} {"train_loss": -18.770328521728516, "global_step": 22018, "epoch": 265} {"train_loss": -18.510589599609375, "global_step": 22019, "epoch": 265} {"train_loss": -18.603073120117188, "global_step": 22020, "epoch": 265} {"train_loss": -18.54024314880371, "global_step": 22021, "epoch": 265} {"train_loss": -18.108057022094727, "global_step": 22022, "epoch": 265} {"train_loss": -18.352336883544922, "global_step": 22023, "epoch": 265} {"train_loss": -18.319631576538086, "global_step": 22024, "epoch": 265} {"train_loss": -18.345714569091797, "global_step": 22025, "epoch": 265} {"train_loss": -18.27956771850586, "global_step": 22026, "epoch": 265} {"train_loss": -18.464893341064453, "global_step": 22027, "epoch": 265} {"train_loss": -18.738012313842773, "global_step": 22028, "epoch": 265} {"train_loss": -18.26544761657715, "global_step": 22029, "epoch": 265} {"train_loss": -18.62394905090332, "global_step": 22030, "epoch": 265} {"train_loss": -18.585865020751953, "global_step": 22031, "epoch": 265} {"train_loss": -18.74713134765625, "global_step": 22032, "epoch": 265} {"train_loss": -18.72430992126465, "global_step": 22033, "epoch": 265} {"train_loss": -18.702585220336914, "global_step": 22034, "epoch": 265} {"train_loss": -18.297086715698242, "global_step": 22035, "epoch": 265} {"train_loss": -18.67792320251465, "global_step": 22036, "epoch": 265} {"train_loss": -18.723600387573242, "global_step": 22037, "epoch": 265} {"train_loss": -18.437870025634766, "global_step": 22038, "epoch": 265} {"train_loss": -18.537921905517578, "global_step": 22039, "epoch": 265} {"train_loss": -18.38495445251465, "global_step": 22040, "epoch": 265} {"train_loss": -18.5394287109375, "global_step": 22041, "epoch": 265} {"train_loss": -18.443876266479492, "global_step": 22042, "epoch": 265} {"train_loss": -18.178457260131836, "global_step": 22043, "epoch": 265} {"train_loss": -18.170215606689453, "global_step": 22044, "epoch": 265} {"train_loss": -18.90776252746582, "global_step": 22045, "epoch": 265} {"train_loss": -18.31268882751465, "global_step": 22046, "epoch": 265} {"train_loss": -18.74814224243164, "global_step": 22047, "epoch": 265} {"train_loss": -18.330638885498047, "global_step": 22048, "epoch": 265} {"train_loss": -18.707000732421875, "global_step": 22049, "epoch": 265} {"train_loss": -18.431360244750977, "global_step": 22050, "epoch": 265} {"train_loss": -18.64696502685547, "global_step": 22051, "epoch": 265} {"train_loss": -18.55240249633789, "global_step": 22052, "epoch": 265} {"train_loss": -18.670673370361328, "global_step": 22053, "epoch": 265} {"train_loss": -18.697635650634766, "global_step": 22054, "epoch": 265} {"train_loss": -18.562070846557617, "global_step": 22055, "epoch": 265} {"train_loss": -18.425256729125977, "global_step": 22056, "epoch": 265} {"train_loss": -18.455896377563477, "global_step": 22057, "epoch": 265} {"train_loss": -18.4688663482666, "global_step": 22058, "epoch": 265} {"train_loss": -18.844173431396484, "global_step": 22059, "epoch": 265} {"train_loss": -18.40555763244629, "global_step": 22060, "epoch": 265} {"train_loss": -18.597017288208008, "global_step": 22061, "epoch": 265} {"train_loss": -18.529830932617188, "global_step": 22062, "epoch": 265} {"train_loss": -18.377735137939453, "global_step": 22063, "epoch": 265} {"train_loss": -18.59877586364746, "global_step": 22064, "epoch": 265} {"train_loss": -18.28952407836914, "global_step": 22065, "epoch": 265} {"train_loss": -18.420669555664062, "global_step": 22066, "epoch": 265} {"train_loss": -17.88567352294922, "global_step": 22067, "epoch": 265} {"train_loss": -18.441953659057617, "global_step": 22068, "epoch": 265} {"train_loss": -18.573108673095703, "global_step": 22069, "epoch": 265} {"train_loss": -18.39737892150879, "global_step": 22070, "epoch": 265} {"train_loss": -18.43880271911621, "global_step": 22071, "epoch": 265} {"train_loss": -18.66761589050293, "global_step": 22072, "epoch": 265} {"train_loss": -18.746570587158203, "global_step": 22073, "epoch": 265} {"train_loss": -18.278207778930664, "global_step": 22074, "epoch": 265} {"train_loss": -18.657995223999023, "global_step": 22075, "epoch": 265} {"train_loss": -18.505544662475586, "global_step": 22076, "epoch": 265} {"train_loss": -18.497191854270106, "global_step": 22077, "epoch": 265, "val_loss": 5906384.0} {"train_loss": -18.36363410949707, "global_step": 22078, "epoch": 266} {"train_loss": -17.975522994995117, "global_step": 22079, "epoch": 266} {"train_loss": -18.133872985839844, "global_step": 22080, "epoch": 266} {"train_loss": -18.07771873474121, "global_step": 22081, "epoch": 266} {"train_loss": -18.30531883239746, "global_step": 22082, "epoch": 266} {"train_loss": -18.069934844970703, "global_step": 22083, "epoch": 266} {"train_loss": -18.187040328979492, "global_step": 22084, "epoch": 266} {"train_loss": -18.286649703979492, "global_step": 22085, "epoch": 266} {"train_loss": -18.441761016845703, "global_step": 22086, "epoch": 266} {"train_loss": -18.611783981323242, "global_step": 22087, "epoch": 266} {"train_loss": -18.55645179748535, "global_step": 22088, "epoch": 266} {"train_loss": -18.426931381225586, "global_step": 22089, "epoch": 266} {"train_loss": -18.417491912841797, "global_step": 22090, "epoch": 266} {"train_loss": -18.216588973999023, "global_step": 22091, "epoch": 266} {"train_loss": -18.161314010620117, "global_step": 22092, "epoch": 266} {"train_loss": -18.63148307800293, "global_step": 22093, "epoch": 266} {"train_loss": -18.237104415893555, "global_step": 22094, "epoch": 266} {"train_loss": -18.127532958984375, "global_step": 22095, "epoch": 266} {"train_loss": -18.459875106811523, "global_step": 22096, "epoch": 266} {"train_loss": -18.684812545776367, "global_step": 22097, "epoch": 266} {"train_loss": -18.74408721923828, "global_step": 22098, "epoch": 266} {"train_loss": -18.479496002197266, "global_step": 22099, "epoch": 266} {"train_loss": -17.8022403717041, "global_step": 22100, "epoch": 266} {"train_loss": -18.928510665893555, "global_step": 22101, "epoch": 266} {"train_loss": -18.47764015197754, "global_step": 22102, "epoch": 266} {"train_loss": -18.03419303894043, "global_step": 22103, "epoch": 266} {"train_loss": -18.74654769897461, "global_step": 22104, "epoch": 266} {"train_loss": -18.43381118774414, "global_step": 22105, "epoch": 266} {"train_loss": -18.545286178588867, "global_step": 22106, "epoch": 266} {"train_loss": -18.75786590576172, "global_step": 22107, "epoch": 266} {"train_loss": -18.40518569946289, "global_step": 22108, "epoch": 266} {"train_loss": -18.5669002532959, "global_step": 22109, "epoch": 266} {"train_loss": -18.638822555541992, "global_step": 22110, "epoch": 266} {"train_loss": -18.17268180847168, "global_step": 22111, "epoch": 266} {"train_loss": -18.738162994384766, "global_step": 22112, "epoch": 266} {"train_loss": -18.506145477294922, "global_step": 22113, "epoch": 266} {"train_loss": -18.08552360534668, "global_step": 22114, "epoch": 266} {"train_loss": -18.628971099853516, "global_step": 22115, "epoch": 266} {"train_loss": -18.37565040588379, "global_step": 22116, "epoch": 266} {"train_loss": -18.53985595703125, "global_step": 22117, "epoch": 266} {"train_loss": -18.524688720703125, "global_step": 22118, "epoch": 266} {"train_loss": -18.599323272705078, "global_step": 22119, "epoch": 266} {"train_loss": -18.3569278717041, "global_step": 22120, "epoch": 266} {"train_loss": -18.712364196777344, "global_step": 22121, "epoch": 266} {"train_loss": -18.571306228637695, "global_step": 22122, "epoch": 266} {"train_loss": -18.464553833007812, "global_step": 22123, "epoch": 266} {"train_loss": -18.501232147216797, "global_step": 22124, "epoch": 266} {"train_loss": -18.30915641784668, "global_step": 22125, "epoch": 266} {"train_loss": -18.932079315185547, "global_step": 22126, "epoch": 266} {"train_loss": -18.787660598754883, "global_step": 22127, "epoch": 266} {"train_loss": -18.601076126098633, "global_step": 22128, "epoch": 266} {"train_loss": -18.40436363220215, "global_step": 22129, "epoch": 266} {"train_loss": -18.91547203063965, "global_step": 22130, "epoch": 266} {"train_loss": -18.709638595581055, "global_step": 22131, "epoch": 266} {"train_loss": -18.51750946044922, "global_step": 22132, "epoch": 266} {"train_loss": -18.400678634643555, "global_step": 22133, "epoch": 266} {"train_loss": -18.8194637298584, "global_step": 22134, "epoch": 266} {"train_loss": -18.522871017456055, "global_step": 22135, "epoch": 266} {"train_loss": -18.332075119018555, "global_step": 22136, "epoch": 266} {"train_loss": -18.685592651367188, "global_step": 22137, "epoch": 266} {"train_loss": -18.606027603149414, "global_step": 22138, "epoch": 266} {"train_loss": -18.586889266967773, "global_step": 22139, "epoch": 266} {"train_loss": -18.602018356323242, "global_step": 22140, "epoch": 266} {"train_loss": -18.626413345336914, "global_step": 22141, "epoch": 266} {"train_loss": -18.44550323486328, "global_step": 22142, "epoch": 266} {"train_loss": -18.484853744506836, "global_step": 22143, "epoch": 266} {"train_loss": -18.746763229370117, "global_step": 22144, "epoch": 266} {"train_loss": -18.25623893737793, "global_step": 22145, "epoch": 266} {"train_loss": -18.623319625854492, "global_step": 22146, "epoch": 266} {"train_loss": -18.777273178100586, "global_step": 22147, "epoch": 266} {"train_loss": -18.481969833374023, "global_step": 22148, "epoch": 266} {"train_loss": -18.660953521728516, "global_step": 22149, "epoch": 266} {"train_loss": -18.291893005371094, "global_step": 22150, "epoch": 266} {"train_loss": -18.908409118652344, "global_step": 22151, "epoch": 266} {"train_loss": -18.665470123291016, "global_step": 22152, "epoch": 266} {"train_loss": -18.57822036743164, "global_step": 22153, "epoch": 266} {"train_loss": -18.663436889648438, "global_step": 22154, "epoch": 266} {"train_loss": -18.8667049407959, "global_step": 22155, "epoch": 266} {"train_loss": -19.07894515991211, "global_step": 22156, "epoch": 266} {"train_loss": -18.753297805786133, "global_step": 22157, "epoch": 266} {"train_loss": -18.896421432495117, "global_step": 22158, "epoch": 266} {"train_loss": -18.663129806518555, "global_step": 22159, "epoch": 266} {"train_loss": -18.510195421885296, "global_step": 22160, "epoch": 266, "val_loss": 5925147.0} {"train_loss": -18.52154541015625, "global_step": 22161, "epoch": 267} {"train_loss": -18.098987579345703, "global_step": 22162, "epoch": 267} {"train_loss": -18.528974533081055, "global_step": 22163, "epoch": 267} {"train_loss": -18.576688766479492, "global_step": 22164, "epoch": 267} {"train_loss": -18.31918716430664, "global_step": 22165, "epoch": 267} {"train_loss": -18.310073852539062, "global_step": 22166, "epoch": 267} {"train_loss": -18.413137435913086, "global_step": 22167, "epoch": 267} {"train_loss": -18.24488639831543, "global_step": 22168, "epoch": 267} {"train_loss": -18.65264320373535, "global_step": 22169, "epoch": 267} {"train_loss": -18.086116790771484, "global_step": 22170, "epoch": 267} {"train_loss": -18.244016647338867, "global_step": 22171, "epoch": 267} {"train_loss": -18.815704345703125, "global_step": 22172, "epoch": 267} {"train_loss": -18.51456069946289, "global_step": 22173, "epoch": 267} {"train_loss": -18.4515438079834, "global_step": 22174, "epoch": 267} {"train_loss": -18.405149459838867, "global_step": 22175, "epoch": 267} {"train_loss": -18.331148147583008, "global_step": 22176, "epoch": 267} {"train_loss": -18.572101593017578, "global_step": 22177, "epoch": 267} {"train_loss": -18.58296775817871, "global_step": 22178, "epoch": 267} {"train_loss": -18.609407424926758, "global_step": 22179, "epoch": 267} {"train_loss": -18.5711727142334, "global_step": 22180, "epoch": 267} {"train_loss": -18.874038696289062, "global_step": 22181, "epoch": 267} {"train_loss": -18.83294105529785, "global_step": 22182, "epoch": 267} {"train_loss": -18.45808219909668, "global_step": 22183, "epoch": 267} {"train_loss": -18.359451293945312, "global_step": 22184, "epoch": 267} {"train_loss": -18.58892822265625, "global_step": 22185, "epoch": 267} {"train_loss": -18.484643936157227, "global_step": 22186, "epoch": 267} {"train_loss": -18.323667526245117, "global_step": 22187, "epoch": 267} {"train_loss": -18.168760299682617, "global_step": 22188, "epoch": 267} {"train_loss": -18.657697677612305, "global_step": 22189, "epoch": 267} {"train_loss": -18.744009017944336, "global_step": 22190, "epoch": 267} {"train_loss": -18.444990158081055, "global_step": 22191, "epoch": 267} {"train_loss": -18.603723526000977, "global_step": 22192, "epoch": 267} {"train_loss": -18.800086975097656, "global_step": 22193, "epoch": 267} {"train_loss": -18.962539672851562, "global_step": 22194, "epoch": 267} {"train_loss": -18.747339248657227, "global_step": 22195, "epoch": 267} {"train_loss": -18.522504806518555, "global_step": 22196, "epoch": 267} {"train_loss": -18.528427124023438, "global_step": 22197, "epoch": 267} {"train_loss": -18.256942749023438, "global_step": 22198, "epoch": 267} {"train_loss": -18.465696334838867, "global_step": 22199, "epoch": 267} {"train_loss": -19.050098419189453, "global_step": 22200, "epoch": 267} {"train_loss": -18.389245986938477, "global_step": 22201, "epoch": 267} {"train_loss": -18.658960342407227, "global_step": 22202, "epoch": 267} {"train_loss": -18.415159225463867, "global_step": 22203, "epoch": 267} {"train_loss": -18.605335235595703, "global_step": 22204, "epoch": 267} {"train_loss": -18.387386322021484, "global_step": 22205, "epoch": 267} {"train_loss": -18.580141067504883, "global_step": 22206, "epoch": 267} {"train_loss": -18.038633346557617, "global_step": 22207, "epoch": 267} {"train_loss": -18.551259994506836, "global_step": 22208, "epoch": 267} {"train_loss": -18.373550415039062, "global_step": 22209, "epoch": 267} {"train_loss": -18.598072052001953, "global_step": 22210, "epoch": 267} {"train_loss": -18.58412742614746, "global_step": 22211, "epoch": 267} {"train_loss": -18.731557846069336, "global_step": 22212, "epoch": 267} {"train_loss": -18.64380645751953, "global_step": 22213, "epoch": 267} {"train_loss": -18.22175407409668, "global_step": 22214, "epoch": 267} {"train_loss": -18.53445816040039, "global_step": 22215, "epoch": 267} {"train_loss": -18.610916137695312, "global_step": 22216, "epoch": 267} {"train_loss": -18.642454147338867, "global_step": 22217, "epoch": 267} {"train_loss": -18.372976303100586, "global_step": 22218, "epoch": 267} {"train_loss": -19.1943416595459, "global_step": 22219, "epoch": 267} {"train_loss": -18.1297550201416, "global_step": 22220, "epoch": 267} {"train_loss": -18.67594337463379, "global_step": 22221, "epoch": 267} {"train_loss": -18.04130744934082, "global_step": 22222, "epoch": 267} {"train_loss": -18.589223861694336, "global_step": 22223, "epoch": 267} {"train_loss": -18.61075210571289, "global_step": 22224, "epoch": 267} {"train_loss": -18.512868881225586, "global_step": 22225, "epoch": 267} {"train_loss": -18.719690322875977, "global_step": 22226, "epoch": 267} {"train_loss": -18.384689331054688, "global_step": 22227, "epoch": 267} {"train_loss": -18.5745849609375, "global_step": 22228, "epoch": 267} {"train_loss": -18.247787475585938, "global_step": 22229, "epoch": 267} {"train_loss": -18.732894897460938, "global_step": 22230, "epoch": 267} {"train_loss": -18.358470916748047, "global_step": 22231, "epoch": 267} {"train_loss": -18.641515731811523, "global_step": 22232, "epoch": 267} {"train_loss": -18.549667358398438, "global_step": 22233, "epoch": 267} {"train_loss": -18.59222984313965, "global_step": 22234, "epoch": 267} {"train_loss": -18.797870635986328, "global_step": 22235, "epoch": 267} {"train_loss": -18.411457061767578, "global_step": 22236, "epoch": 267} {"train_loss": -18.73756980895996, "global_step": 22237, "epoch": 267} {"train_loss": -18.999526977539062, "global_step": 22238, "epoch": 267} {"train_loss": -18.342275619506836, "global_step": 22239, "epoch": 267} {"train_loss": -18.47321891784668, "global_step": 22240, "epoch": 267} {"train_loss": -18.305761337280273, "global_step": 22241, "epoch": 267} {"train_loss": -18.289390563964844, "global_step": 22242, "epoch": 267} {"train_loss": -18.517415356923298, "global_step": 22243, "epoch": 267, "val_loss": 5913405.5} {"train_loss": -18.577991485595703, "global_step": 22244, "epoch": 268} {"train_loss": -17.97541618347168, "global_step": 22245, "epoch": 268} {"train_loss": -18.59845542907715, "global_step": 22246, "epoch": 268} {"train_loss": -18.328805923461914, "global_step": 22247, "epoch": 268} {"train_loss": -18.496967315673828, "global_step": 22248, "epoch": 268} {"train_loss": -18.433319091796875, "global_step": 22249, "epoch": 268} {"train_loss": -18.063024520874023, "global_step": 22250, "epoch": 268} {"train_loss": -18.56935691833496, "global_step": 22251, "epoch": 268} {"train_loss": -18.401453018188477, "global_step": 22252, "epoch": 268} {"train_loss": -18.688512802124023, "global_step": 22253, "epoch": 268} {"train_loss": -18.4245662689209, "global_step": 22254, "epoch": 268} {"train_loss": -18.573110580444336, "global_step": 22255, "epoch": 268} {"train_loss": -18.6456356048584, "global_step": 22256, "epoch": 268} {"train_loss": -18.453754425048828, "global_step": 22257, "epoch": 268} {"train_loss": -18.260509490966797, "global_step": 22258, "epoch": 268} {"train_loss": -18.582508087158203, "global_step": 22259, "epoch": 268} {"train_loss": -18.140905380249023, "global_step": 22260, "epoch": 268} {"train_loss": -18.470516204833984, "global_step": 22261, "epoch": 268} {"train_loss": -18.507986068725586, "global_step": 22262, "epoch": 268} {"train_loss": -18.415739059448242, "global_step": 22263, "epoch": 268} {"train_loss": -18.6181640625, "global_step": 22264, "epoch": 268} {"train_loss": -18.754535675048828, "global_step": 22265, "epoch": 268} {"train_loss": -18.845947265625, "global_step": 22266, "epoch": 268} {"train_loss": -18.691633224487305, "global_step": 22267, "epoch": 268} {"train_loss": -18.37619972229004, "global_step": 22268, "epoch": 268} {"train_loss": -18.558393478393555, "global_step": 22269, "epoch": 268} {"train_loss": -18.427928924560547, "global_step": 22270, "epoch": 268} {"train_loss": -18.643835067749023, "global_step": 22271, "epoch": 268} {"train_loss": -18.371931076049805, "global_step": 22272, "epoch": 268} {"train_loss": -18.83670425415039, "global_step": 22273, "epoch": 268} {"train_loss": -18.466535568237305, "global_step": 22274, "epoch": 268} {"train_loss": -18.506446838378906, "global_step": 22275, "epoch": 268} {"train_loss": -18.356489181518555, "global_step": 22276, "epoch": 268} {"train_loss": -18.752872467041016, "global_step": 22277, "epoch": 268} {"train_loss": -18.369220733642578, "global_step": 22278, "epoch": 268} {"train_loss": -18.822799682617188, "global_step": 22279, "epoch": 268} {"train_loss": -18.329694747924805, "global_step": 22280, "epoch": 268} {"train_loss": -18.369930267333984, "global_step": 22281, "epoch": 268} {"train_loss": -18.6278018951416, "global_step": 22282, "epoch": 268} {"train_loss": -18.705760955810547, "global_step": 22283, "epoch": 268} {"train_loss": -18.602397918701172, "global_step": 22284, "epoch": 268} {"train_loss": -18.401870727539062, "global_step": 22285, "epoch": 268} {"train_loss": -18.303064346313477, "global_step": 22286, "epoch": 268} {"train_loss": -18.3756103515625, "global_step": 22287, "epoch": 268} {"train_loss": -18.411907196044922, "global_step": 22288, "epoch": 268} {"train_loss": -18.446760177612305, "global_step": 22289, "epoch": 268} {"train_loss": -18.6212158203125, "global_step": 22290, "epoch": 268} {"train_loss": -18.295469284057617, "global_step": 22291, "epoch": 268} {"train_loss": -18.23419189453125, "global_step": 22292, "epoch": 268} {"train_loss": -18.452123641967773, "global_step": 22293, "epoch": 268} {"train_loss": -18.509489059448242, "global_step": 22294, "epoch": 268} {"train_loss": -18.731401443481445, "global_step": 22295, "epoch": 268} {"train_loss": -18.2590274810791, "global_step": 22296, "epoch": 268} {"train_loss": -18.90920066833496, "global_step": 22297, "epoch": 268} {"train_loss": -18.669519424438477, "global_step": 22298, "epoch": 268} {"train_loss": -18.619226455688477, "global_step": 22299, "epoch": 268} {"train_loss": -18.464576721191406, "global_step": 22300, "epoch": 268} {"train_loss": -18.551414489746094, "global_step": 22301, "epoch": 268} {"train_loss": -18.68210220336914, "global_step": 22302, "epoch": 268} {"train_loss": -18.55043601989746, "global_step": 22303, "epoch": 268} {"train_loss": -18.321556091308594, "global_step": 22304, "epoch": 268} {"train_loss": -18.843271255493164, "global_step": 22305, "epoch": 268} {"train_loss": -18.10555076599121, "global_step": 22306, "epoch": 268} {"train_loss": -18.649667739868164, "global_step": 22307, "epoch": 268} {"train_loss": -18.64076042175293, "global_step": 22308, "epoch": 268} {"train_loss": -18.452899932861328, "global_step": 22309, "epoch": 268} {"train_loss": -18.33113670349121, "global_step": 22310, "epoch": 268} {"train_loss": -18.51275634765625, "global_step": 22311, "epoch": 268} {"train_loss": -18.607587814331055, "global_step": 22312, "epoch": 268} {"train_loss": -18.68995475769043, "global_step": 22313, "epoch": 268} {"train_loss": -18.305622100830078, "global_step": 22314, "epoch": 268} {"train_loss": -18.249595642089844, "global_step": 22315, "epoch": 268} {"train_loss": -18.68228530883789, "global_step": 22316, "epoch": 268} {"train_loss": -18.461360931396484, "global_step": 22317, "epoch": 268} {"train_loss": -18.317419052124023, "global_step": 22318, "epoch": 268} {"train_loss": -18.706045150756836, "global_step": 22319, "epoch": 268} {"train_loss": -18.556140899658203, "global_step": 22320, "epoch": 268} {"train_loss": -18.37514305114746, "global_step": 22321, "epoch": 268} {"train_loss": -18.409353256225586, "global_step": 22322, "epoch": 268} {"train_loss": -18.343189239501953, "global_step": 22323, "epoch": 268} {"train_loss": -18.548038482666016, "global_step": 22324, "epoch": 268} {"train_loss": -18.70382308959961, "global_step": 22325, "epoch": 268} {"train_loss": -18.499983063663343, "global_step": 22326, "epoch": 268, "val_loss": 6000562.5} {"train_loss": -18.218698501586914, "global_step": 22327, "epoch": 269} {"train_loss": -18.164783477783203, "global_step": 22328, "epoch": 269} {"train_loss": -17.82389259338379, "global_step": 22329, "epoch": 269} {"train_loss": -18.282581329345703, "global_step": 22330, "epoch": 269} {"train_loss": -18.86500358581543, "global_step": 22331, "epoch": 269} {"train_loss": -18.411989212036133, "global_step": 22332, "epoch": 269} {"train_loss": -18.3096866607666, "global_step": 22333, "epoch": 269} {"train_loss": -18.158613204956055, "global_step": 22334, "epoch": 269} {"train_loss": -18.34096336364746, "global_step": 22335, "epoch": 269} {"train_loss": -18.316287994384766, "global_step": 22336, "epoch": 269} {"train_loss": -18.37282371520996, "global_step": 22337, "epoch": 269} {"train_loss": -18.454320907592773, "global_step": 22338, "epoch": 269} {"train_loss": -18.17289161682129, "global_step": 22339, "epoch": 269} {"train_loss": -18.476484298706055, "global_step": 22340, "epoch": 269} {"train_loss": -18.31361198425293, "global_step": 22341, "epoch": 269} {"train_loss": -18.387544631958008, "global_step": 22342, "epoch": 269} {"train_loss": -18.036436080932617, "global_step": 22343, "epoch": 269} {"train_loss": -18.2177791595459, "global_step": 22344, "epoch": 269} {"train_loss": -18.335155487060547, "global_step": 22345, "epoch": 269} {"train_loss": -18.575084686279297, "global_step": 22346, "epoch": 269} {"train_loss": -18.33677101135254, "global_step": 22347, "epoch": 269} {"train_loss": -18.95743179321289, "global_step": 22348, "epoch": 269} {"train_loss": -18.63075065612793, "global_step": 22349, "epoch": 269} {"train_loss": -18.494125366210938, "global_step": 22350, "epoch": 269} {"train_loss": -18.488420486450195, "global_step": 22351, "epoch": 269} {"train_loss": -18.653244018554688, "global_step": 22352, "epoch": 269} {"train_loss": -19.01283073425293, "global_step": 22353, "epoch": 269} {"train_loss": -18.660253524780273, "global_step": 22354, "epoch": 269} {"train_loss": -19.015226364135742, "global_step": 22355, "epoch": 269} {"train_loss": -18.950780868530273, "global_step": 22356, "epoch": 269} {"train_loss": -18.3643856048584, "global_step": 22357, "epoch": 269} {"train_loss": -18.424789428710938, "global_step": 22358, "epoch": 269} {"train_loss": -18.332233428955078, "global_step": 22359, "epoch": 269} {"train_loss": -18.47059440612793, "global_step": 22360, "epoch": 269} {"train_loss": -18.588603973388672, "global_step": 22361, "epoch": 269} {"train_loss": -18.545866012573242, "global_step": 22362, "epoch": 269} {"train_loss": -18.803653717041016, "global_step": 22363, "epoch": 269} {"train_loss": -18.719343185424805, "global_step": 22364, "epoch": 269} {"train_loss": -18.383586883544922, "global_step": 22365, "epoch": 269} {"train_loss": -18.41154670715332, "global_step": 22366, "epoch": 269} {"train_loss": -18.348072052001953, "global_step": 22367, "epoch": 269} {"train_loss": -18.286884307861328, "global_step": 22368, "epoch": 269} {"train_loss": -18.61748695373535, "global_step": 22369, "epoch": 269} {"train_loss": -18.664386749267578, "global_step": 22370, "epoch": 269} {"train_loss": -18.74017906188965, "global_step": 22371, "epoch": 269} {"train_loss": -18.358469009399414, "global_step": 22372, "epoch": 269} {"train_loss": -18.651371002197266, "global_step": 22373, "epoch": 269} {"train_loss": -18.386877059936523, "global_step": 22374, "epoch": 269} {"train_loss": -18.689945220947266, "global_step": 22375, "epoch": 269} {"train_loss": -18.539520263671875, "global_step": 22376, "epoch": 269} {"train_loss": -18.666555404663086, "global_step": 22377, "epoch": 269} {"train_loss": -18.3785457611084, "global_step": 22378, "epoch": 269} {"train_loss": -18.446914672851562, "global_step": 22379, "epoch": 269} {"train_loss": -18.50179100036621, "global_step": 22380, "epoch": 269} {"train_loss": -18.127309799194336, "global_step": 22381, "epoch": 269} {"train_loss": -18.76094627380371, "global_step": 22382, "epoch": 269} {"train_loss": -18.38457489013672, "global_step": 22383, "epoch": 269} {"train_loss": -18.650495529174805, "global_step": 22384, "epoch": 269} {"train_loss": -18.593963623046875, "global_step": 22385, "epoch": 269} {"train_loss": -18.646381378173828, "global_step": 22386, "epoch": 269} {"train_loss": -18.134923934936523, "global_step": 22387, "epoch": 269} {"train_loss": -18.543569564819336, "global_step": 22388, "epoch": 269} {"train_loss": -18.848447799682617, "global_step": 22389, "epoch": 269} {"train_loss": -18.5373477935791, "global_step": 22390, "epoch": 269} {"train_loss": -18.605634689331055, "global_step": 22391, "epoch": 269} {"train_loss": -18.26801109313965, "global_step": 22392, "epoch": 269} {"train_loss": -18.587453842163086, "global_step": 22393, "epoch": 269} {"train_loss": -18.56049919128418, "global_step": 22394, "epoch": 269} {"train_loss": -18.376920700073242, "global_step": 22395, "epoch": 269} {"train_loss": -18.625263214111328, "global_step": 22396, "epoch": 269} {"train_loss": -18.427967071533203, "global_step": 22397, "epoch": 269} {"train_loss": -18.777257919311523, "global_step": 22398, "epoch": 269} {"train_loss": -18.772998809814453, "global_step": 22399, "epoch": 269} {"train_loss": -18.650327682495117, "global_step": 22400, "epoch": 269} {"train_loss": -18.14595603942871, "global_step": 22401, "epoch": 269} {"train_loss": -18.48676109313965, "global_step": 22402, "epoch": 269} {"train_loss": -18.384445190429688, "global_step": 22403, "epoch": 269} {"train_loss": -18.498271942138672, "global_step": 22404, "epoch": 269} {"train_loss": -18.617006301879883, "global_step": 22405, "epoch": 269} {"train_loss": -18.383319854736328, "global_step": 22406, "epoch": 269} {"train_loss": -18.621309280395508, "global_step": 22407, "epoch": 269} {"train_loss": -18.15754508972168, "global_step": 22408, "epoch": 269} {"train_loss": -18.49299276880471, "global_step": 22409, "epoch": 269, "val_loss": 6052284.0} {"train_loss": -17.80586814880371, "global_step": 22410, "epoch": 270} {"train_loss": -18.147180557250977, "global_step": 22411, "epoch": 270} {"train_loss": -18.07358741760254, "global_step": 22412, "epoch": 270} {"train_loss": -17.868772506713867, "global_step": 22413, "epoch": 270} {"train_loss": -18.271224975585938, "global_step": 22414, "epoch": 270} {"train_loss": -18.302099227905273, "global_step": 22415, "epoch": 270} {"train_loss": -18.119159698486328, "global_step": 22416, "epoch": 270} {"train_loss": -18.71457862854004, "global_step": 22417, "epoch": 270} {"train_loss": -18.203649520874023, "global_step": 22418, "epoch": 270} {"train_loss": -18.456707000732422, "global_step": 22419, "epoch": 270} {"train_loss": -18.239953994750977, "global_step": 22420, "epoch": 270} {"train_loss": -18.42343521118164, "global_step": 22421, "epoch": 270} {"train_loss": -18.049850463867188, "global_step": 22422, "epoch": 270} {"train_loss": -18.5240421295166, "global_step": 22423, "epoch": 270} {"train_loss": -18.599618911743164, "global_step": 22424, "epoch": 270} {"train_loss": -18.62049674987793, "global_step": 22425, "epoch": 270} {"train_loss": -18.479198455810547, "global_step": 22426, "epoch": 270} {"train_loss": -18.303442001342773, "global_step": 22427, "epoch": 270} {"train_loss": -18.729387283325195, "global_step": 22428, "epoch": 270} {"train_loss": -18.713666915893555, "global_step": 22429, "epoch": 270} {"train_loss": -18.7049503326416, "global_step": 22430, "epoch": 270} {"train_loss": -18.713871002197266, "global_step": 22431, "epoch": 270} {"train_loss": -18.688100814819336, "global_step": 22432, "epoch": 270} {"train_loss": -18.342529296875, "global_step": 22433, "epoch": 270} {"train_loss": -18.759796142578125, "global_step": 22434, "epoch": 270} {"train_loss": -18.1323299407959, "global_step": 22435, "epoch": 270} {"train_loss": -18.937408447265625, "global_step": 22436, "epoch": 270} {"train_loss": -18.829957962036133, "global_step": 22437, "epoch": 270} {"train_loss": -18.677701950073242, "global_step": 22438, "epoch": 270} {"train_loss": -18.534656524658203, "global_step": 22439, "epoch": 270} {"train_loss": -18.428373336791992, "global_step": 22440, "epoch": 270} {"train_loss": -18.214757919311523, "global_step": 22441, "epoch": 270} {"train_loss": -18.21162223815918, "global_step": 22442, "epoch": 270} {"train_loss": -18.838232040405273, "global_step": 22443, "epoch": 270} {"train_loss": -18.352676391601562, "global_step": 22444, "epoch": 270} {"train_loss": -18.8038330078125, "global_step": 22445, "epoch": 270} {"train_loss": -18.62912940979004, "global_step": 22446, "epoch": 270} {"train_loss": -18.333471298217773, "global_step": 22447, "epoch": 270} {"train_loss": -18.671010971069336, "global_step": 22448, "epoch": 270} {"train_loss": -18.317054748535156, "global_step": 22449, "epoch": 270} {"train_loss": -18.59916114807129, "global_step": 22450, "epoch": 270} {"train_loss": -18.679410934448242, "global_step": 22451, "epoch": 270} {"train_loss": -18.74001121520996, "global_step": 22452, "epoch": 270} {"train_loss": -18.422033309936523, "global_step": 22453, "epoch": 270} {"train_loss": -18.450881958007812, "global_step": 22454, "epoch": 270} {"train_loss": -18.484241485595703, "global_step": 22455, "epoch": 270} {"train_loss": -18.825206756591797, "global_step": 22456, "epoch": 270} {"train_loss": -18.531309127807617, "global_step": 22457, "epoch": 270} {"train_loss": -18.337621688842773, "global_step": 22458, "epoch": 270} {"train_loss": -18.525007247924805, "global_step": 22459, "epoch": 270} {"train_loss": -18.630779266357422, "global_step": 22460, "epoch": 270} {"train_loss": -18.65890884399414, "global_step": 22461, "epoch": 270} {"train_loss": -18.74355125427246, "global_step": 22462, "epoch": 270} {"train_loss": -18.80449867248535, "global_step": 22463, "epoch": 270} {"train_loss": -18.47742462158203, "global_step": 22464, "epoch": 270} {"train_loss": -18.495389938354492, "global_step": 22465, "epoch": 270} {"train_loss": -18.557363510131836, "global_step": 22466, "epoch": 270} {"train_loss": -18.6965274810791, "global_step": 22467, "epoch": 270} {"train_loss": -18.857755661010742, "global_step": 22468, "epoch": 270} {"train_loss": -18.310943603515625, "global_step": 22469, "epoch": 270} {"train_loss": -18.378345489501953, "global_step": 22470, "epoch": 270} {"train_loss": -18.348093032836914, "global_step": 22471, "epoch": 270} {"train_loss": -18.378198623657227, "global_step": 22472, "epoch": 270} {"train_loss": -18.573930740356445, "global_step": 22473, "epoch": 270} {"train_loss": -18.698301315307617, "global_step": 22474, "epoch": 270} {"train_loss": -18.504621505737305, "global_step": 22475, "epoch": 270} {"train_loss": -18.351776123046875, "global_step": 22476, "epoch": 270} {"train_loss": -18.681385040283203, "global_step": 22477, "epoch": 270} {"train_loss": -18.597463607788086, "global_step": 22478, "epoch": 270} {"train_loss": -18.427675247192383, "global_step": 22479, "epoch": 270} {"train_loss": -18.640377044677734, "global_step": 22480, "epoch": 270} {"train_loss": -18.538864135742188, "global_step": 22481, "epoch": 270} {"train_loss": -18.73737907409668, "global_step": 22482, "epoch": 270} {"train_loss": -18.50160789489746, "global_step": 22483, "epoch": 270} {"train_loss": -18.638046264648438, "global_step": 22484, "epoch": 270} {"train_loss": -18.604772567749023, "global_step": 22485, "epoch": 270} {"train_loss": -18.761335372924805, "global_step": 22486, "epoch": 270} {"train_loss": -18.22728157043457, "global_step": 22487, "epoch": 270} {"train_loss": -18.370752334594727, "global_step": 22488, "epoch": 270} {"train_loss": -18.409467697143555, "global_step": 22489, "epoch": 270} {"train_loss": -18.110971450805664, "global_step": 22490, "epoch": 270} {"train_loss": -18.125669479370117, "global_step": 22491, "epoch": 270} {"train_loss": -18.486097289855223, "global_step": 22492, "epoch": 270, "val_loss": 5928242.0} {"train_loss": -18.42535400390625, "global_step": 22493, "epoch": 271} {"train_loss": -18.339889526367188, "global_step": 22494, "epoch": 271} {"train_loss": -17.950410842895508, "global_step": 22495, "epoch": 271} {"train_loss": -18.401945114135742, "global_step": 22496, "epoch": 271} {"train_loss": -18.07522201538086, "global_step": 22497, "epoch": 271} {"train_loss": -18.43734359741211, "global_step": 22498, "epoch": 271} {"train_loss": -18.07083511352539, "global_step": 22499, "epoch": 271} {"train_loss": -18.515213012695312, "global_step": 22500, "epoch": 271} {"train_loss": -18.297300338745117, "global_step": 22501, "epoch": 271} {"train_loss": -18.496816635131836, "global_step": 22502, "epoch": 271} {"train_loss": -18.030912399291992, "global_step": 22503, "epoch": 271} {"train_loss": -18.632713317871094, "global_step": 22504, "epoch": 271} {"train_loss": -18.41792106628418, "global_step": 22505, "epoch": 271} {"train_loss": -18.32390594482422, "global_step": 22506, "epoch": 271} {"train_loss": -18.377103805541992, "global_step": 22507, "epoch": 271} {"train_loss": -18.340295791625977, "global_step": 22508, "epoch": 271} {"train_loss": -18.13374900817871, "global_step": 22509, "epoch": 271} {"train_loss": -18.470849990844727, "global_step": 22510, "epoch": 271} {"train_loss": -18.617238998413086, "global_step": 22511, "epoch": 271} {"train_loss": -18.604127883911133, "global_step": 22512, "epoch": 271} {"train_loss": -18.248327255249023, "global_step": 22513, "epoch": 271} {"train_loss": -18.543787002563477, "global_step": 22514, "epoch": 271} {"train_loss": -18.351560592651367, "global_step": 22515, "epoch": 271} {"train_loss": -18.310306549072266, "global_step": 22516, "epoch": 271} {"train_loss": -18.28395652770996, "global_step": 22517, "epoch": 271} {"train_loss": -18.45172691345215, "global_step": 22518, "epoch": 271} {"train_loss": -18.422832489013672, "global_step": 22519, "epoch": 271} {"train_loss": -18.30437660217285, "global_step": 22520, "epoch": 271} {"train_loss": -18.795822143554688, "global_step": 22521, "epoch": 271} {"train_loss": -18.397994995117188, "global_step": 22522, "epoch": 271} {"train_loss": -18.39874267578125, "global_step": 22523, "epoch": 271} {"train_loss": -18.58319664001465, "global_step": 22524, "epoch": 271} {"train_loss": -18.323095321655273, "global_step": 22525, "epoch": 271} {"train_loss": -18.429262161254883, "global_step": 22526, "epoch": 271} {"train_loss": -18.32404136657715, "global_step": 22527, "epoch": 271} {"train_loss": -18.971532821655273, "global_step": 22528, "epoch": 271} {"train_loss": -18.60848617553711, "global_step": 22529, "epoch": 271} {"train_loss": -18.818132400512695, "global_step": 22530, "epoch": 271} {"train_loss": -18.533069610595703, "global_step": 22531, "epoch": 271} {"train_loss": -18.86651039123535, "global_step": 22532, "epoch": 271} {"train_loss": -18.35553741455078, "global_step": 22533, "epoch": 271} {"train_loss": -18.14448356628418, "global_step": 22534, "epoch": 271} {"train_loss": -18.51922607421875, "global_step": 22535, "epoch": 271} {"train_loss": -18.73929214477539, "global_step": 22536, "epoch": 271} {"train_loss": -18.551652908325195, "global_step": 22537, "epoch": 271} {"train_loss": -18.569448471069336, "global_step": 22538, "epoch": 271} {"train_loss": -18.700956344604492, "global_step": 22539, "epoch": 271} {"train_loss": -18.816204071044922, "global_step": 22540, "epoch": 271} {"train_loss": -18.650543212890625, "global_step": 22541, "epoch": 271} {"train_loss": -18.735187530517578, "global_step": 22542, "epoch": 271} {"train_loss": -18.507143020629883, "global_step": 22543, "epoch": 271} {"train_loss": -18.525182723999023, "global_step": 22544, "epoch": 271} {"train_loss": -18.99435806274414, "global_step": 22545, "epoch": 271} {"train_loss": -18.498584747314453, "global_step": 22546, "epoch": 271} {"train_loss": -18.485675811767578, "global_step": 22547, "epoch": 271} {"train_loss": -18.334184646606445, "global_step": 22548, "epoch": 271} {"train_loss": -18.19887351989746, "global_step": 22549, "epoch": 271} {"train_loss": -18.26283073425293, "global_step": 22550, "epoch": 271} {"train_loss": -18.854745864868164, "global_step": 22551, "epoch": 271} {"train_loss": -18.61347007751465, "global_step": 22552, "epoch": 271} {"train_loss": -18.30462074279785, "global_step": 22553, "epoch": 271} {"train_loss": -18.612150192260742, "global_step": 22554, "epoch": 271} {"train_loss": -18.152090072631836, "global_step": 22555, "epoch": 271} {"train_loss": -18.796295166015625, "global_step": 22556, "epoch": 271} {"train_loss": -18.352760314941406, "global_step": 22557, "epoch": 271} {"train_loss": -18.674503326416016, "global_step": 22558, "epoch": 271} {"train_loss": -18.71517562866211, "global_step": 22559, "epoch": 271} {"train_loss": -18.513071060180664, "global_step": 22560, "epoch": 271} {"train_loss": -18.683664321899414, "global_step": 22561, "epoch": 271} {"train_loss": -18.709104537963867, "global_step": 22562, "epoch": 271} {"train_loss": -18.45454978942871, "global_step": 22563, "epoch": 271} {"train_loss": -18.588687896728516, "global_step": 22564, "epoch": 271} {"train_loss": -18.61250114440918, "global_step": 22565, "epoch": 271} {"train_loss": -18.39472007751465, "global_step": 22566, "epoch": 271} {"train_loss": -18.65292739868164, "global_step": 22567, "epoch": 271} {"train_loss": -18.65026092529297, "global_step": 22568, "epoch": 271} {"train_loss": -18.6837100982666, "global_step": 22569, "epoch": 271} {"train_loss": -18.350143432617188, "global_step": 22570, "epoch": 271} {"train_loss": -18.61646842956543, "global_step": 22571, "epoch": 271} {"train_loss": -18.829044342041016, "global_step": 22572, "epoch": 271} {"train_loss": -18.549962997436523, "global_step": 22573, "epoch": 271} {"train_loss": -18.195669174194336, "global_step": 22574, "epoch": 271} {"train_loss": -18.48819080031062, "global_step": 22575, "epoch": 271, "val_loss": 5933759.0} {"train_loss": -18.008508682250977, "global_step": 22576, "epoch": 272} {"train_loss": -18.40932273864746, "global_step": 22577, "epoch": 272} {"train_loss": -18.290990829467773, "global_step": 22578, "epoch": 272} {"train_loss": -18.408517837524414, "global_step": 22579, "epoch": 272} {"train_loss": -18.228229522705078, "global_step": 22580, "epoch": 272} {"train_loss": -18.627573013305664, "global_step": 22581, "epoch": 272} {"train_loss": -18.54950714111328, "global_step": 22582, "epoch": 272} {"train_loss": -18.257492065429688, "global_step": 22583, "epoch": 272} {"train_loss": -18.70310401916504, "global_step": 22584, "epoch": 272} {"train_loss": -18.616453170776367, "global_step": 22585, "epoch": 272} {"train_loss": -18.06703758239746, "global_step": 22586, "epoch": 272} {"train_loss": -18.2081356048584, "global_step": 22587, "epoch": 272} {"train_loss": -17.959144592285156, "global_step": 22588, "epoch": 272} {"train_loss": -18.80677604675293, "global_step": 22589, "epoch": 272} {"train_loss": -18.513385772705078, "global_step": 22590, "epoch": 272} {"train_loss": -18.530054092407227, "global_step": 22591, "epoch": 272} {"train_loss": -18.623720169067383, "global_step": 22592, "epoch": 272} {"train_loss": -18.55843162536621, "global_step": 22593, "epoch": 272} {"train_loss": -18.594894409179688, "global_step": 22594, "epoch": 272} {"train_loss": -18.655202865600586, "global_step": 22595, "epoch": 272} {"train_loss": -18.490398406982422, "global_step": 22596, "epoch": 272} {"train_loss": -18.50091552734375, "global_step": 22597, "epoch": 272} {"train_loss": -18.587736129760742, "global_step": 22598, "epoch": 272} {"train_loss": -18.351261138916016, "global_step": 22599, "epoch": 272} {"train_loss": -18.75965690612793, "global_step": 22600, "epoch": 272} {"train_loss": -18.266983032226562, "global_step": 22601, "epoch": 272} {"train_loss": -18.915420532226562, "global_step": 22602, "epoch": 272} {"train_loss": -18.17177963256836, "global_step": 22603, "epoch": 272} {"train_loss": -18.54365348815918, "global_step": 22604, "epoch": 272} {"train_loss": -18.239709854125977, "global_step": 22605, "epoch": 272} {"train_loss": -18.36649513244629, "global_step": 22606, "epoch": 272} {"train_loss": -18.103954315185547, "global_step": 22607, "epoch": 272} {"train_loss": -18.546436309814453, "global_step": 22608, "epoch": 272} {"train_loss": -18.28012466430664, "global_step": 22609, "epoch": 272} {"train_loss": -18.712203979492188, "global_step": 22610, "epoch": 272} {"train_loss": -18.40384292602539, "global_step": 22611, "epoch": 272} {"train_loss": -18.381616592407227, "global_step": 22612, "epoch": 272} {"train_loss": -18.461759567260742, "global_step": 22613, "epoch": 272} {"train_loss": -18.526456832885742, "global_step": 22614, "epoch": 272} {"train_loss": -18.188007354736328, "global_step": 22615, "epoch": 272} {"train_loss": -18.36311149597168, "global_step": 22616, "epoch": 272} {"train_loss": -18.59000015258789, "global_step": 22617, "epoch": 272} {"train_loss": -18.54924774169922, "global_step": 22618, "epoch": 272} {"train_loss": -18.510456085205078, "global_step": 22619, "epoch": 272} {"train_loss": -18.42082405090332, "global_step": 22620, "epoch": 272} {"train_loss": -18.05060386657715, "global_step": 22621, "epoch": 272} {"train_loss": -18.64573097229004, "global_step": 22622, "epoch": 272} {"train_loss": -18.217544555664062, "global_step": 22623, "epoch": 272} {"train_loss": -18.466785430908203, "global_step": 22624, "epoch": 272} {"train_loss": -17.99305534362793, "global_step": 22625, "epoch": 272} {"train_loss": -18.4459228515625, "global_step": 22626, "epoch": 272} {"train_loss": -18.241825103759766, "global_step": 22627, "epoch": 272} {"train_loss": -18.30164337158203, "global_step": 22628, "epoch": 272} {"train_loss": -18.697397232055664, "global_step": 22629, "epoch": 272} {"train_loss": -18.499792098999023, "global_step": 22630, "epoch": 272} {"train_loss": -18.36978530883789, "global_step": 22631, "epoch": 272} {"train_loss": -18.594953536987305, "global_step": 22632, "epoch": 272} {"train_loss": -18.540489196777344, "global_step": 22633, "epoch": 272} {"train_loss": -18.479629516601562, "global_step": 22634, "epoch": 272} {"train_loss": -18.253528594970703, "global_step": 22635, "epoch": 272} {"train_loss": -18.43406105041504, "global_step": 22636, "epoch": 272} {"train_loss": -18.278783798217773, "global_step": 22637, "epoch": 272} {"train_loss": -18.584579467773438, "global_step": 22638, "epoch": 272} {"train_loss": -18.500207901000977, "global_step": 22639, "epoch": 272} {"train_loss": -18.47403335571289, "global_step": 22640, "epoch": 272} {"train_loss": -18.319107055664062, "global_step": 22641, "epoch": 272} {"train_loss": -18.14496612548828, "global_step": 22642, "epoch": 272} {"train_loss": -18.874616622924805, "global_step": 22643, "epoch": 272} {"train_loss": -18.453821182250977, "global_step": 22644, "epoch": 272} {"train_loss": -18.70514488220215, "global_step": 22645, "epoch": 272} {"train_loss": -18.346906661987305, "global_step": 22646, "epoch": 272} {"train_loss": -18.557096481323242, "global_step": 22647, "epoch": 272} {"train_loss": -19.016416549682617, "global_step": 22648, "epoch": 272} {"train_loss": -18.683948516845703, "global_step": 22649, "epoch": 272} {"train_loss": -18.31211280822754, "global_step": 22650, "epoch": 272} {"train_loss": -18.392980575561523, "global_step": 22651, "epoch": 272} {"train_loss": -18.274763107299805, "global_step": 22652, "epoch": 272} {"train_loss": -18.731342315673828, "global_step": 22653, "epoch": 272} {"train_loss": -18.661060333251953, "global_step": 22654, "epoch": 272} {"train_loss": -19.28373908996582, "global_step": 22655, "epoch": 272} {"train_loss": -18.537593841552734, "global_step": 22656, "epoch": 272} {"train_loss": -18.77498435974121, "global_step": 22657, "epoch": 272} {"train_loss": -18.44490669434329, "global_step": 22658, "epoch": 272, "val_loss": 5812182.0} {"train_loss": -18.422128677368164, "global_step": 22659, "epoch": 273} {"train_loss": -18.173931121826172, "global_step": 22660, "epoch": 273} {"train_loss": -18.308908462524414, "global_step": 22661, "epoch": 273} {"train_loss": -18.204397201538086, "global_step": 22662, "epoch": 273} {"train_loss": -18.282724380493164, "global_step": 22663, "epoch": 273} {"train_loss": -18.64544677734375, "global_step": 22664, "epoch": 273} {"train_loss": -18.23040199279785, "global_step": 22665, "epoch": 273} {"train_loss": -18.33238410949707, "global_step": 22666, "epoch": 273} {"train_loss": -18.367345809936523, "global_step": 22667, "epoch": 273} {"train_loss": -18.40470314025879, "global_step": 22668, "epoch": 273} {"train_loss": -18.622671127319336, "global_step": 22669, "epoch": 273} {"train_loss": -18.290197372436523, "global_step": 22670, "epoch": 273} {"train_loss": -18.798795700073242, "global_step": 22671, "epoch": 273} {"train_loss": -18.37799072265625, "global_step": 22672, "epoch": 273} {"train_loss": -18.828428268432617, "global_step": 22673, "epoch": 273} {"train_loss": -18.532869338989258, "global_step": 22674, "epoch": 273} {"train_loss": -18.780590057373047, "global_step": 22675, "epoch": 273} {"train_loss": -18.899099349975586, "global_step": 22676, "epoch": 273} {"train_loss": -18.706892013549805, "global_step": 22677, "epoch": 273} {"train_loss": -18.437910079956055, "global_step": 22678, "epoch": 273} {"train_loss": -18.672117233276367, "global_step": 22679, "epoch": 273} {"train_loss": -18.24115753173828, "global_step": 22680, "epoch": 273} {"train_loss": -18.378576278686523, "global_step": 22681, "epoch": 273} {"train_loss": -18.518848419189453, "global_step": 22682, "epoch": 273} {"train_loss": -18.532329559326172, "global_step": 22683, "epoch": 273} {"train_loss": -18.606647491455078, "global_step": 22684, "epoch": 273} {"train_loss": -18.924177169799805, "global_step": 22685, "epoch": 273} {"train_loss": -18.556900024414062, "global_step": 22686, "epoch": 273} {"train_loss": -18.576892852783203, "global_step": 22687, "epoch": 273} {"train_loss": -18.362064361572266, "global_step": 22688, "epoch": 273} {"train_loss": -18.45063591003418, "global_step": 22689, "epoch": 273} {"train_loss": -18.755857467651367, "global_step": 22690, "epoch": 273} {"train_loss": -18.471223831176758, "global_step": 22691, "epoch": 273} {"train_loss": -18.58053970336914, "global_step": 22692, "epoch": 273} {"train_loss": -18.558883666992188, "global_step": 22693, "epoch": 273} {"train_loss": -18.673185348510742, "global_step": 22694, "epoch": 273} {"train_loss": -18.456636428833008, "global_step": 22695, "epoch": 273} {"train_loss": -18.195621490478516, "global_step": 22696, "epoch": 273} {"train_loss": -18.34576988220215, "global_step": 22697, "epoch": 273} {"train_loss": -18.42222023010254, "global_step": 22698, "epoch": 273} {"train_loss": -18.96451759338379, "global_step": 22699, "epoch": 273} {"train_loss": -18.484485626220703, "global_step": 22700, "epoch": 273} {"train_loss": -18.241256713867188, "global_step": 22701, "epoch": 273} {"train_loss": -18.62034034729004, "global_step": 22702, "epoch": 273} {"train_loss": -18.303010940551758, "global_step": 22703, "epoch": 273} {"train_loss": -18.613523483276367, "global_step": 22704, "epoch": 273} {"train_loss": -18.285898208618164, "global_step": 22705, "epoch": 273} {"train_loss": -18.298694610595703, "global_step": 22706, "epoch": 273} {"train_loss": -18.946144104003906, "global_step": 22707, "epoch": 273} {"train_loss": -18.716867446899414, "global_step": 22708, "epoch": 273} {"train_loss": -18.649246215820312, "global_step": 22709, "epoch": 273} {"train_loss": -18.46272087097168, "global_step": 22710, "epoch": 273} {"train_loss": -18.903621673583984, "global_step": 22711, "epoch": 273} {"train_loss": -18.415143966674805, "global_step": 22712, "epoch": 273} {"train_loss": -18.30549430847168, "global_step": 22713, "epoch": 273} {"train_loss": -18.619001388549805, "global_step": 22714, "epoch": 273} {"train_loss": -18.741748809814453, "global_step": 22715, "epoch": 273} {"train_loss": -18.43765640258789, "global_step": 22716, "epoch": 273} {"train_loss": -18.7482967376709, "global_step": 22717, "epoch": 273} {"train_loss": -18.603017807006836, "global_step": 22718, "epoch": 273} {"train_loss": -18.818315505981445, "global_step": 22719, "epoch": 273} {"train_loss": -18.51250648498535, "global_step": 22720, "epoch": 273} {"train_loss": -18.806671142578125, "global_step": 22721, "epoch": 273} {"train_loss": -18.72281265258789, "global_step": 22722, "epoch": 273} {"train_loss": -18.000341415405273, "global_step": 22723, "epoch": 273} {"train_loss": -19.071495056152344, "global_step": 22724, "epoch": 273} {"train_loss": -19.04568862915039, "global_step": 22725, "epoch": 273} {"train_loss": -18.349363327026367, "global_step": 22726, "epoch": 273} {"train_loss": -18.22039222717285, "global_step": 22727, "epoch": 273} {"train_loss": -18.433393478393555, "global_step": 22728, "epoch": 273} {"train_loss": -18.541706085205078, "global_step": 22729, "epoch": 273} {"train_loss": -17.985172271728516, "global_step": 22730, "epoch": 273} {"train_loss": -18.580106735229492, "global_step": 22731, "epoch": 273} {"train_loss": -18.660032272338867, "global_step": 22732, "epoch": 273} {"train_loss": -18.76559066772461, "global_step": 22733, "epoch": 273} {"train_loss": -18.46766471862793, "global_step": 22734, "epoch": 273} {"train_loss": -18.56422996520996, "global_step": 22735, "epoch": 273} {"train_loss": -18.702043533325195, "global_step": 22736, "epoch": 273} {"train_loss": -18.331193923950195, "global_step": 22737, "epoch": 273} {"train_loss": -18.130605697631836, "global_step": 22738, "epoch": 273} {"train_loss": -18.579557418823242, "global_step": 22739, "epoch": 273} {"train_loss": -18.325315475463867, "global_step": 22740, "epoch": 273} {"train_loss": -18.545456093477917, "global_step": 22741, "epoch": 273, "val_loss": 6049755.0} {"train_loss": -18.147947311401367, "global_step": 22742, "epoch": 274} {"train_loss": -18.027433395385742, "global_step": 22743, "epoch": 274} {"train_loss": -18.227798461914062, "global_step": 22744, "epoch": 274} {"train_loss": -18.608001708984375, "global_step": 22745, "epoch": 274} {"train_loss": -18.054128646850586, "global_step": 22746, "epoch": 274} {"train_loss": -18.053796768188477, "global_step": 22747, "epoch": 274} {"train_loss": -18.19303321838379, "global_step": 22748, "epoch": 274} {"train_loss": -18.630374908447266, "global_step": 22749, "epoch": 274} {"train_loss": -18.353897094726562, "global_step": 22750, "epoch": 274} {"train_loss": -18.34341812133789, "global_step": 22751, "epoch": 274} {"train_loss": -18.32398796081543, "global_step": 22752, "epoch": 274} {"train_loss": -18.52971839904785, "global_step": 22753, "epoch": 274} {"train_loss": -18.1003475189209, "global_step": 22754, "epoch": 274} {"train_loss": -18.33523941040039, "global_step": 22755, "epoch": 274} {"train_loss": -18.411651611328125, "global_step": 22756, "epoch": 274} {"train_loss": -18.401071548461914, "global_step": 22757, "epoch": 274} {"train_loss": -18.627811431884766, "global_step": 22758, "epoch": 274} {"train_loss": -18.383466720581055, "global_step": 22759, "epoch": 274} {"train_loss": -18.09720802307129, "global_step": 22760, "epoch": 274} {"train_loss": -18.43536949157715, "global_step": 22761, "epoch": 274} {"train_loss": -18.224634170532227, "global_step": 22762, "epoch": 274} {"train_loss": -18.315658569335938, "global_step": 22763, "epoch": 274} {"train_loss": -18.75642967224121, "global_step": 22764, "epoch": 274} {"train_loss": -18.76679039001465, "global_step": 22765, "epoch": 274} {"train_loss": -18.533361434936523, "global_step": 22766, "epoch": 274} {"train_loss": -19.070444107055664, "global_step": 22767, "epoch": 274} {"train_loss": -18.27545928955078, "global_step": 22768, "epoch": 274} {"train_loss": -18.70384407043457, "global_step": 22769, "epoch": 274} {"train_loss": -18.6008243560791, "global_step": 22770, "epoch": 274} {"train_loss": -18.75417137145996, "global_step": 22771, "epoch": 274} {"train_loss": -18.621463775634766, "global_step": 22772, "epoch": 274} {"train_loss": -18.66019058227539, "global_step": 22773, "epoch": 274} {"train_loss": -18.9271183013916, "global_step": 22774, "epoch": 274} {"train_loss": -18.878469467163086, "global_step": 22775, "epoch": 274} {"train_loss": -19.154315948486328, "global_step": 22776, "epoch": 274} {"train_loss": -18.385305404663086, "global_step": 22777, "epoch": 274} {"train_loss": -18.313507080078125, "global_step": 22778, "epoch": 274} {"train_loss": -18.31648826599121, "global_step": 22779, "epoch": 274} {"train_loss": -18.76751136779785, "global_step": 22780, "epoch": 274} {"train_loss": -18.862445831298828, "global_step": 22781, "epoch": 274} {"train_loss": -18.16644859313965, "global_step": 22782, "epoch": 274} {"train_loss": -18.676944732666016, "global_step": 22783, "epoch": 274} {"train_loss": -18.703540802001953, "global_step": 22784, "epoch": 274} {"train_loss": -18.47536849975586, "global_step": 22785, "epoch": 274} {"train_loss": -18.39748191833496, "global_step": 22786, "epoch": 274} {"train_loss": -18.69220542907715, "global_step": 22787, "epoch": 274} {"train_loss": -18.64520263671875, "global_step": 22788, "epoch": 274} {"train_loss": -18.532289505004883, "global_step": 22789, "epoch": 274} {"train_loss": -18.465757369995117, "global_step": 22790, "epoch": 274} {"train_loss": -18.62255859375, "global_step": 22791, "epoch": 274} {"train_loss": -18.43086051940918, "global_step": 22792, "epoch": 274} {"train_loss": -18.50632667541504, "global_step": 22793, "epoch": 274} {"train_loss": -18.587881088256836, "global_step": 22794, "epoch": 274} {"train_loss": -18.419416427612305, "global_step": 22795, "epoch": 274} {"train_loss": -18.713180541992188, "global_step": 22796, "epoch": 274} {"train_loss": -18.413864135742188, "global_step": 22797, "epoch": 274} {"train_loss": -18.708087921142578, "global_step": 22798, "epoch": 274} {"train_loss": -18.672208786010742, "global_step": 22799, "epoch": 274} {"train_loss": -18.692129135131836, "global_step": 22800, "epoch": 274} {"train_loss": -18.492477416992188, "global_step": 22801, "epoch": 274} {"train_loss": -18.567201614379883, "global_step": 22802, "epoch": 274} {"train_loss": -18.481027603149414, "global_step": 22803, "epoch": 274} {"train_loss": -18.763639450073242, "global_step": 22804, "epoch": 274} {"train_loss": -18.682172775268555, "global_step": 22805, "epoch": 274} {"train_loss": -18.750415802001953, "global_step": 22806, "epoch": 274} {"train_loss": -19.00071907043457, "global_step": 22807, "epoch": 274} {"train_loss": -18.545698165893555, "global_step": 22808, "epoch": 274} {"train_loss": -18.604833602905273, "global_step": 22809, "epoch": 274} {"train_loss": -18.681293487548828, "global_step": 22810, "epoch": 274} {"train_loss": -18.541793823242188, "global_step": 22811, "epoch": 274} {"train_loss": -18.66139030456543, "global_step": 22812, "epoch": 274} {"train_loss": -18.48616600036621, "global_step": 22813, "epoch": 274} {"train_loss": -18.67072105407715, "global_step": 22814, "epoch": 274} {"train_loss": -18.508224487304688, "global_step": 22815, "epoch": 274} {"train_loss": -18.84432029724121, "global_step": 22816, "epoch": 274} {"train_loss": -18.40047264099121, "global_step": 22817, "epoch": 274} {"train_loss": -18.53901481628418, "global_step": 22818, "epoch": 274} {"train_loss": -18.29058074951172, "global_step": 22819, "epoch": 274} {"train_loss": -18.675230026245117, "global_step": 22820, "epoch": 274} {"train_loss": -18.661033630371094, "global_step": 22821, "epoch": 274} {"train_loss": -18.465078353881836, "global_step": 22822, "epoch": 274} {"train_loss": -18.633331298828125, "global_step": 22823, "epoch": 274} {"train_loss": -18.543358584484423, "global_step": 22824, "epoch": 274, "val_loss": 6034058.0} {"train_loss": -18.13552474975586, "global_step": 22825, "epoch": 275} {"train_loss": -18.367752075195312, "global_step": 22826, "epoch": 275} {"train_loss": -18.561176300048828, "global_step": 22827, "epoch": 275} {"train_loss": -18.57801628112793, "global_step": 22828, "epoch": 275} {"train_loss": -18.382108688354492, "global_step": 22829, "epoch": 275} {"train_loss": -18.522342681884766, "global_step": 22830, "epoch": 275} {"train_loss": -18.649057388305664, "global_step": 22831, "epoch": 275} {"train_loss": -18.879972457885742, "global_step": 22832, "epoch": 275} {"train_loss": -18.59779930114746, "global_step": 22833, "epoch": 275} {"train_loss": -18.618066787719727, "global_step": 22834, "epoch": 275} {"train_loss": -18.316879272460938, "global_step": 22835, "epoch": 275} {"train_loss": -18.66005516052246, "global_step": 22836, "epoch": 275} {"train_loss": -18.53696060180664, "global_step": 22837, "epoch": 275} {"train_loss": -18.331985473632812, "global_step": 22838, "epoch": 275} {"train_loss": -18.046955108642578, "global_step": 22839, "epoch": 275} {"train_loss": -18.62376594543457, "global_step": 22840, "epoch": 275} {"train_loss": -18.02723503112793, "global_step": 22841, "epoch": 275} {"train_loss": -18.2508544921875, "global_step": 22842, "epoch": 275} {"train_loss": -18.511083602905273, "global_step": 22843, "epoch": 275} {"train_loss": -18.402240753173828, "global_step": 22844, "epoch": 275} {"train_loss": -18.3560733795166, "global_step": 22845, "epoch": 275} {"train_loss": -18.612625122070312, "global_step": 22846, "epoch": 275} {"train_loss": -18.485614776611328, "global_step": 22847, "epoch": 275} {"train_loss": -18.43012046813965, "global_step": 22848, "epoch": 275} {"train_loss": -18.487953186035156, "global_step": 22849, "epoch": 275} {"train_loss": -18.623563766479492, "global_step": 22850, "epoch": 275} {"train_loss": -18.42730712890625, "global_step": 22851, "epoch": 275} {"train_loss": -18.551408767700195, "global_step": 22852, "epoch": 275} {"train_loss": -18.469741821289062, "global_step": 22853, "epoch": 275} {"train_loss": -18.6341609954834, "global_step": 22854, "epoch": 275} {"train_loss": -18.5117244720459, "global_step": 22855, "epoch": 275} {"train_loss": -18.603378295898438, "global_step": 22856, "epoch": 275} {"train_loss": -18.511362075805664, "global_step": 22857, "epoch": 275} {"train_loss": -18.347681045532227, "global_step": 22858, "epoch": 275} {"train_loss": -18.329931259155273, "global_step": 22859, "epoch": 275} {"train_loss": -18.692808151245117, "global_step": 22860, "epoch": 275} {"train_loss": -18.640583038330078, "global_step": 22861, "epoch": 275} {"train_loss": -18.26271629333496, "global_step": 22862, "epoch": 275} {"train_loss": -18.383737564086914, "global_step": 22863, "epoch": 275} {"train_loss": -18.399063110351562, "global_step": 22864, "epoch": 275} {"train_loss": -18.32539939880371, "global_step": 22865, "epoch": 275} {"train_loss": -18.62493896484375, "global_step": 22866, "epoch": 275} {"train_loss": -18.618539810180664, "global_step": 22867, "epoch": 275} {"train_loss": -18.37367820739746, "global_step": 22868, "epoch": 275} {"train_loss": -18.53415870666504, "global_step": 22869, "epoch": 275} {"train_loss": -18.777816772460938, "global_step": 22870, "epoch": 275} {"train_loss": -18.695703506469727, "global_step": 22871, "epoch": 275} {"train_loss": -18.891733169555664, "global_step": 22872, "epoch": 275} {"train_loss": -18.466571807861328, "global_step": 22873, "epoch": 275} {"train_loss": -18.578269958496094, "global_step": 22874, "epoch": 275} {"train_loss": -18.582935333251953, "global_step": 22875, "epoch": 275} {"train_loss": -18.8575496673584, "global_step": 22876, "epoch": 275} {"train_loss": -18.750141143798828, "global_step": 22877, "epoch": 275} {"train_loss": -18.6767578125, "global_step": 22878, "epoch": 275} {"train_loss": -18.926061630249023, "global_step": 22879, "epoch": 275} {"train_loss": -18.574865341186523, "global_step": 22880, "epoch": 275} {"train_loss": -18.59766960144043, "global_step": 22881, "epoch": 275} {"train_loss": -18.356826782226562, "global_step": 22882, "epoch": 275} {"train_loss": -18.916259765625, "global_step": 22883, "epoch": 275} {"train_loss": -18.47068214416504, "global_step": 22884, "epoch": 275} {"train_loss": -18.556344985961914, "global_step": 22885, "epoch": 275} {"train_loss": -18.84404754638672, "global_step": 22886, "epoch": 275} {"train_loss": -18.149124145507812, "global_step": 22887, "epoch": 275} {"train_loss": -18.442968368530273, "global_step": 22888, "epoch": 275} {"train_loss": -18.963449478149414, "global_step": 22889, "epoch": 275} {"train_loss": -18.55560302734375, "global_step": 22890, "epoch": 275} {"train_loss": -18.677631378173828, "global_step": 22891, "epoch": 275} {"train_loss": -18.340396881103516, "global_step": 22892, "epoch": 275} {"train_loss": -18.793275833129883, "global_step": 22893, "epoch": 275} {"train_loss": -18.544921875, "global_step": 22894, "epoch": 275} {"train_loss": -18.808624267578125, "global_step": 22895, "epoch": 275} {"train_loss": -18.43328285217285, "global_step": 22896, "epoch": 275} {"train_loss": -18.233442306518555, "global_step": 22897, "epoch": 275} {"train_loss": -18.40850830078125, "global_step": 22898, "epoch": 275} {"train_loss": -18.672868728637695, "global_step": 22899, "epoch": 275} {"train_loss": -18.58595085144043, "global_step": 22900, "epoch": 275} {"train_loss": -18.286314010620117, "global_step": 22901, "epoch": 275} {"train_loss": -18.896533966064453, "global_step": 22902, "epoch": 275} {"train_loss": -18.712482452392578, "global_step": 22903, "epoch": 275} {"train_loss": -18.341093063354492, "global_step": 22904, "epoch": 275} {"train_loss": -18.45407485961914, "global_step": 22905, "epoch": 275} {"train_loss": -18.378978729248047, "global_step": 22906, "epoch": 275} {"train_loss": -18.53029207436435, "global_step": 22907, "epoch": 275, "val_loss": 5925052.0} {"train_loss": -18.333616256713867, "global_step": 22908, "epoch": 276} {"train_loss": -18.41721534729004, "global_step": 22909, "epoch": 276} {"train_loss": -18.541545867919922, "global_step": 22910, "epoch": 276} {"train_loss": -18.390554428100586, "global_step": 22911, "epoch": 276} {"train_loss": -18.51194190979004, "global_step": 22912, "epoch": 276} {"train_loss": -18.55940818786621, "global_step": 22913, "epoch": 276} {"train_loss": -17.822595596313477, "global_step": 22914, "epoch": 276} {"train_loss": -18.54608154296875, "global_step": 22915, "epoch": 276} {"train_loss": -18.298736572265625, "global_step": 22916, "epoch": 276} {"train_loss": -18.57638931274414, "global_step": 22917, "epoch": 276} {"train_loss": -18.553775787353516, "global_step": 22918, "epoch": 276} {"train_loss": -18.65595054626465, "global_step": 22919, "epoch": 276} {"train_loss": -18.3348331451416, "global_step": 22920, "epoch": 276} {"train_loss": -18.596830368041992, "global_step": 22921, "epoch": 276} {"train_loss": -18.384130477905273, "global_step": 22922, "epoch": 276} {"train_loss": -18.776914596557617, "global_step": 22923, "epoch": 276} {"train_loss": -18.55252456665039, "global_step": 22924, "epoch": 276} {"train_loss": -18.238210678100586, "global_step": 22925, "epoch": 276} {"train_loss": -18.773622512817383, "global_step": 22926, "epoch": 276} {"train_loss": -18.739364624023438, "global_step": 22927, "epoch": 276} {"train_loss": -18.561193466186523, "global_step": 22928, "epoch": 276} {"train_loss": -18.422008514404297, "global_step": 22929, "epoch": 276} {"train_loss": -18.5928897857666, "global_step": 22930, "epoch": 276} {"train_loss": -18.875141143798828, "global_step": 22931, "epoch": 276} {"train_loss": -18.690610885620117, "global_step": 22932, "epoch": 276} {"train_loss": -19.053386688232422, "global_step": 22933, "epoch": 276} {"train_loss": -18.55002784729004, "global_step": 22934, "epoch": 276} {"train_loss": -18.50685691833496, "global_step": 22935, "epoch": 276} {"train_loss": -18.4898738861084, "global_step": 22936, "epoch": 276} {"train_loss": -18.44034194946289, "global_step": 22937, "epoch": 276} {"train_loss": -18.525558471679688, "global_step": 22938, "epoch": 276} {"train_loss": -18.193876266479492, "global_step": 22939, "epoch": 276} {"train_loss": -18.52303123474121, "global_step": 22940, "epoch": 276} {"train_loss": -18.35227394104004, "global_step": 22941, "epoch": 276} {"train_loss": -18.790746688842773, "global_step": 22942, "epoch": 276} {"train_loss": -18.486907958984375, "global_step": 22943, "epoch": 276} {"train_loss": -18.72432518005371, "global_step": 22944, "epoch": 276} {"train_loss": -18.763595581054688, "global_step": 22945, "epoch": 276} {"train_loss": -18.687061309814453, "global_step": 22946, "epoch": 276} {"train_loss": -18.441347122192383, "global_step": 22947, "epoch": 276} {"train_loss": -19.058103561401367, "global_step": 22948, "epoch": 276} {"train_loss": -18.205732345581055, "global_step": 22949, "epoch": 276} {"train_loss": -18.31366729736328, "global_step": 22950, "epoch": 276} {"train_loss": -18.550281524658203, "global_step": 22951, "epoch": 276} {"train_loss": -18.958528518676758, "global_step": 22952, "epoch": 276} {"train_loss": -18.550565719604492, "global_step": 22953, "epoch": 276} {"train_loss": -18.24610710144043, "global_step": 22954, "epoch": 276} {"train_loss": -18.668447494506836, "global_step": 22955, "epoch": 276} {"train_loss": -18.432275772094727, "global_step": 22956, "epoch": 276} {"train_loss": -18.61865234375, "global_step": 22957, "epoch": 276} {"train_loss": -18.86158561706543, "global_step": 22958, "epoch": 276} {"train_loss": -18.66351890563965, "global_step": 22959, "epoch": 276} {"train_loss": -18.990346908569336, "global_step": 22960, "epoch": 276} {"train_loss": -18.50536346435547, "global_step": 22961, "epoch": 276} {"train_loss": -18.38899803161621, "global_step": 22962, "epoch": 276} {"train_loss": -18.136734008789062, "global_step": 22963, "epoch": 276} {"train_loss": -18.391769409179688, "global_step": 22964, "epoch": 276} {"train_loss": -18.51377296447754, "global_step": 22965, "epoch": 276} {"train_loss": -18.596864700317383, "global_step": 22966, "epoch": 276} {"train_loss": -18.590986251831055, "global_step": 22967, "epoch": 276} {"train_loss": -18.667631149291992, "global_step": 22968, "epoch": 276} {"train_loss": -18.452112197875977, "global_step": 22969, "epoch": 276} {"train_loss": -18.560821533203125, "global_step": 22970, "epoch": 276} {"train_loss": -18.304447174072266, "global_step": 22971, "epoch": 276} {"train_loss": -18.813724517822266, "global_step": 22972, "epoch": 276} {"train_loss": -18.1431884765625, "global_step": 22973, "epoch": 276} {"train_loss": -18.411958694458008, "global_step": 22974, "epoch": 276} {"train_loss": -18.58194351196289, "global_step": 22975, "epoch": 276} {"train_loss": -18.642576217651367, "global_step": 22976, "epoch": 276} {"train_loss": -18.857587814331055, "global_step": 22977, "epoch": 276} {"train_loss": -18.461069107055664, "global_step": 22978, "epoch": 276} {"train_loss": -18.412328720092773, "global_step": 22979, "epoch": 276} {"train_loss": -18.604597091674805, "global_step": 22980, "epoch": 276} {"train_loss": -18.36693572998047, "global_step": 22981, "epoch": 276} {"train_loss": -18.71510124206543, "global_step": 22982, "epoch": 276} {"train_loss": -18.34438705444336, "global_step": 22983, "epoch": 276} {"train_loss": -18.551172256469727, "global_step": 22984, "epoch": 276} {"train_loss": -18.37853240966797, "global_step": 22985, "epoch": 276} {"train_loss": -18.84718132019043, "global_step": 22986, "epoch": 276} {"train_loss": -18.58353042602539, "global_step": 22987, "epoch": 276} {"train_loss": -18.526756286621094, "global_step": 22988, "epoch": 276} {"train_loss": -18.380197525024414, "global_step": 22989, "epoch": 276} {"train_loss": -18.53480830824519, "global_step": 22990, "epoch": 276, "val_loss": 5985301.0} {"train_loss": -18.765457153320312, "global_step": 22991, "epoch": 277} {"train_loss": -18.850156784057617, "global_step": 22992, "epoch": 277} {"train_loss": -18.68161964416504, "global_step": 22993, "epoch": 277} {"train_loss": -18.48366355895996, "global_step": 22994, "epoch": 277} {"train_loss": -18.46247673034668, "global_step": 22995, "epoch": 277} {"train_loss": -18.577444076538086, "global_step": 22996, "epoch": 277} {"train_loss": -18.8034610748291, "global_step": 22997, "epoch": 277} {"train_loss": -18.746238708496094, "global_step": 22998, "epoch": 277} {"train_loss": -18.368972778320312, "global_step": 22999, "epoch": 277} {"train_loss": -18.372318267822266, "global_step": 23000, "epoch": 277} {"train_loss": -18.497892379760742, "global_step": 23001, "epoch": 277} {"train_loss": -18.881330490112305, "global_step": 23002, "epoch": 277} {"train_loss": -18.78021240234375, "global_step": 23003, "epoch": 277} {"train_loss": -18.490917205810547, "global_step": 23004, "epoch": 277} {"train_loss": -18.5627384185791, "global_step": 23005, "epoch": 277} {"train_loss": -18.43916893005371, "global_step": 23006, "epoch": 277} {"train_loss": -18.657184600830078, "global_step": 23007, "epoch": 277} {"train_loss": -18.38688850402832, "global_step": 23008, "epoch": 277} {"train_loss": -18.60063934326172, "global_step": 23009, "epoch": 277} {"train_loss": -18.45802879333496, "global_step": 23010, "epoch": 277} {"train_loss": -18.537256240844727, "global_step": 23011, "epoch": 277} {"train_loss": -18.571033477783203, "global_step": 23012, "epoch": 277} {"train_loss": -18.176252365112305, "global_step": 23013, "epoch": 277} {"train_loss": -18.18708610534668, "global_step": 23014, "epoch": 277} {"train_loss": -18.633676528930664, "global_step": 23015, "epoch": 277} {"train_loss": -18.595809936523438, "global_step": 23016, "epoch": 277} {"train_loss": -18.619657516479492, "global_step": 23017, "epoch": 277} {"train_loss": -18.333959579467773, "global_step": 23018, "epoch": 277} {"train_loss": -18.75288963317871, "global_step": 23019, "epoch": 277} {"train_loss": -18.305164337158203, "global_step": 23020, "epoch": 277} {"train_loss": -18.418968200683594, "global_step": 23021, "epoch": 277} {"train_loss": -18.49777603149414, "global_step": 23022, "epoch": 277} {"train_loss": -18.83053970336914, "global_step": 23023, "epoch": 277} {"train_loss": -18.811054229736328, "global_step": 23024, "epoch": 277} {"train_loss": -18.52096939086914, "global_step": 23025, "epoch": 277} {"train_loss": -18.376007080078125, "global_step": 23026, "epoch": 277} {"train_loss": -18.62542152404785, "global_step": 23027, "epoch": 277} {"train_loss": -18.239805221557617, "global_step": 23028, "epoch": 277} {"train_loss": -18.465932846069336, "global_step": 23029, "epoch": 277} {"train_loss": -18.474241256713867, "global_step": 23030, "epoch": 277} {"train_loss": -18.372543334960938, "global_step": 23031, "epoch": 277} {"train_loss": -18.973081588745117, "global_step": 23032, "epoch": 277} {"train_loss": -18.199411392211914, "global_step": 23033, "epoch": 277} {"train_loss": -18.59883689880371, "global_step": 23034, "epoch": 277} {"train_loss": -18.5534725189209, "global_step": 23035, "epoch": 277} {"train_loss": -18.395448684692383, "global_step": 23036, "epoch": 277} {"train_loss": -18.6478271484375, "global_step": 23037, "epoch": 277} {"train_loss": -18.481569290161133, "global_step": 23038, "epoch": 277} {"train_loss": -18.836414337158203, "global_step": 23039, "epoch": 277} {"train_loss": -18.480987548828125, "global_step": 23040, "epoch": 277} {"train_loss": -18.469436645507812, "global_step": 23041, "epoch": 277} {"train_loss": -18.622745513916016, "global_step": 23042, "epoch": 277} {"train_loss": -18.357358932495117, "global_step": 23043, "epoch": 277} {"train_loss": -19.220834732055664, "global_step": 23044, "epoch": 277} {"train_loss": -18.572021484375, "global_step": 23045, "epoch": 277} {"train_loss": -18.46299171447754, "global_step": 23046, "epoch": 277} {"train_loss": -18.538864135742188, "global_step": 23047, "epoch": 277} {"train_loss": -18.3160457611084, "global_step": 23048, "epoch": 277} {"train_loss": -18.653745651245117, "global_step": 23049, "epoch": 277} {"train_loss": -18.7595157623291, "global_step": 23050, "epoch": 277} {"train_loss": -18.605127334594727, "global_step": 23051, "epoch": 277} {"train_loss": -18.8785457611084, "global_step": 23052, "epoch": 277} {"train_loss": -18.656417846679688, "global_step": 23053, "epoch": 277} {"train_loss": -18.43368911743164, "global_step": 23054, "epoch": 277} {"train_loss": -18.55923843383789, "global_step": 23055, "epoch": 277} {"train_loss": -18.669462203979492, "global_step": 23056, "epoch": 277} {"train_loss": -18.418476104736328, "global_step": 23057, "epoch": 277} {"train_loss": -18.289907455444336, "global_step": 23058, "epoch": 277} {"train_loss": -18.5303955078125, "global_step": 23059, "epoch": 277} {"train_loss": -18.49104118347168, "global_step": 23060, "epoch": 277} {"train_loss": -18.43181800842285, "global_step": 23061, "epoch": 277} {"train_loss": -18.195837020874023, "global_step": 23062, "epoch": 277} {"train_loss": -18.86282730102539, "global_step": 23063, "epoch": 277} {"train_loss": -18.520851135253906, "global_step": 23064, "epoch": 277} {"train_loss": -18.332483291625977, "global_step": 23065, "epoch": 277} {"train_loss": -18.299409866333008, "global_step": 23066, "epoch": 277} {"train_loss": -18.36937141418457, "global_step": 23067, "epoch": 277} {"train_loss": -18.69917106628418, "global_step": 23068, "epoch": 277} {"train_loss": -18.709007263183594, "global_step": 23069, "epoch": 277} {"train_loss": -18.468708038330078, "global_step": 23070, "epoch": 277} {"train_loss": -18.7825984954834, "global_step": 23071, "epoch": 277} {"train_loss": -18.783323287963867, "global_step": 23072, "epoch": 277} {"train_loss": -18.56421845217785, "global_step": 23073, "epoch": 277, "val_loss": 6073892.0} {"train_loss": -17.920557022094727, "global_step": 23074, "epoch": 278} {"train_loss": -18.390771865844727, "global_step": 23075, "epoch": 278} {"train_loss": -17.95118522644043, "global_step": 23076, "epoch": 278} {"train_loss": -18.55267333984375, "global_step": 23077, "epoch": 278} {"train_loss": -18.275888442993164, "global_step": 23078, "epoch": 278} {"train_loss": -18.160018920898438, "global_step": 23079, "epoch": 278} {"train_loss": -18.497629165649414, "global_step": 23080, "epoch": 278} {"train_loss": -18.2664852142334, "global_step": 23081, "epoch": 278} {"train_loss": -18.200307846069336, "global_step": 23082, "epoch": 278} {"train_loss": -18.349958419799805, "global_step": 23083, "epoch": 278} {"train_loss": -18.611103057861328, "global_step": 23084, "epoch": 278} {"train_loss": -18.485105514526367, "global_step": 23085, "epoch": 278} {"train_loss": -18.54378890991211, "global_step": 23086, "epoch": 278} {"train_loss": -18.6467342376709, "global_step": 23087, "epoch": 278} {"train_loss": -18.289966583251953, "global_step": 23088, "epoch": 278} {"train_loss": -18.92273712158203, "global_step": 23089, "epoch": 278} {"train_loss": -18.49601173400879, "global_step": 23090, "epoch": 278} {"train_loss": -18.585466384887695, "global_step": 23091, "epoch": 278} {"train_loss": -18.64976692199707, "global_step": 23092, "epoch": 278} {"train_loss": -18.7211971282959, "global_step": 23093, "epoch": 278} {"train_loss": -18.583120346069336, "global_step": 23094, "epoch": 278} {"train_loss": -18.60940933227539, "global_step": 23095, "epoch": 278} {"train_loss": -18.82098960876465, "global_step": 23096, "epoch": 278} {"train_loss": -18.848892211914062, "global_step": 23097, "epoch": 278} {"train_loss": -18.396650314331055, "global_step": 23098, "epoch": 278} {"train_loss": -18.389102935791016, "global_step": 23099, "epoch": 278} {"train_loss": -18.447818756103516, "global_step": 23100, "epoch": 278} {"train_loss": -18.338111877441406, "global_step": 23101, "epoch": 278} {"train_loss": -18.48884391784668, "global_step": 23102, "epoch": 278} {"train_loss": -18.232290267944336, "global_step": 23103, "epoch": 278} {"train_loss": -18.70802879333496, "global_step": 23104, "epoch": 278} {"train_loss": -18.270368576049805, "global_step": 23105, "epoch": 278} {"train_loss": -18.55225372314453, "global_step": 23106, "epoch": 278} {"train_loss": -18.514997482299805, "global_step": 23107, "epoch": 278} {"train_loss": -18.70052146911621, "global_step": 23108, "epoch": 278} {"train_loss": -18.604583740234375, "global_step": 23109, "epoch": 278} {"train_loss": -18.22146987915039, "global_step": 23110, "epoch": 278} {"train_loss": -18.7554988861084, "global_step": 23111, "epoch": 278} {"train_loss": -18.785329818725586, "global_step": 23112, "epoch": 278} {"train_loss": -18.415796279907227, "global_step": 23113, "epoch": 278} {"train_loss": -18.526151657104492, "global_step": 23114, "epoch": 278} {"train_loss": -18.775426864624023, "global_step": 23115, "epoch": 278} {"train_loss": -18.60959815979004, "global_step": 23116, "epoch": 278} {"train_loss": -18.597896575927734, "global_step": 23117, "epoch": 278} {"train_loss": -18.426254272460938, "global_step": 23118, "epoch": 278} {"train_loss": -18.31072235107422, "global_step": 23119, "epoch": 278} {"train_loss": -18.80167007446289, "global_step": 23120, "epoch": 278} {"train_loss": -18.625686645507812, "global_step": 23121, "epoch": 278} {"train_loss": -18.340076446533203, "global_step": 23122, "epoch": 278} {"train_loss": -18.511587142944336, "global_step": 23123, "epoch": 278} {"train_loss": -18.5858097076416, "global_step": 23124, "epoch": 278} {"train_loss": -18.645008087158203, "global_step": 23125, "epoch": 278} {"train_loss": -18.508939743041992, "global_step": 23126, "epoch": 278} {"train_loss": -18.403812408447266, "global_step": 23127, "epoch": 278} {"train_loss": -18.477933883666992, "global_step": 23128, "epoch": 278} {"train_loss": -18.6317195892334, "global_step": 23129, "epoch": 278} {"train_loss": -18.63501739501953, "global_step": 23130, "epoch": 278} {"train_loss": -18.494184494018555, "global_step": 23131, "epoch": 278} {"train_loss": -18.79486656188965, "global_step": 23132, "epoch": 278} {"train_loss": -18.82122230529785, "global_step": 23133, "epoch": 278} {"train_loss": -18.655929565429688, "global_step": 23134, "epoch": 278} {"train_loss": -18.792882919311523, "global_step": 23135, "epoch": 278} {"train_loss": -18.630126953125, "global_step": 23136, "epoch": 278} {"train_loss": -18.707120895385742, "global_step": 23137, "epoch": 278} {"train_loss": -18.41454315185547, "global_step": 23138, "epoch": 278} {"train_loss": -18.674245834350586, "global_step": 23139, "epoch": 278} {"train_loss": -18.10780143737793, "global_step": 23140, "epoch": 278} {"train_loss": -18.777664184570312, "global_step": 23141, "epoch": 278} {"train_loss": -18.578022003173828, "global_step": 23142, "epoch": 278} {"train_loss": -18.86327362060547, "global_step": 23143, "epoch": 278} {"train_loss": -18.741859436035156, "global_step": 23144, "epoch": 278} {"train_loss": -19.087228775024414, "global_step": 23145, "epoch": 278} {"train_loss": -18.418685913085938, "global_step": 23146, "epoch": 278} {"train_loss": -18.715246200561523, "global_step": 23147, "epoch": 278} {"train_loss": -18.378625869750977, "global_step": 23148, "epoch": 278} {"train_loss": -18.475793838500977, "global_step": 23149, "epoch": 278} {"train_loss": -18.472122192382812, "global_step": 23150, "epoch": 278} {"train_loss": -18.54379653930664, "global_step": 23151, "epoch": 278} {"train_loss": -18.567276000976562, "global_step": 23152, "epoch": 278} {"train_loss": -18.931297302246094, "global_step": 23153, "epoch": 278} {"train_loss": -18.287906646728516, "global_step": 23154, "epoch": 278} {"train_loss": -18.726560592651367, "global_step": 23155, "epoch": 278} {"train_loss": -18.55028890127159, "global_step": 23156, "epoch": 278, "val_loss": 5935090.5} {"train_loss": -18.594892501831055, "global_step": 23157, "epoch": 279} {"train_loss": -18.346853256225586, "global_step": 23158, "epoch": 279} {"train_loss": -18.649547576904297, "global_step": 23159, "epoch": 279} {"train_loss": -18.47378158569336, "global_step": 23160, "epoch": 279} {"train_loss": -18.33544158935547, "global_step": 23161, "epoch": 279} {"train_loss": -18.473344802856445, "global_step": 23162, "epoch": 279} {"train_loss": -18.652578353881836, "global_step": 23163, "epoch": 279} {"train_loss": -18.41360855102539, "global_step": 23164, "epoch": 279} {"train_loss": -18.72151756286621, "global_step": 23165, "epoch": 279} {"train_loss": -18.459287643432617, "global_step": 23166, "epoch": 279} {"train_loss": -18.7186222076416, "global_step": 23167, "epoch": 279} {"train_loss": -18.385730743408203, "global_step": 23168, "epoch": 279} {"train_loss": -18.605703353881836, "global_step": 23169, "epoch": 279} {"train_loss": -18.49563980102539, "global_step": 23170, "epoch": 279} {"train_loss": -18.48931884765625, "global_step": 23171, "epoch": 279} {"train_loss": -18.54266929626465, "global_step": 23172, "epoch": 279} {"train_loss": -18.34075927734375, "global_step": 23173, "epoch": 279} {"train_loss": -18.251867294311523, "global_step": 23174, "epoch": 279} {"train_loss": -18.21677589416504, "global_step": 23175, "epoch": 279} {"train_loss": -18.618518829345703, "global_step": 23176, "epoch": 279} {"train_loss": -18.50856590270996, "global_step": 23177, "epoch": 279} {"train_loss": -18.398937225341797, "global_step": 23178, "epoch": 279} {"train_loss": -18.85975456237793, "global_step": 23179, "epoch": 279} {"train_loss": -18.505460739135742, "global_step": 23180, "epoch": 279} {"train_loss": -18.756153106689453, "global_step": 23181, "epoch": 279} {"train_loss": -18.598554611206055, "global_step": 23182, "epoch": 279} {"train_loss": -18.759090423583984, "global_step": 23183, "epoch": 279} {"train_loss": -18.741147994995117, "global_step": 23184, "epoch": 279} {"train_loss": -18.45387077331543, "global_step": 23185, "epoch": 279} {"train_loss": -18.476421356201172, "global_step": 23186, "epoch": 279} {"train_loss": -18.20400047302246, "global_step": 23187, "epoch": 279} {"train_loss": -18.48815155029297, "global_step": 23188, "epoch": 279} {"train_loss": -18.741579055786133, "global_step": 23189, "epoch": 279} {"train_loss": -18.88262367248535, "global_step": 23190, "epoch": 279} {"train_loss": -18.674589157104492, "global_step": 23191, "epoch": 279} {"train_loss": -18.934711456298828, "global_step": 23192, "epoch": 279} {"train_loss": -18.37544059753418, "global_step": 23193, "epoch": 279} {"train_loss": -18.559858322143555, "global_step": 23194, "epoch": 279} {"train_loss": -18.646493911743164, "global_step": 23195, "epoch": 279} {"train_loss": -18.24312400817871, "global_step": 23196, "epoch": 279} {"train_loss": -18.66188621520996, "global_step": 23197, "epoch": 279} {"train_loss": -18.793729782104492, "global_step": 23198, "epoch": 279} {"train_loss": -18.609216690063477, "global_step": 23199, "epoch": 279} {"train_loss": -18.50204086303711, "global_step": 23200, "epoch": 279} {"train_loss": -18.987899780273438, "global_step": 23201, "epoch": 279} {"train_loss": -18.39681053161621, "global_step": 23202, "epoch": 279} {"train_loss": -18.053939819335938, "global_step": 23203, "epoch": 279} {"train_loss": -18.471521377563477, "global_step": 23204, "epoch": 279} {"train_loss": -18.72234535217285, "global_step": 23205, "epoch": 279} {"train_loss": -18.198495864868164, "global_step": 23206, "epoch": 279} {"train_loss": -18.3212947845459, "global_step": 23207, "epoch": 279} {"train_loss": -18.78961944580078, "global_step": 23208, "epoch": 279} {"train_loss": -18.566638946533203, "global_step": 23209, "epoch": 279} {"train_loss": -18.40879249572754, "global_step": 23210, "epoch": 279} {"train_loss": -18.753992080688477, "global_step": 23211, "epoch": 279} {"train_loss": -18.654010772705078, "global_step": 23212, "epoch": 279} {"train_loss": -18.946441650390625, "global_step": 23213, "epoch": 279} {"train_loss": -18.629745483398438, "global_step": 23214, "epoch": 279} {"train_loss": -18.559818267822266, "global_step": 23215, "epoch": 279} {"train_loss": -18.85663414001465, "global_step": 23216, "epoch": 279} {"train_loss": -18.358718872070312, "global_step": 23217, "epoch": 279} {"train_loss": -18.375722885131836, "global_step": 23218, "epoch": 279} {"train_loss": -18.763961791992188, "global_step": 23219, "epoch": 279} {"train_loss": -18.873254776000977, "global_step": 23220, "epoch": 279} {"train_loss": -18.33165168762207, "global_step": 23221, "epoch": 279} {"train_loss": -18.1995792388916, "global_step": 23222, "epoch": 279} {"train_loss": -18.72565269470215, "global_step": 23223, "epoch": 279} {"train_loss": -18.770992279052734, "global_step": 23224, "epoch": 279} {"train_loss": -18.95051383972168, "global_step": 23225, "epoch": 279} {"train_loss": -18.428617477416992, "global_step": 23226, "epoch": 279} {"train_loss": -18.352155685424805, "global_step": 23227, "epoch": 279} {"train_loss": -18.31427574157715, "global_step": 23228, "epoch": 279} {"train_loss": -18.82020378112793, "global_step": 23229, "epoch": 279} {"train_loss": -18.681638717651367, "global_step": 23230, "epoch": 279} {"train_loss": -18.272335052490234, "global_step": 23231, "epoch": 279} {"train_loss": -18.720911026000977, "global_step": 23232, "epoch": 279} {"train_loss": -18.748504638671875, "global_step": 23233, "epoch": 279} {"train_loss": -18.426067352294922, "global_step": 23234, "epoch": 279} {"train_loss": -18.434921264648438, "global_step": 23235, "epoch": 279} {"train_loss": -18.425968170166016, "global_step": 23236, "epoch": 279} {"train_loss": -18.386999130249023, "global_step": 23237, "epoch": 279} {"train_loss": -18.513391494750977, "global_step": 23238, "epoch": 279} {"train_loss": -18.56051316318742, "global_step": 23239, "epoch": 279, "val_loss": 5862216.5} {"train_loss": -18.125951766967773, "global_step": 23240, "epoch": 280} {"train_loss": -17.99928855895996, "global_step": 23241, "epoch": 280} {"train_loss": -18.547121047973633, "global_step": 23242, "epoch": 280} {"train_loss": -18.445648193359375, "global_step": 23243, "epoch": 280} {"train_loss": -18.424028396606445, "global_step": 23244, "epoch": 280} {"train_loss": -18.269651412963867, "global_step": 23245, "epoch": 280} {"train_loss": -18.445579528808594, "global_step": 23246, "epoch": 280} {"train_loss": -18.367324829101562, "global_step": 23247, "epoch": 280} {"train_loss": -18.217512130737305, "global_step": 23248, "epoch": 280} {"train_loss": -18.347780227661133, "global_step": 23249, "epoch": 280} {"train_loss": -18.667444229125977, "global_step": 23250, "epoch": 280} {"train_loss": -18.442365646362305, "global_step": 23251, "epoch": 280} {"train_loss": -18.38465118408203, "global_step": 23252, "epoch": 280} {"train_loss": -18.336469650268555, "global_step": 23253, "epoch": 280} {"train_loss": -18.536483764648438, "global_step": 23254, "epoch": 280} {"train_loss": -18.43329429626465, "global_step": 23255, "epoch": 280} {"train_loss": -18.452688217163086, "global_step": 23256, "epoch": 280} {"train_loss": -18.401962280273438, "global_step": 23257, "epoch": 280} {"train_loss": -18.508874893188477, "global_step": 23258, "epoch": 280} {"train_loss": -18.83057975769043, "global_step": 23259, "epoch": 280} {"train_loss": -18.604459762573242, "global_step": 23260, "epoch": 280} {"train_loss": -18.864410400390625, "global_step": 23261, "epoch": 280} {"train_loss": -18.84102439880371, "global_step": 23262, "epoch": 280} {"train_loss": -18.590641021728516, "global_step": 23263, "epoch": 280} {"train_loss": -18.275745391845703, "global_step": 23264, "epoch": 280} {"train_loss": -17.966665267944336, "global_step": 23265, "epoch": 280} {"train_loss": -18.720355987548828, "global_step": 23266, "epoch": 280} {"train_loss": -18.419422149658203, "global_step": 23267, "epoch": 280} {"train_loss": -18.68768882751465, "global_step": 23268, "epoch": 280} {"train_loss": -18.374670028686523, "global_step": 23269, "epoch": 280} {"train_loss": -18.555110931396484, "global_step": 23270, "epoch": 280} {"train_loss": -18.16379165649414, "global_step": 23271, "epoch": 280} {"train_loss": -18.474058151245117, "global_step": 23272, "epoch": 280} {"train_loss": -18.4714412689209, "global_step": 23273, "epoch": 280} {"train_loss": -18.696502685546875, "global_step": 23274, "epoch": 280} {"train_loss": -18.46862030029297, "global_step": 23275, "epoch": 280} {"train_loss": -18.58310317993164, "global_step": 23276, "epoch": 280} {"train_loss": -18.51093101501465, "global_step": 23277, "epoch": 280} {"train_loss": -18.692228317260742, "global_step": 23278, "epoch": 280} {"train_loss": -18.442955017089844, "global_step": 23279, "epoch": 280} {"train_loss": -18.664159774780273, "global_step": 23280, "epoch": 280} {"train_loss": -18.748756408691406, "global_step": 23281, "epoch": 280} {"train_loss": -18.520673751831055, "global_step": 23282, "epoch": 280} {"train_loss": -18.715744018554688, "global_step": 23283, "epoch": 280} {"train_loss": -18.779754638671875, "global_step": 23284, "epoch": 280} {"train_loss": -18.191869735717773, "global_step": 23285, "epoch": 280} {"train_loss": -18.31995964050293, "global_step": 23286, "epoch": 280} {"train_loss": -18.767101287841797, "global_step": 23287, "epoch": 280} {"train_loss": -18.31491470336914, "global_step": 23288, "epoch": 280} {"train_loss": -18.72699546813965, "global_step": 23289, "epoch": 280} {"train_loss": -18.778583526611328, "global_step": 23290, "epoch": 280} {"train_loss": -18.889236450195312, "global_step": 23291, "epoch": 280} {"train_loss": -18.567230224609375, "global_step": 23292, "epoch": 280} {"train_loss": -18.870800018310547, "global_step": 23293, "epoch": 280} {"train_loss": -18.602928161621094, "global_step": 23294, "epoch": 280} {"train_loss": -18.210397720336914, "global_step": 23295, "epoch": 280} {"train_loss": -18.680383682250977, "global_step": 23296, "epoch": 280} {"train_loss": -18.268157958984375, "global_step": 23297, "epoch": 280} {"train_loss": -18.55510711669922, "global_step": 23298, "epoch": 280} {"train_loss": -18.50916862487793, "global_step": 23299, "epoch": 280} {"train_loss": -18.687082290649414, "global_step": 23300, "epoch": 280} {"train_loss": -18.72596549987793, "global_step": 23301, "epoch": 280} {"train_loss": -18.765663146972656, "global_step": 23302, "epoch": 280} {"train_loss": -18.865741729736328, "global_step": 23303, "epoch": 280} {"train_loss": -18.629486083984375, "global_step": 23304, "epoch": 280} {"train_loss": -18.71284294128418, "global_step": 23305, "epoch": 280} {"train_loss": -18.49492073059082, "global_step": 23306, "epoch": 280} {"train_loss": -18.85622215270996, "global_step": 23307, "epoch": 280} {"train_loss": -18.473722457885742, "global_step": 23308, "epoch": 280} {"train_loss": -18.452978134155273, "global_step": 23309, "epoch": 280} {"train_loss": -18.827899932861328, "global_step": 23310, "epoch": 280} {"train_loss": -18.61847686767578, "global_step": 23311, "epoch": 280} {"train_loss": -18.899381637573242, "global_step": 23312, "epoch": 280} {"train_loss": -18.829723358154297, "global_step": 23313, "epoch": 280} {"train_loss": -18.470874786376953, "global_step": 23314, "epoch": 280} {"train_loss": -18.5120906829834, "global_step": 23315, "epoch": 280} {"train_loss": -18.455486297607422, "global_step": 23316, "epoch": 280} {"train_loss": -18.688631057739258, "global_step": 23317, "epoch": 280} {"train_loss": -18.491695404052734, "global_step": 23318, "epoch": 280} {"train_loss": -18.61785888671875, "global_step": 23319, "epoch": 280} {"train_loss": -18.910362243652344, "global_step": 23320, "epoch": 280} {"train_loss": -18.640811920166016, "global_step": 23321, "epoch": 280} {"train_loss": -18.544083353984785, "global_step": 23322, "epoch": 280, "val_loss": 5901527.5} {"train_loss": -18.39815330505371, "global_step": 23323, "epoch": 281} {"train_loss": -18.518091201782227, "global_step": 23324, "epoch": 281} {"train_loss": -18.127578735351562, "global_step": 23325, "epoch": 281} {"train_loss": -18.431241989135742, "global_step": 23326, "epoch": 281} {"train_loss": -18.3721981048584, "global_step": 23327, "epoch": 281} {"train_loss": -18.68058204650879, "global_step": 23328, "epoch": 281} {"train_loss": -18.804443359375, "global_step": 23329, "epoch": 281} {"train_loss": -18.74622917175293, "global_step": 23330, "epoch": 281} {"train_loss": -18.46943473815918, "global_step": 23331, "epoch": 281} {"train_loss": -18.60834312438965, "global_step": 23332, "epoch": 281} {"train_loss": -18.531179428100586, "global_step": 23333, "epoch": 281} {"train_loss": -18.16230583190918, "global_step": 23334, "epoch": 281} {"train_loss": -18.018712997436523, "global_step": 23335, "epoch": 281} {"train_loss": -18.202131271362305, "global_step": 23336, "epoch": 281} {"train_loss": -18.729591369628906, "global_step": 23337, "epoch": 281} {"train_loss": -18.970327377319336, "global_step": 23338, "epoch": 281} {"train_loss": -18.593677520751953, "global_step": 23339, "epoch": 281} {"train_loss": -19.064634323120117, "global_step": 23340, "epoch": 281} {"train_loss": -18.298480987548828, "global_step": 23341, "epoch": 281} {"train_loss": -18.7857723236084, "global_step": 23342, "epoch": 281} {"train_loss": -18.582786560058594, "global_step": 23343, "epoch": 281} {"train_loss": -18.318748474121094, "global_step": 23344, "epoch": 281} {"train_loss": -18.753515243530273, "global_step": 23345, "epoch": 281} {"train_loss": -18.78118324279785, "global_step": 23346, "epoch": 281} {"train_loss": -18.36391258239746, "global_step": 23347, "epoch": 281} {"train_loss": -18.749160766601562, "global_step": 23348, "epoch": 281} {"train_loss": -18.213327407836914, "global_step": 23349, "epoch": 281} {"train_loss": -18.930042266845703, "global_step": 23350, "epoch": 281} {"train_loss": -18.375829696655273, "global_step": 23351, "epoch": 281} {"train_loss": -18.216636657714844, "global_step": 23352, "epoch": 281} {"train_loss": -18.737577438354492, "global_step": 23353, "epoch": 281} {"train_loss": -18.305341720581055, "global_step": 23354, "epoch": 281} {"train_loss": -18.7379150390625, "global_step": 23355, "epoch": 281} {"train_loss": -18.527442932128906, "global_step": 23356, "epoch": 281} {"train_loss": -18.929920196533203, "global_step": 23357, "epoch": 281} {"train_loss": -18.63361167907715, "global_step": 23358, "epoch": 281} {"train_loss": -18.644359588623047, "global_step": 23359, "epoch": 281} {"train_loss": -18.715425491333008, "global_step": 23360, "epoch": 281} {"train_loss": -18.71149444580078, "global_step": 23361, "epoch": 281} {"train_loss": -18.845712661743164, "global_step": 23362, "epoch": 281} {"train_loss": -18.959318161010742, "global_step": 23363, "epoch": 281} {"train_loss": -18.844005584716797, "global_step": 23364, "epoch": 281} {"train_loss": -17.912620544433594, "global_step": 23365, "epoch": 281} {"train_loss": -18.517345428466797, "global_step": 23366, "epoch": 281} {"train_loss": -18.754087448120117, "global_step": 23367, "epoch": 281} {"train_loss": -18.512126922607422, "global_step": 23368, "epoch": 281} {"train_loss": -18.334270477294922, "global_step": 23369, "epoch": 281} {"train_loss": -18.455387115478516, "global_step": 23370, "epoch": 281} {"train_loss": -18.93054962158203, "global_step": 23371, "epoch": 281} {"train_loss": -18.631460189819336, "global_step": 23372, "epoch": 281} {"train_loss": -18.367507934570312, "global_step": 23373, "epoch": 281} {"train_loss": -18.550065994262695, "global_step": 23374, "epoch": 281} {"train_loss": -18.154958724975586, "global_step": 23375, "epoch": 281} {"train_loss": -18.380645751953125, "global_step": 23376, "epoch": 281} {"train_loss": -18.652774810791016, "global_step": 23377, "epoch": 281} {"train_loss": -18.388805389404297, "global_step": 23378, "epoch": 281} {"train_loss": -19.01202964782715, "global_step": 23379, "epoch": 281} {"train_loss": -18.632658004760742, "global_step": 23380, "epoch": 281} {"train_loss": -18.767932891845703, "global_step": 23381, "epoch": 281} {"train_loss": -18.669408798217773, "global_step": 23382, "epoch": 281} {"train_loss": -19.015174865722656, "global_step": 23383, "epoch": 281} {"train_loss": -18.668258666992188, "global_step": 23384, "epoch": 281} {"train_loss": -18.487638473510742, "global_step": 23385, "epoch": 281} {"train_loss": -18.78367042541504, "global_step": 23386, "epoch": 281} {"train_loss": -18.93490219116211, "global_step": 23387, "epoch": 281} {"train_loss": -18.70527458190918, "global_step": 23388, "epoch": 281} {"train_loss": -18.446136474609375, "global_step": 23389, "epoch": 281} {"train_loss": -18.972156524658203, "global_step": 23390, "epoch": 281} {"train_loss": -18.306299209594727, "global_step": 23391, "epoch": 281} {"train_loss": -18.656452178955078, "global_step": 23392, "epoch": 281} {"train_loss": -18.770177841186523, "global_step": 23393, "epoch": 281} {"train_loss": -18.208295822143555, "global_step": 23394, "epoch": 281} {"train_loss": -18.792654037475586, "global_step": 23395, "epoch": 281} {"train_loss": -18.52308464050293, "global_step": 23396, "epoch": 281} {"train_loss": -18.075769424438477, "global_step": 23397, "epoch": 281} {"train_loss": -18.35345458984375, "global_step": 23398, "epoch": 281} {"train_loss": -18.63020896911621, "global_step": 23399, "epoch": 281} {"train_loss": -18.382156372070312, "global_step": 23400, "epoch": 281} {"train_loss": -18.52346420288086, "global_step": 23401, "epoch": 281} {"train_loss": -18.44769859313965, "global_step": 23402, "epoch": 281} {"train_loss": -18.702096939086914, "global_step": 23403, "epoch": 281} {"train_loss": -18.176612854003906, "global_step": 23404, "epoch": 281} {"train_loss": -18.54449074526867, "global_step": 23405, "epoch": 281, "val_loss": 6032661.5} {"train_loss": -18.011274337768555, "global_step": 23406, "epoch": 282} {"train_loss": -18.06324577331543, "global_step": 23407, "epoch": 282} {"train_loss": -18.27700424194336, "global_step": 23408, "epoch": 282} {"train_loss": -18.31755256652832, "global_step": 23409, "epoch": 282} {"train_loss": -18.20961570739746, "global_step": 23410, "epoch": 282} {"train_loss": -18.352548599243164, "global_step": 23411, "epoch": 282} {"train_loss": -18.3624324798584, "global_step": 23412, "epoch": 282} {"train_loss": -18.1283016204834, "global_step": 23413, "epoch": 282} {"train_loss": -18.26224708557129, "global_step": 23414, "epoch": 282} {"train_loss": -18.435047149658203, "global_step": 23415, "epoch": 282} {"train_loss": -18.26116371154785, "global_step": 23416, "epoch": 282} {"train_loss": -18.56548309326172, "global_step": 23417, "epoch": 282} {"train_loss": -18.464811325073242, "global_step": 23418, "epoch": 282} {"train_loss": -18.59364891052246, "global_step": 23419, "epoch": 282} {"train_loss": -18.11806297302246, "global_step": 23420, "epoch": 282} {"train_loss": -18.449613571166992, "global_step": 23421, "epoch": 282} {"train_loss": -18.40374755859375, "global_step": 23422, "epoch": 282} {"train_loss": -18.27515983581543, "global_step": 23423, "epoch": 282} {"train_loss": -18.39190673828125, "global_step": 23424, "epoch": 282} {"train_loss": -18.37114906311035, "global_step": 23425, "epoch": 282} {"train_loss": -18.664125442504883, "global_step": 23426, "epoch": 282} {"train_loss": -18.363813400268555, "global_step": 23427, "epoch": 282} {"train_loss": -18.489011764526367, "global_step": 23428, "epoch": 282} {"train_loss": -18.696273803710938, "global_step": 23429, "epoch": 282} {"train_loss": -18.592357635498047, "global_step": 23430, "epoch": 282} {"train_loss": -18.73316764831543, "global_step": 23431, "epoch": 282} {"train_loss": -18.69527244567871, "global_step": 23432, "epoch": 282} {"train_loss": -18.4837589263916, "global_step": 23433, "epoch": 282} {"train_loss": -18.733186721801758, "global_step": 23434, "epoch": 282} {"train_loss": -18.747501373291016, "global_step": 23435, "epoch": 282} {"train_loss": -18.844560623168945, "global_step": 23436, "epoch": 282} {"train_loss": -18.326963424682617, "global_step": 23437, "epoch": 282} {"train_loss": -18.80834197998047, "global_step": 23438, "epoch": 282} {"train_loss": -18.65570640563965, "global_step": 23439, "epoch": 282} {"train_loss": -18.64985466003418, "global_step": 23440, "epoch": 282} {"train_loss": -18.51094627380371, "global_step": 23441, "epoch": 282} {"train_loss": -18.475202560424805, "global_step": 23442, "epoch": 282} {"train_loss": -18.43834114074707, "global_step": 23443, "epoch": 282} {"train_loss": -18.384180068969727, "global_step": 23444, "epoch": 282} {"train_loss": -18.69086265563965, "global_step": 23445, "epoch": 282} {"train_loss": -18.671064376831055, "global_step": 23446, "epoch": 282} {"train_loss": -18.554752349853516, "global_step": 23447, "epoch": 282} {"train_loss": -18.74751091003418, "global_step": 23448, "epoch": 282} {"train_loss": -18.646530151367188, "global_step": 23449, "epoch": 282} {"train_loss": -18.896942138671875, "global_step": 23450, "epoch": 282} {"train_loss": -18.309101104736328, "global_step": 23451, "epoch": 282} {"train_loss": -18.54705810546875, "global_step": 23452, "epoch": 282} {"train_loss": -18.34760093688965, "global_step": 23453, "epoch": 282} {"train_loss": -18.830488204956055, "global_step": 23454, "epoch": 282} {"train_loss": -18.571739196777344, "global_step": 23455, "epoch": 282} {"train_loss": -18.515975952148438, "global_step": 23456, "epoch": 282} {"train_loss": -18.787893295288086, "global_step": 23457, "epoch": 282} {"train_loss": -18.423324584960938, "global_step": 23458, "epoch": 282} {"train_loss": -19.21689224243164, "global_step": 23459, "epoch": 282} {"train_loss": -18.22504997253418, "global_step": 23460, "epoch": 282} {"train_loss": -18.2055721282959, "global_step": 23461, "epoch": 282} {"train_loss": -19.10487174987793, "global_step": 23462, "epoch": 282} {"train_loss": -18.540517807006836, "global_step": 23463, "epoch": 282} {"train_loss": -18.7893009185791, "global_step": 23464, "epoch": 282} {"train_loss": -18.962013244628906, "global_step": 23465, "epoch": 282} {"train_loss": -18.510913848876953, "global_step": 23466, "epoch": 282} {"train_loss": -18.770767211914062, "global_step": 23467, "epoch": 282} {"train_loss": -18.404539108276367, "global_step": 23468, "epoch": 282} {"train_loss": -18.272705078125, "global_step": 23469, "epoch": 282} {"train_loss": -18.525955200195312, "global_step": 23470, "epoch": 282} {"train_loss": -18.490442276000977, "global_step": 23471, "epoch": 282} {"train_loss": -18.177114486694336, "global_step": 23472, "epoch": 282} {"train_loss": -18.48739242553711, "global_step": 23473, "epoch": 282} {"train_loss": -18.32521629333496, "global_step": 23474, "epoch": 282} {"train_loss": -18.6826171875, "global_step": 23475, "epoch": 282} {"train_loss": -18.47801399230957, "global_step": 23476, "epoch": 282} {"train_loss": -18.456090927124023, "global_step": 23477, "epoch": 282} {"train_loss": -18.786487579345703, "global_step": 23478, "epoch": 282} {"train_loss": -18.461118698120117, "global_step": 23479, "epoch": 282} {"train_loss": -18.32241439819336, "global_step": 23480, "epoch": 282} {"train_loss": -18.533294677734375, "global_step": 23481, "epoch": 282} {"train_loss": -18.32590675354004, "global_step": 23482, "epoch": 282} {"train_loss": -18.704578399658203, "global_step": 23483, "epoch": 282} {"train_loss": -18.493392944335938, "global_step": 23484, "epoch": 282} {"train_loss": -18.472625732421875, "global_step": 23485, "epoch": 282} {"train_loss": -18.704538345336914, "global_step": 23486, "epoch": 282} {"train_loss": -18.552011489868164, "global_step": 23487, "epoch": 282} {"train_loss": -18.51980696528791, "global_step": 23488, "epoch": 282, "val_loss": 5948648.0} {"train_loss": -18.109601974487305, "global_step": 23489, "epoch": 283} {"train_loss": -18.70296287536621, "global_step": 23490, "epoch": 283} {"train_loss": -18.721786499023438, "global_step": 23491, "epoch": 283} {"train_loss": -18.233718872070312, "global_step": 23492, "epoch": 283} {"train_loss": -18.669279098510742, "global_step": 23493, "epoch": 283} {"train_loss": -18.719112396240234, "global_step": 23494, "epoch": 283} {"train_loss": -18.583192825317383, "global_step": 23495, "epoch": 283} {"train_loss": -18.360315322875977, "global_step": 23496, "epoch": 283} {"train_loss": -18.339536666870117, "global_step": 23497, "epoch": 283} {"train_loss": -18.398239135742188, "global_step": 23498, "epoch": 283} {"train_loss": -18.4081974029541, "global_step": 23499, "epoch": 283} {"train_loss": -18.679166793823242, "global_step": 23500, "epoch": 283} {"train_loss": -18.43602752685547, "global_step": 23501, "epoch": 283} {"train_loss": -18.29633140563965, "global_step": 23502, "epoch": 283} {"train_loss": -18.556188583374023, "global_step": 23503, "epoch": 283} {"train_loss": -18.67154312133789, "global_step": 23504, "epoch": 283} {"train_loss": -17.901397705078125, "global_step": 23505, "epoch": 283} {"train_loss": -18.64417839050293, "global_step": 23506, "epoch": 283} {"train_loss": -18.47273063659668, "global_step": 23507, "epoch": 283} {"train_loss": -18.374588012695312, "global_step": 23508, "epoch": 283} {"train_loss": -18.1085147857666, "global_step": 23509, "epoch": 283} {"train_loss": -18.800291061401367, "global_step": 23510, "epoch": 283} {"train_loss": -18.804948806762695, "global_step": 23511, "epoch": 283} {"train_loss": -18.56868553161621, "global_step": 23512, "epoch": 283} {"train_loss": -18.459827423095703, "global_step": 23513, "epoch": 283} {"train_loss": -18.719913482666016, "global_step": 23514, "epoch": 283} {"train_loss": -18.62910270690918, "global_step": 23515, "epoch": 283} {"train_loss": -18.60634994506836, "global_step": 23516, "epoch": 283} {"train_loss": -18.42078971862793, "global_step": 23517, "epoch": 283} {"train_loss": -18.049453735351562, "global_step": 23518, "epoch": 283} {"train_loss": -18.852720260620117, "global_step": 23519, "epoch": 283} {"train_loss": -18.807392120361328, "global_step": 23520, "epoch": 283} {"train_loss": -18.35039710998535, "global_step": 23521, "epoch": 283} {"train_loss": -18.64232635498047, "global_step": 23522, "epoch": 283} {"train_loss": -18.37138557434082, "global_step": 23523, "epoch": 283} {"train_loss": -18.461591720581055, "global_step": 23524, "epoch": 283} {"train_loss": -18.83737564086914, "global_step": 23525, "epoch": 283} {"train_loss": -18.4585018157959, "global_step": 23526, "epoch": 283} {"train_loss": -18.586196899414062, "global_step": 23527, "epoch": 283} {"train_loss": -18.561084747314453, "global_step": 23528, "epoch": 283} {"train_loss": -18.878952026367188, "global_step": 23529, "epoch": 283} {"train_loss": -18.66327667236328, "global_step": 23530, "epoch": 283} {"train_loss": -18.549278259277344, "global_step": 23531, "epoch": 283} {"train_loss": -18.7657527923584, "global_step": 23532, "epoch": 283} {"train_loss": -18.57183265686035, "global_step": 23533, "epoch": 283} {"train_loss": -18.946317672729492, "global_step": 23534, "epoch": 283} {"train_loss": -18.665090560913086, "global_step": 23535, "epoch": 283} {"train_loss": -18.427743911743164, "global_step": 23536, "epoch": 283} {"train_loss": -18.701330184936523, "global_step": 23537, "epoch": 283} {"train_loss": -18.512104034423828, "global_step": 23538, "epoch": 283} {"train_loss": -18.989126205444336, "global_step": 23539, "epoch": 283} {"train_loss": -18.664865493774414, "global_step": 23540, "epoch": 283} {"train_loss": -18.486948013305664, "global_step": 23541, "epoch": 283} {"train_loss": -18.780643463134766, "global_step": 23542, "epoch": 283} {"train_loss": -18.777250289916992, "global_step": 23543, "epoch": 283} {"train_loss": -18.514083862304688, "global_step": 23544, "epoch": 283} {"train_loss": -18.370996475219727, "global_step": 23545, "epoch": 283} {"train_loss": -18.96685218811035, "global_step": 23546, "epoch": 283} {"train_loss": -18.63811683654785, "global_step": 23547, "epoch": 283} {"train_loss": -18.40266990661621, "global_step": 23548, "epoch": 283} {"train_loss": -18.959257125854492, "global_step": 23549, "epoch": 283} {"train_loss": -18.45511245727539, "global_step": 23550, "epoch": 283} {"train_loss": -18.714303970336914, "global_step": 23551, "epoch": 283} {"train_loss": -18.458267211914062, "global_step": 23552, "epoch": 283} {"train_loss": -18.345062255859375, "global_step": 23553, "epoch": 283} {"train_loss": -18.707321166992188, "global_step": 23554, "epoch": 283} {"train_loss": -18.53169059753418, "global_step": 23555, "epoch": 283} {"train_loss": -18.581388473510742, "global_step": 23556, "epoch": 283} {"train_loss": -18.76726722717285, "global_step": 23557, "epoch": 283} {"train_loss": -18.495771408081055, "global_step": 23558, "epoch": 283} {"train_loss": -18.756576538085938, "global_step": 23559, "epoch": 283} {"train_loss": -18.66245460510254, "global_step": 23560, "epoch": 283} {"train_loss": -18.53376007080078, "global_step": 23561, "epoch": 283} {"train_loss": -18.426137924194336, "global_step": 23562, "epoch": 283} {"train_loss": -18.286550521850586, "global_step": 23563, "epoch": 283} {"train_loss": -18.974655151367188, "global_step": 23564, "epoch": 283} {"train_loss": -18.440540313720703, "global_step": 23565, "epoch": 283} {"train_loss": -18.871570587158203, "global_step": 23566, "epoch": 283} {"train_loss": -18.585941314697266, "global_step": 23567, "epoch": 283} {"train_loss": -18.82628059387207, "global_step": 23568, "epoch": 283} {"train_loss": -18.662595748901367, "global_step": 23569, "epoch": 283} {"train_loss": -18.7149658203125, "global_step": 23570, "epoch": 283} {"train_loss": -18.59084301684276, "global_step": 23571, "epoch": 283, "val_loss": 5906767.0} {"train_loss": -18.519474029541016, "global_step": 23572, "epoch": 284} {"train_loss": -18.413694381713867, "global_step": 23573, "epoch": 284} {"train_loss": -18.627456665039062, "global_step": 23574, "epoch": 284} {"train_loss": -19.00507164001465, "global_step": 23575, "epoch": 284} {"train_loss": -18.75149154663086, "global_step": 23576, "epoch": 284} {"train_loss": -18.09903907775879, "global_step": 23577, "epoch": 284} {"train_loss": -18.731321334838867, "global_step": 23578, "epoch": 284} {"train_loss": -18.434968948364258, "global_step": 23579, "epoch": 284} {"train_loss": -18.942296981811523, "global_step": 23580, "epoch": 284} {"train_loss": -18.562448501586914, "global_step": 23581, "epoch": 284} {"train_loss": -18.622777938842773, "global_step": 23582, "epoch": 284} {"train_loss": -18.154783248901367, "global_step": 23583, "epoch": 284} {"train_loss": -18.615339279174805, "global_step": 23584, "epoch": 284} {"train_loss": -18.407316207885742, "global_step": 23585, "epoch": 284} {"train_loss": -18.348087310791016, "global_step": 23586, "epoch": 284} {"train_loss": -18.29194450378418, "global_step": 23587, "epoch": 284} {"train_loss": -18.62188720703125, "global_step": 23588, "epoch": 284} {"train_loss": -18.378101348876953, "global_step": 23589, "epoch": 284} {"train_loss": -18.42994499206543, "global_step": 23590, "epoch": 284} {"train_loss": -18.86163330078125, "global_step": 23591, "epoch": 284} {"train_loss": -18.946096420288086, "global_step": 23592, "epoch": 284} {"train_loss": -18.45736312866211, "global_step": 23593, "epoch": 284} {"train_loss": -18.61621856689453, "global_step": 23594, "epoch": 284} {"train_loss": -18.51874351501465, "global_step": 23595, "epoch": 284} {"train_loss": -18.385196685791016, "global_step": 23596, "epoch": 284} {"train_loss": -18.31466293334961, "global_step": 23597, "epoch": 284} {"train_loss": -18.615686416625977, "global_step": 23598, "epoch": 284} {"train_loss": -18.200885772705078, "global_step": 23599, "epoch": 284} {"train_loss": -18.90703582763672, "global_step": 23600, "epoch": 284} {"train_loss": -18.790048599243164, "global_step": 23601, "epoch": 284} {"train_loss": -18.98046112060547, "global_step": 23602, "epoch": 284} {"train_loss": -18.432636260986328, "global_step": 23603, "epoch": 284} {"train_loss": -18.493860244750977, "global_step": 23604, "epoch": 284} {"train_loss": -18.6075496673584, "global_step": 23605, "epoch": 284} {"train_loss": -19.017213821411133, "global_step": 23606, "epoch": 284} {"train_loss": -18.629751205444336, "global_step": 23607, "epoch": 284} {"train_loss": -18.749900817871094, "global_step": 23608, "epoch": 284} {"train_loss": -18.44815444946289, "global_step": 23609, "epoch": 284} {"train_loss": -18.559818267822266, "global_step": 23610, "epoch": 284} {"train_loss": -18.125076293945312, "global_step": 23611, "epoch": 284} {"train_loss": -18.552709579467773, "global_step": 23612, "epoch": 284} {"train_loss": -18.549009323120117, "global_step": 23613, "epoch": 284} {"train_loss": -18.589704513549805, "global_step": 23614, "epoch": 284} {"train_loss": -18.644487380981445, "global_step": 23615, "epoch": 284} {"train_loss": -18.455236434936523, "global_step": 23616, "epoch": 284} {"train_loss": -18.347564697265625, "global_step": 23617, "epoch": 284} {"train_loss": -18.693212509155273, "global_step": 23618, "epoch": 284} {"train_loss": -18.52652359008789, "global_step": 23619, "epoch": 284} {"train_loss": -18.469812393188477, "global_step": 23620, "epoch": 284} {"train_loss": -18.581405639648438, "global_step": 23621, "epoch": 284} {"train_loss": -18.705322265625, "global_step": 23622, "epoch": 284} {"train_loss": -18.17989158630371, "global_step": 23623, "epoch": 284} {"train_loss": -18.70424461364746, "global_step": 23624, "epoch": 284} {"train_loss": -18.750585556030273, "global_step": 23625, "epoch": 284} {"train_loss": -18.52918815612793, "global_step": 23626, "epoch": 284} {"train_loss": -18.528573989868164, "global_step": 23627, "epoch": 284} {"train_loss": -18.66799545288086, "global_step": 23628, "epoch": 284} {"train_loss": -18.617727279663086, "global_step": 23629, "epoch": 284} {"train_loss": -18.601600646972656, "global_step": 23630, "epoch": 284} {"train_loss": -18.417739868164062, "global_step": 23631, "epoch": 284} {"train_loss": -18.540363311767578, "global_step": 23632, "epoch": 284} {"train_loss": -19.004608154296875, "global_step": 23633, "epoch": 284} {"train_loss": -18.61945915222168, "global_step": 23634, "epoch": 284} {"train_loss": -18.35944175720215, "global_step": 23635, "epoch": 284} {"train_loss": -18.84064292907715, "global_step": 23636, "epoch": 284} {"train_loss": -18.448156356811523, "global_step": 23637, "epoch": 284} {"train_loss": -18.4257869720459, "global_step": 23638, "epoch": 284} {"train_loss": -18.889726638793945, "global_step": 23639, "epoch": 284} {"train_loss": -18.46900749206543, "global_step": 23640, "epoch": 284} {"train_loss": -18.38508415222168, "global_step": 23641, "epoch": 284} {"train_loss": -19.01643180847168, "global_step": 23642, "epoch": 284} {"train_loss": -18.66433334350586, "global_step": 23643, "epoch": 284} {"train_loss": -18.6920223236084, "global_step": 23644, "epoch": 284} {"train_loss": -18.273353576660156, "global_step": 23645, "epoch": 284} {"train_loss": -18.6168155670166, "global_step": 23646, "epoch": 284} {"train_loss": -18.575801849365234, "global_step": 23647, "epoch": 284} {"train_loss": -18.595617294311523, "global_step": 23648, "epoch": 284} {"train_loss": -18.206104278564453, "global_step": 23649, "epoch": 284} {"train_loss": -18.843557357788086, "global_step": 23650, "epoch": 284} {"train_loss": -18.679340362548828, "global_step": 23651, "epoch": 284} {"train_loss": -18.529325485229492, "global_step": 23652, "epoch": 284} {"train_loss": -19.02754783630371, "global_step": 23653, "epoch": 284} {"train_loss": -18.562697100352093, "global_step": 23654, "epoch": 284, "val_loss": 6007010.0} {"train_loss": -18.353628158569336, "global_step": 23655, "epoch": 285} {"train_loss": -18.547269821166992, "global_step": 23656, "epoch": 285} {"train_loss": -18.45301628112793, "global_step": 23657, "epoch": 285} {"train_loss": -18.75983238220215, "global_step": 23658, "epoch": 285} {"train_loss": -18.511072158813477, "global_step": 23659, "epoch": 285} {"train_loss": -18.185047149658203, "global_step": 23660, "epoch": 285} {"train_loss": -18.41304588317871, "global_step": 23661, "epoch": 285} {"train_loss": -18.706939697265625, "global_step": 23662, "epoch": 285} {"train_loss": -18.728178024291992, "global_step": 23663, "epoch": 285} {"train_loss": -18.765853881835938, "global_step": 23664, "epoch": 285} {"train_loss": -18.559629440307617, "global_step": 23665, "epoch": 285} {"train_loss": -18.572296142578125, "global_step": 23666, "epoch": 285} {"train_loss": -18.427698135375977, "global_step": 23667, "epoch": 285} {"train_loss": -18.11086654663086, "global_step": 23668, "epoch": 285} {"train_loss": -18.349380493164062, "global_step": 23669, "epoch": 285} {"train_loss": -18.401535034179688, "global_step": 23670, "epoch": 285} {"train_loss": -18.696369171142578, "global_step": 23671, "epoch": 285} {"train_loss": -18.68721580505371, "global_step": 23672, "epoch": 285} {"train_loss": -18.847883224487305, "global_step": 23673, "epoch": 285} {"train_loss": -18.354780197143555, "global_step": 23674, "epoch": 285} {"train_loss": -18.23146629333496, "global_step": 23675, "epoch": 285} {"train_loss": -18.776447296142578, "global_step": 23676, "epoch": 285} {"train_loss": -18.78629493713379, "global_step": 23677, "epoch": 285} {"train_loss": -18.4908447265625, "global_step": 23678, "epoch": 285} {"train_loss": -18.782899856567383, "global_step": 23679, "epoch": 285} {"train_loss": -18.499385833740234, "global_step": 23680, "epoch": 285} {"train_loss": -18.964887619018555, "global_step": 23681, "epoch": 285} {"train_loss": -18.616548538208008, "global_step": 23682, "epoch": 285} {"train_loss": -18.903749465942383, "global_step": 23683, "epoch": 285} {"train_loss": -18.68651580810547, "global_step": 23684, "epoch": 285} {"train_loss": -18.531023025512695, "global_step": 23685, "epoch": 285} {"train_loss": -18.362573623657227, "global_step": 23686, "epoch": 285} {"train_loss": -18.780073165893555, "global_step": 23687, "epoch": 285} {"train_loss": -18.504459381103516, "global_step": 23688, "epoch": 285} {"train_loss": -18.832387924194336, "global_step": 23689, "epoch": 285} {"train_loss": -18.424835205078125, "global_step": 23690, "epoch": 285} {"train_loss": -18.93110466003418, "global_step": 23691, "epoch": 285} {"train_loss": -18.341339111328125, "global_step": 23692, "epoch": 285} {"train_loss": -18.73790740966797, "global_step": 23693, "epoch": 285} {"train_loss": -18.581134796142578, "global_step": 23694, "epoch": 285} {"train_loss": -18.732622146606445, "global_step": 23695, "epoch": 285} {"train_loss": -18.38970184326172, "global_step": 23696, "epoch": 285} {"train_loss": -18.62390899658203, "global_step": 23697, "epoch": 285} {"train_loss": -18.836700439453125, "global_step": 23698, "epoch": 285} {"train_loss": -18.62904167175293, "global_step": 23699, "epoch": 285} {"train_loss": -18.65242576599121, "global_step": 23700, "epoch": 285} {"train_loss": -18.704587936401367, "global_step": 23701, "epoch": 285} {"train_loss": -18.32480812072754, "global_step": 23702, "epoch": 285} {"train_loss": -18.658506393432617, "global_step": 23703, "epoch": 285} {"train_loss": -18.69028091430664, "global_step": 23704, "epoch": 285} {"train_loss": -18.76032066345215, "global_step": 23705, "epoch": 285} {"train_loss": -18.45685386657715, "global_step": 23706, "epoch": 285} {"train_loss": -18.309066772460938, "global_step": 23707, "epoch": 285} {"train_loss": -18.687833786010742, "global_step": 23708, "epoch": 285} {"train_loss": -18.508756637573242, "global_step": 23709, "epoch": 285} {"train_loss": -18.37896728515625, "global_step": 23710, "epoch": 285} {"train_loss": -18.628503799438477, "global_step": 23711, "epoch": 285} {"train_loss": -18.673757553100586, "global_step": 23712, "epoch": 285} {"train_loss": -18.428871154785156, "global_step": 23713, "epoch": 285} {"train_loss": -18.68280029296875, "global_step": 23714, "epoch": 285} {"train_loss": -18.121217727661133, "global_step": 23715, "epoch": 285} {"train_loss": -18.801366806030273, "global_step": 23716, "epoch": 285} {"train_loss": -18.779300689697266, "global_step": 23717, "epoch": 285} {"train_loss": -18.813236236572266, "global_step": 23718, "epoch": 285} {"train_loss": -18.428800582885742, "global_step": 23719, "epoch": 285} {"train_loss": -18.54611587524414, "global_step": 23720, "epoch": 285} {"train_loss": -18.706838607788086, "global_step": 23721, "epoch": 285} {"train_loss": -18.727323532104492, "global_step": 23722, "epoch": 285} {"train_loss": -18.802656173706055, "global_step": 23723, "epoch": 285} {"train_loss": -18.637617111206055, "global_step": 23724, "epoch": 285} {"train_loss": -18.849363327026367, "global_step": 23725, "epoch": 285} {"train_loss": -18.905029296875, "global_step": 23726, "epoch": 285} {"train_loss": -18.450342178344727, "global_step": 23727, "epoch": 285} {"train_loss": -18.493642807006836, "global_step": 23728, "epoch": 285} {"train_loss": -18.678659439086914, "global_step": 23729, "epoch": 285} {"train_loss": -18.60307502746582, "global_step": 23730, "epoch": 285} {"train_loss": -18.53975486755371, "global_step": 23731, "epoch": 285} {"train_loss": -19.10572624206543, "global_step": 23732, "epoch": 285} {"train_loss": -18.539941787719727, "global_step": 23733, "epoch": 285} {"train_loss": -18.65705680847168, "global_step": 23734, "epoch": 285} {"train_loss": -18.48383140563965, "global_step": 23735, "epoch": 285} {"train_loss": -18.65472412109375, "global_step": 23736, "epoch": 285} {"train_loss": -18.612923196999425, "global_step": 23737, "epoch": 285, "val_loss": 5953197.0} {"train_loss": -18.35552406311035, "global_step": 23738, "epoch": 286} {"train_loss": -18.575170516967773, "global_step": 23739, "epoch": 286} {"train_loss": -18.170286178588867, "global_step": 23740, "epoch": 286} {"train_loss": -18.408981323242188, "global_step": 23741, "epoch": 286} {"train_loss": -18.80951499938965, "global_step": 23742, "epoch": 286} {"train_loss": -18.322607040405273, "global_step": 23743, "epoch": 286} {"train_loss": -18.232236862182617, "global_step": 23744, "epoch": 286} {"train_loss": -18.367233276367188, "global_step": 23745, "epoch": 286} {"train_loss": -18.79498291015625, "global_step": 23746, "epoch": 286} {"train_loss": -18.466955184936523, "global_step": 23747, "epoch": 286} {"train_loss": -18.56978416442871, "global_step": 23748, "epoch": 286} {"train_loss": -18.453519821166992, "global_step": 23749, "epoch": 286} {"train_loss": -18.72013282775879, "global_step": 23750, "epoch": 286} {"train_loss": -18.539052963256836, "global_step": 23751, "epoch": 286} {"train_loss": -18.455028533935547, "global_step": 23752, "epoch": 286} {"train_loss": -18.78541374206543, "global_step": 23753, "epoch": 286} {"train_loss": -18.662900924682617, "global_step": 23754, "epoch": 286} {"train_loss": -18.609161376953125, "global_step": 23755, "epoch": 286} {"train_loss": -18.940412521362305, "global_step": 23756, "epoch": 286} {"train_loss": -18.441478729248047, "global_step": 23757, "epoch": 286} {"train_loss": -18.82588005065918, "global_step": 23758, "epoch": 286} {"train_loss": -18.949508666992188, "global_step": 23759, "epoch": 286} {"train_loss": -18.371427536010742, "global_step": 23760, "epoch": 286} {"train_loss": -18.768632888793945, "global_step": 23761, "epoch": 286} {"train_loss": -18.549192428588867, "global_step": 23762, "epoch": 286} {"train_loss": -18.725248336791992, "global_step": 23763, "epoch": 286} {"train_loss": -18.82456398010254, "global_step": 23764, "epoch": 286} {"train_loss": -18.69321060180664, "global_step": 23765, "epoch": 286} {"train_loss": -18.736743927001953, "global_step": 23766, "epoch": 286} {"train_loss": -18.558834075927734, "global_step": 23767, "epoch": 286} {"train_loss": -18.064767837524414, "global_step": 23768, "epoch": 286} {"train_loss": -18.443204879760742, "global_step": 23769, "epoch": 286} {"train_loss": -18.859905242919922, "global_step": 23770, "epoch": 286} {"train_loss": -18.319787979125977, "global_step": 23771, "epoch": 286} {"train_loss": -18.649877548217773, "global_step": 23772, "epoch": 286} {"train_loss": -18.57735252380371, "global_step": 23773, "epoch": 286} {"train_loss": -18.666929244995117, "global_step": 23774, "epoch": 286} {"train_loss": -18.55381202697754, "global_step": 23775, "epoch": 286} {"train_loss": -17.878494262695312, "global_step": 23776, "epoch": 286} {"train_loss": -18.656362533569336, "global_step": 23777, "epoch": 286} {"train_loss": -18.513280868530273, "global_step": 23778, "epoch": 286} {"train_loss": -18.407955169677734, "global_step": 23779, "epoch": 286} {"train_loss": -18.301687240600586, "global_step": 23780, "epoch": 286} {"train_loss": -18.86727523803711, "global_step": 23781, "epoch": 286} {"train_loss": -18.729354858398438, "global_step": 23782, "epoch": 286} {"train_loss": -18.579133987426758, "global_step": 23783, "epoch": 286} {"train_loss": -18.553226470947266, "global_step": 23784, "epoch": 286} {"train_loss": -18.559280395507812, "global_step": 23785, "epoch": 286} {"train_loss": -18.96500015258789, "global_step": 23786, "epoch": 286} {"train_loss": -18.506834030151367, "global_step": 23787, "epoch": 286} {"train_loss": -18.942642211914062, "global_step": 23788, "epoch": 286} {"train_loss": -18.800138473510742, "global_step": 23789, "epoch": 286} {"train_loss": -18.419116973876953, "global_step": 23790, "epoch": 286} {"train_loss": -18.73486328125, "global_step": 23791, "epoch": 286} {"train_loss": -18.683778762817383, "global_step": 23792, "epoch": 286} {"train_loss": -18.531782150268555, "global_step": 23793, "epoch": 286} {"train_loss": -18.7540225982666, "global_step": 23794, "epoch": 286} {"train_loss": -18.78406524658203, "global_step": 23795, "epoch": 286} {"train_loss": -18.907705307006836, "global_step": 23796, "epoch": 286} {"train_loss": -18.358190536499023, "global_step": 23797, "epoch": 286} {"train_loss": -18.628543853759766, "global_step": 23798, "epoch": 286} {"train_loss": -18.895523071289062, "global_step": 23799, "epoch": 286} {"train_loss": -18.443984985351562, "global_step": 23800, "epoch": 286} {"train_loss": -18.617252349853516, "global_step": 23801, "epoch": 286} {"train_loss": -18.782880783081055, "global_step": 23802, "epoch": 286} {"train_loss": -18.472007751464844, "global_step": 23803, "epoch": 286} {"train_loss": -18.4217586517334, "global_step": 23804, "epoch": 286} {"train_loss": -18.36712646484375, "global_step": 23805, "epoch": 286} {"train_loss": -18.757925033569336, "global_step": 23806, "epoch": 286} {"train_loss": -18.63437843322754, "global_step": 23807, "epoch": 286} {"train_loss": -18.707372665405273, "global_step": 23808, "epoch": 286} {"train_loss": -18.55426025390625, "global_step": 23809, "epoch": 286} {"train_loss": -18.726043701171875, "global_step": 23810, "epoch": 286} {"train_loss": -18.17487907409668, "global_step": 23811, "epoch": 286} {"train_loss": -18.705886840820312, "global_step": 23812, "epoch": 286} {"train_loss": -18.75351333618164, "global_step": 23813, "epoch": 286} {"train_loss": -18.254261016845703, "global_step": 23814, "epoch": 286} {"train_loss": -18.263341903686523, "global_step": 23815, "epoch": 286} {"train_loss": -18.79142189025879, "global_step": 23816, "epoch": 286} {"train_loss": -18.868207931518555, "global_step": 23817, "epoch": 286} {"train_loss": -18.75440788269043, "global_step": 23818, "epoch": 286} {"train_loss": -18.622346878051758, "global_step": 23819, "epoch": 286} {"train_loss": -18.570614274725855, "global_step": 23820, "epoch": 286, "val_loss": 5913212.5} {"train_loss": -18.33576011657715, "global_step": 23821, "epoch": 287} {"train_loss": -18.684581756591797, "global_step": 23822, "epoch": 287} {"train_loss": -17.996854782104492, "global_step": 23823, "epoch": 287} {"train_loss": -18.4988956451416, "global_step": 23824, "epoch": 287} {"train_loss": -18.11592674255371, "global_step": 23825, "epoch": 287} {"train_loss": -18.45060157775879, "global_step": 23826, "epoch": 287} {"train_loss": -18.56007957458496, "global_step": 23827, "epoch": 287} {"train_loss": -18.297109603881836, "global_step": 23828, "epoch": 287} {"train_loss": -18.790782928466797, "global_step": 23829, "epoch": 287} {"train_loss": -18.700345993041992, "global_step": 23830, "epoch": 287} {"train_loss": -18.822078704833984, "global_step": 23831, "epoch": 287} {"train_loss": -18.353185653686523, "global_step": 23832, "epoch": 287} {"train_loss": -18.45880699157715, "global_step": 23833, "epoch": 287} {"train_loss": -18.725555419921875, "global_step": 23834, "epoch": 287} {"train_loss": -18.683670043945312, "global_step": 23835, "epoch": 287} {"train_loss": -18.658506393432617, "global_step": 23836, "epoch": 287} {"train_loss": -18.768903732299805, "global_step": 23837, "epoch": 287} {"train_loss": -18.709375381469727, "global_step": 23838, "epoch": 287} {"train_loss": -18.53133201599121, "global_step": 23839, "epoch": 287} {"train_loss": -18.92982292175293, "global_step": 23840, "epoch": 287} {"train_loss": -18.6159725189209, "global_step": 23841, "epoch": 287} {"train_loss": -18.4480037689209, "global_step": 23842, "epoch": 287} {"train_loss": -18.781103134155273, "global_step": 23843, "epoch": 287} {"train_loss": -18.881752014160156, "global_step": 23844, "epoch": 287} {"train_loss": -18.490514755249023, "global_step": 23845, "epoch": 287} {"train_loss": -18.661975860595703, "global_step": 23846, "epoch": 287} {"train_loss": -18.7751522064209, "global_step": 23847, "epoch": 287} {"train_loss": -18.294626235961914, "global_step": 23848, "epoch": 287} {"train_loss": -18.524063110351562, "global_step": 23849, "epoch": 287} {"train_loss": -18.958593368530273, "global_step": 23850, "epoch": 287} {"train_loss": -18.637292861938477, "global_step": 23851, "epoch": 287} {"train_loss": -18.305967330932617, "global_step": 23852, "epoch": 287} {"train_loss": -19.11115837097168, "global_step": 23853, "epoch": 287} {"train_loss": -18.54486656188965, "global_step": 23854, "epoch": 287} {"train_loss": -18.96297264099121, "global_step": 23855, "epoch": 287} {"train_loss": -18.545330047607422, "global_step": 23856, "epoch": 287} {"train_loss": -18.597593307495117, "global_step": 23857, "epoch": 287} {"train_loss": -18.30202293395996, "global_step": 23858, "epoch": 287} {"train_loss": -18.728055953979492, "global_step": 23859, "epoch": 287} {"train_loss": -18.44257164001465, "global_step": 23860, "epoch": 287} {"train_loss": -18.62177848815918, "global_step": 23861, "epoch": 287} {"train_loss": -18.728561401367188, "global_step": 23862, "epoch": 287} {"train_loss": -18.475873947143555, "global_step": 23863, "epoch": 287} {"train_loss": -18.391101837158203, "global_step": 23864, "epoch": 287} {"train_loss": -18.551727294921875, "global_step": 23865, "epoch": 287} {"train_loss": -18.88575553894043, "global_step": 23866, "epoch": 287} {"train_loss": -18.621877670288086, "global_step": 23867, "epoch": 287} {"train_loss": -18.54947853088379, "global_step": 23868, "epoch": 287} {"train_loss": -18.519920349121094, "global_step": 23869, "epoch": 287} {"train_loss": -18.81451416015625, "global_step": 23870, "epoch": 287} {"train_loss": -18.47958755493164, "global_step": 23871, "epoch": 287} {"train_loss": -18.66778564453125, "global_step": 23872, "epoch": 287} {"train_loss": -18.247312545776367, "global_step": 23873, "epoch": 287} {"train_loss": -18.399606704711914, "global_step": 23874, "epoch": 287} {"train_loss": -18.492202758789062, "global_step": 23875, "epoch": 287} {"train_loss": -18.492406845092773, "global_step": 23876, "epoch": 287} {"train_loss": -18.65126609802246, "global_step": 23877, "epoch": 287} {"train_loss": -18.433185577392578, "global_step": 23878, "epoch": 287} {"train_loss": -18.85445213317871, "global_step": 23879, "epoch": 287} {"train_loss": -18.68604850769043, "global_step": 23880, "epoch": 287} {"train_loss": -18.687397003173828, "global_step": 23881, "epoch": 287} {"train_loss": -18.34072494506836, "global_step": 23882, "epoch": 287} {"train_loss": -19.03826332092285, "global_step": 23883, "epoch": 287} {"train_loss": -18.674697875976562, "global_step": 23884, "epoch": 287} {"train_loss": -18.65762710571289, "global_step": 23885, "epoch": 287} {"train_loss": -18.476070404052734, "global_step": 23886, "epoch": 287} {"train_loss": -18.8061466217041, "global_step": 23887, "epoch": 287} {"train_loss": -18.736576080322266, "global_step": 23888, "epoch": 287} {"train_loss": -18.902158737182617, "global_step": 23889, "epoch": 287} {"train_loss": -18.806467056274414, "global_step": 23890, "epoch": 287} {"train_loss": -18.402006149291992, "global_step": 23891, "epoch": 287} {"train_loss": -18.55607032775879, "global_step": 23892, "epoch": 287} {"train_loss": -18.42702293395996, "global_step": 23893, "epoch": 287} {"train_loss": -18.556941986083984, "global_step": 23894, "epoch": 287} {"train_loss": -18.413881301879883, "global_step": 23895, "epoch": 287} {"train_loss": -18.129653930664062, "global_step": 23896, "epoch": 287} {"train_loss": -18.430744171142578, "global_step": 23897, "epoch": 287} {"train_loss": -18.487987518310547, "global_step": 23898, "epoch": 287} {"train_loss": -18.659162521362305, "global_step": 23899, "epoch": 287} {"train_loss": -18.44035530090332, "global_step": 23900, "epoch": 287} {"train_loss": -18.486459732055664, "global_step": 23901, "epoch": 287} {"train_loss": -18.544275283813477, "global_step": 23902, "epoch": 287} {"train_loss": -18.587776321962654, "global_step": 23903, "epoch": 287, "val_loss": 6065673.0} {"train_loss": -17.74907112121582, "global_step": 23904, "epoch": 288} {"train_loss": -18.078842163085938, "global_step": 23905, "epoch": 288} {"train_loss": -17.94196128845215, "global_step": 23906, "epoch": 288} {"train_loss": -17.994260787963867, "global_step": 23907, "epoch": 288} {"train_loss": -18.166046142578125, "global_step": 23908, "epoch": 288} {"train_loss": -18.05198097229004, "global_step": 23909, "epoch": 288} {"train_loss": -18.358028411865234, "global_step": 23910, "epoch": 288} {"train_loss": -18.52381706237793, "global_step": 23911, "epoch": 288} {"train_loss": -18.217626571655273, "global_step": 23912, "epoch": 288} {"train_loss": -18.507247924804688, "global_step": 23913, "epoch": 288} {"train_loss": -18.2305850982666, "global_step": 23914, "epoch": 288} {"train_loss": -17.87432098388672, "global_step": 23915, "epoch": 288} {"train_loss": -18.760730743408203, "global_step": 23916, "epoch": 288} {"train_loss": -18.096782684326172, "global_step": 23917, "epoch": 288} {"train_loss": -18.179182052612305, "global_step": 23918, "epoch": 288} {"train_loss": -18.46788215637207, "global_step": 23919, "epoch": 288} {"train_loss": -18.267847061157227, "global_step": 23920, "epoch": 288} {"train_loss": -18.373401641845703, "global_step": 23921, "epoch": 288} {"train_loss": -18.599937438964844, "global_step": 23922, "epoch": 288} {"train_loss": -18.7795467376709, "global_step": 23923, "epoch": 288} {"train_loss": -18.81501579284668, "global_step": 23924, "epoch": 288} {"train_loss": -18.582122802734375, "global_step": 23925, "epoch": 288} {"train_loss": -18.4981689453125, "global_step": 23926, "epoch": 288} {"train_loss": -18.608360290527344, "global_step": 23927, "epoch": 288} {"train_loss": -18.587194442749023, "global_step": 23928, "epoch": 288} {"train_loss": -18.803787231445312, "global_step": 23929, "epoch": 288} {"train_loss": -18.561561584472656, "global_step": 23930, "epoch": 288} {"train_loss": -18.726057052612305, "global_step": 23931, "epoch": 288} {"train_loss": -18.50258445739746, "global_step": 23932, "epoch": 288} {"train_loss": -18.4917049407959, "global_step": 23933, "epoch": 288} {"train_loss": -18.362958908081055, "global_step": 23934, "epoch": 288} {"train_loss": -18.446664810180664, "global_step": 23935, "epoch": 288} {"train_loss": -18.603240966796875, "global_step": 23936, "epoch": 288} {"train_loss": -18.442121505737305, "global_step": 23937, "epoch": 288} {"train_loss": -18.639734268188477, "global_step": 23938, "epoch": 288} {"train_loss": -18.576932907104492, "global_step": 23939, "epoch": 288} {"train_loss": -18.608566284179688, "global_step": 23940, "epoch": 288} {"train_loss": -18.448453903198242, "global_step": 23941, "epoch": 288} {"train_loss": -18.374141693115234, "global_step": 23942, "epoch": 288} {"train_loss": -18.6497802734375, "global_step": 23943, "epoch": 288} {"train_loss": -18.449024200439453, "global_step": 23944, "epoch": 288} {"train_loss": -18.594501495361328, "global_step": 23945, "epoch": 288} {"train_loss": -18.403390884399414, "global_step": 23946, "epoch": 288} {"train_loss": -18.63727569580078, "global_step": 23947, "epoch": 288} {"train_loss": -18.669681549072266, "global_step": 23948, "epoch": 288} {"train_loss": -18.695404052734375, "global_step": 23949, "epoch": 288} {"train_loss": -18.621196746826172, "global_step": 23950, "epoch": 288} {"train_loss": -18.33216667175293, "global_step": 23951, "epoch": 288} {"train_loss": -18.522048950195312, "global_step": 23952, "epoch": 288} {"train_loss": -18.51486587524414, "global_step": 23953, "epoch": 288} {"train_loss": -18.784435272216797, "global_step": 23954, "epoch": 288} {"train_loss": -18.592100143432617, "global_step": 23955, "epoch": 288} {"train_loss": -18.870731353759766, "global_step": 23956, "epoch": 288} {"train_loss": -18.282590866088867, "global_step": 23957, "epoch": 288} {"train_loss": -18.684978485107422, "global_step": 23958, "epoch": 288} {"train_loss": -18.608680725097656, "global_step": 23959, "epoch": 288} {"train_loss": -18.56203269958496, "global_step": 23960, "epoch": 288} {"train_loss": -18.706029891967773, "global_step": 23961, "epoch": 288} {"train_loss": -18.726938247680664, "global_step": 23962, "epoch": 288} {"train_loss": -18.636594772338867, "global_step": 23963, "epoch": 288} {"train_loss": -18.70538330078125, "global_step": 23964, "epoch": 288} {"train_loss": -18.573820114135742, "global_step": 23965, "epoch": 288} {"train_loss": -18.985519409179688, "global_step": 23966, "epoch": 288} {"train_loss": -19.026174545288086, "global_step": 23967, "epoch": 288} {"train_loss": -18.47918701171875, "global_step": 23968, "epoch": 288} {"train_loss": -19.082571029663086, "global_step": 23969, "epoch": 288} {"train_loss": -18.317564010620117, "global_step": 23970, "epoch": 288} {"train_loss": -18.830345153808594, "global_step": 23971, "epoch": 288} {"train_loss": -18.5496826171875, "global_step": 23972, "epoch": 288} {"train_loss": -18.721891403198242, "global_step": 23973, "epoch": 288} {"train_loss": -19.028409957885742, "global_step": 23974, "epoch": 288} {"train_loss": -18.923803329467773, "global_step": 23975, "epoch": 288} {"train_loss": -18.893413543701172, "global_step": 23976, "epoch": 288} {"train_loss": -18.812580108642578, "global_step": 23977, "epoch": 288} {"train_loss": -18.909881591796875, "global_step": 23978, "epoch": 288} {"train_loss": -18.939218521118164, "global_step": 23979, "epoch": 288} {"train_loss": -18.764795303344727, "global_step": 23980, "epoch": 288} {"train_loss": -18.729276657104492, "global_step": 23981, "epoch": 288} {"train_loss": -18.368436813354492, "global_step": 23982, "epoch": 288} {"train_loss": -18.222883224487305, "global_step": 23983, "epoch": 288} {"train_loss": -18.506206512451172, "global_step": 23984, "epoch": 288} {"train_loss": -18.455684661865234, "global_step": 23985, "epoch": 288} {"train_loss": -18.571660329060382, "global_step": 23986, "epoch": 288, "val_loss": 6045341.0} {"train_loss": -18.416820526123047, "global_step": 23987, "epoch": 289} {"train_loss": -18.822101593017578, "global_step": 23988, "epoch": 289} {"train_loss": -18.732107162475586, "global_step": 23989, "epoch": 289} {"train_loss": -18.23708724975586, "global_step": 23990, "epoch": 289} {"train_loss": -19.003150939941406, "global_step": 23991, "epoch": 289} {"train_loss": -18.70046043395996, "global_step": 23992, "epoch": 289} {"train_loss": -18.786821365356445, "global_step": 23993, "epoch": 289} {"train_loss": -18.4780330657959, "global_step": 23994, "epoch": 289} {"train_loss": -18.473669052124023, "global_step": 23995, "epoch": 289} {"train_loss": -18.451452255249023, "global_step": 23996, "epoch": 289} {"train_loss": -18.367395401000977, "global_step": 23997, "epoch": 289} {"train_loss": -18.182355880737305, "global_step": 23998, "epoch": 289} {"train_loss": -18.638029098510742, "global_step": 23999, "epoch": 289} {"train_loss": -18.504318237304688, "global_step": 24000, "epoch": 289} {"train_loss": -18.412227630615234, "global_step": 24001, "epoch": 289} {"train_loss": -18.466711044311523, "global_step": 24002, "epoch": 289} {"train_loss": -18.403715133666992, "global_step": 24003, "epoch": 289} {"train_loss": -18.784225463867188, "global_step": 24004, "epoch": 289} {"train_loss": -18.71443748474121, "global_step": 24005, "epoch": 289} {"train_loss": -18.701303482055664, "global_step": 24006, "epoch": 289} {"train_loss": -18.761035919189453, "global_step": 24007, "epoch": 289} {"train_loss": -18.378036499023438, "global_step": 24008, "epoch": 289} {"train_loss": -18.80133056640625, "global_step": 24009, "epoch": 289} {"train_loss": -18.135610580444336, "global_step": 24010, "epoch": 289} {"train_loss": -18.42682456970215, "global_step": 24011, "epoch": 289} {"train_loss": -18.512128829956055, "global_step": 24012, "epoch": 289} {"train_loss": -18.909011840820312, "global_step": 24013, "epoch": 289} {"train_loss": -18.762441635131836, "global_step": 24014, "epoch": 289} {"train_loss": -18.39698600769043, "global_step": 24015, "epoch": 289} {"train_loss": -18.585844039916992, "global_step": 24016, "epoch": 289} {"train_loss": -18.614013671875, "global_step": 24017, "epoch": 289} {"train_loss": -18.81363296508789, "global_step": 24018, "epoch": 289} {"train_loss": -18.634462356567383, "global_step": 24019, "epoch": 289} {"train_loss": -18.40595054626465, "global_step": 24020, "epoch": 289} {"train_loss": -18.365556716918945, "global_step": 24021, "epoch": 289} {"train_loss": -18.631742477416992, "global_step": 24022, "epoch": 289} {"train_loss": -18.651992797851562, "global_step": 24023, "epoch": 289} {"train_loss": -18.474714279174805, "global_step": 24024, "epoch": 289} {"train_loss": -18.650440216064453, "global_step": 24025, "epoch": 289} {"train_loss": -18.4423828125, "global_step": 24026, "epoch": 289} {"train_loss": -18.64410400390625, "global_step": 24027, "epoch": 289} {"train_loss": -18.635906219482422, "global_step": 24028, "epoch": 289} {"train_loss": -18.44843101501465, "global_step": 24029, "epoch": 289} {"train_loss": -18.686906814575195, "global_step": 24030, "epoch": 289} {"train_loss": -18.505374908447266, "global_step": 24031, "epoch": 289} {"train_loss": -19.03144645690918, "global_step": 24032, "epoch": 289} {"train_loss": -18.753995895385742, "global_step": 24033, "epoch": 289} {"train_loss": -18.48476791381836, "global_step": 24034, "epoch": 289} {"train_loss": -18.38728904724121, "global_step": 24035, "epoch": 289} {"train_loss": -18.3269100189209, "global_step": 24036, "epoch": 289} {"train_loss": -18.94758415222168, "global_step": 24037, "epoch": 289} {"train_loss": -18.759523391723633, "global_step": 24038, "epoch": 289} {"train_loss": -18.718523025512695, "global_step": 24039, "epoch": 289} {"train_loss": -18.698896408081055, "global_step": 24040, "epoch": 289} {"train_loss": -18.72940444946289, "global_step": 24041, "epoch": 289} {"train_loss": -18.450443267822266, "global_step": 24042, "epoch": 289} {"train_loss": -18.948820114135742, "global_step": 24043, "epoch": 289} {"train_loss": -18.249597549438477, "global_step": 24044, "epoch": 289} {"train_loss": -18.40331268310547, "global_step": 24045, "epoch": 289} {"train_loss": -18.51718521118164, "global_step": 24046, "epoch": 289} {"train_loss": -18.891225814819336, "global_step": 24047, "epoch": 289} {"train_loss": -18.7962703704834, "global_step": 24048, "epoch": 289} {"train_loss": -18.829233169555664, "global_step": 24049, "epoch": 289} {"train_loss": -18.7137393951416, "global_step": 24050, "epoch": 289} {"train_loss": -18.6330623626709, "global_step": 24051, "epoch": 289} {"train_loss": -18.609426498413086, "global_step": 24052, "epoch": 289} {"train_loss": -18.62842559814453, "global_step": 24053, "epoch": 289} {"train_loss": -18.659366607666016, "global_step": 24054, "epoch": 289} {"train_loss": -18.670743942260742, "global_step": 24055, "epoch": 289} {"train_loss": -18.93305778503418, "global_step": 24056, "epoch": 289} {"train_loss": -18.83394432067871, "global_step": 24057, "epoch": 289} {"train_loss": -18.861513137817383, "global_step": 24058, "epoch": 289} {"train_loss": -18.836936950683594, "global_step": 24059, "epoch": 289} {"train_loss": -18.807096481323242, "global_step": 24060, "epoch": 289} {"train_loss": -18.46880340576172, "global_step": 24061, "epoch": 289} {"train_loss": -18.582935333251953, "global_step": 24062, "epoch": 289} {"train_loss": -18.721410751342773, "global_step": 24063, "epoch": 289} {"train_loss": -18.5030574798584, "global_step": 24064, "epoch": 289} {"train_loss": -18.658649444580078, "global_step": 24065, "epoch": 289} {"train_loss": -18.712968826293945, "global_step": 24066, "epoch": 289} {"train_loss": -18.899566650390625, "global_step": 24067, "epoch": 289} {"train_loss": -18.555898666381836, "global_step": 24068, "epoch": 289} {"train_loss": -18.610360708581396, "global_step": 24069, "epoch": 289, "val_loss": 5951842.5} {"train_loss": -18.347543716430664, "global_step": 24070, "epoch": 290} {"train_loss": -18.669769287109375, "global_step": 24071, "epoch": 290} {"train_loss": -18.313812255859375, "global_step": 24072, "epoch": 290} {"train_loss": -18.52705955505371, "global_step": 24073, "epoch": 290} {"train_loss": -17.71875, "global_step": 24074, "epoch": 290} {"train_loss": -18.308603286743164, "global_step": 24075, "epoch": 290} {"train_loss": -18.54774284362793, "global_step": 24076, "epoch": 290} {"train_loss": -18.77523422241211, "global_step": 24077, "epoch": 290} {"train_loss": -18.132917404174805, "global_step": 24078, "epoch": 290} {"train_loss": -18.483219146728516, "global_step": 24079, "epoch": 290} {"train_loss": -18.380613327026367, "global_step": 24080, "epoch": 290} {"train_loss": -18.269800186157227, "global_step": 24081, "epoch": 290} {"train_loss": -18.55788230895996, "global_step": 24082, "epoch": 290} {"train_loss": -18.44870376586914, "global_step": 24083, "epoch": 290} {"train_loss": -18.486371994018555, "global_step": 24084, "epoch": 290} {"train_loss": -18.692523956298828, "global_step": 24085, "epoch": 290} {"train_loss": -18.777204513549805, "global_step": 24086, "epoch": 290} {"train_loss": -18.68465232849121, "global_step": 24087, "epoch": 290} {"train_loss": -18.521474838256836, "global_step": 24088, "epoch": 290} {"train_loss": -18.724491119384766, "global_step": 24089, "epoch": 290} {"train_loss": -18.825428009033203, "global_step": 24090, "epoch": 290} {"train_loss": -18.215576171875, "global_step": 24091, "epoch": 290} {"train_loss": -18.392704010009766, "global_step": 24092, "epoch": 290} {"train_loss": -18.5228271484375, "global_step": 24093, "epoch": 290} {"train_loss": -18.664472579956055, "global_step": 24094, "epoch": 290} {"train_loss": -18.528657913208008, "global_step": 24095, "epoch": 290} {"train_loss": -18.364892959594727, "global_step": 24096, "epoch": 290} {"train_loss": -18.68423843383789, "global_step": 24097, "epoch": 290} {"train_loss": -18.391721725463867, "global_step": 24098, "epoch": 290} {"train_loss": -18.914016723632812, "global_step": 24099, "epoch": 290} {"train_loss": -18.646533966064453, "global_step": 24100, "epoch": 290} {"train_loss": -19.197057723999023, "global_step": 24101, "epoch": 290} {"train_loss": -18.807518005371094, "global_step": 24102, "epoch": 290} {"train_loss": -18.372848510742188, "global_step": 24103, "epoch": 290} {"train_loss": -18.915149688720703, "global_step": 24104, "epoch": 290} {"train_loss": -18.67836570739746, "global_step": 24105, "epoch": 290} {"train_loss": -18.51458740234375, "global_step": 24106, "epoch": 290} {"train_loss": -18.441162109375, "global_step": 24107, "epoch": 290} {"train_loss": -19.027936935424805, "global_step": 24108, "epoch": 290} {"train_loss": -18.234634399414062, "global_step": 24109, "epoch": 290} {"train_loss": -18.730405807495117, "global_step": 24110, "epoch": 290} {"train_loss": -18.58416748046875, "global_step": 24111, "epoch": 290} {"train_loss": -18.540021896362305, "global_step": 24112, "epoch": 290} {"train_loss": -19.160676956176758, "global_step": 24113, "epoch": 290} {"train_loss": -18.75400161743164, "global_step": 24114, "epoch": 290} {"train_loss": -18.641775131225586, "global_step": 24115, "epoch": 290} {"train_loss": -18.353546142578125, "global_step": 24116, "epoch": 290} {"train_loss": -18.642379760742188, "global_step": 24117, "epoch": 290} {"train_loss": -18.747289657592773, "global_step": 24118, "epoch": 290} {"train_loss": -18.793655395507812, "global_step": 24119, "epoch": 290} {"train_loss": -18.47416877746582, "global_step": 24120, "epoch": 290} {"train_loss": -18.539020538330078, "global_step": 24121, "epoch": 290} {"train_loss": -18.759389877319336, "global_step": 24122, "epoch": 290} {"train_loss": -18.88935089111328, "global_step": 24123, "epoch": 290} {"train_loss": -18.490934371948242, "global_step": 24124, "epoch": 290} {"train_loss": -18.71973419189453, "global_step": 24125, "epoch": 290} {"train_loss": -18.709375381469727, "global_step": 24126, "epoch": 290} {"train_loss": -18.22452163696289, "global_step": 24127, "epoch": 290} {"train_loss": -18.810604095458984, "global_step": 24128, "epoch": 290} {"train_loss": -18.55107307434082, "global_step": 24129, "epoch": 290} {"train_loss": -18.496231079101562, "global_step": 24130, "epoch": 290} {"train_loss": -18.73099708557129, "global_step": 24131, "epoch": 290} {"train_loss": -18.663742065429688, "global_step": 24132, "epoch": 290} {"train_loss": -18.906265258789062, "global_step": 24133, "epoch": 290} {"train_loss": -18.73703956604004, "global_step": 24134, "epoch": 290} {"train_loss": -18.7076416015625, "global_step": 24135, "epoch": 290} {"train_loss": -18.442752838134766, "global_step": 24136, "epoch": 290} {"train_loss": -18.72430992126465, "global_step": 24137, "epoch": 290} {"train_loss": -18.675283432006836, "global_step": 24138, "epoch": 290} {"train_loss": -18.662572860717773, "global_step": 24139, "epoch": 290} {"train_loss": -18.73573875427246, "global_step": 24140, "epoch": 290} {"train_loss": -18.432851791381836, "global_step": 24141, "epoch": 290} {"train_loss": -18.73914909362793, "global_step": 24142, "epoch": 290} {"train_loss": -18.821569442749023, "global_step": 24143, "epoch": 290} {"train_loss": -18.782352447509766, "global_step": 24144, "epoch": 290} {"train_loss": -18.520828247070312, "global_step": 24145, "epoch": 290} {"train_loss": -18.750951766967773, "global_step": 24146, "epoch": 290} {"train_loss": -18.519943237304688, "global_step": 24147, "epoch": 290} {"train_loss": -18.49352264404297, "global_step": 24148, "epoch": 290} {"train_loss": -18.737834930419922, "global_step": 24149, "epoch": 290} {"train_loss": -18.3625431060791, "global_step": 24150, "epoch": 290} {"train_loss": -18.663822174072266, "global_step": 24151, "epoch": 290} {"train_loss": -18.62411869003112, "global_step": 24152, "epoch": 290, "val_loss": 5947207.0} {"train_loss": -18.227436065673828, "global_step": 24153, "epoch": 291} {"train_loss": -18.29770278930664, "global_step": 24154, "epoch": 291} {"train_loss": -18.44938087463379, "global_step": 24155, "epoch": 291} {"train_loss": -17.95521354675293, "global_step": 24156, "epoch": 291} {"train_loss": -18.68714714050293, "global_step": 24157, "epoch": 291} {"train_loss": -18.660037994384766, "global_step": 24158, "epoch": 291} {"train_loss": -18.550857543945312, "global_step": 24159, "epoch": 291} {"train_loss": -18.692218780517578, "global_step": 24160, "epoch": 291} {"train_loss": -18.84442710876465, "global_step": 24161, "epoch": 291} {"train_loss": -18.66242790222168, "global_step": 24162, "epoch": 291} {"train_loss": -18.704483032226562, "global_step": 24163, "epoch": 291} {"train_loss": -18.343873977661133, "global_step": 24164, "epoch": 291} {"train_loss": -18.592845916748047, "global_step": 24165, "epoch": 291} {"train_loss": -18.570566177368164, "global_step": 24166, "epoch": 291} {"train_loss": -18.456377029418945, "global_step": 24167, "epoch": 291} {"train_loss": -18.8416748046875, "global_step": 24168, "epoch": 291} {"train_loss": -18.53487777709961, "global_step": 24169, "epoch": 291} {"train_loss": -18.663822174072266, "global_step": 24170, "epoch": 291} {"train_loss": -18.517776489257812, "global_step": 24171, "epoch": 291} {"train_loss": -18.567758560180664, "global_step": 24172, "epoch": 291} {"train_loss": -18.779579162597656, "global_step": 24173, "epoch": 291} {"train_loss": -18.959909439086914, "global_step": 24174, "epoch": 291} {"train_loss": -18.30984878540039, "global_step": 24175, "epoch": 291} {"train_loss": -19.141563415527344, "global_step": 24176, "epoch": 291} {"train_loss": -18.20113182067871, "global_step": 24177, "epoch": 291} {"train_loss": -18.74812889099121, "global_step": 24178, "epoch": 291} {"train_loss": -18.601837158203125, "global_step": 24179, "epoch": 291} {"train_loss": -18.569534301757812, "global_step": 24180, "epoch": 291} {"train_loss": -19.07276725769043, "global_step": 24181, "epoch": 291} {"train_loss": -18.647846221923828, "global_step": 24182, "epoch": 291} {"train_loss": -18.440919876098633, "global_step": 24183, "epoch": 291} {"train_loss": -18.746578216552734, "global_step": 24184, "epoch": 291} {"train_loss": -18.160995483398438, "global_step": 24185, "epoch": 291} {"train_loss": -18.56460952758789, "global_step": 24186, "epoch": 291} {"train_loss": -18.273235321044922, "global_step": 24187, "epoch": 291} {"train_loss": -18.732709884643555, "global_step": 24188, "epoch": 291} {"train_loss": -18.607519149780273, "global_step": 24189, "epoch": 291} {"train_loss": -18.90242576599121, "global_step": 24190, "epoch": 291} {"train_loss": -18.645254135131836, "global_step": 24191, "epoch": 291} {"train_loss": -18.575315475463867, "global_step": 24192, "epoch": 291} {"train_loss": -18.6700382232666, "global_step": 24193, "epoch": 291} {"train_loss": -18.548038482666016, "global_step": 24194, "epoch": 291} {"train_loss": -18.681142807006836, "global_step": 24195, "epoch": 291} {"train_loss": -18.623783111572266, "global_step": 24196, "epoch": 291} {"train_loss": -18.494131088256836, "global_step": 24197, "epoch": 291} {"train_loss": -18.764074325561523, "global_step": 24198, "epoch": 291} {"train_loss": -19.032888412475586, "global_step": 24199, "epoch": 291} {"train_loss": -18.66336441040039, "global_step": 24200, "epoch": 291} {"train_loss": -18.734411239624023, "global_step": 24201, "epoch": 291} {"train_loss": -18.858280181884766, "global_step": 24202, "epoch": 291} {"train_loss": -18.646894454956055, "global_step": 24203, "epoch": 291} {"train_loss": -18.636371612548828, "global_step": 24204, "epoch": 291} {"train_loss": -18.80084228515625, "global_step": 24205, "epoch": 291} {"train_loss": -18.353822708129883, "global_step": 24206, "epoch": 291} {"train_loss": -18.73296546936035, "global_step": 24207, "epoch": 291} {"train_loss": -18.79914665222168, "global_step": 24208, "epoch": 291} {"train_loss": -18.34296417236328, "global_step": 24209, "epoch": 291} {"train_loss": -18.91839599609375, "global_step": 24210, "epoch": 291} {"train_loss": -18.730802536010742, "global_step": 24211, "epoch": 291} {"train_loss": -18.759925842285156, "global_step": 24212, "epoch": 291} {"train_loss": -18.693817138671875, "global_step": 24213, "epoch": 291} {"train_loss": -18.530689239501953, "global_step": 24214, "epoch": 291} {"train_loss": -19.062734603881836, "global_step": 24215, "epoch": 291} {"train_loss": -18.787216186523438, "global_step": 24216, "epoch": 291} {"train_loss": -18.943418502807617, "global_step": 24217, "epoch": 291} {"train_loss": -18.48341941833496, "global_step": 24218, "epoch": 291} {"train_loss": -18.670766830444336, "global_step": 24219, "epoch": 291} {"train_loss": -18.521047592163086, "global_step": 24220, "epoch": 291} {"train_loss": -18.352323532104492, "global_step": 24221, "epoch": 291} {"train_loss": -18.77857780456543, "global_step": 24222, "epoch": 291} {"train_loss": -18.726947784423828, "global_step": 24223, "epoch": 291} {"train_loss": -18.401962280273438, "global_step": 24224, "epoch": 291} {"train_loss": -18.579130172729492, "global_step": 24225, "epoch": 291} {"train_loss": -18.397388458251953, "global_step": 24226, "epoch": 291} {"train_loss": -18.783309936523438, "global_step": 24227, "epoch": 291} {"train_loss": -18.678497314453125, "global_step": 24228, "epoch": 291} {"train_loss": -18.951419830322266, "global_step": 24229, "epoch": 291} {"train_loss": -18.491056442260742, "global_step": 24230, "epoch": 291} {"train_loss": -18.841039657592773, "global_step": 24231, "epoch": 291} {"train_loss": -18.59982681274414, "global_step": 24232, "epoch": 291} {"train_loss": -18.439855575561523, "global_step": 24233, "epoch": 291} {"train_loss": -18.70559310913086, "global_step": 24234, "epoch": 291} {"train_loss": -18.637852358530804, "global_step": 24235, "epoch": 291, "val_loss": 5980245.5} {"train_loss": -18.50516128540039, "global_step": 24236, "epoch": 292} {"train_loss": -18.400556564331055, "global_step": 24237, "epoch": 292} {"train_loss": -18.128957748413086, "global_step": 24238, "epoch": 292} {"train_loss": -18.656217575073242, "global_step": 24239, "epoch": 292} {"train_loss": -18.447040557861328, "global_step": 24240, "epoch": 292} {"train_loss": -18.461578369140625, "global_step": 24241, "epoch": 292} {"train_loss": -18.184253692626953, "global_step": 24242, "epoch": 292} {"train_loss": -18.81694793701172, "global_step": 24243, "epoch": 292} {"train_loss": -18.441646575927734, "global_step": 24244, "epoch": 292} {"train_loss": -18.41144371032715, "global_step": 24245, "epoch": 292} {"train_loss": -18.822370529174805, "global_step": 24246, "epoch": 292} {"train_loss": -18.74970817565918, "global_step": 24247, "epoch": 292} {"train_loss": -18.615293502807617, "global_step": 24248, "epoch": 292} {"train_loss": -18.617408752441406, "global_step": 24249, "epoch": 292} {"train_loss": -18.682218551635742, "global_step": 24250, "epoch": 292} {"train_loss": -18.39963150024414, "global_step": 24251, "epoch": 292} {"train_loss": -18.56378746032715, "global_step": 24252, "epoch": 292} {"train_loss": -18.6490535736084, "global_step": 24253, "epoch": 292} {"train_loss": -18.674985885620117, "global_step": 24254, "epoch": 292} {"train_loss": -18.73138427734375, "global_step": 24255, "epoch": 292} {"train_loss": -18.757415771484375, "global_step": 24256, "epoch": 292} {"train_loss": -18.69329261779785, "global_step": 24257, "epoch": 292} {"train_loss": -18.149646759033203, "global_step": 24258, "epoch": 292} {"train_loss": -18.5997257232666, "global_step": 24259, "epoch": 292} {"train_loss": -18.41061782836914, "global_step": 24260, "epoch": 292} {"train_loss": -18.60382080078125, "global_step": 24261, "epoch": 292} {"train_loss": -18.578638076782227, "global_step": 24262, "epoch": 292} {"train_loss": -18.63496971130371, "global_step": 24263, "epoch": 292} {"train_loss": -18.697494506835938, "global_step": 24264, "epoch": 292} {"train_loss": -18.716161727905273, "global_step": 24265, "epoch": 292} {"train_loss": -18.616086959838867, "global_step": 24266, "epoch": 292} {"train_loss": -18.997365951538086, "global_step": 24267, "epoch": 292} {"train_loss": -18.400659561157227, "global_step": 24268, "epoch": 292} {"train_loss": -18.13975715637207, "global_step": 24269, "epoch": 292} {"train_loss": -18.4341983795166, "global_step": 24270, "epoch": 292} {"train_loss": -18.20577049255371, "global_step": 24271, "epoch": 292} {"train_loss": -18.874296188354492, "global_step": 24272, "epoch": 292} {"train_loss": -18.44796371459961, "global_step": 24273, "epoch": 292} {"train_loss": -18.721040725708008, "global_step": 24274, "epoch": 292} {"train_loss": -18.916906356811523, "global_step": 24275, "epoch": 292} {"train_loss": -18.651762008666992, "global_step": 24276, "epoch": 292} {"train_loss": -18.490209579467773, "global_step": 24277, "epoch": 292} {"train_loss": -18.754854202270508, "global_step": 24278, "epoch": 292} {"train_loss": -19.01919937133789, "global_step": 24279, "epoch": 292} {"train_loss": -18.668041229248047, "global_step": 24280, "epoch": 292} {"train_loss": -18.618444442749023, "global_step": 24281, "epoch": 292} {"train_loss": -18.342111587524414, "global_step": 24282, "epoch": 292} {"train_loss": -18.909130096435547, "global_step": 24283, "epoch": 292} {"train_loss": -18.41619110107422, "global_step": 24284, "epoch": 292} {"train_loss": -18.294769287109375, "global_step": 24285, "epoch": 292} {"train_loss": -18.8714656829834, "global_step": 24286, "epoch": 292} {"train_loss": -18.887861251831055, "global_step": 24287, "epoch": 292} {"train_loss": -18.487049102783203, "global_step": 24288, "epoch": 292} {"train_loss": -18.53853416442871, "global_step": 24289, "epoch": 292} {"train_loss": -18.750423431396484, "global_step": 24290, "epoch": 292} {"train_loss": -18.994741439819336, "global_step": 24291, "epoch": 292} {"train_loss": -18.322696685791016, "global_step": 24292, "epoch": 292} {"train_loss": -18.967561721801758, "global_step": 24293, "epoch": 292} {"train_loss": -18.222211837768555, "global_step": 24294, "epoch": 292} {"train_loss": -18.69536590576172, "global_step": 24295, "epoch": 292} {"train_loss": -18.51242446899414, "global_step": 24296, "epoch": 292} {"train_loss": -18.65943717956543, "global_step": 24297, "epoch": 292} {"train_loss": -18.988082885742188, "global_step": 24298, "epoch": 292} {"train_loss": -18.826406478881836, "global_step": 24299, "epoch": 292} {"train_loss": -18.266510009765625, "global_step": 24300, "epoch": 292} {"train_loss": -18.73284912109375, "global_step": 24301, "epoch": 292} {"train_loss": -18.469772338867188, "global_step": 24302, "epoch": 292} {"train_loss": -18.625150680541992, "global_step": 24303, "epoch": 292} {"train_loss": -18.26106834411621, "global_step": 24304, "epoch": 292} {"train_loss": -19.0687313079834, "global_step": 24305, "epoch": 292} {"train_loss": -18.88079071044922, "global_step": 24306, "epoch": 292} {"train_loss": -18.517959594726562, "global_step": 24307, "epoch": 292} {"train_loss": -18.855749130249023, "global_step": 24308, "epoch": 292} {"train_loss": -18.471799850463867, "global_step": 24309, "epoch": 292} {"train_loss": -18.610734939575195, "global_step": 24310, "epoch": 292} {"train_loss": -18.113895416259766, "global_step": 24311, "epoch": 292} {"train_loss": -18.671598434448242, "global_step": 24312, "epoch": 292} {"train_loss": -18.562963485717773, "global_step": 24313, "epoch": 292} {"train_loss": -18.76113510131836, "global_step": 24314, "epoch": 292} {"train_loss": -18.660940170288086, "global_step": 24315, "epoch": 292} {"train_loss": -18.451797485351562, "global_step": 24316, "epoch": 292} {"train_loss": -18.573150634765625, "global_step": 24317, "epoch": 292} {"train_loss": -18.5760887789439, "global_step": 24318, "epoch": 292, "val_loss": 6040168.5} {"train_loss": -18.771085739135742, "global_step": 24319, "epoch": 293} {"train_loss": -18.503978729248047, "global_step": 24320, "epoch": 293} {"train_loss": -18.55820655822754, "global_step": 24321, "epoch": 293} {"train_loss": -18.87729263305664, "global_step": 24322, "epoch": 293} {"train_loss": -18.718294143676758, "global_step": 24323, "epoch": 293} {"train_loss": -18.663122177124023, "global_step": 24324, "epoch": 293} {"train_loss": -18.594465255737305, "global_step": 24325, "epoch": 293} {"train_loss": -18.75806999206543, "global_step": 24326, "epoch": 293} {"train_loss": -18.476490020751953, "global_step": 24327, "epoch": 293} {"train_loss": -18.590017318725586, "global_step": 24328, "epoch": 293} {"train_loss": -18.61513328552246, "global_step": 24329, "epoch": 293} {"train_loss": -18.287988662719727, "global_step": 24330, "epoch": 293} {"train_loss": -18.33732032775879, "global_step": 24331, "epoch": 293} {"train_loss": -18.392385482788086, "global_step": 24332, "epoch": 293} {"train_loss": -18.772750854492188, "global_step": 24333, "epoch": 293} {"train_loss": -18.59291648864746, "global_step": 24334, "epoch": 293} {"train_loss": -18.781957626342773, "global_step": 24335, "epoch": 293} {"train_loss": -18.767656326293945, "global_step": 24336, "epoch": 293} {"train_loss": -18.5986328125, "global_step": 24337, "epoch": 293} {"train_loss": -18.744369506835938, "global_step": 24338, "epoch": 293} {"train_loss": -18.728567123413086, "global_step": 24339, "epoch": 293} {"train_loss": -18.854358673095703, "global_step": 24340, "epoch": 293} {"train_loss": -18.65765380859375, "global_step": 24341, "epoch": 293} {"train_loss": -18.790817260742188, "global_step": 24342, "epoch": 293} {"train_loss": -18.73249626159668, "global_step": 24343, "epoch": 293} {"train_loss": -18.841819763183594, "global_step": 24344, "epoch": 293} {"train_loss": -18.882375717163086, "global_step": 24345, "epoch": 293} {"train_loss": -18.78974723815918, "global_step": 24346, "epoch": 293} {"train_loss": -18.737735748291016, "global_step": 24347, "epoch": 293} {"train_loss": -18.80214500427246, "global_step": 24348, "epoch": 293} {"train_loss": -18.738086700439453, "global_step": 24349, "epoch": 293} {"train_loss": -18.957351684570312, "global_step": 24350, "epoch": 293} {"train_loss": -18.5041446685791, "global_step": 24351, "epoch": 293} {"train_loss": -18.58443260192871, "global_step": 24352, "epoch": 293} {"train_loss": -18.728702545166016, "global_step": 24353, "epoch": 293} {"train_loss": -19.027114868164062, "global_step": 24354, "epoch": 293} {"train_loss": -18.40433120727539, "global_step": 24355, "epoch": 293} {"train_loss": -18.268375396728516, "global_step": 24356, "epoch": 293} {"train_loss": -18.507917404174805, "global_step": 24357, "epoch": 293} {"train_loss": -18.078290939331055, "global_step": 24358, "epoch": 293} {"train_loss": -18.586627960205078, "global_step": 24359, "epoch": 293} {"train_loss": -18.556119918823242, "global_step": 24360, "epoch": 293} {"train_loss": -18.536184310913086, "global_step": 24361, "epoch": 293} {"train_loss": -18.79184341430664, "global_step": 24362, "epoch": 293} {"train_loss": -18.63714027404785, "global_step": 24363, "epoch": 293} {"train_loss": -18.970304489135742, "global_step": 24364, "epoch": 293} {"train_loss": -18.56565284729004, "global_step": 24365, "epoch": 293} {"train_loss": -18.640478134155273, "global_step": 24366, "epoch": 293} {"train_loss": -18.232341766357422, "global_step": 24367, "epoch": 293} {"train_loss": -18.68439483642578, "global_step": 24368, "epoch": 293} {"train_loss": -18.683887481689453, "global_step": 24369, "epoch": 293} {"train_loss": -18.728103637695312, "global_step": 24370, "epoch": 293} {"train_loss": -18.85590171813965, "global_step": 24371, "epoch": 293} {"train_loss": -18.8435115814209, "global_step": 24372, "epoch": 293} {"train_loss": -18.95066261291504, "global_step": 24373, "epoch": 293} {"train_loss": -18.688121795654297, "global_step": 24374, "epoch": 293} {"train_loss": -18.66713523864746, "global_step": 24375, "epoch": 293} {"train_loss": -18.85280418395996, "global_step": 24376, "epoch": 293} {"train_loss": -18.619009017944336, "global_step": 24377, "epoch": 293} {"train_loss": -18.517343521118164, "global_step": 24378, "epoch": 293} {"train_loss": -18.447952270507812, "global_step": 24379, "epoch": 293} {"train_loss": -18.886564254760742, "global_step": 24380, "epoch": 293} {"train_loss": -18.648252487182617, "global_step": 24381, "epoch": 293} {"train_loss": -18.504987716674805, "global_step": 24382, "epoch": 293} {"train_loss": -18.69174575805664, "global_step": 24383, "epoch": 293} {"train_loss": -18.568634033203125, "global_step": 24384, "epoch": 293} {"train_loss": -18.494647979736328, "global_step": 24385, "epoch": 293} {"train_loss": -18.441957473754883, "global_step": 24386, "epoch": 293} {"train_loss": -18.92006492614746, "global_step": 24387, "epoch": 293} {"train_loss": -18.983928680419922, "global_step": 24388, "epoch": 293} {"train_loss": -18.63813591003418, "global_step": 24389, "epoch": 293} {"train_loss": -18.363689422607422, "global_step": 24390, "epoch": 293} {"train_loss": -18.096479415893555, "global_step": 24391, "epoch": 293} {"train_loss": -18.280624389648438, "global_step": 24392, "epoch": 293} {"train_loss": -18.54891014099121, "global_step": 24393, "epoch": 293} {"train_loss": -18.865455627441406, "global_step": 24394, "epoch": 293} {"train_loss": -18.5943660736084, "global_step": 24395, "epoch": 293} {"train_loss": -18.766523361206055, "global_step": 24396, "epoch": 293} {"train_loss": -18.61684226989746, "global_step": 24397, "epoch": 293} {"train_loss": -18.530385971069336, "global_step": 24398, "epoch": 293} {"train_loss": -18.81290626525879, "global_step": 24399, "epoch": 293} {"train_loss": -18.355695724487305, "global_step": 24400, "epoch": 293} {"train_loss": -18.670750261789344, "global_step": 24401, "epoch": 293, "val_loss": 5943458.5} {"train_loss": -18.388063430786133, "global_step": 24402, "epoch": 294} {"train_loss": -18.66246795654297, "global_step": 24403, "epoch": 294} {"train_loss": -18.741079330444336, "global_step": 24404, "epoch": 294} {"train_loss": -18.62113380432129, "global_step": 24405, "epoch": 294} {"train_loss": -18.82614517211914, "global_step": 24406, "epoch": 294} {"train_loss": -18.502384185791016, "global_step": 24407, "epoch": 294} {"train_loss": -18.080392837524414, "global_step": 24408, "epoch": 294} {"train_loss": -18.419389724731445, "global_step": 24409, "epoch": 294} {"train_loss": -18.49688148498535, "global_step": 24410, "epoch": 294} {"train_loss": -18.76712989807129, "global_step": 24411, "epoch": 294} {"train_loss": -18.76166534423828, "global_step": 24412, "epoch": 294} {"train_loss": -18.677030563354492, "global_step": 24413, "epoch": 294} {"train_loss": -18.554580688476562, "global_step": 24414, "epoch": 294} {"train_loss": -18.803375244140625, "global_step": 24415, "epoch": 294} {"train_loss": -18.675846099853516, "global_step": 24416, "epoch": 294} {"train_loss": -18.728910446166992, "global_step": 24417, "epoch": 294} {"train_loss": -18.57876968383789, "global_step": 24418, "epoch": 294} {"train_loss": -18.8640193939209, "global_step": 24419, "epoch": 294} {"train_loss": -18.98280143737793, "global_step": 24420, "epoch": 294} {"train_loss": -18.69540023803711, "global_step": 24421, "epoch": 294} {"train_loss": -18.663867950439453, "global_step": 24422, "epoch": 294} {"train_loss": -18.310640335083008, "global_step": 24423, "epoch": 294} {"train_loss": -19.107040405273438, "global_step": 24424, "epoch": 294} {"train_loss": -18.829879760742188, "global_step": 24425, "epoch": 294} {"train_loss": -18.674962997436523, "global_step": 24426, "epoch": 294} {"train_loss": -18.612577438354492, "global_step": 24427, "epoch": 294} {"train_loss": -18.884641647338867, "global_step": 24428, "epoch": 294} {"train_loss": -18.456634521484375, "global_step": 24429, "epoch": 294} {"train_loss": -18.224308013916016, "global_step": 24430, "epoch": 294} {"train_loss": -18.657062530517578, "global_step": 24431, "epoch": 294} {"train_loss": -18.35103988647461, "global_step": 24432, "epoch": 294} {"train_loss": -18.550668716430664, "global_step": 24433, "epoch": 294} {"train_loss": -19.011220932006836, "global_step": 24434, "epoch": 294} {"train_loss": -18.862211227416992, "global_step": 24435, "epoch": 294} {"train_loss": -18.779708862304688, "global_step": 24436, "epoch": 294} {"train_loss": -18.3598690032959, "global_step": 24437, "epoch": 294} {"train_loss": -18.843503952026367, "global_step": 24438, "epoch": 294} {"train_loss": -18.477956771850586, "global_step": 24439, "epoch": 294} {"train_loss": -18.41383171081543, "global_step": 24440, "epoch": 294} {"train_loss": -18.629270553588867, "global_step": 24441, "epoch": 294} {"train_loss": -18.652738571166992, "global_step": 24442, "epoch": 294} {"train_loss": -18.2853946685791, "global_step": 24443, "epoch": 294} {"train_loss": -19.062118530273438, "global_step": 24444, "epoch": 294} {"train_loss": -19.04140281677246, "global_step": 24445, "epoch": 294} {"train_loss": -18.854843139648438, "global_step": 24446, "epoch": 294} {"train_loss": -18.678424835205078, "global_step": 24447, "epoch": 294} {"train_loss": -18.257436752319336, "global_step": 24448, "epoch": 294} {"train_loss": -18.6262264251709, "global_step": 24449, "epoch": 294} {"train_loss": -18.530750274658203, "global_step": 24450, "epoch": 294} {"train_loss": -18.526330947875977, "global_step": 24451, "epoch": 294} {"train_loss": -18.971715927124023, "global_step": 24452, "epoch": 294} {"train_loss": -18.927526473999023, "global_step": 24453, "epoch": 294} {"train_loss": -18.84147071838379, "global_step": 24454, "epoch": 294} {"train_loss": -18.62672233581543, "global_step": 24455, "epoch": 294} {"train_loss": -18.26445960998535, "global_step": 24456, "epoch": 294} {"train_loss": -18.372861862182617, "global_step": 24457, "epoch": 294} {"train_loss": -18.510435104370117, "global_step": 24458, "epoch": 294} {"train_loss": -18.786985397338867, "global_step": 24459, "epoch": 294} {"train_loss": -18.7121639251709, "global_step": 24460, "epoch": 294} {"train_loss": -18.858617782592773, "global_step": 24461, "epoch": 294} {"train_loss": -18.79694938659668, "global_step": 24462, "epoch": 294} {"train_loss": -18.76523208618164, "global_step": 24463, "epoch": 294} {"train_loss": -18.261545181274414, "global_step": 24464, "epoch": 294} {"train_loss": -18.92058753967285, "global_step": 24465, "epoch": 294} {"train_loss": -18.76173973083496, "global_step": 24466, "epoch": 294} {"train_loss": -18.914352416992188, "global_step": 24467, "epoch": 294} {"train_loss": -18.942398071289062, "global_step": 24468, "epoch": 294} {"train_loss": -18.86493492126465, "global_step": 24469, "epoch": 294} {"train_loss": -18.36261558532715, "global_step": 24470, "epoch": 294} {"train_loss": -18.696308135986328, "global_step": 24471, "epoch": 294} {"train_loss": -18.08780288696289, "global_step": 24472, "epoch": 294} {"train_loss": -18.563825607299805, "global_step": 24473, "epoch": 294} {"train_loss": -18.383451461791992, "global_step": 24474, "epoch": 294} {"train_loss": -18.16139793395996, "global_step": 24475, "epoch": 294} {"train_loss": -18.820096969604492, "global_step": 24476, "epoch": 294} {"train_loss": -18.551450729370117, "global_step": 24477, "epoch": 294} {"train_loss": -18.492759704589844, "global_step": 24478, "epoch": 294} {"train_loss": -18.185937881469727, "global_step": 24479, "epoch": 294} {"train_loss": -18.509443283081055, "global_step": 24480, "epoch": 294} {"train_loss": -18.5331974029541, "global_step": 24481, "epoch": 294} {"train_loss": -18.354806900024414, "global_step": 24482, "epoch": 294} {"train_loss": -18.328176498413086, "global_step": 24483, "epoch": 294} {"train_loss": -18.60790742161762, "global_step": 24484, "epoch": 294, "val_loss": 5986907.5} {"train_loss": -18.391345977783203, "global_step": 24485, "epoch": 295} {"train_loss": -18.70132827758789, "global_step": 24486, "epoch": 295} {"train_loss": -18.717411041259766, "global_step": 24487, "epoch": 295} {"train_loss": -18.51742935180664, "global_step": 24488, "epoch": 295} {"train_loss": -18.472370147705078, "global_step": 24489, "epoch": 295} {"train_loss": -18.52497673034668, "global_step": 24490, "epoch": 295} {"train_loss": -18.454227447509766, "global_step": 24491, "epoch": 295} {"train_loss": -18.80787467956543, "global_step": 24492, "epoch": 295} {"train_loss": -18.565275192260742, "global_step": 24493, "epoch": 295} {"train_loss": -18.49507713317871, "global_step": 24494, "epoch": 295} {"train_loss": -18.597370147705078, "global_step": 24495, "epoch": 295} {"train_loss": -18.408679962158203, "global_step": 24496, "epoch": 295} {"train_loss": -18.957889556884766, "global_step": 24497, "epoch": 295} {"train_loss": -18.838632583618164, "global_step": 24498, "epoch": 295} {"train_loss": -18.558883666992188, "global_step": 24499, "epoch": 295} {"train_loss": -18.561199188232422, "global_step": 24500, "epoch": 295} {"train_loss": -18.57233238220215, "global_step": 24501, "epoch": 295} {"train_loss": -18.46864891052246, "global_step": 24502, "epoch": 295} {"train_loss": -18.5518741607666, "global_step": 24503, "epoch": 295} {"train_loss": -18.526819229125977, "global_step": 24504, "epoch": 295} {"train_loss": -18.71743392944336, "global_step": 24505, "epoch": 295} {"train_loss": -18.911212921142578, "global_step": 24506, "epoch": 295} {"train_loss": -18.917285919189453, "global_step": 24507, "epoch": 295} {"train_loss": -18.592533111572266, "global_step": 24508, "epoch": 295} {"train_loss": -18.821805953979492, "global_step": 24509, "epoch": 295} {"train_loss": -18.825992584228516, "global_step": 24510, "epoch": 295} {"train_loss": -18.63981056213379, "global_step": 24511, "epoch": 295} {"train_loss": -18.657896041870117, "global_step": 24512, "epoch": 295} {"train_loss": -18.568904876708984, "global_step": 24513, "epoch": 295} {"train_loss": -18.621280670166016, "global_step": 24514, "epoch": 295} {"train_loss": -18.538894653320312, "global_step": 24515, "epoch": 295} {"train_loss": -18.8253173828125, "global_step": 24516, "epoch": 295} {"train_loss": -18.522279739379883, "global_step": 24517, "epoch": 295} {"train_loss": -18.791879653930664, "global_step": 24518, "epoch": 295} {"train_loss": -18.932682037353516, "global_step": 24519, "epoch": 295} {"train_loss": -18.565948486328125, "global_step": 24520, "epoch": 295} {"train_loss": -18.739805221557617, "global_step": 24521, "epoch": 295} {"train_loss": -18.42679786682129, "global_step": 24522, "epoch": 295} {"train_loss": -18.69327735900879, "global_step": 24523, "epoch": 295} {"train_loss": -18.762662887573242, "global_step": 24524, "epoch": 295} {"train_loss": -18.823694229125977, "global_step": 24525, "epoch": 295} {"train_loss": -18.621183395385742, "global_step": 24526, "epoch": 295} {"train_loss": -18.757841110229492, "global_step": 24527, "epoch": 295} {"train_loss": -18.642410278320312, "global_step": 24528, "epoch": 295} {"train_loss": -18.800411224365234, "global_step": 24529, "epoch": 295} {"train_loss": -18.74333381652832, "global_step": 24530, "epoch": 295} {"train_loss": -18.44791603088379, "global_step": 24531, "epoch": 295} {"train_loss": -18.667591094970703, "global_step": 24532, "epoch": 295} {"train_loss": -18.410627365112305, "global_step": 24533, "epoch": 295} {"train_loss": -18.62627410888672, "global_step": 24534, "epoch": 295} {"train_loss": -18.46000099182129, "global_step": 24535, "epoch": 295} {"train_loss": -19.102005004882812, "global_step": 24536, "epoch": 295} {"train_loss": -18.70691680908203, "global_step": 24537, "epoch": 295} {"train_loss": -18.54196548461914, "global_step": 24538, "epoch": 295} {"train_loss": -18.711416244506836, "global_step": 24539, "epoch": 295} {"train_loss": -18.444780349731445, "global_step": 24540, "epoch": 295} {"train_loss": -18.447372436523438, "global_step": 24541, "epoch": 295} {"train_loss": -19.143535614013672, "global_step": 24542, "epoch": 295} {"train_loss": -18.747684478759766, "global_step": 24543, "epoch": 295} {"train_loss": -18.734922409057617, "global_step": 24544, "epoch": 295} {"train_loss": -18.26449966430664, "global_step": 24545, "epoch": 295} {"train_loss": -18.478565216064453, "global_step": 24546, "epoch": 295} {"train_loss": -18.847349166870117, "global_step": 24547, "epoch": 295} {"train_loss": -18.66957664489746, "global_step": 24548, "epoch": 295} {"train_loss": -18.84193992614746, "global_step": 24549, "epoch": 295} {"train_loss": -18.412214279174805, "global_step": 24550, "epoch": 295} {"train_loss": -18.557775497436523, "global_step": 24551, "epoch": 295} {"train_loss": -18.760929107666016, "global_step": 24552, "epoch": 295} {"train_loss": -18.920896530151367, "global_step": 24553, "epoch": 295} {"train_loss": -18.84084129333496, "global_step": 24554, "epoch": 295} {"train_loss": -18.458433151245117, "global_step": 24555, "epoch": 295} {"train_loss": -18.295312881469727, "global_step": 24556, "epoch": 295} {"train_loss": -18.698514938354492, "global_step": 24557, "epoch": 295} {"train_loss": -18.882572174072266, "global_step": 24558, "epoch": 295} {"train_loss": -18.83330726623535, "global_step": 24559, "epoch": 295} {"train_loss": -18.566869735717773, "global_step": 24560, "epoch": 295} {"train_loss": -18.70381736755371, "global_step": 24561, "epoch": 295} {"train_loss": -18.687789916992188, "global_step": 24562, "epoch": 295} {"train_loss": -18.636688232421875, "global_step": 24563, "epoch": 295} {"train_loss": -18.68616485595703, "global_step": 24564, "epoch": 295} {"train_loss": -18.686511993408203, "global_step": 24565, "epoch": 295} {"train_loss": -18.611791610717773, "global_step": 24566, "epoch": 295} {"train_loss": -18.65057464967291, "global_step": 24567, "epoch": 295, "val_loss": 5948876.5} {"train_loss": -18.5314998626709, "global_step": 24568, "epoch": 296} {"train_loss": -18.509077072143555, "global_step": 24569, "epoch": 296} {"train_loss": -18.905324935913086, "global_step": 24570, "epoch": 296} {"train_loss": -18.583616256713867, "global_step": 24571, "epoch": 296} {"train_loss": -18.500286102294922, "global_step": 24572, "epoch": 296} {"train_loss": -18.284915924072266, "global_step": 24573, "epoch": 296} {"train_loss": -18.60345458984375, "global_step": 24574, "epoch": 296} {"train_loss": -18.51812744140625, "global_step": 24575, "epoch": 296} {"train_loss": -18.3904972076416, "global_step": 24576, "epoch": 296} {"train_loss": -18.41607666015625, "global_step": 24577, "epoch": 296} {"train_loss": -18.603185653686523, "global_step": 24578, "epoch": 296} {"train_loss": -18.33147621154785, "global_step": 24579, "epoch": 296} {"train_loss": -18.46538543701172, "global_step": 24580, "epoch": 296} {"train_loss": -18.721370697021484, "global_step": 24581, "epoch": 296} {"train_loss": -18.633575439453125, "global_step": 24582, "epoch": 296} {"train_loss": -18.82811737060547, "global_step": 24583, "epoch": 296} {"train_loss": -18.338571548461914, "global_step": 24584, "epoch": 296} {"train_loss": -18.72319984436035, "global_step": 24585, "epoch": 296} {"train_loss": -18.492462158203125, "global_step": 24586, "epoch": 296} {"train_loss": -18.5529727935791, "global_step": 24587, "epoch": 296} {"train_loss": -18.531280517578125, "global_step": 24588, "epoch": 296} {"train_loss": -18.74407386779785, "global_step": 24589, "epoch": 296} {"train_loss": -18.340242385864258, "global_step": 24590, "epoch": 296} {"train_loss": -19.005422592163086, "global_step": 24591, "epoch": 296} {"train_loss": -18.437116622924805, "global_step": 24592, "epoch": 296} {"train_loss": -18.725072860717773, "global_step": 24593, "epoch": 296} {"train_loss": -18.816221237182617, "global_step": 24594, "epoch": 296} {"train_loss": -18.503446578979492, "global_step": 24595, "epoch": 296} {"train_loss": -18.76140022277832, "global_step": 24596, "epoch": 296} {"train_loss": -18.714807510375977, "global_step": 24597, "epoch": 296} {"train_loss": -18.46886444091797, "global_step": 24598, "epoch": 296} {"train_loss": -18.51555633544922, "global_step": 24599, "epoch": 296} {"train_loss": -18.549840927124023, "global_step": 24600, "epoch": 296} {"train_loss": -18.74612808227539, "global_step": 24601, "epoch": 296} {"train_loss": -18.540475845336914, "global_step": 24602, "epoch": 296} {"train_loss": -18.667682647705078, "global_step": 24603, "epoch": 296} {"train_loss": -18.89362907409668, "global_step": 24604, "epoch": 296} {"train_loss": -18.70306968688965, "global_step": 24605, "epoch": 296} {"train_loss": -19.207294464111328, "global_step": 24606, "epoch": 296} {"train_loss": -18.59562110900879, "global_step": 24607, "epoch": 296} {"train_loss": -18.677820205688477, "global_step": 24608, "epoch": 296} {"train_loss": -18.999067306518555, "global_step": 24609, "epoch": 296} {"train_loss": -18.264598846435547, "global_step": 24610, "epoch": 296} {"train_loss": -18.797101974487305, "global_step": 24611, "epoch": 296} {"train_loss": -18.635862350463867, "global_step": 24612, "epoch": 296} {"train_loss": -18.31732177734375, "global_step": 24613, "epoch": 296} {"train_loss": -18.79292869567871, "global_step": 24614, "epoch": 296} {"train_loss": -18.76108741760254, "global_step": 24615, "epoch": 296} {"train_loss": -18.609899520874023, "global_step": 24616, "epoch": 296} {"train_loss": -18.829792022705078, "global_step": 24617, "epoch": 296} {"train_loss": -18.47903823852539, "global_step": 24618, "epoch": 296} {"train_loss": -18.932554244995117, "global_step": 24619, "epoch": 296} {"train_loss": -18.474477767944336, "global_step": 24620, "epoch": 296} {"train_loss": -18.659276962280273, "global_step": 24621, "epoch": 296} {"train_loss": -18.712085723876953, "global_step": 24622, "epoch": 296} {"train_loss": -18.653583526611328, "global_step": 24623, "epoch": 296} {"train_loss": -18.585369110107422, "global_step": 24624, "epoch": 296} {"train_loss": -18.806615829467773, "global_step": 24625, "epoch": 296} {"train_loss": -18.826162338256836, "global_step": 24626, "epoch": 296} {"train_loss": -18.617816925048828, "global_step": 24627, "epoch": 296} {"train_loss": -18.629562377929688, "global_step": 24628, "epoch": 296} {"train_loss": -18.79633140563965, "global_step": 24629, "epoch": 296} {"train_loss": -18.722274780273438, "global_step": 24630, "epoch": 296} {"train_loss": -18.853233337402344, "global_step": 24631, "epoch": 296} {"train_loss": -18.661245346069336, "global_step": 24632, "epoch": 296} {"train_loss": -18.453798294067383, "global_step": 24633, "epoch": 296} {"train_loss": -18.52446174621582, "global_step": 24634, "epoch": 296} {"train_loss": -18.778736114501953, "global_step": 24635, "epoch": 296} {"train_loss": -18.840158462524414, "global_step": 24636, "epoch": 296} {"train_loss": -18.28559684753418, "global_step": 24637, "epoch": 296} {"train_loss": -18.927350997924805, "global_step": 24638, "epoch": 296} {"train_loss": -19.05596923828125, "global_step": 24639, "epoch": 296} {"train_loss": -18.844858169555664, "global_step": 24640, "epoch": 296} {"train_loss": -18.491727828979492, "global_step": 24641, "epoch": 296} {"train_loss": -18.749073028564453, "global_step": 24642, "epoch": 296} {"train_loss": -18.983068466186523, "global_step": 24643, "epoch": 296} {"train_loss": -18.859487533569336, "global_step": 24644, "epoch": 296} {"train_loss": -18.356016159057617, "global_step": 24645, "epoch": 296} {"train_loss": -18.564456939697266, "global_step": 24646, "epoch": 296} {"train_loss": -19.04197883605957, "global_step": 24647, "epoch": 296} {"train_loss": -18.585622787475586, "global_step": 24648, "epoch": 296} {"train_loss": -18.70722007751465, "global_step": 24649, "epoch": 296} {"train_loss": -18.653541610901613, "global_step": 24650, "epoch": 296, "val_loss": 5947837.5} {"train_loss": -18.501218795776367, "global_step": 24651, "epoch": 297} {"train_loss": -18.567096710205078, "global_step": 24652, "epoch": 297} {"train_loss": -18.573806762695312, "global_step": 24653, "epoch": 297} {"train_loss": -18.44916343688965, "global_step": 24654, "epoch": 297} {"train_loss": -18.707950592041016, "global_step": 24655, "epoch": 297} {"train_loss": -18.653274536132812, "global_step": 24656, "epoch": 297} {"train_loss": -18.24916648864746, "global_step": 24657, "epoch": 297} {"train_loss": -18.83290672302246, "global_step": 24658, "epoch": 297} {"train_loss": -18.492298126220703, "global_step": 24659, "epoch": 297} {"train_loss": -18.54788589477539, "global_step": 24660, "epoch": 297} {"train_loss": -18.61264991760254, "global_step": 24661, "epoch": 297} {"train_loss": -18.62404441833496, "global_step": 24662, "epoch": 297} {"train_loss": -18.973896026611328, "global_step": 24663, "epoch": 297} {"train_loss": -18.203052520751953, "global_step": 24664, "epoch": 297} {"train_loss": -18.709976196289062, "global_step": 24665, "epoch": 297} {"train_loss": -18.580734252929688, "global_step": 24666, "epoch": 297} {"train_loss": -18.40822410583496, "global_step": 24667, "epoch": 297} {"train_loss": -18.53729820251465, "global_step": 24668, "epoch": 297} {"train_loss": -18.578886032104492, "global_step": 24669, "epoch": 297} {"train_loss": -18.65471839904785, "global_step": 24670, "epoch": 297} {"train_loss": -18.655414581298828, "global_step": 24671, "epoch": 297} {"train_loss": -18.24030113220215, "global_step": 24672, "epoch": 297} {"train_loss": -18.685117721557617, "global_step": 24673, "epoch": 297} {"train_loss": -18.41400146484375, "global_step": 24674, "epoch": 297} {"train_loss": -18.465925216674805, "global_step": 24675, "epoch": 297} {"train_loss": -18.84299659729004, "global_step": 24676, "epoch": 297} {"train_loss": -19.112897872924805, "global_step": 24677, "epoch": 297} {"train_loss": -18.968341827392578, "global_step": 24678, "epoch": 297} {"train_loss": -18.43951988220215, "global_step": 24679, "epoch": 297} {"train_loss": -18.67078971862793, "global_step": 24680, "epoch": 297} {"train_loss": -18.862165451049805, "global_step": 24681, "epoch": 297} {"train_loss": -18.814359664916992, "global_step": 24682, "epoch": 297} {"train_loss": -18.52101707458496, "global_step": 24683, "epoch": 297} {"train_loss": -18.891010284423828, "global_step": 24684, "epoch": 297} {"train_loss": -18.84092140197754, "global_step": 24685, "epoch": 297} {"train_loss": -18.493741989135742, "global_step": 24686, "epoch": 297} {"train_loss": -18.543004989624023, "global_step": 24687, "epoch": 297} {"train_loss": -18.70441246032715, "global_step": 24688, "epoch": 297} {"train_loss": -18.72199821472168, "global_step": 24689, "epoch": 297} {"train_loss": -18.44243812561035, "global_step": 24690, "epoch": 297} {"train_loss": -18.70263671875, "global_step": 24691, "epoch": 297} {"train_loss": -18.712820053100586, "global_step": 24692, "epoch": 297} {"train_loss": -18.625696182250977, "global_step": 24693, "epoch": 297} {"train_loss": -18.572683334350586, "global_step": 24694, "epoch": 297} {"train_loss": -18.244577407836914, "global_step": 24695, "epoch": 297} {"train_loss": -18.583942413330078, "global_step": 24696, "epoch": 297} {"train_loss": -18.791748046875, "global_step": 24697, "epoch": 297} {"train_loss": -18.748640060424805, "global_step": 24698, "epoch": 297} {"train_loss": -18.698171615600586, "global_step": 24699, "epoch": 297} {"train_loss": -18.860355377197266, "global_step": 24700, "epoch": 297} {"train_loss": -18.74541664123535, "global_step": 24701, "epoch": 297} {"train_loss": -18.90667152404785, "global_step": 24702, "epoch": 297} {"train_loss": -18.672367095947266, "global_step": 24703, "epoch": 297} {"train_loss": -18.561054229736328, "global_step": 24704, "epoch": 297} {"train_loss": -18.080556869506836, "global_step": 24705, "epoch": 297} {"train_loss": -18.755496978759766, "global_step": 24706, "epoch": 297} {"train_loss": -18.8347225189209, "global_step": 24707, "epoch": 297} {"train_loss": -18.8601131439209, "global_step": 24708, "epoch": 297} {"train_loss": -18.59761619567871, "global_step": 24709, "epoch": 297} {"train_loss": -18.653669357299805, "global_step": 24710, "epoch": 297} {"train_loss": -18.13578987121582, "global_step": 24711, "epoch": 297} {"train_loss": -18.612369537353516, "global_step": 24712, "epoch": 297} {"train_loss": -18.539871215820312, "global_step": 24713, "epoch": 297} {"train_loss": -18.716663360595703, "global_step": 24714, "epoch": 297} {"train_loss": -18.55758285522461, "global_step": 24715, "epoch": 297} {"train_loss": -18.713573455810547, "global_step": 24716, "epoch": 297} {"train_loss": -18.754728317260742, "global_step": 24717, "epoch": 297} {"train_loss": -19.132780075073242, "global_step": 24718, "epoch": 297} {"train_loss": -18.772432327270508, "global_step": 24719, "epoch": 297} {"train_loss": -18.660175323486328, "global_step": 24720, "epoch": 297} {"train_loss": -18.577072143554688, "global_step": 24721, "epoch": 297} {"train_loss": -18.786636352539062, "global_step": 24722, "epoch": 297} {"train_loss": -18.831884384155273, "global_step": 24723, "epoch": 297} {"train_loss": -18.615970611572266, "global_step": 24724, "epoch": 297} {"train_loss": -18.82546043395996, "global_step": 24725, "epoch": 297} {"train_loss": -18.68513298034668, "global_step": 24726, "epoch": 297} {"train_loss": -18.52303695678711, "global_step": 24727, "epoch": 297} {"train_loss": -18.227603912353516, "global_step": 24728, "epoch": 297} {"train_loss": -18.63761329650879, "global_step": 24729, "epoch": 297} {"train_loss": -18.748023986816406, "global_step": 24730, "epoch": 297} {"train_loss": -18.927215576171875, "global_step": 24731, "epoch": 297} {"train_loss": -18.916885375976562, "global_step": 24732, "epoch": 297} {"train_loss": -18.66075428422675, "global_step": 24733, "epoch": 297, "val_loss": 6037393.5} {"train_loss": -18.628040313720703, "global_step": 24734, "epoch": 298} {"train_loss": -18.626264572143555, "global_step": 24735, "epoch": 298} {"train_loss": -18.379934310913086, "global_step": 24736, "epoch": 298} {"train_loss": -18.501937866210938, "global_step": 24737, "epoch": 298} {"train_loss": -18.88550567626953, "global_step": 24738, "epoch": 298} {"train_loss": -18.379852294921875, "global_step": 24739, "epoch": 298} {"train_loss": -18.510496139526367, "global_step": 24740, "epoch": 298} {"train_loss": -18.470840454101562, "global_step": 24741, "epoch": 298} {"train_loss": -18.948673248291016, "global_step": 24742, "epoch": 298} {"train_loss": -18.367963790893555, "global_step": 24743, "epoch": 298} {"train_loss": -18.905475616455078, "global_step": 24744, "epoch": 298} {"train_loss": -18.219404220581055, "global_step": 24745, "epoch": 298} {"train_loss": -18.568204879760742, "global_step": 24746, "epoch": 298} {"train_loss": -18.685302734375, "global_step": 24747, "epoch": 298} {"train_loss": -18.43568229675293, "global_step": 24748, "epoch": 298} {"train_loss": -18.325546264648438, "global_step": 24749, "epoch": 298} {"train_loss": -18.760940551757812, "global_step": 24750, "epoch": 298} {"train_loss": -18.45928382873535, "global_step": 24751, "epoch": 298} {"train_loss": -18.530988693237305, "global_step": 24752, "epoch": 298} {"train_loss": -18.262361526489258, "global_step": 24753, "epoch": 298} {"train_loss": -18.4621524810791, "global_step": 24754, "epoch": 298} {"train_loss": -18.680654525756836, "global_step": 24755, "epoch": 298} {"train_loss": -18.592939376831055, "global_step": 24756, "epoch": 298} {"train_loss": -18.782644271850586, "global_step": 24757, "epoch": 298} {"train_loss": -18.816434860229492, "global_step": 24758, "epoch": 298} {"train_loss": -18.924850463867188, "global_step": 24759, "epoch": 298} {"train_loss": -18.67147445678711, "global_step": 24760, "epoch": 298} {"train_loss": -18.357271194458008, "global_step": 24761, "epoch": 298} {"train_loss": -18.88484001159668, "global_step": 24762, "epoch": 298} {"train_loss": -18.82704734802246, "global_step": 24763, "epoch": 298} {"train_loss": -18.883960723876953, "global_step": 24764, "epoch": 298} {"train_loss": -18.83148193359375, "global_step": 24765, "epoch": 298} {"train_loss": -18.743885040283203, "global_step": 24766, "epoch": 298} {"train_loss": -18.701324462890625, "global_step": 24767, "epoch": 298} {"train_loss": -18.855451583862305, "global_step": 24768, "epoch": 298} {"train_loss": -18.703588485717773, "global_step": 24769, "epoch": 298} {"train_loss": -18.3785400390625, "global_step": 24770, "epoch": 298} {"train_loss": -18.506296157836914, "global_step": 24771, "epoch": 298} {"train_loss": -18.530195236206055, "global_step": 24772, "epoch": 298} {"train_loss": -18.507556915283203, "global_step": 24773, "epoch": 298} {"train_loss": -18.836055755615234, "global_step": 24774, "epoch": 298} {"train_loss": -19.16189956665039, "global_step": 24775, "epoch": 298} {"train_loss": -18.604333877563477, "global_step": 24776, "epoch": 298} {"train_loss": -18.6400146484375, "global_step": 24777, "epoch": 298} {"train_loss": -18.66412925720215, "global_step": 24778, "epoch": 298} {"train_loss": -18.317655563354492, "global_step": 24779, "epoch": 298} {"train_loss": -18.89249610900879, "global_step": 24780, "epoch": 298} {"train_loss": -18.742095947265625, "global_step": 24781, "epoch": 298} {"train_loss": -19.030569076538086, "global_step": 24782, "epoch": 298} {"train_loss": -18.630455017089844, "global_step": 24783, "epoch": 298} {"train_loss": -18.653915405273438, "global_step": 24784, "epoch": 298} {"train_loss": -18.779382705688477, "global_step": 24785, "epoch": 298} {"train_loss": -18.600141525268555, "global_step": 24786, "epoch": 298} {"train_loss": -18.47351837158203, "global_step": 24787, "epoch": 298} {"train_loss": -18.51891326904297, "global_step": 24788, "epoch": 298} {"train_loss": -18.52778434753418, "global_step": 24789, "epoch": 298} {"train_loss": -18.963083267211914, "global_step": 24790, "epoch": 298} {"train_loss": -18.5886287689209, "global_step": 24791, "epoch": 298} {"train_loss": -18.756694793701172, "global_step": 24792, "epoch": 298} {"train_loss": -18.815444946289062, "global_step": 24793, "epoch": 298} {"train_loss": -19.132587432861328, "global_step": 24794, "epoch": 298} {"train_loss": -18.25312614440918, "global_step": 24795, "epoch": 298} {"train_loss": -18.672306060791016, "global_step": 24796, "epoch": 298} {"train_loss": -18.37784767150879, "global_step": 24797, "epoch": 298} {"train_loss": -19.03678321838379, "global_step": 24798, "epoch": 298} {"train_loss": -18.652677536010742, "global_step": 24799, "epoch": 298} {"train_loss": -18.45888328552246, "global_step": 24800, "epoch": 298} {"train_loss": -18.857839584350586, "global_step": 24801, "epoch": 298} {"train_loss": -18.65110206604004, "global_step": 24802, "epoch": 298} {"train_loss": -18.603527069091797, "global_step": 24803, "epoch": 298} {"train_loss": -18.526758193969727, "global_step": 24804, "epoch": 298} {"train_loss": -18.757944107055664, "global_step": 24805, "epoch": 298} {"train_loss": -19.04817771911621, "global_step": 24806, "epoch": 298} {"train_loss": -18.38506507873535, "global_step": 24807, "epoch": 298} {"train_loss": -18.842329025268555, "global_step": 24808, "epoch": 298} {"train_loss": -18.11647605895996, "global_step": 24809, "epoch": 298} {"train_loss": -18.88275718688965, "global_step": 24810, "epoch": 298} {"train_loss": -18.679819107055664, "global_step": 24811, "epoch": 298} {"train_loss": -18.643901824951172, "global_step": 24812, "epoch": 298} {"train_loss": -18.64862632751465, "global_step": 24813, "epoch": 298} {"train_loss": -18.463895797729492, "global_step": 24814, "epoch": 298} {"train_loss": -18.866840362548828, "global_step": 24815, "epoch": 298} {"train_loss": -18.650756812957397, "global_step": 24816, "epoch": 298, "val_loss": 6009914.0} {"train_loss": -18.371000289916992, "global_step": 24817, "epoch": 299} {"train_loss": -18.297901153564453, "global_step": 24818, "epoch": 299} {"train_loss": -17.638599395751953, "global_step": 24819, "epoch": 299} {"train_loss": -18.200963973999023, "global_step": 24820, "epoch": 299} {"train_loss": -17.950916290283203, "global_step": 24821, "epoch": 299} {"train_loss": -18.162389755249023, "global_step": 24822, "epoch": 299} {"train_loss": -18.484365463256836, "global_step": 24823, "epoch": 299} {"train_loss": -18.64732551574707, "global_step": 24824, "epoch": 299} {"train_loss": -18.228069305419922, "global_step": 24825, "epoch": 299} {"train_loss": -18.70446014404297, "global_step": 24826, "epoch": 299} {"train_loss": -18.027843475341797, "global_step": 24827, "epoch": 299} {"train_loss": -18.824922561645508, "global_step": 24828, "epoch": 299} {"train_loss": -18.344404220581055, "global_step": 24829, "epoch": 299} {"train_loss": -18.163183212280273, "global_step": 24830, "epoch": 299} {"train_loss": -18.389028549194336, "global_step": 24831, "epoch": 299} {"train_loss": -18.683761596679688, "global_step": 24832, "epoch": 299} {"train_loss": -18.32684898376465, "global_step": 24833, "epoch": 299} {"train_loss": -18.55571174621582, "global_step": 24834, "epoch": 299} {"train_loss": -18.456811904907227, "global_step": 24835, "epoch": 299} {"train_loss": -18.815998077392578, "global_step": 24836, "epoch": 299} {"train_loss": -18.447385787963867, "global_step": 24837, "epoch": 299} {"train_loss": -18.731592178344727, "global_step": 24838, "epoch": 299} {"train_loss": -18.773792266845703, "global_step": 24839, "epoch": 299} {"train_loss": -18.82552146911621, "global_step": 24840, "epoch": 299} {"train_loss": -18.711469650268555, "global_step": 24841, "epoch": 299} {"train_loss": -18.805784225463867, "global_step": 24842, "epoch": 299} {"train_loss": -18.996967315673828, "global_step": 24843, "epoch": 299} {"train_loss": -18.5667724609375, "global_step": 24844, "epoch": 299} {"train_loss": -18.584556579589844, "global_step": 24845, "epoch": 299} {"train_loss": -18.7840633392334, "global_step": 24846, "epoch": 299} {"train_loss": -18.322830200195312, "global_step": 24847, "epoch": 299} {"train_loss": -18.854389190673828, "global_step": 24848, "epoch": 299} {"train_loss": -18.848487854003906, "global_step": 24849, "epoch": 299} {"train_loss": -18.7367000579834, "global_step": 24850, "epoch": 299} {"train_loss": -18.690479278564453, "global_step": 24851, "epoch": 299} {"train_loss": -18.376462936401367, "global_step": 24852, "epoch": 299} {"train_loss": -18.269834518432617, "global_step": 24853, "epoch": 299} {"train_loss": -18.220233917236328, "global_step": 24854, "epoch": 299} {"train_loss": -18.682350158691406, "global_step": 24855, "epoch": 299} {"train_loss": -18.510019302368164, "global_step": 24856, "epoch": 299} {"train_loss": -18.745161056518555, "global_step": 24857, "epoch": 299} {"train_loss": -18.72295570373535, "global_step": 24858, "epoch": 299} {"train_loss": -18.707664489746094, "global_step": 24859, "epoch": 299} {"train_loss": -18.76057243347168, "global_step": 24860, "epoch": 299} {"train_loss": -18.528242111206055, "global_step": 24861, "epoch": 299} {"train_loss": -18.51375389099121, "global_step": 24862, "epoch": 299} {"train_loss": -18.698095321655273, "global_step": 24863, "epoch": 299} {"train_loss": -18.69171714782715, "global_step": 24864, "epoch": 299} {"train_loss": -18.693323135375977, "global_step": 24865, "epoch": 299} {"train_loss": -18.737751007080078, "global_step": 24866, "epoch": 299} {"train_loss": -18.674509048461914, "global_step": 24867, "epoch": 299} {"train_loss": -18.849849700927734, "global_step": 24868, "epoch": 299} {"train_loss": -18.688465118408203, "global_step": 24869, "epoch": 299} {"train_loss": -18.82956886291504, "global_step": 24870, "epoch": 299} {"train_loss": -18.726701736450195, "global_step": 24871, "epoch": 299} {"train_loss": -18.45657730102539, "global_step": 24872, "epoch": 299} {"train_loss": -18.685165405273438, "global_step": 24873, "epoch": 299} {"train_loss": -18.325979232788086, "global_step": 24874, "epoch": 299} {"train_loss": -18.476491928100586, "global_step": 24875, "epoch": 299} {"train_loss": -18.339597702026367, "global_step": 24876, "epoch": 299} {"train_loss": -18.36172866821289, "global_step": 24877, "epoch": 299} {"train_loss": -18.81328773498535, "global_step": 24878, "epoch": 299} {"train_loss": -18.537572860717773, "global_step": 24879, "epoch": 299} {"train_loss": -18.845417022705078, "global_step": 24880, "epoch": 299} {"train_loss": -18.572206497192383, "global_step": 24881, "epoch": 299} {"train_loss": -18.308027267456055, "global_step": 24882, "epoch": 299} {"train_loss": -18.496395111083984, "global_step": 24883, "epoch": 299} {"train_loss": -18.79949378967285, "global_step": 24884, "epoch": 299} {"train_loss": -18.95198631286621, "global_step": 24885, "epoch": 299} {"train_loss": -18.551794052124023, "global_step": 24886, "epoch": 299} {"train_loss": -18.80586814880371, "global_step": 24887, "epoch": 299} {"train_loss": -18.927274703979492, "global_step": 24888, "epoch": 299} {"train_loss": -18.569908142089844, "global_step": 24889, "epoch": 299} {"train_loss": -19.0902156829834, "global_step": 24890, "epoch": 299} {"train_loss": -18.74540901184082, "global_step": 24891, "epoch": 299} {"train_loss": -18.657323837280273, "global_step": 24892, "epoch": 299} {"train_loss": -18.594749450683594, "global_step": 24893, "epoch": 299} {"train_loss": -18.8051815032959, "global_step": 24894, "epoch": 299} {"train_loss": -18.850723266601562, "global_step": 24895, "epoch": 299} {"train_loss": -18.69368553161621, "global_step": 24896, "epoch": 299} {"train_loss": -18.637191772460938, "global_step": 24897, "epoch": 299} {"train_loss": -18.956113815307617, "global_step": 24898, "epoch": 299} {"train_loss": -18.575342063444207, "global_step": 24899, "epoch": 299, "val_loss": 5990681.0} {"train_loss": -18.098371505737305, "global_step": 24900, "epoch": 300} {"train_loss": -18.342350006103516, "global_step": 24901, "epoch": 300} {"train_loss": -17.970491409301758, "global_step": 24902, "epoch": 300} {"train_loss": -18.151891708374023, "global_step": 24903, "epoch": 300} {"train_loss": -18.07686424255371, "global_step": 24904, "epoch": 300} {"train_loss": -18.54241180419922, "global_step": 24905, "epoch": 300} {"train_loss": -18.032148361206055, "global_step": 24906, "epoch": 300} {"train_loss": -18.526580810546875, "global_step": 24907, "epoch": 300} {"train_loss": -18.07535171508789, "global_step": 24908, "epoch": 300} {"train_loss": -18.234172821044922, "global_step": 24909, "epoch": 300} {"train_loss": -18.065961837768555, "global_step": 24910, "epoch": 300} {"train_loss": -18.470233917236328, "global_step": 24911, "epoch": 300} {"train_loss": -18.092870712280273, "global_step": 24912, "epoch": 300} {"train_loss": -18.38795280456543, "global_step": 24913, "epoch": 300} {"train_loss": -18.4437255859375, "global_step": 24914, "epoch": 300} {"train_loss": -18.411413192749023, "global_step": 24915, "epoch": 300} {"train_loss": -18.73784637451172, "global_step": 24916, "epoch": 300} {"train_loss": -18.603849411010742, "global_step": 24917, "epoch": 300} {"train_loss": -18.640655517578125, "global_step": 24918, "epoch": 300} {"train_loss": -18.679174423217773, "global_step": 24919, "epoch": 300} {"train_loss": -18.8695125579834, "global_step": 24920, "epoch": 300} {"train_loss": -18.759313583374023, "global_step": 24921, "epoch": 300} {"train_loss": -18.60236167907715, "global_step": 24922, "epoch": 300} {"train_loss": -18.723026275634766, "global_step": 24923, "epoch": 300} {"train_loss": -18.288511276245117, "global_step": 24924, "epoch": 300} {"train_loss": -18.805057525634766, "global_step": 24925, "epoch": 300} {"train_loss": -18.63671112060547, "global_step": 24926, "epoch": 300} {"train_loss": -18.68393325805664, "global_step": 24927, "epoch": 300} {"train_loss": -18.30389404296875, "global_step": 24928, "epoch": 300} {"train_loss": -18.634033203125, "global_step": 24929, "epoch": 300} {"train_loss": -18.976505279541016, "global_step": 24930, "epoch": 300} {"train_loss": -19.03662109375, "global_step": 24931, "epoch": 300} {"train_loss": -18.77567481994629, "global_step": 24932, "epoch": 300} {"train_loss": -18.889997482299805, "global_step": 24933, "epoch": 300} {"train_loss": -18.879480361938477, "global_step": 24934, "epoch": 300} {"train_loss": -18.70537757873535, "global_step": 24935, "epoch": 300} {"train_loss": -18.81061363220215, "global_step": 24936, "epoch": 300} {"train_loss": -18.521194458007812, "global_step": 24937, "epoch": 300} {"train_loss": -18.85211753845215, "global_step": 24938, "epoch": 300} {"train_loss": -18.611494064331055, "global_step": 24939, "epoch": 300} {"train_loss": -18.60054588317871, "global_step": 24940, "epoch": 300} {"train_loss": -18.72421646118164, "global_step": 24941, "epoch": 300} {"train_loss": -18.894855499267578, "global_step": 24942, "epoch": 300} {"train_loss": -18.664709091186523, "global_step": 24943, "epoch": 300} {"train_loss": -18.828332901000977, "global_step": 24944, "epoch": 300} {"train_loss": -18.381818771362305, "global_step": 24945, "epoch": 300} {"train_loss": -18.834299087524414, "global_step": 24946, "epoch": 300} {"train_loss": -18.915599822998047, "global_step": 24947, "epoch": 300} {"train_loss": -18.836811065673828, "global_step": 24948, "epoch": 300} {"train_loss": -18.924163818359375, "global_step": 24949, "epoch": 300} {"train_loss": -18.539194107055664, "global_step": 24950, "epoch": 300} {"train_loss": -18.864208221435547, "global_step": 24951, "epoch": 300} {"train_loss": -18.808765411376953, "global_step": 24952, "epoch": 300} {"train_loss": -18.553749084472656, "global_step": 24953, "epoch": 300} {"train_loss": -18.694013595581055, "global_step": 24954, "epoch": 300} {"train_loss": -18.821969985961914, "global_step": 24955, "epoch": 300} {"train_loss": -18.8762264251709, "global_step": 24956, "epoch": 300} {"train_loss": -18.590457916259766, "global_step": 24957, "epoch": 300} {"train_loss": -18.834020614624023, "global_step": 24958, "epoch": 300} {"train_loss": -18.296615600585938, "global_step": 24959, "epoch": 300} {"train_loss": -18.239065170288086, "global_step": 24960, "epoch": 300} {"train_loss": -18.192367553710938, "global_step": 24961, "epoch": 300} {"train_loss": -18.772846221923828, "global_step": 24962, "epoch": 300} {"train_loss": -18.611181259155273, "global_step": 24963, "epoch": 300} {"train_loss": -18.744924545288086, "global_step": 24964, "epoch": 300} {"train_loss": -18.457473754882812, "global_step": 24965, "epoch": 300} {"train_loss": -18.57410430908203, "global_step": 24966, "epoch": 300} {"train_loss": -18.68935203552246, "global_step": 24967, "epoch": 300} {"train_loss": -19.1249942779541, "global_step": 24968, "epoch": 300} {"train_loss": -18.972166061401367, "global_step": 24969, "epoch": 300} {"train_loss": -18.52019691467285, "global_step": 24970, "epoch": 300} {"train_loss": -18.7119197845459, "global_step": 24971, "epoch": 300} {"train_loss": -18.398740768432617, "global_step": 24972, "epoch": 300} {"train_loss": -18.610870361328125, "global_step": 24973, "epoch": 300} {"train_loss": -18.248998641967773, "global_step": 24974, "epoch": 300} {"train_loss": -18.592819213867188, "global_step": 24975, "epoch": 300} {"train_loss": -18.516372680664062, "global_step": 24976, "epoch": 300} {"train_loss": -19.104467391967773, "global_step": 24977, "epoch": 300} {"train_loss": -18.26007652282715, "global_step": 24978, "epoch": 300} {"train_loss": -18.577802658081055, "global_step": 24979, "epoch": 300} {"train_loss": -19.06873893737793, "global_step": 24980, "epoch": 300} {"train_loss": -19.023550033569336, "global_step": 24981, "epoch": 300} {"train_loss": -18.607949613088586, "global_step": 24982, "epoch": 300, "train/sim_max_reward_0": 1.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 0.0, "train/sim_max_reward_4": 0.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4500000": 0.0, "test/sim_max_reward_4500001": 0.0, "test/sim_max_reward_4500002": 1.0, "test/sim_max_reward_4500003": 1.0, "test/sim_max_reward_4500004": 0.0, "test/sim_max_reward_4500005": 1.0, "test/sim_max_reward_4500006": 0.0, "test/sim_max_reward_4500007": 1.0, "test/sim_max_reward_4500008": 1.0, "test/sim_max_reward_4500009": 0.0, "test/sim_max_reward_4500010": 1.0, "test/sim_max_reward_4500011": 1.0, "test/sim_max_reward_4500012": 1.0, "test/sim_max_reward_4500013": 1.0, "test/sim_max_reward_4500014": 1.0, "test/sim_max_reward_4500015": 0.0, "test/sim_max_reward_4500016": 1.0, "test/sim_max_reward_4500017": 1.0, "test/sim_max_reward_4500018": 1.0, "test/sim_max_reward_4500019": 0.0, "test/sim_max_reward_4500020": 1.0, "test/sim_max_reward_4500021": 1.0, "train/mean_score": 0.6666666666666666, "test/mean_score": 0.6818181818181818, "val_loss": 5936332.0} {"train_loss": -18.285242080688477, "global_step": 24983, "epoch": 301} {"train_loss": -18.394224166870117, "global_step": 24984, "epoch": 301} {"train_loss": -18.499521255493164, "global_step": 24985, "epoch": 301} {"train_loss": -18.38594627380371, "global_step": 24986, "epoch": 301} {"train_loss": -18.300046920776367, "global_step": 24987, "epoch": 301} {"train_loss": -18.50443458557129, "global_step": 24988, "epoch": 301} {"train_loss": -18.697004318237305, "global_step": 24989, "epoch": 301} {"train_loss": -18.505050659179688, "global_step": 24990, "epoch": 301} {"train_loss": -18.65675163269043, "global_step": 24991, "epoch": 301} {"train_loss": -18.318525314331055, "global_step": 24992, "epoch": 301} {"train_loss": -18.83269500732422, "global_step": 24993, "epoch": 301} {"train_loss": -17.989852905273438, "global_step": 24994, "epoch": 301} {"train_loss": -18.620269775390625, "global_step": 24995, "epoch": 301} {"train_loss": -18.91399383544922, "global_step": 24996, "epoch": 301} {"train_loss": -18.56610107421875, "global_step": 24997, "epoch": 301} {"train_loss": -18.824962615966797, "global_step": 24998, "epoch": 301} {"train_loss": -18.372072219848633, "global_step": 24999, "epoch": 301} {"train_loss": -18.719301223754883, "global_step": 25000, "epoch": 301} {"train_loss": -18.135313034057617, "global_step": 25001, "epoch": 301} {"train_loss": -18.49917984008789, "global_step": 25002, "epoch": 301} {"train_loss": -18.640100479125977, "global_step": 25003, "epoch": 301} {"train_loss": -18.371170043945312, "global_step": 25004, "epoch": 301} {"train_loss": -18.619165420532227, "global_step": 25005, "epoch": 301} {"train_loss": -18.267147064208984, "global_step": 25006, "epoch": 301} {"train_loss": -18.791135787963867, "global_step": 25007, "epoch": 301} {"train_loss": -18.931930541992188, "global_step": 25008, "epoch": 301} {"train_loss": -18.791452407836914, "global_step": 25009, "epoch": 301} {"train_loss": -18.795820236206055, "global_step": 25010, "epoch": 301} {"train_loss": -18.830753326416016, "global_step": 25011, "epoch": 301} {"train_loss": -18.84280776977539, "global_step": 25012, "epoch": 301} {"train_loss": -19.128713607788086, "global_step": 25013, "epoch": 301} {"train_loss": -19.008047103881836, "global_step": 25014, "epoch": 301} {"train_loss": -18.820449829101562, "global_step": 25015, "epoch": 301} {"train_loss": -18.27851676940918, "global_step": 25016, "epoch": 301} {"train_loss": -18.71161460876465, "global_step": 25017, "epoch": 301} {"train_loss": -18.650043487548828, "global_step": 25018, "epoch": 301} {"train_loss": -19.187244415283203, "global_step": 25019, "epoch": 301} {"train_loss": -18.563257217407227, "global_step": 25020, "epoch": 301} {"train_loss": -18.87929344177246, "global_step": 25021, "epoch": 301} {"train_loss": -18.496688842773438, "global_step": 25022, "epoch": 301} {"train_loss": -18.92041015625, "global_step": 25023, "epoch": 301} {"train_loss": -18.50629997253418, "global_step": 25024, "epoch": 301} {"train_loss": -18.428585052490234, "global_step": 25025, "epoch": 301} {"train_loss": -18.7825984954834, "global_step": 25026, "epoch": 301} {"train_loss": -18.673879623413086, "global_step": 25027, "epoch": 301} {"train_loss": -18.719894409179688, "global_step": 25028, "epoch": 301} {"train_loss": -18.719511032104492, "global_step": 25029, "epoch": 301} {"train_loss": -18.110403060913086, "global_step": 25030, "epoch": 301} {"train_loss": -18.955373764038086, "global_step": 25031, "epoch": 301} {"train_loss": -18.55123519897461, "global_step": 25032, "epoch": 301} {"train_loss": -18.270593643188477, "global_step": 25033, "epoch": 301} {"train_loss": -18.493499755859375, "global_step": 25034, "epoch": 301} {"train_loss": -18.641843795776367, "global_step": 25035, "epoch": 301} {"train_loss": -19.222604751586914, "global_step": 25036, "epoch": 301} {"train_loss": -18.430896759033203, "global_step": 25037, "epoch": 301} {"train_loss": -18.74139976501465, "global_step": 25038, "epoch": 301} {"train_loss": -19.275959014892578, "global_step": 25039, "epoch": 301} {"train_loss": -18.629180908203125, "global_step": 25040, "epoch": 301} {"train_loss": -18.597440719604492, "global_step": 25041, "epoch": 301} {"train_loss": -18.74706268310547, "global_step": 25042, "epoch": 301} {"train_loss": -18.902175903320312, "global_step": 25043, "epoch": 301} {"train_loss": -18.62188720703125, "global_step": 25044, "epoch": 301} {"train_loss": -18.868749618530273, "global_step": 25045, "epoch": 301} {"train_loss": -18.620019912719727, "global_step": 25046, "epoch": 301} {"train_loss": -18.141571044921875, "global_step": 25047, "epoch": 301} {"train_loss": -18.545820236206055, "global_step": 25048, "epoch": 301} {"train_loss": -18.38300895690918, "global_step": 25049, "epoch": 301} {"train_loss": -18.655038833618164, "global_step": 25050, "epoch": 301} {"train_loss": -18.45098304748535, "global_step": 25051, "epoch": 301} {"train_loss": -18.810388565063477, "global_step": 25052, "epoch": 301} {"train_loss": -18.689050674438477, "global_step": 25053, "epoch": 301} {"train_loss": -18.447839736938477, "global_step": 25054, "epoch": 301} {"train_loss": -18.375213623046875, "global_step": 25055, "epoch": 301} {"train_loss": -18.717609405517578, "global_step": 25056, "epoch": 301} {"train_loss": -18.35918617248535, "global_step": 25057, "epoch": 301} {"train_loss": -18.44248390197754, "global_step": 25058, "epoch": 301} {"train_loss": -18.37212562561035, "global_step": 25059, "epoch": 301} {"train_loss": -18.303083419799805, "global_step": 25060, "epoch": 301} {"train_loss": -18.474102020263672, "global_step": 25061, "epoch": 301} {"train_loss": -18.76619529724121, "global_step": 25062, "epoch": 301} {"train_loss": -18.998998641967773, "global_step": 25063, "epoch": 301} {"train_loss": -18.450254440307617, "global_step": 25064, "epoch": 301} {"train_loss": -18.613888430308148, "global_step": 25065, "epoch": 301, "val_loss": 5938041.0} {"train_loss": -17.820146560668945, "global_step": 25066, "epoch": 302} {"train_loss": -18.07988166809082, "global_step": 25067, "epoch": 302} {"train_loss": -18.72539710998535, "global_step": 25068, "epoch": 302} {"train_loss": -18.076406478881836, "global_step": 25069, "epoch": 302} {"train_loss": -18.106693267822266, "global_step": 25070, "epoch": 302} {"train_loss": -18.260007858276367, "global_step": 25071, "epoch": 302} {"train_loss": -18.30800437927246, "global_step": 25072, "epoch": 302} {"train_loss": -18.517568588256836, "global_step": 25073, "epoch": 302} {"train_loss": -18.4830265045166, "global_step": 25074, "epoch": 302} {"train_loss": -18.305845260620117, "global_step": 25075, "epoch": 302} {"train_loss": -18.362234115600586, "global_step": 25076, "epoch": 302} {"train_loss": -18.878992080688477, "global_step": 25077, "epoch": 302} {"train_loss": -18.819072723388672, "global_step": 25078, "epoch": 302} {"train_loss": -18.63947105407715, "global_step": 25079, "epoch": 302} {"train_loss": -18.803369522094727, "global_step": 25080, "epoch": 302} {"train_loss": -18.45057487487793, "global_step": 25081, "epoch": 302} {"train_loss": -18.55810546875, "global_step": 25082, "epoch": 302} {"train_loss": -18.495574951171875, "global_step": 25083, "epoch": 302} {"train_loss": -18.432966232299805, "global_step": 25084, "epoch": 302} {"train_loss": -18.51384162902832, "global_step": 25085, "epoch": 302} {"train_loss": -18.548084259033203, "global_step": 25086, "epoch": 302} {"train_loss": -18.862293243408203, "global_step": 25087, "epoch": 302} {"train_loss": -18.753158569335938, "global_step": 25088, "epoch": 302} {"train_loss": -18.89258575439453, "global_step": 25089, "epoch": 302} {"train_loss": -18.50469970703125, "global_step": 25090, "epoch": 302} {"train_loss": -18.5615234375, "global_step": 25091, "epoch": 302} {"train_loss": -18.613035202026367, "global_step": 25092, "epoch": 302} {"train_loss": -18.640655517578125, "global_step": 25093, "epoch": 302} {"train_loss": -18.47896385192871, "global_step": 25094, "epoch": 302} {"train_loss": -19.100908279418945, "global_step": 25095, "epoch": 302} {"train_loss": -18.502756118774414, "global_step": 25096, "epoch": 302} {"train_loss": -18.61725425720215, "global_step": 25097, "epoch": 302} {"train_loss": -18.70712661743164, "global_step": 25098, "epoch": 302} {"train_loss": -18.845706939697266, "global_step": 25099, "epoch": 302} {"train_loss": -18.595857620239258, "global_step": 25100, "epoch": 302} {"train_loss": -18.705310821533203, "global_step": 25101, "epoch": 302} {"train_loss": -18.71934700012207, "global_step": 25102, "epoch": 302} {"train_loss": -18.74130630493164, "global_step": 25103, "epoch": 302} {"train_loss": -18.420368194580078, "global_step": 25104, "epoch": 302} {"train_loss": -18.71535301208496, "global_step": 25105, "epoch": 302} {"train_loss": -18.708925247192383, "global_step": 25106, "epoch": 302} {"train_loss": -18.27494239807129, "global_step": 25107, "epoch": 302} {"train_loss": -18.752899169921875, "global_step": 25108, "epoch": 302} {"train_loss": -18.532949447631836, "global_step": 25109, "epoch": 302} {"train_loss": -19.036725997924805, "global_step": 25110, "epoch": 302} {"train_loss": -18.596586227416992, "global_step": 25111, "epoch": 302} {"train_loss": -18.671314239501953, "global_step": 25112, "epoch": 302} {"train_loss": -18.78550148010254, "global_step": 25113, "epoch": 302} {"train_loss": -18.981531143188477, "global_step": 25114, "epoch": 302} {"train_loss": -18.536788940429688, "global_step": 25115, "epoch": 302} {"train_loss": -18.555721282958984, "global_step": 25116, "epoch": 302} {"train_loss": -19.157459259033203, "global_step": 25117, "epoch": 302} {"train_loss": -18.20479393005371, "global_step": 25118, "epoch": 302} {"train_loss": -18.69233512878418, "global_step": 25119, "epoch": 302} {"train_loss": -18.835294723510742, "global_step": 25120, "epoch": 302} {"train_loss": -18.955251693725586, "global_step": 25121, "epoch": 302} {"train_loss": -18.394519805908203, "global_step": 25122, "epoch": 302} {"train_loss": -18.93958854675293, "global_step": 25123, "epoch": 302} {"train_loss": -18.609699249267578, "global_step": 25124, "epoch": 302} {"train_loss": -18.714277267456055, "global_step": 25125, "epoch": 302} {"train_loss": -18.400224685668945, "global_step": 25126, "epoch": 302} {"train_loss": -18.47486686706543, "global_step": 25127, "epoch": 302} {"train_loss": -18.880844116210938, "global_step": 25128, "epoch": 302} {"train_loss": -18.662158966064453, "global_step": 25129, "epoch": 302} {"train_loss": -18.79514503479004, "global_step": 25130, "epoch": 302} {"train_loss": -18.715856552124023, "global_step": 25131, "epoch": 302} {"train_loss": -18.602304458618164, "global_step": 25132, "epoch": 302} {"train_loss": -18.724149703979492, "global_step": 25133, "epoch": 302} {"train_loss": -19.00763702392578, "global_step": 25134, "epoch": 302} {"train_loss": -18.98870277404785, "global_step": 25135, "epoch": 302} {"train_loss": -18.507164001464844, "global_step": 25136, "epoch": 302} {"train_loss": -18.572978973388672, "global_step": 25137, "epoch": 302} {"train_loss": -18.489561080932617, "global_step": 25138, "epoch": 302} {"train_loss": -18.893970489501953, "global_step": 25139, "epoch": 302} {"train_loss": -18.8236141204834, "global_step": 25140, "epoch": 302} {"train_loss": -18.495948791503906, "global_step": 25141, "epoch": 302} {"train_loss": -18.630706787109375, "global_step": 25142, "epoch": 302} {"train_loss": -18.689878463745117, "global_step": 25143, "epoch": 302} {"train_loss": -18.60618019104004, "global_step": 25144, "epoch": 302} {"train_loss": -18.874446868896484, "global_step": 25145, "epoch": 302} {"train_loss": -18.693510055541992, "global_step": 25146, "epoch": 302} {"train_loss": -18.75520896911621, "global_step": 25147, "epoch": 302} {"train_loss": -18.61263874927199, "global_step": 25148, "epoch": 302, "val_loss": 5973885.0} {"train_loss": -18.393030166625977, "global_step": 25149, "epoch": 303} {"train_loss": -18.759366989135742, "global_step": 25150, "epoch": 303} {"train_loss": -18.686838150024414, "global_step": 25151, "epoch": 303} {"train_loss": -18.480030059814453, "global_step": 25152, "epoch": 303} {"train_loss": -19.22366714477539, "global_step": 25153, "epoch": 303} {"train_loss": -18.51520347595215, "global_step": 25154, "epoch": 303} {"train_loss": -18.384187698364258, "global_step": 25155, "epoch": 303} {"train_loss": -18.96826171875, "global_step": 25156, "epoch": 303} {"train_loss": -18.71894073486328, "global_step": 25157, "epoch": 303} {"train_loss": -18.495656967163086, "global_step": 25158, "epoch": 303} {"train_loss": -18.881778717041016, "global_step": 25159, "epoch": 303} {"train_loss": -18.82464599609375, "global_step": 25160, "epoch": 303} {"train_loss": -18.641616821289062, "global_step": 25161, "epoch": 303} {"train_loss": -19.12443733215332, "global_step": 25162, "epoch": 303} {"train_loss": -19.006689071655273, "global_step": 25163, "epoch": 303} {"train_loss": -18.61347007751465, "global_step": 25164, "epoch": 303} {"train_loss": -18.54261589050293, "global_step": 25165, "epoch": 303} {"train_loss": -18.362796783447266, "global_step": 25166, "epoch": 303} {"train_loss": -18.70165252685547, "global_step": 25167, "epoch": 303} {"train_loss": -18.44989585876465, "global_step": 25168, "epoch": 303} {"train_loss": -18.25286293029785, "global_step": 25169, "epoch": 303} {"train_loss": -18.544841766357422, "global_step": 25170, "epoch": 303} {"train_loss": -18.920108795166016, "global_step": 25171, "epoch": 303} {"train_loss": -18.41227149963379, "global_step": 25172, "epoch": 303} {"train_loss": -18.6257266998291, "global_step": 25173, "epoch": 303} {"train_loss": -18.946321487426758, "global_step": 25174, "epoch": 303} {"train_loss": -18.44232940673828, "global_step": 25175, "epoch": 303} {"train_loss": -18.478290557861328, "global_step": 25176, "epoch": 303} {"train_loss": -18.556921005249023, "global_step": 25177, "epoch": 303} {"train_loss": -18.72186851501465, "global_step": 25178, "epoch": 303} {"train_loss": -18.48853874206543, "global_step": 25179, "epoch": 303} {"train_loss": -18.81894874572754, "global_step": 25180, "epoch": 303} {"train_loss": -18.764677047729492, "global_step": 25181, "epoch": 303} {"train_loss": -18.93230438232422, "global_step": 25182, "epoch": 303} {"train_loss": -18.69014549255371, "global_step": 25183, "epoch": 303} {"train_loss": -18.55841636657715, "global_step": 25184, "epoch": 303} {"train_loss": -18.907032012939453, "global_step": 25185, "epoch": 303} {"train_loss": -18.661279678344727, "global_step": 25186, "epoch": 303} {"train_loss": -18.403181076049805, "global_step": 25187, "epoch": 303} {"train_loss": -18.585351943969727, "global_step": 25188, "epoch": 303} {"train_loss": -18.90186882019043, "global_step": 25189, "epoch": 303} {"train_loss": -18.697134017944336, "global_step": 25190, "epoch": 303} {"train_loss": -18.96050453186035, "global_step": 25191, "epoch": 303} {"train_loss": -19.01826286315918, "global_step": 25192, "epoch": 303} {"train_loss": -18.54426383972168, "global_step": 25193, "epoch": 303} {"train_loss": -18.743877410888672, "global_step": 25194, "epoch": 303} {"train_loss": -18.865201950073242, "global_step": 25195, "epoch": 303} {"train_loss": -18.72017478942871, "global_step": 25196, "epoch": 303} {"train_loss": -18.917394638061523, "global_step": 25197, "epoch": 303} {"train_loss": -18.474895477294922, "global_step": 25198, "epoch": 303} {"train_loss": -19.08038330078125, "global_step": 25199, "epoch": 303} {"train_loss": -18.637611389160156, "global_step": 25200, "epoch": 303} {"train_loss": -18.7637996673584, "global_step": 25201, "epoch": 303} {"train_loss": -18.24607276916504, "global_step": 25202, "epoch": 303} {"train_loss": -18.700597763061523, "global_step": 25203, "epoch": 303} {"train_loss": -18.30772590637207, "global_step": 25204, "epoch": 303} {"train_loss": -18.608131408691406, "global_step": 25205, "epoch": 303} {"train_loss": -18.347362518310547, "global_step": 25206, "epoch": 303} {"train_loss": -18.458654403686523, "global_step": 25207, "epoch": 303} {"train_loss": -18.502620697021484, "global_step": 25208, "epoch": 303} {"train_loss": -18.966733932495117, "global_step": 25209, "epoch": 303} {"train_loss": -18.62322425842285, "global_step": 25210, "epoch": 303} {"train_loss": -18.672508239746094, "global_step": 25211, "epoch": 303} {"train_loss": -18.805461883544922, "global_step": 25212, "epoch": 303} {"train_loss": -18.501420974731445, "global_step": 25213, "epoch": 303} {"train_loss": -18.95452308654785, "global_step": 25214, "epoch": 303} {"train_loss": -18.517370223999023, "global_step": 25215, "epoch": 303} {"train_loss": -18.93117332458496, "global_step": 25216, "epoch": 303} {"train_loss": -18.846900939941406, "global_step": 25217, "epoch": 303} {"train_loss": -18.44483757019043, "global_step": 25218, "epoch": 303} {"train_loss": -18.752933502197266, "global_step": 25219, "epoch": 303} {"train_loss": -18.597822189331055, "global_step": 25220, "epoch": 303} {"train_loss": -18.822797775268555, "global_step": 25221, "epoch": 303} {"train_loss": -18.30167007446289, "global_step": 25222, "epoch": 303} {"train_loss": -18.342145919799805, "global_step": 25223, "epoch": 303} {"train_loss": -18.775314331054688, "global_step": 25224, "epoch": 303} {"train_loss": -18.85655403137207, "global_step": 25225, "epoch": 303} {"train_loss": -18.891103744506836, "global_step": 25226, "epoch": 303} {"train_loss": -18.674312591552734, "global_step": 25227, "epoch": 303} {"train_loss": -18.95249366760254, "global_step": 25228, "epoch": 303} {"train_loss": -18.91409683227539, "global_step": 25229, "epoch": 303} {"train_loss": -18.74201774597168, "global_step": 25230, "epoch": 303} {"train_loss": -18.663035496171698, "global_step": 25231, "epoch": 303, "val_loss": 5904260.0} {"train_loss": -18.2359676361084, "global_step": 25232, "epoch": 304} {"train_loss": -18.736021041870117, "global_step": 25233, "epoch": 304} {"train_loss": -18.66390609741211, "global_step": 25234, "epoch": 304} {"train_loss": -18.339019775390625, "global_step": 25235, "epoch": 304} {"train_loss": -18.700918197631836, "global_step": 25236, "epoch": 304} {"train_loss": -18.43706703186035, "global_step": 25237, "epoch": 304} {"train_loss": -18.609420776367188, "global_step": 25238, "epoch": 304} {"train_loss": -18.54408836364746, "global_step": 25239, "epoch": 304} {"train_loss": -18.657604217529297, "global_step": 25240, "epoch": 304} {"train_loss": -18.455398559570312, "global_step": 25241, "epoch": 304} {"train_loss": -18.905284881591797, "global_step": 25242, "epoch": 304} {"train_loss": -18.68354606628418, "global_step": 25243, "epoch": 304} {"train_loss": -18.827709197998047, "global_step": 25244, "epoch": 304} {"train_loss": -18.491445541381836, "global_step": 25245, "epoch": 304} {"train_loss": -18.752182006835938, "global_step": 25246, "epoch": 304} {"train_loss": -19.070093154907227, "global_step": 25247, "epoch": 304} {"train_loss": -18.978612899780273, "global_step": 25248, "epoch": 304} {"train_loss": -18.535764694213867, "global_step": 25249, "epoch": 304} {"train_loss": -18.54115104675293, "global_step": 25250, "epoch": 304} {"train_loss": -18.782556533813477, "global_step": 25251, "epoch": 304} {"train_loss": -18.481489181518555, "global_step": 25252, "epoch": 304} {"train_loss": -18.94882583618164, "global_step": 25253, "epoch": 304} {"train_loss": -18.572708129882812, "global_step": 25254, "epoch": 304} {"train_loss": -18.664915084838867, "global_step": 25255, "epoch": 304} {"train_loss": -18.839292526245117, "global_step": 25256, "epoch": 304} {"train_loss": -18.91641616821289, "global_step": 25257, "epoch": 304} {"train_loss": -18.685007095336914, "global_step": 25258, "epoch": 304} {"train_loss": -18.652957916259766, "global_step": 25259, "epoch": 304} {"train_loss": -19.23357582092285, "global_step": 25260, "epoch": 304} {"train_loss": -18.686779022216797, "global_step": 25261, "epoch": 304} {"train_loss": -18.596677780151367, "global_step": 25262, "epoch": 304} {"train_loss": -18.73855209350586, "global_step": 25263, "epoch": 304} {"train_loss": -18.896894454956055, "global_step": 25264, "epoch": 304} {"train_loss": -19.042097091674805, "global_step": 25265, "epoch": 304} {"train_loss": -18.87129020690918, "global_step": 25266, "epoch": 304} {"train_loss": -18.552576065063477, "global_step": 25267, "epoch": 304} {"train_loss": -18.89651107788086, "global_step": 25268, "epoch": 304} {"train_loss": -18.743240356445312, "global_step": 25269, "epoch": 304} {"train_loss": -18.939603805541992, "global_step": 25270, "epoch": 304} {"train_loss": -18.647794723510742, "global_step": 25271, "epoch": 304} {"train_loss": -18.346349716186523, "global_step": 25272, "epoch": 304} {"train_loss": -18.3541316986084, "global_step": 25273, "epoch": 304} {"train_loss": -18.547513961791992, "global_step": 25274, "epoch": 304} {"train_loss": -18.550594329833984, "global_step": 25275, "epoch": 304} {"train_loss": -18.56709861755371, "global_step": 25276, "epoch": 304} {"train_loss": -18.755435943603516, "global_step": 25277, "epoch": 304} {"train_loss": -18.95100212097168, "global_step": 25278, "epoch": 304} {"train_loss": -18.591611862182617, "global_step": 25279, "epoch": 304} {"train_loss": -18.787988662719727, "global_step": 25280, "epoch": 304} {"train_loss": -18.521696090698242, "global_step": 25281, "epoch": 304} {"train_loss": -18.674880981445312, "global_step": 25282, "epoch": 304} {"train_loss": -18.635835647583008, "global_step": 25283, "epoch": 304} {"train_loss": -18.25319480895996, "global_step": 25284, "epoch": 304} {"train_loss": -18.5725040435791, "global_step": 25285, "epoch": 304} {"train_loss": -18.637475967407227, "global_step": 25286, "epoch": 304} {"train_loss": -18.764785766601562, "global_step": 25287, "epoch": 304} {"train_loss": -18.635732650756836, "global_step": 25288, "epoch": 304} {"train_loss": -18.675973892211914, "global_step": 25289, "epoch": 304} {"train_loss": -18.495136260986328, "global_step": 25290, "epoch": 304} {"train_loss": -18.775482177734375, "global_step": 25291, "epoch": 304} {"train_loss": -18.513866424560547, "global_step": 25292, "epoch": 304} {"train_loss": -18.503137588500977, "global_step": 25293, "epoch": 304} {"train_loss": -18.71578598022461, "global_step": 25294, "epoch": 304} {"train_loss": -18.76694107055664, "global_step": 25295, "epoch": 304} {"train_loss": -18.6340389251709, "global_step": 25296, "epoch": 304} {"train_loss": -18.812362670898438, "global_step": 25297, "epoch": 304} {"train_loss": -18.57807731628418, "global_step": 25298, "epoch": 304} {"train_loss": -18.871322631835938, "global_step": 25299, "epoch": 304} {"train_loss": -18.34262466430664, "global_step": 25300, "epoch": 304} {"train_loss": -18.814104080200195, "global_step": 25301, "epoch": 304} {"train_loss": -18.40294647216797, "global_step": 25302, "epoch": 304} {"train_loss": -18.328689575195312, "global_step": 25303, "epoch": 304} {"train_loss": -18.538284301757812, "global_step": 25304, "epoch": 304} {"train_loss": -18.532453536987305, "global_step": 25305, "epoch": 304} {"train_loss": -18.34488296508789, "global_step": 25306, "epoch": 304} {"train_loss": -18.23512077331543, "global_step": 25307, "epoch": 304} {"train_loss": -18.459524154663086, "global_step": 25308, "epoch": 304} {"train_loss": -18.557645797729492, "global_step": 25309, "epoch": 304} {"train_loss": -18.650129318237305, "global_step": 25310, "epoch": 304} {"train_loss": -18.50276756286621, "global_step": 25311, "epoch": 304} {"train_loss": -18.610727310180664, "global_step": 25312, "epoch": 304} {"train_loss": -18.82896614074707, "global_step": 25313, "epoch": 304} {"train_loss": -18.654704427144612, "global_step": 25314, "epoch": 304, "val_loss": 6016550.5} {"train_loss": -18.371429443359375, "global_step": 25315, "epoch": 305} {"train_loss": -18.497879028320312, "global_step": 25316, "epoch": 305} {"train_loss": -18.38593101501465, "global_step": 25317, "epoch": 305} {"train_loss": -18.6404972076416, "global_step": 25318, "epoch": 305} {"train_loss": -18.590768814086914, "global_step": 25319, "epoch": 305} {"train_loss": -18.88243293762207, "global_step": 25320, "epoch": 305} {"train_loss": -18.542205810546875, "global_step": 25321, "epoch": 305} {"train_loss": -18.493762969970703, "global_step": 25322, "epoch": 305} {"train_loss": -17.967588424682617, "global_step": 25323, "epoch": 305} {"train_loss": -18.01422691345215, "global_step": 25324, "epoch": 305} {"train_loss": -18.448476791381836, "global_step": 25325, "epoch": 305} {"train_loss": -18.538557052612305, "global_step": 25326, "epoch": 305} {"train_loss": -18.39128303527832, "global_step": 25327, "epoch": 305} {"train_loss": -18.950613021850586, "global_step": 25328, "epoch": 305} {"train_loss": -18.473400115966797, "global_step": 25329, "epoch": 305} {"train_loss": -18.625686645507812, "global_step": 25330, "epoch": 305} {"train_loss": -18.79188346862793, "global_step": 25331, "epoch": 305} {"train_loss": -18.58852195739746, "global_step": 25332, "epoch": 305} {"train_loss": -18.576740264892578, "global_step": 25333, "epoch": 305} {"train_loss": -18.833236694335938, "global_step": 25334, "epoch": 305} {"train_loss": -18.506620407104492, "global_step": 25335, "epoch": 305} {"train_loss": -18.90155029296875, "global_step": 25336, "epoch": 305} {"train_loss": -18.845197677612305, "global_step": 25337, "epoch": 305} {"train_loss": -18.490610122680664, "global_step": 25338, "epoch": 305} {"train_loss": -18.65996551513672, "global_step": 25339, "epoch": 305} {"train_loss": -18.788414001464844, "global_step": 25340, "epoch": 305} {"train_loss": -18.636394500732422, "global_step": 25341, "epoch": 305} {"train_loss": -18.97406578063965, "global_step": 25342, "epoch": 305} {"train_loss": -18.440662384033203, "global_step": 25343, "epoch": 305} {"train_loss": -18.84711265563965, "global_step": 25344, "epoch": 305} {"train_loss": -18.593647003173828, "global_step": 25345, "epoch": 305} {"train_loss": -18.887454986572266, "global_step": 25346, "epoch": 305} {"train_loss": -18.2900447845459, "global_step": 25347, "epoch": 305} {"train_loss": -18.816909790039062, "global_step": 25348, "epoch": 305} {"train_loss": -18.701398849487305, "global_step": 25349, "epoch": 305} {"train_loss": -18.79059600830078, "global_step": 25350, "epoch": 305} {"train_loss": -18.684999465942383, "global_step": 25351, "epoch": 305} {"train_loss": -18.582921981811523, "global_step": 25352, "epoch": 305} {"train_loss": -19.107524871826172, "global_step": 25353, "epoch": 305} {"train_loss": -18.690519332885742, "global_step": 25354, "epoch": 305} {"train_loss": -18.4921932220459, "global_step": 25355, "epoch": 305} {"train_loss": -18.845773696899414, "global_step": 25356, "epoch": 305} {"train_loss": -18.919370651245117, "global_step": 25357, "epoch": 305} {"train_loss": -18.911624908447266, "global_step": 25358, "epoch": 305} {"train_loss": -18.99094009399414, "global_step": 25359, "epoch": 305} {"train_loss": -18.551794052124023, "global_step": 25360, "epoch": 305} {"train_loss": -18.740522384643555, "global_step": 25361, "epoch": 305} {"train_loss": -18.820215225219727, "global_step": 25362, "epoch": 305} {"train_loss": -18.968017578125, "global_step": 25363, "epoch": 305} {"train_loss": -18.489408493041992, "global_step": 25364, "epoch": 305} {"train_loss": -18.85793113708496, "global_step": 25365, "epoch": 305} {"train_loss": -18.86737060546875, "global_step": 25366, "epoch": 305} {"train_loss": -18.396596908569336, "global_step": 25367, "epoch": 305} {"train_loss": -18.453895568847656, "global_step": 25368, "epoch": 305} {"train_loss": -18.677326202392578, "global_step": 25369, "epoch": 305} {"train_loss": -19.03407859802246, "global_step": 25370, "epoch": 305} {"train_loss": -18.751296997070312, "global_step": 25371, "epoch": 305} {"train_loss": -18.255582809448242, "global_step": 25372, "epoch": 305} {"train_loss": -18.45090103149414, "global_step": 25373, "epoch": 305} {"train_loss": -18.836200714111328, "global_step": 25374, "epoch": 305} {"train_loss": -18.778278350830078, "global_step": 25375, "epoch": 305} {"train_loss": -18.62931251525879, "global_step": 25376, "epoch": 305} {"train_loss": -19.060972213745117, "global_step": 25377, "epoch": 305} {"train_loss": -18.823932647705078, "global_step": 25378, "epoch": 305} {"train_loss": -18.4593563079834, "global_step": 25379, "epoch": 305} {"train_loss": -18.72629737854004, "global_step": 25380, "epoch": 305} {"train_loss": -18.656930923461914, "global_step": 25381, "epoch": 305} {"train_loss": -18.7169246673584, "global_step": 25382, "epoch": 305} {"train_loss": -18.7694149017334, "global_step": 25383, "epoch": 305} {"train_loss": -18.331079483032227, "global_step": 25384, "epoch": 305} {"train_loss": -18.475080490112305, "global_step": 25385, "epoch": 305} {"train_loss": -18.625429153442383, "global_step": 25386, "epoch": 305} {"train_loss": -18.8593807220459, "global_step": 25387, "epoch": 305} {"train_loss": -18.611310958862305, "global_step": 25388, "epoch": 305} {"train_loss": -18.983375549316406, "global_step": 25389, "epoch": 305} {"train_loss": -18.782854080200195, "global_step": 25390, "epoch": 305} {"train_loss": -18.658674240112305, "global_step": 25391, "epoch": 305} {"train_loss": -18.740690231323242, "global_step": 25392, "epoch": 305} {"train_loss": -18.630084991455078, "global_step": 25393, "epoch": 305} {"train_loss": -18.681303024291992, "global_step": 25394, "epoch": 305} {"train_loss": -18.466482162475586, "global_step": 25395, "epoch": 305} {"train_loss": -18.446796417236328, "global_step": 25396, "epoch": 305} {"train_loss": -18.655961829495716, "global_step": 25397, "epoch": 305, "val_loss": 5904491.0} {"train_loss": -18.750022888183594, "global_step": 25398, "epoch": 306} {"train_loss": -18.726205825805664, "global_step": 25399, "epoch": 306} {"train_loss": -18.666719436645508, "global_step": 25400, "epoch": 306} {"train_loss": -18.547338485717773, "global_step": 25401, "epoch": 306} {"train_loss": -18.250730514526367, "global_step": 25402, "epoch": 306} {"train_loss": -18.281957626342773, "global_step": 25403, "epoch": 306} {"train_loss": -18.410696029663086, "global_step": 25404, "epoch": 306} {"train_loss": -18.942523956298828, "global_step": 25405, "epoch": 306} {"train_loss": -18.340513229370117, "global_step": 25406, "epoch": 306} {"train_loss": -18.45957374572754, "global_step": 25407, "epoch": 306} {"train_loss": -18.669078826904297, "global_step": 25408, "epoch": 306} {"train_loss": -18.626474380493164, "global_step": 25409, "epoch": 306} {"train_loss": -18.985952377319336, "global_step": 25410, "epoch": 306} {"train_loss": -18.827463150024414, "global_step": 25411, "epoch": 306} {"train_loss": -18.684261322021484, "global_step": 25412, "epoch": 306} {"train_loss": -18.813785552978516, "global_step": 25413, "epoch": 306} {"train_loss": -18.84365463256836, "global_step": 25414, "epoch": 306} {"train_loss": -18.681161880493164, "global_step": 25415, "epoch": 306} {"train_loss": -18.662281036376953, "global_step": 25416, "epoch": 306} {"train_loss": -18.510374069213867, "global_step": 25417, "epoch": 306} {"train_loss": -18.697790145874023, "global_step": 25418, "epoch": 306} {"train_loss": -18.944522857666016, "global_step": 25419, "epoch": 306} {"train_loss": -18.543081283569336, "global_step": 25420, "epoch": 306} {"train_loss": -18.626066207885742, "global_step": 25421, "epoch": 306} {"train_loss": -19.07240104675293, "global_step": 25422, "epoch": 306} {"train_loss": -19.004579544067383, "global_step": 25423, "epoch": 306} {"train_loss": -18.652639389038086, "global_step": 25424, "epoch": 306} {"train_loss": -18.5968074798584, "global_step": 25425, "epoch": 306} {"train_loss": -18.694080352783203, "global_step": 25426, "epoch": 306} {"train_loss": -18.673877716064453, "global_step": 25427, "epoch": 306} {"train_loss": -18.8156795501709, "global_step": 25428, "epoch": 306} {"train_loss": -18.827970504760742, "global_step": 25429, "epoch": 306} {"train_loss": -18.691055297851562, "global_step": 25430, "epoch": 306} {"train_loss": -18.48257827758789, "global_step": 25431, "epoch": 306} {"train_loss": -18.76896095275879, "global_step": 25432, "epoch": 306} {"train_loss": -18.8210506439209, "global_step": 25433, "epoch": 306} {"train_loss": -18.319360733032227, "global_step": 25434, "epoch": 306} {"train_loss": -18.75760841369629, "global_step": 25435, "epoch": 306} {"train_loss": -18.77541160583496, "global_step": 25436, "epoch": 306} {"train_loss": -18.871231079101562, "global_step": 25437, "epoch": 306} {"train_loss": -18.926517486572266, "global_step": 25438, "epoch": 306} {"train_loss": -19.009910583496094, "global_step": 25439, "epoch": 306} {"train_loss": -18.566917419433594, "global_step": 25440, "epoch": 306} {"train_loss": -18.52289390563965, "global_step": 25441, "epoch": 306} {"train_loss": -18.76203727722168, "global_step": 25442, "epoch": 306} {"train_loss": -18.70340919494629, "global_step": 25443, "epoch": 306} {"train_loss": -18.606800079345703, "global_step": 25444, "epoch": 306} {"train_loss": -18.888273239135742, "global_step": 25445, "epoch": 306} {"train_loss": -18.247488021850586, "global_step": 25446, "epoch": 306} {"train_loss": -18.783384323120117, "global_step": 25447, "epoch": 306} {"train_loss": -18.33587074279785, "global_step": 25448, "epoch": 306} {"train_loss": -18.599058151245117, "global_step": 25449, "epoch": 306} {"train_loss": -18.712345123291016, "global_step": 25450, "epoch": 306} {"train_loss": -18.692411422729492, "global_step": 25451, "epoch": 306} {"train_loss": -18.570703506469727, "global_step": 25452, "epoch": 306} {"train_loss": -18.81886100769043, "global_step": 25453, "epoch": 306} {"train_loss": -18.566009521484375, "global_step": 25454, "epoch": 306} {"train_loss": -18.785757064819336, "global_step": 25455, "epoch": 306} {"train_loss": -18.901151657104492, "global_step": 25456, "epoch": 306} {"train_loss": -18.82032012939453, "global_step": 25457, "epoch": 306} {"train_loss": -19.01459503173828, "global_step": 25458, "epoch": 306} {"train_loss": -18.925765991210938, "global_step": 25459, "epoch": 306} {"train_loss": -18.70259666442871, "global_step": 25460, "epoch": 306} {"train_loss": -18.203121185302734, "global_step": 25461, "epoch": 306} {"train_loss": -18.486547470092773, "global_step": 25462, "epoch": 306} {"train_loss": -18.795907974243164, "global_step": 25463, "epoch": 306} {"train_loss": -18.98911476135254, "global_step": 25464, "epoch": 306} {"train_loss": -18.677640914916992, "global_step": 25465, "epoch": 306} {"train_loss": -19.059858322143555, "global_step": 25466, "epoch": 306} {"train_loss": -18.601043701171875, "global_step": 25467, "epoch": 306} {"train_loss": -18.606643676757812, "global_step": 25468, "epoch": 306} {"train_loss": -18.468915939331055, "global_step": 25469, "epoch": 306} {"train_loss": -18.778610229492188, "global_step": 25470, "epoch": 306} {"train_loss": -18.522947311401367, "global_step": 25471, "epoch": 306} {"train_loss": -18.917078018188477, "global_step": 25472, "epoch": 306} {"train_loss": -18.639286041259766, "global_step": 25473, "epoch": 306} {"train_loss": -18.856782913208008, "global_step": 25474, "epoch": 306} {"train_loss": -18.535242080688477, "global_step": 25475, "epoch": 306} {"train_loss": -18.900114059448242, "global_step": 25476, "epoch": 306} {"train_loss": -18.620376586914062, "global_step": 25477, "epoch": 306} {"train_loss": -18.897336959838867, "global_step": 25478, "epoch": 306} {"train_loss": -18.96851921081543, "global_step": 25479, "epoch": 306} {"train_loss": -18.67180275055299, "global_step": 25480, "epoch": 306, "val_loss": 6010478.5} {"train_loss": -18.78827476501465, "global_step": 25481, "epoch": 307} {"train_loss": -18.590417861938477, "global_step": 25482, "epoch": 307} {"train_loss": -18.53348159790039, "global_step": 25483, "epoch": 307} {"train_loss": -18.61073875427246, "global_step": 25484, "epoch": 307} {"train_loss": -18.525304794311523, "global_step": 25485, "epoch": 307} {"train_loss": -18.236677169799805, "global_step": 25486, "epoch": 307} {"train_loss": -18.822162628173828, "global_step": 25487, "epoch": 307} {"train_loss": -18.877838134765625, "global_step": 25488, "epoch": 307} {"train_loss": -18.323020935058594, "global_step": 25489, "epoch": 307} {"train_loss": -18.796499252319336, "global_step": 25490, "epoch": 307} {"train_loss": -18.38773536682129, "global_step": 25491, "epoch": 307} {"train_loss": -18.361865997314453, "global_step": 25492, "epoch": 307} {"train_loss": -18.82419776916504, "global_step": 25493, "epoch": 307} {"train_loss": -18.26136589050293, "global_step": 25494, "epoch": 307} {"train_loss": -18.60738754272461, "global_step": 25495, "epoch": 307} {"train_loss": -18.695819854736328, "global_step": 25496, "epoch": 307} {"train_loss": -18.630802154541016, "global_step": 25497, "epoch": 307} {"train_loss": -18.587596893310547, "global_step": 25498, "epoch": 307} {"train_loss": -18.685461044311523, "global_step": 25499, "epoch": 307} {"train_loss": -18.64864158630371, "global_step": 25500, "epoch": 307} {"train_loss": -18.864261627197266, "global_step": 25501, "epoch": 307} {"train_loss": -18.717952728271484, "global_step": 25502, "epoch": 307} {"train_loss": -19.01409339904785, "global_step": 25503, "epoch": 307} {"train_loss": -18.18360710144043, "global_step": 25504, "epoch": 307} {"train_loss": -18.71051597595215, "global_step": 25505, "epoch": 307} {"train_loss": -18.601301193237305, "global_step": 25506, "epoch": 307} {"train_loss": -18.63817024230957, "global_step": 25507, "epoch": 307} {"train_loss": -18.5726261138916, "global_step": 25508, "epoch": 307} {"train_loss": -18.439701080322266, "global_step": 25509, "epoch": 307} {"train_loss": -19.00520133972168, "global_step": 25510, "epoch": 307} {"train_loss": -18.98911476135254, "global_step": 25511, "epoch": 307} {"train_loss": -19.13046646118164, "global_step": 25512, "epoch": 307} {"train_loss": -18.845645904541016, "global_step": 25513, "epoch": 307} {"train_loss": -18.704248428344727, "global_step": 25514, "epoch": 307} {"train_loss": -18.51167106628418, "global_step": 25515, "epoch": 307} {"train_loss": -18.784711837768555, "global_step": 25516, "epoch": 307} {"train_loss": -18.513309478759766, "global_step": 25517, "epoch": 307} {"train_loss": -18.810977935791016, "global_step": 25518, "epoch": 307} {"train_loss": -19.23590087890625, "global_step": 25519, "epoch": 307} {"train_loss": -18.979551315307617, "global_step": 25520, "epoch": 307} {"train_loss": -18.62923240661621, "global_step": 25521, "epoch": 307} {"train_loss": -18.956899642944336, "global_step": 25522, "epoch": 307} {"train_loss": -18.489519119262695, "global_step": 25523, "epoch": 307} {"train_loss": -18.757558822631836, "global_step": 25524, "epoch": 307} {"train_loss": -19.089902877807617, "global_step": 25525, "epoch": 307} {"train_loss": -18.65609359741211, "global_step": 25526, "epoch": 307} {"train_loss": -18.860631942749023, "global_step": 25527, "epoch": 307} {"train_loss": -19.081480026245117, "global_step": 25528, "epoch": 307} {"train_loss": -18.69573402404785, "global_step": 25529, "epoch": 307} {"train_loss": -18.79066276550293, "global_step": 25530, "epoch": 307} {"train_loss": -18.511260986328125, "global_step": 25531, "epoch": 307} {"train_loss": -18.763992309570312, "global_step": 25532, "epoch": 307} {"train_loss": -18.630420684814453, "global_step": 25533, "epoch": 307} {"train_loss": -18.497722625732422, "global_step": 25534, "epoch": 307} {"train_loss": -18.393522262573242, "global_step": 25535, "epoch": 307} {"train_loss": -18.639150619506836, "global_step": 25536, "epoch": 307} {"train_loss": -18.733572006225586, "global_step": 25537, "epoch": 307} {"train_loss": -18.608694076538086, "global_step": 25538, "epoch": 307} {"train_loss": -18.557159423828125, "global_step": 25539, "epoch": 307} {"train_loss": -18.463796615600586, "global_step": 25540, "epoch": 307} {"train_loss": -18.88372802734375, "global_step": 25541, "epoch": 307} {"train_loss": -18.65199089050293, "global_step": 25542, "epoch": 307} {"train_loss": -18.95719337463379, "global_step": 25543, "epoch": 307} {"train_loss": -18.765668869018555, "global_step": 25544, "epoch": 307} {"train_loss": -18.948301315307617, "global_step": 25545, "epoch": 307} {"train_loss": -18.49624252319336, "global_step": 25546, "epoch": 307} {"train_loss": -18.524892807006836, "global_step": 25547, "epoch": 307} {"train_loss": -18.757734298706055, "global_step": 25548, "epoch": 307} {"train_loss": -18.706897735595703, "global_step": 25549, "epoch": 307} {"train_loss": -18.627735137939453, "global_step": 25550, "epoch": 307} {"train_loss": -18.77434539794922, "global_step": 25551, "epoch": 307} {"train_loss": -18.83615493774414, "global_step": 25552, "epoch": 307} {"train_loss": -18.856563568115234, "global_step": 25553, "epoch": 307} {"train_loss": -18.570316314697266, "global_step": 25554, "epoch": 307} {"train_loss": -18.59457778930664, "global_step": 25555, "epoch": 307} {"train_loss": -18.499509811401367, "global_step": 25556, "epoch": 307} {"train_loss": -18.728729248046875, "global_step": 25557, "epoch": 307} {"train_loss": -19.06117820739746, "global_step": 25558, "epoch": 307} {"train_loss": -18.304166793823242, "global_step": 25559, "epoch": 307} {"train_loss": -18.5944766998291, "global_step": 25560, "epoch": 307} {"train_loss": -18.860185623168945, "global_step": 25561, "epoch": 307} {"train_loss": -18.71026039123535, "global_step": 25562, "epoch": 307} {"train_loss": -18.68343649714826, "global_step": 25563, "epoch": 307, "val_loss": 5976040.0} {"train_loss": -18.722658157348633, "global_step": 25564, "epoch": 308} {"train_loss": -18.755268096923828, "global_step": 25565, "epoch": 308} {"train_loss": -18.632537841796875, "global_step": 25566, "epoch": 308} {"train_loss": -18.571348190307617, "global_step": 25567, "epoch": 308} {"train_loss": -18.590612411499023, "global_step": 25568, "epoch": 308} {"train_loss": -18.82379150390625, "global_step": 25569, "epoch": 308} {"train_loss": -18.356252670288086, "global_step": 25570, "epoch": 308} {"train_loss": -18.999967575073242, "global_step": 25571, "epoch": 308} {"train_loss": -18.752771377563477, "global_step": 25572, "epoch": 308} {"train_loss": -19.1082763671875, "global_step": 25573, "epoch": 308} {"train_loss": -18.604324340820312, "global_step": 25574, "epoch": 308} {"train_loss": -18.733640670776367, "global_step": 25575, "epoch": 308} {"train_loss": -18.69942855834961, "global_step": 25576, "epoch": 308} {"train_loss": -18.604368209838867, "global_step": 25577, "epoch": 308} {"train_loss": -18.77665138244629, "global_step": 25578, "epoch": 308} {"train_loss": -18.371601104736328, "global_step": 25579, "epoch": 308} {"train_loss": -18.365785598754883, "global_step": 25580, "epoch": 308} {"train_loss": -18.573665618896484, "global_step": 25581, "epoch": 308} {"train_loss": -18.639102935791016, "global_step": 25582, "epoch": 308} {"train_loss": -18.609712600708008, "global_step": 25583, "epoch": 308} {"train_loss": -18.353315353393555, "global_step": 25584, "epoch": 308} {"train_loss": -18.65006446838379, "global_step": 25585, "epoch": 308} {"train_loss": -18.629478454589844, "global_step": 25586, "epoch": 308} {"train_loss": -18.929105758666992, "global_step": 25587, "epoch": 308} {"train_loss": -18.672229766845703, "global_step": 25588, "epoch": 308} {"train_loss": -18.75887680053711, "global_step": 25589, "epoch": 308} {"train_loss": -18.91217613220215, "global_step": 25590, "epoch": 308} {"train_loss": -19.215538024902344, "global_step": 25591, "epoch": 308} {"train_loss": -18.59687614440918, "global_step": 25592, "epoch": 308} {"train_loss": -18.245529174804688, "global_step": 25593, "epoch": 308} {"train_loss": -18.428424835205078, "global_step": 25594, "epoch": 308} {"train_loss": -18.821996688842773, "global_step": 25595, "epoch": 308} {"train_loss": -19.43116569519043, "global_step": 25596, "epoch": 308} {"train_loss": -18.96581268310547, "global_step": 25597, "epoch": 308} {"train_loss": -18.841812133789062, "global_step": 25598, "epoch": 308} {"train_loss": -18.989377975463867, "global_step": 25599, "epoch": 308} {"train_loss": -19.071802139282227, "global_step": 25600, "epoch": 308} {"train_loss": -18.74728775024414, "global_step": 25601, "epoch": 308} {"train_loss": -18.90299415588379, "global_step": 25602, "epoch": 308} {"train_loss": -18.336172103881836, "global_step": 25603, "epoch": 308} {"train_loss": -18.914628982543945, "global_step": 25604, "epoch": 308} {"train_loss": -18.410551071166992, "global_step": 25605, "epoch": 308} {"train_loss": -18.711029052734375, "global_step": 25606, "epoch": 308} {"train_loss": -18.899656295776367, "global_step": 25607, "epoch": 308} {"train_loss": -18.696666717529297, "global_step": 25608, "epoch": 308} {"train_loss": -18.739063262939453, "global_step": 25609, "epoch": 308} {"train_loss": -18.963062286376953, "global_step": 25610, "epoch": 308} {"train_loss": -18.48598861694336, "global_step": 25611, "epoch": 308} {"train_loss": -18.910324096679688, "global_step": 25612, "epoch": 308} {"train_loss": -18.710371017456055, "global_step": 25613, "epoch": 308} {"train_loss": -18.717899322509766, "global_step": 25614, "epoch": 308} {"train_loss": -18.64934730529785, "global_step": 25615, "epoch": 308} {"train_loss": -18.48813819885254, "global_step": 25616, "epoch": 308} {"train_loss": -18.59214210510254, "global_step": 25617, "epoch": 308} {"train_loss": -18.86701202392578, "global_step": 25618, "epoch": 308} {"train_loss": -18.707212448120117, "global_step": 25619, "epoch": 308} {"train_loss": -18.577688217163086, "global_step": 25620, "epoch": 308} {"train_loss": -18.651697158813477, "global_step": 25621, "epoch": 308} {"train_loss": -18.54570960998535, "global_step": 25622, "epoch": 308} {"train_loss": -18.920427322387695, "global_step": 25623, "epoch": 308} {"train_loss": -18.57414436340332, "global_step": 25624, "epoch": 308} {"train_loss": -19.172677993774414, "global_step": 25625, "epoch": 308} {"train_loss": -18.789676666259766, "global_step": 25626, "epoch": 308} {"train_loss": -18.71708869934082, "global_step": 25627, "epoch": 308} {"train_loss": -18.615163803100586, "global_step": 25628, "epoch": 308} {"train_loss": -18.772367477416992, "global_step": 25629, "epoch": 308} {"train_loss": -18.3254451751709, "global_step": 25630, "epoch": 308} {"train_loss": -18.46592903137207, "global_step": 25631, "epoch": 308} {"train_loss": -18.713266372680664, "global_step": 25632, "epoch": 308} {"train_loss": -18.417314529418945, "global_step": 25633, "epoch": 308} {"train_loss": -18.184478759765625, "global_step": 25634, "epoch": 308} {"train_loss": -18.467214584350586, "global_step": 25635, "epoch": 308} {"train_loss": -18.995967864990234, "global_step": 25636, "epoch": 308} {"train_loss": -18.87790298461914, "global_step": 25637, "epoch": 308} {"train_loss": -18.445693969726562, "global_step": 25638, "epoch": 308} {"train_loss": -18.66850471496582, "global_step": 25639, "epoch": 308} {"train_loss": -18.38846778869629, "global_step": 25640, "epoch": 308} {"train_loss": -18.69624900817871, "global_step": 25641, "epoch": 308} {"train_loss": -18.909168243408203, "global_step": 25642, "epoch": 308} {"train_loss": -18.896682739257812, "global_step": 25643, "epoch": 308} {"train_loss": -18.95990562438965, "global_step": 25644, "epoch": 308} {"train_loss": -18.92453384399414, "global_step": 25645, "epoch": 308} {"train_loss": -18.725141088646577, "global_step": 25646, "epoch": 308, "val_loss": 5919607.5} {"train_loss": -18.603179931640625, "global_step": 25647, "epoch": 309} {"train_loss": -18.210447311401367, "global_step": 25648, "epoch": 309} {"train_loss": -18.97709083557129, "global_step": 25649, "epoch": 309} {"train_loss": -18.642684936523438, "global_step": 25650, "epoch": 309} {"train_loss": -18.498207092285156, "global_step": 25651, "epoch": 309} {"train_loss": -18.694442749023438, "global_step": 25652, "epoch": 309} {"train_loss": -18.754362106323242, "global_step": 25653, "epoch": 309} {"train_loss": -18.32710075378418, "global_step": 25654, "epoch": 309} {"train_loss": -18.70343017578125, "global_step": 25655, "epoch": 309} {"train_loss": -18.598247528076172, "global_step": 25656, "epoch": 309} {"train_loss": -18.52652359008789, "global_step": 25657, "epoch": 309} {"train_loss": -18.763647079467773, "global_step": 25658, "epoch": 309} {"train_loss": -18.388168334960938, "global_step": 25659, "epoch": 309} {"train_loss": -18.604169845581055, "global_step": 25660, "epoch": 309} {"train_loss": -18.687198638916016, "global_step": 25661, "epoch": 309} {"train_loss": -18.90887451171875, "global_step": 25662, "epoch": 309} {"train_loss": -18.509775161743164, "global_step": 25663, "epoch": 309} {"train_loss": -18.603361129760742, "global_step": 25664, "epoch": 309} {"train_loss": -18.647789001464844, "global_step": 25665, "epoch": 309} {"train_loss": -18.917858123779297, "global_step": 25666, "epoch": 309} {"train_loss": -19.022354125976562, "global_step": 25667, "epoch": 309} {"train_loss": -18.71280860900879, "global_step": 25668, "epoch": 309} {"train_loss": -18.99704933166504, "global_step": 25669, "epoch": 309} {"train_loss": -18.446578979492188, "global_step": 25670, "epoch": 309} {"train_loss": -18.588449478149414, "global_step": 25671, "epoch": 309} {"train_loss": -19.1027889251709, "global_step": 25672, "epoch": 309} {"train_loss": -19.058176040649414, "global_step": 25673, "epoch": 309} {"train_loss": -19.027088165283203, "global_step": 25674, "epoch": 309} {"train_loss": -18.483440399169922, "global_step": 25675, "epoch": 309} {"train_loss": -18.75809669494629, "global_step": 25676, "epoch": 309} {"train_loss": -18.707304000854492, "global_step": 25677, "epoch": 309} {"train_loss": -18.313161849975586, "global_step": 25678, "epoch": 309} {"train_loss": -18.363008499145508, "global_step": 25679, "epoch": 309} {"train_loss": -18.554244995117188, "global_step": 25680, "epoch": 309} {"train_loss": -18.74156379699707, "global_step": 25681, "epoch": 309} {"train_loss": -18.574615478515625, "global_step": 25682, "epoch": 309} {"train_loss": -18.90504264831543, "global_step": 25683, "epoch": 309} {"train_loss": -18.600364685058594, "global_step": 25684, "epoch": 309} {"train_loss": -18.941627502441406, "global_step": 25685, "epoch": 309} {"train_loss": -18.797576904296875, "global_step": 25686, "epoch": 309} {"train_loss": -19.09683609008789, "global_step": 25687, "epoch": 309} {"train_loss": -18.87714195251465, "global_step": 25688, "epoch": 309} {"train_loss": -18.83052635192871, "global_step": 25689, "epoch": 309} {"train_loss": -18.614288330078125, "global_step": 25690, "epoch": 309} {"train_loss": -18.939775466918945, "global_step": 25691, "epoch": 309} {"train_loss": -18.4483585357666, "global_step": 25692, "epoch": 309} {"train_loss": -18.619070053100586, "global_step": 25693, "epoch": 309} {"train_loss": -18.36433982849121, "global_step": 25694, "epoch": 309} {"train_loss": -18.91620445251465, "global_step": 25695, "epoch": 309} {"train_loss": -18.603912353515625, "global_step": 25696, "epoch": 309} {"train_loss": -18.596830368041992, "global_step": 25697, "epoch": 309} {"train_loss": -18.694644927978516, "global_step": 25698, "epoch": 309} {"train_loss": -18.991037368774414, "global_step": 25699, "epoch": 309} {"train_loss": -18.322072982788086, "global_step": 25700, "epoch": 309} {"train_loss": -18.98518180847168, "global_step": 25701, "epoch": 309} {"train_loss": -18.402841567993164, "global_step": 25702, "epoch": 309} {"train_loss": -18.81294059753418, "global_step": 25703, "epoch": 309} {"train_loss": -18.26186180114746, "global_step": 25704, "epoch": 309} {"train_loss": -18.89150047302246, "global_step": 25705, "epoch": 309} {"train_loss": -18.5236873626709, "global_step": 25706, "epoch": 309} {"train_loss": -19.15459632873535, "global_step": 25707, "epoch": 309} {"train_loss": -18.70021629333496, "global_step": 25708, "epoch": 309} {"train_loss": -18.57088279724121, "global_step": 25709, "epoch": 309} {"train_loss": -18.54550552368164, "global_step": 25710, "epoch": 309} {"train_loss": -18.457447052001953, "global_step": 25711, "epoch": 309} {"train_loss": -18.674104690551758, "global_step": 25712, "epoch": 309} {"train_loss": -18.197301864624023, "global_step": 25713, "epoch": 309} {"train_loss": -19.012428283691406, "global_step": 25714, "epoch": 309} {"train_loss": -19.019437789916992, "global_step": 25715, "epoch": 309} {"train_loss": -18.650312423706055, "global_step": 25716, "epoch": 309} {"train_loss": -18.80245018005371, "global_step": 25717, "epoch": 309} {"train_loss": -18.809513092041016, "global_step": 25718, "epoch": 309} {"train_loss": -18.60636329650879, "global_step": 25719, "epoch": 309} {"train_loss": -19.023027420043945, "global_step": 25720, "epoch": 309} {"train_loss": -18.720090866088867, "global_step": 25721, "epoch": 309} {"train_loss": -18.817724227905273, "global_step": 25722, "epoch": 309} {"train_loss": -18.804197311401367, "global_step": 25723, "epoch": 309} {"train_loss": -18.6778507232666, "global_step": 25724, "epoch": 309} {"train_loss": -18.696203231811523, "global_step": 25725, "epoch": 309} {"train_loss": -18.797407150268555, "global_step": 25726, "epoch": 309} {"train_loss": -18.18861198425293, "global_step": 25727, "epoch": 309} {"train_loss": -18.566625595092773, "global_step": 25728, "epoch": 309} {"train_loss": -18.68573273808123, "global_step": 25729, "epoch": 309, "val_loss": 5937231.0} {"train_loss": -18.619844436645508, "global_step": 25730, "epoch": 310} {"train_loss": -18.35333824157715, "global_step": 25731, "epoch": 310} {"train_loss": -18.83048439025879, "global_step": 25732, "epoch": 310} {"train_loss": -18.604063034057617, "global_step": 25733, "epoch": 310} {"train_loss": -18.604644775390625, "global_step": 25734, "epoch": 310} {"train_loss": -18.612266540527344, "global_step": 25735, "epoch": 310} {"train_loss": -18.80428123474121, "global_step": 25736, "epoch": 310} {"train_loss": -18.454158782958984, "global_step": 25737, "epoch": 310} {"train_loss": -18.78969383239746, "global_step": 25738, "epoch": 310} {"train_loss": -19.01225471496582, "global_step": 25739, "epoch": 310} {"train_loss": -18.827035903930664, "global_step": 25740, "epoch": 310} {"train_loss": -18.74442481994629, "global_step": 25741, "epoch": 310} {"train_loss": -18.391433715820312, "global_step": 25742, "epoch": 310} {"train_loss": -18.28866195678711, "global_step": 25743, "epoch": 310} {"train_loss": -18.431909561157227, "global_step": 25744, "epoch": 310} {"train_loss": -18.93666648864746, "global_step": 25745, "epoch": 310} {"train_loss": -18.84229850769043, "global_step": 25746, "epoch": 310} {"train_loss": -18.59418296813965, "global_step": 25747, "epoch": 310} {"train_loss": -18.589670181274414, "global_step": 25748, "epoch": 310} {"train_loss": -18.46603012084961, "global_step": 25749, "epoch": 310} {"train_loss": -18.945110321044922, "global_step": 25750, "epoch": 310} {"train_loss": -18.808942794799805, "global_step": 25751, "epoch": 310} {"train_loss": -18.85853385925293, "global_step": 25752, "epoch": 310} {"train_loss": -18.739715576171875, "global_step": 25753, "epoch": 310} {"train_loss": -18.504133224487305, "global_step": 25754, "epoch": 310} {"train_loss": -18.656126022338867, "global_step": 25755, "epoch": 310} {"train_loss": -18.57731056213379, "global_step": 25756, "epoch": 310} {"train_loss": -18.87322998046875, "global_step": 25757, "epoch": 310} {"train_loss": -18.514951705932617, "global_step": 25758, "epoch": 310} {"train_loss": -18.555023193359375, "global_step": 25759, "epoch": 310} {"train_loss": -18.859848022460938, "global_step": 25760, "epoch": 310} {"train_loss": -18.639616012573242, "global_step": 25761, "epoch": 310} {"train_loss": -18.484960556030273, "global_step": 25762, "epoch": 310} {"train_loss": -18.6712589263916, "global_step": 25763, "epoch": 310} {"train_loss": -18.57142448425293, "global_step": 25764, "epoch": 310} {"train_loss": -19.061237335205078, "global_step": 25765, "epoch": 310} {"train_loss": -18.825550079345703, "global_step": 25766, "epoch": 310} {"train_loss": -18.748077392578125, "global_step": 25767, "epoch": 310} {"train_loss": -18.615690231323242, "global_step": 25768, "epoch": 310} {"train_loss": -18.694278717041016, "global_step": 25769, "epoch": 310} {"train_loss": -18.450166702270508, "global_step": 25770, "epoch": 310} {"train_loss": -18.477664947509766, "global_step": 25771, "epoch": 310} {"train_loss": -19.030302047729492, "global_step": 25772, "epoch": 310} {"train_loss": -18.64543342590332, "global_step": 25773, "epoch": 310} {"train_loss": -18.8901424407959, "global_step": 25774, "epoch": 310} {"train_loss": -18.489538192749023, "global_step": 25775, "epoch": 310} {"train_loss": -18.757856369018555, "global_step": 25776, "epoch": 310} {"train_loss": -18.724281311035156, "global_step": 25777, "epoch": 310} {"train_loss": -18.51625633239746, "global_step": 25778, "epoch": 310} {"train_loss": -19.082595825195312, "global_step": 25779, "epoch": 310} {"train_loss": -18.328166961669922, "global_step": 25780, "epoch": 310} {"train_loss": -18.649288177490234, "global_step": 25781, "epoch": 310} {"train_loss": -18.57733726501465, "global_step": 25782, "epoch": 310} {"train_loss": -18.462120056152344, "global_step": 25783, "epoch": 310} {"train_loss": -18.936241149902344, "global_step": 25784, "epoch": 310} {"train_loss": -18.720258712768555, "global_step": 25785, "epoch": 310} {"train_loss": -18.82563591003418, "global_step": 25786, "epoch": 310} {"train_loss": -18.791364669799805, "global_step": 25787, "epoch": 310} {"train_loss": -18.79017448425293, "global_step": 25788, "epoch": 310} {"train_loss": -18.73340606689453, "global_step": 25789, "epoch": 310} {"train_loss": -18.469776153564453, "global_step": 25790, "epoch": 310} {"train_loss": -18.52569007873535, "global_step": 25791, "epoch": 310} {"train_loss": -18.58949089050293, "global_step": 25792, "epoch": 310} {"train_loss": -19.042694091796875, "global_step": 25793, "epoch": 310} {"train_loss": -18.95358657836914, "global_step": 25794, "epoch": 310} {"train_loss": -18.597780227661133, "global_step": 25795, "epoch": 310} {"train_loss": -18.827865600585938, "global_step": 25796, "epoch": 310} {"train_loss": -18.596038818359375, "global_step": 25797, "epoch": 310} {"train_loss": -18.9664363861084, "global_step": 25798, "epoch": 310} {"train_loss": -18.347299575805664, "global_step": 25799, "epoch": 310} {"train_loss": -18.501941680908203, "global_step": 25800, "epoch": 310} {"train_loss": -18.64139175415039, "global_step": 25801, "epoch": 310} {"train_loss": -19.075439453125, "global_step": 25802, "epoch": 310} {"train_loss": -19.20400047302246, "global_step": 25803, "epoch": 310} {"train_loss": -18.760316848754883, "global_step": 25804, "epoch": 310} {"train_loss": -18.43191146850586, "global_step": 25805, "epoch": 310} {"train_loss": -18.84055519104004, "global_step": 25806, "epoch": 310} {"train_loss": -19.127853393554688, "global_step": 25807, "epoch": 310} {"train_loss": -18.331031799316406, "global_step": 25808, "epoch": 310} {"train_loss": -19.125295639038086, "global_step": 25809, "epoch": 310} {"train_loss": -18.84907341003418, "global_step": 25810, "epoch": 310} {"train_loss": -18.773456573486328, "global_step": 25811, "epoch": 310} {"train_loss": -18.71607883867011, "global_step": 25812, "epoch": 310, "val_loss": 5970803.0} {"train_loss": -18.668203353881836, "global_step": 25813, "epoch": 311} {"train_loss": -18.76450538635254, "global_step": 25814, "epoch": 311} {"train_loss": -19.08522605895996, "global_step": 25815, "epoch": 311} {"train_loss": -18.436525344848633, "global_step": 25816, "epoch": 311} {"train_loss": -18.685436248779297, "global_step": 25817, "epoch": 311} {"train_loss": -18.62495231628418, "global_step": 25818, "epoch": 311} {"train_loss": -18.48242950439453, "global_step": 25819, "epoch": 311} {"train_loss": -18.51138687133789, "global_step": 25820, "epoch": 311} {"train_loss": -19.17058753967285, "global_step": 25821, "epoch": 311} {"train_loss": -18.73824691772461, "global_step": 25822, "epoch": 311} {"train_loss": -18.587976455688477, "global_step": 25823, "epoch": 311} {"train_loss": -18.265073776245117, "global_step": 25824, "epoch": 311} {"train_loss": -19.166330337524414, "global_step": 25825, "epoch": 311} {"train_loss": -18.829492568969727, "global_step": 25826, "epoch": 311} {"train_loss": -18.765501022338867, "global_step": 25827, "epoch": 311} {"train_loss": -18.629682540893555, "global_step": 25828, "epoch": 311} {"train_loss": -18.697813034057617, "global_step": 25829, "epoch": 311} {"train_loss": -18.65985679626465, "global_step": 25830, "epoch": 311} {"train_loss": -18.740184783935547, "global_step": 25831, "epoch": 311} {"train_loss": -18.7659912109375, "global_step": 25832, "epoch": 311} {"train_loss": -18.70271110534668, "global_step": 25833, "epoch": 311} {"train_loss": -18.464492797851562, "global_step": 25834, "epoch": 311} {"train_loss": -18.609169006347656, "global_step": 25835, "epoch": 311} {"train_loss": -18.649127960205078, "global_step": 25836, "epoch": 311} {"train_loss": -18.824800491333008, "global_step": 25837, "epoch": 311} {"train_loss": -18.962087631225586, "global_step": 25838, "epoch": 311} {"train_loss": -18.741846084594727, "global_step": 25839, "epoch": 311} {"train_loss": -18.239871978759766, "global_step": 25840, "epoch": 311} {"train_loss": -18.424692153930664, "global_step": 25841, "epoch": 311} {"train_loss": -18.873214721679688, "global_step": 25842, "epoch": 311} {"train_loss": -18.31855583190918, "global_step": 25843, "epoch": 311} {"train_loss": -18.84865379333496, "global_step": 25844, "epoch": 311} {"train_loss": -18.22512435913086, "global_step": 25845, "epoch": 311} {"train_loss": -18.96904945373535, "global_step": 25846, "epoch": 311} {"train_loss": -18.479665756225586, "global_step": 25847, "epoch": 311} {"train_loss": -18.458362579345703, "global_step": 25848, "epoch": 311} {"train_loss": -19.137454986572266, "global_step": 25849, "epoch": 311} {"train_loss": -18.34864044189453, "global_step": 25850, "epoch": 311} {"train_loss": -18.8402099609375, "global_step": 25851, "epoch": 311} {"train_loss": -18.606975555419922, "global_step": 25852, "epoch": 311} {"train_loss": -18.726543426513672, "global_step": 25853, "epoch": 311} {"train_loss": -18.72064781188965, "global_step": 25854, "epoch": 311} {"train_loss": -18.655073165893555, "global_step": 25855, "epoch": 311} {"train_loss": -18.751813888549805, "global_step": 25856, "epoch": 311} {"train_loss": -18.55501365661621, "global_step": 25857, "epoch": 311} {"train_loss": -18.480390548706055, "global_step": 25858, "epoch": 311} {"train_loss": -18.61167335510254, "global_step": 25859, "epoch": 311} {"train_loss": -18.906036376953125, "global_step": 25860, "epoch": 311} {"train_loss": -18.952316284179688, "global_step": 25861, "epoch": 311} {"train_loss": -18.58304214477539, "global_step": 25862, "epoch": 311} {"train_loss": -18.308786392211914, "global_step": 25863, "epoch": 311} {"train_loss": -18.84559440612793, "global_step": 25864, "epoch": 311} {"train_loss": -18.553730010986328, "global_step": 25865, "epoch": 311} {"train_loss": -18.589242935180664, "global_step": 25866, "epoch": 311} {"train_loss": -19.02493667602539, "global_step": 25867, "epoch": 311} {"train_loss": -18.578840255737305, "global_step": 25868, "epoch": 311} {"train_loss": -18.8479061126709, "global_step": 25869, "epoch": 311} {"train_loss": -18.29757308959961, "global_step": 25870, "epoch": 311} {"train_loss": -18.76265525817871, "global_step": 25871, "epoch": 311} {"train_loss": -18.955320358276367, "global_step": 25872, "epoch": 311} {"train_loss": -18.475032806396484, "global_step": 25873, "epoch": 311} {"train_loss": -18.837833404541016, "global_step": 25874, "epoch": 311} {"train_loss": -18.690237045288086, "global_step": 25875, "epoch": 311} {"train_loss": -18.6458740234375, "global_step": 25876, "epoch": 311} {"train_loss": -18.358905792236328, "global_step": 25877, "epoch": 311} {"train_loss": -18.76186752319336, "global_step": 25878, "epoch": 311} {"train_loss": -19.018583297729492, "global_step": 25879, "epoch": 311} {"train_loss": -18.737428665161133, "global_step": 25880, "epoch": 311} {"train_loss": -18.76388931274414, "global_step": 25881, "epoch": 311} {"train_loss": -18.930448532104492, "global_step": 25882, "epoch": 311} {"train_loss": -18.422657012939453, "global_step": 25883, "epoch": 311} {"train_loss": -18.93288230895996, "global_step": 25884, "epoch": 311} {"train_loss": -18.681049346923828, "global_step": 25885, "epoch": 311} {"train_loss": -19.030935287475586, "global_step": 25886, "epoch": 311} {"train_loss": -19.058307647705078, "global_step": 25887, "epoch": 311} {"train_loss": -18.721511840820312, "global_step": 25888, "epoch": 311} {"train_loss": -18.62458610534668, "global_step": 25889, "epoch": 311} {"train_loss": -19.019140243530273, "global_step": 25890, "epoch": 311} {"train_loss": -18.51114273071289, "global_step": 25891, "epoch": 311} {"train_loss": -18.750181198120117, "global_step": 25892, "epoch": 311} {"train_loss": -18.759065628051758, "global_step": 25893, "epoch": 311} {"train_loss": -18.852306365966797, "global_step": 25894, "epoch": 311} {"train_loss": -18.715602621974714, "global_step": 25895, "epoch": 311, "val_loss": 5893813.0} {"train_loss": -18.60458755493164, "global_step": 25896, "epoch": 312} {"train_loss": -18.52854347229004, "global_step": 25897, "epoch": 312} {"train_loss": -18.847118377685547, "global_step": 25898, "epoch": 312} {"train_loss": -18.797273635864258, "global_step": 25899, "epoch": 312} {"train_loss": -18.75361442565918, "global_step": 25900, "epoch": 312} {"train_loss": -18.62806510925293, "global_step": 25901, "epoch": 312} {"train_loss": -18.875045776367188, "global_step": 25902, "epoch": 312} {"train_loss": -18.766515731811523, "global_step": 25903, "epoch": 312} {"train_loss": -18.428464889526367, "global_step": 25904, "epoch": 312} {"train_loss": -18.82551383972168, "global_step": 25905, "epoch": 312} {"train_loss": -18.777307510375977, "global_step": 25906, "epoch": 312} {"train_loss": -18.523012161254883, "global_step": 25907, "epoch": 312} {"train_loss": -18.829309463500977, "global_step": 25908, "epoch": 312} {"train_loss": -18.394887924194336, "global_step": 25909, "epoch": 312} {"train_loss": -18.935028076171875, "global_step": 25910, "epoch": 312} {"train_loss": -18.535419464111328, "global_step": 25911, "epoch": 312} {"train_loss": -19.005413055419922, "global_step": 25912, "epoch": 312} {"train_loss": -18.559240341186523, "global_step": 25913, "epoch": 312} {"train_loss": -18.625686645507812, "global_step": 25914, "epoch": 312} {"train_loss": -18.516265869140625, "global_step": 25915, "epoch": 312} {"train_loss": -18.44574546813965, "global_step": 25916, "epoch": 312} {"train_loss": -18.945751190185547, "global_step": 25917, "epoch": 312} {"train_loss": -18.68277931213379, "global_step": 25918, "epoch": 312} {"train_loss": -18.970199584960938, "global_step": 25919, "epoch": 312} {"train_loss": -19.06156349182129, "global_step": 25920, "epoch": 312} {"train_loss": -18.62017822265625, "global_step": 25921, "epoch": 312} {"train_loss": -18.484603881835938, "global_step": 25922, "epoch": 312} {"train_loss": -18.887781143188477, "global_step": 25923, "epoch": 312} {"train_loss": -18.642671585083008, "global_step": 25924, "epoch": 312} {"train_loss": -18.70054817199707, "global_step": 25925, "epoch": 312} {"train_loss": -18.473241806030273, "global_step": 25926, "epoch": 312} {"train_loss": -18.344219207763672, "global_step": 25927, "epoch": 312} {"train_loss": -19.160194396972656, "global_step": 25928, "epoch": 312} {"train_loss": -18.563610076904297, "global_step": 25929, "epoch": 312} {"train_loss": -19.01825523376465, "global_step": 25930, "epoch": 312} {"train_loss": -18.63849449157715, "global_step": 25931, "epoch": 312} {"train_loss": -18.73420524597168, "global_step": 25932, "epoch": 312} {"train_loss": -18.79081916809082, "global_step": 25933, "epoch": 312} {"train_loss": -18.95271110534668, "global_step": 25934, "epoch": 312} {"train_loss": -18.84928321838379, "global_step": 25935, "epoch": 312} {"train_loss": -19.04188346862793, "global_step": 25936, "epoch": 312} {"train_loss": -18.875240325927734, "global_step": 25937, "epoch": 312} {"train_loss": -18.666584014892578, "global_step": 25938, "epoch": 312} {"train_loss": -18.53309440612793, "global_step": 25939, "epoch": 312} {"train_loss": -18.629735946655273, "global_step": 25940, "epoch": 312} {"train_loss": -18.52463150024414, "global_step": 25941, "epoch": 312} {"train_loss": -18.639406204223633, "global_step": 25942, "epoch": 312} {"train_loss": -18.77876091003418, "global_step": 25943, "epoch": 312} {"train_loss": -18.604080200195312, "global_step": 25944, "epoch": 312} {"train_loss": -18.415922164916992, "global_step": 25945, "epoch": 312} {"train_loss": -18.88094139099121, "global_step": 25946, "epoch": 312} {"train_loss": -18.554113388061523, "global_step": 25947, "epoch": 312} {"train_loss": -18.665494918823242, "global_step": 25948, "epoch": 312} {"train_loss": -18.564950942993164, "global_step": 25949, "epoch": 312} {"train_loss": -18.90851402282715, "global_step": 25950, "epoch": 312} {"train_loss": -18.54181480407715, "global_step": 25951, "epoch": 312} {"train_loss": -18.800765991210938, "global_step": 25952, "epoch": 312} {"train_loss": -18.917936325073242, "global_step": 25953, "epoch": 312} {"train_loss": -18.6689453125, "global_step": 25954, "epoch": 312} {"train_loss": -18.73137855529785, "global_step": 25955, "epoch": 312} {"train_loss": -18.759681701660156, "global_step": 25956, "epoch": 312} {"train_loss": -18.545059204101562, "global_step": 25957, "epoch": 312} {"train_loss": -18.710386276245117, "global_step": 25958, "epoch": 312} {"train_loss": -18.864479064941406, "global_step": 25959, "epoch": 312} {"train_loss": -18.789255142211914, "global_step": 25960, "epoch": 312} {"train_loss": -18.773983001708984, "global_step": 25961, "epoch": 312} {"train_loss": -18.515417098999023, "global_step": 25962, "epoch": 312} {"train_loss": -18.695220947265625, "global_step": 25963, "epoch": 312} {"train_loss": -18.88559913635254, "global_step": 25964, "epoch": 312} {"train_loss": -18.737016677856445, "global_step": 25965, "epoch": 312} {"train_loss": -18.66861915588379, "global_step": 25966, "epoch": 312} {"train_loss": -18.816349029541016, "global_step": 25967, "epoch": 312} {"train_loss": -18.91514015197754, "global_step": 25968, "epoch": 312} {"train_loss": -18.771814346313477, "global_step": 25969, "epoch": 312} {"train_loss": -18.895540237426758, "global_step": 25970, "epoch": 312} {"train_loss": -19.182453155517578, "global_step": 25971, "epoch": 312} {"train_loss": -18.80988883972168, "global_step": 25972, "epoch": 312} {"train_loss": -18.82452392578125, "global_step": 25973, "epoch": 312} {"train_loss": -18.622655868530273, "global_step": 25974, "epoch": 312} {"train_loss": -18.77081871032715, "global_step": 25975, "epoch": 312} {"train_loss": -19.149343490600586, "global_step": 25976, "epoch": 312} {"train_loss": -18.887195587158203, "global_step": 25977, "epoch": 312} {"train_loss": -18.740408380347564, "global_step": 25978, "epoch": 312, "val_loss": 6116896.0} {"train_loss": -18.779361724853516, "global_step": 25979, "epoch": 313} {"train_loss": -19.069883346557617, "global_step": 25980, "epoch": 313} {"train_loss": -18.381484985351562, "global_step": 25981, "epoch": 313} {"train_loss": -19.063352584838867, "global_step": 25982, "epoch": 313} {"train_loss": -18.705446243286133, "global_step": 25983, "epoch": 313} {"train_loss": -18.503515243530273, "global_step": 25984, "epoch": 313} {"train_loss": -18.832881927490234, "global_step": 25985, "epoch": 313} {"train_loss": -18.903371810913086, "global_step": 25986, "epoch": 313} {"train_loss": -18.466588973999023, "global_step": 25987, "epoch": 313} {"train_loss": -18.622617721557617, "global_step": 25988, "epoch": 313} {"train_loss": -18.841983795166016, "global_step": 25989, "epoch": 313} {"train_loss": -18.463565826416016, "global_step": 25990, "epoch": 313} {"train_loss": -18.915098190307617, "global_step": 25991, "epoch": 313} {"train_loss": -19.02490234375, "global_step": 25992, "epoch": 313} {"train_loss": -18.42661476135254, "global_step": 25993, "epoch": 313} {"train_loss": -18.724018096923828, "global_step": 25994, "epoch": 313} {"train_loss": -18.862062454223633, "global_step": 25995, "epoch": 313} {"train_loss": -18.672588348388672, "global_step": 25996, "epoch": 313} {"train_loss": -18.812454223632812, "global_step": 25997, "epoch": 313} {"train_loss": -18.516233444213867, "global_step": 25998, "epoch": 313} {"train_loss": -18.51976776123047, "global_step": 25999, "epoch": 313} {"train_loss": -18.950960159301758, "global_step": 26000, "epoch": 313} {"train_loss": -18.55903434753418, "global_step": 26001, "epoch": 313} {"train_loss": -18.8582820892334, "global_step": 26002, "epoch": 313} {"train_loss": -18.711380004882812, "global_step": 26003, "epoch": 313} {"train_loss": -18.75179100036621, "global_step": 26004, "epoch": 313} {"train_loss": -18.588659286499023, "global_step": 26005, "epoch": 313} {"train_loss": -18.371793746948242, "global_step": 26006, "epoch": 313} {"train_loss": -18.59588050842285, "global_step": 26007, "epoch": 313} {"train_loss": -18.711938858032227, "global_step": 26008, "epoch": 313} {"train_loss": -18.611881256103516, "global_step": 26009, "epoch": 313} {"train_loss": -18.47564125061035, "global_step": 26010, "epoch": 313} {"train_loss": -18.48101806640625, "global_step": 26011, "epoch": 313} {"train_loss": -18.39246940612793, "global_step": 26012, "epoch": 313} {"train_loss": -18.363859176635742, "global_step": 26013, "epoch": 313} {"train_loss": -18.94722557067871, "global_step": 26014, "epoch": 313} {"train_loss": -18.829303741455078, "global_step": 26015, "epoch": 313} {"train_loss": -18.756433486938477, "global_step": 26016, "epoch": 313} {"train_loss": -19.163049697875977, "global_step": 26017, "epoch": 313} {"train_loss": -18.77521324157715, "global_step": 26018, "epoch": 313} {"train_loss": -19.118484497070312, "global_step": 26019, "epoch": 313} {"train_loss": -18.504919052124023, "global_step": 26020, "epoch": 313} {"train_loss": -19.051694869995117, "global_step": 26021, "epoch": 313} {"train_loss": -18.719837188720703, "global_step": 26022, "epoch": 313} {"train_loss": -18.38542366027832, "global_step": 26023, "epoch": 313} {"train_loss": -18.683767318725586, "global_step": 26024, "epoch": 313} {"train_loss": -19.054813385009766, "global_step": 26025, "epoch": 313} {"train_loss": -18.690750122070312, "global_step": 26026, "epoch": 313} {"train_loss": -18.52949333190918, "global_step": 26027, "epoch": 313} {"train_loss": -18.92530632019043, "global_step": 26028, "epoch": 313} {"train_loss": -18.868927001953125, "global_step": 26029, "epoch": 313} {"train_loss": -18.526090621948242, "global_step": 26030, "epoch": 313} {"train_loss": -18.769630432128906, "global_step": 26031, "epoch": 313} {"train_loss": -18.899940490722656, "global_step": 26032, "epoch": 313} {"train_loss": -18.546232223510742, "global_step": 26033, "epoch": 313} {"train_loss": -18.45158576965332, "global_step": 26034, "epoch": 313} {"train_loss": -18.816476821899414, "global_step": 26035, "epoch": 313} {"train_loss": -18.65921974182129, "global_step": 26036, "epoch": 313} {"train_loss": -18.717891693115234, "global_step": 26037, "epoch": 313} {"train_loss": -18.530088424682617, "global_step": 26038, "epoch": 313} {"train_loss": -18.862804412841797, "global_step": 26039, "epoch": 313} {"train_loss": -18.308929443359375, "global_step": 26040, "epoch": 313} {"train_loss": -19.103654861450195, "global_step": 26041, "epoch": 313} {"train_loss": -18.70802879333496, "global_step": 26042, "epoch": 313} {"train_loss": -18.860502243041992, "global_step": 26043, "epoch": 313} {"train_loss": -19.390867233276367, "global_step": 26044, "epoch": 313} {"train_loss": -18.99118423461914, "global_step": 26045, "epoch": 313} {"train_loss": -18.701980590820312, "global_step": 26046, "epoch": 313} {"train_loss": -18.829885482788086, "global_step": 26047, "epoch": 313} {"train_loss": -18.667545318603516, "global_step": 26048, "epoch": 313} {"train_loss": -18.603954315185547, "global_step": 26049, "epoch": 313} {"train_loss": -18.646747589111328, "global_step": 26050, "epoch": 313} {"train_loss": -18.346662521362305, "global_step": 26051, "epoch": 313} {"train_loss": -18.579492568969727, "global_step": 26052, "epoch": 313} {"train_loss": -18.587329864501953, "global_step": 26053, "epoch": 313} {"train_loss": -18.833425521850586, "global_step": 26054, "epoch": 313} {"train_loss": -18.784133911132812, "global_step": 26055, "epoch": 313} {"train_loss": -18.94480323791504, "global_step": 26056, "epoch": 313} {"train_loss": -18.564361572265625, "global_step": 26057, "epoch": 313} {"train_loss": -18.7923641204834, "global_step": 26058, "epoch": 313} {"train_loss": -18.5646915435791, "global_step": 26059, "epoch": 313} {"train_loss": -18.507831573486328, "global_step": 26060, "epoch": 313} {"train_loss": -18.704399752329632, "global_step": 26061, "epoch": 313, "val_loss": 6076092.0} {"train_loss": -17.763690948486328, "global_step": 26062, "epoch": 314} {"train_loss": -18.185453414916992, "global_step": 26063, "epoch": 314} {"train_loss": -18.75336456298828, "global_step": 26064, "epoch": 314} {"train_loss": -18.2929630279541, "global_step": 26065, "epoch": 314} {"train_loss": -18.287355422973633, "global_step": 26066, "epoch": 314} {"train_loss": -18.528213500976562, "global_step": 26067, "epoch": 314} {"train_loss": -18.72408103942871, "global_step": 26068, "epoch": 314} {"train_loss": -18.294334411621094, "global_step": 26069, "epoch": 314} {"train_loss": -18.715002059936523, "global_step": 26070, "epoch": 314} {"train_loss": -18.417387008666992, "global_step": 26071, "epoch": 314} {"train_loss": -18.622024536132812, "global_step": 26072, "epoch": 314} {"train_loss": -18.580480575561523, "global_step": 26073, "epoch": 314} {"train_loss": -18.734106063842773, "global_step": 26074, "epoch": 314} {"train_loss": -18.961462020874023, "global_step": 26075, "epoch": 314} {"train_loss": -18.941024780273438, "global_step": 26076, "epoch": 314} {"train_loss": -18.861465454101562, "global_step": 26077, "epoch": 314} {"train_loss": -18.412084579467773, "global_step": 26078, "epoch": 314} {"train_loss": -18.77862548828125, "global_step": 26079, "epoch": 314} {"train_loss": -19.120325088500977, "global_step": 26080, "epoch": 314} {"train_loss": -18.802631378173828, "global_step": 26081, "epoch": 314} {"train_loss": -18.655935287475586, "global_step": 26082, "epoch": 314} {"train_loss": -18.661331176757812, "global_step": 26083, "epoch": 314} {"train_loss": -18.847091674804688, "global_step": 26084, "epoch": 314} {"train_loss": -18.98464584350586, "global_step": 26085, "epoch": 314} {"train_loss": -18.212127685546875, "global_step": 26086, "epoch": 314} {"train_loss": -18.571020126342773, "global_step": 26087, "epoch": 314} {"train_loss": -18.875574111938477, "global_step": 26088, "epoch": 314} {"train_loss": -18.962411880493164, "global_step": 26089, "epoch": 314} {"train_loss": -18.275976181030273, "global_step": 26090, "epoch": 314} {"train_loss": -18.92535972595215, "global_step": 26091, "epoch": 314} {"train_loss": -18.72808265686035, "global_step": 26092, "epoch": 314} {"train_loss": -18.486352920532227, "global_step": 26093, "epoch": 314} {"train_loss": -18.745792388916016, "global_step": 26094, "epoch": 314} {"train_loss": -18.837989807128906, "global_step": 26095, "epoch": 314} {"train_loss": -18.507352828979492, "global_step": 26096, "epoch": 314} {"train_loss": -18.903419494628906, "global_step": 26097, "epoch": 314} {"train_loss": -18.374509811401367, "global_step": 26098, "epoch": 314} {"train_loss": -18.463056564331055, "global_step": 26099, "epoch": 314} {"train_loss": -18.822582244873047, "global_step": 26100, "epoch": 314} {"train_loss": -19.093244552612305, "global_step": 26101, "epoch": 314} {"train_loss": -19.078689575195312, "global_step": 26102, "epoch": 314} {"train_loss": -18.93607521057129, "global_step": 26103, "epoch": 314} {"train_loss": -18.5208683013916, "global_step": 26104, "epoch": 314} {"train_loss": -18.812347412109375, "global_step": 26105, "epoch": 314} {"train_loss": -18.73809242248535, "global_step": 26106, "epoch": 314} {"train_loss": -18.884845733642578, "global_step": 26107, "epoch": 314} {"train_loss": -18.949398040771484, "global_step": 26108, "epoch": 314} {"train_loss": -18.82685089111328, "global_step": 26109, "epoch": 314} {"train_loss": -18.79389190673828, "global_step": 26110, "epoch": 314} {"train_loss": -18.616575241088867, "global_step": 26111, "epoch": 314} {"train_loss": -19.14674186706543, "global_step": 26112, "epoch": 314} {"train_loss": -18.778135299682617, "global_step": 26113, "epoch": 314} {"train_loss": -19.052534103393555, "global_step": 26114, "epoch": 314} {"train_loss": -18.715124130249023, "global_step": 26115, "epoch": 314} {"train_loss": -18.46620750427246, "global_step": 26116, "epoch": 314} {"train_loss": -18.907751083374023, "global_step": 26117, "epoch": 314} {"train_loss": -18.230148315429688, "global_step": 26118, "epoch": 314} {"train_loss": -18.791784286499023, "global_step": 26119, "epoch": 314} {"train_loss": -18.8525447845459, "global_step": 26120, "epoch": 314} {"train_loss": -18.641841888427734, "global_step": 26121, "epoch": 314} {"train_loss": -18.771102905273438, "global_step": 26122, "epoch": 314} {"train_loss": -18.607324600219727, "global_step": 26123, "epoch": 314} {"train_loss": -19.040842056274414, "global_step": 26124, "epoch": 314} {"train_loss": -18.566099166870117, "global_step": 26125, "epoch": 314} {"train_loss": -18.512205123901367, "global_step": 26126, "epoch": 314} {"train_loss": -19.009201049804688, "global_step": 26127, "epoch": 314} {"train_loss": -18.503517150878906, "global_step": 26128, "epoch": 314} {"train_loss": -18.722684860229492, "global_step": 26129, "epoch": 314} {"train_loss": -18.742107391357422, "global_step": 26130, "epoch": 314} {"train_loss": -19.018274307250977, "global_step": 26131, "epoch": 314} {"train_loss": -18.772598266601562, "global_step": 26132, "epoch": 314} {"train_loss": -18.856658935546875, "global_step": 26133, "epoch": 314} {"train_loss": -18.894201278686523, "global_step": 26134, "epoch": 314} {"train_loss": -18.78290557861328, "global_step": 26135, "epoch": 314} {"train_loss": -18.84271812438965, "global_step": 26136, "epoch": 314} {"train_loss": -18.53961944580078, "global_step": 26137, "epoch": 314} {"train_loss": -18.636022567749023, "global_step": 26138, "epoch": 314} {"train_loss": -18.57529067993164, "global_step": 26139, "epoch": 314} {"train_loss": -18.994373321533203, "global_step": 26140, "epoch": 314} {"train_loss": -18.648984909057617, "global_step": 26141, "epoch": 314} {"train_loss": -19.116703033447266, "global_step": 26142, "epoch": 314} {"train_loss": -18.674833297729492, "global_step": 26143, "epoch": 314} {"train_loss": -18.721922656139697, "global_step": 26144, "epoch": 314, "val_loss": 5908010.0} {"train_loss": -18.766571044921875, "global_step": 26145, "epoch": 315} {"train_loss": -18.649778366088867, "global_step": 26146, "epoch": 315} {"train_loss": -18.977170944213867, "global_step": 26147, "epoch": 315} {"train_loss": -18.372406005859375, "global_step": 26148, "epoch": 315} {"train_loss": -18.85898208618164, "global_step": 26149, "epoch": 315} {"train_loss": -18.743322372436523, "global_step": 26150, "epoch": 315} {"train_loss": -18.827123641967773, "global_step": 26151, "epoch": 315} {"train_loss": -18.762222290039062, "global_step": 26152, "epoch": 315} {"train_loss": -19.026123046875, "global_step": 26153, "epoch": 315} {"train_loss": -18.661054611206055, "global_step": 26154, "epoch": 315} {"train_loss": -18.8898868560791, "global_step": 26155, "epoch": 315} {"train_loss": -18.355024337768555, "global_step": 26156, "epoch": 315} {"train_loss": -19.023923873901367, "global_step": 26157, "epoch": 315} {"train_loss": -18.727773666381836, "global_step": 26158, "epoch": 315} {"train_loss": -18.838247299194336, "global_step": 26159, "epoch": 315} {"train_loss": -18.54425048828125, "global_step": 26160, "epoch": 315} {"train_loss": -18.901782989501953, "global_step": 26161, "epoch": 315} {"train_loss": -18.4278564453125, "global_step": 26162, "epoch": 315} {"train_loss": -18.6766414642334, "global_step": 26163, "epoch": 315} {"train_loss": -18.90616798400879, "global_step": 26164, "epoch": 315} {"train_loss": -18.721532821655273, "global_step": 26165, "epoch": 315} {"train_loss": -18.794401168823242, "global_step": 26166, "epoch": 315} {"train_loss": -18.78761863708496, "global_step": 26167, "epoch": 315} {"train_loss": -18.80387306213379, "global_step": 26168, "epoch": 315} {"train_loss": -18.56266212463379, "global_step": 26169, "epoch": 315} {"train_loss": -18.84781837463379, "global_step": 26170, "epoch": 315} {"train_loss": -18.582000732421875, "global_step": 26171, "epoch": 315} {"train_loss": -18.591421127319336, "global_step": 26172, "epoch": 315} {"train_loss": -19.308547973632812, "global_step": 26173, "epoch": 315} {"train_loss": -18.729928970336914, "global_step": 26174, "epoch": 315} {"train_loss": -18.79823875427246, "global_step": 26175, "epoch": 315} {"train_loss": -18.79224395751953, "global_step": 26176, "epoch": 315} {"train_loss": -18.86041831970215, "global_step": 26177, "epoch": 315} {"train_loss": -18.4990291595459, "global_step": 26178, "epoch": 315} {"train_loss": -18.783658981323242, "global_step": 26179, "epoch": 315} {"train_loss": -19.14638328552246, "global_step": 26180, "epoch": 315} {"train_loss": -18.70212745666504, "global_step": 26181, "epoch": 315} {"train_loss": -18.940128326416016, "global_step": 26182, "epoch": 315} {"train_loss": -18.751920700073242, "global_step": 26183, "epoch": 315} {"train_loss": -18.57276725769043, "global_step": 26184, "epoch": 315} {"train_loss": -18.893110275268555, "global_step": 26185, "epoch": 315} {"train_loss": -18.62322235107422, "global_step": 26186, "epoch": 315} {"train_loss": -18.599903106689453, "global_step": 26187, "epoch": 315} {"train_loss": -18.380844116210938, "global_step": 26188, "epoch": 315} {"train_loss": -18.485885620117188, "global_step": 26189, "epoch": 315} {"train_loss": -18.653657913208008, "global_step": 26190, "epoch": 315} {"train_loss": -18.445619583129883, "global_step": 26191, "epoch": 315} {"train_loss": -18.45387077331543, "global_step": 26192, "epoch": 315} {"train_loss": -19.06829261779785, "global_step": 26193, "epoch": 315} {"train_loss": -18.678897857666016, "global_step": 26194, "epoch": 315} {"train_loss": -18.62062644958496, "global_step": 26195, "epoch": 315} {"train_loss": -18.3673095703125, "global_step": 26196, "epoch": 315} {"train_loss": -19.023700714111328, "global_step": 26197, "epoch": 315} {"train_loss": -18.962080001831055, "global_step": 26198, "epoch": 315} {"train_loss": -18.573577880859375, "global_step": 26199, "epoch": 315} {"train_loss": -18.808856964111328, "global_step": 26200, "epoch": 315} {"train_loss": -18.05257225036621, "global_step": 26201, "epoch": 315} {"train_loss": -19.026227951049805, "global_step": 26202, "epoch": 315} {"train_loss": -18.84024429321289, "global_step": 26203, "epoch": 315} {"train_loss": -19.19369888305664, "global_step": 26204, "epoch": 315} {"train_loss": -18.931791305541992, "global_step": 26205, "epoch": 315} {"train_loss": -18.8019962310791, "global_step": 26206, "epoch": 315} {"train_loss": -18.718839645385742, "global_step": 26207, "epoch": 315} {"train_loss": -18.415964126586914, "global_step": 26208, "epoch": 315} {"train_loss": -18.55449867248535, "global_step": 26209, "epoch": 315} {"train_loss": -18.771516799926758, "global_step": 26210, "epoch": 315} {"train_loss": -18.919727325439453, "global_step": 26211, "epoch": 315} {"train_loss": -18.697683334350586, "global_step": 26212, "epoch": 315} {"train_loss": -18.823415756225586, "global_step": 26213, "epoch": 315} {"train_loss": -18.710927963256836, "global_step": 26214, "epoch": 315} {"train_loss": -18.94611167907715, "global_step": 26215, "epoch": 315} {"train_loss": -18.41215705871582, "global_step": 26216, "epoch": 315} {"train_loss": -19.0958194732666, "global_step": 26217, "epoch": 315} {"train_loss": -18.563629150390625, "global_step": 26218, "epoch": 315} {"train_loss": -18.605710983276367, "global_step": 26219, "epoch": 315} {"train_loss": -18.77073860168457, "global_step": 26220, "epoch": 315} {"train_loss": -19.114667892456055, "global_step": 26221, "epoch": 315} {"train_loss": -18.930295944213867, "global_step": 26222, "epoch": 315} {"train_loss": -18.681049346923828, "global_step": 26223, "epoch": 315} {"train_loss": -18.552473068237305, "global_step": 26224, "epoch": 315} {"train_loss": -18.37828826904297, "global_step": 26225, "epoch": 315} {"train_loss": -18.854644775390625, "global_step": 26226, "epoch": 315} {"train_loss": -18.71721826116723, "global_step": 26227, "epoch": 315, "val_loss": 6064361.0} {"train_loss": -18.765207290649414, "global_step": 26228, "epoch": 316} {"train_loss": -18.6221981048584, "global_step": 26229, "epoch": 316} {"train_loss": -18.87574577331543, "global_step": 26230, "epoch": 316} {"train_loss": -18.572940826416016, "global_step": 26231, "epoch": 316} {"train_loss": -18.751981735229492, "global_step": 26232, "epoch": 316} {"train_loss": -18.50572395324707, "global_step": 26233, "epoch": 316} {"train_loss": -18.82974624633789, "global_step": 26234, "epoch": 316} {"train_loss": -18.47067642211914, "global_step": 26235, "epoch": 316} {"train_loss": -18.692392349243164, "global_step": 26236, "epoch": 316} {"train_loss": -18.713172912597656, "global_step": 26237, "epoch": 316} {"train_loss": -18.107654571533203, "global_step": 26238, "epoch": 316} {"train_loss": -18.819074630737305, "global_step": 26239, "epoch": 316} {"train_loss": -18.671281814575195, "global_step": 26240, "epoch": 316} {"train_loss": -18.70063591003418, "global_step": 26241, "epoch": 316} {"train_loss": -18.771224975585938, "global_step": 26242, "epoch": 316} {"train_loss": -18.633716583251953, "global_step": 26243, "epoch": 316} {"train_loss": -19.080875396728516, "global_step": 26244, "epoch": 316} {"train_loss": -18.653522491455078, "global_step": 26245, "epoch": 316} {"train_loss": -18.92352294921875, "global_step": 26246, "epoch": 316} {"train_loss": -19.043956756591797, "global_step": 26247, "epoch": 316} {"train_loss": -18.655044555664062, "global_step": 26248, "epoch": 316} {"train_loss": -18.456043243408203, "global_step": 26249, "epoch": 316} {"train_loss": -18.625802993774414, "global_step": 26250, "epoch": 316} {"train_loss": -18.594802856445312, "global_step": 26251, "epoch": 316} {"train_loss": -18.715009689331055, "global_step": 26252, "epoch": 316} {"train_loss": -18.29538917541504, "global_step": 26253, "epoch": 316} {"train_loss": -18.896650314331055, "global_step": 26254, "epoch": 316} {"train_loss": -18.506567001342773, "global_step": 26255, "epoch": 316} {"train_loss": -18.84745216369629, "global_step": 26256, "epoch": 316} {"train_loss": -18.985925674438477, "global_step": 26257, "epoch": 316} {"train_loss": -18.604446411132812, "global_step": 26258, "epoch": 316} {"train_loss": -18.45298194885254, "global_step": 26259, "epoch": 316} {"train_loss": -18.554244995117188, "global_step": 26260, "epoch": 316} {"train_loss": -18.43351173400879, "global_step": 26261, "epoch": 316} {"train_loss": -18.97761344909668, "global_step": 26262, "epoch": 316} {"train_loss": -18.4946231842041, "global_step": 26263, "epoch": 316} {"train_loss": -19.17087173461914, "global_step": 26264, "epoch": 316} {"train_loss": -18.685644149780273, "global_step": 26265, "epoch": 316} {"train_loss": -18.73200035095215, "global_step": 26266, "epoch": 316} {"train_loss": -18.841588973999023, "global_step": 26267, "epoch": 316} {"train_loss": -18.795988082885742, "global_step": 26268, "epoch": 316} {"train_loss": -18.779226303100586, "global_step": 26269, "epoch": 316} {"train_loss": -18.767242431640625, "global_step": 26270, "epoch": 316} {"train_loss": -18.715375900268555, "global_step": 26271, "epoch": 316} {"train_loss": -18.69658088684082, "global_step": 26272, "epoch": 316} {"train_loss": -18.530054092407227, "global_step": 26273, "epoch": 316} {"train_loss": -18.830341339111328, "global_step": 26274, "epoch": 316} {"train_loss": -18.22018051147461, "global_step": 26275, "epoch": 316} {"train_loss": -18.65705680847168, "global_step": 26276, "epoch": 316} {"train_loss": -18.785215377807617, "global_step": 26277, "epoch": 316} {"train_loss": -18.747724533081055, "global_step": 26278, "epoch": 316} {"train_loss": -18.896047592163086, "global_step": 26279, "epoch": 316} {"train_loss": -18.787567138671875, "global_step": 26280, "epoch": 316} {"train_loss": -18.838041305541992, "global_step": 26281, "epoch": 316} {"train_loss": -18.84847068786621, "global_step": 26282, "epoch": 316} {"train_loss": -18.86005401611328, "global_step": 26283, "epoch": 316} {"train_loss": -18.86392593383789, "global_step": 26284, "epoch": 316} {"train_loss": -18.745656967163086, "global_step": 26285, "epoch": 316} {"train_loss": -18.917011260986328, "global_step": 26286, "epoch": 316} {"train_loss": -18.96527099609375, "global_step": 26287, "epoch": 316} {"train_loss": -19.102964401245117, "global_step": 26288, "epoch": 316} {"train_loss": -18.876794815063477, "global_step": 26289, "epoch": 316} {"train_loss": -18.804443359375, "global_step": 26290, "epoch": 316} {"train_loss": -18.4782772064209, "global_step": 26291, "epoch": 316} {"train_loss": -18.79823112487793, "global_step": 26292, "epoch": 316} {"train_loss": -18.753995895385742, "global_step": 26293, "epoch": 316} {"train_loss": -19.174707412719727, "global_step": 26294, "epoch": 316} {"train_loss": -18.645496368408203, "global_step": 26295, "epoch": 316} {"train_loss": -18.702207565307617, "global_step": 26296, "epoch": 316} {"train_loss": -18.982954025268555, "global_step": 26297, "epoch": 316} {"train_loss": -18.869840621948242, "global_step": 26298, "epoch": 316} {"train_loss": -18.85432243347168, "global_step": 26299, "epoch": 316} {"train_loss": -18.596426010131836, "global_step": 26300, "epoch": 316} {"train_loss": -18.380781173706055, "global_step": 26301, "epoch": 316} {"train_loss": -18.66874122619629, "global_step": 26302, "epoch": 316} {"train_loss": -18.732412338256836, "global_step": 26303, "epoch": 316} {"train_loss": -18.482118606567383, "global_step": 26304, "epoch": 316} {"train_loss": -18.378965377807617, "global_step": 26305, "epoch": 316} {"train_loss": -18.601858139038086, "global_step": 26306, "epoch": 316} {"train_loss": -18.732406616210938, "global_step": 26307, "epoch": 316} {"train_loss": -18.82216453552246, "global_step": 26308, "epoch": 316} {"train_loss": -18.724346160888672, "global_step": 26309, "epoch": 316} {"train_loss": -18.717416648405145, "global_step": 26310, "epoch": 316, "val_loss": 6172080.0} {"train_loss": -17.910715103149414, "global_step": 26311, "epoch": 317} {"train_loss": -18.439477920532227, "global_step": 26312, "epoch": 317} {"train_loss": -18.67294692993164, "global_step": 26313, "epoch": 317} {"train_loss": -18.132253646850586, "global_step": 26314, "epoch": 317} {"train_loss": -18.417692184448242, "global_step": 26315, "epoch": 317} {"train_loss": -18.413772583007812, "global_step": 26316, "epoch": 317} {"train_loss": -18.284196853637695, "global_step": 26317, "epoch": 317} {"train_loss": -18.826927185058594, "global_step": 26318, "epoch": 317} {"train_loss": -18.38422966003418, "global_step": 26319, "epoch": 317} {"train_loss": -18.57228660583496, "global_step": 26320, "epoch": 317} {"train_loss": -18.69841766357422, "global_step": 26321, "epoch": 317} {"train_loss": -18.602331161499023, "global_step": 26322, "epoch": 317} {"train_loss": -18.549291610717773, "global_step": 26323, "epoch": 317} {"train_loss": -18.939285278320312, "global_step": 26324, "epoch": 317} {"train_loss": -18.67095947265625, "global_step": 26325, "epoch": 317} {"train_loss": -19.09593391418457, "global_step": 26326, "epoch": 317} {"train_loss": -18.398191452026367, "global_step": 26327, "epoch": 317} {"train_loss": -18.826156616210938, "global_step": 26328, "epoch": 317} {"train_loss": -18.1125545501709, "global_step": 26329, "epoch": 317} {"train_loss": -18.59463119506836, "global_step": 26330, "epoch": 317} {"train_loss": -18.65151023864746, "global_step": 26331, "epoch": 317} {"train_loss": -19.07805824279785, "global_step": 26332, "epoch": 317} {"train_loss": -18.874141693115234, "global_step": 26333, "epoch": 317} {"train_loss": -19.008424758911133, "global_step": 26334, "epoch": 317} {"train_loss": -18.751590728759766, "global_step": 26335, "epoch": 317} {"train_loss": -18.818504333496094, "global_step": 26336, "epoch": 317} {"train_loss": -18.826202392578125, "global_step": 26337, "epoch": 317} {"train_loss": -18.646268844604492, "global_step": 26338, "epoch": 317} {"train_loss": -18.675649642944336, "global_step": 26339, "epoch": 317} {"train_loss": -18.621442794799805, "global_step": 26340, "epoch": 317} {"train_loss": -18.61672019958496, "global_step": 26341, "epoch": 317} {"train_loss": -18.90626335144043, "global_step": 26342, "epoch": 317} {"train_loss": -18.62685203552246, "global_step": 26343, "epoch": 317} {"train_loss": -18.9565486907959, "global_step": 26344, "epoch": 317} {"train_loss": -18.489988327026367, "global_step": 26345, "epoch": 317} {"train_loss": -18.847309112548828, "global_step": 26346, "epoch": 317} {"train_loss": -18.743202209472656, "global_step": 26347, "epoch": 317} {"train_loss": -19.001096725463867, "global_step": 26348, "epoch": 317} {"train_loss": -18.365947723388672, "global_step": 26349, "epoch": 317} {"train_loss": -18.774335861206055, "global_step": 26350, "epoch": 317} {"train_loss": -18.7456111907959, "global_step": 26351, "epoch": 317} {"train_loss": -18.965293884277344, "global_step": 26352, "epoch": 317} {"train_loss": -19.134519577026367, "global_step": 26353, "epoch": 317} {"train_loss": -18.781652450561523, "global_step": 26354, "epoch": 317} {"train_loss": -18.956653594970703, "global_step": 26355, "epoch": 317} {"train_loss": -18.689924240112305, "global_step": 26356, "epoch": 317} {"train_loss": -18.83978271484375, "global_step": 26357, "epoch": 317} {"train_loss": -18.562271118164062, "global_step": 26358, "epoch": 317} {"train_loss": -18.662273406982422, "global_step": 26359, "epoch": 317} {"train_loss": -18.563379287719727, "global_step": 26360, "epoch": 317} {"train_loss": -18.6101131439209, "global_step": 26361, "epoch": 317} {"train_loss": -18.52910614013672, "global_step": 26362, "epoch": 317} {"train_loss": -19.129165649414062, "global_step": 26363, "epoch": 317} {"train_loss": -18.70482635498047, "global_step": 26364, "epoch": 317} {"train_loss": -19.065786361694336, "global_step": 26365, "epoch": 317} {"train_loss": -18.912281036376953, "global_step": 26366, "epoch": 317} {"train_loss": -18.400997161865234, "global_step": 26367, "epoch": 317} {"train_loss": -19.082822799682617, "global_step": 26368, "epoch": 317} {"train_loss": -18.64568519592285, "global_step": 26369, "epoch": 317} {"train_loss": -19.011550903320312, "global_step": 26370, "epoch": 317} {"train_loss": -18.633573532104492, "global_step": 26371, "epoch": 317} {"train_loss": -19.14156150817871, "global_step": 26372, "epoch": 317} {"train_loss": -18.728391647338867, "global_step": 26373, "epoch": 317} {"train_loss": -18.52899169921875, "global_step": 26374, "epoch": 317} {"train_loss": -18.715662002563477, "global_step": 26375, "epoch": 317} {"train_loss": -19.042694091796875, "global_step": 26376, "epoch": 317} {"train_loss": -18.654733657836914, "global_step": 26377, "epoch": 317} {"train_loss": -18.87035369873047, "global_step": 26378, "epoch": 317} {"train_loss": -18.58521270751953, "global_step": 26379, "epoch": 317} {"train_loss": -18.237966537475586, "global_step": 26380, "epoch": 317} {"train_loss": -18.712238311767578, "global_step": 26381, "epoch": 317} {"train_loss": -18.82454490661621, "global_step": 26382, "epoch": 317} {"train_loss": -18.652475357055664, "global_step": 26383, "epoch": 317} {"train_loss": -18.567861557006836, "global_step": 26384, "epoch": 317} {"train_loss": -18.954620361328125, "global_step": 26385, "epoch": 317} {"train_loss": -18.74026870727539, "global_step": 26386, "epoch": 317} {"train_loss": -18.835926055908203, "global_step": 26387, "epoch": 317} {"train_loss": -18.86079216003418, "global_step": 26388, "epoch": 317} {"train_loss": -18.592206954956055, "global_step": 26389, "epoch": 317} {"train_loss": -18.429996490478516, "global_step": 26390, "epoch": 317} {"train_loss": -19.073768615722656, "global_step": 26391, "epoch": 317} {"train_loss": -19.063247680664062, "global_step": 26392, "epoch": 317} {"train_loss": -18.71461197267096, "global_step": 26393, "epoch": 317, "val_loss": 6028608.5} {"train_loss": -18.607145309448242, "global_step": 26394, "epoch": 318} {"train_loss": -18.66064453125, "global_step": 26395, "epoch": 318} {"train_loss": -18.427963256835938, "global_step": 26396, "epoch": 318} {"train_loss": -19.001720428466797, "global_step": 26397, "epoch": 318} {"train_loss": -18.559804916381836, "global_step": 26398, "epoch": 318} {"train_loss": -18.816757202148438, "global_step": 26399, "epoch": 318} {"train_loss": -19.06985855102539, "global_step": 26400, "epoch": 318} {"train_loss": -18.461896896362305, "global_step": 26401, "epoch": 318} {"train_loss": -18.673791885375977, "global_step": 26402, "epoch": 318} {"train_loss": -18.679325103759766, "global_step": 26403, "epoch": 318} {"train_loss": -18.678974151611328, "global_step": 26404, "epoch": 318} {"train_loss": -18.547475814819336, "global_step": 26405, "epoch": 318} {"train_loss": -18.99543571472168, "global_step": 26406, "epoch": 318} {"train_loss": -18.931365966796875, "global_step": 26407, "epoch": 318} {"train_loss": -19.05891227722168, "global_step": 26408, "epoch": 318} {"train_loss": -18.760650634765625, "global_step": 26409, "epoch": 318} {"train_loss": -18.633962631225586, "global_step": 26410, "epoch": 318} {"train_loss": -18.938688278198242, "global_step": 26411, "epoch": 318} {"train_loss": -18.620620727539062, "global_step": 26412, "epoch": 318} {"train_loss": -18.682783126831055, "global_step": 26413, "epoch": 318} {"train_loss": -18.708911895751953, "global_step": 26414, "epoch": 318} {"train_loss": -18.690448760986328, "global_step": 26415, "epoch": 318} {"train_loss": -18.846538543701172, "global_step": 26416, "epoch": 318} {"train_loss": -18.685239791870117, "global_step": 26417, "epoch": 318} {"train_loss": -18.703397750854492, "global_step": 26418, "epoch": 318} {"train_loss": -18.686704635620117, "global_step": 26419, "epoch": 318} {"train_loss": -18.77174949645996, "global_step": 26420, "epoch": 318} {"train_loss": -18.952497482299805, "global_step": 26421, "epoch": 318} {"train_loss": -19.030426025390625, "global_step": 26422, "epoch": 318} {"train_loss": -18.807783126831055, "global_step": 26423, "epoch": 318} {"train_loss": -18.785606384277344, "global_step": 26424, "epoch": 318} {"train_loss": -18.84036636352539, "global_step": 26425, "epoch": 318} {"train_loss": -18.482784271240234, "global_step": 26426, "epoch": 318} {"train_loss": -18.754560470581055, "global_step": 26427, "epoch": 318} {"train_loss": -18.85188102722168, "global_step": 26428, "epoch": 318} {"train_loss": -18.599111557006836, "global_step": 26429, "epoch": 318} {"train_loss": -18.82114601135254, "global_step": 26430, "epoch": 318} {"train_loss": -18.673952102661133, "global_step": 26431, "epoch": 318} {"train_loss": -18.516109466552734, "global_step": 26432, "epoch": 318} {"train_loss": -18.61530876159668, "global_step": 26433, "epoch": 318} {"train_loss": -18.709020614624023, "global_step": 26434, "epoch": 318} {"train_loss": -18.69222068786621, "global_step": 26435, "epoch": 318} {"train_loss": -18.807523727416992, "global_step": 26436, "epoch": 318} {"train_loss": -18.7801513671875, "global_step": 26437, "epoch": 318} {"train_loss": -18.99918556213379, "global_step": 26438, "epoch": 318} {"train_loss": -18.80325698852539, "global_step": 26439, "epoch": 318} {"train_loss": -18.945261001586914, "global_step": 26440, "epoch": 318} {"train_loss": -18.501562118530273, "global_step": 26441, "epoch": 318} {"train_loss": -18.67669105529785, "global_step": 26442, "epoch": 318} {"train_loss": -18.767181396484375, "global_step": 26443, "epoch": 318} {"train_loss": -18.980390548706055, "global_step": 26444, "epoch": 318} {"train_loss": -18.726865768432617, "global_step": 26445, "epoch": 318} {"train_loss": -18.840412139892578, "global_step": 26446, "epoch": 318} {"train_loss": -18.897104263305664, "global_step": 26447, "epoch": 318} {"train_loss": -19.023664474487305, "global_step": 26448, "epoch": 318} {"train_loss": -18.606704711914062, "global_step": 26449, "epoch": 318} {"train_loss": -18.757017135620117, "global_step": 26450, "epoch": 318} {"train_loss": -18.80843162536621, "global_step": 26451, "epoch": 318} {"train_loss": -18.350439071655273, "global_step": 26452, "epoch": 318} {"train_loss": -18.803281784057617, "global_step": 26453, "epoch": 318} {"train_loss": -18.347434997558594, "global_step": 26454, "epoch": 318} {"train_loss": -19.310657501220703, "global_step": 26455, "epoch": 318} {"train_loss": -18.938398361206055, "global_step": 26456, "epoch": 318} {"train_loss": -18.62836265563965, "global_step": 26457, "epoch": 318} {"train_loss": -18.875577926635742, "global_step": 26458, "epoch": 318} {"train_loss": -18.629859924316406, "global_step": 26459, "epoch": 318} {"train_loss": -18.779802322387695, "global_step": 26460, "epoch": 318} {"train_loss": -19.03452491760254, "global_step": 26461, "epoch": 318} {"train_loss": -18.529462814331055, "global_step": 26462, "epoch": 318} {"train_loss": -18.452425003051758, "global_step": 26463, "epoch": 318} {"train_loss": -19.035846710205078, "global_step": 26464, "epoch": 318} {"train_loss": -18.870298385620117, "global_step": 26465, "epoch": 318} {"train_loss": -19.009496688842773, "global_step": 26466, "epoch": 318} {"train_loss": -18.88983726501465, "global_step": 26467, "epoch": 318} {"train_loss": -18.854793548583984, "global_step": 26468, "epoch": 318} {"train_loss": -18.580215454101562, "global_step": 26469, "epoch": 318} {"train_loss": -18.655921936035156, "global_step": 26470, "epoch": 318} {"train_loss": -18.669254302978516, "global_step": 26471, "epoch": 318} {"train_loss": -18.73233413696289, "global_step": 26472, "epoch": 318} {"train_loss": -18.500892639160156, "global_step": 26473, "epoch": 318} {"train_loss": -18.46998405456543, "global_step": 26474, "epoch": 318} {"train_loss": -18.657007217407227, "global_step": 26475, "epoch": 318} {"train_loss": -18.743002811110163, "global_step": 26476, "epoch": 318, "val_loss": 5989109.5} {"train_loss": -18.15369987487793, "global_step": 26477, "epoch": 319} {"train_loss": -18.22129249572754, "global_step": 26478, "epoch": 319} {"train_loss": -18.017913818359375, "global_step": 26479, "epoch": 319} {"train_loss": -18.660860061645508, "global_step": 26480, "epoch": 319} {"train_loss": -18.164234161376953, "global_step": 26481, "epoch": 319} {"train_loss": -18.566198348999023, "global_step": 26482, "epoch": 319} {"train_loss": -18.07678985595703, "global_step": 26483, "epoch": 319} {"train_loss": -18.420644760131836, "global_step": 26484, "epoch": 319} {"train_loss": -18.690370559692383, "global_step": 26485, "epoch": 319} {"train_loss": -18.501977920532227, "global_step": 26486, "epoch": 319} {"train_loss": -18.410964965820312, "global_step": 26487, "epoch": 319} {"train_loss": -18.39887046813965, "global_step": 26488, "epoch": 319} {"train_loss": -18.588346481323242, "global_step": 26489, "epoch": 319} {"train_loss": -18.525249481201172, "global_step": 26490, "epoch": 319} {"train_loss": -18.723520278930664, "global_step": 26491, "epoch": 319} {"train_loss": -18.5595760345459, "global_step": 26492, "epoch": 319} {"train_loss": -18.61614418029785, "global_step": 26493, "epoch": 319} {"train_loss": -19.032272338867188, "global_step": 26494, "epoch": 319} {"train_loss": -18.6235294342041, "global_step": 26495, "epoch": 319} {"train_loss": -18.93292808532715, "global_step": 26496, "epoch": 319} {"train_loss": -18.276426315307617, "global_step": 26497, "epoch": 319} {"train_loss": -18.595712661743164, "global_step": 26498, "epoch": 319} {"train_loss": -18.523452758789062, "global_step": 26499, "epoch": 319} {"train_loss": -18.704198837280273, "global_step": 26500, "epoch": 319} {"train_loss": -18.98299217224121, "global_step": 26501, "epoch": 319} {"train_loss": -18.987995147705078, "global_step": 26502, "epoch": 319} {"train_loss": -18.840051651000977, "global_step": 26503, "epoch": 319} {"train_loss": -18.712736129760742, "global_step": 26504, "epoch": 319} {"train_loss": -18.95631217956543, "global_step": 26505, "epoch": 319} {"train_loss": -18.93122673034668, "global_step": 26506, "epoch": 319} {"train_loss": -18.91902732849121, "global_step": 26507, "epoch": 319} {"train_loss": -18.662586212158203, "global_step": 26508, "epoch": 319} {"train_loss": -18.631473541259766, "global_step": 26509, "epoch": 319} {"train_loss": -18.881942749023438, "global_step": 26510, "epoch": 319} {"train_loss": -18.759389877319336, "global_step": 26511, "epoch": 319} {"train_loss": -19.096139907836914, "global_step": 26512, "epoch": 319} {"train_loss": -18.769519805908203, "global_step": 26513, "epoch": 319} {"train_loss": -18.450891494750977, "global_step": 26514, "epoch": 319} {"train_loss": -18.711984634399414, "global_step": 26515, "epoch": 319} {"train_loss": -19.125486373901367, "global_step": 26516, "epoch": 319} {"train_loss": -18.492172241210938, "global_step": 26517, "epoch": 319} {"train_loss": -18.784011840820312, "global_step": 26518, "epoch": 319} {"train_loss": -18.676984786987305, "global_step": 26519, "epoch": 319} {"train_loss": -19.106069564819336, "global_step": 26520, "epoch": 319} {"train_loss": -18.947006225585938, "global_step": 26521, "epoch": 319} {"train_loss": -18.815397262573242, "global_step": 26522, "epoch": 319} {"train_loss": -18.427480697631836, "global_step": 26523, "epoch": 319} {"train_loss": -18.55219078063965, "global_step": 26524, "epoch": 319} {"train_loss": -18.500823974609375, "global_step": 26525, "epoch": 319} {"train_loss": -19.076955795288086, "global_step": 26526, "epoch": 319} {"train_loss": -18.849102020263672, "global_step": 26527, "epoch": 319} {"train_loss": -18.863677978515625, "global_step": 26528, "epoch": 319} {"train_loss": -18.693326950073242, "global_step": 26529, "epoch": 319} {"train_loss": -19.096277236938477, "global_step": 26530, "epoch": 319} {"train_loss": -18.55757713317871, "global_step": 26531, "epoch": 319} {"train_loss": -18.762094497680664, "global_step": 26532, "epoch": 319} {"train_loss": -18.771102905273438, "global_step": 26533, "epoch": 319} {"train_loss": -18.788843154907227, "global_step": 26534, "epoch": 319} {"train_loss": -18.748512268066406, "global_step": 26535, "epoch": 319} {"train_loss": -18.72075843811035, "global_step": 26536, "epoch": 319} {"train_loss": -18.52304458618164, "global_step": 26537, "epoch": 319} {"train_loss": -19.186620712280273, "global_step": 26538, "epoch": 319} {"train_loss": -18.867374420166016, "global_step": 26539, "epoch": 319} {"train_loss": -18.457050323486328, "global_step": 26540, "epoch": 319} {"train_loss": -18.957361221313477, "global_step": 26541, "epoch": 319} {"train_loss": -18.813186645507812, "global_step": 26542, "epoch": 319} {"train_loss": -18.605411529541016, "global_step": 26543, "epoch": 319} {"train_loss": -18.456682205200195, "global_step": 26544, "epoch": 319} {"train_loss": -18.580358505249023, "global_step": 26545, "epoch": 319} {"train_loss": -18.69297218322754, "global_step": 26546, "epoch": 319} {"train_loss": -19.066930770874023, "global_step": 26547, "epoch": 319} {"train_loss": -18.639944076538086, "global_step": 26548, "epoch": 319} {"train_loss": -18.681753158569336, "global_step": 26549, "epoch": 319} {"train_loss": -18.72344398498535, "global_step": 26550, "epoch": 319} {"train_loss": -18.743680953979492, "global_step": 26551, "epoch": 319} {"train_loss": -19.135635375976562, "global_step": 26552, "epoch": 319} {"train_loss": -18.781869888305664, "global_step": 26553, "epoch": 319} {"train_loss": -18.721965789794922, "global_step": 26554, "epoch": 319} {"train_loss": -18.734167098999023, "global_step": 26555, "epoch": 319} {"train_loss": -18.810359954833984, "global_step": 26556, "epoch": 319} {"train_loss": -18.70719337463379, "global_step": 26557, "epoch": 319} {"train_loss": -19.035642623901367, "global_step": 26558, "epoch": 319} {"train_loss": -18.72469162079225, "global_step": 26559, "epoch": 319, "val_loss": 5973166.0} {"train_loss": -18.735950469970703, "global_step": 26560, "epoch": 320} {"train_loss": -18.910932540893555, "global_step": 26561, "epoch": 320} {"train_loss": -18.730504989624023, "global_step": 26562, "epoch": 320} {"train_loss": -18.595582962036133, "global_step": 26563, "epoch": 320} {"train_loss": -18.1986083984375, "global_step": 26564, "epoch": 320} {"train_loss": -18.754281997680664, "global_step": 26565, "epoch": 320} {"train_loss": -18.874732971191406, "global_step": 26566, "epoch": 320} {"train_loss": -18.50081443786621, "global_step": 26567, "epoch": 320} {"train_loss": -18.80156707763672, "global_step": 26568, "epoch": 320} {"train_loss": -18.857816696166992, "global_step": 26569, "epoch": 320} {"train_loss": -18.658193588256836, "global_step": 26570, "epoch": 320} {"train_loss": -18.38934326171875, "global_step": 26571, "epoch": 320} {"train_loss": -18.70475196838379, "global_step": 26572, "epoch": 320} {"train_loss": -18.840484619140625, "global_step": 26573, "epoch": 320} {"train_loss": -18.831571578979492, "global_step": 26574, "epoch": 320} {"train_loss": -19.064586639404297, "global_step": 26575, "epoch": 320} {"train_loss": -18.952606201171875, "global_step": 26576, "epoch": 320} {"train_loss": -18.8369197845459, "global_step": 26577, "epoch": 320} {"train_loss": -18.82862663269043, "global_step": 26578, "epoch": 320} {"train_loss": -18.856130599975586, "global_step": 26579, "epoch": 320} {"train_loss": -18.911605834960938, "global_step": 26580, "epoch": 320} {"train_loss": -19.007156372070312, "global_step": 26581, "epoch": 320} {"train_loss": -18.6606502532959, "global_step": 26582, "epoch": 320} {"train_loss": -18.89141845703125, "global_step": 26583, "epoch": 320} {"train_loss": -18.84904670715332, "global_step": 26584, "epoch": 320} {"train_loss": -18.816486358642578, "global_step": 26585, "epoch": 320} {"train_loss": -18.900541305541992, "global_step": 26586, "epoch": 320} {"train_loss": -18.65692710876465, "global_step": 26587, "epoch": 320} {"train_loss": -18.977458953857422, "global_step": 26588, "epoch": 320} {"train_loss": -18.742034912109375, "global_step": 26589, "epoch": 320} {"train_loss": -18.29557991027832, "global_step": 26590, "epoch": 320} {"train_loss": -18.60145378112793, "global_step": 26591, "epoch": 320} {"train_loss": -18.52242660522461, "global_step": 26592, "epoch": 320} {"train_loss": -18.569503784179688, "global_step": 26593, "epoch": 320} {"train_loss": -18.90864372253418, "global_step": 26594, "epoch": 320} {"train_loss": -18.68726921081543, "global_step": 26595, "epoch": 320} {"train_loss": -19.065134048461914, "global_step": 26596, "epoch": 320} {"train_loss": -18.762176513671875, "global_step": 26597, "epoch": 320} {"train_loss": -18.60838508605957, "global_step": 26598, "epoch": 320} {"train_loss": -18.46162223815918, "global_step": 26599, "epoch": 320} {"train_loss": -18.665639877319336, "global_step": 26600, "epoch": 320} {"train_loss": -19.088056564331055, "global_step": 26601, "epoch": 320} {"train_loss": -18.899145126342773, "global_step": 26602, "epoch": 320} {"train_loss": -18.888845443725586, "global_step": 26603, "epoch": 320} {"train_loss": -18.712736129760742, "global_step": 26604, "epoch": 320} {"train_loss": -18.464292526245117, "global_step": 26605, "epoch": 320} {"train_loss": -18.964893341064453, "global_step": 26606, "epoch": 320} {"train_loss": -18.56365394592285, "global_step": 26607, "epoch": 320} {"train_loss": -18.758562088012695, "global_step": 26608, "epoch": 320} {"train_loss": -18.639434814453125, "global_step": 26609, "epoch": 320} {"train_loss": -18.87656593322754, "global_step": 26610, "epoch": 320} {"train_loss": -18.746051788330078, "global_step": 26611, "epoch": 320} {"train_loss": -18.61066246032715, "global_step": 26612, "epoch": 320} {"train_loss": -18.684606552124023, "global_step": 26613, "epoch": 320} {"train_loss": -18.877071380615234, "global_step": 26614, "epoch": 320} {"train_loss": -18.670560836791992, "global_step": 26615, "epoch": 320} {"train_loss": -18.741743087768555, "global_step": 26616, "epoch": 320} {"train_loss": -18.808008193969727, "global_step": 26617, "epoch": 320} {"train_loss": -19.2962646484375, "global_step": 26618, "epoch": 320} {"train_loss": -18.416507720947266, "global_step": 26619, "epoch": 320} {"train_loss": -18.53644371032715, "global_step": 26620, "epoch": 320} {"train_loss": -18.881437301635742, "global_step": 26621, "epoch": 320} {"train_loss": -18.7737979888916, "global_step": 26622, "epoch": 320} {"train_loss": -19.05952262878418, "global_step": 26623, "epoch": 320} {"train_loss": -19.1226863861084, "global_step": 26624, "epoch": 320} {"train_loss": -18.8641300201416, "global_step": 26625, "epoch": 320} {"train_loss": -19.098175048828125, "global_step": 26626, "epoch": 320} {"train_loss": -18.93662452697754, "global_step": 26627, "epoch": 320} {"train_loss": -18.910419464111328, "global_step": 26628, "epoch": 320} {"train_loss": -18.940601348876953, "global_step": 26629, "epoch": 320} {"train_loss": -18.938108444213867, "global_step": 26630, "epoch": 320} {"train_loss": -18.959535598754883, "global_step": 26631, "epoch": 320} {"train_loss": -18.795734405517578, "global_step": 26632, "epoch": 320} {"train_loss": -18.925735473632812, "global_step": 26633, "epoch": 320} {"train_loss": -18.733448028564453, "global_step": 26634, "epoch": 320} {"train_loss": -18.739675521850586, "global_step": 26635, "epoch": 320} {"train_loss": -18.52206039428711, "global_step": 26636, "epoch": 320} {"train_loss": -18.550596237182617, "global_step": 26637, "epoch": 320} {"train_loss": -18.647541046142578, "global_step": 26638, "epoch": 320} {"train_loss": -18.956003189086914, "global_step": 26639, "epoch": 320} {"train_loss": -18.795917510986328, "global_step": 26640, "epoch": 320} {"train_loss": -18.4202823638916, "global_step": 26641, "epoch": 320} {"train_loss": -18.77184472601098, "global_step": 26642, "epoch": 320, "val_loss": 5897986.0} {"train_loss": -18.450977325439453, "global_step": 26643, "epoch": 321} {"train_loss": -18.37946128845215, "global_step": 26644, "epoch": 321} {"train_loss": -18.80804443359375, "global_step": 26645, "epoch": 321} {"train_loss": -18.511884689331055, "global_step": 26646, "epoch": 321} {"train_loss": -18.494821548461914, "global_step": 26647, "epoch": 321} {"train_loss": -18.254440307617188, "global_step": 26648, "epoch": 321} {"train_loss": -18.699951171875, "global_step": 26649, "epoch": 321} {"train_loss": -18.20380973815918, "global_step": 26650, "epoch": 321} {"train_loss": -18.76907730102539, "global_step": 26651, "epoch": 321} {"train_loss": -18.79437828063965, "global_step": 26652, "epoch": 321} {"train_loss": -18.958858489990234, "global_step": 26653, "epoch": 321} {"train_loss": -18.737415313720703, "global_step": 26654, "epoch": 321} {"train_loss": -18.444013595581055, "global_step": 26655, "epoch": 321} {"train_loss": -18.91983985900879, "global_step": 26656, "epoch": 321} {"train_loss": -18.57356071472168, "global_step": 26657, "epoch": 321} {"train_loss": -18.791187286376953, "global_step": 26658, "epoch": 321} {"train_loss": -18.548999786376953, "global_step": 26659, "epoch": 321} {"train_loss": -18.9487361907959, "global_step": 26660, "epoch": 321} {"train_loss": -18.693689346313477, "global_step": 26661, "epoch": 321} {"train_loss": -18.67484474182129, "global_step": 26662, "epoch": 321} {"train_loss": -18.82132911682129, "global_step": 26663, "epoch": 321} {"train_loss": -18.345474243164062, "global_step": 26664, "epoch": 321} {"train_loss": -18.998003005981445, "global_step": 26665, "epoch": 321} {"train_loss": -18.64893913269043, "global_step": 26666, "epoch": 321} {"train_loss": -19.111541748046875, "global_step": 26667, "epoch": 321} {"train_loss": -19.039758682250977, "global_step": 26668, "epoch": 321} {"train_loss": -18.650182723999023, "global_step": 26669, "epoch": 321} {"train_loss": -18.931930541992188, "global_step": 26670, "epoch": 321} {"train_loss": -18.812152862548828, "global_step": 26671, "epoch": 321} {"train_loss": -18.54695701599121, "global_step": 26672, "epoch": 321} {"train_loss": -18.8027286529541, "global_step": 26673, "epoch": 321} {"train_loss": -18.75184440612793, "global_step": 26674, "epoch": 321} {"train_loss": -18.925790786743164, "global_step": 26675, "epoch": 321} {"train_loss": -19.062299728393555, "global_step": 26676, "epoch": 321} {"train_loss": -18.9782657623291, "global_step": 26677, "epoch": 321} {"train_loss": -18.710037231445312, "global_step": 26678, "epoch": 321} {"train_loss": -18.79463005065918, "global_step": 26679, "epoch": 321} {"train_loss": -18.609479904174805, "global_step": 26680, "epoch": 321} {"train_loss": -18.75929832458496, "global_step": 26681, "epoch": 321} {"train_loss": -18.80019187927246, "global_step": 26682, "epoch": 321} {"train_loss": -18.757856369018555, "global_step": 26683, "epoch": 321} {"train_loss": -18.603759765625, "global_step": 26684, "epoch": 321} {"train_loss": -18.755582809448242, "global_step": 26685, "epoch": 321} {"train_loss": -19.1296329498291, "global_step": 26686, "epoch": 321} {"train_loss": -18.672897338867188, "global_step": 26687, "epoch": 321} {"train_loss": -18.916675567626953, "global_step": 26688, "epoch": 321} {"train_loss": -18.63364601135254, "global_step": 26689, "epoch": 321} {"train_loss": -18.685758590698242, "global_step": 26690, "epoch": 321} {"train_loss": -18.933820724487305, "global_step": 26691, "epoch": 321} {"train_loss": -18.801515579223633, "global_step": 26692, "epoch": 321} {"train_loss": -18.695363998413086, "global_step": 26693, "epoch": 321} {"train_loss": -18.4465389251709, "global_step": 26694, "epoch": 321} {"train_loss": -18.982656478881836, "global_step": 26695, "epoch": 321} {"train_loss": -18.87154197692871, "global_step": 26696, "epoch": 321} {"train_loss": -18.48603630065918, "global_step": 26697, "epoch": 321} {"train_loss": -18.65968894958496, "global_step": 26698, "epoch": 321} {"train_loss": -18.715959548950195, "global_step": 26699, "epoch": 321} {"train_loss": -18.860265731811523, "global_step": 26700, "epoch": 321} {"train_loss": -18.949045181274414, "global_step": 26701, "epoch": 321} {"train_loss": -18.638986587524414, "global_step": 26702, "epoch": 321} {"train_loss": -19.19205665588379, "global_step": 26703, "epoch": 321} {"train_loss": -18.740909576416016, "global_step": 26704, "epoch": 321} {"train_loss": -18.933727264404297, "global_step": 26705, "epoch": 321} {"train_loss": -18.859357833862305, "global_step": 26706, "epoch": 321} {"train_loss": -19.04513931274414, "global_step": 26707, "epoch": 321} {"train_loss": -18.67120361328125, "global_step": 26708, "epoch": 321} {"train_loss": -18.517091751098633, "global_step": 26709, "epoch": 321} {"train_loss": -18.874521255493164, "global_step": 26710, "epoch": 321} {"train_loss": -18.709747314453125, "global_step": 26711, "epoch": 321} {"train_loss": -18.92060661315918, "global_step": 26712, "epoch": 321} {"train_loss": -18.894773483276367, "global_step": 26713, "epoch": 321} {"train_loss": -18.596885681152344, "global_step": 26714, "epoch": 321} {"train_loss": -18.535551071166992, "global_step": 26715, "epoch": 321} {"train_loss": -18.491201400756836, "global_step": 26716, "epoch": 321} {"train_loss": -18.72452163696289, "global_step": 26717, "epoch": 321} {"train_loss": -18.84332847595215, "global_step": 26718, "epoch": 321} {"train_loss": -18.754423141479492, "global_step": 26719, "epoch": 321} {"train_loss": -18.891523361206055, "global_step": 26720, "epoch": 321} {"train_loss": -18.74648666381836, "global_step": 26721, "epoch": 321} {"train_loss": -18.706912994384766, "global_step": 26722, "epoch": 321} {"train_loss": -18.63208770751953, "global_step": 26723, "epoch": 321} {"train_loss": -18.690771102905273, "global_step": 26724, "epoch": 321} {"train_loss": -18.72692085174193, "global_step": 26725, "epoch": 321, "val_loss": 5956394.0} {"train_loss": -18.93079376220703, "global_step": 26726, "epoch": 322} {"train_loss": -18.496601104736328, "global_step": 26727, "epoch": 322} {"train_loss": -18.56490135192871, "global_step": 26728, "epoch": 322} {"train_loss": -19.16927146911621, "global_step": 26729, "epoch": 322} {"train_loss": -18.371627807617188, "global_step": 26730, "epoch": 322} {"train_loss": -18.66353416442871, "global_step": 26731, "epoch": 322} {"train_loss": -18.758596420288086, "global_step": 26732, "epoch": 322} {"train_loss": -18.9061336517334, "global_step": 26733, "epoch": 322} {"train_loss": -18.775434494018555, "global_step": 26734, "epoch": 322} {"train_loss": -18.452472686767578, "global_step": 26735, "epoch": 322} {"train_loss": -18.607501983642578, "global_step": 26736, "epoch": 322} {"train_loss": -18.62079429626465, "global_step": 26737, "epoch": 322} {"train_loss": -19.018936157226562, "global_step": 26738, "epoch": 322} {"train_loss": -18.71772575378418, "global_step": 26739, "epoch": 322} {"train_loss": -18.740346908569336, "global_step": 26740, "epoch": 322} {"train_loss": -19.0426082611084, "global_step": 26741, "epoch": 322} {"train_loss": -18.609159469604492, "global_step": 26742, "epoch": 322} {"train_loss": -19.09503746032715, "global_step": 26743, "epoch": 322} {"train_loss": -18.5778865814209, "global_step": 26744, "epoch": 322} {"train_loss": -18.73065185546875, "global_step": 26745, "epoch": 322} {"train_loss": -18.835424423217773, "global_step": 26746, "epoch": 322} {"train_loss": -18.515714645385742, "global_step": 26747, "epoch": 322} {"train_loss": -18.730623245239258, "global_step": 26748, "epoch": 322} {"train_loss": -19.20112419128418, "global_step": 26749, "epoch": 322} {"train_loss": -18.634811401367188, "global_step": 26750, "epoch": 322} {"train_loss": -19.120441436767578, "global_step": 26751, "epoch": 322} {"train_loss": -18.91015625, "global_step": 26752, "epoch": 322} {"train_loss": -19.18635368347168, "global_step": 26753, "epoch": 322} {"train_loss": -18.680110931396484, "global_step": 26754, "epoch": 322} {"train_loss": -19.318395614624023, "global_step": 26755, "epoch": 322} {"train_loss": -18.78763771057129, "global_step": 26756, "epoch": 322} {"train_loss": -18.9425106048584, "global_step": 26757, "epoch": 322} {"train_loss": -18.856204986572266, "global_step": 26758, "epoch": 322} {"train_loss": -18.943119049072266, "global_step": 26759, "epoch": 322} {"train_loss": -18.507421493530273, "global_step": 26760, "epoch": 322} {"train_loss": -18.73069953918457, "global_step": 26761, "epoch": 322} {"train_loss": -18.801557540893555, "global_step": 26762, "epoch": 322} {"train_loss": -18.91470718383789, "global_step": 26763, "epoch": 322} {"train_loss": -18.797731399536133, "global_step": 26764, "epoch": 322} {"train_loss": -18.961261749267578, "global_step": 26765, "epoch": 322} {"train_loss": -18.448657989501953, "global_step": 26766, "epoch": 322} {"train_loss": -18.882587432861328, "global_step": 26767, "epoch": 322} {"train_loss": -18.928817749023438, "global_step": 26768, "epoch": 322} {"train_loss": -18.78892707824707, "global_step": 26769, "epoch": 322} {"train_loss": -18.714191436767578, "global_step": 26770, "epoch": 322} {"train_loss": -18.536436080932617, "global_step": 26771, "epoch": 322} {"train_loss": -18.857206344604492, "global_step": 26772, "epoch": 322} {"train_loss": -18.527212142944336, "global_step": 26773, "epoch": 322} {"train_loss": -18.761178970336914, "global_step": 26774, "epoch": 322} {"train_loss": -19.144479751586914, "global_step": 26775, "epoch": 322} {"train_loss": -18.979490280151367, "global_step": 26776, "epoch": 322} {"train_loss": -19.04840660095215, "global_step": 26777, "epoch": 322} {"train_loss": -18.73255729675293, "global_step": 26778, "epoch": 322} {"train_loss": -18.79657554626465, "global_step": 26779, "epoch": 322} {"train_loss": -18.503847122192383, "global_step": 26780, "epoch": 322} {"train_loss": -18.597396850585938, "global_step": 26781, "epoch": 322} {"train_loss": -18.949857711791992, "global_step": 26782, "epoch": 322} {"train_loss": -18.844472885131836, "global_step": 26783, "epoch": 322} {"train_loss": -18.725454330444336, "global_step": 26784, "epoch": 322} {"train_loss": -18.825485229492188, "global_step": 26785, "epoch": 322} {"train_loss": -18.675931930541992, "global_step": 26786, "epoch": 322} {"train_loss": -19.179080963134766, "global_step": 26787, "epoch": 322} {"train_loss": -19.096569061279297, "global_step": 26788, "epoch": 322} {"train_loss": -18.864980697631836, "global_step": 26789, "epoch": 322} {"train_loss": -18.98033905029297, "global_step": 26790, "epoch": 322} {"train_loss": -18.864572525024414, "global_step": 26791, "epoch": 322} {"train_loss": -19.008474349975586, "global_step": 26792, "epoch": 322} {"train_loss": -18.8550968170166, "global_step": 26793, "epoch": 322} {"train_loss": -18.539682388305664, "global_step": 26794, "epoch": 322} {"train_loss": -18.53255271911621, "global_step": 26795, "epoch": 322} {"train_loss": -18.719987869262695, "global_step": 26796, "epoch": 322} {"train_loss": -18.644241333007812, "global_step": 26797, "epoch": 322} {"train_loss": -18.751941680908203, "global_step": 26798, "epoch": 322} {"train_loss": -18.656217575073242, "global_step": 26799, "epoch": 322} {"train_loss": -18.831037521362305, "global_step": 26800, "epoch": 322} {"train_loss": -18.72306251525879, "global_step": 26801, "epoch": 322} {"train_loss": -18.7274169921875, "global_step": 26802, "epoch": 322} {"train_loss": -18.45575523376465, "global_step": 26803, "epoch": 322} {"train_loss": -18.68608856201172, "global_step": 26804, "epoch": 322} {"train_loss": -18.6580810546875, "global_step": 26805, "epoch": 322} {"train_loss": -18.933565139770508, "global_step": 26806, "epoch": 322} {"train_loss": -19.03824806213379, "global_step": 26807, "epoch": 322} {"train_loss": -18.79867643333343, "global_step": 26808, "epoch": 322, "val_loss": 5850712.0} {"train_loss": -18.63779640197754, "global_step": 26809, "epoch": 323} {"train_loss": -18.58469009399414, "global_step": 26810, "epoch": 323} {"train_loss": -18.866552352905273, "global_step": 26811, "epoch": 323} {"train_loss": -18.586050033569336, "global_step": 26812, "epoch": 323} {"train_loss": -18.645933151245117, "global_step": 26813, "epoch": 323} {"train_loss": -18.657623291015625, "global_step": 26814, "epoch": 323} {"train_loss": -18.57844352722168, "global_step": 26815, "epoch": 323} {"train_loss": -18.36116600036621, "global_step": 26816, "epoch": 323} {"train_loss": -18.468006134033203, "global_step": 26817, "epoch": 323} {"train_loss": -18.37992286682129, "global_step": 26818, "epoch": 323} {"train_loss": -18.7225341796875, "global_step": 26819, "epoch": 323} {"train_loss": -18.654762268066406, "global_step": 26820, "epoch": 323} {"train_loss": -19.234827041625977, "global_step": 26821, "epoch": 323} {"train_loss": -19.052072525024414, "global_step": 26822, "epoch": 323} {"train_loss": -18.792606353759766, "global_step": 26823, "epoch": 323} {"train_loss": -18.74942398071289, "global_step": 26824, "epoch": 323} {"train_loss": -18.621183395385742, "global_step": 26825, "epoch": 323} {"train_loss": -18.864274978637695, "global_step": 26826, "epoch": 323} {"train_loss": -18.72335433959961, "global_step": 26827, "epoch": 323} {"train_loss": -18.88766860961914, "global_step": 26828, "epoch": 323} {"train_loss": -19.010061264038086, "global_step": 26829, "epoch": 323} {"train_loss": -18.772363662719727, "global_step": 26830, "epoch": 323} {"train_loss": -19.01889991760254, "global_step": 26831, "epoch": 323} {"train_loss": -18.8426513671875, "global_step": 26832, "epoch": 323} {"train_loss": -19.095325469970703, "global_step": 26833, "epoch": 323} {"train_loss": -18.8403263092041, "global_step": 26834, "epoch": 323} {"train_loss": -18.850500106811523, "global_step": 26835, "epoch": 323} {"train_loss": -18.573762893676758, "global_step": 26836, "epoch": 323} {"train_loss": -18.776874542236328, "global_step": 26837, "epoch": 323} {"train_loss": -18.788589477539062, "global_step": 26838, "epoch": 323} {"train_loss": -18.50766372680664, "global_step": 26839, "epoch": 323} {"train_loss": -19.092432022094727, "global_step": 26840, "epoch": 323} {"train_loss": -18.736989974975586, "global_step": 26841, "epoch": 323} {"train_loss": -18.43174171447754, "global_step": 26842, "epoch": 323} {"train_loss": -18.45958137512207, "global_step": 26843, "epoch": 323} {"train_loss": -18.755590438842773, "global_step": 26844, "epoch": 323} {"train_loss": -18.799100875854492, "global_step": 26845, "epoch": 323} {"train_loss": -18.527206420898438, "global_step": 26846, "epoch": 323} {"train_loss": -18.606168746948242, "global_step": 26847, "epoch": 323} {"train_loss": -18.593830108642578, "global_step": 26848, "epoch": 323} {"train_loss": -18.920909881591797, "global_step": 26849, "epoch": 323} {"train_loss": -18.917922973632812, "global_step": 26850, "epoch": 323} {"train_loss": -18.706544876098633, "global_step": 26851, "epoch": 323} {"train_loss": -18.862886428833008, "global_step": 26852, "epoch": 323} {"train_loss": -19.102514266967773, "global_step": 26853, "epoch": 323} {"train_loss": -18.78362274169922, "global_step": 26854, "epoch": 323} {"train_loss": -18.686491012573242, "global_step": 26855, "epoch": 323} {"train_loss": -18.69059944152832, "global_step": 26856, "epoch": 323} {"train_loss": -18.511489868164062, "global_step": 26857, "epoch": 323} {"train_loss": -18.703920364379883, "global_step": 26858, "epoch": 323} {"train_loss": -18.948606491088867, "global_step": 26859, "epoch": 323} {"train_loss": -18.78602409362793, "global_step": 26860, "epoch": 323} {"train_loss": -18.977964401245117, "global_step": 26861, "epoch": 323} {"train_loss": -18.873821258544922, "global_step": 26862, "epoch": 323} {"train_loss": -18.655820846557617, "global_step": 26863, "epoch": 323} {"train_loss": -18.819433212280273, "global_step": 26864, "epoch": 323} {"train_loss": -18.7565975189209, "global_step": 26865, "epoch": 323} {"train_loss": -18.758207321166992, "global_step": 26866, "epoch": 323} {"train_loss": -18.63138771057129, "global_step": 26867, "epoch": 323} {"train_loss": -18.497539520263672, "global_step": 26868, "epoch": 323} {"train_loss": -18.672117233276367, "global_step": 26869, "epoch": 323} {"train_loss": -18.643529891967773, "global_step": 26870, "epoch": 323} {"train_loss": -18.603239059448242, "global_step": 26871, "epoch": 323} {"train_loss": -18.870849609375, "global_step": 26872, "epoch": 323} {"train_loss": -18.561628341674805, "global_step": 26873, "epoch": 323} {"train_loss": -18.92925453186035, "global_step": 26874, "epoch": 323} {"train_loss": -18.829051971435547, "global_step": 26875, "epoch": 323} {"train_loss": -18.85886573791504, "global_step": 26876, "epoch": 323} {"train_loss": -18.455188751220703, "global_step": 26877, "epoch": 323} {"train_loss": -18.976144790649414, "global_step": 26878, "epoch": 323} {"train_loss": -18.705249786376953, "global_step": 26879, "epoch": 323} {"train_loss": -18.959014892578125, "global_step": 26880, "epoch": 323} {"train_loss": -18.50419044494629, "global_step": 26881, "epoch": 323} {"train_loss": -18.945423126220703, "global_step": 26882, "epoch": 323} {"train_loss": -18.293241500854492, "global_step": 26883, "epoch": 323} {"train_loss": -19.17782974243164, "global_step": 26884, "epoch": 323} {"train_loss": -18.725011825561523, "global_step": 26885, "epoch": 323} {"train_loss": -18.591520309448242, "global_step": 26886, "epoch": 323} {"train_loss": -18.863452911376953, "global_step": 26887, "epoch": 323} {"train_loss": -18.882360458374023, "global_step": 26888, "epoch": 323} {"train_loss": -18.75149917602539, "global_step": 26889, "epoch": 323} {"train_loss": -18.487390518188477, "global_step": 26890, "epoch": 323} {"train_loss": -18.750853940665003, "global_step": 26891, "epoch": 323, "val_loss": 5965357.0} {"train_loss": -18.727264404296875, "global_step": 26892, "epoch": 324} {"train_loss": -18.36452293395996, "global_step": 26893, "epoch": 324} {"train_loss": -18.582944869995117, "global_step": 26894, "epoch": 324} {"train_loss": -18.48944664001465, "global_step": 26895, "epoch": 324} {"train_loss": -18.841197967529297, "global_step": 26896, "epoch": 324} {"train_loss": -18.586668014526367, "global_step": 26897, "epoch": 324} {"train_loss": -18.858118057250977, "global_step": 26898, "epoch": 324} {"train_loss": -18.53031349182129, "global_step": 26899, "epoch": 324} {"train_loss": -18.601999282836914, "global_step": 26900, "epoch": 324} {"train_loss": -18.77242660522461, "global_step": 26901, "epoch": 324} {"train_loss": -18.88494873046875, "global_step": 26902, "epoch": 324} {"train_loss": -18.86684226989746, "global_step": 26903, "epoch": 324} {"train_loss": -18.412546157836914, "global_step": 26904, "epoch": 324} {"train_loss": -18.908552169799805, "global_step": 26905, "epoch": 324} {"train_loss": -18.779991149902344, "global_step": 26906, "epoch": 324} {"train_loss": -18.409975051879883, "global_step": 26907, "epoch": 324} {"train_loss": -18.41864013671875, "global_step": 26908, "epoch": 324} {"train_loss": -18.515338897705078, "global_step": 26909, "epoch": 324} {"train_loss": -18.804067611694336, "global_step": 26910, "epoch": 324} {"train_loss": -18.92472267150879, "global_step": 26911, "epoch": 324} {"train_loss": -18.55478286743164, "global_step": 26912, "epoch": 324} {"train_loss": -18.683713912963867, "global_step": 26913, "epoch": 324} {"train_loss": -18.62934684753418, "global_step": 26914, "epoch": 324} {"train_loss": -18.984418869018555, "global_step": 26915, "epoch": 324} {"train_loss": -18.796653747558594, "global_step": 26916, "epoch": 324} {"train_loss": -18.638662338256836, "global_step": 26917, "epoch": 324} {"train_loss": -18.979368209838867, "global_step": 26918, "epoch": 324} {"train_loss": -18.769041061401367, "global_step": 26919, "epoch": 324} {"train_loss": -19.147130966186523, "global_step": 26920, "epoch": 324} {"train_loss": -19.00861167907715, "global_step": 26921, "epoch": 324} {"train_loss": -18.659793853759766, "global_step": 26922, "epoch": 324} {"train_loss": -18.628433227539062, "global_step": 26923, "epoch": 324} {"train_loss": -18.657550811767578, "global_step": 26924, "epoch": 324} {"train_loss": -18.84134292602539, "global_step": 26925, "epoch": 324} {"train_loss": -18.2876033782959, "global_step": 26926, "epoch": 324} {"train_loss": -19.20983123779297, "global_step": 26927, "epoch": 324} {"train_loss": -18.55722999572754, "global_step": 26928, "epoch": 324} {"train_loss": -18.73384666442871, "global_step": 26929, "epoch": 324} {"train_loss": -18.749797821044922, "global_step": 26930, "epoch": 324} {"train_loss": -18.81049919128418, "global_step": 26931, "epoch": 324} {"train_loss": -18.688108444213867, "global_step": 26932, "epoch": 324} {"train_loss": -18.86005210876465, "global_step": 26933, "epoch": 324} {"train_loss": -18.69923210144043, "global_step": 26934, "epoch": 324} {"train_loss": -18.7217960357666, "global_step": 26935, "epoch": 324} {"train_loss": -18.68010902404785, "global_step": 26936, "epoch": 324} {"train_loss": -19.189435958862305, "global_step": 26937, "epoch": 324} {"train_loss": -18.474775314331055, "global_step": 26938, "epoch": 324} {"train_loss": -19.044485092163086, "global_step": 26939, "epoch": 324} {"train_loss": -18.804523468017578, "global_step": 26940, "epoch": 324} {"train_loss": -18.7550106048584, "global_step": 26941, "epoch": 324} {"train_loss": -19.069963455200195, "global_step": 26942, "epoch": 324} {"train_loss": -18.98513412475586, "global_step": 26943, "epoch": 324} {"train_loss": -18.85799217224121, "global_step": 26944, "epoch": 324} {"train_loss": -18.938810348510742, "global_step": 26945, "epoch": 324} {"train_loss": -18.90346336364746, "global_step": 26946, "epoch": 324} {"train_loss": -18.96793556213379, "global_step": 26947, "epoch": 324} {"train_loss": -18.953521728515625, "global_step": 26948, "epoch": 324} {"train_loss": -19.064367294311523, "global_step": 26949, "epoch": 324} {"train_loss": -18.65326499938965, "global_step": 26950, "epoch": 324} {"train_loss": -18.80908966064453, "global_step": 26951, "epoch": 324} {"train_loss": -19.02609634399414, "global_step": 26952, "epoch": 324} {"train_loss": -18.60574722290039, "global_step": 26953, "epoch": 324} {"train_loss": -18.89708709716797, "global_step": 26954, "epoch": 324} {"train_loss": -18.80691909790039, "global_step": 26955, "epoch": 324} {"train_loss": -19.000293731689453, "global_step": 26956, "epoch": 324} {"train_loss": -18.9991512298584, "global_step": 26957, "epoch": 324} {"train_loss": -18.453123092651367, "global_step": 26958, "epoch": 324} {"train_loss": -18.23343849182129, "global_step": 26959, "epoch": 324} {"train_loss": -18.60141944885254, "global_step": 26960, "epoch": 324} {"train_loss": -18.962514877319336, "global_step": 26961, "epoch": 324} {"train_loss": -18.59967613220215, "global_step": 26962, "epoch": 324} {"train_loss": -18.82953453063965, "global_step": 26963, "epoch": 324} {"train_loss": -18.777786254882812, "global_step": 26964, "epoch": 324} {"train_loss": -18.391281127929688, "global_step": 26965, "epoch": 324} {"train_loss": -18.785186767578125, "global_step": 26966, "epoch": 324} {"train_loss": -18.764568328857422, "global_step": 26967, "epoch": 324} {"train_loss": -18.54105567932129, "global_step": 26968, "epoch": 324} {"train_loss": -18.661178588867188, "global_step": 26969, "epoch": 324} {"train_loss": -19.004596710205078, "global_step": 26970, "epoch": 324} {"train_loss": -18.55278968811035, "global_step": 26971, "epoch": 324} {"train_loss": -18.60538673400879, "global_step": 26972, "epoch": 324} {"train_loss": -18.729846954345703, "global_step": 26973, "epoch": 324} {"train_loss": -18.75851729978998, "global_step": 26974, "epoch": 324, "val_loss": 5967817.5} {"train_loss": -18.722515106201172, "global_step": 26975, "epoch": 325} {"train_loss": -18.167034149169922, "global_step": 26976, "epoch": 325} {"train_loss": -18.131311416625977, "global_step": 26977, "epoch": 325} {"train_loss": -18.18629264831543, "global_step": 26978, "epoch": 325} {"train_loss": -18.56648063659668, "global_step": 26979, "epoch": 325} {"train_loss": -18.45496940612793, "global_step": 26980, "epoch": 325} {"train_loss": -18.99009895324707, "global_step": 26981, "epoch": 325} {"train_loss": -18.669204711914062, "global_step": 26982, "epoch": 325} {"train_loss": -18.610708236694336, "global_step": 26983, "epoch": 325} {"train_loss": -18.538381576538086, "global_step": 26984, "epoch": 325} {"train_loss": -18.606054306030273, "global_step": 26985, "epoch": 325} {"train_loss": -18.19849395751953, "global_step": 26986, "epoch": 325} {"train_loss": -18.236066818237305, "global_step": 26987, "epoch": 325} {"train_loss": -18.8550968170166, "global_step": 26988, "epoch": 325} {"train_loss": -18.536701202392578, "global_step": 26989, "epoch": 325} {"train_loss": -18.82164764404297, "global_step": 26990, "epoch": 325} {"train_loss": -18.634784698486328, "global_step": 26991, "epoch": 325} {"train_loss": -18.598447799682617, "global_step": 26992, "epoch": 325} {"train_loss": -18.791217803955078, "global_step": 26993, "epoch": 325} {"train_loss": -19.09955596923828, "global_step": 26994, "epoch": 325} {"train_loss": -18.442092895507812, "global_step": 26995, "epoch": 325} {"train_loss": -18.52882194519043, "global_step": 26996, "epoch": 325} {"train_loss": -19.0003662109375, "global_step": 26997, "epoch": 325} {"train_loss": -18.83113670349121, "global_step": 26998, "epoch": 325} {"train_loss": -18.923688888549805, "global_step": 26999, "epoch": 325} {"train_loss": -18.87075424194336, "global_step": 27000, "epoch": 325} {"train_loss": -18.951282501220703, "global_step": 27001, "epoch": 325} {"train_loss": -18.797422409057617, "global_step": 27002, "epoch": 325} {"train_loss": -18.81538200378418, "global_step": 27003, "epoch": 325} {"train_loss": -18.610126495361328, "global_step": 27004, "epoch": 325} {"train_loss": -18.675073623657227, "global_step": 27005, "epoch": 325} {"train_loss": -19.13422966003418, "global_step": 27006, "epoch": 325} {"train_loss": -18.43025779724121, "global_step": 27007, "epoch": 325} {"train_loss": -18.52326774597168, "global_step": 27008, "epoch": 325} {"train_loss": -18.83053970336914, "global_step": 27009, "epoch": 325} {"train_loss": -18.562135696411133, "global_step": 27010, "epoch": 325} {"train_loss": -18.692459106445312, "global_step": 27011, "epoch": 325} {"train_loss": -18.969755172729492, "global_step": 27012, "epoch": 325} {"train_loss": -18.8775577545166, "global_step": 27013, "epoch": 325} {"train_loss": -19.00074577331543, "global_step": 27014, "epoch": 325} {"train_loss": -18.496728897094727, "global_step": 27015, "epoch": 325} {"train_loss": -18.901273727416992, "global_step": 27016, "epoch": 325} {"train_loss": -18.87369155883789, "global_step": 27017, "epoch": 325} {"train_loss": -18.788679122924805, "global_step": 27018, "epoch": 325} {"train_loss": -18.742101669311523, "global_step": 27019, "epoch": 325} {"train_loss": -18.930789947509766, "global_step": 27020, "epoch": 325} {"train_loss": -18.717329025268555, "global_step": 27021, "epoch": 325} {"train_loss": -18.94784164428711, "global_step": 27022, "epoch": 325} {"train_loss": -19.051538467407227, "global_step": 27023, "epoch": 325} {"train_loss": -18.76344871520996, "global_step": 27024, "epoch": 325} {"train_loss": -18.711017608642578, "global_step": 27025, "epoch": 325} {"train_loss": -19.03959083557129, "global_step": 27026, "epoch": 325} {"train_loss": -18.4337215423584, "global_step": 27027, "epoch": 325} {"train_loss": -18.353429794311523, "global_step": 27028, "epoch": 325} {"train_loss": -18.488243103027344, "global_step": 27029, "epoch": 325} {"train_loss": -18.667463302612305, "global_step": 27030, "epoch": 325} {"train_loss": -18.737293243408203, "global_step": 27031, "epoch": 325} {"train_loss": -18.749103546142578, "global_step": 27032, "epoch": 325} {"train_loss": -18.689834594726562, "global_step": 27033, "epoch": 325} {"train_loss": -18.765111923217773, "global_step": 27034, "epoch": 325} {"train_loss": -19.12786293029785, "global_step": 27035, "epoch": 325} {"train_loss": -18.434432983398438, "global_step": 27036, "epoch": 325} {"train_loss": -19.018054962158203, "global_step": 27037, "epoch": 325} {"train_loss": -18.75520133972168, "global_step": 27038, "epoch": 325} {"train_loss": -18.691627502441406, "global_step": 27039, "epoch": 325} {"train_loss": -19.05548858642578, "global_step": 27040, "epoch": 325} {"train_loss": -18.289413452148438, "global_step": 27041, "epoch": 325} {"train_loss": -18.897480010986328, "global_step": 27042, "epoch": 325} {"train_loss": -18.395801544189453, "global_step": 27043, "epoch": 325} {"train_loss": -18.79189109802246, "global_step": 27044, "epoch": 325} {"train_loss": -18.667932510375977, "global_step": 27045, "epoch": 325} {"train_loss": -19.277454376220703, "global_step": 27046, "epoch": 325} {"train_loss": -19.220800399780273, "global_step": 27047, "epoch": 325} {"train_loss": -18.787235260009766, "global_step": 27048, "epoch": 325} {"train_loss": -18.67121696472168, "global_step": 27049, "epoch": 325} {"train_loss": -18.859567642211914, "global_step": 27050, "epoch": 325} {"train_loss": -18.384000778198242, "global_step": 27051, "epoch": 325} {"train_loss": -18.914941787719727, "global_step": 27052, "epoch": 325} {"train_loss": -18.718530654907227, "global_step": 27053, "epoch": 325} {"train_loss": -18.624338150024414, "global_step": 27054, "epoch": 325} {"train_loss": -18.6252498626709, "global_step": 27055, "epoch": 325} {"train_loss": -19.0239315032959, "global_step": 27056, "epoch": 325} {"train_loss": -18.741028797195618, "global_step": 27057, "epoch": 325, "val_loss": 5987303.0} {"train_loss": -18.203418731689453, "global_step": 27058, "epoch": 326} {"train_loss": -18.5426025390625, "global_step": 27059, "epoch": 326} {"train_loss": -18.61481285095215, "global_step": 27060, "epoch": 326} {"train_loss": -18.79684066772461, "global_step": 27061, "epoch": 326} {"train_loss": -18.739404678344727, "global_step": 27062, "epoch": 326} {"train_loss": -18.83047103881836, "global_step": 27063, "epoch": 326} {"train_loss": -18.696191787719727, "global_step": 27064, "epoch": 326} {"train_loss": -18.47348403930664, "global_step": 27065, "epoch": 326} {"train_loss": -18.94349479675293, "global_step": 27066, "epoch": 326} {"train_loss": -18.458951950073242, "global_step": 27067, "epoch": 326} {"train_loss": -18.68534278869629, "global_step": 27068, "epoch": 326} {"train_loss": -18.8437442779541, "global_step": 27069, "epoch": 326} {"train_loss": -18.77131462097168, "global_step": 27070, "epoch": 326} {"train_loss": -18.801090240478516, "global_step": 27071, "epoch": 326} {"train_loss": -18.765975952148438, "global_step": 27072, "epoch": 326} {"train_loss": -18.847393035888672, "global_step": 27073, "epoch": 326} {"train_loss": -19.0271053314209, "global_step": 27074, "epoch": 326} {"train_loss": -18.782638549804688, "global_step": 27075, "epoch": 326} {"train_loss": -18.494049072265625, "global_step": 27076, "epoch": 326} {"train_loss": -18.66794776916504, "global_step": 27077, "epoch": 326} {"train_loss": -19.073400497436523, "global_step": 27078, "epoch": 326} {"train_loss": -19.007217407226562, "global_step": 27079, "epoch": 326} {"train_loss": -19.274030685424805, "global_step": 27080, "epoch": 326} {"train_loss": -18.543638229370117, "global_step": 27081, "epoch": 326} {"train_loss": -18.7568416595459, "global_step": 27082, "epoch": 326} {"train_loss": -18.824338912963867, "global_step": 27083, "epoch": 326} {"train_loss": -18.5330867767334, "global_step": 27084, "epoch": 326} {"train_loss": -18.98294448852539, "global_step": 27085, "epoch": 326} {"train_loss": -18.91788101196289, "global_step": 27086, "epoch": 326} {"train_loss": -18.81211280822754, "global_step": 27087, "epoch": 326} {"train_loss": -18.20528221130371, "global_step": 27088, "epoch": 326} {"train_loss": -18.750308990478516, "global_step": 27089, "epoch": 326} {"train_loss": -18.40455436706543, "global_step": 27090, "epoch": 326} {"train_loss": -18.8259334564209, "global_step": 27091, "epoch": 326} {"train_loss": -19.03167724609375, "global_step": 27092, "epoch": 326} {"train_loss": -18.87184715270996, "global_step": 27093, "epoch": 326} {"train_loss": -18.557004928588867, "global_step": 27094, "epoch": 326} {"train_loss": -18.78963279724121, "global_step": 27095, "epoch": 326} {"train_loss": -19.161428451538086, "global_step": 27096, "epoch": 326} {"train_loss": -18.858610153198242, "global_step": 27097, "epoch": 326} {"train_loss": -18.63248062133789, "global_step": 27098, "epoch": 326} {"train_loss": -18.70513153076172, "global_step": 27099, "epoch": 326} {"train_loss": -18.773365020751953, "global_step": 27100, "epoch": 326} {"train_loss": -18.822099685668945, "global_step": 27101, "epoch": 326} {"train_loss": -18.9064884185791, "global_step": 27102, "epoch": 326} {"train_loss": -18.439218521118164, "global_step": 27103, "epoch": 326} {"train_loss": -18.655704498291016, "global_step": 27104, "epoch": 326} {"train_loss": -18.763086318969727, "global_step": 27105, "epoch": 326} {"train_loss": -18.51376724243164, "global_step": 27106, "epoch": 326} {"train_loss": -18.768585205078125, "global_step": 27107, "epoch": 326} {"train_loss": -19.262897491455078, "global_step": 27108, "epoch": 326} {"train_loss": -18.787519454956055, "global_step": 27109, "epoch": 326} {"train_loss": -18.81898307800293, "global_step": 27110, "epoch": 326} {"train_loss": -18.909740447998047, "global_step": 27111, "epoch": 326} {"train_loss": -18.54903221130371, "global_step": 27112, "epoch": 326} {"train_loss": -18.808910369873047, "global_step": 27113, "epoch": 326} {"train_loss": -18.548803329467773, "global_step": 27114, "epoch": 326} {"train_loss": -18.76018714904785, "global_step": 27115, "epoch": 326} {"train_loss": -18.89216423034668, "global_step": 27116, "epoch": 326} {"train_loss": -18.54352569580078, "global_step": 27117, "epoch": 326} {"train_loss": -18.880897521972656, "global_step": 27118, "epoch": 326} {"train_loss": -18.741220474243164, "global_step": 27119, "epoch": 326} {"train_loss": -19.135889053344727, "global_step": 27120, "epoch": 326} {"train_loss": -18.597700119018555, "global_step": 27121, "epoch": 326} {"train_loss": -18.75941276550293, "global_step": 27122, "epoch": 326} {"train_loss": -19.035303115844727, "global_step": 27123, "epoch": 326} {"train_loss": -18.967844009399414, "global_step": 27124, "epoch": 326} {"train_loss": -18.516868591308594, "global_step": 27125, "epoch": 326} {"train_loss": -18.924823760986328, "global_step": 27126, "epoch": 326} {"train_loss": -18.69997215270996, "global_step": 27127, "epoch": 326} {"train_loss": -19.02581787109375, "global_step": 27128, "epoch": 326} {"train_loss": -19.21462059020996, "global_step": 27129, "epoch": 326} {"train_loss": -18.888349533081055, "global_step": 27130, "epoch": 326} {"train_loss": -18.357807159423828, "global_step": 27131, "epoch": 326} {"train_loss": -18.834335327148438, "global_step": 27132, "epoch": 326} {"train_loss": -18.869577407836914, "global_step": 27133, "epoch": 326} {"train_loss": -18.797910690307617, "global_step": 27134, "epoch": 326} {"train_loss": -19.09309959411621, "global_step": 27135, "epoch": 326} {"train_loss": -18.733755111694336, "global_step": 27136, "epoch": 326} {"train_loss": -18.835298538208008, "global_step": 27137, "epoch": 326} {"train_loss": -19.07010841369629, "global_step": 27138, "epoch": 326} {"train_loss": -18.679691314697266, "global_step": 27139, "epoch": 326} {"train_loss": -18.77662555280938, "global_step": 27140, "epoch": 326, "val_loss": 6051601.0} {"train_loss": -18.648313522338867, "global_step": 27141, "epoch": 327} {"train_loss": -18.785409927368164, "global_step": 27142, "epoch": 327} {"train_loss": -19.07034683227539, "global_step": 27143, "epoch": 327} {"train_loss": -18.841184616088867, "global_step": 27144, "epoch": 327} {"train_loss": -18.92976188659668, "global_step": 27145, "epoch": 327} {"train_loss": -18.703393936157227, "global_step": 27146, "epoch": 327} {"train_loss": -18.715208053588867, "global_step": 27147, "epoch": 327} {"train_loss": -18.92852783203125, "global_step": 27148, "epoch": 327} {"train_loss": -18.618932723999023, "global_step": 27149, "epoch": 327} {"train_loss": -19.051006317138672, "global_step": 27150, "epoch": 327} {"train_loss": -18.731191635131836, "global_step": 27151, "epoch": 327} {"train_loss": -18.96684455871582, "global_step": 27152, "epoch": 327} {"train_loss": -18.86244010925293, "global_step": 27153, "epoch": 327} {"train_loss": -18.547353744506836, "global_step": 27154, "epoch": 327} {"train_loss": -18.557903289794922, "global_step": 27155, "epoch": 327} {"train_loss": -18.807159423828125, "global_step": 27156, "epoch": 327} {"train_loss": -19.08729362487793, "global_step": 27157, "epoch": 327} {"train_loss": -18.805025100708008, "global_step": 27158, "epoch": 327} {"train_loss": -18.8795108795166, "global_step": 27159, "epoch": 327} {"train_loss": -18.925434112548828, "global_step": 27160, "epoch": 327} {"train_loss": -18.363555908203125, "global_step": 27161, "epoch": 327} {"train_loss": -18.728200912475586, "global_step": 27162, "epoch": 327} {"train_loss": -18.7355899810791, "global_step": 27163, "epoch": 327} {"train_loss": -18.552770614624023, "global_step": 27164, "epoch": 327} {"train_loss": -18.766752243041992, "global_step": 27165, "epoch": 327} {"train_loss": -19.070192337036133, "global_step": 27166, "epoch": 327} {"train_loss": -19.123205184936523, "global_step": 27167, "epoch": 327} {"train_loss": -18.79479217529297, "global_step": 27168, "epoch": 327} {"train_loss": -19.00384521484375, "global_step": 27169, "epoch": 327} {"train_loss": -18.613489151000977, "global_step": 27170, "epoch": 327} {"train_loss": -18.969152450561523, "global_step": 27171, "epoch": 327} {"train_loss": -18.80234146118164, "global_step": 27172, "epoch": 327} {"train_loss": -18.80821418762207, "global_step": 27173, "epoch": 327} {"train_loss": -18.59674072265625, "global_step": 27174, "epoch": 327} {"train_loss": -18.56052589416504, "global_step": 27175, "epoch": 327} {"train_loss": -18.967639923095703, "global_step": 27176, "epoch": 327} {"train_loss": -18.572635650634766, "global_step": 27177, "epoch": 327} {"train_loss": -18.76254653930664, "global_step": 27178, "epoch": 327} {"train_loss": -18.845962524414062, "global_step": 27179, "epoch": 327} {"train_loss": -18.74456787109375, "global_step": 27180, "epoch": 327} {"train_loss": -18.346769332885742, "global_step": 27181, "epoch": 327} {"train_loss": -19.029577255249023, "global_step": 27182, "epoch": 327} {"train_loss": -18.52219581604004, "global_step": 27183, "epoch": 327} {"train_loss": -19.105276107788086, "global_step": 27184, "epoch": 327} {"train_loss": -19.0087890625, "global_step": 27185, "epoch": 327} {"train_loss": -18.867069244384766, "global_step": 27186, "epoch": 327} {"train_loss": -18.694381713867188, "global_step": 27187, "epoch": 327} {"train_loss": -18.59889793395996, "global_step": 27188, "epoch": 327} {"train_loss": -18.714162826538086, "global_step": 27189, "epoch": 327} {"train_loss": -18.98293685913086, "global_step": 27190, "epoch": 327} {"train_loss": -18.885351181030273, "global_step": 27191, "epoch": 327} {"train_loss": -18.823150634765625, "global_step": 27192, "epoch": 327} {"train_loss": -18.682554244995117, "global_step": 27193, "epoch": 327} {"train_loss": -18.92327880859375, "global_step": 27194, "epoch": 327} {"train_loss": -18.619421005249023, "global_step": 27195, "epoch": 327} {"train_loss": -18.629291534423828, "global_step": 27196, "epoch": 327} {"train_loss": -18.806968688964844, "global_step": 27197, "epoch": 327} {"train_loss": -18.958433151245117, "global_step": 27198, "epoch": 327} {"train_loss": -18.94521713256836, "global_step": 27199, "epoch": 327} {"train_loss": -18.48467254638672, "global_step": 27200, "epoch": 327} {"train_loss": -18.981285095214844, "global_step": 27201, "epoch": 327} {"train_loss": -19.13130760192871, "global_step": 27202, "epoch": 327} {"train_loss": -18.728086471557617, "global_step": 27203, "epoch": 327} {"train_loss": -18.69990348815918, "global_step": 27204, "epoch": 327} {"train_loss": -19.15687370300293, "global_step": 27205, "epoch": 327} {"train_loss": -19.12713050842285, "global_step": 27206, "epoch": 327} {"train_loss": -18.916221618652344, "global_step": 27207, "epoch": 327} {"train_loss": -19.148664474487305, "global_step": 27208, "epoch": 327} {"train_loss": -18.96521759033203, "global_step": 27209, "epoch": 327} {"train_loss": -18.80535316467285, "global_step": 27210, "epoch": 327} {"train_loss": -19.037887573242188, "global_step": 27211, "epoch": 327} {"train_loss": -18.83473777770996, "global_step": 27212, "epoch": 327} {"train_loss": -18.617721557617188, "global_step": 27213, "epoch": 327} {"train_loss": -18.508502960205078, "global_step": 27214, "epoch": 327} {"train_loss": -18.639333724975586, "global_step": 27215, "epoch": 327} {"train_loss": -18.434938430786133, "global_step": 27216, "epoch": 327} {"train_loss": -18.817840576171875, "global_step": 27217, "epoch": 327} {"train_loss": -18.43521499633789, "global_step": 27218, "epoch": 327} {"train_loss": -18.772581100463867, "global_step": 27219, "epoch": 327} {"train_loss": -18.474393844604492, "global_step": 27220, "epoch": 327} {"train_loss": -18.728918075561523, "global_step": 27221, "epoch": 327} {"train_loss": -18.78981590270996, "global_step": 27222, "epoch": 327} {"train_loss": -18.78759032559682, "global_step": 27223, "epoch": 327, "val_loss": 5945123.5} {"train_loss": -19.15403938293457, "global_step": 27224, "epoch": 328} {"train_loss": -18.69672393798828, "global_step": 27225, "epoch": 328} {"train_loss": -18.592151641845703, "global_step": 27226, "epoch": 328} {"train_loss": -18.431425094604492, "global_step": 27227, "epoch": 328} {"train_loss": -18.569198608398438, "global_step": 27228, "epoch": 328} {"train_loss": -18.867525100708008, "global_step": 27229, "epoch": 328} {"train_loss": -18.902969360351562, "global_step": 27230, "epoch": 328} {"train_loss": -18.81194496154785, "global_step": 27231, "epoch": 328} {"train_loss": -18.87812614440918, "global_step": 27232, "epoch": 328} {"train_loss": -18.820755004882812, "global_step": 27233, "epoch": 328} {"train_loss": -18.766000747680664, "global_step": 27234, "epoch": 328} {"train_loss": -18.87835121154785, "global_step": 27235, "epoch": 328} {"train_loss": -18.602880477905273, "global_step": 27236, "epoch": 328} {"train_loss": -18.441007614135742, "global_step": 27237, "epoch": 328} {"train_loss": -18.717382431030273, "global_step": 27238, "epoch": 328} {"train_loss": -18.903669357299805, "global_step": 27239, "epoch": 328} {"train_loss": -19.0070743560791, "global_step": 27240, "epoch": 328} {"train_loss": -19.210193634033203, "global_step": 27241, "epoch": 328} {"train_loss": -18.390869140625, "global_step": 27242, "epoch": 328} {"train_loss": -18.78806495666504, "global_step": 27243, "epoch": 328} {"train_loss": -18.69402503967285, "global_step": 27244, "epoch": 328} {"train_loss": -18.774913787841797, "global_step": 27245, "epoch": 328} {"train_loss": -18.584064483642578, "global_step": 27246, "epoch": 328} {"train_loss": -18.72467041015625, "global_step": 27247, "epoch": 328} {"train_loss": -18.571226119995117, "global_step": 27248, "epoch": 328} {"train_loss": -18.390836715698242, "global_step": 27249, "epoch": 328} {"train_loss": -18.55924415588379, "global_step": 27250, "epoch": 328} {"train_loss": -18.527191162109375, "global_step": 27251, "epoch": 328} {"train_loss": -19.038156509399414, "global_step": 27252, "epoch": 328} {"train_loss": -19.0084285736084, "global_step": 27253, "epoch": 328} {"train_loss": -18.728897094726562, "global_step": 27254, "epoch": 328} {"train_loss": -18.9793758392334, "global_step": 27255, "epoch": 328} {"train_loss": -18.986066818237305, "global_step": 27256, "epoch": 328} {"train_loss": -18.910629272460938, "global_step": 27257, "epoch": 328} {"train_loss": -18.931591033935547, "global_step": 27258, "epoch": 328} {"train_loss": -19.05483055114746, "global_step": 27259, "epoch": 328} {"train_loss": -19.2374267578125, "global_step": 27260, "epoch": 328} {"train_loss": -18.471784591674805, "global_step": 27261, "epoch": 328} {"train_loss": -18.79818344116211, "global_step": 27262, "epoch": 328} {"train_loss": -18.80987548828125, "global_step": 27263, "epoch": 328} {"train_loss": -18.75460433959961, "global_step": 27264, "epoch": 328} {"train_loss": -19.0675048828125, "global_step": 27265, "epoch": 328} {"train_loss": -18.815479278564453, "global_step": 27266, "epoch": 328} {"train_loss": -18.534046173095703, "global_step": 27267, "epoch": 328} {"train_loss": -19.24759292602539, "global_step": 27268, "epoch": 328} {"train_loss": -19.285856246948242, "global_step": 27269, "epoch": 328} {"train_loss": -18.547473907470703, "global_step": 27270, "epoch": 328} {"train_loss": -18.753280639648438, "global_step": 27271, "epoch": 328} {"train_loss": -18.44352149963379, "global_step": 27272, "epoch": 328} {"train_loss": -18.873456954956055, "global_step": 27273, "epoch": 328} {"train_loss": -19.086042404174805, "global_step": 27274, "epoch": 328} {"train_loss": -18.857810974121094, "global_step": 27275, "epoch": 328} {"train_loss": -18.532148361206055, "global_step": 27276, "epoch": 328} {"train_loss": -18.46084976196289, "global_step": 27277, "epoch": 328} {"train_loss": -18.775238037109375, "global_step": 27278, "epoch": 328} {"train_loss": -18.97199058532715, "global_step": 27279, "epoch": 328} {"train_loss": -18.91957664489746, "global_step": 27280, "epoch": 328} {"train_loss": -19.00917625427246, "global_step": 27281, "epoch": 328} {"train_loss": -18.688413619995117, "global_step": 27282, "epoch": 328} {"train_loss": -18.61122703552246, "global_step": 27283, "epoch": 328} {"train_loss": -18.20139503479004, "global_step": 27284, "epoch": 328} {"train_loss": -18.66118812561035, "global_step": 27285, "epoch": 328} {"train_loss": -18.725658416748047, "global_step": 27286, "epoch": 328} {"train_loss": -19.151525497436523, "global_step": 27287, "epoch": 328} {"train_loss": -18.55009651184082, "global_step": 27288, "epoch": 328} {"train_loss": -18.4216251373291, "global_step": 27289, "epoch": 328} {"train_loss": -19.10590934753418, "global_step": 27290, "epoch": 328} {"train_loss": -18.625919342041016, "global_step": 27291, "epoch": 328} {"train_loss": -18.894941329956055, "global_step": 27292, "epoch": 328} {"train_loss": -18.940032958984375, "global_step": 27293, "epoch": 328} {"train_loss": -18.527175903320312, "global_step": 27294, "epoch": 328} {"train_loss": -18.797117233276367, "global_step": 27295, "epoch": 328} {"train_loss": -18.918973922729492, "global_step": 27296, "epoch": 328} {"train_loss": -18.835140228271484, "global_step": 27297, "epoch": 328} {"train_loss": -18.616613388061523, "global_step": 27298, "epoch": 328} {"train_loss": -18.767942428588867, "global_step": 27299, "epoch": 328} {"train_loss": -18.65791893005371, "global_step": 27300, "epoch": 328} {"train_loss": -18.689472198486328, "global_step": 27301, "epoch": 328} {"train_loss": -18.89548683166504, "global_step": 27302, "epoch": 328} {"train_loss": -18.839204788208008, "global_step": 27303, "epoch": 328} {"train_loss": -18.949066162109375, "global_step": 27304, "epoch": 328} {"train_loss": -18.752792358398438, "global_step": 27305, "epoch": 328} {"train_loss": -18.77687330131071, "global_step": 27306, "epoch": 328, "val_loss": 6029178.5} {"train_loss": -18.30809211730957, "global_step": 27307, "epoch": 329} {"train_loss": -18.534849166870117, "global_step": 27308, "epoch": 329} {"train_loss": -18.774612426757812, "global_step": 27309, "epoch": 329} {"train_loss": -18.754785537719727, "global_step": 27310, "epoch": 329} {"train_loss": -18.526395797729492, "global_step": 27311, "epoch": 329} {"train_loss": -19.042016983032227, "global_step": 27312, "epoch": 329} {"train_loss": -18.73249053955078, "global_step": 27313, "epoch": 329} {"train_loss": -18.987735748291016, "global_step": 27314, "epoch": 329} {"train_loss": -18.66741180419922, "global_step": 27315, "epoch": 329} {"train_loss": -18.663715362548828, "global_step": 27316, "epoch": 329} {"train_loss": -18.834558486938477, "global_step": 27317, "epoch": 329} {"train_loss": -19.105607986450195, "global_step": 27318, "epoch": 329} {"train_loss": -19.00263023376465, "global_step": 27319, "epoch": 329} {"train_loss": -18.998992919921875, "global_step": 27320, "epoch": 329} {"train_loss": -18.894010543823242, "global_step": 27321, "epoch": 329} {"train_loss": -18.705488204956055, "global_step": 27322, "epoch": 329} {"train_loss": -18.651111602783203, "global_step": 27323, "epoch": 329} {"train_loss": -18.193836212158203, "global_step": 27324, "epoch": 329} {"train_loss": -18.820737838745117, "global_step": 27325, "epoch": 329} {"train_loss": -19.18411636352539, "global_step": 27326, "epoch": 329} {"train_loss": -18.707077026367188, "global_step": 27327, "epoch": 329} {"train_loss": -18.50156021118164, "global_step": 27328, "epoch": 329} {"train_loss": -18.648324966430664, "global_step": 27329, "epoch": 329} {"train_loss": -19.144895553588867, "global_step": 27330, "epoch": 329} {"train_loss": -19.15247344970703, "global_step": 27331, "epoch": 329} {"train_loss": -19.14046859741211, "global_step": 27332, "epoch": 329} {"train_loss": -18.505014419555664, "global_step": 27333, "epoch": 329} {"train_loss": -18.757505416870117, "global_step": 27334, "epoch": 329} {"train_loss": -18.9509220123291, "global_step": 27335, "epoch": 329} {"train_loss": -18.385589599609375, "global_step": 27336, "epoch": 329} {"train_loss": -18.93354034423828, "global_step": 27337, "epoch": 329} {"train_loss": -18.58247947692871, "global_step": 27338, "epoch": 329} {"train_loss": -18.747671127319336, "global_step": 27339, "epoch": 329} {"train_loss": -18.999662399291992, "global_step": 27340, "epoch": 329} {"train_loss": -18.4790096282959, "global_step": 27341, "epoch": 329} {"train_loss": -19.07014274597168, "global_step": 27342, "epoch": 329} {"train_loss": -19.23664093017578, "global_step": 27343, "epoch": 329} {"train_loss": -18.722976684570312, "global_step": 27344, "epoch": 329} {"train_loss": -18.549142837524414, "global_step": 27345, "epoch": 329} {"train_loss": -18.8341121673584, "global_step": 27346, "epoch": 329} {"train_loss": -19.0994930267334, "global_step": 27347, "epoch": 329} {"train_loss": -18.829723358154297, "global_step": 27348, "epoch": 329} {"train_loss": -18.523296356201172, "global_step": 27349, "epoch": 329} {"train_loss": -18.876873016357422, "global_step": 27350, "epoch": 329} {"train_loss": -18.489032745361328, "global_step": 27351, "epoch": 329} {"train_loss": -18.780515670776367, "global_step": 27352, "epoch": 329} {"train_loss": -18.62263298034668, "global_step": 27353, "epoch": 329} {"train_loss": -18.803359985351562, "global_step": 27354, "epoch": 329} {"train_loss": -18.85273551940918, "global_step": 27355, "epoch": 329} {"train_loss": -18.69999885559082, "global_step": 27356, "epoch": 329} {"train_loss": -19.192171096801758, "global_step": 27357, "epoch": 329} {"train_loss": -18.690866470336914, "global_step": 27358, "epoch": 329} {"train_loss": -18.920785903930664, "global_step": 27359, "epoch": 329} {"train_loss": -18.71587371826172, "global_step": 27360, "epoch": 329} {"train_loss": -19.001157760620117, "global_step": 27361, "epoch": 329} {"train_loss": -18.66030502319336, "global_step": 27362, "epoch": 329} {"train_loss": -18.773374557495117, "global_step": 27363, "epoch": 329} {"train_loss": -18.874597549438477, "global_step": 27364, "epoch": 329} {"train_loss": -18.568655014038086, "global_step": 27365, "epoch": 329} {"train_loss": -18.777435302734375, "global_step": 27366, "epoch": 329} {"train_loss": -18.660446166992188, "global_step": 27367, "epoch": 329} {"train_loss": -19.039321899414062, "global_step": 27368, "epoch": 329} {"train_loss": -18.73799705505371, "global_step": 27369, "epoch": 329} {"train_loss": -18.859399795532227, "global_step": 27370, "epoch": 329} {"train_loss": -18.58949851989746, "global_step": 27371, "epoch": 329} {"train_loss": -18.9454288482666, "global_step": 27372, "epoch": 329} {"train_loss": -19.14703369140625, "global_step": 27373, "epoch": 329} {"train_loss": -18.713285446166992, "global_step": 27374, "epoch": 329} {"train_loss": -19.004404067993164, "global_step": 27375, "epoch": 329} {"train_loss": -18.620031356811523, "global_step": 27376, "epoch": 329} {"train_loss": -18.859296798706055, "global_step": 27377, "epoch": 329} {"train_loss": -18.865034103393555, "global_step": 27378, "epoch": 329} {"train_loss": -19.070425033569336, "global_step": 27379, "epoch": 329} {"train_loss": -18.809953689575195, "global_step": 27380, "epoch": 329} {"train_loss": -19.0079345703125, "global_step": 27381, "epoch": 329} {"train_loss": -18.82517433166504, "global_step": 27382, "epoch": 329} {"train_loss": -18.588115692138672, "global_step": 27383, "epoch": 329} {"train_loss": -18.89654541015625, "global_step": 27384, "epoch": 329} {"train_loss": -18.41693687438965, "global_step": 27385, "epoch": 329} {"train_loss": -18.862483978271484, "global_step": 27386, "epoch": 329} {"train_loss": -18.76580810546875, "global_step": 27387, "epoch": 329} {"train_loss": -18.633203506469727, "global_step": 27388, "epoch": 329} {"train_loss": -18.802413917449584, "global_step": 27389, "epoch": 329, "val_loss": 6095951.0} {"train_loss": -18.26068115234375, "global_step": 27390, "epoch": 330} {"train_loss": -19.05029296875, "global_step": 27391, "epoch": 330} {"train_loss": -18.600126266479492, "global_step": 27392, "epoch": 330} {"train_loss": -18.327316284179688, "global_step": 27393, "epoch": 330} {"train_loss": -18.415159225463867, "global_step": 27394, "epoch": 330} {"train_loss": -18.616878509521484, "global_step": 27395, "epoch": 330} {"train_loss": -18.483112335205078, "global_step": 27396, "epoch": 330} {"train_loss": -19.3095760345459, "global_step": 27397, "epoch": 330} {"train_loss": -18.52463722229004, "global_step": 27398, "epoch": 330} {"train_loss": -18.641996383666992, "global_step": 27399, "epoch": 330} {"train_loss": -18.66095542907715, "global_step": 27400, "epoch": 330} {"train_loss": -18.52611541748047, "global_step": 27401, "epoch": 330} {"train_loss": -18.3748836517334, "global_step": 27402, "epoch": 330} {"train_loss": -19.232229232788086, "global_step": 27403, "epoch": 330} {"train_loss": -18.445724487304688, "global_step": 27404, "epoch": 330} {"train_loss": -19.288211822509766, "global_step": 27405, "epoch": 330} {"train_loss": -18.678020477294922, "global_step": 27406, "epoch": 330} {"train_loss": -18.899152755737305, "global_step": 27407, "epoch": 330} {"train_loss": -19.117839813232422, "global_step": 27408, "epoch": 330} {"train_loss": -18.23681640625, "global_step": 27409, "epoch": 330} {"train_loss": -18.618579864501953, "global_step": 27410, "epoch": 330} {"train_loss": -18.940290451049805, "global_step": 27411, "epoch": 330} {"train_loss": -18.65132713317871, "global_step": 27412, "epoch": 330} {"train_loss": -18.411849975585938, "global_step": 27413, "epoch": 330} {"train_loss": -18.978469848632812, "global_step": 27414, "epoch": 330} {"train_loss": -18.637184143066406, "global_step": 27415, "epoch": 330} {"train_loss": -19.024585723876953, "global_step": 27416, "epoch": 330} {"train_loss": -18.575777053833008, "global_step": 27417, "epoch": 330} {"train_loss": -18.645977020263672, "global_step": 27418, "epoch": 330} {"train_loss": -18.60198402404785, "global_step": 27419, "epoch": 330} {"train_loss": -18.70233917236328, "global_step": 27420, "epoch": 330} {"train_loss": -18.950437545776367, "global_step": 27421, "epoch": 330} {"train_loss": -18.75284194946289, "global_step": 27422, "epoch": 330} {"train_loss": -18.549549102783203, "global_step": 27423, "epoch": 330} {"train_loss": -19.06688690185547, "global_step": 27424, "epoch": 330} {"train_loss": -18.815690994262695, "global_step": 27425, "epoch": 330} {"train_loss": -18.72406005859375, "global_step": 27426, "epoch": 330} {"train_loss": -18.923940658569336, "global_step": 27427, "epoch": 330} {"train_loss": -18.94337272644043, "global_step": 27428, "epoch": 330} {"train_loss": -18.737083435058594, "global_step": 27429, "epoch": 330} {"train_loss": -19.137741088867188, "global_step": 27430, "epoch": 330} {"train_loss": -18.75215721130371, "global_step": 27431, "epoch": 330} {"train_loss": -18.869647979736328, "global_step": 27432, "epoch": 330} {"train_loss": -18.406558990478516, "global_step": 27433, "epoch": 330} {"train_loss": -18.985580444335938, "global_step": 27434, "epoch": 330} {"train_loss": -18.65252685546875, "global_step": 27435, "epoch": 330} {"train_loss": -18.8111572265625, "global_step": 27436, "epoch": 330} {"train_loss": -18.767854690551758, "global_step": 27437, "epoch": 330} {"train_loss": -18.670133590698242, "global_step": 27438, "epoch": 330} {"train_loss": -18.84012794494629, "global_step": 27439, "epoch": 330} {"train_loss": -18.49901008605957, "global_step": 27440, "epoch": 330} {"train_loss": -18.647167205810547, "global_step": 27441, "epoch": 330} {"train_loss": -18.667011260986328, "global_step": 27442, "epoch": 330} {"train_loss": -18.547582626342773, "global_step": 27443, "epoch": 330} {"train_loss": -18.595605850219727, "global_step": 27444, "epoch": 330} {"train_loss": -18.564359664916992, "global_step": 27445, "epoch": 330} {"train_loss": -18.12369728088379, "global_step": 27446, "epoch": 330} {"train_loss": -18.707096099853516, "global_step": 27447, "epoch": 330} {"train_loss": -18.60684585571289, "global_step": 27448, "epoch": 330} {"train_loss": -18.73261833190918, "global_step": 27449, "epoch": 330} {"train_loss": -18.9442195892334, "global_step": 27450, "epoch": 330} {"train_loss": -18.898099899291992, "global_step": 27451, "epoch": 330} {"train_loss": -18.705076217651367, "global_step": 27452, "epoch": 330} {"train_loss": -19.111486434936523, "global_step": 27453, "epoch": 330} {"train_loss": -19.193410873413086, "global_step": 27454, "epoch": 330} {"train_loss": -18.990497589111328, "global_step": 27455, "epoch": 330} {"train_loss": -18.8256778717041, "global_step": 27456, "epoch": 330} {"train_loss": -18.57089614868164, "global_step": 27457, "epoch": 330} {"train_loss": -18.95053482055664, "global_step": 27458, "epoch": 330} {"train_loss": -18.78846549987793, "global_step": 27459, "epoch": 330} {"train_loss": -18.450016021728516, "global_step": 27460, "epoch": 330} {"train_loss": -18.836536407470703, "global_step": 27461, "epoch": 330} {"train_loss": -19.157135009765625, "global_step": 27462, "epoch": 330} {"train_loss": -18.478424072265625, "global_step": 27463, "epoch": 330} {"train_loss": -18.902103424072266, "global_step": 27464, "epoch": 330} {"train_loss": -18.881179809570312, "global_step": 27465, "epoch": 330} {"train_loss": -18.916959762573242, "global_step": 27466, "epoch": 330} {"train_loss": -18.871957778930664, "global_step": 27467, "epoch": 330} {"train_loss": -18.727153778076172, "global_step": 27468, "epoch": 330} {"train_loss": -18.89547348022461, "global_step": 27469, "epoch": 330} {"train_loss": -18.622434616088867, "global_step": 27470, "epoch": 330} {"train_loss": -19.18709373474121, "global_step": 27471, "epoch": 330} {"train_loss": -18.73485840946795, "global_step": 27472, "epoch": 330, "val_loss": 5998681.5} {"train_loss": -18.748321533203125, "global_step": 27473, "epoch": 331} {"train_loss": -18.668272018432617, "global_step": 27474, "epoch": 331} {"train_loss": -18.795578002929688, "global_step": 27475, "epoch": 331} {"train_loss": -18.712833404541016, "global_step": 27476, "epoch": 331} {"train_loss": -18.529254913330078, "global_step": 27477, "epoch": 331} {"train_loss": -18.730920791625977, "global_step": 27478, "epoch": 331} {"train_loss": -18.980518341064453, "global_step": 27479, "epoch": 331} {"train_loss": -18.729652404785156, "global_step": 27480, "epoch": 331} {"train_loss": -18.83125114440918, "global_step": 27481, "epoch": 331} {"train_loss": -18.744348526000977, "global_step": 27482, "epoch": 331} {"train_loss": -18.48038673400879, "global_step": 27483, "epoch": 331} {"train_loss": -18.83587646484375, "global_step": 27484, "epoch": 331} {"train_loss": -18.53053855895996, "global_step": 27485, "epoch": 331} {"train_loss": -19.001432418823242, "global_step": 27486, "epoch": 331} {"train_loss": -18.778339385986328, "global_step": 27487, "epoch": 331} {"train_loss": -19.1016902923584, "global_step": 27488, "epoch": 331} {"train_loss": -19.315771102905273, "global_step": 27489, "epoch": 331} {"train_loss": -18.48442840576172, "global_step": 27490, "epoch": 331} {"train_loss": -19.026071548461914, "global_step": 27491, "epoch": 331} {"train_loss": -18.464759826660156, "global_step": 27492, "epoch": 331} {"train_loss": -18.669981002807617, "global_step": 27493, "epoch": 331} {"train_loss": -18.741430282592773, "global_step": 27494, "epoch": 331} {"train_loss": -18.699237823486328, "global_step": 27495, "epoch": 331} {"train_loss": -18.67670249938965, "global_step": 27496, "epoch": 331} {"train_loss": -18.71318817138672, "global_step": 27497, "epoch": 331} {"train_loss": -18.783044815063477, "global_step": 27498, "epoch": 331} {"train_loss": -18.46549415588379, "global_step": 27499, "epoch": 331} {"train_loss": -18.445903778076172, "global_step": 27500, "epoch": 331} {"train_loss": -18.82990264892578, "global_step": 27501, "epoch": 331} {"train_loss": -18.705129623413086, "global_step": 27502, "epoch": 331} {"train_loss": -18.685306549072266, "global_step": 27503, "epoch": 331} {"train_loss": -18.997838973999023, "global_step": 27504, "epoch": 331} {"train_loss": -18.91815757751465, "global_step": 27505, "epoch": 331} {"train_loss": -18.862869262695312, "global_step": 27506, "epoch": 331} {"train_loss": -18.752058029174805, "global_step": 27507, "epoch": 331} {"train_loss": -18.72231101989746, "global_step": 27508, "epoch": 331} {"train_loss": -18.748239517211914, "global_step": 27509, "epoch": 331} {"train_loss": -18.762258529663086, "global_step": 27510, "epoch": 331} {"train_loss": -18.517480850219727, "global_step": 27511, "epoch": 331} {"train_loss": -19.00156021118164, "global_step": 27512, "epoch": 331} {"train_loss": -18.843149185180664, "global_step": 27513, "epoch": 331} {"train_loss": -18.67352867126465, "global_step": 27514, "epoch": 331} {"train_loss": -18.740890502929688, "global_step": 27515, "epoch": 331} {"train_loss": -18.6278018951416, "global_step": 27516, "epoch": 331} {"train_loss": -18.787580490112305, "global_step": 27517, "epoch": 331} {"train_loss": -18.536544799804688, "global_step": 27518, "epoch": 331} {"train_loss": -19.100019454956055, "global_step": 27519, "epoch": 331} {"train_loss": -18.432775497436523, "global_step": 27520, "epoch": 331} {"train_loss": -18.449676513671875, "global_step": 27521, "epoch": 331} {"train_loss": -19.1427059173584, "global_step": 27522, "epoch": 331} {"train_loss": -18.990039825439453, "global_step": 27523, "epoch": 331} {"train_loss": -18.692785263061523, "global_step": 27524, "epoch": 331} {"train_loss": -18.631715774536133, "global_step": 27525, "epoch": 331} {"train_loss": -18.841794967651367, "global_step": 27526, "epoch": 331} {"train_loss": -18.68436622619629, "global_step": 27527, "epoch": 331} {"train_loss": -18.93670082092285, "global_step": 27528, "epoch": 331} {"train_loss": -18.862680435180664, "global_step": 27529, "epoch": 331} {"train_loss": -18.365949630737305, "global_step": 27530, "epoch": 331} {"train_loss": -18.974872589111328, "global_step": 27531, "epoch": 331} {"train_loss": -18.68988609313965, "global_step": 27532, "epoch": 331} {"train_loss": -18.889698028564453, "global_step": 27533, "epoch": 331} {"train_loss": -18.616147994995117, "global_step": 27534, "epoch": 331} {"train_loss": -18.95520782470703, "global_step": 27535, "epoch": 331} {"train_loss": -18.789281845092773, "global_step": 27536, "epoch": 331} {"train_loss": -18.53095817565918, "global_step": 27537, "epoch": 331} {"train_loss": -18.794225692749023, "global_step": 27538, "epoch": 331} {"train_loss": -18.798629760742188, "global_step": 27539, "epoch": 331} {"train_loss": -18.684669494628906, "global_step": 27540, "epoch": 331} {"train_loss": -18.684106826782227, "global_step": 27541, "epoch": 331} {"train_loss": -18.717504501342773, "global_step": 27542, "epoch": 331} {"train_loss": -19.140684127807617, "global_step": 27543, "epoch": 331} {"train_loss": -18.73290252685547, "global_step": 27544, "epoch": 331} {"train_loss": -18.899856567382812, "global_step": 27545, "epoch": 331} {"train_loss": -19.163312911987305, "global_step": 27546, "epoch": 331} {"train_loss": -18.865859985351562, "global_step": 27547, "epoch": 331} {"train_loss": -18.770965576171875, "global_step": 27548, "epoch": 331} {"train_loss": -18.806303024291992, "global_step": 27549, "epoch": 331} {"train_loss": -19.00141143798828, "global_step": 27550, "epoch": 331} {"train_loss": -19.205902099609375, "global_step": 27551, "epoch": 331} {"train_loss": -19.227643966674805, "global_step": 27552, "epoch": 331} {"train_loss": -18.87928009033203, "global_step": 27553, "epoch": 331} {"train_loss": -18.51325798034668, "global_step": 27554, "epoch": 331} {"train_loss": -18.76665250939059, "global_step": 27555, "epoch": 331, "val_loss": 5808564.5} {"train_loss": -18.696359634399414, "global_step": 27556, "epoch": 332} {"train_loss": -18.626096725463867, "global_step": 27557, "epoch": 332} {"train_loss": -18.387453079223633, "global_step": 27558, "epoch": 332} {"train_loss": -18.319290161132812, "global_step": 27559, "epoch": 332} {"train_loss": -18.575973510742188, "global_step": 27560, "epoch": 332} {"train_loss": -18.6484317779541, "global_step": 27561, "epoch": 332} {"train_loss": -18.7161808013916, "global_step": 27562, "epoch": 332} {"train_loss": -18.885295867919922, "global_step": 27563, "epoch": 332} {"train_loss": -18.448740005493164, "global_step": 27564, "epoch": 332} {"train_loss": -18.568784713745117, "global_step": 27565, "epoch": 332} {"train_loss": -18.5222110748291, "global_step": 27566, "epoch": 332} {"train_loss": -18.79683494567871, "global_step": 27567, "epoch": 332} {"train_loss": -19.008142471313477, "global_step": 27568, "epoch": 332} {"train_loss": -18.86428451538086, "global_step": 27569, "epoch": 332} {"train_loss": -18.630277633666992, "global_step": 27570, "epoch": 332} {"train_loss": -18.659250259399414, "global_step": 27571, "epoch": 332} {"train_loss": -18.56507682800293, "global_step": 27572, "epoch": 332} {"train_loss": -19.053503036499023, "global_step": 27573, "epoch": 332} {"train_loss": -18.522523880004883, "global_step": 27574, "epoch": 332} {"train_loss": -19.086225509643555, "global_step": 27575, "epoch": 332} {"train_loss": -18.515226364135742, "global_step": 27576, "epoch": 332} {"train_loss": -18.604581832885742, "global_step": 27577, "epoch": 332} {"train_loss": -18.751089096069336, "global_step": 27578, "epoch": 332} {"train_loss": -19.11354637145996, "global_step": 27579, "epoch": 332} {"train_loss": -19.181339263916016, "global_step": 27580, "epoch": 332} {"train_loss": -18.532556533813477, "global_step": 27581, "epoch": 332} {"train_loss": -18.572546005249023, "global_step": 27582, "epoch": 332} {"train_loss": -18.552780151367188, "global_step": 27583, "epoch": 332} {"train_loss": -19.006799697875977, "global_step": 27584, "epoch": 332} {"train_loss": -18.88002586364746, "global_step": 27585, "epoch": 332} {"train_loss": -18.846084594726562, "global_step": 27586, "epoch": 332} {"train_loss": -19.41632652282715, "global_step": 27587, "epoch": 332} {"train_loss": -19.128259658813477, "global_step": 27588, "epoch": 332} {"train_loss": -18.96510124206543, "global_step": 27589, "epoch": 332} {"train_loss": -18.752668380737305, "global_step": 27590, "epoch": 332} {"train_loss": -18.541685104370117, "global_step": 27591, "epoch": 332} {"train_loss": -19.17909812927246, "global_step": 27592, "epoch": 332} {"train_loss": -18.690900802612305, "global_step": 27593, "epoch": 332} {"train_loss": -18.845020294189453, "global_step": 27594, "epoch": 332} {"train_loss": -18.61720848083496, "global_step": 27595, "epoch": 332} {"train_loss": -18.920211791992188, "global_step": 27596, "epoch": 332} {"train_loss": -18.941802978515625, "global_step": 27597, "epoch": 332} {"train_loss": -18.717845916748047, "global_step": 27598, "epoch": 332} {"train_loss": -18.75385856628418, "global_step": 27599, "epoch": 332} {"train_loss": -18.881494522094727, "global_step": 27600, "epoch": 332} {"train_loss": -18.77642250061035, "global_step": 27601, "epoch": 332} {"train_loss": -19.059606552124023, "global_step": 27602, "epoch": 332} {"train_loss": -18.756210327148438, "global_step": 27603, "epoch": 332} {"train_loss": -18.549320220947266, "global_step": 27604, "epoch": 332} {"train_loss": -19.014911651611328, "global_step": 27605, "epoch": 332} {"train_loss": -18.81260108947754, "global_step": 27606, "epoch": 332} {"train_loss": -18.56184959411621, "global_step": 27607, "epoch": 332} {"train_loss": -18.816877365112305, "global_step": 27608, "epoch": 332} {"train_loss": -18.664554595947266, "global_step": 27609, "epoch": 332} {"train_loss": -18.878482818603516, "global_step": 27610, "epoch": 332} {"train_loss": -19.08503532409668, "global_step": 27611, "epoch": 332} {"train_loss": -19.192951202392578, "global_step": 27612, "epoch": 332} {"train_loss": -18.882614135742188, "global_step": 27613, "epoch": 332} {"train_loss": -18.633163452148438, "global_step": 27614, "epoch": 332} {"train_loss": -18.912704467773438, "global_step": 27615, "epoch": 332} {"train_loss": -18.766403198242188, "global_step": 27616, "epoch": 332} {"train_loss": -18.692874908447266, "global_step": 27617, "epoch": 332} {"train_loss": -19.093666076660156, "global_step": 27618, "epoch": 332} {"train_loss": -18.767749786376953, "global_step": 27619, "epoch": 332} {"train_loss": -18.815217971801758, "global_step": 27620, "epoch": 332} {"train_loss": -18.83036994934082, "global_step": 27621, "epoch": 332} {"train_loss": -19.138202667236328, "global_step": 27622, "epoch": 332} {"train_loss": -18.71319580078125, "global_step": 27623, "epoch": 332} {"train_loss": -18.703271865844727, "global_step": 27624, "epoch": 332} {"train_loss": -18.86050796508789, "global_step": 27625, "epoch": 332} {"train_loss": -19.010732650756836, "global_step": 27626, "epoch": 332} {"train_loss": -19.02364730834961, "global_step": 27627, "epoch": 332} {"train_loss": -19.015371322631836, "global_step": 27628, "epoch": 332} {"train_loss": -18.562482833862305, "global_step": 27629, "epoch": 332} {"train_loss": -18.71980094909668, "global_step": 27630, "epoch": 332} {"train_loss": -19.128793716430664, "global_step": 27631, "epoch": 332} {"train_loss": -18.60931968688965, "global_step": 27632, "epoch": 332} {"train_loss": -18.56642723083496, "global_step": 27633, "epoch": 332} {"train_loss": -18.897106170654297, "global_step": 27634, "epoch": 332} {"train_loss": -18.69968605041504, "global_step": 27635, "epoch": 332} {"train_loss": -19.006895065307617, "global_step": 27636, "epoch": 332} {"train_loss": -19.316858291625977, "global_step": 27637, "epoch": 332} {"train_loss": -18.79648500465485, "global_step": 27638, "epoch": 332, "val_loss": 5919283.0} {"train_loss": -18.933998107910156, "global_step": 27639, "epoch": 333} {"train_loss": -18.764129638671875, "global_step": 27640, "epoch": 333} {"train_loss": -18.71044921875, "global_step": 27641, "epoch": 333} {"train_loss": -18.288616180419922, "global_step": 27642, "epoch": 333} {"train_loss": -18.635068893432617, "global_step": 27643, "epoch": 333} {"train_loss": -18.996110916137695, "global_step": 27644, "epoch": 333} {"train_loss": -19.098905563354492, "global_step": 27645, "epoch": 333} {"train_loss": -18.766508102416992, "global_step": 27646, "epoch": 333} {"train_loss": -18.507566452026367, "global_step": 27647, "epoch": 333} {"train_loss": -18.3542423248291, "global_step": 27648, "epoch": 333} {"train_loss": -18.6506290435791, "global_step": 27649, "epoch": 333} {"train_loss": -18.81648063659668, "global_step": 27650, "epoch": 333} {"train_loss": -18.578338623046875, "global_step": 27651, "epoch": 333} {"train_loss": -18.828174591064453, "global_step": 27652, "epoch": 333} {"train_loss": -19.3759765625, "global_step": 27653, "epoch": 333} {"train_loss": -18.874095916748047, "global_step": 27654, "epoch": 333} {"train_loss": -18.79991912841797, "global_step": 27655, "epoch": 333} {"train_loss": -19.004634857177734, "global_step": 27656, "epoch": 333} {"train_loss": -18.818960189819336, "global_step": 27657, "epoch": 333} {"train_loss": -18.409976959228516, "global_step": 27658, "epoch": 333} {"train_loss": -18.915346145629883, "global_step": 27659, "epoch": 333} {"train_loss": -19.144479751586914, "global_step": 27660, "epoch": 333} {"train_loss": -18.973886489868164, "global_step": 27661, "epoch": 333} {"train_loss": -18.6748104095459, "global_step": 27662, "epoch": 333} {"train_loss": -18.729122161865234, "global_step": 27663, "epoch": 333} {"train_loss": -18.63649559020996, "global_step": 27664, "epoch": 333} {"train_loss": -18.970762252807617, "global_step": 27665, "epoch": 333} {"train_loss": -18.570955276489258, "global_step": 27666, "epoch": 333} {"train_loss": -18.796411514282227, "global_step": 27667, "epoch": 333} {"train_loss": -18.872472763061523, "global_step": 27668, "epoch": 333} {"train_loss": -19.029516220092773, "global_step": 27669, "epoch": 333} {"train_loss": -18.636051177978516, "global_step": 27670, "epoch": 333} {"train_loss": -18.57245635986328, "global_step": 27671, "epoch": 333} {"train_loss": -19.161779403686523, "global_step": 27672, "epoch": 333} {"train_loss": -18.75931739807129, "global_step": 27673, "epoch": 333} {"train_loss": -18.9571533203125, "global_step": 27674, "epoch": 333} {"train_loss": -18.92432975769043, "global_step": 27675, "epoch": 333} {"train_loss": -19.23965072631836, "global_step": 27676, "epoch": 333} {"train_loss": -18.88977813720703, "global_step": 27677, "epoch": 333} {"train_loss": -19.19342613220215, "global_step": 27678, "epoch": 333} {"train_loss": -18.86750602722168, "global_step": 27679, "epoch": 333} {"train_loss": -18.666959762573242, "global_step": 27680, "epoch": 333} {"train_loss": -18.9849910736084, "global_step": 27681, "epoch": 333} {"train_loss": -18.703210830688477, "global_step": 27682, "epoch": 333} {"train_loss": -18.55389976501465, "global_step": 27683, "epoch": 333} {"train_loss": -18.846086502075195, "global_step": 27684, "epoch": 333} {"train_loss": -18.764310836791992, "global_step": 27685, "epoch": 333} {"train_loss": -18.56153678894043, "global_step": 27686, "epoch": 333} {"train_loss": -18.819515228271484, "global_step": 27687, "epoch": 333} {"train_loss": -18.877460479736328, "global_step": 27688, "epoch": 333} {"train_loss": -18.6835880279541, "global_step": 27689, "epoch": 333} {"train_loss": -18.27430534362793, "global_step": 27690, "epoch": 333} {"train_loss": -18.796842575073242, "global_step": 27691, "epoch": 333} {"train_loss": -19.299236297607422, "global_step": 27692, "epoch": 333} {"train_loss": -18.63399314880371, "global_step": 27693, "epoch": 333} {"train_loss": -18.573606491088867, "global_step": 27694, "epoch": 333} {"train_loss": -18.553604125976562, "global_step": 27695, "epoch": 333} {"train_loss": -18.570310592651367, "global_step": 27696, "epoch": 333} {"train_loss": -18.970346450805664, "global_step": 27697, "epoch": 333} {"train_loss": -18.935012817382812, "global_step": 27698, "epoch": 333} {"train_loss": -18.867094039916992, "global_step": 27699, "epoch": 333} {"train_loss": -18.53218650817871, "global_step": 27700, "epoch": 333} {"train_loss": -18.948522567749023, "global_step": 27701, "epoch": 333} {"train_loss": -18.690521240234375, "global_step": 27702, "epoch": 333} {"train_loss": -18.672597885131836, "global_step": 27703, "epoch": 333} {"train_loss": -19.293052673339844, "global_step": 27704, "epoch": 333} {"train_loss": -18.545576095581055, "global_step": 27705, "epoch": 333} {"train_loss": -18.997817993164062, "global_step": 27706, "epoch": 333} {"train_loss": -18.73613929748535, "global_step": 27707, "epoch": 333} {"train_loss": -18.86042594909668, "global_step": 27708, "epoch": 333} {"train_loss": -18.796974182128906, "global_step": 27709, "epoch": 333} {"train_loss": -18.992841720581055, "global_step": 27710, "epoch": 333} {"train_loss": -18.665546417236328, "global_step": 27711, "epoch": 333} {"train_loss": -18.611713409423828, "global_step": 27712, "epoch": 333} {"train_loss": -19.00293731689453, "global_step": 27713, "epoch": 333} {"train_loss": -18.95688819885254, "global_step": 27714, "epoch": 333} {"train_loss": -19.330677032470703, "global_step": 27715, "epoch": 333} {"train_loss": -18.774959564208984, "global_step": 27716, "epoch": 333} {"train_loss": -19.103946685791016, "global_step": 27717, "epoch": 333} {"train_loss": -18.513105392456055, "global_step": 27718, "epoch": 333} {"train_loss": -18.950977325439453, "global_step": 27719, "epoch": 333} {"train_loss": -18.8621883392334, "global_step": 27720, "epoch": 333} {"train_loss": -18.795609692493116, "global_step": 27721, "epoch": 333, "val_loss": 6093556.5} {"train_loss": -18.397232055664062, "global_step": 27722, "epoch": 334} {"train_loss": -18.67857551574707, "global_step": 27723, "epoch": 334} {"train_loss": -18.665739059448242, "global_step": 27724, "epoch": 334} {"train_loss": -18.805072784423828, "global_step": 27725, "epoch": 334} {"train_loss": -18.740901947021484, "global_step": 27726, "epoch": 334} {"train_loss": -18.420026779174805, "global_step": 27727, "epoch": 334} {"train_loss": -18.438032150268555, "global_step": 27728, "epoch": 334} {"train_loss": -19.036579132080078, "global_step": 27729, "epoch": 334} {"train_loss": -18.737258911132812, "global_step": 27730, "epoch": 334} {"train_loss": -18.635038375854492, "global_step": 27731, "epoch": 334} {"train_loss": -18.408416748046875, "global_step": 27732, "epoch": 334} {"train_loss": -18.974699020385742, "global_step": 27733, "epoch": 334} {"train_loss": -18.5012149810791, "global_step": 27734, "epoch": 334} {"train_loss": -19.09587860107422, "global_step": 27735, "epoch": 334} {"train_loss": -19.102155685424805, "global_step": 27736, "epoch": 334} {"train_loss": -18.877498626708984, "global_step": 27737, "epoch": 334} {"train_loss": -18.685745239257812, "global_step": 27738, "epoch": 334} {"train_loss": -18.936521530151367, "global_step": 27739, "epoch": 334} {"train_loss": -18.70356559753418, "global_step": 27740, "epoch": 334} {"train_loss": -18.677783966064453, "global_step": 27741, "epoch": 334} {"train_loss": -19.171388626098633, "global_step": 27742, "epoch": 334} {"train_loss": -18.787256240844727, "global_step": 27743, "epoch": 334} {"train_loss": -18.898521423339844, "global_step": 27744, "epoch": 334} {"train_loss": -18.68937873840332, "global_step": 27745, "epoch": 334} {"train_loss": -18.861303329467773, "global_step": 27746, "epoch": 334} {"train_loss": -18.23044204711914, "global_step": 27747, "epoch": 334} {"train_loss": -18.57927894592285, "global_step": 27748, "epoch": 334} {"train_loss": -18.65709114074707, "global_step": 27749, "epoch": 334} {"train_loss": -18.767683029174805, "global_step": 27750, "epoch": 334} {"train_loss": -18.732879638671875, "global_step": 27751, "epoch": 334} {"train_loss": -18.407438278198242, "global_step": 27752, "epoch": 334} {"train_loss": -19.394134521484375, "global_step": 27753, "epoch": 334} {"train_loss": -18.83515739440918, "global_step": 27754, "epoch": 334} {"train_loss": -19.314044952392578, "global_step": 27755, "epoch": 334} {"train_loss": -18.74003791809082, "global_step": 27756, "epoch": 334} {"train_loss": -18.651758193969727, "global_step": 27757, "epoch": 334} {"train_loss": -18.734716415405273, "global_step": 27758, "epoch": 334} {"train_loss": -18.707189559936523, "global_step": 27759, "epoch": 334} {"train_loss": -18.640398025512695, "global_step": 27760, "epoch": 334} {"train_loss": -18.796743392944336, "global_step": 27761, "epoch": 334} {"train_loss": -18.57924461364746, "global_step": 27762, "epoch": 334} {"train_loss": -18.79096221923828, "global_step": 27763, "epoch": 334} {"train_loss": -18.8619327545166, "global_step": 27764, "epoch": 334} {"train_loss": -18.632322311401367, "global_step": 27765, "epoch": 334} {"train_loss": -18.889270782470703, "global_step": 27766, "epoch": 334} {"train_loss": -18.921783447265625, "global_step": 27767, "epoch": 334} {"train_loss": -18.81414794921875, "global_step": 27768, "epoch": 334} {"train_loss": -18.730464935302734, "global_step": 27769, "epoch": 334} {"train_loss": -19.094797134399414, "global_step": 27770, "epoch": 334} {"train_loss": -18.869747161865234, "global_step": 27771, "epoch": 334} {"train_loss": -19.009937286376953, "global_step": 27772, "epoch": 334} {"train_loss": -19.021474838256836, "global_step": 27773, "epoch": 334} {"train_loss": -18.94340705871582, "global_step": 27774, "epoch": 334} {"train_loss": -18.83559226989746, "global_step": 27775, "epoch": 334} {"train_loss": -18.918302536010742, "global_step": 27776, "epoch": 334} {"train_loss": -18.901968002319336, "global_step": 27777, "epoch": 334} {"train_loss": -18.61152458190918, "global_step": 27778, "epoch": 334} {"train_loss": -18.956817626953125, "global_step": 27779, "epoch": 334} {"train_loss": -18.654592514038086, "global_step": 27780, "epoch": 334} {"train_loss": -19.032556533813477, "global_step": 27781, "epoch": 334} {"train_loss": -18.965438842773438, "global_step": 27782, "epoch": 334} {"train_loss": -18.916934967041016, "global_step": 27783, "epoch": 334} {"train_loss": -18.574787139892578, "global_step": 27784, "epoch": 334} {"train_loss": -19.22391700744629, "global_step": 27785, "epoch": 334} {"train_loss": -18.934463500976562, "global_step": 27786, "epoch": 334} {"train_loss": -18.957300186157227, "global_step": 27787, "epoch": 334} {"train_loss": -19.02479362487793, "global_step": 27788, "epoch": 334} {"train_loss": -18.890981674194336, "global_step": 27789, "epoch": 334} {"train_loss": -18.839736938476562, "global_step": 27790, "epoch": 334} {"train_loss": -19.099536895751953, "global_step": 27791, "epoch": 334} {"train_loss": -19.031238555908203, "global_step": 27792, "epoch": 334} {"train_loss": -18.38322639465332, "global_step": 27793, "epoch": 334} {"train_loss": -18.508512496948242, "global_step": 27794, "epoch": 334} {"train_loss": -18.95001792907715, "global_step": 27795, "epoch": 334} {"train_loss": -18.504791259765625, "global_step": 27796, "epoch": 334} {"train_loss": -18.81624984741211, "global_step": 27797, "epoch": 334} {"train_loss": -18.881677627563477, "global_step": 27798, "epoch": 334} {"train_loss": -18.786832809448242, "global_step": 27799, "epoch": 334} {"train_loss": -19.039487838745117, "global_step": 27800, "epoch": 334} {"train_loss": -18.895166397094727, "global_step": 27801, "epoch": 334} {"train_loss": -18.9807186126709, "global_step": 27802, "epoch": 334} {"train_loss": -18.790891647338867, "global_step": 27803, "epoch": 334} {"train_loss": -18.831696429884577, "global_step": 27804, "epoch": 334, "val_loss": 6064927.0} {"train_loss": -18.204465866088867, "global_step": 27805, "epoch": 335} {"train_loss": -18.7984619140625, "global_step": 27806, "epoch": 335} {"train_loss": -18.38222885131836, "global_step": 27807, "epoch": 335} {"train_loss": -18.47841453552246, "global_step": 27808, "epoch": 335} {"train_loss": -18.572124481201172, "global_step": 27809, "epoch": 335} {"train_loss": -18.883657455444336, "global_step": 27810, "epoch": 335} {"train_loss": -18.35857582092285, "global_step": 27811, "epoch": 335} {"train_loss": -18.818185806274414, "global_step": 27812, "epoch": 335} {"train_loss": -18.87567138671875, "global_step": 27813, "epoch": 335} {"train_loss": -18.5299072265625, "global_step": 27814, "epoch": 335} {"train_loss": -18.715179443359375, "global_step": 27815, "epoch": 335} {"train_loss": -18.54139518737793, "global_step": 27816, "epoch": 335} {"train_loss": -18.990203857421875, "global_step": 27817, "epoch": 335} {"train_loss": -18.544431686401367, "global_step": 27818, "epoch": 335} {"train_loss": -18.658994674682617, "global_step": 27819, "epoch": 335} {"train_loss": -18.828641891479492, "global_step": 27820, "epoch": 335} {"train_loss": -18.776859283447266, "global_step": 27821, "epoch": 335} {"train_loss": -18.690202713012695, "global_step": 27822, "epoch": 335} {"train_loss": -18.80478286743164, "global_step": 27823, "epoch": 335} {"train_loss": -18.908361434936523, "global_step": 27824, "epoch": 335} {"train_loss": -18.820486068725586, "global_step": 27825, "epoch": 335} {"train_loss": -18.801034927368164, "global_step": 27826, "epoch": 335} {"train_loss": -18.93592643737793, "global_step": 27827, "epoch": 335} {"train_loss": -18.67510986328125, "global_step": 27828, "epoch": 335} {"train_loss": -18.68602180480957, "global_step": 27829, "epoch": 335} {"train_loss": -18.883726119995117, "global_step": 27830, "epoch": 335} {"train_loss": -18.59558868408203, "global_step": 27831, "epoch": 335} {"train_loss": -19.286945343017578, "global_step": 27832, "epoch": 335} {"train_loss": -19.483800888061523, "global_step": 27833, "epoch": 335} {"train_loss": -19.2222957611084, "global_step": 27834, "epoch": 335} {"train_loss": -18.507793426513672, "global_step": 27835, "epoch": 335} {"train_loss": -18.970487594604492, "global_step": 27836, "epoch": 335} {"train_loss": -18.858381271362305, "global_step": 27837, "epoch": 335} {"train_loss": -18.8157901763916, "global_step": 27838, "epoch": 335} {"train_loss": -18.721073150634766, "global_step": 27839, "epoch": 335} {"train_loss": -18.87790298461914, "global_step": 27840, "epoch": 335} {"train_loss": -18.801456451416016, "global_step": 27841, "epoch": 335} {"train_loss": -19.112548828125, "global_step": 27842, "epoch": 335} {"train_loss": -18.851282119750977, "global_step": 27843, "epoch": 335} {"train_loss": -18.80291748046875, "global_step": 27844, "epoch": 335} {"train_loss": -18.9632511138916, "global_step": 27845, "epoch": 335} {"train_loss": -19.047868728637695, "global_step": 27846, "epoch": 335} {"train_loss": -19.140138626098633, "global_step": 27847, "epoch": 335} {"train_loss": -18.319337844848633, "global_step": 27848, "epoch": 335} {"train_loss": -19.041099548339844, "global_step": 27849, "epoch": 335} {"train_loss": -19.140207290649414, "global_step": 27850, "epoch": 335} {"train_loss": -19.01932716369629, "global_step": 27851, "epoch": 335} {"train_loss": -18.869613647460938, "global_step": 27852, "epoch": 335} {"train_loss": -18.857269287109375, "global_step": 27853, "epoch": 335} {"train_loss": -19.157373428344727, "global_step": 27854, "epoch": 335} {"train_loss": -18.97210121154785, "global_step": 27855, "epoch": 335} {"train_loss": -18.71246910095215, "global_step": 27856, "epoch": 335} {"train_loss": -18.95491600036621, "global_step": 27857, "epoch": 335} {"train_loss": -18.80893898010254, "global_step": 27858, "epoch": 335} {"train_loss": -18.60953140258789, "global_step": 27859, "epoch": 335} {"train_loss": -18.89476776123047, "global_step": 27860, "epoch": 335} {"train_loss": -18.852447509765625, "global_step": 27861, "epoch": 335} {"train_loss": -19.207077026367188, "global_step": 27862, "epoch": 335} {"train_loss": -18.56772232055664, "global_step": 27863, "epoch": 335} {"train_loss": -19.51593780517578, "global_step": 27864, "epoch": 335} {"train_loss": -18.338104248046875, "global_step": 27865, "epoch": 335} {"train_loss": -18.83052635192871, "global_step": 27866, "epoch": 335} {"train_loss": -18.921409606933594, "global_step": 27867, "epoch": 335} {"train_loss": -18.734888076782227, "global_step": 27868, "epoch": 335} {"train_loss": -18.627338409423828, "global_step": 27869, "epoch": 335} {"train_loss": -18.764850616455078, "global_step": 27870, "epoch": 335} {"train_loss": -18.862140655517578, "global_step": 27871, "epoch": 335} {"train_loss": -18.915189743041992, "global_step": 27872, "epoch": 335} {"train_loss": -18.763086318969727, "global_step": 27873, "epoch": 335} {"train_loss": -18.771724700927734, "global_step": 27874, "epoch": 335} {"train_loss": -18.83932113647461, "global_step": 27875, "epoch": 335} {"train_loss": -18.798063278198242, "global_step": 27876, "epoch": 335} {"train_loss": -18.707691192626953, "global_step": 27877, "epoch": 335} {"train_loss": -18.99994659423828, "global_step": 27878, "epoch": 335} {"train_loss": -18.55763816833496, "global_step": 27879, "epoch": 335} {"train_loss": -18.510055541992188, "global_step": 27880, "epoch": 335} {"train_loss": -18.66276741027832, "global_step": 27881, "epoch": 335} {"train_loss": -18.69917106628418, "global_step": 27882, "epoch": 335} {"train_loss": -18.80945587158203, "global_step": 27883, "epoch": 335} {"train_loss": -18.58646011352539, "global_step": 27884, "epoch": 335} {"train_loss": -19.125356674194336, "global_step": 27885, "epoch": 335} {"train_loss": -18.54986000061035, "global_step": 27886, "epoch": 335} {"train_loss": -18.812768706356188, "global_step": 27887, "epoch": 335, "val_loss": 6068802.0} {"train_loss": -18.916479110717773, "global_step": 27888, "epoch": 336} {"train_loss": -18.971317291259766, "global_step": 27889, "epoch": 336} {"train_loss": -18.480100631713867, "global_step": 27890, "epoch": 336} {"train_loss": -18.690237045288086, "global_step": 27891, "epoch": 336} {"train_loss": -18.99828338623047, "global_step": 27892, "epoch": 336} {"train_loss": -18.544775009155273, "global_step": 27893, "epoch": 336} {"train_loss": -18.878620147705078, "global_step": 27894, "epoch": 336} {"train_loss": -18.837453842163086, "global_step": 27895, "epoch": 336} {"train_loss": -18.79165267944336, "global_step": 27896, "epoch": 336} {"train_loss": -18.592288970947266, "global_step": 27897, "epoch": 336} {"train_loss": -18.777822494506836, "global_step": 27898, "epoch": 336} {"train_loss": -18.695281982421875, "global_step": 27899, "epoch": 336} {"train_loss": -18.913970947265625, "global_step": 27900, "epoch": 336} {"train_loss": -18.843753814697266, "global_step": 27901, "epoch": 336} {"train_loss": -18.822866439819336, "global_step": 27902, "epoch": 336} {"train_loss": -18.952178955078125, "global_step": 27903, "epoch": 336} {"train_loss": -18.939517974853516, "global_step": 27904, "epoch": 336} {"train_loss": -18.561065673828125, "global_step": 27905, "epoch": 336} {"train_loss": -18.94866943359375, "global_step": 27906, "epoch": 336} {"train_loss": -19.098859786987305, "global_step": 27907, "epoch": 336} {"train_loss": -19.1771297454834, "global_step": 27908, "epoch": 336} {"train_loss": -19.06920051574707, "global_step": 27909, "epoch": 336} {"train_loss": -18.8218936920166, "global_step": 27910, "epoch": 336} {"train_loss": -18.69002342224121, "global_step": 27911, "epoch": 336} {"train_loss": -18.96060562133789, "global_step": 27912, "epoch": 336} {"train_loss": -18.724201202392578, "global_step": 27913, "epoch": 336} {"train_loss": -19.001585006713867, "global_step": 27914, "epoch": 336} {"train_loss": -18.99458885192871, "global_step": 27915, "epoch": 336} {"train_loss": -18.83530044555664, "global_step": 27916, "epoch": 336} {"train_loss": -18.95859146118164, "global_step": 27917, "epoch": 336} {"train_loss": -18.87970542907715, "global_step": 27918, "epoch": 336} {"train_loss": -18.722055435180664, "global_step": 27919, "epoch": 336} {"train_loss": -18.89571762084961, "global_step": 27920, "epoch": 336} {"train_loss": -18.504047393798828, "global_step": 27921, "epoch": 336} {"train_loss": -18.832059860229492, "global_step": 27922, "epoch": 336} {"train_loss": -19.20716094970703, "global_step": 27923, "epoch": 336} {"train_loss": -19.074277877807617, "global_step": 27924, "epoch": 336} {"train_loss": -19.043624877929688, "global_step": 27925, "epoch": 336} {"train_loss": -18.834163665771484, "global_step": 27926, "epoch": 336} {"train_loss": -19.000911712646484, "global_step": 27927, "epoch": 336} {"train_loss": -19.251657485961914, "global_step": 27928, "epoch": 336} {"train_loss": -18.700714111328125, "global_step": 27929, "epoch": 336} {"train_loss": -18.578285217285156, "global_step": 27930, "epoch": 336} {"train_loss": -18.661691665649414, "global_step": 27931, "epoch": 336} {"train_loss": -18.8922061920166, "global_step": 27932, "epoch": 336} {"train_loss": -18.936525344848633, "global_step": 27933, "epoch": 336} {"train_loss": -19.105152130126953, "global_step": 27934, "epoch": 336} {"train_loss": -18.696256637573242, "global_step": 27935, "epoch": 336} {"train_loss": -19.078784942626953, "global_step": 27936, "epoch": 336} {"train_loss": -18.939559936523438, "global_step": 27937, "epoch": 336} {"train_loss": -19.278879165649414, "global_step": 27938, "epoch": 336} {"train_loss": -19.07136344909668, "global_step": 27939, "epoch": 336} {"train_loss": -18.70245361328125, "global_step": 27940, "epoch": 336} {"train_loss": -19.08619499206543, "global_step": 27941, "epoch": 336} {"train_loss": -18.423643112182617, "global_step": 27942, "epoch": 336} {"train_loss": -18.47334098815918, "global_step": 27943, "epoch": 336} {"train_loss": -18.599506378173828, "global_step": 27944, "epoch": 336} {"train_loss": -18.752832412719727, "global_step": 27945, "epoch": 336} {"train_loss": -19.003631591796875, "global_step": 27946, "epoch": 336} {"train_loss": -18.996679306030273, "global_step": 27947, "epoch": 336} {"train_loss": -18.620161056518555, "global_step": 27948, "epoch": 336} {"train_loss": -18.941492080688477, "global_step": 27949, "epoch": 336} {"train_loss": -18.925931930541992, "global_step": 27950, "epoch": 336} {"train_loss": -18.880624771118164, "global_step": 27951, "epoch": 336} {"train_loss": -19.10231590270996, "global_step": 27952, "epoch": 336} {"train_loss": -18.4732666015625, "global_step": 27953, "epoch": 336} {"train_loss": -18.435277938842773, "global_step": 27954, "epoch": 336} {"train_loss": -18.63282585144043, "global_step": 27955, "epoch": 336} {"train_loss": -18.91276741027832, "global_step": 27956, "epoch": 336} {"train_loss": -18.70606803894043, "global_step": 27957, "epoch": 336} {"train_loss": -19.18061637878418, "global_step": 27958, "epoch": 336} {"train_loss": -19.16314697265625, "global_step": 27959, "epoch": 336} {"train_loss": -18.706464767456055, "global_step": 27960, "epoch": 336} {"train_loss": -18.886001586914062, "global_step": 27961, "epoch": 336} {"train_loss": -18.608610153198242, "global_step": 27962, "epoch": 336} {"train_loss": -18.507986068725586, "global_step": 27963, "epoch": 336} {"train_loss": -18.822702407836914, "global_step": 27964, "epoch": 336} {"train_loss": -18.616151809692383, "global_step": 27965, "epoch": 336} {"train_loss": -18.872655868530273, "global_step": 27966, "epoch": 336} {"train_loss": -18.9000186920166, "global_step": 27967, "epoch": 336} {"train_loss": -18.75498390197754, "global_step": 27968, "epoch": 336} {"train_loss": -19.076810836791992, "global_step": 27969, "epoch": 336} {"train_loss": -18.854877127222267, "global_step": 27970, "epoch": 336, "val_loss": 6105669.0} {"train_loss": -18.28175163269043, "global_step": 27971, "epoch": 337} {"train_loss": -18.817459106445312, "global_step": 27972, "epoch": 337} {"train_loss": -18.680965423583984, "global_step": 27973, "epoch": 337} {"train_loss": -18.650623321533203, "global_step": 27974, "epoch": 337} {"train_loss": -18.767675399780273, "global_step": 27975, "epoch": 337} {"train_loss": -18.566059112548828, "global_step": 27976, "epoch": 337} {"train_loss": -18.562881469726562, "global_step": 27977, "epoch": 337} {"train_loss": -18.9306583404541, "global_step": 27978, "epoch": 337} {"train_loss": -18.65034294128418, "global_step": 27979, "epoch": 337} {"train_loss": -18.947162628173828, "global_step": 27980, "epoch": 337} {"train_loss": -18.739736557006836, "global_step": 27981, "epoch": 337} {"train_loss": -18.78993797302246, "global_step": 27982, "epoch": 337} {"train_loss": -18.791593551635742, "global_step": 27983, "epoch": 337} {"train_loss": -19.038543701171875, "global_step": 27984, "epoch": 337} {"train_loss": -18.63716697692871, "global_step": 27985, "epoch": 337} {"train_loss": -18.38747215270996, "global_step": 27986, "epoch": 337} {"train_loss": -18.587894439697266, "global_step": 27987, "epoch": 337} {"train_loss": -18.735523223876953, "global_step": 27988, "epoch": 337} {"train_loss": -18.891477584838867, "global_step": 27989, "epoch": 337} {"train_loss": -19.045185089111328, "global_step": 27990, "epoch": 337} {"train_loss": -18.601966857910156, "global_step": 27991, "epoch": 337} {"train_loss": -18.71696662902832, "global_step": 27992, "epoch": 337} {"train_loss": -18.854251861572266, "global_step": 27993, "epoch": 337} {"train_loss": -18.481796264648438, "global_step": 27994, "epoch": 337} {"train_loss": -19.139928817749023, "global_step": 27995, "epoch": 337} {"train_loss": -19.25481605529785, "global_step": 27996, "epoch": 337} {"train_loss": -18.90446662902832, "global_step": 27997, "epoch": 337} {"train_loss": -18.9714412689209, "global_step": 27998, "epoch": 337} {"train_loss": -19.16505241394043, "global_step": 27999, "epoch": 337} {"train_loss": -18.71738624572754, "global_step": 28000, "epoch": 337} {"train_loss": -18.932024002075195, "global_step": 28001, "epoch": 337} {"train_loss": -18.78423309326172, "global_step": 28002, "epoch": 337} {"train_loss": -19.34291648864746, "global_step": 28003, "epoch": 337} {"train_loss": -18.89800262451172, "global_step": 28004, "epoch": 337} {"train_loss": -18.969228744506836, "global_step": 28005, "epoch": 337} {"train_loss": -18.85077476501465, "global_step": 28006, "epoch": 337} {"train_loss": -18.368688583374023, "global_step": 28007, "epoch": 337} {"train_loss": -18.825716018676758, "global_step": 28008, "epoch": 337} {"train_loss": -18.666807174682617, "global_step": 28009, "epoch": 337} {"train_loss": -18.7669677734375, "global_step": 28010, "epoch": 337} {"train_loss": -18.822751998901367, "global_step": 28011, "epoch": 337} {"train_loss": -18.691221237182617, "global_step": 28012, "epoch": 337} {"train_loss": -18.672029495239258, "global_step": 28013, "epoch": 337} {"train_loss": -19.035680770874023, "global_step": 28014, "epoch": 337} {"train_loss": -18.82962417602539, "global_step": 28015, "epoch": 337} {"train_loss": -18.63686180114746, "global_step": 28016, "epoch": 337} {"train_loss": -19.234861373901367, "global_step": 28017, "epoch": 337} {"train_loss": -18.555795669555664, "global_step": 28018, "epoch": 337} {"train_loss": -18.829925537109375, "global_step": 28019, "epoch": 337} {"train_loss": -19.039960861206055, "global_step": 28020, "epoch": 337} {"train_loss": -18.867000579833984, "global_step": 28021, "epoch": 337} {"train_loss": -18.928525924682617, "global_step": 28022, "epoch": 337} {"train_loss": -19.059083938598633, "global_step": 28023, "epoch": 337} {"train_loss": -18.702091217041016, "global_step": 28024, "epoch": 337} {"train_loss": -18.92643928527832, "global_step": 28025, "epoch": 337} {"train_loss": -18.850513458251953, "global_step": 28026, "epoch": 337} {"train_loss": -19.1009578704834, "global_step": 28027, "epoch": 337} {"train_loss": -19.154048919677734, "global_step": 28028, "epoch": 337} {"train_loss": -18.947851181030273, "global_step": 28029, "epoch": 337} {"train_loss": -18.761186599731445, "global_step": 28030, "epoch": 337} {"train_loss": -18.783781051635742, "global_step": 28031, "epoch": 337} {"train_loss": -18.78399658203125, "global_step": 28032, "epoch": 337} {"train_loss": -19.01498794555664, "global_step": 28033, "epoch": 337} {"train_loss": -18.914669036865234, "global_step": 28034, "epoch": 337} {"train_loss": -18.838390350341797, "global_step": 28035, "epoch": 337} {"train_loss": -19.080795288085938, "global_step": 28036, "epoch": 337} {"train_loss": -18.8205623626709, "global_step": 28037, "epoch": 337} {"train_loss": -18.97233009338379, "global_step": 28038, "epoch": 337} {"train_loss": -19.060670852661133, "global_step": 28039, "epoch": 337} {"train_loss": -19.09566307067871, "global_step": 28040, "epoch": 337} {"train_loss": -18.847631454467773, "global_step": 28041, "epoch": 337} {"train_loss": -19.010889053344727, "global_step": 28042, "epoch": 337} {"train_loss": -19.09978485107422, "global_step": 28043, "epoch": 337} {"train_loss": -18.985685348510742, "global_step": 28044, "epoch": 337} {"train_loss": -18.6265869140625, "global_step": 28045, "epoch": 337} {"train_loss": -18.9732666015625, "global_step": 28046, "epoch": 337} {"train_loss": -18.87785530090332, "global_step": 28047, "epoch": 337} {"train_loss": -18.47743797302246, "global_step": 28048, "epoch": 337} {"train_loss": -18.63478660583496, "global_step": 28049, "epoch": 337} {"train_loss": -18.782127380371094, "global_step": 28050, "epoch": 337} {"train_loss": -19.089340209960938, "global_step": 28051, "epoch": 337} {"train_loss": -18.86199378967285, "global_step": 28052, "epoch": 337} {"train_loss": -18.855141076696924, "global_step": 28053, "epoch": 337, "val_loss": 6016554.0} {"train_loss": -18.004531860351562, "global_step": 28054, "epoch": 338} {"train_loss": -18.294239044189453, "global_step": 28055, "epoch": 338} {"train_loss": -18.676626205444336, "global_step": 28056, "epoch": 338} {"train_loss": -18.387914657592773, "global_step": 28057, "epoch": 338} {"train_loss": -18.804235458374023, "global_step": 28058, "epoch": 338} {"train_loss": -18.375795364379883, "global_step": 28059, "epoch": 338} {"train_loss": -18.610107421875, "global_step": 28060, "epoch": 338} {"train_loss": -18.39858055114746, "global_step": 28061, "epoch": 338} {"train_loss": -18.741064071655273, "global_step": 28062, "epoch": 338} {"train_loss": -18.712026596069336, "global_step": 28063, "epoch": 338} {"train_loss": -18.789752960205078, "global_step": 28064, "epoch": 338} {"train_loss": -18.93317413330078, "global_step": 28065, "epoch": 338} {"train_loss": -18.6861572265625, "global_step": 28066, "epoch": 338} {"train_loss": -18.55877685546875, "global_step": 28067, "epoch": 338} {"train_loss": -18.362293243408203, "global_step": 28068, "epoch": 338} {"train_loss": -18.85110855102539, "global_step": 28069, "epoch": 338} {"train_loss": -18.5425968170166, "global_step": 28070, "epoch": 338} {"train_loss": -18.714954376220703, "global_step": 28071, "epoch": 338} {"train_loss": -18.483966827392578, "global_step": 28072, "epoch": 338} {"train_loss": -18.94847297668457, "global_step": 28073, "epoch": 338} {"train_loss": -18.885517120361328, "global_step": 28074, "epoch": 338} {"train_loss": -19.211149215698242, "global_step": 28075, "epoch": 338} {"train_loss": -18.8797607421875, "global_step": 28076, "epoch": 338} {"train_loss": -18.918487548828125, "global_step": 28077, "epoch": 338} {"train_loss": -18.92292594909668, "global_step": 28078, "epoch": 338} {"train_loss": -18.459806442260742, "global_step": 28079, "epoch": 338} {"train_loss": -18.657146453857422, "global_step": 28080, "epoch": 338} {"train_loss": -19.093076705932617, "global_step": 28081, "epoch": 338} {"train_loss": -18.815603256225586, "global_step": 28082, "epoch": 338} {"train_loss": -18.539356231689453, "global_step": 28083, "epoch": 338} {"train_loss": -18.79949951171875, "global_step": 28084, "epoch": 338} {"train_loss": -18.738754272460938, "global_step": 28085, "epoch": 338} {"train_loss": -18.832059860229492, "global_step": 28086, "epoch": 338} {"train_loss": -18.829204559326172, "global_step": 28087, "epoch": 338} {"train_loss": -19.204559326171875, "global_step": 28088, "epoch": 338} {"train_loss": -19.03740882873535, "global_step": 28089, "epoch": 338} {"train_loss": -19.309167861938477, "global_step": 28090, "epoch": 338} {"train_loss": -18.711050033569336, "global_step": 28091, "epoch": 338} {"train_loss": -18.72980308532715, "global_step": 28092, "epoch": 338} {"train_loss": -19.10593605041504, "global_step": 28093, "epoch": 338} {"train_loss": -18.806123733520508, "global_step": 28094, "epoch": 338} {"train_loss": -19.011281967163086, "global_step": 28095, "epoch": 338} {"train_loss": -18.624704360961914, "global_step": 28096, "epoch": 338} {"train_loss": -18.708572387695312, "global_step": 28097, "epoch": 338} {"train_loss": -18.881549835205078, "global_step": 28098, "epoch": 338} {"train_loss": -18.99335289001465, "global_step": 28099, "epoch": 338} {"train_loss": -18.987838745117188, "global_step": 28100, "epoch": 338} {"train_loss": -18.61203384399414, "global_step": 28101, "epoch": 338} {"train_loss": -18.759138107299805, "global_step": 28102, "epoch": 338} {"train_loss": -18.904783248901367, "global_step": 28103, "epoch": 338} {"train_loss": -19.1192569732666, "global_step": 28104, "epoch": 338} {"train_loss": -18.79722023010254, "global_step": 28105, "epoch": 338} {"train_loss": -18.86048698425293, "global_step": 28106, "epoch": 338} {"train_loss": -18.975587844848633, "global_step": 28107, "epoch": 338} {"train_loss": -18.715526580810547, "global_step": 28108, "epoch": 338} {"train_loss": -19.066747665405273, "global_step": 28109, "epoch": 338} {"train_loss": -18.93753433227539, "global_step": 28110, "epoch": 338} {"train_loss": -18.875104904174805, "global_step": 28111, "epoch": 338} {"train_loss": -18.912887573242188, "global_step": 28112, "epoch": 338} {"train_loss": -18.7299747467041, "global_step": 28113, "epoch": 338} {"train_loss": -18.75067710876465, "global_step": 28114, "epoch": 338} {"train_loss": -18.781450271606445, "global_step": 28115, "epoch": 338} {"train_loss": -18.808748245239258, "global_step": 28116, "epoch": 338} {"train_loss": -18.67378044128418, "global_step": 28117, "epoch": 338} {"train_loss": -18.87434959411621, "global_step": 28118, "epoch": 338} {"train_loss": -18.893428802490234, "global_step": 28119, "epoch": 338} {"train_loss": -18.424434661865234, "global_step": 28120, "epoch": 338} {"train_loss": -18.6832218170166, "global_step": 28121, "epoch": 338} {"train_loss": -18.981739044189453, "global_step": 28122, "epoch": 338} {"train_loss": -18.929906845092773, "global_step": 28123, "epoch": 338} {"train_loss": -18.7905330657959, "global_step": 28124, "epoch": 338} {"train_loss": -18.971418380737305, "global_step": 28125, "epoch": 338} {"train_loss": -18.7420597076416, "global_step": 28126, "epoch": 338} {"train_loss": -18.829673767089844, "global_step": 28127, "epoch": 338} {"train_loss": -18.793413162231445, "global_step": 28128, "epoch": 338} {"train_loss": -18.979175567626953, "global_step": 28129, "epoch": 338} {"train_loss": -18.752370834350586, "global_step": 28130, "epoch": 338} {"train_loss": -18.814321517944336, "global_step": 28131, "epoch": 338} {"train_loss": -18.932598114013672, "global_step": 28132, "epoch": 338} {"train_loss": -18.923412322998047, "global_step": 28133, "epoch": 338} {"train_loss": -18.647871017456055, "global_step": 28134, "epoch": 338} {"train_loss": -18.67268943786621, "global_step": 28135, "epoch": 338} {"train_loss": -18.799721959125566, "global_step": 28136, "epoch": 338, "val_loss": 5998131.0} {"train_loss": -18.644655227661133, "global_step": 28137, "epoch": 339} {"train_loss": -18.62078857421875, "global_step": 28138, "epoch": 339} {"train_loss": -18.876623153686523, "global_step": 28139, "epoch": 339} {"train_loss": -18.69845199584961, "global_step": 28140, "epoch": 339} {"train_loss": -18.768966674804688, "global_step": 28141, "epoch": 339} {"train_loss": -18.71503448486328, "global_step": 28142, "epoch": 339} {"train_loss": -18.775482177734375, "global_step": 28143, "epoch": 339} {"train_loss": -19.032516479492188, "global_step": 28144, "epoch": 339} {"train_loss": -18.934232711791992, "global_step": 28145, "epoch": 339} {"train_loss": -18.593299865722656, "global_step": 28146, "epoch": 339} {"train_loss": -18.838611602783203, "global_step": 28147, "epoch": 339} {"train_loss": -19.046539306640625, "global_step": 28148, "epoch": 339} {"train_loss": -18.908409118652344, "global_step": 28149, "epoch": 339} {"train_loss": -18.347753524780273, "global_step": 28150, "epoch": 339} {"train_loss": -18.45462417602539, "global_step": 28151, "epoch": 339} {"train_loss": -18.383493423461914, "global_step": 28152, "epoch": 339} {"train_loss": -18.840940475463867, "global_step": 28153, "epoch": 339} {"train_loss": -18.88096046447754, "global_step": 28154, "epoch": 339} {"train_loss": -18.806303024291992, "global_step": 28155, "epoch": 339} {"train_loss": -18.479761123657227, "global_step": 28156, "epoch": 339} {"train_loss": -18.798437118530273, "global_step": 28157, "epoch": 339} {"train_loss": -18.732404708862305, "global_step": 28158, "epoch": 339} {"train_loss": -19.113784790039062, "global_step": 28159, "epoch": 339} {"train_loss": -18.75716781616211, "global_step": 28160, "epoch": 339} {"train_loss": -18.590036392211914, "global_step": 28161, "epoch": 339} {"train_loss": -18.71864891052246, "global_step": 28162, "epoch": 339} {"train_loss": -18.955677032470703, "global_step": 28163, "epoch": 339} {"train_loss": -19.1403865814209, "global_step": 28164, "epoch": 339} {"train_loss": -18.99395179748535, "global_step": 28165, "epoch": 339} {"train_loss": -18.939367294311523, "global_step": 28166, "epoch": 339} {"train_loss": -18.751264572143555, "global_step": 28167, "epoch": 339} {"train_loss": -18.67671012878418, "global_step": 28168, "epoch": 339} {"train_loss": -18.7500057220459, "global_step": 28169, "epoch": 339} {"train_loss": -18.64668083190918, "global_step": 28170, "epoch": 339} {"train_loss": -18.963991165161133, "global_step": 28171, "epoch": 339} {"train_loss": -18.61893653869629, "global_step": 28172, "epoch": 339} {"train_loss": -18.272369384765625, "global_step": 28173, "epoch": 339} {"train_loss": -18.545034408569336, "global_step": 28174, "epoch": 339} {"train_loss": -18.959980010986328, "global_step": 28175, "epoch": 339} {"train_loss": -18.802597045898438, "global_step": 28176, "epoch": 339} {"train_loss": -18.923086166381836, "global_step": 28177, "epoch": 339} {"train_loss": -18.645265579223633, "global_step": 28178, "epoch": 339} {"train_loss": -18.43110466003418, "global_step": 28179, "epoch": 339} {"train_loss": -18.844039916992188, "global_step": 28180, "epoch": 339} {"train_loss": -18.99903678894043, "global_step": 28181, "epoch": 339} {"train_loss": -19.023208618164062, "global_step": 28182, "epoch": 339} {"train_loss": -19.11517906188965, "global_step": 28183, "epoch": 339} {"train_loss": -18.854185104370117, "global_step": 28184, "epoch": 339} {"train_loss": -18.93503189086914, "global_step": 28185, "epoch": 339} {"train_loss": -19.17970085144043, "global_step": 28186, "epoch": 339} {"train_loss": -18.978958129882812, "global_step": 28187, "epoch": 339} {"train_loss": -18.371732711791992, "global_step": 28188, "epoch": 339} {"train_loss": -18.94646453857422, "global_step": 28189, "epoch": 339} {"train_loss": -18.743452072143555, "global_step": 28190, "epoch": 339} {"train_loss": -18.531091690063477, "global_step": 28191, "epoch": 339} {"train_loss": -19.015586853027344, "global_step": 28192, "epoch": 339} {"train_loss": -18.791067123413086, "global_step": 28193, "epoch": 339} {"train_loss": -19.142393112182617, "global_step": 28194, "epoch": 339} {"train_loss": -18.93830680847168, "global_step": 28195, "epoch": 339} {"train_loss": -19.088886260986328, "global_step": 28196, "epoch": 339} {"train_loss": -18.771982192993164, "global_step": 28197, "epoch": 339} {"train_loss": -18.83656120300293, "global_step": 28198, "epoch": 339} {"train_loss": -18.849109649658203, "global_step": 28199, "epoch": 339} {"train_loss": -19.043594360351562, "global_step": 28200, "epoch": 339} {"train_loss": -18.65254783630371, "global_step": 28201, "epoch": 339} {"train_loss": -18.678260803222656, "global_step": 28202, "epoch": 339} {"train_loss": -18.762104034423828, "global_step": 28203, "epoch": 339} {"train_loss": -18.856231689453125, "global_step": 28204, "epoch": 339} {"train_loss": -19.020450592041016, "global_step": 28205, "epoch": 339} {"train_loss": -18.910446166992188, "global_step": 28206, "epoch": 339} {"train_loss": -18.850799560546875, "global_step": 28207, "epoch": 339} {"train_loss": -18.781904220581055, "global_step": 28208, "epoch": 339} {"train_loss": -18.883811950683594, "global_step": 28209, "epoch": 339} {"train_loss": -18.840200424194336, "global_step": 28210, "epoch": 339} {"train_loss": -18.814376831054688, "global_step": 28211, "epoch": 339} {"train_loss": -18.443832397460938, "global_step": 28212, "epoch": 339} {"train_loss": -19.14805030822754, "global_step": 28213, "epoch": 339} {"train_loss": -19.110580444335938, "global_step": 28214, "epoch": 339} {"train_loss": -18.559898376464844, "global_step": 28215, "epoch": 339} {"train_loss": -19.18939781188965, "global_step": 28216, "epoch": 339} {"train_loss": -19.30523681640625, "global_step": 28217, "epoch": 339} {"train_loss": -18.67076873779297, "global_step": 28218, "epoch": 339} {"train_loss": -18.83953914872135, "global_step": 28219, "epoch": 339, "val_loss": 5940722.5} {"train_loss": -18.58302879333496, "global_step": 28220, "epoch": 340} {"train_loss": -19.01898193359375, "global_step": 28221, "epoch": 340} {"train_loss": -18.73560905456543, "global_step": 28222, "epoch": 340} {"train_loss": -18.872943878173828, "global_step": 28223, "epoch": 340} {"train_loss": -18.980314254760742, "global_step": 28224, "epoch": 340} {"train_loss": -18.68968391418457, "global_step": 28225, "epoch": 340} {"train_loss": -18.749279022216797, "global_step": 28226, "epoch": 340} {"train_loss": -18.96170997619629, "global_step": 28227, "epoch": 340} {"train_loss": -18.833724975585938, "global_step": 28228, "epoch": 340} {"train_loss": -18.679113388061523, "global_step": 28229, "epoch": 340} {"train_loss": -18.942710876464844, "global_step": 28230, "epoch": 340} {"train_loss": -18.567642211914062, "global_step": 28231, "epoch": 340} {"train_loss": -18.632492065429688, "global_step": 28232, "epoch": 340} {"train_loss": -18.672231674194336, "global_step": 28233, "epoch": 340} {"train_loss": -19.180755615234375, "global_step": 28234, "epoch": 340} {"train_loss": -18.8742733001709, "global_step": 28235, "epoch": 340} {"train_loss": -18.7396297454834, "global_step": 28236, "epoch": 340} {"train_loss": -18.588171005249023, "global_step": 28237, "epoch": 340} {"train_loss": -19.037931442260742, "global_step": 28238, "epoch": 340} {"train_loss": -18.896484375, "global_step": 28239, "epoch": 340} {"train_loss": -19.219125747680664, "global_step": 28240, "epoch": 340} {"train_loss": -18.733678817749023, "global_step": 28241, "epoch": 340} {"train_loss": -18.78126335144043, "global_step": 28242, "epoch": 340} {"train_loss": -18.78363609313965, "global_step": 28243, "epoch": 340} {"train_loss": -18.62554168701172, "global_step": 28244, "epoch": 340} {"train_loss": -19.062278747558594, "global_step": 28245, "epoch": 340} {"train_loss": -18.256465911865234, "global_step": 28246, "epoch": 340} {"train_loss": -18.945478439331055, "global_step": 28247, "epoch": 340} {"train_loss": -18.93604278564453, "global_step": 28248, "epoch": 340} {"train_loss": -19.31082534790039, "global_step": 28249, "epoch": 340} {"train_loss": -18.611146926879883, "global_step": 28250, "epoch": 340} {"train_loss": -19.024402618408203, "global_step": 28251, "epoch": 340} {"train_loss": -18.764719009399414, "global_step": 28252, "epoch": 340} {"train_loss": -19.120695114135742, "global_step": 28253, "epoch": 340} {"train_loss": -18.68417739868164, "global_step": 28254, "epoch": 340} {"train_loss": -18.95265769958496, "global_step": 28255, "epoch": 340} {"train_loss": -19.080793380737305, "global_step": 28256, "epoch": 340} {"train_loss": -18.698223114013672, "global_step": 28257, "epoch": 340} {"train_loss": -18.591312408447266, "global_step": 28258, "epoch": 340} {"train_loss": -18.50576400756836, "global_step": 28259, "epoch": 340} {"train_loss": -18.708133697509766, "global_step": 28260, "epoch": 340} {"train_loss": -19.063810348510742, "global_step": 28261, "epoch": 340} {"train_loss": -18.84235191345215, "global_step": 28262, "epoch": 340} {"train_loss": -18.753173828125, "global_step": 28263, "epoch": 340} {"train_loss": -18.70292091369629, "global_step": 28264, "epoch": 340} {"train_loss": -18.70369529724121, "global_step": 28265, "epoch": 340} {"train_loss": -18.762659072875977, "global_step": 28266, "epoch": 340} {"train_loss": -18.957672119140625, "global_step": 28267, "epoch": 340} {"train_loss": -18.9494571685791, "global_step": 28268, "epoch": 340} {"train_loss": -19.07203483581543, "global_step": 28269, "epoch": 340} {"train_loss": -18.787160873413086, "global_step": 28270, "epoch": 340} {"train_loss": -18.953794479370117, "global_step": 28271, "epoch": 340} {"train_loss": -18.7292537689209, "global_step": 28272, "epoch": 340} {"train_loss": -18.894195556640625, "global_step": 28273, "epoch": 340} {"train_loss": -18.920331954956055, "global_step": 28274, "epoch": 340} {"train_loss": -18.99699592590332, "global_step": 28275, "epoch": 340} {"train_loss": -18.945945739746094, "global_step": 28276, "epoch": 340} {"train_loss": -18.78744888305664, "global_step": 28277, "epoch": 340} {"train_loss": -19.005329132080078, "global_step": 28278, "epoch": 340} {"train_loss": -18.75981330871582, "global_step": 28279, "epoch": 340} {"train_loss": -18.487751007080078, "global_step": 28280, "epoch": 340} {"train_loss": -19.002655029296875, "global_step": 28281, "epoch": 340} {"train_loss": -18.554174423217773, "global_step": 28282, "epoch": 340} {"train_loss": -18.86553192138672, "global_step": 28283, "epoch": 340} {"train_loss": -18.61710548400879, "global_step": 28284, "epoch": 340} {"train_loss": -18.704147338867188, "global_step": 28285, "epoch": 340} {"train_loss": -18.976789474487305, "global_step": 28286, "epoch": 340} {"train_loss": -19.07771873474121, "global_step": 28287, "epoch": 340} {"train_loss": -18.58941078186035, "global_step": 28288, "epoch": 340} {"train_loss": -19.07154655456543, "global_step": 28289, "epoch": 340} {"train_loss": -19.174100875854492, "global_step": 28290, "epoch": 340} {"train_loss": -19.140583038330078, "global_step": 28291, "epoch": 340} {"train_loss": -18.597246170043945, "global_step": 28292, "epoch": 340} {"train_loss": -18.819486618041992, "global_step": 28293, "epoch": 340} {"train_loss": -18.67900848388672, "global_step": 28294, "epoch": 340} {"train_loss": -18.97027587890625, "global_step": 28295, "epoch": 340} {"train_loss": -19.069272994995117, "global_step": 28296, "epoch": 340} {"train_loss": -18.658069610595703, "global_step": 28297, "epoch": 340} {"train_loss": -18.958547592163086, "global_step": 28298, "epoch": 340} {"train_loss": -18.74749183654785, "global_step": 28299, "epoch": 340} {"train_loss": -19.184412002563477, "global_step": 28300, "epoch": 340} {"train_loss": -19.27581214904785, "global_step": 28301, "epoch": 340} {"train_loss": -18.86238596812788, "global_step": 28302, "epoch": 340, "val_loss": 6085748.0} {"train_loss": -18.845260620117188, "global_step": 28303, "epoch": 341} {"train_loss": -18.672199249267578, "global_step": 28304, "epoch": 341} {"train_loss": -18.492826461791992, "global_step": 28305, "epoch": 341} {"train_loss": -18.548542022705078, "global_step": 28306, "epoch": 341} {"train_loss": -18.929046630859375, "global_step": 28307, "epoch": 341} {"train_loss": -18.68385887145996, "global_step": 28308, "epoch": 341} {"train_loss": -18.941490173339844, "global_step": 28309, "epoch": 341} {"train_loss": -18.819250106811523, "global_step": 28310, "epoch": 341} {"train_loss": -19.01121711730957, "global_step": 28311, "epoch": 341} {"train_loss": -18.77859878540039, "global_step": 28312, "epoch": 341} {"train_loss": -19.169158935546875, "global_step": 28313, "epoch": 341} {"train_loss": -18.863142013549805, "global_step": 28314, "epoch": 341} {"train_loss": -19.15079116821289, "global_step": 28315, "epoch": 341} {"train_loss": -18.519420623779297, "global_step": 28316, "epoch": 341} {"train_loss": -19.00190544128418, "global_step": 28317, "epoch": 341} {"train_loss": -18.91579246520996, "global_step": 28318, "epoch": 341} {"train_loss": -19.142343521118164, "global_step": 28319, "epoch": 341} {"train_loss": -19.004587173461914, "global_step": 28320, "epoch": 341} {"train_loss": -18.79352378845215, "global_step": 28321, "epoch": 341} {"train_loss": -19.324901580810547, "global_step": 28322, "epoch": 341} {"train_loss": -19.17225456237793, "global_step": 28323, "epoch": 341} {"train_loss": -18.848783493041992, "global_step": 28324, "epoch": 341} {"train_loss": -19.013164520263672, "global_step": 28325, "epoch": 341} {"train_loss": -18.820661544799805, "global_step": 28326, "epoch": 341} {"train_loss": -18.724639892578125, "global_step": 28327, "epoch": 341} {"train_loss": -18.736351013183594, "global_step": 28328, "epoch": 341} {"train_loss": -18.59048080444336, "global_step": 28329, "epoch": 341} {"train_loss": -18.639925003051758, "global_step": 28330, "epoch": 341} {"train_loss": -18.836833953857422, "global_step": 28331, "epoch": 341} {"train_loss": -18.600027084350586, "global_step": 28332, "epoch": 341} {"train_loss": -18.562376022338867, "global_step": 28333, "epoch": 341} {"train_loss": -18.565567016601562, "global_step": 28334, "epoch": 341} {"train_loss": -19.087329864501953, "global_step": 28335, "epoch": 341} {"train_loss": -19.225996017456055, "global_step": 28336, "epoch": 341} {"train_loss": -18.832239151000977, "global_step": 28337, "epoch": 341} {"train_loss": -19.00052833557129, "global_step": 28338, "epoch": 341} {"train_loss": -18.71599769592285, "global_step": 28339, "epoch": 341} {"train_loss": -18.75379753112793, "global_step": 28340, "epoch": 341} {"train_loss": -19.11174201965332, "global_step": 28341, "epoch": 341} {"train_loss": -18.738035202026367, "global_step": 28342, "epoch": 341} {"train_loss": -18.894577026367188, "global_step": 28343, "epoch": 341} {"train_loss": -18.95863151550293, "global_step": 28344, "epoch": 341} {"train_loss": -18.84208106994629, "global_step": 28345, "epoch": 341} {"train_loss": -18.84417724609375, "global_step": 28346, "epoch": 341} {"train_loss": -18.82883071899414, "global_step": 28347, "epoch": 341} {"train_loss": -19.17453384399414, "global_step": 28348, "epoch": 341} {"train_loss": -19.095722198486328, "global_step": 28349, "epoch": 341} {"train_loss": -18.383853912353516, "global_step": 28350, "epoch": 341} {"train_loss": -18.855222702026367, "global_step": 28351, "epoch": 341} {"train_loss": -18.726322174072266, "global_step": 28352, "epoch": 341} {"train_loss": -19.006078720092773, "global_step": 28353, "epoch": 341} {"train_loss": -19.171146392822266, "global_step": 28354, "epoch": 341} {"train_loss": -19.095966339111328, "global_step": 28355, "epoch": 341} {"train_loss": -18.681257247924805, "global_step": 28356, "epoch": 341} {"train_loss": -18.756793975830078, "global_step": 28357, "epoch": 341} {"train_loss": -19.260480880737305, "global_step": 28358, "epoch": 341} {"train_loss": -19.163488388061523, "global_step": 28359, "epoch": 341} {"train_loss": -18.74153709411621, "global_step": 28360, "epoch": 341} {"train_loss": -19.260848999023438, "global_step": 28361, "epoch": 341} {"train_loss": -18.773786544799805, "global_step": 28362, "epoch": 341} {"train_loss": -18.362823486328125, "global_step": 28363, "epoch": 341} {"train_loss": -18.610868453979492, "global_step": 28364, "epoch": 341} {"train_loss": -18.682483673095703, "global_step": 28365, "epoch": 341} {"train_loss": -18.74519157409668, "global_step": 28366, "epoch": 341} {"train_loss": -18.69150733947754, "global_step": 28367, "epoch": 341} {"train_loss": -19.131458282470703, "global_step": 28368, "epoch": 341} {"train_loss": -19.18238639831543, "global_step": 28369, "epoch": 341} {"train_loss": -18.77925682067871, "global_step": 28370, "epoch": 341} {"train_loss": -18.97467613220215, "global_step": 28371, "epoch": 341} {"train_loss": -18.63555908203125, "global_step": 28372, "epoch": 341} {"train_loss": -18.639583587646484, "global_step": 28373, "epoch": 341} {"train_loss": -18.956037521362305, "global_step": 28374, "epoch": 341} {"train_loss": -18.860280990600586, "global_step": 28375, "epoch": 341} {"train_loss": -18.713674545288086, "global_step": 28376, "epoch": 341} {"train_loss": -18.822093963623047, "global_step": 28377, "epoch": 341} {"train_loss": -18.843542098999023, "global_step": 28378, "epoch": 341} {"train_loss": -18.875160217285156, "global_step": 28379, "epoch": 341} {"train_loss": -18.961511611938477, "global_step": 28380, "epoch": 341} {"train_loss": -19.016450881958008, "global_step": 28381, "epoch": 341} {"train_loss": -18.89686393737793, "global_step": 28382, "epoch": 341} {"train_loss": -18.87107276916504, "global_step": 28383, "epoch": 341} {"train_loss": -18.79746437072754, "global_step": 28384, "epoch": 341} {"train_loss": -18.884363174438477, "global_step": 28385, "epoch": 341, "val_loss": 6013655.0} {"train_loss": -18.65335464477539, "global_step": 28386, "epoch": 342} {"train_loss": -18.572546005249023, "global_step": 28387, "epoch": 342} {"train_loss": -19.117734909057617, "global_step": 28388, "epoch": 342} {"train_loss": -18.79900550842285, "global_step": 28389, "epoch": 342} {"train_loss": -18.840246200561523, "global_step": 28390, "epoch": 342} {"train_loss": -18.70393943786621, "global_step": 28391, "epoch": 342} {"train_loss": -19.011871337890625, "global_step": 28392, "epoch": 342} {"train_loss": -18.945341110229492, "global_step": 28393, "epoch": 342} {"train_loss": -19.22270393371582, "global_step": 28394, "epoch": 342} {"train_loss": -18.74135398864746, "global_step": 28395, "epoch": 342} {"train_loss": -18.801925659179688, "global_step": 28396, "epoch": 342} {"train_loss": -18.781997680664062, "global_step": 28397, "epoch": 342} {"train_loss": -18.89713478088379, "global_step": 28398, "epoch": 342} {"train_loss": -18.859403610229492, "global_step": 28399, "epoch": 342} {"train_loss": -18.70789909362793, "global_step": 28400, "epoch": 342} {"train_loss": -18.70651626586914, "global_step": 28401, "epoch": 342} {"train_loss": -18.97633171081543, "global_step": 28402, "epoch": 342} {"train_loss": -18.704240798950195, "global_step": 28403, "epoch": 342} {"train_loss": -19.022607803344727, "global_step": 28404, "epoch": 342} {"train_loss": -18.925037384033203, "global_step": 28405, "epoch": 342} {"train_loss": -18.89460563659668, "global_step": 28406, "epoch": 342} {"train_loss": -18.56412696838379, "global_step": 28407, "epoch": 342} {"train_loss": -19.18366813659668, "global_step": 28408, "epoch": 342} {"train_loss": -18.980558395385742, "global_step": 28409, "epoch": 342} {"train_loss": -19.006954193115234, "global_step": 28410, "epoch": 342} {"train_loss": -19.026281356811523, "global_step": 28411, "epoch": 342} {"train_loss": -19.274328231811523, "global_step": 28412, "epoch": 342} {"train_loss": -18.53972816467285, "global_step": 28413, "epoch": 342} {"train_loss": -18.83147621154785, "global_step": 28414, "epoch": 342} {"train_loss": -19.029296875, "global_step": 28415, "epoch": 342} {"train_loss": -18.498884201049805, "global_step": 28416, "epoch": 342} {"train_loss": -18.621639251708984, "global_step": 28417, "epoch": 342} {"train_loss": -18.83271598815918, "global_step": 28418, "epoch": 342} {"train_loss": -18.684778213500977, "global_step": 28419, "epoch": 342} {"train_loss": -18.88381004333496, "global_step": 28420, "epoch": 342} {"train_loss": -18.96590232849121, "global_step": 28421, "epoch": 342} {"train_loss": -18.712087631225586, "global_step": 28422, "epoch": 342} {"train_loss": -18.591386795043945, "global_step": 28423, "epoch": 342} {"train_loss": -18.92171287536621, "global_step": 28424, "epoch": 342} {"train_loss": -18.868885040283203, "global_step": 28425, "epoch": 342} {"train_loss": -18.853479385375977, "global_step": 28426, "epoch": 342} {"train_loss": -18.850675582885742, "global_step": 28427, "epoch": 342} {"train_loss": -19.179670333862305, "global_step": 28428, "epoch": 342} {"train_loss": -18.86384391784668, "global_step": 28429, "epoch": 342} {"train_loss": -19.03916358947754, "global_step": 28430, "epoch": 342} {"train_loss": -19.33854103088379, "global_step": 28431, "epoch": 342} {"train_loss": -18.8977108001709, "global_step": 28432, "epoch": 342} {"train_loss": -18.96650505065918, "global_step": 28433, "epoch": 342} {"train_loss": -19.378681182861328, "global_step": 28434, "epoch": 342} {"train_loss": -18.550554275512695, "global_step": 28435, "epoch": 342} {"train_loss": -18.809574127197266, "global_step": 28436, "epoch": 342} {"train_loss": -18.75335121154785, "global_step": 28437, "epoch": 342} {"train_loss": -18.854408264160156, "global_step": 28438, "epoch": 342} {"train_loss": -18.822879791259766, "global_step": 28439, "epoch": 342} {"train_loss": -18.971832275390625, "global_step": 28440, "epoch": 342} {"train_loss": -19.143882751464844, "global_step": 28441, "epoch": 342} {"train_loss": -19.243745803833008, "global_step": 28442, "epoch": 342} {"train_loss": -19.04345703125, "global_step": 28443, "epoch": 342} {"train_loss": -19.039005279541016, "global_step": 28444, "epoch": 342} {"train_loss": -19.313865661621094, "global_step": 28445, "epoch": 342} {"train_loss": -18.755205154418945, "global_step": 28446, "epoch": 342} {"train_loss": -19.016836166381836, "global_step": 28447, "epoch": 342} {"train_loss": -18.65367889404297, "global_step": 28448, "epoch": 342} {"train_loss": -18.372928619384766, "global_step": 28449, "epoch": 342} {"train_loss": -18.902713775634766, "global_step": 28450, "epoch": 342} {"train_loss": -18.878965377807617, "global_step": 28451, "epoch": 342} {"train_loss": -18.849472045898438, "global_step": 28452, "epoch": 342} {"train_loss": -18.726974487304688, "global_step": 28453, "epoch": 342} {"train_loss": -18.99875831604004, "global_step": 28454, "epoch": 342} {"train_loss": -18.78886604309082, "global_step": 28455, "epoch": 342} {"train_loss": -19.020357131958008, "global_step": 28456, "epoch": 342} {"train_loss": -18.495445251464844, "global_step": 28457, "epoch": 342} {"train_loss": -18.709135055541992, "global_step": 28458, "epoch": 342} {"train_loss": -19.093080520629883, "global_step": 28459, "epoch": 342} {"train_loss": -18.82291030883789, "global_step": 28460, "epoch": 342} {"train_loss": -19.147268295288086, "global_step": 28461, "epoch": 342} {"train_loss": -18.74439811706543, "global_step": 28462, "epoch": 342} {"train_loss": -18.890607833862305, "global_step": 28463, "epoch": 342} {"train_loss": -18.676822662353516, "global_step": 28464, "epoch": 342} {"train_loss": -18.810333251953125, "global_step": 28465, "epoch": 342} {"train_loss": -18.694469451904297, "global_step": 28466, "epoch": 342} {"train_loss": -18.456693649291992, "global_step": 28467, "epoch": 342} {"train_loss": -18.866205537175556, "global_step": 28468, "epoch": 342, "val_loss": 6280376.0} {"train_loss": -18.439477920532227, "global_step": 28469, "epoch": 343} {"train_loss": -18.316255569458008, "global_step": 28470, "epoch": 343} {"train_loss": -18.413793563842773, "global_step": 28471, "epoch": 343} {"train_loss": -18.710678100585938, "global_step": 28472, "epoch": 343} {"train_loss": -18.53908920288086, "global_step": 28473, "epoch": 343} {"train_loss": -18.50592613220215, "global_step": 28474, "epoch": 343} {"train_loss": -18.516489028930664, "global_step": 28475, "epoch": 343} {"train_loss": -18.467758178710938, "global_step": 28476, "epoch": 343} {"train_loss": -18.208906173706055, "global_step": 28477, "epoch": 343} {"train_loss": -18.526081085205078, "global_step": 28478, "epoch": 343} {"train_loss": -18.4235782623291, "global_step": 28479, "epoch": 343} {"train_loss": -18.434804916381836, "global_step": 28480, "epoch": 343} {"train_loss": -18.963504791259766, "global_step": 28481, "epoch": 343} {"train_loss": -19.216175079345703, "global_step": 28482, "epoch": 343} {"train_loss": -18.846357345581055, "global_step": 28483, "epoch": 343} {"train_loss": -18.650171279907227, "global_step": 28484, "epoch": 343} {"train_loss": -18.339054107666016, "global_step": 28485, "epoch": 343} {"train_loss": -19.100431442260742, "global_step": 28486, "epoch": 343} {"train_loss": -18.801471710205078, "global_step": 28487, "epoch": 343} {"train_loss": -18.542387008666992, "global_step": 28488, "epoch": 343} {"train_loss": -18.52107810974121, "global_step": 28489, "epoch": 343} {"train_loss": -18.57204246520996, "global_step": 28490, "epoch": 343} {"train_loss": -18.789453506469727, "global_step": 28491, "epoch": 343} {"train_loss": -18.8212947845459, "global_step": 28492, "epoch": 343} {"train_loss": -18.5958194732666, "global_step": 28493, "epoch": 343} {"train_loss": -18.887760162353516, "global_step": 28494, "epoch": 343} {"train_loss": -18.764102935791016, "global_step": 28495, "epoch": 343} {"train_loss": -19.014883041381836, "global_step": 28496, "epoch": 343} {"train_loss": -18.426549911499023, "global_step": 28497, "epoch": 343} {"train_loss": -18.915878295898438, "global_step": 28498, "epoch": 343} {"train_loss": -18.853296279907227, "global_step": 28499, "epoch": 343} {"train_loss": -18.7530574798584, "global_step": 28500, "epoch": 343} {"train_loss": -18.534231185913086, "global_step": 28501, "epoch": 343} {"train_loss": -18.778940200805664, "global_step": 28502, "epoch": 343} {"train_loss": -18.549152374267578, "global_step": 28503, "epoch": 343} {"train_loss": -19.07000732421875, "global_step": 28504, "epoch": 343} {"train_loss": -18.396833419799805, "global_step": 28505, "epoch": 343} {"train_loss": -18.74606704711914, "global_step": 28506, "epoch": 343} {"train_loss": -18.673105239868164, "global_step": 28507, "epoch": 343} {"train_loss": -19.25042152404785, "global_step": 28508, "epoch": 343} {"train_loss": -19.03663444519043, "global_step": 28509, "epoch": 343} {"train_loss": -18.66586685180664, "global_step": 28510, "epoch": 343} {"train_loss": -19.087173461914062, "global_step": 28511, "epoch": 343} {"train_loss": -19.193649291992188, "global_step": 28512, "epoch": 343} {"train_loss": -18.597270965576172, "global_step": 28513, "epoch": 343} {"train_loss": -18.852558135986328, "global_step": 28514, "epoch": 343} {"train_loss": -18.8941707611084, "global_step": 28515, "epoch": 343} {"train_loss": -18.78677749633789, "global_step": 28516, "epoch": 343} {"train_loss": -19.0124454498291, "global_step": 28517, "epoch": 343} {"train_loss": -19.210363388061523, "global_step": 28518, "epoch": 343} {"train_loss": -19.160442352294922, "global_step": 28519, "epoch": 343} {"train_loss": -19.0534725189209, "global_step": 28520, "epoch": 343} {"train_loss": -18.558074951171875, "global_step": 28521, "epoch": 343} {"train_loss": -18.889936447143555, "global_step": 28522, "epoch": 343} {"train_loss": -18.86583709716797, "global_step": 28523, "epoch": 343} {"train_loss": -18.678916931152344, "global_step": 28524, "epoch": 343} {"train_loss": -18.731412887573242, "global_step": 28525, "epoch": 343} {"train_loss": -19.582626342773438, "global_step": 28526, "epoch": 343} {"train_loss": -18.947233200073242, "global_step": 28527, "epoch": 343} {"train_loss": -18.75461196899414, "global_step": 28528, "epoch": 343} {"train_loss": -18.95186424255371, "global_step": 28529, "epoch": 343} {"train_loss": -18.696491241455078, "global_step": 28530, "epoch": 343} {"train_loss": -18.962451934814453, "global_step": 28531, "epoch": 343} {"train_loss": -18.68494415283203, "global_step": 28532, "epoch": 343} {"train_loss": -18.740942001342773, "global_step": 28533, "epoch": 343} {"train_loss": -18.741863250732422, "global_step": 28534, "epoch": 343} {"train_loss": -18.573246002197266, "global_step": 28535, "epoch": 343} {"train_loss": -18.696691513061523, "global_step": 28536, "epoch": 343} {"train_loss": -19.12982749938965, "global_step": 28537, "epoch": 343} {"train_loss": -18.945663452148438, "global_step": 28538, "epoch": 343} {"train_loss": -18.987571716308594, "global_step": 28539, "epoch": 343} {"train_loss": -19.063064575195312, "global_step": 28540, "epoch": 343} {"train_loss": -18.96719741821289, "global_step": 28541, "epoch": 343} {"train_loss": -19.00855827331543, "global_step": 28542, "epoch": 343} {"train_loss": -18.854223251342773, "global_step": 28543, "epoch": 343} {"train_loss": -19.122936248779297, "global_step": 28544, "epoch": 343} {"train_loss": -18.74301528930664, "global_step": 28545, "epoch": 343} {"train_loss": -18.756982803344727, "global_step": 28546, "epoch": 343} {"train_loss": -18.639780044555664, "global_step": 28547, "epoch": 343} {"train_loss": -18.533008575439453, "global_step": 28548, "epoch": 343} {"train_loss": -19.003948211669922, "global_step": 28549, "epoch": 343} {"train_loss": -19.35541534423828, "global_step": 28550, "epoch": 343} {"train_loss": -18.79569281152932, "global_step": 28551, "epoch": 343, "val_loss": 6004387.0} {"train_loss": -18.583669662475586, "global_step": 28552, "epoch": 344} {"train_loss": -18.571928024291992, "global_step": 28553, "epoch": 344} {"train_loss": -18.51715850830078, "global_step": 28554, "epoch": 344} {"train_loss": -18.930877685546875, "global_step": 28555, "epoch": 344} {"train_loss": -19.168928146362305, "global_step": 28556, "epoch": 344} {"train_loss": -18.918319702148438, "global_step": 28557, "epoch": 344} {"train_loss": -18.424915313720703, "global_step": 28558, "epoch": 344} {"train_loss": -18.741474151611328, "global_step": 28559, "epoch": 344} {"train_loss": -18.954172134399414, "global_step": 28560, "epoch": 344} {"train_loss": -18.772563934326172, "global_step": 28561, "epoch": 344} {"train_loss": -18.812793731689453, "global_step": 28562, "epoch": 344} {"train_loss": -18.797212600708008, "global_step": 28563, "epoch": 344} {"train_loss": -18.91061019897461, "global_step": 28564, "epoch": 344} {"train_loss": -18.57962989807129, "global_step": 28565, "epoch": 344} {"train_loss": -18.94829750061035, "global_step": 28566, "epoch": 344} {"train_loss": -18.719837188720703, "global_step": 28567, "epoch": 344} {"train_loss": -18.8828182220459, "global_step": 28568, "epoch": 344} {"train_loss": -18.877063751220703, "global_step": 28569, "epoch": 344} {"train_loss": -18.79252052307129, "global_step": 28570, "epoch": 344} {"train_loss": -18.796504974365234, "global_step": 28571, "epoch": 344} {"train_loss": -18.683135986328125, "global_step": 28572, "epoch": 344} {"train_loss": -19.214027404785156, "global_step": 28573, "epoch": 344} {"train_loss": -18.71091651916504, "global_step": 28574, "epoch": 344} {"train_loss": -18.844898223876953, "global_step": 28575, "epoch": 344} {"train_loss": -18.685606002807617, "global_step": 28576, "epoch": 344} {"train_loss": -18.914535522460938, "global_step": 28577, "epoch": 344} {"train_loss": -18.71584701538086, "global_step": 28578, "epoch": 344} {"train_loss": -18.977262496948242, "global_step": 28579, "epoch": 344} {"train_loss": -18.864013671875, "global_step": 28580, "epoch": 344} {"train_loss": -19.106159210205078, "global_step": 28581, "epoch": 344} {"train_loss": -18.94773292541504, "global_step": 28582, "epoch": 344} {"train_loss": -18.938058853149414, "global_step": 28583, "epoch": 344} {"train_loss": -18.903303146362305, "global_step": 28584, "epoch": 344} {"train_loss": -18.56512451171875, "global_step": 28585, "epoch": 344} {"train_loss": -18.75014305114746, "global_step": 28586, "epoch": 344} {"train_loss": -19.283170700073242, "global_step": 28587, "epoch": 344} {"train_loss": -18.824222564697266, "global_step": 28588, "epoch": 344} {"train_loss": -18.878665924072266, "global_step": 28589, "epoch": 344} {"train_loss": -18.92926025390625, "global_step": 28590, "epoch": 344} {"train_loss": -18.761423110961914, "global_step": 28591, "epoch": 344} {"train_loss": -19.038915634155273, "global_step": 28592, "epoch": 344} {"train_loss": -18.947690963745117, "global_step": 28593, "epoch": 344} {"train_loss": -18.89124870300293, "global_step": 28594, "epoch": 344} {"train_loss": -18.989187240600586, "global_step": 28595, "epoch": 344} {"train_loss": -19.083784103393555, "global_step": 28596, "epoch": 344} {"train_loss": -19.045827865600586, "global_step": 28597, "epoch": 344} {"train_loss": -18.697111129760742, "global_step": 28598, "epoch": 344} {"train_loss": -18.762685775756836, "global_step": 28599, "epoch": 344} {"train_loss": -18.85470199584961, "global_step": 28600, "epoch": 344} {"train_loss": -18.628576278686523, "global_step": 28601, "epoch": 344} {"train_loss": -18.869272232055664, "global_step": 28602, "epoch": 344} {"train_loss": -18.63831901550293, "global_step": 28603, "epoch": 344} {"train_loss": -19.0617733001709, "global_step": 28604, "epoch": 344} {"train_loss": -18.75360679626465, "global_step": 28605, "epoch": 344} {"train_loss": -18.51736068725586, "global_step": 28606, "epoch": 344} {"train_loss": -18.886777877807617, "global_step": 28607, "epoch": 344} {"train_loss": -19.10344886779785, "global_step": 28608, "epoch": 344} {"train_loss": -18.825992584228516, "global_step": 28609, "epoch": 344} {"train_loss": -18.81080436706543, "global_step": 28610, "epoch": 344} {"train_loss": -18.653926849365234, "global_step": 28611, "epoch": 344} {"train_loss": -19.024213790893555, "global_step": 28612, "epoch": 344} {"train_loss": -19.06110954284668, "global_step": 28613, "epoch": 344} {"train_loss": -19.18115234375, "global_step": 28614, "epoch": 344} {"train_loss": -18.64516258239746, "global_step": 28615, "epoch": 344} {"train_loss": -18.882953643798828, "global_step": 28616, "epoch": 344} {"train_loss": -19.034147262573242, "global_step": 28617, "epoch": 344} {"train_loss": -18.735435485839844, "global_step": 28618, "epoch": 344} {"train_loss": -18.796554565429688, "global_step": 28619, "epoch": 344} {"train_loss": -18.726778030395508, "global_step": 28620, "epoch": 344} {"train_loss": -19.027631759643555, "global_step": 28621, "epoch": 344} {"train_loss": -18.622663497924805, "global_step": 28622, "epoch": 344} {"train_loss": -19.026731491088867, "global_step": 28623, "epoch": 344} {"train_loss": -18.81614112854004, "global_step": 28624, "epoch": 344} {"train_loss": -19.12796401977539, "global_step": 28625, "epoch": 344} {"train_loss": -18.6573429107666, "global_step": 28626, "epoch": 344} {"train_loss": -18.546663284301758, "global_step": 28627, "epoch": 344} {"train_loss": -19.15215492248535, "global_step": 28628, "epoch": 344} {"train_loss": -18.86553955078125, "global_step": 28629, "epoch": 344} {"train_loss": -18.804628372192383, "global_step": 28630, "epoch": 344} {"train_loss": -18.835174560546875, "global_step": 28631, "epoch": 344} {"train_loss": -19.115171432495117, "global_step": 28632, "epoch": 344} {"train_loss": -18.82723045349121, "global_step": 28633, "epoch": 344} {"train_loss": -18.841978348881366, "global_step": 28634, "epoch": 344, "val_loss": 6010789.0} {"train_loss": -18.985544204711914, "global_step": 28635, "epoch": 345} {"train_loss": -18.561315536499023, "global_step": 28636, "epoch": 345} {"train_loss": -18.616756439208984, "global_step": 28637, "epoch": 345} {"train_loss": -18.867202758789062, "global_step": 28638, "epoch": 345} {"train_loss": -18.904279708862305, "global_step": 28639, "epoch": 345} {"train_loss": -18.75345230102539, "global_step": 28640, "epoch": 345} {"train_loss": -18.89837074279785, "global_step": 28641, "epoch": 345} {"train_loss": -18.5588436126709, "global_step": 28642, "epoch": 345} {"train_loss": -18.928272247314453, "global_step": 28643, "epoch": 345} {"train_loss": -18.67559242248535, "global_step": 28644, "epoch": 345} {"train_loss": -18.608657836914062, "global_step": 28645, "epoch": 345} {"train_loss": -18.412607192993164, "global_step": 28646, "epoch": 345} {"train_loss": -18.921499252319336, "global_step": 28647, "epoch": 345} {"train_loss": -19.059688568115234, "global_step": 28648, "epoch": 345} {"train_loss": -18.896326065063477, "global_step": 28649, "epoch": 345} {"train_loss": -18.97170639038086, "global_step": 28650, "epoch": 345} {"train_loss": -18.748327255249023, "global_step": 28651, "epoch": 345} {"train_loss": -18.41021728515625, "global_step": 28652, "epoch": 345} {"train_loss": -18.534687042236328, "global_step": 28653, "epoch": 345} {"train_loss": -19.25091552734375, "global_step": 28654, "epoch": 345} {"train_loss": -18.72426414489746, "global_step": 28655, "epoch": 345} {"train_loss": -18.69712257385254, "global_step": 28656, "epoch": 345} {"train_loss": -18.75676918029785, "global_step": 28657, "epoch": 345} {"train_loss": -18.963891983032227, "global_step": 28658, "epoch": 345} {"train_loss": -18.731311798095703, "global_step": 28659, "epoch": 345} {"train_loss": -18.852872848510742, "global_step": 28660, "epoch": 345} {"train_loss": -18.955419540405273, "global_step": 28661, "epoch": 345} {"train_loss": -18.77019691467285, "global_step": 28662, "epoch": 345} {"train_loss": -18.705188751220703, "global_step": 28663, "epoch": 345} {"train_loss": -18.95511817932129, "global_step": 28664, "epoch": 345} {"train_loss": -18.90944480895996, "global_step": 28665, "epoch": 345} {"train_loss": -18.833494186401367, "global_step": 28666, "epoch": 345} {"train_loss": -18.719919204711914, "global_step": 28667, "epoch": 345} {"train_loss": -18.486318588256836, "global_step": 28668, "epoch": 345} {"train_loss": -19.016000747680664, "global_step": 28669, "epoch": 345} {"train_loss": -18.467899322509766, "global_step": 28670, "epoch": 345} {"train_loss": -18.658103942871094, "global_step": 28671, "epoch": 345} {"train_loss": -18.80776023864746, "global_step": 28672, "epoch": 345} {"train_loss": -19.06448745727539, "global_step": 28673, "epoch": 345} {"train_loss": -19.191007614135742, "global_step": 28674, "epoch": 345} {"train_loss": -19.0743465423584, "global_step": 28675, "epoch": 345} {"train_loss": -19.006526947021484, "global_step": 28676, "epoch": 345} {"train_loss": -18.67072105407715, "global_step": 28677, "epoch": 345} {"train_loss": -18.619205474853516, "global_step": 28678, "epoch": 345} {"train_loss": -19.054914474487305, "global_step": 28679, "epoch": 345} {"train_loss": -19.061290740966797, "global_step": 28680, "epoch": 345} {"train_loss": -18.916030883789062, "global_step": 28681, "epoch": 345} {"train_loss": -18.938047409057617, "global_step": 28682, "epoch": 345} {"train_loss": -18.823331832885742, "global_step": 28683, "epoch": 345} {"train_loss": -18.889793395996094, "global_step": 28684, "epoch": 345} {"train_loss": -18.701221466064453, "global_step": 28685, "epoch": 345} {"train_loss": -19.02512550354004, "global_step": 28686, "epoch": 345} {"train_loss": -19.0700740814209, "global_step": 28687, "epoch": 345} {"train_loss": -18.993637084960938, "global_step": 28688, "epoch": 345} {"train_loss": -18.913442611694336, "global_step": 28689, "epoch": 345} {"train_loss": -18.349609375, "global_step": 28690, "epoch": 345} {"train_loss": -18.73069190979004, "global_step": 28691, "epoch": 345} {"train_loss": -18.813474655151367, "global_step": 28692, "epoch": 345} {"train_loss": -18.97307014465332, "global_step": 28693, "epoch": 345} {"train_loss": -18.919260025024414, "global_step": 28694, "epoch": 345} {"train_loss": -18.92821502685547, "global_step": 28695, "epoch": 345} {"train_loss": -18.903602600097656, "global_step": 28696, "epoch": 345} {"train_loss": -19.039350509643555, "global_step": 28697, "epoch": 345} {"train_loss": -19.05403709411621, "global_step": 28698, "epoch": 345} {"train_loss": -18.674379348754883, "global_step": 28699, "epoch": 345} {"train_loss": -18.919485092163086, "global_step": 28700, "epoch": 345} {"train_loss": -18.823638916015625, "global_step": 28701, "epoch": 345} {"train_loss": -19.174039840698242, "global_step": 28702, "epoch": 345} {"train_loss": -18.891597747802734, "global_step": 28703, "epoch": 345} {"train_loss": -18.723026275634766, "global_step": 28704, "epoch": 345} {"train_loss": -18.868112564086914, "global_step": 28705, "epoch": 345} {"train_loss": -18.45454216003418, "global_step": 28706, "epoch": 345} {"train_loss": -18.702131271362305, "global_step": 28707, "epoch": 345} {"train_loss": -18.862598419189453, "global_step": 28708, "epoch": 345} {"train_loss": -18.84423828125, "global_step": 28709, "epoch": 345} {"train_loss": -18.926624298095703, "global_step": 28710, "epoch": 345} {"train_loss": -19.293596267700195, "global_step": 28711, "epoch": 345} {"train_loss": -19.015932083129883, "global_step": 28712, "epoch": 345} {"train_loss": -18.647245407104492, "global_step": 28713, "epoch": 345} {"train_loss": -19.124448776245117, "global_step": 28714, "epoch": 345} {"train_loss": -18.96237564086914, "global_step": 28715, "epoch": 345} {"train_loss": -18.705060958862305, "global_step": 28716, "epoch": 345} {"train_loss": -18.856466431215583, "global_step": 28717, "epoch": 345, "val_loss": 5861233.0} {"train_loss": -18.587188720703125, "global_step": 28718, "epoch": 346} {"train_loss": -18.519287109375, "global_step": 28719, "epoch": 346} {"train_loss": -18.537216186523438, "global_step": 28720, "epoch": 346} {"train_loss": -18.417911529541016, "global_step": 28721, "epoch": 346} {"train_loss": -18.78708267211914, "global_step": 28722, "epoch": 346} {"train_loss": -18.650524139404297, "global_step": 28723, "epoch": 346} {"train_loss": -18.488603591918945, "global_step": 28724, "epoch": 346} {"train_loss": -18.66645622253418, "global_step": 28725, "epoch": 346} {"train_loss": -18.570383071899414, "global_step": 28726, "epoch": 346} {"train_loss": -18.69270896911621, "global_step": 28727, "epoch": 346} {"train_loss": -19.203418731689453, "global_step": 28728, "epoch": 346} {"train_loss": -18.639896392822266, "global_step": 28729, "epoch": 346} {"train_loss": -18.684555053710938, "global_step": 28730, "epoch": 346} {"train_loss": -19.128023147583008, "global_step": 28731, "epoch": 346} {"train_loss": -19.050167083740234, "global_step": 28732, "epoch": 346} {"train_loss": -18.575353622436523, "global_step": 28733, "epoch": 346} {"train_loss": -18.981769561767578, "global_step": 28734, "epoch": 346} {"train_loss": -18.786985397338867, "global_step": 28735, "epoch": 346} {"train_loss": -18.72126579284668, "global_step": 28736, "epoch": 346} {"train_loss": -19.037485122680664, "global_step": 28737, "epoch": 346} {"train_loss": -18.90887451171875, "global_step": 28738, "epoch": 346} {"train_loss": -19.170785903930664, "global_step": 28739, "epoch": 346} {"train_loss": -18.820255279541016, "global_step": 28740, "epoch": 346} {"train_loss": -18.615060806274414, "global_step": 28741, "epoch": 346} {"train_loss": -18.986684799194336, "global_step": 28742, "epoch": 346} {"train_loss": -19.225893020629883, "global_step": 28743, "epoch": 346} {"train_loss": -18.700841903686523, "global_step": 28744, "epoch": 346} {"train_loss": -19.13312339782715, "global_step": 28745, "epoch": 346} {"train_loss": -19.118497848510742, "global_step": 28746, "epoch": 346} {"train_loss": -18.83646583557129, "global_step": 28747, "epoch": 346} {"train_loss": -18.786903381347656, "global_step": 28748, "epoch": 346} {"train_loss": -19.175722122192383, "global_step": 28749, "epoch": 346} {"train_loss": -18.461181640625, "global_step": 28750, "epoch": 346} {"train_loss": -18.60450553894043, "global_step": 28751, "epoch": 346} {"train_loss": -18.9838924407959, "global_step": 28752, "epoch": 346} {"train_loss": -18.897151947021484, "global_step": 28753, "epoch": 346} {"train_loss": -18.670703887939453, "global_step": 28754, "epoch": 346} {"train_loss": -19.118534088134766, "global_step": 28755, "epoch": 346} {"train_loss": -18.750118255615234, "global_step": 28756, "epoch": 346} {"train_loss": -18.762609481811523, "global_step": 28757, "epoch": 346} {"train_loss": -19.075281143188477, "global_step": 28758, "epoch": 346} {"train_loss": -18.928621292114258, "global_step": 28759, "epoch": 346} {"train_loss": -19.156225204467773, "global_step": 28760, "epoch": 346} {"train_loss": -18.786436080932617, "global_step": 28761, "epoch": 346} {"train_loss": -18.801727294921875, "global_step": 28762, "epoch": 346} {"train_loss": -18.832143783569336, "global_step": 28763, "epoch": 346} {"train_loss": -18.749433517456055, "global_step": 28764, "epoch": 346} {"train_loss": -19.280960083007812, "global_step": 28765, "epoch": 346} {"train_loss": -18.77557945251465, "global_step": 28766, "epoch": 346} {"train_loss": -18.80793571472168, "global_step": 28767, "epoch": 346} {"train_loss": -18.799474716186523, "global_step": 28768, "epoch": 346} {"train_loss": -19.116928100585938, "global_step": 28769, "epoch": 346} {"train_loss": -18.877622604370117, "global_step": 28770, "epoch": 346} {"train_loss": -18.697751998901367, "global_step": 28771, "epoch": 346} {"train_loss": -18.98737907409668, "global_step": 28772, "epoch": 346} {"train_loss": -18.527137756347656, "global_step": 28773, "epoch": 346} {"train_loss": -19.021591186523438, "global_step": 28774, "epoch": 346} {"train_loss": -18.828393936157227, "global_step": 28775, "epoch": 346} {"train_loss": -18.47455406188965, "global_step": 28776, "epoch": 346} {"train_loss": -18.592586517333984, "global_step": 28777, "epoch": 346} {"train_loss": -18.85273551940918, "global_step": 28778, "epoch": 346} {"train_loss": -18.616849899291992, "global_step": 28779, "epoch": 346} {"train_loss": -18.747648239135742, "global_step": 28780, "epoch": 346} {"train_loss": -19.049551010131836, "global_step": 28781, "epoch": 346} {"train_loss": -18.884784698486328, "global_step": 28782, "epoch": 346} {"train_loss": -18.82171058654785, "global_step": 28783, "epoch": 346} {"train_loss": -18.81831169128418, "global_step": 28784, "epoch": 346} {"train_loss": -18.381757736206055, "global_step": 28785, "epoch": 346} {"train_loss": -18.8449649810791, "global_step": 28786, "epoch": 346} {"train_loss": -18.650739669799805, "global_step": 28787, "epoch": 346} {"train_loss": -19.152603149414062, "global_step": 28788, "epoch": 346} {"train_loss": -19.015043258666992, "global_step": 28789, "epoch": 346} {"train_loss": -18.94391441345215, "global_step": 28790, "epoch": 346} {"train_loss": -19.55417251586914, "global_step": 28791, "epoch": 346} {"train_loss": -19.2867488861084, "global_step": 28792, "epoch": 346} {"train_loss": -19.037092208862305, "global_step": 28793, "epoch": 346} {"train_loss": -18.826147079467773, "global_step": 28794, "epoch": 346} {"train_loss": -19.10808753967285, "global_step": 28795, "epoch": 346} {"train_loss": -19.010427474975586, "global_step": 28796, "epoch": 346} {"train_loss": -19.093820571899414, "global_step": 28797, "epoch": 346} {"train_loss": -19.125574111938477, "global_step": 28798, "epoch": 346} {"train_loss": -18.528553009033203, "global_step": 28799, "epoch": 346} {"train_loss": -18.85070187212473, "global_step": 28800, "epoch": 346, "val_loss": 6103717.5} {"train_loss": -18.14862060546875, "global_step": 28801, "epoch": 347} {"train_loss": -18.481903076171875, "global_step": 28802, "epoch": 347} {"train_loss": -18.727792739868164, "global_step": 28803, "epoch": 347} {"train_loss": -18.53644371032715, "global_step": 28804, "epoch": 347} {"train_loss": -18.346281051635742, "global_step": 28805, "epoch": 347} {"train_loss": -18.661453247070312, "global_step": 28806, "epoch": 347} {"train_loss": -18.560789108276367, "global_step": 28807, "epoch": 347} {"train_loss": -18.757583618164062, "global_step": 28808, "epoch": 347} {"train_loss": -18.772397994995117, "global_step": 28809, "epoch": 347} {"train_loss": -18.819910049438477, "global_step": 28810, "epoch": 347} {"train_loss": -18.416519165039062, "global_step": 28811, "epoch": 347} {"train_loss": -18.71959114074707, "global_step": 28812, "epoch": 347} {"train_loss": -18.468202590942383, "global_step": 28813, "epoch": 347} {"train_loss": -18.610170364379883, "global_step": 28814, "epoch": 347} {"train_loss": -18.687902450561523, "global_step": 28815, "epoch": 347} {"train_loss": -18.89670753479004, "global_step": 28816, "epoch": 347} {"train_loss": -18.680410385131836, "global_step": 28817, "epoch": 347} {"train_loss": -18.54048728942871, "global_step": 28818, "epoch": 347} {"train_loss": -18.460851669311523, "global_step": 28819, "epoch": 347} {"train_loss": -18.87910270690918, "global_step": 28820, "epoch": 347} {"train_loss": -18.494436264038086, "global_step": 28821, "epoch": 347} {"train_loss": -18.66583824157715, "global_step": 28822, "epoch": 347} {"train_loss": -18.862396240234375, "global_step": 28823, "epoch": 347} {"train_loss": -18.94464683532715, "global_step": 28824, "epoch": 347} {"train_loss": -19.217466354370117, "global_step": 28825, "epoch": 347} {"train_loss": -18.705602645874023, "global_step": 28826, "epoch": 347} {"train_loss": -18.670875549316406, "global_step": 28827, "epoch": 347} {"train_loss": -19.29233169555664, "global_step": 28828, "epoch": 347} {"train_loss": -18.796598434448242, "global_step": 28829, "epoch": 347} {"train_loss": -18.99017906188965, "global_step": 28830, "epoch": 347} {"train_loss": -18.796363830566406, "global_step": 28831, "epoch": 347} {"train_loss": -19.014883041381836, "global_step": 28832, "epoch": 347} {"train_loss": -18.72474479675293, "global_step": 28833, "epoch": 347} {"train_loss": -19.250593185424805, "global_step": 28834, "epoch": 347} {"train_loss": -18.692190170288086, "global_step": 28835, "epoch": 347} {"train_loss": -18.821762084960938, "global_step": 28836, "epoch": 347} {"train_loss": -19.059656143188477, "global_step": 28837, "epoch": 347} {"train_loss": -18.719989776611328, "global_step": 28838, "epoch": 347} {"train_loss": -19.086294174194336, "global_step": 28839, "epoch": 347} {"train_loss": -18.8416690826416, "global_step": 28840, "epoch": 347} {"train_loss": -19.00737953186035, "global_step": 28841, "epoch": 347} {"train_loss": -18.7843074798584, "global_step": 28842, "epoch": 347} {"train_loss": -18.55645751953125, "global_step": 28843, "epoch": 347} {"train_loss": -19.058195114135742, "global_step": 28844, "epoch": 347} {"train_loss": -18.965076446533203, "global_step": 28845, "epoch": 347} {"train_loss": -18.90040397644043, "global_step": 28846, "epoch": 347} {"train_loss": -19.057296752929688, "global_step": 28847, "epoch": 347} {"train_loss": -18.97488784790039, "global_step": 28848, "epoch": 347} {"train_loss": -19.050901412963867, "global_step": 28849, "epoch": 347} {"train_loss": -19.042144775390625, "global_step": 28850, "epoch": 347} {"train_loss": -18.819849014282227, "global_step": 28851, "epoch": 347} {"train_loss": -19.09202766418457, "global_step": 28852, "epoch": 347} {"train_loss": -18.585681915283203, "global_step": 28853, "epoch": 347} {"train_loss": -19.083044052124023, "global_step": 28854, "epoch": 347} {"train_loss": -18.774072647094727, "global_step": 28855, "epoch": 347} {"train_loss": -18.727781295776367, "global_step": 28856, "epoch": 347} {"train_loss": -19.135068893432617, "global_step": 28857, "epoch": 347} {"train_loss": -19.142990112304688, "global_step": 28858, "epoch": 347} {"train_loss": -19.028079986572266, "global_step": 28859, "epoch": 347} {"train_loss": -18.988990783691406, "global_step": 28860, "epoch": 347} {"train_loss": -18.872236251831055, "global_step": 28861, "epoch": 347} {"train_loss": -18.767230987548828, "global_step": 28862, "epoch": 347} {"train_loss": -19.08841323852539, "global_step": 28863, "epoch": 347} {"train_loss": -18.695968627929688, "global_step": 28864, "epoch": 347} {"train_loss": -18.970630645751953, "global_step": 28865, "epoch": 347} {"train_loss": -18.4774112701416, "global_step": 28866, "epoch": 347} {"train_loss": -18.052841186523438, "global_step": 28867, "epoch": 347} {"train_loss": -19.078100204467773, "global_step": 28868, "epoch": 347} {"train_loss": -19.03838348388672, "global_step": 28869, "epoch": 347} {"train_loss": -19.005308151245117, "global_step": 28870, "epoch": 347} {"train_loss": -18.86172103881836, "global_step": 28871, "epoch": 347} {"train_loss": -18.771486282348633, "global_step": 28872, "epoch": 347} {"train_loss": -19.054853439331055, "global_step": 28873, "epoch": 347} {"train_loss": -18.730222702026367, "global_step": 28874, "epoch": 347} {"train_loss": -18.546085357666016, "global_step": 28875, "epoch": 347} {"train_loss": -18.983245849609375, "global_step": 28876, "epoch": 347} {"train_loss": -18.97865104675293, "global_step": 28877, "epoch": 347} {"train_loss": -18.717853546142578, "global_step": 28878, "epoch": 347} {"train_loss": -18.71504020690918, "global_step": 28879, "epoch": 347} {"train_loss": -18.6806640625, "global_step": 28880, "epoch": 347} {"train_loss": -18.735198974609375, "global_step": 28881, "epoch": 347} {"train_loss": -18.462818145751953, "global_step": 28882, "epoch": 347} {"train_loss": -18.81691006580031, "global_step": 28883, "epoch": 347, "val_loss": 5988946.0} {"train_loss": -18.70513343811035, "global_step": 28884, "epoch": 348} {"train_loss": -19.041208267211914, "global_step": 28885, "epoch": 348} {"train_loss": -18.98136329650879, "global_step": 28886, "epoch": 348} {"train_loss": -18.77918243408203, "global_step": 28887, "epoch": 348} {"train_loss": -18.7867488861084, "global_step": 28888, "epoch": 348} {"train_loss": -18.708093643188477, "global_step": 28889, "epoch": 348} {"train_loss": -19.098569869995117, "global_step": 28890, "epoch": 348} {"train_loss": -19.00050163269043, "global_step": 28891, "epoch": 348} {"train_loss": -18.943735122680664, "global_step": 28892, "epoch": 348} {"train_loss": -18.149770736694336, "global_step": 28893, "epoch": 348} {"train_loss": -18.82435417175293, "global_step": 28894, "epoch": 348} {"train_loss": -19.161436080932617, "global_step": 28895, "epoch": 348} {"train_loss": -18.511274337768555, "global_step": 28896, "epoch": 348} {"train_loss": -18.74093246459961, "global_step": 28897, "epoch": 348} {"train_loss": -18.7096004486084, "global_step": 28898, "epoch": 348} {"train_loss": -18.926313400268555, "global_step": 28899, "epoch": 348} {"train_loss": -19.009449005126953, "global_step": 28900, "epoch": 348} {"train_loss": -18.98174476623535, "global_step": 28901, "epoch": 348} {"train_loss": -19.04545021057129, "global_step": 28902, "epoch": 348} {"train_loss": -19.147138595581055, "global_step": 28903, "epoch": 348} {"train_loss": -18.54891014099121, "global_step": 28904, "epoch": 348} {"train_loss": -18.915273666381836, "global_step": 28905, "epoch": 348} {"train_loss": -18.6740779876709, "global_step": 28906, "epoch": 348} {"train_loss": -18.63077163696289, "global_step": 28907, "epoch": 348} {"train_loss": -18.936023712158203, "global_step": 28908, "epoch": 348} {"train_loss": -19.000425338745117, "global_step": 28909, "epoch": 348} {"train_loss": -18.50257110595703, "global_step": 28910, "epoch": 348} {"train_loss": -18.685245513916016, "global_step": 28911, "epoch": 348} {"train_loss": -18.731523513793945, "global_step": 28912, "epoch": 348} {"train_loss": -19.119922637939453, "global_step": 28913, "epoch": 348} {"train_loss": -19.192434310913086, "global_step": 28914, "epoch": 348} {"train_loss": -18.977914810180664, "global_step": 28915, "epoch": 348} {"train_loss": -18.99189567565918, "global_step": 28916, "epoch": 348} {"train_loss": -19.153316497802734, "global_step": 28917, "epoch": 348} {"train_loss": -19.322778701782227, "global_step": 28918, "epoch": 348} {"train_loss": -19.380163192749023, "global_step": 28919, "epoch": 348} {"train_loss": -19.14564323425293, "global_step": 28920, "epoch": 348} {"train_loss": -19.303028106689453, "global_step": 28921, "epoch": 348} {"train_loss": -18.936464309692383, "global_step": 28922, "epoch": 348} {"train_loss": -18.768280029296875, "global_step": 28923, "epoch": 348} {"train_loss": -18.8795166015625, "global_step": 28924, "epoch": 348} {"train_loss": -18.852903366088867, "global_step": 28925, "epoch": 348} {"train_loss": -18.820724487304688, "global_step": 28926, "epoch": 348} {"train_loss": -18.733192443847656, "global_step": 28927, "epoch": 348} {"train_loss": -18.8455867767334, "global_step": 28928, "epoch": 348} {"train_loss": -19.1154727935791, "global_step": 28929, "epoch": 348} {"train_loss": -18.4578914642334, "global_step": 28930, "epoch": 348} {"train_loss": -18.931365966796875, "global_step": 28931, "epoch": 348} {"train_loss": -19.260177612304688, "global_step": 28932, "epoch": 348} {"train_loss": -19.14536476135254, "global_step": 28933, "epoch": 348} {"train_loss": -19.37733268737793, "global_step": 28934, "epoch": 348} {"train_loss": -18.911001205444336, "global_step": 28935, "epoch": 348} {"train_loss": -18.931110382080078, "global_step": 28936, "epoch": 348} {"train_loss": -18.87013053894043, "global_step": 28937, "epoch": 348} {"train_loss": -19.086353302001953, "global_step": 28938, "epoch": 348} {"train_loss": -19.32588005065918, "global_step": 28939, "epoch": 348} {"train_loss": -19.08380889892578, "global_step": 28940, "epoch": 348} {"train_loss": -18.967336654663086, "global_step": 28941, "epoch": 348} {"train_loss": -18.732194900512695, "global_step": 28942, "epoch": 348} {"train_loss": -18.75480079650879, "global_step": 28943, "epoch": 348} {"train_loss": -18.77137565612793, "global_step": 28944, "epoch": 348} {"train_loss": -18.866130828857422, "global_step": 28945, "epoch": 348} {"train_loss": -19.358701705932617, "global_step": 28946, "epoch": 348} {"train_loss": -18.96923828125, "global_step": 28947, "epoch": 348} {"train_loss": -18.810178756713867, "global_step": 28948, "epoch": 348} {"train_loss": -19.17111587524414, "global_step": 28949, "epoch": 348} {"train_loss": -18.71310043334961, "global_step": 28950, "epoch": 348} {"train_loss": -18.915307998657227, "global_step": 28951, "epoch": 348} {"train_loss": -18.75868034362793, "global_step": 28952, "epoch": 348} {"train_loss": -18.74074363708496, "global_step": 28953, "epoch": 348} {"train_loss": -18.63944435119629, "global_step": 28954, "epoch": 348} {"train_loss": -18.87155532836914, "global_step": 28955, "epoch": 348} {"train_loss": -18.694351196289062, "global_step": 28956, "epoch": 348} {"train_loss": -18.715377807617188, "global_step": 28957, "epoch": 348} {"train_loss": -18.399656295776367, "global_step": 28958, "epoch": 348} {"train_loss": -18.806257247924805, "global_step": 28959, "epoch": 348} {"train_loss": -18.39048194885254, "global_step": 28960, "epoch": 348} {"train_loss": -18.67298126220703, "global_step": 28961, "epoch": 348} {"train_loss": -18.953590393066406, "global_step": 28962, "epoch": 348} {"train_loss": -18.71847152709961, "global_step": 28963, "epoch": 348} {"train_loss": -19.09187126159668, "global_step": 28964, "epoch": 348} {"train_loss": -18.948373794555664, "global_step": 28965, "epoch": 348} {"train_loss": -18.902020419936584, "global_step": 28966, "epoch": 348, "val_loss": 5969677.5} {"train_loss": -18.61744499206543, "global_step": 28967, "epoch": 349} {"train_loss": -18.724660873413086, "global_step": 28968, "epoch": 349} {"train_loss": -18.620275497436523, "global_step": 28969, "epoch": 349} {"train_loss": -18.95754051208496, "global_step": 28970, "epoch": 349} {"train_loss": -19.124074935913086, "global_step": 28971, "epoch": 349} {"train_loss": -18.76821517944336, "global_step": 28972, "epoch": 349} {"train_loss": -18.463245391845703, "global_step": 28973, "epoch": 349} {"train_loss": -18.73708152770996, "global_step": 28974, "epoch": 349} {"train_loss": -18.98697280883789, "global_step": 28975, "epoch": 349} {"train_loss": -18.653417587280273, "global_step": 28976, "epoch": 349} {"train_loss": -18.680545806884766, "global_step": 28977, "epoch": 349} {"train_loss": -18.604721069335938, "global_step": 28978, "epoch": 349} {"train_loss": -18.732025146484375, "global_step": 28979, "epoch": 349} {"train_loss": -18.853532791137695, "global_step": 28980, "epoch": 349} {"train_loss": -18.766950607299805, "global_step": 28981, "epoch": 349} {"train_loss": -18.83795738220215, "global_step": 28982, "epoch": 349} {"train_loss": -18.91937828063965, "global_step": 28983, "epoch": 349} {"train_loss": -18.760513305664062, "global_step": 28984, "epoch": 349} {"train_loss": -19.025527954101562, "global_step": 28985, "epoch": 349} {"train_loss": -18.94349479675293, "global_step": 28986, "epoch": 349} {"train_loss": -19.03757095336914, "global_step": 28987, "epoch": 349} {"train_loss": -18.594554901123047, "global_step": 28988, "epoch": 349} {"train_loss": -18.859785079956055, "global_step": 28989, "epoch": 349} {"train_loss": -18.796186447143555, "global_step": 28990, "epoch": 349} {"train_loss": -18.64523696899414, "global_step": 28991, "epoch": 349} {"train_loss": -19.097944259643555, "global_step": 28992, "epoch": 349} {"train_loss": -18.507566452026367, "global_step": 28993, "epoch": 349} {"train_loss": -18.52939224243164, "global_step": 28994, "epoch": 349} {"train_loss": -19.328201293945312, "global_step": 28995, "epoch": 349} {"train_loss": -18.9833927154541, "global_step": 28996, "epoch": 349} {"train_loss": -19.149219512939453, "global_step": 28997, "epoch": 349} {"train_loss": -18.681364059448242, "global_step": 28998, "epoch": 349} {"train_loss": -19.066299438476562, "global_step": 28999, "epoch": 349} {"train_loss": -19.261823654174805, "global_step": 29000, "epoch": 349} {"train_loss": -19.06218147277832, "global_step": 29001, "epoch": 349} {"train_loss": -18.849313735961914, "global_step": 29002, "epoch": 349} {"train_loss": -18.85550880432129, "global_step": 29003, "epoch": 349} {"train_loss": -19.311098098754883, "global_step": 29004, "epoch": 349} {"train_loss": -19.197843551635742, "global_step": 29005, "epoch": 349} {"train_loss": -18.809833526611328, "global_step": 29006, "epoch": 349} {"train_loss": -18.862892150878906, "global_step": 29007, "epoch": 349} {"train_loss": -18.987173080444336, "global_step": 29008, "epoch": 349} {"train_loss": -18.769535064697266, "global_step": 29009, "epoch": 349} {"train_loss": -19.118289947509766, "global_step": 29010, "epoch": 349} {"train_loss": -18.62689781188965, "global_step": 29011, "epoch": 349} {"train_loss": -18.720022201538086, "global_step": 29012, "epoch": 349} {"train_loss": -18.89728355407715, "global_step": 29013, "epoch": 349} {"train_loss": -18.80093002319336, "global_step": 29014, "epoch": 349} {"train_loss": -18.58475112915039, "global_step": 29015, "epoch": 349} {"train_loss": -19.139863967895508, "global_step": 29016, "epoch": 349} {"train_loss": -19.037805557250977, "global_step": 29017, "epoch": 349} {"train_loss": -19.235380172729492, "global_step": 29018, "epoch": 349} {"train_loss": -18.901805877685547, "global_step": 29019, "epoch": 349} {"train_loss": -19.078556060791016, "global_step": 29020, "epoch": 349} {"train_loss": -19.19173812866211, "global_step": 29021, "epoch": 349} {"train_loss": -19.20680046081543, "global_step": 29022, "epoch": 349} {"train_loss": -19.0767879486084, "global_step": 29023, "epoch": 349} {"train_loss": -19.374094009399414, "global_step": 29024, "epoch": 349} {"train_loss": -19.244836807250977, "global_step": 29025, "epoch": 349} {"train_loss": -18.97475242614746, "global_step": 29026, "epoch": 349} {"train_loss": -18.823169708251953, "global_step": 29027, "epoch": 349} {"train_loss": -18.63576316833496, "global_step": 29028, "epoch": 349} {"train_loss": -18.76595115661621, "global_step": 29029, "epoch": 349} {"train_loss": -18.694562911987305, "global_step": 29030, "epoch": 349} {"train_loss": -18.798933029174805, "global_step": 29031, "epoch": 349} {"train_loss": -18.779050827026367, "global_step": 29032, "epoch": 349} {"train_loss": -19.06524658203125, "global_step": 29033, "epoch": 349} {"train_loss": -19.025426864624023, "global_step": 29034, "epoch": 349} {"train_loss": -18.674060821533203, "global_step": 29035, "epoch": 349} {"train_loss": -19.204940795898438, "global_step": 29036, "epoch": 349} {"train_loss": -18.948637008666992, "global_step": 29037, "epoch": 349} {"train_loss": -19.031314849853516, "global_step": 29038, "epoch": 349} {"train_loss": -18.888572692871094, "global_step": 29039, "epoch": 349} {"train_loss": -18.967296600341797, "global_step": 29040, "epoch": 349} {"train_loss": -19.04835319519043, "global_step": 29041, "epoch": 349} {"train_loss": -18.748620986938477, "global_step": 29042, "epoch": 349} {"train_loss": -18.893115997314453, "global_step": 29043, "epoch": 349} {"train_loss": -18.84978485107422, "global_step": 29044, "epoch": 349} {"train_loss": -18.755338668823242, "global_step": 29045, "epoch": 349} {"train_loss": -19.12173843383789, "global_step": 29046, "epoch": 349} {"train_loss": -18.770709991455078, "global_step": 29047, "epoch": 349} {"train_loss": -18.718908309936523, "global_step": 29048, "epoch": 349} {"train_loss": -18.882761736950243, "global_step": 29049, "epoch": 349, "val_loss": 5920908.0} {"train_loss": -19.1059627532959, "global_step": 29050, "epoch": 350} {"train_loss": -18.44483757019043, "global_step": 29051, "epoch": 350} {"train_loss": -19.009469985961914, "global_step": 29052, "epoch": 350} {"train_loss": -18.50465965270996, "global_step": 29053, "epoch": 350} {"train_loss": -19.0305233001709, "global_step": 29054, "epoch": 350} {"train_loss": -18.689443588256836, "global_step": 29055, "epoch": 350} {"train_loss": -18.563344955444336, "global_step": 29056, "epoch": 350} {"train_loss": -18.474323272705078, "global_step": 29057, "epoch": 350} {"train_loss": -18.845184326171875, "global_step": 29058, "epoch": 350} {"train_loss": -18.734983444213867, "global_step": 29059, "epoch": 350} {"train_loss": -19.041955947875977, "global_step": 29060, "epoch": 350} {"train_loss": -19.12554359436035, "global_step": 29061, "epoch": 350} {"train_loss": -19.156641006469727, "global_step": 29062, "epoch": 350} {"train_loss": -18.95759391784668, "global_step": 29063, "epoch": 350} {"train_loss": -18.59153175354004, "global_step": 29064, "epoch": 350} {"train_loss": -19.232397079467773, "global_step": 29065, "epoch": 350} {"train_loss": -18.57280921936035, "global_step": 29066, "epoch": 350} {"train_loss": -18.373964309692383, "global_step": 29067, "epoch": 350} {"train_loss": -18.974010467529297, "global_step": 29068, "epoch": 350} {"train_loss": -18.785219192504883, "global_step": 29069, "epoch": 350} {"train_loss": -19.125511169433594, "global_step": 29070, "epoch": 350} {"train_loss": -18.975278854370117, "global_step": 29071, "epoch": 350} {"train_loss": -19.10052490234375, "global_step": 29072, "epoch": 350} {"train_loss": -18.660343170166016, "global_step": 29073, "epoch": 350} {"train_loss": -18.866718292236328, "global_step": 29074, "epoch": 350} {"train_loss": -18.84158706665039, "global_step": 29075, "epoch": 350} {"train_loss": -18.90813636779785, "global_step": 29076, "epoch": 350} {"train_loss": -19.378965377807617, "global_step": 29077, "epoch": 350} {"train_loss": -18.70374870300293, "global_step": 29078, "epoch": 350} {"train_loss": -18.92302894592285, "global_step": 29079, "epoch": 350} {"train_loss": -18.97623634338379, "global_step": 29080, "epoch": 350} {"train_loss": -18.730051040649414, "global_step": 29081, "epoch": 350} {"train_loss": -18.861661911010742, "global_step": 29082, "epoch": 350} {"train_loss": -18.9185791015625, "global_step": 29083, "epoch": 350} {"train_loss": -19.35886573791504, "global_step": 29084, "epoch": 350} {"train_loss": -19.0273494720459, "global_step": 29085, "epoch": 350} {"train_loss": -19.137317657470703, "global_step": 29086, "epoch": 350} {"train_loss": -18.877857208251953, "global_step": 29087, "epoch": 350} {"train_loss": -18.731969833374023, "global_step": 29088, "epoch": 350} {"train_loss": -18.690792083740234, "global_step": 29089, "epoch": 350} {"train_loss": -19.12839698791504, "global_step": 29090, "epoch": 350} {"train_loss": -19.172374725341797, "global_step": 29091, "epoch": 350} {"train_loss": -18.926294326782227, "global_step": 29092, "epoch": 350} {"train_loss": -18.842227935791016, "global_step": 29093, "epoch": 350} {"train_loss": -19.09882926940918, "global_step": 29094, "epoch": 350} {"train_loss": -18.880903244018555, "global_step": 29095, "epoch": 350} {"train_loss": -19.104848861694336, "global_step": 29096, "epoch": 350} {"train_loss": -19.126501083374023, "global_step": 29097, "epoch": 350} {"train_loss": -19.0709171295166, "global_step": 29098, "epoch": 350} {"train_loss": -18.577054977416992, "global_step": 29099, "epoch": 350} {"train_loss": -18.965246200561523, "global_step": 29100, "epoch": 350} {"train_loss": -18.926794052124023, "global_step": 29101, "epoch": 350} {"train_loss": -18.92304039001465, "global_step": 29102, "epoch": 350} {"train_loss": -19.267581939697266, "global_step": 29103, "epoch": 350} {"train_loss": -19.150266647338867, "global_step": 29104, "epoch": 350} {"train_loss": -18.690542221069336, "global_step": 29105, "epoch": 350} {"train_loss": -19.03461265563965, "global_step": 29106, "epoch": 350} {"train_loss": -18.66458511352539, "global_step": 29107, "epoch": 350} {"train_loss": -18.677196502685547, "global_step": 29108, "epoch": 350} {"train_loss": -18.94636344909668, "global_step": 29109, "epoch": 350} {"train_loss": -18.62891387939453, "global_step": 29110, "epoch": 350} {"train_loss": -18.94070053100586, "global_step": 29111, "epoch": 350} {"train_loss": -18.628774642944336, "global_step": 29112, "epoch": 350} {"train_loss": -19.046451568603516, "global_step": 29113, "epoch": 350} {"train_loss": -19.023576736450195, "global_step": 29114, "epoch": 350} {"train_loss": -18.599857330322266, "global_step": 29115, "epoch": 350} {"train_loss": -18.924264907836914, "global_step": 29116, "epoch": 350} {"train_loss": -18.620677947998047, "global_step": 29117, "epoch": 350} {"train_loss": -18.941349029541016, "global_step": 29118, "epoch": 350} {"train_loss": -19.024763107299805, "global_step": 29119, "epoch": 350} {"train_loss": -18.874914169311523, "global_step": 29120, "epoch": 350} {"train_loss": -19.349685668945312, "global_step": 29121, "epoch": 350} {"train_loss": -18.66658592224121, "global_step": 29122, "epoch": 350} {"train_loss": -18.62725257873535, "global_step": 29123, "epoch": 350} {"train_loss": -18.98675537109375, "global_step": 29124, "epoch": 350} {"train_loss": -18.536773681640625, "global_step": 29125, "epoch": 350} {"train_loss": -18.743244171142578, "global_step": 29126, "epoch": 350} {"train_loss": -18.59095001220703, "global_step": 29127, "epoch": 350} {"train_loss": -18.804351806640625, "global_step": 29128, "epoch": 350} {"train_loss": -19.386459350585938, "global_step": 29129, "epoch": 350} {"train_loss": -18.971681594848633, "global_step": 29130, "epoch": 350} {"train_loss": -19.257474899291992, "global_step": 29131, "epoch": 350} {"train_loss": -18.8892707594906, "global_step": 29132, "epoch": 350, "train/sim_max_reward_0": 1.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 0.0, "train/sim_max_reward_4": 0.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4500000": 1.0, "test/sim_max_reward_4500001": 1.0, "test/sim_max_reward_4500002": 1.0, "test/sim_max_reward_4500003": 1.0, "test/sim_max_reward_4500004": 1.0, "test/sim_max_reward_4500005": 1.0, "test/sim_max_reward_4500006": 1.0, "test/sim_max_reward_4500007": 1.0, "test/sim_max_reward_4500008": 1.0, "test/sim_max_reward_4500009": 1.0, "test/sim_max_reward_4500010": 1.0, "test/sim_max_reward_4500011": 1.0, "test/sim_max_reward_4500012": 1.0, "test/sim_max_reward_4500013": 1.0, "test/sim_max_reward_4500014": 1.0, "test/sim_max_reward_4500015": 1.0, "test/sim_max_reward_4500016": 1.0, "test/sim_max_reward_4500017": 1.0, "test/sim_max_reward_4500018": 1.0, "test/sim_max_reward_4500019": 0.0, "test/sim_max_reward_4500020": 1.0, "test/sim_max_reward_4500021": 1.0, "train/mean_score": 0.6666666666666666, "test/mean_score": 0.9545454545454546, "val_loss": 6054764.0} {"train_loss": -19.10989761352539, "global_step": 29133, "epoch": 351} {"train_loss": -18.903196334838867, "global_step": 29134, "epoch": 351} {"train_loss": -18.558753967285156, "global_step": 29135, "epoch": 351} {"train_loss": -18.644983291625977, "global_step": 29136, "epoch": 351} {"train_loss": -18.98175621032715, "global_step": 29137, "epoch": 351} {"train_loss": -18.5787353515625, "global_step": 29138, "epoch": 351} {"train_loss": -18.52109718322754, "global_step": 29139, "epoch": 351} {"train_loss": -18.704336166381836, "global_step": 29140, "epoch": 351} {"train_loss": -18.867347717285156, "global_step": 29141, "epoch": 351} {"train_loss": -18.50531578063965, "global_step": 29142, "epoch": 351} {"train_loss": -18.593637466430664, "global_step": 29143, "epoch": 351} {"train_loss": -18.7714900970459, "global_step": 29144, "epoch": 351} {"train_loss": -18.997791290283203, "global_step": 29145, "epoch": 351} {"train_loss": -18.982309341430664, "global_step": 29146, "epoch": 351} {"train_loss": -18.883649826049805, "global_step": 29147, "epoch": 351} {"train_loss": -18.906845092773438, "global_step": 29148, "epoch": 351} {"train_loss": -18.683727264404297, "global_step": 29149, "epoch": 351} {"train_loss": -18.717323303222656, "global_step": 29150, "epoch": 351} {"train_loss": -18.950578689575195, "global_step": 29151, "epoch": 351} {"train_loss": -18.730091094970703, "global_step": 29152, "epoch": 351} {"train_loss": -19.211973190307617, "global_step": 29153, "epoch": 351} {"train_loss": -18.958608627319336, "global_step": 29154, "epoch": 351} {"train_loss": -19.008024215698242, "global_step": 29155, "epoch": 351} {"train_loss": -18.860172271728516, "global_step": 29156, "epoch": 351} {"train_loss": -19.110197067260742, "global_step": 29157, "epoch": 351} {"train_loss": -18.69410514831543, "global_step": 29158, "epoch": 351} {"train_loss": -18.840951919555664, "global_step": 29159, "epoch": 351} {"train_loss": -19.00660514831543, "global_step": 29160, "epoch": 351} {"train_loss": -18.89747428894043, "global_step": 29161, "epoch": 351} {"train_loss": -18.69441032409668, "global_step": 29162, "epoch": 351} {"train_loss": -19.1656551361084, "global_step": 29163, "epoch": 351} {"train_loss": -19.074962615966797, "global_step": 29164, "epoch": 351} {"train_loss": -18.893301010131836, "global_step": 29165, "epoch": 351} {"train_loss": -19.133493423461914, "global_step": 29166, "epoch": 351} {"train_loss": -18.9984188079834, "global_step": 29167, "epoch": 351} {"train_loss": -19.102994918823242, "global_step": 29168, "epoch": 351} {"train_loss": -18.879138946533203, "global_step": 29169, "epoch": 351} {"train_loss": -18.534698486328125, "global_step": 29170, "epoch": 351} {"train_loss": -18.840925216674805, "global_step": 29171, "epoch": 351} {"train_loss": -19.287302017211914, "global_step": 29172, "epoch": 351} {"train_loss": -19.03792381286621, "global_step": 29173, "epoch": 351} {"train_loss": -18.9014892578125, "global_step": 29174, "epoch": 351} {"train_loss": -18.620935440063477, "global_step": 29175, "epoch": 351} {"train_loss": -19.110309600830078, "global_step": 29176, "epoch": 351} {"train_loss": -19.008867263793945, "global_step": 29177, "epoch": 351} {"train_loss": -18.601364135742188, "global_step": 29178, "epoch": 351} {"train_loss": -18.878416061401367, "global_step": 29179, "epoch": 351} {"train_loss": -18.67815399169922, "global_step": 29180, "epoch": 351} {"train_loss": -18.77118492126465, "global_step": 29181, "epoch": 351} {"train_loss": -18.78541374206543, "global_step": 29182, "epoch": 351} {"train_loss": -18.707935333251953, "global_step": 29183, "epoch": 351} {"train_loss": -18.721708297729492, "global_step": 29184, "epoch": 351} {"train_loss": -18.90921974182129, "global_step": 29185, "epoch": 351} {"train_loss": -18.4460391998291, "global_step": 29186, "epoch": 351} {"train_loss": -19.229799270629883, "global_step": 29187, "epoch": 351} {"train_loss": -18.881149291992188, "global_step": 29188, "epoch": 351} {"train_loss": -18.79693603515625, "global_step": 29189, "epoch": 351} {"train_loss": -18.659046173095703, "global_step": 29190, "epoch": 351} {"train_loss": -19.078372955322266, "global_step": 29191, "epoch": 351} {"train_loss": -19.023168563842773, "global_step": 29192, "epoch": 351} {"train_loss": -19.22649574279785, "global_step": 29193, "epoch": 351} {"train_loss": -18.780485153198242, "global_step": 29194, "epoch": 351} {"train_loss": -18.453214645385742, "global_step": 29195, "epoch": 351} {"train_loss": -18.811649322509766, "global_step": 29196, "epoch": 351} {"train_loss": -18.871313095092773, "global_step": 29197, "epoch": 351} {"train_loss": -18.85460662841797, "global_step": 29198, "epoch": 351} {"train_loss": -18.945974349975586, "global_step": 29199, "epoch": 351} {"train_loss": -18.595197677612305, "global_step": 29200, "epoch": 351} {"train_loss": -19.036378860473633, "global_step": 29201, "epoch": 351} {"train_loss": -19.025545120239258, "global_step": 29202, "epoch": 351} {"train_loss": -18.701208114624023, "global_step": 29203, "epoch": 351} {"train_loss": -18.531408309936523, "global_step": 29204, "epoch": 351} {"train_loss": -18.703664779663086, "global_step": 29205, "epoch": 351} {"train_loss": -18.522403717041016, "global_step": 29206, "epoch": 351} {"train_loss": -19.449859619140625, "global_step": 29207, "epoch": 351} {"train_loss": -18.833091735839844, "global_step": 29208, "epoch": 351} {"train_loss": -18.86920738220215, "global_step": 29209, "epoch": 351} {"train_loss": -18.79363441467285, "global_step": 29210, "epoch": 351} {"train_loss": -18.634679794311523, "global_step": 29211, "epoch": 351} {"train_loss": -18.879241943359375, "global_step": 29212, "epoch": 351} {"train_loss": -18.74043083190918, "global_step": 29213, "epoch": 351} {"train_loss": -19.27271842956543, "global_step": 29214, "epoch": 351} {"train_loss": -18.86439353299428, "global_step": 29215, "epoch": 351, "val_loss": 6162248.5} {"train_loss": -18.82961082458496, "global_step": 29216, "epoch": 352} {"train_loss": -18.592374801635742, "global_step": 29217, "epoch": 352} {"train_loss": -18.670164108276367, "global_step": 29218, "epoch": 352} {"train_loss": -18.615182876586914, "global_step": 29219, "epoch": 352} {"train_loss": -18.83319664001465, "global_step": 29220, "epoch": 352} {"train_loss": -18.889890670776367, "global_step": 29221, "epoch": 352} {"train_loss": -18.786819458007812, "global_step": 29222, "epoch": 352} {"train_loss": -19.02083396911621, "global_step": 29223, "epoch": 352} {"train_loss": -19.291852951049805, "global_step": 29224, "epoch": 352} {"train_loss": -18.884790420532227, "global_step": 29225, "epoch": 352} {"train_loss": -19.149486541748047, "global_step": 29226, "epoch": 352} {"train_loss": -18.736906051635742, "global_step": 29227, "epoch": 352} {"train_loss": -19.11935043334961, "global_step": 29228, "epoch": 352} {"train_loss": -18.849180221557617, "global_step": 29229, "epoch": 352} {"train_loss": -18.580463409423828, "global_step": 29230, "epoch": 352} {"train_loss": -18.94398307800293, "global_step": 29231, "epoch": 352} {"train_loss": -18.4553279876709, "global_step": 29232, "epoch": 352} {"train_loss": -18.73031997680664, "global_step": 29233, "epoch": 352} {"train_loss": -19.332807540893555, "global_step": 29234, "epoch": 352} {"train_loss": -19.061965942382812, "global_step": 29235, "epoch": 352} {"train_loss": -19.098417282104492, "global_step": 29236, "epoch": 352} {"train_loss": -18.804611206054688, "global_step": 29237, "epoch": 352} {"train_loss": -18.955530166625977, "global_step": 29238, "epoch": 352} {"train_loss": -19.342044830322266, "global_step": 29239, "epoch": 352} {"train_loss": -19.076839447021484, "global_step": 29240, "epoch": 352} {"train_loss": -18.977333068847656, "global_step": 29241, "epoch": 352} {"train_loss": -18.791301727294922, "global_step": 29242, "epoch": 352} {"train_loss": -19.002090454101562, "global_step": 29243, "epoch": 352} {"train_loss": -18.938465118408203, "global_step": 29244, "epoch": 352} {"train_loss": -18.8167781829834, "global_step": 29245, "epoch": 352} {"train_loss": -18.926244735717773, "global_step": 29246, "epoch": 352} {"train_loss": -19.34442710876465, "global_step": 29247, "epoch": 352} {"train_loss": -19.304758071899414, "global_step": 29248, "epoch": 352} {"train_loss": -18.83609390258789, "global_step": 29249, "epoch": 352} {"train_loss": -18.96710777282715, "global_step": 29250, "epoch": 352} {"train_loss": -18.676067352294922, "global_step": 29251, "epoch": 352} {"train_loss": -19.270734786987305, "global_step": 29252, "epoch": 352} {"train_loss": -19.003503799438477, "global_step": 29253, "epoch": 352} {"train_loss": -18.704282760620117, "global_step": 29254, "epoch": 352} {"train_loss": -18.97321891784668, "global_step": 29255, "epoch": 352} {"train_loss": -18.984777450561523, "global_step": 29256, "epoch": 352} {"train_loss": -19.095333099365234, "global_step": 29257, "epoch": 352} {"train_loss": -18.72780990600586, "global_step": 29258, "epoch": 352} {"train_loss": -18.897865295410156, "global_step": 29259, "epoch": 352} {"train_loss": -19.113162994384766, "global_step": 29260, "epoch": 352} {"train_loss": -18.62921714782715, "global_step": 29261, "epoch": 352} {"train_loss": -19.047880172729492, "global_step": 29262, "epoch": 352} {"train_loss": -18.825483322143555, "global_step": 29263, "epoch": 352} {"train_loss": -18.89679527282715, "global_step": 29264, "epoch": 352} {"train_loss": -18.987958908081055, "global_step": 29265, "epoch": 352} {"train_loss": -19.0194091796875, "global_step": 29266, "epoch": 352} {"train_loss": -18.951385498046875, "global_step": 29267, "epoch": 352} {"train_loss": -18.923688888549805, "global_step": 29268, "epoch": 352} {"train_loss": -18.93113899230957, "global_step": 29269, "epoch": 352} {"train_loss": -18.776046752929688, "global_step": 29270, "epoch": 352} {"train_loss": -19.00782012939453, "global_step": 29271, "epoch": 352} {"train_loss": -18.754926681518555, "global_step": 29272, "epoch": 352} {"train_loss": -19.163572311401367, "global_step": 29273, "epoch": 352} {"train_loss": -19.023969650268555, "global_step": 29274, "epoch": 352} {"train_loss": -18.896535873413086, "global_step": 29275, "epoch": 352} {"train_loss": -18.752084732055664, "global_step": 29276, "epoch": 352} {"train_loss": -18.801054000854492, "global_step": 29277, "epoch": 352} {"train_loss": -18.57441520690918, "global_step": 29278, "epoch": 352} {"train_loss": -18.828489303588867, "global_step": 29279, "epoch": 352} {"train_loss": -18.68682289123535, "global_step": 29280, "epoch": 352} {"train_loss": -19.014019012451172, "global_step": 29281, "epoch": 352} {"train_loss": -19.005342483520508, "global_step": 29282, "epoch": 352} {"train_loss": -18.824277877807617, "global_step": 29283, "epoch": 352} {"train_loss": -18.95236587524414, "global_step": 29284, "epoch": 352} {"train_loss": -18.81761932373047, "global_step": 29285, "epoch": 352} {"train_loss": -19.07107925415039, "global_step": 29286, "epoch": 352} {"train_loss": -19.030155181884766, "global_step": 29287, "epoch": 352} {"train_loss": -18.934812545776367, "global_step": 29288, "epoch": 352} {"train_loss": -19.17853546142578, "global_step": 29289, "epoch": 352} {"train_loss": -18.99286460876465, "global_step": 29290, "epoch": 352} {"train_loss": -19.12369728088379, "global_step": 29291, "epoch": 352} {"train_loss": -18.908254623413086, "global_step": 29292, "epoch": 352} {"train_loss": -18.900827407836914, "global_step": 29293, "epoch": 352} {"train_loss": -18.809606552124023, "global_step": 29294, "epoch": 352} {"train_loss": -18.81587028503418, "global_step": 29295, "epoch": 352} {"train_loss": -19.031997680664062, "global_step": 29296, "epoch": 352} {"train_loss": -18.888700485229492, "global_step": 29297, "epoch": 352} {"train_loss": -18.932373552437287, "global_step": 29298, "epoch": 352, "val_loss": 5999380.0} {"train_loss": -18.49226951599121, "global_step": 29299, "epoch": 353} {"train_loss": -18.222007751464844, "global_step": 29300, "epoch": 353} {"train_loss": -18.707265853881836, "global_step": 29301, "epoch": 353} {"train_loss": -18.56949806213379, "global_step": 29302, "epoch": 353} {"train_loss": -18.993762969970703, "global_step": 29303, "epoch": 353} {"train_loss": -18.468244552612305, "global_step": 29304, "epoch": 353} {"train_loss": -18.746002197265625, "global_step": 29305, "epoch": 353} {"train_loss": -18.73719596862793, "global_step": 29306, "epoch": 353} {"train_loss": -18.817411422729492, "global_step": 29307, "epoch": 353} {"train_loss": -18.5313777923584, "global_step": 29308, "epoch": 353} {"train_loss": -18.471906661987305, "global_step": 29309, "epoch": 353} {"train_loss": -18.787824630737305, "global_step": 29310, "epoch": 353} {"train_loss": -18.449710845947266, "global_step": 29311, "epoch": 353} {"train_loss": -18.783329010009766, "global_step": 29312, "epoch": 353} {"train_loss": -18.603031158447266, "global_step": 29313, "epoch": 353} {"train_loss": -18.38011932373047, "global_step": 29314, "epoch": 353} {"train_loss": -18.527084350585938, "global_step": 29315, "epoch": 353} {"train_loss": -19.00971031188965, "global_step": 29316, "epoch": 353} {"train_loss": -18.682844161987305, "global_step": 29317, "epoch": 353} {"train_loss": -18.974700927734375, "global_step": 29318, "epoch": 353} {"train_loss": -19.258325576782227, "global_step": 29319, "epoch": 353} {"train_loss": -18.609243392944336, "global_step": 29320, "epoch": 353} {"train_loss": -19.16354751586914, "global_step": 29321, "epoch": 353} {"train_loss": -18.80173110961914, "global_step": 29322, "epoch": 353} {"train_loss": -19.13800621032715, "global_step": 29323, "epoch": 353} {"train_loss": -18.632841110229492, "global_step": 29324, "epoch": 353} {"train_loss": -18.776315689086914, "global_step": 29325, "epoch": 353} {"train_loss": -18.613534927368164, "global_step": 29326, "epoch": 353} {"train_loss": -19.073535919189453, "global_step": 29327, "epoch": 353} {"train_loss": -19.04618263244629, "global_step": 29328, "epoch": 353} {"train_loss": -18.9000186920166, "global_step": 29329, "epoch": 353} {"train_loss": -18.910612106323242, "global_step": 29330, "epoch": 353} {"train_loss": -18.78169059753418, "global_step": 29331, "epoch": 353} {"train_loss": -18.880041122436523, "global_step": 29332, "epoch": 353} {"train_loss": -19.10918617248535, "global_step": 29333, "epoch": 353} {"train_loss": -18.836286544799805, "global_step": 29334, "epoch": 353} {"train_loss": -18.977262496948242, "global_step": 29335, "epoch": 353} {"train_loss": -18.82710075378418, "global_step": 29336, "epoch": 353} {"train_loss": -18.89572525024414, "global_step": 29337, "epoch": 353} {"train_loss": -18.63349723815918, "global_step": 29338, "epoch": 353} {"train_loss": -19.606006622314453, "global_step": 29339, "epoch": 353} {"train_loss": -18.989303588867188, "global_step": 29340, "epoch": 353} {"train_loss": -19.104185104370117, "global_step": 29341, "epoch": 353} {"train_loss": -18.785171508789062, "global_step": 29342, "epoch": 353} {"train_loss": -18.97088623046875, "global_step": 29343, "epoch": 353} {"train_loss": -18.83529281616211, "global_step": 29344, "epoch": 353} {"train_loss": -19.308637619018555, "global_step": 29345, "epoch": 353} {"train_loss": -19.027982711791992, "global_step": 29346, "epoch": 353} {"train_loss": -18.80439567565918, "global_step": 29347, "epoch": 353} {"train_loss": -18.805389404296875, "global_step": 29348, "epoch": 353} {"train_loss": -19.170124053955078, "global_step": 29349, "epoch": 353} {"train_loss": -18.878389358520508, "global_step": 29350, "epoch": 353} {"train_loss": -19.15647315979004, "global_step": 29351, "epoch": 353} {"train_loss": -18.93289566040039, "global_step": 29352, "epoch": 353} {"train_loss": -18.749881744384766, "global_step": 29353, "epoch": 353} {"train_loss": -18.38665771484375, "global_step": 29354, "epoch": 353} {"train_loss": -19.243881225585938, "global_step": 29355, "epoch": 353} {"train_loss": -19.00996971130371, "global_step": 29356, "epoch": 353} {"train_loss": -18.69327163696289, "global_step": 29357, "epoch": 353} {"train_loss": -18.999113082885742, "global_step": 29358, "epoch": 353} {"train_loss": -19.145198822021484, "global_step": 29359, "epoch": 353} {"train_loss": -18.359128952026367, "global_step": 29360, "epoch": 353} {"train_loss": -18.849689483642578, "global_step": 29361, "epoch": 353} {"train_loss": -19.110715866088867, "global_step": 29362, "epoch": 353} {"train_loss": -18.80977439880371, "global_step": 29363, "epoch": 353} {"train_loss": -18.696630477905273, "global_step": 29364, "epoch": 353} {"train_loss": -18.93607521057129, "global_step": 29365, "epoch": 353} {"train_loss": -18.623876571655273, "global_step": 29366, "epoch": 353} {"train_loss": -18.920560836791992, "global_step": 29367, "epoch": 353} {"train_loss": -18.71162223815918, "global_step": 29368, "epoch": 353} {"train_loss": -18.475473403930664, "global_step": 29369, "epoch": 353} {"train_loss": -18.978382110595703, "global_step": 29370, "epoch": 353} {"train_loss": -18.593229293823242, "global_step": 29371, "epoch": 353} {"train_loss": -19.09908103942871, "global_step": 29372, "epoch": 353} {"train_loss": -18.66132164001465, "global_step": 29373, "epoch": 353} {"train_loss": -19.056921005249023, "global_step": 29374, "epoch": 353} {"train_loss": -18.674100875854492, "global_step": 29375, "epoch": 353} {"train_loss": -18.984277725219727, "global_step": 29376, "epoch": 353} {"train_loss": -19.200557708740234, "global_step": 29377, "epoch": 353} {"train_loss": -19.001367568969727, "global_step": 29378, "epoch": 353} {"train_loss": -19.086042404174805, "global_step": 29379, "epoch": 353} {"train_loss": -19.101186752319336, "global_step": 29380, "epoch": 353} {"train_loss": -18.84282776246588, "global_step": 29381, "epoch": 353, "val_loss": 5917744.0} {"train_loss": -18.521406173706055, "global_step": 29382, "epoch": 354} {"train_loss": -18.66029167175293, "global_step": 29383, "epoch": 354} {"train_loss": -18.683319091796875, "global_step": 29384, "epoch": 354} {"train_loss": -18.660682678222656, "global_step": 29385, "epoch": 354} {"train_loss": -18.68412208557129, "global_step": 29386, "epoch": 354} {"train_loss": -19.097745895385742, "global_step": 29387, "epoch": 354} {"train_loss": -18.71307945251465, "global_step": 29388, "epoch": 354} {"train_loss": -18.833343505859375, "global_step": 29389, "epoch": 354} {"train_loss": -19.111865997314453, "global_step": 29390, "epoch": 354} {"train_loss": -19.02516746520996, "global_step": 29391, "epoch": 354} {"train_loss": -18.7238826751709, "global_step": 29392, "epoch": 354} {"train_loss": -19.077497482299805, "global_step": 29393, "epoch": 354} {"train_loss": -18.830257415771484, "global_step": 29394, "epoch": 354} {"train_loss": -18.829702377319336, "global_step": 29395, "epoch": 354} {"train_loss": -19.240589141845703, "global_step": 29396, "epoch": 354} {"train_loss": -18.371519088745117, "global_step": 29397, "epoch": 354} {"train_loss": -18.750680923461914, "global_step": 29398, "epoch": 354} {"train_loss": -19.000253677368164, "global_step": 29399, "epoch": 354} {"train_loss": -18.556442260742188, "global_step": 29400, "epoch": 354} {"train_loss": -18.951171875, "global_step": 29401, "epoch": 354} {"train_loss": -18.787067413330078, "global_step": 29402, "epoch": 354} {"train_loss": -18.796293258666992, "global_step": 29403, "epoch": 354} {"train_loss": -18.84739112854004, "global_step": 29404, "epoch": 354} {"train_loss": -18.50312614440918, "global_step": 29405, "epoch": 354} {"train_loss": -19.055173873901367, "global_step": 29406, "epoch": 354} {"train_loss": -18.831649780273438, "global_step": 29407, "epoch": 354} {"train_loss": -19.171436309814453, "global_step": 29408, "epoch": 354} {"train_loss": -18.721012115478516, "global_step": 29409, "epoch": 354} {"train_loss": -19.076688766479492, "global_step": 29410, "epoch": 354} {"train_loss": -18.844175338745117, "global_step": 29411, "epoch": 354} {"train_loss": -18.66420555114746, "global_step": 29412, "epoch": 354} {"train_loss": -19.164932250976562, "global_step": 29413, "epoch": 354} {"train_loss": -18.80525779724121, "global_step": 29414, "epoch": 354} {"train_loss": -18.964826583862305, "global_step": 29415, "epoch": 354} {"train_loss": -18.8746337890625, "global_step": 29416, "epoch": 354} {"train_loss": -18.87126922607422, "global_step": 29417, "epoch": 354} {"train_loss": -19.044092178344727, "global_step": 29418, "epoch": 354} {"train_loss": -19.1387996673584, "global_step": 29419, "epoch": 354} {"train_loss": -18.870271682739258, "global_step": 29420, "epoch": 354} {"train_loss": -19.122282028198242, "global_step": 29421, "epoch": 354} {"train_loss": -19.0167179107666, "global_step": 29422, "epoch": 354} {"train_loss": -19.239944458007812, "global_step": 29423, "epoch": 354} {"train_loss": -18.765390396118164, "global_step": 29424, "epoch": 354} {"train_loss": -18.807235717773438, "global_step": 29425, "epoch": 354} {"train_loss": -18.798599243164062, "global_step": 29426, "epoch": 354} {"train_loss": -18.744304656982422, "global_step": 29427, "epoch": 354} {"train_loss": -18.980491638183594, "global_step": 29428, "epoch": 354} {"train_loss": -18.734498977661133, "global_step": 29429, "epoch": 354} {"train_loss": -19.168405532836914, "global_step": 29430, "epoch": 354} {"train_loss": -19.111896514892578, "global_step": 29431, "epoch": 354} {"train_loss": -18.76313591003418, "global_step": 29432, "epoch": 354} {"train_loss": -18.68787384033203, "global_step": 29433, "epoch": 354} {"train_loss": -18.744115829467773, "global_step": 29434, "epoch": 354} {"train_loss": -19.1699161529541, "global_step": 29435, "epoch": 354} {"train_loss": -19.167444229125977, "global_step": 29436, "epoch": 354} {"train_loss": -19.015737533569336, "global_step": 29437, "epoch": 354} {"train_loss": -19.12155532836914, "global_step": 29438, "epoch": 354} {"train_loss": -18.840316772460938, "global_step": 29439, "epoch": 354} {"train_loss": -18.872114181518555, "global_step": 29440, "epoch": 354} {"train_loss": -18.87525749206543, "global_step": 29441, "epoch": 354} {"train_loss": -18.62204360961914, "global_step": 29442, "epoch": 354} {"train_loss": -19.086536407470703, "global_step": 29443, "epoch": 354} {"train_loss": -18.909040451049805, "global_step": 29444, "epoch": 354} {"train_loss": -19.112634658813477, "global_step": 29445, "epoch": 354} {"train_loss": -19.309232711791992, "global_step": 29446, "epoch": 354} {"train_loss": -19.196552276611328, "global_step": 29447, "epoch": 354} {"train_loss": -18.382465362548828, "global_step": 29448, "epoch": 354} {"train_loss": -18.512405395507812, "global_step": 29449, "epoch": 354} {"train_loss": -19.076852798461914, "global_step": 29450, "epoch": 354} {"train_loss": -19.036754608154297, "global_step": 29451, "epoch": 354} {"train_loss": -18.785512924194336, "global_step": 29452, "epoch": 354} {"train_loss": -18.79205322265625, "global_step": 29453, "epoch": 354} {"train_loss": -18.85951805114746, "global_step": 29454, "epoch": 354} {"train_loss": -19.101078033447266, "global_step": 29455, "epoch": 354} {"train_loss": -18.782672882080078, "global_step": 29456, "epoch": 354} {"train_loss": -18.82403564453125, "global_step": 29457, "epoch": 354} {"train_loss": -18.69202423095703, "global_step": 29458, "epoch": 354} {"train_loss": -18.65605354309082, "global_step": 29459, "epoch": 354} {"train_loss": -19.05671501159668, "global_step": 29460, "epoch": 354} {"train_loss": -19.32784080505371, "global_step": 29461, "epoch": 354} {"train_loss": -18.801422119140625, "global_step": 29462, "epoch": 354} {"train_loss": -19.34256935119629, "global_step": 29463, "epoch": 354} {"train_loss": -18.886909048241304, "global_step": 29464, "epoch": 354, "val_loss": 5952588.0} {"train_loss": -18.104969024658203, "global_step": 29465, "epoch": 355} {"train_loss": -18.251251220703125, "global_step": 29466, "epoch": 355} {"train_loss": -18.937744140625, "global_step": 29467, "epoch": 355} {"train_loss": -18.109210968017578, "global_step": 29468, "epoch": 355} {"train_loss": -18.780607223510742, "global_step": 29469, "epoch": 355} {"train_loss": -18.281143188476562, "global_step": 29470, "epoch": 355} {"train_loss": -18.774648666381836, "global_step": 29471, "epoch": 355} {"train_loss": -18.983240127563477, "global_step": 29472, "epoch": 355} {"train_loss": -18.648361206054688, "global_step": 29473, "epoch": 355} {"train_loss": -18.727432250976562, "global_step": 29474, "epoch": 355} {"train_loss": -18.883371353149414, "global_step": 29475, "epoch": 355} {"train_loss": -18.745637893676758, "global_step": 29476, "epoch": 355} {"train_loss": -18.421146392822266, "global_step": 29477, "epoch": 355} {"train_loss": -19.203022003173828, "global_step": 29478, "epoch": 355} {"train_loss": -19.07258415222168, "global_step": 29479, "epoch": 355} {"train_loss": -18.622684478759766, "global_step": 29480, "epoch": 355} {"train_loss": -19.0986385345459, "global_step": 29481, "epoch": 355} {"train_loss": -18.606679916381836, "global_step": 29482, "epoch": 355} {"train_loss": -19.071937561035156, "global_step": 29483, "epoch": 355} {"train_loss": -19.1385555267334, "global_step": 29484, "epoch": 355} {"train_loss": -18.88239860534668, "global_step": 29485, "epoch": 355} {"train_loss": -18.685089111328125, "global_step": 29486, "epoch": 355} {"train_loss": -19.163984298706055, "global_step": 29487, "epoch": 355} {"train_loss": -18.941516876220703, "global_step": 29488, "epoch": 355} {"train_loss": -19.155500411987305, "global_step": 29489, "epoch": 355} {"train_loss": -18.742828369140625, "global_step": 29490, "epoch": 355} {"train_loss": -18.465429306030273, "global_step": 29491, "epoch": 355} {"train_loss": -18.572879791259766, "global_step": 29492, "epoch": 355} {"train_loss": -18.888845443725586, "global_step": 29493, "epoch": 355} {"train_loss": -19.141773223876953, "global_step": 29494, "epoch": 355} {"train_loss": -18.95991325378418, "global_step": 29495, "epoch": 355} {"train_loss": -19.20497703552246, "global_step": 29496, "epoch": 355} {"train_loss": -18.915794372558594, "global_step": 29497, "epoch": 355} {"train_loss": -18.87135124206543, "global_step": 29498, "epoch": 355} {"train_loss": -18.82313346862793, "global_step": 29499, "epoch": 355} {"train_loss": -18.701215744018555, "global_step": 29500, "epoch": 355} {"train_loss": -19.09527587890625, "global_step": 29501, "epoch": 355} {"train_loss": -19.045637130737305, "global_step": 29502, "epoch": 355} {"train_loss": -18.989770889282227, "global_step": 29503, "epoch": 355} {"train_loss": -19.144880294799805, "global_step": 29504, "epoch": 355} {"train_loss": -19.023204803466797, "global_step": 29505, "epoch": 355} {"train_loss": -18.975515365600586, "global_step": 29506, "epoch": 355} {"train_loss": -19.114255905151367, "global_step": 29507, "epoch": 355} {"train_loss": -19.168109893798828, "global_step": 29508, "epoch": 355} {"train_loss": -18.83535385131836, "global_step": 29509, "epoch": 355} {"train_loss": -18.81778907775879, "global_step": 29510, "epoch": 355} {"train_loss": -18.916433334350586, "global_step": 29511, "epoch": 355} {"train_loss": -18.88187026977539, "global_step": 29512, "epoch": 355} {"train_loss": -18.6070613861084, "global_step": 29513, "epoch": 355} {"train_loss": -18.554956436157227, "global_step": 29514, "epoch": 355} {"train_loss": -18.85358238220215, "global_step": 29515, "epoch": 355} {"train_loss": -19.133899688720703, "global_step": 29516, "epoch": 355} {"train_loss": -18.526758193969727, "global_step": 29517, "epoch": 355} {"train_loss": -19.209156036376953, "global_step": 29518, "epoch": 355} {"train_loss": -19.423818588256836, "global_step": 29519, "epoch": 355} {"train_loss": -18.59906578063965, "global_step": 29520, "epoch": 355} {"train_loss": -19.04201889038086, "global_step": 29521, "epoch": 355} {"train_loss": -19.32086753845215, "global_step": 29522, "epoch": 355} {"train_loss": -18.654321670532227, "global_step": 29523, "epoch": 355} {"train_loss": -19.186132431030273, "global_step": 29524, "epoch": 355} {"train_loss": -19.1908016204834, "global_step": 29525, "epoch": 355} {"train_loss": -18.891611099243164, "global_step": 29526, "epoch": 355} {"train_loss": -18.891172409057617, "global_step": 29527, "epoch": 355} {"train_loss": -18.35953140258789, "global_step": 29528, "epoch": 355} {"train_loss": -18.752676010131836, "global_step": 29529, "epoch": 355} {"train_loss": -18.962186813354492, "global_step": 29530, "epoch": 355} {"train_loss": -18.74563980102539, "global_step": 29531, "epoch": 355} {"train_loss": -18.762638092041016, "global_step": 29532, "epoch": 355} {"train_loss": -19.053054809570312, "global_step": 29533, "epoch": 355} {"train_loss": -19.17930030822754, "global_step": 29534, "epoch": 355} {"train_loss": -18.837604522705078, "global_step": 29535, "epoch": 355} {"train_loss": -18.715801239013672, "global_step": 29536, "epoch": 355} {"train_loss": -18.898883819580078, "global_step": 29537, "epoch": 355} {"train_loss": -18.9825439453125, "global_step": 29538, "epoch": 355} {"train_loss": -18.537216186523438, "global_step": 29539, "epoch": 355} {"train_loss": -18.73524284362793, "global_step": 29540, "epoch": 355} {"train_loss": -19.10696792602539, "global_step": 29541, "epoch": 355} {"train_loss": -19.29449462890625, "global_step": 29542, "epoch": 355} {"train_loss": -19.100887298583984, "global_step": 29543, "epoch": 355} {"train_loss": -18.895254135131836, "global_step": 29544, "epoch": 355} {"train_loss": -19.029129028320312, "global_step": 29545, "epoch": 355} {"train_loss": -18.873414993286133, "global_step": 29546, "epoch": 355} {"train_loss": -18.87276943620429, "global_step": 29547, "epoch": 355, "val_loss": 5995734.0} {"train_loss": -18.354923248291016, "global_step": 29548, "epoch": 356} {"train_loss": -18.475460052490234, "global_step": 29549, "epoch": 356} {"train_loss": -19.299055099487305, "global_step": 29550, "epoch": 356} {"train_loss": -18.3084716796875, "global_step": 29551, "epoch": 356} {"train_loss": -18.67438316345215, "global_step": 29552, "epoch": 356} {"train_loss": -18.46681022644043, "global_step": 29553, "epoch": 356} {"train_loss": -18.923254013061523, "global_step": 29554, "epoch": 356} {"train_loss": -18.436914443969727, "global_step": 29555, "epoch": 356} {"train_loss": -18.62116050720215, "global_step": 29556, "epoch": 356} {"train_loss": -18.855710983276367, "global_step": 29557, "epoch": 356} {"train_loss": -18.372865676879883, "global_step": 29558, "epoch": 356} {"train_loss": -18.59832191467285, "global_step": 29559, "epoch": 356} {"train_loss": -19.294347763061523, "global_step": 29560, "epoch": 356} {"train_loss": -18.752721786499023, "global_step": 29561, "epoch": 356} {"train_loss": -18.635772705078125, "global_step": 29562, "epoch": 356} {"train_loss": -19.060928344726562, "global_step": 29563, "epoch": 356} {"train_loss": -18.94643783569336, "global_step": 29564, "epoch": 356} {"train_loss": -18.890531539916992, "global_step": 29565, "epoch": 356} {"train_loss": -18.522891998291016, "global_step": 29566, "epoch": 356} {"train_loss": -18.691904067993164, "global_step": 29567, "epoch": 356} {"train_loss": -19.123762130737305, "global_step": 29568, "epoch": 356} {"train_loss": -18.65979766845703, "global_step": 29569, "epoch": 356} {"train_loss": -18.590919494628906, "global_step": 29570, "epoch": 356} {"train_loss": -19.03019142150879, "global_step": 29571, "epoch": 356} {"train_loss": -18.980710983276367, "global_step": 29572, "epoch": 356} {"train_loss": -19.03155517578125, "global_step": 29573, "epoch": 356} {"train_loss": -18.996004104614258, "global_step": 29574, "epoch": 356} {"train_loss": -18.78297996520996, "global_step": 29575, "epoch": 356} {"train_loss": -18.704622268676758, "global_step": 29576, "epoch": 356} {"train_loss": -18.828887939453125, "global_step": 29577, "epoch": 356} {"train_loss": -18.838943481445312, "global_step": 29578, "epoch": 356} {"train_loss": -18.617950439453125, "global_step": 29579, "epoch": 356} {"train_loss": -18.667997360229492, "global_step": 29580, "epoch": 356} {"train_loss": -19.22303581237793, "global_step": 29581, "epoch": 356} {"train_loss": -19.146923065185547, "global_step": 29582, "epoch": 356} {"train_loss": -18.854246139526367, "global_step": 29583, "epoch": 356} {"train_loss": -18.683988571166992, "global_step": 29584, "epoch": 356} {"train_loss": -19.458972930908203, "global_step": 29585, "epoch": 356} {"train_loss": -18.891063690185547, "global_step": 29586, "epoch": 356} {"train_loss": -18.900558471679688, "global_step": 29587, "epoch": 356} {"train_loss": -18.856983184814453, "global_step": 29588, "epoch": 356} {"train_loss": -18.683069229125977, "global_step": 29589, "epoch": 356} {"train_loss": -19.084413528442383, "global_step": 29590, "epoch": 356} {"train_loss": -19.03959083557129, "global_step": 29591, "epoch": 356} {"train_loss": -19.120948791503906, "global_step": 29592, "epoch": 356} {"train_loss": -19.13129997253418, "global_step": 29593, "epoch": 356} {"train_loss": -18.911449432373047, "global_step": 29594, "epoch": 356} {"train_loss": -18.60288429260254, "global_step": 29595, "epoch": 356} {"train_loss": -19.085189819335938, "global_step": 29596, "epoch": 356} {"train_loss": -18.978195190429688, "global_step": 29597, "epoch": 356} {"train_loss": -19.359481811523438, "global_step": 29598, "epoch": 356} {"train_loss": -19.271772384643555, "global_step": 29599, "epoch": 356} {"train_loss": -19.104860305786133, "global_step": 29600, "epoch": 356} {"train_loss": -19.516386032104492, "global_step": 29601, "epoch": 356} {"train_loss": -18.71724510192871, "global_step": 29602, "epoch": 356} {"train_loss": -19.138166427612305, "global_step": 29603, "epoch": 356} {"train_loss": -19.261743545532227, "global_step": 29604, "epoch": 356} {"train_loss": -18.955677032470703, "global_step": 29605, "epoch": 356} {"train_loss": -18.827985763549805, "global_step": 29606, "epoch": 356} {"train_loss": -19.45880699157715, "global_step": 29607, "epoch": 356} {"train_loss": -19.23470687866211, "global_step": 29608, "epoch": 356} {"train_loss": -19.058542251586914, "global_step": 29609, "epoch": 356} {"train_loss": -18.65476417541504, "global_step": 29610, "epoch": 356} {"train_loss": -18.872268676757812, "global_step": 29611, "epoch": 356} {"train_loss": -19.004257202148438, "global_step": 29612, "epoch": 356} {"train_loss": -19.217777252197266, "global_step": 29613, "epoch": 356} {"train_loss": -18.50575065612793, "global_step": 29614, "epoch": 356} {"train_loss": -18.57734489440918, "global_step": 29615, "epoch": 356} {"train_loss": -18.79743194580078, "global_step": 29616, "epoch": 356} {"train_loss": -18.520366668701172, "global_step": 29617, "epoch": 356} {"train_loss": -18.8184871673584, "global_step": 29618, "epoch": 356} {"train_loss": -18.54587745666504, "global_step": 29619, "epoch": 356} {"train_loss": -18.799909591674805, "global_step": 29620, "epoch": 356} {"train_loss": -18.436344146728516, "global_step": 29621, "epoch": 356} {"train_loss": -19.413496017456055, "global_step": 29622, "epoch": 356} {"train_loss": -18.59869384765625, "global_step": 29623, "epoch": 356} {"train_loss": -18.710790634155273, "global_step": 29624, "epoch": 356} {"train_loss": -18.561416625976562, "global_step": 29625, "epoch": 356} {"train_loss": -18.705230712890625, "global_step": 29626, "epoch": 356} {"train_loss": -19.280118942260742, "global_step": 29627, "epoch": 356} {"train_loss": -19.334781646728516, "global_step": 29628, "epoch": 356} {"train_loss": -18.680700302124023, "global_step": 29629, "epoch": 356} {"train_loss": -18.871053879519543, "global_step": 29630, "epoch": 356, "val_loss": 5994345.0} {"train_loss": -18.622344970703125, "global_step": 29631, "epoch": 357} {"train_loss": -18.681493759155273, "global_step": 29632, "epoch": 357} {"train_loss": -19.349193572998047, "global_step": 29633, "epoch": 357} {"train_loss": -18.94392204284668, "global_step": 29634, "epoch": 357} {"train_loss": -19.118730545043945, "global_step": 29635, "epoch": 357} {"train_loss": -18.986793518066406, "global_step": 29636, "epoch": 357} {"train_loss": -18.501867294311523, "global_step": 29637, "epoch": 357} {"train_loss": -19.191139221191406, "global_step": 29638, "epoch": 357} {"train_loss": -19.13732147216797, "global_step": 29639, "epoch": 357} {"train_loss": -18.921995162963867, "global_step": 29640, "epoch": 357} {"train_loss": -18.986661911010742, "global_step": 29641, "epoch": 357} {"train_loss": -18.9752197265625, "global_step": 29642, "epoch": 357} {"train_loss": -19.120731353759766, "global_step": 29643, "epoch": 357} {"train_loss": -19.30689811706543, "global_step": 29644, "epoch": 357} {"train_loss": -18.720808029174805, "global_step": 29645, "epoch": 357} {"train_loss": -18.63627052307129, "global_step": 29646, "epoch": 357} {"train_loss": -19.02265167236328, "global_step": 29647, "epoch": 357} {"train_loss": -18.868091583251953, "global_step": 29648, "epoch": 357} {"train_loss": -18.966808319091797, "global_step": 29649, "epoch": 357} {"train_loss": -18.48935317993164, "global_step": 29650, "epoch": 357} {"train_loss": -18.914846420288086, "global_step": 29651, "epoch": 357} {"train_loss": -19.05792999267578, "global_step": 29652, "epoch": 357} {"train_loss": -18.480066299438477, "global_step": 29653, "epoch": 357} {"train_loss": -18.683439254760742, "global_step": 29654, "epoch": 357} {"train_loss": -18.72212028503418, "global_step": 29655, "epoch": 357} {"train_loss": -19.005910873413086, "global_step": 29656, "epoch": 357} {"train_loss": -18.799488067626953, "global_step": 29657, "epoch": 357} {"train_loss": -18.915843963623047, "global_step": 29658, "epoch": 357} {"train_loss": -18.748456954956055, "global_step": 29659, "epoch": 357} {"train_loss": -19.035400390625, "global_step": 29660, "epoch": 357} {"train_loss": -19.16578483581543, "global_step": 29661, "epoch": 357} {"train_loss": -18.687158584594727, "global_step": 29662, "epoch": 357} {"train_loss": -18.650144577026367, "global_step": 29663, "epoch": 357} {"train_loss": -18.4680118560791, "global_step": 29664, "epoch": 357} {"train_loss": -18.567941665649414, "global_step": 29665, "epoch": 357} {"train_loss": -18.878812789916992, "global_step": 29666, "epoch": 357} {"train_loss": -19.25960350036621, "global_step": 29667, "epoch": 357} {"train_loss": -18.568801879882812, "global_step": 29668, "epoch": 357} {"train_loss": -18.45634651184082, "global_step": 29669, "epoch": 357} {"train_loss": -19.343908309936523, "global_step": 29670, "epoch": 357} {"train_loss": -18.999975204467773, "global_step": 29671, "epoch": 357} {"train_loss": -19.01375389099121, "global_step": 29672, "epoch": 357} {"train_loss": -19.046903610229492, "global_step": 29673, "epoch": 357} {"train_loss": -18.573074340820312, "global_step": 29674, "epoch": 357} {"train_loss": -18.80276107788086, "global_step": 29675, "epoch": 357} {"train_loss": -18.712818145751953, "global_step": 29676, "epoch": 357} {"train_loss": -18.924957275390625, "global_step": 29677, "epoch": 357} {"train_loss": -19.209104537963867, "global_step": 29678, "epoch": 357} {"train_loss": -19.265316009521484, "global_step": 29679, "epoch": 357} {"train_loss": -19.01411247253418, "global_step": 29680, "epoch": 357} {"train_loss": -19.606821060180664, "global_step": 29681, "epoch": 357} {"train_loss": -18.954282760620117, "global_step": 29682, "epoch": 357} {"train_loss": -18.920215606689453, "global_step": 29683, "epoch": 357} {"train_loss": -19.380064010620117, "global_step": 29684, "epoch": 357} {"train_loss": -18.824914932250977, "global_step": 29685, "epoch": 357} {"train_loss": -19.02437400817871, "global_step": 29686, "epoch": 357} {"train_loss": -19.02644157409668, "global_step": 29687, "epoch": 357} {"train_loss": -18.397584915161133, "global_step": 29688, "epoch": 357} {"train_loss": -18.983678817749023, "global_step": 29689, "epoch": 357} {"train_loss": -18.617887496948242, "global_step": 29690, "epoch": 357} {"train_loss": -18.921480178833008, "global_step": 29691, "epoch": 357} {"train_loss": -18.726343154907227, "global_step": 29692, "epoch": 357} {"train_loss": -18.674062728881836, "global_step": 29693, "epoch": 357} {"train_loss": -18.667524337768555, "global_step": 29694, "epoch": 357} {"train_loss": -18.71811866760254, "global_step": 29695, "epoch": 357} {"train_loss": -19.128355026245117, "global_step": 29696, "epoch": 357} {"train_loss": -19.34467887878418, "global_step": 29697, "epoch": 357} {"train_loss": -18.630014419555664, "global_step": 29698, "epoch": 357} {"train_loss": -19.193845748901367, "global_step": 29699, "epoch": 357} {"train_loss": -19.44599723815918, "global_step": 29700, "epoch": 357} {"train_loss": -19.24080467224121, "global_step": 29701, "epoch": 357} {"train_loss": -19.09620475769043, "global_step": 29702, "epoch": 357} {"train_loss": -19.073684692382812, "global_step": 29703, "epoch": 357} {"train_loss": -18.959867477416992, "global_step": 29704, "epoch": 357} {"train_loss": -18.784902572631836, "global_step": 29705, "epoch": 357} {"train_loss": -18.783185958862305, "global_step": 29706, "epoch": 357} {"train_loss": -19.417898178100586, "global_step": 29707, "epoch": 357} {"train_loss": -18.810312271118164, "global_step": 29708, "epoch": 357} {"train_loss": -19.095504760742188, "global_step": 29709, "epoch": 357} {"train_loss": -18.728485107421875, "global_step": 29710, "epoch": 357} {"train_loss": -19.002399444580078, "global_step": 29711, "epoch": 357} {"train_loss": -18.909412384033203, "global_step": 29712, "epoch": 357} {"train_loss": -18.932848643107587, "global_step": 29713, "epoch": 357, "val_loss": 5975323.5} {"train_loss": -18.814123153686523, "global_step": 29714, "epoch": 358} {"train_loss": -18.752775192260742, "global_step": 29715, "epoch": 358} {"train_loss": -18.77874183654785, "global_step": 29716, "epoch": 358} {"train_loss": -18.88129997253418, "global_step": 29717, "epoch": 358} {"train_loss": -19.305585861206055, "global_step": 29718, "epoch": 358} {"train_loss": -19.255069732666016, "global_step": 29719, "epoch": 358} {"train_loss": -18.579687118530273, "global_step": 29720, "epoch": 358} {"train_loss": -19.071226119995117, "global_step": 29721, "epoch": 358} {"train_loss": -19.259618759155273, "global_step": 29722, "epoch": 358} {"train_loss": -18.665983200073242, "global_step": 29723, "epoch": 358} {"train_loss": -18.60678482055664, "global_step": 29724, "epoch": 358} {"train_loss": -18.85939598083496, "global_step": 29725, "epoch": 358} {"train_loss": -18.704883575439453, "global_step": 29726, "epoch": 358} {"train_loss": -18.851858139038086, "global_step": 29727, "epoch": 358} {"train_loss": -19.1866397857666, "global_step": 29728, "epoch": 358} {"train_loss": -18.824016571044922, "global_step": 29729, "epoch": 358} {"train_loss": -18.9204044342041, "global_step": 29730, "epoch": 358} {"train_loss": -19.26984214782715, "global_step": 29731, "epoch": 358} {"train_loss": -18.718530654907227, "global_step": 29732, "epoch": 358} {"train_loss": -19.0390567779541, "global_step": 29733, "epoch": 358} {"train_loss": -19.076261520385742, "global_step": 29734, "epoch": 358} {"train_loss": -18.881000518798828, "global_step": 29735, "epoch": 358} {"train_loss": -19.024789810180664, "global_step": 29736, "epoch": 358} {"train_loss": -19.117691040039062, "global_step": 29737, "epoch": 358} {"train_loss": -19.168996810913086, "global_step": 29738, "epoch": 358} {"train_loss": -19.03986930847168, "global_step": 29739, "epoch": 358} {"train_loss": -18.91324806213379, "global_step": 29740, "epoch": 358} {"train_loss": -18.96589469909668, "global_step": 29741, "epoch": 358} {"train_loss": -19.075937271118164, "global_step": 29742, "epoch": 358} {"train_loss": -19.099889755249023, "global_step": 29743, "epoch": 358} {"train_loss": -19.095800399780273, "global_step": 29744, "epoch": 358} {"train_loss": -19.165624618530273, "global_step": 29745, "epoch": 358} {"train_loss": -19.124435424804688, "global_step": 29746, "epoch": 358} {"train_loss": -19.06625747680664, "global_step": 29747, "epoch": 358} {"train_loss": -19.2097110748291, "global_step": 29748, "epoch": 358} {"train_loss": -18.814184188842773, "global_step": 29749, "epoch": 358} {"train_loss": -18.861310958862305, "global_step": 29750, "epoch": 358} {"train_loss": -18.75316619873047, "global_step": 29751, "epoch": 358} {"train_loss": -18.913482666015625, "global_step": 29752, "epoch": 358} {"train_loss": -18.76724624633789, "global_step": 29753, "epoch": 358} {"train_loss": -18.553930282592773, "global_step": 29754, "epoch": 358} {"train_loss": -18.804704666137695, "global_step": 29755, "epoch": 358} {"train_loss": -18.96622657775879, "global_step": 29756, "epoch": 358} {"train_loss": -19.043691635131836, "global_step": 29757, "epoch": 358} {"train_loss": -18.77046012878418, "global_step": 29758, "epoch": 358} {"train_loss": -18.740888595581055, "global_step": 29759, "epoch": 358} {"train_loss": -18.808942794799805, "global_step": 29760, "epoch": 358} {"train_loss": -18.774213790893555, "global_step": 29761, "epoch": 358} {"train_loss": -18.81060791015625, "global_step": 29762, "epoch": 358} {"train_loss": -18.802846908569336, "global_step": 29763, "epoch": 358} {"train_loss": -18.95564079284668, "global_step": 29764, "epoch": 358} {"train_loss": -18.58394432067871, "global_step": 29765, "epoch": 358} {"train_loss": -18.933364868164062, "global_step": 29766, "epoch": 358} {"train_loss": -19.054691314697266, "global_step": 29767, "epoch": 358} {"train_loss": -18.852750778198242, "global_step": 29768, "epoch": 358} {"train_loss": -18.69312286376953, "global_step": 29769, "epoch": 358} {"train_loss": -19.10719871520996, "global_step": 29770, "epoch": 358} {"train_loss": -19.05220603942871, "global_step": 29771, "epoch": 358} {"train_loss": -18.90181541442871, "global_step": 29772, "epoch": 358} {"train_loss": -18.654556274414062, "global_step": 29773, "epoch": 358} {"train_loss": -19.139873504638672, "global_step": 29774, "epoch": 358} {"train_loss": -18.61600112915039, "global_step": 29775, "epoch": 358} {"train_loss": -18.70807456970215, "global_step": 29776, "epoch": 358} {"train_loss": -18.97187042236328, "global_step": 29777, "epoch": 358} {"train_loss": -18.812284469604492, "global_step": 29778, "epoch": 358} {"train_loss": -18.791715621948242, "global_step": 29779, "epoch": 358} {"train_loss": -19.30169105529785, "global_step": 29780, "epoch": 358} {"train_loss": -19.2032413482666, "global_step": 29781, "epoch": 358} {"train_loss": -19.145809173583984, "global_step": 29782, "epoch": 358} {"train_loss": -18.863271713256836, "global_step": 29783, "epoch": 358} {"train_loss": -18.851139068603516, "global_step": 29784, "epoch": 358} {"train_loss": -18.9266300201416, "global_step": 29785, "epoch": 358} {"train_loss": -18.83519172668457, "global_step": 29786, "epoch": 358} {"train_loss": -18.910568237304688, "global_step": 29787, "epoch": 358} {"train_loss": -19.109935760498047, "global_step": 29788, "epoch": 358} {"train_loss": -19.102569580078125, "global_step": 29789, "epoch": 358} {"train_loss": -19.185489654541016, "global_step": 29790, "epoch": 358} {"train_loss": -18.726627349853516, "global_step": 29791, "epoch": 358} {"train_loss": -18.963531494140625, "global_step": 29792, "epoch": 358} {"train_loss": -18.493881225585938, "global_step": 29793, "epoch": 358} {"train_loss": -18.855138778686523, "global_step": 29794, "epoch": 358} {"train_loss": -18.41615867614746, "global_step": 29795, "epoch": 358} {"train_loss": -18.914779042623127, "global_step": 29796, "epoch": 358, "val_loss": 5968230.0} {"train_loss": -18.365018844604492, "global_step": 29797, "epoch": 359} {"train_loss": -18.8104190826416, "global_step": 29798, "epoch": 359} {"train_loss": -18.693212509155273, "global_step": 29799, "epoch": 359} {"train_loss": -19.049762725830078, "global_step": 29800, "epoch": 359} {"train_loss": -19.488767623901367, "global_step": 29801, "epoch": 359} {"train_loss": -18.935510635375977, "global_step": 29802, "epoch": 359} {"train_loss": -19.027650833129883, "global_step": 29803, "epoch": 359} {"train_loss": -18.602481842041016, "global_step": 29804, "epoch": 359} {"train_loss": -19.06816291809082, "global_step": 29805, "epoch": 359} {"train_loss": -19.391529083251953, "global_step": 29806, "epoch": 359} {"train_loss": -18.712940216064453, "global_step": 29807, "epoch": 359} {"train_loss": -19.171232223510742, "global_step": 29808, "epoch": 359} {"train_loss": -18.757465362548828, "global_step": 29809, "epoch": 359} {"train_loss": -18.965778350830078, "global_step": 29810, "epoch": 359} {"train_loss": -19.392446517944336, "global_step": 29811, "epoch": 359} {"train_loss": -18.957012176513672, "global_step": 29812, "epoch": 359} {"train_loss": -19.005319595336914, "global_step": 29813, "epoch": 359} {"train_loss": -18.929000854492188, "global_step": 29814, "epoch": 359} {"train_loss": -19.170244216918945, "global_step": 29815, "epoch": 359} {"train_loss": -18.596948623657227, "global_step": 29816, "epoch": 359} {"train_loss": -18.762714385986328, "global_step": 29817, "epoch": 359} {"train_loss": -19.17267417907715, "global_step": 29818, "epoch": 359} {"train_loss": -18.707107543945312, "global_step": 29819, "epoch": 359} {"train_loss": -19.14101219177246, "global_step": 29820, "epoch": 359} {"train_loss": -19.00101661682129, "global_step": 29821, "epoch": 359} {"train_loss": -18.961339950561523, "global_step": 29822, "epoch": 359} {"train_loss": -18.608999252319336, "global_step": 29823, "epoch": 359} {"train_loss": -18.66969871520996, "global_step": 29824, "epoch": 359} {"train_loss": -19.16585350036621, "global_step": 29825, "epoch": 359} {"train_loss": -18.495542526245117, "global_step": 29826, "epoch": 359} {"train_loss": -18.582530975341797, "global_step": 29827, "epoch": 359} {"train_loss": -19.045103073120117, "global_step": 29828, "epoch": 359} {"train_loss": -18.5662899017334, "global_step": 29829, "epoch": 359} {"train_loss": -19.151493072509766, "global_step": 29830, "epoch": 359} {"train_loss": -18.958627700805664, "global_step": 29831, "epoch": 359} {"train_loss": -19.071094512939453, "global_step": 29832, "epoch": 359} {"train_loss": -18.767196655273438, "global_step": 29833, "epoch": 359} {"train_loss": -19.07098388671875, "global_step": 29834, "epoch": 359} {"train_loss": -18.671518325805664, "global_step": 29835, "epoch": 359} {"train_loss": -18.793745040893555, "global_step": 29836, "epoch": 359} {"train_loss": -18.8593807220459, "global_step": 29837, "epoch": 359} {"train_loss": -18.98206901550293, "global_step": 29838, "epoch": 359} {"train_loss": -18.687904357910156, "global_step": 29839, "epoch": 359} {"train_loss": -18.607898712158203, "global_step": 29840, "epoch": 359} {"train_loss": -18.567861557006836, "global_step": 29841, "epoch": 359} {"train_loss": -19.097599029541016, "global_step": 29842, "epoch": 359} {"train_loss": -19.28693962097168, "global_step": 29843, "epoch": 359} {"train_loss": -18.94501304626465, "global_step": 29844, "epoch": 359} {"train_loss": -19.139862060546875, "global_step": 29845, "epoch": 359} {"train_loss": -18.626480102539062, "global_step": 29846, "epoch": 359} {"train_loss": -18.619558334350586, "global_step": 29847, "epoch": 359} {"train_loss": -18.780853271484375, "global_step": 29848, "epoch": 359} {"train_loss": -18.473285675048828, "global_step": 29849, "epoch": 359} {"train_loss": -18.923276901245117, "global_step": 29850, "epoch": 359} {"train_loss": -18.92982292175293, "global_step": 29851, "epoch": 359} {"train_loss": -19.064062118530273, "global_step": 29852, "epoch": 359} {"train_loss": -19.385677337646484, "global_step": 29853, "epoch": 359} {"train_loss": -19.128555297851562, "global_step": 29854, "epoch": 359} {"train_loss": -18.96148681640625, "global_step": 29855, "epoch": 359} {"train_loss": -18.640817642211914, "global_step": 29856, "epoch": 359} {"train_loss": -19.075590133666992, "global_step": 29857, "epoch": 359} {"train_loss": -19.158639907836914, "global_step": 29858, "epoch": 359} {"train_loss": -18.620288848876953, "global_step": 29859, "epoch": 359} {"train_loss": -18.706836700439453, "global_step": 29860, "epoch": 359} {"train_loss": -19.35504722595215, "global_step": 29861, "epoch": 359} {"train_loss": -19.090871810913086, "global_step": 29862, "epoch": 359} {"train_loss": -19.027524948120117, "global_step": 29863, "epoch": 359} {"train_loss": -18.579294204711914, "global_step": 29864, "epoch": 359} {"train_loss": -18.836427688598633, "global_step": 29865, "epoch": 359} {"train_loss": -18.80343246459961, "global_step": 29866, "epoch": 359} {"train_loss": -18.741159439086914, "global_step": 29867, "epoch": 359} {"train_loss": -18.64387321472168, "global_step": 29868, "epoch": 359} {"train_loss": -19.069976806640625, "global_step": 29869, "epoch": 359} {"train_loss": -19.114215850830078, "global_step": 29870, "epoch": 359} {"train_loss": -18.82283592224121, "global_step": 29871, "epoch": 359} {"train_loss": -18.954809188842773, "global_step": 29872, "epoch": 359} {"train_loss": -18.505468368530273, "global_step": 29873, "epoch": 359} {"train_loss": -18.84456443786621, "global_step": 29874, "epoch": 359} {"train_loss": -18.743925094604492, "global_step": 29875, "epoch": 359} {"train_loss": -19.309263229370117, "global_step": 29876, "epoch": 359} {"train_loss": -18.78167152404785, "global_step": 29877, "epoch": 359} {"train_loss": -18.861867904663086, "global_step": 29878, "epoch": 359} {"train_loss": -18.892046939895813, "global_step": 29879, "epoch": 359, "val_loss": 5995342.0} {"train_loss": -18.720813751220703, "global_step": 29880, "epoch": 360} {"train_loss": -18.50481605529785, "global_step": 29881, "epoch": 360} {"train_loss": -19.002988815307617, "global_step": 29882, "epoch": 360} {"train_loss": -18.576353073120117, "global_step": 29883, "epoch": 360} {"train_loss": -19.180322647094727, "global_step": 29884, "epoch": 360} {"train_loss": -18.595975875854492, "global_step": 29885, "epoch": 360} {"train_loss": -19.0786190032959, "global_step": 29886, "epoch": 360} {"train_loss": -18.629526138305664, "global_step": 29887, "epoch": 360} {"train_loss": -18.53897476196289, "global_step": 29888, "epoch": 360} {"train_loss": -19.22136116027832, "global_step": 29889, "epoch": 360} {"train_loss": -18.513940811157227, "global_step": 29890, "epoch": 360} {"train_loss": -18.706525802612305, "global_step": 29891, "epoch": 360} {"train_loss": -18.77030372619629, "global_step": 29892, "epoch": 360} {"train_loss": -18.59638023376465, "global_step": 29893, "epoch": 360} {"train_loss": -18.759525299072266, "global_step": 29894, "epoch": 360} {"train_loss": -18.819883346557617, "global_step": 29895, "epoch": 360} {"train_loss": -19.140806198120117, "global_step": 29896, "epoch": 360} {"train_loss": -18.84111976623535, "global_step": 29897, "epoch": 360} {"train_loss": -19.339345932006836, "global_step": 29898, "epoch": 360} {"train_loss": -19.058977127075195, "global_step": 29899, "epoch": 360} {"train_loss": -19.1155948638916, "global_step": 29900, "epoch": 360} {"train_loss": -19.153690338134766, "global_step": 29901, "epoch": 360} {"train_loss": -18.7937068939209, "global_step": 29902, "epoch": 360} {"train_loss": -19.0003662109375, "global_step": 29903, "epoch": 360} {"train_loss": -19.01578712463379, "global_step": 29904, "epoch": 360} {"train_loss": -18.96320152282715, "global_step": 29905, "epoch": 360} {"train_loss": -18.826465606689453, "global_step": 29906, "epoch": 360} {"train_loss": -19.075448989868164, "global_step": 29907, "epoch": 360} {"train_loss": -18.942426681518555, "global_step": 29908, "epoch": 360} {"train_loss": -18.888328552246094, "global_step": 29909, "epoch": 360} {"train_loss": -18.944639205932617, "global_step": 29910, "epoch": 360} {"train_loss": -19.347179412841797, "global_step": 29911, "epoch": 360} {"train_loss": -18.888029098510742, "global_step": 29912, "epoch": 360} {"train_loss": -19.0150089263916, "global_step": 29913, "epoch": 360} {"train_loss": -18.999143600463867, "global_step": 29914, "epoch": 360} {"train_loss": -18.90718650817871, "global_step": 29915, "epoch": 360} {"train_loss": -19.085432052612305, "global_step": 29916, "epoch": 360} {"train_loss": -18.792903900146484, "global_step": 29917, "epoch": 360} {"train_loss": -19.10638999938965, "global_step": 29918, "epoch": 360} {"train_loss": -18.797082901000977, "global_step": 29919, "epoch": 360} {"train_loss": -19.01605796813965, "global_step": 29920, "epoch": 360} {"train_loss": -18.856908798217773, "global_step": 29921, "epoch": 360} {"train_loss": -18.791906356811523, "global_step": 29922, "epoch": 360} {"train_loss": -19.469287872314453, "global_step": 29923, "epoch": 360} {"train_loss": -19.078168869018555, "global_step": 29924, "epoch": 360} {"train_loss": -18.49713134765625, "global_step": 29925, "epoch": 360} {"train_loss": -19.13239097595215, "global_step": 29926, "epoch": 360} {"train_loss": -18.827199935913086, "global_step": 29927, "epoch": 360} {"train_loss": -19.15217399597168, "global_step": 29928, "epoch": 360} {"train_loss": -18.944847106933594, "global_step": 29929, "epoch": 360} {"train_loss": -18.797637939453125, "global_step": 29930, "epoch": 360} {"train_loss": -18.583730697631836, "global_step": 29931, "epoch": 360} {"train_loss": -18.867446899414062, "global_step": 29932, "epoch": 360} {"train_loss": -18.901453018188477, "global_step": 29933, "epoch": 360} {"train_loss": -19.333494186401367, "global_step": 29934, "epoch": 360} {"train_loss": -18.931652069091797, "global_step": 29935, "epoch": 360} {"train_loss": -18.97355842590332, "global_step": 29936, "epoch": 360} {"train_loss": -19.125137329101562, "global_step": 29937, "epoch": 360} {"train_loss": -18.975238800048828, "global_step": 29938, "epoch": 360} {"train_loss": -18.744369506835938, "global_step": 29939, "epoch": 360} {"train_loss": -18.913711547851562, "global_step": 29940, "epoch": 360} {"train_loss": -18.91981315612793, "global_step": 29941, "epoch": 360} {"train_loss": -19.010732650756836, "global_step": 29942, "epoch": 360} {"train_loss": -19.209409713745117, "global_step": 29943, "epoch": 360} {"train_loss": -18.970346450805664, "global_step": 29944, "epoch": 360} {"train_loss": -19.171934127807617, "global_step": 29945, "epoch": 360} {"train_loss": -18.82736587524414, "global_step": 29946, "epoch": 360} {"train_loss": -18.591115951538086, "global_step": 29947, "epoch": 360} {"train_loss": -19.016077041625977, "global_step": 29948, "epoch": 360} {"train_loss": -18.725128173828125, "global_step": 29949, "epoch": 360} {"train_loss": -18.609983444213867, "global_step": 29950, "epoch": 360} {"train_loss": -19.241804122924805, "global_step": 29951, "epoch": 360} {"train_loss": -19.03523826599121, "global_step": 29952, "epoch": 360} {"train_loss": -18.58515739440918, "global_step": 29953, "epoch": 360} {"train_loss": -18.92934226989746, "global_step": 29954, "epoch": 360} {"train_loss": -18.90723991394043, "global_step": 29955, "epoch": 360} {"train_loss": -18.71132469177246, "global_step": 29956, "epoch": 360} {"train_loss": -18.839527130126953, "global_step": 29957, "epoch": 360} {"train_loss": -18.65374755859375, "global_step": 29958, "epoch": 360} {"train_loss": -18.55695915222168, "global_step": 29959, "epoch": 360} {"train_loss": -18.824148178100586, "global_step": 29960, "epoch": 360} {"train_loss": -18.938268661499023, "global_step": 29961, "epoch": 360} {"train_loss": -18.91454145132777, "global_step": 29962, "epoch": 360, "val_loss": 5883839.5} {"train_loss": -18.6003360748291, "global_step": 29963, "epoch": 361} {"train_loss": -18.800661087036133, "global_step": 29964, "epoch": 361} {"train_loss": -19.00745964050293, "global_step": 29965, "epoch": 361} {"train_loss": -18.78223419189453, "global_step": 29966, "epoch": 361} {"train_loss": -19.042644500732422, "global_step": 29967, "epoch": 361} {"train_loss": -18.840375900268555, "global_step": 29968, "epoch": 361} {"train_loss": -19.222219467163086, "global_step": 29969, "epoch": 361} {"train_loss": -19.021116256713867, "global_step": 29970, "epoch": 361} {"train_loss": -18.504467010498047, "global_step": 29971, "epoch": 361} {"train_loss": -18.892078399658203, "global_step": 29972, "epoch": 361} {"train_loss": -18.950546264648438, "global_step": 29973, "epoch": 361} {"train_loss": -19.080400466918945, "global_step": 29974, "epoch": 361} {"train_loss": -18.806961059570312, "global_step": 29975, "epoch": 361} {"train_loss": -18.80232048034668, "global_step": 29976, "epoch": 361} {"train_loss": -18.878768920898438, "global_step": 29977, "epoch": 361} {"train_loss": -18.869674682617188, "global_step": 29978, "epoch": 361} {"train_loss": -19.02309799194336, "global_step": 29979, "epoch": 361} {"train_loss": -19.047508239746094, "global_step": 29980, "epoch": 361} {"train_loss": -18.936811447143555, "global_step": 29981, "epoch": 361} {"train_loss": -18.730270385742188, "global_step": 29982, "epoch": 361} {"train_loss": -19.150449752807617, "global_step": 29983, "epoch": 361} {"train_loss": -18.95659637451172, "global_step": 29984, "epoch": 361} {"train_loss": -18.90473747253418, "global_step": 29985, "epoch": 361} {"train_loss": -19.07686424255371, "global_step": 29986, "epoch": 361} {"train_loss": -19.256078720092773, "global_step": 29987, "epoch": 361} {"train_loss": -19.026660919189453, "global_step": 29988, "epoch": 361} {"train_loss": -19.39029312133789, "global_step": 29989, "epoch": 361} {"train_loss": -18.895360946655273, "global_step": 29990, "epoch": 361} {"train_loss": -19.123613357543945, "global_step": 29991, "epoch": 361} {"train_loss": -19.193723678588867, "global_step": 29992, "epoch": 361} {"train_loss": -18.782920837402344, "global_step": 29993, "epoch": 361} {"train_loss": -19.024702072143555, "global_step": 29994, "epoch": 361} {"train_loss": -18.765239715576172, "global_step": 29995, "epoch": 361} {"train_loss": -18.787044525146484, "global_step": 29996, "epoch": 361} {"train_loss": -18.873849868774414, "global_step": 29997, "epoch": 361} {"train_loss": -19.034826278686523, "global_step": 29998, "epoch": 361} {"train_loss": -18.391202926635742, "global_step": 29999, "epoch": 361} {"train_loss": -18.90404510498047, "global_step": 30000, "epoch": 361} {"train_loss": -18.9162540435791, "global_step": 30001, "epoch": 361} {"train_loss": -19.3906192779541, "global_step": 30002, "epoch": 361} {"train_loss": -19.260488510131836, "global_step": 30003, "epoch": 361} {"train_loss": -18.719650268554688, "global_step": 30004, "epoch": 361} {"train_loss": -18.74833106994629, "global_step": 30005, "epoch": 361} {"train_loss": -19.19083595275879, "global_step": 30006, "epoch": 361} {"train_loss": -18.640161514282227, "global_step": 30007, "epoch": 361} {"train_loss": -19.306503295898438, "global_step": 30008, "epoch": 361} {"train_loss": -18.898977279663086, "global_step": 30009, "epoch": 361} {"train_loss": -18.903547286987305, "global_step": 30010, "epoch": 361} {"train_loss": -18.58273696899414, "global_step": 30011, "epoch": 361} {"train_loss": -19.108304977416992, "global_step": 30012, "epoch": 361} {"train_loss": -18.561908721923828, "global_step": 30013, "epoch": 361} {"train_loss": -18.52119255065918, "global_step": 30014, "epoch": 361} {"train_loss": -19.133480072021484, "global_step": 30015, "epoch": 361} {"train_loss": -19.133197784423828, "global_step": 30016, "epoch": 361} {"train_loss": -19.190338134765625, "global_step": 30017, "epoch": 361} {"train_loss": -19.294719696044922, "global_step": 30018, "epoch": 361} {"train_loss": -18.960880279541016, "global_step": 30019, "epoch": 361} {"train_loss": -18.840763092041016, "global_step": 30020, "epoch": 361} {"train_loss": -18.97486114501953, "global_step": 30021, "epoch": 361} {"train_loss": -18.76496696472168, "global_step": 30022, "epoch": 361} {"train_loss": -19.1265926361084, "global_step": 30023, "epoch": 361} {"train_loss": -18.946157455444336, "global_step": 30024, "epoch": 361} {"train_loss": -19.085529327392578, "global_step": 30025, "epoch": 361} {"train_loss": -18.616731643676758, "global_step": 30026, "epoch": 361} {"train_loss": -19.005189895629883, "global_step": 30027, "epoch": 361} {"train_loss": -19.106786727905273, "global_step": 30028, "epoch": 361} {"train_loss": -19.274023056030273, "global_step": 30029, "epoch": 361} {"train_loss": -19.079679489135742, "global_step": 30030, "epoch": 361} {"train_loss": -18.863292694091797, "global_step": 30031, "epoch": 361} {"train_loss": -18.846384048461914, "global_step": 30032, "epoch": 361} {"train_loss": -18.69953727722168, "global_step": 30033, "epoch": 361} {"train_loss": -19.391742706298828, "global_step": 30034, "epoch": 361} {"train_loss": -18.639135360717773, "global_step": 30035, "epoch": 361} {"train_loss": -18.71320152282715, "global_step": 30036, "epoch": 361} {"train_loss": -18.60797119140625, "global_step": 30037, "epoch": 361} {"train_loss": -18.89484977722168, "global_step": 30038, "epoch": 361} {"train_loss": -19.250776290893555, "global_step": 30039, "epoch": 361} {"train_loss": -19.0835018157959, "global_step": 30040, "epoch": 361} {"train_loss": -19.394739151000977, "global_step": 30041, "epoch": 361} {"train_loss": -19.01068687438965, "global_step": 30042, "epoch": 361} {"train_loss": -18.909870147705078, "global_step": 30043, "epoch": 361} {"train_loss": -18.519580841064453, "global_step": 30044, "epoch": 361} {"train_loss": -18.935738368206714, "global_step": 30045, "epoch": 361, "val_loss": 6041861.5} {"train_loss": -18.74690818786621, "global_step": 30046, "epoch": 362} {"train_loss": -18.539182662963867, "global_step": 30047, "epoch": 362} {"train_loss": -18.875829696655273, "global_step": 30048, "epoch": 362} {"train_loss": -18.992908477783203, "global_step": 30049, "epoch": 362} {"train_loss": -18.656024932861328, "global_step": 30050, "epoch": 362} {"train_loss": -18.65106773376465, "global_step": 30051, "epoch": 362} {"train_loss": -19.24725341796875, "global_step": 30052, "epoch": 362} {"train_loss": -18.85172462463379, "global_step": 30053, "epoch": 362} {"train_loss": -19.022077560424805, "global_step": 30054, "epoch": 362} {"train_loss": -18.963714599609375, "global_step": 30055, "epoch": 362} {"train_loss": -19.06709861755371, "global_step": 30056, "epoch": 362} {"train_loss": -18.62355613708496, "global_step": 30057, "epoch": 362} {"train_loss": -18.986942291259766, "global_step": 30058, "epoch": 362} {"train_loss": -18.973243713378906, "global_step": 30059, "epoch": 362} {"train_loss": -18.53185272216797, "global_step": 30060, "epoch": 362} {"train_loss": -18.579504013061523, "global_step": 30061, "epoch": 362} {"train_loss": -19.04460334777832, "global_step": 30062, "epoch": 362} {"train_loss": -18.442373275756836, "global_step": 30063, "epoch": 362} {"train_loss": -18.92548179626465, "global_step": 30064, "epoch": 362} {"train_loss": -18.63504409790039, "global_step": 30065, "epoch": 362} {"train_loss": -19.078903198242188, "global_step": 30066, "epoch": 362} {"train_loss": -19.112770080566406, "global_step": 30067, "epoch": 362} {"train_loss": -18.930845260620117, "global_step": 30068, "epoch": 362} {"train_loss": -19.130788803100586, "global_step": 30069, "epoch": 362} {"train_loss": -18.93195915222168, "global_step": 30070, "epoch": 362} {"train_loss": -18.99845314025879, "global_step": 30071, "epoch": 362} {"train_loss": -19.000717163085938, "global_step": 30072, "epoch": 362} {"train_loss": -19.04115104675293, "global_step": 30073, "epoch": 362} {"train_loss": -18.755117416381836, "global_step": 30074, "epoch": 362} {"train_loss": -18.7404727935791, "global_step": 30075, "epoch": 362} {"train_loss": -19.239089965820312, "global_step": 30076, "epoch": 362} {"train_loss": -18.88347625732422, "global_step": 30077, "epoch": 362} {"train_loss": -18.799015045166016, "global_step": 30078, "epoch": 362} {"train_loss": -18.886091232299805, "global_step": 30079, "epoch": 362} {"train_loss": -18.966278076171875, "global_step": 30080, "epoch": 362} {"train_loss": -18.790973663330078, "global_step": 30081, "epoch": 362} {"train_loss": -19.42633056640625, "global_step": 30082, "epoch": 362} {"train_loss": -18.534692764282227, "global_step": 30083, "epoch": 362} {"train_loss": -19.141271591186523, "global_step": 30084, "epoch": 362} {"train_loss": -18.96834373474121, "global_step": 30085, "epoch": 362} {"train_loss": -18.715513229370117, "global_step": 30086, "epoch": 362} {"train_loss": -19.316814422607422, "global_step": 30087, "epoch": 362} {"train_loss": -18.945880889892578, "global_step": 30088, "epoch": 362} {"train_loss": -19.07950782775879, "global_step": 30089, "epoch": 362} {"train_loss": -19.167551040649414, "global_step": 30090, "epoch": 362} {"train_loss": -18.69806480407715, "global_step": 30091, "epoch": 362} {"train_loss": -19.10689353942871, "global_step": 30092, "epoch": 362} {"train_loss": -18.78815269470215, "global_step": 30093, "epoch": 362} {"train_loss": -18.709745407104492, "global_step": 30094, "epoch": 362} {"train_loss": -19.290807723999023, "global_step": 30095, "epoch": 362} {"train_loss": -19.058271408081055, "global_step": 30096, "epoch": 362} {"train_loss": -19.05060577392578, "global_step": 30097, "epoch": 362} {"train_loss": -19.064403533935547, "global_step": 30098, "epoch": 362} {"train_loss": -19.159948348999023, "global_step": 30099, "epoch": 362} {"train_loss": -19.30620765686035, "global_step": 30100, "epoch": 362} {"train_loss": -19.12495231628418, "global_step": 30101, "epoch": 362} {"train_loss": -19.388784408569336, "global_step": 30102, "epoch": 362} {"train_loss": -18.64664649963379, "global_step": 30103, "epoch": 362} {"train_loss": -19.0440616607666, "global_step": 30104, "epoch": 362} {"train_loss": -19.081342697143555, "global_step": 30105, "epoch": 362} {"train_loss": -18.963735580444336, "global_step": 30106, "epoch": 362} {"train_loss": -19.095077514648438, "global_step": 30107, "epoch": 362} {"train_loss": -18.923120498657227, "global_step": 30108, "epoch": 362} {"train_loss": -18.877527236938477, "global_step": 30109, "epoch": 362} {"train_loss": -18.803909301757812, "global_step": 30110, "epoch": 362} {"train_loss": -18.9486141204834, "global_step": 30111, "epoch": 362} {"train_loss": -18.899221420288086, "global_step": 30112, "epoch": 362} {"train_loss": -19.022113800048828, "global_step": 30113, "epoch": 362} {"train_loss": -18.772171020507812, "global_step": 30114, "epoch": 362} {"train_loss": -18.682886123657227, "global_step": 30115, "epoch": 362} {"train_loss": -18.675601959228516, "global_step": 30116, "epoch": 362} {"train_loss": -18.749780654907227, "global_step": 30117, "epoch": 362} {"train_loss": -19.0151424407959, "global_step": 30118, "epoch": 362} {"train_loss": -18.8669490814209, "global_step": 30119, "epoch": 362} {"train_loss": -18.83216667175293, "global_step": 30120, "epoch": 362} {"train_loss": -19.057798385620117, "global_step": 30121, "epoch": 362} {"train_loss": -18.86655616760254, "global_step": 30122, "epoch": 362} {"train_loss": -19.26104164123535, "global_step": 30123, "epoch": 362} {"train_loss": -19.14581871032715, "global_step": 30124, "epoch": 362} {"train_loss": -19.31621742248535, "global_step": 30125, "epoch": 362} {"train_loss": -18.814687728881836, "global_step": 30126, "epoch": 362} {"train_loss": -18.87430763244629, "global_step": 30127, "epoch": 362} {"train_loss": -18.946914397090314, "global_step": 30128, "epoch": 362, "val_loss": 6067946.0} {"train_loss": -18.44066619873047, "global_step": 30129, "epoch": 363} {"train_loss": -18.346586227416992, "global_step": 30130, "epoch": 363} {"train_loss": -18.867578506469727, "global_step": 30131, "epoch": 363} {"train_loss": -19.04660415649414, "global_step": 30132, "epoch": 363} {"train_loss": -18.716093063354492, "global_step": 30133, "epoch": 363} {"train_loss": -18.732467651367188, "global_step": 30134, "epoch": 363} {"train_loss": -19.022626876831055, "global_step": 30135, "epoch": 363} {"train_loss": -18.918500900268555, "global_step": 30136, "epoch": 363} {"train_loss": -18.64472007751465, "global_step": 30137, "epoch": 363} {"train_loss": -18.78670310974121, "global_step": 30138, "epoch": 363} {"train_loss": -18.647977828979492, "global_step": 30139, "epoch": 363} {"train_loss": -18.7882137298584, "global_step": 30140, "epoch": 363} {"train_loss": -18.904138565063477, "global_step": 30141, "epoch": 363} {"train_loss": -19.066303253173828, "global_step": 30142, "epoch": 363} {"train_loss": -18.991575241088867, "global_step": 30143, "epoch": 363} {"train_loss": -18.750234603881836, "global_step": 30144, "epoch": 363} {"train_loss": -18.695947647094727, "global_step": 30145, "epoch": 363} {"train_loss": -19.11405372619629, "global_step": 30146, "epoch": 363} {"train_loss": -19.131765365600586, "global_step": 30147, "epoch": 363} {"train_loss": -18.842443466186523, "global_step": 30148, "epoch": 363} {"train_loss": -18.624433517456055, "global_step": 30149, "epoch": 363} {"train_loss": -19.097614288330078, "global_step": 30150, "epoch": 363} {"train_loss": -18.735387802124023, "global_step": 30151, "epoch": 363} {"train_loss": -18.55353355407715, "global_step": 30152, "epoch": 363} {"train_loss": -18.792984008789062, "global_step": 30153, "epoch": 363} {"train_loss": -18.63254737854004, "global_step": 30154, "epoch": 363} {"train_loss": -19.01970863342285, "global_step": 30155, "epoch": 363} {"train_loss": -19.127267837524414, "global_step": 30156, "epoch": 363} {"train_loss": -18.972021102905273, "global_step": 30157, "epoch": 363} {"train_loss": -18.71890640258789, "global_step": 30158, "epoch": 363} {"train_loss": -18.790369033813477, "global_step": 30159, "epoch": 363} {"train_loss": -19.39450454711914, "global_step": 30160, "epoch": 363} {"train_loss": -19.12046241760254, "global_step": 30161, "epoch": 363} {"train_loss": -18.9294490814209, "global_step": 30162, "epoch": 363} {"train_loss": -18.82785987854004, "global_step": 30163, "epoch": 363} {"train_loss": -18.662067413330078, "global_step": 30164, "epoch": 363} {"train_loss": -18.71551513671875, "global_step": 30165, "epoch": 363} {"train_loss": -18.900671005249023, "global_step": 30166, "epoch": 363} {"train_loss": -18.76333236694336, "global_step": 30167, "epoch": 363} {"train_loss": -18.994232177734375, "global_step": 30168, "epoch": 363} {"train_loss": -18.749414443969727, "global_step": 30169, "epoch": 363} {"train_loss": -19.073436737060547, "global_step": 30170, "epoch": 363} {"train_loss": -18.91297721862793, "global_step": 30171, "epoch": 363} {"train_loss": -18.99629020690918, "global_step": 30172, "epoch": 363} {"train_loss": -19.00608253479004, "global_step": 30173, "epoch": 363} {"train_loss": -19.019155502319336, "global_step": 30174, "epoch": 363} {"train_loss": -19.212020874023438, "global_step": 30175, "epoch": 363} {"train_loss": -18.622434616088867, "global_step": 30176, "epoch": 363} {"train_loss": -18.964496612548828, "global_step": 30177, "epoch": 363} {"train_loss": -18.791000366210938, "global_step": 30178, "epoch": 363} {"train_loss": -19.304521560668945, "global_step": 30179, "epoch": 363} {"train_loss": -19.02669906616211, "global_step": 30180, "epoch": 363} {"train_loss": -19.081403732299805, "global_step": 30181, "epoch": 363} {"train_loss": -18.940000534057617, "global_step": 30182, "epoch": 363} {"train_loss": -18.871824264526367, "global_step": 30183, "epoch": 363} {"train_loss": -18.83684730529785, "global_step": 30184, "epoch": 363} {"train_loss": -18.733835220336914, "global_step": 30185, "epoch": 363} {"train_loss": -18.712282180786133, "global_step": 30186, "epoch": 363} {"train_loss": -19.080778121948242, "global_step": 30187, "epoch": 363} {"train_loss": -18.80096435546875, "global_step": 30188, "epoch": 363} {"train_loss": -19.0186824798584, "global_step": 30189, "epoch": 363} {"train_loss": -19.120359420776367, "global_step": 30190, "epoch": 363} {"train_loss": -18.523700714111328, "global_step": 30191, "epoch": 363} {"train_loss": -19.015548706054688, "global_step": 30192, "epoch": 363} {"train_loss": -18.847116470336914, "global_step": 30193, "epoch": 363} {"train_loss": -18.787490844726562, "global_step": 30194, "epoch": 363} {"train_loss": -18.914295196533203, "global_step": 30195, "epoch": 363} {"train_loss": -19.11601448059082, "global_step": 30196, "epoch": 363} {"train_loss": -19.220993041992188, "global_step": 30197, "epoch": 363} {"train_loss": -19.06110382080078, "global_step": 30198, "epoch": 363} {"train_loss": -19.040220260620117, "global_step": 30199, "epoch": 363} {"train_loss": -18.705665588378906, "global_step": 30200, "epoch": 363} {"train_loss": -19.36503028869629, "global_step": 30201, "epoch": 363} {"train_loss": -19.1323299407959, "global_step": 30202, "epoch": 363} {"train_loss": -18.750839233398438, "global_step": 30203, "epoch": 363} {"train_loss": -18.94610023498535, "global_step": 30204, "epoch": 363} {"train_loss": -19.291316986083984, "global_step": 30205, "epoch": 363} {"train_loss": -18.726530075073242, "global_step": 30206, "epoch": 363} {"train_loss": -19.12970733642578, "global_step": 30207, "epoch": 363} {"train_loss": -19.02687644958496, "global_step": 30208, "epoch": 363} {"train_loss": -19.199800491333008, "global_step": 30209, "epoch": 363} {"train_loss": -18.946805953979492, "global_step": 30210, "epoch": 363} {"train_loss": -18.90671456578266, "global_step": 30211, "epoch": 363, "val_loss": 6048360.5} {"train_loss": -18.377262115478516, "global_step": 30212, "epoch": 364} {"train_loss": -18.431997299194336, "global_step": 30213, "epoch": 364} {"train_loss": -18.68868064880371, "global_step": 30214, "epoch": 364} {"train_loss": -19.17658805847168, "global_step": 30215, "epoch": 364} {"train_loss": -18.513986587524414, "global_step": 30216, "epoch": 364} {"train_loss": -18.680652618408203, "global_step": 30217, "epoch": 364} {"train_loss": -19.10630226135254, "global_step": 30218, "epoch": 364} {"train_loss": -18.627111434936523, "global_step": 30219, "epoch": 364} {"train_loss": -18.830623626708984, "global_step": 30220, "epoch": 364} {"train_loss": -18.813968658447266, "global_step": 30221, "epoch": 364} {"train_loss": -18.547164916992188, "global_step": 30222, "epoch": 364} {"train_loss": -18.77345085144043, "global_step": 30223, "epoch": 364} {"train_loss": -18.874948501586914, "global_step": 30224, "epoch": 364} {"train_loss": -18.798831939697266, "global_step": 30225, "epoch": 364} {"train_loss": -18.498262405395508, "global_step": 30226, "epoch": 364} {"train_loss": -18.60866355895996, "global_step": 30227, "epoch": 364} {"train_loss": -19.115264892578125, "global_step": 30228, "epoch": 364} {"train_loss": -18.74452018737793, "global_step": 30229, "epoch": 364} {"train_loss": -19.05885124206543, "global_step": 30230, "epoch": 364} {"train_loss": -18.646984100341797, "global_step": 30231, "epoch": 364} {"train_loss": -18.778520584106445, "global_step": 30232, "epoch": 364} {"train_loss": -18.958213806152344, "global_step": 30233, "epoch": 364} {"train_loss": -18.832897186279297, "global_step": 30234, "epoch": 364} {"train_loss": -18.59522819519043, "global_step": 30235, "epoch": 364} {"train_loss": -19.11301040649414, "global_step": 30236, "epoch": 364} {"train_loss": -18.898780822753906, "global_step": 30237, "epoch": 364} {"train_loss": -19.009803771972656, "global_step": 30238, "epoch": 364} {"train_loss": -18.558130264282227, "global_step": 30239, "epoch": 364} {"train_loss": -19.046716690063477, "global_step": 30240, "epoch": 364} {"train_loss": -18.970102310180664, "global_step": 30241, "epoch": 364} {"train_loss": -18.928333282470703, "global_step": 30242, "epoch": 364} {"train_loss": -19.004671096801758, "global_step": 30243, "epoch": 364} {"train_loss": -19.205411911010742, "global_step": 30244, "epoch": 364} {"train_loss": -18.99847984313965, "global_step": 30245, "epoch": 364} {"train_loss": -18.992576599121094, "global_step": 30246, "epoch": 364} {"train_loss": -18.88390350341797, "global_step": 30247, "epoch": 364} {"train_loss": -18.490814208984375, "global_step": 30248, "epoch": 364} {"train_loss": -19.03822898864746, "global_step": 30249, "epoch": 364} {"train_loss": -19.048786163330078, "global_step": 30250, "epoch": 364} {"train_loss": -18.990835189819336, "global_step": 30251, "epoch": 364} {"train_loss": -18.43338394165039, "global_step": 30252, "epoch": 364} {"train_loss": -18.97368812561035, "global_step": 30253, "epoch": 364} {"train_loss": -18.8221378326416, "global_step": 30254, "epoch": 364} {"train_loss": -18.9959659576416, "global_step": 30255, "epoch": 364} {"train_loss": -18.880937576293945, "global_step": 30256, "epoch": 364} {"train_loss": -19.04914093017578, "global_step": 30257, "epoch": 364} {"train_loss": -18.812761306762695, "global_step": 30258, "epoch": 364} {"train_loss": -19.1765079498291, "global_step": 30259, "epoch": 364} {"train_loss": -19.028854370117188, "global_step": 30260, "epoch": 364} {"train_loss": -19.15785026550293, "global_step": 30261, "epoch": 364} {"train_loss": -18.96483039855957, "global_step": 30262, "epoch": 364} {"train_loss": -19.22059440612793, "global_step": 30263, "epoch": 364} {"train_loss": -18.989990234375, "global_step": 30264, "epoch": 364} {"train_loss": -18.962961196899414, "global_step": 30265, "epoch": 364} {"train_loss": -18.805070877075195, "global_step": 30266, "epoch": 364} {"train_loss": -18.81452751159668, "global_step": 30267, "epoch": 364} {"train_loss": -19.161407470703125, "global_step": 30268, "epoch": 364} {"train_loss": -18.965042114257812, "global_step": 30269, "epoch": 364} {"train_loss": -18.83817481994629, "global_step": 30270, "epoch": 364} {"train_loss": -18.507715225219727, "global_step": 30271, "epoch": 364} {"train_loss": -19.309003829956055, "global_step": 30272, "epoch": 364} {"train_loss": -18.949094772338867, "global_step": 30273, "epoch": 364} {"train_loss": -19.159021377563477, "global_step": 30274, "epoch": 364} {"train_loss": -18.969772338867188, "global_step": 30275, "epoch": 364} {"train_loss": -18.87352752685547, "global_step": 30276, "epoch": 364} {"train_loss": -19.271011352539062, "global_step": 30277, "epoch": 364} {"train_loss": -18.8370418548584, "global_step": 30278, "epoch": 364} {"train_loss": -18.851552963256836, "global_step": 30279, "epoch": 364} {"train_loss": -18.886066436767578, "global_step": 30280, "epoch": 364} {"train_loss": -18.737289428710938, "global_step": 30281, "epoch": 364} {"train_loss": -18.7019100189209, "global_step": 30282, "epoch": 364} {"train_loss": -18.946575164794922, "global_step": 30283, "epoch": 364} {"train_loss": -19.27194595336914, "global_step": 30284, "epoch": 364} {"train_loss": -19.293909072875977, "global_step": 30285, "epoch": 364} {"train_loss": -18.998220443725586, "global_step": 30286, "epoch": 364} {"train_loss": -19.06840705871582, "global_step": 30287, "epoch": 364} {"train_loss": -18.678054809570312, "global_step": 30288, "epoch": 364} {"train_loss": -18.971837997436523, "global_step": 30289, "epoch": 364} {"train_loss": -19.27139663696289, "global_step": 30290, "epoch": 364} {"train_loss": -18.356204986572266, "global_step": 30291, "epoch": 364} {"train_loss": -18.978076934814453, "global_step": 30292, "epoch": 364} {"train_loss": -19.12933349609375, "global_step": 30293, "epoch": 364} {"train_loss": -18.89539265919881, "global_step": 30294, "epoch": 364, "val_loss": 5967052.0} {"train_loss": -18.924917221069336, "global_step": 30295, "epoch": 365} {"train_loss": -18.8321590423584, "global_step": 30296, "epoch": 365} {"train_loss": -19.290786743164062, "global_step": 30297, "epoch": 365} {"train_loss": -19.195844650268555, "global_step": 30298, "epoch": 365} {"train_loss": -19.299118041992188, "global_step": 30299, "epoch": 365} {"train_loss": -19.004608154296875, "global_step": 30300, "epoch": 365} {"train_loss": -18.98855972290039, "global_step": 30301, "epoch": 365} {"train_loss": -19.09369659423828, "global_step": 30302, "epoch": 365} {"train_loss": -19.303123474121094, "global_step": 30303, "epoch": 365} {"train_loss": -19.125898361206055, "global_step": 30304, "epoch": 365} {"train_loss": -19.30865478515625, "global_step": 30305, "epoch": 365} {"train_loss": -18.64007568359375, "global_step": 30306, "epoch": 365} {"train_loss": -18.999963760375977, "global_step": 30307, "epoch": 365} {"train_loss": -18.431676864624023, "global_step": 30308, "epoch": 365} {"train_loss": -18.765504837036133, "global_step": 30309, "epoch": 365} {"train_loss": -19.111066818237305, "global_step": 30310, "epoch": 365} {"train_loss": -18.92299461364746, "global_step": 30311, "epoch": 365} {"train_loss": -19.18036460876465, "global_step": 30312, "epoch": 365} {"train_loss": -19.24140739440918, "global_step": 30313, "epoch": 365} {"train_loss": -18.926679611206055, "global_step": 30314, "epoch": 365} {"train_loss": -19.21700096130371, "global_step": 30315, "epoch": 365} {"train_loss": -19.09148406982422, "global_step": 30316, "epoch": 365} {"train_loss": -18.93490982055664, "global_step": 30317, "epoch": 365} {"train_loss": -19.039321899414062, "global_step": 30318, "epoch": 365} {"train_loss": -19.2706241607666, "global_step": 30319, "epoch": 365} {"train_loss": -18.816896438598633, "global_step": 30320, "epoch": 365} {"train_loss": -18.847740173339844, "global_step": 30321, "epoch": 365} {"train_loss": -19.17879867553711, "global_step": 30322, "epoch": 365} {"train_loss": -19.25242805480957, "global_step": 30323, "epoch": 365} {"train_loss": -19.324939727783203, "global_step": 30324, "epoch": 365} {"train_loss": -18.846799850463867, "global_step": 30325, "epoch": 365} {"train_loss": -18.60776710510254, "global_step": 30326, "epoch": 365} {"train_loss": -18.747417449951172, "global_step": 30327, "epoch": 365} {"train_loss": -18.789926528930664, "global_step": 30328, "epoch": 365} {"train_loss": -18.892507553100586, "global_step": 30329, "epoch": 365} {"train_loss": -18.981306076049805, "global_step": 30330, "epoch": 365} {"train_loss": -19.031721115112305, "global_step": 30331, "epoch": 365} {"train_loss": -18.71318817138672, "global_step": 30332, "epoch": 365} {"train_loss": -18.50417137145996, "global_step": 30333, "epoch": 365} {"train_loss": -18.86496925354004, "global_step": 30334, "epoch": 365} {"train_loss": -19.00197982788086, "global_step": 30335, "epoch": 365} {"train_loss": -18.974838256835938, "global_step": 30336, "epoch": 365} {"train_loss": -18.877607345581055, "global_step": 30337, "epoch": 365} {"train_loss": -18.87077522277832, "global_step": 30338, "epoch": 365} {"train_loss": -19.07972526550293, "global_step": 30339, "epoch": 365} {"train_loss": -18.985431671142578, "global_step": 30340, "epoch": 365} {"train_loss": -19.092811584472656, "global_step": 30341, "epoch": 365} {"train_loss": -18.997587203979492, "global_step": 30342, "epoch": 365} {"train_loss": -18.792768478393555, "global_step": 30343, "epoch": 365} {"train_loss": -18.758319854736328, "global_step": 30344, "epoch": 365} {"train_loss": -18.564720153808594, "global_step": 30345, "epoch": 365} {"train_loss": -18.956144332885742, "global_step": 30346, "epoch": 365} {"train_loss": -19.166946411132812, "global_step": 30347, "epoch": 365} {"train_loss": -19.050111770629883, "global_step": 30348, "epoch": 365} {"train_loss": -19.384048461914062, "global_step": 30349, "epoch": 365} {"train_loss": -18.740251541137695, "global_step": 30350, "epoch": 365} {"train_loss": -18.780826568603516, "global_step": 30351, "epoch": 365} {"train_loss": -18.95049476623535, "global_step": 30352, "epoch": 365} {"train_loss": -18.722745895385742, "global_step": 30353, "epoch": 365} {"train_loss": -18.924238204956055, "global_step": 30354, "epoch": 365} {"train_loss": -19.056446075439453, "global_step": 30355, "epoch": 365} {"train_loss": -18.854034423828125, "global_step": 30356, "epoch": 365} {"train_loss": -19.088077545166016, "global_step": 30357, "epoch": 365} {"train_loss": -18.725221633911133, "global_step": 30358, "epoch": 365} {"train_loss": -19.1502685546875, "global_step": 30359, "epoch": 365} {"train_loss": -18.89214515686035, "global_step": 30360, "epoch": 365} {"train_loss": -18.979345321655273, "global_step": 30361, "epoch": 365} {"train_loss": -18.862390518188477, "global_step": 30362, "epoch": 365} {"train_loss": -18.969627380371094, "global_step": 30363, "epoch": 365} {"train_loss": -19.187381744384766, "global_step": 30364, "epoch": 365} {"train_loss": -19.15992546081543, "global_step": 30365, "epoch": 365} {"train_loss": -19.46839141845703, "global_step": 30366, "epoch": 365} {"train_loss": -18.758771896362305, "global_step": 30367, "epoch": 365} {"train_loss": -18.736251831054688, "global_step": 30368, "epoch": 365} {"train_loss": -18.87775993347168, "global_step": 30369, "epoch": 365} {"train_loss": -18.546201705932617, "global_step": 30370, "epoch": 365} {"train_loss": -18.80274200439453, "global_step": 30371, "epoch": 365} {"train_loss": -18.943082809448242, "global_step": 30372, "epoch": 365} {"train_loss": -18.99942398071289, "global_step": 30373, "epoch": 365} {"train_loss": -18.974281311035156, "global_step": 30374, "epoch": 365} {"train_loss": -18.920595169067383, "global_step": 30375, "epoch": 365} {"train_loss": -18.790624618530273, "global_step": 30376, "epoch": 365} {"train_loss": -18.94479928533715, "global_step": 30377, "epoch": 365, "val_loss": 5977785.5} {"train_loss": -18.515153884887695, "global_step": 30378, "epoch": 366} {"train_loss": -18.6246395111084, "global_step": 30379, "epoch": 366} {"train_loss": -18.753202438354492, "global_step": 30380, "epoch": 366} {"train_loss": -18.82027816772461, "global_step": 30381, "epoch": 366} {"train_loss": -18.552650451660156, "global_step": 30382, "epoch": 366} {"train_loss": -18.90218734741211, "global_step": 30383, "epoch": 366} {"train_loss": -18.88157081604004, "global_step": 30384, "epoch": 366} {"train_loss": -18.64092254638672, "global_step": 30385, "epoch": 366} {"train_loss": -18.733699798583984, "global_step": 30386, "epoch": 366} {"train_loss": -19.011606216430664, "global_step": 30387, "epoch": 366} {"train_loss": -18.90894317626953, "global_step": 30388, "epoch": 366} {"train_loss": -18.768569946289062, "global_step": 30389, "epoch": 366} {"train_loss": -18.625638961791992, "global_step": 30390, "epoch": 366} {"train_loss": -19.019094467163086, "global_step": 30391, "epoch": 366} {"train_loss": -18.801088333129883, "global_step": 30392, "epoch": 366} {"train_loss": -19.214859008789062, "global_step": 30393, "epoch": 366} {"train_loss": -19.08916664123535, "global_step": 30394, "epoch": 366} {"train_loss": -18.833585739135742, "global_step": 30395, "epoch": 366} {"train_loss": -18.772581100463867, "global_step": 30396, "epoch": 366} {"train_loss": -19.20534896850586, "global_step": 30397, "epoch": 366} {"train_loss": -19.051395416259766, "global_step": 30398, "epoch": 366} {"train_loss": -18.659000396728516, "global_step": 30399, "epoch": 366} {"train_loss": -18.83805274963379, "global_step": 30400, "epoch": 366} {"train_loss": -18.921001434326172, "global_step": 30401, "epoch": 366} {"train_loss": -18.789949417114258, "global_step": 30402, "epoch": 366} {"train_loss": -19.196813583374023, "global_step": 30403, "epoch": 366} {"train_loss": -19.003955841064453, "global_step": 30404, "epoch": 366} {"train_loss": -18.901199340820312, "global_step": 30405, "epoch": 366} {"train_loss": -19.24482536315918, "global_step": 30406, "epoch": 366} {"train_loss": -19.22623062133789, "global_step": 30407, "epoch": 366} {"train_loss": -19.02292251586914, "global_step": 30408, "epoch": 366} {"train_loss": -18.70355224609375, "global_step": 30409, "epoch": 366} {"train_loss": -18.96122169494629, "global_step": 30410, "epoch": 366} {"train_loss": -19.108203887939453, "global_step": 30411, "epoch": 366} {"train_loss": -19.28147315979004, "global_step": 30412, "epoch": 366} {"train_loss": -18.652908325195312, "global_step": 30413, "epoch": 366} {"train_loss": -18.787153244018555, "global_step": 30414, "epoch": 366} {"train_loss": -19.047836303710938, "global_step": 30415, "epoch": 366} {"train_loss": -18.79622459411621, "global_step": 30416, "epoch": 366} {"train_loss": -18.61518669128418, "global_step": 30417, "epoch": 366} {"train_loss": -18.957599639892578, "global_step": 30418, "epoch": 366} {"train_loss": -19.143321990966797, "global_step": 30419, "epoch": 366} {"train_loss": -19.401138305664062, "global_step": 30420, "epoch": 366} {"train_loss": -19.043062210083008, "global_step": 30421, "epoch": 366} {"train_loss": -18.8291015625, "global_step": 30422, "epoch": 366} {"train_loss": -18.69863510131836, "global_step": 30423, "epoch": 366} {"train_loss": -18.68172264099121, "global_step": 30424, "epoch": 366} {"train_loss": -18.91023063659668, "global_step": 30425, "epoch": 366} {"train_loss": -18.660234451293945, "global_step": 30426, "epoch": 366} {"train_loss": -18.51017189025879, "global_step": 30427, "epoch": 366} {"train_loss": -18.922117233276367, "global_step": 30428, "epoch": 366} {"train_loss": -18.58160972595215, "global_step": 30429, "epoch": 366} {"train_loss": -18.900278091430664, "global_step": 30430, "epoch": 366} {"train_loss": -19.037649154663086, "global_step": 30431, "epoch": 366} {"train_loss": -19.196962356567383, "global_step": 30432, "epoch": 366} {"train_loss": -19.225704193115234, "global_step": 30433, "epoch": 366} {"train_loss": -18.689176559448242, "global_step": 30434, "epoch": 366} {"train_loss": -18.586843490600586, "global_step": 30435, "epoch": 366} {"train_loss": -19.097721099853516, "global_step": 30436, "epoch": 366} {"train_loss": -18.88134765625, "global_step": 30437, "epoch": 366} {"train_loss": -18.643680572509766, "global_step": 30438, "epoch": 366} {"train_loss": -18.571762084960938, "global_step": 30439, "epoch": 366} {"train_loss": -19.026304244995117, "global_step": 30440, "epoch": 366} {"train_loss": -19.197397232055664, "global_step": 30441, "epoch": 366} {"train_loss": -18.838891983032227, "global_step": 30442, "epoch": 366} {"train_loss": -18.362777709960938, "global_step": 30443, "epoch": 366} {"train_loss": -18.631702423095703, "global_step": 30444, "epoch": 366} {"train_loss": -18.71986961364746, "global_step": 30445, "epoch": 366} {"train_loss": -19.202451705932617, "global_step": 30446, "epoch": 366} {"train_loss": -19.15036392211914, "global_step": 30447, "epoch": 366} {"train_loss": -18.79232406616211, "global_step": 30448, "epoch": 366} {"train_loss": -19.057157516479492, "global_step": 30449, "epoch": 366} {"train_loss": -18.854724884033203, "global_step": 30450, "epoch": 366} {"train_loss": -18.676132202148438, "global_step": 30451, "epoch": 366} {"train_loss": -19.29833984375, "global_step": 30452, "epoch": 366} {"train_loss": -18.91351318359375, "global_step": 30453, "epoch": 366} {"train_loss": -18.90384292602539, "global_step": 30454, "epoch": 366} {"train_loss": -19.23781394958496, "global_step": 30455, "epoch": 366} {"train_loss": -18.967397689819336, "global_step": 30456, "epoch": 366} {"train_loss": -19.083349227905273, "global_step": 30457, "epoch": 366} {"train_loss": -18.959136962890625, "global_step": 30458, "epoch": 366} {"train_loss": -18.98487091064453, "global_step": 30459, "epoch": 366} {"train_loss": -18.893408534038496, "global_step": 30460, "epoch": 366, "val_loss": 6056634.0} {"train_loss": -18.7340145111084, "global_step": 30461, "epoch": 367} {"train_loss": -18.466978073120117, "global_step": 30462, "epoch": 367} {"train_loss": -18.586875915527344, "global_step": 30463, "epoch": 367} {"train_loss": -18.911718368530273, "global_step": 30464, "epoch": 367} {"train_loss": -18.867399215698242, "global_step": 30465, "epoch": 367} {"train_loss": -18.567005157470703, "global_step": 30466, "epoch": 367} {"train_loss": -18.535730361938477, "global_step": 30467, "epoch": 367} {"train_loss": -18.658308029174805, "global_step": 30468, "epoch": 367} {"train_loss": -19.356237411499023, "global_step": 30469, "epoch": 367} {"train_loss": -18.42762565612793, "global_step": 30470, "epoch": 367} {"train_loss": -18.76845359802246, "global_step": 30471, "epoch": 367} {"train_loss": -19.082324981689453, "global_step": 30472, "epoch": 367} {"train_loss": -18.83770751953125, "global_step": 30473, "epoch": 367} {"train_loss": -18.907350540161133, "global_step": 30474, "epoch": 367} {"train_loss": -18.255781173706055, "global_step": 30475, "epoch": 367} {"train_loss": -18.454919815063477, "global_step": 30476, "epoch": 367} {"train_loss": -18.782848358154297, "global_step": 30477, "epoch": 367} {"train_loss": -18.691640853881836, "global_step": 30478, "epoch": 367} {"train_loss": -18.865209579467773, "global_step": 30479, "epoch": 367} {"train_loss": -18.788515090942383, "global_step": 30480, "epoch": 367} {"train_loss": -19.09091567993164, "global_step": 30481, "epoch": 367} {"train_loss": -18.817485809326172, "global_step": 30482, "epoch": 367} {"train_loss": -19.128498077392578, "global_step": 30483, "epoch": 367} {"train_loss": -18.8952579498291, "global_step": 30484, "epoch": 367} {"train_loss": -18.791105270385742, "global_step": 30485, "epoch": 367} {"train_loss": -18.92139434814453, "global_step": 30486, "epoch": 367} {"train_loss": -19.284137725830078, "global_step": 30487, "epoch": 367} {"train_loss": -18.99137306213379, "global_step": 30488, "epoch": 367} {"train_loss": -18.721576690673828, "global_step": 30489, "epoch": 367} {"train_loss": -18.809385299682617, "global_step": 30490, "epoch": 367} {"train_loss": -18.84168815612793, "global_step": 30491, "epoch": 367} {"train_loss": -18.99956512451172, "global_step": 30492, "epoch": 367} {"train_loss": -18.843793869018555, "global_step": 30493, "epoch": 367} {"train_loss": -19.129465103149414, "global_step": 30494, "epoch": 367} {"train_loss": -18.992523193359375, "global_step": 30495, "epoch": 367} {"train_loss": -18.70833396911621, "global_step": 30496, "epoch": 367} {"train_loss": -18.838415145874023, "global_step": 30497, "epoch": 367} {"train_loss": -19.322864532470703, "global_step": 30498, "epoch": 367} {"train_loss": -19.318641662597656, "global_step": 30499, "epoch": 367} {"train_loss": -18.98457908630371, "global_step": 30500, "epoch": 367} {"train_loss": -19.073667526245117, "global_step": 30501, "epoch": 367} {"train_loss": -18.87628746032715, "global_step": 30502, "epoch": 367} {"train_loss": -19.167448043823242, "global_step": 30503, "epoch": 367} {"train_loss": -18.967458724975586, "global_step": 30504, "epoch": 367} {"train_loss": -19.263151168823242, "global_step": 30505, "epoch": 367} {"train_loss": -18.738021850585938, "global_step": 30506, "epoch": 367} {"train_loss": -18.8976993560791, "global_step": 30507, "epoch": 367} {"train_loss": -19.279741287231445, "global_step": 30508, "epoch": 367} {"train_loss": -18.805204391479492, "global_step": 30509, "epoch": 367} {"train_loss": -19.03693199157715, "global_step": 30510, "epoch": 367} {"train_loss": -19.136022567749023, "global_step": 30511, "epoch": 367} {"train_loss": -19.127347946166992, "global_step": 30512, "epoch": 367} {"train_loss": -18.826276779174805, "global_step": 30513, "epoch": 367} {"train_loss": -18.87370491027832, "global_step": 30514, "epoch": 367} {"train_loss": -19.2769718170166, "global_step": 30515, "epoch": 367} {"train_loss": -18.72524070739746, "global_step": 30516, "epoch": 367} {"train_loss": -19.202228546142578, "global_step": 30517, "epoch": 367} {"train_loss": -18.784406661987305, "global_step": 30518, "epoch": 367} {"train_loss": -19.23797607421875, "global_step": 30519, "epoch": 367} {"train_loss": -18.759729385375977, "global_step": 30520, "epoch": 367} {"train_loss": -19.35691261291504, "global_step": 30521, "epoch": 367} {"train_loss": -18.956863403320312, "global_step": 30522, "epoch": 367} {"train_loss": -19.175031661987305, "global_step": 30523, "epoch": 367} {"train_loss": -19.00397491455078, "global_step": 30524, "epoch": 367} {"train_loss": -18.978899002075195, "global_step": 30525, "epoch": 367} {"train_loss": -19.27498435974121, "global_step": 30526, "epoch": 367} {"train_loss": -18.781557083129883, "global_step": 30527, "epoch": 367} {"train_loss": -19.32038688659668, "global_step": 30528, "epoch": 367} {"train_loss": -19.077707290649414, "global_step": 30529, "epoch": 367} {"train_loss": -19.076749801635742, "global_step": 30530, "epoch": 367} {"train_loss": -19.151750564575195, "global_step": 30531, "epoch": 367} {"train_loss": -18.872602462768555, "global_step": 30532, "epoch": 367} {"train_loss": -18.966032028198242, "global_step": 30533, "epoch": 367} {"train_loss": -19.287004470825195, "global_step": 30534, "epoch": 367} {"train_loss": -19.3210506439209, "global_step": 30535, "epoch": 367} {"train_loss": -19.370752334594727, "global_step": 30536, "epoch": 367} {"train_loss": -19.04143714904785, "global_step": 30537, "epoch": 367} {"train_loss": -19.09585952758789, "global_step": 30538, "epoch": 367} {"train_loss": -18.51472282409668, "global_step": 30539, "epoch": 367} {"train_loss": -18.718399047851562, "global_step": 30540, "epoch": 367} {"train_loss": -19.175771713256836, "global_step": 30541, "epoch": 367} {"train_loss": -19.004323959350586, "global_step": 30542, "epoch": 367} {"train_loss": -18.942608017519294, "global_step": 30543, "epoch": 367, "val_loss": 6002889.5} {"train_loss": -18.195526123046875, "global_step": 30544, "epoch": 368} {"train_loss": -18.41657066345215, "global_step": 30545, "epoch": 368} {"train_loss": -18.85774803161621, "global_step": 30546, "epoch": 368} {"train_loss": -18.946989059448242, "global_step": 30547, "epoch": 368} {"train_loss": -18.352102279663086, "global_step": 30548, "epoch": 368} {"train_loss": -18.86568260192871, "global_step": 30549, "epoch": 368} {"train_loss": -18.84707260131836, "global_step": 30550, "epoch": 368} {"train_loss": -18.762121200561523, "global_step": 30551, "epoch": 368} {"train_loss": -18.493038177490234, "global_step": 30552, "epoch": 368} {"train_loss": -18.203245162963867, "global_step": 30553, "epoch": 368} {"train_loss": -18.959516525268555, "global_step": 30554, "epoch": 368} {"train_loss": -19.04636573791504, "global_step": 30555, "epoch": 368} {"train_loss": -18.72766876220703, "global_step": 30556, "epoch": 368} {"train_loss": -18.96038055419922, "global_step": 30557, "epoch": 368} {"train_loss": -18.797653198242188, "global_step": 30558, "epoch": 368} {"train_loss": -18.984500885009766, "global_step": 30559, "epoch": 368} {"train_loss": -19.454885482788086, "global_step": 30560, "epoch": 368} {"train_loss": -18.988418579101562, "global_step": 30561, "epoch": 368} {"train_loss": -18.63215446472168, "global_step": 30562, "epoch": 368} {"train_loss": -19.215177536010742, "global_step": 30563, "epoch": 368} {"train_loss": -18.90520668029785, "global_step": 30564, "epoch": 368} {"train_loss": -18.866455078125, "global_step": 30565, "epoch": 368} {"train_loss": -18.992115020751953, "global_step": 30566, "epoch": 368} {"train_loss": -18.850967407226562, "global_step": 30567, "epoch": 368} {"train_loss": -19.0562801361084, "global_step": 30568, "epoch": 368} {"train_loss": -18.520578384399414, "global_step": 30569, "epoch": 368} {"train_loss": -19.237302780151367, "global_step": 30570, "epoch": 368} {"train_loss": -19.05071449279785, "global_step": 30571, "epoch": 368} {"train_loss": -18.976598739624023, "global_step": 30572, "epoch": 368} {"train_loss": -18.956247329711914, "global_step": 30573, "epoch": 368} {"train_loss": -19.279720306396484, "global_step": 30574, "epoch": 368} {"train_loss": -19.036041259765625, "global_step": 30575, "epoch": 368} {"train_loss": -18.723758697509766, "global_step": 30576, "epoch": 368} {"train_loss": -18.725069046020508, "global_step": 30577, "epoch": 368} {"train_loss": -18.78895378112793, "global_step": 30578, "epoch": 368} {"train_loss": -18.812898635864258, "global_step": 30579, "epoch": 368} {"train_loss": -19.354602813720703, "global_step": 30580, "epoch": 368} {"train_loss": -19.02255630493164, "global_step": 30581, "epoch": 368} {"train_loss": -18.99610710144043, "global_step": 30582, "epoch": 368} {"train_loss": -18.874862670898438, "global_step": 30583, "epoch": 368} {"train_loss": -18.60956382751465, "global_step": 30584, "epoch": 368} {"train_loss": -19.48641014099121, "global_step": 30585, "epoch": 368} {"train_loss": -18.73200035095215, "global_step": 30586, "epoch": 368} {"train_loss": -19.240385055541992, "global_step": 30587, "epoch": 368} {"train_loss": -18.844017028808594, "global_step": 30588, "epoch": 368} {"train_loss": -19.200572967529297, "global_step": 30589, "epoch": 368} {"train_loss": -18.95718002319336, "global_step": 30590, "epoch": 368} {"train_loss": -18.913043975830078, "global_step": 30591, "epoch": 368} {"train_loss": -18.773103713989258, "global_step": 30592, "epoch": 368} {"train_loss": -19.089618682861328, "global_step": 30593, "epoch": 368} {"train_loss": -19.443479537963867, "global_step": 30594, "epoch": 368} {"train_loss": -19.072736740112305, "global_step": 30595, "epoch": 368} {"train_loss": -19.058582305908203, "global_step": 30596, "epoch": 368} {"train_loss": -19.146028518676758, "global_step": 30597, "epoch": 368} {"train_loss": -18.739301681518555, "global_step": 30598, "epoch": 368} {"train_loss": -18.799407958984375, "global_step": 30599, "epoch": 368} {"train_loss": -19.162466049194336, "global_step": 30600, "epoch": 368} {"train_loss": -19.140493392944336, "global_step": 30601, "epoch": 368} {"train_loss": -19.025121688842773, "global_step": 30602, "epoch": 368} {"train_loss": -18.90716552734375, "global_step": 30603, "epoch": 368} {"train_loss": -18.886030197143555, "global_step": 30604, "epoch": 368} {"train_loss": -19.262800216674805, "global_step": 30605, "epoch": 368} {"train_loss": -19.135364532470703, "global_step": 30606, "epoch": 368} {"train_loss": -18.96305274963379, "global_step": 30607, "epoch": 368} {"train_loss": -19.24567985534668, "global_step": 30608, "epoch": 368} {"train_loss": -18.630765914916992, "global_step": 30609, "epoch": 368} {"train_loss": -19.0756778717041, "global_step": 30610, "epoch": 368} {"train_loss": -19.225486755371094, "global_step": 30611, "epoch": 368} {"train_loss": -19.08168601989746, "global_step": 30612, "epoch": 368} {"train_loss": -18.61795425415039, "global_step": 30613, "epoch": 368} {"train_loss": -18.981229782104492, "global_step": 30614, "epoch": 368} {"train_loss": -18.853469848632812, "global_step": 30615, "epoch": 368} {"train_loss": -19.072492599487305, "global_step": 30616, "epoch": 368} {"train_loss": -19.032150268554688, "global_step": 30617, "epoch": 368} {"train_loss": -19.078121185302734, "global_step": 30618, "epoch": 368} {"train_loss": -18.6811466217041, "global_step": 30619, "epoch": 368} {"train_loss": -19.081716537475586, "global_step": 30620, "epoch": 368} {"train_loss": -19.05426597595215, "global_step": 30621, "epoch": 368} {"train_loss": -18.812841415405273, "global_step": 30622, "epoch": 368} {"train_loss": -19.01325798034668, "global_step": 30623, "epoch": 368} {"train_loss": -19.078502655029297, "global_step": 30624, "epoch": 368} {"train_loss": -19.087553024291992, "global_step": 30625, "epoch": 368} {"train_loss": -18.934018629143036, "global_step": 30626, "epoch": 368, "val_loss": 6073908.0} {"train_loss": -18.441015243530273, "global_step": 30627, "epoch": 369} {"train_loss": -18.73110008239746, "global_step": 30628, "epoch": 369} {"train_loss": -18.86177635192871, "global_step": 30629, "epoch": 369} {"train_loss": -18.65032386779785, "global_step": 30630, "epoch": 369} {"train_loss": -19.009855270385742, "global_step": 30631, "epoch": 369} {"train_loss": -18.99812889099121, "global_step": 30632, "epoch": 369} {"train_loss": -18.94459342956543, "global_step": 30633, "epoch": 369} {"train_loss": -19.073026657104492, "global_step": 30634, "epoch": 369} {"train_loss": -18.759803771972656, "global_step": 30635, "epoch": 369} {"train_loss": -18.901025772094727, "global_step": 30636, "epoch": 369} {"train_loss": -19.000473022460938, "global_step": 30637, "epoch": 369} {"train_loss": -19.078855514526367, "global_step": 30638, "epoch": 369} {"train_loss": -18.741193771362305, "global_step": 30639, "epoch": 369} {"train_loss": -18.896427154541016, "global_step": 30640, "epoch": 369} {"train_loss": -18.959508895874023, "global_step": 30641, "epoch": 369} {"train_loss": -18.91519546508789, "global_step": 30642, "epoch": 369} {"train_loss": -18.785869598388672, "global_step": 30643, "epoch": 369} {"train_loss": -18.9975643157959, "global_step": 30644, "epoch": 369} {"train_loss": -18.921064376831055, "global_step": 30645, "epoch": 369} {"train_loss": -19.194210052490234, "global_step": 30646, "epoch": 369} {"train_loss": -18.51089859008789, "global_step": 30647, "epoch": 369} {"train_loss": -19.013296127319336, "global_step": 30648, "epoch": 369} {"train_loss": -19.087665557861328, "global_step": 30649, "epoch": 369} {"train_loss": -18.711627960205078, "global_step": 30650, "epoch": 369} {"train_loss": -19.2150936126709, "global_step": 30651, "epoch": 369} {"train_loss": -18.873186111450195, "global_step": 30652, "epoch": 369} {"train_loss": -19.381790161132812, "global_step": 30653, "epoch": 369} {"train_loss": -18.443662643432617, "global_step": 30654, "epoch": 369} {"train_loss": -19.173171997070312, "global_step": 30655, "epoch": 369} {"train_loss": -19.03456687927246, "global_step": 30656, "epoch": 369} {"train_loss": -18.954334259033203, "global_step": 30657, "epoch": 369} {"train_loss": -19.05708885192871, "global_step": 30658, "epoch": 369} {"train_loss": -19.380277633666992, "global_step": 30659, "epoch": 369} {"train_loss": -18.61208724975586, "global_step": 30660, "epoch": 369} {"train_loss": -18.865324020385742, "global_step": 30661, "epoch": 369} {"train_loss": -19.142982482910156, "global_step": 30662, "epoch": 369} {"train_loss": -19.052230834960938, "global_step": 30663, "epoch": 369} {"train_loss": -19.39439582824707, "global_step": 30664, "epoch": 369} {"train_loss": -19.11423683166504, "global_step": 30665, "epoch": 369} {"train_loss": -19.10967445373535, "global_step": 30666, "epoch": 369} {"train_loss": -19.049468994140625, "global_step": 30667, "epoch": 369} {"train_loss": -18.806873321533203, "global_step": 30668, "epoch": 369} {"train_loss": -18.88846206665039, "global_step": 30669, "epoch": 369} {"train_loss": -18.76100730895996, "global_step": 30670, "epoch": 369} {"train_loss": -18.648921966552734, "global_step": 30671, "epoch": 369} {"train_loss": -18.795751571655273, "global_step": 30672, "epoch": 369} {"train_loss": -19.334856033325195, "global_step": 30673, "epoch": 369} {"train_loss": -18.858633041381836, "global_step": 30674, "epoch": 369} {"train_loss": -18.896886825561523, "global_step": 30675, "epoch": 369} {"train_loss": -19.169416427612305, "global_step": 30676, "epoch": 369} {"train_loss": -18.985166549682617, "global_step": 30677, "epoch": 369} {"train_loss": -19.087783813476562, "global_step": 30678, "epoch": 369} {"train_loss": -18.795413970947266, "global_step": 30679, "epoch": 369} {"train_loss": -19.040197372436523, "global_step": 30680, "epoch": 369} {"train_loss": -19.19880485534668, "global_step": 30681, "epoch": 369} {"train_loss": -19.195241928100586, "global_step": 30682, "epoch": 369} {"train_loss": -18.88909339904785, "global_step": 30683, "epoch": 369} {"train_loss": -19.247961044311523, "global_step": 30684, "epoch": 369} {"train_loss": -19.08553123474121, "global_step": 30685, "epoch": 369} {"train_loss": -18.85384178161621, "global_step": 30686, "epoch": 369} {"train_loss": -18.616966247558594, "global_step": 30687, "epoch": 369} {"train_loss": -18.685537338256836, "global_step": 30688, "epoch": 369} {"train_loss": -19.2797908782959, "global_step": 30689, "epoch": 369} {"train_loss": -19.237577438354492, "global_step": 30690, "epoch": 369} {"train_loss": -18.85430145263672, "global_step": 30691, "epoch": 369} {"train_loss": -19.1826229095459, "global_step": 30692, "epoch": 369} {"train_loss": -19.069379806518555, "global_step": 30693, "epoch": 369} {"train_loss": -18.6700439453125, "global_step": 30694, "epoch": 369} {"train_loss": -19.50164794921875, "global_step": 30695, "epoch": 369} {"train_loss": -18.962661743164062, "global_step": 30696, "epoch": 369} {"train_loss": -18.887601852416992, "global_step": 30697, "epoch": 369} {"train_loss": -18.75412940979004, "global_step": 30698, "epoch": 369} {"train_loss": -19.211883544921875, "global_step": 30699, "epoch": 369} {"train_loss": -19.125797271728516, "global_step": 30700, "epoch": 369} {"train_loss": -18.975330352783203, "global_step": 30701, "epoch": 369} {"train_loss": -18.930360794067383, "global_step": 30702, "epoch": 369} {"train_loss": -19.17384910583496, "global_step": 30703, "epoch": 369} {"train_loss": -19.27288818359375, "global_step": 30704, "epoch": 369} {"train_loss": -18.67278480529785, "global_step": 30705, "epoch": 369} {"train_loss": -19.129825592041016, "global_step": 30706, "epoch": 369} {"train_loss": -19.069351196289062, "global_step": 30707, "epoch": 369} {"train_loss": -19.46820831298828, "global_step": 30708, "epoch": 369} {"train_loss": -18.980508137898273, "global_step": 30709, "epoch": 369, "val_loss": 5968353.0} {"train_loss": -18.745389938354492, "global_step": 30710, "epoch": 370} {"train_loss": -18.926538467407227, "global_step": 30711, "epoch": 370} {"train_loss": -18.8748779296875, "global_step": 30712, "epoch": 370} {"train_loss": -18.66816520690918, "global_step": 30713, "epoch": 370} {"train_loss": -19.133665084838867, "global_step": 30714, "epoch": 370} {"train_loss": -18.881742477416992, "global_step": 30715, "epoch": 370} {"train_loss": -18.949365615844727, "global_step": 30716, "epoch": 370} {"train_loss": -18.923749923706055, "global_step": 30717, "epoch": 370} {"train_loss": -18.847320556640625, "global_step": 30718, "epoch": 370} {"train_loss": -18.9988956451416, "global_step": 30719, "epoch": 370} {"train_loss": -19.126962661743164, "global_step": 30720, "epoch": 370} {"train_loss": -19.164093017578125, "global_step": 30721, "epoch": 370} {"train_loss": -18.663084030151367, "global_step": 30722, "epoch": 370} {"train_loss": -18.7451114654541, "global_step": 30723, "epoch": 370} {"train_loss": -19.10915184020996, "global_step": 30724, "epoch": 370} {"train_loss": -18.618520736694336, "global_step": 30725, "epoch": 370} {"train_loss": -18.756269454956055, "global_step": 30726, "epoch": 370} {"train_loss": -18.721891403198242, "global_step": 30727, "epoch": 370} {"train_loss": -19.236576080322266, "global_step": 30728, "epoch": 370} {"train_loss": -19.14930534362793, "global_step": 30729, "epoch": 370} {"train_loss": -19.014005661010742, "global_step": 30730, "epoch": 370} {"train_loss": -18.8703556060791, "global_step": 30731, "epoch": 370} {"train_loss": -19.09648895263672, "global_step": 30732, "epoch": 370} {"train_loss": -18.65678596496582, "global_step": 30733, "epoch": 370} {"train_loss": -18.786930084228516, "global_step": 30734, "epoch": 370} {"train_loss": -19.07253074645996, "global_step": 30735, "epoch": 370} {"train_loss": -18.889862060546875, "global_step": 30736, "epoch": 370} {"train_loss": -19.09461784362793, "global_step": 30737, "epoch": 370} {"train_loss": -19.087186813354492, "global_step": 30738, "epoch": 370} {"train_loss": -18.8041934967041, "global_step": 30739, "epoch": 370} {"train_loss": -19.079710006713867, "global_step": 30740, "epoch": 370} {"train_loss": -19.031091690063477, "global_step": 30741, "epoch": 370} {"train_loss": -18.659555435180664, "global_step": 30742, "epoch": 370} {"train_loss": -19.071989059448242, "global_step": 30743, "epoch": 370} {"train_loss": -19.071157455444336, "global_step": 30744, "epoch": 370} {"train_loss": -18.758556365966797, "global_step": 30745, "epoch": 370} {"train_loss": -19.101743698120117, "global_step": 30746, "epoch": 370} {"train_loss": -18.430418014526367, "global_step": 30747, "epoch": 370} {"train_loss": -19.136655807495117, "global_step": 30748, "epoch": 370} {"train_loss": -19.179906845092773, "global_step": 30749, "epoch": 370} {"train_loss": -18.566579818725586, "global_step": 30750, "epoch": 370} {"train_loss": -18.90129280090332, "global_step": 30751, "epoch": 370} {"train_loss": -18.768930435180664, "global_step": 30752, "epoch": 370} {"train_loss": -18.994543075561523, "global_step": 30753, "epoch": 370} {"train_loss": -18.89583969116211, "global_step": 30754, "epoch": 370} {"train_loss": -19.358707427978516, "global_step": 30755, "epoch": 370} {"train_loss": -18.742197036743164, "global_step": 30756, "epoch": 370} {"train_loss": -19.2258243560791, "global_step": 30757, "epoch": 370} {"train_loss": -19.04438591003418, "global_step": 30758, "epoch": 370} {"train_loss": -19.177085876464844, "global_step": 30759, "epoch": 370} {"train_loss": -19.304927825927734, "global_step": 30760, "epoch": 370} {"train_loss": -19.048612594604492, "global_step": 30761, "epoch": 370} {"train_loss": -18.85312843322754, "global_step": 30762, "epoch": 370} {"train_loss": -18.83748435974121, "global_step": 30763, "epoch": 370} {"train_loss": -18.7525577545166, "global_step": 30764, "epoch": 370} {"train_loss": -19.114429473876953, "global_step": 30765, "epoch": 370} {"train_loss": -19.0640869140625, "global_step": 30766, "epoch": 370} {"train_loss": -19.00105094909668, "global_step": 30767, "epoch": 370} {"train_loss": -19.11299705505371, "global_step": 30768, "epoch": 370} {"train_loss": -19.177719116210938, "global_step": 30769, "epoch": 370} {"train_loss": -18.984663009643555, "global_step": 30770, "epoch": 370} {"train_loss": -19.010900497436523, "global_step": 30771, "epoch": 370} {"train_loss": -18.762042999267578, "global_step": 30772, "epoch": 370} {"train_loss": -18.942087173461914, "global_step": 30773, "epoch": 370} {"train_loss": -19.043447494506836, "global_step": 30774, "epoch": 370} {"train_loss": -18.7452449798584, "global_step": 30775, "epoch": 370} {"train_loss": -18.689916610717773, "global_step": 30776, "epoch": 370} {"train_loss": -19.107824325561523, "global_step": 30777, "epoch": 370} {"train_loss": -18.903493881225586, "global_step": 30778, "epoch": 370} {"train_loss": -19.01641845703125, "global_step": 30779, "epoch": 370} {"train_loss": -19.071012496948242, "global_step": 30780, "epoch": 370} {"train_loss": -19.05898094177246, "global_step": 30781, "epoch": 370} {"train_loss": -19.27372169494629, "global_step": 30782, "epoch": 370} {"train_loss": -18.88118553161621, "global_step": 30783, "epoch": 370} {"train_loss": -18.6187686920166, "global_step": 30784, "epoch": 370} {"train_loss": -18.85968017578125, "global_step": 30785, "epoch": 370} {"train_loss": -18.923465728759766, "global_step": 30786, "epoch": 370} {"train_loss": -19.194122314453125, "global_step": 30787, "epoch": 370} {"train_loss": -19.008020401000977, "global_step": 30788, "epoch": 370} {"train_loss": -18.516437530517578, "global_step": 30789, "epoch": 370} {"train_loss": -18.831022262573242, "global_step": 30790, "epoch": 370} {"train_loss": -18.72223472595215, "global_step": 30791, "epoch": 370} {"train_loss": -18.95896472701107, "global_step": 30792, "epoch": 370, "val_loss": 5979720.0} {"train_loss": -18.745071411132812, "global_step": 30793, "epoch": 371} {"train_loss": -18.76590347290039, "global_step": 30794, "epoch": 371} {"train_loss": -18.30314064025879, "global_step": 30795, "epoch": 371} {"train_loss": -18.951419830322266, "global_step": 30796, "epoch": 371} {"train_loss": -18.866504669189453, "global_step": 30797, "epoch": 371} {"train_loss": -18.678287506103516, "global_step": 30798, "epoch": 371} {"train_loss": -18.654054641723633, "global_step": 30799, "epoch": 371} {"train_loss": -18.755239486694336, "global_step": 30800, "epoch": 371} {"train_loss": -18.961206436157227, "global_step": 30801, "epoch": 371} {"train_loss": -18.758573532104492, "global_step": 30802, "epoch": 371} {"train_loss": -18.786407470703125, "global_step": 30803, "epoch": 371} {"train_loss": -19.249975204467773, "global_step": 30804, "epoch": 371} {"train_loss": -19.277772903442383, "global_step": 30805, "epoch": 371} {"train_loss": -18.892688751220703, "global_step": 30806, "epoch": 371} {"train_loss": -18.647016525268555, "global_step": 30807, "epoch": 371} {"train_loss": -18.864505767822266, "global_step": 30808, "epoch": 371} {"train_loss": -19.147375106811523, "global_step": 30809, "epoch": 371} {"train_loss": -18.831954956054688, "global_step": 30810, "epoch": 371} {"train_loss": -19.184486389160156, "global_step": 30811, "epoch": 371} {"train_loss": -18.980175018310547, "global_step": 30812, "epoch": 371} {"train_loss": -18.76283073425293, "global_step": 30813, "epoch": 371} {"train_loss": -19.521230697631836, "global_step": 30814, "epoch": 371} {"train_loss": -18.753232955932617, "global_step": 30815, "epoch": 371} {"train_loss": -19.12673568725586, "global_step": 30816, "epoch": 371} {"train_loss": -18.565101623535156, "global_step": 30817, "epoch": 371} {"train_loss": -19.44618797302246, "global_step": 30818, "epoch": 371} {"train_loss": -19.162914276123047, "global_step": 30819, "epoch": 371} {"train_loss": -19.201330184936523, "global_step": 30820, "epoch": 371} {"train_loss": -19.380311965942383, "global_step": 30821, "epoch": 371} {"train_loss": -18.761655807495117, "global_step": 30822, "epoch": 371} {"train_loss": -18.955589294433594, "global_step": 30823, "epoch": 371} {"train_loss": -18.950605392456055, "global_step": 30824, "epoch": 371} {"train_loss": -19.2965145111084, "global_step": 30825, "epoch": 371} {"train_loss": -18.919322967529297, "global_step": 30826, "epoch": 371} {"train_loss": -19.129413604736328, "global_step": 30827, "epoch": 371} {"train_loss": -18.8652286529541, "global_step": 30828, "epoch": 371} {"train_loss": -19.062835693359375, "global_step": 30829, "epoch": 371} {"train_loss": -19.182723999023438, "global_step": 30830, "epoch": 371} {"train_loss": -19.26654624938965, "global_step": 30831, "epoch": 371} {"train_loss": -19.204858779907227, "global_step": 30832, "epoch": 371} {"train_loss": -19.05501365661621, "global_step": 30833, "epoch": 371} {"train_loss": -18.793502807617188, "global_step": 30834, "epoch": 371} {"train_loss": -18.80596923828125, "global_step": 30835, "epoch": 371} {"train_loss": -19.406415939331055, "global_step": 30836, "epoch": 371} {"train_loss": -18.786840438842773, "global_step": 30837, "epoch": 371} {"train_loss": -18.978849411010742, "global_step": 30838, "epoch": 371} {"train_loss": -18.90667724609375, "global_step": 30839, "epoch": 371} {"train_loss": -19.145429611206055, "global_step": 30840, "epoch": 371} {"train_loss": -18.851560592651367, "global_step": 30841, "epoch": 371} {"train_loss": -19.594507217407227, "global_step": 30842, "epoch": 371} {"train_loss": -18.903738021850586, "global_step": 30843, "epoch": 371} {"train_loss": -19.271902084350586, "global_step": 30844, "epoch": 371} {"train_loss": -18.952285766601562, "global_step": 30845, "epoch": 371} {"train_loss": -18.98077392578125, "global_step": 30846, "epoch": 371} {"train_loss": -18.872896194458008, "global_step": 30847, "epoch": 371} {"train_loss": -18.664695739746094, "global_step": 30848, "epoch": 371} {"train_loss": -19.04293441772461, "global_step": 30849, "epoch": 371} {"train_loss": -18.89054298400879, "global_step": 30850, "epoch": 371} {"train_loss": -18.876893997192383, "global_step": 30851, "epoch": 371} {"train_loss": -18.79005241394043, "global_step": 30852, "epoch": 371} {"train_loss": -19.0455322265625, "global_step": 30853, "epoch": 371} {"train_loss": -19.511207580566406, "global_step": 30854, "epoch": 371} {"train_loss": -18.70411491394043, "global_step": 30855, "epoch": 371} {"train_loss": -19.11433219909668, "global_step": 30856, "epoch": 371} {"train_loss": -18.909543991088867, "global_step": 30857, "epoch": 371} {"train_loss": -18.820802688598633, "global_step": 30858, "epoch": 371} {"train_loss": -18.60322380065918, "global_step": 30859, "epoch": 371} {"train_loss": -18.982221603393555, "global_step": 30860, "epoch": 371} {"train_loss": -19.361467361450195, "global_step": 30861, "epoch": 371} {"train_loss": -19.200082778930664, "global_step": 30862, "epoch": 371} {"train_loss": -19.375707626342773, "global_step": 30863, "epoch": 371} {"train_loss": -18.981184005737305, "global_step": 30864, "epoch": 371} {"train_loss": -18.906681060791016, "global_step": 30865, "epoch": 371} {"train_loss": -18.81296157836914, "global_step": 30866, "epoch": 371} {"train_loss": -18.862226486206055, "global_step": 30867, "epoch": 371} {"train_loss": -18.982202529907227, "global_step": 30868, "epoch": 371} {"train_loss": -19.065479278564453, "global_step": 30869, "epoch": 371} {"train_loss": -19.413002014160156, "global_step": 30870, "epoch": 371} {"train_loss": -19.28591537475586, "global_step": 30871, "epoch": 371} {"train_loss": -18.940895080566406, "global_step": 30872, "epoch": 371} {"train_loss": -18.970335006713867, "global_step": 30873, "epoch": 371} {"train_loss": -19.074308395385742, "global_step": 30874, "epoch": 371} {"train_loss": -18.993576854108326, "global_step": 30875, "epoch": 371, "val_loss": 5915916.5} {"train_loss": -18.57354736328125, "global_step": 30876, "epoch": 372} {"train_loss": -18.905288696289062, "global_step": 30877, "epoch": 372} {"train_loss": -18.7557430267334, "global_step": 30878, "epoch": 372} {"train_loss": -18.791189193725586, "global_step": 30879, "epoch": 372} {"train_loss": -18.791410446166992, "global_step": 30880, "epoch": 372} {"train_loss": -19.08312225341797, "global_step": 30881, "epoch": 372} {"train_loss": -19.08011817932129, "global_step": 30882, "epoch": 372} {"train_loss": -18.501440048217773, "global_step": 30883, "epoch": 372} {"train_loss": -18.545156478881836, "global_step": 30884, "epoch": 372} {"train_loss": -18.99220848083496, "global_step": 30885, "epoch": 372} {"train_loss": -18.787931442260742, "global_step": 30886, "epoch": 372} {"train_loss": -18.591821670532227, "global_step": 30887, "epoch": 372} {"train_loss": -18.729528427124023, "global_step": 30888, "epoch": 372} {"train_loss": -18.952434539794922, "global_step": 30889, "epoch": 372} {"train_loss": -18.762868881225586, "global_step": 30890, "epoch": 372} {"train_loss": -18.669923782348633, "global_step": 30891, "epoch": 372} {"train_loss": -18.428808212280273, "global_step": 30892, "epoch": 372} {"train_loss": -18.533824920654297, "global_step": 30893, "epoch": 372} {"train_loss": -19.17905616760254, "global_step": 30894, "epoch": 372} {"train_loss": -18.975515365600586, "global_step": 30895, "epoch": 372} {"train_loss": -18.8031063079834, "global_step": 30896, "epoch": 372} {"train_loss": -19.148488998413086, "global_step": 30897, "epoch": 372} {"train_loss": -18.72479248046875, "global_step": 30898, "epoch": 372} {"train_loss": -18.9829044342041, "global_step": 30899, "epoch": 372} {"train_loss": -18.74616050720215, "global_step": 30900, "epoch": 372} {"train_loss": -18.95339012145996, "global_step": 30901, "epoch": 372} {"train_loss": -18.874027252197266, "global_step": 30902, "epoch": 372} {"train_loss": -18.477102279663086, "global_step": 30903, "epoch": 372} {"train_loss": -19.173734664916992, "global_step": 30904, "epoch": 372} {"train_loss": -18.342187881469727, "global_step": 30905, "epoch": 372} {"train_loss": -18.84600257873535, "global_step": 30906, "epoch": 372} {"train_loss": -18.78786849975586, "global_step": 30907, "epoch": 372} {"train_loss": -19.20705223083496, "global_step": 30908, "epoch": 372} {"train_loss": -18.98508644104004, "global_step": 30909, "epoch": 372} {"train_loss": -19.55539321899414, "global_step": 30910, "epoch": 372} {"train_loss": -18.991865158081055, "global_step": 30911, "epoch": 372} {"train_loss": -19.34666633605957, "global_step": 30912, "epoch": 372} {"train_loss": -19.245561599731445, "global_step": 30913, "epoch": 372} {"train_loss": -19.05317497253418, "global_step": 30914, "epoch": 372} {"train_loss": -19.112524032592773, "global_step": 30915, "epoch": 372} {"train_loss": -18.98423194885254, "global_step": 30916, "epoch": 372} {"train_loss": -18.824735641479492, "global_step": 30917, "epoch": 372} {"train_loss": -19.1086368560791, "global_step": 30918, "epoch": 372} {"train_loss": -18.97957420349121, "global_step": 30919, "epoch": 372} {"train_loss": -18.867639541625977, "global_step": 30920, "epoch": 372} {"train_loss": -19.12074089050293, "global_step": 30921, "epoch": 372} {"train_loss": -19.313507080078125, "global_step": 30922, "epoch": 372} {"train_loss": -18.782541275024414, "global_step": 30923, "epoch": 372} {"train_loss": -19.078067779541016, "global_step": 30924, "epoch": 372} {"train_loss": -19.247343063354492, "global_step": 30925, "epoch": 372} {"train_loss": -19.202608108520508, "global_step": 30926, "epoch": 372} {"train_loss": -19.179834365844727, "global_step": 30927, "epoch": 372} {"train_loss": -19.203895568847656, "global_step": 30928, "epoch": 372} {"train_loss": -18.73873519897461, "global_step": 30929, "epoch": 372} {"train_loss": -18.657583236694336, "global_step": 30930, "epoch": 372} {"train_loss": -19.068368911743164, "global_step": 30931, "epoch": 372} {"train_loss": -18.935890197753906, "global_step": 30932, "epoch": 372} {"train_loss": -18.981836318969727, "global_step": 30933, "epoch": 372} {"train_loss": -18.946977615356445, "global_step": 30934, "epoch": 372} {"train_loss": -18.98984146118164, "global_step": 30935, "epoch": 372} {"train_loss": -19.044431686401367, "global_step": 30936, "epoch": 372} {"train_loss": -18.879486083984375, "global_step": 30937, "epoch": 372} {"train_loss": -18.88714599609375, "global_step": 30938, "epoch": 372} {"train_loss": -19.17134666442871, "global_step": 30939, "epoch": 372} {"train_loss": -19.006895065307617, "global_step": 30940, "epoch": 372} {"train_loss": -18.86091423034668, "global_step": 30941, "epoch": 372} {"train_loss": -19.16176414489746, "global_step": 30942, "epoch": 372} {"train_loss": -18.914941787719727, "global_step": 30943, "epoch": 372} {"train_loss": -19.260326385498047, "global_step": 30944, "epoch": 372} {"train_loss": -18.828792572021484, "global_step": 30945, "epoch": 372} {"train_loss": -18.972579956054688, "global_step": 30946, "epoch": 372} {"train_loss": -19.13545799255371, "global_step": 30947, "epoch": 372} {"train_loss": -19.262226104736328, "global_step": 30948, "epoch": 372} {"train_loss": -18.441898345947266, "global_step": 30949, "epoch": 372} {"train_loss": -18.628049850463867, "global_step": 30950, "epoch": 372} {"train_loss": -18.925052642822266, "global_step": 30951, "epoch": 372} {"train_loss": -18.935455322265625, "global_step": 30952, "epoch": 372} {"train_loss": -19.091928482055664, "global_step": 30953, "epoch": 372} {"train_loss": -18.894826889038086, "global_step": 30954, "epoch": 372} {"train_loss": -18.99042510986328, "global_step": 30955, "epoch": 372} {"train_loss": -18.92786979675293, "global_step": 30956, "epoch": 372} {"train_loss": -19.439661026000977, "global_step": 30957, "epoch": 372} {"train_loss": -18.92244545810194, "global_step": 30958, "epoch": 372, "val_loss": 5938241.0} {"train_loss": -18.768341064453125, "global_step": 30959, "epoch": 373} {"train_loss": -19.299972534179688, "global_step": 30960, "epoch": 373} {"train_loss": -18.687070846557617, "global_step": 30961, "epoch": 373} {"train_loss": -19.023279190063477, "global_step": 30962, "epoch": 373} {"train_loss": -18.34531593322754, "global_step": 30963, "epoch": 373} {"train_loss": -19.046279907226562, "global_step": 30964, "epoch": 373} {"train_loss": -18.504934310913086, "global_step": 30965, "epoch": 373} {"train_loss": -18.889371871948242, "global_step": 30966, "epoch": 373} {"train_loss": -18.485143661499023, "global_step": 30967, "epoch": 373} {"train_loss": -19.192747116088867, "global_step": 30968, "epoch": 373} {"train_loss": -18.97667694091797, "global_step": 30969, "epoch": 373} {"train_loss": -18.703588485717773, "global_step": 30970, "epoch": 373} {"train_loss": -18.840656280517578, "global_step": 30971, "epoch": 373} {"train_loss": -18.74762535095215, "global_step": 30972, "epoch": 373} {"train_loss": -19.290151596069336, "global_step": 30973, "epoch": 373} {"train_loss": -19.140918731689453, "global_step": 30974, "epoch": 373} {"train_loss": -18.702293395996094, "global_step": 30975, "epoch": 373} {"train_loss": -19.065122604370117, "global_step": 30976, "epoch": 373} {"train_loss": -18.923980712890625, "global_step": 30977, "epoch": 373} {"train_loss": -18.910852432250977, "global_step": 30978, "epoch": 373} {"train_loss": -18.976240158081055, "global_step": 30979, "epoch": 373} {"train_loss": -18.45932960510254, "global_step": 30980, "epoch": 373} {"train_loss": -19.050373077392578, "global_step": 30981, "epoch": 373} {"train_loss": -19.127840042114258, "global_step": 30982, "epoch": 373} {"train_loss": -19.12630271911621, "global_step": 30983, "epoch": 373} {"train_loss": -19.259735107421875, "global_step": 30984, "epoch": 373} {"train_loss": -19.223112106323242, "global_step": 30985, "epoch": 373} {"train_loss": -18.434162139892578, "global_step": 30986, "epoch": 373} {"train_loss": -19.252748489379883, "global_step": 30987, "epoch": 373} {"train_loss": -19.21168327331543, "global_step": 30988, "epoch": 373} {"train_loss": -18.668254852294922, "global_step": 30989, "epoch": 373} {"train_loss": -18.956823348999023, "global_step": 30990, "epoch": 373} {"train_loss": -19.079259872436523, "global_step": 30991, "epoch": 373} {"train_loss": -18.922107696533203, "global_step": 30992, "epoch": 373} {"train_loss": -19.096248626708984, "global_step": 30993, "epoch": 373} {"train_loss": -19.048704147338867, "global_step": 30994, "epoch": 373} {"train_loss": -19.259008407592773, "global_step": 30995, "epoch": 373} {"train_loss": -18.778276443481445, "global_step": 30996, "epoch": 373} {"train_loss": -19.001407623291016, "global_step": 30997, "epoch": 373} {"train_loss": -19.19809913635254, "global_step": 30998, "epoch": 373} {"train_loss": -19.05206871032715, "global_step": 30999, "epoch": 373} {"train_loss": -19.28005599975586, "global_step": 31000, "epoch": 373} {"train_loss": -18.800222396850586, "global_step": 31001, "epoch": 373} {"train_loss": -18.96170997619629, "global_step": 31002, "epoch": 373} {"train_loss": -19.286035537719727, "global_step": 31003, "epoch": 373} {"train_loss": -19.102405548095703, "global_step": 31004, "epoch": 373} {"train_loss": -19.187746047973633, "global_step": 31005, "epoch": 373} {"train_loss": -19.414335250854492, "global_step": 31006, "epoch": 373} {"train_loss": -19.136934280395508, "global_step": 31007, "epoch": 373} {"train_loss": -18.828710556030273, "global_step": 31008, "epoch": 373} {"train_loss": -18.938310623168945, "global_step": 31009, "epoch": 373} {"train_loss": -18.660961151123047, "global_step": 31010, "epoch": 373} {"train_loss": -19.192434310913086, "global_step": 31011, "epoch": 373} {"train_loss": -18.718469619750977, "global_step": 31012, "epoch": 373} {"train_loss": -18.641263961791992, "global_step": 31013, "epoch": 373} {"train_loss": -19.237655639648438, "global_step": 31014, "epoch": 373} {"train_loss": -19.07073402404785, "global_step": 31015, "epoch": 373} {"train_loss": -19.13315773010254, "global_step": 31016, "epoch": 373} {"train_loss": -18.928335189819336, "global_step": 31017, "epoch": 373} {"train_loss": -18.558210372924805, "global_step": 31018, "epoch": 373} {"train_loss": -19.171913146972656, "global_step": 31019, "epoch": 373} {"train_loss": -18.901418685913086, "global_step": 31020, "epoch": 373} {"train_loss": -19.061023712158203, "global_step": 31021, "epoch": 373} {"train_loss": -18.980945587158203, "global_step": 31022, "epoch": 373} {"train_loss": -19.111600875854492, "global_step": 31023, "epoch": 373} {"train_loss": -19.36130142211914, "global_step": 31024, "epoch": 373} {"train_loss": -18.917463302612305, "global_step": 31025, "epoch": 373} {"train_loss": -19.295028686523438, "global_step": 31026, "epoch": 373} {"train_loss": -19.279340744018555, "global_step": 31027, "epoch": 373} {"train_loss": -19.098407745361328, "global_step": 31028, "epoch": 373} {"train_loss": -18.97383689880371, "global_step": 31029, "epoch": 373} {"train_loss": -19.16059684753418, "global_step": 31030, "epoch": 373} {"train_loss": -19.03912925720215, "global_step": 31031, "epoch": 373} {"train_loss": -18.96833610534668, "global_step": 31032, "epoch": 373} {"train_loss": -19.345178604125977, "global_step": 31033, "epoch": 373} {"train_loss": -19.16290283203125, "global_step": 31034, "epoch": 373} {"train_loss": -18.842288970947266, "global_step": 31035, "epoch": 373} {"train_loss": -18.969913482666016, "global_step": 31036, "epoch": 373} {"train_loss": -19.185829162597656, "global_step": 31037, "epoch": 373} {"train_loss": -19.217390060424805, "global_step": 31038, "epoch": 373} {"train_loss": -18.73609733581543, "global_step": 31039, "epoch": 373} {"train_loss": -18.960886001586914, "global_step": 31040, "epoch": 373} {"train_loss": -18.981415231543853, "global_step": 31041, "epoch": 373, "val_loss": 5969695.0} {"train_loss": -18.87415885925293, "global_step": 31042, "epoch": 374} {"train_loss": -18.39711570739746, "global_step": 31043, "epoch": 374} {"train_loss": -18.6884708404541, "global_step": 31044, "epoch": 374} {"train_loss": -18.799741744995117, "global_step": 31045, "epoch": 374} {"train_loss": -19.07870864868164, "global_step": 31046, "epoch": 374} {"train_loss": -18.797616958618164, "global_step": 31047, "epoch": 374} {"train_loss": -18.864093780517578, "global_step": 31048, "epoch": 374} {"train_loss": -18.29523468017578, "global_step": 31049, "epoch": 374} {"train_loss": -19.069595336914062, "global_step": 31050, "epoch": 374} {"train_loss": -18.884004592895508, "global_step": 31051, "epoch": 374} {"train_loss": -19.200986862182617, "global_step": 31052, "epoch": 374} {"train_loss": -18.830392837524414, "global_step": 31053, "epoch": 374} {"train_loss": -19.30116081237793, "global_step": 31054, "epoch": 374} {"train_loss": -19.329458236694336, "global_step": 31055, "epoch": 374} {"train_loss": -19.169248580932617, "global_step": 31056, "epoch": 374} {"train_loss": -18.67633628845215, "global_step": 31057, "epoch": 374} {"train_loss": -18.866968154907227, "global_step": 31058, "epoch": 374} {"train_loss": -19.039306640625, "global_step": 31059, "epoch": 374} {"train_loss": -18.97356605529785, "global_step": 31060, "epoch": 374} {"train_loss": -19.040538787841797, "global_step": 31061, "epoch": 374} {"train_loss": -18.54325294494629, "global_step": 31062, "epoch": 374} {"train_loss": -19.0262508392334, "global_step": 31063, "epoch": 374} {"train_loss": -19.00714874267578, "global_step": 31064, "epoch": 374} {"train_loss": -18.588306427001953, "global_step": 31065, "epoch": 374} {"train_loss": -18.346647262573242, "global_step": 31066, "epoch": 374} {"train_loss": -19.0134220123291, "global_step": 31067, "epoch": 374} {"train_loss": -18.78618621826172, "global_step": 31068, "epoch": 374} {"train_loss": -19.109127044677734, "global_step": 31069, "epoch": 374} {"train_loss": -18.61258316040039, "global_step": 31070, "epoch": 374} {"train_loss": -18.568477630615234, "global_step": 31071, "epoch": 374} {"train_loss": -18.926095962524414, "global_step": 31072, "epoch": 374} {"train_loss": -18.630369186401367, "global_step": 31073, "epoch": 374} {"train_loss": -19.16836929321289, "global_step": 31074, "epoch": 374} {"train_loss": -18.664722442626953, "global_step": 31075, "epoch": 374} {"train_loss": -18.950952529907227, "global_step": 31076, "epoch": 374} {"train_loss": -19.301122665405273, "global_step": 31077, "epoch": 374} {"train_loss": -18.931203842163086, "global_step": 31078, "epoch": 374} {"train_loss": -18.80767059326172, "global_step": 31079, "epoch": 374} {"train_loss": -18.754728317260742, "global_step": 31080, "epoch": 374} {"train_loss": -18.958494186401367, "global_step": 31081, "epoch": 374} {"train_loss": -18.97675132751465, "global_step": 31082, "epoch": 374} {"train_loss": -18.74142837524414, "global_step": 31083, "epoch": 374} {"train_loss": -18.900632858276367, "global_step": 31084, "epoch": 374} {"train_loss": -18.647016525268555, "global_step": 31085, "epoch": 374} {"train_loss": -18.674148559570312, "global_step": 31086, "epoch": 374} {"train_loss": -19.31534767150879, "global_step": 31087, "epoch": 374} {"train_loss": -18.94637107849121, "global_step": 31088, "epoch": 374} {"train_loss": -19.328571319580078, "global_step": 31089, "epoch": 374} {"train_loss": -19.050006866455078, "global_step": 31090, "epoch": 374} {"train_loss": -19.07199478149414, "global_step": 31091, "epoch": 374} {"train_loss": -18.94293212890625, "global_step": 31092, "epoch": 374} {"train_loss": -18.850263595581055, "global_step": 31093, "epoch": 374} {"train_loss": -18.972837448120117, "global_step": 31094, "epoch": 374} {"train_loss": -19.0701904296875, "global_step": 31095, "epoch": 374} {"train_loss": -18.871591567993164, "global_step": 31096, "epoch": 374} {"train_loss": -18.957090377807617, "global_step": 31097, "epoch": 374} {"train_loss": -18.994565963745117, "global_step": 31098, "epoch": 374} {"train_loss": -19.009122848510742, "global_step": 31099, "epoch": 374} {"train_loss": -19.05173683166504, "global_step": 31100, "epoch": 374} {"train_loss": -18.922025680541992, "global_step": 31101, "epoch": 374} {"train_loss": -19.02665901184082, "global_step": 31102, "epoch": 374} {"train_loss": -18.93281364440918, "global_step": 31103, "epoch": 374} {"train_loss": -18.762784957885742, "global_step": 31104, "epoch": 374} {"train_loss": -18.79401969909668, "global_step": 31105, "epoch": 374} {"train_loss": -18.953405380249023, "global_step": 31106, "epoch": 374} {"train_loss": -18.612756729125977, "global_step": 31107, "epoch": 374} {"train_loss": -19.20082664489746, "global_step": 31108, "epoch": 374} {"train_loss": -19.140735626220703, "global_step": 31109, "epoch": 374} {"train_loss": -19.116559982299805, "global_step": 31110, "epoch": 374} {"train_loss": -18.967788696289062, "global_step": 31111, "epoch": 374} {"train_loss": -19.115446090698242, "global_step": 31112, "epoch": 374} {"train_loss": -18.96332359313965, "global_step": 31113, "epoch": 374} {"train_loss": -19.213520050048828, "global_step": 31114, "epoch": 374} {"train_loss": -19.265806198120117, "global_step": 31115, "epoch": 374} {"train_loss": -19.036046981811523, "global_step": 31116, "epoch": 374} {"train_loss": -19.05181884765625, "global_step": 31117, "epoch": 374} {"train_loss": -19.243701934814453, "global_step": 31118, "epoch": 374} {"train_loss": -19.39681053161621, "global_step": 31119, "epoch": 374} {"train_loss": -19.077030181884766, "global_step": 31120, "epoch": 374} {"train_loss": -19.380441665649414, "global_step": 31121, "epoch": 374} {"train_loss": -19.202194213867188, "global_step": 31122, "epoch": 374} {"train_loss": -19.29441261291504, "global_step": 31123, "epoch": 374} {"train_loss": -18.960119431277356, "global_step": 31124, "epoch": 374, "val_loss": 5926593.0} {"train_loss": -18.676090240478516, "global_step": 31125, "epoch": 375} {"train_loss": -19.234224319458008, "global_step": 31126, "epoch": 375} {"train_loss": -18.98639488220215, "global_step": 31127, "epoch": 375} {"train_loss": -18.683862686157227, "global_step": 31128, "epoch": 375} {"train_loss": -19.142837524414062, "global_step": 31129, "epoch": 375} {"train_loss": -19.365060806274414, "global_step": 31130, "epoch": 375} {"train_loss": -19.213502883911133, "global_step": 31131, "epoch": 375} {"train_loss": -18.6180477142334, "global_step": 31132, "epoch": 375} {"train_loss": -19.182823181152344, "global_step": 31133, "epoch": 375} {"train_loss": -19.201513290405273, "global_step": 31134, "epoch": 375} {"train_loss": -18.843881607055664, "global_step": 31135, "epoch": 375} {"train_loss": -19.140106201171875, "global_step": 31136, "epoch": 375} {"train_loss": -19.175098419189453, "global_step": 31137, "epoch": 375} {"train_loss": -19.012632369995117, "global_step": 31138, "epoch": 375} {"train_loss": -18.69465446472168, "global_step": 31139, "epoch": 375} {"train_loss": -19.07171630859375, "global_step": 31140, "epoch": 375} {"train_loss": -18.80713653564453, "global_step": 31141, "epoch": 375} {"train_loss": -19.163537979125977, "global_step": 31142, "epoch": 375} {"train_loss": -18.808990478515625, "global_step": 31143, "epoch": 375} {"train_loss": -19.013517379760742, "global_step": 31144, "epoch": 375} {"train_loss": -19.183990478515625, "global_step": 31145, "epoch": 375} {"train_loss": -18.762550354003906, "global_step": 31146, "epoch": 375} {"train_loss": -19.260601043701172, "global_step": 31147, "epoch": 375} {"train_loss": -18.918004989624023, "global_step": 31148, "epoch": 375} {"train_loss": -18.917665481567383, "global_step": 31149, "epoch": 375} {"train_loss": -18.776134490966797, "global_step": 31150, "epoch": 375} {"train_loss": -18.46009063720703, "global_step": 31151, "epoch": 375} {"train_loss": -18.95172691345215, "global_step": 31152, "epoch": 375} {"train_loss": -18.939123153686523, "global_step": 31153, "epoch": 375} {"train_loss": -18.76105308532715, "global_step": 31154, "epoch": 375} {"train_loss": -19.067989349365234, "global_step": 31155, "epoch": 375} {"train_loss": -19.06504249572754, "global_step": 31156, "epoch": 375} {"train_loss": -18.9632511138916, "global_step": 31157, "epoch": 375} {"train_loss": -19.14985466003418, "global_step": 31158, "epoch": 375} {"train_loss": -18.8116397857666, "global_step": 31159, "epoch": 375} {"train_loss": -19.0207462310791, "global_step": 31160, "epoch": 375} {"train_loss": -18.944049835205078, "global_step": 31161, "epoch": 375} {"train_loss": -18.901473999023438, "global_step": 31162, "epoch": 375} {"train_loss": -18.651817321777344, "global_step": 31163, "epoch": 375} {"train_loss": -18.902326583862305, "global_step": 31164, "epoch": 375} {"train_loss": -19.353836059570312, "global_step": 31165, "epoch": 375} {"train_loss": -19.096721649169922, "global_step": 31166, "epoch": 375} {"train_loss": -19.15749168395996, "global_step": 31167, "epoch": 375} {"train_loss": -18.971921920776367, "global_step": 31168, "epoch": 375} {"train_loss": -18.84153175354004, "global_step": 31169, "epoch": 375} {"train_loss": -19.17302894592285, "global_step": 31170, "epoch": 375} {"train_loss": -19.064794540405273, "global_step": 31171, "epoch": 375} {"train_loss": -19.19565773010254, "global_step": 31172, "epoch": 375} {"train_loss": -18.815509796142578, "global_step": 31173, "epoch": 375} {"train_loss": -19.11329460144043, "global_step": 31174, "epoch": 375} {"train_loss": -18.870519638061523, "global_step": 31175, "epoch": 375} {"train_loss": -19.024396896362305, "global_step": 31176, "epoch": 375} {"train_loss": -19.190465927124023, "global_step": 31177, "epoch": 375} {"train_loss": -19.215360641479492, "global_step": 31178, "epoch": 375} {"train_loss": -18.921266555786133, "global_step": 31179, "epoch": 375} {"train_loss": -19.495237350463867, "global_step": 31180, "epoch": 375} {"train_loss": -19.379405975341797, "global_step": 31181, "epoch": 375} {"train_loss": -19.10813331604004, "global_step": 31182, "epoch": 375} {"train_loss": -18.61256217956543, "global_step": 31183, "epoch": 375} {"train_loss": -19.065433502197266, "global_step": 31184, "epoch": 375} {"train_loss": -18.68487548828125, "global_step": 31185, "epoch": 375} {"train_loss": -18.881088256835938, "global_step": 31186, "epoch": 375} {"train_loss": -19.011632919311523, "global_step": 31187, "epoch": 375} {"train_loss": -19.13087272644043, "global_step": 31188, "epoch": 375} {"train_loss": -19.08586883544922, "global_step": 31189, "epoch": 375} {"train_loss": -19.055082321166992, "global_step": 31190, "epoch": 375} {"train_loss": -19.305105209350586, "global_step": 31191, "epoch": 375} {"train_loss": -19.191816329956055, "global_step": 31192, "epoch": 375} {"train_loss": -18.892078399658203, "global_step": 31193, "epoch": 375} {"train_loss": -19.200227737426758, "global_step": 31194, "epoch": 375} {"train_loss": -18.906360626220703, "global_step": 31195, "epoch": 375} {"train_loss": -19.036874771118164, "global_step": 31196, "epoch": 375} {"train_loss": -19.060617446899414, "global_step": 31197, "epoch": 375} {"train_loss": -18.960235595703125, "global_step": 31198, "epoch": 375} {"train_loss": -18.96904945373535, "global_step": 31199, "epoch": 375} {"train_loss": -18.828794479370117, "global_step": 31200, "epoch": 375} {"train_loss": -19.082138061523438, "global_step": 31201, "epoch": 375} {"train_loss": -18.92024040222168, "global_step": 31202, "epoch": 375} {"train_loss": -19.191930770874023, "global_step": 31203, "epoch": 375} {"train_loss": -19.08247947692871, "global_step": 31204, "epoch": 375} {"train_loss": -19.119144439697266, "global_step": 31205, "epoch": 375} {"train_loss": -19.09673309326172, "global_step": 31206, "epoch": 375} {"train_loss": -19.023108516830995, "global_step": 31207, "epoch": 375, "val_loss": 5985186.0} {"train_loss": -18.919851303100586, "global_step": 31208, "epoch": 376} {"train_loss": -18.814640045166016, "global_step": 31209, "epoch": 376} {"train_loss": -19.116331100463867, "global_step": 31210, "epoch": 376} {"train_loss": -18.753042221069336, "global_step": 31211, "epoch": 376} {"train_loss": -19.073890686035156, "global_step": 31212, "epoch": 376} {"train_loss": -18.663389205932617, "global_step": 31213, "epoch": 376} {"train_loss": -19.2260799407959, "global_step": 31214, "epoch": 376} {"train_loss": -19.133955001831055, "global_step": 31215, "epoch": 376} {"train_loss": -19.146881103515625, "global_step": 31216, "epoch": 376} {"train_loss": -18.807456970214844, "global_step": 31217, "epoch": 376} {"train_loss": -19.209638595581055, "global_step": 31218, "epoch": 376} {"train_loss": -18.960783004760742, "global_step": 31219, "epoch": 376} {"train_loss": -18.828115463256836, "global_step": 31220, "epoch": 376} {"train_loss": -18.68414878845215, "global_step": 31221, "epoch": 376} {"train_loss": -19.170429229736328, "global_step": 31222, "epoch": 376} {"train_loss": -19.206327438354492, "global_step": 31223, "epoch": 376} {"train_loss": -19.092931747436523, "global_step": 31224, "epoch": 376} {"train_loss": -18.862150192260742, "global_step": 31225, "epoch": 376} {"train_loss": -18.758573532104492, "global_step": 31226, "epoch": 376} {"train_loss": -19.13252830505371, "global_step": 31227, "epoch": 376} {"train_loss": -18.853927612304688, "global_step": 31228, "epoch": 376} {"train_loss": -18.804670333862305, "global_step": 31229, "epoch": 376} {"train_loss": -19.019336700439453, "global_step": 31230, "epoch": 376} {"train_loss": -18.557567596435547, "global_step": 31231, "epoch": 376} {"train_loss": -18.958934783935547, "global_step": 31232, "epoch": 376} {"train_loss": -18.92310333251953, "global_step": 31233, "epoch": 376} {"train_loss": -18.888648986816406, "global_step": 31234, "epoch": 376} {"train_loss": -19.0356388092041, "global_step": 31235, "epoch": 376} {"train_loss": -18.91005516052246, "global_step": 31236, "epoch": 376} {"train_loss": -18.741544723510742, "global_step": 31237, "epoch": 376} {"train_loss": -18.670948028564453, "global_step": 31238, "epoch": 376} {"train_loss": -18.788726806640625, "global_step": 31239, "epoch": 376} {"train_loss": -19.107574462890625, "global_step": 31240, "epoch": 376} {"train_loss": -18.83513832092285, "global_step": 31241, "epoch": 376} {"train_loss": -18.95856285095215, "global_step": 31242, "epoch": 376} {"train_loss": -18.882776260375977, "global_step": 31243, "epoch": 376} {"train_loss": -18.964168548583984, "global_step": 31244, "epoch": 376} {"train_loss": -19.1077823638916, "global_step": 31245, "epoch": 376} {"train_loss": -18.979141235351562, "global_step": 31246, "epoch": 376} {"train_loss": -19.051794052124023, "global_step": 31247, "epoch": 376} {"train_loss": -19.130769729614258, "global_step": 31248, "epoch": 376} {"train_loss": -18.98798942565918, "global_step": 31249, "epoch": 376} {"train_loss": -19.093294143676758, "global_step": 31250, "epoch": 376} {"train_loss": -19.23055648803711, "global_step": 31251, "epoch": 376} {"train_loss": -18.943021774291992, "global_step": 31252, "epoch": 376} {"train_loss": -19.00617790222168, "global_step": 31253, "epoch": 376} {"train_loss": -19.37506675720215, "global_step": 31254, "epoch": 376} {"train_loss": -19.1809024810791, "global_step": 31255, "epoch": 376} {"train_loss": -18.75040626525879, "global_step": 31256, "epoch": 376} {"train_loss": -18.938779830932617, "global_step": 31257, "epoch": 376} {"train_loss": -19.051774978637695, "global_step": 31258, "epoch": 376} {"train_loss": -18.995412826538086, "global_step": 31259, "epoch": 376} {"train_loss": -18.843612670898438, "global_step": 31260, "epoch": 376} {"train_loss": -19.117679595947266, "global_step": 31261, "epoch": 376} {"train_loss": -19.119781494140625, "global_step": 31262, "epoch": 376} {"train_loss": -18.83711051940918, "global_step": 31263, "epoch": 376} {"train_loss": -19.31246566772461, "global_step": 31264, "epoch": 376} {"train_loss": -18.839004516601562, "global_step": 31265, "epoch": 376} {"train_loss": -19.523469924926758, "global_step": 31266, "epoch": 376} {"train_loss": -18.880414962768555, "global_step": 31267, "epoch": 376} {"train_loss": -18.742706298828125, "global_step": 31268, "epoch": 376} {"train_loss": -19.209951400756836, "global_step": 31269, "epoch": 376} {"train_loss": -18.835628509521484, "global_step": 31270, "epoch": 376} {"train_loss": -18.790241241455078, "global_step": 31271, "epoch": 376} {"train_loss": -19.425474166870117, "global_step": 31272, "epoch": 376} {"train_loss": -19.210559844970703, "global_step": 31273, "epoch": 376} {"train_loss": -19.33106231689453, "global_step": 31274, "epoch": 376} {"train_loss": -19.034637451171875, "global_step": 31275, "epoch": 376} {"train_loss": -19.292110443115234, "global_step": 31276, "epoch": 376} {"train_loss": -18.901071548461914, "global_step": 31277, "epoch": 376} {"train_loss": -19.08084487915039, "global_step": 31278, "epoch": 376} {"train_loss": -18.873064041137695, "global_step": 31279, "epoch": 376} {"train_loss": -18.9965763092041, "global_step": 31280, "epoch": 376} {"train_loss": -19.03846549987793, "global_step": 31281, "epoch": 376} {"train_loss": -19.10518455505371, "global_step": 31282, "epoch": 376} {"train_loss": -18.73626708984375, "global_step": 31283, "epoch": 376} {"train_loss": -18.8201961517334, "global_step": 31284, "epoch": 376} {"train_loss": -18.861295700073242, "global_step": 31285, "epoch": 376} {"train_loss": -19.01975440979004, "global_step": 31286, "epoch": 376} {"train_loss": -19.1330509185791, "global_step": 31287, "epoch": 376} {"train_loss": -19.227996826171875, "global_step": 31288, "epoch": 376} {"train_loss": -19.29412269592285, "global_step": 31289, "epoch": 376} {"train_loss": -18.99935708563012, "global_step": 31290, "epoch": 376, "val_loss": 6083249.0} {"train_loss": -18.917089462280273, "global_step": 31291, "epoch": 377} {"train_loss": -19.013608932495117, "global_step": 31292, "epoch": 377} {"train_loss": -19.261659622192383, "global_step": 31293, "epoch": 377} {"train_loss": -18.900354385375977, "global_step": 31294, "epoch": 377} {"train_loss": -18.60470962524414, "global_step": 31295, "epoch": 377} {"train_loss": -18.97585105895996, "global_step": 31296, "epoch": 377} {"train_loss": -19.460386276245117, "global_step": 31297, "epoch": 377} {"train_loss": -19.006511688232422, "global_step": 31298, "epoch": 377} {"train_loss": -18.91767120361328, "global_step": 31299, "epoch": 377} {"train_loss": -18.868927001953125, "global_step": 31300, "epoch": 377} {"train_loss": -19.325902938842773, "global_step": 31301, "epoch": 377} {"train_loss": -18.77129554748535, "global_step": 31302, "epoch": 377} {"train_loss": -18.9210205078125, "global_step": 31303, "epoch": 377} {"train_loss": -19.236169815063477, "global_step": 31304, "epoch": 377} {"train_loss": -18.981603622436523, "global_step": 31305, "epoch": 377} {"train_loss": -18.908695220947266, "global_step": 31306, "epoch": 377} {"train_loss": -19.31005859375, "global_step": 31307, "epoch": 377} {"train_loss": -18.90764808654785, "global_step": 31308, "epoch": 377} {"train_loss": -18.94379997253418, "global_step": 31309, "epoch": 377} {"train_loss": -18.529571533203125, "global_step": 31310, "epoch": 377} {"train_loss": -19.228796005249023, "global_step": 31311, "epoch": 377} {"train_loss": -18.935754776000977, "global_step": 31312, "epoch": 377} {"train_loss": -18.65534019470215, "global_step": 31313, "epoch": 377} {"train_loss": -19.146167755126953, "global_step": 31314, "epoch": 377} {"train_loss": -19.025434494018555, "global_step": 31315, "epoch": 377} {"train_loss": -18.43141746520996, "global_step": 31316, "epoch": 377} {"train_loss": -18.73853874206543, "global_step": 31317, "epoch": 377} {"train_loss": -19.016435623168945, "global_step": 31318, "epoch": 377} {"train_loss": -19.16703224182129, "global_step": 31319, "epoch": 377} {"train_loss": -18.717416763305664, "global_step": 31320, "epoch": 377} {"train_loss": -19.037145614624023, "global_step": 31321, "epoch": 377} {"train_loss": -18.56889533996582, "global_step": 31322, "epoch": 377} {"train_loss": -18.963790893554688, "global_step": 31323, "epoch": 377} {"train_loss": -18.867416381835938, "global_step": 31324, "epoch": 377} {"train_loss": -19.345277786254883, "global_step": 31325, "epoch": 377} {"train_loss": -19.13791275024414, "global_step": 31326, "epoch": 377} {"train_loss": -18.938720703125, "global_step": 31327, "epoch": 377} {"train_loss": -19.005889892578125, "global_step": 31328, "epoch": 377} {"train_loss": -19.073087692260742, "global_step": 31329, "epoch": 377} {"train_loss": -18.90217399597168, "global_step": 31330, "epoch": 377} {"train_loss": -18.6098690032959, "global_step": 31331, "epoch": 377} {"train_loss": -19.393159866333008, "global_step": 31332, "epoch": 377} {"train_loss": -18.924959182739258, "global_step": 31333, "epoch": 377} {"train_loss": -19.03162956237793, "global_step": 31334, "epoch": 377} {"train_loss": -19.008588790893555, "global_step": 31335, "epoch": 377} {"train_loss": -18.82095718383789, "global_step": 31336, "epoch": 377} {"train_loss": -18.76459312438965, "global_step": 31337, "epoch": 377} {"train_loss": -19.350433349609375, "global_step": 31338, "epoch": 377} {"train_loss": -19.034570693969727, "global_step": 31339, "epoch": 377} {"train_loss": -18.669218063354492, "global_step": 31340, "epoch": 377} {"train_loss": -19.084943771362305, "global_step": 31341, "epoch": 377} {"train_loss": -18.90752410888672, "global_step": 31342, "epoch": 377} {"train_loss": -19.0384578704834, "global_step": 31343, "epoch": 377} {"train_loss": -19.067777633666992, "global_step": 31344, "epoch": 377} {"train_loss": -19.138994216918945, "global_step": 31345, "epoch": 377} {"train_loss": -19.21804428100586, "global_step": 31346, "epoch": 377} {"train_loss": -18.556142807006836, "global_step": 31347, "epoch": 377} {"train_loss": -19.094125747680664, "global_step": 31348, "epoch": 377} {"train_loss": -19.25507926940918, "global_step": 31349, "epoch": 377} {"train_loss": -18.829038619995117, "global_step": 31350, "epoch": 377} {"train_loss": -19.138769149780273, "global_step": 31351, "epoch": 377} {"train_loss": -19.15399169921875, "global_step": 31352, "epoch": 377} {"train_loss": -18.963773727416992, "global_step": 31353, "epoch": 377} {"train_loss": -19.11203956604004, "global_step": 31354, "epoch": 377} {"train_loss": -18.618436813354492, "global_step": 31355, "epoch": 377} {"train_loss": -19.1514892578125, "global_step": 31356, "epoch": 377} {"train_loss": -18.717634201049805, "global_step": 31357, "epoch": 377} {"train_loss": -19.40349006652832, "global_step": 31358, "epoch": 377} {"train_loss": -19.054649353027344, "global_step": 31359, "epoch": 377} {"train_loss": -19.074230194091797, "global_step": 31360, "epoch": 377} {"train_loss": -19.10004234313965, "global_step": 31361, "epoch": 377} {"train_loss": -19.447805404663086, "global_step": 31362, "epoch": 377} {"train_loss": -19.1901798248291, "global_step": 31363, "epoch": 377} {"train_loss": -18.369121551513672, "global_step": 31364, "epoch": 377} {"train_loss": -19.198392868041992, "global_step": 31365, "epoch": 377} {"train_loss": -19.010251998901367, "global_step": 31366, "epoch": 377} {"train_loss": -18.864614486694336, "global_step": 31367, "epoch": 377} {"train_loss": -19.198713302612305, "global_step": 31368, "epoch": 377} {"train_loss": -18.838712692260742, "global_step": 31369, "epoch": 377} {"train_loss": -19.254791259765625, "global_step": 31370, "epoch": 377} {"train_loss": -19.260879516601562, "global_step": 31371, "epoch": 377} {"train_loss": -19.254261016845703, "global_step": 31372, "epoch": 377} {"train_loss": -18.996521065034063, "global_step": 31373, "epoch": 377, "val_loss": 6145344.0} {"train_loss": -18.59222984313965, "global_step": 31374, "epoch": 378} {"train_loss": -19.130159378051758, "global_step": 31375, "epoch": 378} {"train_loss": -18.823083877563477, "global_step": 31376, "epoch": 378} {"train_loss": -18.51091957092285, "global_step": 31377, "epoch": 378} {"train_loss": -18.625375747680664, "global_step": 31378, "epoch": 378} {"train_loss": -18.789321899414062, "global_step": 31379, "epoch": 378} {"train_loss": -19.35638427734375, "global_step": 31380, "epoch": 378} {"train_loss": -18.76326560974121, "global_step": 31381, "epoch": 378} {"train_loss": -18.85843276977539, "global_step": 31382, "epoch": 378} {"train_loss": -19.0194149017334, "global_step": 31383, "epoch": 378} {"train_loss": -19.046972274780273, "global_step": 31384, "epoch": 378} {"train_loss": -19.021467208862305, "global_step": 31385, "epoch": 378} {"train_loss": -18.838083267211914, "global_step": 31386, "epoch": 378} {"train_loss": -18.854183197021484, "global_step": 31387, "epoch": 378} {"train_loss": -19.000152587890625, "global_step": 31388, "epoch": 378} {"train_loss": -18.962749481201172, "global_step": 31389, "epoch": 378} {"train_loss": -19.18739128112793, "global_step": 31390, "epoch": 378} {"train_loss": -19.63201141357422, "global_step": 31391, "epoch": 378} {"train_loss": -19.326147079467773, "global_step": 31392, "epoch": 378} {"train_loss": -18.966445922851562, "global_step": 31393, "epoch": 378} {"train_loss": -19.43630599975586, "global_step": 31394, "epoch": 378} {"train_loss": -18.861764907836914, "global_step": 31395, "epoch": 378} {"train_loss": -18.529197692871094, "global_step": 31396, "epoch": 378} {"train_loss": -19.012624740600586, "global_step": 31397, "epoch": 378} {"train_loss": -19.160240173339844, "global_step": 31398, "epoch": 378} {"train_loss": -19.008567810058594, "global_step": 31399, "epoch": 378} {"train_loss": -18.937610626220703, "global_step": 31400, "epoch": 378} {"train_loss": -18.868934631347656, "global_step": 31401, "epoch": 378} {"train_loss": -19.027738571166992, "global_step": 31402, "epoch": 378} {"train_loss": -19.330289840698242, "global_step": 31403, "epoch": 378} {"train_loss": -19.08878517150879, "global_step": 31404, "epoch": 378} {"train_loss": -18.735504150390625, "global_step": 31405, "epoch": 378} {"train_loss": -19.079267501831055, "global_step": 31406, "epoch": 378} {"train_loss": -19.228940963745117, "global_step": 31407, "epoch": 378} {"train_loss": -18.92203712463379, "global_step": 31408, "epoch": 378} {"train_loss": -19.183691024780273, "global_step": 31409, "epoch": 378} {"train_loss": -19.104156494140625, "global_step": 31410, "epoch": 378} {"train_loss": -19.1887264251709, "global_step": 31411, "epoch": 378} {"train_loss": -19.207590103149414, "global_step": 31412, "epoch": 378} {"train_loss": -18.813919067382812, "global_step": 31413, "epoch": 378} {"train_loss": -19.33649253845215, "global_step": 31414, "epoch": 378} {"train_loss": -18.735212326049805, "global_step": 31415, "epoch": 378} {"train_loss": -18.87116813659668, "global_step": 31416, "epoch": 378} {"train_loss": -19.041980743408203, "global_step": 31417, "epoch": 378} {"train_loss": -19.116872787475586, "global_step": 31418, "epoch": 378} {"train_loss": -18.813756942749023, "global_step": 31419, "epoch": 378} {"train_loss": -18.8674373626709, "global_step": 31420, "epoch": 378} {"train_loss": -18.743337631225586, "global_step": 31421, "epoch": 378} {"train_loss": -18.799226760864258, "global_step": 31422, "epoch": 378} {"train_loss": -18.802274703979492, "global_step": 31423, "epoch": 378} {"train_loss": -19.0720157623291, "global_step": 31424, "epoch": 378} {"train_loss": -18.977380752563477, "global_step": 31425, "epoch": 378} {"train_loss": -18.892105102539062, "global_step": 31426, "epoch": 378} {"train_loss": -18.816513061523438, "global_step": 31427, "epoch": 378} {"train_loss": -18.918075561523438, "global_step": 31428, "epoch": 378} {"train_loss": -18.776546478271484, "global_step": 31429, "epoch": 378} {"train_loss": -19.343984603881836, "global_step": 31430, "epoch": 378} {"train_loss": -19.00980567932129, "global_step": 31431, "epoch": 378} {"train_loss": -19.011600494384766, "global_step": 31432, "epoch": 378} {"train_loss": -19.016948699951172, "global_step": 31433, "epoch": 378} {"train_loss": -18.984329223632812, "global_step": 31434, "epoch": 378} {"train_loss": -19.18183708190918, "global_step": 31435, "epoch": 378} {"train_loss": -19.150094985961914, "global_step": 31436, "epoch": 378} {"train_loss": -18.614858627319336, "global_step": 31437, "epoch": 378} {"train_loss": -18.917387008666992, "global_step": 31438, "epoch": 378} {"train_loss": -19.263214111328125, "global_step": 31439, "epoch": 378} {"train_loss": -19.287353515625, "global_step": 31440, "epoch": 378} {"train_loss": -19.219711303710938, "global_step": 31441, "epoch": 378} {"train_loss": -19.109323501586914, "global_step": 31442, "epoch": 378} {"train_loss": -19.242502212524414, "global_step": 31443, "epoch": 378} {"train_loss": -18.8778076171875, "global_step": 31444, "epoch": 378} {"train_loss": -19.07994270324707, "global_step": 31445, "epoch": 378} {"train_loss": -19.39004898071289, "global_step": 31446, "epoch": 378} {"train_loss": -18.955427169799805, "global_step": 31447, "epoch": 378} {"train_loss": -19.18182945251465, "global_step": 31448, "epoch": 378} {"train_loss": -18.87729835510254, "global_step": 31449, "epoch": 378} {"train_loss": -19.18385887145996, "global_step": 31450, "epoch": 378} {"train_loss": -18.924726486206055, "global_step": 31451, "epoch": 378} {"train_loss": -18.937774658203125, "global_step": 31452, "epoch": 378} {"train_loss": -19.25663185119629, "global_step": 31453, "epoch": 378} {"train_loss": -19.018795013427734, "global_step": 31454, "epoch": 378} {"train_loss": -18.965023040771484, "global_step": 31455, "epoch": 378} {"train_loss": -19.01193320033062, "global_step": 31456, "epoch": 378, "val_loss": 6025934.5} {"train_loss": -18.580453872680664, "global_step": 31457, "epoch": 379} {"train_loss": -19.054651260375977, "global_step": 31458, "epoch": 379} {"train_loss": -18.927167892456055, "global_step": 31459, "epoch": 379} {"train_loss": -18.870452880859375, "global_step": 31460, "epoch": 379} {"train_loss": -18.63274383544922, "global_step": 31461, "epoch": 379} {"train_loss": -18.6171932220459, "global_step": 31462, "epoch": 379} {"train_loss": -19.12649154663086, "global_step": 31463, "epoch": 379} {"train_loss": -18.72822380065918, "global_step": 31464, "epoch": 379} {"train_loss": -19.438682556152344, "global_step": 31465, "epoch": 379} {"train_loss": -18.92510986328125, "global_step": 31466, "epoch": 379} {"train_loss": -19.043869018554688, "global_step": 31467, "epoch": 379} {"train_loss": -19.35717010498047, "global_step": 31468, "epoch": 379} {"train_loss": -18.97427749633789, "global_step": 31469, "epoch": 379} {"train_loss": -18.886760711669922, "global_step": 31470, "epoch": 379} {"train_loss": -18.986310958862305, "global_step": 31471, "epoch": 379} {"train_loss": -19.22158432006836, "global_step": 31472, "epoch": 379} {"train_loss": -18.94483757019043, "global_step": 31473, "epoch": 379} {"train_loss": -18.768081665039062, "global_step": 31474, "epoch": 379} {"train_loss": -19.258056640625, "global_step": 31475, "epoch": 379} {"train_loss": -18.850482940673828, "global_step": 31476, "epoch": 379} {"train_loss": -18.77387046813965, "global_step": 31477, "epoch": 379} {"train_loss": -18.945064544677734, "global_step": 31478, "epoch": 379} {"train_loss": -18.986682891845703, "global_step": 31479, "epoch": 379} {"train_loss": -19.056943893432617, "global_step": 31480, "epoch": 379} {"train_loss": -18.797330856323242, "global_step": 31481, "epoch": 379} {"train_loss": -18.819889068603516, "global_step": 31482, "epoch": 379} {"train_loss": -19.00489044189453, "global_step": 31483, "epoch": 379} {"train_loss": -19.02619743347168, "global_step": 31484, "epoch": 379} {"train_loss": -18.626953125, "global_step": 31485, "epoch": 379} {"train_loss": -19.24896812438965, "global_step": 31486, "epoch": 379} {"train_loss": -19.137601852416992, "global_step": 31487, "epoch": 379} {"train_loss": -18.860254287719727, "global_step": 31488, "epoch": 379} {"train_loss": -19.0423526763916, "global_step": 31489, "epoch": 379} {"train_loss": -19.00102996826172, "global_step": 31490, "epoch": 379} {"train_loss": -19.310453414916992, "global_step": 31491, "epoch": 379} {"train_loss": -19.167098999023438, "global_step": 31492, "epoch": 379} {"train_loss": -19.09742546081543, "global_step": 31493, "epoch": 379} {"train_loss": -18.887853622436523, "global_step": 31494, "epoch": 379} {"train_loss": -19.17845916748047, "global_step": 31495, "epoch": 379} {"train_loss": -19.086912155151367, "global_step": 31496, "epoch": 379} {"train_loss": -18.940282821655273, "global_step": 31497, "epoch": 379} {"train_loss": -19.277875900268555, "global_step": 31498, "epoch": 379} {"train_loss": -19.349720001220703, "global_step": 31499, "epoch": 379} {"train_loss": -19.5748291015625, "global_step": 31500, "epoch": 379} {"train_loss": -19.038022994995117, "global_step": 31501, "epoch": 379} {"train_loss": -18.969013214111328, "global_step": 31502, "epoch": 379} {"train_loss": -18.98032569885254, "global_step": 31503, "epoch": 379} {"train_loss": -19.120351791381836, "global_step": 31504, "epoch": 379} {"train_loss": -18.798919677734375, "global_step": 31505, "epoch": 379} {"train_loss": -18.900793075561523, "global_step": 31506, "epoch": 379} {"train_loss": -18.908206939697266, "global_step": 31507, "epoch": 379} {"train_loss": -18.62092399597168, "global_step": 31508, "epoch": 379} {"train_loss": -19.375768661499023, "global_step": 31509, "epoch": 379} {"train_loss": -18.57615852355957, "global_step": 31510, "epoch": 379} {"train_loss": -18.926773071289062, "global_step": 31511, "epoch": 379} {"train_loss": -18.985315322875977, "global_step": 31512, "epoch": 379} {"train_loss": -18.79389762878418, "global_step": 31513, "epoch": 379} {"train_loss": -18.929372787475586, "global_step": 31514, "epoch": 379} {"train_loss": -18.753095626831055, "global_step": 31515, "epoch": 379} {"train_loss": -19.149415969848633, "global_step": 31516, "epoch": 379} {"train_loss": -19.099613189697266, "global_step": 31517, "epoch": 379} {"train_loss": -19.097360610961914, "global_step": 31518, "epoch": 379} {"train_loss": -19.145429611206055, "global_step": 31519, "epoch": 379} {"train_loss": -18.911121368408203, "global_step": 31520, "epoch": 379} {"train_loss": -18.873876571655273, "global_step": 31521, "epoch": 379} {"train_loss": -19.08930015563965, "global_step": 31522, "epoch": 379} {"train_loss": -19.073522567749023, "global_step": 31523, "epoch": 379} {"train_loss": -19.148181915283203, "global_step": 31524, "epoch": 379} {"train_loss": -18.95191764831543, "global_step": 31525, "epoch": 379} {"train_loss": -18.605295181274414, "global_step": 31526, "epoch": 379} {"train_loss": -19.1014461517334, "global_step": 31527, "epoch": 379} {"train_loss": -19.15597915649414, "global_step": 31528, "epoch": 379} {"train_loss": -19.169513702392578, "global_step": 31529, "epoch": 379} {"train_loss": -18.94194984436035, "global_step": 31530, "epoch": 379} {"train_loss": -19.181629180908203, "global_step": 31531, "epoch": 379} {"train_loss": -19.089101791381836, "global_step": 31532, "epoch": 379} {"train_loss": -19.2421932220459, "global_step": 31533, "epoch": 379} {"train_loss": -19.307174682617188, "global_step": 31534, "epoch": 379} {"train_loss": -19.011350631713867, "global_step": 31535, "epoch": 379} {"train_loss": -18.62976837158203, "global_step": 31536, "epoch": 379} {"train_loss": -19.16155433654785, "global_step": 31537, "epoch": 379} {"train_loss": -19.012737274169922, "global_step": 31538, "epoch": 379} {"train_loss": -18.999285180884673, "global_step": 31539, "epoch": 379, "val_loss": 6070152.5} {"train_loss": -18.561567306518555, "global_step": 31540, "epoch": 380} {"train_loss": -19.308914184570312, "global_step": 31541, "epoch": 380} {"train_loss": -18.555545806884766, "global_step": 31542, "epoch": 380} {"train_loss": -18.90363311767578, "global_step": 31543, "epoch": 380} {"train_loss": -18.530195236206055, "global_step": 31544, "epoch": 380} {"train_loss": -18.56696891784668, "global_step": 31545, "epoch": 380} {"train_loss": -19.16049575805664, "global_step": 31546, "epoch": 380} {"train_loss": -18.739572525024414, "global_step": 31547, "epoch": 380} {"train_loss": -19.183917999267578, "global_step": 31548, "epoch": 380} {"train_loss": -18.793771743774414, "global_step": 31549, "epoch": 380} {"train_loss": -18.648895263671875, "global_step": 31550, "epoch": 380} {"train_loss": -18.721572875976562, "global_step": 31551, "epoch": 380} {"train_loss": -19.120079040527344, "global_step": 31552, "epoch": 380} {"train_loss": -18.719282150268555, "global_step": 31553, "epoch": 380} {"train_loss": -19.183847427368164, "global_step": 31554, "epoch": 380} {"train_loss": -19.645980834960938, "global_step": 31555, "epoch": 380} {"train_loss": -18.909177780151367, "global_step": 31556, "epoch": 380} {"train_loss": -19.0120849609375, "global_step": 31557, "epoch": 380} {"train_loss": -18.642597198486328, "global_step": 31558, "epoch": 380} {"train_loss": -18.897342681884766, "global_step": 31559, "epoch": 380} {"train_loss": -19.337553024291992, "global_step": 31560, "epoch": 380} {"train_loss": -19.01643943786621, "global_step": 31561, "epoch": 380} {"train_loss": -19.1623477935791, "global_step": 31562, "epoch": 380} {"train_loss": -18.876333236694336, "global_step": 31563, "epoch": 380} {"train_loss": -18.96841812133789, "global_step": 31564, "epoch": 380} {"train_loss": -19.059326171875, "global_step": 31565, "epoch": 380} {"train_loss": -19.124990463256836, "global_step": 31566, "epoch": 380} {"train_loss": -18.974637985229492, "global_step": 31567, "epoch": 380} {"train_loss": -18.82463264465332, "global_step": 31568, "epoch": 380} {"train_loss": -19.239538192749023, "global_step": 31569, "epoch": 380} {"train_loss": -19.32965660095215, "global_step": 31570, "epoch": 380} {"train_loss": -19.169017791748047, "global_step": 31571, "epoch": 380} {"train_loss": -18.914857864379883, "global_step": 31572, "epoch": 380} {"train_loss": -18.753131866455078, "global_step": 31573, "epoch": 380} {"train_loss": -18.545862197875977, "global_step": 31574, "epoch": 380} {"train_loss": -19.30564308166504, "global_step": 31575, "epoch": 380} {"train_loss": -18.873062133789062, "global_step": 31576, "epoch": 380} {"train_loss": -19.379003524780273, "global_step": 31577, "epoch": 380} {"train_loss": -19.432050704956055, "global_step": 31578, "epoch": 380} {"train_loss": -18.942304611206055, "global_step": 31579, "epoch": 380} {"train_loss": -19.148582458496094, "global_step": 31580, "epoch": 380} {"train_loss": -18.90260124206543, "global_step": 31581, "epoch": 380} {"train_loss": -18.901201248168945, "global_step": 31582, "epoch": 380} {"train_loss": -19.19666862487793, "global_step": 31583, "epoch": 380} {"train_loss": -19.12071990966797, "global_step": 31584, "epoch": 380} {"train_loss": -19.161121368408203, "global_step": 31585, "epoch": 380} {"train_loss": -18.9456844329834, "global_step": 31586, "epoch": 380} {"train_loss": -19.464672088623047, "global_step": 31587, "epoch": 380} {"train_loss": -18.81456756591797, "global_step": 31588, "epoch": 380} {"train_loss": -19.100133895874023, "global_step": 31589, "epoch": 380} {"train_loss": -18.82697105407715, "global_step": 31590, "epoch": 380} {"train_loss": -18.971445083618164, "global_step": 31591, "epoch": 380} {"train_loss": -18.885181427001953, "global_step": 31592, "epoch": 380} {"train_loss": -18.952091217041016, "global_step": 31593, "epoch": 380} {"train_loss": -19.143503189086914, "global_step": 31594, "epoch": 380} {"train_loss": -19.362960815429688, "global_step": 31595, "epoch": 380} {"train_loss": -18.984222412109375, "global_step": 31596, "epoch": 380} {"train_loss": -19.426738739013672, "global_step": 31597, "epoch": 380} {"train_loss": -18.690776824951172, "global_step": 31598, "epoch": 380} {"train_loss": -19.226831436157227, "global_step": 31599, "epoch": 380} {"train_loss": -19.13006591796875, "global_step": 31600, "epoch": 380} {"train_loss": -19.00449562072754, "global_step": 31601, "epoch": 380} {"train_loss": -18.804553985595703, "global_step": 31602, "epoch": 380} {"train_loss": -19.231796264648438, "global_step": 31603, "epoch": 380} {"train_loss": -19.099851608276367, "global_step": 31604, "epoch": 380} {"train_loss": -18.84612464904785, "global_step": 31605, "epoch": 380} {"train_loss": -18.727628707885742, "global_step": 31606, "epoch": 380} {"train_loss": -19.084442138671875, "global_step": 31607, "epoch": 380} {"train_loss": -19.105731964111328, "global_step": 31608, "epoch": 380} {"train_loss": -18.70469093322754, "global_step": 31609, "epoch": 380} {"train_loss": -19.091190338134766, "global_step": 31610, "epoch": 380} {"train_loss": -19.332077026367188, "global_step": 31611, "epoch": 380} {"train_loss": -18.686824798583984, "global_step": 31612, "epoch": 380} {"train_loss": -18.89954948425293, "global_step": 31613, "epoch": 380} {"train_loss": -18.844390869140625, "global_step": 31614, "epoch": 380} {"train_loss": -19.161447525024414, "global_step": 31615, "epoch": 380} {"train_loss": -18.596752166748047, "global_step": 31616, "epoch": 380} {"train_loss": -19.03061866760254, "global_step": 31617, "epoch": 380} {"train_loss": -18.852462768554688, "global_step": 31618, "epoch": 380} {"train_loss": -19.429821014404297, "global_step": 31619, "epoch": 380} {"train_loss": -19.2026424407959, "global_step": 31620, "epoch": 380} {"train_loss": -18.911298751831055, "global_step": 31621, "epoch": 380} {"train_loss": -19.010895970356035, "global_step": 31622, "epoch": 380, "val_loss": 5944467.0} {"train_loss": -18.82695198059082, "global_step": 31623, "epoch": 381} {"train_loss": -18.89781379699707, "global_step": 31624, "epoch": 381} {"train_loss": -18.51931381225586, "global_step": 31625, "epoch": 381} {"train_loss": -18.88603973388672, "global_step": 31626, "epoch": 381} {"train_loss": -18.964628219604492, "global_step": 31627, "epoch": 381} {"train_loss": -18.884008407592773, "global_step": 31628, "epoch": 381} {"train_loss": -18.689035415649414, "global_step": 31629, "epoch": 381} {"train_loss": -18.740537643432617, "global_step": 31630, "epoch": 381} {"train_loss": -18.377355575561523, "global_step": 31631, "epoch": 381} {"train_loss": -19.299375534057617, "global_step": 31632, "epoch": 381} {"train_loss": -18.965688705444336, "global_step": 31633, "epoch": 381} {"train_loss": -19.284889221191406, "global_step": 31634, "epoch": 381} {"train_loss": -18.979324340820312, "global_step": 31635, "epoch": 381} {"train_loss": -18.957584381103516, "global_step": 31636, "epoch": 381} {"train_loss": -18.825061798095703, "global_step": 31637, "epoch": 381} {"train_loss": -18.732280731201172, "global_step": 31638, "epoch": 381} {"train_loss": -19.11958885192871, "global_step": 31639, "epoch": 381} {"train_loss": -18.957365036010742, "global_step": 31640, "epoch": 381} {"train_loss": -19.215551376342773, "global_step": 31641, "epoch": 381} {"train_loss": -18.890810012817383, "global_step": 31642, "epoch": 381} {"train_loss": -19.007505416870117, "global_step": 31643, "epoch": 381} {"train_loss": -18.702789306640625, "global_step": 31644, "epoch": 381} {"train_loss": -19.424280166625977, "global_step": 31645, "epoch": 381} {"train_loss": -19.387252807617188, "global_step": 31646, "epoch": 381} {"train_loss": -19.162214279174805, "global_step": 31647, "epoch": 381} {"train_loss": -18.665678024291992, "global_step": 31648, "epoch": 381} {"train_loss": -19.214414596557617, "global_step": 31649, "epoch": 381} {"train_loss": -18.95509910583496, "global_step": 31650, "epoch": 381} {"train_loss": -19.1915225982666, "global_step": 31651, "epoch": 381} {"train_loss": -18.68965721130371, "global_step": 31652, "epoch": 381} {"train_loss": -18.918306350708008, "global_step": 31653, "epoch": 381} {"train_loss": -18.47618293762207, "global_step": 31654, "epoch": 381} {"train_loss": -19.10795021057129, "global_step": 31655, "epoch": 381} {"train_loss": -18.795156478881836, "global_step": 31656, "epoch": 381} {"train_loss": -19.430435180664062, "global_step": 31657, "epoch": 381} {"train_loss": -19.36176872253418, "global_step": 31658, "epoch": 381} {"train_loss": -19.023908615112305, "global_step": 31659, "epoch": 381} {"train_loss": -18.879858016967773, "global_step": 31660, "epoch": 381} {"train_loss": -19.24244499206543, "global_step": 31661, "epoch": 381} {"train_loss": -18.77969741821289, "global_step": 31662, "epoch": 381} {"train_loss": -19.073993682861328, "global_step": 31663, "epoch": 381} {"train_loss": -19.191076278686523, "global_step": 31664, "epoch": 381} {"train_loss": -19.009136199951172, "global_step": 31665, "epoch": 381} {"train_loss": -18.60124397277832, "global_step": 31666, "epoch": 381} {"train_loss": -19.16120719909668, "global_step": 31667, "epoch": 381} {"train_loss": -19.216495513916016, "global_step": 31668, "epoch": 381} {"train_loss": -18.952667236328125, "global_step": 31669, "epoch": 381} {"train_loss": -19.177461624145508, "global_step": 31670, "epoch": 381} {"train_loss": -19.08998680114746, "global_step": 31671, "epoch": 381} {"train_loss": -18.930891036987305, "global_step": 31672, "epoch": 381} {"train_loss": -18.930801391601562, "global_step": 31673, "epoch": 381} {"train_loss": -18.774145126342773, "global_step": 31674, "epoch": 381} {"train_loss": -18.815908432006836, "global_step": 31675, "epoch": 381} {"train_loss": -19.19977378845215, "global_step": 31676, "epoch": 381} {"train_loss": -19.5031795501709, "global_step": 31677, "epoch": 381} {"train_loss": -19.137006759643555, "global_step": 31678, "epoch": 381} {"train_loss": -18.86481285095215, "global_step": 31679, "epoch": 381} {"train_loss": -18.875028610229492, "global_step": 31680, "epoch": 381} {"train_loss": -19.190114974975586, "global_step": 31681, "epoch": 381} {"train_loss": -19.368085861206055, "global_step": 31682, "epoch": 381} {"train_loss": -18.937776565551758, "global_step": 31683, "epoch": 381} {"train_loss": -18.803388595581055, "global_step": 31684, "epoch": 381} {"train_loss": -19.34391975402832, "global_step": 31685, "epoch": 381} {"train_loss": -19.302513122558594, "global_step": 31686, "epoch": 381} {"train_loss": -18.69449806213379, "global_step": 31687, "epoch": 381} {"train_loss": -18.9898681640625, "global_step": 31688, "epoch": 381} {"train_loss": -19.01009178161621, "global_step": 31689, "epoch": 381} {"train_loss": -18.96864128112793, "global_step": 31690, "epoch": 381} {"train_loss": -19.14499282836914, "global_step": 31691, "epoch": 381} {"train_loss": -19.120946884155273, "global_step": 31692, "epoch": 381} {"train_loss": -18.999040603637695, "global_step": 31693, "epoch": 381} {"train_loss": -19.267972946166992, "global_step": 31694, "epoch": 381} {"train_loss": -19.14632225036621, "global_step": 31695, "epoch": 381} {"train_loss": -19.34299087524414, "global_step": 31696, "epoch": 381} {"train_loss": -18.932418823242188, "global_step": 31697, "epoch": 381} {"train_loss": -18.84596061706543, "global_step": 31698, "epoch": 381} {"train_loss": -19.110315322875977, "global_step": 31699, "epoch": 381} {"train_loss": -19.254901885986328, "global_step": 31700, "epoch": 381} {"train_loss": -18.86069679260254, "global_step": 31701, "epoch": 381} {"train_loss": -19.01850700378418, "global_step": 31702, "epoch": 381} {"train_loss": -18.93674659729004, "global_step": 31703, "epoch": 381} {"train_loss": -18.629453659057617, "global_step": 31704, "epoch": 381} {"train_loss": -18.984619692147497, "global_step": 31705, "epoch": 381, "val_loss": 5992958.5} {"train_loss": -18.302526473999023, "global_step": 31706, "epoch": 382} {"train_loss": -18.709169387817383, "global_step": 31707, "epoch": 382} {"train_loss": -18.79178237915039, "global_step": 31708, "epoch": 382} {"train_loss": -18.753463745117188, "global_step": 31709, "epoch": 382} {"train_loss": -18.864904403686523, "global_step": 31710, "epoch": 382} {"train_loss": -19.013221740722656, "global_step": 31711, "epoch": 382} {"train_loss": -18.9951114654541, "global_step": 31712, "epoch": 382} {"train_loss": -18.752769470214844, "global_step": 31713, "epoch": 382} {"train_loss": -18.699440002441406, "global_step": 31714, "epoch": 382} {"train_loss": -18.66570281982422, "global_step": 31715, "epoch": 382} {"train_loss": -19.106185913085938, "global_step": 31716, "epoch": 382} {"train_loss": -18.615903854370117, "global_step": 31717, "epoch": 382} {"train_loss": -19.08686065673828, "global_step": 31718, "epoch": 382} {"train_loss": -18.869428634643555, "global_step": 31719, "epoch": 382} {"train_loss": -18.919260025024414, "global_step": 31720, "epoch": 382} {"train_loss": -18.9317626953125, "global_step": 31721, "epoch": 382} {"train_loss": -18.711191177368164, "global_step": 31722, "epoch": 382} {"train_loss": -19.26096534729004, "global_step": 31723, "epoch": 382} {"train_loss": -18.917875289916992, "global_step": 31724, "epoch": 382} {"train_loss": -19.36537742614746, "global_step": 31725, "epoch": 382} {"train_loss": -19.110464096069336, "global_step": 31726, "epoch": 382} {"train_loss": -19.32869529724121, "global_step": 31727, "epoch": 382} {"train_loss": -18.97490882873535, "global_step": 31728, "epoch": 382} {"train_loss": -18.748428344726562, "global_step": 31729, "epoch": 382} {"train_loss": -18.73286247253418, "global_step": 31730, "epoch": 382} {"train_loss": -19.141393661499023, "global_step": 31731, "epoch": 382} {"train_loss": -18.709503173828125, "global_step": 31732, "epoch": 382} {"train_loss": -19.12465476989746, "global_step": 31733, "epoch": 382} {"train_loss": -19.255210876464844, "global_step": 31734, "epoch": 382} {"train_loss": -18.592031478881836, "global_step": 31735, "epoch": 382} {"train_loss": -18.948286056518555, "global_step": 31736, "epoch": 382} {"train_loss": -19.0465087890625, "global_step": 31737, "epoch": 382} {"train_loss": -19.03693962097168, "global_step": 31738, "epoch": 382} {"train_loss": -18.703643798828125, "global_step": 31739, "epoch": 382} {"train_loss": -19.334989547729492, "global_step": 31740, "epoch": 382} {"train_loss": -19.031524658203125, "global_step": 31741, "epoch": 382} {"train_loss": -19.007883071899414, "global_step": 31742, "epoch": 382} {"train_loss": -18.993085861206055, "global_step": 31743, "epoch": 382} {"train_loss": -18.977025985717773, "global_step": 31744, "epoch": 382} {"train_loss": -18.869800567626953, "global_step": 31745, "epoch": 382} {"train_loss": -18.56995391845703, "global_step": 31746, "epoch": 382} {"train_loss": -18.76746940612793, "global_step": 31747, "epoch": 382} {"train_loss": -19.344717025756836, "global_step": 31748, "epoch": 382} {"train_loss": -18.916990280151367, "global_step": 31749, "epoch": 382} {"train_loss": -19.019437789916992, "global_step": 31750, "epoch": 382} {"train_loss": -18.940107345581055, "global_step": 31751, "epoch": 382} {"train_loss": -19.27696990966797, "global_step": 31752, "epoch": 382} {"train_loss": -19.341506958007812, "global_step": 31753, "epoch": 382} {"train_loss": -19.31972312927246, "global_step": 31754, "epoch": 382} {"train_loss": -19.093040466308594, "global_step": 31755, "epoch": 382} {"train_loss": -18.826868057250977, "global_step": 31756, "epoch": 382} {"train_loss": -19.014368057250977, "global_step": 31757, "epoch": 382} {"train_loss": -19.153398513793945, "global_step": 31758, "epoch": 382} {"train_loss": -19.200416564941406, "global_step": 31759, "epoch": 382} {"train_loss": -18.54781150817871, "global_step": 31760, "epoch": 382} {"train_loss": -18.864696502685547, "global_step": 31761, "epoch": 382} {"train_loss": -19.372468948364258, "global_step": 31762, "epoch": 382} {"train_loss": -19.27167320251465, "global_step": 31763, "epoch": 382} {"train_loss": -19.13753318786621, "global_step": 31764, "epoch": 382} {"train_loss": -18.942768096923828, "global_step": 31765, "epoch": 382} {"train_loss": -19.186168670654297, "global_step": 31766, "epoch": 382} {"train_loss": -18.994394302368164, "global_step": 31767, "epoch": 382} {"train_loss": -19.04347038269043, "global_step": 31768, "epoch": 382} {"train_loss": -18.880537033081055, "global_step": 31769, "epoch": 382} {"train_loss": -18.870397567749023, "global_step": 31770, "epoch": 382} {"train_loss": -18.603534698486328, "global_step": 31771, "epoch": 382} {"train_loss": -19.16036033630371, "global_step": 31772, "epoch": 382} {"train_loss": -19.0636043548584, "global_step": 31773, "epoch": 382} {"train_loss": -18.882389068603516, "global_step": 31774, "epoch": 382} {"train_loss": -18.909719467163086, "global_step": 31775, "epoch": 382} {"train_loss": -19.312040328979492, "global_step": 31776, "epoch": 382} {"train_loss": -19.046630859375, "global_step": 31777, "epoch": 382} {"train_loss": -19.027029037475586, "global_step": 31778, "epoch": 382} {"train_loss": -19.070697784423828, "global_step": 31779, "epoch": 382} {"train_loss": -19.074054718017578, "global_step": 31780, "epoch": 382} {"train_loss": -19.276403427124023, "global_step": 31781, "epoch": 382} {"train_loss": -19.13588523864746, "global_step": 31782, "epoch": 382} {"train_loss": -18.671024322509766, "global_step": 31783, "epoch": 382} {"train_loss": -18.663625717163086, "global_step": 31784, "epoch": 382} {"train_loss": -19.18793296813965, "global_step": 31785, "epoch": 382} {"train_loss": -18.823965072631836, "global_step": 31786, "epoch": 382} {"train_loss": -19.07797622680664, "global_step": 31787, "epoch": 382} {"train_loss": -18.97648262115846, "global_step": 31788, "epoch": 382, "val_loss": 6161028.0} {"train_loss": -18.854875564575195, "global_step": 31789, "epoch": 383} {"train_loss": -19.07567596435547, "global_step": 31790, "epoch": 383} {"train_loss": -18.635618209838867, "global_step": 31791, "epoch": 383} {"train_loss": -18.88238525390625, "global_step": 31792, "epoch": 383} {"train_loss": -19.1090145111084, "global_step": 31793, "epoch": 383} {"train_loss": -18.80069923400879, "global_step": 31794, "epoch": 383} {"train_loss": -19.125715255737305, "global_step": 31795, "epoch": 383} {"train_loss": -19.015668869018555, "global_step": 31796, "epoch": 383} {"train_loss": -18.922576904296875, "global_step": 31797, "epoch": 383} {"train_loss": -19.111719131469727, "global_step": 31798, "epoch": 383} {"train_loss": -19.168781280517578, "global_step": 31799, "epoch": 383} {"train_loss": -18.896148681640625, "global_step": 31800, "epoch": 383} {"train_loss": -18.79059410095215, "global_step": 31801, "epoch": 383} {"train_loss": -19.325973510742188, "global_step": 31802, "epoch": 383} {"train_loss": -18.757741928100586, "global_step": 31803, "epoch": 383} {"train_loss": -19.308202743530273, "global_step": 31804, "epoch": 383} {"train_loss": -18.938383102416992, "global_step": 31805, "epoch": 383} {"train_loss": -18.634063720703125, "global_step": 31806, "epoch": 383} {"train_loss": -18.89938735961914, "global_step": 31807, "epoch": 383} {"train_loss": -19.040576934814453, "global_step": 31808, "epoch": 383} {"train_loss": -18.95216941833496, "global_step": 31809, "epoch": 383} {"train_loss": -18.88898468017578, "global_step": 31810, "epoch": 383} {"train_loss": -18.642292022705078, "global_step": 31811, "epoch": 383} {"train_loss": -19.286611557006836, "global_step": 31812, "epoch": 383} {"train_loss": -19.406137466430664, "global_step": 31813, "epoch": 383} {"train_loss": -18.960906982421875, "global_step": 31814, "epoch": 383} {"train_loss": -18.887121200561523, "global_step": 31815, "epoch": 383} {"train_loss": -19.346134185791016, "global_step": 31816, "epoch": 383} {"train_loss": -18.874374389648438, "global_step": 31817, "epoch": 383} {"train_loss": -18.61847496032715, "global_step": 31818, "epoch": 383} {"train_loss": -18.8925838470459, "global_step": 31819, "epoch": 383} {"train_loss": -19.427101135253906, "global_step": 31820, "epoch": 383} {"train_loss": -18.908456802368164, "global_step": 31821, "epoch": 383} {"train_loss": -19.290395736694336, "global_step": 31822, "epoch": 383} {"train_loss": -19.304651260375977, "global_step": 31823, "epoch": 383} {"train_loss": -19.036407470703125, "global_step": 31824, "epoch": 383} {"train_loss": -19.298583984375, "global_step": 31825, "epoch": 383} {"train_loss": -18.728445053100586, "global_step": 31826, "epoch": 383} {"train_loss": -19.293394088745117, "global_step": 31827, "epoch": 383} {"train_loss": -19.187341690063477, "global_step": 31828, "epoch": 383} {"train_loss": -19.440332412719727, "global_step": 31829, "epoch": 383} {"train_loss": -19.15419578552246, "global_step": 31830, "epoch": 383} {"train_loss": -19.542774200439453, "global_step": 31831, "epoch": 383} {"train_loss": -18.642797470092773, "global_step": 31832, "epoch": 383} {"train_loss": -18.891357421875, "global_step": 31833, "epoch": 383} {"train_loss": -19.131895065307617, "global_step": 31834, "epoch": 383} {"train_loss": -19.24407386779785, "global_step": 31835, "epoch": 383} {"train_loss": -18.723163604736328, "global_step": 31836, "epoch": 383} {"train_loss": -19.014333724975586, "global_step": 31837, "epoch": 383} {"train_loss": -19.2681884765625, "global_step": 31838, "epoch": 383} {"train_loss": -18.661447525024414, "global_step": 31839, "epoch": 383} {"train_loss": -18.7557430267334, "global_step": 31840, "epoch": 383} {"train_loss": -19.11678123474121, "global_step": 31841, "epoch": 383} {"train_loss": -18.981061935424805, "global_step": 31842, "epoch": 383} {"train_loss": -18.73738670349121, "global_step": 31843, "epoch": 383} {"train_loss": -19.103715896606445, "global_step": 31844, "epoch": 383} {"train_loss": -18.88498878479004, "global_step": 31845, "epoch": 383} {"train_loss": -18.644498825073242, "global_step": 31846, "epoch": 383} {"train_loss": -19.05662727355957, "global_step": 31847, "epoch": 383} {"train_loss": -19.27715492248535, "global_step": 31848, "epoch": 383} {"train_loss": -19.164648056030273, "global_step": 31849, "epoch": 383} {"train_loss": -18.983304977416992, "global_step": 31850, "epoch": 383} {"train_loss": -19.020706176757812, "global_step": 31851, "epoch": 383} {"train_loss": -19.070816040039062, "global_step": 31852, "epoch": 383} {"train_loss": -18.892444610595703, "global_step": 31853, "epoch": 383} {"train_loss": -19.02423667907715, "global_step": 31854, "epoch": 383} {"train_loss": -19.235788345336914, "global_step": 31855, "epoch": 383} {"train_loss": -19.151371002197266, "global_step": 31856, "epoch": 383} {"train_loss": -18.697431564331055, "global_step": 31857, "epoch": 383} {"train_loss": -18.585071563720703, "global_step": 31858, "epoch": 383} {"train_loss": -19.366544723510742, "global_step": 31859, "epoch": 383} {"train_loss": -19.0859432220459, "global_step": 31860, "epoch": 383} {"train_loss": -19.045766830444336, "global_step": 31861, "epoch": 383} {"train_loss": -18.901090621948242, "global_step": 31862, "epoch": 383} {"train_loss": -19.376861572265625, "global_step": 31863, "epoch": 383} {"train_loss": -19.12286949157715, "global_step": 31864, "epoch": 383} {"train_loss": -19.03254508972168, "global_step": 31865, "epoch": 383} {"train_loss": -18.893329620361328, "global_step": 31866, "epoch": 383} {"train_loss": -19.128280639648438, "global_step": 31867, "epoch": 383} {"train_loss": -19.209400177001953, "global_step": 31868, "epoch": 383} {"train_loss": -18.994726181030273, "global_step": 31869, "epoch": 383} {"train_loss": -18.907758712768555, "global_step": 31870, "epoch": 383} {"train_loss": -19.030248412166735, "global_step": 31871, "epoch": 383, "val_loss": 6034498.5} {"train_loss": -18.652524948120117, "global_step": 31872, "epoch": 384} {"train_loss": -18.849929809570312, "global_step": 31873, "epoch": 384} {"train_loss": -19.26266098022461, "global_step": 31874, "epoch": 384} {"train_loss": -19.00010108947754, "global_step": 31875, "epoch": 384} {"train_loss": -18.892911911010742, "global_step": 31876, "epoch": 384} {"train_loss": -18.856443405151367, "global_step": 31877, "epoch": 384} {"train_loss": -18.723722457885742, "global_step": 31878, "epoch": 384} {"train_loss": -18.89408302307129, "global_step": 31879, "epoch": 384} {"train_loss": -19.212182998657227, "global_step": 31880, "epoch": 384} {"train_loss": -19.079254150390625, "global_step": 31881, "epoch": 384} {"train_loss": -18.522735595703125, "global_step": 31882, "epoch": 384} {"train_loss": -19.15082359313965, "global_step": 31883, "epoch": 384} {"train_loss": -19.14600944519043, "global_step": 31884, "epoch": 384} {"train_loss": -19.167875289916992, "global_step": 31885, "epoch": 384} {"train_loss": -18.591848373413086, "global_step": 31886, "epoch": 384} {"train_loss": -18.711090087890625, "global_step": 31887, "epoch": 384} {"train_loss": -18.991872787475586, "global_step": 31888, "epoch": 384} {"train_loss": -19.06304931640625, "global_step": 31889, "epoch": 384} {"train_loss": -19.2504940032959, "global_step": 31890, "epoch": 384} {"train_loss": -18.908145904541016, "global_step": 31891, "epoch": 384} {"train_loss": -19.048425674438477, "global_step": 31892, "epoch": 384} {"train_loss": -18.776025772094727, "global_step": 31893, "epoch": 384} {"train_loss": -18.864883422851562, "global_step": 31894, "epoch": 384} {"train_loss": -19.02149772644043, "global_step": 31895, "epoch": 384} {"train_loss": -19.07604217529297, "global_step": 31896, "epoch": 384} {"train_loss": -18.85642433166504, "global_step": 31897, "epoch": 384} {"train_loss": -18.86821937561035, "global_step": 31898, "epoch": 384} {"train_loss": -19.066587448120117, "global_step": 31899, "epoch": 384} {"train_loss": -18.83353042602539, "global_step": 31900, "epoch": 384} {"train_loss": -19.235219955444336, "global_step": 31901, "epoch": 384} {"train_loss": -19.232685089111328, "global_step": 31902, "epoch": 384} {"train_loss": -19.383146286010742, "global_step": 31903, "epoch": 384} {"train_loss": -18.990449905395508, "global_step": 31904, "epoch": 384} {"train_loss": -19.019878387451172, "global_step": 31905, "epoch": 384} {"train_loss": -18.806730270385742, "global_step": 31906, "epoch": 384} {"train_loss": -19.09419059753418, "global_step": 31907, "epoch": 384} {"train_loss": -19.10982322692871, "global_step": 31908, "epoch": 384} {"train_loss": -18.95988655090332, "global_step": 31909, "epoch": 384} {"train_loss": -19.205848693847656, "global_step": 31910, "epoch": 384} {"train_loss": -19.261510848999023, "global_step": 31911, "epoch": 384} {"train_loss": -18.96221923828125, "global_step": 31912, "epoch": 384} {"train_loss": -18.924936294555664, "global_step": 31913, "epoch": 384} {"train_loss": -18.814777374267578, "global_step": 31914, "epoch": 384} {"train_loss": -19.23943519592285, "global_step": 31915, "epoch": 384} {"train_loss": -19.02166175842285, "global_step": 31916, "epoch": 384} {"train_loss": -19.205230712890625, "global_step": 31917, "epoch": 384} {"train_loss": -18.812255859375, "global_step": 31918, "epoch": 384} {"train_loss": -18.973011016845703, "global_step": 31919, "epoch": 384} {"train_loss": -19.3037052154541, "global_step": 31920, "epoch": 384} {"train_loss": -19.38275718688965, "global_step": 31921, "epoch": 384} {"train_loss": -19.1870174407959, "global_step": 31922, "epoch": 384} {"train_loss": -19.053136825561523, "global_step": 31923, "epoch": 384} {"train_loss": -18.79616355895996, "global_step": 31924, "epoch": 384} {"train_loss": -18.85037612915039, "global_step": 31925, "epoch": 384} {"train_loss": -18.959243774414062, "global_step": 31926, "epoch": 384} {"train_loss": -19.308521270751953, "global_step": 31927, "epoch": 384} {"train_loss": -19.1866512298584, "global_step": 31928, "epoch": 384} {"train_loss": -19.08831214904785, "global_step": 31929, "epoch": 384} {"train_loss": -19.140430450439453, "global_step": 31930, "epoch": 384} {"train_loss": -18.982486724853516, "global_step": 31931, "epoch": 384} {"train_loss": -19.157669067382812, "global_step": 31932, "epoch": 384} {"train_loss": -18.9810733795166, "global_step": 31933, "epoch": 384} {"train_loss": -19.15000343322754, "global_step": 31934, "epoch": 384} {"train_loss": -18.98055076599121, "global_step": 31935, "epoch": 384} {"train_loss": -19.170927047729492, "global_step": 31936, "epoch": 384} {"train_loss": -18.83060073852539, "global_step": 31937, "epoch": 384} {"train_loss": -18.949384689331055, "global_step": 31938, "epoch": 384} {"train_loss": -19.072147369384766, "global_step": 31939, "epoch": 384} {"train_loss": -18.96539306640625, "global_step": 31940, "epoch": 384} {"train_loss": -18.712085723876953, "global_step": 31941, "epoch": 384} {"train_loss": -18.87381362915039, "global_step": 31942, "epoch": 384} {"train_loss": -18.92039680480957, "global_step": 31943, "epoch": 384} {"train_loss": -19.34354591369629, "global_step": 31944, "epoch": 384} {"train_loss": -19.006086349487305, "global_step": 31945, "epoch": 384} {"train_loss": -19.180622100830078, "global_step": 31946, "epoch": 384} {"train_loss": -19.06229591369629, "global_step": 31947, "epoch": 384} {"train_loss": -19.080175399780273, "global_step": 31948, "epoch": 384} {"train_loss": -18.65719985961914, "global_step": 31949, "epoch": 384} {"train_loss": -19.15457534790039, "global_step": 31950, "epoch": 384} {"train_loss": -19.2135066986084, "global_step": 31951, "epoch": 384} {"train_loss": -18.94449806213379, "global_step": 31952, "epoch": 384} {"train_loss": -19.0341739654541, "global_step": 31953, "epoch": 384} {"train_loss": -19.027097564145745, "global_step": 31954, "epoch": 384, "val_loss": 6125563.0} {"train_loss": -18.633209228515625, "global_step": 31955, "epoch": 385} {"train_loss": -19.04156494140625, "global_step": 31956, "epoch": 385} {"train_loss": -19.26828956604004, "global_step": 31957, "epoch": 385} {"train_loss": -18.864734649658203, "global_step": 31958, "epoch": 385} {"train_loss": -18.743549346923828, "global_step": 31959, "epoch": 385} {"train_loss": -18.988346099853516, "global_step": 31960, "epoch": 385} {"train_loss": -19.1536865234375, "global_step": 31961, "epoch": 385} {"train_loss": -18.890289306640625, "global_step": 31962, "epoch": 385} {"train_loss": -18.792564392089844, "global_step": 31963, "epoch": 385} {"train_loss": -19.309146881103516, "global_step": 31964, "epoch": 385} {"train_loss": -18.721567153930664, "global_step": 31965, "epoch": 385} {"train_loss": -18.72828483581543, "global_step": 31966, "epoch": 385} {"train_loss": -19.282339096069336, "global_step": 31967, "epoch": 385} {"train_loss": -18.64344596862793, "global_step": 31968, "epoch": 385} {"train_loss": -18.961082458496094, "global_step": 31969, "epoch": 385} {"train_loss": -18.88350486755371, "global_step": 31970, "epoch": 385} {"train_loss": -19.191055297851562, "global_step": 31971, "epoch": 385} {"train_loss": -19.205175399780273, "global_step": 31972, "epoch": 385} {"train_loss": -18.882776260375977, "global_step": 31973, "epoch": 385} {"train_loss": -18.821269989013672, "global_step": 31974, "epoch": 385} {"train_loss": -19.05778694152832, "global_step": 31975, "epoch": 385} {"train_loss": -18.806116104125977, "global_step": 31976, "epoch": 385} {"train_loss": -18.623205184936523, "global_step": 31977, "epoch": 385} {"train_loss": -18.79188346862793, "global_step": 31978, "epoch": 385} {"train_loss": -19.113975524902344, "global_step": 31979, "epoch": 385} {"train_loss": -19.137805938720703, "global_step": 31980, "epoch": 385} {"train_loss": -19.066360473632812, "global_step": 31981, "epoch": 385} {"train_loss": -18.874971389770508, "global_step": 31982, "epoch": 385} {"train_loss": -18.7733154296875, "global_step": 31983, "epoch": 385} {"train_loss": -19.169103622436523, "global_step": 31984, "epoch": 385} {"train_loss": -19.107534408569336, "global_step": 31985, "epoch": 385} {"train_loss": -19.122344970703125, "global_step": 31986, "epoch": 385} {"train_loss": -19.36226463317871, "global_step": 31987, "epoch": 385} {"train_loss": -18.941892623901367, "global_step": 31988, "epoch": 385} {"train_loss": -19.173307418823242, "global_step": 31989, "epoch": 385} {"train_loss": -18.976852416992188, "global_step": 31990, "epoch": 385} {"train_loss": -18.891700744628906, "global_step": 31991, "epoch": 385} {"train_loss": -19.160402297973633, "global_step": 31992, "epoch": 385} {"train_loss": -19.358747482299805, "global_step": 31993, "epoch": 385} {"train_loss": -19.15973472595215, "global_step": 31994, "epoch": 385} {"train_loss": -19.184274673461914, "global_step": 31995, "epoch": 385} {"train_loss": -18.741775512695312, "global_step": 31996, "epoch": 385} {"train_loss": -19.1273136138916, "global_step": 31997, "epoch": 385} {"train_loss": -19.101505279541016, "global_step": 31998, "epoch": 385} {"train_loss": -18.892452239990234, "global_step": 31999, "epoch": 385} {"train_loss": -19.295673370361328, "global_step": 32000, "epoch": 385} {"train_loss": -18.656606674194336, "global_step": 32001, "epoch": 385} {"train_loss": -19.098735809326172, "global_step": 32002, "epoch": 385} {"train_loss": -19.029081344604492, "global_step": 32003, "epoch": 385} {"train_loss": -18.99672508239746, "global_step": 32004, "epoch": 385} {"train_loss": -19.132421493530273, "global_step": 32005, "epoch": 385} {"train_loss": -19.0707950592041, "global_step": 32006, "epoch": 385} {"train_loss": -18.94441032409668, "global_step": 32007, "epoch": 385} {"train_loss": -19.105789184570312, "global_step": 32008, "epoch": 385} {"train_loss": -19.04123306274414, "global_step": 32009, "epoch": 385} {"train_loss": -19.3426456451416, "global_step": 32010, "epoch": 385} {"train_loss": -18.791751861572266, "global_step": 32011, "epoch": 385} {"train_loss": -19.178598403930664, "global_step": 32012, "epoch": 385} {"train_loss": -18.870786666870117, "global_step": 32013, "epoch": 385} {"train_loss": -19.406118392944336, "global_step": 32014, "epoch": 385} {"train_loss": -18.901681900024414, "global_step": 32015, "epoch": 385} {"train_loss": -19.050718307495117, "global_step": 32016, "epoch": 385} {"train_loss": -19.099714279174805, "global_step": 32017, "epoch": 385} {"train_loss": -19.051645278930664, "global_step": 32018, "epoch": 385} {"train_loss": -19.199405670166016, "global_step": 32019, "epoch": 385} {"train_loss": -19.140539169311523, "global_step": 32020, "epoch": 385} {"train_loss": -18.95164680480957, "global_step": 32021, "epoch": 385} {"train_loss": -19.14476203918457, "global_step": 32022, "epoch": 385} {"train_loss": -19.263486862182617, "global_step": 32023, "epoch": 385} {"train_loss": -19.18166160583496, "global_step": 32024, "epoch": 385} {"train_loss": -19.232038497924805, "global_step": 32025, "epoch": 385} {"train_loss": -19.254140853881836, "global_step": 32026, "epoch": 385} {"train_loss": -19.27994155883789, "global_step": 32027, "epoch": 385} {"train_loss": -19.318952560424805, "global_step": 32028, "epoch": 385} {"train_loss": -19.320098876953125, "global_step": 32029, "epoch": 385} {"train_loss": -18.85023307800293, "global_step": 32030, "epoch": 385} {"train_loss": -18.832733154296875, "global_step": 32031, "epoch": 385} {"train_loss": -18.96075439453125, "global_step": 32032, "epoch": 385} {"train_loss": -19.227981567382812, "global_step": 32033, "epoch": 385} {"train_loss": -18.95288848876953, "global_step": 32034, "epoch": 385} {"train_loss": -18.86690330505371, "global_step": 32035, "epoch": 385} {"train_loss": -19.20062255859375, "global_step": 32036, "epoch": 385} {"train_loss": -19.03010582062135, "global_step": 32037, "epoch": 385, "val_loss": 6009516.0} {"train_loss": -18.69609260559082, "global_step": 32038, "epoch": 386} {"train_loss": -18.43582534790039, "global_step": 32039, "epoch": 386} {"train_loss": -19.05100440979004, "global_step": 32040, "epoch": 386} {"train_loss": -19.00179100036621, "global_step": 32041, "epoch": 386} {"train_loss": -19.084196090698242, "global_step": 32042, "epoch": 386} {"train_loss": -19.10357666015625, "global_step": 32043, "epoch": 386} {"train_loss": -19.099306106567383, "global_step": 32044, "epoch": 386} {"train_loss": -18.565067291259766, "global_step": 32045, "epoch": 386} {"train_loss": -18.88759422302246, "global_step": 32046, "epoch": 386} {"train_loss": -18.863245010375977, "global_step": 32047, "epoch": 386} {"train_loss": -18.575790405273438, "global_step": 32048, "epoch": 386} {"train_loss": -18.96058464050293, "global_step": 32049, "epoch": 386} {"train_loss": -19.219200134277344, "global_step": 32050, "epoch": 386} {"train_loss": -18.806615829467773, "global_step": 32051, "epoch": 386} {"train_loss": -18.965484619140625, "global_step": 32052, "epoch": 386} {"train_loss": -18.921838760375977, "global_step": 32053, "epoch": 386} {"train_loss": -18.890634536743164, "global_step": 32054, "epoch": 386} {"train_loss": -18.857242584228516, "global_step": 32055, "epoch": 386} {"train_loss": -18.853818893432617, "global_step": 32056, "epoch": 386} {"train_loss": -18.65432357788086, "global_step": 32057, "epoch": 386} {"train_loss": -18.986286163330078, "global_step": 32058, "epoch": 386} {"train_loss": -18.770151138305664, "global_step": 32059, "epoch": 386} {"train_loss": -18.887754440307617, "global_step": 32060, "epoch": 386} {"train_loss": -18.55744743347168, "global_step": 32061, "epoch": 386} {"train_loss": -18.711027145385742, "global_step": 32062, "epoch": 386} {"train_loss": -19.093852996826172, "global_step": 32063, "epoch": 386} {"train_loss": -18.956281661987305, "global_step": 32064, "epoch": 386} {"train_loss": -18.89711570739746, "global_step": 32065, "epoch": 386} {"train_loss": -18.827756881713867, "global_step": 32066, "epoch": 386} {"train_loss": -19.000051498413086, "global_step": 32067, "epoch": 386} {"train_loss": -18.89896011352539, "global_step": 32068, "epoch": 386} {"train_loss": -18.892322540283203, "global_step": 32069, "epoch": 386} {"train_loss": -19.219436645507812, "global_step": 32070, "epoch": 386} {"train_loss": -18.778512954711914, "global_step": 32071, "epoch": 386} {"train_loss": -19.0523738861084, "global_step": 32072, "epoch": 386} {"train_loss": -19.050737380981445, "global_step": 32073, "epoch": 386} {"train_loss": -19.313718795776367, "global_step": 32074, "epoch": 386} {"train_loss": -19.25870704650879, "global_step": 32075, "epoch": 386} {"train_loss": -19.49960708618164, "global_step": 32076, "epoch": 386} {"train_loss": -18.517423629760742, "global_step": 32077, "epoch": 386} {"train_loss": -18.870803833007812, "global_step": 32078, "epoch": 386} {"train_loss": -19.0651912689209, "global_step": 32079, "epoch": 386} {"train_loss": -19.127944946289062, "global_step": 32080, "epoch": 386} {"train_loss": -19.025358200073242, "global_step": 32081, "epoch": 386} {"train_loss": -19.458053588867188, "global_step": 32082, "epoch": 386} {"train_loss": -19.046125411987305, "global_step": 32083, "epoch": 386} {"train_loss": -19.126117706298828, "global_step": 32084, "epoch": 386} {"train_loss": -18.94858741760254, "global_step": 32085, "epoch": 386} {"train_loss": -18.974870681762695, "global_step": 32086, "epoch": 386} {"train_loss": -18.89361572265625, "global_step": 32087, "epoch": 386} {"train_loss": -19.119211196899414, "global_step": 32088, "epoch": 386} {"train_loss": -18.834033966064453, "global_step": 32089, "epoch": 386} {"train_loss": -19.18681526184082, "global_step": 32090, "epoch": 386} {"train_loss": -19.31258201599121, "global_step": 32091, "epoch": 386} {"train_loss": -19.083927154541016, "global_step": 32092, "epoch": 386} {"train_loss": -19.440881729125977, "global_step": 32093, "epoch": 386} {"train_loss": -18.84358024597168, "global_step": 32094, "epoch": 386} {"train_loss": -19.13579559326172, "global_step": 32095, "epoch": 386} {"train_loss": -18.68759536743164, "global_step": 32096, "epoch": 386} {"train_loss": -19.02602195739746, "global_step": 32097, "epoch": 386} {"train_loss": -19.057601928710938, "global_step": 32098, "epoch": 386} {"train_loss": -19.160686492919922, "global_step": 32099, "epoch": 386} {"train_loss": -19.169584274291992, "global_step": 32100, "epoch": 386} {"train_loss": -19.272464752197266, "global_step": 32101, "epoch": 386} {"train_loss": -18.820581436157227, "global_step": 32102, "epoch": 386} {"train_loss": -18.903766632080078, "global_step": 32103, "epoch": 386} {"train_loss": -18.84969139099121, "global_step": 32104, "epoch": 386} {"train_loss": -19.095975875854492, "global_step": 32105, "epoch": 386} {"train_loss": -18.96687126159668, "global_step": 32106, "epoch": 386} {"train_loss": -19.392160415649414, "global_step": 32107, "epoch": 386} {"train_loss": -19.088109970092773, "global_step": 32108, "epoch": 386} {"train_loss": -19.392194747924805, "global_step": 32109, "epoch": 386} {"train_loss": -19.129789352416992, "global_step": 32110, "epoch": 386} {"train_loss": -18.876068115234375, "global_step": 32111, "epoch": 386} {"train_loss": -19.45287322998047, "global_step": 32112, "epoch": 386} {"train_loss": -18.772153854370117, "global_step": 32113, "epoch": 386} {"train_loss": -19.214765548706055, "global_step": 32114, "epoch": 386} {"train_loss": -19.210418701171875, "global_step": 32115, "epoch": 386} {"train_loss": -18.952138900756836, "global_step": 32116, "epoch": 386} {"train_loss": -19.172536849975586, "global_step": 32117, "epoch": 386} {"train_loss": -19.112730026245117, "global_step": 32118, "epoch": 386} {"train_loss": -19.216745376586914, "global_step": 32119, "epoch": 386} {"train_loss": -19.00780528424734, "global_step": 32120, "epoch": 386, "val_loss": 6177068.0} {"train_loss": -18.55415153503418, "global_step": 32121, "epoch": 387} {"train_loss": -19.128517150878906, "global_step": 32122, "epoch": 387} {"train_loss": -18.812149047851562, "global_step": 32123, "epoch": 387} {"train_loss": -19.046300888061523, "global_step": 32124, "epoch": 387} {"train_loss": -18.479001998901367, "global_step": 32125, "epoch": 387} {"train_loss": -18.748289108276367, "global_step": 32126, "epoch": 387} {"train_loss": -18.687179565429688, "global_step": 32127, "epoch": 387} {"train_loss": -18.856054306030273, "global_step": 32128, "epoch": 387} {"train_loss": -18.87532615661621, "global_step": 32129, "epoch": 387} {"train_loss": -18.517141342163086, "global_step": 32130, "epoch": 387} {"train_loss": -18.948429107666016, "global_step": 32131, "epoch": 387} {"train_loss": -18.778629302978516, "global_step": 32132, "epoch": 387} {"train_loss": -19.02383804321289, "global_step": 32133, "epoch": 387} {"train_loss": -19.010801315307617, "global_step": 32134, "epoch": 387} {"train_loss": -18.90115737915039, "global_step": 32135, "epoch": 387} {"train_loss": -18.983083724975586, "global_step": 32136, "epoch": 387} {"train_loss": -19.140148162841797, "global_step": 32137, "epoch": 387} {"train_loss": -19.031478881835938, "global_step": 32138, "epoch": 387} {"train_loss": -18.70220375061035, "global_step": 32139, "epoch": 387} {"train_loss": -18.9228515625, "global_step": 32140, "epoch": 387} {"train_loss": -19.204410552978516, "global_step": 32141, "epoch": 387} {"train_loss": -19.294788360595703, "global_step": 32142, "epoch": 387} {"train_loss": -19.236846923828125, "global_step": 32143, "epoch": 387} {"train_loss": -18.773681640625, "global_step": 32144, "epoch": 387} {"train_loss": -19.16849708557129, "global_step": 32145, "epoch": 387} {"train_loss": -18.900360107421875, "global_step": 32146, "epoch": 387} {"train_loss": -18.96925163269043, "global_step": 32147, "epoch": 387} {"train_loss": -18.784330368041992, "global_step": 32148, "epoch": 387} {"train_loss": -19.16414451599121, "global_step": 32149, "epoch": 387} {"train_loss": -19.341257095336914, "global_step": 32150, "epoch": 387} {"train_loss": -19.047025680541992, "global_step": 32151, "epoch": 387} {"train_loss": -18.803224563598633, "global_step": 32152, "epoch": 387} {"train_loss": -18.7790470123291, "global_step": 32153, "epoch": 387} {"train_loss": -18.93512535095215, "global_step": 32154, "epoch": 387} {"train_loss": -18.80482292175293, "global_step": 32155, "epoch": 387} {"train_loss": -19.079151153564453, "global_step": 32156, "epoch": 387} {"train_loss": -19.031736373901367, "global_step": 32157, "epoch": 387} {"train_loss": -18.64259147644043, "global_step": 32158, "epoch": 387} {"train_loss": -19.117334365844727, "global_step": 32159, "epoch": 387} {"train_loss": -19.42039680480957, "global_step": 32160, "epoch": 387} {"train_loss": -19.247724533081055, "global_step": 32161, "epoch": 387} {"train_loss": -19.00739097595215, "global_step": 32162, "epoch": 387} {"train_loss": -18.834028244018555, "global_step": 32163, "epoch": 387} {"train_loss": -19.6082706451416, "global_step": 32164, "epoch": 387} {"train_loss": -18.961301803588867, "global_step": 32165, "epoch": 387} {"train_loss": -19.04132652282715, "global_step": 32166, "epoch": 387} {"train_loss": -19.1009464263916, "global_step": 32167, "epoch": 387} {"train_loss": -19.049057006835938, "global_step": 32168, "epoch": 387} {"train_loss": -19.16387939453125, "global_step": 32169, "epoch": 387} {"train_loss": -19.157140731811523, "global_step": 32170, "epoch": 387} {"train_loss": -18.886600494384766, "global_step": 32171, "epoch": 387} {"train_loss": -19.610328674316406, "global_step": 32172, "epoch": 387} {"train_loss": -19.191118240356445, "global_step": 32173, "epoch": 387} {"train_loss": -19.26626205444336, "global_step": 32174, "epoch": 387} {"train_loss": -19.040891647338867, "global_step": 32175, "epoch": 387} {"train_loss": -18.92354965209961, "global_step": 32176, "epoch": 387} {"train_loss": -18.96634864807129, "global_step": 32177, "epoch": 387} {"train_loss": -19.082096099853516, "global_step": 32178, "epoch": 387} {"train_loss": -19.464208602905273, "global_step": 32179, "epoch": 387} {"train_loss": -19.11263084411621, "global_step": 32180, "epoch": 387} {"train_loss": -19.2393798828125, "global_step": 32181, "epoch": 387} {"train_loss": -19.076187133789062, "global_step": 32182, "epoch": 387} {"train_loss": -18.880319595336914, "global_step": 32183, "epoch": 387} {"train_loss": -19.046070098876953, "global_step": 32184, "epoch": 387} {"train_loss": -18.745105743408203, "global_step": 32185, "epoch": 387} {"train_loss": -19.167661666870117, "global_step": 32186, "epoch": 387} {"train_loss": -18.919965744018555, "global_step": 32187, "epoch": 387} {"train_loss": -19.19753074645996, "global_step": 32188, "epoch": 387} {"train_loss": -19.191871643066406, "global_step": 32189, "epoch": 387} {"train_loss": -18.726993560791016, "global_step": 32190, "epoch": 387} {"train_loss": -18.896486282348633, "global_step": 32191, "epoch": 387} {"train_loss": -19.48575782775879, "global_step": 32192, "epoch": 387} {"train_loss": -19.114282608032227, "global_step": 32193, "epoch": 387} {"train_loss": -18.999731063842773, "global_step": 32194, "epoch": 387} {"train_loss": -19.200511932373047, "global_step": 32195, "epoch": 387} {"train_loss": -19.383033752441406, "global_step": 32196, "epoch": 387} {"train_loss": -19.19914436340332, "global_step": 32197, "epoch": 387} {"train_loss": -19.220340728759766, "global_step": 32198, "epoch": 387} {"train_loss": -19.616802215576172, "global_step": 32199, "epoch": 387} {"train_loss": -19.111495971679688, "global_step": 32200, "epoch": 387} {"train_loss": -18.967634201049805, "global_step": 32201, "epoch": 387} {"train_loss": -19.43951988220215, "global_step": 32202, "epoch": 387} {"train_loss": -19.01100174777479, "global_step": 32203, "epoch": 387, "val_loss": 6085395.5} {"train_loss": -18.545684814453125, "global_step": 32204, "epoch": 388} {"train_loss": -18.967138290405273, "global_step": 32205, "epoch": 388} {"train_loss": -18.777629852294922, "global_step": 32206, "epoch": 388} {"train_loss": -18.6163387298584, "global_step": 32207, "epoch": 388} {"train_loss": -18.92292594909668, "global_step": 32208, "epoch": 388} {"train_loss": -18.949440002441406, "global_step": 32209, "epoch": 388} {"train_loss": -19.019712448120117, "global_step": 32210, "epoch": 388} {"train_loss": -19.039682388305664, "global_step": 32211, "epoch": 388} {"train_loss": -18.608016967773438, "global_step": 32212, "epoch": 388} {"train_loss": -18.953397750854492, "global_step": 32213, "epoch": 388} {"train_loss": -18.97184181213379, "global_step": 32214, "epoch": 388} {"train_loss": -18.77330207824707, "global_step": 32215, "epoch": 388} {"train_loss": -19.048728942871094, "global_step": 32216, "epoch": 388} {"train_loss": -19.160499572753906, "global_step": 32217, "epoch": 388} {"train_loss": -19.206239700317383, "global_step": 32218, "epoch": 388} {"train_loss": -18.832763671875, "global_step": 32219, "epoch": 388} {"train_loss": -18.818159103393555, "global_step": 32220, "epoch": 388} {"train_loss": -19.301593780517578, "global_step": 32221, "epoch": 388} {"train_loss": -19.01828956604004, "global_step": 32222, "epoch": 388} {"train_loss": -18.697134017944336, "global_step": 32223, "epoch": 388} {"train_loss": -19.361202239990234, "global_step": 32224, "epoch": 388} {"train_loss": -19.097713470458984, "global_step": 32225, "epoch": 388} {"train_loss": -19.03911781311035, "global_step": 32226, "epoch": 388} {"train_loss": -19.0253963470459, "global_step": 32227, "epoch": 388} {"train_loss": -19.208984375, "global_step": 32228, "epoch": 388} {"train_loss": -19.2584285736084, "global_step": 32229, "epoch": 388} {"train_loss": -18.901735305786133, "global_step": 32230, "epoch": 388} {"train_loss": -19.080062866210938, "global_step": 32231, "epoch": 388} {"train_loss": -19.03631591796875, "global_step": 32232, "epoch": 388} {"train_loss": -18.89668846130371, "global_step": 32233, "epoch": 388} {"train_loss": -18.99153709411621, "global_step": 32234, "epoch": 388} {"train_loss": -18.90020751953125, "global_step": 32235, "epoch": 388} {"train_loss": -18.987586975097656, "global_step": 32236, "epoch": 388} {"train_loss": -18.809669494628906, "global_step": 32237, "epoch": 388} {"train_loss": -18.970048904418945, "global_step": 32238, "epoch": 388} {"train_loss": -19.02151870727539, "global_step": 32239, "epoch": 388} {"train_loss": -19.164501190185547, "global_step": 32240, "epoch": 388} {"train_loss": -18.8128662109375, "global_step": 32241, "epoch": 388} {"train_loss": -18.79701805114746, "global_step": 32242, "epoch": 388} {"train_loss": -19.465261459350586, "global_step": 32243, "epoch": 388} {"train_loss": -18.961750030517578, "global_step": 32244, "epoch": 388} {"train_loss": -19.00859832763672, "global_step": 32245, "epoch": 388} {"train_loss": -18.805591583251953, "global_step": 32246, "epoch": 388} {"train_loss": -19.314807891845703, "global_step": 32247, "epoch": 388} {"train_loss": -19.019792556762695, "global_step": 32248, "epoch": 388} {"train_loss": -18.71610450744629, "global_step": 32249, "epoch": 388} {"train_loss": -18.661222457885742, "global_step": 32250, "epoch": 388} {"train_loss": -19.196990966796875, "global_step": 32251, "epoch": 388} {"train_loss": -19.4412784576416, "global_step": 32252, "epoch": 388} {"train_loss": -19.560163497924805, "global_step": 32253, "epoch": 388} {"train_loss": -19.256805419921875, "global_step": 32254, "epoch": 388} {"train_loss": -18.788970947265625, "global_step": 32255, "epoch": 388} {"train_loss": -19.034826278686523, "global_step": 32256, "epoch": 388} {"train_loss": -19.099042892456055, "global_step": 32257, "epoch": 388} {"train_loss": -19.04465675354004, "global_step": 32258, "epoch": 388} {"train_loss": -19.250995635986328, "global_step": 32259, "epoch": 388} {"train_loss": -18.998376846313477, "global_step": 32260, "epoch": 388} {"train_loss": -19.023096084594727, "global_step": 32261, "epoch": 388} {"train_loss": -19.037704467773438, "global_step": 32262, "epoch": 388} {"train_loss": -19.251571655273438, "global_step": 32263, "epoch": 388} {"train_loss": -19.165983200073242, "global_step": 32264, "epoch": 388} {"train_loss": -19.00282859802246, "global_step": 32265, "epoch": 388} {"train_loss": -19.208059310913086, "global_step": 32266, "epoch": 388} {"train_loss": -18.467281341552734, "global_step": 32267, "epoch": 388} {"train_loss": -18.98154067993164, "global_step": 32268, "epoch": 388} {"train_loss": -19.287694931030273, "global_step": 32269, "epoch": 388} {"train_loss": -19.37769317626953, "global_step": 32270, "epoch": 388} {"train_loss": -19.158084869384766, "global_step": 32271, "epoch": 388} {"train_loss": -18.91650390625, "global_step": 32272, "epoch": 388} {"train_loss": -19.170196533203125, "global_step": 32273, "epoch": 388} {"train_loss": -19.111886978149414, "global_step": 32274, "epoch": 388} {"train_loss": -19.441272735595703, "global_step": 32275, "epoch": 388} {"train_loss": -19.52622413635254, "global_step": 32276, "epoch": 388} {"train_loss": -19.161787033081055, "global_step": 32277, "epoch": 388} {"train_loss": -19.0878849029541, "global_step": 32278, "epoch": 388} {"train_loss": -19.099781036376953, "global_step": 32279, "epoch": 388} {"train_loss": -18.954906463623047, "global_step": 32280, "epoch": 388} {"train_loss": -19.09477424621582, "global_step": 32281, "epoch": 388} {"train_loss": -18.937997817993164, "global_step": 32282, "epoch": 388} {"train_loss": -18.978307723999023, "global_step": 32283, "epoch": 388} {"train_loss": -19.161142349243164, "global_step": 32284, "epoch": 388} {"train_loss": -19.085586547851562, "global_step": 32285, "epoch": 388} {"train_loss": -19.045277859791216, "global_step": 32286, "epoch": 388, "val_loss": 6044896.0} {"train_loss": -18.549318313598633, "global_step": 32287, "epoch": 389} {"train_loss": -18.907400131225586, "global_step": 32288, "epoch": 389} {"train_loss": -18.52388572692871, "global_step": 32289, "epoch": 389} {"train_loss": -19.019376754760742, "global_step": 32290, "epoch": 389} {"train_loss": -18.493886947631836, "global_step": 32291, "epoch": 389} {"train_loss": -18.466707229614258, "global_step": 32292, "epoch": 389} {"train_loss": -18.777677536010742, "global_step": 32293, "epoch": 389} {"train_loss": -18.664169311523438, "global_step": 32294, "epoch": 389} {"train_loss": -18.988759994506836, "global_step": 32295, "epoch": 389} {"train_loss": -18.9370059967041, "global_step": 32296, "epoch": 389} {"train_loss": -18.745092391967773, "global_step": 32297, "epoch": 389} {"train_loss": -18.463422775268555, "global_step": 32298, "epoch": 389} {"train_loss": -18.659198760986328, "global_step": 32299, "epoch": 389} {"train_loss": -19.21864891052246, "global_step": 32300, "epoch": 389} {"train_loss": -19.34354019165039, "global_step": 32301, "epoch": 389} {"train_loss": -19.065916061401367, "global_step": 32302, "epoch": 389} {"train_loss": -19.046812057495117, "global_step": 32303, "epoch": 389} {"train_loss": -18.50164794921875, "global_step": 32304, "epoch": 389} {"train_loss": -18.8040714263916, "global_step": 32305, "epoch": 389} {"train_loss": -19.20456886291504, "global_step": 32306, "epoch": 389} {"train_loss": -18.786344528198242, "global_step": 32307, "epoch": 389} {"train_loss": -19.15310287475586, "global_step": 32308, "epoch": 389} {"train_loss": -18.918424606323242, "global_step": 32309, "epoch": 389} {"train_loss": -19.330121994018555, "global_step": 32310, "epoch": 389} {"train_loss": -19.243480682373047, "global_step": 32311, "epoch": 389} {"train_loss": -19.029190063476562, "global_step": 32312, "epoch": 389} {"train_loss": -19.011707305908203, "global_step": 32313, "epoch": 389} {"train_loss": -19.256690979003906, "global_step": 32314, "epoch": 389} {"train_loss": -18.822904586791992, "global_step": 32315, "epoch": 389} {"train_loss": -18.792062759399414, "global_step": 32316, "epoch": 389} {"train_loss": -19.129234313964844, "global_step": 32317, "epoch": 389} {"train_loss": -19.1384220123291, "global_step": 32318, "epoch": 389} {"train_loss": -18.88785743713379, "global_step": 32319, "epoch": 389} {"train_loss": -19.432584762573242, "global_step": 32320, "epoch": 389} {"train_loss": -19.248929977416992, "global_step": 32321, "epoch": 389} {"train_loss": -19.189029693603516, "global_step": 32322, "epoch": 389} {"train_loss": -19.174299240112305, "global_step": 32323, "epoch": 389} {"train_loss": -19.057540893554688, "global_step": 32324, "epoch": 389} {"train_loss": -19.343360900878906, "global_step": 32325, "epoch": 389} {"train_loss": -19.25712013244629, "global_step": 32326, "epoch": 389} {"train_loss": -19.311811447143555, "global_step": 32327, "epoch": 389} {"train_loss": -19.097248077392578, "global_step": 32328, "epoch": 389} {"train_loss": -18.98239517211914, "global_step": 32329, "epoch": 389} {"train_loss": -18.928115844726562, "global_step": 32330, "epoch": 389} {"train_loss": -18.795278549194336, "global_step": 32331, "epoch": 389} {"train_loss": -19.497671127319336, "global_step": 32332, "epoch": 389} {"train_loss": -19.32505989074707, "global_step": 32333, "epoch": 389} {"train_loss": -19.026920318603516, "global_step": 32334, "epoch": 389} {"train_loss": -19.03983497619629, "global_step": 32335, "epoch": 389} {"train_loss": -19.13446617126465, "global_step": 32336, "epoch": 389} {"train_loss": -18.896005630493164, "global_step": 32337, "epoch": 389} {"train_loss": -19.1047420501709, "global_step": 32338, "epoch": 389} {"train_loss": -18.748456954956055, "global_step": 32339, "epoch": 389} {"train_loss": -19.354185104370117, "global_step": 32340, "epoch": 389} {"train_loss": -18.95831871032715, "global_step": 32341, "epoch": 389} {"train_loss": -19.419126510620117, "global_step": 32342, "epoch": 389} {"train_loss": -18.84346580505371, "global_step": 32343, "epoch": 389} {"train_loss": -18.78058624267578, "global_step": 32344, "epoch": 389} {"train_loss": -18.56525230407715, "global_step": 32345, "epoch": 389} {"train_loss": -19.158916473388672, "global_step": 32346, "epoch": 389} {"train_loss": -19.04715919494629, "global_step": 32347, "epoch": 389} {"train_loss": -18.77716636657715, "global_step": 32348, "epoch": 389} {"train_loss": -18.742177963256836, "global_step": 32349, "epoch": 389} {"train_loss": -18.940603256225586, "global_step": 32350, "epoch": 389} {"train_loss": -19.13081932067871, "global_step": 32351, "epoch": 389} {"train_loss": -19.331850051879883, "global_step": 32352, "epoch": 389} {"train_loss": -19.05071449279785, "global_step": 32353, "epoch": 389} {"train_loss": -19.416887283325195, "global_step": 32354, "epoch": 389} {"train_loss": -18.680585861206055, "global_step": 32355, "epoch": 389} {"train_loss": -19.38310432434082, "global_step": 32356, "epoch": 389} {"train_loss": -19.02107810974121, "global_step": 32357, "epoch": 389} {"train_loss": -19.443559646606445, "global_step": 32358, "epoch": 389} {"train_loss": -19.29255485534668, "global_step": 32359, "epoch": 389} {"train_loss": -19.179004669189453, "global_step": 32360, "epoch": 389} {"train_loss": -18.981809616088867, "global_step": 32361, "epoch": 389} {"train_loss": -19.27152442932129, "global_step": 32362, "epoch": 389} {"train_loss": -18.97715187072754, "global_step": 32363, "epoch": 389} {"train_loss": -19.063751220703125, "global_step": 32364, "epoch": 389} {"train_loss": -19.527503967285156, "global_step": 32365, "epoch": 389} {"train_loss": -19.207632064819336, "global_step": 32366, "epoch": 389} {"train_loss": -18.79410171508789, "global_step": 32367, "epoch": 389} {"train_loss": -19.084733963012695, "global_step": 32368, "epoch": 389} {"train_loss": -19.02674737034074, "global_step": 32369, "epoch": 389, "val_loss": 5949817.5} {"train_loss": -18.759140014648438, "global_step": 32370, "epoch": 390} {"train_loss": -19.155855178833008, "global_step": 32371, "epoch": 390} {"train_loss": -19.102567672729492, "global_step": 32372, "epoch": 390} {"train_loss": -18.657852172851562, "global_step": 32373, "epoch": 390} {"train_loss": -18.96537208557129, "global_step": 32374, "epoch": 390} {"train_loss": -18.887786865234375, "global_step": 32375, "epoch": 390} {"train_loss": -18.9986515045166, "global_step": 32376, "epoch": 390} {"train_loss": -19.13899040222168, "global_step": 32377, "epoch": 390} {"train_loss": -18.742904663085938, "global_step": 32378, "epoch": 390} {"train_loss": -18.964168548583984, "global_step": 32379, "epoch": 390} {"train_loss": -18.908849716186523, "global_step": 32380, "epoch": 390} {"train_loss": -19.320966720581055, "global_step": 32381, "epoch": 390} {"train_loss": -19.114566802978516, "global_step": 32382, "epoch": 390} {"train_loss": -18.80916976928711, "global_step": 32383, "epoch": 390} {"train_loss": -19.055395126342773, "global_step": 32384, "epoch": 390} {"train_loss": -18.85568618774414, "global_step": 32385, "epoch": 390} {"train_loss": -18.934350967407227, "global_step": 32386, "epoch": 390} {"train_loss": -18.9896297454834, "global_step": 32387, "epoch": 390} {"train_loss": -19.112340927124023, "global_step": 32388, "epoch": 390} {"train_loss": -18.95436668395996, "global_step": 32389, "epoch": 390} {"train_loss": -18.9631404876709, "global_step": 32390, "epoch": 390} {"train_loss": -19.26566505432129, "global_step": 32391, "epoch": 390} {"train_loss": -19.263427734375, "global_step": 32392, "epoch": 390} {"train_loss": -18.9095401763916, "global_step": 32393, "epoch": 390} {"train_loss": -19.127708435058594, "global_step": 32394, "epoch": 390} {"train_loss": -19.48334312438965, "global_step": 32395, "epoch": 390} {"train_loss": -18.949758529663086, "global_step": 32396, "epoch": 390} {"train_loss": -19.226123809814453, "global_step": 32397, "epoch": 390} {"train_loss": -19.05474853515625, "global_step": 32398, "epoch": 390} {"train_loss": -19.112348556518555, "global_step": 32399, "epoch": 390} {"train_loss": -19.105239868164062, "global_step": 32400, "epoch": 390} {"train_loss": -19.236099243164062, "global_step": 32401, "epoch": 390} {"train_loss": -18.743900299072266, "global_step": 32402, "epoch": 390} {"train_loss": -19.406152725219727, "global_step": 32403, "epoch": 390} {"train_loss": -19.24354362487793, "global_step": 32404, "epoch": 390} {"train_loss": -19.234697341918945, "global_step": 32405, "epoch": 390} {"train_loss": -19.273344039916992, "global_step": 32406, "epoch": 390} {"train_loss": -18.90360450744629, "global_step": 32407, "epoch": 390} {"train_loss": -19.218591690063477, "global_step": 32408, "epoch": 390} {"train_loss": -19.114355087280273, "global_step": 32409, "epoch": 390} {"train_loss": -18.94765853881836, "global_step": 32410, "epoch": 390} {"train_loss": -19.026674270629883, "global_step": 32411, "epoch": 390} {"train_loss": -19.256200790405273, "global_step": 32412, "epoch": 390} {"train_loss": -19.345430374145508, "global_step": 32413, "epoch": 390} {"train_loss": -19.004871368408203, "global_step": 32414, "epoch": 390} {"train_loss": -18.9505672454834, "global_step": 32415, "epoch": 390} {"train_loss": -19.299043655395508, "global_step": 32416, "epoch": 390} {"train_loss": -19.30474281311035, "global_step": 32417, "epoch": 390} {"train_loss": -19.072050094604492, "global_step": 32418, "epoch": 390} {"train_loss": -18.775949478149414, "global_step": 32419, "epoch": 390} {"train_loss": -18.92926025390625, "global_step": 32420, "epoch": 390} {"train_loss": -19.15200424194336, "global_step": 32421, "epoch": 390} {"train_loss": -18.893163681030273, "global_step": 32422, "epoch": 390} {"train_loss": -18.715879440307617, "global_step": 32423, "epoch": 390} {"train_loss": -18.983957290649414, "global_step": 32424, "epoch": 390} {"train_loss": -19.078943252563477, "global_step": 32425, "epoch": 390} {"train_loss": -18.580366134643555, "global_step": 32426, "epoch": 390} {"train_loss": -18.81591033935547, "global_step": 32427, "epoch": 390} {"train_loss": -18.950693130493164, "global_step": 32428, "epoch": 390} {"train_loss": -18.969175338745117, "global_step": 32429, "epoch": 390} {"train_loss": -18.967926025390625, "global_step": 32430, "epoch": 390} {"train_loss": -19.051992416381836, "global_step": 32431, "epoch": 390} {"train_loss": -19.060461044311523, "global_step": 32432, "epoch": 390} {"train_loss": -18.833662033081055, "global_step": 32433, "epoch": 390} {"train_loss": -19.02433204650879, "global_step": 32434, "epoch": 390} {"train_loss": -19.25379753112793, "global_step": 32435, "epoch": 390} {"train_loss": -19.273212432861328, "global_step": 32436, "epoch": 390} {"train_loss": -18.805404663085938, "global_step": 32437, "epoch": 390} {"train_loss": -18.814977645874023, "global_step": 32438, "epoch": 390} {"train_loss": -19.400632858276367, "global_step": 32439, "epoch": 390} {"train_loss": -18.821273803710938, "global_step": 32440, "epoch": 390} {"train_loss": -19.012083053588867, "global_step": 32441, "epoch": 390} {"train_loss": -19.29244613647461, "global_step": 32442, "epoch": 390} {"train_loss": -18.94829559326172, "global_step": 32443, "epoch": 390} {"train_loss": -19.254446029663086, "global_step": 32444, "epoch": 390} {"train_loss": -19.495073318481445, "global_step": 32445, "epoch": 390} {"train_loss": -19.035673141479492, "global_step": 32446, "epoch": 390} {"train_loss": -19.031553268432617, "global_step": 32447, "epoch": 390} {"train_loss": -18.7403621673584, "global_step": 32448, "epoch": 390} {"train_loss": -19.39316749572754, "global_step": 32449, "epoch": 390} {"train_loss": -19.22383689880371, "global_step": 32450, "epoch": 390} {"train_loss": -19.286596298217773, "global_step": 32451, "epoch": 390} {"train_loss": -19.054400869162684, "global_step": 32452, "epoch": 390, "val_loss": 5963262.5} {"train_loss": -19.01503562927246, "global_step": 32453, "epoch": 391} {"train_loss": -19.01813316345215, "global_step": 32454, "epoch": 391} {"train_loss": -18.954364776611328, "global_step": 32455, "epoch": 391} {"train_loss": -18.978229522705078, "global_step": 32456, "epoch": 391} {"train_loss": -18.582963943481445, "global_step": 32457, "epoch": 391} {"train_loss": -18.913036346435547, "global_step": 32458, "epoch": 391} {"train_loss": -19.223432540893555, "global_step": 32459, "epoch": 391} {"train_loss": -18.76421546936035, "global_step": 32460, "epoch": 391} {"train_loss": -19.0295352935791, "global_step": 32461, "epoch": 391} {"train_loss": -18.72911262512207, "global_step": 32462, "epoch": 391} {"train_loss": -19.31853675842285, "global_step": 32463, "epoch": 391} {"train_loss": -18.87174415588379, "global_step": 32464, "epoch": 391} {"train_loss": -19.526512145996094, "global_step": 32465, "epoch": 391} {"train_loss": -18.873327255249023, "global_step": 32466, "epoch": 391} {"train_loss": -18.81708335876465, "global_step": 32467, "epoch": 391} {"train_loss": -19.382617950439453, "global_step": 32468, "epoch": 391} {"train_loss": -18.890737533569336, "global_step": 32469, "epoch": 391} {"train_loss": -19.0800724029541, "global_step": 32470, "epoch": 391} {"train_loss": -19.435319900512695, "global_step": 32471, "epoch": 391} {"train_loss": -18.830503463745117, "global_step": 32472, "epoch": 391} {"train_loss": -18.95653533935547, "global_step": 32473, "epoch": 391} {"train_loss": -19.0245418548584, "global_step": 32474, "epoch": 391} {"train_loss": -19.166501998901367, "global_step": 32475, "epoch": 391} {"train_loss": -19.100360870361328, "global_step": 32476, "epoch": 391} {"train_loss": -19.094470977783203, "global_step": 32477, "epoch": 391} {"train_loss": -19.314069747924805, "global_step": 32478, "epoch": 391} {"train_loss": -18.807558059692383, "global_step": 32479, "epoch": 391} {"train_loss": -18.910816192626953, "global_step": 32480, "epoch": 391} {"train_loss": -19.405973434448242, "global_step": 32481, "epoch": 391} {"train_loss": -19.23023223876953, "global_step": 32482, "epoch": 391} {"train_loss": -19.136137008666992, "global_step": 32483, "epoch": 391} {"train_loss": -19.249073028564453, "global_step": 32484, "epoch": 391} {"train_loss": -19.168140411376953, "global_step": 32485, "epoch": 391} {"train_loss": -19.261917114257812, "global_step": 32486, "epoch": 391} {"train_loss": -19.162397384643555, "global_step": 32487, "epoch": 391} {"train_loss": -18.930776596069336, "global_step": 32488, "epoch": 391} {"train_loss": -19.128999710083008, "global_step": 32489, "epoch": 391} {"train_loss": -19.056068420410156, "global_step": 32490, "epoch": 391} {"train_loss": -18.791677474975586, "global_step": 32491, "epoch": 391} {"train_loss": -18.634992599487305, "global_step": 32492, "epoch": 391} {"train_loss": -18.86365509033203, "global_step": 32493, "epoch": 391} {"train_loss": -19.125551223754883, "global_step": 32494, "epoch": 391} {"train_loss": -19.2517032623291, "global_step": 32495, "epoch": 391} {"train_loss": -19.122501373291016, "global_step": 32496, "epoch": 391} {"train_loss": -19.165096282958984, "global_step": 32497, "epoch": 391} {"train_loss": -19.22747802734375, "global_step": 32498, "epoch": 391} {"train_loss": -19.023174285888672, "global_step": 32499, "epoch": 391} {"train_loss": -18.697418212890625, "global_step": 32500, "epoch": 391} {"train_loss": -18.891624450683594, "global_step": 32501, "epoch": 391} {"train_loss": -19.056962966918945, "global_step": 32502, "epoch": 391} {"train_loss": -19.146209716796875, "global_step": 32503, "epoch": 391} {"train_loss": -19.563913345336914, "global_step": 32504, "epoch": 391} {"train_loss": -19.149789810180664, "global_step": 32505, "epoch": 391} {"train_loss": -19.24717140197754, "global_step": 32506, "epoch": 391} {"train_loss": -18.929718017578125, "global_step": 32507, "epoch": 391} {"train_loss": -18.928699493408203, "global_step": 32508, "epoch": 391} {"train_loss": -19.447532653808594, "global_step": 32509, "epoch": 391} {"train_loss": -19.25815200805664, "global_step": 32510, "epoch": 391} {"train_loss": -19.24078369140625, "global_step": 32511, "epoch": 391} {"train_loss": -18.868343353271484, "global_step": 32512, "epoch": 391} {"train_loss": -18.742116928100586, "global_step": 32513, "epoch": 391} {"train_loss": -18.976499557495117, "global_step": 32514, "epoch": 391} {"train_loss": -18.8807315826416, "global_step": 32515, "epoch": 391} {"train_loss": -19.029996871948242, "global_step": 32516, "epoch": 391} {"train_loss": -19.21497344970703, "global_step": 32517, "epoch": 391} {"train_loss": -19.050405502319336, "global_step": 32518, "epoch": 391} {"train_loss": -19.278379440307617, "global_step": 32519, "epoch": 391} {"train_loss": -19.21363639831543, "global_step": 32520, "epoch": 391} {"train_loss": -19.073774337768555, "global_step": 32521, "epoch": 391} {"train_loss": -18.95267105102539, "global_step": 32522, "epoch": 391} {"train_loss": -18.990009307861328, "global_step": 32523, "epoch": 391} {"train_loss": -18.96836280822754, "global_step": 32524, "epoch": 391} {"train_loss": -18.884855270385742, "global_step": 32525, "epoch": 391} {"train_loss": -19.306249618530273, "global_step": 32526, "epoch": 391} {"train_loss": -18.983427047729492, "global_step": 32527, "epoch": 391} {"train_loss": -18.99818992614746, "global_step": 32528, "epoch": 391} {"train_loss": -18.991653442382812, "global_step": 32529, "epoch": 391} {"train_loss": -18.832746505737305, "global_step": 32530, "epoch": 391} {"train_loss": -19.087421417236328, "global_step": 32531, "epoch": 391} {"train_loss": -19.194507598876953, "global_step": 32532, "epoch": 391} {"train_loss": -19.01122283935547, "global_step": 32533, "epoch": 391} {"train_loss": -18.630630493164062, "global_step": 32534, "epoch": 391} {"train_loss": -19.054334962224384, "global_step": 32535, "epoch": 391, "val_loss": 6052577.5} {"train_loss": -18.752599716186523, "global_step": 32536, "epoch": 392} {"train_loss": -18.859466552734375, "global_step": 32537, "epoch": 392} {"train_loss": -18.819669723510742, "global_step": 32538, "epoch": 392} {"train_loss": -18.426856994628906, "global_step": 32539, "epoch": 392} {"train_loss": -18.822423934936523, "global_step": 32540, "epoch": 392} {"train_loss": -18.16847038269043, "global_step": 32541, "epoch": 392} {"train_loss": -18.69351577758789, "global_step": 32542, "epoch": 392} {"train_loss": -18.854379653930664, "global_step": 32543, "epoch": 392} {"train_loss": -19.204450607299805, "global_step": 32544, "epoch": 392} {"train_loss": -18.950912475585938, "global_step": 32545, "epoch": 392} {"train_loss": -19.046903610229492, "global_step": 32546, "epoch": 392} {"train_loss": -18.78194808959961, "global_step": 32547, "epoch": 392} {"train_loss": -19.2537899017334, "global_step": 32548, "epoch": 392} {"train_loss": -19.043249130249023, "global_step": 32549, "epoch": 392} {"train_loss": -19.212631225585938, "global_step": 32550, "epoch": 392} {"train_loss": -18.898845672607422, "global_step": 32551, "epoch": 392} {"train_loss": -18.997943878173828, "global_step": 32552, "epoch": 392} {"train_loss": -18.881391525268555, "global_step": 32553, "epoch": 392} {"train_loss": -19.05084228515625, "global_step": 32554, "epoch": 392} {"train_loss": -19.234893798828125, "global_step": 32555, "epoch": 392} {"train_loss": -19.102371215820312, "global_step": 32556, "epoch": 392} {"train_loss": -19.365924835205078, "global_step": 32557, "epoch": 392} {"train_loss": -18.946380615234375, "global_step": 32558, "epoch": 392} {"train_loss": -19.347869873046875, "global_step": 32559, "epoch": 392} {"train_loss": -19.1789608001709, "global_step": 32560, "epoch": 392} {"train_loss": -19.170957565307617, "global_step": 32561, "epoch": 392} {"train_loss": -19.14081382751465, "global_step": 32562, "epoch": 392} {"train_loss": -18.944246292114258, "global_step": 32563, "epoch": 392} {"train_loss": -19.296743392944336, "global_step": 32564, "epoch": 392} {"train_loss": -19.205129623413086, "global_step": 32565, "epoch": 392} {"train_loss": -19.06939697265625, "global_step": 32566, "epoch": 392} {"train_loss": -19.396682739257812, "global_step": 32567, "epoch": 392} {"train_loss": -19.134857177734375, "global_step": 32568, "epoch": 392} {"train_loss": -19.456026077270508, "global_step": 32569, "epoch": 392} {"train_loss": -19.095365524291992, "global_step": 32570, "epoch": 392} {"train_loss": -18.920928955078125, "global_step": 32571, "epoch": 392} {"train_loss": -19.286808013916016, "global_step": 32572, "epoch": 392} {"train_loss": -19.10597801208496, "global_step": 32573, "epoch": 392} {"train_loss": -19.205280303955078, "global_step": 32574, "epoch": 392} {"train_loss": -18.70551872253418, "global_step": 32575, "epoch": 392} {"train_loss": -18.760746002197266, "global_step": 32576, "epoch": 392} {"train_loss": -19.39731216430664, "global_step": 32577, "epoch": 392} {"train_loss": -19.113876342773438, "global_step": 32578, "epoch": 392} {"train_loss": -19.099607467651367, "global_step": 32579, "epoch": 392} {"train_loss": -18.85972023010254, "global_step": 32580, "epoch": 392} {"train_loss": -19.109678268432617, "global_step": 32581, "epoch": 392} {"train_loss": -19.168197631835938, "global_step": 32582, "epoch": 392} {"train_loss": -18.9073486328125, "global_step": 32583, "epoch": 392} {"train_loss": -19.249797821044922, "global_step": 32584, "epoch": 392} {"train_loss": -19.187345504760742, "global_step": 32585, "epoch": 392} {"train_loss": -19.125844955444336, "global_step": 32586, "epoch": 392} {"train_loss": -19.09923553466797, "global_step": 32587, "epoch": 392} {"train_loss": -18.914649963378906, "global_step": 32588, "epoch": 392} {"train_loss": -19.006820678710938, "global_step": 32589, "epoch": 392} {"train_loss": -18.94867515563965, "global_step": 32590, "epoch": 392} {"train_loss": -19.011276245117188, "global_step": 32591, "epoch": 392} {"train_loss": -19.052576065063477, "global_step": 32592, "epoch": 392} {"train_loss": -18.634946823120117, "global_step": 32593, "epoch": 392} {"train_loss": -18.787328720092773, "global_step": 32594, "epoch": 392} {"train_loss": -18.88679313659668, "global_step": 32595, "epoch": 392} {"train_loss": -19.061420440673828, "global_step": 32596, "epoch": 392} {"train_loss": -19.065582275390625, "global_step": 32597, "epoch": 392} {"train_loss": -19.13844108581543, "global_step": 32598, "epoch": 392} {"train_loss": -18.862401962280273, "global_step": 32599, "epoch": 392} {"train_loss": -19.257593154907227, "global_step": 32600, "epoch": 392} {"train_loss": -18.342065811157227, "global_step": 32601, "epoch": 392} {"train_loss": -18.786725997924805, "global_step": 32602, "epoch": 392} {"train_loss": -19.09900665283203, "global_step": 32603, "epoch": 392} {"train_loss": -19.168106079101562, "global_step": 32604, "epoch": 392} {"train_loss": -19.255300521850586, "global_step": 32605, "epoch": 392} {"train_loss": -19.184009552001953, "global_step": 32606, "epoch": 392} {"train_loss": -19.300500869750977, "global_step": 32607, "epoch": 392} {"train_loss": -19.001554489135742, "global_step": 32608, "epoch": 392} {"train_loss": -18.953691482543945, "global_step": 32609, "epoch": 392} {"train_loss": -18.999053955078125, "global_step": 32610, "epoch": 392} {"train_loss": -18.866527557373047, "global_step": 32611, "epoch": 392} {"train_loss": -19.48845672607422, "global_step": 32612, "epoch": 392} {"train_loss": -19.04495620727539, "global_step": 32613, "epoch": 392} {"train_loss": -18.8297061920166, "global_step": 32614, "epoch": 392} {"train_loss": -18.713287353515625, "global_step": 32615, "epoch": 392} {"train_loss": -18.921072006225586, "global_step": 32616, "epoch": 392} {"train_loss": -18.94233512878418, "global_step": 32617, "epoch": 392} {"train_loss": -19.01276505711567, "global_step": 32618, "epoch": 392, "val_loss": 6117774.5} {"train_loss": -18.103620529174805, "global_step": 32619, "epoch": 393} {"train_loss": -18.776599884033203, "global_step": 32620, "epoch": 393} {"train_loss": -18.691476821899414, "global_step": 32621, "epoch": 393} {"train_loss": -18.41499900817871, "global_step": 32622, "epoch": 393} {"train_loss": -19.00226402282715, "global_step": 32623, "epoch": 393} {"train_loss": -18.620527267456055, "global_step": 32624, "epoch": 393} {"train_loss": -19.056121826171875, "global_step": 32625, "epoch": 393} {"train_loss": -19.24020767211914, "global_step": 32626, "epoch": 393} {"train_loss": -18.981664657592773, "global_step": 32627, "epoch": 393} {"train_loss": -18.75484275817871, "global_step": 32628, "epoch": 393} {"train_loss": -19.016172409057617, "global_step": 32629, "epoch": 393} {"train_loss": -18.900596618652344, "global_step": 32630, "epoch": 393} {"train_loss": -18.970869064331055, "global_step": 32631, "epoch": 393} {"train_loss": -19.158390045166016, "global_step": 32632, "epoch": 393} {"train_loss": -18.857105255126953, "global_step": 32633, "epoch": 393} {"train_loss": -19.109495162963867, "global_step": 32634, "epoch": 393} {"train_loss": -19.146854400634766, "global_step": 32635, "epoch": 393} {"train_loss": -19.104827880859375, "global_step": 32636, "epoch": 393} {"train_loss": -19.124103546142578, "global_step": 32637, "epoch": 393} {"train_loss": -18.756404876708984, "global_step": 32638, "epoch": 393} {"train_loss": -19.176288604736328, "global_step": 32639, "epoch": 393} {"train_loss": -19.3006649017334, "global_step": 32640, "epoch": 393} {"train_loss": -18.5917911529541, "global_step": 32641, "epoch": 393} {"train_loss": -18.705366134643555, "global_step": 32642, "epoch": 393} {"train_loss": -19.140583038330078, "global_step": 32643, "epoch": 393} {"train_loss": -19.17203712463379, "global_step": 32644, "epoch": 393} {"train_loss": -18.947973251342773, "global_step": 32645, "epoch": 393} {"train_loss": -19.034387588500977, "global_step": 32646, "epoch": 393} {"train_loss": -18.977140426635742, "global_step": 32647, "epoch": 393} {"train_loss": -18.82254981994629, "global_step": 32648, "epoch": 393} {"train_loss": -18.693754196166992, "global_step": 32649, "epoch": 393} {"train_loss": -18.962284088134766, "global_step": 32650, "epoch": 393} {"train_loss": -18.802114486694336, "global_step": 32651, "epoch": 393} {"train_loss": -19.029638290405273, "global_step": 32652, "epoch": 393} {"train_loss": -19.028039932250977, "global_step": 32653, "epoch": 393} {"train_loss": -18.878427505493164, "global_step": 32654, "epoch": 393} {"train_loss": -19.268369674682617, "global_step": 32655, "epoch": 393} {"train_loss": -19.133207321166992, "global_step": 32656, "epoch": 393} {"train_loss": -19.35154151916504, "global_step": 32657, "epoch": 393} {"train_loss": -19.26576042175293, "global_step": 32658, "epoch": 393} {"train_loss": -19.171506881713867, "global_step": 32659, "epoch": 393} {"train_loss": -19.389333724975586, "global_step": 32660, "epoch": 393} {"train_loss": -18.80134391784668, "global_step": 32661, "epoch": 393} {"train_loss": -19.297510147094727, "global_step": 32662, "epoch": 393} {"train_loss": -19.138002395629883, "global_step": 32663, "epoch": 393} {"train_loss": -18.968706130981445, "global_step": 32664, "epoch": 393} {"train_loss": -19.081787109375, "global_step": 32665, "epoch": 393} {"train_loss": -19.54547691345215, "global_step": 32666, "epoch": 393} {"train_loss": -19.040313720703125, "global_step": 32667, "epoch": 393} {"train_loss": -19.337371826171875, "global_step": 32668, "epoch": 393} {"train_loss": -18.711563110351562, "global_step": 32669, "epoch": 393} {"train_loss": -19.149694442749023, "global_step": 32670, "epoch": 393} {"train_loss": -19.10950469970703, "global_step": 32671, "epoch": 393} {"train_loss": -19.2115421295166, "global_step": 32672, "epoch": 393} {"train_loss": -19.064420700073242, "global_step": 32673, "epoch": 393} {"train_loss": -18.713199615478516, "global_step": 32674, "epoch": 393} {"train_loss": -19.070322036743164, "global_step": 32675, "epoch": 393} {"train_loss": -18.953887939453125, "global_step": 32676, "epoch": 393} {"train_loss": -19.014427185058594, "global_step": 32677, "epoch": 393} {"train_loss": -19.37424659729004, "global_step": 32678, "epoch": 393} {"train_loss": -18.75791358947754, "global_step": 32679, "epoch": 393} {"train_loss": -18.908580780029297, "global_step": 32680, "epoch": 393} {"train_loss": -19.202285766601562, "global_step": 32681, "epoch": 393} {"train_loss": -19.194019317626953, "global_step": 32682, "epoch": 393} {"train_loss": -19.137104034423828, "global_step": 32683, "epoch": 393} {"train_loss": -19.331960678100586, "global_step": 32684, "epoch": 393} {"train_loss": -18.937795639038086, "global_step": 32685, "epoch": 393} {"train_loss": -19.137006759643555, "global_step": 32686, "epoch": 393} {"train_loss": -19.008281707763672, "global_step": 32687, "epoch": 393} {"train_loss": -19.305484771728516, "global_step": 32688, "epoch": 393} {"train_loss": -19.248159408569336, "global_step": 32689, "epoch": 393} {"train_loss": -18.801034927368164, "global_step": 32690, "epoch": 393} {"train_loss": -19.029603958129883, "global_step": 32691, "epoch": 393} {"train_loss": -19.071767807006836, "global_step": 32692, "epoch": 393} {"train_loss": -18.99493408203125, "global_step": 32693, "epoch": 393} {"train_loss": -19.14564323425293, "global_step": 32694, "epoch": 393} {"train_loss": -18.9212646484375, "global_step": 32695, "epoch": 393} {"train_loss": -18.799299240112305, "global_step": 32696, "epoch": 393} {"train_loss": -18.934886932373047, "global_step": 32697, "epoch": 393} {"train_loss": -19.07146644592285, "global_step": 32698, "epoch": 393} {"train_loss": -18.947328567504883, "global_step": 32699, "epoch": 393} {"train_loss": -19.013822555541992, "global_step": 32700, "epoch": 393} {"train_loss": -19.010513765266143, "global_step": 32701, "epoch": 393, "val_loss": 6031617.5} {"train_loss": -18.999326705932617, "global_step": 32702, "epoch": 394} {"train_loss": -18.958303451538086, "global_step": 32703, "epoch": 394} {"train_loss": -18.85235023498535, "global_step": 32704, "epoch": 394} {"train_loss": -19.07114028930664, "global_step": 32705, "epoch": 394} {"train_loss": -18.84791374206543, "global_step": 32706, "epoch": 394} {"train_loss": -19.237045288085938, "global_step": 32707, "epoch": 394} {"train_loss": -18.762266159057617, "global_step": 32708, "epoch": 394} {"train_loss": -19.290199279785156, "global_step": 32709, "epoch": 394} {"train_loss": -18.992380142211914, "global_step": 32710, "epoch": 394} {"train_loss": -18.854398727416992, "global_step": 32711, "epoch": 394} {"train_loss": -19.307825088500977, "global_step": 32712, "epoch": 394} {"train_loss": -18.67543601989746, "global_step": 32713, "epoch": 394} {"train_loss": -18.947450637817383, "global_step": 32714, "epoch": 394} {"train_loss": -18.723373413085938, "global_step": 32715, "epoch": 394} {"train_loss": -19.060455322265625, "global_step": 32716, "epoch": 394} {"train_loss": -18.718618392944336, "global_step": 32717, "epoch": 394} {"train_loss": -19.0966854095459, "global_step": 32718, "epoch": 394} {"train_loss": -19.08976936340332, "global_step": 32719, "epoch": 394} {"train_loss": -18.79295539855957, "global_step": 32720, "epoch": 394} {"train_loss": -18.567535400390625, "global_step": 32721, "epoch": 394} {"train_loss": -19.159198760986328, "global_step": 32722, "epoch": 394} {"train_loss": -18.97024154663086, "global_step": 32723, "epoch": 394} {"train_loss": -19.14466094970703, "global_step": 32724, "epoch": 394} {"train_loss": -18.78937530517578, "global_step": 32725, "epoch": 394} {"train_loss": -18.967891693115234, "global_step": 32726, "epoch": 394} {"train_loss": -19.13460350036621, "global_step": 32727, "epoch": 394} {"train_loss": -18.8283748626709, "global_step": 32728, "epoch": 394} {"train_loss": -19.12579917907715, "global_step": 32729, "epoch": 394} {"train_loss": -19.095748901367188, "global_step": 32730, "epoch": 394} {"train_loss": -18.831846237182617, "global_step": 32731, "epoch": 394} {"train_loss": -19.082944869995117, "global_step": 32732, "epoch": 394} {"train_loss": -18.645095825195312, "global_step": 32733, "epoch": 394} {"train_loss": -19.242395401000977, "global_step": 32734, "epoch": 394} {"train_loss": -19.302825927734375, "global_step": 32735, "epoch": 394} {"train_loss": -18.868736267089844, "global_step": 32736, "epoch": 394} {"train_loss": -19.131765365600586, "global_step": 32737, "epoch": 394} {"train_loss": -18.404672622680664, "global_step": 32738, "epoch": 394} {"train_loss": -19.17991065979004, "global_step": 32739, "epoch": 394} {"train_loss": -19.623342514038086, "global_step": 32740, "epoch": 394} {"train_loss": -19.177459716796875, "global_step": 32741, "epoch": 394} {"train_loss": -19.18408203125, "global_step": 32742, "epoch": 394} {"train_loss": -19.20306396484375, "global_step": 32743, "epoch": 394} {"train_loss": -18.950668334960938, "global_step": 32744, "epoch": 394} {"train_loss": -19.1895694732666, "global_step": 32745, "epoch": 394} {"train_loss": -19.149669647216797, "global_step": 32746, "epoch": 394} {"train_loss": -19.130590438842773, "global_step": 32747, "epoch": 394} {"train_loss": -19.41665267944336, "global_step": 32748, "epoch": 394} {"train_loss": -19.093738555908203, "global_step": 32749, "epoch": 394} {"train_loss": -18.910266876220703, "global_step": 32750, "epoch": 394} {"train_loss": -19.489622116088867, "global_step": 32751, "epoch": 394} {"train_loss": -19.3785457611084, "global_step": 32752, "epoch": 394} {"train_loss": -19.233291625976562, "global_step": 32753, "epoch": 394} {"train_loss": -19.134288787841797, "global_step": 32754, "epoch": 394} {"train_loss": -19.063016891479492, "global_step": 32755, "epoch": 394} {"train_loss": -18.981632232666016, "global_step": 32756, "epoch": 394} {"train_loss": -18.997634887695312, "global_step": 32757, "epoch": 394} {"train_loss": -19.099393844604492, "global_step": 32758, "epoch": 394} {"train_loss": -19.29867935180664, "global_step": 32759, "epoch": 394} {"train_loss": -19.0487060546875, "global_step": 32760, "epoch": 394} {"train_loss": -19.485868453979492, "global_step": 32761, "epoch": 394} {"train_loss": -19.229909896850586, "global_step": 32762, "epoch": 394} {"train_loss": -19.203815460205078, "global_step": 32763, "epoch": 394} {"train_loss": -19.16875648498535, "global_step": 32764, "epoch": 394} {"train_loss": -19.34467887878418, "global_step": 32765, "epoch": 394} {"train_loss": -19.3471736907959, "global_step": 32766, "epoch": 394} {"train_loss": -19.117406845092773, "global_step": 32767, "epoch": 394} {"train_loss": -19.052358627319336, "global_step": 32768, "epoch": 394} {"train_loss": -19.140018463134766, "global_step": 32769, "epoch": 394} {"train_loss": -19.185819625854492, "global_step": 32770, "epoch": 394} {"train_loss": -19.566221237182617, "global_step": 32771, "epoch": 394} {"train_loss": -19.117908477783203, "global_step": 32772, "epoch": 394} {"train_loss": -19.3749942779541, "global_step": 32773, "epoch": 394} {"train_loss": -19.02581214904785, "global_step": 32774, "epoch": 394} {"train_loss": -19.055604934692383, "global_step": 32775, "epoch": 394} {"train_loss": -19.237407684326172, "global_step": 32776, "epoch": 394} {"train_loss": -18.87159538269043, "global_step": 32777, "epoch": 394} {"train_loss": -18.866668701171875, "global_step": 32778, "epoch": 394} {"train_loss": -19.37545394897461, "global_step": 32779, "epoch": 394} {"train_loss": -18.975799560546875, "global_step": 32780, "epoch": 394} {"train_loss": -18.708526611328125, "global_step": 32781, "epoch": 394} {"train_loss": -19.241140365600586, "global_step": 32782, "epoch": 394} {"train_loss": -19.35411834716797, "global_step": 32783, "epoch": 394} {"train_loss": -19.07508962700166, "global_step": 32784, "epoch": 394, "val_loss": 6153165.0} {"train_loss": -18.5241756439209, "global_step": 32785, "epoch": 395} {"train_loss": -18.546716690063477, "global_step": 32786, "epoch": 395} {"train_loss": -18.73101234436035, "global_step": 32787, "epoch": 395} {"train_loss": -18.956396102905273, "global_step": 32788, "epoch": 395} {"train_loss": -18.63252830505371, "global_step": 32789, "epoch": 395} {"train_loss": -18.636144638061523, "global_step": 32790, "epoch": 395} {"train_loss": -18.67874526977539, "global_step": 32791, "epoch": 395} {"train_loss": -18.39081382751465, "global_step": 32792, "epoch": 395} {"train_loss": -18.953567504882812, "global_step": 32793, "epoch": 395} {"train_loss": -18.58502769470215, "global_step": 32794, "epoch": 395} {"train_loss": -19.39625358581543, "global_step": 32795, "epoch": 395} {"train_loss": -19.32991600036621, "global_step": 32796, "epoch": 395} {"train_loss": -19.05360221862793, "global_step": 32797, "epoch": 395} {"train_loss": -19.249391555786133, "global_step": 32798, "epoch": 395} {"train_loss": -19.202484130859375, "global_step": 32799, "epoch": 395} {"train_loss": -19.0718936920166, "global_step": 32800, "epoch": 395} {"train_loss": -18.615381240844727, "global_step": 32801, "epoch": 395} {"train_loss": -18.75923728942871, "global_step": 32802, "epoch": 395} {"train_loss": -19.22467803955078, "global_step": 32803, "epoch": 395} {"train_loss": -18.99144744873047, "global_step": 32804, "epoch": 395} {"train_loss": -18.57322120666504, "global_step": 32805, "epoch": 395} {"train_loss": -18.660863876342773, "global_step": 32806, "epoch": 395} {"train_loss": -18.86100196838379, "global_step": 32807, "epoch": 395} {"train_loss": -19.01214027404785, "global_step": 32808, "epoch": 395} {"train_loss": -19.22183609008789, "global_step": 32809, "epoch": 395} {"train_loss": -19.493818283081055, "global_step": 32810, "epoch": 395} {"train_loss": -19.140344619750977, "global_step": 32811, "epoch": 395} {"train_loss": -19.00934410095215, "global_step": 32812, "epoch": 395} {"train_loss": -18.793424606323242, "global_step": 32813, "epoch": 395} {"train_loss": -18.93149185180664, "global_step": 32814, "epoch": 395} {"train_loss": -19.45926284790039, "global_step": 32815, "epoch": 395} {"train_loss": -19.013778686523438, "global_step": 32816, "epoch": 395} {"train_loss": -19.003320693969727, "global_step": 32817, "epoch": 395} {"train_loss": -19.10810661315918, "global_step": 32818, "epoch": 395} {"train_loss": -19.227275848388672, "global_step": 32819, "epoch": 395} {"train_loss": -19.034198760986328, "global_step": 32820, "epoch": 395} {"train_loss": -19.381847381591797, "global_step": 32821, "epoch": 395} {"train_loss": -18.522621154785156, "global_step": 32822, "epoch": 395} {"train_loss": -19.023273468017578, "global_step": 32823, "epoch": 395} {"train_loss": -19.11032485961914, "global_step": 32824, "epoch": 395} {"train_loss": -18.961111068725586, "global_step": 32825, "epoch": 395} {"train_loss": -18.874826431274414, "global_step": 32826, "epoch": 395} {"train_loss": -19.171850204467773, "global_step": 32827, "epoch": 395} {"train_loss": -19.039039611816406, "global_step": 32828, "epoch": 395} {"train_loss": -18.96402359008789, "global_step": 32829, "epoch": 395} {"train_loss": -18.92877769470215, "global_step": 32830, "epoch": 395} {"train_loss": -19.26706314086914, "global_step": 32831, "epoch": 395} {"train_loss": -18.97389793395996, "global_step": 32832, "epoch": 395} {"train_loss": -19.02850914001465, "global_step": 32833, "epoch": 395} {"train_loss": -19.206283569335938, "global_step": 32834, "epoch": 395} {"train_loss": -19.19331169128418, "global_step": 32835, "epoch": 395} {"train_loss": -19.179550170898438, "global_step": 32836, "epoch": 395} {"train_loss": -18.703453063964844, "global_step": 32837, "epoch": 395} {"train_loss": -18.49614715576172, "global_step": 32838, "epoch": 395} {"train_loss": -18.464441299438477, "global_step": 32839, "epoch": 395} {"train_loss": -19.034290313720703, "global_step": 32840, "epoch": 395} {"train_loss": -19.210439682006836, "global_step": 32841, "epoch": 395} {"train_loss": -19.062150955200195, "global_step": 32842, "epoch": 395} {"train_loss": -19.050867080688477, "global_step": 32843, "epoch": 395} {"train_loss": -19.267154693603516, "global_step": 32844, "epoch": 395} {"train_loss": -18.90217399597168, "global_step": 32845, "epoch": 395} {"train_loss": -19.295339584350586, "global_step": 32846, "epoch": 395} {"train_loss": -18.8539981842041, "global_step": 32847, "epoch": 395} {"train_loss": -18.861631393432617, "global_step": 32848, "epoch": 395} {"train_loss": -19.108667373657227, "global_step": 32849, "epoch": 395} {"train_loss": -19.05283546447754, "global_step": 32850, "epoch": 395} {"train_loss": -19.012094497680664, "global_step": 32851, "epoch": 395} {"train_loss": -18.85993766784668, "global_step": 32852, "epoch": 395} {"train_loss": -18.904319763183594, "global_step": 32853, "epoch": 395} {"train_loss": -19.408340454101562, "global_step": 32854, "epoch": 395} {"train_loss": -19.21860694885254, "global_step": 32855, "epoch": 395} {"train_loss": -19.48029899597168, "global_step": 32856, "epoch": 395} {"train_loss": -18.989221572875977, "global_step": 32857, "epoch": 395} {"train_loss": -19.213830947875977, "global_step": 32858, "epoch": 395} {"train_loss": -19.087554931640625, "global_step": 32859, "epoch": 395} {"train_loss": -19.321142196655273, "global_step": 32860, "epoch": 395} {"train_loss": -19.580360412597656, "global_step": 32861, "epoch": 395} {"train_loss": -19.428939819335938, "global_step": 32862, "epoch": 395} {"train_loss": -18.933443069458008, "global_step": 32863, "epoch": 395} {"train_loss": -19.12986946105957, "global_step": 32864, "epoch": 395} {"train_loss": -19.1098690032959, "global_step": 32865, "epoch": 395} {"train_loss": -19.429859161376953, "global_step": 32866, "epoch": 395} {"train_loss": -19.028003187064666, "global_step": 32867, "epoch": 395, "val_loss": 6059967.0} {"train_loss": -19.333932876586914, "global_step": 32868, "epoch": 396} {"train_loss": -18.938535690307617, "global_step": 32869, "epoch": 396} {"train_loss": -19.030210494995117, "global_step": 32870, "epoch": 396} {"train_loss": -19.00911521911621, "global_step": 32871, "epoch": 396} {"train_loss": -19.268217086791992, "global_step": 32872, "epoch": 396} {"train_loss": -19.164518356323242, "global_step": 32873, "epoch": 396} {"train_loss": -19.11686897277832, "global_step": 32874, "epoch": 396} {"train_loss": -19.33524513244629, "global_step": 32875, "epoch": 396} {"train_loss": -19.17045021057129, "global_step": 32876, "epoch": 396} {"train_loss": -18.9092960357666, "global_step": 32877, "epoch": 396} {"train_loss": -18.920774459838867, "global_step": 32878, "epoch": 396} {"train_loss": -18.926433563232422, "global_step": 32879, "epoch": 396} {"train_loss": -19.049028396606445, "global_step": 32880, "epoch": 396} {"train_loss": -18.752904891967773, "global_step": 32881, "epoch": 396} {"train_loss": -18.889387130737305, "global_step": 32882, "epoch": 396} {"train_loss": -19.100879669189453, "global_step": 32883, "epoch": 396} {"train_loss": -19.33303451538086, "global_step": 32884, "epoch": 396} {"train_loss": -19.17951774597168, "global_step": 32885, "epoch": 396} {"train_loss": -18.86707878112793, "global_step": 32886, "epoch": 396} {"train_loss": -19.33932876586914, "global_step": 32887, "epoch": 396} {"train_loss": -19.057619094848633, "global_step": 32888, "epoch": 396} {"train_loss": -19.244300842285156, "global_step": 32889, "epoch": 396} {"train_loss": -18.851512908935547, "global_step": 32890, "epoch": 396} {"train_loss": -18.853839874267578, "global_step": 32891, "epoch": 396} {"train_loss": -18.783254623413086, "global_step": 32892, "epoch": 396} {"train_loss": -18.845312118530273, "global_step": 32893, "epoch": 396} {"train_loss": -18.830286026000977, "global_step": 32894, "epoch": 396} {"train_loss": -19.514888763427734, "global_step": 32895, "epoch": 396} {"train_loss": -19.190031051635742, "global_step": 32896, "epoch": 396} {"train_loss": -19.3916015625, "global_step": 32897, "epoch": 396} {"train_loss": -19.330551147460938, "global_step": 32898, "epoch": 396} {"train_loss": -19.665328979492188, "global_step": 32899, "epoch": 396} {"train_loss": -19.35802459716797, "global_step": 32900, "epoch": 396} {"train_loss": -19.402036666870117, "global_step": 32901, "epoch": 396} {"train_loss": -19.33381462097168, "global_step": 32902, "epoch": 396} {"train_loss": -19.108505249023438, "global_step": 32903, "epoch": 396} {"train_loss": -19.133136749267578, "global_step": 32904, "epoch": 396} {"train_loss": -18.940305709838867, "global_step": 32905, "epoch": 396} {"train_loss": -19.07991600036621, "global_step": 32906, "epoch": 396} {"train_loss": -18.931867599487305, "global_step": 32907, "epoch": 396} {"train_loss": -18.867000579833984, "global_step": 32908, "epoch": 396} {"train_loss": -19.455617904663086, "global_step": 32909, "epoch": 396} {"train_loss": -19.049297332763672, "global_step": 32910, "epoch": 396} {"train_loss": -18.689414978027344, "global_step": 32911, "epoch": 396} {"train_loss": -18.80022430419922, "global_step": 32912, "epoch": 396} {"train_loss": -19.281713485717773, "global_step": 32913, "epoch": 396} {"train_loss": -19.046621322631836, "global_step": 32914, "epoch": 396} {"train_loss": -19.15468406677246, "global_step": 32915, "epoch": 396} {"train_loss": -18.784133911132812, "global_step": 32916, "epoch": 396} {"train_loss": -19.392940521240234, "global_step": 32917, "epoch": 396} {"train_loss": -18.892337799072266, "global_step": 32918, "epoch": 396} {"train_loss": -18.83211898803711, "global_step": 32919, "epoch": 396} {"train_loss": -19.125802993774414, "global_step": 32920, "epoch": 396} {"train_loss": -19.001121520996094, "global_step": 32921, "epoch": 396} {"train_loss": -19.263797760009766, "global_step": 32922, "epoch": 396} {"train_loss": -18.800039291381836, "global_step": 32923, "epoch": 396} {"train_loss": -19.061033248901367, "global_step": 32924, "epoch": 396} {"train_loss": -18.8792667388916, "global_step": 32925, "epoch": 396} {"train_loss": -19.039709091186523, "global_step": 32926, "epoch": 396} {"train_loss": -19.180240631103516, "global_step": 32927, "epoch": 396} {"train_loss": -19.030317306518555, "global_step": 32928, "epoch": 396} {"train_loss": -19.323617935180664, "global_step": 32929, "epoch": 396} {"train_loss": -18.88097381591797, "global_step": 32930, "epoch": 396} {"train_loss": -18.90478515625, "global_step": 32931, "epoch": 396} {"train_loss": -19.001569747924805, "global_step": 32932, "epoch": 396} {"train_loss": -19.34151840209961, "global_step": 32933, "epoch": 396} {"train_loss": -18.97843360900879, "global_step": 32934, "epoch": 396} {"train_loss": -19.318056106567383, "global_step": 32935, "epoch": 396} {"train_loss": -19.1185359954834, "global_step": 32936, "epoch": 396} {"train_loss": -19.143178939819336, "global_step": 32937, "epoch": 396} {"train_loss": -18.945560455322266, "global_step": 32938, "epoch": 396} {"train_loss": -19.041460037231445, "global_step": 32939, "epoch": 396} {"train_loss": -18.866195678710938, "global_step": 32940, "epoch": 396} {"train_loss": -19.179628372192383, "global_step": 32941, "epoch": 396} {"train_loss": -19.192548751831055, "global_step": 32942, "epoch": 396} {"train_loss": -18.9943790435791, "global_step": 32943, "epoch": 396} {"train_loss": -18.768756866455078, "global_step": 32944, "epoch": 396} {"train_loss": -18.87676239013672, "global_step": 32945, "epoch": 396} {"train_loss": -18.81529426574707, "global_step": 32946, "epoch": 396} {"train_loss": -19.111377716064453, "global_step": 32947, "epoch": 396} {"train_loss": -19.13763999938965, "global_step": 32948, "epoch": 396} {"train_loss": -19.249515533447266, "global_step": 32949, "epoch": 396} {"train_loss": -19.078026001711926, "global_step": 32950, "epoch": 396, "val_loss": 6136932.5} {"train_loss": -19.174043655395508, "global_step": 32951, "epoch": 397} {"train_loss": -19.063772201538086, "global_step": 32952, "epoch": 397} {"train_loss": -19.14420509338379, "global_step": 32953, "epoch": 397} {"train_loss": -19.23433494567871, "global_step": 32954, "epoch": 397} {"train_loss": -19.157018661499023, "global_step": 32955, "epoch": 397} {"train_loss": -19.276309967041016, "global_step": 32956, "epoch": 397} {"train_loss": -19.09023666381836, "global_step": 32957, "epoch": 397} {"train_loss": -18.89631462097168, "global_step": 32958, "epoch": 397} {"train_loss": -19.124534606933594, "global_step": 32959, "epoch": 397} {"train_loss": -18.9315185546875, "global_step": 32960, "epoch": 397} {"train_loss": -19.2518310546875, "global_step": 32961, "epoch": 397} {"train_loss": -19.19205665588379, "global_step": 32962, "epoch": 397} {"train_loss": -19.05721664428711, "global_step": 32963, "epoch": 397} {"train_loss": -18.62134552001953, "global_step": 32964, "epoch": 397} {"train_loss": -18.969045639038086, "global_step": 32965, "epoch": 397} {"train_loss": -18.83732032775879, "global_step": 32966, "epoch": 397} {"train_loss": -18.86836814880371, "global_step": 32967, "epoch": 397} {"train_loss": -19.580183029174805, "global_step": 32968, "epoch": 397} {"train_loss": -19.468183517456055, "global_step": 32969, "epoch": 397} {"train_loss": -19.067594528198242, "global_step": 32970, "epoch": 397} {"train_loss": -19.18049430847168, "global_step": 32971, "epoch": 397} {"train_loss": -18.87396812438965, "global_step": 32972, "epoch": 397} {"train_loss": -19.389249801635742, "global_step": 32973, "epoch": 397} {"train_loss": -18.88050651550293, "global_step": 32974, "epoch": 397} {"train_loss": -19.04683494567871, "global_step": 32975, "epoch": 397} {"train_loss": -18.987979888916016, "global_step": 32976, "epoch": 397} {"train_loss": -18.907798767089844, "global_step": 32977, "epoch": 397} {"train_loss": -19.477893829345703, "global_step": 32978, "epoch": 397} {"train_loss": -19.092912673950195, "global_step": 32979, "epoch": 397} {"train_loss": -19.2916259765625, "global_step": 32980, "epoch": 397} {"train_loss": -18.732879638671875, "global_step": 32981, "epoch": 397} {"train_loss": -18.82411766052246, "global_step": 32982, "epoch": 397} {"train_loss": -19.38216781616211, "global_step": 32983, "epoch": 397} {"train_loss": -19.295654296875, "global_step": 32984, "epoch": 397} {"train_loss": -18.87001609802246, "global_step": 32985, "epoch": 397} {"train_loss": -19.271757125854492, "global_step": 32986, "epoch": 397} {"train_loss": -19.23808479309082, "global_step": 32987, "epoch": 397} {"train_loss": -19.071304321289062, "global_step": 32988, "epoch": 397} {"train_loss": -19.13456916809082, "global_step": 32989, "epoch": 397} {"train_loss": -19.01240348815918, "global_step": 32990, "epoch": 397} {"train_loss": -19.194345474243164, "global_step": 32991, "epoch": 397} {"train_loss": -19.13567543029785, "global_step": 32992, "epoch": 397} {"train_loss": -19.054672241210938, "global_step": 32993, "epoch": 397} {"train_loss": -19.14090347290039, "global_step": 32994, "epoch": 397} {"train_loss": -19.138538360595703, "global_step": 32995, "epoch": 397} {"train_loss": -18.817235946655273, "global_step": 32996, "epoch": 397} {"train_loss": -18.78622055053711, "global_step": 32997, "epoch": 397} {"train_loss": -19.0474910736084, "global_step": 32998, "epoch": 397} {"train_loss": -19.12563133239746, "global_step": 32999, "epoch": 397} {"train_loss": -19.0749568939209, "global_step": 33000, "epoch": 397} {"train_loss": -19.27037239074707, "global_step": 33001, "epoch": 397} {"train_loss": -19.408655166625977, "global_step": 33002, "epoch": 397} {"train_loss": -19.32080841064453, "global_step": 33003, "epoch": 397} {"train_loss": -19.0131778717041, "global_step": 33004, "epoch": 397} {"train_loss": -18.892436981201172, "global_step": 33005, "epoch": 397} {"train_loss": -18.799579620361328, "global_step": 33006, "epoch": 397} {"train_loss": -18.908676147460938, "global_step": 33007, "epoch": 397} {"train_loss": -19.054563522338867, "global_step": 33008, "epoch": 397} {"train_loss": -18.618698120117188, "global_step": 33009, "epoch": 397} {"train_loss": -19.02884292602539, "global_step": 33010, "epoch": 397} {"train_loss": -19.12291717529297, "global_step": 33011, "epoch": 397} {"train_loss": -19.463043212890625, "global_step": 33012, "epoch": 397} {"train_loss": -19.3901309967041, "global_step": 33013, "epoch": 397} {"train_loss": -18.713254928588867, "global_step": 33014, "epoch": 397} {"train_loss": -19.058349609375, "global_step": 33015, "epoch": 397} {"train_loss": -18.85616111755371, "global_step": 33016, "epoch": 397} {"train_loss": -19.302963256835938, "global_step": 33017, "epoch": 397} {"train_loss": -19.063398361206055, "global_step": 33018, "epoch": 397} {"train_loss": -19.126638412475586, "global_step": 33019, "epoch": 397} {"train_loss": -19.312559127807617, "global_step": 33020, "epoch": 397} {"train_loss": -18.979412078857422, "global_step": 33021, "epoch": 397} {"train_loss": -18.835037231445312, "global_step": 33022, "epoch": 397} {"train_loss": -19.05843734741211, "global_step": 33023, "epoch": 397} {"train_loss": -19.295825958251953, "global_step": 33024, "epoch": 397} {"train_loss": -18.988065719604492, "global_step": 33025, "epoch": 397} {"train_loss": -19.048608779907227, "global_step": 33026, "epoch": 397} {"train_loss": -18.805288314819336, "global_step": 33027, "epoch": 397} {"train_loss": -19.102327346801758, "global_step": 33028, "epoch": 397} {"train_loss": -18.823394775390625, "global_step": 33029, "epoch": 397} {"train_loss": -19.010400772094727, "global_step": 33030, "epoch": 397} {"train_loss": -19.029285430908203, "global_step": 33031, "epoch": 397} {"train_loss": -19.121347427368164, "global_step": 33032, "epoch": 397} {"train_loss": -19.066717630409332, "global_step": 33033, "epoch": 397, "val_loss": 6001390.5} {"train_loss": -18.659015655517578, "global_step": 33034, "epoch": 398} {"train_loss": -18.814294815063477, "global_step": 33035, "epoch": 398} {"train_loss": -19.011083602905273, "global_step": 33036, "epoch": 398} {"train_loss": -18.741031646728516, "global_step": 33037, "epoch": 398} {"train_loss": -18.762086868286133, "global_step": 33038, "epoch": 398} {"train_loss": -18.8061580657959, "global_step": 33039, "epoch": 398} {"train_loss": -18.676225662231445, "global_step": 33040, "epoch": 398} {"train_loss": -18.950231552124023, "global_step": 33041, "epoch": 398} {"train_loss": -18.689781188964844, "global_step": 33042, "epoch": 398} {"train_loss": -18.815135955810547, "global_step": 33043, "epoch": 398} {"train_loss": -18.564655303955078, "global_step": 33044, "epoch": 398} {"train_loss": -18.89405632019043, "global_step": 33045, "epoch": 398} {"train_loss": -18.876554489135742, "global_step": 33046, "epoch": 398} {"train_loss": -18.837827682495117, "global_step": 33047, "epoch": 398} {"train_loss": -19.175168991088867, "global_step": 33048, "epoch": 398} {"train_loss": -18.804731369018555, "global_step": 33049, "epoch": 398} {"train_loss": -19.009687423706055, "global_step": 33050, "epoch": 398} {"train_loss": -19.200353622436523, "global_step": 33051, "epoch": 398} {"train_loss": -19.078306198120117, "global_step": 33052, "epoch": 398} {"train_loss": -19.09334373474121, "global_step": 33053, "epoch": 398} {"train_loss": -19.24801254272461, "global_step": 33054, "epoch": 398} {"train_loss": -19.24825096130371, "global_step": 33055, "epoch": 398} {"train_loss": -19.237672805786133, "global_step": 33056, "epoch": 398} {"train_loss": -19.05847930908203, "global_step": 33057, "epoch": 398} {"train_loss": -18.895111083984375, "global_step": 33058, "epoch": 398} {"train_loss": -18.97882652282715, "global_step": 33059, "epoch": 398} {"train_loss": -19.075889587402344, "global_step": 33060, "epoch": 398} {"train_loss": -19.072528839111328, "global_step": 33061, "epoch": 398} {"train_loss": -18.734556198120117, "global_step": 33062, "epoch": 398} {"train_loss": -18.823745727539062, "global_step": 33063, "epoch": 398} {"train_loss": -19.178287506103516, "global_step": 33064, "epoch": 398} {"train_loss": -19.292612075805664, "global_step": 33065, "epoch": 398} {"train_loss": -19.276113510131836, "global_step": 33066, "epoch": 398} {"train_loss": -18.969507217407227, "global_step": 33067, "epoch": 398} {"train_loss": -18.941680908203125, "global_step": 33068, "epoch": 398} {"train_loss": -19.14707374572754, "global_step": 33069, "epoch": 398} {"train_loss": -19.25396156311035, "global_step": 33070, "epoch": 398} {"train_loss": -18.93574333190918, "global_step": 33071, "epoch": 398} {"train_loss": -19.287038803100586, "global_step": 33072, "epoch": 398} {"train_loss": -19.023983001708984, "global_step": 33073, "epoch": 398} {"train_loss": -19.31732177734375, "global_step": 33074, "epoch": 398} {"train_loss": -18.977773666381836, "global_step": 33075, "epoch": 398} {"train_loss": -19.120128631591797, "global_step": 33076, "epoch": 398} {"train_loss": -18.753332138061523, "global_step": 33077, "epoch": 398} {"train_loss": -18.927595138549805, "global_step": 33078, "epoch": 398} {"train_loss": -18.96172332763672, "global_step": 33079, "epoch": 398} {"train_loss": -19.212926864624023, "global_step": 33080, "epoch": 398} {"train_loss": -18.91216468811035, "global_step": 33081, "epoch": 398} {"train_loss": -18.94402313232422, "global_step": 33082, "epoch": 398} {"train_loss": -19.25417137145996, "global_step": 33083, "epoch": 398} {"train_loss": -19.31241226196289, "global_step": 33084, "epoch": 398} {"train_loss": -19.093996047973633, "global_step": 33085, "epoch": 398} {"train_loss": -19.14944076538086, "global_step": 33086, "epoch": 398} {"train_loss": -19.112253189086914, "global_step": 33087, "epoch": 398} {"train_loss": -19.190000534057617, "global_step": 33088, "epoch": 398} {"train_loss": -19.182580947875977, "global_step": 33089, "epoch": 398} {"train_loss": -19.26344871520996, "global_step": 33090, "epoch": 398} {"train_loss": -19.03242301940918, "global_step": 33091, "epoch": 398} {"train_loss": -19.001623153686523, "global_step": 33092, "epoch": 398} {"train_loss": -18.954294204711914, "global_step": 33093, "epoch": 398} {"train_loss": -18.846942901611328, "global_step": 33094, "epoch": 398} {"train_loss": -18.962339401245117, "global_step": 33095, "epoch": 398} {"train_loss": -19.15791893005371, "global_step": 33096, "epoch": 398} {"train_loss": -18.82073402404785, "global_step": 33097, "epoch": 398} {"train_loss": -18.95806121826172, "global_step": 33098, "epoch": 398} {"train_loss": -18.884708404541016, "global_step": 33099, "epoch": 398} {"train_loss": -18.82318687438965, "global_step": 33100, "epoch": 398} {"train_loss": -18.949493408203125, "global_step": 33101, "epoch": 398} {"train_loss": -19.151315689086914, "global_step": 33102, "epoch": 398} {"train_loss": -18.975570678710938, "global_step": 33103, "epoch": 398} {"train_loss": -19.28098487854004, "global_step": 33104, "epoch": 398} {"train_loss": -19.12661361694336, "global_step": 33105, "epoch": 398} {"train_loss": -18.975582122802734, "global_step": 33106, "epoch": 398} {"train_loss": -18.947601318359375, "global_step": 33107, "epoch": 398} {"train_loss": -19.38957977294922, "global_step": 33108, "epoch": 398} {"train_loss": -19.09391975402832, "global_step": 33109, "epoch": 398} {"train_loss": -19.283170700073242, "global_step": 33110, "epoch": 398} {"train_loss": -19.093223571777344, "global_step": 33111, "epoch": 398} {"train_loss": -19.00124168395996, "global_step": 33112, "epoch": 398} {"train_loss": -19.071182250976562, "global_step": 33113, "epoch": 398} {"train_loss": -18.7137451171875, "global_step": 33114, "epoch": 398} {"train_loss": -19.491790771484375, "global_step": 33115, "epoch": 398} {"train_loss": -19.01986841408603, "global_step": 33116, "epoch": 398, "val_loss": 5827507.0} {"train_loss": -18.575729370117188, "global_step": 33117, "epoch": 399} {"train_loss": -18.763158798217773, "global_step": 33118, "epoch": 399} {"train_loss": -18.62386131286621, "global_step": 33119, "epoch": 399} {"train_loss": -19.21540641784668, "global_step": 33120, "epoch": 399} {"train_loss": -18.816389083862305, "global_step": 33121, "epoch": 399} {"train_loss": -18.910419464111328, "global_step": 33122, "epoch": 399} {"train_loss": -18.690570831298828, "global_step": 33123, "epoch": 399} {"train_loss": -19.140567779541016, "global_step": 33124, "epoch": 399} {"train_loss": -18.41585350036621, "global_step": 33125, "epoch": 399} {"train_loss": -18.909523010253906, "global_step": 33126, "epoch": 399} {"train_loss": -18.786699295043945, "global_step": 33127, "epoch": 399} {"train_loss": -19.082508087158203, "global_step": 33128, "epoch": 399} {"train_loss": -19.114587783813477, "global_step": 33129, "epoch": 399} {"train_loss": -19.2564754486084, "global_step": 33130, "epoch": 399} {"train_loss": -18.964157104492188, "global_step": 33131, "epoch": 399} {"train_loss": -18.90837287902832, "global_step": 33132, "epoch": 399} {"train_loss": -18.61115837097168, "global_step": 33133, "epoch": 399} {"train_loss": -19.05491828918457, "global_step": 33134, "epoch": 399} {"train_loss": -18.8729190826416, "global_step": 33135, "epoch": 399} {"train_loss": -19.166688919067383, "global_step": 33136, "epoch": 399} {"train_loss": -19.331972122192383, "global_step": 33137, "epoch": 399} {"train_loss": -19.160749435424805, "global_step": 33138, "epoch": 399} {"train_loss": -19.25811195373535, "global_step": 33139, "epoch": 399} {"train_loss": -18.77790069580078, "global_step": 33140, "epoch": 399} {"train_loss": -18.95991325378418, "global_step": 33141, "epoch": 399} {"train_loss": -19.073781967163086, "global_step": 33142, "epoch": 399} {"train_loss": -18.747587203979492, "global_step": 33143, "epoch": 399} {"train_loss": -19.260234832763672, "global_step": 33144, "epoch": 399} {"train_loss": -19.340576171875, "global_step": 33145, "epoch": 399} {"train_loss": -19.381793975830078, "global_step": 33146, "epoch": 399} {"train_loss": -19.40973472595215, "global_step": 33147, "epoch": 399} {"train_loss": -18.96577262878418, "global_step": 33148, "epoch": 399} {"train_loss": -19.22191047668457, "global_step": 33149, "epoch": 399} {"train_loss": -19.062171936035156, "global_step": 33150, "epoch": 399} {"train_loss": -19.032119750976562, "global_step": 33151, "epoch": 399} {"train_loss": -19.246749877929688, "global_step": 33152, "epoch": 399} {"train_loss": -18.965099334716797, "global_step": 33153, "epoch": 399} {"train_loss": -19.51068687438965, "global_step": 33154, "epoch": 399} {"train_loss": -18.998693466186523, "global_step": 33155, "epoch": 399} {"train_loss": -18.965303421020508, "global_step": 33156, "epoch": 399} {"train_loss": -19.17660903930664, "global_step": 33157, "epoch": 399} {"train_loss": -19.28900718688965, "global_step": 33158, "epoch": 399} {"train_loss": -18.815446853637695, "global_step": 33159, "epoch": 399} {"train_loss": -19.045766830444336, "global_step": 33160, "epoch": 399} {"train_loss": -18.968976974487305, "global_step": 33161, "epoch": 399} {"train_loss": -19.2645263671875, "global_step": 33162, "epoch": 399} {"train_loss": -19.030559539794922, "global_step": 33163, "epoch": 399} {"train_loss": -19.122285842895508, "global_step": 33164, "epoch": 399} {"train_loss": -18.655288696289062, "global_step": 33165, "epoch": 399} {"train_loss": -19.384891510009766, "global_step": 33166, "epoch": 399} {"train_loss": -19.21857261657715, "global_step": 33167, "epoch": 399} {"train_loss": -18.956998825073242, "global_step": 33168, "epoch": 399} {"train_loss": -18.74421501159668, "global_step": 33169, "epoch": 399} {"train_loss": -19.293790817260742, "global_step": 33170, "epoch": 399} {"train_loss": -18.768341064453125, "global_step": 33171, "epoch": 399} {"train_loss": -18.685888290405273, "global_step": 33172, "epoch": 399} {"train_loss": -19.115148544311523, "global_step": 33173, "epoch": 399} {"train_loss": -19.06422996520996, "global_step": 33174, "epoch": 399} {"train_loss": -18.928747177124023, "global_step": 33175, "epoch": 399} {"train_loss": -19.392406463623047, "global_step": 33176, "epoch": 399} {"train_loss": -18.868436813354492, "global_step": 33177, "epoch": 399} {"train_loss": -19.11533546447754, "global_step": 33178, "epoch": 399} {"train_loss": -19.071866989135742, "global_step": 33179, "epoch": 399} {"train_loss": -19.208974838256836, "global_step": 33180, "epoch": 399} {"train_loss": -19.105775833129883, "global_step": 33181, "epoch": 399} {"train_loss": -18.786901473999023, "global_step": 33182, "epoch": 399} {"train_loss": -19.21477699279785, "global_step": 33183, "epoch": 399} {"train_loss": -19.417999267578125, "global_step": 33184, "epoch": 399} {"train_loss": -18.91351890563965, "global_step": 33185, "epoch": 399} {"train_loss": -18.938879013061523, "global_step": 33186, "epoch": 399} {"train_loss": -19.248197555541992, "global_step": 33187, "epoch": 399} {"train_loss": -19.2031192779541, "global_step": 33188, "epoch": 399} {"train_loss": -19.17388343811035, "global_step": 33189, "epoch": 399} {"train_loss": -19.0748291015625, "global_step": 33190, "epoch": 399} {"train_loss": -18.745779037475586, "global_step": 33191, "epoch": 399} {"train_loss": -18.886260986328125, "global_step": 33192, "epoch": 399} {"train_loss": -19.264211654663086, "global_step": 33193, "epoch": 399} {"train_loss": -18.872888565063477, "global_step": 33194, "epoch": 399} {"train_loss": -19.17195701599121, "global_step": 33195, "epoch": 399} {"train_loss": -19.15191078186035, "global_step": 33196, "epoch": 399} {"train_loss": -19.110273361206055, "global_step": 33197, "epoch": 399} {"train_loss": -19.36948585510254, "global_step": 33198, "epoch": 399} {"train_loss": -19.05197568686612, "global_step": 33199, "epoch": 399, "val_loss": 6030154.0} {"train_loss": -18.817087173461914, "global_step": 33200, "epoch": 400} {"train_loss": -19.067432403564453, "global_step": 33201, "epoch": 400} {"train_loss": -18.815963745117188, "global_step": 33202, "epoch": 400} {"train_loss": -19.054479598999023, "global_step": 33203, "epoch": 400} {"train_loss": -18.9238338470459, "global_step": 33204, "epoch": 400} {"train_loss": -18.703521728515625, "global_step": 33205, "epoch": 400} {"train_loss": -18.83527946472168, "global_step": 33206, "epoch": 400} {"train_loss": -18.809377670288086, "global_step": 33207, "epoch": 400} {"train_loss": -19.081838607788086, "global_step": 33208, "epoch": 400} {"train_loss": -18.780004501342773, "global_step": 33209, "epoch": 400} {"train_loss": -18.885238647460938, "global_step": 33210, "epoch": 400} {"train_loss": -18.832841873168945, "global_step": 33211, "epoch": 400} {"train_loss": -18.922088623046875, "global_step": 33212, "epoch": 400} {"train_loss": -19.0638427734375, "global_step": 33213, "epoch": 400} {"train_loss": -19.165075302124023, "global_step": 33214, "epoch": 400} {"train_loss": -18.90494728088379, "global_step": 33215, "epoch": 400} {"train_loss": -18.702789306640625, "global_step": 33216, "epoch": 400} {"train_loss": -19.25599479675293, "global_step": 33217, "epoch": 400} {"train_loss": -18.813194274902344, "global_step": 33218, "epoch": 400} {"train_loss": -18.816085815429688, "global_step": 33219, "epoch": 400} {"train_loss": -19.006296157836914, "global_step": 33220, "epoch": 400} {"train_loss": -18.922300338745117, "global_step": 33221, "epoch": 400} {"train_loss": -19.209564208984375, "global_step": 33222, "epoch": 400} {"train_loss": -19.079397201538086, "global_step": 33223, "epoch": 400} {"train_loss": -18.99256706237793, "global_step": 33224, "epoch": 400} {"train_loss": -19.088083267211914, "global_step": 33225, "epoch": 400} {"train_loss": -18.84223747253418, "global_step": 33226, "epoch": 400} {"train_loss": -18.99735450744629, "global_step": 33227, "epoch": 400} {"train_loss": -19.20615005493164, "global_step": 33228, "epoch": 400} {"train_loss": -19.035207748413086, "global_step": 33229, "epoch": 400} {"train_loss": -19.051895141601562, "global_step": 33230, "epoch": 400} {"train_loss": -18.77939796447754, "global_step": 33231, "epoch": 400} {"train_loss": -19.043107986450195, "global_step": 33232, "epoch": 400} {"train_loss": -19.067583084106445, "global_step": 33233, "epoch": 400} {"train_loss": -19.320819854736328, "global_step": 33234, "epoch": 400} {"train_loss": -19.156225204467773, "global_step": 33235, "epoch": 400} {"train_loss": -19.1440486907959, "global_step": 33236, "epoch": 400} {"train_loss": -18.642080307006836, "global_step": 33237, "epoch": 400} {"train_loss": -19.117345809936523, "global_step": 33238, "epoch": 400} {"train_loss": -19.210906982421875, "global_step": 33239, "epoch": 400} {"train_loss": -18.99246597290039, "global_step": 33240, "epoch": 400} {"train_loss": -19.406660079956055, "global_step": 33241, "epoch": 400} {"train_loss": -19.35186004638672, "global_step": 33242, "epoch": 400} {"train_loss": -19.046003341674805, "global_step": 33243, "epoch": 400} {"train_loss": -19.18178367614746, "global_step": 33244, "epoch": 400} {"train_loss": -19.13339614868164, "global_step": 33245, "epoch": 400} {"train_loss": -19.29207420349121, "global_step": 33246, "epoch": 400} {"train_loss": -19.474075317382812, "global_step": 33247, "epoch": 400} {"train_loss": -19.080678939819336, "global_step": 33248, "epoch": 400} {"train_loss": -19.088430404663086, "global_step": 33249, "epoch": 400} {"train_loss": -18.952350616455078, "global_step": 33250, "epoch": 400} {"train_loss": -19.118331909179688, "global_step": 33251, "epoch": 400} {"train_loss": -19.25844383239746, "global_step": 33252, "epoch": 400} {"train_loss": -19.003244400024414, "global_step": 33253, "epoch": 400} {"train_loss": -19.14400863647461, "global_step": 33254, "epoch": 400} {"train_loss": -18.951623916625977, "global_step": 33255, "epoch": 400} {"train_loss": -18.789854049682617, "global_step": 33256, "epoch": 400} {"train_loss": -19.136159896850586, "global_step": 33257, "epoch": 400} {"train_loss": -19.12413787841797, "global_step": 33258, "epoch": 400} {"train_loss": -19.240375518798828, "global_step": 33259, "epoch": 400} {"train_loss": -19.375364303588867, "global_step": 33260, "epoch": 400} {"train_loss": -19.24158477783203, "global_step": 33261, "epoch": 400} {"train_loss": -19.301618576049805, "global_step": 33262, "epoch": 400} {"train_loss": -19.339923858642578, "global_step": 33263, "epoch": 400} {"train_loss": -18.886892318725586, "global_step": 33264, "epoch": 400} {"train_loss": -18.75234031677246, "global_step": 33265, "epoch": 400} {"train_loss": -18.905597686767578, "global_step": 33266, "epoch": 400} {"train_loss": -19.32684326171875, "global_step": 33267, "epoch": 400} {"train_loss": -19.47653579711914, "global_step": 33268, "epoch": 400} {"train_loss": -19.285690307617188, "global_step": 33269, "epoch": 400} {"train_loss": -19.101415634155273, "global_step": 33270, "epoch": 400} {"train_loss": -19.126220703125, "global_step": 33271, "epoch": 400} {"train_loss": -19.0789852142334, "global_step": 33272, "epoch": 400} {"train_loss": -19.3236083984375, "global_step": 33273, "epoch": 400} {"train_loss": -19.267744064331055, "global_step": 33274, "epoch": 400} {"train_loss": -19.081052780151367, "global_step": 33275, "epoch": 400} {"train_loss": -18.976810455322266, "global_step": 33276, "epoch": 400} {"train_loss": -19.21932601928711, "global_step": 33277, "epoch": 400} {"train_loss": -19.180335998535156, "global_step": 33278, "epoch": 400} {"train_loss": -19.18657875061035, "global_step": 33279, "epoch": 400} {"train_loss": -18.8753719329834, "global_step": 33280, "epoch": 400} {"train_loss": -18.973432540893555, "global_step": 33281, "epoch": 400} {"train_loss": -19.07821204863399, "global_step": 33282, "epoch": 400, "train/sim_max_reward_0": 1.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 0.0, "train/sim_max_reward_4": 0.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4500000": 0.0, "test/sim_max_reward_4500001": 1.0, "test/sim_max_reward_4500002": 0.0, "test/sim_max_reward_4500003": 1.0, "test/sim_max_reward_4500004": 1.0, "test/sim_max_reward_4500005": 1.0, "test/sim_max_reward_4500006": 1.0, "test/sim_max_reward_4500007": 1.0, "test/sim_max_reward_4500008": 1.0, "test/sim_max_reward_4500009": 1.0, "test/sim_max_reward_4500010": 1.0, "test/sim_max_reward_4500011": 1.0, "test/sim_max_reward_4500012": 1.0, "test/sim_max_reward_4500013": 1.0, "test/sim_max_reward_4500014": 1.0, "test/sim_max_reward_4500015": 1.0, "test/sim_max_reward_4500016": 1.0, "test/sim_max_reward_4500017": 1.0, "test/sim_max_reward_4500018": 1.0, "test/sim_max_reward_4500019": 0.0, "test/sim_max_reward_4500020": 1.0, "test/sim_max_reward_4500021": 1.0, "train/mean_score": 0.6666666666666666, "test/mean_score": 0.8636363636363636, "val_loss": 6000206.5} {"train_loss": -19.025535583496094, "global_step": 33283, "epoch": 401} {"train_loss": -19.418060302734375, "global_step": 33284, "epoch": 401} {"train_loss": -19.25790786743164, "global_step": 33285, "epoch": 401} {"train_loss": -19.009517669677734, "global_step": 33286, "epoch": 401} {"train_loss": -19.1080265045166, "global_step": 33287, "epoch": 401} {"train_loss": -19.392681121826172, "global_step": 33288, "epoch": 401} {"train_loss": -19.05191421508789, "global_step": 33289, "epoch": 401} {"train_loss": -18.599773406982422, "global_step": 33290, "epoch": 401} {"train_loss": -19.012786865234375, "global_step": 33291, "epoch": 401} {"train_loss": -18.70155906677246, "global_step": 33292, "epoch": 401} {"train_loss": -18.898717880249023, "global_step": 33293, "epoch": 401} {"train_loss": -18.87244987487793, "global_step": 33294, "epoch": 401} {"train_loss": -19.118345260620117, "global_step": 33295, "epoch": 401} {"train_loss": -19.10005760192871, "global_step": 33296, "epoch": 401} {"train_loss": -19.23179054260254, "global_step": 33297, "epoch": 401} {"train_loss": -18.945863723754883, "global_step": 33298, "epoch": 401} {"train_loss": -19.04005241394043, "global_step": 33299, "epoch": 401} {"train_loss": -19.12384796142578, "global_step": 33300, "epoch": 401} {"train_loss": -19.054372787475586, "global_step": 33301, "epoch": 401} {"train_loss": -19.21491050720215, "global_step": 33302, "epoch": 401} {"train_loss": -18.816680908203125, "global_step": 33303, "epoch": 401} {"train_loss": -19.2159366607666, "global_step": 33304, "epoch": 401} {"train_loss": -19.441213607788086, "global_step": 33305, "epoch": 401} {"train_loss": -19.442855834960938, "global_step": 33306, "epoch": 401} {"train_loss": -18.993276596069336, "global_step": 33307, "epoch": 401} {"train_loss": -19.09210777282715, "global_step": 33308, "epoch": 401} {"train_loss": -19.108381271362305, "global_step": 33309, "epoch": 401} {"train_loss": -18.669025421142578, "global_step": 33310, "epoch": 401} {"train_loss": -19.208005905151367, "global_step": 33311, "epoch": 401} {"train_loss": -18.989612579345703, "global_step": 33312, "epoch": 401} {"train_loss": -19.444263458251953, "global_step": 33313, "epoch": 401} {"train_loss": -19.352027893066406, "global_step": 33314, "epoch": 401} {"train_loss": -19.13226890563965, "global_step": 33315, "epoch": 401} {"train_loss": -19.129892349243164, "global_step": 33316, "epoch": 401} {"train_loss": -19.22315788269043, "global_step": 33317, "epoch": 401} {"train_loss": -19.242483139038086, "global_step": 33318, "epoch": 401} {"train_loss": -18.9913272857666, "global_step": 33319, "epoch": 401} {"train_loss": -18.505956649780273, "global_step": 33320, "epoch": 401} {"train_loss": -18.68497085571289, "global_step": 33321, "epoch": 401} {"train_loss": -19.090246200561523, "global_step": 33322, "epoch": 401} {"train_loss": -18.87021255493164, "global_step": 33323, "epoch": 401} {"train_loss": -18.883508682250977, "global_step": 33324, "epoch": 401} {"train_loss": -18.79426383972168, "global_step": 33325, "epoch": 401} {"train_loss": -18.882234573364258, "global_step": 33326, "epoch": 401} {"train_loss": -18.856348037719727, "global_step": 33327, "epoch": 401} {"train_loss": -19.594722747802734, "global_step": 33328, "epoch": 401} {"train_loss": -19.14554786682129, "global_step": 33329, "epoch": 401} {"train_loss": -19.124267578125, "global_step": 33330, "epoch": 401} {"train_loss": -19.197433471679688, "global_step": 33331, "epoch": 401} {"train_loss": -19.411039352416992, "global_step": 33332, "epoch": 401} {"train_loss": -18.837108612060547, "global_step": 33333, "epoch": 401} {"train_loss": -19.11293601989746, "global_step": 33334, "epoch": 401} {"train_loss": -18.920087814331055, "global_step": 33335, "epoch": 401} {"train_loss": -18.962779998779297, "global_step": 33336, "epoch": 401} {"train_loss": -19.484384536743164, "global_step": 33337, "epoch": 401} {"train_loss": -19.060476303100586, "global_step": 33338, "epoch": 401} {"train_loss": -18.61478042602539, "global_step": 33339, "epoch": 401} {"train_loss": -18.851301193237305, "global_step": 33340, "epoch": 401} {"train_loss": -18.903614044189453, "global_step": 33341, "epoch": 401} {"train_loss": -19.16524314880371, "global_step": 33342, "epoch": 401} {"train_loss": -19.335044860839844, "global_step": 33343, "epoch": 401} {"train_loss": -19.39569854736328, "global_step": 33344, "epoch": 401} {"train_loss": -19.109872817993164, "global_step": 33345, "epoch": 401} {"train_loss": -19.083602905273438, "global_step": 33346, "epoch": 401} {"train_loss": -18.742048263549805, "global_step": 33347, "epoch": 401} {"train_loss": -19.153793334960938, "global_step": 33348, "epoch": 401} {"train_loss": -19.104358673095703, "global_step": 33349, "epoch": 401} {"train_loss": -19.39206314086914, "global_step": 33350, "epoch": 401} {"train_loss": -18.927078247070312, "global_step": 33351, "epoch": 401} {"train_loss": -19.16457748413086, "global_step": 33352, "epoch": 401} {"train_loss": -19.195884704589844, "global_step": 33353, "epoch": 401} {"train_loss": -19.159244537353516, "global_step": 33354, "epoch": 401} {"train_loss": -19.267196655273438, "global_step": 33355, "epoch": 401} {"train_loss": -19.224889755249023, "global_step": 33356, "epoch": 401} {"train_loss": -19.32431983947754, "global_step": 33357, "epoch": 401} {"train_loss": -19.016550064086914, "global_step": 33358, "epoch": 401} {"train_loss": -19.21242332458496, "global_step": 33359, "epoch": 401} {"train_loss": -19.2904109954834, "global_step": 33360, "epoch": 401} {"train_loss": -19.170522689819336, "global_step": 33361, "epoch": 401} {"train_loss": -19.27423095703125, "global_step": 33362, "epoch": 401} {"train_loss": -19.2334041595459, "global_step": 33363, "epoch": 401} {"train_loss": -19.079797744750977, "global_step": 33364, "epoch": 401} {"train_loss": -19.087980224425536, "global_step": 33365, "epoch": 401, "val_loss": 6000368.0} {"train_loss": -18.966405868530273, "global_step": 33366, "epoch": 402} {"train_loss": -19.15083885192871, "global_step": 33367, "epoch": 402} {"train_loss": -18.96949577331543, "global_step": 33368, "epoch": 402} {"train_loss": -19.199323654174805, "global_step": 33369, "epoch": 402} {"train_loss": -19.05870819091797, "global_step": 33370, "epoch": 402} {"train_loss": -18.7852840423584, "global_step": 33371, "epoch": 402} {"train_loss": -19.052106857299805, "global_step": 33372, "epoch": 402} {"train_loss": -19.069486618041992, "global_step": 33373, "epoch": 402} {"train_loss": -19.2171688079834, "global_step": 33374, "epoch": 402} {"train_loss": -19.2619571685791, "global_step": 33375, "epoch": 402} {"train_loss": -19.250085830688477, "global_step": 33376, "epoch": 402} {"train_loss": -18.677213668823242, "global_step": 33377, "epoch": 402} {"train_loss": -19.471508026123047, "global_step": 33378, "epoch": 402} {"train_loss": -18.98569679260254, "global_step": 33379, "epoch": 402} {"train_loss": -19.17440414428711, "global_step": 33380, "epoch": 402} {"train_loss": -18.981348037719727, "global_step": 33381, "epoch": 402} {"train_loss": -19.286954879760742, "global_step": 33382, "epoch": 402} {"train_loss": -18.741806030273438, "global_step": 33383, "epoch": 402} {"train_loss": -19.059926986694336, "global_step": 33384, "epoch": 402} {"train_loss": -19.336889266967773, "global_step": 33385, "epoch": 402} {"train_loss": -18.97735595703125, "global_step": 33386, "epoch": 402} {"train_loss": -19.010347366333008, "global_step": 33387, "epoch": 402} {"train_loss": -19.290374755859375, "global_step": 33388, "epoch": 402} {"train_loss": -19.077238082885742, "global_step": 33389, "epoch": 402} {"train_loss": -19.104795455932617, "global_step": 33390, "epoch": 402} {"train_loss": -18.934093475341797, "global_step": 33391, "epoch": 402} {"train_loss": -18.904157638549805, "global_step": 33392, "epoch": 402} {"train_loss": -18.781879425048828, "global_step": 33393, "epoch": 402} {"train_loss": -18.864578247070312, "global_step": 33394, "epoch": 402} {"train_loss": -19.116743087768555, "global_step": 33395, "epoch": 402} {"train_loss": -18.960660934448242, "global_step": 33396, "epoch": 402} {"train_loss": -18.731016159057617, "global_step": 33397, "epoch": 402} {"train_loss": -18.881183624267578, "global_step": 33398, "epoch": 402} {"train_loss": -19.228702545166016, "global_step": 33399, "epoch": 402} {"train_loss": -19.187042236328125, "global_step": 33400, "epoch": 402} {"train_loss": -19.055591583251953, "global_step": 33401, "epoch": 402} {"train_loss": -19.26651954650879, "global_step": 33402, "epoch": 402} {"train_loss": -19.20108985900879, "global_step": 33403, "epoch": 402} {"train_loss": -18.917940139770508, "global_step": 33404, "epoch": 402} {"train_loss": -18.979970932006836, "global_step": 33405, "epoch": 402} {"train_loss": -18.72510528564453, "global_step": 33406, "epoch": 402} {"train_loss": -19.07411003112793, "global_step": 33407, "epoch": 402} {"train_loss": -19.405414581298828, "global_step": 33408, "epoch": 402} {"train_loss": -19.080602645874023, "global_step": 33409, "epoch": 402} {"train_loss": -19.36716079711914, "global_step": 33410, "epoch": 402} {"train_loss": -18.941492080688477, "global_step": 33411, "epoch": 402} {"train_loss": -19.192407608032227, "global_step": 33412, "epoch": 402} {"train_loss": -19.097883224487305, "global_step": 33413, "epoch": 402} {"train_loss": -19.274429321289062, "global_step": 33414, "epoch": 402} {"train_loss": -19.556901931762695, "global_step": 33415, "epoch": 402} {"train_loss": -19.123510360717773, "global_step": 33416, "epoch": 402} {"train_loss": -19.206872940063477, "global_step": 33417, "epoch": 402} {"train_loss": -19.49928855895996, "global_step": 33418, "epoch": 402} {"train_loss": -19.08434295654297, "global_step": 33419, "epoch": 402} {"train_loss": -18.977031707763672, "global_step": 33420, "epoch": 402} {"train_loss": -19.50231170654297, "global_step": 33421, "epoch": 402} {"train_loss": -19.046924591064453, "global_step": 33422, "epoch": 402} {"train_loss": -19.220928192138672, "global_step": 33423, "epoch": 402} {"train_loss": -19.423219680786133, "global_step": 33424, "epoch": 402} {"train_loss": -19.37314796447754, "global_step": 33425, "epoch": 402} {"train_loss": -19.1596622467041, "global_step": 33426, "epoch": 402} {"train_loss": -19.030654907226562, "global_step": 33427, "epoch": 402} {"train_loss": -19.184728622436523, "global_step": 33428, "epoch": 402} {"train_loss": -19.256637573242188, "global_step": 33429, "epoch": 402} {"train_loss": -19.176895141601562, "global_step": 33430, "epoch": 402} {"train_loss": -19.175256729125977, "global_step": 33431, "epoch": 402} {"train_loss": -19.293346405029297, "global_step": 33432, "epoch": 402} {"train_loss": -19.15962028503418, "global_step": 33433, "epoch": 402} {"train_loss": -18.959156036376953, "global_step": 33434, "epoch": 402} {"train_loss": -19.2857666015625, "global_step": 33435, "epoch": 402} {"train_loss": -18.795835494995117, "global_step": 33436, "epoch": 402} {"train_loss": -19.136987686157227, "global_step": 33437, "epoch": 402} {"train_loss": -19.557769775390625, "global_step": 33438, "epoch": 402} {"train_loss": -19.04983901977539, "global_step": 33439, "epoch": 402} {"train_loss": -19.111570358276367, "global_step": 33440, "epoch": 402} {"train_loss": -18.680116653442383, "global_step": 33441, "epoch": 402} {"train_loss": -18.895862579345703, "global_step": 33442, "epoch": 402} {"train_loss": -19.16425323486328, "global_step": 33443, "epoch": 402} {"train_loss": -19.429929733276367, "global_step": 33444, "epoch": 402} {"train_loss": -19.33760643005371, "global_step": 33445, "epoch": 402} {"train_loss": -18.797475814819336, "global_step": 33446, "epoch": 402} {"train_loss": -19.065731048583984, "global_step": 33447, "epoch": 402} {"train_loss": -19.10463850182223, "global_step": 33448, "epoch": 402, "val_loss": 6040730.5} {"train_loss": -18.94452476501465, "global_step": 33449, "epoch": 403} {"train_loss": -18.88445281982422, "global_step": 33450, "epoch": 403} {"train_loss": -18.743762969970703, "global_step": 33451, "epoch": 403} {"train_loss": -18.870676040649414, "global_step": 33452, "epoch": 403} {"train_loss": -19.473499298095703, "global_step": 33453, "epoch": 403} {"train_loss": -19.02286720275879, "global_step": 33454, "epoch": 403} {"train_loss": -18.947723388671875, "global_step": 33455, "epoch": 403} {"train_loss": -19.414270401000977, "global_step": 33456, "epoch": 403} {"train_loss": -18.92831802368164, "global_step": 33457, "epoch": 403} {"train_loss": -19.128753662109375, "global_step": 33458, "epoch": 403} {"train_loss": -18.685243606567383, "global_step": 33459, "epoch": 403} {"train_loss": -19.249828338623047, "global_step": 33460, "epoch": 403} {"train_loss": -18.713382720947266, "global_step": 33461, "epoch": 403} {"train_loss": -19.19816017150879, "global_step": 33462, "epoch": 403} {"train_loss": -19.40602684020996, "global_step": 33463, "epoch": 403} {"train_loss": -18.804540634155273, "global_step": 33464, "epoch": 403} {"train_loss": -19.080026626586914, "global_step": 33465, "epoch": 403} {"train_loss": -19.264474868774414, "global_step": 33466, "epoch": 403} {"train_loss": -19.439104080200195, "global_step": 33467, "epoch": 403} {"train_loss": -19.060596466064453, "global_step": 33468, "epoch": 403} {"train_loss": -19.032691955566406, "global_step": 33469, "epoch": 403} {"train_loss": -19.113113403320312, "global_step": 33470, "epoch": 403} {"train_loss": -19.40606689453125, "global_step": 33471, "epoch": 403} {"train_loss": -19.228225708007812, "global_step": 33472, "epoch": 403} {"train_loss": -18.9314022064209, "global_step": 33473, "epoch": 403} {"train_loss": -19.568538665771484, "global_step": 33474, "epoch": 403} {"train_loss": -19.244333267211914, "global_step": 33475, "epoch": 403} {"train_loss": -18.718366622924805, "global_step": 33476, "epoch": 403} {"train_loss": -18.84321403503418, "global_step": 33477, "epoch": 403} {"train_loss": -18.914623260498047, "global_step": 33478, "epoch": 403} {"train_loss": -18.929363250732422, "global_step": 33479, "epoch": 403} {"train_loss": -19.220396041870117, "global_step": 33480, "epoch": 403} {"train_loss": -19.421903610229492, "global_step": 33481, "epoch": 403} {"train_loss": -18.980026245117188, "global_step": 33482, "epoch": 403} {"train_loss": -18.95594596862793, "global_step": 33483, "epoch": 403} {"train_loss": -19.10040283203125, "global_step": 33484, "epoch": 403} {"train_loss": -19.008743286132812, "global_step": 33485, "epoch": 403} {"train_loss": -19.07596778869629, "global_step": 33486, "epoch": 403} {"train_loss": -19.313899993896484, "global_step": 33487, "epoch": 403} {"train_loss": -19.126672744750977, "global_step": 33488, "epoch": 403} {"train_loss": -19.2886962890625, "global_step": 33489, "epoch": 403} {"train_loss": -19.260746002197266, "global_step": 33490, "epoch": 403} {"train_loss": -19.252716064453125, "global_step": 33491, "epoch": 403} {"train_loss": -19.298736572265625, "global_step": 33492, "epoch": 403} {"train_loss": -19.2258358001709, "global_step": 33493, "epoch": 403} {"train_loss": -19.349096298217773, "global_step": 33494, "epoch": 403} {"train_loss": -19.388608932495117, "global_step": 33495, "epoch": 403} {"train_loss": -19.585630416870117, "global_step": 33496, "epoch": 403} {"train_loss": -19.20989990234375, "global_step": 33497, "epoch": 403} {"train_loss": -18.9864501953125, "global_step": 33498, "epoch": 403} {"train_loss": -19.510602951049805, "global_step": 33499, "epoch": 403} {"train_loss": -19.36208152770996, "global_step": 33500, "epoch": 403} {"train_loss": -19.38861656188965, "global_step": 33501, "epoch": 403} {"train_loss": -18.98630142211914, "global_step": 33502, "epoch": 403} {"train_loss": -19.260608673095703, "global_step": 33503, "epoch": 403} {"train_loss": -19.17096710205078, "global_step": 33504, "epoch": 403} {"train_loss": -19.468202590942383, "global_step": 33505, "epoch": 403} {"train_loss": -18.74021339416504, "global_step": 33506, "epoch": 403} {"train_loss": -19.213159561157227, "global_step": 33507, "epoch": 403} {"train_loss": -19.036943435668945, "global_step": 33508, "epoch": 403} {"train_loss": -19.56247329711914, "global_step": 33509, "epoch": 403} {"train_loss": -18.96091651916504, "global_step": 33510, "epoch": 403} {"train_loss": -18.96433448791504, "global_step": 33511, "epoch": 403} {"train_loss": -18.97114372253418, "global_step": 33512, "epoch": 403} {"train_loss": -18.62428855895996, "global_step": 33513, "epoch": 403} {"train_loss": -18.874755859375, "global_step": 33514, "epoch": 403} {"train_loss": -19.084333419799805, "global_step": 33515, "epoch": 403} {"train_loss": -19.203582763671875, "global_step": 33516, "epoch": 403} {"train_loss": -19.114439010620117, "global_step": 33517, "epoch": 403} {"train_loss": -18.93924331665039, "global_step": 33518, "epoch": 403} {"train_loss": -19.24411964416504, "global_step": 33519, "epoch": 403} {"train_loss": -18.952688217163086, "global_step": 33520, "epoch": 403} {"train_loss": -19.167194366455078, "global_step": 33521, "epoch": 403} {"train_loss": -18.999481201171875, "global_step": 33522, "epoch": 403} {"train_loss": -18.964099884033203, "global_step": 33523, "epoch": 403} {"train_loss": -19.057880401611328, "global_step": 33524, "epoch": 403} {"train_loss": -19.30280876159668, "global_step": 33525, "epoch": 403} {"train_loss": -18.8983154296875, "global_step": 33526, "epoch": 403} {"train_loss": -19.60202980041504, "global_step": 33527, "epoch": 403} {"train_loss": -18.931625366210938, "global_step": 33528, "epoch": 403} {"train_loss": -19.211917877197266, "global_step": 33529, "epoch": 403} {"train_loss": -19.070371627807617, "global_step": 33530, "epoch": 403} {"train_loss": -19.108495160757776, "global_step": 33531, "epoch": 403, "val_loss": 5999680.5} {"train_loss": -19.221860885620117, "global_step": 33532, "epoch": 404} {"train_loss": -18.516708374023438, "global_step": 33533, "epoch": 404} {"train_loss": -19.339853286743164, "global_step": 33534, "epoch": 404} {"train_loss": -18.955713272094727, "global_step": 33535, "epoch": 404} {"train_loss": -18.860288619995117, "global_step": 33536, "epoch": 404} {"train_loss": -18.86384391784668, "global_step": 33537, "epoch": 404} {"train_loss": -19.009885787963867, "global_step": 33538, "epoch": 404} {"train_loss": -18.52066993713379, "global_step": 33539, "epoch": 404} {"train_loss": -18.885534286499023, "global_step": 33540, "epoch": 404} {"train_loss": -19.238128662109375, "global_step": 33541, "epoch": 404} {"train_loss": -18.9234561920166, "global_step": 33542, "epoch": 404} {"train_loss": -19.39396858215332, "global_step": 33543, "epoch": 404} {"train_loss": -18.84895133972168, "global_step": 33544, "epoch": 404} {"train_loss": -19.096439361572266, "global_step": 33545, "epoch": 404} {"train_loss": -18.996610641479492, "global_step": 33546, "epoch": 404} {"train_loss": -19.37059211730957, "global_step": 33547, "epoch": 404} {"train_loss": -19.06918716430664, "global_step": 33548, "epoch": 404} {"train_loss": -19.15484619140625, "global_step": 33549, "epoch": 404} {"train_loss": -19.15157127380371, "global_step": 33550, "epoch": 404} {"train_loss": -18.977323532104492, "global_step": 33551, "epoch": 404} {"train_loss": -18.964248657226562, "global_step": 33552, "epoch": 404} {"train_loss": -18.899267196655273, "global_step": 33553, "epoch": 404} {"train_loss": -18.83344841003418, "global_step": 33554, "epoch": 404} {"train_loss": -19.165536880493164, "global_step": 33555, "epoch": 404} {"train_loss": -18.84742546081543, "global_step": 33556, "epoch": 404} {"train_loss": -19.33580207824707, "global_step": 33557, "epoch": 404} {"train_loss": -19.1741886138916, "global_step": 33558, "epoch": 404} {"train_loss": -19.327009201049805, "global_step": 33559, "epoch": 404} {"train_loss": -19.390546798706055, "global_step": 33560, "epoch": 404} {"train_loss": -19.08063316345215, "global_step": 33561, "epoch": 404} {"train_loss": -19.11775016784668, "global_step": 33562, "epoch": 404} {"train_loss": -18.969266891479492, "global_step": 33563, "epoch": 404} {"train_loss": -19.043806076049805, "global_step": 33564, "epoch": 404} {"train_loss": -19.042490005493164, "global_step": 33565, "epoch": 404} {"train_loss": -19.155902862548828, "global_step": 33566, "epoch": 404} {"train_loss": -19.266416549682617, "global_step": 33567, "epoch": 404} {"train_loss": -19.327817916870117, "global_step": 33568, "epoch": 404} {"train_loss": -19.489501953125, "global_step": 33569, "epoch": 404} {"train_loss": -18.9921932220459, "global_step": 33570, "epoch": 404} {"train_loss": -19.430301666259766, "global_step": 33571, "epoch": 404} {"train_loss": -19.231653213500977, "global_step": 33572, "epoch": 404} {"train_loss": -19.18940544128418, "global_step": 33573, "epoch": 404} {"train_loss": -18.940086364746094, "global_step": 33574, "epoch": 404} {"train_loss": -19.25649070739746, "global_step": 33575, "epoch": 404} {"train_loss": -19.00554847717285, "global_step": 33576, "epoch": 404} {"train_loss": -19.391637802124023, "global_step": 33577, "epoch": 404} {"train_loss": -19.04743194580078, "global_step": 33578, "epoch": 404} {"train_loss": -19.006744384765625, "global_step": 33579, "epoch": 404} {"train_loss": -19.23581886291504, "global_step": 33580, "epoch": 404} {"train_loss": -19.367517471313477, "global_step": 33581, "epoch": 404} {"train_loss": -19.13760757446289, "global_step": 33582, "epoch": 404} {"train_loss": -19.24061393737793, "global_step": 33583, "epoch": 404} {"train_loss": -19.16757583618164, "global_step": 33584, "epoch": 404} {"train_loss": -19.300016403198242, "global_step": 33585, "epoch": 404} {"train_loss": -19.102439880371094, "global_step": 33586, "epoch": 404} {"train_loss": -19.122772216796875, "global_step": 33587, "epoch": 404} {"train_loss": -19.506610870361328, "global_step": 33588, "epoch": 404} {"train_loss": -19.06406021118164, "global_step": 33589, "epoch": 404} {"train_loss": -19.099706649780273, "global_step": 33590, "epoch": 404} {"train_loss": -19.555145263671875, "global_step": 33591, "epoch": 404} {"train_loss": -18.88939666748047, "global_step": 33592, "epoch": 404} {"train_loss": -18.855161666870117, "global_step": 33593, "epoch": 404} {"train_loss": -19.539350509643555, "global_step": 33594, "epoch": 404} {"train_loss": -19.10796356201172, "global_step": 33595, "epoch": 404} {"train_loss": -19.162418365478516, "global_step": 33596, "epoch": 404} {"train_loss": -18.82161521911621, "global_step": 33597, "epoch": 404} {"train_loss": -19.202571868896484, "global_step": 33598, "epoch": 404} {"train_loss": -19.078472137451172, "global_step": 33599, "epoch": 404} {"train_loss": -19.120086669921875, "global_step": 33600, "epoch": 404} {"train_loss": -19.271699905395508, "global_step": 33601, "epoch": 404} {"train_loss": -18.93284034729004, "global_step": 33602, "epoch": 404} {"train_loss": -19.305377960205078, "global_step": 33603, "epoch": 404} {"train_loss": -19.348722457885742, "global_step": 33604, "epoch": 404} {"train_loss": -18.97431755065918, "global_step": 33605, "epoch": 404} {"train_loss": -19.29152488708496, "global_step": 33606, "epoch": 404} {"train_loss": -19.010557174682617, "global_step": 33607, "epoch": 404} {"train_loss": -19.356969833374023, "global_step": 33608, "epoch": 404} {"train_loss": -19.03822135925293, "global_step": 33609, "epoch": 404} {"train_loss": -19.26962661743164, "global_step": 33610, "epoch": 404} {"train_loss": -19.289487838745117, "global_step": 33611, "epoch": 404} {"train_loss": -19.222864151000977, "global_step": 33612, "epoch": 404} {"train_loss": -19.67245101928711, "global_step": 33613, "epoch": 404} {"train_loss": -19.139871045767542, "global_step": 33614, "epoch": 404, "val_loss": 5922075.0} {"train_loss": -19.071914672851562, "global_step": 33615, "epoch": 405} {"train_loss": -19.314043045043945, "global_step": 33616, "epoch": 405} {"train_loss": -19.04513931274414, "global_step": 33617, "epoch": 405} {"train_loss": -19.639606475830078, "global_step": 33618, "epoch": 405} {"train_loss": -18.90492820739746, "global_step": 33619, "epoch": 405} {"train_loss": -18.82234001159668, "global_step": 33620, "epoch": 405} {"train_loss": -18.9697322845459, "global_step": 33621, "epoch": 405} {"train_loss": -18.9841251373291, "global_step": 33622, "epoch": 405} {"train_loss": -19.090465545654297, "global_step": 33623, "epoch": 405} {"train_loss": -19.20485496520996, "global_step": 33624, "epoch": 405} {"train_loss": -19.039947509765625, "global_step": 33625, "epoch": 405} {"train_loss": -18.933917999267578, "global_step": 33626, "epoch": 405} {"train_loss": -19.28937339782715, "global_step": 33627, "epoch": 405} {"train_loss": -19.233808517456055, "global_step": 33628, "epoch": 405} {"train_loss": -18.855350494384766, "global_step": 33629, "epoch": 405} {"train_loss": -19.285470962524414, "global_step": 33630, "epoch": 405} {"train_loss": -19.040929794311523, "global_step": 33631, "epoch": 405} {"train_loss": -19.226898193359375, "global_step": 33632, "epoch": 405} {"train_loss": -19.434720993041992, "global_step": 33633, "epoch": 405} {"train_loss": -19.125263214111328, "global_step": 33634, "epoch": 405} {"train_loss": -19.000707626342773, "global_step": 33635, "epoch": 405} {"train_loss": -18.79941177368164, "global_step": 33636, "epoch": 405} {"train_loss": -19.426794052124023, "global_step": 33637, "epoch": 405} {"train_loss": -18.75820541381836, "global_step": 33638, "epoch": 405} {"train_loss": -19.305118560791016, "global_step": 33639, "epoch": 405} {"train_loss": -19.16993522644043, "global_step": 33640, "epoch": 405} {"train_loss": -18.8642520904541, "global_step": 33641, "epoch": 405} {"train_loss": -19.398950576782227, "global_step": 33642, "epoch": 405} {"train_loss": -19.451587677001953, "global_step": 33643, "epoch": 405} {"train_loss": -19.05621910095215, "global_step": 33644, "epoch": 405} {"train_loss": -19.293241500854492, "global_step": 33645, "epoch": 405} {"train_loss": -19.473308563232422, "global_step": 33646, "epoch": 405} {"train_loss": -18.88453483581543, "global_step": 33647, "epoch": 405} {"train_loss": -19.610733032226562, "global_step": 33648, "epoch": 405} {"train_loss": -18.806869506835938, "global_step": 33649, "epoch": 405} {"train_loss": -19.07910919189453, "global_step": 33650, "epoch": 405} {"train_loss": -18.846210479736328, "global_step": 33651, "epoch": 405} {"train_loss": -18.84827423095703, "global_step": 33652, "epoch": 405} {"train_loss": -19.1198673248291, "global_step": 33653, "epoch": 405} {"train_loss": -18.974040985107422, "global_step": 33654, "epoch": 405} {"train_loss": -19.054672241210938, "global_step": 33655, "epoch": 405} {"train_loss": -19.232410430908203, "global_step": 33656, "epoch": 405} {"train_loss": -19.096418380737305, "global_step": 33657, "epoch": 405} {"train_loss": -19.145231246948242, "global_step": 33658, "epoch": 405} {"train_loss": -18.948455810546875, "global_step": 33659, "epoch": 405} {"train_loss": -19.13376808166504, "global_step": 33660, "epoch": 405} {"train_loss": -18.866687774658203, "global_step": 33661, "epoch": 405} {"train_loss": -19.31236457824707, "global_step": 33662, "epoch": 405} {"train_loss": -19.484716415405273, "global_step": 33663, "epoch": 405} {"train_loss": -19.030353546142578, "global_step": 33664, "epoch": 405} {"train_loss": -18.97568130493164, "global_step": 33665, "epoch": 405} {"train_loss": -19.170656204223633, "global_step": 33666, "epoch": 405} {"train_loss": -18.927566528320312, "global_step": 33667, "epoch": 405} {"train_loss": -19.134796142578125, "global_step": 33668, "epoch": 405} {"train_loss": -18.800077438354492, "global_step": 33669, "epoch": 405} {"train_loss": -19.05014991760254, "global_step": 33670, "epoch": 405} {"train_loss": -19.028566360473633, "global_step": 33671, "epoch": 405} {"train_loss": -19.077606201171875, "global_step": 33672, "epoch": 405} {"train_loss": -19.09856605529785, "global_step": 33673, "epoch": 405} {"train_loss": -19.300451278686523, "global_step": 33674, "epoch": 405} {"train_loss": -19.017770767211914, "global_step": 33675, "epoch": 405} {"train_loss": -18.946687698364258, "global_step": 33676, "epoch": 405} {"train_loss": -18.89496421813965, "global_step": 33677, "epoch": 405} {"train_loss": -19.33819007873535, "global_step": 33678, "epoch": 405} {"train_loss": -19.19015884399414, "global_step": 33679, "epoch": 405} {"train_loss": -18.796064376831055, "global_step": 33680, "epoch": 405} {"train_loss": -19.237279891967773, "global_step": 33681, "epoch": 405} {"train_loss": -19.086454391479492, "global_step": 33682, "epoch": 405} {"train_loss": -19.200307846069336, "global_step": 33683, "epoch": 405} {"train_loss": -18.796581268310547, "global_step": 33684, "epoch": 405} {"train_loss": -19.13810157775879, "global_step": 33685, "epoch": 405} {"train_loss": -19.337661743164062, "global_step": 33686, "epoch": 405} {"train_loss": -18.977149963378906, "global_step": 33687, "epoch": 405} {"train_loss": -19.387216567993164, "global_step": 33688, "epoch": 405} {"train_loss": -19.15519142150879, "global_step": 33689, "epoch": 405} {"train_loss": -19.369361877441406, "global_step": 33690, "epoch": 405} {"train_loss": -19.576705932617188, "global_step": 33691, "epoch": 405} {"train_loss": -18.830556869506836, "global_step": 33692, "epoch": 405} {"train_loss": -19.15985107421875, "global_step": 33693, "epoch": 405} {"train_loss": -19.269676208496094, "global_step": 33694, "epoch": 405} {"train_loss": -19.12575912475586, "global_step": 33695, "epoch": 405} {"train_loss": -19.32102394104004, "global_step": 33696, "epoch": 405} {"train_loss": -19.124528034623847, "global_step": 33697, "epoch": 405, "val_loss": 5924245.0} {"train_loss": -18.867664337158203, "global_step": 33698, "epoch": 406} {"train_loss": -19.01129913330078, "global_step": 33699, "epoch": 406} {"train_loss": -18.93306541442871, "global_step": 33700, "epoch": 406} {"train_loss": -19.473691940307617, "global_step": 33701, "epoch": 406} {"train_loss": -18.882221221923828, "global_step": 33702, "epoch": 406} {"train_loss": -18.95462417602539, "global_step": 33703, "epoch": 406} {"train_loss": -19.142486572265625, "global_step": 33704, "epoch": 406} {"train_loss": -19.140220642089844, "global_step": 33705, "epoch": 406} {"train_loss": -18.69170570373535, "global_step": 33706, "epoch": 406} {"train_loss": -19.158689498901367, "global_step": 33707, "epoch": 406} {"train_loss": -18.97694206237793, "global_step": 33708, "epoch": 406} {"train_loss": -19.346078872680664, "global_step": 33709, "epoch": 406} {"train_loss": -18.828956604003906, "global_step": 33710, "epoch": 406} {"train_loss": -18.71438217163086, "global_step": 33711, "epoch": 406} {"train_loss": -18.675247192382812, "global_step": 33712, "epoch": 406} {"train_loss": -19.070758819580078, "global_step": 33713, "epoch": 406} {"train_loss": -19.00943946838379, "global_step": 33714, "epoch": 406} {"train_loss": -18.940160751342773, "global_step": 33715, "epoch": 406} {"train_loss": -18.973169326782227, "global_step": 33716, "epoch": 406} {"train_loss": -18.88949966430664, "global_step": 33717, "epoch": 406} {"train_loss": -19.02901268005371, "global_step": 33718, "epoch": 406} {"train_loss": -18.87373924255371, "global_step": 33719, "epoch": 406} {"train_loss": -19.16324234008789, "global_step": 33720, "epoch": 406} {"train_loss": -19.04498291015625, "global_step": 33721, "epoch": 406} {"train_loss": -18.92172622680664, "global_step": 33722, "epoch": 406} {"train_loss": -18.938953399658203, "global_step": 33723, "epoch": 406} {"train_loss": -19.14569091796875, "global_step": 33724, "epoch": 406} {"train_loss": -18.78607177734375, "global_step": 33725, "epoch": 406} {"train_loss": -19.043010711669922, "global_step": 33726, "epoch": 406} {"train_loss": -19.14823341369629, "global_step": 33727, "epoch": 406} {"train_loss": -19.29730224609375, "global_step": 33728, "epoch": 406} {"train_loss": -19.159276962280273, "global_step": 33729, "epoch": 406} {"train_loss": -18.946012496948242, "global_step": 33730, "epoch": 406} {"train_loss": -19.369855880737305, "global_step": 33731, "epoch": 406} {"train_loss": -19.15821647644043, "global_step": 33732, "epoch": 406} {"train_loss": -19.262569427490234, "global_step": 33733, "epoch": 406} {"train_loss": -19.199100494384766, "global_step": 33734, "epoch": 406} {"train_loss": -19.423330307006836, "global_step": 33735, "epoch": 406} {"train_loss": -19.046545028686523, "global_step": 33736, "epoch": 406} {"train_loss": -19.12613296508789, "global_step": 33737, "epoch": 406} {"train_loss": -19.004562377929688, "global_step": 33738, "epoch": 406} {"train_loss": -19.045629501342773, "global_step": 33739, "epoch": 406} {"train_loss": -19.166711807250977, "global_step": 33740, "epoch": 406} {"train_loss": -19.4210147857666, "global_step": 33741, "epoch": 406} {"train_loss": -19.057641983032227, "global_step": 33742, "epoch": 406} {"train_loss": -19.21291160583496, "global_step": 33743, "epoch": 406} {"train_loss": -19.47311782836914, "global_step": 33744, "epoch": 406} {"train_loss": -19.07071304321289, "global_step": 33745, "epoch": 406} {"train_loss": -19.47056007385254, "global_step": 33746, "epoch": 406} {"train_loss": -19.341928482055664, "global_step": 33747, "epoch": 406} {"train_loss": -19.190139770507812, "global_step": 33748, "epoch": 406} {"train_loss": -18.768224716186523, "global_step": 33749, "epoch": 406} {"train_loss": -19.185842514038086, "global_step": 33750, "epoch": 406} {"train_loss": -19.283689498901367, "global_step": 33751, "epoch": 406} {"train_loss": -18.920528411865234, "global_step": 33752, "epoch": 406} {"train_loss": -19.44417381286621, "global_step": 33753, "epoch": 406} {"train_loss": -18.743093490600586, "global_step": 33754, "epoch": 406} {"train_loss": -19.187192916870117, "global_step": 33755, "epoch": 406} {"train_loss": -18.9226131439209, "global_step": 33756, "epoch": 406} {"train_loss": -18.89192008972168, "global_step": 33757, "epoch": 406} {"train_loss": -19.162782669067383, "global_step": 33758, "epoch": 406} {"train_loss": -18.945615768432617, "global_step": 33759, "epoch": 406} {"train_loss": -19.563539505004883, "global_step": 33760, "epoch": 406} {"train_loss": -19.200742721557617, "global_step": 33761, "epoch": 406} {"train_loss": -19.124311447143555, "global_step": 33762, "epoch": 406} {"train_loss": -19.205820083618164, "global_step": 33763, "epoch": 406} {"train_loss": -19.09535026550293, "global_step": 33764, "epoch": 406} {"train_loss": -18.9545841217041, "global_step": 33765, "epoch": 406} {"train_loss": -19.137861251831055, "global_step": 33766, "epoch": 406} {"train_loss": -19.094890594482422, "global_step": 33767, "epoch": 406} {"train_loss": -19.252471923828125, "global_step": 33768, "epoch": 406} {"train_loss": -19.381778717041016, "global_step": 33769, "epoch": 406} {"train_loss": -19.316864013671875, "global_step": 33770, "epoch": 406} {"train_loss": -19.365150451660156, "global_step": 33771, "epoch": 406} {"train_loss": -19.41316795349121, "global_step": 33772, "epoch": 406} {"train_loss": -19.066959381103516, "global_step": 33773, "epoch": 406} {"train_loss": -19.453662872314453, "global_step": 33774, "epoch": 406} {"train_loss": -19.16189956665039, "global_step": 33775, "epoch": 406} {"train_loss": -19.356544494628906, "global_step": 33776, "epoch": 406} {"train_loss": -19.21841049194336, "global_step": 33777, "epoch": 406} {"train_loss": -19.064664840698242, "global_step": 33778, "epoch": 406} {"train_loss": -19.024635314941406, "global_step": 33779, "epoch": 406} {"train_loss": -19.122220027877624, "global_step": 33780, "epoch": 406, "val_loss": 6068939.0} {"train_loss": -18.56362533569336, "global_step": 33781, "epoch": 407} {"train_loss": -18.84761619567871, "global_step": 33782, "epoch": 407} {"train_loss": -18.904630661010742, "global_step": 33783, "epoch": 407} {"train_loss": -19.205930709838867, "global_step": 33784, "epoch": 407} {"train_loss": -18.794677734375, "global_step": 33785, "epoch": 407} {"train_loss": -19.149065017700195, "global_step": 33786, "epoch": 407} {"train_loss": -19.265350341796875, "global_step": 33787, "epoch": 407} {"train_loss": -19.53563690185547, "global_step": 33788, "epoch": 407} {"train_loss": -18.71742820739746, "global_step": 33789, "epoch": 407} {"train_loss": -18.919540405273438, "global_step": 33790, "epoch": 407} {"train_loss": -18.879213333129883, "global_step": 33791, "epoch": 407} {"train_loss": -19.069705963134766, "global_step": 33792, "epoch": 407} {"train_loss": -18.897489547729492, "global_step": 33793, "epoch": 407} {"train_loss": -18.936086654663086, "global_step": 33794, "epoch": 407} {"train_loss": -19.29625129699707, "global_step": 33795, "epoch": 407} {"train_loss": -18.823152542114258, "global_step": 33796, "epoch": 407} {"train_loss": -19.369707107543945, "global_step": 33797, "epoch": 407} {"train_loss": -18.82769775390625, "global_step": 33798, "epoch": 407} {"train_loss": -19.025571823120117, "global_step": 33799, "epoch": 407} {"train_loss": -18.919157028198242, "global_step": 33800, "epoch": 407} {"train_loss": -19.09720230102539, "global_step": 33801, "epoch": 407} {"train_loss": -19.08982276916504, "global_step": 33802, "epoch": 407} {"train_loss": -19.779027938842773, "global_step": 33803, "epoch": 407} {"train_loss": -19.158018112182617, "global_step": 33804, "epoch": 407} {"train_loss": -18.99958610534668, "global_step": 33805, "epoch": 407} {"train_loss": -19.205289840698242, "global_step": 33806, "epoch": 407} {"train_loss": -19.133100509643555, "global_step": 33807, "epoch": 407} {"train_loss": -19.039813995361328, "global_step": 33808, "epoch": 407} {"train_loss": -19.473642349243164, "global_step": 33809, "epoch": 407} {"train_loss": -19.1780948638916, "global_step": 33810, "epoch": 407} {"train_loss": -18.855024337768555, "global_step": 33811, "epoch": 407} {"train_loss": -19.187768936157227, "global_step": 33812, "epoch": 407} {"train_loss": -19.209300994873047, "global_step": 33813, "epoch": 407} {"train_loss": -19.04397201538086, "global_step": 33814, "epoch": 407} {"train_loss": -19.31440544128418, "global_step": 33815, "epoch": 407} {"train_loss": -18.99906349182129, "global_step": 33816, "epoch": 407} {"train_loss": -19.377614974975586, "global_step": 33817, "epoch": 407} {"train_loss": -18.788671493530273, "global_step": 33818, "epoch": 407} {"train_loss": -19.369121551513672, "global_step": 33819, "epoch": 407} {"train_loss": -19.451602935791016, "global_step": 33820, "epoch": 407} {"train_loss": -19.136289596557617, "global_step": 33821, "epoch": 407} {"train_loss": -19.27954864501953, "global_step": 33822, "epoch": 407} {"train_loss": -19.45686149597168, "global_step": 33823, "epoch": 407} {"train_loss": -18.97990608215332, "global_step": 33824, "epoch": 407} {"train_loss": -19.451257705688477, "global_step": 33825, "epoch": 407} {"train_loss": -19.05954933166504, "global_step": 33826, "epoch": 407} {"train_loss": -19.369245529174805, "global_step": 33827, "epoch": 407} {"train_loss": -19.174100875854492, "global_step": 33828, "epoch": 407} {"train_loss": -19.15095329284668, "global_step": 33829, "epoch": 407} {"train_loss": -19.4306640625, "global_step": 33830, "epoch": 407} {"train_loss": -19.17506217956543, "global_step": 33831, "epoch": 407} {"train_loss": -19.492704391479492, "global_step": 33832, "epoch": 407} {"train_loss": -18.967710494995117, "global_step": 33833, "epoch": 407} {"train_loss": -19.483415603637695, "global_step": 33834, "epoch": 407} {"train_loss": -18.873340606689453, "global_step": 33835, "epoch": 407} {"train_loss": -19.117597579956055, "global_step": 33836, "epoch": 407} {"train_loss": -18.925527572631836, "global_step": 33837, "epoch": 407} {"train_loss": -19.142004013061523, "global_step": 33838, "epoch": 407} {"train_loss": -19.029193878173828, "global_step": 33839, "epoch": 407} {"train_loss": -19.327436447143555, "global_step": 33840, "epoch": 407} {"train_loss": -19.161943435668945, "global_step": 33841, "epoch": 407} {"train_loss": -19.296859741210938, "global_step": 33842, "epoch": 407} {"train_loss": -19.28676414489746, "global_step": 33843, "epoch": 407} {"train_loss": -19.030561447143555, "global_step": 33844, "epoch": 407} {"train_loss": -19.182096481323242, "global_step": 33845, "epoch": 407} {"train_loss": -19.275623321533203, "global_step": 33846, "epoch": 407} {"train_loss": -19.28572654724121, "global_step": 33847, "epoch": 407} {"train_loss": -18.92190170288086, "global_step": 33848, "epoch": 407} {"train_loss": -19.239591598510742, "global_step": 33849, "epoch": 407} {"train_loss": -18.773971557617188, "global_step": 33850, "epoch": 407} {"train_loss": -18.755477905273438, "global_step": 33851, "epoch": 407} {"train_loss": -18.930564880371094, "global_step": 33852, "epoch": 407} {"train_loss": -19.117942810058594, "global_step": 33853, "epoch": 407} {"train_loss": -18.940357208251953, "global_step": 33854, "epoch": 407} {"train_loss": -18.820951461791992, "global_step": 33855, "epoch": 407} {"train_loss": -19.2818603515625, "global_step": 33856, "epoch": 407} {"train_loss": -19.2386474609375, "global_step": 33857, "epoch": 407} {"train_loss": -18.92165184020996, "global_step": 33858, "epoch": 407} {"train_loss": -19.027854919433594, "global_step": 33859, "epoch": 407} {"train_loss": -19.563369750976562, "global_step": 33860, "epoch": 407} {"train_loss": -19.25275230407715, "global_step": 33861, "epoch": 407} {"train_loss": -18.840036392211914, "global_step": 33862, "epoch": 407} {"train_loss": -19.118568236569324, "global_step": 33863, "epoch": 407, "val_loss": 5970466.0} {"train_loss": -18.66969871520996, "global_step": 33864, "epoch": 408} {"train_loss": -18.51883316040039, "global_step": 33865, "epoch": 408} {"train_loss": -18.86865234375, "global_step": 33866, "epoch": 408} {"train_loss": -18.66765785217285, "global_step": 33867, "epoch": 408} {"train_loss": -19.170812606811523, "global_step": 33868, "epoch": 408} {"train_loss": -18.834741592407227, "global_step": 33869, "epoch": 408} {"train_loss": -18.59663200378418, "global_step": 33870, "epoch": 408} {"train_loss": -19.229490280151367, "global_step": 33871, "epoch": 408} {"train_loss": -18.819162368774414, "global_step": 33872, "epoch": 408} {"train_loss": -18.614795684814453, "global_step": 33873, "epoch": 408} {"train_loss": -18.812803268432617, "global_step": 33874, "epoch": 408} {"train_loss": -19.052021026611328, "global_step": 33875, "epoch": 408} {"train_loss": -19.103992462158203, "global_step": 33876, "epoch": 408} {"train_loss": -19.27022361755371, "global_step": 33877, "epoch": 408} {"train_loss": -19.0931339263916, "global_step": 33878, "epoch": 408} {"train_loss": -19.165203094482422, "global_step": 33879, "epoch": 408} {"train_loss": -18.72361946105957, "global_step": 33880, "epoch": 408} {"train_loss": -19.0272274017334, "global_step": 33881, "epoch": 408} {"train_loss": -19.242206573486328, "global_step": 33882, "epoch": 408} {"train_loss": -19.187482833862305, "global_step": 33883, "epoch": 408} {"train_loss": -19.085071563720703, "global_step": 33884, "epoch": 408} {"train_loss": -18.84632110595703, "global_step": 33885, "epoch": 408} {"train_loss": -19.17835807800293, "global_step": 33886, "epoch": 408} {"train_loss": -19.150291442871094, "global_step": 33887, "epoch": 408} {"train_loss": -19.01111602783203, "global_step": 33888, "epoch": 408} {"train_loss": -18.839962005615234, "global_step": 33889, "epoch": 408} {"train_loss": -19.00577735900879, "global_step": 33890, "epoch": 408} {"train_loss": -19.076379776000977, "global_step": 33891, "epoch": 408} {"train_loss": -18.873153686523438, "global_step": 33892, "epoch": 408} {"train_loss": -19.132413864135742, "global_step": 33893, "epoch": 408} {"train_loss": -19.318607330322266, "global_step": 33894, "epoch": 408} {"train_loss": -19.372854232788086, "global_step": 33895, "epoch": 408} {"train_loss": -19.255189895629883, "global_step": 33896, "epoch": 408} {"train_loss": -19.137845993041992, "global_step": 33897, "epoch": 408} {"train_loss": -19.348724365234375, "global_step": 33898, "epoch": 408} {"train_loss": -19.3198299407959, "global_step": 33899, "epoch": 408} {"train_loss": -19.133596420288086, "global_step": 33900, "epoch": 408} {"train_loss": -19.439226150512695, "global_step": 33901, "epoch": 408} {"train_loss": -19.09621238708496, "global_step": 33902, "epoch": 408} {"train_loss": -19.35985565185547, "global_step": 33903, "epoch": 408} {"train_loss": -18.737272262573242, "global_step": 33904, "epoch": 408} {"train_loss": -18.989852905273438, "global_step": 33905, "epoch": 408} {"train_loss": -18.87727928161621, "global_step": 33906, "epoch": 408} {"train_loss": -19.111862182617188, "global_step": 33907, "epoch": 408} {"train_loss": -19.076553344726562, "global_step": 33908, "epoch": 408} {"train_loss": -19.161909103393555, "global_step": 33909, "epoch": 408} {"train_loss": -19.272192001342773, "global_step": 33910, "epoch": 408} {"train_loss": -18.959339141845703, "global_step": 33911, "epoch": 408} {"train_loss": -19.153078079223633, "global_step": 33912, "epoch": 408} {"train_loss": -19.349489212036133, "global_step": 33913, "epoch": 408} {"train_loss": -19.312667846679688, "global_step": 33914, "epoch": 408} {"train_loss": -18.932783126831055, "global_step": 33915, "epoch": 408} {"train_loss": -19.200668334960938, "global_step": 33916, "epoch": 408} {"train_loss": -19.1543025970459, "global_step": 33917, "epoch": 408} {"train_loss": -19.13218879699707, "global_step": 33918, "epoch": 408} {"train_loss": -19.470834732055664, "global_step": 33919, "epoch": 408} {"train_loss": -19.415555953979492, "global_step": 33920, "epoch": 408} {"train_loss": -18.855981826782227, "global_step": 33921, "epoch": 408} {"train_loss": -19.446645736694336, "global_step": 33922, "epoch": 408} {"train_loss": -19.241865158081055, "global_step": 33923, "epoch": 408} {"train_loss": -19.448827743530273, "global_step": 33924, "epoch": 408} {"train_loss": -18.939502716064453, "global_step": 33925, "epoch": 408} {"train_loss": -19.355539321899414, "global_step": 33926, "epoch": 408} {"train_loss": -18.97128677368164, "global_step": 33927, "epoch": 408} {"train_loss": -18.972089767456055, "global_step": 33928, "epoch": 408} {"train_loss": -19.1473388671875, "global_step": 33929, "epoch": 408} {"train_loss": -19.48638153076172, "global_step": 33930, "epoch": 408} {"train_loss": -18.931644439697266, "global_step": 33931, "epoch": 408} {"train_loss": -19.21895408630371, "global_step": 33932, "epoch": 408} {"train_loss": -19.036909103393555, "global_step": 33933, "epoch": 408} {"train_loss": -19.639097213745117, "global_step": 33934, "epoch": 408} {"train_loss": -19.164880752563477, "global_step": 33935, "epoch": 408} {"train_loss": -19.246706008911133, "global_step": 33936, "epoch": 408} {"train_loss": -19.476165771484375, "global_step": 33937, "epoch": 408} {"train_loss": -18.930253982543945, "global_step": 33938, "epoch": 408} {"train_loss": -18.82472038269043, "global_step": 33939, "epoch": 408} {"train_loss": -19.165517807006836, "global_step": 33940, "epoch": 408} {"train_loss": -19.542333602905273, "global_step": 33941, "epoch": 408} {"train_loss": -19.084138870239258, "global_step": 33942, "epoch": 408} {"train_loss": -18.8082332611084, "global_step": 33943, "epoch": 408} {"train_loss": -18.962947845458984, "global_step": 33944, "epoch": 408} {"train_loss": -18.96063232421875, "global_step": 33945, "epoch": 408} {"train_loss": -19.121624291661274, "global_step": 33946, "epoch": 408, "val_loss": 6071922.5} {"train_loss": -18.65766716003418, "global_step": 33947, "epoch": 409} {"train_loss": -19.058469772338867, "global_step": 33948, "epoch": 409} {"train_loss": -18.700550079345703, "global_step": 33949, "epoch": 409} {"train_loss": -18.638851165771484, "global_step": 33950, "epoch": 409} {"train_loss": -19.01654815673828, "global_step": 33951, "epoch": 409} {"train_loss": -19.096067428588867, "global_step": 33952, "epoch": 409} {"train_loss": -19.138288497924805, "global_step": 33953, "epoch": 409} {"train_loss": -19.025249481201172, "global_step": 33954, "epoch": 409} {"train_loss": -18.927560806274414, "global_step": 33955, "epoch": 409} {"train_loss": -18.591407775878906, "global_step": 33956, "epoch": 409} {"train_loss": -18.983489990234375, "global_step": 33957, "epoch": 409} {"train_loss": -19.075178146362305, "global_step": 33958, "epoch": 409} {"train_loss": -19.08680534362793, "global_step": 33959, "epoch": 409} {"train_loss": -19.314605712890625, "global_step": 33960, "epoch": 409} {"train_loss": -18.869752883911133, "global_step": 33961, "epoch": 409} {"train_loss": -19.357900619506836, "global_step": 33962, "epoch": 409} {"train_loss": -19.187902450561523, "global_step": 33963, "epoch": 409} {"train_loss": -18.951040267944336, "global_step": 33964, "epoch": 409} {"train_loss": -19.2100772857666, "global_step": 33965, "epoch": 409} {"train_loss": -19.075428009033203, "global_step": 33966, "epoch": 409} {"train_loss": -19.03948402404785, "global_step": 33967, "epoch": 409} {"train_loss": -19.055593490600586, "global_step": 33968, "epoch": 409} {"train_loss": -19.069026947021484, "global_step": 33969, "epoch": 409} {"train_loss": -19.01447868347168, "global_step": 33970, "epoch": 409} {"train_loss": -19.197629928588867, "global_step": 33971, "epoch": 409} {"train_loss": -19.266977310180664, "global_step": 33972, "epoch": 409} {"train_loss": -19.583646774291992, "global_step": 33973, "epoch": 409} {"train_loss": -18.963768005371094, "global_step": 33974, "epoch": 409} {"train_loss": -18.782690048217773, "global_step": 33975, "epoch": 409} {"train_loss": -19.06954574584961, "global_step": 33976, "epoch": 409} {"train_loss": -19.349193572998047, "global_step": 33977, "epoch": 409} {"train_loss": -19.221153259277344, "global_step": 33978, "epoch": 409} {"train_loss": -19.078231811523438, "global_step": 33979, "epoch": 409} {"train_loss": -18.98561668395996, "global_step": 33980, "epoch": 409} {"train_loss": -19.35610008239746, "global_step": 33981, "epoch": 409} {"train_loss": -19.031465530395508, "global_step": 33982, "epoch": 409} {"train_loss": -19.044654846191406, "global_step": 33983, "epoch": 409} {"train_loss": -19.00090980529785, "global_step": 33984, "epoch": 409} {"train_loss": -19.239526748657227, "global_step": 33985, "epoch": 409} {"train_loss": -18.99764060974121, "global_step": 33986, "epoch": 409} {"train_loss": -19.18196678161621, "global_step": 33987, "epoch": 409} {"train_loss": -19.727062225341797, "global_step": 33988, "epoch": 409} {"train_loss": -18.978164672851562, "global_step": 33989, "epoch": 409} {"train_loss": -19.212209701538086, "global_step": 33990, "epoch": 409} {"train_loss": -19.029523849487305, "global_step": 33991, "epoch": 409} {"train_loss": -19.347524642944336, "global_step": 33992, "epoch": 409} {"train_loss": -19.103696823120117, "global_step": 33993, "epoch": 409} {"train_loss": -19.24525260925293, "global_step": 33994, "epoch": 409} {"train_loss": -19.685504913330078, "global_step": 33995, "epoch": 409} {"train_loss": -18.96388053894043, "global_step": 33996, "epoch": 409} {"train_loss": -19.021272659301758, "global_step": 33997, "epoch": 409} {"train_loss": -18.850772857666016, "global_step": 33998, "epoch": 409} {"train_loss": -18.362180709838867, "global_step": 33999, "epoch": 409} {"train_loss": -19.399259567260742, "global_step": 34000, "epoch": 409} {"train_loss": -19.424270629882812, "global_step": 34001, "epoch": 409} {"train_loss": -19.005298614501953, "global_step": 34002, "epoch": 409} {"train_loss": -19.016752243041992, "global_step": 34003, "epoch": 409} {"train_loss": -19.005859375, "global_step": 34004, "epoch": 409} {"train_loss": -19.343366622924805, "global_step": 34005, "epoch": 409} {"train_loss": -19.537033081054688, "global_step": 34006, "epoch": 409} {"train_loss": -19.258569717407227, "global_step": 34007, "epoch": 409} {"train_loss": -18.94451332092285, "global_step": 34008, "epoch": 409} {"train_loss": -19.086570739746094, "global_step": 34009, "epoch": 409} {"train_loss": -19.241559982299805, "global_step": 34010, "epoch": 409} {"train_loss": -18.972789764404297, "global_step": 34011, "epoch": 409} {"train_loss": -19.22284507751465, "global_step": 34012, "epoch": 409} {"train_loss": -19.16193199157715, "global_step": 34013, "epoch": 409} {"train_loss": -19.478370666503906, "global_step": 34014, "epoch": 409} {"train_loss": -19.494810104370117, "global_step": 34015, "epoch": 409} {"train_loss": -19.010103225708008, "global_step": 34016, "epoch": 409} {"train_loss": -19.188474655151367, "global_step": 34017, "epoch": 409} {"train_loss": -18.967479705810547, "global_step": 34018, "epoch": 409} {"train_loss": -19.116661071777344, "global_step": 34019, "epoch": 409} {"train_loss": -19.032833099365234, "global_step": 34020, "epoch": 409} {"train_loss": -19.07485008239746, "global_step": 34021, "epoch": 409} {"train_loss": -19.0537109375, "global_step": 34022, "epoch": 409} {"train_loss": -19.362735748291016, "global_step": 34023, "epoch": 409} {"train_loss": -19.373998641967773, "global_step": 34024, "epoch": 409} {"train_loss": -18.689361572265625, "global_step": 34025, "epoch": 409} {"train_loss": -18.86008644104004, "global_step": 34026, "epoch": 409} {"train_loss": -19.1083927154541, "global_step": 34027, "epoch": 409} {"train_loss": -19.373991012573242, "global_step": 34028, "epoch": 409} {"train_loss": -19.11118033995111, "global_step": 34029, "epoch": 409, "val_loss": 6077088.0} {"train_loss": -19.07490348815918, "global_step": 34030, "epoch": 410} {"train_loss": -19.108705520629883, "global_step": 34031, "epoch": 410} {"train_loss": -18.829458236694336, "global_step": 34032, "epoch": 410} {"train_loss": -19.088720321655273, "global_step": 34033, "epoch": 410} {"train_loss": -19.24946403503418, "global_step": 34034, "epoch": 410} {"train_loss": -19.040021896362305, "global_step": 34035, "epoch": 410} {"train_loss": -19.100156784057617, "global_step": 34036, "epoch": 410} {"train_loss": -18.778310775756836, "global_step": 34037, "epoch": 410} {"train_loss": -19.220083236694336, "global_step": 34038, "epoch": 410} {"train_loss": -19.12990379333496, "global_step": 34039, "epoch": 410} {"train_loss": -19.143774032592773, "global_step": 34040, "epoch": 410} {"train_loss": -19.111797332763672, "global_step": 34041, "epoch": 410} {"train_loss": -19.094600677490234, "global_step": 34042, "epoch": 410} {"train_loss": -19.023420333862305, "global_step": 34043, "epoch": 410} {"train_loss": -18.756811141967773, "global_step": 34044, "epoch": 410} {"train_loss": -18.994495391845703, "global_step": 34045, "epoch": 410} {"train_loss": -19.09932518005371, "global_step": 34046, "epoch": 410} {"train_loss": -19.160520553588867, "global_step": 34047, "epoch": 410} {"train_loss": -18.913799285888672, "global_step": 34048, "epoch": 410} {"train_loss": -19.01495933532715, "global_step": 34049, "epoch": 410} {"train_loss": -19.101119995117188, "global_step": 34050, "epoch": 410} {"train_loss": -18.684682846069336, "global_step": 34051, "epoch": 410} {"train_loss": -19.205223083496094, "global_step": 34052, "epoch": 410} {"train_loss": -18.874629974365234, "global_step": 34053, "epoch": 410} {"train_loss": -19.25005531311035, "global_step": 34054, "epoch": 410} {"train_loss": -19.46943473815918, "global_step": 34055, "epoch": 410} {"train_loss": -19.286428451538086, "global_step": 34056, "epoch": 410} {"train_loss": -19.155710220336914, "global_step": 34057, "epoch": 410} {"train_loss": -19.2393856048584, "global_step": 34058, "epoch": 410} {"train_loss": -19.141796112060547, "global_step": 34059, "epoch": 410} {"train_loss": -19.197004318237305, "global_step": 34060, "epoch": 410} {"train_loss": -18.910003662109375, "global_step": 34061, "epoch": 410} {"train_loss": -19.249372482299805, "global_step": 34062, "epoch": 410} {"train_loss": -19.357799530029297, "global_step": 34063, "epoch": 410} {"train_loss": -18.911968231201172, "global_step": 34064, "epoch": 410} {"train_loss": -19.00421905517578, "global_step": 34065, "epoch": 410} {"train_loss": -19.49368667602539, "global_step": 34066, "epoch": 410} {"train_loss": -19.21537208557129, "global_step": 34067, "epoch": 410} {"train_loss": -19.661298751831055, "global_step": 34068, "epoch": 410} {"train_loss": -19.332433700561523, "global_step": 34069, "epoch": 410} {"train_loss": -19.14574432373047, "global_step": 34070, "epoch": 410} {"train_loss": -19.022689819335938, "global_step": 34071, "epoch": 410} {"train_loss": -18.84417152404785, "global_step": 34072, "epoch": 410} {"train_loss": -19.341678619384766, "global_step": 34073, "epoch": 410} {"train_loss": -19.45099449157715, "global_step": 34074, "epoch": 410} {"train_loss": -19.242467880249023, "global_step": 34075, "epoch": 410} {"train_loss": -19.198883056640625, "global_step": 34076, "epoch": 410} {"train_loss": -19.331045150756836, "global_step": 34077, "epoch": 410} {"train_loss": -18.93984031677246, "global_step": 34078, "epoch": 410} {"train_loss": -18.7418155670166, "global_step": 34079, "epoch": 410} {"train_loss": -19.539255142211914, "global_step": 34080, "epoch": 410} {"train_loss": -19.590410232543945, "global_step": 34081, "epoch": 410} {"train_loss": -19.057193756103516, "global_step": 34082, "epoch": 410} {"train_loss": -19.36211585998535, "global_step": 34083, "epoch": 410} {"train_loss": -19.160879135131836, "global_step": 34084, "epoch": 410} {"train_loss": -19.181339263916016, "global_step": 34085, "epoch": 410} {"train_loss": -19.338851928710938, "global_step": 34086, "epoch": 410} {"train_loss": -19.33979034423828, "global_step": 34087, "epoch": 410} {"train_loss": -19.28447723388672, "global_step": 34088, "epoch": 410} {"train_loss": -19.281736373901367, "global_step": 34089, "epoch": 410} {"train_loss": -19.100324630737305, "global_step": 34090, "epoch": 410} {"train_loss": -18.788480758666992, "global_step": 34091, "epoch": 410} {"train_loss": -19.08609390258789, "global_step": 34092, "epoch": 410} {"train_loss": -18.988285064697266, "global_step": 34093, "epoch": 410} {"train_loss": -19.267332077026367, "global_step": 34094, "epoch": 410} {"train_loss": -19.176218032836914, "global_step": 34095, "epoch": 410} {"train_loss": -19.027891159057617, "global_step": 34096, "epoch": 410} {"train_loss": -18.94533348083496, "global_step": 34097, "epoch": 410} {"train_loss": -18.98184585571289, "global_step": 34098, "epoch": 410} {"train_loss": -18.958805084228516, "global_step": 34099, "epoch": 410} {"train_loss": -19.077367782592773, "global_step": 34100, "epoch": 410} {"train_loss": -19.45711326599121, "global_step": 34101, "epoch": 410} {"train_loss": -19.17253303527832, "global_step": 34102, "epoch": 410} {"train_loss": -19.286800384521484, "global_step": 34103, "epoch": 410} {"train_loss": -18.926555633544922, "global_step": 34104, "epoch": 410} {"train_loss": -19.492921829223633, "global_step": 34105, "epoch": 410} {"train_loss": -19.194974899291992, "global_step": 34106, "epoch": 410} {"train_loss": -18.911508560180664, "global_step": 34107, "epoch": 410} {"train_loss": -18.903837203979492, "global_step": 34108, "epoch": 410} {"train_loss": -19.325458526611328, "global_step": 34109, "epoch": 410} {"train_loss": -19.07149314880371, "global_step": 34110, "epoch": 410} {"train_loss": -19.4406795501709, "global_step": 34111, "epoch": 410} {"train_loss": -19.152261825929205, "global_step": 34112, "epoch": 410, "val_loss": 5942917.5} {"train_loss": -19.2607479095459, "global_step": 34113, "epoch": 411} {"train_loss": -18.669677734375, "global_step": 34114, "epoch": 411} {"train_loss": -18.9005069732666, "global_step": 34115, "epoch": 411} {"train_loss": -19.12413215637207, "global_step": 34116, "epoch": 411} {"train_loss": -19.30653953552246, "global_step": 34117, "epoch": 411} {"train_loss": -19.26424217224121, "global_step": 34118, "epoch": 411} {"train_loss": -18.917081832885742, "global_step": 34119, "epoch": 411} {"train_loss": -19.071277618408203, "global_step": 34120, "epoch": 411} {"train_loss": -19.39900779724121, "global_step": 34121, "epoch": 411} {"train_loss": -19.042560577392578, "global_step": 34122, "epoch": 411} {"train_loss": -18.929962158203125, "global_step": 34123, "epoch": 411} {"train_loss": -18.982431411743164, "global_step": 34124, "epoch": 411} {"train_loss": -19.064680099487305, "global_step": 34125, "epoch": 411} {"train_loss": -19.006267547607422, "global_step": 34126, "epoch": 411} {"train_loss": -19.106040954589844, "global_step": 34127, "epoch": 411} {"train_loss": -18.93807029724121, "global_step": 34128, "epoch": 411} {"train_loss": -19.229345321655273, "global_step": 34129, "epoch": 411} {"train_loss": -19.486473083496094, "global_step": 34130, "epoch": 411} {"train_loss": -19.06305503845215, "global_step": 34131, "epoch": 411} {"train_loss": -18.82852554321289, "global_step": 34132, "epoch": 411} {"train_loss": -18.85273551940918, "global_step": 34133, "epoch": 411} {"train_loss": -19.03778076171875, "global_step": 34134, "epoch": 411} {"train_loss": -19.383466720581055, "global_step": 34135, "epoch": 411} {"train_loss": -19.564619064331055, "global_step": 34136, "epoch": 411} {"train_loss": -18.895538330078125, "global_step": 34137, "epoch": 411} {"train_loss": -18.827960968017578, "global_step": 34138, "epoch": 411} {"train_loss": -19.299392700195312, "global_step": 34139, "epoch": 411} {"train_loss": -19.35438346862793, "global_step": 34140, "epoch": 411} {"train_loss": -19.458982467651367, "global_step": 34141, "epoch": 411} {"train_loss": -19.220001220703125, "global_step": 34142, "epoch": 411} {"train_loss": -19.06446075439453, "global_step": 34143, "epoch": 411} {"train_loss": -19.380727767944336, "global_step": 34144, "epoch": 411} {"train_loss": -18.793453216552734, "global_step": 34145, "epoch": 411} {"train_loss": -19.127073287963867, "global_step": 34146, "epoch": 411} {"train_loss": -19.239397048950195, "global_step": 34147, "epoch": 411} {"train_loss": -19.298892974853516, "global_step": 34148, "epoch": 411} {"train_loss": -19.79330825805664, "global_step": 34149, "epoch": 411} {"train_loss": -19.063323974609375, "global_step": 34150, "epoch": 411} {"train_loss": -18.97359275817871, "global_step": 34151, "epoch": 411} {"train_loss": -19.457731246948242, "global_step": 34152, "epoch": 411} {"train_loss": -19.06817626953125, "global_step": 34153, "epoch": 411} {"train_loss": -19.41936683654785, "global_step": 34154, "epoch": 411} {"train_loss": -19.031850814819336, "global_step": 34155, "epoch": 411} {"train_loss": -19.14322280883789, "global_step": 34156, "epoch": 411} {"train_loss": -19.585697174072266, "global_step": 34157, "epoch": 411} {"train_loss": -19.087207794189453, "global_step": 34158, "epoch": 411} {"train_loss": -19.147916793823242, "global_step": 34159, "epoch": 411} {"train_loss": -18.927030563354492, "global_step": 34160, "epoch": 411} {"train_loss": -19.075542449951172, "global_step": 34161, "epoch": 411} {"train_loss": -19.111122131347656, "global_step": 34162, "epoch": 411} {"train_loss": -19.161117553710938, "global_step": 34163, "epoch": 411} {"train_loss": -19.003677368164062, "global_step": 34164, "epoch": 411} {"train_loss": -18.72113609313965, "global_step": 34165, "epoch": 411} {"train_loss": -19.139564514160156, "global_step": 34166, "epoch": 411} {"train_loss": -19.62986183166504, "global_step": 34167, "epoch": 411} {"train_loss": -19.2205753326416, "global_step": 34168, "epoch": 411} {"train_loss": -19.37820816040039, "global_step": 34169, "epoch": 411} {"train_loss": -19.46473503112793, "global_step": 34170, "epoch": 411} {"train_loss": -19.082996368408203, "global_step": 34171, "epoch": 411} {"train_loss": -18.857240676879883, "global_step": 34172, "epoch": 411} {"train_loss": -19.399702072143555, "global_step": 34173, "epoch": 411} {"train_loss": -19.463897705078125, "global_step": 34174, "epoch": 411} {"train_loss": -19.376359939575195, "global_step": 34175, "epoch": 411} {"train_loss": -18.918127059936523, "global_step": 34176, "epoch": 411} {"train_loss": -19.080116271972656, "global_step": 34177, "epoch": 411} {"train_loss": -18.70210075378418, "global_step": 34178, "epoch": 411} {"train_loss": -19.220518112182617, "global_step": 34179, "epoch": 411} {"train_loss": -19.34026336669922, "global_step": 34180, "epoch": 411} {"train_loss": -19.695066452026367, "global_step": 34181, "epoch": 411} {"train_loss": -19.314062118530273, "global_step": 34182, "epoch": 411} {"train_loss": -19.425424575805664, "global_step": 34183, "epoch": 411} {"train_loss": -19.05352783203125, "global_step": 34184, "epoch": 411} {"train_loss": -19.08793830871582, "global_step": 34185, "epoch": 411} {"train_loss": -19.090147018432617, "global_step": 34186, "epoch": 411} {"train_loss": -19.38302993774414, "global_step": 34187, "epoch": 411} {"train_loss": -18.977842330932617, "global_step": 34188, "epoch": 411} {"train_loss": -19.439023971557617, "global_step": 34189, "epoch": 411} {"train_loss": -19.170331954956055, "global_step": 34190, "epoch": 411} {"train_loss": -18.98874855041504, "global_step": 34191, "epoch": 411} {"train_loss": -19.29524040222168, "global_step": 34192, "epoch": 411} {"train_loss": -19.163257598876953, "global_step": 34193, "epoch": 411} {"train_loss": -18.881685256958008, "global_step": 34194, "epoch": 411} {"train_loss": -19.15818088025932, "global_step": 34195, "epoch": 411, "val_loss": 5954270.5} {"train_loss": -18.59716796875, "global_step": 34196, "epoch": 412} {"train_loss": -19.02293586730957, "global_step": 34197, "epoch": 412} {"train_loss": -18.690954208374023, "global_step": 34198, "epoch": 412} {"train_loss": -19.037839889526367, "global_step": 34199, "epoch": 412} {"train_loss": -18.91340446472168, "global_step": 34200, "epoch": 412} {"train_loss": -18.596418380737305, "global_step": 34201, "epoch": 412} {"train_loss": -19.27992820739746, "global_step": 34202, "epoch": 412} {"train_loss": -18.99533462524414, "global_step": 34203, "epoch": 412} {"train_loss": -19.483423233032227, "global_step": 34204, "epoch": 412} {"train_loss": -19.068105697631836, "global_step": 34205, "epoch": 412} {"train_loss": -19.123998641967773, "global_step": 34206, "epoch": 412} {"train_loss": -19.495473861694336, "global_step": 34207, "epoch": 412} {"train_loss": -19.116641998291016, "global_step": 34208, "epoch": 412} {"train_loss": -19.336050033569336, "global_step": 34209, "epoch": 412} {"train_loss": -19.15460205078125, "global_step": 34210, "epoch": 412} {"train_loss": -19.46480369567871, "global_step": 34211, "epoch": 412} {"train_loss": -19.000898361206055, "global_step": 34212, "epoch": 412} {"train_loss": -18.685165405273438, "global_step": 34213, "epoch": 412} {"train_loss": -19.42721939086914, "global_step": 34214, "epoch": 412} {"train_loss": -19.0485897064209, "global_step": 34215, "epoch": 412} {"train_loss": -19.128372192382812, "global_step": 34216, "epoch": 412} {"train_loss": -19.24007225036621, "global_step": 34217, "epoch": 412} {"train_loss": -19.118200302124023, "global_step": 34218, "epoch": 412} {"train_loss": -19.652807235717773, "global_step": 34219, "epoch": 412} {"train_loss": -19.38104820251465, "global_step": 34220, "epoch": 412} {"train_loss": -19.085416793823242, "global_step": 34221, "epoch": 412} {"train_loss": -19.149627685546875, "global_step": 34222, "epoch": 412} {"train_loss": -18.98402976989746, "global_step": 34223, "epoch": 412} {"train_loss": -19.27503776550293, "global_step": 34224, "epoch": 412} {"train_loss": -18.9792537689209, "global_step": 34225, "epoch": 412} {"train_loss": -19.313512802124023, "global_step": 34226, "epoch": 412} {"train_loss": -19.225086212158203, "global_step": 34227, "epoch": 412} {"train_loss": -18.960561752319336, "global_step": 34228, "epoch": 412} {"train_loss": -19.1643123626709, "global_step": 34229, "epoch": 412} {"train_loss": -19.24213218688965, "global_step": 34230, "epoch": 412} {"train_loss": -19.166784286499023, "global_step": 34231, "epoch": 412} {"train_loss": -19.288175582885742, "global_step": 34232, "epoch": 412} {"train_loss": -18.73677635192871, "global_step": 34233, "epoch": 412} {"train_loss": -19.377229690551758, "global_step": 34234, "epoch": 412} {"train_loss": -19.109708786010742, "global_step": 34235, "epoch": 412} {"train_loss": -19.422727584838867, "global_step": 34236, "epoch": 412} {"train_loss": -18.62051010131836, "global_step": 34237, "epoch": 412} {"train_loss": -18.932546615600586, "global_step": 34238, "epoch": 412} {"train_loss": -19.43452262878418, "global_step": 34239, "epoch": 412} {"train_loss": -19.177165985107422, "global_step": 34240, "epoch": 412} {"train_loss": -19.516376495361328, "global_step": 34241, "epoch": 412} {"train_loss": -19.359167098999023, "global_step": 34242, "epoch": 412} {"train_loss": -19.43475341796875, "global_step": 34243, "epoch": 412} {"train_loss": -19.26743507385254, "global_step": 34244, "epoch": 412} {"train_loss": -18.987924575805664, "global_step": 34245, "epoch": 412} {"train_loss": -19.493629455566406, "global_step": 34246, "epoch": 412} {"train_loss": -19.007627487182617, "global_step": 34247, "epoch": 412} {"train_loss": -18.701997756958008, "global_step": 34248, "epoch": 412} {"train_loss": -19.841039657592773, "global_step": 34249, "epoch": 412} {"train_loss": -19.269460678100586, "global_step": 34250, "epoch": 412} {"train_loss": -19.092660903930664, "global_step": 34251, "epoch": 412} {"train_loss": -19.556747436523438, "global_step": 34252, "epoch": 412} {"train_loss": -19.099620819091797, "global_step": 34253, "epoch": 412} {"train_loss": -18.998443603515625, "global_step": 34254, "epoch": 412} {"train_loss": -19.447803497314453, "global_step": 34255, "epoch": 412} {"train_loss": -19.021228790283203, "global_step": 34256, "epoch": 412} {"train_loss": -19.204740524291992, "global_step": 34257, "epoch": 412} {"train_loss": -19.285839080810547, "global_step": 34258, "epoch": 412} {"train_loss": -18.88936424255371, "global_step": 34259, "epoch": 412} {"train_loss": -19.23160171508789, "global_step": 34260, "epoch": 412} {"train_loss": -18.855955123901367, "global_step": 34261, "epoch": 412} {"train_loss": -19.141605377197266, "global_step": 34262, "epoch": 412} {"train_loss": -18.847854614257812, "global_step": 34263, "epoch": 412} {"train_loss": -19.394006729125977, "global_step": 34264, "epoch": 412} {"train_loss": -19.13473892211914, "global_step": 34265, "epoch": 412} {"train_loss": -19.07071304321289, "global_step": 34266, "epoch": 412} {"train_loss": -18.85508155822754, "global_step": 34267, "epoch": 412} {"train_loss": -18.772186279296875, "global_step": 34268, "epoch": 412} {"train_loss": -19.060422897338867, "global_step": 34269, "epoch": 412} {"train_loss": -18.9932918548584, "global_step": 34270, "epoch": 412} {"train_loss": -19.183589935302734, "global_step": 34271, "epoch": 412} {"train_loss": -19.223134994506836, "global_step": 34272, "epoch": 412} {"train_loss": -19.114992141723633, "global_step": 34273, "epoch": 412} {"train_loss": -19.275007247924805, "global_step": 34274, "epoch": 412} {"train_loss": -18.93889808654785, "global_step": 34275, "epoch": 412} {"train_loss": -19.169322967529297, "global_step": 34276, "epoch": 412} {"train_loss": -19.30057716369629, "global_step": 34277, "epoch": 412} {"train_loss": -19.14863767968603, "global_step": 34278, "epoch": 412, "val_loss": 6084177.0} {"train_loss": -18.403066635131836, "global_step": 34279, "epoch": 413} {"train_loss": -19.08880615234375, "global_step": 34280, "epoch": 413} {"train_loss": -18.618154525756836, "global_step": 34281, "epoch": 413} {"train_loss": -18.7535457611084, "global_step": 34282, "epoch": 413} {"train_loss": -18.71235466003418, "global_step": 34283, "epoch": 413} {"train_loss": -18.82985496520996, "global_step": 34284, "epoch": 413} {"train_loss": -19.26572036743164, "global_step": 34285, "epoch": 413} {"train_loss": -19.144407272338867, "global_step": 34286, "epoch": 413} {"train_loss": -18.871246337890625, "global_step": 34287, "epoch": 413} {"train_loss": -19.474897384643555, "global_step": 34288, "epoch": 413} {"train_loss": -18.74335289001465, "global_step": 34289, "epoch": 413} {"train_loss": -18.977157592773438, "global_step": 34290, "epoch": 413} {"train_loss": -19.130924224853516, "global_step": 34291, "epoch": 413} {"train_loss": -18.982412338256836, "global_step": 34292, "epoch": 413} {"train_loss": -19.048612594604492, "global_step": 34293, "epoch": 413} {"train_loss": -18.88713836669922, "global_step": 34294, "epoch": 413} {"train_loss": -18.69174575805664, "global_step": 34295, "epoch": 413} {"train_loss": -19.039344787597656, "global_step": 34296, "epoch": 413} {"train_loss": -19.34938621520996, "global_step": 34297, "epoch": 413} {"train_loss": -18.945619583129883, "global_step": 34298, "epoch": 413} {"train_loss": -19.501455307006836, "global_step": 34299, "epoch": 413} {"train_loss": -18.928144454956055, "global_step": 34300, "epoch": 413} {"train_loss": -19.328067779541016, "global_step": 34301, "epoch": 413} {"train_loss": -19.08134651184082, "global_step": 34302, "epoch": 413} {"train_loss": -18.999282836914062, "global_step": 34303, "epoch": 413} {"train_loss": -19.33392906188965, "global_step": 34304, "epoch": 413} {"train_loss": -19.337554931640625, "global_step": 34305, "epoch": 413} {"train_loss": -18.928525924682617, "global_step": 34306, "epoch": 413} {"train_loss": -19.579191207885742, "global_step": 34307, "epoch": 413} {"train_loss": -19.145957946777344, "global_step": 34308, "epoch": 413} {"train_loss": -18.69207000732422, "global_step": 34309, "epoch": 413} {"train_loss": -19.028959274291992, "global_step": 34310, "epoch": 413} {"train_loss": -19.16742515563965, "global_step": 34311, "epoch": 413} {"train_loss": -19.181550979614258, "global_step": 34312, "epoch": 413} {"train_loss": -19.127971649169922, "global_step": 34313, "epoch": 413} {"train_loss": -19.35334014892578, "global_step": 34314, "epoch": 413} {"train_loss": -18.963647842407227, "global_step": 34315, "epoch": 413} {"train_loss": -18.960325241088867, "global_step": 34316, "epoch": 413} {"train_loss": -18.883756637573242, "global_step": 34317, "epoch": 413} {"train_loss": -19.746519088745117, "global_step": 34318, "epoch": 413} {"train_loss": -19.30042839050293, "global_step": 34319, "epoch": 413} {"train_loss": -19.304529190063477, "global_step": 34320, "epoch": 413} {"train_loss": -19.05224609375, "global_step": 34321, "epoch": 413} {"train_loss": -19.3194637298584, "global_step": 34322, "epoch": 413} {"train_loss": -19.136863708496094, "global_step": 34323, "epoch": 413} {"train_loss": -19.557621002197266, "global_step": 34324, "epoch": 413} {"train_loss": -18.9720401763916, "global_step": 34325, "epoch": 413} {"train_loss": -19.644567489624023, "global_step": 34326, "epoch": 413} {"train_loss": -18.951385498046875, "global_step": 34327, "epoch": 413} {"train_loss": -19.20844841003418, "global_step": 34328, "epoch": 413} {"train_loss": -18.986989974975586, "global_step": 34329, "epoch": 413} {"train_loss": -19.210674285888672, "global_step": 34330, "epoch": 413} {"train_loss": -19.367305755615234, "global_step": 34331, "epoch": 413} {"train_loss": -19.108449935913086, "global_step": 34332, "epoch": 413} {"train_loss": -19.288267135620117, "global_step": 34333, "epoch": 413} {"train_loss": -19.40399169921875, "global_step": 34334, "epoch": 413} {"train_loss": -19.062528610229492, "global_step": 34335, "epoch": 413} {"train_loss": -19.226165771484375, "global_step": 34336, "epoch": 413} {"train_loss": -19.48270034790039, "global_step": 34337, "epoch": 413} {"train_loss": -19.532445907592773, "global_step": 34338, "epoch": 413} {"train_loss": -19.046884536743164, "global_step": 34339, "epoch": 413} {"train_loss": -19.232404708862305, "global_step": 34340, "epoch": 413} {"train_loss": -19.067626953125, "global_step": 34341, "epoch": 413} {"train_loss": -19.00104331970215, "global_step": 34342, "epoch": 413} {"train_loss": -19.316442489624023, "global_step": 34343, "epoch": 413} {"train_loss": -18.819488525390625, "global_step": 34344, "epoch": 413} {"train_loss": -19.351783752441406, "global_step": 34345, "epoch": 413} {"train_loss": -19.05617332458496, "global_step": 34346, "epoch": 413} {"train_loss": -19.23722267150879, "global_step": 34347, "epoch": 413} {"train_loss": -18.82649040222168, "global_step": 34348, "epoch": 413} {"train_loss": -19.366241455078125, "global_step": 34349, "epoch": 413} {"train_loss": -18.826534271240234, "global_step": 34350, "epoch": 413} {"train_loss": -19.21016502380371, "global_step": 34351, "epoch": 413} {"train_loss": -19.430212020874023, "global_step": 34352, "epoch": 413} {"train_loss": -19.011320114135742, "global_step": 34353, "epoch": 413} {"train_loss": -19.09992218017578, "global_step": 34354, "epoch": 413} {"train_loss": -19.27895164489746, "global_step": 34355, "epoch": 413} {"train_loss": -19.391340255737305, "global_step": 34356, "epoch": 413} {"train_loss": -19.0146541595459, "global_step": 34357, "epoch": 413} {"train_loss": -18.763490676879883, "global_step": 34358, "epoch": 413} {"train_loss": -18.905986785888672, "global_step": 34359, "epoch": 413} {"train_loss": -18.975576400756836, "global_step": 34360, "epoch": 413} {"train_loss": -19.101271227181677, "global_step": 34361, "epoch": 413, "val_loss": 6072153.0} {"train_loss": -19.233808517456055, "global_step": 34362, "epoch": 414} {"train_loss": -19.081523895263672, "global_step": 34363, "epoch": 414} {"train_loss": -19.147724151611328, "global_step": 34364, "epoch": 414} {"train_loss": -19.101511001586914, "global_step": 34365, "epoch": 414} {"train_loss": -18.5834903717041, "global_step": 34366, "epoch": 414} {"train_loss": -19.082773208618164, "global_step": 34367, "epoch": 414} {"train_loss": -19.043949127197266, "global_step": 34368, "epoch": 414} {"train_loss": -18.824045181274414, "global_step": 34369, "epoch": 414} {"train_loss": -19.193069458007812, "global_step": 34370, "epoch": 414} {"train_loss": -19.075639724731445, "global_step": 34371, "epoch": 414} {"train_loss": -19.28122901916504, "global_step": 34372, "epoch": 414} {"train_loss": -19.02772331237793, "global_step": 34373, "epoch": 414} {"train_loss": -19.217039108276367, "global_step": 34374, "epoch": 414} {"train_loss": -19.08993148803711, "global_step": 34375, "epoch": 414} {"train_loss": -19.09859275817871, "global_step": 34376, "epoch": 414} {"train_loss": -19.247190475463867, "global_step": 34377, "epoch": 414} {"train_loss": -19.241647720336914, "global_step": 34378, "epoch": 414} {"train_loss": -18.994821548461914, "global_step": 34379, "epoch": 414} {"train_loss": -18.894365310668945, "global_step": 34380, "epoch": 414} {"train_loss": -19.042160034179688, "global_step": 34381, "epoch": 414} {"train_loss": -19.09173011779785, "global_step": 34382, "epoch": 414} {"train_loss": -19.3821964263916, "global_step": 34383, "epoch": 414} {"train_loss": -19.11625099182129, "global_step": 34384, "epoch": 414} {"train_loss": -19.27327537536621, "global_step": 34385, "epoch": 414} {"train_loss": -18.912353515625, "global_step": 34386, "epoch": 414} {"train_loss": -19.144588470458984, "global_step": 34387, "epoch": 414} {"train_loss": -19.37152671813965, "global_step": 34388, "epoch": 414} {"train_loss": -19.38136863708496, "global_step": 34389, "epoch": 414} {"train_loss": -18.74286651611328, "global_step": 34390, "epoch": 414} {"train_loss": -18.86591148376465, "global_step": 34391, "epoch": 414} {"train_loss": -19.26068115234375, "global_step": 34392, "epoch": 414} {"train_loss": -19.10479736328125, "global_step": 34393, "epoch": 414} {"train_loss": -19.560327529907227, "global_step": 34394, "epoch": 414} {"train_loss": -19.558246612548828, "global_step": 34395, "epoch": 414} {"train_loss": -19.3226375579834, "global_step": 34396, "epoch": 414} {"train_loss": -19.195068359375, "global_step": 34397, "epoch": 414} {"train_loss": -19.234289169311523, "global_step": 34398, "epoch": 414} {"train_loss": -19.0689754486084, "global_step": 34399, "epoch": 414} {"train_loss": -19.058629989624023, "global_step": 34400, "epoch": 414} {"train_loss": -19.093679428100586, "global_step": 34401, "epoch": 414} {"train_loss": -19.053075790405273, "global_step": 34402, "epoch": 414} {"train_loss": -19.123416900634766, "global_step": 34403, "epoch": 414} {"train_loss": -19.120840072631836, "global_step": 34404, "epoch": 414} {"train_loss": -19.2724666595459, "global_step": 34405, "epoch": 414} {"train_loss": -19.216882705688477, "global_step": 34406, "epoch": 414} {"train_loss": -19.32805061340332, "global_step": 34407, "epoch": 414} {"train_loss": -19.47418212890625, "global_step": 34408, "epoch": 414} {"train_loss": -19.151769638061523, "global_step": 34409, "epoch": 414} {"train_loss": -19.10187339782715, "global_step": 34410, "epoch": 414} {"train_loss": -19.08307456970215, "global_step": 34411, "epoch": 414} {"train_loss": -18.710453033447266, "global_step": 34412, "epoch": 414} {"train_loss": -19.0911922454834, "global_step": 34413, "epoch": 414} {"train_loss": -18.773040771484375, "global_step": 34414, "epoch": 414} {"train_loss": -18.982486724853516, "global_step": 34415, "epoch": 414} {"train_loss": -19.26873779296875, "global_step": 34416, "epoch": 414} {"train_loss": -19.070119857788086, "global_step": 34417, "epoch": 414} {"train_loss": -19.066268920898438, "global_step": 34418, "epoch": 414} {"train_loss": -19.409212112426758, "global_step": 34419, "epoch": 414} {"train_loss": -19.01218032836914, "global_step": 34420, "epoch": 414} {"train_loss": -19.337255477905273, "global_step": 34421, "epoch": 414} {"train_loss": -19.087852478027344, "global_step": 34422, "epoch": 414} {"train_loss": -19.242664337158203, "global_step": 34423, "epoch": 414} {"train_loss": -19.47842788696289, "global_step": 34424, "epoch": 414} {"train_loss": -18.879148483276367, "global_step": 34425, "epoch": 414} {"train_loss": -18.984031677246094, "global_step": 34426, "epoch": 414} {"train_loss": -18.790966033935547, "global_step": 34427, "epoch": 414} {"train_loss": -19.010398864746094, "global_step": 34428, "epoch": 414} {"train_loss": -18.95307731628418, "global_step": 34429, "epoch": 414} {"train_loss": -18.98589515686035, "global_step": 34430, "epoch": 414} {"train_loss": -19.379230499267578, "global_step": 34431, "epoch": 414} {"train_loss": -18.965559005737305, "global_step": 34432, "epoch": 414} {"train_loss": -19.27703857421875, "global_step": 34433, "epoch": 414} {"train_loss": -19.137229919433594, "global_step": 34434, "epoch": 414} {"train_loss": -19.096759796142578, "global_step": 34435, "epoch": 414} {"train_loss": -19.52016258239746, "global_step": 34436, "epoch": 414} {"train_loss": -19.1680965423584, "global_step": 34437, "epoch": 414} {"train_loss": -19.352798461914062, "global_step": 34438, "epoch": 414} {"train_loss": -19.09185791015625, "global_step": 34439, "epoch": 414} {"train_loss": -19.15496826171875, "global_step": 34440, "epoch": 414} {"train_loss": -18.92927360534668, "global_step": 34441, "epoch": 414} {"train_loss": -19.238195419311523, "global_step": 34442, "epoch": 414} {"train_loss": -18.96318817138672, "global_step": 34443, "epoch": 414} {"train_loss": -19.15043915897967, "global_step": 34444, "epoch": 414, "val_loss": 6011881.0} {"train_loss": -18.397077560424805, "global_step": 34445, "epoch": 415} {"train_loss": -18.660266876220703, "global_step": 34446, "epoch": 415} {"train_loss": -18.721982955932617, "global_step": 34447, "epoch": 415} {"train_loss": -18.76851463317871, "global_step": 34448, "epoch": 415} {"train_loss": -19.259510040283203, "global_step": 34449, "epoch": 415} {"train_loss": -18.872711181640625, "global_step": 34450, "epoch": 415} {"train_loss": -19.187009811401367, "global_step": 34451, "epoch": 415} {"train_loss": -18.95375633239746, "global_step": 34452, "epoch": 415} {"train_loss": -18.93317985534668, "global_step": 34453, "epoch": 415} {"train_loss": -19.094173431396484, "global_step": 34454, "epoch": 415} {"train_loss": -19.082740783691406, "global_step": 34455, "epoch": 415} {"train_loss": -18.991037368774414, "global_step": 34456, "epoch": 415} {"train_loss": -19.074323654174805, "global_step": 34457, "epoch": 415} {"train_loss": -18.825288772583008, "global_step": 34458, "epoch": 415} {"train_loss": -19.329776763916016, "global_step": 34459, "epoch": 415} {"train_loss": -19.137868881225586, "global_step": 34460, "epoch": 415} {"train_loss": -19.61985969543457, "global_step": 34461, "epoch": 415} {"train_loss": -18.79851722717285, "global_step": 34462, "epoch": 415} {"train_loss": -19.072507858276367, "global_step": 34463, "epoch": 415} {"train_loss": -19.17787742614746, "global_step": 34464, "epoch": 415} {"train_loss": -18.958383560180664, "global_step": 34465, "epoch": 415} {"train_loss": -19.201568603515625, "global_step": 34466, "epoch": 415} {"train_loss": -19.214879989624023, "global_step": 34467, "epoch": 415} {"train_loss": -19.12018394470215, "global_step": 34468, "epoch": 415} {"train_loss": -19.392227172851562, "global_step": 34469, "epoch": 415} {"train_loss": -18.921525955200195, "global_step": 34470, "epoch": 415} {"train_loss": -19.25807762145996, "global_step": 34471, "epoch": 415} {"train_loss": -19.63930320739746, "global_step": 34472, "epoch": 415} {"train_loss": -19.4077205657959, "global_step": 34473, "epoch": 415} {"train_loss": -19.159658432006836, "global_step": 34474, "epoch": 415} {"train_loss": -19.12437629699707, "global_step": 34475, "epoch": 415} {"train_loss": -19.205322265625, "global_step": 34476, "epoch": 415} {"train_loss": -18.962926864624023, "global_step": 34477, "epoch": 415} {"train_loss": -18.723020553588867, "global_step": 34478, "epoch": 415} {"train_loss": -19.269254684448242, "global_step": 34479, "epoch": 415} {"train_loss": -19.0407657623291, "global_step": 34480, "epoch": 415} {"train_loss": -18.904651641845703, "global_step": 34481, "epoch": 415} {"train_loss": -18.83010482788086, "global_step": 34482, "epoch": 415} {"train_loss": -19.069900512695312, "global_step": 34483, "epoch": 415} {"train_loss": -19.033924102783203, "global_step": 34484, "epoch": 415} {"train_loss": -19.686670303344727, "global_step": 34485, "epoch": 415} {"train_loss": -18.83707618713379, "global_step": 34486, "epoch": 415} {"train_loss": -19.27472686767578, "global_step": 34487, "epoch": 415} {"train_loss": -19.230619430541992, "global_step": 34488, "epoch": 415} {"train_loss": -19.383337020874023, "global_step": 34489, "epoch": 415} {"train_loss": -19.18721580505371, "global_step": 34490, "epoch": 415} {"train_loss": -19.36530876159668, "global_step": 34491, "epoch": 415} {"train_loss": -19.002004623413086, "global_step": 34492, "epoch": 415} {"train_loss": -19.065643310546875, "global_step": 34493, "epoch": 415} {"train_loss": -19.083667755126953, "global_step": 34494, "epoch": 415} {"train_loss": -19.364547729492188, "global_step": 34495, "epoch": 415} {"train_loss": -19.212072372436523, "global_step": 34496, "epoch": 415} {"train_loss": -19.493661880493164, "global_step": 34497, "epoch": 415} {"train_loss": -18.83710479736328, "global_step": 34498, "epoch": 415} {"train_loss": -19.197080612182617, "global_step": 34499, "epoch": 415} {"train_loss": -19.27229881286621, "global_step": 34500, "epoch": 415} {"train_loss": -19.222644805908203, "global_step": 34501, "epoch": 415} {"train_loss": -19.321115493774414, "global_step": 34502, "epoch": 415} {"train_loss": -19.270849227905273, "global_step": 34503, "epoch": 415} {"train_loss": -18.959571838378906, "global_step": 34504, "epoch": 415} {"train_loss": -19.4785099029541, "global_step": 34505, "epoch": 415} {"train_loss": -19.17912483215332, "global_step": 34506, "epoch": 415} {"train_loss": -19.259916305541992, "global_step": 34507, "epoch": 415} {"train_loss": -19.409849166870117, "global_step": 34508, "epoch": 415} {"train_loss": -19.20194435119629, "global_step": 34509, "epoch": 415} {"train_loss": -19.556720733642578, "global_step": 34510, "epoch": 415} {"train_loss": -19.24252700805664, "global_step": 34511, "epoch": 415} {"train_loss": -18.86447525024414, "global_step": 34512, "epoch": 415} {"train_loss": -18.907129287719727, "global_step": 34513, "epoch": 415} {"train_loss": -19.22439956665039, "global_step": 34514, "epoch": 415} {"train_loss": -19.144296646118164, "global_step": 34515, "epoch": 415} {"train_loss": -19.404211044311523, "global_step": 34516, "epoch": 415} {"train_loss": -19.601490020751953, "global_step": 34517, "epoch": 415} {"train_loss": -18.906965255737305, "global_step": 34518, "epoch": 415} {"train_loss": -19.2292423248291, "global_step": 34519, "epoch": 415} {"train_loss": -19.164030075073242, "global_step": 34520, "epoch": 415} {"train_loss": -19.486356735229492, "global_step": 34521, "epoch": 415} {"train_loss": -19.38818359375, "global_step": 34522, "epoch": 415} {"train_loss": -19.382455825805664, "global_step": 34523, "epoch": 415} {"train_loss": -19.423419952392578, "global_step": 34524, "epoch": 415} {"train_loss": -19.03572654724121, "global_step": 34525, "epoch": 415} {"train_loss": -19.23278045654297, "global_step": 34526, "epoch": 415} {"train_loss": -19.162864248436616, "global_step": 34527, "epoch": 415, "val_loss": 6117826.0} {"train_loss": -19.006362915039062, "global_step": 34528, "epoch": 416} {"train_loss": -19.05008888244629, "global_step": 34529, "epoch": 416} {"train_loss": -19.0488338470459, "global_step": 34530, "epoch": 416} {"train_loss": -19.3552303314209, "global_step": 34531, "epoch": 416} {"train_loss": -18.69927406311035, "global_step": 34532, "epoch": 416} {"train_loss": -19.272104263305664, "global_step": 34533, "epoch": 416} {"train_loss": -18.923429489135742, "global_step": 34534, "epoch": 416} {"train_loss": -19.155628204345703, "global_step": 34535, "epoch": 416} {"train_loss": -19.191076278686523, "global_step": 34536, "epoch": 416} {"train_loss": -19.056964874267578, "global_step": 34537, "epoch": 416} {"train_loss": -18.93363380432129, "global_step": 34538, "epoch": 416} {"train_loss": -19.13966941833496, "global_step": 34539, "epoch": 416} {"train_loss": -18.70408058166504, "global_step": 34540, "epoch": 416} {"train_loss": -18.97982406616211, "global_step": 34541, "epoch": 416} {"train_loss": -19.29671287536621, "global_step": 34542, "epoch": 416} {"train_loss": -19.037670135498047, "global_step": 34543, "epoch": 416} {"train_loss": -18.933979034423828, "global_step": 34544, "epoch": 416} {"train_loss": -19.119518280029297, "global_step": 34545, "epoch": 416} {"train_loss": -18.896665573120117, "global_step": 34546, "epoch": 416} {"train_loss": -18.994060516357422, "global_step": 34547, "epoch": 416} {"train_loss": -19.08941078186035, "global_step": 34548, "epoch": 416} {"train_loss": -19.059324264526367, "global_step": 34549, "epoch": 416} {"train_loss": -19.132097244262695, "global_step": 34550, "epoch": 416} {"train_loss": -19.166301727294922, "global_step": 34551, "epoch": 416} {"train_loss": -19.08612632751465, "global_step": 34552, "epoch": 416} {"train_loss": -19.38458251953125, "global_step": 34553, "epoch": 416} {"train_loss": -18.963232040405273, "global_step": 34554, "epoch": 416} {"train_loss": -18.84387969970703, "global_step": 34555, "epoch": 416} {"train_loss": -19.280933380126953, "global_step": 34556, "epoch": 416} {"train_loss": -19.379655838012695, "global_step": 34557, "epoch": 416} {"train_loss": -19.211719512939453, "global_step": 34558, "epoch": 416} {"train_loss": -19.57803726196289, "global_step": 34559, "epoch": 416} {"train_loss": -19.216588973999023, "global_step": 34560, "epoch": 416} {"train_loss": -18.913908004760742, "global_step": 34561, "epoch": 416} {"train_loss": -19.102933883666992, "global_step": 34562, "epoch": 416} {"train_loss": -19.54569435119629, "global_step": 34563, "epoch": 416} {"train_loss": -18.892499923706055, "global_step": 34564, "epoch": 416} {"train_loss": -19.224365234375, "global_step": 34565, "epoch": 416} {"train_loss": -19.22488021850586, "global_step": 34566, "epoch": 416} {"train_loss": -18.7805233001709, "global_step": 34567, "epoch": 416} {"train_loss": -19.32168197631836, "global_step": 34568, "epoch": 416} {"train_loss": -18.774097442626953, "global_step": 34569, "epoch": 416} {"train_loss": -18.97537612915039, "global_step": 34570, "epoch": 416} {"train_loss": -19.243070602416992, "global_step": 34571, "epoch": 416} {"train_loss": -19.303895950317383, "global_step": 34572, "epoch": 416} {"train_loss": -18.99898338317871, "global_step": 34573, "epoch": 416} {"train_loss": -19.16999626159668, "global_step": 34574, "epoch": 416} {"train_loss": -19.301578521728516, "global_step": 34575, "epoch": 416} {"train_loss": -19.097301483154297, "global_step": 34576, "epoch": 416} {"train_loss": -19.50264549255371, "global_step": 34577, "epoch": 416} {"train_loss": -19.322500228881836, "global_step": 34578, "epoch": 416} {"train_loss": -19.461685180664062, "global_step": 34579, "epoch": 416} {"train_loss": -19.33228874206543, "global_step": 34580, "epoch": 416} {"train_loss": -19.377588272094727, "global_step": 34581, "epoch": 416} {"train_loss": -19.003448486328125, "global_step": 34582, "epoch": 416} {"train_loss": -19.213359832763672, "global_step": 34583, "epoch": 416} {"train_loss": -18.91242790222168, "global_step": 34584, "epoch": 416} {"train_loss": -19.448116302490234, "global_step": 34585, "epoch": 416} {"train_loss": -19.414825439453125, "global_step": 34586, "epoch": 416} {"train_loss": -19.17082405090332, "global_step": 34587, "epoch": 416} {"train_loss": -19.518739700317383, "global_step": 34588, "epoch": 416} {"train_loss": -19.282285690307617, "global_step": 34589, "epoch": 416} {"train_loss": -19.352949142456055, "global_step": 34590, "epoch": 416} {"train_loss": -18.967350006103516, "global_step": 34591, "epoch": 416} {"train_loss": -19.28470802307129, "global_step": 34592, "epoch": 416} {"train_loss": -19.028079986572266, "global_step": 34593, "epoch": 416} {"train_loss": -19.338056564331055, "global_step": 34594, "epoch": 416} {"train_loss": -19.268890380859375, "global_step": 34595, "epoch": 416} {"train_loss": -19.187177658081055, "global_step": 34596, "epoch": 416} {"train_loss": -18.833581924438477, "global_step": 34597, "epoch": 416} {"train_loss": -19.10695457458496, "global_step": 34598, "epoch": 416} {"train_loss": -19.142812728881836, "global_step": 34599, "epoch": 416} {"train_loss": -19.336688995361328, "global_step": 34600, "epoch": 416} {"train_loss": -19.308115005493164, "global_step": 34601, "epoch": 416} {"train_loss": -19.4254093170166, "global_step": 34602, "epoch": 416} {"train_loss": -18.963956832885742, "global_step": 34603, "epoch": 416} {"train_loss": -19.139001846313477, "global_step": 34604, "epoch": 416} {"train_loss": -18.982898712158203, "global_step": 34605, "epoch": 416} {"train_loss": -19.232614517211914, "global_step": 34606, "epoch": 416} {"train_loss": -18.850683212280273, "global_step": 34607, "epoch": 416} {"train_loss": -19.33810806274414, "global_step": 34608, "epoch": 416} {"train_loss": -19.38187026977539, "global_step": 34609, "epoch": 416} {"train_loss": -19.166059907660426, "global_step": 34610, "epoch": 416, "val_loss": 5986190.5} {"train_loss": -19.015113830566406, "global_step": 34611, "epoch": 417} {"train_loss": -19.201934814453125, "global_step": 34612, "epoch": 417} {"train_loss": -18.87448501586914, "global_step": 34613, "epoch": 417} {"train_loss": -18.94471549987793, "global_step": 34614, "epoch": 417} {"train_loss": -18.807880401611328, "global_step": 34615, "epoch": 417} {"train_loss": -19.236265182495117, "global_step": 34616, "epoch": 417} {"train_loss": -19.010780334472656, "global_step": 34617, "epoch": 417} {"train_loss": -18.995710372924805, "global_step": 34618, "epoch": 417} {"train_loss": -19.244613647460938, "global_step": 34619, "epoch": 417} {"train_loss": -18.8957576751709, "global_step": 34620, "epoch": 417} {"train_loss": -18.92197608947754, "global_step": 34621, "epoch": 417} {"train_loss": -19.410873413085938, "global_step": 34622, "epoch": 417} {"train_loss": -19.20685386657715, "global_step": 34623, "epoch": 417} {"train_loss": -19.37306022644043, "global_step": 34624, "epoch": 417} {"train_loss": -19.216421127319336, "global_step": 34625, "epoch": 417} {"train_loss": -19.203842163085938, "global_step": 34626, "epoch": 417} {"train_loss": -19.27491569519043, "global_step": 34627, "epoch": 417} {"train_loss": -19.289005279541016, "global_step": 34628, "epoch": 417} {"train_loss": -19.4110107421875, "global_step": 34629, "epoch": 417} {"train_loss": -19.094877243041992, "global_step": 34630, "epoch": 417} {"train_loss": -18.931310653686523, "global_step": 34631, "epoch": 417} {"train_loss": -18.89997100830078, "global_step": 34632, "epoch": 417} {"train_loss": -19.11020278930664, "global_step": 34633, "epoch": 417} {"train_loss": -18.884798049926758, "global_step": 34634, "epoch": 417} {"train_loss": -19.20149803161621, "global_step": 34635, "epoch": 417} {"train_loss": -19.100385665893555, "global_step": 34636, "epoch": 417} {"train_loss": -19.214431762695312, "global_step": 34637, "epoch": 417} {"train_loss": -18.97993278503418, "global_step": 34638, "epoch": 417} {"train_loss": -19.304542541503906, "global_step": 34639, "epoch": 417} {"train_loss": -19.047590255737305, "global_step": 34640, "epoch": 417} {"train_loss": -19.235795974731445, "global_step": 34641, "epoch": 417} {"train_loss": -19.418283462524414, "global_step": 34642, "epoch": 417} {"train_loss": -18.936384201049805, "global_step": 34643, "epoch": 417} {"train_loss": -19.4224796295166, "global_step": 34644, "epoch": 417} {"train_loss": -19.343902587890625, "global_step": 34645, "epoch": 417} {"train_loss": -19.27541160583496, "global_step": 34646, "epoch": 417} {"train_loss": -19.22760581970215, "global_step": 34647, "epoch": 417} {"train_loss": -19.141807556152344, "global_step": 34648, "epoch": 417} {"train_loss": -19.045164108276367, "global_step": 34649, "epoch": 417} {"train_loss": -19.129362106323242, "global_step": 34650, "epoch": 417} {"train_loss": -19.126117706298828, "global_step": 34651, "epoch": 417} {"train_loss": -19.179189682006836, "global_step": 34652, "epoch": 417} {"train_loss": -19.16438865661621, "global_step": 34653, "epoch": 417} {"train_loss": -19.433582305908203, "global_step": 34654, "epoch": 417} {"train_loss": -19.306814193725586, "global_step": 34655, "epoch": 417} {"train_loss": -19.170042037963867, "global_step": 34656, "epoch": 417} {"train_loss": -19.227807998657227, "global_step": 34657, "epoch": 417} {"train_loss": -19.431779861450195, "global_step": 34658, "epoch": 417} {"train_loss": -19.260740280151367, "global_step": 34659, "epoch": 417} {"train_loss": -19.711048126220703, "global_step": 34660, "epoch": 417} {"train_loss": -19.414701461791992, "global_step": 34661, "epoch": 417} {"train_loss": -18.80640983581543, "global_step": 34662, "epoch": 417} {"train_loss": -19.149703979492188, "global_step": 34663, "epoch": 417} {"train_loss": -18.985002517700195, "global_step": 34664, "epoch": 417} {"train_loss": -19.256427764892578, "global_step": 34665, "epoch": 417} {"train_loss": -19.130905151367188, "global_step": 34666, "epoch": 417} {"train_loss": -19.563547134399414, "global_step": 34667, "epoch": 417} {"train_loss": -18.979761123657227, "global_step": 34668, "epoch": 417} {"train_loss": -19.05597496032715, "global_step": 34669, "epoch": 417} {"train_loss": -19.238794326782227, "global_step": 34670, "epoch": 417} {"train_loss": -18.857641220092773, "global_step": 34671, "epoch": 417} {"train_loss": -19.160804748535156, "global_step": 34672, "epoch": 417} {"train_loss": -19.169971466064453, "global_step": 34673, "epoch": 417} {"train_loss": -19.41237449645996, "global_step": 34674, "epoch": 417} {"train_loss": -19.120317459106445, "global_step": 34675, "epoch": 417} {"train_loss": -19.15928840637207, "global_step": 34676, "epoch": 417} {"train_loss": -19.519989013671875, "global_step": 34677, "epoch": 417} {"train_loss": -19.12589454650879, "global_step": 34678, "epoch": 417} {"train_loss": -19.309309005737305, "global_step": 34679, "epoch": 417} {"train_loss": -19.2270565032959, "global_step": 34680, "epoch": 417} {"train_loss": -19.171350479125977, "global_step": 34681, "epoch": 417} {"train_loss": -19.05504608154297, "global_step": 34682, "epoch": 417} {"train_loss": -19.28425407409668, "global_step": 34683, "epoch": 417} {"train_loss": -19.21327781677246, "global_step": 34684, "epoch": 417} {"train_loss": -19.231216430664062, "global_step": 34685, "epoch": 417} {"train_loss": -19.301258087158203, "global_step": 34686, "epoch": 417} {"train_loss": -19.105854034423828, "global_step": 34687, "epoch": 417} {"train_loss": -18.733991622924805, "global_step": 34688, "epoch": 417} {"train_loss": -18.963897705078125, "global_step": 34689, "epoch": 417} {"train_loss": -19.554079055786133, "global_step": 34690, "epoch": 417} {"train_loss": -18.758148193359375, "global_step": 34691, "epoch": 417} {"train_loss": -19.111778259277344, "global_step": 34692, "epoch": 417} {"train_loss": -19.15645826868264, "global_step": 34693, "epoch": 417, "val_loss": 6018249.0} {"train_loss": -18.458703994750977, "global_step": 34694, "epoch": 418} {"train_loss": -19.286386489868164, "global_step": 34695, "epoch": 418} {"train_loss": -18.660751342773438, "global_step": 34696, "epoch": 418} {"train_loss": -18.768510818481445, "global_step": 34697, "epoch": 418} {"train_loss": -18.971513748168945, "global_step": 34698, "epoch": 418} {"train_loss": -18.908536911010742, "global_step": 34699, "epoch": 418} {"train_loss": -19.130863189697266, "global_step": 34700, "epoch": 418} {"train_loss": -18.821794509887695, "global_step": 34701, "epoch": 418} {"train_loss": -18.814441680908203, "global_step": 34702, "epoch": 418} {"train_loss": -19.1746768951416, "global_step": 34703, "epoch": 418} {"train_loss": -18.915510177612305, "global_step": 34704, "epoch": 418} {"train_loss": -18.632078170776367, "global_step": 34705, "epoch": 418} {"train_loss": -18.916118621826172, "global_step": 34706, "epoch": 418} {"train_loss": -19.364364624023438, "global_step": 34707, "epoch": 418} {"train_loss": -19.067163467407227, "global_step": 34708, "epoch": 418} {"train_loss": -18.936519622802734, "global_step": 34709, "epoch": 418} {"train_loss": -19.072040557861328, "global_step": 34710, "epoch": 418} {"train_loss": -19.144493103027344, "global_step": 34711, "epoch": 418} {"train_loss": -19.10852813720703, "global_step": 34712, "epoch": 418} {"train_loss": -19.116687774658203, "global_step": 34713, "epoch": 418} {"train_loss": -18.906452178955078, "global_step": 34714, "epoch": 418} {"train_loss": -19.253721237182617, "global_step": 34715, "epoch": 418} {"train_loss": -19.089353561401367, "global_step": 34716, "epoch": 418} {"train_loss": -19.110687255859375, "global_step": 34717, "epoch": 418} {"train_loss": -19.170835494995117, "global_step": 34718, "epoch": 418} {"train_loss": -19.499082565307617, "global_step": 34719, "epoch": 418} {"train_loss": -18.948225021362305, "global_step": 34720, "epoch": 418} {"train_loss": -19.05647087097168, "global_step": 34721, "epoch": 418} {"train_loss": -19.157100677490234, "global_step": 34722, "epoch": 418} {"train_loss": -19.22003746032715, "global_step": 34723, "epoch": 418} {"train_loss": -19.359434127807617, "global_step": 34724, "epoch": 418} {"train_loss": -19.16974449157715, "global_step": 34725, "epoch": 418} {"train_loss": -19.339014053344727, "global_step": 34726, "epoch": 418} {"train_loss": -19.426517486572266, "global_step": 34727, "epoch": 418} {"train_loss": -18.874984741210938, "global_step": 34728, "epoch": 418} {"train_loss": -19.227733612060547, "global_step": 34729, "epoch": 418} {"train_loss": -19.141054153442383, "global_step": 34730, "epoch": 418} {"train_loss": -18.722753524780273, "global_step": 34731, "epoch": 418} {"train_loss": -19.539459228515625, "global_step": 34732, "epoch": 418} {"train_loss": -19.532520294189453, "global_step": 34733, "epoch": 418} {"train_loss": -19.320737838745117, "global_step": 34734, "epoch": 418} {"train_loss": -19.024465560913086, "global_step": 34735, "epoch": 418} {"train_loss": -19.310522079467773, "global_step": 34736, "epoch": 418} {"train_loss": -18.999164581298828, "global_step": 34737, "epoch": 418} {"train_loss": -19.002527236938477, "global_step": 34738, "epoch": 418} {"train_loss": -19.066831588745117, "global_step": 34739, "epoch": 418} {"train_loss": -19.276521682739258, "global_step": 34740, "epoch": 418} {"train_loss": -19.26838493347168, "global_step": 34741, "epoch": 418} {"train_loss": -19.322046279907227, "global_step": 34742, "epoch": 418} {"train_loss": -19.080198287963867, "global_step": 34743, "epoch": 418} {"train_loss": -18.786026000976562, "global_step": 34744, "epoch": 418} {"train_loss": -19.284006118774414, "global_step": 34745, "epoch": 418} {"train_loss": -19.372955322265625, "global_step": 34746, "epoch": 418} {"train_loss": -19.33513069152832, "global_step": 34747, "epoch": 418} {"train_loss": -18.864368438720703, "global_step": 34748, "epoch": 418} {"train_loss": -19.19365882873535, "global_step": 34749, "epoch": 418} {"train_loss": -18.876995086669922, "global_step": 34750, "epoch": 418} {"train_loss": -19.458494186401367, "global_step": 34751, "epoch": 418} {"train_loss": -19.092952728271484, "global_step": 34752, "epoch": 418} {"train_loss": -19.8779239654541, "global_step": 34753, "epoch": 418} {"train_loss": -18.929908752441406, "global_step": 34754, "epoch": 418} {"train_loss": -18.675886154174805, "global_step": 34755, "epoch": 418} {"train_loss": -19.42348289489746, "global_step": 34756, "epoch": 418} {"train_loss": -19.10079574584961, "global_step": 34757, "epoch": 418} {"train_loss": -19.376310348510742, "global_step": 34758, "epoch": 418} {"train_loss": -18.730588912963867, "global_step": 34759, "epoch": 418} {"train_loss": -18.882658004760742, "global_step": 34760, "epoch": 418} {"train_loss": -19.46803855895996, "global_step": 34761, "epoch": 418} {"train_loss": -19.167163848876953, "global_step": 34762, "epoch": 418} {"train_loss": -18.956674575805664, "global_step": 34763, "epoch": 418} {"train_loss": -19.18704605102539, "global_step": 34764, "epoch": 418} {"train_loss": -18.98014259338379, "global_step": 34765, "epoch": 418} {"train_loss": -19.04025650024414, "global_step": 34766, "epoch": 418} {"train_loss": -19.26854133605957, "global_step": 34767, "epoch": 418} {"train_loss": -19.54852867126465, "global_step": 34768, "epoch": 418} {"train_loss": -19.213520050048828, "global_step": 34769, "epoch": 418} {"train_loss": -19.406370162963867, "global_step": 34770, "epoch": 418} {"train_loss": -19.097335815429688, "global_step": 34771, "epoch": 418} {"train_loss": -19.335432052612305, "global_step": 34772, "epoch": 418} {"train_loss": -19.58672523498535, "global_step": 34773, "epoch": 418} {"train_loss": -19.432275772094727, "global_step": 34774, "epoch": 418} {"train_loss": -19.378925323486328, "global_step": 34775, "epoch": 418} {"train_loss": -19.130335152867328, "global_step": 34776, "epoch": 418, "val_loss": 6009852.0} {"train_loss": -19.160045623779297, "global_step": 34777, "epoch": 419} {"train_loss": -19.001361846923828, "global_step": 34778, "epoch": 419} {"train_loss": -18.544282913208008, "global_step": 34779, "epoch": 419} {"train_loss": -19.221731185913086, "global_step": 34780, "epoch": 419} {"train_loss": -19.338285446166992, "global_step": 34781, "epoch": 419} {"train_loss": -19.255096435546875, "global_step": 34782, "epoch": 419} {"train_loss": -18.7689151763916, "global_step": 34783, "epoch": 419} {"train_loss": -19.42250633239746, "global_step": 34784, "epoch": 419} {"train_loss": -19.00496482849121, "global_step": 34785, "epoch": 419} {"train_loss": -18.97553062438965, "global_step": 34786, "epoch": 419} {"train_loss": -19.040210723876953, "global_step": 34787, "epoch": 419} {"train_loss": -18.866418838500977, "global_step": 34788, "epoch": 419} {"train_loss": -19.01626968383789, "global_step": 34789, "epoch": 419} {"train_loss": -19.259809494018555, "global_step": 34790, "epoch": 419} {"train_loss": -19.243494033813477, "global_step": 34791, "epoch": 419} {"train_loss": -19.080480575561523, "global_step": 34792, "epoch": 419} {"train_loss": -19.00255584716797, "global_step": 34793, "epoch": 419} {"train_loss": -19.074674606323242, "global_step": 34794, "epoch": 419} {"train_loss": -19.060197830200195, "global_step": 34795, "epoch": 419} {"train_loss": -19.336807250976562, "global_step": 34796, "epoch": 419} {"train_loss": -19.507564544677734, "global_step": 34797, "epoch": 419} {"train_loss": -19.148786544799805, "global_step": 34798, "epoch": 419} {"train_loss": -19.270112991333008, "global_step": 34799, "epoch": 419} {"train_loss": -18.920879364013672, "global_step": 34800, "epoch": 419} {"train_loss": -19.33706283569336, "global_step": 34801, "epoch": 419} {"train_loss": -19.032392501831055, "global_step": 34802, "epoch": 419} {"train_loss": -19.624414443969727, "global_step": 34803, "epoch": 419} {"train_loss": -19.289670944213867, "global_step": 34804, "epoch": 419} {"train_loss": -19.3322696685791, "global_step": 34805, "epoch": 419} {"train_loss": -18.78278160095215, "global_step": 34806, "epoch": 419} {"train_loss": -19.315093994140625, "global_step": 34807, "epoch": 419} {"train_loss": -19.0123348236084, "global_step": 34808, "epoch": 419} {"train_loss": -19.32085609436035, "global_step": 34809, "epoch": 419} {"train_loss": -18.848588943481445, "global_step": 34810, "epoch": 419} {"train_loss": -19.292829513549805, "global_step": 34811, "epoch": 419} {"train_loss": -18.83030891418457, "global_step": 34812, "epoch": 419} {"train_loss": -19.291149139404297, "global_step": 34813, "epoch": 419} {"train_loss": -19.389699935913086, "global_step": 34814, "epoch": 419} {"train_loss": -19.529037475585938, "global_step": 34815, "epoch": 419} {"train_loss": -18.91250228881836, "global_step": 34816, "epoch": 419} {"train_loss": -19.12946891784668, "global_step": 34817, "epoch": 419} {"train_loss": -19.561813354492188, "global_step": 34818, "epoch": 419} {"train_loss": -19.36881446838379, "global_step": 34819, "epoch": 419} {"train_loss": -19.318456649780273, "global_step": 34820, "epoch": 419} {"train_loss": -19.14918327331543, "global_step": 34821, "epoch": 419} {"train_loss": -19.542011260986328, "global_step": 34822, "epoch": 419} {"train_loss": -19.242090225219727, "global_step": 34823, "epoch": 419} {"train_loss": -19.265338897705078, "global_step": 34824, "epoch": 419} {"train_loss": -19.26801300048828, "global_step": 34825, "epoch": 419} {"train_loss": -19.224828720092773, "global_step": 34826, "epoch": 419} {"train_loss": -19.064054489135742, "global_step": 34827, "epoch": 419} {"train_loss": -19.207136154174805, "global_step": 34828, "epoch": 419} {"train_loss": -19.563749313354492, "global_step": 34829, "epoch": 419} {"train_loss": -18.848587036132812, "global_step": 34830, "epoch": 419} {"train_loss": -19.04212760925293, "global_step": 34831, "epoch": 419} {"train_loss": -19.174312591552734, "global_step": 34832, "epoch": 419} {"train_loss": -19.54828453063965, "global_step": 34833, "epoch": 419} {"train_loss": -19.164752960205078, "global_step": 34834, "epoch": 419} {"train_loss": -18.642032623291016, "global_step": 34835, "epoch": 419} {"train_loss": -18.923505783081055, "global_step": 34836, "epoch": 419} {"train_loss": -19.13503646850586, "global_step": 34837, "epoch": 419} {"train_loss": -19.459121704101562, "global_step": 34838, "epoch": 419} {"train_loss": -19.11125373840332, "global_step": 34839, "epoch": 419} {"train_loss": -18.813339233398438, "global_step": 34840, "epoch": 419} {"train_loss": -19.2930850982666, "global_step": 34841, "epoch": 419} {"train_loss": -19.294889450073242, "global_step": 34842, "epoch": 419} {"train_loss": -19.11056900024414, "global_step": 34843, "epoch": 419} {"train_loss": -19.089763641357422, "global_step": 34844, "epoch": 419} {"train_loss": -18.98969268798828, "global_step": 34845, "epoch": 419} {"train_loss": -19.144052505493164, "global_step": 34846, "epoch": 419} {"train_loss": -19.06083869934082, "global_step": 34847, "epoch": 419} {"train_loss": -19.143394470214844, "global_step": 34848, "epoch": 419} {"train_loss": -19.06219482421875, "global_step": 34849, "epoch": 419} {"train_loss": -19.01978874206543, "global_step": 34850, "epoch": 419} {"train_loss": -18.4025821685791, "global_step": 34851, "epoch": 419} {"train_loss": -19.38360023498535, "global_step": 34852, "epoch": 419} {"train_loss": -18.757740020751953, "global_step": 34853, "epoch": 419} {"train_loss": -19.01633644104004, "global_step": 34854, "epoch": 419} {"train_loss": -19.41670799255371, "global_step": 34855, "epoch": 419} {"train_loss": -19.117475509643555, "global_step": 34856, "epoch": 419} {"train_loss": -19.309423446655273, "global_step": 34857, "epoch": 419} {"train_loss": -19.389249801635742, "global_step": 34858, "epoch": 419} {"train_loss": -19.15373719456684, "global_step": 34859, "epoch": 419, "val_loss": 5938414.5} {"train_loss": -19.0296573638916, "global_step": 34860, "epoch": 420} {"train_loss": -19.048328399658203, "global_step": 34861, "epoch": 420} {"train_loss": -18.708152770996094, "global_step": 34862, "epoch": 420} {"train_loss": -18.79718017578125, "global_step": 34863, "epoch": 420} {"train_loss": -19.12019157409668, "global_step": 34864, "epoch": 420} {"train_loss": -19.122915267944336, "global_step": 34865, "epoch": 420} {"train_loss": -19.369245529174805, "global_step": 34866, "epoch": 420} {"train_loss": -19.1339168548584, "global_step": 34867, "epoch": 420} {"train_loss": -19.135772705078125, "global_step": 34868, "epoch": 420} {"train_loss": -19.001285552978516, "global_step": 34869, "epoch": 420} {"train_loss": -19.585071563720703, "global_step": 34870, "epoch": 420} {"train_loss": -18.9798526763916, "global_step": 34871, "epoch": 420} {"train_loss": -19.09315299987793, "global_step": 34872, "epoch": 420} {"train_loss": -19.092361450195312, "global_step": 34873, "epoch": 420} {"train_loss": -19.13814353942871, "global_step": 34874, "epoch": 420} {"train_loss": -19.31022071838379, "global_step": 34875, "epoch": 420} {"train_loss": -18.994413375854492, "global_step": 34876, "epoch": 420} {"train_loss": -19.125194549560547, "global_step": 34877, "epoch": 420} {"train_loss": -19.101123809814453, "global_step": 34878, "epoch": 420} {"train_loss": -19.184593200683594, "global_step": 34879, "epoch": 420} {"train_loss": -19.710926055908203, "global_step": 34880, "epoch": 420} {"train_loss": -19.004331588745117, "global_step": 34881, "epoch": 420} {"train_loss": -19.261938095092773, "global_step": 34882, "epoch": 420} {"train_loss": -19.0444278717041, "global_step": 34883, "epoch": 420} {"train_loss": -19.022022247314453, "global_step": 34884, "epoch": 420} {"train_loss": -19.130380630493164, "global_step": 34885, "epoch": 420} {"train_loss": -19.162967681884766, "global_step": 34886, "epoch": 420} {"train_loss": -19.155933380126953, "global_step": 34887, "epoch": 420} {"train_loss": -19.08396339416504, "global_step": 34888, "epoch": 420} {"train_loss": -19.28790855407715, "global_step": 34889, "epoch": 420} {"train_loss": -19.278308868408203, "global_step": 34890, "epoch": 420} {"train_loss": -19.180784225463867, "global_step": 34891, "epoch": 420} {"train_loss": -19.30379295349121, "global_step": 34892, "epoch": 420} {"train_loss": -19.654296875, "global_step": 34893, "epoch": 420} {"train_loss": -19.019390106201172, "global_step": 34894, "epoch": 420} {"train_loss": -19.172143936157227, "global_step": 34895, "epoch": 420} {"train_loss": -19.660409927368164, "global_step": 34896, "epoch": 420} {"train_loss": -19.282482147216797, "global_step": 34897, "epoch": 420} {"train_loss": -19.20707130432129, "global_step": 34898, "epoch": 420} {"train_loss": -19.256229400634766, "global_step": 34899, "epoch": 420} {"train_loss": -19.34598731994629, "global_step": 34900, "epoch": 420} {"train_loss": -19.55396842956543, "global_step": 34901, "epoch": 420} {"train_loss": -19.376209259033203, "global_step": 34902, "epoch": 420} {"train_loss": -19.303909301757812, "global_step": 34903, "epoch": 420} {"train_loss": -19.23138427734375, "global_step": 34904, "epoch": 420} {"train_loss": -19.025177001953125, "global_step": 34905, "epoch": 420} {"train_loss": -19.28277015686035, "global_step": 34906, "epoch": 420} {"train_loss": -19.089702606201172, "global_step": 34907, "epoch": 420} {"train_loss": -19.259342193603516, "global_step": 34908, "epoch": 420} {"train_loss": -19.506155014038086, "global_step": 34909, "epoch": 420} {"train_loss": -18.8105525970459, "global_step": 34910, "epoch": 420} {"train_loss": -19.295286178588867, "global_step": 34911, "epoch": 420} {"train_loss": -19.033498764038086, "global_step": 34912, "epoch": 420} {"train_loss": -19.265710830688477, "global_step": 34913, "epoch": 420} {"train_loss": -19.03449249267578, "global_step": 34914, "epoch": 420} {"train_loss": -19.27645492553711, "global_step": 34915, "epoch": 420} {"train_loss": -19.136167526245117, "global_step": 34916, "epoch": 420} {"train_loss": -18.95046615600586, "global_step": 34917, "epoch": 420} {"train_loss": -19.491535186767578, "global_step": 34918, "epoch": 420} {"train_loss": -19.357236862182617, "global_step": 34919, "epoch": 420} {"train_loss": -19.068462371826172, "global_step": 34920, "epoch": 420} {"train_loss": -19.37379264831543, "global_step": 34921, "epoch": 420} {"train_loss": -18.92974281311035, "global_step": 34922, "epoch": 420} {"train_loss": -19.170316696166992, "global_step": 34923, "epoch": 420} {"train_loss": -19.022689819335938, "global_step": 34924, "epoch": 420} {"train_loss": -19.357519149780273, "global_step": 34925, "epoch": 420} {"train_loss": -19.0085391998291, "global_step": 34926, "epoch": 420} {"train_loss": -19.334753036499023, "global_step": 34927, "epoch": 420} {"train_loss": -19.26729393005371, "global_step": 34928, "epoch": 420} {"train_loss": -19.11531639099121, "global_step": 34929, "epoch": 420} {"train_loss": -19.2521915435791, "global_step": 34930, "epoch": 420} {"train_loss": -18.91290855407715, "global_step": 34931, "epoch": 420} {"train_loss": -19.260988235473633, "global_step": 34932, "epoch": 420} {"train_loss": -19.373952865600586, "global_step": 34933, "epoch": 420} {"train_loss": -19.145912170410156, "global_step": 34934, "epoch": 420} {"train_loss": -19.1032657623291, "global_step": 34935, "epoch": 420} {"train_loss": -19.37948989868164, "global_step": 34936, "epoch": 420} {"train_loss": -19.301666259765625, "global_step": 34937, "epoch": 420} {"train_loss": -19.28641128540039, "global_step": 34938, "epoch": 420} {"train_loss": -19.467130661010742, "global_step": 34939, "epoch": 420} {"train_loss": -19.535491943359375, "global_step": 34940, "epoch": 420} {"train_loss": -19.016870498657227, "global_step": 34941, "epoch": 420} {"train_loss": -19.195272790380272, "global_step": 34942, "epoch": 420, "val_loss": 6013659.5} {"train_loss": -18.791975021362305, "global_step": 34943, "epoch": 421} {"train_loss": -18.814685821533203, "global_step": 34944, "epoch": 421} {"train_loss": -19.234777450561523, "global_step": 34945, "epoch": 421} {"train_loss": -18.85262107849121, "global_step": 34946, "epoch": 421} {"train_loss": -19.220312118530273, "global_step": 34947, "epoch": 421} {"train_loss": -19.14919090270996, "global_step": 34948, "epoch": 421} {"train_loss": -19.002408981323242, "global_step": 34949, "epoch": 421} {"train_loss": -19.380285263061523, "global_step": 34950, "epoch": 421} {"train_loss": -19.321704864501953, "global_step": 34951, "epoch": 421} {"train_loss": -19.480894088745117, "global_step": 34952, "epoch": 421} {"train_loss": -19.073850631713867, "global_step": 34953, "epoch": 421} {"train_loss": -19.01922607421875, "global_step": 34954, "epoch": 421} {"train_loss": -18.841909408569336, "global_step": 34955, "epoch": 421} {"train_loss": -18.966753005981445, "global_step": 34956, "epoch": 421} {"train_loss": -19.193635940551758, "global_step": 34957, "epoch": 421} {"train_loss": -18.845979690551758, "global_step": 34958, "epoch": 421} {"train_loss": -19.37567138671875, "global_step": 34959, "epoch": 421} {"train_loss": -19.381122589111328, "global_step": 34960, "epoch": 421} {"train_loss": -18.886869430541992, "global_step": 34961, "epoch": 421} {"train_loss": -19.243104934692383, "global_step": 34962, "epoch": 421} {"train_loss": -19.107318878173828, "global_step": 34963, "epoch": 421} {"train_loss": -19.50421142578125, "global_step": 34964, "epoch": 421} {"train_loss": -19.222692489624023, "global_step": 34965, "epoch": 421} {"train_loss": -19.12972640991211, "global_step": 34966, "epoch": 421} {"train_loss": -19.27876091003418, "global_step": 34967, "epoch": 421} {"train_loss": -19.2030086517334, "global_step": 34968, "epoch": 421} {"train_loss": -18.87251091003418, "global_step": 34969, "epoch": 421} {"train_loss": -19.104717254638672, "global_step": 34970, "epoch": 421} {"train_loss": -19.1444034576416, "global_step": 34971, "epoch": 421} {"train_loss": -19.42983055114746, "global_step": 34972, "epoch": 421} {"train_loss": -19.19791030883789, "global_step": 34973, "epoch": 421} {"train_loss": -19.161916732788086, "global_step": 34974, "epoch": 421} {"train_loss": -19.1606388092041, "global_step": 34975, "epoch": 421} {"train_loss": -19.422943115234375, "global_step": 34976, "epoch": 421} {"train_loss": -19.53431510925293, "global_step": 34977, "epoch": 421} {"train_loss": -19.13207244873047, "global_step": 34978, "epoch": 421} {"train_loss": -19.41684913635254, "global_step": 34979, "epoch": 421} {"train_loss": -19.44330596923828, "global_step": 34980, "epoch": 421} {"train_loss": -19.638193130493164, "global_step": 34981, "epoch": 421} {"train_loss": -19.160303115844727, "global_step": 34982, "epoch": 421} {"train_loss": -19.34052085876465, "global_step": 34983, "epoch": 421} {"train_loss": -19.222692489624023, "global_step": 34984, "epoch": 421} {"train_loss": -19.100561141967773, "global_step": 34985, "epoch": 421} {"train_loss": -18.959251403808594, "global_step": 34986, "epoch": 421} {"train_loss": -19.6688232421875, "global_step": 34987, "epoch": 421} {"train_loss": -18.799901962280273, "global_step": 34988, "epoch": 421} {"train_loss": -18.910959243774414, "global_step": 34989, "epoch": 421} {"train_loss": -19.2032413482666, "global_step": 34990, "epoch": 421} {"train_loss": -19.057819366455078, "global_step": 34991, "epoch": 421} {"train_loss": -19.567228317260742, "global_step": 34992, "epoch": 421} {"train_loss": -19.1348876953125, "global_step": 34993, "epoch": 421} {"train_loss": -19.266311645507812, "global_step": 34994, "epoch": 421} {"train_loss": -19.08455467224121, "global_step": 34995, "epoch": 421} {"train_loss": -19.281248092651367, "global_step": 34996, "epoch": 421} {"train_loss": -19.271656036376953, "global_step": 34997, "epoch": 421} {"train_loss": -19.401329040527344, "global_step": 34998, "epoch": 421} {"train_loss": -19.040760040283203, "global_step": 34999, "epoch": 421} {"train_loss": -19.202489852905273, "global_step": 35000, "epoch": 421} {"train_loss": -19.388446807861328, "global_step": 35001, "epoch": 421} {"train_loss": -18.891080856323242, "global_step": 35002, "epoch": 421} {"train_loss": -19.041593551635742, "global_step": 35003, "epoch": 421} {"train_loss": -19.46331214904785, "global_step": 35004, "epoch": 421} {"train_loss": -18.938030242919922, "global_step": 35005, "epoch": 421} {"train_loss": -19.252790451049805, "global_step": 35006, "epoch": 421} {"train_loss": -19.662094116210938, "global_step": 35007, "epoch": 421} {"train_loss": -19.2647762298584, "global_step": 35008, "epoch": 421} {"train_loss": -18.892000198364258, "global_step": 35009, "epoch": 421} {"train_loss": -19.184995651245117, "global_step": 35010, "epoch": 421} {"train_loss": -18.940649032592773, "global_step": 35011, "epoch": 421} {"train_loss": -19.14848518371582, "global_step": 35012, "epoch": 421} {"train_loss": -19.808263778686523, "global_step": 35013, "epoch": 421} {"train_loss": -19.40667724609375, "global_step": 35014, "epoch": 421} {"train_loss": -19.222936630249023, "global_step": 35015, "epoch": 421} {"train_loss": -19.448314666748047, "global_step": 35016, "epoch": 421} {"train_loss": -19.133068084716797, "global_step": 35017, "epoch": 421} {"train_loss": -19.223722457885742, "global_step": 35018, "epoch": 421} {"train_loss": -18.987350463867188, "global_step": 35019, "epoch": 421} {"train_loss": -19.390331268310547, "global_step": 35020, "epoch": 421} {"train_loss": -19.294416427612305, "global_step": 35021, "epoch": 421} {"train_loss": -19.300601959228516, "global_step": 35022, "epoch": 421} {"train_loss": -19.563337326049805, "global_step": 35023, "epoch": 421} {"train_loss": -19.1331787109375, "global_step": 35024, "epoch": 421} {"train_loss": -19.20893331320889, "global_step": 35025, "epoch": 421, "val_loss": 6038106.0} {"train_loss": -18.489105224609375, "global_step": 35026, "epoch": 422} {"train_loss": -19.0893611907959, "global_step": 35027, "epoch": 422} {"train_loss": -19.104230880737305, "global_step": 35028, "epoch": 422} {"train_loss": -18.963016510009766, "global_step": 35029, "epoch": 422} {"train_loss": -18.669795989990234, "global_step": 35030, "epoch": 422} {"train_loss": -18.88749885559082, "global_step": 35031, "epoch": 422} {"train_loss": -19.0542049407959, "global_step": 35032, "epoch": 422} {"train_loss": -19.133590698242188, "global_step": 35033, "epoch": 422} {"train_loss": -19.149127960205078, "global_step": 35034, "epoch": 422} {"train_loss": -19.2664852142334, "global_step": 35035, "epoch": 422} {"train_loss": -19.104780197143555, "global_step": 35036, "epoch": 422} {"train_loss": -19.20288848876953, "global_step": 35037, "epoch": 422} {"train_loss": -19.129613876342773, "global_step": 35038, "epoch": 422} {"train_loss": -18.998014450073242, "global_step": 35039, "epoch": 422} {"train_loss": -19.32440757751465, "global_step": 35040, "epoch": 422} {"train_loss": -19.20061492919922, "global_step": 35041, "epoch": 422} {"train_loss": -19.156930923461914, "global_step": 35042, "epoch": 422} {"train_loss": -19.027780532836914, "global_step": 35043, "epoch": 422} {"train_loss": -19.073843002319336, "global_step": 35044, "epoch": 422} {"train_loss": -18.967540740966797, "global_step": 35045, "epoch": 422} {"train_loss": -19.42329216003418, "global_step": 35046, "epoch": 422} {"train_loss": -19.610309600830078, "global_step": 35047, "epoch": 422} {"train_loss": -19.208738327026367, "global_step": 35048, "epoch": 422} {"train_loss": -19.25478172302246, "global_step": 35049, "epoch": 422} {"train_loss": -19.120718002319336, "global_step": 35050, "epoch": 422} {"train_loss": -19.23240852355957, "global_step": 35051, "epoch": 422} {"train_loss": -18.732608795166016, "global_step": 35052, "epoch": 422} {"train_loss": -19.32597541809082, "global_step": 35053, "epoch": 422} {"train_loss": -19.0271053314209, "global_step": 35054, "epoch": 422} {"train_loss": -19.078855514526367, "global_step": 35055, "epoch": 422} {"train_loss": -19.443601608276367, "global_step": 35056, "epoch": 422} {"train_loss": -19.157089233398438, "global_step": 35057, "epoch": 422} {"train_loss": -18.895431518554688, "global_step": 35058, "epoch": 422} {"train_loss": -19.112319946289062, "global_step": 35059, "epoch": 422} {"train_loss": -19.347288131713867, "global_step": 35060, "epoch": 422} {"train_loss": -19.413105010986328, "global_step": 35061, "epoch": 422} {"train_loss": -19.539697647094727, "global_step": 35062, "epoch": 422} {"train_loss": -19.100339889526367, "global_step": 35063, "epoch": 422} {"train_loss": -19.38422203063965, "global_step": 35064, "epoch": 422} {"train_loss": -19.283048629760742, "global_step": 35065, "epoch": 422} {"train_loss": -19.343542098999023, "global_step": 35066, "epoch": 422} {"train_loss": -19.185083389282227, "global_step": 35067, "epoch": 422} {"train_loss": -18.939870834350586, "global_step": 35068, "epoch": 422} {"train_loss": -19.284337997436523, "global_step": 35069, "epoch": 422} {"train_loss": -18.912572860717773, "global_step": 35070, "epoch": 422} {"train_loss": -19.165863037109375, "global_step": 35071, "epoch": 422} {"train_loss": -19.47706413269043, "global_step": 35072, "epoch": 422} {"train_loss": -19.091625213623047, "global_step": 35073, "epoch": 422} {"train_loss": -19.703962326049805, "global_step": 35074, "epoch": 422} {"train_loss": -19.191625595092773, "global_step": 35075, "epoch": 422} {"train_loss": -19.2789249420166, "global_step": 35076, "epoch": 422} {"train_loss": -19.067626953125, "global_step": 35077, "epoch": 422} {"train_loss": -18.88051414489746, "global_step": 35078, "epoch": 422} {"train_loss": -19.398962020874023, "global_step": 35079, "epoch": 422} {"train_loss": -18.924665451049805, "global_step": 35080, "epoch": 422} {"train_loss": -19.2164363861084, "global_step": 35081, "epoch": 422} {"train_loss": -18.942798614501953, "global_step": 35082, "epoch": 422} {"train_loss": -19.2482852935791, "global_step": 35083, "epoch": 422} {"train_loss": -19.33235740661621, "global_step": 35084, "epoch": 422} {"train_loss": -19.052282333374023, "global_step": 35085, "epoch": 422} {"train_loss": -19.448867797851562, "global_step": 35086, "epoch": 422} {"train_loss": -18.963903427124023, "global_step": 35087, "epoch": 422} {"train_loss": -18.95712661743164, "global_step": 35088, "epoch": 422} {"train_loss": -19.58133316040039, "global_step": 35089, "epoch": 422} {"train_loss": -18.933324813842773, "global_step": 35090, "epoch": 422} {"train_loss": -19.0264835357666, "global_step": 35091, "epoch": 422} {"train_loss": -19.272159576416016, "global_step": 35092, "epoch": 422} {"train_loss": -19.106040954589844, "global_step": 35093, "epoch": 422} {"train_loss": -19.255962371826172, "global_step": 35094, "epoch": 422} {"train_loss": -19.292377471923828, "global_step": 35095, "epoch": 422} {"train_loss": -19.175832748413086, "global_step": 35096, "epoch": 422} {"train_loss": -19.051639556884766, "global_step": 35097, "epoch": 422} {"train_loss": -19.040451049804688, "global_step": 35098, "epoch": 422} {"train_loss": -19.332700729370117, "global_step": 35099, "epoch": 422} {"train_loss": -19.00715446472168, "global_step": 35100, "epoch": 422} {"train_loss": -19.085538864135742, "global_step": 35101, "epoch": 422} {"train_loss": -19.319955825805664, "global_step": 35102, "epoch": 422} {"train_loss": -19.494430541992188, "global_step": 35103, "epoch": 422} {"train_loss": -19.245180130004883, "global_step": 35104, "epoch": 422} {"train_loss": -19.089078903198242, "global_step": 35105, "epoch": 422} {"train_loss": -19.090993881225586, "global_step": 35106, "epoch": 422} {"train_loss": -19.1240177154541, "global_step": 35107, "epoch": 422} {"train_loss": -19.15329032346427, "global_step": 35108, "epoch": 422, "val_loss": 5872797.0} {"train_loss": -18.943384170532227, "global_step": 35109, "epoch": 423} {"train_loss": -18.507680892944336, "global_step": 35110, "epoch": 423} {"train_loss": -18.72566795349121, "global_step": 35111, "epoch": 423} {"train_loss": -19.362356185913086, "global_step": 35112, "epoch": 423} {"train_loss": -19.242124557495117, "global_step": 35113, "epoch": 423} {"train_loss": -18.835073471069336, "global_step": 35114, "epoch": 423} {"train_loss": -18.956729888916016, "global_step": 35115, "epoch": 423} {"train_loss": -18.77083969116211, "global_step": 35116, "epoch": 423} {"train_loss": -19.242902755737305, "global_step": 35117, "epoch": 423} {"train_loss": -19.131179809570312, "global_step": 35118, "epoch": 423} {"train_loss": -18.871742248535156, "global_step": 35119, "epoch": 423} {"train_loss": -18.774890899658203, "global_step": 35120, "epoch": 423} {"train_loss": -19.32294273376465, "global_step": 35121, "epoch": 423} {"train_loss": -19.138456344604492, "global_step": 35122, "epoch": 423} {"train_loss": -19.346967697143555, "global_step": 35123, "epoch": 423} {"train_loss": -18.974733352661133, "global_step": 35124, "epoch": 423} {"train_loss": -19.223051071166992, "global_step": 35125, "epoch": 423} {"train_loss": -19.1090030670166, "global_step": 35126, "epoch": 423} {"train_loss": -19.1428165435791, "global_step": 35127, "epoch": 423} {"train_loss": -19.20479393005371, "global_step": 35128, "epoch": 423} {"train_loss": -19.203886032104492, "global_step": 35129, "epoch": 423} {"train_loss": -19.428531646728516, "global_step": 35130, "epoch": 423} {"train_loss": -19.12384605407715, "global_step": 35131, "epoch": 423} {"train_loss": -18.99103546142578, "global_step": 35132, "epoch": 423} {"train_loss": -19.245254516601562, "global_step": 35133, "epoch": 423} {"train_loss": -19.158674240112305, "global_step": 35134, "epoch": 423} {"train_loss": -18.87311363220215, "global_step": 35135, "epoch": 423} {"train_loss": -19.100101470947266, "global_step": 35136, "epoch": 423} {"train_loss": -19.17099952697754, "global_step": 35137, "epoch": 423} {"train_loss": -18.934890747070312, "global_step": 35138, "epoch": 423} {"train_loss": -19.195331573486328, "global_step": 35139, "epoch": 423} {"train_loss": -19.62907600402832, "global_step": 35140, "epoch": 423} {"train_loss": -19.336759567260742, "global_step": 35141, "epoch": 423} {"train_loss": -19.27925682067871, "global_step": 35142, "epoch": 423} {"train_loss": -19.331693649291992, "global_step": 35143, "epoch": 423} {"train_loss": -19.17506980895996, "global_step": 35144, "epoch": 423} {"train_loss": -19.15620231628418, "global_step": 35145, "epoch": 423} {"train_loss": -19.326488494873047, "global_step": 35146, "epoch": 423} {"train_loss": -19.496295928955078, "global_step": 35147, "epoch": 423} {"train_loss": -19.150405883789062, "global_step": 35148, "epoch": 423} {"train_loss": -19.306928634643555, "global_step": 35149, "epoch": 423} {"train_loss": -19.330154418945312, "global_step": 35150, "epoch": 423} {"train_loss": -19.52569580078125, "global_step": 35151, "epoch": 423} {"train_loss": -19.02338409423828, "global_step": 35152, "epoch": 423} {"train_loss": -18.967548370361328, "global_step": 35153, "epoch": 423} {"train_loss": -19.37095069885254, "global_step": 35154, "epoch": 423} {"train_loss": -19.009977340698242, "global_step": 35155, "epoch": 423} {"train_loss": -19.30641746520996, "global_step": 35156, "epoch": 423} {"train_loss": -19.521060943603516, "global_step": 35157, "epoch": 423} {"train_loss": -19.202072143554688, "global_step": 35158, "epoch": 423} {"train_loss": -19.151111602783203, "global_step": 35159, "epoch": 423} {"train_loss": -19.47071647644043, "global_step": 35160, "epoch": 423} {"train_loss": -19.078855514526367, "global_step": 35161, "epoch": 423} {"train_loss": -19.517547607421875, "global_step": 35162, "epoch": 423} {"train_loss": -19.40293312072754, "global_step": 35163, "epoch": 423} {"train_loss": -19.159854888916016, "global_step": 35164, "epoch": 423} {"train_loss": -19.296960830688477, "global_step": 35165, "epoch": 423} {"train_loss": -19.224308013916016, "global_step": 35166, "epoch": 423} {"train_loss": -19.361820220947266, "global_step": 35167, "epoch": 423} {"train_loss": -19.24072265625, "global_step": 35168, "epoch": 423} {"train_loss": -19.36701011657715, "global_step": 35169, "epoch": 423} {"train_loss": -19.442005157470703, "global_step": 35170, "epoch": 423} {"train_loss": -19.24808692932129, "global_step": 35171, "epoch": 423} {"train_loss": -19.017526626586914, "global_step": 35172, "epoch": 423} {"train_loss": -19.207754135131836, "global_step": 35173, "epoch": 423} {"train_loss": -19.105152130126953, "global_step": 35174, "epoch": 423} {"train_loss": -18.72443962097168, "global_step": 35175, "epoch": 423} {"train_loss": -19.395185470581055, "global_step": 35176, "epoch": 423} {"train_loss": -19.132862091064453, "global_step": 35177, "epoch": 423} {"train_loss": -18.97651481628418, "global_step": 35178, "epoch": 423} {"train_loss": -18.798479080200195, "global_step": 35179, "epoch": 423} {"train_loss": -19.34954833984375, "global_step": 35180, "epoch": 423} {"train_loss": -19.34970474243164, "global_step": 35181, "epoch": 423} {"train_loss": -18.68939208984375, "global_step": 35182, "epoch": 423} {"train_loss": -19.045034408569336, "global_step": 35183, "epoch": 423} {"train_loss": -19.122329711914062, "global_step": 35184, "epoch": 423} {"train_loss": -19.232282638549805, "global_step": 35185, "epoch": 423} {"train_loss": -19.20285987854004, "global_step": 35186, "epoch": 423} {"train_loss": -19.216339111328125, "global_step": 35187, "epoch": 423} {"train_loss": -18.987401962280273, "global_step": 35188, "epoch": 423} {"train_loss": -18.987943649291992, "global_step": 35189, "epoch": 423} {"train_loss": -18.772897720336914, "global_step": 35190, "epoch": 423} {"train_loss": -19.173011481043805, "global_step": 35191, "epoch": 423, "val_loss": 6058602.0} {"train_loss": -18.926267623901367, "global_step": 35192, "epoch": 424} {"train_loss": -19.15423583984375, "global_step": 35193, "epoch": 424} {"train_loss": -18.728384017944336, "global_step": 35194, "epoch": 424} {"train_loss": -19.227176666259766, "global_step": 35195, "epoch": 424} {"train_loss": -19.33304214477539, "global_step": 35196, "epoch": 424} {"train_loss": -19.29638671875, "global_step": 35197, "epoch": 424} {"train_loss": -19.099790573120117, "global_step": 35198, "epoch": 424} {"train_loss": -19.03460693359375, "global_step": 35199, "epoch": 424} {"train_loss": -19.14381217956543, "global_step": 35200, "epoch": 424} {"train_loss": -19.162382125854492, "global_step": 35201, "epoch": 424} {"train_loss": -18.976642608642578, "global_step": 35202, "epoch": 424} {"train_loss": -18.842487335205078, "global_step": 35203, "epoch": 424} {"train_loss": -19.476045608520508, "global_step": 35204, "epoch": 424} {"train_loss": -18.71860694885254, "global_step": 35205, "epoch": 424} {"train_loss": -19.068538665771484, "global_step": 35206, "epoch": 424} {"train_loss": -19.15474510192871, "global_step": 35207, "epoch": 424} {"train_loss": -19.087936401367188, "global_step": 35208, "epoch": 424} {"train_loss": -19.235380172729492, "global_step": 35209, "epoch": 424} {"train_loss": -19.178537368774414, "global_step": 35210, "epoch": 424} {"train_loss": -19.4262752532959, "global_step": 35211, "epoch": 424} {"train_loss": -19.27167320251465, "global_step": 35212, "epoch": 424} {"train_loss": -18.993061065673828, "global_step": 35213, "epoch": 424} {"train_loss": -19.04265594482422, "global_step": 35214, "epoch": 424} {"train_loss": -19.287960052490234, "global_step": 35215, "epoch": 424} {"train_loss": -19.279556274414062, "global_step": 35216, "epoch": 424} {"train_loss": -19.1480712890625, "global_step": 35217, "epoch": 424} {"train_loss": -19.52162742614746, "global_step": 35218, "epoch": 424} {"train_loss": -19.464445114135742, "global_step": 35219, "epoch": 424} {"train_loss": -19.395156860351562, "global_step": 35220, "epoch": 424} {"train_loss": -19.19257354736328, "global_step": 35221, "epoch": 424} {"train_loss": -19.421125411987305, "global_step": 35222, "epoch": 424} {"train_loss": -19.297870635986328, "global_step": 35223, "epoch": 424} {"train_loss": -19.423444747924805, "global_step": 35224, "epoch": 424} {"train_loss": -19.333585739135742, "global_step": 35225, "epoch": 424} {"train_loss": -19.078229904174805, "global_step": 35226, "epoch": 424} {"train_loss": -19.429096221923828, "global_step": 35227, "epoch": 424} {"train_loss": -19.225467681884766, "global_step": 35228, "epoch": 424} {"train_loss": -18.984773635864258, "global_step": 35229, "epoch": 424} {"train_loss": -19.292808532714844, "global_step": 35230, "epoch": 424} {"train_loss": -19.316282272338867, "global_step": 35231, "epoch": 424} {"train_loss": -18.99944496154785, "global_step": 35232, "epoch": 424} {"train_loss": -19.043485641479492, "global_step": 35233, "epoch": 424} {"train_loss": -19.457950592041016, "global_step": 35234, "epoch": 424} {"train_loss": -19.035892486572266, "global_step": 35235, "epoch": 424} {"train_loss": -19.267715454101562, "global_step": 35236, "epoch": 424} {"train_loss": -18.8906192779541, "global_step": 35237, "epoch": 424} {"train_loss": -19.287425994873047, "global_step": 35238, "epoch": 424} {"train_loss": -19.08582305908203, "global_step": 35239, "epoch": 424} {"train_loss": -19.28681182861328, "global_step": 35240, "epoch": 424} {"train_loss": -19.33051300048828, "global_step": 35241, "epoch": 424} {"train_loss": -19.143430709838867, "global_step": 35242, "epoch": 424} {"train_loss": -19.241857528686523, "global_step": 35243, "epoch": 424} {"train_loss": -19.1785945892334, "global_step": 35244, "epoch": 424} {"train_loss": -19.34334945678711, "global_step": 35245, "epoch": 424} {"train_loss": -19.42087745666504, "global_step": 35246, "epoch": 424} {"train_loss": -19.110321044921875, "global_step": 35247, "epoch": 424} {"train_loss": -19.308589935302734, "global_step": 35248, "epoch": 424} {"train_loss": -19.27065086364746, "global_step": 35249, "epoch": 424} {"train_loss": -19.571828842163086, "global_step": 35250, "epoch": 424} {"train_loss": -19.186477661132812, "global_step": 35251, "epoch": 424} {"train_loss": -19.209020614624023, "global_step": 35252, "epoch": 424} {"train_loss": -19.238615036010742, "global_step": 35253, "epoch": 424} {"train_loss": -19.09523582458496, "global_step": 35254, "epoch": 424} {"train_loss": -19.292356491088867, "global_step": 35255, "epoch": 424} {"train_loss": -19.157751083374023, "global_step": 35256, "epoch": 424} {"train_loss": -18.994382858276367, "global_step": 35257, "epoch": 424} {"train_loss": -19.435585021972656, "global_step": 35258, "epoch": 424} {"train_loss": -19.099828720092773, "global_step": 35259, "epoch": 424} {"train_loss": -19.195682525634766, "global_step": 35260, "epoch": 424} {"train_loss": -18.685956954956055, "global_step": 35261, "epoch": 424} {"train_loss": -19.1606388092041, "global_step": 35262, "epoch": 424} {"train_loss": -19.094968795776367, "global_step": 35263, "epoch": 424} {"train_loss": -19.000186920166016, "global_step": 35264, "epoch": 424} {"train_loss": -19.149688720703125, "global_step": 35265, "epoch": 424} {"train_loss": -18.939237594604492, "global_step": 35266, "epoch": 424} {"train_loss": -18.94019889831543, "global_step": 35267, "epoch": 424} {"train_loss": -18.978788375854492, "global_step": 35268, "epoch": 424} {"train_loss": -19.148746490478516, "global_step": 35269, "epoch": 424} {"train_loss": -18.832040786743164, "global_step": 35270, "epoch": 424} {"train_loss": -18.84473991394043, "global_step": 35271, "epoch": 424} {"train_loss": -19.019643783569336, "global_step": 35272, "epoch": 424} {"train_loss": -19.174671173095703, "global_step": 35273, "epoch": 424} {"train_loss": -19.17765304841191, "global_step": 35274, "epoch": 424, "val_loss": 6052528.0} {"train_loss": -18.793134689331055, "global_step": 35275, "epoch": 425} {"train_loss": -19.361494064331055, "global_step": 35276, "epoch": 425} {"train_loss": -19.167068481445312, "global_step": 35277, "epoch": 425} {"train_loss": -19.454668045043945, "global_step": 35278, "epoch": 425} {"train_loss": -18.9012451171875, "global_step": 35279, "epoch": 425} {"train_loss": -19.04465103149414, "global_step": 35280, "epoch": 425} {"train_loss": -19.518735885620117, "global_step": 35281, "epoch": 425} {"train_loss": -19.349714279174805, "global_step": 35282, "epoch": 425} {"train_loss": -19.026403427124023, "global_step": 35283, "epoch": 425} {"train_loss": -18.90835952758789, "global_step": 35284, "epoch": 425} {"train_loss": -19.0305118560791, "global_step": 35285, "epoch": 425} {"train_loss": -19.23483657836914, "global_step": 35286, "epoch": 425} {"train_loss": -19.209842681884766, "global_step": 35287, "epoch": 425} {"train_loss": -19.156991958618164, "global_step": 35288, "epoch": 425} {"train_loss": -19.14057731628418, "global_step": 35289, "epoch": 425} {"train_loss": -19.117109298706055, "global_step": 35290, "epoch": 425} {"train_loss": -19.02619171142578, "global_step": 35291, "epoch": 425} {"train_loss": -19.012882232666016, "global_step": 35292, "epoch": 425} {"train_loss": -19.12045669555664, "global_step": 35293, "epoch": 425} {"train_loss": -18.83481216430664, "global_step": 35294, "epoch": 425} {"train_loss": -19.348854064941406, "global_step": 35295, "epoch": 425} {"train_loss": -18.87086296081543, "global_step": 35296, "epoch": 425} {"train_loss": -19.022756576538086, "global_step": 35297, "epoch": 425} {"train_loss": -19.17323112487793, "global_step": 35298, "epoch": 425} {"train_loss": -18.9841251373291, "global_step": 35299, "epoch": 425} {"train_loss": -19.012706756591797, "global_step": 35300, "epoch": 425} {"train_loss": -19.257158279418945, "global_step": 35301, "epoch": 425} {"train_loss": -18.71449851989746, "global_step": 35302, "epoch": 425} {"train_loss": -19.45901870727539, "global_step": 35303, "epoch": 425} {"train_loss": -19.03389549255371, "global_step": 35304, "epoch": 425} {"train_loss": -19.36463737487793, "global_step": 35305, "epoch": 425} {"train_loss": -19.298906326293945, "global_step": 35306, "epoch": 425} {"train_loss": -19.06110954284668, "global_step": 35307, "epoch": 425} {"train_loss": -19.194211959838867, "global_step": 35308, "epoch": 425} {"train_loss": -19.31517791748047, "global_step": 35309, "epoch": 425} {"train_loss": -19.00848388671875, "global_step": 35310, "epoch": 425} {"train_loss": -19.270795822143555, "global_step": 35311, "epoch": 425} {"train_loss": -19.022066116333008, "global_step": 35312, "epoch": 425} {"train_loss": -19.346261978149414, "global_step": 35313, "epoch": 425} {"train_loss": -19.290658950805664, "global_step": 35314, "epoch": 425} {"train_loss": -19.3917236328125, "global_step": 35315, "epoch": 425} {"train_loss": -19.098224639892578, "global_step": 35316, "epoch": 425} {"train_loss": -19.26328468322754, "global_step": 35317, "epoch": 425} {"train_loss": -19.23555564880371, "global_step": 35318, "epoch": 425} {"train_loss": -19.321800231933594, "global_step": 35319, "epoch": 425} {"train_loss": -18.998693466186523, "global_step": 35320, "epoch": 425} {"train_loss": -19.513042449951172, "global_step": 35321, "epoch": 425} {"train_loss": -19.10932731628418, "global_step": 35322, "epoch": 425} {"train_loss": -19.36090087890625, "global_step": 35323, "epoch": 425} {"train_loss": -19.47414779663086, "global_step": 35324, "epoch": 425} {"train_loss": -19.500301361083984, "global_step": 35325, "epoch": 425} {"train_loss": -19.588951110839844, "global_step": 35326, "epoch": 425} {"train_loss": -19.091398239135742, "global_step": 35327, "epoch": 425} {"train_loss": -19.413043975830078, "global_step": 35328, "epoch": 425} {"train_loss": -19.35978126525879, "global_step": 35329, "epoch": 425} {"train_loss": -19.078662872314453, "global_step": 35330, "epoch": 425} {"train_loss": -19.1429500579834, "global_step": 35331, "epoch": 425} {"train_loss": -19.386476516723633, "global_step": 35332, "epoch": 425} {"train_loss": -19.244976043701172, "global_step": 35333, "epoch": 425} {"train_loss": -19.32607078552246, "global_step": 35334, "epoch": 425} {"train_loss": -18.815916061401367, "global_step": 35335, "epoch": 425} {"train_loss": -19.21380043029785, "global_step": 35336, "epoch": 425} {"train_loss": -19.511526107788086, "global_step": 35337, "epoch": 425} {"train_loss": -19.064197540283203, "global_step": 35338, "epoch": 425} {"train_loss": -19.430234909057617, "global_step": 35339, "epoch": 425} {"train_loss": -19.14198875427246, "global_step": 35340, "epoch": 425} {"train_loss": -19.53834342956543, "global_step": 35341, "epoch": 425} {"train_loss": -19.286027908325195, "global_step": 35342, "epoch": 425} {"train_loss": -18.959455490112305, "global_step": 35343, "epoch": 425} {"train_loss": -19.114093780517578, "global_step": 35344, "epoch": 425} {"train_loss": -19.472061157226562, "global_step": 35345, "epoch": 425} {"train_loss": -19.300779342651367, "global_step": 35346, "epoch": 425} {"train_loss": -18.92301368713379, "global_step": 35347, "epoch": 425} {"train_loss": -19.627744674682617, "global_step": 35348, "epoch": 425} {"train_loss": -19.28937339782715, "global_step": 35349, "epoch": 425} {"train_loss": -19.296567916870117, "global_step": 35350, "epoch": 425} {"train_loss": -18.972253799438477, "global_step": 35351, "epoch": 425} {"train_loss": -19.40196418762207, "global_step": 35352, "epoch": 425} {"train_loss": -19.25360107421875, "global_step": 35353, "epoch": 425} {"train_loss": -19.39875602722168, "global_step": 35354, "epoch": 425} {"train_loss": -19.09638214111328, "global_step": 35355, "epoch": 425} {"train_loss": -18.763946533203125, "global_step": 35356, "epoch": 425} {"train_loss": -19.176534721650274, "global_step": 35357, "epoch": 425, "val_loss": 6060594.0} {"train_loss": -19.20722007751465, "global_step": 35358, "epoch": 426} {"train_loss": -18.984127044677734, "global_step": 35359, "epoch": 426} {"train_loss": -19.031034469604492, "global_step": 35360, "epoch": 426} {"train_loss": -19.009023666381836, "global_step": 35361, "epoch": 426} {"train_loss": -19.282291412353516, "global_step": 35362, "epoch": 426} {"train_loss": -18.99283218383789, "global_step": 35363, "epoch": 426} {"train_loss": -18.94635581970215, "global_step": 35364, "epoch": 426} {"train_loss": -19.6325626373291, "global_step": 35365, "epoch": 426} {"train_loss": -19.027891159057617, "global_step": 35366, "epoch": 426} {"train_loss": -19.014493942260742, "global_step": 35367, "epoch": 426} {"train_loss": -19.060787200927734, "global_step": 35368, "epoch": 426} {"train_loss": -18.83028221130371, "global_step": 35369, "epoch": 426} {"train_loss": -18.814937591552734, "global_step": 35370, "epoch": 426} {"train_loss": -19.1989688873291, "global_step": 35371, "epoch": 426} {"train_loss": -19.419044494628906, "global_step": 35372, "epoch": 426} {"train_loss": -18.982316970825195, "global_step": 35373, "epoch": 426} {"train_loss": -19.06368637084961, "global_step": 35374, "epoch": 426} {"train_loss": -19.557205200195312, "global_step": 35375, "epoch": 426} {"train_loss": -18.94267463684082, "global_step": 35376, "epoch": 426} {"train_loss": -19.30131721496582, "global_step": 35377, "epoch": 426} {"train_loss": -19.656232833862305, "global_step": 35378, "epoch": 426} {"train_loss": -19.23069190979004, "global_step": 35379, "epoch": 426} {"train_loss": -19.224966049194336, "global_step": 35380, "epoch": 426} {"train_loss": -19.554685592651367, "global_step": 35381, "epoch": 426} {"train_loss": -18.86954116821289, "global_step": 35382, "epoch": 426} {"train_loss": -19.060230255126953, "global_step": 35383, "epoch": 426} {"train_loss": -19.22159767150879, "global_step": 35384, "epoch": 426} {"train_loss": -18.81235122680664, "global_step": 35385, "epoch": 426} {"train_loss": -19.127216339111328, "global_step": 35386, "epoch": 426} {"train_loss": -19.145362854003906, "global_step": 35387, "epoch": 426} {"train_loss": -19.509511947631836, "global_step": 35388, "epoch": 426} {"train_loss": -19.248695373535156, "global_step": 35389, "epoch": 426} {"train_loss": -19.48636817932129, "global_step": 35390, "epoch": 426} {"train_loss": -19.34334373474121, "global_step": 35391, "epoch": 426} {"train_loss": -18.924962997436523, "global_step": 35392, "epoch": 426} {"train_loss": -19.15052604675293, "global_step": 35393, "epoch": 426} {"train_loss": -19.27191734313965, "global_step": 35394, "epoch": 426} {"train_loss": -19.224855422973633, "global_step": 35395, "epoch": 426} {"train_loss": -19.068313598632812, "global_step": 35396, "epoch": 426} {"train_loss": -19.313901901245117, "global_step": 35397, "epoch": 426} {"train_loss": -19.112667083740234, "global_step": 35398, "epoch": 426} {"train_loss": -19.528892517089844, "global_step": 35399, "epoch": 426} {"train_loss": -19.04230308532715, "global_step": 35400, "epoch": 426} {"train_loss": -19.209665298461914, "global_step": 35401, "epoch": 426} {"train_loss": -19.217880249023438, "global_step": 35402, "epoch": 426} {"train_loss": -19.09885025024414, "global_step": 35403, "epoch": 426} {"train_loss": -19.1626033782959, "global_step": 35404, "epoch": 426} {"train_loss": -18.975679397583008, "global_step": 35405, "epoch": 426} {"train_loss": -19.091230392456055, "global_step": 35406, "epoch": 426} {"train_loss": -19.383350372314453, "global_step": 35407, "epoch": 426} {"train_loss": -19.1629581451416, "global_step": 35408, "epoch": 426} {"train_loss": -19.238924026489258, "global_step": 35409, "epoch": 426} {"train_loss": -19.337575912475586, "global_step": 35410, "epoch": 426} {"train_loss": -19.283056259155273, "global_step": 35411, "epoch": 426} {"train_loss": -19.158323287963867, "global_step": 35412, "epoch": 426} {"train_loss": -19.512371063232422, "global_step": 35413, "epoch": 426} {"train_loss": -19.393314361572266, "global_step": 35414, "epoch": 426} {"train_loss": -19.0280818939209, "global_step": 35415, "epoch": 426} {"train_loss": -19.495025634765625, "global_step": 35416, "epoch": 426} {"train_loss": -19.14310646057129, "global_step": 35417, "epoch": 426} {"train_loss": -19.16349220275879, "global_step": 35418, "epoch": 426} {"train_loss": -19.397045135498047, "global_step": 35419, "epoch": 426} {"train_loss": -19.246274948120117, "global_step": 35420, "epoch": 426} {"train_loss": -18.969894409179688, "global_step": 35421, "epoch": 426} {"train_loss": -19.244205474853516, "global_step": 35422, "epoch": 426} {"train_loss": -19.276254653930664, "global_step": 35423, "epoch": 426} {"train_loss": -19.20407485961914, "global_step": 35424, "epoch": 426} {"train_loss": -19.012802124023438, "global_step": 35425, "epoch": 426} {"train_loss": -19.348087310791016, "global_step": 35426, "epoch": 426} {"train_loss": -19.1438045501709, "global_step": 35427, "epoch": 426} {"train_loss": -19.357776641845703, "global_step": 35428, "epoch": 426} {"train_loss": -19.251806259155273, "global_step": 35429, "epoch": 426} {"train_loss": -19.27924156188965, "global_step": 35430, "epoch": 426} {"train_loss": -19.054393768310547, "global_step": 35431, "epoch": 426} {"train_loss": -19.156818389892578, "global_step": 35432, "epoch": 426} {"train_loss": -18.810400009155273, "global_step": 35433, "epoch": 426} {"train_loss": -19.279741287231445, "global_step": 35434, "epoch": 426} {"train_loss": -18.91291618347168, "global_step": 35435, "epoch": 426} {"train_loss": -19.095754623413086, "global_step": 35436, "epoch": 426} {"train_loss": -19.14131736755371, "global_step": 35437, "epoch": 426} {"train_loss": -19.23480796813965, "global_step": 35438, "epoch": 426} {"train_loss": -19.462926864624023, "global_step": 35439, "epoch": 426} {"train_loss": -19.17512797160321, "global_step": 35440, "epoch": 426, "val_loss": 5959837.0} {"train_loss": -19.052932739257812, "global_step": 35441, "epoch": 427} {"train_loss": -19.368579864501953, "global_step": 35442, "epoch": 427} {"train_loss": -19.192493438720703, "global_step": 35443, "epoch": 427} {"train_loss": -18.921308517456055, "global_step": 35444, "epoch": 427} {"train_loss": -19.40875244140625, "global_step": 35445, "epoch": 427} {"train_loss": -19.013851165771484, "global_step": 35446, "epoch": 427} {"train_loss": -19.061986923217773, "global_step": 35447, "epoch": 427} {"train_loss": -19.109939575195312, "global_step": 35448, "epoch": 427} {"train_loss": -19.055997848510742, "global_step": 35449, "epoch": 427} {"train_loss": -19.49264144897461, "global_step": 35450, "epoch": 427} {"train_loss": -18.961740493774414, "global_step": 35451, "epoch": 427} {"train_loss": -19.16933250427246, "global_step": 35452, "epoch": 427} {"train_loss": -19.16962242126465, "global_step": 35453, "epoch": 427} {"train_loss": -19.26929473876953, "global_step": 35454, "epoch": 427} {"train_loss": -19.106491088867188, "global_step": 35455, "epoch": 427} {"train_loss": -18.82012367248535, "global_step": 35456, "epoch": 427} {"train_loss": -19.400680541992188, "global_step": 35457, "epoch": 427} {"train_loss": -19.204669952392578, "global_step": 35458, "epoch": 427} {"train_loss": -19.243589401245117, "global_step": 35459, "epoch": 427} {"train_loss": -19.08096694946289, "global_step": 35460, "epoch": 427} {"train_loss": -19.138551712036133, "global_step": 35461, "epoch": 427} {"train_loss": -19.589645385742188, "global_step": 35462, "epoch": 427} {"train_loss": -18.920909881591797, "global_step": 35463, "epoch": 427} {"train_loss": -19.3624267578125, "global_step": 35464, "epoch": 427} {"train_loss": -19.229795455932617, "global_step": 35465, "epoch": 427} {"train_loss": -19.1774845123291, "global_step": 35466, "epoch": 427} {"train_loss": -19.067609786987305, "global_step": 35467, "epoch": 427} {"train_loss": -18.961872100830078, "global_step": 35468, "epoch": 427} {"train_loss": -18.882448196411133, "global_step": 35469, "epoch": 427} {"train_loss": -19.257986068725586, "global_step": 35470, "epoch": 427} {"train_loss": -19.239944458007812, "global_step": 35471, "epoch": 427} {"train_loss": -19.083494186401367, "global_step": 35472, "epoch": 427} {"train_loss": -19.48340606689453, "global_step": 35473, "epoch": 427} {"train_loss": -19.576791763305664, "global_step": 35474, "epoch": 427} {"train_loss": -19.212635040283203, "global_step": 35475, "epoch": 427} {"train_loss": -18.783475875854492, "global_step": 35476, "epoch": 427} {"train_loss": -19.504899978637695, "global_step": 35477, "epoch": 427} {"train_loss": -18.91182518005371, "global_step": 35478, "epoch": 427} {"train_loss": -19.306049346923828, "global_step": 35479, "epoch": 427} {"train_loss": -19.020599365234375, "global_step": 35480, "epoch": 427} {"train_loss": -19.357208251953125, "global_step": 35481, "epoch": 427} {"train_loss": -19.108816146850586, "global_step": 35482, "epoch": 427} {"train_loss": -19.430097579956055, "global_step": 35483, "epoch": 427} {"train_loss": -19.15089225769043, "global_step": 35484, "epoch": 427} {"train_loss": -18.83612632751465, "global_step": 35485, "epoch": 427} {"train_loss": -19.57059097290039, "global_step": 35486, "epoch": 427} {"train_loss": -19.02122688293457, "global_step": 35487, "epoch": 427} {"train_loss": -19.31965446472168, "global_step": 35488, "epoch": 427} {"train_loss": -18.804784774780273, "global_step": 35489, "epoch": 427} {"train_loss": -19.100324630737305, "global_step": 35490, "epoch": 427} {"train_loss": -19.327991485595703, "global_step": 35491, "epoch": 427} {"train_loss": -19.295137405395508, "global_step": 35492, "epoch": 427} {"train_loss": -19.19051170349121, "global_step": 35493, "epoch": 427} {"train_loss": -19.52803611755371, "global_step": 35494, "epoch": 427} {"train_loss": -19.234689712524414, "global_step": 35495, "epoch": 427} {"train_loss": -19.402130126953125, "global_step": 35496, "epoch": 427} {"train_loss": -19.142616271972656, "global_step": 35497, "epoch": 427} {"train_loss": -19.493345260620117, "global_step": 35498, "epoch": 427} {"train_loss": -18.87306785583496, "global_step": 35499, "epoch": 427} {"train_loss": -18.720853805541992, "global_step": 35500, "epoch": 427} {"train_loss": -19.219717025756836, "global_step": 35501, "epoch": 427} {"train_loss": -18.880373001098633, "global_step": 35502, "epoch": 427} {"train_loss": -18.549131393432617, "global_step": 35503, "epoch": 427} {"train_loss": -19.375938415527344, "global_step": 35504, "epoch": 427} {"train_loss": -19.27296257019043, "global_step": 35505, "epoch": 427} {"train_loss": -19.40715980529785, "global_step": 35506, "epoch": 427} {"train_loss": -19.0529842376709, "global_step": 35507, "epoch": 427} {"train_loss": -19.31373405456543, "global_step": 35508, "epoch": 427} {"train_loss": -19.485013961791992, "global_step": 35509, "epoch": 427} {"train_loss": -19.378437042236328, "global_step": 35510, "epoch": 427} {"train_loss": -19.197906494140625, "global_step": 35511, "epoch": 427} {"train_loss": -19.176923751831055, "global_step": 35512, "epoch": 427} {"train_loss": -19.357736587524414, "global_step": 35513, "epoch": 427} {"train_loss": -19.198699951171875, "global_step": 35514, "epoch": 427} {"train_loss": -19.38604736328125, "global_step": 35515, "epoch": 427} {"train_loss": -19.302845001220703, "global_step": 35516, "epoch": 427} {"train_loss": -19.08902359008789, "global_step": 35517, "epoch": 427} {"train_loss": -19.159564971923828, "global_step": 35518, "epoch": 427} {"train_loss": -19.489194869995117, "global_step": 35519, "epoch": 427} {"train_loss": -19.374446868896484, "global_step": 35520, "epoch": 427} {"train_loss": -18.916431427001953, "global_step": 35521, "epoch": 427} {"train_loss": -19.161710739135742, "global_step": 35522, "epoch": 427} {"train_loss": -19.169107942696076, "global_step": 35523, "epoch": 427, "val_loss": 6132742.0} {"train_loss": -18.570682525634766, "global_step": 35524, "epoch": 428} {"train_loss": -19.11305809020996, "global_step": 35525, "epoch": 428} {"train_loss": -19.04776954650879, "global_step": 35526, "epoch": 428} {"train_loss": -19.032384872436523, "global_step": 35527, "epoch": 428} {"train_loss": -19.245798110961914, "global_step": 35528, "epoch": 428} {"train_loss": -19.2827205657959, "global_step": 35529, "epoch": 428} {"train_loss": -19.31788444519043, "global_step": 35530, "epoch": 428} {"train_loss": -18.72821617126465, "global_step": 35531, "epoch": 428} {"train_loss": -19.157501220703125, "global_step": 35532, "epoch": 428} {"train_loss": -19.07809829711914, "global_step": 35533, "epoch": 428} {"train_loss": -19.20859718322754, "global_step": 35534, "epoch": 428} {"train_loss": -19.1435604095459, "global_step": 35535, "epoch": 428} {"train_loss": -18.875356674194336, "global_step": 35536, "epoch": 428} {"train_loss": -19.089990615844727, "global_step": 35537, "epoch": 428} {"train_loss": -18.845373153686523, "global_step": 35538, "epoch": 428} {"train_loss": -19.01035499572754, "global_step": 35539, "epoch": 428} {"train_loss": -18.909879684448242, "global_step": 35540, "epoch": 428} {"train_loss": -19.22014617919922, "global_step": 35541, "epoch": 428} {"train_loss": -19.056427001953125, "global_step": 35542, "epoch": 428} {"train_loss": -19.103607177734375, "global_step": 35543, "epoch": 428} {"train_loss": -19.185895919799805, "global_step": 35544, "epoch": 428} {"train_loss": -19.37112808227539, "global_step": 35545, "epoch": 428} {"train_loss": -19.071197509765625, "global_step": 35546, "epoch": 428} {"train_loss": -19.158145904541016, "global_step": 35547, "epoch": 428} {"train_loss": -19.302919387817383, "global_step": 35548, "epoch": 428} {"train_loss": -19.215810775756836, "global_step": 35549, "epoch": 428} {"train_loss": -19.175138473510742, "global_step": 35550, "epoch": 428} {"train_loss": -18.945037841796875, "global_step": 35551, "epoch": 428} {"train_loss": -18.96242332458496, "global_step": 35552, "epoch": 428} {"train_loss": -19.12866973876953, "global_step": 35553, "epoch": 428} {"train_loss": -19.35658836364746, "global_step": 35554, "epoch": 428} {"train_loss": -19.405431747436523, "global_step": 35555, "epoch": 428} {"train_loss": -18.723072052001953, "global_step": 35556, "epoch": 428} {"train_loss": -18.96504783630371, "global_step": 35557, "epoch": 428} {"train_loss": -19.19978904724121, "global_step": 35558, "epoch": 428} {"train_loss": -19.028100967407227, "global_step": 35559, "epoch": 428} {"train_loss": -19.08159637451172, "global_step": 35560, "epoch": 428} {"train_loss": -19.172775268554688, "global_step": 35561, "epoch": 428} {"train_loss": -19.243627548217773, "global_step": 35562, "epoch": 428} {"train_loss": -19.151182174682617, "global_step": 35563, "epoch": 428} {"train_loss": -19.12311363220215, "global_step": 35564, "epoch": 428} {"train_loss": -18.90451431274414, "global_step": 35565, "epoch": 428} {"train_loss": -19.346059799194336, "global_step": 35566, "epoch": 428} {"train_loss": -19.201845169067383, "global_step": 35567, "epoch": 428} {"train_loss": -19.325342178344727, "global_step": 35568, "epoch": 428} {"train_loss": -19.171802520751953, "global_step": 35569, "epoch": 428} {"train_loss": -19.11911964416504, "global_step": 35570, "epoch": 428} {"train_loss": -18.88287353515625, "global_step": 35571, "epoch": 428} {"train_loss": -19.312055587768555, "global_step": 35572, "epoch": 428} {"train_loss": -19.204391479492188, "global_step": 35573, "epoch": 428} {"train_loss": -19.39069938659668, "global_step": 35574, "epoch": 428} {"train_loss": -19.188587188720703, "global_step": 35575, "epoch": 428} {"train_loss": -19.214908599853516, "global_step": 35576, "epoch": 428} {"train_loss": -19.373111724853516, "global_step": 35577, "epoch": 428} {"train_loss": -18.985363006591797, "global_step": 35578, "epoch": 428} {"train_loss": -18.870697021484375, "global_step": 35579, "epoch": 428} {"train_loss": -19.587369918823242, "global_step": 35580, "epoch": 428} {"train_loss": -19.135229110717773, "global_step": 35581, "epoch": 428} {"train_loss": -19.2014217376709, "global_step": 35582, "epoch": 428} {"train_loss": -19.27423667907715, "global_step": 35583, "epoch": 428} {"train_loss": -19.398040771484375, "global_step": 35584, "epoch": 428} {"train_loss": -18.81584358215332, "global_step": 35585, "epoch": 428} {"train_loss": -19.174043655395508, "global_step": 35586, "epoch": 428} {"train_loss": -19.161964416503906, "global_step": 35587, "epoch": 428} {"train_loss": -19.411930084228516, "global_step": 35588, "epoch": 428} {"train_loss": -19.067243576049805, "global_step": 35589, "epoch": 428} {"train_loss": -19.190317153930664, "global_step": 35590, "epoch": 428} {"train_loss": -19.3840274810791, "global_step": 35591, "epoch": 428} {"train_loss": -18.95337677001953, "global_step": 35592, "epoch": 428} {"train_loss": -19.4783992767334, "global_step": 35593, "epoch": 428} {"train_loss": -19.110807418823242, "global_step": 35594, "epoch": 428} {"train_loss": -19.083087921142578, "global_step": 35595, "epoch": 428} {"train_loss": -18.92400550842285, "global_step": 35596, "epoch": 428} {"train_loss": -18.92279624938965, "global_step": 35597, "epoch": 428} {"train_loss": -19.394994735717773, "global_step": 35598, "epoch": 428} {"train_loss": -19.09420394897461, "global_step": 35599, "epoch": 428} {"train_loss": -19.363340377807617, "global_step": 35600, "epoch": 428} {"train_loss": -19.428043365478516, "global_step": 35601, "epoch": 428} {"train_loss": -19.248071670532227, "global_step": 35602, "epoch": 428} {"train_loss": -19.597240447998047, "global_step": 35603, "epoch": 428} {"train_loss": -19.299745559692383, "global_step": 35604, "epoch": 428} {"train_loss": -19.548717498779297, "global_step": 35605, "epoch": 428} {"train_loss": -19.170560147388873, "global_step": 35606, "epoch": 428, "val_loss": 6137524.0} {"train_loss": -18.77161979675293, "global_step": 35607, "epoch": 429} {"train_loss": -19.275869369506836, "global_step": 35608, "epoch": 429} {"train_loss": -18.686569213867188, "global_step": 35609, "epoch": 429} {"train_loss": -19.20315933227539, "global_step": 35610, "epoch": 429} {"train_loss": -18.856046676635742, "global_step": 35611, "epoch": 429} {"train_loss": -19.05780029296875, "global_step": 35612, "epoch": 429} {"train_loss": -18.812881469726562, "global_step": 35613, "epoch": 429} {"train_loss": -18.941333770751953, "global_step": 35614, "epoch": 429} {"train_loss": -19.303640365600586, "global_step": 35615, "epoch": 429} {"train_loss": -19.280593872070312, "global_step": 35616, "epoch": 429} {"train_loss": -18.807138442993164, "global_step": 35617, "epoch": 429} {"train_loss": -19.535755157470703, "global_step": 35618, "epoch": 429} {"train_loss": -19.339744567871094, "global_step": 35619, "epoch": 429} {"train_loss": -19.270315170288086, "global_step": 35620, "epoch": 429} {"train_loss": -19.24738311767578, "global_step": 35621, "epoch": 429} {"train_loss": -18.415613174438477, "global_step": 35622, "epoch": 429} {"train_loss": -19.145835876464844, "global_step": 35623, "epoch": 429} {"train_loss": -19.4620418548584, "global_step": 35624, "epoch": 429} {"train_loss": -19.201221466064453, "global_step": 35625, "epoch": 429} {"train_loss": -19.43014907836914, "global_step": 35626, "epoch": 429} {"train_loss": -19.16259002685547, "global_step": 35627, "epoch": 429} {"train_loss": -19.146915435791016, "global_step": 35628, "epoch": 429} {"train_loss": -19.79193878173828, "global_step": 35629, "epoch": 429} {"train_loss": -18.753671646118164, "global_step": 35630, "epoch": 429} {"train_loss": -19.36701774597168, "global_step": 35631, "epoch": 429} {"train_loss": -19.029348373413086, "global_step": 35632, "epoch": 429} {"train_loss": -19.103775024414062, "global_step": 35633, "epoch": 429} {"train_loss": -19.313705444335938, "global_step": 35634, "epoch": 429} {"train_loss": -19.328554153442383, "global_step": 35635, "epoch": 429} {"train_loss": -18.923620223999023, "global_step": 35636, "epoch": 429} {"train_loss": -19.158889770507812, "global_step": 35637, "epoch": 429} {"train_loss": -19.608076095581055, "global_step": 35638, "epoch": 429} {"train_loss": -19.14438819885254, "global_step": 35639, "epoch": 429} {"train_loss": -19.115093231201172, "global_step": 35640, "epoch": 429} {"train_loss": -19.243925094604492, "global_step": 35641, "epoch": 429} {"train_loss": -19.330411911010742, "global_step": 35642, "epoch": 429} {"train_loss": -19.267805099487305, "global_step": 35643, "epoch": 429} {"train_loss": -19.193410873413086, "global_step": 35644, "epoch": 429} {"train_loss": -19.08083724975586, "global_step": 35645, "epoch": 429} {"train_loss": -19.105205535888672, "global_step": 35646, "epoch": 429} {"train_loss": -19.08448600769043, "global_step": 35647, "epoch": 429} {"train_loss": -19.19161033630371, "global_step": 35648, "epoch": 429} {"train_loss": -19.358701705932617, "global_step": 35649, "epoch": 429} {"train_loss": -19.157398223876953, "global_step": 35650, "epoch": 429} {"train_loss": -19.506391525268555, "global_step": 35651, "epoch": 429} {"train_loss": -19.247970581054688, "global_step": 35652, "epoch": 429} {"train_loss": -19.295997619628906, "global_step": 35653, "epoch": 429} {"train_loss": -19.60698890686035, "global_step": 35654, "epoch": 429} {"train_loss": -19.06281852722168, "global_step": 35655, "epoch": 429} {"train_loss": -19.231515884399414, "global_step": 35656, "epoch": 429} {"train_loss": -19.459579467773438, "global_step": 35657, "epoch": 429} {"train_loss": -19.183883666992188, "global_step": 35658, "epoch": 429} {"train_loss": -19.208786010742188, "global_step": 35659, "epoch": 429} {"train_loss": -19.14083480834961, "global_step": 35660, "epoch": 429} {"train_loss": -18.976781845092773, "global_step": 35661, "epoch": 429} {"train_loss": -19.01570701599121, "global_step": 35662, "epoch": 429} {"train_loss": -19.588361740112305, "global_step": 35663, "epoch": 429} {"train_loss": -18.977140426635742, "global_step": 35664, "epoch": 429} {"train_loss": -19.146976470947266, "global_step": 35665, "epoch": 429} {"train_loss": -18.928205490112305, "global_step": 35666, "epoch": 429} {"train_loss": -19.39707374572754, "global_step": 35667, "epoch": 429} {"train_loss": -19.246498107910156, "global_step": 35668, "epoch": 429} {"train_loss": -19.363319396972656, "global_step": 35669, "epoch": 429} {"train_loss": -19.231666564941406, "global_step": 35670, "epoch": 429} {"train_loss": -19.33894920349121, "global_step": 35671, "epoch": 429} {"train_loss": -19.39957618713379, "global_step": 35672, "epoch": 429} {"train_loss": -19.311126708984375, "global_step": 35673, "epoch": 429} {"train_loss": -19.07913589477539, "global_step": 35674, "epoch": 429} {"train_loss": -18.783479690551758, "global_step": 35675, "epoch": 429} {"train_loss": -18.876819610595703, "global_step": 35676, "epoch": 429} {"train_loss": -19.21925926208496, "global_step": 35677, "epoch": 429} {"train_loss": -19.349313735961914, "global_step": 35678, "epoch": 429} {"train_loss": -19.37067222595215, "global_step": 35679, "epoch": 429} {"train_loss": -18.928043365478516, "global_step": 35680, "epoch": 429} {"train_loss": -19.476856231689453, "global_step": 35681, "epoch": 429} {"train_loss": -19.068254470825195, "global_step": 35682, "epoch": 429} {"train_loss": -19.14501953125, "global_step": 35683, "epoch": 429} {"train_loss": -19.41325569152832, "global_step": 35684, "epoch": 429} {"train_loss": -19.19810676574707, "global_step": 35685, "epoch": 429} {"train_loss": -19.21381950378418, "global_step": 35686, "epoch": 429} {"train_loss": -19.316030502319336, "global_step": 35687, "epoch": 429} {"train_loss": -19.248441696166992, "global_step": 35688, "epoch": 429} {"train_loss": -19.187259811952888, "global_step": 35689, "epoch": 429, "val_loss": 5958046.0} {"train_loss": -18.72117042541504, "global_step": 35690, "epoch": 430} {"train_loss": -19.009349822998047, "global_step": 35691, "epoch": 430} {"train_loss": -19.122272491455078, "global_step": 35692, "epoch": 430} {"train_loss": -19.348031997680664, "global_step": 35693, "epoch": 430} {"train_loss": -19.0681209564209, "global_step": 35694, "epoch": 430} {"train_loss": -19.30615997314453, "global_step": 35695, "epoch": 430} {"train_loss": -19.382246017456055, "global_step": 35696, "epoch": 430} {"train_loss": -19.12534523010254, "global_step": 35697, "epoch": 430} {"train_loss": -19.46162223815918, "global_step": 35698, "epoch": 430} {"train_loss": -19.3591365814209, "global_step": 35699, "epoch": 430} {"train_loss": -19.1278133392334, "global_step": 35700, "epoch": 430} {"train_loss": -19.570035934448242, "global_step": 35701, "epoch": 430} {"train_loss": -19.688047409057617, "global_step": 35702, "epoch": 430} {"train_loss": -18.81103515625, "global_step": 35703, "epoch": 430} {"train_loss": -19.36400604248047, "global_step": 35704, "epoch": 430} {"train_loss": -18.935749053955078, "global_step": 35705, "epoch": 430} {"train_loss": -19.212926864624023, "global_step": 35706, "epoch": 430} {"train_loss": -19.289091110229492, "global_step": 35707, "epoch": 430} {"train_loss": -19.684619903564453, "global_step": 35708, "epoch": 430} {"train_loss": -19.178314208984375, "global_step": 35709, "epoch": 430} {"train_loss": -19.284982681274414, "global_step": 35710, "epoch": 430} {"train_loss": -19.551847457885742, "global_step": 35711, "epoch": 430} {"train_loss": -19.107770919799805, "global_step": 35712, "epoch": 430} {"train_loss": -19.274364471435547, "global_step": 35713, "epoch": 430} {"train_loss": -19.16547393798828, "global_step": 35714, "epoch": 430} {"train_loss": -19.020662307739258, "global_step": 35715, "epoch": 430} {"train_loss": -19.37098503112793, "global_step": 35716, "epoch": 430} {"train_loss": -19.395601272583008, "global_step": 35717, "epoch": 430} {"train_loss": -19.480606079101562, "global_step": 35718, "epoch": 430} {"train_loss": -19.139799118041992, "global_step": 35719, "epoch": 430} {"train_loss": -18.968364715576172, "global_step": 35720, "epoch": 430} {"train_loss": -19.187393188476562, "global_step": 35721, "epoch": 430} {"train_loss": -19.239831924438477, "global_step": 35722, "epoch": 430} {"train_loss": -19.140274047851562, "global_step": 35723, "epoch": 430} {"train_loss": -18.704435348510742, "global_step": 35724, "epoch": 430} {"train_loss": -19.525854110717773, "global_step": 35725, "epoch": 430} {"train_loss": -19.121633529663086, "global_step": 35726, "epoch": 430} {"train_loss": -19.069496154785156, "global_step": 35727, "epoch": 430} {"train_loss": -18.887990951538086, "global_step": 35728, "epoch": 430} {"train_loss": -19.268049240112305, "global_step": 35729, "epoch": 430} {"train_loss": -19.040512084960938, "global_step": 35730, "epoch": 430} {"train_loss": -19.055654525756836, "global_step": 35731, "epoch": 430} {"train_loss": -19.254127502441406, "global_step": 35732, "epoch": 430} {"train_loss": -19.19343376159668, "global_step": 35733, "epoch": 430} {"train_loss": -19.491865158081055, "global_step": 35734, "epoch": 430} {"train_loss": -18.952714920043945, "global_step": 35735, "epoch": 430} {"train_loss": -19.08034324645996, "global_step": 35736, "epoch": 430} {"train_loss": -19.45291519165039, "global_step": 35737, "epoch": 430} {"train_loss": -19.63410186767578, "global_step": 35738, "epoch": 430} {"train_loss": -19.21602439880371, "global_step": 35739, "epoch": 430} {"train_loss": -19.100955963134766, "global_step": 35740, "epoch": 430} {"train_loss": -19.30714225769043, "global_step": 35741, "epoch": 430} {"train_loss": -19.150854110717773, "global_step": 35742, "epoch": 430} {"train_loss": -19.198049545288086, "global_step": 35743, "epoch": 430} {"train_loss": -19.126298904418945, "global_step": 35744, "epoch": 430} {"train_loss": -19.26924705505371, "global_step": 35745, "epoch": 430} {"train_loss": -18.756925582885742, "global_step": 35746, "epoch": 430} {"train_loss": -19.335317611694336, "global_step": 35747, "epoch": 430} {"train_loss": -19.223161697387695, "global_step": 35748, "epoch": 430} {"train_loss": -19.123109817504883, "global_step": 35749, "epoch": 430} {"train_loss": -19.405994415283203, "global_step": 35750, "epoch": 430} {"train_loss": -19.275522232055664, "global_step": 35751, "epoch": 430} {"train_loss": -19.272863388061523, "global_step": 35752, "epoch": 430} {"train_loss": -19.35028648376465, "global_step": 35753, "epoch": 430} {"train_loss": -19.305686950683594, "global_step": 35754, "epoch": 430} {"train_loss": -18.962717056274414, "global_step": 35755, "epoch": 430} {"train_loss": -19.463979721069336, "global_step": 35756, "epoch": 430} {"train_loss": -18.876386642456055, "global_step": 35757, "epoch": 430} {"train_loss": -19.223997116088867, "global_step": 35758, "epoch": 430} {"train_loss": -19.506513595581055, "global_step": 35759, "epoch": 430} {"train_loss": -19.33588981628418, "global_step": 35760, "epoch": 430} {"train_loss": -19.3546085357666, "global_step": 35761, "epoch": 430} {"train_loss": -19.263233184814453, "global_step": 35762, "epoch": 430} {"train_loss": -19.497833251953125, "global_step": 35763, "epoch": 430} {"train_loss": -19.42462158203125, "global_step": 35764, "epoch": 430} {"train_loss": -19.254735946655273, "global_step": 35765, "epoch": 430} {"train_loss": -19.141525268554688, "global_step": 35766, "epoch": 430} {"train_loss": -18.86732292175293, "global_step": 35767, "epoch": 430} {"train_loss": -19.221454620361328, "global_step": 35768, "epoch": 430} {"train_loss": -19.284446716308594, "global_step": 35769, "epoch": 430} {"train_loss": -19.55230140686035, "global_step": 35770, "epoch": 430} {"train_loss": -19.109176635742188, "global_step": 35771, "epoch": 430} {"train_loss": -19.227818178843304, "global_step": 35772, "epoch": 430, "val_loss": 6135672.0} {"train_loss": -18.566070556640625, "global_step": 35773, "epoch": 431} {"train_loss": -18.885202407836914, "global_step": 35774, "epoch": 431} {"train_loss": -19.04437828063965, "global_step": 35775, "epoch": 431} {"train_loss": -19.111875534057617, "global_step": 35776, "epoch": 431} {"train_loss": -19.252849578857422, "global_step": 35777, "epoch": 431} {"train_loss": -18.901859283447266, "global_step": 35778, "epoch": 431} {"train_loss": -19.220317840576172, "global_step": 35779, "epoch": 431} {"train_loss": -19.128509521484375, "global_step": 35780, "epoch": 431} {"train_loss": -19.35607147216797, "global_step": 35781, "epoch": 431} {"train_loss": -18.860733032226562, "global_step": 35782, "epoch": 431} {"train_loss": -18.961233139038086, "global_step": 35783, "epoch": 431} {"train_loss": -18.96211814880371, "global_step": 35784, "epoch": 431} {"train_loss": -19.318220138549805, "global_step": 35785, "epoch": 431} {"train_loss": -19.04298210144043, "global_step": 35786, "epoch": 431} {"train_loss": -19.09500503540039, "global_step": 35787, "epoch": 431} {"train_loss": -18.97218132019043, "global_step": 35788, "epoch": 431} {"train_loss": -19.190580368041992, "global_step": 35789, "epoch": 431} {"train_loss": -19.382396697998047, "global_step": 35790, "epoch": 431} {"train_loss": -18.8997859954834, "global_step": 35791, "epoch": 431} {"train_loss": -19.273822784423828, "global_step": 35792, "epoch": 431} {"train_loss": -19.28474235534668, "global_step": 35793, "epoch": 431} {"train_loss": -18.764129638671875, "global_step": 35794, "epoch": 431} {"train_loss": -19.20868492126465, "global_step": 35795, "epoch": 431} {"train_loss": -19.378454208374023, "global_step": 35796, "epoch": 431} {"train_loss": -19.18843650817871, "global_step": 35797, "epoch": 431} {"train_loss": -19.062959671020508, "global_step": 35798, "epoch": 431} {"train_loss": -19.335426330566406, "global_step": 35799, "epoch": 431} {"train_loss": -19.530210494995117, "global_step": 35800, "epoch": 431} {"train_loss": -19.161895751953125, "global_step": 35801, "epoch": 431} {"train_loss": -19.13612174987793, "global_step": 35802, "epoch": 431} {"train_loss": -18.96089744567871, "global_step": 35803, "epoch": 431} {"train_loss": -19.494592666625977, "global_step": 35804, "epoch": 431} {"train_loss": -19.495298385620117, "global_step": 35805, "epoch": 431} {"train_loss": -18.85322380065918, "global_step": 35806, "epoch": 431} {"train_loss": -19.37811851501465, "global_step": 35807, "epoch": 431} {"train_loss": -19.170385360717773, "global_step": 35808, "epoch": 431} {"train_loss": -19.28037452697754, "global_step": 35809, "epoch": 431} {"train_loss": -19.51759910583496, "global_step": 35810, "epoch": 431} {"train_loss": -19.3615665435791, "global_step": 35811, "epoch": 431} {"train_loss": -19.349740982055664, "global_step": 35812, "epoch": 431} {"train_loss": -19.39100456237793, "global_step": 35813, "epoch": 431} {"train_loss": -19.237890243530273, "global_step": 35814, "epoch": 431} {"train_loss": -19.13783836364746, "global_step": 35815, "epoch": 431} {"train_loss": -18.97586441040039, "global_step": 35816, "epoch": 431} {"train_loss": -19.122451782226562, "global_step": 35817, "epoch": 431} {"train_loss": -18.966960906982422, "global_step": 35818, "epoch": 431} {"train_loss": -19.21137809753418, "global_step": 35819, "epoch": 431} {"train_loss": -19.22047233581543, "global_step": 35820, "epoch": 431} {"train_loss": -19.33153533935547, "global_step": 35821, "epoch": 431} {"train_loss": -19.46236228942871, "global_step": 35822, "epoch": 431} {"train_loss": -19.224750518798828, "global_step": 35823, "epoch": 431} {"train_loss": -19.132659912109375, "global_step": 35824, "epoch": 431} {"train_loss": -19.481565475463867, "global_step": 35825, "epoch": 431} {"train_loss": -18.947805404663086, "global_step": 35826, "epoch": 431} {"train_loss": -19.264583587646484, "global_step": 35827, "epoch": 431} {"train_loss": -19.474842071533203, "global_step": 35828, "epoch": 431} {"train_loss": -19.21392250061035, "global_step": 35829, "epoch": 431} {"train_loss": -18.90521812438965, "global_step": 35830, "epoch": 431} {"train_loss": -19.245458602905273, "global_step": 35831, "epoch": 431} {"train_loss": -19.430967330932617, "global_step": 35832, "epoch": 431} {"train_loss": -19.68198013305664, "global_step": 35833, "epoch": 431} {"train_loss": -19.289865493774414, "global_step": 35834, "epoch": 431} {"train_loss": -19.318756103515625, "global_step": 35835, "epoch": 431} {"train_loss": -19.293685913085938, "global_step": 35836, "epoch": 431} {"train_loss": -19.439512252807617, "global_step": 35837, "epoch": 431} {"train_loss": -18.854942321777344, "global_step": 35838, "epoch": 431} {"train_loss": -19.30109214782715, "global_step": 35839, "epoch": 431} {"train_loss": -19.423677444458008, "global_step": 35840, "epoch": 431} {"train_loss": -19.094953536987305, "global_step": 35841, "epoch": 431} {"train_loss": -19.2023983001709, "global_step": 35842, "epoch": 431} {"train_loss": -19.41031837463379, "global_step": 35843, "epoch": 431} {"train_loss": -19.19594383239746, "global_step": 35844, "epoch": 431} {"train_loss": -19.360774993896484, "global_step": 35845, "epoch": 431} {"train_loss": -19.221914291381836, "global_step": 35846, "epoch": 431} {"train_loss": -19.01319694519043, "global_step": 35847, "epoch": 431} {"train_loss": -19.42356300354004, "global_step": 35848, "epoch": 431} {"train_loss": -19.2762451171875, "global_step": 35849, "epoch": 431} {"train_loss": -19.319686889648438, "global_step": 35850, "epoch": 431} {"train_loss": -19.412168502807617, "global_step": 35851, "epoch": 431} {"train_loss": -18.961318969726562, "global_step": 35852, "epoch": 431} {"train_loss": -19.21099853515625, "global_step": 35853, "epoch": 431} {"train_loss": -19.44024085998535, "global_step": 35854, "epoch": 431} {"train_loss": -19.210788680846434, "global_step": 35855, "epoch": 431, "val_loss": 5927362.5} {"train_loss": -18.757795333862305, "global_step": 35856, "epoch": 432} {"train_loss": -19.108579635620117, "global_step": 35857, "epoch": 432} {"train_loss": -19.290016174316406, "global_step": 35858, "epoch": 432} {"train_loss": -19.294605255126953, "global_step": 35859, "epoch": 432} {"train_loss": -18.774667739868164, "global_step": 35860, "epoch": 432} {"train_loss": -19.426280975341797, "global_step": 35861, "epoch": 432} {"train_loss": -18.891437530517578, "global_step": 35862, "epoch": 432} {"train_loss": -19.096458435058594, "global_step": 35863, "epoch": 432} {"train_loss": -18.993696212768555, "global_step": 35864, "epoch": 432} {"train_loss": -19.149991989135742, "global_step": 35865, "epoch": 432} {"train_loss": -18.869218826293945, "global_step": 35866, "epoch": 432} {"train_loss": -19.414077758789062, "global_step": 35867, "epoch": 432} {"train_loss": -19.235271453857422, "global_step": 35868, "epoch": 432} {"train_loss": -19.56935691833496, "global_step": 35869, "epoch": 432} {"train_loss": -19.342458724975586, "global_step": 35870, "epoch": 432} {"train_loss": -19.048110961914062, "global_step": 35871, "epoch": 432} {"train_loss": -19.683507919311523, "global_step": 35872, "epoch": 432} {"train_loss": -19.25142478942871, "global_step": 35873, "epoch": 432} {"train_loss": -19.482086181640625, "global_step": 35874, "epoch": 432} {"train_loss": -19.080398559570312, "global_step": 35875, "epoch": 432} {"train_loss": -19.582006454467773, "global_step": 35876, "epoch": 432} {"train_loss": -18.891695022583008, "global_step": 35877, "epoch": 432} {"train_loss": -19.25284194946289, "global_step": 35878, "epoch": 432} {"train_loss": -19.404743194580078, "global_step": 35879, "epoch": 432} {"train_loss": -19.009424209594727, "global_step": 35880, "epoch": 432} {"train_loss": -18.760772705078125, "global_step": 35881, "epoch": 432} {"train_loss": -18.839557647705078, "global_step": 35882, "epoch": 432} {"train_loss": -18.941246032714844, "global_step": 35883, "epoch": 432} {"train_loss": -19.371963500976562, "global_step": 35884, "epoch": 432} {"train_loss": -19.359060287475586, "global_step": 35885, "epoch": 432} {"train_loss": -19.056283950805664, "global_step": 35886, "epoch": 432} {"train_loss": -19.45140838623047, "global_step": 35887, "epoch": 432} {"train_loss": -19.49764633178711, "global_step": 35888, "epoch": 432} {"train_loss": -19.184663772583008, "global_step": 35889, "epoch": 432} {"train_loss": -19.4604549407959, "global_step": 35890, "epoch": 432} {"train_loss": -19.04986572265625, "global_step": 35891, "epoch": 432} {"train_loss": -19.241666793823242, "global_step": 35892, "epoch": 432} {"train_loss": -19.620100021362305, "global_step": 35893, "epoch": 432} {"train_loss": -19.16409683227539, "global_step": 35894, "epoch": 432} {"train_loss": -19.25152015686035, "global_step": 35895, "epoch": 432} {"train_loss": -19.33793067932129, "global_step": 35896, "epoch": 432} {"train_loss": -19.31299591064453, "global_step": 35897, "epoch": 432} {"train_loss": -19.146902084350586, "global_step": 35898, "epoch": 432} {"train_loss": -19.156644821166992, "global_step": 35899, "epoch": 432} {"train_loss": -19.22420310974121, "global_step": 35900, "epoch": 432} {"train_loss": -19.470661163330078, "global_step": 35901, "epoch": 432} {"train_loss": -19.54591941833496, "global_step": 35902, "epoch": 432} {"train_loss": -19.040679931640625, "global_step": 35903, "epoch": 432} {"train_loss": -19.31373405456543, "global_step": 35904, "epoch": 432} {"train_loss": -19.175962448120117, "global_step": 35905, "epoch": 432} {"train_loss": -19.19942283630371, "global_step": 35906, "epoch": 432} {"train_loss": -19.256479263305664, "global_step": 35907, "epoch": 432} {"train_loss": -19.099573135375977, "global_step": 35908, "epoch": 432} {"train_loss": -19.748376846313477, "global_step": 35909, "epoch": 432} {"train_loss": -18.93189811706543, "global_step": 35910, "epoch": 432} {"train_loss": -19.37650489807129, "global_step": 35911, "epoch": 432} {"train_loss": -19.186155319213867, "global_step": 35912, "epoch": 432} {"train_loss": -19.215444564819336, "global_step": 35913, "epoch": 432} {"train_loss": -19.15285301208496, "global_step": 35914, "epoch": 432} {"train_loss": -19.118494033813477, "global_step": 35915, "epoch": 432} {"train_loss": -18.90395736694336, "global_step": 35916, "epoch": 432} {"train_loss": -19.235082626342773, "global_step": 35917, "epoch": 432} {"train_loss": -19.394620895385742, "global_step": 35918, "epoch": 432} {"train_loss": -19.60674476623535, "global_step": 35919, "epoch": 432} {"train_loss": -18.906009674072266, "global_step": 35920, "epoch": 432} {"train_loss": -19.639188766479492, "global_step": 35921, "epoch": 432} {"train_loss": -19.05084800720215, "global_step": 35922, "epoch": 432} {"train_loss": -18.926000595092773, "global_step": 35923, "epoch": 432} {"train_loss": -19.301076889038086, "global_step": 35924, "epoch": 432} {"train_loss": -18.757461547851562, "global_step": 35925, "epoch": 432} {"train_loss": -19.372873306274414, "global_step": 35926, "epoch": 432} {"train_loss": -18.979936599731445, "global_step": 35927, "epoch": 432} {"train_loss": -19.279499053955078, "global_step": 35928, "epoch": 432} {"train_loss": -18.96786117553711, "global_step": 35929, "epoch": 432} {"train_loss": -19.220163345336914, "global_step": 35930, "epoch": 432} {"train_loss": -19.142013549804688, "global_step": 35931, "epoch": 432} {"train_loss": -19.299726486206055, "global_step": 35932, "epoch": 432} {"train_loss": -19.383407592773438, "global_step": 35933, "epoch": 432} {"train_loss": -19.673078536987305, "global_step": 35934, "epoch": 432} {"train_loss": -19.55801773071289, "global_step": 35935, "epoch": 432} {"train_loss": -19.238550186157227, "global_step": 35936, "epoch": 432} {"train_loss": -19.294851303100586, "global_step": 35937, "epoch": 432} {"train_loss": -19.206252615135835, "global_step": 35938, "epoch": 432, "val_loss": 6011151.0} {"train_loss": -18.758527755737305, "global_step": 35939, "epoch": 433} {"train_loss": -19.011213302612305, "global_step": 35940, "epoch": 433} {"train_loss": -19.01642417907715, "global_step": 35941, "epoch": 433} {"train_loss": -18.96491813659668, "global_step": 35942, "epoch": 433} {"train_loss": -19.261289596557617, "global_step": 35943, "epoch": 433} {"train_loss": -19.18943214416504, "global_step": 35944, "epoch": 433} {"train_loss": -19.18050193786621, "global_step": 35945, "epoch": 433} {"train_loss": -19.071393966674805, "global_step": 35946, "epoch": 433} {"train_loss": -18.85555648803711, "global_step": 35947, "epoch": 433} {"train_loss": -19.06229591369629, "global_step": 35948, "epoch": 433} {"train_loss": -19.150053024291992, "global_step": 35949, "epoch": 433} {"train_loss": -19.2341365814209, "global_step": 35950, "epoch": 433} {"train_loss": -19.390647888183594, "global_step": 35951, "epoch": 433} {"train_loss": -18.975719451904297, "global_step": 35952, "epoch": 433} {"train_loss": -19.283870697021484, "global_step": 35953, "epoch": 433} {"train_loss": -19.0681209564209, "global_step": 35954, "epoch": 433} {"train_loss": -19.300302505493164, "global_step": 35955, "epoch": 433} {"train_loss": -19.217636108398438, "global_step": 35956, "epoch": 433} {"train_loss": -19.071531295776367, "global_step": 35957, "epoch": 433} {"train_loss": -19.001419067382812, "global_step": 35958, "epoch": 433} {"train_loss": -19.308517456054688, "global_step": 35959, "epoch": 433} {"train_loss": -19.032325744628906, "global_step": 35960, "epoch": 433} {"train_loss": -19.015565872192383, "global_step": 35961, "epoch": 433} {"train_loss": -19.194005966186523, "global_step": 35962, "epoch": 433} {"train_loss": -19.00885009765625, "global_step": 35963, "epoch": 433} {"train_loss": -19.450424194335938, "global_step": 35964, "epoch": 433} {"train_loss": -19.33807945251465, "global_step": 35965, "epoch": 433} {"train_loss": -19.155391693115234, "global_step": 35966, "epoch": 433} {"train_loss": -19.17308235168457, "global_step": 35967, "epoch": 433} {"train_loss": -19.324777603149414, "global_step": 35968, "epoch": 433} {"train_loss": -19.194015502929688, "global_step": 35969, "epoch": 433} {"train_loss": -19.480504989624023, "global_step": 35970, "epoch": 433} {"train_loss": -19.469255447387695, "global_step": 35971, "epoch": 433} {"train_loss": -19.409635543823242, "global_step": 35972, "epoch": 433} {"train_loss": -19.424182891845703, "global_step": 35973, "epoch": 433} {"train_loss": -19.041152954101562, "global_step": 35974, "epoch": 433} {"train_loss": -19.66217613220215, "global_step": 35975, "epoch": 433} {"train_loss": -19.119308471679688, "global_step": 35976, "epoch": 433} {"train_loss": -19.350522994995117, "global_step": 35977, "epoch": 433} {"train_loss": -19.0279541015625, "global_step": 35978, "epoch": 433} {"train_loss": -19.11067008972168, "global_step": 35979, "epoch": 433} {"train_loss": -19.139965057373047, "global_step": 35980, "epoch": 433} {"train_loss": -18.88568687438965, "global_step": 35981, "epoch": 433} {"train_loss": -18.674509048461914, "global_step": 35982, "epoch": 433} {"train_loss": -18.840415954589844, "global_step": 35983, "epoch": 433} {"train_loss": -19.131343841552734, "global_step": 35984, "epoch": 433} {"train_loss": -19.25661277770996, "global_step": 35985, "epoch": 433} {"train_loss": -19.29012107849121, "global_step": 35986, "epoch": 433} {"train_loss": -19.110044479370117, "global_step": 35987, "epoch": 433} {"train_loss": -19.501142501831055, "global_step": 35988, "epoch": 433} {"train_loss": -19.271625518798828, "global_step": 35989, "epoch": 433} {"train_loss": -19.42161750793457, "global_step": 35990, "epoch": 433} {"train_loss": -19.20734214782715, "global_step": 35991, "epoch": 433} {"train_loss": -19.150733947753906, "global_step": 35992, "epoch": 433} {"train_loss": -19.350631713867188, "global_step": 35993, "epoch": 433} {"train_loss": -19.42441177368164, "global_step": 35994, "epoch": 433} {"train_loss": -19.17742347717285, "global_step": 35995, "epoch": 433} {"train_loss": -19.288909912109375, "global_step": 35996, "epoch": 433} {"train_loss": -19.1158447265625, "global_step": 35997, "epoch": 433} {"train_loss": -19.606679916381836, "global_step": 35998, "epoch": 433} {"train_loss": -19.455881118774414, "global_step": 35999, "epoch": 433} {"train_loss": -18.695219039916992, "global_step": 36000, "epoch": 433} {"train_loss": -19.358068466186523, "global_step": 36001, "epoch": 433} {"train_loss": -19.118648529052734, "global_step": 36002, "epoch": 433} {"train_loss": -19.327123641967773, "global_step": 36003, "epoch": 433} {"train_loss": -19.25237464904785, "global_step": 36004, "epoch": 433} {"train_loss": -19.244977951049805, "global_step": 36005, "epoch": 433} {"train_loss": -19.37918472290039, "global_step": 36006, "epoch": 433} {"train_loss": -19.10329246520996, "global_step": 36007, "epoch": 433} {"train_loss": -19.284086227416992, "global_step": 36008, "epoch": 433} {"train_loss": -19.274076461791992, "global_step": 36009, "epoch": 433} {"train_loss": -19.153831481933594, "global_step": 36010, "epoch": 433} {"train_loss": -18.93984603881836, "global_step": 36011, "epoch": 433} {"train_loss": -19.768444061279297, "global_step": 36012, "epoch": 433} {"train_loss": -19.28481674194336, "global_step": 36013, "epoch": 433} {"train_loss": -18.894441604614258, "global_step": 36014, "epoch": 433} {"train_loss": -19.375732421875, "global_step": 36015, "epoch": 433} {"train_loss": -19.174184799194336, "global_step": 36016, "epoch": 433} {"train_loss": -19.382394790649414, "global_step": 36017, "epoch": 433} {"train_loss": -19.28998374938965, "global_step": 36018, "epoch": 433} {"train_loss": -19.159290313720703, "global_step": 36019, "epoch": 433} {"train_loss": -19.296751022338867, "global_step": 36020, "epoch": 433} {"train_loss": -19.212907170674885, "global_step": 36021, "epoch": 433, "val_loss": 5979122.0} {"train_loss": -19.645551681518555, "global_step": 36022, "epoch": 434} {"train_loss": -19.619245529174805, "global_step": 36023, "epoch": 434} {"train_loss": -18.695154190063477, "global_step": 36024, "epoch": 434} {"train_loss": -19.416933059692383, "global_step": 36025, "epoch": 434} {"train_loss": -19.334577560424805, "global_step": 36026, "epoch": 434} {"train_loss": -19.269086837768555, "global_step": 36027, "epoch": 434} {"train_loss": -19.275419235229492, "global_step": 36028, "epoch": 434} {"train_loss": -18.922826766967773, "global_step": 36029, "epoch": 434} {"train_loss": -19.156845092773438, "global_step": 36030, "epoch": 434} {"train_loss": -19.59805679321289, "global_step": 36031, "epoch": 434} {"train_loss": -19.229324340820312, "global_step": 36032, "epoch": 434} {"train_loss": -19.140409469604492, "global_step": 36033, "epoch": 434} {"train_loss": -19.35017967224121, "global_step": 36034, "epoch": 434} {"train_loss": -19.27601432800293, "global_step": 36035, "epoch": 434} {"train_loss": -19.244237899780273, "global_step": 36036, "epoch": 434} {"train_loss": -19.251672744750977, "global_step": 36037, "epoch": 434} {"train_loss": -18.964736938476562, "global_step": 36038, "epoch": 434} {"train_loss": -19.67496109008789, "global_step": 36039, "epoch": 434} {"train_loss": -19.301733016967773, "global_step": 36040, "epoch": 434} {"train_loss": -19.39638328552246, "global_step": 36041, "epoch": 434} {"train_loss": -18.97614097595215, "global_step": 36042, "epoch": 434} {"train_loss": -18.97458267211914, "global_step": 36043, "epoch": 434} {"train_loss": -19.290281295776367, "global_step": 36044, "epoch": 434} {"train_loss": -19.402490615844727, "global_step": 36045, "epoch": 434} {"train_loss": -19.537622451782227, "global_step": 36046, "epoch": 434} {"train_loss": -19.320545196533203, "global_step": 36047, "epoch": 434} {"train_loss": -19.354827880859375, "global_step": 36048, "epoch": 434} {"train_loss": -19.045303344726562, "global_step": 36049, "epoch": 434} {"train_loss": -19.430017471313477, "global_step": 36050, "epoch": 434} {"train_loss": -19.719167709350586, "global_step": 36051, "epoch": 434} {"train_loss": -19.73605728149414, "global_step": 36052, "epoch": 434} {"train_loss": -19.43568229675293, "global_step": 36053, "epoch": 434} {"train_loss": -19.052284240722656, "global_step": 36054, "epoch": 434} {"train_loss": -19.33789825439453, "global_step": 36055, "epoch": 434} {"train_loss": -18.93859100341797, "global_step": 36056, "epoch": 434} {"train_loss": -19.582828521728516, "global_step": 36057, "epoch": 434} {"train_loss": -19.514822006225586, "global_step": 36058, "epoch": 434} {"train_loss": -19.211027145385742, "global_step": 36059, "epoch": 434} {"train_loss": -19.17989158630371, "global_step": 36060, "epoch": 434} {"train_loss": -19.769336700439453, "global_step": 36061, "epoch": 434} {"train_loss": -19.61903190612793, "global_step": 36062, "epoch": 434} {"train_loss": -19.25264549255371, "global_step": 36063, "epoch": 434} {"train_loss": -19.189123153686523, "global_step": 36064, "epoch": 434} {"train_loss": -18.871923446655273, "global_step": 36065, "epoch": 434} {"train_loss": -18.837812423706055, "global_step": 36066, "epoch": 434} {"train_loss": -19.162229537963867, "global_step": 36067, "epoch": 434} {"train_loss": -18.935195922851562, "global_step": 36068, "epoch": 434} {"train_loss": -18.993497848510742, "global_step": 36069, "epoch": 434} {"train_loss": -19.182462692260742, "global_step": 36070, "epoch": 434} {"train_loss": -19.271806716918945, "global_step": 36071, "epoch": 434} {"train_loss": -19.237770080566406, "global_step": 36072, "epoch": 434} {"train_loss": -18.958179473876953, "global_step": 36073, "epoch": 434} {"train_loss": -19.15835952758789, "global_step": 36074, "epoch": 434} {"train_loss": -19.18693733215332, "global_step": 36075, "epoch": 434} {"train_loss": -19.0764217376709, "global_step": 36076, "epoch": 434} {"train_loss": -18.952360153198242, "global_step": 36077, "epoch": 434} {"train_loss": -19.386001586914062, "global_step": 36078, "epoch": 434} {"train_loss": -19.20418357849121, "global_step": 36079, "epoch": 434} {"train_loss": -19.121606826782227, "global_step": 36080, "epoch": 434} {"train_loss": -18.503925323486328, "global_step": 36081, "epoch": 434} {"train_loss": -19.037118911743164, "global_step": 36082, "epoch": 434} {"train_loss": -19.245441436767578, "global_step": 36083, "epoch": 434} {"train_loss": -18.934083938598633, "global_step": 36084, "epoch": 434} {"train_loss": -18.942174911499023, "global_step": 36085, "epoch": 434} {"train_loss": -19.490570068359375, "global_step": 36086, "epoch": 434} {"train_loss": -19.526844024658203, "global_step": 36087, "epoch": 434} {"train_loss": -19.190528869628906, "global_step": 36088, "epoch": 434} {"train_loss": -19.63058853149414, "global_step": 36089, "epoch": 434} {"train_loss": -19.44769859313965, "global_step": 36090, "epoch": 434} {"train_loss": -19.366342544555664, "global_step": 36091, "epoch": 434} {"train_loss": -19.327144622802734, "global_step": 36092, "epoch": 434} {"train_loss": -19.125654220581055, "global_step": 36093, "epoch": 434} {"train_loss": -19.492414474487305, "global_step": 36094, "epoch": 434} {"train_loss": -19.1804256439209, "global_step": 36095, "epoch": 434} {"train_loss": -19.211008071899414, "global_step": 36096, "epoch": 434} {"train_loss": -18.970563888549805, "global_step": 36097, "epoch": 434} {"train_loss": -19.047046661376953, "global_step": 36098, "epoch": 434} {"train_loss": -19.19671630859375, "global_step": 36099, "epoch": 434} {"train_loss": -19.355878829956055, "global_step": 36100, "epoch": 434} {"train_loss": -19.22062110900879, "global_step": 36101, "epoch": 434} {"train_loss": -19.288679122924805, "global_step": 36102, "epoch": 434} {"train_loss": -19.127365112304688, "global_step": 36103, "epoch": 434} {"train_loss": -19.23706817626953, "global_step": 36104, "epoch": 434, "val_loss": 6031292.0} {"train_loss": -18.835065841674805, "global_step": 36105, "epoch": 435} {"train_loss": -18.70488929748535, "global_step": 36106, "epoch": 435} {"train_loss": -19.15104103088379, "global_step": 36107, "epoch": 435} {"train_loss": -18.545913696289062, "global_step": 36108, "epoch": 435} {"train_loss": -18.54075050354004, "global_step": 36109, "epoch": 435} {"train_loss": -19.235891342163086, "global_step": 36110, "epoch": 435} {"train_loss": -18.914457321166992, "global_step": 36111, "epoch": 435} {"train_loss": -18.68365478515625, "global_step": 36112, "epoch": 435} {"train_loss": -19.188522338867188, "global_step": 36113, "epoch": 435} {"train_loss": -19.293615341186523, "global_step": 36114, "epoch": 435} {"train_loss": -19.180517196655273, "global_step": 36115, "epoch": 435} {"train_loss": -18.987442016601562, "global_step": 36116, "epoch": 435} {"train_loss": -18.773847579956055, "global_step": 36117, "epoch": 435} {"train_loss": -19.209030151367188, "global_step": 36118, "epoch": 435} {"train_loss": -19.170654296875, "global_step": 36119, "epoch": 435} {"train_loss": -18.82857322692871, "global_step": 36120, "epoch": 435} {"train_loss": -19.362680435180664, "global_step": 36121, "epoch": 435} {"train_loss": -18.806665420532227, "global_step": 36122, "epoch": 435} {"train_loss": -19.20954704284668, "global_step": 36123, "epoch": 435} {"train_loss": -19.164020538330078, "global_step": 36124, "epoch": 435} {"train_loss": -18.95626449584961, "global_step": 36125, "epoch": 435} {"train_loss": -19.237747192382812, "global_step": 36126, "epoch": 435} {"train_loss": -19.316984176635742, "global_step": 36127, "epoch": 435} {"train_loss": -18.8721981048584, "global_step": 36128, "epoch": 435} {"train_loss": -19.50324058532715, "global_step": 36129, "epoch": 435} {"train_loss": -18.95850944519043, "global_step": 36130, "epoch": 435} {"train_loss": -19.123321533203125, "global_step": 36131, "epoch": 435} {"train_loss": -19.3220272064209, "global_step": 36132, "epoch": 435} {"train_loss": -19.43967628479004, "global_step": 36133, "epoch": 435} {"train_loss": -19.21866226196289, "global_step": 36134, "epoch": 435} {"train_loss": -18.814311981201172, "global_step": 36135, "epoch": 435} {"train_loss": -19.486303329467773, "global_step": 36136, "epoch": 435} {"train_loss": -19.147144317626953, "global_step": 36137, "epoch": 435} {"train_loss": -19.249006271362305, "global_step": 36138, "epoch": 435} {"train_loss": -19.191150665283203, "global_step": 36139, "epoch": 435} {"train_loss": -19.592727661132812, "global_step": 36140, "epoch": 435} {"train_loss": -19.35591697692871, "global_step": 36141, "epoch": 435} {"train_loss": -19.132360458374023, "global_step": 36142, "epoch": 435} {"train_loss": -19.21687889099121, "global_step": 36143, "epoch": 435} {"train_loss": -19.34524154663086, "global_step": 36144, "epoch": 435} {"train_loss": -19.185245513916016, "global_step": 36145, "epoch": 435} {"train_loss": -19.17624282836914, "global_step": 36146, "epoch": 435} {"train_loss": -19.716928482055664, "global_step": 36147, "epoch": 435} {"train_loss": -19.006305694580078, "global_step": 36148, "epoch": 435} {"train_loss": -19.47711753845215, "global_step": 36149, "epoch": 435} {"train_loss": -19.063522338867188, "global_step": 36150, "epoch": 435} {"train_loss": -19.300125122070312, "global_step": 36151, "epoch": 435} {"train_loss": -19.22481346130371, "global_step": 36152, "epoch": 435} {"train_loss": -19.1627140045166, "global_step": 36153, "epoch": 435} {"train_loss": -19.37872314453125, "global_step": 36154, "epoch": 435} {"train_loss": -19.139976501464844, "global_step": 36155, "epoch": 435} {"train_loss": -19.258167266845703, "global_step": 36156, "epoch": 435} {"train_loss": -19.408254623413086, "global_step": 36157, "epoch": 435} {"train_loss": -19.11313247680664, "global_step": 36158, "epoch": 435} {"train_loss": -19.485563278198242, "global_step": 36159, "epoch": 435} {"train_loss": -19.48720359802246, "global_step": 36160, "epoch": 435} {"train_loss": -19.644798278808594, "global_step": 36161, "epoch": 435} {"train_loss": -19.454044342041016, "global_step": 36162, "epoch": 435} {"train_loss": -19.275047302246094, "global_step": 36163, "epoch": 435} {"train_loss": -19.357389450073242, "global_step": 36164, "epoch": 435} {"train_loss": -19.301197052001953, "global_step": 36165, "epoch": 435} {"train_loss": -19.00665855407715, "global_step": 36166, "epoch": 435} {"train_loss": -19.16297721862793, "global_step": 36167, "epoch": 435} {"train_loss": -19.506006240844727, "global_step": 36168, "epoch": 435} {"train_loss": -19.072423934936523, "global_step": 36169, "epoch": 435} {"train_loss": -19.41327476501465, "global_step": 36170, "epoch": 435} {"train_loss": -19.610082626342773, "global_step": 36171, "epoch": 435} {"train_loss": -19.0731143951416, "global_step": 36172, "epoch": 435} {"train_loss": -19.27033805847168, "global_step": 36173, "epoch": 435} {"train_loss": -19.518142700195312, "global_step": 36174, "epoch": 435} {"train_loss": -19.094839096069336, "global_step": 36175, "epoch": 435} {"train_loss": -19.090713500976562, "global_step": 36176, "epoch": 435} {"train_loss": -18.91047477722168, "global_step": 36177, "epoch": 435} {"train_loss": -19.461862564086914, "global_step": 36178, "epoch": 435} {"train_loss": -19.39124870300293, "global_step": 36179, "epoch": 435} {"train_loss": -19.227645874023438, "global_step": 36180, "epoch": 435} {"train_loss": -18.9519100189209, "global_step": 36181, "epoch": 435} {"train_loss": -19.456159591674805, "global_step": 36182, "epoch": 435} {"train_loss": -18.848237991333008, "global_step": 36183, "epoch": 435} {"train_loss": -19.3647403717041, "global_step": 36184, "epoch": 435} {"train_loss": -18.97161865234375, "global_step": 36185, "epoch": 435} {"train_loss": -19.156835556030273, "global_step": 36186, "epoch": 435} {"train_loss": -19.17895094170628, "global_step": 36187, "epoch": 435, "val_loss": 6187053.0} {"train_loss": -18.41399574279785, "global_step": 36188, "epoch": 436} {"train_loss": -18.936206817626953, "global_step": 36189, "epoch": 436} {"train_loss": -18.638559341430664, "global_step": 36190, "epoch": 436} {"train_loss": -19.209272384643555, "global_step": 36191, "epoch": 436} {"train_loss": -19.447803497314453, "global_step": 36192, "epoch": 436} {"train_loss": -18.929851531982422, "global_step": 36193, "epoch": 436} {"train_loss": -19.114398956298828, "global_step": 36194, "epoch": 436} {"train_loss": -19.045392990112305, "global_step": 36195, "epoch": 436} {"train_loss": -19.004499435424805, "global_step": 36196, "epoch": 436} {"train_loss": -19.254674911499023, "global_step": 36197, "epoch": 436} {"train_loss": -19.296171188354492, "global_step": 36198, "epoch": 436} {"train_loss": -18.952852249145508, "global_step": 36199, "epoch": 436} {"train_loss": -18.97698402404785, "global_step": 36200, "epoch": 436} {"train_loss": -19.16939353942871, "global_step": 36201, "epoch": 436} {"train_loss": -18.94489097595215, "global_step": 36202, "epoch": 436} {"train_loss": -19.149982452392578, "global_step": 36203, "epoch": 436} {"train_loss": -19.25447654724121, "global_step": 36204, "epoch": 436} {"train_loss": -18.89255142211914, "global_step": 36205, "epoch": 436} {"train_loss": -18.982824325561523, "global_step": 36206, "epoch": 436} {"train_loss": -19.644123077392578, "global_step": 36207, "epoch": 436} {"train_loss": -19.507028579711914, "global_step": 36208, "epoch": 436} {"train_loss": -19.138574600219727, "global_step": 36209, "epoch": 436} {"train_loss": -19.30196189880371, "global_step": 36210, "epoch": 436} {"train_loss": -19.010282516479492, "global_step": 36211, "epoch": 436} {"train_loss": -19.20892333984375, "global_step": 36212, "epoch": 436} {"train_loss": -19.020923614501953, "global_step": 36213, "epoch": 436} {"train_loss": -19.20914649963379, "global_step": 36214, "epoch": 436} {"train_loss": -19.16217803955078, "global_step": 36215, "epoch": 436} {"train_loss": -19.377811431884766, "global_step": 36216, "epoch": 436} {"train_loss": -19.213138580322266, "global_step": 36217, "epoch": 436} {"train_loss": -19.24261474609375, "global_step": 36218, "epoch": 436} {"train_loss": -19.17751121520996, "global_step": 36219, "epoch": 436} {"train_loss": -19.423404693603516, "global_step": 36220, "epoch": 436} {"train_loss": -19.162399291992188, "global_step": 36221, "epoch": 436} {"train_loss": -19.2137508392334, "global_step": 36222, "epoch": 436} {"train_loss": -19.178110122680664, "global_step": 36223, "epoch": 436} {"train_loss": -19.262990951538086, "global_step": 36224, "epoch": 436} {"train_loss": -19.281389236450195, "global_step": 36225, "epoch": 436} {"train_loss": -19.05118751525879, "global_step": 36226, "epoch": 436} {"train_loss": -19.52808380126953, "global_step": 36227, "epoch": 436} {"train_loss": -19.293550491333008, "global_step": 36228, "epoch": 436} {"train_loss": -18.80470848083496, "global_step": 36229, "epoch": 436} {"train_loss": -19.44754409790039, "global_step": 36230, "epoch": 436} {"train_loss": -19.04130744934082, "global_step": 36231, "epoch": 436} {"train_loss": -19.504858016967773, "global_step": 36232, "epoch": 436} {"train_loss": -19.349838256835938, "global_step": 36233, "epoch": 436} {"train_loss": -18.96131706237793, "global_step": 36234, "epoch": 436} {"train_loss": -19.479394912719727, "global_step": 36235, "epoch": 436} {"train_loss": -19.416481018066406, "global_step": 36236, "epoch": 436} {"train_loss": -19.14772605895996, "global_step": 36237, "epoch": 436} {"train_loss": -19.401227951049805, "global_step": 36238, "epoch": 436} {"train_loss": -19.05850601196289, "global_step": 36239, "epoch": 436} {"train_loss": -19.707910537719727, "global_step": 36240, "epoch": 436} {"train_loss": -19.252729415893555, "global_step": 36241, "epoch": 436} {"train_loss": -19.3415470123291, "global_step": 36242, "epoch": 436} {"train_loss": -19.3122615814209, "global_step": 36243, "epoch": 436} {"train_loss": -19.449758529663086, "global_step": 36244, "epoch": 436} {"train_loss": -19.21119499206543, "global_step": 36245, "epoch": 436} {"train_loss": -19.20911979675293, "global_step": 36246, "epoch": 436} {"train_loss": -19.431812286376953, "global_step": 36247, "epoch": 436} {"train_loss": -19.242998123168945, "global_step": 36248, "epoch": 436} {"train_loss": -19.024267196655273, "global_step": 36249, "epoch": 436} {"train_loss": -19.49123191833496, "global_step": 36250, "epoch": 436} {"train_loss": -19.10298728942871, "global_step": 36251, "epoch": 436} {"train_loss": -19.27488136291504, "global_step": 36252, "epoch": 436} {"train_loss": -19.502004623413086, "global_step": 36253, "epoch": 436} {"train_loss": -19.125547409057617, "global_step": 36254, "epoch": 436} {"train_loss": -19.062360763549805, "global_step": 36255, "epoch": 436} {"train_loss": -18.840295791625977, "global_step": 36256, "epoch": 436} {"train_loss": -19.359786987304688, "global_step": 36257, "epoch": 436} {"train_loss": -19.254261016845703, "global_step": 36258, "epoch": 436} {"train_loss": -19.15435218811035, "global_step": 36259, "epoch": 436} {"train_loss": -19.30140495300293, "global_step": 36260, "epoch": 436} {"train_loss": -19.051801681518555, "global_step": 36261, "epoch": 436} {"train_loss": -19.63361167907715, "global_step": 36262, "epoch": 436} {"train_loss": -19.46187400817871, "global_step": 36263, "epoch": 436} {"train_loss": -19.217666625976562, "global_step": 36264, "epoch": 436} {"train_loss": -19.323904037475586, "global_step": 36265, "epoch": 436} {"train_loss": -18.956836700439453, "global_step": 36266, "epoch": 436} {"train_loss": -19.47877311706543, "global_step": 36267, "epoch": 436} {"train_loss": -19.1722354888916, "global_step": 36268, "epoch": 436} {"train_loss": -19.480628967285156, "global_step": 36269, "epoch": 436} {"train_loss": -19.21992616768343, "global_step": 36270, "epoch": 436, "val_loss": 5892672.5} {"train_loss": -18.88498878479004, "global_step": 36271, "epoch": 437} {"train_loss": -18.743663787841797, "global_step": 36272, "epoch": 437} {"train_loss": -19.248929977416992, "global_step": 36273, "epoch": 437} {"train_loss": -18.981372833251953, "global_step": 36274, "epoch": 437} {"train_loss": -19.035533905029297, "global_step": 36275, "epoch": 437} {"train_loss": -19.17812156677246, "global_step": 36276, "epoch": 437} {"train_loss": -19.36749267578125, "global_step": 36277, "epoch": 437} {"train_loss": -18.999486923217773, "global_step": 36278, "epoch": 437} {"train_loss": -19.050134658813477, "global_step": 36279, "epoch": 437} {"train_loss": -19.168317794799805, "global_step": 36280, "epoch": 437} {"train_loss": -19.14420509338379, "global_step": 36281, "epoch": 437} {"train_loss": -19.431045532226562, "global_step": 36282, "epoch": 437} {"train_loss": -19.26825714111328, "global_step": 36283, "epoch": 437} {"train_loss": -18.976926803588867, "global_step": 36284, "epoch": 437} {"train_loss": -19.102304458618164, "global_step": 36285, "epoch": 437} {"train_loss": -18.90113639831543, "global_step": 36286, "epoch": 437} {"train_loss": -18.934457778930664, "global_step": 36287, "epoch": 437} {"train_loss": -19.616451263427734, "global_step": 36288, "epoch": 437} {"train_loss": -19.42580223083496, "global_step": 36289, "epoch": 437} {"train_loss": -19.35883903503418, "global_step": 36290, "epoch": 437} {"train_loss": -19.455068588256836, "global_step": 36291, "epoch": 437} {"train_loss": -18.91717529296875, "global_step": 36292, "epoch": 437} {"train_loss": -19.43437957763672, "global_step": 36293, "epoch": 437} {"train_loss": -19.045230865478516, "global_step": 36294, "epoch": 437} {"train_loss": -19.1060848236084, "global_step": 36295, "epoch": 437} {"train_loss": -19.442907333374023, "global_step": 36296, "epoch": 437} {"train_loss": -19.372690200805664, "global_step": 36297, "epoch": 437} {"train_loss": -19.36763572692871, "global_step": 36298, "epoch": 437} {"train_loss": -19.07355308532715, "global_step": 36299, "epoch": 437} {"train_loss": -19.147520065307617, "global_step": 36300, "epoch": 437} {"train_loss": -19.412153244018555, "global_step": 36301, "epoch": 437} {"train_loss": -19.710474014282227, "global_step": 36302, "epoch": 437} {"train_loss": -19.13899040222168, "global_step": 36303, "epoch": 437} {"train_loss": -19.14235496520996, "global_step": 36304, "epoch": 437} {"train_loss": -19.52846336364746, "global_step": 36305, "epoch": 437} {"train_loss": -19.20927619934082, "global_step": 36306, "epoch": 437} {"train_loss": -19.575458526611328, "global_step": 36307, "epoch": 437} {"train_loss": -19.39105796813965, "global_step": 36308, "epoch": 437} {"train_loss": -19.378454208374023, "global_step": 36309, "epoch": 437} {"train_loss": -18.600650787353516, "global_step": 36310, "epoch": 437} {"train_loss": -19.156631469726562, "global_step": 36311, "epoch": 437} {"train_loss": -19.231016159057617, "global_step": 36312, "epoch": 437} {"train_loss": -19.16859245300293, "global_step": 36313, "epoch": 437} {"train_loss": -19.20225715637207, "global_step": 36314, "epoch": 437} {"train_loss": -19.329626083374023, "global_step": 36315, "epoch": 437} {"train_loss": -19.144094467163086, "global_step": 36316, "epoch": 437} {"train_loss": -19.39655303955078, "global_step": 36317, "epoch": 437} {"train_loss": -19.15691566467285, "global_step": 36318, "epoch": 437} {"train_loss": -19.610376358032227, "global_step": 36319, "epoch": 437} {"train_loss": -19.373197555541992, "global_step": 36320, "epoch": 437} {"train_loss": -19.07094383239746, "global_step": 36321, "epoch": 437} {"train_loss": -19.451875686645508, "global_step": 36322, "epoch": 437} {"train_loss": -18.892133712768555, "global_step": 36323, "epoch": 437} {"train_loss": -19.218814849853516, "global_step": 36324, "epoch": 437} {"train_loss": -19.4719295501709, "global_step": 36325, "epoch": 437} {"train_loss": -19.080076217651367, "global_step": 36326, "epoch": 437} {"train_loss": -19.25800895690918, "global_step": 36327, "epoch": 437} {"train_loss": -19.43619728088379, "global_step": 36328, "epoch": 437} {"train_loss": -19.08624839782715, "global_step": 36329, "epoch": 437} {"train_loss": -19.281192779541016, "global_step": 36330, "epoch": 437} {"train_loss": -19.195531845092773, "global_step": 36331, "epoch": 437} {"train_loss": -19.340564727783203, "global_step": 36332, "epoch": 437} {"train_loss": -19.61151123046875, "global_step": 36333, "epoch": 437} {"train_loss": -19.373815536499023, "global_step": 36334, "epoch": 437} {"train_loss": -19.084861755371094, "global_step": 36335, "epoch": 437} {"train_loss": -19.298389434814453, "global_step": 36336, "epoch": 437} {"train_loss": -19.185636520385742, "global_step": 36337, "epoch": 437} {"train_loss": -19.009750366210938, "global_step": 36338, "epoch": 437} {"train_loss": -19.207670211791992, "global_step": 36339, "epoch": 437} {"train_loss": -18.96503448486328, "global_step": 36340, "epoch": 437} {"train_loss": -19.28281593322754, "global_step": 36341, "epoch": 437} {"train_loss": -19.22779083251953, "global_step": 36342, "epoch": 437} {"train_loss": -19.145580291748047, "global_step": 36343, "epoch": 437} {"train_loss": -19.289846420288086, "global_step": 36344, "epoch": 437} {"train_loss": -18.911386489868164, "global_step": 36345, "epoch": 437} {"train_loss": -19.473241806030273, "global_step": 36346, "epoch": 437} {"train_loss": -19.081253051757812, "global_step": 36347, "epoch": 437} {"train_loss": -19.418163299560547, "global_step": 36348, "epoch": 437} {"train_loss": -19.061782836914062, "global_step": 36349, "epoch": 437} {"train_loss": -19.233304977416992, "global_step": 36350, "epoch": 437} {"train_loss": -19.556018829345703, "global_step": 36351, "epoch": 437} {"train_loss": -19.112173080444336, "global_step": 36352, "epoch": 437} {"train_loss": -19.2232173092394, "global_step": 36353, "epoch": 437, "val_loss": 5940638.5} {"train_loss": -18.574064254760742, "global_step": 36354, "epoch": 438} {"train_loss": -19.070415496826172, "global_step": 36355, "epoch": 438} {"train_loss": -19.025178909301758, "global_step": 36356, "epoch": 438} {"train_loss": -18.556943893432617, "global_step": 36357, "epoch": 438} {"train_loss": -19.04679298400879, "global_step": 36358, "epoch": 438} {"train_loss": -18.800024032592773, "global_step": 36359, "epoch": 438} {"train_loss": -18.654470443725586, "global_step": 36360, "epoch": 438} {"train_loss": -18.892019271850586, "global_step": 36361, "epoch": 438} {"train_loss": -19.13982582092285, "global_step": 36362, "epoch": 438} {"train_loss": -18.664148330688477, "global_step": 36363, "epoch": 438} {"train_loss": -18.657133102416992, "global_step": 36364, "epoch": 438} {"train_loss": -19.1915283203125, "global_step": 36365, "epoch": 438} {"train_loss": -19.389787673950195, "global_step": 36366, "epoch": 438} {"train_loss": -19.331222534179688, "global_step": 36367, "epoch": 438} {"train_loss": -18.855865478515625, "global_step": 36368, "epoch": 438} {"train_loss": -19.13743019104004, "global_step": 36369, "epoch": 438} {"train_loss": -19.05745506286621, "global_step": 36370, "epoch": 438} {"train_loss": -19.10929298400879, "global_step": 36371, "epoch": 438} {"train_loss": -19.060638427734375, "global_step": 36372, "epoch": 438} {"train_loss": -19.25244903564453, "global_step": 36373, "epoch": 438} {"train_loss": -19.086645126342773, "global_step": 36374, "epoch": 438} {"train_loss": -19.326086044311523, "global_step": 36375, "epoch": 438} {"train_loss": -19.46367835998535, "global_step": 36376, "epoch": 438} {"train_loss": -19.227941513061523, "global_step": 36377, "epoch": 438} {"train_loss": -19.511173248291016, "global_step": 36378, "epoch": 438} {"train_loss": -19.19961929321289, "global_step": 36379, "epoch": 438} {"train_loss": -19.215591430664062, "global_step": 36380, "epoch": 438} {"train_loss": -19.13079833984375, "global_step": 36381, "epoch": 438} {"train_loss": -18.754915237426758, "global_step": 36382, "epoch": 438} {"train_loss": -19.258657455444336, "global_step": 36383, "epoch": 438} {"train_loss": -19.391626358032227, "global_step": 36384, "epoch": 438} {"train_loss": -19.45273780822754, "global_step": 36385, "epoch": 438} {"train_loss": -19.200714111328125, "global_step": 36386, "epoch": 438} {"train_loss": -19.170772552490234, "global_step": 36387, "epoch": 438} {"train_loss": -19.259063720703125, "global_step": 36388, "epoch": 438} {"train_loss": -19.326475143432617, "global_step": 36389, "epoch": 438} {"train_loss": -19.25472068786621, "global_step": 36390, "epoch": 438} {"train_loss": -19.258319854736328, "global_step": 36391, "epoch": 438} {"train_loss": -19.221952438354492, "global_step": 36392, "epoch": 438} {"train_loss": -18.97650718688965, "global_step": 36393, "epoch": 438} {"train_loss": -19.21401023864746, "global_step": 36394, "epoch": 438} {"train_loss": -19.59345054626465, "global_step": 36395, "epoch": 438} {"train_loss": -19.028610229492188, "global_step": 36396, "epoch": 438} {"train_loss": -19.24273681640625, "global_step": 36397, "epoch": 438} {"train_loss": -19.2570858001709, "global_step": 36398, "epoch": 438} {"train_loss": -19.219873428344727, "global_step": 36399, "epoch": 438} {"train_loss": -19.159597396850586, "global_step": 36400, "epoch": 438} {"train_loss": -19.661344528198242, "global_step": 36401, "epoch": 438} {"train_loss": -18.70491600036621, "global_step": 36402, "epoch": 438} {"train_loss": -19.096649169921875, "global_step": 36403, "epoch": 438} {"train_loss": -19.03148651123047, "global_step": 36404, "epoch": 438} {"train_loss": -19.539777755737305, "global_step": 36405, "epoch": 438} {"train_loss": -19.281726837158203, "global_step": 36406, "epoch": 438} {"train_loss": -19.234434127807617, "global_step": 36407, "epoch": 438} {"train_loss": -19.27060890197754, "global_step": 36408, "epoch": 438} {"train_loss": -19.218921661376953, "global_step": 36409, "epoch": 438} {"train_loss": -19.311193466186523, "global_step": 36410, "epoch": 438} {"train_loss": -19.341087341308594, "global_step": 36411, "epoch": 438} {"train_loss": -19.250341415405273, "global_step": 36412, "epoch": 438} {"train_loss": -18.96040916442871, "global_step": 36413, "epoch": 438} {"train_loss": -19.423221588134766, "global_step": 36414, "epoch": 438} {"train_loss": -19.339826583862305, "global_step": 36415, "epoch": 438} {"train_loss": -19.143720626831055, "global_step": 36416, "epoch": 438} {"train_loss": -19.35487937927246, "global_step": 36417, "epoch": 438} {"train_loss": -19.03675651550293, "global_step": 36418, "epoch": 438} {"train_loss": -19.472265243530273, "global_step": 36419, "epoch": 438} {"train_loss": -19.301721572875977, "global_step": 36420, "epoch": 438} {"train_loss": -19.141756057739258, "global_step": 36421, "epoch": 438} {"train_loss": -19.414724349975586, "global_step": 36422, "epoch": 438} {"train_loss": -19.30722999572754, "global_step": 36423, "epoch": 438} {"train_loss": -19.057260513305664, "global_step": 36424, "epoch": 438} {"train_loss": -19.255285263061523, "global_step": 36425, "epoch": 438} {"train_loss": -19.377466201782227, "global_step": 36426, "epoch": 438} {"train_loss": -19.21200180053711, "global_step": 36427, "epoch": 438} {"train_loss": -19.433490753173828, "global_step": 36428, "epoch": 438} {"train_loss": -19.118276596069336, "global_step": 36429, "epoch": 438} {"train_loss": -19.665983200073242, "global_step": 36430, "epoch": 438} {"train_loss": -19.650182723999023, "global_step": 36431, "epoch": 438} {"train_loss": -19.0627498626709, "global_step": 36432, "epoch": 438} {"train_loss": -19.222524642944336, "global_step": 36433, "epoch": 438} {"train_loss": -19.343994140625, "global_step": 36434, "epoch": 438} {"train_loss": -19.534677505493164, "global_step": 36435, "epoch": 438} {"train_loss": -19.186730763998376, "global_step": 36436, "epoch": 438, "val_loss": 6019241.0} {"train_loss": -18.96487808227539, "global_step": 36437, "epoch": 439} {"train_loss": -19.193471908569336, "global_step": 36438, "epoch": 439} {"train_loss": -19.406021118164062, "global_step": 36439, "epoch": 439} {"train_loss": -19.412927627563477, "global_step": 36440, "epoch": 439} {"train_loss": -18.924903869628906, "global_step": 36441, "epoch": 439} {"train_loss": -19.171422958374023, "global_step": 36442, "epoch": 439} {"train_loss": -19.44388771057129, "global_step": 36443, "epoch": 439} {"train_loss": -19.329557418823242, "global_step": 36444, "epoch": 439} {"train_loss": -19.222814559936523, "global_step": 36445, "epoch": 439} {"train_loss": -19.191251754760742, "global_step": 36446, "epoch": 439} {"train_loss": -19.236392974853516, "global_step": 36447, "epoch": 439} {"train_loss": -18.858327865600586, "global_step": 36448, "epoch": 439} {"train_loss": -18.845874786376953, "global_step": 36449, "epoch": 439} {"train_loss": -19.002662658691406, "global_step": 36450, "epoch": 439} {"train_loss": -19.129486083984375, "global_step": 36451, "epoch": 439} {"train_loss": -19.49817657470703, "global_step": 36452, "epoch": 439} {"train_loss": -19.39642906188965, "global_step": 36453, "epoch": 439} {"train_loss": -19.2120361328125, "global_step": 36454, "epoch": 439} {"train_loss": -19.108386993408203, "global_step": 36455, "epoch": 439} {"train_loss": -19.145917892456055, "global_step": 36456, "epoch": 439} {"train_loss": -19.520498275756836, "global_step": 36457, "epoch": 439} {"train_loss": -19.568029403686523, "global_step": 36458, "epoch": 439} {"train_loss": -19.17818832397461, "global_step": 36459, "epoch": 439} {"train_loss": -19.09673500061035, "global_step": 36460, "epoch": 439} {"train_loss": -19.4265193939209, "global_step": 36461, "epoch": 439} {"train_loss": -19.77974510192871, "global_step": 36462, "epoch": 439} {"train_loss": -19.314695358276367, "global_step": 36463, "epoch": 439} {"train_loss": -19.1208553314209, "global_step": 36464, "epoch": 439} {"train_loss": -19.16886329650879, "global_step": 36465, "epoch": 439} {"train_loss": -19.451141357421875, "global_step": 36466, "epoch": 439} {"train_loss": -19.683639526367188, "global_step": 36467, "epoch": 439} {"train_loss": -18.99291229248047, "global_step": 36468, "epoch": 439} {"train_loss": -19.858531951904297, "global_step": 36469, "epoch": 439} {"train_loss": -19.095352172851562, "global_step": 36470, "epoch": 439} {"train_loss": -19.349374771118164, "global_step": 36471, "epoch": 439} {"train_loss": -19.555423736572266, "global_step": 36472, "epoch": 439} {"train_loss": -19.236133575439453, "global_step": 36473, "epoch": 439} {"train_loss": -19.546545028686523, "global_step": 36474, "epoch": 439} {"train_loss": -19.177780151367188, "global_step": 36475, "epoch": 439} {"train_loss": -19.439640045166016, "global_step": 36476, "epoch": 439} {"train_loss": -19.242481231689453, "global_step": 36477, "epoch": 439} {"train_loss": -19.63465690612793, "global_step": 36478, "epoch": 439} {"train_loss": -19.112699508666992, "global_step": 36479, "epoch": 439} {"train_loss": -19.321664810180664, "global_step": 36480, "epoch": 439} {"train_loss": -19.237573623657227, "global_step": 36481, "epoch": 439} {"train_loss": -19.096134185791016, "global_step": 36482, "epoch": 439} {"train_loss": -19.57041358947754, "global_step": 36483, "epoch": 439} {"train_loss": -19.20606231689453, "global_step": 36484, "epoch": 439} {"train_loss": -19.10350227355957, "global_step": 36485, "epoch": 439} {"train_loss": -19.32784080505371, "global_step": 36486, "epoch": 439} {"train_loss": -19.047805786132812, "global_step": 36487, "epoch": 439} {"train_loss": -19.276853561401367, "global_step": 36488, "epoch": 439} {"train_loss": -19.37428092956543, "global_step": 36489, "epoch": 439} {"train_loss": -19.58953857421875, "global_step": 36490, "epoch": 439} {"train_loss": -19.03716278076172, "global_step": 36491, "epoch": 439} {"train_loss": -19.531787872314453, "global_step": 36492, "epoch": 439} {"train_loss": -19.553075790405273, "global_step": 36493, "epoch": 439} {"train_loss": -19.32673454284668, "global_step": 36494, "epoch": 439} {"train_loss": -19.351125717163086, "global_step": 36495, "epoch": 439} {"train_loss": -19.551788330078125, "global_step": 36496, "epoch": 439} {"train_loss": -18.90105628967285, "global_step": 36497, "epoch": 439} {"train_loss": -19.250890731811523, "global_step": 36498, "epoch": 439} {"train_loss": -19.165739059448242, "global_step": 36499, "epoch": 439} {"train_loss": -19.13652229309082, "global_step": 36500, "epoch": 439} {"train_loss": -19.089054107666016, "global_step": 36501, "epoch": 439} {"train_loss": -18.8909854888916, "global_step": 36502, "epoch": 439} {"train_loss": -19.44731903076172, "global_step": 36503, "epoch": 439} {"train_loss": -18.991992950439453, "global_step": 36504, "epoch": 439} {"train_loss": -18.968019485473633, "global_step": 36505, "epoch": 439} {"train_loss": -18.873567581176758, "global_step": 36506, "epoch": 439} {"train_loss": -19.411619186401367, "global_step": 36507, "epoch": 439} {"train_loss": -18.821739196777344, "global_step": 36508, "epoch": 439} {"train_loss": -19.191442489624023, "global_step": 36509, "epoch": 439} {"train_loss": -19.02357292175293, "global_step": 36510, "epoch": 439} {"train_loss": -19.256925582885742, "global_step": 36511, "epoch": 439} {"train_loss": -19.18061637878418, "global_step": 36512, "epoch": 439} {"train_loss": -19.216989517211914, "global_step": 36513, "epoch": 439} {"train_loss": -19.800504684448242, "global_step": 36514, "epoch": 439} {"train_loss": -19.315641403198242, "global_step": 36515, "epoch": 439} {"train_loss": -19.38907241821289, "global_step": 36516, "epoch": 439} {"train_loss": -19.1545352935791, "global_step": 36517, "epoch": 439} {"train_loss": -19.54908561706543, "global_step": 36518, "epoch": 439} {"train_loss": -19.27788578171328, "global_step": 36519, "epoch": 439, "val_loss": 5964495.5} {"train_loss": -18.94257164001465, "global_step": 36520, "epoch": 440} {"train_loss": -18.790830612182617, "global_step": 36521, "epoch": 440} {"train_loss": -18.826717376708984, "global_step": 36522, "epoch": 440} {"train_loss": -19.370363235473633, "global_step": 36523, "epoch": 440} {"train_loss": -19.28201675415039, "global_step": 36524, "epoch": 440} {"train_loss": -18.983821868896484, "global_step": 36525, "epoch": 440} {"train_loss": -19.092041015625, "global_step": 36526, "epoch": 440} {"train_loss": -19.069971084594727, "global_step": 36527, "epoch": 440} {"train_loss": -19.2546443939209, "global_step": 36528, "epoch": 440} {"train_loss": -19.00386619567871, "global_step": 36529, "epoch": 440} {"train_loss": -19.100914001464844, "global_step": 36530, "epoch": 440} {"train_loss": -19.21015739440918, "global_step": 36531, "epoch": 440} {"train_loss": -19.140884399414062, "global_step": 36532, "epoch": 440} {"train_loss": -19.28461456298828, "global_step": 36533, "epoch": 440} {"train_loss": -18.969999313354492, "global_step": 36534, "epoch": 440} {"train_loss": -19.46978759765625, "global_step": 36535, "epoch": 440} {"train_loss": -19.229461669921875, "global_step": 36536, "epoch": 440} {"train_loss": -19.367305755615234, "global_step": 36537, "epoch": 440} {"train_loss": -19.30755043029785, "global_step": 36538, "epoch": 440} {"train_loss": -19.140207290649414, "global_step": 36539, "epoch": 440} {"train_loss": -19.217294692993164, "global_step": 36540, "epoch": 440} {"train_loss": -19.25420570373535, "global_step": 36541, "epoch": 440} {"train_loss": -19.396352767944336, "global_step": 36542, "epoch": 440} {"train_loss": -19.344797134399414, "global_step": 36543, "epoch": 440} {"train_loss": -19.216415405273438, "global_step": 36544, "epoch": 440} {"train_loss": -19.16164207458496, "global_step": 36545, "epoch": 440} {"train_loss": -18.998777389526367, "global_step": 36546, "epoch": 440} {"train_loss": -19.39108657836914, "global_step": 36547, "epoch": 440} {"train_loss": -19.467105865478516, "global_step": 36548, "epoch": 440} {"train_loss": -19.15017318725586, "global_step": 36549, "epoch": 440} {"train_loss": -19.365530014038086, "global_step": 36550, "epoch": 440} {"train_loss": -19.547409057617188, "global_step": 36551, "epoch": 440} {"train_loss": -19.336244583129883, "global_step": 36552, "epoch": 440} {"train_loss": -19.000869750976562, "global_step": 36553, "epoch": 440} {"train_loss": -19.102819442749023, "global_step": 36554, "epoch": 440} {"train_loss": -19.394609451293945, "global_step": 36555, "epoch": 440} {"train_loss": -19.273685455322266, "global_step": 36556, "epoch": 440} {"train_loss": -19.436065673828125, "global_step": 36557, "epoch": 440} {"train_loss": -19.396024703979492, "global_step": 36558, "epoch": 440} {"train_loss": -19.27820587158203, "global_step": 36559, "epoch": 440} {"train_loss": -19.353273391723633, "global_step": 36560, "epoch": 440} {"train_loss": -19.433088302612305, "global_step": 36561, "epoch": 440} {"train_loss": -19.136417388916016, "global_step": 36562, "epoch": 440} {"train_loss": -19.643577575683594, "global_step": 36563, "epoch": 440} {"train_loss": -19.42475700378418, "global_step": 36564, "epoch": 440} {"train_loss": -19.53678321838379, "global_step": 36565, "epoch": 440} {"train_loss": -19.2175350189209, "global_step": 36566, "epoch": 440} {"train_loss": -19.201053619384766, "global_step": 36567, "epoch": 440} {"train_loss": -19.321847915649414, "global_step": 36568, "epoch": 440} {"train_loss": -19.405254364013672, "global_step": 36569, "epoch": 440} {"train_loss": -19.175989151000977, "global_step": 36570, "epoch": 440} {"train_loss": -19.480134963989258, "global_step": 36571, "epoch": 440} {"train_loss": -19.27296257019043, "global_step": 36572, "epoch": 440} {"train_loss": -19.24283790588379, "global_step": 36573, "epoch": 440} {"train_loss": -19.603702545166016, "global_step": 36574, "epoch": 440} {"train_loss": -19.551240921020508, "global_step": 36575, "epoch": 440} {"train_loss": -19.045034408569336, "global_step": 36576, "epoch": 440} {"train_loss": -19.330154418945312, "global_step": 36577, "epoch": 440} {"train_loss": -19.534391403198242, "global_step": 36578, "epoch": 440} {"train_loss": -19.378355026245117, "global_step": 36579, "epoch": 440} {"train_loss": -19.268022537231445, "global_step": 36580, "epoch": 440} {"train_loss": -19.453628540039062, "global_step": 36581, "epoch": 440} {"train_loss": -18.942264556884766, "global_step": 36582, "epoch": 440} {"train_loss": -19.527902603149414, "global_step": 36583, "epoch": 440} {"train_loss": -19.43032455444336, "global_step": 36584, "epoch": 440} {"train_loss": -19.136560440063477, "global_step": 36585, "epoch": 440} {"train_loss": -19.239227294921875, "global_step": 36586, "epoch": 440} {"train_loss": -19.448455810546875, "global_step": 36587, "epoch": 440} {"train_loss": -19.29558563232422, "global_step": 36588, "epoch": 440} {"train_loss": -19.25331687927246, "global_step": 36589, "epoch": 440} {"train_loss": -19.439712524414062, "global_step": 36590, "epoch": 440} {"train_loss": -18.974040985107422, "global_step": 36591, "epoch": 440} {"train_loss": -19.269886016845703, "global_step": 36592, "epoch": 440} {"train_loss": -19.483572006225586, "global_step": 36593, "epoch": 440} {"train_loss": -19.29767608642578, "global_step": 36594, "epoch": 440} {"train_loss": -19.05703353881836, "global_step": 36595, "epoch": 440} {"train_loss": -19.19919776916504, "global_step": 36596, "epoch": 440} {"train_loss": -19.018735885620117, "global_step": 36597, "epoch": 440} {"train_loss": -19.12775993347168, "global_step": 36598, "epoch": 440} {"train_loss": -19.274646759033203, "global_step": 36599, "epoch": 440} {"train_loss": -19.12828254699707, "global_step": 36600, "epoch": 440} {"train_loss": -19.715003967285156, "global_step": 36601, "epoch": 440} {"train_loss": -19.26969091576266, "global_step": 36602, "epoch": 440, "val_loss": 5955540.0} {"train_loss": -19.22188377380371, "global_step": 36603, "epoch": 441} {"train_loss": -18.917951583862305, "global_step": 36604, "epoch": 441} {"train_loss": -18.911352157592773, "global_step": 36605, "epoch": 441} {"train_loss": -19.278995513916016, "global_step": 36606, "epoch": 441} {"train_loss": -19.082931518554688, "global_step": 36607, "epoch": 441} {"train_loss": -19.332447052001953, "global_step": 36608, "epoch": 441} {"train_loss": -19.5963077545166, "global_step": 36609, "epoch": 441} {"train_loss": -19.1173095703125, "global_step": 36610, "epoch": 441} {"train_loss": -19.039623260498047, "global_step": 36611, "epoch": 441} {"train_loss": -19.27257537841797, "global_step": 36612, "epoch": 441} {"train_loss": -19.006052017211914, "global_step": 36613, "epoch": 441} {"train_loss": -19.31682777404785, "global_step": 36614, "epoch": 441} {"train_loss": -19.22015953063965, "global_step": 36615, "epoch": 441} {"train_loss": -19.611494064331055, "global_step": 36616, "epoch": 441} {"train_loss": -19.503952026367188, "global_step": 36617, "epoch": 441} {"train_loss": -19.1014461517334, "global_step": 36618, "epoch": 441} {"train_loss": -19.014041900634766, "global_step": 36619, "epoch": 441} {"train_loss": -19.18985939025879, "global_step": 36620, "epoch": 441} {"train_loss": -19.414541244506836, "global_step": 36621, "epoch": 441} {"train_loss": -19.343198776245117, "global_step": 36622, "epoch": 441} {"train_loss": -19.437911987304688, "global_step": 36623, "epoch": 441} {"train_loss": -19.026512145996094, "global_step": 36624, "epoch": 441} {"train_loss": -18.948850631713867, "global_step": 36625, "epoch": 441} {"train_loss": -19.021146774291992, "global_step": 36626, "epoch": 441} {"train_loss": -18.922943115234375, "global_step": 36627, "epoch": 441} {"train_loss": -19.223325729370117, "global_step": 36628, "epoch": 441} {"train_loss": -19.453481674194336, "global_step": 36629, "epoch": 441} {"train_loss": -19.249685287475586, "global_step": 36630, "epoch": 441} {"train_loss": -19.468032836914062, "global_step": 36631, "epoch": 441} {"train_loss": -18.943130493164062, "global_step": 36632, "epoch": 441} {"train_loss": -19.412826538085938, "global_step": 36633, "epoch": 441} {"train_loss": -19.11050796508789, "global_step": 36634, "epoch": 441} {"train_loss": -19.440353393554688, "global_step": 36635, "epoch": 441} {"train_loss": -19.677648544311523, "global_step": 36636, "epoch": 441} {"train_loss": -19.442670822143555, "global_step": 36637, "epoch": 441} {"train_loss": -19.557701110839844, "global_step": 36638, "epoch": 441} {"train_loss": -18.999197006225586, "global_step": 36639, "epoch": 441} {"train_loss": -18.923429489135742, "global_step": 36640, "epoch": 441} {"train_loss": -18.80379867553711, "global_step": 36641, "epoch": 441} {"train_loss": -19.37233543395996, "global_step": 36642, "epoch": 441} {"train_loss": -19.163969039916992, "global_step": 36643, "epoch": 441} {"train_loss": -19.279142379760742, "global_step": 36644, "epoch": 441} {"train_loss": -19.382930755615234, "global_step": 36645, "epoch": 441} {"train_loss": -19.041555404663086, "global_step": 36646, "epoch": 441} {"train_loss": -18.894506454467773, "global_step": 36647, "epoch": 441} {"train_loss": -19.091632843017578, "global_step": 36648, "epoch": 441} {"train_loss": -19.32015037536621, "global_step": 36649, "epoch": 441} {"train_loss": -18.942522048950195, "global_step": 36650, "epoch": 441} {"train_loss": -19.80905532836914, "global_step": 36651, "epoch": 441} {"train_loss": -18.87583351135254, "global_step": 36652, "epoch": 441} {"train_loss": -19.38058090209961, "global_step": 36653, "epoch": 441} {"train_loss": -19.3512020111084, "global_step": 36654, "epoch": 441} {"train_loss": -19.435407638549805, "global_step": 36655, "epoch": 441} {"train_loss": -19.376943588256836, "global_step": 36656, "epoch": 441} {"train_loss": -19.078079223632812, "global_step": 36657, "epoch": 441} {"train_loss": -19.496973037719727, "global_step": 36658, "epoch": 441} {"train_loss": -19.528348922729492, "global_step": 36659, "epoch": 441} {"train_loss": -19.22089958190918, "global_step": 36660, "epoch": 441} {"train_loss": -19.284006118774414, "global_step": 36661, "epoch": 441} {"train_loss": -19.593826293945312, "global_step": 36662, "epoch": 441} {"train_loss": -19.944536209106445, "global_step": 36663, "epoch": 441} {"train_loss": -19.69782829284668, "global_step": 36664, "epoch": 441} {"train_loss": -18.936473846435547, "global_step": 36665, "epoch": 441} {"train_loss": -19.04414176940918, "global_step": 36666, "epoch": 441} {"train_loss": -19.627439498901367, "global_step": 36667, "epoch": 441} {"train_loss": -19.332813262939453, "global_step": 36668, "epoch": 441} {"train_loss": -19.392715454101562, "global_step": 36669, "epoch": 441} {"train_loss": -19.204999923706055, "global_step": 36670, "epoch": 441} {"train_loss": -18.991544723510742, "global_step": 36671, "epoch": 441} {"train_loss": -19.633285522460938, "global_step": 36672, "epoch": 441} {"train_loss": -19.316593170166016, "global_step": 36673, "epoch": 441} {"train_loss": -19.390426635742188, "global_step": 36674, "epoch": 441} {"train_loss": -19.266931533813477, "global_step": 36675, "epoch": 441} {"train_loss": -19.281585693359375, "global_step": 36676, "epoch": 441} {"train_loss": -19.15743064880371, "global_step": 36677, "epoch": 441} {"train_loss": -19.281248092651367, "global_step": 36678, "epoch": 441} {"train_loss": -19.210329055786133, "global_step": 36679, "epoch": 441} {"train_loss": -19.435781478881836, "global_step": 36680, "epoch": 441} {"train_loss": -19.506406784057617, "global_step": 36681, "epoch": 441} {"train_loss": -19.610525131225586, "global_step": 36682, "epoch": 441} {"train_loss": -19.04829978942871, "global_step": 36683, "epoch": 441} {"train_loss": -19.416105270385742, "global_step": 36684, "epoch": 441} {"train_loss": -19.281189447425934, "global_step": 36685, "epoch": 441, "val_loss": 5959304.0} {"train_loss": -19.164377212524414, "global_step": 36686, "epoch": 442} {"train_loss": -19.23805046081543, "global_step": 36687, "epoch": 442} {"train_loss": -19.486326217651367, "global_step": 36688, "epoch": 442} {"train_loss": -19.16658592224121, "global_step": 36689, "epoch": 442} {"train_loss": -18.83965492248535, "global_step": 36690, "epoch": 442} {"train_loss": -19.098180770874023, "global_step": 36691, "epoch": 442} {"train_loss": -18.96881675720215, "global_step": 36692, "epoch": 442} {"train_loss": -18.787736892700195, "global_step": 36693, "epoch": 442} {"train_loss": -18.977401733398438, "global_step": 36694, "epoch": 442} {"train_loss": -19.17621421813965, "global_step": 36695, "epoch": 442} {"train_loss": -19.24038314819336, "global_step": 36696, "epoch": 442} {"train_loss": -19.536270141601562, "global_step": 36697, "epoch": 442} {"train_loss": -19.283681869506836, "global_step": 36698, "epoch": 442} {"train_loss": -19.38496971130371, "global_step": 36699, "epoch": 442} {"train_loss": -19.300003051757812, "global_step": 36700, "epoch": 442} {"train_loss": -19.322877883911133, "global_step": 36701, "epoch": 442} {"train_loss": -19.510833740234375, "global_step": 36702, "epoch": 442} {"train_loss": -19.525348663330078, "global_step": 36703, "epoch": 442} {"train_loss": -19.417057037353516, "global_step": 36704, "epoch": 442} {"train_loss": -18.869342803955078, "global_step": 36705, "epoch": 442} {"train_loss": -19.12202262878418, "global_step": 36706, "epoch": 442} {"train_loss": -18.917665481567383, "global_step": 36707, "epoch": 442} {"train_loss": -19.257211685180664, "global_step": 36708, "epoch": 442} {"train_loss": -19.26803207397461, "global_step": 36709, "epoch": 442} {"train_loss": -19.541301727294922, "global_step": 36710, "epoch": 442} {"train_loss": -19.26840591430664, "global_step": 36711, "epoch": 442} {"train_loss": -19.104755401611328, "global_step": 36712, "epoch": 442} {"train_loss": -19.103900909423828, "global_step": 36713, "epoch": 442} {"train_loss": -19.164508819580078, "global_step": 36714, "epoch": 442} {"train_loss": -19.38608169555664, "global_step": 36715, "epoch": 442} {"train_loss": -19.196325302124023, "global_step": 36716, "epoch": 442} {"train_loss": -19.36607551574707, "global_step": 36717, "epoch": 442} {"train_loss": -19.097097396850586, "global_step": 36718, "epoch": 442} {"train_loss": -19.31549644470215, "global_step": 36719, "epoch": 442} {"train_loss": -19.14974594116211, "global_step": 36720, "epoch": 442} {"train_loss": -19.318147659301758, "global_step": 36721, "epoch": 442} {"train_loss": -19.378015518188477, "global_step": 36722, "epoch": 442} {"train_loss": -18.87476348876953, "global_step": 36723, "epoch": 442} {"train_loss": -19.039146423339844, "global_step": 36724, "epoch": 442} {"train_loss": -19.38249397277832, "global_step": 36725, "epoch": 442} {"train_loss": -19.561796188354492, "global_step": 36726, "epoch": 442} {"train_loss": -19.206832885742188, "global_step": 36727, "epoch": 442} {"train_loss": -18.85633087158203, "global_step": 36728, "epoch": 442} {"train_loss": -19.19818687438965, "global_step": 36729, "epoch": 442} {"train_loss": -19.33525848388672, "global_step": 36730, "epoch": 442} {"train_loss": -19.303686141967773, "global_step": 36731, "epoch": 442} {"train_loss": -19.275739669799805, "global_step": 36732, "epoch": 442} {"train_loss": -19.199594497680664, "global_step": 36733, "epoch": 442} {"train_loss": -19.439666748046875, "global_step": 36734, "epoch": 442} {"train_loss": -18.647560119628906, "global_step": 36735, "epoch": 442} {"train_loss": -19.279245376586914, "global_step": 36736, "epoch": 442} {"train_loss": -19.35281753540039, "global_step": 36737, "epoch": 442} {"train_loss": -19.0314884185791, "global_step": 36738, "epoch": 442} {"train_loss": -19.29286003112793, "global_step": 36739, "epoch": 442} {"train_loss": -19.22743797302246, "global_step": 36740, "epoch": 442} {"train_loss": -19.522247314453125, "global_step": 36741, "epoch": 442} {"train_loss": -18.784921646118164, "global_step": 36742, "epoch": 442} {"train_loss": -19.19825553894043, "global_step": 36743, "epoch": 442} {"train_loss": -19.401765823364258, "global_step": 36744, "epoch": 442} {"train_loss": -19.122297286987305, "global_step": 36745, "epoch": 442} {"train_loss": -19.400897979736328, "global_step": 36746, "epoch": 442} {"train_loss": -19.380441665649414, "global_step": 36747, "epoch": 442} {"train_loss": -19.0889835357666, "global_step": 36748, "epoch": 442} {"train_loss": -19.10323715209961, "global_step": 36749, "epoch": 442} {"train_loss": -19.365934371948242, "global_step": 36750, "epoch": 442} {"train_loss": -18.782350540161133, "global_step": 36751, "epoch": 442} {"train_loss": -19.313871383666992, "global_step": 36752, "epoch": 442} {"train_loss": -19.218994140625, "global_step": 36753, "epoch": 442} {"train_loss": -19.791316986083984, "global_step": 36754, "epoch": 442} {"train_loss": -19.166828155517578, "global_step": 36755, "epoch": 442} {"train_loss": -19.345548629760742, "global_step": 36756, "epoch": 442} {"train_loss": -19.374011993408203, "global_step": 36757, "epoch": 442} {"train_loss": -19.254711151123047, "global_step": 36758, "epoch": 442} {"train_loss": -19.338504791259766, "global_step": 36759, "epoch": 442} {"train_loss": -19.323999404907227, "global_step": 36760, "epoch": 442} {"train_loss": -19.678979873657227, "global_step": 36761, "epoch": 442} {"train_loss": -18.96921730041504, "global_step": 36762, "epoch": 442} {"train_loss": -19.37946891784668, "global_step": 36763, "epoch": 442} {"train_loss": -19.514606475830078, "global_step": 36764, "epoch": 442} {"train_loss": -19.29837417602539, "global_step": 36765, "epoch": 442} {"train_loss": -19.265546798706055, "global_step": 36766, "epoch": 442} {"train_loss": -19.45759391784668, "global_step": 36767, "epoch": 442} {"train_loss": -19.258194659129682, "global_step": 36768, "epoch": 442, "val_loss": 5893938.5} {"train_loss": -18.805587768554688, "global_step": 36769, "epoch": 443} {"train_loss": -18.921676635742188, "global_step": 36770, "epoch": 443} {"train_loss": -19.6497802734375, "global_step": 36771, "epoch": 443} {"train_loss": -19.17958641052246, "global_step": 36772, "epoch": 443} {"train_loss": -19.575944900512695, "global_step": 36773, "epoch": 443} {"train_loss": -19.252294540405273, "global_step": 36774, "epoch": 443} {"train_loss": -19.051912307739258, "global_step": 36775, "epoch": 443} {"train_loss": -19.255521774291992, "global_step": 36776, "epoch": 443} {"train_loss": -19.24295997619629, "global_step": 36777, "epoch": 443} {"train_loss": -19.143646240234375, "global_step": 36778, "epoch": 443} {"train_loss": -19.692659378051758, "global_step": 36779, "epoch": 443} {"train_loss": -19.06257438659668, "global_step": 36780, "epoch": 443} {"train_loss": -19.270055770874023, "global_step": 36781, "epoch": 443} {"train_loss": -19.368913650512695, "global_step": 36782, "epoch": 443} {"train_loss": -18.9459285736084, "global_step": 36783, "epoch": 443} {"train_loss": -19.04534339904785, "global_step": 36784, "epoch": 443} {"train_loss": -19.384231567382812, "global_step": 36785, "epoch": 443} {"train_loss": -19.33115577697754, "global_step": 36786, "epoch": 443} {"train_loss": -19.18117332458496, "global_step": 36787, "epoch": 443} {"train_loss": -19.258241653442383, "global_step": 36788, "epoch": 443} {"train_loss": -19.762989044189453, "global_step": 36789, "epoch": 443} {"train_loss": -19.158742904663086, "global_step": 36790, "epoch": 443} {"train_loss": -19.47472381591797, "global_step": 36791, "epoch": 443} {"train_loss": -18.97134017944336, "global_step": 36792, "epoch": 443} {"train_loss": -19.15615463256836, "global_step": 36793, "epoch": 443} {"train_loss": -19.27495765686035, "global_step": 36794, "epoch": 443} {"train_loss": -18.89884376525879, "global_step": 36795, "epoch": 443} {"train_loss": -19.232723236083984, "global_step": 36796, "epoch": 443} {"train_loss": -19.282333374023438, "global_step": 36797, "epoch": 443} {"train_loss": -19.535675048828125, "global_step": 36798, "epoch": 443} {"train_loss": -19.358976364135742, "global_step": 36799, "epoch": 443} {"train_loss": -19.295433044433594, "global_step": 36800, "epoch": 443} {"train_loss": -19.517959594726562, "global_step": 36801, "epoch": 443} {"train_loss": -19.675079345703125, "global_step": 36802, "epoch": 443} {"train_loss": -19.571075439453125, "global_step": 36803, "epoch": 443} {"train_loss": -19.033170700073242, "global_step": 36804, "epoch": 443} {"train_loss": -19.125289916992188, "global_step": 36805, "epoch": 443} {"train_loss": -19.38759422302246, "global_step": 36806, "epoch": 443} {"train_loss": -18.939367294311523, "global_step": 36807, "epoch": 443} {"train_loss": -19.678974151611328, "global_step": 36808, "epoch": 443} {"train_loss": -19.682477951049805, "global_step": 36809, "epoch": 443} {"train_loss": -18.99239158630371, "global_step": 36810, "epoch": 443} {"train_loss": -19.452096939086914, "global_step": 36811, "epoch": 443} {"train_loss": -19.543411254882812, "global_step": 36812, "epoch": 443} {"train_loss": -19.30633544921875, "global_step": 36813, "epoch": 443} {"train_loss": -19.579395294189453, "global_step": 36814, "epoch": 443} {"train_loss": -19.374225616455078, "global_step": 36815, "epoch": 443} {"train_loss": -19.321630477905273, "global_step": 36816, "epoch": 443} {"train_loss": -19.642086029052734, "global_step": 36817, "epoch": 443} {"train_loss": -19.091073989868164, "global_step": 36818, "epoch": 443} {"train_loss": -19.32415771484375, "global_step": 36819, "epoch": 443} {"train_loss": -19.280384063720703, "global_step": 36820, "epoch": 443} {"train_loss": -19.067005157470703, "global_step": 36821, "epoch": 443} {"train_loss": -19.084421157836914, "global_step": 36822, "epoch": 443} {"train_loss": -19.255430221557617, "global_step": 36823, "epoch": 443} {"train_loss": -19.194135665893555, "global_step": 36824, "epoch": 443} {"train_loss": -19.306110382080078, "global_step": 36825, "epoch": 443} {"train_loss": -19.054935455322266, "global_step": 36826, "epoch": 443} {"train_loss": -19.339414596557617, "global_step": 36827, "epoch": 443} {"train_loss": -19.517148971557617, "global_step": 36828, "epoch": 443} {"train_loss": -19.160625457763672, "global_step": 36829, "epoch": 443} {"train_loss": -19.395771026611328, "global_step": 36830, "epoch": 443} {"train_loss": -19.62921714782715, "global_step": 36831, "epoch": 443} {"train_loss": -19.072351455688477, "global_step": 36832, "epoch": 443} {"train_loss": -19.12943458557129, "global_step": 36833, "epoch": 443} {"train_loss": -19.511686325073242, "global_step": 36834, "epoch": 443} {"train_loss": -18.6386775970459, "global_step": 36835, "epoch": 443} {"train_loss": -18.90750503540039, "global_step": 36836, "epoch": 443} {"train_loss": -19.05164909362793, "global_step": 36837, "epoch": 443} {"train_loss": -19.531307220458984, "global_step": 36838, "epoch": 443} {"train_loss": -19.271560668945312, "global_step": 36839, "epoch": 443} {"train_loss": -19.173952102661133, "global_step": 36840, "epoch": 443} {"train_loss": -19.500843048095703, "global_step": 36841, "epoch": 443} {"train_loss": -19.488393783569336, "global_step": 36842, "epoch": 443} {"train_loss": -19.45166015625, "global_step": 36843, "epoch": 443} {"train_loss": -19.078367233276367, "global_step": 36844, "epoch": 443} {"train_loss": -18.915699005126953, "global_step": 36845, "epoch": 443} {"train_loss": -19.21181869506836, "global_step": 36846, "epoch": 443} {"train_loss": -19.736896514892578, "global_step": 36847, "epoch": 443} {"train_loss": -19.290695190429688, "global_step": 36848, "epoch": 443} {"train_loss": -19.1503963470459, "global_step": 36849, "epoch": 443} {"train_loss": -19.511098861694336, "global_step": 36850, "epoch": 443} {"train_loss": -19.26101974119623, "global_step": 36851, "epoch": 443, "val_loss": 5993096.5} {"train_loss": -19.110198974609375, "global_step": 36852, "epoch": 444} {"train_loss": -18.86982536315918, "global_step": 36853, "epoch": 444} {"train_loss": -18.974273681640625, "global_step": 36854, "epoch": 444} {"train_loss": -18.8937931060791, "global_step": 36855, "epoch": 444} {"train_loss": -19.04310417175293, "global_step": 36856, "epoch": 444} {"train_loss": -19.526161193847656, "global_step": 36857, "epoch": 444} {"train_loss": -19.047168731689453, "global_step": 36858, "epoch": 444} {"train_loss": -19.463741302490234, "global_step": 36859, "epoch": 444} {"train_loss": -18.8271541595459, "global_step": 36860, "epoch": 444} {"train_loss": -19.39710807800293, "global_step": 36861, "epoch": 444} {"train_loss": -19.225616455078125, "global_step": 36862, "epoch": 444} {"train_loss": -19.248098373413086, "global_step": 36863, "epoch": 444} {"train_loss": -19.24024200439453, "global_step": 36864, "epoch": 444} {"train_loss": -19.16581153869629, "global_step": 36865, "epoch": 444} {"train_loss": -19.348800659179688, "global_step": 36866, "epoch": 444} {"train_loss": -19.4168643951416, "global_step": 36867, "epoch": 444} {"train_loss": -19.248647689819336, "global_step": 36868, "epoch": 444} {"train_loss": -19.228199005126953, "global_step": 36869, "epoch": 444} {"train_loss": -18.995946884155273, "global_step": 36870, "epoch": 444} {"train_loss": -19.272809982299805, "global_step": 36871, "epoch": 444} {"train_loss": -19.38761329650879, "global_step": 36872, "epoch": 444} {"train_loss": -19.384016036987305, "global_step": 36873, "epoch": 444} {"train_loss": -19.784446716308594, "global_step": 36874, "epoch": 444} {"train_loss": -19.66899299621582, "global_step": 36875, "epoch": 444} {"train_loss": -19.207799911499023, "global_step": 36876, "epoch": 444} {"train_loss": -19.05130958557129, "global_step": 36877, "epoch": 444} {"train_loss": -19.400760650634766, "global_step": 36878, "epoch": 444} {"train_loss": -19.22615623474121, "global_step": 36879, "epoch": 444} {"train_loss": -19.401212692260742, "global_step": 36880, "epoch": 444} {"train_loss": -19.45313835144043, "global_step": 36881, "epoch": 444} {"train_loss": -19.40278434753418, "global_step": 36882, "epoch": 444} {"train_loss": -19.269704818725586, "global_step": 36883, "epoch": 444} {"train_loss": -19.5179443359375, "global_step": 36884, "epoch": 444} {"train_loss": -19.455739974975586, "global_step": 36885, "epoch": 444} {"train_loss": -19.23870849609375, "global_step": 36886, "epoch": 444} {"train_loss": -19.308513641357422, "global_step": 36887, "epoch": 444} {"train_loss": -19.24690055847168, "global_step": 36888, "epoch": 444} {"train_loss": -19.22671127319336, "global_step": 36889, "epoch": 444} {"train_loss": -19.728174209594727, "global_step": 36890, "epoch": 444} {"train_loss": -19.23170280456543, "global_step": 36891, "epoch": 444} {"train_loss": -19.02141761779785, "global_step": 36892, "epoch": 444} {"train_loss": -19.388416290283203, "global_step": 36893, "epoch": 444} {"train_loss": -19.502342224121094, "global_step": 36894, "epoch": 444} {"train_loss": -19.658580780029297, "global_step": 36895, "epoch": 444} {"train_loss": -19.57163429260254, "global_step": 36896, "epoch": 444} {"train_loss": -19.107988357543945, "global_step": 36897, "epoch": 444} {"train_loss": -19.017383575439453, "global_step": 36898, "epoch": 444} {"train_loss": -19.301374435424805, "global_step": 36899, "epoch": 444} {"train_loss": -18.909486770629883, "global_step": 36900, "epoch": 444} {"train_loss": -19.26789665222168, "global_step": 36901, "epoch": 444} {"train_loss": -19.350122451782227, "global_step": 36902, "epoch": 444} {"train_loss": -19.324491500854492, "global_step": 36903, "epoch": 444} {"train_loss": -19.20989418029785, "global_step": 36904, "epoch": 444} {"train_loss": -19.476858139038086, "global_step": 36905, "epoch": 444} {"train_loss": -19.410295486450195, "global_step": 36906, "epoch": 444} {"train_loss": -19.468109130859375, "global_step": 36907, "epoch": 444} {"train_loss": -18.8759822845459, "global_step": 36908, "epoch": 444} {"train_loss": -19.704113006591797, "global_step": 36909, "epoch": 444} {"train_loss": -19.271535873413086, "global_step": 36910, "epoch": 444} {"train_loss": -19.340761184692383, "global_step": 36911, "epoch": 444} {"train_loss": -19.359806060791016, "global_step": 36912, "epoch": 444} {"train_loss": -19.194644927978516, "global_step": 36913, "epoch": 444} {"train_loss": -19.33454704284668, "global_step": 36914, "epoch": 444} {"train_loss": -19.181245803833008, "global_step": 36915, "epoch": 444} {"train_loss": -19.23974609375, "global_step": 36916, "epoch": 444} {"train_loss": -19.182676315307617, "global_step": 36917, "epoch": 444} {"train_loss": -19.56806755065918, "global_step": 36918, "epoch": 444} {"train_loss": -19.209909439086914, "global_step": 36919, "epoch": 444} {"train_loss": -19.258094787597656, "global_step": 36920, "epoch": 444} {"train_loss": -19.371021270751953, "global_step": 36921, "epoch": 444} {"train_loss": -19.347532272338867, "global_step": 36922, "epoch": 444} {"train_loss": -19.142210006713867, "global_step": 36923, "epoch": 444} {"train_loss": -19.419696807861328, "global_step": 36924, "epoch": 444} {"train_loss": -19.308156967163086, "global_step": 36925, "epoch": 444} {"train_loss": -19.443218231201172, "global_step": 36926, "epoch": 444} {"train_loss": -19.273649215698242, "global_step": 36927, "epoch": 444} {"train_loss": -19.511751174926758, "global_step": 36928, "epoch": 444} {"train_loss": -19.098119735717773, "global_step": 36929, "epoch": 444} {"train_loss": -19.390039443969727, "global_step": 36930, "epoch": 444} {"train_loss": -19.174686431884766, "global_step": 36931, "epoch": 444} {"train_loss": -19.04443359375, "global_step": 36932, "epoch": 444} {"train_loss": -19.204790115356445, "global_step": 36933, "epoch": 444} {"train_loss": -19.287323733410204, "global_step": 36934, "epoch": 444, "val_loss": 6018778.0} {"train_loss": -19.589462280273438, "global_step": 36935, "epoch": 445} {"train_loss": -19.182485580444336, "global_step": 36936, "epoch": 445} {"train_loss": -19.105093002319336, "global_step": 36937, "epoch": 445} {"train_loss": -19.096485137939453, "global_step": 36938, "epoch": 445} {"train_loss": -19.492202758789062, "global_step": 36939, "epoch": 445} {"train_loss": -19.372713088989258, "global_step": 36940, "epoch": 445} {"train_loss": -19.06879997253418, "global_step": 36941, "epoch": 445} {"train_loss": -19.373210906982422, "global_step": 36942, "epoch": 445} {"train_loss": -19.332462310791016, "global_step": 36943, "epoch": 445} {"train_loss": -19.271501541137695, "global_step": 36944, "epoch": 445} {"train_loss": -19.08165168762207, "global_step": 36945, "epoch": 445} {"train_loss": -18.920005798339844, "global_step": 36946, "epoch": 445} {"train_loss": -19.115966796875, "global_step": 36947, "epoch": 445} {"train_loss": -19.536781311035156, "global_step": 36948, "epoch": 445} {"train_loss": -19.278762817382812, "global_step": 36949, "epoch": 445} {"train_loss": -19.351486206054688, "global_step": 36950, "epoch": 445} {"train_loss": -19.506332397460938, "global_step": 36951, "epoch": 445} {"train_loss": -19.10198211669922, "global_step": 36952, "epoch": 445} {"train_loss": -19.369001388549805, "global_step": 36953, "epoch": 445} {"train_loss": -18.87717056274414, "global_step": 36954, "epoch": 445} {"train_loss": -19.65141487121582, "global_step": 36955, "epoch": 445} {"train_loss": -19.249866485595703, "global_step": 36956, "epoch": 445} {"train_loss": -19.292970657348633, "global_step": 36957, "epoch": 445} {"train_loss": -19.23810386657715, "global_step": 36958, "epoch": 445} {"train_loss": -19.123960494995117, "global_step": 36959, "epoch": 445} {"train_loss": -19.499282836914062, "global_step": 36960, "epoch": 445} {"train_loss": -19.279769897460938, "global_step": 36961, "epoch": 445} {"train_loss": -19.07355308532715, "global_step": 36962, "epoch": 445} {"train_loss": -18.945301055908203, "global_step": 36963, "epoch": 445} {"train_loss": -19.49141502380371, "global_step": 36964, "epoch": 445} {"train_loss": -19.833513259887695, "global_step": 36965, "epoch": 445} {"train_loss": -19.369550704956055, "global_step": 36966, "epoch": 445} {"train_loss": -19.40165901184082, "global_step": 36967, "epoch": 445} {"train_loss": -19.254499435424805, "global_step": 36968, "epoch": 445} {"train_loss": -19.202571868896484, "global_step": 36969, "epoch": 445} {"train_loss": -19.25238609313965, "global_step": 36970, "epoch": 445} {"train_loss": -19.303375244140625, "global_step": 36971, "epoch": 445} {"train_loss": -19.269147872924805, "global_step": 36972, "epoch": 445} {"train_loss": -19.167987823486328, "global_step": 36973, "epoch": 445} {"train_loss": -19.11195945739746, "global_step": 36974, "epoch": 445} {"train_loss": -19.261560440063477, "global_step": 36975, "epoch": 445} {"train_loss": -19.238893508911133, "global_step": 36976, "epoch": 445} {"train_loss": -19.128812789916992, "global_step": 36977, "epoch": 445} {"train_loss": -19.23342514038086, "global_step": 36978, "epoch": 445} {"train_loss": -19.27039909362793, "global_step": 36979, "epoch": 445} {"train_loss": -19.40776252746582, "global_step": 36980, "epoch": 445} {"train_loss": -19.52754783630371, "global_step": 36981, "epoch": 445} {"train_loss": -18.958749771118164, "global_step": 36982, "epoch": 445} {"train_loss": -19.24839973449707, "global_step": 36983, "epoch": 445} {"train_loss": -18.938413619995117, "global_step": 36984, "epoch": 445} {"train_loss": -19.688400268554688, "global_step": 36985, "epoch": 445} {"train_loss": -19.09374237060547, "global_step": 36986, "epoch": 445} {"train_loss": -19.216745376586914, "global_step": 36987, "epoch": 445} {"train_loss": -19.48062515258789, "global_step": 36988, "epoch": 445} {"train_loss": -19.596139907836914, "global_step": 36989, "epoch": 445} {"train_loss": -19.17707633972168, "global_step": 36990, "epoch": 445} {"train_loss": -19.587677001953125, "global_step": 36991, "epoch": 445} {"train_loss": -19.337543487548828, "global_step": 36992, "epoch": 445} {"train_loss": -19.213354110717773, "global_step": 36993, "epoch": 445} {"train_loss": -19.090900421142578, "global_step": 36994, "epoch": 445} {"train_loss": -19.218719482421875, "global_step": 36995, "epoch": 445} {"train_loss": -19.027198791503906, "global_step": 36996, "epoch": 445} {"train_loss": -19.239900588989258, "global_step": 36997, "epoch": 445} {"train_loss": -19.39926528930664, "global_step": 36998, "epoch": 445} {"train_loss": -19.508275985717773, "global_step": 36999, "epoch": 445} {"train_loss": -19.52534294128418, "global_step": 37000, "epoch": 445} {"train_loss": -19.41652488708496, "global_step": 37001, "epoch": 445} {"train_loss": -19.4862003326416, "global_step": 37002, "epoch": 445} {"train_loss": -19.510608673095703, "global_step": 37003, "epoch": 445} {"train_loss": -19.6649227142334, "global_step": 37004, "epoch": 445} {"train_loss": -19.0625057220459, "global_step": 37005, "epoch": 445} {"train_loss": -19.168012619018555, "global_step": 37006, "epoch": 445} {"train_loss": -19.55863380432129, "global_step": 37007, "epoch": 445} {"train_loss": -19.49534797668457, "global_step": 37008, "epoch": 445} {"train_loss": -18.972806930541992, "global_step": 37009, "epoch": 445} {"train_loss": -19.490873336791992, "global_step": 37010, "epoch": 445} {"train_loss": -19.379310607910156, "global_step": 37011, "epoch": 445} {"train_loss": -19.468215942382812, "global_step": 37012, "epoch": 445} {"train_loss": -18.490896224975586, "global_step": 37013, "epoch": 445} {"train_loss": -19.342161178588867, "global_step": 37014, "epoch": 445} {"train_loss": -19.51203727722168, "global_step": 37015, "epoch": 445} {"train_loss": -19.2983341217041, "global_step": 37016, "epoch": 445} {"train_loss": -19.291811632822796, "global_step": 37017, "epoch": 445, "val_loss": 6112346.5} {"train_loss": -19.534460067749023, "global_step": 37018, "epoch": 446} {"train_loss": -19.520038604736328, "global_step": 37019, "epoch": 446} {"train_loss": -18.879493713378906, "global_step": 37020, "epoch": 446} {"train_loss": -18.849220275878906, "global_step": 37021, "epoch": 446} {"train_loss": -19.50990867614746, "global_step": 37022, "epoch": 446} {"train_loss": -18.97028160095215, "global_step": 37023, "epoch": 446} {"train_loss": -19.32637596130371, "global_step": 37024, "epoch": 446} {"train_loss": -19.50960350036621, "global_step": 37025, "epoch": 446} {"train_loss": -19.402835845947266, "global_step": 37026, "epoch": 446} {"train_loss": -19.286680221557617, "global_step": 37027, "epoch": 446} {"train_loss": -19.560789108276367, "global_step": 37028, "epoch": 446} {"train_loss": -19.407424926757812, "global_step": 37029, "epoch": 446} {"train_loss": -19.07326316833496, "global_step": 37030, "epoch": 446} {"train_loss": -19.703041076660156, "global_step": 37031, "epoch": 446} {"train_loss": -19.39967918395996, "global_step": 37032, "epoch": 446} {"train_loss": -18.961383819580078, "global_step": 37033, "epoch": 446} {"train_loss": -19.298856735229492, "global_step": 37034, "epoch": 446} {"train_loss": -19.26968002319336, "global_step": 37035, "epoch": 446} {"train_loss": -19.52219581604004, "global_step": 37036, "epoch": 446} {"train_loss": -19.343612670898438, "global_step": 37037, "epoch": 446} {"train_loss": -19.08001136779785, "global_step": 37038, "epoch": 446} {"train_loss": -19.0709285736084, "global_step": 37039, "epoch": 446} {"train_loss": -19.0446834564209, "global_step": 37040, "epoch": 446} {"train_loss": -19.147428512573242, "global_step": 37041, "epoch": 446} {"train_loss": -19.174436569213867, "global_step": 37042, "epoch": 446} {"train_loss": -19.290164947509766, "global_step": 37043, "epoch": 446} {"train_loss": -19.040433883666992, "global_step": 37044, "epoch": 446} {"train_loss": -19.253637313842773, "global_step": 37045, "epoch": 446} {"train_loss": -19.772159576416016, "global_step": 37046, "epoch": 446} {"train_loss": -19.348773956298828, "global_step": 37047, "epoch": 446} {"train_loss": -19.10223960876465, "global_step": 37048, "epoch": 446} {"train_loss": -19.020822525024414, "global_step": 37049, "epoch": 446} {"train_loss": -19.515525817871094, "global_step": 37050, "epoch": 446} {"train_loss": -19.297870635986328, "global_step": 37051, "epoch": 446} {"train_loss": -19.043848037719727, "global_step": 37052, "epoch": 446} {"train_loss": -19.435653686523438, "global_step": 37053, "epoch": 446} {"train_loss": -19.426054000854492, "global_step": 37054, "epoch": 446} {"train_loss": -18.998291015625, "global_step": 37055, "epoch": 446} {"train_loss": -19.118961334228516, "global_step": 37056, "epoch": 446} {"train_loss": -18.821334838867188, "global_step": 37057, "epoch": 446} {"train_loss": -19.54717445373535, "global_step": 37058, "epoch": 446} {"train_loss": -19.23533058166504, "global_step": 37059, "epoch": 446} {"train_loss": -19.65309715270996, "global_step": 37060, "epoch": 446} {"train_loss": -19.5281982421875, "global_step": 37061, "epoch": 446} {"train_loss": -19.216726303100586, "global_step": 37062, "epoch": 446} {"train_loss": -19.384567260742188, "global_step": 37063, "epoch": 446} {"train_loss": -19.176435470581055, "global_step": 37064, "epoch": 446} {"train_loss": -19.73324203491211, "global_step": 37065, "epoch": 446} {"train_loss": -19.135358810424805, "global_step": 37066, "epoch": 446} {"train_loss": -19.519941329956055, "global_step": 37067, "epoch": 446} {"train_loss": -19.088762283325195, "global_step": 37068, "epoch": 446} {"train_loss": -19.568620681762695, "global_step": 37069, "epoch": 446} {"train_loss": -19.417478561401367, "global_step": 37070, "epoch": 446} {"train_loss": -19.26955223083496, "global_step": 37071, "epoch": 446} {"train_loss": -19.414108276367188, "global_step": 37072, "epoch": 446} {"train_loss": -19.29486083984375, "global_step": 37073, "epoch": 446} {"train_loss": -19.603849411010742, "global_step": 37074, "epoch": 446} {"train_loss": -19.03754997253418, "global_step": 37075, "epoch": 446} {"train_loss": -19.058988571166992, "global_step": 37076, "epoch": 446} {"train_loss": -19.188507080078125, "global_step": 37077, "epoch": 446} {"train_loss": -19.245376586914062, "global_step": 37078, "epoch": 446} {"train_loss": -19.117746353149414, "global_step": 37079, "epoch": 446} {"train_loss": -19.517711639404297, "global_step": 37080, "epoch": 446} {"train_loss": -19.242660522460938, "global_step": 37081, "epoch": 446} {"train_loss": -19.553430557250977, "global_step": 37082, "epoch": 446} {"train_loss": -19.28424072265625, "global_step": 37083, "epoch": 446} {"train_loss": -19.764389038085938, "global_step": 37084, "epoch": 446} {"train_loss": -19.38681411743164, "global_step": 37085, "epoch": 446} {"train_loss": -19.465620040893555, "global_step": 37086, "epoch": 446} {"train_loss": -19.08356285095215, "global_step": 37087, "epoch": 446} {"train_loss": -19.497861862182617, "global_step": 37088, "epoch": 446} {"train_loss": -19.417112350463867, "global_step": 37089, "epoch": 446} {"train_loss": -19.033239364624023, "global_step": 37090, "epoch": 446} {"train_loss": -19.408166885375977, "global_step": 37091, "epoch": 446} {"train_loss": -19.081003189086914, "global_step": 37092, "epoch": 446} {"train_loss": -19.21849822998047, "global_step": 37093, "epoch": 446} {"train_loss": -18.958974838256836, "global_step": 37094, "epoch": 446} {"train_loss": -19.296518325805664, "global_step": 37095, "epoch": 446} {"train_loss": -19.187734603881836, "global_step": 37096, "epoch": 446} {"train_loss": -19.3030948638916, "global_step": 37097, "epoch": 446} {"train_loss": -19.053062438964844, "global_step": 37098, "epoch": 446} {"train_loss": -19.423782348632812, "global_step": 37099, "epoch": 446} {"train_loss": -19.29555605693036, "global_step": 37100, "epoch": 446, "val_loss": 6041135.5} {"train_loss": -19.1002140045166, "global_step": 37101, "epoch": 447} {"train_loss": -19.531646728515625, "global_step": 37102, "epoch": 447} {"train_loss": -19.114696502685547, "global_step": 37103, "epoch": 447} {"train_loss": -18.923885345458984, "global_step": 37104, "epoch": 447} {"train_loss": -19.096817016601562, "global_step": 37105, "epoch": 447} {"train_loss": -18.990938186645508, "global_step": 37106, "epoch": 447} {"train_loss": -18.964475631713867, "global_step": 37107, "epoch": 447} {"train_loss": -18.849048614501953, "global_step": 37108, "epoch": 447} {"train_loss": -19.14594841003418, "global_step": 37109, "epoch": 447} {"train_loss": -18.952199935913086, "global_step": 37110, "epoch": 447} {"train_loss": -19.06072425842285, "global_step": 37111, "epoch": 447} {"train_loss": -18.86009407043457, "global_step": 37112, "epoch": 447} {"train_loss": -19.56595802307129, "global_step": 37113, "epoch": 447} {"train_loss": -18.903091430664062, "global_step": 37114, "epoch": 447} {"train_loss": -19.086170196533203, "global_step": 37115, "epoch": 447} {"train_loss": -19.210004806518555, "global_step": 37116, "epoch": 447} {"train_loss": -19.512630462646484, "global_step": 37117, "epoch": 447} {"train_loss": -19.611677169799805, "global_step": 37118, "epoch": 447} {"train_loss": -19.422285079956055, "global_step": 37119, "epoch": 447} {"train_loss": -19.54390525817871, "global_step": 37120, "epoch": 447} {"train_loss": -19.14839744567871, "global_step": 37121, "epoch": 447} {"train_loss": -19.37821388244629, "global_step": 37122, "epoch": 447} {"train_loss": -19.395551681518555, "global_step": 37123, "epoch": 447} {"train_loss": -19.23116111755371, "global_step": 37124, "epoch": 447} {"train_loss": -19.3106689453125, "global_step": 37125, "epoch": 447} {"train_loss": -19.21742057800293, "global_step": 37126, "epoch": 447} {"train_loss": -19.556625366210938, "global_step": 37127, "epoch": 447} {"train_loss": -19.31805992126465, "global_step": 37128, "epoch": 447} {"train_loss": -19.384824752807617, "global_step": 37129, "epoch": 447} {"train_loss": -18.847400665283203, "global_step": 37130, "epoch": 447} {"train_loss": -19.348600387573242, "global_step": 37131, "epoch": 447} {"train_loss": -19.4633731842041, "global_step": 37132, "epoch": 447} {"train_loss": -19.46296501159668, "global_step": 37133, "epoch": 447} {"train_loss": -19.30315589904785, "global_step": 37134, "epoch": 447} {"train_loss": -19.43889045715332, "global_step": 37135, "epoch": 447} {"train_loss": -19.13594627380371, "global_step": 37136, "epoch": 447} {"train_loss": -19.393630981445312, "global_step": 37137, "epoch": 447} {"train_loss": -19.260087966918945, "global_step": 37138, "epoch": 447} {"train_loss": -19.17300796508789, "global_step": 37139, "epoch": 447} {"train_loss": -19.3238582611084, "global_step": 37140, "epoch": 447} {"train_loss": -18.94426155090332, "global_step": 37141, "epoch": 447} {"train_loss": -19.105649948120117, "global_step": 37142, "epoch": 447} {"train_loss": -19.452255249023438, "global_step": 37143, "epoch": 447} {"train_loss": -19.43364906311035, "global_step": 37144, "epoch": 447} {"train_loss": -19.378171920776367, "global_step": 37145, "epoch": 447} {"train_loss": -19.28328514099121, "global_step": 37146, "epoch": 447} {"train_loss": -19.417438507080078, "global_step": 37147, "epoch": 447} {"train_loss": -19.43528938293457, "global_step": 37148, "epoch": 447} {"train_loss": -19.56443214416504, "global_step": 37149, "epoch": 447} {"train_loss": -19.57576560974121, "global_step": 37150, "epoch": 447} {"train_loss": -19.1846981048584, "global_step": 37151, "epoch": 447} {"train_loss": -19.554996490478516, "global_step": 37152, "epoch": 447} {"train_loss": -19.40699577331543, "global_step": 37153, "epoch": 447} {"train_loss": -19.30660057067871, "global_step": 37154, "epoch": 447} {"train_loss": -19.660831451416016, "global_step": 37155, "epoch": 447} {"train_loss": -19.477128982543945, "global_step": 37156, "epoch": 447} {"train_loss": -19.270282745361328, "global_step": 37157, "epoch": 447} {"train_loss": -19.23583984375, "global_step": 37158, "epoch": 447} {"train_loss": -19.019691467285156, "global_step": 37159, "epoch": 447} {"train_loss": -19.25319480895996, "global_step": 37160, "epoch": 447} {"train_loss": -19.338685989379883, "global_step": 37161, "epoch": 447} {"train_loss": -19.19417381286621, "global_step": 37162, "epoch": 447} {"train_loss": -19.1917781829834, "global_step": 37163, "epoch": 447} {"train_loss": -19.07346534729004, "global_step": 37164, "epoch": 447} {"train_loss": -19.395797729492188, "global_step": 37165, "epoch": 447} {"train_loss": -19.198524475097656, "global_step": 37166, "epoch": 447} {"train_loss": -19.350393295288086, "global_step": 37167, "epoch": 447} {"train_loss": -19.4504451751709, "global_step": 37168, "epoch": 447} {"train_loss": -19.48187828063965, "global_step": 37169, "epoch": 447} {"train_loss": -19.2398738861084, "global_step": 37170, "epoch": 447} {"train_loss": -19.40642738342285, "global_step": 37171, "epoch": 447} {"train_loss": -19.379148483276367, "global_step": 37172, "epoch": 447} {"train_loss": -19.325475692749023, "global_step": 37173, "epoch": 447} {"train_loss": -19.330610275268555, "global_step": 37174, "epoch": 447} {"train_loss": -19.232486724853516, "global_step": 37175, "epoch": 447} {"train_loss": -19.416913986206055, "global_step": 37176, "epoch": 447} {"train_loss": -19.42729377746582, "global_step": 37177, "epoch": 447} {"train_loss": -19.23386001586914, "global_step": 37178, "epoch": 447} {"train_loss": -19.48134994506836, "global_step": 37179, "epoch": 447} {"train_loss": -19.213552474975586, "global_step": 37180, "epoch": 447} {"train_loss": -19.231204986572266, "global_step": 37181, "epoch": 447} {"train_loss": -19.33283233642578, "global_step": 37182, "epoch": 447} {"train_loss": -19.283096658178124, "global_step": 37183, "epoch": 447, "val_loss": 5937751.0} {"train_loss": -19.02815818786621, "global_step": 37184, "epoch": 448} {"train_loss": -19.12180519104004, "global_step": 37185, "epoch": 448} {"train_loss": -19.001218795776367, "global_step": 37186, "epoch": 448} {"train_loss": -18.825788497924805, "global_step": 37187, "epoch": 448} {"train_loss": -19.126708984375, "global_step": 37188, "epoch": 448} {"train_loss": -19.516550064086914, "global_step": 37189, "epoch": 448} {"train_loss": -19.276330947875977, "global_step": 37190, "epoch": 448} {"train_loss": -19.26325225830078, "global_step": 37191, "epoch": 448} {"train_loss": -19.168643951416016, "global_step": 37192, "epoch": 448} {"train_loss": -19.393766403198242, "global_step": 37193, "epoch": 448} {"train_loss": -19.485410690307617, "global_step": 37194, "epoch": 448} {"train_loss": -19.410369873046875, "global_step": 37195, "epoch": 448} {"train_loss": -19.0885066986084, "global_step": 37196, "epoch": 448} {"train_loss": -19.29163932800293, "global_step": 37197, "epoch": 448} {"train_loss": -19.194089889526367, "global_step": 37198, "epoch": 448} {"train_loss": -19.474714279174805, "global_step": 37199, "epoch": 448} {"train_loss": -18.95452880859375, "global_step": 37200, "epoch": 448} {"train_loss": -19.104188919067383, "global_step": 37201, "epoch": 448} {"train_loss": -19.477079391479492, "global_step": 37202, "epoch": 448} {"train_loss": -19.506635665893555, "global_step": 37203, "epoch": 448} {"train_loss": -19.75675392150879, "global_step": 37204, "epoch": 448} {"train_loss": -19.307090759277344, "global_step": 37205, "epoch": 448} {"train_loss": -19.383705139160156, "global_step": 37206, "epoch": 448} {"train_loss": -19.470121383666992, "global_step": 37207, "epoch": 448} {"train_loss": -19.259159088134766, "global_step": 37208, "epoch": 448} {"train_loss": -19.471302032470703, "global_step": 37209, "epoch": 448} {"train_loss": -19.09006118774414, "global_step": 37210, "epoch": 448} {"train_loss": -19.3033447265625, "global_step": 37211, "epoch": 448} {"train_loss": -19.41156578063965, "global_step": 37212, "epoch": 448} {"train_loss": -19.32550621032715, "global_step": 37213, "epoch": 448} {"train_loss": -19.225461959838867, "global_step": 37214, "epoch": 448} {"train_loss": -19.211393356323242, "global_step": 37215, "epoch": 448} {"train_loss": -19.390653610229492, "global_step": 37216, "epoch": 448} {"train_loss": -19.58513641357422, "global_step": 37217, "epoch": 448} {"train_loss": -19.05057144165039, "global_step": 37218, "epoch": 448} {"train_loss": -19.289365768432617, "global_step": 37219, "epoch": 448} {"train_loss": -19.578115463256836, "global_step": 37220, "epoch": 448} {"train_loss": -19.309057235717773, "global_step": 37221, "epoch": 448} {"train_loss": -19.422138214111328, "global_step": 37222, "epoch": 448} {"train_loss": -19.485591888427734, "global_step": 37223, "epoch": 448} {"train_loss": -19.26352882385254, "global_step": 37224, "epoch": 448} {"train_loss": -19.071836471557617, "global_step": 37225, "epoch": 448} {"train_loss": -19.524869918823242, "global_step": 37226, "epoch": 448} {"train_loss": -19.239540100097656, "global_step": 37227, "epoch": 448} {"train_loss": -19.195926666259766, "global_step": 37228, "epoch": 448} {"train_loss": -19.4532527923584, "global_step": 37229, "epoch": 448} {"train_loss": -19.29053497314453, "global_step": 37230, "epoch": 448} {"train_loss": -19.194181442260742, "global_step": 37231, "epoch": 448} {"train_loss": -19.406490325927734, "global_step": 37232, "epoch": 448} {"train_loss": -19.42124366760254, "global_step": 37233, "epoch": 448} {"train_loss": -19.612934112548828, "global_step": 37234, "epoch": 448} {"train_loss": -19.040985107421875, "global_step": 37235, "epoch": 448} {"train_loss": -19.186634063720703, "global_step": 37236, "epoch": 448} {"train_loss": -19.5734920501709, "global_step": 37237, "epoch": 448} {"train_loss": -19.51955795288086, "global_step": 37238, "epoch": 448} {"train_loss": -19.319839477539062, "global_step": 37239, "epoch": 448} {"train_loss": -19.228788375854492, "global_step": 37240, "epoch": 448} {"train_loss": -19.398414611816406, "global_step": 37241, "epoch": 448} {"train_loss": -19.364511489868164, "global_step": 37242, "epoch": 448} {"train_loss": -19.514501571655273, "global_step": 37243, "epoch": 448} {"train_loss": -18.962421417236328, "global_step": 37244, "epoch": 448} {"train_loss": -19.441991806030273, "global_step": 37245, "epoch": 448} {"train_loss": -19.55936050415039, "global_step": 37246, "epoch": 448} {"train_loss": -19.210412979125977, "global_step": 37247, "epoch": 448} {"train_loss": -19.252958297729492, "global_step": 37248, "epoch": 448} {"train_loss": -19.071975708007812, "global_step": 37249, "epoch": 448} {"train_loss": -19.512304306030273, "global_step": 37250, "epoch": 448} {"train_loss": -19.586904525756836, "global_step": 37251, "epoch": 448} {"train_loss": -19.334714889526367, "global_step": 37252, "epoch": 448} {"train_loss": -18.890657424926758, "global_step": 37253, "epoch": 448} {"train_loss": -19.358476638793945, "global_step": 37254, "epoch": 448} {"train_loss": -19.39896011352539, "global_step": 37255, "epoch": 448} {"train_loss": -19.178573608398438, "global_step": 37256, "epoch": 448} {"train_loss": -19.45052146911621, "global_step": 37257, "epoch": 448} {"train_loss": -19.10146141052246, "global_step": 37258, "epoch": 448} {"train_loss": -19.60091209411621, "global_step": 37259, "epoch": 448} {"train_loss": -19.652267456054688, "global_step": 37260, "epoch": 448} {"train_loss": -19.304336547851562, "global_step": 37261, "epoch": 448} {"train_loss": -19.05459976196289, "global_step": 37262, "epoch": 448} {"train_loss": -18.92070198059082, "global_step": 37263, "epoch": 448} {"train_loss": -19.36935806274414, "global_step": 37264, "epoch": 448} {"train_loss": -19.232511520385742, "global_step": 37265, "epoch": 448} {"train_loss": -19.288527063576574, "global_step": 37266, "epoch": 448, "val_loss": 5933569.0} {"train_loss": -18.948566436767578, "global_step": 37267, "epoch": 449} {"train_loss": -19.112987518310547, "global_step": 37268, "epoch": 449} {"train_loss": -19.275785446166992, "global_step": 37269, "epoch": 449} {"train_loss": -19.363548278808594, "global_step": 37270, "epoch": 449} {"train_loss": -19.23177146911621, "global_step": 37271, "epoch": 449} {"train_loss": -19.07208251953125, "global_step": 37272, "epoch": 449} {"train_loss": -19.129175186157227, "global_step": 37273, "epoch": 449} {"train_loss": -18.987539291381836, "global_step": 37274, "epoch": 449} {"train_loss": -19.719404220581055, "global_step": 37275, "epoch": 449} {"train_loss": -19.17889976501465, "global_step": 37276, "epoch": 449} {"train_loss": -19.413801193237305, "global_step": 37277, "epoch": 449} {"train_loss": -19.63935661315918, "global_step": 37278, "epoch": 449} {"train_loss": -19.173538208007812, "global_step": 37279, "epoch": 449} {"train_loss": -19.25349235534668, "global_step": 37280, "epoch": 449} {"train_loss": -19.57185935974121, "global_step": 37281, "epoch": 449} {"train_loss": -19.0922794342041, "global_step": 37282, "epoch": 449} {"train_loss": -19.382404327392578, "global_step": 37283, "epoch": 449} {"train_loss": -19.226835250854492, "global_step": 37284, "epoch": 449} {"train_loss": -19.08650779724121, "global_step": 37285, "epoch": 449} {"train_loss": -19.18391990661621, "global_step": 37286, "epoch": 449} {"train_loss": -19.172351837158203, "global_step": 37287, "epoch": 449} {"train_loss": -19.00702476501465, "global_step": 37288, "epoch": 449} {"train_loss": -19.355161666870117, "global_step": 37289, "epoch": 449} {"train_loss": -19.125959396362305, "global_step": 37290, "epoch": 449} {"train_loss": -19.063934326171875, "global_step": 37291, "epoch": 449} {"train_loss": -19.179250717163086, "global_step": 37292, "epoch": 449} {"train_loss": -19.1561336517334, "global_step": 37293, "epoch": 449} {"train_loss": -19.190122604370117, "global_step": 37294, "epoch": 449} {"train_loss": -19.247671127319336, "global_step": 37295, "epoch": 449} {"train_loss": -18.890216827392578, "global_step": 37296, "epoch": 449} {"train_loss": -18.840341567993164, "global_step": 37297, "epoch": 449} {"train_loss": -19.250347137451172, "global_step": 37298, "epoch": 449} {"train_loss": -19.594274520874023, "global_step": 37299, "epoch": 449} {"train_loss": -19.281631469726562, "global_step": 37300, "epoch": 449} {"train_loss": -19.27097511291504, "global_step": 37301, "epoch": 449} {"train_loss": -19.16495132446289, "global_step": 37302, "epoch": 449} {"train_loss": -19.36903190612793, "global_step": 37303, "epoch": 449} {"train_loss": -19.48520278930664, "global_step": 37304, "epoch": 449} {"train_loss": -19.067893981933594, "global_step": 37305, "epoch": 449} {"train_loss": -19.4158935546875, "global_step": 37306, "epoch": 449} {"train_loss": -19.663822174072266, "global_step": 37307, "epoch": 449} {"train_loss": -19.435901641845703, "global_step": 37308, "epoch": 449} {"train_loss": -19.254926681518555, "global_step": 37309, "epoch": 449} {"train_loss": -19.1114559173584, "global_step": 37310, "epoch": 449} {"train_loss": -19.4694881439209, "global_step": 37311, "epoch": 449} {"train_loss": -19.2478084564209, "global_step": 37312, "epoch": 449} {"train_loss": -19.21118927001953, "global_step": 37313, "epoch": 449} {"train_loss": -19.419891357421875, "global_step": 37314, "epoch": 449} {"train_loss": -19.822757720947266, "global_step": 37315, "epoch": 449} {"train_loss": -19.33144187927246, "global_step": 37316, "epoch": 449} {"train_loss": -19.207351684570312, "global_step": 37317, "epoch": 449} {"train_loss": -18.736526489257812, "global_step": 37318, "epoch": 449} {"train_loss": -19.215238571166992, "global_step": 37319, "epoch": 449} {"train_loss": -18.776382446289062, "global_step": 37320, "epoch": 449} {"train_loss": -19.441162109375, "global_step": 37321, "epoch": 449} {"train_loss": -19.40608787536621, "global_step": 37322, "epoch": 449} {"train_loss": -19.599288940429688, "global_step": 37323, "epoch": 449} {"train_loss": -19.843374252319336, "global_step": 37324, "epoch": 449} {"train_loss": -19.406402587890625, "global_step": 37325, "epoch": 449} {"train_loss": -19.236692428588867, "global_step": 37326, "epoch": 449} {"train_loss": -19.47110366821289, "global_step": 37327, "epoch": 449} {"train_loss": -19.09290885925293, "global_step": 37328, "epoch": 449} {"train_loss": -19.420490264892578, "global_step": 37329, "epoch": 449} {"train_loss": -19.651784896850586, "global_step": 37330, "epoch": 449} {"train_loss": -19.21651840209961, "global_step": 37331, "epoch": 449} {"train_loss": -19.456392288208008, "global_step": 37332, "epoch": 449} {"train_loss": -19.376911163330078, "global_step": 37333, "epoch": 449} {"train_loss": -19.590377807617188, "global_step": 37334, "epoch": 449} {"train_loss": -19.20001792907715, "global_step": 37335, "epoch": 449} {"train_loss": -19.12120246887207, "global_step": 37336, "epoch": 449} {"train_loss": -19.231433868408203, "global_step": 37337, "epoch": 449} {"train_loss": -19.332096099853516, "global_step": 37338, "epoch": 449} {"train_loss": -19.159231185913086, "global_step": 37339, "epoch": 449} {"train_loss": -19.601654052734375, "global_step": 37340, "epoch": 449} {"train_loss": -19.0953311920166, "global_step": 37341, "epoch": 449} {"train_loss": -19.508943557739258, "global_step": 37342, "epoch": 449} {"train_loss": -19.40675163269043, "global_step": 37343, "epoch": 449} {"train_loss": -19.330982208251953, "global_step": 37344, "epoch": 449} {"train_loss": -19.2552490234375, "global_step": 37345, "epoch": 449} {"train_loss": -18.724790573120117, "global_step": 37346, "epoch": 449} {"train_loss": -19.387399673461914, "global_step": 37347, "epoch": 449} {"train_loss": -19.265995025634766, "global_step": 37348, "epoch": 449} {"train_loss": -19.287095495017176, "global_step": 37349, "epoch": 449, "val_loss": 5917373.0} {"train_loss": -18.85972023010254, "global_step": 37350, "epoch": 450} {"train_loss": -19.156034469604492, "global_step": 37351, "epoch": 450} {"train_loss": -19.008930206298828, "global_step": 37352, "epoch": 450} {"train_loss": -19.07053565979004, "global_step": 37353, "epoch": 450} {"train_loss": -19.179508209228516, "global_step": 37354, "epoch": 450} {"train_loss": -18.67450523376465, "global_step": 37355, "epoch": 450} {"train_loss": -19.378116607666016, "global_step": 37356, "epoch": 450} {"train_loss": -19.091896057128906, "global_step": 37357, "epoch": 450} {"train_loss": -19.03101921081543, "global_step": 37358, "epoch": 450} {"train_loss": -19.057641983032227, "global_step": 37359, "epoch": 450} {"train_loss": -19.432296752929688, "global_step": 37360, "epoch": 450} {"train_loss": -19.240415573120117, "global_step": 37361, "epoch": 450} {"train_loss": -19.39981460571289, "global_step": 37362, "epoch": 450} {"train_loss": -19.259103775024414, "global_step": 37363, "epoch": 450} {"train_loss": -18.773900985717773, "global_step": 37364, "epoch": 450} {"train_loss": -19.00032615661621, "global_step": 37365, "epoch": 450} {"train_loss": -19.20114517211914, "global_step": 37366, "epoch": 450} {"train_loss": -19.20261573791504, "global_step": 37367, "epoch": 450} {"train_loss": -19.383085250854492, "global_step": 37368, "epoch": 450} {"train_loss": -19.39105796813965, "global_step": 37369, "epoch": 450} {"train_loss": -19.328197479248047, "global_step": 37370, "epoch": 450} {"train_loss": -19.270917892456055, "global_step": 37371, "epoch": 450} {"train_loss": -19.265634536743164, "global_step": 37372, "epoch": 450} {"train_loss": -19.14832878112793, "global_step": 37373, "epoch": 450} {"train_loss": -19.262365341186523, "global_step": 37374, "epoch": 450} {"train_loss": -19.35138511657715, "global_step": 37375, "epoch": 450} {"train_loss": -18.8866024017334, "global_step": 37376, "epoch": 450} {"train_loss": -19.353483200073242, "global_step": 37377, "epoch": 450} {"train_loss": -19.154666900634766, "global_step": 37378, "epoch": 450} {"train_loss": -19.441892623901367, "global_step": 37379, "epoch": 450} {"train_loss": -19.368379592895508, "global_step": 37380, "epoch": 450} {"train_loss": -19.397937774658203, "global_step": 37381, "epoch": 450} {"train_loss": -19.073373794555664, "global_step": 37382, "epoch": 450} {"train_loss": -19.51432228088379, "global_step": 37383, "epoch": 450} {"train_loss": -19.666425704956055, "global_step": 37384, "epoch": 450} {"train_loss": -19.38374137878418, "global_step": 37385, "epoch": 450} {"train_loss": -18.983097076416016, "global_step": 37386, "epoch": 450} {"train_loss": -19.702314376831055, "global_step": 37387, "epoch": 450} {"train_loss": -19.243175506591797, "global_step": 37388, "epoch": 450} {"train_loss": -19.347097396850586, "global_step": 37389, "epoch": 450} {"train_loss": -18.918407440185547, "global_step": 37390, "epoch": 450} {"train_loss": -19.60463523864746, "global_step": 37391, "epoch": 450} {"train_loss": -19.34928321838379, "global_step": 37392, "epoch": 450} {"train_loss": -19.39423179626465, "global_step": 37393, "epoch": 450} {"train_loss": -19.53436851501465, "global_step": 37394, "epoch": 450} {"train_loss": -19.308103561401367, "global_step": 37395, "epoch": 450} {"train_loss": -19.178739547729492, "global_step": 37396, "epoch": 450} {"train_loss": -19.609113693237305, "global_step": 37397, "epoch": 450} {"train_loss": -19.503021240234375, "global_step": 37398, "epoch": 450} {"train_loss": -19.62424087524414, "global_step": 37399, "epoch": 450} {"train_loss": -19.14737319946289, "global_step": 37400, "epoch": 450} {"train_loss": -19.398639678955078, "global_step": 37401, "epoch": 450} {"train_loss": -19.522741317749023, "global_step": 37402, "epoch": 450} {"train_loss": -19.492603302001953, "global_step": 37403, "epoch": 450} {"train_loss": -19.596609115600586, "global_step": 37404, "epoch": 450} {"train_loss": -19.159521102905273, "global_step": 37405, "epoch": 450} {"train_loss": -19.262088775634766, "global_step": 37406, "epoch": 450} {"train_loss": -18.873838424682617, "global_step": 37407, "epoch": 450} {"train_loss": -19.333984375, "global_step": 37408, "epoch": 450} {"train_loss": -19.13104820251465, "global_step": 37409, "epoch": 450} {"train_loss": -19.25410270690918, "global_step": 37410, "epoch": 450} {"train_loss": -19.282426834106445, "global_step": 37411, "epoch": 450} {"train_loss": -19.304218292236328, "global_step": 37412, "epoch": 450} {"train_loss": -19.497344970703125, "global_step": 37413, "epoch": 450} {"train_loss": -19.26676368713379, "global_step": 37414, "epoch": 450} {"train_loss": -19.154050827026367, "global_step": 37415, "epoch": 450} {"train_loss": -19.10276222229004, "global_step": 37416, "epoch": 450} {"train_loss": -19.521652221679688, "global_step": 37417, "epoch": 450} {"train_loss": -19.362356185913086, "global_step": 37418, "epoch": 450} {"train_loss": -19.001270294189453, "global_step": 37419, "epoch": 450} {"train_loss": -19.27533531188965, "global_step": 37420, "epoch": 450} {"train_loss": -19.455345153808594, "global_step": 37421, "epoch": 450} {"train_loss": -19.537569046020508, "global_step": 37422, "epoch": 450} {"train_loss": -19.578256607055664, "global_step": 37423, "epoch": 450} {"train_loss": -19.269723892211914, "global_step": 37424, "epoch": 450} {"train_loss": -18.92218589782715, "global_step": 37425, "epoch": 450} {"train_loss": -19.600095748901367, "global_step": 37426, "epoch": 450} {"train_loss": -19.345489501953125, "global_step": 37427, "epoch": 450} {"train_loss": -19.352436065673828, "global_step": 37428, "epoch": 450} {"train_loss": -19.17701530456543, "global_step": 37429, "epoch": 450} {"train_loss": -19.260360717773438, "global_step": 37430, "epoch": 450} {"train_loss": -19.057117462158203, "global_step": 37431, "epoch": 450} {"train_loss": -19.262804399053735, "global_step": 37432, "epoch": 450, "train/sim_max_reward_0": 1.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 0.0, "train/sim_max_reward_4": 0.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4500000": 0.0, "test/sim_max_reward_4500001": 0.0, "test/sim_max_reward_4500002": 1.0, "test/sim_max_reward_4500003": 1.0, "test/sim_max_reward_4500004": 0.0, "test/sim_max_reward_4500005": 1.0, "test/sim_max_reward_4500006": 1.0, "test/sim_max_reward_4500007": 1.0, "test/sim_max_reward_4500008": 1.0, "test/sim_max_reward_4500009": 0.0, "test/sim_max_reward_4500010": 1.0, "test/sim_max_reward_4500011": 1.0, "test/sim_max_reward_4500012": 1.0, "test/sim_max_reward_4500013": 1.0, "test/sim_max_reward_4500014": 1.0, "test/sim_max_reward_4500015": 0.0, "test/sim_max_reward_4500016": 1.0, "test/sim_max_reward_4500017": 1.0, "test/sim_max_reward_4500018": 1.0, "test/sim_max_reward_4500019": 0.0, "test/sim_max_reward_4500020": 1.0, "test/sim_max_reward_4500021": 1.0, "train/mean_score": 0.6666666666666666, "test/mean_score": 0.7272727272727273, "val_loss": 6181297.0} {"train_loss": -19.410566329956055, "global_step": 37433, "epoch": 451} {"train_loss": -19.35816192626953, "global_step": 37434, "epoch": 451} {"train_loss": -19.201520919799805, "global_step": 37435, "epoch": 451} {"train_loss": -19.2802734375, "global_step": 37436, "epoch": 451} {"train_loss": -19.267169952392578, "global_step": 37437, "epoch": 451} {"train_loss": -19.17659568786621, "global_step": 37438, "epoch": 451} {"train_loss": -19.03618049621582, "global_step": 37439, "epoch": 451} {"train_loss": -19.039392471313477, "global_step": 37440, "epoch": 451} {"train_loss": -19.398475646972656, "global_step": 37441, "epoch": 451} {"train_loss": -19.41242027282715, "global_step": 37442, "epoch": 451} {"train_loss": -19.2241153717041, "global_step": 37443, "epoch": 451} {"train_loss": -19.2182674407959, "global_step": 37444, "epoch": 451} {"train_loss": -19.475378036499023, "global_step": 37445, "epoch": 451} {"train_loss": -19.043668746948242, "global_step": 37446, "epoch": 451} {"train_loss": -19.381366729736328, "global_step": 37447, "epoch": 451} {"train_loss": -19.32547378540039, "global_step": 37448, "epoch": 451} {"train_loss": -19.367855072021484, "global_step": 37449, "epoch": 451} {"train_loss": -19.57292938232422, "global_step": 37450, "epoch": 451} {"train_loss": -19.405765533447266, "global_step": 37451, "epoch": 451} {"train_loss": -18.916364669799805, "global_step": 37452, "epoch": 451} {"train_loss": -18.950193405151367, "global_step": 37453, "epoch": 451} {"train_loss": -19.897634506225586, "global_step": 37454, "epoch": 451} {"train_loss": -19.00539207458496, "global_step": 37455, "epoch": 451} {"train_loss": -19.414505004882812, "global_step": 37456, "epoch": 451} {"train_loss": -19.348840713500977, "global_step": 37457, "epoch": 451} {"train_loss": -19.626541137695312, "global_step": 37458, "epoch": 451} {"train_loss": -19.03880500793457, "global_step": 37459, "epoch": 451} {"train_loss": -19.382463455200195, "global_step": 37460, "epoch": 451} {"train_loss": -19.5446720123291, "global_step": 37461, "epoch": 451} {"train_loss": -19.63498306274414, "global_step": 37462, "epoch": 451} {"train_loss": -19.29498863220215, "global_step": 37463, "epoch": 451} {"train_loss": -19.086811065673828, "global_step": 37464, "epoch": 451} {"train_loss": -19.710142135620117, "global_step": 37465, "epoch": 451} {"train_loss": -19.15937614440918, "global_step": 37466, "epoch": 451} {"train_loss": -18.929061889648438, "global_step": 37467, "epoch": 451} {"train_loss": -19.3729305267334, "global_step": 37468, "epoch": 451} {"train_loss": -19.634244918823242, "global_step": 37469, "epoch": 451} {"train_loss": -19.366737365722656, "global_step": 37470, "epoch": 451} {"train_loss": -18.946319580078125, "global_step": 37471, "epoch": 451} {"train_loss": -19.57404899597168, "global_step": 37472, "epoch": 451} {"train_loss": -19.590801239013672, "global_step": 37473, "epoch": 451} {"train_loss": -19.325292587280273, "global_step": 37474, "epoch": 451} {"train_loss": -18.967912673950195, "global_step": 37475, "epoch": 451} {"train_loss": -19.436582565307617, "global_step": 37476, "epoch": 451} {"train_loss": -19.387065887451172, "global_step": 37477, "epoch": 451} {"train_loss": -19.552627563476562, "global_step": 37478, "epoch": 451} {"train_loss": -19.163440704345703, "global_step": 37479, "epoch": 451} {"train_loss": -18.802146911621094, "global_step": 37480, "epoch": 451} {"train_loss": -19.47339630126953, "global_step": 37481, "epoch": 451} {"train_loss": -18.984888076782227, "global_step": 37482, "epoch": 451} {"train_loss": -19.340421676635742, "global_step": 37483, "epoch": 451} {"train_loss": -19.600942611694336, "global_step": 37484, "epoch": 451} {"train_loss": -19.271011352539062, "global_step": 37485, "epoch": 451} {"train_loss": -19.013402938842773, "global_step": 37486, "epoch": 451} {"train_loss": -19.10457420349121, "global_step": 37487, "epoch": 451} {"train_loss": -19.213144302368164, "global_step": 37488, "epoch": 451} {"train_loss": -19.492380142211914, "global_step": 37489, "epoch": 451} {"train_loss": -19.423215866088867, "global_step": 37490, "epoch": 451} {"train_loss": -19.69247055053711, "global_step": 37491, "epoch": 451} {"train_loss": -19.206085205078125, "global_step": 37492, "epoch": 451} {"train_loss": -19.00751304626465, "global_step": 37493, "epoch": 451} {"train_loss": -19.392541885375977, "global_step": 37494, "epoch": 451} {"train_loss": -19.218719482421875, "global_step": 37495, "epoch": 451} {"train_loss": -19.132007598876953, "global_step": 37496, "epoch": 451} {"train_loss": -19.20576286315918, "global_step": 37497, "epoch": 451} {"train_loss": -19.391563415527344, "global_step": 37498, "epoch": 451} {"train_loss": -19.19157600402832, "global_step": 37499, "epoch": 451} {"train_loss": -19.117889404296875, "global_step": 37500, "epoch": 451} {"train_loss": -19.341461181640625, "global_step": 37501, "epoch": 451} {"train_loss": -19.262907028198242, "global_step": 37502, "epoch": 451} {"train_loss": -19.53125, "global_step": 37503, "epoch": 451} {"train_loss": -19.516170501708984, "global_step": 37504, "epoch": 451} {"train_loss": -19.537046432495117, "global_step": 37505, "epoch": 451} {"train_loss": -19.17145347595215, "global_step": 37506, "epoch": 451} {"train_loss": -18.965503692626953, "global_step": 37507, "epoch": 451} {"train_loss": -19.308950424194336, "global_step": 37508, "epoch": 451} {"train_loss": -19.076541900634766, "global_step": 37509, "epoch": 451} {"train_loss": -19.30865478515625, "global_step": 37510, "epoch": 451} {"train_loss": -19.168319702148438, "global_step": 37511, "epoch": 451} {"train_loss": -19.345298767089844, "global_step": 37512, "epoch": 451} {"train_loss": -19.12630844116211, "global_step": 37513, "epoch": 451} {"train_loss": -19.442480087280273, "global_step": 37514, "epoch": 451} {"train_loss": -19.294319129851928, "global_step": 37515, "epoch": 451, "val_loss": 5873111.0} {"train_loss": -18.74057388305664, "global_step": 37516, "epoch": 452} {"train_loss": -18.87745475769043, "global_step": 37517, "epoch": 452} {"train_loss": -19.26008415222168, "global_step": 37518, "epoch": 452} {"train_loss": -18.871557235717773, "global_step": 37519, "epoch": 452} {"train_loss": -19.253141403198242, "global_step": 37520, "epoch": 452} {"train_loss": -18.582412719726562, "global_step": 37521, "epoch": 452} {"train_loss": -19.173704147338867, "global_step": 37522, "epoch": 452} {"train_loss": -19.10432243347168, "global_step": 37523, "epoch": 452} {"train_loss": -19.435344696044922, "global_step": 37524, "epoch": 452} {"train_loss": -19.00124168395996, "global_step": 37525, "epoch": 452} {"train_loss": -18.879270553588867, "global_step": 37526, "epoch": 452} {"train_loss": -19.35567283630371, "global_step": 37527, "epoch": 452} {"train_loss": -19.104736328125, "global_step": 37528, "epoch": 452} {"train_loss": -19.07294273376465, "global_step": 37529, "epoch": 452} {"train_loss": -19.27543067932129, "global_step": 37530, "epoch": 452} {"train_loss": -19.317811965942383, "global_step": 37531, "epoch": 452} {"train_loss": -19.112226486206055, "global_step": 37532, "epoch": 452} {"train_loss": -19.36532974243164, "global_step": 37533, "epoch": 452} {"train_loss": -18.7830753326416, "global_step": 37534, "epoch": 452} {"train_loss": -19.385746002197266, "global_step": 37535, "epoch": 452} {"train_loss": -19.2308406829834, "global_step": 37536, "epoch": 452} {"train_loss": -19.154218673706055, "global_step": 37537, "epoch": 452} {"train_loss": -19.590946197509766, "global_step": 37538, "epoch": 452} {"train_loss": -19.28070831298828, "global_step": 37539, "epoch": 452} {"train_loss": -19.226654052734375, "global_step": 37540, "epoch": 452} {"train_loss": -19.471860885620117, "global_step": 37541, "epoch": 452} {"train_loss": -19.470876693725586, "global_step": 37542, "epoch": 452} {"train_loss": -19.45831871032715, "global_step": 37543, "epoch": 452} {"train_loss": -19.269582748413086, "global_step": 37544, "epoch": 452} {"train_loss": -19.153915405273438, "global_step": 37545, "epoch": 452} {"train_loss": -19.131031036376953, "global_step": 37546, "epoch": 452} {"train_loss": -19.16765594482422, "global_step": 37547, "epoch": 452} {"train_loss": -19.11775016784668, "global_step": 37548, "epoch": 452} {"train_loss": -19.16412353515625, "global_step": 37549, "epoch": 452} {"train_loss": -19.325902938842773, "global_step": 37550, "epoch": 452} {"train_loss": -19.204938888549805, "global_step": 37551, "epoch": 452} {"train_loss": -19.23464012145996, "global_step": 37552, "epoch": 452} {"train_loss": -19.38270378112793, "global_step": 37553, "epoch": 452} {"train_loss": -19.00197982788086, "global_step": 37554, "epoch": 452} {"train_loss": -19.382810592651367, "global_step": 37555, "epoch": 452} {"train_loss": -19.38542366027832, "global_step": 37556, "epoch": 452} {"train_loss": -19.465299606323242, "global_step": 37557, "epoch": 452} {"train_loss": -19.32567596435547, "global_step": 37558, "epoch": 452} {"train_loss": -19.404598236083984, "global_step": 37559, "epoch": 452} {"train_loss": -19.39154815673828, "global_step": 37560, "epoch": 452} {"train_loss": -19.494916915893555, "global_step": 37561, "epoch": 452} {"train_loss": -19.804378509521484, "global_step": 37562, "epoch": 452} {"train_loss": -19.15583610534668, "global_step": 37563, "epoch": 452} {"train_loss": -19.627099990844727, "global_step": 37564, "epoch": 452} {"train_loss": -19.38190269470215, "global_step": 37565, "epoch": 452} {"train_loss": -19.656627655029297, "global_step": 37566, "epoch": 452} {"train_loss": -19.069976806640625, "global_step": 37567, "epoch": 452} {"train_loss": -19.112085342407227, "global_step": 37568, "epoch": 452} {"train_loss": -18.913434982299805, "global_step": 37569, "epoch": 452} {"train_loss": -19.430316925048828, "global_step": 37570, "epoch": 452} {"train_loss": -19.30286407470703, "global_step": 37571, "epoch": 452} {"train_loss": -19.627676010131836, "global_step": 37572, "epoch": 452} {"train_loss": -19.07795524597168, "global_step": 37573, "epoch": 452} {"train_loss": -19.409385681152344, "global_step": 37574, "epoch": 452} {"train_loss": -19.062545776367188, "global_step": 37575, "epoch": 452} {"train_loss": -19.465280532836914, "global_step": 37576, "epoch": 452} {"train_loss": -19.097431182861328, "global_step": 37577, "epoch": 452} {"train_loss": -19.330638885498047, "global_step": 37578, "epoch": 452} {"train_loss": -19.366323471069336, "global_step": 37579, "epoch": 452} {"train_loss": -19.27629852294922, "global_step": 37580, "epoch": 452} {"train_loss": -19.428266525268555, "global_step": 37581, "epoch": 452} {"train_loss": -18.842214584350586, "global_step": 37582, "epoch": 452} {"train_loss": -19.564687728881836, "global_step": 37583, "epoch": 452} {"train_loss": -19.51675033569336, "global_step": 37584, "epoch": 452} {"train_loss": -18.99399185180664, "global_step": 37585, "epoch": 452} {"train_loss": -19.404781341552734, "global_step": 37586, "epoch": 452} {"train_loss": -19.038320541381836, "global_step": 37587, "epoch": 452} {"train_loss": -19.115339279174805, "global_step": 37588, "epoch": 452} {"train_loss": -19.439992904663086, "global_step": 37589, "epoch": 452} {"train_loss": -19.52741050720215, "global_step": 37590, "epoch": 452} {"train_loss": -19.353322982788086, "global_step": 37591, "epoch": 452} {"train_loss": -19.544429779052734, "global_step": 37592, "epoch": 452} {"train_loss": -18.946012496948242, "global_step": 37593, "epoch": 452} {"train_loss": -19.51833152770996, "global_step": 37594, "epoch": 452} {"train_loss": -18.9526424407959, "global_step": 37595, "epoch": 452} {"train_loss": -19.172555923461914, "global_step": 37596, "epoch": 452} {"train_loss": -19.145177841186523, "global_step": 37597, "epoch": 452} {"train_loss": -19.24253571751606, "global_step": 37598, "epoch": 452, "val_loss": 5872220.0} {"train_loss": -18.795339584350586, "global_step": 37599, "epoch": 453} {"train_loss": -18.905841827392578, "global_step": 37600, "epoch": 453} {"train_loss": -19.185317993164062, "global_step": 37601, "epoch": 453} {"train_loss": -18.771291732788086, "global_step": 37602, "epoch": 453} {"train_loss": -18.98955726623535, "global_step": 37603, "epoch": 453} {"train_loss": -19.40277671813965, "global_step": 37604, "epoch": 453} {"train_loss": -19.0062255859375, "global_step": 37605, "epoch": 453} {"train_loss": -18.843467712402344, "global_step": 37606, "epoch": 453} {"train_loss": -19.138874053955078, "global_step": 37607, "epoch": 453} {"train_loss": -19.2537784576416, "global_step": 37608, "epoch": 453} {"train_loss": -19.299875259399414, "global_step": 37609, "epoch": 453} {"train_loss": -19.186355590820312, "global_step": 37610, "epoch": 453} {"train_loss": -19.00136375427246, "global_step": 37611, "epoch": 453} {"train_loss": -19.372196197509766, "global_step": 37612, "epoch": 453} {"train_loss": -19.51612663269043, "global_step": 37613, "epoch": 453} {"train_loss": -19.298931121826172, "global_step": 37614, "epoch": 453} {"train_loss": -19.322738647460938, "global_step": 37615, "epoch": 453} {"train_loss": -19.216733932495117, "global_step": 37616, "epoch": 453} {"train_loss": -19.060089111328125, "global_step": 37617, "epoch": 453} {"train_loss": -19.495702743530273, "global_step": 37618, "epoch": 453} {"train_loss": -19.5775146484375, "global_step": 37619, "epoch": 453} {"train_loss": -19.398670196533203, "global_step": 37620, "epoch": 453} {"train_loss": -19.210479736328125, "global_step": 37621, "epoch": 453} {"train_loss": -19.489500045776367, "global_step": 37622, "epoch": 453} {"train_loss": -19.563823699951172, "global_step": 37623, "epoch": 453} {"train_loss": -19.618494033813477, "global_step": 37624, "epoch": 453} {"train_loss": -19.333478927612305, "global_step": 37625, "epoch": 453} {"train_loss": -18.953786849975586, "global_step": 37626, "epoch": 453} {"train_loss": -19.696060180664062, "global_step": 37627, "epoch": 453} {"train_loss": -19.736967086791992, "global_step": 37628, "epoch": 453} {"train_loss": -19.284849166870117, "global_step": 37629, "epoch": 453} {"train_loss": -19.58395004272461, "global_step": 37630, "epoch": 453} {"train_loss": -19.153907775878906, "global_step": 37631, "epoch": 453} {"train_loss": -19.347177505493164, "global_step": 37632, "epoch": 453} {"train_loss": -19.41481590270996, "global_step": 37633, "epoch": 453} {"train_loss": -19.395097732543945, "global_step": 37634, "epoch": 453} {"train_loss": -19.48720359802246, "global_step": 37635, "epoch": 453} {"train_loss": -19.273374557495117, "global_step": 37636, "epoch": 453} {"train_loss": -19.624021530151367, "global_step": 37637, "epoch": 453} {"train_loss": -19.121015548706055, "global_step": 37638, "epoch": 453} {"train_loss": -19.32698631286621, "global_step": 37639, "epoch": 453} {"train_loss": -19.619821548461914, "global_step": 37640, "epoch": 453} {"train_loss": -19.325223922729492, "global_step": 37641, "epoch": 453} {"train_loss": -19.47482681274414, "global_step": 37642, "epoch": 453} {"train_loss": -19.216903686523438, "global_step": 37643, "epoch": 453} {"train_loss": -19.12919044494629, "global_step": 37644, "epoch": 453} {"train_loss": -19.429397583007812, "global_step": 37645, "epoch": 453} {"train_loss": -18.93341064453125, "global_step": 37646, "epoch": 453} {"train_loss": -19.34528160095215, "global_step": 37647, "epoch": 453} {"train_loss": -19.0804386138916, "global_step": 37648, "epoch": 453} {"train_loss": -19.3963623046875, "global_step": 37649, "epoch": 453} {"train_loss": -19.107290267944336, "global_step": 37650, "epoch": 453} {"train_loss": -19.082975387573242, "global_step": 37651, "epoch": 453} {"train_loss": -19.545804977416992, "global_step": 37652, "epoch": 453} {"train_loss": -19.214405059814453, "global_step": 37653, "epoch": 453} {"train_loss": -19.371030807495117, "global_step": 37654, "epoch": 453} {"train_loss": -19.50263023376465, "global_step": 37655, "epoch": 453} {"train_loss": -19.152700424194336, "global_step": 37656, "epoch": 453} {"train_loss": -20.05491065979004, "global_step": 37657, "epoch": 453} {"train_loss": -19.55672264099121, "global_step": 37658, "epoch": 453} {"train_loss": -19.387365341186523, "global_step": 37659, "epoch": 453} {"train_loss": -19.385072708129883, "global_step": 37660, "epoch": 453} {"train_loss": -19.694881439208984, "global_step": 37661, "epoch": 453} {"train_loss": -19.315114974975586, "global_step": 37662, "epoch": 453} {"train_loss": -19.308958053588867, "global_step": 37663, "epoch": 453} {"train_loss": -19.163902282714844, "global_step": 37664, "epoch": 453} {"train_loss": -19.234485626220703, "global_step": 37665, "epoch": 453} {"train_loss": -19.516132354736328, "global_step": 37666, "epoch": 453} {"train_loss": -19.034313201904297, "global_step": 37667, "epoch": 453} {"train_loss": -19.446073532104492, "global_step": 37668, "epoch": 453} {"train_loss": -19.339862823486328, "global_step": 37669, "epoch": 453} {"train_loss": -19.19698715209961, "global_step": 37670, "epoch": 453} {"train_loss": -19.508529663085938, "global_step": 37671, "epoch": 453} {"train_loss": -19.320693969726562, "global_step": 37672, "epoch": 453} {"train_loss": -19.54764175415039, "global_step": 37673, "epoch": 453} {"train_loss": -19.577688217163086, "global_step": 37674, "epoch": 453} {"train_loss": -18.804224014282227, "global_step": 37675, "epoch": 453} {"train_loss": -19.42121696472168, "global_step": 37676, "epoch": 453} {"train_loss": -19.734874725341797, "global_step": 37677, "epoch": 453} {"train_loss": -19.36412239074707, "global_step": 37678, "epoch": 453} {"train_loss": -19.71311378479004, "global_step": 37679, "epoch": 453} {"train_loss": -19.161596298217773, "global_step": 37680, "epoch": 453} {"train_loss": -19.30774314145008, "global_step": 37681, "epoch": 453, "val_loss": 6024042.0} {"train_loss": -19.08391571044922, "global_step": 37682, "epoch": 454} {"train_loss": -19.46866226196289, "global_step": 37683, "epoch": 454} {"train_loss": -19.202167510986328, "global_step": 37684, "epoch": 454} {"train_loss": -18.97418785095215, "global_step": 37685, "epoch": 454} {"train_loss": -19.233640670776367, "global_step": 37686, "epoch": 454} {"train_loss": -19.317319869995117, "global_step": 37687, "epoch": 454} {"train_loss": -18.892419815063477, "global_step": 37688, "epoch": 454} {"train_loss": -18.88542366027832, "global_step": 37689, "epoch": 454} {"train_loss": -19.245702743530273, "global_step": 37690, "epoch": 454} {"train_loss": -19.205936431884766, "global_step": 37691, "epoch": 454} {"train_loss": -19.272396087646484, "global_step": 37692, "epoch": 454} {"train_loss": -19.06973648071289, "global_step": 37693, "epoch": 454} {"train_loss": -19.52884864807129, "global_step": 37694, "epoch": 454} {"train_loss": -19.44886016845703, "global_step": 37695, "epoch": 454} {"train_loss": -19.094141006469727, "global_step": 37696, "epoch": 454} {"train_loss": -19.09682273864746, "global_step": 37697, "epoch": 454} {"train_loss": -19.21278953552246, "global_step": 37698, "epoch": 454} {"train_loss": -19.546602249145508, "global_step": 37699, "epoch": 454} {"train_loss": -19.641677856445312, "global_step": 37700, "epoch": 454} {"train_loss": -18.75483512878418, "global_step": 37701, "epoch": 454} {"train_loss": -19.354642868041992, "global_step": 37702, "epoch": 454} {"train_loss": -19.49127197265625, "global_step": 37703, "epoch": 454} {"train_loss": -19.05607795715332, "global_step": 37704, "epoch": 454} {"train_loss": -19.374265670776367, "global_step": 37705, "epoch": 454} {"train_loss": -19.44075584411621, "global_step": 37706, "epoch": 454} {"train_loss": -19.416215896606445, "global_step": 37707, "epoch": 454} {"train_loss": -18.983001708984375, "global_step": 37708, "epoch": 454} {"train_loss": -19.384662628173828, "global_step": 37709, "epoch": 454} {"train_loss": -19.291471481323242, "global_step": 37710, "epoch": 454} {"train_loss": -19.49159049987793, "global_step": 37711, "epoch": 454} {"train_loss": -19.80953598022461, "global_step": 37712, "epoch": 454} {"train_loss": -19.309158325195312, "global_step": 37713, "epoch": 454} {"train_loss": -19.372196197509766, "global_step": 37714, "epoch": 454} {"train_loss": -19.908315658569336, "global_step": 37715, "epoch": 454} {"train_loss": -19.376188278198242, "global_step": 37716, "epoch": 454} {"train_loss": -19.32231903076172, "global_step": 37717, "epoch": 454} {"train_loss": -19.3100528717041, "global_step": 37718, "epoch": 454} {"train_loss": -19.117359161376953, "global_step": 37719, "epoch": 454} {"train_loss": -19.145645141601562, "global_step": 37720, "epoch": 454} {"train_loss": -19.520292282104492, "global_step": 37721, "epoch": 454} {"train_loss": -19.32109260559082, "global_step": 37722, "epoch": 454} {"train_loss": -19.3017520904541, "global_step": 37723, "epoch": 454} {"train_loss": -19.336524963378906, "global_step": 37724, "epoch": 454} {"train_loss": -19.49674415588379, "global_step": 37725, "epoch": 454} {"train_loss": -19.303070068359375, "global_step": 37726, "epoch": 454} {"train_loss": -19.573575973510742, "global_step": 37727, "epoch": 454} {"train_loss": -19.29096031188965, "global_step": 37728, "epoch": 454} {"train_loss": -19.329633712768555, "global_step": 37729, "epoch": 454} {"train_loss": -19.365644454956055, "global_step": 37730, "epoch": 454} {"train_loss": -19.50899887084961, "global_step": 37731, "epoch": 454} {"train_loss": -19.51930046081543, "global_step": 37732, "epoch": 454} {"train_loss": -19.29754638671875, "global_step": 37733, "epoch": 454} {"train_loss": -19.383512496948242, "global_step": 37734, "epoch": 454} {"train_loss": -19.576555252075195, "global_step": 37735, "epoch": 454} {"train_loss": -19.664810180664062, "global_step": 37736, "epoch": 454} {"train_loss": -18.9897518157959, "global_step": 37737, "epoch": 454} {"train_loss": -19.2945556640625, "global_step": 37738, "epoch": 454} {"train_loss": -19.373153686523438, "global_step": 37739, "epoch": 454} {"train_loss": -19.32028579711914, "global_step": 37740, "epoch": 454} {"train_loss": -19.382944107055664, "global_step": 37741, "epoch": 454} {"train_loss": -19.608339309692383, "global_step": 37742, "epoch": 454} {"train_loss": -19.05188751220703, "global_step": 37743, "epoch": 454} {"train_loss": -19.367847442626953, "global_step": 37744, "epoch": 454} {"train_loss": -19.669010162353516, "global_step": 37745, "epoch": 454} {"train_loss": -19.64106559753418, "global_step": 37746, "epoch": 454} {"train_loss": -19.49241828918457, "global_step": 37747, "epoch": 454} {"train_loss": -19.360488891601562, "global_step": 37748, "epoch": 454} {"train_loss": -19.443017959594727, "global_step": 37749, "epoch": 454} {"train_loss": -19.16054344177246, "global_step": 37750, "epoch": 454} {"train_loss": -19.475101470947266, "global_step": 37751, "epoch": 454} {"train_loss": -18.864688873291016, "global_step": 37752, "epoch": 454} {"train_loss": -19.357166290283203, "global_step": 37753, "epoch": 454} {"train_loss": -19.33714485168457, "global_step": 37754, "epoch": 454} {"train_loss": -19.1497802734375, "global_step": 37755, "epoch": 454} {"train_loss": -19.022493362426758, "global_step": 37756, "epoch": 454} {"train_loss": -19.60788345336914, "global_step": 37757, "epoch": 454} {"train_loss": -19.335935592651367, "global_step": 37758, "epoch": 454} {"train_loss": -19.307554244995117, "global_step": 37759, "epoch": 454} {"train_loss": -19.662473678588867, "global_step": 37760, "epoch": 454} {"train_loss": -19.41206932067871, "global_step": 37761, "epoch": 454} {"train_loss": -19.100812911987305, "global_step": 37762, "epoch": 454} {"train_loss": -19.1544246673584, "global_step": 37763, "epoch": 454} {"train_loss": -19.322249148265424, "global_step": 37764, "epoch": 454, "val_loss": 5995982.0} {"train_loss": -18.632307052612305, "global_step": 37765, "epoch": 455} {"train_loss": -18.87710952758789, "global_step": 37766, "epoch": 455} {"train_loss": -18.896394729614258, "global_step": 37767, "epoch": 455} {"train_loss": -18.9080867767334, "global_step": 37768, "epoch": 455} {"train_loss": -18.606266021728516, "global_step": 37769, "epoch": 455} {"train_loss": -18.89686393737793, "global_step": 37770, "epoch": 455} {"train_loss": -18.85601806640625, "global_step": 37771, "epoch": 455} {"train_loss": -19.111156463623047, "global_step": 37772, "epoch": 455} {"train_loss": -19.28046989440918, "global_step": 37773, "epoch": 455} {"train_loss": -19.225759506225586, "global_step": 37774, "epoch": 455} {"train_loss": -19.2855281829834, "global_step": 37775, "epoch": 455} {"train_loss": -19.11432456970215, "global_step": 37776, "epoch": 455} {"train_loss": -19.335708618164062, "global_step": 37777, "epoch": 455} {"train_loss": -19.302093505859375, "global_step": 37778, "epoch": 455} {"train_loss": -19.090972900390625, "global_step": 37779, "epoch": 455} {"train_loss": -19.1380672454834, "global_step": 37780, "epoch": 455} {"train_loss": -19.39304542541504, "global_step": 37781, "epoch": 455} {"train_loss": -19.11257553100586, "global_step": 37782, "epoch": 455} {"train_loss": -19.325397491455078, "global_step": 37783, "epoch": 455} {"train_loss": -19.31564712524414, "global_step": 37784, "epoch": 455} {"train_loss": -19.26497459411621, "global_step": 37785, "epoch": 455} {"train_loss": -18.7752742767334, "global_step": 37786, "epoch": 455} {"train_loss": -19.203163146972656, "global_step": 37787, "epoch": 455} {"train_loss": -19.40053367614746, "global_step": 37788, "epoch": 455} {"train_loss": -19.25307273864746, "global_step": 37789, "epoch": 455} {"train_loss": -19.507726669311523, "global_step": 37790, "epoch": 455} {"train_loss": -19.57685089111328, "global_step": 37791, "epoch": 455} {"train_loss": -19.081958770751953, "global_step": 37792, "epoch": 455} {"train_loss": -19.42962074279785, "global_step": 37793, "epoch": 455} {"train_loss": -19.2406063079834, "global_step": 37794, "epoch": 455} {"train_loss": -19.157621383666992, "global_step": 37795, "epoch": 455} {"train_loss": -19.480066299438477, "global_step": 37796, "epoch": 455} {"train_loss": -18.84866714477539, "global_step": 37797, "epoch": 455} {"train_loss": -19.197851181030273, "global_step": 37798, "epoch": 455} {"train_loss": -19.278247833251953, "global_step": 37799, "epoch": 455} {"train_loss": -19.402738571166992, "global_step": 37800, "epoch": 455} {"train_loss": -19.349197387695312, "global_step": 37801, "epoch": 455} {"train_loss": -19.633140563964844, "global_step": 37802, "epoch": 455} {"train_loss": -19.57512855529785, "global_step": 37803, "epoch": 455} {"train_loss": -19.68041229248047, "global_step": 37804, "epoch": 455} {"train_loss": -19.184255599975586, "global_step": 37805, "epoch": 455} {"train_loss": -19.506240844726562, "global_step": 37806, "epoch": 455} {"train_loss": -19.437414169311523, "global_step": 37807, "epoch": 455} {"train_loss": -19.317319869995117, "global_step": 37808, "epoch": 455} {"train_loss": -19.5576229095459, "global_step": 37809, "epoch": 455} {"train_loss": -19.13334083557129, "global_step": 37810, "epoch": 455} {"train_loss": -19.066431045532227, "global_step": 37811, "epoch": 455} {"train_loss": -19.3521785736084, "global_step": 37812, "epoch": 455} {"train_loss": -19.231801986694336, "global_step": 37813, "epoch": 455} {"train_loss": -19.569416046142578, "global_step": 37814, "epoch": 455} {"train_loss": -19.199237823486328, "global_step": 37815, "epoch": 455} {"train_loss": -19.54032325744629, "global_step": 37816, "epoch": 455} {"train_loss": -19.788982391357422, "global_step": 37817, "epoch": 455} {"train_loss": -19.088682174682617, "global_step": 37818, "epoch": 455} {"train_loss": -19.043447494506836, "global_step": 37819, "epoch": 455} {"train_loss": -19.392045974731445, "global_step": 37820, "epoch": 455} {"train_loss": -19.469144821166992, "global_step": 37821, "epoch": 455} {"train_loss": -19.448705673217773, "global_step": 37822, "epoch": 455} {"train_loss": -19.392425537109375, "global_step": 37823, "epoch": 455} {"train_loss": -19.33954620361328, "global_step": 37824, "epoch": 455} {"train_loss": -19.452970504760742, "global_step": 37825, "epoch": 455} {"train_loss": -19.80139923095703, "global_step": 37826, "epoch": 455} {"train_loss": -19.281269073486328, "global_step": 37827, "epoch": 455} {"train_loss": -19.372793197631836, "global_step": 37828, "epoch": 455} {"train_loss": -19.135229110717773, "global_step": 37829, "epoch": 455} {"train_loss": -19.601713180541992, "global_step": 37830, "epoch": 455} {"train_loss": -19.72417449951172, "global_step": 37831, "epoch": 455} {"train_loss": -19.586484909057617, "global_step": 37832, "epoch": 455} {"train_loss": -19.274625778198242, "global_step": 37833, "epoch": 455} {"train_loss": -19.660690307617188, "global_step": 37834, "epoch": 455} {"train_loss": -19.281843185424805, "global_step": 37835, "epoch": 455} {"train_loss": -18.931676864624023, "global_step": 37836, "epoch": 455} {"train_loss": -19.16704750061035, "global_step": 37837, "epoch": 455} {"train_loss": -19.513975143432617, "global_step": 37838, "epoch": 455} {"train_loss": -19.800382614135742, "global_step": 37839, "epoch": 455} {"train_loss": -19.821565628051758, "global_step": 37840, "epoch": 455} {"train_loss": -19.2990779876709, "global_step": 37841, "epoch": 455} {"train_loss": -19.290878295898438, "global_step": 37842, "epoch": 455} {"train_loss": -19.214677810668945, "global_step": 37843, "epoch": 455} {"train_loss": -19.397920608520508, "global_step": 37844, "epoch": 455} {"train_loss": -19.543554306030273, "global_step": 37845, "epoch": 455} {"train_loss": -19.205524444580078, "global_step": 37846, "epoch": 455} {"train_loss": -19.27332443788827, "global_step": 37847, "epoch": 455, "val_loss": 5986382.0} {"train_loss": -19.131025314331055, "global_step": 37848, "epoch": 456} {"train_loss": -19.198339462280273, "global_step": 37849, "epoch": 456} {"train_loss": -19.44346809387207, "global_step": 37850, "epoch": 456} {"train_loss": -19.438196182250977, "global_step": 37851, "epoch": 456} {"train_loss": -18.961414337158203, "global_step": 37852, "epoch": 456} {"train_loss": -19.155366897583008, "global_step": 37853, "epoch": 456} {"train_loss": -19.281389236450195, "global_step": 37854, "epoch": 456} {"train_loss": -19.670251846313477, "global_step": 37855, "epoch": 456} {"train_loss": -19.18449592590332, "global_step": 37856, "epoch": 456} {"train_loss": -19.32272720336914, "global_step": 37857, "epoch": 456} {"train_loss": -19.388172149658203, "global_step": 37858, "epoch": 456} {"train_loss": -19.239431381225586, "global_step": 37859, "epoch": 456} {"train_loss": -19.187580108642578, "global_step": 37860, "epoch": 456} {"train_loss": -19.176923751831055, "global_step": 37861, "epoch": 456} {"train_loss": -19.393779754638672, "global_step": 37862, "epoch": 456} {"train_loss": -19.26275634765625, "global_step": 37863, "epoch": 456} {"train_loss": -19.37721824645996, "global_step": 37864, "epoch": 456} {"train_loss": -19.054515838623047, "global_step": 37865, "epoch": 456} {"train_loss": -19.65509033203125, "global_step": 37866, "epoch": 456} {"train_loss": -19.118093490600586, "global_step": 37867, "epoch": 456} {"train_loss": -19.77915382385254, "global_step": 37868, "epoch": 456} {"train_loss": -19.266218185424805, "global_step": 37869, "epoch": 456} {"train_loss": -19.416725158691406, "global_step": 37870, "epoch": 456} {"train_loss": -19.71733283996582, "global_step": 37871, "epoch": 456} {"train_loss": -19.32204818725586, "global_step": 37872, "epoch": 456} {"train_loss": -19.052173614501953, "global_step": 37873, "epoch": 456} {"train_loss": -18.9804630279541, "global_step": 37874, "epoch": 456} {"train_loss": -19.51779556274414, "global_step": 37875, "epoch": 456} {"train_loss": -19.36251449584961, "global_step": 37876, "epoch": 456} {"train_loss": -18.845251083374023, "global_step": 37877, "epoch": 456} {"train_loss": -19.36221694946289, "global_step": 37878, "epoch": 456} {"train_loss": -19.055419921875, "global_step": 37879, "epoch": 456} {"train_loss": -19.450159072875977, "global_step": 37880, "epoch": 456} {"train_loss": -19.4049129486084, "global_step": 37881, "epoch": 456} {"train_loss": -19.555578231811523, "global_step": 37882, "epoch": 456} {"train_loss": -19.58686637878418, "global_step": 37883, "epoch": 456} {"train_loss": -19.15334129333496, "global_step": 37884, "epoch": 456} {"train_loss": -19.43146324157715, "global_step": 37885, "epoch": 456} {"train_loss": -19.266889572143555, "global_step": 37886, "epoch": 456} {"train_loss": -19.21779441833496, "global_step": 37887, "epoch": 456} {"train_loss": -19.422348022460938, "global_step": 37888, "epoch": 456} {"train_loss": -19.303983688354492, "global_step": 37889, "epoch": 456} {"train_loss": -19.405784606933594, "global_step": 37890, "epoch": 456} {"train_loss": -19.137847900390625, "global_step": 37891, "epoch": 456} {"train_loss": -19.50986671447754, "global_step": 37892, "epoch": 456} {"train_loss": -19.211423873901367, "global_step": 37893, "epoch": 456} {"train_loss": -19.687143325805664, "global_step": 37894, "epoch": 456} {"train_loss": -19.11127471923828, "global_step": 37895, "epoch": 456} {"train_loss": -19.584741592407227, "global_step": 37896, "epoch": 456} {"train_loss": -19.243383407592773, "global_step": 37897, "epoch": 456} {"train_loss": -19.431005477905273, "global_step": 37898, "epoch": 456} {"train_loss": -19.522613525390625, "global_step": 37899, "epoch": 456} {"train_loss": -19.078733444213867, "global_step": 37900, "epoch": 456} {"train_loss": -19.34754753112793, "global_step": 37901, "epoch": 456} {"train_loss": -19.66660499572754, "global_step": 37902, "epoch": 456} {"train_loss": -19.328935623168945, "global_step": 37903, "epoch": 456} {"train_loss": -18.972684860229492, "global_step": 37904, "epoch": 456} {"train_loss": -19.472021102905273, "global_step": 37905, "epoch": 456} {"train_loss": -19.356586456298828, "global_step": 37906, "epoch": 456} {"train_loss": -19.416807174682617, "global_step": 37907, "epoch": 456} {"train_loss": -19.57683563232422, "global_step": 37908, "epoch": 456} {"train_loss": -19.231698989868164, "global_step": 37909, "epoch": 456} {"train_loss": -19.606616973876953, "global_step": 37910, "epoch": 456} {"train_loss": -19.268842697143555, "global_step": 37911, "epoch": 456} {"train_loss": -19.78062629699707, "global_step": 37912, "epoch": 456} {"train_loss": -19.131628036499023, "global_step": 37913, "epoch": 456} {"train_loss": -19.50467872619629, "global_step": 37914, "epoch": 456} {"train_loss": -19.267980575561523, "global_step": 37915, "epoch": 456} {"train_loss": -19.349416732788086, "global_step": 37916, "epoch": 456} {"train_loss": -19.514163970947266, "global_step": 37917, "epoch": 456} {"train_loss": -19.392446517944336, "global_step": 37918, "epoch": 456} {"train_loss": -18.93340301513672, "global_step": 37919, "epoch": 456} {"train_loss": -19.37332534790039, "global_step": 37920, "epoch": 456} {"train_loss": -19.58684730529785, "global_step": 37921, "epoch": 456} {"train_loss": -19.643686294555664, "global_step": 37922, "epoch": 456} {"train_loss": -19.505502700805664, "global_step": 37923, "epoch": 456} {"train_loss": -19.072528839111328, "global_step": 37924, "epoch": 456} {"train_loss": -19.506223678588867, "global_step": 37925, "epoch": 456} {"train_loss": -19.4663143157959, "global_step": 37926, "epoch": 456} {"train_loss": -19.459638595581055, "global_step": 37927, "epoch": 456} {"train_loss": -19.421003341674805, "global_step": 37928, "epoch": 456} {"train_loss": -19.709625244140625, "global_step": 37929, "epoch": 456} {"train_loss": -19.358811275068536, "global_step": 37930, "epoch": 456, "val_loss": 6160928.5} {"train_loss": -19.646743774414062, "global_step": 37931, "epoch": 457} {"train_loss": -19.22564125061035, "global_step": 37932, "epoch": 457} {"train_loss": -19.05454444885254, "global_step": 37933, "epoch": 457} {"train_loss": -19.065139770507812, "global_step": 37934, "epoch": 457} {"train_loss": -19.007225036621094, "global_step": 37935, "epoch": 457} {"train_loss": -19.024290084838867, "global_step": 37936, "epoch": 457} {"train_loss": -19.515047073364258, "global_step": 37937, "epoch": 457} {"train_loss": -19.069955825805664, "global_step": 37938, "epoch": 457} {"train_loss": -19.059585571289062, "global_step": 37939, "epoch": 457} {"train_loss": -19.520307540893555, "global_step": 37940, "epoch": 457} {"train_loss": -19.10169792175293, "global_step": 37941, "epoch": 457} {"train_loss": -19.253955841064453, "global_step": 37942, "epoch": 457} {"train_loss": -19.24479866027832, "global_step": 37943, "epoch": 457} {"train_loss": -19.218297958374023, "global_step": 37944, "epoch": 457} {"train_loss": -19.648929595947266, "global_step": 37945, "epoch": 457} {"train_loss": -19.423765182495117, "global_step": 37946, "epoch": 457} {"train_loss": -19.26632308959961, "global_step": 37947, "epoch": 457} {"train_loss": -19.104787826538086, "global_step": 37948, "epoch": 457} {"train_loss": -19.066375732421875, "global_step": 37949, "epoch": 457} {"train_loss": -19.3785400390625, "global_step": 37950, "epoch": 457} {"train_loss": -19.560148239135742, "global_step": 37951, "epoch": 457} {"train_loss": -19.19242286682129, "global_step": 37952, "epoch": 457} {"train_loss": -18.946252822875977, "global_step": 37953, "epoch": 457} {"train_loss": -19.159305572509766, "global_step": 37954, "epoch": 457} {"train_loss": -19.47878074645996, "global_step": 37955, "epoch": 457} {"train_loss": -19.534563064575195, "global_step": 37956, "epoch": 457} {"train_loss": -19.281082153320312, "global_step": 37957, "epoch": 457} {"train_loss": -19.200300216674805, "global_step": 37958, "epoch": 457} {"train_loss": -19.612445831298828, "global_step": 37959, "epoch": 457} {"train_loss": -19.672895431518555, "global_step": 37960, "epoch": 457} {"train_loss": -19.31987762451172, "global_step": 37961, "epoch": 457} {"train_loss": -19.689041137695312, "global_step": 37962, "epoch": 457} {"train_loss": -19.24978256225586, "global_step": 37963, "epoch": 457} {"train_loss": -19.327322006225586, "global_step": 37964, "epoch": 457} {"train_loss": -19.334455490112305, "global_step": 37965, "epoch": 457} {"train_loss": -19.55381202697754, "global_step": 37966, "epoch": 457} {"train_loss": -19.191730499267578, "global_step": 37967, "epoch": 457} {"train_loss": -19.473947525024414, "global_step": 37968, "epoch": 457} {"train_loss": -19.428359985351562, "global_step": 37969, "epoch": 457} {"train_loss": -19.205699920654297, "global_step": 37970, "epoch": 457} {"train_loss": -19.278812408447266, "global_step": 37971, "epoch": 457} {"train_loss": -19.51225471496582, "global_step": 37972, "epoch": 457} {"train_loss": -19.196975708007812, "global_step": 37973, "epoch": 457} {"train_loss": -19.30574607849121, "global_step": 37974, "epoch": 457} {"train_loss": -19.19746971130371, "global_step": 37975, "epoch": 457} {"train_loss": -19.231033325195312, "global_step": 37976, "epoch": 457} {"train_loss": -19.01687240600586, "global_step": 37977, "epoch": 457} {"train_loss": -19.243391036987305, "global_step": 37978, "epoch": 457} {"train_loss": -19.479581832885742, "global_step": 37979, "epoch": 457} {"train_loss": -19.0933895111084, "global_step": 37980, "epoch": 457} {"train_loss": -19.55133628845215, "global_step": 37981, "epoch": 457} {"train_loss": -19.6279354095459, "global_step": 37982, "epoch": 457} {"train_loss": -19.147356033325195, "global_step": 37983, "epoch": 457} {"train_loss": -19.3525390625, "global_step": 37984, "epoch": 457} {"train_loss": -19.22059440612793, "global_step": 37985, "epoch": 457} {"train_loss": -19.377195358276367, "global_step": 37986, "epoch": 457} {"train_loss": -19.203933715820312, "global_step": 37987, "epoch": 457} {"train_loss": -19.448331832885742, "global_step": 37988, "epoch": 457} {"train_loss": -19.486082077026367, "global_step": 37989, "epoch": 457} {"train_loss": -19.362035751342773, "global_step": 37990, "epoch": 457} {"train_loss": -19.675579071044922, "global_step": 37991, "epoch": 457} {"train_loss": -19.740949630737305, "global_step": 37992, "epoch": 457} {"train_loss": -19.515277862548828, "global_step": 37993, "epoch": 457} {"train_loss": -19.337669372558594, "global_step": 37994, "epoch": 457} {"train_loss": -19.56435203552246, "global_step": 37995, "epoch": 457} {"train_loss": -19.50312614440918, "global_step": 37996, "epoch": 457} {"train_loss": -18.9356632232666, "global_step": 37997, "epoch": 457} {"train_loss": -19.60150909423828, "global_step": 37998, "epoch": 457} {"train_loss": -19.353668212890625, "global_step": 37999, "epoch": 457} {"train_loss": -19.433530807495117, "global_step": 38000, "epoch": 457} {"train_loss": -19.165103912353516, "global_step": 38001, "epoch": 457} {"train_loss": -19.443716049194336, "global_step": 38002, "epoch": 457} {"train_loss": -19.162384033203125, "global_step": 38003, "epoch": 457} {"train_loss": -19.2976131439209, "global_step": 38004, "epoch": 457} {"train_loss": -19.668060302734375, "global_step": 38005, "epoch": 457} {"train_loss": -19.42494010925293, "global_step": 38006, "epoch": 457} {"train_loss": -18.951824188232422, "global_step": 38007, "epoch": 457} {"train_loss": -19.509262084960938, "global_step": 38008, "epoch": 457} {"train_loss": -19.2767391204834, "global_step": 38009, "epoch": 457} {"train_loss": -19.52540397644043, "global_step": 38010, "epoch": 457} {"train_loss": -19.42082977294922, "global_step": 38011, "epoch": 457} {"train_loss": -19.252756118774414, "global_step": 38012, "epoch": 457} {"train_loss": -19.354055105921734, "global_step": 38013, "epoch": 457, "val_loss": 5983027.0} {"train_loss": -18.724254608154297, "global_step": 38014, "epoch": 458} {"train_loss": -19.004926681518555, "global_step": 38015, "epoch": 458} {"train_loss": -19.177000045776367, "global_step": 38016, "epoch": 458} {"train_loss": -19.004684448242188, "global_step": 38017, "epoch": 458} {"train_loss": -19.475751876831055, "global_step": 38018, "epoch": 458} {"train_loss": -18.94459342956543, "global_step": 38019, "epoch": 458} {"train_loss": -19.720670700073242, "global_step": 38020, "epoch": 458} {"train_loss": -18.724639892578125, "global_step": 38021, "epoch": 458} {"train_loss": -19.159543991088867, "global_step": 38022, "epoch": 458} {"train_loss": -19.433053970336914, "global_step": 38023, "epoch": 458} {"train_loss": -19.248931884765625, "global_step": 38024, "epoch": 458} {"train_loss": -19.342008590698242, "global_step": 38025, "epoch": 458} {"train_loss": -19.166772842407227, "global_step": 38026, "epoch": 458} {"train_loss": -19.552940368652344, "global_step": 38027, "epoch": 458} {"train_loss": -19.263694763183594, "global_step": 38028, "epoch": 458} {"train_loss": -19.147323608398438, "global_step": 38029, "epoch": 458} {"train_loss": -19.37160301208496, "global_step": 38030, "epoch": 458} {"train_loss": -18.978736877441406, "global_step": 38031, "epoch": 458} {"train_loss": -19.238645553588867, "global_step": 38032, "epoch": 458} {"train_loss": -19.555606842041016, "global_step": 38033, "epoch": 458} {"train_loss": -19.225675582885742, "global_step": 38034, "epoch": 458} {"train_loss": -19.11576271057129, "global_step": 38035, "epoch": 458} {"train_loss": -19.342300415039062, "global_step": 38036, "epoch": 458} {"train_loss": -19.385189056396484, "global_step": 38037, "epoch": 458} {"train_loss": -19.399337768554688, "global_step": 38038, "epoch": 458} {"train_loss": -19.312753677368164, "global_step": 38039, "epoch": 458} {"train_loss": -18.7515869140625, "global_step": 38040, "epoch": 458} {"train_loss": -19.36688804626465, "global_step": 38041, "epoch": 458} {"train_loss": -19.12380027770996, "global_step": 38042, "epoch": 458} {"train_loss": -19.734619140625, "global_step": 38043, "epoch": 458} {"train_loss": -19.422592163085938, "global_step": 38044, "epoch": 458} {"train_loss": -19.39393424987793, "global_step": 38045, "epoch": 458} {"train_loss": -19.34279441833496, "global_step": 38046, "epoch": 458} {"train_loss": -19.578168869018555, "global_step": 38047, "epoch": 458} {"train_loss": -19.459644317626953, "global_step": 38048, "epoch": 458} {"train_loss": -19.388442993164062, "global_step": 38049, "epoch": 458} {"train_loss": -19.396329879760742, "global_step": 38050, "epoch": 458} {"train_loss": -19.040502548217773, "global_step": 38051, "epoch": 458} {"train_loss": -19.233692169189453, "global_step": 38052, "epoch": 458} {"train_loss": -19.423465728759766, "global_step": 38053, "epoch": 458} {"train_loss": -19.448110580444336, "global_step": 38054, "epoch": 458} {"train_loss": -19.510202407836914, "global_step": 38055, "epoch": 458} {"train_loss": -19.658689498901367, "global_step": 38056, "epoch": 458} {"train_loss": -19.335712432861328, "global_step": 38057, "epoch": 458} {"train_loss": -19.5255069732666, "global_step": 38058, "epoch": 458} {"train_loss": -19.68423843383789, "global_step": 38059, "epoch": 458} {"train_loss": -19.118925094604492, "global_step": 38060, "epoch": 458} {"train_loss": -19.593442916870117, "global_step": 38061, "epoch": 458} {"train_loss": -19.356454849243164, "global_step": 38062, "epoch": 458} {"train_loss": -18.95976448059082, "global_step": 38063, "epoch": 458} {"train_loss": -19.475025177001953, "global_step": 38064, "epoch": 458} {"train_loss": -19.426570892333984, "global_step": 38065, "epoch": 458} {"train_loss": -19.648752212524414, "global_step": 38066, "epoch": 458} {"train_loss": -19.553083419799805, "global_step": 38067, "epoch": 458} {"train_loss": -19.48100471496582, "global_step": 38068, "epoch": 458} {"train_loss": -19.636062622070312, "global_step": 38069, "epoch": 458} {"train_loss": -18.797443389892578, "global_step": 38070, "epoch": 458} {"train_loss": -19.548433303833008, "global_step": 38071, "epoch": 458} {"train_loss": -19.490556716918945, "global_step": 38072, "epoch": 458} {"train_loss": -19.3688907623291, "global_step": 38073, "epoch": 458} {"train_loss": -19.03313446044922, "global_step": 38074, "epoch": 458} {"train_loss": -19.384933471679688, "global_step": 38075, "epoch": 458} {"train_loss": -18.818443298339844, "global_step": 38076, "epoch": 458} {"train_loss": -19.302776336669922, "global_step": 38077, "epoch": 458} {"train_loss": -19.27113151550293, "global_step": 38078, "epoch": 458} {"train_loss": -19.11276626586914, "global_step": 38079, "epoch": 458} {"train_loss": -19.456832885742188, "global_step": 38080, "epoch": 458} {"train_loss": -19.600025177001953, "global_step": 38081, "epoch": 458} {"train_loss": -19.48272132873535, "global_step": 38082, "epoch": 458} {"train_loss": -19.206235885620117, "global_step": 38083, "epoch": 458} {"train_loss": -19.25538444519043, "global_step": 38084, "epoch": 458} {"train_loss": -18.840909957885742, "global_step": 38085, "epoch": 458} {"train_loss": -19.004520416259766, "global_step": 38086, "epoch": 458} {"train_loss": -19.490966796875, "global_step": 38087, "epoch": 458} {"train_loss": -19.664478302001953, "global_step": 38088, "epoch": 458} {"train_loss": -19.20003890991211, "global_step": 38089, "epoch": 458} {"train_loss": -18.926990509033203, "global_step": 38090, "epoch": 458} {"train_loss": -19.246938705444336, "global_step": 38091, "epoch": 458} {"train_loss": -19.570995330810547, "global_step": 38092, "epoch": 458} {"train_loss": -19.273591995239258, "global_step": 38093, "epoch": 458} {"train_loss": -19.092443466186523, "global_step": 38094, "epoch": 458} {"train_loss": -19.399309158325195, "global_step": 38095, "epoch": 458} {"train_loss": -19.292132389114563, "global_step": 38096, "epoch": 458, "val_loss": 6082548.0} {"train_loss": -18.79846954345703, "global_step": 38097, "epoch": 459} {"train_loss": -18.660282135009766, "global_step": 38098, "epoch": 459} {"train_loss": -19.02105140686035, "global_step": 38099, "epoch": 459} {"train_loss": -18.910184860229492, "global_step": 38100, "epoch": 459} {"train_loss": -18.98885154724121, "global_step": 38101, "epoch": 459} {"train_loss": -19.339345932006836, "global_step": 38102, "epoch": 459} {"train_loss": -19.2352352142334, "global_step": 38103, "epoch": 459} {"train_loss": -19.37776756286621, "global_step": 38104, "epoch": 459} {"train_loss": -19.763933181762695, "global_step": 38105, "epoch": 459} {"train_loss": -19.061527252197266, "global_step": 38106, "epoch": 459} {"train_loss": -19.314756393432617, "global_step": 38107, "epoch": 459} {"train_loss": -19.52370262145996, "global_step": 38108, "epoch": 459} {"train_loss": -19.189990997314453, "global_step": 38109, "epoch": 459} {"train_loss": -19.43454360961914, "global_step": 38110, "epoch": 459} {"train_loss": -19.348920822143555, "global_step": 38111, "epoch": 459} {"train_loss": -19.497297286987305, "global_step": 38112, "epoch": 459} {"train_loss": -19.3992977142334, "global_step": 38113, "epoch": 459} {"train_loss": -19.460729598999023, "global_step": 38114, "epoch": 459} {"train_loss": -19.37806510925293, "global_step": 38115, "epoch": 459} {"train_loss": -19.39085578918457, "global_step": 38116, "epoch": 459} {"train_loss": -19.16633415222168, "global_step": 38117, "epoch": 459} {"train_loss": -19.40983009338379, "global_step": 38118, "epoch": 459} {"train_loss": -19.204172134399414, "global_step": 38119, "epoch": 459} {"train_loss": -19.09853172302246, "global_step": 38120, "epoch": 459} {"train_loss": -19.668590545654297, "global_step": 38121, "epoch": 459} {"train_loss": -19.45172119140625, "global_step": 38122, "epoch": 459} {"train_loss": -19.425466537475586, "global_step": 38123, "epoch": 459} {"train_loss": -19.567686080932617, "global_step": 38124, "epoch": 459} {"train_loss": -19.634458541870117, "global_step": 38125, "epoch": 459} {"train_loss": -19.31923484802246, "global_step": 38126, "epoch": 459} {"train_loss": -19.487741470336914, "global_step": 38127, "epoch": 459} {"train_loss": -19.5500431060791, "global_step": 38128, "epoch": 459} {"train_loss": -19.178359985351562, "global_step": 38129, "epoch": 459} {"train_loss": -19.186126708984375, "global_step": 38130, "epoch": 459} {"train_loss": -19.17479133605957, "global_step": 38131, "epoch": 459} {"train_loss": -19.097049713134766, "global_step": 38132, "epoch": 459} {"train_loss": -19.332786560058594, "global_step": 38133, "epoch": 459} {"train_loss": -19.074058532714844, "global_step": 38134, "epoch": 459} {"train_loss": -19.24787139892578, "global_step": 38135, "epoch": 459} {"train_loss": -19.18325424194336, "global_step": 38136, "epoch": 459} {"train_loss": -19.914968490600586, "global_step": 38137, "epoch": 459} {"train_loss": -19.29833984375, "global_step": 38138, "epoch": 459} {"train_loss": -19.060644149780273, "global_step": 38139, "epoch": 459} {"train_loss": -19.38814926147461, "global_step": 38140, "epoch": 459} {"train_loss": -19.424686431884766, "global_step": 38141, "epoch": 459} {"train_loss": -19.229230880737305, "global_step": 38142, "epoch": 459} {"train_loss": -19.212995529174805, "global_step": 38143, "epoch": 459} {"train_loss": -19.407516479492188, "global_step": 38144, "epoch": 459} {"train_loss": -19.170583724975586, "global_step": 38145, "epoch": 459} {"train_loss": -19.857500076293945, "global_step": 38146, "epoch": 459} {"train_loss": -19.3165340423584, "global_step": 38147, "epoch": 459} {"train_loss": -19.41904640197754, "global_step": 38148, "epoch": 459} {"train_loss": -19.585180282592773, "global_step": 38149, "epoch": 459} {"train_loss": -19.457380294799805, "global_step": 38150, "epoch": 459} {"train_loss": -19.608489990234375, "global_step": 38151, "epoch": 459} {"train_loss": -19.36623191833496, "global_step": 38152, "epoch": 459} {"train_loss": -19.470056533813477, "global_step": 38153, "epoch": 459} {"train_loss": -19.3232479095459, "global_step": 38154, "epoch": 459} {"train_loss": -19.5677490234375, "global_step": 38155, "epoch": 459} {"train_loss": -19.262178421020508, "global_step": 38156, "epoch": 459} {"train_loss": -19.53773307800293, "global_step": 38157, "epoch": 459} {"train_loss": -19.147140502929688, "global_step": 38158, "epoch": 459} {"train_loss": -19.28435707092285, "global_step": 38159, "epoch": 459} {"train_loss": -19.52783203125, "global_step": 38160, "epoch": 459} {"train_loss": -19.265003204345703, "global_step": 38161, "epoch": 459} {"train_loss": -19.166410446166992, "global_step": 38162, "epoch": 459} {"train_loss": -19.361064910888672, "global_step": 38163, "epoch": 459} {"train_loss": -19.189054489135742, "global_step": 38164, "epoch": 459} {"train_loss": -19.444963455200195, "global_step": 38165, "epoch": 459} {"train_loss": -19.769485473632812, "global_step": 38166, "epoch": 459} {"train_loss": -18.98714828491211, "global_step": 38167, "epoch": 459} {"train_loss": -19.2397518157959, "global_step": 38168, "epoch": 459} {"train_loss": -19.4049129486084, "global_step": 38169, "epoch": 459} {"train_loss": -19.147977828979492, "global_step": 38170, "epoch": 459} {"train_loss": -19.4569091796875, "global_step": 38171, "epoch": 459} {"train_loss": -19.319778442382812, "global_step": 38172, "epoch": 459} {"train_loss": -19.35748863220215, "global_step": 38173, "epoch": 459} {"train_loss": -19.03716278076172, "global_step": 38174, "epoch": 459} {"train_loss": -19.241735458374023, "global_step": 38175, "epoch": 459} {"train_loss": -19.193960189819336, "global_step": 38176, "epoch": 459} {"train_loss": -19.285871505737305, "global_step": 38177, "epoch": 459} {"train_loss": -19.5874080657959, "global_step": 38178, "epoch": 459} {"train_loss": -19.338926016566266, "global_step": 38179, "epoch": 459, "val_loss": 5938128.0} {"train_loss": -18.504478454589844, "global_step": 38180, "epoch": 460} {"train_loss": -19.25957679748535, "global_step": 38181, "epoch": 460} {"train_loss": -19.12548828125, "global_step": 38182, "epoch": 460} {"train_loss": -19.53304100036621, "global_step": 38183, "epoch": 460} {"train_loss": -19.245515823364258, "global_step": 38184, "epoch": 460} {"train_loss": -19.063688278198242, "global_step": 38185, "epoch": 460} {"train_loss": -19.50299644470215, "global_step": 38186, "epoch": 460} {"train_loss": -19.25988006591797, "global_step": 38187, "epoch": 460} {"train_loss": -19.175540924072266, "global_step": 38188, "epoch": 460} {"train_loss": -19.380958557128906, "global_step": 38189, "epoch": 460} {"train_loss": -19.3730525970459, "global_step": 38190, "epoch": 460} {"train_loss": -19.277179718017578, "global_step": 38191, "epoch": 460} {"train_loss": -19.070417404174805, "global_step": 38192, "epoch": 460} {"train_loss": -19.314176559448242, "global_step": 38193, "epoch": 460} {"train_loss": -19.339359283447266, "global_step": 38194, "epoch": 460} {"train_loss": -18.860794067382812, "global_step": 38195, "epoch": 460} {"train_loss": -19.334911346435547, "global_step": 38196, "epoch": 460} {"train_loss": -19.244121551513672, "global_step": 38197, "epoch": 460} {"train_loss": -19.45876693725586, "global_step": 38198, "epoch": 460} {"train_loss": -19.63494110107422, "global_step": 38199, "epoch": 460} {"train_loss": -19.529333114624023, "global_step": 38200, "epoch": 460} {"train_loss": -19.384069442749023, "global_step": 38201, "epoch": 460} {"train_loss": -19.50113868713379, "global_step": 38202, "epoch": 460} {"train_loss": -19.53387451171875, "global_step": 38203, "epoch": 460} {"train_loss": -19.713056564331055, "global_step": 38204, "epoch": 460} {"train_loss": -19.25741958618164, "global_step": 38205, "epoch": 460} {"train_loss": -19.206388473510742, "global_step": 38206, "epoch": 460} {"train_loss": -19.169448852539062, "global_step": 38207, "epoch": 460} {"train_loss": -19.575254440307617, "global_step": 38208, "epoch": 460} {"train_loss": -19.27163314819336, "global_step": 38209, "epoch": 460} {"train_loss": -18.84316635131836, "global_step": 38210, "epoch": 460} {"train_loss": -19.34528350830078, "global_step": 38211, "epoch": 460} {"train_loss": -19.211477279663086, "global_step": 38212, "epoch": 460} {"train_loss": -19.234914779663086, "global_step": 38213, "epoch": 460} {"train_loss": -19.373254776000977, "global_step": 38214, "epoch": 460} {"train_loss": -19.28018569946289, "global_step": 38215, "epoch": 460} {"train_loss": -19.62040901184082, "global_step": 38216, "epoch": 460} {"train_loss": -19.318876266479492, "global_step": 38217, "epoch": 460} {"train_loss": -19.247594833374023, "global_step": 38218, "epoch": 460} {"train_loss": -19.230100631713867, "global_step": 38219, "epoch": 460} {"train_loss": -19.131494522094727, "global_step": 38220, "epoch": 460} {"train_loss": -19.629796981811523, "global_step": 38221, "epoch": 460} {"train_loss": -19.066892623901367, "global_step": 38222, "epoch": 460} {"train_loss": -19.29742431640625, "global_step": 38223, "epoch": 460} {"train_loss": -19.106863021850586, "global_step": 38224, "epoch": 460} {"train_loss": -19.37600326538086, "global_step": 38225, "epoch": 460} {"train_loss": -19.599294662475586, "global_step": 38226, "epoch": 460} {"train_loss": -19.75847816467285, "global_step": 38227, "epoch": 460} {"train_loss": -19.578649520874023, "global_step": 38228, "epoch": 460} {"train_loss": -19.4746150970459, "global_step": 38229, "epoch": 460} {"train_loss": -19.499326705932617, "global_step": 38230, "epoch": 460} {"train_loss": -19.22045135498047, "global_step": 38231, "epoch": 460} {"train_loss": -19.597681045532227, "global_step": 38232, "epoch": 460} {"train_loss": -19.2125186920166, "global_step": 38233, "epoch": 460} {"train_loss": -19.640647888183594, "global_step": 38234, "epoch": 460} {"train_loss": -19.218297958374023, "global_step": 38235, "epoch": 460} {"train_loss": -19.445966720581055, "global_step": 38236, "epoch": 460} {"train_loss": -19.30817985534668, "global_step": 38237, "epoch": 460} {"train_loss": -19.382823944091797, "global_step": 38238, "epoch": 460} {"train_loss": -19.297758102416992, "global_step": 38239, "epoch": 460} {"train_loss": -19.413301467895508, "global_step": 38240, "epoch": 460} {"train_loss": -19.694704055786133, "global_step": 38241, "epoch": 460} {"train_loss": -19.697019577026367, "global_step": 38242, "epoch": 460} {"train_loss": -19.454496383666992, "global_step": 38243, "epoch": 460} {"train_loss": -19.25167465209961, "global_step": 38244, "epoch": 460} {"train_loss": -19.339366912841797, "global_step": 38245, "epoch": 460} {"train_loss": -19.12771987915039, "global_step": 38246, "epoch": 460} {"train_loss": -19.59095573425293, "global_step": 38247, "epoch": 460} {"train_loss": -19.332788467407227, "global_step": 38248, "epoch": 460} {"train_loss": -19.438032150268555, "global_step": 38249, "epoch": 460} {"train_loss": -19.09163475036621, "global_step": 38250, "epoch": 460} {"train_loss": -19.380582809448242, "global_step": 38251, "epoch": 460} {"train_loss": -19.588104248046875, "global_step": 38252, "epoch": 460} {"train_loss": -19.628812789916992, "global_step": 38253, "epoch": 460} {"train_loss": -19.197568893432617, "global_step": 38254, "epoch": 460} {"train_loss": -19.692514419555664, "global_step": 38255, "epoch": 460} {"train_loss": -19.186986923217773, "global_step": 38256, "epoch": 460} {"train_loss": -19.326932907104492, "global_step": 38257, "epoch": 460} {"train_loss": -19.22093391418457, "global_step": 38258, "epoch": 460} {"train_loss": -19.3625545501709, "global_step": 38259, "epoch": 460} {"train_loss": -19.36712074279785, "global_step": 38260, "epoch": 460} {"train_loss": -19.435466766357422, "global_step": 38261, "epoch": 460} {"train_loss": -19.357186466814525, "global_step": 38262, "epoch": 460, "val_loss": 5931019.0} {"train_loss": -18.82366943359375, "global_step": 38263, "epoch": 461} {"train_loss": -19.499235153198242, "global_step": 38264, "epoch": 461} {"train_loss": -19.28203773498535, "global_step": 38265, "epoch": 461} {"train_loss": -19.122053146362305, "global_step": 38266, "epoch": 461} {"train_loss": -19.20747184753418, "global_step": 38267, "epoch": 461} {"train_loss": -19.140857696533203, "global_step": 38268, "epoch": 461} {"train_loss": -18.457395553588867, "global_step": 38269, "epoch": 461} {"train_loss": -19.023303985595703, "global_step": 38270, "epoch": 461} {"train_loss": -19.348459243774414, "global_step": 38271, "epoch": 461} {"train_loss": -18.825061798095703, "global_step": 38272, "epoch": 461} {"train_loss": -19.219043731689453, "global_step": 38273, "epoch": 461} {"train_loss": -19.39644432067871, "global_step": 38274, "epoch": 461} {"train_loss": -18.9589900970459, "global_step": 38275, "epoch": 461} {"train_loss": -19.6037654876709, "global_step": 38276, "epoch": 461} {"train_loss": -19.096426010131836, "global_step": 38277, "epoch": 461} {"train_loss": -19.192228317260742, "global_step": 38278, "epoch": 461} {"train_loss": -19.416025161743164, "global_step": 38279, "epoch": 461} {"train_loss": -19.194677352905273, "global_step": 38280, "epoch": 461} {"train_loss": -19.559051513671875, "global_step": 38281, "epoch": 461} {"train_loss": -19.35624885559082, "global_step": 38282, "epoch": 461} {"train_loss": -19.622772216796875, "global_step": 38283, "epoch": 461} {"train_loss": -19.059423446655273, "global_step": 38284, "epoch": 461} {"train_loss": -19.392566680908203, "global_step": 38285, "epoch": 461} {"train_loss": -19.414793014526367, "global_step": 38286, "epoch": 461} {"train_loss": -19.183677673339844, "global_step": 38287, "epoch": 461} {"train_loss": -19.258649826049805, "global_step": 38288, "epoch": 461} {"train_loss": -19.36829948425293, "global_step": 38289, "epoch": 461} {"train_loss": -19.357942581176758, "global_step": 38290, "epoch": 461} {"train_loss": -19.36146354675293, "global_step": 38291, "epoch": 461} {"train_loss": -19.847341537475586, "global_step": 38292, "epoch": 461} {"train_loss": -19.443180084228516, "global_step": 38293, "epoch": 461} {"train_loss": -19.66136932373047, "global_step": 38294, "epoch": 461} {"train_loss": -19.219472885131836, "global_step": 38295, "epoch": 461} {"train_loss": -19.02814292907715, "global_step": 38296, "epoch": 461} {"train_loss": -19.498315811157227, "global_step": 38297, "epoch": 461} {"train_loss": -19.318492889404297, "global_step": 38298, "epoch": 461} {"train_loss": -19.08654022216797, "global_step": 38299, "epoch": 461} {"train_loss": -19.353118896484375, "global_step": 38300, "epoch": 461} {"train_loss": -19.053335189819336, "global_step": 38301, "epoch": 461} {"train_loss": -19.435182571411133, "global_step": 38302, "epoch": 461} {"train_loss": -19.525373458862305, "global_step": 38303, "epoch": 461} {"train_loss": -19.145599365234375, "global_step": 38304, "epoch": 461} {"train_loss": -19.522050857543945, "global_step": 38305, "epoch": 461} {"train_loss": -19.753084182739258, "global_step": 38306, "epoch": 461} {"train_loss": -19.09013557434082, "global_step": 38307, "epoch": 461} {"train_loss": -19.30049705505371, "global_step": 38308, "epoch": 461} {"train_loss": -19.1479434967041, "global_step": 38309, "epoch": 461} {"train_loss": -19.385263442993164, "global_step": 38310, "epoch": 461} {"train_loss": -19.26262664794922, "global_step": 38311, "epoch": 461} {"train_loss": -19.373092651367188, "global_step": 38312, "epoch": 461} {"train_loss": -19.139129638671875, "global_step": 38313, "epoch": 461} {"train_loss": -18.955053329467773, "global_step": 38314, "epoch": 461} {"train_loss": -19.489194869995117, "global_step": 38315, "epoch": 461} {"train_loss": -18.88867950439453, "global_step": 38316, "epoch": 461} {"train_loss": -19.446945190429688, "global_step": 38317, "epoch": 461} {"train_loss": -19.22697639465332, "global_step": 38318, "epoch": 461} {"train_loss": -19.357223510742188, "global_step": 38319, "epoch": 461} {"train_loss": -19.157835006713867, "global_step": 38320, "epoch": 461} {"train_loss": -18.98990249633789, "global_step": 38321, "epoch": 461} {"train_loss": -19.022661209106445, "global_step": 38322, "epoch": 461} {"train_loss": -19.062175750732422, "global_step": 38323, "epoch": 461} {"train_loss": -19.140043258666992, "global_step": 38324, "epoch": 461} {"train_loss": -19.742399215698242, "global_step": 38325, "epoch": 461} {"train_loss": -19.491641998291016, "global_step": 38326, "epoch": 461} {"train_loss": -19.320444107055664, "global_step": 38327, "epoch": 461} {"train_loss": -19.3198299407959, "global_step": 38328, "epoch": 461} {"train_loss": -19.571760177612305, "global_step": 38329, "epoch": 461} {"train_loss": -19.602935791015625, "global_step": 38330, "epoch": 461} {"train_loss": -19.233983993530273, "global_step": 38331, "epoch": 461} {"train_loss": -19.72419548034668, "global_step": 38332, "epoch": 461} {"train_loss": -18.960952758789062, "global_step": 38333, "epoch": 461} {"train_loss": -19.54826545715332, "global_step": 38334, "epoch": 461} {"train_loss": -19.536951065063477, "global_step": 38335, "epoch": 461} {"train_loss": -19.609481811523438, "global_step": 38336, "epoch": 461} {"train_loss": -19.547117233276367, "global_step": 38337, "epoch": 461} {"train_loss": -19.51764488220215, "global_step": 38338, "epoch": 461} {"train_loss": -19.299360275268555, "global_step": 38339, "epoch": 461} {"train_loss": -19.66779136657715, "global_step": 38340, "epoch": 461} {"train_loss": -19.55606460571289, "global_step": 38341, "epoch": 461} {"train_loss": -19.4040584564209, "global_step": 38342, "epoch": 461} {"train_loss": -19.124454498291016, "global_step": 38343, "epoch": 461} {"train_loss": -19.22332191467285, "global_step": 38344, "epoch": 461} {"train_loss": -19.30627733253571, "global_step": 38345, "epoch": 461, "val_loss": 6014900.0} {"train_loss": -18.929128646850586, "global_step": 38346, "epoch": 462} {"train_loss": -18.863554000854492, "global_step": 38347, "epoch": 462} {"train_loss": -19.07044792175293, "global_step": 38348, "epoch": 462} {"train_loss": -18.930255889892578, "global_step": 38349, "epoch": 462} {"train_loss": -19.38673210144043, "global_step": 38350, "epoch": 462} {"train_loss": -19.0407657623291, "global_step": 38351, "epoch": 462} {"train_loss": -19.093130111694336, "global_step": 38352, "epoch": 462} {"train_loss": -19.23932456970215, "global_step": 38353, "epoch": 462} {"train_loss": -19.233402252197266, "global_step": 38354, "epoch": 462} {"train_loss": -19.09807014465332, "global_step": 38355, "epoch": 462} {"train_loss": -19.508813858032227, "global_step": 38356, "epoch": 462} {"train_loss": -19.259536743164062, "global_step": 38357, "epoch": 462} {"train_loss": -19.48993492126465, "global_step": 38358, "epoch": 462} {"train_loss": -19.312164306640625, "global_step": 38359, "epoch": 462} {"train_loss": -19.130695343017578, "global_step": 38360, "epoch": 462} {"train_loss": -19.271347045898438, "global_step": 38361, "epoch": 462} {"train_loss": -19.262042999267578, "global_step": 38362, "epoch": 462} {"train_loss": -19.443981170654297, "global_step": 38363, "epoch": 462} {"train_loss": -19.588653564453125, "global_step": 38364, "epoch": 462} {"train_loss": -19.27049446105957, "global_step": 38365, "epoch": 462} {"train_loss": -18.932191848754883, "global_step": 38366, "epoch": 462} {"train_loss": -19.214847564697266, "global_step": 38367, "epoch": 462} {"train_loss": -19.06633949279785, "global_step": 38368, "epoch": 462} {"train_loss": -19.51570701599121, "global_step": 38369, "epoch": 462} {"train_loss": -19.454151153564453, "global_step": 38370, "epoch": 462} {"train_loss": -19.319128036499023, "global_step": 38371, "epoch": 462} {"train_loss": -19.08315086364746, "global_step": 38372, "epoch": 462} {"train_loss": -19.328659057617188, "global_step": 38373, "epoch": 462} {"train_loss": -19.28611946105957, "global_step": 38374, "epoch": 462} {"train_loss": -19.537683486938477, "global_step": 38375, "epoch": 462} {"train_loss": -19.10494041442871, "global_step": 38376, "epoch": 462} {"train_loss": -19.38596534729004, "global_step": 38377, "epoch": 462} {"train_loss": -19.36812400817871, "global_step": 38378, "epoch": 462} {"train_loss": -19.377391815185547, "global_step": 38379, "epoch": 462} {"train_loss": -19.51666831970215, "global_step": 38380, "epoch": 462} {"train_loss": -19.347064971923828, "global_step": 38381, "epoch": 462} {"train_loss": -19.486600875854492, "global_step": 38382, "epoch": 462} {"train_loss": -19.398225784301758, "global_step": 38383, "epoch": 462} {"train_loss": -19.642141342163086, "global_step": 38384, "epoch": 462} {"train_loss": -19.247085571289062, "global_step": 38385, "epoch": 462} {"train_loss": -19.71409034729004, "global_step": 38386, "epoch": 462} {"train_loss": -19.563953399658203, "global_step": 38387, "epoch": 462} {"train_loss": -19.371068954467773, "global_step": 38388, "epoch": 462} {"train_loss": -19.26590347290039, "global_step": 38389, "epoch": 462} {"train_loss": -19.791635513305664, "global_step": 38390, "epoch": 462} {"train_loss": -19.439165115356445, "global_step": 38391, "epoch": 462} {"train_loss": -19.2008113861084, "global_step": 38392, "epoch": 462} {"train_loss": -19.366178512573242, "global_step": 38393, "epoch": 462} {"train_loss": -19.17214012145996, "global_step": 38394, "epoch": 462} {"train_loss": -19.073699951171875, "global_step": 38395, "epoch": 462} {"train_loss": -19.409971237182617, "global_step": 38396, "epoch": 462} {"train_loss": -19.350671768188477, "global_step": 38397, "epoch": 462} {"train_loss": -19.97907066345215, "global_step": 38398, "epoch": 462} {"train_loss": -19.224668502807617, "global_step": 38399, "epoch": 462} {"train_loss": -19.80634117126465, "global_step": 38400, "epoch": 462} {"train_loss": -18.874156951904297, "global_step": 38401, "epoch": 462} {"train_loss": -19.310380935668945, "global_step": 38402, "epoch": 462} {"train_loss": -19.362760543823242, "global_step": 38403, "epoch": 462} {"train_loss": -19.17951774597168, "global_step": 38404, "epoch": 462} {"train_loss": -19.75547218322754, "global_step": 38405, "epoch": 462} {"train_loss": -19.023426055908203, "global_step": 38406, "epoch": 462} {"train_loss": -19.297290802001953, "global_step": 38407, "epoch": 462} {"train_loss": -19.453046798706055, "global_step": 38408, "epoch": 462} {"train_loss": -19.455175399780273, "global_step": 38409, "epoch": 462} {"train_loss": -19.253385543823242, "global_step": 38410, "epoch": 462} {"train_loss": -19.349462509155273, "global_step": 38411, "epoch": 462} {"train_loss": -19.077320098876953, "global_step": 38412, "epoch": 462} {"train_loss": -19.498287200927734, "global_step": 38413, "epoch": 462} {"train_loss": -19.767831802368164, "global_step": 38414, "epoch": 462} {"train_loss": -19.427549362182617, "global_step": 38415, "epoch": 462} {"train_loss": -19.40578269958496, "global_step": 38416, "epoch": 462} {"train_loss": -19.650632858276367, "global_step": 38417, "epoch": 462} {"train_loss": -19.17793083190918, "global_step": 38418, "epoch": 462} {"train_loss": -19.729856491088867, "global_step": 38419, "epoch": 462} {"train_loss": -19.377965927124023, "global_step": 38420, "epoch": 462} {"train_loss": -19.46326446533203, "global_step": 38421, "epoch": 462} {"train_loss": -19.22499656677246, "global_step": 38422, "epoch": 462} {"train_loss": -19.50315284729004, "global_step": 38423, "epoch": 462} {"train_loss": -19.045217514038086, "global_step": 38424, "epoch": 462} {"train_loss": -19.405887603759766, "global_step": 38425, "epoch": 462} {"train_loss": -19.412025451660156, "global_step": 38426, "epoch": 462} {"train_loss": -19.60007095336914, "global_step": 38427, "epoch": 462} {"train_loss": -19.338718506227057, "global_step": 38428, "epoch": 462, "val_loss": 5921426.5} {"train_loss": -19.21085548400879, "global_step": 38429, "epoch": 463} {"train_loss": -18.95795249938965, "global_step": 38430, "epoch": 463} {"train_loss": -19.295761108398438, "global_step": 38431, "epoch": 463} {"train_loss": -18.653732299804688, "global_step": 38432, "epoch": 463} {"train_loss": -19.052839279174805, "global_step": 38433, "epoch": 463} {"train_loss": -19.05028533935547, "global_step": 38434, "epoch": 463} {"train_loss": -19.366209030151367, "global_step": 38435, "epoch": 463} {"train_loss": -19.4251651763916, "global_step": 38436, "epoch": 463} {"train_loss": -19.109071731567383, "global_step": 38437, "epoch": 463} {"train_loss": -18.60015296936035, "global_step": 38438, "epoch": 463} {"train_loss": -19.3746280670166, "global_step": 38439, "epoch": 463} {"train_loss": -19.2741756439209, "global_step": 38440, "epoch": 463} {"train_loss": -19.467300415039062, "global_step": 38441, "epoch": 463} {"train_loss": -19.360576629638672, "global_step": 38442, "epoch": 463} {"train_loss": -19.126035690307617, "global_step": 38443, "epoch": 463} {"train_loss": -19.547056198120117, "global_step": 38444, "epoch": 463} {"train_loss": -19.44759178161621, "global_step": 38445, "epoch": 463} {"train_loss": -19.26003646850586, "global_step": 38446, "epoch": 463} {"train_loss": -19.31377410888672, "global_step": 38447, "epoch": 463} {"train_loss": -19.418067932128906, "global_step": 38448, "epoch": 463} {"train_loss": -19.276004791259766, "global_step": 38449, "epoch": 463} {"train_loss": -19.492416381835938, "global_step": 38450, "epoch": 463} {"train_loss": -19.4295654296875, "global_step": 38451, "epoch": 463} {"train_loss": -19.36118507385254, "global_step": 38452, "epoch": 463} {"train_loss": -19.640167236328125, "global_step": 38453, "epoch": 463} {"train_loss": -19.521137237548828, "global_step": 38454, "epoch": 463} {"train_loss": -19.621442794799805, "global_step": 38455, "epoch": 463} {"train_loss": -19.160490036010742, "global_step": 38456, "epoch": 463} {"train_loss": -19.13599395751953, "global_step": 38457, "epoch": 463} {"train_loss": -19.222715377807617, "global_step": 38458, "epoch": 463} {"train_loss": -18.83786964416504, "global_step": 38459, "epoch": 463} {"train_loss": -19.0128231048584, "global_step": 38460, "epoch": 463} {"train_loss": -19.138288497924805, "global_step": 38461, "epoch": 463} {"train_loss": -19.75206756591797, "global_step": 38462, "epoch": 463} {"train_loss": -19.39301872253418, "global_step": 38463, "epoch": 463} {"train_loss": -19.526988983154297, "global_step": 38464, "epoch": 463} {"train_loss": -19.755727767944336, "global_step": 38465, "epoch": 463} {"train_loss": -19.203664779663086, "global_step": 38466, "epoch": 463} {"train_loss": -19.203630447387695, "global_step": 38467, "epoch": 463} {"train_loss": -19.030866622924805, "global_step": 38468, "epoch": 463} {"train_loss": -19.3659610748291, "global_step": 38469, "epoch": 463} {"train_loss": -19.740827560424805, "global_step": 38470, "epoch": 463} {"train_loss": -19.508459091186523, "global_step": 38471, "epoch": 463} {"train_loss": -19.315765380859375, "global_step": 38472, "epoch": 463} {"train_loss": -19.432310104370117, "global_step": 38473, "epoch": 463} {"train_loss": -19.46302604675293, "global_step": 38474, "epoch": 463} {"train_loss": -19.397512435913086, "global_step": 38475, "epoch": 463} {"train_loss": -18.8353214263916, "global_step": 38476, "epoch": 463} {"train_loss": -19.33297348022461, "global_step": 38477, "epoch": 463} {"train_loss": -19.348539352416992, "global_step": 38478, "epoch": 463} {"train_loss": -19.28439712524414, "global_step": 38479, "epoch": 463} {"train_loss": -19.867223739624023, "global_step": 38480, "epoch": 463} {"train_loss": -19.636377334594727, "global_step": 38481, "epoch": 463} {"train_loss": -18.748458862304688, "global_step": 38482, "epoch": 463} {"train_loss": -19.12117576599121, "global_step": 38483, "epoch": 463} {"train_loss": -19.310476303100586, "global_step": 38484, "epoch": 463} {"train_loss": -19.078908920288086, "global_step": 38485, "epoch": 463} {"train_loss": -19.88421058654785, "global_step": 38486, "epoch": 463} {"train_loss": -19.38088035583496, "global_step": 38487, "epoch": 463} {"train_loss": -19.428800582885742, "global_step": 38488, "epoch": 463} {"train_loss": -19.391521453857422, "global_step": 38489, "epoch": 463} {"train_loss": -19.10890007019043, "global_step": 38490, "epoch": 463} {"train_loss": -19.508466720581055, "global_step": 38491, "epoch": 463} {"train_loss": -19.298358917236328, "global_step": 38492, "epoch": 463} {"train_loss": -19.406888961791992, "global_step": 38493, "epoch": 463} {"train_loss": -19.531455993652344, "global_step": 38494, "epoch": 463} {"train_loss": -19.09220314025879, "global_step": 38495, "epoch": 463} {"train_loss": -19.596643447875977, "global_step": 38496, "epoch": 463} {"train_loss": -19.4908504486084, "global_step": 38497, "epoch": 463} {"train_loss": -19.252479553222656, "global_step": 38498, "epoch": 463} {"train_loss": -19.284528732299805, "global_step": 38499, "epoch": 463} {"train_loss": -19.576509475708008, "global_step": 38500, "epoch": 463} {"train_loss": -19.48468589782715, "global_step": 38501, "epoch": 463} {"train_loss": -19.33332633972168, "global_step": 38502, "epoch": 463} {"train_loss": -19.402700424194336, "global_step": 38503, "epoch": 463} {"train_loss": -19.771514892578125, "global_step": 38504, "epoch": 463} {"train_loss": -19.368139266967773, "global_step": 38505, "epoch": 463} {"train_loss": -19.216222763061523, "global_step": 38506, "epoch": 463} {"train_loss": -19.348464965820312, "global_step": 38507, "epoch": 463} {"train_loss": -19.52644920349121, "global_step": 38508, "epoch": 463} {"train_loss": -19.311885833740234, "global_step": 38509, "epoch": 463} {"train_loss": -19.34990882873535, "global_step": 38510, "epoch": 463} {"train_loss": -19.32141216691718, "global_step": 38511, "epoch": 463, "val_loss": 6106422.5} {"train_loss": -19.175201416015625, "global_step": 38512, "epoch": 464} {"train_loss": -19.047574996948242, "global_step": 38513, "epoch": 464} {"train_loss": -19.415424346923828, "global_step": 38514, "epoch": 464} {"train_loss": -19.11215591430664, "global_step": 38515, "epoch": 464} {"train_loss": -18.84429931640625, "global_step": 38516, "epoch": 464} {"train_loss": -18.896459579467773, "global_step": 38517, "epoch": 464} {"train_loss": -19.254837036132812, "global_step": 38518, "epoch": 464} {"train_loss": -19.36933708190918, "global_step": 38519, "epoch": 464} {"train_loss": -19.329500198364258, "global_step": 38520, "epoch": 464} {"train_loss": -19.59579849243164, "global_step": 38521, "epoch": 464} {"train_loss": -18.97932243347168, "global_step": 38522, "epoch": 464} {"train_loss": -19.338134765625, "global_step": 38523, "epoch": 464} {"train_loss": -19.24262237548828, "global_step": 38524, "epoch": 464} {"train_loss": -19.135425567626953, "global_step": 38525, "epoch": 464} {"train_loss": -19.713224411010742, "global_step": 38526, "epoch": 464} {"train_loss": -19.353580474853516, "global_step": 38527, "epoch": 464} {"train_loss": -19.08418083190918, "global_step": 38528, "epoch": 464} {"train_loss": -19.28359031677246, "global_step": 38529, "epoch": 464} {"train_loss": -19.197904586791992, "global_step": 38530, "epoch": 464} {"train_loss": -19.400070190429688, "global_step": 38531, "epoch": 464} {"train_loss": -19.642196655273438, "global_step": 38532, "epoch": 464} {"train_loss": -19.1584529876709, "global_step": 38533, "epoch": 464} {"train_loss": -19.405033111572266, "global_step": 38534, "epoch": 464} {"train_loss": -19.603103637695312, "global_step": 38535, "epoch": 464} {"train_loss": -19.230783462524414, "global_step": 38536, "epoch": 464} {"train_loss": -19.37160301208496, "global_step": 38537, "epoch": 464} {"train_loss": -19.46329116821289, "global_step": 38538, "epoch": 464} {"train_loss": -19.35928726196289, "global_step": 38539, "epoch": 464} {"train_loss": -19.342546463012695, "global_step": 38540, "epoch": 464} {"train_loss": -19.26051139831543, "global_step": 38541, "epoch": 464} {"train_loss": -19.633514404296875, "global_step": 38542, "epoch": 464} {"train_loss": -19.52394676208496, "global_step": 38543, "epoch": 464} {"train_loss": -19.512968063354492, "global_step": 38544, "epoch": 464} {"train_loss": -19.497745513916016, "global_step": 38545, "epoch": 464} {"train_loss": -19.739500045776367, "global_step": 38546, "epoch": 464} {"train_loss": -19.24794578552246, "global_step": 38547, "epoch": 464} {"train_loss": -19.13797378540039, "global_step": 38548, "epoch": 464} {"train_loss": -19.223674774169922, "global_step": 38549, "epoch": 464} {"train_loss": -18.953222274780273, "global_step": 38550, "epoch": 464} {"train_loss": -19.507293701171875, "global_step": 38551, "epoch": 464} {"train_loss": -19.763513565063477, "global_step": 38552, "epoch": 464} {"train_loss": -19.18556785583496, "global_step": 38553, "epoch": 464} {"train_loss": -19.19516372680664, "global_step": 38554, "epoch": 464} {"train_loss": -19.33579444885254, "global_step": 38555, "epoch": 464} {"train_loss": -19.524812698364258, "global_step": 38556, "epoch": 464} {"train_loss": -19.10306167602539, "global_step": 38557, "epoch": 464} {"train_loss": -19.34762954711914, "global_step": 38558, "epoch": 464} {"train_loss": -19.54547691345215, "global_step": 38559, "epoch": 464} {"train_loss": -19.15718650817871, "global_step": 38560, "epoch": 464} {"train_loss": -19.50004768371582, "global_step": 38561, "epoch": 464} {"train_loss": -19.792394638061523, "global_step": 38562, "epoch": 464} {"train_loss": -19.147863388061523, "global_step": 38563, "epoch": 464} {"train_loss": -19.323833465576172, "global_step": 38564, "epoch": 464} {"train_loss": -19.342222213745117, "global_step": 38565, "epoch": 464} {"train_loss": -19.566259384155273, "global_step": 38566, "epoch": 464} {"train_loss": -19.152379989624023, "global_step": 38567, "epoch": 464} {"train_loss": -19.38142967224121, "global_step": 38568, "epoch": 464} {"train_loss": -19.356233596801758, "global_step": 38569, "epoch": 464} {"train_loss": -19.174421310424805, "global_step": 38570, "epoch": 464} {"train_loss": -19.280868530273438, "global_step": 38571, "epoch": 464} {"train_loss": -19.334049224853516, "global_step": 38572, "epoch": 464} {"train_loss": -19.73322105407715, "global_step": 38573, "epoch": 464} {"train_loss": -19.945337295532227, "global_step": 38574, "epoch": 464} {"train_loss": -19.316293716430664, "global_step": 38575, "epoch": 464} {"train_loss": -19.25433349609375, "global_step": 38576, "epoch": 464} {"train_loss": -19.276744842529297, "global_step": 38577, "epoch": 464} {"train_loss": -19.276233673095703, "global_step": 38578, "epoch": 464} {"train_loss": -19.363018035888672, "global_step": 38579, "epoch": 464} {"train_loss": -19.071308135986328, "global_step": 38580, "epoch": 464} {"train_loss": -19.662099838256836, "global_step": 38581, "epoch": 464} {"train_loss": -19.28350257873535, "global_step": 38582, "epoch": 464} {"train_loss": -19.005277633666992, "global_step": 38583, "epoch": 464} {"train_loss": -19.408594131469727, "global_step": 38584, "epoch": 464} {"train_loss": -19.448984146118164, "global_step": 38585, "epoch": 464} {"train_loss": -19.413333892822266, "global_step": 38586, "epoch": 464} {"train_loss": -19.45018768310547, "global_step": 38587, "epoch": 464} {"train_loss": -19.220373153686523, "global_step": 38588, "epoch": 464} {"train_loss": -18.927509307861328, "global_step": 38589, "epoch": 464} {"train_loss": -19.39340591430664, "global_step": 38590, "epoch": 464} {"train_loss": -19.561803817749023, "global_step": 38591, "epoch": 464} {"train_loss": -19.836965560913086, "global_step": 38592, "epoch": 464} {"train_loss": -19.402116775512695, "global_step": 38593, "epoch": 464} {"train_loss": -19.333804624626435, "global_step": 38594, "epoch": 464, "val_loss": 6038864.0} {"train_loss": -18.854293823242188, "global_step": 38595, "epoch": 465} {"train_loss": -19.11936378479004, "global_step": 38596, "epoch": 465} {"train_loss": -19.31852149963379, "global_step": 38597, "epoch": 465} {"train_loss": -19.012218475341797, "global_step": 38598, "epoch": 465} {"train_loss": -19.425703048706055, "global_step": 38599, "epoch": 465} {"train_loss": -19.148588180541992, "global_step": 38600, "epoch": 465} {"train_loss": -19.46344566345215, "global_step": 38601, "epoch": 465} {"train_loss": -19.352935791015625, "global_step": 38602, "epoch": 465} {"train_loss": -19.54969596862793, "global_step": 38603, "epoch": 465} {"train_loss": -18.81412696838379, "global_step": 38604, "epoch": 465} {"train_loss": -19.360000610351562, "global_step": 38605, "epoch": 465} {"train_loss": -19.246440887451172, "global_step": 38606, "epoch": 465} {"train_loss": -19.364028930664062, "global_step": 38607, "epoch": 465} {"train_loss": -19.247461318969727, "global_step": 38608, "epoch": 465} {"train_loss": -19.034212112426758, "global_step": 38609, "epoch": 465} {"train_loss": -19.322086334228516, "global_step": 38610, "epoch": 465} {"train_loss": -19.209829330444336, "global_step": 38611, "epoch": 465} {"train_loss": -19.190998077392578, "global_step": 38612, "epoch": 465} {"train_loss": -19.413259506225586, "global_step": 38613, "epoch": 465} {"train_loss": -19.409133911132812, "global_step": 38614, "epoch": 465} {"train_loss": -19.504486083984375, "global_step": 38615, "epoch": 465} {"train_loss": -19.38225746154785, "global_step": 38616, "epoch": 465} {"train_loss": -19.68691635131836, "global_step": 38617, "epoch": 465} {"train_loss": -19.12651252746582, "global_step": 38618, "epoch": 465} {"train_loss": -19.086698532104492, "global_step": 38619, "epoch": 465} {"train_loss": -19.6068115234375, "global_step": 38620, "epoch": 465} {"train_loss": -19.20610237121582, "global_step": 38621, "epoch": 465} {"train_loss": -19.294851303100586, "global_step": 38622, "epoch": 465} {"train_loss": -18.94549560546875, "global_step": 38623, "epoch": 465} {"train_loss": -19.206729888916016, "global_step": 38624, "epoch": 465} {"train_loss": -19.321565628051758, "global_step": 38625, "epoch": 465} {"train_loss": -19.580472946166992, "global_step": 38626, "epoch": 465} {"train_loss": -19.656082153320312, "global_step": 38627, "epoch": 465} {"train_loss": -19.219812393188477, "global_step": 38628, "epoch": 465} {"train_loss": -19.638635635375977, "global_step": 38629, "epoch": 465} {"train_loss": -19.49215316772461, "global_step": 38630, "epoch": 465} {"train_loss": -19.21839714050293, "global_step": 38631, "epoch": 465} {"train_loss": -19.2752742767334, "global_step": 38632, "epoch": 465} {"train_loss": -19.43994140625, "global_step": 38633, "epoch": 465} {"train_loss": -19.810636520385742, "global_step": 38634, "epoch": 465} {"train_loss": -19.150129318237305, "global_step": 38635, "epoch": 465} {"train_loss": -19.246816635131836, "global_step": 38636, "epoch": 465} {"train_loss": -19.270841598510742, "global_step": 38637, "epoch": 465} {"train_loss": -19.760700225830078, "global_step": 38638, "epoch": 465} {"train_loss": -19.336334228515625, "global_step": 38639, "epoch": 465} {"train_loss": -19.543212890625, "global_step": 38640, "epoch": 465} {"train_loss": -19.428089141845703, "global_step": 38641, "epoch": 465} {"train_loss": -19.446884155273438, "global_step": 38642, "epoch": 465} {"train_loss": -19.266376495361328, "global_step": 38643, "epoch": 465} {"train_loss": -18.948551177978516, "global_step": 38644, "epoch": 465} {"train_loss": -19.701692581176758, "global_step": 38645, "epoch": 465} {"train_loss": -19.468393325805664, "global_step": 38646, "epoch": 465} {"train_loss": -19.4409122467041, "global_step": 38647, "epoch": 465} {"train_loss": -18.876874923706055, "global_step": 38648, "epoch": 465} {"train_loss": -19.36808204650879, "global_step": 38649, "epoch": 465} {"train_loss": -19.37421226501465, "global_step": 38650, "epoch": 465} {"train_loss": -19.356935501098633, "global_step": 38651, "epoch": 465} {"train_loss": -19.52374839782715, "global_step": 38652, "epoch": 465} {"train_loss": -19.4310302734375, "global_step": 38653, "epoch": 465} {"train_loss": -19.203676223754883, "global_step": 38654, "epoch": 465} {"train_loss": -19.39322280883789, "global_step": 38655, "epoch": 465} {"train_loss": -19.5452938079834, "global_step": 38656, "epoch": 465} {"train_loss": -19.021297454833984, "global_step": 38657, "epoch": 465} {"train_loss": -19.59786033630371, "global_step": 38658, "epoch": 465} {"train_loss": -19.176164627075195, "global_step": 38659, "epoch": 465} {"train_loss": -19.193103790283203, "global_step": 38660, "epoch": 465} {"train_loss": -19.783435821533203, "global_step": 38661, "epoch": 465} {"train_loss": -19.481857299804688, "global_step": 38662, "epoch": 465} {"train_loss": -19.523517608642578, "global_step": 38663, "epoch": 465} {"train_loss": -19.24079704284668, "global_step": 38664, "epoch": 465} {"train_loss": -19.277469635009766, "global_step": 38665, "epoch": 465} {"train_loss": -19.692747116088867, "global_step": 38666, "epoch": 465} {"train_loss": -19.421979904174805, "global_step": 38667, "epoch": 465} {"train_loss": -19.929645538330078, "global_step": 38668, "epoch": 465} {"train_loss": -19.896299362182617, "global_step": 38669, "epoch": 465} {"train_loss": -19.442277908325195, "global_step": 38670, "epoch": 465} {"train_loss": -19.468862533569336, "global_step": 38671, "epoch": 465} {"train_loss": -19.54085922241211, "global_step": 38672, "epoch": 465} {"train_loss": -19.577442169189453, "global_step": 38673, "epoch": 465} {"train_loss": -19.427677154541016, "global_step": 38674, "epoch": 465} {"train_loss": -19.497121810913086, "global_step": 38675, "epoch": 465} {"train_loss": -19.33180809020996, "global_step": 38676, "epoch": 465} {"train_loss": -19.395644452198443, "global_step": 38677, "epoch": 465, "val_loss": 5976378.0} {"train_loss": -18.956090927124023, "global_step": 38678, "epoch": 466} {"train_loss": -19.426788330078125, "global_step": 38679, "epoch": 466} {"train_loss": -18.98412322998047, "global_step": 38680, "epoch": 466} {"train_loss": -19.435955047607422, "global_step": 38681, "epoch": 466} {"train_loss": -19.108421325683594, "global_step": 38682, "epoch": 466} {"train_loss": -19.177778244018555, "global_step": 38683, "epoch": 466} {"train_loss": -19.127399444580078, "global_step": 38684, "epoch": 466} {"train_loss": -19.236310958862305, "global_step": 38685, "epoch": 466} {"train_loss": -19.40558433532715, "global_step": 38686, "epoch": 466} {"train_loss": -19.25271987915039, "global_step": 38687, "epoch": 466} {"train_loss": -19.42167854309082, "global_step": 38688, "epoch": 466} {"train_loss": -19.39491844177246, "global_step": 38689, "epoch": 466} {"train_loss": -19.415470123291016, "global_step": 38690, "epoch": 466} {"train_loss": -19.12053680419922, "global_step": 38691, "epoch": 466} {"train_loss": -19.255094528198242, "global_step": 38692, "epoch": 466} {"train_loss": -19.364404678344727, "global_step": 38693, "epoch": 466} {"train_loss": -19.727676391601562, "global_step": 38694, "epoch": 466} {"train_loss": -19.395984649658203, "global_step": 38695, "epoch": 466} {"train_loss": -18.995553970336914, "global_step": 38696, "epoch": 466} {"train_loss": -19.34103775024414, "global_step": 38697, "epoch": 466} {"train_loss": -19.17876625061035, "global_step": 38698, "epoch": 466} {"train_loss": -19.10079574584961, "global_step": 38699, "epoch": 466} {"train_loss": -19.223974227905273, "global_step": 38700, "epoch": 466} {"train_loss": -19.10768699645996, "global_step": 38701, "epoch": 466} {"train_loss": -19.343353271484375, "global_step": 38702, "epoch": 466} {"train_loss": -18.92609214782715, "global_step": 38703, "epoch": 466} {"train_loss": -19.019411087036133, "global_step": 38704, "epoch": 466} {"train_loss": -19.61615753173828, "global_step": 38705, "epoch": 466} {"train_loss": -18.92182731628418, "global_step": 38706, "epoch": 466} {"train_loss": -19.55611228942871, "global_step": 38707, "epoch": 466} {"train_loss": -19.259923934936523, "global_step": 38708, "epoch": 466} {"train_loss": -19.412267684936523, "global_step": 38709, "epoch": 466} {"train_loss": -19.334125518798828, "global_step": 38710, "epoch": 466} {"train_loss": -19.266035079956055, "global_step": 38711, "epoch": 466} {"train_loss": -19.30670738220215, "global_step": 38712, "epoch": 466} {"train_loss": -19.464614868164062, "global_step": 38713, "epoch": 466} {"train_loss": -19.492961883544922, "global_step": 38714, "epoch": 466} {"train_loss": -19.31740379333496, "global_step": 38715, "epoch": 466} {"train_loss": -19.61182975769043, "global_step": 38716, "epoch": 466} {"train_loss": -19.52964973449707, "global_step": 38717, "epoch": 466} {"train_loss": -19.396581649780273, "global_step": 38718, "epoch": 466} {"train_loss": -19.120935440063477, "global_step": 38719, "epoch": 466} {"train_loss": -19.29953384399414, "global_step": 38720, "epoch": 466} {"train_loss": -19.76173973083496, "global_step": 38721, "epoch": 466} {"train_loss": -19.458894729614258, "global_step": 38722, "epoch": 466} {"train_loss": -19.41827392578125, "global_step": 38723, "epoch": 466} {"train_loss": -19.73384666442871, "global_step": 38724, "epoch": 466} {"train_loss": -19.763296127319336, "global_step": 38725, "epoch": 466} {"train_loss": -19.2737979888916, "global_step": 38726, "epoch": 466} {"train_loss": -19.180896759033203, "global_step": 38727, "epoch": 466} {"train_loss": -19.71906089782715, "global_step": 38728, "epoch": 466} {"train_loss": -19.833250045776367, "global_step": 38729, "epoch": 466} {"train_loss": -19.5709228515625, "global_step": 38730, "epoch": 466} {"train_loss": -19.18943977355957, "global_step": 38731, "epoch": 466} {"train_loss": -19.347375869750977, "global_step": 38732, "epoch": 466} {"train_loss": -19.512685775756836, "global_step": 38733, "epoch": 466} {"train_loss": -19.253698348999023, "global_step": 38734, "epoch": 466} {"train_loss": -19.351909637451172, "global_step": 38735, "epoch": 466} {"train_loss": -19.26936149597168, "global_step": 38736, "epoch": 466} {"train_loss": -19.169376373291016, "global_step": 38737, "epoch": 466} {"train_loss": -19.2229061126709, "global_step": 38738, "epoch": 466} {"train_loss": -19.25664710998535, "global_step": 38739, "epoch": 466} {"train_loss": -19.186067581176758, "global_step": 38740, "epoch": 466} {"train_loss": -19.449682235717773, "global_step": 38741, "epoch": 466} {"train_loss": -19.60123062133789, "global_step": 38742, "epoch": 466} {"train_loss": -19.596141815185547, "global_step": 38743, "epoch": 466} {"train_loss": -19.442224502563477, "global_step": 38744, "epoch": 466} {"train_loss": -19.524282455444336, "global_step": 38745, "epoch": 466} {"train_loss": -19.800556182861328, "global_step": 38746, "epoch": 466} {"train_loss": -19.27151870727539, "global_step": 38747, "epoch": 466} {"train_loss": -19.486295700073242, "global_step": 38748, "epoch": 466} {"train_loss": -19.33905029296875, "global_step": 38749, "epoch": 466} {"train_loss": -19.22863006591797, "global_step": 38750, "epoch": 466} {"train_loss": -19.64140510559082, "global_step": 38751, "epoch": 466} {"train_loss": -19.31491470336914, "global_step": 38752, "epoch": 466} {"train_loss": -19.545246124267578, "global_step": 38753, "epoch": 466} {"train_loss": -19.41543960571289, "global_step": 38754, "epoch": 466} {"train_loss": -19.194761276245117, "global_step": 38755, "epoch": 466} {"train_loss": -19.632482528686523, "global_step": 38756, "epoch": 466} {"train_loss": -19.501615524291992, "global_step": 38757, "epoch": 466} {"train_loss": -19.167098999023438, "global_step": 38758, "epoch": 466} {"train_loss": -19.354455947875977, "global_step": 38759, "epoch": 466} {"train_loss": -19.365048741719807, "global_step": 38760, "epoch": 466, "val_loss": 6084335.5} {"train_loss": -19.2811279296875, "global_step": 38761, "epoch": 467} {"train_loss": -19.247724533081055, "global_step": 38762, "epoch": 467} {"train_loss": -19.13723373413086, "global_step": 38763, "epoch": 467} {"train_loss": -19.18075942993164, "global_step": 38764, "epoch": 467} {"train_loss": -18.710681915283203, "global_step": 38765, "epoch": 467} {"train_loss": -18.849027633666992, "global_step": 38766, "epoch": 467} {"train_loss": -19.2462215423584, "global_step": 38767, "epoch": 467} {"train_loss": -19.033205032348633, "global_step": 38768, "epoch": 467} {"train_loss": -19.113821029663086, "global_step": 38769, "epoch": 467} {"train_loss": -19.29262924194336, "global_step": 38770, "epoch": 467} {"train_loss": -19.379703521728516, "global_step": 38771, "epoch": 467} {"train_loss": -19.18018913269043, "global_step": 38772, "epoch": 467} {"train_loss": -19.02039909362793, "global_step": 38773, "epoch": 467} {"train_loss": -19.606121063232422, "global_step": 38774, "epoch": 467} {"train_loss": -19.385334014892578, "global_step": 38775, "epoch": 467} {"train_loss": -19.853363037109375, "global_step": 38776, "epoch": 467} {"train_loss": -19.509119033813477, "global_step": 38777, "epoch": 467} {"train_loss": -19.3343505859375, "global_step": 38778, "epoch": 467} {"train_loss": -19.547740936279297, "global_step": 38779, "epoch": 467} {"train_loss": -19.413557052612305, "global_step": 38780, "epoch": 467} {"train_loss": -19.473806381225586, "global_step": 38781, "epoch": 467} {"train_loss": -19.297420501708984, "global_step": 38782, "epoch": 467} {"train_loss": -18.97759437561035, "global_step": 38783, "epoch": 467} {"train_loss": -19.513076782226562, "global_step": 38784, "epoch": 467} {"train_loss": -19.46244239807129, "global_step": 38785, "epoch": 467} {"train_loss": -19.34563636779785, "global_step": 38786, "epoch": 467} {"train_loss": -19.389684677124023, "global_step": 38787, "epoch": 467} {"train_loss": -19.299514770507812, "global_step": 38788, "epoch": 467} {"train_loss": -19.164716720581055, "global_step": 38789, "epoch": 467} {"train_loss": -19.307758331298828, "global_step": 38790, "epoch": 467} {"train_loss": -19.607694625854492, "global_step": 38791, "epoch": 467} {"train_loss": -19.1897029876709, "global_step": 38792, "epoch": 467} {"train_loss": -19.72629165649414, "global_step": 38793, "epoch": 467} {"train_loss": -19.54867935180664, "global_step": 38794, "epoch": 467} {"train_loss": -19.538618087768555, "global_step": 38795, "epoch": 467} {"train_loss": -19.402982711791992, "global_step": 38796, "epoch": 467} {"train_loss": -19.465147018432617, "global_step": 38797, "epoch": 467} {"train_loss": -19.77741813659668, "global_step": 38798, "epoch": 467} {"train_loss": -19.30038833618164, "global_step": 38799, "epoch": 467} {"train_loss": -19.54280662536621, "global_step": 38800, "epoch": 467} {"train_loss": -19.307527542114258, "global_step": 38801, "epoch": 467} {"train_loss": -19.512203216552734, "global_step": 38802, "epoch": 467} {"train_loss": -19.00862693786621, "global_step": 38803, "epoch": 467} {"train_loss": -19.596166610717773, "global_step": 38804, "epoch": 467} {"train_loss": -19.02120018005371, "global_step": 38805, "epoch": 467} {"train_loss": -19.279205322265625, "global_step": 38806, "epoch": 467} {"train_loss": -19.20539665222168, "global_step": 38807, "epoch": 467} {"train_loss": -19.3503360748291, "global_step": 38808, "epoch": 467} {"train_loss": -19.24611473083496, "global_step": 38809, "epoch": 467} {"train_loss": -19.751733779907227, "global_step": 38810, "epoch": 467} {"train_loss": -19.02145767211914, "global_step": 38811, "epoch": 467} {"train_loss": -19.298381805419922, "global_step": 38812, "epoch": 467} {"train_loss": -19.2906551361084, "global_step": 38813, "epoch": 467} {"train_loss": -19.521631240844727, "global_step": 38814, "epoch": 467} {"train_loss": -19.643951416015625, "global_step": 38815, "epoch": 467} {"train_loss": -19.101987838745117, "global_step": 38816, "epoch": 467} {"train_loss": -19.395185470581055, "global_step": 38817, "epoch": 467} {"train_loss": -19.317626953125, "global_step": 38818, "epoch": 467} {"train_loss": -19.3304500579834, "global_step": 38819, "epoch": 467} {"train_loss": -19.175703048706055, "global_step": 38820, "epoch": 467} {"train_loss": -19.182172775268555, "global_step": 38821, "epoch": 467} {"train_loss": -19.267967224121094, "global_step": 38822, "epoch": 467} {"train_loss": -19.37188148498535, "global_step": 38823, "epoch": 467} {"train_loss": -19.489652633666992, "global_step": 38824, "epoch": 467} {"train_loss": -18.917375564575195, "global_step": 38825, "epoch": 467} {"train_loss": -18.8111629486084, "global_step": 38826, "epoch": 467} {"train_loss": -19.532682418823242, "global_step": 38827, "epoch": 467} {"train_loss": -19.469806671142578, "global_step": 38828, "epoch": 467} {"train_loss": -18.958663940429688, "global_step": 38829, "epoch": 467} {"train_loss": -19.23664665222168, "global_step": 38830, "epoch": 467} {"train_loss": -19.433774948120117, "global_step": 38831, "epoch": 467} {"train_loss": -19.49074363708496, "global_step": 38832, "epoch": 467} {"train_loss": -19.5585994720459, "global_step": 38833, "epoch": 467} {"train_loss": -19.5736083984375, "global_step": 38834, "epoch": 467} {"train_loss": -19.529945373535156, "global_step": 38835, "epoch": 467} {"train_loss": -19.176279067993164, "global_step": 38836, "epoch": 467} {"train_loss": -19.537405014038086, "global_step": 38837, "epoch": 467} {"train_loss": -19.080799102783203, "global_step": 38838, "epoch": 467} {"train_loss": -19.370641708374023, "global_step": 38839, "epoch": 467} {"train_loss": -19.19293212890625, "global_step": 38840, "epoch": 467} {"train_loss": -19.48236846923828, "global_step": 38841, "epoch": 467} {"train_loss": -19.513038635253906, "global_step": 38842, "epoch": 467} {"train_loss": -19.355112420507226, "global_step": 38843, "epoch": 467, "val_loss": 6130834.0} {"train_loss": -18.635833740234375, "global_step": 38844, "epoch": 468} {"train_loss": -19.20962142944336, "global_step": 38845, "epoch": 468} {"train_loss": -19.101877212524414, "global_step": 38846, "epoch": 468} {"train_loss": -19.015966415405273, "global_step": 38847, "epoch": 468} {"train_loss": -19.085205078125, "global_step": 38848, "epoch": 468} {"train_loss": -19.106184005737305, "global_step": 38849, "epoch": 468} {"train_loss": -19.269865036010742, "global_step": 38850, "epoch": 468} {"train_loss": -19.22785758972168, "global_step": 38851, "epoch": 468} {"train_loss": -19.269933700561523, "global_step": 38852, "epoch": 468} {"train_loss": -19.24238395690918, "global_step": 38853, "epoch": 468} {"train_loss": -19.61710548400879, "global_step": 38854, "epoch": 468} {"train_loss": -19.868741989135742, "global_step": 38855, "epoch": 468} {"train_loss": -19.077943801879883, "global_step": 38856, "epoch": 468} {"train_loss": -19.101552963256836, "global_step": 38857, "epoch": 468} {"train_loss": -19.375394821166992, "global_step": 38858, "epoch": 468} {"train_loss": -19.28290367126465, "global_step": 38859, "epoch": 468} {"train_loss": -18.792865753173828, "global_step": 38860, "epoch": 468} {"train_loss": -19.063199996948242, "global_step": 38861, "epoch": 468} {"train_loss": -19.045639038085938, "global_step": 38862, "epoch": 468} {"train_loss": -18.961606979370117, "global_step": 38863, "epoch": 468} {"train_loss": -19.328990936279297, "global_step": 38864, "epoch": 468} {"train_loss": -19.308618545532227, "global_step": 38865, "epoch": 468} {"train_loss": -19.300466537475586, "global_step": 38866, "epoch": 468} {"train_loss": -19.234209060668945, "global_step": 38867, "epoch": 468} {"train_loss": -19.058835983276367, "global_step": 38868, "epoch": 468} {"train_loss": -18.937597274780273, "global_step": 38869, "epoch": 468} {"train_loss": -19.358530044555664, "global_step": 38870, "epoch": 468} {"train_loss": -19.304555892944336, "global_step": 38871, "epoch": 468} {"train_loss": -19.205434799194336, "global_step": 38872, "epoch": 468} {"train_loss": -19.16346549987793, "global_step": 38873, "epoch": 468} {"train_loss": -19.305749893188477, "global_step": 38874, "epoch": 468} {"train_loss": -19.456974029541016, "global_step": 38875, "epoch": 468} {"train_loss": -19.329702377319336, "global_step": 38876, "epoch": 468} {"train_loss": -19.339170455932617, "global_step": 38877, "epoch": 468} {"train_loss": -19.25483512878418, "global_step": 38878, "epoch": 468} {"train_loss": -19.158781051635742, "global_step": 38879, "epoch": 468} {"train_loss": -19.412633895874023, "global_step": 38880, "epoch": 468} {"train_loss": -19.641035079956055, "global_step": 38881, "epoch": 468} {"train_loss": -19.56954574584961, "global_step": 38882, "epoch": 468} {"train_loss": -19.417972564697266, "global_step": 38883, "epoch": 468} {"train_loss": -19.311655044555664, "global_step": 38884, "epoch": 468} {"train_loss": -19.501867294311523, "global_step": 38885, "epoch": 468} {"train_loss": -19.66374397277832, "global_step": 38886, "epoch": 468} {"train_loss": -19.612409591674805, "global_step": 38887, "epoch": 468} {"train_loss": -19.4554500579834, "global_step": 38888, "epoch": 468} {"train_loss": -19.25230598449707, "global_step": 38889, "epoch": 468} {"train_loss": -19.547992706298828, "global_step": 38890, "epoch": 468} {"train_loss": -19.645689010620117, "global_step": 38891, "epoch": 468} {"train_loss": -19.533370971679688, "global_step": 38892, "epoch": 468} {"train_loss": -19.36286735534668, "global_step": 38893, "epoch": 468} {"train_loss": -18.90813636779785, "global_step": 38894, "epoch": 468} {"train_loss": -19.577598571777344, "global_step": 38895, "epoch": 468} {"train_loss": -19.18817710876465, "global_step": 38896, "epoch": 468} {"train_loss": -19.528518676757812, "global_step": 38897, "epoch": 468} {"train_loss": -19.824722290039062, "global_step": 38898, "epoch": 468} {"train_loss": -19.858230590820312, "global_step": 38899, "epoch": 468} {"train_loss": -19.02072525024414, "global_step": 38900, "epoch": 468} {"train_loss": -19.58890151977539, "global_step": 38901, "epoch": 468} {"train_loss": -19.708356857299805, "global_step": 38902, "epoch": 468} {"train_loss": -19.35849952697754, "global_step": 38903, "epoch": 468} {"train_loss": -19.32040023803711, "global_step": 38904, "epoch": 468} {"train_loss": -19.631147384643555, "global_step": 38905, "epoch": 468} {"train_loss": -19.509521484375, "global_step": 38906, "epoch": 468} {"train_loss": -19.371103286743164, "global_step": 38907, "epoch": 468} {"train_loss": -19.64783477783203, "global_step": 38908, "epoch": 468} {"train_loss": -19.50477409362793, "global_step": 38909, "epoch": 468} {"train_loss": -19.676101684570312, "global_step": 38910, "epoch": 468} {"train_loss": -19.286033630371094, "global_step": 38911, "epoch": 468} {"train_loss": -19.403783798217773, "global_step": 38912, "epoch": 468} {"train_loss": -19.441009521484375, "global_step": 38913, "epoch": 468} {"train_loss": -19.467206954956055, "global_step": 38914, "epoch": 468} {"train_loss": -19.343229293823242, "global_step": 38915, "epoch": 468} {"train_loss": -19.863595962524414, "global_step": 38916, "epoch": 468} {"train_loss": -19.592281341552734, "global_step": 38917, "epoch": 468} {"train_loss": -19.6099910736084, "global_step": 38918, "epoch": 468} {"train_loss": -19.46230125427246, "global_step": 38919, "epoch": 468} {"train_loss": -19.94544792175293, "global_step": 38920, "epoch": 468} {"train_loss": -19.660091400146484, "global_step": 38921, "epoch": 468} {"train_loss": -18.96538734436035, "global_step": 38922, "epoch": 468} {"train_loss": -19.423686981201172, "global_step": 38923, "epoch": 468} {"train_loss": -19.406187057495117, "global_step": 38924, "epoch": 468} {"train_loss": -19.600576400756836, "global_step": 38925, "epoch": 468} {"train_loss": -19.365616534129682, "global_step": 38926, "epoch": 468, "val_loss": 5901317.5} {"train_loss": -19.295185089111328, "global_step": 38927, "epoch": 469} {"train_loss": -19.793546676635742, "global_step": 38928, "epoch": 469} {"train_loss": -19.3764591217041, "global_step": 38929, "epoch": 469} {"train_loss": -19.485036849975586, "global_step": 38930, "epoch": 469} {"train_loss": -19.246339797973633, "global_step": 38931, "epoch": 469} {"train_loss": -19.474668502807617, "global_step": 38932, "epoch": 469} {"train_loss": -19.5301570892334, "global_step": 38933, "epoch": 469} {"train_loss": -19.567920684814453, "global_step": 38934, "epoch": 469} {"train_loss": -19.545644760131836, "global_step": 38935, "epoch": 469} {"train_loss": -19.30342674255371, "global_step": 38936, "epoch": 469} {"train_loss": -19.514570236206055, "global_step": 38937, "epoch": 469} {"train_loss": -19.184988021850586, "global_step": 38938, "epoch": 469} {"train_loss": -19.514265060424805, "global_step": 38939, "epoch": 469} {"train_loss": -19.064228057861328, "global_step": 38940, "epoch": 469} {"train_loss": -19.354068756103516, "global_step": 38941, "epoch": 469} {"train_loss": -19.228973388671875, "global_step": 38942, "epoch": 469} {"train_loss": -19.48042869567871, "global_step": 38943, "epoch": 469} {"train_loss": -19.701583862304688, "global_step": 38944, "epoch": 469} {"train_loss": -19.093948364257812, "global_step": 38945, "epoch": 469} {"train_loss": -19.736562728881836, "global_step": 38946, "epoch": 469} {"train_loss": -19.149686813354492, "global_step": 38947, "epoch": 469} {"train_loss": -19.51521110534668, "global_step": 38948, "epoch": 469} {"train_loss": -19.204458236694336, "global_step": 38949, "epoch": 469} {"train_loss": -19.662694931030273, "global_step": 38950, "epoch": 469} {"train_loss": -19.710208892822266, "global_step": 38951, "epoch": 469} {"train_loss": -19.368457794189453, "global_step": 38952, "epoch": 469} {"train_loss": -19.493518829345703, "global_step": 38953, "epoch": 469} {"train_loss": -19.1087646484375, "global_step": 38954, "epoch": 469} {"train_loss": -19.45631980895996, "global_step": 38955, "epoch": 469} {"train_loss": -19.152708053588867, "global_step": 38956, "epoch": 469} {"train_loss": -19.504446029663086, "global_step": 38957, "epoch": 469} {"train_loss": -19.275861740112305, "global_step": 38958, "epoch": 469} {"train_loss": -19.464384078979492, "global_step": 38959, "epoch": 469} {"train_loss": -19.005863189697266, "global_step": 38960, "epoch": 469} {"train_loss": -18.977371215820312, "global_step": 38961, "epoch": 469} {"train_loss": -19.1656494140625, "global_step": 38962, "epoch": 469} {"train_loss": -19.599584579467773, "global_step": 38963, "epoch": 469} {"train_loss": -19.723112106323242, "global_step": 38964, "epoch": 469} {"train_loss": -19.39852523803711, "global_step": 38965, "epoch": 469} {"train_loss": -19.484472274780273, "global_step": 38966, "epoch": 469} {"train_loss": -19.084924697875977, "global_step": 38967, "epoch": 469} {"train_loss": -19.645374298095703, "global_step": 38968, "epoch": 469} {"train_loss": -19.22633171081543, "global_step": 38969, "epoch": 469} {"train_loss": -19.456998825073242, "global_step": 38970, "epoch": 469} {"train_loss": -19.488174438476562, "global_step": 38971, "epoch": 469} {"train_loss": -19.275409698486328, "global_step": 38972, "epoch": 469} {"train_loss": -19.297550201416016, "global_step": 38973, "epoch": 469} {"train_loss": -19.7116756439209, "global_step": 38974, "epoch": 469} {"train_loss": -19.234588623046875, "global_step": 38975, "epoch": 469} {"train_loss": -19.565031051635742, "global_step": 38976, "epoch": 469} {"train_loss": -19.728666305541992, "global_step": 38977, "epoch": 469} {"train_loss": -18.937368392944336, "global_step": 38978, "epoch": 469} {"train_loss": -19.32428550720215, "global_step": 38979, "epoch": 469} {"train_loss": -19.430845260620117, "global_step": 38980, "epoch": 469} {"train_loss": -19.586156845092773, "global_step": 38981, "epoch": 469} {"train_loss": -19.36054801940918, "global_step": 38982, "epoch": 469} {"train_loss": -19.643579483032227, "global_step": 38983, "epoch": 469} {"train_loss": -19.31381607055664, "global_step": 38984, "epoch": 469} {"train_loss": -19.690658569335938, "global_step": 38985, "epoch": 469} {"train_loss": -19.40225601196289, "global_step": 38986, "epoch": 469} {"train_loss": -19.476856231689453, "global_step": 38987, "epoch": 469} {"train_loss": -19.306068420410156, "global_step": 38988, "epoch": 469} {"train_loss": -19.408130645751953, "global_step": 38989, "epoch": 469} {"train_loss": -19.291461944580078, "global_step": 38990, "epoch": 469} {"train_loss": -19.139822006225586, "global_step": 38991, "epoch": 469} {"train_loss": -19.68320083618164, "global_step": 38992, "epoch": 469} {"train_loss": -19.270605087280273, "global_step": 38993, "epoch": 469} {"train_loss": -19.294567108154297, "global_step": 38994, "epoch": 469} {"train_loss": -18.953704833984375, "global_step": 38995, "epoch": 469} {"train_loss": -19.453489303588867, "global_step": 38996, "epoch": 469} {"train_loss": -19.219999313354492, "global_step": 38997, "epoch": 469} {"train_loss": -19.227323532104492, "global_step": 38998, "epoch": 469} {"train_loss": -19.337804794311523, "global_step": 38999, "epoch": 469} {"train_loss": -19.22439193725586, "global_step": 39000, "epoch": 469} {"train_loss": -19.153167724609375, "global_step": 39001, "epoch": 469} {"train_loss": -19.252897262573242, "global_step": 39002, "epoch": 469} {"train_loss": -19.7341251373291, "global_step": 39003, "epoch": 469} {"train_loss": -19.277006149291992, "global_step": 39004, "epoch": 469} {"train_loss": -19.3011474609375, "global_step": 39005, "epoch": 469} {"train_loss": -19.32636833190918, "global_step": 39006, "epoch": 469} {"train_loss": -19.238128662109375, "global_step": 39007, "epoch": 469} {"train_loss": -19.335556030273438, "global_step": 39008, "epoch": 469} {"train_loss": -19.37010264109416, "global_step": 39009, "epoch": 469, "val_loss": 6049823.0} {"train_loss": -18.86981773376465, "global_step": 39010, "epoch": 470} {"train_loss": -19.344425201416016, "global_step": 39011, "epoch": 470} {"train_loss": -19.48042106628418, "global_step": 39012, "epoch": 470} {"train_loss": -19.242494583129883, "global_step": 39013, "epoch": 470} {"train_loss": -18.980924606323242, "global_step": 39014, "epoch": 470} {"train_loss": -19.07986068725586, "global_step": 39015, "epoch": 470} {"train_loss": -19.24403190612793, "global_step": 39016, "epoch": 470} {"train_loss": -19.303775787353516, "global_step": 39017, "epoch": 470} {"train_loss": -19.09901237487793, "global_step": 39018, "epoch": 470} {"train_loss": -18.958255767822266, "global_step": 39019, "epoch": 470} {"train_loss": -19.870824813842773, "global_step": 39020, "epoch": 470} {"train_loss": -19.1442813873291, "global_step": 39021, "epoch": 470} {"train_loss": -19.018482208251953, "global_step": 39022, "epoch": 470} {"train_loss": -19.34014129638672, "global_step": 39023, "epoch": 470} {"train_loss": -19.04886245727539, "global_step": 39024, "epoch": 470} {"train_loss": -19.275772094726562, "global_step": 39025, "epoch": 470} {"train_loss": -19.623449325561523, "global_step": 39026, "epoch": 470} {"train_loss": -18.886829376220703, "global_step": 39027, "epoch": 470} {"train_loss": -19.219449996948242, "global_step": 39028, "epoch": 470} {"train_loss": -19.1303768157959, "global_step": 39029, "epoch": 470} {"train_loss": -19.44573402404785, "global_step": 39030, "epoch": 470} {"train_loss": -19.501121520996094, "global_step": 39031, "epoch": 470} {"train_loss": -19.287540435791016, "global_step": 39032, "epoch": 470} {"train_loss": -19.211618423461914, "global_step": 39033, "epoch": 470} {"train_loss": -19.740360260009766, "global_step": 39034, "epoch": 470} {"train_loss": -19.52402687072754, "global_step": 39035, "epoch": 470} {"train_loss": -19.27558708190918, "global_step": 39036, "epoch": 470} {"train_loss": -19.76508903503418, "global_step": 39037, "epoch": 470} {"train_loss": -19.208349227905273, "global_step": 39038, "epoch": 470} {"train_loss": -19.32901954650879, "global_step": 39039, "epoch": 470} {"train_loss": -19.403669357299805, "global_step": 39040, "epoch": 470} {"train_loss": -19.28970718383789, "global_step": 39041, "epoch": 470} {"train_loss": -19.016464233398438, "global_step": 39042, "epoch": 470} {"train_loss": -19.643728256225586, "global_step": 39043, "epoch": 470} {"train_loss": -19.185672760009766, "global_step": 39044, "epoch": 470} {"train_loss": -19.28272247314453, "global_step": 39045, "epoch": 470} {"train_loss": -19.77872657775879, "global_step": 39046, "epoch": 470} {"train_loss": -19.588102340698242, "global_step": 39047, "epoch": 470} {"train_loss": -19.36981201171875, "global_step": 39048, "epoch": 470} {"train_loss": -19.336925506591797, "global_step": 39049, "epoch": 470} {"train_loss": -19.47303009033203, "global_step": 39050, "epoch": 470} {"train_loss": -19.252439498901367, "global_step": 39051, "epoch": 470} {"train_loss": -19.337100982666016, "global_step": 39052, "epoch": 470} {"train_loss": -19.349523544311523, "global_step": 39053, "epoch": 470} {"train_loss": -19.6735782623291, "global_step": 39054, "epoch": 470} {"train_loss": -18.995397567749023, "global_step": 39055, "epoch": 470} {"train_loss": -19.26903533935547, "global_step": 39056, "epoch": 470} {"train_loss": -19.32973289489746, "global_step": 39057, "epoch": 470} {"train_loss": -19.396987915039062, "global_step": 39058, "epoch": 470} {"train_loss": -19.62518310546875, "global_step": 39059, "epoch": 470} {"train_loss": -18.92425537109375, "global_step": 39060, "epoch": 470} {"train_loss": -19.495302200317383, "global_step": 39061, "epoch": 470} {"train_loss": -19.317279815673828, "global_step": 39062, "epoch": 470} {"train_loss": -19.530681610107422, "global_step": 39063, "epoch": 470} {"train_loss": -19.56038475036621, "global_step": 39064, "epoch": 470} {"train_loss": -19.524198532104492, "global_step": 39065, "epoch": 470} {"train_loss": -19.15771484375, "global_step": 39066, "epoch": 470} {"train_loss": -19.335742950439453, "global_step": 39067, "epoch": 470} {"train_loss": -19.406644821166992, "global_step": 39068, "epoch": 470} {"train_loss": -19.34562110900879, "global_step": 39069, "epoch": 470} {"train_loss": -19.755468368530273, "global_step": 39070, "epoch": 470} {"train_loss": -19.664337158203125, "global_step": 39071, "epoch": 470} {"train_loss": -19.33970069885254, "global_step": 39072, "epoch": 470} {"train_loss": -19.54716682434082, "global_step": 39073, "epoch": 470} {"train_loss": -19.816038131713867, "global_step": 39074, "epoch": 470} {"train_loss": -19.549686431884766, "global_step": 39075, "epoch": 470} {"train_loss": -19.717304229736328, "global_step": 39076, "epoch": 470} {"train_loss": -19.225345611572266, "global_step": 39077, "epoch": 470} {"train_loss": -19.06825065612793, "global_step": 39078, "epoch": 470} {"train_loss": -19.41141700744629, "global_step": 39079, "epoch": 470} {"train_loss": -19.62705421447754, "global_step": 39080, "epoch": 470} {"train_loss": -19.88501739501953, "global_step": 39081, "epoch": 470} {"train_loss": -19.490610122680664, "global_step": 39082, "epoch": 470} {"train_loss": -19.313217163085938, "global_step": 39083, "epoch": 470} {"train_loss": -19.735340118408203, "global_step": 39084, "epoch": 470} {"train_loss": -19.606876373291016, "global_step": 39085, "epoch": 470} {"train_loss": -19.231557846069336, "global_step": 39086, "epoch": 470} {"train_loss": -19.360145568847656, "global_step": 39087, "epoch": 470} {"train_loss": -19.534717559814453, "global_step": 39088, "epoch": 470} {"train_loss": -19.52495574951172, "global_step": 39089, "epoch": 470} {"train_loss": -19.62879753112793, "global_step": 39090, "epoch": 470} {"train_loss": -19.175962448120117, "global_step": 39091, "epoch": 470} {"train_loss": -19.381915517600184, "global_step": 39092, "epoch": 470, "val_loss": 5921512.5} {"train_loss": -19.268707275390625, "global_step": 39093, "epoch": 471} {"train_loss": -18.917999267578125, "global_step": 39094, "epoch": 471} {"train_loss": -19.52785301208496, "global_step": 39095, "epoch": 471} {"train_loss": -19.287628173828125, "global_step": 39096, "epoch": 471} {"train_loss": -19.469663619995117, "global_step": 39097, "epoch": 471} {"train_loss": -18.9137020111084, "global_step": 39098, "epoch": 471} {"train_loss": -19.621450424194336, "global_step": 39099, "epoch": 471} {"train_loss": -19.312725067138672, "global_step": 39100, "epoch": 471} {"train_loss": -19.45494270324707, "global_step": 39101, "epoch": 471} {"train_loss": -19.468090057373047, "global_step": 39102, "epoch": 471} {"train_loss": -19.306161880493164, "global_step": 39103, "epoch": 471} {"train_loss": -19.48442840576172, "global_step": 39104, "epoch": 471} {"train_loss": -19.195066452026367, "global_step": 39105, "epoch": 471} {"train_loss": -19.363569259643555, "global_step": 39106, "epoch": 471} {"train_loss": -19.398212432861328, "global_step": 39107, "epoch": 471} {"train_loss": -19.56545066833496, "global_step": 39108, "epoch": 471} {"train_loss": -19.41650390625, "global_step": 39109, "epoch": 471} {"train_loss": -19.4080753326416, "global_step": 39110, "epoch": 471} {"train_loss": -19.337392807006836, "global_step": 39111, "epoch": 471} {"train_loss": -19.217300415039062, "global_step": 39112, "epoch": 471} {"train_loss": -19.639135360717773, "global_step": 39113, "epoch": 471} {"train_loss": -19.286020278930664, "global_step": 39114, "epoch": 471} {"train_loss": -19.715574264526367, "global_step": 39115, "epoch": 471} {"train_loss": -19.750059127807617, "global_step": 39116, "epoch": 471} {"train_loss": -19.238374710083008, "global_step": 39117, "epoch": 471} {"train_loss": -19.215848922729492, "global_step": 39118, "epoch": 471} {"train_loss": -19.30863380432129, "global_step": 39119, "epoch": 471} {"train_loss": -19.260272979736328, "global_step": 39120, "epoch": 471} {"train_loss": -19.293533325195312, "global_step": 39121, "epoch": 471} {"train_loss": -19.1413631439209, "global_step": 39122, "epoch": 471} {"train_loss": -19.1793155670166, "global_step": 39123, "epoch": 471} {"train_loss": -19.408920288085938, "global_step": 39124, "epoch": 471} {"train_loss": -19.4212646484375, "global_step": 39125, "epoch": 471} {"train_loss": -19.18949317932129, "global_step": 39126, "epoch": 471} {"train_loss": -19.46180534362793, "global_step": 39127, "epoch": 471} {"train_loss": -19.265838623046875, "global_step": 39128, "epoch": 471} {"train_loss": -19.48386001586914, "global_step": 39129, "epoch": 471} {"train_loss": -19.4846248626709, "global_step": 39130, "epoch": 471} {"train_loss": -19.46184730529785, "global_step": 39131, "epoch": 471} {"train_loss": -19.455739974975586, "global_step": 39132, "epoch": 471} {"train_loss": -19.415372848510742, "global_step": 39133, "epoch": 471} {"train_loss": -19.38205337524414, "global_step": 39134, "epoch": 471} {"train_loss": -19.53189468383789, "global_step": 39135, "epoch": 471} {"train_loss": -18.89699935913086, "global_step": 39136, "epoch": 471} {"train_loss": -19.510467529296875, "global_step": 39137, "epoch": 471} {"train_loss": -19.459333419799805, "global_step": 39138, "epoch": 471} {"train_loss": -19.56946563720703, "global_step": 39139, "epoch": 471} {"train_loss": -19.474937438964844, "global_step": 39140, "epoch": 471} {"train_loss": -19.293487548828125, "global_step": 39141, "epoch": 471} {"train_loss": -19.217370986938477, "global_step": 39142, "epoch": 471} {"train_loss": -19.612388610839844, "global_step": 39143, "epoch": 471} {"train_loss": -19.761667251586914, "global_step": 39144, "epoch": 471} {"train_loss": -19.219327926635742, "global_step": 39145, "epoch": 471} {"train_loss": -19.36374282836914, "global_step": 39146, "epoch": 471} {"train_loss": -19.52086639404297, "global_step": 39147, "epoch": 471} {"train_loss": -19.373397827148438, "global_step": 39148, "epoch": 471} {"train_loss": -19.650693893432617, "global_step": 39149, "epoch": 471} {"train_loss": -19.29043960571289, "global_step": 39150, "epoch": 471} {"train_loss": -19.461999893188477, "global_step": 39151, "epoch": 471} {"train_loss": -19.442129135131836, "global_step": 39152, "epoch": 471} {"train_loss": -19.38511085510254, "global_step": 39153, "epoch": 471} {"train_loss": -19.55437660217285, "global_step": 39154, "epoch": 471} {"train_loss": -19.6650447845459, "global_step": 39155, "epoch": 471} {"train_loss": -19.57355308532715, "global_step": 39156, "epoch": 471} {"train_loss": -19.379016876220703, "global_step": 39157, "epoch": 471} {"train_loss": -19.5377197265625, "global_step": 39158, "epoch": 471} {"train_loss": -19.42805290222168, "global_step": 39159, "epoch": 471} {"train_loss": -19.293397903442383, "global_step": 39160, "epoch": 471} {"train_loss": -19.31403160095215, "global_step": 39161, "epoch": 471} {"train_loss": -19.015029907226562, "global_step": 39162, "epoch": 471} {"train_loss": -19.424707412719727, "global_step": 39163, "epoch": 471} {"train_loss": -19.49506187438965, "global_step": 39164, "epoch": 471} {"train_loss": -19.59828758239746, "global_step": 39165, "epoch": 471} {"train_loss": -19.484893798828125, "global_step": 39166, "epoch": 471} {"train_loss": -19.03956413269043, "global_step": 39167, "epoch": 471} {"train_loss": -19.554624557495117, "global_step": 39168, "epoch": 471} {"train_loss": -19.46473503112793, "global_step": 39169, "epoch": 471} {"train_loss": -19.638275146484375, "global_step": 39170, "epoch": 471} {"train_loss": -19.508543014526367, "global_step": 39171, "epoch": 471} {"train_loss": -19.386198043823242, "global_step": 39172, "epoch": 471} {"train_loss": -19.724279403686523, "global_step": 39173, "epoch": 471} {"train_loss": -19.62116050720215, "global_step": 39174, "epoch": 471} {"train_loss": -19.409963837589125, "global_step": 39175, "epoch": 471, "val_loss": 6081453.5} {"train_loss": -19.054401397705078, "global_step": 39176, "epoch": 472} {"train_loss": -18.679039001464844, "global_step": 39177, "epoch": 472} {"train_loss": -18.938167572021484, "global_step": 39178, "epoch": 472} {"train_loss": -19.260929107666016, "global_step": 39179, "epoch": 472} {"train_loss": -19.49714469909668, "global_step": 39180, "epoch": 472} {"train_loss": -18.931060791015625, "global_step": 39181, "epoch": 472} {"train_loss": -19.38490104675293, "global_step": 39182, "epoch": 472} {"train_loss": -19.66916847229004, "global_step": 39183, "epoch": 472} {"train_loss": -19.069726943969727, "global_step": 39184, "epoch": 472} {"train_loss": -19.19895362854004, "global_step": 39185, "epoch": 472} {"train_loss": -19.118505477905273, "global_step": 39186, "epoch": 472} {"train_loss": -19.31815528869629, "global_step": 39187, "epoch": 472} {"train_loss": -19.436786651611328, "global_step": 39188, "epoch": 472} {"train_loss": -19.022974014282227, "global_step": 39189, "epoch": 472} {"train_loss": -19.29922866821289, "global_step": 39190, "epoch": 472} {"train_loss": -19.51789665222168, "global_step": 39191, "epoch": 472} {"train_loss": -19.577383041381836, "global_step": 39192, "epoch": 472} {"train_loss": -19.323265075683594, "global_step": 39193, "epoch": 472} {"train_loss": -19.54684829711914, "global_step": 39194, "epoch": 472} {"train_loss": -19.18227195739746, "global_step": 39195, "epoch": 472} {"train_loss": -18.918338775634766, "global_step": 39196, "epoch": 472} {"train_loss": -19.454471588134766, "global_step": 39197, "epoch": 472} {"train_loss": -19.4771785736084, "global_step": 39198, "epoch": 472} {"train_loss": -19.59052085876465, "global_step": 39199, "epoch": 472} {"train_loss": -19.414306640625, "global_step": 39200, "epoch": 472} {"train_loss": -19.392675399780273, "global_step": 39201, "epoch": 472} {"train_loss": -19.26064109802246, "global_step": 39202, "epoch": 472} {"train_loss": -19.3970890045166, "global_step": 39203, "epoch": 472} {"train_loss": -19.1241455078125, "global_step": 39204, "epoch": 472} {"train_loss": -19.635831832885742, "global_step": 39205, "epoch": 472} {"train_loss": -19.778379440307617, "global_step": 39206, "epoch": 472} {"train_loss": -19.205514907836914, "global_step": 39207, "epoch": 472} {"train_loss": -19.282217025756836, "global_step": 39208, "epoch": 472} {"train_loss": -19.534069061279297, "global_step": 39209, "epoch": 472} {"train_loss": -19.95454978942871, "global_step": 39210, "epoch": 472} {"train_loss": -19.01434898376465, "global_step": 39211, "epoch": 472} {"train_loss": -19.49188232421875, "global_step": 39212, "epoch": 472} {"train_loss": -19.363073348999023, "global_step": 39213, "epoch": 472} {"train_loss": -19.558792114257812, "global_step": 39214, "epoch": 472} {"train_loss": -19.474584579467773, "global_step": 39215, "epoch": 472} {"train_loss": -19.40764045715332, "global_step": 39216, "epoch": 472} {"train_loss": -19.190778732299805, "global_step": 39217, "epoch": 472} {"train_loss": -19.728775024414062, "global_step": 39218, "epoch": 472} {"train_loss": -19.4954891204834, "global_step": 39219, "epoch": 472} {"train_loss": -19.232898712158203, "global_step": 39220, "epoch": 472} {"train_loss": -19.056625366210938, "global_step": 39221, "epoch": 472} {"train_loss": -19.291845321655273, "global_step": 39222, "epoch": 472} {"train_loss": -19.3885440826416, "global_step": 39223, "epoch": 472} {"train_loss": -19.14863395690918, "global_step": 39224, "epoch": 472} {"train_loss": -19.57850456237793, "global_step": 39225, "epoch": 472} {"train_loss": -19.341352462768555, "global_step": 39226, "epoch": 472} {"train_loss": -19.532312393188477, "global_step": 39227, "epoch": 472} {"train_loss": -19.321744918823242, "global_step": 39228, "epoch": 472} {"train_loss": -18.99228858947754, "global_step": 39229, "epoch": 472} {"train_loss": -19.297147750854492, "global_step": 39230, "epoch": 472} {"train_loss": -18.92835807800293, "global_step": 39231, "epoch": 472} {"train_loss": -19.240766525268555, "global_step": 39232, "epoch": 472} {"train_loss": -18.89703941345215, "global_step": 39233, "epoch": 472} {"train_loss": -19.217437744140625, "global_step": 39234, "epoch": 472} {"train_loss": -19.64192771911621, "global_step": 39235, "epoch": 472} {"train_loss": -19.32950210571289, "global_step": 39236, "epoch": 472} {"train_loss": -19.210479736328125, "global_step": 39237, "epoch": 472} {"train_loss": -19.26917839050293, "global_step": 39238, "epoch": 472} {"train_loss": -19.28411865234375, "global_step": 39239, "epoch": 472} {"train_loss": -19.327316284179688, "global_step": 39240, "epoch": 472} {"train_loss": -19.823678970336914, "global_step": 39241, "epoch": 472} {"train_loss": -19.428983688354492, "global_step": 39242, "epoch": 472} {"train_loss": -19.676965713500977, "global_step": 39243, "epoch": 472} {"train_loss": -19.082530975341797, "global_step": 39244, "epoch": 472} {"train_loss": -19.232397079467773, "global_step": 39245, "epoch": 472} {"train_loss": -19.497343063354492, "global_step": 39246, "epoch": 472} {"train_loss": -19.509723663330078, "global_step": 39247, "epoch": 472} {"train_loss": -19.208707809448242, "global_step": 39248, "epoch": 472} {"train_loss": -19.376235961914062, "global_step": 39249, "epoch": 472} {"train_loss": -19.596668243408203, "global_step": 39250, "epoch": 472} {"train_loss": -19.341806411743164, "global_step": 39251, "epoch": 472} {"train_loss": -19.38225746154785, "global_step": 39252, "epoch": 472} {"train_loss": -19.677724838256836, "global_step": 39253, "epoch": 472} {"train_loss": -19.242788314819336, "global_step": 39254, "epoch": 472} {"train_loss": -19.358177185058594, "global_step": 39255, "epoch": 472} {"train_loss": -19.326656341552734, "global_step": 39256, "epoch": 472} {"train_loss": -19.311473846435547, "global_step": 39257, "epoch": 472} {"train_loss": -19.36840436544763, "global_step": 39258, "epoch": 472, "val_loss": 6206367.5} {"train_loss": -19.18950843811035, "global_step": 39259, "epoch": 473} {"train_loss": -19.265661239624023, "global_step": 39260, "epoch": 473} {"train_loss": -19.10611343383789, "global_step": 39261, "epoch": 473} {"train_loss": -19.00969886779785, "global_step": 39262, "epoch": 473} {"train_loss": -19.24944496154785, "global_step": 39263, "epoch": 473} {"train_loss": -19.220844268798828, "global_step": 39264, "epoch": 473} {"train_loss": -19.066749572753906, "global_step": 39265, "epoch": 473} {"train_loss": -19.326200485229492, "global_step": 39266, "epoch": 473} {"train_loss": -19.18401527404785, "global_step": 39267, "epoch": 473} {"train_loss": -19.279504776000977, "global_step": 39268, "epoch": 473} {"train_loss": -19.191869735717773, "global_step": 39269, "epoch": 473} {"train_loss": -19.195646286010742, "global_step": 39270, "epoch": 473} {"train_loss": -19.226667404174805, "global_step": 39271, "epoch": 473} {"train_loss": -19.39227867126465, "global_step": 39272, "epoch": 473} {"train_loss": -19.388534545898438, "global_step": 39273, "epoch": 473} {"train_loss": -19.557037353515625, "global_step": 39274, "epoch": 473} {"train_loss": -19.650774002075195, "global_step": 39275, "epoch": 473} {"train_loss": -19.526718139648438, "global_step": 39276, "epoch": 473} {"train_loss": -19.37351417541504, "global_step": 39277, "epoch": 473} {"train_loss": -19.234628677368164, "global_step": 39278, "epoch": 473} {"train_loss": -19.51694107055664, "global_step": 39279, "epoch": 473} {"train_loss": -19.552257537841797, "global_step": 39280, "epoch": 473} {"train_loss": -19.34004783630371, "global_step": 39281, "epoch": 473} {"train_loss": -19.665504455566406, "global_step": 39282, "epoch": 473} {"train_loss": -19.289392471313477, "global_step": 39283, "epoch": 473} {"train_loss": -19.672378540039062, "global_step": 39284, "epoch": 473} {"train_loss": -19.600719451904297, "global_step": 39285, "epoch": 473} {"train_loss": -19.37584114074707, "global_step": 39286, "epoch": 473} {"train_loss": -19.736928939819336, "global_step": 39287, "epoch": 473} {"train_loss": -19.431583404541016, "global_step": 39288, "epoch": 473} {"train_loss": -19.112672805786133, "global_step": 39289, "epoch": 473} {"train_loss": -19.428678512573242, "global_step": 39290, "epoch": 473} {"train_loss": -19.85310173034668, "global_step": 39291, "epoch": 473} {"train_loss": -19.401426315307617, "global_step": 39292, "epoch": 473} {"train_loss": -19.38298797607422, "global_step": 39293, "epoch": 473} {"train_loss": -19.489551544189453, "global_step": 39294, "epoch": 473} {"train_loss": -19.79046058654785, "global_step": 39295, "epoch": 473} {"train_loss": -19.135578155517578, "global_step": 39296, "epoch": 473} {"train_loss": -19.551395416259766, "global_step": 39297, "epoch": 473} {"train_loss": -19.314544677734375, "global_step": 39298, "epoch": 473} {"train_loss": -19.547088623046875, "global_step": 39299, "epoch": 473} {"train_loss": -19.16623306274414, "global_step": 39300, "epoch": 473} {"train_loss": -19.280405044555664, "global_step": 39301, "epoch": 473} {"train_loss": -19.29411506652832, "global_step": 39302, "epoch": 473} {"train_loss": -19.17805290222168, "global_step": 39303, "epoch": 473} {"train_loss": -19.503488540649414, "global_step": 39304, "epoch": 473} {"train_loss": -19.42372703552246, "global_step": 39305, "epoch": 473} {"train_loss": -19.2226619720459, "global_step": 39306, "epoch": 473} {"train_loss": -19.498929977416992, "global_step": 39307, "epoch": 473} {"train_loss": -19.4262638092041, "global_step": 39308, "epoch": 473} {"train_loss": -19.11299705505371, "global_step": 39309, "epoch": 473} {"train_loss": -19.74799919128418, "global_step": 39310, "epoch": 473} {"train_loss": -19.491851806640625, "global_step": 39311, "epoch": 473} {"train_loss": -19.53081703186035, "global_step": 39312, "epoch": 473} {"train_loss": -19.631147384643555, "global_step": 39313, "epoch": 473} {"train_loss": -19.588947296142578, "global_step": 39314, "epoch": 473} {"train_loss": -19.3572940826416, "global_step": 39315, "epoch": 473} {"train_loss": -19.38360023498535, "global_step": 39316, "epoch": 473} {"train_loss": -19.211673736572266, "global_step": 39317, "epoch": 473} {"train_loss": -19.75657081604004, "global_step": 39318, "epoch": 473} {"train_loss": -19.495521545410156, "global_step": 39319, "epoch": 473} {"train_loss": -19.33424186706543, "global_step": 39320, "epoch": 473} {"train_loss": -19.59065055847168, "global_step": 39321, "epoch": 473} {"train_loss": -19.1208438873291, "global_step": 39322, "epoch": 473} {"train_loss": -19.302310943603516, "global_step": 39323, "epoch": 473} {"train_loss": -19.235183715820312, "global_step": 39324, "epoch": 473} {"train_loss": -19.32069206237793, "global_step": 39325, "epoch": 473} {"train_loss": -19.338666915893555, "global_step": 39326, "epoch": 473} {"train_loss": -19.399045944213867, "global_step": 39327, "epoch": 473} {"train_loss": -19.366689682006836, "global_step": 39328, "epoch": 473} {"train_loss": -19.368392944335938, "global_step": 39329, "epoch": 473} {"train_loss": -19.51712989807129, "global_step": 39330, "epoch": 473} {"train_loss": -19.39386558532715, "global_step": 39331, "epoch": 473} {"train_loss": -19.556493759155273, "global_step": 39332, "epoch": 473} {"train_loss": -19.377094268798828, "global_step": 39333, "epoch": 473} {"train_loss": -19.288854598999023, "global_step": 39334, "epoch": 473} {"train_loss": -19.376876831054688, "global_step": 39335, "epoch": 473} {"train_loss": -19.597427368164062, "global_step": 39336, "epoch": 473} {"train_loss": -19.316204071044922, "global_step": 39337, "epoch": 473} {"train_loss": -19.261377334594727, "global_step": 39338, "epoch": 473} {"train_loss": -19.493040084838867, "global_step": 39339, "epoch": 473} {"train_loss": -19.14053726196289, "global_step": 39340, "epoch": 473} {"train_loss": -19.396576318396143, "global_step": 39341, "epoch": 473, "val_loss": 5981095.0} {"train_loss": -19.063207626342773, "global_step": 39342, "epoch": 474} {"train_loss": -19.108295440673828, "global_step": 39343, "epoch": 474} {"train_loss": -19.422718048095703, "global_step": 39344, "epoch": 474} {"train_loss": -19.212575912475586, "global_step": 39345, "epoch": 474} {"train_loss": -19.43024444580078, "global_step": 39346, "epoch": 474} {"train_loss": -19.32330322265625, "global_step": 39347, "epoch": 474} {"train_loss": -19.202177047729492, "global_step": 39348, "epoch": 474} {"train_loss": -19.107868194580078, "global_step": 39349, "epoch": 474} {"train_loss": -19.019866943359375, "global_step": 39350, "epoch": 474} {"train_loss": -19.340696334838867, "global_step": 39351, "epoch": 474} {"train_loss": -19.3857364654541, "global_step": 39352, "epoch": 474} {"train_loss": -19.254568099975586, "global_step": 39353, "epoch": 474} {"train_loss": -19.725271224975586, "global_step": 39354, "epoch": 474} {"train_loss": -19.35413932800293, "global_step": 39355, "epoch": 474} {"train_loss": -19.463247299194336, "global_step": 39356, "epoch": 474} {"train_loss": -19.49957847595215, "global_step": 39357, "epoch": 474} {"train_loss": -19.43364715576172, "global_step": 39358, "epoch": 474} {"train_loss": -19.08077049255371, "global_step": 39359, "epoch": 474} {"train_loss": -19.344165802001953, "global_step": 39360, "epoch": 474} {"train_loss": -19.367136001586914, "global_step": 39361, "epoch": 474} {"train_loss": -19.486164093017578, "global_step": 39362, "epoch": 474} {"train_loss": -19.051090240478516, "global_step": 39363, "epoch": 474} {"train_loss": -19.51108169555664, "global_step": 39364, "epoch": 474} {"train_loss": -19.386533737182617, "global_step": 39365, "epoch": 474} {"train_loss": -19.696271896362305, "global_step": 39366, "epoch": 474} {"train_loss": -19.289339065551758, "global_step": 39367, "epoch": 474} {"train_loss": -19.01031494140625, "global_step": 39368, "epoch": 474} {"train_loss": -19.283620834350586, "global_step": 39369, "epoch": 474} {"train_loss": -19.254154205322266, "global_step": 39370, "epoch": 474} {"train_loss": -18.85854148864746, "global_step": 39371, "epoch": 474} {"train_loss": -19.546045303344727, "global_step": 39372, "epoch": 474} {"train_loss": -19.418045043945312, "global_step": 39373, "epoch": 474} {"train_loss": -19.353403091430664, "global_step": 39374, "epoch": 474} {"train_loss": -19.674089431762695, "global_step": 39375, "epoch": 474} {"train_loss": -19.269319534301758, "global_step": 39376, "epoch": 474} {"train_loss": -19.249841690063477, "global_step": 39377, "epoch": 474} {"train_loss": -19.32452392578125, "global_step": 39378, "epoch": 474} {"train_loss": -19.84207534790039, "global_step": 39379, "epoch": 474} {"train_loss": -19.40557289123535, "global_step": 39380, "epoch": 474} {"train_loss": -19.16327476501465, "global_step": 39381, "epoch": 474} {"train_loss": -19.32879638671875, "global_step": 39382, "epoch": 474} {"train_loss": -19.65668487548828, "global_step": 39383, "epoch": 474} {"train_loss": -19.469009399414062, "global_step": 39384, "epoch": 474} {"train_loss": -19.424819946289062, "global_step": 39385, "epoch": 474} {"train_loss": -19.41701316833496, "global_step": 39386, "epoch": 474} {"train_loss": -19.327184677124023, "global_step": 39387, "epoch": 474} {"train_loss": -19.445783615112305, "global_step": 39388, "epoch": 474} {"train_loss": -19.447324752807617, "global_step": 39389, "epoch": 474} {"train_loss": -19.637298583984375, "global_step": 39390, "epoch": 474} {"train_loss": -19.151554107666016, "global_step": 39391, "epoch": 474} {"train_loss": -19.593734741210938, "global_step": 39392, "epoch": 474} {"train_loss": -19.706056594848633, "global_step": 39393, "epoch": 474} {"train_loss": -19.126291275024414, "global_step": 39394, "epoch": 474} {"train_loss": -19.448144912719727, "global_step": 39395, "epoch": 474} {"train_loss": -19.54766273498535, "global_step": 39396, "epoch": 474} {"train_loss": -19.285287857055664, "global_step": 39397, "epoch": 474} {"train_loss": -19.31979751586914, "global_step": 39398, "epoch": 474} {"train_loss": -19.53730583190918, "global_step": 39399, "epoch": 474} {"train_loss": -19.427833557128906, "global_step": 39400, "epoch": 474} {"train_loss": -19.43523597717285, "global_step": 39401, "epoch": 474} {"train_loss": -19.10052490234375, "global_step": 39402, "epoch": 474} {"train_loss": -19.463743209838867, "global_step": 39403, "epoch": 474} {"train_loss": -19.17384910583496, "global_step": 39404, "epoch": 474} {"train_loss": -19.40976333618164, "global_step": 39405, "epoch": 474} {"train_loss": -19.597803115844727, "global_step": 39406, "epoch": 474} {"train_loss": -19.561811447143555, "global_step": 39407, "epoch": 474} {"train_loss": -19.438316345214844, "global_step": 39408, "epoch": 474} {"train_loss": -19.376178741455078, "global_step": 39409, "epoch": 474} {"train_loss": -19.587963104248047, "global_step": 39410, "epoch": 474} {"train_loss": -19.657033920288086, "global_step": 39411, "epoch": 474} {"train_loss": -19.33376121520996, "global_step": 39412, "epoch": 474} {"train_loss": -19.442564010620117, "global_step": 39413, "epoch": 474} {"train_loss": -19.50619125366211, "global_step": 39414, "epoch": 474} {"train_loss": -19.608814239501953, "global_step": 39415, "epoch": 474} {"train_loss": -19.62101173400879, "global_step": 39416, "epoch": 474} {"train_loss": -19.452085494995117, "global_step": 39417, "epoch": 474} {"train_loss": -19.367443084716797, "global_step": 39418, "epoch": 474} {"train_loss": -19.342016220092773, "global_step": 39419, "epoch": 474} {"train_loss": -19.3133487701416, "global_step": 39420, "epoch": 474} {"train_loss": -19.72346305847168, "global_step": 39421, "epoch": 474} {"train_loss": -19.361791610717773, "global_step": 39422, "epoch": 474} {"train_loss": -19.626272201538086, "global_step": 39423, "epoch": 474} {"train_loss": -19.374934460743365, "global_step": 39424, "epoch": 474, "val_loss": 6100334.5} {"train_loss": -19.126012802124023, "global_step": 39425, "epoch": 475} {"train_loss": -19.255422592163086, "global_step": 39426, "epoch": 475} {"train_loss": -19.53131675720215, "global_step": 39427, "epoch": 475} {"train_loss": -18.872831344604492, "global_step": 39428, "epoch": 475} {"train_loss": -18.837753295898438, "global_step": 39429, "epoch": 475} {"train_loss": -19.002281188964844, "global_step": 39430, "epoch": 475} {"train_loss": -18.9932804107666, "global_step": 39431, "epoch": 475} {"train_loss": -19.246137619018555, "global_step": 39432, "epoch": 475} {"train_loss": -19.40439224243164, "global_step": 39433, "epoch": 475} {"train_loss": -19.372655868530273, "global_step": 39434, "epoch": 475} {"train_loss": -19.60655975341797, "global_step": 39435, "epoch": 475} {"train_loss": -19.18625831604004, "global_step": 39436, "epoch": 475} {"train_loss": -18.91067123413086, "global_step": 39437, "epoch": 475} {"train_loss": -19.475570678710938, "global_step": 39438, "epoch": 475} {"train_loss": -19.193288803100586, "global_step": 39439, "epoch": 475} {"train_loss": -19.474817276000977, "global_step": 39440, "epoch": 475} {"train_loss": -19.73105239868164, "global_step": 39441, "epoch": 475} {"train_loss": -19.318153381347656, "global_step": 39442, "epoch": 475} {"train_loss": -19.52435302734375, "global_step": 39443, "epoch": 475} {"train_loss": -18.688669204711914, "global_step": 39444, "epoch": 475} {"train_loss": -19.17542839050293, "global_step": 39445, "epoch": 475} {"train_loss": -19.4040584564209, "global_step": 39446, "epoch": 475} {"train_loss": -19.647241592407227, "global_step": 39447, "epoch": 475} {"train_loss": -19.22548484802246, "global_step": 39448, "epoch": 475} {"train_loss": -19.51362419128418, "global_step": 39449, "epoch": 475} {"train_loss": -19.479801177978516, "global_step": 39450, "epoch": 475} {"train_loss": -19.682374954223633, "global_step": 39451, "epoch": 475} {"train_loss": -19.21779441833496, "global_step": 39452, "epoch": 475} {"train_loss": -19.680206298828125, "global_step": 39453, "epoch": 475} {"train_loss": -19.550636291503906, "global_step": 39454, "epoch": 475} {"train_loss": -19.321420669555664, "global_step": 39455, "epoch": 475} {"train_loss": -19.384990692138672, "global_step": 39456, "epoch": 475} {"train_loss": -19.474760055541992, "global_step": 39457, "epoch": 475} {"train_loss": -19.57020378112793, "global_step": 39458, "epoch": 475} {"train_loss": -19.675323486328125, "global_step": 39459, "epoch": 475} {"train_loss": -19.689098358154297, "global_step": 39460, "epoch": 475} {"train_loss": -19.171401977539062, "global_step": 39461, "epoch": 475} {"train_loss": -19.443395614624023, "global_step": 39462, "epoch": 475} {"train_loss": -19.134811401367188, "global_step": 39463, "epoch": 475} {"train_loss": -19.188894271850586, "global_step": 39464, "epoch": 475} {"train_loss": -19.50006103515625, "global_step": 39465, "epoch": 475} {"train_loss": -19.382492065429688, "global_step": 39466, "epoch": 475} {"train_loss": -19.423315048217773, "global_step": 39467, "epoch": 475} {"train_loss": -19.33257293701172, "global_step": 39468, "epoch": 475} {"train_loss": -19.624460220336914, "global_step": 39469, "epoch": 475} {"train_loss": -19.001066207885742, "global_step": 39470, "epoch": 475} {"train_loss": -19.53753089904785, "global_step": 39471, "epoch": 475} {"train_loss": -19.012256622314453, "global_step": 39472, "epoch": 475} {"train_loss": -19.152862548828125, "global_step": 39473, "epoch": 475} {"train_loss": -19.033750534057617, "global_step": 39474, "epoch": 475} {"train_loss": -19.52942657470703, "global_step": 39475, "epoch": 475} {"train_loss": -19.421167373657227, "global_step": 39476, "epoch": 475} {"train_loss": -19.17644691467285, "global_step": 39477, "epoch": 475} {"train_loss": -19.595449447631836, "global_step": 39478, "epoch": 475} {"train_loss": -19.282514572143555, "global_step": 39479, "epoch": 475} {"train_loss": -19.667112350463867, "global_step": 39480, "epoch": 475} {"train_loss": -19.597131729125977, "global_step": 39481, "epoch": 475} {"train_loss": -19.212064743041992, "global_step": 39482, "epoch": 475} {"train_loss": -19.58106231689453, "global_step": 39483, "epoch": 475} {"train_loss": -19.525236129760742, "global_step": 39484, "epoch": 475} {"train_loss": -19.380680084228516, "global_step": 39485, "epoch": 475} {"train_loss": -19.446088790893555, "global_step": 39486, "epoch": 475} {"train_loss": -18.9842472076416, "global_step": 39487, "epoch": 475} {"train_loss": -19.579904556274414, "global_step": 39488, "epoch": 475} {"train_loss": -19.641109466552734, "global_step": 39489, "epoch": 475} {"train_loss": -19.490236282348633, "global_step": 39490, "epoch": 475} {"train_loss": -19.7694149017334, "global_step": 39491, "epoch": 475} {"train_loss": -19.501977920532227, "global_step": 39492, "epoch": 475} {"train_loss": -19.412321090698242, "global_step": 39493, "epoch": 475} {"train_loss": -19.495336532592773, "global_step": 39494, "epoch": 475} {"train_loss": -19.3975887298584, "global_step": 39495, "epoch": 475} {"train_loss": -19.34403419494629, "global_step": 39496, "epoch": 475} {"train_loss": -19.624916076660156, "global_step": 39497, "epoch": 475} {"train_loss": -19.674955368041992, "global_step": 39498, "epoch": 475} {"train_loss": -19.636245727539062, "global_step": 39499, "epoch": 475} {"train_loss": -19.842159271240234, "global_step": 39500, "epoch": 475} {"train_loss": -19.506330490112305, "global_step": 39501, "epoch": 475} {"train_loss": -19.591888427734375, "global_step": 39502, "epoch": 475} {"train_loss": -19.379657745361328, "global_step": 39503, "epoch": 475} {"train_loss": -19.688602447509766, "global_step": 39504, "epoch": 475} {"train_loss": -19.51435661315918, "global_step": 39505, "epoch": 475} {"train_loss": -19.32170867919922, "global_step": 39506, "epoch": 475} {"train_loss": -19.409683342439582, "global_step": 39507, "epoch": 475, "val_loss": 6052255.5} {"train_loss": -19.191593170166016, "global_step": 39508, "epoch": 476} {"train_loss": -19.271150588989258, "global_step": 39509, "epoch": 476} {"train_loss": -19.344257354736328, "global_step": 39510, "epoch": 476} {"train_loss": -19.256467819213867, "global_step": 39511, "epoch": 476} {"train_loss": -19.798852920532227, "global_step": 39512, "epoch": 476} {"train_loss": -19.21822166442871, "global_step": 39513, "epoch": 476} {"train_loss": -19.102182388305664, "global_step": 39514, "epoch": 476} {"train_loss": -19.24123764038086, "global_step": 39515, "epoch": 476} {"train_loss": -19.173887252807617, "global_step": 39516, "epoch": 476} {"train_loss": -19.46162223815918, "global_step": 39517, "epoch": 476} {"train_loss": -19.541187286376953, "global_step": 39518, "epoch": 476} {"train_loss": -19.714574813842773, "global_step": 39519, "epoch": 476} {"train_loss": -19.1333065032959, "global_step": 39520, "epoch": 476} {"train_loss": -19.248823165893555, "global_step": 39521, "epoch": 476} {"train_loss": -19.4248046875, "global_step": 39522, "epoch": 476} {"train_loss": -19.43073844909668, "global_step": 39523, "epoch": 476} {"train_loss": -19.261844635009766, "global_step": 39524, "epoch": 476} {"train_loss": -19.29317283630371, "global_step": 39525, "epoch": 476} {"train_loss": -19.782384872436523, "global_step": 39526, "epoch": 476} {"train_loss": -19.194616317749023, "global_step": 39527, "epoch": 476} {"train_loss": -19.276382446289062, "global_step": 39528, "epoch": 476} {"train_loss": -19.689184188842773, "global_step": 39529, "epoch": 476} {"train_loss": -19.551517486572266, "global_step": 39530, "epoch": 476} {"train_loss": -19.77718734741211, "global_step": 39531, "epoch": 476} {"train_loss": -19.405424118041992, "global_step": 39532, "epoch": 476} {"train_loss": -19.08519172668457, "global_step": 39533, "epoch": 476} {"train_loss": -19.516462326049805, "global_step": 39534, "epoch": 476} {"train_loss": -19.130146026611328, "global_step": 39535, "epoch": 476} {"train_loss": -19.415678024291992, "global_step": 39536, "epoch": 476} {"train_loss": -19.364757537841797, "global_step": 39537, "epoch": 476} {"train_loss": -19.66843605041504, "global_step": 39538, "epoch": 476} {"train_loss": -19.40015983581543, "global_step": 39539, "epoch": 476} {"train_loss": -19.685171127319336, "global_step": 39540, "epoch": 476} {"train_loss": -19.40360450744629, "global_step": 39541, "epoch": 476} {"train_loss": -19.290687561035156, "global_step": 39542, "epoch": 476} {"train_loss": -19.409381866455078, "global_step": 39543, "epoch": 476} {"train_loss": -19.484519958496094, "global_step": 39544, "epoch": 476} {"train_loss": -19.133325576782227, "global_step": 39545, "epoch": 476} {"train_loss": -18.995038986206055, "global_step": 39546, "epoch": 476} {"train_loss": -19.171003341674805, "global_step": 39547, "epoch": 476} {"train_loss": -19.875932693481445, "global_step": 39548, "epoch": 476} {"train_loss": -19.786407470703125, "global_step": 39549, "epoch": 476} {"train_loss": -18.94852066040039, "global_step": 39550, "epoch": 476} {"train_loss": -19.543731689453125, "global_step": 39551, "epoch": 476} {"train_loss": -19.275117874145508, "global_step": 39552, "epoch": 476} {"train_loss": -19.640336990356445, "global_step": 39553, "epoch": 476} {"train_loss": -19.203842163085938, "global_step": 39554, "epoch": 476} {"train_loss": -19.304227828979492, "global_step": 39555, "epoch": 476} {"train_loss": -19.48427391052246, "global_step": 39556, "epoch": 476} {"train_loss": -19.38669776916504, "global_step": 39557, "epoch": 476} {"train_loss": -19.600168228149414, "global_step": 39558, "epoch": 476} {"train_loss": -19.35999298095703, "global_step": 39559, "epoch": 476} {"train_loss": -19.16888999938965, "global_step": 39560, "epoch": 476} {"train_loss": -19.480541229248047, "global_step": 39561, "epoch": 476} {"train_loss": -19.45156478881836, "global_step": 39562, "epoch": 476} {"train_loss": -19.45380210876465, "global_step": 39563, "epoch": 476} {"train_loss": -19.205480575561523, "global_step": 39564, "epoch": 476} {"train_loss": -18.98337745666504, "global_step": 39565, "epoch": 476} {"train_loss": -19.61739158630371, "global_step": 39566, "epoch": 476} {"train_loss": -19.050039291381836, "global_step": 39567, "epoch": 476} {"train_loss": -19.13693618774414, "global_step": 39568, "epoch": 476} {"train_loss": -19.424285888671875, "global_step": 39569, "epoch": 476} {"train_loss": -19.348247528076172, "global_step": 39570, "epoch": 476} {"train_loss": -19.467227935791016, "global_step": 39571, "epoch": 476} {"train_loss": -19.687707901000977, "global_step": 39572, "epoch": 476} {"train_loss": -19.722457885742188, "global_step": 39573, "epoch": 476} {"train_loss": -19.514745712280273, "global_step": 39574, "epoch": 476} {"train_loss": -19.665884017944336, "global_step": 39575, "epoch": 476} {"train_loss": -19.419485092163086, "global_step": 39576, "epoch": 476} {"train_loss": -19.446256637573242, "global_step": 39577, "epoch": 476} {"train_loss": -19.223072052001953, "global_step": 39578, "epoch": 476} {"train_loss": -19.06827163696289, "global_step": 39579, "epoch": 476} {"train_loss": -19.33785057067871, "global_step": 39580, "epoch": 476} {"train_loss": -19.620141983032227, "global_step": 39581, "epoch": 476} {"train_loss": -19.255517959594727, "global_step": 39582, "epoch": 476} {"train_loss": -19.538606643676758, "global_step": 39583, "epoch": 476} {"train_loss": -19.37653160095215, "global_step": 39584, "epoch": 476} {"train_loss": -19.657485961914062, "global_step": 39585, "epoch": 476} {"train_loss": -19.639516830444336, "global_step": 39586, "epoch": 476} {"train_loss": -19.265941619873047, "global_step": 39587, "epoch": 476} {"train_loss": -19.37809181213379, "global_step": 39588, "epoch": 476} {"train_loss": -19.29630470275879, "global_step": 39589, "epoch": 476} {"train_loss": -19.395756066563617, "global_step": 39590, "epoch": 476, "val_loss": 5974117.0} {"train_loss": -19.281396865844727, "global_step": 39591, "epoch": 477} {"train_loss": -18.781803131103516, "global_step": 39592, "epoch": 477} {"train_loss": -19.32157325744629, "global_step": 39593, "epoch": 477} {"train_loss": -19.3244686126709, "global_step": 39594, "epoch": 477} {"train_loss": -19.080076217651367, "global_step": 39595, "epoch": 477} {"train_loss": -19.261207580566406, "global_step": 39596, "epoch": 477} {"train_loss": -19.262704849243164, "global_step": 39597, "epoch": 477} {"train_loss": -19.570322036743164, "global_step": 39598, "epoch": 477} {"train_loss": -19.343732833862305, "global_step": 39599, "epoch": 477} {"train_loss": -19.477163314819336, "global_step": 39600, "epoch": 477} {"train_loss": -19.50135612487793, "global_step": 39601, "epoch": 477} {"train_loss": -19.331069946289062, "global_step": 39602, "epoch": 477} {"train_loss": -19.186967849731445, "global_step": 39603, "epoch": 477} {"train_loss": -19.273380279541016, "global_step": 39604, "epoch": 477} {"train_loss": -19.642200469970703, "global_step": 39605, "epoch": 477} {"train_loss": -19.723520278930664, "global_step": 39606, "epoch": 477} {"train_loss": -19.726757049560547, "global_step": 39607, "epoch": 477} {"train_loss": -19.127843856811523, "global_step": 39608, "epoch": 477} {"train_loss": -19.266403198242188, "global_step": 39609, "epoch": 477} {"train_loss": -19.305959701538086, "global_step": 39610, "epoch": 477} {"train_loss": -19.87993049621582, "global_step": 39611, "epoch": 477} {"train_loss": -19.4736385345459, "global_step": 39612, "epoch": 477} {"train_loss": -19.484542846679688, "global_step": 39613, "epoch": 477} {"train_loss": -19.115873336791992, "global_step": 39614, "epoch": 477} {"train_loss": -19.305810928344727, "global_step": 39615, "epoch": 477} {"train_loss": -19.162893295288086, "global_step": 39616, "epoch": 477} {"train_loss": -19.243619918823242, "global_step": 39617, "epoch": 477} {"train_loss": -19.541728973388672, "global_step": 39618, "epoch": 477} {"train_loss": -19.52081871032715, "global_step": 39619, "epoch": 477} {"train_loss": -19.319204330444336, "global_step": 39620, "epoch": 477} {"train_loss": -19.479997634887695, "global_step": 39621, "epoch": 477} {"train_loss": -19.2729549407959, "global_step": 39622, "epoch": 477} {"train_loss": -19.334318161010742, "global_step": 39623, "epoch": 477} {"train_loss": -19.233383178710938, "global_step": 39624, "epoch": 477} {"train_loss": -19.5123348236084, "global_step": 39625, "epoch": 477} {"train_loss": -19.57640266418457, "global_step": 39626, "epoch": 477} {"train_loss": -19.29623031616211, "global_step": 39627, "epoch": 477} {"train_loss": -19.312381744384766, "global_step": 39628, "epoch": 477} {"train_loss": -19.55464744567871, "global_step": 39629, "epoch": 477} {"train_loss": -19.505046844482422, "global_step": 39630, "epoch": 477} {"train_loss": -19.488460540771484, "global_step": 39631, "epoch": 477} {"train_loss": -19.523591995239258, "global_step": 39632, "epoch": 477} {"train_loss": -19.335840225219727, "global_step": 39633, "epoch": 477} {"train_loss": -19.785825729370117, "global_step": 39634, "epoch": 477} {"train_loss": -19.3779354095459, "global_step": 39635, "epoch": 477} {"train_loss": -19.43992042541504, "global_step": 39636, "epoch": 477} {"train_loss": -19.21249771118164, "global_step": 39637, "epoch": 477} {"train_loss": -19.415266036987305, "global_step": 39638, "epoch": 477} {"train_loss": -19.512121200561523, "global_step": 39639, "epoch": 477} {"train_loss": -19.59615135192871, "global_step": 39640, "epoch": 477} {"train_loss": -19.040485382080078, "global_step": 39641, "epoch": 477} {"train_loss": -19.427244186401367, "global_step": 39642, "epoch": 477} {"train_loss": -19.471487045288086, "global_step": 39643, "epoch": 477} {"train_loss": -18.973670959472656, "global_step": 39644, "epoch": 477} {"train_loss": -19.55762481689453, "global_step": 39645, "epoch": 477} {"train_loss": -19.072019577026367, "global_step": 39646, "epoch": 477} {"train_loss": -19.154254913330078, "global_step": 39647, "epoch": 477} {"train_loss": -19.642072677612305, "global_step": 39648, "epoch": 477} {"train_loss": -19.373477935791016, "global_step": 39649, "epoch": 477} {"train_loss": -19.660236358642578, "global_step": 39650, "epoch": 477} {"train_loss": -19.40606117248535, "global_step": 39651, "epoch": 477} {"train_loss": -19.526803970336914, "global_step": 39652, "epoch": 477} {"train_loss": -19.554454803466797, "global_step": 39653, "epoch": 477} {"train_loss": -19.563711166381836, "global_step": 39654, "epoch": 477} {"train_loss": -19.666500091552734, "global_step": 39655, "epoch": 477} {"train_loss": -19.478185653686523, "global_step": 39656, "epoch": 477} {"train_loss": -19.451372146606445, "global_step": 39657, "epoch": 477} {"train_loss": -19.482091903686523, "global_step": 39658, "epoch": 477} {"train_loss": -19.54207420349121, "global_step": 39659, "epoch": 477} {"train_loss": -19.272565841674805, "global_step": 39660, "epoch": 477} {"train_loss": -19.549718856811523, "global_step": 39661, "epoch": 477} {"train_loss": -19.720285415649414, "global_step": 39662, "epoch": 477} {"train_loss": -19.431196212768555, "global_step": 39663, "epoch": 477} {"train_loss": -19.177988052368164, "global_step": 39664, "epoch": 477} {"train_loss": -19.582059860229492, "global_step": 39665, "epoch": 477} {"train_loss": -19.760284423828125, "global_step": 39666, "epoch": 477} {"train_loss": -19.446847915649414, "global_step": 39667, "epoch": 477} {"train_loss": -19.350610733032227, "global_step": 39668, "epoch": 477} {"train_loss": -19.60512351989746, "global_step": 39669, "epoch": 477} {"train_loss": -19.535703659057617, "global_step": 39670, "epoch": 477} {"train_loss": -19.448816299438477, "global_step": 39671, "epoch": 477} {"train_loss": -19.0986385345459, "global_step": 39672, "epoch": 477} {"train_loss": -19.41560030558023, "global_step": 39673, "epoch": 477, "val_loss": 5804911.0} {"train_loss": -18.551359176635742, "global_step": 39674, "epoch": 478} {"train_loss": -19.264928817749023, "global_step": 39675, "epoch": 478} {"train_loss": -18.70075035095215, "global_step": 39676, "epoch": 478} {"train_loss": -19.061059951782227, "global_step": 39677, "epoch": 478} {"train_loss": -19.40632438659668, "global_step": 39678, "epoch": 478} {"train_loss": -19.047021865844727, "global_step": 39679, "epoch": 478} {"train_loss": -19.38516616821289, "global_step": 39680, "epoch": 478} {"train_loss": -19.463518142700195, "global_step": 39681, "epoch": 478} {"train_loss": -19.52426528930664, "global_step": 39682, "epoch": 478} {"train_loss": -19.064199447631836, "global_step": 39683, "epoch": 478} {"train_loss": -19.38219451904297, "global_step": 39684, "epoch": 478} {"train_loss": -19.585811614990234, "global_step": 39685, "epoch": 478} {"train_loss": -19.60882568359375, "global_step": 39686, "epoch": 478} {"train_loss": -19.29275131225586, "global_step": 39687, "epoch": 478} {"train_loss": -19.523466110229492, "global_step": 39688, "epoch": 478} {"train_loss": -19.338171005249023, "global_step": 39689, "epoch": 478} {"train_loss": -19.34187126159668, "global_step": 39690, "epoch": 478} {"train_loss": -19.494794845581055, "global_step": 39691, "epoch": 478} {"train_loss": -19.622486114501953, "global_step": 39692, "epoch": 478} {"train_loss": -19.218917846679688, "global_step": 39693, "epoch": 478} {"train_loss": -19.29094696044922, "global_step": 39694, "epoch": 478} {"train_loss": -19.18657112121582, "global_step": 39695, "epoch": 478} {"train_loss": -19.34845733642578, "global_step": 39696, "epoch": 478} {"train_loss": -19.45238494873047, "global_step": 39697, "epoch": 478} {"train_loss": -19.159862518310547, "global_step": 39698, "epoch": 478} {"train_loss": -19.43730926513672, "global_step": 39699, "epoch": 478} {"train_loss": -19.331945419311523, "global_step": 39700, "epoch": 478} {"train_loss": -19.234037399291992, "global_step": 39701, "epoch": 478} {"train_loss": -19.55433464050293, "global_step": 39702, "epoch": 478} {"train_loss": -19.687803268432617, "global_step": 39703, "epoch": 478} {"train_loss": -19.44129180908203, "global_step": 39704, "epoch": 478} {"train_loss": -19.388608932495117, "global_step": 39705, "epoch": 478} {"train_loss": -19.57086753845215, "global_step": 39706, "epoch": 478} {"train_loss": -19.376617431640625, "global_step": 39707, "epoch": 478} {"train_loss": -19.521121978759766, "global_step": 39708, "epoch": 478} {"train_loss": -19.32868766784668, "global_step": 39709, "epoch": 478} {"train_loss": -19.361026763916016, "global_step": 39710, "epoch": 478} {"train_loss": -19.70790672302246, "global_step": 39711, "epoch": 478} {"train_loss": -19.078611373901367, "global_step": 39712, "epoch": 478} {"train_loss": -19.252262115478516, "global_step": 39713, "epoch": 478} {"train_loss": -19.3907413482666, "global_step": 39714, "epoch": 478} {"train_loss": -19.14460563659668, "global_step": 39715, "epoch": 478} {"train_loss": -19.772504806518555, "global_step": 39716, "epoch": 478} {"train_loss": -19.287946701049805, "global_step": 39717, "epoch": 478} {"train_loss": -19.59183120727539, "global_step": 39718, "epoch": 478} {"train_loss": -19.406585693359375, "global_step": 39719, "epoch": 478} {"train_loss": -19.618349075317383, "global_step": 39720, "epoch": 478} {"train_loss": -19.56984519958496, "global_step": 39721, "epoch": 478} {"train_loss": -19.227365493774414, "global_step": 39722, "epoch": 478} {"train_loss": -19.3367919921875, "global_step": 39723, "epoch": 478} {"train_loss": -19.453811645507812, "global_step": 39724, "epoch": 478} {"train_loss": -19.220083236694336, "global_step": 39725, "epoch": 478} {"train_loss": -19.553924560546875, "global_step": 39726, "epoch": 478} {"train_loss": -19.697824478149414, "global_step": 39727, "epoch": 478} {"train_loss": -19.76102638244629, "global_step": 39728, "epoch": 478} {"train_loss": -19.54401206970215, "global_step": 39729, "epoch": 478} {"train_loss": -19.555606842041016, "global_step": 39730, "epoch": 478} {"train_loss": -19.50419807434082, "global_step": 39731, "epoch": 478} {"train_loss": -19.58966827392578, "global_step": 39732, "epoch": 478} {"train_loss": -19.352951049804688, "global_step": 39733, "epoch": 478} {"train_loss": -19.250288009643555, "global_step": 39734, "epoch": 478} {"train_loss": -19.23140525817871, "global_step": 39735, "epoch": 478} {"train_loss": -19.585861206054688, "global_step": 39736, "epoch": 478} {"train_loss": -19.25509262084961, "global_step": 39737, "epoch": 478} {"train_loss": -19.209257125854492, "global_step": 39738, "epoch": 478} {"train_loss": -19.22492027282715, "global_step": 39739, "epoch": 478} {"train_loss": -19.54487419128418, "global_step": 39740, "epoch": 478} {"train_loss": -19.567264556884766, "global_step": 39741, "epoch": 478} {"train_loss": -19.32858657836914, "global_step": 39742, "epoch": 478} {"train_loss": -19.136075973510742, "global_step": 39743, "epoch": 478} {"train_loss": -19.39575958251953, "global_step": 39744, "epoch": 478} {"train_loss": -19.175386428833008, "global_step": 39745, "epoch": 478} {"train_loss": -19.553672790527344, "global_step": 39746, "epoch": 478} {"train_loss": -19.35700798034668, "global_step": 39747, "epoch": 478} {"train_loss": -19.143774032592773, "global_step": 39748, "epoch": 478} {"train_loss": -19.477741241455078, "global_step": 39749, "epoch": 478} {"train_loss": -19.68848991394043, "global_step": 39750, "epoch": 478} {"train_loss": -19.391027450561523, "global_step": 39751, "epoch": 478} {"train_loss": -19.070188522338867, "global_step": 39752, "epoch": 478} {"train_loss": -19.31837272644043, "global_step": 39753, "epoch": 478} {"train_loss": -19.952157974243164, "global_step": 39754, "epoch": 478} {"train_loss": -19.293540954589844, "global_step": 39755, "epoch": 478} {"train_loss": -19.386405048600164, "global_step": 39756, "epoch": 478, "val_loss": 6029935.5} {"train_loss": -19.347158432006836, "global_step": 39757, "epoch": 479} {"train_loss": -19.068021774291992, "global_step": 39758, "epoch": 479} {"train_loss": -19.0476131439209, "global_step": 39759, "epoch": 479} {"train_loss": -19.22761344909668, "global_step": 39760, "epoch": 479} {"train_loss": -19.384567260742188, "global_step": 39761, "epoch": 479} {"train_loss": -19.519819259643555, "global_step": 39762, "epoch": 479} {"train_loss": -19.01984977722168, "global_step": 39763, "epoch": 479} {"train_loss": -18.997467041015625, "global_step": 39764, "epoch": 479} {"train_loss": -19.310359954833984, "global_step": 39765, "epoch": 479} {"train_loss": -19.508779525756836, "global_step": 39766, "epoch": 479} {"train_loss": -19.296833038330078, "global_step": 39767, "epoch": 479} {"train_loss": -19.00795555114746, "global_step": 39768, "epoch": 479} {"train_loss": -19.175500869750977, "global_step": 39769, "epoch": 479} {"train_loss": -19.587982177734375, "global_step": 39770, "epoch": 479} {"train_loss": -19.051023483276367, "global_step": 39771, "epoch": 479} {"train_loss": -19.471332550048828, "global_step": 39772, "epoch": 479} {"train_loss": -19.174131393432617, "global_step": 39773, "epoch": 479} {"train_loss": -19.79923439025879, "global_step": 39774, "epoch": 479} {"train_loss": -19.629568099975586, "global_step": 39775, "epoch": 479} {"train_loss": -19.369617462158203, "global_step": 39776, "epoch": 479} {"train_loss": -19.676294326782227, "global_step": 39777, "epoch": 479} {"train_loss": -19.762237548828125, "global_step": 39778, "epoch": 479} {"train_loss": -19.83047866821289, "global_step": 39779, "epoch": 479} {"train_loss": -19.54408836364746, "global_step": 39780, "epoch": 479} {"train_loss": -19.664146423339844, "global_step": 39781, "epoch": 479} {"train_loss": -19.368967056274414, "global_step": 39782, "epoch": 479} {"train_loss": -19.1616268157959, "global_step": 39783, "epoch": 479} {"train_loss": -19.227434158325195, "global_step": 39784, "epoch": 479} {"train_loss": -19.214282989501953, "global_step": 39785, "epoch": 479} {"train_loss": -19.744356155395508, "global_step": 39786, "epoch": 479} {"train_loss": -19.36539077758789, "global_step": 39787, "epoch": 479} {"train_loss": -19.769805908203125, "global_step": 39788, "epoch": 479} {"train_loss": -19.151376724243164, "global_step": 39789, "epoch": 479} {"train_loss": -19.454378128051758, "global_step": 39790, "epoch": 479} {"train_loss": -19.08492088317871, "global_step": 39791, "epoch": 479} {"train_loss": -19.737102508544922, "global_step": 39792, "epoch": 479} {"train_loss": -19.310178756713867, "global_step": 39793, "epoch": 479} {"train_loss": -19.489898681640625, "global_step": 39794, "epoch": 479} {"train_loss": -20.13300132751465, "global_step": 39795, "epoch": 479} {"train_loss": -19.560312271118164, "global_step": 39796, "epoch": 479} {"train_loss": -19.414461135864258, "global_step": 39797, "epoch": 479} {"train_loss": -19.60886001586914, "global_step": 39798, "epoch": 479} {"train_loss": -19.12091827392578, "global_step": 39799, "epoch": 479} {"train_loss": -20.126916885375977, "global_step": 39800, "epoch": 479} {"train_loss": -19.42962646484375, "global_step": 39801, "epoch": 479} {"train_loss": -19.080957412719727, "global_step": 39802, "epoch": 479} {"train_loss": -19.373395919799805, "global_step": 39803, "epoch": 479} {"train_loss": -18.91058349609375, "global_step": 39804, "epoch": 479} {"train_loss": -19.27972984313965, "global_step": 39805, "epoch": 479} {"train_loss": -19.296085357666016, "global_step": 39806, "epoch": 479} {"train_loss": -19.29598617553711, "global_step": 39807, "epoch": 479} {"train_loss": -19.638202667236328, "global_step": 39808, "epoch": 479} {"train_loss": -19.410953521728516, "global_step": 39809, "epoch": 479} {"train_loss": -19.43585205078125, "global_step": 39810, "epoch": 479} {"train_loss": -19.57718849182129, "global_step": 39811, "epoch": 479} {"train_loss": -19.334104537963867, "global_step": 39812, "epoch": 479} {"train_loss": -19.492719650268555, "global_step": 39813, "epoch": 479} {"train_loss": -19.191543579101562, "global_step": 39814, "epoch": 479} {"train_loss": -19.408668518066406, "global_step": 39815, "epoch": 479} {"train_loss": -18.805166244506836, "global_step": 39816, "epoch": 479} {"train_loss": -19.160505294799805, "global_step": 39817, "epoch": 479} {"train_loss": -19.10499382019043, "global_step": 39818, "epoch": 479} {"train_loss": -19.34446144104004, "global_step": 39819, "epoch": 479} {"train_loss": -19.479801177978516, "global_step": 39820, "epoch": 479} {"train_loss": -19.273178100585938, "global_step": 39821, "epoch": 479} {"train_loss": -19.022180557250977, "global_step": 39822, "epoch": 479} {"train_loss": -19.49934959411621, "global_step": 39823, "epoch": 479} {"train_loss": -19.39252281188965, "global_step": 39824, "epoch": 479} {"train_loss": -19.33243751525879, "global_step": 39825, "epoch": 479} {"train_loss": -19.72491455078125, "global_step": 39826, "epoch": 479} {"train_loss": -19.321142196655273, "global_step": 39827, "epoch": 479} {"train_loss": -19.7935791015625, "global_step": 39828, "epoch": 479} {"train_loss": -19.57305335998535, "global_step": 39829, "epoch": 479} {"train_loss": -19.198654174804688, "global_step": 39830, "epoch": 479} {"train_loss": -19.042577743530273, "global_step": 39831, "epoch": 479} {"train_loss": -19.674955368041992, "global_step": 39832, "epoch": 479} {"train_loss": -19.315610885620117, "global_step": 39833, "epoch": 479} {"train_loss": -19.157276153564453, "global_step": 39834, "epoch": 479} {"train_loss": -19.253713607788086, "global_step": 39835, "epoch": 479} {"train_loss": -19.538419723510742, "global_step": 39836, "epoch": 479} {"train_loss": -19.675024032592773, "global_step": 39837, "epoch": 479} {"train_loss": -19.550973892211914, "global_step": 39838, "epoch": 479} {"train_loss": -19.391800960862493, "global_step": 39839, "epoch": 479, "val_loss": 6090901.0} {"train_loss": -19.41400146484375, "global_step": 39840, "epoch": 480} {"train_loss": -19.22271728515625, "global_step": 39841, "epoch": 480} {"train_loss": -19.524009704589844, "global_step": 39842, "epoch": 480} {"train_loss": -19.05051040649414, "global_step": 39843, "epoch": 480} {"train_loss": -19.508060455322266, "global_step": 39844, "epoch": 480} {"train_loss": -19.58817481994629, "global_step": 39845, "epoch": 480} {"train_loss": -19.31290054321289, "global_step": 39846, "epoch": 480} {"train_loss": -19.47694206237793, "global_step": 39847, "epoch": 480} {"train_loss": -19.205984115600586, "global_step": 39848, "epoch": 480} {"train_loss": -19.628366470336914, "global_step": 39849, "epoch": 480} {"train_loss": -19.189441680908203, "global_step": 39850, "epoch": 480} {"train_loss": -19.585224151611328, "global_step": 39851, "epoch": 480} {"train_loss": -19.677541732788086, "global_step": 39852, "epoch": 480} {"train_loss": -19.523588180541992, "global_step": 39853, "epoch": 480} {"train_loss": -19.649831771850586, "global_step": 39854, "epoch": 480} {"train_loss": -19.24653434753418, "global_step": 39855, "epoch": 480} {"train_loss": -19.275808334350586, "global_step": 39856, "epoch": 480} {"train_loss": -19.3082275390625, "global_step": 39857, "epoch": 480} {"train_loss": -19.318668365478516, "global_step": 39858, "epoch": 480} {"train_loss": -19.701784133911133, "global_step": 39859, "epoch": 480} {"train_loss": -19.48700714111328, "global_step": 39860, "epoch": 480} {"train_loss": -19.64581298828125, "global_step": 39861, "epoch": 480} {"train_loss": -19.212148666381836, "global_step": 39862, "epoch": 480} {"train_loss": -19.549909591674805, "global_step": 39863, "epoch": 480} {"train_loss": -19.450132369995117, "global_step": 39864, "epoch": 480} {"train_loss": -19.564212799072266, "global_step": 39865, "epoch": 480} {"train_loss": -19.25236701965332, "global_step": 39866, "epoch": 480} {"train_loss": -19.1640625, "global_step": 39867, "epoch": 480} {"train_loss": -19.465476989746094, "global_step": 39868, "epoch": 480} {"train_loss": -19.34375762939453, "global_step": 39869, "epoch": 480} {"train_loss": -19.746963500976562, "global_step": 39870, "epoch": 480} {"train_loss": -19.21952247619629, "global_step": 39871, "epoch": 480} {"train_loss": -19.499921798706055, "global_step": 39872, "epoch": 480} {"train_loss": -19.405723571777344, "global_step": 39873, "epoch": 480} {"train_loss": -19.461130142211914, "global_step": 39874, "epoch": 480} {"train_loss": -19.356470108032227, "global_step": 39875, "epoch": 480} {"train_loss": -19.333953857421875, "global_step": 39876, "epoch": 480} {"train_loss": -19.46539878845215, "global_step": 39877, "epoch": 480} {"train_loss": -19.796306610107422, "global_step": 39878, "epoch": 480} {"train_loss": -19.444461822509766, "global_step": 39879, "epoch": 480} {"train_loss": -19.4835147857666, "global_step": 39880, "epoch": 480} {"train_loss": -19.55706214904785, "global_step": 39881, "epoch": 480} {"train_loss": -19.27051544189453, "global_step": 39882, "epoch": 480} {"train_loss": -19.661245346069336, "global_step": 39883, "epoch": 480} {"train_loss": -19.511571884155273, "global_step": 39884, "epoch": 480} {"train_loss": -19.55885124206543, "global_step": 39885, "epoch": 480} {"train_loss": -19.61134910583496, "global_step": 39886, "epoch": 480} {"train_loss": -18.778005599975586, "global_step": 39887, "epoch": 480} {"train_loss": -19.729190826416016, "global_step": 39888, "epoch": 480} {"train_loss": -19.351926803588867, "global_step": 39889, "epoch": 480} {"train_loss": -19.73577880859375, "global_step": 39890, "epoch": 480} {"train_loss": -19.243946075439453, "global_step": 39891, "epoch": 480} {"train_loss": -19.244449615478516, "global_step": 39892, "epoch": 480} {"train_loss": -19.794279098510742, "global_step": 39893, "epoch": 480} {"train_loss": -19.501224517822266, "global_step": 39894, "epoch": 480} {"train_loss": -19.060117721557617, "global_step": 39895, "epoch": 480} {"train_loss": -19.28517723083496, "global_step": 39896, "epoch": 480} {"train_loss": -19.255306243896484, "global_step": 39897, "epoch": 480} {"train_loss": -19.068525314331055, "global_step": 39898, "epoch": 480} {"train_loss": -19.35630226135254, "global_step": 39899, "epoch": 480} {"train_loss": -19.380037307739258, "global_step": 39900, "epoch": 480} {"train_loss": -19.40924644470215, "global_step": 39901, "epoch": 480} {"train_loss": -19.351938247680664, "global_step": 39902, "epoch": 480} {"train_loss": -19.51650047302246, "global_step": 39903, "epoch": 480} {"train_loss": -19.330982208251953, "global_step": 39904, "epoch": 480} {"train_loss": -19.29204750061035, "global_step": 39905, "epoch": 480} {"train_loss": -19.60259437561035, "global_step": 39906, "epoch": 480} {"train_loss": -19.499858856201172, "global_step": 39907, "epoch": 480} {"train_loss": -19.633670806884766, "global_step": 39908, "epoch": 480} {"train_loss": -19.42176628112793, "global_step": 39909, "epoch": 480} {"train_loss": -19.215858459472656, "global_step": 39910, "epoch": 480} {"train_loss": -20.000680923461914, "global_step": 39911, "epoch": 480} {"train_loss": -19.77461051940918, "global_step": 39912, "epoch": 480} {"train_loss": -19.563194274902344, "global_step": 39913, "epoch": 480} {"train_loss": -19.73924446105957, "global_step": 39914, "epoch": 480} {"train_loss": -19.39676284790039, "global_step": 39915, "epoch": 480} {"train_loss": -19.619688034057617, "global_step": 39916, "epoch": 480} {"train_loss": -19.496002197265625, "global_step": 39917, "epoch": 480} {"train_loss": -19.347320556640625, "global_step": 39918, "epoch": 480} {"train_loss": -19.747331619262695, "global_step": 39919, "epoch": 480} {"train_loss": -19.585142135620117, "global_step": 39920, "epoch": 480} {"train_loss": -19.352930068969727, "global_step": 39921, "epoch": 480} {"train_loss": -19.459521925593, "global_step": 39922, "epoch": 480, "val_loss": 5976908.0} {"train_loss": -19.043214797973633, "global_step": 39923, "epoch": 481} {"train_loss": -19.153457641601562, "global_step": 39924, "epoch": 481} {"train_loss": -19.14190101623535, "global_step": 39925, "epoch": 481} {"train_loss": -19.24952507019043, "global_step": 39926, "epoch": 481} {"train_loss": -18.801477432250977, "global_step": 39927, "epoch": 481} {"train_loss": -19.09815788269043, "global_step": 39928, "epoch": 481} {"train_loss": -19.676219940185547, "global_step": 39929, "epoch": 481} {"train_loss": -19.126150131225586, "global_step": 39930, "epoch": 481} {"train_loss": -19.47711753845215, "global_step": 39931, "epoch": 481} {"train_loss": -19.234941482543945, "global_step": 39932, "epoch": 481} {"train_loss": -18.982709884643555, "global_step": 39933, "epoch": 481} {"train_loss": -19.192026138305664, "global_step": 39934, "epoch": 481} {"train_loss": -19.351573944091797, "global_step": 39935, "epoch": 481} {"train_loss": -19.318340301513672, "global_step": 39936, "epoch": 481} {"train_loss": -19.7857666015625, "global_step": 39937, "epoch": 481} {"train_loss": -19.480310440063477, "global_step": 39938, "epoch": 481} {"train_loss": -19.286352157592773, "global_step": 39939, "epoch": 481} {"train_loss": -19.486364364624023, "global_step": 39940, "epoch": 481} {"train_loss": -19.451597213745117, "global_step": 39941, "epoch": 481} {"train_loss": -19.364667892456055, "global_step": 39942, "epoch": 481} {"train_loss": -19.77680206298828, "global_step": 39943, "epoch": 481} {"train_loss": -19.65289306640625, "global_step": 39944, "epoch": 481} {"train_loss": -19.424739837646484, "global_step": 39945, "epoch": 481} {"train_loss": -19.385622024536133, "global_step": 39946, "epoch": 481} {"train_loss": -19.401504516601562, "global_step": 39947, "epoch": 481} {"train_loss": -19.23968505859375, "global_step": 39948, "epoch": 481} {"train_loss": -19.088266372680664, "global_step": 39949, "epoch": 481} {"train_loss": -19.133424758911133, "global_step": 39950, "epoch": 481} {"train_loss": -19.385812759399414, "global_step": 39951, "epoch": 481} {"train_loss": -19.856725692749023, "global_step": 39952, "epoch": 481} {"train_loss": -19.01503562927246, "global_step": 39953, "epoch": 481} {"train_loss": -19.340961456298828, "global_step": 39954, "epoch": 481} {"train_loss": -19.195144653320312, "global_step": 39955, "epoch": 481} {"train_loss": -19.68992805480957, "global_step": 39956, "epoch": 481} {"train_loss": -19.680618286132812, "global_step": 39957, "epoch": 481} {"train_loss": -19.2699031829834, "global_step": 39958, "epoch": 481} {"train_loss": -19.59160804748535, "global_step": 39959, "epoch": 481} {"train_loss": -19.023740768432617, "global_step": 39960, "epoch": 481} {"train_loss": -19.428516387939453, "global_step": 39961, "epoch": 481} {"train_loss": -19.543821334838867, "global_step": 39962, "epoch": 481} {"train_loss": -19.251220703125, "global_step": 39963, "epoch": 481} {"train_loss": -19.395977020263672, "global_step": 39964, "epoch": 481} {"train_loss": -19.86396598815918, "global_step": 39965, "epoch": 481} {"train_loss": -19.40666961669922, "global_step": 39966, "epoch": 481} {"train_loss": -19.387596130371094, "global_step": 39967, "epoch": 481} {"train_loss": -19.49226951599121, "global_step": 39968, "epoch": 481} {"train_loss": -19.17734718322754, "global_step": 39969, "epoch": 481} {"train_loss": -19.76698112487793, "global_step": 39970, "epoch": 481} {"train_loss": -19.529821395874023, "global_step": 39971, "epoch": 481} {"train_loss": -19.536340713500977, "global_step": 39972, "epoch": 481} {"train_loss": -19.470218658447266, "global_step": 39973, "epoch": 481} {"train_loss": -19.24216651916504, "global_step": 39974, "epoch": 481} {"train_loss": -19.342323303222656, "global_step": 39975, "epoch": 481} {"train_loss": -19.526575088500977, "global_step": 39976, "epoch": 481} {"train_loss": -19.501188278198242, "global_step": 39977, "epoch": 481} {"train_loss": -19.206329345703125, "global_step": 39978, "epoch": 481} {"train_loss": -19.494104385375977, "global_step": 39979, "epoch": 481} {"train_loss": -18.98110580444336, "global_step": 39980, "epoch": 481} {"train_loss": -19.591388702392578, "global_step": 39981, "epoch": 481} {"train_loss": -19.584735870361328, "global_step": 39982, "epoch": 481} {"train_loss": -19.660282135009766, "global_step": 39983, "epoch": 481} {"train_loss": -18.958921432495117, "global_step": 39984, "epoch": 481} {"train_loss": -19.768747329711914, "global_step": 39985, "epoch": 481} {"train_loss": -19.453201293945312, "global_step": 39986, "epoch": 481} {"train_loss": -19.3905086517334, "global_step": 39987, "epoch": 481} {"train_loss": -19.39832305908203, "global_step": 39988, "epoch": 481} {"train_loss": -19.712209701538086, "global_step": 39989, "epoch": 481} {"train_loss": -19.25908660888672, "global_step": 39990, "epoch": 481} {"train_loss": -19.574813842773438, "global_step": 39991, "epoch": 481} {"train_loss": -19.36112403869629, "global_step": 39992, "epoch": 481} {"train_loss": -19.275800704956055, "global_step": 39993, "epoch": 481} {"train_loss": -19.459171295166016, "global_step": 39994, "epoch": 481} {"train_loss": -19.471899032592773, "global_step": 39995, "epoch": 481} {"train_loss": -19.698331832885742, "global_step": 39996, "epoch": 481} {"train_loss": -19.246530532836914, "global_step": 39997, "epoch": 481} {"train_loss": -19.399564743041992, "global_step": 39998, "epoch": 481} {"train_loss": -19.55529022216797, "global_step": 39999, "epoch": 481} {"train_loss": -19.30429458618164, "global_step": 40000, "epoch": 481} {"train_loss": -19.616514205932617, "global_step": 40001, "epoch": 481} {"train_loss": -19.62308120727539, "global_step": 40002, "epoch": 481} {"train_loss": -19.4373779296875, "global_step": 40003, "epoch": 481} {"train_loss": -19.5030574798584, "global_step": 40004, "epoch": 481} {"train_loss": -19.362641139202807, "global_step": 40005, "epoch": 481, "val_loss": 5928002.5} {"train_loss": -19.631399154663086, "global_step": 40006, "epoch": 482} {"train_loss": -19.19237518310547, "global_step": 40007, "epoch": 482} {"train_loss": -19.44525146484375, "global_step": 40008, "epoch": 482} {"train_loss": -19.301538467407227, "global_step": 40009, "epoch": 482} {"train_loss": -19.23419189453125, "global_step": 40010, "epoch": 482} {"train_loss": -19.33893394470215, "global_step": 40011, "epoch": 482} {"train_loss": -19.278762817382812, "global_step": 40012, "epoch": 482} {"train_loss": -19.448822021484375, "global_step": 40013, "epoch": 482} {"train_loss": -19.492198944091797, "global_step": 40014, "epoch": 482} {"train_loss": -19.405437469482422, "global_step": 40015, "epoch": 482} {"train_loss": -19.394819259643555, "global_step": 40016, "epoch": 482} {"train_loss": -19.55945587158203, "global_step": 40017, "epoch": 482} {"train_loss": -19.380422592163086, "global_step": 40018, "epoch": 482} {"train_loss": -19.64545249938965, "global_step": 40019, "epoch": 482} {"train_loss": -19.27459144592285, "global_step": 40020, "epoch": 482} {"train_loss": -19.81353187561035, "global_step": 40021, "epoch": 482} {"train_loss": -19.356948852539062, "global_step": 40022, "epoch": 482} {"train_loss": -19.543315887451172, "global_step": 40023, "epoch": 482} {"train_loss": -19.321388244628906, "global_step": 40024, "epoch": 482} {"train_loss": -19.334829330444336, "global_step": 40025, "epoch": 482} {"train_loss": -19.501596450805664, "global_step": 40026, "epoch": 482} {"train_loss": -19.42856788635254, "global_step": 40027, "epoch": 482} {"train_loss": -19.434253692626953, "global_step": 40028, "epoch": 482} {"train_loss": -19.411439895629883, "global_step": 40029, "epoch": 482} {"train_loss": -19.42329216003418, "global_step": 40030, "epoch": 482} {"train_loss": -19.20172882080078, "global_step": 40031, "epoch": 482} {"train_loss": -19.203664779663086, "global_step": 40032, "epoch": 482} {"train_loss": -19.309572219848633, "global_step": 40033, "epoch": 482} {"train_loss": -19.188730239868164, "global_step": 40034, "epoch": 482} {"train_loss": -18.840295791625977, "global_step": 40035, "epoch": 482} {"train_loss": -19.773569107055664, "global_step": 40036, "epoch": 482} {"train_loss": -19.15862464904785, "global_step": 40037, "epoch": 482} {"train_loss": -19.159011840820312, "global_step": 40038, "epoch": 482} {"train_loss": -19.361614227294922, "global_step": 40039, "epoch": 482} {"train_loss": -19.317886352539062, "global_step": 40040, "epoch": 482} {"train_loss": -19.677934646606445, "global_step": 40041, "epoch": 482} {"train_loss": -19.434125900268555, "global_step": 40042, "epoch": 482} {"train_loss": -19.384214401245117, "global_step": 40043, "epoch": 482} {"train_loss": -19.5403995513916, "global_step": 40044, "epoch": 482} {"train_loss": -19.901020050048828, "global_step": 40045, "epoch": 482} {"train_loss": -19.363218307495117, "global_step": 40046, "epoch": 482} {"train_loss": -19.091323852539062, "global_step": 40047, "epoch": 482} {"train_loss": -19.251554489135742, "global_step": 40048, "epoch": 482} {"train_loss": -19.432003021240234, "global_step": 40049, "epoch": 482} {"train_loss": -19.385311126708984, "global_step": 40050, "epoch": 482} {"train_loss": -19.308393478393555, "global_step": 40051, "epoch": 482} {"train_loss": -19.282543182373047, "global_step": 40052, "epoch": 482} {"train_loss": -19.710111618041992, "global_step": 40053, "epoch": 482} {"train_loss": -19.153493881225586, "global_step": 40054, "epoch": 482} {"train_loss": -19.396671295166016, "global_step": 40055, "epoch": 482} {"train_loss": -19.529876708984375, "global_step": 40056, "epoch": 482} {"train_loss": -19.640283584594727, "global_step": 40057, "epoch": 482} {"train_loss": -19.226484298706055, "global_step": 40058, "epoch": 482} {"train_loss": -19.536779403686523, "global_step": 40059, "epoch": 482} {"train_loss": -19.42513656616211, "global_step": 40060, "epoch": 482} {"train_loss": -19.605810165405273, "global_step": 40061, "epoch": 482} {"train_loss": -19.50311851501465, "global_step": 40062, "epoch": 482} {"train_loss": -19.23685646057129, "global_step": 40063, "epoch": 482} {"train_loss": -19.52182388305664, "global_step": 40064, "epoch": 482} {"train_loss": -19.5244140625, "global_step": 40065, "epoch": 482} {"train_loss": -19.573339462280273, "global_step": 40066, "epoch": 482} {"train_loss": -19.34990119934082, "global_step": 40067, "epoch": 482} {"train_loss": -19.337453842163086, "global_step": 40068, "epoch": 482} {"train_loss": -19.222766876220703, "global_step": 40069, "epoch": 482} {"train_loss": -19.269132614135742, "global_step": 40070, "epoch": 482} {"train_loss": -19.633384704589844, "global_step": 40071, "epoch": 482} {"train_loss": -19.401935577392578, "global_step": 40072, "epoch": 482} {"train_loss": -20.034154891967773, "global_step": 40073, "epoch": 482} {"train_loss": -19.80775260925293, "global_step": 40074, "epoch": 482} {"train_loss": -19.80879783630371, "global_step": 40075, "epoch": 482} {"train_loss": -19.43987464904785, "global_step": 40076, "epoch": 482} {"train_loss": -19.533891677856445, "global_step": 40077, "epoch": 482} {"train_loss": -19.700782775878906, "global_step": 40078, "epoch": 482} {"train_loss": -19.398035049438477, "global_step": 40079, "epoch": 482} {"train_loss": -19.46693992614746, "global_step": 40080, "epoch": 482} {"train_loss": -19.519643783569336, "global_step": 40081, "epoch": 482} {"train_loss": -19.3978328704834, "global_step": 40082, "epoch": 482} {"train_loss": -19.3748779296875, "global_step": 40083, "epoch": 482} {"train_loss": -19.236135482788086, "global_step": 40084, "epoch": 482} {"train_loss": -19.54860496520996, "global_step": 40085, "epoch": 482} {"train_loss": -19.076324462890625, "global_step": 40086, "epoch": 482} {"train_loss": -19.533220291137695, "global_step": 40087, "epoch": 482} {"train_loss": -19.45398505337267, "global_step": 40088, "epoch": 482, "val_loss": 5922580.5} {"train_loss": -19.50337791442871, "global_step": 40089, "epoch": 483} {"train_loss": -19.632041931152344, "global_step": 40090, "epoch": 483} {"train_loss": -19.143896102905273, "global_step": 40091, "epoch": 483} {"train_loss": -19.155309677124023, "global_step": 40092, "epoch": 483} {"train_loss": -19.320077896118164, "global_step": 40093, "epoch": 483} {"train_loss": -19.45267677307129, "global_step": 40094, "epoch": 483} {"train_loss": -19.443849563598633, "global_step": 40095, "epoch": 483} {"train_loss": -19.214242935180664, "global_step": 40096, "epoch": 483} {"train_loss": -19.006071090698242, "global_step": 40097, "epoch": 483} {"train_loss": -18.8125, "global_step": 40098, "epoch": 483} {"train_loss": -19.32217025756836, "global_step": 40099, "epoch": 483} {"train_loss": -19.206689834594727, "global_step": 40100, "epoch": 483} {"train_loss": -19.111486434936523, "global_step": 40101, "epoch": 483} {"train_loss": -19.50370216369629, "global_step": 40102, "epoch": 483} {"train_loss": -19.159406661987305, "global_step": 40103, "epoch": 483} {"train_loss": -19.320560455322266, "global_step": 40104, "epoch": 483} {"train_loss": -19.646244049072266, "global_step": 40105, "epoch": 483} {"train_loss": -19.4023380279541, "global_step": 40106, "epoch": 483} {"train_loss": -19.223356246948242, "global_step": 40107, "epoch": 483} {"train_loss": -19.542484283447266, "global_step": 40108, "epoch": 483} {"train_loss": -19.47480583190918, "global_step": 40109, "epoch": 483} {"train_loss": -19.173643112182617, "global_step": 40110, "epoch": 483} {"train_loss": -19.024364471435547, "global_step": 40111, "epoch": 483} {"train_loss": -19.146759033203125, "global_step": 40112, "epoch": 483} {"train_loss": -19.34291648864746, "global_step": 40113, "epoch": 483} {"train_loss": -19.46632957458496, "global_step": 40114, "epoch": 483} {"train_loss": -19.49420928955078, "global_step": 40115, "epoch": 483} {"train_loss": -19.289878845214844, "global_step": 40116, "epoch": 483} {"train_loss": -19.36126136779785, "global_step": 40117, "epoch": 483} {"train_loss": -19.629858016967773, "global_step": 40118, "epoch": 483} {"train_loss": -19.0202693939209, "global_step": 40119, "epoch": 483} {"train_loss": -19.434494018554688, "global_step": 40120, "epoch": 483} {"train_loss": -19.388431549072266, "global_step": 40121, "epoch": 483} {"train_loss": -19.309003829956055, "global_step": 40122, "epoch": 483} {"train_loss": -19.135984420776367, "global_step": 40123, "epoch": 483} {"train_loss": -19.519418716430664, "global_step": 40124, "epoch": 483} {"train_loss": -19.021657943725586, "global_step": 40125, "epoch": 483} {"train_loss": -19.445457458496094, "global_step": 40126, "epoch": 483} {"train_loss": -18.97475242614746, "global_step": 40127, "epoch": 483} {"train_loss": -19.509607315063477, "global_step": 40128, "epoch": 483} {"train_loss": -19.597585678100586, "global_step": 40129, "epoch": 483} {"train_loss": -19.335418701171875, "global_step": 40130, "epoch": 483} {"train_loss": -19.1429500579834, "global_step": 40131, "epoch": 483} {"train_loss": -19.267498016357422, "global_step": 40132, "epoch": 483} {"train_loss": -19.563034057617188, "global_step": 40133, "epoch": 483} {"train_loss": -19.4091739654541, "global_step": 40134, "epoch": 483} {"train_loss": -19.443174362182617, "global_step": 40135, "epoch": 483} {"train_loss": -19.138574600219727, "global_step": 40136, "epoch": 483} {"train_loss": -19.58608627319336, "global_step": 40137, "epoch": 483} {"train_loss": -19.376148223876953, "global_step": 40138, "epoch": 483} {"train_loss": -19.576902389526367, "global_step": 40139, "epoch": 483} {"train_loss": -19.3118896484375, "global_step": 40140, "epoch": 483} {"train_loss": -19.520341873168945, "global_step": 40141, "epoch": 483} {"train_loss": -19.8588809967041, "global_step": 40142, "epoch": 483} {"train_loss": -19.340818405151367, "global_step": 40143, "epoch": 483} {"train_loss": -19.415449142456055, "global_step": 40144, "epoch": 483} {"train_loss": -19.4385929107666, "global_step": 40145, "epoch": 483} {"train_loss": -19.5135555267334, "global_step": 40146, "epoch": 483} {"train_loss": -19.483806610107422, "global_step": 40147, "epoch": 483} {"train_loss": -19.380023956298828, "global_step": 40148, "epoch": 483} {"train_loss": -19.277353286743164, "global_step": 40149, "epoch": 483} {"train_loss": -19.50259017944336, "global_step": 40150, "epoch": 483} {"train_loss": -19.511497497558594, "global_step": 40151, "epoch": 483} {"train_loss": -19.22024917602539, "global_step": 40152, "epoch": 483} {"train_loss": -19.639265060424805, "global_step": 40153, "epoch": 483} {"train_loss": -19.674224853515625, "global_step": 40154, "epoch": 483} {"train_loss": -19.461896896362305, "global_step": 40155, "epoch": 483} {"train_loss": -19.555118560791016, "global_step": 40156, "epoch": 483} {"train_loss": -19.486286163330078, "global_step": 40157, "epoch": 483} {"train_loss": -19.683210372924805, "global_step": 40158, "epoch": 483} {"train_loss": -19.558765411376953, "global_step": 40159, "epoch": 483} {"train_loss": -19.360334396362305, "global_step": 40160, "epoch": 483} {"train_loss": -19.714736938476562, "global_step": 40161, "epoch": 483} {"train_loss": -19.696455001831055, "global_step": 40162, "epoch": 483} {"train_loss": -19.529142379760742, "global_step": 40163, "epoch": 483} {"train_loss": -19.133678436279297, "global_step": 40164, "epoch": 483} {"train_loss": -19.398603439331055, "global_step": 40165, "epoch": 483} {"train_loss": -19.371761322021484, "global_step": 40166, "epoch": 483} {"train_loss": -19.465896606445312, "global_step": 40167, "epoch": 483} {"train_loss": -19.422348022460938, "global_step": 40168, "epoch": 483} {"train_loss": -19.38271141052246, "global_step": 40169, "epoch": 483} {"train_loss": -19.549970626831055, "global_step": 40170, "epoch": 483} {"train_loss": -19.378473075039416, "global_step": 40171, "epoch": 483, "val_loss": 6080784.5} {"train_loss": -19.43964958190918, "global_step": 40172, "epoch": 484} {"train_loss": -19.26935386657715, "global_step": 40173, "epoch": 484} {"train_loss": -19.572986602783203, "global_step": 40174, "epoch": 484} {"train_loss": -18.532081604003906, "global_step": 40175, "epoch": 484} {"train_loss": -19.797941207885742, "global_step": 40176, "epoch": 484} {"train_loss": -19.346649169921875, "global_step": 40177, "epoch": 484} {"train_loss": -19.206878662109375, "global_step": 40178, "epoch": 484} {"train_loss": -19.095035552978516, "global_step": 40179, "epoch": 484} {"train_loss": -19.49960708618164, "global_step": 40180, "epoch": 484} {"train_loss": -19.22199058532715, "global_step": 40181, "epoch": 484} {"train_loss": -19.469379425048828, "global_step": 40182, "epoch": 484} {"train_loss": -19.290822982788086, "global_step": 40183, "epoch": 484} {"train_loss": -19.321855545043945, "global_step": 40184, "epoch": 484} {"train_loss": -19.552608489990234, "global_step": 40185, "epoch": 484} {"train_loss": -19.54774284362793, "global_step": 40186, "epoch": 484} {"train_loss": -19.39952850341797, "global_step": 40187, "epoch": 484} {"train_loss": -19.338098526000977, "global_step": 40188, "epoch": 484} {"train_loss": -19.61956214904785, "global_step": 40189, "epoch": 484} {"train_loss": -19.86444664001465, "global_step": 40190, "epoch": 484} {"train_loss": -19.5885066986084, "global_step": 40191, "epoch": 484} {"train_loss": -19.572673797607422, "global_step": 40192, "epoch": 484} {"train_loss": -19.35051918029785, "global_step": 40193, "epoch": 484} {"train_loss": -19.677762985229492, "global_step": 40194, "epoch": 484} {"train_loss": -19.465513229370117, "global_step": 40195, "epoch": 484} {"train_loss": -19.730894088745117, "global_step": 40196, "epoch": 484} {"train_loss": -19.36275291442871, "global_step": 40197, "epoch": 484} {"train_loss": -19.692676544189453, "global_step": 40198, "epoch": 484} {"train_loss": -19.481901168823242, "global_step": 40199, "epoch": 484} {"train_loss": -19.648832321166992, "global_step": 40200, "epoch": 484} {"train_loss": -19.618669509887695, "global_step": 40201, "epoch": 484} {"train_loss": -19.526548385620117, "global_step": 40202, "epoch": 484} {"train_loss": -19.770992279052734, "global_step": 40203, "epoch": 484} {"train_loss": -19.389768600463867, "global_step": 40204, "epoch": 484} {"train_loss": -19.318891525268555, "global_step": 40205, "epoch": 484} {"train_loss": -19.00994873046875, "global_step": 40206, "epoch": 484} {"train_loss": -19.524253845214844, "global_step": 40207, "epoch": 484} {"train_loss": -19.5523681640625, "global_step": 40208, "epoch": 484} {"train_loss": -19.42755699157715, "global_step": 40209, "epoch": 484} {"train_loss": -19.722442626953125, "global_step": 40210, "epoch": 484} {"train_loss": -19.453527450561523, "global_step": 40211, "epoch": 484} {"train_loss": -19.435394287109375, "global_step": 40212, "epoch": 484} {"train_loss": -19.348188400268555, "global_step": 40213, "epoch": 484} {"train_loss": -19.316177368164062, "global_step": 40214, "epoch": 484} {"train_loss": -19.683181762695312, "global_step": 40215, "epoch": 484} {"train_loss": -19.686288833618164, "global_step": 40216, "epoch": 484} {"train_loss": -19.549009323120117, "global_step": 40217, "epoch": 484} {"train_loss": -19.105438232421875, "global_step": 40218, "epoch": 484} {"train_loss": -19.254150390625, "global_step": 40219, "epoch": 484} {"train_loss": -19.743432998657227, "global_step": 40220, "epoch": 484} {"train_loss": -19.257055282592773, "global_step": 40221, "epoch": 484} {"train_loss": -19.58069610595703, "global_step": 40222, "epoch": 484} {"train_loss": -19.48821449279785, "global_step": 40223, "epoch": 484} {"train_loss": -19.43681526184082, "global_step": 40224, "epoch": 484} {"train_loss": -19.592472076416016, "global_step": 40225, "epoch": 484} {"train_loss": -19.53464126586914, "global_step": 40226, "epoch": 484} {"train_loss": -19.248485565185547, "global_step": 40227, "epoch": 484} {"train_loss": -19.671951293945312, "global_step": 40228, "epoch": 484} {"train_loss": -19.44496726989746, "global_step": 40229, "epoch": 484} {"train_loss": -19.230255126953125, "global_step": 40230, "epoch": 484} {"train_loss": -19.59236717224121, "global_step": 40231, "epoch": 484} {"train_loss": -19.341428756713867, "global_step": 40232, "epoch": 484} {"train_loss": -19.554166793823242, "global_step": 40233, "epoch": 484} {"train_loss": -19.355640411376953, "global_step": 40234, "epoch": 484} {"train_loss": -19.49639129638672, "global_step": 40235, "epoch": 484} {"train_loss": -19.044477462768555, "global_step": 40236, "epoch": 484} {"train_loss": -19.774412155151367, "global_step": 40237, "epoch": 484} {"train_loss": -19.514476776123047, "global_step": 40238, "epoch": 484} {"train_loss": -19.49740219116211, "global_step": 40239, "epoch": 484} {"train_loss": -19.155622482299805, "global_step": 40240, "epoch": 484} {"train_loss": -19.530364990234375, "global_step": 40241, "epoch": 484} {"train_loss": -19.315961837768555, "global_step": 40242, "epoch": 484} {"train_loss": -19.31667137145996, "global_step": 40243, "epoch": 484} {"train_loss": -19.7164306640625, "global_step": 40244, "epoch": 484} {"train_loss": -19.57245445251465, "global_step": 40245, "epoch": 484} {"train_loss": -19.417936325073242, "global_step": 40246, "epoch": 484} {"train_loss": -19.55059814453125, "global_step": 40247, "epoch": 484} {"train_loss": -19.64617156982422, "global_step": 40248, "epoch": 484} {"train_loss": -19.789936065673828, "global_step": 40249, "epoch": 484} {"train_loss": -19.603147506713867, "global_step": 40250, "epoch": 484} {"train_loss": -19.378210067749023, "global_step": 40251, "epoch": 484} {"train_loss": -19.580286026000977, "global_step": 40252, "epoch": 484} {"train_loss": -19.292638778686523, "global_step": 40253, "epoch": 484} {"train_loss": -19.47365195492664, "global_step": 40254, "epoch": 484, "val_loss": 5920959.0} {"train_loss": -19.338483810424805, "global_step": 40255, "epoch": 485} {"train_loss": -19.518741607666016, "global_step": 40256, "epoch": 485} {"train_loss": -19.215938568115234, "global_step": 40257, "epoch": 485} {"train_loss": -19.597190856933594, "global_step": 40258, "epoch": 485} {"train_loss": -19.56203269958496, "global_step": 40259, "epoch": 485} {"train_loss": -19.540075302124023, "global_step": 40260, "epoch": 485} {"train_loss": -19.548049926757812, "global_step": 40261, "epoch": 485} {"train_loss": -19.2176570892334, "global_step": 40262, "epoch": 485} {"train_loss": -19.420560836791992, "global_step": 40263, "epoch": 485} {"train_loss": -19.35624122619629, "global_step": 40264, "epoch": 485} {"train_loss": -19.300153732299805, "global_step": 40265, "epoch": 485} {"train_loss": -19.560565948486328, "global_step": 40266, "epoch": 485} {"train_loss": -19.278783798217773, "global_step": 40267, "epoch": 485} {"train_loss": -19.5993709564209, "global_step": 40268, "epoch": 485} {"train_loss": -19.605819702148438, "global_step": 40269, "epoch": 485} {"train_loss": -19.464506149291992, "global_step": 40270, "epoch": 485} {"train_loss": -19.34592628479004, "global_step": 40271, "epoch": 485} {"train_loss": -19.64630699157715, "global_step": 40272, "epoch": 485} {"train_loss": -19.558176040649414, "global_step": 40273, "epoch": 485} {"train_loss": -19.5178279876709, "global_step": 40274, "epoch": 485} {"train_loss": -19.633270263671875, "global_step": 40275, "epoch": 485} {"train_loss": -19.212736129760742, "global_step": 40276, "epoch": 485} {"train_loss": -19.3846378326416, "global_step": 40277, "epoch": 485} {"train_loss": -19.80690574645996, "global_step": 40278, "epoch": 485} {"train_loss": -19.652912139892578, "global_step": 40279, "epoch": 485} {"train_loss": -19.776193618774414, "global_step": 40280, "epoch": 485} {"train_loss": -19.62431526184082, "global_step": 40281, "epoch": 485} {"train_loss": -19.346521377563477, "global_step": 40282, "epoch": 485} {"train_loss": -19.670297622680664, "global_step": 40283, "epoch": 485} {"train_loss": -19.750940322875977, "global_step": 40284, "epoch": 485} {"train_loss": -19.498910903930664, "global_step": 40285, "epoch": 485} {"train_loss": -19.415197372436523, "global_step": 40286, "epoch": 485} {"train_loss": -19.15788459777832, "global_step": 40287, "epoch": 485} {"train_loss": -19.606754302978516, "global_step": 40288, "epoch": 485} {"train_loss": -19.058923721313477, "global_step": 40289, "epoch": 485} {"train_loss": -19.49249267578125, "global_step": 40290, "epoch": 485} {"train_loss": -19.670974731445312, "global_step": 40291, "epoch": 485} {"train_loss": -19.575307846069336, "global_step": 40292, "epoch": 485} {"train_loss": -19.481130599975586, "global_step": 40293, "epoch": 485} {"train_loss": -19.252635955810547, "global_step": 40294, "epoch": 485} {"train_loss": -19.417524337768555, "global_step": 40295, "epoch": 485} {"train_loss": -19.255643844604492, "global_step": 40296, "epoch": 485} {"train_loss": -19.353918075561523, "global_step": 40297, "epoch": 485} {"train_loss": -19.636594772338867, "global_step": 40298, "epoch": 485} {"train_loss": -19.412805557250977, "global_step": 40299, "epoch": 485} {"train_loss": -19.48636817932129, "global_step": 40300, "epoch": 485} {"train_loss": -19.716772079467773, "global_step": 40301, "epoch": 485} {"train_loss": -19.630329132080078, "global_step": 40302, "epoch": 485} {"train_loss": -19.600276947021484, "global_step": 40303, "epoch": 485} {"train_loss": -19.46567726135254, "global_step": 40304, "epoch": 485} {"train_loss": -19.531131744384766, "global_step": 40305, "epoch": 485} {"train_loss": -19.365768432617188, "global_step": 40306, "epoch": 485} {"train_loss": -19.100217819213867, "global_step": 40307, "epoch": 485} {"train_loss": -19.104324340820312, "global_step": 40308, "epoch": 485} {"train_loss": -19.78338050842285, "global_step": 40309, "epoch": 485} {"train_loss": -19.442279815673828, "global_step": 40310, "epoch": 485} {"train_loss": -19.48373794555664, "global_step": 40311, "epoch": 485} {"train_loss": -19.21115493774414, "global_step": 40312, "epoch": 485} {"train_loss": -19.449995040893555, "global_step": 40313, "epoch": 485} {"train_loss": -19.34031105041504, "global_step": 40314, "epoch": 485} {"train_loss": -19.739667892456055, "global_step": 40315, "epoch": 485} {"train_loss": -19.374465942382812, "global_step": 40316, "epoch": 485} {"train_loss": -19.36222267150879, "global_step": 40317, "epoch": 485} {"train_loss": -19.495670318603516, "global_step": 40318, "epoch": 485} {"train_loss": -19.377105712890625, "global_step": 40319, "epoch": 485} {"train_loss": -19.732168197631836, "global_step": 40320, "epoch": 485} {"train_loss": -19.6186580657959, "global_step": 40321, "epoch": 485} {"train_loss": -19.16611671447754, "global_step": 40322, "epoch": 485} {"train_loss": -19.420190811157227, "global_step": 40323, "epoch": 485} {"train_loss": -19.592594146728516, "global_step": 40324, "epoch": 485} {"train_loss": -19.576730728149414, "global_step": 40325, "epoch": 485} {"train_loss": -19.437976837158203, "global_step": 40326, "epoch": 485} {"train_loss": -19.57485008239746, "global_step": 40327, "epoch": 485} {"train_loss": -19.487548828125, "global_step": 40328, "epoch": 485} {"train_loss": -19.26569938659668, "global_step": 40329, "epoch": 485} {"train_loss": -19.239892959594727, "global_step": 40330, "epoch": 485} {"train_loss": -19.217819213867188, "global_step": 40331, "epoch": 485} {"train_loss": -19.581815719604492, "global_step": 40332, "epoch": 485} {"train_loss": -19.12578773498535, "global_step": 40333, "epoch": 485} {"train_loss": -19.67579460144043, "global_step": 40334, "epoch": 485} {"train_loss": -18.924650192260742, "global_step": 40335, "epoch": 485} {"train_loss": -19.249801635742188, "global_step": 40336, "epoch": 485} {"train_loss": -19.46491436785962, "global_step": 40337, "epoch": 485, "val_loss": 5949461.0} {"train_loss": -19.557775497436523, "global_step": 40338, "epoch": 486} {"train_loss": -19.65614891052246, "global_step": 40339, "epoch": 486} {"train_loss": -19.91628074645996, "global_step": 40340, "epoch": 486} {"train_loss": -19.501693725585938, "global_step": 40341, "epoch": 486} {"train_loss": -19.068395614624023, "global_step": 40342, "epoch": 486} {"train_loss": -19.36695671081543, "global_step": 40343, "epoch": 486} {"train_loss": -19.217330932617188, "global_step": 40344, "epoch": 486} {"train_loss": -19.154449462890625, "global_step": 40345, "epoch": 486} {"train_loss": -19.42519187927246, "global_step": 40346, "epoch": 486} {"train_loss": -19.17633819580078, "global_step": 40347, "epoch": 486} {"train_loss": -19.67976188659668, "global_step": 40348, "epoch": 486} {"train_loss": -19.18037223815918, "global_step": 40349, "epoch": 486} {"train_loss": -19.756603240966797, "global_step": 40350, "epoch": 486} {"train_loss": -18.734020233154297, "global_step": 40351, "epoch": 486} {"train_loss": -19.025285720825195, "global_step": 40352, "epoch": 486} {"train_loss": -19.533777236938477, "global_step": 40353, "epoch": 486} {"train_loss": -19.342514038085938, "global_step": 40354, "epoch": 486} {"train_loss": -19.431427001953125, "global_step": 40355, "epoch": 486} {"train_loss": -19.539213180541992, "global_step": 40356, "epoch": 486} {"train_loss": -19.415813446044922, "global_step": 40357, "epoch": 486} {"train_loss": -19.778003692626953, "global_step": 40358, "epoch": 486} {"train_loss": -19.333200454711914, "global_step": 40359, "epoch": 486} {"train_loss": -19.46035385131836, "global_step": 40360, "epoch": 486} {"train_loss": -19.636388778686523, "global_step": 40361, "epoch": 486} {"train_loss": -19.38136100769043, "global_step": 40362, "epoch": 486} {"train_loss": -19.678335189819336, "global_step": 40363, "epoch": 486} {"train_loss": -19.50796890258789, "global_step": 40364, "epoch": 486} {"train_loss": -19.604583740234375, "global_step": 40365, "epoch": 486} {"train_loss": -19.36482810974121, "global_step": 40366, "epoch": 486} {"train_loss": -19.912233352661133, "global_step": 40367, "epoch": 486} {"train_loss": -19.287906646728516, "global_step": 40368, "epoch": 486} {"train_loss": -19.684680938720703, "global_step": 40369, "epoch": 486} {"train_loss": -19.52973175048828, "global_step": 40370, "epoch": 486} {"train_loss": -19.436264038085938, "global_step": 40371, "epoch": 486} {"train_loss": -18.875659942626953, "global_step": 40372, "epoch": 486} {"train_loss": -19.91355323791504, "global_step": 40373, "epoch": 486} {"train_loss": -19.75835609436035, "global_step": 40374, "epoch": 486} {"train_loss": -19.543859481811523, "global_step": 40375, "epoch": 486} {"train_loss": -19.826318740844727, "global_step": 40376, "epoch": 486} {"train_loss": -19.181259155273438, "global_step": 40377, "epoch": 486} {"train_loss": -19.257905960083008, "global_step": 40378, "epoch": 486} {"train_loss": -19.624048233032227, "global_step": 40379, "epoch": 486} {"train_loss": -19.687997817993164, "global_step": 40380, "epoch": 486} {"train_loss": -19.4934024810791, "global_step": 40381, "epoch": 486} {"train_loss": -19.59388542175293, "global_step": 40382, "epoch": 486} {"train_loss": -19.839284896850586, "global_step": 40383, "epoch": 486} {"train_loss": -19.383319854736328, "global_step": 40384, "epoch": 486} {"train_loss": -19.855756759643555, "global_step": 40385, "epoch": 486} {"train_loss": -19.716276168823242, "global_step": 40386, "epoch": 486} {"train_loss": -19.741214752197266, "global_step": 40387, "epoch": 486} {"train_loss": -19.961122512817383, "global_step": 40388, "epoch": 486} {"train_loss": -19.862165451049805, "global_step": 40389, "epoch": 486} {"train_loss": -19.25148582458496, "global_step": 40390, "epoch": 486} {"train_loss": -19.698471069335938, "global_step": 40391, "epoch": 486} {"train_loss": -19.570938110351562, "global_step": 40392, "epoch": 486} {"train_loss": -19.564538955688477, "global_step": 40393, "epoch": 486} {"train_loss": -19.43729019165039, "global_step": 40394, "epoch": 486} {"train_loss": -19.548337936401367, "global_step": 40395, "epoch": 486} {"train_loss": -19.084945678710938, "global_step": 40396, "epoch": 486} {"train_loss": -19.3939266204834, "global_step": 40397, "epoch": 486} {"train_loss": -19.437591552734375, "global_step": 40398, "epoch": 486} {"train_loss": -19.65884780883789, "global_step": 40399, "epoch": 486} {"train_loss": -19.6607666015625, "global_step": 40400, "epoch": 486} {"train_loss": -19.673368453979492, "global_step": 40401, "epoch": 486} {"train_loss": -19.455814361572266, "global_step": 40402, "epoch": 486} {"train_loss": -19.806455612182617, "global_step": 40403, "epoch": 486} {"train_loss": -19.5332088470459, "global_step": 40404, "epoch": 486} {"train_loss": -19.554433822631836, "global_step": 40405, "epoch": 486} {"train_loss": -19.317581176757812, "global_step": 40406, "epoch": 486} {"train_loss": -19.50019073486328, "global_step": 40407, "epoch": 486} {"train_loss": -19.320470809936523, "global_step": 40408, "epoch": 486} {"train_loss": -19.59600257873535, "global_step": 40409, "epoch": 486} {"train_loss": -19.408422470092773, "global_step": 40410, "epoch": 486} {"train_loss": -19.6044921875, "global_step": 40411, "epoch": 486} {"train_loss": -19.03639030456543, "global_step": 40412, "epoch": 486} {"train_loss": -19.27558708190918, "global_step": 40413, "epoch": 486} {"train_loss": -19.383026123046875, "global_step": 40414, "epoch": 486} {"train_loss": -19.19614028930664, "global_step": 40415, "epoch": 486} {"train_loss": -19.353654861450195, "global_step": 40416, "epoch": 486} {"train_loss": -19.465396881103516, "global_step": 40417, "epoch": 486} {"train_loss": -19.321378707885742, "global_step": 40418, "epoch": 486} {"train_loss": -19.3353214263916, "global_step": 40419, "epoch": 486} {"train_loss": -19.481390321111103, "global_step": 40420, "epoch": 486, "val_loss": 5950524.0} {"train_loss": -19.77496910095215, "global_step": 40421, "epoch": 487} {"train_loss": -19.413419723510742, "global_step": 40422, "epoch": 487} {"train_loss": -19.61639976501465, "global_step": 40423, "epoch": 487} {"train_loss": -19.443241119384766, "global_step": 40424, "epoch": 487} {"train_loss": -19.494155883789062, "global_step": 40425, "epoch": 487} {"train_loss": -19.982481002807617, "global_step": 40426, "epoch": 487} {"train_loss": -19.5667667388916, "global_step": 40427, "epoch": 487} {"train_loss": -19.561098098754883, "global_step": 40428, "epoch": 487} {"train_loss": -19.46918487548828, "global_step": 40429, "epoch": 487} {"train_loss": -19.301254272460938, "global_step": 40430, "epoch": 487} {"train_loss": -19.60506248474121, "global_step": 40431, "epoch": 487} {"train_loss": -19.10880470275879, "global_step": 40432, "epoch": 487} {"train_loss": -19.664230346679688, "global_step": 40433, "epoch": 487} {"train_loss": -19.65651512145996, "global_step": 40434, "epoch": 487} {"train_loss": -19.441692352294922, "global_step": 40435, "epoch": 487} {"train_loss": -19.37404441833496, "global_step": 40436, "epoch": 487} {"train_loss": -19.458999633789062, "global_step": 40437, "epoch": 487} {"train_loss": -19.90264320373535, "global_step": 40438, "epoch": 487} {"train_loss": -19.915550231933594, "global_step": 40439, "epoch": 487} {"train_loss": -19.326425552368164, "global_step": 40440, "epoch": 487} {"train_loss": -19.826162338256836, "global_step": 40441, "epoch": 487} {"train_loss": -19.615203857421875, "global_step": 40442, "epoch": 487} {"train_loss": -19.257484436035156, "global_step": 40443, "epoch": 487} {"train_loss": -19.139917373657227, "global_step": 40444, "epoch": 487} {"train_loss": -19.73080825805664, "global_step": 40445, "epoch": 487} {"train_loss": -19.030046463012695, "global_step": 40446, "epoch": 487} {"train_loss": -19.89370346069336, "global_step": 40447, "epoch": 487} {"train_loss": -19.529037475585938, "global_step": 40448, "epoch": 487} {"train_loss": -19.347009658813477, "global_step": 40449, "epoch": 487} {"train_loss": -19.39100456237793, "global_step": 40450, "epoch": 487} {"train_loss": -19.268171310424805, "global_step": 40451, "epoch": 487} {"train_loss": -19.49493980407715, "global_step": 40452, "epoch": 487} {"train_loss": -19.531511306762695, "global_step": 40453, "epoch": 487} {"train_loss": -19.534406661987305, "global_step": 40454, "epoch": 487} {"train_loss": -19.280750274658203, "global_step": 40455, "epoch": 487} {"train_loss": -19.406850814819336, "global_step": 40456, "epoch": 487} {"train_loss": -19.471588134765625, "global_step": 40457, "epoch": 487} {"train_loss": -19.34553337097168, "global_step": 40458, "epoch": 487} {"train_loss": -19.444961547851562, "global_step": 40459, "epoch": 487} {"train_loss": -19.691818237304688, "global_step": 40460, "epoch": 487} {"train_loss": -19.109663009643555, "global_step": 40461, "epoch": 487} {"train_loss": -19.271066665649414, "global_step": 40462, "epoch": 487} {"train_loss": -19.644203186035156, "global_step": 40463, "epoch": 487} {"train_loss": -19.110803604125977, "global_step": 40464, "epoch": 487} {"train_loss": -19.07429313659668, "global_step": 40465, "epoch": 487} {"train_loss": -19.861860275268555, "global_step": 40466, "epoch": 487} {"train_loss": -19.522106170654297, "global_step": 40467, "epoch": 487} {"train_loss": -19.357635498046875, "global_step": 40468, "epoch": 487} {"train_loss": -19.700265884399414, "global_step": 40469, "epoch": 487} {"train_loss": -19.315488815307617, "global_step": 40470, "epoch": 487} {"train_loss": -19.657541275024414, "global_step": 40471, "epoch": 487} {"train_loss": -19.572547912597656, "global_step": 40472, "epoch": 487} {"train_loss": -19.4979305267334, "global_step": 40473, "epoch": 487} {"train_loss": -19.347156524658203, "global_step": 40474, "epoch": 487} {"train_loss": -19.25733757019043, "global_step": 40475, "epoch": 487} {"train_loss": -19.815778732299805, "global_step": 40476, "epoch": 487} {"train_loss": -19.774900436401367, "global_step": 40477, "epoch": 487} {"train_loss": -19.527362823486328, "global_step": 40478, "epoch": 487} {"train_loss": -19.268075942993164, "global_step": 40479, "epoch": 487} {"train_loss": -19.758203506469727, "global_step": 40480, "epoch": 487} {"train_loss": -19.30635643005371, "global_step": 40481, "epoch": 487} {"train_loss": -19.954086303710938, "global_step": 40482, "epoch": 487} {"train_loss": -19.528722763061523, "global_step": 40483, "epoch": 487} {"train_loss": -19.605770111083984, "global_step": 40484, "epoch": 487} {"train_loss": -19.31195640563965, "global_step": 40485, "epoch": 487} {"train_loss": -19.045751571655273, "global_step": 40486, "epoch": 487} {"train_loss": -19.529022216796875, "global_step": 40487, "epoch": 487} {"train_loss": -19.501222610473633, "global_step": 40488, "epoch": 487} {"train_loss": -19.443937301635742, "global_step": 40489, "epoch": 487} {"train_loss": -19.859546661376953, "global_step": 40490, "epoch": 487} {"train_loss": -19.490360260009766, "global_step": 40491, "epoch": 487} {"train_loss": -19.300704956054688, "global_step": 40492, "epoch": 487} {"train_loss": -19.499374389648438, "global_step": 40493, "epoch": 487} {"train_loss": -19.186674118041992, "global_step": 40494, "epoch": 487} {"train_loss": -18.983932495117188, "global_step": 40495, "epoch": 487} {"train_loss": -19.538558959960938, "global_step": 40496, "epoch": 487} {"train_loss": -19.434417724609375, "global_step": 40497, "epoch": 487} {"train_loss": -19.7830867767334, "global_step": 40498, "epoch": 487} {"train_loss": -19.420654296875, "global_step": 40499, "epoch": 487} {"train_loss": -19.79235076904297, "global_step": 40500, "epoch": 487} {"train_loss": -19.51185417175293, "global_step": 40501, "epoch": 487} {"train_loss": -19.649555206298828, "global_step": 40502, "epoch": 487} {"train_loss": -19.496138055640532, "global_step": 40503, "epoch": 487, "val_loss": 5986276.0} {"train_loss": -19.503141403198242, "global_step": 40504, "epoch": 488} {"train_loss": -19.07706069946289, "global_step": 40505, "epoch": 488} {"train_loss": -19.33121109008789, "global_step": 40506, "epoch": 488} {"train_loss": -19.56318473815918, "global_step": 40507, "epoch": 488} {"train_loss": -19.084779739379883, "global_step": 40508, "epoch": 488} {"train_loss": -19.16741943359375, "global_step": 40509, "epoch": 488} {"train_loss": -19.547754287719727, "global_step": 40510, "epoch": 488} {"train_loss": -19.486316680908203, "global_step": 40511, "epoch": 488} {"train_loss": -19.974760055541992, "global_step": 40512, "epoch": 488} {"train_loss": -19.41230583190918, "global_step": 40513, "epoch": 488} {"train_loss": -19.351213455200195, "global_step": 40514, "epoch": 488} {"train_loss": -19.576261520385742, "global_step": 40515, "epoch": 488} {"train_loss": -19.367368698120117, "global_step": 40516, "epoch": 488} {"train_loss": -19.19670295715332, "global_step": 40517, "epoch": 488} {"train_loss": -19.483121871948242, "global_step": 40518, "epoch": 488} {"train_loss": -19.56719970703125, "global_step": 40519, "epoch": 488} {"train_loss": -19.405567169189453, "global_step": 40520, "epoch": 488} {"train_loss": -19.060956954956055, "global_step": 40521, "epoch": 488} {"train_loss": -19.321216583251953, "global_step": 40522, "epoch": 488} {"train_loss": -19.566614151000977, "global_step": 40523, "epoch": 488} {"train_loss": -19.595539093017578, "global_step": 40524, "epoch": 488} {"train_loss": -19.333911895751953, "global_step": 40525, "epoch": 488} {"train_loss": -19.392135620117188, "global_step": 40526, "epoch": 488} {"train_loss": -19.72261619567871, "global_step": 40527, "epoch": 488} {"train_loss": -19.27444076538086, "global_step": 40528, "epoch": 488} {"train_loss": -19.667428970336914, "global_step": 40529, "epoch": 488} {"train_loss": -19.296489715576172, "global_step": 40530, "epoch": 488} {"train_loss": -19.2940673828125, "global_step": 40531, "epoch": 488} {"train_loss": -19.370756149291992, "global_step": 40532, "epoch": 488} {"train_loss": -19.603857040405273, "global_step": 40533, "epoch": 488} {"train_loss": -19.541004180908203, "global_step": 40534, "epoch": 488} {"train_loss": -19.438474655151367, "global_step": 40535, "epoch": 488} {"train_loss": -19.245241165161133, "global_step": 40536, "epoch": 488} {"train_loss": -19.54397964477539, "global_step": 40537, "epoch": 488} {"train_loss": -19.578563690185547, "global_step": 40538, "epoch": 488} {"train_loss": -19.2274227142334, "global_step": 40539, "epoch": 488} {"train_loss": -19.295503616333008, "global_step": 40540, "epoch": 488} {"train_loss": -19.52445411682129, "global_step": 40541, "epoch": 488} {"train_loss": -19.35993003845215, "global_step": 40542, "epoch": 488} {"train_loss": -19.5752010345459, "global_step": 40543, "epoch": 488} {"train_loss": -19.57230567932129, "global_step": 40544, "epoch": 488} {"train_loss": -19.369359970092773, "global_step": 40545, "epoch": 488} {"train_loss": -19.408178329467773, "global_step": 40546, "epoch": 488} {"train_loss": -19.441570281982422, "global_step": 40547, "epoch": 488} {"train_loss": -18.91583824157715, "global_step": 40548, "epoch": 488} {"train_loss": -19.60162353515625, "global_step": 40549, "epoch": 488} {"train_loss": -19.50465965270996, "global_step": 40550, "epoch": 488} {"train_loss": -19.584150314331055, "global_step": 40551, "epoch": 488} {"train_loss": -19.562740325927734, "global_step": 40552, "epoch": 488} {"train_loss": -19.778419494628906, "global_step": 40553, "epoch": 488} {"train_loss": -19.57826805114746, "global_step": 40554, "epoch": 488} {"train_loss": -19.052093505859375, "global_step": 40555, "epoch": 488} {"train_loss": -19.021533966064453, "global_step": 40556, "epoch": 488} {"train_loss": -19.469390869140625, "global_step": 40557, "epoch": 488} {"train_loss": -19.66949462890625, "global_step": 40558, "epoch": 488} {"train_loss": -19.234323501586914, "global_step": 40559, "epoch": 488} {"train_loss": -19.16275405883789, "global_step": 40560, "epoch": 488} {"train_loss": -19.445459365844727, "global_step": 40561, "epoch": 488} {"train_loss": -19.53359603881836, "global_step": 40562, "epoch": 488} {"train_loss": -19.004377365112305, "global_step": 40563, "epoch": 488} {"train_loss": -19.430200576782227, "global_step": 40564, "epoch": 488} {"train_loss": -19.966602325439453, "global_step": 40565, "epoch": 488} {"train_loss": -19.829771041870117, "global_step": 40566, "epoch": 488} {"train_loss": -19.99005126953125, "global_step": 40567, "epoch": 488} {"train_loss": -19.471155166625977, "global_step": 40568, "epoch": 488} {"train_loss": -19.684206008911133, "global_step": 40569, "epoch": 488} {"train_loss": -19.46119499206543, "global_step": 40570, "epoch": 488} {"train_loss": -19.824953079223633, "global_step": 40571, "epoch": 488} {"train_loss": -19.635160446166992, "global_step": 40572, "epoch": 488} {"train_loss": -19.886455535888672, "global_step": 40573, "epoch": 488} {"train_loss": -19.22202491760254, "global_step": 40574, "epoch": 488} {"train_loss": -19.365697860717773, "global_step": 40575, "epoch": 488} {"train_loss": -19.42970085144043, "global_step": 40576, "epoch": 488} {"train_loss": -19.75654411315918, "global_step": 40577, "epoch": 488} {"train_loss": -19.948747634887695, "global_step": 40578, "epoch": 488} {"train_loss": -19.015134811401367, "global_step": 40579, "epoch": 488} {"train_loss": -19.60756492614746, "global_step": 40580, "epoch": 488} {"train_loss": -19.475051879882812, "global_step": 40581, "epoch": 488} {"train_loss": -19.70482635498047, "global_step": 40582, "epoch": 488} {"train_loss": -19.563135147094727, "global_step": 40583, "epoch": 488} {"train_loss": -19.469106674194336, "global_step": 40584, "epoch": 488} {"train_loss": -19.493061065673828, "global_step": 40585, "epoch": 488} {"train_loss": -19.462601397410932, "global_step": 40586, "epoch": 488, "val_loss": 5965358.0} {"train_loss": -19.22361183166504, "global_step": 40587, "epoch": 489} {"train_loss": -19.7402286529541, "global_step": 40588, "epoch": 489} {"train_loss": -18.754642486572266, "global_step": 40589, "epoch": 489} {"train_loss": -19.43876075744629, "global_step": 40590, "epoch": 489} {"train_loss": -19.199987411499023, "global_step": 40591, "epoch": 489} {"train_loss": -19.420358657836914, "global_step": 40592, "epoch": 489} {"train_loss": -19.592885971069336, "global_step": 40593, "epoch": 489} {"train_loss": -19.26318359375, "global_step": 40594, "epoch": 489} {"train_loss": -19.35564613342285, "global_step": 40595, "epoch": 489} {"train_loss": -19.2336368560791, "global_step": 40596, "epoch": 489} {"train_loss": -19.436246871948242, "global_step": 40597, "epoch": 489} {"train_loss": -19.603334426879883, "global_step": 40598, "epoch": 489} {"train_loss": -19.40364646911621, "global_step": 40599, "epoch": 489} {"train_loss": -19.155866622924805, "global_step": 40600, "epoch": 489} {"train_loss": -19.437490463256836, "global_step": 40601, "epoch": 489} {"train_loss": -19.683216094970703, "global_step": 40602, "epoch": 489} {"train_loss": -19.328699111938477, "global_step": 40603, "epoch": 489} {"train_loss": -19.7596435546875, "global_step": 40604, "epoch": 489} {"train_loss": -19.390439987182617, "global_step": 40605, "epoch": 489} {"train_loss": -19.430482864379883, "global_step": 40606, "epoch": 489} {"train_loss": -19.699886322021484, "global_step": 40607, "epoch": 489} {"train_loss": -19.567792892456055, "global_step": 40608, "epoch": 489} {"train_loss": -19.55522346496582, "global_step": 40609, "epoch": 489} {"train_loss": -19.438495635986328, "global_step": 40610, "epoch": 489} {"train_loss": -19.5036678314209, "global_step": 40611, "epoch": 489} {"train_loss": -19.31402587890625, "global_step": 40612, "epoch": 489} {"train_loss": -19.42043113708496, "global_step": 40613, "epoch": 489} {"train_loss": -19.639734268188477, "global_step": 40614, "epoch": 489} {"train_loss": -19.48792839050293, "global_step": 40615, "epoch": 489} {"train_loss": -19.531185150146484, "global_step": 40616, "epoch": 489} {"train_loss": -19.843738555908203, "global_step": 40617, "epoch": 489} {"train_loss": -19.29289436340332, "global_step": 40618, "epoch": 489} {"train_loss": -19.584264755249023, "global_step": 40619, "epoch": 489} {"train_loss": -18.717336654663086, "global_step": 40620, "epoch": 489} {"train_loss": -19.13932228088379, "global_step": 40621, "epoch": 489} {"train_loss": -19.406776428222656, "global_step": 40622, "epoch": 489} {"train_loss": -19.21106719970703, "global_step": 40623, "epoch": 489} {"train_loss": -19.556324005126953, "global_step": 40624, "epoch": 489} {"train_loss": -19.417139053344727, "global_step": 40625, "epoch": 489} {"train_loss": -19.676794052124023, "global_step": 40626, "epoch": 489} {"train_loss": -19.67841911315918, "global_step": 40627, "epoch": 489} {"train_loss": -19.569778442382812, "global_step": 40628, "epoch": 489} {"train_loss": -18.833986282348633, "global_step": 40629, "epoch": 489} {"train_loss": -19.425649642944336, "global_step": 40630, "epoch": 489} {"train_loss": -19.47115707397461, "global_step": 40631, "epoch": 489} {"train_loss": -20.045734405517578, "global_step": 40632, "epoch": 489} {"train_loss": -19.622859954833984, "global_step": 40633, "epoch": 489} {"train_loss": -19.187442779541016, "global_step": 40634, "epoch": 489} {"train_loss": -19.582595825195312, "global_step": 40635, "epoch": 489} {"train_loss": -19.50108528137207, "global_step": 40636, "epoch": 489} {"train_loss": -18.824003219604492, "global_step": 40637, "epoch": 489} {"train_loss": -19.47013282775879, "global_step": 40638, "epoch": 489} {"train_loss": -19.4444580078125, "global_step": 40639, "epoch": 489} {"train_loss": -19.806795120239258, "global_step": 40640, "epoch": 489} {"train_loss": -19.474084854125977, "global_step": 40641, "epoch": 489} {"train_loss": -19.79131507873535, "global_step": 40642, "epoch": 489} {"train_loss": -19.24648094177246, "global_step": 40643, "epoch": 489} {"train_loss": -18.888141632080078, "global_step": 40644, "epoch": 489} {"train_loss": -19.286405563354492, "global_step": 40645, "epoch": 489} {"train_loss": -19.509170532226562, "global_step": 40646, "epoch": 489} {"train_loss": -19.1616153717041, "global_step": 40647, "epoch": 489} {"train_loss": -19.661584854125977, "global_step": 40648, "epoch": 489} {"train_loss": -19.646020889282227, "global_step": 40649, "epoch": 489} {"train_loss": -19.472749710083008, "global_step": 40650, "epoch": 489} {"train_loss": -19.597387313842773, "global_step": 40651, "epoch": 489} {"train_loss": -19.250471115112305, "global_step": 40652, "epoch": 489} {"train_loss": -19.229280471801758, "global_step": 40653, "epoch": 489} {"train_loss": -19.610620498657227, "global_step": 40654, "epoch": 489} {"train_loss": -19.23419189453125, "global_step": 40655, "epoch": 489} {"train_loss": -19.741718292236328, "global_step": 40656, "epoch": 489} {"train_loss": -19.188064575195312, "global_step": 40657, "epoch": 489} {"train_loss": -19.540210723876953, "global_step": 40658, "epoch": 489} {"train_loss": -19.32654571533203, "global_step": 40659, "epoch": 489} {"train_loss": -19.34980583190918, "global_step": 40660, "epoch": 489} {"train_loss": -19.619596481323242, "global_step": 40661, "epoch": 489} {"train_loss": -19.48438835144043, "global_step": 40662, "epoch": 489} {"train_loss": -19.60602569580078, "global_step": 40663, "epoch": 489} {"train_loss": -19.30404281616211, "global_step": 40664, "epoch": 489} {"train_loss": -19.491811752319336, "global_step": 40665, "epoch": 489} {"train_loss": -19.43545150756836, "global_step": 40666, "epoch": 489} {"train_loss": -19.269102096557617, "global_step": 40667, "epoch": 489} {"train_loss": -19.739290237426758, "global_step": 40668, "epoch": 489} {"train_loss": -19.43519516450813, "global_step": 40669, "epoch": 489, "val_loss": 5955699.0} {"train_loss": -19.411558151245117, "global_step": 40670, "epoch": 490} {"train_loss": -19.347063064575195, "global_step": 40671, "epoch": 490} {"train_loss": -19.35398292541504, "global_step": 40672, "epoch": 490} {"train_loss": -19.207792282104492, "global_step": 40673, "epoch": 490} {"train_loss": -19.40974998474121, "global_step": 40674, "epoch": 490} {"train_loss": -19.414270401000977, "global_step": 40675, "epoch": 490} {"train_loss": -18.98415184020996, "global_step": 40676, "epoch": 490} {"train_loss": -19.3006534576416, "global_step": 40677, "epoch": 490} {"train_loss": -19.461740493774414, "global_step": 40678, "epoch": 490} {"train_loss": -19.398351669311523, "global_step": 40679, "epoch": 490} {"train_loss": -19.477502822875977, "global_step": 40680, "epoch": 490} {"train_loss": -19.275461196899414, "global_step": 40681, "epoch": 490} {"train_loss": -19.66448402404785, "global_step": 40682, "epoch": 490} {"train_loss": -19.27366828918457, "global_step": 40683, "epoch": 490} {"train_loss": -20.057180404663086, "global_step": 40684, "epoch": 490} {"train_loss": -19.529014587402344, "global_step": 40685, "epoch": 490} {"train_loss": -19.708789825439453, "global_step": 40686, "epoch": 490} {"train_loss": -19.8341007232666, "global_step": 40687, "epoch": 490} {"train_loss": -19.4107723236084, "global_step": 40688, "epoch": 490} {"train_loss": -19.184616088867188, "global_step": 40689, "epoch": 490} {"train_loss": -19.253711700439453, "global_step": 40690, "epoch": 490} {"train_loss": -19.19692039489746, "global_step": 40691, "epoch": 490} {"train_loss": -19.965835571289062, "global_step": 40692, "epoch": 490} {"train_loss": -19.43577003479004, "global_step": 40693, "epoch": 490} {"train_loss": -19.590116500854492, "global_step": 40694, "epoch": 490} {"train_loss": -19.21686363220215, "global_step": 40695, "epoch": 490} {"train_loss": -19.71425437927246, "global_step": 40696, "epoch": 490} {"train_loss": -19.122028350830078, "global_step": 40697, "epoch": 490} {"train_loss": -19.11835289001465, "global_step": 40698, "epoch": 490} {"train_loss": -19.06087875366211, "global_step": 40699, "epoch": 490} {"train_loss": -19.67865562438965, "global_step": 40700, "epoch": 490} {"train_loss": -19.360824584960938, "global_step": 40701, "epoch": 490} {"train_loss": -19.753787994384766, "global_step": 40702, "epoch": 490} {"train_loss": -19.335601806640625, "global_step": 40703, "epoch": 490} {"train_loss": -19.452974319458008, "global_step": 40704, "epoch": 490} {"train_loss": -19.529504776000977, "global_step": 40705, "epoch": 490} {"train_loss": -19.365928649902344, "global_step": 40706, "epoch": 490} {"train_loss": -19.689504623413086, "global_step": 40707, "epoch": 490} {"train_loss": -19.342439651489258, "global_step": 40708, "epoch": 490} {"train_loss": -19.348369598388672, "global_step": 40709, "epoch": 490} {"train_loss": -19.483976364135742, "global_step": 40710, "epoch": 490} {"train_loss": -19.739561080932617, "global_step": 40711, "epoch": 490} {"train_loss": -19.54826545715332, "global_step": 40712, "epoch": 490} {"train_loss": -19.51322364807129, "global_step": 40713, "epoch": 490} {"train_loss": -19.516401290893555, "global_step": 40714, "epoch": 490} {"train_loss": -19.679927825927734, "global_step": 40715, "epoch": 490} {"train_loss": -19.483800888061523, "global_step": 40716, "epoch": 490} {"train_loss": -19.435461044311523, "global_step": 40717, "epoch": 490} {"train_loss": -19.404783248901367, "global_step": 40718, "epoch": 490} {"train_loss": -19.84279441833496, "global_step": 40719, "epoch": 490} {"train_loss": -19.553922653198242, "global_step": 40720, "epoch": 490} {"train_loss": -19.725305557250977, "global_step": 40721, "epoch": 490} {"train_loss": -19.610563278198242, "global_step": 40722, "epoch": 490} {"train_loss": -19.583393096923828, "global_step": 40723, "epoch": 490} {"train_loss": -19.715919494628906, "global_step": 40724, "epoch": 490} {"train_loss": -19.771638870239258, "global_step": 40725, "epoch": 490} {"train_loss": -19.4339542388916, "global_step": 40726, "epoch": 490} {"train_loss": -19.966833114624023, "global_step": 40727, "epoch": 490} {"train_loss": -19.526782989501953, "global_step": 40728, "epoch": 490} {"train_loss": -19.82237434387207, "global_step": 40729, "epoch": 490} {"train_loss": -19.658628463745117, "global_step": 40730, "epoch": 490} {"train_loss": -19.5064754486084, "global_step": 40731, "epoch": 490} {"train_loss": -19.456066131591797, "global_step": 40732, "epoch": 490} {"train_loss": -19.580570220947266, "global_step": 40733, "epoch": 490} {"train_loss": -19.14940071105957, "global_step": 40734, "epoch": 490} {"train_loss": -19.447662353515625, "global_step": 40735, "epoch": 490} {"train_loss": -19.401212692260742, "global_step": 40736, "epoch": 490} {"train_loss": -19.6628360748291, "global_step": 40737, "epoch": 490} {"train_loss": -19.78118896484375, "global_step": 40738, "epoch": 490} {"train_loss": -19.2509708404541, "global_step": 40739, "epoch": 490} {"train_loss": -19.641407012939453, "global_step": 40740, "epoch": 490} {"train_loss": -19.42379379272461, "global_step": 40741, "epoch": 490} {"train_loss": -19.552045822143555, "global_step": 40742, "epoch": 490} {"train_loss": -19.95193099975586, "global_step": 40743, "epoch": 490} {"train_loss": -19.307554244995117, "global_step": 40744, "epoch": 490} {"train_loss": -19.63278579711914, "global_step": 40745, "epoch": 490} {"train_loss": -19.456323623657227, "global_step": 40746, "epoch": 490} {"train_loss": -19.6640625, "global_step": 40747, "epoch": 490} {"train_loss": -19.57862091064453, "global_step": 40748, "epoch": 490} {"train_loss": -19.406753540039062, "global_step": 40749, "epoch": 490} {"train_loss": -19.36754035949707, "global_step": 40750, "epoch": 490} {"train_loss": -19.38453483581543, "global_step": 40751, "epoch": 490} {"train_loss": -19.510265855904084, "global_step": 40752, "epoch": 490, "val_loss": 5846132.0} {"train_loss": -19.20735740661621, "global_step": 40753, "epoch": 491} {"train_loss": -19.340078353881836, "global_step": 40754, "epoch": 491} {"train_loss": -19.224706649780273, "global_step": 40755, "epoch": 491} {"train_loss": -19.53078269958496, "global_step": 40756, "epoch": 491} {"train_loss": -19.572050094604492, "global_step": 40757, "epoch": 491} {"train_loss": -19.17058753967285, "global_step": 40758, "epoch": 491} {"train_loss": -19.35662078857422, "global_step": 40759, "epoch": 491} {"train_loss": -19.290082931518555, "global_step": 40760, "epoch": 491} {"train_loss": -19.334060668945312, "global_step": 40761, "epoch": 491} {"train_loss": -19.525800704956055, "global_step": 40762, "epoch": 491} {"train_loss": -19.545541763305664, "global_step": 40763, "epoch": 491} {"train_loss": -19.72206687927246, "global_step": 40764, "epoch": 491} {"train_loss": -19.293376922607422, "global_step": 40765, "epoch": 491} {"train_loss": -19.2086238861084, "global_step": 40766, "epoch": 491} {"train_loss": -19.188512802124023, "global_step": 40767, "epoch": 491} {"train_loss": -19.779165267944336, "global_step": 40768, "epoch": 491} {"train_loss": -19.449148178100586, "global_step": 40769, "epoch": 491} {"train_loss": -19.873929977416992, "global_step": 40770, "epoch": 491} {"train_loss": -19.560468673706055, "global_step": 40771, "epoch": 491} {"train_loss": -19.659711837768555, "global_step": 40772, "epoch": 491} {"train_loss": -19.231937408447266, "global_step": 40773, "epoch": 491} {"train_loss": -19.14159393310547, "global_step": 40774, "epoch": 491} {"train_loss": -19.32476043701172, "global_step": 40775, "epoch": 491} {"train_loss": -19.389686584472656, "global_step": 40776, "epoch": 491} {"train_loss": -19.829904556274414, "global_step": 40777, "epoch": 491} {"train_loss": -19.306167602539062, "global_step": 40778, "epoch": 491} {"train_loss": -19.417558670043945, "global_step": 40779, "epoch": 491} {"train_loss": -19.472570419311523, "global_step": 40780, "epoch": 491} {"train_loss": -19.65061378479004, "global_step": 40781, "epoch": 491} {"train_loss": -19.383939743041992, "global_step": 40782, "epoch": 491} {"train_loss": -19.22355842590332, "global_step": 40783, "epoch": 491} {"train_loss": -19.477746963500977, "global_step": 40784, "epoch": 491} {"train_loss": -19.45352554321289, "global_step": 40785, "epoch": 491} {"train_loss": -19.0419921875, "global_step": 40786, "epoch": 491} {"train_loss": -19.391630172729492, "global_step": 40787, "epoch": 491} {"train_loss": -19.713781356811523, "global_step": 40788, "epoch": 491} {"train_loss": -19.336931228637695, "global_step": 40789, "epoch": 491} {"train_loss": -19.596508026123047, "global_step": 40790, "epoch": 491} {"train_loss": -19.3957576751709, "global_step": 40791, "epoch": 491} {"train_loss": -19.218170166015625, "global_step": 40792, "epoch": 491} {"train_loss": -19.602792739868164, "global_step": 40793, "epoch": 491} {"train_loss": -18.992162704467773, "global_step": 40794, "epoch": 491} {"train_loss": -19.560760498046875, "global_step": 40795, "epoch": 491} {"train_loss": -19.821760177612305, "global_step": 40796, "epoch": 491} {"train_loss": -19.36474609375, "global_step": 40797, "epoch": 491} {"train_loss": -19.225507736206055, "global_step": 40798, "epoch": 491} {"train_loss": -19.628591537475586, "global_step": 40799, "epoch": 491} {"train_loss": -19.87032127380371, "global_step": 40800, "epoch": 491} {"train_loss": -19.866647720336914, "global_step": 40801, "epoch": 491} {"train_loss": -19.11897850036621, "global_step": 40802, "epoch": 491} {"train_loss": -19.48426628112793, "global_step": 40803, "epoch": 491} {"train_loss": -19.3033447265625, "global_step": 40804, "epoch": 491} {"train_loss": -19.311908721923828, "global_step": 40805, "epoch": 491} {"train_loss": -19.67403221130371, "global_step": 40806, "epoch": 491} {"train_loss": -19.607763290405273, "global_step": 40807, "epoch": 491} {"train_loss": -19.712909698486328, "global_step": 40808, "epoch": 491} {"train_loss": -19.47650718688965, "global_step": 40809, "epoch": 491} {"train_loss": -19.093183517456055, "global_step": 40810, "epoch": 491} {"train_loss": -19.256933212280273, "global_step": 40811, "epoch": 491} {"train_loss": -19.12987518310547, "global_step": 40812, "epoch": 491} {"train_loss": -19.5118465423584, "global_step": 40813, "epoch": 491} {"train_loss": -19.402923583984375, "global_step": 40814, "epoch": 491} {"train_loss": -19.492267608642578, "global_step": 40815, "epoch": 491} {"train_loss": -19.45208168029785, "global_step": 40816, "epoch": 491} {"train_loss": -19.39613914489746, "global_step": 40817, "epoch": 491} {"train_loss": -19.590484619140625, "global_step": 40818, "epoch": 491} {"train_loss": -18.98091697692871, "global_step": 40819, "epoch": 491} {"train_loss": -19.262937545776367, "global_step": 40820, "epoch": 491} {"train_loss": -18.764833450317383, "global_step": 40821, "epoch": 491} {"train_loss": -19.455791473388672, "global_step": 40822, "epoch": 491} {"train_loss": -18.78810691833496, "global_step": 40823, "epoch": 491} {"train_loss": -19.512861251831055, "global_step": 40824, "epoch": 491} {"train_loss": -19.715599060058594, "global_step": 40825, "epoch": 491} {"train_loss": -19.321348190307617, "global_step": 40826, "epoch": 491} {"train_loss": -19.613494873046875, "global_step": 40827, "epoch": 491} {"train_loss": -19.101226806640625, "global_step": 40828, "epoch": 491} {"train_loss": -19.74785041809082, "global_step": 40829, "epoch": 491} {"train_loss": -19.51087188720703, "global_step": 40830, "epoch": 491} {"train_loss": -19.705068588256836, "global_step": 40831, "epoch": 491} {"train_loss": -19.307527542114258, "global_step": 40832, "epoch": 491} {"train_loss": -19.638296127319336, "global_step": 40833, "epoch": 491} {"train_loss": -19.395751953125, "global_step": 40834, "epoch": 491} {"train_loss": -19.424770217343987, "global_step": 40835, "epoch": 491, "val_loss": 6007020.5} {"train_loss": -19.497323989868164, "global_step": 40836, "epoch": 492} {"train_loss": -18.95901870727539, "global_step": 40837, "epoch": 492} {"train_loss": -19.694028854370117, "global_step": 40838, "epoch": 492} {"train_loss": -19.0886287689209, "global_step": 40839, "epoch": 492} {"train_loss": -19.32234764099121, "global_step": 40840, "epoch": 492} {"train_loss": -19.21480369567871, "global_step": 40841, "epoch": 492} {"train_loss": -19.187448501586914, "global_step": 40842, "epoch": 492} {"train_loss": -19.1489200592041, "global_step": 40843, "epoch": 492} {"train_loss": -19.70975685119629, "global_step": 40844, "epoch": 492} {"train_loss": -19.67386245727539, "global_step": 40845, "epoch": 492} {"train_loss": -19.67551612854004, "global_step": 40846, "epoch": 492} {"train_loss": -19.3665771484375, "global_step": 40847, "epoch": 492} {"train_loss": -19.47840118408203, "global_step": 40848, "epoch": 492} {"train_loss": -19.359100341796875, "global_step": 40849, "epoch": 492} {"train_loss": -19.562671661376953, "global_step": 40850, "epoch": 492} {"train_loss": -19.656476974487305, "global_step": 40851, "epoch": 492} {"train_loss": -19.738910675048828, "global_step": 40852, "epoch": 492} {"train_loss": -19.679346084594727, "global_step": 40853, "epoch": 492} {"train_loss": -19.472900390625, "global_step": 40854, "epoch": 492} {"train_loss": -19.331754684448242, "global_step": 40855, "epoch": 492} {"train_loss": -19.821273803710938, "global_step": 40856, "epoch": 492} {"train_loss": -19.36260986328125, "global_step": 40857, "epoch": 492} {"train_loss": -19.263593673706055, "global_step": 40858, "epoch": 492} {"train_loss": -19.44081687927246, "global_step": 40859, "epoch": 492} {"train_loss": -19.34214973449707, "global_step": 40860, "epoch": 492} {"train_loss": -19.55221176147461, "global_step": 40861, "epoch": 492} {"train_loss": -19.33057975769043, "global_step": 40862, "epoch": 492} {"train_loss": -19.485885620117188, "global_step": 40863, "epoch": 492} {"train_loss": -19.481138229370117, "global_step": 40864, "epoch": 492} {"train_loss": -19.676496505737305, "global_step": 40865, "epoch": 492} {"train_loss": -19.133777618408203, "global_step": 40866, "epoch": 492} {"train_loss": -19.396137237548828, "global_step": 40867, "epoch": 492} {"train_loss": -19.48224449157715, "global_step": 40868, "epoch": 492} {"train_loss": -19.368314743041992, "global_step": 40869, "epoch": 492} {"train_loss": -19.440601348876953, "global_step": 40870, "epoch": 492} {"train_loss": -19.236804962158203, "global_step": 40871, "epoch": 492} {"train_loss": -19.178186416625977, "global_step": 40872, "epoch": 492} {"train_loss": -19.535137176513672, "global_step": 40873, "epoch": 492} {"train_loss": -19.541959762573242, "global_step": 40874, "epoch": 492} {"train_loss": -19.267282485961914, "global_step": 40875, "epoch": 492} {"train_loss": -19.296337127685547, "global_step": 40876, "epoch": 492} {"train_loss": -19.41061782836914, "global_step": 40877, "epoch": 492} {"train_loss": -19.335290908813477, "global_step": 40878, "epoch": 492} {"train_loss": -19.3008975982666, "global_step": 40879, "epoch": 492} {"train_loss": -19.488496780395508, "global_step": 40880, "epoch": 492} {"train_loss": -19.375869750976562, "global_step": 40881, "epoch": 492} {"train_loss": -19.520645141601562, "global_step": 40882, "epoch": 492} {"train_loss": -19.352602005004883, "global_step": 40883, "epoch": 492} {"train_loss": -19.43463134765625, "global_step": 40884, "epoch": 492} {"train_loss": -19.60312271118164, "global_step": 40885, "epoch": 492} {"train_loss": -19.490039825439453, "global_step": 40886, "epoch": 492} {"train_loss": -19.640090942382812, "global_step": 40887, "epoch": 492} {"train_loss": -19.893259048461914, "global_step": 40888, "epoch": 492} {"train_loss": -19.448482513427734, "global_step": 40889, "epoch": 492} {"train_loss": -19.2005672454834, "global_step": 40890, "epoch": 492} {"train_loss": -19.538843154907227, "global_step": 40891, "epoch": 492} {"train_loss": -19.469167709350586, "global_step": 40892, "epoch": 492} {"train_loss": -19.48594856262207, "global_step": 40893, "epoch": 492} {"train_loss": -19.70737075805664, "global_step": 40894, "epoch": 492} {"train_loss": -19.77980613708496, "global_step": 40895, "epoch": 492} {"train_loss": -19.522329330444336, "global_step": 40896, "epoch": 492} {"train_loss": -19.6434383392334, "global_step": 40897, "epoch": 492} {"train_loss": -19.543554306030273, "global_step": 40898, "epoch": 492} {"train_loss": -19.558109283447266, "global_step": 40899, "epoch": 492} {"train_loss": -19.774688720703125, "global_step": 40900, "epoch": 492} {"train_loss": -19.48111915588379, "global_step": 40901, "epoch": 492} {"train_loss": -19.537935256958008, "global_step": 40902, "epoch": 492} {"train_loss": -19.79167366027832, "global_step": 40903, "epoch": 492} {"train_loss": -19.548171997070312, "global_step": 40904, "epoch": 492} {"train_loss": -19.35546875, "global_step": 40905, "epoch": 492} {"train_loss": -19.673534393310547, "global_step": 40906, "epoch": 492} {"train_loss": -19.598230361938477, "global_step": 40907, "epoch": 492} {"train_loss": -19.83188819885254, "global_step": 40908, "epoch": 492} {"train_loss": -19.547460556030273, "global_step": 40909, "epoch": 492} {"train_loss": -19.186203002929688, "global_step": 40910, "epoch": 492} {"train_loss": -19.390731811523438, "global_step": 40911, "epoch": 492} {"train_loss": -19.598363876342773, "global_step": 40912, "epoch": 492} {"train_loss": -19.529376983642578, "global_step": 40913, "epoch": 492} {"train_loss": -19.74203872680664, "global_step": 40914, "epoch": 492} {"train_loss": -19.346879959106445, "global_step": 40915, "epoch": 492} {"train_loss": -19.987112045288086, "global_step": 40916, "epoch": 492} {"train_loss": -19.44805335998535, "global_step": 40917, "epoch": 492} {"train_loss": -19.4667257975383, "global_step": 40918, "epoch": 492, "val_loss": 5949881.0} {"train_loss": -18.888460159301758, "global_step": 40919, "epoch": 493} {"train_loss": -19.544057846069336, "global_step": 40920, "epoch": 493} {"train_loss": -19.439712524414062, "global_step": 40921, "epoch": 493} {"train_loss": -19.690767288208008, "global_step": 40922, "epoch": 493} {"train_loss": -19.72878074645996, "global_step": 40923, "epoch": 493} {"train_loss": -19.036340713500977, "global_step": 40924, "epoch": 493} {"train_loss": -19.24721336364746, "global_step": 40925, "epoch": 493} {"train_loss": -19.780689239501953, "global_step": 40926, "epoch": 493} {"train_loss": -19.483469009399414, "global_step": 40927, "epoch": 493} {"train_loss": -19.33152198791504, "global_step": 40928, "epoch": 493} {"train_loss": -19.452421188354492, "global_step": 40929, "epoch": 493} {"train_loss": -19.344457626342773, "global_step": 40930, "epoch": 493} {"train_loss": -19.486387252807617, "global_step": 40931, "epoch": 493} {"train_loss": -19.660043716430664, "global_step": 40932, "epoch": 493} {"train_loss": -19.50357437133789, "global_step": 40933, "epoch": 493} {"train_loss": -19.709583282470703, "global_step": 40934, "epoch": 493} {"train_loss": -19.500537872314453, "global_step": 40935, "epoch": 493} {"train_loss": -19.116558074951172, "global_step": 40936, "epoch": 493} {"train_loss": -19.497793197631836, "global_step": 40937, "epoch": 493} {"train_loss": -19.387210845947266, "global_step": 40938, "epoch": 493} {"train_loss": -19.114377975463867, "global_step": 40939, "epoch": 493} {"train_loss": -19.578857421875, "global_step": 40940, "epoch": 493} {"train_loss": -19.262136459350586, "global_step": 40941, "epoch": 493} {"train_loss": -19.470443725585938, "global_step": 40942, "epoch": 493} {"train_loss": -19.72784423828125, "global_step": 40943, "epoch": 493} {"train_loss": -19.159191131591797, "global_step": 40944, "epoch": 493} {"train_loss": -19.54462242126465, "global_step": 40945, "epoch": 493} {"train_loss": -19.77634048461914, "global_step": 40946, "epoch": 493} {"train_loss": -19.26726722717285, "global_step": 40947, "epoch": 493} {"train_loss": -19.545724868774414, "global_step": 40948, "epoch": 493} {"train_loss": -19.500411987304688, "global_step": 40949, "epoch": 493} {"train_loss": -19.5672664642334, "global_step": 40950, "epoch": 493} {"train_loss": -19.530593872070312, "global_step": 40951, "epoch": 493} {"train_loss": -19.446216583251953, "global_step": 40952, "epoch": 493} {"train_loss": -19.529687881469727, "global_step": 40953, "epoch": 493} {"train_loss": -19.450660705566406, "global_step": 40954, "epoch": 493} {"train_loss": -19.762670516967773, "global_step": 40955, "epoch": 493} {"train_loss": -19.306814193725586, "global_step": 40956, "epoch": 493} {"train_loss": -19.634462356567383, "global_step": 40957, "epoch": 493} {"train_loss": -19.621347427368164, "global_step": 40958, "epoch": 493} {"train_loss": -19.476015090942383, "global_step": 40959, "epoch": 493} {"train_loss": -19.395116806030273, "global_step": 40960, "epoch": 493} {"train_loss": -19.49456214904785, "global_step": 40961, "epoch": 493} {"train_loss": -19.402664184570312, "global_step": 40962, "epoch": 493} {"train_loss": -19.534605026245117, "global_step": 40963, "epoch": 493} {"train_loss": -19.45560646057129, "global_step": 40964, "epoch": 493} {"train_loss": -18.980314254760742, "global_step": 40965, "epoch": 493} {"train_loss": -19.752038955688477, "global_step": 40966, "epoch": 493} {"train_loss": -19.42793083190918, "global_step": 40967, "epoch": 493} {"train_loss": -19.152860641479492, "global_step": 40968, "epoch": 493} {"train_loss": -19.66400146484375, "global_step": 40969, "epoch": 493} {"train_loss": -19.49294090270996, "global_step": 40970, "epoch": 493} {"train_loss": -19.303434371948242, "global_step": 40971, "epoch": 493} {"train_loss": -19.4592227935791, "global_step": 40972, "epoch": 493} {"train_loss": -19.606008529663086, "global_step": 40973, "epoch": 493} {"train_loss": -19.906431198120117, "global_step": 40974, "epoch": 493} {"train_loss": -19.481576919555664, "global_step": 40975, "epoch": 493} {"train_loss": -19.101890563964844, "global_step": 40976, "epoch": 493} {"train_loss": -19.621103286743164, "global_step": 40977, "epoch": 493} {"train_loss": -19.52426528930664, "global_step": 40978, "epoch": 493} {"train_loss": -19.487110137939453, "global_step": 40979, "epoch": 493} {"train_loss": -19.691648483276367, "global_step": 40980, "epoch": 493} {"train_loss": -19.436050415039062, "global_step": 40981, "epoch": 493} {"train_loss": -19.6861629486084, "global_step": 40982, "epoch": 493} {"train_loss": -19.353551864624023, "global_step": 40983, "epoch": 493} {"train_loss": -19.238935470581055, "global_step": 40984, "epoch": 493} {"train_loss": -19.245145797729492, "global_step": 40985, "epoch": 493} {"train_loss": -19.079883575439453, "global_step": 40986, "epoch": 493} {"train_loss": -19.59023094177246, "global_step": 40987, "epoch": 493} {"train_loss": -19.86054801940918, "global_step": 40988, "epoch": 493} {"train_loss": -19.558650970458984, "global_step": 40989, "epoch": 493} {"train_loss": -19.693113327026367, "global_step": 40990, "epoch": 493} {"train_loss": -19.243017196655273, "global_step": 40991, "epoch": 493} {"train_loss": -19.65299415588379, "global_step": 40992, "epoch": 493} {"train_loss": -19.14073371887207, "global_step": 40993, "epoch": 493} {"train_loss": -19.825523376464844, "global_step": 40994, "epoch": 493} {"train_loss": -19.339445114135742, "global_step": 40995, "epoch": 493} {"train_loss": -19.281461715698242, "global_step": 40996, "epoch": 493} {"train_loss": -19.407297134399414, "global_step": 40997, "epoch": 493} {"train_loss": -19.21318244934082, "global_step": 40998, "epoch": 493} {"train_loss": -19.65789222717285, "global_step": 40999, "epoch": 493} {"train_loss": -19.445768356323242, "global_step": 41000, "epoch": 493} {"train_loss": -19.4712596111987, "global_step": 41001, "epoch": 493, "val_loss": 5974564.5} {"train_loss": -19.024351119995117, "global_step": 41002, "epoch": 494} {"train_loss": -19.187002182006836, "global_step": 41003, "epoch": 494} {"train_loss": -18.925888061523438, "global_step": 41004, "epoch": 494} {"train_loss": -18.96613121032715, "global_step": 41005, "epoch": 494} {"train_loss": -19.354721069335938, "global_step": 41006, "epoch": 494} {"train_loss": -19.122209548950195, "global_step": 41007, "epoch": 494} {"train_loss": -19.010597229003906, "global_step": 41008, "epoch": 494} {"train_loss": -19.412405014038086, "global_step": 41009, "epoch": 494} {"train_loss": -18.96405601501465, "global_step": 41010, "epoch": 494} {"train_loss": -19.140552520751953, "global_step": 41011, "epoch": 494} {"train_loss": -19.540124893188477, "global_step": 41012, "epoch": 494} {"train_loss": -19.535385131835938, "global_step": 41013, "epoch": 494} {"train_loss": -19.444087982177734, "global_step": 41014, "epoch": 494} {"train_loss": -19.398820877075195, "global_step": 41015, "epoch": 494} {"train_loss": -19.530609130859375, "global_step": 41016, "epoch": 494} {"train_loss": -19.454259872436523, "global_step": 41017, "epoch": 494} {"train_loss": -19.46893882751465, "global_step": 41018, "epoch": 494} {"train_loss": -19.288681030273438, "global_step": 41019, "epoch": 494} {"train_loss": -19.357912063598633, "global_step": 41020, "epoch": 494} {"train_loss": -19.25152587890625, "global_step": 41021, "epoch": 494} {"train_loss": -19.494327545166016, "global_step": 41022, "epoch": 494} {"train_loss": -19.501012802124023, "global_step": 41023, "epoch": 494} {"train_loss": -19.691696166992188, "global_step": 41024, "epoch": 494} {"train_loss": -19.974966049194336, "global_step": 41025, "epoch": 494} {"train_loss": -19.034090042114258, "global_step": 41026, "epoch": 494} {"train_loss": -19.654483795166016, "global_step": 41027, "epoch": 494} {"train_loss": -19.782758712768555, "global_step": 41028, "epoch": 494} {"train_loss": -19.297941207885742, "global_step": 41029, "epoch": 494} {"train_loss": -19.59794044494629, "global_step": 41030, "epoch": 494} {"train_loss": -19.41115379333496, "global_step": 41031, "epoch": 494} {"train_loss": -19.675317764282227, "global_step": 41032, "epoch": 494} {"train_loss": -19.57282829284668, "global_step": 41033, "epoch": 494} {"train_loss": -19.750396728515625, "global_step": 41034, "epoch": 494} {"train_loss": -19.748916625976562, "global_step": 41035, "epoch": 494} {"train_loss": -19.483518600463867, "global_step": 41036, "epoch": 494} {"train_loss": -19.41594123840332, "global_step": 41037, "epoch": 494} {"train_loss": -19.42124366760254, "global_step": 41038, "epoch": 494} {"train_loss": -19.78267478942871, "global_step": 41039, "epoch": 494} {"train_loss": -19.25031089782715, "global_step": 41040, "epoch": 494} {"train_loss": -19.129165649414062, "global_step": 41041, "epoch": 494} {"train_loss": -19.370624542236328, "global_step": 41042, "epoch": 494} {"train_loss": -20.04265594482422, "global_step": 41043, "epoch": 494} {"train_loss": -19.464160919189453, "global_step": 41044, "epoch": 494} {"train_loss": -19.413206100463867, "global_step": 41045, "epoch": 494} {"train_loss": -19.348770141601562, "global_step": 41046, "epoch": 494} {"train_loss": -19.764896392822266, "global_step": 41047, "epoch": 494} {"train_loss": -19.497966766357422, "global_step": 41048, "epoch": 494} {"train_loss": -19.632749557495117, "global_step": 41049, "epoch": 494} {"train_loss": -19.593427658081055, "global_step": 41050, "epoch": 494} {"train_loss": -19.6944637298584, "global_step": 41051, "epoch": 494} {"train_loss": -19.62262535095215, "global_step": 41052, "epoch": 494} {"train_loss": -19.626131057739258, "global_step": 41053, "epoch": 494} {"train_loss": -19.376113891601562, "global_step": 41054, "epoch": 494} {"train_loss": -19.97516632080078, "global_step": 41055, "epoch": 494} {"train_loss": -19.513837814331055, "global_step": 41056, "epoch": 494} {"train_loss": -19.424352645874023, "global_step": 41057, "epoch": 494} {"train_loss": -19.84862518310547, "global_step": 41058, "epoch": 494} {"train_loss": -19.329669952392578, "global_step": 41059, "epoch": 494} {"train_loss": -19.63102912902832, "global_step": 41060, "epoch": 494} {"train_loss": -19.434755325317383, "global_step": 41061, "epoch": 494} {"train_loss": -19.60517692565918, "global_step": 41062, "epoch": 494} {"train_loss": -19.279993057250977, "global_step": 41063, "epoch": 494} {"train_loss": -19.580280303955078, "global_step": 41064, "epoch": 494} {"train_loss": -19.794086456298828, "global_step": 41065, "epoch": 494} {"train_loss": -19.44663429260254, "global_step": 41066, "epoch": 494} {"train_loss": -19.604421615600586, "global_step": 41067, "epoch": 494} {"train_loss": -19.42240333557129, "global_step": 41068, "epoch": 494} {"train_loss": -19.818740844726562, "global_step": 41069, "epoch": 494} {"train_loss": -19.303524017333984, "global_step": 41070, "epoch": 494} {"train_loss": -19.691110610961914, "global_step": 41071, "epoch": 494} {"train_loss": -19.854618072509766, "global_step": 41072, "epoch": 494} {"train_loss": -19.83420181274414, "global_step": 41073, "epoch": 494} {"train_loss": -19.648469924926758, "global_step": 41074, "epoch": 494} {"train_loss": -19.506494522094727, "global_step": 41075, "epoch": 494} {"train_loss": -19.5632381439209, "global_step": 41076, "epoch": 494} {"train_loss": -19.639759063720703, "global_step": 41077, "epoch": 494} {"train_loss": -19.244136810302734, "global_step": 41078, "epoch": 494} {"train_loss": -19.167911529541016, "global_step": 41079, "epoch": 494} {"train_loss": -19.492603302001953, "global_step": 41080, "epoch": 494} {"train_loss": -19.410573959350586, "global_step": 41081, "epoch": 494} {"train_loss": -19.101276397705078, "global_step": 41082, "epoch": 494} {"train_loss": -19.468168258666992, "global_step": 41083, "epoch": 494} {"train_loss": -19.488355268915015, "global_step": 41084, "epoch": 494, "val_loss": 6012316.0} {"train_loss": -19.066852569580078, "global_step": 41085, "epoch": 495} {"train_loss": -19.30922508239746, "global_step": 41086, "epoch": 495} {"train_loss": -19.287424087524414, "global_step": 41087, "epoch": 495} {"train_loss": -19.176774978637695, "global_step": 41088, "epoch": 495} {"train_loss": -19.568286895751953, "global_step": 41089, "epoch": 495} {"train_loss": -19.724855422973633, "global_step": 41090, "epoch": 495} {"train_loss": -19.594980239868164, "global_step": 41091, "epoch": 495} {"train_loss": -19.18637466430664, "global_step": 41092, "epoch": 495} {"train_loss": -19.359512329101562, "global_step": 41093, "epoch": 495} {"train_loss": -19.2861328125, "global_step": 41094, "epoch": 495} {"train_loss": -19.691312789916992, "global_step": 41095, "epoch": 495} {"train_loss": -19.527576446533203, "global_step": 41096, "epoch": 495} {"train_loss": -19.363195419311523, "global_step": 41097, "epoch": 495} {"train_loss": -19.736820220947266, "global_step": 41098, "epoch": 495} {"train_loss": -19.551685333251953, "global_step": 41099, "epoch": 495} {"train_loss": -19.305599212646484, "global_step": 41100, "epoch": 495} {"train_loss": -19.23015594482422, "global_step": 41101, "epoch": 495} {"train_loss": -19.72986602783203, "global_step": 41102, "epoch": 495} {"train_loss": -19.281829833984375, "global_step": 41103, "epoch": 495} {"train_loss": -19.803668975830078, "global_step": 41104, "epoch": 495} {"train_loss": -19.313291549682617, "global_step": 41105, "epoch": 495} {"train_loss": -19.577499389648438, "global_step": 41106, "epoch": 495} {"train_loss": -19.736434936523438, "global_step": 41107, "epoch": 495} {"train_loss": -19.530651092529297, "global_step": 41108, "epoch": 495} {"train_loss": -19.92391014099121, "global_step": 41109, "epoch": 495} {"train_loss": -19.497663497924805, "global_step": 41110, "epoch": 495} {"train_loss": -19.575363159179688, "global_step": 41111, "epoch": 495} {"train_loss": -19.258724212646484, "global_step": 41112, "epoch": 495} {"train_loss": -19.465192794799805, "global_step": 41113, "epoch": 495} {"train_loss": -19.345582962036133, "global_step": 41114, "epoch": 495} {"train_loss": -19.672876358032227, "global_step": 41115, "epoch": 495} {"train_loss": -19.41509437561035, "global_step": 41116, "epoch": 495} {"train_loss": -19.302030563354492, "global_step": 41117, "epoch": 495} {"train_loss": -19.455284118652344, "global_step": 41118, "epoch": 495} {"train_loss": -19.40351676940918, "global_step": 41119, "epoch": 495} {"train_loss": -19.594715118408203, "global_step": 41120, "epoch": 495} {"train_loss": -19.686365127563477, "global_step": 41121, "epoch": 495} {"train_loss": -19.22320556640625, "global_step": 41122, "epoch": 495} {"train_loss": -19.464338302612305, "global_step": 41123, "epoch": 495} {"train_loss": -19.29338264465332, "global_step": 41124, "epoch": 495} {"train_loss": -18.946157455444336, "global_step": 41125, "epoch": 495} {"train_loss": -19.630218505859375, "global_step": 41126, "epoch": 495} {"train_loss": -19.47430992126465, "global_step": 41127, "epoch": 495} {"train_loss": -19.458263397216797, "global_step": 41128, "epoch": 495} {"train_loss": -19.676633834838867, "global_step": 41129, "epoch": 495} {"train_loss": -19.376922607421875, "global_step": 41130, "epoch": 495} {"train_loss": -19.382837295532227, "global_step": 41131, "epoch": 495} {"train_loss": -19.2237548828125, "global_step": 41132, "epoch": 495} {"train_loss": -19.485639572143555, "global_step": 41133, "epoch": 495} {"train_loss": -19.575910568237305, "global_step": 41134, "epoch": 495} {"train_loss": -19.354459762573242, "global_step": 41135, "epoch": 495} {"train_loss": -19.603174209594727, "global_step": 41136, "epoch": 495} {"train_loss": -19.304224014282227, "global_step": 41137, "epoch": 495} {"train_loss": -19.671720504760742, "global_step": 41138, "epoch": 495} {"train_loss": -19.247451782226562, "global_step": 41139, "epoch": 495} {"train_loss": -19.647825241088867, "global_step": 41140, "epoch": 495} {"train_loss": -19.153528213500977, "global_step": 41141, "epoch": 495} {"train_loss": -19.403974533081055, "global_step": 41142, "epoch": 495} {"train_loss": -19.491125106811523, "global_step": 41143, "epoch": 495} {"train_loss": -19.602190017700195, "global_step": 41144, "epoch": 495} {"train_loss": -19.673770904541016, "global_step": 41145, "epoch": 495} {"train_loss": -19.748483657836914, "global_step": 41146, "epoch": 495} {"train_loss": -19.671199798583984, "global_step": 41147, "epoch": 495} {"train_loss": -19.500898361206055, "global_step": 41148, "epoch": 495} {"train_loss": -19.421133041381836, "global_step": 41149, "epoch": 495} {"train_loss": -19.609676361083984, "global_step": 41150, "epoch": 495} {"train_loss": -19.432573318481445, "global_step": 41151, "epoch": 495} {"train_loss": -19.366016387939453, "global_step": 41152, "epoch": 495} {"train_loss": -19.218555450439453, "global_step": 41153, "epoch": 495} {"train_loss": -19.41886329650879, "global_step": 41154, "epoch": 495} {"train_loss": -19.41446304321289, "global_step": 41155, "epoch": 495} {"train_loss": -19.342988967895508, "global_step": 41156, "epoch": 495} {"train_loss": -19.59895133972168, "global_step": 41157, "epoch": 495} {"train_loss": -19.724523544311523, "global_step": 41158, "epoch": 495} {"train_loss": -19.17177391052246, "global_step": 41159, "epoch": 495} {"train_loss": -19.49601173400879, "global_step": 41160, "epoch": 495} {"train_loss": -19.645151138305664, "global_step": 41161, "epoch": 495} {"train_loss": -19.337505340576172, "global_step": 41162, "epoch": 495} {"train_loss": -19.50653076171875, "global_step": 41163, "epoch": 495} {"train_loss": -19.57798194885254, "global_step": 41164, "epoch": 495} {"train_loss": -19.349302291870117, "global_step": 41165, "epoch": 495} {"train_loss": -19.206159591674805, "global_step": 41166, "epoch": 495} {"train_loss": -19.477097913443323, "global_step": 41167, "epoch": 495, "val_loss": 6029575.0} {"train_loss": -19.346738815307617, "global_step": 41168, "epoch": 496} {"train_loss": -19.467100143432617, "global_step": 41169, "epoch": 496} {"train_loss": -19.29355239868164, "global_step": 41170, "epoch": 496} {"train_loss": -19.630002975463867, "global_step": 41171, "epoch": 496} {"train_loss": -18.99318504333496, "global_step": 41172, "epoch": 496} {"train_loss": -19.412641525268555, "global_step": 41173, "epoch": 496} {"train_loss": -19.33173942565918, "global_step": 41174, "epoch": 496} {"train_loss": -19.519439697265625, "global_step": 41175, "epoch": 496} {"train_loss": -19.69175910949707, "global_step": 41176, "epoch": 496} {"train_loss": -19.313589096069336, "global_step": 41177, "epoch": 496} {"train_loss": -19.49547576904297, "global_step": 41178, "epoch": 496} {"train_loss": -19.177804946899414, "global_step": 41179, "epoch": 496} {"train_loss": -19.365629196166992, "global_step": 41180, "epoch": 496} {"train_loss": -19.32752799987793, "global_step": 41181, "epoch": 496} {"train_loss": -18.987119674682617, "global_step": 41182, "epoch": 496} {"train_loss": -19.284223556518555, "global_step": 41183, "epoch": 496} {"train_loss": -19.127012252807617, "global_step": 41184, "epoch": 496} {"train_loss": -19.627195358276367, "global_step": 41185, "epoch": 496} {"train_loss": -19.41248893737793, "global_step": 41186, "epoch": 496} {"train_loss": -19.504491806030273, "global_step": 41187, "epoch": 496} {"train_loss": -19.44691276550293, "global_step": 41188, "epoch": 496} {"train_loss": -19.467689514160156, "global_step": 41189, "epoch": 496} {"train_loss": -19.304121017456055, "global_step": 41190, "epoch": 496} {"train_loss": -19.595474243164062, "global_step": 41191, "epoch": 496} {"train_loss": -19.553409576416016, "global_step": 41192, "epoch": 496} {"train_loss": -19.420089721679688, "global_step": 41193, "epoch": 496} {"train_loss": -19.469257354736328, "global_step": 41194, "epoch": 496} {"train_loss": -20.085166931152344, "global_step": 41195, "epoch": 496} {"train_loss": -19.49993896484375, "global_step": 41196, "epoch": 496} {"train_loss": -19.453264236450195, "global_step": 41197, "epoch": 496} {"train_loss": -19.759794235229492, "global_step": 41198, "epoch": 496} {"train_loss": -19.352100372314453, "global_step": 41199, "epoch": 496} {"train_loss": -19.253250122070312, "global_step": 41200, "epoch": 496} {"train_loss": -19.06459617614746, "global_step": 41201, "epoch": 496} {"train_loss": -19.79473304748535, "global_step": 41202, "epoch": 496} {"train_loss": -19.682592391967773, "global_step": 41203, "epoch": 496} {"train_loss": -19.142948150634766, "global_step": 41204, "epoch": 496} {"train_loss": -19.73018455505371, "global_step": 41205, "epoch": 496} {"train_loss": -19.329750061035156, "global_step": 41206, "epoch": 496} {"train_loss": -19.263879776000977, "global_step": 41207, "epoch": 496} {"train_loss": -19.943464279174805, "global_step": 41208, "epoch": 496} {"train_loss": -19.506498336791992, "global_step": 41209, "epoch": 496} {"train_loss": -19.4713191986084, "global_step": 41210, "epoch": 496} {"train_loss": -19.59708595275879, "global_step": 41211, "epoch": 496} {"train_loss": -19.64211654663086, "global_step": 41212, "epoch": 496} {"train_loss": -19.23809814453125, "global_step": 41213, "epoch": 496} {"train_loss": -19.675308227539062, "global_step": 41214, "epoch": 496} {"train_loss": -19.591379165649414, "global_step": 41215, "epoch": 496} {"train_loss": -19.253347396850586, "global_step": 41216, "epoch": 496} {"train_loss": -19.16177749633789, "global_step": 41217, "epoch": 496} {"train_loss": -19.513505935668945, "global_step": 41218, "epoch": 496} {"train_loss": -19.221275329589844, "global_step": 41219, "epoch": 496} {"train_loss": -19.89493751525879, "global_step": 41220, "epoch": 496} {"train_loss": -19.25364112854004, "global_step": 41221, "epoch": 496} {"train_loss": -19.356552124023438, "global_step": 41222, "epoch": 496} {"train_loss": -19.32282829284668, "global_step": 41223, "epoch": 496} {"train_loss": -19.5488224029541, "global_step": 41224, "epoch": 496} {"train_loss": -19.436870574951172, "global_step": 41225, "epoch": 496} {"train_loss": -19.713708877563477, "global_step": 41226, "epoch": 496} {"train_loss": -19.557477951049805, "global_step": 41227, "epoch": 496} {"train_loss": -19.32563591003418, "global_step": 41228, "epoch": 496} {"train_loss": -19.225000381469727, "global_step": 41229, "epoch": 496} {"train_loss": -19.31296157836914, "global_step": 41230, "epoch": 496} {"train_loss": -19.61287498474121, "global_step": 41231, "epoch": 496} {"train_loss": -19.151748657226562, "global_step": 41232, "epoch": 496} {"train_loss": -19.497947692871094, "global_step": 41233, "epoch": 496} {"train_loss": -19.45713233947754, "global_step": 41234, "epoch": 496} {"train_loss": -19.750654220581055, "global_step": 41235, "epoch": 496} {"train_loss": -19.321212768554688, "global_step": 41236, "epoch": 496} {"train_loss": -19.192058563232422, "global_step": 41237, "epoch": 496} {"train_loss": -19.313404083251953, "global_step": 41238, "epoch": 496} {"train_loss": -19.715572357177734, "global_step": 41239, "epoch": 496} {"train_loss": -19.399051666259766, "global_step": 41240, "epoch": 496} {"train_loss": -19.627561569213867, "global_step": 41241, "epoch": 496} {"train_loss": -19.551862716674805, "global_step": 41242, "epoch": 496} {"train_loss": -19.44551658630371, "global_step": 41243, "epoch": 496} {"train_loss": -19.65479278564453, "global_step": 41244, "epoch": 496} {"train_loss": -19.18317985534668, "global_step": 41245, "epoch": 496} {"train_loss": -19.81589126586914, "global_step": 41246, "epoch": 496} {"train_loss": -19.408239364624023, "global_step": 41247, "epoch": 496} {"train_loss": -19.776508331298828, "global_step": 41248, "epoch": 496} {"train_loss": -19.398426055908203, "global_step": 41249, "epoch": 496} {"train_loss": -19.456684847912157, "global_step": 41250, "epoch": 496, "val_loss": 5972914.0} {"train_loss": -19.263385772705078, "global_step": 41251, "epoch": 497} {"train_loss": -19.547626495361328, "global_step": 41252, "epoch": 497} {"train_loss": -19.687841415405273, "global_step": 41253, "epoch": 497} {"train_loss": -19.899343490600586, "global_step": 41254, "epoch": 497} {"train_loss": -19.383193969726562, "global_step": 41255, "epoch": 497} {"train_loss": -19.296356201171875, "global_step": 41256, "epoch": 497} {"train_loss": -19.89716148376465, "global_step": 41257, "epoch": 497} {"train_loss": -19.067113876342773, "global_step": 41258, "epoch": 497} {"train_loss": -19.245214462280273, "global_step": 41259, "epoch": 497} {"train_loss": -19.18089485168457, "global_step": 41260, "epoch": 497} {"train_loss": -19.325769424438477, "global_step": 41261, "epoch": 497} {"train_loss": -19.273330688476562, "global_step": 41262, "epoch": 497} {"train_loss": -19.261381149291992, "global_step": 41263, "epoch": 497} {"train_loss": -19.369232177734375, "global_step": 41264, "epoch": 497} {"train_loss": -19.60379409790039, "global_step": 41265, "epoch": 497} {"train_loss": -19.66376304626465, "global_step": 41266, "epoch": 497} {"train_loss": -19.671236038208008, "global_step": 41267, "epoch": 497} {"train_loss": -19.323942184448242, "global_step": 41268, "epoch": 497} {"train_loss": -19.72556495666504, "global_step": 41269, "epoch": 497} {"train_loss": -19.609031677246094, "global_step": 41270, "epoch": 497} {"train_loss": -19.445499420166016, "global_step": 41271, "epoch": 497} {"train_loss": -19.39072036743164, "global_step": 41272, "epoch": 497} {"train_loss": -19.397844314575195, "global_step": 41273, "epoch": 497} {"train_loss": -19.26503562927246, "global_step": 41274, "epoch": 497} {"train_loss": -19.6200008392334, "global_step": 41275, "epoch": 497} {"train_loss": -19.620473861694336, "global_step": 41276, "epoch": 497} {"train_loss": -19.530372619628906, "global_step": 41277, "epoch": 497} {"train_loss": -19.47281265258789, "global_step": 41278, "epoch": 497} {"train_loss": -19.93826675415039, "global_step": 41279, "epoch": 497} {"train_loss": -19.482162475585938, "global_step": 41280, "epoch": 497} {"train_loss": -19.567672729492188, "global_step": 41281, "epoch": 497} {"train_loss": -19.670597076416016, "global_step": 41282, "epoch": 497} {"train_loss": -20.074817657470703, "global_step": 41283, "epoch": 497} {"train_loss": -19.422971725463867, "global_step": 41284, "epoch": 497} {"train_loss": -19.50190544128418, "global_step": 41285, "epoch": 497} {"train_loss": -19.800926208496094, "global_step": 41286, "epoch": 497} {"train_loss": -19.427019119262695, "global_step": 41287, "epoch": 497} {"train_loss": -19.214990615844727, "global_step": 41288, "epoch": 497} {"train_loss": -19.69878387451172, "global_step": 41289, "epoch": 497} {"train_loss": -19.536752700805664, "global_step": 41290, "epoch": 497} {"train_loss": -19.503820419311523, "global_step": 41291, "epoch": 497} {"train_loss": -19.040573120117188, "global_step": 41292, "epoch": 497} {"train_loss": -19.687088012695312, "global_step": 41293, "epoch": 497} {"train_loss": -19.430761337280273, "global_step": 41294, "epoch": 497} {"train_loss": -19.661550521850586, "global_step": 41295, "epoch": 497} {"train_loss": -19.63790512084961, "global_step": 41296, "epoch": 497} {"train_loss": -19.66362762451172, "global_step": 41297, "epoch": 497} {"train_loss": -19.38945960998535, "global_step": 41298, "epoch": 497} {"train_loss": -19.575223922729492, "global_step": 41299, "epoch": 497} {"train_loss": -19.605632781982422, "global_step": 41300, "epoch": 497} {"train_loss": -19.591514587402344, "global_step": 41301, "epoch": 497} {"train_loss": -19.3476619720459, "global_step": 41302, "epoch": 497} {"train_loss": -19.62601661682129, "global_step": 41303, "epoch": 497} {"train_loss": -19.056100845336914, "global_step": 41304, "epoch": 497} {"train_loss": -19.661813735961914, "global_step": 41305, "epoch": 497} {"train_loss": -19.297216415405273, "global_step": 41306, "epoch": 497} {"train_loss": -19.473058700561523, "global_step": 41307, "epoch": 497} {"train_loss": -19.5961971282959, "global_step": 41308, "epoch": 497} {"train_loss": -19.46925926208496, "global_step": 41309, "epoch": 497} {"train_loss": -19.684785842895508, "global_step": 41310, "epoch": 497} {"train_loss": -19.626953125, "global_step": 41311, "epoch": 497} {"train_loss": -19.669986724853516, "global_step": 41312, "epoch": 497} {"train_loss": -19.472272872924805, "global_step": 41313, "epoch": 497} {"train_loss": -19.97208023071289, "global_step": 41314, "epoch": 497} {"train_loss": -19.520742416381836, "global_step": 41315, "epoch": 497} {"train_loss": -19.760271072387695, "global_step": 41316, "epoch": 497} {"train_loss": -19.323284149169922, "global_step": 41317, "epoch": 497} {"train_loss": -19.283132553100586, "global_step": 41318, "epoch": 497} {"train_loss": -19.526702880859375, "global_step": 41319, "epoch": 497} {"train_loss": -19.594436645507812, "global_step": 41320, "epoch": 497} {"train_loss": -19.482107162475586, "global_step": 41321, "epoch": 497} {"train_loss": -19.550424575805664, "global_step": 41322, "epoch": 497} {"train_loss": -19.49428939819336, "global_step": 41323, "epoch": 497} {"train_loss": -19.321365356445312, "global_step": 41324, "epoch": 497} {"train_loss": -19.460580825805664, "global_step": 41325, "epoch": 497} {"train_loss": -19.50255012512207, "global_step": 41326, "epoch": 497} {"train_loss": -19.481412887573242, "global_step": 41327, "epoch": 497} {"train_loss": -19.349151611328125, "global_step": 41328, "epoch": 497} {"train_loss": -19.65036392211914, "global_step": 41329, "epoch": 497} {"train_loss": -19.407316207885742, "global_step": 41330, "epoch": 497} {"train_loss": -19.868066787719727, "global_step": 41331, "epoch": 497} {"train_loss": -19.341171264648438, "global_step": 41332, "epoch": 497} {"train_loss": -19.522616374923523, "global_step": 41333, "epoch": 497, "val_loss": 5959803.5} {"train_loss": -18.88347816467285, "global_step": 41334, "epoch": 498} {"train_loss": -19.35753631591797, "global_step": 41335, "epoch": 498} {"train_loss": -19.50482177734375, "global_step": 41336, "epoch": 498} {"train_loss": -19.64884376525879, "global_step": 41337, "epoch": 498} {"train_loss": -19.3101806640625, "global_step": 41338, "epoch": 498} {"train_loss": -19.225008010864258, "global_step": 41339, "epoch": 498} {"train_loss": -19.593141555786133, "global_step": 41340, "epoch": 498} {"train_loss": -19.486591339111328, "global_step": 41341, "epoch": 498} {"train_loss": -19.697175979614258, "global_step": 41342, "epoch": 498} {"train_loss": -19.207582473754883, "global_step": 41343, "epoch": 498} {"train_loss": -19.794172286987305, "global_step": 41344, "epoch": 498} {"train_loss": -19.432392120361328, "global_step": 41345, "epoch": 498} {"train_loss": -19.588308334350586, "global_step": 41346, "epoch": 498} {"train_loss": -19.66928482055664, "global_step": 41347, "epoch": 498} {"train_loss": -19.207401275634766, "global_step": 41348, "epoch": 498} {"train_loss": -19.32016372680664, "global_step": 41349, "epoch": 498} {"train_loss": -19.340192794799805, "global_step": 41350, "epoch": 498} {"train_loss": -19.544946670532227, "global_step": 41351, "epoch": 498} {"train_loss": -19.271427154541016, "global_step": 41352, "epoch": 498} {"train_loss": -19.360700607299805, "global_step": 41353, "epoch": 498} {"train_loss": -19.718679428100586, "global_step": 41354, "epoch": 498} {"train_loss": -18.920162200927734, "global_step": 41355, "epoch": 498} {"train_loss": -19.398914337158203, "global_step": 41356, "epoch": 498} {"train_loss": -19.263334274291992, "global_step": 41357, "epoch": 498} {"train_loss": -19.550382614135742, "global_step": 41358, "epoch": 498} {"train_loss": -19.335697174072266, "global_step": 41359, "epoch": 498} {"train_loss": -19.548505783081055, "global_step": 41360, "epoch": 498} {"train_loss": -19.706186294555664, "global_step": 41361, "epoch": 498} {"train_loss": -19.03885841369629, "global_step": 41362, "epoch": 498} {"train_loss": -19.619775772094727, "global_step": 41363, "epoch": 498} {"train_loss": -19.294862747192383, "global_step": 41364, "epoch": 498} {"train_loss": -19.2310791015625, "global_step": 41365, "epoch": 498} {"train_loss": -19.575563430786133, "global_step": 41366, "epoch": 498} {"train_loss": -19.620824813842773, "global_step": 41367, "epoch": 498} {"train_loss": -19.357303619384766, "global_step": 41368, "epoch": 498} {"train_loss": -19.792966842651367, "global_step": 41369, "epoch": 498} {"train_loss": -19.587129592895508, "global_step": 41370, "epoch": 498} {"train_loss": -19.539459228515625, "global_step": 41371, "epoch": 498} {"train_loss": -19.439212799072266, "global_step": 41372, "epoch": 498} {"train_loss": -19.551156997680664, "global_step": 41373, "epoch": 498} {"train_loss": -19.04502296447754, "global_step": 41374, "epoch": 498} {"train_loss": -19.484445571899414, "global_step": 41375, "epoch": 498} {"train_loss": -19.743703842163086, "global_step": 41376, "epoch": 498} {"train_loss": -19.772340774536133, "global_step": 41377, "epoch": 498} {"train_loss": -19.339078903198242, "global_step": 41378, "epoch": 498} {"train_loss": -19.265701293945312, "global_step": 41379, "epoch": 498} {"train_loss": -19.663570404052734, "global_step": 41380, "epoch": 498} {"train_loss": -19.60072135925293, "global_step": 41381, "epoch": 498} {"train_loss": -19.59385871887207, "global_step": 41382, "epoch": 498} {"train_loss": -19.48472785949707, "global_step": 41383, "epoch": 498} {"train_loss": -19.43765640258789, "global_step": 41384, "epoch": 498} {"train_loss": -19.738786697387695, "global_step": 41385, "epoch": 498} {"train_loss": -19.2872314453125, "global_step": 41386, "epoch": 498} {"train_loss": -19.158056259155273, "global_step": 41387, "epoch": 498} {"train_loss": -19.62199592590332, "global_step": 41388, "epoch": 498} {"train_loss": -19.43903923034668, "global_step": 41389, "epoch": 498} {"train_loss": -19.409889221191406, "global_step": 41390, "epoch": 498} {"train_loss": -19.55097770690918, "global_step": 41391, "epoch": 498} {"train_loss": -19.334049224853516, "global_step": 41392, "epoch": 498} {"train_loss": -19.462873458862305, "global_step": 41393, "epoch": 498} {"train_loss": -19.572240829467773, "global_step": 41394, "epoch": 498} {"train_loss": -19.51017189025879, "global_step": 41395, "epoch": 498} {"train_loss": -19.475461959838867, "global_step": 41396, "epoch": 498} {"train_loss": -19.588163375854492, "global_step": 41397, "epoch": 498} {"train_loss": -19.37478256225586, "global_step": 41398, "epoch": 498} {"train_loss": -19.465744018554688, "global_step": 41399, "epoch": 498} {"train_loss": -19.566726684570312, "global_step": 41400, "epoch": 498} {"train_loss": -19.260313034057617, "global_step": 41401, "epoch": 498} {"train_loss": -19.578481674194336, "global_step": 41402, "epoch": 498} {"train_loss": -19.522418975830078, "global_step": 41403, "epoch": 498} {"train_loss": -19.331796646118164, "global_step": 41404, "epoch": 498} {"train_loss": -19.789257049560547, "global_step": 41405, "epoch": 498} {"train_loss": -19.758176803588867, "global_step": 41406, "epoch": 498} {"train_loss": -19.829084396362305, "global_step": 41407, "epoch": 498} {"train_loss": -20.040876388549805, "global_step": 41408, "epoch": 498} {"train_loss": -19.830724716186523, "global_step": 41409, "epoch": 498} {"train_loss": -19.495569229125977, "global_step": 41410, "epoch": 498} {"train_loss": -19.52091407775879, "global_step": 41411, "epoch": 498} {"train_loss": -19.39303970336914, "global_step": 41412, "epoch": 498} {"train_loss": -19.361738204956055, "global_step": 41413, "epoch": 498} {"train_loss": -19.337568283081055, "global_step": 41414, "epoch": 498} {"train_loss": -19.76624870300293, "global_step": 41415, "epoch": 498} {"train_loss": -19.472399056675922, "global_step": 41416, "epoch": 498, "val_loss": 5998370.0} {"train_loss": -19.274179458618164, "global_step": 41417, "epoch": 499} {"train_loss": -19.466747283935547, "global_step": 41418, "epoch": 499} {"train_loss": -19.788915634155273, "global_step": 41419, "epoch": 499} {"train_loss": -19.20920181274414, "global_step": 41420, "epoch": 499} {"train_loss": -19.44304847717285, "global_step": 41421, "epoch": 499} {"train_loss": -19.40826416015625, "global_step": 41422, "epoch": 499} {"train_loss": -19.4632625579834, "global_step": 41423, "epoch": 499} {"train_loss": -19.58837890625, "global_step": 41424, "epoch": 499} {"train_loss": -19.781675338745117, "global_step": 41425, "epoch": 499} {"train_loss": -19.75912857055664, "global_step": 41426, "epoch": 499} {"train_loss": -19.447778701782227, "global_step": 41427, "epoch": 499} {"train_loss": -19.469724655151367, "global_step": 41428, "epoch": 499} {"train_loss": -19.330862045288086, "global_step": 41429, "epoch": 499} {"train_loss": -19.57262420654297, "global_step": 41430, "epoch": 499} {"train_loss": -19.542404174804688, "global_step": 41431, "epoch": 499} {"train_loss": -19.564804077148438, "global_step": 41432, "epoch": 499} {"train_loss": -19.314353942871094, "global_step": 41433, "epoch": 499} {"train_loss": -19.096302032470703, "global_step": 41434, "epoch": 499} {"train_loss": -19.732221603393555, "global_step": 41435, "epoch": 499} {"train_loss": -19.177845001220703, "global_step": 41436, "epoch": 499} {"train_loss": -19.402029037475586, "global_step": 41437, "epoch": 499} {"train_loss": -19.34934425354004, "global_step": 41438, "epoch": 499} {"train_loss": -19.500192642211914, "global_step": 41439, "epoch": 499} {"train_loss": -19.71134376525879, "global_step": 41440, "epoch": 499} {"train_loss": -19.251930236816406, "global_step": 41441, "epoch": 499} {"train_loss": -19.53215980529785, "global_step": 41442, "epoch": 499} {"train_loss": -19.430219650268555, "global_step": 41443, "epoch": 499} {"train_loss": -19.527563095092773, "global_step": 41444, "epoch": 499} {"train_loss": -19.18996238708496, "global_step": 41445, "epoch": 499} {"train_loss": -19.83760643005371, "global_step": 41446, "epoch": 499} {"train_loss": -19.31183433532715, "global_step": 41447, "epoch": 499} {"train_loss": -19.581607818603516, "global_step": 41448, "epoch": 499} {"train_loss": -19.353208541870117, "global_step": 41449, "epoch": 499} {"train_loss": -19.487266540527344, "global_step": 41450, "epoch": 499} {"train_loss": -19.17725372314453, "global_step": 41451, "epoch": 499} {"train_loss": -19.664085388183594, "global_step": 41452, "epoch": 499} {"train_loss": -19.266788482666016, "global_step": 41453, "epoch": 499} {"train_loss": -19.663822174072266, "global_step": 41454, "epoch": 499} {"train_loss": -19.276235580444336, "global_step": 41455, "epoch": 499} {"train_loss": -19.608171463012695, "global_step": 41456, "epoch": 499} {"train_loss": -19.32538604736328, "global_step": 41457, "epoch": 499} {"train_loss": -19.50843048095703, "global_step": 41458, "epoch": 499} {"train_loss": -18.996952056884766, "global_step": 41459, "epoch": 499} {"train_loss": -19.65152359008789, "global_step": 41460, "epoch": 499} {"train_loss": -19.376752853393555, "global_step": 41461, "epoch": 499} {"train_loss": -19.2911376953125, "global_step": 41462, "epoch": 499} {"train_loss": -19.44801139831543, "global_step": 41463, "epoch": 499} {"train_loss": -19.853923797607422, "global_step": 41464, "epoch": 499} {"train_loss": -19.743871688842773, "global_step": 41465, "epoch": 499} {"train_loss": -19.377090454101562, "global_step": 41466, "epoch": 499} {"train_loss": -19.357160568237305, "global_step": 41467, "epoch": 499} {"train_loss": -19.36567497253418, "global_step": 41468, "epoch": 499} {"train_loss": -19.815567016601562, "global_step": 41469, "epoch": 499} {"train_loss": -19.595077514648438, "global_step": 41470, "epoch": 499} {"train_loss": -19.564970016479492, "global_step": 41471, "epoch": 499} {"train_loss": -19.296293258666992, "global_step": 41472, "epoch": 499} {"train_loss": -19.2694034576416, "global_step": 41473, "epoch": 499} {"train_loss": -19.323705673217773, "global_step": 41474, "epoch": 499} {"train_loss": -19.188676834106445, "global_step": 41475, "epoch": 499} {"train_loss": -19.97100067138672, "global_step": 41476, "epoch": 499} {"train_loss": -19.735437393188477, "global_step": 41477, "epoch": 499} {"train_loss": -19.772336959838867, "global_step": 41478, "epoch": 499} {"train_loss": -19.30314826965332, "global_step": 41479, "epoch": 499} {"train_loss": -19.595142364501953, "global_step": 41480, "epoch": 499} {"train_loss": -19.790023803710938, "global_step": 41481, "epoch": 499} {"train_loss": -19.487960815429688, "global_step": 41482, "epoch": 499} {"train_loss": -20.078950881958008, "global_step": 41483, "epoch": 499} {"train_loss": -19.886798858642578, "global_step": 41484, "epoch": 499} {"train_loss": -19.516357421875, "global_step": 41485, "epoch": 499} {"train_loss": -19.096792221069336, "global_step": 41486, "epoch": 499} {"train_loss": -19.6131591796875, "global_step": 41487, "epoch": 499} {"train_loss": -19.611055374145508, "global_step": 41488, "epoch": 499} {"train_loss": -19.480854034423828, "global_step": 41489, "epoch": 499} {"train_loss": -19.335355758666992, "global_step": 41490, "epoch": 499} {"train_loss": -19.653152465820312, "global_step": 41491, "epoch": 499} {"train_loss": -19.409549713134766, "global_step": 41492, "epoch": 499} {"train_loss": -20.02338218688965, "global_step": 41493, "epoch": 499} {"train_loss": -19.558319091796875, "global_step": 41494, "epoch": 499} {"train_loss": -19.512331008911133, "global_step": 41495, "epoch": 499} {"train_loss": -19.626819610595703, "global_step": 41496, "epoch": 499} {"train_loss": -19.818130493164062, "global_step": 41497, "epoch": 499} {"train_loss": -19.81100845336914, "global_step": 41498, "epoch": 499} {"train_loss": -19.510868807873095, "global_step": 41499, "epoch": 499, "val_loss": 5897321.0} {"train_loss": -18.75358009338379, "global_step": 41500, "epoch": 500} {"train_loss": -19.41513442993164, "global_step": 41501, "epoch": 500} {"train_loss": -19.132375717163086, "global_step": 41502, "epoch": 500} {"train_loss": -19.217304229736328, "global_step": 41503, "epoch": 500} {"train_loss": -19.5833740234375, "global_step": 41504, "epoch": 500} {"train_loss": -19.39261245727539, "global_step": 41505, "epoch": 500} {"train_loss": -19.33048439025879, "global_step": 41506, "epoch": 500} {"train_loss": -19.180402755737305, "global_step": 41507, "epoch": 500} {"train_loss": -19.360363006591797, "global_step": 41508, "epoch": 500} {"train_loss": -19.745084762573242, "global_step": 41509, "epoch": 500} {"train_loss": -19.002262115478516, "global_step": 41510, "epoch": 500} {"train_loss": -19.472890853881836, "global_step": 41511, "epoch": 500} {"train_loss": -19.723861694335938, "global_step": 41512, "epoch": 500} {"train_loss": -19.268774032592773, "global_step": 41513, "epoch": 500} {"train_loss": -19.570981979370117, "global_step": 41514, "epoch": 500} {"train_loss": -19.518896102905273, "global_step": 41515, "epoch": 500} {"train_loss": -19.555490493774414, "global_step": 41516, "epoch": 500} {"train_loss": -19.489259719848633, "global_step": 41517, "epoch": 500} {"train_loss": -19.345136642456055, "global_step": 41518, "epoch": 500} {"train_loss": -19.384817123413086, "global_step": 41519, "epoch": 500} {"train_loss": -19.772064208984375, "global_step": 41520, "epoch": 500} {"train_loss": -19.17650604248047, "global_step": 41521, "epoch": 500} {"train_loss": -19.505802154541016, "global_step": 41522, "epoch": 500} {"train_loss": -19.43935203552246, "global_step": 41523, "epoch": 500} {"train_loss": -19.507837295532227, "global_step": 41524, "epoch": 500} {"train_loss": -19.535213470458984, "global_step": 41525, "epoch": 500} {"train_loss": -19.292253494262695, "global_step": 41526, "epoch": 500} {"train_loss": -19.4296875, "global_step": 41527, "epoch": 500} {"train_loss": -19.395889282226562, "global_step": 41528, "epoch": 500} {"train_loss": -19.369125366210938, "global_step": 41529, "epoch": 500} {"train_loss": -19.685108184814453, "global_step": 41530, "epoch": 500} {"train_loss": -19.316434860229492, "global_step": 41531, "epoch": 500} {"train_loss": -19.671445846557617, "global_step": 41532, "epoch": 500} {"train_loss": -19.397342681884766, "global_step": 41533, "epoch": 500} {"train_loss": -19.331724166870117, "global_step": 41534, "epoch": 500} {"train_loss": -18.82849884033203, "global_step": 41535, "epoch": 500} {"train_loss": -19.41522789001465, "global_step": 41536, "epoch": 500} {"train_loss": -19.832517623901367, "global_step": 41537, "epoch": 500} {"train_loss": -19.720136642456055, "global_step": 41538, "epoch": 500} {"train_loss": -19.54205894470215, "global_step": 41539, "epoch": 500} {"train_loss": -19.65207862854004, "global_step": 41540, "epoch": 500} {"train_loss": -19.351516723632812, "global_step": 41541, "epoch": 500} {"train_loss": -19.753910064697266, "global_step": 41542, "epoch": 500} {"train_loss": -19.66806983947754, "global_step": 41543, "epoch": 500} {"train_loss": -19.509014129638672, "global_step": 41544, "epoch": 500} {"train_loss": -19.40645408630371, "global_step": 41545, "epoch": 500} {"train_loss": -19.693115234375, "global_step": 41546, "epoch": 500} {"train_loss": -19.247411727905273, "global_step": 41547, "epoch": 500} {"train_loss": -19.4027042388916, "global_step": 41548, "epoch": 500} {"train_loss": -19.530414581298828, "global_step": 41549, "epoch": 500} {"train_loss": -19.600046157836914, "global_step": 41550, "epoch": 500} {"train_loss": -19.44675064086914, "global_step": 41551, "epoch": 500} {"train_loss": -19.67816162109375, "global_step": 41552, "epoch": 500} {"train_loss": -19.953245162963867, "global_step": 41553, "epoch": 500} {"train_loss": -19.62400245666504, "global_step": 41554, "epoch": 500} {"train_loss": -19.338972091674805, "global_step": 41555, "epoch": 500} {"train_loss": -19.7021541595459, "global_step": 41556, "epoch": 500} {"train_loss": -19.600624084472656, "global_step": 41557, "epoch": 500} {"train_loss": -19.303970336914062, "global_step": 41558, "epoch": 500} {"train_loss": -19.204212188720703, "global_step": 41559, "epoch": 500} {"train_loss": -19.86773681640625, "global_step": 41560, "epoch": 500} {"train_loss": -19.69717025756836, "global_step": 41561, "epoch": 500} {"train_loss": -19.4353084564209, "global_step": 41562, "epoch": 500} {"train_loss": -19.504018783569336, "global_step": 41563, "epoch": 500} {"train_loss": -19.756338119506836, "global_step": 41564, "epoch": 500} {"train_loss": -19.505624771118164, "global_step": 41565, "epoch": 500} {"train_loss": -19.49657440185547, "global_step": 41566, "epoch": 500} {"train_loss": -19.718673706054688, "global_step": 41567, "epoch": 500} {"train_loss": -19.522397994995117, "global_step": 41568, "epoch": 500} {"train_loss": -19.72321128845215, "global_step": 41569, "epoch": 500} {"train_loss": -19.451297760009766, "global_step": 41570, "epoch": 500} {"train_loss": -19.457365036010742, "global_step": 41571, "epoch": 500} {"train_loss": -19.659727096557617, "global_step": 41572, "epoch": 500} {"train_loss": -19.522260665893555, "global_step": 41573, "epoch": 500} {"train_loss": -19.604799270629883, "global_step": 41574, "epoch": 500} {"train_loss": -19.58485221862793, "global_step": 41575, "epoch": 500} {"train_loss": -19.513381958007812, "global_step": 41576, "epoch": 500} {"train_loss": -19.342952728271484, "global_step": 41577, "epoch": 500} {"train_loss": -19.36505126953125, "global_step": 41578, "epoch": 500} {"train_loss": -19.13187599182129, "global_step": 41579, "epoch": 500} {"train_loss": -19.61964988708496, "global_step": 41580, "epoch": 500} {"train_loss": -19.48567008972168, "global_step": 41581, "epoch": 500} {"train_loss": -19.485534185386566, "global_step": 41582, "epoch": 500, "train/sim_max_reward_0": 1.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 0.0, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4500000": 0.0, "test/sim_max_reward_4500001": 1.0, "test/sim_max_reward_4500002": 1.0, "test/sim_max_reward_4500003": 1.0, "test/sim_max_reward_4500004": 1.0, "test/sim_max_reward_4500005": 1.0, "test/sim_max_reward_4500006": 0.0, "test/sim_max_reward_4500007": 1.0, "test/sim_max_reward_4500008": 1.0, "test/sim_max_reward_4500009": 1.0, "test/sim_max_reward_4500010": 1.0, "test/sim_max_reward_4500011": 1.0, "test/sim_max_reward_4500012": 1.0, "test/sim_max_reward_4500013": 1.0, "test/sim_max_reward_4500014": 1.0, "test/sim_max_reward_4500015": 1.0, "test/sim_max_reward_4500016": 1.0, "test/sim_max_reward_4500017": 1.0, "test/sim_max_reward_4500018": 1.0, "test/sim_max_reward_4500019": 0.0, "test/sim_max_reward_4500020": 1.0, "test/sim_max_reward_4500021": 1.0, "train/mean_score": 0.8333333333333334, "test/mean_score": 0.8636363636363636, "val_loss": 6024330.5} {"train_loss": -19.3133602142334, "global_step": 41583, "epoch": 501} {"train_loss": -19.20157814025879, "global_step": 41584, "epoch": 501} {"train_loss": -19.110309600830078, "global_step": 41585, "epoch": 501} {"train_loss": -19.016319274902344, "global_step": 41586, "epoch": 501} {"train_loss": -19.521507263183594, "global_step": 41587, "epoch": 501} {"train_loss": -19.15431022644043, "global_step": 41588, "epoch": 501} {"train_loss": -19.416337966918945, "global_step": 41589, "epoch": 501} {"train_loss": -19.222705841064453, "global_step": 41590, "epoch": 501} {"train_loss": -18.978628158569336, "global_step": 41591, "epoch": 501} {"train_loss": -19.533193588256836, "global_step": 41592, "epoch": 501} {"train_loss": -19.28175926208496, "global_step": 41593, "epoch": 501} {"train_loss": -19.77332878112793, "global_step": 41594, "epoch": 501} {"train_loss": -19.322677612304688, "global_step": 41595, "epoch": 501} {"train_loss": -19.19662094116211, "global_step": 41596, "epoch": 501} {"train_loss": -19.537748336791992, "global_step": 41597, "epoch": 501} {"train_loss": -19.36895179748535, "global_step": 41598, "epoch": 501} {"train_loss": -19.426748275756836, "global_step": 41599, "epoch": 501} {"train_loss": -19.864482879638672, "global_step": 41600, "epoch": 501} {"train_loss": -19.44637107849121, "global_step": 41601, "epoch": 501} {"train_loss": -19.474552154541016, "global_step": 41602, "epoch": 501} {"train_loss": -19.60202407836914, "global_step": 41603, "epoch": 501} {"train_loss": -19.7192325592041, "global_step": 41604, "epoch": 501} {"train_loss": -19.683385848999023, "global_step": 41605, "epoch": 501} {"train_loss": -19.654727935791016, "global_step": 41606, "epoch": 501} {"train_loss": -19.50401496887207, "global_step": 41607, "epoch": 501} {"train_loss": -19.598352432250977, "global_step": 41608, "epoch": 501} {"train_loss": -19.611169815063477, "global_step": 41609, "epoch": 501} {"train_loss": -19.756345748901367, "global_step": 41610, "epoch": 501} {"train_loss": -19.728944778442383, "global_step": 41611, "epoch": 501} {"train_loss": -19.68037223815918, "global_step": 41612, "epoch": 501} {"train_loss": -19.63560676574707, "global_step": 41613, "epoch": 501} {"train_loss": -19.71075439453125, "global_step": 41614, "epoch": 501} {"train_loss": -19.488866806030273, "global_step": 41615, "epoch": 501} {"train_loss": -19.293981552124023, "global_step": 41616, "epoch": 501} {"train_loss": -19.391172409057617, "global_step": 41617, "epoch": 501} {"train_loss": -19.486568450927734, "global_step": 41618, "epoch": 501} {"train_loss": -19.605527877807617, "global_step": 41619, "epoch": 501} {"train_loss": -19.320234298706055, "global_step": 41620, "epoch": 501} {"train_loss": -19.704572677612305, "global_step": 41621, "epoch": 501} {"train_loss": -19.487688064575195, "global_step": 41622, "epoch": 501} {"train_loss": -18.875667572021484, "global_step": 41623, "epoch": 501} {"train_loss": -19.477169036865234, "global_step": 41624, "epoch": 501} {"train_loss": -19.543615341186523, "global_step": 41625, "epoch": 501} {"train_loss": -19.555660247802734, "global_step": 41626, "epoch": 501} {"train_loss": -19.467937469482422, "global_step": 41627, "epoch": 501} {"train_loss": -19.6867733001709, "global_step": 41628, "epoch": 501} {"train_loss": -19.841449737548828, "global_step": 41629, "epoch": 501} {"train_loss": -19.577241897583008, "global_step": 41630, "epoch": 501} {"train_loss": -19.40041160583496, "global_step": 41631, "epoch": 501} {"train_loss": -19.409088134765625, "global_step": 41632, "epoch": 501} {"train_loss": -19.363656997680664, "global_step": 41633, "epoch": 501} {"train_loss": -19.122600555419922, "global_step": 41634, "epoch": 501} {"train_loss": -19.8470401763916, "global_step": 41635, "epoch": 501} {"train_loss": -19.405567169189453, "global_step": 41636, "epoch": 501} {"train_loss": -19.939794540405273, "global_step": 41637, "epoch": 501} {"train_loss": -19.530155181884766, "global_step": 41638, "epoch": 501} {"train_loss": -19.687162399291992, "global_step": 41639, "epoch": 501} {"train_loss": -19.588706970214844, "global_step": 41640, "epoch": 501} {"train_loss": -19.853635787963867, "global_step": 41641, "epoch": 501} {"train_loss": -19.699308395385742, "global_step": 41642, "epoch": 501} {"train_loss": -19.47672462463379, "global_step": 41643, "epoch": 501} {"train_loss": -19.534040451049805, "global_step": 41644, "epoch": 501} {"train_loss": -19.45773696899414, "global_step": 41645, "epoch": 501} {"train_loss": -19.579410552978516, "global_step": 41646, "epoch": 501} {"train_loss": -19.47744369506836, "global_step": 41647, "epoch": 501} {"train_loss": -19.502498626708984, "global_step": 41648, "epoch": 501} {"train_loss": -19.3914852142334, "global_step": 41649, "epoch": 501} {"train_loss": -19.513961791992188, "global_step": 41650, "epoch": 501} {"train_loss": -19.518997192382812, "global_step": 41651, "epoch": 501} {"train_loss": -19.381986618041992, "global_step": 41652, "epoch": 501} {"train_loss": -19.54514503479004, "global_step": 41653, "epoch": 501} {"train_loss": -19.3914737701416, "global_step": 41654, "epoch": 501} {"train_loss": -19.80963134765625, "global_step": 41655, "epoch": 501} {"train_loss": -19.773038864135742, "global_step": 41656, "epoch": 501} {"train_loss": -19.584177017211914, "global_step": 41657, "epoch": 501} {"train_loss": -19.14898681640625, "global_step": 41658, "epoch": 501} {"train_loss": -19.732101440429688, "global_step": 41659, "epoch": 501} {"train_loss": -19.775054931640625, "global_step": 41660, "epoch": 501} {"train_loss": -19.50594139099121, "global_step": 41661, "epoch": 501} {"train_loss": -19.931074142456055, "global_step": 41662, "epoch": 501} {"train_loss": -19.50788688659668, "global_step": 41663, "epoch": 501} {"train_loss": -19.456663131713867, "global_step": 41664, "epoch": 501} {"train_loss": -19.500852630799073, "global_step": 41665, "epoch": 501, "val_loss": 6146136.5} {"train_loss": -19.24268913269043, "global_step": 41666, "epoch": 502} {"train_loss": -19.00205421447754, "global_step": 41667, "epoch": 502} {"train_loss": -19.074697494506836, "global_step": 41668, "epoch": 502} {"train_loss": -19.183439254760742, "global_step": 41669, "epoch": 502} {"train_loss": -19.343088150024414, "global_step": 41670, "epoch": 502} {"train_loss": -19.059322357177734, "global_step": 41671, "epoch": 502} {"train_loss": -19.275455474853516, "global_step": 41672, "epoch": 502} {"train_loss": -19.251192092895508, "global_step": 41673, "epoch": 502} {"train_loss": -19.31515884399414, "global_step": 41674, "epoch": 502} {"train_loss": -19.579877853393555, "global_step": 41675, "epoch": 502} {"train_loss": -19.028268814086914, "global_step": 41676, "epoch": 502} {"train_loss": -19.109678268432617, "global_step": 41677, "epoch": 502} {"train_loss": -18.942867279052734, "global_step": 41678, "epoch": 502} {"train_loss": -19.52869415283203, "global_step": 41679, "epoch": 502} {"train_loss": -19.559083938598633, "global_step": 41680, "epoch": 502} {"train_loss": -19.720312118530273, "global_step": 41681, "epoch": 502} {"train_loss": -19.467008590698242, "global_step": 41682, "epoch": 502} {"train_loss": -19.594467163085938, "global_step": 41683, "epoch": 502} {"train_loss": -19.760107040405273, "global_step": 41684, "epoch": 502} {"train_loss": -19.67702293395996, "global_step": 41685, "epoch": 502} {"train_loss": -19.57236671447754, "global_step": 41686, "epoch": 502} {"train_loss": -19.30957794189453, "global_step": 41687, "epoch": 502} {"train_loss": -19.198755264282227, "global_step": 41688, "epoch": 502} {"train_loss": -19.21483612060547, "global_step": 41689, "epoch": 502} {"train_loss": -19.3240966796875, "global_step": 41690, "epoch": 502} {"train_loss": -18.98855209350586, "global_step": 41691, "epoch": 502} {"train_loss": -19.421993255615234, "global_step": 41692, "epoch": 502} {"train_loss": -19.468719482421875, "global_step": 41693, "epoch": 502} {"train_loss": -19.4365291595459, "global_step": 41694, "epoch": 502} {"train_loss": -19.561750411987305, "global_step": 41695, "epoch": 502} {"train_loss": -19.664316177368164, "global_step": 41696, "epoch": 502} {"train_loss": -19.564624786376953, "global_step": 41697, "epoch": 502} {"train_loss": -19.444904327392578, "global_step": 41698, "epoch": 502} {"train_loss": -19.323591232299805, "global_step": 41699, "epoch": 502} {"train_loss": -19.303884506225586, "global_step": 41700, "epoch": 502} {"train_loss": -19.49575424194336, "global_step": 41701, "epoch": 502} {"train_loss": -19.95151710510254, "global_step": 41702, "epoch": 502} {"train_loss": -19.69654655456543, "global_step": 41703, "epoch": 502} {"train_loss": -19.897790908813477, "global_step": 41704, "epoch": 502} {"train_loss": -19.425424575805664, "global_step": 41705, "epoch": 502} {"train_loss": -19.665090560913086, "global_step": 41706, "epoch": 502} {"train_loss": -19.772052764892578, "global_step": 41707, "epoch": 502} {"train_loss": -19.47909927368164, "global_step": 41708, "epoch": 502} {"train_loss": -19.8597469329834, "global_step": 41709, "epoch": 502} {"train_loss": -19.528921127319336, "global_step": 41710, "epoch": 502} {"train_loss": -19.464384078979492, "global_step": 41711, "epoch": 502} {"train_loss": -19.41373062133789, "global_step": 41712, "epoch": 502} {"train_loss": -19.153427124023438, "global_step": 41713, "epoch": 502} {"train_loss": -20.06898307800293, "global_step": 41714, "epoch": 502} {"train_loss": -19.652647018432617, "global_step": 41715, "epoch": 502} {"train_loss": -19.329023361206055, "global_step": 41716, "epoch": 502} {"train_loss": -19.261520385742188, "global_step": 41717, "epoch": 502} {"train_loss": -19.448537826538086, "global_step": 41718, "epoch": 502} {"train_loss": -19.44664764404297, "global_step": 41719, "epoch": 502} {"train_loss": -19.72237205505371, "global_step": 41720, "epoch": 502} {"train_loss": -19.46990203857422, "global_step": 41721, "epoch": 502} {"train_loss": -19.513248443603516, "global_step": 41722, "epoch": 502} {"train_loss": -19.6927547454834, "global_step": 41723, "epoch": 502} {"train_loss": -19.53278923034668, "global_step": 41724, "epoch": 502} {"train_loss": -19.301259994506836, "global_step": 41725, "epoch": 502} {"train_loss": -19.472219467163086, "global_step": 41726, "epoch": 502} {"train_loss": -19.424001693725586, "global_step": 41727, "epoch": 502} {"train_loss": -19.450613021850586, "global_step": 41728, "epoch": 502} {"train_loss": -19.734037399291992, "global_step": 41729, "epoch": 502} {"train_loss": -19.321731567382812, "global_step": 41730, "epoch": 502} {"train_loss": -19.590078353881836, "global_step": 41731, "epoch": 502} {"train_loss": -19.72374725341797, "global_step": 41732, "epoch": 502} {"train_loss": -19.357227325439453, "global_step": 41733, "epoch": 502} {"train_loss": -19.75494956970215, "global_step": 41734, "epoch": 502} {"train_loss": -19.55629539489746, "global_step": 41735, "epoch": 502} {"train_loss": -19.549936294555664, "global_step": 41736, "epoch": 502} {"train_loss": -19.398054122924805, "global_step": 41737, "epoch": 502} {"train_loss": -19.562620162963867, "global_step": 41738, "epoch": 502} {"train_loss": -19.480396270751953, "global_step": 41739, "epoch": 502} {"train_loss": -19.790420532226562, "global_step": 41740, "epoch": 502} {"train_loss": -19.707733154296875, "global_step": 41741, "epoch": 502} {"train_loss": -19.700260162353516, "global_step": 41742, "epoch": 502} {"train_loss": -19.482316970825195, "global_step": 41743, "epoch": 502} {"train_loss": -19.521665573120117, "global_step": 41744, "epoch": 502} {"train_loss": -19.470726013183594, "global_step": 41745, "epoch": 502} {"train_loss": -19.40411376953125, "global_step": 41746, "epoch": 502} {"train_loss": -19.817642211914062, "global_step": 41747, "epoch": 502} {"train_loss": -19.48696065236287, "global_step": 41748, "epoch": 502, "val_loss": 6111219.0} {"train_loss": -19.057493209838867, "global_step": 41749, "epoch": 503} {"train_loss": -19.107330322265625, "global_step": 41750, "epoch": 503} {"train_loss": -19.191221237182617, "global_step": 41751, "epoch": 503} {"train_loss": -18.753732681274414, "global_step": 41752, "epoch": 503} {"train_loss": -19.508895874023438, "global_step": 41753, "epoch": 503} {"train_loss": -19.300548553466797, "global_step": 41754, "epoch": 503} {"train_loss": -19.065841674804688, "global_step": 41755, "epoch": 503} {"train_loss": -19.201372146606445, "global_step": 41756, "epoch": 503} {"train_loss": -19.15943717956543, "global_step": 41757, "epoch": 503} {"train_loss": -19.196762084960938, "global_step": 41758, "epoch": 503} {"train_loss": -19.1655216217041, "global_step": 41759, "epoch": 503} {"train_loss": -19.392410278320312, "global_step": 41760, "epoch": 503} {"train_loss": -18.8663387298584, "global_step": 41761, "epoch": 503} {"train_loss": -19.153379440307617, "global_step": 41762, "epoch": 503} {"train_loss": -19.30989646911621, "global_step": 41763, "epoch": 503} {"train_loss": -19.498632431030273, "global_step": 41764, "epoch": 503} {"train_loss": -19.33663558959961, "global_step": 41765, "epoch": 503} {"train_loss": -19.26529312133789, "global_step": 41766, "epoch": 503} {"train_loss": -19.316669464111328, "global_step": 41767, "epoch": 503} {"train_loss": -19.73888397216797, "global_step": 41768, "epoch": 503} {"train_loss": -19.07115364074707, "global_step": 41769, "epoch": 503} {"train_loss": -19.627540588378906, "global_step": 41770, "epoch": 503} {"train_loss": -19.181772232055664, "global_step": 41771, "epoch": 503} {"train_loss": -19.45051383972168, "global_step": 41772, "epoch": 503} {"train_loss": -19.515403747558594, "global_step": 41773, "epoch": 503} {"train_loss": -19.75343132019043, "global_step": 41774, "epoch": 503} {"train_loss": -19.309240341186523, "global_step": 41775, "epoch": 503} {"train_loss": -19.508514404296875, "global_step": 41776, "epoch": 503} {"train_loss": -19.296621322631836, "global_step": 41777, "epoch": 503} {"train_loss": -19.35232925415039, "global_step": 41778, "epoch": 503} {"train_loss": -19.711515426635742, "global_step": 41779, "epoch": 503} {"train_loss": -19.616580963134766, "global_step": 41780, "epoch": 503} {"train_loss": -19.5602970123291, "global_step": 41781, "epoch": 503} {"train_loss": -19.601083755493164, "global_step": 41782, "epoch": 503} {"train_loss": -19.373416900634766, "global_step": 41783, "epoch": 503} {"train_loss": -19.456275939941406, "global_step": 41784, "epoch": 503} {"train_loss": -19.426427841186523, "global_step": 41785, "epoch": 503} {"train_loss": -19.3875675201416, "global_step": 41786, "epoch": 503} {"train_loss": -19.5509090423584, "global_step": 41787, "epoch": 503} {"train_loss": -19.5654354095459, "global_step": 41788, "epoch": 503} {"train_loss": -19.236631393432617, "global_step": 41789, "epoch": 503} {"train_loss": -19.183137893676758, "global_step": 41790, "epoch": 503} {"train_loss": -19.673818588256836, "global_step": 41791, "epoch": 503} {"train_loss": -19.646974563598633, "global_step": 41792, "epoch": 503} {"train_loss": -19.38865089416504, "global_step": 41793, "epoch": 503} {"train_loss": -19.84666633605957, "global_step": 41794, "epoch": 503} {"train_loss": -19.752790451049805, "global_step": 41795, "epoch": 503} {"train_loss": -19.670347213745117, "global_step": 41796, "epoch": 503} {"train_loss": -19.332767486572266, "global_step": 41797, "epoch": 503} {"train_loss": -19.63739585876465, "global_step": 41798, "epoch": 503} {"train_loss": -19.537519454956055, "global_step": 41799, "epoch": 503} {"train_loss": -19.65956687927246, "global_step": 41800, "epoch": 503} {"train_loss": -19.94458770751953, "global_step": 41801, "epoch": 503} {"train_loss": -19.214542388916016, "global_step": 41802, "epoch": 503} {"train_loss": -19.351381301879883, "global_step": 41803, "epoch": 503} {"train_loss": -19.327402114868164, "global_step": 41804, "epoch": 503} {"train_loss": -19.393762588500977, "global_step": 41805, "epoch": 503} {"train_loss": -19.532135009765625, "global_step": 41806, "epoch": 503} {"train_loss": -19.452131271362305, "global_step": 41807, "epoch": 503} {"train_loss": -19.298248291015625, "global_step": 41808, "epoch": 503} {"train_loss": -19.65630531311035, "global_step": 41809, "epoch": 503} {"train_loss": -19.619150161743164, "global_step": 41810, "epoch": 503} {"train_loss": -19.776630401611328, "global_step": 41811, "epoch": 503} {"train_loss": -19.783897399902344, "global_step": 41812, "epoch": 503} {"train_loss": -19.376314163208008, "global_step": 41813, "epoch": 503} {"train_loss": -19.582700729370117, "global_step": 41814, "epoch": 503} {"train_loss": -19.300519943237305, "global_step": 41815, "epoch": 503} {"train_loss": -19.673986434936523, "global_step": 41816, "epoch": 503} {"train_loss": -19.88226890563965, "global_step": 41817, "epoch": 503} {"train_loss": -19.805639266967773, "global_step": 41818, "epoch": 503} {"train_loss": -19.443265914916992, "global_step": 41819, "epoch": 503} {"train_loss": -20.038944244384766, "global_step": 41820, "epoch": 503} {"train_loss": -19.441951751708984, "global_step": 41821, "epoch": 503} {"train_loss": -19.720365524291992, "global_step": 41822, "epoch": 503} {"train_loss": -19.4759578704834, "global_step": 41823, "epoch": 503} {"train_loss": -19.260026931762695, "global_step": 41824, "epoch": 503} {"train_loss": -19.715011596679688, "global_step": 41825, "epoch": 503} {"train_loss": -19.494766235351562, "global_step": 41826, "epoch": 503} {"train_loss": -19.11637306213379, "global_step": 41827, "epoch": 503} {"train_loss": -19.440671920776367, "global_step": 41828, "epoch": 503} {"train_loss": -19.6949405670166, "global_step": 41829, "epoch": 503} {"train_loss": -19.536605834960938, "global_step": 41830, "epoch": 503} {"train_loss": -19.45947982604245, "global_step": 41831, "epoch": 503, "val_loss": 5897306.5} {"train_loss": -19.61067771911621, "global_step": 41832, "epoch": 504} {"train_loss": -19.415359497070312, "global_step": 41833, "epoch": 504} {"train_loss": -19.268558502197266, "global_step": 41834, "epoch": 504} {"train_loss": -19.610671997070312, "global_step": 41835, "epoch": 504} {"train_loss": -19.551422119140625, "global_step": 41836, "epoch": 504} {"train_loss": -19.397598266601562, "global_step": 41837, "epoch": 504} {"train_loss": -19.484216690063477, "global_step": 41838, "epoch": 504} {"train_loss": -19.271163940429688, "global_step": 41839, "epoch": 504} {"train_loss": -19.19939613342285, "global_step": 41840, "epoch": 504} {"train_loss": -19.681808471679688, "global_step": 41841, "epoch": 504} {"train_loss": -19.68196678161621, "global_step": 41842, "epoch": 504} {"train_loss": -19.51486587524414, "global_step": 41843, "epoch": 504} {"train_loss": -19.29874610900879, "global_step": 41844, "epoch": 504} {"train_loss": -19.279953002929688, "global_step": 41845, "epoch": 504} {"train_loss": -19.86166763305664, "global_step": 41846, "epoch": 504} {"train_loss": -19.404138565063477, "global_step": 41847, "epoch": 504} {"train_loss": -19.41029167175293, "global_step": 41848, "epoch": 504} {"train_loss": -19.15125846862793, "global_step": 41849, "epoch": 504} {"train_loss": -19.299272537231445, "global_step": 41850, "epoch": 504} {"train_loss": -19.38032341003418, "global_step": 41851, "epoch": 504} {"train_loss": -19.36625862121582, "global_step": 41852, "epoch": 504} {"train_loss": -19.503690719604492, "global_step": 41853, "epoch": 504} {"train_loss": -19.581777572631836, "global_step": 41854, "epoch": 504} {"train_loss": -19.770151138305664, "global_step": 41855, "epoch": 504} {"train_loss": -19.672279357910156, "global_step": 41856, "epoch": 504} {"train_loss": -19.613779067993164, "global_step": 41857, "epoch": 504} {"train_loss": -19.17988395690918, "global_step": 41858, "epoch": 504} {"train_loss": -19.722917556762695, "global_step": 41859, "epoch": 504} {"train_loss": -19.601810455322266, "global_step": 41860, "epoch": 504} {"train_loss": -19.4739990234375, "global_step": 41861, "epoch": 504} {"train_loss": -19.46072769165039, "global_step": 41862, "epoch": 504} {"train_loss": -19.647464752197266, "global_step": 41863, "epoch": 504} {"train_loss": -19.259559631347656, "global_step": 41864, "epoch": 504} {"train_loss": -19.61138916015625, "global_step": 41865, "epoch": 504} {"train_loss": -19.80579948425293, "global_step": 41866, "epoch": 504} {"train_loss": -19.316221237182617, "global_step": 41867, "epoch": 504} {"train_loss": -19.24295997619629, "global_step": 41868, "epoch": 504} {"train_loss": -19.069852828979492, "global_step": 41869, "epoch": 504} {"train_loss": -19.607009887695312, "global_step": 41870, "epoch": 504} {"train_loss": -19.64986228942871, "global_step": 41871, "epoch": 504} {"train_loss": -19.4606876373291, "global_step": 41872, "epoch": 504} {"train_loss": -19.779504776000977, "global_step": 41873, "epoch": 504} {"train_loss": -19.5102596282959, "global_step": 41874, "epoch": 504} {"train_loss": -19.83662223815918, "global_step": 41875, "epoch": 504} {"train_loss": -19.595401763916016, "global_step": 41876, "epoch": 504} {"train_loss": -20.223800659179688, "global_step": 41877, "epoch": 504} {"train_loss": -19.545610427856445, "global_step": 41878, "epoch": 504} {"train_loss": -19.844396591186523, "global_step": 41879, "epoch": 504} {"train_loss": -19.641765594482422, "global_step": 41880, "epoch": 504} {"train_loss": -19.42481803894043, "global_step": 41881, "epoch": 504} {"train_loss": -19.691801071166992, "global_step": 41882, "epoch": 504} {"train_loss": -19.73935317993164, "global_step": 41883, "epoch": 504} {"train_loss": -19.279951095581055, "global_step": 41884, "epoch": 504} {"train_loss": -19.50579833984375, "global_step": 41885, "epoch": 504} {"train_loss": -19.887113571166992, "global_step": 41886, "epoch": 504} {"train_loss": -19.646852493286133, "global_step": 41887, "epoch": 504} {"train_loss": -19.258991241455078, "global_step": 41888, "epoch": 504} {"train_loss": -19.772216796875, "global_step": 41889, "epoch": 504} {"train_loss": -20.055578231811523, "global_step": 41890, "epoch": 504} {"train_loss": -19.094350814819336, "global_step": 41891, "epoch": 504} {"train_loss": -19.47882652282715, "global_step": 41892, "epoch": 504} {"train_loss": -19.460744857788086, "global_step": 41893, "epoch": 504} {"train_loss": -19.246152877807617, "global_step": 41894, "epoch": 504} {"train_loss": -19.6561336517334, "global_step": 41895, "epoch": 504} {"train_loss": -19.537168502807617, "global_step": 41896, "epoch": 504} {"train_loss": -19.824230194091797, "global_step": 41897, "epoch": 504} {"train_loss": -19.791839599609375, "global_step": 41898, "epoch": 504} {"train_loss": -19.5783748626709, "global_step": 41899, "epoch": 504} {"train_loss": -19.393896102905273, "global_step": 41900, "epoch": 504} {"train_loss": -19.605398178100586, "global_step": 41901, "epoch": 504} {"train_loss": -19.68244743347168, "global_step": 41902, "epoch": 504} {"train_loss": -19.491910934448242, "global_step": 41903, "epoch": 504} {"train_loss": -19.66340446472168, "global_step": 41904, "epoch": 504} {"train_loss": -19.596193313598633, "global_step": 41905, "epoch": 504} {"train_loss": -19.54829978942871, "global_step": 41906, "epoch": 504} {"train_loss": -19.66889762878418, "global_step": 41907, "epoch": 504} {"train_loss": -19.546588897705078, "global_step": 41908, "epoch": 504} {"train_loss": -19.762557983398438, "global_step": 41909, "epoch": 504} {"train_loss": -19.40285873413086, "global_step": 41910, "epoch": 504} {"train_loss": -19.323089599609375, "global_step": 41911, "epoch": 504} {"train_loss": -19.525190353393555, "global_step": 41912, "epoch": 504} {"train_loss": -19.5203857421875, "global_step": 41913, "epoch": 504} {"train_loss": -19.548808385090656, "global_step": 41914, "epoch": 504, "val_loss": 5881707.5} {"train_loss": -18.762115478515625, "global_step": 41915, "epoch": 505} {"train_loss": -19.282682418823242, "global_step": 41916, "epoch": 505} {"train_loss": -19.41292953491211, "global_step": 41917, "epoch": 505} {"train_loss": -19.170005798339844, "global_step": 41918, "epoch": 505} {"train_loss": -19.18025016784668, "global_step": 41919, "epoch": 505} {"train_loss": -19.43256187438965, "global_step": 41920, "epoch": 505} {"train_loss": -18.88343048095703, "global_step": 41921, "epoch": 505} {"train_loss": -19.250757217407227, "global_step": 41922, "epoch": 505} {"train_loss": -19.290897369384766, "global_step": 41923, "epoch": 505} {"train_loss": -19.49140739440918, "global_step": 41924, "epoch": 505} {"train_loss": -19.709707260131836, "global_step": 41925, "epoch": 505} {"train_loss": -19.693042755126953, "global_step": 41926, "epoch": 505} {"train_loss": -19.521095275878906, "global_step": 41927, "epoch": 505} {"train_loss": -19.459152221679688, "global_step": 41928, "epoch": 505} {"train_loss": -19.40767478942871, "global_step": 41929, "epoch": 505} {"train_loss": -19.563711166381836, "global_step": 41930, "epoch": 505} {"train_loss": -19.511083602905273, "global_step": 41931, "epoch": 505} {"train_loss": -19.452606201171875, "global_step": 41932, "epoch": 505} {"train_loss": -19.767044067382812, "global_step": 41933, "epoch": 505} {"train_loss": -19.685789108276367, "global_step": 41934, "epoch": 505} {"train_loss": -19.434057235717773, "global_step": 41935, "epoch": 505} {"train_loss": -19.175708770751953, "global_step": 41936, "epoch": 505} {"train_loss": -19.20538902282715, "global_step": 41937, "epoch": 505} {"train_loss": -19.560224533081055, "global_step": 41938, "epoch": 505} {"train_loss": -19.542016983032227, "global_step": 41939, "epoch": 505} {"train_loss": -19.466083526611328, "global_step": 41940, "epoch": 505} {"train_loss": -19.450681686401367, "global_step": 41941, "epoch": 505} {"train_loss": -19.25667381286621, "global_step": 41942, "epoch": 505} {"train_loss": -19.54914665222168, "global_step": 41943, "epoch": 505} {"train_loss": -19.37040138244629, "global_step": 41944, "epoch": 505} {"train_loss": -19.40763282775879, "global_step": 41945, "epoch": 505} {"train_loss": -19.83030128479004, "global_step": 41946, "epoch": 505} {"train_loss": -19.561864852905273, "global_step": 41947, "epoch": 505} {"train_loss": -19.49580955505371, "global_step": 41948, "epoch": 505} {"train_loss": -19.901304244995117, "global_step": 41949, "epoch": 505} {"train_loss": -19.840330123901367, "global_step": 41950, "epoch": 505} {"train_loss": -19.392244338989258, "global_step": 41951, "epoch": 505} {"train_loss": -19.924348831176758, "global_step": 41952, "epoch": 505} {"train_loss": -19.38754653930664, "global_step": 41953, "epoch": 505} {"train_loss": -19.34861183166504, "global_step": 41954, "epoch": 505} {"train_loss": -19.868534088134766, "global_step": 41955, "epoch": 505} {"train_loss": -19.427356719970703, "global_step": 41956, "epoch": 505} {"train_loss": -19.394886016845703, "global_step": 41957, "epoch": 505} {"train_loss": -19.6107177734375, "global_step": 41958, "epoch": 505} {"train_loss": -19.552146911621094, "global_step": 41959, "epoch": 505} {"train_loss": -19.68784523010254, "global_step": 41960, "epoch": 505} {"train_loss": -19.529233932495117, "global_step": 41961, "epoch": 505} {"train_loss": -19.694801330566406, "global_step": 41962, "epoch": 505} {"train_loss": -19.787612915039062, "global_step": 41963, "epoch": 505} {"train_loss": -20.107513427734375, "global_step": 41964, "epoch": 505} {"train_loss": -19.1710262298584, "global_step": 41965, "epoch": 505} {"train_loss": -19.55837059020996, "global_step": 41966, "epoch": 505} {"train_loss": -19.836477279663086, "global_step": 41967, "epoch": 505} {"train_loss": -20.017333984375, "global_step": 41968, "epoch": 505} {"train_loss": -19.7202205657959, "global_step": 41969, "epoch": 505} {"train_loss": -19.78028678894043, "global_step": 41970, "epoch": 505} {"train_loss": -19.1442813873291, "global_step": 41971, "epoch": 505} {"train_loss": -19.299787521362305, "global_step": 41972, "epoch": 505} {"train_loss": -19.655000686645508, "global_step": 41973, "epoch": 505} {"train_loss": -19.883764266967773, "global_step": 41974, "epoch": 505} {"train_loss": -19.059480667114258, "global_step": 41975, "epoch": 505} {"train_loss": -19.596776962280273, "global_step": 41976, "epoch": 505} {"train_loss": -19.837196350097656, "global_step": 41977, "epoch": 505} {"train_loss": -19.30323600769043, "global_step": 41978, "epoch": 505} {"train_loss": -19.522863388061523, "global_step": 41979, "epoch": 505} {"train_loss": -19.63516616821289, "global_step": 41980, "epoch": 505} {"train_loss": -19.423234939575195, "global_step": 41981, "epoch": 505} {"train_loss": -19.310401916503906, "global_step": 41982, "epoch": 505} {"train_loss": -19.751432418823242, "global_step": 41983, "epoch": 505} {"train_loss": -19.613306045532227, "global_step": 41984, "epoch": 505} {"train_loss": -19.551137924194336, "global_step": 41985, "epoch": 505} {"train_loss": -19.32614517211914, "global_step": 41986, "epoch": 505} {"train_loss": -19.36075210571289, "global_step": 41987, "epoch": 505} {"train_loss": -19.9773006439209, "global_step": 41988, "epoch": 505} {"train_loss": -19.508726119995117, "global_step": 41989, "epoch": 505} {"train_loss": -19.162429809570312, "global_step": 41990, "epoch": 505} {"train_loss": -19.615459442138672, "global_step": 41991, "epoch": 505} {"train_loss": -19.462810516357422, "global_step": 41992, "epoch": 505} {"train_loss": -19.37141990661621, "global_step": 41993, "epoch": 505} {"train_loss": -19.99723243713379, "global_step": 41994, "epoch": 505} {"train_loss": -19.703947067260742, "global_step": 41995, "epoch": 505} {"train_loss": -19.49613380432129, "global_step": 41996, "epoch": 505} {"train_loss": -19.52950852175793, "global_step": 41997, "epoch": 505, "val_loss": 6083418.5} {"train_loss": -19.45896339416504, "global_step": 41998, "epoch": 506} {"train_loss": -19.601099014282227, "global_step": 41999, "epoch": 506} {"train_loss": -19.099172592163086, "global_step": 42000, "epoch": 506} {"train_loss": -19.374244689941406, "global_step": 42001, "epoch": 506} {"train_loss": -19.23728370666504, "global_step": 42002, "epoch": 506} {"train_loss": -19.66641616821289, "global_step": 42003, "epoch": 506} {"train_loss": -18.949512481689453, "global_step": 42004, "epoch": 506} {"train_loss": -19.305391311645508, "global_step": 42005, "epoch": 506} {"train_loss": -19.639999389648438, "global_step": 42006, "epoch": 506} {"train_loss": -19.36187744140625, "global_step": 42007, "epoch": 506} {"train_loss": -19.411710739135742, "global_step": 42008, "epoch": 506} {"train_loss": -19.564184188842773, "global_step": 42009, "epoch": 506} {"train_loss": -19.644058227539062, "global_step": 42010, "epoch": 506} {"train_loss": -19.90635871887207, "global_step": 42011, "epoch": 506} {"train_loss": -19.478515625, "global_step": 42012, "epoch": 506} {"train_loss": -19.600391387939453, "global_step": 42013, "epoch": 506} {"train_loss": -19.686113357543945, "global_step": 42014, "epoch": 506} {"train_loss": -19.464595794677734, "global_step": 42015, "epoch": 506} {"train_loss": -19.376371383666992, "global_step": 42016, "epoch": 506} {"train_loss": -19.231664657592773, "global_step": 42017, "epoch": 506} {"train_loss": -19.755216598510742, "global_step": 42018, "epoch": 506} {"train_loss": -19.85127067565918, "global_step": 42019, "epoch": 506} {"train_loss": -19.43071937561035, "global_step": 42020, "epoch": 506} {"train_loss": -19.769962310791016, "global_step": 42021, "epoch": 506} {"train_loss": -19.486690521240234, "global_step": 42022, "epoch": 506} {"train_loss": -19.377431869506836, "global_step": 42023, "epoch": 506} {"train_loss": -19.48267936706543, "global_step": 42024, "epoch": 506} {"train_loss": -19.57172203063965, "global_step": 42025, "epoch": 506} {"train_loss": -19.649444580078125, "global_step": 42026, "epoch": 506} {"train_loss": -19.449365615844727, "global_step": 42027, "epoch": 506} {"train_loss": -19.762243270874023, "global_step": 42028, "epoch": 506} {"train_loss": -19.560245513916016, "global_step": 42029, "epoch": 506} {"train_loss": -19.683813095092773, "global_step": 42030, "epoch": 506} {"train_loss": -19.348188400268555, "global_step": 42031, "epoch": 506} {"train_loss": -19.2894287109375, "global_step": 42032, "epoch": 506} {"train_loss": -19.852294921875, "global_step": 42033, "epoch": 506} {"train_loss": -19.3647403717041, "global_step": 42034, "epoch": 506} {"train_loss": -19.128719329833984, "global_step": 42035, "epoch": 506} {"train_loss": -19.366392135620117, "global_step": 42036, "epoch": 506} {"train_loss": -19.427324295043945, "global_step": 42037, "epoch": 506} {"train_loss": -19.97454261779785, "global_step": 42038, "epoch": 506} {"train_loss": -19.500110626220703, "global_step": 42039, "epoch": 506} {"train_loss": -19.775768280029297, "global_step": 42040, "epoch": 506} {"train_loss": -19.43634033203125, "global_step": 42041, "epoch": 506} {"train_loss": -19.582151412963867, "global_step": 42042, "epoch": 506} {"train_loss": -19.40777587890625, "global_step": 42043, "epoch": 506} {"train_loss": -19.533952713012695, "global_step": 42044, "epoch": 506} {"train_loss": -19.71440315246582, "global_step": 42045, "epoch": 506} {"train_loss": -19.33469009399414, "global_step": 42046, "epoch": 506} {"train_loss": -19.61626625061035, "global_step": 42047, "epoch": 506} {"train_loss": -19.3682861328125, "global_step": 42048, "epoch": 506} {"train_loss": -19.591670989990234, "global_step": 42049, "epoch": 506} {"train_loss": -19.27988624572754, "global_step": 42050, "epoch": 506} {"train_loss": -19.69232940673828, "global_step": 42051, "epoch": 506} {"train_loss": -19.812366485595703, "global_step": 42052, "epoch": 506} {"train_loss": -19.678293228149414, "global_step": 42053, "epoch": 506} {"train_loss": -19.59816551208496, "global_step": 42054, "epoch": 506} {"train_loss": -19.51102638244629, "global_step": 42055, "epoch": 506} {"train_loss": -19.806228637695312, "global_step": 42056, "epoch": 506} {"train_loss": -19.77495002746582, "global_step": 42057, "epoch": 506} {"train_loss": -19.6662654876709, "global_step": 42058, "epoch": 506} {"train_loss": -19.474821090698242, "global_step": 42059, "epoch": 506} {"train_loss": -19.769001007080078, "global_step": 42060, "epoch": 506} {"train_loss": -19.89449119567871, "global_step": 42061, "epoch": 506} {"train_loss": -19.50815200805664, "global_step": 42062, "epoch": 506} {"train_loss": -19.533742904663086, "global_step": 42063, "epoch": 506} {"train_loss": -19.58576774597168, "global_step": 42064, "epoch": 506} {"train_loss": -19.574474334716797, "global_step": 42065, "epoch": 506} {"train_loss": -19.455036163330078, "global_step": 42066, "epoch": 506} {"train_loss": -19.621915817260742, "global_step": 42067, "epoch": 506} {"train_loss": -19.474058151245117, "global_step": 42068, "epoch": 506} {"train_loss": -19.91014289855957, "global_step": 42069, "epoch": 506} {"train_loss": -19.528362274169922, "global_step": 42070, "epoch": 506} {"train_loss": -19.4368953704834, "global_step": 42071, "epoch": 506} {"train_loss": -19.467334747314453, "global_step": 42072, "epoch": 506} {"train_loss": -19.27457618713379, "global_step": 42073, "epoch": 506} {"train_loss": -19.46133804321289, "global_step": 42074, "epoch": 506} {"train_loss": -19.434926986694336, "global_step": 42075, "epoch": 506} {"train_loss": -19.49913787841797, "global_step": 42076, "epoch": 506} {"train_loss": -19.49066734313965, "global_step": 42077, "epoch": 506} {"train_loss": -19.316640853881836, "global_step": 42078, "epoch": 506} {"train_loss": -19.532835006713867, "global_step": 42079, "epoch": 506} {"train_loss": -19.545106658016344, "global_step": 42080, "epoch": 506, "val_loss": 6105192.0} {"train_loss": -18.252765655517578, "global_step": 42081, "epoch": 507} {"train_loss": -19.30681610107422, "global_step": 42082, "epoch": 507} {"train_loss": -18.824575424194336, "global_step": 42083, "epoch": 507} {"train_loss": -19.310420989990234, "global_step": 42084, "epoch": 507} {"train_loss": -19.41755485534668, "global_step": 42085, "epoch": 507} {"train_loss": -19.36988067626953, "global_step": 42086, "epoch": 507} {"train_loss": -19.304433822631836, "global_step": 42087, "epoch": 507} {"train_loss": -19.196578979492188, "global_step": 42088, "epoch": 507} {"train_loss": -19.15143394470215, "global_step": 42089, "epoch": 507} {"train_loss": -19.650121688842773, "global_step": 42090, "epoch": 507} {"train_loss": -19.797163009643555, "global_step": 42091, "epoch": 507} {"train_loss": -19.17255401611328, "global_step": 42092, "epoch": 507} {"train_loss": -19.48835563659668, "global_step": 42093, "epoch": 507} {"train_loss": -19.61643409729004, "global_step": 42094, "epoch": 507} {"train_loss": -19.309112548828125, "global_step": 42095, "epoch": 507} {"train_loss": -19.4499454498291, "global_step": 42096, "epoch": 507} {"train_loss": -19.62655258178711, "global_step": 42097, "epoch": 507} {"train_loss": -19.131744384765625, "global_step": 42098, "epoch": 507} {"train_loss": -19.51985740661621, "global_step": 42099, "epoch": 507} {"train_loss": -19.655029296875, "global_step": 42100, "epoch": 507} {"train_loss": -19.896787643432617, "global_step": 42101, "epoch": 507} {"train_loss": -19.351850509643555, "global_step": 42102, "epoch": 507} {"train_loss": -19.163925170898438, "global_step": 42103, "epoch": 507} {"train_loss": -19.42373275756836, "global_step": 42104, "epoch": 507} {"train_loss": -19.692548751831055, "global_step": 42105, "epoch": 507} {"train_loss": -19.28497886657715, "global_step": 42106, "epoch": 507} {"train_loss": -19.504358291625977, "global_step": 42107, "epoch": 507} {"train_loss": -19.485950469970703, "global_step": 42108, "epoch": 507} {"train_loss": -19.107023239135742, "global_step": 42109, "epoch": 507} {"train_loss": -19.54096794128418, "global_step": 42110, "epoch": 507} {"train_loss": -19.790618896484375, "global_step": 42111, "epoch": 507} {"train_loss": -19.262496948242188, "global_step": 42112, "epoch": 507} {"train_loss": -19.780441284179688, "global_step": 42113, "epoch": 507} {"train_loss": -19.536190032958984, "global_step": 42114, "epoch": 507} {"train_loss": -19.81957244873047, "global_step": 42115, "epoch": 507} {"train_loss": -19.604177474975586, "global_step": 42116, "epoch": 507} {"train_loss": -19.64924430847168, "global_step": 42117, "epoch": 507} {"train_loss": -19.120046615600586, "global_step": 42118, "epoch": 507} {"train_loss": -19.54593276977539, "global_step": 42119, "epoch": 507} {"train_loss": -19.361013412475586, "global_step": 42120, "epoch": 507} {"train_loss": -19.64386558532715, "global_step": 42121, "epoch": 507} {"train_loss": -19.390493392944336, "global_step": 42122, "epoch": 507} {"train_loss": -19.780088424682617, "global_step": 42123, "epoch": 507} {"train_loss": -19.200613021850586, "global_step": 42124, "epoch": 507} {"train_loss": -19.542648315429688, "global_step": 42125, "epoch": 507} {"train_loss": -19.695676803588867, "global_step": 42126, "epoch": 507} {"train_loss": -19.515241622924805, "global_step": 42127, "epoch": 507} {"train_loss": -19.623010635375977, "global_step": 42128, "epoch": 507} {"train_loss": -19.458322525024414, "global_step": 42129, "epoch": 507} {"train_loss": -19.139677047729492, "global_step": 42130, "epoch": 507} {"train_loss": -19.63358497619629, "global_step": 42131, "epoch": 507} {"train_loss": -19.30963134765625, "global_step": 42132, "epoch": 507} {"train_loss": -19.274580001831055, "global_step": 42133, "epoch": 507} {"train_loss": -19.50010871887207, "global_step": 42134, "epoch": 507} {"train_loss": -19.448022842407227, "global_step": 42135, "epoch": 507} {"train_loss": -19.604177474975586, "global_step": 42136, "epoch": 507} {"train_loss": -19.425697326660156, "global_step": 42137, "epoch": 507} {"train_loss": -19.8143310546875, "global_step": 42138, "epoch": 507} {"train_loss": -19.562042236328125, "global_step": 42139, "epoch": 507} {"train_loss": -19.328413009643555, "global_step": 42140, "epoch": 507} {"train_loss": -19.440414428710938, "global_step": 42141, "epoch": 507} {"train_loss": -19.929956436157227, "global_step": 42142, "epoch": 507} {"train_loss": -19.530574798583984, "global_step": 42143, "epoch": 507} {"train_loss": -19.290014266967773, "global_step": 42144, "epoch": 507} {"train_loss": -19.790922164916992, "global_step": 42145, "epoch": 507} {"train_loss": -20.069091796875, "global_step": 42146, "epoch": 507} {"train_loss": -19.4355525970459, "global_step": 42147, "epoch": 507} {"train_loss": -19.472503662109375, "global_step": 42148, "epoch": 507} {"train_loss": -19.882169723510742, "global_step": 42149, "epoch": 507} {"train_loss": -19.23349380493164, "global_step": 42150, "epoch": 507} {"train_loss": -20.044757843017578, "global_step": 42151, "epoch": 507} {"train_loss": -19.57028579711914, "global_step": 42152, "epoch": 507} {"train_loss": -19.626712799072266, "global_step": 42153, "epoch": 507} {"train_loss": -19.625293731689453, "global_step": 42154, "epoch": 507} {"train_loss": -19.703365325927734, "global_step": 42155, "epoch": 507} {"train_loss": -18.988811492919922, "global_step": 42156, "epoch": 507} {"train_loss": -19.38065528869629, "global_step": 42157, "epoch": 507} {"train_loss": -19.71057891845703, "global_step": 42158, "epoch": 507} {"train_loss": -19.594846725463867, "global_step": 42159, "epoch": 507} {"train_loss": -19.475446701049805, "global_step": 42160, "epoch": 507} {"train_loss": -19.895601272583008, "global_step": 42161, "epoch": 507} {"train_loss": -19.740400314331055, "global_step": 42162, "epoch": 507} {"train_loss": -19.498296324029027, "global_step": 42163, "epoch": 507, "val_loss": 6045000.0} {"train_loss": -19.019556045532227, "global_step": 42164, "epoch": 508} {"train_loss": -19.447553634643555, "global_step": 42165, "epoch": 508} {"train_loss": -19.505125045776367, "global_step": 42166, "epoch": 508} {"train_loss": -19.49188804626465, "global_step": 42167, "epoch": 508} {"train_loss": -19.762815475463867, "global_step": 42168, "epoch": 508} {"train_loss": -19.311767578125, "global_step": 42169, "epoch": 508} {"train_loss": -19.220809936523438, "global_step": 42170, "epoch": 508} {"train_loss": -19.73539924621582, "global_step": 42171, "epoch": 508} {"train_loss": -19.578628540039062, "global_step": 42172, "epoch": 508} {"train_loss": -19.30936622619629, "global_step": 42173, "epoch": 508} {"train_loss": -19.24199867248535, "global_step": 42174, "epoch": 508} {"train_loss": -19.345853805541992, "global_step": 42175, "epoch": 508} {"train_loss": -19.157548904418945, "global_step": 42176, "epoch": 508} {"train_loss": -19.289709091186523, "global_step": 42177, "epoch": 508} {"train_loss": -19.37916374206543, "global_step": 42178, "epoch": 508} {"train_loss": -19.441757202148438, "global_step": 42179, "epoch": 508} {"train_loss": -19.533771514892578, "global_step": 42180, "epoch": 508} {"train_loss": -19.272192001342773, "global_step": 42181, "epoch": 508} {"train_loss": -19.552560806274414, "global_step": 42182, "epoch": 508} {"train_loss": -19.76093292236328, "global_step": 42183, "epoch": 508} {"train_loss": -19.761734008789062, "global_step": 42184, "epoch": 508} {"train_loss": -19.624099731445312, "global_step": 42185, "epoch": 508} {"train_loss": -19.499380111694336, "global_step": 42186, "epoch": 508} {"train_loss": -19.58529281616211, "global_step": 42187, "epoch": 508} {"train_loss": -19.154705047607422, "global_step": 42188, "epoch": 508} {"train_loss": -19.753759384155273, "global_step": 42189, "epoch": 508} {"train_loss": -19.872480392456055, "global_step": 42190, "epoch": 508} {"train_loss": -19.45206642150879, "global_step": 42191, "epoch": 508} {"train_loss": -19.385204315185547, "global_step": 42192, "epoch": 508} {"train_loss": -19.598228454589844, "global_step": 42193, "epoch": 508} {"train_loss": -19.54011344909668, "global_step": 42194, "epoch": 508} {"train_loss": -19.62359619140625, "global_step": 42195, "epoch": 508} {"train_loss": -19.526220321655273, "global_step": 42196, "epoch": 508} {"train_loss": -19.42083740234375, "global_step": 42197, "epoch": 508} {"train_loss": -19.59036636352539, "global_step": 42198, "epoch": 508} {"train_loss": -19.580352783203125, "global_step": 42199, "epoch": 508} {"train_loss": -19.538972854614258, "global_step": 42200, "epoch": 508} {"train_loss": -19.73951530456543, "global_step": 42201, "epoch": 508} {"train_loss": -19.79817771911621, "global_step": 42202, "epoch": 508} {"train_loss": -19.492841720581055, "global_step": 42203, "epoch": 508} {"train_loss": -19.627111434936523, "global_step": 42204, "epoch": 508} {"train_loss": -19.545190811157227, "global_step": 42205, "epoch": 508} {"train_loss": -19.615070343017578, "global_step": 42206, "epoch": 508} {"train_loss": -19.50522232055664, "global_step": 42207, "epoch": 508} {"train_loss": -19.714120864868164, "global_step": 42208, "epoch": 508} {"train_loss": -19.711997985839844, "global_step": 42209, "epoch": 508} {"train_loss": -19.517053604125977, "global_step": 42210, "epoch": 508} {"train_loss": -19.446523666381836, "global_step": 42211, "epoch": 508} {"train_loss": -19.70735740661621, "global_step": 42212, "epoch": 508} {"train_loss": -19.467416763305664, "global_step": 42213, "epoch": 508} {"train_loss": -19.838979721069336, "global_step": 42214, "epoch": 508} {"train_loss": -19.582504272460938, "global_step": 42215, "epoch": 508} {"train_loss": -19.751001358032227, "global_step": 42216, "epoch": 508} {"train_loss": -19.553625106811523, "global_step": 42217, "epoch": 508} {"train_loss": -19.553518295288086, "global_step": 42218, "epoch": 508} {"train_loss": -19.589237213134766, "global_step": 42219, "epoch": 508} {"train_loss": -19.268869400024414, "global_step": 42220, "epoch": 508} {"train_loss": -19.480077743530273, "global_step": 42221, "epoch": 508} {"train_loss": -19.845746994018555, "global_step": 42222, "epoch": 508} {"train_loss": -19.634244918823242, "global_step": 42223, "epoch": 508} {"train_loss": -19.599689483642578, "global_step": 42224, "epoch": 508} {"train_loss": -19.292272567749023, "global_step": 42225, "epoch": 508} {"train_loss": -19.74608039855957, "global_step": 42226, "epoch": 508} {"train_loss": -19.7070255279541, "global_step": 42227, "epoch": 508} {"train_loss": -19.647947311401367, "global_step": 42228, "epoch": 508} {"train_loss": -19.250394821166992, "global_step": 42229, "epoch": 508} {"train_loss": -19.4547061920166, "global_step": 42230, "epoch": 508} {"train_loss": -19.415538787841797, "global_step": 42231, "epoch": 508} {"train_loss": -19.465396881103516, "global_step": 42232, "epoch": 508} {"train_loss": -19.44635772705078, "global_step": 42233, "epoch": 508} {"train_loss": -19.770675659179688, "global_step": 42234, "epoch": 508} {"train_loss": -19.5314998626709, "global_step": 42235, "epoch": 508} {"train_loss": -19.384326934814453, "global_step": 42236, "epoch": 508} {"train_loss": -19.43516731262207, "global_step": 42237, "epoch": 508} {"train_loss": -19.65920066833496, "global_step": 42238, "epoch": 508} {"train_loss": -19.482812881469727, "global_step": 42239, "epoch": 508} {"train_loss": -19.703567504882812, "global_step": 42240, "epoch": 508} {"train_loss": -19.21359634399414, "global_step": 42241, "epoch": 508} {"train_loss": -19.701566696166992, "global_step": 42242, "epoch": 508} {"train_loss": -19.826446533203125, "global_step": 42243, "epoch": 508} {"train_loss": -19.499286651611328, "global_step": 42244, "epoch": 508} {"train_loss": -19.380842208862305, "global_step": 42245, "epoch": 508} {"train_loss": -19.531282999429358, "global_step": 42246, "epoch": 508, "val_loss": 6002576.5} {"train_loss": -19.039785385131836, "global_step": 42247, "epoch": 509} {"train_loss": -19.49259376525879, "global_step": 42248, "epoch": 509} {"train_loss": -19.358564376831055, "global_step": 42249, "epoch": 509} {"train_loss": -19.457469940185547, "global_step": 42250, "epoch": 509} {"train_loss": -19.448251724243164, "global_step": 42251, "epoch": 509} {"train_loss": -19.443235397338867, "global_step": 42252, "epoch": 509} {"train_loss": -19.500070571899414, "global_step": 42253, "epoch": 509} {"train_loss": -19.253583908081055, "global_step": 42254, "epoch": 509} {"train_loss": -19.64485740661621, "global_step": 42255, "epoch": 509} {"train_loss": -19.136226654052734, "global_step": 42256, "epoch": 509} {"train_loss": -19.085206985473633, "global_step": 42257, "epoch": 509} {"train_loss": -19.565353393554688, "global_step": 42258, "epoch": 509} {"train_loss": -19.216787338256836, "global_step": 42259, "epoch": 509} {"train_loss": -19.636716842651367, "global_step": 42260, "epoch": 509} {"train_loss": -19.392560958862305, "global_step": 42261, "epoch": 509} {"train_loss": -19.391206741333008, "global_step": 42262, "epoch": 509} {"train_loss": -19.60362434387207, "global_step": 42263, "epoch": 509} {"train_loss": -19.49831199645996, "global_step": 42264, "epoch": 509} {"train_loss": -19.404945373535156, "global_step": 42265, "epoch": 509} {"train_loss": -19.487598419189453, "global_step": 42266, "epoch": 509} {"train_loss": -19.642261505126953, "global_step": 42267, "epoch": 509} {"train_loss": -19.397525787353516, "global_step": 42268, "epoch": 509} {"train_loss": -19.57686424255371, "global_step": 42269, "epoch": 509} {"train_loss": -19.741207122802734, "global_step": 42270, "epoch": 509} {"train_loss": -19.290494918823242, "global_step": 42271, "epoch": 509} {"train_loss": -19.454885482788086, "global_step": 42272, "epoch": 509} {"train_loss": -19.28786277770996, "global_step": 42273, "epoch": 509} {"train_loss": -19.73762321472168, "global_step": 42274, "epoch": 509} {"train_loss": -19.028766632080078, "global_step": 42275, "epoch": 509} {"train_loss": -19.449251174926758, "global_step": 42276, "epoch": 509} {"train_loss": -20.17720603942871, "global_step": 42277, "epoch": 509} {"train_loss": -19.556716918945312, "global_step": 42278, "epoch": 509} {"train_loss": -19.53050422668457, "global_step": 42279, "epoch": 509} {"train_loss": -19.689449310302734, "global_step": 42280, "epoch": 509} {"train_loss": -19.64423179626465, "global_step": 42281, "epoch": 509} {"train_loss": -19.51494789123535, "global_step": 42282, "epoch": 509} {"train_loss": -19.76199722290039, "global_step": 42283, "epoch": 509} {"train_loss": -19.600412368774414, "global_step": 42284, "epoch": 509} {"train_loss": -19.4934139251709, "global_step": 42285, "epoch": 509} {"train_loss": -19.761171340942383, "global_step": 42286, "epoch": 509} {"train_loss": -19.45339584350586, "global_step": 42287, "epoch": 509} {"train_loss": -19.5542049407959, "global_step": 42288, "epoch": 509} {"train_loss": -19.5947322845459, "global_step": 42289, "epoch": 509} {"train_loss": -19.470937728881836, "global_step": 42290, "epoch": 509} {"train_loss": -19.459226608276367, "global_step": 42291, "epoch": 509} {"train_loss": -19.61993408203125, "global_step": 42292, "epoch": 509} {"train_loss": -19.40070915222168, "global_step": 42293, "epoch": 509} {"train_loss": -19.7177734375, "global_step": 42294, "epoch": 509} {"train_loss": -19.76335906982422, "global_step": 42295, "epoch": 509} {"train_loss": -20.015321731567383, "global_step": 42296, "epoch": 509} {"train_loss": -19.51056671142578, "global_step": 42297, "epoch": 509} {"train_loss": -19.486459732055664, "global_step": 42298, "epoch": 509} {"train_loss": -19.967222213745117, "global_step": 42299, "epoch": 509} {"train_loss": -19.57562828063965, "global_step": 42300, "epoch": 509} {"train_loss": -19.6418399810791, "global_step": 42301, "epoch": 509} {"train_loss": -19.705509185791016, "global_step": 42302, "epoch": 509} {"train_loss": -19.537202835083008, "global_step": 42303, "epoch": 509} {"train_loss": -19.556432723999023, "global_step": 42304, "epoch": 509} {"train_loss": -19.1589412689209, "global_step": 42305, "epoch": 509} {"train_loss": -19.569923400878906, "global_step": 42306, "epoch": 509} {"train_loss": -19.748672485351562, "global_step": 42307, "epoch": 509} {"train_loss": -19.483007431030273, "global_step": 42308, "epoch": 509} {"train_loss": -19.415632247924805, "global_step": 42309, "epoch": 509} {"train_loss": -19.511795043945312, "global_step": 42310, "epoch": 509} {"train_loss": -19.670841217041016, "global_step": 42311, "epoch": 509} {"train_loss": -19.56268882751465, "global_step": 42312, "epoch": 509} {"train_loss": -19.710803985595703, "global_step": 42313, "epoch": 509} {"train_loss": -19.21980857849121, "global_step": 42314, "epoch": 509} {"train_loss": -19.528249740600586, "global_step": 42315, "epoch": 509} {"train_loss": -19.416366577148438, "global_step": 42316, "epoch": 509} {"train_loss": -19.52083396911621, "global_step": 42317, "epoch": 509} {"train_loss": -19.531721115112305, "global_step": 42318, "epoch": 509} {"train_loss": -19.85279655456543, "global_step": 42319, "epoch": 509} {"train_loss": -19.619754791259766, "global_step": 42320, "epoch": 509} {"train_loss": -19.335447311401367, "global_step": 42321, "epoch": 509} {"train_loss": -20.16890525817871, "global_step": 42322, "epoch": 509} {"train_loss": -19.912729263305664, "global_step": 42323, "epoch": 509} {"train_loss": -19.709440231323242, "global_step": 42324, "epoch": 509} {"train_loss": -19.593605041503906, "global_step": 42325, "epoch": 509} {"train_loss": -19.6402587890625, "global_step": 42326, "epoch": 509} {"train_loss": -19.673486709594727, "global_step": 42327, "epoch": 509} {"train_loss": -20.017757415771484, "global_step": 42328, "epoch": 509} {"train_loss": -19.54013654410121, "global_step": 42329, "epoch": 509, "val_loss": 5923861.0} {"train_loss": -18.969099044799805, "global_step": 42330, "epoch": 510} {"train_loss": -19.487112045288086, "global_step": 42331, "epoch": 510} {"train_loss": -19.57659912109375, "global_step": 42332, "epoch": 510} {"train_loss": -19.440584182739258, "global_step": 42333, "epoch": 510} {"train_loss": -19.29718017578125, "global_step": 42334, "epoch": 510} {"train_loss": -19.116573333740234, "global_step": 42335, "epoch": 510} {"train_loss": -19.257659912109375, "global_step": 42336, "epoch": 510} {"train_loss": -19.210586547851562, "global_step": 42337, "epoch": 510} {"train_loss": -19.490392684936523, "global_step": 42338, "epoch": 510} {"train_loss": -19.63545036315918, "global_step": 42339, "epoch": 510} {"train_loss": -19.68735122680664, "global_step": 42340, "epoch": 510} {"train_loss": -19.674596786499023, "global_step": 42341, "epoch": 510} {"train_loss": -19.223834991455078, "global_step": 42342, "epoch": 510} {"train_loss": -19.71296501159668, "global_step": 42343, "epoch": 510} {"train_loss": -19.642419815063477, "global_step": 42344, "epoch": 510} {"train_loss": -19.715103149414062, "global_step": 42345, "epoch": 510} {"train_loss": -19.269180297851562, "global_step": 42346, "epoch": 510} {"train_loss": -19.38983726501465, "global_step": 42347, "epoch": 510} {"train_loss": -19.496740341186523, "global_step": 42348, "epoch": 510} {"train_loss": -19.610702514648438, "global_step": 42349, "epoch": 510} {"train_loss": -19.431943893432617, "global_step": 42350, "epoch": 510} {"train_loss": -19.809297561645508, "global_step": 42351, "epoch": 510} {"train_loss": -19.461088180541992, "global_step": 42352, "epoch": 510} {"train_loss": -19.568693161010742, "global_step": 42353, "epoch": 510} {"train_loss": -19.513015747070312, "global_step": 42354, "epoch": 510} {"train_loss": -19.67776107788086, "global_step": 42355, "epoch": 510} {"train_loss": -19.502750396728516, "global_step": 42356, "epoch": 510} {"train_loss": -19.548810958862305, "global_step": 42357, "epoch": 510} {"train_loss": -19.502304077148438, "global_step": 42358, "epoch": 510} {"train_loss": -19.69085121154785, "global_step": 42359, "epoch": 510} {"train_loss": -19.515094757080078, "global_step": 42360, "epoch": 510} {"train_loss": -19.829097747802734, "global_step": 42361, "epoch": 510} {"train_loss": -18.9345760345459, "global_step": 42362, "epoch": 510} {"train_loss": -19.299610137939453, "global_step": 42363, "epoch": 510} {"train_loss": -19.62657356262207, "global_step": 42364, "epoch": 510} {"train_loss": -19.446203231811523, "global_step": 42365, "epoch": 510} {"train_loss": -19.221176147460938, "global_step": 42366, "epoch": 510} {"train_loss": -19.591690063476562, "global_step": 42367, "epoch": 510} {"train_loss": -19.652080535888672, "global_step": 42368, "epoch": 510} {"train_loss": -19.724225997924805, "global_step": 42369, "epoch": 510} {"train_loss": -19.497081756591797, "global_step": 42370, "epoch": 510} {"train_loss": -19.766096115112305, "global_step": 42371, "epoch": 510} {"train_loss": -19.64190673828125, "global_step": 42372, "epoch": 510} {"train_loss": -19.29820442199707, "global_step": 42373, "epoch": 510} {"train_loss": -19.824838638305664, "global_step": 42374, "epoch": 510} {"train_loss": -19.416784286499023, "global_step": 42375, "epoch": 510} {"train_loss": -19.58147621154785, "global_step": 42376, "epoch": 510} {"train_loss": -19.760358810424805, "global_step": 42377, "epoch": 510} {"train_loss": -19.150283813476562, "global_step": 42378, "epoch": 510} {"train_loss": -19.691328048706055, "global_step": 42379, "epoch": 510} {"train_loss": -19.614221572875977, "global_step": 42380, "epoch": 510} {"train_loss": -19.5706844329834, "global_step": 42381, "epoch": 510} {"train_loss": -19.124319076538086, "global_step": 42382, "epoch": 510} {"train_loss": -19.480117797851562, "global_step": 42383, "epoch": 510} {"train_loss": -19.385908126831055, "global_step": 42384, "epoch": 510} {"train_loss": -19.7589054107666, "global_step": 42385, "epoch": 510} {"train_loss": -19.539793014526367, "global_step": 42386, "epoch": 510} {"train_loss": -19.243589401245117, "global_step": 42387, "epoch": 510} {"train_loss": -19.735363006591797, "global_step": 42388, "epoch": 510} {"train_loss": -19.57912254333496, "global_step": 42389, "epoch": 510} {"train_loss": -19.686861038208008, "global_step": 42390, "epoch": 510} {"train_loss": -19.217283248901367, "global_step": 42391, "epoch": 510} {"train_loss": -19.976898193359375, "global_step": 42392, "epoch": 510} {"train_loss": -19.8262882232666, "global_step": 42393, "epoch": 510} {"train_loss": -19.6837158203125, "global_step": 42394, "epoch": 510} {"train_loss": -19.54561424255371, "global_step": 42395, "epoch": 510} {"train_loss": -19.710844039916992, "global_step": 42396, "epoch": 510} {"train_loss": -19.51910972595215, "global_step": 42397, "epoch": 510} {"train_loss": -19.662900924682617, "global_step": 42398, "epoch": 510} {"train_loss": -19.26836585998535, "global_step": 42399, "epoch": 510} {"train_loss": -19.461843490600586, "global_step": 42400, "epoch": 510} {"train_loss": -19.902700424194336, "global_step": 42401, "epoch": 510} {"train_loss": -19.526947021484375, "global_step": 42402, "epoch": 510} {"train_loss": -19.593597412109375, "global_step": 42403, "epoch": 510} {"train_loss": -19.739700317382812, "global_step": 42404, "epoch": 510} {"train_loss": -19.375900268554688, "global_step": 42405, "epoch": 510} {"train_loss": -19.320714950561523, "global_step": 42406, "epoch": 510} {"train_loss": -19.52142906188965, "global_step": 42407, "epoch": 510} {"train_loss": -19.57904624938965, "global_step": 42408, "epoch": 510} {"train_loss": -19.41082191467285, "global_step": 42409, "epoch": 510} {"train_loss": -19.21717071533203, "global_step": 42410, "epoch": 510} {"train_loss": -19.809293746948242, "global_step": 42411, "epoch": 510} {"train_loss": -19.53011623060847, "global_step": 42412, "epoch": 510, "val_loss": 5967676.5} {"train_loss": -19.293489456176758, "global_step": 42413, "epoch": 511} {"train_loss": -19.45549774169922, "global_step": 42414, "epoch": 511} {"train_loss": -19.428085327148438, "global_step": 42415, "epoch": 511} {"train_loss": -19.18159294128418, "global_step": 42416, "epoch": 511} {"train_loss": -19.427427291870117, "global_step": 42417, "epoch": 511} {"train_loss": -19.227994918823242, "global_step": 42418, "epoch": 511} {"train_loss": -19.097990036010742, "global_step": 42419, "epoch": 511} {"train_loss": -19.260997772216797, "global_step": 42420, "epoch": 511} {"train_loss": -19.577205657958984, "global_step": 42421, "epoch": 511} {"train_loss": -19.28671646118164, "global_step": 42422, "epoch": 511} {"train_loss": -19.482620239257812, "global_step": 42423, "epoch": 511} {"train_loss": -19.850671768188477, "global_step": 42424, "epoch": 511} {"train_loss": -19.34968376159668, "global_step": 42425, "epoch": 511} {"train_loss": -19.603675842285156, "global_step": 42426, "epoch": 511} {"train_loss": -19.213970184326172, "global_step": 42427, "epoch": 511} {"train_loss": -19.676403045654297, "global_step": 42428, "epoch": 511} {"train_loss": -19.673583984375, "global_step": 42429, "epoch": 511} {"train_loss": -19.731000900268555, "global_step": 42430, "epoch": 511} {"train_loss": -19.37568473815918, "global_step": 42431, "epoch": 511} {"train_loss": -19.503101348876953, "global_step": 42432, "epoch": 511} {"train_loss": -19.432926177978516, "global_step": 42433, "epoch": 511} {"train_loss": -19.62031364440918, "global_step": 42434, "epoch": 511} {"train_loss": -19.545148849487305, "global_step": 42435, "epoch": 511} {"train_loss": -19.86207389831543, "global_step": 42436, "epoch": 511} {"train_loss": -19.49702262878418, "global_step": 42437, "epoch": 511} {"train_loss": -19.867761611938477, "global_step": 42438, "epoch": 511} {"train_loss": -19.42307472229004, "global_step": 42439, "epoch": 511} {"train_loss": -19.47510528564453, "global_step": 42440, "epoch": 511} {"train_loss": -19.95411491394043, "global_step": 42441, "epoch": 511} {"train_loss": -19.506210327148438, "global_step": 42442, "epoch": 511} {"train_loss": -19.426288604736328, "global_step": 42443, "epoch": 511} {"train_loss": -19.6601505279541, "global_step": 42444, "epoch": 511} {"train_loss": -19.726730346679688, "global_step": 42445, "epoch": 511} {"train_loss": -19.71443748474121, "global_step": 42446, "epoch": 511} {"train_loss": -19.548425674438477, "global_step": 42447, "epoch": 511} {"train_loss": -19.80130958557129, "global_step": 42448, "epoch": 511} {"train_loss": -19.366987228393555, "global_step": 42449, "epoch": 511} {"train_loss": -19.608055114746094, "global_step": 42450, "epoch": 511} {"train_loss": -19.64641761779785, "global_step": 42451, "epoch": 511} {"train_loss": -19.276243209838867, "global_step": 42452, "epoch": 511} {"train_loss": -19.532114028930664, "global_step": 42453, "epoch": 511} {"train_loss": -19.5267333984375, "global_step": 42454, "epoch": 511} {"train_loss": -19.609683990478516, "global_step": 42455, "epoch": 511} {"train_loss": -19.37762451171875, "global_step": 42456, "epoch": 511} {"train_loss": -19.497756958007812, "global_step": 42457, "epoch": 511} {"train_loss": -19.6030216217041, "global_step": 42458, "epoch": 511} {"train_loss": -19.60264015197754, "global_step": 42459, "epoch": 511} {"train_loss": -19.54290008544922, "global_step": 42460, "epoch": 511} {"train_loss": -19.356063842773438, "global_step": 42461, "epoch": 511} {"train_loss": -19.511112213134766, "global_step": 42462, "epoch": 511} {"train_loss": -19.6346435546875, "global_step": 42463, "epoch": 511} {"train_loss": -19.7968692779541, "global_step": 42464, "epoch": 511} {"train_loss": -19.62000846862793, "global_step": 42465, "epoch": 511} {"train_loss": -19.3665714263916, "global_step": 42466, "epoch": 511} {"train_loss": -19.680021286010742, "global_step": 42467, "epoch": 511} {"train_loss": -19.56427574157715, "global_step": 42468, "epoch": 511} {"train_loss": -19.7230281829834, "global_step": 42469, "epoch": 511} {"train_loss": -19.65867805480957, "global_step": 42470, "epoch": 511} {"train_loss": -19.54328727722168, "global_step": 42471, "epoch": 511} {"train_loss": -19.576581954956055, "global_step": 42472, "epoch": 511} {"train_loss": -19.729127883911133, "global_step": 42473, "epoch": 511} {"train_loss": -19.84815788269043, "global_step": 42474, "epoch": 511} {"train_loss": -19.618711471557617, "global_step": 42475, "epoch": 511} {"train_loss": -19.49747657775879, "global_step": 42476, "epoch": 511} {"train_loss": -19.21491241455078, "global_step": 42477, "epoch": 511} {"train_loss": -19.504323959350586, "global_step": 42478, "epoch": 511} {"train_loss": -19.550119400024414, "global_step": 42479, "epoch": 511} {"train_loss": -19.695905685424805, "global_step": 42480, "epoch": 511} {"train_loss": -19.690677642822266, "global_step": 42481, "epoch": 511} {"train_loss": -19.69353675842285, "global_step": 42482, "epoch": 511} {"train_loss": -19.985843658447266, "global_step": 42483, "epoch": 511} {"train_loss": -19.57668685913086, "global_step": 42484, "epoch": 511} {"train_loss": -19.736543655395508, "global_step": 42485, "epoch": 511} {"train_loss": -19.460519790649414, "global_step": 42486, "epoch": 511} {"train_loss": -19.773056030273438, "global_step": 42487, "epoch": 511} {"train_loss": -19.384361267089844, "global_step": 42488, "epoch": 511} {"train_loss": -19.26205825805664, "global_step": 42489, "epoch": 511} {"train_loss": -19.671049118041992, "global_step": 42490, "epoch": 511} {"train_loss": -19.549701690673828, "global_step": 42491, "epoch": 511} {"train_loss": -19.352006912231445, "global_step": 42492, "epoch": 511} {"train_loss": -19.660146713256836, "global_step": 42493, "epoch": 511} {"train_loss": -19.260128021240234, "global_step": 42494, "epoch": 511} {"train_loss": -19.528741721647332, "global_step": 42495, "epoch": 511, "val_loss": 6084584.0} {"train_loss": -19.631847381591797, "global_step": 42496, "epoch": 512} {"train_loss": -19.003482818603516, "global_step": 42497, "epoch": 512} {"train_loss": -19.37112808227539, "global_step": 42498, "epoch": 512} {"train_loss": -19.32533836364746, "global_step": 42499, "epoch": 512} {"train_loss": -19.620426177978516, "global_step": 42500, "epoch": 512} {"train_loss": -19.58401870727539, "global_step": 42501, "epoch": 512} {"train_loss": -19.324552536010742, "global_step": 42502, "epoch": 512} {"train_loss": -19.583486557006836, "global_step": 42503, "epoch": 512} {"train_loss": -19.287158966064453, "global_step": 42504, "epoch": 512} {"train_loss": -19.3527889251709, "global_step": 42505, "epoch": 512} {"train_loss": -19.497329711914062, "global_step": 42506, "epoch": 512} {"train_loss": -19.802419662475586, "global_step": 42507, "epoch": 512} {"train_loss": -19.564332962036133, "global_step": 42508, "epoch": 512} {"train_loss": -19.8044376373291, "global_step": 42509, "epoch": 512} {"train_loss": -19.571508407592773, "global_step": 42510, "epoch": 512} {"train_loss": -19.2473201751709, "global_step": 42511, "epoch": 512} {"train_loss": -19.196386337280273, "global_step": 42512, "epoch": 512} {"train_loss": -19.368316650390625, "global_step": 42513, "epoch": 512} {"train_loss": -19.821144104003906, "global_step": 42514, "epoch": 512} {"train_loss": -19.154666900634766, "global_step": 42515, "epoch": 512} {"train_loss": -19.4908390045166, "global_step": 42516, "epoch": 512} {"train_loss": -19.459131240844727, "global_step": 42517, "epoch": 512} {"train_loss": -19.678150177001953, "global_step": 42518, "epoch": 512} {"train_loss": -19.607791900634766, "global_step": 42519, "epoch": 512} {"train_loss": -19.41851234436035, "global_step": 42520, "epoch": 512} {"train_loss": -19.182931900024414, "global_step": 42521, "epoch": 512} {"train_loss": -19.556137084960938, "global_step": 42522, "epoch": 512} {"train_loss": -19.459882736206055, "global_step": 42523, "epoch": 512} {"train_loss": -19.897085189819336, "global_step": 42524, "epoch": 512} {"train_loss": -19.859134674072266, "global_step": 42525, "epoch": 512} {"train_loss": -19.641315460205078, "global_step": 42526, "epoch": 512} {"train_loss": -19.43855857849121, "global_step": 42527, "epoch": 512} {"train_loss": -19.322824478149414, "global_step": 42528, "epoch": 512} {"train_loss": -19.678913116455078, "global_step": 42529, "epoch": 512} {"train_loss": -19.823766708374023, "global_step": 42530, "epoch": 512} {"train_loss": -19.85029411315918, "global_step": 42531, "epoch": 512} {"train_loss": -19.71673583984375, "global_step": 42532, "epoch": 512} {"train_loss": -19.755353927612305, "global_step": 42533, "epoch": 512} {"train_loss": -19.678415298461914, "global_step": 42534, "epoch": 512} {"train_loss": -19.26568603515625, "global_step": 42535, "epoch": 512} {"train_loss": -19.636442184448242, "global_step": 42536, "epoch": 512} {"train_loss": -19.437545776367188, "global_step": 42537, "epoch": 512} {"train_loss": -19.799291610717773, "global_step": 42538, "epoch": 512} {"train_loss": -19.49810791015625, "global_step": 42539, "epoch": 512} {"train_loss": -19.687740325927734, "global_step": 42540, "epoch": 512} {"train_loss": -19.610366821289062, "global_step": 42541, "epoch": 512} {"train_loss": -19.53334617614746, "global_step": 42542, "epoch": 512} {"train_loss": -19.61201286315918, "global_step": 42543, "epoch": 512} {"train_loss": -19.673070907592773, "global_step": 42544, "epoch": 512} {"train_loss": -19.786087036132812, "global_step": 42545, "epoch": 512} {"train_loss": -19.62331199645996, "global_step": 42546, "epoch": 512} {"train_loss": -19.7088680267334, "global_step": 42547, "epoch": 512} {"train_loss": -19.396833419799805, "global_step": 42548, "epoch": 512} {"train_loss": -19.958511352539062, "global_step": 42549, "epoch": 512} {"train_loss": -19.52739715576172, "global_step": 42550, "epoch": 512} {"train_loss": -19.68033218383789, "global_step": 42551, "epoch": 512} {"train_loss": -19.381370544433594, "global_step": 42552, "epoch": 512} {"train_loss": -19.649168014526367, "global_step": 42553, "epoch": 512} {"train_loss": -19.43979835510254, "global_step": 42554, "epoch": 512} {"train_loss": -19.26305389404297, "global_step": 42555, "epoch": 512} {"train_loss": -19.961076736450195, "global_step": 42556, "epoch": 512} {"train_loss": -19.623929977416992, "global_step": 42557, "epoch": 512} {"train_loss": -19.38472557067871, "global_step": 42558, "epoch": 512} {"train_loss": -19.663908004760742, "global_step": 42559, "epoch": 512} {"train_loss": -19.646543502807617, "global_step": 42560, "epoch": 512} {"train_loss": -19.650985717773438, "global_step": 42561, "epoch": 512} {"train_loss": -19.426973342895508, "global_step": 42562, "epoch": 512} {"train_loss": -19.416227340698242, "global_step": 42563, "epoch": 512} {"train_loss": -19.626155853271484, "global_step": 42564, "epoch": 512} {"train_loss": -19.36819839477539, "global_step": 42565, "epoch": 512} {"train_loss": -19.93167495727539, "global_step": 42566, "epoch": 512} {"train_loss": -19.417348861694336, "global_step": 42567, "epoch": 512} {"train_loss": -19.421903610229492, "global_step": 42568, "epoch": 512} {"train_loss": -19.4788761138916, "global_step": 42569, "epoch": 512} {"train_loss": -19.799612045288086, "global_step": 42570, "epoch": 512} {"train_loss": -19.363195419311523, "global_step": 42571, "epoch": 512} {"train_loss": -19.843799591064453, "global_step": 42572, "epoch": 512} {"train_loss": -19.676769256591797, "global_step": 42573, "epoch": 512} {"train_loss": -19.69343376159668, "global_step": 42574, "epoch": 512} {"train_loss": -19.686573028564453, "global_step": 42575, "epoch": 512} {"train_loss": -19.685321807861328, "global_step": 42576, "epoch": 512} {"train_loss": -19.72313117980957, "global_step": 42577, "epoch": 512} {"train_loss": -19.565386255103423, "global_step": 42578, "epoch": 512, "val_loss": 6207590.0} {"train_loss": -19.405603408813477, "global_step": 42579, "epoch": 513} {"train_loss": -19.29805564880371, "global_step": 42580, "epoch": 513} {"train_loss": -19.27315330505371, "global_step": 42581, "epoch": 513} {"train_loss": -19.70610809326172, "global_step": 42582, "epoch": 513} {"train_loss": -19.17893409729004, "global_step": 42583, "epoch": 513} {"train_loss": -19.564496994018555, "global_step": 42584, "epoch": 513} {"train_loss": -19.39444923400879, "global_step": 42585, "epoch": 513} {"train_loss": -19.351255416870117, "global_step": 42586, "epoch": 513} {"train_loss": -19.378768920898438, "global_step": 42587, "epoch": 513} {"train_loss": -19.23078727722168, "global_step": 42588, "epoch": 513} {"train_loss": -19.46018409729004, "global_step": 42589, "epoch": 513} {"train_loss": -19.556411743164062, "global_step": 42590, "epoch": 513} {"train_loss": -19.17542266845703, "global_step": 42591, "epoch": 513} {"train_loss": -19.57948112487793, "global_step": 42592, "epoch": 513} {"train_loss": -19.640708923339844, "global_step": 42593, "epoch": 513} {"train_loss": -19.73811912536621, "global_step": 42594, "epoch": 513} {"train_loss": -19.338735580444336, "global_step": 42595, "epoch": 513} {"train_loss": -19.56005096435547, "global_step": 42596, "epoch": 513} {"train_loss": -19.79927635192871, "global_step": 42597, "epoch": 513} {"train_loss": -19.41339111328125, "global_step": 42598, "epoch": 513} {"train_loss": -19.265851974487305, "global_step": 42599, "epoch": 513} {"train_loss": -19.325000762939453, "global_step": 42600, "epoch": 513} {"train_loss": -19.322065353393555, "global_step": 42601, "epoch": 513} {"train_loss": -19.9117431640625, "global_step": 42602, "epoch": 513} {"train_loss": -19.828964233398438, "global_step": 42603, "epoch": 513} {"train_loss": -19.467016220092773, "global_step": 42604, "epoch": 513} {"train_loss": -19.244993209838867, "global_step": 42605, "epoch": 513} {"train_loss": -19.524290084838867, "global_step": 42606, "epoch": 513} {"train_loss": -19.489694595336914, "global_step": 42607, "epoch": 513} {"train_loss": -19.766407012939453, "global_step": 42608, "epoch": 513} {"train_loss": -19.469141006469727, "global_step": 42609, "epoch": 513} {"train_loss": -19.571014404296875, "global_step": 42610, "epoch": 513} {"train_loss": -19.6322078704834, "global_step": 42611, "epoch": 513} {"train_loss": -19.68605613708496, "global_step": 42612, "epoch": 513} {"train_loss": -19.493408203125, "global_step": 42613, "epoch": 513} {"train_loss": -19.416059494018555, "global_step": 42614, "epoch": 513} {"train_loss": -19.808032989501953, "global_step": 42615, "epoch": 513} {"train_loss": -19.860153198242188, "global_step": 42616, "epoch": 513} {"train_loss": -19.485197067260742, "global_step": 42617, "epoch": 513} {"train_loss": -19.650197982788086, "global_step": 42618, "epoch": 513} {"train_loss": -19.804960250854492, "global_step": 42619, "epoch": 513} {"train_loss": -19.78969955444336, "global_step": 42620, "epoch": 513} {"train_loss": -19.632057189941406, "global_step": 42621, "epoch": 513} {"train_loss": -19.600257873535156, "global_step": 42622, "epoch": 513} {"train_loss": -19.72332191467285, "global_step": 42623, "epoch": 513} {"train_loss": -19.926441192626953, "global_step": 42624, "epoch": 513} {"train_loss": -19.320608139038086, "global_step": 42625, "epoch": 513} {"train_loss": -19.706544876098633, "global_step": 42626, "epoch": 513} {"train_loss": -19.97269058227539, "global_step": 42627, "epoch": 513} {"train_loss": -19.70816993713379, "global_step": 42628, "epoch": 513} {"train_loss": -19.772829055786133, "global_step": 42629, "epoch": 513} {"train_loss": -19.359149932861328, "global_step": 42630, "epoch": 513} {"train_loss": -19.544286727905273, "global_step": 42631, "epoch": 513} {"train_loss": -19.467926025390625, "global_step": 42632, "epoch": 513} {"train_loss": -19.660703659057617, "global_step": 42633, "epoch": 513} {"train_loss": -19.783401489257812, "global_step": 42634, "epoch": 513} {"train_loss": -19.56535530090332, "global_step": 42635, "epoch": 513} {"train_loss": -19.544031143188477, "global_step": 42636, "epoch": 513} {"train_loss": -19.061628341674805, "global_step": 42637, "epoch": 513} {"train_loss": -19.782638549804688, "global_step": 42638, "epoch": 513} {"train_loss": -19.266956329345703, "global_step": 42639, "epoch": 513} {"train_loss": -19.35945701599121, "global_step": 42640, "epoch": 513} {"train_loss": -19.37489891052246, "global_step": 42641, "epoch": 513} {"train_loss": -19.348493576049805, "global_step": 42642, "epoch": 513} {"train_loss": -19.280065536499023, "global_step": 42643, "epoch": 513} {"train_loss": -19.565982818603516, "global_step": 42644, "epoch": 513} {"train_loss": -19.735036849975586, "global_step": 42645, "epoch": 513} {"train_loss": -19.78938865661621, "global_step": 42646, "epoch": 513} {"train_loss": -19.65044593811035, "global_step": 42647, "epoch": 513} {"train_loss": -19.458879470825195, "global_step": 42648, "epoch": 513} {"train_loss": -19.52498435974121, "global_step": 42649, "epoch": 513} {"train_loss": -19.7782039642334, "global_step": 42650, "epoch": 513} {"train_loss": -19.471511840820312, "global_step": 42651, "epoch": 513} {"train_loss": -19.719144821166992, "global_step": 42652, "epoch": 513} {"train_loss": -19.541837692260742, "global_step": 42653, "epoch": 513} {"train_loss": -19.492170333862305, "global_step": 42654, "epoch": 513} {"train_loss": -19.228694915771484, "global_step": 42655, "epoch": 513} {"train_loss": -19.580312728881836, "global_step": 42656, "epoch": 513} {"train_loss": -19.33517837524414, "global_step": 42657, "epoch": 513} {"train_loss": -19.419750213623047, "global_step": 42658, "epoch": 513} {"train_loss": -19.786895751953125, "global_step": 42659, "epoch": 513} {"train_loss": -19.862064361572266, "global_step": 42660, "epoch": 513} {"train_loss": -19.52573500483869, "global_step": 42661, "epoch": 513, "val_loss": 5982489.0} {"train_loss": -18.383586883544922, "global_step": 42662, "epoch": 514} {"train_loss": -19.288589477539062, "global_step": 42663, "epoch": 514} {"train_loss": -19.425390243530273, "global_step": 42664, "epoch": 514} {"train_loss": -18.76263999938965, "global_step": 42665, "epoch": 514} {"train_loss": -19.022457122802734, "global_step": 42666, "epoch": 514} {"train_loss": -19.44774627685547, "global_step": 42667, "epoch": 514} {"train_loss": -19.38021469116211, "global_step": 42668, "epoch": 514} {"train_loss": -19.551733016967773, "global_step": 42669, "epoch": 514} {"train_loss": -19.5699405670166, "global_step": 42670, "epoch": 514} {"train_loss": -19.175710678100586, "global_step": 42671, "epoch": 514} {"train_loss": -19.48550033569336, "global_step": 42672, "epoch": 514} {"train_loss": -19.247425079345703, "global_step": 42673, "epoch": 514} {"train_loss": -18.999011993408203, "global_step": 42674, "epoch": 514} {"train_loss": -19.318151473999023, "global_step": 42675, "epoch": 514} {"train_loss": -19.230165481567383, "global_step": 42676, "epoch": 514} {"train_loss": -19.50029754638672, "global_step": 42677, "epoch": 514} {"train_loss": -19.60249137878418, "global_step": 42678, "epoch": 514} {"train_loss": -18.869361877441406, "global_step": 42679, "epoch": 514} {"train_loss": -19.718721389770508, "global_step": 42680, "epoch": 514} {"train_loss": -19.37173080444336, "global_step": 42681, "epoch": 514} {"train_loss": -19.614940643310547, "global_step": 42682, "epoch": 514} {"train_loss": -20.001203536987305, "global_step": 42683, "epoch": 514} {"train_loss": -19.685169219970703, "global_step": 42684, "epoch": 514} {"train_loss": -19.928197860717773, "global_step": 42685, "epoch": 514} {"train_loss": -19.59390640258789, "global_step": 42686, "epoch": 514} {"train_loss": -19.760427474975586, "global_step": 42687, "epoch": 514} {"train_loss": -19.92421531677246, "global_step": 42688, "epoch": 514} {"train_loss": -19.720413208007812, "global_step": 42689, "epoch": 514} {"train_loss": -19.22529411315918, "global_step": 42690, "epoch": 514} {"train_loss": -19.459455490112305, "global_step": 42691, "epoch": 514} {"train_loss": -19.399621963500977, "global_step": 42692, "epoch": 514} {"train_loss": -19.756385803222656, "global_step": 42693, "epoch": 514} {"train_loss": -19.67329216003418, "global_step": 42694, "epoch": 514} {"train_loss": -19.490386962890625, "global_step": 42695, "epoch": 514} {"train_loss": -19.797931671142578, "global_step": 42696, "epoch": 514} {"train_loss": -19.719919204711914, "global_step": 42697, "epoch": 514} {"train_loss": -19.69285011291504, "global_step": 42698, "epoch": 514} {"train_loss": -19.351016998291016, "global_step": 42699, "epoch": 514} {"train_loss": -19.391027450561523, "global_step": 42700, "epoch": 514} {"train_loss": -19.859176635742188, "global_step": 42701, "epoch": 514} {"train_loss": -19.7814998626709, "global_step": 42702, "epoch": 514} {"train_loss": -19.277936935424805, "global_step": 42703, "epoch": 514} {"train_loss": -19.711984634399414, "global_step": 42704, "epoch": 514} {"train_loss": -19.232580184936523, "global_step": 42705, "epoch": 514} {"train_loss": -19.585081100463867, "global_step": 42706, "epoch": 514} {"train_loss": -19.514066696166992, "global_step": 42707, "epoch": 514} {"train_loss": -19.516311645507812, "global_step": 42708, "epoch": 514} {"train_loss": -19.617877960205078, "global_step": 42709, "epoch": 514} {"train_loss": -19.76649284362793, "global_step": 42710, "epoch": 514} {"train_loss": -19.431257247924805, "global_step": 42711, "epoch": 514} {"train_loss": -19.69460678100586, "global_step": 42712, "epoch": 514} {"train_loss": -19.849857330322266, "global_step": 42713, "epoch": 514} {"train_loss": -19.684171676635742, "global_step": 42714, "epoch": 514} {"train_loss": -19.672414779663086, "global_step": 42715, "epoch": 514} {"train_loss": -19.756168365478516, "global_step": 42716, "epoch": 514} {"train_loss": -19.319578170776367, "global_step": 42717, "epoch": 514} {"train_loss": -19.491018295288086, "global_step": 42718, "epoch": 514} {"train_loss": -19.62056541442871, "global_step": 42719, "epoch": 514} {"train_loss": -19.72991371154785, "global_step": 42720, "epoch": 514} {"train_loss": -19.630796432495117, "global_step": 42721, "epoch": 514} {"train_loss": -19.74432945251465, "global_step": 42722, "epoch": 514} {"train_loss": -19.719593048095703, "global_step": 42723, "epoch": 514} {"train_loss": -19.50289535522461, "global_step": 42724, "epoch": 514} {"train_loss": -20.017366409301758, "global_step": 42725, "epoch": 514} {"train_loss": -19.460264205932617, "global_step": 42726, "epoch": 514} {"train_loss": -19.784290313720703, "global_step": 42727, "epoch": 514} {"train_loss": -19.77815055847168, "global_step": 42728, "epoch": 514} {"train_loss": -19.550090789794922, "global_step": 42729, "epoch": 514} {"train_loss": -19.425975799560547, "global_step": 42730, "epoch": 514} {"train_loss": -19.64963722229004, "global_step": 42731, "epoch": 514} {"train_loss": -20.31434440612793, "global_step": 42732, "epoch": 514} {"train_loss": -19.456480026245117, "global_step": 42733, "epoch": 514} {"train_loss": -19.78136444091797, "global_step": 42734, "epoch": 514} {"train_loss": -19.577924728393555, "global_step": 42735, "epoch": 514} {"train_loss": -19.458791732788086, "global_step": 42736, "epoch": 514} {"train_loss": -19.66248893737793, "global_step": 42737, "epoch": 514} {"train_loss": -19.679752349853516, "global_step": 42738, "epoch": 514} {"train_loss": -19.594711303710938, "global_step": 42739, "epoch": 514} {"train_loss": -19.70316505432129, "global_step": 42740, "epoch": 514} {"train_loss": -19.5192928314209, "global_step": 42741, "epoch": 514} {"train_loss": -19.321836471557617, "global_step": 42742, "epoch": 514} {"train_loss": -19.286376953125, "global_step": 42743, "epoch": 514} {"train_loss": -19.543972543923253, "global_step": 42744, "epoch": 514, "val_loss": 5917582.0} {"train_loss": -19.02605628967285, "global_step": 42745, "epoch": 515} {"train_loss": -19.297382354736328, "global_step": 42746, "epoch": 515} {"train_loss": -19.406265258789062, "global_step": 42747, "epoch": 515} {"train_loss": -19.17965316772461, "global_step": 42748, "epoch": 515} {"train_loss": -19.472314834594727, "global_step": 42749, "epoch": 515} {"train_loss": -18.666345596313477, "global_step": 42750, "epoch": 515} {"train_loss": -19.4921932220459, "global_step": 42751, "epoch": 515} {"train_loss": -19.507673263549805, "global_step": 42752, "epoch": 515} {"train_loss": -19.667890548706055, "global_step": 42753, "epoch": 515} {"train_loss": -19.331518173217773, "global_step": 42754, "epoch": 515} {"train_loss": -19.33487892150879, "global_step": 42755, "epoch": 515} {"train_loss": -19.28656005859375, "global_step": 42756, "epoch": 515} {"train_loss": -19.43941307067871, "global_step": 42757, "epoch": 515} {"train_loss": -19.423664093017578, "global_step": 42758, "epoch": 515} {"train_loss": -19.559024810791016, "global_step": 42759, "epoch": 515} {"train_loss": -19.22779655456543, "global_step": 42760, "epoch": 515} {"train_loss": -19.61969757080078, "global_step": 42761, "epoch": 515} {"train_loss": -19.70112419128418, "global_step": 42762, "epoch": 515} {"train_loss": -19.49595069885254, "global_step": 42763, "epoch": 515} {"train_loss": -19.771018981933594, "global_step": 42764, "epoch": 515} {"train_loss": -19.675586700439453, "global_step": 42765, "epoch": 515} {"train_loss": -19.547773361206055, "global_step": 42766, "epoch": 515} {"train_loss": -19.527496337890625, "global_step": 42767, "epoch": 515} {"train_loss": -19.439849853515625, "global_step": 42768, "epoch": 515} {"train_loss": -19.791601181030273, "global_step": 42769, "epoch": 515} {"train_loss": -19.484670639038086, "global_step": 42770, "epoch": 515} {"train_loss": -19.67824363708496, "global_step": 42771, "epoch": 515} {"train_loss": -19.569046020507812, "global_step": 42772, "epoch": 515} {"train_loss": -19.611820220947266, "global_step": 42773, "epoch": 515} {"train_loss": -19.43952178955078, "global_step": 42774, "epoch": 515} {"train_loss": -19.82333755493164, "global_step": 42775, "epoch": 515} {"train_loss": -19.51332664489746, "global_step": 42776, "epoch": 515} {"train_loss": -19.57192039489746, "global_step": 42777, "epoch": 515} {"train_loss": -19.56013298034668, "global_step": 42778, "epoch": 515} {"train_loss": -19.69948387145996, "global_step": 42779, "epoch": 515} {"train_loss": -19.81800651550293, "global_step": 42780, "epoch": 515} {"train_loss": -19.862892150878906, "global_step": 42781, "epoch": 515} {"train_loss": -19.362693786621094, "global_step": 42782, "epoch": 515} {"train_loss": -19.503767013549805, "global_step": 42783, "epoch": 515} {"train_loss": -19.47869873046875, "global_step": 42784, "epoch": 515} {"train_loss": -19.753217697143555, "global_step": 42785, "epoch": 515} {"train_loss": -19.3912353515625, "global_step": 42786, "epoch": 515} {"train_loss": -20.07742691040039, "global_step": 42787, "epoch": 515} {"train_loss": -19.73633575439453, "global_step": 42788, "epoch": 515} {"train_loss": -19.659500122070312, "global_step": 42789, "epoch": 515} {"train_loss": -19.518537521362305, "global_step": 42790, "epoch": 515} {"train_loss": -19.916858673095703, "global_step": 42791, "epoch": 515} {"train_loss": -19.81477928161621, "global_step": 42792, "epoch": 515} {"train_loss": -19.46764373779297, "global_step": 42793, "epoch": 515} {"train_loss": -19.534456253051758, "global_step": 42794, "epoch": 515} {"train_loss": -19.751502990722656, "global_step": 42795, "epoch": 515} {"train_loss": -19.894981384277344, "global_step": 42796, "epoch": 515} {"train_loss": -19.464323043823242, "global_step": 42797, "epoch": 515} {"train_loss": -19.4454345703125, "global_step": 42798, "epoch": 515} {"train_loss": -19.720579147338867, "global_step": 42799, "epoch": 515} {"train_loss": -19.269901275634766, "global_step": 42800, "epoch": 515} {"train_loss": -19.709243774414062, "global_step": 42801, "epoch": 515} {"train_loss": -19.834468841552734, "global_step": 42802, "epoch": 515} {"train_loss": -19.711668014526367, "global_step": 42803, "epoch": 515} {"train_loss": -19.314523696899414, "global_step": 42804, "epoch": 515} {"train_loss": -19.8126277923584, "global_step": 42805, "epoch": 515} {"train_loss": -20.011035919189453, "global_step": 42806, "epoch": 515} {"train_loss": -19.826858520507812, "global_step": 42807, "epoch": 515} {"train_loss": -19.32852554321289, "global_step": 42808, "epoch": 515} {"train_loss": -19.6781063079834, "global_step": 42809, "epoch": 515} {"train_loss": -19.417579650878906, "global_step": 42810, "epoch": 515} {"train_loss": -19.57881736755371, "global_step": 42811, "epoch": 515} {"train_loss": -20.068073272705078, "global_step": 42812, "epoch": 515} {"train_loss": -19.581159591674805, "global_step": 42813, "epoch": 515} {"train_loss": -19.025917053222656, "global_step": 42814, "epoch": 515} {"train_loss": -19.62771987915039, "global_step": 42815, "epoch": 515} {"train_loss": -19.776229858398438, "global_step": 42816, "epoch": 515} {"train_loss": -19.342933654785156, "global_step": 42817, "epoch": 515} {"train_loss": -19.606290817260742, "global_step": 42818, "epoch": 515} {"train_loss": -19.611486434936523, "global_step": 42819, "epoch": 515} {"train_loss": -19.415441513061523, "global_step": 42820, "epoch": 515} {"train_loss": -19.865478515625, "global_step": 42821, "epoch": 515} {"train_loss": -19.434581756591797, "global_step": 42822, "epoch": 515} {"train_loss": -19.88759422302246, "global_step": 42823, "epoch": 515} {"train_loss": -19.858427047729492, "global_step": 42824, "epoch": 515} {"train_loss": -19.660247802734375, "global_step": 42825, "epoch": 515} {"train_loss": -19.889997482299805, "global_step": 42826, "epoch": 515} {"train_loss": -19.566504834646203, "global_step": 42827, "epoch": 515, "val_loss": 5889099.0} {"train_loss": -19.423629760742188, "global_step": 42828, "epoch": 516} {"train_loss": -19.53427505493164, "global_step": 42829, "epoch": 516} {"train_loss": -19.45326042175293, "global_step": 42830, "epoch": 516} {"train_loss": -19.374052047729492, "global_step": 42831, "epoch": 516} {"train_loss": -19.326801300048828, "global_step": 42832, "epoch": 516} {"train_loss": -19.303207397460938, "global_step": 42833, "epoch": 516} {"train_loss": -19.532955169677734, "global_step": 42834, "epoch": 516} {"train_loss": -19.411836624145508, "global_step": 42835, "epoch": 516} {"train_loss": -19.43879508972168, "global_step": 42836, "epoch": 516} {"train_loss": -19.339218139648438, "global_step": 42837, "epoch": 516} {"train_loss": -19.464384078979492, "global_step": 42838, "epoch": 516} {"train_loss": -19.400949478149414, "global_step": 42839, "epoch": 516} {"train_loss": -19.286314010620117, "global_step": 42840, "epoch": 516} {"train_loss": -19.047225952148438, "global_step": 42841, "epoch": 516} {"train_loss": -19.405189514160156, "global_step": 42842, "epoch": 516} {"train_loss": -19.393613815307617, "global_step": 42843, "epoch": 516} {"train_loss": -19.278446197509766, "global_step": 42844, "epoch": 516} {"train_loss": -19.65350914001465, "global_step": 42845, "epoch": 516} {"train_loss": -19.525405883789062, "global_step": 42846, "epoch": 516} {"train_loss": -19.619190216064453, "global_step": 42847, "epoch": 516} {"train_loss": -19.656253814697266, "global_step": 42848, "epoch": 516} {"train_loss": -19.63336181640625, "global_step": 42849, "epoch": 516} {"train_loss": -19.391826629638672, "global_step": 42850, "epoch": 516} {"train_loss": -19.919469833374023, "global_step": 42851, "epoch": 516} {"train_loss": -19.74066162109375, "global_step": 42852, "epoch": 516} {"train_loss": -19.561100006103516, "global_step": 42853, "epoch": 516} {"train_loss": -19.564823150634766, "global_step": 42854, "epoch": 516} {"train_loss": -19.364439010620117, "global_step": 42855, "epoch": 516} {"train_loss": -19.950714111328125, "global_step": 42856, "epoch": 516} {"train_loss": -19.422922134399414, "global_step": 42857, "epoch": 516} {"train_loss": -19.701072692871094, "global_step": 42858, "epoch": 516} {"train_loss": -19.59549331665039, "global_step": 42859, "epoch": 516} {"train_loss": -19.5664119720459, "global_step": 42860, "epoch": 516} {"train_loss": -19.627981185913086, "global_step": 42861, "epoch": 516} {"train_loss": -19.858047485351562, "global_step": 42862, "epoch": 516} {"train_loss": -19.47344207763672, "global_step": 42863, "epoch": 516} {"train_loss": -19.298261642456055, "global_step": 42864, "epoch": 516} {"train_loss": -19.519041061401367, "global_step": 42865, "epoch": 516} {"train_loss": -19.38703727722168, "global_step": 42866, "epoch": 516} {"train_loss": -19.52094078063965, "global_step": 42867, "epoch": 516} {"train_loss": -19.868614196777344, "global_step": 42868, "epoch": 516} {"train_loss": -19.755247116088867, "global_step": 42869, "epoch": 516} {"train_loss": -19.34551239013672, "global_step": 42870, "epoch": 516} {"train_loss": -19.47823143005371, "global_step": 42871, "epoch": 516} {"train_loss": -19.65126609802246, "global_step": 42872, "epoch": 516} {"train_loss": -19.4554500579834, "global_step": 42873, "epoch": 516} {"train_loss": -19.245868682861328, "global_step": 42874, "epoch": 516} {"train_loss": -19.58870506286621, "global_step": 42875, "epoch": 516} {"train_loss": -19.411380767822266, "global_step": 42876, "epoch": 516} {"train_loss": -19.680103302001953, "global_step": 42877, "epoch": 516} {"train_loss": -19.72174644470215, "global_step": 42878, "epoch": 516} {"train_loss": -19.480485916137695, "global_step": 42879, "epoch": 516} {"train_loss": -19.840530395507812, "global_step": 42880, "epoch": 516} {"train_loss": -19.547889709472656, "global_step": 42881, "epoch": 516} {"train_loss": -19.532384872436523, "global_step": 42882, "epoch": 516} {"train_loss": -19.816930770874023, "global_step": 42883, "epoch": 516} {"train_loss": -19.37053871154785, "global_step": 42884, "epoch": 516} {"train_loss": -19.733020782470703, "global_step": 42885, "epoch": 516} {"train_loss": -19.11048698425293, "global_step": 42886, "epoch": 516} {"train_loss": -19.45307731628418, "global_step": 42887, "epoch": 516} {"train_loss": -19.563261032104492, "global_step": 42888, "epoch": 516} {"train_loss": -19.521085739135742, "global_step": 42889, "epoch": 516} {"train_loss": -19.513601303100586, "global_step": 42890, "epoch": 516} {"train_loss": -19.809423446655273, "global_step": 42891, "epoch": 516} {"train_loss": -19.913572311401367, "global_step": 42892, "epoch": 516} {"train_loss": -19.4176025390625, "global_step": 42893, "epoch": 516} {"train_loss": -19.891231536865234, "global_step": 42894, "epoch": 516} {"train_loss": -20.03697967529297, "global_step": 42895, "epoch": 516} {"train_loss": -19.453123092651367, "global_step": 42896, "epoch": 516} {"train_loss": -20.168500900268555, "global_step": 42897, "epoch": 516} {"train_loss": -19.713706970214844, "global_step": 42898, "epoch": 516} {"train_loss": -20.15970802307129, "global_step": 42899, "epoch": 516} {"train_loss": -19.310312271118164, "global_step": 42900, "epoch": 516} {"train_loss": -19.610492706298828, "global_step": 42901, "epoch": 516} {"train_loss": -19.545127868652344, "global_step": 42902, "epoch": 516} {"train_loss": -19.991331100463867, "global_step": 42903, "epoch": 516} {"train_loss": -19.56683349609375, "global_step": 42904, "epoch": 516} {"train_loss": -19.871347427368164, "global_step": 42905, "epoch": 516} {"train_loss": -19.486658096313477, "global_step": 42906, "epoch": 516} {"train_loss": -19.683700561523438, "global_step": 42907, "epoch": 516} {"train_loss": -19.49737548828125, "global_step": 42908, "epoch": 516} {"train_loss": -19.673139572143555, "global_step": 42909, "epoch": 516} {"train_loss": -19.57860234272049, "global_step": 42910, "epoch": 516, "val_loss": 6017328.0} {"train_loss": -19.30354881286621, "global_step": 42911, "epoch": 517} {"train_loss": -19.41115379333496, "global_step": 42912, "epoch": 517} {"train_loss": -19.230972290039062, "global_step": 42913, "epoch": 517} {"train_loss": -19.33820152282715, "global_step": 42914, "epoch": 517} {"train_loss": -19.526229858398438, "global_step": 42915, "epoch": 517} {"train_loss": -19.589284896850586, "global_step": 42916, "epoch": 517} {"train_loss": -19.53694725036621, "global_step": 42917, "epoch": 517} {"train_loss": -19.59189224243164, "global_step": 42918, "epoch": 517} {"train_loss": -19.806011199951172, "global_step": 42919, "epoch": 517} {"train_loss": -19.154916763305664, "global_step": 42920, "epoch": 517} {"train_loss": -19.45163917541504, "global_step": 42921, "epoch": 517} {"train_loss": -19.62535285949707, "global_step": 42922, "epoch": 517} {"train_loss": -19.57615089416504, "global_step": 42923, "epoch": 517} {"train_loss": -19.472183227539062, "global_step": 42924, "epoch": 517} {"train_loss": -19.50904655456543, "global_step": 42925, "epoch": 517} {"train_loss": -19.226154327392578, "global_step": 42926, "epoch": 517} {"train_loss": -19.371965408325195, "global_step": 42927, "epoch": 517} {"train_loss": -19.41364860534668, "global_step": 42928, "epoch": 517} {"train_loss": -19.405359268188477, "global_step": 42929, "epoch": 517} {"train_loss": -19.497026443481445, "global_step": 42930, "epoch": 517} {"train_loss": -19.66322135925293, "global_step": 42931, "epoch": 517} {"train_loss": -19.752416610717773, "global_step": 42932, "epoch": 517} {"train_loss": -19.61134910583496, "global_step": 42933, "epoch": 517} {"train_loss": -19.122821807861328, "global_step": 42934, "epoch": 517} {"train_loss": -19.85507583618164, "global_step": 42935, "epoch": 517} {"train_loss": -19.511337280273438, "global_step": 42936, "epoch": 517} {"train_loss": -19.55438232421875, "global_step": 42937, "epoch": 517} {"train_loss": -19.716629028320312, "global_step": 42938, "epoch": 517} {"train_loss": -19.715288162231445, "global_step": 42939, "epoch": 517} {"train_loss": -19.28107452392578, "global_step": 42940, "epoch": 517} {"train_loss": -19.66766929626465, "global_step": 42941, "epoch": 517} {"train_loss": -19.79732322692871, "global_step": 42942, "epoch": 517} {"train_loss": -19.941211700439453, "global_step": 42943, "epoch": 517} {"train_loss": -19.71932029724121, "global_step": 42944, "epoch": 517} {"train_loss": -19.251806259155273, "global_step": 42945, "epoch": 517} {"train_loss": -19.244211196899414, "global_step": 42946, "epoch": 517} {"train_loss": -19.745437622070312, "global_step": 42947, "epoch": 517} {"train_loss": -19.716217041015625, "global_step": 42948, "epoch": 517} {"train_loss": -19.350454330444336, "global_step": 42949, "epoch": 517} {"train_loss": -19.568891525268555, "global_step": 42950, "epoch": 517} {"train_loss": -19.90377426147461, "global_step": 42951, "epoch": 517} {"train_loss": -19.361066818237305, "global_step": 42952, "epoch": 517} {"train_loss": -19.46734046936035, "global_step": 42953, "epoch": 517} {"train_loss": -19.491418838500977, "global_step": 42954, "epoch": 517} {"train_loss": -19.91740608215332, "global_step": 42955, "epoch": 517} {"train_loss": -19.977415084838867, "global_step": 42956, "epoch": 517} {"train_loss": -19.608497619628906, "global_step": 42957, "epoch": 517} {"train_loss": -19.879499435424805, "global_step": 42958, "epoch": 517} {"train_loss": -19.535322189331055, "global_step": 42959, "epoch": 517} {"train_loss": -19.687986373901367, "global_step": 42960, "epoch": 517} {"train_loss": -19.743818283081055, "global_step": 42961, "epoch": 517} {"train_loss": -19.831298828125, "global_step": 42962, "epoch": 517} {"train_loss": -19.863147735595703, "global_step": 42963, "epoch": 517} {"train_loss": -20.248266220092773, "global_step": 42964, "epoch": 517} {"train_loss": -19.432737350463867, "global_step": 42965, "epoch": 517} {"train_loss": -19.589981079101562, "global_step": 42966, "epoch": 517} {"train_loss": -19.626096725463867, "global_step": 42967, "epoch": 517} {"train_loss": -19.4683895111084, "global_step": 42968, "epoch": 517} {"train_loss": -19.67262840270996, "global_step": 42969, "epoch": 517} {"train_loss": -19.269472122192383, "global_step": 42970, "epoch": 517} {"train_loss": -19.363386154174805, "global_step": 42971, "epoch": 517} {"train_loss": -19.535017013549805, "global_step": 42972, "epoch": 517} {"train_loss": -19.944660186767578, "global_step": 42973, "epoch": 517} {"train_loss": -19.86182975769043, "global_step": 42974, "epoch": 517} {"train_loss": -19.654409408569336, "global_step": 42975, "epoch": 517} {"train_loss": -19.53290367126465, "global_step": 42976, "epoch": 517} {"train_loss": -19.378799438476562, "global_step": 42977, "epoch": 517} {"train_loss": -19.606414794921875, "global_step": 42978, "epoch": 517} {"train_loss": -19.562484741210938, "global_step": 42979, "epoch": 517} {"train_loss": -19.794950485229492, "global_step": 42980, "epoch": 517} {"train_loss": -19.513578414916992, "global_step": 42981, "epoch": 517} {"train_loss": -19.602258682250977, "global_step": 42982, "epoch": 517} {"train_loss": -19.97495460510254, "global_step": 42983, "epoch": 517} {"train_loss": -19.51311683654785, "global_step": 42984, "epoch": 517} {"train_loss": -19.989755630493164, "global_step": 42985, "epoch": 517} {"train_loss": -19.24183464050293, "global_step": 42986, "epoch": 517} {"train_loss": -19.363937377929688, "global_step": 42987, "epoch": 517} {"train_loss": -19.367786407470703, "global_step": 42988, "epoch": 517} {"train_loss": -19.9555721282959, "global_step": 42989, "epoch": 517} {"train_loss": -19.510730743408203, "global_step": 42990, "epoch": 517} {"train_loss": -19.856348037719727, "global_step": 42991, "epoch": 517} {"train_loss": -19.693002700805664, "global_step": 42992, "epoch": 517} {"train_loss": -19.591863333460797, "global_step": 42993, "epoch": 517, "val_loss": 5894199.5} {"train_loss": -18.690052032470703, "global_step": 42994, "epoch": 518} {"train_loss": -19.13068962097168, "global_step": 42995, "epoch": 518} {"train_loss": -18.927656173706055, "global_step": 42996, "epoch": 518} {"train_loss": -19.2228946685791, "global_step": 42997, "epoch": 518} {"train_loss": -19.443998336791992, "global_step": 42998, "epoch": 518} {"train_loss": -19.402118682861328, "global_step": 42999, "epoch": 518} {"train_loss": -19.56550407409668, "global_step": 43000, "epoch": 518} {"train_loss": -18.790285110473633, "global_step": 43001, "epoch": 518} {"train_loss": -19.510845184326172, "global_step": 43002, "epoch": 518} {"train_loss": -19.453079223632812, "global_step": 43003, "epoch": 518} {"train_loss": -19.27011489868164, "global_step": 43004, "epoch": 518} {"train_loss": -19.307722091674805, "global_step": 43005, "epoch": 518} {"train_loss": -19.246950149536133, "global_step": 43006, "epoch": 518} {"train_loss": -19.4542236328125, "global_step": 43007, "epoch": 518} {"train_loss": -19.653329849243164, "global_step": 43008, "epoch": 518} {"train_loss": -19.312469482421875, "global_step": 43009, "epoch": 518} {"train_loss": -19.753955841064453, "global_step": 43010, "epoch": 518} {"train_loss": -20.104276657104492, "global_step": 43011, "epoch": 518} {"train_loss": -19.56037712097168, "global_step": 43012, "epoch": 518} {"train_loss": -19.34061622619629, "global_step": 43013, "epoch": 518} {"train_loss": -19.535932540893555, "global_step": 43014, "epoch": 518} {"train_loss": -19.377872467041016, "global_step": 43015, "epoch": 518} {"train_loss": -19.68446922302246, "global_step": 43016, "epoch": 518} {"train_loss": -19.51689338684082, "global_step": 43017, "epoch": 518} {"train_loss": -19.64129066467285, "global_step": 43018, "epoch": 518} {"train_loss": -19.955198287963867, "global_step": 43019, "epoch": 518} {"train_loss": -19.979232788085938, "global_step": 43020, "epoch": 518} {"train_loss": -19.337751388549805, "global_step": 43021, "epoch": 518} {"train_loss": -19.697952270507812, "global_step": 43022, "epoch": 518} {"train_loss": -19.329326629638672, "global_step": 43023, "epoch": 518} {"train_loss": -19.432218551635742, "global_step": 43024, "epoch": 518} {"train_loss": -19.52989959716797, "global_step": 43025, "epoch": 518} {"train_loss": -19.896333694458008, "global_step": 43026, "epoch": 518} {"train_loss": -19.876178741455078, "global_step": 43027, "epoch": 518} {"train_loss": -19.66360855102539, "global_step": 43028, "epoch": 518} {"train_loss": -19.63162612915039, "global_step": 43029, "epoch": 518} {"train_loss": -19.5865535736084, "global_step": 43030, "epoch": 518} {"train_loss": -19.40753746032715, "global_step": 43031, "epoch": 518} {"train_loss": -19.58380699157715, "global_step": 43032, "epoch": 518} {"train_loss": -19.585031509399414, "global_step": 43033, "epoch": 518} {"train_loss": -19.91645622253418, "global_step": 43034, "epoch": 518} {"train_loss": -19.713953018188477, "global_step": 43035, "epoch": 518} {"train_loss": -19.78272819519043, "global_step": 43036, "epoch": 518} {"train_loss": -19.726789474487305, "global_step": 43037, "epoch": 518} {"train_loss": -19.556318283081055, "global_step": 43038, "epoch": 518} {"train_loss": -19.50539207458496, "global_step": 43039, "epoch": 518} {"train_loss": -19.854948043823242, "global_step": 43040, "epoch": 518} {"train_loss": -19.43748664855957, "global_step": 43041, "epoch": 518} {"train_loss": -19.708608627319336, "global_step": 43042, "epoch": 518} {"train_loss": -19.529001235961914, "global_step": 43043, "epoch": 518} {"train_loss": -19.639371871948242, "global_step": 43044, "epoch": 518} {"train_loss": -19.835378646850586, "global_step": 43045, "epoch": 518} {"train_loss": -19.5131893157959, "global_step": 43046, "epoch": 518} {"train_loss": -19.749662399291992, "global_step": 43047, "epoch": 518} {"train_loss": -19.56520652770996, "global_step": 43048, "epoch": 518} {"train_loss": -19.962860107421875, "global_step": 43049, "epoch": 518} {"train_loss": -19.38849639892578, "global_step": 43050, "epoch": 518} {"train_loss": -19.73891830444336, "global_step": 43051, "epoch": 518} {"train_loss": -19.57801628112793, "global_step": 43052, "epoch": 518} {"train_loss": -19.468427658081055, "global_step": 43053, "epoch": 518} {"train_loss": -19.684371948242188, "global_step": 43054, "epoch": 518} {"train_loss": -19.862356185913086, "global_step": 43055, "epoch": 518} {"train_loss": -19.74439811706543, "global_step": 43056, "epoch": 518} {"train_loss": -19.529111862182617, "global_step": 43057, "epoch": 518} {"train_loss": -19.500473022460938, "global_step": 43058, "epoch": 518} {"train_loss": -19.68714714050293, "global_step": 43059, "epoch": 518} {"train_loss": -19.459524154663086, "global_step": 43060, "epoch": 518} {"train_loss": -19.71809959411621, "global_step": 43061, "epoch": 518} {"train_loss": -19.405563354492188, "global_step": 43062, "epoch": 518} {"train_loss": -19.451187133789062, "global_step": 43063, "epoch": 518} {"train_loss": -19.667423248291016, "global_step": 43064, "epoch": 518} {"train_loss": -19.770381927490234, "global_step": 43065, "epoch": 518} {"train_loss": -19.511003494262695, "global_step": 43066, "epoch": 518} {"train_loss": -19.800228118896484, "global_step": 43067, "epoch": 518} {"train_loss": -19.572357177734375, "global_step": 43068, "epoch": 518} {"train_loss": -19.6882381439209, "global_step": 43069, "epoch": 518} {"train_loss": -19.578968048095703, "global_step": 43070, "epoch": 518} {"train_loss": -19.72689437866211, "global_step": 43071, "epoch": 518} {"train_loss": -19.43507194519043, "global_step": 43072, "epoch": 518} {"train_loss": -19.46612548828125, "global_step": 43073, "epoch": 518} {"train_loss": -19.45785903930664, "global_step": 43074, "epoch": 518} {"train_loss": -19.444931030273438, "global_step": 43075, "epoch": 518} {"train_loss": -19.545797026301006, "global_step": 43076, "epoch": 518, "val_loss": 5929267.0} {"train_loss": -19.57284164428711, "global_step": 43077, "epoch": 519} {"train_loss": -19.329517364501953, "global_step": 43078, "epoch": 519} {"train_loss": -19.630186080932617, "global_step": 43079, "epoch": 519} {"train_loss": -19.40028190612793, "global_step": 43080, "epoch": 519} {"train_loss": -19.524658203125, "global_step": 43081, "epoch": 519} {"train_loss": -19.45216178894043, "global_step": 43082, "epoch": 519} {"train_loss": -19.612661361694336, "global_step": 43083, "epoch": 519} {"train_loss": -19.372032165527344, "global_step": 43084, "epoch": 519} {"train_loss": -20.03822135925293, "global_step": 43085, "epoch": 519} {"train_loss": -19.69819450378418, "global_step": 43086, "epoch": 519} {"train_loss": -19.528125762939453, "global_step": 43087, "epoch": 519} {"train_loss": -19.421194076538086, "global_step": 43088, "epoch": 519} {"train_loss": -19.53554344177246, "global_step": 43089, "epoch": 519} {"train_loss": -19.912954330444336, "global_step": 43090, "epoch": 519} {"train_loss": -19.805631637573242, "global_step": 43091, "epoch": 519} {"train_loss": -19.641910552978516, "global_step": 43092, "epoch": 519} {"train_loss": -19.28476333618164, "global_step": 43093, "epoch": 519} {"train_loss": -19.172611236572266, "global_step": 43094, "epoch": 519} {"train_loss": -19.649255752563477, "global_step": 43095, "epoch": 519} {"train_loss": -19.598264694213867, "global_step": 43096, "epoch": 519} {"train_loss": -19.74080467224121, "global_step": 43097, "epoch": 519} {"train_loss": -19.817520141601562, "global_step": 43098, "epoch": 519} {"train_loss": -19.61577796936035, "global_step": 43099, "epoch": 519} {"train_loss": -19.55971336364746, "global_step": 43100, "epoch": 519} {"train_loss": -19.370004653930664, "global_step": 43101, "epoch": 519} {"train_loss": -19.568689346313477, "global_step": 43102, "epoch": 519} {"train_loss": -19.328107833862305, "global_step": 43103, "epoch": 519} {"train_loss": -19.58417320251465, "global_step": 43104, "epoch": 519} {"train_loss": -19.606822967529297, "global_step": 43105, "epoch": 519} {"train_loss": -19.205280303955078, "global_step": 43106, "epoch": 519} {"train_loss": -19.38942527770996, "global_step": 43107, "epoch": 519} {"train_loss": -19.57697868347168, "global_step": 43108, "epoch": 519} {"train_loss": -19.291948318481445, "global_step": 43109, "epoch": 519} {"train_loss": -19.417922973632812, "global_step": 43110, "epoch": 519} {"train_loss": -19.441980361938477, "global_step": 43111, "epoch": 519} {"train_loss": -19.764509201049805, "global_step": 43112, "epoch": 519} {"train_loss": -19.622663497924805, "global_step": 43113, "epoch": 519} {"train_loss": -19.45900535583496, "global_step": 43114, "epoch": 519} {"train_loss": -19.04618263244629, "global_step": 43115, "epoch": 519} {"train_loss": -19.845447540283203, "global_step": 43116, "epoch": 519} {"train_loss": -19.762758255004883, "global_step": 43117, "epoch": 519} {"train_loss": -20.237009048461914, "global_step": 43118, "epoch": 519} {"train_loss": -20.067846298217773, "global_step": 43119, "epoch": 519} {"train_loss": -19.8359432220459, "global_step": 43120, "epoch": 519} {"train_loss": -19.37825584411621, "global_step": 43121, "epoch": 519} {"train_loss": -20.08307456970215, "global_step": 43122, "epoch": 519} {"train_loss": -19.576297760009766, "global_step": 43123, "epoch": 519} {"train_loss": -19.807064056396484, "global_step": 43124, "epoch": 519} {"train_loss": -19.819080352783203, "global_step": 43125, "epoch": 519} {"train_loss": -19.417882919311523, "global_step": 43126, "epoch": 519} {"train_loss": -19.63545799255371, "global_step": 43127, "epoch": 519} {"train_loss": -19.517202377319336, "global_step": 43128, "epoch": 519} {"train_loss": -19.6992130279541, "global_step": 43129, "epoch": 519} {"train_loss": -19.47582244873047, "global_step": 43130, "epoch": 519} {"train_loss": -19.419828414916992, "global_step": 43131, "epoch": 519} {"train_loss": -19.409379959106445, "global_step": 43132, "epoch": 519} {"train_loss": -20.224506378173828, "global_step": 43133, "epoch": 519} {"train_loss": -19.73406410217285, "global_step": 43134, "epoch": 519} {"train_loss": -19.37795066833496, "global_step": 43135, "epoch": 519} {"train_loss": -19.7792911529541, "global_step": 43136, "epoch": 519} {"train_loss": -19.66975212097168, "global_step": 43137, "epoch": 519} {"train_loss": -19.514179229736328, "global_step": 43138, "epoch": 519} {"train_loss": -19.7394962310791, "global_step": 43139, "epoch": 519} {"train_loss": -19.82948875427246, "global_step": 43140, "epoch": 519} {"train_loss": -19.227283477783203, "global_step": 43141, "epoch": 519} {"train_loss": -19.730823516845703, "global_step": 43142, "epoch": 519} {"train_loss": -19.659826278686523, "global_step": 43143, "epoch": 519} {"train_loss": -19.957866668701172, "global_step": 43144, "epoch": 519} {"train_loss": -19.586633682250977, "global_step": 43145, "epoch": 519} {"train_loss": -19.22735023498535, "global_step": 43146, "epoch": 519} {"train_loss": -19.692537307739258, "global_step": 43147, "epoch": 519} {"train_loss": -19.790491104125977, "global_step": 43148, "epoch": 519} {"train_loss": -19.780969619750977, "global_step": 43149, "epoch": 519} {"train_loss": -19.46651268005371, "global_step": 43150, "epoch": 519} {"train_loss": -19.908655166625977, "global_step": 43151, "epoch": 519} {"train_loss": -19.805524826049805, "global_step": 43152, "epoch": 519} {"train_loss": -19.464038848876953, "global_step": 43153, "epoch": 519} {"train_loss": -19.420339584350586, "global_step": 43154, "epoch": 519} {"train_loss": -19.755361557006836, "global_step": 43155, "epoch": 519} {"train_loss": -19.550981521606445, "global_step": 43156, "epoch": 519} {"train_loss": -19.771493911743164, "global_step": 43157, "epoch": 519} {"train_loss": -19.480026245117188, "global_step": 43158, "epoch": 519} {"train_loss": -19.59995083636548, "global_step": 43159, "epoch": 519, "val_loss": 6045019.5} {"train_loss": -19.651718139648438, "global_step": 43160, "epoch": 520} {"train_loss": -19.487897872924805, "global_step": 43161, "epoch": 520} {"train_loss": -19.18669891357422, "global_step": 43162, "epoch": 520} {"train_loss": -19.18971061706543, "global_step": 43163, "epoch": 520} {"train_loss": -19.369709014892578, "global_step": 43164, "epoch": 520} {"train_loss": -19.343990325927734, "global_step": 43165, "epoch": 520} {"train_loss": -19.11516571044922, "global_step": 43166, "epoch": 520} {"train_loss": -19.685644149780273, "global_step": 43167, "epoch": 520} {"train_loss": -19.696996688842773, "global_step": 43168, "epoch": 520} {"train_loss": -19.129362106323242, "global_step": 43169, "epoch": 520} {"train_loss": -19.49422264099121, "global_step": 43170, "epoch": 520} {"train_loss": -19.605783462524414, "global_step": 43171, "epoch": 520} {"train_loss": -19.292264938354492, "global_step": 43172, "epoch": 520} {"train_loss": -19.59305191040039, "global_step": 43173, "epoch": 520} {"train_loss": -19.537534713745117, "global_step": 43174, "epoch": 520} {"train_loss": -19.644058227539062, "global_step": 43175, "epoch": 520} {"train_loss": -19.735143661499023, "global_step": 43176, "epoch": 520} {"train_loss": -19.631391525268555, "global_step": 43177, "epoch": 520} {"train_loss": -19.337953567504883, "global_step": 43178, "epoch": 520} {"train_loss": -19.69391441345215, "global_step": 43179, "epoch": 520} {"train_loss": -19.499540328979492, "global_step": 43180, "epoch": 520} {"train_loss": -19.542470932006836, "global_step": 43181, "epoch": 520} {"train_loss": -19.64043617248535, "global_step": 43182, "epoch": 520} {"train_loss": -19.74567222595215, "global_step": 43183, "epoch": 520} {"train_loss": -19.604890823364258, "global_step": 43184, "epoch": 520} {"train_loss": -19.342453002929688, "global_step": 43185, "epoch": 520} {"train_loss": -19.85443115234375, "global_step": 43186, "epoch": 520} {"train_loss": -19.422592163085938, "global_step": 43187, "epoch": 520} {"train_loss": -19.571645736694336, "global_step": 43188, "epoch": 520} {"train_loss": -19.826276779174805, "global_step": 43189, "epoch": 520} {"train_loss": -19.400075912475586, "global_step": 43190, "epoch": 520} {"train_loss": -19.60007667541504, "global_step": 43191, "epoch": 520} {"train_loss": -19.375654220581055, "global_step": 43192, "epoch": 520} {"train_loss": -19.499286651611328, "global_step": 43193, "epoch": 520} {"train_loss": -19.726390838623047, "global_step": 43194, "epoch": 520} {"train_loss": -19.86865234375, "global_step": 43195, "epoch": 520} {"train_loss": -19.777145385742188, "global_step": 43196, "epoch": 520} {"train_loss": -19.7023868560791, "global_step": 43197, "epoch": 520} {"train_loss": -19.413896560668945, "global_step": 43198, "epoch": 520} {"train_loss": -19.405715942382812, "global_step": 43199, "epoch": 520} {"train_loss": -19.525009155273438, "global_step": 43200, "epoch": 520} {"train_loss": -19.63458824157715, "global_step": 43201, "epoch": 520} {"train_loss": -19.817617416381836, "global_step": 43202, "epoch": 520} {"train_loss": -19.49826431274414, "global_step": 43203, "epoch": 520} {"train_loss": -19.496234893798828, "global_step": 43204, "epoch": 520} {"train_loss": -19.574533462524414, "global_step": 43205, "epoch": 520} {"train_loss": -19.461400985717773, "global_step": 43206, "epoch": 520} {"train_loss": -19.59592056274414, "global_step": 43207, "epoch": 520} {"train_loss": -19.52718162536621, "global_step": 43208, "epoch": 520} {"train_loss": -19.50717544555664, "global_step": 43209, "epoch": 520} {"train_loss": -19.710163116455078, "global_step": 43210, "epoch": 520} {"train_loss": -19.80731201171875, "global_step": 43211, "epoch": 520} {"train_loss": -19.4581241607666, "global_step": 43212, "epoch": 520} {"train_loss": -19.6126651763916, "global_step": 43213, "epoch": 520} {"train_loss": -19.830049514770508, "global_step": 43214, "epoch": 520} {"train_loss": -19.574630737304688, "global_step": 43215, "epoch": 520} {"train_loss": -19.819561004638672, "global_step": 43216, "epoch": 520} {"train_loss": -19.177963256835938, "global_step": 43217, "epoch": 520} {"train_loss": -19.73632049560547, "global_step": 43218, "epoch": 520} {"train_loss": -19.585609436035156, "global_step": 43219, "epoch": 520} {"train_loss": -19.742429733276367, "global_step": 43220, "epoch": 520} {"train_loss": -19.65070915222168, "global_step": 43221, "epoch": 520} {"train_loss": -19.7758731842041, "global_step": 43222, "epoch": 520} {"train_loss": -19.69024085998535, "global_step": 43223, "epoch": 520} {"train_loss": -19.42535972595215, "global_step": 43224, "epoch": 520} {"train_loss": -19.44098472595215, "global_step": 43225, "epoch": 520} {"train_loss": -19.716476440429688, "global_step": 43226, "epoch": 520} {"train_loss": -20.033260345458984, "global_step": 43227, "epoch": 520} {"train_loss": -19.235822677612305, "global_step": 43228, "epoch": 520} {"train_loss": -19.802490234375, "global_step": 43229, "epoch": 520} {"train_loss": -19.815214157104492, "global_step": 43230, "epoch": 520} {"train_loss": -19.74989128112793, "global_step": 43231, "epoch": 520} {"train_loss": -19.45821189880371, "global_step": 43232, "epoch": 520} {"train_loss": -19.773801803588867, "global_step": 43233, "epoch": 520} {"train_loss": -19.503509521484375, "global_step": 43234, "epoch": 520} {"train_loss": -19.900409698486328, "global_step": 43235, "epoch": 520} {"train_loss": -19.707122802734375, "global_step": 43236, "epoch": 520} {"train_loss": -19.714401245117188, "global_step": 43237, "epoch": 520} {"train_loss": -19.8657283782959, "global_step": 43238, "epoch": 520} {"train_loss": -19.782583236694336, "global_step": 43239, "epoch": 520} {"train_loss": -19.083847045898438, "global_step": 43240, "epoch": 520} {"train_loss": -19.599782943725586, "global_step": 43241, "epoch": 520} {"train_loss": -19.602683147752142, "global_step": 43242, "epoch": 520, "val_loss": 6017877.0} {"train_loss": -18.982555389404297, "global_step": 43243, "epoch": 521} {"train_loss": -19.568456649780273, "global_step": 43244, "epoch": 521} {"train_loss": -19.68123435974121, "global_step": 43245, "epoch": 521} {"train_loss": -19.525619506835938, "global_step": 43246, "epoch": 521} {"train_loss": -19.31166648864746, "global_step": 43247, "epoch": 521} {"train_loss": -19.530872344970703, "global_step": 43248, "epoch": 521} {"train_loss": -19.554906845092773, "global_step": 43249, "epoch": 521} {"train_loss": -19.553701400756836, "global_step": 43250, "epoch": 521} {"train_loss": -19.377836227416992, "global_step": 43251, "epoch": 521} {"train_loss": -19.498825073242188, "global_step": 43252, "epoch": 521} {"train_loss": -19.355030059814453, "global_step": 43253, "epoch": 521} {"train_loss": -19.773147583007812, "global_step": 43254, "epoch": 521} {"train_loss": -19.465024948120117, "global_step": 43255, "epoch": 521} {"train_loss": -19.754098892211914, "global_step": 43256, "epoch": 521} {"train_loss": -19.585195541381836, "global_step": 43257, "epoch": 521} {"train_loss": -19.348913192749023, "global_step": 43258, "epoch": 521} {"train_loss": -19.6296329498291, "global_step": 43259, "epoch": 521} {"train_loss": -19.666427612304688, "global_step": 43260, "epoch": 521} {"train_loss": -19.723159790039062, "global_step": 43261, "epoch": 521} {"train_loss": -19.62226676940918, "global_step": 43262, "epoch": 521} {"train_loss": -19.80696678161621, "global_step": 43263, "epoch": 521} {"train_loss": -19.5755615234375, "global_step": 43264, "epoch": 521} {"train_loss": -19.790929794311523, "global_step": 43265, "epoch": 521} {"train_loss": -19.39399528503418, "global_step": 43266, "epoch": 521} {"train_loss": -19.476335525512695, "global_step": 43267, "epoch": 521} {"train_loss": -19.260419845581055, "global_step": 43268, "epoch": 521} {"train_loss": -19.608156204223633, "global_step": 43269, "epoch": 521} {"train_loss": -19.377439498901367, "global_step": 43270, "epoch": 521} {"train_loss": -19.12491798400879, "global_step": 43271, "epoch": 521} {"train_loss": -19.928543090820312, "global_step": 43272, "epoch": 521} {"train_loss": -19.71540641784668, "global_step": 43273, "epoch": 521} {"train_loss": -19.60228157043457, "global_step": 43274, "epoch": 521} {"train_loss": -19.551786422729492, "global_step": 43275, "epoch": 521} {"train_loss": -19.349699020385742, "global_step": 43276, "epoch": 521} {"train_loss": -19.67222023010254, "global_step": 43277, "epoch": 521} {"train_loss": -19.448646545410156, "global_step": 43278, "epoch": 521} {"train_loss": -19.254093170166016, "global_step": 43279, "epoch": 521} {"train_loss": -19.83698844909668, "global_step": 43280, "epoch": 521} {"train_loss": -19.224084854125977, "global_step": 43281, "epoch": 521} {"train_loss": -19.67574119567871, "global_step": 43282, "epoch": 521} {"train_loss": -19.181499481201172, "global_step": 43283, "epoch": 521} {"train_loss": -19.605819702148438, "global_step": 43284, "epoch": 521} {"train_loss": -19.521177291870117, "global_step": 43285, "epoch": 521} {"train_loss": -19.75318717956543, "global_step": 43286, "epoch": 521} {"train_loss": -19.208791732788086, "global_step": 43287, "epoch": 521} {"train_loss": -19.734865188598633, "global_step": 43288, "epoch": 521} {"train_loss": -19.627084732055664, "global_step": 43289, "epoch": 521} {"train_loss": -19.38149070739746, "global_step": 43290, "epoch": 521} {"train_loss": -19.829877853393555, "global_step": 43291, "epoch": 521} {"train_loss": -19.96770668029785, "global_step": 43292, "epoch": 521} {"train_loss": -19.80158042907715, "global_step": 43293, "epoch": 521} {"train_loss": -19.86248207092285, "global_step": 43294, "epoch": 521} {"train_loss": -19.63787841796875, "global_step": 43295, "epoch": 521} {"train_loss": -19.484655380249023, "global_step": 43296, "epoch": 521} {"train_loss": -19.811447143554688, "global_step": 43297, "epoch": 521} {"train_loss": -19.818586349487305, "global_step": 43298, "epoch": 521} {"train_loss": -19.56051254272461, "global_step": 43299, "epoch": 521} {"train_loss": -19.689777374267578, "global_step": 43300, "epoch": 521} {"train_loss": -19.482263565063477, "global_step": 43301, "epoch": 521} {"train_loss": -19.411794662475586, "global_step": 43302, "epoch": 521} {"train_loss": -19.474380493164062, "global_step": 43303, "epoch": 521} {"train_loss": -19.229963302612305, "global_step": 43304, "epoch": 521} {"train_loss": -19.359006881713867, "global_step": 43305, "epoch": 521} {"train_loss": -19.266372680664062, "global_step": 43306, "epoch": 521} {"train_loss": -19.592437744140625, "global_step": 43307, "epoch": 521} {"train_loss": -19.702909469604492, "global_step": 43308, "epoch": 521} {"train_loss": -19.479028701782227, "global_step": 43309, "epoch": 521} {"train_loss": -19.279478073120117, "global_step": 43310, "epoch": 521} {"train_loss": -19.60881233215332, "global_step": 43311, "epoch": 521} {"train_loss": -19.384695053100586, "global_step": 43312, "epoch": 521} {"train_loss": -19.771305084228516, "global_step": 43313, "epoch": 521} {"train_loss": -19.37436294555664, "global_step": 43314, "epoch": 521} {"train_loss": -19.59347915649414, "global_step": 43315, "epoch": 521} {"train_loss": -19.511198043823242, "global_step": 43316, "epoch": 521} {"train_loss": -19.981779098510742, "global_step": 43317, "epoch": 521} {"train_loss": -19.629146575927734, "global_step": 43318, "epoch": 521} {"train_loss": -19.47418212890625, "global_step": 43319, "epoch": 521} {"train_loss": -19.454153060913086, "global_step": 43320, "epoch": 521} {"train_loss": -19.800527572631836, "global_step": 43321, "epoch": 521} {"train_loss": -19.783761978149414, "global_step": 43322, "epoch": 521} {"train_loss": -19.558622360229492, "global_step": 43323, "epoch": 521} {"train_loss": -19.578746795654297, "global_step": 43324, "epoch": 521} {"train_loss": -19.525481741112397, "global_step": 43325, "epoch": 521, "val_loss": 6081037.0} {"train_loss": -19.08543586730957, "global_step": 43326, "epoch": 522} {"train_loss": -19.907424926757812, "global_step": 43327, "epoch": 522} {"train_loss": -19.199222564697266, "global_step": 43328, "epoch": 522} {"train_loss": -19.155969619750977, "global_step": 43329, "epoch": 522} {"train_loss": -19.42172622680664, "global_step": 43330, "epoch": 522} {"train_loss": -19.364389419555664, "global_step": 43331, "epoch": 522} {"train_loss": -19.204238891601562, "global_step": 43332, "epoch": 522} {"train_loss": -19.529434204101562, "global_step": 43333, "epoch": 522} {"train_loss": -19.54835319519043, "global_step": 43334, "epoch": 522} {"train_loss": -19.66307258605957, "global_step": 43335, "epoch": 522} {"train_loss": -19.883403778076172, "global_step": 43336, "epoch": 522} {"train_loss": -19.39967918395996, "global_step": 43337, "epoch": 522} {"train_loss": -19.462039947509766, "global_step": 43338, "epoch": 522} {"train_loss": -19.508939743041992, "global_step": 43339, "epoch": 522} {"train_loss": -19.58848762512207, "global_step": 43340, "epoch": 522} {"train_loss": -19.420795440673828, "global_step": 43341, "epoch": 522} {"train_loss": -20.03230094909668, "global_step": 43342, "epoch": 522} {"train_loss": -20.179466247558594, "global_step": 43343, "epoch": 522} {"train_loss": -19.8610897064209, "global_step": 43344, "epoch": 522} {"train_loss": -19.68173599243164, "global_step": 43345, "epoch": 522} {"train_loss": -19.283777236938477, "global_step": 43346, "epoch": 522} {"train_loss": -19.28798484802246, "global_step": 43347, "epoch": 522} {"train_loss": -19.45560646057129, "global_step": 43348, "epoch": 522} {"train_loss": -19.60072135925293, "global_step": 43349, "epoch": 522} {"train_loss": -19.894275665283203, "global_step": 43350, "epoch": 522} {"train_loss": -19.74112319946289, "global_step": 43351, "epoch": 522} {"train_loss": -19.564252853393555, "global_step": 43352, "epoch": 522} {"train_loss": -19.34657859802246, "global_step": 43353, "epoch": 522} {"train_loss": -19.65302848815918, "global_step": 43354, "epoch": 522} {"train_loss": -19.69257164001465, "global_step": 43355, "epoch": 522} {"train_loss": -19.780790328979492, "global_step": 43356, "epoch": 522} {"train_loss": -19.866674423217773, "global_step": 43357, "epoch": 522} {"train_loss": -19.682586669921875, "global_step": 43358, "epoch": 522} {"train_loss": -19.8391056060791, "global_step": 43359, "epoch": 522} {"train_loss": -19.460586547851562, "global_step": 43360, "epoch": 522} {"train_loss": -19.495710372924805, "global_step": 43361, "epoch": 522} {"train_loss": -19.926790237426758, "global_step": 43362, "epoch": 522} {"train_loss": -19.305084228515625, "global_step": 43363, "epoch": 522} {"train_loss": -19.399534225463867, "global_step": 43364, "epoch": 522} {"train_loss": -20.0037841796875, "global_step": 43365, "epoch": 522} {"train_loss": -19.651655197143555, "global_step": 43366, "epoch": 522} {"train_loss": -19.548377990722656, "global_step": 43367, "epoch": 522} {"train_loss": -19.209718704223633, "global_step": 43368, "epoch": 522} {"train_loss": -19.28873062133789, "global_step": 43369, "epoch": 522} {"train_loss": -19.78729248046875, "global_step": 43370, "epoch": 522} {"train_loss": -19.645099639892578, "global_step": 43371, "epoch": 522} {"train_loss": -19.532855987548828, "global_step": 43372, "epoch": 522} {"train_loss": -19.7354736328125, "global_step": 43373, "epoch": 522} {"train_loss": -19.59444236755371, "global_step": 43374, "epoch": 522} {"train_loss": -19.73893165588379, "global_step": 43375, "epoch": 522} {"train_loss": -19.921491622924805, "global_step": 43376, "epoch": 522} {"train_loss": -19.897306442260742, "global_step": 43377, "epoch": 522} {"train_loss": -19.77638816833496, "global_step": 43378, "epoch": 522} {"train_loss": -19.651447296142578, "global_step": 43379, "epoch": 522} {"train_loss": -19.4993953704834, "global_step": 43380, "epoch": 522} {"train_loss": -19.591123580932617, "global_step": 43381, "epoch": 522} {"train_loss": -19.614505767822266, "global_step": 43382, "epoch": 522} {"train_loss": -19.358963012695312, "global_step": 43383, "epoch": 522} {"train_loss": -19.25156593322754, "global_step": 43384, "epoch": 522} {"train_loss": -19.691455841064453, "global_step": 43385, "epoch": 522} {"train_loss": -19.752059936523438, "global_step": 43386, "epoch": 522} {"train_loss": -19.702966690063477, "global_step": 43387, "epoch": 522} {"train_loss": -19.782222747802734, "global_step": 43388, "epoch": 522} {"train_loss": -19.622562408447266, "global_step": 43389, "epoch": 522} {"train_loss": -19.462430953979492, "global_step": 43390, "epoch": 522} {"train_loss": -19.81104850769043, "global_step": 43391, "epoch": 522} {"train_loss": -19.60316276550293, "global_step": 43392, "epoch": 522} {"train_loss": -19.677474975585938, "global_step": 43393, "epoch": 522} {"train_loss": -19.606082916259766, "global_step": 43394, "epoch": 522} {"train_loss": -19.454980850219727, "global_step": 43395, "epoch": 522} {"train_loss": -19.27498435974121, "global_step": 43396, "epoch": 522} {"train_loss": -19.329801559448242, "global_step": 43397, "epoch": 522} {"train_loss": -19.46175193786621, "global_step": 43398, "epoch": 522} {"train_loss": -19.73017120361328, "global_step": 43399, "epoch": 522} {"train_loss": -19.954532623291016, "global_step": 43400, "epoch": 522} {"train_loss": -19.427988052368164, "global_step": 43401, "epoch": 522} {"train_loss": -19.608449935913086, "global_step": 43402, "epoch": 522} {"train_loss": -19.432477951049805, "global_step": 43403, "epoch": 522} {"train_loss": -19.61560821533203, "global_step": 43404, "epoch": 522} {"train_loss": -19.98050880432129, "global_step": 43405, "epoch": 522} {"train_loss": -19.584402084350586, "global_step": 43406, "epoch": 522} {"train_loss": -20.29191017150879, "global_step": 43407, "epoch": 522} {"train_loss": -19.61273009518543, "global_step": 43408, "epoch": 522, "val_loss": 6153573.5} {"train_loss": -19.1726131439209, "global_step": 43409, "epoch": 523} {"train_loss": -19.750293731689453, "global_step": 43410, "epoch": 523} {"train_loss": -19.276905059814453, "global_step": 43411, "epoch": 523} {"train_loss": -19.825056076049805, "global_step": 43412, "epoch": 523} {"train_loss": -19.65285301208496, "global_step": 43413, "epoch": 523} {"train_loss": -19.611684799194336, "global_step": 43414, "epoch": 523} {"train_loss": -19.30059242248535, "global_step": 43415, "epoch": 523} {"train_loss": -19.701139450073242, "global_step": 43416, "epoch": 523} {"train_loss": -19.38050079345703, "global_step": 43417, "epoch": 523} {"train_loss": -19.65926742553711, "global_step": 43418, "epoch": 523} {"train_loss": -19.45911979675293, "global_step": 43419, "epoch": 523} {"train_loss": -19.345739364624023, "global_step": 43420, "epoch": 523} {"train_loss": -19.564865112304688, "global_step": 43421, "epoch": 523} {"train_loss": -19.512529373168945, "global_step": 43422, "epoch": 523} {"train_loss": -19.878419876098633, "global_step": 43423, "epoch": 523} {"train_loss": -19.6726016998291, "global_step": 43424, "epoch": 523} {"train_loss": -19.49258804321289, "global_step": 43425, "epoch": 523} {"train_loss": -19.48200035095215, "global_step": 43426, "epoch": 523} {"train_loss": -19.432498931884766, "global_step": 43427, "epoch": 523} {"train_loss": -19.344999313354492, "global_step": 43428, "epoch": 523} {"train_loss": -19.90296745300293, "global_step": 43429, "epoch": 523} {"train_loss": -19.965688705444336, "global_step": 43430, "epoch": 523} {"train_loss": -19.479503631591797, "global_step": 43431, "epoch": 523} {"train_loss": -19.177087783813477, "global_step": 43432, "epoch": 523} {"train_loss": -19.466394424438477, "global_step": 43433, "epoch": 523} {"train_loss": -19.64387321472168, "global_step": 43434, "epoch": 523} {"train_loss": -19.49649429321289, "global_step": 43435, "epoch": 523} {"train_loss": -19.824172973632812, "global_step": 43436, "epoch": 523} {"train_loss": -19.378198623657227, "global_step": 43437, "epoch": 523} {"train_loss": -19.75363540649414, "global_step": 43438, "epoch": 523} {"train_loss": -19.68561363220215, "global_step": 43439, "epoch": 523} {"train_loss": -19.55756187438965, "global_step": 43440, "epoch": 523} {"train_loss": -19.48666000366211, "global_step": 43441, "epoch": 523} {"train_loss": -19.227731704711914, "global_step": 43442, "epoch": 523} {"train_loss": -19.178447723388672, "global_step": 43443, "epoch": 523} {"train_loss": -19.66657066345215, "global_step": 43444, "epoch": 523} {"train_loss": -19.84771156311035, "global_step": 43445, "epoch": 523} {"train_loss": -19.694236755371094, "global_step": 43446, "epoch": 523} {"train_loss": -19.727642059326172, "global_step": 43447, "epoch": 523} {"train_loss": -20.033084869384766, "global_step": 43448, "epoch": 523} {"train_loss": -19.831296920776367, "global_step": 43449, "epoch": 523} {"train_loss": -19.840662002563477, "global_step": 43450, "epoch": 523} {"train_loss": -19.516708374023438, "global_step": 43451, "epoch": 523} {"train_loss": -19.468191146850586, "global_step": 43452, "epoch": 523} {"train_loss": -19.35546875, "global_step": 43453, "epoch": 523} {"train_loss": -19.332937240600586, "global_step": 43454, "epoch": 523} {"train_loss": -19.27382469177246, "global_step": 43455, "epoch": 523} {"train_loss": -19.679054260253906, "global_step": 43456, "epoch": 523} {"train_loss": -19.525117874145508, "global_step": 43457, "epoch": 523} {"train_loss": -19.35357093811035, "global_step": 43458, "epoch": 523} {"train_loss": -19.789926528930664, "global_step": 43459, "epoch": 523} {"train_loss": -19.74298858642578, "global_step": 43460, "epoch": 523} {"train_loss": -19.814529418945312, "global_step": 43461, "epoch": 523} {"train_loss": -19.820837020874023, "global_step": 43462, "epoch": 523} {"train_loss": -19.698917388916016, "global_step": 43463, "epoch": 523} {"train_loss": -19.726049423217773, "global_step": 43464, "epoch": 523} {"train_loss": -19.90266990661621, "global_step": 43465, "epoch": 523} {"train_loss": -19.592212677001953, "global_step": 43466, "epoch": 523} {"train_loss": -19.64307975769043, "global_step": 43467, "epoch": 523} {"train_loss": -19.46337127685547, "global_step": 43468, "epoch": 523} {"train_loss": -19.953205108642578, "global_step": 43469, "epoch": 523} {"train_loss": -19.408418655395508, "global_step": 43470, "epoch": 523} {"train_loss": -19.755002975463867, "global_step": 43471, "epoch": 523} {"train_loss": -19.62287712097168, "global_step": 43472, "epoch": 523} {"train_loss": -19.541746139526367, "global_step": 43473, "epoch": 523} {"train_loss": -19.468244552612305, "global_step": 43474, "epoch": 523} {"train_loss": -19.701831817626953, "global_step": 43475, "epoch": 523} {"train_loss": -19.676801681518555, "global_step": 43476, "epoch": 523} {"train_loss": -19.79677391052246, "global_step": 43477, "epoch": 523} {"train_loss": -19.578229904174805, "global_step": 43478, "epoch": 523} {"train_loss": -19.488357543945312, "global_step": 43479, "epoch": 523} {"train_loss": -19.990020751953125, "global_step": 43480, "epoch": 523} {"train_loss": -19.29722023010254, "global_step": 43481, "epoch": 523} {"train_loss": -19.30816078186035, "global_step": 43482, "epoch": 523} {"train_loss": -19.073139190673828, "global_step": 43483, "epoch": 523} {"train_loss": -19.775548934936523, "global_step": 43484, "epoch": 523} {"train_loss": -19.6915340423584, "global_step": 43485, "epoch": 523} {"train_loss": -20.063722610473633, "global_step": 43486, "epoch": 523} {"train_loss": -19.47286605834961, "global_step": 43487, "epoch": 523} {"train_loss": -19.752567291259766, "global_step": 43488, "epoch": 523} {"train_loss": -19.473529815673828, "global_step": 43489, "epoch": 523} {"train_loss": -19.77241325378418, "global_step": 43490, "epoch": 523} {"train_loss": -19.594731227461114, "global_step": 43491, "epoch": 523, "val_loss": 6032571.5} {"train_loss": -19.2083683013916, "global_step": 43492, "epoch": 524} {"train_loss": -19.41022300720215, "global_step": 43493, "epoch": 524} {"train_loss": -19.702268600463867, "global_step": 43494, "epoch": 524} {"train_loss": -19.405750274658203, "global_step": 43495, "epoch": 524} {"train_loss": -19.433029174804688, "global_step": 43496, "epoch": 524} {"train_loss": -19.846817016601562, "global_step": 43497, "epoch": 524} {"train_loss": -19.47822380065918, "global_step": 43498, "epoch": 524} {"train_loss": -19.352134704589844, "global_step": 43499, "epoch": 524} {"train_loss": -19.53749656677246, "global_step": 43500, "epoch": 524} {"train_loss": -19.692129135131836, "global_step": 43501, "epoch": 524} {"train_loss": -19.578420639038086, "global_step": 43502, "epoch": 524} {"train_loss": -19.644210815429688, "global_step": 43503, "epoch": 524} {"train_loss": -19.74325180053711, "global_step": 43504, "epoch": 524} {"train_loss": -19.459686279296875, "global_step": 43505, "epoch": 524} {"train_loss": -19.749881744384766, "global_step": 43506, "epoch": 524} {"train_loss": -19.78169059753418, "global_step": 43507, "epoch": 524} {"train_loss": -19.654537200927734, "global_step": 43508, "epoch": 524} {"train_loss": -19.588552474975586, "global_step": 43509, "epoch": 524} {"train_loss": -19.411380767822266, "global_step": 43510, "epoch": 524} {"train_loss": -19.412063598632812, "global_step": 43511, "epoch": 524} {"train_loss": -19.86799430847168, "global_step": 43512, "epoch": 524} {"train_loss": -19.243284225463867, "global_step": 43513, "epoch": 524} {"train_loss": -19.51397132873535, "global_step": 43514, "epoch": 524} {"train_loss": -19.757566452026367, "global_step": 43515, "epoch": 524} {"train_loss": -19.75916862487793, "global_step": 43516, "epoch": 524} {"train_loss": -19.708642959594727, "global_step": 43517, "epoch": 524} {"train_loss": -19.42841148376465, "global_step": 43518, "epoch": 524} {"train_loss": -19.701034545898438, "global_step": 43519, "epoch": 524} {"train_loss": -19.56784439086914, "global_step": 43520, "epoch": 524} {"train_loss": -19.325719833374023, "global_step": 43521, "epoch": 524} {"train_loss": -19.439727783203125, "global_step": 43522, "epoch": 524} {"train_loss": -19.26424217224121, "global_step": 43523, "epoch": 524} {"train_loss": -19.846492767333984, "global_step": 43524, "epoch": 524} {"train_loss": -19.367956161499023, "global_step": 43525, "epoch": 524} {"train_loss": -19.51757049560547, "global_step": 43526, "epoch": 524} {"train_loss": -19.38858413696289, "global_step": 43527, "epoch": 524} {"train_loss": -19.724294662475586, "global_step": 43528, "epoch": 524} {"train_loss": -20.017038345336914, "global_step": 43529, "epoch": 524} {"train_loss": -19.349164962768555, "global_step": 43530, "epoch": 524} {"train_loss": -19.715848922729492, "global_step": 43531, "epoch": 524} {"train_loss": -19.510427474975586, "global_step": 43532, "epoch": 524} {"train_loss": -19.369400024414062, "global_step": 43533, "epoch": 524} {"train_loss": -19.596988677978516, "global_step": 43534, "epoch": 524} {"train_loss": -19.675228118896484, "global_step": 43535, "epoch": 524} {"train_loss": -19.647558212280273, "global_step": 43536, "epoch": 524} {"train_loss": -19.249704360961914, "global_step": 43537, "epoch": 524} {"train_loss": -19.632802963256836, "global_step": 43538, "epoch": 524} {"train_loss": -19.818140029907227, "global_step": 43539, "epoch": 524} {"train_loss": -19.51487159729004, "global_step": 43540, "epoch": 524} {"train_loss": -19.74835968017578, "global_step": 43541, "epoch": 524} {"train_loss": -19.7554874420166, "global_step": 43542, "epoch": 524} {"train_loss": -19.50641632080078, "global_step": 43543, "epoch": 524} {"train_loss": -19.64934730529785, "global_step": 43544, "epoch": 524} {"train_loss": -19.690237045288086, "global_step": 43545, "epoch": 524} {"train_loss": -19.838605880737305, "global_step": 43546, "epoch": 524} {"train_loss": -19.792558670043945, "global_step": 43547, "epoch": 524} {"train_loss": -19.51519775390625, "global_step": 43548, "epoch": 524} {"train_loss": -19.552419662475586, "global_step": 43549, "epoch": 524} {"train_loss": -19.629011154174805, "global_step": 43550, "epoch": 524} {"train_loss": -19.724435806274414, "global_step": 43551, "epoch": 524} {"train_loss": -19.844884872436523, "global_step": 43552, "epoch": 524} {"train_loss": -19.6395320892334, "global_step": 43553, "epoch": 524} {"train_loss": -19.733457565307617, "global_step": 43554, "epoch": 524} {"train_loss": -19.732318878173828, "global_step": 43555, "epoch": 524} {"train_loss": -19.81192398071289, "global_step": 43556, "epoch": 524} {"train_loss": -19.999982833862305, "global_step": 43557, "epoch": 524} {"train_loss": -19.74319839477539, "global_step": 43558, "epoch": 524} {"train_loss": -19.878437042236328, "global_step": 43559, "epoch": 524} {"train_loss": -19.519865036010742, "global_step": 43560, "epoch": 524} {"train_loss": -19.53989028930664, "global_step": 43561, "epoch": 524} {"train_loss": -19.6215877532959, "global_step": 43562, "epoch": 524} {"train_loss": -19.66612434387207, "global_step": 43563, "epoch": 524} {"train_loss": -19.641277313232422, "global_step": 43564, "epoch": 524} {"train_loss": -19.576160430908203, "global_step": 43565, "epoch": 524} {"train_loss": -19.982242584228516, "global_step": 43566, "epoch": 524} {"train_loss": -19.692047119140625, "global_step": 43567, "epoch": 524} {"train_loss": -19.900331497192383, "global_step": 43568, "epoch": 524} {"train_loss": -19.70331573486328, "global_step": 43569, "epoch": 524} {"train_loss": -19.67108154296875, "global_step": 43570, "epoch": 524} {"train_loss": -19.188230514526367, "global_step": 43571, "epoch": 524} {"train_loss": -19.356250762939453, "global_step": 43572, "epoch": 524} {"train_loss": -19.288881301879883, "global_step": 43573, "epoch": 524} {"train_loss": -19.609714462096434, "global_step": 43574, "epoch": 524, "val_loss": 6063960.0} {"train_loss": -19.21697998046875, "global_step": 43575, "epoch": 525} {"train_loss": -19.569629669189453, "global_step": 43576, "epoch": 525} {"train_loss": -19.25229835510254, "global_step": 43577, "epoch": 525} {"train_loss": -19.753400802612305, "global_step": 43578, "epoch": 525} {"train_loss": -19.770915985107422, "global_step": 43579, "epoch": 525} {"train_loss": -19.187271118164062, "global_step": 43580, "epoch": 525} {"train_loss": -19.805753707885742, "global_step": 43581, "epoch": 525} {"train_loss": -19.709375381469727, "global_step": 43582, "epoch": 525} {"train_loss": -19.7457275390625, "global_step": 43583, "epoch": 525} {"train_loss": -19.54368019104004, "global_step": 43584, "epoch": 525} {"train_loss": -19.396757125854492, "global_step": 43585, "epoch": 525} {"train_loss": -19.876567840576172, "global_step": 43586, "epoch": 525} {"train_loss": -19.898948669433594, "global_step": 43587, "epoch": 525} {"train_loss": -19.50848388671875, "global_step": 43588, "epoch": 525} {"train_loss": -19.535053253173828, "global_step": 43589, "epoch": 525} {"train_loss": -19.817319869995117, "global_step": 43590, "epoch": 525} {"train_loss": -19.647235870361328, "global_step": 43591, "epoch": 525} {"train_loss": -19.710193634033203, "global_step": 43592, "epoch": 525} {"train_loss": -19.364660263061523, "global_step": 43593, "epoch": 525} {"train_loss": -19.913738250732422, "global_step": 43594, "epoch": 525} {"train_loss": -19.519641876220703, "global_step": 43595, "epoch": 525} {"train_loss": -19.641942977905273, "global_step": 43596, "epoch": 525} {"train_loss": -19.95515251159668, "global_step": 43597, "epoch": 525} {"train_loss": -19.613534927368164, "global_step": 43598, "epoch": 525} {"train_loss": -20.052242279052734, "global_step": 43599, "epoch": 525} {"train_loss": -19.694366455078125, "global_step": 43600, "epoch": 525} {"train_loss": -19.59682273864746, "global_step": 43601, "epoch": 525} {"train_loss": -19.87579345703125, "global_step": 43602, "epoch": 525} {"train_loss": -19.640108108520508, "global_step": 43603, "epoch": 525} {"train_loss": -19.929767608642578, "global_step": 43604, "epoch": 525} {"train_loss": -19.48365592956543, "global_step": 43605, "epoch": 525} {"train_loss": -19.560850143432617, "global_step": 43606, "epoch": 525} {"train_loss": -19.533002853393555, "global_step": 43607, "epoch": 525} {"train_loss": -19.80661392211914, "global_step": 43608, "epoch": 525} {"train_loss": -19.960691452026367, "global_step": 43609, "epoch": 525} {"train_loss": -19.747648239135742, "global_step": 43610, "epoch": 525} {"train_loss": -19.80692481994629, "global_step": 43611, "epoch": 525} {"train_loss": -19.71868324279785, "global_step": 43612, "epoch": 525} {"train_loss": -19.708471298217773, "global_step": 43613, "epoch": 525} {"train_loss": -19.577484130859375, "global_step": 43614, "epoch": 525} {"train_loss": -19.629486083984375, "global_step": 43615, "epoch": 525} {"train_loss": -19.692480087280273, "global_step": 43616, "epoch": 525} {"train_loss": -19.79866600036621, "global_step": 43617, "epoch": 525} {"train_loss": -19.628772735595703, "global_step": 43618, "epoch": 525} {"train_loss": -19.68617057800293, "global_step": 43619, "epoch": 525} {"train_loss": -19.364789962768555, "global_step": 43620, "epoch": 525} {"train_loss": -19.386884689331055, "global_step": 43621, "epoch": 525} {"train_loss": -19.621849060058594, "global_step": 43622, "epoch": 525} {"train_loss": -19.244932174682617, "global_step": 43623, "epoch": 525} {"train_loss": -19.618743896484375, "global_step": 43624, "epoch": 525} {"train_loss": -19.782339096069336, "global_step": 43625, "epoch": 525} {"train_loss": -19.203702926635742, "global_step": 43626, "epoch": 525} {"train_loss": -19.834157943725586, "global_step": 43627, "epoch": 525} {"train_loss": -19.538612365722656, "global_step": 43628, "epoch": 525} {"train_loss": -19.656293869018555, "global_step": 43629, "epoch": 525} {"train_loss": -19.782711029052734, "global_step": 43630, "epoch": 525} {"train_loss": -19.53689956665039, "global_step": 43631, "epoch": 525} {"train_loss": -19.69319725036621, "global_step": 43632, "epoch": 525} {"train_loss": -19.591896057128906, "global_step": 43633, "epoch": 525} {"train_loss": -19.769344329833984, "global_step": 43634, "epoch": 525} {"train_loss": -19.698774337768555, "global_step": 43635, "epoch": 525} {"train_loss": -19.79161834716797, "global_step": 43636, "epoch": 525} {"train_loss": -19.715116500854492, "global_step": 43637, "epoch": 525} {"train_loss": -19.767297744750977, "global_step": 43638, "epoch": 525} {"train_loss": -19.580598831176758, "global_step": 43639, "epoch": 525} {"train_loss": -19.836566925048828, "global_step": 43640, "epoch": 525} {"train_loss": -19.315114974975586, "global_step": 43641, "epoch": 525} {"train_loss": -19.413333892822266, "global_step": 43642, "epoch": 525} {"train_loss": -19.842586517333984, "global_step": 43643, "epoch": 525} {"train_loss": -19.61150550842285, "global_step": 43644, "epoch": 525} {"train_loss": -19.623111724853516, "global_step": 43645, "epoch": 525} {"train_loss": -19.764801025390625, "global_step": 43646, "epoch": 525} {"train_loss": -19.33730125427246, "global_step": 43647, "epoch": 525} {"train_loss": -19.677352905273438, "global_step": 43648, "epoch": 525} {"train_loss": -19.308048248291016, "global_step": 43649, "epoch": 525} {"train_loss": -19.4919490814209, "global_step": 43650, "epoch": 525} {"train_loss": -19.326902389526367, "global_step": 43651, "epoch": 525} {"train_loss": -19.583288192749023, "global_step": 43652, "epoch": 525} {"train_loss": -19.385473251342773, "global_step": 43653, "epoch": 525} {"train_loss": -19.389057159423828, "global_step": 43654, "epoch": 525} {"train_loss": -19.6766300201416, "global_step": 43655, "epoch": 525} {"train_loss": -19.476472854614258, "global_step": 43656, "epoch": 525} {"train_loss": -19.638062189860516, "global_step": 43657, "epoch": 525, "val_loss": 6018900.0} {"train_loss": -19.40265464782715, "global_step": 43658, "epoch": 526} {"train_loss": -19.483060836791992, "global_step": 43659, "epoch": 526} {"train_loss": -19.844953536987305, "global_step": 43660, "epoch": 526} {"train_loss": -19.041868209838867, "global_step": 43661, "epoch": 526} {"train_loss": -19.525287628173828, "global_step": 43662, "epoch": 526} {"train_loss": -19.757383346557617, "global_step": 43663, "epoch": 526} {"train_loss": -19.758108139038086, "global_step": 43664, "epoch": 526} {"train_loss": -19.148426055908203, "global_step": 43665, "epoch": 526} {"train_loss": -19.622867584228516, "global_step": 43666, "epoch": 526} {"train_loss": -19.47434425354004, "global_step": 43667, "epoch": 526} {"train_loss": -19.21095085144043, "global_step": 43668, "epoch": 526} {"train_loss": -19.44309425354004, "global_step": 43669, "epoch": 526} {"train_loss": -19.71530532836914, "global_step": 43670, "epoch": 526} {"train_loss": -19.52947425842285, "global_step": 43671, "epoch": 526} {"train_loss": -19.54595184326172, "global_step": 43672, "epoch": 526} {"train_loss": -19.138206481933594, "global_step": 43673, "epoch": 526} {"train_loss": -19.467533111572266, "global_step": 43674, "epoch": 526} {"train_loss": -19.61136245727539, "global_step": 43675, "epoch": 526} {"train_loss": -20.005002975463867, "global_step": 43676, "epoch": 526} {"train_loss": -19.959753036499023, "global_step": 43677, "epoch": 526} {"train_loss": -19.72217559814453, "global_step": 43678, "epoch": 526} {"train_loss": -19.893102645874023, "global_step": 43679, "epoch": 526} {"train_loss": -19.81037712097168, "global_step": 43680, "epoch": 526} {"train_loss": -19.580322265625, "global_step": 43681, "epoch": 526} {"train_loss": -19.750919342041016, "global_step": 43682, "epoch": 526} {"train_loss": -19.532739639282227, "global_step": 43683, "epoch": 526} {"train_loss": -19.83038902282715, "global_step": 43684, "epoch": 526} {"train_loss": -19.744626998901367, "global_step": 43685, "epoch": 526} {"train_loss": -19.910276412963867, "global_step": 43686, "epoch": 526} {"train_loss": -19.95538330078125, "global_step": 43687, "epoch": 526} {"train_loss": -19.447786331176758, "global_step": 43688, "epoch": 526} {"train_loss": -19.465106964111328, "global_step": 43689, "epoch": 526} {"train_loss": -19.42093276977539, "global_step": 43690, "epoch": 526} {"train_loss": -19.347394943237305, "global_step": 43691, "epoch": 526} {"train_loss": -19.655317306518555, "global_step": 43692, "epoch": 526} {"train_loss": -19.577756881713867, "global_step": 43693, "epoch": 526} {"train_loss": -19.528249740600586, "global_step": 43694, "epoch": 526} {"train_loss": -19.978506088256836, "global_step": 43695, "epoch": 526} {"train_loss": -19.678808212280273, "global_step": 43696, "epoch": 526} {"train_loss": -19.245275497436523, "global_step": 43697, "epoch": 526} {"train_loss": -19.845932006835938, "global_step": 43698, "epoch": 526} {"train_loss": -19.637102127075195, "global_step": 43699, "epoch": 526} {"train_loss": -19.56904411315918, "global_step": 43700, "epoch": 526} {"train_loss": -19.418638229370117, "global_step": 43701, "epoch": 526} {"train_loss": -19.758071899414062, "global_step": 43702, "epoch": 526} {"train_loss": -19.492107391357422, "global_step": 43703, "epoch": 526} {"train_loss": -19.9803524017334, "global_step": 43704, "epoch": 526} {"train_loss": -20.003032684326172, "global_step": 43705, "epoch": 526} {"train_loss": -20.02080535888672, "global_step": 43706, "epoch": 526} {"train_loss": -19.42768669128418, "global_step": 43707, "epoch": 526} {"train_loss": -19.536319732666016, "global_step": 43708, "epoch": 526} {"train_loss": -19.654090881347656, "global_step": 43709, "epoch": 526} {"train_loss": -19.582260131835938, "global_step": 43710, "epoch": 526} {"train_loss": -19.760656356811523, "global_step": 43711, "epoch": 526} {"train_loss": -19.8546085357666, "global_step": 43712, "epoch": 526} {"train_loss": -19.584888458251953, "global_step": 43713, "epoch": 526} {"train_loss": -19.464340209960938, "global_step": 43714, "epoch": 526} {"train_loss": -19.682573318481445, "global_step": 43715, "epoch": 526} {"train_loss": -19.431127548217773, "global_step": 43716, "epoch": 526} {"train_loss": -19.527326583862305, "global_step": 43717, "epoch": 526} {"train_loss": -19.668760299682617, "global_step": 43718, "epoch": 526} {"train_loss": -19.09490394592285, "global_step": 43719, "epoch": 526} {"train_loss": -19.54347801208496, "global_step": 43720, "epoch": 526} {"train_loss": -19.265050888061523, "global_step": 43721, "epoch": 526} {"train_loss": -19.721633911132812, "global_step": 43722, "epoch": 526} {"train_loss": -19.54181480407715, "global_step": 43723, "epoch": 526} {"train_loss": -19.68002700805664, "global_step": 43724, "epoch": 526} {"train_loss": -19.851280212402344, "global_step": 43725, "epoch": 526} {"train_loss": -19.62845230102539, "global_step": 43726, "epoch": 526} {"train_loss": -19.505966186523438, "global_step": 43727, "epoch": 526} {"train_loss": -19.51557731628418, "global_step": 43728, "epoch": 526} {"train_loss": -19.32239532470703, "global_step": 43729, "epoch": 526} {"train_loss": -19.595069885253906, "global_step": 43730, "epoch": 526} {"train_loss": -19.523120880126953, "global_step": 43731, "epoch": 526} {"train_loss": -19.376081466674805, "global_step": 43732, "epoch": 526} {"train_loss": -19.676145553588867, "global_step": 43733, "epoch": 526} {"train_loss": -19.60664939880371, "global_step": 43734, "epoch": 526} {"train_loss": -19.682785034179688, "global_step": 43735, "epoch": 526} {"train_loss": -19.49102783203125, "global_step": 43736, "epoch": 526} {"train_loss": -19.337167739868164, "global_step": 43737, "epoch": 526} {"train_loss": -19.691455841064453, "global_step": 43738, "epoch": 526} {"train_loss": -19.675729751586914, "global_step": 43739, "epoch": 526} {"train_loss": -19.618040820202197, "global_step": 43740, "epoch": 526, "val_loss": 6069582.5} {"train_loss": -18.93165397644043, "global_step": 43741, "epoch": 527} {"train_loss": -19.64898109436035, "global_step": 43742, "epoch": 527} {"train_loss": -19.331567764282227, "global_step": 43743, "epoch": 527} {"train_loss": -19.437955856323242, "global_step": 43744, "epoch": 527} {"train_loss": -19.464574813842773, "global_step": 43745, "epoch": 527} {"train_loss": -19.153432846069336, "global_step": 43746, "epoch": 527} {"train_loss": -19.51665496826172, "global_step": 43747, "epoch": 527} {"train_loss": -19.4263973236084, "global_step": 43748, "epoch": 527} {"train_loss": -19.597789764404297, "global_step": 43749, "epoch": 527} {"train_loss": -19.747114181518555, "global_step": 43750, "epoch": 527} {"train_loss": -19.661518096923828, "global_step": 43751, "epoch": 527} {"train_loss": -19.40810203552246, "global_step": 43752, "epoch": 527} {"train_loss": -19.553577423095703, "global_step": 43753, "epoch": 527} {"train_loss": -19.55988883972168, "global_step": 43754, "epoch": 527} {"train_loss": -19.475683212280273, "global_step": 43755, "epoch": 527} {"train_loss": -19.684276580810547, "global_step": 43756, "epoch": 527} {"train_loss": -19.542118072509766, "global_step": 43757, "epoch": 527} {"train_loss": -19.31698989868164, "global_step": 43758, "epoch": 527} {"train_loss": -19.748367309570312, "global_step": 43759, "epoch": 527} {"train_loss": -19.3693790435791, "global_step": 43760, "epoch": 527} {"train_loss": -19.823095321655273, "global_step": 43761, "epoch": 527} {"train_loss": -19.49374771118164, "global_step": 43762, "epoch": 527} {"train_loss": -19.5975284576416, "global_step": 43763, "epoch": 527} {"train_loss": -19.585739135742188, "global_step": 43764, "epoch": 527} {"train_loss": -19.506956100463867, "global_step": 43765, "epoch": 527} {"train_loss": -19.654829025268555, "global_step": 43766, "epoch": 527} {"train_loss": -19.548933029174805, "global_step": 43767, "epoch": 527} {"train_loss": -19.40180778503418, "global_step": 43768, "epoch": 527} {"train_loss": -19.659616470336914, "global_step": 43769, "epoch": 527} {"train_loss": -19.516738891601562, "global_step": 43770, "epoch": 527} {"train_loss": -19.715993881225586, "global_step": 43771, "epoch": 527} {"train_loss": -19.97479820251465, "global_step": 43772, "epoch": 527} {"train_loss": -19.595426559448242, "global_step": 43773, "epoch": 527} {"train_loss": -19.562650680541992, "global_step": 43774, "epoch": 527} {"train_loss": -19.687314987182617, "global_step": 43775, "epoch": 527} {"train_loss": -19.532886505126953, "global_step": 43776, "epoch": 527} {"train_loss": -19.479280471801758, "global_step": 43777, "epoch": 527} {"train_loss": -19.42557716369629, "global_step": 43778, "epoch": 527} {"train_loss": -19.56931495666504, "global_step": 43779, "epoch": 527} {"train_loss": -19.994421005249023, "global_step": 43780, "epoch": 527} {"train_loss": -19.77937126159668, "global_step": 43781, "epoch": 527} {"train_loss": -20.00023651123047, "global_step": 43782, "epoch": 527} {"train_loss": -19.683137893676758, "global_step": 43783, "epoch": 527} {"train_loss": -19.538122177124023, "global_step": 43784, "epoch": 527} {"train_loss": -19.314682006835938, "global_step": 43785, "epoch": 527} {"train_loss": -19.94964027404785, "global_step": 43786, "epoch": 527} {"train_loss": -19.6646785736084, "global_step": 43787, "epoch": 527} {"train_loss": -19.69404411315918, "global_step": 43788, "epoch": 527} {"train_loss": -19.509042739868164, "global_step": 43789, "epoch": 527} {"train_loss": -19.866836547851562, "global_step": 43790, "epoch": 527} {"train_loss": -19.855100631713867, "global_step": 43791, "epoch": 527} {"train_loss": -19.727069854736328, "global_step": 43792, "epoch": 527} {"train_loss": -19.752212524414062, "global_step": 43793, "epoch": 527} {"train_loss": -19.615081787109375, "global_step": 43794, "epoch": 527} {"train_loss": -19.521955490112305, "global_step": 43795, "epoch": 527} {"train_loss": -20.189546585083008, "global_step": 43796, "epoch": 527} {"train_loss": -19.583436965942383, "global_step": 43797, "epoch": 527} {"train_loss": -19.602794647216797, "global_step": 43798, "epoch": 527} {"train_loss": -19.649921417236328, "global_step": 43799, "epoch": 527} {"train_loss": -19.356672286987305, "global_step": 43800, "epoch": 527} {"train_loss": -19.760465621948242, "global_step": 43801, "epoch": 527} {"train_loss": -19.372583389282227, "global_step": 43802, "epoch": 527} {"train_loss": -19.58664321899414, "global_step": 43803, "epoch": 527} {"train_loss": -19.671714782714844, "global_step": 43804, "epoch": 527} {"train_loss": -19.514984130859375, "global_step": 43805, "epoch": 527} {"train_loss": -19.62672233581543, "global_step": 43806, "epoch": 527} {"train_loss": -19.387723922729492, "global_step": 43807, "epoch": 527} {"train_loss": -19.698575973510742, "global_step": 43808, "epoch": 527} {"train_loss": -19.28626251220703, "global_step": 43809, "epoch": 527} {"train_loss": -19.72269630432129, "global_step": 43810, "epoch": 527} {"train_loss": -19.75209617614746, "global_step": 43811, "epoch": 527} {"train_loss": -19.777870178222656, "global_step": 43812, "epoch": 527} {"train_loss": -19.634401321411133, "global_step": 43813, "epoch": 527} {"train_loss": -19.70882797241211, "global_step": 43814, "epoch": 527} {"train_loss": -19.81647300720215, "global_step": 43815, "epoch": 527} {"train_loss": -19.566028594970703, "global_step": 43816, "epoch": 527} {"train_loss": -19.884305953979492, "global_step": 43817, "epoch": 527} {"train_loss": -20.032123565673828, "global_step": 43818, "epoch": 527} {"train_loss": -19.347288131713867, "global_step": 43819, "epoch": 527} {"train_loss": -20.09895896911621, "global_step": 43820, "epoch": 527} {"train_loss": -19.61857032775879, "global_step": 43821, "epoch": 527} {"train_loss": -19.113492965698242, "global_step": 43822, "epoch": 527} {"train_loss": -19.592611634587666, "global_step": 43823, "epoch": 527, "val_loss": 6037414.0} {"train_loss": -18.757123947143555, "global_step": 43824, "epoch": 528} {"train_loss": -19.675800323486328, "global_step": 43825, "epoch": 528} {"train_loss": -19.36271858215332, "global_step": 43826, "epoch": 528} {"train_loss": -19.299137115478516, "global_step": 43827, "epoch": 528} {"train_loss": -19.348981857299805, "global_step": 43828, "epoch": 528} {"train_loss": -19.274017333984375, "global_step": 43829, "epoch": 528} {"train_loss": -19.4681339263916, "global_step": 43830, "epoch": 528} {"train_loss": -19.541278839111328, "global_step": 43831, "epoch": 528} {"train_loss": -19.684112548828125, "global_step": 43832, "epoch": 528} {"train_loss": -19.11968421936035, "global_step": 43833, "epoch": 528} {"train_loss": -19.012435913085938, "global_step": 43834, "epoch": 528} {"train_loss": -19.157812118530273, "global_step": 43835, "epoch": 528} {"train_loss": -19.749784469604492, "global_step": 43836, "epoch": 528} {"train_loss": -19.34821891784668, "global_step": 43837, "epoch": 528} {"train_loss": -19.110807418823242, "global_step": 43838, "epoch": 528} {"train_loss": -19.420495986938477, "global_step": 43839, "epoch": 528} {"train_loss": -19.58521270751953, "global_step": 43840, "epoch": 528} {"train_loss": -19.616668701171875, "global_step": 43841, "epoch": 528} {"train_loss": -19.504505157470703, "global_step": 43842, "epoch": 528} {"train_loss": -19.580801010131836, "global_step": 43843, "epoch": 528} {"train_loss": -19.885663986206055, "global_step": 43844, "epoch": 528} {"train_loss": -19.987186431884766, "global_step": 43845, "epoch": 528} {"train_loss": -19.462793350219727, "global_step": 43846, "epoch": 528} {"train_loss": -19.70624351501465, "global_step": 43847, "epoch": 528} {"train_loss": -19.71445655822754, "global_step": 43848, "epoch": 528} {"train_loss": -19.630691528320312, "global_step": 43849, "epoch": 528} {"train_loss": -19.740192413330078, "global_step": 43850, "epoch": 528} {"train_loss": -19.563749313354492, "global_step": 43851, "epoch": 528} {"train_loss": -19.283767700195312, "global_step": 43852, "epoch": 528} {"train_loss": -19.93638038635254, "global_step": 43853, "epoch": 528} {"train_loss": -19.64008140563965, "global_step": 43854, "epoch": 528} {"train_loss": -19.68651008605957, "global_step": 43855, "epoch": 528} {"train_loss": -20.045562744140625, "global_step": 43856, "epoch": 528} {"train_loss": -19.7630672454834, "global_step": 43857, "epoch": 528} {"train_loss": -19.466779708862305, "global_step": 43858, "epoch": 528} {"train_loss": -19.662281036376953, "global_step": 43859, "epoch": 528} {"train_loss": -19.673500061035156, "global_step": 43860, "epoch": 528} {"train_loss": -19.910512924194336, "global_step": 43861, "epoch": 528} {"train_loss": -19.700910568237305, "global_step": 43862, "epoch": 528} {"train_loss": -19.84296989440918, "global_step": 43863, "epoch": 528} {"train_loss": -19.6109676361084, "global_step": 43864, "epoch": 528} {"train_loss": -19.83084487915039, "global_step": 43865, "epoch": 528} {"train_loss": -19.620948791503906, "global_step": 43866, "epoch": 528} {"train_loss": -19.666339874267578, "global_step": 43867, "epoch": 528} {"train_loss": -19.41226577758789, "global_step": 43868, "epoch": 528} {"train_loss": -19.539474487304688, "global_step": 43869, "epoch": 528} {"train_loss": -19.75922393798828, "global_step": 43870, "epoch": 528} {"train_loss": -19.598691940307617, "global_step": 43871, "epoch": 528} {"train_loss": -19.5811767578125, "global_step": 43872, "epoch": 528} {"train_loss": -19.639240264892578, "global_step": 43873, "epoch": 528} {"train_loss": -20.008384704589844, "global_step": 43874, "epoch": 528} {"train_loss": -19.747591018676758, "global_step": 43875, "epoch": 528} {"train_loss": -19.24698257446289, "global_step": 43876, "epoch": 528} {"train_loss": -19.779102325439453, "global_step": 43877, "epoch": 528} {"train_loss": -19.65688133239746, "global_step": 43878, "epoch": 528} {"train_loss": -19.50956153869629, "global_step": 43879, "epoch": 528} {"train_loss": -19.702106475830078, "global_step": 43880, "epoch": 528} {"train_loss": -19.749340057373047, "global_step": 43881, "epoch": 528} {"train_loss": -19.695837020874023, "global_step": 43882, "epoch": 528} {"train_loss": -19.36204719543457, "global_step": 43883, "epoch": 528} {"train_loss": -19.664987564086914, "global_step": 43884, "epoch": 528} {"train_loss": -19.83591651916504, "global_step": 43885, "epoch": 528} {"train_loss": -19.42902183532715, "global_step": 43886, "epoch": 528} {"train_loss": -19.557037353515625, "global_step": 43887, "epoch": 528} {"train_loss": -19.641454696655273, "global_step": 43888, "epoch": 528} {"train_loss": -19.50709342956543, "global_step": 43889, "epoch": 528} {"train_loss": -19.795475006103516, "global_step": 43890, "epoch": 528} {"train_loss": -19.74087142944336, "global_step": 43891, "epoch": 528} {"train_loss": -19.61927604675293, "global_step": 43892, "epoch": 528} {"train_loss": -19.61773109436035, "global_step": 43893, "epoch": 528} {"train_loss": -19.976083755493164, "global_step": 43894, "epoch": 528} {"train_loss": -19.450626373291016, "global_step": 43895, "epoch": 528} {"train_loss": -19.701904296875, "global_step": 43896, "epoch": 528} {"train_loss": -19.64512062072754, "global_step": 43897, "epoch": 528} {"train_loss": -19.807600021362305, "global_step": 43898, "epoch": 528} {"train_loss": -19.77356719970703, "global_step": 43899, "epoch": 528} {"train_loss": -19.412466049194336, "global_step": 43900, "epoch": 528} {"train_loss": -19.874113082885742, "global_step": 43901, "epoch": 528} {"train_loss": -19.51057243347168, "global_step": 43902, "epoch": 528} {"train_loss": -19.534658432006836, "global_step": 43903, "epoch": 528} {"train_loss": -19.499601364135742, "global_step": 43904, "epoch": 528} {"train_loss": -19.802297592163086, "global_step": 43905, "epoch": 528} {"train_loss": -19.5939763770046, "global_step": 43906, "epoch": 528, "val_loss": 5957712.0} {"train_loss": -19.528364181518555, "global_step": 43907, "epoch": 529} {"train_loss": -18.971393585205078, "global_step": 43908, "epoch": 529} {"train_loss": -19.347660064697266, "global_step": 43909, "epoch": 529} {"train_loss": -19.21146011352539, "global_step": 43910, "epoch": 529} {"train_loss": -19.297138214111328, "global_step": 43911, "epoch": 529} {"train_loss": -18.95001220703125, "global_step": 43912, "epoch": 529} {"train_loss": -19.334531784057617, "global_step": 43913, "epoch": 529} {"train_loss": -19.580432891845703, "global_step": 43914, "epoch": 529} {"train_loss": -19.085554122924805, "global_step": 43915, "epoch": 529} {"train_loss": -19.473308563232422, "global_step": 43916, "epoch": 529} {"train_loss": -19.637401580810547, "global_step": 43917, "epoch": 529} {"train_loss": -19.628124237060547, "global_step": 43918, "epoch": 529} {"train_loss": -19.686798095703125, "global_step": 43919, "epoch": 529} {"train_loss": -19.572546005249023, "global_step": 43920, "epoch": 529} {"train_loss": -19.773860931396484, "global_step": 43921, "epoch": 529} {"train_loss": -19.580141067504883, "global_step": 43922, "epoch": 529} {"train_loss": -19.6563777923584, "global_step": 43923, "epoch": 529} {"train_loss": -19.544076919555664, "global_step": 43924, "epoch": 529} {"train_loss": -19.892471313476562, "global_step": 43925, "epoch": 529} {"train_loss": -19.611000061035156, "global_step": 43926, "epoch": 529} {"train_loss": -19.44498634338379, "global_step": 43927, "epoch": 529} {"train_loss": -19.842348098754883, "global_step": 43928, "epoch": 529} {"train_loss": -19.564584732055664, "global_step": 43929, "epoch": 529} {"train_loss": -19.822742462158203, "global_step": 43930, "epoch": 529} {"train_loss": -19.58384132385254, "global_step": 43931, "epoch": 529} {"train_loss": -19.905536651611328, "global_step": 43932, "epoch": 529} {"train_loss": -19.8547420501709, "global_step": 43933, "epoch": 529} {"train_loss": -19.81111717224121, "global_step": 43934, "epoch": 529} {"train_loss": -19.339345932006836, "global_step": 43935, "epoch": 529} {"train_loss": -19.30018424987793, "global_step": 43936, "epoch": 529} {"train_loss": -19.52556037902832, "global_step": 43937, "epoch": 529} {"train_loss": -19.91468620300293, "global_step": 43938, "epoch": 529} {"train_loss": -19.958524703979492, "global_step": 43939, "epoch": 529} {"train_loss": -19.68244743347168, "global_step": 43940, "epoch": 529} {"train_loss": -19.633474349975586, "global_step": 43941, "epoch": 529} {"train_loss": -19.744565963745117, "global_step": 43942, "epoch": 529} {"train_loss": -19.663715362548828, "global_step": 43943, "epoch": 529} {"train_loss": -19.608882904052734, "global_step": 43944, "epoch": 529} {"train_loss": -19.608530044555664, "global_step": 43945, "epoch": 529} {"train_loss": -20.002716064453125, "global_step": 43946, "epoch": 529} {"train_loss": -19.26807975769043, "global_step": 43947, "epoch": 529} {"train_loss": -19.313413619995117, "global_step": 43948, "epoch": 529} {"train_loss": -20.07012176513672, "global_step": 43949, "epoch": 529} {"train_loss": -19.637266159057617, "global_step": 43950, "epoch": 529} {"train_loss": -19.782026290893555, "global_step": 43951, "epoch": 529} {"train_loss": -19.950164794921875, "global_step": 43952, "epoch": 529} {"train_loss": -19.484638214111328, "global_step": 43953, "epoch": 529} {"train_loss": -19.68400001525879, "global_step": 43954, "epoch": 529} {"train_loss": -19.461999893188477, "global_step": 43955, "epoch": 529} {"train_loss": -19.76410484313965, "global_step": 43956, "epoch": 529} {"train_loss": -20.089595794677734, "global_step": 43957, "epoch": 529} {"train_loss": -19.403289794921875, "global_step": 43958, "epoch": 529} {"train_loss": -19.880836486816406, "global_step": 43959, "epoch": 529} {"train_loss": -19.626310348510742, "global_step": 43960, "epoch": 529} {"train_loss": -19.45132064819336, "global_step": 43961, "epoch": 529} {"train_loss": -19.968765258789062, "global_step": 43962, "epoch": 529} {"train_loss": -19.639801025390625, "global_step": 43963, "epoch": 529} {"train_loss": -19.411991119384766, "global_step": 43964, "epoch": 529} {"train_loss": -19.48343276977539, "global_step": 43965, "epoch": 529} {"train_loss": -19.55182647705078, "global_step": 43966, "epoch": 529} {"train_loss": -19.480697631835938, "global_step": 43967, "epoch": 529} {"train_loss": -19.684539794921875, "global_step": 43968, "epoch": 529} {"train_loss": -19.78351402282715, "global_step": 43969, "epoch": 529} {"train_loss": -19.723129272460938, "global_step": 43970, "epoch": 529} {"train_loss": -19.52516746520996, "global_step": 43971, "epoch": 529} {"train_loss": -19.746971130371094, "global_step": 43972, "epoch": 529} {"train_loss": -19.179533004760742, "global_step": 43973, "epoch": 529} {"train_loss": -19.28723907470703, "global_step": 43974, "epoch": 529} {"train_loss": -19.5874080657959, "global_step": 43975, "epoch": 529} {"train_loss": -19.618467330932617, "global_step": 43976, "epoch": 529} {"train_loss": -19.748350143432617, "global_step": 43977, "epoch": 529} {"train_loss": -19.310781478881836, "global_step": 43978, "epoch": 529} {"train_loss": -19.354106903076172, "global_step": 43979, "epoch": 529} {"train_loss": -19.913869857788086, "global_step": 43980, "epoch": 529} {"train_loss": -19.820865631103516, "global_step": 43981, "epoch": 529} {"train_loss": -19.296627044677734, "global_step": 43982, "epoch": 529} {"train_loss": -19.41407585144043, "global_step": 43983, "epoch": 529} {"train_loss": -19.468860626220703, "global_step": 43984, "epoch": 529} {"train_loss": -19.54788589477539, "global_step": 43985, "epoch": 529} {"train_loss": -19.708724975585938, "global_step": 43986, "epoch": 529} {"train_loss": -19.596128463745117, "global_step": 43987, "epoch": 529} {"train_loss": -19.353559494018555, "global_step": 43988, "epoch": 529} {"train_loss": -19.585567244564196, "global_step": 43989, "epoch": 529, "val_loss": 6027184.5} {"train_loss": -19.54469871520996, "global_step": 43990, "epoch": 530} {"train_loss": -19.360126495361328, "global_step": 43991, "epoch": 530} {"train_loss": -19.59604835510254, "global_step": 43992, "epoch": 530} {"train_loss": -19.617786407470703, "global_step": 43993, "epoch": 530} {"train_loss": -19.649845123291016, "global_step": 43994, "epoch": 530} {"train_loss": -19.70281982421875, "global_step": 43995, "epoch": 530} {"train_loss": -19.802228927612305, "global_step": 43996, "epoch": 530} {"train_loss": -19.470050811767578, "global_step": 43997, "epoch": 530} {"train_loss": -19.3593807220459, "global_step": 43998, "epoch": 530} {"train_loss": -19.638046264648438, "global_step": 43999, "epoch": 530} {"train_loss": -19.582090377807617, "global_step": 44000, "epoch": 530} {"train_loss": -19.719890594482422, "global_step": 44001, "epoch": 530} {"train_loss": -19.9792537689209, "global_step": 44002, "epoch": 530} {"train_loss": -19.802486419677734, "global_step": 44003, "epoch": 530} {"train_loss": -19.474302291870117, "global_step": 44004, "epoch": 530} {"train_loss": -19.54958724975586, "global_step": 44005, "epoch": 530} {"train_loss": -19.33204460144043, "global_step": 44006, "epoch": 530} {"train_loss": -19.409629821777344, "global_step": 44007, "epoch": 530} {"train_loss": -19.96567153930664, "global_step": 44008, "epoch": 530} {"train_loss": -19.562152862548828, "global_step": 44009, "epoch": 530} {"train_loss": -19.677534103393555, "global_step": 44010, "epoch": 530} {"train_loss": -19.423776626586914, "global_step": 44011, "epoch": 530} {"train_loss": -19.74032974243164, "global_step": 44012, "epoch": 530} {"train_loss": -19.74405288696289, "global_step": 44013, "epoch": 530} {"train_loss": -19.576412200927734, "global_step": 44014, "epoch": 530} {"train_loss": -19.618850708007812, "global_step": 44015, "epoch": 530} {"train_loss": -19.1564998626709, "global_step": 44016, "epoch": 530} {"train_loss": -19.40250587463379, "global_step": 44017, "epoch": 530} {"train_loss": -19.65825653076172, "global_step": 44018, "epoch": 530} {"train_loss": -19.556411743164062, "global_step": 44019, "epoch": 530} {"train_loss": -19.87905502319336, "global_step": 44020, "epoch": 530} {"train_loss": -19.546436309814453, "global_step": 44021, "epoch": 530} {"train_loss": -19.5821590423584, "global_step": 44022, "epoch": 530} {"train_loss": -19.725522994995117, "global_step": 44023, "epoch": 530} {"train_loss": -19.44493293762207, "global_step": 44024, "epoch": 530} {"train_loss": -19.8774471282959, "global_step": 44025, "epoch": 530} {"train_loss": -19.805774688720703, "global_step": 44026, "epoch": 530} {"train_loss": -19.675275802612305, "global_step": 44027, "epoch": 530} {"train_loss": -19.25595474243164, "global_step": 44028, "epoch": 530} {"train_loss": -19.8249568939209, "global_step": 44029, "epoch": 530} {"train_loss": -20.00404167175293, "global_step": 44030, "epoch": 530} {"train_loss": -20.029949188232422, "global_step": 44031, "epoch": 530} {"train_loss": -19.566299438476562, "global_step": 44032, "epoch": 530} {"train_loss": -19.669357299804688, "global_step": 44033, "epoch": 530} {"train_loss": -20.12611198425293, "global_step": 44034, "epoch": 530} {"train_loss": -19.764677047729492, "global_step": 44035, "epoch": 530} {"train_loss": -19.64688491821289, "global_step": 44036, "epoch": 530} {"train_loss": -20.030349731445312, "global_step": 44037, "epoch": 530} {"train_loss": -19.107702255249023, "global_step": 44038, "epoch": 530} {"train_loss": -19.782827377319336, "global_step": 44039, "epoch": 530} {"train_loss": -20.02885627746582, "global_step": 44040, "epoch": 530} {"train_loss": -19.683277130126953, "global_step": 44041, "epoch": 530} {"train_loss": -19.457326889038086, "global_step": 44042, "epoch": 530} {"train_loss": -19.602025985717773, "global_step": 44043, "epoch": 530} {"train_loss": -19.328176498413086, "global_step": 44044, "epoch": 530} {"train_loss": -19.54279136657715, "global_step": 44045, "epoch": 530} {"train_loss": -19.763935089111328, "global_step": 44046, "epoch": 530} {"train_loss": -19.020732879638672, "global_step": 44047, "epoch": 530} {"train_loss": -19.634286880493164, "global_step": 44048, "epoch": 530} {"train_loss": -19.542287826538086, "global_step": 44049, "epoch": 530} {"train_loss": -19.50338363647461, "global_step": 44050, "epoch": 530} {"train_loss": -19.65209197998047, "global_step": 44051, "epoch": 530} {"train_loss": -19.825437545776367, "global_step": 44052, "epoch": 530} {"train_loss": -20.123443603515625, "global_step": 44053, "epoch": 530} {"train_loss": -19.47563362121582, "global_step": 44054, "epoch": 530} {"train_loss": -19.4400691986084, "global_step": 44055, "epoch": 530} {"train_loss": -19.492074966430664, "global_step": 44056, "epoch": 530} {"train_loss": -19.92864227294922, "global_step": 44057, "epoch": 530} {"train_loss": -19.238218307495117, "global_step": 44058, "epoch": 530} {"train_loss": -19.5179500579834, "global_step": 44059, "epoch": 530} {"train_loss": -19.848176956176758, "global_step": 44060, "epoch": 530} {"train_loss": -19.42181396484375, "global_step": 44061, "epoch": 530} {"train_loss": -19.568578720092773, "global_step": 44062, "epoch": 530} {"train_loss": -19.420557022094727, "global_step": 44063, "epoch": 530} {"train_loss": -20.087926864624023, "global_step": 44064, "epoch": 530} {"train_loss": -19.499765396118164, "global_step": 44065, "epoch": 530} {"train_loss": -19.740615844726562, "global_step": 44066, "epoch": 530} {"train_loss": -19.579919815063477, "global_step": 44067, "epoch": 530} {"train_loss": -19.37651252746582, "global_step": 44068, "epoch": 530} {"train_loss": -19.561010360717773, "global_step": 44069, "epoch": 530} {"train_loss": -19.476398468017578, "global_step": 44070, "epoch": 530} {"train_loss": -19.886173248291016, "global_step": 44071, "epoch": 530} {"train_loss": -19.623858233532275, "global_step": 44072, "epoch": 530, "val_loss": 6000782.0} {"train_loss": -19.182703018188477, "global_step": 44073, "epoch": 531} {"train_loss": -19.419662475585938, "global_step": 44074, "epoch": 531} {"train_loss": -19.776941299438477, "global_step": 44075, "epoch": 531} {"train_loss": -19.343473434448242, "global_step": 44076, "epoch": 531} {"train_loss": -19.47121238708496, "global_step": 44077, "epoch": 531} {"train_loss": -19.497922897338867, "global_step": 44078, "epoch": 531} {"train_loss": -19.682933807373047, "global_step": 44079, "epoch": 531} {"train_loss": -19.4085636138916, "global_step": 44080, "epoch": 531} {"train_loss": -19.658157348632812, "global_step": 44081, "epoch": 531} {"train_loss": -19.678573608398438, "global_step": 44082, "epoch": 531} {"train_loss": -19.765737533569336, "global_step": 44083, "epoch": 531} {"train_loss": -19.44733238220215, "global_step": 44084, "epoch": 531} {"train_loss": -19.732852935791016, "global_step": 44085, "epoch": 531} {"train_loss": -19.94183921813965, "global_step": 44086, "epoch": 531} {"train_loss": -19.510761260986328, "global_step": 44087, "epoch": 531} {"train_loss": -19.574935913085938, "global_step": 44088, "epoch": 531} {"train_loss": -19.5037841796875, "global_step": 44089, "epoch": 531} {"train_loss": -19.60967445373535, "global_step": 44090, "epoch": 531} {"train_loss": -19.892425537109375, "global_step": 44091, "epoch": 531} {"train_loss": -19.654582977294922, "global_step": 44092, "epoch": 531} {"train_loss": -19.363605499267578, "global_step": 44093, "epoch": 531} {"train_loss": -19.740306854248047, "global_step": 44094, "epoch": 531} {"train_loss": -19.497758865356445, "global_step": 44095, "epoch": 531} {"train_loss": -19.664213180541992, "global_step": 44096, "epoch": 531} {"train_loss": -19.666757583618164, "global_step": 44097, "epoch": 531} {"train_loss": -19.96259880065918, "global_step": 44098, "epoch": 531} {"train_loss": -19.609495162963867, "global_step": 44099, "epoch": 531} {"train_loss": -19.783830642700195, "global_step": 44100, "epoch": 531} {"train_loss": -19.07901382446289, "global_step": 44101, "epoch": 531} {"train_loss": -19.6533203125, "global_step": 44102, "epoch": 531} {"train_loss": -19.459863662719727, "global_step": 44103, "epoch": 531} {"train_loss": -19.29252815246582, "global_step": 44104, "epoch": 531} {"train_loss": -19.580354690551758, "global_step": 44105, "epoch": 531} {"train_loss": -19.969215393066406, "global_step": 44106, "epoch": 531} {"train_loss": -19.708364486694336, "global_step": 44107, "epoch": 531} {"train_loss": -19.520652770996094, "global_step": 44108, "epoch": 531} {"train_loss": -19.920835494995117, "global_step": 44109, "epoch": 531} {"train_loss": -19.56537628173828, "global_step": 44110, "epoch": 531} {"train_loss": -19.631250381469727, "global_step": 44111, "epoch": 531} {"train_loss": -19.606775283813477, "global_step": 44112, "epoch": 531} {"train_loss": -19.697904586791992, "global_step": 44113, "epoch": 531} {"train_loss": -19.617765426635742, "global_step": 44114, "epoch": 531} {"train_loss": -20.01122283935547, "global_step": 44115, "epoch": 531} {"train_loss": -19.315536499023438, "global_step": 44116, "epoch": 531} {"train_loss": -19.852853775024414, "global_step": 44117, "epoch": 531} {"train_loss": -19.10893440246582, "global_step": 44118, "epoch": 531} {"train_loss": -19.5492000579834, "global_step": 44119, "epoch": 531} {"train_loss": -19.382322311401367, "global_step": 44120, "epoch": 531} {"train_loss": -19.509611129760742, "global_step": 44121, "epoch": 531} {"train_loss": -19.535675048828125, "global_step": 44122, "epoch": 531} {"train_loss": -19.449893951416016, "global_step": 44123, "epoch": 531} {"train_loss": -19.56270408630371, "global_step": 44124, "epoch": 531} {"train_loss": -19.81279945373535, "global_step": 44125, "epoch": 531} {"train_loss": -19.493101119995117, "global_step": 44126, "epoch": 531} {"train_loss": -19.691694259643555, "global_step": 44127, "epoch": 531} {"train_loss": -19.829179763793945, "global_step": 44128, "epoch": 531} {"train_loss": -19.487457275390625, "global_step": 44129, "epoch": 531} {"train_loss": -19.573606491088867, "global_step": 44130, "epoch": 531} {"train_loss": -19.805971145629883, "global_step": 44131, "epoch": 531} {"train_loss": -19.48207664489746, "global_step": 44132, "epoch": 531} {"train_loss": -19.814260482788086, "global_step": 44133, "epoch": 531} {"train_loss": -19.623584747314453, "global_step": 44134, "epoch": 531} {"train_loss": -19.58624839782715, "global_step": 44135, "epoch": 531} {"train_loss": -19.719762802124023, "global_step": 44136, "epoch": 531} {"train_loss": -19.535860061645508, "global_step": 44137, "epoch": 531} {"train_loss": -19.792768478393555, "global_step": 44138, "epoch": 531} {"train_loss": -19.607831954956055, "global_step": 44139, "epoch": 531} {"train_loss": -19.723234176635742, "global_step": 44140, "epoch": 531} {"train_loss": -20.00634765625, "global_step": 44141, "epoch": 531} {"train_loss": -19.44260025024414, "global_step": 44142, "epoch": 531} {"train_loss": -19.77616310119629, "global_step": 44143, "epoch": 531} {"train_loss": -19.439905166625977, "global_step": 44144, "epoch": 531} {"train_loss": -19.958423614501953, "global_step": 44145, "epoch": 531} {"train_loss": -19.9180850982666, "global_step": 44146, "epoch": 531} {"train_loss": -19.621368408203125, "global_step": 44147, "epoch": 531} {"train_loss": -19.763486862182617, "global_step": 44148, "epoch": 531} {"train_loss": -19.9525089263916, "global_step": 44149, "epoch": 531} {"train_loss": -19.730575561523438, "global_step": 44150, "epoch": 531} {"train_loss": -19.370786666870117, "global_step": 44151, "epoch": 531} {"train_loss": -19.147748947143555, "global_step": 44152, "epoch": 531} {"train_loss": -19.499332427978516, "global_step": 44153, "epoch": 531} {"train_loss": -20.164766311645508, "global_step": 44154, "epoch": 531} {"train_loss": -19.631356963192125, "global_step": 44155, "epoch": 531, "val_loss": 5940982.0} {"train_loss": -18.699371337890625, "global_step": 44156, "epoch": 532} {"train_loss": -19.29715919494629, "global_step": 44157, "epoch": 532} {"train_loss": -19.137317657470703, "global_step": 44158, "epoch": 532} {"train_loss": -19.021244049072266, "global_step": 44159, "epoch": 532} {"train_loss": -19.08489990234375, "global_step": 44160, "epoch": 532} {"train_loss": -19.509031295776367, "global_step": 44161, "epoch": 532} {"train_loss": -19.511030197143555, "global_step": 44162, "epoch": 532} {"train_loss": -19.000455856323242, "global_step": 44163, "epoch": 532} {"train_loss": -19.334739685058594, "global_step": 44164, "epoch": 532} {"train_loss": -19.641788482666016, "global_step": 44165, "epoch": 532} {"train_loss": -19.222909927368164, "global_step": 44166, "epoch": 532} {"train_loss": -19.205463409423828, "global_step": 44167, "epoch": 532} {"train_loss": -19.339069366455078, "global_step": 44168, "epoch": 532} {"train_loss": -19.611515045166016, "global_step": 44169, "epoch": 532} {"train_loss": -19.147314071655273, "global_step": 44170, "epoch": 532} {"train_loss": -19.51089859008789, "global_step": 44171, "epoch": 532} {"train_loss": -19.542423248291016, "global_step": 44172, "epoch": 532} {"train_loss": -19.568527221679688, "global_step": 44173, "epoch": 532} {"train_loss": -19.60474395751953, "global_step": 44174, "epoch": 532} {"train_loss": -19.64362144470215, "global_step": 44175, "epoch": 532} {"train_loss": -19.52501678466797, "global_step": 44176, "epoch": 532} {"train_loss": -19.65015983581543, "global_step": 44177, "epoch": 532} {"train_loss": -19.4732666015625, "global_step": 44178, "epoch": 532} {"train_loss": -19.767921447753906, "global_step": 44179, "epoch": 532} {"train_loss": -19.607831954956055, "global_step": 44180, "epoch": 532} {"train_loss": -19.196664810180664, "global_step": 44181, "epoch": 532} {"train_loss": -19.620450973510742, "global_step": 44182, "epoch": 532} {"train_loss": -19.1622371673584, "global_step": 44183, "epoch": 532} {"train_loss": -19.6884765625, "global_step": 44184, "epoch": 532} {"train_loss": -19.662473678588867, "global_step": 44185, "epoch": 532} {"train_loss": -19.645164489746094, "global_step": 44186, "epoch": 532} {"train_loss": -19.562049865722656, "global_step": 44187, "epoch": 532} {"train_loss": -19.55769920349121, "global_step": 44188, "epoch": 532} {"train_loss": -19.627750396728516, "global_step": 44189, "epoch": 532} {"train_loss": -19.56119155883789, "global_step": 44190, "epoch": 532} {"train_loss": -19.396989822387695, "global_step": 44191, "epoch": 532} {"train_loss": -19.76447868347168, "global_step": 44192, "epoch": 532} {"train_loss": -19.794631958007812, "global_step": 44193, "epoch": 532} {"train_loss": -19.85663414001465, "global_step": 44194, "epoch": 532} {"train_loss": -19.65517807006836, "global_step": 44195, "epoch": 532} {"train_loss": -20.018415451049805, "global_step": 44196, "epoch": 532} {"train_loss": -19.4769229888916, "global_step": 44197, "epoch": 532} {"train_loss": -19.812965393066406, "global_step": 44198, "epoch": 532} {"train_loss": -19.66132164001465, "global_step": 44199, "epoch": 532} {"train_loss": -20.050397872924805, "global_step": 44200, "epoch": 532} {"train_loss": -19.646650314331055, "global_step": 44201, "epoch": 532} {"train_loss": -19.517683029174805, "global_step": 44202, "epoch": 532} {"train_loss": -19.758060455322266, "global_step": 44203, "epoch": 532} {"train_loss": -19.77926254272461, "global_step": 44204, "epoch": 532} {"train_loss": -19.925430297851562, "global_step": 44205, "epoch": 532} {"train_loss": -19.876972198486328, "global_step": 44206, "epoch": 532} {"train_loss": -19.675521850585938, "global_step": 44207, "epoch": 532} {"train_loss": -19.51227378845215, "global_step": 44208, "epoch": 532} {"train_loss": -19.553434371948242, "global_step": 44209, "epoch": 532} {"train_loss": -19.733320236206055, "global_step": 44210, "epoch": 532} {"train_loss": -19.454288482666016, "global_step": 44211, "epoch": 532} {"train_loss": -19.617088317871094, "global_step": 44212, "epoch": 532} {"train_loss": -19.48349952697754, "global_step": 44213, "epoch": 532} {"train_loss": -19.516172409057617, "global_step": 44214, "epoch": 532} {"train_loss": -19.133272171020508, "global_step": 44215, "epoch": 532} {"train_loss": -19.916099548339844, "global_step": 44216, "epoch": 532} {"train_loss": -19.59685707092285, "global_step": 44217, "epoch": 532} {"train_loss": -19.31463050842285, "global_step": 44218, "epoch": 532} {"train_loss": -19.34003448486328, "global_step": 44219, "epoch": 532} {"train_loss": -19.521738052368164, "global_step": 44220, "epoch": 532} {"train_loss": -19.303970336914062, "global_step": 44221, "epoch": 532} {"train_loss": -19.49806022644043, "global_step": 44222, "epoch": 532} {"train_loss": -19.553281784057617, "global_step": 44223, "epoch": 532} {"train_loss": -19.54774284362793, "global_step": 44224, "epoch": 532} {"train_loss": -20.010107040405273, "global_step": 44225, "epoch": 532} {"train_loss": -19.111366271972656, "global_step": 44226, "epoch": 532} {"train_loss": -19.57430076599121, "global_step": 44227, "epoch": 532} {"train_loss": -19.745370864868164, "global_step": 44228, "epoch": 532} {"train_loss": -19.719133377075195, "global_step": 44229, "epoch": 532} {"train_loss": -20.0184383392334, "global_step": 44230, "epoch": 532} {"train_loss": -19.65119171142578, "global_step": 44231, "epoch": 532} {"train_loss": -19.620826721191406, "global_step": 44232, "epoch": 532} {"train_loss": -19.629404067993164, "global_step": 44233, "epoch": 532} {"train_loss": -19.537382125854492, "global_step": 44234, "epoch": 532} {"train_loss": -19.675931930541992, "global_step": 44235, "epoch": 532} {"train_loss": -19.837186813354492, "global_step": 44236, "epoch": 532} {"train_loss": -19.723438262939453, "global_step": 44237, "epoch": 532} {"train_loss": -19.54198949882783, "global_step": 44238, "epoch": 532, "val_loss": 6032375.0} {"train_loss": -19.559677124023438, "global_step": 44239, "epoch": 533} {"train_loss": -19.75950050354004, "global_step": 44240, "epoch": 533} {"train_loss": -19.654420852661133, "global_step": 44241, "epoch": 533} {"train_loss": -19.472503662109375, "global_step": 44242, "epoch": 533} {"train_loss": -19.310876846313477, "global_step": 44243, "epoch": 533} {"train_loss": -19.297256469726562, "global_step": 44244, "epoch": 533} {"train_loss": -19.342166900634766, "global_step": 44245, "epoch": 533} {"train_loss": -19.576099395751953, "global_step": 44246, "epoch": 533} {"train_loss": -19.476171493530273, "global_step": 44247, "epoch": 533} {"train_loss": -19.498708724975586, "global_step": 44248, "epoch": 533} {"train_loss": -19.03839683532715, "global_step": 44249, "epoch": 533} {"train_loss": -19.717355728149414, "global_step": 44250, "epoch": 533} {"train_loss": -19.51289939880371, "global_step": 44251, "epoch": 533} {"train_loss": -19.570737838745117, "global_step": 44252, "epoch": 533} {"train_loss": -19.729257583618164, "global_step": 44253, "epoch": 533} {"train_loss": -19.641986846923828, "global_step": 44254, "epoch": 533} {"train_loss": -19.847686767578125, "global_step": 44255, "epoch": 533} {"train_loss": -19.743759155273438, "global_step": 44256, "epoch": 533} {"train_loss": -20.013050079345703, "global_step": 44257, "epoch": 533} {"train_loss": -19.507413864135742, "global_step": 44258, "epoch": 533} {"train_loss": -19.643163681030273, "global_step": 44259, "epoch": 533} {"train_loss": -20.084644317626953, "global_step": 44260, "epoch": 533} {"train_loss": -19.63294219970703, "global_step": 44261, "epoch": 533} {"train_loss": -19.69548988342285, "global_step": 44262, "epoch": 533} {"train_loss": -19.484764099121094, "global_step": 44263, "epoch": 533} {"train_loss": -19.750978469848633, "global_step": 44264, "epoch": 533} {"train_loss": -19.46885871887207, "global_step": 44265, "epoch": 533} {"train_loss": -19.470853805541992, "global_step": 44266, "epoch": 533} {"train_loss": -19.723112106323242, "global_step": 44267, "epoch": 533} {"train_loss": -19.592700958251953, "global_step": 44268, "epoch": 533} {"train_loss": -19.751663208007812, "global_step": 44269, "epoch": 533} {"train_loss": -19.668058395385742, "global_step": 44270, "epoch": 533} {"train_loss": -19.861042022705078, "global_step": 44271, "epoch": 533} {"train_loss": -19.263635635375977, "global_step": 44272, "epoch": 533} {"train_loss": -20.06662368774414, "global_step": 44273, "epoch": 533} {"train_loss": -19.767427444458008, "global_step": 44274, "epoch": 533} {"train_loss": -19.650096893310547, "global_step": 44275, "epoch": 533} {"train_loss": -19.595569610595703, "global_step": 44276, "epoch": 533} {"train_loss": -19.727182388305664, "global_step": 44277, "epoch": 533} {"train_loss": -19.935468673706055, "global_step": 44278, "epoch": 533} {"train_loss": -19.440799713134766, "global_step": 44279, "epoch": 533} {"train_loss": -19.96352195739746, "global_step": 44280, "epoch": 533} {"train_loss": -20.00042152404785, "global_step": 44281, "epoch": 533} {"train_loss": -19.57356834411621, "global_step": 44282, "epoch": 533} {"train_loss": -19.79391860961914, "global_step": 44283, "epoch": 533} {"train_loss": -19.84284019470215, "global_step": 44284, "epoch": 533} {"train_loss": -19.747915267944336, "global_step": 44285, "epoch": 533} {"train_loss": -19.756982803344727, "global_step": 44286, "epoch": 533} {"train_loss": -19.600217819213867, "global_step": 44287, "epoch": 533} {"train_loss": -19.41657066345215, "global_step": 44288, "epoch": 533} {"train_loss": -19.89373779296875, "global_step": 44289, "epoch": 533} {"train_loss": -19.834875106811523, "global_step": 44290, "epoch": 533} {"train_loss": -19.271575927734375, "global_step": 44291, "epoch": 533} {"train_loss": -19.989673614501953, "global_step": 44292, "epoch": 533} {"train_loss": -20.07270622253418, "global_step": 44293, "epoch": 533} {"train_loss": -19.855581283569336, "global_step": 44294, "epoch": 533} {"train_loss": -19.94663429260254, "global_step": 44295, "epoch": 533} {"train_loss": -20.086957931518555, "global_step": 44296, "epoch": 533} {"train_loss": -19.716947555541992, "global_step": 44297, "epoch": 533} {"train_loss": -19.649518966674805, "global_step": 44298, "epoch": 533} {"train_loss": -19.36481475830078, "global_step": 44299, "epoch": 533} {"train_loss": -19.755659103393555, "global_step": 44300, "epoch": 533} {"train_loss": -19.71297264099121, "global_step": 44301, "epoch": 533} {"train_loss": -19.503158569335938, "global_step": 44302, "epoch": 533} {"train_loss": -20.038400650024414, "global_step": 44303, "epoch": 533} {"train_loss": -19.302553176879883, "global_step": 44304, "epoch": 533} {"train_loss": -19.615909576416016, "global_step": 44305, "epoch": 533} {"train_loss": -19.33376121520996, "global_step": 44306, "epoch": 533} {"train_loss": -19.660581588745117, "global_step": 44307, "epoch": 533} {"train_loss": -19.799665451049805, "global_step": 44308, "epoch": 533} {"train_loss": -19.34572410583496, "global_step": 44309, "epoch": 533} {"train_loss": -19.480253219604492, "global_step": 44310, "epoch": 533} {"train_loss": -19.73900032043457, "global_step": 44311, "epoch": 533} {"train_loss": -19.6805419921875, "global_step": 44312, "epoch": 533} {"train_loss": -19.39179801940918, "global_step": 44313, "epoch": 533} {"train_loss": -19.678953170776367, "global_step": 44314, "epoch": 533} {"train_loss": -19.626615524291992, "global_step": 44315, "epoch": 533} {"train_loss": -19.705068588256836, "global_step": 44316, "epoch": 533} {"train_loss": -19.455530166625977, "global_step": 44317, "epoch": 533} {"train_loss": -19.881668090820312, "global_step": 44318, "epoch": 533} {"train_loss": -19.90496063232422, "global_step": 44319, "epoch": 533} {"train_loss": -19.40057945251465, "global_step": 44320, "epoch": 533} {"train_loss": -19.649309503026757, "global_step": 44321, "epoch": 533, "val_loss": 5914247.5} {"train_loss": -19.0217227935791, "global_step": 44322, "epoch": 534} {"train_loss": -19.31698226928711, "global_step": 44323, "epoch": 534} {"train_loss": -19.1639347076416, "global_step": 44324, "epoch": 534} {"train_loss": -19.063037872314453, "global_step": 44325, "epoch": 534} {"train_loss": -19.30496597290039, "global_step": 44326, "epoch": 534} {"train_loss": -19.54267692565918, "global_step": 44327, "epoch": 534} {"train_loss": -19.273542404174805, "global_step": 44328, "epoch": 534} {"train_loss": -19.32538414001465, "global_step": 44329, "epoch": 534} {"train_loss": -18.848112106323242, "global_step": 44330, "epoch": 534} {"train_loss": -19.161338806152344, "global_step": 44331, "epoch": 534} {"train_loss": -19.61590576171875, "global_step": 44332, "epoch": 534} {"train_loss": -19.435955047607422, "global_step": 44333, "epoch": 534} {"train_loss": -19.840269088745117, "global_step": 44334, "epoch": 534} {"train_loss": -19.496007919311523, "global_step": 44335, "epoch": 534} {"train_loss": -19.2767276763916, "global_step": 44336, "epoch": 534} {"train_loss": -19.2641658782959, "global_step": 44337, "epoch": 534} {"train_loss": -19.21109390258789, "global_step": 44338, "epoch": 534} {"train_loss": -19.54093360900879, "global_step": 44339, "epoch": 534} {"train_loss": -19.568044662475586, "global_step": 44340, "epoch": 534} {"train_loss": -19.550220489501953, "global_step": 44341, "epoch": 534} {"train_loss": -19.585201263427734, "global_step": 44342, "epoch": 534} {"train_loss": -19.84435272216797, "global_step": 44343, "epoch": 534} {"train_loss": -19.917652130126953, "global_step": 44344, "epoch": 534} {"train_loss": -19.45418357849121, "global_step": 44345, "epoch": 534} {"train_loss": -19.451566696166992, "global_step": 44346, "epoch": 534} {"train_loss": -19.75020408630371, "global_step": 44347, "epoch": 534} {"train_loss": -19.44166374206543, "global_step": 44348, "epoch": 534} {"train_loss": -19.726797103881836, "global_step": 44349, "epoch": 534} {"train_loss": -19.568115234375, "global_step": 44350, "epoch": 534} {"train_loss": -19.72025489807129, "global_step": 44351, "epoch": 534} {"train_loss": -19.120777130126953, "global_step": 44352, "epoch": 534} {"train_loss": -19.409265518188477, "global_step": 44353, "epoch": 534} {"train_loss": -19.763267517089844, "global_step": 44354, "epoch": 534} {"train_loss": -19.746307373046875, "global_step": 44355, "epoch": 534} {"train_loss": -19.62332534790039, "global_step": 44356, "epoch": 534} {"train_loss": -19.601402282714844, "global_step": 44357, "epoch": 534} {"train_loss": -19.537479400634766, "global_step": 44358, "epoch": 534} {"train_loss": -19.523727416992188, "global_step": 44359, "epoch": 534} {"train_loss": -19.514280319213867, "global_step": 44360, "epoch": 534} {"train_loss": -19.705753326416016, "global_step": 44361, "epoch": 534} {"train_loss": -19.91590690612793, "global_step": 44362, "epoch": 534} {"train_loss": -19.8355712890625, "global_step": 44363, "epoch": 534} {"train_loss": -19.676738739013672, "global_step": 44364, "epoch": 534} {"train_loss": -19.838239669799805, "global_step": 44365, "epoch": 534} {"train_loss": -19.62655258178711, "global_step": 44366, "epoch": 534} {"train_loss": -19.46770477294922, "global_step": 44367, "epoch": 534} {"train_loss": -19.74735450744629, "global_step": 44368, "epoch": 534} {"train_loss": -19.85150718688965, "global_step": 44369, "epoch": 534} {"train_loss": -19.954458236694336, "global_step": 44370, "epoch": 534} {"train_loss": -19.531396865844727, "global_step": 44371, "epoch": 534} {"train_loss": -19.434738159179688, "global_step": 44372, "epoch": 534} {"train_loss": -19.70905113220215, "global_step": 44373, "epoch": 534} {"train_loss": -19.538259506225586, "global_step": 44374, "epoch": 534} {"train_loss": -19.376012802124023, "global_step": 44375, "epoch": 534} {"train_loss": -19.293569564819336, "global_step": 44376, "epoch": 534} {"train_loss": -19.451946258544922, "global_step": 44377, "epoch": 534} {"train_loss": -19.81114387512207, "global_step": 44378, "epoch": 534} {"train_loss": -19.732770919799805, "global_step": 44379, "epoch": 534} {"train_loss": -19.537446975708008, "global_step": 44380, "epoch": 534} {"train_loss": -19.709484100341797, "global_step": 44381, "epoch": 534} {"train_loss": -19.723800659179688, "global_step": 44382, "epoch": 534} {"train_loss": -19.330415725708008, "global_step": 44383, "epoch": 534} {"train_loss": -19.420019149780273, "global_step": 44384, "epoch": 534} {"train_loss": -19.77692985534668, "global_step": 44385, "epoch": 534} {"train_loss": -19.43735694885254, "global_step": 44386, "epoch": 534} {"train_loss": -19.835159301757812, "global_step": 44387, "epoch": 534} {"train_loss": -19.579938888549805, "global_step": 44388, "epoch": 534} {"train_loss": -19.43524169921875, "global_step": 44389, "epoch": 534} {"train_loss": -19.78053855895996, "global_step": 44390, "epoch": 534} {"train_loss": -19.85147476196289, "global_step": 44391, "epoch": 534} {"train_loss": -19.647308349609375, "global_step": 44392, "epoch": 534} {"train_loss": -19.62495994567871, "global_step": 44393, "epoch": 534} {"train_loss": -19.493453979492188, "global_step": 44394, "epoch": 534} {"train_loss": -19.711254119873047, "global_step": 44395, "epoch": 534} {"train_loss": -19.85821533203125, "global_step": 44396, "epoch": 534} {"train_loss": -19.27277946472168, "global_step": 44397, "epoch": 534} {"train_loss": -19.74030876159668, "global_step": 44398, "epoch": 534} {"train_loss": -19.729265213012695, "global_step": 44399, "epoch": 534} {"train_loss": -19.583538055419922, "global_step": 44400, "epoch": 534} {"train_loss": -19.686288833618164, "global_step": 44401, "epoch": 534} {"train_loss": -19.791486740112305, "global_step": 44402, "epoch": 534} {"train_loss": -19.72902488708496, "global_step": 44403, "epoch": 534} {"train_loss": -19.56375096792198, "global_step": 44404, "epoch": 534, "val_loss": 6038028.0} {"train_loss": -19.408498764038086, "global_step": 44405, "epoch": 535} {"train_loss": -19.199060440063477, "global_step": 44406, "epoch": 535} {"train_loss": -19.64717674255371, "global_step": 44407, "epoch": 535} {"train_loss": -19.641950607299805, "global_step": 44408, "epoch": 535} {"train_loss": -19.557212829589844, "global_step": 44409, "epoch": 535} {"train_loss": -19.57021141052246, "global_step": 44410, "epoch": 535} {"train_loss": -19.52766227722168, "global_step": 44411, "epoch": 535} {"train_loss": -19.64607810974121, "global_step": 44412, "epoch": 535} {"train_loss": -19.96674156188965, "global_step": 44413, "epoch": 535} {"train_loss": -19.671295166015625, "global_step": 44414, "epoch": 535} {"train_loss": -19.63629722595215, "global_step": 44415, "epoch": 535} {"train_loss": -19.345605850219727, "global_step": 44416, "epoch": 535} {"train_loss": -19.667129516601562, "global_step": 44417, "epoch": 535} {"train_loss": -20.0333309173584, "global_step": 44418, "epoch": 535} {"train_loss": -19.823699951171875, "global_step": 44419, "epoch": 535} {"train_loss": -19.580602645874023, "global_step": 44420, "epoch": 535} {"train_loss": -19.58213233947754, "global_step": 44421, "epoch": 535} {"train_loss": -19.369943618774414, "global_step": 44422, "epoch": 535} {"train_loss": -19.208112716674805, "global_step": 44423, "epoch": 535} {"train_loss": -19.436695098876953, "global_step": 44424, "epoch": 535} {"train_loss": -19.702524185180664, "global_step": 44425, "epoch": 535} {"train_loss": -19.27161979675293, "global_step": 44426, "epoch": 535} {"train_loss": -19.483182907104492, "global_step": 44427, "epoch": 535} {"train_loss": -19.622060775756836, "global_step": 44428, "epoch": 535} {"train_loss": -19.868871688842773, "global_step": 44429, "epoch": 535} {"train_loss": -20.037525177001953, "global_step": 44430, "epoch": 535} {"train_loss": -19.833240509033203, "global_step": 44431, "epoch": 535} {"train_loss": -19.828153610229492, "global_step": 44432, "epoch": 535} {"train_loss": -19.691654205322266, "global_step": 44433, "epoch": 535} {"train_loss": -19.713865280151367, "global_step": 44434, "epoch": 535} {"train_loss": -19.57634925842285, "global_step": 44435, "epoch": 535} {"train_loss": -19.75874137878418, "global_step": 44436, "epoch": 535} {"train_loss": -19.525724411010742, "global_step": 44437, "epoch": 535} {"train_loss": -19.72944450378418, "global_step": 44438, "epoch": 535} {"train_loss": -19.3935489654541, "global_step": 44439, "epoch": 535} {"train_loss": -19.53614616394043, "global_step": 44440, "epoch": 535} {"train_loss": -19.547941207885742, "global_step": 44441, "epoch": 535} {"train_loss": -19.54999351501465, "global_step": 44442, "epoch": 535} {"train_loss": -19.719501495361328, "global_step": 44443, "epoch": 535} {"train_loss": -20.125776290893555, "global_step": 44444, "epoch": 535} {"train_loss": -19.236724853515625, "global_step": 44445, "epoch": 535} {"train_loss": -19.901193618774414, "global_step": 44446, "epoch": 535} {"train_loss": -19.551252365112305, "global_step": 44447, "epoch": 535} {"train_loss": -19.70476722717285, "global_step": 44448, "epoch": 535} {"train_loss": -20.257593154907227, "global_step": 44449, "epoch": 535} {"train_loss": -19.462158203125, "global_step": 44450, "epoch": 535} {"train_loss": -19.472997665405273, "global_step": 44451, "epoch": 535} {"train_loss": -19.49687385559082, "global_step": 44452, "epoch": 535} {"train_loss": -19.861703872680664, "global_step": 44453, "epoch": 535} {"train_loss": -19.403501510620117, "global_step": 44454, "epoch": 535} {"train_loss": -19.424991607666016, "global_step": 44455, "epoch": 535} {"train_loss": -19.411392211914062, "global_step": 44456, "epoch": 535} {"train_loss": -19.369962692260742, "global_step": 44457, "epoch": 535} {"train_loss": -19.43833351135254, "global_step": 44458, "epoch": 535} {"train_loss": -19.695837020874023, "global_step": 44459, "epoch": 535} {"train_loss": -19.598690032958984, "global_step": 44460, "epoch": 535} {"train_loss": -19.68813133239746, "global_step": 44461, "epoch": 535} {"train_loss": -19.531538009643555, "global_step": 44462, "epoch": 535} {"train_loss": -19.813901901245117, "global_step": 44463, "epoch": 535} {"train_loss": -19.962926864624023, "global_step": 44464, "epoch": 535} {"train_loss": -19.75241470336914, "global_step": 44465, "epoch": 535} {"train_loss": -19.600313186645508, "global_step": 44466, "epoch": 535} {"train_loss": -19.743799209594727, "global_step": 44467, "epoch": 535} {"train_loss": -19.704607009887695, "global_step": 44468, "epoch": 535} {"train_loss": -20.06928825378418, "global_step": 44469, "epoch": 535} {"train_loss": -19.66560173034668, "global_step": 44470, "epoch": 535} {"train_loss": -19.88028907775879, "global_step": 44471, "epoch": 535} {"train_loss": -19.847299575805664, "global_step": 44472, "epoch": 535} {"train_loss": -19.829437255859375, "global_step": 44473, "epoch": 535} {"train_loss": -19.890817642211914, "global_step": 44474, "epoch": 535} {"train_loss": -19.624977111816406, "global_step": 44475, "epoch": 535} {"train_loss": -19.91657829284668, "global_step": 44476, "epoch": 535} {"train_loss": -19.650251388549805, "global_step": 44477, "epoch": 535} {"train_loss": -19.819305419921875, "global_step": 44478, "epoch": 535} {"train_loss": -19.666234970092773, "global_step": 44479, "epoch": 535} {"train_loss": -19.4502010345459, "global_step": 44480, "epoch": 535} {"train_loss": -19.44696617126465, "global_step": 44481, "epoch": 535} {"train_loss": -19.627233505249023, "global_step": 44482, "epoch": 535} {"train_loss": -19.91950035095215, "global_step": 44483, "epoch": 535} {"train_loss": -19.827056884765625, "global_step": 44484, "epoch": 535} {"train_loss": -19.885770797729492, "global_step": 44485, "epoch": 535} {"train_loss": -19.746692657470703, "global_step": 44486, "epoch": 535} {"train_loss": -19.64807009409709, "global_step": 44487, "epoch": 535, "val_loss": 5990533.5} {"train_loss": -19.49789810180664, "global_step": 44488, "epoch": 536} {"train_loss": -19.21744728088379, "global_step": 44489, "epoch": 536} {"train_loss": -19.237682342529297, "global_step": 44490, "epoch": 536} {"train_loss": -19.360614776611328, "global_step": 44491, "epoch": 536} {"train_loss": -19.113067626953125, "global_step": 44492, "epoch": 536} {"train_loss": -19.181781768798828, "global_step": 44493, "epoch": 536} {"train_loss": -19.451934814453125, "global_step": 44494, "epoch": 536} {"train_loss": -19.371824264526367, "global_step": 44495, "epoch": 536} {"train_loss": -19.54252052307129, "global_step": 44496, "epoch": 536} {"train_loss": -19.26145362854004, "global_step": 44497, "epoch": 536} {"train_loss": -19.549238204956055, "global_step": 44498, "epoch": 536} {"train_loss": -18.92457389831543, "global_step": 44499, "epoch": 536} {"train_loss": -19.353952407836914, "global_step": 44500, "epoch": 536} {"train_loss": -19.72591209411621, "global_step": 44501, "epoch": 536} {"train_loss": -19.361249923706055, "global_step": 44502, "epoch": 536} {"train_loss": -19.710342407226562, "global_step": 44503, "epoch": 536} {"train_loss": -19.572696685791016, "global_step": 44504, "epoch": 536} {"train_loss": -19.91438865661621, "global_step": 44505, "epoch": 536} {"train_loss": -19.65683937072754, "global_step": 44506, "epoch": 536} {"train_loss": -19.583282470703125, "global_step": 44507, "epoch": 536} {"train_loss": -19.661529541015625, "global_step": 44508, "epoch": 536} {"train_loss": -19.392789840698242, "global_step": 44509, "epoch": 536} {"train_loss": -19.538883209228516, "global_step": 44510, "epoch": 536} {"train_loss": -19.5997257232666, "global_step": 44511, "epoch": 536} {"train_loss": -19.783130645751953, "global_step": 44512, "epoch": 536} {"train_loss": -19.48642349243164, "global_step": 44513, "epoch": 536} {"train_loss": -19.411386489868164, "global_step": 44514, "epoch": 536} {"train_loss": -20.052391052246094, "global_step": 44515, "epoch": 536} {"train_loss": -19.51692771911621, "global_step": 44516, "epoch": 536} {"train_loss": -19.905908584594727, "global_step": 44517, "epoch": 536} {"train_loss": -19.547513961791992, "global_step": 44518, "epoch": 536} {"train_loss": -19.55996322631836, "global_step": 44519, "epoch": 536} {"train_loss": -19.55577278137207, "global_step": 44520, "epoch": 536} {"train_loss": -19.52399253845215, "global_step": 44521, "epoch": 536} {"train_loss": -19.36724281311035, "global_step": 44522, "epoch": 536} {"train_loss": -19.263105392456055, "global_step": 44523, "epoch": 536} {"train_loss": -19.726428985595703, "global_step": 44524, "epoch": 536} {"train_loss": -19.764793395996094, "global_step": 44525, "epoch": 536} {"train_loss": -19.44462013244629, "global_step": 44526, "epoch": 536} {"train_loss": -19.455041885375977, "global_step": 44527, "epoch": 536} {"train_loss": -19.94329833984375, "global_step": 44528, "epoch": 536} {"train_loss": -19.36358642578125, "global_step": 44529, "epoch": 536} {"train_loss": -19.57821273803711, "global_step": 44530, "epoch": 536} {"train_loss": -19.713987350463867, "global_step": 44531, "epoch": 536} {"train_loss": -19.629850387573242, "global_step": 44532, "epoch": 536} {"train_loss": -19.622333526611328, "global_step": 44533, "epoch": 536} {"train_loss": -20.18732261657715, "global_step": 44534, "epoch": 536} {"train_loss": -19.67696189880371, "global_step": 44535, "epoch": 536} {"train_loss": -19.695798873901367, "global_step": 44536, "epoch": 536} {"train_loss": -19.640653610229492, "global_step": 44537, "epoch": 536} {"train_loss": -19.564733505249023, "global_step": 44538, "epoch": 536} {"train_loss": -19.6694393157959, "global_step": 44539, "epoch": 536} {"train_loss": -19.62064552307129, "global_step": 44540, "epoch": 536} {"train_loss": -20.356828689575195, "global_step": 44541, "epoch": 536} {"train_loss": -19.5140438079834, "global_step": 44542, "epoch": 536} {"train_loss": -19.920507431030273, "global_step": 44543, "epoch": 536} {"train_loss": -19.7631893157959, "global_step": 44544, "epoch": 536} {"train_loss": -19.811147689819336, "global_step": 44545, "epoch": 536} {"train_loss": -19.629770278930664, "global_step": 44546, "epoch": 536} {"train_loss": -20.006818771362305, "global_step": 44547, "epoch": 536} {"train_loss": -19.476957321166992, "global_step": 44548, "epoch": 536} {"train_loss": -19.504911422729492, "global_step": 44549, "epoch": 536} {"train_loss": -19.72541618347168, "global_step": 44550, "epoch": 536} {"train_loss": -19.86449432373047, "global_step": 44551, "epoch": 536} {"train_loss": -20.177608489990234, "global_step": 44552, "epoch": 536} {"train_loss": -19.58209228515625, "global_step": 44553, "epoch": 536} {"train_loss": -20.021713256835938, "global_step": 44554, "epoch": 536} {"train_loss": -19.30095100402832, "global_step": 44555, "epoch": 536} {"train_loss": -19.99134635925293, "global_step": 44556, "epoch": 536} {"train_loss": -19.57260513305664, "global_step": 44557, "epoch": 536} {"train_loss": -19.703489303588867, "global_step": 44558, "epoch": 536} {"train_loss": -19.979766845703125, "global_step": 44559, "epoch": 536} {"train_loss": -19.692705154418945, "global_step": 44560, "epoch": 536} {"train_loss": -19.762039184570312, "global_step": 44561, "epoch": 536} {"train_loss": -19.686920166015625, "global_step": 44562, "epoch": 536} {"train_loss": -19.606048583984375, "global_step": 44563, "epoch": 536} {"train_loss": -19.984508514404297, "global_step": 44564, "epoch": 536} {"train_loss": -19.701614379882812, "global_step": 44565, "epoch": 536} {"train_loss": -19.780271530151367, "global_step": 44566, "epoch": 536} {"train_loss": -19.811986923217773, "global_step": 44567, "epoch": 536} {"train_loss": -19.366971969604492, "global_step": 44568, "epoch": 536} {"train_loss": -19.62030601501465, "global_step": 44569, "epoch": 536} {"train_loss": -19.600555925484162, "global_step": 44570, "epoch": 536, "val_loss": 5815994.5} {"train_loss": -19.379446029663086, "global_step": 44571, "epoch": 537} {"train_loss": -19.97773551940918, "global_step": 44572, "epoch": 537} {"train_loss": -19.410446166992188, "global_step": 44573, "epoch": 537} {"train_loss": -19.424705505371094, "global_step": 44574, "epoch": 537} {"train_loss": -19.769588470458984, "global_step": 44575, "epoch": 537} {"train_loss": -19.724294662475586, "global_step": 44576, "epoch": 537} {"train_loss": -19.379104614257812, "global_step": 44577, "epoch": 537} {"train_loss": -19.94290542602539, "global_step": 44578, "epoch": 537} {"train_loss": -19.5844669342041, "global_step": 44579, "epoch": 537} {"train_loss": -19.529769897460938, "global_step": 44580, "epoch": 537} {"train_loss": -19.615468978881836, "global_step": 44581, "epoch": 537} {"train_loss": -19.65298843383789, "global_step": 44582, "epoch": 537} {"train_loss": -19.501718521118164, "global_step": 44583, "epoch": 537} {"train_loss": -19.783063888549805, "global_step": 44584, "epoch": 537} {"train_loss": -19.792762756347656, "global_step": 44585, "epoch": 537} {"train_loss": -19.832988739013672, "global_step": 44586, "epoch": 537} {"train_loss": -20.093765258789062, "global_step": 44587, "epoch": 537} {"train_loss": -19.571069717407227, "global_step": 44588, "epoch": 537} {"train_loss": -19.68331527709961, "global_step": 44589, "epoch": 537} {"train_loss": -19.481428146362305, "global_step": 44590, "epoch": 537} {"train_loss": -19.71830177307129, "global_step": 44591, "epoch": 537} {"train_loss": -19.45865821838379, "global_step": 44592, "epoch": 537} {"train_loss": -19.40983009338379, "global_step": 44593, "epoch": 537} {"train_loss": -19.520109176635742, "global_step": 44594, "epoch": 537} {"train_loss": -19.819759368896484, "global_step": 44595, "epoch": 537} {"train_loss": -19.251195907592773, "global_step": 44596, "epoch": 537} {"train_loss": -19.736906051635742, "global_step": 44597, "epoch": 537} {"train_loss": -19.290529251098633, "global_step": 44598, "epoch": 537} {"train_loss": -19.68802261352539, "global_step": 44599, "epoch": 537} {"train_loss": -19.501480102539062, "global_step": 44600, "epoch": 537} {"train_loss": -19.618240356445312, "global_step": 44601, "epoch": 537} {"train_loss": -19.662439346313477, "global_step": 44602, "epoch": 537} {"train_loss": -19.46788215637207, "global_step": 44603, "epoch": 537} {"train_loss": -19.504728317260742, "global_step": 44604, "epoch": 537} {"train_loss": -19.72562026977539, "global_step": 44605, "epoch": 537} {"train_loss": -19.64906883239746, "global_step": 44606, "epoch": 537} {"train_loss": -19.789812088012695, "global_step": 44607, "epoch": 537} {"train_loss": -19.520822525024414, "global_step": 44608, "epoch": 537} {"train_loss": -19.111331939697266, "global_step": 44609, "epoch": 537} {"train_loss": -19.918527603149414, "global_step": 44610, "epoch": 537} {"train_loss": -19.468883514404297, "global_step": 44611, "epoch": 537} {"train_loss": -19.423505783081055, "global_step": 44612, "epoch": 537} {"train_loss": -19.82063102722168, "global_step": 44613, "epoch": 537} {"train_loss": -19.497610092163086, "global_step": 44614, "epoch": 537} {"train_loss": -19.548521041870117, "global_step": 44615, "epoch": 537} {"train_loss": -19.497154235839844, "global_step": 44616, "epoch": 537} {"train_loss": -19.594778060913086, "global_step": 44617, "epoch": 537} {"train_loss": -19.779647827148438, "global_step": 44618, "epoch": 537} {"train_loss": -19.775075912475586, "global_step": 44619, "epoch": 537} {"train_loss": -19.933826446533203, "global_step": 44620, "epoch": 537} {"train_loss": -19.762954711914062, "global_step": 44621, "epoch": 537} {"train_loss": -19.78251075744629, "global_step": 44622, "epoch": 537} {"train_loss": -19.670608520507812, "global_step": 44623, "epoch": 537} {"train_loss": -19.07886505126953, "global_step": 44624, "epoch": 537} {"train_loss": -19.634016036987305, "global_step": 44625, "epoch": 537} {"train_loss": -19.037519454956055, "global_step": 44626, "epoch": 537} {"train_loss": -19.88260841369629, "global_step": 44627, "epoch": 537} {"train_loss": -19.54554557800293, "global_step": 44628, "epoch": 537} {"train_loss": -20.18891716003418, "global_step": 44629, "epoch": 537} {"train_loss": -20.008512496948242, "global_step": 44630, "epoch": 537} {"train_loss": -19.765092849731445, "global_step": 44631, "epoch": 537} {"train_loss": -19.775068283081055, "global_step": 44632, "epoch": 537} {"train_loss": -19.661439895629883, "global_step": 44633, "epoch": 537} {"train_loss": -19.763986587524414, "global_step": 44634, "epoch": 537} {"train_loss": -20.038061141967773, "global_step": 44635, "epoch": 537} {"train_loss": -19.407052993774414, "global_step": 44636, "epoch": 537} {"train_loss": -20.009084701538086, "global_step": 44637, "epoch": 537} {"train_loss": -19.71929359436035, "global_step": 44638, "epoch": 537} {"train_loss": -19.644577026367188, "global_step": 44639, "epoch": 537} {"train_loss": -19.564956665039062, "global_step": 44640, "epoch": 537} {"train_loss": -19.78000259399414, "global_step": 44641, "epoch": 537} {"train_loss": -19.70707130432129, "global_step": 44642, "epoch": 537} {"train_loss": -19.415220260620117, "global_step": 44643, "epoch": 537} {"train_loss": -19.439218521118164, "global_step": 44644, "epoch": 537} {"train_loss": -19.824542999267578, "global_step": 44645, "epoch": 537} {"train_loss": -19.548187255859375, "global_step": 44646, "epoch": 537} {"train_loss": -19.976682662963867, "global_step": 44647, "epoch": 537} {"train_loss": -20.121200561523438, "global_step": 44648, "epoch": 537} {"train_loss": -19.380748748779297, "global_step": 44649, "epoch": 537} {"train_loss": -19.73690414428711, "global_step": 44650, "epoch": 537} {"train_loss": -19.757497787475586, "global_step": 44651, "epoch": 537} {"train_loss": -19.87676239013672, "global_step": 44652, "epoch": 537} {"train_loss": -19.623364069375647, "global_step": 44653, "epoch": 537, "val_loss": 6013976.0} {"train_loss": -19.583839416503906, "global_step": 44654, "epoch": 538} {"train_loss": -19.55178451538086, "global_step": 44655, "epoch": 538} {"train_loss": -19.82379913330078, "global_step": 44656, "epoch": 538} {"train_loss": -19.106901168823242, "global_step": 44657, "epoch": 538} {"train_loss": -19.548641204833984, "global_step": 44658, "epoch": 538} {"train_loss": -19.2419490814209, "global_step": 44659, "epoch": 538} {"train_loss": -19.133995056152344, "global_step": 44660, "epoch": 538} {"train_loss": -19.88054084777832, "global_step": 44661, "epoch": 538} {"train_loss": -19.26411247253418, "global_step": 44662, "epoch": 538} {"train_loss": -19.609085083007812, "global_step": 44663, "epoch": 538} {"train_loss": -19.582685470581055, "global_step": 44664, "epoch": 538} {"train_loss": -19.367326736450195, "global_step": 44665, "epoch": 538} {"train_loss": -19.441434860229492, "global_step": 44666, "epoch": 538} {"train_loss": -19.542268753051758, "global_step": 44667, "epoch": 538} {"train_loss": -19.284177780151367, "global_step": 44668, "epoch": 538} {"train_loss": -19.81378173828125, "global_step": 44669, "epoch": 538} {"train_loss": -19.27918815612793, "global_step": 44670, "epoch": 538} {"train_loss": -19.451759338378906, "global_step": 44671, "epoch": 538} {"train_loss": -19.582807540893555, "global_step": 44672, "epoch": 538} {"train_loss": -19.417387008666992, "global_step": 44673, "epoch": 538} {"train_loss": -19.492782592773438, "global_step": 44674, "epoch": 538} {"train_loss": -20.00927734375, "global_step": 44675, "epoch": 538} {"train_loss": -19.82856559753418, "global_step": 44676, "epoch": 538} {"train_loss": -20.011770248413086, "global_step": 44677, "epoch": 538} {"train_loss": -19.47727394104004, "global_step": 44678, "epoch": 538} {"train_loss": -19.87604331970215, "global_step": 44679, "epoch": 538} {"train_loss": -19.81754493713379, "global_step": 44680, "epoch": 538} {"train_loss": -19.381528854370117, "global_step": 44681, "epoch": 538} {"train_loss": -19.694984436035156, "global_step": 44682, "epoch": 538} {"train_loss": -19.451383590698242, "global_step": 44683, "epoch": 538} {"train_loss": -19.545461654663086, "global_step": 44684, "epoch": 538} {"train_loss": -19.83397674560547, "global_step": 44685, "epoch": 538} {"train_loss": -19.686601638793945, "global_step": 44686, "epoch": 538} {"train_loss": -19.7000789642334, "global_step": 44687, "epoch": 538} {"train_loss": -19.40017318725586, "global_step": 44688, "epoch": 538} {"train_loss": -19.748220443725586, "global_step": 44689, "epoch": 538} {"train_loss": -19.98138999938965, "global_step": 44690, "epoch": 538} {"train_loss": -19.412757873535156, "global_step": 44691, "epoch": 538} {"train_loss": -19.921798706054688, "global_step": 44692, "epoch": 538} {"train_loss": -19.455015182495117, "global_step": 44693, "epoch": 538} {"train_loss": -19.692514419555664, "global_step": 44694, "epoch": 538} {"train_loss": -19.363447189331055, "global_step": 44695, "epoch": 538} {"train_loss": -19.519840240478516, "global_step": 44696, "epoch": 538} {"train_loss": -19.521770477294922, "global_step": 44697, "epoch": 538} {"train_loss": -20.12968635559082, "global_step": 44698, "epoch": 538} {"train_loss": -20.172300338745117, "global_step": 44699, "epoch": 538} {"train_loss": -19.937646865844727, "global_step": 44700, "epoch": 538} {"train_loss": -19.907678604125977, "global_step": 44701, "epoch": 538} {"train_loss": -19.827604293823242, "global_step": 44702, "epoch": 538} {"train_loss": -19.659570693969727, "global_step": 44703, "epoch": 538} {"train_loss": -19.75541877746582, "global_step": 44704, "epoch": 538} {"train_loss": -19.695804595947266, "global_step": 44705, "epoch": 538} {"train_loss": -19.857898712158203, "global_step": 44706, "epoch": 538} {"train_loss": -19.825464248657227, "global_step": 44707, "epoch": 538} {"train_loss": -19.720380783081055, "global_step": 44708, "epoch": 538} {"train_loss": -19.60887336730957, "global_step": 44709, "epoch": 538} {"train_loss": -19.539541244506836, "global_step": 44710, "epoch": 538} {"train_loss": -19.680879592895508, "global_step": 44711, "epoch": 538} {"train_loss": -19.758420944213867, "global_step": 44712, "epoch": 538} {"train_loss": -19.676977157592773, "global_step": 44713, "epoch": 538} {"train_loss": -19.98767852783203, "global_step": 44714, "epoch": 538} {"train_loss": -19.520803451538086, "global_step": 44715, "epoch": 538} {"train_loss": -19.78162384033203, "global_step": 44716, "epoch": 538} {"train_loss": -19.475317001342773, "global_step": 44717, "epoch": 538} {"train_loss": -19.66353988647461, "global_step": 44718, "epoch": 538} {"train_loss": -20.047269821166992, "global_step": 44719, "epoch": 538} {"train_loss": -19.904705047607422, "global_step": 44720, "epoch": 538} {"train_loss": -19.346206665039062, "global_step": 44721, "epoch": 538} {"train_loss": -19.75566864013672, "global_step": 44722, "epoch": 538} {"train_loss": -19.907440185546875, "global_step": 44723, "epoch": 538} {"train_loss": -19.535337448120117, "global_step": 44724, "epoch": 538} {"train_loss": -19.67807960510254, "global_step": 44725, "epoch": 538} {"train_loss": -19.909292221069336, "global_step": 44726, "epoch": 538} {"train_loss": -19.836017608642578, "global_step": 44727, "epoch": 538} {"train_loss": -19.5350399017334, "global_step": 44728, "epoch": 538} {"train_loss": -19.769027709960938, "global_step": 44729, "epoch": 538} {"train_loss": -19.595638275146484, "global_step": 44730, "epoch": 538} {"train_loss": -19.794042587280273, "global_step": 44731, "epoch": 538} {"train_loss": -19.632158279418945, "global_step": 44732, "epoch": 538} {"train_loss": -19.43739891052246, "global_step": 44733, "epoch": 538} {"train_loss": -19.535282135009766, "global_step": 44734, "epoch": 538} {"train_loss": -19.840295791625977, "global_step": 44735, "epoch": 538} {"train_loss": -19.661173694105035, "global_step": 44736, "epoch": 538, "val_loss": 5960821.0} {"train_loss": -19.462703704833984, "global_step": 44737, "epoch": 539} {"train_loss": -19.642026901245117, "global_step": 44738, "epoch": 539} {"train_loss": -19.913711547851562, "global_step": 44739, "epoch": 539} {"train_loss": -19.288434982299805, "global_step": 44740, "epoch": 539} {"train_loss": -19.77312660217285, "global_step": 44741, "epoch": 539} {"train_loss": -19.6783447265625, "global_step": 44742, "epoch": 539} {"train_loss": -19.474897384643555, "global_step": 44743, "epoch": 539} {"train_loss": -19.55352020263672, "global_step": 44744, "epoch": 539} {"train_loss": -19.853574752807617, "global_step": 44745, "epoch": 539} {"train_loss": -19.436084747314453, "global_step": 44746, "epoch": 539} {"train_loss": -19.92428970336914, "global_step": 44747, "epoch": 539} {"train_loss": -19.440433502197266, "global_step": 44748, "epoch": 539} {"train_loss": -19.380857467651367, "global_step": 44749, "epoch": 539} {"train_loss": -19.755102157592773, "global_step": 44750, "epoch": 539} {"train_loss": -19.4359130859375, "global_step": 44751, "epoch": 539} {"train_loss": -19.6657772064209, "global_step": 44752, "epoch": 539} {"train_loss": -19.697269439697266, "global_step": 44753, "epoch": 539} {"train_loss": -19.620670318603516, "global_step": 44754, "epoch": 539} {"train_loss": -19.469919204711914, "global_step": 44755, "epoch": 539} {"train_loss": -19.570764541625977, "global_step": 44756, "epoch": 539} {"train_loss": -19.4664363861084, "global_step": 44757, "epoch": 539} {"train_loss": -19.528499603271484, "global_step": 44758, "epoch": 539} {"train_loss": -19.530317306518555, "global_step": 44759, "epoch": 539} {"train_loss": -19.969358444213867, "global_step": 44760, "epoch": 539} {"train_loss": -19.720876693725586, "global_step": 44761, "epoch": 539} {"train_loss": -19.51898956298828, "global_step": 44762, "epoch": 539} {"train_loss": -19.662364959716797, "global_step": 44763, "epoch": 539} {"train_loss": -19.40195655822754, "global_step": 44764, "epoch": 539} {"train_loss": -19.849979400634766, "global_step": 44765, "epoch": 539} {"train_loss": -19.617290496826172, "global_step": 44766, "epoch": 539} {"train_loss": -20.12101173400879, "global_step": 44767, "epoch": 539} {"train_loss": -19.87171745300293, "global_step": 44768, "epoch": 539} {"train_loss": -19.56747817993164, "global_step": 44769, "epoch": 539} {"train_loss": -19.697195053100586, "global_step": 44770, "epoch": 539} {"train_loss": -19.92569923400879, "global_step": 44771, "epoch": 539} {"train_loss": -19.576025009155273, "global_step": 44772, "epoch": 539} {"train_loss": -19.718847274780273, "global_step": 44773, "epoch": 539} {"train_loss": -20.135717391967773, "global_step": 44774, "epoch": 539} {"train_loss": -19.80198860168457, "global_step": 44775, "epoch": 539} {"train_loss": -19.37955093383789, "global_step": 44776, "epoch": 539} {"train_loss": -19.434572219848633, "global_step": 44777, "epoch": 539} {"train_loss": -19.454730987548828, "global_step": 44778, "epoch": 539} {"train_loss": -19.74896240234375, "global_step": 44779, "epoch": 539} {"train_loss": -19.73933982849121, "global_step": 44780, "epoch": 539} {"train_loss": -19.548372268676758, "global_step": 44781, "epoch": 539} {"train_loss": -19.934228897094727, "global_step": 44782, "epoch": 539} {"train_loss": -19.772319793701172, "global_step": 44783, "epoch": 539} {"train_loss": -19.916927337646484, "global_step": 44784, "epoch": 539} {"train_loss": -19.350605010986328, "global_step": 44785, "epoch": 539} {"train_loss": -19.638883590698242, "global_step": 44786, "epoch": 539} {"train_loss": -19.861572265625, "global_step": 44787, "epoch": 539} {"train_loss": -19.795394897460938, "global_step": 44788, "epoch": 539} {"train_loss": -19.44679069519043, "global_step": 44789, "epoch": 539} {"train_loss": -19.68378257751465, "global_step": 44790, "epoch": 539} {"train_loss": -19.450254440307617, "global_step": 44791, "epoch": 539} {"train_loss": -19.743209838867188, "global_step": 44792, "epoch": 539} {"train_loss": -19.65740203857422, "global_step": 44793, "epoch": 539} {"train_loss": -19.32745361328125, "global_step": 44794, "epoch": 539} {"train_loss": -19.365264892578125, "global_step": 44795, "epoch": 539} {"train_loss": -19.72357177734375, "global_step": 44796, "epoch": 539} {"train_loss": -19.149564743041992, "global_step": 44797, "epoch": 539} {"train_loss": -19.7359676361084, "global_step": 44798, "epoch": 539} {"train_loss": -19.76279640197754, "global_step": 44799, "epoch": 539} {"train_loss": -19.637723922729492, "global_step": 44800, "epoch": 539} {"train_loss": -19.44099235534668, "global_step": 44801, "epoch": 539} {"train_loss": -19.598159790039062, "global_step": 44802, "epoch": 539} {"train_loss": -19.850149154663086, "global_step": 44803, "epoch": 539} {"train_loss": -19.614988327026367, "global_step": 44804, "epoch": 539} {"train_loss": -19.683605194091797, "global_step": 44805, "epoch": 539} {"train_loss": -19.988075256347656, "global_step": 44806, "epoch": 539} {"train_loss": -19.97203254699707, "global_step": 44807, "epoch": 539} {"train_loss": -19.69476890563965, "global_step": 44808, "epoch": 539} {"train_loss": -19.7335205078125, "global_step": 44809, "epoch": 539} {"train_loss": -19.7243709564209, "global_step": 44810, "epoch": 539} {"train_loss": -19.629974365234375, "global_step": 44811, "epoch": 539} {"train_loss": -20.077960968017578, "global_step": 44812, "epoch": 539} {"train_loss": -19.985458374023438, "global_step": 44813, "epoch": 539} {"train_loss": -19.840087890625, "global_step": 44814, "epoch": 539} {"train_loss": -19.84736442565918, "global_step": 44815, "epoch": 539} {"train_loss": -19.80765724182129, "global_step": 44816, "epoch": 539} {"train_loss": -19.757993698120117, "global_step": 44817, "epoch": 539} {"train_loss": -20.046201705932617, "global_step": 44818, "epoch": 539} {"train_loss": -19.652610801788697, "global_step": 44819, "epoch": 539, "val_loss": 6083012.0} {"train_loss": -19.614830017089844, "global_step": 44820, "epoch": 540} {"train_loss": -19.703405380249023, "global_step": 44821, "epoch": 540} {"train_loss": -19.440994262695312, "global_step": 44822, "epoch": 540} {"train_loss": -19.58742332458496, "global_step": 44823, "epoch": 540} {"train_loss": -19.558835983276367, "global_step": 44824, "epoch": 540} {"train_loss": -19.1513671875, "global_step": 44825, "epoch": 540} {"train_loss": -19.873456954956055, "global_step": 44826, "epoch": 540} {"train_loss": -19.854028701782227, "global_step": 44827, "epoch": 540} {"train_loss": -19.623315811157227, "global_step": 44828, "epoch": 540} {"train_loss": -19.915119171142578, "global_step": 44829, "epoch": 540} {"train_loss": -19.8618106842041, "global_step": 44830, "epoch": 540} {"train_loss": -19.71681785583496, "global_step": 44831, "epoch": 540} {"train_loss": -19.500015258789062, "global_step": 44832, "epoch": 540} {"train_loss": -19.488012313842773, "global_step": 44833, "epoch": 540} {"train_loss": -19.793272018432617, "global_step": 44834, "epoch": 540} {"train_loss": -19.600244522094727, "global_step": 44835, "epoch": 540} {"train_loss": -19.51034164428711, "global_step": 44836, "epoch": 540} {"train_loss": -19.734603881835938, "global_step": 44837, "epoch": 540} {"train_loss": -19.649412155151367, "global_step": 44838, "epoch": 540} {"train_loss": -19.548402786254883, "global_step": 44839, "epoch": 540} {"train_loss": -19.45050048828125, "global_step": 44840, "epoch": 540} {"train_loss": -19.56614112854004, "global_step": 44841, "epoch": 540} {"train_loss": -19.78545570373535, "global_step": 44842, "epoch": 540} {"train_loss": -19.624378204345703, "global_step": 44843, "epoch": 540} {"train_loss": -19.83063316345215, "global_step": 44844, "epoch": 540} {"train_loss": -19.652135848999023, "global_step": 44845, "epoch": 540} {"train_loss": -19.15236473083496, "global_step": 44846, "epoch": 540} {"train_loss": -19.91147804260254, "global_step": 44847, "epoch": 540} {"train_loss": -19.57285499572754, "global_step": 44848, "epoch": 540} {"train_loss": -19.958478927612305, "global_step": 44849, "epoch": 540} {"train_loss": -19.74823760986328, "global_step": 44850, "epoch": 540} {"train_loss": -19.394521713256836, "global_step": 44851, "epoch": 540} {"train_loss": -19.94870376586914, "global_step": 44852, "epoch": 540} {"train_loss": -19.911184310913086, "global_step": 44853, "epoch": 540} {"train_loss": -19.27631187438965, "global_step": 44854, "epoch": 540} {"train_loss": -20.05792808532715, "global_step": 44855, "epoch": 540} {"train_loss": -19.34113121032715, "global_step": 44856, "epoch": 540} {"train_loss": -19.660314559936523, "global_step": 44857, "epoch": 540} {"train_loss": -19.568824768066406, "global_step": 44858, "epoch": 540} {"train_loss": -19.87090492248535, "global_step": 44859, "epoch": 540} {"train_loss": -19.745927810668945, "global_step": 44860, "epoch": 540} {"train_loss": -19.62198257446289, "global_step": 44861, "epoch": 540} {"train_loss": -19.713623046875, "global_step": 44862, "epoch": 540} {"train_loss": -19.554218292236328, "global_step": 44863, "epoch": 540} {"train_loss": -19.829526901245117, "global_step": 44864, "epoch": 540} {"train_loss": -19.72873878479004, "global_step": 44865, "epoch": 540} {"train_loss": -19.63113021850586, "global_step": 44866, "epoch": 540} {"train_loss": -19.795801162719727, "global_step": 44867, "epoch": 540} {"train_loss": -19.52275276184082, "global_step": 44868, "epoch": 540} {"train_loss": -19.739912033081055, "global_step": 44869, "epoch": 540} {"train_loss": -19.279277801513672, "global_step": 44870, "epoch": 540} {"train_loss": -19.602087020874023, "global_step": 44871, "epoch": 540} {"train_loss": -19.41961669921875, "global_step": 44872, "epoch": 540} {"train_loss": -19.505569458007812, "global_step": 44873, "epoch": 540} {"train_loss": -19.61580467224121, "global_step": 44874, "epoch": 540} {"train_loss": -19.73917579650879, "global_step": 44875, "epoch": 540} {"train_loss": -20.114500045776367, "global_step": 44876, "epoch": 540} {"train_loss": -20.200143814086914, "global_step": 44877, "epoch": 540} {"train_loss": -19.667497634887695, "global_step": 44878, "epoch": 540} {"train_loss": -19.649282455444336, "global_step": 44879, "epoch": 540} {"train_loss": -19.466224670410156, "global_step": 44880, "epoch": 540} {"train_loss": -19.698974609375, "global_step": 44881, "epoch": 540} {"train_loss": -19.094629287719727, "global_step": 44882, "epoch": 540} {"train_loss": -19.467294692993164, "global_step": 44883, "epoch": 540} {"train_loss": -19.462785720825195, "global_step": 44884, "epoch": 540} {"train_loss": -19.786388397216797, "global_step": 44885, "epoch": 540} {"train_loss": -19.791547775268555, "global_step": 44886, "epoch": 540} {"train_loss": -19.74886131286621, "global_step": 44887, "epoch": 540} {"train_loss": -19.421972274780273, "global_step": 44888, "epoch": 540} {"train_loss": -19.569665908813477, "global_step": 44889, "epoch": 540} {"train_loss": -19.543899536132812, "global_step": 44890, "epoch": 540} {"train_loss": -19.426441192626953, "global_step": 44891, "epoch": 540} {"train_loss": -19.973066329956055, "global_step": 44892, "epoch": 540} {"train_loss": -19.68946647644043, "global_step": 44893, "epoch": 540} {"train_loss": -19.77584457397461, "global_step": 44894, "epoch": 540} {"train_loss": -19.616561889648438, "global_step": 44895, "epoch": 540} {"train_loss": -19.274259567260742, "global_step": 44896, "epoch": 540} {"train_loss": -19.74755859375, "global_step": 44897, "epoch": 540} {"train_loss": -19.714059829711914, "global_step": 44898, "epoch": 540} {"train_loss": -19.646642684936523, "global_step": 44899, "epoch": 540} {"train_loss": -19.816776275634766, "global_step": 44900, "epoch": 540} {"train_loss": -19.859363555908203, "global_step": 44901, "epoch": 540} {"train_loss": -19.661080578723585, "global_step": 44902, "epoch": 540, "val_loss": 6041480.0} {"train_loss": -19.353336334228516, "global_step": 44903, "epoch": 541} {"train_loss": -19.3287353515625, "global_step": 44904, "epoch": 541} {"train_loss": -19.440073013305664, "global_step": 44905, "epoch": 541} {"train_loss": -19.409231185913086, "global_step": 44906, "epoch": 541} {"train_loss": -19.692541122436523, "global_step": 44907, "epoch": 541} {"train_loss": -19.18535614013672, "global_step": 44908, "epoch": 541} {"train_loss": -19.397663116455078, "global_step": 44909, "epoch": 541} {"train_loss": -19.56266212463379, "global_step": 44910, "epoch": 541} {"train_loss": -19.431713104248047, "global_step": 44911, "epoch": 541} {"train_loss": -19.852567672729492, "global_step": 44912, "epoch": 541} {"train_loss": -19.821924209594727, "global_step": 44913, "epoch": 541} {"train_loss": -19.49283218383789, "global_step": 44914, "epoch": 541} {"train_loss": -19.782108306884766, "global_step": 44915, "epoch": 541} {"train_loss": -19.97234344482422, "global_step": 44916, "epoch": 541} {"train_loss": -19.757049560546875, "global_step": 44917, "epoch": 541} {"train_loss": -20.07709312438965, "global_step": 44918, "epoch": 541} {"train_loss": -19.53135108947754, "global_step": 44919, "epoch": 541} {"train_loss": -19.714269638061523, "global_step": 44920, "epoch": 541} {"train_loss": -19.549509048461914, "global_step": 44921, "epoch": 541} {"train_loss": -19.770936965942383, "global_step": 44922, "epoch": 541} {"train_loss": -19.894922256469727, "global_step": 44923, "epoch": 541} {"train_loss": -20.03076171875, "global_step": 44924, "epoch": 541} {"train_loss": -19.696870803833008, "global_step": 44925, "epoch": 541} {"train_loss": -19.688146591186523, "global_step": 44926, "epoch": 541} {"train_loss": -19.81137466430664, "global_step": 44927, "epoch": 541} {"train_loss": -19.578195571899414, "global_step": 44928, "epoch": 541} {"train_loss": -19.591474533081055, "global_step": 44929, "epoch": 541} {"train_loss": -19.702489852905273, "global_step": 44930, "epoch": 541} {"train_loss": -19.553281784057617, "global_step": 44931, "epoch": 541} {"train_loss": -19.989347457885742, "global_step": 44932, "epoch": 541} {"train_loss": -19.67978286743164, "global_step": 44933, "epoch": 541} {"train_loss": -19.746158599853516, "global_step": 44934, "epoch": 541} {"train_loss": -19.9287052154541, "global_step": 44935, "epoch": 541} {"train_loss": -19.576879501342773, "global_step": 44936, "epoch": 541} {"train_loss": -19.690994262695312, "global_step": 44937, "epoch": 541} {"train_loss": -19.837934494018555, "global_step": 44938, "epoch": 541} {"train_loss": -19.76584243774414, "global_step": 44939, "epoch": 541} {"train_loss": -19.729196548461914, "global_step": 44940, "epoch": 541} {"train_loss": -19.824460983276367, "global_step": 44941, "epoch": 541} {"train_loss": -19.411481857299805, "global_step": 44942, "epoch": 541} {"train_loss": -19.804349899291992, "global_step": 44943, "epoch": 541} {"train_loss": -19.92600440979004, "global_step": 44944, "epoch": 541} {"train_loss": -19.819494247436523, "global_step": 44945, "epoch": 541} {"train_loss": -19.583433151245117, "global_step": 44946, "epoch": 541} {"train_loss": -19.795156478881836, "global_step": 44947, "epoch": 541} {"train_loss": -19.728931427001953, "global_step": 44948, "epoch": 541} {"train_loss": -19.78456687927246, "global_step": 44949, "epoch": 541} {"train_loss": -19.805931091308594, "global_step": 44950, "epoch": 541} {"train_loss": -19.78493881225586, "global_step": 44951, "epoch": 541} {"train_loss": -19.989999771118164, "global_step": 44952, "epoch": 541} {"train_loss": -19.3493709564209, "global_step": 44953, "epoch": 541} {"train_loss": -19.69915199279785, "global_step": 44954, "epoch": 541} {"train_loss": -19.81806755065918, "global_step": 44955, "epoch": 541} {"train_loss": -20.031173706054688, "global_step": 44956, "epoch": 541} {"train_loss": -19.645309448242188, "global_step": 44957, "epoch": 541} {"train_loss": -19.595849990844727, "global_step": 44958, "epoch": 541} {"train_loss": -19.64462661743164, "global_step": 44959, "epoch": 541} {"train_loss": -19.942529678344727, "global_step": 44960, "epoch": 541} {"train_loss": -19.770978927612305, "global_step": 44961, "epoch": 541} {"train_loss": -19.827970504760742, "global_step": 44962, "epoch": 541} {"train_loss": -19.148151397705078, "global_step": 44963, "epoch": 541} {"train_loss": -19.7169246673584, "global_step": 44964, "epoch": 541} {"train_loss": -19.508560180664062, "global_step": 44965, "epoch": 541} {"train_loss": -19.76654052734375, "global_step": 44966, "epoch": 541} {"train_loss": -19.7052059173584, "global_step": 44967, "epoch": 541} {"train_loss": -19.797073364257812, "global_step": 44968, "epoch": 541} {"train_loss": -19.661344528198242, "global_step": 44969, "epoch": 541} {"train_loss": -19.735862731933594, "global_step": 44970, "epoch": 541} {"train_loss": -19.763465881347656, "global_step": 44971, "epoch": 541} {"train_loss": -19.814544677734375, "global_step": 44972, "epoch": 541} {"train_loss": -19.953121185302734, "global_step": 44973, "epoch": 541} {"train_loss": -19.74262046813965, "global_step": 44974, "epoch": 541} {"train_loss": -19.594505310058594, "global_step": 44975, "epoch": 541} {"train_loss": -19.701026916503906, "global_step": 44976, "epoch": 541} {"train_loss": -19.793834686279297, "global_step": 44977, "epoch": 541} {"train_loss": -19.681867599487305, "global_step": 44978, "epoch": 541} {"train_loss": -19.589059829711914, "global_step": 44979, "epoch": 541} {"train_loss": -20.064016342163086, "global_step": 44980, "epoch": 541} {"train_loss": -19.748075485229492, "global_step": 44981, "epoch": 541} {"train_loss": -19.545766830444336, "global_step": 44982, "epoch": 541} {"train_loss": -19.66065788269043, "global_step": 44983, "epoch": 541} {"train_loss": -19.845075607299805, "global_step": 44984, "epoch": 541} {"train_loss": -19.72347843216126, "global_step": 44985, "epoch": 541, "val_loss": 6018766.5} {"train_loss": -19.423110961914062, "global_step": 44986, "epoch": 542} {"train_loss": -19.07572364807129, "global_step": 44987, "epoch": 542} {"train_loss": -19.623699188232422, "global_step": 44988, "epoch": 542} {"train_loss": -19.42222023010254, "global_step": 44989, "epoch": 542} {"train_loss": -19.142675399780273, "global_step": 44990, "epoch": 542} {"train_loss": -19.630016326904297, "global_step": 44991, "epoch": 542} {"train_loss": -19.540935516357422, "global_step": 44992, "epoch": 542} {"train_loss": -19.74532699584961, "global_step": 44993, "epoch": 542} {"train_loss": -19.684091567993164, "global_step": 44994, "epoch": 542} {"train_loss": -19.890287399291992, "global_step": 44995, "epoch": 542} {"train_loss": -19.550643920898438, "global_step": 44996, "epoch": 542} {"train_loss": -19.57264518737793, "global_step": 44997, "epoch": 542} {"train_loss": -19.54936408996582, "global_step": 44998, "epoch": 542} {"train_loss": -19.307708740234375, "global_step": 44999, "epoch": 542} {"train_loss": -19.610078811645508, "global_step": 45000, "epoch": 542} {"train_loss": -19.822568893432617, "global_step": 45001, "epoch": 542} {"train_loss": -19.39984703063965, "global_step": 45002, "epoch": 542} {"train_loss": -19.818531036376953, "global_step": 45003, "epoch": 542} {"train_loss": -19.408037185668945, "global_step": 45004, "epoch": 542} {"train_loss": -19.76973533630371, "global_step": 45005, "epoch": 542} {"train_loss": -19.50459098815918, "global_step": 45006, "epoch": 542} {"train_loss": -19.934541702270508, "global_step": 45007, "epoch": 542} {"train_loss": -19.620159149169922, "global_step": 45008, "epoch": 542} {"train_loss": -19.512924194335938, "global_step": 45009, "epoch": 542} {"train_loss": -19.64179039001465, "global_step": 45010, "epoch": 542} {"train_loss": -19.380075454711914, "global_step": 45011, "epoch": 542} {"train_loss": -19.897083282470703, "global_step": 45012, "epoch": 542} {"train_loss": -19.3955078125, "global_step": 45013, "epoch": 542} {"train_loss": -19.99014663696289, "global_step": 45014, "epoch": 542} {"train_loss": -19.63068962097168, "global_step": 45015, "epoch": 542} {"train_loss": -19.32868766784668, "global_step": 45016, "epoch": 542} {"train_loss": -19.533727645874023, "global_step": 45017, "epoch": 542} {"train_loss": -19.869552612304688, "global_step": 45018, "epoch": 542} {"train_loss": -19.536054611206055, "global_step": 45019, "epoch": 542} {"train_loss": -19.714120864868164, "global_step": 45020, "epoch": 542} {"train_loss": -19.484678268432617, "global_step": 45021, "epoch": 542} {"train_loss": -19.627771377563477, "global_step": 45022, "epoch": 542} {"train_loss": -19.703113555908203, "global_step": 45023, "epoch": 542} {"train_loss": -19.315967559814453, "global_step": 45024, "epoch": 542} {"train_loss": -19.692977905273438, "global_step": 45025, "epoch": 542} {"train_loss": -19.630781173706055, "global_step": 45026, "epoch": 542} {"train_loss": -19.64592742919922, "global_step": 45027, "epoch": 542} {"train_loss": -19.67177391052246, "global_step": 45028, "epoch": 542} {"train_loss": -19.6511287689209, "global_step": 45029, "epoch": 542} {"train_loss": -19.693984985351562, "global_step": 45030, "epoch": 542} {"train_loss": -19.600563049316406, "global_step": 45031, "epoch": 542} {"train_loss": -19.796018600463867, "global_step": 45032, "epoch": 542} {"train_loss": -19.51766014099121, "global_step": 45033, "epoch": 542} {"train_loss": -19.651187896728516, "global_step": 45034, "epoch": 542} {"train_loss": -19.598196029663086, "global_step": 45035, "epoch": 542} {"train_loss": -19.666259765625, "global_step": 45036, "epoch": 542} {"train_loss": -19.070524215698242, "global_step": 45037, "epoch": 542} {"train_loss": -19.380704879760742, "global_step": 45038, "epoch": 542} {"train_loss": -19.649473190307617, "global_step": 45039, "epoch": 542} {"train_loss": -19.17576026916504, "global_step": 45040, "epoch": 542} {"train_loss": -19.87592887878418, "global_step": 45041, "epoch": 542} {"train_loss": -19.674875259399414, "global_step": 45042, "epoch": 542} {"train_loss": -19.822525024414062, "global_step": 45043, "epoch": 542} {"train_loss": -20.039884567260742, "global_step": 45044, "epoch": 542} {"train_loss": -19.88764762878418, "global_step": 45045, "epoch": 542} {"train_loss": -19.649486541748047, "global_step": 45046, "epoch": 542} {"train_loss": -20.011627197265625, "global_step": 45047, "epoch": 542} {"train_loss": -19.508514404296875, "global_step": 45048, "epoch": 542} {"train_loss": -19.311248779296875, "global_step": 45049, "epoch": 542} {"train_loss": -20.229787826538086, "global_step": 45050, "epoch": 542} {"train_loss": -19.621946334838867, "global_step": 45051, "epoch": 542} {"train_loss": -20.319564819335938, "global_step": 45052, "epoch": 542} {"train_loss": -19.859970092773438, "global_step": 45053, "epoch": 542} {"train_loss": -19.751646041870117, "global_step": 45054, "epoch": 542} {"train_loss": -19.850534439086914, "global_step": 45055, "epoch": 542} {"train_loss": -19.563079833984375, "global_step": 45056, "epoch": 542} {"train_loss": -19.790298461914062, "global_step": 45057, "epoch": 542} {"train_loss": -19.421510696411133, "global_step": 45058, "epoch": 542} {"train_loss": -19.90177345275879, "global_step": 45059, "epoch": 542} {"train_loss": -19.2480411529541, "global_step": 45060, "epoch": 542} {"train_loss": -19.945911407470703, "global_step": 45061, "epoch": 542} {"train_loss": -19.686399459838867, "global_step": 45062, "epoch": 542} {"train_loss": -19.763107299804688, "global_step": 45063, "epoch": 542} {"train_loss": -19.829452514648438, "global_step": 45064, "epoch": 542} {"train_loss": -19.488510131835938, "global_step": 45065, "epoch": 542} {"train_loss": -19.686491012573242, "global_step": 45066, "epoch": 542} {"train_loss": -19.442554473876953, "global_step": 45067, "epoch": 542} {"train_loss": -19.621501371084925, "global_step": 45068, "epoch": 542, "val_loss": 5954562.0} {"train_loss": -19.50453758239746, "global_step": 45069, "epoch": 543} {"train_loss": -19.249469757080078, "global_step": 45070, "epoch": 543} {"train_loss": -19.50680923461914, "global_step": 45071, "epoch": 543} {"train_loss": -19.39808464050293, "global_step": 45072, "epoch": 543} {"train_loss": -19.469642639160156, "global_step": 45073, "epoch": 543} {"train_loss": -19.22016143798828, "global_step": 45074, "epoch": 543} {"train_loss": -19.969839096069336, "global_step": 45075, "epoch": 543} {"train_loss": -19.578027725219727, "global_step": 45076, "epoch": 543} {"train_loss": -19.537643432617188, "global_step": 45077, "epoch": 543} {"train_loss": -19.518203735351562, "global_step": 45078, "epoch": 543} {"train_loss": -19.31813621520996, "global_step": 45079, "epoch": 543} {"train_loss": -19.597936630249023, "global_step": 45080, "epoch": 543} {"train_loss": -19.717607498168945, "global_step": 45081, "epoch": 543} {"train_loss": -19.695396423339844, "global_step": 45082, "epoch": 543} {"train_loss": -19.668386459350586, "global_step": 45083, "epoch": 543} {"train_loss": -19.688852310180664, "global_step": 45084, "epoch": 543} {"train_loss": -19.58396339416504, "global_step": 45085, "epoch": 543} {"train_loss": -19.69111442565918, "global_step": 45086, "epoch": 543} {"train_loss": -19.705671310424805, "global_step": 45087, "epoch": 543} {"train_loss": -19.760282516479492, "global_step": 45088, "epoch": 543} {"train_loss": -19.660123825073242, "global_step": 45089, "epoch": 543} {"train_loss": -19.76515769958496, "global_step": 45090, "epoch": 543} {"train_loss": -19.693330764770508, "global_step": 45091, "epoch": 543} {"train_loss": -19.77396011352539, "global_step": 45092, "epoch": 543} {"train_loss": -19.880268096923828, "global_step": 45093, "epoch": 543} {"train_loss": -19.470951080322266, "global_step": 45094, "epoch": 543} {"train_loss": -19.765422821044922, "global_step": 45095, "epoch": 543} {"train_loss": -19.892963409423828, "global_step": 45096, "epoch": 543} {"train_loss": -19.687143325805664, "global_step": 45097, "epoch": 543} {"train_loss": -19.886554718017578, "global_step": 45098, "epoch": 543} {"train_loss": -19.955066680908203, "global_step": 45099, "epoch": 543} {"train_loss": -19.912351608276367, "global_step": 45100, "epoch": 543} {"train_loss": -19.72426414489746, "global_step": 45101, "epoch": 543} {"train_loss": -19.89641761779785, "global_step": 45102, "epoch": 543} {"train_loss": -19.322216033935547, "global_step": 45103, "epoch": 543} {"train_loss": -19.558547973632812, "global_step": 45104, "epoch": 543} {"train_loss": -19.727073669433594, "global_step": 45105, "epoch": 543} {"train_loss": -19.875534057617188, "global_step": 45106, "epoch": 543} {"train_loss": -19.44522476196289, "global_step": 45107, "epoch": 543} {"train_loss": -19.496219635009766, "global_step": 45108, "epoch": 543} {"train_loss": -19.375995635986328, "global_step": 45109, "epoch": 543} {"train_loss": -19.377859115600586, "global_step": 45110, "epoch": 543} {"train_loss": -19.686147689819336, "global_step": 45111, "epoch": 543} {"train_loss": -19.63735008239746, "global_step": 45112, "epoch": 543} {"train_loss": -19.907594680786133, "global_step": 45113, "epoch": 543} {"train_loss": -19.797212600708008, "global_step": 45114, "epoch": 543} {"train_loss": -19.98552131652832, "global_step": 45115, "epoch": 543} {"train_loss": -19.617422103881836, "global_step": 45116, "epoch": 543} {"train_loss": -19.86149024963379, "global_step": 45117, "epoch": 543} {"train_loss": -19.518692016601562, "global_step": 45118, "epoch": 543} {"train_loss": -19.696308135986328, "global_step": 45119, "epoch": 543} {"train_loss": -19.840253829956055, "global_step": 45120, "epoch": 543} {"train_loss": -19.55116844177246, "global_step": 45121, "epoch": 543} {"train_loss": -19.8679256439209, "global_step": 45122, "epoch": 543} {"train_loss": -19.528772354125977, "global_step": 45123, "epoch": 543} {"train_loss": -19.926523208618164, "global_step": 45124, "epoch": 543} {"train_loss": -19.959157943725586, "global_step": 45125, "epoch": 543} {"train_loss": -19.406278610229492, "global_step": 45126, "epoch": 543} {"train_loss": -19.464191436767578, "global_step": 45127, "epoch": 543} {"train_loss": -19.61445426940918, "global_step": 45128, "epoch": 543} {"train_loss": -19.517332077026367, "global_step": 45129, "epoch": 543} {"train_loss": -19.487815856933594, "global_step": 45130, "epoch": 543} {"train_loss": -19.986318588256836, "global_step": 45131, "epoch": 543} {"train_loss": -19.46807861328125, "global_step": 45132, "epoch": 543} {"train_loss": -19.559329986572266, "global_step": 45133, "epoch": 543} {"train_loss": -19.85316276550293, "global_step": 45134, "epoch": 543} {"train_loss": -19.19642448425293, "global_step": 45135, "epoch": 543} {"train_loss": -19.808578491210938, "global_step": 45136, "epoch": 543} {"train_loss": -19.419994354248047, "global_step": 45137, "epoch": 543} {"train_loss": -19.760425567626953, "global_step": 45138, "epoch": 543} {"train_loss": -19.748065948486328, "global_step": 45139, "epoch": 543} {"train_loss": -19.687665939331055, "global_step": 45140, "epoch": 543} {"train_loss": -19.768686294555664, "global_step": 45141, "epoch": 543} {"train_loss": -19.97239875793457, "global_step": 45142, "epoch": 543} {"train_loss": -19.991235733032227, "global_step": 45143, "epoch": 543} {"train_loss": -19.468130111694336, "global_step": 45144, "epoch": 543} {"train_loss": -19.694183349609375, "global_step": 45145, "epoch": 543} {"train_loss": -19.872806549072266, "global_step": 45146, "epoch": 543} {"train_loss": -19.38726806640625, "global_step": 45147, "epoch": 543} {"train_loss": -19.529434204101562, "global_step": 45148, "epoch": 543} {"train_loss": -19.667736053466797, "global_step": 45149, "epoch": 543} {"train_loss": -19.59889793395996, "global_step": 45150, "epoch": 543} {"train_loss": -19.67008016195642, "global_step": 45151, "epoch": 543, "val_loss": 5938573.5} {"train_loss": -19.428457260131836, "global_step": 45152, "epoch": 544} {"train_loss": -19.459428787231445, "global_step": 45153, "epoch": 544} {"train_loss": -19.069625854492188, "global_step": 45154, "epoch": 544} {"train_loss": -19.675527572631836, "global_step": 45155, "epoch": 544} {"train_loss": -19.32416343688965, "global_step": 45156, "epoch": 544} {"train_loss": -19.08078384399414, "global_step": 45157, "epoch": 544} {"train_loss": -19.8255558013916, "global_step": 45158, "epoch": 544} {"train_loss": -19.078306198120117, "global_step": 45159, "epoch": 544} {"train_loss": -19.49940299987793, "global_step": 45160, "epoch": 544} {"train_loss": -19.154775619506836, "global_step": 45161, "epoch": 544} {"train_loss": -19.69390869140625, "global_step": 45162, "epoch": 544} {"train_loss": -19.811241149902344, "global_step": 45163, "epoch": 544} {"train_loss": -19.7819881439209, "global_step": 45164, "epoch": 544} {"train_loss": -19.940114974975586, "global_step": 45165, "epoch": 544} {"train_loss": -19.663923263549805, "global_step": 45166, "epoch": 544} {"train_loss": -19.649402618408203, "global_step": 45167, "epoch": 544} {"train_loss": -20.020462036132812, "global_step": 45168, "epoch": 544} {"train_loss": -19.596813201904297, "global_step": 45169, "epoch": 544} {"train_loss": -19.916969299316406, "global_step": 45170, "epoch": 544} {"train_loss": -19.771947860717773, "global_step": 45171, "epoch": 544} {"train_loss": -19.83054542541504, "global_step": 45172, "epoch": 544} {"train_loss": -19.85978889465332, "global_step": 45173, "epoch": 544} {"train_loss": -19.446958541870117, "global_step": 45174, "epoch": 544} {"train_loss": -19.694263458251953, "global_step": 45175, "epoch": 544} {"train_loss": -20.18536949157715, "global_step": 45176, "epoch": 544} {"train_loss": -19.873632431030273, "global_step": 45177, "epoch": 544} {"train_loss": -19.938940048217773, "global_step": 45178, "epoch": 544} {"train_loss": -19.38473892211914, "global_step": 45179, "epoch": 544} {"train_loss": -19.740636825561523, "global_step": 45180, "epoch": 544} {"train_loss": -19.630613327026367, "global_step": 45181, "epoch": 544} {"train_loss": -19.597518920898438, "global_step": 45182, "epoch": 544} {"train_loss": -19.53400993347168, "global_step": 45183, "epoch": 544} {"train_loss": -19.669330596923828, "global_step": 45184, "epoch": 544} {"train_loss": -19.824268341064453, "global_step": 45185, "epoch": 544} {"train_loss": -19.661834716796875, "global_step": 45186, "epoch": 544} {"train_loss": -19.982709884643555, "global_step": 45187, "epoch": 544} {"train_loss": -19.593626022338867, "global_step": 45188, "epoch": 544} {"train_loss": -19.95438575744629, "global_step": 45189, "epoch": 544} {"train_loss": -19.695051193237305, "global_step": 45190, "epoch": 544} {"train_loss": -19.58391761779785, "global_step": 45191, "epoch": 544} {"train_loss": -19.884498596191406, "global_step": 45192, "epoch": 544} {"train_loss": -19.659564971923828, "global_step": 45193, "epoch": 544} {"train_loss": -19.632593154907227, "global_step": 45194, "epoch": 544} {"train_loss": -19.710651397705078, "global_step": 45195, "epoch": 544} {"train_loss": -19.832548141479492, "global_step": 45196, "epoch": 544} {"train_loss": -20.09735107421875, "global_step": 45197, "epoch": 544} {"train_loss": -19.651798248291016, "global_step": 45198, "epoch": 544} {"train_loss": -19.8482666015625, "global_step": 45199, "epoch": 544} {"train_loss": -19.55852508544922, "global_step": 45200, "epoch": 544} {"train_loss": -19.521841049194336, "global_step": 45201, "epoch": 544} {"train_loss": -19.876041412353516, "global_step": 45202, "epoch": 544} {"train_loss": -19.785123825073242, "global_step": 45203, "epoch": 544} {"train_loss": -19.924772262573242, "global_step": 45204, "epoch": 544} {"train_loss": -19.334983825683594, "global_step": 45205, "epoch": 544} {"train_loss": -19.63072395324707, "global_step": 45206, "epoch": 544} {"train_loss": -19.31245231628418, "global_step": 45207, "epoch": 544} {"train_loss": -19.468297958374023, "global_step": 45208, "epoch": 544} {"train_loss": -19.40921401977539, "global_step": 45209, "epoch": 544} {"train_loss": -19.408416748046875, "global_step": 45210, "epoch": 544} {"train_loss": -19.202756881713867, "global_step": 45211, "epoch": 544} {"train_loss": -19.716543197631836, "global_step": 45212, "epoch": 544} {"train_loss": -19.796283721923828, "global_step": 45213, "epoch": 544} {"train_loss": -19.743207931518555, "global_step": 45214, "epoch": 544} {"train_loss": -19.437368392944336, "global_step": 45215, "epoch": 544} {"train_loss": -19.851465225219727, "global_step": 45216, "epoch": 544} {"train_loss": -19.777585983276367, "global_step": 45217, "epoch": 544} {"train_loss": -19.69569206237793, "global_step": 45218, "epoch": 544} {"train_loss": -19.624826431274414, "global_step": 45219, "epoch": 544} {"train_loss": -19.788156509399414, "global_step": 45220, "epoch": 544} {"train_loss": -19.42902183532715, "global_step": 45221, "epoch": 544} {"train_loss": -19.60017967224121, "global_step": 45222, "epoch": 544} {"train_loss": -19.82607650756836, "global_step": 45223, "epoch": 544} {"train_loss": -19.769582748413086, "global_step": 45224, "epoch": 544} {"train_loss": -19.667022705078125, "global_step": 45225, "epoch": 544} {"train_loss": -19.5537052154541, "global_step": 45226, "epoch": 544} {"train_loss": -19.799076080322266, "global_step": 45227, "epoch": 544} {"train_loss": -19.402868270874023, "global_step": 45228, "epoch": 544} {"train_loss": -19.89082908630371, "global_step": 45229, "epoch": 544} {"train_loss": -19.66631317138672, "global_step": 45230, "epoch": 544} {"train_loss": -19.51923942565918, "global_step": 45231, "epoch": 544} {"train_loss": -19.666574478149414, "global_step": 45232, "epoch": 544} {"train_loss": -19.776187896728516, "global_step": 45233, "epoch": 544} {"train_loss": -19.634786054312464, "global_step": 45234, "epoch": 544, "val_loss": 6004974.0} {"train_loss": -19.239728927612305, "global_step": 45235, "epoch": 545} {"train_loss": -19.55824089050293, "global_step": 45236, "epoch": 545} {"train_loss": -19.42807388305664, "global_step": 45237, "epoch": 545} {"train_loss": -19.5627498626709, "global_step": 45238, "epoch": 545} {"train_loss": -19.905805587768555, "global_step": 45239, "epoch": 545} {"train_loss": -19.678247451782227, "global_step": 45240, "epoch": 545} {"train_loss": -19.728107452392578, "global_step": 45241, "epoch": 545} {"train_loss": -19.344030380249023, "global_step": 45242, "epoch": 545} {"train_loss": -19.481801986694336, "global_step": 45243, "epoch": 545} {"train_loss": -19.8012752532959, "global_step": 45244, "epoch": 545} {"train_loss": -19.736572265625, "global_step": 45245, "epoch": 545} {"train_loss": -19.876874923706055, "global_step": 45246, "epoch": 545} {"train_loss": -19.743764877319336, "global_step": 45247, "epoch": 545} {"train_loss": -19.993921279907227, "global_step": 45248, "epoch": 545} {"train_loss": -19.729290008544922, "global_step": 45249, "epoch": 545} {"train_loss": -19.610380172729492, "global_step": 45250, "epoch": 545} {"train_loss": -19.78084373474121, "global_step": 45251, "epoch": 545} {"train_loss": -19.633434295654297, "global_step": 45252, "epoch": 545} {"train_loss": -19.802152633666992, "global_step": 45253, "epoch": 545} {"train_loss": -19.928930282592773, "global_step": 45254, "epoch": 545} {"train_loss": -19.263992309570312, "global_step": 45255, "epoch": 545} {"train_loss": -19.851119995117188, "global_step": 45256, "epoch": 545} {"train_loss": -19.68348503112793, "global_step": 45257, "epoch": 545} {"train_loss": -19.75225257873535, "global_step": 45258, "epoch": 545} {"train_loss": -19.7544002532959, "global_step": 45259, "epoch": 545} {"train_loss": -19.94378089904785, "global_step": 45260, "epoch": 545} {"train_loss": -19.722929000854492, "global_step": 45261, "epoch": 545} {"train_loss": -19.906963348388672, "global_step": 45262, "epoch": 545} {"train_loss": -19.591800689697266, "global_step": 45263, "epoch": 545} {"train_loss": -19.905927658081055, "global_step": 45264, "epoch": 545} {"train_loss": -19.712316513061523, "global_step": 45265, "epoch": 545} {"train_loss": -19.572162628173828, "global_step": 45266, "epoch": 545} {"train_loss": -19.716535568237305, "global_step": 45267, "epoch": 545} {"train_loss": -19.634098052978516, "global_step": 45268, "epoch": 545} {"train_loss": -20.01877784729004, "global_step": 45269, "epoch": 545} {"train_loss": -19.53881072998047, "global_step": 45270, "epoch": 545} {"train_loss": -19.930648803710938, "global_step": 45271, "epoch": 545} {"train_loss": -19.775161743164062, "global_step": 45272, "epoch": 545} {"train_loss": -19.471927642822266, "global_step": 45273, "epoch": 545} {"train_loss": -19.821752548217773, "global_step": 45274, "epoch": 545} {"train_loss": -19.953983306884766, "global_step": 45275, "epoch": 545} {"train_loss": -19.760318756103516, "global_step": 45276, "epoch": 545} {"train_loss": -19.523130416870117, "global_step": 45277, "epoch": 545} {"train_loss": -20.0637264251709, "global_step": 45278, "epoch": 545} {"train_loss": -19.86939811706543, "global_step": 45279, "epoch": 545} {"train_loss": -19.7325382232666, "global_step": 45280, "epoch": 545} {"train_loss": -19.802818298339844, "global_step": 45281, "epoch": 545} {"train_loss": -19.868696212768555, "global_step": 45282, "epoch": 545} {"train_loss": -19.861927032470703, "global_step": 45283, "epoch": 545} {"train_loss": -19.905073165893555, "global_step": 45284, "epoch": 545} {"train_loss": -19.67890739440918, "global_step": 45285, "epoch": 545} {"train_loss": -19.484968185424805, "global_step": 45286, "epoch": 545} {"train_loss": -19.733060836791992, "global_step": 45287, "epoch": 545} {"train_loss": -20.002756118774414, "global_step": 45288, "epoch": 545} {"train_loss": -19.641321182250977, "global_step": 45289, "epoch": 545} {"train_loss": -19.580678939819336, "global_step": 45290, "epoch": 545} {"train_loss": -19.69333839416504, "global_step": 45291, "epoch": 545} {"train_loss": -19.55487060546875, "global_step": 45292, "epoch": 545} {"train_loss": -19.6533203125, "global_step": 45293, "epoch": 545} {"train_loss": -19.939958572387695, "global_step": 45294, "epoch": 545} {"train_loss": -19.841814041137695, "global_step": 45295, "epoch": 545} {"train_loss": -20.125226974487305, "global_step": 45296, "epoch": 545} {"train_loss": -19.70513916015625, "global_step": 45297, "epoch": 545} {"train_loss": -19.50046157836914, "global_step": 45298, "epoch": 545} {"train_loss": -20.075563430786133, "global_step": 45299, "epoch": 545} {"train_loss": -19.907550811767578, "global_step": 45300, "epoch": 545} {"train_loss": -19.58609390258789, "global_step": 45301, "epoch": 545} {"train_loss": -19.893327713012695, "global_step": 45302, "epoch": 545} {"train_loss": -19.89048194885254, "global_step": 45303, "epoch": 545} {"train_loss": -20.31391716003418, "global_step": 45304, "epoch": 545} {"train_loss": -19.520862579345703, "global_step": 45305, "epoch": 545} {"train_loss": -19.798377990722656, "global_step": 45306, "epoch": 545} {"train_loss": -19.71735954284668, "global_step": 45307, "epoch": 545} {"train_loss": -19.678150177001953, "global_step": 45308, "epoch": 545} {"train_loss": -19.94540023803711, "global_step": 45309, "epoch": 545} {"train_loss": -19.65052604675293, "global_step": 45310, "epoch": 545} {"train_loss": -19.543842315673828, "global_step": 45311, "epoch": 545} {"train_loss": -19.759140014648438, "global_step": 45312, "epoch": 545} {"train_loss": -19.626996994018555, "global_step": 45313, "epoch": 545} {"train_loss": -19.55167007446289, "global_step": 45314, "epoch": 545} {"train_loss": -19.785797119140625, "global_step": 45315, "epoch": 545} {"train_loss": -19.507579803466797, "global_step": 45316, "epoch": 545} {"train_loss": -19.719930441982775, "global_step": 45317, "epoch": 545, "val_loss": 5926318.5} {"train_loss": -19.410093307495117, "global_step": 45318, "epoch": 546} {"train_loss": -19.316749572753906, "global_step": 45319, "epoch": 546} {"train_loss": -19.87105369567871, "global_step": 45320, "epoch": 546} {"train_loss": -19.43436050415039, "global_step": 45321, "epoch": 546} {"train_loss": -19.617734909057617, "global_step": 45322, "epoch": 546} {"train_loss": -19.62078857421875, "global_step": 45323, "epoch": 546} {"train_loss": -19.65424156188965, "global_step": 45324, "epoch": 546} {"train_loss": -20.149282455444336, "global_step": 45325, "epoch": 546} {"train_loss": -19.492746353149414, "global_step": 45326, "epoch": 546} {"train_loss": -19.623294830322266, "global_step": 45327, "epoch": 546} {"train_loss": -19.643333435058594, "global_step": 45328, "epoch": 546} {"train_loss": -19.43738555908203, "global_step": 45329, "epoch": 546} {"train_loss": -19.575857162475586, "global_step": 45330, "epoch": 546} {"train_loss": -19.69032096862793, "global_step": 45331, "epoch": 546} {"train_loss": -19.680328369140625, "global_step": 45332, "epoch": 546} {"train_loss": -19.91168975830078, "global_step": 45333, "epoch": 546} {"train_loss": -19.65358543395996, "global_step": 45334, "epoch": 546} {"train_loss": -19.546987533569336, "global_step": 45335, "epoch": 546} {"train_loss": -19.61860466003418, "global_step": 45336, "epoch": 546} {"train_loss": -19.661893844604492, "global_step": 45337, "epoch": 546} {"train_loss": -19.459917068481445, "global_step": 45338, "epoch": 546} {"train_loss": -19.56410026550293, "global_step": 45339, "epoch": 546} {"train_loss": -19.93489646911621, "global_step": 45340, "epoch": 546} {"train_loss": -19.425186157226562, "global_step": 45341, "epoch": 546} {"train_loss": -19.72330093383789, "global_step": 45342, "epoch": 546} {"train_loss": -19.705045700073242, "global_step": 45343, "epoch": 546} {"train_loss": -19.566205978393555, "global_step": 45344, "epoch": 546} {"train_loss": -19.691486358642578, "global_step": 45345, "epoch": 546} {"train_loss": -19.825849533081055, "global_step": 45346, "epoch": 546} {"train_loss": -19.778196334838867, "global_step": 45347, "epoch": 546} {"train_loss": -19.501178741455078, "global_step": 45348, "epoch": 546} {"train_loss": -19.88727378845215, "global_step": 45349, "epoch": 546} {"train_loss": -20.124004364013672, "global_step": 45350, "epoch": 546} {"train_loss": -19.559267044067383, "global_step": 45351, "epoch": 546} {"train_loss": -19.934419631958008, "global_step": 45352, "epoch": 546} {"train_loss": -19.79400634765625, "global_step": 45353, "epoch": 546} {"train_loss": -19.854476928710938, "global_step": 45354, "epoch": 546} {"train_loss": -19.799468994140625, "global_step": 45355, "epoch": 546} {"train_loss": -19.70369529724121, "global_step": 45356, "epoch": 546} {"train_loss": -19.63531494140625, "global_step": 45357, "epoch": 546} {"train_loss": -20.043188095092773, "global_step": 45358, "epoch": 546} {"train_loss": -19.64639663696289, "global_step": 45359, "epoch": 546} {"train_loss": -19.231290817260742, "global_step": 45360, "epoch": 546} {"train_loss": -19.633926391601562, "global_step": 45361, "epoch": 546} {"train_loss": -19.886911392211914, "global_step": 45362, "epoch": 546} {"train_loss": -19.81905174255371, "global_step": 45363, "epoch": 546} {"train_loss": -19.637229919433594, "global_step": 45364, "epoch": 546} {"train_loss": -19.94581413269043, "global_step": 45365, "epoch": 546} {"train_loss": -19.770307540893555, "global_step": 45366, "epoch": 546} {"train_loss": -19.795141220092773, "global_step": 45367, "epoch": 546} {"train_loss": -19.750280380249023, "global_step": 45368, "epoch": 546} {"train_loss": -19.683605194091797, "global_step": 45369, "epoch": 546} {"train_loss": -19.811199188232422, "global_step": 45370, "epoch": 546} {"train_loss": -19.573095321655273, "global_step": 45371, "epoch": 546} {"train_loss": -19.746904373168945, "global_step": 45372, "epoch": 546} {"train_loss": -19.413619995117188, "global_step": 45373, "epoch": 546} {"train_loss": -19.763683319091797, "global_step": 45374, "epoch": 546} {"train_loss": -19.62105369567871, "global_step": 45375, "epoch": 546} {"train_loss": -19.732624053955078, "global_step": 45376, "epoch": 546} {"train_loss": -19.7950382232666, "global_step": 45377, "epoch": 546} {"train_loss": -19.682050704956055, "global_step": 45378, "epoch": 546} {"train_loss": -20.35542869567871, "global_step": 45379, "epoch": 546} {"train_loss": -20.19705581665039, "global_step": 45380, "epoch": 546} {"train_loss": -19.703807830810547, "global_step": 45381, "epoch": 546} {"train_loss": -19.69740104675293, "global_step": 45382, "epoch": 546} {"train_loss": -19.785276412963867, "global_step": 45383, "epoch": 546} {"train_loss": -19.812440872192383, "global_step": 45384, "epoch": 546} {"train_loss": -19.666913986206055, "global_step": 45385, "epoch": 546} {"train_loss": -19.91426658630371, "global_step": 45386, "epoch": 546} {"train_loss": -19.73592758178711, "global_step": 45387, "epoch": 546} {"train_loss": -19.678903579711914, "global_step": 45388, "epoch": 546} {"train_loss": -19.76997184753418, "global_step": 45389, "epoch": 546} {"train_loss": -19.797544479370117, "global_step": 45390, "epoch": 546} {"train_loss": -19.376253128051758, "global_step": 45391, "epoch": 546} {"train_loss": -19.85955047607422, "global_step": 45392, "epoch": 546} {"train_loss": -19.680967330932617, "global_step": 45393, "epoch": 546} {"train_loss": -19.585824966430664, "global_step": 45394, "epoch": 546} {"train_loss": -19.99115562438965, "global_step": 45395, "epoch": 546} {"train_loss": -19.608701705932617, "global_step": 45396, "epoch": 546} {"train_loss": -19.816295623779297, "global_step": 45397, "epoch": 546} {"train_loss": -19.758129119873047, "global_step": 45398, "epoch": 546} {"train_loss": -19.57948112487793, "global_step": 45399, "epoch": 546} {"train_loss": -19.69021730537874, "global_step": 45400, "epoch": 546, "val_loss": 6031497.0} {"train_loss": -18.887664794921875, "global_step": 45401, "epoch": 547} {"train_loss": -19.68037223815918, "global_step": 45402, "epoch": 547} {"train_loss": -19.074460983276367, "global_step": 45403, "epoch": 547} {"train_loss": -18.958127975463867, "global_step": 45404, "epoch": 547} {"train_loss": -19.391464233398438, "global_step": 45405, "epoch": 547} {"train_loss": -19.297290802001953, "global_step": 45406, "epoch": 547} {"train_loss": -19.652896881103516, "global_step": 45407, "epoch": 547} {"train_loss": -19.446361541748047, "global_step": 45408, "epoch": 547} {"train_loss": -19.400320053100586, "global_step": 45409, "epoch": 547} {"train_loss": -19.372541427612305, "global_step": 45410, "epoch": 547} {"train_loss": -19.33401107788086, "global_step": 45411, "epoch": 547} {"train_loss": -19.386262893676758, "global_step": 45412, "epoch": 547} {"train_loss": -19.31610679626465, "global_step": 45413, "epoch": 547} {"train_loss": -19.912988662719727, "global_step": 45414, "epoch": 547} {"train_loss": -19.2814998626709, "global_step": 45415, "epoch": 547} {"train_loss": -19.712507247924805, "global_step": 45416, "epoch": 547} {"train_loss": -19.65547752380371, "global_step": 45417, "epoch": 547} {"train_loss": -19.34002685546875, "global_step": 45418, "epoch": 547} {"train_loss": -19.393796920776367, "global_step": 45419, "epoch": 547} {"train_loss": -19.255990982055664, "global_step": 45420, "epoch": 547} {"train_loss": -19.438749313354492, "global_step": 45421, "epoch": 547} {"train_loss": -19.49848747253418, "global_step": 45422, "epoch": 547} {"train_loss": -19.545270919799805, "global_step": 45423, "epoch": 547} {"train_loss": -19.608869552612305, "global_step": 45424, "epoch": 547} {"train_loss": -19.595401763916016, "global_step": 45425, "epoch": 547} {"train_loss": -19.765546798706055, "global_step": 45426, "epoch": 547} {"train_loss": -19.939558029174805, "global_step": 45427, "epoch": 547} {"train_loss": -19.673873901367188, "global_step": 45428, "epoch": 547} {"train_loss": -19.688194274902344, "global_step": 45429, "epoch": 547} {"train_loss": -19.421857833862305, "global_step": 45430, "epoch": 547} {"train_loss": -20.1229190826416, "global_step": 45431, "epoch": 547} {"train_loss": -19.560495376586914, "global_step": 45432, "epoch": 547} {"train_loss": -19.1392822265625, "global_step": 45433, "epoch": 547} {"train_loss": -19.85915756225586, "global_step": 45434, "epoch": 547} {"train_loss": -20.04060935974121, "global_step": 45435, "epoch": 547} {"train_loss": -19.570035934448242, "global_step": 45436, "epoch": 547} {"train_loss": -19.87446403503418, "global_step": 45437, "epoch": 547} {"train_loss": -19.93866539001465, "global_step": 45438, "epoch": 547} {"train_loss": -19.472463607788086, "global_step": 45439, "epoch": 547} {"train_loss": -19.96022605895996, "global_step": 45440, "epoch": 547} {"train_loss": -19.412748336791992, "global_step": 45441, "epoch": 547} {"train_loss": -19.783370971679688, "global_step": 45442, "epoch": 547} {"train_loss": -19.389495849609375, "global_step": 45443, "epoch": 547} {"train_loss": -19.7882080078125, "global_step": 45444, "epoch": 547} {"train_loss": -19.633140563964844, "global_step": 45445, "epoch": 547} {"train_loss": -20.13188362121582, "global_step": 45446, "epoch": 547} {"train_loss": -19.55777359008789, "global_step": 45447, "epoch": 547} {"train_loss": -19.846317291259766, "global_step": 45448, "epoch": 547} {"train_loss": -20.021987915039062, "global_step": 45449, "epoch": 547} {"train_loss": -19.47760009765625, "global_step": 45450, "epoch": 547} {"train_loss": -19.40601921081543, "global_step": 45451, "epoch": 547} {"train_loss": -19.917165756225586, "global_step": 45452, "epoch": 547} {"train_loss": -19.67686653137207, "global_step": 45453, "epoch": 547} {"train_loss": -19.64797592163086, "global_step": 45454, "epoch": 547} {"train_loss": -19.654499053955078, "global_step": 45455, "epoch": 547} {"train_loss": -19.54231834411621, "global_step": 45456, "epoch": 547} {"train_loss": -19.72041130065918, "global_step": 45457, "epoch": 547} {"train_loss": -19.734739303588867, "global_step": 45458, "epoch": 547} {"train_loss": -19.313373565673828, "global_step": 45459, "epoch": 547} {"train_loss": -19.812225341796875, "global_step": 45460, "epoch": 547} {"train_loss": -19.93050193786621, "global_step": 45461, "epoch": 547} {"train_loss": -19.687162399291992, "global_step": 45462, "epoch": 547} {"train_loss": -19.838834762573242, "global_step": 45463, "epoch": 547} {"train_loss": -19.769643783569336, "global_step": 45464, "epoch": 547} {"train_loss": -19.562559127807617, "global_step": 45465, "epoch": 547} {"train_loss": -19.710128784179688, "global_step": 45466, "epoch": 547} {"train_loss": -19.427947998046875, "global_step": 45467, "epoch": 547} {"train_loss": -19.626256942749023, "global_step": 45468, "epoch": 547} {"train_loss": -20.26369285583496, "global_step": 45469, "epoch": 547} {"train_loss": -20.0271053314209, "global_step": 45470, "epoch": 547} {"train_loss": -19.674774169921875, "global_step": 45471, "epoch": 547} {"train_loss": -19.62129783630371, "global_step": 45472, "epoch": 547} {"train_loss": -19.879104614257812, "global_step": 45473, "epoch": 547} {"train_loss": -19.294363021850586, "global_step": 45474, "epoch": 547} {"train_loss": -19.317663192749023, "global_step": 45475, "epoch": 547} {"train_loss": -19.641714096069336, "global_step": 45476, "epoch": 547} {"train_loss": -19.850616455078125, "global_step": 45477, "epoch": 547} {"train_loss": -19.904932022094727, "global_step": 45478, "epoch": 547} {"train_loss": -19.533329010009766, "global_step": 45479, "epoch": 547} {"train_loss": -19.842025756835938, "global_step": 45480, "epoch": 547} {"train_loss": -19.885461807250977, "global_step": 45481, "epoch": 547} {"train_loss": -19.49526023864746, "global_step": 45482, "epoch": 547} {"train_loss": -19.617236424641437, "global_step": 45483, "epoch": 547, "val_loss": 6030363.0} {"train_loss": -20.039627075195312, "global_step": 45484, "epoch": 548} {"train_loss": -19.35008430480957, "global_step": 45485, "epoch": 548} {"train_loss": -19.26950454711914, "global_step": 45486, "epoch": 548} {"train_loss": -19.457942962646484, "global_step": 45487, "epoch": 548} {"train_loss": -19.333845138549805, "global_step": 45488, "epoch": 548} {"train_loss": -20.01120376586914, "global_step": 45489, "epoch": 548} {"train_loss": -19.557329177856445, "global_step": 45490, "epoch": 548} {"train_loss": -19.605756759643555, "global_step": 45491, "epoch": 548} {"train_loss": -19.452329635620117, "global_step": 45492, "epoch": 548} {"train_loss": -19.45075225830078, "global_step": 45493, "epoch": 548} {"train_loss": -19.830041885375977, "global_step": 45494, "epoch": 548} {"train_loss": -19.581663131713867, "global_step": 45495, "epoch": 548} {"train_loss": -19.842880249023438, "global_step": 45496, "epoch": 548} {"train_loss": -19.754348754882812, "global_step": 45497, "epoch": 548} {"train_loss": -20.055208206176758, "global_step": 45498, "epoch": 548} {"train_loss": -19.87070083618164, "global_step": 45499, "epoch": 548} {"train_loss": -19.767641067504883, "global_step": 45500, "epoch": 548} {"train_loss": -19.340564727783203, "global_step": 45501, "epoch": 548} {"train_loss": -19.718517303466797, "global_step": 45502, "epoch": 548} {"train_loss": -19.656885147094727, "global_step": 45503, "epoch": 548} {"train_loss": -19.29108238220215, "global_step": 45504, "epoch": 548} {"train_loss": -19.6940975189209, "global_step": 45505, "epoch": 548} {"train_loss": -19.62965965270996, "global_step": 45506, "epoch": 548} {"train_loss": -19.708303451538086, "global_step": 45507, "epoch": 548} {"train_loss": -19.368793487548828, "global_step": 45508, "epoch": 548} {"train_loss": -19.7862491607666, "global_step": 45509, "epoch": 548} {"train_loss": -19.753904342651367, "global_step": 45510, "epoch": 548} {"train_loss": -19.68385124206543, "global_step": 45511, "epoch": 548} {"train_loss": -19.751916885375977, "global_step": 45512, "epoch": 548} {"train_loss": -19.55109214782715, "global_step": 45513, "epoch": 548} {"train_loss": -19.76542091369629, "global_step": 45514, "epoch": 548} {"train_loss": -19.638181686401367, "global_step": 45515, "epoch": 548} {"train_loss": -19.915189743041992, "global_step": 45516, "epoch": 548} {"train_loss": -19.855173110961914, "global_step": 45517, "epoch": 548} {"train_loss": -19.675161361694336, "global_step": 45518, "epoch": 548} {"train_loss": -19.720598220825195, "global_step": 45519, "epoch": 548} {"train_loss": -19.816282272338867, "global_step": 45520, "epoch": 548} {"train_loss": -19.825870513916016, "global_step": 45521, "epoch": 548} {"train_loss": -19.798809051513672, "global_step": 45522, "epoch": 548} {"train_loss": -19.645761489868164, "global_step": 45523, "epoch": 548} {"train_loss": -19.800596237182617, "global_step": 45524, "epoch": 548} {"train_loss": -19.900760650634766, "global_step": 45525, "epoch": 548} {"train_loss": -19.62872886657715, "global_step": 45526, "epoch": 548} {"train_loss": -19.79087257385254, "global_step": 45527, "epoch": 548} {"train_loss": -19.959178924560547, "global_step": 45528, "epoch": 548} {"train_loss": -19.698694229125977, "global_step": 45529, "epoch": 548} {"train_loss": -19.566476821899414, "global_step": 45530, "epoch": 548} {"train_loss": -19.975120544433594, "global_step": 45531, "epoch": 548} {"train_loss": -19.473773956298828, "global_step": 45532, "epoch": 548} {"train_loss": -19.579011917114258, "global_step": 45533, "epoch": 548} {"train_loss": -19.78481101989746, "global_step": 45534, "epoch": 548} {"train_loss": -19.902843475341797, "global_step": 45535, "epoch": 548} {"train_loss": -19.558317184448242, "global_step": 45536, "epoch": 548} {"train_loss": -19.6866512298584, "global_step": 45537, "epoch": 548} {"train_loss": -19.613393783569336, "global_step": 45538, "epoch": 548} {"train_loss": -19.916797637939453, "global_step": 45539, "epoch": 548} {"train_loss": -19.229848861694336, "global_step": 45540, "epoch": 548} {"train_loss": -19.790969848632812, "global_step": 45541, "epoch": 548} {"train_loss": -19.625715255737305, "global_step": 45542, "epoch": 548} {"train_loss": -19.95728874206543, "global_step": 45543, "epoch": 548} {"train_loss": -19.884572982788086, "global_step": 45544, "epoch": 548} {"train_loss": -19.701021194458008, "global_step": 45545, "epoch": 548} {"train_loss": -19.45473289489746, "global_step": 45546, "epoch": 548} {"train_loss": -19.697935104370117, "global_step": 45547, "epoch": 548} {"train_loss": -19.825002670288086, "global_step": 45548, "epoch": 548} {"train_loss": -19.21525764465332, "global_step": 45549, "epoch": 548} {"train_loss": -19.973812103271484, "global_step": 45550, "epoch": 548} {"train_loss": -19.810569763183594, "global_step": 45551, "epoch": 548} {"train_loss": -19.45383071899414, "global_step": 45552, "epoch": 548} {"train_loss": -19.464279174804688, "global_step": 45553, "epoch": 548} {"train_loss": -19.510683059692383, "global_step": 45554, "epoch": 548} {"train_loss": -19.737918853759766, "global_step": 45555, "epoch": 548} {"train_loss": -19.629676818847656, "global_step": 45556, "epoch": 548} {"train_loss": -19.86249351501465, "global_step": 45557, "epoch": 548} {"train_loss": -19.8648738861084, "global_step": 45558, "epoch": 548} {"train_loss": -19.679458618164062, "global_step": 45559, "epoch": 548} {"train_loss": -19.503196716308594, "global_step": 45560, "epoch": 548} {"train_loss": -19.661069869995117, "global_step": 45561, "epoch": 548} {"train_loss": -19.790212631225586, "global_step": 45562, "epoch": 548} {"train_loss": -19.684911727905273, "global_step": 45563, "epoch": 548} {"train_loss": -19.40809440612793, "global_step": 45564, "epoch": 548} {"train_loss": -19.817005157470703, "global_step": 45565, "epoch": 548} {"train_loss": -19.683668205536993, "global_step": 45566, "epoch": 548, "val_loss": 5895821.5} {"train_loss": -19.466672897338867, "global_step": 45567, "epoch": 549} {"train_loss": -19.878402709960938, "global_step": 45568, "epoch": 549} {"train_loss": -19.631855010986328, "global_step": 45569, "epoch": 549} {"train_loss": -19.57666015625, "global_step": 45570, "epoch": 549} {"train_loss": -19.377960205078125, "global_step": 45571, "epoch": 549} {"train_loss": -19.872802734375, "global_step": 45572, "epoch": 549} {"train_loss": -20.044301986694336, "global_step": 45573, "epoch": 549} {"train_loss": -19.654869079589844, "global_step": 45574, "epoch": 549} {"train_loss": -19.560041427612305, "global_step": 45575, "epoch": 549} {"train_loss": -19.46241569519043, "global_step": 45576, "epoch": 549} {"train_loss": -19.64497184753418, "global_step": 45577, "epoch": 549} {"train_loss": -19.66743278503418, "global_step": 45578, "epoch": 549} {"train_loss": -19.64179229736328, "global_step": 45579, "epoch": 549} {"train_loss": -19.72418785095215, "global_step": 45580, "epoch": 549} {"train_loss": -19.615650177001953, "global_step": 45581, "epoch": 549} {"train_loss": -19.475711822509766, "global_step": 45582, "epoch": 549} {"train_loss": -19.798070907592773, "global_step": 45583, "epoch": 549} {"train_loss": -19.50185775756836, "global_step": 45584, "epoch": 549} {"train_loss": -19.76715660095215, "global_step": 45585, "epoch": 549} {"train_loss": -20.05452537536621, "global_step": 45586, "epoch": 549} {"train_loss": -19.378597259521484, "global_step": 45587, "epoch": 549} {"train_loss": -19.441314697265625, "global_step": 45588, "epoch": 549} {"train_loss": -19.928359985351562, "global_step": 45589, "epoch": 549} {"train_loss": -19.55950355529785, "global_step": 45590, "epoch": 549} {"train_loss": -19.70714569091797, "global_step": 45591, "epoch": 549} {"train_loss": -19.39410400390625, "global_step": 45592, "epoch": 549} {"train_loss": -19.464492797851562, "global_step": 45593, "epoch": 549} {"train_loss": -19.96091079711914, "global_step": 45594, "epoch": 549} {"train_loss": -19.85945701599121, "global_step": 45595, "epoch": 549} {"train_loss": -19.808958053588867, "global_step": 45596, "epoch": 549} {"train_loss": -19.575963973999023, "global_step": 45597, "epoch": 549} {"train_loss": -19.8913631439209, "global_step": 45598, "epoch": 549} {"train_loss": -19.60692024230957, "global_step": 45599, "epoch": 549} {"train_loss": -19.896451950073242, "global_step": 45600, "epoch": 549} {"train_loss": -19.5557918548584, "global_step": 45601, "epoch": 549} {"train_loss": -19.27429962158203, "global_step": 45602, "epoch": 549} {"train_loss": -19.774612426757812, "global_step": 45603, "epoch": 549} {"train_loss": -19.686559677124023, "global_step": 45604, "epoch": 549} {"train_loss": -20.07600975036621, "global_step": 45605, "epoch": 549} {"train_loss": -19.735671997070312, "global_step": 45606, "epoch": 549} {"train_loss": -19.767105102539062, "global_step": 45607, "epoch": 549} {"train_loss": -19.945653915405273, "global_step": 45608, "epoch": 549} {"train_loss": -19.695301055908203, "global_step": 45609, "epoch": 549} {"train_loss": -19.56440544128418, "global_step": 45610, "epoch": 549} {"train_loss": -19.737071990966797, "global_step": 45611, "epoch": 549} {"train_loss": -19.863372802734375, "global_step": 45612, "epoch": 549} {"train_loss": -19.595855712890625, "global_step": 45613, "epoch": 549} {"train_loss": -19.795166015625, "global_step": 45614, "epoch": 549} {"train_loss": -19.892274856567383, "global_step": 45615, "epoch": 549} {"train_loss": -19.153837203979492, "global_step": 45616, "epoch": 549} {"train_loss": -19.783742904663086, "global_step": 45617, "epoch": 549} {"train_loss": -19.750835418701172, "global_step": 45618, "epoch": 549} {"train_loss": -19.825986862182617, "global_step": 45619, "epoch": 549} {"train_loss": -19.889902114868164, "global_step": 45620, "epoch": 549} {"train_loss": -19.64902114868164, "global_step": 45621, "epoch": 549} {"train_loss": -19.613399505615234, "global_step": 45622, "epoch": 549} {"train_loss": -19.279022216796875, "global_step": 45623, "epoch": 549} {"train_loss": -19.717634201049805, "global_step": 45624, "epoch": 549} {"train_loss": -19.397008895874023, "global_step": 45625, "epoch": 549} {"train_loss": -19.937849044799805, "global_step": 45626, "epoch": 549} {"train_loss": -19.394412994384766, "global_step": 45627, "epoch": 549} {"train_loss": -19.789770126342773, "global_step": 45628, "epoch": 549} {"train_loss": -19.680021286010742, "global_step": 45629, "epoch": 549} {"train_loss": -19.542980194091797, "global_step": 45630, "epoch": 549} {"train_loss": -19.732437133789062, "global_step": 45631, "epoch": 549} {"train_loss": -19.45228385925293, "global_step": 45632, "epoch": 549} {"train_loss": -19.917036056518555, "global_step": 45633, "epoch": 549} {"train_loss": -19.670989990234375, "global_step": 45634, "epoch": 549} {"train_loss": -19.60406494140625, "global_step": 45635, "epoch": 549} {"train_loss": -19.725862503051758, "global_step": 45636, "epoch": 549} {"train_loss": -19.93321418762207, "global_step": 45637, "epoch": 549} {"train_loss": -19.520565032958984, "global_step": 45638, "epoch": 549} {"train_loss": -20.06735610961914, "global_step": 45639, "epoch": 549} {"train_loss": -19.8796329498291, "global_step": 45640, "epoch": 549} {"train_loss": -19.956113815307617, "global_step": 45641, "epoch": 549} {"train_loss": -19.71309471130371, "global_step": 45642, "epoch": 549} {"train_loss": -19.58675193786621, "global_step": 45643, "epoch": 549} {"train_loss": -19.982954025268555, "global_step": 45644, "epoch": 549} {"train_loss": -19.780532836914062, "global_step": 45645, "epoch": 549} {"train_loss": -19.871999740600586, "global_step": 45646, "epoch": 549} {"train_loss": -19.708974838256836, "global_step": 45647, "epoch": 549} {"train_loss": -20.1629695892334, "global_step": 45648, "epoch": 549} {"train_loss": -19.708831074726152, "global_step": 45649, "epoch": 549, "val_loss": 6116909.0} {"train_loss": -19.259878158569336, "global_step": 45650, "epoch": 550} {"train_loss": -19.601285934448242, "global_step": 45651, "epoch": 550} {"train_loss": -19.312314987182617, "global_step": 45652, "epoch": 550} {"train_loss": -19.53315544128418, "global_step": 45653, "epoch": 550} {"train_loss": -19.811874389648438, "global_step": 45654, "epoch": 550} {"train_loss": -19.461109161376953, "global_step": 45655, "epoch": 550} {"train_loss": -19.576135635375977, "global_step": 45656, "epoch": 550} {"train_loss": -19.51116371154785, "global_step": 45657, "epoch": 550} {"train_loss": -19.9190616607666, "global_step": 45658, "epoch": 550} {"train_loss": -19.771512985229492, "global_step": 45659, "epoch": 550} {"train_loss": -19.58734130859375, "global_step": 45660, "epoch": 550} {"train_loss": -19.936298370361328, "global_step": 45661, "epoch": 550} {"train_loss": -19.47602081298828, "global_step": 45662, "epoch": 550} {"train_loss": -19.665834426879883, "global_step": 45663, "epoch": 550} {"train_loss": -19.664838790893555, "global_step": 45664, "epoch": 550} {"train_loss": -19.799978256225586, "global_step": 45665, "epoch": 550} {"train_loss": -19.57154083251953, "global_step": 45666, "epoch": 550} {"train_loss": -19.774690628051758, "global_step": 45667, "epoch": 550} {"train_loss": -19.652507781982422, "global_step": 45668, "epoch": 550} {"train_loss": -20.107011795043945, "global_step": 45669, "epoch": 550} {"train_loss": -19.791353225708008, "global_step": 45670, "epoch": 550} {"train_loss": -19.77187156677246, "global_step": 45671, "epoch": 550} {"train_loss": -19.708974838256836, "global_step": 45672, "epoch": 550} {"train_loss": -19.854053497314453, "global_step": 45673, "epoch": 550} {"train_loss": -19.98280906677246, "global_step": 45674, "epoch": 550} {"train_loss": -19.347211837768555, "global_step": 45675, "epoch": 550} {"train_loss": -19.532377243041992, "global_step": 45676, "epoch": 550} {"train_loss": -19.500396728515625, "global_step": 45677, "epoch": 550} {"train_loss": -19.30549430847168, "global_step": 45678, "epoch": 550} {"train_loss": -19.86006736755371, "global_step": 45679, "epoch": 550} {"train_loss": -19.9737491607666, "global_step": 45680, "epoch": 550} {"train_loss": -19.44899559020996, "global_step": 45681, "epoch": 550} {"train_loss": -19.373952865600586, "global_step": 45682, "epoch": 550} {"train_loss": -19.972225189208984, "global_step": 45683, "epoch": 550} {"train_loss": -19.51139259338379, "global_step": 45684, "epoch": 550} {"train_loss": -19.76886749267578, "global_step": 45685, "epoch": 550} {"train_loss": -19.527013778686523, "global_step": 45686, "epoch": 550} {"train_loss": -19.425527572631836, "global_step": 45687, "epoch": 550} {"train_loss": -19.74847412109375, "global_step": 45688, "epoch": 550} {"train_loss": -19.425416946411133, "global_step": 45689, "epoch": 550} {"train_loss": -19.64611053466797, "global_step": 45690, "epoch": 550} {"train_loss": -19.45170783996582, "global_step": 45691, "epoch": 550} {"train_loss": -19.80190086364746, "global_step": 45692, "epoch": 550} {"train_loss": -19.71717643737793, "global_step": 45693, "epoch": 550} {"train_loss": -19.713077545166016, "global_step": 45694, "epoch": 550} {"train_loss": -19.7745361328125, "global_step": 45695, "epoch": 550} {"train_loss": -19.65508460998535, "global_step": 45696, "epoch": 550} {"train_loss": -19.749387741088867, "global_step": 45697, "epoch": 550} {"train_loss": -19.78860855102539, "global_step": 45698, "epoch": 550} {"train_loss": -19.680490493774414, "global_step": 45699, "epoch": 550} {"train_loss": -19.643234252929688, "global_step": 45700, "epoch": 550} {"train_loss": -20.031705856323242, "global_step": 45701, "epoch": 550} {"train_loss": -20.083803176879883, "global_step": 45702, "epoch": 550} {"train_loss": -19.93608856201172, "global_step": 45703, "epoch": 550} {"train_loss": -19.991323471069336, "global_step": 45704, "epoch": 550} {"train_loss": -19.818634033203125, "global_step": 45705, "epoch": 550} {"train_loss": -20.098865509033203, "global_step": 45706, "epoch": 550} {"train_loss": -19.404165267944336, "global_step": 45707, "epoch": 550} {"train_loss": -19.6788272857666, "global_step": 45708, "epoch": 550} {"train_loss": -19.697816848754883, "global_step": 45709, "epoch": 550} {"train_loss": -19.981523513793945, "global_step": 45710, "epoch": 550} {"train_loss": -19.90824317932129, "global_step": 45711, "epoch": 550} {"train_loss": -19.81569480895996, "global_step": 45712, "epoch": 550} {"train_loss": -20.071407318115234, "global_step": 45713, "epoch": 550} {"train_loss": -19.665958404541016, "global_step": 45714, "epoch": 550} {"train_loss": -19.603361129760742, "global_step": 45715, "epoch": 550} {"train_loss": -19.87628173828125, "global_step": 45716, "epoch": 550} {"train_loss": -19.795166015625, "global_step": 45717, "epoch": 550} {"train_loss": -19.23594856262207, "global_step": 45718, "epoch": 550} {"train_loss": -19.565580368041992, "global_step": 45719, "epoch": 550} {"train_loss": -19.586816787719727, "global_step": 45720, "epoch": 550} {"train_loss": -19.839908599853516, "global_step": 45721, "epoch": 550} {"train_loss": -19.67070960998535, "global_step": 45722, "epoch": 550} {"train_loss": -19.556238174438477, "global_step": 45723, "epoch": 550} {"train_loss": -19.830245971679688, "global_step": 45724, "epoch": 550} {"train_loss": -19.89632225036621, "global_step": 45725, "epoch": 550} {"train_loss": -19.74773597717285, "global_step": 45726, "epoch": 550} {"train_loss": -19.476911544799805, "global_step": 45727, "epoch": 550} {"train_loss": -20.025344848632812, "global_step": 45728, "epoch": 550} {"train_loss": -19.301904678344727, "global_step": 45729, "epoch": 550} {"train_loss": -19.85256004333496, "global_step": 45730, "epoch": 550} {"train_loss": -20.064594268798828, "global_step": 45731, "epoch": 550} {"train_loss": -19.707389578761823, "global_step": 45732, "epoch": 550, "train/sim_max_reward_0": 1.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 0.0, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4500000": 1.0, "test/sim_max_reward_4500001": 1.0, "test/sim_max_reward_4500002": 1.0, "test/sim_max_reward_4500003": 1.0, "test/sim_max_reward_4500004": 1.0, "test/sim_max_reward_4500005": 1.0, "test/sim_max_reward_4500006": 1.0, "test/sim_max_reward_4500007": 1.0, "test/sim_max_reward_4500008": 1.0, "test/sim_max_reward_4500009": 1.0, "test/sim_max_reward_4500010": 1.0, "test/sim_max_reward_4500011": 1.0, "test/sim_max_reward_4500012": 1.0, "test/sim_max_reward_4500013": 1.0, "test/sim_max_reward_4500014": 1.0, "test/sim_max_reward_4500015": 1.0, "test/sim_max_reward_4500016": 1.0, "test/sim_max_reward_4500017": 1.0, "test/sim_max_reward_4500018": 1.0, "test/sim_max_reward_4500019": 0.0, "test/sim_max_reward_4500020": 1.0, "test/sim_max_reward_4500021": 1.0, "train/mean_score": 0.8333333333333334, "test/mean_score": 0.9545454545454546, "val_loss": 5897535.5} {"train_loss": -19.59282875061035, "global_step": 45733, "epoch": 551} {"train_loss": -19.576353073120117, "global_step": 45734, "epoch": 551} {"train_loss": -19.637765884399414, "global_step": 45735, "epoch": 551} {"train_loss": -19.63916015625, "global_step": 45736, "epoch": 551} {"train_loss": -19.461944580078125, "global_step": 45737, "epoch": 551} {"train_loss": -19.51788902282715, "global_step": 45738, "epoch": 551} {"train_loss": -19.54657554626465, "global_step": 45739, "epoch": 551} {"train_loss": -19.75087547302246, "global_step": 45740, "epoch": 551} {"train_loss": -19.764820098876953, "global_step": 45741, "epoch": 551} {"train_loss": -19.294363021850586, "global_step": 45742, "epoch": 551} {"train_loss": -19.582637786865234, "global_step": 45743, "epoch": 551} {"train_loss": -19.618467330932617, "global_step": 45744, "epoch": 551} {"train_loss": -19.702383041381836, "global_step": 45745, "epoch": 551} {"train_loss": -19.653722763061523, "global_step": 45746, "epoch": 551} {"train_loss": -19.71501922607422, "global_step": 45747, "epoch": 551} {"train_loss": -19.680097579956055, "global_step": 45748, "epoch": 551} {"train_loss": -19.712432861328125, "global_step": 45749, "epoch": 551} {"train_loss": -19.317792892456055, "global_step": 45750, "epoch": 551} {"train_loss": -19.903871536254883, "global_step": 45751, "epoch": 551} {"train_loss": -19.995115280151367, "global_step": 45752, "epoch": 551} {"train_loss": -19.29429054260254, "global_step": 45753, "epoch": 551} {"train_loss": -19.589649200439453, "global_step": 45754, "epoch": 551} {"train_loss": -19.64754867553711, "global_step": 45755, "epoch": 551} {"train_loss": -19.755422592163086, "global_step": 45756, "epoch": 551} {"train_loss": -19.52332878112793, "global_step": 45757, "epoch": 551} {"train_loss": -19.76026725769043, "global_step": 45758, "epoch": 551} {"train_loss": -19.792205810546875, "global_step": 45759, "epoch": 551} {"train_loss": -19.90229606628418, "global_step": 45760, "epoch": 551} {"train_loss": -19.817092895507812, "global_step": 45761, "epoch": 551} {"train_loss": -19.9500789642334, "global_step": 45762, "epoch": 551} {"train_loss": -19.577558517456055, "global_step": 45763, "epoch": 551} {"train_loss": -19.831186294555664, "global_step": 45764, "epoch": 551} {"train_loss": -19.439434051513672, "global_step": 45765, "epoch": 551} {"train_loss": -19.964481353759766, "global_step": 45766, "epoch": 551} {"train_loss": -19.84633445739746, "global_step": 45767, "epoch": 551} {"train_loss": -19.556833267211914, "global_step": 45768, "epoch": 551} {"train_loss": -19.827600479125977, "global_step": 45769, "epoch": 551} {"train_loss": -19.65842056274414, "global_step": 45770, "epoch": 551} {"train_loss": -20.27042007446289, "global_step": 45771, "epoch": 551} {"train_loss": -20.0565185546875, "global_step": 45772, "epoch": 551} {"train_loss": -20.07993507385254, "global_step": 45773, "epoch": 551} {"train_loss": -19.318668365478516, "global_step": 45774, "epoch": 551} {"train_loss": -19.943361282348633, "global_step": 45775, "epoch": 551} {"train_loss": -19.562971115112305, "global_step": 45776, "epoch": 551} {"train_loss": -19.613746643066406, "global_step": 45777, "epoch": 551} {"train_loss": -19.745487213134766, "global_step": 45778, "epoch": 551} {"train_loss": -19.659435272216797, "global_step": 45779, "epoch": 551} {"train_loss": -19.647680282592773, "global_step": 45780, "epoch": 551} {"train_loss": -19.757736206054688, "global_step": 45781, "epoch": 551} {"train_loss": -19.70863151550293, "global_step": 45782, "epoch": 551} {"train_loss": -19.83977699279785, "global_step": 45783, "epoch": 551} {"train_loss": -19.7835636138916, "global_step": 45784, "epoch": 551} {"train_loss": -19.602018356323242, "global_step": 45785, "epoch": 551} {"train_loss": -19.964035034179688, "global_step": 45786, "epoch": 551} {"train_loss": -19.653396606445312, "global_step": 45787, "epoch": 551} {"train_loss": -19.143280029296875, "global_step": 45788, "epoch": 551} {"train_loss": -19.746707916259766, "global_step": 45789, "epoch": 551} {"train_loss": -19.466535568237305, "global_step": 45790, "epoch": 551} {"train_loss": -19.7893123626709, "global_step": 45791, "epoch": 551} {"train_loss": -19.521045684814453, "global_step": 45792, "epoch": 551} {"train_loss": -19.567373275756836, "global_step": 45793, "epoch": 551} {"train_loss": -19.63688850402832, "global_step": 45794, "epoch": 551} {"train_loss": -19.34682273864746, "global_step": 45795, "epoch": 551} {"train_loss": -19.21007537841797, "global_step": 45796, "epoch": 551} {"train_loss": -19.965665817260742, "global_step": 45797, "epoch": 551} {"train_loss": -19.626771926879883, "global_step": 45798, "epoch": 551} {"train_loss": -19.51650047302246, "global_step": 45799, "epoch": 551} {"train_loss": -20.04347801208496, "global_step": 45800, "epoch": 551} {"train_loss": -19.464576721191406, "global_step": 45801, "epoch": 551} {"train_loss": -19.56599998474121, "global_step": 45802, "epoch": 551} {"train_loss": -19.838438034057617, "global_step": 45803, "epoch": 551} {"train_loss": -19.637929916381836, "global_step": 45804, "epoch": 551} {"train_loss": -20.218839645385742, "global_step": 45805, "epoch": 551} {"train_loss": -20.067886352539062, "global_step": 45806, "epoch": 551} {"train_loss": -20.09731101989746, "global_step": 45807, "epoch": 551} {"train_loss": -19.943601608276367, "global_step": 45808, "epoch": 551} {"train_loss": -19.835330963134766, "global_step": 45809, "epoch": 551} {"train_loss": -19.5165958404541, "global_step": 45810, "epoch": 551} {"train_loss": -20.035085678100586, "global_step": 45811, "epoch": 551} {"train_loss": -19.83241081237793, "global_step": 45812, "epoch": 551} {"train_loss": -19.839265823364258, "global_step": 45813, "epoch": 551} {"train_loss": -19.667421340942383, "global_step": 45814, "epoch": 551} {"train_loss": -19.720999430461102, "global_step": 45815, "epoch": 551, "val_loss": 5933025.0} {"train_loss": -19.73097801208496, "global_step": 45816, "epoch": 552} {"train_loss": -19.688831329345703, "global_step": 45817, "epoch": 552} {"train_loss": -19.18096351623535, "global_step": 45818, "epoch": 552} {"train_loss": -19.1003475189209, "global_step": 45819, "epoch": 552} {"train_loss": -19.8436222076416, "global_step": 45820, "epoch": 552} {"train_loss": -19.893177032470703, "global_step": 45821, "epoch": 552} {"train_loss": -19.661725997924805, "global_step": 45822, "epoch": 552} {"train_loss": -19.432584762573242, "global_step": 45823, "epoch": 552} {"train_loss": -19.574132919311523, "global_step": 45824, "epoch": 552} {"train_loss": -19.568937301635742, "global_step": 45825, "epoch": 552} {"train_loss": -19.932479858398438, "global_step": 45826, "epoch": 552} {"train_loss": -19.802654266357422, "global_step": 45827, "epoch": 552} {"train_loss": -19.71034812927246, "global_step": 45828, "epoch": 552} {"train_loss": -19.715044021606445, "global_step": 45829, "epoch": 552} {"train_loss": -19.643674850463867, "global_step": 45830, "epoch": 552} {"train_loss": -19.752721786499023, "global_step": 45831, "epoch": 552} {"train_loss": -19.648193359375, "global_step": 45832, "epoch": 552} {"train_loss": -19.48980140686035, "global_step": 45833, "epoch": 552} {"train_loss": -20.072961807250977, "global_step": 45834, "epoch": 552} {"train_loss": -19.583017349243164, "global_step": 45835, "epoch": 552} {"train_loss": -19.794958114624023, "global_step": 45836, "epoch": 552} {"train_loss": -19.879545211791992, "global_step": 45837, "epoch": 552} {"train_loss": -20.190134048461914, "global_step": 45838, "epoch": 552} {"train_loss": -19.52203941345215, "global_step": 45839, "epoch": 552} {"train_loss": -19.453794479370117, "global_step": 45840, "epoch": 552} {"train_loss": -19.561359405517578, "global_step": 45841, "epoch": 552} {"train_loss": -19.957311630249023, "global_step": 45842, "epoch": 552} {"train_loss": -19.86385154724121, "global_step": 45843, "epoch": 552} {"train_loss": -20.008289337158203, "global_step": 45844, "epoch": 552} {"train_loss": -20.234647750854492, "global_step": 45845, "epoch": 552} {"train_loss": -20.030370712280273, "global_step": 45846, "epoch": 552} {"train_loss": -19.98236083984375, "global_step": 45847, "epoch": 552} {"train_loss": -19.773244857788086, "global_step": 45848, "epoch": 552} {"train_loss": -19.774593353271484, "global_step": 45849, "epoch": 552} {"train_loss": -20.0240478515625, "global_step": 45850, "epoch": 552} {"train_loss": -19.554418563842773, "global_step": 45851, "epoch": 552} {"train_loss": -19.35465431213379, "global_step": 45852, "epoch": 552} {"train_loss": -19.427684783935547, "global_step": 45853, "epoch": 552} {"train_loss": -20.108755111694336, "global_step": 45854, "epoch": 552} {"train_loss": -19.72321128845215, "global_step": 45855, "epoch": 552} {"train_loss": -19.638477325439453, "global_step": 45856, "epoch": 552} {"train_loss": -19.533676147460938, "global_step": 45857, "epoch": 552} {"train_loss": -19.828962326049805, "global_step": 45858, "epoch": 552} {"train_loss": -19.402631759643555, "global_step": 45859, "epoch": 552} {"train_loss": -19.890850067138672, "global_step": 45860, "epoch": 552} {"train_loss": -19.845853805541992, "global_step": 45861, "epoch": 552} {"train_loss": -19.639501571655273, "global_step": 45862, "epoch": 552} {"train_loss": -19.731948852539062, "global_step": 45863, "epoch": 552} {"train_loss": -19.568037033081055, "global_step": 45864, "epoch": 552} {"train_loss": -19.61701774597168, "global_step": 45865, "epoch": 552} {"train_loss": -19.809894561767578, "global_step": 45866, "epoch": 552} {"train_loss": -19.731718063354492, "global_step": 45867, "epoch": 552} {"train_loss": -19.79080581665039, "global_step": 45868, "epoch": 552} {"train_loss": -19.907421112060547, "global_step": 45869, "epoch": 552} {"train_loss": -19.416128158569336, "global_step": 45870, "epoch": 552} {"train_loss": -19.688108444213867, "global_step": 45871, "epoch": 552} {"train_loss": -19.861236572265625, "global_step": 45872, "epoch": 552} {"train_loss": -19.76429557800293, "global_step": 45873, "epoch": 552} {"train_loss": -20.01396942138672, "global_step": 45874, "epoch": 552} {"train_loss": -19.40858268737793, "global_step": 45875, "epoch": 552} {"train_loss": -19.613189697265625, "global_step": 45876, "epoch": 552} {"train_loss": -19.556598663330078, "global_step": 45877, "epoch": 552} {"train_loss": -19.61988639831543, "global_step": 45878, "epoch": 552} {"train_loss": -19.82618522644043, "global_step": 45879, "epoch": 552} {"train_loss": -19.58900260925293, "global_step": 45880, "epoch": 552} {"train_loss": -19.90861701965332, "global_step": 45881, "epoch": 552} {"train_loss": -19.320119857788086, "global_step": 45882, "epoch": 552} {"train_loss": -19.381864547729492, "global_step": 45883, "epoch": 552} {"train_loss": -19.843494415283203, "global_step": 45884, "epoch": 552} {"train_loss": -19.733861923217773, "global_step": 45885, "epoch": 552} {"train_loss": -19.939180374145508, "global_step": 45886, "epoch": 552} {"train_loss": -19.86355972290039, "global_step": 45887, "epoch": 552} {"train_loss": -19.94036293029785, "global_step": 45888, "epoch": 552} {"train_loss": -19.455411911010742, "global_step": 45889, "epoch": 552} {"train_loss": -19.77521514892578, "global_step": 45890, "epoch": 552} {"train_loss": -19.57222557067871, "global_step": 45891, "epoch": 552} {"train_loss": -19.936725616455078, "global_step": 45892, "epoch": 552} {"train_loss": -20.01618766784668, "global_step": 45893, "epoch": 552} {"train_loss": -19.888051986694336, "global_step": 45894, "epoch": 552} {"train_loss": -19.930908203125, "global_step": 45895, "epoch": 552} {"train_loss": -19.932626724243164, "global_step": 45896, "epoch": 552} {"train_loss": -19.792964935302734, "global_step": 45897, "epoch": 552} {"train_loss": -19.7330883899367, "global_step": 45898, "epoch": 552, "val_loss": 5948656.5} {"train_loss": -19.57370376586914, "global_step": 45899, "epoch": 553} {"train_loss": -19.406780242919922, "global_step": 45900, "epoch": 553} {"train_loss": -19.443832397460938, "global_step": 45901, "epoch": 553} {"train_loss": -19.404632568359375, "global_step": 45902, "epoch": 553} {"train_loss": -19.35548973083496, "global_step": 45903, "epoch": 553} {"train_loss": -19.7375431060791, "global_step": 45904, "epoch": 553} {"train_loss": -19.499282836914062, "global_step": 45905, "epoch": 553} {"train_loss": -19.467756271362305, "global_step": 45906, "epoch": 553} {"train_loss": -19.83860206604004, "global_step": 45907, "epoch": 553} {"train_loss": -19.764739990234375, "global_step": 45908, "epoch": 553} {"train_loss": -20.0865478515625, "global_step": 45909, "epoch": 553} {"train_loss": -19.602222442626953, "global_step": 45910, "epoch": 553} {"train_loss": -19.769742965698242, "global_step": 45911, "epoch": 553} {"train_loss": -19.60969352722168, "global_step": 45912, "epoch": 553} {"train_loss": -19.55092430114746, "global_step": 45913, "epoch": 553} {"train_loss": -19.824542999267578, "global_step": 45914, "epoch": 553} {"train_loss": -19.503501892089844, "global_step": 45915, "epoch": 553} {"train_loss": -19.179208755493164, "global_step": 45916, "epoch": 553} {"train_loss": -19.560346603393555, "global_step": 45917, "epoch": 553} {"train_loss": -19.481155395507812, "global_step": 45918, "epoch": 553} {"train_loss": -19.779199600219727, "global_step": 45919, "epoch": 553} {"train_loss": -19.57698631286621, "global_step": 45920, "epoch": 553} {"train_loss": -19.40711212158203, "global_step": 45921, "epoch": 553} {"train_loss": -19.38555908203125, "global_step": 45922, "epoch": 553} {"train_loss": -19.525976181030273, "global_step": 45923, "epoch": 553} {"train_loss": -20.079145431518555, "global_step": 45924, "epoch": 553} {"train_loss": -19.77252197265625, "global_step": 45925, "epoch": 553} {"train_loss": -20.097190856933594, "global_step": 45926, "epoch": 553} {"train_loss": -19.64133644104004, "global_step": 45927, "epoch": 553} {"train_loss": -19.544958114624023, "global_step": 45928, "epoch": 553} {"train_loss": -19.690542221069336, "global_step": 45929, "epoch": 553} {"train_loss": -20.02864646911621, "global_step": 45930, "epoch": 553} {"train_loss": -19.924610137939453, "global_step": 45931, "epoch": 553} {"train_loss": -19.692686080932617, "global_step": 45932, "epoch": 553} {"train_loss": -19.747987747192383, "global_step": 45933, "epoch": 553} {"train_loss": -19.935049057006836, "global_step": 45934, "epoch": 553} {"train_loss": -19.636789321899414, "global_step": 45935, "epoch": 553} {"train_loss": -19.4279727935791, "global_step": 45936, "epoch": 553} {"train_loss": -19.706655502319336, "global_step": 45937, "epoch": 553} {"train_loss": -19.69207191467285, "global_step": 45938, "epoch": 553} {"train_loss": -19.70339012145996, "global_step": 45939, "epoch": 553} {"train_loss": -20.026233673095703, "global_step": 45940, "epoch": 553} {"train_loss": -19.72855567932129, "global_step": 45941, "epoch": 553} {"train_loss": -19.628326416015625, "global_step": 45942, "epoch": 553} {"train_loss": -19.91413688659668, "global_step": 45943, "epoch": 553} {"train_loss": -19.757984161376953, "global_step": 45944, "epoch": 553} {"train_loss": -19.706817626953125, "global_step": 45945, "epoch": 553} {"train_loss": -19.855661392211914, "global_step": 45946, "epoch": 553} {"train_loss": -19.948347091674805, "global_step": 45947, "epoch": 553} {"train_loss": -19.807723999023438, "global_step": 45948, "epoch": 553} {"train_loss": -19.672773361206055, "global_step": 45949, "epoch": 553} {"train_loss": -19.46258544921875, "global_step": 45950, "epoch": 553} {"train_loss": -19.98296356201172, "global_step": 45951, "epoch": 553} {"train_loss": -19.360654830932617, "global_step": 45952, "epoch": 553} {"train_loss": -19.86751365661621, "global_step": 45953, "epoch": 553} {"train_loss": -19.93897819519043, "global_step": 45954, "epoch": 553} {"train_loss": -19.55221939086914, "global_step": 45955, "epoch": 553} {"train_loss": -19.523717880249023, "global_step": 45956, "epoch": 553} {"train_loss": -19.85626792907715, "global_step": 45957, "epoch": 553} {"train_loss": -19.610584259033203, "global_step": 45958, "epoch": 553} {"train_loss": -20.01484489440918, "global_step": 45959, "epoch": 553} {"train_loss": -20.046314239501953, "global_step": 45960, "epoch": 553} {"train_loss": -19.983537673950195, "global_step": 45961, "epoch": 553} {"train_loss": -19.898916244506836, "global_step": 45962, "epoch": 553} {"train_loss": -19.56928825378418, "global_step": 45963, "epoch": 553} {"train_loss": -19.61553955078125, "global_step": 45964, "epoch": 553} {"train_loss": -19.637197494506836, "global_step": 45965, "epoch": 553} {"train_loss": -19.57543182373047, "global_step": 45966, "epoch": 553} {"train_loss": -20.234888076782227, "global_step": 45967, "epoch": 553} {"train_loss": -19.46201515197754, "global_step": 45968, "epoch": 553} {"train_loss": -20.025781631469727, "global_step": 45969, "epoch": 553} {"train_loss": -19.9582576751709, "global_step": 45970, "epoch": 553} {"train_loss": -19.811214447021484, "global_step": 45971, "epoch": 553} {"train_loss": -20.043331146240234, "global_step": 45972, "epoch": 553} {"train_loss": -19.82694435119629, "global_step": 45973, "epoch": 553} {"train_loss": -19.925277709960938, "global_step": 45974, "epoch": 553} {"train_loss": -19.922361373901367, "global_step": 45975, "epoch": 553} {"train_loss": -19.769245147705078, "global_step": 45976, "epoch": 553} {"train_loss": -19.344200134277344, "global_step": 45977, "epoch": 553} {"train_loss": -19.788602828979492, "global_step": 45978, "epoch": 553} {"train_loss": -19.602680206298828, "global_step": 45979, "epoch": 553} {"train_loss": -19.802127838134766, "global_step": 45980, "epoch": 553} {"train_loss": -19.710119615118188, "global_step": 45981, "epoch": 553, "val_loss": 5991326.0} {"train_loss": -19.2086181640625, "global_step": 45982, "epoch": 554} {"train_loss": -19.363298416137695, "global_step": 45983, "epoch": 554} {"train_loss": -19.52675437927246, "global_step": 45984, "epoch": 554} {"train_loss": -19.257247924804688, "global_step": 45985, "epoch": 554} {"train_loss": -19.213687896728516, "global_step": 45986, "epoch": 554} {"train_loss": -19.54849624633789, "global_step": 45987, "epoch": 554} {"train_loss": -19.555906295776367, "global_step": 45988, "epoch": 554} {"train_loss": -19.575212478637695, "global_step": 45989, "epoch": 554} {"train_loss": -19.750083923339844, "global_step": 45990, "epoch": 554} {"train_loss": -19.385507583618164, "global_step": 45991, "epoch": 554} {"train_loss": -19.094858169555664, "global_step": 45992, "epoch": 554} {"train_loss": -19.59758758544922, "global_step": 45993, "epoch": 554} {"train_loss": -19.88196563720703, "global_step": 45994, "epoch": 554} {"train_loss": -19.525495529174805, "global_step": 45995, "epoch": 554} {"train_loss": -19.2539119720459, "global_step": 45996, "epoch": 554} {"train_loss": -19.921220779418945, "global_step": 45997, "epoch": 554} {"train_loss": -19.76997947692871, "global_step": 45998, "epoch": 554} {"train_loss": -19.618579864501953, "global_step": 45999, "epoch": 554} {"train_loss": -19.56600570678711, "global_step": 46000, "epoch": 554} {"train_loss": -19.795156478881836, "global_step": 46001, "epoch": 554} {"train_loss": -19.603010177612305, "global_step": 46002, "epoch": 554} {"train_loss": -19.94114112854004, "global_step": 46003, "epoch": 554} {"train_loss": -19.898658752441406, "global_step": 46004, "epoch": 554} {"train_loss": -19.575780868530273, "global_step": 46005, "epoch": 554} {"train_loss": -19.547346115112305, "global_step": 46006, "epoch": 554} {"train_loss": -19.805999755859375, "global_step": 46007, "epoch": 554} {"train_loss": -19.807767868041992, "global_step": 46008, "epoch": 554} {"train_loss": -19.928335189819336, "global_step": 46009, "epoch": 554} {"train_loss": -19.614355087280273, "global_step": 46010, "epoch": 554} {"train_loss": -19.3349552154541, "global_step": 46011, "epoch": 554} {"train_loss": -19.842687606811523, "global_step": 46012, "epoch": 554} {"train_loss": -19.862993240356445, "global_step": 46013, "epoch": 554} {"train_loss": -19.893308639526367, "global_step": 46014, "epoch": 554} {"train_loss": -19.70540428161621, "global_step": 46015, "epoch": 554} {"train_loss": -19.60208511352539, "global_step": 46016, "epoch": 554} {"train_loss": -19.50713348388672, "global_step": 46017, "epoch": 554} {"train_loss": -19.959924697875977, "global_step": 46018, "epoch": 554} {"train_loss": -19.98785972595215, "global_step": 46019, "epoch": 554} {"train_loss": -19.618366241455078, "global_step": 46020, "epoch": 554} {"train_loss": -19.54424476623535, "global_step": 46021, "epoch": 554} {"train_loss": -19.607635498046875, "global_step": 46022, "epoch": 554} {"train_loss": -19.652847290039062, "global_step": 46023, "epoch": 554} {"train_loss": -19.675256729125977, "global_step": 46024, "epoch": 554} {"train_loss": -19.717504501342773, "global_step": 46025, "epoch": 554} {"train_loss": -19.639511108398438, "global_step": 46026, "epoch": 554} {"train_loss": -19.574337005615234, "global_step": 46027, "epoch": 554} {"train_loss": -19.727005004882812, "global_step": 46028, "epoch": 554} {"train_loss": -20.062597274780273, "global_step": 46029, "epoch": 554} {"train_loss": -19.706832885742188, "global_step": 46030, "epoch": 554} {"train_loss": -19.898313522338867, "global_step": 46031, "epoch": 554} {"train_loss": -19.723173141479492, "global_step": 46032, "epoch": 554} {"train_loss": -19.626169204711914, "global_step": 46033, "epoch": 554} {"train_loss": -19.987476348876953, "global_step": 46034, "epoch": 554} {"train_loss": -19.827903747558594, "global_step": 46035, "epoch": 554} {"train_loss": -19.43866729736328, "global_step": 46036, "epoch": 554} {"train_loss": -19.89590835571289, "global_step": 46037, "epoch": 554} {"train_loss": -19.765241622924805, "global_step": 46038, "epoch": 554} {"train_loss": -19.83370590209961, "global_step": 46039, "epoch": 554} {"train_loss": -20.149045944213867, "global_step": 46040, "epoch": 554} {"train_loss": -19.758256912231445, "global_step": 46041, "epoch": 554} {"train_loss": -20.026561737060547, "global_step": 46042, "epoch": 554} {"train_loss": -19.55085563659668, "global_step": 46043, "epoch": 554} {"train_loss": -20.15049171447754, "global_step": 46044, "epoch": 554} {"train_loss": -19.492782592773438, "global_step": 46045, "epoch": 554} {"train_loss": -19.659751892089844, "global_step": 46046, "epoch": 554} {"train_loss": -19.64956283569336, "global_step": 46047, "epoch": 554} {"train_loss": -19.89768409729004, "global_step": 46048, "epoch": 554} {"train_loss": -20.12811279296875, "global_step": 46049, "epoch": 554} {"train_loss": -19.7512149810791, "global_step": 46050, "epoch": 554} {"train_loss": -19.672574996948242, "global_step": 46051, "epoch": 554} {"train_loss": -19.375497817993164, "global_step": 46052, "epoch": 554} {"train_loss": -19.766298294067383, "global_step": 46053, "epoch": 554} {"train_loss": -19.64214515686035, "global_step": 46054, "epoch": 554} {"train_loss": -19.861867904663086, "global_step": 46055, "epoch": 554} {"train_loss": -19.541563034057617, "global_step": 46056, "epoch": 554} {"train_loss": -19.991958618164062, "global_step": 46057, "epoch": 554} {"train_loss": -19.70028305053711, "global_step": 46058, "epoch": 554} {"train_loss": -19.569732666015625, "global_step": 46059, "epoch": 554} {"train_loss": -19.555805206298828, "global_step": 46060, "epoch": 554} {"train_loss": -19.747037887573242, "global_step": 46061, "epoch": 554} {"train_loss": -19.96735191345215, "global_step": 46062, "epoch": 554} {"train_loss": -19.641691207885742, "global_step": 46063, "epoch": 554} {"train_loss": -19.688828663653638, "global_step": 46064, "epoch": 554, "val_loss": 6041411.0} {"train_loss": -19.294946670532227, "global_step": 46065, "epoch": 555} {"train_loss": -19.641212463378906, "global_step": 46066, "epoch": 555} {"train_loss": -19.602115631103516, "global_step": 46067, "epoch": 555} {"train_loss": -19.30394744873047, "global_step": 46068, "epoch": 555} {"train_loss": -19.1756591796875, "global_step": 46069, "epoch": 555} {"train_loss": -19.30537986755371, "global_step": 46070, "epoch": 555} {"train_loss": -19.834638595581055, "global_step": 46071, "epoch": 555} {"train_loss": -19.46955680847168, "global_step": 46072, "epoch": 555} {"train_loss": -19.65742301940918, "global_step": 46073, "epoch": 555} {"train_loss": -19.91629409790039, "global_step": 46074, "epoch": 555} {"train_loss": -19.71137809753418, "global_step": 46075, "epoch": 555} {"train_loss": -19.895654678344727, "global_step": 46076, "epoch": 555} {"train_loss": -19.579925537109375, "global_step": 46077, "epoch": 555} {"train_loss": -19.445308685302734, "global_step": 46078, "epoch": 555} {"train_loss": -19.755048751831055, "global_step": 46079, "epoch": 555} {"train_loss": -19.697402954101562, "global_step": 46080, "epoch": 555} {"train_loss": -19.86545753479004, "global_step": 46081, "epoch": 555} {"train_loss": -19.918790817260742, "global_step": 46082, "epoch": 555} {"train_loss": -19.671436309814453, "global_step": 46083, "epoch": 555} {"train_loss": -19.577219009399414, "global_step": 46084, "epoch": 555} {"train_loss": -20.043119430541992, "global_step": 46085, "epoch": 555} {"train_loss": -19.836217880249023, "global_step": 46086, "epoch": 555} {"train_loss": -19.861600875854492, "global_step": 46087, "epoch": 555} {"train_loss": -19.848541259765625, "global_step": 46088, "epoch": 555} {"train_loss": -19.50697898864746, "global_step": 46089, "epoch": 555} {"train_loss": -19.97434425354004, "global_step": 46090, "epoch": 555} {"train_loss": -19.24244499206543, "global_step": 46091, "epoch": 555} {"train_loss": -19.939208984375, "global_step": 46092, "epoch": 555} {"train_loss": -20.000036239624023, "global_step": 46093, "epoch": 555} {"train_loss": -19.80745506286621, "global_step": 46094, "epoch": 555} {"train_loss": -19.75270652770996, "global_step": 46095, "epoch": 555} {"train_loss": -19.665719985961914, "global_step": 46096, "epoch": 555} {"train_loss": -19.98019790649414, "global_step": 46097, "epoch": 555} {"train_loss": -20.179269790649414, "global_step": 46098, "epoch": 555} {"train_loss": -20.10856056213379, "global_step": 46099, "epoch": 555} {"train_loss": -19.760709762573242, "global_step": 46100, "epoch": 555} {"train_loss": -19.59771156311035, "global_step": 46101, "epoch": 555} {"train_loss": -19.751224517822266, "global_step": 46102, "epoch": 555} {"train_loss": -19.68528175354004, "global_step": 46103, "epoch": 555} {"train_loss": -19.397886276245117, "global_step": 46104, "epoch": 555} {"train_loss": -19.32403564453125, "global_step": 46105, "epoch": 555} {"train_loss": -19.688295364379883, "global_step": 46106, "epoch": 555} {"train_loss": -19.82280921936035, "global_step": 46107, "epoch": 555} {"train_loss": -19.374340057373047, "global_step": 46108, "epoch": 555} {"train_loss": -19.883041381835938, "global_step": 46109, "epoch": 555} {"train_loss": -19.67176628112793, "global_step": 46110, "epoch": 555} {"train_loss": -19.557514190673828, "global_step": 46111, "epoch": 555} {"train_loss": -19.642112731933594, "global_step": 46112, "epoch": 555} {"train_loss": -19.616817474365234, "global_step": 46113, "epoch": 555} {"train_loss": -19.736520767211914, "global_step": 46114, "epoch": 555} {"train_loss": -19.792306900024414, "global_step": 46115, "epoch": 555} {"train_loss": -19.987646102905273, "global_step": 46116, "epoch": 555} {"train_loss": -19.687862396240234, "global_step": 46117, "epoch": 555} {"train_loss": -19.751401901245117, "global_step": 46118, "epoch": 555} {"train_loss": -19.856842041015625, "global_step": 46119, "epoch": 555} {"train_loss": -19.847253799438477, "global_step": 46120, "epoch": 555} {"train_loss": -19.26557159423828, "global_step": 46121, "epoch": 555} {"train_loss": -19.374902725219727, "global_step": 46122, "epoch": 555} {"train_loss": -19.900955200195312, "global_step": 46123, "epoch": 555} {"train_loss": -19.89392852783203, "global_step": 46124, "epoch": 555} {"train_loss": -19.808603286743164, "global_step": 46125, "epoch": 555} {"train_loss": -19.943944931030273, "global_step": 46126, "epoch": 555} {"train_loss": -19.96816062927246, "global_step": 46127, "epoch": 555} {"train_loss": -19.834300994873047, "global_step": 46128, "epoch": 555} {"train_loss": -19.974075317382812, "global_step": 46129, "epoch": 555} {"train_loss": -19.807809829711914, "global_step": 46130, "epoch": 555} {"train_loss": -19.99410629272461, "global_step": 46131, "epoch": 555} {"train_loss": -19.86433219909668, "global_step": 46132, "epoch": 555} {"train_loss": -19.573144912719727, "global_step": 46133, "epoch": 555} {"train_loss": -19.70076560974121, "global_step": 46134, "epoch": 555} {"train_loss": -19.87688446044922, "global_step": 46135, "epoch": 555} {"train_loss": -19.633060455322266, "global_step": 46136, "epoch": 555} {"train_loss": -19.584121704101562, "global_step": 46137, "epoch": 555} {"train_loss": -19.706809997558594, "global_step": 46138, "epoch": 555} {"train_loss": -19.651887893676758, "global_step": 46139, "epoch": 555} {"train_loss": -19.327299118041992, "global_step": 46140, "epoch": 555} {"train_loss": -19.958206176757812, "global_step": 46141, "epoch": 555} {"train_loss": -19.52052879333496, "global_step": 46142, "epoch": 555} {"train_loss": -20.138830184936523, "global_step": 46143, "epoch": 555} {"train_loss": -19.468000411987305, "global_step": 46144, "epoch": 555} {"train_loss": -19.739784240722656, "global_step": 46145, "epoch": 555} {"train_loss": -19.444326400756836, "global_step": 46146, "epoch": 555} {"train_loss": -19.718147645513696, "global_step": 46147, "epoch": 555, "val_loss": 6113748.0} {"train_loss": -19.375829696655273, "global_step": 46148, "epoch": 556} {"train_loss": -19.608396530151367, "global_step": 46149, "epoch": 556} {"train_loss": -19.634418487548828, "global_step": 46150, "epoch": 556} {"train_loss": -19.60833168029785, "global_step": 46151, "epoch": 556} {"train_loss": -19.24020004272461, "global_step": 46152, "epoch": 556} {"train_loss": -19.88627052307129, "global_step": 46153, "epoch": 556} {"train_loss": -19.535093307495117, "global_step": 46154, "epoch": 556} {"train_loss": -19.442617416381836, "global_step": 46155, "epoch": 556} {"train_loss": -19.814807891845703, "global_step": 46156, "epoch": 556} {"train_loss": -19.797183990478516, "global_step": 46157, "epoch": 556} {"train_loss": -19.591516494750977, "global_step": 46158, "epoch": 556} {"train_loss": -19.527509689331055, "global_step": 46159, "epoch": 556} {"train_loss": -19.395742416381836, "global_step": 46160, "epoch": 556} {"train_loss": -19.512832641601562, "global_step": 46161, "epoch": 556} {"train_loss": -19.985401153564453, "global_step": 46162, "epoch": 556} {"train_loss": -19.091371536254883, "global_step": 46163, "epoch": 556} {"train_loss": -19.33329200744629, "global_step": 46164, "epoch": 556} {"train_loss": -19.355955123901367, "global_step": 46165, "epoch": 556} {"train_loss": -19.640487670898438, "global_step": 46166, "epoch": 556} {"train_loss": -19.779096603393555, "global_step": 46167, "epoch": 556} {"train_loss": -19.86343765258789, "global_step": 46168, "epoch": 556} {"train_loss": -19.5417537689209, "global_step": 46169, "epoch": 556} {"train_loss": -19.73664093017578, "global_step": 46170, "epoch": 556} {"train_loss": -19.810285568237305, "global_step": 46171, "epoch": 556} {"train_loss": -19.59456443786621, "global_step": 46172, "epoch": 556} {"train_loss": -19.558916091918945, "global_step": 46173, "epoch": 556} {"train_loss": -19.831716537475586, "global_step": 46174, "epoch": 556} {"train_loss": -19.294706344604492, "global_step": 46175, "epoch": 556} {"train_loss": -19.621877670288086, "global_step": 46176, "epoch": 556} {"train_loss": -19.91483497619629, "global_step": 46177, "epoch": 556} {"train_loss": -20.040241241455078, "global_step": 46178, "epoch": 556} {"train_loss": -19.31693458557129, "global_step": 46179, "epoch": 556} {"train_loss": -19.46526527404785, "global_step": 46180, "epoch": 556} {"train_loss": -19.850473403930664, "global_step": 46181, "epoch": 556} {"train_loss": -19.565847396850586, "global_step": 46182, "epoch": 556} {"train_loss": -20.075124740600586, "global_step": 46183, "epoch": 556} {"train_loss": -19.721097946166992, "global_step": 46184, "epoch": 556} {"train_loss": -19.97146224975586, "global_step": 46185, "epoch": 556} {"train_loss": -19.882484436035156, "global_step": 46186, "epoch": 556} {"train_loss": -20.138349533081055, "global_step": 46187, "epoch": 556} {"train_loss": -19.920087814331055, "global_step": 46188, "epoch": 556} {"train_loss": -20.00075340270996, "global_step": 46189, "epoch": 556} {"train_loss": -19.447309494018555, "global_step": 46190, "epoch": 556} {"train_loss": -19.716482162475586, "global_step": 46191, "epoch": 556} {"train_loss": -19.86347770690918, "global_step": 46192, "epoch": 556} {"train_loss": -19.614782333374023, "global_step": 46193, "epoch": 556} {"train_loss": -19.906587600708008, "global_step": 46194, "epoch": 556} {"train_loss": -19.945423126220703, "global_step": 46195, "epoch": 556} {"train_loss": -19.955400466918945, "global_step": 46196, "epoch": 556} {"train_loss": -19.812091827392578, "global_step": 46197, "epoch": 556} {"train_loss": -19.810026168823242, "global_step": 46198, "epoch": 556} {"train_loss": -19.74742317199707, "global_step": 46199, "epoch": 556} {"train_loss": -19.52927589416504, "global_step": 46200, "epoch": 556} {"train_loss": -20.24598503112793, "global_step": 46201, "epoch": 556} {"train_loss": -19.910995483398438, "global_step": 46202, "epoch": 556} {"train_loss": -19.825016021728516, "global_step": 46203, "epoch": 556} {"train_loss": -19.95712661743164, "global_step": 46204, "epoch": 556} {"train_loss": -19.947223663330078, "global_step": 46205, "epoch": 556} {"train_loss": -19.76252555847168, "global_step": 46206, "epoch": 556} {"train_loss": -20.017202377319336, "global_step": 46207, "epoch": 556} {"train_loss": -19.971479415893555, "global_step": 46208, "epoch": 556} {"train_loss": -19.69925308227539, "global_step": 46209, "epoch": 556} {"train_loss": -19.624576568603516, "global_step": 46210, "epoch": 556} {"train_loss": -20.007858276367188, "global_step": 46211, "epoch": 556} {"train_loss": -19.742996215820312, "global_step": 46212, "epoch": 556} {"train_loss": -19.842275619506836, "global_step": 46213, "epoch": 556} {"train_loss": -19.50262451171875, "global_step": 46214, "epoch": 556} {"train_loss": -19.718124389648438, "global_step": 46215, "epoch": 556} {"train_loss": -19.7486629486084, "global_step": 46216, "epoch": 556} {"train_loss": -19.783771514892578, "global_step": 46217, "epoch": 556} {"train_loss": -20.093435287475586, "global_step": 46218, "epoch": 556} {"train_loss": -20.30915641784668, "global_step": 46219, "epoch": 556} {"train_loss": -19.822429656982422, "global_step": 46220, "epoch": 556} {"train_loss": -19.585983276367188, "global_step": 46221, "epoch": 556} {"train_loss": -19.538726806640625, "global_step": 46222, "epoch": 556} {"train_loss": -19.83573341369629, "global_step": 46223, "epoch": 556} {"train_loss": -19.462343215942383, "global_step": 46224, "epoch": 556} {"train_loss": -19.81915283203125, "global_step": 46225, "epoch": 556} {"train_loss": -19.502817153930664, "global_step": 46226, "epoch": 556} {"train_loss": -19.88801383972168, "global_step": 46227, "epoch": 556} {"train_loss": -19.56144905090332, "global_step": 46228, "epoch": 556} {"train_loss": -19.71552085876465, "global_step": 46229, "epoch": 556} {"train_loss": -19.74493626514113, "global_step": 46230, "epoch": 556, "val_loss": 5976296.0} {"train_loss": -19.714492797851562, "global_step": 46231, "epoch": 557} {"train_loss": -19.573827743530273, "global_step": 46232, "epoch": 557} {"train_loss": -19.578474044799805, "global_step": 46233, "epoch": 557} {"train_loss": -19.371545791625977, "global_step": 46234, "epoch": 557} {"train_loss": -19.984506607055664, "global_step": 46235, "epoch": 557} {"train_loss": -19.2758731842041, "global_step": 46236, "epoch": 557} {"train_loss": -19.451574325561523, "global_step": 46237, "epoch": 557} {"train_loss": -19.491899490356445, "global_step": 46238, "epoch": 557} {"train_loss": -19.864423751831055, "global_step": 46239, "epoch": 557} {"train_loss": -19.57264518737793, "global_step": 46240, "epoch": 557} {"train_loss": -19.415485382080078, "global_step": 46241, "epoch": 557} {"train_loss": -19.7612361907959, "global_step": 46242, "epoch": 557} {"train_loss": -20.02461051940918, "global_step": 46243, "epoch": 557} {"train_loss": -19.786640167236328, "global_step": 46244, "epoch": 557} {"train_loss": -19.577184677124023, "global_step": 46245, "epoch": 557} {"train_loss": -20.018674850463867, "global_step": 46246, "epoch": 557} {"train_loss": -19.534494400024414, "global_step": 46247, "epoch": 557} {"train_loss": -19.77646827697754, "global_step": 46248, "epoch": 557} {"train_loss": -19.704145431518555, "global_step": 46249, "epoch": 557} {"train_loss": -19.765981674194336, "global_step": 46250, "epoch": 557} {"train_loss": -19.60698890686035, "global_step": 46251, "epoch": 557} {"train_loss": -19.4915771484375, "global_step": 46252, "epoch": 557} {"train_loss": -19.51039695739746, "global_step": 46253, "epoch": 557} {"train_loss": -19.598108291625977, "global_step": 46254, "epoch": 557} {"train_loss": -19.75710678100586, "global_step": 46255, "epoch": 557} {"train_loss": -19.880224227905273, "global_step": 46256, "epoch": 557} {"train_loss": -19.706995010375977, "global_step": 46257, "epoch": 557} {"train_loss": -19.951589584350586, "global_step": 46258, "epoch": 557} {"train_loss": -19.83363914489746, "global_step": 46259, "epoch": 557} {"train_loss": -19.535953521728516, "global_step": 46260, "epoch": 557} {"train_loss": -20.196189880371094, "global_step": 46261, "epoch": 557} {"train_loss": -19.472854614257812, "global_step": 46262, "epoch": 557} {"train_loss": -20.147794723510742, "global_step": 46263, "epoch": 557} {"train_loss": -19.8457088470459, "global_step": 46264, "epoch": 557} {"train_loss": -20.03143310546875, "global_step": 46265, "epoch": 557} {"train_loss": -19.646631240844727, "global_step": 46266, "epoch": 557} {"train_loss": -19.639785766601562, "global_step": 46267, "epoch": 557} {"train_loss": -20.006742477416992, "global_step": 46268, "epoch": 557} {"train_loss": -19.588584899902344, "global_step": 46269, "epoch": 557} {"train_loss": -19.935400009155273, "global_step": 46270, "epoch": 557} {"train_loss": -19.896591186523438, "global_step": 46271, "epoch": 557} {"train_loss": -19.768470764160156, "global_step": 46272, "epoch": 557} {"train_loss": -19.904083251953125, "global_step": 46273, "epoch": 557} {"train_loss": -19.87468910217285, "global_step": 46274, "epoch": 557} {"train_loss": -19.696950912475586, "global_step": 46275, "epoch": 557} {"train_loss": -19.586288452148438, "global_step": 46276, "epoch": 557} {"train_loss": -19.401548385620117, "global_step": 46277, "epoch": 557} {"train_loss": -20.119644165039062, "global_step": 46278, "epoch": 557} {"train_loss": -19.63624382019043, "global_step": 46279, "epoch": 557} {"train_loss": -19.651227951049805, "global_step": 46280, "epoch": 557} {"train_loss": -19.343952178955078, "global_step": 46281, "epoch": 557} {"train_loss": -19.752227783203125, "global_step": 46282, "epoch": 557} {"train_loss": -20.211339950561523, "global_step": 46283, "epoch": 557} {"train_loss": -19.52980613708496, "global_step": 46284, "epoch": 557} {"train_loss": -19.543962478637695, "global_step": 46285, "epoch": 557} {"train_loss": -19.50897789001465, "global_step": 46286, "epoch": 557} {"train_loss": -19.991342544555664, "global_step": 46287, "epoch": 557} {"train_loss": -19.767059326171875, "global_step": 46288, "epoch": 557} {"train_loss": -20.160358428955078, "global_step": 46289, "epoch": 557} {"train_loss": -19.638004302978516, "global_step": 46290, "epoch": 557} {"train_loss": -19.444055557250977, "global_step": 46291, "epoch": 557} {"train_loss": -19.8201847076416, "global_step": 46292, "epoch": 557} {"train_loss": -19.733732223510742, "global_step": 46293, "epoch": 557} {"train_loss": -19.538358688354492, "global_step": 46294, "epoch": 557} {"train_loss": -19.755949020385742, "global_step": 46295, "epoch": 557} {"train_loss": -19.838088989257812, "global_step": 46296, "epoch": 557} {"train_loss": -19.715349197387695, "global_step": 46297, "epoch": 557} {"train_loss": -19.43330192565918, "global_step": 46298, "epoch": 557} {"train_loss": -19.792814254760742, "global_step": 46299, "epoch": 557} {"train_loss": -19.52155303955078, "global_step": 46300, "epoch": 557} {"train_loss": -19.397628784179688, "global_step": 46301, "epoch": 557} {"train_loss": -19.837066650390625, "global_step": 46302, "epoch": 557} {"train_loss": -19.614871978759766, "global_step": 46303, "epoch": 557} {"train_loss": -19.38462257385254, "global_step": 46304, "epoch": 557} {"train_loss": -20.055978775024414, "global_step": 46305, "epoch": 557} {"train_loss": -19.790151596069336, "global_step": 46306, "epoch": 557} {"train_loss": -20.033395767211914, "global_step": 46307, "epoch": 557} {"train_loss": -19.827472686767578, "global_step": 46308, "epoch": 557} {"train_loss": -19.83411407470703, "global_step": 46309, "epoch": 557} {"train_loss": -19.928691864013672, "global_step": 46310, "epoch": 557} {"train_loss": -19.753629684448242, "global_step": 46311, "epoch": 557} {"train_loss": -19.62472915649414, "global_step": 46312, "epoch": 557} {"train_loss": -19.717975662415284, "global_step": 46313, "epoch": 557, "val_loss": 5906275.5} {"train_loss": -19.155181884765625, "global_step": 46314, "epoch": 558} {"train_loss": -19.734983444213867, "global_step": 46315, "epoch": 558} {"train_loss": -19.177488327026367, "global_step": 46316, "epoch": 558} {"train_loss": -19.72899627685547, "global_step": 46317, "epoch": 558} {"train_loss": -19.5718994140625, "global_step": 46318, "epoch": 558} {"train_loss": -19.749544143676758, "global_step": 46319, "epoch": 558} {"train_loss": -19.536828994750977, "global_step": 46320, "epoch": 558} {"train_loss": -19.36575698852539, "global_step": 46321, "epoch": 558} {"train_loss": -19.711822509765625, "global_step": 46322, "epoch": 558} {"train_loss": -19.846635818481445, "global_step": 46323, "epoch": 558} {"train_loss": -19.91872215270996, "global_step": 46324, "epoch": 558} {"train_loss": -19.9222412109375, "global_step": 46325, "epoch": 558} {"train_loss": -19.83078956604004, "global_step": 46326, "epoch": 558} {"train_loss": -20.006614685058594, "global_step": 46327, "epoch": 558} {"train_loss": -19.841392517089844, "global_step": 46328, "epoch": 558} {"train_loss": -19.891969680786133, "global_step": 46329, "epoch": 558} {"train_loss": -19.706531524658203, "global_step": 46330, "epoch": 558} {"train_loss": -19.477041244506836, "global_step": 46331, "epoch": 558} {"train_loss": -20.27035903930664, "global_step": 46332, "epoch": 558} {"train_loss": -19.782621383666992, "global_step": 46333, "epoch": 558} {"train_loss": -19.807722091674805, "global_step": 46334, "epoch": 558} {"train_loss": -19.82252311706543, "global_step": 46335, "epoch": 558} {"train_loss": -19.809417724609375, "global_step": 46336, "epoch": 558} {"train_loss": -19.888566970825195, "global_step": 46337, "epoch": 558} {"train_loss": -20.033111572265625, "global_step": 46338, "epoch": 558} {"train_loss": -19.93308448791504, "global_step": 46339, "epoch": 558} {"train_loss": -19.490785598754883, "global_step": 46340, "epoch": 558} {"train_loss": -19.727649688720703, "global_step": 46341, "epoch": 558} {"train_loss": -20.104022979736328, "global_step": 46342, "epoch": 558} {"train_loss": -19.425556182861328, "global_step": 46343, "epoch": 558} {"train_loss": -19.696380615234375, "global_step": 46344, "epoch": 558} {"train_loss": -20.007383346557617, "global_step": 46345, "epoch": 558} {"train_loss": -19.794315338134766, "global_step": 46346, "epoch": 558} {"train_loss": -19.85524559020996, "global_step": 46347, "epoch": 558} {"train_loss": -19.721172332763672, "global_step": 46348, "epoch": 558} {"train_loss": -19.631916046142578, "global_step": 46349, "epoch": 558} {"train_loss": -19.76453971862793, "global_step": 46350, "epoch": 558} {"train_loss": -19.645057678222656, "global_step": 46351, "epoch": 558} {"train_loss": -19.827789306640625, "global_step": 46352, "epoch": 558} {"train_loss": -19.88235855102539, "global_step": 46353, "epoch": 558} {"train_loss": -19.626787185668945, "global_step": 46354, "epoch": 558} {"train_loss": -19.438358306884766, "global_step": 46355, "epoch": 558} {"train_loss": -19.705257415771484, "global_step": 46356, "epoch": 558} {"train_loss": -19.622892379760742, "global_step": 46357, "epoch": 558} {"train_loss": -19.64277458190918, "global_step": 46358, "epoch": 558} {"train_loss": -19.874961853027344, "global_step": 46359, "epoch": 558} {"train_loss": -19.82801055908203, "global_step": 46360, "epoch": 558} {"train_loss": -20.018117904663086, "global_step": 46361, "epoch": 558} {"train_loss": -19.937358856201172, "global_step": 46362, "epoch": 558} {"train_loss": -19.86102867126465, "global_step": 46363, "epoch": 558} {"train_loss": -19.82295036315918, "global_step": 46364, "epoch": 558} {"train_loss": -19.802976608276367, "global_step": 46365, "epoch": 558} {"train_loss": -19.906335830688477, "global_step": 46366, "epoch": 558} {"train_loss": -19.695051193237305, "global_step": 46367, "epoch": 558} {"train_loss": -19.867252349853516, "global_step": 46368, "epoch": 558} {"train_loss": -20.039146423339844, "global_step": 46369, "epoch": 558} {"train_loss": -19.47600746154785, "global_step": 46370, "epoch": 558} {"train_loss": -19.761066436767578, "global_step": 46371, "epoch": 558} {"train_loss": -19.9007625579834, "global_step": 46372, "epoch": 558} {"train_loss": -19.787734985351562, "global_step": 46373, "epoch": 558} {"train_loss": -20.033506393432617, "global_step": 46374, "epoch": 558} {"train_loss": -19.843015670776367, "global_step": 46375, "epoch": 558} {"train_loss": -19.67437744140625, "global_step": 46376, "epoch": 558} {"train_loss": -19.566543579101562, "global_step": 46377, "epoch": 558} {"train_loss": -19.784635543823242, "global_step": 46378, "epoch": 558} {"train_loss": -20.00539207458496, "global_step": 46379, "epoch": 558} {"train_loss": -19.509349822998047, "global_step": 46380, "epoch": 558} {"train_loss": -19.947036743164062, "global_step": 46381, "epoch": 558} {"train_loss": -20.005277633666992, "global_step": 46382, "epoch": 558} {"train_loss": -19.870351791381836, "global_step": 46383, "epoch": 558} {"train_loss": -19.77987289428711, "global_step": 46384, "epoch": 558} {"train_loss": -19.843847274780273, "global_step": 46385, "epoch": 558} {"train_loss": -19.479028701782227, "global_step": 46386, "epoch": 558} {"train_loss": -19.667165756225586, "global_step": 46387, "epoch": 558} {"train_loss": -19.887359619140625, "global_step": 46388, "epoch": 558} {"train_loss": -19.768949508666992, "global_step": 46389, "epoch": 558} {"train_loss": -19.95649528503418, "global_step": 46390, "epoch": 558} {"train_loss": -19.61811637878418, "global_step": 46391, "epoch": 558} {"train_loss": -19.438865661621094, "global_step": 46392, "epoch": 558} {"train_loss": -19.798309326171875, "global_step": 46393, "epoch": 558} {"train_loss": -19.698240280151367, "global_step": 46394, "epoch": 558} {"train_loss": -20.008832931518555, "global_step": 46395, "epoch": 558} {"train_loss": -19.774963930428747, "global_step": 46396, "epoch": 558, "val_loss": 6022742.0} {"train_loss": -19.113285064697266, "global_step": 46397, "epoch": 559} {"train_loss": -19.635303497314453, "global_step": 46398, "epoch": 559} {"train_loss": -19.512723922729492, "global_step": 46399, "epoch": 559} {"train_loss": -19.81904411315918, "global_step": 46400, "epoch": 559} {"train_loss": -19.76683235168457, "global_step": 46401, "epoch": 559} {"train_loss": -19.643598556518555, "global_step": 46402, "epoch": 559} {"train_loss": -19.629003524780273, "global_step": 46403, "epoch": 559} {"train_loss": -19.803083419799805, "global_step": 46404, "epoch": 559} {"train_loss": -19.766027450561523, "global_step": 46405, "epoch": 559} {"train_loss": -19.889989852905273, "global_step": 46406, "epoch": 559} {"train_loss": -19.59438133239746, "global_step": 46407, "epoch": 559} {"train_loss": -19.564664840698242, "global_step": 46408, "epoch": 559} {"train_loss": -19.72611427307129, "global_step": 46409, "epoch": 559} {"train_loss": -19.75934410095215, "global_step": 46410, "epoch": 559} {"train_loss": -19.67399024963379, "global_step": 46411, "epoch": 559} {"train_loss": -19.88142204284668, "global_step": 46412, "epoch": 559} {"train_loss": -19.927154541015625, "global_step": 46413, "epoch": 559} {"train_loss": -19.685522079467773, "global_step": 46414, "epoch": 559} {"train_loss": -19.777135848999023, "global_step": 46415, "epoch": 559} {"train_loss": -19.728759765625, "global_step": 46416, "epoch": 559} {"train_loss": -19.883981704711914, "global_step": 46417, "epoch": 559} {"train_loss": -19.951339721679688, "global_step": 46418, "epoch": 559} {"train_loss": -19.627920150756836, "global_step": 46419, "epoch": 559} {"train_loss": -19.89627456665039, "global_step": 46420, "epoch": 559} {"train_loss": -19.93231964111328, "global_step": 46421, "epoch": 559} {"train_loss": -19.52968406677246, "global_step": 46422, "epoch": 559} {"train_loss": -20.119619369506836, "global_step": 46423, "epoch": 559} {"train_loss": -19.70773696899414, "global_step": 46424, "epoch": 559} {"train_loss": -20.17287826538086, "global_step": 46425, "epoch": 559} {"train_loss": -19.715333938598633, "global_step": 46426, "epoch": 559} {"train_loss": -19.669479370117188, "global_step": 46427, "epoch": 559} {"train_loss": -19.635318756103516, "global_step": 46428, "epoch": 559} {"train_loss": -19.609540939331055, "global_step": 46429, "epoch": 559} {"train_loss": -19.755212783813477, "global_step": 46430, "epoch": 559} {"train_loss": -19.78085708618164, "global_step": 46431, "epoch": 559} {"train_loss": -19.891664505004883, "global_step": 46432, "epoch": 559} {"train_loss": -19.437665939331055, "global_step": 46433, "epoch": 559} {"train_loss": -19.541288375854492, "global_step": 46434, "epoch": 559} {"train_loss": -19.56098747253418, "global_step": 46435, "epoch": 559} {"train_loss": -19.828393936157227, "global_step": 46436, "epoch": 559} {"train_loss": -20.109317779541016, "global_step": 46437, "epoch": 559} {"train_loss": -20.15345573425293, "global_step": 46438, "epoch": 559} {"train_loss": -19.9848690032959, "global_step": 46439, "epoch": 559} {"train_loss": -19.685224533081055, "global_step": 46440, "epoch": 559} {"train_loss": -19.87397575378418, "global_step": 46441, "epoch": 559} {"train_loss": -19.68916893005371, "global_step": 46442, "epoch": 559} {"train_loss": -19.89864158630371, "global_step": 46443, "epoch": 559} {"train_loss": -19.7852840423584, "global_step": 46444, "epoch": 559} {"train_loss": -19.047391891479492, "global_step": 46445, "epoch": 559} {"train_loss": -19.707202911376953, "global_step": 46446, "epoch": 559} {"train_loss": -19.83563804626465, "global_step": 46447, "epoch": 559} {"train_loss": -19.638307571411133, "global_step": 46448, "epoch": 559} {"train_loss": -19.438274383544922, "global_step": 46449, "epoch": 559} {"train_loss": -19.918338775634766, "global_step": 46450, "epoch": 559} {"train_loss": -19.515165328979492, "global_step": 46451, "epoch": 559} {"train_loss": -19.799457550048828, "global_step": 46452, "epoch": 559} {"train_loss": -19.727128982543945, "global_step": 46453, "epoch": 559} {"train_loss": -19.949399948120117, "global_step": 46454, "epoch": 559} {"train_loss": -20.165395736694336, "global_step": 46455, "epoch": 559} {"train_loss": -19.751821517944336, "global_step": 46456, "epoch": 559} {"train_loss": -19.621667861938477, "global_step": 46457, "epoch": 559} {"train_loss": -19.546798706054688, "global_step": 46458, "epoch": 559} {"train_loss": -19.81976890563965, "global_step": 46459, "epoch": 559} {"train_loss": -19.52855110168457, "global_step": 46460, "epoch": 559} {"train_loss": -19.84662437438965, "global_step": 46461, "epoch": 559} {"train_loss": -19.930648803710938, "global_step": 46462, "epoch": 559} {"train_loss": -19.63633155822754, "global_step": 46463, "epoch": 559} {"train_loss": -19.830068588256836, "global_step": 46464, "epoch": 559} {"train_loss": -19.693321228027344, "global_step": 46465, "epoch": 559} {"train_loss": -19.98639488220215, "global_step": 46466, "epoch": 559} {"train_loss": -19.70888900756836, "global_step": 46467, "epoch": 559} {"train_loss": -19.848941802978516, "global_step": 46468, "epoch": 559} {"train_loss": -19.408613204956055, "global_step": 46469, "epoch": 559} {"train_loss": -19.550853729248047, "global_step": 46470, "epoch": 559} {"train_loss": -20.062835693359375, "global_step": 46471, "epoch": 559} {"train_loss": -19.838239669799805, "global_step": 46472, "epoch": 559} {"train_loss": -19.928409576416016, "global_step": 46473, "epoch": 559} {"train_loss": -19.979429244995117, "global_step": 46474, "epoch": 559} {"train_loss": -19.918872833251953, "global_step": 46475, "epoch": 559} {"train_loss": -19.782215118408203, "global_step": 46476, "epoch": 559} {"train_loss": -19.6381893157959, "global_step": 46477, "epoch": 559} {"train_loss": -19.573833465576172, "global_step": 46478, "epoch": 559} {"train_loss": -19.763111987745905, "global_step": 46479, "epoch": 559, "val_loss": 6043028.0} {"train_loss": -19.72291374206543, "global_step": 46480, "epoch": 560} {"train_loss": -19.84492301940918, "global_step": 46481, "epoch": 560} {"train_loss": -19.648258209228516, "global_step": 46482, "epoch": 560} {"train_loss": -19.818214416503906, "global_step": 46483, "epoch": 560} {"train_loss": -19.686498641967773, "global_step": 46484, "epoch": 560} {"train_loss": -19.868576049804688, "global_step": 46485, "epoch": 560} {"train_loss": -19.867328643798828, "global_step": 46486, "epoch": 560} {"train_loss": -19.529497146606445, "global_step": 46487, "epoch": 560} {"train_loss": -19.795005798339844, "global_step": 46488, "epoch": 560} {"train_loss": -19.49125099182129, "global_step": 46489, "epoch": 560} {"train_loss": -19.72102928161621, "global_step": 46490, "epoch": 560} {"train_loss": -19.911874771118164, "global_step": 46491, "epoch": 560} {"train_loss": -19.59599494934082, "global_step": 46492, "epoch": 560} {"train_loss": -19.91060447692871, "global_step": 46493, "epoch": 560} {"train_loss": -19.93923568725586, "global_step": 46494, "epoch": 560} {"train_loss": -19.539793014526367, "global_step": 46495, "epoch": 560} {"train_loss": -19.560806274414062, "global_step": 46496, "epoch": 560} {"train_loss": -19.83892822265625, "global_step": 46497, "epoch": 560} {"train_loss": -19.449264526367188, "global_step": 46498, "epoch": 560} {"train_loss": -19.74228858947754, "global_step": 46499, "epoch": 560} {"train_loss": -19.82954978942871, "global_step": 46500, "epoch": 560} {"train_loss": -19.5367431640625, "global_step": 46501, "epoch": 560} {"train_loss": -19.7336368560791, "global_step": 46502, "epoch": 560} {"train_loss": -19.62826919555664, "global_step": 46503, "epoch": 560} {"train_loss": -19.61220359802246, "global_step": 46504, "epoch": 560} {"train_loss": -19.635879516601562, "global_step": 46505, "epoch": 560} {"train_loss": -19.697904586791992, "global_step": 46506, "epoch": 560} {"train_loss": -19.900238037109375, "global_step": 46507, "epoch": 560} {"train_loss": -19.649717330932617, "global_step": 46508, "epoch": 560} {"train_loss": -19.9262638092041, "global_step": 46509, "epoch": 560} {"train_loss": -19.5961971282959, "global_step": 46510, "epoch": 560} {"train_loss": -19.62261199951172, "global_step": 46511, "epoch": 560} {"train_loss": -19.935606002807617, "global_step": 46512, "epoch": 560} {"train_loss": -19.775442123413086, "global_step": 46513, "epoch": 560} {"train_loss": -19.642337799072266, "global_step": 46514, "epoch": 560} {"train_loss": -19.9509220123291, "global_step": 46515, "epoch": 560} {"train_loss": -19.5856990814209, "global_step": 46516, "epoch": 560} {"train_loss": -20.026132583618164, "global_step": 46517, "epoch": 560} {"train_loss": -19.863431930541992, "global_step": 46518, "epoch": 560} {"train_loss": -19.55129623413086, "global_step": 46519, "epoch": 560} {"train_loss": -19.442428588867188, "global_step": 46520, "epoch": 560} {"train_loss": -19.813955307006836, "global_step": 46521, "epoch": 560} {"train_loss": -20.02623748779297, "global_step": 46522, "epoch": 560} {"train_loss": -20.25501823425293, "global_step": 46523, "epoch": 560} {"train_loss": -19.728839874267578, "global_step": 46524, "epoch": 560} {"train_loss": -19.674100875854492, "global_step": 46525, "epoch": 560} {"train_loss": -19.562711715698242, "global_step": 46526, "epoch": 560} {"train_loss": -19.554672241210938, "global_step": 46527, "epoch": 560} {"train_loss": -19.45646095275879, "global_step": 46528, "epoch": 560} {"train_loss": -19.852994918823242, "global_step": 46529, "epoch": 560} {"train_loss": -19.782621383666992, "global_step": 46530, "epoch": 560} {"train_loss": -19.47217559814453, "global_step": 46531, "epoch": 560} {"train_loss": -20.180463790893555, "global_step": 46532, "epoch": 560} {"train_loss": -20.14743995666504, "global_step": 46533, "epoch": 560} {"train_loss": -19.813840866088867, "global_step": 46534, "epoch": 560} {"train_loss": -19.897817611694336, "global_step": 46535, "epoch": 560} {"train_loss": -20.227781295776367, "global_step": 46536, "epoch": 560} {"train_loss": -19.606998443603516, "global_step": 46537, "epoch": 560} {"train_loss": -19.746837615966797, "global_step": 46538, "epoch": 560} {"train_loss": -19.34906005859375, "global_step": 46539, "epoch": 560} {"train_loss": -19.94011878967285, "global_step": 46540, "epoch": 560} {"train_loss": -19.829992294311523, "global_step": 46541, "epoch": 560} {"train_loss": -19.942960739135742, "global_step": 46542, "epoch": 560} {"train_loss": -19.6964168548584, "global_step": 46543, "epoch": 560} {"train_loss": -19.94632911682129, "global_step": 46544, "epoch": 560} {"train_loss": -19.849517822265625, "global_step": 46545, "epoch": 560} {"train_loss": -19.742849349975586, "global_step": 46546, "epoch": 560} {"train_loss": -19.862754821777344, "global_step": 46547, "epoch": 560} {"train_loss": -19.92988395690918, "global_step": 46548, "epoch": 560} {"train_loss": -20.091306686401367, "global_step": 46549, "epoch": 560} {"train_loss": -19.641740798950195, "global_step": 46550, "epoch": 560} {"train_loss": -19.999929428100586, "global_step": 46551, "epoch": 560} {"train_loss": -19.4241886138916, "global_step": 46552, "epoch": 560} {"train_loss": -20.087812423706055, "global_step": 46553, "epoch": 560} {"train_loss": -19.522064208984375, "global_step": 46554, "epoch": 560} {"train_loss": -19.579153060913086, "global_step": 46555, "epoch": 560} {"train_loss": -19.67513084411621, "global_step": 46556, "epoch": 560} {"train_loss": -19.782108306884766, "global_step": 46557, "epoch": 560} {"train_loss": -20.075916290283203, "global_step": 46558, "epoch": 560} {"train_loss": -19.91413688659668, "global_step": 46559, "epoch": 560} {"train_loss": -19.95985221862793, "global_step": 46560, "epoch": 560} {"train_loss": -19.4932861328125, "global_step": 46561, "epoch": 560} {"train_loss": -19.776558565806194, "global_step": 46562, "epoch": 560, "val_loss": 5965738.0} {"train_loss": -19.439550399780273, "global_step": 46563, "epoch": 561} {"train_loss": -19.648775100708008, "global_step": 46564, "epoch": 561} {"train_loss": -19.642438888549805, "global_step": 46565, "epoch": 561} {"train_loss": -20.115161895751953, "global_step": 46566, "epoch": 561} {"train_loss": -19.36261558532715, "global_step": 46567, "epoch": 561} {"train_loss": -19.49806785583496, "global_step": 46568, "epoch": 561} {"train_loss": -19.906118392944336, "global_step": 46569, "epoch": 561} {"train_loss": -19.779388427734375, "global_step": 46570, "epoch": 561} {"train_loss": -19.62086296081543, "global_step": 46571, "epoch": 561} {"train_loss": -19.501863479614258, "global_step": 46572, "epoch": 561} {"train_loss": -19.5482177734375, "global_step": 46573, "epoch": 561} {"train_loss": -19.732725143432617, "global_step": 46574, "epoch": 561} {"train_loss": -19.782238006591797, "global_step": 46575, "epoch": 561} {"train_loss": -19.76394271850586, "global_step": 46576, "epoch": 561} {"train_loss": -19.63056755065918, "global_step": 46577, "epoch": 561} {"train_loss": -19.763776779174805, "global_step": 46578, "epoch": 561} {"train_loss": -19.526229858398438, "global_step": 46579, "epoch": 561} {"train_loss": -19.677570343017578, "global_step": 46580, "epoch": 561} {"train_loss": -19.824344635009766, "global_step": 46581, "epoch": 561} {"train_loss": -19.66598892211914, "global_step": 46582, "epoch": 561} {"train_loss": -19.755990982055664, "global_step": 46583, "epoch": 561} {"train_loss": -19.854507446289062, "global_step": 46584, "epoch": 561} {"train_loss": -19.58677864074707, "global_step": 46585, "epoch": 561} {"train_loss": -19.64371109008789, "global_step": 46586, "epoch": 561} {"train_loss": -19.487524032592773, "global_step": 46587, "epoch": 561} {"train_loss": -19.887311935424805, "global_step": 46588, "epoch": 561} {"train_loss": -19.775157928466797, "global_step": 46589, "epoch": 561} {"train_loss": -19.875904083251953, "global_step": 46590, "epoch": 561} {"train_loss": -19.70521354675293, "global_step": 46591, "epoch": 561} {"train_loss": -19.868000030517578, "global_step": 46592, "epoch": 561} {"train_loss": -19.924875259399414, "global_step": 46593, "epoch": 561} {"train_loss": -19.59838104248047, "global_step": 46594, "epoch": 561} {"train_loss": -19.943105697631836, "global_step": 46595, "epoch": 561} {"train_loss": -20.127405166625977, "global_step": 46596, "epoch": 561} {"train_loss": -19.853504180908203, "global_step": 46597, "epoch": 561} {"train_loss": -19.566953659057617, "global_step": 46598, "epoch": 561} {"train_loss": -20.031808853149414, "global_step": 46599, "epoch": 561} {"train_loss": -19.55910301208496, "global_step": 46600, "epoch": 561} {"train_loss": -19.830286026000977, "global_step": 46601, "epoch": 561} {"train_loss": -19.59053611755371, "global_step": 46602, "epoch": 561} {"train_loss": -19.91444969177246, "global_step": 46603, "epoch": 561} {"train_loss": -19.84543228149414, "global_step": 46604, "epoch": 561} {"train_loss": -19.4890193939209, "global_step": 46605, "epoch": 561} {"train_loss": -19.529203414916992, "global_step": 46606, "epoch": 561} {"train_loss": -19.670446395874023, "global_step": 46607, "epoch": 561} {"train_loss": -19.94375991821289, "global_step": 46608, "epoch": 561} {"train_loss": -19.9183406829834, "global_step": 46609, "epoch": 561} {"train_loss": -19.7164363861084, "global_step": 46610, "epoch": 561} {"train_loss": -19.79166030883789, "global_step": 46611, "epoch": 561} {"train_loss": -19.752119064331055, "global_step": 46612, "epoch": 561} {"train_loss": -19.697641372680664, "global_step": 46613, "epoch": 561} {"train_loss": -19.40846824645996, "global_step": 46614, "epoch": 561} {"train_loss": -19.946420669555664, "global_step": 46615, "epoch": 561} {"train_loss": -19.642728805541992, "global_step": 46616, "epoch": 561} {"train_loss": -20.043304443359375, "global_step": 46617, "epoch": 561} {"train_loss": -19.741979598999023, "global_step": 46618, "epoch": 561} {"train_loss": -19.727201461791992, "global_step": 46619, "epoch": 561} {"train_loss": -19.511966705322266, "global_step": 46620, "epoch": 561} {"train_loss": -20.093473434448242, "global_step": 46621, "epoch": 561} {"train_loss": -20.078535079956055, "global_step": 46622, "epoch": 561} {"train_loss": -19.645523071289062, "global_step": 46623, "epoch": 561} {"train_loss": -19.684293746948242, "global_step": 46624, "epoch": 561} {"train_loss": -19.144563674926758, "global_step": 46625, "epoch": 561} {"train_loss": -19.54294204711914, "global_step": 46626, "epoch": 561} {"train_loss": -20.055814743041992, "global_step": 46627, "epoch": 561} {"train_loss": -19.982995986938477, "global_step": 46628, "epoch": 561} {"train_loss": -19.86418914794922, "global_step": 46629, "epoch": 561} {"train_loss": -19.41220474243164, "global_step": 46630, "epoch": 561} {"train_loss": -19.795656204223633, "global_step": 46631, "epoch": 561} {"train_loss": -19.84929847717285, "global_step": 46632, "epoch": 561} {"train_loss": -19.967655181884766, "global_step": 46633, "epoch": 561} {"train_loss": -19.74521827697754, "global_step": 46634, "epoch": 561} {"train_loss": -20.000844955444336, "global_step": 46635, "epoch": 561} {"train_loss": -19.938459396362305, "global_step": 46636, "epoch": 561} {"train_loss": -20.376182556152344, "global_step": 46637, "epoch": 561} {"train_loss": -19.96070098876953, "global_step": 46638, "epoch": 561} {"train_loss": -19.91400718688965, "global_step": 46639, "epoch": 561} {"train_loss": -20.16758155822754, "global_step": 46640, "epoch": 561} {"train_loss": -19.841581344604492, "global_step": 46641, "epoch": 561} {"train_loss": -19.85146141052246, "global_step": 46642, "epoch": 561} {"train_loss": -19.6147518157959, "global_step": 46643, "epoch": 561} {"train_loss": -19.960420608520508, "global_step": 46644, "epoch": 561} {"train_loss": -19.783014665167016, "global_step": 46645, "epoch": 561, "val_loss": 6290506.0} {"train_loss": -19.81130027770996, "global_step": 46646, "epoch": 562} {"train_loss": -19.337553024291992, "global_step": 46647, "epoch": 562} {"train_loss": -19.622529983520508, "global_step": 46648, "epoch": 562} {"train_loss": -19.51328468322754, "global_step": 46649, "epoch": 562} {"train_loss": -19.291091918945312, "global_step": 46650, "epoch": 562} {"train_loss": -19.686185836791992, "global_step": 46651, "epoch": 562} {"train_loss": -19.567781448364258, "global_step": 46652, "epoch": 562} {"train_loss": -19.97136116027832, "global_step": 46653, "epoch": 562} {"train_loss": -19.802631378173828, "global_step": 46654, "epoch": 562} {"train_loss": -20.026304244995117, "global_step": 46655, "epoch": 562} {"train_loss": -19.38513946533203, "global_step": 46656, "epoch": 562} {"train_loss": -19.469221115112305, "global_step": 46657, "epoch": 562} {"train_loss": -19.620168685913086, "global_step": 46658, "epoch": 562} {"train_loss": -19.808897018432617, "global_step": 46659, "epoch": 562} {"train_loss": -19.924640655517578, "global_step": 46660, "epoch": 562} {"train_loss": -19.662490844726562, "global_step": 46661, "epoch": 562} {"train_loss": -19.96257781982422, "global_step": 46662, "epoch": 562} {"train_loss": -19.53626251220703, "global_step": 46663, "epoch": 562} {"train_loss": -20.06796646118164, "global_step": 46664, "epoch": 562} {"train_loss": -19.530292510986328, "global_step": 46665, "epoch": 562} {"train_loss": -19.90646743774414, "global_step": 46666, "epoch": 562} {"train_loss": -19.59151268005371, "global_step": 46667, "epoch": 562} {"train_loss": -19.38728904724121, "global_step": 46668, "epoch": 562} {"train_loss": -20.224151611328125, "global_step": 46669, "epoch": 562} {"train_loss": -19.85910415649414, "global_step": 46670, "epoch": 562} {"train_loss": -19.778711318969727, "global_step": 46671, "epoch": 562} {"train_loss": -19.68661880493164, "global_step": 46672, "epoch": 562} {"train_loss": -19.363046646118164, "global_step": 46673, "epoch": 562} {"train_loss": -19.959009170532227, "global_step": 46674, "epoch": 562} {"train_loss": -19.772003173828125, "global_step": 46675, "epoch": 562} {"train_loss": -20.057266235351562, "global_step": 46676, "epoch": 562} {"train_loss": -19.869659423828125, "global_step": 46677, "epoch": 562} {"train_loss": -19.7703914642334, "global_step": 46678, "epoch": 562} {"train_loss": -19.471466064453125, "global_step": 46679, "epoch": 562} {"train_loss": -19.969907760620117, "global_step": 46680, "epoch": 562} {"train_loss": -19.598644256591797, "global_step": 46681, "epoch": 562} {"train_loss": -19.615100860595703, "global_step": 46682, "epoch": 562} {"train_loss": -19.53937339782715, "global_step": 46683, "epoch": 562} {"train_loss": -19.741729736328125, "global_step": 46684, "epoch": 562} {"train_loss": -19.801944732666016, "global_step": 46685, "epoch": 562} {"train_loss": -19.606901168823242, "global_step": 46686, "epoch": 562} {"train_loss": -19.937671661376953, "global_step": 46687, "epoch": 562} {"train_loss": -19.606369018554688, "global_step": 46688, "epoch": 562} {"train_loss": -19.583599090576172, "global_step": 46689, "epoch": 562} {"train_loss": -19.673242568969727, "global_step": 46690, "epoch": 562} {"train_loss": -19.64685821533203, "global_step": 46691, "epoch": 562} {"train_loss": -19.918964385986328, "global_step": 46692, "epoch": 562} {"train_loss": -19.54897117614746, "global_step": 46693, "epoch": 562} {"train_loss": -19.411893844604492, "global_step": 46694, "epoch": 562} {"train_loss": -19.576614379882812, "global_step": 46695, "epoch": 562} {"train_loss": -19.333927154541016, "global_step": 46696, "epoch": 562} {"train_loss": -19.511831283569336, "global_step": 46697, "epoch": 562} {"train_loss": -19.851179122924805, "global_step": 46698, "epoch": 562} {"train_loss": -20.093963623046875, "global_step": 46699, "epoch": 562} {"train_loss": -19.732646942138672, "global_step": 46700, "epoch": 562} {"train_loss": -19.543745040893555, "global_step": 46701, "epoch": 562} {"train_loss": -19.740842819213867, "global_step": 46702, "epoch": 562} {"train_loss": -19.423381805419922, "global_step": 46703, "epoch": 562} {"train_loss": -20.116979598999023, "global_step": 46704, "epoch": 562} {"train_loss": -19.755849838256836, "global_step": 46705, "epoch": 562} {"train_loss": -19.709850311279297, "global_step": 46706, "epoch": 562} {"train_loss": -19.546865463256836, "global_step": 46707, "epoch": 562} {"train_loss": -19.43365478515625, "global_step": 46708, "epoch": 562} {"train_loss": -19.463722229003906, "global_step": 46709, "epoch": 562} {"train_loss": -19.51209259033203, "global_step": 46710, "epoch": 562} {"train_loss": -19.838117599487305, "global_step": 46711, "epoch": 562} {"train_loss": -19.75511932373047, "global_step": 46712, "epoch": 562} {"train_loss": -19.92824935913086, "global_step": 46713, "epoch": 562} {"train_loss": -19.67193603515625, "global_step": 46714, "epoch": 562} {"train_loss": -19.554807662963867, "global_step": 46715, "epoch": 562} {"train_loss": -19.847333908081055, "global_step": 46716, "epoch": 562} {"train_loss": -19.68428611755371, "global_step": 46717, "epoch": 562} {"train_loss": -19.91568946838379, "global_step": 46718, "epoch": 562} {"train_loss": -19.743492126464844, "global_step": 46719, "epoch": 562} {"train_loss": -19.57600975036621, "global_step": 46720, "epoch": 562} {"train_loss": -19.692182540893555, "global_step": 46721, "epoch": 562} {"train_loss": -19.441661834716797, "global_step": 46722, "epoch": 562} {"train_loss": -19.749732971191406, "global_step": 46723, "epoch": 562} {"train_loss": -19.780256271362305, "global_step": 46724, "epoch": 562} {"train_loss": -19.640727996826172, "global_step": 46725, "epoch": 562} {"train_loss": -19.745311737060547, "global_step": 46726, "epoch": 562} {"train_loss": -19.650150299072266, "global_step": 46727, "epoch": 562} {"train_loss": -19.680477578955962, "global_step": 46728, "epoch": 562, "val_loss": 6223566.0} {"train_loss": -19.71671485900879, "global_step": 46729, "epoch": 563} {"train_loss": -19.47013282775879, "global_step": 46730, "epoch": 563} {"train_loss": -19.657224655151367, "global_step": 46731, "epoch": 563} {"train_loss": -19.55975914001465, "global_step": 46732, "epoch": 563} {"train_loss": -19.835865020751953, "global_step": 46733, "epoch": 563} {"train_loss": -19.50996971130371, "global_step": 46734, "epoch": 563} {"train_loss": -19.808055877685547, "global_step": 46735, "epoch": 563} {"train_loss": -19.723642349243164, "global_step": 46736, "epoch": 563} {"train_loss": -19.642642974853516, "global_step": 46737, "epoch": 563} {"train_loss": -19.203649520874023, "global_step": 46738, "epoch": 563} {"train_loss": -19.52906608581543, "global_step": 46739, "epoch": 563} {"train_loss": -19.517669677734375, "global_step": 46740, "epoch": 563} {"train_loss": -19.748855590820312, "global_step": 46741, "epoch": 563} {"train_loss": -19.590238571166992, "global_step": 46742, "epoch": 563} {"train_loss": -19.47010040283203, "global_step": 46743, "epoch": 563} {"train_loss": -19.444252014160156, "global_step": 46744, "epoch": 563} {"train_loss": -19.60677146911621, "global_step": 46745, "epoch": 563} {"train_loss": -19.473491668701172, "global_step": 46746, "epoch": 563} {"train_loss": -19.89163589477539, "global_step": 46747, "epoch": 563} {"train_loss": -20.285470962524414, "global_step": 46748, "epoch": 563} {"train_loss": -19.962902069091797, "global_step": 46749, "epoch": 563} {"train_loss": -19.7501220703125, "global_step": 46750, "epoch": 563} {"train_loss": -19.533313751220703, "global_step": 46751, "epoch": 563} {"train_loss": -19.889909744262695, "global_step": 46752, "epoch": 563} {"train_loss": -19.747724533081055, "global_step": 46753, "epoch": 563} {"train_loss": -19.474430084228516, "global_step": 46754, "epoch": 563} {"train_loss": -19.776750564575195, "global_step": 46755, "epoch": 563} {"train_loss": -19.32108497619629, "global_step": 46756, "epoch": 563} {"train_loss": -19.908777236938477, "global_step": 46757, "epoch": 563} {"train_loss": -19.619291305541992, "global_step": 46758, "epoch": 563} {"train_loss": -19.116647720336914, "global_step": 46759, "epoch": 563} {"train_loss": -20.00507926940918, "global_step": 46760, "epoch": 563} {"train_loss": -19.83107566833496, "global_step": 46761, "epoch": 563} {"train_loss": -19.915420532226562, "global_step": 46762, "epoch": 563} {"train_loss": -19.74470329284668, "global_step": 46763, "epoch": 563} {"train_loss": -19.906492233276367, "global_step": 46764, "epoch": 563} {"train_loss": -20.114206314086914, "global_step": 46765, "epoch": 563} {"train_loss": -20.160137176513672, "global_step": 46766, "epoch": 563} {"train_loss": -19.44916534423828, "global_step": 46767, "epoch": 563} {"train_loss": -19.752126693725586, "global_step": 46768, "epoch": 563} {"train_loss": -19.96047019958496, "global_step": 46769, "epoch": 563} {"train_loss": -20.070432662963867, "global_step": 46770, "epoch": 563} {"train_loss": -19.93593406677246, "global_step": 46771, "epoch": 563} {"train_loss": -19.85890769958496, "global_step": 46772, "epoch": 563} {"train_loss": -19.74934196472168, "global_step": 46773, "epoch": 563} {"train_loss": -19.887683868408203, "global_step": 46774, "epoch": 563} {"train_loss": -20.132827758789062, "global_step": 46775, "epoch": 563} {"train_loss": -19.439285278320312, "global_step": 46776, "epoch": 563} {"train_loss": -19.780059814453125, "global_step": 46777, "epoch": 563} {"train_loss": -19.117990493774414, "global_step": 46778, "epoch": 563} {"train_loss": -19.527536392211914, "global_step": 46779, "epoch": 563} {"train_loss": -19.53482437133789, "global_step": 46780, "epoch": 563} {"train_loss": -20.06682777404785, "global_step": 46781, "epoch": 563} {"train_loss": -19.912555694580078, "global_step": 46782, "epoch": 563} {"train_loss": -19.715431213378906, "global_step": 46783, "epoch": 563} {"train_loss": -19.6135311126709, "global_step": 46784, "epoch": 563} {"train_loss": -19.499317169189453, "global_step": 46785, "epoch": 563} {"train_loss": -19.78110122680664, "global_step": 46786, "epoch": 563} {"train_loss": -19.739566802978516, "global_step": 46787, "epoch": 563} {"train_loss": -19.806690216064453, "global_step": 46788, "epoch": 563} {"train_loss": -19.729419708251953, "global_step": 46789, "epoch": 563} {"train_loss": -20.044113159179688, "global_step": 46790, "epoch": 563} {"train_loss": -19.967905044555664, "global_step": 46791, "epoch": 563} {"train_loss": -19.962491989135742, "global_step": 46792, "epoch": 563} {"train_loss": -19.94540786743164, "global_step": 46793, "epoch": 563} {"train_loss": -19.95828628540039, "global_step": 46794, "epoch": 563} {"train_loss": -20.165376663208008, "global_step": 46795, "epoch": 563} {"train_loss": -19.74830436706543, "global_step": 46796, "epoch": 563} {"train_loss": -19.894882202148438, "global_step": 46797, "epoch": 563} {"train_loss": -19.64320945739746, "global_step": 46798, "epoch": 563} {"train_loss": -19.84017562866211, "global_step": 46799, "epoch": 563} {"train_loss": -19.612714767456055, "global_step": 46800, "epoch": 563} {"train_loss": -19.80862045288086, "global_step": 46801, "epoch": 563} {"train_loss": -19.79925537109375, "global_step": 46802, "epoch": 563} {"train_loss": -19.766462326049805, "global_step": 46803, "epoch": 563} {"train_loss": -19.9074764251709, "global_step": 46804, "epoch": 563} {"train_loss": -19.802839279174805, "global_step": 46805, "epoch": 563} {"train_loss": -19.95267677307129, "global_step": 46806, "epoch": 563} {"train_loss": -19.74078941345215, "global_step": 46807, "epoch": 563} {"train_loss": -19.586618423461914, "global_step": 46808, "epoch": 563} {"train_loss": -19.837385177612305, "global_step": 46809, "epoch": 563} {"train_loss": -20.125547409057617, "global_step": 46810, "epoch": 563} {"train_loss": -19.755098825477692, "global_step": 46811, "epoch": 563, "val_loss": 5973997.5} {"train_loss": -19.44730567932129, "global_step": 46812, "epoch": 564} {"train_loss": -19.717681884765625, "global_step": 46813, "epoch": 564} {"train_loss": -19.84016990661621, "global_step": 46814, "epoch": 564} {"train_loss": -19.59352684020996, "global_step": 46815, "epoch": 564} {"train_loss": -19.384607315063477, "global_step": 46816, "epoch": 564} {"train_loss": -19.746347427368164, "global_step": 46817, "epoch": 564} {"train_loss": -20.11474609375, "global_step": 46818, "epoch": 564} {"train_loss": -19.927091598510742, "global_step": 46819, "epoch": 564} {"train_loss": -19.72548484802246, "global_step": 46820, "epoch": 564} {"train_loss": -19.888113021850586, "global_step": 46821, "epoch": 564} {"train_loss": -19.635549545288086, "global_step": 46822, "epoch": 564} {"train_loss": -19.5587215423584, "global_step": 46823, "epoch": 564} {"train_loss": -19.220840454101562, "global_step": 46824, "epoch": 564} {"train_loss": -19.96428108215332, "global_step": 46825, "epoch": 564} {"train_loss": -19.957807540893555, "global_step": 46826, "epoch": 564} {"train_loss": -19.665273666381836, "global_step": 46827, "epoch": 564} {"train_loss": -20.020051956176758, "global_step": 46828, "epoch": 564} {"train_loss": -19.746463775634766, "global_step": 46829, "epoch": 564} {"train_loss": -19.641653060913086, "global_step": 46830, "epoch": 564} {"train_loss": -19.745502471923828, "global_step": 46831, "epoch": 564} {"train_loss": -19.768129348754883, "global_step": 46832, "epoch": 564} {"train_loss": -19.88238525390625, "global_step": 46833, "epoch": 564} {"train_loss": -19.709463119506836, "global_step": 46834, "epoch": 564} {"train_loss": -19.754743576049805, "global_step": 46835, "epoch": 564} {"train_loss": -19.926498413085938, "global_step": 46836, "epoch": 564} {"train_loss": -19.667875289916992, "global_step": 46837, "epoch": 564} {"train_loss": -20.233728408813477, "global_step": 46838, "epoch": 564} {"train_loss": -19.868011474609375, "global_step": 46839, "epoch": 564} {"train_loss": -19.78411293029785, "global_step": 46840, "epoch": 564} {"train_loss": -19.645078659057617, "global_step": 46841, "epoch": 564} {"train_loss": -20.157838821411133, "global_step": 46842, "epoch": 564} {"train_loss": -19.876224517822266, "global_step": 46843, "epoch": 564} {"train_loss": -19.68263053894043, "global_step": 46844, "epoch": 564} {"train_loss": -19.781888961791992, "global_step": 46845, "epoch": 564} {"train_loss": -19.899351119995117, "global_step": 46846, "epoch": 564} {"train_loss": -19.793331146240234, "global_step": 46847, "epoch": 564} {"train_loss": -19.7168025970459, "global_step": 46848, "epoch": 564} {"train_loss": -19.890445709228516, "global_step": 46849, "epoch": 564} {"train_loss": -20.031396865844727, "global_step": 46850, "epoch": 564} {"train_loss": -19.736948013305664, "global_step": 46851, "epoch": 564} {"train_loss": -19.596012115478516, "global_step": 46852, "epoch": 564} {"train_loss": -19.850126266479492, "global_step": 46853, "epoch": 564} {"train_loss": -19.470273971557617, "global_step": 46854, "epoch": 564} {"train_loss": -19.760852813720703, "global_step": 46855, "epoch": 564} {"train_loss": -19.558475494384766, "global_step": 46856, "epoch": 564} {"train_loss": -19.80816078186035, "global_step": 46857, "epoch": 564} {"train_loss": -19.444028854370117, "global_step": 46858, "epoch": 564} {"train_loss": -19.385950088500977, "global_step": 46859, "epoch": 564} {"train_loss": -19.686634063720703, "global_step": 46860, "epoch": 564} {"train_loss": -19.970914840698242, "global_step": 46861, "epoch": 564} {"train_loss": -19.750762939453125, "global_step": 46862, "epoch": 564} {"train_loss": -19.400659561157227, "global_step": 46863, "epoch": 564} {"train_loss": -19.89510154724121, "global_step": 46864, "epoch": 564} {"train_loss": -19.86612319946289, "global_step": 46865, "epoch": 564} {"train_loss": -19.553436279296875, "global_step": 46866, "epoch": 564} {"train_loss": -19.96278953552246, "global_step": 46867, "epoch": 564} {"train_loss": -19.997112274169922, "global_step": 46868, "epoch": 564} {"train_loss": -19.737871170043945, "global_step": 46869, "epoch": 564} {"train_loss": -19.973861694335938, "global_step": 46870, "epoch": 564} {"train_loss": -19.87869644165039, "global_step": 46871, "epoch": 564} {"train_loss": -20.07110023498535, "global_step": 46872, "epoch": 564} {"train_loss": -19.631744384765625, "global_step": 46873, "epoch": 564} {"train_loss": -20.126684188842773, "global_step": 46874, "epoch": 564} {"train_loss": -19.537147521972656, "global_step": 46875, "epoch": 564} {"train_loss": -19.83937644958496, "global_step": 46876, "epoch": 564} {"train_loss": -20.222116470336914, "global_step": 46877, "epoch": 564} {"train_loss": -20.14229393005371, "global_step": 46878, "epoch": 564} {"train_loss": -19.82379722595215, "global_step": 46879, "epoch": 564} {"train_loss": -19.784597396850586, "global_step": 46880, "epoch": 564} {"train_loss": -19.72197723388672, "global_step": 46881, "epoch": 564} {"train_loss": -19.776622772216797, "global_step": 46882, "epoch": 564} {"train_loss": -19.65056037902832, "global_step": 46883, "epoch": 564} {"train_loss": -19.748727798461914, "global_step": 46884, "epoch": 564} {"train_loss": -19.500009536743164, "global_step": 46885, "epoch": 564} {"train_loss": -19.598388671875, "global_step": 46886, "epoch": 564} {"train_loss": -19.655492782592773, "global_step": 46887, "epoch": 564} {"train_loss": -19.650293350219727, "global_step": 46888, "epoch": 564} {"train_loss": -19.712478637695312, "global_step": 46889, "epoch": 564} {"train_loss": -19.606952667236328, "global_step": 46890, "epoch": 564} {"train_loss": -19.7924747467041, "global_step": 46891, "epoch": 564} {"train_loss": -19.695035934448242, "global_step": 46892, "epoch": 564} {"train_loss": -19.981618881225586, "global_step": 46893, "epoch": 564} {"train_loss": -19.77549734460302, "global_step": 46894, "epoch": 564, "val_loss": 5997337.0} {"train_loss": -19.807973861694336, "global_step": 46895, "epoch": 565} {"train_loss": -19.81707191467285, "global_step": 46896, "epoch": 565} {"train_loss": -19.745954513549805, "global_step": 46897, "epoch": 565} {"train_loss": -19.42315673828125, "global_step": 46898, "epoch": 565} {"train_loss": -19.996789932250977, "global_step": 46899, "epoch": 565} {"train_loss": -19.66272735595703, "global_step": 46900, "epoch": 565} {"train_loss": -19.66096305847168, "global_step": 46901, "epoch": 565} {"train_loss": -19.494815826416016, "global_step": 46902, "epoch": 565} {"train_loss": -19.4533634185791, "global_step": 46903, "epoch": 565} {"train_loss": -19.393869400024414, "global_step": 46904, "epoch": 565} {"train_loss": -19.963134765625, "global_step": 46905, "epoch": 565} {"train_loss": -19.699514389038086, "global_step": 46906, "epoch": 565} {"train_loss": -19.627147674560547, "global_step": 46907, "epoch": 565} {"train_loss": -19.829740524291992, "global_step": 46908, "epoch": 565} {"train_loss": -19.48915672302246, "global_step": 46909, "epoch": 565} {"train_loss": -19.78474235534668, "global_step": 46910, "epoch": 565} {"train_loss": -19.47908592224121, "global_step": 46911, "epoch": 565} {"train_loss": -19.371063232421875, "global_step": 46912, "epoch": 565} {"train_loss": -20.060171127319336, "global_step": 46913, "epoch": 565} {"train_loss": -19.805097579956055, "global_step": 46914, "epoch": 565} {"train_loss": -19.633285522460938, "global_step": 46915, "epoch": 565} {"train_loss": -19.76862335205078, "global_step": 46916, "epoch": 565} {"train_loss": -19.46851921081543, "global_step": 46917, "epoch": 565} {"train_loss": -19.58603286743164, "global_step": 46918, "epoch": 565} {"train_loss": -19.944082260131836, "global_step": 46919, "epoch": 565} {"train_loss": -19.852378845214844, "global_step": 46920, "epoch": 565} {"train_loss": -20.16249656677246, "global_step": 46921, "epoch": 565} {"train_loss": -19.810028076171875, "global_step": 46922, "epoch": 565} {"train_loss": -19.376802444458008, "global_step": 46923, "epoch": 565} {"train_loss": -19.910062789916992, "global_step": 46924, "epoch": 565} {"train_loss": -20.03717613220215, "global_step": 46925, "epoch": 565} {"train_loss": -19.772701263427734, "global_step": 46926, "epoch": 565} {"train_loss": -19.94371223449707, "global_step": 46927, "epoch": 565} {"train_loss": -19.57375717163086, "global_step": 46928, "epoch": 565} {"train_loss": -19.80579948425293, "global_step": 46929, "epoch": 565} {"train_loss": -20.00459861755371, "global_step": 46930, "epoch": 565} {"train_loss": -20.01604652404785, "global_step": 46931, "epoch": 565} {"train_loss": -19.98074722290039, "global_step": 46932, "epoch": 565} {"train_loss": -19.595279693603516, "global_step": 46933, "epoch": 565} {"train_loss": -19.876657485961914, "global_step": 46934, "epoch": 565} {"train_loss": -19.853092193603516, "global_step": 46935, "epoch": 565} {"train_loss": -19.66363525390625, "global_step": 46936, "epoch": 565} {"train_loss": -19.656126022338867, "global_step": 46937, "epoch": 565} {"train_loss": -19.57094383239746, "global_step": 46938, "epoch": 565} {"train_loss": -19.975021362304688, "global_step": 46939, "epoch": 565} {"train_loss": -19.95747947692871, "global_step": 46940, "epoch": 565} {"train_loss": -19.383047103881836, "global_step": 46941, "epoch": 565} {"train_loss": -19.282529830932617, "global_step": 46942, "epoch": 565} {"train_loss": -19.887845993041992, "global_step": 46943, "epoch": 565} {"train_loss": -20.051456451416016, "global_step": 46944, "epoch": 565} {"train_loss": -19.91102409362793, "global_step": 46945, "epoch": 565} {"train_loss": -20.12523078918457, "global_step": 46946, "epoch": 565} {"train_loss": -20.03786277770996, "global_step": 46947, "epoch": 565} {"train_loss": -19.837976455688477, "global_step": 46948, "epoch": 565} {"train_loss": -19.87502670288086, "global_step": 46949, "epoch": 565} {"train_loss": -19.854354858398438, "global_step": 46950, "epoch": 565} {"train_loss": -19.820140838623047, "global_step": 46951, "epoch": 565} {"train_loss": -19.801624298095703, "global_step": 46952, "epoch": 565} {"train_loss": -19.72199058532715, "global_step": 46953, "epoch": 565} {"train_loss": -20.096689224243164, "global_step": 46954, "epoch": 565} {"train_loss": -19.934450149536133, "global_step": 46955, "epoch": 565} {"train_loss": -19.653141021728516, "global_step": 46956, "epoch": 565} {"train_loss": -19.92104721069336, "global_step": 46957, "epoch": 565} {"train_loss": -19.685028076171875, "global_step": 46958, "epoch": 565} {"train_loss": -19.64173698425293, "global_step": 46959, "epoch": 565} {"train_loss": -19.765941619873047, "global_step": 46960, "epoch": 565} {"train_loss": -19.620529174804688, "global_step": 46961, "epoch": 565} {"train_loss": -20.25165367126465, "global_step": 46962, "epoch": 565} {"train_loss": -19.456954956054688, "global_step": 46963, "epoch": 565} {"train_loss": -20.230592727661133, "global_step": 46964, "epoch": 565} {"train_loss": -19.853595733642578, "global_step": 46965, "epoch": 565} {"train_loss": -20.015363693237305, "global_step": 46966, "epoch": 565} {"train_loss": -19.503780364990234, "global_step": 46967, "epoch": 565} {"train_loss": -19.785184860229492, "global_step": 46968, "epoch": 565} {"train_loss": -19.68784523010254, "global_step": 46969, "epoch": 565} {"train_loss": -19.741594314575195, "global_step": 46970, "epoch": 565} {"train_loss": -20.06570053100586, "global_step": 46971, "epoch": 565} {"train_loss": -19.99264144897461, "global_step": 46972, "epoch": 565} {"train_loss": -19.87251853942871, "global_step": 46973, "epoch": 565} {"train_loss": -19.752965927124023, "global_step": 46974, "epoch": 565} {"train_loss": -19.474721908569336, "global_step": 46975, "epoch": 565} {"train_loss": -20.1264591217041, "global_step": 46976, "epoch": 565} {"train_loss": -19.77574261125312, "global_step": 46977, "epoch": 565, "val_loss": 5914288.5} {"train_loss": -18.96278953552246, "global_step": 46978, "epoch": 566} {"train_loss": -19.64863395690918, "global_step": 46979, "epoch": 566} {"train_loss": -19.559743881225586, "global_step": 46980, "epoch": 566} {"train_loss": -19.72523307800293, "global_step": 46981, "epoch": 566} {"train_loss": -19.188190460205078, "global_step": 46982, "epoch": 566} {"train_loss": -19.25018882751465, "global_step": 46983, "epoch": 566} {"train_loss": -19.58624267578125, "global_step": 46984, "epoch": 566} {"train_loss": -19.467077255249023, "global_step": 46985, "epoch": 566} {"train_loss": -19.419401168823242, "global_step": 46986, "epoch": 566} {"train_loss": -19.535324096679688, "global_step": 46987, "epoch": 566} {"train_loss": -19.196428298950195, "global_step": 46988, "epoch": 566} {"train_loss": -19.363920211791992, "global_step": 46989, "epoch": 566} {"train_loss": -19.81633949279785, "global_step": 46990, "epoch": 566} {"train_loss": -19.690631866455078, "global_step": 46991, "epoch": 566} {"train_loss": -19.42693328857422, "global_step": 46992, "epoch": 566} {"train_loss": -19.594003677368164, "global_step": 46993, "epoch": 566} {"train_loss": -19.6501407623291, "global_step": 46994, "epoch": 566} {"train_loss": -19.98650550842285, "global_step": 46995, "epoch": 566} {"train_loss": -19.7230167388916, "global_step": 46996, "epoch": 566} {"train_loss": -19.39776611328125, "global_step": 46997, "epoch": 566} {"train_loss": -19.672542572021484, "global_step": 46998, "epoch": 566} {"train_loss": -19.61933708190918, "global_step": 46999, "epoch": 566} {"train_loss": -19.597463607788086, "global_step": 47000, "epoch": 566} {"train_loss": -19.850818634033203, "global_step": 47001, "epoch": 566} {"train_loss": -19.491445541381836, "global_step": 47002, "epoch": 566} {"train_loss": -19.74940299987793, "global_step": 47003, "epoch": 566} {"train_loss": -19.750816345214844, "global_step": 47004, "epoch": 566} {"train_loss": -19.653295516967773, "global_step": 47005, "epoch": 566} {"train_loss": -20.132856369018555, "global_step": 47006, "epoch": 566} {"train_loss": -19.67000961303711, "global_step": 47007, "epoch": 566} {"train_loss": -19.90021324157715, "global_step": 47008, "epoch": 566} {"train_loss": -19.90066146850586, "global_step": 47009, "epoch": 566} {"train_loss": -19.662696838378906, "global_step": 47010, "epoch": 566} {"train_loss": -20.079837799072266, "global_step": 47011, "epoch": 566} {"train_loss": -19.769819259643555, "global_step": 47012, "epoch": 566} {"train_loss": -19.699167251586914, "global_step": 47013, "epoch": 566} {"train_loss": -19.639692306518555, "global_step": 47014, "epoch": 566} {"train_loss": -20.061124801635742, "global_step": 47015, "epoch": 566} {"train_loss": -19.508508682250977, "global_step": 47016, "epoch": 566} {"train_loss": -19.733427047729492, "global_step": 47017, "epoch": 566} {"train_loss": -19.586332321166992, "global_step": 47018, "epoch": 566} {"train_loss": -20.013029098510742, "global_step": 47019, "epoch": 566} {"train_loss": -19.928129196166992, "global_step": 47020, "epoch": 566} {"train_loss": -19.584148406982422, "global_step": 47021, "epoch": 566} {"train_loss": -20.035776138305664, "global_step": 47022, "epoch": 566} {"train_loss": -20.281396865844727, "global_step": 47023, "epoch": 566} {"train_loss": -19.95101547241211, "global_step": 47024, "epoch": 566} {"train_loss": -19.608173370361328, "global_step": 47025, "epoch": 566} {"train_loss": -19.917905807495117, "global_step": 47026, "epoch": 566} {"train_loss": -19.9405517578125, "global_step": 47027, "epoch": 566} {"train_loss": -19.527114868164062, "global_step": 47028, "epoch": 566} {"train_loss": -19.526166915893555, "global_step": 47029, "epoch": 566} {"train_loss": -19.924209594726562, "global_step": 47030, "epoch": 566} {"train_loss": -19.881990432739258, "global_step": 47031, "epoch": 566} {"train_loss": -19.8343505859375, "global_step": 47032, "epoch": 566} {"train_loss": -19.89999008178711, "global_step": 47033, "epoch": 566} {"train_loss": -19.412399291992188, "global_step": 47034, "epoch": 566} {"train_loss": -19.488908767700195, "global_step": 47035, "epoch": 566} {"train_loss": -19.911561965942383, "global_step": 47036, "epoch": 566} {"train_loss": -19.506431579589844, "global_step": 47037, "epoch": 566} {"train_loss": -19.530677795410156, "global_step": 47038, "epoch": 566} {"train_loss": -20.061420440673828, "global_step": 47039, "epoch": 566} {"train_loss": -20.151472091674805, "global_step": 47040, "epoch": 566} {"train_loss": -19.877355575561523, "global_step": 47041, "epoch": 566} {"train_loss": -19.88665199279785, "global_step": 47042, "epoch": 566} {"train_loss": -19.8798885345459, "global_step": 47043, "epoch": 566} {"train_loss": -19.609542846679688, "global_step": 47044, "epoch": 566} {"train_loss": -20.2016658782959, "global_step": 47045, "epoch": 566} {"train_loss": -19.58265495300293, "global_step": 47046, "epoch": 566} {"train_loss": -19.836828231811523, "global_step": 47047, "epoch": 566} {"train_loss": -19.78629493713379, "global_step": 47048, "epoch": 566} {"train_loss": -19.410409927368164, "global_step": 47049, "epoch": 566} {"train_loss": -19.84000015258789, "global_step": 47050, "epoch": 566} {"train_loss": -19.75489616394043, "global_step": 47051, "epoch": 566} {"train_loss": -20.042627334594727, "global_step": 47052, "epoch": 566} {"train_loss": -19.946170806884766, "global_step": 47053, "epoch": 566} {"train_loss": -20.00962257385254, "global_step": 47054, "epoch": 566} {"train_loss": -19.70203399658203, "global_step": 47055, "epoch": 566} {"train_loss": -19.521154403686523, "global_step": 47056, "epoch": 566} {"train_loss": -19.47529411315918, "global_step": 47057, "epoch": 566} {"train_loss": -20.033117294311523, "global_step": 47058, "epoch": 566} {"train_loss": -19.825315475463867, "global_step": 47059, "epoch": 566} {"train_loss": -19.71617528616664, "global_step": 47060, "epoch": 566, "val_loss": 6034011.0} {"train_loss": -19.748210906982422, "global_step": 47061, "epoch": 567} {"train_loss": -19.31153678894043, "global_step": 47062, "epoch": 567} {"train_loss": -19.77487564086914, "global_step": 47063, "epoch": 567} {"train_loss": -19.31300926208496, "global_step": 47064, "epoch": 567} {"train_loss": -19.990901947021484, "global_step": 47065, "epoch": 567} {"train_loss": -19.563867568969727, "global_step": 47066, "epoch": 567} {"train_loss": -19.962310791015625, "global_step": 47067, "epoch": 567} {"train_loss": -19.2645206451416, "global_step": 47068, "epoch": 567} {"train_loss": -19.62415313720703, "global_step": 47069, "epoch": 567} {"train_loss": -19.365276336669922, "global_step": 47070, "epoch": 567} {"train_loss": -19.69025230407715, "global_step": 47071, "epoch": 567} {"train_loss": -19.515792846679688, "global_step": 47072, "epoch": 567} {"train_loss": -19.761083602905273, "global_step": 47073, "epoch": 567} {"train_loss": -19.596431732177734, "global_step": 47074, "epoch": 567} {"train_loss": -19.39124870300293, "global_step": 47075, "epoch": 567} {"train_loss": -19.5830020904541, "global_step": 47076, "epoch": 567} {"train_loss": -19.987218856811523, "global_step": 47077, "epoch": 567} {"train_loss": -19.779592514038086, "global_step": 47078, "epoch": 567} {"train_loss": -19.8442440032959, "global_step": 47079, "epoch": 567} {"train_loss": -19.737123489379883, "global_step": 47080, "epoch": 567} {"train_loss": -19.648006439208984, "global_step": 47081, "epoch": 567} {"train_loss": -19.830005645751953, "global_step": 47082, "epoch": 567} {"train_loss": -19.562152862548828, "global_step": 47083, "epoch": 567} {"train_loss": -19.700773239135742, "global_step": 47084, "epoch": 567} {"train_loss": -20.06633949279785, "global_step": 47085, "epoch": 567} {"train_loss": -20.05625343322754, "global_step": 47086, "epoch": 567} {"train_loss": -19.866958618164062, "global_step": 47087, "epoch": 567} {"train_loss": -19.9183406829834, "global_step": 47088, "epoch": 567} {"train_loss": -20.24391746520996, "global_step": 47089, "epoch": 567} {"train_loss": -19.83308219909668, "global_step": 47090, "epoch": 567} {"train_loss": -19.967620849609375, "global_step": 47091, "epoch": 567} {"train_loss": -19.810800552368164, "global_step": 47092, "epoch": 567} {"train_loss": -19.73284339904785, "global_step": 47093, "epoch": 567} {"train_loss": -19.833541870117188, "global_step": 47094, "epoch": 567} {"train_loss": -19.428672790527344, "global_step": 47095, "epoch": 567} {"train_loss": -19.9190616607666, "global_step": 47096, "epoch": 567} {"train_loss": -19.756803512573242, "global_step": 47097, "epoch": 567} {"train_loss": -19.867185592651367, "global_step": 47098, "epoch": 567} {"train_loss": -19.789623260498047, "global_step": 47099, "epoch": 567} {"train_loss": -19.522144317626953, "global_step": 47100, "epoch": 567} {"train_loss": -19.749835968017578, "global_step": 47101, "epoch": 567} {"train_loss": -19.213809967041016, "global_step": 47102, "epoch": 567} {"train_loss": -19.6052188873291, "global_step": 47103, "epoch": 567} {"train_loss": -19.61065673828125, "global_step": 47104, "epoch": 567} {"train_loss": -19.587493896484375, "global_step": 47105, "epoch": 567} {"train_loss": -20.275732040405273, "global_step": 47106, "epoch": 567} {"train_loss": -19.644628524780273, "global_step": 47107, "epoch": 567} {"train_loss": -19.81146240234375, "global_step": 47108, "epoch": 567} {"train_loss": -19.63135528564453, "global_step": 47109, "epoch": 567} {"train_loss": -20.33402442932129, "global_step": 47110, "epoch": 567} {"train_loss": -19.845136642456055, "global_step": 47111, "epoch": 567} {"train_loss": -19.727331161499023, "global_step": 47112, "epoch": 567} {"train_loss": -19.97187042236328, "global_step": 47113, "epoch": 567} {"train_loss": -20.12006187438965, "global_step": 47114, "epoch": 567} {"train_loss": -19.657150268554688, "global_step": 47115, "epoch": 567} {"train_loss": -19.40948486328125, "global_step": 47116, "epoch": 567} {"train_loss": -20.027196884155273, "global_step": 47117, "epoch": 567} {"train_loss": -19.41996955871582, "global_step": 47118, "epoch": 567} {"train_loss": -19.495046615600586, "global_step": 47119, "epoch": 567} {"train_loss": -19.662092208862305, "global_step": 47120, "epoch": 567} {"train_loss": -19.522287368774414, "global_step": 47121, "epoch": 567} {"train_loss": -19.996862411499023, "global_step": 47122, "epoch": 567} {"train_loss": -20.0642147064209, "global_step": 47123, "epoch": 567} {"train_loss": -19.757600784301758, "global_step": 47124, "epoch": 567} {"train_loss": -19.961896896362305, "global_step": 47125, "epoch": 567} {"train_loss": -19.730337142944336, "global_step": 47126, "epoch": 567} {"train_loss": -19.70478630065918, "global_step": 47127, "epoch": 567} {"train_loss": -19.93446922302246, "global_step": 47128, "epoch": 567} {"train_loss": -19.51755714416504, "global_step": 47129, "epoch": 567} {"train_loss": -19.93001937866211, "global_step": 47130, "epoch": 567} {"train_loss": -20.004899978637695, "global_step": 47131, "epoch": 567} {"train_loss": -20.104063034057617, "global_step": 47132, "epoch": 567} {"train_loss": -20.135597229003906, "global_step": 47133, "epoch": 567} {"train_loss": -19.838165283203125, "global_step": 47134, "epoch": 567} {"train_loss": -19.977476119995117, "global_step": 47135, "epoch": 567} {"train_loss": -20.08473777770996, "global_step": 47136, "epoch": 567} {"train_loss": -19.706960678100586, "global_step": 47137, "epoch": 567} {"train_loss": -19.732601165771484, "global_step": 47138, "epoch": 567} {"train_loss": -19.798934936523438, "global_step": 47139, "epoch": 567} {"train_loss": -19.594465255737305, "global_step": 47140, "epoch": 567} {"train_loss": -19.784719467163086, "global_step": 47141, "epoch": 567} {"train_loss": -19.638076782226562, "global_step": 47142, "epoch": 567} {"train_loss": -19.758724327547004, "global_step": 47143, "epoch": 567, "val_loss": 5861604.0} {"train_loss": -19.00594139099121, "global_step": 47144, "epoch": 568} {"train_loss": -19.1356201171875, "global_step": 47145, "epoch": 568} {"train_loss": -19.233495712280273, "global_step": 47146, "epoch": 568} {"train_loss": -19.400480270385742, "global_step": 47147, "epoch": 568} {"train_loss": -19.840763092041016, "global_step": 47148, "epoch": 568} {"train_loss": -19.422914505004883, "global_step": 47149, "epoch": 568} {"train_loss": -19.455419540405273, "global_step": 47150, "epoch": 568} {"train_loss": -19.932899475097656, "global_step": 47151, "epoch": 568} {"train_loss": -19.625402450561523, "global_step": 47152, "epoch": 568} {"train_loss": -19.598237991333008, "global_step": 47153, "epoch": 568} {"train_loss": -19.694194793701172, "global_step": 47154, "epoch": 568} {"train_loss": -19.512935638427734, "global_step": 47155, "epoch": 568} {"train_loss": -19.3770751953125, "global_step": 47156, "epoch": 568} {"train_loss": -19.436874389648438, "global_step": 47157, "epoch": 568} {"train_loss": -19.49996566772461, "global_step": 47158, "epoch": 568} {"train_loss": -18.845670700073242, "global_step": 47159, "epoch": 568} {"train_loss": -19.595151901245117, "global_step": 47160, "epoch": 568} {"train_loss": -19.731855392456055, "global_step": 47161, "epoch": 568} {"train_loss": -19.446043014526367, "global_step": 47162, "epoch": 568} {"train_loss": -19.62738800048828, "global_step": 47163, "epoch": 568} {"train_loss": -19.323827743530273, "global_step": 47164, "epoch": 568} {"train_loss": -19.433094024658203, "global_step": 47165, "epoch": 568} {"train_loss": -19.41751480102539, "global_step": 47166, "epoch": 568} {"train_loss": -19.724802017211914, "global_step": 47167, "epoch": 568} {"train_loss": -19.51371955871582, "global_step": 47168, "epoch": 568} {"train_loss": -19.679443359375, "global_step": 47169, "epoch": 568} {"train_loss": -19.557920455932617, "global_step": 47170, "epoch": 568} {"train_loss": -19.675500869750977, "global_step": 47171, "epoch": 568} {"train_loss": -19.405351638793945, "global_step": 47172, "epoch": 568} {"train_loss": -19.916336059570312, "global_step": 47173, "epoch": 568} {"train_loss": -19.374589920043945, "global_step": 47174, "epoch": 568} {"train_loss": -19.84282875061035, "global_step": 47175, "epoch": 568} {"train_loss": -19.936370849609375, "global_step": 47176, "epoch": 568} {"train_loss": -19.1961669921875, "global_step": 47177, "epoch": 568} {"train_loss": -19.691816329956055, "global_step": 47178, "epoch": 568} {"train_loss": -19.58767318725586, "global_step": 47179, "epoch": 568} {"train_loss": -19.728422164916992, "global_step": 47180, "epoch": 568} {"train_loss": -19.380136489868164, "global_step": 47181, "epoch": 568} {"train_loss": -19.87335777282715, "global_step": 47182, "epoch": 568} {"train_loss": -19.759321212768555, "global_step": 47183, "epoch": 568} {"train_loss": -19.720163345336914, "global_step": 47184, "epoch": 568} {"train_loss": -19.601301193237305, "global_step": 47185, "epoch": 568} {"train_loss": -19.333114624023438, "global_step": 47186, "epoch": 568} {"train_loss": -19.470447540283203, "global_step": 47187, "epoch": 568} {"train_loss": -19.99637794494629, "global_step": 47188, "epoch": 568} {"train_loss": -19.678098678588867, "global_step": 47189, "epoch": 568} {"train_loss": -19.663894653320312, "global_step": 47190, "epoch": 568} {"train_loss": -19.78714942932129, "global_step": 47191, "epoch": 568} {"train_loss": -19.712894439697266, "global_step": 47192, "epoch": 568} {"train_loss": -20.012529373168945, "global_step": 47193, "epoch": 568} {"train_loss": -19.951398849487305, "global_step": 47194, "epoch": 568} {"train_loss": -19.841901779174805, "global_step": 47195, "epoch": 568} {"train_loss": -19.81819725036621, "global_step": 47196, "epoch": 568} {"train_loss": -19.95978355407715, "global_step": 47197, "epoch": 568} {"train_loss": -19.813222885131836, "global_step": 47198, "epoch": 568} {"train_loss": -19.538057327270508, "global_step": 47199, "epoch": 568} {"train_loss": -19.979022979736328, "global_step": 47200, "epoch": 568} {"train_loss": -20.103599548339844, "global_step": 47201, "epoch": 568} {"train_loss": -20.225574493408203, "global_step": 47202, "epoch": 568} {"train_loss": -19.89753532409668, "global_step": 47203, "epoch": 568} {"train_loss": -19.554296493530273, "global_step": 47204, "epoch": 568} {"train_loss": -19.691604614257812, "global_step": 47205, "epoch": 568} {"train_loss": -19.5958309173584, "global_step": 47206, "epoch": 568} {"train_loss": -19.917747497558594, "global_step": 47207, "epoch": 568} {"train_loss": -19.580127716064453, "global_step": 47208, "epoch": 568} {"train_loss": -20.14997673034668, "global_step": 47209, "epoch": 568} {"train_loss": -19.576492309570312, "global_step": 47210, "epoch": 568} {"train_loss": -20.31373405456543, "global_step": 47211, "epoch": 568} {"train_loss": -20.023508071899414, "global_step": 47212, "epoch": 568} {"train_loss": -19.872852325439453, "global_step": 47213, "epoch": 568} {"train_loss": -19.881582260131836, "global_step": 47214, "epoch": 568} {"train_loss": -19.894386291503906, "global_step": 47215, "epoch": 568} {"train_loss": -20.06937026977539, "global_step": 47216, "epoch": 568} {"train_loss": -19.874048233032227, "global_step": 47217, "epoch": 568} {"train_loss": -19.68646240234375, "global_step": 47218, "epoch": 568} {"train_loss": -19.778371810913086, "global_step": 47219, "epoch": 568} {"train_loss": -19.761489868164062, "global_step": 47220, "epoch": 568} {"train_loss": -19.59840202331543, "global_step": 47221, "epoch": 568} {"train_loss": -19.83405876159668, "global_step": 47222, "epoch": 568} {"train_loss": -19.912609100341797, "global_step": 47223, "epoch": 568} {"train_loss": -20.036771774291992, "global_step": 47224, "epoch": 568} {"train_loss": -20.06705093383789, "global_step": 47225, "epoch": 568} {"train_loss": -19.682158550584173, "global_step": 47226, "epoch": 568, "val_loss": 5893483.0} {"train_loss": -19.933135986328125, "global_step": 47227, "epoch": 569} {"train_loss": -19.700040817260742, "global_step": 47228, "epoch": 569} {"train_loss": -19.97176742553711, "global_step": 47229, "epoch": 569} {"train_loss": -19.502307891845703, "global_step": 47230, "epoch": 569} {"train_loss": -20.047597885131836, "global_step": 47231, "epoch": 569} {"train_loss": -19.458763122558594, "global_step": 47232, "epoch": 569} {"train_loss": -20.107614517211914, "global_step": 47233, "epoch": 569} {"train_loss": -19.634559631347656, "global_step": 47234, "epoch": 569} {"train_loss": -19.64142417907715, "global_step": 47235, "epoch": 569} {"train_loss": -19.7343807220459, "global_step": 47236, "epoch": 569} {"train_loss": -19.739370346069336, "global_step": 47237, "epoch": 569} {"train_loss": -19.69022560119629, "global_step": 47238, "epoch": 569} {"train_loss": -19.869068145751953, "global_step": 47239, "epoch": 569} {"train_loss": -19.530256271362305, "global_step": 47240, "epoch": 569} {"train_loss": -20.089811325073242, "global_step": 47241, "epoch": 569} {"train_loss": -19.96242904663086, "global_step": 47242, "epoch": 569} {"train_loss": -19.535831451416016, "global_step": 47243, "epoch": 569} {"train_loss": -19.744943618774414, "global_step": 47244, "epoch": 569} {"train_loss": -19.898862838745117, "global_step": 47245, "epoch": 569} {"train_loss": -19.811872482299805, "global_step": 47246, "epoch": 569} {"train_loss": -19.89337158203125, "global_step": 47247, "epoch": 569} {"train_loss": -20.147659301757812, "global_step": 47248, "epoch": 569} {"train_loss": -20.00701332092285, "global_step": 47249, "epoch": 569} {"train_loss": -19.675220489501953, "global_step": 47250, "epoch": 569} {"train_loss": -19.86269187927246, "global_step": 47251, "epoch": 569} {"train_loss": -19.441436767578125, "global_step": 47252, "epoch": 569} {"train_loss": -19.959402084350586, "global_step": 47253, "epoch": 569} {"train_loss": -19.658634185791016, "global_step": 47254, "epoch": 569} {"train_loss": -19.68509292602539, "global_step": 47255, "epoch": 569} {"train_loss": -20.418201446533203, "global_step": 47256, "epoch": 569} {"train_loss": -19.802221298217773, "global_step": 47257, "epoch": 569} {"train_loss": -19.847503662109375, "global_step": 47258, "epoch": 569} {"train_loss": -20.320396423339844, "global_step": 47259, "epoch": 569} {"train_loss": -19.829574584960938, "global_step": 47260, "epoch": 569} {"train_loss": -19.420270919799805, "global_step": 47261, "epoch": 569} {"train_loss": -19.91591453552246, "global_step": 47262, "epoch": 569} {"train_loss": -19.793638229370117, "global_step": 47263, "epoch": 569} {"train_loss": -19.597991943359375, "global_step": 47264, "epoch": 569} {"train_loss": -19.431339263916016, "global_step": 47265, "epoch": 569} {"train_loss": -19.59827995300293, "global_step": 47266, "epoch": 569} {"train_loss": -20.173898696899414, "global_step": 47267, "epoch": 569} {"train_loss": -20.046649932861328, "global_step": 47268, "epoch": 569} {"train_loss": -19.739704132080078, "global_step": 47269, "epoch": 569} {"train_loss": -19.769638061523438, "global_step": 47270, "epoch": 569} {"train_loss": -19.9204044342041, "global_step": 47271, "epoch": 569} {"train_loss": -19.823638916015625, "global_step": 47272, "epoch": 569} {"train_loss": -19.758108139038086, "global_step": 47273, "epoch": 569} {"train_loss": -19.595056533813477, "global_step": 47274, "epoch": 569} {"train_loss": -19.72775650024414, "global_step": 47275, "epoch": 569} {"train_loss": -19.907068252563477, "global_step": 47276, "epoch": 569} {"train_loss": -19.420381546020508, "global_step": 47277, "epoch": 569} {"train_loss": -20.00021743774414, "global_step": 47278, "epoch": 569} {"train_loss": -19.656152725219727, "global_step": 47279, "epoch": 569} {"train_loss": -19.84720230102539, "global_step": 47280, "epoch": 569} {"train_loss": -19.696264266967773, "global_step": 47281, "epoch": 569} {"train_loss": -20.126697540283203, "global_step": 47282, "epoch": 569} {"train_loss": -20.044536590576172, "global_step": 47283, "epoch": 569} {"train_loss": -19.764102935791016, "global_step": 47284, "epoch": 569} {"train_loss": -19.42317771911621, "global_step": 47285, "epoch": 569} {"train_loss": -19.683311462402344, "global_step": 47286, "epoch": 569} {"train_loss": -19.912384033203125, "global_step": 47287, "epoch": 569} {"train_loss": -19.811233520507812, "global_step": 47288, "epoch": 569} {"train_loss": -19.660945892333984, "global_step": 47289, "epoch": 569} {"train_loss": -19.77699851989746, "global_step": 47290, "epoch": 569} {"train_loss": -19.757434844970703, "global_step": 47291, "epoch": 569} {"train_loss": -19.92156410217285, "global_step": 47292, "epoch": 569} {"train_loss": -19.6756534576416, "global_step": 47293, "epoch": 569} {"train_loss": -19.682849884033203, "global_step": 47294, "epoch": 569} {"train_loss": -20.381826400756836, "global_step": 47295, "epoch": 569} {"train_loss": -19.55204200744629, "global_step": 47296, "epoch": 569} {"train_loss": -19.9298038482666, "global_step": 47297, "epoch": 569} {"train_loss": -19.609294891357422, "global_step": 47298, "epoch": 569} {"train_loss": -19.78141212463379, "global_step": 47299, "epoch": 569} {"train_loss": -19.66603660583496, "global_step": 47300, "epoch": 569} {"train_loss": -19.916828155517578, "global_step": 47301, "epoch": 569} {"train_loss": -19.780790328979492, "global_step": 47302, "epoch": 569} {"train_loss": -19.368011474609375, "global_step": 47303, "epoch": 569} {"train_loss": -19.75455665588379, "global_step": 47304, "epoch": 569} {"train_loss": -20.077037811279297, "global_step": 47305, "epoch": 569} {"train_loss": -19.623388290405273, "global_step": 47306, "epoch": 569} {"train_loss": -19.87091064453125, "global_step": 47307, "epoch": 569} {"train_loss": -19.507190704345703, "global_step": 47308, "epoch": 569} {"train_loss": -19.780710679938995, "global_step": 47309, "epoch": 569, "val_loss": 6140876.5} {"train_loss": -19.2783203125, "global_step": 47310, "epoch": 570} {"train_loss": -19.591323852539062, "global_step": 47311, "epoch": 570} {"train_loss": -19.440584182739258, "global_step": 47312, "epoch": 570} {"train_loss": -19.459026336669922, "global_step": 47313, "epoch": 570} {"train_loss": -19.660795211791992, "global_step": 47314, "epoch": 570} {"train_loss": -19.520750045776367, "global_step": 47315, "epoch": 570} {"train_loss": -19.880229949951172, "global_step": 47316, "epoch": 570} {"train_loss": -19.943655014038086, "global_step": 47317, "epoch": 570} {"train_loss": -19.664899826049805, "global_step": 47318, "epoch": 570} {"train_loss": -19.41719627380371, "global_step": 47319, "epoch": 570} {"train_loss": -19.99146842956543, "global_step": 47320, "epoch": 570} {"train_loss": -19.91572380065918, "global_step": 47321, "epoch": 570} {"train_loss": -19.803804397583008, "global_step": 47322, "epoch": 570} {"train_loss": -19.70442771911621, "global_step": 47323, "epoch": 570} {"train_loss": -19.696725845336914, "global_step": 47324, "epoch": 570} {"train_loss": -19.61618423461914, "global_step": 47325, "epoch": 570} {"train_loss": -19.773441314697266, "global_step": 47326, "epoch": 570} {"train_loss": -19.557861328125, "global_step": 47327, "epoch": 570} {"train_loss": -19.755752563476562, "global_step": 47328, "epoch": 570} {"train_loss": -19.772680282592773, "global_step": 47329, "epoch": 570} {"train_loss": -20.118864059448242, "global_step": 47330, "epoch": 570} {"train_loss": -19.47650718688965, "global_step": 47331, "epoch": 570} {"train_loss": -19.86615753173828, "global_step": 47332, "epoch": 570} {"train_loss": -19.608577728271484, "global_step": 47333, "epoch": 570} {"train_loss": -19.73773765563965, "global_step": 47334, "epoch": 570} {"train_loss": -19.87711524963379, "global_step": 47335, "epoch": 570} {"train_loss": -19.929698944091797, "global_step": 47336, "epoch": 570} {"train_loss": -19.66333770751953, "global_step": 47337, "epoch": 570} {"train_loss": -19.594064712524414, "global_step": 47338, "epoch": 570} {"train_loss": -20.056535720825195, "global_step": 47339, "epoch": 570} {"train_loss": -19.8587589263916, "global_step": 47340, "epoch": 570} {"train_loss": -20.01734733581543, "global_step": 47341, "epoch": 570} {"train_loss": -19.663888931274414, "global_step": 47342, "epoch": 570} {"train_loss": -20.05854606628418, "global_step": 47343, "epoch": 570} {"train_loss": -19.912830352783203, "global_step": 47344, "epoch": 570} {"train_loss": -19.651538848876953, "global_step": 47345, "epoch": 570} {"train_loss": -19.678791046142578, "global_step": 47346, "epoch": 570} {"train_loss": -20.27228355407715, "global_step": 47347, "epoch": 570} {"train_loss": -19.773040771484375, "global_step": 47348, "epoch": 570} {"train_loss": -19.784589767456055, "global_step": 47349, "epoch": 570} {"train_loss": -19.778017044067383, "global_step": 47350, "epoch": 570} {"train_loss": -19.41445541381836, "global_step": 47351, "epoch": 570} {"train_loss": -19.75721549987793, "global_step": 47352, "epoch": 570} {"train_loss": -19.651185989379883, "global_step": 47353, "epoch": 570} {"train_loss": -19.581666946411133, "global_step": 47354, "epoch": 570} {"train_loss": -19.79254150390625, "global_step": 47355, "epoch": 570} {"train_loss": -19.942373275756836, "global_step": 47356, "epoch": 570} {"train_loss": -19.543699264526367, "global_step": 47357, "epoch": 570} {"train_loss": -19.787464141845703, "global_step": 47358, "epoch": 570} {"train_loss": -19.651235580444336, "global_step": 47359, "epoch": 570} {"train_loss": -19.473730087280273, "global_step": 47360, "epoch": 570} {"train_loss": -19.76195526123047, "global_step": 47361, "epoch": 570} {"train_loss": -19.715517044067383, "global_step": 47362, "epoch": 570} {"train_loss": -19.718002319335938, "global_step": 47363, "epoch": 570} {"train_loss": -19.76930809020996, "global_step": 47364, "epoch": 570} {"train_loss": -19.645681381225586, "global_step": 47365, "epoch": 570} {"train_loss": -19.8920841217041, "global_step": 47366, "epoch": 570} {"train_loss": -19.673330307006836, "global_step": 47367, "epoch": 570} {"train_loss": -19.949756622314453, "global_step": 47368, "epoch": 570} {"train_loss": -20.005451202392578, "global_step": 47369, "epoch": 570} {"train_loss": -19.8114070892334, "global_step": 47370, "epoch": 570} {"train_loss": -19.66030502319336, "global_step": 47371, "epoch": 570} {"train_loss": -20.08454704284668, "global_step": 47372, "epoch": 570} {"train_loss": -19.887577056884766, "global_step": 47373, "epoch": 570} {"train_loss": -19.6925048828125, "global_step": 47374, "epoch": 570} {"train_loss": -19.8204402923584, "global_step": 47375, "epoch": 570} {"train_loss": -19.916305541992188, "global_step": 47376, "epoch": 570} {"train_loss": -19.75826072692871, "global_step": 47377, "epoch": 570} {"train_loss": -19.9339542388916, "global_step": 47378, "epoch": 570} {"train_loss": -19.5377197265625, "global_step": 47379, "epoch": 570} {"train_loss": -19.91529655456543, "global_step": 47380, "epoch": 570} {"train_loss": -19.852325439453125, "global_step": 47381, "epoch": 570} {"train_loss": -20.03342628479004, "global_step": 47382, "epoch": 570} {"train_loss": -19.621646881103516, "global_step": 47383, "epoch": 570} {"train_loss": -19.466318130493164, "global_step": 47384, "epoch": 570} {"train_loss": -19.785497665405273, "global_step": 47385, "epoch": 570} {"train_loss": -19.975454330444336, "global_step": 47386, "epoch": 570} {"train_loss": -19.72063636779785, "global_step": 47387, "epoch": 570} {"train_loss": -19.586591720581055, "global_step": 47388, "epoch": 570} {"train_loss": -19.982261657714844, "global_step": 47389, "epoch": 570} {"train_loss": -19.744659423828125, "global_step": 47390, "epoch": 570} {"train_loss": -19.66033935546875, "global_step": 47391, "epoch": 570} {"train_loss": -19.753050218145532, "global_step": 47392, "epoch": 570, "val_loss": 5898433.5} {"train_loss": -18.629776000976562, "global_step": 47393, "epoch": 571} {"train_loss": -19.775165557861328, "global_step": 47394, "epoch": 571} {"train_loss": -19.356285095214844, "global_step": 47395, "epoch": 571} {"train_loss": -19.39264488220215, "global_step": 47396, "epoch": 571} {"train_loss": -19.372865676879883, "global_step": 47397, "epoch": 571} {"train_loss": -19.500324249267578, "global_step": 47398, "epoch": 571} {"train_loss": -19.8157958984375, "global_step": 47399, "epoch": 571} {"train_loss": -19.525897979736328, "global_step": 47400, "epoch": 571} {"train_loss": -19.31098747253418, "global_step": 47401, "epoch": 571} {"train_loss": -19.788349151611328, "global_step": 47402, "epoch": 571} {"train_loss": -19.435842514038086, "global_step": 47403, "epoch": 571} {"train_loss": -19.7000732421875, "global_step": 47404, "epoch": 571} {"train_loss": -19.42327880859375, "global_step": 47405, "epoch": 571} {"train_loss": -19.6231689453125, "global_step": 47406, "epoch": 571} {"train_loss": -19.098867416381836, "global_step": 47407, "epoch": 571} {"train_loss": -19.809667587280273, "global_step": 47408, "epoch": 571} {"train_loss": -20.074766159057617, "global_step": 47409, "epoch": 571} {"train_loss": -19.854473114013672, "global_step": 47410, "epoch": 571} {"train_loss": -19.599273681640625, "global_step": 47411, "epoch": 571} {"train_loss": -19.781557083129883, "global_step": 47412, "epoch": 571} {"train_loss": -19.62087631225586, "global_step": 47413, "epoch": 571} {"train_loss": -19.905363082885742, "global_step": 47414, "epoch": 571} {"train_loss": -19.545278549194336, "global_step": 47415, "epoch": 571} {"train_loss": -19.920642852783203, "global_step": 47416, "epoch": 571} {"train_loss": -19.875883102416992, "global_step": 47417, "epoch": 571} {"train_loss": -19.47256851196289, "global_step": 47418, "epoch": 571} {"train_loss": -19.72355079650879, "global_step": 47419, "epoch": 571} {"train_loss": -19.83978271484375, "global_step": 47420, "epoch": 571} {"train_loss": -20.035306930541992, "global_step": 47421, "epoch": 571} {"train_loss": -19.574193954467773, "global_step": 47422, "epoch": 571} {"train_loss": -19.777982711791992, "global_step": 47423, "epoch": 571} {"train_loss": -19.43111228942871, "global_step": 47424, "epoch": 571} {"train_loss": -20.249189376831055, "global_step": 47425, "epoch": 571} {"train_loss": -19.763212203979492, "global_step": 47426, "epoch": 571} {"train_loss": -19.912038803100586, "global_step": 47427, "epoch": 571} {"train_loss": -19.935388565063477, "global_step": 47428, "epoch": 571} {"train_loss": -19.91939353942871, "global_step": 47429, "epoch": 571} {"train_loss": -19.821765899658203, "global_step": 47430, "epoch": 571} {"train_loss": -19.816715240478516, "global_step": 47431, "epoch": 571} {"train_loss": -20.003026962280273, "global_step": 47432, "epoch": 571} {"train_loss": -19.76148796081543, "global_step": 47433, "epoch": 571} {"train_loss": -19.58936882019043, "global_step": 47434, "epoch": 571} {"train_loss": -19.667598724365234, "global_step": 47435, "epoch": 571} {"train_loss": -19.935678482055664, "global_step": 47436, "epoch": 571} {"train_loss": -19.37196159362793, "global_step": 47437, "epoch": 571} {"train_loss": -20.0869140625, "global_step": 47438, "epoch": 571} {"train_loss": -20.163103103637695, "global_step": 47439, "epoch": 571} {"train_loss": -19.825031280517578, "global_step": 47440, "epoch": 571} {"train_loss": -19.968652725219727, "global_step": 47441, "epoch": 571} {"train_loss": -19.963634490966797, "global_step": 47442, "epoch": 571} {"train_loss": -19.838119506835938, "global_step": 47443, "epoch": 571} {"train_loss": -19.51471710205078, "global_step": 47444, "epoch": 571} {"train_loss": -19.84981346130371, "global_step": 47445, "epoch": 571} {"train_loss": -20.320077896118164, "global_step": 47446, "epoch": 571} {"train_loss": -19.693349838256836, "global_step": 47447, "epoch": 571} {"train_loss": -19.406538009643555, "global_step": 47448, "epoch": 571} {"train_loss": -20.2237606048584, "global_step": 47449, "epoch": 571} {"train_loss": -19.875394821166992, "global_step": 47450, "epoch": 571} {"train_loss": -19.766983032226562, "global_step": 47451, "epoch": 571} {"train_loss": -19.79754638671875, "global_step": 47452, "epoch": 571} {"train_loss": -19.475086212158203, "global_step": 47453, "epoch": 571} {"train_loss": -20.251209259033203, "global_step": 47454, "epoch": 571} {"train_loss": -19.79933738708496, "global_step": 47455, "epoch": 571} {"train_loss": -19.509544372558594, "global_step": 47456, "epoch": 571} {"train_loss": -19.513656616210938, "global_step": 47457, "epoch": 571} {"train_loss": -19.673126220703125, "global_step": 47458, "epoch": 571} {"train_loss": -20.0867977142334, "global_step": 47459, "epoch": 571} {"train_loss": -19.44489288330078, "global_step": 47460, "epoch": 571} {"train_loss": -19.684181213378906, "global_step": 47461, "epoch": 571} {"train_loss": -20.164968490600586, "global_step": 47462, "epoch": 571} {"train_loss": -19.605918884277344, "global_step": 47463, "epoch": 571} {"train_loss": -19.45465087890625, "global_step": 47464, "epoch": 571} {"train_loss": -19.751358032226562, "global_step": 47465, "epoch": 571} {"train_loss": -20.06038475036621, "global_step": 47466, "epoch": 571} {"train_loss": -19.524316787719727, "global_step": 47467, "epoch": 571} {"train_loss": -20.079381942749023, "global_step": 47468, "epoch": 571} {"train_loss": -20.05690574645996, "global_step": 47469, "epoch": 571} {"train_loss": -20.20977210998535, "global_step": 47470, "epoch": 571} {"train_loss": -19.725067138671875, "global_step": 47471, "epoch": 571} {"train_loss": -19.900833129882812, "global_step": 47472, "epoch": 571} {"train_loss": -20.07310676574707, "global_step": 47473, "epoch": 571} {"train_loss": -19.532642364501953, "global_step": 47474, "epoch": 571} {"train_loss": -19.737246455916438, "global_step": 47475, "epoch": 571, "val_loss": 6059013.0} {"train_loss": -19.720596313476562, "global_step": 47476, "epoch": 572} {"train_loss": -20.322355270385742, "global_step": 47477, "epoch": 572} {"train_loss": -19.866165161132812, "global_step": 47478, "epoch": 572} {"train_loss": -19.694461822509766, "global_step": 47479, "epoch": 572} {"train_loss": -19.82222557067871, "global_step": 47480, "epoch": 572} {"train_loss": -19.742259979248047, "global_step": 47481, "epoch": 572} {"train_loss": -19.715654373168945, "global_step": 47482, "epoch": 572} {"train_loss": -19.683202743530273, "global_step": 47483, "epoch": 572} {"train_loss": -19.842599868774414, "global_step": 47484, "epoch": 572} {"train_loss": -20.151174545288086, "global_step": 47485, "epoch": 572} {"train_loss": -19.709867477416992, "global_step": 47486, "epoch": 572} {"train_loss": -19.308706283569336, "global_step": 47487, "epoch": 572} {"train_loss": -19.837793350219727, "global_step": 47488, "epoch": 572} {"train_loss": -19.972803115844727, "global_step": 47489, "epoch": 572} {"train_loss": -19.651687622070312, "global_step": 47490, "epoch": 572} {"train_loss": -19.73456382751465, "global_step": 47491, "epoch": 572} {"train_loss": -19.830852508544922, "global_step": 47492, "epoch": 572} {"train_loss": -19.891536712646484, "global_step": 47493, "epoch": 572} {"train_loss": -19.826066970825195, "global_step": 47494, "epoch": 572} {"train_loss": -20.163793563842773, "global_step": 47495, "epoch": 572} {"train_loss": -19.67588233947754, "global_step": 47496, "epoch": 572} {"train_loss": -19.599136352539062, "global_step": 47497, "epoch": 572} {"train_loss": -19.884525299072266, "global_step": 47498, "epoch": 572} {"train_loss": -19.692548751831055, "global_step": 47499, "epoch": 572} {"train_loss": -19.961267471313477, "global_step": 47500, "epoch": 572} {"train_loss": -19.436235427856445, "global_step": 47501, "epoch": 572} {"train_loss": -19.858083724975586, "global_step": 47502, "epoch": 572} {"train_loss": -19.552982330322266, "global_step": 47503, "epoch": 572} {"train_loss": -19.985092163085938, "global_step": 47504, "epoch": 572} {"train_loss": -19.932437896728516, "global_step": 47505, "epoch": 572} {"train_loss": -19.46845245361328, "global_step": 47506, "epoch": 572} {"train_loss": -19.7193660736084, "global_step": 47507, "epoch": 572} {"train_loss": -20.199270248413086, "global_step": 47508, "epoch": 572} {"train_loss": -19.5267333984375, "global_step": 47509, "epoch": 572} {"train_loss": -19.721195220947266, "global_step": 47510, "epoch": 572} {"train_loss": -20.13167381286621, "global_step": 47511, "epoch": 572} {"train_loss": -19.93492889404297, "global_step": 47512, "epoch": 572} {"train_loss": -19.59587287902832, "global_step": 47513, "epoch": 572} {"train_loss": -19.585573196411133, "global_step": 47514, "epoch": 572} {"train_loss": -20.008838653564453, "global_step": 47515, "epoch": 572} {"train_loss": -19.86689567565918, "global_step": 47516, "epoch": 572} {"train_loss": -20.260557174682617, "global_step": 47517, "epoch": 572} {"train_loss": -19.800973892211914, "global_step": 47518, "epoch": 572} {"train_loss": -19.796131134033203, "global_step": 47519, "epoch": 572} {"train_loss": -20.06415367126465, "global_step": 47520, "epoch": 572} {"train_loss": -19.84165382385254, "global_step": 47521, "epoch": 572} {"train_loss": -19.75319480895996, "global_step": 47522, "epoch": 572} {"train_loss": -19.653440475463867, "global_step": 47523, "epoch": 572} {"train_loss": -19.473438262939453, "global_step": 47524, "epoch": 572} {"train_loss": -19.702436447143555, "global_step": 47525, "epoch": 572} {"train_loss": -19.57820701599121, "global_step": 47526, "epoch": 572} {"train_loss": -19.445533752441406, "global_step": 47527, "epoch": 572} {"train_loss": -19.93523406982422, "global_step": 47528, "epoch": 572} {"train_loss": -19.547107696533203, "global_step": 47529, "epoch": 572} {"train_loss": -20.03754997253418, "global_step": 47530, "epoch": 572} {"train_loss": -19.984994888305664, "global_step": 47531, "epoch": 572} {"train_loss": -19.753726959228516, "global_step": 47532, "epoch": 572} {"train_loss": -19.878238677978516, "global_step": 47533, "epoch": 572} {"train_loss": -20.145732879638672, "global_step": 47534, "epoch": 572} {"train_loss": -19.970062255859375, "global_step": 47535, "epoch": 572} {"train_loss": -20.085086822509766, "global_step": 47536, "epoch": 572} {"train_loss": -19.551427841186523, "global_step": 47537, "epoch": 572} {"train_loss": -20.08143424987793, "global_step": 47538, "epoch": 572} {"train_loss": -19.77448081970215, "global_step": 47539, "epoch": 572} {"train_loss": -20.2101993560791, "global_step": 47540, "epoch": 572} {"train_loss": -19.542387008666992, "global_step": 47541, "epoch": 572} {"train_loss": -20.000045776367188, "global_step": 47542, "epoch": 572} {"train_loss": -20.143447875976562, "global_step": 47543, "epoch": 572} {"train_loss": -19.71799087524414, "global_step": 47544, "epoch": 572} {"train_loss": -19.75867462158203, "global_step": 47545, "epoch": 572} {"train_loss": -19.6610164642334, "global_step": 47546, "epoch": 572} {"train_loss": -19.940074920654297, "global_step": 47547, "epoch": 572} {"train_loss": -19.694631576538086, "global_step": 47548, "epoch": 572} {"train_loss": -19.990549087524414, "global_step": 47549, "epoch": 572} {"train_loss": -19.891590118408203, "global_step": 47550, "epoch": 572} {"train_loss": -19.948139190673828, "global_step": 47551, "epoch": 572} {"train_loss": -19.29819107055664, "global_step": 47552, "epoch": 572} {"train_loss": -19.923954010009766, "global_step": 47553, "epoch": 572} {"train_loss": -19.885663986206055, "global_step": 47554, "epoch": 572} {"train_loss": -19.642322540283203, "global_step": 47555, "epoch": 572} {"train_loss": -19.766834259033203, "global_step": 47556, "epoch": 572} {"train_loss": -19.639806747436523, "global_step": 47557, "epoch": 572} {"train_loss": -19.805325519607727, "global_step": 47558, "epoch": 572, "val_loss": 6191989.5} {"train_loss": -19.20355224609375, "global_step": 47559, "epoch": 573} {"train_loss": -19.50038719177246, "global_step": 47560, "epoch": 573} {"train_loss": -19.504926681518555, "global_step": 47561, "epoch": 573} {"train_loss": -19.741037368774414, "global_step": 47562, "epoch": 573} {"train_loss": -19.138763427734375, "global_step": 47563, "epoch": 573} {"train_loss": -19.416133880615234, "global_step": 47564, "epoch": 573} {"train_loss": -19.412443161010742, "global_step": 47565, "epoch": 573} {"train_loss": -19.538925170898438, "global_step": 47566, "epoch": 573} {"train_loss": -19.587711334228516, "global_step": 47567, "epoch": 573} {"train_loss": -19.82154655456543, "global_step": 47568, "epoch": 573} {"train_loss": -19.68906593322754, "global_step": 47569, "epoch": 573} {"train_loss": -19.556533813476562, "global_step": 47570, "epoch": 573} {"train_loss": -19.237415313720703, "global_step": 47571, "epoch": 573} {"train_loss": -19.26204490661621, "global_step": 47572, "epoch": 573} {"train_loss": -19.870508193969727, "global_step": 47573, "epoch": 573} {"train_loss": -19.36219024658203, "global_step": 47574, "epoch": 573} {"train_loss": -19.58612632751465, "global_step": 47575, "epoch": 573} {"train_loss": -19.863475799560547, "global_step": 47576, "epoch": 573} {"train_loss": -19.965417861938477, "global_step": 47577, "epoch": 573} {"train_loss": -19.890213012695312, "global_step": 47578, "epoch": 573} {"train_loss": -19.418954849243164, "global_step": 47579, "epoch": 573} {"train_loss": -19.64731788635254, "global_step": 47580, "epoch": 573} {"train_loss": -19.89847183227539, "global_step": 47581, "epoch": 573} {"train_loss": -19.55377769470215, "global_step": 47582, "epoch": 573} {"train_loss": -19.880340576171875, "global_step": 47583, "epoch": 573} {"train_loss": -19.69287109375, "global_step": 47584, "epoch": 573} {"train_loss": -19.527360916137695, "global_step": 47585, "epoch": 573} {"train_loss": -20.047317504882812, "global_step": 47586, "epoch": 573} {"train_loss": -19.853519439697266, "global_step": 47587, "epoch": 573} {"train_loss": -19.842121124267578, "global_step": 47588, "epoch": 573} {"train_loss": -19.203433990478516, "global_step": 47589, "epoch": 573} {"train_loss": -19.630027770996094, "global_step": 47590, "epoch": 573} {"train_loss": -19.914661407470703, "global_step": 47591, "epoch": 573} {"train_loss": -20.1577205657959, "global_step": 47592, "epoch": 573} {"train_loss": -19.983606338500977, "global_step": 47593, "epoch": 573} {"train_loss": -19.899457931518555, "global_step": 47594, "epoch": 573} {"train_loss": -20.023305892944336, "global_step": 47595, "epoch": 573} {"train_loss": -19.705839157104492, "global_step": 47596, "epoch": 573} {"train_loss": -19.76228141784668, "global_step": 47597, "epoch": 573} {"train_loss": -19.74749183654785, "global_step": 47598, "epoch": 573} {"train_loss": -19.962072372436523, "global_step": 47599, "epoch": 573} {"train_loss": -19.7348690032959, "global_step": 47600, "epoch": 573} {"train_loss": -19.83538818359375, "global_step": 47601, "epoch": 573} {"train_loss": -19.820852279663086, "global_step": 47602, "epoch": 573} {"train_loss": -20.075626373291016, "global_step": 47603, "epoch": 573} {"train_loss": -19.43669319152832, "global_step": 47604, "epoch": 573} {"train_loss": -19.922901153564453, "global_step": 47605, "epoch": 573} {"train_loss": -20.028362274169922, "global_step": 47606, "epoch": 573} {"train_loss": -19.89991569519043, "global_step": 47607, "epoch": 573} {"train_loss": -19.96197509765625, "global_step": 47608, "epoch": 573} {"train_loss": -19.495386123657227, "global_step": 47609, "epoch": 573} {"train_loss": -19.743520736694336, "global_step": 47610, "epoch": 573} {"train_loss": -19.672407150268555, "global_step": 47611, "epoch": 573} {"train_loss": -19.75351905822754, "global_step": 47612, "epoch": 573} {"train_loss": -19.608003616333008, "global_step": 47613, "epoch": 573} {"train_loss": -19.771459579467773, "global_step": 47614, "epoch": 573} {"train_loss": -19.694395065307617, "global_step": 47615, "epoch": 573} {"train_loss": -20.072357177734375, "global_step": 47616, "epoch": 573} {"train_loss": -19.809864044189453, "global_step": 47617, "epoch": 573} {"train_loss": -19.700054168701172, "global_step": 47618, "epoch": 573} {"train_loss": -19.864171981811523, "global_step": 47619, "epoch": 573} {"train_loss": -19.69894790649414, "global_step": 47620, "epoch": 573} {"train_loss": -19.906511306762695, "global_step": 47621, "epoch": 573} {"train_loss": -19.866491317749023, "global_step": 47622, "epoch": 573} {"train_loss": -19.77777671813965, "global_step": 47623, "epoch": 573} {"train_loss": -19.98715591430664, "global_step": 47624, "epoch": 573} {"train_loss": -19.489582061767578, "global_step": 47625, "epoch": 573} {"train_loss": -19.6861515045166, "global_step": 47626, "epoch": 573} {"train_loss": -19.732772827148438, "global_step": 47627, "epoch": 573} {"train_loss": -19.98025131225586, "global_step": 47628, "epoch": 573} {"train_loss": -19.974565505981445, "global_step": 47629, "epoch": 573} {"train_loss": -19.351770401000977, "global_step": 47630, "epoch": 573} {"train_loss": -19.861635208129883, "global_step": 47631, "epoch": 573} {"train_loss": -19.94571876525879, "global_step": 47632, "epoch": 573} {"train_loss": -20.024606704711914, "global_step": 47633, "epoch": 573} {"train_loss": -19.8221492767334, "global_step": 47634, "epoch": 573} {"train_loss": -19.671703338623047, "global_step": 47635, "epoch": 573} {"train_loss": -19.651447296142578, "global_step": 47636, "epoch": 573} {"train_loss": -19.8905086517334, "global_step": 47637, "epoch": 573} {"train_loss": -20.00884246826172, "global_step": 47638, "epoch": 573} {"train_loss": -19.665281295776367, "global_step": 47639, "epoch": 573} {"train_loss": -20.14794921875, "global_step": 47640, "epoch": 573} {"train_loss": -19.747073736535498, "global_step": 47641, "epoch": 573, "val_loss": 5965606.0} {"train_loss": -19.580759048461914, "global_step": 47642, "epoch": 574} {"train_loss": -19.58335304260254, "global_step": 47643, "epoch": 574} {"train_loss": -19.666582107543945, "global_step": 47644, "epoch": 574} {"train_loss": -19.660768508911133, "global_step": 47645, "epoch": 574} {"train_loss": -19.728443145751953, "global_step": 47646, "epoch": 574} {"train_loss": -19.717960357666016, "global_step": 47647, "epoch": 574} {"train_loss": -19.691030502319336, "global_step": 47648, "epoch": 574} {"train_loss": -19.40266227722168, "global_step": 47649, "epoch": 574} {"train_loss": -19.732954025268555, "global_step": 47650, "epoch": 574} {"train_loss": -19.92067527770996, "global_step": 47651, "epoch": 574} {"train_loss": -19.520858764648438, "global_step": 47652, "epoch": 574} {"train_loss": -19.644235610961914, "global_step": 47653, "epoch": 574} {"train_loss": -19.56379508972168, "global_step": 47654, "epoch": 574} {"train_loss": -19.820281982421875, "global_step": 47655, "epoch": 574} {"train_loss": -19.56241226196289, "global_step": 47656, "epoch": 574} {"train_loss": -19.439529418945312, "global_step": 47657, "epoch": 574} {"train_loss": -19.85291290283203, "global_step": 47658, "epoch": 574} {"train_loss": -19.793439865112305, "global_step": 47659, "epoch": 574} {"train_loss": -20.005170822143555, "global_step": 47660, "epoch": 574} {"train_loss": -20.1021785736084, "global_step": 47661, "epoch": 574} {"train_loss": -19.87787437438965, "global_step": 47662, "epoch": 574} {"train_loss": -20.0155086517334, "global_step": 47663, "epoch": 574} {"train_loss": -19.7092227935791, "global_step": 47664, "epoch": 574} {"train_loss": -20.236215591430664, "global_step": 47665, "epoch": 574} {"train_loss": -19.67865562438965, "global_step": 47666, "epoch": 574} {"train_loss": -19.99458885192871, "global_step": 47667, "epoch": 574} {"train_loss": -19.96650505065918, "global_step": 47668, "epoch": 574} {"train_loss": -20.274831771850586, "global_step": 47669, "epoch": 574} {"train_loss": -19.878355026245117, "global_step": 47670, "epoch": 574} {"train_loss": -20.060022354125977, "global_step": 47671, "epoch": 574} {"train_loss": -19.538511276245117, "global_step": 47672, "epoch": 574} {"train_loss": -19.9141845703125, "global_step": 47673, "epoch": 574} {"train_loss": -19.458282470703125, "global_step": 47674, "epoch": 574} {"train_loss": -19.852697372436523, "global_step": 47675, "epoch": 574} {"train_loss": -19.2106876373291, "global_step": 47676, "epoch": 574} {"train_loss": -19.710311889648438, "global_step": 47677, "epoch": 574} {"train_loss": -20.01220703125, "global_step": 47678, "epoch": 574} {"train_loss": -19.936481475830078, "global_step": 47679, "epoch": 574} {"train_loss": -19.927387237548828, "global_step": 47680, "epoch": 574} {"train_loss": -19.733747482299805, "global_step": 47681, "epoch": 574} {"train_loss": -19.7813720703125, "global_step": 47682, "epoch": 574} {"train_loss": -20.05525016784668, "global_step": 47683, "epoch": 574} {"train_loss": -19.8170166015625, "global_step": 47684, "epoch": 574} {"train_loss": -20.0523681640625, "global_step": 47685, "epoch": 574} {"train_loss": -19.714590072631836, "global_step": 47686, "epoch": 574} {"train_loss": -19.828815460205078, "global_step": 47687, "epoch": 574} {"train_loss": -19.83028793334961, "global_step": 47688, "epoch": 574} {"train_loss": -19.758468627929688, "global_step": 47689, "epoch": 574} {"train_loss": -19.793987274169922, "global_step": 47690, "epoch": 574} {"train_loss": -19.93255043029785, "global_step": 47691, "epoch": 574} {"train_loss": -19.79204750061035, "global_step": 47692, "epoch": 574} {"train_loss": -20.184324264526367, "global_step": 47693, "epoch": 574} {"train_loss": -19.960542678833008, "global_step": 47694, "epoch": 574} {"train_loss": -19.610593795776367, "global_step": 47695, "epoch": 574} {"train_loss": -19.871057510375977, "global_step": 47696, "epoch": 574} {"train_loss": -19.965559005737305, "global_step": 47697, "epoch": 574} {"train_loss": -19.865930557250977, "global_step": 47698, "epoch": 574} {"train_loss": -19.84937858581543, "global_step": 47699, "epoch": 574} {"train_loss": -20.308849334716797, "global_step": 47700, "epoch": 574} {"train_loss": -19.834760665893555, "global_step": 47701, "epoch": 574} {"train_loss": -19.721771240234375, "global_step": 47702, "epoch": 574} {"train_loss": -19.736581802368164, "global_step": 47703, "epoch": 574} {"train_loss": -19.744319915771484, "global_step": 47704, "epoch": 574} {"train_loss": -19.779300689697266, "global_step": 47705, "epoch": 574} {"train_loss": -20.016340255737305, "global_step": 47706, "epoch": 574} {"train_loss": -19.93947410583496, "global_step": 47707, "epoch": 574} {"train_loss": -19.690725326538086, "global_step": 47708, "epoch": 574} {"train_loss": -20.07465362548828, "global_step": 47709, "epoch": 574} {"train_loss": -19.812545776367188, "global_step": 47710, "epoch": 574} {"train_loss": -19.84178924560547, "global_step": 47711, "epoch": 574} {"train_loss": -19.738784790039062, "global_step": 47712, "epoch": 574} {"train_loss": -19.717235565185547, "global_step": 47713, "epoch": 574} {"train_loss": -19.88917350769043, "global_step": 47714, "epoch": 574} {"train_loss": -19.85025978088379, "global_step": 47715, "epoch": 574} {"train_loss": -19.94990348815918, "global_step": 47716, "epoch": 574} {"train_loss": -20.233747482299805, "global_step": 47717, "epoch": 574} {"train_loss": -19.871313095092773, "global_step": 47718, "epoch": 574} {"train_loss": -19.862384796142578, "global_step": 47719, "epoch": 574} {"train_loss": -20.04217529296875, "global_step": 47720, "epoch": 574} {"train_loss": -19.72639274597168, "global_step": 47721, "epoch": 574} {"train_loss": -20.262466430664062, "global_step": 47722, "epoch": 574} {"train_loss": -19.955453872680664, "global_step": 47723, "epoch": 574} {"train_loss": -19.84092202244035, "global_step": 47724, "epoch": 574, "val_loss": 5919207.0} {"train_loss": -19.577260971069336, "global_step": 47725, "epoch": 575} {"train_loss": -19.96856117248535, "global_step": 47726, "epoch": 575} {"train_loss": -19.96762466430664, "global_step": 47727, "epoch": 575} {"train_loss": -19.376798629760742, "global_step": 47728, "epoch": 575} {"train_loss": -19.632427215576172, "global_step": 47729, "epoch": 575} {"train_loss": -19.586692810058594, "global_step": 47730, "epoch": 575} {"train_loss": -19.635190963745117, "global_step": 47731, "epoch": 575} {"train_loss": -20.03496742248535, "global_step": 47732, "epoch": 575} {"train_loss": -19.635005950927734, "global_step": 47733, "epoch": 575} {"train_loss": -19.90540313720703, "global_step": 47734, "epoch": 575} {"train_loss": -19.384212493896484, "global_step": 47735, "epoch": 575} {"train_loss": -19.433866500854492, "global_step": 47736, "epoch": 575} {"train_loss": -19.7629337310791, "global_step": 47737, "epoch": 575} {"train_loss": -19.534046173095703, "global_step": 47738, "epoch": 575} {"train_loss": -19.719829559326172, "global_step": 47739, "epoch": 575} {"train_loss": -19.625329971313477, "global_step": 47740, "epoch": 575} {"train_loss": -19.976428985595703, "global_step": 47741, "epoch": 575} {"train_loss": -19.556039810180664, "global_step": 47742, "epoch": 575} {"train_loss": -19.603199005126953, "global_step": 47743, "epoch": 575} {"train_loss": -20.219053268432617, "global_step": 47744, "epoch": 575} {"train_loss": -19.58835220336914, "global_step": 47745, "epoch": 575} {"train_loss": -19.56808090209961, "global_step": 47746, "epoch": 575} {"train_loss": -19.873350143432617, "global_step": 47747, "epoch": 575} {"train_loss": -19.80230140686035, "global_step": 47748, "epoch": 575} {"train_loss": -19.89270782470703, "global_step": 47749, "epoch": 575} {"train_loss": -20.160673141479492, "global_step": 47750, "epoch": 575} {"train_loss": -19.692062377929688, "global_step": 47751, "epoch": 575} {"train_loss": -19.782224655151367, "global_step": 47752, "epoch": 575} {"train_loss": -20.222152709960938, "global_step": 47753, "epoch": 575} {"train_loss": -19.83066749572754, "global_step": 47754, "epoch": 575} {"train_loss": -19.54646110534668, "global_step": 47755, "epoch": 575} {"train_loss": -19.619592666625977, "global_step": 47756, "epoch": 575} {"train_loss": -19.6674747467041, "global_step": 47757, "epoch": 575} {"train_loss": -20.350723266601562, "global_step": 47758, "epoch": 575} {"train_loss": -20.084243774414062, "global_step": 47759, "epoch": 575} {"train_loss": -19.630712509155273, "global_step": 47760, "epoch": 575} {"train_loss": -19.756179809570312, "global_step": 47761, "epoch": 575} {"train_loss": -20.086652755737305, "global_step": 47762, "epoch": 575} {"train_loss": -19.916173934936523, "global_step": 47763, "epoch": 575} {"train_loss": -19.399951934814453, "global_step": 47764, "epoch": 575} {"train_loss": -19.957429885864258, "global_step": 47765, "epoch": 575} {"train_loss": -19.807802200317383, "global_step": 47766, "epoch": 575} {"train_loss": -20.15765953063965, "global_step": 47767, "epoch": 575} {"train_loss": -19.849302291870117, "global_step": 47768, "epoch": 575} {"train_loss": -19.811132431030273, "global_step": 47769, "epoch": 575} {"train_loss": -19.726713180541992, "global_step": 47770, "epoch": 575} {"train_loss": -19.743722915649414, "global_step": 47771, "epoch": 575} {"train_loss": -19.424890518188477, "global_step": 47772, "epoch": 575} {"train_loss": -19.50950813293457, "global_step": 47773, "epoch": 575} {"train_loss": -20.03565788269043, "global_step": 47774, "epoch": 575} {"train_loss": -19.744531631469727, "global_step": 47775, "epoch": 575} {"train_loss": -20.001018524169922, "global_step": 47776, "epoch": 575} {"train_loss": -19.901159286499023, "global_step": 47777, "epoch": 575} {"train_loss": -19.715225219726562, "global_step": 47778, "epoch": 575} {"train_loss": -19.8662052154541, "global_step": 47779, "epoch": 575} {"train_loss": -19.747940063476562, "global_step": 47780, "epoch": 575} {"train_loss": -19.97541618347168, "global_step": 47781, "epoch": 575} {"train_loss": -20.270782470703125, "global_step": 47782, "epoch": 575} {"train_loss": -19.871061325073242, "global_step": 47783, "epoch": 575} {"train_loss": -19.69627571105957, "global_step": 47784, "epoch": 575} {"train_loss": -20.152435302734375, "global_step": 47785, "epoch": 575} {"train_loss": -19.835468292236328, "global_step": 47786, "epoch": 575} {"train_loss": -19.82942008972168, "global_step": 47787, "epoch": 575} {"train_loss": -19.946691513061523, "global_step": 47788, "epoch": 575} {"train_loss": -20.02535057067871, "global_step": 47789, "epoch": 575} {"train_loss": -19.92707633972168, "global_step": 47790, "epoch": 575} {"train_loss": -19.735013961791992, "global_step": 47791, "epoch": 575} {"train_loss": -19.9272518157959, "global_step": 47792, "epoch": 575} {"train_loss": -19.652490615844727, "global_step": 47793, "epoch": 575} {"train_loss": -20.005451202392578, "global_step": 47794, "epoch": 575} {"train_loss": -20.247909545898438, "global_step": 47795, "epoch": 575} {"train_loss": -19.727294921875, "global_step": 47796, "epoch": 575} {"train_loss": -19.892494201660156, "global_step": 47797, "epoch": 575} {"train_loss": -19.734235763549805, "global_step": 47798, "epoch": 575} {"train_loss": -19.688833236694336, "global_step": 47799, "epoch": 575} {"train_loss": -19.975849151611328, "global_step": 47800, "epoch": 575} {"train_loss": -19.904953002929688, "global_step": 47801, "epoch": 575} {"train_loss": -20.037694931030273, "global_step": 47802, "epoch": 575} {"train_loss": -20.09543228149414, "global_step": 47803, "epoch": 575} {"train_loss": -20.05202293395996, "global_step": 47804, "epoch": 575} {"train_loss": -19.809762954711914, "global_step": 47805, "epoch": 575} {"train_loss": -20.075281143188477, "global_step": 47806, "epoch": 575} {"train_loss": -19.84558753507683, "global_step": 47807, "epoch": 575, "val_loss": 6030813.5} {"train_loss": -19.456501007080078, "global_step": 47808, "epoch": 576} {"train_loss": -19.835968017578125, "global_step": 47809, "epoch": 576} {"train_loss": -19.648441314697266, "global_step": 47810, "epoch": 576} {"train_loss": -19.65156364440918, "global_step": 47811, "epoch": 576} {"train_loss": -19.64264488220215, "global_step": 47812, "epoch": 576} {"train_loss": -19.997461318969727, "global_step": 47813, "epoch": 576} {"train_loss": -19.67304801940918, "global_step": 47814, "epoch": 576} {"train_loss": -19.67828941345215, "global_step": 47815, "epoch": 576} {"train_loss": -19.492788314819336, "global_step": 47816, "epoch": 576} {"train_loss": -19.788955688476562, "global_step": 47817, "epoch": 576} {"train_loss": -19.933616638183594, "global_step": 47818, "epoch": 576} {"train_loss": -19.611093521118164, "global_step": 47819, "epoch": 576} {"train_loss": -19.720914840698242, "global_step": 47820, "epoch": 576} {"train_loss": -19.74428367614746, "global_step": 47821, "epoch": 576} {"train_loss": -19.593542098999023, "global_step": 47822, "epoch": 576} {"train_loss": -19.657211303710938, "global_step": 47823, "epoch": 576} {"train_loss": -19.860036849975586, "global_step": 47824, "epoch": 576} {"train_loss": -19.71504783630371, "global_step": 47825, "epoch": 576} {"train_loss": -19.845279693603516, "global_step": 47826, "epoch": 576} {"train_loss": -19.464658737182617, "global_step": 47827, "epoch": 576} {"train_loss": -19.971227645874023, "global_step": 47828, "epoch": 576} {"train_loss": -19.472278594970703, "global_step": 47829, "epoch": 576} {"train_loss": -19.79327964782715, "global_step": 47830, "epoch": 576} {"train_loss": -20.003965377807617, "global_step": 47831, "epoch": 576} {"train_loss": -19.623624801635742, "global_step": 47832, "epoch": 576} {"train_loss": -19.826492309570312, "global_step": 47833, "epoch": 576} {"train_loss": -19.56888198852539, "global_step": 47834, "epoch": 576} {"train_loss": -19.774089813232422, "global_step": 47835, "epoch": 576} {"train_loss": -19.826868057250977, "global_step": 47836, "epoch": 576} {"train_loss": -19.7271728515625, "global_step": 47837, "epoch": 576} {"train_loss": -19.98017692565918, "global_step": 47838, "epoch": 576} {"train_loss": -19.742244720458984, "global_step": 47839, "epoch": 576} {"train_loss": -19.932973861694336, "global_step": 47840, "epoch": 576} {"train_loss": -19.839950561523438, "global_step": 47841, "epoch": 576} {"train_loss": -20.0371036529541, "global_step": 47842, "epoch": 576} {"train_loss": -20.158599853515625, "global_step": 47843, "epoch": 576} {"train_loss": -20.01744842529297, "global_step": 47844, "epoch": 576} {"train_loss": -20.144697189331055, "global_step": 47845, "epoch": 576} {"train_loss": -19.902860641479492, "global_step": 47846, "epoch": 576} {"train_loss": -19.69437026977539, "global_step": 47847, "epoch": 576} {"train_loss": -19.897083282470703, "global_step": 47848, "epoch": 576} {"train_loss": -19.834766387939453, "global_step": 47849, "epoch": 576} {"train_loss": -19.863910675048828, "global_step": 47850, "epoch": 576} {"train_loss": -19.86343765258789, "global_step": 47851, "epoch": 576} {"train_loss": -19.801671981811523, "global_step": 47852, "epoch": 576} {"train_loss": -20.220386505126953, "global_step": 47853, "epoch": 576} {"train_loss": -20.002403259277344, "global_step": 47854, "epoch": 576} {"train_loss": -19.52906608581543, "global_step": 47855, "epoch": 576} {"train_loss": -19.652328491210938, "global_step": 47856, "epoch": 576} {"train_loss": -20.034381866455078, "global_step": 47857, "epoch": 576} {"train_loss": -20.185150146484375, "global_step": 47858, "epoch": 576} {"train_loss": -19.71101188659668, "global_step": 47859, "epoch": 576} {"train_loss": -19.116397857666016, "global_step": 47860, "epoch": 576} {"train_loss": -20.114885330200195, "global_step": 47861, "epoch": 576} {"train_loss": -19.862905502319336, "global_step": 47862, "epoch": 576} {"train_loss": -19.824880599975586, "global_step": 47863, "epoch": 576} {"train_loss": -19.85251808166504, "global_step": 47864, "epoch": 576} {"train_loss": -19.64299201965332, "global_step": 47865, "epoch": 576} {"train_loss": -19.77837562561035, "global_step": 47866, "epoch": 576} {"train_loss": -19.916873931884766, "global_step": 47867, "epoch": 576} {"train_loss": -20.028425216674805, "global_step": 47868, "epoch": 576} {"train_loss": -19.86368179321289, "global_step": 47869, "epoch": 576} {"train_loss": -20.166549682617188, "global_step": 47870, "epoch": 576} {"train_loss": -19.59746742248535, "global_step": 47871, "epoch": 576} {"train_loss": -19.765714645385742, "global_step": 47872, "epoch": 576} {"train_loss": -19.91229820251465, "global_step": 47873, "epoch": 576} {"train_loss": -19.54610252380371, "global_step": 47874, "epoch": 576} {"train_loss": -19.821584701538086, "global_step": 47875, "epoch": 576} {"train_loss": -20.228851318359375, "global_step": 47876, "epoch": 576} {"train_loss": -20.189655303955078, "global_step": 47877, "epoch": 576} {"train_loss": -19.84755516052246, "global_step": 47878, "epoch": 576} {"train_loss": -19.8196964263916, "global_step": 47879, "epoch": 576} {"train_loss": -19.788333892822266, "global_step": 47880, "epoch": 576} {"train_loss": -20.013212203979492, "global_step": 47881, "epoch": 576} {"train_loss": -19.681381225585938, "global_step": 47882, "epoch": 576} {"train_loss": -19.66895294189453, "global_step": 47883, "epoch": 576} {"train_loss": -19.696033477783203, "global_step": 47884, "epoch": 576} {"train_loss": -19.981613159179688, "global_step": 47885, "epoch": 576} {"train_loss": -19.79779624938965, "global_step": 47886, "epoch": 576} {"train_loss": -19.685688018798828, "global_step": 47887, "epoch": 576} {"train_loss": -20.100040435791016, "global_step": 47888, "epoch": 576} {"train_loss": -19.736255645751953, "global_step": 47889, "epoch": 576} {"train_loss": -19.80571420508695, "global_step": 47890, "epoch": 576, "val_loss": 5912382.0} {"train_loss": -19.79020118713379, "global_step": 47891, "epoch": 577} {"train_loss": -20.058155059814453, "global_step": 47892, "epoch": 577} {"train_loss": -19.446744918823242, "global_step": 47893, "epoch": 577} {"train_loss": -19.750625610351562, "global_step": 47894, "epoch": 577} {"train_loss": -19.573593139648438, "global_step": 47895, "epoch": 577} {"train_loss": -19.81945037841797, "global_step": 47896, "epoch": 577} {"train_loss": -19.819902420043945, "global_step": 47897, "epoch": 577} {"train_loss": -19.913293838500977, "global_step": 47898, "epoch": 577} {"train_loss": -19.68023681640625, "global_step": 47899, "epoch": 577} {"train_loss": -19.82679557800293, "global_step": 47900, "epoch": 577} {"train_loss": -19.711191177368164, "global_step": 47901, "epoch": 577} {"train_loss": -19.711637496948242, "global_step": 47902, "epoch": 577} {"train_loss": -20.03447723388672, "global_step": 47903, "epoch": 577} {"train_loss": -19.809284210205078, "global_step": 47904, "epoch": 577} {"train_loss": -20.253971099853516, "global_step": 47905, "epoch": 577} {"train_loss": -19.744892120361328, "global_step": 47906, "epoch": 577} {"train_loss": -20.008426666259766, "global_step": 47907, "epoch": 577} {"train_loss": -19.688716888427734, "global_step": 47908, "epoch": 577} {"train_loss": -19.675273895263672, "global_step": 47909, "epoch": 577} {"train_loss": -19.494482040405273, "global_step": 47910, "epoch": 577} {"train_loss": -20.195871353149414, "global_step": 47911, "epoch": 577} {"train_loss": -19.675039291381836, "global_step": 47912, "epoch": 577} {"train_loss": -19.999692916870117, "global_step": 47913, "epoch": 577} {"train_loss": -19.827890396118164, "global_step": 47914, "epoch": 577} {"train_loss": -19.58974266052246, "global_step": 47915, "epoch": 577} {"train_loss": -19.418298721313477, "global_step": 47916, "epoch": 577} {"train_loss": -20.082809448242188, "global_step": 47917, "epoch": 577} {"train_loss": -20.10400390625, "global_step": 47918, "epoch": 577} {"train_loss": -19.628185272216797, "global_step": 47919, "epoch": 577} {"train_loss": -19.394582748413086, "global_step": 47920, "epoch": 577} {"train_loss": -19.716373443603516, "global_step": 47921, "epoch": 577} {"train_loss": -19.803796768188477, "global_step": 47922, "epoch": 577} {"train_loss": -19.661500930786133, "global_step": 47923, "epoch": 577} {"train_loss": -19.8407039642334, "global_step": 47924, "epoch": 577} {"train_loss": -19.863183975219727, "global_step": 47925, "epoch": 577} {"train_loss": -20.070077896118164, "global_step": 47926, "epoch": 577} {"train_loss": -19.659780502319336, "global_step": 47927, "epoch": 577} {"train_loss": -20.019521713256836, "global_step": 47928, "epoch": 577} {"train_loss": -19.901090621948242, "global_step": 47929, "epoch": 577} {"train_loss": -19.821027755737305, "global_step": 47930, "epoch": 577} {"train_loss": -19.70046043395996, "global_step": 47931, "epoch": 577} {"train_loss": -20.111940383911133, "global_step": 47932, "epoch": 577} {"train_loss": -19.976642608642578, "global_step": 47933, "epoch": 577} {"train_loss": -19.599031448364258, "global_step": 47934, "epoch": 577} {"train_loss": -19.762969970703125, "global_step": 47935, "epoch": 577} {"train_loss": -19.970426559448242, "global_step": 47936, "epoch": 577} {"train_loss": -19.848936080932617, "global_step": 47937, "epoch": 577} {"train_loss": -19.801151275634766, "global_step": 47938, "epoch": 577} {"train_loss": -19.82697868347168, "global_step": 47939, "epoch": 577} {"train_loss": -19.66640281677246, "global_step": 47940, "epoch": 577} {"train_loss": -19.690013885498047, "global_step": 47941, "epoch": 577} {"train_loss": -19.470754623413086, "global_step": 47942, "epoch": 577} {"train_loss": -20.112483978271484, "global_step": 47943, "epoch": 577} {"train_loss": -19.727645874023438, "global_step": 47944, "epoch": 577} {"train_loss": -19.739816665649414, "global_step": 47945, "epoch": 577} {"train_loss": -19.83510971069336, "global_step": 47946, "epoch": 577} {"train_loss": -19.661787033081055, "global_step": 47947, "epoch": 577} {"train_loss": -19.553783416748047, "global_step": 47948, "epoch": 577} {"train_loss": -19.903348922729492, "global_step": 47949, "epoch": 577} {"train_loss": -20.028043746948242, "global_step": 47950, "epoch": 577} {"train_loss": -19.952051162719727, "global_step": 47951, "epoch": 577} {"train_loss": -19.854089736938477, "global_step": 47952, "epoch": 577} {"train_loss": -19.63610076904297, "global_step": 47953, "epoch": 577} {"train_loss": -19.879592895507812, "global_step": 47954, "epoch": 577} {"train_loss": -20.135374069213867, "global_step": 47955, "epoch": 577} {"train_loss": -20.147842407226562, "global_step": 47956, "epoch": 577} {"train_loss": -20.1057071685791, "global_step": 47957, "epoch": 577} {"train_loss": -19.686016082763672, "global_step": 47958, "epoch": 577} {"train_loss": -19.72932243347168, "global_step": 47959, "epoch": 577} {"train_loss": -19.720792770385742, "global_step": 47960, "epoch": 577} {"train_loss": -19.59905433654785, "global_step": 47961, "epoch": 577} {"train_loss": -19.70265769958496, "global_step": 47962, "epoch": 577} {"train_loss": -20.18474578857422, "global_step": 47963, "epoch": 577} {"train_loss": -19.483409881591797, "global_step": 47964, "epoch": 577} {"train_loss": -19.65266227722168, "global_step": 47965, "epoch": 577} {"train_loss": -20.200439453125, "global_step": 47966, "epoch": 577} {"train_loss": -19.76795768737793, "global_step": 47967, "epoch": 577} {"train_loss": -19.845373153686523, "global_step": 47968, "epoch": 577} {"train_loss": -19.61446189880371, "global_step": 47969, "epoch": 577} {"train_loss": -19.81300163269043, "global_step": 47970, "epoch": 577} {"train_loss": -19.833877563476562, "global_step": 47971, "epoch": 577} {"train_loss": -19.760845184326172, "global_step": 47972, "epoch": 577} {"train_loss": -19.810298161334302, "global_step": 47973, "epoch": 577, "val_loss": 5932281.0} {"train_loss": -20.135595321655273, "global_step": 47974, "epoch": 578} {"train_loss": -19.83551597595215, "global_step": 47975, "epoch": 578} {"train_loss": -19.789688110351562, "global_step": 47976, "epoch": 578} {"train_loss": -19.896703720092773, "global_step": 47977, "epoch": 578} {"train_loss": -19.9990234375, "global_step": 47978, "epoch": 578} {"train_loss": -19.78571891784668, "global_step": 47979, "epoch": 578} {"train_loss": -20.12759780883789, "global_step": 47980, "epoch": 578} {"train_loss": -19.881744384765625, "global_step": 47981, "epoch": 578} {"train_loss": -19.6706485748291, "global_step": 47982, "epoch": 578} {"train_loss": -19.654680252075195, "global_step": 47983, "epoch": 578} {"train_loss": -19.81963348388672, "global_step": 47984, "epoch": 578} {"train_loss": -20.01265525817871, "global_step": 47985, "epoch": 578} {"train_loss": -19.835372924804688, "global_step": 47986, "epoch": 578} {"train_loss": -20.11457633972168, "global_step": 47987, "epoch": 578} {"train_loss": -19.7496395111084, "global_step": 47988, "epoch": 578} {"train_loss": -20.154651641845703, "global_step": 47989, "epoch": 578} {"train_loss": -19.8367862701416, "global_step": 47990, "epoch": 578} {"train_loss": -19.759231567382812, "global_step": 47991, "epoch": 578} {"train_loss": -19.87000846862793, "global_step": 47992, "epoch": 578} {"train_loss": -20.005239486694336, "global_step": 47993, "epoch": 578} {"train_loss": -20.060163497924805, "global_step": 47994, "epoch": 578} {"train_loss": -19.884199142456055, "global_step": 47995, "epoch": 578} {"train_loss": -19.445241928100586, "global_step": 47996, "epoch": 578} {"train_loss": -19.6551513671875, "global_step": 47997, "epoch": 578} {"train_loss": -19.67572593688965, "global_step": 47998, "epoch": 578} {"train_loss": -19.7125301361084, "global_step": 47999, "epoch": 578} {"train_loss": -19.735965728759766, "global_step": 48000, "epoch": 578} {"train_loss": -19.767576217651367, "global_step": 48001, "epoch": 578} {"train_loss": -19.49860191345215, "global_step": 48002, "epoch": 578} {"train_loss": -19.583236694335938, "global_step": 48003, "epoch": 578} {"train_loss": -20.005022048950195, "global_step": 48004, "epoch": 578} {"train_loss": -19.73053550720215, "global_step": 48005, "epoch": 578} {"train_loss": -19.697118759155273, "global_step": 48006, "epoch": 578} {"train_loss": -19.63376808166504, "global_step": 48007, "epoch": 578} {"train_loss": -19.740631103515625, "global_step": 48008, "epoch": 578} {"train_loss": -19.512832641601562, "global_step": 48009, "epoch": 578} {"train_loss": -19.886030197143555, "global_step": 48010, "epoch": 578} {"train_loss": -19.987546920776367, "global_step": 48011, "epoch": 578} {"train_loss": -19.3327693939209, "global_step": 48012, "epoch": 578} {"train_loss": -19.97952651977539, "global_step": 48013, "epoch": 578} {"train_loss": -19.70582389831543, "global_step": 48014, "epoch": 578} {"train_loss": -19.848051071166992, "global_step": 48015, "epoch": 578} {"train_loss": -19.66936683654785, "global_step": 48016, "epoch": 578} {"train_loss": -20.003215789794922, "global_step": 48017, "epoch": 578} {"train_loss": -19.846830368041992, "global_step": 48018, "epoch": 578} {"train_loss": -19.80687713623047, "global_step": 48019, "epoch": 578} {"train_loss": -19.543228149414062, "global_step": 48020, "epoch": 578} {"train_loss": -19.66103744506836, "global_step": 48021, "epoch": 578} {"train_loss": -19.473407745361328, "global_step": 48022, "epoch": 578} {"train_loss": -19.959075927734375, "global_step": 48023, "epoch": 578} {"train_loss": -19.62692642211914, "global_step": 48024, "epoch": 578} {"train_loss": -20.096435546875, "global_step": 48025, "epoch": 578} {"train_loss": -19.710325241088867, "global_step": 48026, "epoch": 578} {"train_loss": -20.090993881225586, "global_step": 48027, "epoch": 578} {"train_loss": -19.91621208190918, "global_step": 48028, "epoch": 578} {"train_loss": -20.070377349853516, "global_step": 48029, "epoch": 578} {"train_loss": -19.73702049255371, "global_step": 48030, "epoch": 578} {"train_loss": -19.68715476989746, "global_step": 48031, "epoch": 578} {"train_loss": -19.634424209594727, "global_step": 48032, "epoch": 578} {"train_loss": -19.862979888916016, "global_step": 48033, "epoch": 578} {"train_loss": -19.73794174194336, "global_step": 48034, "epoch": 578} {"train_loss": -19.862348556518555, "global_step": 48035, "epoch": 578} {"train_loss": -19.859350204467773, "global_step": 48036, "epoch": 578} {"train_loss": -19.48978042602539, "global_step": 48037, "epoch": 578} {"train_loss": -19.622995376586914, "global_step": 48038, "epoch": 578} {"train_loss": -19.718557357788086, "global_step": 48039, "epoch": 578} {"train_loss": -19.83534049987793, "global_step": 48040, "epoch": 578} {"train_loss": -19.820707321166992, "global_step": 48041, "epoch": 578} {"train_loss": -19.86983299255371, "global_step": 48042, "epoch": 578} {"train_loss": -19.618207931518555, "global_step": 48043, "epoch": 578} {"train_loss": -19.89858055114746, "global_step": 48044, "epoch": 578} {"train_loss": -19.909929275512695, "global_step": 48045, "epoch": 578} {"train_loss": -19.68186378479004, "global_step": 48046, "epoch": 578} {"train_loss": -19.794097900390625, "global_step": 48047, "epoch": 578} {"train_loss": -19.64757537841797, "global_step": 48048, "epoch": 578} {"train_loss": -19.645023345947266, "global_step": 48049, "epoch": 578} {"train_loss": -19.762937545776367, "global_step": 48050, "epoch": 578} {"train_loss": -19.894458770751953, "global_step": 48051, "epoch": 578} {"train_loss": -19.89752960205078, "global_step": 48052, "epoch": 578} {"train_loss": -19.790372848510742, "global_step": 48053, "epoch": 578} {"train_loss": -19.706777572631836, "global_step": 48054, "epoch": 578} {"train_loss": -19.696359634399414, "global_step": 48055, "epoch": 578} {"train_loss": -19.795907009078796, "global_step": 48056, "epoch": 578, "val_loss": 6164287.0} {"train_loss": -18.84820556640625, "global_step": 48057, "epoch": 579} {"train_loss": -19.491561889648438, "global_step": 48058, "epoch": 579} {"train_loss": -19.399505615234375, "global_step": 48059, "epoch": 579} {"train_loss": -18.948240280151367, "global_step": 48060, "epoch": 579} {"train_loss": -19.57487678527832, "global_step": 48061, "epoch": 579} {"train_loss": -18.76017951965332, "global_step": 48062, "epoch": 579} {"train_loss": -19.493972778320312, "global_step": 48063, "epoch": 579} {"train_loss": -19.894315719604492, "global_step": 48064, "epoch": 579} {"train_loss": -19.576261520385742, "global_step": 48065, "epoch": 579} {"train_loss": -19.843107223510742, "global_step": 48066, "epoch": 579} {"train_loss": -19.237977981567383, "global_step": 48067, "epoch": 579} {"train_loss": -19.33937644958496, "global_step": 48068, "epoch": 579} {"train_loss": -19.416706085205078, "global_step": 48069, "epoch": 579} {"train_loss": -19.48504066467285, "global_step": 48070, "epoch": 579} {"train_loss": -19.643312454223633, "global_step": 48071, "epoch": 579} {"train_loss": -19.70344352722168, "global_step": 48072, "epoch": 579} {"train_loss": -19.795063018798828, "global_step": 48073, "epoch": 579} {"train_loss": -19.64595603942871, "global_step": 48074, "epoch": 579} {"train_loss": -19.648603439331055, "global_step": 48075, "epoch": 579} {"train_loss": -19.81630516052246, "global_step": 48076, "epoch": 579} {"train_loss": -19.891904830932617, "global_step": 48077, "epoch": 579} {"train_loss": -19.928030014038086, "global_step": 48078, "epoch": 579} {"train_loss": -19.631454467773438, "global_step": 48079, "epoch": 579} {"train_loss": -19.582927703857422, "global_step": 48080, "epoch": 579} {"train_loss": -19.62568473815918, "global_step": 48081, "epoch": 579} {"train_loss": -19.527097702026367, "global_step": 48082, "epoch": 579} {"train_loss": -19.75752830505371, "global_step": 48083, "epoch": 579} {"train_loss": -19.616546630859375, "global_step": 48084, "epoch": 579} {"train_loss": -19.552457809448242, "global_step": 48085, "epoch": 579} {"train_loss": -19.61830711364746, "global_step": 48086, "epoch": 579} {"train_loss": -19.70536231994629, "global_step": 48087, "epoch": 579} {"train_loss": -19.56829833984375, "global_step": 48088, "epoch": 579} {"train_loss": -19.776405334472656, "global_step": 48089, "epoch": 579} {"train_loss": -19.915958404541016, "global_step": 48090, "epoch": 579} {"train_loss": -19.657901763916016, "global_step": 48091, "epoch": 579} {"train_loss": -20.07023048400879, "global_step": 48092, "epoch": 579} {"train_loss": -19.561208724975586, "global_step": 48093, "epoch": 579} {"train_loss": -19.790912628173828, "global_step": 48094, "epoch": 579} {"train_loss": -19.874799728393555, "global_step": 48095, "epoch": 579} {"train_loss": -19.4276180267334, "global_step": 48096, "epoch": 579} {"train_loss": -19.713973999023438, "global_step": 48097, "epoch": 579} {"train_loss": -19.891834259033203, "global_step": 48098, "epoch": 579} {"train_loss": -19.714645385742188, "global_step": 48099, "epoch": 579} {"train_loss": -19.83112907409668, "global_step": 48100, "epoch": 579} {"train_loss": -19.699731826782227, "global_step": 48101, "epoch": 579} {"train_loss": -19.81560707092285, "global_step": 48102, "epoch": 579} {"train_loss": -19.781530380249023, "global_step": 48103, "epoch": 579} {"train_loss": -19.88201904296875, "global_step": 48104, "epoch": 579} {"train_loss": -19.99236488342285, "global_step": 48105, "epoch": 579} {"train_loss": -19.8536319732666, "global_step": 48106, "epoch": 579} {"train_loss": -20.156038284301758, "global_step": 48107, "epoch": 579} {"train_loss": -19.858665466308594, "global_step": 48108, "epoch": 579} {"train_loss": -19.70029067993164, "global_step": 48109, "epoch": 579} {"train_loss": -19.694156646728516, "global_step": 48110, "epoch": 579} {"train_loss": -19.720605850219727, "global_step": 48111, "epoch": 579} {"train_loss": -19.710533142089844, "global_step": 48112, "epoch": 579} {"train_loss": -19.993722915649414, "global_step": 48113, "epoch": 579} {"train_loss": -19.686758041381836, "global_step": 48114, "epoch": 579} {"train_loss": -19.80122947692871, "global_step": 48115, "epoch": 579} {"train_loss": -19.84689712524414, "global_step": 48116, "epoch": 579} {"train_loss": -19.598636627197266, "global_step": 48117, "epoch": 579} {"train_loss": -20.074857711791992, "global_step": 48118, "epoch": 579} {"train_loss": -20.0909481048584, "global_step": 48119, "epoch": 579} {"train_loss": -20.319746017456055, "global_step": 48120, "epoch": 579} {"train_loss": -19.967992782592773, "global_step": 48121, "epoch": 579} {"train_loss": -20.037832260131836, "global_step": 48122, "epoch": 579} {"train_loss": -19.59063148498535, "global_step": 48123, "epoch": 579} {"train_loss": -19.877517700195312, "global_step": 48124, "epoch": 579} {"train_loss": -20.062021255493164, "global_step": 48125, "epoch": 579} {"train_loss": -20.016164779663086, "global_step": 48126, "epoch": 579} {"train_loss": -20.262800216674805, "global_step": 48127, "epoch": 579} {"train_loss": -19.970293045043945, "global_step": 48128, "epoch": 579} {"train_loss": -19.56842613220215, "global_step": 48129, "epoch": 579} {"train_loss": -19.545686721801758, "global_step": 48130, "epoch": 579} {"train_loss": -19.778562545776367, "global_step": 48131, "epoch": 579} {"train_loss": -19.96257209777832, "global_step": 48132, "epoch": 579} {"train_loss": -19.784181594848633, "global_step": 48133, "epoch": 579} {"train_loss": -20.036300659179688, "global_step": 48134, "epoch": 579} {"train_loss": -19.933393478393555, "global_step": 48135, "epoch": 579} {"train_loss": -19.79251480102539, "global_step": 48136, "epoch": 579} {"train_loss": -20.071918487548828, "global_step": 48137, "epoch": 579} {"train_loss": -19.73480796813965, "global_step": 48138, "epoch": 579} {"train_loss": -19.728260407964868, "global_step": 48139, "epoch": 579, "val_loss": 5902180.0} {"train_loss": -20.17321014404297, "global_step": 48140, "epoch": 580} {"train_loss": -19.52198600769043, "global_step": 48141, "epoch": 580} {"train_loss": -19.889432907104492, "global_step": 48142, "epoch": 580} {"train_loss": -19.380659103393555, "global_step": 48143, "epoch": 580} {"train_loss": -19.75335121154785, "global_step": 48144, "epoch": 580} {"train_loss": -19.697622299194336, "global_step": 48145, "epoch": 580} {"train_loss": -19.759811401367188, "global_step": 48146, "epoch": 580} {"train_loss": -19.743810653686523, "global_step": 48147, "epoch": 580} {"train_loss": -19.745439529418945, "global_step": 48148, "epoch": 580} {"train_loss": -19.90813636779785, "global_step": 48149, "epoch": 580} {"train_loss": -19.92890167236328, "global_step": 48150, "epoch": 580} {"train_loss": -19.691120147705078, "global_step": 48151, "epoch": 580} {"train_loss": -19.5610408782959, "global_step": 48152, "epoch": 580} {"train_loss": -19.73465919494629, "global_step": 48153, "epoch": 580} {"train_loss": -19.951303482055664, "global_step": 48154, "epoch": 580} {"train_loss": -19.781967163085938, "global_step": 48155, "epoch": 580} {"train_loss": -20.130952835083008, "global_step": 48156, "epoch": 580} {"train_loss": -19.502286911010742, "global_step": 48157, "epoch": 580} {"train_loss": -19.927305221557617, "global_step": 48158, "epoch": 580} {"train_loss": -19.94891357421875, "global_step": 48159, "epoch": 580} {"train_loss": -19.379758834838867, "global_step": 48160, "epoch": 580} {"train_loss": -20.093496322631836, "global_step": 48161, "epoch": 580} {"train_loss": -19.74944496154785, "global_step": 48162, "epoch": 580} {"train_loss": -19.528705596923828, "global_step": 48163, "epoch": 580} {"train_loss": -20.1704044342041, "global_step": 48164, "epoch": 580} {"train_loss": -19.78145980834961, "global_step": 48165, "epoch": 580} {"train_loss": -19.80706214904785, "global_step": 48166, "epoch": 580} {"train_loss": -19.846500396728516, "global_step": 48167, "epoch": 580} {"train_loss": -19.90652847290039, "global_step": 48168, "epoch": 580} {"train_loss": -19.80105972290039, "global_step": 48169, "epoch": 580} {"train_loss": -20.260862350463867, "global_step": 48170, "epoch": 580} {"train_loss": -19.686885833740234, "global_step": 48171, "epoch": 580} {"train_loss": -19.587350845336914, "global_step": 48172, "epoch": 580} {"train_loss": -20.529022216796875, "global_step": 48173, "epoch": 580} {"train_loss": -20.053287506103516, "global_step": 48174, "epoch": 580} {"train_loss": -20.17014503479004, "global_step": 48175, "epoch": 580} {"train_loss": -19.722198486328125, "global_step": 48176, "epoch": 580} {"train_loss": -19.774560928344727, "global_step": 48177, "epoch": 580} {"train_loss": -19.871896743774414, "global_step": 48178, "epoch": 580} {"train_loss": -19.8963623046875, "global_step": 48179, "epoch": 580} {"train_loss": -19.973331451416016, "global_step": 48180, "epoch": 580} {"train_loss": -19.817190170288086, "global_step": 48181, "epoch": 580} {"train_loss": -19.841758728027344, "global_step": 48182, "epoch": 580} {"train_loss": -19.750795364379883, "global_step": 48183, "epoch": 580} {"train_loss": -19.81793975830078, "global_step": 48184, "epoch": 580} {"train_loss": -19.63312339782715, "global_step": 48185, "epoch": 580} {"train_loss": -19.75831413269043, "global_step": 48186, "epoch": 580} {"train_loss": -19.740406036376953, "global_step": 48187, "epoch": 580} {"train_loss": -19.769336700439453, "global_step": 48188, "epoch": 580} {"train_loss": -19.826284408569336, "global_step": 48189, "epoch": 580} {"train_loss": -20.164081573486328, "global_step": 48190, "epoch": 580} {"train_loss": -19.837141036987305, "global_step": 48191, "epoch": 580} {"train_loss": -19.668447494506836, "global_step": 48192, "epoch": 580} {"train_loss": -19.861793518066406, "global_step": 48193, "epoch": 580} {"train_loss": -19.606578826904297, "global_step": 48194, "epoch": 580} {"train_loss": -20.020132064819336, "global_step": 48195, "epoch": 580} {"train_loss": -19.823501586914062, "global_step": 48196, "epoch": 580} {"train_loss": -20.084707260131836, "global_step": 48197, "epoch": 580} {"train_loss": -19.886934280395508, "global_step": 48198, "epoch": 580} {"train_loss": -19.70186424255371, "global_step": 48199, "epoch": 580} {"train_loss": -19.768884658813477, "global_step": 48200, "epoch": 580} {"train_loss": -19.973716735839844, "global_step": 48201, "epoch": 580} {"train_loss": -19.6187801361084, "global_step": 48202, "epoch": 580} {"train_loss": -19.840045928955078, "global_step": 48203, "epoch": 580} {"train_loss": -19.672298431396484, "global_step": 48204, "epoch": 580} {"train_loss": -19.738759994506836, "global_step": 48205, "epoch": 580} {"train_loss": -19.626638412475586, "global_step": 48206, "epoch": 580} {"train_loss": -20.023883819580078, "global_step": 48207, "epoch": 580} {"train_loss": -20.3122615814209, "global_step": 48208, "epoch": 580} {"train_loss": -19.67708396911621, "global_step": 48209, "epoch": 580} {"train_loss": -19.947200775146484, "global_step": 48210, "epoch": 580} {"train_loss": -19.775012969970703, "global_step": 48211, "epoch": 580} {"train_loss": -20.19801139831543, "global_step": 48212, "epoch": 580} {"train_loss": -20.18604850769043, "global_step": 48213, "epoch": 580} {"train_loss": -19.711353302001953, "global_step": 48214, "epoch": 580} {"train_loss": -19.496610641479492, "global_step": 48215, "epoch": 580} {"train_loss": -19.96919822692871, "global_step": 48216, "epoch": 580} {"train_loss": -19.965017318725586, "global_step": 48217, "epoch": 580} {"train_loss": -20.051977157592773, "global_step": 48218, "epoch": 580} {"train_loss": -19.734195709228516, "global_step": 48219, "epoch": 580} {"train_loss": -19.89781379699707, "global_step": 48220, "epoch": 580} {"train_loss": -19.883588790893555, "global_step": 48221, "epoch": 580} {"train_loss": -19.832823879747504, "global_step": 48222, "epoch": 580, "val_loss": 6003744.0} {"train_loss": -19.46101951599121, "global_step": 48223, "epoch": 581} {"train_loss": -19.645828247070312, "global_step": 48224, "epoch": 581} {"train_loss": -19.653135299682617, "global_step": 48225, "epoch": 581} {"train_loss": -19.2894229888916, "global_step": 48226, "epoch": 581} {"train_loss": -19.440719604492188, "global_step": 48227, "epoch": 581} {"train_loss": -19.89748764038086, "global_step": 48228, "epoch": 581} {"train_loss": -19.67898941040039, "global_step": 48229, "epoch": 581} {"train_loss": -19.84242820739746, "global_step": 48230, "epoch": 581} {"train_loss": -19.76636505126953, "global_step": 48231, "epoch": 581} {"train_loss": -19.791166305541992, "global_step": 48232, "epoch": 581} {"train_loss": -19.61082649230957, "global_step": 48233, "epoch": 581} {"train_loss": -19.642576217651367, "global_step": 48234, "epoch": 581} {"train_loss": -19.548124313354492, "global_step": 48235, "epoch": 581} {"train_loss": -19.80638313293457, "global_step": 48236, "epoch": 581} {"train_loss": -19.745107650756836, "global_step": 48237, "epoch": 581} {"train_loss": -19.471555709838867, "global_step": 48238, "epoch": 581} {"train_loss": -20.007421493530273, "global_step": 48239, "epoch": 581} {"train_loss": -19.997892379760742, "global_step": 48240, "epoch": 581} {"train_loss": -19.888320922851562, "global_step": 48241, "epoch": 581} {"train_loss": -20.116411209106445, "global_step": 48242, "epoch": 581} {"train_loss": -20.21637535095215, "global_step": 48243, "epoch": 581} {"train_loss": -19.740468978881836, "global_step": 48244, "epoch": 581} {"train_loss": -20.01828384399414, "global_step": 48245, "epoch": 581} {"train_loss": -19.744932174682617, "global_step": 48246, "epoch": 581} {"train_loss": -19.918292999267578, "global_step": 48247, "epoch": 581} {"train_loss": -19.6718807220459, "global_step": 48248, "epoch": 581} {"train_loss": -19.605976104736328, "global_step": 48249, "epoch": 581} {"train_loss": -19.743478775024414, "global_step": 48250, "epoch": 581} {"train_loss": -19.826841354370117, "global_step": 48251, "epoch": 581} {"train_loss": -19.955747604370117, "global_step": 48252, "epoch": 581} {"train_loss": -20.04918670654297, "global_step": 48253, "epoch": 581} {"train_loss": -19.68178367614746, "global_step": 48254, "epoch": 581} {"train_loss": -19.72005271911621, "global_step": 48255, "epoch": 581} {"train_loss": -19.779626846313477, "global_step": 48256, "epoch": 581} {"train_loss": -19.8905086517334, "global_step": 48257, "epoch": 581} {"train_loss": -19.789770126342773, "global_step": 48258, "epoch": 581} {"train_loss": -19.717185974121094, "global_step": 48259, "epoch": 581} {"train_loss": -19.687841415405273, "global_step": 48260, "epoch": 581} {"train_loss": -20.29683494567871, "global_step": 48261, "epoch": 581} {"train_loss": -20.00221824645996, "global_step": 48262, "epoch": 581} {"train_loss": -20.108224868774414, "global_step": 48263, "epoch": 581} {"train_loss": -20.13791847229004, "global_step": 48264, "epoch": 581} {"train_loss": -19.919782638549805, "global_step": 48265, "epoch": 581} {"train_loss": -20.099414825439453, "global_step": 48266, "epoch": 581} {"train_loss": -20.35951805114746, "global_step": 48267, "epoch": 581} {"train_loss": -19.863292694091797, "global_step": 48268, "epoch": 581} {"train_loss": -20.375890731811523, "global_step": 48269, "epoch": 581} {"train_loss": -20.212406158447266, "global_step": 48270, "epoch": 581} {"train_loss": -19.556398391723633, "global_step": 48271, "epoch": 581} {"train_loss": -20.03236961364746, "global_step": 48272, "epoch": 581} {"train_loss": -19.570880889892578, "global_step": 48273, "epoch": 581} {"train_loss": -19.9495906829834, "global_step": 48274, "epoch": 581} {"train_loss": -19.71394920349121, "global_step": 48275, "epoch": 581} {"train_loss": -19.941349029541016, "global_step": 48276, "epoch": 581} {"train_loss": -19.77879524230957, "global_step": 48277, "epoch": 581} {"train_loss": -19.897275924682617, "global_step": 48278, "epoch": 581} {"train_loss": -19.685487747192383, "global_step": 48279, "epoch": 581} {"train_loss": -19.86343765258789, "global_step": 48280, "epoch": 581} {"train_loss": -19.64852523803711, "global_step": 48281, "epoch": 581} {"train_loss": -19.39240837097168, "global_step": 48282, "epoch": 581} {"train_loss": -19.73771095275879, "global_step": 48283, "epoch": 581} {"train_loss": -19.65862464904785, "global_step": 48284, "epoch": 581} {"train_loss": -20.135669708251953, "global_step": 48285, "epoch": 581} {"train_loss": -19.86494255065918, "global_step": 48286, "epoch": 581} {"train_loss": -19.889631271362305, "global_step": 48287, "epoch": 581} {"train_loss": -19.78519058227539, "global_step": 48288, "epoch": 581} {"train_loss": -19.701101303100586, "global_step": 48289, "epoch": 581} {"train_loss": -20.014249801635742, "global_step": 48290, "epoch": 581} {"train_loss": -19.7531681060791, "global_step": 48291, "epoch": 581} {"train_loss": -19.518917083740234, "global_step": 48292, "epoch": 581} {"train_loss": -19.788959503173828, "global_step": 48293, "epoch": 581} {"train_loss": -19.730953216552734, "global_step": 48294, "epoch": 581} {"train_loss": -19.89980125427246, "global_step": 48295, "epoch": 581} {"train_loss": -20.184362411499023, "global_step": 48296, "epoch": 581} {"train_loss": -19.72574806213379, "global_step": 48297, "epoch": 581} {"train_loss": -20.01759147644043, "global_step": 48298, "epoch": 581} {"train_loss": -20.18999481201172, "global_step": 48299, "epoch": 581} {"train_loss": -20.021713256835938, "global_step": 48300, "epoch": 581} {"train_loss": -20.222944259643555, "global_step": 48301, "epoch": 581} {"train_loss": -19.844079971313477, "global_step": 48302, "epoch": 581} {"train_loss": -19.766845703125, "global_step": 48303, "epoch": 581} {"train_loss": -19.925968170166016, "global_step": 48304, "epoch": 581} {"train_loss": -19.847733945731658, "global_step": 48305, "epoch": 581, "val_loss": 6030072.0} {"train_loss": -19.611539840698242, "global_step": 48306, "epoch": 582} {"train_loss": -19.792369842529297, "global_step": 48307, "epoch": 582} {"train_loss": -19.847421646118164, "global_step": 48308, "epoch": 582} {"train_loss": -19.033592224121094, "global_step": 48309, "epoch": 582} {"train_loss": -19.692052841186523, "global_step": 48310, "epoch": 582} {"train_loss": -19.37566566467285, "global_step": 48311, "epoch": 582} {"train_loss": -19.431974411010742, "global_step": 48312, "epoch": 582} {"train_loss": -19.995115280151367, "global_step": 48313, "epoch": 582} {"train_loss": -19.57501983642578, "global_step": 48314, "epoch": 582} {"train_loss": -19.889408111572266, "global_step": 48315, "epoch": 582} {"train_loss": -19.763412475585938, "global_step": 48316, "epoch": 582} {"train_loss": -19.62247657775879, "global_step": 48317, "epoch": 582} {"train_loss": -19.71687889099121, "global_step": 48318, "epoch": 582} {"train_loss": -19.892385482788086, "global_step": 48319, "epoch": 582} {"train_loss": -19.494993209838867, "global_step": 48320, "epoch": 582} {"train_loss": -19.785337448120117, "global_step": 48321, "epoch": 582} {"train_loss": -19.872148513793945, "global_step": 48322, "epoch": 582} {"train_loss": -19.532846450805664, "global_step": 48323, "epoch": 582} {"train_loss": -19.751834869384766, "global_step": 48324, "epoch": 582} {"train_loss": -19.81186866760254, "global_step": 48325, "epoch": 582} {"train_loss": -19.71177101135254, "global_step": 48326, "epoch": 582} {"train_loss": -19.789941787719727, "global_step": 48327, "epoch": 582} {"train_loss": -20.144447326660156, "global_step": 48328, "epoch": 582} {"train_loss": -20.009599685668945, "global_step": 48329, "epoch": 582} {"train_loss": -20.145357131958008, "global_step": 48330, "epoch": 582} {"train_loss": -20.072214126586914, "global_step": 48331, "epoch": 582} {"train_loss": -19.489408493041992, "global_step": 48332, "epoch": 582} {"train_loss": -19.922565460205078, "global_step": 48333, "epoch": 582} {"train_loss": -19.806852340698242, "global_step": 48334, "epoch": 582} {"train_loss": -20.330570220947266, "global_step": 48335, "epoch": 582} {"train_loss": -19.867979049682617, "global_step": 48336, "epoch": 582} {"train_loss": -19.803903579711914, "global_step": 48337, "epoch": 582} {"train_loss": -19.97783660888672, "global_step": 48338, "epoch": 582} {"train_loss": -19.90950584411621, "global_step": 48339, "epoch": 582} {"train_loss": -19.6905460357666, "global_step": 48340, "epoch": 582} {"train_loss": -20.22808265686035, "global_step": 48341, "epoch": 582} {"train_loss": -19.2346248626709, "global_step": 48342, "epoch": 582} {"train_loss": -20.030668258666992, "global_step": 48343, "epoch": 582} {"train_loss": -20.100858688354492, "global_step": 48344, "epoch": 582} {"train_loss": -19.71864128112793, "global_step": 48345, "epoch": 582} {"train_loss": -20.11811637878418, "global_step": 48346, "epoch": 582} {"train_loss": -20.118627548217773, "global_step": 48347, "epoch": 582} {"train_loss": -19.814634323120117, "global_step": 48348, "epoch": 582} {"train_loss": -19.850805282592773, "global_step": 48349, "epoch": 582} {"train_loss": -19.80608558654785, "global_step": 48350, "epoch": 582} {"train_loss": -19.52158546447754, "global_step": 48351, "epoch": 582} {"train_loss": -19.4421443939209, "global_step": 48352, "epoch": 582} {"train_loss": -19.803632736206055, "global_step": 48353, "epoch": 582} {"train_loss": -19.578893661499023, "global_step": 48354, "epoch": 582} {"train_loss": -20.111072540283203, "global_step": 48355, "epoch": 582} {"train_loss": -19.739877700805664, "global_step": 48356, "epoch": 582} {"train_loss": -19.873512268066406, "global_step": 48357, "epoch": 582} {"train_loss": -19.65425682067871, "global_step": 48358, "epoch": 582} {"train_loss": -19.832059860229492, "global_step": 48359, "epoch": 582} {"train_loss": -19.22414207458496, "global_step": 48360, "epoch": 582} {"train_loss": -20.154340744018555, "global_step": 48361, "epoch": 582} {"train_loss": -19.693063735961914, "global_step": 48362, "epoch": 582} {"train_loss": -19.78175926208496, "global_step": 48363, "epoch": 582} {"train_loss": -19.429964065551758, "global_step": 48364, "epoch": 582} {"train_loss": -19.946645736694336, "global_step": 48365, "epoch": 582} {"train_loss": -19.79521942138672, "global_step": 48366, "epoch": 582} {"train_loss": -19.817052841186523, "global_step": 48367, "epoch": 582} {"train_loss": -19.736000061035156, "global_step": 48368, "epoch": 582} {"train_loss": -19.992603302001953, "global_step": 48369, "epoch": 582} {"train_loss": -20.3101863861084, "global_step": 48370, "epoch": 582} {"train_loss": -19.817041397094727, "global_step": 48371, "epoch": 582} {"train_loss": -19.694265365600586, "global_step": 48372, "epoch": 582} {"train_loss": -19.77178382873535, "global_step": 48373, "epoch": 582} {"train_loss": -19.69443702697754, "global_step": 48374, "epoch": 582} {"train_loss": -19.661256790161133, "global_step": 48375, "epoch": 582} {"train_loss": -19.69317054748535, "global_step": 48376, "epoch": 582} {"train_loss": -19.791940689086914, "global_step": 48377, "epoch": 582} {"train_loss": -19.6442928314209, "global_step": 48378, "epoch": 582} {"train_loss": -19.298782348632812, "global_step": 48379, "epoch": 582} {"train_loss": -20.04717254638672, "global_step": 48380, "epoch": 582} {"train_loss": -20.02386474609375, "global_step": 48381, "epoch": 582} {"train_loss": -20.051563262939453, "global_step": 48382, "epoch": 582} {"train_loss": -19.940706253051758, "global_step": 48383, "epoch": 582} {"train_loss": -19.47159767150879, "global_step": 48384, "epoch": 582} {"train_loss": -19.803955078125, "global_step": 48385, "epoch": 582} {"train_loss": -19.29906463623047, "global_step": 48386, "epoch": 582} {"train_loss": -19.959959030151367, "global_step": 48387, "epoch": 582} {"train_loss": -19.799769183239306, "global_step": 48388, "epoch": 582, "val_loss": 6062287.0} {"train_loss": -19.32080841064453, "global_step": 48389, "epoch": 583} {"train_loss": -19.697248458862305, "global_step": 48390, "epoch": 583} {"train_loss": -19.305049896240234, "global_step": 48391, "epoch": 583} {"train_loss": -19.86687660217285, "global_step": 48392, "epoch": 583} {"train_loss": -19.549020767211914, "global_step": 48393, "epoch": 583} {"train_loss": -19.263662338256836, "global_step": 48394, "epoch": 583} {"train_loss": -19.949453353881836, "global_step": 48395, "epoch": 583} {"train_loss": -19.46756935119629, "global_step": 48396, "epoch": 583} {"train_loss": -19.468555450439453, "global_step": 48397, "epoch": 583} {"train_loss": -19.69174575805664, "global_step": 48398, "epoch": 583} {"train_loss": -20.146461486816406, "global_step": 48399, "epoch": 583} {"train_loss": -19.526451110839844, "global_step": 48400, "epoch": 583} {"train_loss": -19.56733512878418, "global_step": 48401, "epoch": 583} {"train_loss": -19.756437301635742, "global_step": 48402, "epoch": 583} {"train_loss": -19.93147850036621, "global_step": 48403, "epoch": 583} {"train_loss": -19.83686065673828, "global_step": 48404, "epoch": 583} {"train_loss": -19.873693466186523, "global_step": 48405, "epoch": 583} {"train_loss": -19.74867820739746, "global_step": 48406, "epoch": 583} {"train_loss": -20.21723747253418, "global_step": 48407, "epoch": 583} {"train_loss": -19.999847412109375, "global_step": 48408, "epoch": 583} {"train_loss": -19.722471237182617, "global_step": 48409, "epoch": 583} {"train_loss": -19.962247848510742, "global_step": 48410, "epoch": 583} {"train_loss": -20.11502456665039, "global_step": 48411, "epoch": 583} {"train_loss": -19.868650436401367, "global_step": 48412, "epoch": 583} {"train_loss": -20.00286293029785, "global_step": 48413, "epoch": 583} {"train_loss": -19.866256713867188, "global_step": 48414, "epoch": 583} {"train_loss": -19.735261917114258, "global_step": 48415, "epoch": 583} {"train_loss": -19.554763793945312, "global_step": 48416, "epoch": 583} {"train_loss": -19.621667861938477, "global_step": 48417, "epoch": 583} {"train_loss": -19.921058654785156, "global_step": 48418, "epoch": 583} {"train_loss": -19.57088279724121, "global_step": 48419, "epoch": 583} {"train_loss": -19.873249053955078, "global_step": 48420, "epoch": 583} {"train_loss": -19.894420623779297, "global_step": 48421, "epoch": 583} {"train_loss": -19.736766815185547, "global_step": 48422, "epoch": 583} {"train_loss": -19.50775718688965, "global_step": 48423, "epoch": 583} {"train_loss": -19.962635040283203, "global_step": 48424, "epoch": 583} {"train_loss": -19.498647689819336, "global_step": 48425, "epoch": 583} {"train_loss": -20.066015243530273, "global_step": 48426, "epoch": 583} {"train_loss": -19.715900421142578, "global_step": 48427, "epoch": 583} {"train_loss": -20.298452377319336, "global_step": 48428, "epoch": 583} {"train_loss": -19.91914176940918, "global_step": 48429, "epoch": 583} {"train_loss": -19.52693748474121, "global_step": 48430, "epoch": 583} {"train_loss": -19.97965431213379, "global_step": 48431, "epoch": 583} {"train_loss": -19.843461990356445, "global_step": 48432, "epoch": 583} {"train_loss": -19.9344425201416, "global_step": 48433, "epoch": 583} {"train_loss": -19.795564651489258, "global_step": 48434, "epoch": 583} {"train_loss": -19.851337432861328, "global_step": 48435, "epoch": 583} {"train_loss": -20.040441513061523, "global_step": 48436, "epoch": 583} {"train_loss": -19.90595054626465, "global_step": 48437, "epoch": 583} {"train_loss": -20.252798080444336, "global_step": 48438, "epoch": 583} {"train_loss": -19.67061996459961, "global_step": 48439, "epoch": 583} {"train_loss": -19.947784423828125, "global_step": 48440, "epoch": 583} {"train_loss": -19.689138412475586, "global_step": 48441, "epoch": 583} {"train_loss": -20.0157527923584, "global_step": 48442, "epoch": 583} {"train_loss": -19.822824478149414, "global_step": 48443, "epoch": 583} {"train_loss": -20.373485565185547, "global_step": 48444, "epoch": 583} {"train_loss": -19.920949935913086, "global_step": 48445, "epoch": 583} {"train_loss": -20.008073806762695, "global_step": 48446, "epoch": 583} {"train_loss": -20.30752944946289, "global_step": 48447, "epoch": 583} {"train_loss": -19.956815719604492, "global_step": 48448, "epoch": 583} {"train_loss": -20.057523727416992, "global_step": 48449, "epoch": 583} {"train_loss": -19.56477165222168, "global_step": 48450, "epoch": 583} {"train_loss": -19.522865295410156, "global_step": 48451, "epoch": 583} {"train_loss": -20.330198287963867, "global_step": 48452, "epoch": 583} {"train_loss": -19.93886375427246, "global_step": 48453, "epoch": 583} {"train_loss": -19.661151885986328, "global_step": 48454, "epoch": 583} {"train_loss": -19.690038681030273, "global_step": 48455, "epoch": 583} {"train_loss": -19.951704025268555, "global_step": 48456, "epoch": 583} {"train_loss": -19.822402954101562, "global_step": 48457, "epoch": 583} {"train_loss": -19.528236389160156, "global_step": 48458, "epoch": 583} {"train_loss": -20.05183219909668, "global_step": 48459, "epoch": 583} {"train_loss": -20.05200958251953, "global_step": 48460, "epoch": 583} {"train_loss": -19.74709129333496, "global_step": 48461, "epoch": 583} {"train_loss": -20.092844009399414, "global_step": 48462, "epoch": 583} {"train_loss": -19.748239517211914, "global_step": 48463, "epoch": 583} {"train_loss": -19.705459594726562, "global_step": 48464, "epoch": 583} {"train_loss": -20.033185958862305, "global_step": 48465, "epoch": 583} {"train_loss": -19.762557983398438, "global_step": 48466, "epoch": 583} {"train_loss": -19.953771591186523, "global_step": 48467, "epoch": 583} {"train_loss": -19.767295837402344, "global_step": 48468, "epoch": 583} {"train_loss": -20.260034561157227, "global_step": 48469, "epoch": 583} {"train_loss": -19.815879821777344, "global_step": 48470, "epoch": 583} {"train_loss": -19.845146133239012, "global_step": 48471, "epoch": 583, "val_loss": 6082735.5} {"train_loss": -19.553909301757812, "global_step": 48472, "epoch": 584} {"train_loss": -19.702756881713867, "global_step": 48473, "epoch": 584} {"train_loss": -19.5396785736084, "global_step": 48474, "epoch": 584} {"train_loss": -19.86399269104004, "global_step": 48475, "epoch": 584} {"train_loss": -19.596813201904297, "global_step": 48476, "epoch": 584} {"train_loss": -19.41788101196289, "global_step": 48477, "epoch": 584} {"train_loss": -19.730642318725586, "global_step": 48478, "epoch": 584} {"train_loss": -19.758333206176758, "global_step": 48479, "epoch": 584} {"train_loss": -19.746313095092773, "global_step": 48480, "epoch": 584} {"train_loss": -19.68381118774414, "global_step": 48481, "epoch": 584} {"train_loss": -19.466903686523438, "global_step": 48482, "epoch": 584} {"train_loss": -19.854360580444336, "global_step": 48483, "epoch": 584} {"train_loss": -19.837270736694336, "global_step": 48484, "epoch": 584} {"train_loss": -19.887226104736328, "global_step": 48485, "epoch": 584} {"train_loss": -20.066198348999023, "global_step": 48486, "epoch": 584} {"train_loss": -19.941516876220703, "global_step": 48487, "epoch": 584} {"train_loss": -19.708097457885742, "global_step": 48488, "epoch": 584} {"train_loss": -19.841909408569336, "global_step": 48489, "epoch": 584} {"train_loss": -20.083478927612305, "global_step": 48490, "epoch": 584} {"train_loss": -20.205801010131836, "global_step": 48491, "epoch": 584} {"train_loss": -20.026472091674805, "global_step": 48492, "epoch": 584} {"train_loss": -19.675485610961914, "global_step": 48493, "epoch": 584} {"train_loss": -20.1304874420166, "global_step": 48494, "epoch": 584} {"train_loss": -20.145994186401367, "global_step": 48495, "epoch": 584} {"train_loss": -19.77021598815918, "global_step": 48496, "epoch": 584} {"train_loss": -20.142240524291992, "global_step": 48497, "epoch": 584} {"train_loss": -19.91153335571289, "global_step": 48498, "epoch": 584} {"train_loss": -20.172649383544922, "global_step": 48499, "epoch": 584} {"train_loss": -20.165494918823242, "global_step": 48500, "epoch": 584} {"train_loss": -20.097745895385742, "global_step": 48501, "epoch": 584} {"train_loss": -19.699726104736328, "global_step": 48502, "epoch": 584} {"train_loss": -19.915565490722656, "global_step": 48503, "epoch": 584} {"train_loss": -19.669050216674805, "global_step": 48504, "epoch": 584} {"train_loss": -19.623701095581055, "global_step": 48505, "epoch": 584} {"train_loss": -19.989978790283203, "global_step": 48506, "epoch": 584} {"train_loss": -19.87091827392578, "global_step": 48507, "epoch": 584} {"train_loss": -19.509469985961914, "global_step": 48508, "epoch": 584} {"train_loss": -19.928024291992188, "global_step": 48509, "epoch": 584} {"train_loss": -19.707046508789062, "global_step": 48510, "epoch": 584} {"train_loss": -19.686798095703125, "global_step": 48511, "epoch": 584} {"train_loss": -19.863367080688477, "global_step": 48512, "epoch": 584} {"train_loss": -19.849153518676758, "global_step": 48513, "epoch": 584} {"train_loss": -19.925283432006836, "global_step": 48514, "epoch": 584} {"train_loss": -20.423234939575195, "global_step": 48515, "epoch": 584} {"train_loss": -19.923797607421875, "global_step": 48516, "epoch": 584} {"train_loss": -19.88933563232422, "global_step": 48517, "epoch": 584} {"train_loss": -19.763349533081055, "global_step": 48518, "epoch": 584} {"train_loss": -20.16114044189453, "global_step": 48519, "epoch": 584} {"train_loss": -19.880496978759766, "global_step": 48520, "epoch": 584} {"train_loss": -19.733673095703125, "global_step": 48521, "epoch": 584} {"train_loss": -19.668989181518555, "global_step": 48522, "epoch": 584} {"train_loss": -19.94302749633789, "global_step": 48523, "epoch": 584} {"train_loss": -19.91920280456543, "global_step": 48524, "epoch": 584} {"train_loss": -19.505203247070312, "global_step": 48525, "epoch": 584} {"train_loss": -19.780160903930664, "global_step": 48526, "epoch": 584} {"train_loss": -19.58648109436035, "global_step": 48527, "epoch": 584} {"train_loss": -19.961898803710938, "global_step": 48528, "epoch": 584} {"train_loss": -19.810274124145508, "global_step": 48529, "epoch": 584} {"train_loss": -20.02821922302246, "global_step": 48530, "epoch": 584} {"train_loss": -19.577808380126953, "global_step": 48531, "epoch": 584} {"train_loss": -19.85134506225586, "global_step": 48532, "epoch": 584} {"train_loss": -19.501304626464844, "global_step": 48533, "epoch": 584} {"train_loss": -20.136804580688477, "global_step": 48534, "epoch": 584} {"train_loss": -19.813955307006836, "global_step": 48535, "epoch": 584} {"train_loss": -19.74018669128418, "global_step": 48536, "epoch": 584} {"train_loss": -19.98896598815918, "global_step": 48537, "epoch": 584} {"train_loss": -19.866561889648438, "global_step": 48538, "epoch": 584} {"train_loss": -19.54323959350586, "global_step": 48539, "epoch": 584} {"train_loss": -19.73994255065918, "global_step": 48540, "epoch": 584} {"train_loss": -19.703027725219727, "global_step": 48541, "epoch": 584} {"train_loss": -19.87625503540039, "global_step": 48542, "epoch": 584} {"train_loss": -19.79313087463379, "global_step": 48543, "epoch": 584} {"train_loss": -19.528364181518555, "global_step": 48544, "epoch": 584} {"train_loss": -19.992603302001953, "global_step": 48545, "epoch": 584} {"train_loss": -19.25589370727539, "global_step": 48546, "epoch": 584} {"train_loss": -20.076812744140625, "global_step": 48547, "epoch": 584} {"train_loss": -19.692726135253906, "global_step": 48548, "epoch": 584} {"train_loss": -20.076589584350586, "global_step": 48549, "epoch": 584} {"train_loss": -19.723949432373047, "global_step": 48550, "epoch": 584} {"train_loss": -19.835832595825195, "global_step": 48551, "epoch": 584} {"train_loss": -19.940876007080078, "global_step": 48552, "epoch": 584} {"train_loss": -19.96312713623047, "global_step": 48553, "epoch": 584} {"train_loss": -19.813304993043463, "global_step": 48554, "epoch": 584, "val_loss": 5873108.0} {"train_loss": -19.61931800842285, "global_step": 48555, "epoch": 585} {"train_loss": -19.728487014770508, "global_step": 48556, "epoch": 585} {"train_loss": -19.573728561401367, "global_step": 48557, "epoch": 585} {"train_loss": -20.034948348999023, "global_step": 48558, "epoch": 585} {"train_loss": -19.732595443725586, "global_step": 48559, "epoch": 585} {"train_loss": -20.192485809326172, "global_step": 48560, "epoch": 585} {"train_loss": -20.04008674621582, "global_step": 48561, "epoch": 585} {"train_loss": -19.773517608642578, "global_step": 48562, "epoch": 585} {"train_loss": -20.058685302734375, "global_step": 48563, "epoch": 585} {"train_loss": -19.7176456451416, "global_step": 48564, "epoch": 585} {"train_loss": -19.807605743408203, "global_step": 48565, "epoch": 585} {"train_loss": -19.746627807617188, "global_step": 48566, "epoch": 585} {"train_loss": -19.454299926757812, "global_step": 48567, "epoch": 585} {"train_loss": -20.09392738342285, "global_step": 48568, "epoch": 585} {"train_loss": -19.835683822631836, "global_step": 48569, "epoch": 585} {"train_loss": -19.768035888671875, "global_step": 48570, "epoch": 585} {"train_loss": -20.088157653808594, "global_step": 48571, "epoch": 585} {"train_loss": -19.72085952758789, "global_step": 48572, "epoch": 585} {"train_loss": -20.06038475036621, "global_step": 48573, "epoch": 585} {"train_loss": -19.960561752319336, "global_step": 48574, "epoch": 585} {"train_loss": -19.82631492614746, "global_step": 48575, "epoch": 585} {"train_loss": -19.760242462158203, "global_step": 48576, "epoch": 585} {"train_loss": -19.747543334960938, "global_step": 48577, "epoch": 585} {"train_loss": -19.731977462768555, "global_step": 48578, "epoch": 585} {"train_loss": -19.894025802612305, "global_step": 48579, "epoch": 585} {"train_loss": -20.20489501953125, "global_step": 48580, "epoch": 585} {"train_loss": -19.822309494018555, "global_step": 48581, "epoch": 585} {"train_loss": -19.756216049194336, "global_step": 48582, "epoch": 585} {"train_loss": -19.500015258789062, "global_step": 48583, "epoch": 585} {"train_loss": -19.848987579345703, "global_step": 48584, "epoch": 585} {"train_loss": -19.598447799682617, "global_step": 48585, "epoch": 585} {"train_loss": -19.50981903076172, "global_step": 48586, "epoch": 585} {"train_loss": -20.218143463134766, "global_step": 48587, "epoch": 585} {"train_loss": -19.769302368164062, "global_step": 48588, "epoch": 585} {"train_loss": -20.34564781188965, "global_step": 48589, "epoch": 585} {"train_loss": -19.865596771240234, "global_step": 48590, "epoch": 585} {"train_loss": -19.997352600097656, "global_step": 48591, "epoch": 585} {"train_loss": -20.11447525024414, "global_step": 48592, "epoch": 585} {"train_loss": -19.955610275268555, "global_step": 48593, "epoch": 585} {"train_loss": -19.95795249938965, "global_step": 48594, "epoch": 585} {"train_loss": -19.647388458251953, "global_step": 48595, "epoch": 585} {"train_loss": -19.326644897460938, "global_step": 48596, "epoch": 585} {"train_loss": -19.54767608642578, "global_step": 48597, "epoch": 585} {"train_loss": -19.91400909423828, "global_step": 48598, "epoch": 585} {"train_loss": -20.277048110961914, "global_step": 48599, "epoch": 585} {"train_loss": -19.700822830200195, "global_step": 48600, "epoch": 585} {"train_loss": -19.657270431518555, "global_step": 48601, "epoch": 585} {"train_loss": -19.65090560913086, "global_step": 48602, "epoch": 585} {"train_loss": -19.655813217163086, "global_step": 48603, "epoch": 585} {"train_loss": -20.026731491088867, "global_step": 48604, "epoch": 585} {"train_loss": -19.966310501098633, "global_step": 48605, "epoch": 585} {"train_loss": -20.040420532226562, "global_step": 48606, "epoch": 585} {"train_loss": -19.553617477416992, "global_step": 48607, "epoch": 585} {"train_loss": -19.914236068725586, "global_step": 48608, "epoch": 585} {"train_loss": -19.92978858947754, "global_step": 48609, "epoch": 585} {"train_loss": -19.7348690032959, "global_step": 48610, "epoch": 585} {"train_loss": -19.692655563354492, "global_step": 48611, "epoch": 585} {"train_loss": -19.542896270751953, "global_step": 48612, "epoch": 585} {"train_loss": -19.7078800201416, "global_step": 48613, "epoch": 585} {"train_loss": -19.67051124572754, "global_step": 48614, "epoch": 585} {"train_loss": -19.246397018432617, "global_step": 48615, "epoch": 585} {"train_loss": -19.791351318359375, "global_step": 48616, "epoch": 585} {"train_loss": -19.498685836791992, "global_step": 48617, "epoch": 585} {"train_loss": -19.502729415893555, "global_step": 48618, "epoch": 585} {"train_loss": -19.605493545532227, "global_step": 48619, "epoch": 585} {"train_loss": -19.604164123535156, "global_step": 48620, "epoch": 585} {"train_loss": -19.435089111328125, "global_step": 48621, "epoch": 585} {"train_loss": -19.92826271057129, "global_step": 48622, "epoch": 585} {"train_loss": -19.706151962280273, "global_step": 48623, "epoch": 585} {"train_loss": -20.184268951416016, "global_step": 48624, "epoch": 585} {"train_loss": -19.871479034423828, "global_step": 48625, "epoch": 585} {"train_loss": -19.866596221923828, "global_step": 48626, "epoch": 585} {"train_loss": -19.851200103759766, "global_step": 48627, "epoch": 585} {"train_loss": -19.98142433166504, "global_step": 48628, "epoch": 585} {"train_loss": -20.11775016784668, "global_step": 48629, "epoch": 585} {"train_loss": -19.88993263244629, "global_step": 48630, "epoch": 585} {"train_loss": -19.663480758666992, "global_step": 48631, "epoch": 585} {"train_loss": -19.8524227142334, "global_step": 48632, "epoch": 585} {"train_loss": -19.758075714111328, "global_step": 48633, "epoch": 585} {"train_loss": -19.787029266357422, "global_step": 48634, "epoch": 585} {"train_loss": -19.79276466369629, "global_step": 48635, "epoch": 585} {"train_loss": -20.397581100463867, "global_step": 48636, "epoch": 585} {"train_loss": -19.815186259258223, "global_step": 48637, "epoch": 585, "val_loss": 6050507.0} {"train_loss": -19.800546646118164, "global_step": 48638, "epoch": 586} {"train_loss": -19.828521728515625, "global_step": 48639, "epoch": 586} {"train_loss": -19.35442543029785, "global_step": 48640, "epoch": 586} {"train_loss": -19.34134292602539, "global_step": 48641, "epoch": 586} {"train_loss": -19.618988037109375, "global_step": 48642, "epoch": 586} {"train_loss": -19.73842430114746, "global_step": 48643, "epoch": 586} {"train_loss": -19.833892822265625, "global_step": 48644, "epoch": 586} {"train_loss": -19.441709518432617, "global_step": 48645, "epoch": 586} {"train_loss": -19.3944091796875, "global_step": 48646, "epoch": 586} {"train_loss": -19.566452026367188, "global_step": 48647, "epoch": 586} {"train_loss": -19.585763931274414, "global_step": 48648, "epoch": 586} {"train_loss": -19.52772331237793, "global_step": 48649, "epoch": 586} {"train_loss": -19.566802978515625, "global_step": 48650, "epoch": 586} {"train_loss": -19.369041442871094, "global_step": 48651, "epoch": 586} {"train_loss": -19.735910415649414, "global_step": 48652, "epoch": 586} {"train_loss": -19.696582794189453, "global_step": 48653, "epoch": 586} {"train_loss": -19.779224395751953, "global_step": 48654, "epoch": 586} {"train_loss": -19.805042266845703, "global_step": 48655, "epoch": 586} {"train_loss": -20.05232810974121, "global_step": 48656, "epoch": 586} {"train_loss": -19.770910263061523, "global_step": 48657, "epoch": 586} {"train_loss": -20.07504653930664, "global_step": 48658, "epoch": 586} {"train_loss": -19.847824096679688, "global_step": 48659, "epoch": 586} {"train_loss": -19.902496337890625, "global_step": 48660, "epoch": 586} {"train_loss": -20.158994674682617, "global_step": 48661, "epoch": 586} {"train_loss": -19.725370407104492, "global_step": 48662, "epoch": 586} {"train_loss": -19.873123168945312, "global_step": 48663, "epoch": 586} {"train_loss": -20.139617919921875, "global_step": 48664, "epoch": 586} {"train_loss": -19.923063278198242, "global_step": 48665, "epoch": 586} {"train_loss": -19.893678665161133, "global_step": 48666, "epoch": 586} {"train_loss": -19.901931762695312, "global_step": 48667, "epoch": 586} {"train_loss": -19.569929122924805, "global_step": 48668, "epoch": 586} {"train_loss": -19.7011661529541, "global_step": 48669, "epoch": 586} {"train_loss": -19.67380142211914, "global_step": 48670, "epoch": 586} {"train_loss": -20.122488021850586, "global_step": 48671, "epoch": 586} {"train_loss": -19.7028751373291, "global_step": 48672, "epoch": 586} {"train_loss": -20.09602165222168, "global_step": 48673, "epoch": 586} {"train_loss": -19.92547035217285, "global_step": 48674, "epoch": 586} {"train_loss": -20.069007873535156, "global_step": 48675, "epoch": 586} {"train_loss": -19.528501510620117, "global_step": 48676, "epoch": 586} {"train_loss": -19.931127548217773, "global_step": 48677, "epoch": 586} {"train_loss": -20.276384353637695, "global_step": 48678, "epoch": 586} {"train_loss": -19.86834716796875, "global_step": 48679, "epoch": 586} {"train_loss": -19.8681640625, "global_step": 48680, "epoch": 586} {"train_loss": -19.897613525390625, "global_step": 48681, "epoch": 586} {"train_loss": -20.047090530395508, "global_step": 48682, "epoch": 586} {"train_loss": -19.81093406677246, "global_step": 48683, "epoch": 586} {"train_loss": -19.951257705688477, "global_step": 48684, "epoch": 586} {"train_loss": -19.843046188354492, "global_step": 48685, "epoch": 586} {"train_loss": -19.61639404296875, "global_step": 48686, "epoch": 586} {"train_loss": -19.778242111206055, "global_step": 48687, "epoch": 586} {"train_loss": -19.71809959411621, "global_step": 48688, "epoch": 586} {"train_loss": -19.82408905029297, "global_step": 48689, "epoch": 586} {"train_loss": -19.76788330078125, "global_step": 48690, "epoch": 586} {"train_loss": -20.01377296447754, "global_step": 48691, "epoch": 586} {"train_loss": -19.947214126586914, "global_step": 48692, "epoch": 586} {"train_loss": -19.795156478881836, "global_step": 48693, "epoch": 586} {"train_loss": -20.05500602722168, "global_step": 48694, "epoch": 586} {"train_loss": -19.805280685424805, "global_step": 48695, "epoch": 586} {"train_loss": -19.80925941467285, "global_step": 48696, "epoch": 586} {"train_loss": -19.856664657592773, "global_step": 48697, "epoch": 586} {"train_loss": -19.722412109375, "global_step": 48698, "epoch": 586} {"train_loss": -19.887907028198242, "global_step": 48699, "epoch": 586} {"train_loss": -19.58331871032715, "global_step": 48700, "epoch": 586} {"train_loss": -20.192968368530273, "global_step": 48701, "epoch": 586} {"train_loss": -19.716894149780273, "global_step": 48702, "epoch": 586} {"train_loss": -19.69014549255371, "global_step": 48703, "epoch": 586} {"train_loss": -19.967023849487305, "global_step": 48704, "epoch": 586} {"train_loss": -19.761682510375977, "global_step": 48705, "epoch": 586} {"train_loss": -19.820621490478516, "global_step": 48706, "epoch": 586} {"train_loss": -20.064899444580078, "global_step": 48707, "epoch": 586} {"train_loss": -20.289783477783203, "global_step": 48708, "epoch": 586} {"train_loss": -19.97153663635254, "global_step": 48709, "epoch": 586} {"train_loss": -20.429441452026367, "global_step": 48710, "epoch": 586} {"train_loss": -19.560508728027344, "global_step": 48711, "epoch": 586} {"train_loss": -19.888317108154297, "global_step": 48712, "epoch": 586} {"train_loss": -20.094518661499023, "global_step": 48713, "epoch": 586} {"train_loss": -19.643381118774414, "global_step": 48714, "epoch": 586} {"train_loss": -19.9090518951416, "global_step": 48715, "epoch": 586} {"train_loss": -19.81416130065918, "global_step": 48716, "epoch": 586} {"train_loss": -19.920310974121094, "global_step": 48717, "epoch": 586} {"train_loss": -20.055295944213867, "global_step": 48718, "epoch": 586} {"train_loss": -19.53427505493164, "global_step": 48719, "epoch": 586} {"train_loss": -19.845656452408758, "global_step": 48720, "epoch": 586, "val_loss": 6042897.0} {"train_loss": -19.68153953552246, "global_step": 48721, "epoch": 587} {"train_loss": -19.433500289916992, "global_step": 48722, "epoch": 587} {"train_loss": -19.85483741760254, "global_step": 48723, "epoch": 587} {"train_loss": -19.1972599029541, "global_step": 48724, "epoch": 587} {"train_loss": -19.482816696166992, "global_step": 48725, "epoch": 587} {"train_loss": -19.78447151184082, "global_step": 48726, "epoch": 587} {"train_loss": -19.765966415405273, "global_step": 48727, "epoch": 587} {"train_loss": -19.5318603515625, "global_step": 48728, "epoch": 587} {"train_loss": -19.785324096679688, "global_step": 48729, "epoch": 587} {"train_loss": -19.852270126342773, "global_step": 48730, "epoch": 587} {"train_loss": -20.184812545776367, "global_step": 48731, "epoch": 587} {"train_loss": -19.914228439331055, "global_step": 48732, "epoch": 587} {"train_loss": -19.975156784057617, "global_step": 48733, "epoch": 587} {"train_loss": -19.784391403198242, "global_step": 48734, "epoch": 587} {"train_loss": -20.286718368530273, "global_step": 48735, "epoch": 587} {"train_loss": -19.85211944580078, "global_step": 48736, "epoch": 587} {"train_loss": -19.944944381713867, "global_step": 48737, "epoch": 587} {"train_loss": -19.752424240112305, "global_step": 48738, "epoch": 587} {"train_loss": -19.968303680419922, "global_step": 48739, "epoch": 587} {"train_loss": -20.023279190063477, "global_step": 48740, "epoch": 587} {"train_loss": -19.715604782104492, "global_step": 48741, "epoch": 587} {"train_loss": -19.668365478515625, "global_step": 48742, "epoch": 587} {"train_loss": -19.616140365600586, "global_step": 48743, "epoch": 587} {"train_loss": -19.987545013427734, "global_step": 48744, "epoch": 587} {"train_loss": -20.091659545898438, "global_step": 48745, "epoch": 587} {"train_loss": -20.0881404876709, "global_step": 48746, "epoch": 587} {"train_loss": -19.96047592163086, "global_step": 48747, "epoch": 587} {"train_loss": -19.70175552368164, "global_step": 48748, "epoch": 587} {"train_loss": -20.049596786499023, "global_step": 48749, "epoch": 587} {"train_loss": -19.76262855529785, "global_step": 48750, "epoch": 587} {"train_loss": -19.722030639648438, "global_step": 48751, "epoch": 587} {"train_loss": -19.900856018066406, "global_step": 48752, "epoch": 587} {"train_loss": -19.506961822509766, "global_step": 48753, "epoch": 587} {"train_loss": -19.861669540405273, "global_step": 48754, "epoch": 587} {"train_loss": -19.87293815612793, "global_step": 48755, "epoch": 587} {"train_loss": -20.234952926635742, "global_step": 48756, "epoch": 587} {"train_loss": -19.951913833618164, "global_step": 48757, "epoch": 587} {"train_loss": -19.900196075439453, "global_step": 48758, "epoch": 587} {"train_loss": -19.783855438232422, "global_step": 48759, "epoch": 587} {"train_loss": -20.015371322631836, "global_step": 48760, "epoch": 587} {"train_loss": -20.031362533569336, "global_step": 48761, "epoch": 587} {"train_loss": -19.8529109954834, "global_step": 48762, "epoch": 587} {"train_loss": -19.825332641601562, "global_step": 48763, "epoch": 587} {"train_loss": -19.784435272216797, "global_step": 48764, "epoch": 587} {"train_loss": -19.21528434753418, "global_step": 48765, "epoch": 587} {"train_loss": -19.961645126342773, "global_step": 48766, "epoch": 587} {"train_loss": -19.94183921813965, "global_step": 48767, "epoch": 587} {"train_loss": -20.122695922851562, "global_step": 48768, "epoch": 587} {"train_loss": -19.959829330444336, "global_step": 48769, "epoch": 587} {"train_loss": -19.817907333374023, "global_step": 48770, "epoch": 587} {"train_loss": -19.84050178527832, "global_step": 48771, "epoch": 587} {"train_loss": -19.868391036987305, "global_step": 48772, "epoch": 587} {"train_loss": -20.075075149536133, "global_step": 48773, "epoch": 587} {"train_loss": -20.261518478393555, "global_step": 48774, "epoch": 587} {"train_loss": -19.997873306274414, "global_step": 48775, "epoch": 587} {"train_loss": -19.80389976501465, "global_step": 48776, "epoch": 587} {"train_loss": -19.739965438842773, "global_step": 48777, "epoch": 587} {"train_loss": -19.569128036499023, "global_step": 48778, "epoch": 587} {"train_loss": -20.076282501220703, "global_step": 48779, "epoch": 587} {"train_loss": -19.523935317993164, "global_step": 48780, "epoch": 587} {"train_loss": -20.077167510986328, "global_step": 48781, "epoch": 587} {"train_loss": -20.05463218688965, "global_step": 48782, "epoch": 587} {"train_loss": -20.00813865661621, "global_step": 48783, "epoch": 587} {"train_loss": -19.933332443237305, "global_step": 48784, "epoch": 587} {"train_loss": -19.776653289794922, "global_step": 48785, "epoch": 587} {"train_loss": -20.00883674621582, "global_step": 48786, "epoch": 587} {"train_loss": -19.36127471923828, "global_step": 48787, "epoch": 587} {"train_loss": -20.182069778442383, "global_step": 48788, "epoch": 587} {"train_loss": -20.101667404174805, "global_step": 48789, "epoch": 587} {"train_loss": -19.875947952270508, "global_step": 48790, "epoch": 587} {"train_loss": -19.809799194335938, "global_step": 48791, "epoch": 587} {"train_loss": -19.44215965270996, "global_step": 48792, "epoch": 587} {"train_loss": -19.770292282104492, "global_step": 48793, "epoch": 587} {"train_loss": -19.96747398376465, "global_step": 48794, "epoch": 587} {"train_loss": -20.10207176208496, "global_step": 48795, "epoch": 587} {"train_loss": -19.844785690307617, "global_step": 48796, "epoch": 587} {"train_loss": -19.79018783569336, "global_step": 48797, "epoch": 587} {"train_loss": -20.221485137939453, "global_step": 48798, "epoch": 587} {"train_loss": -19.869415283203125, "global_step": 48799, "epoch": 587} {"train_loss": -19.71534538269043, "global_step": 48800, "epoch": 587} {"train_loss": -19.71437644958496, "global_step": 48801, "epoch": 587} {"train_loss": -19.633808135986328, "global_step": 48802, "epoch": 587} {"train_loss": -19.835927044052674, "global_step": 48803, "epoch": 587, "val_loss": 6131277.0} {"train_loss": -19.681596755981445, "global_step": 48804, "epoch": 588} {"train_loss": -20.26271629333496, "global_step": 48805, "epoch": 588} {"train_loss": -19.826032638549805, "global_step": 48806, "epoch": 588} {"train_loss": -19.702367782592773, "global_step": 48807, "epoch": 588} {"train_loss": -19.682010650634766, "global_step": 48808, "epoch": 588} {"train_loss": -20.040536880493164, "global_step": 48809, "epoch": 588} {"train_loss": -19.293811798095703, "global_step": 48810, "epoch": 588} {"train_loss": -20.011043548583984, "global_step": 48811, "epoch": 588} {"train_loss": -19.961362838745117, "global_step": 48812, "epoch": 588} {"train_loss": -19.967126846313477, "global_step": 48813, "epoch": 588} {"train_loss": -19.851734161376953, "global_step": 48814, "epoch": 588} {"train_loss": -19.792430877685547, "global_step": 48815, "epoch": 588} {"train_loss": -19.71528434753418, "global_step": 48816, "epoch": 588} {"train_loss": -19.77110481262207, "global_step": 48817, "epoch": 588} {"train_loss": -19.840898513793945, "global_step": 48818, "epoch": 588} {"train_loss": -19.77738380432129, "global_step": 48819, "epoch": 588} {"train_loss": -19.704727172851562, "global_step": 48820, "epoch": 588} {"train_loss": -19.975948333740234, "global_step": 48821, "epoch": 588} {"train_loss": -20.17290496826172, "global_step": 48822, "epoch": 588} {"train_loss": -19.625661849975586, "global_step": 48823, "epoch": 588} {"train_loss": -19.820756912231445, "global_step": 48824, "epoch": 588} {"train_loss": -19.874677658081055, "global_step": 48825, "epoch": 588} {"train_loss": -19.54510498046875, "global_step": 48826, "epoch": 588} {"train_loss": -19.600034713745117, "global_step": 48827, "epoch": 588} {"train_loss": -20.01930046081543, "global_step": 48828, "epoch": 588} {"train_loss": -19.640581130981445, "global_step": 48829, "epoch": 588} {"train_loss": -20.43648338317871, "global_step": 48830, "epoch": 588} {"train_loss": -19.841411590576172, "global_step": 48831, "epoch": 588} {"train_loss": -19.692716598510742, "global_step": 48832, "epoch": 588} {"train_loss": -20.056915283203125, "global_step": 48833, "epoch": 588} {"train_loss": -19.999788284301758, "global_step": 48834, "epoch": 588} {"train_loss": -19.8591365814209, "global_step": 48835, "epoch": 588} {"train_loss": -20.13904571533203, "global_step": 48836, "epoch": 588} {"train_loss": -19.987424850463867, "global_step": 48837, "epoch": 588} {"train_loss": -19.606515884399414, "global_step": 48838, "epoch": 588} {"train_loss": -20.061161041259766, "global_step": 48839, "epoch": 588} {"train_loss": -19.7601318359375, "global_step": 48840, "epoch": 588} {"train_loss": -20.330615997314453, "global_step": 48841, "epoch": 588} {"train_loss": -19.668989181518555, "global_step": 48842, "epoch": 588} {"train_loss": -19.74338150024414, "global_step": 48843, "epoch": 588} {"train_loss": -19.988340377807617, "global_step": 48844, "epoch": 588} {"train_loss": -19.983524322509766, "global_step": 48845, "epoch": 588} {"train_loss": -19.164358139038086, "global_step": 48846, "epoch": 588} {"train_loss": -20.072866439819336, "global_step": 48847, "epoch": 588} {"train_loss": -19.981718063354492, "global_step": 48848, "epoch": 588} {"train_loss": -19.656280517578125, "global_step": 48849, "epoch": 588} {"train_loss": -19.46546173095703, "global_step": 48850, "epoch": 588} {"train_loss": -19.50248908996582, "global_step": 48851, "epoch": 588} {"train_loss": -19.815284729003906, "global_step": 48852, "epoch": 588} {"train_loss": -20.169677734375, "global_step": 48853, "epoch": 588} {"train_loss": -20.09491729736328, "global_step": 48854, "epoch": 588} {"train_loss": -19.846189498901367, "global_step": 48855, "epoch": 588} {"train_loss": -19.67365837097168, "global_step": 48856, "epoch": 588} {"train_loss": -19.925739288330078, "global_step": 48857, "epoch": 588} {"train_loss": -19.401884078979492, "global_step": 48858, "epoch": 588} {"train_loss": -19.920942306518555, "global_step": 48859, "epoch": 588} {"train_loss": -19.719491958618164, "global_step": 48860, "epoch": 588} {"train_loss": -19.85297203063965, "global_step": 48861, "epoch": 588} {"train_loss": -19.996992111206055, "global_step": 48862, "epoch": 588} {"train_loss": -20.131439208984375, "global_step": 48863, "epoch": 588} {"train_loss": -20.236400604248047, "global_step": 48864, "epoch": 588} {"train_loss": -20.15825843811035, "global_step": 48865, "epoch": 588} {"train_loss": -20.02176856994629, "global_step": 48866, "epoch": 588} {"train_loss": -19.972185134887695, "global_step": 48867, "epoch": 588} {"train_loss": -20.104843139648438, "global_step": 48868, "epoch": 588} {"train_loss": -20.048490524291992, "global_step": 48869, "epoch": 588} {"train_loss": -20.149747848510742, "global_step": 48870, "epoch": 588} {"train_loss": -19.905210494995117, "global_step": 48871, "epoch": 588} {"train_loss": -19.74459457397461, "global_step": 48872, "epoch": 588} {"train_loss": -19.977460861206055, "global_step": 48873, "epoch": 588} {"train_loss": -19.717283248901367, "global_step": 48874, "epoch": 588} {"train_loss": -19.757434844970703, "global_step": 48875, "epoch": 588} {"train_loss": -20.068679809570312, "global_step": 48876, "epoch": 588} {"train_loss": -19.770004272460938, "global_step": 48877, "epoch": 588} {"train_loss": -20.026901245117188, "global_step": 48878, "epoch": 588} {"train_loss": -19.685230255126953, "global_step": 48879, "epoch": 588} {"train_loss": -19.761341094970703, "global_step": 48880, "epoch": 588} {"train_loss": -19.924657821655273, "global_step": 48881, "epoch": 588} {"train_loss": -20.113861083984375, "global_step": 48882, "epoch": 588} {"train_loss": -20.485136032104492, "global_step": 48883, "epoch": 588} {"train_loss": -19.864774703979492, "global_step": 48884, "epoch": 588} {"train_loss": -19.9674129486084, "global_step": 48885, "epoch": 588} {"train_loss": -19.882232091513025, "global_step": 48886, "epoch": 588, "val_loss": 6022293.0} {"train_loss": -19.458850860595703, "global_step": 48887, "epoch": 589} {"train_loss": -19.79100799560547, "global_step": 48888, "epoch": 589} {"train_loss": -20.12421989440918, "global_step": 48889, "epoch": 589} {"train_loss": -19.479907989501953, "global_step": 48890, "epoch": 589} {"train_loss": -19.701932907104492, "global_step": 48891, "epoch": 589} {"train_loss": -19.370405197143555, "global_step": 48892, "epoch": 589} {"train_loss": -19.94475746154785, "global_step": 48893, "epoch": 589} {"train_loss": -19.840229034423828, "global_step": 48894, "epoch": 589} {"train_loss": -19.6365966796875, "global_step": 48895, "epoch": 589} {"train_loss": -19.569019317626953, "global_step": 48896, "epoch": 589} {"train_loss": -19.719345092773438, "global_step": 48897, "epoch": 589} {"train_loss": -20.019548416137695, "global_step": 48898, "epoch": 589} {"train_loss": -19.820762634277344, "global_step": 48899, "epoch": 589} {"train_loss": -19.67333984375, "global_step": 48900, "epoch": 589} {"train_loss": -19.673187255859375, "global_step": 48901, "epoch": 589} {"train_loss": -19.930295944213867, "global_step": 48902, "epoch": 589} {"train_loss": -20.006866455078125, "global_step": 48903, "epoch": 589} {"train_loss": -19.855052947998047, "global_step": 48904, "epoch": 589} {"train_loss": -19.821842193603516, "global_step": 48905, "epoch": 589} {"train_loss": -19.73526954650879, "global_step": 48906, "epoch": 589} {"train_loss": -19.58892059326172, "global_step": 48907, "epoch": 589} {"train_loss": -20.112693786621094, "global_step": 48908, "epoch": 589} {"train_loss": -19.70256996154785, "global_step": 48909, "epoch": 589} {"train_loss": -19.946210861206055, "global_step": 48910, "epoch": 589} {"train_loss": -20.061120986938477, "global_step": 48911, "epoch": 589} {"train_loss": -19.772241592407227, "global_step": 48912, "epoch": 589} {"train_loss": -19.412839889526367, "global_step": 48913, "epoch": 589} {"train_loss": -20.07549476623535, "global_step": 48914, "epoch": 589} {"train_loss": -20.22934913635254, "global_step": 48915, "epoch": 589} {"train_loss": -19.800302505493164, "global_step": 48916, "epoch": 589} {"train_loss": -20.079267501831055, "global_step": 48917, "epoch": 589} {"train_loss": -19.965085983276367, "global_step": 48918, "epoch": 589} {"train_loss": -19.6664981842041, "global_step": 48919, "epoch": 589} {"train_loss": -19.889616012573242, "global_step": 48920, "epoch": 589} {"train_loss": -20.091842651367188, "global_step": 48921, "epoch": 589} {"train_loss": -19.697607040405273, "global_step": 48922, "epoch": 589} {"train_loss": -19.7282772064209, "global_step": 48923, "epoch": 589} {"train_loss": -19.9953670501709, "global_step": 48924, "epoch": 589} {"train_loss": -19.897693634033203, "global_step": 48925, "epoch": 589} {"train_loss": -19.491802215576172, "global_step": 48926, "epoch": 589} {"train_loss": -20.01742935180664, "global_step": 48927, "epoch": 589} {"train_loss": -19.957056045532227, "global_step": 48928, "epoch": 589} {"train_loss": -19.780216217041016, "global_step": 48929, "epoch": 589} {"train_loss": -20.12868881225586, "global_step": 48930, "epoch": 589} {"train_loss": -19.660791397094727, "global_step": 48931, "epoch": 589} {"train_loss": -19.51161766052246, "global_step": 48932, "epoch": 589} {"train_loss": -19.792213439941406, "global_step": 48933, "epoch": 589} {"train_loss": -19.838804244995117, "global_step": 48934, "epoch": 589} {"train_loss": -19.786142349243164, "global_step": 48935, "epoch": 589} {"train_loss": -19.8836669921875, "global_step": 48936, "epoch": 589} {"train_loss": -20.154462814331055, "global_step": 48937, "epoch": 589} {"train_loss": -19.51732063293457, "global_step": 48938, "epoch": 589} {"train_loss": -19.82939338684082, "global_step": 48939, "epoch": 589} {"train_loss": -19.903350830078125, "global_step": 48940, "epoch": 589} {"train_loss": -20.01219367980957, "global_step": 48941, "epoch": 589} {"train_loss": -20.017797470092773, "global_step": 48942, "epoch": 589} {"train_loss": -19.77945899963379, "global_step": 48943, "epoch": 589} {"train_loss": -20.181026458740234, "global_step": 48944, "epoch": 589} {"train_loss": -19.758464813232422, "global_step": 48945, "epoch": 589} {"train_loss": -19.7742862701416, "global_step": 48946, "epoch": 589} {"train_loss": -20.062082290649414, "global_step": 48947, "epoch": 589} {"train_loss": -19.998239517211914, "global_step": 48948, "epoch": 589} {"train_loss": -19.9375057220459, "global_step": 48949, "epoch": 589} {"train_loss": -19.9648380279541, "global_step": 48950, "epoch": 589} {"train_loss": -19.964611053466797, "global_step": 48951, "epoch": 589} {"train_loss": -20.15894889831543, "global_step": 48952, "epoch": 589} {"train_loss": -20.10701560974121, "global_step": 48953, "epoch": 589} {"train_loss": -19.607629776000977, "global_step": 48954, "epoch": 589} {"train_loss": -19.94038963317871, "global_step": 48955, "epoch": 589} {"train_loss": -19.918569564819336, "global_step": 48956, "epoch": 589} {"train_loss": -20.124353408813477, "global_step": 48957, "epoch": 589} {"train_loss": -19.767810821533203, "global_step": 48958, "epoch": 589} {"train_loss": -19.281450271606445, "global_step": 48959, "epoch": 589} {"train_loss": -19.83655548095703, "global_step": 48960, "epoch": 589} {"train_loss": -20.11506462097168, "global_step": 48961, "epoch": 589} {"train_loss": -19.716434478759766, "global_step": 48962, "epoch": 589} {"train_loss": -19.9868106842041, "global_step": 48963, "epoch": 589} {"train_loss": -19.844009399414062, "global_step": 48964, "epoch": 589} {"train_loss": -19.87526512145996, "global_step": 48965, "epoch": 589} {"train_loss": -20.17681884765625, "global_step": 48966, "epoch": 589} {"train_loss": -19.81855010986328, "global_step": 48967, "epoch": 589} {"train_loss": -19.766637802124023, "global_step": 48968, "epoch": 589} {"train_loss": -19.85581800162074, "global_step": 48969, "epoch": 589, "val_loss": 6218360.0} {"train_loss": -19.599632263183594, "global_step": 48970, "epoch": 590} {"train_loss": -19.452598571777344, "global_step": 48971, "epoch": 590} {"train_loss": -19.80814552307129, "global_step": 48972, "epoch": 590} {"train_loss": -19.655263900756836, "global_step": 48973, "epoch": 590} {"train_loss": -19.70929527282715, "global_step": 48974, "epoch": 590} {"train_loss": -19.62668228149414, "global_step": 48975, "epoch": 590} {"train_loss": -19.4527645111084, "global_step": 48976, "epoch": 590} {"train_loss": -19.668582916259766, "global_step": 48977, "epoch": 590} {"train_loss": -19.7869930267334, "global_step": 48978, "epoch": 590} {"train_loss": -19.605268478393555, "global_step": 48979, "epoch": 590} {"train_loss": -19.8250675201416, "global_step": 48980, "epoch": 590} {"train_loss": -19.87647819519043, "global_step": 48981, "epoch": 590} {"train_loss": -19.501012802124023, "global_step": 48982, "epoch": 590} {"train_loss": -19.656177520751953, "global_step": 48983, "epoch": 590} {"train_loss": -19.79994010925293, "global_step": 48984, "epoch": 590} {"train_loss": -20.10919761657715, "global_step": 48985, "epoch": 590} {"train_loss": -19.840957641601562, "global_step": 48986, "epoch": 590} {"train_loss": -19.832677841186523, "global_step": 48987, "epoch": 590} {"train_loss": -20.034006118774414, "global_step": 48988, "epoch": 590} {"train_loss": -19.920799255371094, "global_step": 48989, "epoch": 590} {"train_loss": -19.74403190612793, "global_step": 48990, "epoch": 590} {"train_loss": -19.985301971435547, "global_step": 48991, "epoch": 590} {"train_loss": -19.809345245361328, "global_step": 48992, "epoch": 590} {"train_loss": -19.414581298828125, "global_step": 48993, "epoch": 590} {"train_loss": -20.1084041595459, "global_step": 48994, "epoch": 590} {"train_loss": -19.752225875854492, "global_step": 48995, "epoch": 590} {"train_loss": -19.211532592773438, "global_step": 48996, "epoch": 590} {"train_loss": -19.646764755249023, "global_step": 48997, "epoch": 590} {"train_loss": -19.97446060180664, "global_step": 48998, "epoch": 590} {"train_loss": -19.811355590820312, "global_step": 48999, "epoch": 590} {"train_loss": -20.032394409179688, "global_step": 49000, "epoch": 590} {"train_loss": -20.25885009765625, "global_step": 49001, "epoch": 590} {"train_loss": -19.796945571899414, "global_step": 49002, "epoch": 590} {"train_loss": -19.65157127380371, "global_step": 49003, "epoch": 590} {"train_loss": -20.21379280090332, "global_step": 49004, "epoch": 590} {"train_loss": -20.05796241760254, "global_step": 49005, "epoch": 590} {"train_loss": -19.709346771240234, "global_step": 49006, "epoch": 590} {"train_loss": -20.034717559814453, "global_step": 49007, "epoch": 590} {"train_loss": -20.000030517578125, "global_step": 49008, "epoch": 590} {"train_loss": -20.212295532226562, "global_step": 49009, "epoch": 590} {"train_loss": -19.795316696166992, "global_step": 49010, "epoch": 590} {"train_loss": -19.714445114135742, "global_step": 49011, "epoch": 590} {"train_loss": -19.745004653930664, "global_step": 49012, "epoch": 590} {"train_loss": -19.806232452392578, "global_step": 49013, "epoch": 590} {"train_loss": -20.07112693786621, "global_step": 49014, "epoch": 590} {"train_loss": -19.821063995361328, "global_step": 49015, "epoch": 590} {"train_loss": -19.87226676940918, "global_step": 49016, "epoch": 590} {"train_loss": -19.616281509399414, "global_step": 49017, "epoch": 590} {"train_loss": -19.7944393157959, "global_step": 49018, "epoch": 590} {"train_loss": -19.767282485961914, "global_step": 49019, "epoch": 590} {"train_loss": -19.847217559814453, "global_step": 49020, "epoch": 590} {"train_loss": -20.2084903717041, "global_step": 49021, "epoch": 590} {"train_loss": -19.877643585205078, "global_step": 49022, "epoch": 590} {"train_loss": -19.786123275756836, "global_step": 49023, "epoch": 590} {"train_loss": -19.922142028808594, "global_step": 49024, "epoch": 590} {"train_loss": -20.051883697509766, "global_step": 49025, "epoch": 590} {"train_loss": -20.18458366394043, "global_step": 49026, "epoch": 590} {"train_loss": -19.55772590637207, "global_step": 49027, "epoch": 590} {"train_loss": -19.68375015258789, "global_step": 49028, "epoch": 590} {"train_loss": -20.06890296936035, "global_step": 49029, "epoch": 590} {"train_loss": -20.217979431152344, "global_step": 49030, "epoch": 590} {"train_loss": -19.69398307800293, "global_step": 49031, "epoch": 590} {"train_loss": -20.23853874206543, "global_step": 49032, "epoch": 590} {"train_loss": -19.87535285949707, "global_step": 49033, "epoch": 590} {"train_loss": -19.886144638061523, "global_step": 49034, "epoch": 590} {"train_loss": -20.108449935913086, "global_step": 49035, "epoch": 590} {"train_loss": -20.33241844177246, "global_step": 49036, "epoch": 590} {"train_loss": -19.790470123291016, "global_step": 49037, "epoch": 590} {"train_loss": -19.947187423706055, "global_step": 49038, "epoch": 590} {"train_loss": -19.860305786132812, "global_step": 49039, "epoch": 590} {"train_loss": -19.759780883789062, "global_step": 49040, "epoch": 590} {"train_loss": -19.79353904724121, "global_step": 49041, "epoch": 590} {"train_loss": -19.996129989624023, "global_step": 49042, "epoch": 590} {"train_loss": -19.809494018554688, "global_step": 49043, "epoch": 590} {"train_loss": -19.765594482421875, "global_step": 49044, "epoch": 590} {"train_loss": -19.735977172851562, "global_step": 49045, "epoch": 590} {"train_loss": -20.040512084960938, "global_step": 49046, "epoch": 590} {"train_loss": -20.032787322998047, "global_step": 49047, "epoch": 590} {"train_loss": -19.82465934753418, "global_step": 49048, "epoch": 590} {"train_loss": -20.01851463317871, "global_step": 49049, "epoch": 590} {"train_loss": -19.806413650512695, "global_step": 49050, "epoch": 590} {"train_loss": -19.786794662475586, "global_step": 49051, "epoch": 590} {"train_loss": -19.850595887885035, "global_step": 49052, "epoch": 590, "val_loss": 6022664.0} {"train_loss": -20.009838104248047, "global_step": 49053, "epoch": 591} {"train_loss": -19.738800048828125, "global_step": 49054, "epoch": 591} {"train_loss": -19.809242248535156, "global_step": 49055, "epoch": 591} {"train_loss": -19.851621627807617, "global_step": 49056, "epoch": 591} {"train_loss": -19.8070068359375, "global_step": 49057, "epoch": 591} {"train_loss": -19.690893173217773, "global_step": 49058, "epoch": 591} {"train_loss": -19.681716918945312, "global_step": 49059, "epoch": 591} {"train_loss": -19.466947555541992, "global_step": 49060, "epoch": 591} {"train_loss": -19.696170806884766, "global_step": 49061, "epoch": 591} {"train_loss": -19.772994995117188, "global_step": 49062, "epoch": 591} {"train_loss": -19.9613037109375, "global_step": 49063, "epoch": 591} {"train_loss": -20.144357681274414, "global_step": 49064, "epoch": 591} {"train_loss": -20.08301544189453, "global_step": 49065, "epoch": 591} {"train_loss": -20.114791870117188, "global_step": 49066, "epoch": 591} {"train_loss": -19.645158767700195, "global_step": 49067, "epoch": 591} {"train_loss": -19.69520378112793, "global_step": 49068, "epoch": 591} {"train_loss": -19.63734245300293, "global_step": 49069, "epoch": 591} {"train_loss": -19.891000747680664, "global_step": 49070, "epoch": 591} {"train_loss": -19.775876998901367, "global_step": 49071, "epoch": 591} {"train_loss": -19.68501853942871, "global_step": 49072, "epoch": 591} {"train_loss": -19.917089462280273, "global_step": 49073, "epoch": 591} {"train_loss": -19.835189819335938, "global_step": 49074, "epoch": 591} {"train_loss": -19.75681495666504, "global_step": 49075, "epoch": 591} {"train_loss": -20.253582000732422, "global_step": 49076, "epoch": 591} {"train_loss": -19.61480140686035, "global_step": 49077, "epoch": 591} {"train_loss": -19.606542587280273, "global_step": 49078, "epoch": 591} {"train_loss": -20.086467742919922, "global_step": 49079, "epoch": 591} {"train_loss": -19.638290405273438, "global_step": 49080, "epoch": 591} {"train_loss": -19.577383041381836, "global_step": 49081, "epoch": 591} {"train_loss": -20.096891403198242, "global_step": 49082, "epoch": 591} {"train_loss": -19.949058532714844, "global_step": 49083, "epoch": 591} {"train_loss": -20.155912399291992, "global_step": 49084, "epoch": 591} {"train_loss": -19.803770065307617, "global_step": 49085, "epoch": 591} {"train_loss": -19.388856887817383, "global_step": 49086, "epoch": 591} {"train_loss": -20.236120223999023, "global_step": 49087, "epoch": 591} {"train_loss": -19.640029907226562, "global_step": 49088, "epoch": 591} {"train_loss": -19.8681583404541, "global_step": 49089, "epoch": 591} {"train_loss": -20.070621490478516, "global_step": 49090, "epoch": 591} {"train_loss": -20.150009155273438, "global_step": 49091, "epoch": 591} {"train_loss": -20.030324935913086, "global_step": 49092, "epoch": 591} {"train_loss": -19.84922218322754, "global_step": 49093, "epoch": 591} {"train_loss": -20.150897979736328, "global_step": 49094, "epoch": 591} {"train_loss": -19.814268112182617, "global_step": 49095, "epoch": 591} {"train_loss": -19.52764320373535, "global_step": 49096, "epoch": 591} {"train_loss": -19.601383209228516, "global_step": 49097, "epoch": 591} {"train_loss": -19.808027267456055, "global_step": 49098, "epoch": 591} {"train_loss": -20.0332088470459, "global_step": 49099, "epoch": 591} {"train_loss": -19.82267189025879, "global_step": 49100, "epoch": 591} {"train_loss": -20.39240074157715, "global_step": 49101, "epoch": 591} {"train_loss": -19.587018966674805, "global_step": 49102, "epoch": 591} {"train_loss": -19.855066299438477, "global_step": 49103, "epoch": 591} {"train_loss": -20.04214859008789, "global_step": 49104, "epoch": 591} {"train_loss": -19.871408462524414, "global_step": 49105, "epoch": 591} {"train_loss": -19.9412784576416, "global_step": 49106, "epoch": 591} {"train_loss": -20.014184951782227, "global_step": 49107, "epoch": 591} {"train_loss": -19.85589599609375, "global_step": 49108, "epoch": 591} {"train_loss": -20.09345817565918, "global_step": 49109, "epoch": 591} {"train_loss": -20.21406364440918, "global_step": 49110, "epoch": 591} {"train_loss": -20.255929946899414, "global_step": 49111, "epoch": 591} {"train_loss": -20.1711483001709, "global_step": 49112, "epoch": 591} {"train_loss": -19.872873306274414, "global_step": 49113, "epoch": 591} {"train_loss": -19.73390007019043, "global_step": 49114, "epoch": 591} {"train_loss": -20.544872283935547, "global_step": 49115, "epoch": 591} {"train_loss": -19.9349308013916, "global_step": 49116, "epoch": 591} {"train_loss": -19.968717575073242, "global_step": 49117, "epoch": 591} {"train_loss": -20.136886596679688, "global_step": 49118, "epoch": 591} {"train_loss": -19.535255432128906, "global_step": 49119, "epoch": 591} {"train_loss": -19.863534927368164, "global_step": 49120, "epoch": 591} {"train_loss": -19.894323348999023, "global_step": 49121, "epoch": 591} {"train_loss": -20.018878936767578, "global_step": 49122, "epoch": 591} {"train_loss": -19.7188663482666, "global_step": 49123, "epoch": 591} {"train_loss": -19.62560272216797, "global_step": 49124, "epoch": 591} {"train_loss": -19.941389083862305, "global_step": 49125, "epoch": 591} {"train_loss": -19.815937042236328, "global_step": 49126, "epoch": 591} {"train_loss": -20.021371841430664, "global_step": 49127, "epoch": 591} {"train_loss": -20.140371322631836, "global_step": 49128, "epoch": 591} {"train_loss": -19.537260055541992, "global_step": 49129, "epoch": 591} {"train_loss": -19.80966567993164, "global_step": 49130, "epoch": 591} {"train_loss": -19.936481475830078, "global_step": 49131, "epoch": 591} {"train_loss": -20.144250869750977, "global_step": 49132, "epoch": 591} {"train_loss": -19.702077865600586, "global_step": 49133, "epoch": 591} {"train_loss": -19.525962829589844, "global_step": 49134, "epoch": 591} {"train_loss": -19.881599472229738, "global_step": 49135, "epoch": 591, "val_loss": 6059180.0} {"train_loss": -19.783475875854492, "global_step": 49136, "epoch": 592} {"train_loss": -19.02082061767578, "global_step": 49137, "epoch": 592} {"train_loss": -19.665267944335938, "global_step": 49138, "epoch": 592} {"train_loss": -19.586530685424805, "global_step": 49139, "epoch": 592} {"train_loss": -19.784086227416992, "global_step": 49140, "epoch": 592} {"train_loss": -19.752058029174805, "global_step": 49141, "epoch": 592} {"train_loss": -19.597692489624023, "global_step": 49142, "epoch": 592} {"train_loss": -19.791828155517578, "global_step": 49143, "epoch": 592} {"train_loss": -19.62140464782715, "global_step": 49144, "epoch": 592} {"train_loss": -19.699527740478516, "global_step": 49145, "epoch": 592} {"train_loss": -19.736644744873047, "global_step": 49146, "epoch": 592} {"train_loss": -19.7976016998291, "global_step": 49147, "epoch": 592} {"train_loss": -19.780324935913086, "global_step": 49148, "epoch": 592} {"train_loss": -19.849674224853516, "global_step": 49149, "epoch": 592} {"train_loss": -19.751127243041992, "global_step": 49150, "epoch": 592} {"train_loss": -20.046512603759766, "global_step": 49151, "epoch": 592} {"train_loss": -20.132394790649414, "global_step": 49152, "epoch": 592} {"train_loss": -19.66756248474121, "global_step": 49153, "epoch": 592} {"train_loss": -20.139205932617188, "global_step": 49154, "epoch": 592} {"train_loss": -19.720014572143555, "global_step": 49155, "epoch": 592} {"train_loss": -20.007726669311523, "global_step": 49156, "epoch": 592} {"train_loss": -19.65557098388672, "global_step": 49157, "epoch": 592} {"train_loss": -19.95522117614746, "global_step": 49158, "epoch": 592} {"train_loss": -19.941320419311523, "global_step": 49159, "epoch": 592} {"train_loss": -19.8284912109375, "global_step": 49160, "epoch": 592} {"train_loss": -20.007781982421875, "global_step": 49161, "epoch": 592} {"train_loss": -19.71266746520996, "global_step": 49162, "epoch": 592} {"train_loss": -19.952844619750977, "global_step": 49163, "epoch": 592} {"train_loss": -19.484899520874023, "global_step": 49164, "epoch": 592} {"train_loss": -19.72108268737793, "global_step": 49165, "epoch": 592} {"train_loss": -19.87806510925293, "global_step": 49166, "epoch": 592} {"train_loss": -20.125524520874023, "global_step": 49167, "epoch": 592} {"train_loss": -20.010019302368164, "global_step": 49168, "epoch": 592} {"train_loss": -19.72678565979004, "global_step": 49169, "epoch": 592} {"train_loss": -19.70863914489746, "global_step": 49170, "epoch": 592} {"train_loss": -19.680273056030273, "global_step": 49171, "epoch": 592} {"train_loss": -20.01369285583496, "global_step": 49172, "epoch": 592} {"train_loss": -20.247419357299805, "global_step": 49173, "epoch": 592} {"train_loss": -19.918495178222656, "global_step": 49174, "epoch": 592} {"train_loss": -19.80992317199707, "global_step": 49175, "epoch": 592} {"train_loss": -19.699186325073242, "global_step": 49176, "epoch": 592} {"train_loss": -19.947046279907227, "global_step": 49177, "epoch": 592} {"train_loss": -20.1356258392334, "global_step": 49178, "epoch": 592} {"train_loss": -19.83538246154785, "global_step": 49179, "epoch": 592} {"train_loss": -20.20882225036621, "global_step": 49180, "epoch": 592} {"train_loss": -19.878202438354492, "global_step": 49181, "epoch": 592} {"train_loss": -19.814645767211914, "global_step": 49182, "epoch": 592} {"train_loss": -20.066865921020508, "global_step": 49183, "epoch": 592} {"train_loss": -20.21377944946289, "global_step": 49184, "epoch": 592} {"train_loss": -19.700937271118164, "global_step": 49185, "epoch": 592} {"train_loss": -19.991174697875977, "global_step": 49186, "epoch": 592} {"train_loss": -20.048669815063477, "global_step": 49187, "epoch": 592} {"train_loss": -19.585386276245117, "global_step": 49188, "epoch": 592} {"train_loss": -19.650150299072266, "global_step": 49189, "epoch": 592} {"train_loss": -19.71003532409668, "global_step": 49190, "epoch": 592} {"train_loss": -19.909238815307617, "global_step": 49191, "epoch": 592} {"train_loss": -19.862369537353516, "global_step": 49192, "epoch": 592} {"train_loss": -19.884069442749023, "global_step": 49193, "epoch": 592} {"train_loss": -20.046173095703125, "global_step": 49194, "epoch": 592} {"train_loss": -19.722440719604492, "global_step": 49195, "epoch": 592} {"train_loss": -19.782180786132812, "global_step": 49196, "epoch": 592} {"train_loss": -19.821157455444336, "global_step": 49197, "epoch": 592} {"train_loss": -20.179706573486328, "global_step": 49198, "epoch": 592} {"train_loss": -20.14468765258789, "global_step": 49199, "epoch": 592} {"train_loss": -20.04433250427246, "global_step": 49200, "epoch": 592} {"train_loss": -19.550453186035156, "global_step": 49201, "epoch": 592} {"train_loss": -19.87038230895996, "global_step": 49202, "epoch": 592} {"train_loss": -19.89496612548828, "global_step": 49203, "epoch": 592} {"train_loss": -19.522279739379883, "global_step": 49204, "epoch": 592} {"train_loss": -20.01407814025879, "global_step": 49205, "epoch": 592} {"train_loss": -19.61385726928711, "global_step": 49206, "epoch": 592} {"train_loss": -20.115148544311523, "global_step": 49207, "epoch": 592} {"train_loss": -19.800796508789062, "global_step": 49208, "epoch": 592} {"train_loss": -20.055343627929688, "global_step": 49209, "epoch": 592} {"train_loss": -19.856781005859375, "global_step": 49210, "epoch": 592} {"train_loss": -19.761123657226562, "global_step": 49211, "epoch": 592} {"train_loss": -19.605031967163086, "global_step": 49212, "epoch": 592} {"train_loss": -20.11197853088379, "global_step": 49213, "epoch": 592} {"train_loss": -19.82707977294922, "global_step": 49214, "epoch": 592} {"train_loss": -19.63829231262207, "global_step": 49215, "epoch": 592} {"train_loss": -20.348737716674805, "global_step": 49216, "epoch": 592} {"train_loss": -19.61530876159668, "global_step": 49217, "epoch": 592} {"train_loss": -19.854662768812066, "global_step": 49218, "epoch": 592, "val_loss": 5955183.0} {"train_loss": -20.06618881225586, "global_step": 49219, "epoch": 593} {"train_loss": -19.914836883544922, "global_step": 49220, "epoch": 593} {"train_loss": -19.916746139526367, "global_step": 49221, "epoch": 593} {"train_loss": -20.02683448791504, "global_step": 49222, "epoch": 593} {"train_loss": -19.93645477294922, "global_step": 49223, "epoch": 593} {"train_loss": -19.63909149169922, "global_step": 49224, "epoch": 593} {"train_loss": -19.785917282104492, "global_step": 49225, "epoch": 593} {"train_loss": -19.708532333374023, "global_step": 49226, "epoch": 593} {"train_loss": -19.829174041748047, "global_step": 49227, "epoch": 593} {"train_loss": -20.072843551635742, "global_step": 49228, "epoch": 593} {"train_loss": -19.6970272064209, "global_step": 49229, "epoch": 593} {"train_loss": -19.779911041259766, "global_step": 49230, "epoch": 593} {"train_loss": -20.047271728515625, "global_step": 49231, "epoch": 593} {"train_loss": -19.6065731048584, "global_step": 49232, "epoch": 593} {"train_loss": -19.992334365844727, "global_step": 49233, "epoch": 593} {"train_loss": -19.940885543823242, "global_step": 49234, "epoch": 593} {"train_loss": -19.893964767456055, "global_step": 49235, "epoch": 593} {"train_loss": -20.067609786987305, "global_step": 49236, "epoch": 593} {"train_loss": -19.847389221191406, "global_step": 49237, "epoch": 593} {"train_loss": -20.05514144897461, "global_step": 49238, "epoch": 593} {"train_loss": -19.899045944213867, "global_step": 49239, "epoch": 593} {"train_loss": -19.417238235473633, "global_step": 49240, "epoch": 593} {"train_loss": -19.749799728393555, "global_step": 49241, "epoch": 593} {"train_loss": -19.561986923217773, "global_step": 49242, "epoch": 593} {"train_loss": -20.397207260131836, "global_step": 49243, "epoch": 593} {"train_loss": -20.085962295532227, "global_step": 49244, "epoch": 593} {"train_loss": -19.751745223999023, "global_step": 49245, "epoch": 593} {"train_loss": -19.934429168701172, "global_step": 49246, "epoch": 593} {"train_loss": -19.79495620727539, "global_step": 49247, "epoch": 593} {"train_loss": -19.6363582611084, "global_step": 49248, "epoch": 593} {"train_loss": -19.833913803100586, "global_step": 49249, "epoch": 593} {"train_loss": -20.364532470703125, "global_step": 49250, "epoch": 593} {"train_loss": -19.929035186767578, "global_step": 49251, "epoch": 593} {"train_loss": -20.03284454345703, "global_step": 49252, "epoch": 593} {"train_loss": -19.691423416137695, "global_step": 49253, "epoch": 593} {"train_loss": -19.461898803710938, "global_step": 49254, "epoch": 593} {"train_loss": -19.853281021118164, "global_step": 49255, "epoch": 593} {"train_loss": -20.138561248779297, "global_step": 49256, "epoch": 593} {"train_loss": -19.926809310913086, "global_step": 49257, "epoch": 593} {"train_loss": -19.81739616394043, "global_step": 49258, "epoch": 593} {"train_loss": -20.039262771606445, "global_step": 49259, "epoch": 593} {"train_loss": -19.929182052612305, "global_step": 49260, "epoch": 593} {"train_loss": -20.030324935913086, "global_step": 49261, "epoch": 593} {"train_loss": -19.964340209960938, "global_step": 49262, "epoch": 593} {"train_loss": -19.846641540527344, "global_step": 49263, "epoch": 593} {"train_loss": -20.051361083984375, "global_step": 49264, "epoch": 593} {"train_loss": -19.9987850189209, "global_step": 49265, "epoch": 593} {"train_loss": -20.08639144897461, "global_step": 49266, "epoch": 593} {"train_loss": -20.142614364624023, "global_step": 49267, "epoch": 593} {"train_loss": -20.308181762695312, "global_step": 49268, "epoch": 593} {"train_loss": -19.955961227416992, "global_step": 49269, "epoch": 593} {"train_loss": -20.138774871826172, "global_step": 49270, "epoch": 593} {"train_loss": -19.751506805419922, "global_step": 49271, "epoch": 593} {"train_loss": -19.888044357299805, "global_step": 49272, "epoch": 593} {"train_loss": -19.721384048461914, "global_step": 49273, "epoch": 593} {"train_loss": -19.806659698486328, "global_step": 49274, "epoch": 593} {"train_loss": -19.953266143798828, "global_step": 49275, "epoch": 593} {"train_loss": -20.323413848876953, "global_step": 49276, "epoch": 593} {"train_loss": -20.087749481201172, "global_step": 49277, "epoch": 593} {"train_loss": -19.818771362304688, "global_step": 49278, "epoch": 593} {"train_loss": -20.077957153320312, "global_step": 49279, "epoch": 593} {"train_loss": -20.067289352416992, "global_step": 49280, "epoch": 593} {"train_loss": -19.870107650756836, "global_step": 49281, "epoch": 593} {"train_loss": -19.93873405456543, "global_step": 49282, "epoch": 593} {"train_loss": -20.076217651367188, "global_step": 49283, "epoch": 593} {"train_loss": -19.645435333251953, "global_step": 49284, "epoch": 593} {"train_loss": -19.84649085998535, "global_step": 49285, "epoch": 593} {"train_loss": -20.038105010986328, "global_step": 49286, "epoch": 593} {"train_loss": -19.947086334228516, "global_step": 49287, "epoch": 593} {"train_loss": -19.919281005859375, "global_step": 49288, "epoch": 593} {"train_loss": -19.784337997436523, "global_step": 49289, "epoch": 593} {"train_loss": -19.839628219604492, "global_step": 49290, "epoch": 593} {"train_loss": -20.248760223388672, "global_step": 49291, "epoch": 593} {"train_loss": -19.857423782348633, "global_step": 49292, "epoch": 593} {"train_loss": -19.895627975463867, "global_step": 49293, "epoch": 593} {"train_loss": -20.20975112915039, "global_step": 49294, "epoch": 593} {"train_loss": -19.789276123046875, "global_step": 49295, "epoch": 593} {"train_loss": -20.11695671081543, "global_step": 49296, "epoch": 593} {"train_loss": -19.649930953979492, "global_step": 49297, "epoch": 593} {"train_loss": -20.033817291259766, "global_step": 49298, "epoch": 593} {"train_loss": -20.042924880981445, "global_step": 49299, "epoch": 593} {"train_loss": -20.346282958984375, "global_step": 49300, "epoch": 593} {"train_loss": -19.928685521504963, "global_step": 49301, "epoch": 593, "val_loss": 6071110.0} {"train_loss": -19.88123321533203, "global_step": 49302, "epoch": 594} {"train_loss": -19.81122398376465, "global_step": 49303, "epoch": 594} {"train_loss": -19.583206176757812, "global_step": 49304, "epoch": 594} {"train_loss": -19.34932518005371, "global_step": 49305, "epoch": 594} {"train_loss": -19.676292419433594, "global_step": 49306, "epoch": 594} {"train_loss": -20.06985855102539, "global_step": 49307, "epoch": 594} {"train_loss": -19.75337028503418, "global_step": 49308, "epoch": 594} {"train_loss": -19.9704647064209, "global_step": 49309, "epoch": 594} {"train_loss": -20.193891525268555, "global_step": 49310, "epoch": 594} {"train_loss": -19.898988723754883, "global_step": 49311, "epoch": 594} {"train_loss": -19.758071899414062, "global_step": 49312, "epoch": 594} {"train_loss": -19.78439712524414, "global_step": 49313, "epoch": 594} {"train_loss": -20.044544219970703, "global_step": 49314, "epoch": 594} {"train_loss": -19.950044631958008, "global_step": 49315, "epoch": 594} {"train_loss": -19.835647583007812, "global_step": 49316, "epoch": 594} {"train_loss": -20.031461715698242, "global_step": 49317, "epoch": 594} {"train_loss": -20.155881881713867, "global_step": 49318, "epoch": 594} {"train_loss": -20.237314224243164, "global_step": 49319, "epoch": 594} {"train_loss": -19.89725112915039, "global_step": 49320, "epoch": 594} {"train_loss": -19.748825073242188, "global_step": 49321, "epoch": 594} {"train_loss": -19.799570083618164, "global_step": 49322, "epoch": 594} {"train_loss": -19.926172256469727, "global_step": 49323, "epoch": 594} {"train_loss": -20.050052642822266, "global_step": 49324, "epoch": 594} {"train_loss": -19.571889877319336, "global_step": 49325, "epoch": 594} {"train_loss": -19.913419723510742, "global_step": 49326, "epoch": 594} {"train_loss": -19.90806007385254, "global_step": 49327, "epoch": 594} {"train_loss": -19.628341674804688, "global_step": 49328, "epoch": 594} {"train_loss": -19.997604370117188, "global_step": 49329, "epoch": 594} {"train_loss": -19.477874755859375, "global_step": 49330, "epoch": 594} {"train_loss": -19.682872772216797, "global_step": 49331, "epoch": 594} {"train_loss": -20.345605850219727, "global_step": 49332, "epoch": 594} {"train_loss": -19.728107452392578, "global_step": 49333, "epoch": 594} {"train_loss": -19.57636833190918, "global_step": 49334, "epoch": 594} {"train_loss": -19.838056564331055, "global_step": 49335, "epoch": 594} {"train_loss": -19.764453887939453, "global_step": 49336, "epoch": 594} {"train_loss": -19.872983932495117, "global_step": 49337, "epoch": 594} {"train_loss": -20.14713478088379, "global_step": 49338, "epoch": 594} {"train_loss": -19.970075607299805, "global_step": 49339, "epoch": 594} {"train_loss": -19.761449813842773, "global_step": 49340, "epoch": 594} {"train_loss": -19.824665069580078, "global_step": 49341, "epoch": 594} {"train_loss": -20.0297908782959, "global_step": 49342, "epoch": 594} {"train_loss": -20.08880615234375, "global_step": 49343, "epoch": 594} {"train_loss": -19.883758544921875, "global_step": 49344, "epoch": 594} {"train_loss": -19.9797420501709, "global_step": 49345, "epoch": 594} {"train_loss": -19.895343780517578, "global_step": 49346, "epoch": 594} {"train_loss": -19.673511505126953, "global_step": 49347, "epoch": 594} {"train_loss": -19.802473068237305, "global_step": 49348, "epoch": 594} {"train_loss": -19.96639633178711, "global_step": 49349, "epoch": 594} {"train_loss": -19.939239501953125, "global_step": 49350, "epoch": 594} {"train_loss": -20.08211326599121, "global_step": 49351, "epoch": 594} {"train_loss": -20.013071060180664, "global_step": 49352, "epoch": 594} {"train_loss": -19.85692596435547, "global_step": 49353, "epoch": 594} {"train_loss": -19.882490158081055, "global_step": 49354, "epoch": 594} {"train_loss": -20.04456329345703, "global_step": 49355, "epoch": 594} {"train_loss": -19.7457332611084, "global_step": 49356, "epoch": 594} {"train_loss": -19.502227783203125, "global_step": 49357, "epoch": 594} {"train_loss": -19.92051124572754, "global_step": 49358, "epoch": 594} {"train_loss": -19.75947380065918, "global_step": 49359, "epoch": 594} {"train_loss": -19.63721466064453, "global_step": 49360, "epoch": 594} {"train_loss": -20.057199478149414, "global_step": 49361, "epoch": 594} {"train_loss": -20.116622924804688, "global_step": 49362, "epoch": 594} {"train_loss": -20.115633010864258, "global_step": 49363, "epoch": 594} {"train_loss": -19.67197036743164, "global_step": 49364, "epoch": 594} {"train_loss": -20.49822998046875, "global_step": 49365, "epoch": 594} {"train_loss": -19.982097625732422, "global_step": 49366, "epoch": 594} {"train_loss": -19.83241844177246, "global_step": 49367, "epoch": 594} {"train_loss": -19.915189743041992, "global_step": 49368, "epoch": 594} {"train_loss": -19.836505889892578, "global_step": 49369, "epoch": 594} {"train_loss": -19.966299057006836, "global_step": 49370, "epoch": 594} {"train_loss": -20.361106872558594, "global_step": 49371, "epoch": 594} {"train_loss": -19.9378719329834, "global_step": 49372, "epoch": 594} {"train_loss": -19.855422973632812, "global_step": 49373, "epoch": 594} {"train_loss": -20.06282615661621, "global_step": 49374, "epoch": 594} {"train_loss": -19.497831344604492, "global_step": 49375, "epoch": 594} {"train_loss": -19.806964874267578, "global_step": 49376, "epoch": 594} {"train_loss": -19.9029598236084, "global_step": 49377, "epoch": 594} {"train_loss": -19.909561157226562, "global_step": 49378, "epoch": 594} {"train_loss": -20.011816024780273, "global_step": 49379, "epoch": 594} {"train_loss": -19.814838409423828, "global_step": 49380, "epoch": 594} {"train_loss": -20.0213565826416, "global_step": 49381, "epoch": 594} {"train_loss": -19.987192153930664, "global_step": 49382, "epoch": 594} {"train_loss": -19.935869216918945, "global_step": 49383, "epoch": 594} {"train_loss": -19.89280139969056, "global_step": 49384, "epoch": 594, "val_loss": 6195857.0} {"train_loss": -19.903182983398438, "global_step": 49385, "epoch": 595} {"train_loss": -20.05293846130371, "global_step": 49386, "epoch": 595} {"train_loss": -20.189538955688477, "global_step": 49387, "epoch": 595} {"train_loss": -19.848896026611328, "global_step": 49388, "epoch": 595} {"train_loss": -19.839874267578125, "global_step": 49389, "epoch": 595} {"train_loss": -19.602331161499023, "global_step": 49390, "epoch": 595} {"train_loss": -19.85582160949707, "global_step": 49391, "epoch": 595} {"train_loss": -19.848918914794922, "global_step": 49392, "epoch": 595} {"train_loss": -19.925006866455078, "global_step": 49393, "epoch": 595} {"train_loss": -20.073009490966797, "global_step": 49394, "epoch": 595} {"train_loss": -19.921987533569336, "global_step": 49395, "epoch": 595} {"train_loss": -19.537275314331055, "global_step": 49396, "epoch": 595} {"train_loss": -20.12391471862793, "global_step": 49397, "epoch": 595} {"train_loss": -19.722105026245117, "global_step": 49398, "epoch": 595} {"train_loss": -19.599573135375977, "global_step": 49399, "epoch": 595} {"train_loss": -19.873111724853516, "global_step": 49400, "epoch": 595} {"train_loss": -19.722854614257812, "global_step": 49401, "epoch": 595} {"train_loss": -20.035383224487305, "global_step": 49402, "epoch": 595} {"train_loss": -20.1292724609375, "global_step": 49403, "epoch": 595} {"train_loss": -20.09354591369629, "global_step": 49404, "epoch": 595} {"train_loss": -19.943641662597656, "global_step": 49405, "epoch": 595} {"train_loss": -20.145296096801758, "global_step": 49406, "epoch": 595} {"train_loss": -19.558013916015625, "global_step": 49407, "epoch": 595} {"train_loss": -19.92499351501465, "global_step": 49408, "epoch": 595} {"train_loss": -20.24090576171875, "global_step": 49409, "epoch": 595} {"train_loss": -19.67564582824707, "global_step": 49410, "epoch": 595} {"train_loss": -19.763029098510742, "global_step": 49411, "epoch": 595} {"train_loss": -20.088220596313477, "global_step": 49412, "epoch": 595} {"train_loss": -20.006942749023438, "global_step": 49413, "epoch": 595} {"train_loss": -19.95721435546875, "global_step": 49414, "epoch": 595} {"train_loss": -19.61768913269043, "global_step": 49415, "epoch": 595} {"train_loss": -20.002798080444336, "global_step": 49416, "epoch": 595} {"train_loss": -19.77734375, "global_step": 49417, "epoch": 595} {"train_loss": -19.824817657470703, "global_step": 49418, "epoch": 595} {"train_loss": -20.049575805664062, "global_step": 49419, "epoch": 595} {"train_loss": -19.77157974243164, "global_step": 49420, "epoch": 595} {"train_loss": -20.077896118164062, "global_step": 49421, "epoch": 595} {"train_loss": -20.139083862304688, "global_step": 49422, "epoch": 595} {"train_loss": -19.942481994628906, "global_step": 49423, "epoch": 595} {"train_loss": -19.632505416870117, "global_step": 49424, "epoch": 595} {"train_loss": -19.866872787475586, "global_step": 49425, "epoch": 595} {"train_loss": -19.959333419799805, "global_step": 49426, "epoch": 595} {"train_loss": -19.935895919799805, "global_step": 49427, "epoch": 595} {"train_loss": -19.9509334564209, "global_step": 49428, "epoch": 595} {"train_loss": -19.787643432617188, "global_step": 49429, "epoch": 595} {"train_loss": -19.945058822631836, "global_step": 49430, "epoch": 595} {"train_loss": -20.10176658630371, "global_step": 49431, "epoch": 595} {"train_loss": -19.940885543823242, "global_step": 49432, "epoch": 595} {"train_loss": -19.947660446166992, "global_step": 49433, "epoch": 595} {"train_loss": -20.247854232788086, "global_step": 49434, "epoch": 595} {"train_loss": -19.993017196655273, "global_step": 49435, "epoch": 595} {"train_loss": -20.0018367767334, "global_step": 49436, "epoch": 595} {"train_loss": -19.973325729370117, "global_step": 49437, "epoch": 595} {"train_loss": -19.780500411987305, "global_step": 49438, "epoch": 595} {"train_loss": -19.825895309448242, "global_step": 49439, "epoch": 595} {"train_loss": -20.03127670288086, "global_step": 49440, "epoch": 595} {"train_loss": -20.045530319213867, "global_step": 49441, "epoch": 595} {"train_loss": -19.864770889282227, "global_step": 49442, "epoch": 595} {"train_loss": -19.703367233276367, "global_step": 49443, "epoch": 595} {"train_loss": -19.884498596191406, "global_step": 49444, "epoch": 595} {"train_loss": -19.813291549682617, "global_step": 49445, "epoch": 595} {"train_loss": -20.001922607421875, "global_step": 49446, "epoch": 595} {"train_loss": -19.75876235961914, "global_step": 49447, "epoch": 595} {"train_loss": -20.117420196533203, "global_step": 49448, "epoch": 595} {"train_loss": -19.545089721679688, "global_step": 49449, "epoch": 595} {"train_loss": -20.008359909057617, "global_step": 49450, "epoch": 595} {"train_loss": -20.024513244628906, "global_step": 49451, "epoch": 595} {"train_loss": -19.498985290527344, "global_step": 49452, "epoch": 595} {"train_loss": -20.024200439453125, "global_step": 49453, "epoch": 595} {"train_loss": -19.756547927856445, "global_step": 49454, "epoch": 595} {"train_loss": -19.566837310791016, "global_step": 49455, "epoch": 595} {"train_loss": -19.957475662231445, "global_step": 49456, "epoch": 595} {"train_loss": -19.931468963623047, "global_step": 49457, "epoch": 595} {"train_loss": -19.8678035736084, "global_step": 49458, "epoch": 595} {"train_loss": -20.051895141601562, "global_step": 49459, "epoch": 595} {"train_loss": -20.186874389648438, "global_step": 49460, "epoch": 595} {"train_loss": -19.41676902770996, "global_step": 49461, "epoch": 595} {"train_loss": -19.794889450073242, "global_step": 49462, "epoch": 595} {"train_loss": -20.167491912841797, "global_step": 49463, "epoch": 595} {"train_loss": -19.710962295532227, "global_step": 49464, "epoch": 595} {"train_loss": -19.77411460876465, "global_step": 49465, "epoch": 595} {"train_loss": -19.879865646362305, "global_step": 49466, "epoch": 595} {"train_loss": -19.89126274384648, "global_step": 49467, "epoch": 595, "val_loss": 5954891.5} {"train_loss": -19.512929916381836, "global_step": 49468, "epoch": 596} {"train_loss": -19.41167640686035, "global_step": 49469, "epoch": 596} {"train_loss": -19.821123123168945, "global_step": 49470, "epoch": 596} {"train_loss": -19.866104125976562, "global_step": 49471, "epoch": 596} {"train_loss": -19.948766708374023, "global_step": 49472, "epoch": 596} {"train_loss": -19.29572105407715, "global_step": 49473, "epoch": 596} {"train_loss": -19.42232322692871, "global_step": 49474, "epoch": 596} {"train_loss": -19.40380859375, "global_step": 49475, "epoch": 596} {"train_loss": -19.851150512695312, "global_step": 49476, "epoch": 596} {"train_loss": -19.500791549682617, "global_step": 49477, "epoch": 596} {"train_loss": -19.714359283447266, "global_step": 49478, "epoch": 596} {"train_loss": -19.72052764892578, "global_step": 49479, "epoch": 596} {"train_loss": -19.74982452392578, "global_step": 49480, "epoch": 596} {"train_loss": -19.584386825561523, "global_step": 49481, "epoch": 596} {"train_loss": -19.7665958404541, "global_step": 49482, "epoch": 596} {"train_loss": -19.581092834472656, "global_step": 49483, "epoch": 596} {"train_loss": -19.858631134033203, "global_step": 49484, "epoch": 596} {"train_loss": -20.0109920501709, "global_step": 49485, "epoch": 596} {"train_loss": -19.967988967895508, "global_step": 49486, "epoch": 596} {"train_loss": -20.017133712768555, "global_step": 49487, "epoch": 596} {"train_loss": -19.629301071166992, "global_step": 49488, "epoch": 596} {"train_loss": -20.1165771484375, "global_step": 49489, "epoch": 596} {"train_loss": -20.149887084960938, "global_step": 49490, "epoch": 596} {"train_loss": -19.879985809326172, "global_step": 49491, "epoch": 596} {"train_loss": -19.520618438720703, "global_step": 49492, "epoch": 596} {"train_loss": -20.149580001831055, "global_step": 49493, "epoch": 596} {"train_loss": -19.876205444335938, "global_step": 49494, "epoch": 596} {"train_loss": -19.373563766479492, "global_step": 49495, "epoch": 596} {"train_loss": -19.79459571838379, "global_step": 49496, "epoch": 596} {"train_loss": -19.838438034057617, "global_step": 49497, "epoch": 596} {"train_loss": -19.528623580932617, "global_step": 49498, "epoch": 596} {"train_loss": -19.845638275146484, "global_step": 49499, "epoch": 596} {"train_loss": -20.0516414642334, "global_step": 49500, "epoch": 596} {"train_loss": -20.098464965820312, "global_step": 49501, "epoch": 596} {"train_loss": -19.75898551940918, "global_step": 49502, "epoch": 596} {"train_loss": -20.11117935180664, "global_step": 49503, "epoch": 596} {"train_loss": -19.724842071533203, "global_step": 49504, "epoch": 596} {"train_loss": -19.545644760131836, "global_step": 49505, "epoch": 596} {"train_loss": -20.03057289123535, "global_step": 49506, "epoch": 596} {"train_loss": -20.010883331298828, "global_step": 49507, "epoch": 596} {"train_loss": -20.072509765625, "global_step": 49508, "epoch": 596} {"train_loss": -20.347366333007812, "global_step": 49509, "epoch": 596} {"train_loss": -19.543350219726562, "global_step": 49510, "epoch": 596} {"train_loss": -19.63511085510254, "global_step": 49511, "epoch": 596} {"train_loss": -19.469797134399414, "global_step": 49512, "epoch": 596} {"train_loss": -19.948118209838867, "global_step": 49513, "epoch": 596} {"train_loss": -20.00227928161621, "global_step": 49514, "epoch": 596} {"train_loss": -19.8674373626709, "global_step": 49515, "epoch": 596} {"train_loss": -20.096982955932617, "global_step": 49516, "epoch": 596} {"train_loss": -20.152738571166992, "global_step": 49517, "epoch": 596} {"train_loss": -19.41778564453125, "global_step": 49518, "epoch": 596} {"train_loss": -19.953886032104492, "global_step": 49519, "epoch": 596} {"train_loss": -19.94586181640625, "global_step": 49520, "epoch": 596} {"train_loss": -20.210988998413086, "global_step": 49521, "epoch": 596} {"train_loss": -19.759382247924805, "global_step": 49522, "epoch": 596} {"train_loss": -19.660648345947266, "global_step": 49523, "epoch": 596} {"train_loss": -20.092283248901367, "global_step": 49524, "epoch": 596} {"train_loss": -20.117996215820312, "global_step": 49525, "epoch": 596} {"train_loss": -19.622756958007812, "global_step": 49526, "epoch": 596} {"train_loss": -19.899320602416992, "global_step": 49527, "epoch": 596} {"train_loss": -19.71577262878418, "global_step": 49528, "epoch": 596} {"train_loss": -20.144405364990234, "global_step": 49529, "epoch": 596} {"train_loss": -19.589052200317383, "global_step": 49530, "epoch": 596} {"train_loss": -20.098783493041992, "global_step": 49531, "epoch": 596} {"train_loss": -20.395828247070312, "global_step": 49532, "epoch": 596} {"train_loss": -19.952228546142578, "global_step": 49533, "epoch": 596} {"train_loss": -19.838735580444336, "global_step": 49534, "epoch": 596} {"train_loss": -19.950847625732422, "global_step": 49535, "epoch": 596} {"train_loss": -19.830490112304688, "global_step": 49536, "epoch": 596} {"train_loss": -19.826763153076172, "global_step": 49537, "epoch": 596} {"train_loss": -19.86521339416504, "global_step": 49538, "epoch": 596} {"train_loss": -19.99918556213379, "global_step": 49539, "epoch": 596} {"train_loss": -19.915725708007812, "global_step": 49540, "epoch": 596} {"train_loss": -20.11688804626465, "global_step": 49541, "epoch": 596} {"train_loss": -19.93694496154785, "global_step": 49542, "epoch": 596} {"train_loss": -19.889005661010742, "global_step": 49543, "epoch": 596} {"train_loss": -19.988386154174805, "global_step": 49544, "epoch": 596} {"train_loss": -19.582366943359375, "global_step": 49545, "epoch": 596} {"train_loss": -19.833053588867188, "global_step": 49546, "epoch": 596} {"train_loss": -20.05318260192871, "global_step": 49547, "epoch": 596} {"train_loss": -19.90138816833496, "global_step": 49548, "epoch": 596} {"train_loss": -19.98780632019043, "global_step": 49549, "epoch": 596} {"train_loss": -19.842603614531367, "global_step": 49550, "epoch": 596, "val_loss": 5944106.0} {"train_loss": -19.91864013671875, "global_step": 49551, "epoch": 597} {"train_loss": -19.76270866394043, "global_step": 49552, "epoch": 597} {"train_loss": -19.76763343811035, "global_step": 49553, "epoch": 597} {"train_loss": -19.9341983795166, "global_step": 49554, "epoch": 597} {"train_loss": -20.09761619567871, "global_step": 49555, "epoch": 597} {"train_loss": -19.73904800415039, "global_step": 49556, "epoch": 597} {"train_loss": -19.616147994995117, "global_step": 49557, "epoch": 597} {"train_loss": -19.84731101989746, "global_step": 49558, "epoch": 597} {"train_loss": -20.01308250427246, "global_step": 49559, "epoch": 597} {"train_loss": -20.14697265625, "global_step": 49560, "epoch": 597} {"train_loss": -19.628116607666016, "global_step": 49561, "epoch": 597} {"train_loss": -20.032695770263672, "global_step": 49562, "epoch": 597} {"train_loss": -19.486114501953125, "global_step": 49563, "epoch": 597} {"train_loss": -19.900747299194336, "global_step": 49564, "epoch": 597} {"train_loss": -19.67376708984375, "global_step": 49565, "epoch": 597} {"train_loss": -19.551074981689453, "global_step": 49566, "epoch": 597} {"train_loss": -19.9776554107666, "global_step": 49567, "epoch": 597} {"train_loss": -19.883214950561523, "global_step": 49568, "epoch": 597} {"train_loss": -19.805673599243164, "global_step": 49569, "epoch": 597} {"train_loss": -19.929306030273438, "global_step": 49570, "epoch": 597} {"train_loss": -19.8115234375, "global_step": 49571, "epoch": 597} {"train_loss": -20.00119400024414, "global_step": 49572, "epoch": 597} {"train_loss": -20.285295486450195, "global_step": 49573, "epoch": 597} {"train_loss": -20.041311264038086, "global_step": 49574, "epoch": 597} {"train_loss": -20.13698387145996, "global_step": 49575, "epoch": 597} {"train_loss": -20.04642677307129, "global_step": 49576, "epoch": 597} {"train_loss": -20.018564224243164, "global_step": 49577, "epoch": 597} {"train_loss": -19.702838897705078, "global_step": 49578, "epoch": 597} {"train_loss": -19.880325317382812, "global_step": 49579, "epoch": 597} {"train_loss": -19.905241012573242, "global_step": 49580, "epoch": 597} {"train_loss": -19.584272384643555, "global_step": 49581, "epoch": 597} {"train_loss": -19.988664627075195, "global_step": 49582, "epoch": 597} {"train_loss": -20.052061080932617, "global_step": 49583, "epoch": 597} {"train_loss": -19.8430233001709, "global_step": 49584, "epoch": 597} {"train_loss": -19.917678833007812, "global_step": 49585, "epoch": 597} {"train_loss": -19.798263549804688, "global_step": 49586, "epoch": 597} {"train_loss": -19.549835205078125, "global_step": 49587, "epoch": 597} {"train_loss": -19.677780151367188, "global_step": 49588, "epoch": 597} {"train_loss": -19.92571258544922, "global_step": 49589, "epoch": 597} {"train_loss": -20.285266876220703, "global_step": 49590, "epoch": 597} {"train_loss": -20.034494400024414, "global_step": 49591, "epoch": 597} {"train_loss": -19.990095138549805, "global_step": 49592, "epoch": 597} {"train_loss": -20.139394760131836, "global_step": 49593, "epoch": 597} {"train_loss": -20.112668991088867, "global_step": 49594, "epoch": 597} {"train_loss": -19.627634048461914, "global_step": 49595, "epoch": 597} {"train_loss": -19.929906845092773, "global_step": 49596, "epoch": 597} {"train_loss": -19.898359298706055, "global_step": 49597, "epoch": 597} {"train_loss": -19.702951431274414, "global_step": 49598, "epoch": 597} {"train_loss": -19.671911239624023, "global_step": 49599, "epoch": 597} {"train_loss": -19.74945068359375, "global_step": 49600, "epoch": 597} {"train_loss": -19.863683700561523, "global_step": 49601, "epoch": 597} {"train_loss": -20.030488967895508, "global_step": 49602, "epoch": 597} {"train_loss": -19.939790725708008, "global_step": 49603, "epoch": 597} {"train_loss": -19.63605308532715, "global_step": 49604, "epoch": 597} {"train_loss": -20.034378051757812, "global_step": 49605, "epoch": 597} {"train_loss": -20.110660552978516, "global_step": 49606, "epoch": 597} {"train_loss": -20.087520599365234, "global_step": 49607, "epoch": 597} {"train_loss": -20.232248306274414, "global_step": 49608, "epoch": 597} {"train_loss": -19.577102661132812, "global_step": 49609, "epoch": 597} {"train_loss": -20.05965232849121, "global_step": 49610, "epoch": 597} {"train_loss": -20.083444595336914, "global_step": 49611, "epoch": 597} {"train_loss": -19.800138473510742, "global_step": 49612, "epoch": 597} {"train_loss": -20.017175674438477, "global_step": 49613, "epoch": 597} {"train_loss": -19.8144588470459, "global_step": 49614, "epoch": 597} {"train_loss": -19.944091796875, "global_step": 49615, "epoch": 597} {"train_loss": -20.13518714904785, "global_step": 49616, "epoch": 597} {"train_loss": -20.14827537536621, "global_step": 49617, "epoch": 597} {"train_loss": -19.8289737701416, "global_step": 49618, "epoch": 597} {"train_loss": -20.05371856689453, "global_step": 49619, "epoch": 597} {"train_loss": -19.797800064086914, "global_step": 49620, "epoch": 597} {"train_loss": -19.786518096923828, "global_step": 49621, "epoch": 597} {"train_loss": -19.901247024536133, "global_step": 49622, "epoch": 597} {"train_loss": -20.082683563232422, "global_step": 49623, "epoch": 597} {"train_loss": -19.83222770690918, "global_step": 49624, "epoch": 597} {"train_loss": -19.738611221313477, "global_step": 49625, "epoch": 597} {"train_loss": -19.9658145904541, "global_step": 49626, "epoch": 597} {"train_loss": -19.848129272460938, "global_step": 49627, "epoch": 597} {"train_loss": -20.306962966918945, "global_step": 49628, "epoch": 597} {"train_loss": -20.112411499023438, "global_step": 49629, "epoch": 597} {"train_loss": -19.846784591674805, "global_step": 49630, "epoch": 597} {"train_loss": -19.789655685424805, "global_step": 49631, "epoch": 597} {"train_loss": -20.141040802001953, "global_step": 49632, "epoch": 597} {"train_loss": -19.911759640797076, "global_step": 49633, "epoch": 597, "val_loss": 6065705.0} {"train_loss": -19.87790870666504, "global_step": 49634, "epoch": 598} {"train_loss": -19.66452980041504, "global_step": 49635, "epoch": 598} {"train_loss": -19.640872955322266, "global_step": 49636, "epoch": 598} {"train_loss": -19.637052536010742, "global_step": 49637, "epoch": 598} {"train_loss": -19.729284286499023, "global_step": 49638, "epoch": 598} {"train_loss": -19.87908363342285, "global_step": 49639, "epoch": 598} {"train_loss": -19.553361892700195, "global_step": 49640, "epoch": 598} {"train_loss": -19.768646240234375, "global_step": 49641, "epoch": 598} {"train_loss": -19.845422744750977, "global_step": 49642, "epoch": 598} {"train_loss": -19.881757736206055, "global_step": 49643, "epoch": 598} {"train_loss": -19.826086044311523, "global_step": 49644, "epoch": 598} {"train_loss": -19.81048011779785, "global_step": 49645, "epoch": 598} {"train_loss": -19.65299415588379, "global_step": 49646, "epoch": 598} {"train_loss": -19.67976951599121, "global_step": 49647, "epoch": 598} {"train_loss": -20.065994262695312, "global_step": 49648, "epoch": 598} {"train_loss": -19.574106216430664, "global_step": 49649, "epoch": 598} {"train_loss": -19.809432983398438, "global_step": 49650, "epoch": 598} {"train_loss": -20.001333236694336, "global_step": 49651, "epoch": 598} {"train_loss": -19.493457794189453, "global_step": 49652, "epoch": 598} {"train_loss": -20.069368362426758, "global_step": 49653, "epoch": 598} {"train_loss": -19.877470016479492, "global_step": 49654, "epoch": 598} {"train_loss": -20.033960342407227, "global_step": 49655, "epoch": 598} {"train_loss": -20.038463592529297, "global_step": 49656, "epoch": 598} {"train_loss": -19.762435913085938, "global_step": 49657, "epoch": 598} {"train_loss": -20.209497451782227, "global_step": 49658, "epoch": 598} {"train_loss": -20.027557373046875, "global_step": 49659, "epoch": 598} {"train_loss": -19.964786529541016, "global_step": 49660, "epoch": 598} {"train_loss": -19.759441375732422, "global_step": 49661, "epoch": 598} {"train_loss": -20.181406021118164, "global_step": 49662, "epoch": 598} {"train_loss": -20.2979679107666, "global_step": 49663, "epoch": 598} {"train_loss": -19.974557876586914, "global_step": 49664, "epoch": 598} {"train_loss": -19.842641830444336, "global_step": 49665, "epoch": 598} {"train_loss": -20.27776336669922, "global_step": 49666, "epoch": 598} {"train_loss": -19.711057662963867, "global_step": 49667, "epoch": 598} {"train_loss": -19.936050415039062, "global_step": 49668, "epoch": 598} {"train_loss": -19.91818618774414, "global_step": 49669, "epoch": 598} {"train_loss": -19.580514907836914, "global_step": 49670, "epoch": 598} {"train_loss": -19.566600799560547, "global_step": 49671, "epoch": 598} {"train_loss": -19.872587203979492, "global_step": 49672, "epoch": 598} {"train_loss": -19.797475814819336, "global_step": 49673, "epoch": 598} {"train_loss": -20.050769805908203, "global_step": 49674, "epoch": 598} {"train_loss": -19.889753341674805, "global_step": 49675, "epoch": 598} {"train_loss": -20.116363525390625, "global_step": 49676, "epoch": 598} {"train_loss": -19.73213005065918, "global_step": 49677, "epoch": 598} {"train_loss": -20.150554656982422, "global_step": 49678, "epoch": 598} {"train_loss": -20.217323303222656, "global_step": 49679, "epoch": 598} {"train_loss": -20.236225128173828, "global_step": 49680, "epoch": 598} {"train_loss": -20.01277732849121, "global_step": 49681, "epoch": 598} {"train_loss": -19.6146240234375, "global_step": 49682, "epoch": 598} {"train_loss": -20.186262130737305, "global_step": 49683, "epoch": 598} {"train_loss": -19.96493911743164, "global_step": 49684, "epoch": 598} {"train_loss": -19.957069396972656, "global_step": 49685, "epoch": 598} {"train_loss": -19.97822380065918, "global_step": 49686, "epoch": 598} {"train_loss": -19.920557022094727, "global_step": 49687, "epoch": 598} {"train_loss": -19.792842864990234, "global_step": 49688, "epoch": 598} {"train_loss": -20.30803871154785, "global_step": 49689, "epoch": 598} {"train_loss": -20.1560115814209, "global_step": 49690, "epoch": 598} {"train_loss": -19.9332218170166, "global_step": 49691, "epoch": 598} {"train_loss": -20.101757049560547, "global_step": 49692, "epoch": 598} {"train_loss": -19.6456356048584, "global_step": 49693, "epoch": 598} {"train_loss": -20.219661712646484, "global_step": 49694, "epoch": 598} {"train_loss": -19.592649459838867, "global_step": 49695, "epoch": 598} {"train_loss": -19.831811904907227, "global_step": 49696, "epoch": 598} {"train_loss": -19.88483238220215, "global_step": 49697, "epoch": 598} {"train_loss": -20.18144989013672, "global_step": 49698, "epoch": 598} {"train_loss": -19.847156524658203, "global_step": 49699, "epoch": 598} {"train_loss": -20.054813385009766, "global_step": 49700, "epoch": 598} {"train_loss": -19.803247451782227, "global_step": 49701, "epoch": 598} {"train_loss": -20.124130249023438, "global_step": 49702, "epoch": 598} {"train_loss": -19.802839279174805, "global_step": 49703, "epoch": 598} {"train_loss": -20.048063278198242, "global_step": 49704, "epoch": 598} {"train_loss": -20.159122467041016, "global_step": 49705, "epoch": 598} {"train_loss": -19.860000610351562, "global_step": 49706, "epoch": 598} {"train_loss": -19.79969596862793, "global_step": 49707, "epoch": 598} {"train_loss": -19.614805221557617, "global_step": 49708, "epoch": 598} {"train_loss": -19.833271026611328, "global_step": 49709, "epoch": 598} {"train_loss": -19.982908248901367, "global_step": 49710, "epoch": 598} {"train_loss": -19.879878997802734, "global_step": 49711, "epoch": 598} {"train_loss": -19.774240493774414, "global_step": 49712, "epoch": 598} {"train_loss": -19.769058227539062, "global_step": 49713, "epoch": 598} {"train_loss": -20.02193260192871, "global_step": 49714, "epoch": 598} {"train_loss": -20.010507583618164, "global_step": 49715, "epoch": 598} {"train_loss": -19.891297099101973, "global_step": 49716, "epoch": 598, "val_loss": 6067185.0} {"train_loss": -19.682661056518555, "global_step": 49717, "epoch": 599} {"train_loss": -20.117780685424805, "global_step": 49718, "epoch": 599} {"train_loss": -19.629697799682617, "global_step": 49719, "epoch": 599} {"train_loss": -19.7138614654541, "global_step": 49720, "epoch": 599} {"train_loss": -19.987394332885742, "global_step": 49721, "epoch": 599} {"train_loss": -19.748090744018555, "global_step": 49722, "epoch": 599} {"train_loss": -19.600629806518555, "global_step": 49723, "epoch": 599} {"train_loss": -19.70954132080078, "global_step": 49724, "epoch": 599} {"train_loss": -20.1805477142334, "global_step": 49725, "epoch": 599} {"train_loss": -20.044706344604492, "global_step": 49726, "epoch": 599} {"train_loss": -19.97210693359375, "global_step": 49727, "epoch": 599} {"train_loss": -19.964588165283203, "global_step": 49728, "epoch": 599} {"train_loss": -19.844669342041016, "global_step": 49729, "epoch": 599} {"train_loss": -19.829668045043945, "global_step": 49730, "epoch": 599} {"train_loss": -19.99340057373047, "global_step": 49731, "epoch": 599} {"train_loss": -19.95570945739746, "global_step": 49732, "epoch": 599} {"train_loss": -19.8587703704834, "global_step": 49733, "epoch": 599} {"train_loss": -19.89804458618164, "global_step": 49734, "epoch": 599} {"train_loss": -19.861061096191406, "global_step": 49735, "epoch": 599} {"train_loss": -19.89046287536621, "global_step": 49736, "epoch": 599} {"train_loss": -19.885318756103516, "global_step": 49737, "epoch": 599} {"train_loss": -19.970914840698242, "global_step": 49738, "epoch": 599} {"train_loss": -20.162565231323242, "global_step": 49739, "epoch": 599} {"train_loss": -19.980419158935547, "global_step": 49740, "epoch": 599} {"train_loss": -19.52410316467285, "global_step": 49741, "epoch": 599} {"train_loss": -19.952327728271484, "global_step": 49742, "epoch": 599} {"train_loss": -19.507572174072266, "global_step": 49743, "epoch": 599} {"train_loss": -20.191131591796875, "global_step": 49744, "epoch": 599} {"train_loss": -19.63787269592285, "global_step": 49745, "epoch": 599} {"train_loss": -20.01857566833496, "global_step": 49746, "epoch": 599} {"train_loss": -19.816883087158203, "global_step": 49747, "epoch": 599} {"train_loss": -19.999963760375977, "global_step": 49748, "epoch": 599} {"train_loss": -19.986373901367188, "global_step": 49749, "epoch": 599} {"train_loss": -19.68027687072754, "global_step": 49750, "epoch": 599} {"train_loss": -20.163829803466797, "global_step": 49751, "epoch": 599} {"train_loss": -19.860441207885742, "global_step": 49752, "epoch": 599} {"train_loss": -19.867231369018555, "global_step": 49753, "epoch": 599} {"train_loss": -19.715700149536133, "global_step": 49754, "epoch": 599} {"train_loss": -19.935155868530273, "global_step": 49755, "epoch": 599} {"train_loss": -20.171663284301758, "global_step": 49756, "epoch": 599} {"train_loss": -19.686691284179688, "global_step": 49757, "epoch": 599} {"train_loss": -19.941442489624023, "global_step": 49758, "epoch": 599} {"train_loss": -19.734434127807617, "global_step": 49759, "epoch": 599} {"train_loss": -19.91695213317871, "global_step": 49760, "epoch": 599} {"train_loss": -19.877132415771484, "global_step": 49761, "epoch": 599} {"train_loss": -20.157556533813477, "global_step": 49762, "epoch": 599} {"train_loss": -20.024770736694336, "global_step": 49763, "epoch": 599} {"train_loss": -20.167341232299805, "global_step": 49764, "epoch": 599} {"train_loss": -20.08655548095703, "global_step": 49765, "epoch": 599} {"train_loss": -19.862096786499023, "global_step": 49766, "epoch": 599} {"train_loss": -19.830350875854492, "global_step": 49767, "epoch": 599} {"train_loss": -19.96322250366211, "global_step": 49768, "epoch": 599} {"train_loss": -20.139169692993164, "global_step": 49769, "epoch": 599} {"train_loss": -19.822986602783203, "global_step": 49770, "epoch": 599} {"train_loss": -19.810091018676758, "global_step": 49771, "epoch": 599} {"train_loss": -19.9168758392334, "global_step": 49772, "epoch": 599} {"train_loss": -19.816511154174805, "global_step": 49773, "epoch": 599} {"train_loss": -20.406599044799805, "global_step": 49774, "epoch": 599} {"train_loss": -20.28527069091797, "global_step": 49775, "epoch": 599} {"train_loss": -20.01078224182129, "global_step": 49776, "epoch": 599} {"train_loss": -19.5939884185791, "global_step": 49777, "epoch": 599} {"train_loss": -19.55841064453125, "global_step": 49778, "epoch": 599} {"train_loss": -19.90675163269043, "global_step": 49779, "epoch": 599} {"train_loss": -20.236669540405273, "global_step": 49780, "epoch": 599} {"train_loss": -20.109331130981445, "global_step": 49781, "epoch": 599} {"train_loss": -20.078397750854492, "global_step": 49782, "epoch": 599} {"train_loss": -19.839488983154297, "global_step": 49783, "epoch": 599} {"train_loss": -20.04629898071289, "global_step": 49784, "epoch": 599} {"train_loss": -19.534414291381836, "global_step": 49785, "epoch": 599} {"train_loss": -19.76112937927246, "global_step": 49786, "epoch": 599} {"train_loss": -19.9116268157959, "global_step": 49787, "epoch": 599} {"train_loss": -19.613561630249023, "global_step": 49788, "epoch": 599} {"train_loss": -19.80525779724121, "global_step": 49789, "epoch": 599} {"train_loss": -19.721702575683594, "global_step": 49790, "epoch": 599} {"train_loss": -19.89739990234375, "global_step": 49791, "epoch": 599} {"train_loss": -20.05409049987793, "global_step": 49792, "epoch": 599} {"train_loss": -20.03130531311035, "global_step": 49793, "epoch": 599} {"train_loss": -19.859556198120117, "global_step": 49794, "epoch": 599} {"train_loss": -19.816776275634766, "global_step": 49795, "epoch": 599} {"train_loss": -19.843585968017578, "global_step": 49796, "epoch": 599} {"train_loss": -19.950551986694336, "global_step": 49797, "epoch": 599} {"train_loss": -20.069522857666016, "global_step": 49798, "epoch": 599} {"train_loss": -19.901132238916603, "global_step": 49799, "epoch": 599, "val_loss": 6168287.0} {"train_loss": -19.73200035095215, "global_step": 49800, "epoch": 600} {"train_loss": -19.665348052978516, "global_step": 49801, "epoch": 600} {"train_loss": -19.729389190673828, "global_step": 49802, "epoch": 600} {"train_loss": -19.699247360229492, "global_step": 49803, "epoch": 600} {"train_loss": -19.456472396850586, "global_step": 49804, "epoch": 600} {"train_loss": -19.779232025146484, "global_step": 49805, "epoch": 600} {"train_loss": -19.37037467956543, "global_step": 49806, "epoch": 600} {"train_loss": -19.998563766479492, "global_step": 49807, "epoch": 600} {"train_loss": -19.912139892578125, "global_step": 49808, "epoch": 600} {"train_loss": -19.776294708251953, "global_step": 49809, "epoch": 600} {"train_loss": -19.600677490234375, "global_step": 49810, "epoch": 600} {"train_loss": -19.508535385131836, "global_step": 49811, "epoch": 600} {"train_loss": -19.5462703704834, "global_step": 49812, "epoch": 600} {"train_loss": -19.77687644958496, "global_step": 49813, "epoch": 600} {"train_loss": -19.982133865356445, "global_step": 49814, "epoch": 600} {"train_loss": -19.766925811767578, "global_step": 49815, "epoch": 600} {"train_loss": -19.948043823242188, "global_step": 49816, "epoch": 600} {"train_loss": -20.029376983642578, "global_step": 49817, "epoch": 600} {"train_loss": -20.079832077026367, "global_step": 49818, "epoch": 600} {"train_loss": -19.083301544189453, "global_step": 49819, "epoch": 600} {"train_loss": -20.028955459594727, "global_step": 49820, "epoch": 600} {"train_loss": -20.02033805847168, "global_step": 49821, "epoch": 600} {"train_loss": -19.662717819213867, "global_step": 49822, "epoch": 600} {"train_loss": -20.105449676513672, "global_step": 49823, "epoch": 600} {"train_loss": -20.066848754882812, "global_step": 49824, "epoch": 600} {"train_loss": -19.914438247680664, "global_step": 49825, "epoch": 600} {"train_loss": -19.92239761352539, "global_step": 49826, "epoch": 600} {"train_loss": -19.83098602294922, "global_step": 49827, "epoch": 600} {"train_loss": -20.058422088623047, "global_step": 49828, "epoch": 600} {"train_loss": -19.564611434936523, "global_step": 49829, "epoch": 600} {"train_loss": -19.98431968688965, "global_step": 49830, "epoch": 600} {"train_loss": -20.016849517822266, "global_step": 49831, "epoch": 600} {"train_loss": -19.669965744018555, "global_step": 49832, "epoch": 600} {"train_loss": -20.07073974609375, "global_step": 49833, "epoch": 600} {"train_loss": -19.765714645385742, "global_step": 49834, "epoch": 600} {"train_loss": -20.035907745361328, "global_step": 49835, "epoch": 600} {"train_loss": -19.534183502197266, "global_step": 49836, "epoch": 600} {"train_loss": -19.872787475585938, "global_step": 49837, "epoch": 600} {"train_loss": -20.005611419677734, "global_step": 49838, "epoch": 600} {"train_loss": -20.239635467529297, "global_step": 49839, "epoch": 600} {"train_loss": -20.002498626708984, "global_step": 49840, "epoch": 600} {"train_loss": -19.65181541442871, "global_step": 49841, "epoch": 600} {"train_loss": -19.91574478149414, "global_step": 49842, "epoch": 600} {"train_loss": -20.003803253173828, "global_step": 49843, "epoch": 600} {"train_loss": -19.78620147705078, "global_step": 49844, "epoch": 600} {"train_loss": -19.94378662109375, "global_step": 49845, "epoch": 600} {"train_loss": -19.950326919555664, "global_step": 49846, "epoch": 600} {"train_loss": -19.90863609313965, "global_step": 49847, "epoch": 600} {"train_loss": -19.814571380615234, "global_step": 49848, "epoch": 600} {"train_loss": -20.375059127807617, "global_step": 49849, "epoch": 600} {"train_loss": -20.078893661499023, "global_step": 49850, "epoch": 600} {"train_loss": -19.83168601989746, "global_step": 49851, "epoch": 600} {"train_loss": -20.252660751342773, "global_step": 49852, "epoch": 600} {"train_loss": -19.873563766479492, "global_step": 49853, "epoch": 600} {"train_loss": -19.6556453704834, "global_step": 49854, "epoch": 600} {"train_loss": -20.138526916503906, "global_step": 49855, "epoch": 600} {"train_loss": -19.638242721557617, "global_step": 49856, "epoch": 600} {"train_loss": -19.55892562866211, "global_step": 49857, "epoch": 600} {"train_loss": -20.220008850097656, "global_step": 49858, "epoch": 600} {"train_loss": -19.962181091308594, "global_step": 49859, "epoch": 600} {"train_loss": -20.18474769592285, "global_step": 49860, "epoch": 600} {"train_loss": -19.677555084228516, "global_step": 49861, "epoch": 600} {"train_loss": -20.07856559753418, "global_step": 49862, "epoch": 600} {"train_loss": -19.624759674072266, "global_step": 49863, "epoch": 600} {"train_loss": -19.961959838867188, "global_step": 49864, "epoch": 600} {"train_loss": -20.194814682006836, "global_step": 49865, "epoch": 600} {"train_loss": -20.118906021118164, "global_step": 49866, "epoch": 600} {"train_loss": -19.75290298461914, "global_step": 49867, "epoch": 600} {"train_loss": -19.833240509033203, "global_step": 49868, "epoch": 600} {"train_loss": -19.97730827331543, "global_step": 49869, "epoch": 600} {"train_loss": -19.861549377441406, "global_step": 49870, "epoch": 600} {"train_loss": -19.84290885925293, "global_step": 49871, "epoch": 600} {"train_loss": -19.972692489624023, "global_step": 49872, "epoch": 600} {"train_loss": -19.97279930114746, "global_step": 49873, "epoch": 600} {"train_loss": -20.04659652709961, "global_step": 49874, "epoch": 600} {"train_loss": -20.021955490112305, "global_step": 49875, "epoch": 600} {"train_loss": -20.135366439819336, "global_step": 49876, "epoch": 600} {"train_loss": -20.13724708557129, "global_step": 49877, "epoch": 600} {"train_loss": -19.911054611206055, "global_step": 49878, "epoch": 600} {"train_loss": -20.099653244018555, "global_step": 49879, "epoch": 600} {"train_loss": -19.588666915893555, "global_step": 49880, "epoch": 600} {"train_loss": -19.913719177246094, "global_step": 49881, "epoch": 600} {"train_loss": -19.87628403629165, "global_step": 49882, "epoch": 600, "train/sim_max_reward_0": 1.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 0.0, "train/sim_max_reward_4": 0.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4500000": 1.0, "test/sim_max_reward_4500001": 1.0, "test/sim_max_reward_4500002": 1.0, "test/sim_max_reward_4500003": 1.0, "test/sim_max_reward_4500004": 1.0, "test/sim_max_reward_4500005": 1.0, "test/sim_max_reward_4500006": 1.0, "test/sim_max_reward_4500007": 1.0, "test/sim_max_reward_4500008": 1.0, "test/sim_max_reward_4500009": 1.0, "test/sim_max_reward_4500010": 1.0, "test/sim_max_reward_4500011": 1.0, "test/sim_max_reward_4500012": 1.0, "test/sim_max_reward_4500013": 1.0, "test/sim_max_reward_4500014": 1.0, "test/sim_max_reward_4500015": 1.0, "test/sim_max_reward_4500016": 1.0, "test/sim_max_reward_4500017": 1.0, "test/sim_max_reward_4500018": 1.0, "test/sim_max_reward_4500019": 0.0, "test/sim_max_reward_4500020": 1.0, "test/sim_max_reward_4500021": 1.0, "train/mean_score": 0.6666666666666666, "test/mean_score": 0.9545454545454546, "val_loss": 5932380.5} {"train_loss": -19.128448486328125, "global_step": 49883, "epoch": 601} {"train_loss": -19.412960052490234, "global_step": 49884, "epoch": 601} {"train_loss": -19.594924926757812, "global_step": 49885, "epoch": 601} {"train_loss": -19.563989639282227, "global_step": 49886, "epoch": 601} {"train_loss": -19.83440399169922, "global_step": 49887, "epoch": 601} {"train_loss": -19.75655174255371, "global_step": 49888, "epoch": 601} {"train_loss": -19.77460289001465, "global_step": 49889, "epoch": 601} {"train_loss": -19.709257125854492, "global_step": 49890, "epoch": 601} {"train_loss": -19.82744598388672, "global_step": 49891, "epoch": 601} {"train_loss": -19.61958122253418, "global_step": 49892, "epoch": 601} {"train_loss": -19.920818328857422, "global_step": 49893, "epoch": 601} {"train_loss": -19.995473861694336, "global_step": 49894, "epoch": 601} {"train_loss": -19.650989532470703, "global_step": 49895, "epoch": 601} {"train_loss": -19.9779109954834, "global_step": 49896, "epoch": 601} {"train_loss": -19.705032348632812, "global_step": 49897, "epoch": 601} {"train_loss": -19.803722381591797, "global_step": 49898, "epoch": 601} {"train_loss": -19.91254234313965, "global_step": 49899, "epoch": 601} {"train_loss": -19.77070426940918, "global_step": 49900, "epoch": 601} {"train_loss": -19.988632202148438, "global_step": 49901, "epoch": 601} {"train_loss": -19.46893310546875, "global_step": 49902, "epoch": 601} {"train_loss": -19.997037887573242, "global_step": 49903, "epoch": 601} {"train_loss": -19.974849700927734, "global_step": 49904, "epoch": 601} {"train_loss": -19.911144256591797, "global_step": 49905, "epoch": 601} {"train_loss": -19.21628761291504, "global_step": 49906, "epoch": 601} {"train_loss": -20.0942440032959, "global_step": 49907, "epoch": 601} {"train_loss": -19.536706924438477, "global_step": 49908, "epoch": 601} {"train_loss": -19.768224716186523, "global_step": 49909, "epoch": 601} {"train_loss": -19.730396270751953, "global_step": 49910, "epoch": 601} {"train_loss": -19.91243553161621, "global_step": 49911, "epoch": 601} {"train_loss": -19.990854263305664, "global_step": 49912, "epoch": 601} {"train_loss": -19.840423583984375, "global_step": 49913, "epoch": 601} {"train_loss": -19.991863250732422, "global_step": 49914, "epoch": 601} {"train_loss": -20.015106201171875, "global_step": 49915, "epoch": 601} {"train_loss": -19.822376251220703, "global_step": 49916, "epoch": 601} {"train_loss": -20.212432861328125, "global_step": 49917, "epoch": 601} {"train_loss": -20.016563415527344, "global_step": 49918, "epoch": 601} {"train_loss": -20.073631286621094, "global_step": 49919, "epoch": 601} {"train_loss": -19.646957397460938, "global_step": 49920, "epoch": 601} {"train_loss": -20.14450454711914, "global_step": 49921, "epoch": 601} {"train_loss": -20.38361930847168, "global_step": 49922, "epoch": 601} {"train_loss": -20.221515655517578, "global_step": 49923, "epoch": 601} {"train_loss": -19.741043090820312, "global_step": 49924, "epoch": 601} {"train_loss": -19.683059692382812, "global_step": 49925, "epoch": 601} {"train_loss": -20.0899600982666, "global_step": 49926, "epoch": 601} {"train_loss": -20.215248107910156, "global_step": 49927, "epoch": 601} {"train_loss": -19.84730339050293, "global_step": 49928, "epoch": 601} {"train_loss": -19.693267822265625, "global_step": 49929, "epoch": 601} {"train_loss": -20.096891403198242, "global_step": 49930, "epoch": 601} {"train_loss": -20.075925827026367, "global_step": 49931, "epoch": 601} {"train_loss": -19.830121994018555, "global_step": 49932, "epoch": 601} {"train_loss": -20.37071990966797, "global_step": 49933, "epoch": 601} {"train_loss": -19.5017032623291, "global_step": 49934, "epoch": 601} {"train_loss": -19.883955001831055, "global_step": 49935, "epoch": 601} {"train_loss": -20.04366683959961, "global_step": 49936, "epoch": 601} {"train_loss": -20.219268798828125, "global_step": 49937, "epoch": 601} {"train_loss": -19.837919235229492, "global_step": 49938, "epoch": 601} {"train_loss": -19.47981071472168, "global_step": 49939, "epoch": 601} {"train_loss": -19.772581100463867, "global_step": 49940, "epoch": 601} {"train_loss": -19.870908737182617, "global_step": 49941, "epoch": 601} {"train_loss": -20.350629806518555, "global_step": 49942, "epoch": 601} {"train_loss": -20.153518676757812, "global_step": 49943, "epoch": 601} {"train_loss": -20.274662017822266, "global_step": 49944, "epoch": 601} {"train_loss": -19.98192596435547, "global_step": 49945, "epoch": 601} {"train_loss": -19.50297737121582, "global_step": 49946, "epoch": 601} {"train_loss": -19.974384307861328, "global_step": 49947, "epoch": 601} {"train_loss": -19.948091506958008, "global_step": 49948, "epoch": 601} {"train_loss": -19.907682418823242, "global_step": 49949, "epoch": 601} {"train_loss": -19.963043212890625, "global_step": 49950, "epoch": 601} {"train_loss": -19.79094696044922, "global_step": 49951, "epoch": 601} {"train_loss": -19.843400955200195, "global_step": 49952, "epoch": 601} {"train_loss": -19.648069381713867, "global_step": 49953, "epoch": 601} {"train_loss": -19.875730514526367, "global_step": 49954, "epoch": 601} {"train_loss": -19.488819122314453, "global_step": 49955, "epoch": 601} {"train_loss": -20.19329261779785, "global_step": 49956, "epoch": 601} {"train_loss": -19.691003799438477, "global_step": 49957, "epoch": 601} {"train_loss": -20.041690826416016, "global_step": 49958, "epoch": 601} {"train_loss": -20.10820198059082, "global_step": 49959, "epoch": 601} {"train_loss": -20.021041870117188, "global_step": 49960, "epoch": 601} {"train_loss": -20.000728607177734, "global_step": 49961, "epoch": 601} {"train_loss": -19.830703735351562, "global_step": 49962, "epoch": 601} {"train_loss": -19.969995498657227, "global_step": 49963, "epoch": 601} {"train_loss": -20.153898239135742, "global_step": 49964, "epoch": 601} {"train_loss": -19.87868543418057, "global_step": 49965, "epoch": 601, "val_loss": 5975709.5} {"train_loss": -19.0373592376709, "global_step": 49966, "epoch": 602} {"train_loss": -19.339757919311523, "global_step": 49967, "epoch": 602} {"train_loss": -19.267438888549805, "global_step": 49968, "epoch": 602} {"train_loss": -19.15435791015625, "global_step": 49969, "epoch": 602} {"train_loss": -19.904678344726562, "global_step": 49970, "epoch": 602} {"train_loss": -19.225139617919922, "global_step": 49971, "epoch": 602} {"train_loss": -19.4217586517334, "global_step": 49972, "epoch": 602} {"train_loss": -19.73868179321289, "global_step": 49973, "epoch": 602} {"train_loss": -19.594839096069336, "global_step": 49974, "epoch": 602} {"train_loss": -19.449329376220703, "global_step": 49975, "epoch": 602} {"train_loss": -19.59090805053711, "global_step": 49976, "epoch": 602} {"train_loss": -19.663955688476562, "global_step": 49977, "epoch": 602} {"train_loss": -19.50935173034668, "global_step": 49978, "epoch": 602} {"train_loss": -19.721561431884766, "global_step": 49979, "epoch": 602} {"train_loss": -19.78070831298828, "global_step": 49980, "epoch": 602} {"train_loss": -19.512374877929688, "global_step": 49981, "epoch": 602} {"train_loss": -19.66484832763672, "global_step": 49982, "epoch": 602} {"train_loss": -19.491445541381836, "global_step": 49983, "epoch": 602} {"train_loss": -19.745441436767578, "global_step": 49984, "epoch": 602} {"train_loss": -19.84792137145996, "global_step": 49985, "epoch": 602} {"train_loss": -20.098058700561523, "global_step": 49986, "epoch": 602} {"train_loss": -19.486862182617188, "global_step": 49987, "epoch": 602} {"train_loss": -19.783893585205078, "global_step": 49988, "epoch": 602} {"train_loss": -20.14620590209961, "global_step": 49989, "epoch": 602} {"train_loss": -19.80664825439453, "global_step": 49990, "epoch": 602} {"train_loss": -19.690088272094727, "global_step": 49991, "epoch": 602} {"train_loss": -20.06744956970215, "global_step": 49992, "epoch": 602} {"train_loss": -19.7864933013916, "global_step": 49993, "epoch": 602} {"train_loss": -19.86468505859375, "global_step": 49994, "epoch": 602} {"train_loss": -19.59731101989746, "global_step": 49995, "epoch": 602} {"train_loss": -19.7475643157959, "global_step": 49996, "epoch": 602} {"train_loss": -20.12911033630371, "global_step": 49997, "epoch": 602} {"train_loss": -20.030689239501953, "global_step": 49998, "epoch": 602} {"train_loss": -20.1540470123291, "global_step": 49999, "epoch": 602} {"train_loss": -19.970569610595703, "global_step": 50000, "epoch": 602} {"train_loss": -19.584487915039062, "global_step": 50001, "epoch": 602} {"train_loss": -19.96241569519043, "global_step": 50002, "epoch": 602} {"train_loss": -20.185209274291992, "global_step": 50003, "epoch": 602} {"train_loss": -20.058822631835938, "global_step": 50004, "epoch": 602} {"train_loss": -19.758892059326172, "global_step": 50005, "epoch": 602} {"train_loss": -20.377166748046875, "global_step": 50006, "epoch": 602} {"train_loss": -19.926515579223633, "global_step": 50007, "epoch": 602} {"train_loss": -19.63477897644043, "global_step": 50008, "epoch": 602} {"train_loss": -19.898983001708984, "global_step": 50009, "epoch": 602} {"train_loss": -19.94993019104004, "global_step": 50010, "epoch": 602} {"train_loss": -20.048093795776367, "global_step": 50011, "epoch": 602} {"train_loss": -19.6527156829834, "global_step": 50012, "epoch": 602} {"train_loss": -20.22633171081543, "global_step": 50013, "epoch": 602} {"train_loss": -19.936391830444336, "global_step": 50014, "epoch": 602} {"train_loss": -19.707687377929688, "global_step": 50015, "epoch": 602} {"train_loss": -20.164390563964844, "global_step": 50016, "epoch": 602} {"train_loss": -19.68555450439453, "global_step": 50017, "epoch": 602} {"train_loss": -19.751684188842773, "global_step": 50018, "epoch": 602} {"train_loss": -20.126049041748047, "global_step": 50019, "epoch": 602} {"train_loss": -20.036151885986328, "global_step": 50020, "epoch": 602} {"train_loss": -19.983131408691406, "global_step": 50021, "epoch": 602} {"train_loss": -19.774429321289062, "global_step": 50022, "epoch": 602} {"train_loss": -20.16274070739746, "global_step": 50023, "epoch": 602} {"train_loss": -19.55364418029785, "global_step": 50024, "epoch": 602} {"train_loss": -20.255470275878906, "global_step": 50025, "epoch": 602} {"train_loss": -19.91176414489746, "global_step": 50026, "epoch": 602} {"train_loss": -19.991662979125977, "global_step": 50027, "epoch": 602} {"train_loss": -19.938589096069336, "global_step": 50028, "epoch": 602} {"train_loss": -20.094717025756836, "global_step": 50029, "epoch": 602} {"train_loss": -19.83381462097168, "global_step": 50030, "epoch": 602} {"train_loss": -19.945871353149414, "global_step": 50031, "epoch": 602} {"train_loss": -20.313308715820312, "global_step": 50032, "epoch": 602} {"train_loss": -19.96852684020996, "global_step": 50033, "epoch": 602} {"train_loss": -19.63797378540039, "global_step": 50034, "epoch": 602} {"train_loss": -20.116003036499023, "global_step": 50035, "epoch": 602} {"train_loss": -19.941329956054688, "global_step": 50036, "epoch": 602} {"train_loss": -19.895999908447266, "global_step": 50037, "epoch": 602} {"train_loss": -20.17701530456543, "global_step": 50038, "epoch": 602} {"train_loss": -20.065326690673828, "global_step": 50039, "epoch": 602} {"train_loss": -19.941532135009766, "global_step": 50040, "epoch": 602} {"train_loss": -19.698650360107422, "global_step": 50041, "epoch": 602} {"train_loss": -19.41290283203125, "global_step": 50042, "epoch": 602} {"train_loss": -20.20631217956543, "global_step": 50043, "epoch": 602} {"train_loss": -19.869918823242188, "global_step": 50044, "epoch": 602} {"train_loss": -19.935970306396484, "global_step": 50045, "epoch": 602} {"train_loss": -19.782264709472656, "global_step": 50046, "epoch": 602} {"train_loss": -20.07925796508789, "global_step": 50047, "epoch": 602} {"train_loss": -19.824223483901427, "global_step": 50048, "epoch": 602, "val_loss": 5960877.5} {"train_loss": -19.789154052734375, "global_step": 50049, "epoch": 603} {"train_loss": -19.681589126586914, "global_step": 50050, "epoch": 603} {"train_loss": -19.06983757019043, "global_step": 50051, "epoch": 603} {"train_loss": -19.419178009033203, "global_step": 50052, "epoch": 603} {"train_loss": -19.336875915527344, "global_step": 50053, "epoch": 603} {"train_loss": -19.72713279724121, "global_step": 50054, "epoch": 603} {"train_loss": -19.594715118408203, "global_step": 50055, "epoch": 603} {"train_loss": -19.591690063476562, "global_step": 50056, "epoch": 603} {"train_loss": -19.85542106628418, "global_step": 50057, "epoch": 603} {"train_loss": -19.869525909423828, "global_step": 50058, "epoch": 603} {"train_loss": -19.718748092651367, "global_step": 50059, "epoch": 603} {"train_loss": -19.947715759277344, "global_step": 50060, "epoch": 603} {"train_loss": -20.312271118164062, "global_step": 50061, "epoch": 603} {"train_loss": -19.811166763305664, "global_step": 50062, "epoch": 603} {"train_loss": -19.59372329711914, "global_step": 50063, "epoch": 603} {"train_loss": -19.775815963745117, "global_step": 50064, "epoch": 603} {"train_loss": -20.06609535217285, "global_step": 50065, "epoch": 603} {"train_loss": -19.833053588867188, "global_step": 50066, "epoch": 603} {"train_loss": -19.7679386138916, "global_step": 50067, "epoch": 603} {"train_loss": -20.10269546508789, "global_step": 50068, "epoch": 603} {"train_loss": -19.638471603393555, "global_step": 50069, "epoch": 603} {"train_loss": -20.110105514526367, "global_step": 50070, "epoch": 603} {"train_loss": -19.747713088989258, "global_step": 50071, "epoch": 603} {"train_loss": -19.855825424194336, "global_step": 50072, "epoch": 603} {"train_loss": -19.99123191833496, "global_step": 50073, "epoch": 603} {"train_loss": -19.90195655822754, "global_step": 50074, "epoch": 603} {"train_loss": -19.70077896118164, "global_step": 50075, "epoch": 603} {"train_loss": -20.03346824645996, "global_step": 50076, "epoch": 603} {"train_loss": -19.955366134643555, "global_step": 50077, "epoch": 603} {"train_loss": -20.32863426208496, "global_step": 50078, "epoch": 603} {"train_loss": -20.12599754333496, "global_step": 50079, "epoch": 603} {"train_loss": -19.835784912109375, "global_step": 50080, "epoch": 603} {"train_loss": -20.27469253540039, "global_step": 50081, "epoch": 603} {"train_loss": -19.927946090698242, "global_step": 50082, "epoch": 603} {"train_loss": -20.2813663482666, "global_step": 50083, "epoch": 603} {"train_loss": -20.242738723754883, "global_step": 50084, "epoch": 603} {"train_loss": -20.103309631347656, "global_step": 50085, "epoch": 603} {"train_loss": -20.10285758972168, "global_step": 50086, "epoch": 603} {"train_loss": -20.02815818786621, "global_step": 50087, "epoch": 603} {"train_loss": -19.908044815063477, "global_step": 50088, "epoch": 603} {"train_loss": -20.02897834777832, "global_step": 50089, "epoch": 603} {"train_loss": -20.102550506591797, "global_step": 50090, "epoch": 603} {"train_loss": -19.97438621520996, "global_step": 50091, "epoch": 603} {"train_loss": -19.9461669921875, "global_step": 50092, "epoch": 603} {"train_loss": -19.98206901550293, "global_step": 50093, "epoch": 603} {"train_loss": -19.68838882446289, "global_step": 50094, "epoch": 603} {"train_loss": -20.28779411315918, "global_step": 50095, "epoch": 603} {"train_loss": -19.828344345092773, "global_step": 50096, "epoch": 603} {"train_loss": -20.26409912109375, "global_step": 50097, "epoch": 603} {"train_loss": -20.153738021850586, "global_step": 50098, "epoch": 603} {"train_loss": -20.07732582092285, "global_step": 50099, "epoch": 603} {"train_loss": -20.145597457885742, "global_step": 50100, "epoch": 603} {"train_loss": -20.03684425354004, "global_step": 50101, "epoch": 603} {"train_loss": -19.990842819213867, "global_step": 50102, "epoch": 603} {"train_loss": -19.941925048828125, "global_step": 50103, "epoch": 603} {"train_loss": -20.208084106445312, "global_step": 50104, "epoch": 603} {"train_loss": -20.118667602539062, "global_step": 50105, "epoch": 603} {"train_loss": -19.743967056274414, "global_step": 50106, "epoch": 603} {"train_loss": -19.91517448425293, "global_step": 50107, "epoch": 603} {"train_loss": -19.872711181640625, "global_step": 50108, "epoch": 603} {"train_loss": -19.7180233001709, "global_step": 50109, "epoch": 603} {"train_loss": -19.52499771118164, "global_step": 50110, "epoch": 603} {"train_loss": -19.51023292541504, "global_step": 50111, "epoch": 603} {"train_loss": -19.615015029907227, "global_step": 50112, "epoch": 603} {"train_loss": -19.741891860961914, "global_step": 50113, "epoch": 603} {"train_loss": -20.33196449279785, "global_step": 50114, "epoch": 603} {"train_loss": -20.159278869628906, "global_step": 50115, "epoch": 603} {"train_loss": -19.96649169921875, "global_step": 50116, "epoch": 603} {"train_loss": -20.115476608276367, "global_step": 50117, "epoch": 603} {"train_loss": -19.93575668334961, "global_step": 50118, "epoch": 603} {"train_loss": -19.964170455932617, "global_step": 50119, "epoch": 603} {"train_loss": -20.175411224365234, "global_step": 50120, "epoch": 603} {"train_loss": -20.266000747680664, "global_step": 50121, "epoch": 603} {"train_loss": -19.995786666870117, "global_step": 50122, "epoch": 603} {"train_loss": -19.915178298950195, "global_step": 50123, "epoch": 603} {"train_loss": -20.048490524291992, "global_step": 50124, "epoch": 603} {"train_loss": -19.83110237121582, "global_step": 50125, "epoch": 603} {"train_loss": -20.07622718811035, "global_step": 50126, "epoch": 603} {"train_loss": -19.98573875427246, "global_step": 50127, "epoch": 603} {"train_loss": -19.89630699157715, "global_step": 50128, "epoch": 603} {"train_loss": -20.17732048034668, "global_step": 50129, "epoch": 603} {"train_loss": -20.167478561401367, "global_step": 50130, "epoch": 603} {"train_loss": -19.93826015886054, "global_step": 50131, "epoch": 603, "val_loss": 6083363.0} {"train_loss": -19.619155883789062, "global_step": 50132, "epoch": 604} {"train_loss": -20.174060821533203, "global_step": 50133, "epoch": 604} {"train_loss": -19.795637130737305, "global_step": 50134, "epoch": 604} {"train_loss": -19.441396713256836, "global_step": 50135, "epoch": 604} {"train_loss": -19.832990646362305, "global_step": 50136, "epoch": 604} {"train_loss": -19.7675838470459, "global_step": 50137, "epoch": 604} {"train_loss": -19.961912155151367, "global_step": 50138, "epoch": 604} {"train_loss": -19.906753540039062, "global_step": 50139, "epoch": 604} {"train_loss": -20.021642684936523, "global_step": 50140, "epoch": 604} {"train_loss": -19.875852584838867, "global_step": 50141, "epoch": 604} {"train_loss": -19.917329788208008, "global_step": 50142, "epoch": 604} {"train_loss": -19.957632064819336, "global_step": 50143, "epoch": 604} {"train_loss": -19.942310333251953, "global_step": 50144, "epoch": 604} {"train_loss": -19.86038589477539, "global_step": 50145, "epoch": 604} {"train_loss": -19.502277374267578, "global_step": 50146, "epoch": 604} {"train_loss": -20.06839942932129, "global_step": 50147, "epoch": 604} {"train_loss": -20.16704750061035, "global_step": 50148, "epoch": 604} {"train_loss": -19.3328914642334, "global_step": 50149, "epoch": 604} {"train_loss": -20.235788345336914, "global_step": 50150, "epoch": 604} {"train_loss": -19.89266014099121, "global_step": 50151, "epoch": 604} {"train_loss": -20.140653610229492, "global_step": 50152, "epoch": 604} {"train_loss": -19.71990966796875, "global_step": 50153, "epoch": 604} {"train_loss": -19.545211791992188, "global_step": 50154, "epoch": 604} {"train_loss": -19.72989273071289, "global_step": 50155, "epoch": 604} {"train_loss": -19.984350204467773, "global_step": 50156, "epoch": 604} {"train_loss": -19.777685165405273, "global_step": 50157, "epoch": 604} {"train_loss": -19.97185516357422, "global_step": 50158, "epoch": 604} {"train_loss": -20.160024642944336, "global_step": 50159, "epoch": 604} {"train_loss": -20.17011070251465, "global_step": 50160, "epoch": 604} {"train_loss": -19.945655822753906, "global_step": 50161, "epoch": 604} {"train_loss": -19.92214012145996, "global_step": 50162, "epoch": 604} {"train_loss": -20.135244369506836, "global_step": 50163, "epoch": 604} {"train_loss": -19.964357376098633, "global_step": 50164, "epoch": 604} {"train_loss": -20.11862564086914, "global_step": 50165, "epoch": 604} {"train_loss": -20.094032287597656, "global_step": 50166, "epoch": 604} {"train_loss": -20.299875259399414, "global_step": 50167, "epoch": 604} {"train_loss": -20.10403060913086, "global_step": 50168, "epoch": 604} {"train_loss": -20.227460861206055, "global_step": 50169, "epoch": 604} {"train_loss": -20.07708740234375, "global_step": 50170, "epoch": 604} {"train_loss": -19.793827056884766, "global_step": 50171, "epoch": 604} {"train_loss": -19.826444625854492, "global_step": 50172, "epoch": 604} {"train_loss": -19.99329948425293, "global_step": 50173, "epoch": 604} {"train_loss": -19.9263858795166, "global_step": 50174, "epoch": 604} {"train_loss": -19.553482055664062, "global_step": 50175, "epoch": 604} {"train_loss": -19.60828971862793, "global_step": 50176, "epoch": 604} {"train_loss": -19.943960189819336, "global_step": 50177, "epoch": 604} {"train_loss": -19.91343879699707, "global_step": 50178, "epoch": 604} {"train_loss": -19.744308471679688, "global_step": 50179, "epoch": 604} {"train_loss": -20.207157135009766, "global_step": 50180, "epoch": 604} {"train_loss": -20.087398529052734, "global_step": 50181, "epoch": 604} {"train_loss": -20.27497673034668, "global_step": 50182, "epoch": 604} {"train_loss": -20.208547592163086, "global_step": 50183, "epoch": 604} {"train_loss": -20.09151268005371, "global_step": 50184, "epoch": 604} {"train_loss": -19.803958892822266, "global_step": 50185, "epoch": 604} {"train_loss": -20.024089813232422, "global_step": 50186, "epoch": 604} {"train_loss": -19.908933639526367, "global_step": 50187, "epoch": 604} {"train_loss": -19.75682830810547, "global_step": 50188, "epoch": 604} {"train_loss": -20.03474235534668, "global_step": 50189, "epoch": 604} {"train_loss": -20.238908767700195, "global_step": 50190, "epoch": 604} {"train_loss": -20.456218719482422, "global_step": 50191, "epoch": 604} {"train_loss": -19.58796501159668, "global_step": 50192, "epoch": 604} {"train_loss": -19.851362228393555, "global_step": 50193, "epoch": 604} {"train_loss": -19.914962768554688, "global_step": 50194, "epoch": 604} {"train_loss": -20.111616134643555, "global_step": 50195, "epoch": 604} {"train_loss": -20.0094051361084, "global_step": 50196, "epoch": 604} {"train_loss": -19.936359405517578, "global_step": 50197, "epoch": 604} {"train_loss": -19.865379333496094, "global_step": 50198, "epoch": 604} {"train_loss": -20.38231086730957, "global_step": 50199, "epoch": 604} {"train_loss": -20.178770065307617, "global_step": 50200, "epoch": 604} {"train_loss": -19.97920799255371, "global_step": 50201, "epoch": 604} {"train_loss": -20.407560348510742, "global_step": 50202, "epoch": 604} {"train_loss": -19.607315063476562, "global_step": 50203, "epoch": 604} {"train_loss": -19.98319435119629, "global_step": 50204, "epoch": 604} {"train_loss": -20.119802474975586, "global_step": 50205, "epoch": 604} {"train_loss": -20.20755386352539, "global_step": 50206, "epoch": 604} {"train_loss": -19.94814682006836, "global_step": 50207, "epoch": 604} {"train_loss": -19.429187774658203, "global_step": 50208, "epoch": 604} {"train_loss": -20.180028915405273, "global_step": 50209, "epoch": 604} {"train_loss": -19.89573097229004, "global_step": 50210, "epoch": 604} {"train_loss": -19.917194366455078, "global_step": 50211, "epoch": 604} {"train_loss": -19.580509185791016, "global_step": 50212, "epoch": 604} {"train_loss": -20.10042381286621, "global_step": 50213, "epoch": 604} {"train_loss": -19.96530130685094, "global_step": 50214, "epoch": 604, "val_loss": 6201528.5} {"train_loss": -18.496273040771484, "global_step": 50215, "epoch": 605} {"train_loss": -19.098112106323242, "global_step": 50216, "epoch": 605} {"train_loss": -19.281024932861328, "global_step": 50217, "epoch": 605} {"train_loss": -19.12371253967285, "global_step": 50218, "epoch": 605} {"train_loss": -19.144407272338867, "global_step": 50219, "epoch": 605} {"train_loss": -19.687559127807617, "global_step": 50220, "epoch": 605} {"train_loss": -19.52288818359375, "global_step": 50221, "epoch": 605} {"train_loss": -19.377479553222656, "global_step": 50222, "epoch": 605} {"train_loss": -19.95915985107422, "global_step": 50223, "epoch": 605} {"train_loss": -19.819793701171875, "global_step": 50224, "epoch": 605} {"train_loss": -19.60967254638672, "global_step": 50225, "epoch": 605} {"train_loss": -19.436859130859375, "global_step": 50226, "epoch": 605} {"train_loss": -19.68158531188965, "global_step": 50227, "epoch": 605} {"train_loss": -19.477811813354492, "global_step": 50228, "epoch": 605} {"train_loss": -19.835065841674805, "global_step": 50229, "epoch": 605} {"train_loss": -19.952383041381836, "global_step": 50230, "epoch": 605} {"train_loss": -19.755239486694336, "global_step": 50231, "epoch": 605} {"train_loss": -19.751976013183594, "global_step": 50232, "epoch": 605} {"train_loss": -20.242740631103516, "global_step": 50233, "epoch": 605} {"train_loss": -19.830078125, "global_step": 50234, "epoch": 605} {"train_loss": -19.74556541442871, "global_step": 50235, "epoch": 605} {"train_loss": -20.143875122070312, "global_step": 50236, "epoch": 605} {"train_loss": -20.09783363342285, "global_step": 50237, "epoch": 605} {"train_loss": -19.926416397094727, "global_step": 50238, "epoch": 605} {"train_loss": -20.003036499023438, "global_step": 50239, "epoch": 605} {"train_loss": -20.212127685546875, "global_step": 50240, "epoch": 605} {"train_loss": -19.867597579956055, "global_step": 50241, "epoch": 605} {"train_loss": -19.726240158081055, "global_step": 50242, "epoch": 605} {"train_loss": -20.279890060424805, "global_step": 50243, "epoch": 605} {"train_loss": -19.765317916870117, "global_step": 50244, "epoch": 605} {"train_loss": -19.885805130004883, "global_step": 50245, "epoch": 605} {"train_loss": -20.177377700805664, "global_step": 50246, "epoch": 605} {"train_loss": -19.721933364868164, "global_step": 50247, "epoch": 605} {"train_loss": -19.75064468383789, "global_step": 50248, "epoch": 605} {"train_loss": -19.787153244018555, "global_step": 50249, "epoch": 605} {"train_loss": -20.275972366333008, "global_step": 50250, "epoch": 605} {"train_loss": -20.149765014648438, "global_step": 50251, "epoch": 605} {"train_loss": -19.996549606323242, "global_step": 50252, "epoch": 605} {"train_loss": -19.974042892456055, "global_step": 50253, "epoch": 605} {"train_loss": -19.892433166503906, "global_step": 50254, "epoch": 605} {"train_loss": -19.986377716064453, "global_step": 50255, "epoch": 605} {"train_loss": -20.031208038330078, "global_step": 50256, "epoch": 605} {"train_loss": -19.695573806762695, "global_step": 50257, "epoch": 605} {"train_loss": -20.036466598510742, "global_step": 50258, "epoch": 605} {"train_loss": -19.828550338745117, "global_step": 50259, "epoch": 605} {"train_loss": -19.777029037475586, "global_step": 50260, "epoch": 605} {"train_loss": -19.815078735351562, "global_step": 50261, "epoch": 605} {"train_loss": -19.99280548095703, "global_step": 50262, "epoch": 605} {"train_loss": -19.870237350463867, "global_step": 50263, "epoch": 605} {"train_loss": -19.89951515197754, "global_step": 50264, "epoch": 605} {"train_loss": -20.27754783630371, "global_step": 50265, "epoch": 605} {"train_loss": -19.7748966217041, "global_step": 50266, "epoch": 605} {"train_loss": -19.9902400970459, "global_step": 50267, "epoch": 605} {"train_loss": -20.021728515625, "global_step": 50268, "epoch": 605} {"train_loss": -20.016891479492188, "global_step": 50269, "epoch": 605} {"train_loss": -19.6231746673584, "global_step": 50270, "epoch": 605} {"train_loss": -19.75619888305664, "global_step": 50271, "epoch": 605} {"train_loss": -20.106409072875977, "global_step": 50272, "epoch": 605} {"train_loss": -19.86078453063965, "global_step": 50273, "epoch": 605} {"train_loss": -19.712697982788086, "global_step": 50274, "epoch": 605} {"train_loss": -19.754131317138672, "global_step": 50275, "epoch": 605} {"train_loss": -19.890092849731445, "global_step": 50276, "epoch": 605} {"train_loss": -20.05735969543457, "global_step": 50277, "epoch": 605} {"train_loss": -19.952138900756836, "global_step": 50278, "epoch": 605} {"train_loss": -19.72479820251465, "global_step": 50279, "epoch": 605} {"train_loss": -20.065088272094727, "global_step": 50280, "epoch": 605} {"train_loss": -20.31532859802246, "global_step": 50281, "epoch": 605} {"train_loss": -19.728734970092773, "global_step": 50282, "epoch": 605} {"train_loss": -19.887893676757812, "global_step": 50283, "epoch": 605} {"train_loss": -19.589698791503906, "global_step": 50284, "epoch": 605} {"train_loss": -19.916852951049805, "global_step": 50285, "epoch": 605} {"train_loss": -20.296045303344727, "global_step": 50286, "epoch": 605} {"train_loss": -20.14902114868164, "global_step": 50287, "epoch": 605} {"train_loss": -20.0012264251709, "global_step": 50288, "epoch": 605} {"train_loss": -20.02512550354004, "global_step": 50289, "epoch": 605} {"train_loss": -19.757587432861328, "global_step": 50290, "epoch": 605} {"train_loss": -19.56090545654297, "global_step": 50291, "epoch": 605} {"train_loss": -20.19135856628418, "global_step": 50292, "epoch": 605} {"train_loss": -20.122365951538086, "global_step": 50293, "epoch": 605} {"train_loss": -20.372465133666992, "global_step": 50294, "epoch": 605} {"train_loss": -19.83112144470215, "global_step": 50295, "epoch": 605} {"train_loss": -19.586488723754883, "global_step": 50296, "epoch": 605} {"train_loss": -19.860634861222234, "global_step": 50297, "epoch": 605, "val_loss": 6179924.5} {"train_loss": -19.523513793945312, "global_step": 50298, "epoch": 606} {"train_loss": -19.070131301879883, "global_step": 50299, "epoch": 606} {"train_loss": -19.658628463745117, "global_step": 50300, "epoch": 606} {"train_loss": -19.783294677734375, "global_step": 50301, "epoch": 606} {"train_loss": -20.0065860748291, "global_step": 50302, "epoch": 606} {"train_loss": -19.32394027709961, "global_step": 50303, "epoch": 606} {"train_loss": -20.003292083740234, "global_step": 50304, "epoch": 606} {"train_loss": -19.46780776977539, "global_step": 50305, "epoch": 606} {"train_loss": -20.31299591064453, "global_step": 50306, "epoch": 606} {"train_loss": -19.487154006958008, "global_step": 50307, "epoch": 606} {"train_loss": -19.31760597229004, "global_step": 50308, "epoch": 606} {"train_loss": -20.00600242614746, "global_step": 50309, "epoch": 606} {"train_loss": -19.798460006713867, "global_step": 50310, "epoch": 606} {"train_loss": -19.9292049407959, "global_step": 50311, "epoch": 606} {"train_loss": -19.9349422454834, "global_step": 50312, "epoch": 606} {"train_loss": -20.271072387695312, "global_step": 50313, "epoch": 606} {"train_loss": -19.60187339782715, "global_step": 50314, "epoch": 606} {"train_loss": -20.013402938842773, "global_step": 50315, "epoch": 606} {"train_loss": -20.06186294555664, "global_step": 50316, "epoch": 606} {"train_loss": -19.520261764526367, "global_step": 50317, "epoch": 606} {"train_loss": -19.599435806274414, "global_step": 50318, "epoch": 606} {"train_loss": -19.74887466430664, "global_step": 50319, "epoch": 606} {"train_loss": -19.896757125854492, "global_step": 50320, "epoch": 606} {"train_loss": -20.184803009033203, "global_step": 50321, "epoch": 606} {"train_loss": -19.57326316833496, "global_step": 50322, "epoch": 606} {"train_loss": -20.02654266357422, "global_step": 50323, "epoch": 606} {"train_loss": -19.81160545349121, "global_step": 50324, "epoch": 606} {"train_loss": -20.301822662353516, "global_step": 50325, "epoch": 606} {"train_loss": -19.955657958984375, "global_step": 50326, "epoch": 606} {"train_loss": -19.904123306274414, "global_step": 50327, "epoch": 606} {"train_loss": -19.57868003845215, "global_step": 50328, "epoch": 606} {"train_loss": -19.964393615722656, "global_step": 50329, "epoch": 606} {"train_loss": -20.002729415893555, "global_step": 50330, "epoch": 606} {"train_loss": -19.78589630126953, "global_step": 50331, "epoch": 606} {"train_loss": -19.956159591674805, "global_step": 50332, "epoch": 606} {"train_loss": -19.890390396118164, "global_step": 50333, "epoch": 606} {"train_loss": -19.938034057617188, "global_step": 50334, "epoch": 606} {"train_loss": -19.65771484375, "global_step": 50335, "epoch": 606} {"train_loss": -19.986717224121094, "global_step": 50336, "epoch": 606} {"train_loss": -19.619298934936523, "global_step": 50337, "epoch": 606} {"train_loss": -20.224742889404297, "global_step": 50338, "epoch": 606} {"train_loss": -20.179567337036133, "global_step": 50339, "epoch": 606} {"train_loss": -19.66370964050293, "global_step": 50340, "epoch": 606} {"train_loss": -20.141712188720703, "global_step": 50341, "epoch": 606} {"train_loss": -19.905607223510742, "global_step": 50342, "epoch": 606} {"train_loss": -20.085737228393555, "global_step": 50343, "epoch": 606} {"train_loss": -20.25148582458496, "global_step": 50344, "epoch": 606} {"train_loss": -20.133420944213867, "global_step": 50345, "epoch": 606} {"train_loss": -20.06807518005371, "global_step": 50346, "epoch": 606} {"train_loss": -19.98509407043457, "global_step": 50347, "epoch": 606} {"train_loss": -20.099695205688477, "global_step": 50348, "epoch": 606} {"train_loss": -19.83051300048828, "global_step": 50349, "epoch": 606} {"train_loss": -19.81720542907715, "global_step": 50350, "epoch": 606} {"train_loss": -19.873798370361328, "global_step": 50351, "epoch": 606} {"train_loss": -19.9388370513916, "global_step": 50352, "epoch": 606} {"train_loss": -19.93024253845215, "global_step": 50353, "epoch": 606} {"train_loss": -19.915742874145508, "global_step": 50354, "epoch": 606} {"train_loss": -19.934961318969727, "global_step": 50355, "epoch": 606} {"train_loss": -19.99203109741211, "global_step": 50356, "epoch": 606} {"train_loss": -19.886672973632812, "global_step": 50357, "epoch": 606} {"train_loss": -19.565784454345703, "global_step": 50358, "epoch": 606} {"train_loss": -20.345979690551758, "global_step": 50359, "epoch": 606} {"train_loss": -19.8245906829834, "global_step": 50360, "epoch": 606} {"train_loss": -19.951093673706055, "global_step": 50361, "epoch": 606} {"train_loss": -20.127851486206055, "global_step": 50362, "epoch": 606} {"train_loss": -20.04005241394043, "global_step": 50363, "epoch": 606} {"train_loss": -19.90896987915039, "global_step": 50364, "epoch": 606} {"train_loss": -19.58659553527832, "global_step": 50365, "epoch": 606} {"train_loss": -20.047264099121094, "global_step": 50366, "epoch": 606} {"train_loss": -20.186471939086914, "global_step": 50367, "epoch": 606} {"train_loss": -19.612350463867188, "global_step": 50368, "epoch": 606} {"train_loss": -19.80390739440918, "global_step": 50369, "epoch": 606} {"train_loss": -19.96216583251953, "global_step": 50370, "epoch": 606} {"train_loss": -19.965877532958984, "global_step": 50371, "epoch": 606} {"train_loss": -19.80609893798828, "global_step": 50372, "epoch": 606} {"train_loss": -20.124204635620117, "global_step": 50373, "epoch": 606} {"train_loss": -19.950443267822266, "global_step": 50374, "epoch": 606} {"train_loss": -20.02138900756836, "global_step": 50375, "epoch": 606} {"train_loss": -20.35263442993164, "global_step": 50376, "epoch": 606} {"train_loss": -20.40424919128418, "global_step": 50377, "epoch": 606} {"train_loss": -20.000646591186523, "global_step": 50378, "epoch": 606} {"train_loss": -20.05228042602539, "global_step": 50379, "epoch": 606} {"train_loss": -19.90639757822795, "global_step": 50380, "epoch": 606, "val_loss": 6025019.5} {"train_loss": -19.431324005126953, "global_step": 50381, "epoch": 607} {"train_loss": -19.81705665588379, "global_step": 50382, "epoch": 607} {"train_loss": -19.940122604370117, "global_step": 50383, "epoch": 607} {"train_loss": -19.867023468017578, "global_step": 50384, "epoch": 607} {"train_loss": -19.768238067626953, "global_step": 50385, "epoch": 607} {"train_loss": -19.85306167602539, "global_step": 50386, "epoch": 607} {"train_loss": -20.32181739807129, "global_step": 50387, "epoch": 607} {"train_loss": -19.861051559448242, "global_step": 50388, "epoch": 607} {"train_loss": -19.947118759155273, "global_step": 50389, "epoch": 607} {"train_loss": -19.565555572509766, "global_step": 50390, "epoch": 607} {"train_loss": -19.889596939086914, "global_step": 50391, "epoch": 607} {"train_loss": -19.55731773376465, "global_step": 50392, "epoch": 607} {"train_loss": -19.856689453125, "global_step": 50393, "epoch": 607} {"train_loss": -20.25339698791504, "global_step": 50394, "epoch": 607} {"train_loss": -19.934782028198242, "global_step": 50395, "epoch": 607} {"train_loss": -19.876724243164062, "global_step": 50396, "epoch": 607} {"train_loss": -19.98723602294922, "global_step": 50397, "epoch": 607} {"train_loss": -20.02301597595215, "global_step": 50398, "epoch": 607} {"train_loss": -19.4696044921875, "global_step": 50399, "epoch": 607} {"train_loss": -19.86639976501465, "global_step": 50400, "epoch": 607} {"train_loss": -20.05838966369629, "global_step": 50401, "epoch": 607} {"train_loss": -19.91837501525879, "global_step": 50402, "epoch": 607} {"train_loss": -19.805002212524414, "global_step": 50403, "epoch": 607} {"train_loss": -20.01392936706543, "global_step": 50404, "epoch": 607} {"train_loss": -19.864294052124023, "global_step": 50405, "epoch": 607} {"train_loss": -20.106260299682617, "global_step": 50406, "epoch": 607} {"train_loss": -19.65393829345703, "global_step": 50407, "epoch": 607} {"train_loss": -20.031558990478516, "global_step": 50408, "epoch": 607} {"train_loss": -20.017379760742188, "global_step": 50409, "epoch": 607} {"train_loss": -19.84418296813965, "global_step": 50410, "epoch": 607} {"train_loss": -19.953794479370117, "global_step": 50411, "epoch": 607} {"train_loss": -20.222803115844727, "global_step": 50412, "epoch": 607} {"train_loss": -20.085363388061523, "global_step": 50413, "epoch": 607} {"train_loss": -20.097732543945312, "global_step": 50414, "epoch": 607} {"train_loss": -19.5860652923584, "global_step": 50415, "epoch": 607} {"train_loss": -19.85474395751953, "global_step": 50416, "epoch": 607} {"train_loss": -20.049163818359375, "global_step": 50417, "epoch": 607} {"train_loss": -20.072614669799805, "global_step": 50418, "epoch": 607} {"train_loss": -20.057233810424805, "global_step": 50419, "epoch": 607} {"train_loss": -20.40563201904297, "global_step": 50420, "epoch": 607} {"train_loss": -19.814258575439453, "global_step": 50421, "epoch": 607} {"train_loss": -19.875547409057617, "global_step": 50422, "epoch": 607} {"train_loss": -20.017478942871094, "global_step": 50423, "epoch": 607} {"train_loss": -19.958356857299805, "global_step": 50424, "epoch": 607} {"train_loss": -19.990474700927734, "global_step": 50425, "epoch": 607} {"train_loss": -19.9564151763916, "global_step": 50426, "epoch": 607} {"train_loss": -20.126388549804688, "global_step": 50427, "epoch": 607} {"train_loss": -19.673206329345703, "global_step": 50428, "epoch": 607} {"train_loss": -20.238040924072266, "global_step": 50429, "epoch": 607} {"train_loss": -20.037567138671875, "global_step": 50430, "epoch": 607} {"train_loss": -20.036306381225586, "global_step": 50431, "epoch": 607} {"train_loss": -20.006362915039062, "global_step": 50432, "epoch": 607} {"train_loss": -20.230833053588867, "global_step": 50433, "epoch": 607} {"train_loss": -19.665891647338867, "global_step": 50434, "epoch": 607} {"train_loss": -19.776432037353516, "global_step": 50435, "epoch": 607} {"train_loss": -19.591773986816406, "global_step": 50436, "epoch": 607} {"train_loss": -19.93442726135254, "global_step": 50437, "epoch": 607} {"train_loss": -20.176345825195312, "global_step": 50438, "epoch": 607} {"train_loss": -19.888639450073242, "global_step": 50439, "epoch": 607} {"train_loss": -20.3509521484375, "global_step": 50440, "epoch": 607} {"train_loss": -19.971052169799805, "global_step": 50441, "epoch": 607} {"train_loss": -19.63883399963379, "global_step": 50442, "epoch": 607} {"train_loss": -19.734272003173828, "global_step": 50443, "epoch": 607} {"train_loss": -20.024778366088867, "global_step": 50444, "epoch": 607} {"train_loss": -20.148208618164062, "global_step": 50445, "epoch": 607} {"train_loss": -19.53069496154785, "global_step": 50446, "epoch": 607} {"train_loss": -19.99625587463379, "global_step": 50447, "epoch": 607} {"train_loss": -19.793115615844727, "global_step": 50448, "epoch": 607} {"train_loss": -20.027997970581055, "global_step": 50449, "epoch": 607} {"train_loss": -19.83717918395996, "global_step": 50450, "epoch": 607} {"train_loss": -20.200897216796875, "global_step": 50451, "epoch": 607} {"train_loss": -20.29658317565918, "global_step": 50452, "epoch": 607} {"train_loss": -20.420528411865234, "global_step": 50453, "epoch": 607} {"train_loss": -19.858182907104492, "global_step": 50454, "epoch": 607} {"train_loss": -20.010168075561523, "global_step": 50455, "epoch": 607} {"train_loss": -19.799001693725586, "global_step": 50456, "epoch": 607} {"train_loss": -20.205270767211914, "global_step": 50457, "epoch": 607} {"train_loss": -20.1444091796875, "global_step": 50458, "epoch": 607} {"train_loss": -19.65940284729004, "global_step": 50459, "epoch": 607} {"train_loss": -19.76824378967285, "global_step": 50460, "epoch": 607} {"train_loss": -19.475343704223633, "global_step": 50461, "epoch": 607} {"train_loss": -20.117416381835938, "global_step": 50462, "epoch": 607} {"train_loss": -19.945893207228327, "global_step": 50463, "epoch": 607, "val_loss": 5920907.5} {"train_loss": -19.402708053588867, "global_step": 50464, "epoch": 608} {"train_loss": -19.921283721923828, "global_step": 50465, "epoch": 608} {"train_loss": -19.83931541442871, "global_step": 50466, "epoch": 608} {"train_loss": -19.76264190673828, "global_step": 50467, "epoch": 608} {"train_loss": -19.664411544799805, "global_step": 50468, "epoch": 608} {"train_loss": -20.02814292907715, "global_step": 50469, "epoch": 608} {"train_loss": -19.651891708374023, "global_step": 50470, "epoch": 608} {"train_loss": -19.637292861938477, "global_step": 50471, "epoch": 608} {"train_loss": -19.875417709350586, "global_step": 50472, "epoch": 608} {"train_loss": -19.560976028442383, "global_step": 50473, "epoch": 608} {"train_loss": -19.698362350463867, "global_step": 50474, "epoch": 608} {"train_loss": -19.747220993041992, "global_step": 50475, "epoch": 608} {"train_loss": -19.892696380615234, "global_step": 50476, "epoch": 608} {"train_loss": -19.86878204345703, "global_step": 50477, "epoch": 608} {"train_loss": -20.257038116455078, "global_step": 50478, "epoch": 608} {"train_loss": -19.813718795776367, "global_step": 50479, "epoch": 608} {"train_loss": -19.941770553588867, "global_step": 50480, "epoch": 608} {"train_loss": -19.543350219726562, "global_step": 50481, "epoch": 608} {"train_loss": -19.903684616088867, "global_step": 50482, "epoch": 608} {"train_loss": -19.73495864868164, "global_step": 50483, "epoch": 608} {"train_loss": -19.963594436645508, "global_step": 50484, "epoch": 608} {"train_loss": -19.72429084777832, "global_step": 50485, "epoch": 608} {"train_loss": -19.566320419311523, "global_step": 50486, "epoch": 608} {"train_loss": -19.947240829467773, "global_step": 50487, "epoch": 608} {"train_loss": -19.847585678100586, "global_step": 50488, "epoch": 608} {"train_loss": -20.426992416381836, "global_step": 50489, "epoch": 608} {"train_loss": -20.030080795288086, "global_step": 50490, "epoch": 608} {"train_loss": -20.013395309448242, "global_step": 50491, "epoch": 608} {"train_loss": -20.042890548706055, "global_step": 50492, "epoch": 608} {"train_loss": -20.056467056274414, "global_step": 50493, "epoch": 608} {"train_loss": -20.083078384399414, "global_step": 50494, "epoch": 608} {"train_loss": -20.187549591064453, "global_step": 50495, "epoch": 608} {"train_loss": -20.105037689208984, "global_step": 50496, "epoch": 608} {"train_loss": -20.077451705932617, "global_step": 50497, "epoch": 608} {"train_loss": -19.928319931030273, "global_step": 50498, "epoch": 608} {"train_loss": -19.900136947631836, "global_step": 50499, "epoch": 608} {"train_loss": -19.965269088745117, "global_step": 50500, "epoch": 608} {"train_loss": -19.746692657470703, "global_step": 50501, "epoch": 608} {"train_loss": -20.046850204467773, "global_step": 50502, "epoch": 608} {"train_loss": -20.480932235717773, "global_step": 50503, "epoch": 608} {"train_loss": -19.716657638549805, "global_step": 50504, "epoch": 608} {"train_loss": -20.08795166015625, "global_step": 50505, "epoch": 608} {"train_loss": -19.993858337402344, "global_step": 50506, "epoch": 608} {"train_loss": -19.897035598754883, "global_step": 50507, "epoch": 608} {"train_loss": -19.71600914001465, "global_step": 50508, "epoch": 608} {"train_loss": -20.539752960205078, "global_step": 50509, "epoch": 608} {"train_loss": -19.84443473815918, "global_step": 50510, "epoch": 608} {"train_loss": -19.880544662475586, "global_step": 50511, "epoch": 608} {"train_loss": -19.76211929321289, "global_step": 50512, "epoch": 608} {"train_loss": -20.040237426757812, "global_step": 50513, "epoch": 608} {"train_loss": -19.956342697143555, "global_step": 50514, "epoch": 608} {"train_loss": -19.983503341674805, "global_step": 50515, "epoch": 608} {"train_loss": -20.335355758666992, "global_step": 50516, "epoch": 608} {"train_loss": -20.190671920776367, "global_step": 50517, "epoch": 608} {"train_loss": -20.06806755065918, "global_step": 50518, "epoch": 608} {"train_loss": -20.247116088867188, "global_step": 50519, "epoch": 608} {"train_loss": -19.877567291259766, "global_step": 50520, "epoch": 608} {"train_loss": -19.862951278686523, "global_step": 50521, "epoch": 608} {"train_loss": -20.209823608398438, "global_step": 50522, "epoch": 608} {"train_loss": -19.653274536132812, "global_step": 50523, "epoch": 608} {"train_loss": -19.828821182250977, "global_step": 50524, "epoch": 608} {"train_loss": -19.747486114501953, "global_step": 50525, "epoch": 608} {"train_loss": -19.82008171081543, "global_step": 50526, "epoch": 608} {"train_loss": -19.878734588623047, "global_step": 50527, "epoch": 608} {"train_loss": -20.062963485717773, "global_step": 50528, "epoch": 608} {"train_loss": -19.988840103149414, "global_step": 50529, "epoch": 608} {"train_loss": -20.009124755859375, "global_step": 50530, "epoch": 608} {"train_loss": -19.79014778137207, "global_step": 50531, "epoch": 608} {"train_loss": -19.765043258666992, "global_step": 50532, "epoch": 608} {"train_loss": -19.898574829101562, "global_step": 50533, "epoch": 608} {"train_loss": -19.974349975585938, "global_step": 50534, "epoch": 608} {"train_loss": -19.97757339477539, "global_step": 50535, "epoch": 608} {"train_loss": -20.11429214477539, "global_step": 50536, "epoch": 608} {"train_loss": -20.26291847229004, "global_step": 50537, "epoch": 608} {"train_loss": -19.746267318725586, "global_step": 50538, "epoch": 608} {"train_loss": -20.15165138244629, "global_step": 50539, "epoch": 608} {"train_loss": -19.902923583984375, "global_step": 50540, "epoch": 608} {"train_loss": -19.75733757019043, "global_step": 50541, "epoch": 608} {"train_loss": -19.70957374572754, "global_step": 50542, "epoch": 608} {"train_loss": -19.910104751586914, "global_step": 50543, "epoch": 608} {"train_loss": -20.469772338867188, "global_step": 50544, "epoch": 608} {"train_loss": -20.2191162109375, "global_step": 50545, "epoch": 608} {"train_loss": -19.932651473815184, "global_step": 50546, "epoch": 608, "val_loss": 6055976.5} {"train_loss": -19.085784912109375, "global_step": 50547, "epoch": 609} {"train_loss": -19.7559757232666, "global_step": 50548, "epoch": 609} {"train_loss": -19.788806915283203, "global_step": 50549, "epoch": 609} {"train_loss": -20.19740104675293, "global_step": 50550, "epoch": 609} {"train_loss": -19.52655601501465, "global_step": 50551, "epoch": 609} {"train_loss": -19.772300720214844, "global_step": 50552, "epoch": 609} {"train_loss": -19.793689727783203, "global_step": 50553, "epoch": 609} {"train_loss": -19.82145118713379, "global_step": 50554, "epoch": 609} {"train_loss": -19.718154907226562, "global_step": 50555, "epoch": 609} {"train_loss": -19.791170120239258, "global_step": 50556, "epoch": 609} {"train_loss": -19.724618911743164, "global_step": 50557, "epoch": 609} {"train_loss": -19.557226181030273, "global_step": 50558, "epoch": 609} {"train_loss": -19.407957077026367, "global_step": 50559, "epoch": 609} {"train_loss": -19.77488136291504, "global_step": 50560, "epoch": 609} {"train_loss": -19.918943405151367, "global_step": 50561, "epoch": 609} {"train_loss": -19.641921997070312, "global_step": 50562, "epoch": 609} {"train_loss": -19.824588775634766, "global_step": 50563, "epoch": 609} {"train_loss": -19.963504791259766, "global_step": 50564, "epoch": 609} {"train_loss": -19.716577529907227, "global_step": 50565, "epoch": 609} {"train_loss": -19.768829345703125, "global_step": 50566, "epoch": 609} {"train_loss": -20.01812171936035, "global_step": 50567, "epoch": 609} {"train_loss": -19.480863571166992, "global_step": 50568, "epoch": 609} {"train_loss": -19.855276107788086, "global_step": 50569, "epoch": 609} {"train_loss": -20.034847259521484, "global_step": 50570, "epoch": 609} {"train_loss": -19.45624351501465, "global_step": 50571, "epoch": 609} {"train_loss": -19.51240348815918, "global_step": 50572, "epoch": 609} {"train_loss": -19.95697593688965, "global_step": 50573, "epoch": 609} {"train_loss": -19.94471549987793, "global_step": 50574, "epoch": 609} {"train_loss": -19.98420524597168, "global_step": 50575, "epoch": 609} {"train_loss": -19.47336769104004, "global_step": 50576, "epoch": 609} {"train_loss": -19.76405143737793, "global_step": 50577, "epoch": 609} {"train_loss": -19.840673446655273, "global_step": 50578, "epoch": 609} {"train_loss": -20.36679458618164, "global_step": 50579, "epoch": 609} {"train_loss": -19.751188278198242, "global_step": 50580, "epoch": 609} {"train_loss": -19.869531631469727, "global_step": 50581, "epoch": 609} {"train_loss": -19.89995765686035, "global_step": 50582, "epoch": 609} {"train_loss": -19.840734481811523, "global_step": 50583, "epoch": 609} {"train_loss": -19.85988426208496, "global_step": 50584, "epoch": 609} {"train_loss": -19.826126098632812, "global_step": 50585, "epoch": 609} {"train_loss": -19.617328643798828, "global_step": 50586, "epoch": 609} {"train_loss": -20.155006408691406, "global_step": 50587, "epoch": 609} {"train_loss": -19.87504768371582, "global_step": 50588, "epoch": 609} {"train_loss": -20.15372085571289, "global_step": 50589, "epoch": 609} {"train_loss": -20.030254364013672, "global_step": 50590, "epoch": 609} {"train_loss": -19.76173210144043, "global_step": 50591, "epoch": 609} {"train_loss": -20.105810165405273, "global_step": 50592, "epoch": 609} {"train_loss": -20.001028060913086, "global_step": 50593, "epoch": 609} {"train_loss": -19.826452255249023, "global_step": 50594, "epoch": 609} {"train_loss": -19.840688705444336, "global_step": 50595, "epoch": 609} {"train_loss": -19.87677764892578, "global_step": 50596, "epoch": 609} {"train_loss": -19.742849349975586, "global_step": 50597, "epoch": 609} {"train_loss": -19.861799240112305, "global_step": 50598, "epoch": 609} {"train_loss": -20.261316299438477, "global_step": 50599, "epoch": 609} {"train_loss": -20.031721115112305, "global_step": 50600, "epoch": 609} {"train_loss": -20.002445220947266, "global_step": 50601, "epoch": 609} {"train_loss": -20.199539184570312, "global_step": 50602, "epoch": 609} {"train_loss": -20.068008422851562, "global_step": 50603, "epoch": 609} {"train_loss": -19.913169860839844, "global_step": 50604, "epoch": 609} {"train_loss": -20.02867317199707, "global_step": 50605, "epoch": 609} {"train_loss": -20.07546043395996, "global_step": 50606, "epoch": 609} {"train_loss": -19.67612648010254, "global_step": 50607, "epoch": 609} {"train_loss": -19.91029167175293, "global_step": 50608, "epoch": 609} {"train_loss": -19.957122802734375, "global_step": 50609, "epoch": 609} {"train_loss": -19.99045753479004, "global_step": 50610, "epoch": 609} {"train_loss": -19.894609451293945, "global_step": 50611, "epoch": 609} {"train_loss": -19.91803550720215, "global_step": 50612, "epoch": 609} {"train_loss": -19.74409294128418, "global_step": 50613, "epoch": 609} {"train_loss": -20.093381881713867, "global_step": 50614, "epoch": 609} {"train_loss": -19.917709350585938, "global_step": 50615, "epoch": 609} {"train_loss": -20.170835494995117, "global_step": 50616, "epoch": 609} {"train_loss": -19.896968841552734, "global_step": 50617, "epoch": 609} {"train_loss": -19.513778686523438, "global_step": 50618, "epoch": 609} {"train_loss": -19.919689178466797, "global_step": 50619, "epoch": 609} {"train_loss": -20.219873428344727, "global_step": 50620, "epoch": 609} {"train_loss": -20.055805206298828, "global_step": 50621, "epoch": 609} {"train_loss": -19.59630584716797, "global_step": 50622, "epoch": 609} {"train_loss": -19.66025733947754, "global_step": 50623, "epoch": 609} {"train_loss": -20.065509796142578, "global_step": 50624, "epoch": 609} {"train_loss": -19.797090530395508, "global_step": 50625, "epoch": 609} {"train_loss": -20.052595138549805, "global_step": 50626, "epoch": 609} {"train_loss": -20.081707000732422, "global_step": 50627, "epoch": 609} {"train_loss": -19.887380599975586, "global_step": 50628, "epoch": 609} {"train_loss": -19.8590070655547, "global_step": 50629, "epoch": 609, "val_loss": 5984815.0} {"train_loss": -20.01871681213379, "global_step": 50630, "epoch": 610} {"train_loss": -19.65206527709961, "global_step": 50631, "epoch": 610} {"train_loss": -19.7862606048584, "global_step": 50632, "epoch": 610} {"train_loss": -19.889169692993164, "global_step": 50633, "epoch": 610} {"train_loss": -20.284650802612305, "global_step": 50634, "epoch": 610} {"train_loss": -19.93010902404785, "global_step": 50635, "epoch": 610} {"train_loss": -20.105295181274414, "global_step": 50636, "epoch": 610} {"train_loss": -20.462324142456055, "global_step": 50637, "epoch": 610} {"train_loss": -20.046560287475586, "global_step": 50638, "epoch": 610} {"train_loss": -19.973100662231445, "global_step": 50639, "epoch": 610} {"train_loss": -19.949865341186523, "global_step": 50640, "epoch": 610} {"train_loss": -19.82533836364746, "global_step": 50641, "epoch": 610} {"train_loss": -19.9600887298584, "global_step": 50642, "epoch": 610} {"train_loss": -19.97494888305664, "global_step": 50643, "epoch": 610} {"train_loss": -19.82417869567871, "global_step": 50644, "epoch": 610} {"train_loss": -20.19472885131836, "global_step": 50645, "epoch": 610} {"train_loss": -19.741437911987305, "global_step": 50646, "epoch": 610} {"train_loss": -19.73497200012207, "global_step": 50647, "epoch": 610} {"train_loss": -19.821035385131836, "global_step": 50648, "epoch": 610} {"train_loss": -19.700902938842773, "global_step": 50649, "epoch": 610} {"train_loss": -20.03598403930664, "global_step": 50650, "epoch": 610} {"train_loss": -19.860347747802734, "global_step": 50651, "epoch": 610} {"train_loss": -19.682065963745117, "global_step": 50652, "epoch": 610} {"train_loss": -19.711957931518555, "global_step": 50653, "epoch": 610} {"train_loss": -20.187488555908203, "global_step": 50654, "epoch": 610} {"train_loss": -20.211048126220703, "global_step": 50655, "epoch": 610} {"train_loss": -19.939559936523438, "global_step": 50656, "epoch": 610} {"train_loss": -20.282499313354492, "global_step": 50657, "epoch": 610} {"train_loss": -20.066465377807617, "global_step": 50658, "epoch": 610} {"train_loss": -19.950803756713867, "global_step": 50659, "epoch": 610} {"train_loss": -19.99580192565918, "global_step": 50660, "epoch": 610} {"train_loss": -20.2890682220459, "global_step": 50661, "epoch": 610} {"train_loss": -19.87397575378418, "global_step": 50662, "epoch": 610} {"train_loss": -19.82840347290039, "global_step": 50663, "epoch": 610} {"train_loss": -20.137815475463867, "global_step": 50664, "epoch": 610} {"train_loss": -20.374094009399414, "global_step": 50665, "epoch": 610} {"train_loss": -19.42319107055664, "global_step": 50666, "epoch": 610} {"train_loss": -19.767107009887695, "global_step": 50667, "epoch": 610} {"train_loss": -20.051082611083984, "global_step": 50668, "epoch": 610} {"train_loss": -19.94532012939453, "global_step": 50669, "epoch": 610} {"train_loss": -20.055627822875977, "global_step": 50670, "epoch": 610} {"train_loss": -20.115102767944336, "global_step": 50671, "epoch": 610} {"train_loss": -19.993209838867188, "global_step": 50672, "epoch": 610} {"train_loss": -19.830564498901367, "global_step": 50673, "epoch": 610} {"train_loss": -19.838281631469727, "global_step": 50674, "epoch": 610} {"train_loss": -20.04510498046875, "global_step": 50675, "epoch": 610} {"train_loss": -20.26698875427246, "global_step": 50676, "epoch": 610} {"train_loss": -19.67160987854004, "global_step": 50677, "epoch": 610} {"train_loss": -19.828292846679688, "global_step": 50678, "epoch": 610} {"train_loss": -19.932331085205078, "global_step": 50679, "epoch": 610} {"train_loss": -20.141218185424805, "global_step": 50680, "epoch": 610} {"train_loss": -19.94985008239746, "global_step": 50681, "epoch": 610} {"train_loss": -20.050756454467773, "global_step": 50682, "epoch": 610} {"train_loss": -19.634933471679688, "global_step": 50683, "epoch": 610} {"train_loss": -19.96082878112793, "global_step": 50684, "epoch": 610} {"train_loss": -20.02188491821289, "global_step": 50685, "epoch": 610} {"train_loss": -20.357667922973633, "global_step": 50686, "epoch": 610} {"train_loss": -19.742074966430664, "global_step": 50687, "epoch": 610} {"train_loss": -19.842193603515625, "global_step": 50688, "epoch": 610} {"train_loss": -20.141971588134766, "global_step": 50689, "epoch": 610} {"train_loss": -20.042165756225586, "global_step": 50690, "epoch": 610} {"train_loss": -20.124929428100586, "global_step": 50691, "epoch": 610} {"train_loss": -20.273588180541992, "global_step": 50692, "epoch": 610} {"train_loss": -20.107751846313477, "global_step": 50693, "epoch": 610} {"train_loss": -20.069589614868164, "global_step": 50694, "epoch": 610} {"train_loss": -19.975343704223633, "global_step": 50695, "epoch": 610} {"train_loss": -19.82350730895996, "global_step": 50696, "epoch": 610} {"train_loss": -19.952713012695312, "global_step": 50697, "epoch": 610} {"train_loss": -20.082868576049805, "global_step": 50698, "epoch": 610} {"train_loss": -19.822988510131836, "global_step": 50699, "epoch": 610} {"train_loss": -20.013731002807617, "global_step": 50700, "epoch": 610} {"train_loss": -20.273221969604492, "global_step": 50701, "epoch": 610} {"train_loss": -20.289295196533203, "global_step": 50702, "epoch": 610} {"train_loss": -19.726600646972656, "global_step": 50703, "epoch": 610} {"train_loss": -20.305465698242188, "global_step": 50704, "epoch": 610} {"train_loss": -20.168012619018555, "global_step": 50705, "epoch": 610} {"train_loss": -19.832321166992188, "global_step": 50706, "epoch": 610} {"train_loss": -19.95397186279297, "global_step": 50707, "epoch": 610} {"train_loss": -19.843746185302734, "global_step": 50708, "epoch": 610} {"train_loss": -19.94187355041504, "global_step": 50709, "epoch": 610} {"train_loss": -19.431053161621094, "global_step": 50710, "epoch": 610} {"train_loss": -19.70456886291504, "global_step": 50711, "epoch": 610} {"train_loss": -19.99195287313806, "global_step": 50712, "epoch": 610, "val_loss": 6038708.5} {"train_loss": -19.203266143798828, "global_step": 50713, "epoch": 611} {"train_loss": -19.348312377929688, "global_step": 50714, "epoch": 611} {"train_loss": -19.749671936035156, "global_step": 50715, "epoch": 611} {"train_loss": -19.48114585876465, "global_step": 50716, "epoch": 611} {"train_loss": -19.834638595581055, "global_step": 50717, "epoch": 611} {"train_loss": -19.824684143066406, "global_step": 50718, "epoch": 611} {"train_loss": -19.846872329711914, "global_step": 50719, "epoch": 611} {"train_loss": -19.778518676757812, "global_step": 50720, "epoch": 611} {"train_loss": -19.584753036499023, "global_step": 50721, "epoch": 611} {"train_loss": -19.3341121673584, "global_step": 50722, "epoch": 611} {"train_loss": -19.557180404663086, "global_step": 50723, "epoch": 611} {"train_loss": -19.52316665649414, "global_step": 50724, "epoch": 611} {"train_loss": -19.714731216430664, "global_step": 50725, "epoch": 611} {"train_loss": -19.886259078979492, "global_step": 50726, "epoch": 611} {"train_loss": -19.51346778869629, "global_step": 50727, "epoch": 611} {"train_loss": -19.552263259887695, "global_step": 50728, "epoch": 611} {"train_loss": -19.418886184692383, "global_step": 50729, "epoch": 611} {"train_loss": -20.055727005004883, "global_step": 50730, "epoch": 611} {"train_loss": -19.89284324645996, "global_step": 50731, "epoch": 611} {"train_loss": -19.8323917388916, "global_step": 50732, "epoch": 611} {"train_loss": -19.977338790893555, "global_step": 50733, "epoch": 611} {"train_loss": -19.425931930541992, "global_step": 50734, "epoch": 611} {"train_loss": -19.91713523864746, "global_step": 50735, "epoch": 611} {"train_loss": -19.79111671447754, "global_step": 50736, "epoch": 611} {"train_loss": -20.31976318359375, "global_step": 50737, "epoch": 611} {"train_loss": -19.65144920349121, "global_step": 50738, "epoch": 611} {"train_loss": -19.85367202758789, "global_step": 50739, "epoch": 611} {"train_loss": -20.117252349853516, "global_step": 50740, "epoch": 611} {"train_loss": -19.835857391357422, "global_step": 50741, "epoch": 611} {"train_loss": -20.00409507751465, "global_step": 50742, "epoch": 611} {"train_loss": -20.011812210083008, "global_step": 50743, "epoch": 611} {"train_loss": -19.936033248901367, "global_step": 50744, "epoch": 611} {"train_loss": -20.18703269958496, "global_step": 50745, "epoch": 611} {"train_loss": -19.983869552612305, "global_step": 50746, "epoch": 611} {"train_loss": -19.59830665588379, "global_step": 50747, "epoch": 611} {"train_loss": -20.068790435791016, "global_step": 50748, "epoch": 611} {"train_loss": -19.946081161499023, "global_step": 50749, "epoch": 611} {"train_loss": -20.07872200012207, "global_step": 50750, "epoch": 611} {"train_loss": -19.724342346191406, "global_step": 50751, "epoch": 611} {"train_loss": -20.003219604492188, "global_step": 50752, "epoch": 611} {"train_loss": -20.13222312927246, "global_step": 50753, "epoch": 611} {"train_loss": -19.57480239868164, "global_step": 50754, "epoch": 611} {"train_loss": -20.201496124267578, "global_step": 50755, "epoch": 611} {"train_loss": -20.137746810913086, "global_step": 50756, "epoch": 611} {"train_loss": -20.100208282470703, "global_step": 50757, "epoch": 611} {"train_loss": -20.00367546081543, "global_step": 50758, "epoch": 611} {"train_loss": -20.10025978088379, "global_step": 50759, "epoch": 611} {"train_loss": -20.22182846069336, "global_step": 50760, "epoch": 611} {"train_loss": -19.971515655517578, "global_step": 50761, "epoch": 611} {"train_loss": -19.70967674255371, "global_step": 50762, "epoch": 611} {"train_loss": -20.038381576538086, "global_step": 50763, "epoch": 611} {"train_loss": -19.825803756713867, "global_step": 50764, "epoch": 611} {"train_loss": -19.841856002807617, "global_step": 50765, "epoch": 611} {"train_loss": -20.054521560668945, "global_step": 50766, "epoch": 611} {"train_loss": -19.887380599975586, "global_step": 50767, "epoch": 611} {"train_loss": -20.061450958251953, "global_step": 50768, "epoch": 611} {"train_loss": -19.782773971557617, "global_step": 50769, "epoch": 611} {"train_loss": -20.12525749206543, "global_step": 50770, "epoch": 611} {"train_loss": -20.03509521484375, "global_step": 50771, "epoch": 611} {"train_loss": -20.26228141784668, "global_step": 50772, "epoch": 611} {"train_loss": -20.017282485961914, "global_step": 50773, "epoch": 611} {"train_loss": -20.055700302124023, "global_step": 50774, "epoch": 611} {"train_loss": -19.939390182495117, "global_step": 50775, "epoch": 611} {"train_loss": -20.12228775024414, "global_step": 50776, "epoch": 611} {"train_loss": -20.243860244750977, "global_step": 50777, "epoch": 611} {"train_loss": -19.735992431640625, "global_step": 50778, "epoch": 611} {"train_loss": -19.893444061279297, "global_step": 50779, "epoch": 611} {"train_loss": -20.098512649536133, "global_step": 50780, "epoch": 611} {"train_loss": -19.90022087097168, "global_step": 50781, "epoch": 611} {"train_loss": -19.992557525634766, "global_step": 50782, "epoch": 611} {"train_loss": -19.685596466064453, "global_step": 50783, "epoch": 611} {"train_loss": -20.27530860900879, "global_step": 50784, "epoch": 611} {"train_loss": -20.306503295898438, "global_step": 50785, "epoch": 611} {"train_loss": -20.228179931640625, "global_step": 50786, "epoch": 611} {"train_loss": -20.32923698425293, "global_step": 50787, "epoch": 611} {"train_loss": -19.92079734802246, "global_step": 50788, "epoch": 611} {"train_loss": -19.721412658691406, "global_step": 50789, "epoch": 611} {"train_loss": -19.92893409729004, "global_step": 50790, "epoch": 611} {"train_loss": -19.910160064697266, "global_step": 50791, "epoch": 611} {"train_loss": -19.87188720703125, "global_step": 50792, "epoch": 611} {"train_loss": -19.997432708740234, "global_step": 50793, "epoch": 611} {"train_loss": -19.827848434448242, "global_step": 50794, "epoch": 611} {"train_loss": -19.912758884659734, "global_step": 50795, "epoch": 611, "val_loss": 6092636.0} {"train_loss": -19.699499130249023, "global_step": 50796, "epoch": 612} {"train_loss": -19.575122833251953, "global_step": 50797, "epoch": 612} {"train_loss": -19.646352767944336, "global_step": 50798, "epoch": 612} {"train_loss": -19.759519577026367, "global_step": 50799, "epoch": 612} {"train_loss": -19.57598304748535, "global_step": 50800, "epoch": 612} {"train_loss": -19.195688247680664, "global_step": 50801, "epoch": 612} {"train_loss": -20.065753936767578, "global_step": 50802, "epoch": 612} {"train_loss": -20.058027267456055, "global_step": 50803, "epoch": 612} {"train_loss": -19.90289878845215, "global_step": 50804, "epoch": 612} {"train_loss": -19.823957443237305, "global_step": 50805, "epoch": 612} {"train_loss": -19.63558006286621, "global_step": 50806, "epoch": 612} {"train_loss": -20.01492691040039, "global_step": 50807, "epoch": 612} {"train_loss": -20.315317153930664, "global_step": 50808, "epoch": 612} {"train_loss": -20.043018341064453, "global_step": 50809, "epoch": 612} {"train_loss": -20.088056564331055, "global_step": 50810, "epoch": 612} {"train_loss": -20.0355167388916, "global_step": 50811, "epoch": 612} {"train_loss": -20.151824951171875, "global_step": 50812, "epoch": 612} {"train_loss": -20.0240535736084, "global_step": 50813, "epoch": 612} {"train_loss": -19.70831298828125, "global_step": 50814, "epoch": 612} {"train_loss": -20.0224552154541, "global_step": 50815, "epoch": 612} {"train_loss": -20.341533660888672, "global_step": 50816, "epoch": 612} {"train_loss": -19.916975021362305, "global_step": 50817, "epoch": 612} {"train_loss": -20.145719528198242, "global_step": 50818, "epoch": 612} {"train_loss": -19.77953338623047, "global_step": 50819, "epoch": 612} {"train_loss": -20.07016944885254, "global_step": 50820, "epoch": 612} {"train_loss": -20.140241622924805, "global_step": 50821, "epoch": 612} {"train_loss": -20.085241317749023, "global_step": 50822, "epoch": 612} {"train_loss": -20.169727325439453, "global_step": 50823, "epoch": 612} {"train_loss": -20.31193733215332, "global_step": 50824, "epoch": 612} {"train_loss": -19.852210998535156, "global_step": 50825, "epoch": 612} {"train_loss": -19.827932357788086, "global_step": 50826, "epoch": 612} {"train_loss": -19.776350021362305, "global_step": 50827, "epoch": 612} {"train_loss": -20.28873062133789, "global_step": 50828, "epoch": 612} {"train_loss": -19.76387596130371, "global_step": 50829, "epoch": 612} {"train_loss": -20.08089256286621, "global_step": 50830, "epoch": 612} {"train_loss": -20.3991756439209, "global_step": 50831, "epoch": 612} {"train_loss": -20.00704002380371, "global_step": 50832, "epoch": 612} {"train_loss": -20.086273193359375, "global_step": 50833, "epoch": 612} {"train_loss": -20.058340072631836, "global_step": 50834, "epoch": 612} {"train_loss": -19.943103790283203, "global_step": 50835, "epoch": 612} {"train_loss": -19.7302303314209, "global_step": 50836, "epoch": 612} {"train_loss": -20.12775993347168, "global_step": 50837, "epoch": 612} {"train_loss": -19.993955612182617, "global_step": 50838, "epoch": 612} {"train_loss": -20.06281280517578, "global_step": 50839, "epoch": 612} {"train_loss": -19.738510131835938, "global_step": 50840, "epoch": 612} {"train_loss": -20.14915657043457, "global_step": 50841, "epoch": 612} {"train_loss": -20.026464462280273, "global_step": 50842, "epoch": 612} {"train_loss": -19.842185974121094, "global_step": 50843, "epoch": 612} {"train_loss": -20.012502670288086, "global_step": 50844, "epoch": 612} {"train_loss": -19.60468292236328, "global_step": 50845, "epoch": 612} {"train_loss": -19.793399810791016, "global_step": 50846, "epoch": 612} {"train_loss": -20.32938003540039, "global_step": 50847, "epoch": 612} {"train_loss": -20.192928314208984, "global_step": 50848, "epoch": 612} {"train_loss": -20.188385009765625, "global_step": 50849, "epoch": 612} {"train_loss": -20.13531494140625, "global_step": 50850, "epoch": 612} {"train_loss": -19.596317291259766, "global_step": 50851, "epoch": 612} {"train_loss": -20.070568084716797, "global_step": 50852, "epoch": 612} {"train_loss": -19.71971893310547, "global_step": 50853, "epoch": 612} {"train_loss": -20.31426429748535, "global_step": 50854, "epoch": 612} {"train_loss": -20.00996208190918, "global_step": 50855, "epoch": 612} {"train_loss": -19.94989585876465, "global_step": 50856, "epoch": 612} {"train_loss": -20.110822677612305, "global_step": 50857, "epoch": 612} {"train_loss": -20.20380973815918, "global_step": 50858, "epoch": 612} {"train_loss": -19.89765739440918, "global_step": 50859, "epoch": 612} {"train_loss": -20.318082809448242, "global_step": 50860, "epoch": 612} {"train_loss": -19.8377628326416, "global_step": 50861, "epoch": 612} {"train_loss": -20.0643253326416, "global_step": 50862, "epoch": 612} {"train_loss": -19.88067626953125, "global_step": 50863, "epoch": 612} {"train_loss": -20.182518005371094, "global_step": 50864, "epoch": 612} {"train_loss": -19.86345863342285, "global_step": 50865, "epoch": 612} {"train_loss": -19.585859298706055, "global_step": 50866, "epoch": 612} {"train_loss": -20.029081344604492, "global_step": 50867, "epoch": 612} {"train_loss": -19.77179527282715, "global_step": 50868, "epoch": 612} {"train_loss": -19.731460571289062, "global_step": 50869, "epoch": 612} {"train_loss": -20.06721305847168, "global_step": 50870, "epoch": 612} {"train_loss": -19.915273666381836, "global_step": 50871, "epoch": 612} {"train_loss": -19.961719512939453, "global_step": 50872, "epoch": 612} {"train_loss": -20.3105411529541, "global_step": 50873, "epoch": 612} {"train_loss": -19.87175750732422, "global_step": 50874, "epoch": 612} {"train_loss": -19.730215072631836, "global_step": 50875, "epoch": 612} {"train_loss": -19.942419052124023, "global_step": 50876, "epoch": 612} {"train_loss": -20.22426414489746, "global_step": 50877, "epoch": 612} {"train_loss": -19.962295210505108, "global_step": 50878, "epoch": 612, "val_loss": 6072836.0} {"train_loss": -19.3958797454834, "global_step": 50879, "epoch": 613} {"train_loss": -19.56466293334961, "global_step": 50880, "epoch": 613} {"train_loss": -19.49502944946289, "global_step": 50881, "epoch": 613} {"train_loss": -19.588834762573242, "global_step": 50882, "epoch": 613} {"train_loss": -19.687850952148438, "global_step": 50883, "epoch": 613} {"train_loss": -19.477458953857422, "global_step": 50884, "epoch": 613} {"train_loss": -20.100582122802734, "global_step": 50885, "epoch": 613} {"train_loss": -19.557315826416016, "global_step": 50886, "epoch": 613} {"train_loss": -19.89381217956543, "global_step": 50887, "epoch": 613} {"train_loss": -20.44955825805664, "global_step": 50888, "epoch": 613} {"train_loss": -19.66375732421875, "global_step": 50889, "epoch": 613} {"train_loss": -19.96550750732422, "global_step": 50890, "epoch": 613} {"train_loss": -19.931543350219727, "global_step": 50891, "epoch": 613} {"train_loss": -19.941312789916992, "global_step": 50892, "epoch": 613} {"train_loss": -19.595407485961914, "global_step": 50893, "epoch": 613} {"train_loss": -20.192136764526367, "global_step": 50894, "epoch": 613} {"train_loss": -19.862648010253906, "global_step": 50895, "epoch": 613} {"train_loss": -20.061105728149414, "global_step": 50896, "epoch": 613} {"train_loss": -20.384634017944336, "global_step": 50897, "epoch": 613} {"train_loss": -20.367311477661133, "global_step": 50898, "epoch": 613} {"train_loss": -19.76483917236328, "global_step": 50899, "epoch": 613} {"train_loss": -20.47314453125, "global_step": 50900, "epoch": 613} {"train_loss": -19.767587661743164, "global_step": 50901, "epoch": 613} {"train_loss": -19.84291648864746, "global_step": 50902, "epoch": 613} {"train_loss": -20.009057998657227, "global_step": 50903, "epoch": 613} {"train_loss": -19.885669708251953, "global_step": 50904, "epoch": 613} {"train_loss": -19.72838020324707, "global_step": 50905, "epoch": 613} {"train_loss": -20.02704429626465, "global_step": 50906, "epoch": 613} {"train_loss": -20.12888526916504, "global_step": 50907, "epoch": 613} {"train_loss": -19.804763793945312, "global_step": 50908, "epoch": 613} {"train_loss": -19.63693618774414, "global_step": 50909, "epoch": 613} {"train_loss": -20.236059188842773, "global_step": 50910, "epoch": 613} {"train_loss": -20.276084899902344, "global_step": 50911, "epoch": 613} {"train_loss": -19.928571701049805, "global_step": 50912, "epoch": 613} {"train_loss": -20.534826278686523, "global_step": 50913, "epoch": 613} {"train_loss": -20.034204483032227, "global_step": 50914, "epoch": 613} {"train_loss": -20.26727867126465, "global_step": 50915, "epoch": 613} {"train_loss": -19.798757553100586, "global_step": 50916, "epoch": 613} {"train_loss": -20.275178909301758, "global_step": 50917, "epoch": 613} {"train_loss": -20.013999938964844, "global_step": 50918, "epoch": 613} {"train_loss": -20.163578033447266, "global_step": 50919, "epoch": 613} {"train_loss": -19.572917938232422, "global_step": 50920, "epoch": 613} {"train_loss": -19.91697120666504, "global_step": 50921, "epoch": 613} {"train_loss": -20.34205436706543, "global_step": 50922, "epoch": 613} {"train_loss": -20.395429611206055, "global_step": 50923, "epoch": 613} {"train_loss": -19.645360946655273, "global_step": 50924, "epoch": 613} {"train_loss": -20.44405174255371, "global_step": 50925, "epoch": 613} {"train_loss": -19.54865074157715, "global_step": 50926, "epoch": 613} {"train_loss": -20.227880477905273, "global_step": 50927, "epoch": 613} {"train_loss": -19.950597763061523, "global_step": 50928, "epoch": 613} {"train_loss": -20.065048217773438, "global_step": 50929, "epoch": 613} {"train_loss": -19.71502113342285, "global_step": 50930, "epoch": 613} {"train_loss": -20.091768264770508, "global_step": 50931, "epoch": 613} {"train_loss": -19.94248390197754, "global_step": 50932, "epoch": 613} {"train_loss": -20.296478271484375, "global_step": 50933, "epoch": 613} {"train_loss": -19.690412521362305, "global_step": 50934, "epoch": 613} {"train_loss": -20.078960418701172, "global_step": 50935, "epoch": 613} {"train_loss": -19.96266746520996, "global_step": 50936, "epoch": 613} {"train_loss": -20.217336654663086, "global_step": 50937, "epoch": 613} {"train_loss": -19.755186080932617, "global_step": 50938, "epoch": 613} {"train_loss": -20.19303321838379, "global_step": 50939, "epoch": 613} {"train_loss": -20.0230655670166, "global_step": 50940, "epoch": 613} {"train_loss": -19.702428817749023, "global_step": 50941, "epoch": 613} {"train_loss": -19.9803466796875, "global_step": 50942, "epoch": 613} {"train_loss": -19.99003791809082, "global_step": 50943, "epoch": 613} {"train_loss": -20.16460609436035, "global_step": 50944, "epoch": 613} {"train_loss": -20.018857955932617, "global_step": 50945, "epoch": 613} {"train_loss": -19.862274169921875, "global_step": 50946, "epoch": 613} {"train_loss": -20.280723571777344, "global_step": 50947, "epoch": 613} {"train_loss": -19.724084854125977, "global_step": 50948, "epoch": 613} {"train_loss": -20.24802017211914, "global_step": 50949, "epoch": 613} {"train_loss": -20.014469146728516, "global_step": 50950, "epoch": 613} {"train_loss": -19.92661476135254, "global_step": 50951, "epoch": 613} {"train_loss": -19.64663314819336, "global_step": 50952, "epoch": 613} {"train_loss": -19.862462997436523, "global_step": 50953, "epoch": 613} {"train_loss": -20.157154083251953, "global_step": 50954, "epoch": 613} {"train_loss": -20.05832862854004, "global_step": 50955, "epoch": 613} {"train_loss": -20.151945114135742, "global_step": 50956, "epoch": 613} {"train_loss": -19.97206687927246, "global_step": 50957, "epoch": 613} {"train_loss": -19.775083541870117, "global_step": 50958, "epoch": 613} {"train_loss": -19.96146011352539, "global_step": 50959, "epoch": 613} {"train_loss": -20.273889541625977, "global_step": 50960, "epoch": 613} {"train_loss": -19.97633688133883, "global_step": 50961, "epoch": 613, "val_loss": 6029558.0} {"train_loss": -20.064647674560547, "global_step": 50962, "epoch": 614} {"train_loss": -19.665937423706055, "global_step": 50963, "epoch": 614} {"train_loss": -20.12305450439453, "global_step": 50964, "epoch": 614} {"train_loss": -19.760839462280273, "global_step": 50965, "epoch": 614} {"train_loss": -19.613847732543945, "global_step": 50966, "epoch": 614} {"train_loss": -20.093961715698242, "global_step": 50967, "epoch": 614} {"train_loss": -19.853742599487305, "global_step": 50968, "epoch": 614} {"train_loss": -20.179794311523438, "global_step": 50969, "epoch": 614} {"train_loss": -19.668848037719727, "global_step": 50970, "epoch": 614} {"train_loss": -19.844772338867188, "global_step": 50971, "epoch": 614} {"train_loss": -19.813640594482422, "global_step": 50972, "epoch": 614} {"train_loss": -20.029163360595703, "global_step": 50973, "epoch": 614} {"train_loss": -20.019153594970703, "global_step": 50974, "epoch": 614} {"train_loss": -19.893712997436523, "global_step": 50975, "epoch": 614} {"train_loss": -20.19227409362793, "global_step": 50976, "epoch": 614} {"train_loss": -19.839019775390625, "global_step": 50977, "epoch": 614} {"train_loss": -20.09532928466797, "global_step": 50978, "epoch": 614} {"train_loss": -20.132251739501953, "global_step": 50979, "epoch": 614} {"train_loss": -19.423168182373047, "global_step": 50980, "epoch": 614} {"train_loss": -20.071020126342773, "global_step": 50981, "epoch": 614} {"train_loss": -20.169797897338867, "global_step": 50982, "epoch": 614} {"train_loss": -19.901119232177734, "global_step": 50983, "epoch": 614} {"train_loss": -20.48018455505371, "global_step": 50984, "epoch": 614} {"train_loss": -19.939899444580078, "global_step": 50985, "epoch": 614} {"train_loss": -19.929433822631836, "global_step": 50986, "epoch": 614} {"train_loss": -19.786468505859375, "global_step": 50987, "epoch": 614} {"train_loss": -20.13290023803711, "global_step": 50988, "epoch": 614} {"train_loss": -19.828367233276367, "global_step": 50989, "epoch": 614} {"train_loss": -20.109342575073242, "global_step": 50990, "epoch": 614} {"train_loss": -20.290313720703125, "global_step": 50991, "epoch": 614} {"train_loss": -20.093978881835938, "global_step": 50992, "epoch": 614} {"train_loss": -20.082622528076172, "global_step": 50993, "epoch": 614} {"train_loss": -20.116060256958008, "global_step": 50994, "epoch": 614} {"train_loss": -20.041242599487305, "global_step": 50995, "epoch": 614} {"train_loss": -20.22540283203125, "global_step": 50996, "epoch": 614} {"train_loss": -20.187793731689453, "global_step": 50997, "epoch": 614} {"train_loss": -20.01494789123535, "global_step": 50998, "epoch": 614} {"train_loss": -19.865032196044922, "global_step": 50999, "epoch": 614} {"train_loss": -19.82429313659668, "global_step": 51000, "epoch": 614} {"train_loss": -20.221481323242188, "global_step": 51001, "epoch": 614} {"train_loss": -19.918445587158203, "global_step": 51002, "epoch": 614} {"train_loss": -20.19340705871582, "global_step": 51003, "epoch": 614} {"train_loss": -19.86226463317871, "global_step": 51004, "epoch": 614} {"train_loss": -20.065593719482422, "global_step": 51005, "epoch": 614} {"train_loss": -19.81165885925293, "global_step": 51006, "epoch": 614} {"train_loss": -20.166879653930664, "global_step": 51007, "epoch": 614} {"train_loss": -20.02803611755371, "global_step": 51008, "epoch": 614} {"train_loss": -19.520309448242188, "global_step": 51009, "epoch": 614} {"train_loss": -20.00271987915039, "global_step": 51010, "epoch": 614} {"train_loss": -19.92835235595703, "global_step": 51011, "epoch": 614} {"train_loss": -19.856962203979492, "global_step": 51012, "epoch": 614} {"train_loss": -20.127126693725586, "global_step": 51013, "epoch": 614} {"train_loss": -19.97828483581543, "global_step": 51014, "epoch": 614} {"train_loss": -19.064130783081055, "global_step": 51015, "epoch": 614} {"train_loss": -19.976835250854492, "global_step": 51016, "epoch": 614} {"train_loss": -19.732715606689453, "global_step": 51017, "epoch": 614} {"train_loss": -20.02381706237793, "global_step": 51018, "epoch": 614} {"train_loss": -19.74020004272461, "global_step": 51019, "epoch": 614} {"train_loss": -19.758769989013672, "global_step": 51020, "epoch": 614} {"train_loss": -19.431371688842773, "global_step": 51021, "epoch": 614} {"train_loss": -19.984027862548828, "global_step": 51022, "epoch": 614} {"train_loss": -20.128955841064453, "global_step": 51023, "epoch": 614} {"train_loss": -20.37906265258789, "global_step": 51024, "epoch": 614} {"train_loss": -19.715442657470703, "global_step": 51025, "epoch": 614} {"train_loss": -19.922504425048828, "global_step": 51026, "epoch": 614} {"train_loss": -19.97368621826172, "global_step": 51027, "epoch": 614} {"train_loss": -19.797788619995117, "global_step": 51028, "epoch": 614} {"train_loss": -20.225078582763672, "global_step": 51029, "epoch": 614} {"train_loss": -19.9367618560791, "global_step": 51030, "epoch": 614} {"train_loss": -19.8834285736084, "global_step": 51031, "epoch": 614} {"train_loss": -20.292755126953125, "global_step": 51032, "epoch": 614} {"train_loss": -19.980371475219727, "global_step": 51033, "epoch": 614} {"train_loss": -20.13750648498535, "global_step": 51034, "epoch": 614} {"train_loss": -20.208515167236328, "global_step": 51035, "epoch": 614} {"train_loss": -19.809947967529297, "global_step": 51036, "epoch": 614} {"train_loss": -19.94882583618164, "global_step": 51037, "epoch": 614} {"train_loss": -19.65004539489746, "global_step": 51038, "epoch": 614} {"train_loss": -20.093055725097656, "global_step": 51039, "epoch": 614} {"train_loss": -19.885400772094727, "global_step": 51040, "epoch": 614} {"train_loss": -19.9488468170166, "global_step": 51041, "epoch": 614} {"train_loss": -20.318344116210938, "global_step": 51042, "epoch": 614} {"train_loss": -20.270360946655273, "global_step": 51043, "epoch": 614} {"train_loss": -19.959704801260706, "global_step": 51044, "epoch": 614, "val_loss": 6008424.0} {"train_loss": -19.72627067565918, "global_step": 51045, "epoch": 615} {"train_loss": -20.095354080200195, "global_step": 51046, "epoch": 615} {"train_loss": -19.71425437927246, "global_step": 51047, "epoch": 615} {"train_loss": -19.6761474609375, "global_step": 51048, "epoch": 615} {"train_loss": -20.085119247436523, "global_step": 51049, "epoch": 615} {"train_loss": -19.850427627563477, "global_step": 51050, "epoch": 615} {"train_loss": -19.86321449279785, "global_step": 51051, "epoch": 615} {"train_loss": -20.040790557861328, "global_step": 51052, "epoch": 615} {"train_loss": -19.703744888305664, "global_step": 51053, "epoch": 615} {"train_loss": -19.781721115112305, "global_step": 51054, "epoch": 615} {"train_loss": -19.913602828979492, "global_step": 51055, "epoch": 615} {"train_loss": -19.67886734008789, "global_step": 51056, "epoch": 615} {"train_loss": -19.883750915527344, "global_step": 51057, "epoch": 615} {"train_loss": -20.193387985229492, "global_step": 51058, "epoch": 615} {"train_loss": -20.137619018554688, "global_step": 51059, "epoch": 615} {"train_loss": -20.084035873413086, "global_step": 51060, "epoch": 615} {"train_loss": -20.221176147460938, "global_step": 51061, "epoch": 615} {"train_loss": -19.951091766357422, "global_step": 51062, "epoch": 615} {"train_loss": -20.04683494567871, "global_step": 51063, "epoch": 615} {"train_loss": -20.081953048706055, "global_step": 51064, "epoch": 615} {"train_loss": -19.88612174987793, "global_step": 51065, "epoch": 615} {"train_loss": -19.76375961303711, "global_step": 51066, "epoch": 615} {"train_loss": -19.86484718322754, "global_step": 51067, "epoch": 615} {"train_loss": -20.086275100708008, "global_step": 51068, "epoch": 615} {"train_loss": -19.9390926361084, "global_step": 51069, "epoch": 615} {"train_loss": -19.839860916137695, "global_step": 51070, "epoch": 615} {"train_loss": -19.794775009155273, "global_step": 51071, "epoch": 615} {"train_loss": -19.839448928833008, "global_step": 51072, "epoch": 615} {"train_loss": -20.14645767211914, "global_step": 51073, "epoch": 615} {"train_loss": -20.066390991210938, "global_step": 51074, "epoch": 615} {"train_loss": -19.990976333618164, "global_step": 51075, "epoch": 615} {"train_loss": -19.876140594482422, "global_step": 51076, "epoch": 615} {"train_loss": -19.678552627563477, "global_step": 51077, "epoch": 615} {"train_loss": -19.9094295501709, "global_step": 51078, "epoch": 615} {"train_loss": -19.864652633666992, "global_step": 51079, "epoch": 615} {"train_loss": -19.9360408782959, "global_step": 51080, "epoch": 615} {"train_loss": -20.057937622070312, "global_step": 51081, "epoch": 615} {"train_loss": -20.030765533447266, "global_step": 51082, "epoch": 615} {"train_loss": -20.18006706237793, "global_step": 51083, "epoch": 615} {"train_loss": -19.95237159729004, "global_step": 51084, "epoch": 615} {"train_loss": -19.60987091064453, "global_step": 51085, "epoch": 615} {"train_loss": -19.95558738708496, "global_step": 51086, "epoch": 615} {"train_loss": -19.78363609313965, "global_step": 51087, "epoch": 615} {"train_loss": -20.010412216186523, "global_step": 51088, "epoch": 615} {"train_loss": -20.062625885009766, "global_step": 51089, "epoch": 615} {"train_loss": -20.025217056274414, "global_step": 51090, "epoch": 615} {"train_loss": -19.811689376831055, "global_step": 51091, "epoch": 615} {"train_loss": -20.228666305541992, "global_step": 51092, "epoch": 615} {"train_loss": -20.269580841064453, "global_step": 51093, "epoch": 615} {"train_loss": -19.837337493896484, "global_step": 51094, "epoch": 615} {"train_loss": -20.37051773071289, "global_step": 51095, "epoch": 615} {"train_loss": -20.045568466186523, "global_step": 51096, "epoch": 615} {"train_loss": -19.894031524658203, "global_step": 51097, "epoch": 615} {"train_loss": -19.644245147705078, "global_step": 51098, "epoch": 615} {"train_loss": -19.848299026489258, "global_step": 51099, "epoch": 615} {"train_loss": -19.897863388061523, "global_step": 51100, "epoch": 615} {"train_loss": -19.710783004760742, "global_step": 51101, "epoch": 615} {"train_loss": -20.16806411743164, "global_step": 51102, "epoch": 615} {"train_loss": -19.946504592895508, "global_step": 51103, "epoch": 615} {"train_loss": -19.8670654296875, "global_step": 51104, "epoch": 615} {"train_loss": -19.846900939941406, "global_step": 51105, "epoch": 615} {"train_loss": -20.125713348388672, "global_step": 51106, "epoch": 615} {"train_loss": -19.815471649169922, "global_step": 51107, "epoch": 615} {"train_loss": -20.15411376953125, "global_step": 51108, "epoch": 615} {"train_loss": -20.225980758666992, "global_step": 51109, "epoch": 615} {"train_loss": -19.930761337280273, "global_step": 51110, "epoch": 615} {"train_loss": -19.89448356628418, "global_step": 51111, "epoch": 615} {"train_loss": -20.059568405151367, "global_step": 51112, "epoch": 615} {"train_loss": -19.92485237121582, "global_step": 51113, "epoch": 615} {"train_loss": -19.57826042175293, "global_step": 51114, "epoch": 615} {"train_loss": -19.85588264465332, "global_step": 51115, "epoch": 615} {"train_loss": -20.14887046813965, "global_step": 51116, "epoch": 615} {"train_loss": -20.135848999023438, "global_step": 51117, "epoch": 615} {"train_loss": -20.100513458251953, "global_step": 51118, "epoch": 615} {"train_loss": -20.285451889038086, "global_step": 51119, "epoch": 615} {"train_loss": -20.086149215698242, "global_step": 51120, "epoch": 615} {"train_loss": -19.78767204284668, "global_step": 51121, "epoch": 615} {"train_loss": -20.254352569580078, "global_step": 51122, "epoch": 615} {"train_loss": -20.031352996826172, "global_step": 51123, "epoch": 615} {"train_loss": -20.15411949157715, "global_step": 51124, "epoch": 615} {"train_loss": -19.993165969848633, "global_step": 51125, "epoch": 615} {"train_loss": -20.035348892211914, "global_step": 51126, "epoch": 615} {"train_loss": -19.977338630032826, "global_step": 51127, "epoch": 615, "val_loss": 6228922.0} {"train_loss": -19.558446884155273, "global_step": 51128, "epoch": 616} {"train_loss": -19.6146240234375, "global_step": 51129, "epoch": 616} {"train_loss": -20.024078369140625, "global_step": 51130, "epoch": 616} {"train_loss": -19.875713348388672, "global_step": 51131, "epoch": 616} {"train_loss": -19.588760375976562, "global_step": 51132, "epoch": 616} {"train_loss": -20.268144607543945, "global_step": 51133, "epoch": 616} {"train_loss": -19.605077743530273, "global_step": 51134, "epoch": 616} {"train_loss": -20.1366024017334, "global_step": 51135, "epoch": 616} {"train_loss": -19.79864501953125, "global_step": 51136, "epoch": 616} {"train_loss": -19.45088005065918, "global_step": 51137, "epoch": 616} {"train_loss": -20.24519920349121, "global_step": 51138, "epoch": 616} {"train_loss": -19.734739303588867, "global_step": 51139, "epoch": 616} {"train_loss": -20.112462997436523, "global_step": 51140, "epoch": 616} {"train_loss": -19.559232711791992, "global_step": 51141, "epoch": 616} {"train_loss": -19.998289108276367, "global_step": 51142, "epoch": 616} {"train_loss": -19.668970108032227, "global_step": 51143, "epoch": 616} {"train_loss": -19.906536102294922, "global_step": 51144, "epoch": 616} {"train_loss": -19.873247146606445, "global_step": 51145, "epoch": 616} {"train_loss": -20.185049057006836, "global_step": 51146, "epoch": 616} {"train_loss": -19.73115348815918, "global_step": 51147, "epoch": 616} {"train_loss": -20.14605712890625, "global_step": 51148, "epoch": 616} {"train_loss": -19.86966323852539, "global_step": 51149, "epoch": 616} {"train_loss": -20.075057983398438, "global_step": 51150, "epoch": 616} {"train_loss": -20.160497665405273, "global_step": 51151, "epoch": 616} {"train_loss": -20.09381675720215, "global_step": 51152, "epoch": 616} {"train_loss": -19.802820205688477, "global_step": 51153, "epoch": 616} {"train_loss": -19.953088760375977, "global_step": 51154, "epoch": 616} {"train_loss": -19.93389892578125, "global_step": 51155, "epoch": 616} {"train_loss": -19.869543075561523, "global_step": 51156, "epoch": 616} {"train_loss": -19.70331382751465, "global_step": 51157, "epoch": 616} {"train_loss": -20.03208351135254, "global_step": 51158, "epoch": 616} {"train_loss": -19.738197326660156, "global_step": 51159, "epoch": 616} {"train_loss": -20.09709358215332, "global_step": 51160, "epoch": 616} {"train_loss": -19.923431396484375, "global_step": 51161, "epoch": 616} {"train_loss": -19.91135025024414, "global_step": 51162, "epoch": 616} {"train_loss": -19.988727569580078, "global_step": 51163, "epoch": 616} {"train_loss": -19.670007705688477, "global_step": 51164, "epoch": 616} {"train_loss": -20.1884708404541, "global_step": 51165, "epoch": 616} {"train_loss": -19.896686553955078, "global_step": 51166, "epoch": 616} {"train_loss": -19.58375358581543, "global_step": 51167, "epoch": 616} {"train_loss": -19.961685180664062, "global_step": 51168, "epoch": 616} {"train_loss": -19.59153175354004, "global_step": 51169, "epoch": 616} {"train_loss": -20.0284423828125, "global_step": 51170, "epoch": 616} {"train_loss": -20.04817008972168, "global_step": 51171, "epoch": 616} {"train_loss": -20.06698989868164, "global_step": 51172, "epoch": 616} {"train_loss": -20.332324981689453, "global_step": 51173, "epoch": 616} {"train_loss": -20.108240127563477, "global_step": 51174, "epoch": 616} {"train_loss": -20.11300277709961, "global_step": 51175, "epoch": 616} {"train_loss": -19.81288719177246, "global_step": 51176, "epoch": 616} {"train_loss": -19.694616317749023, "global_step": 51177, "epoch": 616} {"train_loss": -19.70135498046875, "global_step": 51178, "epoch": 616} {"train_loss": -20.052297592163086, "global_step": 51179, "epoch": 616} {"train_loss": -19.72464942932129, "global_step": 51180, "epoch": 616} {"train_loss": -19.959991455078125, "global_step": 51181, "epoch": 616} {"train_loss": -19.88243865966797, "global_step": 51182, "epoch": 616} {"train_loss": -19.937959671020508, "global_step": 51183, "epoch": 616} {"train_loss": -19.799413681030273, "global_step": 51184, "epoch": 616} {"train_loss": -19.859283447265625, "global_step": 51185, "epoch": 616} {"train_loss": -20.09322166442871, "global_step": 51186, "epoch": 616} {"train_loss": -19.96906852722168, "global_step": 51187, "epoch": 616} {"train_loss": -19.746784210205078, "global_step": 51188, "epoch": 616} {"train_loss": -20.08233642578125, "global_step": 51189, "epoch": 616} {"train_loss": -19.71555519104004, "global_step": 51190, "epoch": 616} {"train_loss": -20.272140502929688, "global_step": 51191, "epoch": 616} {"train_loss": -20.293750762939453, "global_step": 51192, "epoch": 616} {"train_loss": -19.95663833618164, "global_step": 51193, "epoch": 616} {"train_loss": -19.934844970703125, "global_step": 51194, "epoch": 616} {"train_loss": -20.030698776245117, "global_step": 51195, "epoch": 616} {"train_loss": -20.24412727355957, "global_step": 51196, "epoch": 616} {"train_loss": -20.077390670776367, "global_step": 51197, "epoch": 616} {"train_loss": -19.96949005126953, "global_step": 51198, "epoch": 616} {"train_loss": -19.669708251953125, "global_step": 51199, "epoch": 616} {"train_loss": -19.92593765258789, "global_step": 51200, "epoch": 616} {"train_loss": -20.022933959960938, "global_step": 51201, "epoch": 616} {"train_loss": -19.889562606811523, "global_step": 51202, "epoch": 616} {"train_loss": -20.070472717285156, "global_step": 51203, "epoch": 616} {"train_loss": -20.06855010986328, "global_step": 51204, "epoch": 616} {"train_loss": -19.983793258666992, "global_step": 51205, "epoch": 616} {"train_loss": -20.105655670166016, "global_step": 51206, "epoch": 616} {"train_loss": -20.01472282409668, "global_step": 51207, "epoch": 616} {"train_loss": -20.121036529541016, "global_step": 51208, "epoch": 616} {"train_loss": -19.560440063476562, "global_step": 51209, "epoch": 616} {"train_loss": -19.930690811341066, "global_step": 51210, "epoch": 616, "val_loss": 6058058.5} {"train_loss": -19.758466720581055, "global_step": 51211, "epoch": 617} {"train_loss": -19.471853256225586, "global_step": 51212, "epoch": 617} {"train_loss": -19.697160720825195, "global_step": 51213, "epoch": 617} {"train_loss": -19.509937286376953, "global_step": 51214, "epoch": 617} {"train_loss": -19.61163902282715, "global_step": 51215, "epoch": 617} {"train_loss": -19.473615646362305, "global_step": 51216, "epoch": 617} {"train_loss": -19.862031936645508, "global_step": 51217, "epoch": 617} {"train_loss": -19.77107810974121, "global_step": 51218, "epoch": 617} {"train_loss": -19.8244571685791, "global_step": 51219, "epoch": 617} {"train_loss": -19.88262367248535, "global_step": 51220, "epoch": 617} {"train_loss": -19.66410255432129, "global_step": 51221, "epoch": 617} {"train_loss": -19.71932029724121, "global_step": 51222, "epoch": 617} {"train_loss": -20.038105010986328, "global_step": 51223, "epoch": 617} {"train_loss": -20.25661277770996, "global_step": 51224, "epoch": 617} {"train_loss": -19.811811447143555, "global_step": 51225, "epoch": 617} {"train_loss": -20.005542755126953, "global_step": 51226, "epoch": 617} {"train_loss": -19.955793380737305, "global_step": 51227, "epoch": 617} {"train_loss": -19.77131462097168, "global_step": 51228, "epoch": 617} {"train_loss": -19.907135009765625, "global_step": 51229, "epoch": 617} {"train_loss": -19.98993492126465, "global_step": 51230, "epoch": 617} {"train_loss": -19.91972541809082, "global_step": 51231, "epoch": 617} {"train_loss": -20.179471969604492, "global_step": 51232, "epoch": 617} {"train_loss": -20.439058303833008, "global_step": 51233, "epoch": 617} {"train_loss": -20.18842124938965, "global_step": 51234, "epoch": 617} {"train_loss": -19.800962448120117, "global_step": 51235, "epoch": 617} {"train_loss": -19.951322555541992, "global_step": 51236, "epoch": 617} {"train_loss": -19.939855575561523, "global_step": 51237, "epoch": 617} {"train_loss": -19.885217666625977, "global_step": 51238, "epoch": 617} {"train_loss": -20.075841903686523, "global_step": 51239, "epoch": 617} {"train_loss": -20.153095245361328, "global_step": 51240, "epoch": 617} {"train_loss": -19.891407012939453, "global_step": 51241, "epoch": 617} {"train_loss": -19.976669311523438, "global_step": 51242, "epoch": 617} {"train_loss": -20.113567352294922, "global_step": 51243, "epoch": 617} {"train_loss": -19.64272117614746, "global_step": 51244, "epoch": 617} {"train_loss": -19.923341751098633, "global_step": 51245, "epoch": 617} {"train_loss": -20.482097625732422, "global_step": 51246, "epoch": 617} {"train_loss": -19.765974044799805, "global_step": 51247, "epoch": 617} {"train_loss": -19.92945671081543, "global_step": 51248, "epoch": 617} {"train_loss": -20.04970359802246, "global_step": 51249, "epoch": 617} {"train_loss": -19.9847354888916, "global_step": 51250, "epoch": 617} {"train_loss": -20.138229370117188, "global_step": 51251, "epoch": 617} {"train_loss": -19.97948455810547, "global_step": 51252, "epoch": 617} {"train_loss": -20.38690185546875, "global_step": 51253, "epoch": 617} {"train_loss": -20.000064849853516, "global_step": 51254, "epoch": 617} {"train_loss": -19.825361251831055, "global_step": 51255, "epoch": 617} {"train_loss": -20.102588653564453, "global_step": 51256, "epoch": 617} {"train_loss": -19.994876861572266, "global_step": 51257, "epoch": 617} {"train_loss": -20.233694076538086, "global_step": 51258, "epoch": 617} {"train_loss": -20.123764038085938, "global_step": 51259, "epoch": 617} {"train_loss": -20.171506881713867, "global_step": 51260, "epoch": 617} {"train_loss": -19.99704933166504, "global_step": 51261, "epoch": 617} {"train_loss": -19.616621017456055, "global_step": 51262, "epoch": 617} {"train_loss": -20.066253662109375, "global_step": 51263, "epoch": 617} {"train_loss": -20.214468002319336, "global_step": 51264, "epoch": 617} {"train_loss": -20.2547607421875, "global_step": 51265, "epoch": 617} {"train_loss": -19.5761661529541, "global_step": 51266, "epoch": 617} {"train_loss": -20.321714401245117, "global_step": 51267, "epoch": 617} {"train_loss": -19.959684371948242, "global_step": 51268, "epoch": 617} {"train_loss": -20.12575340270996, "global_step": 51269, "epoch": 617} {"train_loss": -19.960790634155273, "global_step": 51270, "epoch": 617} {"train_loss": -19.824403762817383, "global_step": 51271, "epoch": 617} {"train_loss": -20.053266525268555, "global_step": 51272, "epoch": 617} {"train_loss": -19.92250633239746, "global_step": 51273, "epoch": 617} {"train_loss": -19.798364639282227, "global_step": 51274, "epoch": 617} {"train_loss": -19.827848434448242, "global_step": 51275, "epoch": 617} {"train_loss": -19.87375259399414, "global_step": 51276, "epoch": 617} {"train_loss": -19.796871185302734, "global_step": 51277, "epoch": 617} {"train_loss": -20.223073959350586, "global_step": 51278, "epoch": 617} {"train_loss": -19.946630477905273, "global_step": 51279, "epoch": 617} {"train_loss": -20.25360679626465, "global_step": 51280, "epoch": 617} {"train_loss": -19.754776000976562, "global_step": 51281, "epoch": 617} {"train_loss": -19.7059268951416, "global_step": 51282, "epoch": 617} {"train_loss": -19.941434860229492, "global_step": 51283, "epoch": 617} {"train_loss": -19.840505599975586, "global_step": 51284, "epoch": 617} {"train_loss": -19.892597198486328, "global_step": 51285, "epoch": 617} {"train_loss": -20.149240493774414, "global_step": 51286, "epoch": 617} {"train_loss": -20.2471981048584, "global_step": 51287, "epoch": 617} {"train_loss": -20.019031524658203, "global_step": 51288, "epoch": 617} {"train_loss": -19.892995834350586, "global_step": 51289, "epoch": 617} {"train_loss": -20.217832565307617, "global_step": 51290, "epoch": 617} {"train_loss": -20.04478645324707, "global_step": 51291, "epoch": 617} {"train_loss": -20.46051597595215, "global_step": 51292, "epoch": 617} {"train_loss": -19.96099221562765, "global_step": 51293, "epoch": 617, "val_loss": 6089989.5} {"train_loss": -19.70613670349121, "global_step": 51294, "epoch": 618} {"train_loss": -19.966106414794922, "global_step": 51295, "epoch": 618} {"train_loss": -19.57309913635254, "global_step": 51296, "epoch": 618} {"train_loss": -19.823518753051758, "global_step": 51297, "epoch": 618} {"train_loss": -19.515066146850586, "global_step": 51298, "epoch": 618} {"train_loss": -19.778797149658203, "global_step": 51299, "epoch": 618} {"train_loss": -20.11286735534668, "global_step": 51300, "epoch": 618} {"train_loss": -20.03675651550293, "global_step": 51301, "epoch": 618} {"train_loss": -19.44479751586914, "global_step": 51302, "epoch": 618} {"train_loss": -20.189395904541016, "global_step": 51303, "epoch": 618} {"train_loss": -20.05023765563965, "global_step": 51304, "epoch": 618} {"train_loss": -20.03763198852539, "global_step": 51305, "epoch": 618} {"train_loss": -19.72890281677246, "global_step": 51306, "epoch": 618} {"train_loss": -20.262975692749023, "global_step": 51307, "epoch": 618} {"train_loss": -19.561477661132812, "global_step": 51308, "epoch": 618} {"train_loss": -19.678848266601562, "global_step": 51309, "epoch": 618} {"train_loss": -19.990270614624023, "global_step": 51310, "epoch": 618} {"train_loss": -19.788854598999023, "global_step": 51311, "epoch": 618} {"train_loss": -20.001985549926758, "global_step": 51312, "epoch": 618} {"train_loss": -19.834875106811523, "global_step": 51313, "epoch": 618} {"train_loss": -19.866117477416992, "global_step": 51314, "epoch": 618} {"train_loss": -19.616907119750977, "global_step": 51315, "epoch": 618} {"train_loss": -20.01036262512207, "global_step": 51316, "epoch": 618} {"train_loss": -20.04832649230957, "global_step": 51317, "epoch": 618} {"train_loss": -19.945892333984375, "global_step": 51318, "epoch": 618} {"train_loss": -20.026296615600586, "global_step": 51319, "epoch": 618} {"train_loss": -19.890668869018555, "global_step": 51320, "epoch": 618} {"train_loss": -19.914396286010742, "global_step": 51321, "epoch": 618} {"train_loss": -20.059497833251953, "global_step": 51322, "epoch": 618} {"train_loss": -19.712139129638672, "global_step": 51323, "epoch": 618} {"train_loss": -19.685375213623047, "global_step": 51324, "epoch": 618} {"train_loss": -20.215627670288086, "global_step": 51325, "epoch": 618} {"train_loss": -20.144399642944336, "global_step": 51326, "epoch": 618} {"train_loss": -20.23318862915039, "global_step": 51327, "epoch": 618} {"train_loss": -19.796634674072266, "global_step": 51328, "epoch": 618} {"train_loss": -20.065664291381836, "global_step": 51329, "epoch": 618} {"train_loss": -19.9681453704834, "global_step": 51330, "epoch": 618} {"train_loss": -19.64995765686035, "global_step": 51331, "epoch": 618} {"train_loss": -20.17223358154297, "global_step": 51332, "epoch": 618} {"train_loss": -19.915952682495117, "global_step": 51333, "epoch": 618} {"train_loss": -19.957902908325195, "global_step": 51334, "epoch": 618} {"train_loss": -20.122711181640625, "global_step": 51335, "epoch": 618} {"train_loss": -20.123563766479492, "global_step": 51336, "epoch": 618} {"train_loss": -20.077848434448242, "global_step": 51337, "epoch": 618} {"train_loss": -19.859128952026367, "global_step": 51338, "epoch": 618} {"train_loss": -19.87566375732422, "global_step": 51339, "epoch": 618} {"train_loss": -20.13251495361328, "global_step": 51340, "epoch": 618} {"train_loss": -20.31937026977539, "global_step": 51341, "epoch": 618} {"train_loss": -20.088926315307617, "global_step": 51342, "epoch": 618} {"train_loss": -20.335813522338867, "global_step": 51343, "epoch": 618} {"train_loss": -19.836183547973633, "global_step": 51344, "epoch": 618} {"train_loss": -19.832693099975586, "global_step": 51345, "epoch": 618} {"train_loss": -20.21048355102539, "global_step": 51346, "epoch": 618} {"train_loss": -20.00424575805664, "global_step": 51347, "epoch": 618} {"train_loss": -20.19134521484375, "global_step": 51348, "epoch": 618} {"train_loss": -20.213855743408203, "global_step": 51349, "epoch": 618} {"train_loss": -19.992326736450195, "global_step": 51350, "epoch": 618} {"train_loss": -19.667478561401367, "global_step": 51351, "epoch": 618} {"train_loss": -19.8873348236084, "global_step": 51352, "epoch": 618} {"train_loss": -20.463441848754883, "global_step": 51353, "epoch": 618} {"train_loss": -19.91687774658203, "global_step": 51354, "epoch": 618} {"train_loss": -20.291845321655273, "global_step": 51355, "epoch": 618} {"train_loss": -20.251279830932617, "global_step": 51356, "epoch": 618} {"train_loss": -20.158864974975586, "global_step": 51357, "epoch": 618} {"train_loss": -19.872838973999023, "global_step": 51358, "epoch": 618} {"train_loss": -19.712148666381836, "global_step": 51359, "epoch": 618} {"train_loss": -20.226627349853516, "global_step": 51360, "epoch": 618} {"train_loss": -20.03326988220215, "global_step": 51361, "epoch": 618} {"train_loss": -20.17881202697754, "global_step": 51362, "epoch": 618} {"train_loss": -20.12244987487793, "global_step": 51363, "epoch": 618} {"train_loss": -20.176572799682617, "global_step": 51364, "epoch": 618} {"train_loss": -20.312007904052734, "global_step": 51365, "epoch": 618} {"train_loss": -20.127700805664062, "global_step": 51366, "epoch": 618} {"train_loss": -19.80002212524414, "global_step": 51367, "epoch": 618} {"train_loss": -19.85127067565918, "global_step": 51368, "epoch": 618} {"train_loss": -20.222623825073242, "global_step": 51369, "epoch": 618} {"train_loss": -20.484033584594727, "global_step": 51370, "epoch": 618} {"train_loss": -19.996932983398438, "global_step": 51371, "epoch": 618} {"train_loss": -19.937803268432617, "global_step": 51372, "epoch": 618} {"train_loss": -20.21998405456543, "global_step": 51373, "epoch": 618} {"train_loss": -19.659912109375, "global_step": 51374, "epoch": 618} {"train_loss": -20.19880485534668, "global_step": 51375, "epoch": 618} {"train_loss": -19.98954023797828, "global_step": 51376, "epoch": 618, "val_loss": 6006606.0} {"train_loss": -19.55603790283203, "global_step": 51377, "epoch": 619} {"train_loss": -20.15838050842285, "global_step": 51378, "epoch": 619} {"train_loss": -19.679039001464844, "global_step": 51379, "epoch": 619} {"train_loss": -19.93203353881836, "global_step": 51380, "epoch": 619} {"train_loss": -19.49959373474121, "global_step": 51381, "epoch": 619} {"train_loss": -19.98530387878418, "global_step": 51382, "epoch": 619} {"train_loss": -19.794437408447266, "global_step": 51383, "epoch": 619} {"train_loss": -19.881973266601562, "global_step": 51384, "epoch": 619} {"train_loss": -19.809926986694336, "global_step": 51385, "epoch": 619} {"train_loss": -20.06574821472168, "global_step": 51386, "epoch": 619} {"train_loss": -20.036226272583008, "global_step": 51387, "epoch": 619} {"train_loss": -20.00955581665039, "global_step": 51388, "epoch": 619} {"train_loss": -19.947885513305664, "global_step": 51389, "epoch": 619} {"train_loss": -19.855741500854492, "global_step": 51390, "epoch": 619} {"train_loss": -20.2188777923584, "global_step": 51391, "epoch": 619} {"train_loss": -20.001428604125977, "global_step": 51392, "epoch": 619} {"train_loss": -19.823137283325195, "global_step": 51393, "epoch": 619} {"train_loss": -19.785114288330078, "global_step": 51394, "epoch": 619} {"train_loss": -20.188568115234375, "global_step": 51395, "epoch": 619} {"train_loss": -20.198841094970703, "global_step": 51396, "epoch": 619} {"train_loss": -20.226560592651367, "global_step": 51397, "epoch": 619} {"train_loss": -19.96826171875, "global_step": 51398, "epoch": 619} {"train_loss": -20.239948272705078, "global_step": 51399, "epoch": 619} {"train_loss": -20.298513412475586, "global_step": 51400, "epoch": 619} {"train_loss": -19.989089965820312, "global_step": 51401, "epoch": 619} {"train_loss": -20.002187728881836, "global_step": 51402, "epoch": 619} {"train_loss": -19.71925926208496, "global_step": 51403, "epoch": 619} {"train_loss": -20.224557876586914, "global_step": 51404, "epoch": 619} {"train_loss": -20.023788452148438, "global_step": 51405, "epoch": 619} {"train_loss": -19.937759399414062, "global_step": 51406, "epoch": 619} {"train_loss": -19.9199275970459, "global_step": 51407, "epoch": 619} {"train_loss": -19.68378257751465, "global_step": 51408, "epoch": 619} {"train_loss": -20.289785385131836, "global_step": 51409, "epoch": 619} {"train_loss": -20.014814376831055, "global_step": 51410, "epoch": 619} {"train_loss": -20.14154815673828, "global_step": 51411, "epoch": 619} {"train_loss": -20.1079158782959, "global_step": 51412, "epoch": 619} {"train_loss": -19.782093048095703, "global_step": 51413, "epoch": 619} {"train_loss": -19.913244247436523, "global_step": 51414, "epoch": 619} {"train_loss": -19.885339736938477, "global_step": 51415, "epoch": 619} {"train_loss": -20.10927391052246, "global_step": 51416, "epoch": 619} {"train_loss": -19.778024673461914, "global_step": 51417, "epoch": 619} {"train_loss": -19.924589157104492, "global_step": 51418, "epoch": 619} {"train_loss": -19.76051139831543, "global_step": 51419, "epoch": 619} {"train_loss": -20.142057418823242, "global_step": 51420, "epoch": 619} {"train_loss": -19.718719482421875, "global_step": 51421, "epoch": 619} {"train_loss": -19.826141357421875, "global_step": 51422, "epoch": 619} {"train_loss": -20.398752212524414, "global_step": 51423, "epoch": 619} {"train_loss": -20.439157485961914, "global_step": 51424, "epoch": 619} {"train_loss": -20.174354553222656, "global_step": 51425, "epoch": 619} {"train_loss": -20.18010139465332, "global_step": 51426, "epoch": 619} {"train_loss": -19.61772346496582, "global_step": 51427, "epoch": 619} {"train_loss": -20.385149002075195, "global_step": 51428, "epoch": 619} {"train_loss": -20.63504409790039, "global_step": 51429, "epoch": 619} {"train_loss": -20.08536148071289, "global_step": 51430, "epoch": 619} {"train_loss": -19.961509704589844, "global_step": 51431, "epoch": 619} {"train_loss": -20.015226364135742, "global_step": 51432, "epoch": 619} {"train_loss": -20.098478317260742, "global_step": 51433, "epoch": 619} {"train_loss": -19.71633529663086, "global_step": 51434, "epoch": 619} {"train_loss": -20.29825210571289, "global_step": 51435, "epoch": 619} {"train_loss": -20.109670639038086, "global_step": 51436, "epoch": 619} {"train_loss": -19.9020938873291, "global_step": 51437, "epoch": 619} {"train_loss": -19.809677124023438, "global_step": 51438, "epoch": 619} {"train_loss": -20.253389358520508, "global_step": 51439, "epoch": 619} {"train_loss": -19.878454208374023, "global_step": 51440, "epoch": 619} {"train_loss": -20.225976943969727, "global_step": 51441, "epoch": 619} {"train_loss": -20.122203826904297, "global_step": 51442, "epoch": 619} {"train_loss": -20.110937118530273, "global_step": 51443, "epoch": 619} {"train_loss": -19.861257553100586, "global_step": 51444, "epoch": 619} {"train_loss": -19.86017417907715, "global_step": 51445, "epoch": 619} {"train_loss": -20.01909828186035, "global_step": 51446, "epoch": 619} {"train_loss": -19.863943099975586, "global_step": 51447, "epoch": 619} {"train_loss": -19.8342227935791, "global_step": 51448, "epoch": 619} {"train_loss": -20.121137619018555, "global_step": 51449, "epoch": 619} {"train_loss": -19.93799591064453, "global_step": 51450, "epoch": 619} {"train_loss": -20.18058204650879, "global_step": 51451, "epoch": 619} {"train_loss": -19.583003997802734, "global_step": 51452, "epoch": 619} {"train_loss": -19.788511276245117, "global_step": 51453, "epoch": 619} {"train_loss": -20.116989135742188, "global_step": 51454, "epoch": 619} {"train_loss": -20.241918563842773, "global_step": 51455, "epoch": 619} {"train_loss": -20.151504516601562, "global_step": 51456, "epoch": 619} {"train_loss": -20.26823616027832, "global_step": 51457, "epoch": 619} {"train_loss": -20.117307662963867, "global_step": 51458, "epoch": 619} {"train_loss": -20.0081729659115, "global_step": 51459, "epoch": 619, "val_loss": 5927762.0} {"train_loss": -19.679115295410156, "global_step": 51460, "epoch": 620} {"train_loss": -19.83791160583496, "global_step": 51461, "epoch": 620} {"train_loss": -19.63688087463379, "global_step": 51462, "epoch": 620} {"train_loss": -19.713560104370117, "global_step": 51463, "epoch": 620} {"train_loss": -19.73470115661621, "global_step": 51464, "epoch": 620} {"train_loss": -19.81708335876465, "global_step": 51465, "epoch": 620} {"train_loss": -20.043190002441406, "global_step": 51466, "epoch": 620} {"train_loss": -19.9079647064209, "global_step": 51467, "epoch": 620} {"train_loss": -20.28008460998535, "global_step": 51468, "epoch": 620} {"train_loss": -20.251235961914062, "global_step": 51469, "epoch": 620} {"train_loss": -19.78803062438965, "global_step": 51470, "epoch": 620} {"train_loss": -20.274600982666016, "global_step": 51471, "epoch": 620} {"train_loss": -20.214841842651367, "global_step": 51472, "epoch": 620} {"train_loss": -19.91641616821289, "global_step": 51473, "epoch": 620} {"train_loss": -20.027175903320312, "global_step": 51474, "epoch": 620} {"train_loss": -19.87529754638672, "global_step": 51475, "epoch": 620} {"train_loss": -20.3084774017334, "global_step": 51476, "epoch": 620} {"train_loss": -20.418947219848633, "global_step": 51477, "epoch": 620} {"train_loss": -20.083852767944336, "global_step": 51478, "epoch": 620} {"train_loss": -19.7775936126709, "global_step": 51479, "epoch": 620} {"train_loss": -20.566612243652344, "global_step": 51480, "epoch": 620} {"train_loss": -20.233118057250977, "global_step": 51481, "epoch": 620} {"train_loss": -20.04875373840332, "global_step": 51482, "epoch": 620} {"train_loss": -19.984561920166016, "global_step": 51483, "epoch": 620} {"train_loss": -20.199644088745117, "global_step": 51484, "epoch": 620} {"train_loss": -19.983749389648438, "global_step": 51485, "epoch": 620} {"train_loss": -19.948558807373047, "global_step": 51486, "epoch": 620} {"train_loss": -19.887943267822266, "global_step": 51487, "epoch": 620} {"train_loss": -19.932231903076172, "global_step": 51488, "epoch": 620} {"train_loss": -19.83930778503418, "global_step": 51489, "epoch": 620} {"train_loss": -20.002405166625977, "global_step": 51490, "epoch": 620} {"train_loss": -19.8657283782959, "global_step": 51491, "epoch": 620} {"train_loss": -19.775453567504883, "global_step": 51492, "epoch": 620} {"train_loss": -20.204267501831055, "global_step": 51493, "epoch": 620} {"train_loss": -20.38215446472168, "global_step": 51494, "epoch": 620} {"train_loss": -19.83599853515625, "global_step": 51495, "epoch": 620} {"train_loss": -20.10080909729004, "global_step": 51496, "epoch": 620} {"train_loss": -20.12872314453125, "global_step": 51497, "epoch": 620} {"train_loss": -19.699609756469727, "global_step": 51498, "epoch": 620} {"train_loss": -20.09187126159668, "global_step": 51499, "epoch": 620} {"train_loss": -20.076025009155273, "global_step": 51500, "epoch": 620} {"train_loss": -19.81766700744629, "global_step": 51501, "epoch": 620} {"train_loss": -19.69938087463379, "global_step": 51502, "epoch": 620} {"train_loss": -20.16998291015625, "global_step": 51503, "epoch": 620} {"train_loss": -20.15186309814453, "global_step": 51504, "epoch": 620} {"train_loss": -20.03781509399414, "global_step": 51505, "epoch": 620} {"train_loss": -19.924835205078125, "global_step": 51506, "epoch": 620} {"train_loss": -19.82183265686035, "global_step": 51507, "epoch": 620} {"train_loss": -19.909507751464844, "global_step": 51508, "epoch": 620} {"train_loss": -20.008703231811523, "global_step": 51509, "epoch": 620} {"train_loss": -20.04859161376953, "global_step": 51510, "epoch": 620} {"train_loss": -20.23004913330078, "global_step": 51511, "epoch": 620} {"train_loss": -19.732372283935547, "global_step": 51512, "epoch": 620} {"train_loss": -20.108224868774414, "global_step": 51513, "epoch": 620} {"train_loss": -20.27143669128418, "global_step": 51514, "epoch": 620} {"train_loss": -20.249591827392578, "global_step": 51515, "epoch": 620} {"train_loss": -19.86984634399414, "global_step": 51516, "epoch": 620} {"train_loss": -19.901500701904297, "global_step": 51517, "epoch": 620} {"train_loss": -20.12860107421875, "global_step": 51518, "epoch": 620} {"train_loss": -20.10161781311035, "global_step": 51519, "epoch": 620} {"train_loss": -20.13167381286621, "global_step": 51520, "epoch": 620} {"train_loss": -19.832351684570312, "global_step": 51521, "epoch": 620} {"train_loss": -20.061756134033203, "global_step": 51522, "epoch": 620} {"train_loss": -19.97664451599121, "global_step": 51523, "epoch": 620} {"train_loss": -20.036718368530273, "global_step": 51524, "epoch": 620} {"train_loss": -19.8632869720459, "global_step": 51525, "epoch": 620} {"train_loss": -19.95747184753418, "global_step": 51526, "epoch": 620} {"train_loss": -20.241230010986328, "global_step": 51527, "epoch": 620} {"train_loss": -20.509904861450195, "global_step": 51528, "epoch": 620} {"train_loss": -20.10959243774414, "global_step": 51529, "epoch": 620} {"train_loss": -20.005849838256836, "global_step": 51530, "epoch": 620} {"train_loss": -20.073196411132812, "global_step": 51531, "epoch": 620} {"train_loss": -19.83940315246582, "global_step": 51532, "epoch": 620} {"train_loss": -19.863677978515625, "global_step": 51533, "epoch": 620} {"train_loss": -20.08831214904785, "global_step": 51534, "epoch": 620} {"train_loss": -20.099695205688477, "global_step": 51535, "epoch": 620} {"train_loss": -19.84474754333496, "global_step": 51536, "epoch": 620} {"train_loss": -19.8182373046875, "global_step": 51537, "epoch": 620} {"train_loss": -19.866662979125977, "global_step": 51538, "epoch": 620} {"train_loss": -19.831716537475586, "global_step": 51539, "epoch": 620} {"train_loss": -19.906705856323242, "global_step": 51540, "epoch": 620} {"train_loss": -19.9666748046875, "global_step": 51541, "epoch": 620} {"train_loss": -19.999171911952008, "global_step": 51542, "epoch": 620, "val_loss": 6116754.0} {"train_loss": -19.092050552368164, "global_step": 51543, "epoch": 621} {"train_loss": -19.75335693359375, "global_step": 51544, "epoch": 621} {"train_loss": -19.71651268005371, "global_step": 51545, "epoch": 621} {"train_loss": -19.870603561401367, "global_step": 51546, "epoch": 621} {"train_loss": -19.728809356689453, "global_step": 51547, "epoch": 621} {"train_loss": -19.83234977722168, "global_step": 51548, "epoch": 621} {"train_loss": -19.53787612915039, "global_step": 51549, "epoch": 621} {"train_loss": -19.913206100463867, "global_step": 51550, "epoch": 621} {"train_loss": -19.680601119995117, "global_step": 51551, "epoch": 621} {"train_loss": -20.085927963256836, "global_step": 51552, "epoch": 621} {"train_loss": -20.17713737487793, "global_step": 51553, "epoch": 621} {"train_loss": -19.73189353942871, "global_step": 51554, "epoch": 621} {"train_loss": -20.125507354736328, "global_step": 51555, "epoch": 621} {"train_loss": -19.70828628540039, "global_step": 51556, "epoch": 621} {"train_loss": -19.668962478637695, "global_step": 51557, "epoch": 621} {"train_loss": -20.010189056396484, "global_step": 51558, "epoch": 621} {"train_loss": -19.831388473510742, "global_step": 51559, "epoch": 621} {"train_loss": -19.601728439331055, "global_step": 51560, "epoch": 621} {"train_loss": -19.926868438720703, "global_step": 51561, "epoch": 621} {"train_loss": -20.31308364868164, "global_step": 51562, "epoch": 621} {"train_loss": -19.798749923706055, "global_step": 51563, "epoch": 621} {"train_loss": -19.902563095092773, "global_step": 51564, "epoch": 621} {"train_loss": -19.886926651000977, "global_step": 51565, "epoch": 621} {"train_loss": -20.22171974182129, "global_step": 51566, "epoch": 621} {"train_loss": -19.702062606811523, "global_step": 51567, "epoch": 621} {"train_loss": -19.782028198242188, "global_step": 51568, "epoch": 621} {"train_loss": -20.41818618774414, "global_step": 51569, "epoch": 621} {"train_loss": -20.267385482788086, "global_step": 51570, "epoch": 621} {"train_loss": -20.086347579956055, "global_step": 51571, "epoch": 621} {"train_loss": -19.91729164123535, "global_step": 51572, "epoch": 621} {"train_loss": -19.871414184570312, "global_step": 51573, "epoch": 621} {"train_loss": -19.881683349609375, "global_step": 51574, "epoch": 621} {"train_loss": -20.171585083007812, "global_step": 51575, "epoch": 621} {"train_loss": -20.20856285095215, "global_step": 51576, "epoch": 621} {"train_loss": -19.923215866088867, "global_step": 51577, "epoch": 621} {"train_loss": -19.801555633544922, "global_step": 51578, "epoch": 621} {"train_loss": -20.270986557006836, "global_step": 51579, "epoch": 621} {"train_loss": -20.13426971435547, "global_step": 51580, "epoch": 621} {"train_loss": -19.740808486938477, "global_step": 51581, "epoch": 621} {"train_loss": -19.80427360534668, "global_step": 51582, "epoch": 621} {"train_loss": -20.191381454467773, "global_step": 51583, "epoch": 621} {"train_loss": -20.076007843017578, "global_step": 51584, "epoch": 621} {"train_loss": -19.933719635009766, "global_step": 51585, "epoch": 621} {"train_loss": -20.03843116760254, "global_step": 51586, "epoch": 621} {"train_loss": -19.8363094329834, "global_step": 51587, "epoch": 621} {"train_loss": -20.005512237548828, "global_step": 51588, "epoch": 621} {"train_loss": -20.340673446655273, "global_step": 51589, "epoch": 621} {"train_loss": -19.949844360351562, "global_step": 51590, "epoch": 621} {"train_loss": -19.96518325805664, "global_step": 51591, "epoch": 621} {"train_loss": -19.651674270629883, "global_step": 51592, "epoch": 621} {"train_loss": -19.896530151367188, "global_step": 51593, "epoch": 621} {"train_loss": -19.84223747253418, "global_step": 51594, "epoch": 621} {"train_loss": -20.11037254333496, "global_step": 51595, "epoch": 621} {"train_loss": -19.991971969604492, "global_step": 51596, "epoch": 621} {"train_loss": -20.09673500061035, "global_step": 51597, "epoch": 621} {"train_loss": -20.197620391845703, "global_step": 51598, "epoch": 621} {"train_loss": -20.023635864257812, "global_step": 51599, "epoch": 621} {"train_loss": -19.652332305908203, "global_step": 51600, "epoch": 621} {"train_loss": -20.256614685058594, "global_step": 51601, "epoch": 621} {"train_loss": -19.799991607666016, "global_step": 51602, "epoch": 621} {"train_loss": -20.059900283813477, "global_step": 51603, "epoch": 621} {"train_loss": -19.238378524780273, "global_step": 51604, "epoch": 621} {"train_loss": -20.17934226989746, "global_step": 51605, "epoch": 621} {"train_loss": -20.26173210144043, "global_step": 51606, "epoch": 621} {"train_loss": -19.51564598083496, "global_step": 51607, "epoch": 621} {"train_loss": -19.900646209716797, "global_step": 51608, "epoch": 621} {"train_loss": -19.82875633239746, "global_step": 51609, "epoch": 621} {"train_loss": -20.23859977722168, "global_step": 51610, "epoch": 621} {"train_loss": -20.393545150756836, "global_step": 51611, "epoch": 621} {"train_loss": -20.039356231689453, "global_step": 51612, "epoch": 621} {"train_loss": -19.89235496520996, "global_step": 51613, "epoch": 621} {"train_loss": -19.88775634765625, "global_step": 51614, "epoch": 621} {"train_loss": -20.0351619720459, "global_step": 51615, "epoch": 621} {"train_loss": -19.86530876159668, "global_step": 51616, "epoch": 621} {"train_loss": -19.839345932006836, "global_step": 51617, "epoch": 621} {"train_loss": -20.37122917175293, "global_step": 51618, "epoch": 621} {"train_loss": -20.013595581054688, "global_step": 51619, "epoch": 621} {"train_loss": -20.246719360351562, "global_step": 51620, "epoch": 621} {"train_loss": -19.948104858398438, "global_step": 51621, "epoch": 621} {"train_loss": -19.651508331298828, "global_step": 51622, "epoch": 621} {"train_loss": -20.04261589050293, "global_step": 51623, "epoch": 621} {"train_loss": -20.153438568115234, "global_step": 51624, "epoch": 621} {"train_loss": -19.949799342327807, "global_step": 51625, "epoch": 621, "val_loss": 6065117.5} {"train_loss": -19.89748191833496, "global_step": 51626, "epoch": 622} {"train_loss": -20.266149520874023, "global_step": 51627, "epoch": 622} {"train_loss": -19.32398796081543, "global_step": 51628, "epoch": 622} {"train_loss": -19.585508346557617, "global_step": 51629, "epoch": 622} {"train_loss": -20.00678253173828, "global_step": 51630, "epoch": 622} {"train_loss": -19.329965591430664, "global_step": 51631, "epoch": 622} {"train_loss": -20.15114974975586, "global_step": 51632, "epoch": 622} {"train_loss": -19.628849029541016, "global_step": 51633, "epoch": 622} {"train_loss": -19.8598690032959, "global_step": 51634, "epoch": 622} {"train_loss": -19.814712524414062, "global_step": 51635, "epoch": 622} {"train_loss": -20.074583053588867, "global_step": 51636, "epoch": 622} {"train_loss": -19.727497100830078, "global_step": 51637, "epoch": 622} {"train_loss": -19.785036087036133, "global_step": 51638, "epoch": 622} {"train_loss": -20.09100914001465, "global_step": 51639, "epoch": 622} {"train_loss": -19.689149856567383, "global_step": 51640, "epoch": 622} {"train_loss": -20.03666114807129, "global_step": 51641, "epoch": 622} {"train_loss": -20.150503158569336, "global_step": 51642, "epoch": 622} {"train_loss": -20.118440628051758, "global_step": 51643, "epoch": 622} {"train_loss": -19.902414321899414, "global_step": 51644, "epoch": 622} {"train_loss": -19.92882537841797, "global_step": 51645, "epoch": 622} {"train_loss": -19.872953414916992, "global_step": 51646, "epoch": 622} {"train_loss": -20.00016212463379, "global_step": 51647, "epoch": 622} {"train_loss": -19.713214874267578, "global_step": 51648, "epoch": 622} {"train_loss": -19.749408721923828, "global_step": 51649, "epoch": 622} {"train_loss": -20.150012969970703, "global_step": 51650, "epoch": 622} {"train_loss": -20.086929321289062, "global_step": 51651, "epoch": 622} {"train_loss": -20.107053756713867, "global_step": 51652, "epoch": 622} {"train_loss": -20.002798080444336, "global_step": 51653, "epoch": 622} {"train_loss": -19.96291160583496, "global_step": 51654, "epoch": 622} {"train_loss": -19.75957679748535, "global_step": 51655, "epoch": 622} {"train_loss": -20.384214401245117, "global_step": 51656, "epoch": 622} {"train_loss": -20.00501823425293, "global_step": 51657, "epoch": 622} {"train_loss": -19.67024040222168, "global_step": 51658, "epoch": 622} {"train_loss": -20.109325408935547, "global_step": 51659, "epoch": 622} {"train_loss": -20.113859176635742, "global_step": 51660, "epoch": 622} {"train_loss": -19.685583114624023, "global_step": 51661, "epoch": 622} {"train_loss": -20.148162841796875, "global_step": 51662, "epoch": 622} {"train_loss": -19.66572380065918, "global_step": 51663, "epoch": 622} {"train_loss": -19.799270629882812, "global_step": 51664, "epoch": 622} {"train_loss": -20.288660049438477, "global_step": 51665, "epoch": 622} {"train_loss": -19.716388702392578, "global_step": 51666, "epoch": 622} {"train_loss": -20.204782485961914, "global_step": 51667, "epoch": 622} {"train_loss": -19.61524772644043, "global_step": 51668, "epoch": 622} {"train_loss": -20.239877700805664, "global_step": 51669, "epoch": 622} {"train_loss": -20.033430099487305, "global_step": 51670, "epoch": 622} {"train_loss": -19.922374725341797, "global_step": 51671, "epoch": 622} {"train_loss": -20.376306533813477, "global_step": 51672, "epoch": 622} {"train_loss": -19.883499145507812, "global_step": 51673, "epoch": 622} {"train_loss": -20.022031784057617, "global_step": 51674, "epoch": 622} {"train_loss": -19.989032745361328, "global_step": 51675, "epoch": 622} {"train_loss": -20.26549530029297, "global_step": 51676, "epoch": 622} {"train_loss": -19.67116355895996, "global_step": 51677, "epoch": 622} {"train_loss": -19.92606544494629, "global_step": 51678, "epoch": 622} {"train_loss": -19.954416275024414, "global_step": 51679, "epoch": 622} {"train_loss": -20.00437355041504, "global_step": 51680, "epoch": 622} {"train_loss": -20.004932403564453, "global_step": 51681, "epoch": 622} {"train_loss": -20.17939567565918, "global_step": 51682, "epoch": 622} {"train_loss": -20.378267288208008, "global_step": 51683, "epoch": 622} {"train_loss": -20.069501876831055, "global_step": 51684, "epoch": 622} {"train_loss": -19.963953018188477, "global_step": 51685, "epoch": 622} {"train_loss": -19.97287940979004, "global_step": 51686, "epoch": 622} {"train_loss": -19.86269187927246, "global_step": 51687, "epoch": 622} {"train_loss": -20.20462417602539, "global_step": 51688, "epoch": 622} {"train_loss": -20.316308975219727, "global_step": 51689, "epoch": 622} {"train_loss": -19.88522720336914, "global_step": 51690, "epoch": 622} {"train_loss": -20.230239868164062, "global_step": 51691, "epoch": 622} {"train_loss": -20.323434829711914, "global_step": 51692, "epoch": 622} {"train_loss": -19.72146987915039, "global_step": 51693, "epoch": 622} {"train_loss": -19.869211196899414, "global_step": 51694, "epoch": 622} {"train_loss": -19.899152755737305, "global_step": 51695, "epoch": 622} {"train_loss": -20.084514617919922, "global_step": 51696, "epoch": 622} {"train_loss": -20.243839263916016, "global_step": 51697, "epoch": 622} {"train_loss": -19.79884910583496, "global_step": 51698, "epoch": 622} {"train_loss": -19.944974899291992, "global_step": 51699, "epoch": 622} {"train_loss": -19.586050033569336, "global_step": 51700, "epoch": 622} {"train_loss": -19.859033584594727, "global_step": 51701, "epoch": 622} {"train_loss": -19.972930908203125, "global_step": 51702, "epoch": 622} {"train_loss": -20.06936264038086, "global_step": 51703, "epoch": 622} {"train_loss": -19.960655212402344, "global_step": 51704, "epoch": 622} {"train_loss": -20.04099464416504, "global_step": 51705, "epoch": 622} {"train_loss": -20.001108169555664, "global_step": 51706, "epoch": 622} {"train_loss": -20.15584373474121, "global_step": 51707, "epoch": 622} {"train_loss": -19.967796325683594, "global_step": 51708, "epoch": 622, "val_loss": 5996206.0} {"train_loss": -19.541139602661133, "global_step": 51709, "epoch": 623} {"train_loss": -19.813505172729492, "global_step": 51710, "epoch": 623} {"train_loss": -19.32057762145996, "global_step": 51711, "epoch": 623} {"train_loss": -20.0504207611084, "global_step": 51712, "epoch": 623} {"train_loss": -19.351224899291992, "global_step": 51713, "epoch": 623} {"train_loss": -19.726627349853516, "global_step": 51714, "epoch": 623} {"train_loss": -19.305299758911133, "global_step": 51715, "epoch": 623} {"train_loss": -19.8017520904541, "global_step": 51716, "epoch": 623} {"train_loss": -19.248788833618164, "global_step": 51717, "epoch": 623} {"train_loss": -19.1644287109375, "global_step": 51718, "epoch": 623} {"train_loss": -19.569774627685547, "global_step": 51719, "epoch": 623} {"train_loss": -19.764989852905273, "global_step": 51720, "epoch": 623} {"train_loss": -19.626569747924805, "global_step": 51721, "epoch": 623} {"train_loss": -19.70395851135254, "global_step": 51722, "epoch": 623} {"train_loss": -19.7401065826416, "global_step": 51723, "epoch": 623} {"train_loss": -19.89560317993164, "global_step": 51724, "epoch": 623} {"train_loss": -19.581008911132812, "global_step": 51725, "epoch": 623} {"train_loss": -19.740903854370117, "global_step": 51726, "epoch": 623} {"train_loss": -19.744220733642578, "global_step": 51727, "epoch": 623} {"train_loss": -19.67791175842285, "global_step": 51728, "epoch": 623} {"train_loss": -20.224458694458008, "global_step": 51729, "epoch": 623} {"train_loss": -19.775182723999023, "global_step": 51730, "epoch": 623} {"train_loss": -20.0263671875, "global_step": 51731, "epoch": 623} {"train_loss": -19.66432762145996, "global_step": 51732, "epoch": 623} {"train_loss": -19.94300651550293, "global_step": 51733, "epoch": 623} {"train_loss": -20.165210723876953, "global_step": 51734, "epoch": 623} {"train_loss": -20.104555130004883, "global_step": 51735, "epoch": 623} {"train_loss": -19.898290634155273, "global_step": 51736, "epoch": 623} {"train_loss": -20.0688533782959, "global_step": 51737, "epoch": 623} {"train_loss": -19.9848690032959, "global_step": 51738, "epoch": 623} {"train_loss": -19.7741756439209, "global_step": 51739, "epoch": 623} {"train_loss": -19.69927406311035, "global_step": 51740, "epoch": 623} {"train_loss": -19.614398956298828, "global_step": 51741, "epoch": 623} {"train_loss": -19.988676071166992, "global_step": 51742, "epoch": 623} {"train_loss": -19.8588924407959, "global_step": 51743, "epoch": 623} {"train_loss": -19.883268356323242, "global_step": 51744, "epoch": 623} {"train_loss": -20.332334518432617, "global_step": 51745, "epoch": 623} {"train_loss": -19.67251968383789, "global_step": 51746, "epoch": 623} {"train_loss": -19.64600944519043, "global_step": 51747, "epoch": 623} {"train_loss": -20.021610260009766, "global_step": 51748, "epoch": 623} {"train_loss": -20.245126724243164, "global_step": 51749, "epoch": 623} {"train_loss": -19.687427520751953, "global_step": 51750, "epoch": 623} {"train_loss": -20.214082717895508, "global_step": 51751, "epoch": 623} {"train_loss": -20.15082359313965, "global_step": 51752, "epoch": 623} {"train_loss": -19.920312881469727, "global_step": 51753, "epoch": 623} {"train_loss": -19.94871711730957, "global_step": 51754, "epoch": 623} {"train_loss": -19.66518211364746, "global_step": 51755, "epoch": 623} {"train_loss": -19.918792724609375, "global_step": 51756, "epoch": 623} {"train_loss": -19.466602325439453, "global_step": 51757, "epoch": 623} {"train_loss": -20.075794219970703, "global_step": 51758, "epoch": 623} {"train_loss": -20.050796508789062, "global_step": 51759, "epoch": 623} {"train_loss": -20.0494441986084, "global_step": 51760, "epoch": 623} {"train_loss": -19.998075485229492, "global_step": 51761, "epoch": 623} {"train_loss": -19.573957443237305, "global_step": 51762, "epoch": 623} {"train_loss": -19.998014450073242, "global_step": 51763, "epoch": 623} {"train_loss": -20.0430908203125, "global_step": 51764, "epoch": 623} {"train_loss": -20.1390438079834, "global_step": 51765, "epoch": 623} {"train_loss": -20.07893180847168, "global_step": 51766, "epoch": 623} {"train_loss": -20.083921432495117, "global_step": 51767, "epoch": 623} {"train_loss": -20.009906768798828, "global_step": 51768, "epoch": 623} {"train_loss": -19.774261474609375, "global_step": 51769, "epoch": 623} {"train_loss": -20.353052139282227, "global_step": 51770, "epoch": 623} {"train_loss": -19.96463966369629, "global_step": 51771, "epoch": 623} {"train_loss": -20.067705154418945, "global_step": 51772, "epoch": 623} {"train_loss": -20.391042709350586, "global_step": 51773, "epoch": 623} {"train_loss": -19.94771385192871, "global_step": 51774, "epoch": 623} {"train_loss": -20.09516716003418, "global_step": 51775, "epoch": 623} {"train_loss": -19.82893180847168, "global_step": 51776, "epoch": 623} {"train_loss": -19.517887115478516, "global_step": 51777, "epoch": 623} {"train_loss": -20.18065071105957, "global_step": 51778, "epoch": 623} {"train_loss": -20.212360382080078, "global_step": 51779, "epoch": 623} {"train_loss": -19.95257568359375, "global_step": 51780, "epoch": 623} {"train_loss": -19.856786727905273, "global_step": 51781, "epoch": 623} {"train_loss": -20.058074951171875, "global_step": 51782, "epoch": 623} {"train_loss": -19.882713317871094, "global_step": 51783, "epoch": 623} {"train_loss": -19.947723388671875, "global_step": 51784, "epoch": 623} {"train_loss": -19.767606735229492, "global_step": 51785, "epoch": 623} {"train_loss": -20.193328857421875, "global_step": 51786, "epoch": 623} {"train_loss": -19.929990768432617, "global_step": 51787, "epoch": 623} {"train_loss": -20.0347843170166, "global_step": 51788, "epoch": 623} {"train_loss": -20.0490779876709, "global_step": 51789, "epoch": 623} {"train_loss": -19.999954223632812, "global_step": 51790, "epoch": 623} {"train_loss": -19.88208221527467, "global_step": 51791, "epoch": 623, "val_loss": 6172125.5} {"train_loss": -19.518712997436523, "global_step": 51792, "epoch": 624} {"train_loss": -19.671466827392578, "global_step": 51793, "epoch": 624} {"train_loss": -19.6624755859375, "global_step": 51794, "epoch": 624} {"train_loss": -19.969167709350586, "global_step": 51795, "epoch": 624} {"train_loss": -19.849233627319336, "global_step": 51796, "epoch": 624} {"train_loss": -19.55316734313965, "global_step": 51797, "epoch": 624} {"train_loss": -20.002283096313477, "global_step": 51798, "epoch": 624} {"train_loss": -19.552154541015625, "global_step": 51799, "epoch": 624} {"train_loss": -19.82428741455078, "global_step": 51800, "epoch": 624} {"train_loss": -19.59766960144043, "global_step": 51801, "epoch": 624} {"train_loss": -19.527685165405273, "global_step": 51802, "epoch": 624} {"train_loss": -19.76214599609375, "global_step": 51803, "epoch": 624} {"train_loss": -19.996784210205078, "global_step": 51804, "epoch": 624} {"train_loss": -20.029407501220703, "global_step": 51805, "epoch": 624} {"train_loss": -19.80189323425293, "global_step": 51806, "epoch": 624} {"train_loss": -19.952178955078125, "global_step": 51807, "epoch": 624} {"train_loss": -20.364255905151367, "global_step": 51808, "epoch": 624} {"train_loss": -20.206876754760742, "global_step": 51809, "epoch": 624} {"train_loss": -19.867029190063477, "global_step": 51810, "epoch": 624} {"train_loss": -19.621816635131836, "global_step": 51811, "epoch": 624} {"train_loss": -19.84137725830078, "global_step": 51812, "epoch": 624} {"train_loss": -20.085390090942383, "global_step": 51813, "epoch": 624} {"train_loss": -19.996065139770508, "global_step": 51814, "epoch": 624} {"train_loss": -19.76742935180664, "global_step": 51815, "epoch": 624} {"train_loss": -19.87322998046875, "global_step": 51816, "epoch": 624} {"train_loss": -19.90274429321289, "global_step": 51817, "epoch": 624} {"train_loss": -19.884384155273438, "global_step": 51818, "epoch": 624} {"train_loss": -19.980772018432617, "global_step": 51819, "epoch": 624} {"train_loss": -19.7601318359375, "global_step": 51820, "epoch": 624} {"train_loss": -20.01658058166504, "global_step": 51821, "epoch": 624} {"train_loss": -19.70795249938965, "global_step": 51822, "epoch": 624} {"train_loss": -20.15903663635254, "global_step": 51823, "epoch": 624} {"train_loss": -20.22376823425293, "global_step": 51824, "epoch": 624} {"train_loss": -20.053144454956055, "global_step": 51825, "epoch": 624} {"train_loss": -20.03782844543457, "global_step": 51826, "epoch": 624} {"train_loss": -19.847375869750977, "global_step": 51827, "epoch": 624} {"train_loss": -19.93714141845703, "global_step": 51828, "epoch": 624} {"train_loss": -19.843372344970703, "global_step": 51829, "epoch": 624} {"train_loss": -20.209980010986328, "global_step": 51830, "epoch": 624} {"train_loss": -19.80767250061035, "global_step": 51831, "epoch": 624} {"train_loss": -20.063547134399414, "global_step": 51832, "epoch": 624} {"train_loss": -19.98898696899414, "global_step": 51833, "epoch": 624} {"train_loss": -19.894596099853516, "global_step": 51834, "epoch": 624} {"train_loss": -20.037227630615234, "global_step": 51835, "epoch": 624} {"train_loss": -20.400053024291992, "global_step": 51836, "epoch": 624} {"train_loss": -19.940671920776367, "global_step": 51837, "epoch": 624} {"train_loss": -19.92262840270996, "global_step": 51838, "epoch": 624} {"train_loss": -20.377286911010742, "global_step": 51839, "epoch": 624} {"train_loss": -19.936542510986328, "global_step": 51840, "epoch": 624} {"train_loss": -20.330717086791992, "global_step": 51841, "epoch": 624} {"train_loss": -19.99698257446289, "global_step": 51842, "epoch": 624} {"train_loss": -20.466276168823242, "global_step": 51843, "epoch": 624} {"train_loss": -20.078062057495117, "global_step": 51844, "epoch": 624} {"train_loss": -20.160980224609375, "global_step": 51845, "epoch": 624} {"train_loss": -20.421058654785156, "global_step": 51846, "epoch": 624} {"train_loss": -20.11432456970215, "global_step": 51847, "epoch": 624} {"train_loss": -20.0248966217041, "global_step": 51848, "epoch": 624} {"train_loss": -19.69028663635254, "global_step": 51849, "epoch": 624} {"train_loss": -20.159055709838867, "global_step": 51850, "epoch": 624} {"train_loss": -19.973142623901367, "global_step": 51851, "epoch": 624} {"train_loss": -20.177148818969727, "global_step": 51852, "epoch": 624} {"train_loss": -19.977188110351562, "global_step": 51853, "epoch": 624} {"train_loss": -20.129568099975586, "global_step": 51854, "epoch": 624} {"train_loss": -19.63361167907715, "global_step": 51855, "epoch": 624} {"train_loss": -19.96173667907715, "global_step": 51856, "epoch": 624} {"train_loss": -19.695432662963867, "global_step": 51857, "epoch": 624} {"train_loss": -20.37955093383789, "global_step": 51858, "epoch": 624} {"train_loss": -20.156696319580078, "global_step": 51859, "epoch": 624} {"train_loss": -19.832975387573242, "global_step": 51860, "epoch": 624} {"train_loss": -20.14753532409668, "global_step": 51861, "epoch": 624} {"train_loss": -19.912403106689453, "global_step": 51862, "epoch": 624} {"train_loss": -19.763639450073242, "global_step": 51863, "epoch": 624} {"train_loss": -20.195880889892578, "global_step": 51864, "epoch": 624} {"train_loss": -19.9165096282959, "global_step": 51865, "epoch": 624} {"train_loss": -20.38099479675293, "global_step": 51866, "epoch": 624} {"train_loss": -20.072317123413086, "global_step": 51867, "epoch": 624} {"train_loss": -20.412757873535156, "global_step": 51868, "epoch": 624} {"train_loss": -19.961339950561523, "global_step": 51869, "epoch": 624} {"train_loss": -19.67351722717285, "global_step": 51870, "epoch": 624} {"train_loss": -20.060012817382812, "global_step": 51871, "epoch": 624} {"train_loss": -20.444547653198242, "global_step": 51872, "epoch": 624} {"train_loss": -20.36994171142578, "global_step": 51873, "epoch": 624} {"train_loss": -19.98643385645855, "global_step": 51874, "epoch": 624, "val_loss": 5939031.0} {"train_loss": -20.163599014282227, "global_step": 51875, "epoch": 625} {"train_loss": -20.429494857788086, "global_step": 51876, "epoch": 625} {"train_loss": -19.553464889526367, "global_step": 51877, "epoch": 625} {"train_loss": -19.57526206970215, "global_step": 51878, "epoch": 625} {"train_loss": -19.733272552490234, "global_step": 51879, "epoch": 625} {"train_loss": -19.78935432434082, "global_step": 51880, "epoch": 625} {"train_loss": -19.90666961669922, "global_step": 51881, "epoch": 625} {"train_loss": -20.170705795288086, "global_step": 51882, "epoch": 625} {"train_loss": -19.870071411132812, "global_step": 51883, "epoch": 625} {"train_loss": -20.057525634765625, "global_step": 51884, "epoch": 625} {"train_loss": -19.81477165222168, "global_step": 51885, "epoch": 625} {"train_loss": -19.716585159301758, "global_step": 51886, "epoch": 625} {"train_loss": -20.207429885864258, "global_step": 51887, "epoch": 625} {"train_loss": -20.051441192626953, "global_step": 51888, "epoch": 625} {"train_loss": -19.848554611206055, "global_step": 51889, "epoch": 625} {"train_loss": -19.56917953491211, "global_step": 51890, "epoch": 625} {"train_loss": -20.045217514038086, "global_step": 51891, "epoch": 625} {"train_loss": -19.88812255859375, "global_step": 51892, "epoch": 625} {"train_loss": -19.938215255737305, "global_step": 51893, "epoch": 625} {"train_loss": -20.28435516357422, "global_step": 51894, "epoch": 625} {"train_loss": -20.052587509155273, "global_step": 51895, "epoch": 625} {"train_loss": -20.05087661743164, "global_step": 51896, "epoch": 625} {"train_loss": -20.15443992614746, "global_step": 51897, "epoch": 625} {"train_loss": -20.21122169494629, "global_step": 51898, "epoch": 625} {"train_loss": -20.014617919921875, "global_step": 51899, "epoch": 625} {"train_loss": -20.276771545410156, "global_step": 51900, "epoch": 625} {"train_loss": -19.887632369995117, "global_step": 51901, "epoch": 625} {"train_loss": -20.457612991333008, "global_step": 51902, "epoch": 625} {"train_loss": -20.113126754760742, "global_step": 51903, "epoch": 625} {"train_loss": -20.034875869750977, "global_step": 51904, "epoch": 625} {"train_loss": -20.450149536132812, "global_step": 51905, "epoch": 625} {"train_loss": -20.20108413696289, "global_step": 51906, "epoch": 625} {"train_loss": -19.719045639038086, "global_step": 51907, "epoch": 625} {"train_loss": -20.279590606689453, "global_step": 51908, "epoch": 625} {"train_loss": -20.077302932739258, "global_step": 51909, "epoch": 625} {"train_loss": -20.296857833862305, "global_step": 51910, "epoch": 625} {"train_loss": -19.85564422607422, "global_step": 51911, "epoch": 625} {"train_loss": -19.874929428100586, "global_step": 51912, "epoch": 625} {"train_loss": -19.847375869750977, "global_step": 51913, "epoch": 625} {"train_loss": -19.89798355102539, "global_step": 51914, "epoch": 625} {"train_loss": -20.119327545166016, "global_step": 51915, "epoch": 625} {"train_loss": -19.822967529296875, "global_step": 51916, "epoch": 625} {"train_loss": -20.15213966369629, "global_step": 51917, "epoch": 625} {"train_loss": -20.04060935974121, "global_step": 51918, "epoch": 625} {"train_loss": -20.097074508666992, "global_step": 51919, "epoch": 625} {"train_loss": -20.1152286529541, "global_step": 51920, "epoch": 625} {"train_loss": -20.066503524780273, "global_step": 51921, "epoch": 625} {"train_loss": -19.851356506347656, "global_step": 51922, "epoch": 625} {"train_loss": -19.580137252807617, "global_step": 51923, "epoch": 625} {"train_loss": -19.823410034179688, "global_step": 51924, "epoch": 625} {"train_loss": -19.802457809448242, "global_step": 51925, "epoch": 625} {"train_loss": -19.997970581054688, "global_step": 51926, "epoch": 625} {"train_loss": -20.238134384155273, "global_step": 51927, "epoch": 625} {"train_loss": -20.185705184936523, "global_step": 51928, "epoch": 625} {"train_loss": -20.482046127319336, "global_step": 51929, "epoch": 625} {"train_loss": -20.216480255126953, "global_step": 51930, "epoch": 625} {"train_loss": -20.164770126342773, "global_step": 51931, "epoch": 625} {"train_loss": -19.983211517333984, "global_step": 51932, "epoch": 625} {"train_loss": -20.005765914916992, "global_step": 51933, "epoch": 625} {"train_loss": -19.911405563354492, "global_step": 51934, "epoch": 625} {"train_loss": -19.624055862426758, "global_step": 51935, "epoch": 625} {"train_loss": -19.815221786499023, "global_step": 51936, "epoch": 625} {"train_loss": -19.910215377807617, "global_step": 51937, "epoch": 625} {"train_loss": -20.088104248046875, "global_step": 51938, "epoch": 625} {"train_loss": -19.78951072692871, "global_step": 51939, "epoch": 625} {"train_loss": -20.171430587768555, "global_step": 51940, "epoch": 625} {"train_loss": -20.33316421508789, "global_step": 51941, "epoch": 625} {"train_loss": -20.053695678710938, "global_step": 51942, "epoch": 625} {"train_loss": -19.744659423828125, "global_step": 51943, "epoch": 625} {"train_loss": -19.99732780456543, "global_step": 51944, "epoch": 625} {"train_loss": -20.17776870727539, "global_step": 51945, "epoch": 625} {"train_loss": -20.23597526550293, "global_step": 51946, "epoch": 625} {"train_loss": -20.326528549194336, "global_step": 51947, "epoch": 625} {"train_loss": -20.022552490234375, "global_step": 51948, "epoch": 625} {"train_loss": -20.320547103881836, "global_step": 51949, "epoch": 625} {"train_loss": -19.85239601135254, "global_step": 51950, "epoch": 625} {"train_loss": -20.100582122802734, "global_step": 51951, "epoch": 625} {"train_loss": -20.279956817626953, "global_step": 51952, "epoch": 625} {"train_loss": -20.000181198120117, "global_step": 51953, "epoch": 625} {"train_loss": -19.973968505859375, "global_step": 51954, "epoch": 625} {"train_loss": -19.94658851623535, "global_step": 51955, "epoch": 625} {"train_loss": -20.245262145996094, "global_step": 51956, "epoch": 625} {"train_loss": -20.02201227394931, "global_step": 51957, "epoch": 625, "val_loss": 6008160.0} {"train_loss": -19.71175193786621, "global_step": 51958, "epoch": 626} {"train_loss": -19.909957885742188, "global_step": 51959, "epoch": 626} {"train_loss": -19.789777755737305, "global_step": 51960, "epoch": 626} {"train_loss": -19.72713279724121, "global_step": 51961, "epoch": 626} {"train_loss": -19.55902862548828, "global_step": 51962, "epoch": 626} {"train_loss": -19.85284423828125, "global_step": 51963, "epoch": 626} {"train_loss": -19.933340072631836, "global_step": 51964, "epoch": 626} {"train_loss": -20.15880584716797, "global_step": 51965, "epoch": 626} {"train_loss": -19.861366271972656, "global_step": 51966, "epoch": 626} {"train_loss": -20.026294708251953, "global_step": 51967, "epoch": 626} {"train_loss": -19.797319412231445, "global_step": 51968, "epoch": 626} {"train_loss": -20.175230026245117, "global_step": 51969, "epoch": 626} {"train_loss": -20.02191925048828, "global_step": 51970, "epoch": 626} {"train_loss": -20.52591896057129, "global_step": 51971, "epoch": 626} {"train_loss": -19.926889419555664, "global_step": 51972, "epoch": 626} {"train_loss": -20.280200958251953, "global_step": 51973, "epoch": 626} {"train_loss": -19.95291519165039, "global_step": 51974, "epoch": 626} {"train_loss": -20.0899600982666, "global_step": 51975, "epoch": 626} {"train_loss": -19.878665924072266, "global_step": 51976, "epoch": 626} {"train_loss": -20.093647003173828, "global_step": 51977, "epoch": 626} {"train_loss": -20.368738174438477, "global_step": 51978, "epoch": 626} {"train_loss": -19.811185836791992, "global_step": 51979, "epoch": 626} {"train_loss": -20.34345054626465, "global_step": 51980, "epoch": 626} {"train_loss": -19.780546188354492, "global_step": 51981, "epoch": 626} {"train_loss": -19.834213256835938, "global_step": 51982, "epoch": 626} {"train_loss": -19.717870712280273, "global_step": 51983, "epoch": 626} {"train_loss": -19.98761558532715, "global_step": 51984, "epoch": 626} {"train_loss": -19.802600860595703, "global_step": 51985, "epoch": 626} {"train_loss": -19.917081832885742, "global_step": 51986, "epoch": 626} {"train_loss": -20.42584991455078, "global_step": 51987, "epoch": 626} {"train_loss": -20.319236755371094, "global_step": 51988, "epoch": 626} {"train_loss": -20.061315536499023, "global_step": 51989, "epoch": 626} {"train_loss": -19.85615348815918, "global_step": 51990, "epoch": 626} {"train_loss": -19.939687728881836, "global_step": 51991, "epoch": 626} {"train_loss": -19.790809631347656, "global_step": 51992, "epoch": 626} {"train_loss": -19.9154109954834, "global_step": 51993, "epoch": 626} {"train_loss": -20.254066467285156, "global_step": 51994, "epoch": 626} {"train_loss": -20.07518196105957, "global_step": 51995, "epoch": 626} {"train_loss": -19.636796951293945, "global_step": 51996, "epoch": 626} {"train_loss": -20.435667037963867, "global_step": 51997, "epoch": 626} {"train_loss": -20.055898666381836, "global_step": 51998, "epoch": 626} {"train_loss": -20.086055755615234, "global_step": 51999, "epoch": 626} {"train_loss": -20.211050033569336, "global_step": 52000, "epoch": 626} {"train_loss": -20.097244262695312, "global_step": 52001, "epoch": 626} {"train_loss": -20.08109474182129, "global_step": 52002, "epoch": 626} {"train_loss": -19.883914947509766, "global_step": 52003, "epoch": 626} {"train_loss": -20.088953018188477, "global_step": 52004, "epoch": 626} {"train_loss": -19.725269317626953, "global_step": 52005, "epoch": 626} {"train_loss": -19.812162399291992, "global_step": 52006, "epoch": 626} {"train_loss": -19.90883445739746, "global_step": 52007, "epoch": 626} {"train_loss": -19.883230209350586, "global_step": 52008, "epoch": 626} {"train_loss": -20.1196231842041, "global_step": 52009, "epoch": 626} {"train_loss": -20.146806716918945, "global_step": 52010, "epoch": 626} {"train_loss": -20.04215431213379, "global_step": 52011, "epoch": 626} {"train_loss": -20.055049896240234, "global_step": 52012, "epoch": 626} {"train_loss": -20.386493682861328, "global_step": 52013, "epoch": 626} {"train_loss": -19.85938262939453, "global_step": 52014, "epoch": 626} {"train_loss": -20.180341720581055, "global_step": 52015, "epoch": 626} {"train_loss": -20.107675552368164, "global_step": 52016, "epoch": 626} {"train_loss": -20.168874740600586, "global_step": 52017, "epoch": 626} {"train_loss": -19.78870964050293, "global_step": 52018, "epoch": 626} {"train_loss": -19.901535034179688, "global_step": 52019, "epoch": 626} {"train_loss": -20.108640670776367, "global_step": 52020, "epoch": 626} {"train_loss": -19.822040557861328, "global_step": 52021, "epoch": 626} {"train_loss": -19.76967430114746, "global_step": 52022, "epoch": 626} {"train_loss": -20.070280075073242, "global_step": 52023, "epoch": 626} {"train_loss": -19.828079223632812, "global_step": 52024, "epoch": 626} {"train_loss": -20.203292846679688, "global_step": 52025, "epoch": 626} {"train_loss": -20.000274658203125, "global_step": 52026, "epoch": 626} {"train_loss": -20.074928283691406, "global_step": 52027, "epoch": 626} {"train_loss": -20.229990005493164, "global_step": 52028, "epoch": 626} {"train_loss": -20.308547973632812, "global_step": 52029, "epoch": 626} {"train_loss": -20.166540145874023, "global_step": 52030, "epoch": 626} {"train_loss": -20.138288497924805, "global_step": 52031, "epoch": 626} {"train_loss": -19.621219635009766, "global_step": 52032, "epoch": 626} {"train_loss": -20.37691307067871, "global_step": 52033, "epoch": 626} {"train_loss": -20.119253158569336, "global_step": 52034, "epoch": 626} {"train_loss": -20.26469612121582, "global_step": 52035, "epoch": 626} {"train_loss": -20.009933471679688, "global_step": 52036, "epoch": 626} {"train_loss": -20.252281188964844, "global_step": 52037, "epoch": 626} {"train_loss": -19.809995651245117, "global_step": 52038, "epoch": 626} {"train_loss": -19.72088623046875, "global_step": 52039, "epoch": 626} {"train_loss": -19.999541730765838, "global_step": 52040, "epoch": 626, "val_loss": 5971817.0} {"train_loss": -19.594282150268555, "global_step": 52041, "epoch": 627} {"train_loss": -19.660375595092773, "global_step": 52042, "epoch": 627} {"train_loss": -20.218505859375, "global_step": 52043, "epoch": 627} {"train_loss": -20.094959259033203, "global_step": 52044, "epoch": 627} {"train_loss": -20.384002685546875, "global_step": 52045, "epoch": 627} {"train_loss": -19.51357078552246, "global_step": 52046, "epoch": 627} {"train_loss": -19.5367431640625, "global_step": 52047, "epoch": 627} {"train_loss": -19.935190200805664, "global_step": 52048, "epoch": 627} {"train_loss": -20.11158561706543, "global_step": 52049, "epoch": 627} {"train_loss": -19.995763778686523, "global_step": 52050, "epoch": 627} {"train_loss": -20.242481231689453, "global_step": 52051, "epoch": 627} {"train_loss": -19.700252532958984, "global_step": 52052, "epoch": 627} {"train_loss": -19.42444610595703, "global_step": 52053, "epoch": 627} {"train_loss": -20.29966163635254, "global_step": 52054, "epoch": 627} {"train_loss": -19.620141983032227, "global_step": 52055, "epoch": 627} {"train_loss": -19.86612892150879, "global_step": 52056, "epoch": 627} {"train_loss": -19.469955444335938, "global_step": 52057, "epoch": 627} {"train_loss": -19.844961166381836, "global_step": 52058, "epoch": 627} {"train_loss": -20.148649215698242, "global_step": 52059, "epoch": 627} {"train_loss": -20.215499877929688, "global_step": 52060, "epoch": 627} {"train_loss": -19.831214904785156, "global_step": 52061, "epoch": 627} {"train_loss": -20.34189796447754, "global_step": 52062, "epoch": 627} {"train_loss": -19.761789321899414, "global_step": 52063, "epoch": 627} {"train_loss": -19.964351654052734, "global_step": 52064, "epoch": 627} {"train_loss": -20.11041831970215, "global_step": 52065, "epoch": 627} {"train_loss": -20.065473556518555, "global_step": 52066, "epoch": 627} {"train_loss": -19.650705337524414, "global_step": 52067, "epoch": 627} {"train_loss": -20.18780517578125, "global_step": 52068, "epoch": 627} {"train_loss": -20.062997817993164, "global_step": 52069, "epoch": 627} {"train_loss": -20.312969207763672, "global_step": 52070, "epoch": 627} {"train_loss": -19.535886764526367, "global_step": 52071, "epoch": 627} {"train_loss": -20.039798736572266, "global_step": 52072, "epoch": 627} {"train_loss": -19.995420455932617, "global_step": 52073, "epoch": 627} {"train_loss": -20.26801872253418, "global_step": 52074, "epoch": 627} {"train_loss": -19.897998809814453, "global_step": 52075, "epoch": 627} {"train_loss": -20.102155685424805, "global_step": 52076, "epoch": 627} {"train_loss": -19.79865074157715, "global_step": 52077, "epoch": 627} {"train_loss": -20.040470123291016, "global_step": 52078, "epoch": 627} {"train_loss": -20.251184463500977, "global_step": 52079, "epoch": 627} {"train_loss": -20.14436912536621, "global_step": 52080, "epoch": 627} {"train_loss": -19.87264633178711, "global_step": 52081, "epoch": 627} {"train_loss": -19.78587532043457, "global_step": 52082, "epoch": 627} {"train_loss": -19.84664535522461, "global_step": 52083, "epoch": 627} {"train_loss": -20.0620059967041, "global_step": 52084, "epoch": 627} {"train_loss": -20.307889938354492, "global_step": 52085, "epoch": 627} {"train_loss": -20.10505485534668, "global_step": 52086, "epoch": 627} {"train_loss": -19.94887351989746, "global_step": 52087, "epoch": 627} {"train_loss": -19.95810317993164, "global_step": 52088, "epoch": 627} {"train_loss": -20.036598205566406, "global_step": 52089, "epoch": 627} {"train_loss": -20.015535354614258, "global_step": 52090, "epoch": 627} {"train_loss": -19.821043014526367, "global_step": 52091, "epoch": 627} {"train_loss": -20.111968994140625, "global_step": 52092, "epoch": 627} {"train_loss": -20.05387306213379, "global_step": 52093, "epoch": 627} {"train_loss": -20.00267791748047, "global_step": 52094, "epoch": 627} {"train_loss": -20.24578094482422, "global_step": 52095, "epoch": 627} {"train_loss": -20.0524959564209, "global_step": 52096, "epoch": 627} {"train_loss": -19.991872787475586, "global_step": 52097, "epoch": 627} {"train_loss": -20.021520614624023, "global_step": 52098, "epoch": 627} {"train_loss": -19.824344635009766, "global_step": 52099, "epoch": 627} {"train_loss": -20.124387741088867, "global_step": 52100, "epoch": 627} {"train_loss": -19.953231811523438, "global_step": 52101, "epoch": 627} {"train_loss": -20.05620765686035, "global_step": 52102, "epoch": 627} {"train_loss": -19.554990768432617, "global_step": 52103, "epoch": 627} {"train_loss": -19.888830184936523, "global_step": 52104, "epoch": 627} {"train_loss": -20.177165985107422, "global_step": 52105, "epoch": 627} {"train_loss": -19.819791793823242, "global_step": 52106, "epoch": 627} {"train_loss": -19.784143447875977, "global_step": 52107, "epoch": 627} {"train_loss": -19.779569625854492, "global_step": 52108, "epoch": 627} {"train_loss": -20.022201538085938, "global_step": 52109, "epoch": 627} {"train_loss": -20.47194480895996, "global_step": 52110, "epoch": 627} {"train_loss": -20.300312042236328, "global_step": 52111, "epoch": 627} {"train_loss": -20.307926177978516, "global_step": 52112, "epoch": 627} {"train_loss": -20.057279586791992, "global_step": 52113, "epoch": 627} {"train_loss": -20.491567611694336, "global_step": 52114, "epoch": 627} {"train_loss": -19.852880477905273, "global_step": 52115, "epoch": 627} {"train_loss": -19.81534194946289, "global_step": 52116, "epoch": 627} {"train_loss": -19.757787704467773, "global_step": 52117, "epoch": 627} {"train_loss": -20.033559799194336, "global_step": 52118, "epoch": 627} {"train_loss": -19.643476486206055, "global_step": 52119, "epoch": 627} {"train_loss": -20.060277938842773, "global_step": 52120, "epoch": 627} {"train_loss": -20.004674911499023, "global_step": 52121, "epoch": 627} {"train_loss": -20.024642944335938, "global_step": 52122, "epoch": 627} {"train_loss": -19.95119988774679, "global_step": 52123, "epoch": 627, "val_loss": 6029976.5} {"train_loss": -19.882596969604492, "global_step": 52124, "epoch": 628} {"train_loss": -20.060550689697266, "global_step": 52125, "epoch": 628} {"train_loss": -19.948984146118164, "global_step": 52126, "epoch": 628} {"train_loss": -19.923986434936523, "global_step": 52127, "epoch": 628} {"train_loss": -20.130107879638672, "global_step": 52128, "epoch": 628} {"train_loss": -19.490964889526367, "global_step": 52129, "epoch": 628} {"train_loss": -19.699756622314453, "global_step": 52130, "epoch": 628} {"train_loss": -19.85784912109375, "global_step": 52131, "epoch": 628} {"train_loss": -19.948022842407227, "global_step": 52132, "epoch": 628} {"train_loss": -19.984756469726562, "global_step": 52133, "epoch": 628} {"train_loss": -19.931005477905273, "global_step": 52134, "epoch": 628} {"train_loss": -20.030242919921875, "global_step": 52135, "epoch": 628} {"train_loss": -20.108366012573242, "global_step": 52136, "epoch": 628} {"train_loss": -20.115615844726562, "global_step": 52137, "epoch": 628} {"train_loss": -20.124481201171875, "global_step": 52138, "epoch": 628} {"train_loss": -19.909961700439453, "global_step": 52139, "epoch": 628} {"train_loss": -20.103567123413086, "global_step": 52140, "epoch": 628} {"train_loss": -19.89808464050293, "global_step": 52141, "epoch": 628} {"train_loss": -19.69203758239746, "global_step": 52142, "epoch": 628} {"train_loss": -20.249643325805664, "global_step": 52143, "epoch": 628} {"train_loss": -20.25884437561035, "global_step": 52144, "epoch": 628} {"train_loss": -20.29060935974121, "global_step": 52145, "epoch": 628} {"train_loss": -20.09805679321289, "global_step": 52146, "epoch": 628} {"train_loss": -20.23200225830078, "global_step": 52147, "epoch": 628} {"train_loss": -20.17396354675293, "global_step": 52148, "epoch": 628} {"train_loss": -19.80377769470215, "global_step": 52149, "epoch": 628} {"train_loss": -19.815866470336914, "global_step": 52150, "epoch": 628} {"train_loss": -19.485881805419922, "global_step": 52151, "epoch": 628} {"train_loss": -20.09332275390625, "global_step": 52152, "epoch": 628} {"train_loss": -20.127809524536133, "global_step": 52153, "epoch": 628} {"train_loss": -20.20728874206543, "global_step": 52154, "epoch": 628} {"train_loss": -19.87369155883789, "global_step": 52155, "epoch": 628} {"train_loss": -20.036996841430664, "global_step": 52156, "epoch": 628} {"train_loss": -19.741113662719727, "global_step": 52157, "epoch": 628} {"train_loss": -19.91254997253418, "global_step": 52158, "epoch": 628} {"train_loss": -19.858963012695312, "global_step": 52159, "epoch": 628} {"train_loss": -20.05653190612793, "global_step": 52160, "epoch": 628} {"train_loss": -20.211864471435547, "global_step": 52161, "epoch": 628} {"train_loss": -20.135353088378906, "global_step": 52162, "epoch": 628} {"train_loss": -19.87683868408203, "global_step": 52163, "epoch": 628} {"train_loss": -20.167865753173828, "global_step": 52164, "epoch": 628} {"train_loss": -20.314231872558594, "global_step": 52165, "epoch": 628} {"train_loss": -19.978239059448242, "global_step": 52166, "epoch": 628} {"train_loss": -19.963123321533203, "global_step": 52167, "epoch": 628} {"train_loss": -20.03029441833496, "global_step": 52168, "epoch": 628} {"train_loss": -19.766698837280273, "global_step": 52169, "epoch": 628} {"train_loss": -20.171052932739258, "global_step": 52170, "epoch": 628} {"train_loss": -19.907358169555664, "global_step": 52171, "epoch": 628} {"train_loss": -20.216209411621094, "global_step": 52172, "epoch": 628} {"train_loss": -19.876379013061523, "global_step": 52173, "epoch": 628} {"train_loss": -20.148252487182617, "global_step": 52174, "epoch": 628} {"train_loss": -20.183462142944336, "global_step": 52175, "epoch": 628} {"train_loss": -20.390472412109375, "global_step": 52176, "epoch": 628} {"train_loss": -19.999521255493164, "global_step": 52177, "epoch": 628} {"train_loss": -19.983266830444336, "global_step": 52178, "epoch": 628} {"train_loss": -20.365026473999023, "global_step": 52179, "epoch": 628} {"train_loss": -19.858625411987305, "global_step": 52180, "epoch": 628} {"train_loss": -20.141260147094727, "global_step": 52181, "epoch": 628} {"train_loss": -19.99028778076172, "global_step": 52182, "epoch": 628} {"train_loss": -19.918134689331055, "global_step": 52183, "epoch": 628} {"train_loss": -19.9034366607666, "global_step": 52184, "epoch": 628} {"train_loss": -20.20248794555664, "global_step": 52185, "epoch": 628} {"train_loss": -20.185834884643555, "global_step": 52186, "epoch": 628} {"train_loss": -19.952674865722656, "global_step": 52187, "epoch": 628} {"train_loss": -20.478971481323242, "global_step": 52188, "epoch": 628} {"train_loss": -20.192840576171875, "global_step": 52189, "epoch": 628} {"train_loss": -19.987564086914062, "global_step": 52190, "epoch": 628} {"train_loss": -19.601465225219727, "global_step": 52191, "epoch": 628} {"train_loss": -20.20159912109375, "global_step": 52192, "epoch": 628} {"train_loss": -20.470808029174805, "global_step": 52193, "epoch": 628} {"train_loss": -20.075986862182617, "global_step": 52194, "epoch": 628} {"train_loss": -19.951751708984375, "global_step": 52195, "epoch": 628} {"train_loss": -20.184532165527344, "global_step": 52196, "epoch": 628} {"train_loss": -20.4088191986084, "global_step": 52197, "epoch": 628} {"train_loss": -19.936538696289062, "global_step": 52198, "epoch": 628} {"train_loss": -19.820646286010742, "global_step": 52199, "epoch": 628} {"train_loss": -19.910507202148438, "global_step": 52200, "epoch": 628} {"train_loss": -19.73794937133789, "global_step": 52201, "epoch": 628} {"train_loss": -19.86851692199707, "global_step": 52202, "epoch": 628} {"train_loss": -19.541406631469727, "global_step": 52203, "epoch": 628} {"train_loss": -19.767873764038086, "global_step": 52204, "epoch": 628} {"train_loss": -20.318967819213867, "global_step": 52205, "epoch": 628} {"train_loss": -19.99316904918257, "global_step": 52206, "epoch": 628, "val_loss": 6063981.0} {"train_loss": -19.79298210144043, "global_step": 52207, "epoch": 629} {"train_loss": -19.603605270385742, "global_step": 52208, "epoch": 629} {"train_loss": -20.126794815063477, "global_step": 52209, "epoch": 629} {"train_loss": -19.56573486328125, "global_step": 52210, "epoch": 629} {"train_loss": -20.200157165527344, "global_step": 52211, "epoch": 629} {"train_loss": -19.715913772583008, "global_step": 52212, "epoch": 629} {"train_loss": -19.779226303100586, "global_step": 52213, "epoch": 629} {"train_loss": -19.536365509033203, "global_step": 52214, "epoch": 629} {"train_loss": -19.554784774780273, "global_step": 52215, "epoch": 629} {"train_loss": -19.445667266845703, "global_step": 52216, "epoch": 629} {"train_loss": -20.176549911499023, "global_step": 52217, "epoch": 629} {"train_loss": -19.65876579284668, "global_step": 52218, "epoch": 629} {"train_loss": -19.95436668395996, "global_step": 52219, "epoch": 629} {"train_loss": -19.492727279663086, "global_step": 52220, "epoch": 629} {"train_loss": -19.6231746673584, "global_step": 52221, "epoch": 629} {"train_loss": -19.95796775817871, "global_step": 52222, "epoch": 629} {"train_loss": -19.92864418029785, "global_step": 52223, "epoch": 629} {"train_loss": -19.474096298217773, "global_step": 52224, "epoch": 629} {"train_loss": -19.818784713745117, "global_step": 52225, "epoch": 629} {"train_loss": -20.0264835357666, "global_step": 52226, "epoch": 629} {"train_loss": -19.829580307006836, "global_step": 52227, "epoch": 629} {"train_loss": -19.676156997680664, "global_step": 52228, "epoch": 629} {"train_loss": -20.1446533203125, "global_step": 52229, "epoch": 629} {"train_loss": -19.901906967163086, "global_step": 52230, "epoch": 629} {"train_loss": -19.797269821166992, "global_step": 52231, "epoch": 629} {"train_loss": -20.030019760131836, "global_step": 52232, "epoch": 629} {"train_loss": -20.161468505859375, "global_step": 52233, "epoch": 629} {"train_loss": -19.961450576782227, "global_step": 52234, "epoch": 629} {"train_loss": -20.082136154174805, "global_step": 52235, "epoch": 629} {"train_loss": -20.036684036254883, "global_step": 52236, "epoch": 629} {"train_loss": -20.199569702148438, "global_step": 52237, "epoch": 629} {"train_loss": -19.389266967773438, "global_step": 52238, "epoch": 629} {"train_loss": -20.161054611206055, "global_step": 52239, "epoch": 629} {"train_loss": -19.95340347290039, "global_step": 52240, "epoch": 629} {"train_loss": -20.188344955444336, "global_step": 52241, "epoch": 629} {"train_loss": -20.46339225769043, "global_step": 52242, "epoch": 629} {"train_loss": -20.108537673950195, "global_step": 52243, "epoch": 629} {"train_loss": -20.2760066986084, "global_step": 52244, "epoch": 629} {"train_loss": -19.85892677307129, "global_step": 52245, "epoch": 629} {"train_loss": -20.22041893005371, "global_step": 52246, "epoch": 629} {"train_loss": -20.0489559173584, "global_step": 52247, "epoch": 629} {"train_loss": -20.23017692565918, "global_step": 52248, "epoch": 629} {"train_loss": -20.2429256439209, "global_step": 52249, "epoch": 629} {"train_loss": -19.994619369506836, "global_step": 52250, "epoch": 629} {"train_loss": -20.2242488861084, "global_step": 52251, "epoch": 629} {"train_loss": -19.949867248535156, "global_step": 52252, "epoch": 629} {"train_loss": -19.771390914916992, "global_step": 52253, "epoch": 629} {"train_loss": -20.50722312927246, "global_step": 52254, "epoch": 629} {"train_loss": -20.235124588012695, "global_step": 52255, "epoch": 629} {"train_loss": -19.94435691833496, "global_step": 52256, "epoch": 629} {"train_loss": -19.78473472595215, "global_step": 52257, "epoch": 629} {"train_loss": -20.06656265258789, "global_step": 52258, "epoch": 629} {"train_loss": -19.338367462158203, "global_step": 52259, "epoch": 629} {"train_loss": -20.00250244140625, "global_step": 52260, "epoch": 629} {"train_loss": -19.497379302978516, "global_step": 52261, "epoch": 629} {"train_loss": -19.97627067565918, "global_step": 52262, "epoch": 629} {"train_loss": -20.012359619140625, "global_step": 52263, "epoch": 629} {"train_loss": -19.974538803100586, "global_step": 52264, "epoch": 629} {"train_loss": -19.943124771118164, "global_step": 52265, "epoch": 629} {"train_loss": -19.81983757019043, "global_step": 52266, "epoch": 629} {"train_loss": -19.770910263061523, "global_step": 52267, "epoch": 629} {"train_loss": -20.45818519592285, "global_step": 52268, "epoch": 629} {"train_loss": -19.848440170288086, "global_step": 52269, "epoch": 629} {"train_loss": -19.63262176513672, "global_step": 52270, "epoch": 629} {"train_loss": -20.358150482177734, "global_step": 52271, "epoch": 629} {"train_loss": -19.966703414916992, "global_step": 52272, "epoch": 629} {"train_loss": -19.795215606689453, "global_step": 52273, "epoch": 629} {"train_loss": -20.077390670776367, "global_step": 52274, "epoch": 629} {"train_loss": -20.041513442993164, "global_step": 52275, "epoch": 629} {"train_loss": -20.245588302612305, "global_step": 52276, "epoch": 629} {"train_loss": -19.900224685668945, "global_step": 52277, "epoch": 629} {"train_loss": -19.711393356323242, "global_step": 52278, "epoch": 629} {"train_loss": -20.028549194335938, "global_step": 52279, "epoch": 629} {"train_loss": -20.0460205078125, "global_step": 52280, "epoch": 629} {"train_loss": -20.254703521728516, "global_step": 52281, "epoch": 629} {"train_loss": -20.337495803833008, "global_step": 52282, "epoch": 629} {"train_loss": -20.04081916809082, "global_step": 52283, "epoch": 629} {"train_loss": -20.05208396911621, "global_step": 52284, "epoch": 629} {"train_loss": -19.91947364807129, "global_step": 52285, "epoch": 629} {"train_loss": -19.775705337524414, "global_step": 52286, "epoch": 629} {"train_loss": -20.003982543945312, "global_step": 52287, "epoch": 629} {"train_loss": -19.80158805847168, "global_step": 52288, "epoch": 629} {"train_loss": -19.945683513779237, "global_step": 52289, "epoch": 629, "val_loss": 5945901.0} {"train_loss": -20.090803146362305, "global_step": 52290, "epoch": 630} {"train_loss": -20.06578254699707, "global_step": 52291, "epoch": 630} {"train_loss": -19.27115821838379, "global_step": 52292, "epoch": 630} {"train_loss": -19.988428115844727, "global_step": 52293, "epoch": 630} {"train_loss": -19.881778717041016, "global_step": 52294, "epoch": 630} {"train_loss": -19.899436950683594, "global_step": 52295, "epoch": 630} {"train_loss": -19.952667236328125, "global_step": 52296, "epoch": 630} {"train_loss": -19.822845458984375, "global_step": 52297, "epoch": 630} {"train_loss": -20.079946517944336, "global_step": 52298, "epoch": 630} {"train_loss": -19.951745986938477, "global_step": 52299, "epoch": 630} {"train_loss": -20.0407657623291, "global_step": 52300, "epoch": 630} {"train_loss": -20.124765396118164, "global_step": 52301, "epoch": 630} {"train_loss": -20.405363082885742, "global_step": 52302, "epoch": 630} {"train_loss": -19.972536087036133, "global_step": 52303, "epoch": 630} {"train_loss": -20.010007858276367, "global_step": 52304, "epoch": 630} {"train_loss": -20.313600540161133, "global_step": 52305, "epoch": 630} {"train_loss": -19.559741973876953, "global_step": 52306, "epoch": 630} {"train_loss": -20.163724899291992, "global_step": 52307, "epoch": 630} {"train_loss": -20.053720474243164, "global_step": 52308, "epoch": 630} {"train_loss": -20.15964126586914, "global_step": 52309, "epoch": 630} {"train_loss": -20.28143310546875, "global_step": 52310, "epoch": 630} {"train_loss": -20.017614364624023, "global_step": 52311, "epoch": 630} {"train_loss": -20.1602840423584, "global_step": 52312, "epoch": 630} {"train_loss": -20.31232261657715, "global_step": 52313, "epoch": 630} {"train_loss": -19.987394332885742, "global_step": 52314, "epoch": 630} {"train_loss": -19.992080688476562, "global_step": 52315, "epoch": 630} {"train_loss": -19.937971115112305, "global_step": 52316, "epoch": 630} {"train_loss": -19.730194091796875, "global_step": 52317, "epoch": 630} {"train_loss": -20.375274658203125, "global_step": 52318, "epoch": 630} {"train_loss": -19.73074722290039, "global_step": 52319, "epoch": 630} {"train_loss": -20.162691116333008, "global_step": 52320, "epoch": 630} {"train_loss": -19.85205078125, "global_step": 52321, "epoch": 630} {"train_loss": -19.87472915649414, "global_step": 52322, "epoch": 630} {"train_loss": -20.043792724609375, "global_step": 52323, "epoch": 630} {"train_loss": -20.25048828125, "global_step": 52324, "epoch": 630} {"train_loss": -20.180423736572266, "global_step": 52325, "epoch": 630} {"train_loss": -20.24798583984375, "global_step": 52326, "epoch": 630} {"train_loss": -20.280231475830078, "global_step": 52327, "epoch": 630} {"train_loss": -20.072904586791992, "global_step": 52328, "epoch": 630} {"train_loss": -19.866477966308594, "global_step": 52329, "epoch": 630} {"train_loss": -19.980031967163086, "global_step": 52330, "epoch": 630} {"train_loss": -20.296533584594727, "global_step": 52331, "epoch": 630} {"train_loss": -20.051021575927734, "global_step": 52332, "epoch": 630} {"train_loss": -19.946949005126953, "global_step": 52333, "epoch": 630} {"train_loss": -19.836095809936523, "global_step": 52334, "epoch": 630} {"train_loss": -19.953655242919922, "global_step": 52335, "epoch": 630} {"train_loss": -20.457059860229492, "global_step": 52336, "epoch": 630} {"train_loss": -19.915021896362305, "global_step": 52337, "epoch": 630} {"train_loss": -20.25429916381836, "global_step": 52338, "epoch": 630} {"train_loss": -20.23494529724121, "global_step": 52339, "epoch": 630} {"train_loss": -20.294178009033203, "global_step": 52340, "epoch": 630} {"train_loss": -20.089324951171875, "global_step": 52341, "epoch": 630} {"train_loss": -20.474607467651367, "global_step": 52342, "epoch": 630} {"train_loss": -19.590961456298828, "global_step": 52343, "epoch": 630} {"train_loss": -19.933666229248047, "global_step": 52344, "epoch": 630} {"train_loss": -20.016101837158203, "global_step": 52345, "epoch": 630} {"train_loss": -19.74272346496582, "global_step": 52346, "epoch": 630} {"train_loss": -19.82696533203125, "global_step": 52347, "epoch": 630} {"train_loss": -19.677507400512695, "global_step": 52348, "epoch": 630} {"train_loss": -20.229650497436523, "global_step": 52349, "epoch": 630} {"train_loss": -19.942049026489258, "global_step": 52350, "epoch": 630} {"train_loss": -19.98211669921875, "global_step": 52351, "epoch": 630} {"train_loss": -19.794681549072266, "global_step": 52352, "epoch": 630} {"train_loss": -20.101530075073242, "global_step": 52353, "epoch": 630} {"train_loss": -19.893028259277344, "global_step": 52354, "epoch": 630} {"train_loss": -20.081480026245117, "global_step": 52355, "epoch": 630} {"train_loss": -19.81995964050293, "global_step": 52356, "epoch": 630} {"train_loss": -19.913118362426758, "global_step": 52357, "epoch": 630} {"train_loss": -20.003713607788086, "global_step": 52358, "epoch": 630} {"train_loss": -20.017255783081055, "global_step": 52359, "epoch": 630} {"train_loss": -20.173490524291992, "global_step": 52360, "epoch": 630} {"train_loss": -20.033567428588867, "global_step": 52361, "epoch": 630} {"train_loss": -20.155229568481445, "global_step": 52362, "epoch": 630} {"train_loss": -19.75363540649414, "global_step": 52363, "epoch": 630} {"train_loss": -20.078292846679688, "global_step": 52364, "epoch": 630} {"train_loss": -20.241907119750977, "global_step": 52365, "epoch": 630} {"train_loss": -20.188562393188477, "global_step": 52366, "epoch": 630} {"train_loss": -20.015769958496094, "global_step": 52367, "epoch": 630} {"train_loss": -19.849843978881836, "global_step": 52368, "epoch": 630} {"train_loss": -19.77217674255371, "global_step": 52369, "epoch": 630} {"train_loss": -19.984561920166016, "global_step": 52370, "epoch": 630} {"train_loss": -20.018535614013672, "global_step": 52371, "epoch": 630} {"train_loss": -20.031198225825666, "global_step": 52372, "epoch": 630, "val_loss": 6035386.0} {"train_loss": -19.77314567565918, "global_step": 52373, "epoch": 631} {"train_loss": -19.996511459350586, "global_step": 52374, "epoch": 631} {"train_loss": -19.9146671295166, "global_step": 52375, "epoch": 631} {"train_loss": -20.036880493164062, "global_step": 52376, "epoch": 631} {"train_loss": -19.63736915588379, "global_step": 52377, "epoch": 631} {"train_loss": -19.555952072143555, "global_step": 52378, "epoch": 631} {"train_loss": -19.512786865234375, "global_step": 52379, "epoch": 631} {"train_loss": -19.747495651245117, "global_step": 52380, "epoch": 631} {"train_loss": -19.959609985351562, "global_step": 52381, "epoch": 631} {"train_loss": -19.79186248779297, "global_step": 52382, "epoch": 631} {"train_loss": -19.919769287109375, "global_step": 52383, "epoch": 631} {"train_loss": -20.202238082885742, "global_step": 52384, "epoch": 631} {"train_loss": -20.01767921447754, "global_step": 52385, "epoch": 631} {"train_loss": -20.247167587280273, "global_step": 52386, "epoch": 631} {"train_loss": -19.882068634033203, "global_step": 52387, "epoch": 631} {"train_loss": -19.764286041259766, "global_step": 52388, "epoch": 631} {"train_loss": -20.054601669311523, "global_step": 52389, "epoch": 631} {"train_loss": -20.052433013916016, "global_step": 52390, "epoch": 631} {"train_loss": -19.82932472229004, "global_step": 52391, "epoch": 631} {"train_loss": -20.045621871948242, "global_step": 52392, "epoch": 631} {"train_loss": -19.938955307006836, "global_step": 52393, "epoch": 631} {"train_loss": -20.016788482666016, "global_step": 52394, "epoch": 631} {"train_loss": -20.208969116210938, "global_step": 52395, "epoch": 631} {"train_loss": -20.115570068359375, "global_step": 52396, "epoch": 631} {"train_loss": -20.140945434570312, "global_step": 52397, "epoch": 631} {"train_loss": -19.92476463317871, "global_step": 52398, "epoch": 631} {"train_loss": -20.216480255126953, "global_step": 52399, "epoch": 631} {"train_loss": -20.30514144897461, "global_step": 52400, "epoch": 631} {"train_loss": -20.289289474487305, "global_step": 52401, "epoch": 631} {"train_loss": -20.101083755493164, "global_step": 52402, "epoch": 631} {"train_loss": -19.990375518798828, "global_step": 52403, "epoch": 631} {"train_loss": -19.706151962280273, "global_step": 52404, "epoch": 631} {"train_loss": -20.099380493164062, "global_step": 52405, "epoch": 631} {"train_loss": -19.80307960510254, "global_step": 52406, "epoch": 631} {"train_loss": -20.21396827697754, "global_step": 52407, "epoch": 631} {"train_loss": -20.301156997680664, "global_step": 52408, "epoch": 631} {"train_loss": -20.003293991088867, "global_step": 52409, "epoch": 631} {"train_loss": -20.123443603515625, "global_step": 52410, "epoch": 631} {"train_loss": -19.80470085144043, "global_step": 52411, "epoch": 631} {"train_loss": -20.347410202026367, "global_step": 52412, "epoch": 631} {"train_loss": -20.443368911743164, "global_step": 52413, "epoch": 631} {"train_loss": -19.9974422454834, "global_step": 52414, "epoch": 631} {"train_loss": -20.126333236694336, "global_step": 52415, "epoch": 631} {"train_loss": -20.16858673095703, "global_step": 52416, "epoch": 631} {"train_loss": -20.14052391052246, "global_step": 52417, "epoch": 631} {"train_loss": -19.94496726989746, "global_step": 52418, "epoch": 631} {"train_loss": -19.94339370727539, "global_step": 52419, "epoch": 631} {"train_loss": -20.035751342773438, "global_step": 52420, "epoch": 631} {"train_loss": -20.387624740600586, "global_step": 52421, "epoch": 631} {"train_loss": -20.12955665588379, "global_step": 52422, "epoch": 631} {"train_loss": -20.03510856628418, "global_step": 52423, "epoch": 631} {"train_loss": -19.866968154907227, "global_step": 52424, "epoch": 631} {"train_loss": -20.085233688354492, "global_step": 52425, "epoch": 631} {"train_loss": -20.00740623474121, "global_step": 52426, "epoch": 631} {"train_loss": -19.921384811401367, "global_step": 52427, "epoch": 631} {"train_loss": -19.907129287719727, "global_step": 52428, "epoch": 631} {"train_loss": -20.194448471069336, "global_step": 52429, "epoch": 631} {"train_loss": -20.317413330078125, "global_step": 52430, "epoch": 631} {"train_loss": -19.817373275756836, "global_step": 52431, "epoch": 631} {"train_loss": -20.185001373291016, "global_step": 52432, "epoch": 631} {"train_loss": -20.241886138916016, "global_step": 52433, "epoch": 631} {"train_loss": -20.16942024230957, "global_step": 52434, "epoch": 631} {"train_loss": -19.98105239868164, "global_step": 52435, "epoch": 631} {"train_loss": -19.78512954711914, "global_step": 52436, "epoch": 631} {"train_loss": -19.983997344970703, "global_step": 52437, "epoch": 631} {"train_loss": -19.82807731628418, "global_step": 52438, "epoch": 631} {"train_loss": -19.621822357177734, "global_step": 52439, "epoch": 631} {"train_loss": -20.10692596435547, "global_step": 52440, "epoch": 631} {"train_loss": -20.117551803588867, "global_step": 52441, "epoch": 631} {"train_loss": -20.06494140625, "global_step": 52442, "epoch": 631} {"train_loss": -20.259971618652344, "global_step": 52443, "epoch": 631} {"train_loss": -19.946121215820312, "global_step": 52444, "epoch": 631} {"train_loss": -20.027708053588867, "global_step": 52445, "epoch": 631} {"train_loss": -19.563735961914062, "global_step": 52446, "epoch": 631} {"train_loss": -19.907398223876953, "global_step": 52447, "epoch": 631} {"train_loss": -20.114330291748047, "global_step": 52448, "epoch": 631} {"train_loss": -19.944307327270508, "global_step": 52449, "epoch": 631} {"train_loss": -20.152694702148438, "global_step": 52450, "epoch": 631} {"train_loss": -20.193113327026367, "global_step": 52451, "epoch": 631} {"train_loss": -20.13057518005371, "global_step": 52452, "epoch": 631} {"train_loss": -20.12258529663086, "global_step": 52453, "epoch": 631} {"train_loss": -20.22467041015625, "global_step": 52454, "epoch": 631} {"train_loss": -20.019685906099987, "global_step": 52455, "epoch": 631, "val_loss": 5980127.0} {"train_loss": -20.13201904296875, "global_step": 52456, "epoch": 632} {"train_loss": -20.075712203979492, "global_step": 52457, "epoch": 632} {"train_loss": -19.892072677612305, "global_step": 52458, "epoch": 632} {"train_loss": -20.1393985748291, "global_step": 52459, "epoch": 632} {"train_loss": -19.68661880493164, "global_step": 52460, "epoch": 632} {"train_loss": -19.668310165405273, "global_step": 52461, "epoch": 632} {"train_loss": -20.092798233032227, "global_step": 52462, "epoch": 632} {"train_loss": -20.16114616394043, "global_step": 52463, "epoch": 632} {"train_loss": -20.089262008666992, "global_step": 52464, "epoch": 632} {"train_loss": -19.90398406982422, "global_step": 52465, "epoch": 632} {"train_loss": -20.390531539916992, "global_step": 52466, "epoch": 632} {"train_loss": -20.037063598632812, "global_step": 52467, "epoch": 632} {"train_loss": -19.9591121673584, "global_step": 52468, "epoch": 632} {"train_loss": -19.973621368408203, "global_step": 52469, "epoch": 632} {"train_loss": -19.823551177978516, "global_step": 52470, "epoch": 632} {"train_loss": -20.096111297607422, "global_step": 52471, "epoch": 632} {"train_loss": -20.350173950195312, "global_step": 52472, "epoch": 632} {"train_loss": -19.883161544799805, "global_step": 52473, "epoch": 632} {"train_loss": -20.0466365814209, "global_step": 52474, "epoch": 632} {"train_loss": -20.00192642211914, "global_step": 52475, "epoch": 632} {"train_loss": -20.522552490234375, "global_step": 52476, "epoch": 632} {"train_loss": -20.106061935424805, "global_step": 52477, "epoch": 632} {"train_loss": -19.84974479675293, "global_step": 52478, "epoch": 632} {"train_loss": -19.84815788269043, "global_step": 52479, "epoch": 632} {"train_loss": -20.10807991027832, "global_step": 52480, "epoch": 632} {"train_loss": -19.834806442260742, "global_step": 52481, "epoch": 632} {"train_loss": -20.25311851501465, "global_step": 52482, "epoch": 632} {"train_loss": -19.863826751708984, "global_step": 52483, "epoch": 632} {"train_loss": -20.117725372314453, "global_step": 52484, "epoch": 632} {"train_loss": -19.789358139038086, "global_step": 52485, "epoch": 632} {"train_loss": -20.15009117126465, "global_step": 52486, "epoch": 632} {"train_loss": -19.582046508789062, "global_step": 52487, "epoch": 632} {"train_loss": -19.76900291442871, "global_step": 52488, "epoch": 632} {"train_loss": -20.33967399597168, "global_step": 52489, "epoch": 632} {"train_loss": -20.01962661743164, "global_step": 52490, "epoch": 632} {"train_loss": -20.236194610595703, "global_step": 52491, "epoch": 632} {"train_loss": -20.46589469909668, "global_step": 52492, "epoch": 632} {"train_loss": -19.821456909179688, "global_step": 52493, "epoch": 632} {"train_loss": -20.097698211669922, "global_step": 52494, "epoch": 632} {"train_loss": -20.3643856048584, "global_step": 52495, "epoch": 632} {"train_loss": -19.868505477905273, "global_step": 52496, "epoch": 632} {"train_loss": -20.284250259399414, "global_step": 52497, "epoch": 632} {"train_loss": -20.139469146728516, "global_step": 52498, "epoch": 632} {"train_loss": -20.06682777404785, "global_step": 52499, "epoch": 632} {"train_loss": -20.080480575561523, "global_step": 52500, "epoch": 632} {"train_loss": -20.243457794189453, "global_step": 52501, "epoch": 632} {"train_loss": -20.39581298828125, "global_step": 52502, "epoch": 632} {"train_loss": -19.565229415893555, "global_step": 52503, "epoch": 632} {"train_loss": -20.223743438720703, "global_step": 52504, "epoch": 632} {"train_loss": -19.959247589111328, "global_step": 52505, "epoch": 632} {"train_loss": -19.3421573638916, "global_step": 52506, "epoch": 632} {"train_loss": -20.097518920898438, "global_step": 52507, "epoch": 632} {"train_loss": -19.91254234313965, "global_step": 52508, "epoch": 632} {"train_loss": -20.144245147705078, "global_step": 52509, "epoch": 632} {"train_loss": -19.988515853881836, "global_step": 52510, "epoch": 632} {"train_loss": -19.8750057220459, "global_step": 52511, "epoch": 632} {"train_loss": -19.998245239257812, "global_step": 52512, "epoch": 632} {"train_loss": -19.9280948638916, "global_step": 52513, "epoch": 632} {"train_loss": -19.8966064453125, "global_step": 52514, "epoch": 632} {"train_loss": -19.866777420043945, "global_step": 52515, "epoch": 632} {"train_loss": -20.135787963867188, "global_step": 52516, "epoch": 632} {"train_loss": -20.191312789916992, "global_step": 52517, "epoch": 632} {"train_loss": -19.893186569213867, "global_step": 52518, "epoch": 632} {"train_loss": -20.198410034179688, "global_step": 52519, "epoch": 632} {"train_loss": -19.774938583374023, "global_step": 52520, "epoch": 632} {"train_loss": -19.968393325805664, "global_step": 52521, "epoch": 632} {"train_loss": -19.374723434448242, "global_step": 52522, "epoch": 632} {"train_loss": -20.06732749938965, "global_step": 52523, "epoch": 632} {"train_loss": -19.951562881469727, "global_step": 52524, "epoch": 632} {"train_loss": -20.369932174682617, "global_step": 52525, "epoch": 632} {"train_loss": -20.186071395874023, "global_step": 52526, "epoch": 632} {"train_loss": -20.0133056640625, "global_step": 52527, "epoch": 632} {"train_loss": -20.171884536743164, "global_step": 52528, "epoch": 632} {"train_loss": -19.97941017150879, "global_step": 52529, "epoch": 632} {"train_loss": -20.017480850219727, "global_step": 52530, "epoch": 632} {"train_loss": -19.682126998901367, "global_step": 52531, "epoch": 632} {"train_loss": -20.018232345581055, "global_step": 52532, "epoch": 632} {"train_loss": -20.17742347717285, "global_step": 52533, "epoch": 632} {"train_loss": -19.9500732421875, "global_step": 52534, "epoch": 632} {"train_loss": -19.823711395263672, "global_step": 52535, "epoch": 632} {"train_loss": -20.40104866027832, "global_step": 52536, "epoch": 632} {"train_loss": -19.9271240234375, "global_step": 52537, "epoch": 632} {"train_loss": -20.02596379475421, "global_step": 52538, "epoch": 632, "val_loss": 6104868.5} {"train_loss": -19.90981101989746, "global_step": 52539, "epoch": 633} {"train_loss": -19.699970245361328, "global_step": 52540, "epoch": 633} {"train_loss": -19.751895904541016, "global_step": 52541, "epoch": 633} {"train_loss": -19.952177047729492, "global_step": 52542, "epoch": 633} {"train_loss": -20.07355308532715, "global_step": 52543, "epoch": 633} {"train_loss": -20.272329330444336, "global_step": 52544, "epoch": 633} {"train_loss": -20.51137351989746, "global_step": 52545, "epoch": 633} {"train_loss": -19.481809616088867, "global_step": 52546, "epoch": 633} {"train_loss": -20.479246139526367, "global_step": 52547, "epoch": 633} {"train_loss": -19.74136734008789, "global_step": 52548, "epoch": 633} {"train_loss": -19.722013473510742, "global_step": 52549, "epoch": 633} {"train_loss": -20.068544387817383, "global_step": 52550, "epoch": 633} {"train_loss": -20.51022720336914, "global_step": 52551, "epoch": 633} {"train_loss": -19.847360610961914, "global_step": 52552, "epoch": 633} {"train_loss": -20.372190475463867, "global_step": 52553, "epoch": 633} {"train_loss": -20.435476303100586, "global_step": 52554, "epoch": 633} {"train_loss": -20.393436431884766, "global_step": 52555, "epoch": 633} {"train_loss": -19.888898849487305, "global_step": 52556, "epoch": 633} {"train_loss": -19.89381980895996, "global_step": 52557, "epoch": 633} {"train_loss": -20.025516510009766, "global_step": 52558, "epoch": 633} {"train_loss": -20.221237182617188, "global_step": 52559, "epoch": 633} {"train_loss": -19.712039947509766, "global_step": 52560, "epoch": 633} {"train_loss": -20.093793869018555, "global_step": 52561, "epoch": 633} {"train_loss": -20.201032638549805, "global_step": 52562, "epoch": 633} {"train_loss": -20.005746841430664, "global_step": 52563, "epoch": 633} {"train_loss": -19.796964645385742, "global_step": 52564, "epoch": 633} {"train_loss": -20.005756378173828, "global_step": 52565, "epoch": 633} {"train_loss": -20.355674743652344, "global_step": 52566, "epoch": 633} {"train_loss": -19.914220809936523, "global_step": 52567, "epoch": 633} {"train_loss": -20.08268165588379, "global_step": 52568, "epoch": 633} {"train_loss": -20.207801818847656, "global_step": 52569, "epoch": 633} {"train_loss": -19.893840789794922, "global_step": 52570, "epoch": 633} {"train_loss": -20.00548553466797, "global_step": 52571, "epoch": 633} {"train_loss": -20.19789695739746, "global_step": 52572, "epoch": 633} {"train_loss": -20.104928970336914, "global_step": 52573, "epoch": 633} {"train_loss": -20.3692684173584, "global_step": 52574, "epoch": 633} {"train_loss": -20.315242767333984, "global_step": 52575, "epoch": 633} {"train_loss": -20.188220977783203, "global_step": 52576, "epoch": 633} {"train_loss": -20.651731491088867, "global_step": 52577, "epoch": 633} {"train_loss": -20.111257553100586, "global_step": 52578, "epoch": 633} {"train_loss": -19.969039916992188, "global_step": 52579, "epoch": 633} {"train_loss": -20.205930709838867, "global_step": 52580, "epoch": 633} {"train_loss": -20.454227447509766, "global_step": 52581, "epoch": 633} {"train_loss": -20.127370834350586, "global_step": 52582, "epoch": 633} {"train_loss": -20.31273078918457, "global_step": 52583, "epoch": 633} {"train_loss": -20.054096221923828, "global_step": 52584, "epoch": 633} {"train_loss": -20.16238021850586, "global_step": 52585, "epoch": 633} {"train_loss": -19.70526695251465, "global_step": 52586, "epoch": 633} {"train_loss": -19.870067596435547, "global_step": 52587, "epoch": 633} {"train_loss": -20.095703125, "global_step": 52588, "epoch": 633} {"train_loss": -20.253406524658203, "global_step": 52589, "epoch": 633} {"train_loss": -19.935531616210938, "global_step": 52590, "epoch": 633} {"train_loss": -19.86947250366211, "global_step": 52591, "epoch": 633} {"train_loss": -19.98956298828125, "global_step": 52592, "epoch": 633} {"train_loss": -19.784656524658203, "global_step": 52593, "epoch": 633} {"train_loss": -20.324237823486328, "global_step": 52594, "epoch": 633} {"train_loss": -19.852924346923828, "global_step": 52595, "epoch": 633} {"train_loss": -19.946706771850586, "global_step": 52596, "epoch": 633} {"train_loss": -19.761188507080078, "global_step": 52597, "epoch": 633} {"train_loss": -20.18671989440918, "global_step": 52598, "epoch": 633} {"train_loss": -19.901615142822266, "global_step": 52599, "epoch": 633} {"train_loss": -20.070327758789062, "global_step": 52600, "epoch": 633} {"train_loss": -19.787160873413086, "global_step": 52601, "epoch": 633} {"train_loss": -20.17787742614746, "global_step": 52602, "epoch": 633} {"train_loss": -19.920495986938477, "global_step": 52603, "epoch": 633} {"train_loss": -19.888813018798828, "global_step": 52604, "epoch": 633} {"train_loss": -20.37820053100586, "global_step": 52605, "epoch": 633} {"train_loss": -20.159677505493164, "global_step": 52606, "epoch": 633} {"train_loss": -20.08989906311035, "global_step": 52607, "epoch": 633} {"train_loss": -19.926076889038086, "global_step": 52608, "epoch": 633} {"train_loss": -20.10628318786621, "global_step": 52609, "epoch": 633} {"train_loss": -20.10404396057129, "global_step": 52610, "epoch": 633} {"train_loss": -20.20054817199707, "global_step": 52611, "epoch": 633} {"train_loss": -20.171756744384766, "global_step": 52612, "epoch": 633} {"train_loss": -20.174718856811523, "global_step": 52613, "epoch": 633} {"train_loss": -20.05759048461914, "global_step": 52614, "epoch": 633} {"train_loss": -20.34688949584961, "global_step": 52615, "epoch": 633} {"train_loss": -19.948436737060547, "global_step": 52616, "epoch": 633} {"train_loss": -20.022470474243164, "global_step": 52617, "epoch": 633} {"train_loss": -20.138303756713867, "global_step": 52618, "epoch": 633} {"train_loss": -20.089035034179688, "global_step": 52619, "epoch": 633} {"train_loss": -20.200716018676758, "global_step": 52620, "epoch": 633} {"train_loss": -20.06717661202672, "global_step": 52621, "epoch": 633, "val_loss": 6080358.5} {"train_loss": -19.136962890625, "global_step": 52622, "epoch": 634} {"train_loss": -20.356704711914062, "global_step": 52623, "epoch": 634} {"train_loss": -19.660688400268555, "global_step": 52624, "epoch": 634} {"train_loss": -19.853727340698242, "global_step": 52625, "epoch": 634} {"train_loss": -19.45587158203125, "global_step": 52626, "epoch": 634} {"train_loss": -19.91727638244629, "global_step": 52627, "epoch": 634} {"train_loss": -19.465715408325195, "global_step": 52628, "epoch": 634} {"train_loss": -19.89690589904785, "global_step": 52629, "epoch": 634} {"train_loss": -19.571195602416992, "global_step": 52630, "epoch": 634} {"train_loss": -20.093250274658203, "global_step": 52631, "epoch": 634} {"train_loss": -19.72319984436035, "global_step": 52632, "epoch": 634} {"train_loss": -20.01812744140625, "global_step": 52633, "epoch": 634} {"train_loss": -19.63779640197754, "global_step": 52634, "epoch": 634} {"train_loss": -19.563371658325195, "global_step": 52635, "epoch": 634} {"train_loss": -19.90250015258789, "global_step": 52636, "epoch": 634} {"train_loss": -20.114471435546875, "global_step": 52637, "epoch": 634} {"train_loss": -19.609365463256836, "global_step": 52638, "epoch": 634} {"train_loss": -19.8428897857666, "global_step": 52639, "epoch": 634} {"train_loss": -19.622760772705078, "global_step": 52640, "epoch": 634} {"train_loss": -20.264495849609375, "global_step": 52641, "epoch": 634} {"train_loss": -19.712474822998047, "global_step": 52642, "epoch": 634} {"train_loss": -19.827713012695312, "global_step": 52643, "epoch": 634} {"train_loss": -20.086822509765625, "global_step": 52644, "epoch": 634} {"train_loss": -20.182086944580078, "global_step": 52645, "epoch": 634} {"train_loss": -20.118602752685547, "global_step": 52646, "epoch": 634} {"train_loss": -19.779077529907227, "global_step": 52647, "epoch": 634} {"train_loss": -20.113971710205078, "global_step": 52648, "epoch": 634} {"train_loss": -19.770336151123047, "global_step": 52649, "epoch": 634} {"train_loss": -19.872011184692383, "global_step": 52650, "epoch": 634} {"train_loss": -20.294885635375977, "global_step": 52651, "epoch": 634} {"train_loss": -19.7032470703125, "global_step": 52652, "epoch": 634} {"train_loss": -19.84357261657715, "global_step": 52653, "epoch": 634} {"train_loss": -20.18710708618164, "global_step": 52654, "epoch": 634} {"train_loss": -19.938867568969727, "global_step": 52655, "epoch": 634} {"train_loss": -19.730085372924805, "global_step": 52656, "epoch": 634} {"train_loss": -19.96048355102539, "global_step": 52657, "epoch": 634} {"train_loss": -20.038190841674805, "global_step": 52658, "epoch": 634} {"train_loss": -19.82167625427246, "global_step": 52659, "epoch": 634} {"train_loss": -20.147329330444336, "global_step": 52660, "epoch": 634} {"train_loss": -20.075735092163086, "global_step": 52661, "epoch": 634} {"train_loss": -19.88894271850586, "global_step": 52662, "epoch": 634} {"train_loss": -19.894350051879883, "global_step": 52663, "epoch": 634} {"train_loss": -20.267698287963867, "global_step": 52664, "epoch": 634} {"train_loss": -20.16749382019043, "global_step": 52665, "epoch": 634} {"train_loss": -20.097253799438477, "global_step": 52666, "epoch": 634} {"train_loss": -20.24393653869629, "global_step": 52667, "epoch": 634} {"train_loss": -19.889493942260742, "global_step": 52668, "epoch": 634} {"train_loss": -20.304847717285156, "global_step": 52669, "epoch": 634} {"train_loss": -19.88748550415039, "global_step": 52670, "epoch": 634} {"train_loss": -20.114622116088867, "global_step": 52671, "epoch": 634} {"train_loss": -20.128828048706055, "global_step": 52672, "epoch": 634} {"train_loss": -19.75119972229004, "global_step": 52673, "epoch": 634} {"train_loss": -20.00508689880371, "global_step": 52674, "epoch": 634} {"train_loss": -19.921655654907227, "global_step": 52675, "epoch": 634} {"train_loss": -20.38918113708496, "global_step": 52676, "epoch": 634} {"train_loss": -19.692533493041992, "global_step": 52677, "epoch": 634} {"train_loss": -20.05067253112793, "global_step": 52678, "epoch": 634} {"train_loss": -19.8396053314209, "global_step": 52679, "epoch": 634} {"train_loss": -19.969379425048828, "global_step": 52680, "epoch": 634} {"train_loss": -20.074865341186523, "global_step": 52681, "epoch": 634} {"train_loss": -20.033079147338867, "global_step": 52682, "epoch": 634} {"train_loss": -20.238065719604492, "global_step": 52683, "epoch": 634} {"train_loss": -20.021133422851562, "global_step": 52684, "epoch": 634} {"train_loss": -19.717702865600586, "global_step": 52685, "epoch": 634} {"train_loss": -20.062868118286133, "global_step": 52686, "epoch": 634} {"train_loss": -19.89715003967285, "global_step": 52687, "epoch": 634} {"train_loss": -20.3856258392334, "global_step": 52688, "epoch": 634} {"train_loss": -20.12981414794922, "global_step": 52689, "epoch": 634} {"train_loss": -20.267507553100586, "global_step": 52690, "epoch": 634} {"train_loss": -20.026887893676758, "global_step": 52691, "epoch": 634} {"train_loss": -20.277185440063477, "global_step": 52692, "epoch": 634} {"train_loss": -20.48249626159668, "global_step": 52693, "epoch": 634} {"train_loss": -19.9023494720459, "global_step": 52694, "epoch": 634} {"train_loss": -19.96923828125, "global_step": 52695, "epoch": 634} {"train_loss": -20.035924911499023, "global_step": 52696, "epoch": 634} {"train_loss": -20.319955825805664, "global_step": 52697, "epoch": 634} {"train_loss": -20.21327018737793, "global_step": 52698, "epoch": 634} {"train_loss": -20.016977310180664, "global_step": 52699, "epoch": 634} {"train_loss": -19.813039779663086, "global_step": 52700, "epoch": 634} {"train_loss": -19.89993667602539, "global_step": 52701, "epoch": 634} {"train_loss": -20.0666446685791, "global_step": 52702, "epoch": 634} {"train_loss": -20.251731872558594, "global_step": 52703, "epoch": 634} {"train_loss": -19.966361011367248, "global_step": 52704, "epoch": 634, "val_loss": 6100602.0} {"train_loss": -20.12374496459961, "global_step": 52705, "epoch": 635} {"train_loss": -20.21772003173828, "global_step": 52706, "epoch": 635} {"train_loss": -19.822965621948242, "global_step": 52707, "epoch": 635} {"train_loss": -20.190555572509766, "global_step": 52708, "epoch": 635} {"train_loss": -20.148160934448242, "global_step": 52709, "epoch": 635} {"train_loss": -20.03307342529297, "global_step": 52710, "epoch": 635} {"train_loss": -19.98245620727539, "global_step": 52711, "epoch": 635} {"train_loss": -19.962480545043945, "global_step": 52712, "epoch": 635} {"train_loss": -19.93085289001465, "global_step": 52713, "epoch": 635} {"train_loss": -20.167390823364258, "global_step": 52714, "epoch": 635} {"train_loss": -20.483367919921875, "global_step": 52715, "epoch": 635} {"train_loss": -20.082929611206055, "global_step": 52716, "epoch": 635} {"train_loss": -19.91958999633789, "global_step": 52717, "epoch": 635} {"train_loss": -19.917760848999023, "global_step": 52718, "epoch": 635} {"train_loss": -19.795942306518555, "global_step": 52719, "epoch": 635} {"train_loss": -20.25023651123047, "global_step": 52720, "epoch": 635} {"train_loss": -19.794601440429688, "global_step": 52721, "epoch": 635} {"train_loss": -19.645050048828125, "global_step": 52722, "epoch": 635} {"train_loss": -19.638736724853516, "global_step": 52723, "epoch": 635} {"train_loss": -20.341354370117188, "global_step": 52724, "epoch": 635} {"train_loss": -20.26648712158203, "global_step": 52725, "epoch": 635} {"train_loss": -20.086938858032227, "global_step": 52726, "epoch": 635} {"train_loss": -20.225805282592773, "global_step": 52727, "epoch": 635} {"train_loss": -19.85173988342285, "global_step": 52728, "epoch": 635} {"train_loss": -19.83599281311035, "global_step": 52729, "epoch": 635} {"train_loss": -20.220144271850586, "global_step": 52730, "epoch": 635} {"train_loss": -20.336198806762695, "global_step": 52731, "epoch": 635} {"train_loss": -20.121763229370117, "global_step": 52732, "epoch": 635} {"train_loss": -20.00638771057129, "global_step": 52733, "epoch": 635} {"train_loss": -20.05274772644043, "global_step": 52734, "epoch": 635} {"train_loss": -20.26654052734375, "global_step": 52735, "epoch": 635} {"train_loss": -20.197147369384766, "global_step": 52736, "epoch": 635} {"train_loss": -20.31501579284668, "global_step": 52737, "epoch": 635} {"train_loss": -20.23788070678711, "global_step": 52738, "epoch": 635} {"train_loss": -20.194581985473633, "global_step": 52739, "epoch": 635} {"train_loss": -20.11769676208496, "global_step": 52740, "epoch": 635} {"train_loss": -20.20845603942871, "global_step": 52741, "epoch": 635} {"train_loss": -20.119237899780273, "global_step": 52742, "epoch": 635} {"train_loss": -20.36989402770996, "global_step": 52743, "epoch": 635} {"train_loss": -19.88309669494629, "global_step": 52744, "epoch": 635} {"train_loss": -19.874860763549805, "global_step": 52745, "epoch": 635} {"train_loss": -20.14297866821289, "global_step": 52746, "epoch": 635} {"train_loss": -20.329885482788086, "global_step": 52747, "epoch": 635} {"train_loss": -20.4069881439209, "global_step": 52748, "epoch": 635} {"train_loss": -19.69483757019043, "global_step": 52749, "epoch": 635} {"train_loss": -20.086627960205078, "global_step": 52750, "epoch": 635} {"train_loss": -20.1336727142334, "global_step": 52751, "epoch": 635} {"train_loss": -20.50074577331543, "global_step": 52752, "epoch": 635} {"train_loss": -19.968334197998047, "global_step": 52753, "epoch": 635} {"train_loss": -19.892824172973633, "global_step": 52754, "epoch": 635} {"train_loss": -19.761371612548828, "global_step": 52755, "epoch": 635} {"train_loss": -20.082443237304688, "global_step": 52756, "epoch": 635} {"train_loss": -20.04958152770996, "global_step": 52757, "epoch": 635} {"train_loss": -20.04154396057129, "global_step": 52758, "epoch": 635} {"train_loss": -19.79401969909668, "global_step": 52759, "epoch": 635} {"train_loss": -20.444868087768555, "global_step": 52760, "epoch": 635} {"train_loss": -20.027271270751953, "global_step": 52761, "epoch": 635} {"train_loss": -20.198810577392578, "global_step": 52762, "epoch": 635} {"train_loss": -19.889928817749023, "global_step": 52763, "epoch": 635} {"train_loss": -20.217769622802734, "global_step": 52764, "epoch": 635} {"train_loss": -20.21747398376465, "global_step": 52765, "epoch": 635} {"train_loss": -19.925636291503906, "global_step": 52766, "epoch": 635} {"train_loss": -19.9796199798584, "global_step": 52767, "epoch": 635} {"train_loss": -19.981857299804688, "global_step": 52768, "epoch": 635} {"train_loss": -20.200605392456055, "global_step": 52769, "epoch": 635} {"train_loss": -19.913389205932617, "global_step": 52770, "epoch": 635} {"train_loss": -20.207639694213867, "global_step": 52771, "epoch": 635} {"train_loss": -20.188169479370117, "global_step": 52772, "epoch": 635} {"train_loss": -20.01288604736328, "global_step": 52773, "epoch": 635} {"train_loss": -20.08977699279785, "global_step": 52774, "epoch": 635} {"train_loss": -19.89763641357422, "global_step": 52775, "epoch": 635} {"train_loss": -20.09016990661621, "global_step": 52776, "epoch": 635} {"train_loss": -20.16834831237793, "global_step": 52777, "epoch": 635} {"train_loss": -19.93760108947754, "global_step": 52778, "epoch": 635} {"train_loss": -20.13503074645996, "global_step": 52779, "epoch": 635} {"train_loss": -20.263504028320312, "global_step": 52780, "epoch": 635} {"train_loss": -20.07339859008789, "global_step": 52781, "epoch": 635} {"train_loss": -20.20341682434082, "global_step": 52782, "epoch": 635} {"train_loss": -19.709348678588867, "global_step": 52783, "epoch": 635} {"train_loss": -20.149751663208008, "global_step": 52784, "epoch": 635} {"train_loss": -19.840295791625977, "global_step": 52785, "epoch": 635} {"train_loss": -19.837024688720703, "global_step": 52786, "epoch": 635} {"train_loss": -20.06943702697754, "global_step": 52787, "epoch": 635, "val_loss": 5918437.5} {"train_loss": -20.019498825073242, "global_step": 52788, "epoch": 636} {"train_loss": -19.704702377319336, "global_step": 52789, "epoch": 636} {"train_loss": -19.755178451538086, "global_step": 52790, "epoch": 636} {"train_loss": -20.017728805541992, "global_step": 52791, "epoch": 636} {"train_loss": -20.063444137573242, "global_step": 52792, "epoch": 636} {"train_loss": -20.084457397460938, "global_step": 52793, "epoch": 636} {"train_loss": -19.651235580444336, "global_step": 52794, "epoch": 636} {"train_loss": -19.744720458984375, "global_step": 52795, "epoch": 636} {"train_loss": -19.80141258239746, "global_step": 52796, "epoch": 636} {"train_loss": -19.874608993530273, "global_step": 52797, "epoch": 636} {"train_loss": -19.765405654907227, "global_step": 52798, "epoch": 636} {"train_loss": -19.64496612548828, "global_step": 52799, "epoch": 636} {"train_loss": -20.034778594970703, "global_step": 52800, "epoch": 636} {"train_loss": -19.705923080444336, "global_step": 52801, "epoch": 636} {"train_loss": -19.658506393432617, "global_step": 52802, "epoch": 636} {"train_loss": -19.94905662536621, "global_step": 52803, "epoch": 636} {"train_loss": -20.13593864440918, "global_step": 52804, "epoch": 636} {"train_loss": -20.21675682067871, "global_step": 52805, "epoch": 636} {"train_loss": -19.957901000976562, "global_step": 52806, "epoch": 636} {"train_loss": -20.37421226501465, "global_step": 52807, "epoch": 636} {"train_loss": -19.961261749267578, "global_step": 52808, "epoch": 636} {"train_loss": -20.036470413208008, "global_step": 52809, "epoch": 636} {"train_loss": -19.99492835998535, "global_step": 52810, "epoch": 636} {"train_loss": -19.8062801361084, "global_step": 52811, "epoch": 636} {"train_loss": -20.008270263671875, "global_step": 52812, "epoch": 636} {"train_loss": -20.16924476623535, "global_step": 52813, "epoch": 636} {"train_loss": -20.297082901000977, "global_step": 52814, "epoch": 636} {"train_loss": -19.704999923706055, "global_step": 52815, "epoch": 636} {"train_loss": -20.022201538085938, "global_step": 52816, "epoch": 636} {"train_loss": -20.123159408569336, "global_step": 52817, "epoch": 636} {"train_loss": -20.137609481811523, "global_step": 52818, "epoch": 636} {"train_loss": -20.07084083557129, "global_step": 52819, "epoch": 636} {"train_loss": -19.804105758666992, "global_step": 52820, "epoch": 636} {"train_loss": -20.140628814697266, "global_step": 52821, "epoch": 636} {"train_loss": -20.255859375, "global_step": 52822, "epoch": 636} {"train_loss": -20.00006675720215, "global_step": 52823, "epoch": 636} {"train_loss": -19.91050910949707, "global_step": 52824, "epoch": 636} {"train_loss": -20.152990341186523, "global_step": 52825, "epoch": 636} {"train_loss": -19.979795455932617, "global_step": 52826, "epoch": 636} {"train_loss": -20.158470153808594, "global_step": 52827, "epoch": 636} {"train_loss": -20.139392852783203, "global_step": 52828, "epoch": 636} {"train_loss": -19.615751266479492, "global_step": 52829, "epoch": 636} {"train_loss": -19.81624984741211, "global_step": 52830, "epoch": 636} {"train_loss": -20.061553955078125, "global_step": 52831, "epoch": 636} {"train_loss": -20.119359970092773, "global_step": 52832, "epoch": 636} {"train_loss": -19.999053955078125, "global_step": 52833, "epoch": 636} {"train_loss": -20.268728256225586, "global_step": 52834, "epoch": 636} {"train_loss": -20.250051498413086, "global_step": 52835, "epoch": 636} {"train_loss": -19.964853286743164, "global_step": 52836, "epoch": 636} {"train_loss": -20.046804428100586, "global_step": 52837, "epoch": 636} {"train_loss": -20.123010635375977, "global_step": 52838, "epoch": 636} {"train_loss": -20.420738220214844, "global_step": 52839, "epoch": 636} {"train_loss": -20.436899185180664, "global_step": 52840, "epoch": 636} {"train_loss": -20.359689712524414, "global_step": 52841, "epoch": 636} {"train_loss": -19.774316787719727, "global_step": 52842, "epoch": 636} {"train_loss": -20.177091598510742, "global_step": 52843, "epoch": 636} {"train_loss": -19.984764099121094, "global_step": 52844, "epoch": 636} {"train_loss": -19.992399215698242, "global_step": 52845, "epoch": 636} {"train_loss": -19.98470115661621, "global_step": 52846, "epoch": 636} {"train_loss": -19.94203758239746, "global_step": 52847, "epoch": 636} {"train_loss": -19.98019790649414, "global_step": 52848, "epoch": 636} {"train_loss": -20.295196533203125, "global_step": 52849, "epoch": 636} {"train_loss": -20.277790069580078, "global_step": 52850, "epoch": 636} {"train_loss": -19.96330451965332, "global_step": 52851, "epoch": 636} {"train_loss": -20.038753509521484, "global_step": 52852, "epoch": 636} {"train_loss": -20.162702560424805, "global_step": 52853, "epoch": 636} {"train_loss": -19.83328628540039, "global_step": 52854, "epoch": 636} {"train_loss": -19.8013916015625, "global_step": 52855, "epoch": 636} {"train_loss": -19.65583610534668, "global_step": 52856, "epoch": 636} {"train_loss": -20.22138023376465, "global_step": 52857, "epoch": 636} {"train_loss": -20.29030418395996, "global_step": 52858, "epoch": 636} {"train_loss": -20.1846923828125, "global_step": 52859, "epoch": 636} {"train_loss": -20.014801025390625, "global_step": 52860, "epoch": 636} {"train_loss": -20.39043617248535, "global_step": 52861, "epoch": 636} {"train_loss": -20.165008544921875, "global_step": 52862, "epoch": 636} {"train_loss": -20.251182556152344, "global_step": 52863, "epoch": 636} {"train_loss": -20.118982315063477, "global_step": 52864, "epoch": 636} {"train_loss": -20.44313621520996, "global_step": 52865, "epoch": 636} {"train_loss": -20.07246971130371, "global_step": 52866, "epoch": 636} {"train_loss": -20.20943260192871, "global_step": 52867, "epoch": 636} {"train_loss": -20.146650314331055, "global_step": 52868, "epoch": 636} {"train_loss": -19.95753288269043, "global_step": 52869, "epoch": 636} {"train_loss": -20.01421087333955, "global_step": 52870, "epoch": 636, "val_loss": 6262939.0} {"train_loss": -20.135265350341797, "global_step": 52871, "epoch": 637} {"train_loss": -19.040130615234375, "global_step": 52872, "epoch": 637} {"train_loss": -19.951902389526367, "global_step": 52873, "epoch": 637} {"train_loss": -19.98000144958496, "global_step": 52874, "epoch": 637} {"train_loss": -19.738555908203125, "global_step": 52875, "epoch": 637} {"train_loss": -19.456357955932617, "global_step": 52876, "epoch": 637} {"train_loss": -19.56088638305664, "global_step": 52877, "epoch": 637} {"train_loss": -19.82988739013672, "global_step": 52878, "epoch": 637} {"train_loss": -19.436574935913086, "global_step": 52879, "epoch": 637} {"train_loss": -20.074953079223633, "global_step": 52880, "epoch": 637} {"train_loss": -19.823095321655273, "global_step": 52881, "epoch": 637} {"train_loss": -19.652252197265625, "global_step": 52882, "epoch": 637} {"train_loss": -19.87118911743164, "global_step": 52883, "epoch": 637} {"train_loss": -19.596464157104492, "global_step": 52884, "epoch": 637} {"train_loss": -19.4725284576416, "global_step": 52885, "epoch": 637} {"train_loss": -19.844491958618164, "global_step": 52886, "epoch": 637} {"train_loss": -19.93178367614746, "global_step": 52887, "epoch": 637} {"train_loss": -20.007965087890625, "global_step": 52888, "epoch": 637} {"train_loss": -19.89164161682129, "global_step": 52889, "epoch": 637} {"train_loss": -19.662912368774414, "global_step": 52890, "epoch": 637} {"train_loss": -19.78849220275879, "global_step": 52891, "epoch": 637} {"train_loss": -19.81153678894043, "global_step": 52892, "epoch": 637} {"train_loss": -19.95101547241211, "global_step": 52893, "epoch": 637} {"train_loss": -19.896413803100586, "global_step": 52894, "epoch": 637} {"train_loss": -19.998302459716797, "global_step": 52895, "epoch": 637} {"train_loss": -19.908044815063477, "global_step": 52896, "epoch": 637} {"train_loss": -19.829025268554688, "global_step": 52897, "epoch": 637} {"train_loss": -19.955564498901367, "global_step": 52898, "epoch": 637} {"train_loss": -19.572996139526367, "global_step": 52899, "epoch": 637} {"train_loss": -19.890100479125977, "global_step": 52900, "epoch": 637} {"train_loss": -19.991296768188477, "global_step": 52901, "epoch": 637} {"train_loss": -20.2506103515625, "global_step": 52902, "epoch": 637} {"train_loss": -20.54015350341797, "global_step": 52903, "epoch": 637} {"train_loss": -19.839670181274414, "global_step": 52904, "epoch": 637} {"train_loss": -20.356813430786133, "global_step": 52905, "epoch": 637} {"train_loss": -20.27225685119629, "global_step": 52906, "epoch": 637} {"train_loss": -20.31542205810547, "global_step": 52907, "epoch": 637} {"train_loss": -20.006559371948242, "global_step": 52908, "epoch": 637} {"train_loss": -19.980697631835938, "global_step": 52909, "epoch": 637} {"train_loss": -19.899688720703125, "global_step": 52910, "epoch": 637} {"train_loss": -19.96483039855957, "global_step": 52911, "epoch": 637} {"train_loss": -20.039443969726562, "global_step": 52912, "epoch": 637} {"train_loss": -19.78133773803711, "global_step": 52913, "epoch": 637} {"train_loss": -20.139541625976562, "global_step": 52914, "epoch": 637} {"train_loss": -19.839879989624023, "global_step": 52915, "epoch": 637} {"train_loss": -19.59535789489746, "global_step": 52916, "epoch": 637} {"train_loss": -19.60579490661621, "global_step": 52917, "epoch": 637} {"train_loss": -19.95929527282715, "global_step": 52918, "epoch": 637} {"train_loss": -20.360666275024414, "global_step": 52919, "epoch": 637} {"train_loss": -19.976099014282227, "global_step": 52920, "epoch": 637} {"train_loss": -19.994491577148438, "global_step": 52921, "epoch": 637} {"train_loss": -20.06064796447754, "global_step": 52922, "epoch": 637} {"train_loss": -20.03672218322754, "global_step": 52923, "epoch": 637} {"train_loss": -19.97186851501465, "global_step": 52924, "epoch": 637} {"train_loss": -20.32118034362793, "global_step": 52925, "epoch": 637} {"train_loss": -20.305526733398438, "global_step": 52926, "epoch": 637} {"train_loss": -19.94822883605957, "global_step": 52927, "epoch": 637} {"train_loss": -19.926801681518555, "global_step": 52928, "epoch": 637} {"train_loss": -20.263751983642578, "global_step": 52929, "epoch": 637} {"train_loss": -20.445526123046875, "global_step": 52930, "epoch": 637} {"train_loss": -20.184926986694336, "global_step": 52931, "epoch": 637} {"train_loss": -19.811979293823242, "global_step": 52932, "epoch": 637} {"train_loss": -19.84686851501465, "global_step": 52933, "epoch": 637} {"train_loss": -19.733184814453125, "global_step": 52934, "epoch": 637} {"train_loss": -20.406330108642578, "global_step": 52935, "epoch": 637} {"train_loss": -20.1402587890625, "global_step": 52936, "epoch": 637} {"train_loss": -20.364957809448242, "global_step": 52937, "epoch": 637} {"train_loss": -19.98378562927246, "global_step": 52938, "epoch": 637} {"train_loss": -19.94775390625, "global_step": 52939, "epoch": 637} {"train_loss": -20.301782608032227, "global_step": 52940, "epoch": 637} {"train_loss": -20.0694580078125, "global_step": 52941, "epoch": 637} {"train_loss": -20.079668045043945, "global_step": 52942, "epoch": 637} {"train_loss": -20.588058471679688, "global_step": 52943, "epoch": 637} {"train_loss": -19.767789840698242, "global_step": 52944, "epoch": 637} {"train_loss": -20.088716506958008, "global_step": 52945, "epoch": 637} {"train_loss": -19.98655128479004, "global_step": 52946, "epoch": 637} {"train_loss": -20.130674362182617, "global_step": 52947, "epoch": 637} {"train_loss": -20.026657104492188, "global_step": 52948, "epoch": 637} {"train_loss": -19.8951473236084, "global_step": 52949, "epoch": 637} {"train_loss": -19.949495315551758, "global_step": 52950, "epoch": 637} {"train_loss": -19.923730850219727, "global_step": 52951, "epoch": 637} {"train_loss": -20.05160903930664, "global_step": 52952, "epoch": 637} {"train_loss": -19.95423006724162, "global_step": 52953, "epoch": 637, "val_loss": 5878409.5} {"train_loss": -19.433679580688477, "global_step": 52954, "epoch": 638} {"train_loss": -19.51119041442871, "global_step": 52955, "epoch": 638} {"train_loss": -20.039682388305664, "global_step": 52956, "epoch": 638} {"train_loss": -19.93496322631836, "global_step": 52957, "epoch": 638} {"train_loss": -19.90032958984375, "global_step": 52958, "epoch": 638} {"train_loss": -19.78709602355957, "global_step": 52959, "epoch": 638} {"train_loss": -19.582876205444336, "global_step": 52960, "epoch": 638} {"train_loss": -19.9693546295166, "global_step": 52961, "epoch": 638} {"train_loss": -20.0045223236084, "global_step": 52962, "epoch": 638} {"train_loss": -19.707807540893555, "global_step": 52963, "epoch": 638} {"train_loss": -19.78602409362793, "global_step": 52964, "epoch": 638} {"train_loss": -19.961637496948242, "global_step": 52965, "epoch": 638} {"train_loss": -19.670255661010742, "global_step": 52966, "epoch": 638} {"train_loss": -20.173526763916016, "global_step": 52967, "epoch": 638} {"train_loss": -19.993614196777344, "global_step": 52968, "epoch": 638} {"train_loss": -19.844877243041992, "global_step": 52969, "epoch": 638} {"train_loss": -19.759981155395508, "global_step": 52970, "epoch": 638} {"train_loss": -19.908279418945312, "global_step": 52971, "epoch": 638} {"train_loss": -19.91631507873535, "global_step": 52972, "epoch": 638} {"train_loss": -19.79869270324707, "global_step": 52973, "epoch": 638} {"train_loss": -20.047576904296875, "global_step": 52974, "epoch": 638} {"train_loss": -19.615034103393555, "global_step": 52975, "epoch": 638} {"train_loss": -20.251699447631836, "global_step": 52976, "epoch": 638} {"train_loss": -19.72482681274414, "global_step": 52977, "epoch": 638} {"train_loss": -20.165746688842773, "global_step": 52978, "epoch": 638} {"train_loss": -20.056554794311523, "global_step": 52979, "epoch": 638} {"train_loss": -19.89754295349121, "global_step": 52980, "epoch": 638} {"train_loss": -19.972490310668945, "global_step": 52981, "epoch": 638} {"train_loss": -20.177066802978516, "global_step": 52982, "epoch": 638} {"train_loss": -20.0094051361084, "global_step": 52983, "epoch": 638} {"train_loss": -20.14153480529785, "global_step": 52984, "epoch": 638} {"train_loss": -20.190122604370117, "global_step": 52985, "epoch": 638} {"train_loss": -20.02386474609375, "global_step": 52986, "epoch": 638} {"train_loss": -20.325414657592773, "global_step": 52987, "epoch": 638} {"train_loss": -19.79522705078125, "global_step": 52988, "epoch": 638} {"train_loss": -20.169330596923828, "global_step": 52989, "epoch": 638} {"train_loss": -19.948999404907227, "global_step": 52990, "epoch": 638} {"train_loss": -20.3256893157959, "global_step": 52991, "epoch": 638} {"train_loss": -20.292112350463867, "global_step": 52992, "epoch": 638} {"train_loss": -20.123899459838867, "global_step": 52993, "epoch": 638} {"train_loss": -20.42354393005371, "global_step": 52994, "epoch": 638} {"train_loss": -20.106285095214844, "global_step": 52995, "epoch": 638} {"train_loss": -20.266645431518555, "global_step": 52996, "epoch": 638} {"train_loss": -20.259315490722656, "global_step": 52997, "epoch": 638} {"train_loss": -19.995939254760742, "global_step": 52998, "epoch": 638} {"train_loss": -19.861642837524414, "global_step": 52999, "epoch": 638} {"train_loss": -20.27721405029297, "global_step": 53000, "epoch": 638} {"train_loss": -20.1339054107666, "global_step": 53001, "epoch": 638} {"train_loss": -20.568632125854492, "global_step": 53002, "epoch": 638} {"train_loss": -20.246932983398438, "global_step": 53003, "epoch": 638} {"train_loss": -20.080184936523438, "global_step": 53004, "epoch": 638} {"train_loss": -20.031660079956055, "global_step": 53005, "epoch": 638} {"train_loss": -20.209081649780273, "global_step": 53006, "epoch": 638} {"train_loss": -20.180953979492188, "global_step": 53007, "epoch": 638} {"train_loss": -19.927322387695312, "global_step": 53008, "epoch": 638} {"train_loss": -20.277400970458984, "global_step": 53009, "epoch": 638} {"train_loss": -19.85859489440918, "global_step": 53010, "epoch": 638} {"train_loss": -20.135730743408203, "global_step": 53011, "epoch": 638} {"train_loss": -19.94504165649414, "global_step": 53012, "epoch": 638} {"train_loss": -19.875349044799805, "global_step": 53013, "epoch": 638} {"train_loss": -20.17634391784668, "global_step": 53014, "epoch": 638} {"train_loss": -20.006206512451172, "global_step": 53015, "epoch": 638} {"train_loss": -20.004823684692383, "global_step": 53016, "epoch": 638} {"train_loss": -19.976842880249023, "global_step": 53017, "epoch": 638} {"train_loss": -20.334638595581055, "global_step": 53018, "epoch": 638} {"train_loss": -20.17177391052246, "global_step": 53019, "epoch": 638} {"train_loss": -20.04400062561035, "global_step": 53020, "epoch": 638} {"train_loss": -20.068126678466797, "global_step": 53021, "epoch": 638} {"train_loss": -20.318984985351562, "global_step": 53022, "epoch": 638} {"train_loss": -20.113794326782227, "global_step": 53023, "epoch": 638} {"train_loss": -20.0850772857666, "global_step": 53024, "epoch": 638} {"train_loss": -20.333040237426758, "global_step": 53025, "epoch": 638} {"train_loss": -19.833391189575195, "global_step": 53026, "epoch": 638} {"train_loss": -20.11155891418457, "global_step": 53027, "epoch": 638} {"train_loss": -20.230762481689453, "global_step": 53028, "epoch": 638} {"train_loss": -20.03814697265625, "global_step": 53029, "epoch": 638} {"train_loss": -20.265533447265625, "global_step": 53030, "epoch": 638} {"train_loss": -19.79426383972168, "global_step": 53031, "epoch": 638} {"train_loss": -20.31328773498535, "global_step": 53032, "epoch": 638} {"train_loss": -20.131610870361328, "global_step": 53033, "epoch": 638} {"train_loss": -20.09811019897461, "global_step": 53034, "epoch": 638} {"train_loss": -20.31995391845703, "global_step": 53035, "epoch": 638} {"train_loss": -20.046388051596033, "global_step": 53036, "epoch": 638, "val_loss": 6166416.0} {"train_loss": -20.057767868041992, "global_step": 53037, "epoch": 639} {"train_loss": -20.406414031982422, "global_step": 53038, "epoch": 639} {"train_loss": -20.078580856323242, "global_step": 53039, "epoch": 639} {"train_loss": -20.06455421447754, "global_step": 53040, "epoch": 639} {"train_loss": -19.735898971557617, "global_step": 53041, "epoch": 639} {"train_loss": -19.993410110473633, "global_step": 53042, "epoch": 639} {"train_loss": -19.794702529907227, "global_step": 53043, "epoch": 639} {"train_loss": -19.875080108642578, "global_step": 53044, "epoch": 639} {"train_loss": -20.115476608276367, "global_step": 53045, "epoch": 639} {"train_loss": -20.288578033447266, "global_step": 53046, "epoch": 639} {"train_loss": -20.05687141418457, "global_step": 53047, "epoch": 639} {"train_loss": -19.829946517944336, "global_step": 53048, "epoch": 639} {"train_loss": -20.177400588989258, "global_step": 53049, "epoch": 639} {"train_loss": -19.992630004882812, "global_step": 53050, "epoch": 639} {"train_loss": -20.04050064086914, "global_step": 53051, "epoch": 639} {"train_loss": -20.051366806030273, "global_step": 53052, "epoch": 639} {"train_loss": -19.89296531677246, "global_step": 53053, "epoch": 639} {"train_loss": -19.954891204833984, "global_step": 53054, "epoch": 639} {"train_loss": -20.015117645263672, "global_step": 53055, "epoch": 639} {"train_loss": -20.1228084564209, "global_step": 53056, "epoch": 639} {"train_loss": -20.00938606262207, "global_step": 53057, "epoch": 639} {"train_loss": -19.856298446655273, "global_step": 53058, "epoch": 639} {"train_loss": -19.89885902404785, "global_step": 53059, "epoch": 639} {"train_loss": -19.943984985351562, "global_step": 53060, "epoch": 639} {"train_loss": -19.820602416992188, "global_step": 53061, "epoch": 639} {"train_loss": -20.12807273864746, "global_step": 53062, "epoch": 639} {"train_loss": -20.090118408203125, "global_step": 53063, "epoch": 639} {"train_loss": -20.107778549194336, "global_step": 53064, "epoch": 639} {"train_loss": -20.04823875427246, "global_step": 53065, "epoch": 639} {"train_loss": -20.05645751953125, "global_step": 53066, "epoch": 639} {"train_loss": -20.0185604095459, "global_step": 53067, "epoch": 639} {"train_loss": -19.75431251525879, "global_step": 53068, "epoch": 639} {"train_loss": -19.82171630859375, "global_step": 53069, "epoch": 639} {"train_loss": -19.880834579467773, "global_step": 53070, "epoch": 639} {"train_loss": -19.84329605102539, "global_step": 53071, "epoch": 639} {"train_loss": -20.438364028930664, "global_step": 53072, "epoch": 639} {"train_loss": -20.02448844909668, "global_step": 53073, "epoch": 639} {"train_loss": -20.300106048583984, "global_step": 53074, "epoch": 639} {"train_loss": -19.749719619750977, "global_step": 53075, "epoch": 639} {"train_loss": -20.31160545349121, "global_step": 53076, "epoch": 639} {"train_loss": -20.037677764892578, "global_step": 53077, "epoch": 639} {"train_loss": -19.808385848999023, "global_step": 53078, "epoch": 639} {"train_loss": -20.206863403320312, "global_step": 53079, "epoch": 639} {"train_loss": -20.120624542236328, "global_step": 53080, "epoch": 639} {"train_loss": -20.042325973510742, "global_step": 53081, "epoch": 639} {"train_loss": -19.81907081604004, "global_step": 53082, "epoch": 639} {"train_loss": -20.223329544067383, "global_step": 53083, "epoch": 639} {"train_loss": -19.95046043395996, "global_step": 53084, "epoch": 639} {"train_loss": -19.93967056274414, "global_step": 53085, "epoch": 639} {"train_loss": -19.792577743530273, "global_step": 53086, "epoch": 639} {"train_loss": -20.031938552856445, "global_step": 53087, "epoch": 639} {"train_loss": -19.946361541748047, "global_step": 53088, "epoch": 639} {"train_loss": -19.98219871520996, "global_step": 53089, "epoch": 639} {"train_loss": -19.99945640563965, "global_step": 53090, "epoch": 639} {"train_loss": -20.082775115966797, "global_step": 53091, "epoch": 639} {"train_loss": -19.794021606445312, "global_step": 53092, "epoch": 639} {"train_loss": -20.108715057373047, "global_step": 53093, "epoch": 639} {"train_loss": -20.085155487060547, "global_step": 53094, "epoch": 639} {"train_loss": -19.945499420166016, "global_step": 53095, "epoch": 639} {"train_loss": -19.871341705322266, "global_step": 53096, "epoch": 639} {"train_loss": -20.058691024780273, "global_step": 53097, "epoch": 639} {"train_loss": -20.092931747436523, "global_step": 53098, "epoch": 639} {"train_loss": -19.814245223999023, "global_step": 53099, "epoch": 639} {"train_loss": -20.472625732421875, "global_step": 53100, "epoch": 639} {"train_loss": -20.20132064819336, "global_step": 53101, "epoch": 639} {"train_loss": -20.282033920288086, "global_step": 53102, "epoch": 639} {"train_loss": -20.052093505859375, "global_step": 53103, "epoch": 639} {"train_loss": -20.12784194946289, "global_step": 53104, "epoch": 639} {"train_loss": -20.417062759399414, "global_step": 53105, "epoch": 639} {"train_loss": -20.06412696838379, "global_step": 53106, "epoch": 639} {"train_loss": -20.029033660888672, "global_step": 53107, "epoch": 639} {"train_loss": -20.124601364135742, "global_step": 53108, "epoch": 639} {"train_loss": -19.95371437072754, "global_step": 53109, "epoch": 639} {"train_loss": -20.009597778320312, "global_step": 53110, "epoch": 639} {"train_loss": -20.299270629882812, "global_step": 53111, "epoch": 639} {"train_loss": -20.0473575592041, "global_step": 53112, "epoch": 639} {"train_loss": -19.56672477722168, "global_step": 53113, "epoch": 639} {"train_loss": -20.02988624572754, "global_step": 53114, "epoch": 639} {"train_loss": -20.04888343811035, "global_step": 53115, "epoch": 639} {"train_loss": -19.92930030822754, "global_step": 53116, "epoch": 639} {"train_loss": -20.0506534576416, "global_step": 53117, "epoch": 639} {"train_loss": -20.011266708374023, "global_step": 53118, "epoch": 639} {"train_loss": -20.00190010990005, "global_step": 53119, "epoch": 639, "val_loss": 5809531.5} {"train_loss": -20.15312385559082, "global_step": 53120, "epoch": 640} {"train_loss": -19.91830825805664, "global_step": 53121, "epoch": 640} {"train_loss": -19.897985458374023, "global_step": 53122, "epoch": 640} {"train_loss": -19.52388572692871, "global_step": 53123, "epoch": 640} {"train_loss": -19.917057037353516, "global_step": 53124, "epoch": 640} {"train_loss": -19.68605613708496, "global_step": 53125, "epoch": 640} {"train_loss": -20.03839683532715, "global_step": 53126, "epoch": 640} {"train_loss": -19.92681884765625, "global_step": 53127, "epoch": 640} {"train_loss": -19.830007553100586, "global_step": 53128, "epoch": 640} {"train_loss": -19.907991409301758, "global_step": 53129, "epoch": 640} {"train_loss": -20.004194259643555, "global_step": 53130, "epoch": 640} {"train_loss": -20.549720764160156, "global_step": 53131, "epoch": 640} {"train_loss": -19.99408531188965, "global_step": 53132, "epoch": 640} {"train_loss": -20.393096923828125, "global_step": 53133, "epoch": 640} {"train_loss": -19.925365447998047, "global_step": 53134, "epoch": 640} {"train_loss": -19.959735870361328, "global_step": 53135, "epoch": 640} {"train_loss": -20.046546936035156, "global_step": 53136, "epoch": 640} {"train_loss": -20.023662567138672, "global_step": 53137, "epoch": 640} {"train_loss": -19.726064682006836, "global_step": 53138, "epoch": 640} {"train_loss": -19.775876998901367, "global_step": 53139, "epoch": 640} {"train_loss": -20.37489891052246, "global_step": 53140, "epoch": 640} {"train_loss": -19.96259117126465, "global_step": 53141, "epoch": 640} {"train_loss": -20.12302017211914, "global_step": 53142, "epoch": 640} {"train_loss": -20.381656646728516, "global_step": 53143, "epoch": 640} {"train_loss": -20.279165267944336, "global_step": 53144, "epoch": 640} {"train_loss": -20.269575119018555, "global_step": 53145, "epoch": 640} {"train_loss": -19.94509506225586, "global_step": 53146, "epoch": 640} {"train_loss": -20.376708984375, "global_step": 53147, "epoch": 640} {"train_loss": -20.387996673583984, "global_step": 53148, "epoch": 640} {"train_loss": -19.91047477722168, "global_step": 53149, "epoch": 640} {"train_loss": -20.05245018005371, "global_step": 53150, "epoch": 640} {"train_loss": -20.071020126342773, "global_step": 53151, "epoch": 640} {"train_loss": -19.66584587097168, "global_step": 53152, "epoch": 640} {"train_loss": -19.779041290283203, "global_step": 53153, "epoch": 640} {"train_loss": -19.985258102416992, "global_step": 53154, "epoch": 640} {"train_loss": -19.96558952331543, "global_step": 53155, "epoch": 640} {"train_loss": -20.335729598999023, "global_step": 53156, "epoch": 640} {"train_loss": -19.77458381652832, "global_step": 53157, "epoch": 640} {"train_loss": -20.12918472290039, "global_step": 53158, "epoch": 640} {"train_loss": -20.190364837646484, "global_step": 53159, "epoch": 640} {"train_loss": -20.18536376953125, "global_step": 53160, "epoch": 640} {"train_loss": -20.162450790405273, "global_step": 53161, "epoch": 640} {"train_loss": -19.749906539916992, "global_step": 53162, "epoch": 640} {"train_loss": -20.07364273071289, "global_step": 53163, "epoch": 640} {"train_loss": -20.317773818969727, "global_step": 53164, "epoch": 640} {"train_loss": -20.057754516601562, "global_step": 53165, "epoch": 640} {"train_loss": -20.241321563720703, "global_step": 53166, "epoch": 640} {"train_loss": -19.99134063720703, "global_step": 53167, "epoch": 640} {"train_loss": -20.13856315612793, "global_step": 53168, "epoch": 640} {"train_loss": -19.918399810791016, "global_step": 53169, "epoch": 640} {"train_loss": -20.116348266601562, "global_step": 53170, "epoch": 640} {"train_loss": -20.124347686767578, "global_step": 53171, "epoch": 640} {"train_loss": -20.0766658782959, "global_step": 53172, "epoch": 640} {"train_loss": -20.152027130126953, "global_step": 53173, "epoch": 640} {"train_loss": -20.348207473754883, "global_step": 53174, "epoch": 640} {"train_loss": -20.06821632385254, "global_step": 53175, "epoch": 640} {"train_loss": -20.016084671020508, "global_step": 53176, "epoch": 640} {"train_loss": -20.10501480102539, "global_step": 53177, "epoch": 640} {"train_loss": -20.545976638793945, "global_step": 53178, "epoch": 640} {"train_loss": -20.10051155090332, "global_step": 53179, "epoch": 640} {"train_loss": -20.23898696899414, "global_step": 53180, "epoch": 640} {"train_loss": -20.001256942749023, "global_step": 53181, "epoch": 640} {"train_loss": -19.88123893737793, "global_step": 53182, "epoch": 640} {"train_loss": -20.24866485595703, "global_step": 53183, "epoch": 640} {"train_loss": -20.132835388183594, "global_step": 53184, "epoch": 640} {"train_loss": -20.03861427307129, "global_step": 53185, "epoch": 640} {"train_loss": -20.135828018188477, "global_step": 53186, "epoch": 640} {"train_loss": -19.91854476928711, "global_step": 53187, "epoch": 640} {"train_loss": -20.168716430664062, "global_step": 53188, "epoch": 640} {"train_loss": -20.313146591186523, "global_step": 53189, "epoch": 640} {"train_loss": -20.07570457458496, "global_step": 53190, "epoch": 640} {"train_loss": -20.552406311035156, "global_step": 53191, "epoch": 640} {"train_loss": -20.41254997253418, "global_step": 53192, "epoch": 640} {"train_loss": -20.10915184020996, "global_step": 53193, "epoch": 640} {"train_loss": -20.22840690612793, "global_step": 53194, "epoch": 640} {"train_loss": -19.938413619995117, "global_step": 53195, "epoch": 640} {"train_loss": -19.902563095092773, "global_step": 53196, "epoch": 640} {"train_loss": -20.174070358276367, "global_step": 53197, "epoch": 640} {"train_loss": -20.313379287719727, "global_step": 53198, "epoch": 640} {"train_loss": -20.07517433166504, "global_step": 53199, "epoch": 640} {"train_loss": -19.82708168029785, "global_step": 53200, "epoch": 640} {"train_loss": -20.27374839782715, "global_step": 53201, "epoch": 640} {"train_loss": -20.08795984107328, "global_step": 53202, "epoch": 640, "val_loss": 5978498.5} {"train_loss": -20.08077049255371, "global_step": 53203, "epoch": 641} {"train_loss": -19.546239852905273, "global_step": 53204, "epoch": 641} {"train_loss": -19.86514663696289, "global_step": 53205, "epoch": 641} {"train_loss": -20.032604217529297, "global_step": 53206, "epoch": 641} {"train_loss": -19.5797061920166, "global_step": 53207, "epoch": 641} {"train_loss": -19.890411376953125, "global_step": 53208, "epoch": 641} {"train_loss": -19.962759017944336, "global_step": 53209, "epoch": 641} {"train_loss": -19.755584716796875, "global_step": 53210, "epoch": 641} {"train_loss": -19.54804039001465, "global_step": 53211, "epoch": 641} {"train_loss": -20.327911376953125, "global_step": 53212, "epoch": 641} {"train_loss": -20.411142349243164, "global_step": 53213, "epoch": 641} {"train_loss": -19.93865966796875, "global_step": 53214, "epoch": 641} {"train_loss": -20.323362350463867, "global_step": 53215, "epoch": 641} {"train_loss": -19.75482177734375, "global_step": 53216, "epoch": 641} {"train_loss": -19.73238182067871, "global_step": 53217, "epoch": 641} {"train_loss": -19.70690155029297, "global_step": 53218, "epoch": 641} {"train_loss": -20.10462188720703, "global_step": 53219, "epoch": 641} {"train_loss": -20.07697868347168, "global_step": 53220, "epoch": 641} {"train_loss": -19.961257934570312, "global_step": 53221, "epoch": 641} {"train_loss": -20.284170150756836, "global_step": 53222, "epoch": 641} {"train_loss": -19.962461471557617, "global_step": 53223, "epoch": 641} {"train_loss": -20.058462142944336, "global_step": 53224, "epoch": 641} {"train_loss": -20.089740753173828, "global_step": 53225, "epoch": 641} {"train_loss": -20.166196823120117, "global_step": 53226, "epoch": 641} {"train_loss": -19.89496612548828, "global_step": 53227, "epoch": 641} {"train_loss": -20.123626708984375, "global_step": 53228, "epoch": 641} {"train_loss": -20.104475021362305, "global_step": 53229, "epoch": 641} {"train_loss": -20.139429092407227, "global_step": 53230, "epoch": 641} {"train_loss": -20.235733032226562, "global_step": 53231, "epoch": 641} {"train_loss": -20.195568084716797, "global_step": 53232, "epoch": 641} {"train_loss": -20.134098052978516, "global_step": 53233, "epoch": 641} {"train_loss": -20.278533935546875, "global_step": 53234, "epoch": 641} {"train_loss": -20.183334350585938, "global_step": 53235, "epoch": 641} {"train_loss": -19.908964157104492, "global_step": 53236, "epoch": 641} {"train_loss": -20.165578842163086, "global_step": 53237, "epoch": 641} {"train_loss": -19.728544235229492, "global_step": 53238, "epoch": 641} {"train_loss": -20.472515106201172, "global_step": 53239, "epoch": 641} {"train_loss": -20.224435806274414, "global_step": 53240, "epoch": 641} {"train_loss": -20.268272399902344, "global_step": 53241, "epoch": 641} {"train_loss": -20.02681541442871, "global_step": 53242, "epoch": 641} {"train_loss": -19.91623878479004, "global_step": 53243, "epoch": 641} {"train_loss": -19.96904945373535, "global_step": 53244, "epoch": 641} {"train_loss": -20.235610961914062, "global_step": 53245, "epoch": 641} {"train_loss": -20.108623504638672, "global_step": 53246, "epoch": 641} {"train_loss": -20.085296630859375, "global_step": 53247, "epoch": 641} {"train_loss": -20.298961639404297, "global_step": 53248, "epoch": 641} {"train_loss": -19.896352767944336, "global_step": 53249, "epoch": 641} {"train_loss": -20.15912437438965, "global_step": 53250, "epoch": 641} {"train_loss": -20.291975021362305, "global_step": 53251, "epoch": 641} {"train_loss": -20.24066162109375, "global_step": 53252, "epoch": 641} {"train_loss": -20.125328063964844, "global_step": 53253, "epoch": 641} {"train_loss": -20.106048583984375, "global_step": 53254, "epoch": 641} {"train_loss": -20.280658721923828, "global_step": 53255, "epoch": 641} {"train_loss": -20.044023513793945, "global_step": 53256, "epoch": 641} {"train_loss": -20.057193756103516, "global_step": 53257, "epoch": 641} {"train_loss": -20.4290828704834, "global_step": 53258, "epoch": 641} {"train_loss": -20.0610408782959, "global_step": 53259, "epoch": 641} {"train_loss": -19.8889102935791, "global_step": 53260, "epoch": 641} {"train_loss": -20.030637741088867, "global_step": 53261, "epoch": 641} {"train_loss": -20.13446617126465, "global_step": 53262, "epoch": 641} {"train_loss": -20.157459259033203, "global_step": 53263, "epoch": 641} {"train_loss": -20.331741333007812, "global_step": 53264, "epoch": 641} {"train_loss": -19.71721076965332, "global_step": 53265, "epoch": 641} {"train_loss": -19.887073516845703, "global_step": 53266, "epoch": 641} {"train_loss": -20.05023956298828, "global_step": 53267, "epoch": 641} {"train_loss": -19.92520523071289, "global_step": 53268, "epoch": 641} {"train_loss": -20.07973861694336, "global_step": 53269, "epoch": 641} {"train_loss": -20.02434730529785, "global_step": 53270, "epoch": 641} {"train_loss": -20.035253524780273, "global_step": 53271, "epoch": 641} {"train_loss": -20.081300735473633, "global_step": 53272, "epoch": 641} {"train_loss": -20.060468673706055, "global_step": 53273, "epoch": 641} {"train_loss": -19.724491119384766, "global_step": 53274, "epoch": 641} {"train_loss": -20.16497230529785, "global_step": 53275, "epoch": 641} {"train_loss": -20.199758529663086, "global_step": 53276, "epoch": 641} {"train_loss": -19.986854553222656, "global_step": 53277, "epoch": 641} {"train_loss": -20.209266662597656, "global_step": 53278, "epoch": 641} {"train_loss": -20.16352081298828, "global_step": 53279, "epoch": 641} {"train_loss": -20.09339714050293, "global_step": 53280, "epoch": 641} {"train_loss": -20.121734619140625, "global_step": 53281, "epoch": 641} {"train_loss": -20.28386878967285, "global_step": 53282, "epoch": 641} {"train_loss": -19.973867416381836, "global_step": 53283, "epoch": 641} {"train_loss": -20.007654190063477, "global_step": 53284, "epoch": 641} {"train_loss": -20.054087144782745, "global_step": 53285, "epoch": 641, "val_loss": 5826627.0} {"train_loss": -19.01692008972168, "global_step": 53286, "epoch": 642} {"train_loss": -19.041229248046875, "global_step": 53287, "epoch": 642} {"train_loss": -19.636503219604492, "global_step": 53288, "epoch": 642} {"train_loss": -19.358570098876953, "global_step": 53289, "epoch": 642} {"train_loss": -20.087257385253906, "global_step": 53290, "epoch": 642} {"train_loss": -19.424367904663086, "global_step": 53291, "epoch": 642} {"train_loss": -19.691587448120117, "global_step": 53292, "epoch": 642} {"train_loss": -19.730398178100586, "global_step": 53293, "epoch": 642} {"train_loss": -19.938806533813477, "global_step": 53294, "epoch": 642} {"train_loss": -19.26465606689453, "global_step": 53295, "epoch": 642} {"train_loss": -19.861671447753906, "global_step": 53296, "epoch": 642} {"train_loss": -19.70354461669922, "global_step": 53297, "epoch": 642} {"train_loss": -19.702362060546875, "global_step": 53298, "epoch": 642} {"train_loss": -20.02617073059082, "global_step": 53299, "epoch": 642} {"train_loss": -19.781938552856445, "global_step": 53300, "epoch": 642} {"train_loss": -20.065587997436523, "global_step": 53301, "epoch": 642} {"train_loss": -20.295570373535156, "global_step": 53302, "epoch": 642} {"train_loss": -19.698034286499023, "global_step": 53303, "epoch": 642} {"train_loss": -19.798757553100586, "global_step": 53304, "epoch": 642} {"train_loss": -20.209680557250977, "global_step": 53305, "epoch": 642} {"train_loss": -19.82865333557129, "global_step": 53306, "epoch": 642} {"train_loss": -20.25813102722168, "global_step": 53307, "epoch": 642} {"train_loss": -20.040632247924805, "global_step": 53308, "epoch": 642} {"train_loss": -19.95416259765625, "global_step": 53309, "epoch": 642} {"train_loss": -20.06549644470215, "global_step": 53310, "epoch": 642} {"train_loss": -20.458599090576172, "global_step": 53311, "epoch": 642} {"train_loss": -20.241422653198242, "global_step": 53312, "epoch": 642} {"train_loss": -20.238792419433594, "global_step": 53313, "epoch": 642} {"train_loss": -20.069042205810547, "global_step": 53314, "epoch": 642} {"train_loss": -19.665822982788086, "global_step": 53315, "epoch": 642} {"train_loss": -20.066804885864258, "global_step": 53316, "epoch": 642} {"train_loss": -20.221969604492188, "global_step": 53317, "epoch": 642} {"train_loss": -20.337982177734375, "global_step": 53318, "epoch": 642} {"train_loss": -20.332387924194336, "global_step": 53319, "epoch": 642} {"train_loss": -20.01554298400879, "global_step": 53320, "epoch": 642} {"train_loss": -19.585290908813477, "global_step": 53321, "epoch": 642} {"train_loss": -20.182004928588867, "global_step": 53322, "epoch": 642} {"train_loss": -20.033063888549805, "global_step": 53323, "epoch": 642} {"train_loss": -20.19681167602539, "global_step": 53324, "epoch": 642} {"train_loss": -19.828907012939453, "global_step": 53325, "epoch": 642} {"train_loss": -19.823963165283203, "global_step": 53326, "epoch": 642} {"train_loss": -20.198715209960938, "global_step": 53327, "epoch": 642} {"train_loss": -19.6314640045166, "global_step": 53328, "epoch": 642} {"train_loss": -19.8846435546875, "global_step": 53329, "epoch": 642} {"train_loss": -20.32118797302246, "global_step": 53330, "epoch": 642} {"train_loss": -19.960529327392578, "global_step": 53331, "epoch": 642} {"train_loss": -20.490524291992188, "global_step": 53332, "epoch": 642} {"train_loss": -20.117155075073242, "global_step": 53333, "epoch": 642} {"train_loss": -19.89517593383789, "global_step": 53334, "epoch": 642} {"train_loss": -20.308942794799805, "global_step": 53335, "epoch": 642} {"train_loss": -20.35479164123535, "global_step": 53336, "epoch": 642} {"train_loss": -20.27020835876465, "global_step": 53337, "epoch": 642} {"train_loss": -20.26869773864746, "global_step": 53338, "epoch": 642} {"train_loss": -20.07967185974121, "global_step": 53339, "epoch": 642} {"train_loss": -19.94917869567871, "global_step": 53340, "epoch": 642} {"train_loss": -20.154043197631836, "global_step": 53341, "epoch": 642} {"train_loss": -20.52223014831543, "global_step": 53342, "epoch": 642} {"train_loss": -20.073896408081055, "global_step": 53343, "epoch": 642} {"train_loss": -19.86226463317871, "global_step": 53344, "epoch": 642} {"train_loss": -20.175617218017578, "global_step": 53345, "epoch": 642} {"train_loss": -20.462366104125977, "global_step": 53346, "epoch": 642} {"train_loss": -20.5419979095459, "global_step": 53347, "epoch": 642} {"train_loss": -20.137619018554688, "global_step": 53348, "epoch": 642} {"train_loss": -20.098264694213867, "global_step": 53349, "epoch": 642} {"train_loss": -20.18501853942871, "global_step": 53350, "epoch": 642} {"train_loss": -20.047521591186523, "global_step": 53351, "epoch": 642} {"train_loss": -20.061325073242188, "global_step": 53352, "epoch": 642} {"train_loss": -19.930845260620117, "global_step": 53353, "epoch": 642} {"train_loss": -20.22919273376465, "global_step": 53354, "epoch": 642} {"train_loss": -19.982572555541992, "global_step": 53355, "epoch": 642} {"train_loss": -19.605175018310547, "global_step": 53356, "epoch": 642} {"train_loss": -19.915006637573242, "global_step": 53357, "epoch": 642} {"train_loss": -19.921682357788086, "global_step": 53358, "epoch": 642} {"train_loss": -20.258533477783203, "global_step": 53359, "epoch": 642} {"train_loss": -20.223281860351562, "global_step": 53360, "epoch": 642} {"train_loss": -19.953258514404297, "global_step": 53361, "epoch": 642} {"train_loss": -20.03598976135254, "global_step": 53362, "epoch": 642} {"train_loss": -19.945873260498047, "global_step": 53363, "epoch": 642} {"train_loss": -20.32916259765625, "global_step": 53364, "epoch": 642} {"train_loss": -19.85817527770996, "global_step": 53365, "epoch": 642} {"train_loss": -19.873783111572266, "global_step": 53366, "epoch": 642} {"train_loss": -20.13993263244629, "global_step": 53367, "epoch": 642} {"train_loss": -20.012472819132977, "global_step": 53368, "epoch": 642, "val_loss": 6014846.5} {"train_loss": -19.839399337768555, "global_step": 53369, "epoch": 643} {"train_loss": -20.150794982910156, "global_step": 53370, "epoch": 643} {"train_loss": -20.0494384765625, "global_step": 53371, "epoch": 643} {"train_loss": -19.78171157836914, "global_step": 53372, "epoch": 643} {"train_loss": -19.715734481811523, "global_step": 53373, "epoch": 643} {"train_loss": -19.974868774414062, "global_step": 53374, "epoch": 643} {"train_loss": -19.994762420654297, "global_step": 53375, "epoch": 643} {"train_loss": -19.980422973632812, "global_step": 53376, "epoch": 643} {"train_loss": -19.906288146972656, "global_step": 53377, "epoch": 643} {"train_loss": -20.21809959411621, "global_step": 53378, "epoch": 643} {"train_loss": -20.093313217163086, "global_step": 53379, "epoch": 643} {"train_loss": -20.06036949157715, "global_step": 53380, "epoch": 643} {"train_loss": -20.039880752563477, "global_step": 53381, "epoch": 643} {"train_loss": -20.00294303894043, "global_step": 53382, "epoch": 643} {"train_loss": -20.01447105407715, "global_step": 53383, "epoch": 643} {"train_loss": -19.96266746520996, "global_step": 53384, "epoch": 643} {"train_loss": -19.960081100463867, "global_step": 53385, "epoch": 643} {"train_loss": -19.860618591308594, "global_step": 53386, "epoch": 643} {"train_loss": -20.064050674438477, "global_step": 53387, "epoch": 643} {"train_loss": -20.062978744506836, "global_step": 53388, "epoch": 643} {"train_loss": -20.21749496459961, "global_step": 53389, "epoch": 643} {"train_loss": -20.32289695739746, "global_step": 53390, "epoch": 643} {"train_loss": -20.045297622680664, "global_step": 53391, "epoch": 643} {"train_loss": -19.95086097717285, "global_step": 53392, "epoch": 643} {"train_loss": -20.062101364135742, "global_step": 53393, "epoch": 643} {"train_loss": -20.285818099975586, "global_step": 53394, "epoch": 643} {"train_loss": -20.263763427734375, "global_step": 53395, "epoch": 643} {"train_loss": -19.893590927124023, "global_step": 53396, "epoch": 643} {"train_loss": -20.168760299682617, "global_step": 53397, "epoch": 643} {"train_loss": -20.361434936523438, "global_step": 53398, "epoch": 643} {"train_loss": -19.81901741027832, "global_step": 53399, "epoch": 643} {"train_loss": -20.077260971069336, "global_step": 53400, "epoch": 643} {"train_loss": -20.198139190673828, "global_step": 53401, "epoch": 643} {"train_loss": -19.908315658569336, "global_step": 53402, "epoch": 643} {"train_loss": -19.433399200439453, "global_step": 53403, "epoch": 643} {"train_loss": -19.858211517333984, "global_step": 53404, "epoch": 643} {"train_loss": -20.0334415435791, "global_step": 53405, "epoch": 643} {"train_loss": -20.097814559936523, "global_step": 53406, "epoch": 643} {"train_loss": -20.156362533569336, "global_step": 53407, "epoch": 643} {"train_loss": -20.20621109008789, "global_step": 53408, "epoch": 643} {"train_loss": -20.12537956237793, "global_step": 53409, "epoch": 643} {"train_loss": -19.86358642578125, "global_step": 53410, "epoch": 643} {"train_loss": -20.396745681762695, "global_step": 53411, "epoch": 643} {"train_loss": -20.247400283813477, "global_step": 53412, "epoch": 643} {"train_loss": -20.38530731201172, "global_step": 53413, "epoch": 643} {"train_loss": -20.242164611816406, "global_step": 53414, "epoch": 643} {"train_loss": -19.977294921875, "global_step": 53415, "epoch": 643} {"train_loss": -20.10324478149414, "global_step": 53416, "epoch": 643} {"train_loss": -20.059354782104492, "global_step": 53417, "epoch": 643} {"train_loss": -20.028684616088867, "global_step": 53418, "epoch": 643} {"train_loss": -19.978548049926758, "global_step": 53419, "epoch": 643} {"train_loss": -20.256406784057617, "global_step": 53420, "epoch": 643} {"train_loss": -20.481475830078125, "global_step": 53421, "epoch": 643} {"train_loss": -20.164905548095703, "global_step": 53422, "epoch": 643} {"train_loss": -20.045700073242188, "global_step": 53423, "epoch": 643} {"train_loss": -20.31775665283203, "global_step": 53424, "epoch": 643} {"train_loss": -20.15993309020996, "global_step": 53425, "epoch": 643} {"train_loss": -19.965993881225586, "global_step": 53426, "epoch": 643} {"train_loss": -20.161420822143555, "global_step": 53427, "epoch": 643} {"train_loss": -19.92482566833496, "global_step": 53428, "epoch": 643} {"train_loss": -19.922775268554688, "global_step": 53429, "epoch": 643} {"train_loss": -19.83736228942871, "global_step": 53430, "epoch": 643} {"train_loss": -19.956342697143555, "global_step": 53431, "epoch": 643} {"train_loss": -19.982959747314453, "global_step": 53432, "epoch": 643} {"train_loss": -19.915332794189453, "global_step": 53433, "epoch": 643} {"train_loss": -19.795352935791016, "global_step": 53434, "epoch": 643} {"train_loss": -20.42113494873047, "global_step": 53435, "epoch": 643} {"train_loss": -19.72567367553711, "global_step": 53436, "epoch": 643} {"train_loss": -20.151622772216797, "global_step": 53437, "epoch": 643} {"train_loss": -19.8222713470459, "global_step": 53438, "epoch": 643} {"train_loss": -20.02033233642578, "global_step": 53439, "epoch": 643} {"train_loss": -20.539762496948242, "global_step": 53440, "epoch": 643} {"train_loss": -20.14906120300293, "global_step": 53441, "epoch": 643} {"train_loss": -20.39491844177246, "global_step": 53442, "epoch": 643} {"train_loss": -19.943580627441406, "global_step": 53443, "epoch": 643} {"train_loss": -20.037267684936523, "global_step": 53444, "epoch": 643} {"train_loss": -19.770904541015625, "global_step": 53445, "epoch": 643} {"train_loss": -20.052663803100586, "global_step": 53446, "epoch": 643} {"train_loss": -20.280704498291016, "global_step": 53447, "epoch": 643} {"train_loss": -19.981618881225586, "global_step": 53448, "epoch": 643} {"train_loss": -19.869831085205078, "global_step": 53449, "epoch": 643} {"train_loss": -19.856491088867188, "global_step": 53450, "epoch": 643} {"train_loss": -20.070791796029333, "global_step": 53451, "epoch": 643, "val_loss": 6022259.0} {"train_loss": -19.738142013549805, "global_step": 53452, "epoch": 644} {"train_loss": -19.85627555847168, "global_step": 53453, "epoch": 644} {"train_loss": -19.986364364624023, "global_step": 53454, "epoch": 644} {"train_loss": -19.742042541503906, "global_step": 53455, "epoch": 644} {"train_loss": -19.959224700927734, "global_step": 53456, "epoch": 644} {"train_loss": -19.762914657592773, "global_step": 53457, "epoch": 644} {"train_loss": -20.049463272094727, "global_step": 53458, "epoch": 644} {"train_loss": -20.43796157836914, "global_step": 53459, "epoch": 644} {"train_loss": -19.739643096923828, "global_step": 53460, "epoch": 644} {"train_loss": -19.80135154724121, "global_step": 53461, "epoch": 644} {"train_loss": -20.065113067626953, "global_step": 53462, "epoch": 644} {"train_loss": -19.99408531188965, "global_step": 53463, "epoch": 644} {"train_loss": -19.8081111907959, "global_step": 53464, "epoch": 644} {"train_loss": -20.040420532226562, "global_step": 53465, "epoch": 644} {"train_loss": -19.956541061401367, "global_step": 53466, "epoch": 644} {"train_loss": -19.932254791259766, "global_step": 53467, "epoch": 644} {"train_loss": -20.194644927978516, "global_step": 53468, "epoch": 644} {"train_loss": -19.904741287231445, "global_step": 53469, "epoch": 644} {"train_loss": -20.048608779907227, "global_step": 53470, "epoch": 644} {"train_loss": -20.430408477783203, "global_step": 53471, "epoch": 644} {"train_loss": -19.730154037475586, "global_step": 53472, "epoch": 644} {"train_loss": -20.104957580566406, "global_step": 53473, "epoch": 644} {"train_loss": -20.12883758544922, "global_step": 53474, "epoch": 644} {"train_loss": -19.982986450195312, "global_step": 53475, "epoch": 644} {"train_loss": -20.096323013305664, "global_step": 53476, "epoch": 644} {"train_loss": -19.705608367919922, "global_step": 53477, "epoch": 644} {"train_loss": -19.969568252563477, "global_step": 53478, "epoch": 644} {"train_loss": -19.857168197631836, "global_step": 53479, "epoch": 644} {"train_loss": -19.72321891784668, "global_step": 53480, "epoch": 644} {"train_loss": -19.776851654052734, "global_step": 53481, "epoch": 644} {"train_loss": -20.35260581970215, "global_step": 53482, "epoch": 644} {"train_loss": -20.103158950805664, "global_step": 53483, "epoch": 644} {"train_loss": -20.143211364746094, "global_step": 53484, "epoch": 644} {"train_loss": -19.917343139648438, "global_step": 53485, "epoch": 644} {"train_loss": -20.339313507080078, "global_step": 53486, "epoch": 644} {"train_loss": -19.93459129333496, "global_step": 53487, "epoch": 644} {"train_loss": -20.176435470581055, "global_step": 53488, "epoch": 644} {"train_loss": -19.642990112304688, "global_step": 53489, "epoch": 644} {"train_loss": -19.9376277923584, "global_step": 53490, "epoch": 644} {"train_loss": -19.936063766479492, "global_step": 53491, "epoch": 644} {"train_loss": -19.666784286499023, "global_step": 53492, "epoch": 644} {"train_loss": -20.23386001586914, "global_step": 53493, "epoch": 644} {"train_loss": -20.349002838134766, "global_step": 53494, "epoch": 644} {"train_loss": -20.056299209594727, "global_step": 53495, "epoch": 644} {"train_loss": -19.927534103393555, "global_step": 53496, "epoch": 644} {"train_loss": -20.192520141601562, "global_step": 53497, "epoch": 644} {"train_loss": -20.206266403198242, "global_step": 53498, "epoch": 644} {"train_loss": -20.156356811523438, "global_step": 53499, "epoch": 644} {"train_loss": -20.023334503173828, "global_step": 53500, "epoch": 644} {"train_loss": -20.032154083251953, "global_step": 53501, "epoch": 644} {"train_loss": -20.22725486755371, "global_step": 53502, "epoch": 644} {"train_loss": -20.011777877807617, "global_step": 53503, "epoch": 644} {"train_loss": -19.960412979125977, "global_step": 53504, "epoch": 644} {"train_loss": -19.65535545349121, "global_step": 53505, "epoch": 644} {"train_loss": -20.32661247253418, "global_step": 53506, "epoch": 644} {"train_loss": -20.15974998474121, "global_step": 53507, "epoch": 644} {"train_loss": -20.240726470947266, "global_step": 53508, "epoch": 644} {"train_loss": -20.02445411682129, "global_step": 53509, "epoch": 644} {"train_loss": -20.03268814086914, "global_step": 53510, "epoch": 644} {"train_loss": -20.224246978759766, "global_step": 53511, "epoch": 644} {"train_loss": -20.019001007080078, "global_step": 53512, "epoch": 644} {"train_loss": -20.05209732055664, "global_step": 53513, "epoch": 644} {"train_loss": -20.07088279724121, "global_step": 53514, "epoch": 644} {"train_loss": -20.376541137695312, "global_step": 53515, "epoch": 644} {"train_loss": -20.31793785095215, "global_step": 53516, "epoch": 644} {"train_loss": -19.71919059753418, "global_step": 53517, "epoch": 644} {"train_loss": -19.827625274658203, "global_step": 53518, "epoch": 644} {"train_loss": -20.13099479675293, "global_step": 53519, "epoch": 644} {"train_loss": -20.11904525756836, "global_step": 53520, "epoch": 644} {"train_loss": -20.046247482299805, "global_step": 53521, "epoch": 644} {"train_loss": -20.471609115600586, "global_step": 53522, "epoch": 644} {"train_loss": -20.38619041442871, "global_step": 53523, "epoch": 644} {"train_loss": -20.249692916870117, "global_step": 53524, "epoch": 644} {"train_loss": -20.151782989501953, "global_step": 53525, "epoch": 644} {"train_loss": -20.024343490600586, "global_step": 53526, "epoch": 644} {"train_loss": -20.248722076416016, "global_step": 53527, "epoch": 644} {"train_loss": -20.219974517822266, "global_step": 53528, "epoch": 644} {"train_loss": -20.32831382751465, "global_step": 53529, "epoch": 644} {"train_loss": -20.30765151977539, "global_step": 53530, "epoch": 644} {"train_loss": -20.058256149291992, "global_step": 53531, "epoch": 644} {"train_loss": -20.27484703063965, "global_step": 53532, "epoch": 644} {"train_loss": -20.291257858276367, "global_step": 53533, "epoch": 644} {"train_loss": -20.059017135436278, "global_step": 53534, "epoch": 644, "val_loss": 5884482.0} {"train_loss": -19.605010986328125, "global_step": 53535, "epoch": 645} {"train_loss": -19.813596725463867, "global_step": 53536, "epoch": 645} {"train_loss": -19.711002349853516, "global_step": 53537, "epoch": 645} {"train_loss": -20.032100677490234, "global_step": 53538, "epoch": 645} {"train_loss": -19.8179931640625, "global_step": 53539, "epoch": 645} {"train_loss": -19.86322784423828, "global_step": 53540, "epoch": 645} {"train_loss": -20.226110458374023, "global_step": 53541, "epoch": 645} {"train_loss": -20.14632225036621, "global_step": 53542, "epoch": 645} {"train_loss": -20.118125915527344, "global_step": 53543, "epoch": 645} {"train_loss": -19.419973373413086, "global_step": 53544, "epoch": 645} {"train_loss": -19.93216896057129, "global_step": 53545, "epoch": 645} {"train_loss": -19.850614547729492, "global_step": 53546, "epoch": 645} {"train_loss": -19.75986671447754, "global_step": 53547, "epoch": 645} {"train_loss": -19.777610778808594, "global_step": 53548, "epoch": 645} {"train_loss": -19.733928680419922, "global_step": 53549, "epoch": 645} {"train_loss": -20.29766845703125, "global_step": 53550, "epoch": 645} {"train_loss": -19.99970245361328, "global_step": 53551, "epoch": 645} {"train_loss": -19.932035446166992, "global_step": 53552, "epoch": 645} {"train_loss": -19.77754020690918, "global_step": 53553, "epoch": 645} {"train_loss": -19.88739585876465, "global_step": 53554, "epoch": 645} {"train_loss": -20.049774169921875, "global_step": 53555, "epoch": 645} {"train_loss": -19.92871856689453, "global_step": 53556, "epoch": 645} {"train_loss": -20.113523483276367, "global_step": 53557, "epoch": 645} {"train_loss": -20.255184173583984, "global_step": 53558, "epoch": 645} {"train_loss": -20.31300926208496, "global_step": 53559, "epoch": 645} {"train_loss": -20.112987518310547, "global_step": 53560, "epoch": 645} {"train_loss": -19.89927101135254, "global_step": 53561, "epoch": 645} {"train_loss": -20.256620407104492, "global_step": 53562, "epoch": 645} {"train_loss": -20.126436233520508, "global_step": 53563, "epoch": 645} {"train_loss": -20.743927001953125, "global_step": 53564, "epoch": 645} {"train_loss": -20.038549423217773, "global_step": 53565, "epoch": 645} {"train_loss": -20.309282302856445, "global_step": 53566, "epoch": 645} {"train_loss": -20.208303451538086, "global_step": 53567, "epoch": 645} {"train_loss": -20.014902114868164, "global_step": 53568, "epoch": 645} {"train_loss": -20.10004997253418, "global_step": 53569, "epoch": 645} {"train_loss": -19.974105834960938, "global_step": 53570, "epoch": 645} {"train_loss": -20.165029525756836, "global_step": 53571, "epoch": 645} {"train_loss": -20.142826080322266, "global_step": 53572, "epoch": 645} {"train_loss": -20.26557731628418, "global_step": 53573, "epoch": 645} {"train_loss": -19.816211700439453, "global_step": 53574, "epoch": 645} {"train_loss": -20.07831382751465, "global_step": 53575, "epoch": 645} {"train_loss": -20.212299346923828, "global_step": 53576, "epoch": 645} {"train_loss": -19.825681686401367, "global_step": 53577, "epoch": 645} {"train_loss": -20.32865333557129, "global_step": 53578, "epoch": 645} {"train_loss": -19.962942123413086, "global_step": 53579, "epoch": 645} {"train_loss": -19.984947204589844, "global_step": 53580, "epoch": 645} {"train_loss": -20.210914611816406, "global_step": 53581, "epoch": 645} {"train_loss": -20.29522132873535, "global_step": 53582, "epoch": 645} {"train_loss": -20.25946617126465, "global_step": 53583, "epoch": 645} {"train_loss": -20.108142852783203, "global_step": 53584, "epoch": 645} {"train_loss": -20.023832321166992, "global_step": 53585, "epoch": 645} {"train_loss": -19.890304565429688, "global_step": 53586, "epoch": 645} {"train_loss": -20.011829376220703, "global_step": 53587, "epoch": 645} {"train_loss": -20.317363739013672, "global_step": 53588, "epoch": 645} {"train_loss": -19.773529052734375, "global_step": 53589, "epoch": 645} {"train_loss": -20.04566764831543, "global_step": 53590, "epoch": 645} {"train_loss": -20.59559440612793, "global_step": 53591, "epoch": 645} {"train_loss": -19.751049041748047, "global_step": 53592, "epoch": 645} {"train_loss": -20.03168487548828, "global_step": 53593, "epoch": 645} {"train_loss": -20.392911911010742, "global_step": 53594, "epoch": 645} {"train_loss": -19.849454879760742, "global_step": 53595, "epoch": 645} {"train_loss": -20.391098022460938, "global_step": 53596, "epoch": 645} {"train_loss": -20.058542251586914, "global_step": 53597, "epoch": 645} {"train_loss": -20.068166732788086, "global_step": 53598, "epoch": 645} {"train_loss": -20.160932540893555, "global_step": 53599, "epoch": 645} {"train_loss": -20.011526107788086, "global_step": 53600, "epoch": 645} {"train_loss": -20.20002555847168, "global_step": 53601, "epoch": 645} {"train_loss": -20.135334014892578, "global_step": 53602, "epoch": 645} {"train_loss": -20.423999786376953, "global_step": 53603, "epoch": 645} {"train_loss": -19.846025466918945, "global_step": 53604, "epoch": 645} {"train_loss": -20.419538497924805, "global_step": 53605, "epoch": 645} {"train_loss": -20.350696563720703, "global_step": 53606, "epoch": 645} {"train_loss": -20.084484100341797, "global_step": 53607, "epoch": 645} {"train_loss": -20.267444610595703, "global_step": 53608, "epoch": 645} {"train_loss": -20.16446876525879, "global_step": 53609, "epoch": 645} {"train_loss": -19.787738800048828, "global_step": 53610, "epoch": 645} {"train_loss": -20.134109497070312, "global_step": 53611, "epoch": 645} {"train_loss": -20.32242774963379, "global_step": 53612, "epoch": 645} {"train_loss": -19.84610366821289, "global_step": 53613, "epoch": 645} {"train_loss": -20.08709716796875, "global_step": 53614, "epoch": 645} {"train_loss": -20.286954879760742, "global_step": 53615, "epoch": 645} {"train_loss": -19.849790573120117, "global_step": 53616, "epoch": 645} {"train_loss": -20.076884488025343, "global_step": 53617, "epoch": 645, "val_loss": 6187631.5} {"train_loss": -19.60158348083496, "global_step": 53618, "epoch": 646} {"train_loss": -20.0991268157959, "global_step": 53619, "epoch": 646} {"train_loss": -19.779050827026367, "global_step": 53620, "epoch": 646} {"train_loss": -20.086545944213867, "global_step": 53621, "epoch": 646} {"train_loss": -19.85841178894043, "global_step": 53622, "epoch": 646} {"train_loss": -20.13565444946289, "global_step": 53623, "epoch": 646} {"train_loss": -20.024246215820312, "global_step": 53624, "epoch": 646} {"train_loss": -20.2280330657959, "global_step": 53625, "epoch": 646} {"train_loss": -19.872501373291016, "global_step": 53626, "epoch": 646} {"train_loss": -20.34116554260254, "global_step": 53627, "epoch": 646} {"train_loss": -19.720266342163086, "global_step": 53628, "epoch": 646} {"train_loss": -20.281240463256836, "global_step": 53629, "epoch": 646} {"train_loss": -20.137598037719727, "global_step": 53630, "epoch": 646} {"train_loss": -20.007543563842773, "global_step": 53631, "epoch": 646} {"train_loss": -19.958913803100586, "global_step": 53632, "epoch": 646} {"train_loss": -20.423673629760742, "global_step": 53633, "epoch": 646} {"train_loss": -20.3837947845459, "global_step": 53634, "epoch": 646} {"train_loss": -20.1926326751709, "global_step": 53635, "epoch": 646} {"train_loss": -19.94832420349121, "global_step": 53636, "epoch": 646} {"train_loss": -20.19247055053711, "global_step": 53637, "epoch": 646} {"train_loss": -19.982446670532227, "global_step": 53638, "epoch": 646} {"train_loss": -20.107236862182617, "global_step": 53639, "epoch": 646} {"train_loss": -19.81049346923828, "global_step": 53640, "epoch": 646} {"train_loss": -20.235883712768555, "global_step": 53641, "epoch": 646} {"train_loss": -20.213571548461914, "global_step": 53642, "epoch": 646} {"train_loss": -20.443037033081055, "global_step": 53643, "epoch": 646} {"train_loss": -19.965900421142578, "global_step": 53644, "epoch": 646} {"train_loss": -20.064889907836914, "global_step": 53645, "epoch": 646} {"train_loss": -20.021726608276367, "global_step": 53646, "epoch": 646} {"train_loss": -19.9515380859375, "global_step": 53647, "epoch": 646} {"train_loss": -19.913694381713867, "global_step": 53648, "epoch": 646} {"train_loss": -19.840778350830078, "global_step": 53649, "epoch": 646} {"train_loss": -19.96671485900879, "global_step": 53650, "epoch": 646} {"train_loss": -19.73998260498047, "global_step": 53651, "epoch": 646} {"train_loss": -20.073835372924805, "global_step": 53652, "epoch": 646} {"train_loss": -20.663475036621094, "global_step": 53653, "epoch": 646} {"train_loss": -20.45998191833496, "global_step": 53654, "epoch": 646} {"train_loss": -19.92753791809082, "global_step": 53655, "epoch": 646} {"train_loss": -19.8797607421875, "global_step": 53656, "epoch": 646} {"train_loss": -20.405014038085938, "global_step": 53657, "epoch": 646} {"train_loss": -20.234027862548828, "global_step": 53658, "epoch": 646} {"train_loss": -20.336090087890625, "global_step": 53659, "epoch": 646} {"train_loss": -20.377241134643555, "global_step": 53660, "epoch": 646} {"train_loss": -19.852914810180664, "global_step": 53661, "epoch": 646} {"train_loss": -20.076953887939453, "global_step": 53662, "epoch": 646} {"train_loss": -20.410140991210938, "global_step": 53663, "epoch": 646} {"train_loss": -20.043237686157227, "global_step": 53664, "epoch": 646} {"train_loss": -20.08646583557129, "global_step": 53665, "epoch": 646} {"train_loss": -20.395549774169922, "global_step": 53666, "epoch": 646} {"train_loss": -19.761213302612305, "global_step": 53667, "epoch": 646} {"train_loss": -20.218164443969727, "global_step": 53668, "epoch": 646} {"train_loss": -20.24883270263672, "global_step": 53669, "epoch": 646} {"train_loss": -19.449941635131836, "global_step": 53670, "epoch": 646} {"train_loss": -20.065031051635742, "global_step": 53671, "epoch": 646} {"train_loss": -20.029346466064453, "global_step": 53672, "epoch": 646} {"train_loss": -20.256250381469727, "global_step": 53673, "epoch": 646} {"train_loss": -20.04376792907715, "global_step": 53674, "epoch": 646} {"train_loss": -20.087247848510742, "global_step": 53675, "epoch": 646} {"train_loss": -20.12917137145996, "global_step": 53676, "epoch": 646} {"train_loss": -19.945240020751953, "global_step": 53677, "epoch": 646} {"train_loss": -20.104690551757812, "global_step": 53678, "epoch": 646} {"train_loss": -19.724308013916016, "global_step": 53679, "epoch": 646} {"train_loss": -19.941335678100586, "global_step": 53680, "epoch": 646} {"train_loss": -19.918142318725586, "global_step": 53681, "epoch": 646} {"train_loss": -20.287078857421875, "global_step": 53682, "epoch": 646} {"train_loss": -20.41823387145996, "global_step": 53683, "epoch": 646} {"train_loss": -20.005022048950195, "global_step": 53684, "epoch": 646} {"train_loss": -19.813247680664062, "global_step": 53685, "epoch": 646} {"train_loss": -20.19550895690918, "global_step": 53686, "epoch": 646} {"train_loss": -20.199155807495117, "global_step": 53687, "epoch": 646} {"train_loss": -20.101171493530273, "global_step": 53688, "epoch": 646} {"train_loss": -19.8905086517334, "global_step": 53689, "epoch": 646} {"train_loss": -20.114831924438477, "global_step": 53690, "epoch": 646} {"train_loss": -20.43255043029785, "global_step": 53691, "epoch": 646} {"train_loss": -20.380189895629883, "global_step": 53692, "epoch": 646} {"train_loss": -20.07376480102539, "global_step": 53693, "epoch": 646} {"train_loss": -20.28956413269043, "global_step": 53694, "epoch": 646} {"train_loss": -20.193174362182617, "global_step": 53695, "epoch": 646} {"train_loss": -19.99248504638672, "global_step": 53696, "epoch": 646} {"train_loss": -20.559415817260742, "global_step": 53697, "epoch": 646} {"train_loss": -20.3696346282959, "global_step": 53698, "epoch": 646} {"train_loss": -20.3729248046875, "global_step": 53699, "epoch": 646} {"train_loss": -20.118241344589784, "global_step": 53700, "epoch": 646, "val_loss": 6023374.0} {"train_loss": -19.923032760620117, "global_step": 53701, "epoch": 647} {"train_loss": -19.72756004333496, "global_step": 53702, "epoch": 647} {"train_loss": -19.67213249206543, "global_step": 53703, "epoch": 647} {"train_loss": -19.799213409423828, "global_step": 53704, "epoch": 647} {"train_loss": -20.088668823242188, "global_step": 53705, "epoch": 647} {"train_loss": -19.61519432067871, "global_step": 53706, "epoch": 647} {"train_loss": -19.76924705505371, "global_step": 53707, "epoch": 647} {"train_loss": -19.364072799682617, "global_step": 53708, "epoch": 647} {"train_loss": -20.2290096282959, "global_step": 53709, "epoch": 647} {"train_loss": -20.119369506835938, "global_step": 53710, "epoch": 647} {"train_loss": -19.5709228515625, "global_step": 53711, "epoch": 647} {"train_loss": -19.746566772460938, "global_step": 53712, "epoch": 647} {"train_loss": -19.86419677734375, "global_step": 53713, "epoch": 647} {"train_loss": -20.17144775390625, "global_step": 53714, "epoch": 647} {"train_loss": -19.80592918395996, "global_step": 53715, "epoch": 647} {"train_loss": -20.069568634033203, "global_step": 53716, "epoch": 647} {"train_loss": -19.96082878112793, "global_step": 53717, "epoch": 647} {"train_loss": -20.180770874023438, "global_step": 53718, "epoch": 647} {"train_loss": -19.82875633239746, "global_step": 53719, "epoch": 647} {"train_loss": -20.350614547729492, "global_step": 53720, "epoch": 647} {"train_loss": -20.03037452697754, "global_step": 53721, "epoch": 647} {"train_loss": -20.410078048706055, "global_step": 53722, "epoch": 647} {"train_loss": -20.238447189331055, "global_step": 53723, "epoch": 647} {"train_loss": -20.0952091217041, "global_step": 53724, "epoch": 647} {"train_loss": -20.00107765197754, "global_step": 53725, "epoch": 647} {"train_loss": -19.91123390197754, "global_step": 53726, "epoch": 647} {"train_loss": -20.052797317504883, "global_step": 53727, "epoch": 647} {"train_loss": -20.00919532775879, "global_step": 53728, "epoch": 647} {"train_loss": -20.412038803100586, "global_step": 53729, "epoch": 647} {"train_loss": -20.383100509643555, "global_step": 53730, "epoch": 647} {"train_loss": -20.10020637512207, "global_step": 53731, "epoch": 647} {"train_loss": -20.078819274902344, "global_step": 53732, "epoch": 647} {"train_loss": -20.18111228942871, "global_step": 53733, "epoch": 647} {"train_loss": -20.04578399658203, "global_step": 53734, "epoch": 647} {"train_loss": -20.26263999938965, "global_step": 53735, "epoch": 647} {"train_loss": -19.99930191040039, "global_step": 53736, "epoch": 647} {"train_loss": -19.888320922851562, "global_step": 53737, "epoch": 647} {"train_loss": -20.25569725036621, "global_step": 53738, "epoch": 647} {"train_loss": -20.055940628051758, "global_step": 53739, "epoch": 647} {"train_loss": -20.085132598876953, "global_step": 53740, "epoch": 647} {"train_loss": -20.2714786529541, "global_step": 53741, "epoch": 647} {"train_loss": -19.845279693603516, "global_step": 53742, "epoch": 647} {"train_loss": -20.165136337280273, "global_step": 53743, "epoch": 647} {"train_loss": -20.111373901367188, "global_step": 53744, "epoch": 647} {"train_loss": -19.824419021606445, "global_step": 53745, "epoch": 647} {"train_loss": -20.04970359802246, "global_step": 53746, "epoch": 647} {"train_loss": -20.10104751586914, "global_step": 53747, "epoch": 647} {"train_loss": -20.0827579498291, "global_step": 53748, "epoch": 647} {"train_loss": -20.19302749633789, "global_step": 53749, "epoch": 647} {"train_loss": -20.086669921875, "global_step": 53750, "epoch": 647} {"train_loss": -20.524093627929688, "global_step": 53751, "epoch": 647} {"train_loss": -19.948347091674805, "global_step": 53752, "epoch": 647} {"train_loss": -20.28281021118164, "global_step": 53753, "epoch": 647} {"train_loss": -19.94516372680664, "global_step": 53754, "epoch": 647} {"train_loss": -20.23683738708496, "global_step": 53755, "epoch": 647} {"train_loss": -20.03910255432129, "global_step": 53756, "epoch": 647} {"train_loss": -20.28374671936035, "global_step": 53757, "epoch": 647} {"train_loss": -20.00691795349121, "global_step": 53758, "epoch": 647} {"train_loss": -20.01175880432129, "global_step": 53759, "epoch": 647} {"train_loss": -20.1386661529541, "global_step": 53760, "epoch": 647} {"train_loss": -20.14031982421875, "global_step": 53761, "epoch": 647} {"train_loss": -20.53864097595215, "global_step": 53762, "epoch": 647} {"train_loss": -20.348608016967773, "global_step": 53763, "epoch": 647} {"train_loss": -20.055068969726562, "global_step": 53764, "epoch": 647} {"train_loss": -20.523765563964844, "global_step": 53765, "epoch": 647} {"train_loss": -20.219970703125, "global_step": 53766, "epoch": 647} {"train_loss": -19.97162437438965, "global_step": 53767, "epoch": 647} {"train_loss": -20.084049224853516, "global_step": 53768, "epoch": 647} {"train_loss": -19.8714542388916, "global_step": 53769, "epoch": 647} {"train_loss": -20.226999282836914, "global_step": 53770, "epoch": 647} {"train_loss": -19.994131088256836, "global_step": 53771, "epoch": 647} {"train_loss": -20.05147361755371, "global_step": 53772, "epoch": 647} {"train_loss": -20.205102920532227, "global_step": 53773, "epoch": 647} {"train_loss": -20.174240112304688, "global_step": 53774, "epoch": 647} {"train_loss": -20.159603118896484, "global_step": 53775, "epoch": 647} {"train_loss": -19.922033309936523, "global_step": 53776, "epoch": 647} {"train_loss": -19.83437156677246, "global_step": 53777, "epoch": 647} {"train_loss": -20.252904891967773, "global_step": 53778, "epoch": 647} {"train_loss": -20.0136775970459, "global_step": 53779, "epoch": 647} {"train_loss": -20.07279396057129, "global_step": 53780, "epoch": 647} {"train_loss": -20.027189254760742, "global_step": 53781, "epoch": 647} {"train_loss": -20.066564559936523, "global_step": 53782, "epoch": 647} {"train_loss": -20.044752764414593, "global_step": 53783, "epoch": 647, "val_loss": 5963484.5} {"train_loss": -19.455318450927734, "global_step": 53784, "epoch": 648} {"train_loss": -20.14310073852539, "global_step": 53785, "epoch": 648} {"train_loss": -19.424306869506836, "global_step": 53786, "epoch": 648} {"train_loss": -19.956876754760742, "global_step": 53787, "epoch": 648} {"train_loss": -19.71076202392578, "global_step": 53788, "epoch": 648} {"train_loss": -19.783628463745117, "global_step": 53789, "epoch": 648} {"train_loss": -19.73016357421875, "global_step": 53790, "epoch": 648} {"train_loss": -19.778486251831055, "global_step": 53791, "epoch": 648} {"train_loss": -19.825902938842773, "global_step": 53792, "epoch": 648} {"train_loss": -19.760160446166992, "global_step": 53793, "epoch": 648} {"train_loss": -19.705352783203125, "global_step": 53794, "epoch": 648} {"train_loss": -19.675193786621094, "global_step": 53795, "epoch": 648} {"train_loss": -19.44464683532715, "global_step": 53796, "epoch": 648} {"train_loss": -19.788476943969727, "global_step": 53797, "epoch": 648} {"train_loss": -19.880374908447266, "global_step": 53798, "epoch": 648} {"train_loss": -20.051586151123047, "global_step": 53799, "epoch": 648} {"train_loss": -20.26105308532715, "global_step": 53800, "epoch": 648} {"train_loss": -19.840869903564453, "global_step": 53801, "epoch": 648} {"train_loss": -20.399600982666016, "global_step": 53802, "epoch": 648} {"train_loss": -19.9473819732666, "global_step": 53803, "epoch": 648} {"train_loss": -19.962345123291016, "global_step": 53804, "epoch": 648} {"train_loss": -19.91719627380371, "global_step": 53805, "epoch": 648} {"train_loss": -20.16415786743164, "global_step": 53806, "epoch": 648} {"train_loss": -20.31294059753418, "global_step": 53807, "epoch": 648} {"train_loss": -19.713134765625, "global_step": 53808, "epoch": 648} {"train_loss": -19.82716941833496, "global_step": 53809, "epoch": 648} {"train_loss": -20.431543350219727, "global_step": 53810, "epoch": 648} {"train_loss": -19.824602127075195, "global_step": 53811, "epoch": 648} {"train_loss": -20.02888298034668, "global_step": 53812, "epoch": 648} {"train_loss": -20.138778686523438, "global_step": 53813, "epoch": 648} {"train_loss": -20.12525749206543, "global_step": 53814, "epoch": 648} {"train_loss": -20.075939178466797, "global_step": 53815, "epoch": 648} {"train_loss": -20.267372131347656, "global_step": 53816, "epoch": 648} {"train_loss": -20.347810745239258, "global_step": 53817, "epoch": 648} {"train_loss": -20.281585693359375, "global_step": 53818, "epoch": 648} {"train_loss": -20.43558120727539, "global_step": 53819, "epoch": 648} {"train_loss": -20.265705108642578, "global_step": 53820, "epoch": 648} {"train_loss": -20.479578018188477, "global_step": 53821, "epoch": 648} {"train_loss": -20.442182540893555, "global_step": 53822, "epoch": 648} {"train_loss": -20.072460174560547, "global_step": 53823, "epoch": 648} {"train_loss": -20.105337142944336, "global_step": 53824, "epoch": 648} {"train_loss": -20.56526756286621, "global_step": 53825, "epoch": 648} {"train_loss": -19.684022903442383, "global_step": 53826, "epoch": 648} {"train_loss": -20.09493064880371, "global_step": 53827, "epoch": 648} {"train_loss": -20.222482681274414, "global_step": 53828, "epoch": 648} {"train_loss": -20.50251579284668, "global_step": 53829, "epoch": 648} {"train_loss": -20.112592697143555, "global_step": 53830, "epoch": 648} {"train_loss": -20.49911880493164, "global_step": 53831, "epoch": 648} {"train_loss": -20.371936798095703, "global_step": 53832, "epoch": 648} {"train_loss": -20.302412033081055, "global_step": 53833, "epoch": 648} {"train_loss": -20.160598754882812, "global_step": 53834, "epoch": 648} {"train_loss": -19.90639877319336, "global_step": 53835, "epoch": 648} {"train_loss": -20.142520904541016, "global_step": 53836, "epoch": 648} {"train_loss": -20.080387115478516, "global_step": 53837, "epoch": 648} {"train_loss": -20.058822631835938, "global_step": 53838, "epoch": 648} {"train_loss": -20.155548095703125, "global_step": 53839, "epoch": 648} {"train_loss": -19.91650390625, "global_step": 53840, "epoch": 648} {"train_loss": -20.040332794189453, "global_step": 53841, "epoch": 648} {"train_loss": -20.10002899169922, "global_step": 53842, "epoch": 648} {"train_loss": -19.60525894165039, "global_step": 53843, "epoch": 648} {"train_loss": -20.15916633605957, "global_step": 53844, "epoch": 648} {"train_loss": -19.992664337158203, "global_step": 53845, "epoch": 648} {"train_loss": -20.2081356048584, "global_step": 53846, "epoch": 648} {"train_loss": -20.291275024414062, "global_step": 53847, "epoch": 648} {"train_loss": -20.379560470581055, "global_step": 53848, "epoch": 648} {"train_loss": -20.317161560058594, "global_step": 53849, "epoch": 648} {"train_loss": -20.39847755432129, "global_step": 53850, "epoch": 648} {"train_loss": -20.161623001098633, "global_step": 53851, "epoch": 648} {"train_loss": -20.174951553344727, "global_step": 53852, "epoch": 648} {"train_loss": -20.218473434448242, "global_step": 53853, "epoch": 648} {"train_loss": -20.28666114807129, "global_step": 53854, "epoch": 648} {"train_loss": -19.931005477905273, "global_step": 53855, "epoch": 648} {"train_loss": -20.174306869506836, "global_step": 53856, "epoch": 648} {"train_loss": -19.636816024780273, "global_step": 53857, "epoch": 648} {"train_loss": -20.165433883666992, "global_step": 53858, "epoch": 648} {"train_loss": -19.812746047973633, "global_step": 53859, "epoch": 648} {"train_loss": -20.27588653564453, "global_step": 53860, "epoch": 648} {"train_loss": -20.250572204589844, "global_step": 53861, "epoch": 648} {"train_loss": -20.129728317260742, "global_step": 53862, "epoch": 648} {"train_loss": -20.009552001953125, "global_step": 53863, "epoch": 648} {"train_loss": -19.989871978759766, "global_step": 53864, "epoch": 648} {"train_loss": -20.077041625976562, "global_step": 53865, "epoch": 648} {"train_loss": -20.061302874461713, "global_step": 53866, "epoch": 648, "val_loss": 5855771.5} {"train_loss": -19.646284103393555, "global_step": 53867, "epoch": 649} {"train_loss": -19.71742820739746, "global_step": 53868, "epoch": 649} {"train_loss": -19.923593521118164, "global_step": 53869, "epoch": 649} {"train_loss": -19.932605743408203, "global_step": 53870, "epoch": 649} {"train_loss": -20.008848190307617, "global_step": 53871, "epoch": 649} {"train_loss": -19.780414581298828, "global_step": 53872, "epoch": 649} {"train_loss": -19.853200912475586, "global_step": 53873, "epoch": 649} {"train_loss": -19.78523063659668, "global_step": 53874, "epoch": 649} {"train_loss": -20.244293212890625, "global_step": 53875, "epoch": 649} {"train_loss": -19.99502182006836, "global_step": 53876, "epoch": 649} {"train_loss": -19.923120498657227, "global_step": 53877, "epoch": 649} {"train_loss": -19.915639877319336, "global_step": 53878, "epoch": 649} {"train_loss": -20.201719284057617, "global_step": 53879, "epoch": 649} {"train_loss": -19.685842514038086, "global_step": 53880, "epoch": 649} {"train_loss": -20.00608253479004, "global_step": 53881, "epoch": 649} {"train_loss": -19.67832374572754, "global_step": 53882, "epoch": 649} {"train_loss": -20.29865837097168, "global_step": 53883, "epoch": 649} {"train_loss": -20.181028366088867, "global_step": 53884, "epoch": 649} {"train_loss": -19.984983444213867, "global_step": 53885, "epoch": 649} {"train_loss": -19.88869285583496, "global_step": 53886, "epoch": 649} {"train_loss": -20.185956954956055, "global_step": 53887, "epoch": 649} {"train_loss": -20.450275421142578, "global_step": 53888, "epoch": 649} {"train_loss": -20.113235473632812, "global_step": 53889, "epoch": 649} {"train_loss": -20.214126586914062, "global_step": 53890, "epoch": 649} {"train_loss": -19.871885299682617, "global_step": 53891, "epoch": 649} {"train_loss": -20.078725814819336, "global_step": 53892, "epoch": 649} {"train_loss": -20.06881332397461, "global_step": 53893, "epoch": 649} {"train_loss": -19.942840576171875, "global_step": 53894, "epoch": 649} {"train_loss": -20.0024471282959, "global_step": 53895, "epoch": 649} {"train_loss": -19.935819625854492, "global_step": 53896, "epoch": 649} {"train_loss": -20.436159133911133, "global_step": 53897, "epoch": 649} {"train_loss": -19.733076095581055, "global_step": 53898, "epoch": 649} {"train_loss": -20.49264907836914, "global_step": 53899, "epoch": 649} {"train_loss": -20.14206886291504, "global_step": 53900, "epoch": 649} {"train_loss": -20.28500747680664, "global_step": 53901, "epoch": 649} {"train_loss": -20.12460708618164, "global_step": 53902, "epoch": 649} {"train_loss": -20.14179801940918, "global_step": 53903, "epoch": 649} {"train_loss": -19.363279342651367, "global_step": 53904, "epoch": 649} {"train_loss": -20.48883819580078, "global_step": 53905, "epoch": 649} {"train_loss": -20.255189895629883, "global_step": 53906, "epoch": 649} {"train_loss": -20.13313865661621, "global_step": 53907, "epoch": 649} {"train_loss": -19.7127685546875, "global_step": 53908, "epoch": 649} {"train_loss": -20.346271514892578, "global_step": 53909, "epoch": 649} {"train_loss": -20.30083656311035, "global_step": 53910, "epoch": 649} {"train_loss": -20.13387107849121, "global_step": 53911, "epoch": 649} {"train_loss": -20.290298461914062, "global_step": 53912, "epoch": 649} {"train_loss": -20.06653594970703, "global_step": 53913, "epoch": 649} {"train_loss": -20.219058990478516, "global_step": 53914, "epoch": 649} {"train_loss": -20.300504684448242, "global_step": 53915, "epoch": 649} {"train_loss": -19.93473243713379, "global_step": 53916, "epoch": 649} {"train_loss": -19.856277465820312, "global_step": 53917, "epoch": 649} {"train_loss": -19.80792236328125, "global_step": 53918, "epoch": 649} {"train_loss": -20.16261863708496, "global_step": 53919, "epoch": 649} {"train_loss": -19.990358352661133, "global_step": 53920, "epoch": 649} {"train_loss": -19.88996696472168, "global_step": 53921, "epoch": 649} {"train_loss": -20.045211791992188, "global_step": 53922, "epoch": 649} {"train_loss": -19.92656135559082, "global_step": 53923, "epoch": 649} {"train_loss": -19.891971588134766, "global_step": 53924, "epoch": 649} {"train_loss": -19.903106689453125, "global_step": 53925, "epoch": 649} {"train_loss": -20.13472557067871, "global_step": 53926, "epoch": 649} {"train_loss": -19.905811309814453, "global_step": 53927, "epoch": 649} {"train_loss": -20.08420181274414, "global_step": 53928, "epoch": 649} {"train_loss": -20.277433395385742, "global_step": 53929, "epoch": 649} {"train_loss": -20.154605865478516, "global_step": 53930, "epoch": 649} {"train_loss": -20.24967384338379, "global_step": 53931, "epoch": 649} {"train_loss": -20.17839813232422, "global_step": 53932, "epoch": 649} {"train_loss": -20.425302505493164, "global_step": 53933, "epoch": 649} {"train_loss": -19.949262619018555, "global_step": 53934, "epoch": 649} {"train_loss": -19.869062423706055, "global_step": 53935, "epoch": 649} {"train_loss": -20.01331901550293, "global_step": 53936, "epoch": 649} {"train_loss": -20.640783309936523, "global_step": 53937, "epoch": 649} {"train_loss": -20.294050216674805, "global_step": 53938, "epoch": 649} {"train_loss": -20.502763748168945, "global_step": 53939, "epoch": 649} {"train_loss": -20.22307586669922, "global_step": 53940, "epoch": 649} {"train_loss": -20.17340660095215, "global_step": 53941, "epoch": 649} {"train_loss": -20.320459365844727, "global_step": 53942, "epoch": 649} {"train_loss": -20.159791946411133, "global_step": 53943, "epoch": 649} {"train_loss": -20.36353874206543, "global_step": 53944, "epoch": 649} {"train_loss": -20.025522232055664, "global_step": 53945, "epoch": 649} {"train_loss": -20.155479431152344, "global_step": 53946, "epoch": 649} {"train_loss": -20.166160583496094, "global_step": 53947, "epoch": 649} {"train_loss": -20.315988540649414, "global_step": 53948, "epoch": 649} {"train_loss": -20.09014301989452, "global_step": 53949, "epoch": 649, "val_loss": 5999670.0} {"train_loss": -19.31965446472168, "global_step": 53950, "epoch": 650} {"train_loss": -19.74646759033203, "global_step": 53951, "epoch": 650} {"train_loss": -19.623069763183594, "global_step": 53952, "epoch": 650} {"train_loss": -20.18338966369629, "global_step": 53953, "epoch": 650} {"train_loss": -20.005619049072266, "global_step": 53954, "epoch": 650} {"train_loss": -20.124740600585938, "global_step": 53955, "epoch": 650} {"train_loss": -19.858556747436523, "global_step": 53956, "epoch": 650} {"train_loss": -20.32753562927246, "global_step": 53957, "epoch": 650} {"train_loss": -19.9269962310791, "global_step": 53958, "epoch": 650} {"train_loss": -20.04335594177246, "global_step": 53959, "epoch": 650} {"train_loss": -19.91006851196289, "global_step": 53960, "epoch": 650} {"train_loss": -19.88163948059082, "global_step": 53961, "epoch": 650} {"train_loss": -20.168567657470703, "global_step": 53962, "epoch": 650} {"train_loss": -20.17616844177246, "global_step": 53963, "epoch": 650} {"train_loss": -20.248798370361328, "global_step": 53964, "epoch": 650} {"train_loss": -19.729421615600586, "global_step": 53965, "epoch": 650} {"train_loss": -20.08803367614746, "global_step": 53966, "epoch": 650} {"train_loss": -20.007978439331055, "global_step": 53967, "epoch": 650} {"train_loss": -20.24560546875, "global_step": 53968, "epoch": 650} {"train_loss": -20.130935668945312, "global_step": 53969, "epoch": 650} {"train_loss": -19.908267974853516, "global_step": 53970, "epoch": 650} {"train_loss": -19.92072868347168, "global_step": 53971, "epoch": 650} {"train_loss": -20.10685920715332, "global_step": 53972, "epoch": 650} {"train_loss": -19.816938400268555, "global_step": 53973, "epoch": 650} {"train_loss": -20.127634048461914, "global_step": 53974, "epoch": 650} {"train_loss": -20.231943130493164, "global_step": 53975, "epoch": 650} {"train_loss": -19.94537353515625, "global_step": 53976, "epoch": 650} {"train_loss": -19.835081100463867, "global_step": 53977, "epoch": 650} {"train_loss": -19.862558364868164, "global_step": 53978, "epoch": 650} {"train_loss": -20.190950393676758, "global_step": 53979, "epoch": 650} {"train_loss": -20.47425651550293, "global_step": 53980, "epoch": 650} {"train_loss": -20.282743453979492, "global_step": 53981, "epoch": 650} {"train_loss": -20.195804595947266, "global_step": 53982, "epoch": 650} {"train_loss": -20.078624725341797, "global_step": 53983, "epoch": 650} {"train_loss": -20.33255958557129, "global_step": 53984, "epoch": 650} {"train_loss": -20.11502456665039, "global_step": 53985, "epoch": 650} {"train_loss": -20.222061157226562, "global_step": 53986, "epoch": 650} {"train_loss": -20.157079696655273, "global_step": 53987, "epoch": 650} {"train_loss": -19.927410125732422, "global_step": 53988, "epoch": 650} {"train_loss": -20.039703369140625, "global_step": 53989, "epoch": 650} {"train_loss": -19.932861328125, "global_step": 53990, "epoch": 650} {"train_loss": -20.283649444580078, "global_step": 53991, "epoch": 650} {"train_loss": -20.27345085144043, "global_step": 53992, "epoch": 650} {"train_loss": -19.89094352722168, "global_step": 53993, "epoch": 650} {"train_loss": -20.108922958374023, "global_step": 53994, "epoch": 650} {"train_loss": -20.44871711730957, "global_step": 53995, "epoch": 650} {"train_loss": -20.011159896850586, "global_step": 53996, "epoch": 650} {"train_loss": -19.943716049194336, "global_step": 53997, "epoch": 650} {"train_loss": -20.282255172729492, "global_step": 53998, "epoch": 650} {"train_loss": -20.447980880737305, "global_step": 53999, "epoch": 650} {"train_loss": -20.60273551940918, "global_step": 54000, "epoch": 650} {"train_loss": -20.05754852294922, "global_step": 54001, "epoch": 650} {"train_loss": -20.42713737487793, "global_step": 54002, "epoch": 650} {"train_loss": -20.06416893005371, "global_step": 54003, "epoch": 650} {"train_loss": -20.409290313720703, "global_step": 54004, "epoch": 650} {"train_loss": -20.13273048400879, "global_step": 54005, "epoch": 650} {"train_loss": -20.19347381591797, "global_step": 54006, "epoch": 650} {"train_loss": -20.1803035736084, "global_step": 54007, "epoch": 650} {"train_loss": -20.165739059448242, "global_step": 54008, "epoch": 650} {"train_loss": -20.111404418945312, "global_step": 54009, "epoch": 650} {"train_loss": -20.186969757080078, "global_step": 54010, "epoch": 650} {"train_loss": -20.0793514251709, "global_step": 54011, "epoch": 650} {"train_loss": -20.07781982421875, "global_step": 54012, "epoch": 650} {"train_loss": -19.815412521362305, "global_step": 54013, "epoch": 650} {"train_loss": -20.231266021728516, "global_step": 54014, "epoch": 650} {"train_loss": -20.007984161376953, "global_step": 54015, "epoch": 650} {"train_loss": -19.874805450439453, "global_step": 54016, "epoch": 650} {"train_loss": -20.352399826049805, "global_step": 54017, "epoch": 650} {"train_loss": -19.891616821289062, "global_step": 54018, "epoch": 650} {"train_loss": -19.83051300048828, "global_step": 54019, "epoch": 650} {"train_loss": -19.868375778198242, "global_step": 54020, "epoch": 650} {"train_loss": -20.235681533813477, "global_step": 54021, "epoch": 650} {"train_loss": -20.236642837524414, "global_step": 54022, "epoch": 650} {"train_loss": -19.761493682861328, "global_step": 54023, "epoch": 650} {"train_loss": -20.34786605834961, "global_step": 54024, "epoch": 650} {"train_loss": -20.283340454101562, "global_step": 54025, "epoch": 650} {"train_loss": -19.957197189331055, "global_step": 54026, "epoch": 650} {"train_loss": -19.979904174804688, "global_step": 54027, "epoch": 650} {"train_loss": -19.90131950378418, "global_step": 54028, "epoch": 650} {"train_loss": -20.13091468811035, "global_step": 54029, "epoch": 650} {"train_loss": -20.512271881103516, "global_step": 54030, "epoch": 650} {"train_loss": -20.197851181030273, "global_step": 54031, "epoch": 650} {"train_loss": -20.06756258585367, "global_step": 54032, "epoch": 650, "train/sim_max_reward_0": 1.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 0.0, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4500000": 1.0, "test/sim_max_reward_4500001": 1.0, "test/sim_max_reward_4500002": 1.0, "test/sim_max_reward_4500003": 1.0, "test/sim_max_reward_4500004": 1.0, "test/sim_max_reward_4500005": 1.0, "test/sim_max_reward_4500006": 1.0, "test/sim_max_reward_4500007": 1.0, "test/sim_max_reward_4500008": 1.0, "test/sim_max_reward_4500009": 1.0, "test/sim_max_reward_4500010": 0.0, "test/sim_max_reward_4500011": 1.0, "test/sim_max_reward_4500012": 1.0, "test/sim_max_reward_4500013": 1.0, "test/sim_max_reward_4500014": 1.0, "test/sim_max_reward_4500015": 1.0, "test/sim_max_reward_4500016": 1.0, "test/sim_max_reward_4500017": 1.0, "test/sim_max_reward_4500018": 1.0, "test/sim_max_reward_4500019": 1.0, "test/sim_max_reward_4500020": 1.0, "test/sim_max_reward_4500021": 1.0, "train/mean_score": 0.8333333333333334, "test/mean_score": 0.9545454545454546, "val_loss": 6110272.5} {"train_loss": -19.987863540649414, "global_step": 54033, "epoch": 651} {"train_loss": -20.09737205505371, "global_step": 54034, "epoch": 651} {"train_loss": -19.78047752380371, "global_step": 54035, "epoch": 651} {"train_loss": -19.963407516479492, "global_step": 54036, "epoch": 651} {"train_loss": -19.94292449951172, "global_step": 54037, "epoch": 651} {"train_loss": -19.976715087890625, "global_step": 54038, "epoch": 651} {"train_loss": -19.88300132751465, "global_step": 54039, "epoch": 651} {"train_loss": -20.328386306762695, "global_step": 54040, "epoch": 651} {"train_loss": -19.757526397705078, "global_step": 54041, "epoch": 651} {"train_loss": -20.10854148864746, "global_step": 54042, "epoch": 651} {"train_loss": -19.865726470947266, "global_step": 54043, "epoch": 651} {"train_loss": -19.79561424255371, "global_step": 54044, "epoch": 651} {"train_loss": -19.665542602539062, "global_step": 54045, "epoch": 651} {"train_loss": -19.764507293701172, "global_step": 54046, "epoch": 651} {"train_loss": -19.774641036987305, "global_step": 54047, "epoch": 651} {"train_loss": -20.13671875, "global_step": 54048, "epoch": 651} {"train_loss": -20.252944946289062, "global_step": 54049, "epoch": 651} {"train_loss": -20.230518341064453, "global_step": 54050, "epoch": 651} {"train_loss": -19.827716827392578, "global_step": 54051, "epoch": 651} {"train_loss": -20.03840446472168, "global_step": 54052, "epoch": 651} {"train_loss": -20.03278160095215, "global_step": 54053, "epoch": 651} {"train_loss": -20.111164093017578, "global_step": 54054, "epoch": 651} {"train_loss": -20.364011764526367, "global_step": 54055, "epoch": 651} {"train_loss": -19.734283447265625, "global_step": 54056, "epoch": 651} {"train_loss": -20.23264503479004, "global_step": 54057, "epoch": 651} {"train_loss": -20.06805419921875, "global_step": 54058, "epoch": 651} {"train_loss": -20.26263427734375, "global_step": 54059, "epoch": 651} {"train_loss": -20.010223388671875, "global_step": 54060, "epoch": 651} {"train_loss": -19.813220977783203, "global_step": 54061, "epoch": 651} {"train_loss": -20.266979217529297, "global_step": 54062, "epoch": 651} {"train_loss": -20.008991241455078, "global_step": 54063, "epoch": 651} {"train_loss": -19.917993545532227, "global_step": 54064, "epoch": 651} {"train_loss": -20.21917152404785, "global_step": 54065, "epoch": 651} {"train_loss": -20.09490966796875, "global_step": 54066, "epoch": 651} {"train_loss": -19.867536544799805, "global_step": 54067, "epoch": 651} {"train_loss": -19.8666934967041, "global_step": 54068, "epoch": 651} {"train_loss": -20.279586791992188, "global_step": 54069, "epoch": 651} {"train_loss": -20.327289581298828, "global_step": 54070, "epoch": 651} {"train_loss": -19.953828811645508, "global_step": 54071, "epoch": 651} {"train_loss": -20.236528396606445, "global_step": 54072, "epoch": 651} {"train_loss": -20.046184539794922, "global_step": 54073, "epoch": 651} {"train_loss": -20.238330841064453, "global_step": 54074, "epoch": 651} {"train_loss": -20.00640296936035, "global_step": 54075, "epoch": 651} {"train_loss": -20.29340362548828, "global_step": 54076, "epoch": 651} {"train_loss": -20.082746505737305, "global_step": 54077, "epoch": 651} {"train_loss": -20.057735443115234, "global_step": 54078, "epoch": 651} {"train_loss": -20.114749908447266, "global_step": 54079, "epoch": 651} {"train_loss": -19.913114547729492, "global_step": 54080, "epoch": 651} {"train_loss": -20.064857482910156, "global_step": 54081, "epoch": 651} {"train_loss": -20.14435386657715, "global_step": 54082, "epoch": 651} {"train_loss": -20.12860107421875, "global_step": 54083, "epoch": 651} {"train_loss": -20.433271408081055, "global_step": 54084, "epoch": 651} {"train_loss": -19.949941635131836, "global_step": 54085, "epoch": 651} {"train_loss": -20.522165298461914, "global_step": 54086, "epoch": 651} {"train_loss": -20.0971736907959, "global_step": 54087, "epoch": 651} {"train_loss": -20.15923500061035, "global_step": 54088, "epoch": 651} {"train_loss": -20.359315872192383, "global_step": 54089, "epoch": 651} {"train_loss": -20.267623901367188, "global_step": 54090, "epoch": 651} {"train_loss": -20.338308334350586, "global_step": 54091, "epoch": 651} {"train_loss": -19.87958526611328, "global_step": 54092, "epoch": 651} {"train_loss": -20.412878036499023, "global_step": 54093, "epoch": 651} {"train_loss": -19.737363815307617, "global_step": 54094, "epoch": 651} {"train_loss": -19.990407943725586, "global_step": 54095, "epoch": 651} {"train_loss": -19.968521118164062, "global_step": 54096, "epoch": 651} {"train_loss": -20.046018600463867, "global_step": 54097, "epoch": 651} {"train_loss": -20.460615158081055, "global_step": 54098, "epoch": 651} {"train_loss": -19.89581298828125, "global_step": 54099, "epoch": 651} {"train_loss": -19.845319747924805, "global_step": 54100, "epoch": 651} {"train_loss": -19.923215866088867, "global_step": 54101, "epoch": 651} {"train_loss": -19.9112491607666, "global_step": 54102, "epoch": 651} {"train_loss": -20.334829330444336, "global_step": 54103, "epoch": 651} {"train_loss": -20.530162811279297, "global_step": 54104, "epoch": 651} {"train_loss": -20.049701690673828, "global_step": 54105, "epoch": 651} {"train_loss": -20.084388732910156, "global_step": 54106, "epoch": 651} {"train_loss": -20.414342880249023, "global_step": 54107, "epoch": 651} {"train_loss": -20.202972412109375, "global_step": 54108, "epoch": 651} {"train_loss": -19.991552352905273, "global_step": 54109, "epoch": 651} {"train_loss": -20.637836456298828, "global_step": 54110, "epoch": 651} {"train_loss": -20.270906448364258, "global_step": 54111, "epoch": 651} {"train_loss": -20.3663387298584, "global_step": 54112, "epoch": 651} {"train_loss": -20.07541275024414, "global_step": 54113, "epoch": 651} {"train_loss": -20.26886749267578, "global_step": 54114, "epoch": 651} {"train_loss": -20.09994945755924, "global_step": 54115, "epoch": 651, "val_loss": 6215234.0} {"train_loss": -18.284116744995117, "global_step": 54116, "epoch": 652} {"train_loss": -18.309167861938477, "global_step": 54117, "epoch": 652} {"train_loss": -19.876680374145508, "global_step": 54118, "epoch": 652} {"train_loss": -18.796920776367188, "global_step": 54119, "epoch": 652} {"train_loss": -18.754709243774414, "global_step": 54120, "epoch": 652} {"train_loss": -19.282211303710938, "global_step": 54121, "epoch": 652} {"train_loss": -19.742816925048828, "global_step": 54122, "epoch": 652} {"train_loss": -19.091886520385742, "global_step": 54123, "epoch": 652} {"train_loss": -18.921152114868164, "global_step": 54124, "epoch": 652} {"train_loss": -19.395132064819336, "global_step": 54125, "epoch": 652} {"train_loss": -19.170522689819336, "global_step": 54126, "epoch": 652} {"train_loss": -19.32210350036621, "global_step": 54127, "epoch": 652} {"train_loss": -19.628347396850586, "global_step": 54128, "epoch": 652} {"train_loss": -19.492570877075195, "global_step": 54129, "epoch": 652} {"train_loss": -19.637969970703125, "global_step": 54130, "epoch": 652} {"train_loss": -19.182477951049805, "global_step": 54131, "epoch": 652} {"train_loss": -19.45766258239746, "global_step": 54132, "epoch": 652} {"train_loss": -19.470815658569336, "global_step": 54133, "epoch": 652} {"train_loss": -19.570804595947266, "global_step": 54134, "epoch": 652} {"train_loss": -19.77760887145996, "global_step": 54135, "epoch": 652} {"train_loss": -19.367374420166016, "global_step": 54136, "epoch": 652} {"train_loss": -19.703763961791992, "global_step": 54137, "epoch": 652} {"train_loss": -19.571638107299805, "global_step": 54138, "epoch": 652} {"train_loss": -19.67386245727539, "global_step": 54139, "epoch": 652} {"train_loss": -19.624845504760742, "global_step": 54140, "epoch": 652} {"train_loss": -19.821739196777344, "global_step": 54141, "epoch": 652} {"train_loss": -19.768537521362305, "global_step": 54142, "epoch": 652} {"train_loss": -19.85402488708496, "global_step": 54143, "epoch": 652} {"train_loss": -19.744779586791992, "global_step": 54144, "epoch": 652} {"train_loss": -19.893054962158203, "global_step": 54145, "epoch": 652} {"train_loss": -19.639995574951172, "global_step": 54146, "epoch": 652} {"train_loss": -19.79123878479004, "global_step": 54147, "epoch": 652} {"train_loss": -20.197031021118164, "global_step": 54148, "epoch": 652} {"train_loss": -20.081396102905273, "global_step": 54149, "epoch": 652} {"train_loss": -19.762496948242188, "global_step": 54150, "epoch": 652} {"train_loss": -19.695959091186523, "global_step": 54151, "epoch": 652} {"train_loss": -19.98522186279297, "global_step": 54152, "epoch": 652} {"train_loss": -20.419435501098633, "global_step": 54153, "epoch": 652} {"train_loss": -20.245595932006836, "global_step": 54154, "epoch": 652} {"train_loss": -19.880491256713867, "global_step": 54155, "epoch": 652} {"train_loss": -20.031333923339844, "global_step": 54156, "epoch": 652} {"train_loss": -19.8548641204834, "global_step": 54157, "epoch": 652} {"train_loss": -20.070241928100586, "global_step": 54158, "epoch": 652} {"train_loss": -20.14261817932129, "global_step": 54159, "epoch": 652} {"train_loss": -20.100664138793945, "global_step": 54160, "epoch": 652} {"train_loss": -19.90287971496582, "global_step": 54161, "epoch": 652} {"train_loss": -20.2542724609375, "global_step": 54162, "epoch": 652} {"train_loss": -19.889057159423828, "global_step": 54163, "epoch": 652} {"train_loss": -20.20223045349121, "global_step": 54164, "epoch": 652} {"train_loss": -19.719160079956055, "global_step": 54165, "epoch": 652} {"train_loss": -20.170434951782227, "global_step": 54166, "epoch": 652} {"train_loss": -20.009096145629883, "global_step": 54167, "epoch": 652} {"train_loss": -19.9145450592041, "global_step": 54168, "epoch": 652} {"train_loss": -20.37265396118164, "global_step": 54169, "epoch": 652} {"train_loss": -20.207828521728516, "global_step": 54170, "epoch": 652} {"train_loss": -19.795093536376953, "global_step": 54171, "epoch": 652} {"train_loss": -20.548643112182617, "global_step": 54172, "epoch": 652} {"train_loss": -20.109437942504883, "global_step": 54173, "epoch": 652} {"train_loss": -19.589834213256836, "global_step": 54174, "epoch": 652} {"train_loss": -20.206449508666992, "global_step": 54175, "epoch": 652} {"train_loss": -20.00074577331543, "global_step": 54176, "epoch": 652} {"train_loss": -19.963191986083984, "global_step": 54177, "epoch": 652} {"train_loss": -20.15095329284668, "global_step": 54178, "epoch": 652} {"train_loss": -19.807729721069336, "global_step": 54179, "epoch": 652} {"train_loss": -20.217308044433594, "global_step": 54180, "epoch": 652} {"train_loss": -20.19719886779785, "global_step": 54181, "epoch": 652} {"train_loss": -20.40797233581543, "global_step": 54182, "epoch": 652} {"train_loss": -20.342737197875977, "global_step": 54183, "epoch": 652} {"train_loss": -19.73214340209961, "global_step": 54184, "epoch": 652} {"train_loss": -20.077789306640625, "global_step": 54185, "epoch": 652} {"train_loss": -20.05612564086914, "global_step": 54186, "epoch": 652} {"train_loss": -20.282485961914062, "global_step": 54187, "epoch": 652} {"train_loss": -19.87845802307129, "global_step": 54188, "epoch": 652} {"train_loss": -19.646177291870117, "global_step": 54189, "epoch": 652} {"train_loss": -20.18564224243164, "global_step": 54190, "epoch": 652} {"train_loss": -19.904529571533203, "global_step": 54191, "epoch": 652} {"train_loss": -19.99527359008789, "global_step": 54192, "epoch": 652} {"train_loss": -19.48093605041504, "global_step": 54193, "epoch": 652} {"train_loss": -20.20107650756836, "global_step": 54194, "epoch": 652} {"train_loss": -20.0534725189209, "global_step": 54195, "epoch": 652} {"train_loss": -20.315759658813477, "global_step": 54196, "epoch": 652} {"train_loss": -20.31233024597168, "global_step": 54197, "epoch": 652} {"train_loss": -19.79088231741664, "global_step": 54198, "epoch": 652, "val_loss": 6068293.0} {"train_loss": -19.01203727722168, "global_step": 54199, "epoch": 653} {"train_loss": -20.271728515625, "global_step": 54200, "epoch": 653} {"train_loss": -19.419994354248047, "global_step": 54201, "epoch": 653} {"train_loss": -20.00282096862793, "global_step": 54202, "epoch": 653} {"train_loss": -20.282434463500977, "global_step": 54203, "epoch": 653} {"train_loss": -19.926284790039062, "global_step": 54204, "epoch": 653} {"train_loss": -19.90041160583496, "global_step": 54205, "epoch": 653} {"train_loss": -19.831632614135742, "global_step": 54206, "epoch": 653} {"train_loss": -20.212839126586914, "global_step": 54207, "epoch": 653} {"train_loss": -20.045320510864258, "global_step": 54208, "epoch": 653} {"train_loss": -20.396949768066406, "global_step": 54209, "epoch": 653} {"train_loss": -20.059736251831055, "global_step": 54210, "epoch": 653} {"train_loss": -19.727352142333984, "global_step": 54211, "epoch": 653} {"train_loss": -19.996238708496094, "global_step": 54212, "epoch": 653} {"train_loss": -19.911413192749023, "global_step": 54213, "epoch": 653} {"train_loss": -20.176679611206055, "global_step": 54214, "epoch": 653} {"train_loss": -20.11463737487793, "global_step": 54215, "epoch": 653} {"train_loss": -19.99598503112793, "global_step": 54216, "epoch": 653} {"train_loss": -20.128942489624023, "global_step": 54217, "epoch": 653} {"train_loss": -20.288427352905273, "global_step": 54218, "epoch": 653} {"train_loss": -20.098310470581055, "global_step": 54219, "epoch": 653} {"train_loss": -20.271093368530273, "global_step": 54220, "epoch": 653} {"train_loss": -20.1567440032959, "global_step": 54221, "epoch": 653} {"train_loss": -20.268829345703125, "global_step": 54222, "epoch": 653} {"train_loss": -20.126848220825195, "global_step": 54223, "epoch": 653} {"train_loss": -20.341983795166016, "global_step": 54224, "epoch": 653} {"train_loss": -20.246688842773438, "global_step": 54225, "epoch": 653} {"train_loss": -20.2347354888916, "global_step": 54226, "epoch": 653} {"train_loss": -20.349821090698242, "global_step": 54227, "epoch": 653} {"train_loss": -20.146865844726562, "global_step": 54228, "epoch": 653} {"train_loss": -20.437448501586914, "global_step": 54229, "epoch": 653} {"train_loss": -19.981321334838867, "global_step": 54230, "epoch": 653} {"train_loss": -20.471975326538086, "global_step": 54231, "epoch": 653} {"train_loss": -19.66887664794922, "global_step": 54232, "epoch": 653} {"train_loss": -20.167213439941406, "global_step": 54233, "epoch": 653} {"train_loss": -20.068269729614258, "global_step": 54234, "epoch": 653} {"train_loss": -20.306564331054688, "global_step": 54235, "epoch": 653} {"train_loss": -19.88521385192871, "global_step": 54236, "epoch": 653} {"train_loss": -20.041086196899414, "global_step": 54237, "epoch": 653} {"train_loss": -20.092870712280273, "global_step": 54238, "epoch": 653} {"train_loss": -20.07831382751465, "global_step": 54239, "epoch": 653} {"train_loss": -19.912118911743164, "global_step": 54240, "epoch": 653} {"train_loss": -20.322851181030273, "global_step": 54241, "epoch": 653} {"train_loss": -20.180612564086914, "global_step": 54242, "epoch": 653} {"train_loss": -20.33501625061035, "global_step": 54243, "epoch": 653} {"train_loss": -20.136377334594727, "global_step": 54244, "epoch": 653} {"train_loss": -20.11383628845215, "global_step": 54245, "epoch": 653} {"train_loss": -20.1146297454834, "global_step": 54246, "epoch": 653} {"train_loss": -20.21192741394043, "global_step": 54247, "epoch": 653} {"train_loss": -20.431621551513672, "global_step": 54248, "epoch": 653} {"train_loss": -20.453901290893555, "global_step": 54249, "epoch": 653} {"train_loss": -20.047143936157227, "global_step": 54250, "epoch": 653} {"train_loss": -20.396148681640625, "global_step": 54251, "epoch": 653} {"train_loss": -19.752004623413086, "global_step": 54252, "epoch": 653} {"train_loss": -20.1742000579834, "global_step": 54253, "epoch": 653} {"train_loss": -20.276845932006836, "global_step": 54254, "epoch": 653} {"train_loss": -19.990999221801758, "global_step": 54255, "epoch": 653} {"train_loss": -20.205183029174805, "global_step": 54256, "epoch": 653} {"train_loss": -20.072174072265625, "global_step": 54257, "epoch": 653} {"train_loss": -20.361371994018555, "global_step": 54258, "epoch": 653} {"train_loss": -20.481306076049805, "global_step": 54259, "epoch": 653} {"train_loss": -20.232454299926758, "global_step": 54260, "epoch": 653} {"train_loss": -20.194129943847656, "global_step": 54261, "epoch": 653} {"train_loss": -20.282102584838867, "global_step": 54262, "epoch": 653} {"train_loss": -20.114561080932617, "global_step": 54263, "epoch": 653} {"train_loss": -20.287458419799805, "global_step": 54264, "epoch": 653} {"train_loss": -20.1002140045166, "global_step": 54265, "epoch": 653} {"train_loss": -19.994531631469727, "global_step": 54266, "epoch": 653} {"train_loss": -20.210058212280273, "global_step": 54267, "epoch": 653} {"train_loss": -20.074552536010742, "global_step": 54268, "epoch": 653} {"train_loss": -20.210214614868164, "global_step": 54269, "epoch": 653} {"train_loss": -20.08086585998535, "global_step": 54270, "epoch": 653} {"train_loss": -20.0555477142334, "global_step": 54271, "epoch": 653} {"train_loss": -19.950651168823242, "global_step": 54272, "epoch": 653} {"train_loss": -20.308034896850586, "global_step": 54273, "epoch": 653} {"train_loss": -20.083072662353516, "global_step": 54274, "epoch": 653} {"train_loss": -20.33097267150879, "global_step": 54275, "epoch": 653} {"train_loss": -20.226322174072266, "global_step": 54276, "epoch": 653} {"train_loss": -19.898937225341797, "global_step": 54277, "epoch": 653} {"train_loss": -20.562292098999023, "global_step": 54278, "epoch": 653} {"train_loss": -19.834882736206055, "global_step": 54279, "epoch": 653} {"train_loss": -20.250642776489258, "global_step": 54280, "epoch": 653} {"train_loss": -20.1240423501256, "global_step": 54281, "epoch": 653, "val_loss": 6214645.0} {"train_loss": -18.9151554107666, "global_step": 54282, "epoch": 654} {"train_loss": -19.12836456298828, "global_step": 54283, "epoch": 654} {"train_loss": -19.734472274780273, "global_step": 54284, "epoch": 654} {"train_loss": -19.721837997436523, "global_step": 54285, "epoch": 654} {"train_loss": -19.896703720092773, "global_step": 54286, "epoch": 654} {"train_loss": -19.874067306518555, "global_step": 54287, "epoch": 654} {"train_loss": -19.943395614624023, "global_step": 54288, "epoch": 654} {"train_loss": -19.656240463256836, "global_step": 54289, "epoch": 654} {"train_loss": -19.718547821044922, "global_step": 54290, "epoch": 654} {"train_loss": -19.9768123626709, "global_step": 54291, "epoch": 654} {"train_loss": -19.87565040588379, "global_step": 54292, "epoch": 654} {"train_loss": -19.996179580688477, "global_step": 54293, "epoch": 654} {"train_loss": -19.30795669555664, "global_step": 54294, "epoch": 654} {"train_loss": -19.962337493896484, "global_step": 54295, "epoch": 654} {"train_loss": -19.907081604003906, "global_step": 54296, "epoch": 654} {"train_loss": -19.618223190307617, "global_step": 54297, "epoch": 654} {"train_loss": -20.121536254882812, "global_step": 54298, "epoch": 654} {"train_loss": -19.906423568725586, "global_step": 54299, "epoch": 654} {"train_loss": -20.180158615112305, "global_step": 54300, "epoch": 654} {"train_loss": -19.7569522857666, "global_step": 54301, "epoch": 654} {"train_loss": -19.994871139526367, "global_step": 54302, "epoch": 654} {"train_loss": -19.75660514831543, "global_step": 54303, "epoch": 654} {"train_loss": -20.250341415405273, "global_step": 54304, "epoch": 654} {"train_loss": -19.800352096557617, "global_step": 54305, "epoch": 654} {"train_loss": -19.908145904541016, "global_step": 54306, "epoch": 654} {"train_loss": -20.357187271118164, "global_step": 54307, "epoch": 654} {"train_loss": -19.947248458862305, "global_step": 54308, "epoch": 654} {"train_loss": -20.352659225463867, "global_step": 54309, "epoch": 654} {"train_loss": -19.991769790649414, "global_step": 54310, "epoch": 654} {"train_loss": -20.15042495727539, "global_step": 54311, "epoch": 654} {"train_loss": -20.17742347717285, "global_step": 54312, "epoch": 654} {"train_loss": -19.87595558166504, "global_step": 54313, "epoch": 654} {"train_loss": -20.112485885620117, "global_step": 54314, "epoch": 654} {"train_loss": -19.95118522644043, "global_step": 54315, "epoch": 654} {"train_loss": -20.501001358032227, "global_step": 54316, "epoch": 654} {"train_loss": -20.39972496032715, "global_step": 54317, "epoch": 654} {"train_loss": -19.780624389648438, "global_step": 54318, "epoch": 654} {"train_loss": -19.792922973632812, "global_step": 54319, "epoch": 654} {"train_loss": -20.054672241210938, "global_step": 54320, "epoch": 654} {"train_loss": -20.0687313079834, "global_step": 54321, "epoch": 654} {"train_loss": -19.965578079223633, "global_step": 54322, "epoch": 654} {"train_loss": -20.213346481323242, "global_step": 54323, "epoch": 654} {"train_loss": -19.990270614624023, "global_step": 54324, "epoch": 654} {"train_loss": -20.23457908630371, "global_step": 54325, "epoch": 654} {"train_loss": -20.33432388305664, "global_step": 54326, "epoch": 654} {"train_loss": -20.063453674316406, "global_step": 54327, "epoch": 654} {"train_loss": -20.304035186767578, "global_step": 54328, "epoch": 654} {"train_loss": -20.056049346923828, "global_step": 54329, "epoch": 654} {"train_loss": -20.18611717224121, "global_step": 54330, "epoch": 654} {"train_loss": -20.082170486450195, "global_step": 54331, "epoch": 654} {"train_loss": -19.774885177612305, "global_step": 54332, "epoch": 654} {"train_loss": -20.034475326538086, "global_step": 54333, "epoch": 654} {"train_loss": -20.273883819580078, "global_step": 54334, "epoch": 654} {"train_loss": -20.155227661132812, "global_step": 54335, "epoch": 654} {"train_loss": -20.672311782836914, "global_step": 54336, "epoch": 654} {"train_loss": -20.163516998291016, "global_step": 54337, "epoch": 654} {"train_loss": -20.525497436523438, "global_step": 54338, "epoch": 654} {"train_loss": -20.57806396484375, "global_step": 54339, "epoch": 654} {"train_loss": -20.31545066833496, "global_step": 54340, "epoch": 654} {"train_loss": -20.44923210144043, "global_step": 54341, "epoch": 654} {"train_loss": -20.18228530883789, "global_step": 54342, "epoch": 654} {"train_loss": -20.01730728149414, "global_step": 54343, "epoch": 654} {"train_loss": -19.8247127532959, "global_step": 54344, "epoch": 654} {"train_loss": -20.381696701049805, "global_step": 54345, "epoch": 654} {"train_loss": -20.019906997680664, "global_step": 54346, "epoch": 654} {"train_loss": -20.032703399658203, "global_step": 54347, "epoch": 654} {"train_loss": -20.051530838012695, "global_step": 54348, "epoch": 654} {"train_loss": -19.944686889648438, "global_step": 54349, "epoch": 654} {"train_loss": -20.338552474975586, "global_step": 54350, "epoch": 654} {"train_loss": -19.971017837524414, "global_step": 54351, "epoch": 654} {"train_loss": -20.33852195739746, "global_step": 54352, "epoch": 654} {"train_loss": -20.1656494140625, "global_step": 54353, "epoch": 654} {"train_loss": -20.265722274780273, "global_step": 54354, "epoch": 654} {"train_loss": -19.967973709106445, "global_step": 54355, "epoch": 654} {"train_loss": -20.44202423095703, "global_step": 54356, "epoch": 654} {"train_loss": -20.041133880615234, "global_step": 54357, "epoch": 654} {"train_loss": -20.089080810546875, "global_step": 54358, "epoch": 654} {"train_loss": -20.71290397644043, "global_step": 54359, "epoch": 654} {"train_loss": -19.587427139282227, "global_step": 54360, "epoch": 654} {"train_loss": -20.49097442626953, "global_step": 54361, "epoch": 654} {"train_loss": -20.42201042175293, "global_step": 54362, "epoch": 654} {"train_loss": -19.969499588012695, "global_step": 54363, "epoch": 654} {"train_loss": -20.04895139027791, "global_step": 54364, "epoch": 654, "val_loss": 6096602.0} {"train_loss": -19.80670738220215, "global_step": 54365, "epoch": 655} {"train_loss": -19.62004852294922, "global_step": 54366, "epoch": 655} {"train_loss": -20.09828758239746, "global_step": 54367, "epoch": 655} {"train_loss": -20.331472396850586, "global_step": 54368, "epoch": 655} {"train_loss": -20.565723419189453, "global_step": 54369, "epoch": 655} {"train_loss": -20.26410484313965, "global_step": 54370, "epoch": 655} {"train_loss": -20.353891372680664, "global_step": 54371, "epoch": 655} {"train_loss": -20.153928756713867, "global_step": 54372, "epoch": 655} {"train_loss": -19.641597747802734, "global_step": 54373, "epoch": 655} {"train_loss": -20.056411743164062, "global_step": 54374, "epoch": 655} {"train_loss": -19.817157745361328, "global_step": 54375, "epoch": 655} {"train_loss": -19.899932861328125, "global_step": 54376, "epoch": 655} {"train_loss": -19.98952293395996, "global_step": 54377, "epoch": 655} {"train_loss": -20.07718276977539, "global_step": 54378, "epoch": 655} {"train_loss": -20.004592895507812, "global_step": 54379, "epoch": 655} {"train_loss": -19.6702938079834, "global_step": 54380, "epoch": 655} {"train_loss": -19.81746482849121, "global_step": 54381, "epoch": 655} {"train_loss": -20.38397979736328, "global_step": 54382, "epoch": 655} {"train_loss": -20.172704696655273, "global_step": 54383, "epoch": 655} {"train_loss": -20.42933464050293, "global_step": 54384, "epoch": 655} {"train_loss": -20.270038604736328, "global_step": 54385, "epoch": 655} {"train_loss": -19.87165641784668, "global_step": 54386, "epoch": 655} {"train_loss": -20.050649642944336, "global_step": 54387, "epoch": 655} {"train_loss": -19.969629287719727, "global_step": 54388, "epoch": 655} {"train_loss": -20.295093536376953, "global_step": 54389, "epoch": 655} {"train_loss": -19.73537826538086, "global_step": 54390, "epoch": 655} {"train_loss": -19.968120574951172, "global_step": 54391, "epoch": 655} {"train_loss": -19.937021255493164, "global_step": 54392, "epoch": 655} {"train_loss": -20.228551864624023, "global_step": 54393, "epoch": 655} {"train_loss": -20.532140731811523, "global_step": 54394, "epoch": 655} {"train_loss": -20.26091957092285, "global_step": 54395, "epoch": 655} {"train_loss": -19.78266716003418, "global_step": 54396, "epoch": 655} {"train_loss": -20.041810989379883, "global_step": 54397, "epoch": 655} {"train_loss": -19.990102767944336, "global_step": 54398, "epoch": 655} {"train_loss": -20.350370407104492, "global_step": 54399, "epoch": 655} {"train_loss": -20.31568717956543, "global_step": 54400, "epoch": 655} {"train_loss": -20.172521591186523, "global_step": 54401, "epoch": 655} {"train_loss": -20.390336990356445, "global_step": 54402, "epoch": 655} {"train_loss": -20.00554656982422, "global_step": 54403, "epoch": 655} {"train_loss": -20.0670166015625, "global_step": 54404, "epoch": 655} {"train_loss": -20.0648250579834, "global_step": 54405, "epoch": 655} {"train_loss": -20.281574249267578, "global_step": 54406, "epoch": 655} {"train_loss": -20.14124870300293, "global_step": 54407, "epoch": 655} {"train_loss": -19.874122619628906, "global_step": 54408, "epoch": 655} {"train_loss": -20.473081588745117, "global_step": 54409, "epoch": 655} {"train_loss": -20.163772583007812, "global_step": 54410, "epoch": 655} {"train_loss": -20.069395065307617, "global_step": 54411, "epoch": 655} {"train_loss": -20.425607681274414, "global_step": 54412, "epoch": 655} {"train_loss": -20.214059829711914, "global_step": 54413, "epoch": 655} {"train_loss": -20.435117721557617, "global_step": 54414, "epoch": 655} {"train_loss": -20.449026107788086, "global_step": 54415, "epoch": 655} {"train_loss": -20.209997177124023, "global_step": 54416, "epoch": 655} {"train_loss": -20.033472061157227, "global_step": 54417, "epoch": 655} {"train_loss": -20.308609008789062, "global_step": 54418, "epoch": 655} {"train_loss": -19.826766967773438, "global_step": 54419, "epoch": 655} {"train_loss": -20.28583526611328, "global_step": 54420, "epoch": 655} {"train_loss": -20.315332412719727, "global_step": 54421, "epoch": 655} {"train_loss": -20.19781494140625, "global_step": 54422, "epoch": 655} {"train_loss": -20.19862937927246, "global_step": 54423, "epoch": 655} {"train_loss": -20.374101638793945, "global_step": 54424, "epoch": 655} {"train_loss": -19.971593856811523, "global_step": 54425, "epoch": 655} {"train_loss": -20.20880889892578, "global_step": 54426, "epoch": 655} {"train_loss": -20.102354049682617, "global_step": 54427, "epoch": 655} {"train_loss": -19.842275619506836, "global_step": 54428, "epoch": 655} {"train_loss": -20.013164520263672, "global_step": 54429, "epoch": 655} {"train_loss": -20.475507736206055, "global_step": 54430, "epoch": 655} {"train_loss": -20.098129272460938, "global_step": 54431, "epoch": 655} {"train_loss": -19.9238338470459, "global_step": 54432, "epoch": 655} {"train_loss": -20.248123168945312, "global_step": 54433, "epoch": 655} {"train_loss": -19.842979431152344, "global_step": 54434, "epoch": 655} {"train_loss": -20.40029525756836, "global_step": 54435, "epoch": 655} {"train_loss": -20.450069427490234, "global_step": 54436, "epoch": 655} {"train_loss": -20.059837341308594, "global_step": 54437, "epoch": 655} {"train_loss": -20.388622283935547, "global_step": 54438, "epoch": 655} {"train_loss": -20.08537483215332, "global_step": 54439, "epoch": 655} {"train_loss": -20.25602149963379, "global_step": 54440, "epoch": 655} {"train_loss": -20.553131103515625, "global_step": 54441, "epoch": 655} {"train_loss": -20.2755069732666, "global_step": 54442, "epoch": 655} {"train_loss": -20.329605102539062, "global_step": 54443, "epoch": 655} {"train_loss": -20.536203384399414, "global_step": 54444, "epoch": 655} {"train_loss": -19.938241958618164, "global_step": 54445, "epoch": 655} {"train_loss": -20.080461502075195, "global_step": 54446, "epoch": 655} {"train_loss": -20.150561780814666, "global_step": 54447, "epoch": 655, "val_loss": 6107469.0} {"train_loss": -19.334835052490234, "global_step": 54448, "epoch": 656} {"train_loss": -19.3154239654541, "global_step": 54449, "epoch": 656} {"train_loss": -20.204843521118164, "global_step": 54450, "epoch": 656} {"train_loss": -19.530227661132812, "global_step": 54451, "epoch": 656} {"train_loss": -19.8802490234375, "global_step": 54452, "epoch": 656} {"train_loss": -19.8132266998291, "global_step": 54453, "epoch": 656} {"train_loss": -19.887102127075195, "global_step": 54454, "epoch": 656} {"train_loss": -20.082401275634766, "global_step": 54455, "epoch": 656} {"train_loss": -20.13623046875, "global_step": 54456, "epoch": 656} {"train_loss": -19.85426139831543, "global_step": 54457, "epoch": 656} {"train_loss": -19.639591217041016, "global_step": 54458, "epoch": 656} {"train_loss": -20.1043643951416, "global_step": 54459, "epoch": 656} {"train_loss": -20.14133644104004, "global_step": 54460, "epoch": 656} {"train_loss": -20.117450714111328, "global_step": 54461, "epoch": 656} {"train_loss": -19.871158599853516, "global_step": 54462, "epoch": 656} {"train_loss": -19.958784103393555, "global_step": 54463, "epoch": 656} {"train_loss": -20.273656845092773, "global_step": 54464, "epoch": 656} {"train_loss": -20.146549224853516, "global_step": 54465, "epoch": 656} {"train_loss": -20.1726131439209, "global_step": 54466, "epoch": 656} {"train_loss": -19.965238571166992, "global_step": 54467, "epoch": 656} {"train_loss": -19.729856491088867, "global_step": 54468, "epoch": 656} {"train_loss": -20.1846981048584, "global_step": 54469, "epoch": 656} {"train_loss": -20.178396224975586, "global_step": 54470, "epoch": 656} {"train_loss": -20.34535789489746, "global_step": 54471, "epoch": 656} {"train_loss": -20.1052188873291, "global_step": 54472, "epoch": 656} {"train_loss": -20.014266967773438, "global_step": 54473, "epoch": 656} {"train_loss": -20.087888717651367, "global_step": 54474, "epoch": 656} {"train_loss": -19.88237953186035, "global_step": 54475, "epoch": 656} {"train_loss": -20.377582550048828, "global_step": 54476, "epoch": 656} {"train_loss": -20.240209579467773, "global_step": 54477, "epoch": 656} {"train_loss": -20.158613204956055, "global_step": 54478, "epoch": 656} {"train_loss": -20.55193328857422, "global_step": 54479, "epoch": 656} {"train_loss": -20.20692253112793, "global_step": 54480, "epoch": 656} {"train_loss": -20.27667808532715, "global_step": 54481, "epoch": 656} {"train_loss": -20.2469539642334, "global_step": 54482, "epoch": 656} {"train_loss": -20.23494529724121, "global_step": 54483, "epoch": 656} {"train_loss": -20.20151138305664, "global_step": 54484, "epoch": 656} {"train_loss": -20.289220809936523, "global_step": 54485, "epoch": 656} {"train_loss": -20.04659080505371, "global_step": 54486, "epoch": 656} {"train_loss": -20.012672424316406, "global_step": 54487, "epoch": 656} {"train_loss": -19.828088760375977, "global_step": 54488, "epoch": 656} {"train_loss": -20.1235408782959, "global_step": 54489, "epoch": 656} {"train_loss": -20.214202880859375, "global_step": 54490, "epoch": 656} {"train_loss": -19.73558235168457, "global_step": 54491, "epoch": 656} {"train_loss": -20.3465633392334, "global_step": 54492, "epoch": 656} {"train_loss": -19.918676376342773, "global_step": 54493, "epoch": 656} {"train_loss": -19.976337432861328, "global_step": 54494, "epoch": 656} {"train_loss": -19.902042388916016, "global_step": 54495, "epoch": 656} {"train_loss": -19.84716796875, "global_step": 54496, "epoch": 656} {"train_loss": -20.329082489013672, "global_step": 54497, "epoch": 656} {"train_loss": -20.288366317749023, "global_step": 54498, "epoch": 656} {"train_loss": -20.251110076904297, "global_step": 54499, "epoch": 656} {"train_loss": -20.216459274291992, "global_step": 54500, "epoch": 656} {"train_loss": -20.21199607849121, "global_step": 54501, "epoch": 656} {"train_loss": -20.516311645507812, "global_step": 54502, "epoch": 656} {"train_loss": -20.177783966064453, "global_step": 54503, "epoch": 656} {"train_loss": -20.6633243560791, "global_step": 54504, "epoch": 656} {"train_loss": -20.377429962158203, "global_step": 54505, "epoch": 656} {"train_loss": -20.10977554321289, "global_step": 54506, "epoch": 656} {"train_loss": -20.494855880737305, "global_step": 54507, "epoch": 656} {"train_loss": -20.291650772094727, "global_step": 54508, "epoch": 656} {"train_loss": -20.195104598999023, "global_step": 54509, "epoch": 656} {"train_loss": -19.86322593688965, "global_step": 54510, "epoch": 656} {"train_loss": -19.917695999145508, "global_step": 54511, "epoch": 656} {"train_loss": -20.262104034423828, "global_step": 54512, "epoch": 656} {"train_loss": -20.146472930908203, "global_step": 54513, "epoch": 656} {"train_loss": -20.041635513305664, "global_step": 54514, "epoch": 656} {"train_loss": -20.082603454589844, "global_step": 54515, "epoch": 656} {"train_loss": -20.014551162719727, "global_step": 54516, "epoch": 656} {"train_loss": -20.24859619140625, "global_step": 54517, "epoch": 656} {"train_loss": -20.022558212280273, "global_step": 54518, "epoch": 656} {"train_loss": -20.114395141601562, "global_step": 54519, "epoch": 656} {"train_loss": -20.292579650878906, "global_step": 54520, "epoch": 656} {"train_loss": -20.229219436645508, "global_step": 54521, "epoch": 656} {"train_loss": -20.35307502746582, "global_step": 54522, "epoch": 656} {"train_loss": -20.209232330322266, "global_step": 54523, "epoch": 656} {"train_loss": -19.7545223236084, "global_step": 54524, "epoch": 656} {"train_loss": -19.813980102539062, "global_step": 54525, "epoch": 656} {"train_loss": -20.237531661987305, "global_step": 54526, "epoch": 656} {"train_loss": -20.165904998779297, "global_step": 54527, "epoch": 656} {"train_loss": -19.85093116760254, "global_step": 54528, "epoch": 656} {"train_loss": -19.839466094970703, "global_step": 54529, "epoch": 656} {"train_loss": -20.096057156482374, "global_step": 54530, "epoch": 656, "val_loss": 5991145.0} {"train_loss": -18.94440269470215, "global_step": 54531, "epoch": 657} {"train_loss": -19.71605682373047, "global_step": 54532, "epoch": 657} {"train_loss": -19.271114349365234, "global_step": 54533, "epoch": 657} {"train_loss": -19.802064895629883, "global_step": 54534, "epoch": 657} {"train_loss": -19.853618621826172, "global_step": 54535, "epoch": 657} {"train_loss": -19.967548370361328, "global_step": 54536, "epoch": 657} {"train_loss": -20.02802848815918, "global_step": 54537, "epoch": 657} {"train_loss": -19.73176383972168, "global_step": 54538, "epoch": 657} {"train_loss": -19.989248275756836, "global_step": 54539, "epoch": 657} {"train_loss": -19.468185424804688, "global_step": 54540, "epoch": 657} {"train_loss": -20.12029457092285, "global_step": 54541, "epoch": 657} {"train_loss": -20.043325424194336, "global_step": 54542, "epoch": 657} {"train_loss": -20.20417022705078, "global_step": 54543, "epoch": 657} {"train_loss": -19.954113006591797, "global_step": 54544, "epoch": 657} {"train_loss": -20.029104232788086, "global_step": 54545, "epoch": 657} {"train_loss": -20.186941146850586, "global_step": 54546, "epoch": 657} {"train_loss": -19.908409118652344, "global_step": 54547, "epoch": 657} {"train_loss": -20.077274322509766, "global_step": 54548, "epoch": 657} {"train_loss": -19.786306381225586, "global_step": 54549, "epoch": 657} {"train_loss": -19.869281768798828, "global_step": 54550, "epoch": 657} {"train_loss": -19.799306869506836, "global_step": 54551, "epoch": 657} {"train_loss": -19.755783081054688, "global_step": 54552, "epoch": 657} {"train_loss": -19.882619857788086, "global_step": 54553, "epoch": 657} {"train_loss": -20.349428176879883, "global_step": 54554, "epoch": 657} {"train_loss": -19.9886531829834, "global_step": 54555, "epoch": 657} {"train_loss": -20.365781784057617, "global_step": 54556, "epoch": 657} {"train_loss": -19.924840927124023, "global_step": 54557, "epoch": 657} {"train_loss": -19.592453002929688, "global_step": 54558, "epoch": 657} {"train_loss": -20.156997680664062, "global_step": 54559, "epoch": 657} {"train_loss": -20.049280166625977, "global_step": 54560, "epoch": 657} {"train_loss": -20.13277244567871, "global_step": 54561, "epoch": 657} {"train_loss": -20.19738006591797, "global_step": 54562, "epoch": 657} {"train_loss": -20.107643127441406, "global_step": 54563, "epoch": 657} {"train_loss": -20.346059799194336, "global_step": 54564, "epoch": 657} {"train_loss": -20.26361846923828, "global_step": 54565, "epoch": 657} {"train_loss": -20.26899528503418, "global_step": 54566, "epoch": 657} {"train_loss": -20.160932540893555, "global_step": 54567, "epoch": 657} {"train_loss": -20.51175880432129, "global_step": 54568, "epoch": 657} {"train_loss": -19.954984664916992, "global_step": 54569, "epoch": 657} {"train_loss": -20.04384422302246, "global_step": 54570, "epoch": 657} {"train_loss": -20.039779663085938, "global_step": 54571, "epoch": 657} {"train_loss": -20.249404907226562, "global_step": 54572, "epoch": 657} {"train_loss": -20.40152931213379, "global_step": 54573, "epoch": 657} {"train_loss": -20.162338256835938, "global_step": 54574, "epoch": 657} {"train_loss": -20.041833877563477, "global_step": 54575, "epoch": 657} {"train_loss": -19.940956115722656, "global_step": 54576, "epoch": 657} {"train_loss": -20.0701847076416, "global_step": 54577, "epoch": 657} {"train_loss": -20.00192642211914, "global_step": 54578, "epoch": 657} {"train_loss": -20.139738082885742, "global_step": 54579, "epoch": 657} {"train_loss": -20.309326171875, "global_step": 54580, "epoch": 657} {"train_loss": -20.307418823242188, "global_step": 54581, "epoch": 657} {"train_loss": -20.374736785888672, "global_step": 54582, "epoch": 657} {"train_loss": -20.26346206665039, "global_step": 54583, "epoch": 657} {"train_loss": -20.190366744995117, "global_step": 54584, "epoch": 657} {"train_loss": -20.023395538330078, "global_step": 54585, "epoch": 657} {"train_loss": -20.266368865966797, "global_step": 54586, "epoch": 657} {"train_loss": -19.985280990600586, "global_step": 54587, "epoch": 657} {"train_loss": -19.971179962158203, "global_step": 54588, "epoch": 657} {"train_loss": -19.845022201538086, "global_step": 54589, "epoch": 657} {"train_loss": -20.4183406829834, "global_step": 54590, "epoch": 657} {"train_loss": -20.091217041015625, "global_step": 54591, "epoch": 657} {"train_loss": -20.08184814453125, "global_step": 54592, "epoch": 657} {"train_loss": -20.234079360961914, "global_step": 54593, "epoch": 657} {"train_loss": -19.90364646911621, "global_step": 54594, "epoch": 657} {"train_loss": -20.69685935974121, "global_step": 54595, "epoch": 657} {"train_loss": -20.067811965942383, "global_step": 54596, "epoch": 657} {"train_loss": -20.406509399414062, "global_step": 54597, "epoch": 657} {"train_loss": -20.155258178710938, "global_step": 54598, "epoch": 657} {"train_loss": -20.235767364501953, "global_step": 54599, "epoch": 657} {"train_loss": -20.125837326049805, "global_step": 54600, "epoch": 657} {"train_loss": -20.4119815826416, "global_step": 54601, "epoch": 657} {"train_loss": -20.067821502685547, "global_step": 54602, "epoch": 657} {"train_loss": -20.195343017578125, "global_step": 54603, "epoch": 657} {"train_loss": -20.13037109375, "global_step": 54604, "epoch": 657} {"train_loss": -20.401216506958008, "global_step": 54605, "epoch": 657} {"train_loss": -19.995685577392578, "global_step": 54606, "epoch": 657} {"train_loss": -20.107534408569336, "global_step": 54607, "epoch": 657} {"train_loss": -20.45222282409668, "global_step": 54608, "epoch": 657} {"train_loss": -19.955568313598633, "global_step": 54609, "epoch": 657} {"train_loss": -20.387081146240234, "global_step": 54610, "epoch": 657} {"train_loss": -20.47371482849121, "global_step": 54611, "epoch": 657} {"train_loss": -20.508636474609375, "global_step": 54612, "epoch": 657} {"train_loss": -20.09471194715385, "global_step": 54613, "epoch": 657, "val_loss": 5991448.0} {"train_loss": -19.952749252319336, "global_step": 54614, "epoch": 658} {"train_loss": -20.051076889038086, "global_step": 54615, "epoch": 658} {"train_loss": -19.82038116455078, "global_step": 54616, "epoch": 658} {"train_loss": -20.148361206054688, "global_step": 54617, "epoch": 658} {"train_loss": -19.94162368774414, "global_step": 54618, "epoch": 658} {"train_loss": -20.240182876586914, "global_step": 54619, "epoch": 658} {"train_loss": -20.381887435913086, "global_step": 54620, "epoch": 658} {"train_loss": -20.039579391479492, "global_step": 54621, "epoch": 658} {"train_loss": -20.18853759765625, "global_step": 54622, "epoch": 658} {"train_loss": -20.23701286315918, "global_step": 54623, "epoch": 658} {"train_loss": -20.283079147338867, "global_step": 54624, "epoch": 658} {"train_loss": -20.25541877746582, "global_step": 54625, "epoch": 658} {"train_loss": -19.95395278930664, "global_step": 54626, "epoch": 658} {"train_loss": -20.194120407104492, "global_step": 54627, "epoch": 658} {"train_loss": -20.33193588256836, "global_step": 54628, "epoch": 658} {"train_loss": -20.226852416992188, "global_step": 54629, "epoch": 658} {"train_loss": -20.0135555267334, "global_step": 54630, "epoch": 658} {"train_loss": -20.282123565673828, "global_step": 54631, "epoch": 658} {"train_loss": -20.29343032836914, "global_step": 54632, "epoch": 658} {"train_loss": -20.106197357177734, "global_step": 54633, "epoch": 658} {"train_loss": -20.098220825195312, "global_step": 54634, "epoch": 658} {"train_loss": -20.078033447265625, "global_step": 54635, "epoch": 658} {"train_loss": -19.8218994140625, "global_step": 54636, "epoch": 658} {"train_loss": -19.444580078125, "global_step": 54637, "epoch": 658} {"train_loss": -20.26827049255371, "global_step": 54638, "epoch": 658} {"train_loss": -20.19277000427246, "global_step": 54639, "epoch": 658} {"train_loss": -20.164295196533203, "global_step": 54640, "epoch": 658} {"train_loss": -20.3799991607666, "global_step": 54641, "epoch": 658} {"train_loss": -20.089624404907227, "global_step": 54642, "epoch": 658} {"train_loss": -20.23685073852539, "global_step": 54643, "epoch": 658} {"train_loss": -20.143308639526367, "global_step": 54644, "epoch": 658} {"train_loss": -19.864206314086914, "global_step": 54645, "epoch": 658} {"train_loss": -20.42110252380371, "global_step": 54646, "epoch": 658} {"train_loss": -19.802780151367188, "global_step": 54647, "epoch": 658} {"train_loss": -20.526592254638672, "global_step": 54648, "epoch": 658} {"train_loss": -19.959856033325195, "global_step": 54649, "epoch": 658} {"train_loss": -19.990692138671875, "global_step": 54650, "epoch": 658} {"train_loss": -19.93329429626465, "global_step": 54651, "epoch": 658} {"train_loss": -20.26621437072754, "global_step": 54652, "epoch": 658} {"train_loss": -20.18657112121582, "global_step": 54653, "epoch": 658} {"train_loss": -20.13106346130371, "global_step": 54654, "epoch": 658} {"train_loss": -19.995569229125977, "global_step": 54655, "epoch": 658} {"train_loss": -20.476028442382812, "global_step": 54656, "epoch": 658} {"train_loss": -20.2287654876709, "global_step": 54657, "epoch": 658} {"train_loss": -20.285871505737305, "global_step": 54658, "epoch": 658} {"train_loss": -20.02014923095703, "global_step": 54659, "epoch": 658} {"train_loss": -20.44830894470215, "global_step": 54660, "epoch": 658} {"train_loss": -19.97344970703125, "global_step": 54661, "epoch": 658} {"train_loss": -19.822423934936523, "global_step": 54662, "epoch": 658} {"train_loss": -20.179487228393555, "global_step": 54663, "epoch": 658} {"train_loss": -20.251333236694336, "global_step": 54664, "epoch": 658} {"train_loss": -20.315702438354492, "global_step": 54665, "epoch": 658} {"train_loss": -20.55543327331543, "global_step": 54666, "epoch": 658} {"train_loss": -19.9820613861084, "global_step": 54667, "epoch": 658} {"train_loss": -20.136579513549805, "global_step": 54668, "epoch": 658} {"train_loss": -20.197635650634766, "global_step": 54669, "epoch": 658} {"train_loss": -19.869619369506836, "global_step": 54670, "epoch": 658} {"train_loss": -20.033048629760742, "global_step": 54671, "epoch": 658} {"train_loss": -20.20559310913086, "global_step": 54672, "epoch": 658} {"train_loss": -19.909658432006836, "global_step": 54673, "epoch": 658} {"train_loss": -20.317127227783203, "global_step": 54674, "epoch": 658} {"train_loss": -20.270355224609375, "global_step": 54675, "epoch": 658} {"train_loss": -20.22276496887207, "global_step": 54676, "epoch": 658} {"train_loss": -19.768415451049805, "global_step": 54677, "epoch": 658} {"train_loss": -20.334394454956055, "global_step": 54678, "epoch": 658} {"train_loss": -20.14126205444336, "global_step": 54679, "epoch": 658} {"train_loss": -20.294233322143555, "global_step": 54680, "epoch": 658} {"train_loss": -20.482694625854492, "global_step": 54681, "epoch": 658} {"train_loss": -19.96131134033203, "global_step": 54682, "epoch": 658} {"train_loss": -20.192657470703125, "global_step": 54683, "epoch": 658} {"train_loss": -20.195846557617188, "global_step": 54684, "epoch": 658} {"train_loss": -20.77841567993164, "global_step": 54685, "epoch": 658} {"train_loss": -20.35504722595215, "global_step": 54686, "epoch": 658} {"train_loss": -20.111499786376953, "global_step": 54687, "epoch": 658} {"train_loss": -20.217844009399414, "global_step": 54688, "epoch": 658} {"train_loss": -20.180273056030273, "global_step": 54689, "epoch": 658} {"train_loss": -19.94073486328125, "global_step": 54690, "epoch": 658} {"train_loss": -20.3228816986084, "global_step": 54691, "epoch": 658} {"train_loss": -20.01430320739746, "global_step": 54692, "epoch": 658} {"train_loss": -20.37516212463379, "global_step": 54693, "epoch": 658} {"train_loss": -20.32297134399414, "global_step": 54694, "epoch": 658} {"train_loss": -20.00873565673828, "global_step": 54695, "epoch": 658} {"train_loss": -20.155887006277062, "global_step": 54696, "epoch": 658, "val_loss": 6098542.0} {"train_loss": -20.218992233276367, "global_step": 54697, "epoch": 659} {"train_loss": -19.83526611328125, "global_step": 54698, "epoch": 659} {"train_loss": -20.01180076599121, "global_step": 54699, "epoch": 659} {"train_loss": -19.925493240356445, "global_step": 54700, "epoch": 659} {"train_loss": -19.82211685180664, "global_step": 54701, "epoch": 659} {"train_loss": -20.43039321899414, "global_step": 54702, "epoch": 659} {"train_loss": -20.089567184448242, "global_step": 54703, "epoch": 659} {"train_loss": -20.14621353149414, "global_step": 54704, "epoch": 659} {"train_loss": -20.057294845581055, "global_step": 54705, "epoch": 659} {"train_loss": -19.717721939086914, "global_step": 54706, "epoch": 659} {"train_loss": -20.25604820251465, "global_step": 54707, "epoch": 659} {"train_loss": -19.93622589111328, "global_step": 54708, "epoch": 659} {"train_loss": -20.115915298461914, "global_step": 54709, "epoch": 659} {"train_loss": -20.01816749572754, "global_step": 54710, "epoch": 659} {"train_loss": -20.33782958984375, "global_step": 54711, "epoch": 659} {"train_loss": -19.574460983276367, "global_step": 54712, "epoch": 659} {"train_loss": -20.31168556213379, "global_step": 54713, "epoch": 659} {"train_loss": -20.4384765625, "global_step": 54714, "epoch": 659} {"train_loss": -19.87327003479004, "global_step": 54715, "epoch": 659} {"train_loss": -20.26136589050293, "global_step": 54716, "epoch": 659} {"train_loss": -19.871610641479492, "global_step": 54717, "epoch": 659} {"train_loss": -20.552494049072266, "global_step": 54718, "epoch": 659} {"train_loss": -20.21849822998047, "global_step": 54719, "epoch": 659} {"train_loss": -20.458812713623047, "global_step": 54720, "epoch": 659} {"train_loss": -20.25174331665039, "global_step": 54721, "epoch": 659} {"train_loss": -19.95088005065918, "global_step": 54722, "epoch": 659} {"train_loss": -20.294015884399414, "global_step": 54723, "epoch": 659} {"train_loss": -20.061233520507812, "global_step": 54724, "epoch": 659} {"train_loss": -20.04838752746582, "global_step": 54725, "epoch": 659} {"train_loss": -20.34052848815918, "global_step": 54726, "epoch": 659} {"train_loss": -20.090534210205078, "global_step": 54727, "epoch": 659} {"train_loss": -20.21832847595215, "global_step": 54728, "epoch": 659} {"train_loss": -20.093454360961914, "global_step": 54729, "epoch": 659} {"train_loss": -20.06296157836914, "global_step": 54730, "epoch": 659} {"train_loss": -20.33182144165039, "global_step": 54731, "epoch": 659} {"train_loss": -20.179706573486328, "global_step": 54732, "epoch": 659} {"train_loss": -20.12642478942871, "global_step": 54733, "epoch": 659} {"train_loss": -19.855188369750977, "global_step": 54734, "epoch": 659} {"train_loss": -20.14613151550293, "global_step": 54735, "epoch": 659} {"train_loss": -20.49399185180664, "global_step": 54736, "epoch": 659} {"train_loss": -20.32777976989746, "global_step": 54737, "epoch": 659} {"train_loss": -20.107526779174805, "global_step": 54738, "epoch": 659} {"train_loss": -20.164838790893555, "global_step": 54739, "epoch": 659} {"train_loss": -20.25733757019043, "global_step": 54740, "epoch": 659} {"train_loss": -20.364482879638672, "global_step": 54741, "epoch": 659} {"train_loss": -20.20955467224121, "global_step": 54742, "epoch": 659} {"train_loss": -20.3072566986084, "global_step": 54743, "epoch": 659} {"train_loss": -19.97882652282715, "global_step": 54744, "epoch": 659} {"train_loss": -20.280881881713867, "global_step": 54745, "epoch": 659} {"train_loss": -20.093454360961914, "global_step": 54746, "epoch": 659} {"train_loss": -20.055938720703125, "global_step": 54747, "epoch": 659} {"train_loss": -20.09060287475586, "global_step": 54748, "epoch": 659} {"train_loss": -20.323638916015625, "global_step": 54749, "epoch": 659} {"train_loss": -20.290021896362305, "global_step": 54750, "epoch": 659} {"train_loss": -20.098255157470703, "global_step": 54751, "epoch": 659} {"train_loss": -20.45787811279297, "global_step": 54752, "epoch": 659} {"train_loss": -20.22712516784668, "global_step": 54753, "epoch": 659} {"train_loss": -20.379697799682617, "global_step": 54754, "epoch": 659} {"train_loss": -19.660795211791992, "global_step": 54755, "epoch": 659} {"train_loss": -19.988245010375977, "global_step": 54756, "epoch": 659} {"train_loss": -20.008991241455078, "global_step": 54757, "epoch": 659} {"train_loss": -20.181377410888672, "global_step": 54758, "epoch": 659} {"train_loss": -20.2628173828125, "global_step": 54759, "epoch": 659} {"train_loss": -19.970251083374023, "global_step": 54760, "epoch": 659} {"train_loss": -20.151687622070312, "global_step": 54761, "epoch": 659} {"train_loss": -20.35729217529297, "global_step": 54762, "epoch": 659} {"train_loss": -20.224197387695312, "global_step": 54763, "epoch": 659} {"train_loss": -20.352869033813477, "global_step": 54764, "epoch": 659} {"train_loss": -20.38230323791504, "global_step": 54765, "epoch": 659} {"train_loss": -19.956104278564453, "global_step": 54766, "epoch": 659} {"train_loss": -20.107717514038086, "global_step": 54767, "epoch": 659} {"train_loss": -20.073829650878906, "global_step": 54768, "epoch": 659} {"train_loss": -20.211090087890625, "global_step": 54769, "epoch": 659} {"train_loss": -19.819868087768555, "global_step": 54770, "epoch": 659} {"train_loss": -20.03163719177246, "global_step": 54771, "epoch": 659} {"train_loss": -19.86288833618164, "global_step": 54772, "epoch": 659} {"train_loss": -20.18784523010254, "global_step": 54773, "epoch": 659} {"train_loss": -20.372343063354492, "global_step": 54774, "epoch": 659} {"train_loss": -20.1898136138916, "global_step": 54775, "epoch": 659} {"train_loss": -20.453155517578125, "global_step": 54776, "epoch": 659} {"train_loss": -20.053831100463867, "global_step": 54777, "epoch": 659} {"train_loss": -20.01311492919922, "global_step": 54778, "epoch": 659} {"train_loss": -20.147849186357245, "global_step": 54779, "epoch": 659, "val_loss": 6009887.5} {"train_loss": -19.646793365478516, "global_step": 54780, "epoch": 660} {"train_loss": -19.825979232788086, "global_step": 54781, "epoch": 660} {"train_loss": -19.794218063354492, "global_step": 54782, "epoch": 660} {"train_loss": -19.96125602722168, "global_step": 54783, "epoch": 660} {"train_loss": -20.223356246948242, "global_step": 54784, "epoch": 660} {"train_loss": -20.116180419921875, "global_step": 54785, "epoch": 660} {"train_loss": -19.773948669433594, "global_step": 54786, "epoch": 660} {"train_loss": -19.7503719329834, "global_step": 54787, "epoch": 660} {"train_loss": -19.96149253845215, "global_step": 54788, "epoch": 660} {"train_loss": -20.02680778503418, "global_step": 54789, "epoch": 660} {"train_loss": -20.61695671081543, "global_step": 54790, "epoch": 660} {"train_loss": -19.812267303466797, "global_step": 54791, "epoch": 660} {"train_loss": -19.91754913330078, "global_step": 54792, "epoch": 660} {"train_loss": -19.80689811706543, "global_step": 54793, "epoch": 660} {"train_loss": -20.3430233001709, "global_step": 54794, "epoch": 660} {"train_loss": -19.924711227416992, "global_step": 54795, "epoch": 660} {"train_loss": -20.0573787689209, "global_step": 54796, "epoch": 660} {"train_loss": -20.473716735839844, "global_step": 54797, "epoch": 660} {"train_loss": -20.353368759155273, "global_step": 54798, "epoch": 660} {"train_loss": -20.4804744720459, "global_step": 54799, "epoch": 660} {"train_loss": -20.043968200683594, "global_step": 54800, "epoch": 660} {"train_loss": -20.059961318969727, "global_step": 54801, "epoch": 660} {"train_loss": -20.1394100189209, "global_step": 54802, "epoch": 660} {"train_loss": -20.38629913330078, "global_step": 54803, "epoch": 660} {"train_loss": -20.02752685546875, "global_step": 54804, "epoch": 660} {"train_loss": -20.085634231567383, "global_step": 54805, "epoch": 660} {"train_loss": -20.468429565429688, "global_step": 54806, "epoch": 660} {"train_loss": -19.923887252807617, "global_step": 54807, "epoch": 660} {"train_loss": -20.397565841674805, "global_step": 54808, "epoch": 660} {"train_loss": -20.452632904052734, "global_step": 54809, "epoch": 660} {"train_loss": -20.185510635375977, "global_step": 54810, "epoch": 660} {"train_loss": -19.982284545898438, "global_step": 54811, "epoch": 660} {"train_loss": -20.03407859802246, "global_step": 54812, "epoch": 660} {"train_loss": -20.176151275634766, "global_step": 54813, "epoch": 660} {"train_loss": -20.304224014282227, "global_step": 54814, "epoch": 660} {"train_loss": -20.300424575805664, "global_step": 54815, "epoch": 660} {"train_loss": -19.921157836914062, "global_step": 54816, "epoch": 660} {"train_loss": -20.411298751831055, "global_step": 54817, "epoch": 660} {"train_loss": -20.377309799194336, "global_step": 54818, "epoch": 660} {"train_loss": -20.050201416015625, "global_step": 54819, "epoch": 660} {"train_loss": -19.97398567199707, "global_step": 54820, "epoch": 660} {"train_loss": -20.43983268737793, "global_step": 54821, "epoch": 660} {"train_loss": -20.03704261779785, "global_step": 54822, "epoch": 660} {"train_loss": -20.512670516967773, "global_step": 54823, "epoch": 660} {"train_loss": -20.135364532470703, "global_step": 54824, "epoch": 660} {"train_loss": -19.94312858581543, "global_step": 54825, "epoch": 660} {"train_loss": -20.000774383544922, "global_step": 54826, "epoch": 660} {"train_loss": -20.32200050354004, "global_step": 54827, "epoch": 660} {"train_loss": -20.41972541809082, "global_step": 54828, "epoch": 660} {"train_loss": -20.12009048461914, "global_step": 54829, "epoch": 660} {"train_loss": -20.500125885009766, "global_step": 54830, "epoch": 660} {"train_loss": -19.992122650146484, "global_step": 54831, "epoch": 660} {"train_loss": -20.079801559448242, "global_step": 54832, "epoch": 660} {"train_loss": -20.317380905151367, "global_step": 54833, "epoch": 660} {"train_loss": -20.114015579223633, "global_step": 54834, "epoch": 660} {"train_loss": -20.338382720947266, "global_step": 54835, "epoch": 660} {"train_loss": -20.169946670532227, "global_step": 54836, "epoch": 660} {"train_loss": -19.913694381713867, "global_step": 54837, "epoch": 660} {"train_loss": -20.156097412109375, "global_step": 54838, "epoch": 660} {"train_loss": -20.27092742919922, "global_step": 54839, "epoch": 660} {"train_loss": -20.219655990600586, "global_step": 54840, "epoch": 660} {"train_loss": -20.330228805541992, "global_step": 54841, "epoch": 660} {"train_loss": -19.879989624023438, "global_step": 54842, "epoch": 660} {"train_loss": -19.91187858581543, "global_step": 54843, "epoch": 660} {"train_loss": -20.210599899291992, "global_step": 54844, "epoch": 660} {"train_loss": -20.59529685974121, "global_step": 54845, "epoch": 660} {"train_loss": -20.01323699951172, "global_step": 54846, "epoch": 660} {"train_loss": -20.29335594177246, "global_step": 54847, "epoch": 660} {"train_loss": -19.88892936706543, "global_step": 54848, "epoch": 660} {"train_loss": -20.20746421813965, "global_step": 54849, "epoch": 660} {"train_loss": -20.10761833190918, "global_step": 54850, "epoch": 660} {"train_loss": -20.013320922851562, "global_step": 54851, "epoch": 660} {"train_loss": -20.091537475585938, "global_step": 54852, "epoch": 660} {"train_loss": -20.144210815429688, "global_step": 54853, "epoch": 660} {"train_loss": -20.191612243652344, "global_step": 54854, "epoch": 660} {"train_loss": -20.231042861938477, "global_step": 54855, "epoch": 660} {"train_loss": -20.420001983642578, "global_step": 54856, "epoch": 660} {"train_loss": -20.387216567993164, "global_step": 54857, "epoch": 660} {"train_loss": -20.10600471496582, "global_step": 54858, "epoch": 660} {"train_loss": -20.635150909423828, "global_step": 54859, "epoch": 660} {"train_loss": -20.34425926208496, "global_step": 54860, "epoch": 660} {"train_loss": -20.0649356842041, "global_step": 54861, "epoch": 660} {"train_loss": -20.141750082912214, "global_step": 54862, "epoch": 660, "val_loss": 6120056.0} {"train_loss": -19.36269187927246, "global_step": 54863, "epoch": 661} {"train_loss": -19.689075469970703, "global_step": 54864, "epoch": 661} {"train_loss": -19.39500617980957, "global_step": 54865, "epoch": 661} {"train_loss": -19.366790771484375, "global_step": 54866, "epoch": 661} {"train_loss": -19.911224365234375, "global_step": 54867, "epoch": 661} {"train_loss": -19.499557495117188, "global_step": 54868, "epoch": 661} {"train_loss": -20.20185661315918, "global_step": 54869, "epoch": 661} {"train_loss": -19.611085891723633, "global_step": 54870, "epoch": 661} {"train_loss": -19.571151733398438, "global_step": 54871, "epoch": 661} {"train_loss": -19.490032196044922, "global_step": 54872, "epoch": 661} {"train_loss": -20.02239227294922, "global_step": 54873, "epoch": 661} {"train_loss": -20.094131469726562, "global_step": 54874, "epoch": 661} {"train_loss": -19.736656188964844, "global_step": 54875, "epoch": 661} {"train_loss": -19.79066276550293, "global_step": 54876, "epoch": 661} {"train_loss": -20.045461654663086, "global_step": 54877, "epoch": 661} {"train_loss": -20.03900146484375, "global_step": 54878, "epoch": 661} {"train_loss": -19.763351440429688, "global_step": 54879, "epoch": 661} {"train_loss": -20.178869247436523, "global_step": 54880, "epoch": 661} {"train_loss": -20.090742111206055, "global_step": 54881, "epoch": 661} {"train_loss": -20.184825897216797, "global_step": 54882, "epoch": 661} {"train_loss": -19.543264389038086, "global_step": 54883, "epoch": 661} {"train_loss": -19.90802574157715, "global_step": 54884, "epoch": 661} {"train_loss": -20.041898727416992, "global_step": 54885, "epoch": 661} {"train_loss": -19.777902603149414, "global_step": 54886, "epoch": 661} {"train_loss": -20.0031681060791, "global_step": 54887, "epoch": 661} {"train_loss": -19.73590660095215, "global_step": 54888, "epoch": 661} {"train_loss": -19.812118530273438, "global_step": 54889, "epoch": 661} {"train_loss": -20.257007598876953, "global_step": 54890, "epoch": 661} {"train_loss": -19.86103630065918, "global_step": 54891, "epoch": 661} {"train_loss": -20.0638427734375, "global_step": 54892, "epoch": 661} {"train_loss": -19.640363693237305, "global_step": 54893, "epoch": 661} {"train_loss": -19.80866050720215, "global_step": 54894, "epoch": 661} {"train_loss": -19.935476303100586, "global_step": 54895, "epoch": 661} {"train_loss": -20.14699363708496, "global_step": 54896, "epoch": 661} {"train_loss": -20.165390014648438, "global_step": 54897, "epoch": 661} {"train_loss": -20.02016258239746, "global_step": 54898, "epoch": 661} {"train_loss": -19.979751586914062, "global_step": 54899, "epoch": 661} {"train_loss": -20.613224029541016, "global_step": 54900, "epoch": 661} {"train_loss": -20.2833251953125, "global_step": 54901, "epoch": 661} {"train_loss": -20.44841957092285, "global_step": 54902, "epoch": 661} {"train_loss": -20.39751434326172, "global_step": 54903, "epoch": 661} {"train_loss": -19.90350341796875, "global_step": 54904, "epoch": 661} {"train_loss": -20.309247970581055, "global_step": 54905, "epoch": 661} {"train_loss": -20.00227928161621, "global_step": 54906, "epoch": 661} {"train_loss": -20.128690719604492, "global_step": 54907, "epoch": 661} {"train_loss": -20.19574546813965, "global_step": 54908, "epoch": 661} {"train_loss": -20.437515258789062, "global_step": 54909, "epoch": 661} {"train_loss": -20.14352798461914, "global_step": 54910, "epoch": 661} {"train_loss": -20.442426681518555, "global_step": 54911, "epoch": 661} {"train_loss": -20.34629249572754, "global_step": 54912, "epoch": 661} {"train_loss": -20.200193405151367, "global_step": 54913, "epoch": 661} {"train_loss": -20.219335556030273, "global_step": 54914, "epoch": 661} {"train_loss": -20.2883358001709, "global_step": 54915, "epoch": 661} {"train_loss": -19.858091354370117, "global_step": 54916, "epoch": 661} {"train_loss": -20.40444564819336, "global_step": 54917, "epoch": 661} {"train_loss": -20.07221794128418, "global_step": 54918, "epoch": 661} {"train_loss": -20.328773498535156, "global_step": 54919, "epoch": 661} {"train_loss": -20.07725715637207, "global_step": 54920, "epoch": 661} {"train_loss": -19.931840896606445, "global_step": 54921, "epoch": 661} {"train_loss": -20.367197036743164, "global_step": 54922, "epoch": 661} {"train_loss": -20.38568687438965, "global_step": 54923, "epoch": 661} {"train_loss": -20.62787437438965, "global_step": 54924, "epoch": 661} {"train_loss": -20.63707733154297, "global_step": 54925, "epoch": 661} {"train_loss": -20.095230102539062, "global_step": 54926, "epoch": 661} {"train_loss": -20.009502410888672, "global_step": 54927, "epoch": 661} {"train_loss": -20.175445556640625, "global_step": 54928, "epoch": 661} {"train_loss": -20.293752670288086, "global_step": 54929, "epoch": 661} {"train_loss": -20.259275436401367, "global_step": 54930, "epoch": 661} {"train_loss": -20.421676635742188, "global_step": 54931, "epoch": 661} {"train_loss": -19.914249420166016, "global_step": 54932, "epoch": 661} {"train_loss": -19.83430290222168, "global_step": 54933, "epoch": 661} {"train_loss": -20.307052612304688, "global_step": 54934, "epoch": 661} {"train_loss": -20.07404327392578, "global_step": 54935, "epoch": 661} {"train_loss": -19.74673843383789, "global_step": 54936, "epoch": 661} {"train_loss": -20.059776306152344, "global_step": 54937, "epoch": 661} {"train_loss": -20.396106719970703, "global_step": 54938, "epoch": 661} {"train_loss": -20.103614807128906, "global_step": 54939, "epoch": 661} {"train_loss": -20.230653762817383, "global_step": 54940, "epoch": 661} {"train_loss": -20.810232162475586, "global_step": 54941, "epoch": 661} {"train_loss": -20.082651138305664, "global_step": 54942, "epoch": 661} {"train_loss": -20.135425567626953, "global_step": 54943, "epoch": 661} {"train_loss": -19.948881149291992, "global_step": 54944, "epoch": 661} {"train_loss": -20.06164527801146, "global_step": 54945, "epoch": 661, "val_loss": 6143046.0} {"train_loss": -20.152755737304688, "global_step": 54946, "epoch": 662} {"train_loss": -20.58768081665039, "global_step": 54947, "epoch": 662} {"train_loss": -20.05202293395996, "global_step": 54948, "epoch": 662} {"train_loss": -20.302698135375977, "global_step": 54949, "epoch": 662} {"train_loss": -20.068933486938477, "global_step": 54950, "epoch": 662} {"train_loss": -19.65251350402832, "global_step": 54951, "epoch": 662} {"train_loss": -20.298885345458984, "global_step": 54952, "epoch": 662} {"train_loss": -20.113723754882812, "global_step": 54953, "epoch": 662} {"train_loss": -20.35274314880371, "global_step": 54954, "epoch": 662} {"train_loss": -20.051464080810547, "global_step": 54955, "epoch": 662} {"train_loss": -20.650775909423828, "global_step": 54956, "epoch": 662} {"train_loss": -20.170129776000977, "global_step": 54957, "epoch": 662} {"train_loss": -19.90044403076172, "global_step": 54958, "epoch": 662} {"train_loss": -19.822952270507812, "global_step": 54959, "epoch": 662} {"train_loss": -20.02008628845215, "global_step": 54960, "epoch": 662} {"train_loss": -20.213735580444336, "global_step": 54961, "epoch": 662} {"train_loss": -20.02056884765625, "global_step": 54962, "epoch": 662} {"train_loss": -20.338706970214844, "global_step": 54963, "epoch": 662} {"train_loss": -20.176042556762695, "global_step": 54964, "epoch": 662} {"train_loss": -19.88484764099121, "global_step": 54965, "epoch": 662} {"train_loss": -20.497650146484375, "global_step": 54966, "epoch": 662} {"train_loss": -20.069059371948242, "global_step": 54967, "epoch": 662} {"train_loss": -20.061979293823242, "global_step": 54968, "epoch": 662} {"train_loss": -20.210580825805664, "global_step": 54969, "epoch": 662} {"train_loss": -20.11446189880371, "global_step": 54970, "epoch": 662} {"train_loss": -20.201461791992188, "global_step": 54971, "epoch": 662} {"train_loss": -20.13617515563965, "global_step": 54972, "epoch": 662} {"train_loss": -19.631921768188477, "global_step": 54973, "epoch": 662} {"train_loss": -19.779035568237305, "global_step": 54974, "epoch": 662} {"train_loss": -20.2083797454834, "global_step": 54975, "epoch": 662} {"train_loss": -20.29652976989746, "global_step": 54976, "epoch": 662} {"train_loss": -20.197742462158203, "global_step": 54977, "epoch": 662} {"train_loss": -20.097000122070312, "global_step": 54978, "epoch": 662} {"train_loss": -20.316022872924805, "global_step": 54979, "epoch": 662} {"train_loss": -20.08686637878418, "global_step": 54980, "epoch": 662} {"train_loss": -20.03301429748535, "global_step": 54981, "epoch": 662} {"train_loss": -20.310224533081055, "global_step": 54982, "epoch": 662} {"train_loss": -20.244464874267578, "global_step": 54983, "epoch": 662} {"train_loss": -20.269262313842773, "global_step": 54984, "epoch": 662} {"train_loss": -20.444791793823242, "global_step": 54985, "epoch": 662} {"train_loss": -19.784574508666992, "global_step": 54986, "epoch": 662} {"train_loss": -20.178213119506836, "global_step": 54987, "epoch": 662} {"train_loss": -19.628292083740234, "global_step": 54988, "epoch": 662} {"train_loss": -20.607847213745117, "global_step": 54989, "epoch": 662} {"train_loss": -20.066164016723633, "global_step": 54990, "epoch": 662} {"train_loss": -20.238534927368164, "global_step": 54991, "epoch": 662} {"train_loss": -20.189828872680664, "global_step": 54992, "epoch": 662} {"train_loss": -19.93514060974121, "global_step": 54993, "epoch": 662} {"train_loss": -20.05630874633789, "global_step": 54994, "epoch": 662} {"train_loss": -20.027210235595703, "global_step": 54995, "epoch": 662} {"train_loss": -20.11798667907715, "global_step": 54996, "epoch": 662} {"train_loss": -20.160120010375977, "global_step": 54997, "epoch": 662} {"train_loss": -20.340301513671875, "global_step": 54998, "epoch": 662} {"train_loss": -20.358922958374023, "global_step": 54999, "epoch": 662} {"train_loss": -19.878957748413086, "global_step": 55000, "epoch": 662} {"train_loss": -20.117490768432617, "global_step": 55001, "epoch": 662} {"train_loss": -20.136014938354492, "global_step": 55002, "epoch": 662} {"train_loss": -20.016407012939453, "global_step": 55003, "epoch": 662} {"train_loss": -19.723834991455078, "global_step": 55004, "epoch": 662} {"train_loss": -20.47938346862793, "global_step": 55005, "epoch": 662} {"train_loss": -20.21059226989746, "global_step": 55006, "epoch": 662} {"train_loss": -19.776456832885742, "global_step": 55007, "epoch": 662} {"train_loss": -20.223369598388672, "global_step": 55008, "epoch": 662} {"train_loss": -19.63288116455078, "global_step": 55009, "epoch": 662} {"train_loss": -20.26026725769043, "global_step": 55010, "epoch": 662} {"train_loss": -20.26198959350586, "global_step": 55011, "epoch": 662} {"train_loss": -20.24538230895996, "global_step": 55012, "epoch": 662} {"train_loss": -20.21819496154785, "global_step": 55013, "epoch": 662} {"train_loss": -20.102100372314453, "global_step": 55014, "epoch": 662} {"train_loss": -20.00057601928711, "global_step": 55015, "epoch": 662} {"train_loss": -20.03780746459961, "global_step": 55016, "epoch": 662} {"train_loss": -19.926870346069336, "global_step": 55017, "epoch": 662} {"train_loss": -19.8968563079834, "global_step": 55018, "epoch": 662} {"train_loss": -20.242816925048828, "global_step": 55019, "epoch": 662} {"train_loss": -20.148889541625977, "global_step": 55020, "epoch": 662} {"train_loss": -20.05974006652832, "global_step": 55021, "epoch": 662} {"train_loss": -20.424528121948242, "global_step": 55022, "epoch": 662} {"train_loss": -19.957521438598633, "global_step": 55023, "epoch": 662} {"train_loss": -20.161165237426758, "global_step": 55024, "epoch": 662} {"train_loss": -20.64076042175293, "global_step": 55025, "epoch": 662} {"train_loss": -19.969411849975586, "global_step": 55026, "epoch": 662} {"train_loss": -20.058883666992188, "global_step": 55027, "epoch": 662} {"train_loss": -20.13784723396761, "global_step": 55028, "epoch": 662, "val_loss": 6068498.0} {"train_loss": -19.89594078063965, "global_step": 55029, "epoch": 663} {"train_loss": -19.799238204956055, "global_step": 55030, "epoch": 663} {"train_loss": -19.47260284423828, "global_step": 55031, "epoch": 663} {"train_loss": -19.926416397094727, "global_step": 55032, "epoch": 663} {"train_loss": -19.222267150878906, "global_step": 55033, "epoch": 663} {"train_loss": -19.974048614501953, "global_step": 55034, "epoch": 663} {"train_loss": -19.8411922454834, "global_step": 55035, "epoch": 663} {"train_loss": -19.708181381225586, "global_step": 55036, "epoch": 663} {"train_loss": -20.44007682800293, "global_step": 55037, "epoch": 663} {"train_loss": -19.698810577392578, "global_step": 55038, "epoch": 663} {"train_loss": -20.015167236328125, "global_step": 55039, "epoch": 663} {"train_loss": -20.118635177612305, "global_step": 55040, "epoch": 663} {"train_loss": -20.374671936035156, "global_step": 55041, "epoch": 663} {"train_loss": -20.28853416442871, "global_step": 55042, "epoch": 663} {"train_loss": -20.121074676513672, "global_step": 55043, "epoch": 663} {"train_loss": -20.010009765625, "global_step": 55044, "epoch": 663} {"train_loss": -19.70128631591797, "global_step": 55045, "epoch": 663} {"train_loss": -19.706083297729492, "global_step": 55046, "epoch": 663} {"train_loss": -19.616418838500977, "global_step": 55047, "epoch": 663} {"train_loss": -20.168298721313477, "global_step": 55048, "epoch": 663} {"train_loss": -20.10785484313965, "global_step": 55049, "epoch": 663} {"train_loss": -19.717540740966797, "global_step": 55050, "epoch": 663} {"train_loss": -20.24464225769043, "global_step": 55051, "epoch": 663} {"train_loss": -20.425392150878906, "global_step": 55052, "epoch": 663} {"train_loss": -20.417043685913086, "global_step": 55053, "epoch": 663} {"train_loss": -20.349714279174805, "global_step": 55054, "epoch": 663} {"train_loss": -20.05177116394043, "global_step": 55055, "epoch": 663} {"train_loss": -20.205469131469727, "global_step": 55056, "epoch": 663} {"train_loss": -20.173519134521484, "global_step": 55057, "epoch": 663} {"train_loss": -20.11374855041504, "global_step": 55058, "epoch": 663} {"train_loss": -19.675504684448242, "global_step": 55059, "epoch": 663} {"train_loss": -20.328439712524414, "global_step": 55060, "epoch": 663} {"train_loss": -20.566532135009766, "global_step": 55061, "epoch": 663} {"train_loss": -20.073766708374023, "global_step": 55062, "epoch": 663} {"train_loss": -20.05984878540039, "global_step": 55063, "epoch": 663} {"train_loss": -20.086170196533203, "global_step": 55064, "epoch": 663} {"train_loss": -20.415847778320312, "global_step": 55065, "epoch": 663} {"train_loss": -20.039419174194336, "global_step": 55066, "epoch": 663} {"train_loss": -20.342498779296875, "global_step": 55067, "epoch": 663} {"train_loss": -20.917743682861328, "global_step": 55068, "epoch": 663} {"train_loss": -20.21564292907715, "global_step": 55069, "epoch": 663} {"train_loss": -20.025127410888672, "global_step": 55070, "epoch": 663} {"train_loss": -20.72454261779785, "global_step": 55071, "epoch": 663} {"train_loss": -20.281858444213867, "global_step": 55072, "epoch": 663} {"train_loss": -20.23824119567871, "global_step": 55073, "epoch": 663} {"train_loss": -20.1283016204834, "global_step": 55074, "epoch": 663} {"train_loss": -20.117494583129883, "global_step": 55075, "epoch": 663} {"train_loss": -20.328367233276367, "global_step": 55076, "epoch": 663} {"train_loss": -20.530736923217773, "global_step": 55077, "epoch": 663} {"train_loss": -20.335132598876953, "global_step": 55078, "epoch": 663} {"train_loss": -19.753217697143555, "global_step": 55079, "epoch": 663} {"train_loss": -20.007383346557617, "global_step": 55080, "epoch": 663} {"train_loss": -20.098222732543945, "global_step": 55081, "epoch": 663} {"train_loss": -19.911279678344727, "global_step": 55082, "epoch": 663} {"train_loss": -20.571680068969727, "global_step": 55083, "epoch": 663} {"train_loss": -20.296552658081055, "global_step": 55084, "epoch": 663} {"train_loss": -20.246793746948242, "global_step": 55085, "epoch": 663} {"train_loss": -20.364425659179688, "global_step": 55086, "epoch": 663} {"train_loss": -20.054912567138672, "global_step": 55087, "epoch": 663} {"train_loss": -19.928211212158203, "global_step": 55088, "epoch": 663} {"train_loss": -20.26125144958496, "global_step": 55089, "epoch": 663} {"train_loss": -20.243017196655273, "global_step": 55090, "epoch": 663} {"train_loss": -20.618772506713867, "global_step": 55091, "epoch": 663} {"train_loss": -20.532846450805664, "global_step": 55092, "epoch": 663} {"train_loss": -20.58778953552246, "global_step": 55093, "epoch": 663} {"train_loss": -19.933835983276367, "global_step": 55094, "epoch": 663} {"train_loss": -20.288455963134766, "global_step": 55095, "epoch": 663} {"train_loss": -20.330129623413086, "global_step": 55096, "epoch": 663} {"train_loss": -19.761093139648438, "global_step": 55097, "epoch": 663} {"train_loss": -19.801000595092773, "global_step": 55098, "epoch": 663} {"train_loss": -20.138803482055664, "global_step": 55099, "epoch": 663} {"train_loss": -20.22739601135254, "global_step": 55100, "epoch": 663} {"train_loss": -20.13207244873047, "global_step": 55101, "epoch": 663} {"train_loss": -20.104400634765625, "global_step": 55102, "epoch": 663} {"train_loss": -20.244993209838867, "global_step": 55103, "epoch": 663} {"train_loss": -20.186132431030273, "global_step": 55104, "epoch": 663} {"train_loss": -20.429222106933594, "global_step": 55105, "epoch": 663} {"train_loss": -20.146469116210938, "global_step": 55106, "epoch": 663} {"train_loss": -20.011817932128906, "global_step": 55107, "epoch": 663} {"train_loss": -20.4122314453125, "global_step": 55108, "epoch": 663} {"train_loss": -19.96503448486328, "global_step": 55109, "epoch": 663} {"train_loss": -20.316205978393555, "global_step": 55110, "epoch": 663} {"train_loss": -20.143098946077277, "global_step": 55111, "epoch": 663, "val_loss": 6030297.0} {"train_loss": -19.85498046875, "global_step": 55112, "epoch": 664} {"train_loss": -19.4652099609375, "global_step": 55113, "epoch": 664} {"train_loss": -19.780685424804688, "global_step": 55114, "epoch": 664} {"train_loss": -19.655406951904297, "global_step": 55115, "epoch": 664} {"train_loss": -19.74445152282715, "global_step": 55116, "epoch": 664} {"train_loss": -19.926666259765625, "global_step": 55117, "epoch": 664} {"train_loss": -19.89430046081543, "global_step": 55118, "epoch": 664} {"train_loss": -19.80423355102539, "global_step": 55119, "epoch": 664} {"train_loss": -19.644567489624023, "global_step": 55120, "epoch": 664} {"train_loss": -19.929899215698242, "global_step": 55121, "epoch": 664} {"train_loss": -20.080774307250977, "global_step": 55122, "epoch": 664} {"train_loss": -20.25653648376465, "global_step": 55123, "epoch": 664} {"train_loss": -20.012420654296875, "global_step": 55124, "epoch": 664} {"train_loss": -19.97021484375, "global_step": 55125, "epoch": 664} {"train_loss": -19.67518424987793, "global_step": 55126, "epoch": 664} {"train_loss": -20.07880210876465, "global_step": 55127, "epoch": 664} {"train_loss": -19.81572914123535, "global_step": 55128, "epoch": 664} {"train_loss": -20.065412521362305, "global_step": 55129, "epoch": 664} {"train_loss": -20.08641815185547, "global_step": 55130, "epoch": 664} {"train_loss": -20.028751373291016, "global_step": 55131, "epoch": 664} {"train_loss": -19.9210147857666, "global_step": 55132, "epoch": 664} {"train_loss": -19.74988555908203, "global_step": 55133, "epoch": 664} {"train_loss": -20.022415161132812, "global_step": 55134, "epoch": 664} {"train_loss": -19.850793838500977, "global_step": 55135, "epoch": 664} {"train_loss": -20.10003089904785, "global_step": 55136, "epoch": 664} {"train_loss": -19.972654342651367, "global_step": 55137, "epoch": 664} {"train_loss": -20.04145622253418, "global_step": 55138, "epoch": 664} {"train_loss": -20.07284927368164, "global_step": 55139, "epoch": 664} {"train_loss": -19.962202072143555, "global_step": 55140, "epoch": 664} {"train_loss": -19.85196304321289, "global_step": 55141, "epoch": 664} {"train_loss": -20.25119400024414, "global_step": 55142, "epoch": 664} {"train_loss": -20.224267959594727, "global_step": 55143, "epoch": 664} {"train_loss": -20.083711624145508, "global_step": 55144, "epoch": 664} {"train_loss": -20.0128173828125, "global_step": 55145, "epoch": 664} {"train_loss": -20.150861740112305, "global_step": 55146, "epoch": 664} {"train_loss": -20.035144805908203, "global_step": 55147, "epoch": 664} {"train_loss": -20.3150691986084, "global_step": 55148, "epoch": 664} {"train_loss": -20.361061096191406, "global_step": 55149, "epoch": 664} {"train_loss": -20.53062629699707, "global_step": 55150, "epoch": 664} {"train_loss": -20.21149253845215, "global_step": 55151, "epoch": 664} {"train_loss": -20.128950119018555, "global_step": 55152, "epoch": 664} {"train_loss": -20.159399032592773, "global_step": 55153, "epoch": 664} {"train_loss": -19.84351921081543, "global_step": 55154, "epoch": 664} {"train_loss": -20.112394332885742, "global_step": 55155, "epoch": 664} {"train_loss": -19.983003616333008, "global_step": 55156, "epoch": 664} {"train_loss": -20.175689697265625, "global_step": 55157, "epoch": 664} {"train_loss": -19.867645263671875, "global_step": 55158, "epoch": 664} {"train_loss": -20.09311866760254, "global_step": 55159, "epoch": 664} {"train_loss": -19.911149978637695, "global_step": 55160, "epoch": 664} {"train_loss": -20.309938430786133, "global_step": 55161, "epoch": 664} {"train_loss": -20.365863800048828, "global_step": 55162, "epoch": 664} {"train_loss": -20.277090072631836, "global_step": 55163, "epoch": 664} {"train_loss": -20.32411003112793, "global_step": 55164, "epoch": 664} {"train_loss": -20.167583465576172, "global_step": 55165, "epoch": 664} {"train_loss": -20.18670082092285, "global_step": 55166, "epoch": 664} {"train_loss": -20.2670841217041, "global_step": 55167, "epoch": 664} {"train_loss": -20.266788482666016, "global_step": 55168, "epoch": 664} {"train_loss": -20.25929832458496, "global_step": 55169, "epoch": 664} {"train_loss": -20.25408172607422, "global_step": 55170, "epoch": 664} {"train_loss": -20.43589210510254, "global_step": 55171, "epoch": 664} {"train_loss": -19.90906524658203, "global_step": 55172, "epoch": 664} {"train_loss": -20.460309982299805, "global_step": 55173, "epoch": 664} {"train_loss": -20.18025016784668, "global_step": 55174, "epoch": 664} {"train_loss": -19.8475284576416, "global_step": 55175, "epoch": 664} {"train_loss": -20.47273826599121, "global_step": 55176, "epoch": 664} {"train_loss": -19.96354103088379, "global_step": 55177, "epoch": 664} {"train_loss": -20.006607055664062, "global_step": 55178, "epoch": 664} {"train_loss": -20.264081954956055, "global_step": 55179, "epoch": 664} {"train_loss": -20.086606979370117, "global_step": 55180, "epoch": 664} {"train_loss": -19.9596004486084, "global_step": 55181, "epoch": 664} {"train_loss": -20.131847381591797, "global_step": 55182, "epoch": 664} {"train_loss": -19.993253707885742, "global_step": 55183, "epoch": 664} {"train_loss": -19.865713119506836, "global_step": 55184, "epoch": 664} {"train_loss": -20.23046875, "global_step": 55185, "epoch": 664} {"train_loss": -20.064313888549805, "global_step": 55186, "epoch": 664} {"train_loss": -20.037694931030273, "global_step": 55187, "epoch": 664} {"train_loss": -20.110923767089844, "global_step": 55188, "epoch": 664} {"train_loss": -20.34795570373535, "global_step": 55189, "epoch": 664} {"train_loss": -20.013700485229492, "global_step": 55190, "epoch": 664} {"train_loss": -20.066455841064453, "global_step": 55191, "epoch": 664} {"train_loss": -20.4859676361084, "global_step": 55192, "epoch": 664} {"train_loss": -20.093244552612305, "global_step": 55193, "epoch": 664} {"train_loss": -20.076959449124622, "global_step": 55194, "epoch": 664, "val_loss": 6019858.5} {"train_loss": -18.98518943786621, "global_step": 55195, "epoch": 665} {"train_loss": -20.03969383239746, "global_step": 55196, "epoch": 665} {"train_loss": -19.7630672454834, "global_step": 55197, "epoch": 665} {"train_loss": -19.212045669555664, "global_step": 55198, "epoch": 665} {"train_loss": -19.975378036499023, "global_step": 55199, "epoch": 665} {"train_loss": -19.945446014404297, "global_step": 55200, "epoch": 665} {"train_loss": -19.456298828125, "global_step": 55201, "epoch": 665} {"train_loss": -19.742019653320312, "global_step": 55202, "epoch": 665} {"train_loss": -20.01541519165039, "global_step": 55203, "epoch": 665} {"train_loss": -19.856170654296875, "global_step": 55204, "epoch": 665} {"train_loss": -19.795621871948242, "global_step": 55205, "epoch": 665} {"train_loss": -19.9483642578125, "global_step": 55206, "epoch": 665} {"train_loss": -19.8489933013916, "global_step": 55207, "epoch": 665} {"train_loss": -19.606483459472656, "global_step": 55208, "epoch": 665} {"train_loss": -19.93782615661621, "global_step": 55209, "epoch": 665} {"train_loss": -19.784122467041016, "global_step": 55210, "epoch": 665} {"train_loss": -20.053085327148438, "global_step": 55211, "epoch": 665} {"train_loss": -19.627546310424805, "global_step": 55212, "epoch": 665} {"train_loss": -19.892698287963867, "global_step": 55213, "epoch": 665} {"train_loss": -19.87091064453125, "global_step": 55214, "epoch": 665} {"train_loss": -19.70863914489746, "global_step": 55215, "epoch": 665} {"train_loss": -20.017446517944336, "global_step": 55216, "epoch": 665} {"train_loss": -20.312681198120117, "global_step": 55217, "epoch": 665} {"train_loss": -20.25177001953125, "global_step": 55218, "epoch": 665} {"train_loss": -19.95015525817871, "global_step": 55219, "epoch": 665} {"train_loss": -20.073339462280273, "global_step": 55220, "epoch": 665} {"train_loss": -19.96843147277832, "global_step": 55221, "epoch": 665} {"train_loss": -19.694154739379883, "global_step": 55222, "epoch": 665} {"train_loss": -20.107017517089844, "global_step": 55223, "epoch": 665} {"train_loss": -19.880592346191406, "global_step": 55224, "epoch": 665} {"train_loss": -20.165058135986328, "global_step": 55225, "epoch": 665} {"train_loss": -20.21980857849121, "global_step": 55226, "epoch": 665} {"train_loss": -19.75892448425293, "global_step": 55227, "epoch": 665} {"train_loss": -20.249454498291016, "global_step": 55228, "epoch": 665} {"train_loss": -19.775487899780273, "global_step": 55229, "epoch": 665} {"train_loss": -20.61355209350586, "global_step": 55230, "epoch": 665} {"train_loss": -19.94775390625, "global_step": 55231, "epoch": 665} {"train_loss": -20.04100799560547, "global_step": 55232, "epoch": 665} {"train_loss": -20.272933959960938, "global_step": 55233, "epoch": 665} {"train_loss": -20.076669692993164, "global_step": 55234, "epoch": 665} {"train_loss": -20.116287231445312, "global_step": 55235, "epoch": 665} {"train_loss": -20.068620681762695, "global_step": 55236, "epoch": 665} {"train_loss": -20.287412643432617, "global_step": 55237, "epoch": 665} {"train_loss": -20.224538803100586, "global_step": 55238, "epoch": 665} {"train_loss": -19.926837921142578, "global_step": 55239, "epoch": 665} {"train_loss": -20.276874542236328, "global_step": 55240, "epoch": 665} {"train_loss": -19.887922286987305, "global_step": 55241, "epoch": 665} {"train_loss": -20.408506393432617, "global_step": 55242, "epoch": 665} {"train_loss": -20.252277374267578, "global_step": 55243, "epoch": 665} {"train_loss": -20.179967880249023, "global_step": 55244, "epoch": 665} {"train_loss": -20.05732536315918, "global_step": 55245, "epoch": 665} {"train_loss": -20.453699111938477, "global_step": 55246, "epoch": 665} {"train_loss": -20.235868453979492, "global_step": 55247, "epoch": 665} {"train_loss": -19.954299926757812, "global_step": 55248, "epoch": 665} {"train_loss": -20.322193145751953, "global_step": 55249, "epoch": 665} {"train_loss": -20.24055290222168, "global_step": 55250, "epoch": 665} {"train_loss": -20.124601364135742, "global_step": 55251, "epoch": 665} {"train_loss": -20.10626983642578, "global_step": 55252, "epoch": 665} {"train_loss": -20.165058135986328, "global_step": 55253, "epoch": 665} {"train_loss": -20.029882431030273, "global_step": 55254, "epoch": 665} {"train_loss": -20.330657958984375, "global_step": 55255, "epoch": 665} {"train_loss": -20.895910263061523, "global_step": 55256, "epoch": 665} {"train_loss": -20.263809204101562, "global_step": 55257, "epoch": 665} {"train_loss": -19.820520401000977, "global_step": 55258, "epoch": 665} {"train_loss": -20.110944747924805, "global_step": 55259, "epoch": 665} {"train_loss": -20.45636749267578, "global_step": 55260, "epoch": 665} {"train_loss": -20.513349533081055, "global_step": 55261, "epoch": 665} {"train_loss": -20.270248413085938, "global_step": 55262, "epoch": 665} {"train_loss": -20.50514793395996, "global_step": 55263, "epoch": 665} {"train_loss": -20.41167640686035, "global_step": 55264, "epoch": 665} {"train_loss": -20.187070846557617, "global_step": 55265, "epoch": 665} {"train_loss": -20.35679054260254, "global_step": 55266, "epoch": 665} {"train_loss": -20.115610122680664, "global_step": 55267, "epoch": 665} {"train_loss": -19.85322380065918, "global_step": 55268, "epoch": 665} {"train_loss": -20.262868881225586, "global_step": 55269, "epoch": 665} {"train_loss": -20.009910583496094, "global_step": 55270, "epoch": 665} {"train_loss": -20.238433837890625, "global_step": 55271, "epoch": 665} {"train_loss": -20.14259910583496, "global_step": 55272, "epoch": 665} {"train_loss": -20.273014068603516, "global_step": 55273, "epoch": 665} {"train_loss": -20.317195892333984, "global_step": 55274, "epoch": 665} {"train_loss": -19.910404205322266, "global_step": 55275, "epoch": 665} {"train_loss": -20.282806396484375, "global_step": 55276, "epoch": 665} {"train_loss": -20.05878014162362, "global_step": 55277, "epoch": 665, "val_loss": 6056287.0} {"train_loss": -20.208372116088867, "global_step": 55278, "epoch": 666} {"train_loss": -19.981687545776367, "global_step": 55279, "epoch": 666} {"train_loss": -19.950551986694336, "global_step": 55280, "epoch": 666} {"train_loss": -19.962949752807617, "global_step": 55281, "epoch": 666} {"train_loss": -19.92159080505371, "global_step": 55282, "epoch": 666} {"train_loss": -20.40097999572754, "global_step": 55283, "epoch": 666} {"train_loss": -19.839353561401367, "global_step": 55284, "epoch": 666} {"train_loss": -20.47100257873535, "global_step": 55285, "epoch": 666} {"train_loss": -20.06495475769043, "global_step": 55286, "epoch": 666} {"train_loss": -20.06768798828125, "global_step": 55287, "epoch": 666} {"train_loss": -20.320993423461914, "global_step": 55288, "epoch": 666} {"train_loss": -20.224756240844727, "global_step": 55289, "epoch": 666} {"train_loss": -20.041847229003906, "global_step": 55290, "epoch": 666} {"train_loss": -20.468143463134766, "global_step": 55291, "epoch": 666} {"train_loss": -20.16892433166504, "global_step": 55292, "epoch": 666} {"train_loss": -20.378896713256836, "global_step": 55293, "epoch": 666} {"train_loss": -20.03553009033203, "global_step": 55294, "epoch": 666} {"train_loss": -19.955202102661133, "global_step": 55295, "epoch": 666} {"train_loss": -20.23088836669922, "global_step": 55296, "epoch": 666} {"train_loss": -20.246437072753906, "global_step": 55297, "epoch": 666} {"train_loss": -20.395719528198242, "global_step": 55298, "epoch": 666} {"train_loss": -20.07184410095215, "global_step": 55299, "epoch": 666} {"train_loss": -20.23964500427246, "global_step": 55300, "epoch": 666} {"train_loss": -20.124271392822266, "global_step": 55301, "epoch": 666} {"train_loss": -20.21531105041504, "global_step": 55302, "epoch": 666} {"train_loss": -19.83170509338379, "global_step": 55303, "epoch": 666} {"train_loss": -20.580062866210938, "global_step": 55304, "epoch": 666} {"train_loss": -20.117263793945312, "global_step": 55305, "epoch": 666} {"train_loss": -20.31804847717285, "global_step": 55306, "epoch": 666} {"train_loss": -20.18328857421875, "global_step": 55307, "epoch": 666} {"train_loss": -20.584125518798828, "global_step": 55308, "epoch": 666} {"train_loss": -20.310781478881836, "global_step": 55309, "epoch": 666} {"train_loss": -19.93845558166504, "global_step": 55310, "epoch": 666} {"train_loss": -20.108165740966797, "global_step": 55311, "epoch": 666} {"train_loss": -20.026371002197266, "global_step": 55312, "epoch": 666} {"train_loss": -20.16302490234375, "global_step": 55313, "epoch": 666} {"train_loss": -20.42025375366211, "global_step": 55314, "epoch": 666} {"train_loss": -20.169347763061523, "global_step": 55315, "epoch": 666} {"train_loss": -20.372785568237305, "global_step": 55316, "epoch": 666} {"train_loss": -20.132871627807617, "global_step": 55317, "epoch": 666} {"train_loss": -20.224103927612305, "global_step": 55318, "epoch": 666} {"train_loss": -19.836881637573242, "global_step": 55319, "epoch": 666} {"train_loss": -19.848529815673828, "global_step": 55320, "epoch": 666} {"train_loss": -19.904987335205078, "global_step": 55321, "epoch": 666} {"train_loss": -19.67264747619629, "global_step": 55322, "epoch": 666} {"train_loss": -20.05483055114746, "global_step": 55323, "epoch": 666} {"train_loss": -20.092500686645508, "global_step": 55324, "epoch": 666} {"train_loss": -19.972272872924805, "global_step": 55325, "epoch": 666} {"train_loss": -20.320714950561523, "global_step": 55326, "epoch": 666} {"train_loss": -20.282367706298828, "global_step": 55327, "epoch": 666} {"train_loss": -20.21034812927246, "global_step": 55328, "epoch": 666} {"train_loss": -20.38263511657715, "global_step": 55329, "epoch": 666} {"train_loss": -19.91937255859375, "global_step": 55330, "epoch": 666} {"train_loss": -20.184499740600586, "global_step": 55331, "epoch": 666} {"train_loss": -20.246326446533203, "global_step": 55332, "epoch": 666} {"train_loss": -20.220748901367188, "global_step": 55333, "epoch": 666} {"train_loss": -20.055456161499023, "global_step": 55334, "epoch": 666} {"train_loss": -20.221099853515625, "global_step": 55335, "epoch": 666} {"train_loss": -20.302099227905273, "global_step": 55336, "epoch": 666} {"train_loss": -20.155248641967773, "global_step": 55337, "epoch": 666} {"train_loss": -20.218679428100586, "global_step": 55338, "epoch": 666} {"train_loss": -20.043663024902344, "global_step": 55339, "epoch": 666} {"train_loss": -20.197969436645508, "global_step": 55340, "epoch": 666} {"train_loss": -19.925745010375977, "global_step": 55341, "epoch": 666} {"train_loss": -20.165145874023438, "global_step": 55342, "epoch": 666} {"train_loss": -20.27021598815918, "global_step": 55343, "epoch": 666} {"train_loss": -20.349145889282227, "global_step": 55344, "epoch": 666} {"train_loss": -20.460840225219727, "global_step": 55345, "epoch": 666} {"train_loss": -20.342649459838867, "global_step": 55346, "epoch": 666} {"train_loss": -19.953596115112305, "global_step": 55347, "epoch": 666} {"train_loss": -20.124799728393555, "global_step": 55348, "epoch": 666} {"train_loss": -20.0076847076416, "global_step": 55349, "epoch": 666} {"train_loss": -20.247222900390625, "global_step": 55350, "epoch": 666} {"train_loss": -20.376371383666992, "global_step": 55351, "epoch": 666} {"train_loss": -20.149755477905273, "global_step": 55352, "epoch": 666} {"train_loss": -19.97357749938965, "global_step": 55353, "epoch": 666} {"train_loss": -20.254674911499023, "global_step": 55354, "epoch": 666} {"train_loss": -20.439603805541992, "global_step": 55355, "epoch": 666} {"train_loss": -20.33837890625, "global_step": 55356, "epoch": 666} {"train_loss": -20.47749900817871, "global_step": 55357, "epoch": 666} {"train_loss": -20.262311935424805, "global_step": 55358, "epoch": 666} {"train_loss": -20.512964248657227, "global_step": 55359, "epoch": 666} {"train_loss": -20.1666208290192, "global_step": 55360, "epoch": 666, "val_loss": 6118084.0} {"train_loss": -19.698312759399414, "global_step": 55361, "epoch": 667} {"train_loss": -19.375696182250977, "global_step": 55362, "epoch": 667} {"train_loss": -20.41294288635254, "global_step": 55363, "epoch": 667} {"train_loss": -19.92353630065918, "global_step": 55364, "epoch": 667} {"train_loss": -20.336517333984375, "global_step": 55365, "epoch": 667} {"train_loss": -20.091873168945312, "global_step": 55366, "epoch": 667} {"train_loss": -20.333433151245117, "global_step": 55367, "epoch": 667} {"train_loss": -20.06891441345215, "global_step": 55368, "epoch": 667} {"train_loss": -20.034093856811523, "global_step": 55369, "epoch": 667} {"train_loss": -20.074432373046875, "global_step": 55370, "epoch": 667} {"train_loss": -20.179141998291016, "global_step": 55371, "epoch": 667} {"train_loss": -20.480295181274414, "global_step": 55372, "epoch": 667} {"train_loss": -20.175519943237305, "global_step": 55373, "epoch": 667} {"train_loss": -20.508516311645508, "global_step": 55374, "epoch": 667} {"train_loss": -20.2611141204834, "global_step": 55375, "epoch": 667} {"train_loss": -20.192707061767578, "global_step": 55376, "epoch": 667} {"train_loss": -19.78073501586914, "global_step": 55377, "epoch": 667} {"train_loss": -19.914886474609375, "global_step": 55378, "epoch": 667} {"train_loss": -19.76902198791504, "global_step": 55379, "epoch": 667} {"train_loss": -19.78159523010254, "global_step": 55380, "epoch": 667} {"train_loss": -19.693464279174805, "global_step": 55381, "epoch": 667} {"train_loss": -20.239341735839844, "global_step": 55382, "epoch": 667} {"train_loss": -20.11320686340332, "global_step": 55383, "epoch": 667} {"train_loss": -19.78110694885254, "global_step": 55384, "epoch": 667} {"train_loss": -20.076169967651367, "global_step": 55385, "epoch": 667} {"train_loss": -20.16863441467285, "global_step": 55386, "epoch": 667} {"train_loss": -20.39127540588379, "global_step": 55387, "epoch": 667} {"train_loss": -20.11280632019043, "global_step": 55388, "epoch": 667} {"train_loss": -19.976974487304688, "global_step": 55389, "epoch": 667} {"train_loss": -20.064374923706055, "global_step": 55390, "epoch": 667} {"train_loss": -19.960708618164062, "global_step": 55391, "epoch": 667} {"train_loss": -19.81296157836914, "global_step": 55392, "epoch": 667} {"train_loss": -20.169628143310547, "global_step": 55393, "epoch": 667} {"train_loss": -20.321035385131836, "global_step": 55394, "epoch": 667} {"train_loss": -20.165454864501953, "global_step": 55395, "epoch": 667} {"train_loss": -20.12251091003418, "global_step": 55396, "epoch": 667} {"train_loss": -20.41117286682129, "global_step": 55397, "epoch": 667} {"train_loss": -20.227216720581055, "global_step": 55398, "epoch": 667} {"train_loss": -19.861976623535156, "global_step": 55399, "epoch": 667} {"train_loss": -20.35767936706543, "global_step": 55400, "epoch": 667} {"train_loss": -20.529794692993164, "global_step": 55401, "epoch": 667} {"train_loss": -20.220136642456055, "global_step": 55402, "epoch": 667} {"train_loss": -20.24677085876465, "global_step": 55403, "epoch": 667} {"train_loss": -20.2685489654541, "global_step": 55404, "epoch": 667} {"train_loss": -20.039306640625, "global_step": 55405, "epoch": 667} {"train_loss": -20.05160903930664, "global_step": 55406, "epoch": 667} {"train_loss": -20.135677337646484, "global_step": 55407, "epoch": 667} {"train_loss": -20.3439998626709, "global_step": 55408, "epoch": 667} {"train_loss": -20.37325096130371, "global_step": 55409, "epoch": 667} {"train_loss": -20.052021026611328, "global_step": 55410, "epoch": 667} {"train_loss": -19.951181411743164, "global_step": 55411, "epoch": 667} {"train_loss": -20.340173721313477, "global_step": 55412, "epoch": 667} {"train_loss": -19.886259078979492, "global_step": 55413, "epoch": 667} {"train_loss": -20.449575424194336, "global_step": 55414, "epoch": 667} {"train_loss": -20.05449676513672, "global_step": 55415, "epoch": 667} {"train_loss": -19.99369239807129, "global_step": 55416, "epoch": 667} {"train_loss": -19.948566436767578, "global_step": 55417, "epoch": 667} {"train_loss": -20.462501525878906, "global_step": 55418, "epoch": 667} {"train_loss": -20.468219757080078, "global_step": 55419, "epoch": 667} {"train_loss": -20.282033920288086, "global_step": 55420, "epoch": 667} {"train_loss": -20.23969841003418, "global_step": 55421, "epoch": 667} {"train_loss": -20.23469352722168, "global_step": 55422, "epoch": 667} {"train_loss": -19.8864688873291, "global_step": 55423, "epoch": 667} {"train_loss": -20.336288452148438, "global_step": 55424, "epoch": 667} {"train_loss": -20.0194091796875, "global_step": 55425, "epoch": 667} {"train_loss": -20.42772102355957, "global_step": 55426, "epoch": 667} {"train_loss": -20.287153244018555, "global_step": 55427, "epoch": 667} {"train_loss": -20.19264793395996, "global_step": 55428, "epoch": 667} {"train_loss": -20.182891845703125, "global_step": 55429, "epoch": 667} {"train_loss": -20.507205963134766, "global_step": 55430, "epoch": 667} {"train_loss": -20.280380249023438, "global_step": 55431, "epoch": 667} {"train_loss": -20.276504516601562, "global_step": 55432, "epoch": 667} {"train_loss": -20.138931274414062, "global_step": 55433, "epoch": 667} {"train_loss": -20.384262084960938, "global_step": 55434, "epoch": 667} {"train_loss": -20.01076316833496, "global_step": 55435, "epoch": 667} {"train_loss": -19.86819839477539, "global_step": 55436, "epoch": 667} {"train_loss": -20.498462677001953, "global_step": 55437, "epoch": 667} {"train_loss": -20.066267013549805, "global_step": 55438, "epoch": 667} {"train_loss": -19.988473892211914, "global_step": 55439, "epoch": 667} {"train_loss": -20.327457427978516, "global_step": 55440, "epoch": 667} {"train_loss": -20.27657127380371, "global_step": 55441, "epoch": 667} {"train_loss": -20.17168426513672, "global_step": 55442, "epoch": 667} {"train_loss": -20.138982979648084, "global_step": 55443, "epoch": 667, "val_loss": 6104880.0} {"train_loss": -19.882068634033203, "global_step": 55444, "epoch": 668} {"train_loss": -19.782913208007812, "global_step": 55445, "epoch": 668} {"train_loss": -20.373685836791992, "global_step": 55446, "epoch": 668} {"train_loss": -20.0198917388916, "global_step": 55447, "epoch": 668} {"train_loss": -19.867111206054688, "global_step": 55448, "epoch": 668} {"train_loss": -20.26287078857422, "global_step": 55449, "epoch": 668} {"train_loss": -19.790386199951172, "global_step": 55450, "epoch": 668} {"train_loss": -20.16657066345215, "global_step": 55451, "epoch": 668} {"train_loss": -20.32697105407715, "global_step": 55452, "epoch": 668} {"train_loss": -20.399030685424805, "global_step": 55453, "epoch": 668} {"train_loss": -19.819242477416992, "global_step": 55454, "epoch": 668} {"train_loss": -19.846336364746094, "global_step": 55455, "epoch": 668} {"train_loss": -19.939077377319336, "global_step": 55456, "epoch": 668} {"train_loss": -19.82877540588379, "global_step": 55457, "epoch": 668} {"train_loss": -19.820363998413086, "global_step": 55458, "epoch": 668} {"train_loss": -20.55179786682129, "global_step": 55459, "epoch": 668} {"train_loss": -20.085172653198242, "global_step": 55460, "epoch": 668} {"train_loss": -20.223485946655273, "global_step": 55461, "epoch": 668} {"train_loss": -19.973501205444336, "global_step": 55462, "epoch": 668} {"train_loss": -20.704898834228516, "global_step": 55463, "epoch": 668} {"train_loss": -20.054275512695312, "global_step": 55464, "epoch": 668} {"train_loss": -20.402376174926758, "global_step": 55465, "epoch": 668} {"train_loss": -19.990997314453125, "global_step": 55466, "epoch": 668} {"train_loss": -20.15865135192871, "global_step": 55467, "epoch": 668} {"train_loss": -20.173490524291992, "global_step": 55468, "epoch": 668} {"train_loss": -19.982412338256836, "global_step": 55469, "epoch": 668} {"train_loss": -20.43596839904785, "global_step": 55470, "epoch": 668} {"train_loss": -20.110300064086914, "global_step": 55471, "epoch": 668} {"train_loss": -20.355316162109375, "global_step": 55472, "epoch": 668} {"train_loss": -20.038909912109375, "global_step": 55473, "epoch": 668} {"train_loss": -20.23257064819336, "global_step": 55474, "epoch": 668} {"train_loss": -20.547805786132812, "global_step": 55475, "epoch": 668} {"train_loss": -19.891799926757812, "global_step": 55476, "epoch": 668} {"train_loss": -20.196247100830078, "global_step": 55477, "epoch": 668} {"train_loss": -19.926523208618164, "global_step": 55478, "epoch": 668} {"train_loss": -20.33407974243164, "global_step": 55479, "epoch": 668} {"train_loss": -20.09834861755371, "global_step": 55480, "epoch": 668} {"train_loss": -20.221881866455078, "global_step": 55481, "epoch": 668} {"train_loss": -20.154815673828125, "global_step": 55482, "epoch": 668} {"train_loss": -20.57255744934082, "global_step": 55483, "epoch": 668} {"train_loss": -20.217716217041016, "global_step": 55484, "epoch": 668} {"train_loss": -20.809173583984375, "global_step": 55485, "epoch": 668} {"train_loss": -20.074647903442383, "global_step": 55486, "epoch": 668} {"train_loss": -20.11429786682129, "global_step": 55487, "epoch": 668} {"train_loss": -20.40065574645996, "global_step": 55488, "epoch": 668} {"train_loss": -20.38140296936035, "global_step": 55489, "epoch": 668} {"train_loss": -20.1915225982666, "global_step": 55490, "epoch": 668} {"train_loss": -19.791196823120117, "global_step": 55491, "epoch": 668} {"train_loss": -19.807260513305664, "global_step": 55492, "epoch": 668} {"train_loss": -20.460508346557617, "global_step": 55493, "epoch": 668} {"train_loss": -19.93058204650879, "global_step": 55494, "epoch": 668} {"train_loss": -20.31168556213379, "global_step": 55495, "epoch": 668} {"train_loss": -20.212839126586914, "global_step": 55496, "epoch": 668} {"train_loss": -20.206811904907227, "global_step": 55497, "epoch": 668} {"train_loss": -19.932647705078125, "global_step": 55498, "epoch": 668} {"train_loss": -20.155385971069336, "global_step": 55499, "epoch": 668} {"train_loss": -19.997020721435547, "global_step": 55500, "epoch": 668} {"train_loss": -20.110702514648438, "global_step": 55501, "epoch": 668} {"train_loss": -20.1353816986084, "global_step": 55502, "epoch": 668} {"train_loss": -20.41035270690918, "global_step": 55503, "epoch": 668} {"train_loss": -20.203195571899414, "global_step": 55504, "epoch": 668} {"train_loss": -20.321317672729492, "global_step": 55505, "epoch": 668} {"train_loss": -20.175344467163086, "global_step": 55506, "epoch": 668} {"train_loss": -20.144168853759766, "global_step": 55507, "epoch": 668} {"train_loss": -20.027143478393555, "global_step": 55508, "epoch": 668} {"train_loss": -19.829437255859375, "global_step": 55509, "epoch": 668} {"train_loss": -20.133193969726562, "global_step": 55510, "epoch": 668} {"train_loss": -20.037099838256836, "global_step": 55511, "epoch": 668} {"train_loss": -20.437423706054688, "global_step": 55512, "epoch": 668} {"train_loss": -20.630659103393555, "global_step": 55513, "epoch": 668} {"train_loss": -20.305932998657227, "global_step": 55514, "epoch": 668} {"train_loss": -20.42325210571289, "global_step": 55515, "epoch": 668} {"train_loss": -20.575008392333984, "global_step": 55516, "epoch": 668} {"train_loss": -20.065126419067383, "global_step": 55517, "epoch": 668} {"train_loss": -20.037479400634766, "global_step": 55518, "epoch": 668} {"train_loss": -20.554981231689453, "global_step": 55519, "epoch": 668} {"train_loss": -20.60962677001953, "global_step": 55520, "epoch": 668} {"train_loss": -20.231565475463867, "global_step": 55521, "epoch": 668} {"train_loss": -20.143888473510742, "global_step": 55522, "epoch": 668} {"train_loss": -20.30488395690918, "global_step": 55523, "epoch": 668} {"train_loss": -20.06168556213379, "global_step": 55524, "epoch": 668} {"train_loss": -19.914249420166016, "global_step": 55525, "epoch": 668} {"train_loss": -20.187136178993317, "global_step": 55526, "epoch": 668, "val_loss": 5952146.5} {"train_loss": -19.652753829956055, "global_step": 55527, "epoch": 669} {"train_loss": -20.086597442626953, "global_step": 55528, "epoch": 669} {"train_loss": -19.89934539794922, "global_step": 55529, "epoch": 669} {"train_loss": -19.89482879638672, "global_step": 55530, "epoch": 669} {"train_loss": -19.458616256713867, "global_step": 55531, "epoch": 669} {"train_loss": -20.21965980529785, "global_step": 55532, "epoch": 669} {"train_loss": -19.635122299194336, "global_step": 55533, "epoch": 669} {"train_loss": -19.720867156982422, "global_step": 55534, "epoch": 669} {"train_loss": -19.99155044555664, "global_step": 55535, "epoch": 669} {"train_loss": -19.691089630126953, "global_step": 55536, "epoch": 669} {"train_loss": -19.91225242614746, "global_step": 55537, "epoch": 669} {"train_loss": -19.982643127441406, "global_step": 55538, "epoch": 669} {"train_loss": -19.9164981842041, "global_step": 55539, "epoch": 669} {"train_loss": -20.100255966186523, "global_step": 55540, "epoch": 669} {"train_loss": -19.997102737426758, "global_step": 55541, "epoch": 669} {"train_loss": -19.935009002685547, "global_step": 55542, "epoch": 669} {"train_loss": -19.90810203552246, "global_step": 55543, "epoch": 669} {"train_loss": -20.260717391967773, "global_step": 55544, "epoch": 669} {"train_loss": -19.836959838867188, "global_step": 55545, "epoch": 669} {"train_loss": -20.007328033447266, "global_step": 55546, "epoch": 669} {"train_loss": -20.530187606811523, "global_step": 55547, "epoch": 669} {"train_loss": -20.133962631225586, "global_step": 55548, "epoch": 669} {"train_loss": -20.113779067993164, "global_step": 55549, "epoch": 669} {"train_loss": -20.14312744140625, "global_step": 55550, "epoch": 669} {"train_loss": -20.29062843322754, "global_step": 55551, "epoch": 669} {"train_loss": -20.064416885375977, "global_step": 55552, "epoch": 669} {"train_loss": -20.183551788330078, "global_step": 55553, "epoch": 669} {"train_loss": -20.358530044555664, "global_step": 55554, "epoch": 669} {"train_loss": -20.19805335998535, "global_step": 55555, "epoch": 669} {"train_loss": -20.17793846130371, "global_step": 55556, "epoch": 669} {"train_loss": -19.835391998291016, "global_step": 55557, "epoch": 669} {"train_loss": -19.813955307006836, "global_step": 55558, "epoch": 669} {"train_loss": -20.225234985351562, "global_step": 55559, "epoch": 669} {"train_loss": -20.320556640625, "global_step": 55560, "epoch": 669} {"train_loss": -19.976171493530273, "global_step": 55561, "epoch": 669} {"train_loss": -19.862340927124023, "global_step": 55562, "epoch": 669} {"train_loss": -20.010665893554688, "global_step": 55563, "epoch": 669} {"train_loss": -20.02023696899414, "global_step": 55564, "epoch": 669} {"train_loss": -20.010162353515625, "global_step": 55565, "epoch": 669} {"train_loss": -20.370620727539062, "global_step": 55566, "epoch": 669} {"train_loss": -19.973676681518555, "global_step": 55567, "epoch": 669} {"train_loss": -20.14841651916504, "global_step": 55568, "epoch": 669} {"train_loss": -20.12139129638672, "global_step": 55569, "epoch": 669} {"train_loss": -19.949241638183594, "global_step": 55570, "epoch": 669} {"train_loss": -20.24970817565918, "global_step": 55571, "epoch": 669} {"train_loss": -20.24933433532715, "global_step": 55572, "epoch": 669} {"train_loss": -20.12776756286621, "global_step": 55573, "epoch": 669} {"train_loss": -19.966976165771484, "global_step": 55574, "epoch": 669} {"train_loss": -20.17548179626465, "global_step": 55575, "epoch": 669} {"train_loss": -19.960433959960938, "global_step": 55576, "epoch": 669} {"train_loss": -19.776742935180664, "global_step": 55577, "epoch": 669} {"train_loss": -20.256912231445312, "global_step": 55578, "epoch": 669} {"train_loss": -19.969013214111328, "global_step": 55579, "epoch": 669} {"train_loss": -20.29534339904785, "global_step": 55580, "epoch": 669} {"train_loss": -20.000730514526367, "global_step": 55581, "epoch": 669} {"train_loss": -20.406070709228516, "global_step": 55582, "epoch": 669} {"train_loss": -20.3927001953125, "global_step": 55583, "epoch": 669} {"train_loss": -20.25172996520996, "global_step": 55584, "epoch": 669} {"train_loss": -20.119482040405273, "global_step": 55585, "epoch": 669} {"train_loss": -20.112863540649414, "global_step": 55586, "epoch": 669} {"train_loss": -20.303598403930664, "global_step": 55587, "epoch": 669} {"train_loss": -20.345373153686523, "global_step": 55588, "epoch": 669} {"train_loss": -20.28123664855957, "global_step": 55589, "epoch": 669} {"train_loss": -20.536725997924805, "global_step": 55590, "epoch": 669} {"train_loss": -20.26103401184082, "global_step": 55591, "epoch": 669} {"train_loss": -20.176504135131836, "global_step": 55592, "epoch": 669} {"train_loss": -20.381383895874023, "global_step": 55593, "epoch": 669} {"train_loss": -19.881683349609375, "global_step": 55594, "epoch": 669} {"train_loss": -20.227909088134766, "global_step": 55595, "epoch": 669} {"train_loss": -20.02583122253418, "global_step": 55596, "epoch": 669} {"train_loss": -20.153409957885742, "global_step": 55597, "epoch": 669} {"train_loss": -20.10552978515625, "global_step": 55598, "epoch": 669} {"train_loss": -20.346616744995117, "global_step": 55599, "epoch": 669} {"train_loss": -20.26460838317871, "global_step": 55600, "epoch": 669} {"train_loss": -20.28315544128418, "global_step": 55601, "epoch": 669} {"train_loss": -20.329429626464844, "global_step": 55602, "epoch": 669} {"train_loss": -20.56021499633789, "global_step": 55603, "epoch": 669} {"train_loss": -20.407333374023438, "global_step": 55604, "epoch": 669} {"train_loss": -20.15610694885254, "global_step": 55605, "epoch": 669} {"train_loss": -19.875368118286133, "global_step": 55606, "epoch": 669} {"train_loss": -20.232379913330078, "global_step": 55607, "epoch": 669} {"train_loss": -20.28909683227539, "global_step": 55608, "epoch": 669} {"train_loss": -20.110741511884942, "global_step": 55609, "epoch": 669, "val_loss": 6079062.5} {"train_loss": -19.81501579284668, "global_step": 55610, "epoch": 670} {"train_loss": -20.404584884643555, "global_step": 55611, "epoch": 670} {"train_loss": -19.7705135345459, "global_step": 55612, "epoch": 670} {"train_loss": -20.145071029663086, "global_step": 55613, "epoch": 670} {"train_loss": -20.365991592407227, "global_step": 55614, "epoch": 670} {"train_loss": -20.177682876586914, "global_step": 55615, "epoch": 670} {"train_loss": -19.590484619140625, "global_step": 55616, "epoch": 670} {"train_loss": -19.796743392944336, "global_step": 55617, "epoch": 670} {"train_loss": -19.999469757080078, "global_step": 55618, "epoch": 670} {"train_loss": -20.04817008972168, "global_step": 55619, "epoch": 670} {"train_loss": -20.299528121948242, "global_step": 55620, "epoch": 670} {"train_loss": -19.762035369873047, "global_step": 55621, "epoch": 670} {"train_loss": -20.30672264099121, "global_step": 55622, "epoch": 670} {"train_loss": -20.127714157104492, "global_step": 55623, "epoch": 670} {"train_loss": -20.380352020263672, "global_step": 55624, "epoch": 670} {"train_loss": -20.001384735107422, "global_step": 55625, "epoch": 670} {"train_loss": -20.119375228881836, "global_step": 55626, "epoch": 670} {"train_loss": -19.933889389038086, "global_step": 55627, "epoch": 670} {"train_loss": -20.151676177978516, "global_step": 55628, "epoch": 670} {"train_loss": -20.14749526977539, "global_step": 55629, "epoch": 670} {"train_loss": -20.53375816345215, "global_step": 55630, "epoch": 670} {"train_loss": -20.148801803588867, "global_step": 55631, "epoch": 670} {"train_loss": -19.822656631469727, "global_step": 55632, "epoch": 670} {"train_loss": -19.93682098388672, "global_step": 55633, "epoch": 670} {"train_loss": -20.364334106445312, "global_step": 55634, "epoch": 670} {"train_loss": -20.36270523071289, "global_step": 55635, "epoch": 670} {"train_loss": -20.246240615844727, "global_step": 55636, "epoch": 670} {"train_loss": -19.878822326660156, "global_step": 55637, "epoch": 670} {"train_loss": -20.266860961914062, "global_step": 55638, "epoch": 670} {"train_loss": -20.35881996154785, "global_step": 55639, "epoch": 670} {"train_loss": -20.211977005004883, "global_step": 55640, "epoch": 670} {"train_loss": -20.37935447692871, "global_step": 55641, "epoch": 670} {"train_loss": -20.165231704711914, "global_step": 55642, "epoch": 670} {"train_loss": -20.337940216064453, "global_step": 55643, "epoch": 670} {"train_loss": -20.368942260742188, "global_step": 55644, "epoch": 670} {"train_loss": -20.256946563720703, "global_step": 55645, "epoch": 670} {"train_loss": -20.053712844848633, "global_step": 55646, "epoch": 670} {"train_loss": -20.51104164123535, "global_step": 55647, "epoch": 670} {"train_loss": -19.88838768005371, "global_step": 55648, "epoch": 670} {"train_loss": -20.12032127380371, "global_step": 55649, "epoch": 670} {"train_loss": -19.754016876220703, "global_step": 55650, "epoch": 670} {"train_loss": -20.214780807495117, "global_step": 55651, "epoch": 670} {"train_loss": -20.01021385192871, "global_step": 55652, "epoch": 670} {"train_loss": -20.748334884643555, "global_step": 55653, "epoch": 670} {"train_loss": -20.522626876831055, "global_step": 55654, "epoch": 670} {"train_loss": -20.32573890686035, "global_step": 55655, "epoch": 670} {"train_loss": -20.11574363708496, "global_step": 55656, "epoch": 670} {"train_loss": -20.176130294799805, "global_step": 55657, "epoch": 670} {"train_loss": -20.17433738708496, "global_step": 55658, "epoch": 670} {"train_loss": -20.693649291992188, "global_step": 55659, "epoch": 670} {"train_loss": -19.89084815979004, "global_step": 55660, "epoch": 670} {"train_loss": -20.13262367248535, "global_step": 55661, "epoch": 670} {"train_loss": -20.03923797607422, "global_step": 55662, "epoch": 670} {"train_loss": -20.09323501586914, "global_step": 55663, "epoch": 670} {"train_loss": -19.639942169189453, "global_step": 55664, "epoch": 670} {"train_loss": -20.388507843017578, "global_step": 55665, "epoch": 670} {"train_loss": -20.075468063354492, "global_step": 55666, "epoch": 670} {"train_loss": -20.586767196655273, "global_step": 55667, "epoch": 670} {"train_loss": -19.968236923217773, "global_step": 55668, "epoch": 670} {"train_loss": -20.19649314880371, "global_step": 55669, "epoch": 670} {"train_loss": -20.038480758666992, "global_step": 55670, "epoch": 670} {"train_loss": -20.442659378051758, "global_step": 55671, "epoch": 670} {"train_loss": -20.386560440063477, "global_step": 55672, "epoch": 670} {"train_loss": -20.75712013244629, "global_step": 55673, "epoch": 670} {"train_loss": -19.871633529663086, "global_step": 55674, "epoch": 670} {"train_loss": -19.958892822265625, "global_step": 55675, "epoch": 670} {"train_loss": -20.20441436767578, "global_step": 55676, "epoch": 670} {"train_loss": -20.385770797729492, "global_step": 55677, "epoch": 670} {"train_loss": -20.092910766601562, "global_step": 55678, "epoch": 670} {"train_loss": -20.303977966308594, "global_step": 55679, "epoch": 670} {"train_loss": -19.995330810546875, "global_step": 55680, "epoch": 670} {"train_loss": -20.475278854370117, "global_step": 55681, "epoch": 670} {"train_loss": -20.232757568359375, "global_step": 55682, "epoch": 670} {"train_loss": -20.197324752807617, "global_step": 55683, "epoch": 670} {"train_loss": -20.357437133789062, "global_step": 55684, "epoch": 670} {"train_loss": -20.03767204284668, "global_step": 55685, "epoch": 670} {"train_loss": -20.248929977416992, "global_step": 55686, "epoch": 670} {"train_loss": -20.20137596130371, "global_step": 55687, "epoch": 670} {"train_loss": -20.32087516784668, "global_step": 55688, "epoch": 670} {"train_loss": -20.212757110595703, "global_step": 55689, "epoch": 670} {"train_loss": -20.597715377807617, "global_step": 55690, "epoch": 670} {"train_loss": -20.09634780883789, "global_step": 55691, "epoch": 670} {"train_loss": -20.176314089671674, "global_step": 55692, "epoch": 670, "val_loss": 6047459.0} {"train_loss": -19.501712799072266, "global_step": 55693, "epoch": 671} {"train_loss": -19.889022827148438, "global_step": 55694, "epoch": 671} {"train_loss": -19.614017486572266, "global_step": 55695, "epoch": 671} {"train_loss": -19.924348831176758, "global_step": 55696, "epoch": 671} {"train_loss": -19.870197296142578, "global_step": 55697, "epoch": 671} {"train_loss": -20.224180221557617, "global_step": 55698, "epoch": 671} {"train_loss": -20.114538192749023, "global_step": 55699, "epoch": 671} {"train_loss": -19.968921661376953, "global_step": 55700, "epoch": 671} {"train_loss": -20.132064819335938, "global_step": 55701, "epoch": 671} {"train_loss": -19.64697265625, "global_step": 55702, "epoch": 671} {"train_loss": -19.729944229125977, "global_step": 55703, "epoch": 671} {"train_loss": -20.044675827026367, "global_step": 55704, "epoch": 671} {"train_loss": -19.93424415588379, "global_step": 55705, "epoch": 671} {"train_loss": -19.82684898376465, "global_step": 55706, "epoch": 671} {"train_loss": -19.985280990600586, "global_step": 55707, "epoch": 671} {"train_loss": -20.22707176208496, "global_step": 55708, "epoch": 671} {"train_loss": -20.09041404724121, "global_step": 55709, "epoch": 671} {"train_loss": -20.286161422729492, "global_step": 55710, "epoch": 671} {"train_loss": -20.052799224853516, "global_step": 55711, "epoch": 671} {"train_loss": -20.094572067260742, "global_step": 55712, "epoch": 671} {"train_loss": -20.33741569519043, "global_step": 55713, "epoch": 671} {"train_loss": -20.370481491088867, "global_step": 55714, "epoch": 671} {"train_loss": -20.262454986572266, "global_step": 55715, "epoch": 671} {"train_loss": -19.9228458404541, "global_step": 55716, "epoch": 671} {"train_loss": -19.893508911132812, "global_step": 55717, "epoch": 671} {"train_loss": -20.39670753479004, "global_step": 55718, "epoch": 671} {"train_loss": -20.114421844482422, "global_step": 55719, "epoch": 671} {"train_loss": -19.962234497070312, "global_step": 55720, "epoch": 671} {"train_loss": -20.124683380126953, "global_step": 55721, "epoch": 671} {"train_loss": -20.42730140686035, "global_step": 55722, "epoch": 671} {"train_loss": -20.001066207885742, "global_step": 55723, "epoch": 671} {"train_loss": -20.189401626586914, "global_step": 55724, "epoch": 671} {"train_loss": -20.055892944335938, "global_step": 55725, "epoch": 671} {"train_loss": -20.444782257080078, "global_step": 55726, "epoch": 671} {"train_loss": -19.976346969604492, "global_step": 55727, "epoch": 671} {"train_loss": -20.23405647277832, "global_step": 55728, "epoch": 671} {"train_loss": -20.32571792602539, "global_step": 55729, "epoch": 671} {"train_loss": -19.93535804748535, "global_step": 55730, "epoch": 671} {"train_loss": -20.315481185913086, "global_step": 55731, "epoch": 671} {"train_loss": -19.961563110351562, "global_step": 55732, "epoch": 671} {"train_loss": -20.355756759643555, "global_step": 55733, "epoch": 671} {"train_loss": -20.08517837524414, "global_step": 55734, "epoch": 671} {"train_loss": -19.980926513671875, "global_step": 55735, "epoch": 671} {"train_loss": -20.328664779663086, "global_step": 55736, "epoch": 671} {"train_loss": -20.18075180053711, "global_step": 55737, "epoch": 671} {"train_loss": -20.209150314331055, "global_step": 55738, "epoch": 671} {"train_loss": -20.023656845092773, "global_step": 55739, "epoch": 671} {"train_loss": -20.266218185424805, "global_step": 55740, "epoch": 671} {"train_loss": -20.367767333984375, "global_step": 55741, "epoch": 671} {"train_loss": -20.37037467956543, "global_step": 55742, "epoch": 671} {"train_loss": -20.01826286315918, "global_step": 55743, "epoch": 671} {"train_loss": -20.556135177612305, "global_step": 55744, "epoch": 671} {"train_loss": -20.297937393188477, "global_step": 55745, "epoch": 671} {"train_loss": -20.140478134155273, "global_step": 55746, "epoch": 671} {"train_loss": -20.180057525634766, "global_step": 55747, "epoch": 671} {"train_loss": -20.222469329833984, "global_step": 55748, "epoch": 671} {"train_loss": -20.196969985961914, "global_step": 55749, "epoch": 671} {"train_loss": -20.093502044677734, "global_step": 55750, "epoch": 671} {"train_loss": -20.213504791259766, "global_step": 55751, "epoch": 671} {"train_loss": -20.207181930541992, "global_step": 55752, "epoch": 671} {"train_loss": -19.848907470703125, "global_step": 55753, "epoch": 671} {"train_loss": -20.442445755004883, "global_step": 55754, "epoch": 671} {"train_loss": -20.077489852905273, "global_step": 55755, "epoch": 671} {"train_loss": -20.113239288330078, "global_step": 55756, "epoch": 671} {"train_loss": -20.439035415649414, "global_step": 55757, "epoch": 671} {"train_loss": -20.556564331054688, "global_step": 55758, "epoch": 671} {"train_loss": -20.14569664001465, "global_step": 55759, "epoch": 671} {"train_loss": -20.504608154296875, "global_step": 55760, "epoch": 671} {"train_loss": -20.21785545349121, "global_step": 55761, "epoch": 671} {"train_loss": -20.113798141479492, "global_step": 55762, "epoch": 671} {"train_loss": -20.26007652282715, "global_step": 55763, "epoch": 671} {"train_loss": -20.177305221557617, "global_step": 55764, "epoch": 671} {"train_loss": -20.016637802124023, "global_step": 55765, "epoch": 671} {"train_loss": -20.596450805664062, "global_step": 55766, "epoch": 671} {"train_loss": -20.40694808959961, "global_step": 55767, "epoch": 671} {"train_loss": -19.994915008544922, "global_step": 55768, "epoch": 671} {"train_loss": -20.035110473632812, "global_step": 55769, "epoch": 671} {"train_loss": -20.018156051635742, "global_step": 55770, "epoch": 671} {"train_loss": -20.136932373046875, "global_step": 55771, "epoch": 671} {"train_loss": -20.216005325317383, "global_step": 55772, "epoch": 671} {"train_loss": -20.32979393005371, "global_step": 55773, "epoch": 671} {"train_loss": -20.10910987854004, "global_step": 55774, "epoch": 671} {"train_loss": -20.158786842621954, "global_step": 55775, "epoch": 671, "val_loss": 5925952.5} {"train_loss": -19.9747257232666, "global_step": 55776, "epoch": 672} {"train_loss": -19.774988174438477, "global_step": 55777, "epoch": 672} {"train_loss": -19.642223358154297, "global_step": 55778, "epoch": 672} {"train_loss": -19.701791763305664, "global_step": 55779, "epoch": 672} {"train_loss": -19.725263595581055, "global_step": 55780, "epoch": 672} {"train_loss": -19.965469360351562, "global_step": 55781, "epoch": 672} {"train_loss": -20.119688034057617, "global_step": 55782, "epoch": 672} {"train_loss": -20.091205596923828, "global_step": 55783, "epoch": 672} {"train_loss": -19.606990814208984, "global_step": 55784, "epoch": 672} {"train_loss": -19.93574333190918, "global_step": 55785, "epoch": 672} {"train_loss": -20.147504806518555, "global_step": 55786, "epoch": 672} {"train_loss": -19.784120559692383, "global_step": 55787, "epoch": 672} {"train_loss": -19.65772819519043, "global_step": 55788, "epoch": 672} {"train_loss": -19.43967628479004, "global_step": 55789, "epoch": 672} {"train_loss": -20.323713302612305, "global_step": 55790, "epoch": 672} {"train_loss": -20.273557662963867, "global_step": 55791, "epoch": 672} {"train_loss": -20.148895263671875, "global_step": 55792, "epoch": 672} {"train_loss": -20.023056030273438, "global_step": 55793, "epoch": 672} {"train_loss": -19.991697311401367, "global_step": 55794, "epoch": 672} {"train_loss": -19.973230361938477, "global_step": 55795, "epoch": 672} {"train_loss": -19.944740295410156, "global_step": 55796, "epoch": 672} {"train_loss": -20.421850204467773, "global_step": 55797, "epoch": 672} {"train_loss": -20.260419845581055, "global_step": 55798, "epoch": 672} {"train_loss": -19.874454498291016, "global_step": 55799, "epoch": 672} {"train_loss": -20.173049926757812, "global_step": 55800, "epoch": 672} {"train_loss": -20.111387252807617, "global_step": 55801, "epoch": 672} {"train_loss": -19.764856338500977, "global_step": 55802, "epoch": 672} {"train_loss": -20.1549072265625, "global_step": 55803, "epoch": 672} {"train_loss": -20.211965560913086, "global_step": 55804, "epoch": 672} {"train_loss": -20.133413314819336, "global_step": 55805, "epoch": 672} {"train_loss": -19.976070404052734, "global_step": 55806, "epoch": 672} {"train_loss": -20.22611427307129, "global_step": 55807, "epoch": 672} {"train_loss": -20.047889709472656, "global_step": 55808, "epoch": 672} {"train_loss": -20.073041915893555, "global_step": 55809, "epoch": 672} {"train_loss": -20.076047897338867, "global_step": 55810, "epoch": 672} {"train_loss": -20.10158348083496, "global_step": 55811, "epoch": 672} {"train_loss": -20.571434020996094, "global_step": 55812, "epoch": 672} {"train_loss": -20.23841667175293, "global_step": 55813, "epoch": 672} {"train_loss": -20.0643310546875, "global_step": 55814, "epoch": 672} {"train_loss": -20.103168487548828, "global_step": 55815, "epoch": 672} {"train_loss": -20.369583129882812, "global_step": 55816, "epoch": 672} {"train_loss": -20.34698486328125, "global_step": 55817, "epoch": 672} {"train_loss": -19.96013832092285, "global_step": 55818, "epoch": 672} {"train_loss": -20.31656837463379, "global_step": 55819, "epoch": 672} {"train_loss": -20.29147720336914, "global_step": 55820, "epoch": 672} {"train_loss": -20.178714752197266, "global_step": 55821, "epoch": 672} {"train_loss": -20.202953338623047, "global_step": 55822, "epoch": 672} {"train_loss": -20.188308715820312, "global_step": 55823, "epoch": 672} {"train_loss": -20.579946517944336, "global_step": 55824, "epoch": 672} {"train_loss": -20.491016387939453, "global_step": 55825, "epoch": 672} {"train_loss": -19.94556999206543, "global_step": 55826, "epoch": 672} {"train_loss": -20.30360984802246, "global_step": 55827, "epoch": 672} {"train_loss": -19.805288314819336, "global_step": 55828, "epoch": 672} {"train_loss": -20.422269821166992, "global_step": 55829, "epoch": 672} {"train_loss": -20.631567001342773, "global_step": 55830, "epoch": 672} {"train_loss": -19.939899444580078, "global_step": 55831, "epoch": 672} {"train_loss": -20.36799430847168, "global_step": 55832, "epoch": 672} {"train_loss": -20.063074111938477, "global_step": 55833, "epoch": 672} {"train_loss": -20.027376174926758, "global_step": 55834, "epoch": 672} {"train_loss": -20.202281951904297, "global_step": 55835, "epoch": 672} {"train_loss": -20.063749313354492, "global_step": 55836, "epoch": 672} {"train_loss": -20.093875885009766, "global_step": 55837, "epoch": 672} {"train_loss": -20.262100219726562, "global_step": 55838, "epoch": 672} {"train_loss": -19.84194564819336, "global_step": 55839, "epoch": 672} {"train_loss": -20.192062377929688, "global_step": 55840, "epoch": 672} {"train_loss": -20.184988021850586, "global_step": 55841, "epoch": 672} {"train_loss": -20.10517692565918, "global_step": 55842, "epoch": 672} {"train_loss": -20.0489444732666, "global_step": 55843, "epoch": 672} {"train_loss": -20.153165817260742, "global_step": 55844, "epoch": 672} {"train_loss": -19.86649513244629, "global_step": 55845, "epoch": 672} {"train_loss": -20.42576026916504, "global_step": 55846, "epoch": 672} {"train_loss": -20.424070358276367, "global_step": 55847, "epoch": 672} {"train_loss": -20.356990814208984, "global_step": 55848, "epoch": 672} {"train_loss": -20.061975479125977, "global_step": 55849, "epoch": 672} {"train_loss": -20.156869888305664, "global_step": 55850, "epoch": 672} {"train_loss": -20.393264770507812, "global_step": 55851, "epoch": 672} {"train_loss": -20.441091537475586, "global_step": 55852, "epoch": 672} {"train_loss": -20.029882431030273, "global_step": 55853, "epoch": 672} {"train_loss": -20.27760124206543, "global_step": 55854, "epoch": 672} {"train_loss": -20.26981544494629, "global_step": 55855, "epoch": 672} {"train_loss": -20.361228942871094, "global_step": 55856, "epoch": 672} {"train_loss": -20.271482467651367, "global_step": 55857, "epoch": 672} {"train_loss": -20.089618085378625, "global_step": 55858, "epoch": 672, "val_loss": 6050325.0} {"train_loss": -19.395721435546875, "global_step": 55859, "epoch": 673} {"train_loss": -19.435129165649414, "global_step": 55860, "epoch": 673} {"train_loss": -19.81594467163086, "global_step": 55861, "epoch": 673} {"train_loss": -19.72650146484375, "global_step": 55862, "epoch": 673} {"train_loss": -19.565101623535156, "global_step": 55863, "epoch": 673} {"train_loss": -20.018075942993164, "global_step": 55864, "epoch": 673} {"train_loss": -20.184167861938477, "global_step": 55865, "epoch": 673} {"train_loss": -20.237516403198242, "global_step": 55866, "epoch": 673} {"train_loss": -19.612470626831055, "global_step": 55867, "epoch": 673} {"train_loss": -19.603269577026367, "global_step": 55868, "epoch": 673} {"train_loss": -20.10071563720703, "global_step": 55869, "epoch": 673} {"train_loss": -19.434921264648438, "global_step": 55870, "epoch": 673} {"train_loss": -20.017135620117188, "global_step": 55871, "epoch": 673} {"train_loss": -19.903470993041992, "global_step": 55872, "epoch": 673} {"train_loss": -19.929330825805664, "global_step": 55873, "epoch": 673} {"train_loss": -19.75404930114746, "global_step": 55874, "epoch": 673} {"train_loss": -20.093759536743164, "global_step": 55875, "epoch": 673} {"train_loss": -20.303930282592773, "global_step": 55876, "epoch": 673} {"train_loss": -20.242069244384766, "global_step": 55877, "epoch": 673} {"train_loss": -20.00516128540039, "global_step": 55878, "epoch": 673} {"train_loss": -20.571155548095703, "global_step": 55879, "epoch": 673} {"train_loss": -20.023788452148438, "global_step": 55880, "epoch": 673} {"train_loss": -19.734344482421875, "global_step": 55881, "epoch": 673} {"train_loss": -20.227426528930664, "global_step": 55882, "epoch": 673} {"train_loss": -19.976083755493164, "global_step": 55883, "epoch": 673} {"train_loss": -20.261945724487305, "global_step": 55884, "epoch": 673} {"train_loss": -20.002334594726562, "global_step": 55885, "epoch": 673} {"train_loss": -20.485136032104492, "global_step": 55886, "epoch": 673} {"train_loss": -19.94742774963379, "global_step": 55887, "epoch": 673} {"train_loss": -20.462936401367188, "global_step": 55888, "epoch": 673} {"train_loss": -20.049232482910156, "global_step": 55889, "epoch": 673} {"train_loss": -20.184358596801758, "global_step": 55890, "epoch": 673} {"train_loss": -19.76496124267578, "global_step": 55891, "epoch": 673} {"train_loss": -20.26502799987793, "global_step": 55892, "epoch": 673} {"train_loss": -20.19092559814453, "global_step": 55893, "epoch": 673} {"train_loss": -19.548065185546875, "global_step": 55894, "epoch": 673} {"train_loss": -19.99912452697754, "global_step": 55895, "epoch": 673} {"train_loss": -20.015607833862305, "global_step": 55896, "epoch": 673} {"train_loss": -20.185962677001953, "global_step": 55897, "epoch": 673} {"train_loss": -20.593154907226562, "global_step": 55898, "epoch": 673} {"train_loss": -20.330549240112305, "global_step": 55899, "epoch": 673} {"train_loss": -20.170608520507812, "global_step": 55900, "epoch": 673} {"train_loss": -20.139570236206055, "global_step": 55901, "epoch": 673} {"train_loss": -20.121313095092773, "global_step": 55902, "epoch": 673} {"train_loss": -20.0130672454834, "global_step": 55903, "epoch": 673} {"train_loss": -20.30768394470215, "global_step": 55904, "epoch": 673} {"train_loss": -20.101585388183594, "global_step": 55905, "epoch": 673} {"train_loss": -20.19131088256836, "global_step": 55906, "epoch": 673} {"train_loss": -20.106666564941406, "global_step": 55907, "epoch": 673} {"train_loss": -20.221948623657227, "global_step": 55908, "epoch": 673} {"train_loss": -20.33770751953125, "global_step": 55909, "epoch": 673} {"train_loss": -20.37210464477539, "global_step": 55910, "epoch": 673} {"train_loss": -19.893661499023438, "global_step": 55911, "epoch": 673} {"train_loss": -20.46713638305664, "global_step": 55912, "epoch": 673} {"train_loss": -20.604589462280273, "global_step": 55913, "epoch": 673} {"train_loss": -20.311059951782227, "global_step": 55914, "epoch": 673} {"train_loss": -20.645776748657227, "global_step": 55915, "epoch": 673} {"train_loss": -20.249881744384766, "global_step": 55916, "epoch": 673} {"train_loss": -20.206998825073242, "global_step": 55917, "epoch": 673} {"train_loss": -20.516889572143555, "global_step": 55918, "epoch": 673} {"train_loss": -20.201826095581055, "global_step": 55919, "epoch": 673} {"train_loss": -20.327045440673828, "global_step": 55920, "epoch": 673} {"train_loss": -20.758939743041992, "global_step": 55921, "epoch": 673} {"train_loss": -20.345535278320312, "global_step": 55922, "epoch": 673} {"train_loss": -20.4450626373291, "global_step": 55923, "epoch": 673} {"train_loss": -20.20086669921875, "global_step": 55924, "epoch": 673} {"train_loss": -20.01150894165039, "global_step": 55925, "epoch": 673} {"train_loss": -20.363981246948242, "global_step": 55926, "epoch": 673} {"train_loss": -20.15771484375, "global_step": 55927, "epoch": 673} {"train_loss": -20.648202896118164, "global_step": 55928, "epoch": 673} {"train_loss": -20.226337432861328, "global_step": 55929, "epoch": 673} {"train_loss": -20.137401580810547, "global_step": 55930, "epoch": 673} {"train_loss": -20.386993408203125, "global_step": 55931, "epoch": 673} {"train_loss": -19.88886070251465, "global_step": 55932, "epoch": 673} {"train_loss": -20.319717407226562, "global_step": 55933, "epoch": 673} {"train_loss": -20.6004581451416, "global_step": 55934, "epoch": 673} {"train_loss": -20.09189224243164, "global_step": 55935, "epoch": 673} {"train_loss": -19.839176177978516, "global_step": 55936, "epoch": 673} {"train_loss": -20.22064781188965, "global_step": 55937, "epoch": 673} {"train_loss": -20.22597312927246, "global_step": 55938, "epoch": 673} {"train_loss": -20.22511863708496, "global_step": 55939, "epoch": 673} {"train_loss": -20.306970596313477, "global_step": 55940, "epoch": 673} {"train_loss": -20.1365187311747, "global_step": 55941, "epoch": 673, "val_loss": 6134806.0} {"train_loss": -19.992605209350586, "global_step": 55942, "epoch": 674} {"train_loss": -20.068052291870117, "global_step": 55943, "epoch": 674} {"train_loss": -19.882841110229492, "global_step": 55944, "epoch": 674} {"train_loss": -20.04330825805664, "global_step": 55945, "epoch": 674} {"train_loss": -19.694141387939453, "global_step": 55946, "epoch": 674} {"train_loss": -20.062747955322266, "global_step": 55947, "epoch": 674} {"train_loss": -20.031946182250977, "global_step": 55948, "epoch": 674} {"train_loss": -20.032804489135742, "global_step": 55949, "epoch": 674} {"train_loss": -20.162973403930664, "global_step": 55950, "epoch": 674} {"train_loss": -19.959821701049805, "global_step": 55951, "epoch": 674} {"train_loss": -19.9013671875, "global_step": 55952, "epoch": 674} {"train_loss": -19.837451934814453, "global_step": 55953, "epoch": 674} {"train_loss": -20.287302017211914, "global_step": 55954, "epoch": 674} {"train_loss": -19.8931827545166, "global_step": 55955, "epoch": 674} {"train_loss": -20.150976181030273, "global_step": 55956, "epoch": 674} {"train_loss": -19.870542526245117, "global_step": 55957, "epoch": 674} {"train_loss": -19.86549949645996, "global_step": 55958, "epoch": 674} {"train_loss": -20.211790084838867, "global_step": 55959, "epoch": 674} {"train_loss": -19.959199905395508, "global_step": 55960, "epoch": 674} {"train_loss": -20.142026901245117, "global_step": 55961, "epoch": 674} {"train_loss": -20.302173614501953, "global_step": 55962, "epoch": 674} {"train_loss": -20.378820419311523, "global_step": 55963, "epoch": 674} {"train_loss": -20.15522575378418, "global_step": 55964, "epoch": 674} {"train_loss": -19.98161506652832, "global_step": 55965, "epoch": 674} {"train_loss": -20.00945281982422, "global_step": 55966, "epoch": 674} {"train_loss": -20.179149627685547, "global_step": 55967, "epoch": 674} {"train_loss": -20.507558822631836, "global_step": 55968, "epoch": 674} {"train_loss": -20.17392921447754, "global_step": 55969, "epoch": 674} {"train_loss": -20.04646110534668, "global_step": 55970, "epoch": 674} {"train_loss": -19.837539672851562, "global_step": 55971, "epoch": 674} {"train_loss": -20.31033706665039, "global_step": 55972, "epoch": 674} {"train_loss": -20.366744995117188, "global_step": 55973, "epoch": 674} {"train_loss": -20.52473258972168, "global_step": 55974, "epoch": 674} {"train_loss": -20.091384887695312, "global_step": 55975, "epoch": 674} {"train_loss": -20.724042892456055, "global_step": 55976, "epoch": 674} {"train_loss": -20.306175231933594, "global_step": 55977, "epoch": 674} {"train_loss": -20.43158531188965, "global_step": 55978, "epoch": 674} {"train_loss": -20.178489685058594, "global_step": 55979, "epoch": 674} {"train_loss": -20.496973037719727, "global_step": 55980, "epoch": 674} {"train_loss": -20.055540084838867, "global_step": 55981, "epoch": 674} {"train_loss": -20.40631103515625, "global_step": 55982, "epoch": 674} {"train_loss": -20.016220092773438, "global_step": 55983, "epoch": 674} {"train_loss": -20.169965744018555, "global_step": 55984, "epoch": 674} {"train_loss": -20.225820541381836, "global_step": 55985, "epoch": 674} {"train_loss": -20.405324935913086, "global_step": 55986, "epoch": 674} {"train_loss": -20.065000534057617, "global_step": 55987, "epoch": 674} {"train_loss": -20.316452026367188, "global_step": 55988, "epoch": 674} {"train_loss": -20.338958740234375, "global_step": 55989, "epoch": 674} {"train_loss": -20.1439151763916, "global_step": 55990, "epoch": 674} {"train_loss": -20.629751205444336, "global_step": 55991, "epoch": 674} {"train_loss": -20.690139770507812, "global_step": 55992, "epoch": 674} {"train_loss": -20.43110466003418, "global_step": 55993, "epoch": 674} {"train_loss": -20.368820190429688, "global_step": 55994, "epoch": 674} {"train_loss": -20.108734130859375, "global_step": 55995, "epoch": 674} {"train_loss": -20.045438766479492, "global_step": 55996, "epoch": 674} {"train_loss": -20.194141387939453, "global_step": 55997, "epoch": 674} {"train_loss": -20.240739822387695, "global_step": 55998, "epoch": 674} {"train_loss": -19.993610382080078, "global_step": 55999, "epoch": 674} {"train_loss": -20.357324600219727, "global_step": 56000, "epoch": 674} {"train_loss": -20.327524185180664, "global_step": 56001, "epoch": 674} {"train_loss": -20.22739601135254, "global_step": 56002, "epoch": 674} {"train_loss": -20.074752807617188, "global_step": 56003, "epoch": 674} {"train_loss": -20.10135269165039, "global_step": 56004, "epoch": 674} {"train_loss": -20.31288719177246, "global_step": 56005, "epoch": 674} {"train_loss": -20.40346336364746, "global_step": 56006, "epoch": 674} {"train_loss": -20.07772445678711, "global_step": 56007, "epoch": 674} {"train_loss": -19.891841888427734, "global_step": 56008, "epoch": 674} {"train_loss": -20.26877784729004, "global_step": 56009, "epoch": 674} {"train_loss": -20.433340072631836, "global_step": 56010, "epoch": 674} {"train_loss": -20.317975997924805, "global_step": 56011, "epoch": 674} {"train_loss": -20.651931762695312, "global_step": 56012, "epoch": 674} {"train_loss": -20.01042366027832, "global_step": 56013, "epoch": 674} {"train_loss": -20.11148452758789, "global_step": 56014, "epoch": 674} {"train_loss": -19.74648094177246, "global_step": 56015, "epoch": 674} {"train_loss": -19.994937896728516, "global_step": 56016, "epoch": 674} {"train_loss": -20.030248641967773, "global_step": 56017, "epoch": 674} {"train_loss": -20.092262268066406, "global_step": 56018, "epoch": 674} {"train_loss": -20.37076187133789, "global_step": 56019, "epoch": 674} {"train_loss": -19.892539978027344, "global_step": 56020, "epoch": 674} {"train_loss": -20.097021102905273, "global_step": 56021, "epoch": 674} {"train_loss": -19.7093448638916, "global_step": 56022, "epoch": 674} {"train_loss": -20.335214614868164, "global_step": 56023, "epoch": 674} {"train_loss": -20.182544846132576, "global_step": 56024, "epoch": 674, "val_loss": 6060722.0} {"train_loss": -19.78852653503418, "global_step": 56025, "epoch": 675} {"train_loss": -20.23172950744629, "global_step": 56026, "epoch": 675} {"train_loss": -19.550010681152344, "global_step": 56027, "epoch": 675} {"train_loss": -19.94877052307129, "global_step": 56028, "epoch": 675} {"train_loss": -20.225215911865234, "global_step": 56029, "epoch": 675} {"train_loss": -20.1451416015625, "global_step": 56030, "epoch": 675} {"train_loss": -19.915977478027344, "global_step": 56031, "epoch": 675} {"train_loss": -19.92847442626953, "global_step": 56032, "epoch": 675} {"train_loss": -20.317365646362305, "global_step": 56033, "epoch": 675} {"train_loss": -20.016340255737305, "global_step": 56034, "epoch": 675} {"train_loss": -20.17479705810547, "global_step": 56035, "epoch": 675} {"train_loss": -20.410078048706055, "global_step": 56036, "epoch": 675} {"train_loss": -20.101058959960938, "global_step": 56037, "epoch": 675} {"train_loss": -19.885547637939453, "global_step": 56038, "epoch": 675} {"train_loss": -20.175992965698242, "global_step": 56039, "epoch": 675} {"train_loss": -20.250761032104492, "global_step": 56040, "epoch": 675} {"train_loss": -20.281131744384766, "global_step": 56041, "epoch": 675} {"train_loss": -20.17070960998535, "global_step": 56042, "epoch": 675} {"train_loss": -20.318283081054688, "global_step": 56043, "epoch": 675} {"train_loss": -20.179048538208008, "global_step": 56044, "epoch": 675} {"train_loss": -20.36578369140625, "global_step": 56045, "epoch": 675} {"train_loss": -20.126604080200195, "global_step": 56046, "epoch": 675} {"train_loss": -20.05927848815918, "global_step": 56047, "epoch": 675} {"train_loss": -20.320377349853516, "global_step": 56048, "epoch": 675} {"train_loss": -20.023929595947266, "global_step": 56049, "epoch": 675} {"train_loss": -20.32332420349121, "global_step": 56050, "epoch": 675} {"train_loss": -20.16157341003418, "global_step": 56051, "epoch": 675} {"train_loss": -20.30083656311035, "global_step": 56052, "epoch": 675} {"train_loss": -20.260334014892578, "global_step": 56053, "epoch": 675} {"train_loss": -20.12847328186035, "global_step": 56054, "epoch": 675} {"train_loss": -20.36414909362793, "global_step": 56055, "epoch": 675} {"train_loss": -20.43124008178711, "global_step": 56056, "epoch": 675} {"train_loss": -20.16077995300293, "global_step": 56057, "epoch": 675} {"train_loss": -20.023801803588867, "global_step": 56058, "epoch": 675} {"train_loss": -20.187589645385742, "global_step": 56059, "epoch": 675} {"train_loss": -20.366092681884766, "global_step": 56060, "epoch": 675} {"train_loss": -20.146060943603516, "global_step": 56061, "epoch": 675} {"train_loss": -20.38873291015625, "global_step": 56062, "epoch": 675} {"train_loss": -20.231658935546875, "global_step": 56063, "epoch": 675} {"train_loss": -20.183517456054688, "global_step": 56064, "epoch": 675} {"train_loss": -19.864416122436523, "global_step": 56065, "epoch": 675} {"train_loss": -20.381240844726562, "global_step": 56066, "epoch": 675} {"train_loss": -20.215560913085938, "global_step": 56067, "epoch": 675} {"train_loss": -20.146780014038086, "global_step": 56068, "epoch": 675} {"train_loss": -20.233549118041992, "global_step": 56069, "epoch": 675} {"train_loss": -19.843778610229492, "global_step": 56070, "epoch": 675} {"train_loss": -20.25311279296875, "global_step": 56071, "epoch": 675} {"train_loss": -20.45747947692871, "global_step": 56072, "epoch": 675} {"train_loss": -20.094280242919922, "global_step": 56073, "epoch": 675} {"train_loss": -20.150039672851562, "global_step": 56074, "epoch": 675} {"train_loss": -20.267227172851562, "global_step": 56075, "epoch": 675} {"train_loss": -19.920217514038086, "global_step": 56076, "epoch": 675} {"train_loss": -19.98598289489746, "global_step": 56077, "epoch": 675} {"train_loss": -20.339054107666016, "global_step": 56078, "epoch": 675} {"train_loss": -20.04764175415039, "global_step": 56079, "epoch": 675} {"train_loss": -20.243688583374023, "global_step": 56080, "epoch": 675} {"train_loss": -20.439550399780273, "global_step": 56081, "epoch": 675} {"train_loss": -20.312639236450195, "global_step": 56082, "epoch": 675} {"train_loss": -20.034391403198242, "global_step": 56083, "epoch": 675} {"train_loss": -20.647491455078125, "global_step": 56084, "epoch": 675} {"train_loss": -20.256534576416016, "global_step": 56085, "epoch": 675} {"train_loss": -20.244962692260742, "global_step": 56086, "epoch": 675} {"train_loss": -20.14764976501465, "global_step": 56087, "epoch": 675} {"train_loss": -20.21286964416504, "global_step": 56088, "epoch": 675} {"train_loss": -20.414634704589844, "global_step": 56089, "epoch": 675} {"train_loss": -20.261707305908203, "global_step": 56090, "epoch": 675} {"train_loss": -20.374164581298828, "global_step": 56091, "epoch": 675} {"train_loss": -20.225587844848633, "global_step": 56092, "epoch": 675} {"train_loss": -20.11815071105957, "global_step": 56093, "epoch": 675} {"train_loss": -19.99237060546875, "global_step": 56094, "epoch": 675} {"train_loss": -20.338911056518555, "global_step": 56095, "epoch": 675} {"train_loss": -20.24737548828125, "global_step": 56096, "epoch": 675} {"train_loss": -20.06450843811035, "global_step": 56097, "epoch": 675} {"train_loss": -20.174516677856445, "global_step": 56098, "epoch": 675} {"train_loss": -20.35755729675293, "global_step": 56099, "epoch": 675} {"train_loss": -20.224163055419922, "global_step": 56100, "epoch": 675} {"train_loss": -20.075439453125, "global_step": 56101, "epoch": 675} {"train_loss": -19.7674617767334, "global_step": 56102, "epoch": 675} {"train_loss": -20.26644515991211, "global_step": 56103, "epoch": 675} {"train_loss": -20.05317497253418, "global_step": 56104, "epoch": 675} {"train_loss": -20.416982650756836, "global_step": 56105, "epoch": 675} {"train_loss": -20.269136428833008, "global_step": 56106, "epoch": 675} {"train_loss": -20.185208010386273, "global_step": 56107, "epoch": 675, "val_loss": 6032331.5} {"train_loss": -20.125473022460938, "global_step": 56108, "epoch": 676} {"train_loss": -20.026470184326172, "global_step": 56109, "epoch": 676} {"train_loss": -20.188758850097656, "global_step": 56110, "epoch": 676} {"train_loss": -20.065153121948242, "global_step": 56111, "epoch": 676} {"train_loss": -20.290395736694336, "global_step": 56112, "epoch": 676} {"train_loss": -20.10040855407715, "global_step": 56113, "epoch": 676} {"train_loss": -20.349332809448242, "global_step": 56114, "epoch": 676} {"train_loss": -20.318037033081055, "global_step": 56115, "epoch": 676} {"train_loss": -20.439762115478516, "global_step": 56116, "epoch": 676} {"train_loss": -20.11940574645996, "global_step": 56117, "epoch": 676} {"train_loss": -20.251861572265625, "global_step": 56118, "epoch": 676} {"train_loss": -20.57703971862793, "global_step": 56119, "epoch": 676} {"train_loss": -20.2354679107666, "global_step": 56120, "epoch": 676} {"train_loss": -20.229333877563477, "global_step": 56121, "epoch": 676} {"train_loss": -20.99165916442871, "global_step": 56122, "epoch": 676} {"train_loss": -20.477811813354492, "global_step": 56123, "epoch": 676} {"train_loss": -20.483701705932617, "global_step": 56124, "epoch": 676} {"train_loss": -19.94569206237793, "global_step": 56125, "epoch": 676} {"train_loss": -20.06684112548828, "global_step": 56126, "epoch": 676} {"train_loss": -20.04530906677246, "global_step": 56127, "epoch": 676} {"train_loss": -20.351781845092773, "global_step": 56128, "epoch": 676} {"train_loss": -20.336151123046875, "global_step": 56129, "epoch": 676} {"train_loss": -20.170873641967773, "global_step": 56130, "epoch": 676} {"train_loss": -20.524532318115234, "global_step": 56131, "epoch": 676} {"train_loss": -20.42899513244629, "global_step": 56132, "epoch": 676} {"train_loss": -20.490291595458984, "global_step": 56133, "epoch": 676} {"train_loss": -20.314924240112305, "global_step": 56134, "epoch": 676} {"train_loss": -20.151037216186523, "global_step": 56135, "epoch": 676} {"train_loss": -20.38075828552246, "global_step": 56136, "epoch": 676} {"train_loss": -20.360387802124023, "global_step": 56137, "epoch": 676} {"train_loss": -20.029037475585938, "global_step": 56138, "epoch": 676} {"train_loss": -20.50050163269043, "global_step": 56139, "epoch": 676} {"train_loss": -20.351886749267578, "global_step": 56140, "epoch": 676} {"train_loss": -20.633291244506836, "global_step": 56141, "epoch": 676} {"train_loss": -20.509077072143555, "global_step": 56142, "epoch": 676} {"train_loss": -20.38148307800293, "global_step": 56143, "epoch": 676} {"train_loss": -20.261423110961914, "global_step": 56144, "epoch": 676} {"train_loss": -20.139554977416992, "global_step": 56145, "epoch": 676} {"train_loss": -20.187971115112305, "global_step": 56146, "epoch": 676} {"train_loss": -20.407461166381836, "global_step": 56147, "epoch": 676} {"train_loss": -20.34034538269043, "global_step": 56148, "epoch": 676} {"train_loss": -20.160846710205078, "global_step": 56149, "epoch": 676} {"train_loss": -20.2301082611084, "global_step": 56150, "epoch": 676} {"train_loss": -20.4028377532959, "global_step": 56151, "epoch": 676} {"train_loss": -20.1124267578125, "global_step": 56152, "epoch": 676} {"train_loss": -20.30684471130371, "global_step": 56153, "epoch": 676} {"train_loss": -20.751117706298828, "global_step": 56154, "epoch": 676} {"train_loss": -20.37145233154297, "global_step": 56155, "epoch": 676} {"train_loss": -20.06851577758789, "global_step": 56156, "epoch": 676} {"train_loss": -19.87674331665039, "global_step": 56157, "epoch": 676} {"train_loss": -20.280921936035156, "global_step": 56158, "epoch": 676} {"train_loss": -20.39712142944336, "global_step": 56159, "epoch": 676} {"train_loss": -20.230581283569336, "global_step": 56160, "epoch": 676} {"train_loss": -20.600210189819336, "global_step": 56161, "epoch": 676} {"train_loss": -19.96711540222168, "global_step": 56162, "epoch": 676} {"train_loss": -20.17336082458496, "global_step": 56163, "epoch": 676} {"train_loss": -20.206533432006836, "global_step": 56164, "epoch": 676} {"train_loss": -19.860706329345703, "global_step": 56165, "epoch": 676} {"train_loss": -20.336469650268555, "global_step": 56166, "epoch": 676} {"train_loss": -20.09110450744629, "global_step": 56167, "epoch": 676} {"train_loss": -20.381322860717773, "global_step": 56168, "epoch": 676} {"train_loss": -20.197294235229492, "global_step": 56169, "epoch": 676} {"train_loss": -19.92424964904785, "global_step": 56170, "epoch": 676} {"train_loss": -20.215518951416016, "global_step": 56171, "epoch": 676} {"train_loss": -20.134199142456055, "global_step": 56172, "epoch": 676} {"train_loss": -20.382028579711914, "global_step": 56173, "epoch": 676} {"train_loss": -19.984533309936523, "global_step": 56174, "epoch": 676} {"train_loss": -20.0638370513916, "global_step": 56175, "epoch": 676} {"train_loss": -19.991918563842773, "global_step": 56176, "epoch": 676} {"train_loss": -19.959104537963867, "global_step": 56177, "epoch": 676} {"train_loss": -19.902196884155273, "global_step": 56178, "epoch": 676} {"train_loss": -20.57027244567871, "global_step": 56179, "epoch": 676} {"train_loss": -20.24441909790039, "global_step": 56180, "epoch": 676} {"train_loss": -20.251693725585938, "global_step": 56181, "epoch": 676} {"train_loss": -20.08436393737793, "global_step": 56182, "epoch": 676} {"train_loss": -20.146595001220703, "global_step": 56183, "epoch": 676} {"train_loss": -20.51034927368164, "global_step": 56184, "epoch": 676} {"train_loss": -20.149301528930664, "global_step": 56185, "epoch": 676} {"train_loss": -20.475818634033203, "global_step": 56186, "epoch": 676} {"train_loss": -20.569820404052734, "global_step": 56187, "epoch": 676} {"train_loss": -20.361003875732422, "global_step": 56188, "epoch": 676} {"train_loss": -20.017446517944336, "global_step": 56189, "epoch": 676} {"train_loss": -20.28555346109781, "global_step": 56190, "epoch": 676, "val_loss": 5856961.0} {"train_loss": -19.2973690032959, "global_step": 56191, "epoch": 677} {"train_loss": -19.613126754760742, "global_step": 56192, "epoch": 677} {"train_loss": -19.72480583190918, "global_step": 56193, "epoch": 677} {"train_loss": -19.559499740600586, "global_step": 56194, "epoch": 677} {"train_loss": -19.915536880493164, "global_step": 56195, "epoch": 677} {"train_loss": -19.68545150756836, "global_step": 56196, "epoch": 677} {"train_loss": -19.394529342651367, "global_step": 56197, "epoch": 677} {"train_loss": -19.984806060791016, "global_step": 56198, "epoch": 677} {"train_loss": -19.649795532226562, "global_step": 56199, "epoch": 677} {"train_loss": -19.82649040222168, "global_step": 56200, "epoch": 677} {"train_loss": -19.953094482421875, "global_step": 56201, "epoch": 677} {"train_loss": -19.910497665405273, "global_step": 56202, "epoch": 677} {"train_loss": -19.812891006469727, "global_step": 56203, "epoch": 677} {"train_loss": -19.337385177612305, "global_step": 56204, "epoch": 677} {"train_loss": -19.952970504760742, "global_step": 56205, "epoch": 677} {"train_loss": -19.823959350585938, "global_step": 56206, "epoch": 677} {"train_loss": -20.034168243408203, "global_step": 56207, "epoch": 677} {"train_loss": -19.868106842041016, "global_step": 56208, "epoch": 677} {"train_loss": -19.817445755004883, "global_step": 56209, "epoch": 677} {"train_loss": -19.82711410522461, "global_step": 56210, "epoch": 677} {"train_loss": -19.662992477416992, "global_step": 56211, "epoch": 677} {"train_loss": -20.01270866394043, "global_step": 56212, "epoch": 677} {"train_loss": -20.321338653564453, "global_step": 56213, "epoch": 677} {"train_loss": -19.854110717773438, "global_step": 56214, "epoch": 677} {"train_loss": -19.965391159057617, "global_step": 56215, "epoch": 677} {"train_loss": -20.325178146362305, "global_step": 56216, "epoch": 677} {"train_loss": -20.223772048950195, "global_step": 56217, "epoch": 677} {"train_loss": -20.153284072875977, "global_step": 56218, "epoch": 677} {"train_loss": -20.373416900634766, "global_step": 56219, "epoch": 677} {"train_loss": -20.165151596069336, "global_step": 56220, "epoch": 677} {"train_loss": -20.009685516357422, "global_step": 56221, "epoch": 677} {"train_loss": -20.147567749023438, "global_step": 56222, "epoch": 677} {"train_loss": -20.14459800720215, "global_step": 56223, "epoch": 677} {"train_loss": -20.376079559326172, "global_step": 56224, "epoch": 677} {"train_loss": -20.133331298828125, "global_step": 56225, "epoch": 677} {"train_loss": -20.459915161132812, "global_step": 56226, "epoch": 677} {"train_loss": -20.22014808654785, "global_step": 56227, "epoch": 677} {"train_loss": -20.33469581604004, "global_step": 56228, "epoch": 677} {"train_loss": -20.090410232543945, "global_step": 56229, "epoch": 677} {"train_loss": -20.415393829345703, "global_step": 56230, "epoch": 677} {"train_loss": -20.383169174194336, "global_step": 56231, "epoch": 677} {"train_loss": -20.529184341430664, "global_step": 56232, "epoch": 677} {"train_loss": -20.204145431518555, "global_step": 56233, "epoch": 677} {"train_loss": -20.524477005004883, "global_step": 56234, "epoch": 677} {"train_loss": -20.170879364013672, "global_step": 56235, "epoch": 677} {"train_loss": -20.22736167907715, "global_step": 56236, "epoch": 677} {"train_loss": -20.491262435913086, "global_step": 56237, "epoch": 677} {"train_loss": -20.503225326538086, "global_step": 56238, "epoch": 677} {"train_loss": -20.077749252319336, "global_step": 56239, "epoch": 677} {"train_loss": -20.536882400512695, "global_step": 56240, "epoch": 677} {"train_loss": -20.372480392456055, "global_step": 56241, "epoch": 677} {"train_loss": -20.04571533203125, "global_step": 56242, "epoch": 677} {"train_loss": -20.533145904541016, "global_step": 56243, "epoch": 677} {"train_loss": -20.439435958862305, "global_step": 56244, "epoch": 677} {"train_loss": -20.20551872253418, "global_step": 56245, "epoch": 677} {"train_loss": -20.2899169921875, "global_step": 56246, "epoch": 677} {"train_loss": -20.2528133392334, "global_step": 56247, "epoch": 677} {"train_loss": -20.29402732849121, "global_step": 56248, "epoch": 677} {"train_loss": -20.3212890625, "global_step": 56249, "epoch": 677} {"train_loss": -20.181888580322266, "global_step": 56250, "epoch": 677} {"train_loss": -20.312108993530273, "global_step": 56251, "epoch": 677} {"train_loss": -20.361928939819336, "global_step": 56252, "epoch": 677} {"train_loss": -20.168245315551758, "global_step": 56253, "epoch": 677} {"train_loss": -20.37226676940918, "global_step": 56254, "epoch": 677} {"train_loss": -20.453144073486328, "global_step": 56255, "epoch": 677} {"train_loss": -20.23238182067871, "global_step": 56256, "epoch": 677} {"train_loss": -20.22208595275879, "global_step": 56257, "epoch": 677} {"train_loss": -20.440555572509766, "global_step": 56258, "epoch": 677} {"train_loss": -20.34653091430664, "global_step": 56259, "epoch": 677} {"train_loss": -20.342121124267578, "global_step": 56260, "epoch": 677} {"train_loss": -20.427152633666992, "global_step": 56261, "epoch": 677} {"train_loss": -20.11830711364746, "global_step": 56262, "epoch": 677} {"train_loss": -20.080835342407227, "global_step": 56263, "epoch": 677} {"train_loss": -20.217031478881836, "global_step": 56264, "epoch": 677} {"train_loss": -20.477243423461914, "global_step": 56265, "epoch": 677} {"train_loss": -20.384801864624023, "global_step": 56266, "epoch": 677} {"train_loss": -20.034896850585938, "global_step": 56267, "epoch": 677} {"train_loss": -20.298009872436523, "global_step": 56268, "epoch": 677} {"train_loss": -20.388486862182617, "global_step": 56269, "epoch": 677} {"train_loss": -20.16643714904785, "global_step": 56270, "epoch": 677} {"train_loss": -20.05191993713379, "global_step": 56271, "epoch": 677} {"train_loss": -20.43435287475586, "global_step": 56272, "epoch": 677} {"train_loss": -20.14728189950966, "global_step": 56273, "epoch": 677, "val_loss": 5807049.0} {"train_loss": -20.076303482055664, "global_step": 56274, "epoch": 678} {"train_loss": -20.363449096679688, "global_step": 56275, "epoch": 678} {"train_loss": -19.94448471069336, "global_step": 56276, "epoch": 678} {"train_loss": -20.060131072998047, "global_step": 56277, "epoch": 678} {"train_loss": -20.027536392211914, "global_step": 56278, "epoch": 678} {"train_loss": -19.962743759155273, "global_step": 56279, "epoch": 678} {"train_loss": -19.71556282043457, "global_step": 56280, "epoch": 678} {"train_loss": -20.281217575073242, "global_step": 56281, "epoch": 678} {"train_loss": -20.178438186645508, "global_step": 56282, "epoch": 678} {"train_loss": -19.895933151245117, "global_step": 56283, "epoch": 678} {"train_loss": -19.94537353515625, "global_step": 56284, "epoch": 678} {"train_loss": -20.047327041625977, "global_step": 56285, "epoch": 678} {"train_loss": -19.907520294189453, "global_step": 56286, "epoch": 678} {"train_loss": -20.318553924560547, "global_step": 56287, "epoch": 678} {"train_loss": -20.223758697509766, "global_step": 56288, "epoch": 678} {"train_loss": -20.2522029876709, "global_step": 56289, "epoch": 678} {"train_loss": -20.418928146362305, "global_step": 56290, "epoch": 678} {"train_loss": -20.268518447875977, "global_step": 56291, "epoch": 678} {"train_loss": -20.420764923095703, "global_step": 56292, "epoch": 678} {"train_loss": -20.227035522460938, "global_step": 56293, "epoch": 678} {"train_loss": -20.13642692565918, "global_step": 56294, "epoch": 678} {"train_loss": -20.91538429260254, "global_step": 56295, "epoch": 678} {"train_loss": -20.505979537963867, "global_step": 56296, "epoch": 678} {"train_loss": -20.449953079223633, "global_step": 56297, "epoch": 678} {"train_loss": -20.44563102722168, "global_step": 56298, "epoch": 678} {"train_loss": -20.45361328125, "global_step": 56299, "epoch": 678} {"train_loss": -20.168718338012695, "global_step": 56300, "epoch": 678} {"train_loss": -20.224641799926758, "global_step": 56301, "epoch": 678} {"train_loss": -19.875940322875977, "global_step": 56302, "epoch": 678} {"train_loss": -20.365087509155273, "global_step": 56303, "epoch": 678} {"train_loss": -20.33150291442871, "global_step": 56304, "epoch": 678} {"train_loss": -20.02345848083496, "global_step": 56305, "epoch": 678} {"train_loss": -20.472217559814453, "global_step": 56306, "epoch": 678} {"train_loss": -20.26279640197754, "global_step": 56307, "epoch": 678} {"train_loss": -20.4395809173584, "global_step": 56308, "epoch": 678} {"train_loss": -20.302438735961914, "global_step": 56309, "epoch": 678} {"train_loss": -19.911468505859375, "global_step": 56310, "epoch": 678} {"train_loss": -20.361083984375, "global_step": 56311, "epoch": 678} {"train_loss": -20.021068572998047, "global_step": 56312, "epoch": 678} {"train_loss": -20.2524471282959, "global_step": 56313, "epoch": 678} {"train_loss": -20.352252960205078, "global_step": 56314, "epoch": 678} {"train_loss": -20.346464157104492, "global_step": 56315, "epoch": 678} {"train_loss": -19.688201904296875, "global_step": 56316, "epoch": 678} {"train_loss": -20.1541690826416, "global_step": 56317, "epoch": 678} {"train_loss": -20.080896377563477, "global_step": 56318, "epoch": 678} {"train_loss": -20.152957916259766, "global_step": 56319, "epoch": 678} {"train_loss": -20.093017578125, "global_step": 56320, "epoch": 678} {"train_loss": -19.998796463012695, "global_step": 56321, "epoch": 678} {"train_loss": -20.346790313720703, "global_step": 56322, "epoch": 678} {"train_loss": -20.256559371948242, "global_step": 56323, "epoch": 678} {"train_loss": -20.20087242126465, "global_step": 56324, "epoch": 678} {"train_loss": -20.1674861907959, "global_step": 56325, "epoch": 678} {"train_loss": -20.117460250854492, "global_step": 56326, "epoch": 678} {"train_loss": -20.163909912109375, "global_step": 56327, "epoch": 678} {"train_loss": -20.29553985595703, "global_step": 56328, "epoch": 678} {"train_loss": -19.785715103149414, "global_step": 56329, "epoch": 678} {"train_loss": -20.245147705078125, "global_step": 56330, "epoch": 678} {"train_loss": -20.374326705932617, "global_step": 56331, "epoch": 678} {"train_loss": -20.054149627685547, "global_step": 56332, "epoch": 678} {"train_loss": -20.3619441986084, "global_step": 56333, "epoch": 678} {"train_loss": -20.307600021362305, "global_step": 56334, "epoch": 678} {"train_loss": -20.518146514892578, "global_step": 56335, "epoch": 678} {"train_loss": -20.190526962280273, "global_step": 56336, "epoch": 678} {"train_loss": -20.61789894104004, "global_step": 56337, "epoch": 678} {"train_loss": -20.41853904724121, "global_step": 56338, "epoch": 678} {"train_loss": -20.242782592773438, "global_step": 56339, "epoch": 678} {"train_loss": -20.48293685913086, "global_step": 56340, "epoch": 678} {"train_loss": -20.096952438354492, "global_step": 56341, "epoch": 678} {"train_loss": -20.011350631713867, "global_step": 56342, "epoch": 678} {"train_loss": -20.546571731567383, "global_step": 56343, "epoch": 678} {"train_loss": -20.35272216796875, "global_step": 56344, "epoch": 678} {"train_loss": -20.256418228149414, "global_step": 56345, "epoch": 678} {"train_loss": -20.26722526550293, "global_step": 56346, "epoch": 678} {"train_loss": -20.18667984008789, "global_step": 56347, "epoch": 678} {"train_loss": -20.596771240234375, "global_step": 56348, "epoch": 678} {"train_loss": -20.20136070251465, "global_step": 56349, "epoch": 678} {"train_loss": -20.036813735961914, "global_step": 56350, "epoch": 678} {"train_loss": -20.50008201599121, "global_step": 56351, "epoch": 678} {"train_loss": -20.19759750366211, "global_step": 56352, "epoch": 678} {"train_loss": -20.287830352783203, "global_step": 56353, "epoch": 678} {"train_loss": -19.84023666381836, "global_step": 56354, "epoch": 678} {"train_loss": -20.593162536621094, "global_step": 56355, "epoch": 678} {"train_loss": -20.237548322562713, "global_step": 56356, "epoch": 678, "val_loss": 6026665.0} {"train_loss": -19.966176986694336, "global_step": 56357, "epoch": 679} {"train_loss": -20.04090690612793, "global_step": 56358, "epoch": 679} {"train_loss": -20.160932540893555, "global_step": 56359, "epoch": 679} {"train_loss": -19.94829750061035, "global_step": 56360, "epoch": 679} {"train_loss": -19.884748458862305, "global_step": 56361, "epoch": 679} {"train_loss": -20.10400390625, "global_step": 56362, "epoch": 679} {"train_loss": -19.86545753479004, "global_step": 56363, "epoch": 679} {"train_loss": -20.058006286621094, "global_step": 56364, "epoch": 679} {"train_loss": -20.451181411743164, "global_step": 56365, "epoch": 679} {"train_loss": -20.286230087280273, "global_step": 56366, "epoch": 679} {"train_loss": -20.04098892211914, "global_step": 56367, "epoch": 679} {"train_loss": -20.055173873901367, "global_step": 56368, "epoch": 679} {"train_loss": -19.8892879486084, "global_step": 56369, "epoch": 679} {"train_loss": -19.992170333862305, "global_step": 56370, "epoch": 679} {"train_loss": -20.386491775512695, "global_step": 56371, "epoch": 679} {"train_loss": -20.200075149536133, "global_step": 56372, "epoch": 679} {"train_loss": -20.11512565612793, "global_step": 56373, "epoch": 679} {"train_loss": -20.23859214782715, "global_step": 56374, "epoch": 679} {"train_loss": -19.69662857055664, "global_step": 56375, "epoch": 679} {"train_loss": -20.37017250061035, "global_step": 56376, "epoch": 679} {"train_loss": -20.184955596923828, "global_step": 56377, "epoch": 679} {"train_loss": -20.069610595703125, "global_step": 56378, "epoch": 679} {"train_loss": -20.04874610900879, "global_step": 56379, "epoch": 679} {"train_loss": -19.98128318786621, "global_step": 56380, "epoch": 679} {"train_loss": -20.283721923828125, "global_step": 56381, "epoch": 679} {"train_loss": -20.330503463745117, "global_step": 56382, "epoch": 679} {"train_loss": -20.281898498535156, "global_step": 56383, "epoch": 679} {"train_loss": -20.297012329101562, "global_step": 56384, "epoch": 679} {"train_loss": -20.364294052124023, "global_step": 56385, "epoch": 679} {"train_loss": -20.20489501953125, "global_step": 56386, "epoch": 679} {"train_loss": -20.315702438354492, "global_step": 56387, "epoch": 679} {"train_loss": -20.556476593017578, "global_step": 56388, "epoch": 679} {"train_loss": -20.229984283447266, "global_step": 56389, "epoch": 679} {"train_loss": -20.239011764526367, "global_step": 56390, "epoch": 679} {"train_loss": -20.337085723876953, "global_step": 56391, "epoch": 679} {"train_loss": -20.30389404296875, "global_step": 56392, "epoch": 679} {"train_loss": -20.117481231689453, "global_step": 56393, "epoch": 679} {"train_loss": -19.86506462097168, "global_step": 56394, "epoch": 679} {"train_loss": -20.09937286376953, "global_step": 56395, "epoch": 679} {"train_loss": -20.381444931030273, "global_step": 56396, "epoch": 679} {"train_loss": -20.10718536376953, "global_step": 56397, "epoch": 679} {"train_loss": -20.042112350463867, "global_step": 56398, "epoch": 679} {"train_loss": -20.22528076171875, "global_step": 56399, "epoch": 679} {"train_loss": -20.15176773071289, "global_step": 56400, "epoch": 679} {"train_loss": -20.826801300048828, "global_step": 56401, "epoch": 679} {"train_loss": -20.111400604248047, "global_step": 56402, "epoch": 679} {"train_loss": -20.276077270507812, "global_step": 56403, "epoch": 679} {"train_loss": -20.305402755737305, "global_step": 56404, "epoch": 679} {"train_loss": -20.5513858795166, "global_step": 56405, "epoch": 679} {"train_loss": -20.20665740966797, "global_step": 56406, "epoch": 679} {"train_loss": -20.188140869140625, "global_step": 56407, "epoch": 679} {"train_loss": -20.28371238708496, "global_step": 56408, "epoch": 679} {"train_loss": -19.924606323242188, "global_step": 56409, "epoch": 679} {"train_loss": -20.48290252685547, "global_step": 56410, "epoch": 679} {"train_loss": -20.36060905456543, "global_step": 56411, "epoch": 679} {"train_loss": -20.26375389099121, "global_step": 56412, "epoch": 679} {"train_loss": -20.389436721801758, "global_step": 56413, "epoch": 679} {"train_loss": -20.209796905517578, "global_step": 56414, "epoch": 679} {"train_loss": -20.222827911376953, "global_step": 56415, "epoch": 679} {"train_loss": -20.246122360229492, "global_step": 56416, "epoch": 679} {"train_loss": -20.21415138244629, "global_step": 56417, "epoch": 679} {"train_loss": -20.501760482788086, "global_step": 56418, "epoch": 679} {"train_loss": -20.22909927368164, "global_step": 56419, "epoch": 679} {"train_loss": -20.274078369140625, "global_step": 56420, "epoch": 679} {"train_loss": -20.048646926879883, "global_step": 56421, "epoch": 679} {"train_loss": -20.39631462097168, "global_step": 56422, "epoch": 679} {"train_loss": -20.157928466796875, "global_step": 56423, "epoch": 679} {"train_loss": -20.333786010742188, "global_step": 56424, "epoch": 679} {"train_loss": -20.1400146484375, "global_step": 56425, "epoch": 679} {"train_loss": -20.533588409423828, "global_step": 56426, "epoch": 679} {"train_loss": -20.01568603515625, "global_step": 56427, "epoch": 679} {"train_loss": -20.301986694335938, "global_step": 56428, "epoch": 679} {"train_loss": -20.458967208862305, "global_step": 56429, "epoch": 679} {"train_loss": -19.980688095092773, "global_step": 56430, "epoch": 679} {"train_loss": -20.413766860961914, "global_step": 56431, "epoch": 679} {"train_loss": -19.939956665039062, "global_step": 56432, "epoch": 679} {"train_loss": -20.03135108947754, "global_step": 56433, "epoch": 679} {"train_loss": -20.312732696533203, "global_step": 56434, "epoch": 679} {"train_loss": -20.323450088500977, "global_step": 56435, "epoch": 679} {"train_loss": -20.330123901367188, "global_step": 56436, "epoch": 679} {"train_loss": -20.29244041442871, "global_step": 56437, "epoch": 679} {"train_loss": -20.622303009033203, "global_step": 56438, "epoch": 679} {"train_loss": -20.20193874405091, "global_step": 56439, "epoch": 679, "val_loss": 5888935.0} {"train_loss": -20.047605514526367, "global_step": 56440, "epoch": 680} {"train_loss": -19.979114532470703, "global_step": 56441, "epoch": 680} {"train_loss": -20.403339385986328, "global_step": 56442, "epoch": 680} {"train_loss": -20.163883209228516, "global_step": 56443, "epoch": 680} {"train_loss": -19.745162963867188, "global_step": 56444, "epoch": 680} {"train_loss": -19.7893009185791, "global_step": 56445, "epoch": 680} {"train_loss": -20.213163375854492, "global_step": 56446, "epoch": 680} {"train_loss": -20.11161231994629, "global_step": 56447, "epoch": 680} {"train_loss": -20.140722274780273, "global_step": 56448, "epoch": 680} {"train_loss": -20.194717407226562, "global_step": 56449, "epoch": 680} {"train_loss": -19.99051856994629, "global_step": 56450, "epoch": 680} {"train_loss": -20.242839813232422, "global_step": 56451, "epoch": 680} {"train_loss": -20.592777252197266, "global_step": 56452, "epoch": 680} {"train_loss": -20.228288650512695, "global_step": 56453, "epoch": 680} {"train_loss": -20.526165008544922, "global_step": 56454, "epoch": 680} {"train_loss": -20.026126861572266, "global_step": 56455, "epoch": 680} {"train_loss": -20.097614288330078, "global_step": 56456, "epoch": 680} {"train_loss": -20.18636131286621, "global_step": 56457, "epoch": 680} {"train_loss": -20.205446243286133, "global_step": 56458, "epoch": 680} {"train_loss": -20.23127555847168, "global_step": 56459, "epoch": 680} {"train_loss": -20.417495727539062, "global_step": 56460, "epoch": 680} {"train_loss": -20.618803024291992, "global_step": 56461, "epoch": 680} {"train_loss": -20.294477462768555, "global_step": 56462, "epoch": 680} {"train_loss": -20.20838165283203, "global_step": 56463, "epoch": 680} {"train_loss": -19.635087966918945, "global_step": 56464, "epoch": 680} {"train_loss": -20.242576599121094, "global_step": 56465, "epoch": 680} {"train_loss": -20.476118087768555, "global_step": 56466, "epoch": 680} {"train_loss": -20.16786003112793, "global_step": 56467, "epoch": 680} {"train_loss": -20.35454750061035, "global_step": 56468, "epoch": 680} {"train_loss": -20.308618545532227, "global_step": 56469, "epoch": 680} {"train_loss": -19.961511611938477, "global_step": 56470, "epoch": 680} {"train_loss": -20.644760131835938, "global_step": 56471, "epoch": 680} {"train_loss": -20.082080841064453, "global_step": 56472, "epoch": 680} {"train_loss": -20.45710563659668, "global_step": 56473, "epoch": 680} {"train_loss": -20.25184440612793, "global_step": 56474, "epoch": 680} {"train_loss": -19.972761154174805, "global_step": 56475, "epoch": 680} {"train_loss": -20.2266788482666, "global_step": 56476, "epoch": 680} {"train_loss": -20.611957550048828, "global_step": 56477, "epoch": 680} {"train_loss": -20.729406356811523, "global_step": 56478, "epoch": 680} {"train_loss": -20.28481101989746, "global_step": 56479, "epoch": 680} {"train_loss": -19.93072509765625, "global_step": 56480, "epoch": 680} {"train_loss": -20.343854904174805, "global_step": 56481, "epoch": 680} {"train_loss": -20.346805572509766, "global_step": 56482, "epoch": 680} {"train_loss": -20.26441764831543, "global_step": 56483, "epoch": 680} {"train_loss": -20.176254272460938, "global_step": 56484, "epoch": 680} {"train_loss": -20.23274040222168, "global_step": 56485, "epoch": 680} {"train_loss": -19.7786865234375, "global_step": 56486, "epoch": 680} {"train_loss": -20.3253173828125, "global_step": 56487, "epoch": 680} {"train_loss": -20.2288818359375, "global_step": 56488, "epoch": 680} {"train_loss": -20.453962326049805, "global_step": 56489, "epoch": 680} {"train_loss": -20.312339782714844, "global_step": 56490, "epoch": 680} {"train_loss": -20.47646713256836, "global_step": 56491, "epoch": 680} {"train_loss": -20.24823760986328, "global_step": 56492, "epoch": 680} {"train_loss": -19.99422264099121, "global_step": 56493, "epoch": 680} {"train_loss": -20.14103126525879, "global_step": 56494, "epoch": 680} {"train_loss": -20.161090850830078, "global_step": 56495, "epoch": 680} {"train_loss": -20.152509689331055, "global_step": 56496, "epoch": 680} {"train_loss": -20.376785278320312, "global_step": 56497, "epoch": 680} {"train_loss": -20.409168243408203, "global_step": 56498, "epoch": 680} {"train_loss": -20.173126220703125, "global_step": 56499, "epoch": 680} {"train_loss": -19.93996810913086, "global_step": 56500, "epoch": 680} {"train_loss": -20.4298152923584, "global_step": 56501, "epoch": 680} {"train_loss": -19.94928550720215, "global_step": 56502, "epoch": 680} {"train_loss": -19.635116577148438, "global_step": 56503, "epoch": 680} {"train_loss": -20.4792537689209, "global_step": 56504, "epoch": 680} {"train_loss": -20.25135612487793, "global_step": 56505, "epoch": 680} {"train_loss": -20.441349029541016, "global_step": 56506, "epoch": 680} {"train_loss": -20.343887329101562, "global_step": 56507, "epoch": 680} {"train_loss": -20.59184455871582, "global_step": 56508, "epoch": 680} {"train_loss": -20.06838035583496, "global_step": 56509, "epoch": 680} {"train_loss": -19.955093383789062, "global_step": 56510, "epoch": 680} {"train_loss": -20.181306838989258, "global_step": 56511, "epoch": 680} {"train_loss": -20.081119537353516, "global_step": 56512, "epoch": 680} {"train_loss": -20.150068283081055, "global_step": 56513, "epoch": 680} {"train_loss": -20.222858428955078, "global_step": 56514, "epoch": 680} {"train_loss": -20.099443435668945, "global_step": 56515, "epoch": 680} {"train_loss": -20.45062828063965, "global_step": 56516, "epoch": 680} {"train_loss": -20.024051666259766, "global_step": 56517, "epoch": 680} {"train_loss": -20.371862411499023, "global_step": 56518, "epoch": 680} {"train_loss": -20.12495231628418, "global_step": 56519, "epoch": 680} {"train_loss": -20.264631271362305, "global_step": 56520, "epoch": 680} {"train_loss": -19.901945114135742, "global_step": 56521, "epoch": 680} {"train_loss": -20.200167598494563, "global_step": 56522, "epoch": 680, "val_loss": 5989633.0} {"train_loss": -20.358469009399414, "global_step": 56523, "epoch": 681} {"train_loss": -20.123302459716797, "global_step": 56524, "epoch": 681} {"train_loss": -20.243318557739258, "global_step": 56525, "epoch": 681} {"train_loss": -20.76715660095215, "global_step": 56526, "epoch": 681} {"train_loss": -20.136905670166016, "global_step": 56527, "epoch": 681} {"train_loss": -19.900920867919922, "global_step": 56528, "epoch": 681} {"train_loss": -20.516019821166992, "global_step": 56529, "epoch": 681} {"train_loss": -19.941259384155273, "global_step": 56530, "epoch": 681} {"train_loss": -20.245908737182617, "global_step": 56531, "epoch": 681} {"train_loss": -19.676483154296875, "global_step": 56532, "epoch": 681} {"train_loss": -20.368494033813477, "global_step": 56533, "epoch": 681} {"train_loss": -20.160144805908203, "global_step": 56534, "epoch": 681} {"train_loss": -20.162668228149414, "global_step": 56535, "epoch": 681} {"train_loss": -20.248638153076172, "global_step": 56536, "epoch": 681} {"train_loss": -19.978195190429688, "global_step": 56537, "epoch": 681} {"train_loss": -20.263507843017578, "global_step": 56538, "epoch": 681} {"train_loss": -20.264968872070312, "global_step": 56539, "epoch": 681} {"train_loss": -20.462289810180664, "global_step": 56540, "epoch": 681} {"train_loss": -19.852798461914062, "global_step": 56541, "epoch": 681} {"train_loss": -20.387121200561523, "global_step": 56542, "epoch": 681} {"train_loss": -20.362192153930664, "global_step": 56543, "epoch": 681} {"train_loss": -20.156497955322266, "global_step": 56544, "epoch": 681} {"train_loss": -20.25099754333496, "global_step": 56545, "epoch": 681} {"train_loss": -20.259069442749023, "global_step": 56546, "epoch": 681} {"train_loss": -20.079792022705078, "global_step": 56547, "epoch": 681} {"train_loss": -19.983762741088867, "global_step": 56548, "epoch": 681} {"train_loss": -20.196622848510742, "global_step": 56549, "epoch": 681} {"train_loss": -20.4957218170166, "global_step": 56550, "epoch": 681} {"train_loss": -20.06614875793457, "global_step": 56551, "epoch": 681} {"train_loss": -19.948575973510742, "global_step": 56552, "epoch": 681} {"train_loss": -20.386388778686523, "global_step": 56553, "epoch": 681} {"train_loss": -20.27910614013672, "global_step": 56554, "epoch": 681} {"train_loss": -19.95599937438965, "global_step": 56555, "epoch": 681} {"train_loss": -20.42096519470215, "global_step": 56556, "epoch": 681} {"train_loss": -20.037580490112305, "global_step": 56557, "epoch": 681} {"train_loss": -20.159543991088867, "global_step": 56558, "epoch": 681} {"train_loss": -20.143844604492188, "global_step": 56559, "epoch": 681} {"train_loss": -20.2194881439209, "global_step": 56560, "epoch": 681} {"train_loss": -19.970767974853516, "global_step": 56561, "epoch": 681} {"train_loss": -20.217756271362305, "global_step": 56562, "epoch": 681} {"train_loss": -20.39565086364746, "global_step": 56563, "epoch": 681} {"train_loss": -20.25546646118164, "global_step": 56564, "epoch": 681} {"train_loss": -19.84662437438965, "global_step": 56565, "epoch": 681} {"train_loss": -19.925703048706055, "global_step": 56566, "epoch": 681} {"train_loss": -19.875720977783203, "global_step": 56567, "epoch": 681} {"train_loss": -20.1204891204834, "global_step": 56568, "epoch": 681} {"train_loss": -20.35636329650879, "global_step": 56569, "epoch": 681} {"train_loss": -20.337814331054688, "global_step": 56570, "epoch": 681} {"train_loss": -19.84787368774414, "global_step": 56571, "epoch": 681} {"train_loss": -20.103300094604492, "global_step": 56572, "epoch": 681} {"train_loss": -20.154560089111328, "global_step": 56573, "epoch": 681} {"train_loss": -20.73190689086914, "global_step": 56574, "epoch": 681} {"train_loss": -20.37101173400879, "global_step": 56575, "epoch": 681} {"train_loss": -20.01030921936035, "global_step": 56576, "epoch": 681} {"train_loss": -20.14957046508789, "global_step": 56577, "epoch": 681} {"train_loss": -20.046567916870117, "global_step": 56578, "epoch": 681} {"train_loss": -20.181716918945312, "global_step": 56579, "epoch": 681} {"train_loss": -20.13726806640625, "global_step": 56580, "epoch": 681} {"train_loss": -20.42411231994629, "global_step": 56581, "epoch": 681} {"train_loss": -20.194021224975586, "global_step": 56582, "epoch": 681} {"train_loss": -20.115964889526367, "global_step": 56583, "epoch": 681} {"train_loss": -20.187461853027344, "global_step": 56584, "epoch": 681} {"train_loss": -20.147798538208008, "global_step": 56585, "epoch": 681} {"train_loss": -20.428892135620117, "global_step": 56586, "epoch": 681} {"train_loss": -20.09242057800293, "global_step": 56587, "epoch": 681} {"train_loss": -20.261341094970703, "global_step": 56588, "epoch": 681} {"train_loss": -20.322113037109375, "global_step": 56589, "epoch": 681} {"train_loss": -20.43511199951172, "global_step": 56590, "epoch": 681} {"train_loss": -20.21698570251465, "global_step": 56591, "epoch": 681} {"train_loss": -20.16379165649414, "global_step": 56592, "epoch": 681} {"train_loss": -20.256473541259766, "global_step": 56593, "epoch": 681} {"train_loss": -20.272552490234375, "global_step": 56594, "epoch": 681} {"train_loss": -20.251134872436523, "global_step": 56595, "epoch": 681} {"train_loss": -20.460416793823242, "global_step": 56596, "epoch": 681} {"train_loss": -19.938169479370117, "global_step": 56597, "epoch": 681} {"train_loss": -20.203947067260742, "global_step": 56598, "epoch": 681} {"train_loss": -19.967838287353516, "global_step": 56599, "epoch": 681} {"train_loss": -20.273662567138672, "global_step": 56600, "epoch": 681} {"train_loss": -20.276567459106445, "global_step": 56601, "epoch": 681} {"train_loss": -20.099689483642578, "global_step": 56602, "epoch": 681} {"train_loss": -19.936697006225586, "global_step": 56603, "epoch": 681} {"train_loss": -20.297992706298828, "global_step": 56604, "epoch": 681} {"train_loss": -20.183213659079676, "global_step": 56605, "epoch": 681, "val_loss": 5975886.0} {"train_loss": -20.194629669189453, "global_step": 56606, "epoch": 682} {"train_loss": -20.286788940429688, "global_step": 56607, "epoch": 682} {"train_loss": -19.749095916748047, "global_step": 56608, "epoch": 682} {"train_loss": -20.202621459960938, "global_step": 56609, "epoch": 682} {"train_loss": -19.990285873413086, "global_step": 56610, "epoch": 682} {"train_loss": -19.769319534301758, "global_step": 56611, "epoch": 682} {"train_loss": -19.89729118347168, "global_step": 56612, "epoch": 682} {"train_loss": -20.151906967163086, "global_step": 56613, "epoch": 682} {"train_loss": -20.30315399169922, "global_step": 56614, "epoch": 682} {"train_loss": -20.18070411682129, "global_step": 56615, "epoch": 682} {"train_loss": -19.92886734008789, "global_step": 56616, "epoch": 682} {"train_loss": -20.574384689331055, "global_step": 56617, "epoch": 682} {"train_loss": -20.092731475830078, "global_step": 56618, "epoch": 682} {"train_loss": -20.529293060302734, "global_step": 56619, "epoch": 682} {"train_loss": -20.28183937072754, "global_step": 56620, "epoch": 682} {"train_loss": -20.32966423034668, "global_step": 56621, "epoch": 682} {"train_loss": -20.115495681762695, "global_step": 56622, "epoch": 682} {"train_loss": -20.162372589111328, "global_step": 56623, "epoch": 682} {"train_loss": -19.9593563079834, "global_step": 56624, "epoch": 682} {"train_loss": -20.055479049682617, "global_step": 56625, "epoch": 682} {"train_loss": -20.065439224243164, "global_step": 56626, "epoch": 682} {"train_loss": -20.40006446838379, "global_step": 56627, "epoch": 682} {"train_loss": -20.153173446655273, "global_step": 56628, "epoch": 682} {"train_loss": -20.264404296875, "global_step": 56629, "epoch": 682} {"train_loss": -20.218164443969727, "global_step": 56630, "epoch": 682} {"train_loss": -20.222078323364258, "global_step": 56631, "epoch": 682} {"train_loss": -20.298795700073242, "global_step": 56632, "epoch": 682} {"train_loss": -20.0493221282959, "global_step": 56633, "epoch": 682} {"train_loss": -20.19313621520996, "global_step": 56634, "epoch": 682} {"train_loss": -20.132131576538086, "global_step": 56635, "epoch": 682} {"train_loss": -20.362436294555664, "global_step": 56636, "epoch": 682} {"train_loss": -20.118146896362305, "global_step": 56637, "epoch": 682} {"train_loss": -20.397123336791992, "global_step": 56638, "epoch": 682} {"train_loss": -20.305702209472656, "global_step": 56639, "epoch": 682} {"train_loss": -20.254079818725586, "global_step": 56640, "epoch": 682} {"train_loss": -20.686809539794922, "global_step": 56641, "epoch": 682} {"train_loss": -20.144346237182617, "global_step": 56642, "epoch": 682} {"train_loss": -20.161880493164062, "global_step": 56643, "epoch": 682} {"train_loss": -20.203704833984375, "global_step": 56644, "epoch": 682} {"train_loss": -20.49771499633789, "global_step": 56645, "epoch": 682} {"train_loss": -20.38490867614746, "global_step": 56646, "epoch": 682} {"train_loss": -20.522106170654297, "global_step": 56647, "epoch": 682} {"train_loss": -20.291141510009766, "global_step": 56648, "epoch": 682} {"train_loss": -20.108373641967773, "global_step": 56649, "epoch": 682} {"train_loss": -19.941713333129883, "global_step": 56650, "epoch": 682} {"train_loss": -20.205204010009766, "global_step": 56651, "epoch": 682} {"train_loss": -20.259567260742188, "global_step": 56652, "epoch": 682} {"train_loss": -20.190595626831055, "global_step": 56653, "epoch": 682} {"train_loss": -20.490461349487305, "global_step": 56654, "epoch": 682} {"train_loss": -20.229238510131836, "global_step": 56655, "epoch": 682} {"train_loss": -20.134557723999023, "global_step": 56656, "epoch": 682} {"train_loss": -19.9655818939209, "global_step": 56657, "epoch": 682} {"train_loss": -20.315753936767578, "global_step": 56658, "epoch": 682} {"train_loss": -20.59793472290039, "global_step": 56659, "epoch": 682} {"train_loss": -19.838735580444336, "global_step": 56660, "epoch": 682} {"train_loss": -20.203664779663086, "global_step": 56661, "epoch": 682} {"train_loss": -20.404911041259766, "global_step": 56662, "epoch": 682} {"train_loss": -20.483728408813477, "global_step": 56663, "epoch": 682} {"train_loss": -20.72077178955078, "global_step": 56664, "epoch": 682} {"train_loss": -20.49800682067871, "global_step": 56665, "epoch": 682} {"train_loss": -20.004995346069336, "global_step": 56666, "epoch": 682} {"train_loss": -20.359600067138672, "global_step": 56667, "epoch": 682} {"train_loss": -20.4705810546875, "global_step": 56668, "epoch": 682} {"train_loss": -20.61034393310547, "global_step": 56669, "epoch": 682} {"train_loss": -20.16147232055664, "global_step": 56670, "epoch": 682} {"train_loss": -20.448516845703125, "global_step": 56671, "epoch": 682} {"train_loss": -20.618877410888672, "global_step": 56672, "epoch": 682} {"train_loss": -20.25063705444336, "global_step": 56673, "epoch": 682} {"train_loss": -20.245573043823242, "global_step": 56674, "epoch": 682} {"train_loss": -19.767797470092773, "global_step": 56675, "epoch": 682} {"train_loss": -20.258630752563477, "global_step": 56676, "epoch": 682} {"train_loss": -19.931184768676758, "global_step": 56677, "epoch": 682} {"train_loss": -20.300121307373047, "global_step": 56678, "epoch": 682} {"train_loss": -20.314022064208984, "global_step": 56679, "epoch": 682} {"train_loss": -20.218767166137695, "global_step": 56680, "epoch": 682} {"train_loss": -20.56271743774414, "global_step": 56681, "epoch": 682} {"train_loss": -20.383975982666016, "global_step": 56682, "epoch": 682} {"train_loss": -19.947843551635742, "global_step": 56683, "epoch": 682} {"train_loss": -20.226123809814453, "global_step": 56684, "epoch": 682} {"train_loss": -20.80413246154785, "global_step": 56685, "epoch": 682} {"train_loss": -20.16309928894043, "global_step": 56686, "epoch": 682} {"train_loss": -20.35640525817871, "global_step": 56687, "epoch": 682} {"train_loss": -20.245465933558453, "global_step": 56688, "epoch": 682, "val_loss": 6003919.0} {"train_loss": -20.07655906677246, "global_step": 56689, "epoch": 683} {"train_loss": -20.35995101928711, "global_step": 56690, "epoch": 683} {"train_loss": -20.01291275024414, "global_step": 56691, "epoch": 683} {"train_loss": -20.266016006469727, "global_step": 56692, "epoch": 683} {"train_loss": -20.229419708251953, "global_step": 56693, "epoch": 683} {"train_loss": -19.985193252563477, "global_step": 56694, "epoch": 683} {"train_loss": -20.241016387939453, "global_step": 56695, "epoch": 683} {"train_loss": -19.96569061279297, "global_step": 56696, "epoch": 683} {"train_loss": -20.2290096282959, "global_step": 56697, "epoch": 683} {"train_loss": -20.170875549316406, "global_step": 56698, "epoch": 683} {"train_loss": -20.347707748413086, "global_step": 56699, "epoch": 683} {"train_loss": -20.282257080078125, "global_step": 56700, "epoch": 683} {"train_loss": -19.995298385620117, "global_step": 56701, "epoch": 683} {"train_loss": -20.231586456298828, "global_step": 56702, "epoch": 683} {"train_loss": -20.50496482849121, "global_step": 56703, "epoch": 683} {"train_loss": -20.0400390625, "global_step": 56704, "epoch": 683} {"train_loss": -20.086166381835938, "global_step": 56705, "epoch": 683} {"train_loss": -20.345951080322266, "global_step": 56706, "epoch": 683} {"train_loss": -20.761438369750977, "global_step": 56707, "epoch": 683} {"train_loss": -20.298181533813477, "global_step": 56708, "epoch": 683} {"train_loss": -20.140766143798828, "global_step": 56709, "epoch": 683} {"train_loss": -20.3161678314209, "global_step": 56710, "epoch": 683} {"train_loss": -20.334278106689453, "global_step": 56711, "epoch": 683} {"train_loss": -20.114505767822266, "global_step": 56712, "epoch": 683} {"train_loss": -20.091815948486328, "global_step": 56713, "epoch": 683} {"train_loss": -20.370254516601562, "global_step": 56714, "epoch": 683} {"train_loss": -19.92144775390625, "global_step": 56715, "epoch": 683} {"train_loss": -20.173229217529297, "global_step": 56716, "epoch": 683} {"train_loss": -20.368743896484375, "global_step": 56717, "epoch": 683} {"train_loss": -20.06178092956543, "global_step": 56718, "epoch": 683} {"train_loss": -19.965795516967773, "global_step": 56719, "epoch": 683} {"train_loss": -20.36603355407715, "global_step": 56720, "epoch": 683} {"train_loss": -20.06374168395996, "global_step": 56721, "epoch": 683} {"train_loss": -20.01521110534668, "global_step": 56722, "epoch": 683} {"train_loss": -20.283714294433594, "global_step": 56723, "epoch": 683} {"train_loss": -20.19716453552246, "global_step": 56724, "epoch": 683} {"train_loss": -20.590116500854492, "global_step": 56725, "epoch": 683} {"train_loss": -20.156339645385742, "global_step": 56726, "epoch": 683} {"train_loss": -20.54775047302246, "global_step": 56727, "epoch": 683} {"train_loss": -20.28093910217285, "global_step": 56728, "epoch": 683} {"train_loss": -20.48468780517578, "global_step": 56729, "epoch": 683} {"train_loss": -20.27329444885254, "global_step": 56730, "epoch": 683} {"train_loss": -20.68263816833496, "global_step": 56731, "epoch": 683} {"train_loss": -19.88299560546875, "global_step": 56732, "epoch": 683} {"train_loss": -20.182863235473633, "global_step": 56733, "epoch": 683} {"train_loss": -20.529098510742188, "global_step": 56734, "epoch": 683} {"train_loss": -20.036869049072266, "global_step": 56735, "epoch": 683} {"train_loss": -20.366931915283203, "global_step": 56736, "epoch": 683} {"train_loss": -20.053730010986328, "global_step": 56737, "epoch": 683} {"train_loss": -20.393888473510742, "global_step": 56738, "epoch": 683} {"train_loss": -20.31460952758789, "global_step": 56739, "epoch": 683} {"train_loss": -20.096210479736328, "global_step": 56740, "epoch": 683} {"train_loss": -19.799314498901367, "global_step": 56741, "epoch": 683} {"train_loss": -20.203725814819336, "global_step": 56742, "epoch": 683} {"train_loss": -19.98630142211914, "global_step": 56743, "epoch": 683} {"train_loss": -20.189281463623047, "global_step": 56744, "epoch": 683} {"train_loss": -20.11310386657715, "global_step": 56745, "epoch": 683} {"train_loss": -20.150989532470703, "global_step": 56746, "epoch": 683} {"train_loss": -20.08266258239746, "global_step": 56747, "epoch": 683} {"train_loss": -20.354515075683594, "global_step": 56748, "epoch": 683} {"train_loss": -20.264694213867188, "global_step": 56749, "epoch": 683} {"train_loss": -20.257463455200195, "global_step": 56750, "epoch": 683} {"train_loss": -20.026193618774414, "global_step": 56751, "epoch": 683} {"train_loss": -20.461597442626953, "global_step": 56752, "epoch": 683} {"train_loss": -20.593692779541016, "global_step": 56753, "epoch": 683} {"train_loss": -20.528913497924805, "global_step": 56754, "epoch": 683} {"train_loss": -20.56462860107422, "global_step": 56755, "epoch": 683} {"train_loss": -20.196260452270508, "global_step": 56756, "epoch": 683} {"train_loss": -20.411243438720703, "global_step": 56757, "epoch": 683} {"train_loss": -20.07560157775879, "global_step": 56758, "epoch": 683} {"train_loss": -19.90547752380371, "global_step": 56759, "epoch": 683} {"train_loss": -20.110761642456055, "global_step": 56760, "epoch": 683} {"train_loss": -19.8227596282959, "global_step": 56761, "epoch": 683} {"train_loss": -20.05586814880371, "global_step": 56762, "epoch": 683} {"train_loss": -20.10367774963379, "global_step": 56763, "epoch": 683} {"train_loss": -20.00636863708496, "global_step": 56764, "epoch": 683} {"train_loss": -19.998624801635742, "global_step": 56765, "epoch": 683} {"train_loss": -19.984867095947266, "global_step": 56766, "epoch": 683} {"train_loss": -20.125415802001953, "global_step": 56767, "epoch": 683} {"train_loss": -19.987754821777344, "global_step": 56768, "epoch": 683} {"train_loss": -19.981586456298828, "global_step": 56769, "epoch": 683} {"train_loss": -20.154088973999023, "global_step": 56770, "epoch": 683} {"train_loss": -20.204355929271284, "global_step": 56771, "epoch": 683, "val_loss": 5962044.5} {"train_loss": -20.153018951416016, "global_step": 56772, "epoch": 684} {"train_loss": -19.668720245361328, "global_step": 56773, "epoch": 684} {"train_loss": -20.352792739868164, "global_step": 56774, "epoch": 684} {"train_loss": -20.268957138061523, "global_step": 56775, "epoch": 684} {"train_loss": -20.176170349121094, "global_step": 56776, "epoch": 684} {"train_loss": -19.93504524230957, "global_step": 56777, "epoch": 684} {"train_loss": -20.141328811645508, "global_step": 56778, "epoch": 684} {"train_loss": -20.274044036865234, "global_step": 56779, "epoch": 684} {"train_loss": -20.162952423095703, "global_step": 56780, "epoch": 684} {"train_loss": -20.480762481689453, "global_step": 56781, "epoch": 684} {"train_loss": -20.204103469848633, "global_step": 56782, "epoch": 684} {"train_loss": -20.148157119750977, "global_step": 56783, "epoch": 684} {"train_loss": -19.85546875, "global_step": 56784, "epoch": 684} {"train_loss": -20.1374568939209, "global_step": 56785, "epoch": 684} {"train_loss": -20.375350952148438, "global_step": 56786, "epoch": 684} {"train_loss": -20.04749298095703, "global_step": 56787, "epoch": 684} {"train_loss": -20.45487403869629, "global_step": 56788, "epoch": 684} {"train_loss": -20.40862464904785, "global_step": 56789, "epoch": 684} {"train_loss": -20.235212326049805, "global_step": 56790, "epoch": 684} {"train_loss": -20.19319725036621, "global_step": 56791, "epoch": 684} {"train_loss": -20.54015350341797, "global_step": 56792, "epoch": 684} {"train_loss": -20.555553436279297, "global_step": 56793, "epoch": 684} {"train_loss": -20.240230560302734, "global_step": 56794, "epoch": 684} {"train_loss": -20.050411224365234, "global_step": 56795, "epoch": 684} {"train_loss": -20.306610107421875, "global_step": 56796, "epoch": 684} {"train_loss": -20.72939109802246, "global_step": 56797, "epoch": 684} {"train_loss": -20.574365615844727, "global_step": 56798, "epoch": 684} {"train_loss": -20.495637893676758, "global_step": 56799, "epoch": 684} {"train_loss": -20.290502548217773, "global_step": 56800, "epoch": 684} {"train_loss": -20.358346939086914, "global_step": 56801, "epoch": 684} {"train_loss": -20.017181396484375, "global_step": 56802, "epoch": 684} {"train_loss": -20.268552780151367, "global_step": 56803, "epoch": 684} {"train_loss": -19.89961814880371, "global_step": 56804, "epoch": 684} {"train_loss": -20.379453659057617, "global_step": 56805, "epoch": 684} {"train_loss": -20.414453506469727, "global_step": 56806, "epoch": 684} {"train_loss": -20.29843521118164, "global_step": 56807, "epoch": 684} {"train_loss": -20.378854751586914, "global_step": 56808, "epoch": 684} {"train_loss": -20.161518096923828, "global_step": 56809, "epoch": 684} {"train_loss": -20.276966094970703, "global_step": 56810, "epoch": 684} {"train_loss": -20.141332626342773, "global_step": 56811, "epoch": 684} {"train_loss": -19.93727684020996, "global_step": 56812, "epoch": 684} {"train_loss": -20.220678329467773, "global_step": 56813, "epoch": 684} {"train_loss": -20.132099151611328, "global_step": 56814, "epoch": 684} {"train_loss": -20.248205184936523, "global_step": 56815, "epoch": 684} {"train_loss": -20.474620819091797, "global_step": 56816, "epoch": 684} {"train_loss": -20.16786003112793, "global_step": 56817, "epoch": 684} {"train_loss": -20.2667179107666, "global_step": 56818, "epoch": 684} {"train_loss": -20.045211791992188, "global_step": 56819, "epoch": 684} {"train_loss": -20.135011672973633, "global_step": 56820, "epoch": 684} {"train_loss": -20.056806564331055, "global_step": 56821, "epoch": 684} {"train_loss": -19.977460861206055, "global_step": 56822, "epoch": 684} {"train_loss": -20.538406372070312, "global_step": 56823, "epoch": 684} {"train_loss": -20.04819679260254, "global_step": 56824, "epoch": 684} {"train_loss": -20.0964412689209, "global_step": 56825, "epoch": 684} {"train_loss": -20.2156925201416, "global_step": 56826, "epoch": 684} {"train_loss": -20.136594772338867, "global_step": 56827, "epoch": 684} {"train_loss": -20.506763458251953, "global_step": 56828, "epoch": 684} {"train_loss": -20.382326126098633, "global_step": 56829, "epoch": 684} {"train_loss": -20.37476921081543, "global_step": 56830, "epoch": 684} {"train_loss": -19.771493911743164, "global_step": 56831, "epoch": 684} {"train_loss": -19.934926986694336, "global_step": 56832, "epoch": 684} {"train_loss": -20.262537002563477, "global_step": 56833, "epoch": 684} {"train_loss": -20.38588523864746, "global_step": 56834, "epoch": 684} {"train_loss": -19.813446044921875, "global_step": 56835, "epoch": 684} {"train_loss": -20.15549659729004, "global_step": 56836, "epoch": 684} {"train_loss": -20.00775718688965, "global_step": 56837, "epoch": 684} {"train_loss": -20.243146896362305, "global_step": 56838, "epoch": 684} {"train_loss": -20.355182647705078, "global_step": 56839, "epoch": 684} {"train_loss": -20.38935661315918, "global_step": 56840, "epoch": 684} {"train_loss": -20.508520126342773, "global_step": 56841, "epoch": 684} {"train_loss": -20.61097526550293, "global_step": 56842, "epoch": 684} {"train_loss": -20.1939640045166, "global_step": 56843, "epoch": 684} {"train_loss": -20.49380874633789, "global_step": 56844, "epoch": 684} {"train_loss": -20.56572723388672, "global_step": 56845, "epoch": 684} {"train_loss": -20.19329833984375, "global_step": 56846, "epoch": 684} {"train_loss": -20.42914390563965, "global_step": 56847, "epoch": 684} {"train_loss": -20.395849227905273, "global_step": 56848, "epoch": 684} {"train_loss": -20.106536865234375, "global_step": 56849, "epoch": 684} {"train_loss": -20.180978775024414, "global_step": 56850, "epoch": 684} {"train_loss": -19.965713500976562, "global_step": 56851, "epoch": 684} {"train_loss": -20.435211181640625, "global_step": 56852, "epoch": 684} {"train_loss": -20.3369140625, "global_step": 56853, "epoch": 684} {"train_loss": -20.24163073804005, "global_step": 56854, "epoch": 684, "val_loss": 5984084.0} {"train_loss": -20.284547805786133, "global_step": 56855, "epoch": 685} {"train_loss": -20.207937240600586, "global_step": 56856, "epoch": 685} {"train_loss": -20.450918197631836, "global_step": 56857, "epoch": 685} {"train_loss": -20.272174835205078, "global_step": 56858, "epoch": 685} {"train_loss": -20.122095108032227, "global_step": 56859, "epoch": 685} {"train_loss": -20.103696823120117, "global_step": 56860, "epoch": 685} {"train_loss": -19.903791427612305, "global_step": 56861, "epoch": 685} {"train_loss": -20.215505599975586, "global_step": 56862, "epoch": 685} {"train_loss": -20.12809181213379, "global_step": 56863, "epoch": 685} {"train_loss": -20.688203811645508, "global_step": 56864, "epoch": 685} {"train_loss": -20.030012130737305, "global_step": 56865, "epoch": 685} {"train_loss": -19.900976181030273, "global_step": 56866, "epoch": 685} {"train_loss": -20.220373153686523, "global_step": 56867, "epoch": 685} {"train_loss": -20.577009201049805, "global_step": 56868, "epoch": 685} {"train_loss": -19.969745635986328, "global_step": 56869, "epoch": 685} {"train_loss": -20.5185546875, "global_step": 56870, "epoch": 685} {"train_loss": -20.3403377532959, "global_step": 56871, "epoch": 685} {"train_loss": -20.672443389892578, "global_step": 56872, "epoch": 685} {"train_loss": -20.258703231811523, "global_step": 56873, "epoch": 685} {"train_loss": -20.21271324157715, "global_step": 56874, "epoch": 685} {"train_loss": -20.476268768310547, "global_step": 56875, "epoch": 685} {"train_loss": -20.357717514038086, "global_step": 56876, "epoch": 685} {"train_loss": -20.424449920654297, "global_step": 56877, "epoch": 685} {"train_loss": -20.13917350769043, "global_step": 56878, "epoch": 685} {"train_loss": -19.761152267456055, "global_step": 56879, "epoch": 685} {"train_loss": -20.108304977416992, "global_step": 56880, "epoch": 685} {"train_loss": -20.436222076416016, "global_step": 56881, "epoch": 685} {"train_loss": -20.491565704345703, "global_step": 56882, "epoch": 685} {"train_loss": -19.905776977539062, "global_step": 56883, "epoch": 685} {"train_loss": -20.54969596862793, "global_step": 56884, "epoch": 685} {"train_loss": -20.135513305664062, "global_step": 56885, "epoch": 685} {"train_loss": -20.35944175720215, "global_step": 56886, "epoch": 685} {"train_loss": -20.027551651000977, "global_step": 56887, "epoch": 685} {"train_loss": -20.481290817260742, "global_step": 56888, "epoch": 685} {"train_loss": -20.028684616088867, "global_step": 56889, "epoch": 685} {"train_loss": -20.055517196655273, "global_step": 56890, "epoch": 685} {"train_loss": -20.606826782226562, "global_step": 56891, "epoch": 685} {"train_loss": -20.276132583618164, "global_step": 56892, "epoch": 685} {"train_loss": -19.926700592041016, "global_step": 56893, "epoch": 685} {"train_loss": -20.152069091796875, "global_step": 56894, "epoch": 685} {"train_loss": -20.230558395385742, "global_step": 56895, "epoch": 685} {"train_loss": -20.191173553466797, "global_step": 56896, "epoch": 685} {"train_loss": -20.043455123901367, "global_step": 56897, "epoch": 685} {"train_loss": -20.392621994018555, "global_step": 56898, "epoch": 685} {"train_loss": -20.26465606689453, "global_step": 56899, "epoch": 685} {"train_loss": -20.095935821533203, "global_step": 56900, "epoch": 685} {"train_loss": -20.440568923950195, "global_step": 56901, "epoch": 685} {"train_loss": -20.067829132080078, "global_step": 56902, "epoch": 685} {"train_loss": -19.831735610961914, "global_step": 56903, "epoch": 685} {"train_loss": -20.28971290588379, "global_step": 56904, "epoch": 685} {"train_loss": -19.970869064331055, "global_step": 56905, "epoch": 685} {"train_loss": -20.036901473999023, "global_step": 56906, "epoch": 685} {"train_loss": -20.001447677612305, "global_step": 56907, "epoch": 685} {"train_loss": -20.40386390686035, "global_step": 56908, "epoch": 685} {"train_loss": -20.408153533935547, "global_step": 56909, "epoch": 685} {"train_loss": -20.209857940673828, "global_step": 56910, "epoch": 685} {"train_loss": -19.90477752685547, "global_step": 56911, "epoch": 685} {"train_loss": -20.13370132446289, "global_step": 56912, "epoch": 685} {"train_loss": -20.187192916870117, "global_step": 56913, "epoch": 685} {"train_loss": -20.031728744506836, "global_step": 56914, "epoch": 685} {"train_loss": -20.298171997070312, "global_step": 56915, "epoch": 685} {"train_loss": -20.30329704284668, "global_step": 56916, "epoch": 685} {"train_loss": -20.10280418395996, "global_step": 56917, "epoch": 685} {"train_loss": -20.22431755065918, "global_step": 56918, "epoch": 685} {"train_loss": -20.17531394958496, "global_step": 56919, "epoch": 685} {"train_loss": -20.174026489257812, "global_step": 56920, "epoch": 685} {"train_loss": -20.501672744750977, "global_step": 56921, "epoch": 685} {"train_loss": -20.376956939697266, "global_step": 56922, "epoch": 685} {"train_loss": -20.353410720825195, "global_step": 56923, "epoch": 685} {"train_loss": -20.42708396911621, "global_step": 56924, "epoch": 685} {"train_loss": -20.410104751586914, "global_step": 56925, "epoch": 685} {"train_loss": -20.377782821655273, "global_step": 56926, "epoch": 685} {"train_loss": -20.336206436157227, "global_step": 56927, "epoch": 685} {"train_loss": -19.8756160736084, "global_step": 56928, "epoch": 685} {"train_loss": -20.52311897277832, "global_step": 56929, "epoch": 685} {"train_loss": -20.266508102416992, "global_step": 56930, "epoch": 685} {"train_loss": -20.140348434448242, "global_step": 56931, "epoch": 685} {"train_loss": -20.459402084350586, "global_step": 56932, "epoch": 685} {"train_loss": -19.95115089416504, "global_step": 56933, "epoch": 685} {"train_loss": -20.387577056884766, "global_step": 56934, "epoch": 685} {"train_loss": -20.356260299682617, "global_step": 56935, "epoch": 685} {"train_loss": -20.228008270263672, "global_step": 56936, "epoch": 685} {"train_loss": -20.207010797707433, "global_step": 56937, "epoch": 685, "val_loss": 5916973.0} {"train_loss": -20.272075653076172, "global_step": 56938, "epoch": 686} {"train_loss": -20.1851863861084, "global_step": 56939, "epoch": 686} {"train_loss": -19.906169891357422, "global_step": 56940, "epoch": 686} {"train_loss": -20.372756958007812, "global_step": 56941, "epoch": 686} {"train_loss": -19.96401596069336, "global_step": 56942, "epoch": 686} {"train_loss": -20.207721710205078, "global_step": 56943, "epoch": 686} {"train_loss": -19.922107696533203, "global_step": 56944, "epoch": 686} {"train_loss": -20.043088912963867, "global_step": 56945, "epoch": 686} {"train_loss": -20.46358299255371, "global_step": 56946, "epoch": 686} {"train_loss": -20.285245895385742, "global_step": 56947, "epoch": 686} {"train_loss": -20.175621032714844, "global_step": 56948, "epoch": 686} {"train_loss": -20.06757926940918, "global_step": 56949, "epoch": 686} {"train_loss": -20.30539894104004, "global_step": 56950, "epoch": 686} {"train_loss": -20.210962295532227, "global_step": 56951, "epoch": 686} {"train_loss": -20.356632232666016, "global_step": 56952, "epoch": 686} {"train_loss": -20.18313217163086, "global_step": 56953, "epoch": 686} {"train_loss": -19.78754234313965, "global_step": 56954, "epoch": 686} {"train_loss": -20.098562240600586, "global_step": 56955, "epoch": 686} {"train_loss": -20.301485061645508, "global_step": 56956, "epoch": 686} {"train_loss": -20.734100341796875, "global_step": 56957, "epoch": 686} {"train_loss": -20.255231857299805, "global_step": 56958, "epoch": 686} {"train_loss": -20.0944766998291, "global_step": 56959, "epoch": 686} {"train_loss": -20.128265380859375, "global_step": 56960, "epoch": 686} {"train_loss": -20.239614486694336, "global_step": 56961, "epoch": 686} {"train_loss": -19.939237594604492, "global_step": 56962, "epoch": 686} {"train_loss": -20.389554977416992, "global_step": 56963, "epoch": 686} {"train_loss": -20.462295532226562, "global_step": 56964, "epoch": 686} {"train_loss": -20.098068237304688, "global_step": 56965, "epoch": 686} {"train_loss": -19.977649688720703, "global_step": 56966, "epoch": 686} {"train_loss": -20.318998336791992, "global_step": 56967, "epoch": 686} {"train_loss": -20.545988082885742, "global_step": 56968, "epoch": 686} {"train_loss": -20.345691680908203, "global_step": 56969, "epoch": 686} {"train_loss": -20.255327224731445, "global_step": 56970, "epoch": 686} {"train_loss": -20.09463882446289, "global_step": 56971, "epoch": 686} {"train_loss": -20.0789737701416, "global_step": 56972, "epoch": 686} {"train_loss": -20.213655471801758, "global_step": 56973, "epoch": 686} {"train_loss": -20.33125114440918, "global_step": 56974, "epoch": 686} {"train_loss": -20.064313888549805, "global_step": 56975, "epoch": 686} {"train_loss": -20.565195083618164, "global_step": 56976, "epoch": 686} {"train_loss": -19.640146255493164, "global_step": 56977, "epoch": 686} {"train_loss": -19.8092098236084, "global_step": 56978, "epoch": 686} {"train_loss": -20.491296768188477, "global_step": 56979, "epoch": 686} {"train_loss": -20.308834075927734, "global_step": 56980, "epoch": 686} {"train_loss": -19.989036560058594, "global_step": 56981, "epoch": 686} {"train_loss": -20.488662719726562, "global_step": 56982, "epoch": 686} {"train_loss": -20.22871971130371, "global_step": 56983, "epoch": 686} {"train_loss": -20.31415367126465, "global_step": 56984, "epoch": 686} {"train_loss": -19.96036148071289, "global_step": 56985, "epoch": 686} {"train_loss": -19.98257827758789, "global_step": 56986, "epoch": 686} {"train_loss": -20.51141929626465, "global_step": 56987, "epoch": 686} {"train_loss": -19.86276626586914, "global_step": 56988, "epoch": 686} {"train_loss": -20.536588668823242, "global_step": 56989, "epoch": 686} {"train_loss": -20.3537654876709, "global_step": 56990, "epoch": 686} {"train_loss": -20.225826263427734, "global_step": 56991, "epoch": 686} {"train_loss": -19.868896484375, "global_step": 56992, "epoch": 686} {"train_loss": -19.977346420288086, "global_step": 56993, "epoch": 686} {"train_loss": -20.355112075805664, "global_step": 56994, "epoch": 686} {"train_loss": -20.159391403198242, "global_step": 56995, "epoch": 686} {"train_loss": -20.235254287719727, "global_step": 56996, "epoch": 686} {"train_loss": -20.1790714263916, "global_step": 56997, "epoch": 686} {"train_loss": -20.638507843017578, "global_step": 56998, "epoch": 686} {"train_loss": -20.276660919189453, "global_step": 56999, "epoch": 686} {"train_loss": -20.068572998046875, "global_step": 57000, "epoch": 686} {"train_loss": -20.511383056640625, "global_step": 57001, "epoch": 686} {"train_loss": -19.934249877929688, "global_step": 57002, "epoch": 686} {"train_loss": -20.264062881469727, "global_step": 57003, "epoch": 686} {"train_loss": -20.152029037475586, "global_step": 57004, "epoch": 686} {"train_loss": -20.29236602783203, "global_step": 57005, "epoch": 686} {"train_loss": -19.761632919311523, "global_step": 57006, "epoch": 686} {"train_loss": -20.266332626342773, "global_step": 57007, "epoch": 686} {"train_loss": -20.05600929260254, "global_step": 57008, "epoch": 686} {"train_loss": -20.35931968688965, "global_step": 57009, "epoch": 686} {"train_loss": -20.080047607421875, "global_step": 57010, "epoch": 686} {"train_loss": -20.272794723510742, "global_step": 57011, "epoch": 686} {"train_loss": -20.14020347595215, "global_step": 57012, "epoch": 686} {"train_loss": -20.275020599365234, "global_step": 57013, "epoch": 686} {"train_loss": -20.00444221496582, "global_step": 57014, "epoch": 686} {"train_loss": -20.460983276367188, "global_step": 57015, "epoch": 686} {"train_loss": -20.017297744750977, "global_step": 57016, "epoch": 686} {"train_loss": -20.11175537109375, "global_step": 57017, "epoch": 686} {"train_loss": -20.677412033081055, "global_step": 57018, "epoch": 686} {"train_loss": -20.19109344482422, "global_step": 57019, "epoch": 686} {"train_loss": -20.20347700923322, "global_step": 57020, "epoch": 686, "val_loss": 6024162.0} {"train_loss": -19.035581588745117, "global_step": 57021, "epoch": 687} {"train_loss": -19.845853805541992, "global_step": 57022, "epoch": 687} {"train_loss": -19.25809669494629, "global_step": 57023, "epoch": 687} {"train_loss": -19.198148727416992, "global_step": 57024, "epoch": 687} {"train_loss": -19.64106559753418, "global_step": 57025, "epoch": 687} {"train_loss": -19.734020233154297, "global_step": 57026, "epoch": 687} {"train_loss": -19.948511123657227, "global_step": 57027, "epoch": 687} {"train_loss": -19.90534210205078, "global_step": 57028, "epoch": 687} {"train_loss": -19.879362106323242, "global_step": 57029, "epoch": 687} {"train_loss": -19.925703048706055, "global_step": 57030, "epoch": 687} {"train_loss": -20.056821823120117, "global_step": 57031, "epoch": 687} {"train_loss": -19.587249755859375, "global_step": 57032, "epoch": 687} {"train_loss": -20.071880340576172, "global_step": 57033, "epoch": 687} {"train_loss": -20.04323959350586, "global_step": 57034, "epoch": 687} {"train_loss": -20.19696617126465, "global_step": 57035, "epoch": 687} {"train_loss": -20.089338302612305, "global_step": 57036, "epoch": 687} {"train_loss": -20.060319900512695, "global_step": 57037, "epoch": 687} {"train_loss": -19.89539909362793, "global_step": 57038, "epoch": 687} {"train_loss": -20.199115753173828, "global_step": 57039, "epoch": 687} {"train_loss": -19.80695152282715, "global_step": 57040, "epoch": 687} {"train_loss": -20.23740005493164, "global_step": 57041, "epoch": 687} {"train_loss": -19.86594581604004, "global_step": 57042, "epoch": 687} {"train_loss": -20.278549194335938, "global_step": 57043, "epoch": 687} {"train_loss": -20.38520622253418, "global_step": 57044, "epoch": 687} {"train_loss": -20.469039916992188, "global_step": 57045, "epoch": 687} {"train_loss": -20.493574142456055, "global_step": 57046, "epoch": 687} {"train_loss": -20.25396156311035, "global_step": 57047, "epoch": 687} {"train_loss": -20.483793258666992, "global_step": 57048, "epoch": 687} {"train_loss": -20.207157135009766, "global_step": 57049, "epoch": 687} {"train_loss": -20.495159149169922, "global_step": 57050, "epoch": 687} {"train_loss": -20.38815689086914, "global_step": 57051, "epoch": 687} {"train_loss": -20.230070114135742, "global_step": 57052, "epoch": 687} {"train_loss": -19.88213348388672, "global_step": 57053, "epoch": 687} {"train_loss": -20.074399948120117, "global_step": 57054, "epoch": 687} {"train_loss": -19.77227783203125, "global_step": 57055, "epoch": 687} {"train_loss": -19.940078735351562, "global_step": 57056, "epoch": 687} {"train_loss": -20.116689682006836, "global_step": 57057, "epoch": 687} {"train_loss": -20.05086898803711, "global_step": 57058, "epoch": 687} {"train_loss": -20.160953521728516, "global_step": 57059, "epoch": 687} {"train_loss": -20.036081314086914, "global_step": 57060, "epoch": 687} {"train_loss": -20.054460525512695, "global_step": 57061, "epoch": 687} {"train_loss": -20.308395385742188, "global_step": 57062, "epoch": 687} {"train_loss": -20.105676651000977, "global_step": 57063, "epoch": 687} {"train_loss": -20.0631103515625, "global_step": 57064, "epoch": 687} {"train_loss": -20.22396469116211, "global_step": 57065, "epoch": 687} {"train_loss": -20.281593322753906, "global_step": 57066, "epoch": 687} {"train_loss": -20.30193328857422, "global_step": 57067, "epoch": 687} {"train_loss": -20.132823944091797, "global_step": 57068, "epoch": 687} {"train_loss": -20.313154220581055, "global_step": 57069, "epoch": 687} {"train_loss": -20.08196449279785, "global_step": 57070, "epoch": 687} {"train_loss": -20.390522003173828, "global_step": 57071, "epoch": 687} {"train_loss": -20.030445098876953, "global_step": 57072, "epoch": 687} {"train_loss": -20.367170333862305, "global_step": 57073, "epoch": 687} {"train_loss": -20.52503776550293, "global_step": 57074, "epoch": 687} {"train_loss": -20.077436447143555, "global_step": 57075, "epoch": 687} {"train_loss": -20.15558433532715, "global_step": 57076, "epoch": 687} {"train_loss": -20.244138717651367, "global_step": 57077, "epoch": 687} {"train_loss": -20.285430908203125, "global_step": 57078, "epoch": 687} {"train_loss": -20.044082641601562, "global_step": 57079, "epoch": 687} {"train_loss": -20.467985153198242, "global_step": 57080, "epoch": 687} {"train_loss": -20.53720474243164, "global_step": 57081, "epoch": 687} {"train_loss": -20.321317672729492, "global_step": 57082, "epoch": 687} {"train_loss": -20.11673355102539, "global_step": 57083, "epoch": 687} {"train_loss": -20.235258102416992, "global_step": 57084, "epoch": 687} {"train_loss": -20.44019889831543, "global_step": 57085, "epoch": 687} {"train_loss": -20.301509857177734, "global_step": 57086, "epoch": 687} {"train_loss": -20.313051223754883, "global_step": 57087, "epoch": 687} {"train_loss": -20.1846981048584, "global_step": 57088, "epoch": 687} {"train_loss": -20.403852462768555, "global_step": 57089, "epoch": 687} {"train_loss": -20.168649673461914, "global_step": 57090, "epoch": 687} {"train_loss": -20.307836532592773, "global_step": 57091, "epoch": 687} {"train_loss": -19.861011505126953, "global_step": 57092, "epoch": 687} {"train_loss": -20.49833106994629, "global_step": 57093, "epoch": 687} {"train_loss": -20.293424606323242, "global_step": 57094, "epoch": 687} {"train_loss": -20.1640567779541, "global_step": 57095, "epoch": 687} {"train_loss": -20.32429313659668, "global_step": 57096, "epoch": 687} {"train_loss": -20.342390060424805, "global_step": 57097, "epoch": 687} {"train_loss": -20.30817222595215, "global_step": 57098, "epoch": 687} {"train_loss": -19.952844619750977, "global_step": 57099, "epoch": 687} {"train_loss": -20.038190841674805, "global_step": 57100, "epoch": 687} {"train_loss": -20.516372680664062, "global_step": 57101, "epoch": 687} {"train_loss": -20.179819107055664, "global_step": 57102, "epoch": 687} {"train_loss": -20.13874357292451, "global_step": 57103, "epoch": 687, "val_loss": 5962673.0} {"train_loss": -20.487977981567383, "global_step": 57104, "epoch": 688} {"train_loss": -20.400590896606445, "global_step": 57105, "epoch": 688} {"train_loss": -20.285276412963867, "global_step": 57106, "epoch": 688} {"train_loss": -20.05447769165039, "global_step": 57107, "epoch": 688} {"train_loss": -20.29861831665039, "global_step": 57108, "epoch": 688} {"train_loss": -20.25366973876953, "global_step": 57109, "epoch": 688} {"train_loss": -20.02931022644043, "global_step": 57110, "epoch": 688} {"train_loss": -20.389848709106445, "global_step": 57111, "epoch": 688} {"train_loss": -20.18807029724121, "global_step": 57112, "epoch": 688} {"train_loss": -20.15765953063965, "global_step": 57113, "epoch": 688} {"train_loss": -20.026060104370117, "global_step": 57114, "epoch": 688} {"train_loss": -20.259214401245117, "global_step": 57115, "epoch": 688} {"train_loss": -20.327075958251953, "global_step": 57116, "epoch": 688} {"train_loss": -20.226179122924805, "global_step": 57117, "epoch": 688} {"train_loss": -20.358421325683594, "global_step": 57118, "epoch": 688} {"train_loss": -20.250207901000977, "global_step": 57119, "epoch": 688} {"train_loss": -20.458864212036133, "global_step": 57120, "epoch": 688} {"train_loss": -20.199350357055664, "global_step": 57121, "epoch": 688} {"train_loss": -20.658605575561523, "global_step": 57122, "epoch": 688} {"train_loss": -20.257247924804688, "global_step": 57123, "epoch": 688} {"train_loss": -20.001291275024414, "global_step": 57124, "epoch": 688} {"train_loss": -20.1927547454834, "global_step": 57125, "epoch": 688} {"train_loss": -20.292373657226562, "global_step": 57126, "epoch": 688} {"train_loss": -20.549331665039062, "global_step": 57127, "epoch": 688} {"train_loss": -20.37619972229004, "global_step": 57128, "epoch": 688} {"train_loss": -20.252132415771484, "global_step": 57129, "epoch": 688} {"train_loss": -20.52504539489746, "global_step": 57130, "epoch": 688} {"train_loss": -20.120412826538086, "global_step": 57131, "epoch": 688} {"train_loss": -20.67594337463379, "global_step": 57132, "epoch": 688} {"train_loss": -19.933853149414062, "global_step": 57133, "epoch": 688} {"train_loss": -20.189258575439453, "global_step": 57134, "epoch": 688} {"train_loss": -20.055082321166992, "global_step": 57135, "epoch": 688} {"train_loss": -20.21879768371582, "global_step": 57136, "epoch": 688} {"train_loss": -20.53239631652832, "global_step": 57137, "epoch": 688} {"train_loss": -20.432126998901367, "global_step": 57138, "epoch": 688} {"train_loss": -19.795957565307617, "global_step": 57139, "epoch": 688} {"train_loss": -20.65534019470215, "global_step": 57140, "epoch": 688} {"train_loss": -19.824748992919922, "global_step": 57141, "epoch": 688} {"train_loss": -20.355581283569336, "global_step": 57142, "epoch": 688} {"train_loss": -20.4807186126709, "global_step": 57143, "epoch": 688} {"train_loss": -20.08815574645996, "global_step": 57144, "epoch": 688} {"train_loss": -20.44806671142578, "global_step": 57145, "epoch": 688} {"train_loss": -20.21820068359375, "global_step": 57146, "epoch": 688} {"train_loss": -20.00160789489746, "global_step": 57147, "epoch": 688} {"train_loss": -20.120147705078125, "global_step": 57148, "epoch": 688} {"train_loss": -20.09644317626953, "global_step": 57149, "epoch": 688} {"train_loss": -20.031728744506836, "global_step": 57150, "epoch": 688} {"train_loss": -20.45990753173828, "global_step": 57151, "epoch": 688} {"train_loss": -19.878652572631836, "global_step": 57152, "epoch": 688} {"train_loss": -20.288362503051758, "global_step": 57153, "epoch": 688} {"train_loss": -20.07584571838379, "global_step": 57154, "epoch": 688} {"train_loss": -20.382463455200195, "global_step": 57155, "epoch": 688} {"train_loss": -20.159141540527344, "global_step": 57156, "epoch": 688} {"train_loss": -20.210233688354492, "global_step": 57157, "epoch": 688} {"train_loss": -20.396081924438477, "global_step": 57158, "epoch": 688} {"train_loss": -19.98988914489746, "global_step": 57159, "epoch": 688} {"train_loss": -20.31905746459961, "global_step": 57160, "epoch": 688} {"train_loss": -20.25581932067871, "global_step": 57161, "epoch": 688} {"train_loss": -19.93398094177246, "global_step": 57162, "epoch": 688} {"train_loss": -20.32801628112793, "global_step": 57163, "epoch": 688} {"train_loss": -20.423297882080078, "global_step": 57164, "epoch": 688} {"train_loss": -20.22454833984375, "global_step": 57165, "epoch": 688} {"train_loss": -20.212919235229492, "global_step": 57166, "epoch": 688} {"train_loss": -20.049760818481445, "global_step": 57167, "epoch": 688} {"train_loss": -20.103017807006836, "global_step": 57168, "epoch": 688} {"train_loss": -20.288516998291016, "global_step": 57169, "epoch": 688} {"train_loss": -20.08721923828125, "global_step": 57170, "epoch": 688} {"train_loss": -20.57442283630371, "global_step": 57171, "epoch": 688} {"train_loss": -20.144229888916016, "global_step": 57172, "epoch": 688} {"train_loss": -20.313161849975586, "global_step": 57173, "epoch": 688} {"train_loss": -20.65895652770996, "global_step": 57174, "epoch": 688} {"train_loss": -20.255634307861328, "global_step": 57175, "epoch": 688} {"train_loss": -20.442663192749023, "global_step": 57176, "epoch": 688} {"train_loss": -20.481590270996094, "global_step": 57177, "epoch": 688} {"train_loss": -20.497028350830078, "global_step": 57178, "epoch": 688} {"train_loss": -20.03309440612793, "global_step": 57179, "epoch": 688} {"train_loss": -20.353321075439453, "global_step": 57180, "epoch": 688} {"train_loss": -20.259855270385742, "global_step": 57181, "epoch": 688} {"train_loss": -20.43644905090332, "global_step": 57182, "epoch": 688} {"train_loss": -20.354652404785156, "global_step": 57183, "epoch": 688} {"train_loss": -20.302474975585938, "global_step": 57184, "epoch": 688} {"train_loss": -19.912145614624023, "global_step": 57185, "epoch": 688} {"train_loss": -20.252246075365917, "global_step": 57186, "epoch": 688, "val_loss": 5955036.5} {"train_loss": -19.78754997253418, "global_step": 57187, "epoch": 689} {"train_loss": -20.08176040649414, "global_step": 57188, "epoch": 689} {"train_loss": -19.852703094482422, "global_step": 57189, "epoch": 689} {"train_loss": -20.504791259765625, "global_step": 57190, "epoch": 689} {"train_loss": -20.100889205932617, "global_step": 57191, "epoch": 689} {"train_loss": -19.87306022644043, "global_step": 57192, "epoch": 689} {"train_loss": -20.252464294433594, "global_step": 57193, "epoch": 689} {"train_loss": -19.93243408203125, "global_step": 57194, "epoch": 689} {"train_loss": -20.444091796875, "global_step": 57195, "epoch": 689} {"train_loss": -20.19879913330078, "global_step": 57196, "epoch": 689} {"train_loss": -20.560758590698242, "global_step": 57197, "epoch": 689} {"train_loss": -20.17814064025879, "global_step": 57198, "epoch": 689} {"train_loss": -20.033843994140625, "global_step": 57199, "epoch": 689} {"train_loss": -20.09123992919922, "global_step": 57200, "epoch": 689} {"train_loss": -20.298093795776367, "global_step": 57201, "epoch": 689} {"train_loss": -19.998685836791992, "global_step": 57202, "epoch": 689} {"train_loss": -20.319684982299805, "global_step": 57203, "epoch": 689} {"train_loss": -19.916671752929688, "global_step": 57204, "epoch": 689} {"train_loss": -20.31118392944336, "global_step": 57205, "epoch": 689} {"train_loss": -20.093704223632812, "global_step": 57206, "epoch": 689} {"train_loss": -20.25446891784668, "global_step": 57207, "epoch": 689} {"train_loss": -20.438623428344727, "global_step": 57208, "epoch": 689} {"train_loss": -20.434654235839844, "global_step": 57209, "epoch": 689} {"train_loss": -19.914592742919922, "global_step": 57210, "epoch": 689} {"train_loss": -19.879384994506836, "global_step": 57211, "epoch": 689} {"train_loss": -20.404102325439453, "global_step": 57212, "epoch": 689} {"train_loss": -20.052885055541992, "global_step": 57213, "epoch": 689} {"train_loss": -20.149076461791992, "global_step": 57214, "epoch": 689} {"train_loss": -20.504444122314453, "global_step": 57215, "epoch": 689} {"train_loss": -20.60265350341797, "global_step": 57216, "epoch": 689} {"train_loss": -20.274755477905273, "global_step": 57217, "epoch": 689} {"train_loss": -20.117021560668945, "global_step": 57218, "epoch": 689} {"train_loss": -20.367115020751953, "global_step": 57219, "epoch": 689} {"train_loss": -20.52833366394043, "global_step": 57220, "epoch": 689} {"train_loss": -20.52986717224121, "global_step": 57221, "epoch": 689} {"train_loss": -20.3339900970459, "global_step": 57222, "epoch": 689} {"train_loss": -20.170337677001953, "global_step": 57223, "epoch": 689} {"train_loss": -20.252729415893555, "global_step": 57224, "epoch": 689} {"train_loss": -19.822385787963867, "global_step": 57225, "epoch": 689} {"train_loss": -20.456769943237305, "global_step": 57226, "epoch": 689} {"train_loss": -20.480609893798828, "global_step": 57227, "epoch": 689} {"train_loss": -20.10783576965332, "global_step": 57228, "epoch": 689} {"train_loss": -20.413610458374023, "global_step": 57229, "epoch": 689} {"train_loss": -20.054208755493164, "global_step": 57230, "epoch": 689} {"train_loss": -19.78767967224121, "global_step": 57231, "epoch": 689} {"train_loss": -20.23884391784668, "global_step": 57232, "epoch": 689} {"train_loss": -19.9564266204834, "global_step": 57233, "epoch": 689} {"train_loss": -20.042160034179688, "global_step": 57234, "epoch": 689} {"train_loss": -20.187774658203125, "global_step": 57235, "epoch": 689} {"train_loss": -19.98050308227539, "global_step": 57236, "epoch": 689} {"train_loss": -19.817855834960938, "global_step": 57237, "epoch": 689} {"train_loss": -20.268674850463867, "global_step": 57238, "epoch": 689} {"train_loss": -20.114633560180664, "global_step": 57239, "epoch": 689} {"train_loss": -20.264413833618164, "global_step": 57240, "epoch": 689} {"train_loss": -20.002269744873047, "global_step": 57241, "epoch": 689} {"train_loss": -20.361440658569336, "global_step": 57242, "epoch": 689} {"train_loss": -20.400005340576172, "global_step": 57243, "epoch": 689} {"train_loss": -20.06878662109375, "global_step": 57244, "epoch": 689} {"train_loss": -20.169828414916992, "global_step": 57245, "epoch": 689} {"train_loss": -19.8602237701416, "global_step": 57246, "epoch": 689} {"train_loss": -20.2911376953125, "global_step": 57247, "epoch": 689} {"train_loss": -20.256282806396484, "global_step": 57248, "epoch": 689} {"train_loss": -20.00636100769043, "global_step": 57249, "epoch": 689} {"train_loss": -20.685102462768555, "global_step": 57250, "epoch": 689} {"train_loss": -20.57917022705078, "global_step": 57251, "epoch": 689} {"train_loss": -20.295482635498047, "global_step": 57252, "epoch": 689} {"train_loss": -19.9948673248291, "global_step": 57253, "epoch": 689} {"train_loss": -20.0799617767334, "global_step": 57254, "epoch": 689} {"train_loss": -20.305362701416016, "global_step": 57255, "epoch": 689} {"train_loss": -19.99810791015625, "global_step": 57256, "epoch": 689} {"train_loss": -20.382190704345703, "global_step": 57257, "epoch": 689} {"train_loss": -20.616735458374023, "global_step": 57258, "epoch": 689} {"train_loss": -20.08675193786621, "global_step": 57259, "epoch": 689} {"train_loss": -20.33389663696289, "global_step": 57260, "epoch": 689} {"train_loss": -20.238550186157227, "global_step": 57261, "epoch": 689} {"train_loss": -20.4270076751709, "global_step": 57262, "epoch": 689} {"train_loss": -20.044498443603516, "global_step": 57263, "epoch": 689} {"train_loss": -20.41542625427246, "global_step": 57264, "epoch": 689} {"train_loss": -20.46430015563965, "global_step": 57265, "epoch": 689} {"train_loss": -20.1015567779541, "global_step": 57266, "epoch": 689} {"train_loss": -20.364002227783203, "global_step": 57267, "epoch": 689} {"train_loss": -20.284902572631836, "global_step": 57268, "epoch": 689} {"train_loss": -20.216436661869647, "global_step": 57269, "epoch": 689, "val_loss": 5977869.5} {"train_loss": -19.9256649017334, "global_step": 57270, "epoch": 690} {"train_loss": -20.497629165649414, "global_step": 57271, "epoch": 690} {"train_loss": -20.13825035095215, "global_step": 57272, "epoch": 690} {"train_loss": -20.085453033447266, "global_step": 57273, "epoch": 690} {"train_loss": -20.133996963500977, "global_step": 57274, "epoch": 690} {"train_loss": -19.988739013671875, "global_step": 57275, "epoch": 690} {"train_loss": -20.172683715820312, "global_step": 57276, "epoch": 690} {"train_loss": -20.102903366088867, "global_step": 57277, "epoch": 690} {"train_loss": -20.371612548828125, "global_step": 57278, "epoch": 690} {"train_loss": -20.19580078125, "global_step": 57279, "epoch": 690} {"train_loss": -20.041383743286133, "global_step": 57280, "epoch": 690} {"train_loss": -20.20991325378418, "global_step": 57281, "epoch": 690} {"train_loss": -19.900354385375977, "global_step": 57282, "epoch": 690} {"train_loss": -20.098743438720703, "global_step": 57283, "epoch": 690} {"train_loss": -20.296606063842773, "global_step": 57284, "epoch": 690} {"train_loss": -20.01839256286621, "global_step": 57285, "epoch": 690} {"train_loss": -20.313068389892578, "global_step": 57286, "epoch": 690} {"train_loss": -20.252653121948242, "global_step": 57287, "epoch": 690} {"train_loss": -19.89687156677246, "global_step": 57288, "epoch": 690} {"train_loss": -20.408735275268555, "global_step": 57289, "epoch": 690} {"train_loss": -20.768138885498047, "global_step": 57290, "epoch": 690} {"train_loss": -20.386247634887695, "global_step": 57291, "epoch": 690} {"train_loss": -20.27720832824707, "global_step": 57292, "epoch": 690} {"train_loss": -20.549989700317383, "global_step": 57293, "epoch": 690} {"train_loss": -20.168079376220703, "global_step": 57294, "epoch": 690} {"train_loss": -20.27070426940918, "global_step": 57295, "epoch": 690} {"train_loss": -19.999568939208984, "global_step": 57296, "epoch": 690} {"train_loss": -20.278982162475586, "global_step": 57297, "epoch": 690} {"train_loss": -20.356327056884766, "global_step": 57298, "epoch": 690} {"train_loss": -20.430662155151367, "global_step": 57299, "epoch": 690} {"train_loss": -20.222976684570312, "global_step": 57300, "epoch": 690} {"train_loss": -20.156986236572266, "global_step": 57301, "epoch": 690} {"train_loss": -20.24958610534668, "global_step": 57302, "epoch": 690} {"train_loss": -20.178672790527344, "global_step": 57303, "epoch": 690} {"train_loss": -20.16798210144043, "global_step": 57304, "epoch": 690} {"train_loss": -20.567623138427734, "global_step": 57305, "epoch": 690} {"train_loss": -20.128398895263672, "global_step": 57306, "epoch": 690} {"train_loss": -20.389469146728516, "global_step": 57307, "epoch": 690} {"train_loss": -20.162290573120117, "global_step": 57308, "epoch": 690} {"train_loss": -20.2598876953125, "global_step": 57309, "epoch": 690} {"train_loss": -20.287282943725586, "global_step": 57310, "epoch": 690} {"train_loss": -20.484378814697266, "global_step": 57311, "epoch": 690} {"train_loss": -20.408660888671875, "global_step": 57312, "epoch": 690} {"train_loss": -20.587379455566406, "global_step": 57313, "epoch": 690} {"train_loss": -20.689598083496094, "global_step": 57314, "epoch": 690} {"train_loss": -20.291837692260742, "global_step": 57315, "epoch": 690} {"train_loss": -20.55702781677246, "global_step": 57316, "epoch": 690} {"train_loss": -20.487241744995117, "global_step": 57317, "epoch": 690} {"train_loss": -20.512649536132812, "global_step": 57318, "epoch": 690} {"train_loss": -20.37552833557129, "global_step": 57319, "epoch": 690} {"train_loss": -20.584796905517578, "global_step": 57320, "epoch": 690} {"train_loss": -20.339414596557617, "global_step": 57321, "epoch": 690} {"train_loss": -20.13408851623535, "global_step": 57322, "epoch": 690} {"train_loss": -20.26222038269043, "global_step": 57323, "epoch": 690} {"train_loss": -20.617145538330078, "global_step": 57324, "epoch": 690} {"train_loss": -20.720932006835938, "global_step": 57325, "epoch": 690} {"train_loss": -20.068044662475586, "global_step": 57326, "epoch": 690} {"train_loss": -20.337913513183594, "global_step": 57327, "epoch": 690} {"train_loss": -20.08973503112793, "global_step": 57328, "epoch": 690} {"train_loss": -20.108043670654297, "global_step": 57329, "epoch": 690} {"train_loss": -19.835107803344727, "global_step": 57330, "epoch": 690} {"train_loss": -20.19808578491211, "global_step": 57331, "epoch": 690} {"train_loss": -20.041784286499023, "global_step": 57332, "epoch": 690} {"train_loss": -19.930755615234375, "global_step": 57333, "epoch": 690} {"train_loss": -20.314674377441406, "global_step": 57334, "epoch": 690} {"train_loss": -19.917776107788086, "global_step": 57335, "epoch": 690} {"train_loss": -20.3747501373291, "global_step": 57336, "epoch": 690} {"train_loss": -20.113000869750977, "global_step": 57337, "epoch": 690} {"train_loss": -20.238935470581055, "global_step": 57338, "epoch": 690} {"train_loss": -20.049253463745117, "global_step": 57339, "epoch": 690} {"train_loss": -19.995107650756836, "global_step": 57340, "epoch": 690} {"train_loss": -20.361927032470703, "global_step": 57341, "epoch": 690} {"train_loss": -20.458066940307617, "global_step": 57342, "epoch": 690} {"train_loss": -20.323837280273438, "global_step": 57343, "epoch": 690} {"train_loss": -20.030668258666992, "global_step": 57344, "epoch": 690} {"train_loss": -20.162132263183594, "global_step": 57345, "epoch": 690} {"train_loss": -19.99176788330078, "global_step": 57346, "epoch": 690} {"train_loss": -20.25578498840332, "global_step": 57347, "epoch": 690} {"train_loss": -20.287784576416016, "global_step": 57348, "epoch": 690} {"train_loss": -20.220508575439453, "global_step": 57349, "epoch": 690} {"train_loss": -20.327823638916016, "global_step": 57350, "epoch": 690} {"train_loss": -19.979028701782227, "global_step": 57351, "epoch": 690} {"train_loss": -20.241784428975667, "global_step": 57352, "epoch": 690, "val_loss": 5973040.0} {"train_loss": -20.103513717651367, "global_step": 57353, "epoch": 691} {"train_loss": -20.20018196105957, "global_step": 57354, "epoch": 691} {"train_loss": -20.688941955566406, "global_step": 57355, "epoch": 691} {"train_loss": -20.245153427124023, "global_step": 57356, "epoch": 691} {"train_loss": -20.254941940307617, "global_step": 57357, "epoch": 691} {"train_loss": -20.238086700439453, "global_step": 57358, "epoch": 691} {"train_loss": -20.314199447631836, "global_step": 57359, "epoch": 691} {"train_loss": -20.253662109375, "global_step": 57360, "epoch": 691} {"train_loss": -20.293502807617188, "global_step": 57361, "epoch": 691} {"train_loss": -20.55513572692871, "global_step": 57362, "epoch": 691} {"train_loss": -20.096113204956055, "global_step": 57363, "epoch": 691} {"train_loss": -20.163732528686523, "global_step": 57364, "epoch": 691} {"train_loss": -20.161832809448242, "global_step": 57365, "epoch": 691} {"train_loss": -20.291231155395508, "global_step": 57366, "epoch": 691} {"train_loss": -19.79319190979004, "global_step": 57367, "epoch": 691} {"train_loss": -20.257938385009766, "global_step": 57368, "epoch": 691} {"train_loss": -20.226821899414062, "global_step": 57369, "epoch": 691} {"train_loss": -20.1612606048584, "global_step": 57370, "epoch": 691} {"train_loss": -20.36444664001465, "global_step": 57371, "epoch": 691} {"train_loss": -20.113882064819336, "global_step": 57372, "epoch": 691} {"train_loss": -20.723526000976562, "global_step": 57373, "epoch": 691} {"train_loss": -20.133493423461914, "global_step": 57374, "epoch": 691} {"train_loss": -20.526628494262695, "global_step": 57375, "epoch": 691} {"train_loss": -20.339441299438477, "global_step": 57376, "epoch": 691} {"train_loss": -20.29336166381836, "global_step": 57377, "epoch": 691} {"train_loss": -20.10218620300293, "global_step": 57378, "epoch": 691} {"train_loss": -20.665420532226562, "global_step": 57379, "epoch": 691} {"train_loss": -19.588926315307617, "global_step": 57380, "epoch": 691} {"train_loss": -20.142929077148438, "global_step": 57381, "epoch": 691} {"train_loss": -20.50865364074707, "global_step": 57382, "epoch": 691} {"train_loss": -20.668516159057617, "global_step": 57383, "epoch": 691} {"train_loss": -20.159276962280273, "global_step": 57384, "epoch": 691} {"train_loss": -20.180883407592773, "global_step": 57385, "epoch": 691} {"train_loss": -20.635555267333984, "global_step": 57386, "epoch": 691} {"train_loss": -20.30696678161621, "global_step": 57387, "epoch": 691} {"train_loss": -20.58221435546875, "global_step": 57388, "epoch": 691} {"train_loss": -20.123382568359375, "global_step": 57389, "epoch": 691} {"train_loss": -19.982891082763672, "global_step": 57390, "epoch": 691} {"train_loss": -20.393999099731445, "global_step": 57391, "epoch": 691} {"train_loss": -20.09463119506836, "global_step": 57392, "epoch": 691} {"train_loss": -20.501340866088867, "global_step": 57393, "epoch": 691} {"train_loss": -20.11017417907715, "global_step": 57394, "epoch": 691} {"train_loss": -20.217660903930664, "global_step": 57395, "epoch": 691} {"train_loss": -20.549930572509766, "global_step": 57396, "epoch": 691} {"train_loss": -19.848508834838867, "global_step": 57397, "epoch": 691} {"train_loss": -20.261886596679688, "global_step": 57398, "epoch": 691} {"train_loss": -20.292978286743164, "global_step": 57399, "epoch": 691} {"train_loss": -20.191123962402344, "global_step": 57400, "epoch": 691} {"train_loss": -20.202362060546875, "global_step": 57401, "epoch": 691} {"train_loss": -20.54326820373535, "global_step": 57402, "epoch": 691} {"train_loss": -20.123491287231445, "global_step": 57403, "epoch": 691} {"train_loss": -20.0526123046875, "global_step": 57404, "epoch": 691} {"train_loss": -20.220264434814453, "global_step": 57405, "epoch": 691} {"train_loss": -20.30853843688965, "global_step": 57406, "epoch": 691} {"train_loss": -20.614276885986328, "global_step": 57407, "epoch": 691} {"train_loss": -20.19829750061035, "global_step": 57408, "epoch": 691} {"train_loss": -20.65171241760254, "global_step": 57409, "epoch": 691} {"train_loss": -20.145414352416992, "global_step": 57410, "epoch": 691} {"train_loss": -20.431604385375977, "global_step": 57411, "epoch": 691} {"train_loss": -20.467018127441406, "global_step": 57412, "epoch": 691} {"train_loss": -20.022476196289062, "global_step": 57413, "epoch": 691} {"train_loss": -20.460683822631836, "global_step": 57414, "epoch": 691} {"train_loss": -19.95271873474121, "global_step": 57415, "epoch": 691} {"train_loss": -19.96080780029297, "global_step": 57416, "epoch": 691} {"train_loss": -20.711210250854492, "global_step": 57417, "epoch": 691} {"train_loss": -20.251981735229492, "global_step": 57418, "epoch": 691} {"train_loss": -20.071990966796875, "global_step": 57419, "epoch": 691} {"train_loss": -20.017507553100586, "global_step": 57420, "epoch": 691} {"train_loss": -20.537738800048828, "global_step": 57421, "epoch": 691} {"train_loss": -20.443843841552734, "global_step": 57422, "epoch": 691} {"train_loss": -20.013519287109375, "global_step": 57423, "epoch": 691} {"train_loss": -20.105512619018555, "global_step": 57424, "epoch": 691} {"train_loss": -19.972370147705078, "global_step": 57425, "epoch": 691} {"train_loss": -20.328397750854492, "global_step": 57426, "epoch": 691} {"train_loss": -20.116430282592773, "global_step": 57427, "epoch": 691} {"train_loss": -20.165502548217773, "global_step": 57428, "epoch": 691} {"train_loss": -20.437482833862305, "global_step": 57429, "epoch": 691} {"train_loss": -20.40473747253418, "global_step": 57430, "epoch": 691} {"train_loss": -20.264480590820312, "global_step": 57431, "epoch": 691} {"train_loss": -20.553302764892578, "global_step": 57432, "epoch": 691} {"train_loss": -20.26790428161621, "global_step": 57433, "epoch": 691} {"train_loss": -19.83368492126465, "global_step": 57434, "epoch": 691} {"train_loss": -20.272339119968645, "global_step": 57435, "epoch": 691, "val_loss": 6017163.5} {"train_loss": -19.635522842407227, "global_step": 57436, "epoch": 692} {"train_loss": -19.978958129882812, "global_step": 57437, "epoch": 692} {"train_loss": -20.186155319213867, "global_step": 57438, "epoch": 692} {"train_loss": -19.816186904907227, "global_step": 57439, "epoch": 692} {"train_loss": -19.858671188354492, "global_step": 57440, "epoch": 692} {"train_loss": -20.410062789916992, "global_step": 57441, "epoch": 692} {"train_loss": -19.834407806396484, "global_step": 57442, "epoch": 692} {"train_loss": -19.95407485961914, "global_step": 57443, "epoch": 692} {"train_loss": -20.135507583618164, "global_step": 57444, "epoch": 692} {"train_loss": -20.107290267944336, "global_step": 57445, "epoch": 692} {"train_loss": -20.32752799987793, "global_step": 57446, "epoch": 692} {"train_loss": -19.975210189819336, "global_step": 57447, "epoch": 692} {"train_loss": -20.212797164916992, "global_step": 57448, "epoch": 692} {"train_loss": -19.99757194519043, "global_step": 57449, "epoch": 692} {"train_loss": -20.40174674987793, "global_step": 57450, "epoch": 692} {"train_loss": -20.16848373413086, "global_step": 57451, "epoch": 692} {"train_loss": -20.214460372924805, "global_step": 57452, "epoch": 692} {"train_loss": -20.165517807006836, "global_step": 57453, "epoch": 692} {"train_loss": -20.109277725219727, "global_step": 57454, "epoch": 692} {"train_loss": -20.462665557861328, "global_step": 57455, "epoch": 692} {"train_loss": -20.066280364990234, "global_step": 57456, "epoch": 692} {"train_loss": -20.345306396484375, "global_step": 57457, "epoch": 692} {"train_loss": -20.19077491760254, "global_step": 57458, "epoch": 692} {"train_loss": -20.30039405822754, "global_step": 57459, "epoch": 692} {"train_loss": -20.358322143554688, "global_step": 57460, "epoch": 692} {"train_loss": -20.259782791137695, "global_step": 57461, "epoch": 692} {"train_loss": -20.147123336791992, "global_step": 57462, "epoch": 692} {"train_loss": -20.11421775817871, "global_step": 57463, "epoch": 692} {"train_loss": -19.954519271850586, "global_step": 57464, "epoch": 692} {"train_loss": -20.132455825805664, "global_step": 57465, "epoch": 692} {"train_loss": -20.458242416381836, "global_step": 57466, "epoch": 692} {"train_loss": -20.211347579956055, "global_step": 57467, "epoch": 692} {"train_loss": -20.17665672302246, "global_step": 57468, "epoch": 692} {"train_loss": -20.43265724182129, "global_step": 57469, "epoch": 692} {"train_loss": -19.956050872802734, "global_step": 57470, "epoch": 692} {"train_loss": -20.16854476928711, "global_step": 57471, "epoch": 692} {"train_loss": -20.16365623474121, "global_step": 57472, "epoch": 692} {"train_loss": -20.7186222076416, "global_step": 57473, "epoch": 692} {"train_loss": -19.896276473999023, "global_step": 57474, "epoch": 692} {"train_loss": -20.731840133666992, "global_step": 57475, "epoch": 692} {"train_loss": -20.554367065429688, "global_step": 57476, "epoch": 692} {"train_loss": -20.020544052124023, "global_step": 57477, "epoch": 692} {"train_loss": -20.61273765563965, "global_step": 57478, "epoch": 692} {"train_loss": -20.728221893310547, "global_step": 57479, "epoch": 692} {"train_loss": -20.268831253051758, "global_step": 57480, "epoch": 692} {"train_loss": -20.40943717956543, "global_step": 57481, "epoch": 692} {"train_loss": -20.03521156311035, "global_step": 57482, "epoch": 692} {"train_loss": -20.253311157226562, "global_step": 57483, "epoch": 692} {"train_loss": -20.341344833374023, "global_step": 57484, "epoch": 692} {"train_loss": -20.322935104370117, "global_step": 57485, "epoch": 692} {"train_loss": -20.22955322265625, "global_step": 57486, "epoch": 692} {"train_loss": -20.145017623901367, "global_step": 57487, "epoch": 692} {"train_loss": -20.315109252929688, "global_step": 57488, "epoch": 692} {"train_loss": -20.209060668945312, "global_step": 57489, "epoch": 692} {"train_loss": -20.677289962768555, "global_step": 57490, "epoch": 692} {"train_loss": -19.852869033813477, "global_step": 57491, "epoch": 692} {"train_loss": -20.252273559570312, "global_step": 57492, "epoch": 692} {"train_loss": -20.242948532104492, "global_step": 57493, "epoch": 692} {"train_loss": -20.30426597595215, "global_step": 57494, "epoch": 692} {"train_loss": -20.13739013671875, "global_step": 57495, "epoch": 692} {"train_loss": -20.4679012298584, "global_step": 57496, "epoch": 692} {"train_loss": -20.26874351501465, "global_step": 57497, "epoch": 692} {"train_loss": -20.384183883666992, "global_step": 57498, "epoch": 692} {"train_loss": -20.49583625793457, "global_step": 57499, "epoch": 692} {"train_loss": -20.12755012512207, "global_step": 57500, "epoch": 692} {"train_loss": -20.186485290527344, "global_step": 57501, "epoch": 692} {"train_loss": -20.524429321289062, "global_step": 57502, "epoch": 692} {"train_loss": -20.066015243530273, "global_step": 57503, "epoch": 692} {"train_loss": -19.982816696166992, "global_step": 57504, "epoch": 692} {"train_loss": -20.326711654663086, "global_step": 57505, "epoch": 692} {"train_loss": -20.664098739624023, "global_step": 57506, "epoch": 692} {"train_loss": -20.224334716796875, "global_step": 57507, "epoch": 692} {"train_loss": -20.379941940307617, "global_step": 57508, "epoch": 692} {"train_loss": -20.607328414916992, "global_step": 57509, "epoch": 692} {"train_loss": -20.19061851501465, "global_step": 57510, "epoch": 692} {"train_loss": -20.319650650024414, "global_step": 57511, "epoch": 692} {"train_loss": -20.276185989379883, "global_step": 57512, "epoch": 692} {"train_loss": -20.253931045532227, "global_step": 57513, "epoch": 692} {"train_loss": -20.212778091430664, "global_step": 57514, "epoch": 692} {"train_loss": -20.46677589416504, "global_step": 57515, "epoch": 692} {"train_loss": -20.245988845825195, "global_step": 57516, "epoch": 692} {"train_loss": -20.23878288269043, "global_step": 57517, "epoch": 692} {"train_loss": -20.235225585569818, "global_step": 57518, "epoch": 692, "val_loss": 6116236.0} {"train_loss": -19.47481918334961, "global_step": 57519, "epoch": 693} {"train_loss": -20.094968795776367, "global_step": 57520, "epoch": 693} {"train_loss": -20.224212646484375, "global_step": 57521, "epoch": 693} {"train_loss": -19.922399520874023, "global_step": 57522, "epoch": 693} {"train_loss": -19.839033126831055, "global_step": 57523, "epoch": 693} {"train_loss": -19.99799346923828, "global_step": 57524, "epoch": 693} {"train_loss": -19.844213485717773, "global_step": 57525, "epoch": 693} {"train_loss": -19.850698471069336, "global_step": 57526, "epoch": 693} {"train_loss": -20.0798282623291, "global_step": 57527, "epoch": 693} {"train_loss": -19.9881591796875, "global_step": 57528, "epoch": 693} {"train_loss": -20.35157585144043, "global_step": 57529, "epoch": 693} {"train_loss": -20.066055297851562, "global_step": 57530, "epoch": 693} {"train_loss": -19.931188583374023, "global_step": 57531, "epoch": 693} {"train_loss": -20.29721450805664, "global_step": 57532, "epoch": 693} {"train_loss": -19.99152183532715, "global_step": 57533, "epoch": 693} {"train_loss": -19.760990142822266, "global_step": 57534, "epoch": 693} {"train_loss": -20.10743522644043, "global_step": 57535, "epoch": 693} {"train_loss": -20.150867462158203, "global_step": 57536, "epoch": 693} {"train_loss": -19.666955947875977, "global_step": 57537, "epoch": 693} {"train_loss": -20.3477725982666, "global_step": 57538, "epoch": 693} {"train_loss": -20.618314743041992, "global_step": 57539, "epoch": 693} {"train_loss": -20.037580490112305, "global_step": 57540, "epoch": 693} {"train_loss": -20.101919174194336, "global_step": 57541, "epoch": 693} {"train_loss": -20.23421287536621, "global_step": 57542, "epoch": 693} {"train_loss": -19.832616806030273, "global_step": 57543, "epoch": 693} {"train_loss": -20.58405113220215, "global_step": 57544, "epoch": 693} {"train_loss": -19.98011589050293, "global_step": 57545, "epoch": 693} {"train_loss": -20.449979782104492, "global_step": 57546, "epoch": 693} {"train_loss": -20.25998878479004, "global_step": 57547, "epoch": 693} {"train_loss": -20.06806182861328, "global_step": 57548, "epoch": 693} {"train_loss": -20.625761032104492, "global_step": 57549, "epoch": 693} {"train_loss": -20.518291473388672, "global_step": 57550, "epoch": 693} {"train_loss": -20.020444869995117, "global_step": 57551, "epoch": 693} {"train_loss": -20.21308135986328, "global_step": 57552, "epoch": 693} {"train_loss": -20.354833602905273, "global_step": 57553, "epoch": 693} {"train_loss": -20.262258529663086, "global_step": 57554, "epoch": 693} {"train_loss": -20.40741539001465, "global_step": 57555, "epoch": 693} {"train_loss": -20.25611686706543, "global_step": 57556, "epoch": 693} {"train_loss": -20.165740966796875, "global_step": 57557, "epoch": 693} {"train_loss": -20.069564819335938, "global_step": 57558, "epoch": 693} {"train_loss": -20.584758758544922, "global_step": 57559, "epoch": 693} {"train_loss": -20.33301544189453, "global_step": 57560, "epoch": 693} {"train_loss": -20.394773483276367, "global_step": 57561, "epoch": 693} {"train_loss": -20.344724655151367, "global_step": 57562, "epoch": 693} {"train_loss": -19.9877986907959, "global_step": 57563, "epoch": 693} {"train_loss": -20.27423095703125, "global_step": 57564, "epoch": 693} {"train_loss": -20.070104598999023, "global_step": 57565, "epoch": 693} {"train_loss": -20.192720413208008, "global_step": 57566, "epoch": 693} {"train_loss": -20.11246681213379, "global_step": 57567, "epoch": 693} {"train_loss": -20.43279457092285, "global_step": 57568, "epoch": 693} {"train_loss": -20.273679733276367, "global_step": 57569, "epoch": 693} {"train_loss": -20.298553466796875, "global_step": 57570, "epoch": 693} {"train_loss": -20.26080322265625, "global_step": 57571, "epoch": 693} {"train_loss": -20.161834716796875, "global_step": 57572, "epoch": 693} {"train_loss": -20.458181381225586, "global_step": 57573, "epoch": 693} {"train_loss": -20.79343032836914, "global_step": 57574, "epoch": 693} {"train_loss": -20.240596771240234, "global_step": 57575, "epoch": 693} {"train_loss": -20.207124710083008, "global_step": 57576, "epoch": 693} {"train_loss": -20.26679229736328, "global_step": 57577, "epoch": 693} {"train_loss": -20.564058303833008, "global_step": 57578, "epoch": 693} {"train_loss": -20.405303955078125, "global_step": 57579, "epoch": 693} {"train_loss": -20.216293334960938, "global_step": 57580, "epoch": 693} {"train_loss": -20.07122230529785, "global_step": 57581, "epoch": 693} {"train_loss": -20.30071449279785, "global_step": 57582, "epoch": 693} {"train_loss": -20.1870174407959, "global_step": 57583, "epoch": 693} {"train_loss": -20.451616287231445, "global_step": 57584, "epoch": 693} {"train_loss": -19.833322525024414, "global_step": 57585, "epoch": 693} {"train_loss": -20.21619987487793, "global_step": 57586, "epoch": 693} {"train_loss": -20.540002822875977, "global_step": 57587, "epoch": 693} {"train_loss": -20.345354080200195, "global_step": 57588, "epoch": 693} {"train_loss": -20.493375778198242, "global_step": 57589, "epoch": 693} {"train_loss": -20.578041076660156, "global_step": 57590, "epoch": 693} {"train_loss": -20.667224884033203, "global_step": 57591, "epoch": 693} {"train_loss": -20.36820411682129, "global_step": 57592, "epoch": 693} {"train_loss": -20.41826057434082, "global_step": 57593, "epoch": 693} {"train_loss": -20.514041900634766, "global_step": 57594, "epoch": 693} {"train_loss": -19.787948608398438, "global_step": 57595, "epoch": 693} {"train_loss": -20.45814323425293, "global_step": 57596, "epoch": 693} {"train_loss": -20.360078811645508, "global_step": 57597, "epoch": 693} {"train_loss": -20.180875778198242, "global_step": 57598, "epoch": 693} {"train_loss": -20.560461044311523, "global_step": 57599, "epoch": 693} {"train_loss": -20.08005142211914, "global_step": 57600, "epoch": 693} {"train_loss": -20.22131274119917, "global_step": 57601, "epoch": 693, "val_loss": 6008431.0} {"train_loss": -20.080829620361328, "global_step": 57602, "epoch": 694} {"train_loss": -20.382604598999023, "global_step": 57603, "epoch": 694} {"train_loss": -19.998746871948242, "global_step": 57604, "epoch": 694} {"train_loss": -19.948209762573242, "global_step": 57605, "epoch": 694} {"train_loss": -20.123197555541992, "global_step": 57606, "epoch": 694} {"train_loss": -20.164121627807617, "global_step": 57607, "epoch": 694} {"train_loss": -20.343765258789062, "global_step": 57608, "epoch": 694} {"train_loss": -20.192489624023438, "global_step": 57609, "epoch": 694} {"train_loss": -20.41257667541504, "global_step": 57610, "epoch": 694} {"train_loss": -20.281644821166992, "global_step": 57611, "epoch": 694} {"train_loss": -20.16599464416504, "global_step": 57612, "epoch": 694} {"train_loss": -20.409696578979492, "global_step": 57613, "epoch": 694} {"train_loss": -20.189594268798828, "global_step": 57614, "epoch": 694} {"train_loss": -20.142805099487305, "global_step": 57615, "epoch": 694} {"train_loss": -20.28798484802246, "global_step": 57616, "epoch": 694} {"train_loss": -20.710927963256836, "global_step": 57617, "epoch": 694} {"train_loss": -20.128942489624023, "global_step": 57618, "epoch": 694} {"train_loss": -20.34000587463379, "global_step": 57619, "epoch": 694} {"train_loss": -20.32694435119629, "global_step": 57620, "epoch": 694} {"train_loss": -20.20166778564453, "global_step": 57621, "epoch": 694} {"train_loss": -20.31789207458496, "global_step": 57622, "epoch": 694} {"train_loss": -20.379457473754883, "global_step": 57623, "epoch": 694} {"train_loss": -19.99896812438965, "global_step": 57624, "epoch": 694} {"train_loss": -20.273462295532227, "global_step": 57625, "epoch": 694} {"train_loss": -20.11728858947754, "global_step": 57626, "epoch": 694} {"train_loss": -20.09418296813965, "global_step": 57627, "epoch": 694} {"train_loss": -20.461545944213867, "global_step": 57628, "epoch": 694} {"train_loss": -20.354246139526367, "global_step": 57629, "epoch": 694} {"train_loss": -20.436809539794922, "global_step": 57630, "epoch": 694} {"train_loss": -20.123580932617188, "global_step": 57631, "epoch": 694} {"train_loss": -20.440988540649414, "global_step": 57632, "epoch": 694} {"train_loss": -20.17251968383789, "global_step": 57633, "epoch": 694} {"train_loss": -20.4423885345459, "global_step": 57634, "epoch": 694} {"train_loss": -19.910470962524414, "global_step": 57635, "epoch": 694} {"train_loss": -20.168643951416016, "global_step": 57636, "epoch": 694} {"train_loss": -20.712671279907227, "global_step": 57637, "epoch": 694} {"train_loss": -20.43763542175293, "global_step": 57638, "epoch": 694} {"train_loss": -20.48798942565918, "global_step": 57639, "epoch": 694} {"train_loss": -20.23843765258789, "global_step": 57640, "epoch": 694} {"train_loss": -20.46295738220215, "global_step": 57641, "epoch": 694} {"train_loss": -20.781278610229492, "global_step": 57642, "epoch": 694} {"train_loss": -20.684738159179688, "global_step": 57643, "epoch": 694} {"train_loss": -20.3970947265625, "global_step": 57644, "epoch": 694} {"train_loss": -20.55897331237793, "global_step": 57645, "epoch": 694} {"train_loss": -20.131500244140625, "global_step": 57646, "epoch": 694} {"train_loss": -20.389875411987305, "global_step": 57647, "epoch": 694} {"train_loss": -19.85828399658203, "global_step": 57648, "epoch": 694} {"train_loss": -20.37541389465332, "global_step": 57649, "epoch": 694} {"train_loss": -20.55006217956543, "global_step": 57650, "epoch": 694} {"train_loss": -20.276308059692383, "global_step": 57651, "epoch": 694} {"train_loss": -20.202302932739258, "global_step": 57652, "epoch": 694} {"train_loss": -20.029254913330078, "global_step": 57653, "epoch": 694} {"train_loss": -20.290132522583008, "global_step": 57654, "epoch": 694} {"train_loss": -20.44882583618164, "global_step": 57655, "epoch": 694} {"train_loss": -20.301950454711914, "global_step": 57656, "epoch": 694} {"train_loss": -20.282983779907227, "global_step": 57657, "epoch": 694} {"train_loss": -20.392560958862305, "global_step": 57658, "epoch": 694} {"train_loss": -20.36675453186035, "global_step": 57659, "epoch": 694} {"train_loss": -20.24404525756836, "global_step": 57660, "epoch": 694} {"train_loss": -20.408029556274414, "global_step": 57661, "epoch": 694} {"train_loss": -20.501976013183594, "global_step": 57662, "epoch": 694} {"train_loss": -20.329395294189453, "global_step": 57663, "epoch": 694} {"train_loss": -20.441499710083008, "global_step": 57664, "epoch": 694} {"train_loss": -19.974401473999023, "global_step": 57665, "epoch": 694} {"train_loss": -20.37040138244629, "global_step": 57666, "epoch": 694} {"train_loss": -20.507383346557617, "global_step": 57667, "epoch": 694} {"train_loss": -20.00018882751465, "global_step": 57668, "epoch": 694} {"train_loss": -20.05128288269043, "global_step": 57669, "epoch": 694} {"train_loss": -20.338438034057617, "global_step": 57670, "epoch": 694} {"train_loss": -20.104257583618164, "global_step": 57671, "epoch": 694} {"train_loss": -20.438579559326172, "global_step": 57672, "epoch": 694} {"train_loss": -20.070831298828125, "global_step": 57673, "epoch": 694} {"train_loss": -20.407575607299805, "global_step": 57674, "epoch": 694} {"train_loss": -20.422672271728516, "global_step": 57675, "epoch": 694} {"train_loss": -20.022525787353516, "global_step": 57676, "epoch": 694} {"train_loss": -20.15794563293457, "global_step": 57677, "epoch": 694} {"train_loss": -19.963525772094727, "global_step": 57678, "epoch": 694} {"train_loss": -20.119583129882812, "global_step": 57679, "epoch": 694} {"train_loss": -20.352249145507812, "global_step": 57680, "epoch": 694} {"train_loss": -20.176734924316406, "global_step": 57681, "epoch": 694} {"train_loss": -20.13277244567871, "global_step": 57682, "epoch": 694} {"train_loss": -20.17397117614746, "global_step": 57683, "epoch": 694} {"train_loss": -20.286085657326574, "global_step": 57684, "epoch": 694, "val_loss": 5899167.5} {"train_loss": -19.708860397338867, "global_step": 57685, "epoch": 695} {"train_loss": -20.65687370300293, "global_step": 57686, "epoch": 695} {"train_loss": -19.97222900390625, "global_step": 57687, "epoch": 695} {"train_loss": -19.999786376953125, "global_step": 57688, "epoch": 695} {"train_loss": -19.655797958374023, "global_step": 57689, "epoch": 695} {"train_loss": -20.033802032470703, "global_step": 57690, "epoch": 695} {"train_loss": -19.855764389038086, "global_step": 57691, "epoch": 695} {"train_loss": -20.240333557128906, "global_step": 57692, "epoch": 695} {"train_loss": -20.460424423217773, "global_step": 57693, "epoch": 695} {"train_loss": -20.297475814819336, "global_step": 57694, "epoch": 695} {"train_loss": -20.151941299438477, "global_step": 57695, "epoch": 695} {"train_loss": -20.121566772460938, "global_step": 57696, "epoch": 695} {"train_loss": -20.066308975219727, "global_step": 57697, "epoch": 695} {"train_loss": -20.18061637878418, "global_step": 57698, "epoch": 695} {"train_loss": -20.183408737182617, "global_step": 57699, "epoch": 695} {"train_loss": -20.319677352905273, "global_step": 57700, "epoch": 695} {"train_loss": -20.29903793334961, "global_step": 57701, "epoch": 695} {"train_loss": -20.11054229736328, "global_step": 57702, "epoch": 695} {"train_loss": -20.419286727905273, "global_step": 57703, "epoch": 695} {"train_loss": -20.46388053894043, "global_step": 57704, "epoch": 695} {"train_loss": -20.332700729370117, "global_step": 57705, "epoch": 695} {"train_loss": -20.07102394104004, "global_step": 57706, "epoch": 695} {"train_loss": -20.372907638549805, "global_step": 57707, "epoch": 695} {"train_loss": -20.39154624938965, "global_step": 57708, "epoch": 695} {"train_loss": -20.20552635192871, "global_step": 57709, "epoch": 695} {"train_loss": -19.845617294311523, "global_step": 57710, "epoch": 695} {"train_loss": -20.34493064880371, "global_step": 57711, "epoch": 695} {"train_loss": -20.18439483642578, "global_step": 57712, "epoch": 695} {"train_loss": -20.328245162963867, "global_step": 57713, "epoch": 695} {"train_loss": -19.933712005615234, "global_step": 57714, "epoch": 695} {"train_loss": -19.704320907592773, "global_step": 57715, "epoch": 695} {"train_loss": -20.396984100341797, "global_step": 57716, "epoch": 695} {"train_loss": -20.17549705505371, "global_step": 57717, "epoch": 695} {"train_loss": -20.234403610229492, "global_step": 57718, "epoch": 695} {"train_loss": -20.64046859741211, "global_step": 57719, "epoch": 695} {"train_loss": -20.269983291625977, "global_step": 57720, "epoch": 695} {"train_loss": -20.22621726989746, "global_step": 57721, "epoch": 695} {"train_loss": -20.454633712768555, "global_step": 57722, "epoch": 695} {"train_loss": -20.15971565246582, "global_step": 57723, "epoch": 695} {"train_loss": -20.04890251159668, "global_step": 57724, "epoch": 695} {"train_loss": -20.285139083862305, "global_step": 57725, "epoch": 695} {"train_loss": -19.976083755493164, "global_step": 57726, "epoch": 695} {"train_loss": -20.37790870666504, "global_step": 57727, "epoch": 695} {"train_loss": -20.215518951416016, "global_step": 57728, "epoch": 695} {"train_loss": -20.173120498657227, "global_step": 57729, "epoch": 695} {"train_loss": -20.46006202697754, "global_step": 57730, "epoch": 695} {"train_loss": -20.300498962402344, "global_step": 57731, "epoch": 695} {"train_loss": -20.499313354492188, "global_step": 57732, "epoch": 695} {"train_loss": -19.924230575561523, "global_step": 57733, "epoch": 695} {"train_loss": -20.51677894592285, "global_step": 57734, "epoch": 695} {"train_loss": -20.132951736450195, "global_step": 57735, "epoch": 695} {"train_loss": -20.18916130065918, "global_step": 57736, "epoch": 695} {"train_loss": -20.054677963256836, "global_step": 57737, "epoch": 695} {"train_loss": -20.45418930053711, "global_step": 57738, "epoch": 695} {"train_loss": -20.73811149597168, "global_step": 57739, "epoch": 695} {"train_loss": -20.566747665405273, "global_step": 57740, "epoch": 695} {"train_loss": -20.070165634155273, "global_step": 57741, "epoch": 695} {"train_loss": -20.48952293395996, "global_step": 57742, "epoch": 695} {"train_loss": -20.133756637573242, "global_step": 57743, "epoch": 695} {"train_loss": -20.125471115112305, "global_step": 57744, "epoch": 695} {"train_loss": -20.37689781188965, "global_step": 57745, "epoch": 695} {"train_loss": -20.261362075805664, "global_step": 57746, "epoch": 695} {"train_loss": -20.234594345092773, "global_step": 57747, "epoch": 695} {"train_loss": -20.331832885742188, "global_step": 57748, "epoch": 695} {"train_loss": -20.21175765991211, "global_step": 57749, "epoch": 695} {"train_loss": -20.381723403930664, "global_step": 57750, "epoch": 695} {"train_loss": -20.50592041015625, "global_step": 57751, "epoch": 695} {"train_loss": -20.45147705078125, "global_step": 57752, "epoch": 695} {"train_loss": -19.836637496948242, "global_step": 57753, "epoch": 695} {"train_loss": -20.63072967529297, "global_step": 57754, "epoch": 695} {"train_loss": -20.419952392578125, "global_step": 57755, "epoch": 695} {"train_loss": -20.08430290222168, "global_step": 57756, "epoch": 695} {"train_loss": -20.121265411376953, "global_step": 57757, "epoch": 695} {"train_loss": -19.92255973815918, "global_step": 57758, "epoch": 695} {"train_loss": -20.1065673828125, "global_step": 57759, "epoch": 695} {"train_loss": -20.22319793701172, "global_step": 57760, "epoch": 695} {"train_loss": -20.39678955078125, "global_step": 57761, "epoch": 695} {"train_loss": -20.098604202270508, "global_step": 57762, "epoch": 695} {"train_loss": -20.502622604370117, "global_step": 57763, "epoch": 695} {"train_loss": -20.101348876953125, "global_step": 57764, "epoch": 695} {"train_loss": -20.14436912536621, "global_step": 57765, "epoch": 695} {"train_loss": -20.16626739501953, "global_step": 57766, "epoch": 695} {"train_loss": -20.231748833713763, "global_step": 57767, "epoch": 695, "val_loss": 6039981.5} {"train_loss": -19.917593002319336, "global_step": 57768, "epoch": 696} {"train_loss": -19.697484970092773, "global_step": 57769, "epoch": 696} {"train_loss": -20.109167098999023, "global_step": 57770, "epoch": 696} {"train_loss": -20.141408920288086, "global_step": 57771, "epoch": 696} {"train_loss": -19.89972496032715, "global_step": 57772, "epoch": 696} {"train_loss": -19.612817764282227, "global_step": 57773, "epoch": 696} {"train_loss": -19.75373649597168, "global_step": 57774, "epoch": 696} {"train_loss": -20.29427146911621, "global_step": 57775, "epoch": 696} {"train_loss": -20.376964569091797, "global_step": 57776, "epoch": 696} {"train_loss": -20.42862892150879, "global_step": 57777, "epoch": 696} {"train_loss": -20.06035804748535, "global_step": 57778, "epoch": 696} {"train_loss": -20.258148193359375, "global_step": 57779, "epoch": 696} {"train_loss": -20.11396598815918, "global_step": 57780, "epoch": 696} {"train_loss": -20.3327579498291, "global_step": 57781, "epoch": 696} {"train_loss": -20.338001251220703, "global_step": 57782, "epoch": 696} {"train_loss": -20.858673095703125, "global_step": 57783, "epoch": 696} {"train_loss": -20.445343017578125, "global_step": 57784, "epoch": 696} {"train_loss": -20.13698959350586, "global_step": 57785, "epoch": 696} {"train_loss": -20.418210983276367, "global_step": 57786, "epoch": 696} {"train_loss": -20.43576431274414, "global_step": 57787, "epoch": 696} {"train_loss": -20.324615478515625, "global_step": 57788, "epoch": 696} {"train_loss": -19.866186141967773, "global_step": 57789, "epoch": 696} {"train_loss": -20.04227638244629, "global_step": 57790, "epoch": 696} {"train_loss": -20.581439971923828, "global_step": 57791, "epoch": 696} {"train_loss": -20.343366622924805, "global_step": 57792, "epoch": 696} {"train_loss": -20.137903213500977, "global_step": 57793, "epoch": 696} {"train_loss": -20.271635055541992, "global_step": 57794, "epoch": 696} {"train_loss": -19.82852554321289, "global_step": 57795, "epoch": 696} {"train_loss": -20.0634708404541, "global_step": 57796, "epoch": 696} {"train_loss": -20.378660202026367, "global_step": 57797, "epoch": 696} {"train_loss": -19.970670700073242, "global_step": 57798, "epoch": 696} {"train_loss": -20.170759201049805, "global_step": 57799, "epoch": 696} {"train_loss": -20.2534236907959, "global_step": 57800, "epoch": 696} {"train_loss": -20.50221061706543, "global_step": 57801, "epoch": 696} {"train_loss": -20.440261840820312, "global_step": 57802, "epoch": 696} {"train_loss": -20.095226287841797, "global_step": 57803, "epoch": 696} {"train_loss": -20.72133445739746, "global_step": 57804, "epoch": 696} {"train_loss": -20.015846252441406, "global_step": 57805, "epoch": 696} {"train_loss": -20.545194625854492, "global_step": 57806, "epoch": 696} {"train_loss": -20.059101104736328, "global_step": 57807, "epoch": 696} {"train_loss": -20.248313903808594, "global_step": 57808, "epoch": 696} {"train_loss": -20.32120132446289, "global_step": 57809, "epoch": 696} {"train_loss": -20.004369735717773, "global_step": 57810, "epoch": 696} {"train_loss": -20.566186904907227, "global_step": 57811, "epoch": 696} {"train_loss": -20.181394577026367, "global_step": 57812, "epoch": 696} {"train_loss": -20.504858016967773, "global_step": 57813, "epoch": 696} {"train_loss": -20.257190704345703, "global_step": 57814, "epoch": 696} {"train_loss": -20.449033737182617, "global_step": 57815, "epoch": 696} {"train_loss": -20.095382690429688, "global_step": 57816, "epoch": 696} {"train_loss": -20.346269607543945, "global_step": 57817, "epoch": 696} {"train_loss": -20.501157760620117, "global_step": 57818, "epoch": 696} {"train_loss": -20.440048217773438, "global_step": 57819, "epoch": 696} {"train_loss": -20.464155197143555, "global_step": 57820, "epoch": 696} {"train_loss": -20.37607765197754, "global_step": 57821, "epoch": 696} {"train_loss": -19.932567596435547, "global_step": 57822, "epoch": 696} {"train_loss": -20.36932373046875, "global_step": 57823, "epoch": 696} {"train_loss": -20.149808883666992, "global_step": 57824, "epoch": 696} {"train_loss": -20.323869705200195, "global_step": 57825, "epoch": 696} {"train_loss": -20.285221099853516, "global_step": 57826, "epoch": 696} {"train_loss": -20.22504234313965, "global_step": 57827, "epoch": 696} {"train_loss": -20.47792625427246, "global_step": 57828, "epoch": 696} {"train_loss": -19.968725204467773, "global_step": 57829, "epoch": 696} {"train_loss": -20.27079200744629, "global_step": 57830, "epoch": 696} {"train_loss": -20.314224243164062, "global_step": 57831, "epoch": 696} {"train_loss": -19.830039978027344, "global_step": 57832, "epoch": 696} {"train_loss": -20.138715744018555, "global_step": 57833, "epoch": 696} {"train_loss": -20.288131713867188, "global_step": 57834, "epoch": 696} {"train_loss": -20.000577926635742, "global_step": 57835, "epoch": 696} {"train_loss": -20.181249618530273, "global_step": 57836, "epoch": 696} {"train_loss": -20.15595245361328, "global_step": 57837, "epoch": 696} {"train_loss": -20.664234161376953, "global_step": 57838, "epoch": 696} {"train_loss": -19.936969757080078, "global_step": 57839, "epoch": 696} {"train_loss": -20.109228134155273, "global_step": 57840, "epoch": 696} {"train_loss": -20.104639053344727, "global_step": 57841, "epoch": 696} {"train_loss": -20.27044105529785, "global_step": 57842, "epoch": 696} {"train_loss": -20.171993255615234, "global_step": 57843, "epoch": 696} {"train_loss": -20.226057052612305, "global_step": 57844, "epoch": 696} {"train_loss": -20.484533309936523, "global_step": 57845, "epoch": 696} {"train_loss": -20.334854125976562, "global_step": 57846, "epoch": 696} {"train_loss": -20.32547950744629, "global_step": 57847, "epoch": 696} {"train_loss": -20.579137802124023, "global_step": 57848, "epoch": 696} {"train_loss": -20.634740829467773, "global_step": 57849, "epoch": 696} {"train_loss": -20.25152181142784, "global_step": 57850, "epoch": 696, "val_loss": 6156617.0} {"train_loss": -19.72150993347168, "global_step": 57851, "epoch": 697} {"train_loss": -19.922157287597656, "global_step": 57852, "epoch": 697} {"train_loss": -19.98115348815918, "global_step": 57853, "epoch": 697} {"train_loss": -19.62537956237793, "global_step": 57854, "epoch": 697} {"train_loss": -20.21484375, "global_step": 57855, "epoch": 697} {"train_loss": -20.165008544921875, "global_step": 57856, "epoch": 697} {"train_loss": -20.002042770385742, "global_step": 57857, "epoch": 697} {"train_loss": -20.15668487548828, "global_step": 57858, "epoch": 697} {"train_loss": -20.252660751342773, "global_step": 57859, "epoch": 697} {"train_loss": -19.856496810913086, "global_step": 57860, "epoch": 697} {"train_loss": -20.312057495117188, "global_step": 57861, "epoch": 697} {"train_loss": -19.80525779724121, "global_step": 57862, "epoch": 697} {"train_loss": -20.23402214050293, "global_step": 57863, "epoch": 697} {"train_loss": -20.314411163330078, "global_step": 57864, "epoch": 697} {"train_loss": -20.351648330688477, "global_step": 57865, "epoch": 697} {"train_loss": -20.095829010009766, "global_step": 57866, "epoch": 697} {"train_loss": -20.38068199157715, "global_step": 57867, "epoch": 697} {"train_loss": -20.07981300354004, "global_step": 57868, "epoch": 697} {"train_loss": -20.167184829711914, "global_step": 57869, "epoch": 697} {"train_loss": -20.54597282409668, "global_step": 57870, "epoch": 697} {"train_loss": -20.390905380249023, "global_step": 57871, "epoch": 697} {"train_loss": -20.36653709411621, "global_step": 57872, "epoch": 697} {"train_loss": -19.980085372924805, "global_step": 57873, "epoch": 697} {"train_loss": -20.34693717956543, "global_step": 57874, "epoch": 697} {"train_loss": -20.42342758178711, "global_step": 57875, "epoch": 697} {"train_loss": -20.37004280090332, "global_step": 57876, "epoch": 697} {"train_loss": -20.040790557861328, "global_step": 57877, "epoch": 697} {"train_loss": -20.08698081970215, "global_step": 57878, "epoch": 697} {"train_loss": -20.140867233276367, "global_step": 57879, "epoch": 697} {"train_loss": -20.152250289916992, "global_step": 57880, "epoch": 697} {"train_loss": -19.863916397094727, "global_step": 57881, "epoch": 697} {"train_loss": -20.424457550048828, "global_step": 57882, "epoch": 697} {"train_loss": -20.205081939697266, "global_step": 57883, "epoch": 697} {"train_loss": -20.366056442260742, "global_step": 57884, "epoch": 697} {"train_loss": -20.287818908691406, "global_step": 57885, "epoch": 697} {"train_loss": -20.336881637573242, "global_step": 57886, "epoch": 697} {"train_loss": -20.558401107788086, "global_step": 57887, "epoch": 697} {"train_loss": -20.149616241455078, "global_step": 57888, "epoch": 697} {"train_loss": -20.18173599243164, "global_step": 57889, "epoch": 697} {"train_loss": -20.17274284362793, "global_step": 57890, "epoch": 697} {"train_loss": -20.462385177612305, "global_step": 57891, "epoch": 697} {"train_loss": -20.646730422973633, "global_step": 57892, "epoch": 697} {"train_loss": -20.18743896484375, "global_step": 57893, "epoch": 697} {"train_loss": -20.17887306213379, "global_step": 57894, "epoch": 697} {"train_loss": -20.59743881225586, "global_step": 57895, "epoch": 697} {"train_loss": -20.271814346313477, "global_step": 57896, "epoch": 697} {"train_loss": -20.360036849975586, "global_step": 57897, "epoch": 697} {"train_loss": -20.633028030395508, "global_step": 57898, "epoch": 697} {"train_loss": -20.06211280822754, "global_step": 57899, "epoch": 697} {"train_loss": -20.26375389099121, "global_step": 57900, "epoch": 697} {"train_loss": -20.397634506225586, "global_step": 57901, "epoch": 697} {"train_loss": -20.369977951049805, "global_step": 57902, "epoch": 697} {"train_loss": -20.373876571655273, "global_step": 57903, "epoch": 697} {"train_loss": -20.42106056213379, "global_step": 57904, "epoch": 697} {"train_loss": -20.611196517944336, "global_step": 57905, "epoch": 697} {"train_loss": -20.161623001098633, "global_step": 57906, "epoch": 697} {"train_loss": -20.128782272338867, "global_step": 57907, "epoch": 697} {"train_loss": -20.5253963470459, "global_step": 57908, "epoch": 697} {"train_loss": -20.274839401245117, "global_step": 57909, "epoch": 697} {"train_loss": -20.13071632385254, "global_step": 57910, "epoch": 697} {"train_loss": -20.196958541870117, "global_step": 57911, "epoch": 697} {"train_loss": -20.524490356445312, "global_step": 57912, "epoch": 697} {"train_loss": -20.223552703857422, "global_step": 57913, "epoch": 697} {"train_loss": -19.828632354736328, "global_step": 57914, "epoch": 697} {"train_loss": -20.166709899902344, "global_step": 57915, "epoch": 697} {"train_loss": -20.282201766967773, "global_step": 57916, "epoch": 697} {"train_loss": -20.368408203125, "global_step": 57917, "epoch": 697} {"train_loss": -20.004196166992188, "global_step": 57918, "epoch": 697} {"train_loss": -20.593442916870117, "global_step": 57919, "epoch": 697} {"train_loss": -20.538074493408203, "global_step": 57920, "epoch": 697} {"train_loss": -20.275175094604492, "global_step": 57921, "epoch": 697} {"train_loss": -20.34406852722168, "global_step": 57922, "epoch": 697} {"train_loss": -20.56744956970215, "global_step": 57923, "epoch": 697} {"train_loss": -20.229040145874023, "global_step": 57924, "epoch": 697} {"train_loss": -20.37825584411621, "global_step": 57925, "epoch": 697} {"train_loss": -20.55512046813965, "global_step": 57926, "epoch": 697} {"train_loss": -20.49673080444336, "global_step": 57927, "epoch": 697} {"train_loss": -20.590539932250977, "global_step": 57928, "epoch": 697} {"train_loss": -20.30427360534668, "global_step": 57929, "epoch": 697} {"train_loss": -20.421733856201172, "global_step": 57930, "epoch": 697} {"train_loss": -20.709028244018555, "global_step": 57931, "epoch": 697} {"train_loss": -20.087949752807617, "global_step": 57932, "epoch": 697} {"train_loss": -20.268720213189184, "global_step": 57933, "epoch": 697, "val_loss": 5928841.0} {"train_loss": -19.95444679260254, "global_step": 57934, "epoch": 698} {"train_loss": -19.783151626586914, "global_step": 57935, "epoch": 698} {"train_loss": -20.191144943237305, "global_step": 57936, "epoch": 698} {"train_loss": -19.66745948791504, "global_step": 57937, "epoch": 698} {"train_loss": -19.586767196655273, "global_step": 57938, "epoch": 698} {"train_loss": -19.89802360534668, "global_step": 57939, "epoch": 698} {"train_loss": -19.63009262084961, "global_step": 57940, "epoch": 698} {"train_loss": -19.752771377563477, "global_step": 57941, "epoch": 698} {"train_loss": -20.209129333496094, "global_step": 57942, "epoch": 698} {"train_loss": -20.31062889099121, "global_step": 57943, "epoch": 698} {"train_loss": -20.033376693725586, "global_step": 57944, "epoch": 698} {"train_loss": -20.252517700195312, "global_step": 57945, "epoch": 698} {"train_loss": -20.24738883972168, "global_step": 57946, "epoch": 698} {"train_loss": -20.370189666748047, "global_step": 57947, "epoch": 698} {"train_loss": -20.293432235717773, "global_step": 57948, "epoch": 698} {"train_loss": -19.968008041381836, "global_step": 57949, "epoch": 698} {"train_loss": -20.002477645874023, "global_step": 57950, "epoch": 698} {"train_loss": -20.2907657623291, "global_step": 57951, "epoch": 698} {"train_loss": -20.458572387695312, "global_step": 57952, "epoch": 698} {"train_loss": -20.5562686920166, "global_step": 57953, "epoch": 698} {"train_loss": -20.218017578125, "global_step": 57954, "epoch": 698} {"train_loss": -20.56254768371582, "global_step": 57955, "epoch": 698} {"train_loss": -20.469152450561523, "global_step": 57956, "epoch": 698} {"train_loss": -20.22187614440918, "global_step": 57957, "epoch": 698} {"train_loss": -20.044666290283203, "global_step": 57958, "epoch": 698} {"train_loss": -20.584325790405273, "global_step": 57959, "epoch": 698} {"train_loss": -19.973318099975586, "global_step": 57960, "epoch": 698} {"train_loss": -20.295642852783203, "global_step": 57961, "epoch": 698} {"train_loss": -20.527511596679688, "global_step": 57962, "epoch": 698} {"train_loss": -20.231033325195312, "global_step": 57963, "epoch": 698} {"train_loss": -20.260953903198242, "global_step": 57964, "epoch": 698} {"train_loss": -20.519895553588867, "global_step": 57965, "epoch": 698} {"train_loss": -20.090051651000977, "global_step": 57966, "epoch": 698} {"train_loss": -20.31954002380371, "global_step": 57967, "epoch": 698} {"train_loss": -20.570964813232422, "global_step": 57968, "epoch": 698} {"train_loss": -20.31953239440918, "global_step": 57969, "epoch": 698} {"train_loss": -20.003446578979492, "global_step": 57970, "epoch": 698} {"train_loss": -20.436735153198242, "global_step": 57971, "epoch": 698} {"train_loss": -20.40212631225586, "global_step": 57972, "epoch": 698} {"train_loss": -20.461956024169922, "global_step": 57973, "epoch": 698} {"train_loss": -20.357084274291992, "global_step": 57974, "epoch": 698} {"train_loss": -20.43440055847168, "global_step": 57975, "epoch": 698} {"train_loss": -20.311025619506836, "global_step": 57976, "epoch": 698} {"train_loss": -20.31583595275879, "global_step": 57977, "epoch": 698} {"train_loss": -20.35697364807129, "global_step": 57978, "epoch": 698} {"train_loss": -20.23038101196289, "global_step": 57979, "epoch": 698} {"train_loss": -20.720285415649414, "global_step": 57980, "epoch": 698} {"train_loss": -20.200651168823242, "global_step": 57981, "epoch": 698} {"train_loss": -20.428564071655273, "global_step": 57982, "epoch": 698} {"train_loss": -20.336509704589844, "global_step": 57983, "epoch": 698} {"train_loss": -20.49408531188965, "global_step": 57984, "epoch": 698} {"train_loss": -20.278366088867188, "global_step": 57985, "epoch": 698} {"train_loss": -20.310260772705078, "global_step": 57986, "epoch": 698} {"train_loss": -20.212432861328125, "global_step": 57987, "epoch": 698} {"train_loss": -20.408248901367188, "global_step": 57988, "epoch": 698} {"train_loss": -20.06439781188965, "global_step": 57989, "epoch": 698} {"train_loss": -20.538467407226562, "global_step": 57990, "epoch": 698} {"train_loss": -20.560081481933594, "global_step": 57991, "epoch": 698} {"train_loss": -20.307538986206055, "global_step": 57992, "epoch": 698} {"train_loss": -19.858640670776367, "global_step": 57993, "epoch": 698} {"train_loss": -20.449859619140625, "global_step": 57994, "epoch": 698} {"train_loss": -20.477781295776367, "global_step": 57995, "epoch": 698} {"train_loss": -20.04120445251465, "global_step": 57996, "epoch": 698} {"train_loss": -20.0549373626709, "global_step": 57997, "epoch": 698} {"train_loss": -20.387197494506836, "global_step": 57998, "epoch": 698} {"train_loss": -20.041730880737305, "global_step": 57999, "epoch": 698} {"train_loss": -20.40876579284668, "global_step": 58000, "epoch": 698} {"train_loss": -20.296865463256836, "global_step": 58001, "epoch": 698} {"train_loss": -20.661996841430664, "global_step": 58002, "epoch": 698} {"train_loss": -20.566612243652344, "global_step": 58003, "epoch": 698} {"train_loss": -20.03510856628418, "global_step": 58004, "epoch": 698} {"train_loss": -20.536346435546875, "global_step": 58005, "epoch": 698} {"train_loss": -20.174610137939453, "global_step": 58006, "epoch": 698} {"train_loss": -20.421035766601562, "global_step": 58007, "epoch": 698} {"train_loss": -20.371309280395508, "global_step": 58008, "epoch": 698} {"train_loss": -20.093225479125977, "global_step": 58009, "epoch": 698} {"train_loss": -20.095762252807617, "global_step": 58010, "epoch": 698} {"train_loss": -20.2327823638916, "global_step": 58011, "epoch": 698} {"train_loss": -20.413793563842773, "global_step": 58012, "epoch": 698} {"train_loss": -20.183530807495117, "global_step": 58013, "epoch": 698} {"train_loss": -20.488676071166992, "global_step": 58014, "epoch": 698} {"train_loss": -20.301116943359375, "global_step": 58015, "epoch": 698} {"train_loss": -20.259792810463043, "global_step": 58016, "epoch": 698, "val_loss": 5881859.5} {"train_loss": -19.706769943237305, "global_step": 58017, "epoch": 699} {"train_loss": -20.06788444519043, "global_step": 58018, "epoch": 699} {"train_loss": -19.790332794189453, "global_step": 58019, "epoch": 699} {"train_loss": -19.646276473999023, "global_step": 58020, "epoch": 699} {"train_loss": -19.82781410217285, "global_step": 58021, "epoch": 699} {"train_loss": -19.717493057250977, "global_step": 58022, "epoch": 699} {"train_loss": -19.762420654296875, "global_step": 58023, "epoch": 699} {"train_loss": -19.954803466796875, "global_step": 58024, "epoch": 699} {"train_loss": -20.38076400756836, "global_step": 58025, "epoch": 699} {"train_loss": -19.509790420532227, "global_step": 58026, "epoch": 699} {"train_loss": -19.95172691345215, "global_step": 58027, "epoch": 699} {"train_loss": -19.861478805541992, "global_step": 58028, "epoch": 699} {"train_loss": -19.9997615814209, "global_step": 58029, "epoch": 699} {"train_loss": -19.957090377807617, "global_step": 58030, "epoch": 699} {"train_loss": -19.856719970703125, "global_step": 58031, "epoch": 699} {"train_loss": -20.546236038208008, "global_step": 58032, "epoch": 699} {"train_loss": -20.17378807067871, "global_step": 58033, "epoch": 699} {"train_loss": -20.133033752441406, "global_step": 58034, "epoch": 699} {"train_loss": -20.0352840423584, "global_step": 58035, "epoch": 699} {"train_loss": -20.32122039794922, "global_step": 58036, "epoch": 699} {"train_loss": -20.314922332763672, "global_step": 58037, "epoch": 699} {"train_loss": -20.520732879638672, "global_step": 58038, "epoch": 699} {"train_loss": -20.13741111755371, "global_step": 58039, "epoch": 699} {"train_loss": -20.396562576293945, "global_step": 58040, "epoch": 699} {"train_loss": -20.224700927734375, "global_step": 58041, "epoch": 699} {"train_loss": -20.26153564453125, "global_step": 58042, "epoch": 699} {"train_loss": -20.161054611206055, "global_step": 58043, "epoch": 699} {"train_loss": -19.97110939025879, "global_step": 58044, "epoch": 699} {"train_loss": -20.486968994140625, "global_step": 58045, "epoch": 699} {"train_loss": -20.456235885620117, "global_step": 58046, "epoch": 699} {"train_loss": -20.14156723022461, "global_step": 58047, "epoch": 699} {"train_loss": -20.27479362487793, "global_step": 58048, "epoch": 699} {"train_loss": -20.3502197265625, "global_step": 58049, "epoch": 699} {"train_loss": -19.676008224487305, "global_step": 58050, "epoch": 699} {"train_loss": -20.244722366333008, "global_step": 58051, "epoch": 699} {"train_loss": -20.465351104736328, "global_step": 58052, "epoch": 699} {"train_loss": -20.392942428588867, "global_step": 58053, "epoch": 699} {"train_loss": -19.927345275878906, "global_step": 58054, "epoch": 699} {"train_loss": -20.38918113708496, "global_step": 58055, "epoch": 699} {"train_loss": -20.50342559814453, "global_step": 58056, "epoch": 699} {"train_loss": -20.446117401123047, "global_step": 58057, "epoch": 699} {"train_loss": -20.376876831054688, "global_step": 58058, "epoch": 699} {"train_loss": -20.437456130981445, "global_step": 58059, "epoch": 699} {"train_loss": -20.2728214263916, "global_step": 58060, "epoch": 699} {"train_loss": -20.174734115600586, "global_step": 58061, "epoch": 699} {"train_loss": -20.561798095703125, "global_step": 58062, "epoch": 699} {"train_loss": -20.50935935974121, "global_step": 58063, "epoch": 699} {"train_loss": -20.15449333190918, "global_step": 58064, "epoch": 699} {"train_loss": -20.371824264526367, "global_step": 58065, "epoch": 699} {"train_loss": -20.45006561279297, "global_step": 58066, "epoch": 699} {"train_loss": -20.22812271118164, "global_step": 58067, "epoch": 699} {"train_loss": -20.631153106689453, "global_step": 58068, "epoch": 699} {"train_loss": -20.17386245727539, "global_step": 58069, "epoch": 699} {"train_loss": -20.450212478637695, "global_step": 58070, "epoch": 699} {"train_loss": -20.696943283081055, "global_step": 58071, "epoch": 699} {"train_loss": -20.15555763244629, "global_step": 58072, "epoch": 699} {"train_loss": -20.772472381591797, "global_step": 58073, "epoch": 699} {"train_loss": -20.191984176635742, "global_step": 58074, "epoch": 699} {"train_loss": -20.514949798583984, "global_step": 58075, "epoch": 699} {"train_loss": -20.06076431274414, "global_step": 58076, "epoch": 699} {"train_loss": -20.339393615722656, "global_step": 58077, "epoch": 699} {"train_loss": -20.4337215423584, "global_step": 58078, "epoch": 699} {"train_loss": -20.23353385925293, "global_step": 58079, "epoch": 699} {"train_loss": -20.10605812072754, "global_step": 58080, "epoch": 699} {"train_loss": -20.239620208740234, "global_step": 58081, "epoch": 699} {"train_loss": -20.309341430664062, "global_step": 58082, "epoch": 699} {"train_loss": -21.03858757019043, "global_step": 58083, "epoch": 699} {"train_loss": -20.441614151000977, "global_step": 58084, "epoch": 699} {"train_loss": -20.222118377685547, "global_step": 58085, "epoch": 699} {"train_loss": -19.700899124145508, "global_step": 58086, "epoch": 699} {"train_loss": -20.846532821655273, "global_step": 58087, "epoch": 699} {"train_loss": -20.298919677734375, "global_step": 58088, "epoch": 699} {"train_loss": -20.066869735717773, "global_step": 58089, "epoch": 699} {"train_loss": -20.20473289489746, "global_step": 58090, "epoch": 699} {"train_loss": -20.300594329833984, "global_step": 58091, "epoch": 699} {"train_loss": -19.640478134155273, "global_step": 58092, "epoch": 699} {"train_loss": -20.08587074279785, "global_step": 58093, "epoch": 699} {"train_loss": -20.14522933959961, "global_step": 58094, "epoch": 699} {"train_loss": -20.389612197875977, "global_step": 58095, "epoch": 699} {"train_loss": -20.075260162353516, "global_step": 58096, "epoch": 699} {"train_loss": -20.13037109375, "global_step": 58097, "epoch": 699} {"train_loss": -20.22410011291504, "global_step": 58098, "epoch": 699} {"train_loss": -20.20225051512201, "global_step": 58099, "epoch": 699, "val_loss": 5987564.0} {"train_loss": -19.62125587463379, "global_step": 58100, "epoch": 700} {"train_loss": -19.949827194213867, "global_step": 58101, "epoch": 700} {"train_loss": -19.837827682495117, "global_step": 58102, "epoch": 700} {"train_loss": -20.222248077392578, "global_step": 58103, "epoch": 700} {"train_loss": -20.003019332885742, "global_step": 58104, "epoch": 700} {"train_loss": -20.26236915588379, "global_step": 58105, "epoch": 700} {"train_loss": -19.966550827026367, "global_step": 58106, "epoch": 700} {"train_loss": -20.049169540405273, "global_step": 58107, "epoch": 700} {"train_loss": -20.60053825378418, "global_step": 58108, "epoch": 700} {"train_loss": -20.033777236938477, "global_step": 58109, "epoch": 700} {"train_loss": -20.310958862304688, "global_step": 58110, "epoch": 700} {"train_loss": -20.2265682220459, "global_step": 58111, "epoch": 700} {"train_loss": -20.22639274597168, "global_step": 58112, "epoch": 700} {"train_loss": -19.80198097229004, "global_step": 58113, "epoch": 700} {"train_loss": -20.259382247924805, "global_step": 58114, "epoch": 700} {"train_loss": -20.208284378051758, "global_step": 58115, "epoch": 700} {"train_loss": -20.151947021484375, "global_step": 58116, "epoch": 700} {"train_loss": -20.076383590698242, "global_step": 58117, "epoch": 700} {"train_loss": -20.687219619750977, "global_step": 58118, "epoch": 700} {"train_loss": -20.098630905151367, "global_step": 58119, "epoch": 700} {"train_loss": -20.1768741607666, "global_step": 58120, "epoch": 700} {"train_loss": -20.28741455078125, "global_step": 58121, "epoch": 700} {"train_loss": -20.457910537719727, "global_step": 58122, "epoch": 700} {"train_loss": -20.4188289642334, "global_step": 58123, "epoch": 700} {"train_loss": -20.289859771728516, "global_step": 58124, "epoch": 700} {"train_loss": -20.650793075561523, "global_step": 58125, "epoch": 700} {"train_loss": -20.32756996154785, "global_step": 58126, "epoch": 700} {"train_loss": -20.36988639831543, "global_step": 58127, "epoch": 700} {"train_loss": -20.366464614868164, "global_step": 58128, "epoch": 700} {"train_loss": -20.344959259033203, "global_step": 58129, "epoch": 700} {"train_loss": -20.037931442260742, "global_step": 58130, "epoch": 700} {"train_loss": -20.09381103515625, "global_step": 58131, "epoch": 700} {"train_loss": -20.237625122070312, "global_step": 58132, "epoch": 700} {"train_loss": -20.170211791992188, "global_step": 58133, "epoch": 700} {"train_loss": -20.098073959350586, "global_step": 58134, "epoch": 700} {"train_loss": -20.300405502319336, "global_step": 58135, "epoch": 700} {"train_loss": -20.310415267944336, "global_step": 58136, "epoch": 700} {"train_loss": -20.098499298095703, "global_step": 58137, "epoch": 700} {"train_loss": -20.21234130859375, "global_step": 58138, "epoch": 700} {"train_loss": -20.322021484375, "global_step": 58139, "epoch": 700} {"train_loss": -19.824037551879883, "global_step": 58140, "epoch": 700} {"train_loss": -20.417417526245117, "global_step": 58141, "epoch": 700} {"train_loss": -20.491962432861328, "global_step": 58142, "epoch": 700} {"train_loss": -20.344022750854492, "global_step": 58143, "epoch": 700} {"train_loss": -20.463415145874023, "global_step": 58144, "epoch": 700} {"train_loss": -20.301610946655273, "global_step": 58145, "epoch": 700} {"train_loss": -20.464624404907227, "global_step": 58146, "epoch": 700} {"train_loss": -20.27370262145996, "global_step": 58147, "epoch": 700} {"train_loss": -20.32199478149414, "global_step": 58148, "epoch": 700} {"train_loss": -20.64519691467285, "global_step": 58149, "epoch": 700} {"train_loss": -20.22665786743164, "global_step": 58150, "epoch": 700} {"train_loss": -20.632333755493164, "global_step": 58151, "epoch": 700} {"train_loss": -20.178924560546875, "global_step": 58152, "epoch": 700} {"train_loss": -20.53890609741211, "global_step": 58153, "epoch": 700} {"train_loss": -20.451744079589844, "global_step": 58154, "epoch": 700} {"train_loss": -20.298999786376953, "global_step": 58155, "epoch": 700} {"train_loss": -20.51360511779785, "global_step": 58156, "epoch": 700} {"train_loss": -20.619070053100586, "global_step": 58157, "epoch": 700} {"train_loss": -20.18009376525879, "global_step": 58158, "epoch": 700} {"train_loss": -20.34056854248047, "global_step": 58159, "epoch": 700} {"train_loss": -20.516536712646484, "global_step": 58160, "epoch": 700} {"train_loss": -20.479276657104492, "global_step": 58161, "epoch": 700} {"train_loss": -19.874454498291016, "global_step": 58162, "epoch": 700} {"train_loss": -20.27345085144043, "global_step": 58163, "epoch": 700} {"train_loss": -20.000471115112305, "global_step": 58164, "epoch": 700} {"train_loss": -20.105680465698242, "global_step": 58165, "epoch": 700} {"train_loss": -20.616418838500977, "global_step": 58166, "epoch": 700} {"train_loss": -20.54768943786621, "global_step": 58167, "epoch": 700} {"train_loss": -20.300527572631836, "global_step": 58168, "epoch": 700} {"train_loss": -20.714319229125977, "global_step": 58169, "epoch": 700} {"train_loss": -20.333288192749023, "global_step": 58170, "epoch": 700} {"train_loss": -19.968114852905273, "global_step": 58171, "epoch": 700} {"train_loss": -20.395347595214844, "global_step": 58172, "epoch": 700} {"train_loss": -20.407285690307617, "global_step": 58173, "epoch": 700} {"train_loss": -20.404769897460938, "global_step": 58174, "epoch": 700} {"train_loss": -20.352468490600586, "global_step": 58175, "epoch": 700} {"train_loss": -20.06816291809082, "global_step": 58176, "epoch": 700} {"train_loss": -20.41560173034668, "global_step": 58177, "epoch": 700} {"train_loss": -20.1901912689209, "global_step": 58178, "epoch": 700} {"train_loss": -20.334362030029297, "global_step": 58179, "epoch": 700} {"train_loss": -20.459829330444336, "global_step": 58180, "epoch": 700} {"train_loss": -20.23362159729004, "global_step": 58181, "epoch": 700} {"train_loss": -20.26837335149926, "global_step": 58182, "epoch": 700, "train/sim_max_reward_0": 1.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4500000": 1.0, "test/sim_max_reward_4500001": 1.0, "test/sim_max_reward_4500002": 1.0, "test/sim_max_reward_4500003": 1.0, "test/sim_max_reward_4500004": 1.0, "test/sim_max_reward_4500005": 1.0, "test/sim_max_reward_4500006": 1.0, "test/sim_max_reward_4500007": 1.0, "test/sim_max_reward_4500008": 1.0, "test/sim_max_reward_4500009": 1.0, "test/sim_max_reward_4500010": 1.0, "test/sim_max_reward_4500011": 1.0, "test/sim_max_reward_4500012": 1.0, "test/sim_max_reward_4500013": 1.0, "test/sim_max_reward_4500014": 1.0, "test/sim_max_reward_4500015": 1.0, "test/sim_max_reward_4500016": 1.0, "test/sim_max_reward_4500017": 1.0, "test/sim_max_reward_4500018": 1.0, "test/sim_max_reward_4500019": 0.0, "test/sim_max_reward_4500020": 1.0, "test/sim_max_reward_4500021": 1.0, "train/mean_score": 1.0, "test/mean_score": 0.9545454545454546, "val_loss": 6112840.0} {"train_loss": -19.553133010864258, "global_step": 58183, "epoch": 701} {"train_loss": -19.718791961669922, "global_step": 58184, "epoch": 701} {"train_loss": -19.342193603515625, "global_step": 58185, "epoch": 701} {"train_loss": -19.631168365478516, "global_step": 58186, "epoch": 701} {"train_loss": -19.87343406677246, "global_step": 58187, "epoch": 701} {"train_loss": -20.26901626586914, "global_step": 58188, "epoch": 701} {"train_loss": -20.208324432373047, "global_step": 58189, "epoch": 701} {"train_loss": -20.055240631103516, "global_step": 58190, "epoch": 701} {"train_loss": -19.964445114135742, "global_step": 58191, "epoch": 701} {"train_loss": -20.1086483001709, "global_step": 58192, "epoch": 701} {"train_loss": -19.70060157775879, "global_step": 58193, "epoch": 701} {"train_loss": -19.949535369873047, "global_step": 58194, "epoch": 701} {"train_loss": -20.412954330444336, "global_step": 58195, "epoch": 701} {"train_loss": -20.082853317260742, "global_step": 58196, "epoch": 701} {"train_loss": -19.912139892578125, "global_step": 58197, "epoch": 701} {"train_loss": -19.6319637298584, "global_step": 58198, "epoch": 701} {"train_loss": -20.03788948059082, "global_step": 58199, "epoch": 701} {"train_loss": -20.124038696289062, "global_step": 58200, "epoch": 701} {"train_loss": -20.34358024597168, "global_step": 58201, "epoch": 701} {"train_loss": -19.953123092651367, "global_step": 58202, "epoch": 701} {"train_loss": -20.303442001342773, "global_step": 58203, "epoch": 701} {"train_loss": -20.44634437561035, "global_step": 58204, "epoch": 701} {"train_loss": -20.36274528503418, "global_step": 58205, "epoch": 701} {"train_loss": -20.19788932800293, "global_step": 58206, "epoch": 701} {"train_loss": -20.192922592163086, "global_step": 58207, "epoch": 701} {"train_loss": -20.1669921875, "global_step": 58208, "epoch": 701} {"train_loss": -20.383220672607422, "global_step": 58209, "epoch": 701} {"train_loss": -19.982685089111328, "global_step": 58210, "epoch": 701} {"train_loss": -20.127758026123047, "global_step": 58211, "epoch": 701} {"train_loss": -20.639606475830078, "global_step": 58212, "epoch": 701} {"train_loss": -20.49344253540039, "global_step": 58213, "epoch": 701} {"train_loss": -20.187652587890625, "global_step": 58214, "epoch": 701} {"train_loss": -20.35737419128418, "global_step": 58215, "epoch": 701} {"train_loss": -20.213863372802734, "global_step": 58216, "epoch": 701} {"train_loss": -20.644277572631836, "global_step": 58217, "epoch": 701} {"train_loss": -20.31471824645996, "global_step": 58218, "epoch": 701} {"train_loss": -20.138147354125977, "global_step": 58219, "epoch": 701} {"train_loss": -20.181949615478516, "global_step": 58220, "epoch": 701} {"train_loss": -19.897958755493164, "global_step": 58221, "epoch": 701} {"train_loss": -20.09084129333496, "global_step": 58222, "epoch": 701} {"train_loss": -20.2567081451416, "global_step": 58223, "epoch": 701} {"train_loss": -20.609237670898438, "global_step": 58224, "epoch": 701} {"train_loss": -20.30382537841797, "global_step": 58225, "epoch": 701} {"train_loss": -20.15253257751465, "global_step": 58226, "epoch": 701} {"train_loss": -19.9837646484375, "global_step": 58227, "epoch": 701} {"train_loss": -20.30146598815918, "global_step": 58228, "epoch": 701} {"train_loss": -20.37306785583496, "global_step": 58229, "epoch": 701} {"train_loss": -20.687253952026367, "global_step": 58230, "epoch": 701} {"train_loss": -20.178359985351562, "global_step": 58231, "epoch": 701} {"train_loss": -20.100595474243164, "global_step": 58232, "epoch": 701} {"train_loss": -20.24909019470215, "global_step": 58233, "epoch": 701} {"train_loss": -20.045166015625, "global_step": 58234, "epoch": 701} {"train_loss": -20.51498794555664, "global_step": 58235, "epoch": 701} {"train_loss": -20.545377731323242, "global_step": 58236, "epoch": 701} {"train_loss": -20.738628387451172, "global_step": 58237, "epoch": 701} {"train_loss": -20.36801528930664, "global_step": 58238, "epoch": 701} {"train_loss": -20.29910659790039, "global_step": 58239, "epoch": 701} {"train_loss": -20.45637321472168, "global_step": 58240, "epoch": 701} {"train_loss": -20.193857192993164, "global_step": 58241, "epoch": 701} {"train_loss": -20.278799057006836, "global_step": 58242, "epoch": 701} {"train_loss": -20.439258575439453, "global_step": 58243, "epoch": 701} {"train_loss": -20.591136932373047, "global_step": 58244, "epoch": 701} {"train_loss": -20.076574325561523, "global_step": 58245, "epoch": 701} {"train_loss": -20.642255783081055, "global_step": 58246, "epoch": 701} {"train_loss": -20.035507202148438, "global_step": 58247, "epoch": 701} {"train_loss": -20.275957107543945, "global_step": 58248, "epoch": 701} {"train_loss": -20.02833366394043, "global_step": 58249, "epoch": 701} {"train_loss": -19.93466567993164, "global_step": 58250, "epoch": 701} {"train_loss": -20.42932891845703, "global_step": 58251, "epoch": 701} {"train_loss": -20.310754776000977, "global_step": 58252, "epoch": 701} {"train_loss": -20.75960350036621, "global_step": 58253, "epoch": 701} {"train_loss": -20.41082191467285, "global_step": 58254, "epoch": 701} {"train_loss": -19.934925079345703, "global_step": 58255, "epoch": 701} {"train_loss": -20.49924659729004, "global_step": 58256, "epoch": 701} {"train_loss": -20.420391082763672, "global_step": 58257, "epoch": 701} {"train_loss": -19.897016525268555, "global_step": 58258, "epoch": 701} {"train_loss": -20.1776123046875, "global_step": 58259, "epoch": 701} {"train_loss": -20.550586700439453, "global_step": 58260, "epoch": 701} {"train_loss": -20.33535385131836, "global_step": 58261, "epoch": 701} {"train_loss": -20.53827667236328, "global_step": 58262, "epoch": 701} {"train_loss": -20.546157836914062, "global_step": 58263, "epoch": 701} {"train_loss": -20.592008590698242, "global_step": 58264, "epoch": 701} {"train_loss": -20.217634476811053, "global_step": 58265, "epoch": 701, "val_loss": 6003541.0} {"train_loss": -20.278318405151367, "global_step": 58266, "epoch": 702} {"train_loss": -19.8875732421875, "global_step": 58267, "epoch": 702} {"train_loss": -19.879150390625, "global_step": 58268, "epoch": 702} {"train_loss": -20.15261459350586, "global_step": 58269, "epoch": 702} {"train_loss": -20.372257232666016, "global_step": 58270, "epoch": 702} {"train_loss": -20.254690170288086, "global_step": 58271, "epoch": 702} {"train_loss": -20.378358840942383, "global_step": 58272, "epoch": 702} {"train_loss": -20.07465171813965, "global_step": 58273, "epoch": 702} {"train_loss": -20.141416549682617, "global_step": 58274, "epoch": 702} {"train_loss": -20.170743942260742, "global_step": 58275, "epoch": 702} {"train_loss": -20.26936912536621, "global_step": 58276, "epoch": 702} {"train_loss": -20.04685401916504, "global_step": 58277, "epoch": 702} {"train_loss": -20.263259887695312, "global_step": 58278, "epoch": 702} {"train_loss": -19.954055786132812, "global_step": 58279, "epoch": 702} {"train_loss": -20.257793426513672, "global_step": 58280, "epoch": 702} {"train_loss": -20.328638076782227, "global_step": 58281, "epoch": 702} {"train_loss": -20.318878173828125, "global_step": 58282, "epoch": 702} {"train_loss": -20.21045684814453, "global_step": 58283, "epoch": 702} {"train_loss": -20.383331298828125, "global_step": 58284, "epoch": 702} {"train_loss": -20.201248168945312, "global_step": 58285, "epoch": 702} {"train_loss": -20.1966609954834, "global_step": 58286, "epoch": 702} {"train_loss": -20.55010986328125, "global_step": 58287, "epoch": 702} {"train_loss": -20.309106826782227, "global_step": 58288, "epoch": 702} {"train_loss": -20.459487915039062, "global_step": 58289, "epoch": 702} {"train_loss": -20.31159019470215, "global_step": 58290, "epoch": 702} {"train_loss": -20.451021194458008, "global_step": 58291, "epoch": 702} {"train_loss": -19.717992782592773, "global_step": 58292, "epoch": 702} {"train_loss": -20.244504928588867, "global_step": 58293, "epoch": 702} {"train_loss": -20.175031661987305, "global_step": 58294, "epoch": 702} {"train_loss": -20.253000259399414, "global_step": 58295, "epoch": 702} {"train_loss": -20.23610496520996, "global_step": 58296, "epoch": 702} {"train_loss": -20.086299896240234, "global_step": 58297, "epoch": 702} {"train_loss": -20.45611000061035, "global_step": 58298, "epoch": 702} {"train_loss": -20.3209285736084, "global_step": 58299, "epoch": 702} {"train_loss": -20.584087371826172, "global_step": 58300, "epoch": 702} {"train_loss": -20.31989097595215, "global_step": 58301, "epoch": 702} {"train_loss": -20.323331832885742, "global_step": 58302, "epoch": 702} {"train_loss": -20.01569938659668, "global_step": 58303, "epoch": 702} {"train_loss": -20.4119930267334, "global_step": 58304, "epoch": 702} {"train_loss": -20.610584259033203, "global_step": 58305, "epoch": 702} {"train_loss": -19.973114013671875, "global_step": 58306, "epoch": 702} {"train_loss": -20.27144432067871, "global_step": 58307, "epoch": 702} {"train_loss": -20.5561580657959, "global_step": 58308, "epoch": 702} {"train_loss": -20.06056785583496, "global_step": 58309, "epoch": 702} {"train_loss": -19.88348388671875, "global_step": 58310, "epoch": 702} {"train_loss": -20.24201774597168, "global_step": 58311, "epoch": 702} {"train_loss": -20.243942260742188, "global_step": 58312, "epoch": 702} {"train_loss": -20.184900283813477, "global_step": 58313, "epoch": 702} {"train_loss": -20.22953987121582, "global_step": 58314, "epoch": 702} {"train_loss": -20.207197189331055, "global_step": 58315, "epoch": 702} {"train_loss": -19.916357040405273, "global_step": 58316, "epoch": 702} {"train_loss": -19.78980827331543, "global_step": 58317, "epoch": 702} {"train_loss": -20.150959014892578, "global_step": 58318, "epoch": 702} {"train_loss": -20.492374420166016, "global_step": 58319, "epoch": 702} {"train_loss": -20.326534271240234, "global_step": 58320, "epoch": 702} {"train_loss": -20.073423385620117, "global_step": 58321, "epoch": 702} {"train_loss": -20.523893356323242, "global_step": 58322, "epoch": 702} {"train_loss": -19.89727020263672, "global_step": 58323, "epoch": 702} {"train_loss": -20.720844268798828, "global_step": 58324, "epoch": 702} {"train_loss": -20.213735580444336, "global_step": 58325, "epoch": 702} {"train_loss": -20.151487350463867, "global_step": 58326, "epoch": 702} {"train_loss": -19.840559005737305, "global_step": 58327, "epoch": 702} {"train_loss": -20.38823890686035, "global_step": 58328, "epoch": 702} {"train_loss": -20.354259490966797, "global_step": 58329, "epoch": 702} {"train_loss": -20.591001510620117, "global_step": 58330, "epoch": 702} {"train_loss": -20.420501708984375, "global_step": 58331, "epoch": 702} {"train_loss": -20.382869720458984, "global_step": 58332, "epoch": 702} {"train_loss": -20.4645938873291, "global_step": 58333, "epoch": 702} {"train_loss": -20.653961181640625, "global_step": 58334, "epoch": 702} {"train_loss": -20.271753311157227, "global_step": 58335, "epoch": 702} {"train_loss": -20.596582412719727, "global_step": 58336, "epoch": 702} {"train_loss": -20.69833755493164, "global_step": 58337, "epoch": 702} {"train_loss": -20.339527130126953, "global_step": 58338, "epoch": 702} {"train_loss": -20.269750595092773, "global_step": 58339, "epoch": 702} {"train_loss": -20.5174617767334, "global_step": 58340, "epoch": 702} {"train_loss": -20.165925979614258, "global_step": 58341, "epoch": 702} {"train_loss": -20.315139770507812, "global_step": 58342, "epoch": 702} {"train_loss": -20.264118194580078, "global_step": 58343, "epoch": 702} {"train_loss": -20.53667640686035, "global_step": 58344, "epoch": 702} {"train_loss": -20.32999610900879, "global_step": 58345, "epoch": 702} {"train_loss": -20.466033935546875, "global_step": 58346, "epoch": 702} {"train_loss": -20.3304386138916, "global_step": 58347, "epoch": 702} {"train_loss": -20.297290250479456, "global_step": 58348, "epoch": 702, "val_loss": 6080731.5} {"train_loss": -20.02949333190918, "global_step": 58349, "epoch": 703} {"train_loss": -20.0380916595459, "global_step": 58350, "epoch": 703} {"train_loss": -20.375532150268555, "global_step": 58351, "epoch": 703} {"train_loss": -20.084501266479492, "global_step": 58352, "epoch": 703} {"train_loss": -20.18497085571289, "global_step": 58353, "epoch": 703} {"train_loss": -19.986408233642578, "global_step": 58354, "epoch": 703} {"train_loss": -20.065597534179688, "global_step": 58355, "epoch": 703} {"train_loss": -19.845422744750977, "global_step": 58356, "epoch": 703} {"train_loss": -20.10295867919922, "global_step": 58357, "epoch": 703} {"train_loss": -20.145801544189453, "global_step": 58358, "epoch": 703} {"train_loss": -20.378339767456055, "global_step": 58359, "epoch": 703} {"train_loss": -20.32032585144043, "global_step": 58360, "epoch": 703} {"train_loss": -20.23713493347168, "global_step": 58361, "epoch": 703} {"train_loss": -20.481367111206055, "global_step": 58362, "epoch": 703} {"train_loss": -19.914499282836914, "global_step": 58363, "epoch": 703} {"train_loss": -20.3791446685791, "global_step": 58364, "epoch": 703} {"train_loss": -20.26980972290039, "global_step": 58365, "epoch": 703} {"train_loss": -20.4245548248291, "global_step": 58366, "epoch": 703} {"train_loss": -20.602262496948242, "global_step": 58367, "epoch": 703} {"train_loss": -20.166242599487305, "global_step": 58368, "epoch": 703} {"train_loss": -20.288148880004883, "global_step": 58369, "epoch": 703} {"train_loss": -20.354692459106445, "global_step": 58370, "epoch": 703} {"train_loss": -20.286224365234375, "global_step": 58371, "epoch": 703} {"train_loss": -20.41036605834961, "global_step": 58372, "epoch": 703} {"train_loss": -20.312997817993164, "global_step": 58373, "epoch": 703} {"train_loss": -20.07665252685547, "global_step": 58374, "epoch": 703} {"train_loss": -20.409942626953125, "global_step": 58375, "epoch": 703} {"train_loss": -19.989248275756836, "global_step": 58376, "epoch": 703} {"train_loss": -19.960132598876953, "global_step": 58377, "epoch": 703} {"train_loss": -20.501689910888672, "global_step": 58378, "epoch": 703} {"train_loss": -20.461599349975586, "global_step": 58379, "epoch": 703} {"train_loss": -20.14166831970215, "global_step": 58380, "epoch": 703} {"train_loss": -20.583303451538086, "global_step": 58381, "epoch": 703} {"train_loss": -20.332075119018555, "global_step": 58382, "epoch": 703} {"train_loss": -20.309547424316406, "global_step": 58383, "epoch": 703} {"train_loss": -19.9597225189209, "global_step": 58384, "epoch": 703} {"train_loss": -20.43143653869629, "global_step": 58385, "epoch": 703} {"train_loss": -20.494009017944336, "global_step": 58386, "epoch": 703} {"train_loss": -20.550209045410156, "global_step": 58387, "epoch": 703} {"train_loss": -20.846607208251953, "global_step": 58388, "epoch": 703} {"train_loss": -20.330829620361328, "global_step": 58389, "epoch": 703} {"train_loss": -20.44035530090332, "global_step": 58390, "epoch": 703} {"train_loss": -20.28525733947754, "global_step": 58391, "epoch": 703} {"train_loss": -20.569555282592773, "global_step": 58392, "epoch": 703} {"train_loss": -20.216909408569336, "global_step": 58393, "epoch": 703} {"train_loss": -20.266664505004883, "global_step": 58394, "epoch": 703} {"train_loss": -20.361783981323242, "global_step": 58395, "epoch": 703} {"train_loss": -20.59905433654785, "global_step": 58396, "epoch": 703} {"train_loss": -20.2022762298584, "global_step": 58397, "epoch": 703} {"train_loss": -20.5052433013916, "global_step": 58398, "epoch": 703} {"train_loss": -20.250951766967773, "global_step": 58399, "epoch": 703} {"train_loss": -20.205703735351562, "global_step": 58400, "epoch": 703} {"train_loss": -20.43025016784668, "global_step": 58401, "epoch": 703} {"train_loss": -19.977005004882812, "global_step": 58402, "epoch": 703} {"train_loss": -20.297903060913086, "global_step": 58403, "epoch": 703} {"train_loss": -20.276227951049805, "global_step": 58404, "epoch": 703} {"train_loss": -20.641321182250977, "global_step": 58405, "epoch": 703} {"train_loss": -20.557743072509766, "global_step": 58406, "epoch": 703} {"train_loss": -20.60683250427246, "global_step": 58407, "epoch": 703} {"train_loss": -20.397647857666016, "global_step": 58408, "epoch": 703} {"train_loss": -20.254377365112305, "global_step": 58409, "epoch": 703} {"train_loss": -20.704425811767578, "global_step": 58410, "epoch": 703} {"train_loss": -20.564870834350586, "global_step": 58411, "epoch": 703} {"train_loss": -20.5596981048584, "global_step": 58412, "epoch": 703} {"train_loss": -20.061437606811523, "global_step": 58413, "epoch": 703} {"train_loss": -20.296070098876953, "global_step": 58414, "epoch": 703} {"train_loss": -20.210309982299805, "global_step": 58415, "epoch": 703} {"train_loss": -20.397628784179688, "global_step": 58416, "epoch": 703} {"train_loss": -20.45368003845215, "global_step": 58417, "epoch": 703} {"train_loss": -20.419889450073242, "global_step": 58418, "epoch": 703} {"train_loss": -20.428075790405273, "global_step": 58419, "epoch": 703} {"train_loss": -20.39240837097168, "global_step": 58420, "epoch": 703} {"train_loss": -20.42728614807129, "global_step": 58421, "epoch": 703} {"train_loss": -20.381786346435547, "global_step": 58422, "epoch": 703} {"train_loss": -20.587417602539062, "global_step": 58423, "epoch": 703} {"train_loss": -20.364696502685547, "global_step": 58424, "epoch": 703} {"train_loss": -20.19765281677246, "global_step": 58425, "epoch": 703} {"train_loss": -20.303464889526367, "global_step": 58426, "epoch": 703} {"train_loss": -20.15302085876465, "global_step": 58427, "epoch": 703} {"train_loss": -20.419099807739258, "global_step": 58428, "epoch": 703} {"train_loss": -20.536224365234375, "global_step": 58429, "epoch": 703} {"train_loss": -19.882265090942383, "global_step": 58430, "epoch": 703} {"train_loss": -20.337228085621295, "global_step": 58431, "epoch": 703, "val_loss": 5997699.0} {"train_loss": -20.275314331054688, "global_step": 58432, "epoch": 704} {"train_loss": -20.198884963989258, "global_step": 58433, "epoch": 704} {"train_loss": -20.3537540435791, "global_step": 58434, "epoch": 704} {"train_loss": -20.317712783813477, "global_step": 58435, "epoch": 704} {"train_loss": -20.079679489135742, "global_step": 58436, "epoch": 704} {"train_loss": -20.6199951171875, "global_step": 58437, "epoch": 704} {"train_loss": -20.085620880126953, "global_step": 58438, "epoch": 704} {"train_loss": -20.04459571838379, "global_step": 58439, "epoch": 704} {"train_loss": -19.869735717773438, "global_step": 58440, "epoch": 704} {"train_loss": -19.876148223876953, "global_step": 58441, "epoch": 704} {"train_loss": -20.20552635192871, "global_step": 58442, "epoch": 704} {"train_loss": -20.176443099975586, "global_step": 58443, "epoch": 704} {"train_loss": -20.422719955444336, "global_step": 58444, "epoch": 704} {"train_loss": -20.163042068481445, "global_step": 58445, "epoch": 704} {"train_loss": -20.3525333404541, "global_step": 58446, "epoch": 704} {"train_loss": -20.021331787109375, "global_step": 58447, "epoch": 704} {"train_loss": -20.614431381225586, "global_step": 58448, "epoch": 704} {"train_loss": -19.974529266357422, "global_step": 58449, "epoch": 704} {"train_loss": -20.300161361694336, "global_step": 58450, "epoch": 704} {"train_loss": -20.364103317260742, "global_step": 58451, "epoch": 704} {"train_loss": -20.2819881439209, "global_step": 58452, "epoch": 704} {"train_loss": -20.17123794555664, "global_step": 58453, "epoch": 704} {"train_loss": -20.1688175201416, "global_step": 58454, "epoch": 704} {"train_loss": -20.47920036315918, "global_step": 58455, "epoch": 704} {"train_loss": -19.916799545288086, "global_step": 58456, "epoch": 704} {"train_loss": -20.612985610961914, "global_step": 58457, "epoch": 704} {"train_loss": -20.355243682861328, "global_step": 58458, "epoch": 704} {"train_loss": -20.504819869995117, "global_step": 58459, "epoch": 704} {"train_loss": -20.178285598754883, "global_step": 58460, "epoch": 704} {"train_loss": -20.494678497314453, "global_step": 58461, "epoch": 704} {"train_loss": -20.437713623046875, "global_step": 58462, "epoch": 704} {"train_loss": -20.163177490234375, "global_step": 58463, "epoch": 704} {"train_loss": -20.9443302154541, "global_step": 58464, "epoch": 704} {"train_loss": -20.3101863861084, "global_step": 58465, "epoch": 704} {"train_loss": -20.335973739624023, "global_step": 58466, "epoch": 704} {"train_loss": -20.66937828063965, "global_step": 58467, "epoch": 704} {"train_loss": -19.9107608795166, "global_step": 58468, "epoch": 704} {"train_loss": -20.298559188842773, "global_step": 58469, "epoch": 704} {"train_loss": -20.305484771728516, "global_step": 58470, "epoch": 704} {"train_loss": -20.467092514038086, "global_step": 58471, "epoch": 704} {"train_loss": -20.403676986694336, "global_step": 58472, "epoch": 704} {"train_loss": -20.29789161682129, "global_step": 58473, "epoch": 704} {"train_loss": -20.314199447631836, "global_step": 58474, "epoch": 704} {"train_loss": -20.816354751586914, "global_step": 58475, "epoch": 704} {"train_loss": -20.80244255065918, "global_step": 58476, "epoch": 704} {"train_loss": -20.603418350219727, "global_step": 58477, "epoch": 704} {"train_loss": -20.25739860534668, "global_step": 58478, "epoch": 704} {"train_loss": -20.349292755126953, "global_step": 58479, "epoch": 704} {"train_loss": -19.994596481323242, "global_step": 58480, "epoch": 704} {"train_loss": -20.289216995239258, "global_step": 58481, "epoch": 704} {"train_loss": -20.28394889831543, "global_step": 58482, "epoch": 704} {"train_loss": -20.181060791015625, "global_step": 58483, "epoch": 704} {"train_loss": -20.59942626953125, "global_step": 58484, "epoch": 704} {"train_loss": -20.698240280151367, "global_step": 58485, "epoch": 704} {"train_loss": -20.3122615814209, "global_step": 58486, "epoch": 704} {"train_loss": -20.285354614257812, "global_step": 58487, "epoch": 704} {"train_loss": -20.505390167236328, "global_step": 58488, "epoch": 704} {"train_loss": -20.235416412353516, "global_step": 58489, "epoch": 704} {"train_loss": -20.470014572143555, "global_step": 58490, "epoch": 704} {"train_loss": -20.281522750854492, "global_step": 58491, "epoch": 704} {"train_loss": -20.28922462463379, "global_step": 58492, "epoch": 704} {"train_loss": -20.408464431762695, "global_step": 58493, "epoch": 704} {"train_loss": -20.40087127685547, "global_step": 58494, "epoch": 704} {"train_loss": -20.380002975463867, "global_step": 58495, "epoch": 704} {"train_loss": -20.56903648376465, "global_step": 58496, "epoch": 704} {"train_loss": -20.502197265625, "global_step": 58497, "epoch": 704} {"train_loss": -20.479223251342773, "global_step": 58498, "epoch": 704} {"train_loss": -19.85258674621582, "global_step": 58499, "epoch": 704} {"train_loss": -20.34284782409668, "global_step": 58500, "epoch": 704} {"train_loss": -20.539392471313477, "global_step": 58501, "epoch": 704} {"train_loss": -20.29628562927246, "global_step": 58502, "epoch": 704} {"train_loss": -20.02170181274414, "global_step": 58503, "epoch": 704} {"train_loss": -20.048755645751953, "global_step": 58504, "epoch": 704} {"train_loss": -20.13901138305664, "global_step": 58505, "epoch": 704} {"train_loss": -20.39621353149414, "global_step": 58506, "epoch": 704} {"train_loss": -20.145801544189453, "global_step": 58507, "epoch": 704} {"train_loss": -20.192182540893555, "global_step": 58508, "epoch": 704} {"train_loss": -20.50437355041504, "global_step": 58509, "epoch": 704} {"train_loss": -19.634313583374023, "global_step": 58510, "epoch": 704} {"train_loss": -20.220544815063477, "global_step": 58511, "epoch": 704} {"train_loss": -20.242229461669922, "global_step": 58512, "epoch": 704} {"train_loss": -20.230344772338867, "global_step": 58513, "epoch": 704} {"train_loss": -20.31796142853886, "global_step": 58514, "epoch": 704, "val_loss": 5950583.5} {"train_loss": -20.225561141967773, "global_step": 58515, "epoch": 705} {"train_loss": -20.065093994140625, "global_step": 58516, "epoch": 705} {"train_loss": -20.342342376708984, "global_step": 58517, "epoch": 705} {"train_loss": -20.32783317565918, "global_step": 58518, "epoch": 705} {"train_loss": -20.080230712890625, "global_step": 58519, "epoch": 705} {"train_loss": -20.24129295349121, "global_step": 58520, "epoch": 705} {"train_loss": -20.193248748779297, "global_step": 58521, "epoch": 705} {"train_loss": -20.245206832885742, "global_step": 58522, "epoch": 705} {"train_loss": -20.511259078979492, "global_step": 58523, "epoch": 705} {"train_loss": -20.293609619140625, "global_step": 58524, "epoch": 705} {"train_loss": -20.05665397644043, "global_step": 58525, "epoch": 705} {"train_loss": -20.23337173461914, "global_step": 58526, "epoch": 705} {"train_loss": -20.332630157470703, "global_step": 58527, "epoch": 705} {"train_loss": -20.283132553100586, "global_step": 58528, "epoch": 705} {"train_loss": -20.425067901611328, "global_step": 58529, "epoch": 705} {"train_loss": -20.125017166137695, "global_step": 58530, "epoch": 705} {"train_loss": -20.033525466918945, "global_step": 58531, "epoch": 705} {"train_loss": -20.337894439697266, "global_step": 58532, "epoch": 705} {"train_loss": -20.288888931274414, "global_step": 58533, "epoch": 705} {"train_loss": -20.283466339111328, "global_step": 58534, "epoch": 705} {"train_loss": -20.327533721923828, "global_step": 58535, "epoch": 705} {"train_loss": -20.0446834564209, "global_step": 58536, "epoch": 705} {"train_loss": -19.993350982666016, "global_step": 58537, "epoch": 705} {"train_loss": -20.040380477905273, "global_step": 58538, "epoch": 705} {"train_loss": -20.252338409423828, "global_step": 58539, "epoch": 705} {"train_loss": -20.55243492126465, "global_step": 58540, "epoch": 705} {"train_loss": -20.190073013305664, "global_step": 58541, "epoch": 705} {"train_loss": -19.8668270111084, "global_step": 58542, "epoch": 705} {"train_loss": -20.621246337890625, "global_step": 58543, "epoch": 705} {"train_loss": -20.175125122070312, "global_step": 58544, "epoch": 705} {"train_loss": -20.22003746032715, "global_step": 58545, "epoch": 705} {"train_loss": -20.159927368164062, "global_step": 58546, "epoch": 705} {"train_loss": -20.161808013916016, "global_step": 58547, "epoch": 705} {"train_loss": -20.330106735229492, "global_step": 58548, "epoch": 705} {"train_loss": -19.972023010253906, "global_step": 58549, "epoch": 705} {"train_loss": -20.04315185546875, "global_step": 58550, "epoch": 705} {"train_loss": -20.23773956298828, "global_step": 58551, "epoch": 705} {"train_loss": -20.305753707885742, "global_step": 58552, "epoch": 705} {"train_loss": -20.73236083984375, "global_step": 58553, "epoch": 705} {"train_loss": -20.58565902709961, "global_step": 58554, "epoch": 705} {"train_loss": -20.54541015625, "global_step": 58555, "epoch": 705} {"train_loss": -20.300565719604492, "global_step": 58556, "epoch": 705} {"train_loss": -20.55691909790039, "global_step": 58557, "epoch": 705} {"train_loss": -20.736726760864258, "global_step": 58558, "epoch": 705} {"train_loss": -20.61191177368164, "global_step": 58559, "epoch": 705} {"train_loss": -20.61151695251465, "global_step": 58560, "epoch": 705} {"train_loss": -20.127025604248047, "global_step": 58561, "epoch": 705} {"train_loss": -20.060911178588867, "global_step": 58562, "epoch": 705} {"train_loss": -20.480327606201172, "global_step": 58563, "epoch": 705} {"train_loss": -20.010608673095703, "global_step": 58564, "epoch": 705} {"train_loss": -20.179725646972656, "global_step": 58565, "epoch": 705} {"train_loss": -20.161985397338867, "global_step": 58566, "epoch": 705} {"train_loss": -19.84827995300293, "global_step": 58567, "epoch": 705} {"train_loss": -20.50606346130371, "global_step": 58568, "epoch": 705} {"train_loss": -20.183353424072266, "global_step": 58569, "epoch": 705} {"train_loss": -20.008625030517578, "global_step": 58570, "epoch": 705} {"train_loss": -20.107667922973633, "global_step": 58571, "epoch": 705} {"train_loss": -20.071359634399414, "global_step": 58572, "epoch": 705} {"train_loss": -20.049327850341797, "global_step": 58573, "epoch": 705} {"train_loss": -20.394838333129883, "global_step": 58574, "epoch": 705} {"train_loss": -20.0985164642334, "global_step": 58575, "epoch": 705} {"train_loss": -20.543336868286133, "global_step": 58576, "epoch": 705} {"train_loss": -20.438383102416992, "global_step": 58577, "epoch": 705} {"train_loss": -20.216922760009766, "global_step": 58578, "epoch": 705} {"train_loss": -20.462844848632812, "global_step": 58579, "epoch": 705} {"train_loss": -20.38764190673828, "global_step": 58580, "epoch": 705} {"train_loss": -20.313444137573242, "global_step": 58581, "epoch": 705} {"train_loss": -20.309289932250977, "global_step": 58582, "epoch": 705} {"train_loss": -20.60149383544922, "global_step": 58583, "epoch": 705} {"train_loss": -20.010223388671875, "global_step": 58584, "epoch": 705} {"train_loss": -20.467395782470703, "global_step": 58585, "epoch": 705} {"train_loss": -20.24585723876953, "global_step": 58586, "epoch": 705} {"train_loss": -20.000391006469727, "global_step": 58587, "epoch": 705} {"train_loss": -20.3980770111084, "global_step": 58588, "epoch": 705} {"train_loss": -20.46103286743164, "global_step": 58589, "epoch": 705} {"train_loss": -20.431102752685547, "global_step": 58590, "epoch": 705} {"train_loss": -20.264251708984375, "global_step": 58591, "epoch": 705} {"train_loss": -20.498504638671875, "global_step": 58592, "epoch": 705} {"train_loss": -20.236236572265625, "global_step": 58593, "epoch": 705} {"train_loss": -20.353940963745117, "global_step": 58594, "epoch": 705} {"train_loss": -20.54368019104004, "global_step": 58595, "epoch": 705} {"train_loss": -20.5158634185791, "global_step": 58596, "epoch": 705} {"train_loss": -20.27251921504377, "global_step": 58597, "epoch": 705, "val_loss": 6000239.0} {"train_loss": -20.062049865722656, "global_step": 58598, "epoch": 706} {"train_loss": -20.40035629272461, "global_step": 58599, "epoch": 706} {"train_loss": -20.229522705078125, "global_step": 58600, "epoch": 706} {"train_loss": -19.99129295349121, "global_step": 58601, "epoch": 706} {"train_loss": -20.483884811401367, "global_step": 58602, "epoch": 706} {"train_loss": -20.084468841552734, "global_step": 58603, "epoch": 706} {"train_loss": -20.455745697021484, "global_step": 58604, "epoch": 706} {"train_loss": -20.082548141479492, "global_step": 58605, "epoch": 706} {"train_loss": -20.190113067626953, "global_step": 58606, "epoch": 706} {"train_loss": -20.57087516784668, "global_step": 58607, "epoch": 706} {"train_loss": -20.256610870361328, "global_step": 58608, "epoch": 706} {"train_loss": -20.78217124938965, "global_step": 58609, "epoch": 706} {"train_loss": -20.405174255371094, "global_step": 58610, "epoch": 706} {"train_loss": -20.26289176940918, "global_step": 58611, "epoch": 706} {"train_loss": -20.437835693359375, "global_step": 58612, "epoch": 706} {"train_loss": -20.063507080078125, "global_step": 58613, "epoch": 706} {"train_loss": -20.30537223815918, "global_step": 58614, "epoch": 706} {"train_loss": -20.255041122436523, "global_step": 58615, "epoch": 706} {"train_loss": -20.24192237854004, "global_step": 58616, "epoch": 706} {"train_loss": -20.302610397338867, "global_step": 58617, "epoch": 706} {"train_loss": -20.505441665649414, "global_step": 58618, "epoch": 706} {"train_loss": -20.263154983520508, "global_step": 58619, "epoch": 706} {"train_loss": -20.086078643798828, "global_step": 58620, "epoch": 706} {"train_loss": -19.908008575439453, "global_step": 58621, "epoch": 706} {"train_loss": -20.34238624572754, "global_step": 58622, "epoch": 706} {"train_loss": -20.22150230407715, "global_step": 58623, "epoch": 706} {"train_loss": -20.49867057800293, "global_step": 58624, "epoch": 706} {"train_loss": -20.528797149658203, "global_step": 58625, "epoch": 706} {"train_loss": -20.364551544189453, "global_step": 58626, "epoch": 706} {"train_loss": -20.199443817138672, "global_step": 58627, "epoch": 706} {"train_loss": -20.518781661987305, "global_step": 58628, "epoch": 706} {"train_loss": -19.977384567260742, "global_step": 58629, "epoch": 706} {"train_loss": -20.57684898376465, "global_step": 58630, "epoch": 706} {"train_loss": -20.361379623413086, "global_step": 58631, "epoch": 706} {"train_loss": -20.437149047851562, "global_step": 58632, "epoch": 706} {"train_loss": -20.326353073120117, "global_step": 58633, "epoch": 706} {"train_loss": -20.276456832885742, "global_step": 58634, "epoch": 706} {"train_loss": -20.23422622680664, "global_step": 58635, "epoch": 706} {"train_loss": -20.27876091003418, "global_step": 58636, "epoch": 706} {"train_loss": -20.59104347229004, "global_step": 58637, "epoch": 706} {"train_loss": -20.65032386779785, "global_step": 58638, "epoch": 706} {"train_loss": -20.196508407592773, "global_step": 58639, "epoch": 706} {"train_loss": -20.40645980834961, "global_step": 58640, "epoch": 706} {"train_loss": -20.346576690673828, "global_step": 58641, "epoch": 706} {"train_loss": -20.61494255065918, "global_step": 58642, "epoch": 706} {"train_loss": -20.53668212890625, "global_step": 58643, "epoch": 706} {"train_loss": -20.529985427856445, "global_step": 58644, "epoch": 706} {"train_loss": -20.627294540405273, "global_step": 58645, "epoch": 706} {"train_loss": -20.56606674194336, "global_step": 58646, "epoch": 706} {"train_loss": -20.22751808166504, "global_step": 58647, "epoch": 706} {"train_loss": -20.558500289916992, "global_step": 58648, "epoch": 706} {"train_loss": -20.587316513061523, "global_step": 58649, "epoch": 706} {"train_loss": -20.18585205078125, "global_step": 58650, "epoch": 706} {"train_loss": -20.75592613220215, "global_step": 58651, "epoch": 706} {"train_loss": -20.56978416442871, "global_step": 58652, "epoch": 706} {"train_loss": -20.286914825439453, "global_step": 58653, "epoch": 706} {"train_loss": -20.567331314086914, "global_step": 58654, "epoch": 706} {"train_loss": -20.507396697998047, "global_step": 58655, "epoch": 706} {"train_loss": -20.66180419921875, "global_step": 58656, "epoch": 706} {"train_loss": -20.323102951049805, "global_step": 58657, "epoch": 706} {"train_loss": -20.337360382080078, "global_step": 58658, "epoch": 706} {"train_loss": -20.35788917541504, "global_step": 58659, "epoch": 706} {"train_loss": -19.927907943725586, "global_step": 58660, "epoch": 706} {"train_loss": -20.209096908569336, "global_step": 58661, "epoch": 706} {"train_loss": -20.477773666381836, "global_step": 58662, "epoch": 706} {"train_loss": -20.114168167114258, "global_step": 58663, "epoch": 706} {"train_loss": -20.046785354614258, "global_step": 58664, "epoch": 706} {"train_loss": -20.587621688842773, "global_step": 58665, "epoch": 706} {"train_loss": -20.06123924255371, "global_step": 58666, "epoch": 706} {"train_loss": -20.418216705322266, "global_step": 58667, "epoch": 706} {"train_loss": -20.29674530029297, "global_step": 58668, "epoch": 706} {"train_loss": -20.731115341186523, "global_step": 58669, "epoch": 706} {"train_loss": -20.345600128173828, "global_step": 58670, "epoch": 706} {"train_loss": -20.565101623535156, "global_step": 58671, "epoch": 706} {"train_loss": -20.093082427978516, "global_step": 58672, "epoch": 706} {"train_loss": -20.77490234375, "global_step": 58673, "epoch": 706} {"train_loss": -20.471830368041992, "global_step": 58674, "epoch": 706} {"train_loss": -20.304861068725586, "global_step": 58675, "epoch": 706} {"train_loss": -20.23628807067871, "global_step": 58676, "epoch": 706} {"train_loss": -20.09552574157715, "global_step": 58677, "epoch": 706} {"train_loss": -20.45741844177246, "global_step": 58678, "epoch": 706} {"train_loss": -20.411571502685547, "global_step": 58679, "epoch": 706} {"train_loss": -20.370448238878364, "global_step": 58680, "epoch": 706, "val_loss": 6040045.0} {"train_loss": -20.578031539916992, "global_step": 58681, "epoch": 707} {"train_loss": -20.257078170776367, "global_step": 58682, "epoch": 707} {"train_loss": -20.216388702392578, "global_step": 58683, "epoch": 707} {"train_loss": -20.175321578979492, "global_step": 58684, "epoch": 707} {"train_loss": -20.42963218688965, "global_step": 58685, "epoch": 707} {"train_loss": -20.110639572143555, "global_step": 58686, "epoch": 707} {"train_loss": -20.44232749938965, "global_step": 58687, "epoch": 707} {"train_loss": -20.154361724853516, "global_step": 58688, "epoch": 707} {"train_loss": -20.074949264526367, "global_step": 58689, "epoch": 707} {"train_loss": -20.209814071655273, "global_step": 58690, "epoch": 707} {"train_loss": -20.25815773010254, "global_step": 58691, "epoch": 707} {"train_loss": -20.220361709594727, "global_step": 58692, "epoch": 707} {"train_loss": -20.277761459350586, "global_step": 58693, "epoch": 707} {"train_loss": -20.35767936706543, "global_step": 58694, "epoch": 707} {"train_loss": -20.241695404052734, "global_step": 58695, "epoch": 707} {"train_loss": -20.140018463134766, "global_step": 58696, "epoch": 707} {"train_loss": -20.567554473876953, "global_step": 58697, "epoch": 707} {"train_loss": -20.18120765686035, "global_step": 58698, "epoch": 707} {"train_loss": -20.393659591674805, "global_step": 58699, "epoch": 707} {"train_loss": -20.09504508972168, "global_step": 58700, "epoch": 707} {"train_loss": -20.14183807373047, "global_step": 58701, "epoch": 707} {"train_loss": -20.419994354248047, "global_step": 58702, "epoch": 707} {"train_loss": -20.274335861206055, "global_step": 58703, "epoch": 707} {"train_loss": -20.309030532836914, "global_step": 58704, "epoch": 707} {"train_loss": -20.21506690979004, "global_step": 58705, "epoch": 707} {"train_loss": -20.1484317779541, "global_step": 58706, "epoch": 707} {"train_loss": -20.42873191833496, "global_step": 58707, "epoch": 707} {"train_loss": -20.40204620361328, "global_step": 58708, "epoch": 707} {"train_loss": -20.733774185180664, "global_step": 58709, "epoch": 707} {"train_loss": -20.0870418548584, "global_step": 58710, "epoch": 707} {"train_loss": -20.301660537719727, "global_step": 58711, "epoch": 707} {"train_loss": -20.474458694458008, "global_step": 58712, "epoch": 707} {"train_loss": -20.094165802001953, "global_step": 58713, "epoch": 707} {"train_loss": -19.911151885986328, "global_step": 58714, "epoch": 707} {"train_loss": -20.140226364135742, "global_step": 58715, "epoch": 707} {"train_loss": -20.279706954956055, "global_step": 58716, "epoch": 707} {"train_loss": -20.21256446838379, "global_step": 58717, "epoch": 707} {"train_loss": -20.73142433166504, "global_step": 58718, "epoch": 707} {"train_loss": -20.75662612915039, "global_step": 58719, "epoch": 707} {"train_loss": -20.450178146362305, "global_step": 58720, "epoch": 707} {"train_loss": -20.21486473083496, "global_step": 58721, "epoch": 707} {"train_loss": -20.114973068237305, "global_step": 58722, "epoch": 707} {"train_loss": -20.358015060424805, "global_step": 58723, "epoch": 707} {"train_loss": -20.201040267944336, "global_step": 58724, "epoch": 707} {"train_loss": -20.23366355895996, "global_step": 58725, "epoch": 707} {"train_loss": -20.57367515563965, "global_step": 58726, "epoch": 707} {"train_loss": -20.241933822631836, "global_step": 58727, "epoch": 707} {"train_loss": -20.178281784057617, "global_step": 58728, "epoch": 707} {"train_loss": -20.368423461914062, "global_step": 58729, "epoch": 707} {"train_loss": -20.526426315307617, "global_step": 58730, "epoch": 707} {"train_loss": -20.584171295166016, "global_step": 58731, "epoch": 707} {"train_loss": -20.45553970336914, "global_step": 58732, "epoch": 707} {"train_loss": -20.411436080932617, "global_step": 58733, "epoch": 707} {"train_loss": -20.2373104095459, "global_step": 58734, "epoch": 707} {"train_loss": -19.926288604736328, "global_step": 58735, "epoch": 707} {"train_loss": -20.845827102661133, "global_step": 58736, "epoch": 707} {"train_loss": -20.749792098999023, "global_step": 58737, "epoch": 707} {"train_loss": -20.3941650390625, "global_step": 58738, "epoch": 707} {"train_loss": -20.23648452758789, "global_step": 58739, "epoch": 707} {"train_loss": -20.321256637573242, "global_step": 58740, "epoch": 707} {"train_loss": -20.257549285888672, "global_step": 58741, "epoch": 707} {"train_loss": -20.212509155273438, "global_step": 58742, "epoch": 707} {"train_loss": -20.508413314819336, "global_step": 58743, "epoch": 707} {"train_loss": -20.42314910888672, "global_step": 58744, "epoch": 707} {"train_loss": -20.6048641204834, "global_step": 58745, "epoch": 707} {"train_loss": -20.383737564086914, "global_step": 58746, "epoch": 707} {"train_loss": -20.396581649780273, "global_step": 58747, "epoch": 707} {"train_loss": -20.343734741210938, "global_step": 58748, "epoch": 707} {"train_loss": -20.408552169799805, "global_step": 58749, "epoch": 707} {"train_loss": -20.460187911987305, "global_step": 58750, "epoch": 707} {"train_loss": -20.24043846130371, "global_step": 58751, "epoch": 707} {"train_loss": -20.487335205078125, "global_step": 58752, "epoch": 707} {"train_loss": -20.261198043823242, "global_step": 58753, "epoch": 707} {"train_loss": -20.099796295166016, "global_step": 58754, "epoch": 707} {"train_loss": -20.679996490478516, "global_step": 58755, "epoch": 707} {"train_loss": -20.605640411376953, "global_step": 58756, "epoch": 707} {"train_loss": -20.40260124206543, "global_step": 58757, "epoch": 707} {"train_loss": -20.019750595092773, "global_step": 58758, "epoch": 707} {"train_loss": -20.5047664642334, "global_step": 58759, "epoch": 707} {"train_loss": -20.008167266845703, "global_step": 58760, "epoch": 707} {"train_loss": -20.45417594909668, "global_step": 58761, "epoch": 707} {"train_loss": -20.237882614135742, "global_step": 58762, "epoch": 707} {"train_loss": -20.335223117506647, "global_step": 58763, "epoch": 707, "val_loss": 6098854.5} {"train_loss": -19.42156410217285, "global_step": 58764, "epoch": 708} {"train_loss": -19.83368492126465, "global_step": 58765, "epoch": 708} {"train_loss": -19.44693946838379, "global_step": 58766, "epoch": 708} {"train_loss": -20.158292770385742, "global_step": 58767, "epoch": 708} {"train_loss": -20.25421714782715, "global_step": 58768, "epoch": 708} {"train_loss": -20.330717086791992, "global_step": 58769, "epoch": 708} {"train_loss": -20.114843368530273, "global_step": 58770, "epoch": 708} {"train_loss": -19.894357681274414, "global_step": 58771, "epoch": 708} {"train_loss": -20.138967514038086, "global_step": 58772, "epoch": 708} {"train_loss": -20.009458541870117, "global_step": 58773, "epoch": 708} {"train_loss": -20.08296775817871, "global_step": 58774, "epoch": 708} {"train_loss": -20.040821075439453, "global_step": 58775, "epoch": 708} {"train_loss": -19.597320556640625, "global_step": 58776, "epoch": 708} {"train_loss": -20.37619972229004, "global_step": 58777, "epoch": 708} {"train_loss": -19.918561935424805, "global_step": 58778, "epoch": 708} {"train_loss": -20.119455337524414, "global_step": 58779, "epoch": 708} {"train_loss": -20.36845588684082, "global_step": 58780, "epoch": 708} {"train_loss": -20.302011489868164, "global_step": 58781, "epoch": 708} {"train_loss": -20.191307067871094, "global_step": 58782, "epoch": 708} {"train_loss": -20.335153579711914, "global_step": 58783, "epoch": 708} {"train_loss": -19.910797119140625, "global_step": 58784, "epoch": 708} {"train_loss": -20.259862899780273, "global_step": 58785, "epoch": 708} {"train_loss": -20.65950584411621, "global_step": 58786, "epoch": 708} {"train_loss": -20.060102462768555, "global_step": 58787, "epoch": 708} {"train_loss": -19.78208351135254, "global_step": 58788, "epoch": 708} {"train_loss": -20.101520538330078, "global_step": 58789, "epoch": 708} {"train_loss": -20.595624923706055, "global_step": 58790, "epoch": 708} {"train_loss": -20.453420639038086, "global_step": 58791, "epoch": 708} {"train_loss": -20.182653427124023, "global_step": 58792, "epoch": 708} {"train_loss": -20.335874557495117, "global_step": 58793, "epoch": 708} {"train_loss": -20.072643280029297, "global_step": 58794, "epoch": 708} {"train_loss": -20.39156723022461, "global_step": 58795, "epoch": 708} {"train_loss": -20.22810173034668, "global_step": 58796, "epoch": 708} {"train_loss": -20.131240844726562, "global_step": 58797, "epoch": 708} {"train_loss": -20.287582397460938, "global_step": 58798, "epoch": 708} {"train_loss": -19.849441528320312, "global_step": 58799, "epoch": 708} {"train_loss": -20.435367584228516, "global_step": 58800, "epoch": 708} {"train_loss": -20.38923454284668, "global_step": 58801, "epoch": 708} {"train_loss": -20.225784301757812, "global_step": 58802, "epoch": 708} {"train_loss": -20.185306549072266, "global_step": 58803, "epoch": 708} {"train_loss": -20.471220016479492, "global_step": 58804, "epoch": 708} {"train_loss": -20.247961044311523, "global_step": 58805, "epoch": 708} {"train_loss": -20.05219078063965, "global_step": 58806, "epoch": 708} {"train_loss": -20.231359481811523, "global_step": 58807, "epoch": 708} {"train_loss": -20.41054344177246, "global_step": 58808, "epoch": 708} {"train_loss": -20.1466121673584, "global_step": 58809, "epoch": 708} {"train_loss": -20.661428451538086, "global_step": 58810, "epoch": 708} {"train_loss": -20.417011260986328, "global_step": 58811, "epoch": 708} {"train_loss": -20.31130599975586, "global_step": 58812, "epoch": 708} {"train_loss": -20.375396728515625, "global_step": 58813, "epoch": 708} {"train_loss": -20.57215690612793, "global_step": 58814, "epoch": 708} {"train_loss": -20.397493362426758, "global_step": 58815, "epoch": 708} {"train_loss": -20.2546443939209, "global_step": 58816, "epoch": 708} {"train_loss": -20.280363082885742, "global_step": 58817, "epoch": 708} {"train_loss": -20.617816925048828, "global_step": 58818, "epoch": 708} {"train_loss": -20.50603675842285, "global_step": 58819, "epoch": 708} {"train_loss": -20.433067321777344, "global_step": 58820, "epoch": 708} {"train_loss": -20.26816749572754, "global_step": 58821, "epoch": 708} {"train_loss": -20.319482803344727, "global_step": 58822, "epoch": 708} {"train_loss": -20.43182945251465, "global_step": 58823, "epoch": 708} {"train_loss": -20.2962589263916, "global_step": 58824, "epoch": 708} {"train_loss": -19.96188735961914, "global_step": 58825, "epoch": 708} {"train_loss": -20.085857391357422, "global_step": 58826, "epoch": 708} {"train_loss": -20.624311447143555, "global_step": 58827, "epoch": 708} {"train_loss": -20.53461456298828, "global_step": 58828, "epoch": 708} {"train_loss": -20.12821388244629, "global_step": 58829, "epoch": 708} {"train_loss": -20.50773811340332, "global_step": 58830, "epoch": 708} {"train_loss": -20.49245262145996, "global_step": 58831, "epoch": 708} {"train_loss": -19.954280853271484, "global_step": 58832, "epoch": 708} {"train_loss": -20.064119338989258, "global_step": 58833, "epoch": 708} {"train_loss": -19.99884033203125, "global_step": 58834, "epoch": 708} {"train_loss": -20.358762741088867, "global_step": 58835, "epoch": 708} {"train_loss": -20.679574966430664, "global_step": 58836, "epoch": 708} {"train_loss": -20.508466720581055, "global_step": 58837, "epoch": 708} {"train_loss": -20.557424545288086, "global_step": 58838, "epoch": 708} {"train_loss": -20.375858306884766, "global_step": 58839, "epoch": 708} {"train_loss": -20.281524658203125, "global_step": 58840, "epoch": 708} {"train_loss": -20.267301559448242, "global_step": 58841, "epoch": 708} {"train_loss": -20.515182495117188, "global_step": 58842, "epoch": 708} {"train_loss": -20.35993003845215, "global_step": 58843, "epoch": 708} {"train_loss": -20.17713165283203, "global_step": 58844, "epoch": 708} {"train_loss": -20.521268844604492, "global_step": 58845, "epoch": 708} {"train_loss": -20.227263255291675, "global_step": 58846, "epoch": 708, "val_loss": 5903836.0} {"train_loss": -20.06353759765625, "global_step": 58847, "epoch": 709} {"train_loss": -19.916723251342773, "global_step": 58848, "epoch": 709} {"train_loss": -20.11297035217285, "global_step": 58849, "epoch": 709} {"train_loss": -20.103866577148438, "global_step": 58850, "epoch": 709} {"train_loss": -20.380300521850586, "global_step": 58851, "epoch": 709} {"train_loss": -19.975431442260742, "global_step": 58852, "epoch": 709} {"train_loss": -19.651296615600586, "global_step": 58853, "epoch": 709} {"train_loss": -20.12110710144043, "global_step": 58854, "epoch": 709} {"train_loss": -20.062454223632812, "global_step": 58855, "epoch": 709} {"train_loss": -19.853368759155273, "global_step": 58856, "epoch": 709} {"train_loss": -19.9754695892334, "global_step": 58857, "epoch": 709} {"train_loss": -20.08492088317871, "global_step": 58858, "epoch": 709} {"train_loss": -20.02508544921875, "global_step": 58859, "epoch": 709} {"train_loss": -19.852737426757812, "global_step": 58860, "epoch": 709} {"train_loss": -20.327268600463867, "global_step": 58861, "epoch": 709} {"train_loss": -20.25661277770996, "global_step": 58862, "epoch": 709} {"train_loss": -20.29496955871582, "global_step": 58863, "epoch": 709} {"train_loss": -20.359594345092773, "global_step": 58864, "epoch": 709} {"train_loss": -19.963592529296875, "global_step": 58865, "epoch": 709} {"train_loss": -20.068017959594727, "global_step": 58866, "epoch": 709} {"train_loss": -20.418779373168945, "global_step": 58867, "epoch": 709} {"train_loss": -20.673063278198242, "global_step": 58868, "epoch": 709} {"train_loss": -19.948400497436523, "global_step": 58869, "epoch": 709} {"train_loss": -20.112741470336914, "global_step": 58870, "epoch": 709} {"train_loss": -20.35249900817871, "global_step": 58871, "epoch": 709} {"train_loss": -20.458667755126953, "global_step": 58872, "epoch": 709} {"train_loss": -20.30818748474121, "global_step": 58873, "epoch": 709} {"train_loss": -20.552030563354492, "global_step": 58874, "epoch": 709} {"train_loss": -20.463232040405273, "global_step": 58875, "epoch": 709} {"train_loss": -20.21892547607422, "global_step": 58876, "epoch": 709} {"train_loss": -20.39639663696289, "global_step": 58877, "epoch": 709} {"train_loss": -20.242807388305664, "global_step": 58878, "epoch": 709} {"train_loss": -20.30140495300293, "global_step": 58879, "epoch": 709} {"train_loss": -20.382383346557617, "global_step": 58880, "epoch": 709} {"train_loss": -20.21237564086914, "global_step": 58881, "epoch": 709} {"train_loss": -20.09645652770996, "global_step": 58882, "epoch": 709} {"train_loss": -20.31947898864746, "global_step": 58883, "epoch": 709} {"train_loss": -20.035184860229492, "global_step": 58884, "epoch": 709} {"train_loss": -20.281021118164062, "global_step": 58885, "epoch": 709} {"train_loss": -20.442014694213867, "global_step": 58886, "epoch": 709} {"train_loss": -20.218364715576172, "global_step": 58887, "epoch": 709} {"train_loss": -20.286741256713867, "global_step": 58888, "epoch": 709} {"train_loss": -20.473907470703125, "global_step": 58889, "epoch": 709} {"train_loss": -20.127901077270508, "global_step": 58890, "epoch": 709} {"train_loss": -20.570524215698242, "global_step": 58891, "epoch": 709} {"train_loss": -20.59187126159668, "global_step": 58892, "epoch": 709} {"train_loss": -20.33841896057129, "global_step": 58893, "epoch": 709} {"train_loss": -20.411710739135742, "global_step": 58894, "epoch": 709} {"train_loss": -20.339017868041992, "global_step": 58895, "epoch": 709} {"train_loss": -20.320003509521484, "global_step": 58896, "epoch": 709} {"train_loss": -20.15821647644043, "global_step": 58897, "epoch": 709} {"train_loss": -20.293231964111328, "global_step": 58898, "epoch": 709} {"train_loss": -20.697853088378906, "global_step": 58899, "epoch": 709} {"train_loss": -20.740501403808594, "global_step": 58900, "epoch": 709} {"train_loss": -20.160585403442383, "global_step": 58901, "epoch": 709} {"train_loss": -20.331649780273438, "global_step": 58902, "epoch": 709} {"train_loss": -20.052549362182617, "global_step": 58903, "epoch": 709} {"train_loss": -20.1756534576416, "global_step": 58904, "epoch": 709} {"train_loss": -20.279935836791992, "global_step": 58905, "epoch": 709} {"train_loss": -20.328882217407227, "global_step": 58906, "epoch": 709} {"train_loss": -20.762229919433594, "global_step": 58907, "epoch": 709} {"train_loss": -20.26190757751465, "global_step": 58908, "epoch": 709} {"train_loss": -20.0037841796875, "global_step": 58909, "epoch": 709} {"train_loss": -20.133207321166992, "global_step": 58910, "epoch": 709} {"train_loss": -19.855409622192383, "global_step": 58911, "epoch": 709} {"train_loss": -20.320571899414062, "global_step": 58912, "epoch": 709} {"train_loss": -20.35725212097168, "global_step": 58913, "epoch": 709} {"train_loss": -20.399322509765625, "global_step": 58914, "epoch": 709} {"train_loss": -20.34504508972168, "global_step": 58915, "epoch": 709} {"train_loss": -20.577125549316406, "global_step": 58916, "epoch": 709} {"train_loss": -20.36817741394043, "global_step": 58917, "epoch": 709} {"train_loss": -20.101787567138672, "global_step": 58918, "epoch": 709} {"train_loss": -20.17530632019043, "global_step": 58919, "epoch": 709} {"train_loss": -20.079504013061523, "global_step": 58920, "epoch": 709} {"train_loss": -20.277246475219727, "global_step": 58921, "epoch": 709} {"train_loss": -20.563440322875977, "global_step": 58922, "epoch": 709} {"train_loss": -20.594602584838867, "global_step": 58923, "epoch": 709} {"train_loss": -20.237411499023438, "global_step": 58924, "epoch": 709} {"train_loss": -20.2462215423584, "global_step": 58925, "epoch": 709} {"train_loss": -20.673828125, "global_step": 58926, "epoch": 709} {"train_loss": -20.212955474853516, "global_step": 58927, "epoch": 709} {"train_loss": -20.31713104248047, "global_step": 58928, "epoch": 709} {"train_loss": -20.25721722338573, "global_step": 58929, "epoch": 709, "val_loss": 5981529.5} {"train_loss": -20.231103897094727, "global_step": 58930, "epoch": 710} {"train_loss": -20.0766544342041, "global_step": 58931, "epoch": 710} {"train_loss": -20.44220733642578, "global_step": 58932, "epoch": 710} {"train_loss": -19.947805404663086, "global_step": 58933, "epoch": 710} {"train_loss": -20.375682830810547, "global_step": 58934, "epoch": 710} {"train_loss": -20.14771842956543, "global_step": 58935, "epoch": 710} {"train_loss": -20.465360641479492, "global_step": 58936, "epoch": 710} {"train_loss": -20.2329044342041, "global_step": 58937, "epoch": 710} {"train_loss": -19.790863037109375, "global_step": 58938, "epoch": 710} {"train_loss": -20.00766944885254, "global_step": 58939, "epoch": 710} {"train_loss": -19.656539916992188, "global_step": 58940, "epoch": 710} {"train_loss": -20.00205421447754, "global_step": 58941, "epoch": 710} {"train_loss": -20.239459991455078, "global_step": 58942, "epoch": 710} {"train_loss": -20.38104248046875, "global_step": 58943, "epoch": 710} {"train_loss": -20.502309799194336, "global_step": 58944, "epoch": 710} {"train_loss": -20.216642379760742, "global_step": 58945, "epoch": 710} {"train_loss": -20.13356590270996, "global_step": 58946, "epoch": 710} {"train_loss": -20.209245681762695, "global_step": 58947, "epoch": 710} {"train_loss": -20.401464462280273, "global_step": 58948, "epoch": 710} {"train_loss": -20.48164939880371, "global_step": 58949, "epoch": 710} {"train_loss": -20.163822174072266, "global_step": 58950, "epoch": 710} {"train_loss": -20.3571834564209, "global_step": 58951, "epoch": 710} {"train_loss": -19.784664154052734, "global_step": 58952, "epoch": 710} {"train_loss": -20.290145874023438, "global_step": 58953, "epoch": 710} {"train_loss": -20.135313034057617, "global_step": 58954, "epoch": 710} {"train_loss": -20.378360748291016, "global_step": 58955, "epoch": 710} {"train_loss": -20.303878784179688, "global_step": 58956, "epoch": 710} {"train_loss": -20.263383865356445, "global_step": 58957, "epoch": 710} {"train_loss": -20.54409408569336, "global_step": 58958, "epoch": 710} {"train_loss": -20.55961036682129, "global_step": 58959, "epoch": 710} {"train_loss": -20.236347198486328, "global_step": 58960, "epoch": 710} {"train_loss": -20.208791732788086, "global_step": 58961, "epoch": 710} {"train_loss": -20.38921546936035, "global_step": 58962, "epoch": 710} {"train_loss": -20.53896141052246, "global_step": 58963, "epoch": 710} {"train_loss": -20.458194732666016, "global_step": 58964, "epoch": 710} {"train_loss": -20.380096435546875, "global_step": 58965, "epoch": 710} {"train_loss": -20.406213760375977, "global_step": 58966, "epoch": 710} {"train_loss": -20.271469116210938, "global_step": 58967, "epoch": 710} {"train_loss": -20.425872802734375, "global_step": 58968, "epoch": 710} {"train_loss": -20.411832809448242, "global_step": 58969, "epoch": 710} {"train_loss": -20.06015396118164, "global_step": 58970, "epoch": 710} {"train_loss": -20.331541061401367, "global_step": 58971, "epoch": 710} {"train_loss": -20.608646392822266, "global_step": 58972, "epoch": 710} {"train_loss": -20.44222068786621, "global_step": 58973, "epoch": 710} {"train_loss": -20.631103515625, "global_step": 58974, "epoch": 710} {"train_loss": -20.319849014282227, "global_step": 58975, "epoch": 710} {"train_loss": -20.132314682006836, "global_step": 58976, "epoch": 710} {"train_loss": -20.576303482055664, "global_step": 58977, "epoch": 710} {"train_loss": -20.700252532958984, "global_step": 58978, "epoch": 710} {"train_loss": -20.301563262939453, "global_step": 58979, "epoch": 710} {"train_loss": -20.71393585205078, "global_step": 58980, "epoch": 710} {"train_loss": -20.225330352783203, "global_step": 58981, "epoch": 710} {"train_loss": -20.49187469482422, "global_step": 58982, "epoch": 710} {"train_loss": -20.345094680786133, "global_step": 58983, "epoch": 710} {"train_loss": -20.47926139831543, "global_step": 58984, "epoch": 710} {"train_loss": -20.460798263549805, "global_step": 58985, "epoch": 710} {"train_loss": -20.303874969482422, "global_step": 58986, "epoch": 710} {"train_loss": -20.68294334411621, "global_step": 58987, "epoch": 710} {"train_loss": -20.29256820678711, "global_step": 58988, "epoch": 710} {"train_loss": -20.41440200805664, "global_step": 58989, "epoch": 710} {"train_loss": -20.373647689819336, "global_step": 58990, "epoch": 710} {"train_loss": -20.361488342285156, "global_step": 58991, "epoch": 710} {"train_loss": -20.205127716064453, "global_step": 58992, "epoch": 710} {"train_loss": -20.535919189453125, "global_step": 58993, "epoch": 710} {"train_loss": -20.44825553894043, "global_step": 58994, "epoch": 710} {"train_loss": -20.186100006103516, "global_step": 58995, "epoch": 710} {"train_loss": -20.381607055664062, "global_step": 58996, "epoch": 710} {"train_loss": -20.661422729492188, "global_step": 58997, "epoch": 710} {"train_loss": -20.2511043548584, "global_step": 58998, "epoch": 710} {"train_loss": -20.44621467590332, "global_step": 58999, "epoch": 710} {"train_loss": -20.792810440063477, "global_step": 59000, "epoch": 710} {"train_loss": -20.196245193481445, "global_step": 59001, "epoch": 710} {"train_loss": -20.242385864257812, "global_step": 59002, "epoch": 710} {"train_loss": -20.3422794342041, "global_step": 59003, "epoch": 710} {"train_loss": -20.26723289489746, "global_step": 59004, "epoch": 710} {"train_loss": -20.000757217407227, "global_step": 59005, "epoch": 710} {"train_loss": -20.321044921875, "global_step": 59006, "epoch": 710} {"train_loss": -20.205062866210938, "global_step": 59007, "epoch": 710} {"train_loss": -20.2431640625, "global_step": 59008, "epoch": 710} {"train_loss": -20.109806060791016, "global_step": 59009, "epoch": 710} {"train_loss": -20.85507583618164, "global_step": 59010, "epoch": 710} {"train_loss": -20.422914505004883, "global_step": 59011, "epoch": 710} {"train_loss": -20.319066564720796, "global_step": 59012, "epoch": 710, "val_loss": 5855641.5} {"train_loss": -20.412221908569336, "global_step": 59013, "epoch": 711} {"train_loss": -20.353900909423828, "global_step": 59014, "epoch": 711} {"train_loss": -20.317289352416992, "global_step": 59015, "epoch": 711} {"train_loss": -19.77374839782715, "global_step": 59016, "epoch": 711} {"train_loss": -20.062416076660156, "global_step": 59017, "epoch": 711} {"train_loss": -20.479490280151367, "global_step": 59018, "epoch": 711} {"train_loss": -20.296552658081055, "global_step": 59019, "epoch": 711} {"train_loss": -20.310039520263672, "global_step": 59020, "epoch": 711} {"train_loss": -20.427427291870117, "global_step": 59021, "epoch": 711} {"train_loss": -19.984825134277344, "global_step": 59022, "epoch": 711} {"train_loss": -20.239728927612305, "global_step": 59023, "epoch": 711} {"train_loss": -19.973642349243164, "global_step": 59024, "epoch": 711} {"train_loss": -19.98533058166504, "global_step": 59025, "epoch": 711} {"train_loss": -20.193552017211914, "global_step": 59026, "epoch": 711} {"train_loss": -20.34565544128418, "global_step": 59027, "epoch": 711} {"train_loss": -19.992542266845703, "global_step": 59028, "epoch": 711} {"train_loss": -19.965993881225586, "global_step": 59029, "epoch": 711} {"train_loss": -19.756765365600586, "global_step": 59030, "epoch": 711} {"train_loss": -20.33662986755371, "global_step": 59031, "epoch": 711} {"train_loss": -20.47869300842285, "global_step": 59032, "epoch": 711} {"train_loss": -20.114261627197266, "global_step": 59033, "epoch": 711} {"train_loss": -19.890859603881836, "global_step": 59034, "epoch": 711} {"train_loss": -20.29228401184082, "global_step": 59035, "epoch": 711} {"train_loss": -19.927244186401367, "global_step": 59036, "epoch": 711} {"train_loss": -20.188140869140625, "global_step": 59037, "epoch": 711} {"train_loss": -20.177209854125977, "global_step": 59038, "epoch": 711} {"train_loss": -20.148160934448242, "global_step": 59039, "epoch": 711} {"train_loss": -20.069990158081055, "global_step": 59040, "epoch": 711} {"train_loss": -20.28627586364746, "global_step": 59041, "epoch": 711} {"train_loss": -20.521982192993164, "global_step": 59042, "epoch": 711} {"train_loss": -19.9617919921875, "global_step": 59043, "epoch": 711} {"train_loss": -20.471343994140625, "global_step": 59044, "epoch": 711} {"train_loss": -20.244686126708984, "global_step": 59045, "epoch": 711} {"train_loss": -20.725269317626953, "global_step": 59046, "epoch": 711} {"train_loss": -20.47841453552246, "global_step": 59047, "epoch": 711} {"train_loss": -20.282751083374023, "global_step": 59048, "epoch": 711} {"train_loss": -20.2108211517334, "global_step": 59049, "epoch": 711} {"train_loss": -20.50922966003418, "global_step": 59050, "epoch": 711} {"train_loss": -20.461261749267578, "global_step": 59051, "epoch": 711} {"train_loss": -20.196462631225586, "global_step": 59052, "epoch": 711} {"train_loss": -20.289350509643555, "global_step": 59053, "epoch": 711} {"train_loss": -20.408660888671875, "global_step": 59054, "epoch": 711} {"train_loss": -20.455326080322266, "global_step": 59055, "epoch": 711} {"train_loss": -20.102802276611328, "global_step": 59056, "epoch": 711} {"train_loss": -20.420717239379883, "global_step": 59057, "epoch": 711} {"train_loss": -20.541868209838867, "global_step": 59058, "epoch": 711} {"train_loss": -20.048002243041992, "global_step": 59059, "epoch": 711} {"train_loss": -20.342267990112305, "global_step": 59060, "epoch": 711} {"train_loss": -20.41230010986328, "global_step": 59061, "epoch": 711} {"train_loss": -20.398298263549805, "global_step": 59062, "epoch": 711} {"train_loss": -20.535776138305664, "global_step": 59063, "epoch": 711} {"train_loss": -20.579011917114258, "global_step": 59064, "epoch": 711} {"train_loss": -20.429351806640625, "global_step": 59065, "epoch": 711} {"train_loss": -20.519521713256836, "global_step": 59066, "epoch": 711} {"train_loss": -20.35906219482422, "global_step": 59067, "epoch": 711} {"train_loss": -19.85551643371582, "global_step": 59068, "epoch": 711} {"train_loss": -20.325891494750977, "global_step": 59069, "epoch": 711} {"train_loss": -20.039152145385742, "global_step": 59070, "epoch": 711} {"train_loss": -20.252195358276367, "global_step": 59071, "epoch": 711} {"train_loss": -20.30402946472168, "global_step": 59072, "epoch": 711} {"train_loss": -20.595609664916992, "global_step": 59073, "epoch": 711} {"train_loss": -20.287195205688477, "global_step": 59074, "epoch": 711} {"train_loss": -20.738405227661133, "global_step": 59075, "epoch": 711} {"train_loss": -20.265472412109375, "global_step": 59076, "epoch": 711} {"train_loss": -19.98198699951172, "global_step": 59077, "epoch": 711} {"train_loss": -20.40174674987793, "global_step": 59078, "epoch": 711} {"train_loss": -20.50901222229004, "global_step": 59079, "epoch": 711} {"train_loss": -20.445648193359375, "global_step": 59080, "epoch": 711} {"train_loss": -20.382095336914062, "global_step": 59081, "epoch": 711} {"train_loss": -20.26462173461914, "global_step": 59082, "epoch": 711} {"train_loss": -20.623971939086914, "global_step": 59083, "epoch": 711} {"train_loss": -20.377368927001953, "global_step": 59084, "epoch": 711} {"train_loss": -19.812965393066406, "global_step": 59085, "epoch": 711} {"train_loss": -20.269065856933594, "global_step": 59086, "epoch": 711} {"train_loss": -20.253103256225586, "global_step": 59087, "epoch": 711} {"train_loss": -20.377965927124023, "global_step": 59088, "epoch": 711} {"train_loss": -20.39980125427246, "global_step": 59089, "epoch": 711} {"train_loss": -20.479528427124023, "global_step": 59090, "epoch": 711} {"train_loss": -20.51369285583496, "global_step": 59091, "epoch": 711} {"train_loss": -20.249706268310547, "global_step": 59092, "epoch": 711} {"train_loss": -20.542783737182617, "global_step": 59093, "epoch": 711} {"train_loss": -20.26202964782715, "global_step": 59094, "epoch": 711} {"train_loss": -20.286436494574488, "global_step": 59095, "epoch": 711, "val_loss": 6061744.5} {"train_loss": -19.770376205444336, "global_step": 59096, "epoch": 712} {"train_loss": -20.30914878845215, "global_step": 59097, "epoch": 712} {"train_loss": -20.416717529296875, "global_step": 59098, "epoch": 712} {"train_loss": -20.026288986206055, "global_step": 59099, "epoch": 712} {"train_loss": -20.290311813354492, "global_step": 59100, "epoch": 712} {"train_loss": -20.2534236907959, "global_step": 59101, "epoch": 712} {"train_loss": -20.271167755126953, "global_step": 59102, "epoch": 712} {"train_loss": -19.876440048217773, "global_step": 59103, "epoch": 712} {"train_loss": -19.898780822753906, "global_step": 59104, "epoch": 712} {"train_loss": -20.02193832397461, "global_step": 59105, "epoch": 712} {"train_loss": -20.23053550720215, "global_step": 59106, "epoch": 712} {"train_loss": -20.399580001831055, "global_step": 59107, "epoch": 712} {"train_loss": -19.887563705444336, "global_step": 59108, "epoch": 712} {"train_loss": -20.045812606811523, "global_step": 59109, "epoch": 712} {"train_loss": -20.42233657836914, "global_step": 59110, "epoch": 712} {"train_loss": -20.461868286132812, "global_step": 59111, "epoch": 712} {"train_loss": -20.36610221862793, "global_step": 59112, "epoch": 712} {"train_loss": -20.279361724853516, "global_step": 59113, "epoch": 712} {"train_loss": -20.34041404724121, "global_step": 59114, "epoch": 712} {"train_loss": -20.220701217651367, "global_step": 59115, "epoch": 712} {"train_loss": -20.355588912963867, "global_step": 59116, "epoch": 712} {"train_loss": -19.8568172454834, "global_step": 59117, "epoch": 712} {"train_loss": -20.687122344970703, "global_step": 59118, "epoch": 712} {"train_loss": -20.311948776245117, "global_step": 59119, "epoch": 712} {"train_loss": -20.431119918823242, "global_step": 59120, "epoch": 712} {"train_loss": -20.609766006469727, "global_step": 59121, "epoch": 712} {"train_loss": -20.128751754760742, "global_step": 59122, "epoch": 712} {"train_loss": -20.353172302246094, "global_step": 59123, "epoch": 712} {"train_loss": -20.328414916992188, "global_step": 59124, "epoch": 712} {"train_loss": -20.206998825073242, "global_step": 59125, "epoch": 712} {"train_loss": -20.429903030395508, "global_step": 59126, "epoch": 712} {"train_loss": -20.551523208618164, "global_step": 59127, "epoch": 712} {"train_loss": -20.466638565063477, "global_step": 59128, "epoch": 712} {"train_loss": -20.455387115478516, "global_step": 59129, "epoch": 712} {"train_loss": -20.61982536315918, "global_step": 59130, "epoch": 712} {"train_loss": -20.374469757080078, "global_step": 59131, "epoch": 712} {"train_loss": -20.56342887878418, "global_step": 59132, "epoch": 712} {"train_loss": -20.322776794433594, "global_step": 59133, "epoch": 712} {"train_loss": -20.434274673461914, "global_step": 59134, "epoch": 712} {"train_loss": -20.283140182495117, "global_step": 59135, "epoch": 712} {"train_loss": -20.96588134765625, "global_step": 59136, "epoch": 712} {"train_loss": -20.62026023864746, "global_step": 59137, "epoch": 712} {"train_loss": -19.95895004272461, "global_step": 59138, "epoch": 712} {"train_loss": -20.311782836914062, "global_step": 59139, "epoch": 712} {"train_loss": -20.168859481811523, "global_step": 59140, "epoch": 712} {"train_loss": -20.266010284423828, "global_step": 59141, "epoch": 712} {"train_loss": -20.237794876098633, "global_step": 59142, "epoch": 712} {"train_loss": -20.164037704467773, "global_step": 59143, "epoch": 712} {"train_loss": -20.29082679748535, "global_step": 59144, "epoch": 712} {"train_loss": -20.33099365234375, "global_step": 59145, "epoch": 712} {"train_loss": -20.386615753173828, "global_step": 59146, "epoch": 712} {"train_loss": -20.20069122314453, "global_step": 59147, "epoch": 712} {"train_loss": -20.10921287536621, "global_step": 59148, "epoch": 712} {"train_loss": -20.298086166381836, "global_step": 59149, "epoch": 712} {"train_loss": -20.48123550415039, "global_step": 59150, "epoch": 712} {"train_loss": -20.43134117126465, "global_step": 59151, "epoch": 712} {"train_loss": -20.49798583984375, "global_step": 59152, "epoch": 712} {"train_loss": -20.46337890625, "global_step": 59153, "epoch": 712} {"train_loss": -20.143613815307617, "global_step": 59154, "epoch": 712} {"train_loss": -20.57893943786621, "global_step": 59155, "epoch": 712} {"train_loss": -20.101497650146484, "global_step": 59156, "epoch": 712} {"train_loss": -20.253931045532227, "global_step": 59157, "epoch": 712} {"train_loss": -20.53291893005371, "global_step": 59158, "epoch": 712} {"train_loss": -20.008955001831055, "global_step": 59159, "epoch": 712} {"train_loss": -20.214115142822266, "global_step": 59160, "epoch": 712} {"train_loss": -20.139005661010742, "global_step": 59161, "epoch": 712} {"train_loss": -20.338369369506836, "global_step": 59162, "epoch": 712} {"train_loss": -20.7197322845459, "global_step": 59163, "epoch": 712} {"train_loss": -20.331287384033203, "global_step": 59164, "epoch": 712} {"train_loss": -20.31133460998535, "global_step": 59165, "epoch": 712} {"train_loss": -20.131179809570312, "global_step": 59166, "epoch": 712} {"train_loss": -20.53639030456543, "global_step": 59167, "epoch": 712} {"train_loss": -20.080551147460938, "global_step": 59168, "epoch": 712} {"train_loss": -20.147432327270508, "global_step": 59169, "epoch": 712} {"train_loss": -20.62526512145996, "global_step": 59170, "epoch": 712} {"train_loss": -20.577878952026367, "global_step": 59171, "epoch": 712} {"train_loss": -20.19118309020996, "global_step": 59172, "epoch": 712} {"train_loss": -20.788284301757812, "global_step": 59173, "epoch": 712} {"train_loss": -20.518705368041992, "global_step": 59174, "epoch": 712} {"train_loss": -20.3519229888916, "global_step": 59175, "epoch": 712} {"train_loss": -20.17328453063965, "global_step": 59176, "epoch": 712} {"train_loss": -20.26607894897461, "global_step": 59177, "epoch": 712} {"train_loss": -20.308097632534533, "global_step": 59178, "epoch": 712, "val_loss": 5955943.0} {"train_loss": -20.19047737121582, "global_step": 59179, "epoch": 713} {"train_loss": -20.136884689331055, "global_step": 59180, "epoch": 713} {"train_loss": -20.24050521850586, "global_step": 59181, "epoch": 713} {"train_loss": -20.477638244628906, "global_step": 59182, "epoch": 713} {"train_loss": -19.78424644470215, "global_step": 59183, "epoch": 713} {"train_loss": -20.26378059387207, "global_step": 59184, "epoch": 713} {"train_loss": -20.319005966186523, "global_step": 59185, "epoch": 713} {"train_loss": -19.91090965270996, "global_step": 59186, "epoch": 713} {"train_loss": -20.242856979370117, "global_step": 59187, "epoch": 713} {"train_loss": -20.33085823059082, "global_step": 59188, "epoch": 713} {"train_loss": -20.15528678894043, "global_step": 59189, "epoch": 713} {"train_loss": -20.215444564819336, "global_step": 59190, "epoch": 713} {"train_loss": -20.65596580505371, "global_step": 59191, "epoch": 713} {"train_loss": -20.192087173461914, "global_step": 59192, "epoch": 713} {"train_loss": -20.24810218811035, "global_step": 59193, "epoch": 713} {"train_loss": -20.08884048461914, "global_step": 59194, "epoch": 713} {"train_loss": -20.491559982299805, "global_step": 59195, "epoch": 713} {"train_loss": -20.41877555847168, "global_step": 59196, "epoch": 713} {"train_loss": -20.491260528564453, "global_step": 59197, "epoch": 713} {"train_loss": -20.364208221435547, "global_step": 59198, "epoch": 713} {"train_loss": -20.428632736206055, "global_step": 59199, "epoch": 713} {"train_loss": -19.912612915039062, "global_step": 59200, "epoch": 713} {"train_loss": -20.526260375976562, "global_step": 59201, "epoch": 713} {"train_loss": -20.477529525756836, "global_step": 59202, "epoch": 713} {"train_loss": -20.21888542175293, "global_step": 59203, "epoch": 713} {"train_loss": -20.485416412353516, "global_step": 59204, "epoch": 713} {"train_loss": -20.264610290527344, "global_step": 59205, "epoch": 713} {"train_loss": -20.61260986328125, "global_step": 59206, "epoch": 713} {"train_loss": -20.316604614257812, "global_step": 59207, "epoch": 713} {"train_loss": -20.365249633789062, "global_step": 59208, "epoch": 713} {"train_loss": -20.496801376342773, "global_step": 59209, "epoch": 713} {"train_loss": -20.254850387573242, "global_step": 59210, "epoch": 713} {"train_loss": -20.459075927734375, "global_step": 59211, "epoch": 713} {"train_loss": -20.592573165893555, "global_step": 59212, "epoch": 713} {"train_loss": -20.475339889526367, "global_step": 59213, "epoch": 713} {"train_loss": -20.672407150268555, "global_step": 59214, "epoch": 713} {"train_loss": -20.5478572845459, "global_step": 59215, "epoch": 713} {"train_loss": -20.22964096069336, "global_step": 59216, "epoch": 713} {"train_loss": -20.346664428710938, "global_step": 59217, "epoch": 713} {"train_loss": -20.3807373046875, "global_step": 59218, "epoch": 713} {"train_loss": -20.394620895385742, "global_step": 59219, "epoch": 713} {"train_loss": -20.59967041015625, "global_step": 59220, "epoch": 713} {"train_loss": -20.62519645690918, "global_step": 59221, "epoch": 713} {"train_loss": -20.367494583129883, "global_step": 59222, "epoch": 713} {"train_loss": -20.176713943481445, "global_step": 59223, "epoch": 713} {"train_loss": -20.230947494506836, "global_step": 59224, "epoch": 713} {"train_loss": -20.219099044799805, "global_step": 59225, "epoch": 713} {"train_loss": -20.716594696044922, "global_step": 59226, "epoch": 713} {"train_loss": -20.387699127197266, "global_step": 59227, "epoch": 713} {"train_loss": -20.304473876953125, "global_step": 59228, "epoch": 713} {"train_loss": -20.33759880065918, "global_step": 59229, "epoch": 713} {"train_loss": -20.508634567260742, "global_step": 59230, "epoch": 713} {"train_loss": -20.521709442138672, "global_step": 59231, "epoch": 713} {"train_loss": -20.392911911010742, "global_step": 59232, "epoch": 713} {"train_loss": -20.14146614074707, "global_step": 59233, "epoch": 713} {"train_loss": -20.730487823486328, "global_step": 59234, "epoch": 713} {"train_loss": -20.433441162109375, "global_step": 59235, "epoch": 713} {"train_loss": -20.442964553833008, "global_step": 59236, "epoch": 713} {"train_loss": -20.35064697265625, "global_step": 59237, "epoch": 713} {"train_loss": -20.44944190979004, "global_step": 59238, "epoch": 713} {"train_loss": -20.174030303955078, "global_step": 59239, "epoch": 713} {"train_loss": -20.416217803955078, "global_step": 59240, "epoch": 713} {"train_loss": -20.12123680114746, "global_step": 59241, "epoch": 713} {"train_loss": -20.055509567260742, "global_step": 59242, "epoch": 713} {"train_loss": -20.54039192199707, "global_step": 59243, "epoch": 713} {"train_loss": -20.45765495300293, "global_step": 59244, "epoch": 713} {"train_loss": -20.681873321533203, "global_step": 59245, "epoch": 713} {"train_loss": -20.528379440307617, "global_step": 59246, "epoch": 713} {"train_loss": -20.3349666595459, "global_step": 59247, "epoch": 713} {"train_loss": -20.420928955078125, "global_step": 59248, "epoch": 713} {"train_loss": -20.456647872924805, "global_step": 59249, "epoch": 713} {"train_loss": -20.49359893798828, "global_step": 59250, "epoch": 713} {"train_loss": -20.27667999267578, "global_step": 59251, "epoch": 713} {"train_loss": -20.709630966186523, "global_step": 59252, "epoch": 713} {"train_loss": -20.674863815307617, "global_step": 59253, "epoch": 713} {"train_loss": -20.577194213867188, "global_step": 59254, "epoch": 713} {"train_loss": -20.218854904174805, "global_step": 59255, "epoch": 713} {"train_loss": -20.358768463134766, "global_step": 59256, "epoch": 713} {"train_loss": -20.385221481323242, "global_step": 59257, "epoch": 713} {"train_loss": -20.36896324157715, "global_step": 59258, "epoch": 713} {"train_loss": -20.58587646484375, "global_step": 59259, "epoch": 713} {"train_loss": -19.966398239135742, "global_step": 59260, "epoch": 713} {"train_loss": -20.37560485931764, "global_step": 59261, "epoch": 713, "val_loss": 6089951.5} {"train_loss": -19.98046875, "global_step": 59262, "epoch": 714} {"train_loss": -19.7705135345459, "global_step": 59263, "epoch": 714} {"train_loss": -19.624637603759766, "global_step": 59264, "epoch": 714} {"train_loss": -20.041696548461914, "global_step": 59265, "epoch": 714} {"train_loss": -20.070798873901367, "global_step": 59266, "epoch": 714} {"train_loss": -20.038509368896484, "global_step": 59267, "epoch": 714} {"train_loss": -19.923507690429688, "global_step": 59268, "epoch": 714} {"train_loss": -19.855697631835938, "global_step": 59269, "epoch": 714} {"train_loss": -19.82689094543457, "global_step": 59270, "epoch": 714} {"train_loss": -19.806509017944336, "global_step": 59271, "epoch": 714} {"train_loss": -20.034215927124023, "global_step": 59272, "epoch": 714} {"train_loss": -19.92445182800293, "global_step": 59273, "epoch": 714} {"train_loss": -20.162981033325195, "global_step": 59274, "epoch": 714} {"train_loss": -20.014877319335938, "global_step": 59275, "epoch": 714} {"train_loss": -20.264545440673828, "global_step": 59276, "epoch": 714} {"train_loss": -20.267457962036133, "global_step": 59277, "epoch": 714} {"train_loss": -20.101003646850586, "global_step": 59278, "epoch": 714} {"train_loss": -20.537109375, "global_step": 59279, "epoch": 714} {"train_loss": -20.09171485900879, "global_step": 59280, "epoch": 714} {"train_loss": -20.289447784423828, "global_step": 59281, "epoch": 714} {"train_loss": -20.279821395874023, "global_step": 59282, "epoch": 714} {"train_loss": -20.449846267700195, "global_step": 59283, "epoch": 714} {"train_loss": -20.382654190063477, "global_step": 59284, "epoch": 714} {"train_loss": -20.174890518188477, "global_step": 59285, "epoch": 714} {"train_loss": -20.28681755065918, "global_step": 59286, "epoch": 714} {"train_loss": -20.43106460571289, "global_step": 59287, "epoch": 714} {"train_loss": -20.1696834564209, "global_step": 59288, "epoch": 714} {"train_loss": -20.304609298706055, "global_step": 59289, "epoch": 714} {"train_loss": -20.250757217407227, "global_step": 59290, "epoch": 714} {"train_loss": -20.624967575073242, "global_step": 59291, "epoch": 714} {"train_loss": -20.442672729492188, "global_step": 59292, "epoch": 714} {"train_loss": -20.36243438720703, "global_step": 59293, "epoch": 714} {"train_loss": -20.136341094970703, "global_step": 59294, "epoch": 714} {"train_loss": -20.235502243041992, "global_step": 59295, "epoch": 714} {"train_loss": -20.452014923095703, "global_step": 59296, "epoch": 714} {"train_loss": -20.173185348510742, "global_step": 59297, "epoch": 714} {"train_loss": -20.31002426147461, "global_step": 59298, "epoch": 714} {"train_loss": -20.170734405517578, "global_step": 59299, "epoch": 714} {"train_loss": -20.196971893310547, "global_step": 59300, "epoch": 714} {"train_loss": -20.407211303710938, "global_step": 59301, "epoch": 714} {"train_loss": -20.442184448242188, "global_step": 59302, "epoch": 714} {"train_loss": -20.361257553100586, "global_step": 59303, "epoch": 714} {"train_loss": -20.667146682739258, "global_step": 59304, "epoch": 714} {"train_loss": -20.168424606323242, "global_step": 59305, "epoch": 714} {"train_loss": -20.386167526245117, "global_step": 59306, "epoch": 714} {"train_loss": -20.525634765625, "global_step": 59307, "epoch": 714} {"train_loss": -20.223478317260742, "global_step": 59308, "epoch": 714} {"train_loss": -20.520919799804688, "global_step": 59309, "epoch": 714} {"train_loss": -20.508304595947266, "global_step": 59310, "epoch": 714} {"train_loss": -20.48383140563965, "global_step": 59311, "epoch": 714} {"train_loss": -20.172941207885742, "global_step": 59312, "epoch": 714} {"train_loss": -20.315052032470703, "global_step": 59313, "epoch": 714} {"train_loss": -20.159330368041992, "global_step": 59314, "epoch": 714} {"train_loss": -20.270353317260742, "global_step": 59315, "epoch": 714} {"train_loss": -20.32523536682129, "global_step": 59316, "epoch": 714} {"train_loss": -20.755277633666992, "global_step": 59317, "epoch": 714} {"train_loss": -20.302465438842773, "global_step": 59318, "epoch": 714} {"train_loss": -20.464099884033203, "global_step": 59319, "epoch": 714} {"train_loss": -20.250356674194336, "global_step": 59320, "epoch": 714} {"train_loss": -20.194583892822266, "global_step": 59321, "epoch": 714} {"train_loss": -20.145618438720703, "global_step": 59322, "epoch": 714} {"train_loss": -20.472097396850586, "global_step": 59323, "epoch": 714} {"train_loss": -19.884340286254883, "global_step": 59324, "epoch": 714} {"train_loss": -20.614492416381836, "global_step": 59325, "epoch": 714} {"train_loss": -20.37717056274414, "global_step": 59326, "epoch": 714} {"train_loss": -20.26297950744629, "global_step": 59327, "epoch": 714} {"train_loss": -20.335525512695312, "global_step": 59328, "epoch": 714} {"train_loss": -20.146255493164062, "global_step": 59329, "epoch": 714} {"train_loss": -20.467599868774414, "global_step": 59330, "epoch": 714} {"train_loss": -20.141143798828125, "global_step": 59331, "epoch": 714} {"train_loss": -20.501432418823242, "global_step": 59332, "epoch": 714} {"train_loss": -20.047842025756836, "global_step": 59333, "epoch": 714} {"train_loss": -20.016704559326172, "global_step": 59334, "epoch": 714} {"train_loss": -20.262615203857422, "global_step": 59335, "epoch": 714} {"train_loss": -20.371618270874023, "global_step": 59336, "epoch": 714} {"train_loss": -20.134748458862305, "global_step": 59337, "epoch": 714} {"train_loss": -20.49605941772461, "global_step": 59338, "epoch": 714} {"train_loss": -20.491308212280273, "global_step": 59339, "epoch": 714} {"train_loss": -20.455421447753906, "global_step": 59340, "epoch": 714} {"train_loss": -20.291173934936523, "global_step": 59341, "epoch": 714} {"train_loss": -20.4298038482666, "global_step": 59342, "epoch": 714} {"train_loss": -20.381818771362305, "global_step": 59343, "epoch": 714} {"train_loss": -20.27062857294657, "global_step": 59344, "epoch": 714, "val_loss": 5861504.0} {"train_loss": -19.823057174682617, "global_step": 59345, "epoch": 715} {"train_loss": -20.174619674682617, "global_step": 59346, "epoch": 715} {"train_loss": -20.07063102722168, "global_step": 59347, "epoch": 715} {"train_loss": -20.53474998474121, "global_step": 59348, "epoch": 715} {"train_loss": -20.511457443237305, "global_step": 59349, "epoch": 715} {"train_loss": -20.040851593017578, "global_step": 59350, "epoch": 715} {"train_loss": -20.348539352416992, "global_step": 59351, "epoch": 715} {"train_loss": -20.00554847717285, "global_step": 59352, "epoch": 715} {"train_loss": -20.6121768951416, "global_step": 59353, "epoch": 715} {"train_loss": -20.308277130126953, "global_step": 59354, "epoch": 715} {"train_loss": -20.520313262939453, "global_step": 59355, "epoch": 715} {"train_loss": -20.28226089477539, "global_step": 59356, "epoch": 715} {"train_loss": -20.188400268554688, "global_step": 59357, "epoch": 715} {"train_loss": -20.18873405456543, "global_step": 59358, "epoch": 715} {"train_loss": -20.574359893798828, "global_step": 59359, "epoch": 715} {"train_loss": -20.522199630737305, "global_step": 59360, "epoch": 715} {"train_loss": -20.220230102539062, "global_step": 59361, "epoch": 715} {"train_loss": -20.384613037109375, "global_step": 59362, "epoch": 715} {"train_loss": -20.28753089904785, "global_step": 59363, "epoch": 715} {"train_loss": -20.44379234313965, "global_step": 59364, "epoch": 715} {"train_loss": -20.218997955322266, "global_step": 59365, "epoch": 715} {"train_loss": -20.25899887084961, "global_step": 59366, "epoch": 715} {"train_loss": -20.409210205078125, "global_step": 59367, "epoch": 715} {"train_loss": -20.3590145111084, "global_step": 59368, "epoch": 715} {"train_loss": -20.28021812438965, "global_step": 59369, "epoch": 715} {"train_loss": -20.600866317749023, "global_step": 59370, "epoch": 715} {"train_loss": -20.595279693603516, "global_step": 59371, "epoch": 715} {"train_loss": -20.078201293945312, "global_step": 59372, "epoch": 715} {"train_loss": -20.499664306640625, "global_step": 59373, "epoch": 715} {"train_loss": -20.34532928466797, "global_step": 59374, "epoch": 715} {"train_loss": -20.342859268188477, "global_step": 59375, "epoch": 715} {"train_loss": -20.672876358032227, "global_step": 59376, "epoch": 715} {"train_loss": -20.622539520263672, "global_step": 59377, "epoch": 715} {"train_loss": -20.497648239135742, "global_step": 59378, "epoch": 715} {"train_loss": -20.305585861206055, "global_step": 59379, "epoch": 715} {"train_loss": -20.38711929321289, "global_step": 59380, "epoch": 715} {"train_loss": -19.960935592651367, "global_step": 59381, "epoch": 715} {"train_loss": -20.031641006469727, "global_step": 59382, "epoch": 715} {"train_loss": -20.67777442932129, "global_step": 59383, "epoch": 715} {"train_loss": -19.9816837310791, "global_step": 59384, "epoch": 715} {"train_loss": -20.487430572509766, "global_step": 59385, "epoch": 715} {"train_loss": -20.580848693847656, "global_step": 59386, "epoch": 715} {"train_loss": -20.259408950805664, "global_step": 59387, "epoch": 715} {"train_loss": -20.588218688964844, "global_step": 59388, "epoch": 715} {"train_loss": -20.57839012145996, "global_step": 59389, "epoch": 715} {"train_loss": -20.2966365814209, "global_step": 59390, "epoch": 715} {"train_loss": -20.39314842224121, "global_step": 59391, "epoch": 715} {"train_loss": -20.18387222290039, "global_step": 59392, "epoch": 715} {"train_loss": -20.01642608642578, "global_step": 59393, "epoch": 715} {"train_loss": -20.467634201049805, "global_step": 59394, "epoch": 715} {"train_loss": -20.587242126464844, "global_step": 59395, "epoch": 715} {"train_loss": -20.504199981689453, "global_step": 59396, "epoch": 715} {"train_loss": -20.24738883972168, "global_step": 59397, "epoch": 715} {"train_loss": -20.471078872680664, "global_step": 59398, "epoch": 715} {"train_loss": -20.232179641723633, "global_step": 59399, "epoch": 715} {"train_loss": -20.089557647705078, "global_step": 59400, "epoch": 715} {"train_loss": -20.59267234802246, "global_step": 59401, "epoch": 715} {"train_loss": -20.36642074584961, "global_step": 59402, "epoch": 715} {"train_loss": -20.46436882019043, "global_step": 59403, "epoch": 715} {"train_loss": -20.122251510620117, "global_step": 59404, "epoch": 715} {"train_loss": -20.566892623901367, "global_step": 59405, "epoch": 715} {"train_loss": -20.2255916595459, "global_step": 59406, "epoch": 715} {"train_loss": -20.461706161499023, "global_step": 59407, "epoch": 715} {"train_loss": -20.507604598999023, "global_step": 59408, "epoch": 715} {"train_loss": -20.363157272338867, "global_step": 59409, "epoch": 715} {"train_loss": -20.267107009887695, "global_step": 59410, "epoch": 715} {"train_loss": -20.524391174316406, "global_step": 59411, "epoch": 715} {"train_loss": -20.72950553894043, "global_step": 59412, "epoch": 715} {"train_loss": -20.710716247558594, "global_step": 59413, "epoch": 715} {"train_loss": -20.255849838256836, "global_step": 59414, "epoch": 715} {"train_loss": -20.716249465942383, "global_step": 59415, "epoch": 715} {"train_loss": -20.958402633666992, "global_step": 59416, "epoch": 715} {"train_loss": -20.427762985229492, "global_step": 59417, "epoch": 715} {"train_loss": -20.5436954498291, "global_step": 59418, "epoch": 715} {"train_loss": -20.592201232910156, "global_step": 59419, "epoch": 715} {"train_loss": -20.0621337890625, "global_step": 59420, "epoch": 715} {"train_loss": -20.19356346130371, "global_step": 59421, "epoch": 715} {"train_loss": -20.60176658630371, "global_step": 59422, "epoch": 715} {"train_loss": -20.396902084350586, "global_step": 59423, "epoch": 715} {"train_loss": -20.398693084716797, "global_step": 59424, "epoch": 715} {"train_loss": -20.12398338317871, "global_step": 59425, "epoch": 715} {"train_loss": -20.402313232421875, "global_step": 59426, "epoch": 715} {"train_loss": -20.374801268060523, "global_step": 59427, "epoch": 715, "val_loss": 5897572.0} {"train_loss": -18.616724014282227, "global_step": 59428, "epoch": 716} {"train_loss": -18.128530502319336, "global_step": 59429, "epoch": 716} {"train_loss": -19.399396896362305, "global_step": 59430, "epoch": 716} {"train_loss": -19.265295028686523, "global_step": 59431, "epoch": 716} {"train_loss": -19.44329833984375, "global_step": 59432, "epoch": 716} {"train_loss": -19.61170768737793, "global_step": 59433, "epoch": 716} {"train_loss": -19.5858211517334, "global_step": 59434, "epoch": 716} {"train_loss": -19.475971221923828, "global_step": 59435, "epoch": 716} {"train_loss": -19.399030685424805, "global_step": 59436, "epoch": 716} {"train_loss": -19.76240348815918, "global_step": 59437, "epoch": 716} {"train_loss": -20.247983932495117, "global_step": 59438, "epoch": 716} {"train_loss": -20.12029457092285, "global_step": 59439, "epoch": 716} {"train_loss": -19.7830753326416, "global_step": 59440, "epoch": 716} {"train_loss": -19.564321517944336, "global_step": 59441, "epoch": 716} {"train_loss": -19.71120262145996, "global_step": 59442, "epoch": 716} {"train_loss": -19.728960037231445, "global_step": 59443, "epoch": 716} {"train_loss": -20.39275550842285, "global_step": 59444, "epoch": 716} {"train_loss": -20.344675064086914, "global_step": 59445, "epoch": 716} {"train_loss": -19.91524314880371, "global_step": 59446, "epoch": 716} {"train_loss": -19.8679141998291, "global_step": 59447, "epoch": 716} {"train_loss": -19.67940330505371, "global_step": 59448, "epoch": 716} {"train_loss": -19.64811134338379, "global_step": 59449, "epoch": 716} {"train_loss": -20.245861053466797, "global_step": 59450, "epoch": 716} {"train_loss": -20.249980926513672, "global_step": 59451, "epoch": 716} {"train_loss": -19.866424560546875, "global_step": 59452, "epoch": 716} {"train_loss": -19.875797271728516, "global_step": 59453, "epoch": 716} {"train_loss": -19.8726863861084, "global_step": 59454, "epoch": 716} {"train_loss": -19.858911514282227, "global_step": 59455, "epoch": 716} {"train_loss": -20.3045711517334, "global_step": 59456, "epoch": 716} {"train_loss": -20.340864181518555, "global_step": 59457, "epoch": 716} {"train_loss": -19.935890197753906, "global_step": 59458, "epoch": 716} {"train_loss": -20.364439010620117, "global_step": 59459, "epoch": 716} {"train_loss": -20.225114822387695, "global_step": 59460, "epoch": 716} {"train_loss": -20.134008407592773, "global_step": 59461, "epoch": 716} {"train_loss": -20.218719482421875, "global_step": 59462, "epoch": 716} {"train_loss": -20.228012084960938, "global_step": 59463, "epoch": 716} {"train_loss": -20.263395309448242, "global_step": 59464, "epoch": 716} {"train_loss": -20.48678970336914, "global_step": 59465, "epoch": 716} {"train_loss": -20.362462997436523, "global_step": 59466, "epoch": 716} {"train_loss": -20.30031394958496, "global_step": 59467, "epoch": 716} {"train_loss": -20.352773666381836, "global_step": 59468, "epoch": 716} {"train_loss": -20.366886138916016, "global_step": 59469, "epoch": 716} {"train_loss": -20.32893943786621, "global_step": 59470, "epoch": 716} {"train_loss": -20.268352508544922, "global_step": 59471, "epoch": 716} {"train_loss": -20.36818504333496, "global_step": 59472, "epoch": 716} {"train_loss": -20.41193199157715, "global_step": 59473, "epoch": 716} {"train_loss": -20.23731803894043, "global_step": 59474, "epoch": 716} {"train_loss": -20.014724731445312, "global_step": 59475, "epoch": 716} {"train_loss": -20.07377052307129, "global_step": 59476, "epoch": 716} {"train_loss": -20.478872299194336, "global_step": 59477, "epoch": 716} {"train_loss": -20.260936737060547, "global_step": 59478, "epoch": 716} {"train_loss": -20.297489166259766, "global_step": 59479, "epoch": 716} {"train_loss": -19.8004207611084, "global_step": 59480, "epoch": 716} {"train_loss": -20.13296890258789, "global_step": 59481, "epoch": 716} {"train_loss": -20.522613525390625, "global_step": 59482, "epoch": 716} {"train_loss": -20.29671287536621, "global_step": 59483, "epoch": 716} {"train_loss": -20.250051498413086, "global_step": 59484, "epoch": 716} {"train_loss": -20.156320571899414, "global_step": 59485, "epoch": 716} {"train_loss": -20.334945678710938, "global_step": 59486, "epoch": 716} {"train_loss": -20.260190963745117, "global_step": 59487, "epoch": 716} {"train_loss": -20.403982162475586, "global_step": 59488, "epoch": 716} {"train_loss": -20.405912399291992, "global_step": 59489, "epoch": 716} {"train_loss": -20.10887336730957, "global_step": 59490, "epoch": 716} {"train_loss": -20.47023582458496, "global_step": 59491, "epoch": 716} {"train_loss": -20.241491317749023, "global_step": 59492, "epoch": 716} {"train_loss": -20.504642486572266, "global_step": 59493, "epoch": 716} {"train_loss": -20.610971450805664, "global_step": 59494, "epoch": 716} {"train_loss": -20.483692169189453, "global_step": 59495, "epoch": 716} {"train_loss": -20.247817993164062, "global_step": 59496, "epoch": 716} {"train_loss": -20.18299102783203, "global_step": 59497, "epoch": 716} {"train_loss": -20.56804847717285, "global_step": 59498, "epoch": 716} {"train_loss": -20.592817306518555, "global_step": 59499, "epoch": 716} {"train_loss": -20.27405548095703, "global_step": 59500, "epoch": 716} {"train_loss": -20.388296127319336, "global_step": 59501, "epoch": 716} {"train_loss": -19.989755630493164, "global_step": 59502, "epoch": 716} {"train_loss": -20.760862350463867, "global_step": 59503, "epoch": 716} {"train_loss": -20.336400985717773, "global_step": 59504, "epoch": 716} {"train_loss": -20.741926193237305, "global_step": 59505, "epoch": 716} {"train_loss": -20.789941787719727, "global_step": 59506, "epoch": 716} {"train_loss": -20.290498733520508, "global_step": 59507, "epoch": 716} {"train_loss": -20.55939292907715, "global_step": 59508, "epoch": 716} {"train_loss": -20.168914794921875, "global_step": 59509, "epoch": 716} {"train_loss": -20.119604983961725, "global_step": 59510, "epoch": 716, "val_loss": 5900946.0} {"train_loss": -19.98985481262207, "global_step": 59511, "epoch": 717} {"train_loss": -20.90870475769043, "global_step": 59512, "epoch": 717} {"train_loss": -19.81822967529297, "global_step": 59513, "epoch": 717} {"train_loss": -20.183134078979492, "global_step": 59514, "epoch": 717} {"train_loss": -20.344589233398438, "global_step": 59515, "epoch": 717} {"train_loss": -20.62629508972168, "global_step": 59516, "epoch": 717} {"train_loss": -20.48781394958496, "global_step": 59517, "epoch": 717} {"train_loss": -20.032718658447266, "global_step": 59518, "epoch": 717} {"train_loss": -20.178171157836914, "global_step": 59519, "epoch": 717} {"train_loss": -20.368335723876953, "global_step": 59520, "epoch": 717} {"train_loss": -20.30901527404785, "global_step": 59521, "epoch": 717} {"train_loss": -20.019453048706055, "global_step": 59522, "epoch": 717} {"train_loss": -19.983774185180664, "global_step": 59523, "epoch": 717} {"train_loss": -20.435958862304688, "global_step": 59524, "epoch": 717} {"train_loss": -19.918481826782227, "global_step": 59525, "epoch": 717} {"train_loss": -20.213077545166016, "global_step": 59526, "epoch": 717} {"train_loss": -20.130735397338867, "global_step": 59527, "epoch": 717} {"train_loss": -20.23468589782715, "global_step": 59528, "epoch": 717} {"train_loss": -20.523740768432617, "global_step": 59529, "epoch": 717} {"train_loss": -20.426233291625977, "global_step": 59530, "epoch": 717} {"train_loss": -20.253576278686523, "global_step": 59531, "epoch": 717} {"train_loss": -20.417922973632812, "global_step": 59532, "epoch": 717} {"train_loss": -20.121854782104492, "global_step": 59533, "epoch": 717} {"train_loss": -20.738067626953125, "global_step": 59534, "epoch": 717} {"train_loss": -20.541719436645508, "global_step": 59535, "epoch": 717} {"train_loss": -20.59852409362793, "global_step": 59536, "epoch": 717} {"train_loss": -20.437795639038086, "global_step": 59537, "epoch": 717} {"train_loss": -20.42957878112793, "global_step": 59538, "epoch": 717} {"train_loss": -20.485088348388672, "global_step": 59539, "epoch": 717} {"train_loss": -20.1518611907959, "global_step": 59540, "epoch": 717} {"train_loss": -20.27865982055664, "global_step": 59541, "epoch": 717} {"train_loss": -20.236698150634766, "global_step": 59542, "epoch": 717} {"train_loss": -20.136085510253906, "global_step": 59543, "epoch": 717} {"train_loss": -20.173887252807617, "global_step": 59544, "epoch": 717} {"train_loss": -20.456918716430664, "global_step": 59545, "epoch": 717} {"train_loss": -20.417686462402344, "global_step": 59546, "epoch": 717} {"train_loss": -20.308927536010742, "global_step": 59547, "epoch": 717} {"train_loss": -20.323989868164062, "global_step": 59548, "epoch": 717} {"train_loss": -20.068523406982422, "global_step": 59549, "epoch": 717} {"train_loss": -20.602706909179688, "global_step": 59550, "epoch": 717} {"train_loss": -20.372283935546875, "global_step": 59551, "epoch": 717} {"train_loss": -20.09585952758789, "global_step": 59552, "epoch": 717} {"train_loss": -20.7406063079834, "global_step": 59553, "epoch": 717} {"train_loss": -20.33878517150879, "global_step": 59554, "epoch": 717} {"train_loss": -20.177671432495117, "global_step": 59555, "epoch": 717} {"train_loss": -20.2767276763916, "global_step": 59556, "epoch": 717} {"train_loss": -20.64948844909668, "global_step": 59557, "epoch": 717} {"train_loss": -20.260303497314453, "global_step": 59558, "epoch": 717} {"train_loss": -20.11372947692871, "global_step": 59559, "epoch": 717} {"train_loss": -20.628774642944336, "global_step": 59560, "epoch": 717} {"train_loss": -20.192188262939453, "global_step": 59561, "epoch": 717} {"train_loss": -20.169721603393555, "global_step": 59562, "epoch": 717} {"train_loss": -20.300649642944336, "global_step": 59563, "epoch": 717} {"train_loss": -20.540334701538086, "global_step": 59564, "epoch": 717} {"train_loss": -20.310300827026367, "global_step": 59565, "epoch": 717} {"train_loss": -20.4084529876709, "global_step": 59566, "epoch": 717} {"train_loss": -20.764312744140625, "global_step": 59567, "epoch": 717} {"train_loss": -20.22865104675293, "global_step": 59568, "epoch": 717} {"train_loss": -20.465621948242188, "global_step": 59569, "epoch": 717} {"train_loss": -20.456953048706055, "global_step": 59570, "epoch": 717} {"train_loss": -20.248931884765625, "global_step": 59571, "epoch": 717} {"train_loss": -19.92783546447754, "global_step": 59572, "epoch": 717} {"train_loss": -20.110553741455078, "global_step": 59573, "epoch": 717} {"train_loss": -20.683256149291992, "global_step": 59574, "epoch": 717} {"train_loss": -20.42854118347168, "global_step": 59575, "epoch": 717} {"train_loss": -20.588407516479492, "global_step": 59576, "epoch": 717} {"train_loss": -20.655929565429688, "global_step": 59577, "epoch": 717} {"train_loss": -20.726930618286133, "global_step": 59578, "epoch": 717} {"train_loss": -20.432941436767578, "global_step": 59579, "epoch": 717} {"train_loss": -20.2719783782959, "global_step": 59580, "epoch": 717} {"train_loss": -20.451797485351562, "global_step": 59581, "epoch": 717} {"train_loss": -20.39284324645996, "global_step": 59582, "epoch": 717} {"train_loss": -20.459556579589844, "global_step": 59583, "epoch": 717} {"train_loss": -20.119190216064453, "global_step": 59584, "epoch": 717} {"train_loss": -20.353818893432617, "global_step": 59585, "epoch": 717} {"train_loss": -20.310571670532227, "global_step": 59586, "epoch": 717} {"train_loss": -20.51207160949707, "global_step": 59587, "epoch": 717} {"train_loss": -20.631895065307617, "global_step": 59588, "epoch": 717} {"train_loss": -20.213666915893555, "global_step": 59589, "epoch": 717} {"train_loss": -20.408967971801758, "global_step": 59590, "epoch": 717} {"train_loss": -20.341777801513672, "global_step": 59591, "epoch": 717} {"train_loss": -20.829526901245117, "global_step": 59592, "epoch": 717} {"train_loss": -20.341447669339466, "global_step": 59593, "epoch": 717, "val_loss": 5960209.5} {"train_loss": -20.235746383666992, "global_step": 59594, "epoch": 718} {"train_loss": -20.055614471435547, "global_step": 59595, "epoch": 718} {"train_loss": -20.075279235839844, "global_step": 59596, "epoch": 718} {"train_loss": -20.129850387573242, "global_step": 59597, "epoch": 718} {"train_loss": -20.407583236694336, "global_step": 59598, "epoch": 718} {"train_loss": -20.261398315429688, "global_step": 59599, "epoch": 718} {"train_loss": -20.122760772705078, "global_step": 59600, "epoch": 718} {"train_loss": -20.265226364135742, "global_step": 59601, "epoch": 718} {"train_loss": -20.700204849243164, "global_step": 59602, "epoch": 718} {"train_loss": -20.45378303527832, "global_step": 59603, "epoch": 718} {"train_loss": -20.45891571044922, "global_step": 59604, "epoch": 718} {"train_loss": -20.4505615234375, "global_step": 59605, "epoch": 718} {"train_loss": -20.715713500976562, "global_step": 59606, "epoch": 718} {"train_loss": -20.451963424682617, "global_step": 59607, "epoch": 718} {"train_loss": -20.480045318603516, "global_step": 59608, "epoch": 718} {"train_loss": -20.604629516601562, "global_step": 59609, "epoch": 718} {"train_loss": -20.307897567749023, "global_step": 59610, "epoch": 718} {"train_loss": -20.298595428466797, "global_step": 59611, "epoch": 718} {"train_loss": -20.274389266967773, "global_step": 59612, "epoch": 718} {"train_loss": -20.435495376586914, "global_step": 59613, "epoch": 718} {"train_loss": -20.552745819091797, "global_step": 59614, "epoch": 718} {"train_loss": -20.285078048706055, "global_step": 59615, "epoch": 718} {"train_loss": -20.488876342773438, "global_step": 59616, "epoch": 718} {"train_loss": -20.388681411743164, "global_step": 59617, "epoch": 718} {"train_loss": -20.625747680664062, "global_step": 59618, "epoch": 718} {"train_loss": -20.254776000976562, "global_step": 59619, "epoch": 718} {"train_loss": -20.3656005859375, "global_step": 59620, "epoch": 718} {"train_loss": -20.136953353881836, "global_step": 59621, "epoch": 718} {"train_loss": -20.01642417907715, "global_step": 59622, "epoch": 718} {"train_loss": -20.52400779724121, "global_step": 59623, "epoch": 718} {"train_loss": -20.496957778930664, "global_step": 59624, "epoch": 718} {"train_loss": -20.634572982788086, "global_step": 59625, "epoch": 718} {"train_loss": -20.496545791625977, "global_step": 59626, "epoch": 718} {"train_loss": -20.18519401550293, "global_step": 59627, "epoch": 718} {"train_loss": -19.936880111694336, "global_step": 59628, "epoch": 718} {"train_loss": -20.290212631225586, "global_step": 59629, "epoch": 718} {"train_loss": -20.13915252685547, "global_step": 59630, "epoch": 718} {"train_loss": -20.420333862304688, "global_step": 59631, "epoch": 718} {"train_loss": -20.352752685546875, "global_step": 59632, "epoch": 718} {"train_loss": -20.65900993347168, "global_step": 59633, "epoch": 718} {"train_loss": -20.28567886352539, "global_step": 59634, "epoch": 718} {"train_loss": -20.060537338256836, "global_step": 59635, "epoch": 718} {"train_loss": -20.497983932495117, "global_step": 59636, "epoch": 718} {"train_loss": -20.469593048095703, "global_step": 59637, "epoch": 718} {"train_loss": -20.558048248291016, "global_step": 59638, "epoch": 718} {"train_loss": -20.527076721191406, "global_step": 59639, "epoch": 718} {"train_loss": -20.625782012939453, "global_step": 59640, "epoch": 718} {"train_loss": -20.46320915222168, "global_step": 59641, "epoch": 718} {"train_loss": -20.520294189453125, "global_step": 59642, "epoch": 718} {"train_loss": -20.1973876953125, "global_step": 59643, "epoch": 718} {"train_loss": -20.53143310546875, "global_step": 59644, "epoch": 718} {"train_loss": -20.232263565063477, "global_step": 59645, "epoch": 718} {"train_loss": -20.69384002685547, "global_step": 59646, "epoch": 718} {"train_loss": -20.309545516967773, "global_step": 59647, "epoch": 718} {"train_loss": -20.840513229370117, "global_step": 59648, "epoch": 718} {"train_loss": -20.609973907470703, "global_step": 59649, "epoch": 718} {"train_loss": -20.209537506103516, "global_step": 59650, "epoch": 718} {"train_loss": -20.669418334960938, "global_step": 59651, "epoch": 718} {"train_loss": -20.20879554748535, "global_step": 59652, "epoch": 718} {"train_loss": -20.35550308227539, "global_step": 59653, "epoch": 718} {"train_loss": -20.160795211791992, "global_step": 59654, "epoch": 718} {"train_loss": -20.423917770385742, "global_step": 59655, "epoch": 718} {"train_loss": -20.515165328979492, "global_step": 59656, "epoch": 718} {"train_loss": -20.64529800415039, "global_step": 59657, "epoch": 718} {"train_loss": -20.452016830444336, "global_step": 59658, "epoch": 718} {"train_loss": -19.814407348632812, "global_step": 59659, "epoch": 718} {"train_loss": -20.533641815185547, "global_step": 59660, "epoch": 718} {"train_loss": -20.86541175842285, "global_step": 59661, "epoch": 718} {"train_loss": -20.171491622924805, "global_step": 59662, "epoch": 718} {"train_loss": -20.5004940032959, "global_step": 59663, "epoch": 718} {"train_loss": -20.10496711730957, "global_step": 59664, "epoch": 718} {"train_loss": -19.938209533691406, "global_step": 59665, "epoch": 718} {"train_loss": -20.167993545532227, "global_step": 59666, "epoch": 718} {"train_loss": -20.40911293029785, "global_step": 59667, "epoch": 718} {"train_loss": -20.87476921081543, "global_step": 59668, "epoch": 718} {"train_loss": -20.141326904296875, "global_step": 59669, "epoch": 718} {"train_loss": -20.201160430908203, "global_step": 59670, "epoch": 718} {"train_loss": -20.48756980895996, "global_step": 59671, "epoch": 718} {"train_loss": -20.029020309448242, "global_step": 59672, "epoch": 718} {"train_loss": -20.411422729492188, "global_step": 59673, "epoch": 718} {"train_loss": -20.21319580078125, "global_step": 59674, "epoch": 718} {"train_loss": -19.766843795776367, "global_step": 59675, "epoch": 718} {"train_loss": -20.347856935248316, "global_step": 59676, "epoch": 718, "val_loss": 6016676.0} {"train_loss": -19.636062622070312, "global_step": 59677, "epoch": 719} {"train_loss": -20.488508224487305, "global_step": 59678, "epoch": 719} {"train_loss": -20.356142044067383, "global_step": 59679, "epoch": 719} {"train_loss": -20.115034103393555, "global_step": 59680, "epoch": 719} {"train_loss": -20.05198097229004, "global_step": 59681, "epoch": 719} {"train_loss": -19.887521743774414, "global_step": 59682, "epoch": 719} {"train_loss": -20.05319595336914, "global_step": 59683, "epoch": 719} {"train_loss": -19.970930099487305, "global_step": 59684, "epoch": 719} {"train_loss": -20.308429718017578, "global_step": 59685, "epoch": 719} {"train_loss": -20.070581436157227, "global_step": 59686, "epoch": 719} {"train_loss": -20.249061584472656, "global_step": 59687, "epoch": 719} {"train_loss": -20.290298461914062, "global_step": 59688, "epoch": 719} {"train_loss": -20.17637825012207, "global_step": 59689, "epoch": 719} {"train_loss": -20.21589469909668, "global_step": 59690, "epoch": 719} {"train_loss": -19.950469970703125, "global_step": 59691, "epoch": 719} {"train_loss": -20.443302154541016, "global_step": 59692, "epoch": 719} {"train_loss": -20.361125946044922, "global_step": 59693, "epoch": 719} {"train_loss": -20.47283363342285, "global_step": 59694, "epoch": 719} {"train_loss": -20.154932022094727, "global_step": 59695, "epoch": 719} {"train_loss": -20.195222854614258, "global_step": 59696, "epoch": 719} {"train_loss": -20.039945602416992, "global_step": 59697, "epoch": 719} {"train_loss": -20.50212860107422, "global_step": 59698, "epoch": 719} {"train_loss": -20.0427188873291, "global_step": 59699, "epoch": 719} {"train_loss": -20.156415939331055, "global_step": 59700, "epoch": 719} {"train_loss": -20.243131637573242, "global_step": 59701, "epoch": 719} {"train_loss": -20.36164665222168, "global_step": 59702, "epoch": 719} {"train_loss": -20.20264434814453, "global_step": 59703, "epoch": 719} {"train_loss": -20.65631675720215, "global_step": 59704, "epoch": 719} {"train_loss": -20.468830108642578, "global_step": 59705, "epoch": 719} {"train_loss": -20.292531967163086, "global_step": 59706, "epoch": 719} {"train_loss": -20.290895462036133, "global_step": 59707, "epoch": 719} {"train_loss": -20.649412155151367, "global_step": 59708, "epoch": 719} {"train_loss": -20.1563777923584, "global_step": 59709, "epoch": 719} {"train_loss": -20.426101684570312, "global_step": 59710, "epoch": 719} {"train_loss": -20.13868522644043, "global_step": 59711, "epoch": 719} {"train_loss": -20.463056564331055, "global_step": 59712, "epoch": 719} {"train_loss": -20.15894317626953, "global_step": 59713, "epoch": 719} {"train_loss": -20.40660285949707, "global_step": 59714, "epoch": 719} {"train_loss": -19.937870025634766, "global_step": 59715, "epoch": 719} {"train_loss": -19.887941360473633, "global_step": 59716, "epoch": 719} {"train_loss": -20.404781341552734, "global_step": 59717, "epoch": 719} {"train_loss": -20.421926498413086, "global_step": 59718, "epoch": 719} {"train_loss": -20.06599998474121, "global_step": 59719, "epoch": 719} {"train_loss": -20.42560386657715, "global_step": 59720, "epoch": 719} {"train_loss": -20.177087783813477, "global_step": 59721, "epoch": 719} {"train_loss": -20.440265655517578, "global_step": 59722, "epoch": 719} {"train_loss": -19.90315055847168, "global_step": 59723, "epoch": 719} {"train_loss": -20.28525733947754, "global_step": 59724, "epoch": 719} {"train_loss": -20.224868774414062, "global_step": 59725, "epoch": 719} {"train_loss": -20.3084659576416, "global_step": 59726, "epoch": 719} {"train_loss": -20.267545700073242, "global_step": 59727, "epoch": 719} {"train_loss": -20.44349479675293, "global_step": 59728, "epoch": 719} {"train_loss": -20.407913208007812, "global_step": 59729, "epoch": 719} {"train_loss": -20.22913360595703, "global_step": 59730, "epoch": 719} {"train_loss": -20.514551162719727, "global_step": 59731, "epoch": 719} {"train_loss": -20.225065231323242, "global_step": 59732, "epoch": 719} {"train_loss": -20.505990982055664, "global_step": 59733, "epoch": 719} {"train_loss": -20.539968490600586, "global_step": 59734, "epoch": 719} {"train_loss": -20.419418334960938, "global_step": 59735, "epoch": 719} {"train_loss": -20.526168823242188, "global_step": 59736, "epoch": 719} {"train_loss": -20.2365665435791, "global_step": 59737, "epoch": 719} {"train_loss": -20.482839584350586, "global_step": 59738, "epoch": 719} {"train_loss": -20.404523849487305, "global_step": 59739, "epoch": 719} {"train_loss": -20.560213088989258, "global_step": 59740, "epoch": 719} {"train_loss": -20.227094650268555, "global_step": 59741, "epoch": 719} {"train_loss": -20.212453842163086, "global_step": 59742, "epoch": 719} {"train_loss": -20.536264419555664, "global_step": 59743, "epoch": 719} {"train_loss": -20.55476951599121, "global_step": 59744, "epoch": 719} {"train_loss": -20.45845603942871, "global_step": 59745, "epoch": 719} {"train_loss": -20.462263107299805, "global_step": 59746, "epoch": 719} {"train_loss": -20.37366485595703, "global_step": 59747, "epoch": 719} {"train_loss": -20.354333877563477, "global_step": 59748, "epoch": 719} {"train_loss": -20.3751163482666, "global_step": 59749, "epoch": 719} {"train_loss": -20.247888565063477, "global_step": 59750, "epoch": 719} {"train_loss": -20.309295654296875, "global_step": 59751, "epoch": 719} {"train_loss": -20.26885986328125, "global_step": 59752, "epoch": 719} {"train_loss": -20.278976440429688, "global_step": 59753, "epoch": 719} {"train_loss": -20.656105041503906, "global_step": 59754, "epoch": 719} {"train_loss": -20.521459579467773, "global_step": 59755, "epoch": 719} {"train_loss": -20.45344352722168, "global_step": 59756, "epoch": 719} {"train_loss": -20.12647819519043, "global_step": 59757, "epoch": 719} {"train_loss": -20.158187866210938, "global_step": 59758, "epoch": 719} {"train_loss": -20.311390727399342, "global_step": 59759, "epoch": 719, "val_loss": 6001671.0} {"train_loss": -20.318695068359375, "global_step": 59760, "epoch": 720} {"train_loss": -20.647165298461914, "global_step": 59761, "epoch": 720} {"train_loss": -20.13040542602539, "global_step": 59762, "epoch": 720} {"train_loss": -20.0552921295166, "global_step": 59763, "epoch": 720} {"train_loss": -20.347999572753906, "global_step": 59764, "epoch": 720} {"train_loss": -20.10371208190918, "global_step": 59765, "epoch": 720} {"train_loss": -19.723180770874023, "global_step": 59766, "epoch": 720} {"train_loss": -20.34469985961914, "global_step": 59767, "epoch": 720} {"train_loss": -20.139476776123047, "global_step": 59768, "epoch": 720} {"train_loss": -20.381637573242188, "global_step": 59769, "epoch": 720} {"train_loss": -20.46484375, "global_step": 59770, "epoch": 720} {"train_loss": -20.264888763427734, "global_step": 59771, "epoch": 720} {"train_loss": -20.191360473632812, "global_step": 59772, "epoch": 720} {"train_loss": -20.278480529785156, "global_step": 59773, "epoch": 720} {"train_loss": -20.451648712158203, "global_step": 59774, "epoch": 720} {"train_loss": -20.023380279541016, "global_step": 59775, "epoch": 720} {"train_loss": -20.135038375854492, "global_step": 59776, "epoch": 720} {"train_loss": -20.198501586914062, "global_step": 59777, "epoch": 720} {"train_loss": -20.195199966430664, "global_step": 59778, "epoch": 720} {"train_loss": -20.072874069213867, "global_step": 59779, "epoch": 720} {"train_loss": -20.43415641784668, "global_step": 59780, "epoch": 720} {"train_loss": -20.50775718688965, "global_step": 59781, "epoch": 720} {"train_loss": -20.369272232055664, "global_step": 59782, "epoch": 720} {"train_loss": -20.32915687561035, "global_step": 59783, "epoch": 720} {"train_loss": -20.457294464111328, "global_step": 59784, "epoch": 720} {"train_loss": -20.324209213256836, "global_step": 59785, "epoch": 720} {"train_loss": -20.505268096923828, "global_step": 59786, "epoch": 720} {"train_loss": -20.348739624023438, "global_step": 59787, "epoch": 720} {"train_loss": -20.288610458374023, "global_step": 59788, "epoch": 720} {"train_loss": -20.026395797729492, "global_step": 59789, "epoch": 720} {"train_loss": -20.748828887939453, "global_step": 59790, "epoch": 720} {"train_loss": -20.435317993164062, "global_step": 59791, "epoch": 720} {"train_loss": -19.918027877807617, "global_step": 59792, "epoch": 720} {"train_loss": -20.334714889526367, "global_step": 59793, "epoch": 720} {"train_loss": -20.178049087524414, "global_step": 59794, "epoch": 720} {"train_loss": -20.27997398376465, "global_step": 59795, "epoch": 720} {"train_loss": -20.321109771728516, "global_step": 59796, "epoch": 720} {"train_loss": -20.409351348876953, "global_step": 59797, "epoch": 720} {"train_loss": -20.249603271484375, "global_step": 59798, "epoch": 720} {"train_loss": -20.430749893188477, "global_step": 59799, "epoch": 720} {"train_loss": -20.517499923706055, "global_step": 59800, "epoch": 720} {"train_loss": -20.444761276245117, "global_step": 59801, "epoch": 720} {"train_loss": -20.56024169921875, "global_step": 59802, "epoch": 720} {"train_loss": -20.403369903564453, "global_step": 59803, "epoch": 720} {"train_loss": -20.463144302368164, "global_step": 59804, "epoch": 720} {"train_loss": -20.089868545532227, "global_step": 59805, "epoch": 720} {"train_loss": -20.370468139648438, "global_step": 59806, "epoch": 720} {"train_loss": -20.423131942749023, "global_step": 59807, "epoch": 720} {"train_loss": -20.462156295776367, "global_step": 59808, "epoch": 720} {"train_loss": -20.38514518737793, "global_step": 59809, "epoch": 720} {"train_loss": -20.387346267700195, "global_step": 59810, "epoch": 720} {"train_loss": -20.116241455078125, "global_step": 59811, "epoch": 720} {"train_loss": -20.174903869628906, "global_step": 59812, "epoch": 720} {"train_loss": -20.317312240600586, "global_step": 59813, "epoch": 720} {"train_loss": -20.44309425354004, "global_step": 59814, "epoch": 720} {"train_loss": -20.56075096130371, "global_step": 59815, "epoch": 720} {"train_loss": -20.56653594970703, "global_step": 59816, "epoch": 720} {"train_loss": -20.396459579467773, "global_step": 59817, "epoch": 720} {"train_loss": -20.369428634643555, "global_step": 59818, "epoch": 720} {"train_loss": -20.12274742126465, "global_step": 59819, "epoch": 720} {"train_loss": -20.611093521118164, "global_step": 59820, "epoch": 720} {"train_loss": -20.601943969726562, "global_step": 59821, "epoch": 720} {"train_loss": -20.285552978515625, "global_step": 59822, "epoch": 720} {"train_loss": -20.519195556640625, "global_step": 59823, "epoch": 720} {"train_loss": -20.407007217407227, "global_step": 59824, "epoch": 720} {"train_loss": -20.410587310791016, "global_step": 59825, "epoch": 720} {"train_loss": -20.06032371520996, "global_step": 59826, "epoch": 720} {"train_loss": -20.149642944335938, "global_step": 59827, "epoch": 720} {"train_loss": -20.350717544555664, "global_step": 59828, "epoch": 720} {"train_loss": -20.589475631713867, "global_step": 59829, "epoch": 720} {"train_loss": -20.45309829711914, "global_step": 59830, "epoch": 720} {"train_loss": -20.39697265625, "global_step": 59831, "epoch": 720} {"train_loss": -20.669553756713867, "global_step": 59832, "epoch": 720} {"train_loss": -20.553253173828125, "global_step": 59833, "epoch": 720} {"train_loss": -20.2462100982666, "global_step": 59834, "epoch": 720} {"train_loss": -20.418216705322266, "global_step": 59835, "epoch": 720} {"train_loss": -20.349634170532227, "global_step": 59836, "epoch": 720} {"train_loss": -20.16997718811035, "global_step": 59837, "epoch": 720} {"train_loss": -20.231983184814453, "global_step": 59838, "epoch": 720} {"train_loss": -20.54884147644043, "global_step": 59839, "epoch": 720} {"train_loss": -20.51370620727539, "global_step": 59840, "epoch": 720} {"train_loss": -20.53787612915039, "global_step": 59841, "epoch": 720} {"train_loss": -20.33554327631571, "global_step": 59842, "epoch": 720, "val_loss": 6065149.5} {"train_loss": -19.46225929260254, "global_step": 59843, "epoch": 721} {"train_loss": -19.667194366455078, "global_step": 59844, "epoch": 721} {"train_loss": -20.196142196655273, "global_step": 59845, "epoch": 721} {"train_loss": -19.818378448486328, "global_step": 59846, "epoch": 721} {"train_loss": -20.141002655029297, "global_step": 59847, "epoch": 721} {"train_loss": -20.109689712524414, "global_step": 59848, "epoch": 721} {"train_loss": -20.09270668029785, "global_step": 59849, "epoch": 721} {"train_loss": -20.018980026245117, "global_step": 59850, "epoch": 721} {"train_loss": -20.35455894470215, "global_step": 59851, "epoch": 721} {"train_loss": -20.1400203704834, "global_step": 59852, "epoch": 721} {"train_loss": -20.201690673828125, "global_step": 59853, "epoch": 721} {"train_loss": -20.45372772216797, "global_step": 59854, "epoch": 721} {"train_loss": -20.177717208862305, "global_step": 59855, "epoch": 721} {"train_loss": -19.816055297851562, "global_step": 59856, "epoch": 721} {"train_loss": -20.341629028320312, "global_step": 59857, "epoch": 721} {"train_loss": -20.190671920776367, "global_step": 59858, "epoch": 721} {"train_loss": -20.483808517456055, "global_step": 59859, "epoch": 721} {"train_loss": -20.435731887817383, "global_step": 59860, "epoch": 721} {"train_loss": -20.339563369750977, "global_step": 59861, "epoch": 721} {"train_loss": -20.337615966796875, "global_step": 59862, "epoch": 721} {"train_loss": -20.46454620361328, "global_step": 59863, "epoch": 721} {"train_loss": -20.38783073425293, "global_step": 59864, "epoch": 721} {"train_loss": -20.3073673248291, "global_step": 59865, "epoch": 721} {"train_loss": -20.50726890563965, "global_step": 59866, "epoch": 721} {"train_loss": -20.31235694885254, "global_step": 59867, "epoch": 721} {"train_loss": -19.991840362548828, "global_step": 59868, "epoch": 721} {"train_loss": -20.423885345458984, "global_step": 59869, "epoch": 721} {"train_loss": -20.398818969726562, "global_step": 59870, "epoch": 721} {"train_loss": -20.426389694213867, "global_step": 59871, "epoch": 721} {"train_loss": -20.269317626953125, "global_step": 59872, "epoch": 721} {"train_loss": -20.105051040649414, "global_step": 59873, "epoch": 721} {"train_loss": -20.058095932006836, "global_step": 59874, "epoch": 721} {"train_loss": -20.348133087158203, "global_step": 59875, "epoch": 721} {"train_loss": -20.26784324645996, "global_step": 59876, "epoch": 721} {"train_loss": -19.95635986328125, "global_step": 59877, "epoch": 721} {"train_loss": -20.501371383666992, "global_step": 59878, "epoch": 721} {"train_loss": -20.529727935791016, "global_step": 59879, "epoch": 721} {"train_loss": -20.33150291442871, "global_step": 59880, "epoch": 721} {"train_loss": -20.15774917602539, "global_step": 59881, "epoch": 721} {"train_loss": -20.216739654541016, "global_step": 59882, "epoch": 721} {"train_loss": -20.51556968688965, "global_step": 59883, "epoch": 721} {"train_loss": -20.316299438476562, "global_step": 59884, "epoch": 721} {"train_loss": -20.31831169128418, "global_step": 59885, "epoch": 721} {"train_loss": -20.465091705322266, "global_step": 59886, "epoch": 721} {"train_loss": -20.324024200439453, "global_step": 59887, "epoch": 721} {"train_loss": -20.425697326660156, "global_step": 59888, "epoch": 721} {"train_loss": -20.111238479614258, "global_step": 59889, "epoch": 721} {"train_loss": -20.60719871520996, "global_step": 59890, "epoch": 721} {"train_loss": -20.245975494384766, "global_step": 59891, "epoch": 721} {"train_loss": -20.505178451538086, "global_step": 59892, "epoch": 721} {"train_loss": -20.686155319213867, "global_step": 59893, "epoch": 721} {"train_loss": -20.184537887573242, "global_step": 59894, "epoch": 721} {"train_loss": -20.642488479614258, "global_step": 59895, "epoch": 721} {"train_loss": -20.389448165893555, "global_step": 59896, "epoch": 721} {"train_loss": -20.147140502929688, "global_step": 59897, "epoch": 721} {"train_loss": -20.494430541992188, "global_step": 59898, "epoch": 721} {"train_loss": -20.253467559814453, "global_step": 59899, "epoch": 721} {"train_loss": -20.406484603881836, "global_step": 59900, "epoch": 721} {"train_loss": -20.158851623535156, "global_step": 59901, "epoch": 721} {"train_loss": -20.290863037109375, "global_step": 59902, "epoch": 721} {"train_loss": -20.281570434570312, "global_step": 59903, "epoch": 721} {"train_loss": -20.05243492126465, "global_step": 59904, "epoch": 721} {"train_loss": -20.52617835998535, "global_step": 59905, "epoch": 721} {"train_loss": -20.015522003173828, "global_step": 59906, "epoch": 721} {"train_loss": -20.176437377929688, "global_step": 59907, "epoch": 721} {"train_loss": -20.289710998535156, "global_step": 59908, "epoch": 721} {"train_loss": -20.105297088623047, "global_step": 59909, "epoch": 721} {"train_loss": -20.247949600219727, "global_step": 59910, "epoch": 721} {"train_loss": -20.607980728149414, "global_step": 59911, "epoch": 721} {"train_loss": -20.37656593322754, "global_step": 59912, "epoch": 721} {"train_loss": -20.54676628112793, "global_step": 59913, "epoch": 721} {"train_loss": -20.643611907958984, "global_step": 59914, "epoch": 721} {"train_loss": -20.658634185791016, "global_step": 59915, "epoch": 721} {"train_loss": -20.25550079345703, "global_step": 59916, "epoch": 721} {"train_loss": -19.97483253479004, "global_step": 59917, "epoch": 721} {"train_loss": -20.190046310424805, "global_step": 59918, "epoch": 721} {"train_loss": -20.12872314453125, "global_step": 59919, "epoch": 721} {"train_loss": -20.21961212158203, "global_step": 59920, "epoch": 721} {"train_loss": -20.25446128845215, "global_step": 59921, "epoch": 721} {"train_loss": -20.631423950195312, "global_step": 59922, "epoch": 721} {"train_loss": -19.995786666870117, "global_step": 59923, "epoch": 721} {"train_loss": -19.87238883972168, "global_step": 59924, "epoch": 721} {"train_loss": -20.276504355740833, "global_step": 59925, "epoch": 721, "val_loss": 6083666.0} {"train_loss": -19.83230209350586, "global_step": 59926, "epoch": 722} {"train_loss": -19.8829345703125, "global_step": 59927, "epoch": 722} {"train_loss": -19.82651138305664, "global_step": 59928, "epoch": 722} {"train_loss": -19.695316314697266, "global_step": 59929, "epoch": 722} {"train_loss": -20.359054565429688, "global_step": 59930, "epoch": 722} {"train_loss": -19.967538833618164, "global_step": 59931, "epoch": 722} {"train_loss": -20.54368019104004, "global_step": 59932, "epoch": 722} {"train_loss": -20.289920806884766, "global_step": 59933, "epoch": 722} {"train_loss": -20.177600860595703, "global_step": 59934, "epoch": 722} {"train_loss": -20.10988998413086, "global_step": 59935, "epoch": 722} {"train_loss": -20.034332275390625, "global_step": 59936, "epoch": 722} {"train_loss": -20.13266944885254, "global_step": 59937, "epoch": 722} {"train_loss": -20.416364669799805, "global_step": 59938, "epoch": 722} {"train_loss": -20.36040496826172, "global_step": 59939, "epoch": 722} {"train_loss": -20.74881935119629, "global_step": 59940, "epoch": 722} {"train_loss": -20.428354263305664, "global_step": 59941, "epoch": 722} {"train_loss": -20.273046493530273, "global_step": 59942, "epoch": 722} {"train_loss": -19.799840927124023, "global_step": 59943, "epoch": 722} {"train_loss": -20.0655517578125, "global_step": 59944, "epoch": 722} {"train_loss": -20.381521224975586, "global_step": 59945, "epoch": 722} {"train_loss": -20.110742568969727, "global_step": 59946, "epoch": 722} {"train_loss": -20.20058250427246, "global_step": 59947, "epoch": 722} {"train_loss": -20.67746925354004, "global_step": 59948, "epoch": 722} {"train_loss": -20.320707321166992, "global_step": 59949, "epoch": 722} {"train_loss": -20.6795711517334, "global_step": 59950, "epoch": 722} {"train_loss": -20.056272506713867, "global_step": 59951, "epoch": 722} {"train_loss": -20.023395538330078, "global_step": 59952, "epoch": 722} {"train_loss": -20.597579956054688, "global_step": 59953, "epoch": 722} {"train_loss": -20.050689697265625, "global_step": 59954, "epoch": 722} {"train_loss": -20.27488899230957, "global_step": 59955, "epoch": 722} {"train_loss": -20.270832061767578, "global_step": 59956, "epoch": 722} {"train_loss": -20.113101959228516, "global_step": 59957, "epoch": 722} {"train_loss": -20.71002197265625, "global_step": 59958, "epoch": 722} {"train_loss": -20.253957748413086, "global_step": 59959, "epoch": 722} {"train_loss": -20.401941299438477, "global_step": 59960, "epoch": 722} {"train_loss": -20.163375854492188, "global_step": 59961, "epoch": 722} {"train_loss": -20.3877010345459, "global_step": 59962, "epoch": 722} {"train_loss": -20.320466995239258, "global_step": 59963, "epoch": 722} {"train_loss": -20.344266891479492, "global_step": 59964, "epoch": 722} {"train_loss": -20.3858642578125, "global_step": 59965, "epoch": 722} {"train_loss": -20.468467712402344, "global_step": 59966, "epoch": 722} {"train_loss": -20.2879695892334, "global_step": 59967, "epoch": 722} {"train_loss": -20.421438217163086, "global_step": 59968, "epoch": 722} {"train_loss": -20.474477767944336, "global_step": 59969, "epoch": 722} {"train_loss": -20.64716911315918, "global_step": 59970, "epoch": 722} {"train_loss": -20.252180099487305, "global_step": 59971, "epoch": 722} {"train_loss": -20.664278030395508, "global_step": 59972, "epoch": 722} {"train_loss": -20.389917373657227, "global_step": 59973, "epoch": 722} {"train_loss": -20.149927139282227, "global_step": 59974, "epoch": 722} {"train_loss": -20.434741973876953, "global_step": 59975, "epoch": 722} {"train_loss": -20.36629295349121, "global_step": 59976, "epoch": 722} {"train_loss": -20.49753189086914, "global_step": 59977, "epoch": 722} {"train_loss": -20.460493087768555, "global_step": 59978, "epoch": 722} {"train_loss": -20.418859481811523, "global_step": 59979, "epoch": 722} {"train_loss": -20.434232711791992, "global_step": 59980, "epoch": 722} {"train_loss": -20.305465698242188, "global_step": 59981, "epoch": 722} {"train_loss": -20.67593765258789, "global_step": 59982, "epoch": 722} {"train_loss": -20.176897048950195, "global_step": 59983, "epoch": 722} {"train_loss": -20.48001480102539, "global_step": 59984, "epoch": 722} {"train_loss": -20.347749710083008, "global_step": 59985, "epoch": 722} {"train_loss": -20.48587417602539, "global_step": 59986, "epoch": 722} {"train_loss": -20.52264976501465, "global_step": 59987, "epoch": 722} {"train_loss": -20.494192123413086, "global_step": 59988, "epoch": 722} {"train_loss": -20.408493041992188, "global_step": 59989, "epoch": 722} {"train_loss": -20.603147506713867, "global_step": 59990, "epoch": 722} {"train_loss": -20.6450138092041, "global_step": 59991, "epoch": 722} {"train_loss": -20.694557189941406, "global_step": 59992, "epoch": 722} {"train_loss": -20.742618560791016, "global_step": 59993, "epoch": 722} {"train_loss": -20.42116355895996, "global_step": 59994, "epoch": 722} {"train_loss": -20.422048568725586, "global_step": 59995, "epoch": 722} {"train_loss": -20.268346786499023, "global_step": 59996, "epoch": 722} {"train_loss": -20.178150177001953, "global_step": 59997, "epoch": 722} {"train_loss": -20.28069496154785, "global_step": 59998, "epoch": 722} {"train_loss": -20.367374420166016, "global_step": 59999, "epoch": 722} {"train_loss": -20.36795425415039, "global_step": 60000, "epoch": 722} {"train_loss": -20.484880447387695, "global_step": 60001, "epoch": 722} {"train_loss": -20.568496704101562, "global_step": 60002, "epoch": 722} {"train_loss": -20.32826042175293, "global_step": 60003, "epoch": 722} {"train_loss": -20.24371337890625, "global_step": 60004, "epoch": 722} {"train_loss": -20.419715881347656, "global_step": 60005, "epoch": 722} {"train_loss": -20.46059226989746, "global_step": 60006, "epoch": 722} {"train_loss": -20.689416885375977, "global_step": 60007, "epoch": 722} {"train_loss": -20.3230977575463, "global_step": 60008, "epoch": 722, "val_loss": 6054292.0} {"train_loss": -20.43100929260254, "global_step": 60009, "epoch": 723} {"train_loss": -19.975046157836914, "global_step": 60010, "epoch": 723} {"train_loss": -20.333572387695312, "global_step": 60011, "epoch": 723} {"train_loss": -20.677059173583984, "global_step": 60012, "epoch": 723} {"train_loss": -20.459787368774414, "global_step": 60013, "epoch": 723} {"train_loss": -20.641130447387695, "global_step": 60014, "epoch": 723} {"train_loss": -19.90120506286621, "global_step": 60015, "epoch": 723} {"train_loss": -20.391586303710938, "global_step": 60016, "epoch": 723} {"train_loss": -20.438791275024414, "global_step": 60017, "epoch": 723} {"train_loss": -19.611433029174805, "global_step": 60018, "epoch": 723} {"train_loss": -20.58481216430664, "global_step": 60019, "epoch": 723} {"train_loss": -19.706680297851562, "global_step": 60020, "epoch": 723} {"train_loss": -20.210926055908203, "global_step": 60021, "epoch": 723} {"train_loss": -19.9907283782959, "global_step": 60022, "epoch": 723} {"train_loss": -20.165870666503906, "global_step": 60023, "epoch": 723} {"train_loss": -20.511810302734375, "global_step": 60024, "epoch": 723} {"train_loss": -20.240985870361328, "global_step": 60025, "epoch": 723} {"train_loss": -20.094533920288086, "global_step": 60026, "epoch": 723} {"train_loss": -20.446916580200195, "global_step": 60027, "epoch": 723} {"train_loss": -20.439350128173828, "global_step": 60028, "epoch": 723} {"train_loss": -20.503183364868164, "global_step": 60029, "epoch": 723} {"train_loss": -20.036121368408203, "global_step": 60030, "epoch": 723} {"train_loss": -19.93024444580078, "global_step": 60031, "epoch": 723} {"train_loss": -20.71221160888672, "global_step": 60032, "epoch": 723} {"train_loss": -20.414411544799805, "global_step": 60033, "epoch": 723} {"train_loss": -20.249494552612305, "global_step": 60034, "epoch": 723} {"train_loss": -20.161951065063477, "global_step": 60035, "epoch": 723} {"train_loss": -20.099735260009766, "global_step": 60036, "epoch": 723} {"train_loss": -20.376874923706055, "global_step": 60037, "epoch": 723} {"train_loss": -20.516511917114258, "global_step": 60038, "epoch": 723} {"train_loss": -20.181652069091797, "global_step": 60039, "epoch": 723} {"train_loss": -20.381620407104492, "global_step": 60040, "epoch": 723} {"train_loss": -20.743385314941406, "global_step": 60041, "epoch": 723} {"train_loss": -20.4298038482666, "global_step": 60042, "epoch": 723} {"train_loss": -20.362140655517578, "global_step": 60043, "epoch": 723} {"train_loss": -20.711759567260742, "global_step": 60044, "epoch": 723} {"train_loss": -20.203580856323242, "global_step": 60045, "epoch": 723} {"train_loss": -20.467737197875977, "global_step": 60046, "epoch": 723} {"train_loss": -20.85638999938965, "global_step": 60047, "epoch": 723} {"train_loss": -20.465810775756836, "global_step": 60048, "epoch": 723} {"train_loss": -20.64726448059082, "global_step": 60049, "epoch": 723} {"train_loss": -20.597753524780273, "global_step": 60050, "epoch": 723} {"train_loss": -20.475650787353516, "global_step": 60051, "epoch": 723} {"train_loss": -20.13687515258789, "global_step": 60052, "epoch": 723} {"train_loss": -20.218612670898438, "global_step": 60053, "epoch": 723} {"train_loss": -20.161298751831055, "global_step": 60054, "epoch": 723} {"train_loss": -20.4649715423584, "global_step": 60055, "epoch": 723} {"train_loss": -20.636486053466797, "global_step": 60056, "epoch": 723} {"train_loss": -20.462387084960938, "global_step": 60057, "epoch": 723} {"train_loss": -20.397903442382812, "global_step": 60058, "epoch": 723} {"train_loss": -20.632553100585938, "global_step": 60059, "epoch": 723} {"train_loss": -20.3284912109375, "global_step": 60060, "epoch": 723} {"train_loss": -20.57978057861328, "global_step": 60061, "epoch": 723} {"train_loss": -20.290132522583008, "global_step": 60062, "epoch": 723} {"train_loss": -19.909826278686523, "global_step": 60063, "epoch": 723} {"train_loss": -19.984848022460938, "global_step": 60064, "epoch": 723} {"train_loss": -20.76950454711914, "global_step": 60065, "epoch": 723} {"train_loss": -20.33845329284668, "global_step": 60066, "epoch": 723} {"train_loss": -20.636001586914062, "global_step": 60067, "epoch": 723} {"train_loss": -20.242752075195312, "global_step": 60068, "epoch": 723} {"train_loss": -20.61005973815918, "global_step": 60069, "epoch": 723} {"train_loss": -20.471485137939453, "global_step": 60070, "epoch": 723} {"train_loss": -20.323200225830078, "global_step": 60071, "epoch": 723} {"train_loss": -20.276769638061523, "global_step": 60072, "epoch": 723} {"train_loss": -20.582548141479492, "global_step": 60073, "epoch": 723} {"train_loss": -20.341047286987305, "global_step": 60074, "epoch": 723} {"train_loss": -20.4892578125, "global_step": 60075, "epoch": 723} {"train_loss": -20.630319595336914, "global_step": 60076, "epoch": 723} {"train_loss": -20.342544555664062, "global_step": 60077, "epoch": 723} {"train_loss": -20.61077308654785, "global_step": 60078, "epoch": 723} {"train_loss": -20.339813232421875, "global_step": 60079, "epoch": 723} {"train_loss": -20.41206932067871, "global_step": 60080, "epoch": 723} {"train_loss": -20.253454208374023, "global_step": 60081, "epoch": 723} {"train_loss": -20.161420822143555, "global_step": 60082, "epoch": 723} {"train_loss": -20.40543556213379, "global_step": 60083, "epoch": 723} {"train_loss": -20.127155303955078, "global_step": 60084, "epoch": 723} {"train_loss": -20.65165901184082, "global_step": 60085, "epoch": 723} {"train_loss": -20.314720153808594, "global_step": 60086, "epoch": 723} {"train_loss": -20.59602165222168, "global_step": 60087, "epoch": 723} {"train_loss": -20.832509994506836, "global_step": 60088, "epoch": 723} {"train_loss": -20.46837615966797, "global_step": 60089, "epoch": 723} {"train_loss": -20.576181411743164, "global_step": 60090, "epoch": 723} {"train_loss": -20.38621424479657, "global_step": 60091, "epoch": 723, "val_loss": 5978453.5} {"train_loss": -20.087568283081055, "global_step": 60092, "epoch": 724} {"train_loss": -20.32490348815918, "global_step": 60093, "epoch": 724} {"train_loss": -20.29631805419922, "global_step": 60094, "epoch": 724} {"train_loss": -20.19522476196289, "global_step": 60095, "epoch": 724} {"train_loss": -20.023033142089844, "global_step": 60096, "epoch": 724} {"train_loss": -20.195913314819336, "global_step": 60097, "epoch": 724} {"train_loss": -20.466169357299805, "global_step": 60098, "epoch": 724} {"train_loss": -20.608694076538086, "global_step": 60099, "epoch": 724} {"train_loss": -20.486637115478516, "global_step": 60100, "epoch": 724} {"train_loss": -20.4440975189209, "global_step": 60101, "epoch": 724} {"train_loss": -19.919479370117188, "global_step": 60102, "epoch": 724} {"train_loss": -20.583724975585938, "global_step": 60103, "epoch": 724} {"train_loss": -20.474872589111328, "global_step": 60104, "epoch": 724} {"train_loss": -20.205108642578125, "global_step": 60105, "epoch": 724} {"train_loss": -20.570627212524414, "global_step": 60106, "epoch": 724} {"train_loss": -19.942075729370117, "global_step": 60107, "epoch": 724} {"train_loss": -20.714086532592773, "global_step": 60108, "epoch": 724} {"train_loss": -20.06144142150879, "global_step": 60109, "epoch": 724} {"train_loss": -20.146509170532227, "global_step": 60110, "epoch": 724} {"train_loss": -20.50337028503418, "global_step": 60111, "epoch": 724} {"train_loss": -20.616168975830078, "global_step": 60112, "epoch": 724} {"train_loss": -20.44560432434082, "global_step": 60113, "epoch": 724} {"train_loss": -20.26645851135254, "global_step": 60114, "epoch": 724} {"train_loss": -20.90863037109375, "global_step": 60115, "epoch": 724} {"train_loss": -20.222021102905273, "global_step": 60116, "epoch": 724} {"train_loss": -20.17718505859375, "global_step": 60117, "epoch": 724} {"train_loss": -20.7250919342041, "global_step": 60118, "epoch": 724} {"train_loss": -20.373016357421875, "global_step": 60119, "epoch": 724} {"train_loss": -20.64849281311035, "global_step": 60120, "epoch": 724} {"train_loss": -20.382598876953125, "global_step": 60121, "epoch": 724} {"train_loss": -20.821552276611328, "global_step": 60122, "epoch": 724} {"train_loss": -20.49057388305664, "global_step": 60123, "epoch": 724} {"train_loss": -20.175565719604492, "global_step": 60124, "epoch": 724} {"train_loss": -20.42216682434082, "global_step": 60125, "epoch": 724} {"train_loss": -20.3940486907959, "global_step": 60126, "epoch": 724} {"train_loss": -20.500938415527344, "global_step": 60127, "epoch": 724} {"train_loss": -20.383726119995117, "global_step": 60128, "epoch": 724} {"train_loss": -21.005281448364258, "global_step": 60129, "epoch": 724} {"train_loss": -20.444721221923828, "global_step": 60130, "epoch": 724} {"train_loss": -20.38626480102539, "global_step": 60131, "epoch": 724} {"train_loss": -20.358549118041992, "global_step": 60132, "epoch": 724} {"train_loss": -20.619375228881836, "global_step": 60133, "epoch": 724} {"train_loss": -20.467363357543945, "global_step": 60134, "epoch": 724} {"train_loss": -20.1923828125, "global_step": 60135, "epoch": 724} {"train_loss": -20.418350219726562, "global_step": 60136, "epoch": 724} {"train_loss": -20.447635650634766, "global_step": 60137, "epoch": 724} {"train_loss": -20.321073532104492, "global_step": 60138, "epoch": 724} {"train_loss": -20.490970611572266, "global_step": 60139, "epoch": 724} {"train_loss": -20.312408447265625, "global_step": 60140, "epoch": 724} {"train_loss": -20.61899757385254, "global_step": 60141, "epoch": 724} {"train_loss": -20.858722686767578, "global_step": 60142, "epoch": 724} {"train_loss": -20.176090240478516, "global_step": 60143, "epoch": 724} {"train_loss": -20.483341217041016, "global_step": 60144, "epoch": 724} {"train_loss": -20.589609146118164, "global_step": 60145, "epoch": 724} {"train_loss": -20.161359786987305, "global_step": 60146, "epoch": 724} {"train_loss": -20.238340377807617, "global_step": 60147, "epoch": 724} {"train_loss": -20.162870407104492, "global_step": 60148, "epoch": 724} {"train_loss": -20.321125030517578, "global_step": 60149, "epoch": 724} {"train_loss": -20.452102661132812, "global_step": 60150, "epoch": 724} {"train_loss": -20.19245719909668, "global_step": 60151, "epoch": 724} {"train_loss": -20.31201171875, "global_step": 60152, "epoch": 724} {"train_loss": -20.09725570678711, "global_step": 60153, "epoch": 724} {"train_loss": -20.204591751098633, "global_step": 60154, "epoch": 724} {"train_loss": -20.631940841674805, "global_step": 60155, "epoch": 724} {"train_loss": -20.221969604492188, "global_step": 60156, "epoch": 724} {"train_loss": -20.492691040039062, "global_step": 60157, "epoch": 724} {"train_loss": -20.116470336914062, "global_step": 60158, "epoch": 724} {"train_loss": -20.250280380249023, "global_step": 60159, "epoch": 724} {"train_loss": -20.501001358032227, "global_step": 60160, "epoch": 724} {"train_loss": -20.548297882080078, "global_step": 60161, "epoch": 724} {"train_loss": -20.48110008239746, "global_step": 60162, "epoch": 724} {"train_loss": -20.35843849182129, "global_step": 60163, "epoch": 724} {"train_loss": -20.337356567382812, "global_step": 60164, "epoch": 724} {"train_loss": -20.41834259033203, "global_step": 60165, "epoch": 724} {"train_loss": -20.627525329589844, "global_step": 60166, "epoch": 724} {"train_loss": -20.291532516479492, "global_step": 60167, "epoch": 724} {"train_loss": -20.299238204956055, "global_step": 60168, "epoch": 724} {"train_loss": -20.455808639526367, "global_step": 60169, "epoch": 724} {"train_loss": -20.3437557220459, "global_step": 60170, "epoch": 724} {"train_loss": -20.344017028808594, "global_step": 60171, "epoch": 724} {"train_loss": -20.5511474609375, "global_step": 60172, "epoch": 724} {"train_loss": -20.847402572631836, "global_step": 60173, "epoch": 724} {"train_loss": -20.409506740340266, "global_step": 60174, "epoch": 724, "val_loss": 5932644.0} {"train_loss": -20.220548629760742, "global_step": 60175, "epoch": 725} {"train_loss": -20.310073852539062, "global_step": 60176, "epoch": 725} {"train_loss": -20.018051147460938, "global_step": 60177, "epoch": 725} {"train_loss": -20.6130428314209, "global_step": 60178, "epoch": 725} {"train_loss": -20.162809371948242, "global_step": 60179, "epoch": 725} {"train_loss": -20.711523056030273, "global_step": 60180, "epoch": 725} {"train_loss": -20.574060440063477, "global_step": 60181, "epoch": 725} {"train_loss": -20.364450454711914, "global_step": 60182, "epoch": 725} {"train_loss": -20.037643432617188, "global_step": 60183, "epoch": 725} {"train_loss": -20.391992568969727, "global_step": 60184, "epoch": 725} {"train_loss": -20.259626388549805, "global_step": 60185, "epoch": 725} {"train_loss": -20.338376998901367, "global_step": 60186, "epoch": 725} {"train_loss": -19.763914108276367, "global_step": 60187, "epoch": 725} {"train_loss": -20.46430778503418, "global_step": 60188, "epoch": 725} {"train_loss": -20.61445426940918, "global_step": 60189, "epoch": 725} {"train_loss": -20.30833625793457, "global_step": 60190, "epoch": 725} {"train_loss": -20.46824073791504, "global_step": 60191, "epoch": 725} {"train_loss": -20.161359786987305, "global_step": 60192, "epoch": 725} {"train_loss": -20.589391708374023, "global_step": 60193, "epoch": 725} {"train_loss": -20.264310836791992, "global_step": 60194, "epoch": 725} {"train_loss": -20.491025924682617, "global_step": 60195, "epoch": 725} {"train_loss": -20.30370330810547, "global_step": 60196, "epoch": 725} {"train_loss": -20.479841232299805, "global_step": 60197, "epoch": 725} {"train_loss": -20.733243942260742, "global_step": 60198, "epoch": 725} {"train_loss": -20.167537689208984, "global_step": 60199, "epoch": 725} {"train_loss": -20.461400985717773, "global_step": 60200, "epoch": 725} {"train_loss": -20.665210723876953, "global_step": 60201, "epoch": 725} {"train_loss": -20.670835494995117, "global_step": 60202, "epoch": 725} {"train_loss": -20.438138961791992, "global_step": 60203, "epoch": 725} {"train_loss": -19.90483283996582, "global_step": 60204, "epoch": 725} {"train_loss": -20.563196182250977, "global_step": 60205, "epoch": 725} {"train_loss": -20.242904663085938, "global_step": 60206, "epoch": 725} {"train_loss": -20.615142822265625, "global_step": 60207, "epoch": 725} {"train_loss": -20.236936569213867, "global_step": 60208, "epoch": 725} {"train_loss": -20.22340965270996, "global_step": 60209, "epoch": 725} {"train_loss": -20.391651153564453, "global_step": 60210, "epoch": 725} {"train_loss": -19.849864959716797, "global_step": 60211, "epoch": 725} {"train_loss": -20.277318954467773, "global_step": 60212, "epoch": 725} {"train_loss": -20.25754165649414, "global_step": 60213, "epoch": 725} {"train_loss": -20.190244674682617, "global_step": 60214, "epoch": 725} {"train_loss": -20.3219051361084, "global_step": 60215, "epoch": 725} {"train_loss": -20.455265045166016, "global_step": 60216, "epoch": 725} {"train_loss": -20.083833694458008, "global_step": 60217, "epoch": 725} {"train_loss": -20.1986026763916, "global_step": 60218, "epoch": 725} {"train_loss": -20.489736557006836, "global_step": 60219, "epoch": 725} {"train_loss": -20.22037696838379, "global_step": 60220, "epoch": 725} {"train_loss": -20.232994079589844, "global_step": 60221, "epoch": 725} {"train_loss": -20.21380043029785, "global_step": 60222, "epoch": 725} {"train_loss": -20.34113121032715, "global_step": 60223, "epoch": 725} {"train_loss": -20.429365158081055, "global_step": 60224, "epoch": 725} {"train_loss": -20.371601104736328, "global_step": 60225, "epoch": 725} {"train_loss": -20.622434616088867, "global_step": 60226, "epoch": 725} {"train_loss": -20.209646224975586, "global_step": 60227, "epoch": 725} {"train_loss": -20.687015533447266, "global_step": 60228, "epoch": 725} {"train_loss": -20.216392517089844, "global_step": 60229, "epoch": 725} {"train_loss": -20.601537704467773, "global_step": 60230, "epoch": 725} {"train_loss": -20.644271850585938, "global_step": 60231, "epoch": 725} {"train_loss": -20.294641494750977, "global_step": 60232, "epoch": 725} {"train_loss": -20.53156852722168, "global_step": 60233, "epoch": 725} {"train_loss": -20.12798500061035, "global_step": 60234, "epoch": 725} {"train_loss": -20.285429000854492, "global_step": 60235, "epoch": 725} {"train_loss": -20.36832618713379, "global_step": 60236, "epoch": 725} {"train_loss": -20.518943786621094, "global_step": 60237, "epoch": 725} {"train_loss": -20.147968292236328, "global_step": 60238, "epoch": 725} {"train_loss": -19.93705940246582, "global_step": 60239, "epoch": 725} {"train_loss": -20.300168991088867, "global_step": 60240, "epoch": 725} {"train_loss": -20.304540634155273, "global_step": 60241, "epoch": 725} {"train_loss": -20.3524227142334, "global_step": 60242, "epoch": 725} {"train_loss": -20.3767147064209, "global_step": 60243, "epoch": 725} {"train_loss": -20.46405601501465, "global_step": 60244, "epoch": 725} {"train_loss": -20.402395248413086, "global_step": 60245, "epoch": 725} {"train_loss": -20.237886428833008, "global_step": 60246, "epoch": 725} {"train_loss": -20.549514770507812, "global_step": 60247, "epoch": 725} {"train_loss": -20.33883285522461, "global_step": 60248, "epoch": 725} {"train_loss": -20.49994468688965, "global_step": 60249, "epoch": 725} {"train_loss": -20.44998550415039, "global_step": 60250, "epoch": 725} {"train_loss": -20.5030517578125, "global_step": 60251, "epoch": 725} {"train_loss": -20.041812896728516, "global_step": 60252, "epoch": 725} {"train_loss": -20.479215621948242, "global_step": 60253, "epoch": 725} {"train_loss": -20.44024085998535, "global_step": 60254, "epoch": 725} {"train_loss": -20.194616317749023, "global_step": 60255, "epoch": 725} {"train_loss": -20.370140075683594, "global_step": 60256, "epoch": 725} {"train_loss": -20.35051113726145, "global_step": 60257, "epoch": 725, "val_loss": 6004520.0} {"train_loss": -20.114700317382812, "global_step": 60258, "epoch": 726} {"train_loss": -20.192502975463867, "global_step": 60259, "epoch": 726} {"train_loss": -20.266752243041992, "global_step": 60260, "epoch": 726} {"train_loss": -20.255802154541016, "global_step": 60261, "epoch": 726} {"train_loss": -20.6148681640625, "global_step": 60262, "epoch": 726} {"train_loss": -20.19432258605957, "global_step": 60263, "epoch": 726} {"train_loss": -20.176698684692383, "global_step": 60264, "epoch": 726} {"train_loss": -19.955392837524414, "global_step": 60265, "epoch": 726} {"train_loss": -20.527597427368164, "global_step": 60266, "epoch": 726} {"train_loss": -20.013229370117188, "global_step": 60267, "epoch": 726} {"train_loss": -20.423398971557617, "global_step": 60268, "epoch": 726} {"train_loss": -20.407018661499023, "global_step": 60269, "epoch": 726} {"train_loss": -20.3717041015625, "global_step": 60270, "epoch": 726} {"train_loss": -20.40992546081543, "global_step": 60271, "epoch": 726} {"train_loss": -20.2724666595459, "global_step": 60272, "epoch": 726} {"train_loss": -20.4965877532959, "global_step": 60273, "epoch": 726} {"train_loss": -20.063756942749023, "global_step": 60274, "epoch": 726} {"train_loss": -20.2453556060791, "global_step": 60275, "epoch": 726} {"train_loss": -20.614458084106445, "global_step": 60276, "epoch": 726} {"train_loss": -20.456058502197266, "global_step": 60277, "epoch": 726} {"train_loss": -20.6339168548584, "global_step": 60278, "epoch": 726} {"train_loss": -20.535263061523438, "global_step": 60279, "epoch": 726} {"train_loss": -20.92804527282715, "global_step": 60280, "epoch": 726} {"train_loss": -20.14383888244629, "global_step": 60281, "epoch": 726} {"train_loss": -20.790836334228516, "global_step": 60282, "epoch": 726} {"train_loss": -20.506254196166992, "global_step": 60283, "epoch": 726} {"train_loss": -20.052717208862305, "global_step": 60284, "epoch": 726} {"train_loss": -20.44350242614746, "global_step": 60285, "epoch": 726} {"train_loss": -20.455310821533203, "global_step": 60286, "epoch": 726} {"train_loss": -20.238813400268555, "global_step": 60287, "epoch": 726} {"train_loss": -20.332292556762695, "global_step": 60288, "epoch": 726} {"train_loss": -20.616281509399414, "global_step": 60289, "epoch": 726} {"train_loss": -20.27254295349121, "global_step": 60290, "epoch": 726} {"train_loss": -20.698917388916016, "global_step": 60291, "epoch": 726} {"train_loss": -20.098817825317383, "global_step": 60292, "epoch": 726} {"train_loss": -20.105100631713867, "global_step": 60293, "epoch": 726} {"train_loss": -20.541181564331055, "global_step": 60294, "epoch": 726} {"train_loss": -20.584781646728516, "global_step": 60295, "epoch": 726} {"train_loss": -20.732492446899414, "global_step": 60296, "epoch": 726} {"train_loss": -20.199813842773438, "global_step": 60297, "epoch": 726} {"train_loss": -20.25520896911621, "global_step": 60298, "epoch": 726} {"train_loss": -20.41019058227539, "global_step": 60299, "epoch": 726} {"train_loss": -20.256168365478516, "global_step": 60300, "epoch": 726} {"train_loss": -19.986963272094727, "global_step": 60301, "epoch": 726} {"train_loss": -20.490985870361328, "global_step": 60302, "epoch": 726} {"train_loss": -20.095794677734375, "global_step": 60303, "epoch": 726} {"train_loss": -20.05979347229004, "global_step": 60304, "epoch": 726} {"train_loss": -20.16659164428711, "global_step": 60305, "epoch": 726} {"train_loss": -20.038179397583008, "global_step": 60306, "epoch": 726} {"train_loss": -20.442527770996094, "global_step": 60307, "epoch": 726} {"train_loss": -20.422292709350586, "global_step": 60308, "epoch": 726} {"train_loss": -20.42694664001465, "global_step": 60309, "epoch": 726} {"train_loss": -20.469892501831055, "global_step": 60310, "epoch": 726} {"train_loss": -20.423215866088867, "global_step": 60311, "epoch": 726} {"train_loss": -20.471351623535156, "global_step": 60312, "epoch": 726} {"train_loss": -20.191089630126953, "global_step": 60313, "epoch": 726} {"train_loss": -20.62255859375, "global_step": 60314, "epoch": 726} {"train_loss": -20.16497230529785, "global_step": 60315, "epoch": 726} {"train_loss": -19.93593978881836, "global_step": 60316, "epoch": 726} {"train_loss": -20.420867919921875, "global_step": 60317, "epoch": 726} {"train_loss": -20.685285568237305, "global_step": 60318, "epoch": 726} {"train_loss": -20.3629207611084, "global_step": 60319, "epoch": 726} {"train_loss": -20.506162643432617, "global_step": 60320, "epoch": 726} {"train_loss": -20.436670303344727, "global_step": 60321, "epoch": 726} {"train_loss": -20.509197235107422, "global_step": 60322, "epoch": 726} {"train_loss": -20.418973922729492, "global_step": 60323, "epoch": 726} {"train_loss": -20.430652618408203, "global_step": 60324, "epoch": 726} {"train_loss": -20.259546279907227, "global_step": 60325, "epoch": 726} {"train_loss": -20.34403419494629, "global_step": 60326, "epoch": 726} {"train_loss": -20.1366024017334, "global_step": 60327, "epoch": 726} {"train_loss": -20.55829429626465, "global_step": 60328, "epoch": 726} {"train_loss": -20.56095314025879, "global_step": 60329, "epoch": 726} {"train_loss": -20.108495712280273, "global_step": 60330, "epoch": 726} {"train_loss": -20.242435455322266, "global_step": 60331, "epoch": 726} {"train_loss": -20.839845657348633, "global_step": 60332, "epoch": 726} {"train_loss": -20.582229614257812, "global_step": 60333, "epoch": 726} {"train_loss": -20.34765625, "global_step": 60334, "epoch": 726} {"train_loss": -20.5229549407959, "global_step": 60335, "epoch": 726} {"train_loss": -20.528024673461914, "global_step": 60336, "epoch": 726} {"train_loss": -20.68500328063965, "global_step": 60337, "epoch": 726} {"train_loss": -20.93478775024414, "global_step": 60338, "epoch": 726} {"train_loss": -20.205820083618164, "global_step": 60339, "epoch": 726} {"train_loss": -20.400948604905462, "global_step": 60340, "epoch": 726, "val_loss": 5870624.0} {"train_loss": -20.136260986328125, "global_step": 60341, "epoch": 727} {"train_loss": -20.010610580444336, "global_step": 60342, "epoch": 727} {"train_loss": -20.02431297302246, "global_step": 60343, "epoch": 727} {"train_loss": -20.503381729125977, "global_step": 60344, "epoch": 727} {"train_loss": -20.565183639526367, "global_step": 60345, "epoch": 727} {"train_loss": -20.324247360229492, "global_step": 60346, "epoch": 727} {"train_loss": -19.841562271118164, "global_step": 60347, "epoch": 727} {"train_loss": -20.09722328186035, "global_step": 60348, "epoch": 727} {"train_loss": -20.076744079589844, "global_step": 60349, "epoch": 727} {"train_loss": -20.38860321044922, "global_step": 60350, "epoch": 727} {"train_loss": -19.686574935913086, "global_step": 60351, "epoch": 727} {"train_loss": -20.054668426513672, "global_step": 60352, "epoch": 727} {"train_loss": -20.53330421447754, "global_step": 60353, "epoch": 727} {"train_loss": -20.309364318847656, "global_step": 60354, "epoch": 727} {"train_loss": -20.413818359375, "global_step": 60355, "epoch": 727} {"train_loss": -20.203462600708008, "global_step": 60356, "epoch": 727} {"train_loss": -20.159652709960938, "global_step": 60357, "epoch": 727} {"train_loss": -20.265588760375977, "global_step": 60358, "epoch": 727} {"train_loss": -20.65228843688965, "global_step": 60359, "epoch": 727} {"train_loss": -20.331954956054688, "global_step": 60360, "epoch": 727} {"train_loss": -20.455291748046875, "global_step": 60361, "epoch": 727} {"train_loss": -20.420177459716797, "global_step": 60362, "epoch": 727} {"train_loss": -20.540618896484375, "global_step": 60363, "epoch": 727} {"train_loss": -20.585161209106445, "global_step": 60364, "epoch": 727} {"train_loss": -20.6416072845459, "global_step": 60365, "epoch": 727} {"train_loss": -20.185916900634766, "global_step": 60366, "epoch": 727} {"train_loss": -20.749454498291016, "global_step": 60367, "epoch": 727} {"train_loss": -20.32362174987793, "global_step": 60368, "epoch": 727} {"train_loss": -20.02510643005371, "global_step": 60369, "epoch": 727} {"train_loss": -20.212194442749023, "global_step": 60370, "epoch": 727} {"train_loss": -20.497804641723633, "global_step": 60371, "epoch": 727} {"train_loss": -20.390960693359375, "global_step": 60372, "epoch": 727} {"train_loss": -20.675968170166016, "global_step": 60373, "epoch": 727} {"train_loss": -20.29878807067871, "global_step": 60374, "epoch": 727} {"train_loss": -20.210886001586914, "global_step": 60375, "epoch": 727} {"train_loss": -20.299476623535156, "global_step": 60376, "epoch": 727} {"train_loss": -20.588098526000977, "global_step": 60377, "epoch": 727} {"train_loss": -20.549434661865234, "global_step": 60378, "epoch": 727} {"train_loss": -20.436370849609375, "global_step": 60379, "epoch": 727} {"train_loss": -20.01187515258789, "global_step": 60380, "epoch": 727} {"train_loss": -20.246051788330078, "global_step": 60381, "epoch": 727} {"train_loss": -19.9646053314209, "global_step": 60382, "epoch": 727} {"train_loss": -20.739946365356445, "global_step": 60383, "epoch": 727} {"train_loss": -20.24724769592285, "global_step": 60384, "epoch": 727} {"train_loss": -20.418540954589844, "global_step": 60385, "epoch": 727} {"train_loss": -20.379779815673828, "global_step": 60386, "epoch": 727} {"train_loss": -20.42806625366211, "global_step": 60387, "epoch": 727} {"train_loss": -20.217702865600586, "global_step": 60388, "epoch": 727} {"train_loss": -20.946321487426758, "global_step": 60389, "epoch": 727} {"train_loss": -20.258358001708984, "global_step": 60390, "epoch": 727} {"train_loss": -20.23990249633789, "global_step": 60391, "epoch": 727} {"train_loss": -20.435684204101562, "global_step": 60392, "epoch": 727} {"train_loss": -20.49909019470215, "global_step": 60393, "epoch": 727} {"train_loss": -20.375595092773438, "global_step": 60394, "epoch": 727} {"train_loss": -20.035797119140625, "global_step": 60395, "epoch": 727} {"train_loss": -20.059736251831055, "global_step": 60396, "epoch": 727} {"train_loss": -20.57733154296875, "global_step": 60397, "epoch": 727} {"train_loss": -20.283550262451172, "global_step": 60398, "epoch": 727} {"train_loss": -19.91998863220215, "global_step": 60399, "epoch": 727} {"train_loss": -20.318744659423828, "global_step": 60400, "epoch": 727} {"train_loss": -20.266202926635742, "global_step": 60401, "epoch": 727} {"train_loss": -20.34583854675293, "global_step": 60402, "epoch": 727} {"train_loss": -20.8559513092041, "global_step": 60403, "epoch": 727} {"train_loss": -20.466238021850586, "global_step": 60404, "epoch": 727} {"train_loss": -20.68427085876465, "global_step": 60405, "epoch": 727} {"train_loss": -20.52997398376465, "global_step": 60406, "epoch": 727} {"train_loss": -19.87225914001465, "global_step": 60407, "epoch": 727} {"train_loss": -20.148408889770508, "global_step": 60408, "epoch": 727} {"train_loss": -20.78603744506836, "global_step": 60409, "epoch": 727} {"train_loss": -20.435781478881836, "global_step": 60410, "epoch": 727} {"train_loss": -20.11161231994629, "global_step": 60411, "epoch": 727} {"train_loss": -20.574960708618164, "global_step": 60412, "epoch": 727} {"train_loss": -20.119457244873047, "global_step": 60413, "epoch": 727} {"train_loss": -20.748838424682617, "global_step": 60414, "epoch": 727} {"train_loss": -20.70920181274414, "global_step": 60415, "epoch": 727} {"train_loss": -20.377561569213867, "global_step": 60416, "epoch": 727} {"train_loss": -20.592802047729492, "global_step": 60417, "epoch": 727} {"train_loss": -20.263086318969727, "global_step": 60418, "epoch": 727} {"train_loss": -20.7111873626709, "global_step": 60419, "epoch": 727} {"train_loss": -20.321500778198242, "global_step": 60420, "epoch": 727} {"train_loss": -20.070056915283203, "global_step": 60421, "epoch": 727} {"train_loss": -20.039369583129883, "global_step": 60422, "epoch": 727} {"train_loss": -20.349702881043214, "global_step": 60423, "epoch": 727, "val_loss": 6036057.5} {"train_loss": -19.42916488647461, "global_step": 60424, "epoch": 728} {"train_loss": -19.911197662353516, "global_step": 60425, "epoch": 728} {"train_loss": -20.35689353942871, "global_step": 60426, "epoch": 728} {"train_loss": -19.658781051635742, "global_step": 60427, "epoch": 728} {"train_loss": -20.33688735961914, "global_step": 60428, "epoch": 728} {"train_loss": -20.389982223510742, "global_step": 60429, "epoch": 728} {"train_loss": -20.379941940307617, "global_step": 60430, "epoch": 728} {"train_loss": -20.135488510131836, "global_step": 60431, "epoch": 728} {"train_loss": -20.247732162475586, "global_step": 60432, "epoch": 728} {"train_loss": -20.08367347717285, "global_step": 60433, "epoch": 728} {"train_loss": -20.008811950683594, "global_step": 60434, "epoch": 728} {"train_loss": -20.284698486328125, "global_step": 60435, "epoch": 728} {"train_loss": -20.353473663330078, "global_step": 60436, "epoch": 728} {"train_loss": -19.971240997314453, "global_step": 60437, "epoch": 728} {"train_loss": -20.253164291381836, "global_step": 60438, "epoch": 728} {"train_loss": -20.544784545898438, "global_step": 60439, "epoch": 728} {"train_loss": -20.22531509399414, "global_step": 60440, "epoch": 728} {"train_loss": -20.61923599243164, "global_step": 60441, "epoch": 728} {"train_loss": -20.07436180114746, "global_step": 60442, "epoch": 728} {"train_loss": -20.317182540893555, "global_step": 60443, "epoch": 728} {"train_loss": -20.67025375366211, "global_step": 60444, "epoch": 728} {"train_loss": -20.42048454284668, "global_step": 60445, "epoch": 728} {"train_loss": -20.124940872192383, "global_step": 60446, "epoch": 728} {"train_loss": -20.532297134399414, "global_step": 60447, "epoch": 728} {"train_loss": -20.322860717773438, "global_step": 60448, "epoch": 728} {"train_loss": -20.589601516723633, "global_step": 60449, "epoch": 728} {"train_loss": -20.17810821533203, "global_step": 60450, "epoch": 728} {"train_loss": -20.90899085998535, "global_step": 60451, "epoch": 728} {"train_loss": -20.138965606689453, "global_step": 60452, "epoch": 728} {"train_loss": -20.67690086364746, "global_step": 60453, "epoch": 728} {"train_loss": -20.452478408813477, "global_step": 60454, "epoch": 728} {"train_loss": -20.57021713256836, "global_step": 60455, "epoch": 728} {"train_loss": -20.331716537475586, "global_step": 60456, "epoch": 728} {"train_loss": -20.50119972229004, "global_step": 60457, "epoch": 728} {"train_loss": -20.635021209716797, "global_step": 60458, "epoch": 728} {"train_loss": -20.54514503479004, "global_step": 60459, "epoch": 728} {"train_loss": -20.62578010559082, "global_step": 60460, "epoch": 728} {"train_loss": -20.49942398071289, "global_step": 60461, "epoch": 728} {"train_loss": -20.199277877807617, "global_step": 60462, "epoch": 728} {"train_loss": -20.349897384643555, "global_step": 60463, "epoch": 728} {"train_loss": -20.394392013549805, "global_step": 60464, "epoch": 728} {"train_loss": -20.409061431884766, "global_step": 60465, "epoch": 728} {"train_loss": -20.50739860534668, "global_step": 60466, "epoch": 728} {"train_loss": -20.23862075805664, "global_step": 60467, "epoch": 728} {"train_loss": -20.390724182128906, "global_step": 60468, "epoch": 728} {"train_loss": -20.379297256469727, "global_step": 60469, "epoch": 728} {"train_loss": -20.49399757385254, "global_step": 60470, "epoch": 728} {"train_loss": -20.488405227661133, "global_step": 60471, "epoch": 728} {"train_loss": -20.43361473083496, "global_step": 60472, "epoch": 728} {"train_loss": -20.432233810424805, "global_step": 60473, "epoch": 728} {"train_loss": -20.86767578125, "global_step": 60474, "epoch": 728} {"train_loss": -20.074827194213867, "global_step": 60475, "epoch": 728} {"train_loss": -20.135543823242188, "global_step": 60476, "epoch": 728} {"train_loss": -20.494998931884766, "global_step": 60477, "epoch": 728} {"train_loss": -20.87858009338379, "global_step": 60478, "epoch": 728} {"train_loss": -20.3966121673584, "global_step": 60479, "epoch": 728} {"train_loss": -20.2238826751709, "global_step": 60480, "epoch": 728} {"train_loss": -20.381500244140625, "global_step": 60481, "epoch": 728} {"train_loss": -20.510360717773438, "global_step": 60482, "epoch": 728} {"train_loss": -20.231687545776367, "global_step": 60483, "epoch": 728} {"train_loss": -20.784561157226562, "global_step": 60484, "epoch": 728} {"train_loss": -20.46889305114746, "global_step": 60485, "epoch": 728} {"train_loss": -20.15907859802246, "global_step": 60486, "epoch": 728} {"train_loss": -20.094114303588867, "global_step": 60487, "epoch": 728} {"train_loss": -20.495845794677734, "global_step": 60488, "epoch": 728} {"train_loss": -20.32950782775879, "global_step": 60489, "epoch": 728} {"train_loss": -20.335678100585938, "global_step": 60490, "epoch": 728} {"train_loss": -20.253299713134766, "global_step": 60491, "epoch": 728} {"train_loss": -20.077280044555664, "global_step": 60492, "epoch": 728} {"train_loss": -20.2061767578125, "global_step": 60493, "epoch": 728} {"train_loss": -20.275333404541016, "global_step": 60494, "epoch": 728} {"train_loss": -20.423709869384766, "global_step": 60495, "epoch": 728} {"train_loss": -19.551748275756836, "global_step": 60496, "epoch": 728} {"train_loss": -20.394384384155273, "global_step": 60497, "epoch": 728} {"train_loss": -20.251821517944336, "global_step": 60498, "epoch": 728} {"train_loss": -20.50404167175293, "global_step": 60499, "epoch": 728} {"train_loss": -20.38765525817871, "global_step": 60500, "epoch": 728} {"train_loss": -20.32954978942871, "global_step": 60501, "epoch": 728} {"train_loss": -20.1016902923584, "global_step": 60502, "epoch": 728} {"train_loss": -20.30791664123535, "global_step": 60503, "epoch": 728} {"train_loss": -20.665576934814453, "global_step": 60504, "epoch": 728} {"train_loss": -20.178136825561523, "global_step": 60505, "epoch": 728} {"train_loss": -20.325332067098962, "global_step": 60506, "epoch": 728, "val_loss": 5946560.5} {"train_loss": -20.374948501586914, "global_step": 60507, "epoch": 729} {"train_loss": -20.129507064819336, "global_step": 60508, "epoch": 729} {"train_loss": -19.662328720092773, "global_step": 60509, "epoch": 729} {"train_loss": -19.759069442749023, "global_step": 60510, "epoch": 729} {"train_loss": -19.99911117553711, "global_step": 60511, "epoch": 729} {"train_loss": -19.758176803588867, "global_step": 60512, "epoch": 729} {"train_loss": -20.28651237487793, "global_step": 60513, "epoch": 729} {"train_loss": -20.16084861755371, "global_step": 60514, "epoch": 729} {"train_loss": -19.968854904174805, "global_step": 60515, "epoch": 729} {"train_loss": -20.356948852539062, "global_step": 60516, "epoch": 729} {"train_loss": -20.34051513671875, "global_step": 60517, "epoch": 729} {"train_loss": -20.254056930541992, "global_step": 60518, "epoch": 729} {"train_loss": -19.87018394470215, "global_step": 60519, "epoch": 729} {"train_loss": -20.435882568359375, "global_step": 60520, "epoch": 729} {"train_loss": -20.393112182617188, "global_step": 60521, "epoch": 729} {"train_loss": -20.288188934326172, "global_step": 60522, "epoch": 729} {"train_loss": -20.191530227661133, "global_step": 60523, "epoch": 729} {"train_loss": -19.72078514099121, "global_step": 60524, "epoch": 729} {"train_loss": -20.229127883911133, "global_step": 60525, "epoch": 729} {"train_loss": -20.490673065185547, "global_step": 60526, "epoch": 729} {"train_loss": -19.75835418701172, "global_step": 60527, "epoch": 729} {"train_loss": -20.357229232788086, "global_step": 60528, "epoch": 729} {"train_loss": -20.187192916870117, "global_step": 60529, "epoch": 729} {"train_loss": -20.060632705688477, "global_step": 60530, "epoch": 729} {"train_loss": -20.461652755737305, "global_step": 60531, "epoch": 729} {"train_loss": -20.269243240356445, "global_step": 60532, "epoch": 729} {"train_loss": -20.184951782226562, "global_step": 60533, "epoch": 729} {"train_loss": -20.501379013061523, "global_step": 60534, "epoch": 729} {"train_loss": -20.424331665039062, "global_step": 60535, "epoch": 729} {"train_loss": -20.590457916259766, "global_step": 60536, "epoch": 729} {"train_loss": -20.8243408203125, "global_step": 60537, "epoch": 729} {"train_loss": -20.319128036499023, "global_step": 60538, "epoch": 729} {"train_loss": -20.589229583740234, "global_step": 60539, "epoch": 729} {"train_loss": -20.276472091674805, "global_step": 60540, "epoch": 729} {"train_loss": -19.892820358276367, "global_step": 60541, "epoch": 729} {"train_loss": -20.568159103393555, "global_step": 60542, "epoch": 729} {"train_loss": -20.228471755981445, "global_step": 60543, "epoch": 729} {"train_loss": -20.25204849243164, "global_step": 60544, "epoch": 729} {"train_loss": -20.334257125854492, "global_step": 60545, "epoch": 729} {"train_loss": -20.200265884399414, "global_step": 60546, "epoch": 729} {"train_loss": -20.57481575012207, "global_step": 60547, "epoch": 729} {"train_loss": -20.12727928161621, "global_step": 60548, "epoch": 729} {"train_loss": -20.2153377532959, "global_step": 60549, "epoch": 729} {"train_loss": -20.299833297729492, "global_step": 60550, "epoch": 729} {"train_loss": -20.594968795776367, "global_step": 60551, "epoch": 729} {"train_loss": -20.79927635192871, "global_step": 60552, "epoch": 729} {"train_loss": -20.14408302307129, "global_step": 60553, "epoch": 729} {"train_loss": -20.266971588134766, "global_step": 60554, "epoch": 729} {"train_loss": -20.202131271362305, "global_step": 60555, "epoch": 729} {"train_loss": -20.37334632873535, "global_step": 60556, "epoch": 729} {"train_loss": -20.400001525878906, "global_step": 60557, "epoch": 729} {"train_loss": -19.91384506225586, "global_step": 60558, "epoch": 729} {"train_loss": -20.724721908569336, "global_step": 60559, "epoch": 729} {"train_loss": -20.451770782470703, "global_step": 60560, "epoch": 729} {"train_loss": -20.291820526123047, "global_step": 60561, "epoch": 729} {"train_loss": -20.05274200439453, "global_step": 60562, "epoch": 729} {"train_loss": -20.459638595581055, "global_step": 60563, "epoch": 729} {"train_loss": -20.53205680847168, "global_step": 60564, "epoch": 729} {"train_loss": -20.760099411010742, "global_step": 60565, "epoch": 729} {"train_loss": -20.402475357055664, "global_step": 60566, "epoch": 729} {"train_loss": -20.582813262939453, "global_step": 60567, "epoch": 729} {"train_loss": -20.846920013427734, "global_step": 60568, "epoch": 729} {"train_loss": -20.664566040039062, "global_step": 60569, "epoch": 729} {"train_loss": -20.63001823425293, "global_step": 60570, "epoch": 729} {"train_loss": -20.378530502319336, "global_step": 60571, "epoch": 729} {"train_loss": -20.290302276611328, "global_step": 60572, "epoch": 729} {"train_loss": -20.36182975769043, "global_step": 60573, "epoch": 729} {"train_loss": -20.343170166015625, "global_step": 60574, "epoch": 729} {"train_loss": -20.530364990234375, "global_step": 60575, "epoch": 729} {"train_loss": -20.827211380004883, "global_step": 60576, "epoch": 729} {"train_loss": -20.841907501220703, "global_step": 60577, "epoch": 729} {"train_loss": -20.883520126342773, "global_step": 60578, "epoch": 729} {"train_loss": -20.259307861328125, "global_step": 60579, "epoch": 729} {"train_loss": -20.41927719116211, "global_step": 60580, "epoch": 729} {"train_loss": -20.599382400512695, "global_step": 60581, "epoch": 729} {"train_loss": -20.734174728393555, "global_step": 60582, "epoch": 729} {"train_loss": -20.063812255859375, "global_step": 60583, "epoch": 729} {"train_loss": -20.678525924682617, "global_step": 60584, "epoch": 729} {"train_loss": -20.367448806762695, "global_step": 60585, "epoch": 729} {"train_loss": -20.66520118713379, "global_step": 60586, "epoch": 729} {"train_loss": -20.32588768005371, "global_step": 60587, "epoch": 729} {"train_loss": -20.40359878540039, "global_step": 60588, "epoch": 729} {"train_loss": -20.336103301450432, "global_step": 60589, "epoch": 729, "val_loss": 5980615.5} {"train_loss": -20.04622459411621, "global_step": 60590, "epoch": 730} {"train_loss": -20.50955581665039, "global_step": 60591, "epoch": 730} {"train_loss": -20.50007438659668, "global_step": 60592, "epoch": 730} {"train_loss": -20.01080322265625, "global_step": 60593, "epoch": 730} {"train_loss": -20.314395904541016, "global_step": 60594, "epoch": 730} {"train_loss": -20.3426570892334, "global_step": 60595, "epoch": 730} {"train_loss": -20.220020294189453, "global_step": 60596, "epoch": 730} {"train_loss": -20.479429244995117, "global_step": 60597, "epoch": 730} {"train_loss": -20.199724197387695, "global_step": 60598, "epoch": 730} {"train_loss": -20.371679306030273, "global_step": 60599, "epoch": 730} {"train_loss": -20.206327438354492, "global_step": 60600, "epoch": 730} {"train_loss": -20.281503677368164, "global_step": 60601, "epoch": 730} {"train_loss": -20.22327995300293, "global_step": 60602, "epoch": 730} {"train_loss": -20.668466567993164, "global_step": 60603, "epoch": 730} {"train_loss": -20.487272262573242, "global_step": 60604, "epoch": 730} {"train_loss": -20.601062774658203, "global_step": 60605, "epoch": 730} {"train_loss": -20.5310115814209, "global_step": 60606, "epoch": 730} {"train_loss": -20.266706466674805, "global_step": 60607, "epoch": 730} {"train_loss": -20.66412353515625, "global_step": 60608, "epoch": 730} {"train_loss": -20.540237426757812, "global_step": 60609, "epoch": 730} {"train_loss": -19.962331771850586, "global_step": 60610, "epoch": 730} {"train_loss": -20.463787078857422, "global_step": 60611, "epoch": 730} {"train_loss": -20.519378662109375, "global_step": 60612, "epoch": 730} {"train_loss": -20.29543113708496, "global_step": 60613, "epoch": 730} {"train_loss": -20.506855010986328, "global_step": 60614, "epoch": 730} {"train_loss": -20.67176628112793, "global_step": 60615, "epoch": 730} {"train_loss": -20.16977882385254, "global_step": 60616, "epoch": 730} {"train_loss": -20.126419067382812, "global_step": 60617, "epoch": 730} {"train_loss": -20.313888549804688, "global_step": 60618, "epoch": 730} {"train_loss": -20.762664794921875, "global_step": 60619, "epoch": 730} {"train_loss": -20.516109466552734, "global_step": 60620, "epoch": 730} {"train_loss": -20.401336669921875, "global_step": 60621, "epoch": 730} {"train_loss": -20.47993278503418, "global_step": 60622, "epoch": 730} {"train_loss": -20.518890380859375, "global_step": 60623, "epoch": 730} {"train_loss": -20.20658302307129, "global_step": 60624, "epoch": 730} {"train_loss": -20.49627685546875, "global_step": 60625, "epoch": 730} {"train_loss": -19.999406814575195, "global_step": 60626, "epoch": 730} {"train_loss": -20.33089828491211, "global_step": 60627, "epoch": 730} {"train_loss": -20.67432975769043, "global_step": 60628, "epoch": 730} {"train_loss": -20.580129623413086, "global_step": 60629, "epoch": 730} {"train_loss": -20.639846801757812, "global_step": 60630, "epoch": 730} {"train_loss": -20.563936233520508, "global_step": 60631, "epoch": 730} {"train_loss": -20.360187530517578, "global_step": 60632, "epoch": 730} {"train_loss": -20.260009765625, "global_step": 60633, "epoch": 730} {"train_loss": -20.752256393432617, "global_step": 60634, "epoch": 730} {"train_loss": -20.241300582885742, "global_step": 60635, "epoch": 730} {"train_loss": -20.13275718688965, "global_step": 60636, "epoch": 730} {"train_loss": -20.261152267456055, "global_step": 60637, "epoch": 730} {"train_loss": -21.07990264892578, "global_step": 60638, "epoch": 730} {"train_loss": -20.786243438720703, "global_step": 60639, "epoch": 730} {"train_loss": -20.55891227722168, "global_step": 60640, "epoch": 730} {"train_loss": -20.5445556640625, "global_step": 60641, "epoch": 730} {"train_loss": -20.22629737854004, "global_step": 60642, "epoch": 730} {"train_loss": -20.47612953186035, "global_step": 60643, "epoch": 730} {"train_loss": -20.645505905151367, "global_step": 60644, "epoch": 730} {"train_loss": -20.44511604309082, "global_step": 60645, "epoch": 730} {"train_loss": -20.22821617126465, "global_step": 60646, "epoch": 730} {"train_loss": -20.589452743530273, "global_step": 60647, "epoch": 730} {"train_loss": -20.42038917541504, "global_step": 60648, "epoch": 730} {"train_loss": -20.511770248413086, "global_step": 60649, "epoch": 730} {"train_loss": -20.455718994140625, "global_step": 60650, "epoch": 730} {"train_loss": -20.36604118347168, "global_step": 60651, "epoch": 730} {"train_loss": -20.735445022583008, "global_step": 60652, "epoch": 730} {"train_loss": -20.293376922607422, "global_step": 60653, "epoch": 730} {"train_loss": -20.713512420654297, "global_step": 60654, "epoch": 730} {"train_loss": -20.664480209350586, "global_step": 60655, "epoch": 730} {"train_loss": -20.35371971130371, "global_step": 60656, "epoch": 730} {"train_loss": -20.60429573059082, "global_step": 60657, "epoch": 730} {"train_loss": -20.742279052734375, "global_step": 60658, "epoch": 730} {"train_loss": -20.50181770324707, "global_step": 60659, "epoch": 730} {"train_loss": -20.149694442749023, "global_step": 60660, "epoch": 730} {"train_loss": -20.406112670898438, "global_step": 60661, "epoch": 730} {"train_loss": -20.373916625976562, "global_step": 60662, "epoch": 730} {"train_loss": -20.1925106048584, "global_step": 60663, "epoch": 730} {"train_loss": -20.809642791748047, "global_step": 60664, "epoch": 730} {"train_loss": -20.474348068237305, "global_step": 60665, "epoch": 730} {"train_loss": -20.431074142456055, "global_step": 60666, "epoch": 730} {"train_loss": -20.4129695892334, "global_step": 60667, "epoch": 730} {"train_loss": -20.05974769592285, "global_step": 60668, "epoch": 730} {"train_loss": -20.55076026916504, "global_step": 60669, "epoch": 730} {"train_loss": -20.338193893432617, "global_step": 60670, "epoch": 730} {"train_loss": -20.41275978088379, "global_step": 60671, "epoch": 730} {"train_loss": -20.420316902987928, "global_step": 60672, "epoch": 730, "val_loss": 5879161.0} {"train_loss": -20.15607261657715, "global_step": 60673, "epoch": 731} {"train_loss": -20.283933639526367, "global_step": 60674, "epoch": 731} {"train_loss": -19.71681022644043, "global_step": 60675, "epoch": 731} {"train_loss": -20.30694007873535, "global_step": 60676, "epoch": 731} {"train_loss": -20.25177574157715, "global_step": 60677, "epoch": 731} {"train_loss": -20.080137252807617, "global_step": 60678, "epoch": 731} {"train_loss": -20.33914566040039, "global_step": 60679, "epoch": 731} {"train_loss": -20.527481079101562, "global_step": 60680, "epoch": 731} {"train_loss": -20.24848747253418, "global_step": 60681, "epoch": 731} {"train_loss": -20.482654571533203, "global_step": 60682, "epoch": 731} {"train_loss": -20.473342895507812, "global_step": 60683, "epoch": 731} {"train_loss": -20.63775062561035, "global_step": 60684, "epoch": 731} {"train_loss": -20.374347686767578, "global_step": 60685, "epoch": 731} {"train_loss": -20.59199333190918, "global_step": 60686, "epoch": 731} {"train_loss": -20.196701049804688, "global_step": 60687, "epoch": 731} {"train_loss": -20.729055404663086, "global_step": 60688, "epoch": 731} {"train_loss": -20.379535675048828, "global_step": 60689, "epoch": 731} {"train_loss": -19.969812393188477, "global_step": 60690, "epoch": 731} {"train_loss": -20.566940307617188, "global_step": 60691, "epoch": 731} {"train_loss": -20.531579971313477, "global_step": 60692, "epoch": 731} {"train_loss": -20.476287841796875, "global_step": 60693, "epoch": 731} {"train_loss": -20.27878189086914, "global_step": 60694, "epoch": 731} {"train_loss": -20.495912551879883, "global_step": 60695, "epoch": 731} {"train_loss": -20.438709259033203, "global_step": 60696, "epoch": 731} {"train_loss": -20.587703704833984, "global_step": 60697, "epoch": 731} {"train_loss": -20.61051368713379, "global_step": 60698, "epoch": 731} {"train_loss": -20.5477352142334, "global_step": 60699, "epoch": 731} {"train_loss": -20.468168258666992, "global_step": 60700, "epoch": 731} {"train_loss": -20.763017654418945, "global_step": 60701, "epoch": 731} {"train_loss": -20.724416732788086, "global_step": 60702, "epoch": 731} {"train_loss": -20.597232818603516, "global_step": 60703, "epoch": 731} {"train_loss": -20.552961349487305, "global_step": 60704, "epoch": 731} {"train_loss": -20.6446533203125, "global_step": 60705, "epoch": 731} {"train_loss": -20.194616317749023, "global_step": 60706, "epoch": 731} {"train_loss": -20.464496612548828, "global_step": 60707, "epoch": 731} {"train_loss": -20.33754539489746, "global_step": 60708, "epoch": 731} {"train_loss": -20.418270111083984, "global_step": 60709, "epoch": 731} {"train_loss": -20.3813419342041, "global_step": 60710, "epoch": 731} {"train_loss": -20.348020553588867, "global_step": 60711, "epoch": 731} {"train_loss": -20.615758895874023, "global_step": 60712, "epoch": 731} {"train_loss": -20.6890869140625, "global_step": 60713, "epoch": 731} {"train_loss": -20.392568588256836, "global_step": 60714, "epoch": 731} {"train_loss": -20.493783950805664, "global_step": 60715, "epoch": 731} {"train_loss": -20.53314208984375, "global_step": 60716, "epoch": 731} {"train_loss": -20.328418731689453, "global_step": 60717, "epoch": 731} {"train_loss": -20.54119300842285, "global_step": 60718, "epoch": 731} {"train_loss": -20.508914947509766, "global_step": 60719, "epoch": 731} {"train_loss": -20.324771881103516, "global_step": 60720, "epoch": 731} {"train_loss": -20.618940353393555, "global_step": 60721, "epoch": 731} {"train_loss": -20.498014450073242, "global_step": 60722, "epoch": 731} {"train_loss": -20.72244644165039, "global_step": 60723, "epoch": 731} {"train_loss": -20.183246612548828, "global_step": 60724, "epoch": 731} {"train_loss": -20.079574584960938, "global_step": 60725, "epoch": 731} {"train_loss": -20.421375274658203, "global_step": 60726, "epoch": 731} {"train_loss": -20.16953468322754, "global_step": 60727, "epoch": 731} {"train_loss": -19.981698989868164, "global_step": 60728, "epoch": 731} {"train_loss": -20.098432540893555, "global_step": 60729, "epoch": 731} {"train_loss": -20.7810001373291, "global_step": 60730, "epoch": 731} {"train_loss": -20.401891708374023, "global_step": 60731, "epoch": 731} {"train_loss": -20.668996810913086, "global_step": 60732, "epoch": 731} {"train_loss": -20.574186325073242, "global_step": 60733, "epoch": 731} {"train_loss": -20.594213485717773, "global_step": 60734, "epoch": 731} {"train_loss": -19.998353958129883, "global_step": 60735, "epoch": 731} {"train_loss": -20.679676055908203, "global_step": 60736, "epoch": 731} {"train_loss": -20.813644409179688, "global_step": 60737, "epoch": 731} {"train_loss": -20.41237449645996, "global_step": 60738, "epoch": 731} {"train_loss": -20.598556518554688, "global_step": 60739, "epoch": 731} {"train_loss": -20.401172637939453, "global_step": 60740, "epoch": 731} {"train_loss": -20.652379989624023, "global_step": 60741, "epoch": 731} {"train_loss": -20.000110626220703, "global_step": 60742, "epoch": 731} {"train_loss": -20.438230514526367, "global_step": 60743, "epoch": 731} {"train_loss": -20.578027725219727, "global_step": 60744, "epoch": 731} {"train_loss": -20.551950454711914, "global_step": 60745, "epoch": 731} {"train_loss": -20.45892333984375, "global_step": 60746, "epoch": 731} {"train_loss": -20.294208526611328, "global_step": 60747, "epoch": 731} {"train_loss": -20.317113876342773, "global_step": 60748, "epoch": 731} {"train_loss": -20.712841033935547, "global_step": 60749, "epoch": 731} {"train_loss": -20.268638610839844, "global_step": 60750, "epoch": 731} {"train_loss": -20.444915771484375, "global_step": 60751, "epoch": 731} {"train_loss": -20.865121841430664, "global_step": 60752, "epoch": 731} {"train_loss": -20.776569366455078, "global_step": 60753, "epoch": 731} {"train_loss": -20.452619552612305, "global_step": 60754, "epoch": 731} {"train_loss": -20.443061231130578, "global_step": 60755, "epoch": 731, "val_loss": 6021735.5} {"train_loss": -18.770769119262695, "global_step": 60756, "epoch": 732} {"train_loss": -19.906545639038086, "global_step": 60757, "epoch": 732} {"train_loss": -19.625516891479492, "global_step": 60758, "epoch": 732} {"train_loss": -19.94386100769043, "global_step": 60759, "epoch": 732} {"train_loss": -19.70265769958496, "global_step": 60760, "epoch": 732} {"train_loss": -20.0371150970459, "global_step": 60761, "epoch": 732} {"train_loss": -20.074726104736328, "global_step": 60762, "epoch": 732} {"train_loss": -19.997472763061523, "global_step": 60763, "epoch": 732} {"train_loss": -20.133609771728516, "global_step": 60764, "epoch": 732} {"train_loss": -19.40998649597168, "global_step": 60765, "epoch": 732} {"train_loss": -20.409605026245117, "global_step": 60766, "epoch": 732} {"train_loss": -19.770435333251953, "global_step": 60767, "epoch": 732} {"train_loss": -19.957929611206055, "global_step": 60768, "epoch": 732} {"train_loss": -19.994037628173828, "global_step": 60769, "epoch": 732} {"train_loss": -19.776121139526367, "global_step": 60770, "epoch": 732} {"train_loss": -20.031692504882812, "global_step": 60771, "epoch": 732} {"train_loss": -20.012929916381836, "global_step": 60772, "epoch": 732} {"train_loss": -20.234668731689453, "global_step": 60773, "epoch": 732} {"train_loss": -20.22585105895996, "global_step": 60774, "epoch": 732} {"train_loss": -20.311059951782227, "global_step": 60775, "epoch": 732} {"train_loss": -20.251983642578125, "global_step": 60776, "epoch": 732} {"train_loss": -19.987634658813477, "global_step": 60777, "epoch": 732} {"train_loss": -19.6455135345459, "global_step": 60778, "epoch": 732} {"train_loss": -20.645313262939453, "global_step": 60779, "epoch": 732} {"train_loss": -20.31330108642578, "global_step": 60780, "epoch": 732} {"train_loss": -19.92244529724121, "global_step": 60781, "epoch": 732} {"train_loss": -20.2100887298584, "global_step": 60782, "epoch": 732} {"train_loss": -20.313037872314453, "global_step": 60783, "epoch": 732} {"train_loss": -20.633222579956055, "global_step": 60784, "epoch": 732} {"train_loss": -20.38582992553711, "global_step": 60785, "epoch": 732} {"train_loss": -20.089096069335938, "global_step": 60786, "epoch": 732} {"train_loss": -20.052371978759766, "global_step": 60787, "epoch": 732} {"train_loss": -20.407676696777344, "global_step": 60788, "epoch": 732} {"train_loss": -20.386220932006836, "global_step": 60789, "epoch": 732} {"train_loss": -20.56736183166504, "global_step": 60790, "epoch": 732} {"train_loss": -20.296142578125, "global_step": 60791, "epoch": 732} {"train_loss": -20.400121688842773, "global_step": 60792, "epoch": 732} {"train_loss": -20.399816513061523, "global_step": 60793, "epoch": 732} {"train_loss": -20.405179977416992, "global_step": 60794, "epoch": 732} {"train_loss": -20.034975051879883, "global_step": 60795, "epoch": 732} {"train_loss": -20.80638885498047, "global_step": 60796, "epoch": 732} {"train_loss": -20.814420700073242, "global_step": 60797, "epoch": 732} {"train_loss": -20.72269630432129, "global_step": 60798, "epoch": 732} {"train_loss": -20.29596519470215, "global_step": 60799, "epoch": 732} {"train_loss": -20.662582397460938, "global_step": 60800, "epoch": 732} {"train_loss": -20.48077964782715, "global_step": 60801, "epoch": 732} {"train_loss": -20.662145614624023, "global_step": 60802, "epoch": 732} {"train_loss": -20.716201782226562, "global_step": 60803, "epoch": 732} {"train_loss": -20.292875289916992, "global_step": 60804, "epoch": 732} {"train_loss": -20.367795944213867, "global_step": 60805, "epoch": 732} {"train_loss": -20.579326629638672, "global_step": 60806, "epoch": 732} {"train_loss": -20.50434684753418, "global_step": 60807, "epoch": 732} {"train_loss": -20.570951461791992, "global_step": 60808, "epoch": 732} {"train_loss": -20.59071159362793, "global_step": 60809, "epoch": 732} {"train_loss": -20.674116134643555, "global_step": 60810, "epoch": 732} {"train_loss": -20.134057998657227, "global_step": 60811, "epoch": 732} {"train_loss": -20.206878662109375, "global_step": 60812, "epoch": 732} {"train_loss": -20.374282836914062, "global_step": 60813, "epoch": 732} {"train_loss": -20.57406234741211, "global_step": 60814, "epoch": 732} {"train_loss": -20.3671932220459, "global_step": 60815, "epoch": 732} {"train_loss": -20.740886688232422, "global_step": 60816, "epoch": 732} {"train_loss": -20.438648223876953, "global_step": 60817, "epoch": 732} {"train_loss": -20.587465286254883, "global_step": 60818, "epoch": 732} {"train_loss": -20.73930549621582, "global_step": 60819, "epoch": 732} {"train_loss": -20.47870445251465, "global_step": 60820, "epoch": 732} {"train_loss": -20.451215744018555, "global_step": 60821, "epoch": 732} {"train_loss": -20.799009323120117, "global_step": 60822, "epoch": 732} {"train_loss": -20.105247497558594, "global_step": 60823, "epoch": 732} {"train_loss": -20.30765151977539, "global_step": 60824, "epoch": 732} {"train_loss": -20.401779174804688, "global_step": 60825, "epoch": 732} {"train_loss": -20.537874221801758, "global_step": 60826, "epoch": 732} {"train_loss": -20.464853286743164, "global_step": 60827, "epoch": 732} {"train_loss": -20.623117446899414, "global_step": 60828, "epoch": 732} {"train_loss": -20.40007972717285, "global_step": 60829, "epoch": 732} {"train_loss": -20.44923973083496, "global_step": 60830, "epoch": 732} {"train_loss": -20.543630599975586, "global_step": 60831, "epoch": 732} {"train_loss": -20.588790893554688, "global_step": 60832, "epoch": 732} {"train_loss": -20.070667266845703, "global_step": 60833, "epoch": 732} {"train_loss": -20.223772048950195, "global_step": 60834, "epoch": 732} {"train_loss": -20.8094482421875, "global_step": 60835, "epoch": 732} {"train_loss": -20.08609962463379, "global_step": 60836, "epoch": 732} {"train_loss": -20.20631217956543, "global_step": 60837, "epoch": 732} {"train_loss": -20.296291741980127, "global_step": 60838, "epoch": 732, "val_loss": 6052217.5} {"train_loss": -19.838443756103516, "global_step": 60839, "epoch": 733} {"train_loss": -20.34430694580078, "global_step": 60840, "epoch": 733} {"train_loss": -20.045013427734375, "global_step": 60841, "epoch": 733} {"train_loss": -20.41181755065918, "global_step": 60842, "epoch": 733} {"train_loss": -20.287551879882812, "global_step": 60843, "epoch": 733} {"train_loss": -20.26667594909668, "global_step": 60844, "epoch": 733} {"train_loss": -20.249868392944336, "global_step": 60845, "epoch": 733} {"train_loss": -20.409549713134766, "global_step": 60846, "epoch": 733} {"train_loss": -20.605819702148438, "global_step": 60847, "epoch": 733} {"train_loss": -20.196001052856445, "global_step": 60848, "epoch": 733} {"train_loss": -20.448575973510742, "global_step": 60849, "epoch": 733} {"train_loss": -20.365217208862305, "global_step": 60850, "epoch": 733} {"train_loss": -20.487773895263672, "global_step": 60851, "epoch": 733} {"train_loss": -20.673269271850586, "global_step": 60852, "epoch": 733} {"train_loss": -20.106651306152344, "global_step": 60853, "epoch": 733} {"train_loss": -20.605161666870117, "global_step": 60854, "epoch": 733} {"train_loss": -20.504837036132812, "global_step": 60855, "epoch": 733} {"train_loss": -20.56914710998535, "global_step": 60856, "epoch": 733} {"train_loss": -20.387094497680664, "global_step": 60857, "epoch": 733} {"train_loss": -20.65478515625, "global_step": 60858, "epoch": 733} {"train_loss": -20.634328842163086, "global_step": 60859, "epoch": 733} {"train_loss": -20.512971878051758, "global_step": 60860, "epoch": 733} {"train_loss": -20.225296020507812, "global_step": 60861, "epoch": 733} {"train_loss": -20.188291549682617, "global_step": 60862, "epoch": 733} {"train_loss": -20.198118209838867, "global_step": 60863, "epoch": 733} {"train_loss": -20.506744384765625, "global_step": 60864, "epoch": 733} {"train_loss": -20.347620010375977, "global_step": 60865, "epoch": 733} {"train_loss": -20.606481552124023, "global_step": 60866, "epoch": 733} {"train_loss": -20.534631729125977, "global_step": 60867, "epoch": 733} {"train_loss": -20.77596092224121, "global_step": 60868, "epoch": 733} {"train_loss": -20.45624351501465, "global_step": 60869, "epoch": 733} {"train_loss": -20.26944923400879, "global_step": 60870, "epoch": 733} {"train_loss": -20.357358932495117, "global_step": 60871, "epoch": 733} {"train_loss": -20.236038208007812, "global_step": 60872, "epoch": 733} {"train_loss": -20.439725875854492, "global_step": 60873, "epoch": 733} {"train_loss": -20.15584373474121, "global_step": 60874, "epoch": 733} {"train_loss": -20.583127975463867, "global_step": 60875, "epoch": 733} {"train_loss": -20.607378005981445, "global_step": 60876, "epoch": 733} {"train_loss": -20.275049209594727, "global_step": 60877, "epoch": 733} {"train_loss": -20.399673461914062, "global_step": 60878, "epoch": 733} {"train_loss": -20.456701278686523, "global_step": 60879, "epoch": 733} {"train_loss": -20.24167823791504, "global_step": 60880, "epoch": 733} {"train_loss": -20.225065231323242, "global_step": 60881, "epoch": 733} {"train_loss": -20.70290184020996, "global_step": 60882, "epoch": 733} {"train_loss": -20.6434383392334, "global_step": 60883, "epoch": 733} {"train_loss": -19.91058921813965, "global_step": 60884, "epoch": 733} {"train_loss": -20.9685115814209, "global_step": 60885, "epoch": 733} {"train_loss": -20.4261417388916, "global_step": 60886, "epoch": 733} {"train_loss": -20.2833309173584, "global_step": 60887, "epoch": 733} {"train_loss": -20.152212142944336, "global_step": 60888, "epoch": 733} {"train_loss": -20.701231002807617, "global_step": 60889, "epoch": 733} {"train_loss": -20.26560401916504, "global_step": 60890, "epoch": 733} {"train_loss": -20.464618682861328, "global_step": 60891, "epoch": 733} {"train_loss": -20.581390380859375, "global_step": 60892, "epoch": 733} {"train_loss": -20.3393611907959, "global_step": 60893, "epoch": 733} {"train_loss": -20.219741821289062, "global_step": 60894, "epoch": 733} {"train_loss": -20.70878028869629, "global_step": 60895, "epoch": 733} {"train_loss": -20.68160629272461, "global_step": 60896, "epoch": 733} {"train_loss": -20.32225799560547, "global_step": 60897, "epoch": 733} {"train_loss": -20.182939529418945, "global_step": 60898, "epoch": 733} {"train_loss": -20.49687957763672, "global_step": 60899, "epoch": 733} {"train_loss": -20.822111129760742, "global_step": 60900, "epoch": 733} {"train_loss": -20.34101676940918, "global_step": 60901, "epoch": 733} {"train_loss": -20.574617385864258, "global_step": 60902, "epoch": 733} {"train_loss": -20.3801326751709, "global_step": 60903, "epoch": 733} {"train_loss": -20.347043991088867, "global_step": 60904, "epoch": 733} {"train_loss": -20.640235900878906, "global_step": 60905, "epoch": 733} {"train_loss": -20.104820251464844, "global_step": 60906, "epoch": 733} {"train_loss": -20.3067684173584, "global_step": 60907, "epoch": 733} {"train_loss": -20.278106689453125, "global_step": 60908, "epoch": 733} {"train_loss": -20.28126335144043, "global_step": 60909, "epoch": 733} {"train_loss": -20.402013778686523, "global_step": 60910, "epoch": 733} {"train_loss": -20.554365158081055, "global_step": 60911, "epoch": 733} {"train_loss": -20.803329467773438, "global_step": 60912, "epoch": 733} {"train_loss": -20.420324325561523, "global_step": 60913, "epoch": 733} {"train_loss": -20.409286499023438, "global_step": 60914, "epoch": 733} {"train_loss": -20.59195899963379, "global_step": 60915, "epoch": 733} {"train_loss": -20.241483688354492, "global_step": 60916, "epoch": 733} {"train_loss": -20.549100875854492, "global_step": 60917, "epoch": 733} {"train_loss": -20.747995376586914, "global_step": 60918, "epoch": 733} {"train_loss": -20.417739868164062, "global_step": 60919, "epoch": 733} {"train_loss": -20.550722122192383, "global_step": 60920, "epoch": 733} {"train_loss": -20.426044050469457, "global_step": 60921, "epoch": 733, "val_loss": 6004169.0} {"train_loss": -20.343244552612305, "global_step": 60922, "epoch": 734} {"train_loss": -20.375350952148438, "global_step": 60923, "epoch": 734} {"train_loss": -20.6497859954834, "global_step": 60924, "epoch": 734} {"train_loss": -20.151554107666016, "global_step": 60925, "epoch": 734} {"train_loss": -19.868438720703125, "global_step": 60926, "epoch": 734} {"train_loss": -20.134321212768555, "global_step": 60927, "epoch": 734} {"train_loss": -19.85724449157715, "global_step": 60928, "epoch": 734} {"train_loss": -20.401273727416992, "global_step": 60929, "epoch": 734} {"train_loss": -20.392141342163086, "global_step": 60930, "epoch": 734} {"train_loss": -20.40573501586914, "global_step": 60931, "epoch": 734} {"train_loss": -20.439321517944336, "global_step": 60932, "epoch": 734} {"train_loss": -20.196828842163086, "global_step": 60933, "epoch": 734} {"train_loss": -20.335235595703125, "global_step": 60934, "epoch": 734} {"train_loss": -20.489059448242188, "global_step": 60935, "epoch": 734} {"train_loss": -20.16902732849121, "global_step": 60936, "epoch": 734} {"train_loss": -20.470279693603516, "global_step": 60937, "epoch": 734} {"train_loss": -20.1754093170166, "global_step": 60938, "epoch": 734} {"train_loss": -20.160551071166992, "global_step": 60939, "epoch": 734} {"train_loss": -20.619831085205078, "global_step": 60940, "epoch": 734} {"train_loss": -20.33705711364746, "global_step": 60941, "epoch": 734} {"train_loss": -20.566022872924805, "global_step": 60942, "epoch": 734} {"train_loss": -20.75892448425293, "global_step": 60943, "epoch": 734} {"train_loss": -20.179725646972656, "global_step": 60944, "epoch": 734} {"train_loss": -20.171918869018555, "global_step": 60945, "epoch": 734} {"train_loss": -20.521398544311523, "global_step": 60946, "epoch": 734} {"train_loss": -20.16946792602539, "global_step": 60947, "epoch": 734} {"train_loss": -20.60765838623047, "global_step": 60948, "epoch": 734} {"train_loss": -20.398130416870117, "global_step": 60949, "epoch": 734} {"train_loss": -20.44655418395996, "global_step": 60950, "epoch": 734} {"train_loss": -20.131973266601562, "global_step": 60951, "epoch": 734} {"train_loss": -20.18659782409668, "global_step": 60952, "epoch": 734} {"train_loss": -20.809152603149414, "global_step": 60953, "epoch": 734} {"train_loss": -20.58913803100586, "global_step": 60954, "epoch": 734} {"train_loss": -20.404539108276367, "global_step": 60955, "epoch": 734} {"train_loss": -20.131500244140625, "global_step": 60956, "epoch": 734} {"train_loss": -20.34151268005371, "global_step": 60957, "epoch": 734} {"train_loss": -19.9998722076416, "global_step": 60958, "epoch": 734} {"train_loss": -20.334383010864258, "global_step": 60959, "epoch": 734} {"train_loss": -20.31730079650879, "global_step": 60960, "epoch": 734} {"train_loss": -20.42438316345215, "global_step": 60961, "epoch": 734} {"train_loss": -20.376358032226562, "global_step": 60962, "epoch": 734} {"train_loss": -20.30159568786621, "global_step": 60963, "epoch": 734} {"train_loss": -20.351484298706055, "global_step": 60964, "epoch": 734} {"train_loss": -20.73259735107422, "global_step": 60965, "epoch": 734} {"train_loss": -20.628385543823242, "global_step": 60966, "epoch": 734} {"train_loss": -20.344911575317383, "global_step": 60967, "epoch": 734} {"train_loss": -20.237295150756836, "global_step": 60968, "epoch": 734} {"train_loss": -20.154277801513672, "global_step": 60969, "epoch": 734} {"train_loss": -20.325401306152344, "global_step": 60970, "epoch": 734} {"train_loss": -20.498563766479492, "global_step": 60971, "epoch": 734} {"train_loss": -20.649831771850586, "global_step": 60972, "epoch": 734} {"train_loss": -19.95553970336914, "global_step": 60973, "epoch": 734} {"train_loss": -20.650310516357422, "global_step": 60974, "epoch": 734} {"train_loss": -20.570236206054688, "global_step": 60975, "epoch": 734} {"train_loss": -20.70159339904785, "global_step": 60976, "epoch": 734} {"train_loss": -20.5898494720459, "global_step": 60977, "epoch": 734} {"train_loss": -20.252939224243164, "global_step": 60978, "epoch": 734} {"train_loss": -20.54867935180664, "global_step": 60979, "epoch": 734} {"train_loss": -20.5856990814209, "global_step": 60980, "epoch": 734} {"train_loss": -20.63266944885254, "global_step": 60981, "epoch": 734} {"train_loss": -20.57855796813965, "global_step": 60982, "epoch": 734} {"train_loss": -20.104475021362305, "global_step": 60983, "epoch": 734} {"train_loss": -20.61392593383789, "global_step": 60984, "epoch": 734} {"train_loss": -20.40813636779785, "global_step": 60985, "epoch": 734} {"train_loss": -20.430471420288086, "global_step": 60986, "epoch": 734} {"train_loss": -20.48323631286621, "global_step": 60987, "epoch": 734} {"train_loss": -20.578170776367188, "global_step": 60988, "epoch": 734} {"train_loss": -20.588293075561523, "global_step": 60989, "epoch": 734} {"train_loss": -20.447154998779297, "global_step": 60990, "epoch": 734} {"train_loss": -20.404476165771484, "global_step": 60991, "epoch": 734} {"train_loss": -20.315847396850586, "global_step": 60992, "epoch": 734} {"train_loss": -20.462072372436523, "global_step": 60993, "epoch": 734} {"train_loss": -20.45697021484375, "global_step": 60994, "epoch": 734} {"train_loss": -20.650033950805664, "global_step": 60995, "epoch": 734} {"train_loss": -20.363786697387695, "global_step": 60996, "epoch": 734} {"train_loss": -20.110158920288086, "global_step": 60997, "epoch": 734} {"train_loss": -20.493839263916016, "global_step": 60998, "epoch": 734} {"train_loss": -20.477615356445312, "global_step": 60999, "epoch": 734} {"train_loss": -20.4238224029541, "global_step": 61000, "epoch": 734} {"train_loss": -20.170757293701172, "global_step": 61001, "epoch": 734} {"train_loss": -20.50714683532715, "global_step": 61002, "epoch": 734} {"train_loss": -20.656240463256836, "global_step": 61003, "epoch": 734} {"train_loss": -20.386846634278815, "global_step": 61004, "epoch": 734, "val_loss": 5875291.5} {"train_loss": -20.083486557006836, "global_step": 61005, "epoch": 735} {"train_loss": -20.415441513061523, "global_step": 61006, "epoch": 735} {"train_loss": -20.070247650146484, "global_step": 61007, "epoch": 735} {"train_loss": -20.386938095092773, "global_step": 61008, "epoch": 735} {"train_loss": -20.067481994628906, "global_step": 61009, "epoch": 735} {"train_loss": -20.207433700561523, "global_step": 61010, "epoch": 735} {"train_loss": -20.25922203063965, "global_step": 61011, "epoch": 735} {"train_loss": -20.25518798828125, "global_step": 61012, "epoch": 735} {"train_loss": -20.01536750793457, "global_step": 61013, "epoch": 735} {"train_loss": -20.42343521118164, "global_step": 61014, "epoch": 735} {"train_loss": -20.429147720336914, "global_step": 61015, "epoch": 735} {"train_loss": -20.4284725189209, "global_step": 61016, "epoch": 735} {"train_loss": -20.53346061706543, "global_step": 61017, "epoch": 735} {"train_loss": -20.452890396118164, "global_step": 61018, "epoch": 735} {"train_loss": -19.79034423828125, "global_step": 61019, "epoch": 735} {"train_loss": -20.34853172302246, "global_step": 61020, "epoch": 735} {"train_loss": -19.985563278198242, "global_step": 61021, "epoch": 735} {"train_loss": -20.413711547851562, "global_step": 61022, "epoch": 735} {"train_loss": -20.323589324951172, "global_step": 61023, "epoch": 735} {"train_loss": -20.152631759643555, "global_step": 61024, "epoch": 735} {"train_loss": -20.490158081054688, "global_step": 61025, "epoch": 735} {"train_loss": -20.421804428100586, "global_step": 61026, "epoch": 735} {"train_loss": -20.342432022094727, "global_step": 61027, "epoch": 735} {"train_loss": -20.466922760009766, "global_step": 61028, "epoch": 735} {"train_loss": -20.543058395385742, "global_step": 61029, "epoch": 735} {"train_loss": -20.363845825195312, "global_step": 61030, "epoch": 735} {"train_loss": -20.372812271118164, "global_step": 61031, "epoch": 735} {"train_loss": -20.186599731445312, "global_step": 61032, "epoch": 735} {"train_loss": -20.642751693725586, "global_step": 61033, "epoch": 735} {"train_loss": -20.442651748657227, "global_step": 61034, "epoch": 735} {"train_loss": -20.45222282409668, "global_step": 61035, "epoch": 735} {"train_loss": -20.393205642700195, "global_step": 61036, "epoch": 735} {"train_loss": -20.49635124206543, "global_step": 61037, "epoch": 735} {"train_loss": -20.58949089050293, "global_step": 61038, "epoch": 735} {"train_loss": -20.177839279174805, "global_step": 61039, "epoch": 735} {"train_loss": -20.275243759155273, "global_step": 61040, "epoch": 735} {"train_loss": -20.27621078491211, "global_step": 61041, "epoch": 735} {"train_loss": -20.344709396362305, "global_step": 61042, "epoch": 735} {"train_loss": -20.638845443725586, "global_step": 61043, "epoch": 735} {"train_loss": -20.218961715698242, "global_step": 61044, "epoch": 735} {"train_loss": -20.8543758392334, "global_step": 61045, "epoch": 735} {"train_loss": -20.47587013244629, "global_step": 61046, "epoch": 735} {"train_loss": -20.953481674194336, "global_step": 61047, "epoch": 735} {"train_loss": -20.871530532836914, "global_step": 61048, "epoch": 735} {"train_loss": -20.591106414794922, "global_step": 61049, "epoch": 735} {"train_loss": -20.272113800048828, "global_step": 61050, "epoch": 735} {"train_loss": -20.16168785095215, "global_step": 61051, "epoch": 735} {"train_loss": -20.55961799621582, "global_step": 61052, "epoch": 735} {"train_loss": -20.589323043823242, "global_step": 61053, "epoch": 735} {"train_loss": -20.510461807250977, "global_step": 61054, "epoch": 735} {"train_loss": -20.93549919128418, "global_step": 61055, "epoch": 735} {"train_loss": -20.85791015625, "global_step": 61056, "epoch": 735} {"train_loss": -20.586389541625977, "global_step": 61057, "epoch": 735} {"train_loss": -20.48809051513672, "global_step": 61058, "epoch": 735} {"train_loss": -20.548564910888672, "global_step": 61059, "epoch": 735} {"train_loss": -20.199071884155273, "global_step": 61060, "epoch": 735} {"train_loss": -20.600521087646484, "global_step": 61061, "epoch": 735} {"train_loss": -20.6910457611084, "global_step": 61062, "epoch": 735} {"train_loss": -20.5399169921875, "global_step": 61063, "epoch": 735} {"train_loss": -20.38702392578125, "global_step": 61064, "epoch": 735} {"train_loss": -20.528913497924805, "global_step": 61065, "epoch": 735} {"train_loss": -20.399580001831055, "global_step": 61066, "epoch": 735} {"train_loss": -20.184207916259766, "global_step": 61067, "epoch": 735} {"train_loss": -20.612773895263672, "global_step": 61068, "epoch": 735} {"train_loss": -20.454063415527344, "global_step": 61069, "epoch": 735} {"train_loss": -20.55714988708496, "global_step": 61070, "epoch": 735} {"train_loss": -20.244766235351562, "global_step": 61071, "epoch": 735} {"train_loss": -20.276718139648438, "global_step": 61072, "epoch": 735} {"train_loss": -20.506834030151367, "global_step": 61073, "epoch": 735} {"train_loss": -20.297222137451172, "global_step": 61074, "epoch": 735} {"train_loss": -20.74757957458496, "global_step": 61075, "epoch": 735} {"train_loss": -20.14728355407715, "global_step": 61076, "epoch": 735} {"train_loss": -20.43906021118164, "global_step": 61077, "epoch": 735} {"train_loss": -20.35577964782715, "global_step": 61078, "epoch": 735} {"train_loss": -20.51495933532715, "global_step": 61079, "epoch": 735} {"train_loss": -20.281850814819336, "global_step": 61080, "epoch": 735} {"train_loss": -20.030485153198242, "global_step": 61081, "epoch": 735} {"train_loss": -20.39554214477539, "global_step": 61082, "epoch": 735} {"train_loss": -20.430572509765625, "global_step": 61083, "epoch": 735} {"train_loss": -20.327619552612305, "global_step": 61084, "epoch": 735} {"train_loss": -20.649707794189453, "global_step": 61085, "epoch": 735} {"train_loss": -20.141061782836914, "global_step": 61086, "epoch": 735} {"train_loss": -20.4019202266831, "global_step": 61087, "epoch": 735, "val_loss": 6051885.5} {"train_loss": -19.253494262695312, "global_step": 61088, "epoch": 736} {"train_loss": -20.02837371826172, "global_step": 61089, "epoch": 736} {"train_loss": -20.10059928894043, "global_step": 61090, "epoch": 736} {"train_loss": -20.393545150756836, "global_step": 61091, "epoch": 736} {"train_loss": -20.313913345336914, "global_step": 61092, "epoch": 736} {"train_loss": -20.273916244506836, "global_step": 61093, "epoch": 736} {"train_loss": -20.328298568725586, "global_step": 61094, "epoch": 736} {"train_loss": -20.29201316833496, "global_step": 61095, "epoch": 736} {"train_loss": -20.292783737182617, "global_step": 61096, "epoch": 736} {"train_loss": -20.0632381439209, "global_step": 61097, "epoch": 736} {"train_loss": -19.92990493774414, "global_step": 61098, "epoch": 736} {"train_loss": -20.449865341186523, "global_step": 61099, "epoch": 736} {"train_loss": -20.11490249633789, "global_step": 61100, "epoch": 736} {"train_loss": -20.079504013061523, "global_step": 61101, "epoch": 736} {"train_loss": -20.423908233642578, "global_step": 61102, "epoch": 736} {"train_loss": -20.331645965576172, "global_step": 61103, "epoch": 736} {"train_loss": -20.45197868347168, "global_step": 61104, "epoch": 736} {"train_loss": -20.072113037109375, "global_step": 61105, "epoch": 736} {"train_loss": -20.229816436767578, "global_step": 61106, "epoch": 736} {"train_loss": -20.526065826416016, "global_step": 61107, "epoch": 736} {"train_loss": -20.342164993286133, "global_step": 61108, "epoch": 736} {"train_loss": -20.05843162536621, "global_step": 61109, "epoch": 736} {"train_loss": -20.30883026123047, "global_step": 61110, "epoch": 736} {"train_loss": -20.14609718322754, "global_step": 61111, "epoch": 736} {"train_loss": -19.99918556213379, "global_step": 61112, "epoch": 736} {"train_loss": -19.91218376159668, "global_step": 61113, "epoch": 736} {"train_loss": -20.679094314575195, "global_step": 61114, "epoch": 736} {"train_loss": -20.492856979370117, "global_step": 61115, "epoch": 736} {"train_loss": -20.417409896850586, "global_step": 61116, "epoch": 736} {"train_loss": -20.44891929626465, "global_step": 61117, "epoch": 736} {"train_loss": -20.391366958618164, "global_step": 61118, "epoch": 736} {"train_loss": -20.647815704345703, "global_step": 61119, "epoch": 736} {"train_loss": -20.347028732299805, "global_step": 61120, "epoch": 736} {"train_loss": -20.55689239501953, "global_step": 61121, "epoch": 736} {"train_loss": -20.29157257080078, "global_step": 61122, "epoch": 736} {"train_loss": -20.30313491821289, "global_step": 61123, "epoch": 736} {"train_loss": -20.180540084838867, "global_step": 61124, "epoch": 736} {"train_loss": -20.957685470581055, "global_step": 61125, "epoch": 736} {"train_loss": -20.408720016479492, "global_step": 61126, "epoch": 736} {"train_loss": -20.458723068237305, "global_step": 61127, "epoch": 736} {"train_loss": -20.282930374145508, "global_step": 61128, "epoch": 736} {"train_loss": -20.558496475219727, "global_step": 61129, "epoch": 736} {"train_loss": -20.966859817504883, "global_step": 61130, "epoch": 736} {"train_loss": -20.1678466796875, "global_step": 61131, "epoch": 736} {"train_loss": -20.5780086517334, "global_step": 61132, "epoch": 736} {"train_loss": -20.491973876953125, "global_step": 61133, "epoch": 736} {"train_loss": -20.056718826293945, "global_step": 61134, "epoch": 736} {"train_loss": -20.12543296813965, "global_step": 61135, "epoch": 736} {"train_loss": -20.329084396362305, "global_step": 61136, "epoch": 736} {"train_loss": -20.717741012573242, "global_step": 61137, "epoch": 736} {"train_loss": -20.433399200439453, "global_step": 61138, "epoch": 736} {"train_loss": -20.6898250579834, "global_step": 61139, "epoch": 736} {"train_loss": -20.3121337890625, "global_step": 61140, "epoch": 736} {"train_loss": -20.5528621673584, "global_step": 61141, "epoch": 736} {"train_loss": -20.12799644470215, "global_step": 61142, "epoch": 736} {"train_loss": -20.3729305267334, "global_step": 61143, "epoch": 736} {"train_loss": -20.071563720703125, "global_step": 61144, "epoch": 736} {"train_loss": -20.42615509033203, "global_step": 61145, "epoch": 736} {"train_loss": -20.62959861755371, "global_step": 61146, "epoch": 736} {"train_loss": -20.775379180908203, "global_step": 61147, "epoch": 736} {"train_loss": -20.8552188873291, "global_step": 61148, "epoch": 736} {"train_loss": -20.205427169799805, "global_step": 61149, "epoch": 736} {"train_loss": -20.897092819213867, "global_step": 61150, "epoch": 736} {"train_loss": -20.710397720336914, "global_step": 61151, "epoch": 736} {"train_loss": -20.685588836669922, "global_step": 61152, "epoch": 736} {"train_loss": -20.22859764099121, "global_step": 61153, "epoch": 736} {"train_loss": -20.5692195892334, "global_step": 61154, "epoch": 736} {"train_loss": -20.484561920166016, "global_step": 61155, "epoch": 736} {"train_loss": -20.451440811157227, "global_step": 61156, "epoch": 736} {"train_loss": -20.862207412719727, "global_step": 61157, "epoch": 736} {"train_loss": -20.200042724609375, "global_step": 61158, "epoch": 736} {"train_loss": -20.58246421813965, "global_step": 61159, "epoch": 736} {"train_loss": -20.697864532470703, "global_step": 61160, "epoch": 736} {"train_loss": -20.019804000854492, "global_step": 61161, "epoch": 736} {"train_loss": -20.231359481811523, "global_step": 61162, "epoch": 736} {"train_loss": -20.478515625, "global_step": 61163, "epoch": 736} {"train_loss": -20.547561645507812, "global_step": 61164, "epoch": 736} {"train_loss": -20.7299861907959, "global_step": 61165, "epoch": 736} {"train_loss": -20.0902156829834, "global_step": 61166, "epoch": 736} {"train_loss": -20.397857666015625, "global_step": 61167, "epoch": 736} {"train_loss": -20.580018997192383, "global_step": 61168, "epoch": 736} {"train_loss": -20.55291175842285, "global_step": 61169, "epoch": 736} {"train_loss": -20.371813900499458, "global_step": 61170, "epoch": 736, "val_loss": 6033314.5} {"train_loss": -19.97646141052246, "global_step": 61171, "epoch": 737} {"train_loss": -20.6545352935791, "global_step": 61172, "epoch": 737} {"train_loss": -20.198806762695312, "global_step": 61173, "epoch": 737} {"train_loss": -20.440027236938477, "global_step": 61174, "epoch": 737} {"train_loss": -20.4333553314209, "global_step": 61175, "epoch": 737} {"train_loss": -20.24704360961914, "global_step": 61176, "epoch": 737} {"train_loss": -20.345670700073242, "global_step": 61177, "epoch": 737} {"train_loss": -20.16171646118164, "global_step": 61178, "epoch": 737} {"train_loss": -20.12943458557129, "global_step": 61179, "epoch": 737} {"train_loss": -20.474897384643555, "global_step": 61180, "epoch": 737} {"train_loss": -19.9890193939209, "global_step": 61181, "epoch": 737} {"train_loss": -20.090763092041016, "global_step": 61182, "epoch": 737} {"train_loss": -20.534378051757812, "global_step": 61183, "epoch": 737} {"train_loss": -20.300588607788086, "global_step": 61184, "epoch": 737} {"train_loss": -20.39501953125, "global_step": 61185, "epoch": 737} {"train_loss": -20.336450576782227, "global_step": 61186, "epoch": 737} {"train_loss": -20.584915161132812, "global_step": 61187, "epoch": 737} {"train_loss": -20.53316307067871, "global_step": 61188, "epoch": 737} {"train_loss": -20.130468368530273, "global_step": 61189, "epoch": 737} {"train_loss": -20.44650650024414, "global_step": 61190, "epoch": 737} {"train_loss": -20.55867576599121, "global_step": 61191, "epoch": 737} {"train_loss": -19.997417449951172, "global_step": 61192, "epoch": 737} {"train_loss": -20.39552116394043, "global_step": 61193, "epoch": 737} {"train_loss": -20.730863571166992, "global_step": 61194, "epoch": 737} {"train_loss": -20.377744674682617, "global_step": 61195, "epoch": 737} {"train_loss": -20.498693466186523, "global_step": 61196, "epoch": 737} {"train_loss": -20.333209991455078, "global_step": 61197, "epoch": 737} {"train_loss": -20.38633918762207, "global_step": 61198, "epoch": 737} {"train_loss": -19.87312889099121, "global_step": 61199, "epoch": 737} {"train_loss": -19.872756958007812, "global_step": 61200, "epoch": 737} {"train_loss": -20.479448318481445, "global_step": 61201, "epoch": 737} {"train_loss": -20.297719955444336, "global_step": 61202, "epoch": 737} {"train_loss": -20.23171615600586, "global_step": 61203, "epoch": 737} {"train_loss": -20.53093147277832, "global_step": 61204, "epoch": 737} {"train_loss": -20.422069549560547, "global_step": 61205, "epoch": 737} {"train_loss": -20.530534744262695, "global_step": 61206, "epoch": 737} {"train_loss": -20.344377517700195, "global_step": 61207, "epoch": 737} {"train_loss": -20.63404655456543, "global_step": 61208, "epoch": 737} {"train_loss": -20.562856674194336, "global_step": 61209, "epoch": 737} {"train_loss": -20.558130264282227, "global_step": 61210, "epoch": 737} {"train_loss": -20.36911392211914, "global_step": 61211, "epoch": 737} {"train_loss": -20.073347091674805, "global_step": 61212, "epoch": 737} {"train_loss": -20.48590660095215, "global_step": 61213, "epoch": 737} {"train_loss": -21.033496856689453, "global_step": 61214, "epoch": 737} {"train_loss": -20.343887329101562, "global_step": 61215, "epoch": 737} {"train_loss": -20.53990936279297, "global_step": 61216, "epoch": 737} {"train_loss": -20.441818237304688, "global_step": 61217, "epoch": 737} {"train_loss": -20.65673065185547, "global_step": 61218, "epoch": 737} {"train_loss": -20.504268646240234, "global_step": 61219, "epoch": 737} {"train_loss": -20.32596778869629, "global_step": 61220, "epoch": 737} {"train_loss": -20.417448043823242, "global_step": 61221, "epoch": 737} {"train_loss": -20.68733787536621, "global_step": 61222, "epoch": 737} {"train_loss": -20.413738250732422, "global_step": 61223, "epoch": 737} {"train_loss": -20.779932022094727, "global_step": 61224, "epoch": 737} {"train_loss": -20.679853439331055, "global_step": 61225, "epoch": 737} {"train_loss": -20.4378719329834, "global_step": 61226, "epoch": 737} {"train_loss": -20.12856101989746, "global_step": 61227, "epoch": 737} {"train_loss": -20.3912296295166, "global_step": 61228, "epoch": 737} {"train_loss": -20.304670333862305, "global_step": 61229, "epoch": 737} {"train_loss": -20.38026237487793, "global_step": 61230, "epoch": 737} {"train_loss": -20.491849899291992, "global_step": 61231, "epoch": 737} {"train_loss": -20.658184051513672, "global_step": 61232, "epoch": 737} {"train_loss": -20.06618309020996, "global_step": 61233, "epoch": 737} {"train_loss": -20.749380111694336, "global_step": 61234, "epoch": 737} {"train_loss": -20.290592193603516, "global_step": 61235, "epoch": 737} {"train_loss": -20.9890079498291, "global_step": 61236, "epoch": 737} {"train_loss": -20.628948211669922, "global_step": 61237, "epoch": 737} {"train_loss": -20.338966369628906, "global_step": 61238, "epoch": 737} {"train_loss": -20.782718658447266, "global_step": 61239, "epoch": 737} {"train_loss": -20.13416862487793, "global_step": 61240, "epoch": 737} {"train_loss": -19.878812789916992, "global_step": 61241, "epoch": 737} {"train_loss": -20.469242095947266, "global_step": 61242, "epoch": 737} {"train_loss": -20.351337432861328, "global_step": 61243, "epoch": 737} {"train_loss": -20.5261287689209, "global_step": 61244, "epoch": 737} {"train_loss": -20.51924705505371, "global_step": 61245, "epoch": 737} {"train_loss": -20.526844024658203, "global_step": 61246, "epoch": 737} {"train_loss": -20.4328556060791, "global_step": 61247, "epoch": 737} {"train_loss": -20.3458309173584, "global_step": 61248, "epoch": 737} {"train_loss": -20.75954246520996, "global_step": 61249, "epoch": 737} {"train_loss": -19.99446678161621, "global_step": 61250, "epoch": 737} {"train_loss": -20.5363826751709, "global_step": 61251, "epoch": 737} {"train_loss": -20.248708724975586, "global_step": 61252, "epoch": 737} {"train_loss": -20.389210597578302, "global_step": 61253, "epoch": 737, "val_loss": 5950052.5} {"train_loss": -20.56083106994629, "global_step": 61254, "epoch": 738} {"train_loss": -20.055490493774414, "global_step": 61255, "epoch": 738} {"train_loss": -20.461278915405273, "global_step": 61256, "epoch": 738} {"train_loss": -20.19204330444336, "global_step": 61257, "epoch": 738} {"train_loss": -20.13450050354004, "global_step": 61258, "epoch": 738} {"train_loss": -20.0875301361084, "global_step": 61259, "epoch": 738} {"train_loss": -20.542648315429688, "global_step": 61260, "epoch": 738} {"train_loss": -20.247106552124023, "global_step": 61261, "epoch": 738} {"train_loss": -20.385700225830078, "global_step": 61262, "epoch": 738} {"train_loss": -20.38433265686035, "global_step": 61263, "epoch": 738} {"train_loss": -20.442834854125977, "global_step": 61264, "epoch": 738} {"train_loss": -20.437570571899414, "global_step": 61265, "epoch": 738} {"train_loss": -20.503372192382812, "global_step": 61266, "epoch": 738} {"train_loss": -20.160856246948242, "global_step": 61267, "epoch": 738} {"train_loss": -20.29488182067871, "global_step": 61268, "epoch": 738} {"train_loss": -20.559616088867188, "global_step": 61269, "epoch": 738} {"train_loss": -20.381004333496094, "global_step": 61270, "epoch": 738} {"train_loss": -20.712631225585938, "global_step": 61271, "epoch": 738} {"train_loss": -20.89523696899414, "global_step": 61272, "epoch": 738} {"train_loss": -20.46392250061035, "global_step": 61273, "epoch": 738} {"train_loss": -20.559539794921875, "global_step": 61274, "epoch": 738} {"train_loss": -20.37251091003418, "global_step": 61275, "epoch": 738} {"train_loss": -20.313735961914062, "global_step": 61276, "epoch": 738} {"train_loss": -20.759658813476562, "global_step": 61277, "epoch": 738} {"train_loss": -20.249807357788086, "global_step": 61278, "epoch": 738} {"train_loss": -21.102863311767578, "global_step": 61279, "epoch": 738} {"train_loss": -20.345144271850586, "global_step": 61280, "epoch": 738} {"train_loss": -20.16884422302246, "global_step": 61281, "epoch": 738} {"train_loss": -20.564346313476562, "global_step": 61282, "epoch": 738} {"train_loss": -20.694040298461914, "global_step": 61283, "epoch": 738} {"train_loss": -20.293928146362305, "global_step": 61284, "epoch": 738} {"train_loss": -20.50583267211914, "global_step": 61285, "epoch": 738} {"train_loss": -20.517526626586914, "global_step": 61286, "epoch": 738} {"train_loss": -20.280244827270508, "global_step": 61287, "epoch": 738} {"train_loss": -20.429162979125977, "global_step": 61288, "epoch": 738} {"train_loss": -20.782394409179688, "global_step": 61289, "epoch": 738} {"train_loss": -20.552778244018555, "global_step": 61290, "epoch": 738} {"train_loss": -20.334171295166016, "global_step": 61291, "epoch": 738} {"train_loss": -20.353628158569336, "global_step": 61292, "epoch": 738} {"train_loss": -20.375024795532227, "global_step": 61293, "epoch": 738} {"train_loss": -20.599851608276367, "global_step": 61294, "epoch": 738} {"train_loss": -20.691015243530273, "global_step": 61295, "epoch": 738} {"train_loss": -20.250492095947266, "global_step": 61296, "epoch": 738} {"train_loss": -20.565244674682617, "global_step": 61297, "epoch": 738} {"train_loss": -20.4586238861084, "global_step": 61298, "epoch": 738} {"train_loss": -20.132986068725586, "global_step": 61299, "epoch": 738} {"train_loss": -20.734399795532227, "global_step": 61300, "epoch": 738} {"train_loss": -20.5250186920166, "global_step": 61301, "epoch": 738} {"train_loss": -20.427282333374023, "global_step": 61302, "epoch": 738} {"train_loss": -20.49474334716797, "global_step": 61303, "epoch": 738} {"train_loss": -20.667552947998047, "global_step": 61304, "epoch": 738} {"train_loss": -20.4456729888916, "global_step": 61305, "epoch": 738} {"train_loss": -20.672523498535156, "global_step": 61306, "epoch": 738} {"train_loss": -20.33029556274414, "global_step": 61307, "epoch": 738} {"train_loss": -20.3490047454834, "global_step": 61308, "epoch": 738} {"train_loss": -20.967039108276367, "global_step": 61309, "epoch": 738} {"train_loss": -20.219533920288086, "global_step": 61310, "epoch": 738} {"train_loss": -20.501480102539062, "global_step": 61311, "epoch": 738} {"train_loss": -20.349872589111328, "global_step": 61312, "epoch": 738} {"train_loss": -20.673200607299805, "global_step": 61313, "epoch": 738} {"train_loss": -20.47764015197754, "global_step": 61314, "epoch": 738} {"train_loss": -20.562036514282227, "global_step": 61315, "epoch": 738} {"train_loss": -20.531787872314453, "global_step": 61316, "epoch": 738} {"train_loss": -20.46974754333496, "global_step": 61317, "epoch": 738} {"train_loss": -20.620101928710938, "global_step": 61318, "epoch": 738} {"train_loss": -20.548057556152344, "global_step": 61319, "epoch": 738} {"train_loss": -20.371076583862305, "global_step": 61320, "epoch": 738} {"train_loss": -20.394535064697266, "global_step": 61321, "epoch": 738} {"train_loss": -20.769285202026367, "global_step": 61322, "epoch": 738} {"train_loss": -20.315475463867188, "global_step": 61323, "epoch": 738} {"train_loss": -20.299144744873047, "global_step": 61324, "epoch": 738} {"train_loss": -20.406814575195312, "global_step": 61325, "epoch": 738} {"train_loss": -20.50227928161621, "global_step": 61326, "epoch": 738} {"train_loss": -20.404701232910156, "global_step": 61327, "epoch": 738} {"train_loss": -20.43994140625, "global_step": 61328, "epoch": 738} {"train_loss": -20.433109283447266, "global_step": 61329, "epoch": 738} {"train_loss": -20.40614128112793, "global_step": 61330, "epoch": 738} {"train_loss": -20.622377395629883, "global_step": 61331, "epoch": 738} {"train_loss": -20.191606521606445, "global_step": 61332, "epoch": 738} {"train_loss": -20.215961456298828, "global_step": 61333, "epoch": 738} {"train_loss": -20.273868560791016, "global_step": 61334, "epoch": 738} {"train_loss": -20.456518173217773, "global_step": 61335, "epoch": 738} {"train_loss": -20.456253626260413, "global_step": 61336, "epoch": 738, "val_loss": 5884124.0} {"train_loss": -19.707706451416016, "global_step": 61337, "epoch": 739} {"train_loss": -20.04755973815918, "global_step": 61338, "epoch": 739} {"train_loss": -19.894306182861328, "global_step": 61339, "epoch": 739} {"train_loss": -20.30100440979004, "global_step": 61340, "epoch": 739} {"train_loss": -20.025636672973633, "global_step": 61341, "epoch": 739} {"train_loss": -20.04792594909668, "global_step": 61342, "epoch": 739} {"train_loss": -19.804153442382812, "global_step": 61343, "epoch": 739} {"train_loss": -20.069425582885742, "global_step": 61344, "epoch": 739} {"train_loss": -19.887178421020508, "global_step": 61345, "epoch": 739} {"train_loss": -19.9805850982666, "global_step": 61346, "epoch": 739} {"train_loss": -20.472578048706055, "global_step": 61347, "epoch": 739} {"train_loss": -19.969175338745117, "global_step": 61348, "epoch": 739} {"train_loss": -20.085847854614258, "global_step": 61349, "epoch": 739} {"train_loss": -20.033044815063477, "global_step": 61350, "epoch": 739} {"train_loss": -20.1904354095459, "global_step": 61351, "epoch": 739} {"train_loss": -20.31463050842285, "global_step": 61352, "epoch": 739} {"train_loss": -20.147666931152344, "global_step": 61353, "epoch": 739} {"train_loss": -20.014341354370117, "global_step": 61354, "epoch": 739} {"train_loss": -20.462848663330078, "global_step": 61355, "epoch": 739} {"train_loss": -20.392868041992188, "global_step": 61356, "epoch": 739} {"train_loss": -20.30348014831543, "global_step": 61357, "epoch": 739} {"train_loss": -20.239133834838867, "global_step": 61358, "epoch": 739} {"train_loss": -20.219961166381836, "global_step": 61359, "epoch": 739} {"train_loss": -20.6105899810791, "global_step": 61360, "epoch": 739} {"train_loss": -20.289344787597656, "global_step": 61361, "epoch": 739} {"train_loss": -20.717918395996094, "global_step": 61362, "epoch": 739} {"train_loss": -20.426517486572266, "global_step": 61363, "epoch": 739} {"train_loss": -20.290067672729492, "global_step": 61364, "epoch": 739} {"train_loss": -20.851675033569336, "global_step": 61365, "epoch": 739} {"train_loss": -20.56009864807129, "global_step": 61366, "epoch": 739} {"train_loss": -20.603538513183594, "global_step": 61367, "epoch": 739} {"train_loss": -20.346555709838867, "global_step": 61368, "epoch": 739} {"train_loss": -20.466873168945312, "global_step": 61369, "epoch": 739} {"train_loss": -20.176830291748047, "global_step": 61370, "epoch": 739} {"train_loss": -20.50043296813965, "global_step": 61371, "epoch": 739} {"train_loss": -20.67562484741211, "global_step": 61372, "epoch": 739} {"train_loss": -20.485355377197266, "global_step": 61373, "epoch": 739} {"train_loss": -20.50797462463379, "global_step": 61374, "epoch": 739} {"train_loss": -20.426130294799805, "global_step": 61375, "epoch": 739} {"train_loss": -20.533597946166992, "global_step": 61376, "epoch": 739} {"train_loss": -20.471729278564453, "global_step": 61377, "epoch": 739} {"train_loss": -20.313053131103516, "global_step": 61378, "epoch": 739} {"train_loss": -19.97749900817871, "global_step": 61379, "epoch": 739} {"train_loss": -20.32148551940918, "global_step": 61380, "epoch": 739} {"train_loss": -20.56549072265625, "global_step": 61381, "epoch": 739} {"train_loss": -19.982059478759766, "global_step": 61382, "epoch": 739} {"train_loss": -20.189044952392578, "global_step": 61383, "epoch": 739} {"train_loss": -20.730384826660156, "global_step": 61384, "epoch": 739} {"train_loss": -20.45198631286621, "global_step": 61385, "epoch": 739} {"train_loss": -20.83088493347168, "global_step": 61386, "epoch": 739} {"train_loss": -20.07379150390625, "global_step": 61387, "epoch": 739} {"train_loss": -20.64626693725586, "global_step": 61388, "epoch": 739} {"train_loss": -20.589862823486328, "global_step": 61389, "epoch": 739} {"train_loss": -20.870227813720703, "global_step": 61390, "epoch": 739} {"train_loss": -20.39143180847168, "global_step": 61391, "epoch": 739} {"train_loss": -20.380388259887695, "global_step": 61392, "epoch": 739} {"train_loss": -20.232318878173828, "global_step": 61393, "epoch": 739} {"train_loss": -20.419692993164062, "global_step": 61394, "epoch": 739} {"train_loss": -20.61044692993164, "global_step": 61395, "epoch": 739} {"train_loss": -20.486692428588867, "global_step": 61396, "epoch": 739} {"train_loss": -20.738271713256836, "global_step": 61397, "epoch": 739} {"train_loss": -20.6112117767334, "global_step": 61398, "epoch": 739} {"train_loss": -20.639850616455078, "global_step": 61399, "epoch": 739} {"train_loss": -20.39711570739746, "global_step": 61400, "epoch": 739} {"train_loss": -20.553863525390625, "global_step": 61401, "epoch": 739} {"train_loss": -19.871702194213867, "global_step": 61402, "epoch": 739} {"train_loss": -20.121959686279297, "global_step": 61403, "epoch": 739} {"train_loss": -20.220251083374023, "global_step": 61404, "epoch": 739} {"train_loss": -20.812244415283203, "global_step": 61405, "epoch": 739} {"train_loss": -20.302465438842773, "global_step": 61406, "epoch": 739} {"train_loss": -20.928749084472656, "global_step": 61407, "epoch": 739} {"train_loss": -20.551965713500977, "global_step": 61408, "epoch": 739} {"train_loss": -20.459917068481445, "global_step": 61409, "epoch": 739} {"train_loss": -20.0555477142334, "global_step": 61410, "epoch": 739} {"train_loss": -20.42321014404297, "global_step": 61411, "epoch": 739} {"train_loss": -20.039045333862305, "global_step": 61412, "epoch": 739} {"train_loss": -20.576278686523438, "global_step": 61413, "epoch": 739} {"train_loss": -20.299299240112305, "global_step": 61414, "epoch": 739} {"train_loss": -20.39028549194336, "global_step": 61415, "epoch": 739} {"train_loss": -20.413436889648438, "global_step": 61416, "epoch": 739} {"train_loss": -20.597137451171875, "global_step": 61417, "epoch": 739} {"train_loss": -20.739131927490234, "global_step": 61418, "epoch": 739} {"train_loss": -20.380900394485657, "global_step": 61419, "epoch": 739, "val_loss": 5888607.5} {"train_loss": -20.451358795166016, "global_step": 61420, "epoch": 740} {"train_loss": -20.423343658447266, "global_step": 61421, "epoch": 740} {"train_loss": -20.40395164489746, "global_step": 61422, "epoch": 740} {"train_loss": -20.18084716796875, "global_step": 61423, "epoch": 740} {"train_loss": -20.265005111694336, "global_step": 61424, "epoch": 740} {"train_loss": -20.49617576599121, "global_step": 61425, "epoch": 740} {"train_loss": -20.288713455200195, "global_step": 61426, "epoch": 740} {"train_loss": -20.262332916259766, "global_step": 61427, "epoch": 740} {"train_loss": -20.543813705444336, "global_step": 61428, "epoch": 740} {"train_loss": -20.329574584960938, "global_step": 61429, "epoch": 740} {"train_loss": -19.949560165405273, "global_step": 61430, "epoch": 740} {"train_loss": -20.490982055664062, "global_step": 61431, "epoch": 740} {"train_loss": -20.777421951293945, "global_step": 61432, "epoch": 740} {"train_loss": -20.699466705322266, "global_step": 61433, "epoch": 740} {"train_loss": -20.498510360717773, "global_step": 61434, "epoch": 740} {"train_loss": -20.259918212890625, "global_step": 61435, "epoch": 740} {"train_loss": -20.337997436523438, "global_step": 61436, "epoch": 740} {"train_loss": -20.621591567993164, "global_step": 61437, "epoch": 740} {"train_loss": -20.76862335205078, "global_step": 61438, "epoch": 740} {"train_loss": -20.727949142456055, "global_step": 61439, "epoch": 740} {"train_loss": -20.39609718322754, "global_step": 61440, "epoch": 740} {"train_loss": -20.540496826171875, "global_step": 61441, "epoch": 740} {"train_loss": -20.47256851196289, "global_step": 61442, "epoch": 740} {"train_loss": -20.486373901367188, "global_step": 61443, "epoch": 740} {"train_loss": -20.22260093688965, "global_step": 61444, "epoch": 740} {"train_loss": -20.185932159423828, "global_step": 61445, "epoch": 740} {"train_loss": -20.432462692260742, "global_step": 61446, "epoch": 740} {"train_loss": -19.997329711914062, "global_step": 61447, "epoch": 740} {"train_loss": -20.48695945739746, "global_step": 61448, "epoch": 740} {"train_loss": -20.674192428588867, "global_step": 61449, "epoch": 740} {"train_loss": -20.596065521240234, "global_step": 61450, "epoch": 740} {"train_loss": -20.589853286743164, "global_step": 61451, "epoch": 740} {"train_loss": -20.10666847229004, "global_step": 61452, "epoch": 740} {"train_loss": -20.460268020629883, "global_step": 61453, "epoch": 740} {"train_loss": -20.42186737060547, "global_step": 61454, "epoch": 740} {"train_loss": -20.404211044311523, "global_step": 61455, "epoch": 740} {"train_loss": -20.5839786529541, "global_step": 61456, "epoch": 740} {"train_loss": -20.078054428100586, "global_step": 61457, "epoch": 740} {"train_loss": -20.539581298828125, "global_step": 61458, "epoch": 740} {"train_loss": -20.655914306640625, "global_step": 61459, "epoch": 740} {"train_loss": -20.450605392456055, "global_step": 61460, "epoch": 740} {"train_loss": -20.254961013793945, "global_step": 61461, "epoch": 740} {"train_loss": -21.078800201416016, "global_step": 61462, "epoch": 740} {"train_loss": -20.42774772644043, "global_step": 61463, "epoch": 740} {"train_loss": -20.490652084350586, "global_step": 61464, "epoch": 740} {"train_loss": -20.247848510742188, "global_step": 61465, "epoch": 740} {"train_loss": -20.538768768310547, "global_step": 61466, "epoch": 740} {"train_loss": -20.631803512573242, "global_step": 61467, "epoch": 740} {"train_loss": -20.432058334350586, "global_step": 61468, "epoch": 740} {"train_loss": -20.650251388549805, "global_step": 61469, "epoch": 740} {"train_loss": -20.59471893310547, "global_step": 61470, "epoch": 740} {"train_loss": -20.255422592163086, "global_step": 61471, "epoch": 740} {"train_loss": -20.346994400024414, "global_step": 61472, "epoch": 740} {"train_loss": -20.52164649963379, "global_step": 61473, "epoch": 740} {"train_loss": -20.368932723999023, "global_step": 61474, "epoch": 740} {"train_loss": -20.543001174926758, "global_step": 61475, "epoch": 740} {"train_loss": -20.58918571472168, "global_step": 61476, "epoch": 740} {"train_loss": -20.460376739501953, "global_step": 61477, "epoch": 740} {"train_loss": -20.150510787963867, "global_step": 61478, "epoch": 740} {"train_loss": -20.344921112060547, "global_step": 61479, "epoch": 740} {"train_loss": -20.58987808227539, "global_step": 61480, "epoch": 740} {"train_loss": -20.27449607849121, "global_step": 61481, "epoch": 740} {"train_loss": -20.26065444946289, "global_step": 61482, "epoch": 740} {"train_loss": -20.614553451538086, "global_step": 61483, "epoch": 740} {"train_loss": -20.75320816040039, "global_step": 61484, "epoch": 740} {"train_loss": -20.459003448486328, "global_step": 61485, "epoch": 740} {"train_loss": -20.352109909057617, "global_step": 61486, "epoch": 740} {"train_loss": -20.501575469970703, "global_step": 61487, "epoch": 740} {"train_loss": -20.61266326904297, "global_step": 61488, "epoch": 740} {"train_loss": -20.623897552490234, "global_step": 61489, "epoch": 740} {"train_loss": -20.675830841064453, "global_step": 61490, "epoch": 740} {"train_loss": -20.423093795776367, "global_step": 61491, "epoch": 740} {"train_loss": -20.47612190246582, "global_step": 61492, "epoch": 740} {"train_loss": -20.547378540039062, "global_step": 61493, "epoch": 740} {"train_loss": -20.125246047973633, "global_step": 61494, "epoch": 740} {"train_loss": -20.564878463745117, "global_step": 61495, "epoch": 740} {"train_loss": -20.35756492614746, "global_step": 61496, "epoch": 740} {"train_loss": -20.960166931152344, "global_step": 61497, "epoch": 740} {"train_loss": -20.633548736572266, "global_step": 61498, "epoch": 740} {"train_loss": -20.31585693359375, "global_step": 61499, "epoch": 740} {"train_loss": -20.450536727905273, "global_step": 61500, "epoch": 740} {"train_loss": -20.356191635131836, "global_step": 61501, "epoch": 740} {"train_loss": -20.45303480309176, "global_step": 61502, "epoch": 740, "val_loss": 5955151.5} {"train_loss": -20.37221908569336, "global_step": 61503, "epoch": 741} {"train_loss": -20.125364303588867, "global_step": 61504, "epoch": 741} {"train_loss": -20.08078384399414, "global_step": 61505, "epoch": 741} {"train_loss": -20.511587142944336, "global_step": 61506, "epoch": 741} {"train_loss": -19.863943099975586, "global_step": 61507, "epoch": 741} {"train_loss": -20.17238426208496, "global_step": 61508, "epoch": 741} {"train_loss": -20.439443588256836, "global_step": 61509, "epoch": 741} {"train_loss": -20.241147994995117, "global_step": 61510, "epoch": 741} {"train_loss": -20.353382110595703, "global_step": 61511, "epoch": 741} {"train_loss": -20.193897247314453, "global_step": 61512, "epoch": 741} {"train_loss": -20.2845516204834, "global_step": 61513, "epoch": 741} {"train_loss": -20.415807723999023, "global_step": 61514, "epoch": 741} {"train_loss": -20.215097427368164, "global_step": 61515, "epoch": 741} {"train_loss": -20.635251998901367, "global_step": 61516, "epoch": 741} {"train_loss": -20.155912399291992, "global_step": 61517, "epoch": 741} {"train_loss": -20.544889450073242, "global_step": 61518, "epoch": 741} {"train_loss": -20.597074508666992, "global_step": 61519, "epoch": 741} {"train_loss": -20.71686363220215, "global_step": 61520, "epoch": 741} {"train_loss": -20.362781524658203, "global_step": 61521, "epoch": 741} {"train_loss": -20.596271514892578, "global_step": 61522, "epoch": 741} {"train_loss": -20.511472702026367, "global_step": 61523, "epoch": 741} {"train_loss": -20.85961151123047, "global_step": 61524, "epoch": 741} {"train_loss": -20.269336700439453, "global_step": 61525, "epoch": 741} {"train_loss": -20.502283096313477, "global_step": 61526, "epoch": 741} {"train_loss": -20.724021911621094, "global_step": 61527, "epoch": 741} {"train_loss": -20.52274513244629, "global_step": 61528, "epoch": 741} {"train_loss": -20.1165714263916, "global_step": 61529, "epoch": 741} {"train_loss": -20.22697639465332, "global_step": 61530, "epoch": 741} {"train_loss": -20.7643985748291, "global_step": 61531, "epoch": 741} {"train_loss": -20.343103408813477, "global_step": 61532, "epoch": 741} {"train_loss": -20.343280792236328, "global_step": 61533, "epoch": 741} {"train_loss": -20.343420028686523, "global_step": 61534, "epoch": 741} {"train_loss": -20.404678344726562, "global_step": 61535, "epoch": 741} {"train_loss": -20.22882843017578, "global_step": 61536, "epoch": 741} {"train_loss": -20.284645080566406, "global_step": 61537, "epoch": 741} {"train_loss": -20.661376953125, "global_step": 61538, "epoch": 741} {"train_loss": -20.423818588256836, "global_step": 61539, "epoch": 741} {"train_loss": -20.5693302154541, "global_step": 61540, "epoch": 741} {"train_loss": -20.26200294494629, "global_step": 61541, "epoch": 741} {"train_loss": -20.632810592651367, "global_step": 61542, "epoch": 741} {"train_loss": -20.789772033691406, "global_step": 61543, "epoch": 741} {"train_loss": -20.809595108032227, "global_step": 61544, "epoch": 741} {"train_loss": -20.4470272064209, "global_step": 61545, "epoch": 741} {"train_loss": -20.814979553222656, "global_step": 61546, "epoch": 741} {"train_loss": -20.743284225463867, "global_step": 61547, "epoch": 741} {"train_loss": -20.045846939086914, "global_step": 61548, "epoch": 741} {"train_loss": -20.458593368530273, "global_step": 61549, "epoch": 741} {"train_loss": -19.971975326538086, "global_step": 61550, "epoch": 741} {"train_loss": -20.432849884033203, "global_step": 61551, "epoch": 741} {"train_loss": -20.20445442199707, "global_step": 61552, "epoch": 741} {"train_loss": -20.560951232910156, "global_step": 61553, "epoch": 741} {"train_loss": -20.7460994720459, "global_step": 61554, "epoch": 741} {"train_loss": -20.518047332763672, "global_step": 61555, "epoch": 741} {"train_loss": -20.03877830505371, "global_step": 61556, "epoch": 741} {"train_loss": -20.368471145629883, "global_step": 61557, "epoch": 741} {"train_loss": -20.441448211669922, "global_step": 61558, "epoch": 741} {"train_loss": -20.48680305480957, "global_step": 61559, "epoch": 741} {"train_loss": -20.31368637084961, "global_step": 61560, "epoch": 741} {"train_loss": -20.060840606689453, "global_step": 61561, "epoch": 741} {"train_loss": -20.477331161499023, "global_step": 61562, "epoch": 741} {"train_loss": -20.511457443237305, "global_step": 61563, "epoch": 741} {"train_loss": -20.440292358398438, "global_step": 61564, "epoch": 741} {"train_loss": -20.38063621520996, "global_step": 61565, "epoch": 741} {"train_loss": -20.913070678710938, "global_step": 61566, "epoch": 741} {"train_loss": -20.430620193481445, "global_step": 61567, "epoch": 741} {"train_loss": -20.476381301879883, "global_step": 61568, "epoch": 741} {"train_loss": -20.6203670501709, "global_step": 61569, "epoch": 741} {"train_loss": -20.29445457458496, "global_step": 61570, "epoch": 741} {"train_loss": -20.4100399017334, "global_step": 61571, "epoch": 741} {"train_loss": -19.98505210876465, "global_step": 61572, "epoch": 741} {"train_loss": -20.42593002319336, "global_step": 61573, "epoch": 741} {"train_loss": -20.571279525756836, "global_step": 61574, "epoch": 741} {"train_loss": -20.189924240112305, "global_step": 61575, "epoch": 741} {"train_loss": -20.357404708862305, "global_step": 61576, "epoch": 741} {"train_loss": -20.62264060974121, "global_step": 61577, "epoch": 741} {"train_loss": -20.605283737182617, "global_step": 61578, "epoch": 741} {"train_loss": -20.103527069091797, "global_step": 61579, "epoch": 741} {"train_loss": -20.682838439941406, "global_step": 61580, "epoch": 741} {"train_loss": -20.555313110351562, "global_step": 61581, "epoch": 741} {"train_loss": -20.3636531829834, "global_step": 61582, "epoch": 741} {"train_loss": -20.58909034729004, "global_step": 61583, "epoch": 741} {"train_loss": -20.589765548706055, "global_step": 61584, "epoch": 741} {"train_loss": -20.42635251240558, "global_step": 61585, "epoch": 741, "val_loss": 5962056.5} {"train_loss": -20.165836334228516, "global_step": 61586, "epoch": 742} {"train_loss": -20.43507194519043, "global_step": 61587, "epoch": 742} {"train_loss": -20.33129119873047, "global_step": 61588, "epoch": 742} {"train_loss": -20.22559928894043, "global_step": 61589, "epoch": 742} {"train_loss": -20.53853988647461, "global_step": 61590, "epoch": 742} {"train_loss": -20.060638427734375, "global_step": 61591, "epoch": 742} {"train_loss": -20.253610610961914, "global_step": 61592, "epoch": 742} {"train_loss": -20.3708553314209, "global_step": 61593, "epoch": 742} {"train_loss": -20.24466323852539, "global_step": 61594, "epoch": 742} {"train_loss": -20.488147735595703, "global_step": 61595, "epoch": 742} {"train_loss": -20.307077407836914, "global_step": 61596, "epoch": 742} {"train_loss": -20.302350997924805, "global_step": 61597, "epoch": 742} {"train_loss": -20.501358032226562, "global_step": 61598, "epoch": 742} {"train_loss": -20.169431686401367, "global_step": 61599, "epoch": 742} {"train_loss": -20.38629150390625, "global_step": 61600, "epoch": 742} {"train_loss": -20.8021183013916, "global_step": 61601, "epoch": 742} {"train_loss": -20.188892364501953, "global_step": 61602, "epoch": 742} {"train_loss": -20.66816520690918, "global_step": 61603, "epoch": 742} {"train_loss": -20.55852699279785, "global_step": 61604, "epoch": 742} {"train_loss": -20.77838706970215, "global_step": 61605, "epoch": 742} {"train_loss": -20.342357635498047, "global_step": 61606, "epoch": 742} {"train_loss": -20.213909149169922, "global_step": 61607, "epoch": 742} {"train_loss": -20.338459014892578, "global_step": 61608, "epoch": 742} {"train_loss": -20.517513275146484, "global_step": 61609, "epoch": 742} {"train_loss": -20.44844627380371, "global_step": 61610, "epoch": 742} {"train_loss": -20.664762496948242, "global_step": 61611, "epoch": 742} {"train_loss": -20.639753341674805, "global_step": 61612, "epoch": 742} {"train_loss": -20.669763565063477, "global_step": 61613, "epoch": 742} {"train_loss": -20.568435668945312, "global_step": 61614, "epoch": 742} {"train_loss": -20.446033477783203, "global_step": 61615, "epoch": 742} {"train_loss": -20.83805274963379, "global_step": 61616, "epoch": 742} {"train_loss": -20.091856002807617, "global_step": 61617, "epoch": 742} {"train_loss": -20.778011322021484, "global_step": 61618, "epoch": 742} {"train_loss": -20.292402267456055, "global_step": 61619, "epoch": 742} {"train_loss": -20.043989181518555, "global_step": 61620, "epoch": 742} {"train_loss": -20.033004760742188, "global_step": 61621, "epoch": 742} {"train_loss": -20.626386642456055, "global_step": 61622, "epoch": 742} {"train_loss": -20.242094039916992, "global_step": 61623, "epoch": 742} {"train_loss": -20.346006393432617, "global_step": 61624, "epoch": 742} {"train_loss": -20.07572364807129, "global_step": 61625, "epoch": 742} {"train_loss": -20.147113800048828, "global_step": 61626, "epoch": 742} {"train_loss": -20.40069007873535, "global_step": 61627, "epoch": 742} {"train_loss": -20.349029541015625, "global_step": 61628, "epoch": 742} {"train_loss": -20.416305541992188, "global_step": 61629, "epoch": 742} {"train_loss": -20.403535842895508, "global_step": 61630, "epoch": 742} {"train_loss": -20.27715492248535, "global_step": 61631, "epoch": 742} {"train_loss": -20.430166244506836, "global_step": 61632, "epoch": 742} {"train_loss": -20.260908126831055, "global_step": 61633, "epoch": 742} {"train_loss": -20.221097946166992, "global_step": 61634, "epoch": 742} {"train_loss": -20.43444061279297, "global_step": 61635, "epoch": 742} {"train_loss": -20.809906005859375, "global_step": 61636, "epoch": 742} {"train_loss": -20.7642765045166, "global_step": 61637, "epoch": 742} {"train_loss": -20.421545028686523, "global_step": 61638, "epoch": 742} {"train_loss": -20.42902183532715, "global_step": 61639, "epoch": 742} {"train_loss": -20.649328231811523, "global_step": 61640, "epoch": 742} {"train_loss": -20.18052101135254, "global_step": 61641, "epoch": 742} {"train_loss": -20.269041061401367, "global_step": 61642, "epoch": 742} {"train_loss": -20.708892822265625, "global_step": 61643, "epoch": 742} {"train_loss": -20.487985610961914, "global_step": 61644, "epoch": 742} {"train_loss": -20.196651458740234, "global_step": 61645, "epoch": 742} {"train_loss": -20.517236709594727, "global_step": 61646, "epoch": 742} {"train_loss": -20.681217193603516, "global_step": 61647, "epoch": 742} {"train_loss": -20.111515045166016, "global_step": 61648, "epoch": 742} {"train_loss": -20.53000259399414, "global_step": 61649, "epoch": 742} {"train_loss": -20.437284469604492, "global_step": 61650, "epoch": 742} {"train_loss": -20.240131378173828, "global_step": 61651, "epoch": 742} {"train_loss": -20.45328712463379, "global_step": 61652, "epoch": 742} {"train_loss": -20.426233291625977, "global_step": 61653, "epoch": 742} {"train_loss": -20.164737701416016, "global_step": 61654, "epoch": 742} {"train_loss": -20.4224910736084, "global_step": 61655, "epoch": 742} {"train_loss": -20.48067855834961, "global_step": 61656, "epoch": 742} {"train_loss": -20.291582107543945, "global_step": 61657, "epoch": 742} {"train_loss": -20.200469970703125, "global_step": 61658, "epoch": 742} {"train_loss": -20.626541137695312, "global_step": 61659, "epoch": 742} {"train_loss": -20.299074172973633, "global_step": 61660, "epoch": 742} {"train_loss": -20.295530319213867, "global_step": 61661, "epoch": 742} {"train_loss": -20.148656845092773, "global_step": 61662, "epoch": 742} {"train_loss": -20.390316009521484, "global_step": 61663, "epoch": 742} {"train_loss": -20.840211868286133, "global_step": 61664, "epoch": 742} {"train_loss": -20.22769546508789, "global_step": 61665, "epoch": 742} {"train_loss": -20.294227600097656, "global_step": 61666, "epoch": 742} {"train_loss": -20.5125675201416, "global_step": 61667, "epoch": 742} {"train_loss": -20.40182922547122, "global_step": 61668, "epoch": 742, "val_loss": 5938846.0} {"train_loss": -20.152362823486328, "global_step": 61669, "epoch": 743} {"train_loss": -20.1115779876709, "global_step": 61670, "epoch": 743} {"train_loss": -20.456201553344727, "global_step": 61671, "epoch": 743} {"train_loss": -20.294607162475586, "global_step": 61672, "epoch": 743} {"train_loss": -20.250974655151367, "global_step": 61673, "epoch": 743} {"train_loss": -20.553232192993164, "global_step": 61674, "epoch": 743} {"train_loss": -20.095325469970703, "global_step": 61675, "epoch": 743} {"train_loss": -20.5528621673584, "global_step": 61676, "epoch": 743} {"train_loss": -20.276010513305664, "global_step": 61677, "epoch": 743} {"train_loss": -20.51185417175293, "global_step": 61678, "epoch": 743} {"train_loss": -19.816558837890625, "global_step": 61679, "epoch": 743} {"train_loss": -20.12929344177246, "global_step": 61680, "epoch": 743} {"train_loss": -19.969778060913086, "global_step": 61681, "epoch": 743} {"train_loss": -20.29811668395996, "global_step": 61682, "epoch": 743} {"train_loss": -20.41273307800293, "global_step": 61683, "epoch": 743} {"train_loss": -20.55998420715332, "global_step": 61684, "epoch": 743} {"train_loss": -20.060741424560547, "global_step": 61685, "epoch": 743} {"train_loss": -20.11784553527832, "global_step": 61686, "epoch": 743} {"train_loss": -20.323667526245117, "global_step": 61687, "epoch": 743} {"train_loss": -20.379108428955078, "global_step": 61688, "epoch": 743} {"train_loss": -20.560583114624023, "global_step": 61689, "epoch": 743} {"train_loss": -20.41187858581543, "global_step": 61690, "epoch": 743} {"train_loss": -20.535629272460938, "global_step": 61691, "epoch": 743} {"train_loss": -20.343042373657227, "global_step": 61692, "epoch": 743} {"train_loss": -20.30396842956543, "global_step": 61693, "epoch": 743} {"train_loss": -20.98854637145996, "global_step": 61694, "epoch": 743} {"train_loss": -20.51618003845215, "global_step": 61695, "epoch": 743} {"train_loss": -20.218053817749023, "global_step": 61696, "epoch": 743} {"train_loss": -20.405237197875977, "global_step": 61697, "epoch": 743} {"train_loss": -19.9311580657959, "global_step": 61698, "epoch": 743} {"train_loss": -20.24129867553711, "global_step": 61699, "epoch": 743} {"train_loss": -20.557559967041016, "global_step": 61700, "epoch": 743} {"train_loss": -20.3740234375, "global_step": 61701, "epoch": 743} {"train_loss": -20.669721603393555, "global_step": 61702, "epoch": 743} {"train_loss": -20.173337936401367, "global_step": 61703, "epoch": 743} {"train_loss": -20.404687881469727, "global_step": 61704, "epoch": 743} {"train_loss": -20.504981994628906, "global_step": 61705, "epoch": 743} {"train_loss": -20.633872985839844, "global_step": 61706, "epoch": 743} {"train_loss": -20.066085815429688, "global_step": 61707, "epoch": 743} {"train_loss": -20.27412986755371, "global_step": 61708, "epoch": 743} {"train_loss": -20.853757858276367, "global_step": 61709, "epoch": 743} {"train_loss": -20.803606033325195, "global_step": 61710, "epoch": 743} {"train_loss": -20.40333366394043, "global_step": 61711, "epoch": 743} {"train_loss": -20.1838436126709, "global_step": 61712, "epoch": 743} {"train_loss": -20.576871871948242, "global_step": 61713, "epoch": 743} {"train_loss": -20.677562713623047, "global_step": 61714, "epoch": 743} {"train_loss": -20.1713809967041, "global_step": 61715, "epoch": 743} {"train_loss": -20.211280822753906, "global_step": 61716, "epoch": 743} {"train_loss": -20.44963264465332, "global_step": 61717, "epoch": 743} {"train_loss": -20.383869171142578, "global_step": 61718, "epoch": 743} {"train_loss": -20.617578506469727, "global_step": 61719, "epoch": 743} {"train_loss": -20.2155818939209, "global_step": 61720, "epoch": 743} {"train_loss": -20.352567672729492, "global_step": 61721, "epoch": 743} {"train_loss": -20.525503158569336, "global_step": 61722, "epoch": 743} {"train_loss": -20.529071807861328, "global_step": 61723, "epoch": 743} {"train_loss": -20.85259437561035, "global_step": 61724, "epoch": 743} {"train_loss": -20.44338035583496, "global_step": 61725, "epoch": 743} {"train_loss": -20.427122116088867, "global_step": 61726, "epoch": 743} {"train_loss": -20.513999938964844, "global_step": 61727, "epoch": 743} {"train_loss": -20.742544174194336, "global_step": 61728, "epoch": 743} {"train_loss": -20.60822296142578, "global_step": 61729, "epoch": 743} {"train_loss": -20.595401763916016, "global_step": 61730, "epoch": 743} {"train_loss": -20.49581527709961, "global_step": 61731, "epoch": 743} {"train_loss": -20.53388023376465, "global_step": 61732, "epoch": 743} {"train_loss": -20.438152313232422, "global_step": 61733, "epoch": 743} {"train_loss": -20.711763381958008, "global_step": 61734, "epoch": 743} {"train_loss": -20.525135040283203, "global_step": 61735, "epoch": 743} {"train_loss": -19.935016632080078, "global_step": 61736, "epoch": 743} {"train_loss": -20.361265182495117, "global_step": 61737, "epoch": 743} {"train_loss": -20.04297637939453, "global_step": 61738, "epoch": 743} {"train_loss": -20.107309341430664, "global_step": 61739, "epoch": 743} {"train_loss": -20.53265953063965, "global_step": 61740, "epoch": 743} {"train_loss": -20.26579475402832, "global_step": 61741, "epoch": 743} {"train_loss": -20.548221588134766, "global_step": 61742, "epoch": 743} {"train_loss": -20.33588218688965, "global_step": 61743, "epoch": 743} {"train_loss": -20.307981491088867, "global_step": 61744, "epoch": 743} {"train_loss": -20.600940704345703, "global_step": 61745, "epoch": 743} {"train_loss": -20.17730712890625, "global_step": 61746, "epoch": 743} {"train_loss": -20.6501407623291, "global_step": 61747, "epoch": 743} {"train_loss": -20.5152587890625, "global_step": 61748, "epoch": 743} {"train_loss": -20.640186309814453, "global_step": 61749, "epoch": 743} {"train_loss": -20.741125106811523, "global_step": 61750, "epoch": 743} {"train_loss": -20.403522652315807, "global_step": 61751, "epoch": 743, "val_loss": 5949896.0} {"train_loss": -20.08033561706543, "global_step": 61752, "epoch": 744} {"train_loss": -19.754497528076172, "global_step": 61753, "epoch": 744} {"train_loss": -19.671659469604492, "global_step": 61754, "epoch": 744} {"train_loss": -20.27837562561035, "global_step": 61755, "epoch": 744} {"train_loss": -20.15399742126465, "global_step": 61756, "epoch": 744} {"train_loss": -20.0493221282959, "global_step": 61757, "epoch": 744} {"train_loss": -20.25829315185547, "global_step": 61758, "epoch": 744} {"train_loss": -20.155330657958984, "global_step": 61759, "epoch": 744} {"train_loss": -20.304737091064453, "global_step": 61760, "epoch": 744} {"train_loss": -20.0699520111084, "global_step": 61761, "epoch": 744} {"train_loss": -20.19297218322754, "global_step": 61762, "epoch": 744} {"train_loss": -20.250288009643555, "global_step": 61763, "epoch": 744} {"train_loss": -20.05747413635254, "global_step": 61764, "epoch": 744} {"train_loss": -20.162145614624023, "global_step": 61765, "epoch": 744} {"train_loss": -20.375715255737305, "global_step": 61766, "epoch": 744} {"train_loss": -20.3933048248291, "global_step": 61767, "epoch": 744} {"train_loss": -20.51676368713379, "global_step": 61768, "epoch": 744} {"train_loss": -20.452062606811523, "global_step": 61769, "epoch": 744} {"train_loss": -20.585309982299805, "global_step": 61770, "epoch": 744} {"train_loss": -20.268545150756836, "global_step": 61771, "epoch": 744} {"train_loss": -20.026288986206055, "global_step": 61772, "epoch": 744} {"train_loss": -20.3541202545166, "global_step": 61773, "epoch": 744} {"train_loss": -20.802505493164062, "global_step": 61774, "epoch": 744} {"train_loss": -19.94209861755371, "global_step": 61775, "epoch": 744} {"train_loss": -20.577672958374023, "global_step": 61776, "epoch": 744} {"train_loss": -20.5673828125, "global_step": 61777, "epoch": 744} {"train_loss": -20.43858528137207, "global_step": 61778, "epoch": 744} {"train_loss": -20.61207389831543, "global_step": 61779, "epoch": 744} {"train_loss": -20.753314971923828, "global_step": 61780, "epoch": 744} {"train_loss": -20.525949478149414, "global_step": 61781, "epoch": 744} {"train_loss": -20.62000846862793, "global_step": 61782, "epoch": 744} {"train_loss": -20.544652938842773, "global_step": 61783, "epoch": 744} {"train_loss": -20.556161880493164, "global_step": 61784, "epoch": 744} {"train_loss": -20.45191764831543, "global_step": 61785, "epoch": 744} {"train_loss": -20.18004608154297, "global_step": 61786, "epoch": 744} {"train_loss": -20.14425277709961, "global_step": 61787, "epoch": 744} {"train_loss": -20.32349395751953, "global_step": 61788, "epoch": 744} {"train_loss": -20.755781173706055, "global_step": 61789, "epoch": 744} {"train_loss": -20.353408813476562, "global_step": 61790, "epoch": 744} {"train_loss": -20.90781021118164, "global_step": 61791, "epoch": 744} {"train_loss": -20.313932418823242, "global_step": 61792, "epoch": 744} {"train_loss": -20.673416137695312, "global_step": 61793, "epoch": 744} {"train_loss": -20.664867401123047, "global_step": 61794, "epoch": 744} {"train_loss": -20.354345321655273, "global_step": 61795, "epoch": 744} {"train_loss": -20.558631896972656, "global_step": 61796, "epoch": 744} {"train_loss": -20.88679313659668, "global_step": 61797, "epoch": 744} {"train_loss": -20.3914737701416, "global_step": 61798, "epoch": 744} {"train_loss": -20.58280372619629, "global_step": 61799, "epoch": 744} {"train_loss": -20.63671875, "global_step": 61800, "epoch": 744} {"train_loss": -20.366514205932617, "global_step": 61801, "epoch": 744} {"train_loss": -19.945035934448242, "global_step": 61802, "epoch": 744} {"train_loss": -20.200223922729492, "global_step": 61803, "epoch": 744} {"train_loss": -20.680727005004883, "global_step": 61804, "epoch": 744} {"train_loss": -20.722991943359375, "global_step": 61805, "epoch": 744} {"train_loss": -20.403600692749023, "global_step": 61806, "epoch": 744} {"train_loss": -20.52902603149414, "global_step": 61807, "epoch": 744} {"train_loss": -20.708967208862305, "global_step": 61808, "epoch": 744} {"train_loss": -20.294071197509766, "global_step": 61809, "epoch": 744} {"train_loss": -20.47979736328125, "global_step": 61810, "epoch": 744} {"train_loss": -20.572498321533203, "global_step": 61811, "epoch": 744} {"train_loss": -20.694395065307617, "global_step": 61812, "epoch": 744} {"train_loss": -20.5738582611084, "global_step": 61813, "epoch": 744} {"train_loss": -20.593154907226562, "global_step": 61814, "epoch": 744} {"train_loss": -20.498559951782227, "global_step": 61815, "epoch": 744} {"train_loss": -20.622861862182617, "global_step": 61816, "epoch": 744} {"train_loss": -20.48720359802246, "global_step": 61817, "epoch": 744} {"train_loss": -20.34203338623047, "global_step": 61818, "epoch": 744} {"train_loss": -20.415502548217773, "global_step": 61819, "epoch": 744} {"train_loss": -20.441116333007812, "global_step": 61820, "epoch": 744} {"train_loss": -20.215068817138672, "global_step": 61821, "epoch": 744} {"train_loss": -21.128995895385742, "global_step": 61822, "epoch": 744} {"train_loss": -20.34552764892578, "global_step": 61823, "epoch": 744} {"train_loss": -20.848331451416016, "global_step": 61824, "epoch": 744} {"train_loss": -20.628482818603516, "global_step": 61825, "epoch": 744} {"train_loss": -20.411449432373047, "global_step": 61826, "epoch": 744} {"train_loss": -20.625913619995117, "global_step": 61827, "epoch": 744} {"train_loss": -20.931928634643555, "global_step": 61828, "epoch": 744} {"train_loss": -20.735960006713867, "global_step": 61829, "epoch": 744} {"train_loss": -20.702505111694336, "global_step": 61830, "epoch": 744} {"train_loss": -20.53857421875, "global_step": 61831, "epoch": 744} {"train_loss": -20.233745574951172, "global_step": 61832, "epoch": 744} {"train_loss": -20.48313331604004, "global_step": 61833, "epoch": 744} {"train_loss": -20.4334699561797, "global_step": 61834, "epoch": 744, "val_loss": 6190052.0} {"train_loss": -19.640308380126953, "global_step": 61835, "epoch": 745} {"train_loss": -19.79682731628418, "global_step": 61836, "epoch": 745} {"train_loss": -20.34540367126465, "global_step": 61837, "epoch": 745} {"train_loss": -19.542083740234375, "global_step": 61838, "epoch": 745} {"train_loss": -20.284549713134766, "global_step": 61839, "epoch": 745} {"train_loss": -19.94246482849121, "global_step": 61840, "epoch": 745} {"train_loss": -20.341825485229492, "global_step": 61841, "epoch": 745} {"train_loss": -20.098352432250977, "global_step": 61842, "epoch": 745} {"train_loss": -20.308063507080078, "global_step": 61843, "epoch": 745} {"train_loss": -20.24477195739746, "global_step": 61844, "epoch": 745} {"train_loss": -20.32076072692871, "global_step": 61845, "epoch": 745} {"train_loss": -20.07822036743164, "global_step": 61846, "epoch": 745} {"train_loss": -20.231029510498047, "global_step": 61847, "epoch": 745} {"train_loss": -20.182016372680664, "global_step": 61848, "epoch": 745} {"train_loss": -20.25266456604004, "global_step": 61849, "epoch": 745} {"train_loss": -20.375818252563477, "global_step": 61850, "epoch": 745} {"train_loss": -20.390094757080078, "global_step": 61851, "epoch": 745} {"train_loss": -20.50812530517578, "global_step": 61852, "epoch": 745} {"train_loss": -20.51148796081543, "global_step": 61853, "epoch": 745} {"train_loss": -20.61289405822754, "global_step": 61854, "epoch": 745} {"train_loss": -20.49386978149414, "global_step": 61855, "epoch": 745} {"train_loss": -20.41594886779785, "global_step": 61856, "epoch": 745} {"train_loss": -20.328702926635742, "global_step": 61857, "epoch": 745} {"train_loss": -20.661108016967773, "global_step": 61858, "epoch": 745} {"train_loss": -20.16366958618164, "global_step": 61859, "epoch": 745} {"train_loss": -20.329483032226562, "global_step": 61860, "epoch": 745} {"train_loss": -20.733930587768555, "global_step": 61861, "epoch": 745} {"train_loss": -20.02126121520996, "global_step": 61862, "epoch": 745} {"train_loss": -20.449499130249023, "global_step": 61863, "epoch": 745} {"train_loss": -20.71554946899414, "global_step": 61864, "epoch": 745} {"train_loss": -20.232633590698242, "global_step": 61865, "epoch": 745} {"train_loss": -20.29529571533203, "global_step": 61866, "epoch": 745} {"train_loss": -20.46573257446289, "global_step": 61867, "epoch": 745} {"train_loss": -20.492305755615234, "global_step": 61868, "epoch": 745} {"train_loss": -20.408578872680664, "global_step": 61869, "epoch": 745} {"train_loss": -20.420072555541992, "global_step": 61870, "epoch": 745} {"train_loss": -20.476871490478516, "global_step": 61871, "epoch": 745} {"train_loss": -20.66792106628418, "global_step": 61872, "epoch": 745} {"train_loss": -20.44232749938965, "global_step": 61873, "epoch": 745} {"train_loss": -20.340900421142578, "global_step": 61874, "epoch": 745} {"train_loss": -20.060712814331055, "global_step": 61875, "epoch": 745} {"train_loss": -20.849523544311523, "global_step": 61876, "epoch": 745} {"train_loss": -20.298755645751953, "global_step": 61877, "epoch": 745} {"train_loss": -20.706954956054688, "global_step": 61878, "epoch": 745} {"train_loss": -20.311513900756836, "global_step": 61879, "epoch": 745} {"train_loss": -20.352930068969727, "global_step": 61880, "epoch": 745} {"train_loss": -20.44352149963379, "global_step": 61881, "epoch": 745} {"train_loss": -20.702228546142578, "global_step": 61882, "epoch": 745} {"train_loss": -20.411029815673828, "global_step": 61883, "epoch": 745} {"train_loss": -20.406253814697266, "global_step": 61884, "epoch": 745} {"train_loss": -20.792646408081055, "global_step": 61885, "epoch": 745} {"train_loss": -21.017723083496094, "global_step": 61886, "epoch": 745} {"train_loss": -20.569469451904297, "global_step": 61887, "epoch": 745} {"train_loss": -20.331274032592773, "global_step": 61888, "epoch": 745} {"train_loss": -20.66163444519043, "global_step": 61889, "epoch": 745} {"train_loss": -20.389371871948242, "global_step": 61890, "epoch": 745} {"train_loss": -20.260282516479492, "global_step": 61891, "epoch": 745} {"train_loss": -20.811033248901367, "global_step": 61892, "epoch": 745} {"train_loss": -20.712900161743164, "global_step": 61893, "epoch": 745} {"train_loss": -20.399076461791992, "global_step": 61894, "epoch": 745} {"train_loss": -20.994592666625977, "global_step": 61895, "epoch": 745} {"train_loss": -20.665258407592773, "global_step": 61896, "epoch": 745} {"train_loss": -20.44765281677246, "global_step": 61897, "epoch": 745} {"train_loss": -20.123151779174805, "global_step": 61898, "epoch": 745} {"train_loss": -20.285480499267578, "global_step": 61899, "epoch": 745} {"train_loss": -20.45795249938965, "global_step": 61900, "epoch": 745} {"train_loss": -20.522863388061523, "global_step": 61901, "epoch": 745} {"train_loss": -20.80044937133789, "global_step": 61902, "epoch": 745} {"train_loss": -20.397497177124023, "global_step": 61903, "epoch": 745} {"train_loss": -20.651636123657227, "global_step": 61904, "epoch": 745} {"train_loss": -20.822195053100586, "global_step": 61905, "epoch": 745} {"train_loss": -20.234268188476562, "global_step": 61906, "epoch": 745} {"train_loss": -20.610271453857422, "global_step": 61907, "epoch": 745} {"train_loss": -20.429441452026367, "global_step": 61908, "epoch": 745} {"train_loss": -20.53407096862793, "global_step": 61909, "epoch": 745} {"train_loss": -20.496854782104492, "global_step": 61910, "epoch": 745} {"train_loss": -20.516271591186523, "global_step": 61911, "epoch": 745} {"train_loss": -20.430089950561523, "global_step": 61912, "epoch": 745} {"train_loss": -20.43876075744629, "global_step": 61913, "epoch": 745} {"train_loss": -20.640588760375977, "global_step": 61914, "epoch": 745} {"train_loss": -20.568164825439453, "global_step": 61915, "epoch": 745} {"train_loss": -20.60463523864746, "global_step": 61916, "epoch": 745} {"train_loss": -20.417022268456147, "global_step": 61917, "epoch": 745, "val_loss": 5858698.0} {"train_loss": -20.285215377807617, "global_step": 61918, "epoch": 746} {"train_loss": -20.4672794342041, "global_step": 61919, "epoch": 746} {"train_loss": -19.401647567749023, "global_step": 61920, "epoch": 746} {"train_loss": -20.21247673034668, "global_step": 61921, "epoch": 746} {"train_loss": -20.12645721435547, "global_step": 61922, "epoch": 746} {"train_loss": -20.299772262573242, "global_step": 61923, "epoch": 746} {"train_loss": -20.212406158447266, "global_step": 61924, "epoch": 746} {"train_loss": -20.32905387878418, "global_step": 61925, "epoch": 746} {"train_loss": -20.434499740600586, "global_step": 61926, "epoch": 746} {"train_loss": -20.186424255371094, "global_step": 61927, "epoch": 746} {"train_loss": -20.48098373413086, "global_step": 61928, "epoch": 746} {"train_loss": -20.188718795776367, "global_step": 61929, "epoch": 746} {"train_loss": -20.233476638793945, "global_step": 61930, "epoch": 746} {"train_loss": -20.277156829833984, "global_step": 61931, "epoch": 746} {"train_loss": -20.56378746032715, "global_step": 61932, "epoch": 746} {"train_loss": -20.29215431213379, "global_step": 61933, "epoch": 746} {"train_loss": -20.605554580688477, "global_step": 61934, "epoch": 746} {"train_loss": -20.188739776611328, "global_step": 61935, "epoch": 746} {"train_loss": -20.607120513916016, "global_step": 61936, "epoch": 746} {"train_loss": -20.334131240844727, "global_step": 61937, "epoch": 746} {"train_loss": -20.082202911376953, "global_step": 61938, "epoch": 746} {"train_loss": -20.512331008911133, "global_step": 61939, "epoch": 746} {"train_loss": -20.2745361328125, "global_step": 61940, "epoch": 746} {"train_loss": -20.516359329223633, "global_step": 61941, "epoch": 746} {"train_loss": -20.044103622436523, "global_step": 61942, "epoch": 746} {"train_loss": -20.49441146850586, "global_step": 61943, "epoch": 746} {"train_loss": -20.378646850585938, "global_step": 61944, "epoch": 746} {"train_loss": -20.409482955932617, "global_step": 61945, "epoch": 746} {"train_loss": -20.715829849243164, "global_step": 61946, "epoch": 746} {"train_loss": -20.554773330688477, "global_step": 61947, "epoch": 746} {"train_loss": -20.606916427612305, "global_step": 61948, "epoch": 746} {"train_loss": -20.636310577392578, "global_step": 61949, "epoch": 746} {"train_loss": -20.64784812927246, "global_step": 61950, "epoch": 746} {"train_loss": -20.520288467407227, "global_step": 61951, "epoch": 746} {"train_loss": -20.45260238647461, "global_step": 61952, "epoch": 746} {"train_loss": -20.533109664916992, "global_step": 61953, "epoch": 746} {"train_loss": -20.55660629272461, "global_step": 61954, "epoch": 746} {"train_loss": -20.454782485961914, "global_step": 61955, "epoch": 746} {"train_loss": -20.728744506835938, "global_step": 61956, "epoch": 746} {"train_loss": -20.58323097229004, "global_step": 61957, "epoch": 746} {"train_loss": -20.504837036132812, "global_step": 61958, "epoch": 746} {"train_loss": -20.393381118774414, "global_step": 61959, "epoch": 746} {"train_loss": -20.661123275756836, "global_step": 61960, "epoch": 746} {"train_loss": -20.546554565429688, "global_step": 61961, "epoch": 746} {"train_loss": -20.555822372436523, "global_step": 61962, "epoch": 746} {"train_loss": -20.296466827392578, "global_step": 61963, "epoch": 746} {"train_loss": -20.5013370513916, "global_step": 61964, "epoch": 746} {"train_loss": -20.45182228088379, "global_step": 61965, "epoch": 746} {"train_loss": -20.65064239501953, "global_step": 61966, "epoch": 746} {"train_loss": -20.38154411315918, "global_step": 61967, "epoch": 746} {"train_loss": -20.642433166503906, "global_step": 61968, "epoch": 746} {"train_loss": -20.62697410583496, "global_step": 61969, "epoch": 746} {"train_loss": -20.207345962524414, "global_step": 61970, "epoch": 746} {"train_loss": -19.9930362701416, "global_step": 61971, "epoch": 746} {"train_loss": -20.398937225341797, "global_step": 61972, "epoch": 746} {"train_loss": -20.584623336791992, "global_step": 61973, "epoch": 746} {"train_loss": -20.22932243347168, "global_step": 61974, "epoch": 746} {"train_loss": -20.211496353149414, "global_step": 61975, "epoch": 746} {"train_loss": -20.494110107421875, "global_step": 61976, "epoch": 746} {"train_loss": -20.46184730529785, "global_step": 61977, "epoch": 746} {"train_loss": -20.804140090942383, "global_step": 61978, "epoch": 746} {"train_loss": -20.12319564819336, "global_step": 61979, "epoch": 746} {"train_loss": -20.364002227783203, "global_step": 61980, "epoch": 746} {"train_loss": -20.114370346069336, "global_step": 61981, "epoch": 746} {"train_loss": -20.663110733032227, "global_step": 61982, "epoch": 746} {"train_loss": -20.348264694213867, "global_step": 61983, "epoch": 746} {"train_loss": -20.46187400817871, "global_step": 61984, "epoch": 746} {"train_loss": -20.172561645507812, "global_step": 61985, "epoch": 746} {"train_loss": -20.73245620727539, "global_step": 61986, "epoch": 746} {"train_loss": -20.598072052001953, "global_step": 61987, "epoch": 746} {"train_loss": -19.892858505249023, "global_step": 61988, "epoch": 746} {"train_loss": -20.261533737182617, "global_step": 61989, "epoch": 746} {"train_loss": -20.170642852783203, "global_step": 61990, "epoch": 746} {"train_loss": -20.707029342651367, "global_step": 61991, "epoch": 746} {"train_loss": -20.635913848876953, "global_step": 61992, "epoch": 746} {"train_loss": -20.61602210998535, "global_step": 61993, "epoch": 746} {"train_loss": -20.056013107299805, "global_step": 61994, "epoch": 746} {"train_loss": -20.34661865234375, "global_step": 61995, "epoch": 746} {"train_loss": -20.15680503845215, "global_step": 61996, "epoch": 746} {"train_loss": -20.63229751586914, "global_step": 61997, "epoch": 746} {"train_loss": -20.7652645111084, "global_step": 61998, "epoch": 746} {"train_loss": -20.659549713134766, "global_step": 61999, "epoch": 746} {"train_loss": -20.41644275619323, "global_step": 62000, "epoch": 746, "val_loss": 5981009.5} {"train_loss": -20.512182235717773, "global_step": 62001, "epoch": 747} {"train_loss": -20.55841064453125, "global_step": 62002, "epoch": 747} {"train_loss": -20.187564849853516, "global_step": 62003, "epoch": 747} {"train_loss": -20.267942428588867, "global_step": 62004, "epoch": 747} {"train_loss": -20.06757164001465, "global_step": 62005, "epoch": 747} {"train_loss": -20.672739028930664, "global_step": 62006, "epoch": 747} {"train_loss": -20.52695083618164, "global_step": 62007, "epoch": 747} {"train_loss": -20.5176944732666, "global_step": 62008, "epoch": 747} {"train_loss": -20.652929306030273, "global_step": 62009, "epoch": 747} {"train_loss": -20.529172897338867, "global_step": 62010, "epoch": 747} {"train_loss": -20.277679443359375, "global_step": 62011, "epoch": 747} {"train_loss": -20.166730880737305, "global_step": 62012, "epoch": 747} {"train_loss": -20.54734230041504, "global_step": 62013, "epoch": 747} {"train_loss": -20.735010147094727, "global_step": 62014, "epoch": 747} {"train_loss": -20.33655548095703, "global_step": 62015, "epoch": 747} {"train_loss": -20.375947952270508, "global_step": 62016, "epoch": 747} {"train_loss": -20.529619216918945, "global_step": 62017, "epoch": 747} {"train_loss": -20.567750930786133, "global_step": 62018, "epoch": 747} {"train_loss": -20.5755558013916, "global_step": 62019, "epoch": 747} {"train_loss": -20.10483169555664, "global_step": 62020, "epoch": 747} {"train_loss": -20.10263442993164, "global_step": 62021, "epoch": 747} {"train_loss": -20.19496726989746, "global_step": 62022, "epoch": 747} {"train_loss": -20.255840301513672, "global_step": 62023, "epoch": 747} {"train_loss": -20.373165130615234, "global_step": 62024, "epoch": 747} {"train_loss": -20.63471794128418, "global_step": 62025, "epoch": 747} {"train_loss": -20.396617889404297, "global_step": 62026, "epoch": 747} {"train_loss": -20.544443130493164, "global_step": 62027, "epoch": 747} {"train_loss": -20.67767906188965, "global_step": 62028, "epoch": 747} {"train_loss": -20.565053939819336, "global_step": 62029, "epoch": 747} {"train_loss": -20.248517990112305, "global_step": 62030, "epoch": 747} {"train_loss": -20.217281341552734, "global_step": 62031, "epoch": 747} {"train_loss": -20.637819290161133, "global_step": 62032, "epoch": 747} {"train_loss": -20.22968101501465, "global_step": 62033, "epoch": 747} {"train_loss": -20.54532241821289, "global_step": 62034, "epoch": 747} {"train_loss": -20.548391342163086, "global_step": 62035, "epoch": 747} {"train_loss": -20.835403442382812, "global_step": 62036, "epoch": 747} {"train_loss": -20.729671478271484, "global_step": 62037, "epoch": 747} {"train_loss": -20.312604904174805, "global_step": 62038, "epoch": 747} {"train_loss": -20.218215942382812, "global_step": 62039, "epoch": 747} {"train_loss": -20.323719024658203, "global_step": 62040, "epoch": 747} {"train_loss": -20.358572006225586, "global_step": 62041, "epoch": 747} {"train_loss": -20.264249801635742, "global_step": 62042, "epoch": 747} {"train_loss": -20.579910278320312, "global_step": 62043, "epoch": 747} {"train_loss": -20.39237403869629, "global_step": 62044, "epoch": 747} {"train_loss": -20.577682495117188, "global_step": 62045, "epoch": 747} {"train_loss": -20.611814498901367, "global_step": 62046, "epoch": 747} {"train_loss": -20.780380249023438, "global_step": 62047, "epoch": 747} {"train_loss": -20.33763313293457, "global_step": 62048, "epoch": 747} {"train_loss": -20.45179557800293, "global_step": 62049, "epoch": 747} {"train_loss": -20.41072654724121, "global_step": 62050, "epoch": 747} {"train_loss": -20.584489822387695, "global_step": 62051, "epoch": 747} {"train_loss": -20.707321166992188, "global_step": 62052, "epoch": 747} {"train_loss": -20.584280014038086, "global_step": 62053, "epoch": 747} {"train_loss": -20.881855010986328, "global_step": 62054, "epoch": 747} {"train_loss": -20.237764358520508, "global_step": 62055, "epoch": 747} {"train_loss": -20.641815185546875, "global_step": 62056, "epoch": 747} {"train_loss": -20.29127311706543, "global_step": 62057, "epoch": 747} {"train_loss": -20.594831466674805, "global_step": 62058, "epoch": 747} {"train_loss": -20.44085121154785, "global_step": 62059, "epoch": 747} {"train_loss": -20.547998428344727, "global_step": 62060, "epoch": 747} {"train_loss": -20.75220489501953, "global_step": 62061, "epoch": 747} {"train_loss": -20.424646377563477, "global_step": 62062, "epoch": 747} {"train_loss": -20.391523361206055, "global_step": 62063, "epoch": 747} {"train_loss": -20.64471435546875, "global_step": 62064, "epoch": 747} {"train_loss": -20.51362419128418, "global_step": 62065, "epoch": 747} {"train_loss": -20.810834884643555, "global_step": 62066, "epoch": 747} {"train_loss": -20.717981338500977, "global_step": 62067, "epoch": 747} {"train_loss": -20.61355972290039, "global_step": 62068, "epoch": 747} {"train_loss": -20.604171752929688, "global_step": 62069, "epoch": 747} {"train_loss": -20.795551300048828, "global_step": 62070, "epoch": 747} {"train_loss": -20.26202392578125, "global_step": 62071, "epoch": 747} {"train_loss": -20.581899642944336, "global_step": 62072, "epoch": 747} {"train_loss": -20.753496170043945, "global_step": 62073, "epoch": 747} {"train_loss": -20.217302322387695, "global_step": 62074, "epoch": 747} {"train_loss": -20.22096061706543, "global_step": 62075, "epoch": 747} {"train_loss": -20.03387451171875, "global_step": 62076, "epoch": 747} {"train_loss": -20.882858276367188, "global_step": 62077, "epoch": 747} {"train_loss": -20.678298950195312, "global_step": 62078, "epoch": 747} {"train_loss": -20.69733428955078, "global_step": 62079, "epoch": 747} {"train_loss": -20.437284469604492, "global_step": 62080, "epoch": 747} {"train_loss": -20.161298751831055, "global_step": 62081, "epoch": 747} {"train_loss": -20.221372604370117, "global_step": 62082, "epoch": 747} {"train_loss": -20.46278408923781, "global_step": 62083, "epoch": 747, "val_loss": 5865455.0} {"train_loss": -19.810985565185547, "global_step": 62084, "epoch": 748} {"train_loss": -20.349905014038086, "global_step": 62085, "epoch": 748} {"train_loss": -20.3223934173584, "global_step": 62086, "epoch": 748} {"train_loss": -20.342092514038086, "global_step": 62087, "epoch": 748} {"train_loss": -20.0645809173584, "global_step": 62088, "epoch": 748} {"train_loss": -20.370586395263672, "global_step": 62089, "epoch": 748} {"train_loss": -20.339202880859375, "global_step": 62090, "epoch": 748} {"train_loss": -20.21242332458496, "global_step": 62091, "epoch": 748} {"train_loss": -20.06271743774414, "global_step": 62092, "epoch": 748} {"train_loss": -20.30149269104004, "global_step": 62093, "epoch": 748} {"train_loss": -20.404760360717773, "global_step": 62094, "epoch": 748} {"train_loss": -20.676969528198242, "global_step": 62095, "epoch": 748} {"train_loss": -20.334278106689453, "global_step": 62096, "epoch": 748} {"train_loss": -20.52231216430664, "global_step": 62097, "epoch": 748} {"train_loss": -20.371572494506836, "global_step": 62098, "epoch": 748} {"train_loss": -20.3922176361084, "global_step": 62099, "epoch": 748} {"train_loss": -20.376310348510742, "global_step": 62100, "epoch": 748} {"train_loss": -20.189220428466797, "global_step": 62101, "epoch": 748} {"train_loss": -20.2198429107666, "global_step": 62102, "epoch": 748} {"train_loss": -20.4512882232666, "global_step": 62103, "epoch": 748} {"train_loss": -20.317855834960938, "global_step": 62104, "epoch": 748} {"train_loss": -20.496334075927734, "global_step": 62105, "epoch": 748} {"train_loss": -20.4794864654541, "global_step": 62106, "epoch": 748} {"train_loss": -20.527414321899414, "global_step": 62107, "epoch": 748} {"train_loss": -20.547473907470703, "global_step": 62108, "epoch": 748} {"train_loss": -20.390037536621094, "global_step": 62109, "epoch": 748} {"train_loss": -20.54636001586914, "global_step": 62110, "epoch": 748} {"train_loss": -20.710582733154297, "global_step": 62111, "epoch": 748} {"train_loss": -20.113927841186523, "global_step": 62112, "epoch": 748} {"train_loss": -20.631725311279297, "global_step": 62113, "epoch": 748} {"train_loss": -20.484617233276367, "global_step": 62114, "epoch": 748} {"train_loss": -20.782949447631836, "global_step": 62115, "epoch": 748} {"train_loss": -20.784378051757812, "global_step": 62116, "epoch": 748} {"train_loss": -20.322019577026367, "global_step": 62117, "epoch": 748} {"train_loss": -20.58697509765625, "global_step": 62118, "epoch": 748} {"train_loss": -20.493972778320312, "global_step": 62119, "epoch": 748} {"train_loss": -20.303272247314453, "global_step": 62120, "epoch": 748} {"train_loss": -20.49269676208496, "global_step": 62121, "epoch": 748} {"train_loss": -20.468618392944336, "global_step": 62122, "epoch": 748} {"train_loss": -20.864694595336914, "global_step": 62123, "epoch": 748} {"train_loss": -20.905858993530273, "global_step": 62124, "epoch": 748} {"train_loss": -20.133840560913086, "global_step": 62125, "epoch": 748} {"train_loss": -20.490192413330078, "global_step": 62126, "epoch": 748} {"train_loss": -20.26370620727539, "global_step": 62127, "epoch": 748} {"train_loss": -20.884384155273438, "global_step": 62128, "epoch": 748} {"train_loss": -20.699298858642578, "global_step": 62129, "epoch": 748} {"train_loss": -20.371763229370117, "global_step": 62130, "epoch": 748} {"train_loss": -20.453500747680664, "global_step": 62131, "epoch": 748} {"train_loss": -20.28571891784668, "global_step": 62132, "epoch": 748} {"train_loss": -20.697021484375, "global_step": 62133, "epoch": 748} {"train_loss": -20.522628784179688, "global_step": 62134, "epoch": 748} {"train_loss": -20.31488037109375, "global_step": 62135, "epoch": 748} {"train_loss": -20.373794555664062, "global_step": 62136, "epoch": 748} {"train_loss": -20.313657760620117, "global_step": 62137, "epoch": 748} {"train_loss": -20.058582305908203, "global_step": 62138, "epoch": 748} {"train_loss": -20.52634620666504, "global_step": 62139, "epoch": 748} {"train_loss": -20.47882080078125, "global_step": 62140, "epoch": 748} {"train_loss": -20.32154655456543, "global_step": 62141, "epoch": 748} {"train_loss": -20.707517623901367, "global_step": 62142, "epoch": 748} {"train_loss": -20.777589797973633, "global_step": 62143, "epoch": 748} {"train_loss": -20.260101318359375, "global_step": 62144, "epoch": 748} {"train_loss": -20.400346755981445, "global_step": 62145, "epoch": 748} {"train_loss": -20.691482543945312, "global_step": 62146, "epoch": 748} {"train_loss": -20.655261993408203, "global_step": 62147, "epoch": 748} {"train_loss": -20.9761962890625, "global_step": 62148, "epoch": 748} {"train_loss": -20.4368839263916, "global_step": 62149, "epoch": 748} {"train_loss": -20.475330352783203, "global_step": 62150, "epoch": 748} {"train_loss": -20.89009666442871, "global_step": 62151, "epoch": 748} {"train_loss": -20.114076614379883, "global_step": 62152, "epoch": 748} {"train_loss": -20.4295654296875, "global_step": 62153, "epoch": 748} {"train_loss": -20.558645248413086, "global_step": 62154, "epoch": 748} {"train_loss": -20.437589645385742, "global_step": 62155, "epoch": 748} {"train_loss": -20.18024444580078, "global_step": 62156, "epoch": 748} {"train_loss": -19.85748863220215, "global_step": 62157, "epoch": 748} {"train_loss": -20.613861083984375, "global_step": 62158, "epoch": 748} {"train_loss": -20.55192756652832, "global_step": 62159, "epoch": 748} {"train_loss": -20.875505447387695, "global_step": 62160, "epoch": 748} {"train_loss": -20.6715145111084, "global_step": 62161, "epoch": 748} {"train_loss": -20.421567916870117, "global_step": 62162, "epoch": 748} {"train_loss": -20.93716812133789, "global_step": 62163, "epoch": 748} {"train_loss": -20.459396362304688, "global_step": 62164, "epoch": 748} {"train_loss": -20.639236450195312, "global_step": 62165, "epoch": 748} {"train_loss": -20.47815463054611, "global_step": 62166, "epoch": 748, "val_loss": 6051251.0} {"train_loss": -19.527450561523438, "global_step": 62167, "epoch": 749} {"train_loss": -20.62410545349121, "global_step": 62168, "epoch": 749} {"train_loss": -19.910953521728516, "global_step": 62169, "epoch": 749} {"train_loss": -20.201541900634766, "global_step": 62170, "epoch": 749} {"train_loss": -20.242095947265625, "global_step": 62171, "epoch": 749} {"train_loss": -20.01392936706543, "global_step": 62172, "epoch": 749} {"train_loss": -20.55315589904785, "global_step": 62173, "epoch": 749} {"train_loss": -20.137672424316406, "global_step": 62174, "epoch": 749} {"train_loss": -19.971742630004883, "global_step": 62175, "epoch": 749} {"train_loss": -20.6453914642334, "global_step": 62176, "epoch": 749} {"train_loss": -20.30432891845703, "global_step": 62177, "epoch": 749} {"train_loss": -20.5008602142334, "global_step": 62178, "epoch": 749} {"train_loss": -20.193666458129883, "global_step": 62179, "epoch": 749} {"train_loss": -20.153566360473633, "global_step": 62180, "epoch": 749} {"train_loss": -20.586286544799805, "global_step": 62181, "epoch": 749} {"train_loss": -20.10956382751465, "global_step": 62182, "epoch": 749} {"train_loss": -20.20256996154785, "global_step": 62183, "epoch": 749} {"train_loss": -20.556259155273438, "global_step": 62184, "epoch": 749} {"train_loss": -20.299360275268555, "global_step": 62185, "epoch": 749} {"train_loss": -20.47200584411621, "global_step": 62186, "epoch": 749} {"train_loss": -20.291975021362305, "global_step": 62187, "epoch": 749} {"train_loss": -20.376781463623047, "global_step": 62188, "epoch": 749} {"train_loss": -20.487728118896484, "global_step": 62189, "epoch": 749} {"train_loss": -20.383459091186523, "global_step": 62190, "epoch": 749} {"train_loss": -20.522729873657227, "global_step": 62191, "epoch": 749} {"train_loss": -20.702598571777344, "global_step": 62192, "epoch": 749} {"train_loss": -20.44041633605957, "global_step": 62193, "epoch": 749} {"train_loss": -20.819305419921875, "global_step": 62194, "epoch": 749} {"train_loss": -20.293853759765625, "global_step": 62195, "epoch": 749} {"train_loss": -20.570941925048828, "global_step": 62196, "epoch": 749} {"train_loss": -20.68659782409668, "global_step": 62197, "epoch": 749} {"train_loss": -20.488000869750977, "global_step": 62198, "epoch": 749} {"train_loss": -20.583791732788086, "global_step": 62199, "epoch": 749} {"train_loss": -20.49437141418457, "global_step": 62200, "epoch": 749} {"train_loss": -20.24324607849121, "global_step": 62201, "epoch": 749} {"train_loss": -20.44585609436035, "global_step": 62202, "epoch": 749} {"train_loss": -20.537824630737305, "global_step": 62203, "epoch": 749} {"train_loss": -20.42255401611328, "global_step": 62204, "epoch": 749} {"train_loss": -20.80531120300293, "global_step": 62205, "epoch": 749} {"train_loss": -20.16836929321289, "global_step": 62206, "epoch": 749} {"train_loss": -20.52717399597168, "global_step": 62207, "epoch": 749} {"train_loss": -20.50743865966797, "global_step": 62208, "epoch": 749} {"train_loss": -20.395715713500977, "global_step": 62209, "epoch": 749} {"train_loss": -20.48916244506836, "global_step": 62210, "epoch": 749} {"train_loss": -20.557573318481445, "global_step": 62211, "epoch": 749} {"train_loss": -20.62441062927246, "global_step": 62212, "epoch": 749} {"train_loss": -20.492948532104492, "global_step": 62213, "epoch": 749} {"train_loss": -20.42396354675293, "global_step": 62214, "epoch": 749} {"train_loss": -20.41291618347168, "global_step": 62215, "epoch": 749} {"train_loss": -20.338727951049805, "global_step": 62216, "epoch": 749} {"train_loss": -20.38749122619629, "global_step": 62217, "epoch": 749} {"train_loss": -20.34505844116211, "global_step": 62218, "epoch": 749} {"train_loss": -20.40199851989746, "global_step": 62219, "epoch": 749} {"train_loss": -20.55677604675293, "global_step": 62220, "epoch": 749} {"train_loss": -20.509565353393555, "global_step": 62221, "epoch": 749} {"train_loss": -20.44289207458496, "global_step": 62222, "epoch": 749} {"train_loss": -20.26513671875, "global_step": 62223, "epoch": 749} {"train_loss": -20.62957191467285, "global_step": 62224, "epoch": 749} {"train_loss": -20.341562271118164, "global_step": 62225, "epoch": 749} {"train_loss": -20.640506744384766, "global_step": 62226, "epoch": 749} {"train_loss": -20.583110809326172, "global_step": 62227, "epoch": 749} {"train_loss": -20.630399703979492, "global_step": 62228, "epoch": 749} {"train_loss": -19.84571647644043, "global_step": 62229, "epoch": 749} {"train_loss": -20.54046630859375, "global_step": 62230, "epoch": 749} {"train_loss": -20.169952392578125, "global_step": 62231, "epoch": 749} {"train_loss": -20.457015991210938, "global_step": 62232, "epoch": 749} {"train_loss": -20.450363159179688, "global_step": 62233, "epoch": 749} {"train_loss": -20.582965850830078, "global_step": 62234, "epoch": 749} {"train_loss": -20.491735458374023, "global_step": 62235, "epoch": 749} {"train_loss": -20.65012550354004, "global_step": 62236, "epoch": 749} {"train_loss": -20.64942741394043, "global_step": 62237, "epoch": 749} {"train_loss": -20.230445861816406, "global_step": 62238, "epoch": 749} {"train_loss": -20.2611026763916, "global_step": 62239, "epoch": 749} {"train_loss": -20.495832443237305, "global_step": 62240, "epoch": 749} {"train_loss": -20.35353660583496, "global_step": 62241, "epoch": 749} {"train_loss": -20.807035446166992, "global_step": 62242, "epoch": 749} {"train_loss": -20.630949020385742, "global_step": 62243, "epoch": 749} {"train_loss": -20.389860153198242, "global_step": 62244, "epoch": 749} {"train_loss": -20.818145751953125, "global_step": 62245, "epoch": 749} {"train_loss": -20.43890953063965, "global_step": 62246, "epoch": 749} {"train_loss": -20.814945220947266, "global_step": 62247, "epoch": 749} {"train_loss": -20.204389572143555, "global_step": 62248, "epoch": 749} {"train_loss": -20.4237117767334, "global_step": 62249, "epoch": 749, "val_loss": 5970577.0} {"train_loss": -20.18897819519043, "global_step": 62250, "epoch": 750} {"train_loss": -20.344085693359375, "global_step": 62251, "epoch": 750} {"train_loss": -19.916015625, "global_step": 62252, "epoch": 750} {"train_loss": -20.23616600036621, "global_step": 62253, "epoch": 750} {"train_loss": -20.315502166748047, "global_step": 62254, "epoch": 750} {"train_loss": -20.14550018310547, "global_step": 62255, "epoch": 750} {"train_loss": -20.072376251220703, "global_step": 62256, "epoch": 750} {"train_loss": -20.27048110961914, "global_step": 62257, "epoch": 750} {"train_loss": -20.158353805541992, "global_step": 62258, "epoch": 750} {"train_loss": -20.306365966796875, "global_step": 62259, "epoch": 750} {"train_loss": -20.08245277404785, "global_step": 62260, "epoch": 750} {"train_loss": -20.330852508544922, "global_step": 62261, "epoch": 750} {"train_loss": -20.541757583618164, "global_step": 62262, "epoch": 750} {"train_loss": -20.786514282226562, "global_step": 62263, "epoch": 750} {"train_loss": -20.531566619873047, "global_step": 62264, "epoch": 750} {"train_loss": -20.27931022644043, "global_step": 62265, "epoch": 750} {"train_loss": -20.518163681030273, "global_step": 62266, "epoch": 750} {"train_loss": -20.329063415527344, "global_step": 62267, "epoch": 750} {"train_loss": -20.676856994628906, "global_step": 62268, "epoch": 750} {"train_loss": -20.622467041015625, "global_step": 62269, "epoch": 750} {"train_loss": -20.47597312927246, "global_step": 62270, "epoch": 750} {"train_loss": -20.957015991210938, "global_step": 62271, "epoch": 750} {"train_loss": -20.480072021484375, "global_step": 62272, "epoch": 750} {"train_loss": -20.528974533081055, "global_step": 62273, "epoch": 750} {"train_loss": -20.371891021728516, "global_step": 62274, "epoch": 750} {"train_loss": -20.588851928710938, "global_step": 62275, "epoch": 750} {"train_loss": -20.44033432006836, "global_step": 62276, "epoch": 750} {"train_loss": -20.365341186523438, "global_step": 62277, "epoch": 750} {"train_loss": -20.087528228759766, "global_step": 62278, "epoch": 750} {"train_loss": -20.593358993530273, "global_step": 62279, "epoch": 750} {"train_loss": -20.441312789916992, "global_step": 62280, "epoch": 750} {"train_loss": -20.31298828125, "global_step": 62281, "epoch": 750} {"train_loss": -20.704282760620117, "global_step": 62282, "epoch": 750} {"train_loss": -20.585533142089844, "global_step": 62283, "epoch": 750} {"train_loss": -20.205472946166992, "global_step": 62284, "epoch": 750} {"train_loss": -20.430252075195312, "global_step": 62285, "epoch": 750} {"train_loss": -20.5367488861084, "global_step": 62286, "epoch": 750} {"train_loss": -20.389684677124023, "global_step": 62287, "epoch": 750} {"train_loss": -20.194568634033203, "global_step": 62288, "epoch": 750} {"train_loss": -20.71377944946289, "global_step": 62289, "epoch": 750} {"train_loss": -21.088376998901367, "global_step": 62290, "epoch": 750} {"train_loss": -20.628726959228516, "global_step": 62291, "epoch": 750} {"train_loss": -20.71600914001465, "global_step": 62292, "epoch": 750} {"train_loss": -20.52829933166504, "global_step": 62293, "epoch": 750} {"train_loss": -20.4851016998291, "global_step": 62294, "epoch": 750} {"train_loss": -20.131214141845703, "global_step": 62295, "epoch": 750} {"train_loss": -20.31217384338379, "global_step": 62296, "epoch": 750} {"train_loss": -20.51104736328125, "global_step": 62297, "epoch": 750} {"train_loss": -20.17823600769043, "global_step": 62298, "epoch": 750} {"train_loss": -20.485557556152344, "global_step": 62299, "epoch": 750} {"train_loss": -20.373779296875, "global_step": 62300, "epoch": 750} {"train_loss": -20.673646926879883, "global_step": 62301, "epoch": 750} {"train_loss": -20.45705223083496, "global_step": 62302, "epoch": 750} {"train_loss": -20.312252044677734, "global_step": 62303, "epoch": 750} {"train_loss": -20.791242599487305, "global_step": 62304, "epoch": 750} {"train_loss": -20.233675003051758, "global_step": 62305, "epoch": 750} {"train_loss": -20.7215633392334, "global_step": 62306, "epoch": 750} {"train_loss": -20.567529678344727, "global_step": 62307, "epoch": 750} {"train_loss": -20.43446922302246, "global_step": 62308, "epoch": 750} {"train_loss": -20.216764450073242, "global_step": 62309, "epoch": 750} {"train_loss": -20.674667358398438, "global_step": 62310, "epoch": 750} {"train_loss": -20.44834327697754, "global_step": 62311, "epoch": 750} {"train_loss": -20.418914794921875, "global_step": 62312, "epoch": 750} {"train_loss": -20.40679931640625, "global_step": 62313, "epoch": 750} {"train_loss": -20.277618408203125, "global_step": 62314, "epoch": 750} {"train_loss": -20.590177536010742, "global_step": 62315, "epoch": 750} {"train_loss": -20.469593048095703, "global_step": 62316, "epoch": 750} {"train_loss": -20.254812240600586, "global_step": 62317, "epoch": 750} {"train_loss": -20.62139320373535, "global_step": 62318, "epoch": 750} {"train_loss": -21.152389526367188, "global_step": 62319, "epoch": 750} {"train_loss": -20.374502182006836, "global_step": 62320, "epoch": 750} {"train_loss": -20.594894409179688, "global_step": 62321, "epoch": 750} {"train_loss": -20.193334579467773, "global_step": 62322, "epoch": 750} {"train_loss": -20.368772506713867, "global_step": 62323, "epoch": 750} {"train_loss": -20.940635681152344, "global_step": 62324, "epoch": 750} {"train_loss": -20.389419555664062, "global_step": 62325, "epoch": 750} {"train_loss": -20.637609481811523, "global_step": 62326, "epoch": 750} {"train_loss": -20.678760528564453, "global_step": 62327, "epoch": 750} {"train_loss": -20.66019630432129, "global_step": 62328, "epoch": 750} {"train_loss": -20.869428634643555, "global_step": 62329, "epoch": 750} {"train_loss": -21.14301109313965, "global_step": 62330, "epoch": 750} {"train_loss": -20.726409912109375, "global_step": 62331, "epoch": 750} {"train_loss": -20.475939325539464, "global_step": 62332, "epoch": 750, "train/sim_max_reward_0": 1.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 0.0, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4500000": 1.0, "test/sim_max_reward_4500001": 1.0, "test/sim_max_reward_4500002": 1.0, "test/sim_max_reward_4500003": 1.0, "test/sim_max_reward_4500004": 0.0, "test/sim_max_reward_4500005": 1.0, "test/sim_max_reward_4500006": 1.0, "test/sim_max_reward_4500007": 1.0, "test/sim_max_reward_4500008": 1.0, "test/sim_max_reward_4500009": 1.0, "test/sim_max_reward_4500010": 1.0, "test/sim_max_reward_4500011": 1.0, "test/sim_max_reward_4500012": 1.0, "test/sim_max_reward_4500013": 1.0, "test/sim_max_reward_4500014": 1.0, "test/sim_max_reward_4500015": 1.0, "test/sim_max_reward_4500016": 1.0, "test/sim_max_reward_4500017": 1.0, "test/sim_max_reward_4500018": 1.0, "test/sim_max_reward_4500019": 0.0, "test/sim_max_reward_4500020": 1.0, "test/sim_max_reward_4500021": 1.0, "train/mean_score": 0.8333333333333334, "test/mean_score": 0.9090909090909091, "val_loss": 6032471.5} {"train_loss": -20.38722801208496, "global_step": 62333, "epoch": 751} {"train_loss": -20.298046112060547, "global_step": 62334, "epoch": 751} {"train_loss": -20.573856353759766, "global_step": 62335, "epoch": 751} {"train_loss": -20.417387008666992, "global_step": 62336, "epoch": 751} {"train_loss": -20.1291561126709, "global_step": 62337, "epoch": 751} {"train_loss": -20.85199546813965, "global_step": 62338, "epoch": 751} {"train_loss": -20.396404266357422, "global_step": 62339, "epoch": 751} {"train_loss": -20.34261131286621, "global_step": 62340, "epoch": 751} {"train_loss": -20.400543212890625, "global_step": 62341, "epoch": 751} {"train_loss": -20.421207427978516, "global_step": 62342, "epoch": 751} {"train_loss": -20.484031677246094, "global_step": 62343, "epoch": 751} {"train_loss": -20.30305290222168, "global_step": 62344, "epoch": 751} {"train_loss": -20.59235954284668, "global_step": 62345, "epoch": 751} {"train_loss": -20.352445602416992, "global_step": 62346, "epoch": 751} {"train_loss": -20.640695571899414, "global_step": 62347, "epoch": 751} {"train_loss": -20.41941261291504, "global_step": 62348, "epoch": 751} {"train_loss": -20.267553329467773, "global_step": 62349, "epoch": 751} {"train_loss": -20.540630340576172, "global_step": 62350, "epoch": 751} {"train_loss": -20.0756778717041, "global_step": 62351, "epoch": 751} {"train_loss": -20.49911880493164, "global_step": 62352, "epoch": 751} {"train_loss": -20.252485275268555, "global_step": 62353, "epoch": 751} {"train_loss": -20.54825210571289, "global_step": 62354, "epoch": 751} {"train_loss": -20.376367568969727, "global_step": 62355, "epoch": 751} {"train_loss": -20.366107940673828, "global_step": 62356, "epoch": 751} {"train_loss": -20.50471305847168, "global_step": 62357, "epoch": 751} {"train_loss": -20.37054443359375, "global_step": 62358, "epoch": 751} {"train_loss": -20.21407127380371, "global_step": 62359, "epoch": 751} {"train_loss": -20.201810836791992, "global_step": 62360, "epoch": 751} {"train_loss": -20.278833389282227, "global_step": 62361, "epoch": 751} {"train_loss": -20.751516342163086, "global_step": 62362, "epoch": 751} {"train_loss": -20.653644561767578, "global_step": 62363, "epoch": 751} {"train_loss": -20.45208740234375, "global_step": 62364, "epoch": 751} {"train_loss": -20.76692771911621, "global_step": 62365, "epoch": 751} {"train_loss": -20.80466079711914, "global_step": 62366, "epoch": 751} {"train_loss": -20.565866470336914, "global_step": 62367, "epoch": 751} {"train_loss": -20.594282150268555, "global_step": 62368, "epoch": 751} {"train_loss": -20.07659912109375, "global_step": 62369, "epoch": 751} {"train_loss": -20.45744514465332, "global_step": 62370, "epoch": 751} {"train_loss": -20.250043869018555, "global_step": 62371, "epoch": 751} {"train_loss": -20.375402450561523, "global_step": 62372, "epoch": 751} {"train_loss": -20.54347801208496, "global_step": 62373, "epoch": 751} {"train_loss": -20.402841567993164, "global_step": 62374, "epoch": 751} {"train_loss": -20.378570556640625, "global_step": 62375, "epoch": 751} {"train_loss": -20.62294578552246, "global_step": 62376, "epoch": 751} {"train_loss": -20.402847290039062, "global_step": 62377, "epoch": 751} {"train_loss": -20.413881301879883, "global_step": 62378, "epoch": 751} {"train_loss": -20.542112350463867, "global_step": 62379, "epoch": 751} {"train_loss": -20.41163444519043, "global_step": 62380, "epoch": 751} {"train_loss": -20.593994140625, "global_step": 62381, "epoch": 751} {"train_loss": -20.430158615112305, "global_step": 62382, "epoch": 751} {"train_loss": -20.56662940979004, "global_step": 62383, "epoch": 751} {"train_loss": -20.631853103637695, "global_step": 62384, "epoch": 751} {"train_loss": -20.294919967651367, "global_step": 62385, "epoch": 751} {"train_loss": -20.172361373901367, "global_step": 62386, "epoch": 751} {"train_loss": -20.549057006835938, "global_step": 62387, "epoch": 751} {"train_loss": -20.614978790283203, "global_step": 62388, "epoch": 751} {"train_loss": -20.65696144104004, "global_step": 62389, "epoch": 751} {"train_loss": -20.198501586914062, "global_step": 62390, "epoch": 751} {"train_loss": -20.595884323120117, "global_step": 62391, "epoch": 751} {"train_loss": -20.596467971801758, "global_step": 62392, "epoch": 751} {"train_loss": -20.21843147277832, "global_step": 62393, "epoch": 751} {"train_loss": -20.58339500427246, "global_step": 62394, "epoch": 751} {"train_loss": -20.70532989501953, "global_step": 62395, "epoch": 751} {"train_loss": -20.25912857055664, "global_step": 62396, "epoch": 751} {"train_loss": -20.736398696899414, "global_step": 62397, "epoch": 751} {"train_loss": -20.28379249572754, "global_step": 62398, "epoch": 751} {"train_loss": -20.290054321289062, "global_step": 62399, "epoch": 751} {"train_loss": -20.44350242614746, "global_step": 62400, "epoch": 751} {"train_loss": -20.27326011657715, "global_step": 62401, "epoch": 751} {"train_loss": -20.576780319213867, "global_step": 62402, "epoch": 751} {"train_loss": -20.755634307861328, "global_step": 62403, "epoch": 751} {"train_loss": -20.611156463623047, "global_step": 62404, "epoch": 751} {"train_loss": -20.385055541992188, "global_step": 62405, "epoch": 751} {"train_loss": -20.503936767578125, "global_step": 62406, "epoch": 751} {"train_loss": -20.706924438476562, "global_step": 62407, "epoch": 751} {"train_loss": -20.47732925415039, "global_step": 62408, "epoch": 751} {"train_loss": -20.464445114135742, "global_step": 62409, "epoch": 751} {"train_loss": -20.650882720947266, "global_step": 62410, "epoch": 751} {"train_loss": -20.473770141601562, "global_step": 62411, "epoch": 751} {"train_loss": -20.463912963867188, "global_step": 62412, "epoch": 751} {"train_loss": -20.6417179107666, "global_step": 62413, "epoch": 751} {"train_loss": -20.756786346435547, "global_step": 62414, "epoch": 751} {"train_loss": -20.47670341399779, "global_step": 62415, "epoch": 751, "val_loss": 5885759.0} {"train_loss": -19.889436721801758, "global_step": 62416, "epoch": 752} {"train_loss": -20.30988121032715, "global_step": 62417, "epoch": 752} {"train_loss": -20.54106903076172, "global_step": 62418, "epoch": 752} {"train_loss": -20.30793571472168, "global_step": 62419, "epoch": 752} {"train_loss": -20.173969268798828, "global_step": 62420, "epoch": 752} {"train_loss": -20.261077880859375, "global_step": 62421, "epoch": 752} {"train_loss": -20.2139835357666, "global_step": 62422, "epoch": 752} {"train_loss": -20.15947723388672, "global_step": 62423, "epoch": 752} {"train_loss": -20.153776168823242, "global_step": 62424, "epoch": 752} {"train_loss": -20.263500213623047, "global_step": 62425, "epoch": 752} {"train_loss": -20.338886260986328, "global_step": 62426, "epoch": 752} {"train_loss": -20.351163864135742, "global_step": 62427, "epoch": 752} {"train_loss": -20.390888214111328, "global_step": 62428, "epoch": 752} {"train_loss": -20.153167724609375, "global_step": 62429, "epoch": 752} {"train_loss": -20.50934410095215, "global_step": 62430, "epoch": 752} {"train_loss": -20.143165588378906, "global_step": 62431, "epoch": 752} {"train_loss": -20.53433609008789, "global_step": 62432, "epoch": 752} {"train_loss": -20.32650375366211, "global_step": 62433, "epoch": 752} {"train_loss": -20.198171615600586, "global_step": 62434, "epoch": 752} {"train_loss": -20.486021041870117, "global_step": 62435, "epoch": 752} {"train_loss": -20.64727783203125, "global_step": 62436, "epoch": 752} {"train_loss": -20.748428344726562, "global_step": 62437, "epoch": 752} {"train_loss": -20.750324249267578, "global_step": 62438, "epoch": 752} {"train_loss": -20.56324577331543, "global_step": 62439, "epoch": 752} {"train_loss": -21.07331085205078, "global_step": 62440, "epoch": 752} {"train_loss": -20.63545799255371, "global_step": 62441, "epoch": 752} {"train_loss": -20.208703994750977, "global_step": 62442, "epoch": 752} {"train_loss": -20.70464515686035, "global_step": 62443, "epoch": 752} {"train_loss": -20.45513153076172, "global_step": 62444, "epoch": 752} {"train_loss": -20.495868682861328, "global_step": 62445, "epoch": 752} {"train_loss": -20.175708770751953, "global_step": 62446, "epoch": 752} {"train_loss": -20.683168411254883, "global_step": 62447, "epoch": 752} {"train_loss": -20.42093849182129, "global_step": 62448, "epoch": 752} {"train_loss": -20.969112396240234, "global_step": 62449, "epoch": 752} {"train_loss": -20.801788330078125, "global_step": 62450, "epoch": 752} {"train_loss": -20.634016036987305, "global_step": 62451, "epoch": 752} {"train_loss": -20.70318603515625, "global_step": 62452, "epoch": 752} {"train_loss": -20.44087028503418, "global_step": 62453, "epoch": 752} {"train_loss": -20.85344886779785, "global_step": 62454, "epoch": 752} {"train_loss": -20.71073341369629, "global_step": 62455, "epoch": 752} {"train_loss": -20.572885513305664, "global_step": 62456, "epoch": 752} {"train_loss": -20.66357421875, "global_step": 62457, "epoch": 752} {"train_loss": -20.470407485961914, "global_step": 62458, "epoch": 752} {"train_loss": -20.426029205322266, "global_step": 62459, "epoch": 752} {"train_loss": -20.632266998291016, "global_step": 62460, "epoch": 752} {"train_loss": -20.31519889831543, "global_step": 62461, "epoch": 752} {"train_loss": -20.401283264160156, "global_step": 62462, "epoch": 752} {"train_loss": -20.58932876586914, "global_step": 62463, "epoch": 752} {"train_loss": -20.257272720336914, "global_step": 62464, "epoch": 752} {"train_loss": -20.448604583740234, "global_step": 62465, "epoch": 752} {"train_loss": -20.626920700073242, "global_step": 62466, "epoch": 752} {"train_loss": -20.720699310302734, "global_step": 62467, "epoch": 752} {"train_loss": -20.741504669189453, "global_step": 62468, "epoch": 752} {"train_loss": -20.613622665405273, "global_step": 62469, "epoch": 752} {"train_loss": -20.19724464416504, "global_step": 62470, "epoch": 752} {"train_loss": -20.316085815429688, "global_step": 62471, "epoch": 752} {"train_loss": -20.567296981811523, "global_step": 62472, "epoch": 752} {"train_loss": -20.37877082824707, "global_step": 62473, "epoch": 752} {"train_loss": -20.517667770385742, "global_step": 62474, "epoch": 752} {"train_loss": -20.5288143157959, "global_step": 62475, "epoch": 752} {"train_loss": -20.383825302124023, "global_step": 62476, "epoch": 752} {"train_loss": -20.500146865844727, "global_step": 62477, "epoch": 752} {"train_loss": -20.567506790161133, "global_step": 62478, "epoch": 752} {"train_loss": -20.53662872314453, "global_step": 62479, "epoch": 752} {"train_loss": -20.57283592224121, "global_step": 62480, "epoch": 752} {"train_loss": -20.45075798034668, "global_step": 62481, "epoch": 752} {"train_loss": -20.386390686035156, "global_step": 62482, "epoch": 752} {"train_loss": -20.571292877197266, "global_step": 62483, "epoch": 752} {"train_loss": -20.254638671875, "global_step": 62484, "epoch": 752} {"train_loss": -20.361759185791016, "global_step": 62485, "epoch": 752} {"train_loss": -20.55756187438965, "global_step": 62486, "epoch": 752} {"train_loss": -20.700809478759766, "global_step": 62487, "epoch": 752} {"train_loss": -20.809579849243164, "global_step": 62488, "epoch": 752} {"train_loss": -20.611194610595703, "global_step": 62489, "epoch": 752} {"train_loss": -20.843305587768555, "global_step": 62490, "epoch": 752} {"train_loss": -20.289602279663086, "global_step": 62491, "epoch": 752} {"train_loss": -20.0587215423584, "global_step": 62492, "epoch": 752} {"train_loss": -20.619516372680664, "global_step": 62493, "epoch": 752} {"train_loss": -20.778379440307617, "global_step": 62494, "epoch": 752} {"train_loss": -19.969982147216797, "global_step": 62495, "epoch": 752} {"train_loss": -20.585094451904297, "global_step": 62496, "epoch": 752} {"train_loss": -20.563467025756836, "global_step": 62497, "epoch": 752} {"train_loss": -20.491787898971374, "global_step": 62498, "epoch": 752, "val_loss": 5825801.5} {"train_loss": -20.44278907775879, "global_step": 62499, "epoch": 753} {"train_loss": -20.072858810424805, "global_step": 62500, "epoch": 753} {"train_loss": -20.441089630126953, "global_step": 62501, "epoch": 753} {"train_loss": -20.530929565429688, "global_step": 62502, "epoch": 753} {"train_loss": -20.40566062927246, "global_step": 62503, "epoch": 753} {"train_loss": -20.415220260620117, "global_step": 62504, "epoch": 753} {"train_loss": -20.120786666870117, "global_step": 62505, "epoch": 753} {"train_loss": -19.91261100769043, "global_step": 62506, "epoch": 753} {"train_loss": -20.48329734802246, "global_step": 62507, "epoch": 753} {"train_loss": -20.371509552001953, "global_step": 62508, "epoch": 753} {"train_loss": -20.357648849487305, "global_step": 62509, "epoch": 753} {"train_loss": -20.285547256469727, "global_step": 62510, "epoch": 753} {"train_loss": -20.527755737304688, "global_step": 62511, "epoch": 753} {"train_loss": -20.6322021484375, "global_step": 62512, "epoch": 753} {"train_loss": -20.60902976989746, "global_step": 62513, "epoch": 753} {"train_loss": -19.803688049316406, "global_step": 62514, "epoch": 753} {"train_loss": -20.454160690307617, "global_step": 62515, "epoch": 753} {"train_loss": -20.257415771484375, "global_step": 62516, "epoch": 753} {"train_loss": -20.127405166625977, "global_step": 62517, "epoch": 753} {"train_loss": -20.659957885742188, "global_step": 62518, "epoch": 753} {"train_loss": -20.421262741088867, "global_step": 62519, "epoch": 753} {"train_loss": -20.42002296447754, "global_step": 62520, "epoch": 753} {"train_loss": -20.268817901611328, "global_step": 62521, "epoch": 753} {"train_loss": -20.414119720458984, "global_step": 62522, "epoch": 753} {"train_loss": -20.54022789001465, "global_step": 62523, "epoch": 753} {"train_loss": -20.162622451782227, "global_step": 62524, "epoch": 753} {"train_loss": -20.200681686401367, "global_step": 62525, "epoch": 753} {"train_loss": -20.72666358947754, "global_step": 62526, "epoch": 753} {"train_loss": -20.303760528564453, "global_step": 62527, "epoch": 753} {"train_loss": -20.57065773010254, "global_step": 62528, "epoch": 753} {"train_loss": -20.586090087890625, "global_step": 62529, "epoch": 753} {"train_loss": -20.08747100830078, "global_step": 62530, "epoch": 753} {"train_loss": -20.698970794677734, "global_step": 62531, "epoch": 753} {"train_loss": -20.225528717041016, "global_step": 62532, "epoch": 753} {"train_loss": -20.62727928161621, "global_step": 62533, "epoch": 753} {"train_loss": -20.498849868774414, "global_step": 62534, "epoch": 753} {"train_loss": -20.742034912109375, "global_step": 62535, "epoch": 753} {"train_loss": -20.573776245117188, "global_step": 62536, "epoch": 753} {"train_loss": -20.054866790771484, "global_step": 62537, "epoch": 753} {"train_loss": -20.354389190673828, "global_step": 62538, "epoch": 753} {"train_loss": -20.20713233947754, "global_step": 62539, "epoch": 753} {"train_loss": -20.413358688354492, "global_step": 62540, "epoch": 753} {"train_loss": -20.262168884277344, "global_step": 62541, "epoch": 753} {"train_loss": -20.559001922607422, "global_step": 62542, "epoch": 753} {"train_loss": -20.564496994018555, "global_step": 62543, "epoch": 753} {"train_loss": -20.575349807739258, "global_step": 62544, "epoch": 753} {"train_loss": -20.653186798095703, "global_step": 62545, "epoch": 753} {"train_loss": -20.720901489257812, "global_step": 62546, "epoch": 753} {"train_loss": -20.500986099243164, "global_step": 62547, "epoch": 753} {"train_loss": -20.73110008239746, "global_step": 62548, "epoch": 753} {"train_loss": -20.548864364624023, "global_step": 62549, "epoch": 753} {"train_loss": -20.537616729736328, "global_step": 62550, "epoch": 753} {"train_loss": -20.590559005737305, "global_step": 62551, "epoch": 753} {"train_loss": -20.26873207092285, "global_step": 62552, "epoch": 753} {"train_loss": -20.288597106933594, "global_step": 62553, "epoch": 753} {"train_loss": -20.795621871948242, "global_step": 62554, "epoch": 753} {"train_loss": -20.382606506347656, "global_step": 62555, "epoch": 753} {"train_loss": -20.59889030456543, "global_step": 62556, "epoch": 753} {"train_loss": -20.44939613342285, "global_step": 62557, "epoch": 753} {"train_loss": -20.137351989746094, "global_step": 62558, "epoch": 753} {"train_loss": -20.62302589416504, "global_step": 62559, "epoch": 753} {"train_loss": -20.90064811706543, "global_step": 62560, "epoch": 753} {"train_loss": -20.501296997070312, "global_step": 62561, "epoch": 753} {"train_loss": -20.634607315063477, "global_step": 62562, "epoch": 753} {"train_loss": -20.156068801879883, "global_step": 62563, "epoch": 753} {"train_loss": -20.568593978881836, "global_step": 62564, "epoch": 753} {"train_loss": -20.339584350585938, "global_step": 62565, "epoch": 753} {"train_loss": -20.595487594604492, "global_step": 62566, "epoch": 753} {"train_loss": -20.268388748168945, "global_step": 62567, "epoch": 753} {"train_loss": -20.677288055419922, "global_step": 62568, "epoch": 753} {"train_loss": -20.591611862182617, "global_step": 62569, "epoch": 753} {"train_loss": -20.47800064086914, "global_step": 62570, "epoch": 753} {"train_loss": -20.54343032836914, "global_step": 62571, "epoch": 753} {"train_loss": -20.36844253540039, "global_step": 62572, "epoch": 753} {"train_loss": -20.566545486450195, "global_step": 62573, "epoch": 753} {"train_loss": -20.18610954284668, "global_step": 62574, "epoch": 753} {"train_loss": -20.62698745727539, "global_step": 62575, "epoch": 753} {"train_loss": -20.375152587890625, "global_step": 62576, "epoch": 753} {"train_loss": -20.46149444580078, "global_step": 62577, "epoch": 753} {"train_loss": -20.37491798400879, "global_step": 62578, "epoch": 753} {"train_loss": -20.506881713867188, "global_step": 62579, "epoch": 753} {"train_loss": -20.73093032836914, "global_step": 62580, "epoch": 753} {"train_loss": -20.453391753047345, "global_step": 62581, "epoch": 753, "val_loss": 5973598.5} {"train_loss": -20.248014450073242, "global_step": 62582, "epoch": 754} {"train_loss": -20.422473907470703, "global_step": 62583, "epoch": 754} {"train_loss": -20.3634033203125, "global_step": 62584, "epoch": 754} {"train_loss": -20.6020565032959, "global_step": 62585, "epoch": 754} {"train_loss": -20.299701690673828, "global_step": 62586, "epoch": 754} {"train_loss": -20.66261863708496, "global_step": 62587, "epoch": 754} {"train_loss": -20.40183448791504, "global_step": 62588, "epoch": 754} {"train_loss": -20.3413143157959, "global_step": 62589, "epoch": 754} {"train_loss": -20.192964553833008, "global_step": 62590, "epoch": 754} {"train_loss": -20.441442489624023, "global_step": 62591, "epoch": 754} {"train_loss": -20.43815803527832, "global_step": 62592, "epoch": 754} {"train_loss": -20.793867111206055, "global_step": 62593, "epoch": 754} {"train_loss": -20.446884155273438, "global_step": 62594, "epoch": 754} {"train_loss": -20.293062210083008, "global_step": 62595, "epoch": 754} {"train_loss": -20.218700408935547, "global_step": 62596, "epoch": 754} {"train_loss": -20.24268913269043, "global_step": 62597, "epoch": 754} {"train_loss": -20.60346794128418, "global_step": 62598, "epoch": 754} {"train_loss": -20.425012588500977, "global_step": 62599, "epoch": 754} {"train_loss": -20.373027801513672, "global_step": 62600, "epoch": 754} {"train_loss": -20.661954879760742, "global_step": 62601, "epoch": 754} {"train_loss": -20.184431076049805, "global_step": 62602, "epoch": 754} {"train_loss": -21.03272247314453, "global_step": 62603, "epoch": 754} {"train_loss": -20.774932861328125, "global_step": 62604, "epoch": 754} {"train_loss": -20.528959274291992, "global_step": 62605, "epoch": 754} {"train_loss": -20.29922866821289, "global_step": 62606, "epoch": 754} {"train_loss": -20.314680099487305, "global_step": 62607, "epoch": 754} {"train_loss": -20.795433044433594, "global_step": 62608, "epoch": 754} {"train_loss": -20.693328857421875, "global_step": 62609, "epoch": 754} {"train_loss": -20.26880645751953, "global_step": 62610, "epoch": 754} {"train_loss": -20.199251174926758, "global_step": 62611, "epoch": 754} {"train_loss": -20.306379318237305, "global_step": 62612, "epoch": 754} {"train_loss": -20.759967803955078, "global_step": 62613, "epoch": 754} {"train_loss": -20.820972442626953, "global_step": 62614, "epoch": 754} {"train_loss": -20.161039352416992, "global_step": 62615, "epoch": 754} {"train_loss": -20.80141258239746, "global_step": 62616, "epoch": 754} {"train_loss": -20.461647033691406, "global_step": 62617, "epoch": 754} {"train_loss": -20.48975944519043, "global_step": 62618, "epoch": 754} {"train_loss": -20.401456832885742, "global_step": 62619, "epoch": 754} {"train_loss": -20.348968505859375, "global_step": 62620, "epoch": 754} {"train_loss": -20.572324752807617, "global_step": 62621, "epoch": 754} {"train_loss": -20.505613327026367, "global_step": 62622, "epoch": 754} {"train_loss": -20.565353393554688, "global_step": 62623, "epoch": 754} {"train_loss": -20.495319366455078, "global_step": 62624, "epoch": 754} {"train_loss": -20.594741821289062, "global_step": 62625, "epoch": 754} {"train_loss": -20.530807495117188, "global_step": 62626, "epoch": 754} {"train_loss": -20.321332931518555, "global_step": 62627, "epoch": 754} {"train_loss": -20.445457458496094, "global_step": 62628, "epoch": 754} {"train_loss": -20.69887351989746, "global_step": 62629, "epoch": 754} {"train_loss": -20.455474853515625, "global_step": 62630, "epoch": 754} {"train_loss": -20.2730712890625, "global_step": 62631, "epoch": 754} {"train_loss": -20.5686092376709, "global_step": 62632, "epoch": 754} {"train_loss": -20.669469833374023, "global_step": 62633, "epoch": 754} {"train_loss": -20.52988624572754, "global_step": 62634, "epoch": 754} {"train_loss": -20.758569717407227, "global_step": 62635, "epoch": 754} {"train_loss": -20.63404655456543, "global_step": 62636, "epoch": 754} {"train_loss": -20.476964950561523, "global_step": 62637, "epoch": 754} {"train_loss": -20.43255043029785, "global_step": 62638, "epoch": 754} {"train_loss": -20.66203498840332, "global_step": 62639, "epoch": 754} {"train_loss": -20.189064025878906, "global_step": 62640, "epoch": 754} {"train_loss": -20.71742820739746, "global_step": 62641, "epoch": 754} {"train_loss": -20.35877799987793, "global_step": 62642, "epoch": 754} {"train_loss": -20.501768112182617, "global_step": 62643, "epoch": 754} {"train_loss": -20.573379516601562, "global_step": 62644, "epoch": 754} {"train_loss": -20.204172134399414, "global_step": 62645, "epoch": 754} {"train_loss": -20.600330352783203, "global_step": 62646, "epoch": 754} {"train_loss": -20.14227867126465, "global_step": 62647, "epoch": 754} {"train_loss": -19.974760055541992, "global_step": 62648, "epoch": 754} {"train_loss": -20.059606552124023, "global_step": 62649, "epoch": 754} {"train_loss": -20.676488876342773, "global_step": 62650, "epoch": 754} {"train_loss": -20.3316707611084, "global_step": 62651, "epoch": 754} {"train_loss": -20.833890914916992, "global_step": 62652, "epoch": 754} {"train_loss": -20.762155532836914, "global_step": 62653, "epoch": 754} {"train_loss": -20.39727020263672, "global_step": 62654, "epoch": 754} {"train_loss": -20.467906951904297, "global_step": 62655, "epoch": 754} {"train_loss": -20.34566879272461, "global_step": 62656, "epoch": 754} {"train_loss": -20.38731575012207, "global_step": 62657, "epoch": 754} {"train_loss": -20.748708724975586, "global_step": 62658, "epoch": 754} {"train_loss": -20.63163185119629, "global_step": 62659, "epoch": 754} {"train_loss": -20.50774574279785, "global_step": 62660, "epoch": 754} {"train_loss": -20.619911193847656, "global_step": 62661, "epoch": 754} {"train_loss": -20.733415603637695, "global_step": 62662, "epoch": 754} {"train_loss": -20.212839126586914, "global_step": 62663, "epoch": 754} {"train_loss": -20.48163627716432, "global_step": 62664, "epoch": 754, "val_loss": 6049691.0} {"train_loss": -20.02565574645996, "global_step": 62665, "epoch": 755} {"train_loss": -19.969257354736328, "global_step": 62666, "epoch": 755} {"train_loss": -19.946626663208008, "global_step": 62667, "epoch": 755} {"train_loss": -19.998342514038086, "global_step": 62668, "epoch": 755} {"train_loss": -19.992626190185547, "global_step": 62669, "epoch": 755} {"train_loss": -20.260562896728516, "global_step": 62670, "epoch": 755} {"train_loss": -20.412553787231445, "global_step": 62671, "epoch": 755} {"train_loss": -20.12945556640625, "global_step": 62672, "epoch": 755} {"train_loss": -20.124359130859375, "global_step": 62673, "epoch": 755} {"train_loss": -20.50093650817871, "global_step": 62674, "epoch": 755} {"train_loss": -20.130138397216797, "global_step": 62675, "epoch": 755} {"train_loss": -20.2340087890625, "global_step": 62676, "epoch": 755} {"train_loss": -19.994632720947266, "global_step": 62677, "epoch": 755} {"train_loss": -20.404998779296875, "global_step": 62678, "epoch": 755} {"train_loss": -20.223175048828125, "global_step": 62679, "epoch": 755} {"train_loss": -20.29895782470703, "global_step": 62680, "epoch": 755} {"train_loss": -20.388690948486328, "global_step": 62681, "epoch": 755} {"train_loss": -19.96274757385254, "global_step": 62682, "epoch": 755} {"train_loss": -20.453977584838867, "global_step": 62683, "epoch": 755} {"train_loss": -20.396224975585938, "global_step": 62684, "epoch": 755} {"train_loss": -20.250364303588867, "global_step": 62685, "epoch": 755} {"train_loss": -20.659093856811523, "global_step": 62686, "epoch": 755} {"train_loss": -20.17654800415039, "global_step": 62687, "epoch": 755} {"train_loss": -20.79198455810547, "global_step": 62688, "epoch": 755} {"train_loss": -20.375402450561523, "global_step": 62689, "epoch": 755} {"train_loss": -19.919614791870117, "global_step": 62690, "epoch": 755} {"train_loss": -20.52471351623535, "global_step": 62691, "epoch": 755} {"train_loss": -20.491724014282227, "global_step": 62692, "epoch": 755} {"train_loss": -20.647001266479492, "global_step": 62693, "epoch": 755} {"train_loss": -20.133195877075195, "global_step": 62694, "epoch": 755} {"train_loss": -20.71091651916504, "global_step": 62695, "epoch": 755} {"train_loss": -20.131099700927734, "global_step": 62696, "epoch": 755} {"train_loss": -20.758502960205078, "global_step": 62697, "epoch": 755} {"train_loss": -20.81597900390625, "global_step": 62698, "epoch": 755} {"train_loss": -20.611631393432617, "global_step": 62699, "epoch": 755} {"train_loss": -20.444217681884766, "global_step": 62700, "epoch": 755} {"train_loss": -19.969579696655273, "global_step": 62701, "epoch": 755} {"train_loss": -20.4956111907959, "global_step": 62702, "epoch": 755} {"train_loss": -20.4977970123291, "global_step": 62703, "epoch": 755} {"train_loss": -20.184057235717773, "global_step": 62704, "epoch": 755} {"train_loss": -20.087284088134766, "global_step": 62705, "epoch": 755} {"train_loss": -20.30586814880371, "global_step": 62706, "epoch": 755} {"train_loss": -20.537967681884766, "global_step": 62707, "epoch": 755} {"train_loss": -20.331668853759766, "global_step": 62708, "epoch": 755} {"train_loss": -20.728710174560547, "global_step": 62709, "epoch": 755} {"train_loss": -20.50304412841797, "global_step": 62710, "epoch": 755} {"train_loss": -20.40006446838379, "global_step": 62711, "epoch": 755} {"train_loss": -20.82012939453125, "global_step": 62712, "epoch": 755} {"train_loss": -20.6180362701416, "global_step": 62713, "epoch": 755} {"train_loss": -20.677967071533203, "global_step": 62714, "epoch": 755} {"train_loss": -20.694509506225586, "global_step": 62715, "epoch": 755} {"train_loss": -20.554611206054688, "global_step": 62716, "epoch": 755} {"train_loss": -20.07635498046875, "global_step": 62717, "epoch": 755} {"train_loss": -20.531160354614258, "global_step": 62718, "epoch": 755} {"train_loss": -20.87877655029297, "global_step": 62719, "epoch": 755} {"train_loss": -20.927921295166016, "global_step": 62720, "epoch": 755} {"train_loss": -20.77271842956543, "global_step": 62721, "epoch": 755} {"train_loss": -20.748781204223633, "global_step": 62722, "epoch": 755} {"train_loss": -20.567014694213867, "global_step": 62723, "epoch": 755} {"train_loss": -20.466632843017578, "global_step": 62724, "epoch": 755} {"train_loss": -21.09026527404785, "global_step": 62725, "epoch": 755} {"train_loss": -20.036977767944336, "global_step": 62726, "epoch": 755} {"train_loss": -20.475561141967773, "global_step": 62727, "epoch": 755} {"train_loss": -20.550888061523438, "global_step": 62728, "epoch": 755} {"train_loss": -20.58481788635254, "global_step": 62729, "epoch": 755} {"train_loss": -20.781064987182617, "global_step": 62730, "epoch": 755} {"train_loss": -21.083829879760742, "global_step": 62731, "epoch": 755} {"train_loss": -20.409772872924805, "global_step": 62732, "epoch": 755} {"train_loss": -20.70704460144043, "global_step": 62733, "epoch": 755} {"train_loss": -20.466644287109375, "global_step": 62734, "epoch": 755} {"train_loss": -20.4879093170166, "global_step": 62735, "epoch": 755} {"train_loss": -20.412946701049805, "global_step": 62736, "epoch": 755} {"train_loss": -20.8675479888916, "global_step": 62737, "epoch": 755} {"train_loss": -20.74605369567871, "global_step": 62738, "epoch": 755} {"train_loss": -20.886999130249023, "global_step": 62739, "epoch": 755} {"train_loss": -20.522857666015625, "global_step": 62740, "epoch": 755} {"train_loss": -20.49449920654297, "global_step": 62741, "epoch": 755} {"train_loss": -20.454282760620117, "global_step": 62742, "epoch": 755} {"train_loss": -20.814420700073242, "global_step": 62743, "epoch": 755} {"train_loss": -20.830175399780273, "global_step": 62744, "epoch": 755} {"train_loss": -20.532886505126953, "global_step": 62745, "epoch": 755} {"train_loss": -20.334224700927734, "global_step": 62746, "epoch": 755} {"train_loss": -20.440257152879095, "global_step": 62747, "epoch": 755, "val_loss": 6144201.0} {"train_loss": -20.28983497619629, "global_step": 62748, "epoch": 756} {"train_loss": -20.233930587768555, "global_step": 62749, "epoch": 756} {"train_loss": -20.3326473236084, "global_step": 62750, "epoch": 756} {"train_loss": -20.481306076049805, "global_step": 62751, "epoch": 756} {"train_loss": -20.319116592407227, "global_step": 62752, "epoch": 756} {"train_loss": -20.649497985839844, "global_step": 62753, "epoch": 756} {"train_loss": -20.651023864746094, "global_step": 62754, "epoch": 756} {"train_loss": -20.45340919494629, "global_step": 62755, "epoch": 756} {"train_loss": -20.110013961791992, "global_step": 62756, "epoch": 756} {"train_loss": -20.398046493530273, "global_step": 62757, "epoch": 756} {"train_loss": -20.155797958374023, "global_step": 62758, "epoch": 756} {"train_loss": -20.522489547729492, "global_step": 62759, "epoch": 756} {"train_loss": -20.573633193969727, "global_step": 62760, "epoch": 756} {"train_loss": -20.093997955322266, "global_step": 62761, "epoch": 756} {"train_loss": -20.699636459350586, "global_step": 62762, "epoch": 756} {"train_loss": -20.234045028686523, "global_step": 62763, "epoch": 756} {"train_loss": -20.278533935546875, "global_step": 62764, "epoch": 756} {"train_loss": -20.25080680847168, "global_step": 62765, "epoch": 756} {"train_loss": -20.469167709350586, "global_step": 62766, "epoch": 756} {"train_loss": -20.510456085205078, "global_step": 62767, "epoch": 756} {"train_loss": -20.44561767578125, "global_step": 62768, "epoch": 756} {"train_loss": -20.6584529876709, "global_step": 62769, "epoch": 756} {"train_loss": -20.731735229492188, "global_step": 62770, "epoch": 756} {"train_loss": -20.70154571533203, "global_step": 62771, "epoch": 756} {"train_loss": -19.87958335876465, "global_step": 62772, "epoch": 756} {"train_loss": -20.404905319213867, "global_step": 62773, "epoch": 756} {"train_loss": -20.376310348510742, "global_step": 62774, "epoch": 756} {"train_loss": -20.24207878112793, "global_step": 62775, "epoch": 756} {"train_loss": -20.370208740234375, "global_step": 62776, "epoch": 756} {"train_loss": -20.740034103393555, "global_step": 62777, "epoch": 756} {"train_loss": -20.585952758789062, "global_step": 62778, "epoch": 756} {"train_loss": -20.241849899291992, "global_step": 62779, "epoch": 756} {"train_loss": -20.774381637573242, "global_step": 62780, "epoch": 756} {"train_loss": -20.375812530517578, "global_step": 62781, "epoch": 756} {"train_loss": -20.376388549804688, "global_step": 62782, "epoch": 756} {"train_loss": -20.437265396118164, "global_step": 62783, "epoch": 756} {"train_loss": -20.59967613220215, "global_step": 62784, "epoch": 756} {"train_loss": -20.50063705444336, "global_step": 62785, "epoch": 756} {"train_loss": -20.649932861328125, "global_step": 62786, "epoch": 756} {"train_loss": -20.80389976501465, "global_step": 62787, "epoch": 756} {"train_loss": -20.55695915222168, "global_step": 62788, "epoch": 756} {"train_loss": -20.5871524810791, "global_step": 62789, "epoch": 756} {"train_loss": -20.761117935180664, "global_step": 62790, "epoch": 756} {"train_loss": -20.40667724609375, "global_step": 62791, "epoch": 756} {"train_loss": -20.8145751953125, "global_step": 62792, "epoch": 756} {"train_loss": -20.232877731323242, "global_step": 62793, "epoch": 756} {"train_loss": -20.558195114135742, "global_step": 62794, "epoch": 756} {"train_loss": -20.53781509399414, "global_step": 62795, "epoch": 756} {"train_loss": -20.812517166137695, "global_step": 62796, "epoch": 756} {"train_loss": -20.603696823120117, "global_step": 62797, "epoch": 756} {"train_loss": -20.443622589111328, "global_step": 62798, "epoch": 756} {"train_loss": -20.53615951538086, "global_step": 62799, "epoch": 756} {"train_loss": -20.823043823242188, "global_step": 62800, "epoch": 756} {"train_loss": -20.312213897705078, "global_step": 62801, "epoch": 756} {"train_loss": -20.555084228515625, "global_step": 62802, "epoch": 756} {"train_loss": -20.668067932128906, "global_step": 62803, "epoch": 756} {"train_loss": -20.35334587097168, "global_step": 62804, "epoch": 756} {"train_loss": -20.838680267333984, "global_step": 62805, "epoch": 756} {"train_loss": -20.60633659362793, "global_step": 62806, "epoch": 756} {"train_loss": -20.626800537109375, "global_step": 62807, "epoch": 756} {"train_loss": -20.72637176513672, "global_step": 62808, "epoch": 756} {"train_loss": -20.55908966064453, "global_step": 62809, "epoch": 756} {"train_loss": -20.45009422302246, "global_step": 62810, "epoch": 756} {"train_loss": -20.47857093811035, "global_step": 62811, "epoch": 756} {"train_loss": -20.47456932067871, "global_step": 62812, "epoch": 756} {"train_loss": -20.479663848876953, "global_step": 62813, "epoch": 756} {"train_loss": -20.68815803527832, "global_step": 62814, "epoch": 756} {"train_loss": -20.730161666870117, "global_step": 62815, "epoch": 756} {"train_loss": -20.471704483032227, "global_step": 62816, "epoch": 756} {"train_loss": -20.248960494995117, "global_step": 62817, "epoch": 756} {"train_loss": -20.741878509521484, "global_step": 62818, "epoch": 756} {"train_loss": -20.58338737487793, "global_step": 62819, "epoch": 756} {"train_loss": -20.72819709777832, "global_step": 62820, "epoch": 756} {"train_loss": -20.700454711914062, "global_step": 62821, "epoch": 756} {"train_loss": -20.607925415039062, "global_step": 62822, "epoch": 756} {"train_loss": -20.70857810974121, "global_step": 62823, "epoch": 756} {"train_loss": -20.373533248901367, "global_step": 62824, "epoch": 756} {"train_loss": -20.370798110961914, "global_step": 62825, "epoch": 756} {"train_loss": -20.375141143798828, "global_step": 62826, "epoch": 756} {"train_loss": -20.41473960876465, "global_step": 62827, "epoch": 756} {"train_loss": -20.33700942993164, "global_step": 62828, "epoch": 756} {"train_loss": -20.580896377563477, "global_step": 62829, "epoch": 756} {"train_loss": -20.49671487923128, "global_step": 62830, "epoch": 756, "val_loss": 5983991.5} {"train_loss": -20.43007469177246, "global_step": 62831, "epoch": 757} {"train_loss": -19.89226722717285, "global_step": 62832, "epoch": 757} {"train_loss": -20.560754776000977, "global_step": 62833, "epoch": 757} {"train_loss": -20.485931396484375, "global_step": 62834, "epoch": 757} {"train_loss": -19.845417022705078, "global_step": 62835, "epoch": 757} {"train_loss": -20.37769317626953, "global_step": 62836, "epoch": 757} {"train_loss": -19.88429832458496, "global_step": 62837, "epoch": 757} {"train_loss": -20.3182430267334, "global_step": 62838, "epoch": 757} {"train_loss": -19.863203048706055, "global_step": 62839, "epoch": 757} {"train_loss": -20.368337631225586, "global_step": 62840, "epoch": 757} {"train_loss": -20.193368911743164, "global_step": 62841, "epoch": 757} {"train_loss": -20.29701042175293, "global_step": 62842, "epoch": 757} {"train_loss": -20.14241600036621, "global_step": 62843, "epoch": 757} {"train_loss": -20.79956817626953, "global_step": 62844, "epoch": 757} {"train_loss": -20.432039260864258, "global_step": 62845, "epoch": 757} {"train_loss": -19.939329147338867, "global_step": 62846, "epoch": 757} {"train_loss": -20.26535415649414, "global_step": 62847, "epoch": 757} {"train_loss": -20.763532638549805, "global_step": 62848, "epoch": 757} {"train_loss": -20.97432518005371, "global_step": 62849, "epoch": 757} {"train_loss": -20.682449340820312, "global_step": 62850, "epoch": 757} {"train_loss": -20.14679527282715, "global_step": 62851, "epoch": 757} {"train_loss": -20.341638565063477, "global_step": 62852, "epoch": 757} {"train_loss": -20.446435928344727, "global_step": 62853, "epoch": 757} {"train_loss": -20.40581512451172, "global_step": 62854, "epoch": 757} {"train_loss": -20.44556999206543, "global_step": 62855, "epoch": 757} {"train_loss": -20.354551315307617, "global_step": 62856, "epoch": 757} {"train_loss": -20.428586959838867, "global_step": 62857, "epoch": 757} {"train_loss": -20.58211326599121, "global_step": 62858, "epoch": 757} {"train_loss": -20.537538528442383, "global_step": 62859, "epoch": 757} {"train_loss": -20.394519805908203, "global_step": 62860, "epoch": 757} {"train_loss": -20.822484970092773, "global_step": 62861, "epoch": 757} {"train_loss": -20.58364486694336, "global_step": 62862, "epoch": 757} {"train_loss": -20.410858154296875, "global_step": 62863, "epoch": 757} {"train_loss": -20.521686553955078, "global_step": 62864, "epoch": 757} {"train_loss": -20.48606300354004, "global_step": 62865, "epoch": 757} {"train_loss": -20.14626121520996, "global_step": 62866, "epoch": 757} {"train_loss": -20.487361907958984, "global_step": 62867, "epoch": 757} {"train_loss": -20.732879638671875, "global_step": 62868, "epoch": 757} {"train_loss": -20.434804916381836, "global_step": 62869, "epoch": 757} {"train_loss": -20.41873550415039, "global_step": 62870, "epoch": 757} {"train_loss": -20.445419311523438, "global_step": 62871, "epoch": 757} {"train_loss": -20.514299392700195, "global_step": 62872, "epoch": 757} {"train_loss": -20.19769859313965, "global_step": 62873, "epoch": 757} {"train_loss": -20.502685546875, "global_step": 62874, "epoch": 757} {"train_loss": -20.28200340270996, "global_step": 62875, "epoch": 757} {"train_loss": -20.873369216918945, "global_step": 62876, "epoch": 757} {"train_loss": -20.7224178314209, "global_step": 62877, "epoch": 757} {"train_loss": -20.149520874023438, "global_step": 62878, "epoch": 757} {"train_loss": -20.65609359741211, "global_step": 62879, "epoch": 757} {"train_loss": -20.472991943359375, "global_step": 62880, "epoch": 757} {"train_loss": -20.276914596557617, "global_step": 62881, "epoch": 757} {"train_loss": -20.585708618164062, "global_step": 62882, "epoch": 757} {"train_loss": -20.637414932250977, "global_step": 62883, "epoch": 757} {"train_loss": -20.275943756103516, "global_step": 62884, "epoch": 757} {"train_loss": -20.40131950378418, "global_step": 62885, "epoch": 757} {"train_loss": -20.488113403320312, "global_step": 62886, "epoch": 757} {"train_loss": -20.45552635192871, "global_step": 62887, "epoch": 757} {"train_loss": -20.471813201904297, "global_step": 62888, "epoch": 757} {"train_loss": -20.576597213745117, "global_step": 62889, "epoch": 757} {"train_loss": -20.7726993560791, "global_step": 62890, "epoch": 757} {"train_loss": -20.837783813476562, "global_step": 62891, "epoch": 757} {"train_loss": -20.891706466674805, "global_step": 62892, "epoch": 757} {"train_loss": -20.925451278686523, "global_step": 62893, "epoch": 757} {"train_loss": -20.520437240600586, "global_step": 62894, "epoch": 757} {"train_loss": -20.545623779296875, "global_step": 62895, "epoch": 757} {"train_loss": -20.510562896728516, "global_step": 62896, "epoch": 757} {"train_loss": -20.97097396850586, "global_step": 62897, "epoch": 757} {"train_loss": -20.53925895690918, "global_step": 62898, "epoch": 757} {"train_loss": -20.72150993347168, "global_step": 62899, "epoch": 757} {"train_loss": -21.03937530517578, "global_step": 62900, "epoch": 757} {"train_loss": -20.97215461730957, "global_step": 62901, "epoch": 757} {"train_loss": -20.435583114624023, "global_step": 62902, "epoch": 757} {"train_loss": -20.621824264526367, "global_step": 62903, "epoch": 757} {"train_loss": -20.470916748046875, "global_step": 62904, "epoch": 757} {"train_loss": -20.28841209411621, "global_step": 62905, "epoch": 757} {"train_loss": -20.39834213256836, "global_step": 62906, "epoch": 757} {"train_loss": -20.68610191345215, "global_step": 62907, "epoch": 757} {"train_loss": -20.566492080688477, "global_step": 62908, "epoch": 757} {"train_loss": -20.597248077392578, "global_step": 62909, "epoch": 757} {"train_loss": -20.67934226989746, "global_step": 62910, "epoch": 757} {"train_loss": -20.434762954711914, "global_step": 62911, "epoch": 757} {"train_loss": -20.80426597595215, "global_step": 62912, "epoch": 757} {"train_loss": -20.476527800042945, "global_step": 62913, "epoch": 757, "val_loss": 6046915.5} {"train_loss": -19.807756423950195, "global_step": 62914, "epoch": 758} {"train_loss": -20.45107078552246, "global_step": 62915, "epoch": 758} {"train_loss": -19.7976131439209, "global_step": 62916, "epoch": 758} {"train_loss": -19.950668334960938, "global_step": 62917, "epoch": 758} {"train_loss": -20.137908935546875, "global_step": 62918, "epoch": 758} {"train_loss": -20.494810104370117, "global_step": 62919, "epoch": 758} {"train_loss": -20.41834831237793, "global_step": 62920, "epoch": 758} {"train_loss": -20.18659019470215, "global_step": 62921, "epoch": 758} {"train_loss": -20.156951904296875, "global_step": 62922, "epoch": 758} {"train_loss": -20.152297973632812, "global_step": 62923, "epoch": 758} {"train_loss": -20.132766723632812, "global_step": 62924, "epoch": 758} {"train_loss": -20.20783233642578, "global_step": 62925, "epoch": 758} {"train_loss": -20.5316219329834, "global_step": 62926, "epoch": 758} {"train_loss": -20.507545471191406, "global_step": 62927, "epoch": 758} {"train_loss": -20.40785789489746, "global_step": 62928, "epoch": 758} {"train_loss": -20.3276424407959, "global_step": 62929, "epoch": 758} {"train_loss": -20.00187873840332, "global_step": 62930, "epoch": 758} {"train_loss": -20.40291404724121, "global_step": 62931, "epoch": 758} {"train_loss": -20.68511962890625, "global_step": 62932, "epoch": 758} {"train_loss": -20.25237464904785, "global_step": 62933, "epoch": 758} {"train_loss": -20.28104019165039, "global_step": 62934, "epoch": 758} {"train_loss": -20.335859298706055, "global_step": 62935, "epoch": 758} {"train_loss": -20.463638305664062, "global_step": 62936, "epoch": 758} {"train_loss": -20.29197120666504, "global_step": 62937, "epoch": 758} {"train_loss": -20.83601188659668, "global_step": 62938, "epoch": 758} {"train_loss": -20.362241744995117, "global_step": 62939, "epoch": 758} {"train_loss": -20.24957847595215, "global_step": 62940, "epoch": 758} {"train_loss": -20.518964767456055, "global_step": 62941, "epoch": 758} {"train_loss": -20.207143783569336, "global_step": 62942, "epoch": 758} {"train_loss": -20.477163314819336, "global_step": 62943, "epoch": 758} {"train_loss": -20.80037498474121, "global_step": 62944, "epoch": 758} {"train_loss": -20.355283737182617, "global_step": 62945, "epoch": 758} {"train_loss": -20.34551239013672, "global_step": 62946, "epoch": 758} {"train_loss": -20.36672592163086, "global_step": 62947, "epoch": 758} {"train_loss": -20.548721313476562, "global_step": 62948, "epoch": 758} {"train_loss": -20.48567008972168, "global_step": 62949, "epoch": 758} {"train_loss": -20.551048278808594, "global_step": 62950, "epoch": 758} {"train_loss": -20.686037063598633, "global_step": 62951, "epoch": 758} {"train_loss": -20.793079376220703, "global_step": 62952, "epoch": 758} {"train_loss": -20.599271774291992, "global_step": 62953, "epoch": 758} {"train_loss": -20.2545166015625, "global_step": 62954, "epoch": 758} {"train_loss": -20.44685935974121, "global_step": 62955, "epoch": 758} {"train_loss": -20.71929359436035, "global_step": 62956, "epoch": 758} {"train_loss": -20.813634872436523, "global_step": 62957, "epoch": 758} {"train_loss": -20.823617935180664, "global_step": 62958, "epoch": 758} {"train_loss": -20.959259033203125, "global_step": 62959, "epoch": 758} {"train_loss": -20.275365829467773, "global_step": 62960, "epoch": 758} {"train_loss": -20.5394344329834, "global_step": 62961, "epoch": 758} {"train_loss": -20.556068420410156, "global_step": 62962, "epoch": 758} {"train_loss": -20.327116012573242, "global_step": 62963, "epoch": 758} {"train_loss": -20.587291717529297, "global_step": 62964, "epoch": 758} {"train_loss": -21.00763511657715, "global_step": 62965, "epoch": 758} {"train_loss": -19.892196655273438, "global_step": 62966, "epoch": 758} {"train_loss": -20.487667083740234, "global_step": 62967, "epoch": 758} {"train_loss": -20.79054832458496, "global_step": 62968, "epoch": 758} {"train_loss": -20.388051986694336, "global_step": 62969, "epoch": 758} {"train_loss": -20.066226959228516, "global_step": 62970, "epoch": 758} {"train_loss": -20.641443252563477, "global_step": 62971, "epoch": 758} {"train_loss": -20.607091903686523, "global_step": 62972, "epoch": 758} {"train_loss": -20.491222381591797, "global_step": 62973, "epoch": 758} {"train_loss": -20.627914428710938, "global_step": 62974, "epoch": 758} {"train_loss": -20.651588439941406, "global_step": 62975, "epoch": 758} {"train_loss": -20.612329483032227, "global_step": 62976, "epoch": 758} {"train_loss": -20.63642120361328, "global_step": 62977, "epoch": 758} {"train_loss": -20.690282821655273, "global_step": 62978, "epoch": 758} {"train_loss": -20.513019561767578, "global_step": 62979, "epoch": 758} {"train_loss": -20.352643966674805, "global_step": 62980, "epoch": 758} {"train_loss": -20.616262435913086, "global_step": 62981, "epoch": 758} {"train_loss": -20.5655460357666, "global_step": 62982, "epoch": 758} {"train_loss": -20.775232315063477, "global_step": 62983, "epoch": 758} {"train_loss": -20.513940811157227, "global_step": 62984, "epoch": 758} {"train_loss": -20.560577392578125, "global_step": 62985, "epoch": 758} {"train_loss": -20.37986183166504, "global_step": 62986, "epoch": 758} {"train_loss": -20.460481643676758, "global_step": 62987, "epoch": 758} {"train_loss": -20.580392837524414, "global_step": 62988, "epoch": 758} {"train_loss": -20.3928279876709, "global_step": 62989, "epoch": 758} {"train_loss": -20.47178840637207, "global_step": 62990, "epoch": 758} {"train_loss": -20.81178092956543, "global_step": 62991, "epoch": 758} {"train_loss": -20.56312370300293, "global_step": 62992, "epoch": 758} {"train_loss": -20.515106201171875, "global_step": 62993, "epoch": 758} {"train_loss": -20.549978256225586, "global_step": 62994, "epoch": 758} {"train_loss": -20.03931999206543, "global_step": 62995, "epoch": 758} {"train_loss": -20.463423579572193, "global_step": 62996, "epoch": 758, "val_loss": 6003606.5} {"train_loss": -19.92059898376465, "global_step": 62997, "epoch": 759} {"train_loss": -20.22873306274414, "global_step": 62998, "epoch": 759} {"train_loss": -20.099716186523438, "global_step": 62999, "epoch": 759} {"train_loss": -20.501440048217773, "global_step": 63000, "epoch": 759} {"train_loss": -20.405248641967773, "global_step": 63001, "epoch": 759} {"train_loss": -20.29609489440918, "global_step": 63002, "epoch": 759} {"train_loss": -20.405424118041992, "global_step": 63003, "epoch": 759} {"train_loss": -19.828527450561523, "global_step": 63004, "epoch": 759} {"train_loss": -20.343931198120117, "global_step": 63005, "epoch": 759} {"train_loss": -19.86333656311035, "global_step": 63006, "epoch": 759} {"train_loss": -20.448108673095703, "global_step": 63007, "epoch": 759} {"train_loss": -20.663293838500977, "global_step": 63008, "epoch": 759} {"train_loss": -20.786130905151367, "global_step": 63009, "epoch": 759} {"train_loss": -20.56553840637207, "global_step": 63010, "epoch": 759} {"train_loss": -20.490243911743164, "global_step": 63011, "epoch": 759} {"train_loss": -20.226181030273438, "global_step": 63012, "epoch": 759} {"train_loss": -20.975238800048828, "global_step": 63013, "epoch": 759} {"train_loss": -20.74240493774414, "global_step": 63014, "epoch": 759} {"train_loss": -20.641738891601562, "global_step": 63015, "epoch": 759} {"train_loss": -20.349355697631836, "global_step": 63016, "epoch": 759} {"train_loss": -20.471445083618164, "global_step": 63017, "epoch": 759} {"train_loss": -20.532983779907227, "global_step": 63018, "epoch": 759} {"train_loss": -20.010730743408203, "global_step": 63019, "epoch": 759} {"train_loss": -20.550535202026367, "global_step": 63020, "epoch": 759} {"train_loss": -20.15376091003418, "global_step": 63021, "epoch": 759} {"train_loss": -20.584657669067383, "global_step": 63022, "epoch": 759} {"train_loss": -20.687589645385742, "global_step": 63023, "epoch": 759} {"train_loss": -20.645877838134766, "global_step": 63024, "epoch": 759} {"train_loss": -20.77571678161621, "global_step": 63025, "epoch": 759} {"train_loss": -20.397907257080078, "global_step": 63026, "epoch": 759} {"train_loss": -20.597686767578125, "global_step": 63027, "epoch": 759} {"train_loss": -20.151151657104492, "global_step": 63028, "epoch": 759} {"train_loss": -20.26151466369629, "global_step": 63029, "epoch": 759} {"train_loss": -20.48298454284668, "global_step": 63030, "epoch": 759} {"train_loss": -20.753671646118164, "global_step": 63031, "epoch": 759} {"train_loss": -20.3963680267334, "global_step": 63032, "epoch": 759} {"train_loss": -20.14361572265625, "global_step": 63033, "epoch": 759} {"train_loss": -19.974262237548828, "global_step": 63034, "epoch": 759} {"train_loss": -20.36126136779785, "global_step": 63035, "epoch": 759} {"train_loss": -20.274269104003906, "global_step": 63036, "epoch": 759} {"train_loss": -20.477794647216797, "global_step": 63037, "epoch": 759} {"train_loss": -20.54714012145996, "global_step": 63038, "epoch": 759} {"train_loss": -20.648351669311523, "global_step": 63039, "epoch": 759} {"train_loss": -20.304061889648438, "global_step": 63040, "epoch": 759} {"train_loss": -20.52754020690918, "global_step": 63041, "epoch": 759} {"train_loss": -20.350820541381836, "global_step": 63042, "epoch": 759} {"train_loss": -20.48914909362793, "global_step": 63043, "epoch": 759} {"train_loss": -20.3400936126709, "global_step": 63044, "epoch": 759} {"train_loss": -20.29624366760254, "global_step": 63045, "epoch": 759} {"train_loss": -20.76338768005371, "global_step": 63046, "epoch": 759} {"train_loss": -20.34335708618164, "global_step": 63047, "epoch": 759} {"train_loss": -20.59819221496582, "global_step": 63048, "epoch": 759} {"train_loss": -20.531452178955078, "global_step": 63049, "epoch": 759} {"train_loss": -20.661535263061523, "global_step": 63050, "epoch": 759} {"train_loss": -20.52635383605957, "global_step": 63051, "epoch": 759} {"train_loss": -20.429792404174805, "global_step": 63052, "epoch": 759} {"train_loss": -20.261972427368164, "global_step": 63053, "epoch": 759} {"train_loss": -20.511388778686523, "global_step": 63054, "epoch": 759} {"train_loss": -20.687097549438477, "global_step": 63055, "epoch": 759} {"train_loss": -20.561376571655273, "global_step": 63056, "epoch": 759} {"train_loss": -20.114717483520508, "global_step": 63057, "epoch": 759} {"train_loss": -20.295143127441406, "global_step": 63058, "epoch": 759} {"train_loss": -20.69978904724121, "global_step": 63059, "epoch": 759} {"train_loss": -20.643407821655273, "global_step": 63060, "epoch": 759} {"train_loss": -20.566303253173828, "global_step": 63061, "epoch": 759} {"train_loss": -20.4593563079834, "global_step": 63062, "epoch": 759} {"train_loss": -20.694429397583008, "global_step": 63063, "epoch": 759} {"train_loss": -20.777212142944336, "global_step": 63064, "epoch": 759} {"train_loss": -20.392118453979492, "global_step": 63065, "epoch": 759} {"train_loss": -20.766080856323242, "global_step": 63066, "epoch": 759} {"train_loss": -20.8013916015625, "global_step": 63067, "epoch": 759} {"train_loss": -20.41446304321289, "global_step": 63068, "epoch": 759} {"train_loss": -20.775415420532227, "global_step": 63069, "epoch": 759} {"train_loss": -20.729848861694336, "global_step": 63070, "epoch": 759} {"train_loss": -20.1957950592041, "global_step": 63071, "epoch": 759} {"train_loss": -20.440628051757812, "global_step": 63072, "epoch": 759} {"train_loss": -20.477739334106445, "global_step": 63073, "epoch": 759} {"train_loss": -20.257352828979492, "global_step": 63074, "epoch": 759} {"train_loss": -20.847448348999023, "global_step": 63075, "epoch": 759} {"train_loss": -20.61895751953125, "global_step": 63076, "epoch": 759} {"train_loss": -20.37700653076172, "global_step": 63077, "epoch": 759} {"train_loss": -21.112335205078125, "global_step": 63078, "epoch": 759} {"train_loss": -20.474848460002118, "global_step": 63079, "epoch": 759, "val_loss": 5951246.0} {"train_loss": -19.702239990234375, "global_step": 63080, "epoch": 760} {"train_loss": -20.69343376159668, "global_step": 63081, "epoch": 760} {"train_loss": -20.204862594604492, "global_step": 63082, "epoch": 760} {"train_loss": -20.038394927978516, "global_step": 63083, "epoch": 760} {"train_loss": -20.3132381439209, "global_step": 63084, "epoch": 760} {"train_loss": -20.261503219604492, "global_step": 63085, "epoch": 760} {"train_loss": -20.132993698120117, "global_step": 63086, "epoch": 760} {"train_loss": -20.595693588256836, "global_step": 63087, "epoch": 760} {"train_loss": -20.37250518798828, "global_step": 63088, "epoch": 760} {"train_loss": -20.106916427612305, "global_step": 63089, "epoch": 760} {"train_loss": -20.066646575927734, "global_step": 63090, "epoch": 760} {"train_loss": -20.387155532836914, "global_step": 63091, "epoch": 760} {"train_loss": -20.322004318237305, "global_step": 63092, "epoch": 760} {"train_loss": -20.609846115112305, "global_step": 63093, "epoch": 760} {"train_loss": -20.158933639526367, "global_step": 63094, "epoch": 760} {"train_loss": -20.245370864868164, "global_step": 63095, "epoch": 760} {"train_loss": -20.62343978881836, "global_step": 63096, "epoch": 760} {"train_loss": -20.528966903686523, "global_step": 63097, "epoch": 760} {"train_loss": -20.539581298828125, "global_step": 63098, "epoch": 760} {"train_loss": -20.63716697692871, "global_step": 63099, "epoch": 760} {"train_loss": -20.608261108398438, "global_step": 63100, "epoch": 760} {"train_loss": -20.214635848999023, "global_step": 63101, "epoch": 760} {"train_loss": -20.839866638183594, "global_step": 63102, "epoch": 760} {"train_loss": -20.374223709106445, "global_step": 63103, "epoch": 760} {"train_loss": -20.31463050842285, "global_step": 63104, "epoch": 760} {"train_loss": -20.690879821777344, "global_step": 63105, "epoch": 760} {"train_loss": -20.53470802307129, "global_step": 63106, "epoch": 760} {"train_loss": -20.403465270996094, "global_step": 63107, "epoch": 760} {"train_loss": -20.719717025756836, "global_step": 63108, "epoch": 760} {"train_loss": -20.33556365966797, "global_step": 63109, "epoch": 760} {"train_loss": -20.484848022460938, "global_step": 63110, "epoch": 760} {"train_loss": -20.329177856445312, "global_step": 63111, "epoch": 760} {"train_loss": -20.446208953857422, "global_step": 63112, "epoch": 760} {"train_loss": -20.652441024780273, "global_step": 63113, "epoch": 760} {"train_loss": -20.72709846496582, "global_step": 63114, "epoch": 760} {"train_loss": -20.502750396728516, "global_step": 63115, "epoch": 760} {"train_loss": -20.426427841186523, "global_step": 63116, "epoch": 760} {"train_loss": -20.50626564025879, "global_step": 63117, "epoch": 760} {"train_loss": -20.93560791015625, "global_step": 63118, "epoch": 760} {"train_loss": -20.901687622070312, "global_step": 63119, "epoch": 760} {"train_loss": -20.497419357299805, "global_step": 63120, "epoch": 760} {"train_loss": -20.79729652404785, "global_step": 63121, "epoch": 760} {"train_loss": -20.3455753326416, "global_step": 63122, "epoch": 760} {"train_loss": -20.66053581237793, "global_step": 63123, "epoch": 760} {"train_loss": -20.353246688842773, "global_step": 63124, "epoch": 760} {"train_loss": -20.728899002075195, "global_step": 63125, "epoch": 760} {"train_loss": -20.67571449279785, "global_step": 63126, "epoch": 760} {"train_loss": -20.60426139831543, "global_step": 63127, "epoch": 760} {"train_loss": -20.4431209564209, "global_step": 63128, "epoch": 760} {"train_loss": -20.37010955810547, "global_step": 63129, "epoch": 760} {"train_loss": -20.954172134399414, "global_step": 63130, "epoch": 760} {"train_loss": -20.42441177368164, "global_step": 63131, "epoch": 760} {"train_loss": -20.317659378051758, "global_step": 63132, "epoch": 760} {"train_loss": -20.398101806640625, "global_step": 63133, "epoch": 760} {"train_loss": -20.471647262573242, "global_step": 63134, "epoch": 760} {"train_loss": -20.083097457885742, "global_step": 63135, "epoch": 760} {"train_loss": -20.543704986572266, "global_step": 63136, "epoch": 760} {"train_loss": -20.82941436767578, "global_step": 63137, "epoch": 760} {"train_loss": -20.192581176757812, "global_step": 63138, "epoch": 760} {"train_loss": -20.24982261657715, "global_step": 63139, "epoch": 760} {"train_loss": -20.036693572998047, "global_step": 63140, "epoch": 760} {"train_loss": -20.42453384399414, "global_step": 63141, "epoch": 760} {"train_loss": -20.63275146484375, "global_step": 63142, "epoch": 760} {"train_loss": -20.354293823242188, "global_step": 63143, "epoch": 760} {"train_loss": -20.271108627319336, "global_step": 63144, "epoch": 760} {"train_loss": -20.34047508239746, "global_step": 63145, "epoch": 760} {"train_loss": -20.413389205932617, "global_step": 63146, "epoch": 760} {"train_loss": -20.44451332092285, "global_step": 63147, "epoch": 760} {"train_loss": -20.546218872070312, "global_step": 63148, "epoch": 760} {"train_loss": -20.420988082885742, "global_step": 63149, "epoch": 760} {"train_loss": -20.469205856323242, "global_step": 63150, "epoch": 760} {"train_loss": -20.893428802490234, "global_step": 63151, "epoch": 760} {"train_loss": -20.752777099609375, "global_step": 63152, "epoch": 760} {"train_loss": -20.716445922851562, "global_step": 63153, "epoch": 760} {"train_loss": -20.83376693725586, "global_step": 63154, "epoch": 760} {"train_loss": -20.44771957397461, "global_step": 63155, "epoch": 760} {"train_loss": -20.479206085205078, "global_step": 63156, "epoch": 760} {"train_loss": -20.500640869140625, "global_step": 63157, "epoch": 760} {"train_loss": -20.51997947692871, "global_step": 63158, "epoch": 760} {"train_loss": -20.400484085083008, "global_step": 63159, "epoch": 760} {"train_loss": -20.73609733581543, "global_step": 63160, "epoch": 760} {"train_loss": -20.477970123291016, "global_step": 63161, "epoch": 760} {"train_loss": -20.455403385392156, "global_step": 63162, "epoch": 760, "val_loss": 5970399.0} {"train_loss": -20.111570358276367, "global_step": 63163, "epoch": 761} {"train_loss": -20.211938858032227, "global_step": 63164, "epoch": 761} {"train_loss": -20.210790634155273, "global_step": 63165, "epoch": 761} {"train_loss": -20.467178344726562, "global_step": 63166, "epoch": 761} {"train_loss": -20.710355758666992, "global_step": 63167, "epoch": 761} {"train_loss": -20.206851959228516, "global_step": 63168, "epoch": 761} {"train_loss": -20.391603469848633, "global_step": 63169, "epoch": 761} {"train_loss": -20.885908126831055, "global_step": 63170, "epoch": 761} {"train_loss": -20.2359676361084, "global_step": 63171, "epoch": 761} {"train_loss": -20.167165756225586, "global_step": 63172, "epoch": 761} {"train_loss": -20.037012100219727, "global_step": 63173, "epoch": 761} {"train_loss": -20.40450096130371, "global_step": 63174, "epoch": 761} {"train_loss": -20.282339096069336, "global_step": 63175, "epoch": 761} {"train_loss": -20.62987518310547, "global_step": 63176, "epoch": 761} {"train_loss": -20.612329483032227, "global_step": 63177, "epoch": 761} {"train_loss": -20.204944610595703, "global_step": 63178, "epoch": 761} {"train_loss": -20.382675170898438, "global_step": 63179, "epoch": 761} {"train_loss": -20.338281631469727, "global_step": 63180, "epoch": 761} {"train_loss": -20.373023986816406, "global_step": 63181, "epoch": 761} {"train_loss": -20.71685791015625, "global_step": 63182, "epoch": 761} {"train_loss": -20.41468620300293, "global_step": 63183, "epoch": 761} {"train_loss": -20.626869201660156, "global_step": 63184, "epoch": 761} {"train_loss": -20.59465217590332, "global_step": 63185, "epoch": 761} {"train_loss": -20.14400291442871, "global_step": 63186, "epoch": 761} {"train_loss": -20.45465660095215, "global_step": 63187, "epoch": 761} {"train_loss": -20.397897720336914, "global_step": 63188, "epoch": 761} {"train_loss": -20.297529220581055, "global_step": 63189, "epoch": 761} {"train_loss": -20.6471004486084, "global_step": 63190, "epoch": 761} {"train_loss": -20.47420883178711, "global_step": 63191, "epoch": 761} {"train_loss": -20.6054744720459, "global_step": 63192, "epoch": 761} {"train_loss": -20.439123153686523, "global_step": 63193, "epoch": 761} {"train_loss": -20.419200897216797, "global_step": 63194, "epoch": 761} {"train_loss": -20.433547973632812, "global_step": 63195, "epoch": 761} {"train_loss": -20.856515884399414, "global_step": 63196, "epoch": 761} {"train_loss": -20.59556770324707, "global_step": 63197, "epoch": 761} {"train_loss": -20.619274139404297, "global_step": 63198, "epoch": 761} {"train_loss": -20.378583908081055, "global_step": 63199, "epoch": 761} {"train_loss": -20.718379974365234, "global_step": 63200, "epoch": 761} {"train_loss": -20.44831657409668, "global_step": 63201, "epoch": 761} {"train_loss": -20.906463623046875, "global_step": 63202, "epoch": 761} {"train_loss": -20.730960845947266, "global_step": 63203, "epoch": 761} {"train_loss": -20.807775497436523, "global_step": 63204, "epoch": 761} {"train_loss": -20.676538467407227, "global_step": 63205, "epoch": 761} {"train_loss": -20.80865478515625, "global_step": 63206, "epoch": 761} {"train_loss": -20.908308029174805, "global_step": 63207, "epoch": 761} {"train_loss": -20.578840255737305, "global_step": 63208, "epoch": 761} {"train_loss": -20.453887939453125, "global_step": 63209, "epoch": 761} {"train_loss": -20.532190322875977, "global_step": 63210, "epoch": 761} {"train_loss": -20.57978630065918, "global_step": 63211, "epoch": 761} {"train_loss": -20.20825958251953, "global_step": 63212, "epoch": 761} {"train_loss": -20.528461456298828, "global_step": 63213, "epoch": 761} {"train_loss": -20.330976486206055, "global_step": 63214, "epoch": 761} {"train_loss": -20.795743942260742, "global_step": 63215, "epoch": 761} {"train_loss": -20.55466079711914, "global_step": 63216, "epoch": 761} {"train_loss": -20.20383071899414, "global_step": 63217, "epoch": 761} {"train_loss": -20.574369430541992, "global_step": 63218, "epoch": 761} {"train_loss": -20.54751968383789, "global_step": 63219, "epoch": 761} {"train_loss": -20.875696182250977, "global_step": 63220, "epoch": 761} {"train_loss": -20.508989334106445, "global_step": 63221, "epoch": 761} {"train_loss": -20.531280517578125, "global_step": 63222, "epoch": 761} {"train_loss": -20.410219192504883, "global_step": 63223, "epoch": 761} {"train_loss": -20.54952049255371, "global_step": 63224, "epoch": 761} {"train_loss": -20.434995651245117, "global_step": 63225, "epoch": 761} {"train_loss": -20.30649185180664, "global_step": 63226, "epoch": 761} {"train_loss": -20.18398094177246, "global_step": 63227, "epoch": 761} {"train_loss": -20.755373001098633, "global_step": 63228, "epoch": 761} {"train_loss": -20.47657585144043, "global_step": 63229, "epoch": 761} {"train_loss": -20.6781005859375, "global_step": 63230, "epoch": 761} {"train_loss": -20.573993682861328, "global_step": 63231, "epoch": 761} {"train_loss": -20.919858932495117, "global_step": 63232, "epoch": 761} {"train_loss": -20.255643844604492, "global_step": 63233, "epoch": 761} {"train_loss": -20.57637596130371, "global_step": 63234, "epoch": 761} {"train_loss": -20.518617630004883, "global_step": 63235, "epoch": 761} {"train_loss": -20.785968780517578, "global_step": 63236, "epoch": 761} {"train_loss": -20.306825637817383, "global_step": 63237, "epoch": 761} {"train_loss": -21.191692352294922, "global_step": 63238, "epoch": 761} {"train_loss": -20.526700973510742, "global_step": 63239, "epoch": 761} {"train_loss": -20.504919052124023, "global_step": 63240, "epoch": 761} {"train_loss": -20.397680282592773, "global_step": 63241, "epoch": 761} {"train_loss": -20.409347534179688, "global_step": 63242, "epoch": 761} {"train_loss": -20.97218894958496, "global_step": 63243, "epoch": 761} {"train_loss": -20.56740379333496, "global_step": 63244, "epoch": 761} {"train_loss": -20.518425539315466, "global_step": 63245, "epoch": 761, "val_loss": 5977230.5} {"train_loss": -19.781335830688477, "global_step": 63246, "epoch": 762} {"train_loss": -20.520009994506836, "global_step": 63247, "epoch": 762} {"train_loss": -20.020105361938477, "global_step": 63248, "epoch": 762} {"train_loss": -19.964447021484375, "global_step": 63249, "epoch": 762} {"train_loss": -20.127275466918945, "global_step": 63250, "epoch": 762} {"train_loss": -20.245861053466797, "global_step": 63251, "epoch": 762} {"train_loss": -20.248504638671875, "global_step": 63252, "epoch": 762} {"train_loss": -20.36884307861328, "global_step": 63253, "epoch": 762} {"train_loss": -20.225095748901367, "global_step": 63254, "epoch": 762} {"train_loss": -20.34149742126465, "global_step": 63255, "epoch": 762} {"train_loss": -20.71400260925293, "global_step": 63256, "epoch": 762} {"train_loss": -20.6599178314209, "global_step": 63257, "epoch": 762} {"train_loss": -20.073272705078125, "global_step": 63258, "epoch": 762} {"train_loss": -20.145334243774414, "global_step": 63259, "epoch": 762} {"train_loss": -20.314786911010742, "global_step": 63260, "epoch": 762} {"train_loss": -20.744558334350586, "global_step": 63261, "epoch": 762} {"train_loss": -20.2926082611084, "global_step": 63262, "epoch": 762} {"train_loss": -20.50543212890625, "global_step": 63263, "epoch": 762} {"train_loss": -20.55323600769043, "global_step": 63264, "epoch": 762} {"train_loss": -20.556100845336914, "global_step": 63265, "epoch": 762} {"train_loss": -20.576650619506836, "global_step": 63266, "epoch": 762} {"train_loss": -20.715688705444336, "global_step": 63267, "epoch": 762} {"train_loss": -20.536882400512695, "global_step": 63268, "epoch": 762} {"train_loss": -20.67793083190918, "global_step": 63269, "epoch": 762} {"train_loss": -20.416248321533203, "global_step": 63270, "epoch": 762} {"train_loss": -20.550825119018555, "global_step": 63271, "epoch": 762} {"train_loss": -20.389158248901367, "global_step": 63272, "epoch": 762} {"train_loss": -20.455015182495117, "global_step": 63273, "epoch": 762} {"train_loss": -20.214582443237305, "global_step": 63274, "epoch": 762} {"train_loss": -20.65471839904785, "global_step": 63275, "epoch": 762} {"train_loss": -20.37679672241211, "global_step": 63276, "epoch": 762} {"train_loss": -20.632171630859375, "global_step": 63277, "epoch": 762} {"train_loss": -20.147499084472656, "global_step": 63278, "epoch": 762} {"train_loss": -20.4688777923584, "global_step": 63279, "epoch": 762} {"train_loss": -20.654632568359375, "global_step": 63280, "epoch": 762} {"train_loss": -20.461515426635742, "global_step": 63281, "epoch": 762} {"train_loss": -20.55889892578125, "global_step": 63282, "epoch": 762} {"train_loss": -20.797880172729492, "global_step": 63283, "epoch": 762} {"train_loss": -20.429365158081055, "global_step": 63284, "epoch": 762} {"train_loss": -20.506799697875977, "global_step": 63285, "epoch": 762} {"train_loss": -20.63920021057129, "global_step": 63286, "epoch": 762} {"train_loss": -20.49347496032715, "global_step": 63287, "epoch": 762} {"train_loss": -20.66312599182129, "global_step": 63288, "epoch": 762} {"train_loss": -20.68842124938965, "global_step": 63289, "epoch": 762} {"train_loss": -20.45378875732422, "global_step": 63290, "epoch": 762} {"train_loss": -20.2636775970459, "global_step": 63291, "epoch": 762} {"train_loss": -20.45460319519043, "global_step": 63292, "epoch": 762} {"train_loss": -20.69484519958496, "global_step": 63293, "epoch": 762} {"train_loss": -20.52191162109375, "global_step": 63294, "epoch": 762} {"train_loss": -20.600370407104492, "global_step": 63295, "epoch": 762} {"train_loss": -20.655237197875977, "global_step": 63296, "epoch": 762} {"train_loss": -20.403369903564453, "global_step": 63297, "epoch": 762} {"train_loss": -20.561288833618164, "global_step": 63298, "epoch": 762} {"train_loss": -20.573514938354492, "global_step": 63299, "epoch": 762} {"train_loss": -20.493104934692383, "global_step": 63300, "epoch": 762} {"train_loss": -20.621931076049805, "global_step": 63301, "epoch": 762} {"train_loss": -20.74543571472168, "global_step": 63302, "epoch": 762} {"train_loss": -20.37214469909668, "global_step": 63303, "epoch": 762} {"train_loss": -20.667978286743164, "global_step": 63304, "epoch": 762} {"train_loss": -20.697233200073242, "global_step": 63305, "epoch": 762} {"train_loss": -20.359455108642578, "global_step": 63306, "epoch": 762} {"train_loss": -20.696557998657227, "global_step": 63307, "epoch": 762} {"train_loss": -20.4235897064209, "global_step": 63308, "epoch": 762} {"train_loss": -20.584732055664062, "global_step": 63309, "epoch": 762} {"train_loss": -20.6092586517334, "global_step": 63310, "epoch": 762} {"train_loss": -20.552560806274414, "global_step": 63311, "epoch": 762} {"train_loss": -20.392101287841797, "global_step": 63312, "epoch": 762} {"train_loss": -20.79189109802246, "global_step": 63313, "epoch": 762} {"train_loss": -20.7412109375, "global_step": 63314, "epoch": 762} {"train_loss": -20.335956573486328, "global_step": 63315, "epoch": 762} {"train_loss": -20.679096221923828, "global_step": 63316, "epoch": 762} {"train_loss": -20.174274444580078, "global_step": 63317, "epoch": 762} {"train_loss": -20.427471160888672, "global_step": 63318, "epoch": 762} {"train_loss": -20.598188400268555, "global_step": 63319, "epoch": 762} {"train_loss": -20.44745445251465, "global_step": 63320, "epoch": 762} {"train_loss": -20.321805953979492, "global_step": 63321, "epoch": 762} {"train_loss": -20.32638931274414, "global_step": 63322, "epoch": 762} {"train_loss": -20.33681297302246, "global_step": 63323, "epoch": 762} {"train_loss": -21.01021385192871, "global_step": 63324, "epoch": 762} {"train_loss": -20.13312339782715, "global_step": 63325, "epoch": 762} {"train_loss": -20.44288444519043, "global_step": 63326, "epoch": 762} {"train_loss": -20.536645889282227, "global_step": 63327, "epoch": 762} {"train_loss": -20.48068170662386, "global_step": 63328, "epoch": 762, "val_loss": 5978711.0} {"train_loss": -19.562204360961914, "global_step": 63329, "epoch": 763} {"train_loss": -19.92923927307129, "global_step": 63330, "epoch": 763} {"train_loss": -20.86774444580078, "global_step": 63331, "epoch": 763} {"train_loss": -20.313764572143555, "global_step": 63332, "epoch": 763} {"train_loss": -20.3361759185791, "global_step": 63333, "epoch": 763} {"train_loss": -20.299955368041992, "global_step": 63334, "epoch": 763} {"train_loss": -20.36016845703125, "global_step": 63335, "epoch": 763} {"train_loss": -20.291446685791016, "global_step": 63336, "epoch": 763} {"train_loss": -20.626441955566406, "global_step": 63337, "epoch": 763} {"train_loss": -20.531028747558594, "global_step": 63338, "epoch": 763} {"train_loss": -20.3528995513916, "global_step": 63339, "epoch": 763} {"train_loss": -20.50482749938965, "global_step": 63340, "epoch": 763} {"train_loss": -20.68470573425293, "global_step": 63341, "epoch": 763} {"train_loss": -20.304462432861328, "global_step": 63342, "epoch": 763} {"train_loss": -20.495220184326172, "global_step": 63343, "epoch": 763} {"train_loss": -20.781261444091797, "global_step": 63344, "epoch": 763} {"train_loss": -20.56641960144043, "global_step": 63345, "epoch": 763} {"train_loss": -20.38446617126465, "global_step": 63346, "epoch": 763} {"train_loss": -20.559221267700195, "global_step": 63347, "epoch": 763} {"train_loss": -20.765460968017578, "global_step": 63348, "epoch": 763} {"train_loss": -20.416364669799805, "global_step": 63349, "epoch": 763} {"train_loss": -20.468839645385742, "global_step": 63350, "epoch": 763} {"train_loss": -20.754974365234375, "global_step": 63351, "epoch": 763} {"train_loss": -20.636585235595703, "global_step": 63352, "epoch": 763} {"train_loss": -21.0090274810791, "global_step": 63353, "epoch": 763} {"train_loss": -20.770462036132812, "global_step": 63354, "epoch": 763} {"train_loss": -20.478397369384766, "global_step": 63355, "epoch": 763} {"train_loss": -20.460203170776367, "global_step": 63356, "epoch": 763} {"train_loss": -20.371957778930664, "global_step": 63357, "epoch": 763} {"train_loss": -20.831117630004883, "global_step": 63358, "epoch": 763} {"train_loss": -20.482364654541016, "global_step": 63359, "epoch": 763} {"train_loss": -20.3248348236084, "global_step": 63360, "epoch": 763} {"train_loss": -20.230836868286133, "global_step": 63361, "epoch": 763} {"train_loss": -20.364194869995117, "global_step": 63362, "epoch": 763} {"train_loss": -20.81573486328125, "global_step": 63363, "epoch": 763} {"train_loss": -20.23701286315918, "global_step": 63364, "epoch": 763} {"train_loss": -20.514484405517578, "global_step": 63365, "epoch": 763} {"train_loss": -20.331073760986328, "global_step": 63366, "epoch": 763} {"train_loss": -20.51964569091797, "global_step": 63367, "epoch": 763} {"train_loss": -20.71188735961914, "global_step": 63368, "epoch": 763} {"train_loss": -20.19574546813965, "global_step": 63369, "epoch": 763} {"train_loss": -20.284038543701172, "global_step": 63370, "epoch": 763} {"train_loss": -20.608394622802734, "global_step": 63371, "epoch": 763} {"train_loss": -20.363300323486328, "global_step": 63372, "epoch": 763} {"train_loss": -20.590089797973633, "global_step": 63373, "epoch": 763} {"train_loss": -21.06242561340332, "global_step": 63374, "epoch": 763} {"train_loss": -20.769729614257812, "global_step": 63375, "epoch": 763} {"train_loss": -20.67259979248047, "global_step": 63376, "epoch": 763} {"train_loss": -20.7127742767334, "global_step": 63377, "epoch": 763} {"train_loss": -20.236299514770508, "global_step": 63378, "epoch": 763} {"train_loss": -20.692285537719727, "global_step": 63379, "epoch": 763} {"train_loss": -20.838834762573242, "global_step": 63380, "epoch": 763} {"train_loss": -20.527984619140625, "global_step": 63381, "epoch": 763} {"train_loss": -20.701204299926758, "global_step": 63382, "epoch": 763} {"train_loss": -20.520105361938477, "global_step": 63383, "epoch": 763} {"train_loss": -20.572370529174805, "global_step": 63384, "epoch": 763} {"train_loss": -20.867490768432617, "global_step": 63385, "epoch": 763} {"train_loss": -20.957111358642578, "global_step": 63386, "epoch": 763} {"train_loss": -20.532888412475586, "global_step": 63387, "epoch": 763} {"train_loss": -20.630966186523438, "global_step": 63388, "epoch": 763} {"train_loss": -20.436649322509766, "global_step": 63389, "epoch": 763} {"train_loss": -20.599624633789062, "global_step": 63390, "epoch": 763} {"train_loss": -20.249181747436523, "global_step": 63391, "epoch": 763} {"train_loss": -20.611242294311523, "global_step": 63392, "epoch": 763} {"train_loss": -20.493165969848633, "global_step": 63393, "epoch": 763} {"train_loss": -20.672992706298828, "global_step": 63394, "epoch": 763} {"train_loss": -19.85004997253418, "global_step": 63395, "epoch": 763} {"train_loss": -20.391000747680664, "global_step": 63396, "epoch": 763} {"train_loss": -20.631439208984375, "global_step": 63397, "epoch": 763} {"train_loss": -20.67827606201172, "global_step": 63398, "epoch": 763} {"train_loss": -20.53824806213379, "global_step": 63399, "epoch": 763} {"train_loss": -20.481569290161133, "global_step": 63400, "epoch": 763} {"train_loss": -20.15728187561035, "global_step": 63401, "epoch": 763} {"train_loss": -20.299787521362305, "global_step": 63402, "epoch": 763} {"train_loss": -20.547903060913086, "global_step": 63403, "epoch": 763} {"train_loss": -20.72017478942871, "global_step": 63404, "epoch": 763} {"train_loss": -20.440223693847656, "global_step": 63405, "epoch": 763} {"train_loss": -20.415788650512695, "global_step": 63406, "epoch": 763} {"train_loss": -20.358612060546875, "global_step": 63407, "epoch": 763} {"train_loss": -20.599624633789062, "global_step": 63408, "epoch": 763} {"train_loss": -20.405174255371094, "global_step": 63409, "epoch": 763} {"train_loss": -20.4088191986084, "global_step": 63410, "epoch": 763} {"train_loss": -20.51509563032403, "global_step": 63411, "epoch": 763, "val_loss": 5926251.0} {"train_loss": -20.32830810546875, "global_step": 63412, "epoch": 764} {"train_loss": -20.305940628051758, "global_step": 63413, "epoch": 764} {"train_loss": -20.371015548706055, "global_step": 63414, "epoch": 764} {"train_loss": -19.99651336669922, "global_step": 63415, "epoch": 764} {"train_loss": -19.945825576782227, "global_step": 63416, "epoch": 764} {"train_loss": -20.432170867919922, "global_step": 63417, "epoch": 764} {"train_loss": -20.25589942932129, "global_step": 63418, "epoch": 764} {"train_loss": -20.2806453704834, "global_step": 63419, "epoch": 764} {"train_loss": -20.430068969726562, "global_step": 63420, "epoch": 764} {"train_loss": -20.52179718017578, "global_step": 63421, "epoch": 764} {"train_loss": -20.386333465576172, "global_step": 63422, "epoch": 764} {"train_loss": -20.511438369750977, "global_step": 63423, "epoch": 764} {"train_loss": -20.586824417114258, "global_step": 63424, "epoch": 764} {"train_loss": -20.415149688720703, "global_step": 63425, "epoch": 764} {"train_loss": -20.36443519592285, "global_step": 63426, "epoch": 764} {"train_loss": -20.56496238708496, "global_step": 63427, "epoch": 764} {"train_loss": -20.58132553100586, "global_step": 63428, "epoch": 764} {"train_loss": -20.430715560913086, "global_step": 63429, "epoch": 764} {"train_loss": -20.625905990600586, "global_step": 63430, "epoch": 764} {"train_loss": -20.397886276245117, "global_step": 63431, "epoch": 764} {"train_loss": -20.18148422241211, "global_step": 63432, "epoch": 764} {"train_loss": -20.59668731689453, "global_step": 63433, "epoch": 764} {"train_loss": -20.515607833862305, "global_step": 63434, "epoch": 764} {"train_loss": -20.68893814086914, "global_step": 63435, "epoch": 764} {"train_loss": -20.595497131347656, "global_step": 63436, "epoch": 764} {"train_loss": -20.717214584350586, "global_step": 63437, "epoch": 764} {"train_loss": -20.376686096191406, "global_step": 63438, "epoch": 764} {"train_loss": -20.60150718688965, "global_step": 63439, "epoch": 764} {"train_loss": -20.649860382080078, "global_step": 63440, "epoch": 764} {"train_loss": -20.545881271362305, "global_step": 63441, "epoch": 764} {"train_loss": -20.911630630493164, "global_step": 63442, "epoch": 764} {"train_loss": -20.684125900268555, "global_step": 63443, "epoch": 764} {"train_loss": -20.147130966186523, "global_step": 63444, "epoch": 764} {"train_loss": -20.43476104736328, "global_step": 63445, "epoch": 764} {"train_loss": -20.562244415283203, "global_step": 63446, "epoch": 764} {"train_loss": -20.341604232788086, "global_step": 63447, "epoch": 764} {"train_loss": -20.93524742126465, "global_step": 63448, "epoch": 764} {"train_loss": -20.867525100708008, "global_step": 63449, "epoch": 764} {"train_loss": -20.725725173950195, "global_step": 63450, "epoch": 764} {"train_loss": -20.62190818786621, "global_step": 63451, "epoch": 764} {"train_loss": -20.53551483154297, "global_step": 63452, "epoch": 764} {"train_loss": -20.291812896728516, "global_step": 63453, "epoch": 764} {"train_loss": -20.781667709350586, "global_step": 63454, "epoch": 764} {"train_loss": -20.05210304260254, "global_step": 63455, "epoch": 764} {"train_loss": -20.46456527709961, "global_step": 63456, "epoch": 764} {"train_loss": -20.586584091186523, "global_step": 63457, "epoch": 764} {"train_loss": -20.710174560546875, "global_step": 63458, "epoch": 764} {"train_loss": -20.35517692565918, "global_step": 63459, "epoch": 764} {"train_loss": -20.569232940673828, "global_step": 63460, "epoch": 764} {"train_loss": -20.407983779907227, "global_step": 63461, "epoch": 764} {"train_loss": -20.605533599853516, "global_step": 63462, "epoch": 764} {"train_loss": -20.7452392578125, "global_step": 63463, "epoch": 764} {"train_loss": -20.353322982788086, "global_step": 63464, "epoch": 764} {"train_loss": -20.443674087524414, "global_step": 63465, "epoch": 764} {"train_loss": -20.752222061157227, "global_step": 63466, "epoch": 764} {"train_loss": -20.824317932128906, "global_step": 63467, "epoch": 764} {"train_loss": -20.52414321899414, "global_step": 63468, "epoch": 764} {"train_loss": -20.69370460510254, "global_step": 63469, "epoch": 764} {"train_loss": -20.414337158203125, "global_step": 63470, "epoch": 764} {"train_loss": -20.62660789489746, "global_step": 63471, "epoch": 764} {"train_loss": -20.290740966796875, "global_step": 63472, "epoch": 764} {"train_loss": -20.827001571655273, "global_step": 63473, "epoch": 764} {"train_loss": -20.4835147857666, "global_step": 63474, "epoch": 764} {"train_loss": -20.67989158630371, "global_step": 63475, "epoch": 764} {"train_loss": -20.9290828704834, "global_step": 63476, "epoch": 764} {"train_loss": -20.912458419799805, "global_step": 63477, "epoch": 764} {"train_loss": -20.790197372436523, "global_step": 63478, "epoch": 764} {"train_loss": -20.346586227416992, "global_step": 63479, "epoch": 764} {"train_loss": -20.55303955078125, "global_step": 63480, "epoch": 764} {"train_loss": -20.638519287109375, "global_step": 63481, "epoch": 764} {"train_loss": -20.7736873626709, "global_step": 63482, "epoch": 764} {"train_loss": -20.673046112060547, "global_step": 63483, "epoch": 764} {"train_loss": -20.680648803710938, "global_step": 63484, "epoch": 764} {"train_loss": -20.883787155151367, "global_step": 63485, "epoch": 764} {"train_loss": -20.589874267578125, "global_step": 63486, "epoch": 764} {"train_loss": -20.63368034362793, "global_step": 63487, "epoch": 764} {"train_loss": -20.40093231201172, "global_step": 63488, "epoch": 764} {"train_loss": -20.57147216796875, "global_step": 63489, "epoch": 764} {"train_loss": -20.77540397644043, "global_step": 63490, "epoch": 764} {"train_loss": -20.56442642211914, "global_step": 63491, "epoch": 764} {"train_loss": -20.8886661529541, "global_step": 63492, "epoch": 764} {"train_loss": -20.613309860229492, "global_step": 63493, "epoch": 764} {"train_loss": -20.53523642758289, "global_step": 63494, "epoch": 764, "val_loss": 6026429.0} {"train_loss": -20.106534957885742, "global_step": 63495, "epoch": 765} {"train_loss": -20.38926887512207, "global_step": 63496, "epoch": 765} {"train_loss": -20.525304794311523, "global_step": 63497, "epoch": 765} {"train_loss": -20.494428634643555, "global_step": 63498, "epoch": 765} {"train_loss": -20.122522354125977, "global_step": 63499, "epoch": 765} {"train_loss": -20.165369033813477, "global_step": 63500, "epoch": 765} {"train_loss": -20.192306518554688, "global_step": 63501, "epoch": 765} {"train_loss": -20.30497932434082, "global_step": 63502, "epoch": 765} {"train_loss": -20.35638999938965, "global_step": 63503, "epoch": 765} {"train_loss": -20.64186668395996, "global_step": 63504, "epoch": 765} {"train_loss": -20.46571159362793, "global_step": 63505, "epoch": 765} {"train_loss": -20.47771644592285, "global_step": 63506, "epoch": 765} {"train_loss": -20.131330490112305, "global_step": 63507, "epoch": 765} {"train_loss": -20.28392791748047, "global_step": 63508, "epoch": 765} {"train_loss": -20.82155418395996, "global_step": 63509, "epoch": 765} {"train_loss": -20.13040542602539, "global_step": 63510, "epoch": 765} {"train_loss": -20.204435348510742, "global_step": 63511, "epoch": 765} {"train_loss": -20.755584716796875, "global_step": 63512, "epoch": 765} {"train_loss": -20.360795974731445, "global_step": 63513, "epoch": 765} {"train_loss": -20.134767532348633, "global_step": 63514, "epoch": 765} {"train_loss": -20.13746452331543, "global_step": 63515, "epoch": 765} {"train_loss": -20.544679641723633, "global_step": 63516, "epoch": 765} {"train_loss": -20.194395065307617, "global_step": 63517, "epoch": 765} {"train_loss": -20.493240356445312, "global_step": 63518, "epoch": 765} {"train_loss": -20.7761287689209, "global_step": 63519, "epoch": 765} {"train_loss": -20.82405662536621, "global_step": 63520, "epoch": 765} {"train_loss": -20.653852462768555, "global_step": 63521, "epoch": 765} {"train_loss": -20.467992782592773, "global_step": 63522, "epoch": 765} {"train_loss": -20.33528709411621, "global_step": 63523, "epoch": 765} {"train_loss": -20.305070877075195, "global_step": 63524, "epoch": 765} {"train_loss": -20.507450103759766, "global_step": 63525, "epoch": 765} {"train_loss": -20.842077255249023, "global_step": 63526, "epoch": 765} {"train_loss": -20.82372283935547, "global_step": 63527, "epoch": 765} {"train_loss": -20.79205322265625, "global_step": 63528, "epoch": 765} {"train_loss": -20.703903198242188, "global_step": 63529, "epoch": 765} {"train_loss": -20.229869842529297, "global_step": 63530, "epoch": 765} {"train_loss": -20.560157775878906, "global_step": 63531, "epoch": 765} {"train_loss": -20.545812606811523, "global_step": 63532, "epoch": 765} {"train_loss": -20.719078063964844, "global_step": 63533, "epoch": 765} {"train_loss": -20.981517791748047, "global_step": 63534, "epoch": 765} {"train_loss": -20.89838981628418, "global_step": 63535, "epoch": 765} {"train_loss": -20.491708755493164, "global_step": 63536, "epoch": 765} {"train_loss": -20.617542266845703, "global_step": 63537, "epoch": 765} {"train_loss": -20.78902244567871, "global_step": 63538, "epoch": 765} {"train_loss": -20.755008697509766, "global_step": 63539, "epoch": 765} {"train_loss": -20.8741512298584, "global_step": 63540, "epoch": 765} {"train_loss": -20.488014221191406, "global_step": 63541, "epoch": 765} {"train_loss": -21.094472885131836, "global_step": 63542, "epoch": 765} {"train_loss": -20.713001251220703, "global_step": 63543, "epoch": 765} {"train_loss": -20.907917022705078, "global_step": 63544, "epoch": 765} {"train_loss": -20.231931686401367, "global_step": 63545, "epoch": 765} {"train_loss": -20.28460121154785, "global_step": 63546, "epoch": 765} {"train_loss": -20.919218063354492, "global_step": 63547, "epoch": 765} {"train_loss": -20.30908203125, "global_step": 63548, "epoch": 765} {"train_loss": -20.667448043823242, "global_step": 63549, "epoch": 765} {"train_loss": -20.510412216186523, "global_step": 63550, "epoch": 765} {"train_loss": -20.636886596679688, "global_step": 63551, "epoch": 765} {"train_loss": -20.86084747314453, "global_step": 63552, "epoch": 765} {"train_loss": -21.05773162841797, "global_step": 63553, "epoch": 765} {"train_loss": -20.651920318603516, "global_step": 63554, "epoch": 765} {"train_loss": -19.59004020690918, "global_step": 63555, "epoch": 765} {"train_loss": -20.271963119506836, "global_step": 63556, "epoch": 765} {"train_loss": -20.75130844116211, "global_step": 63557, "epoch": 765} {"train_loss": -20.572660446166992, "global_step": 63558, "epoch": 765} {"train_loss": -20.569448471069336, "global_step": 63559, "epoch": 765} {"train_loss": -20.581878662109375, "global_step": 63560, "epoch": 765} {"train_loss": -20.83814811706543, "global_step": 63561, "epoch": 765} {"train_loss": -20.66280174255371, "global_step": 63562, "epoch": 765} {"train_loss": -20.536457061767578, "global_step": 63563, "epoch": 765} {"train_loss": -20.374677658081055, "global_step": 63564, "epoch": 765} {"train_loss": -20.5259952545166, "global_step": 63565, "epoch": 765} {"train_loss": -20.517440795898438, "global_step": 63566, "epoch": 765} {"train_loss": -20.580228805541992, "global_step": 63567, "epoch": 765} {"train_loss": -20.67001724243164, "global_step": 63568, "epoch": 765} {"train_loss": -20.423480987548828, "global_step": 63569, "epoch": 765} {"train_loss": -20.9326114654541, "global_step": 63570, "epoch": 765} {"train_loss": -20.78328514099121, "global_step": 63571, "epoch": 765} {"train_loss": -19.925586700439453, "global_step": 63572, "epoch": 765} {"train_loss": -20.659744262695312, "global_step": 63573, "epoch": 765} {"train_loss": -20.706022262573242, "global_step": 63574, "epoch": 765} {"train_loss": -20.38614273071289, "global_step": 63575, "epoch": 765} {"train_loss": -20.32013702392578, "global_step": 63576, "epoch": 765} {"train_loss": -20.521449514182216, "global_step": 63577, "epoch": 765, "val_loss": 5917715.0} {"train_loss": -20.2593994140625, "global_step": 63578, "epoch": 766} {"train_loss": -19.89662742614746, "global_step": 63579, "epoch": 766} {"train_loss": -20.64317512512207, "global_step": 63580, "epoch": 766} {"train_loss": -20.06954002380371, "global_step": 63581, "epoch": 766} {"train_loss": -19.971776962280273, "global_step": 63582, "epoch": 766} {"train_loss": -20.347620010375977, "global_step": 63583, "epoch": 766} {"train_loss": -20.066505432128906, "global_step": 63584, "epoch": 766} {"train_loss": -20.163619995117188, "global_step": 63585, "epoch": 766} {"train_loss": -20.680768966674805, "global_step": 63586, "epoch": 766} {"train_loss": -20.197284698486328, "global_step": 63587, "epoch": 766} {"train_loss": -20.593862533569336, "global_step": 63588, "epoch": 766} {"train_loss": -20.503448486328125, "global_step": 63589, "epoch": 766} {"train_loss": -20.25571632385254, "global_step": 63590, "epoch": 766} {"train_loss": -20.56410026550293, "global_step": 63591, "epoch": 766} {"train_loss": -20.2650203704834, "global_step": 63592, "epoch": 766} {"train_loss": -20.675186157226562, "global_step": 63593, "epoch": 766} {"train_loss": -20.15852165222168, "global_step": 63594, "epoch": 766} {"train_loss": -20.431344985961914, "global_step": 63595, "epoch": 766} {"train_loss": -20.504425048828125, "global_step": 63596, "epoch": 766} {"train_loss": -20.719213485717773, "global_step": 63597, "epoch": 766} {"train_loss": -20.30944061279297, "global_step": 63598, "epoch": 766} {"train_loss": -20.191192626953125, "global_step": 63599, "epoch": 766} {"train_loss": -20.598997116088867, "global_step": 63600, "epoch": 766} {"train_loss": -20.71120262145996, "global_step": 63601, "epoch": 766} {"train_loss": -20.80126190185547, "global_step": 63602, "epoch": 766} {"train_loss": -20.689481735229492, "global_step": 63603, "epoch": 766} {"train_loss": -20.63330841064453, "global_step": 63604, "epoch": 766} {"train_loss": -20.901386260986328, "global_step": 63605, "epoch": 766} {"train_loss": -20.912582397460938, "global_step": 63606, "epoch": 766} {"train_loss": -20.297224044799805, "global_step": 63607, "epoch": 766} {"train_loss": -20.47010612487793, "global_step": 63608, "epoch": 766} {"train_loss": -20.444997787475586, "global_step": 63609, "epoch": 766} {"train_loss": -20.613515853881836, "global_step": 63610, "epoch": 766} {"train_loss": -20.613962173461914, "global_step": 63611, "epoch": 766} {"train_loss": -20.417133331298828, "global_step": 63612, "epoch": 766} {"train_loss": -20.37226676940918, "global_step": 63613, "epoch": 766} {"train_loss": -20.781320571899414, "global_step": 63614, "epoch": 766} {"train_loss": -20.460590362548828, "global_step": 63615, "epoch": 766} {"train_loss": -20.693599700927734, "global_step": 63616, "epoch": 766} {"train_loss": -20.52024269104004, "global_step": 63617, "epoch": 766} {"train_loss": -20.529752731323242, "global_step": 63618, "epoch": 766} {"train_loss": -20.66310691833496, "global_step": 63619, "epoch": 766} {"train_loss": -20.50316047668457, "global_step": 63620, "epoch": 766} {"train_loss": -20.69808006286621, "global_step": 63621, "epoch": 766} {"train_loss": -20.70895767211914, "global_step": 63622, "epoch": 766} {"train_loss": -20.630868911743164, "global_step": 63623, "epoch": 766} {"train_loss": -20.743732452392578, "global_step": 63624, "epoch": 766} {"train_loss": -20.84859275817871, "global_step": 63625, "epoch": 766} {"train_loss": -20.542724609375, "global_step": 63626, "epoch": 766} {"train_loss": -20.467844009399414, "global_step": 63627, "epoch": 766} {"train_loss": -20.659040451049805, "global_step": 63628, "epoch": 766} {"train_loss": -20.54157066345215, "global_step": 63629, "epoch": 766} {"train_loss": -20.465545654296875, "global_step": 63630, "epoch": 766} {"train_loss": -20.856611251831055, "global_step": 63631, "epoch": 766} {"train_loss": -20.403499603271484, "global_step": 63632, "epoch": 766} {"train_loss": -20.641843795776367, "global_step": 63633, "epoch": 766} {"train_loss": -20.519575119018555, "global_step": 63634, "epoch": 766} {"train_loss": -20.554594039916992, "global_step": 63635, "epoch": 766} {"train_loss": -20.891082763671875, "global_step": 63636, "epoch": 766} {"train_loss": -20.43828773498535, "global_step": 63637, "epoch": 766} {"train_loss": -20.85646629333496, "global_step": 63638, "epoch": 766} {"train_loss": -20.730918884277344, "global_step": 63639, "epoch": 766} {"train_loss": -20.761377334594727, "global_step": 63640, "epoch": 766} {"train_loss": -20.616683959960938, "global_step": 63641, "epoch": 766} {"train_loss": -20.80243492126465, "global_step": 63642, "epoch": 766} {"train_loss": -20.613264083862305, "global_step": 63643, "epoch": 766} {"train_loss": -20.724735260009766, "global_step": 63644, "epoch": 766} {"train_loss": -20.263517379760742, "global_step": 63645, "epoch": 766} {"train_loss": -20.775310516357422, "global_step": 63646, "epoch": 766} {"train_loss": -20.787662506103516, "global_step": 63647, "epoch": 766} {"train_loss": -20.64267921447754, "global_step": 63648, "epoch": 766} {"train_loss": -20.7171688079834, "global_step": 63649, "epoch": 766} {"train_loss": -20.31850242614746, "global_step": 63650, "epoch": 766} {"train_loss": -20.542333602905273, "global_step": 63651, "epoch": 766} {"train_loss": -20.661497116088867, "global_step": 63652, "epoch": 766} {"train_loss": -20.257247924804688, "global_step": 63653, "epoch": 766} {"train_loss": -20.593143463134766, "global_step": 63654, "epoch": 766} {"train_loss": -20.65705108642578, "global_step": 63655, "epoch": 766} {"train_loss": -20.742429733276367, "global_step": 63656, "epoch": 766} {"train_loss": -20.53993034362793, "global_step": 63657, "epoch": 766} {"train_loss": -20.6553955078125, "global_step": 63658, "epoch": 766} {"train_loss": -20.753530502319336, "global_step": 63659, "epoch": 766} {"train_loss": -20.551615427775555, "global_step": 63660, "epoch": 766, "val_loss": 5962977.0} {"train_loss": -19.880836486816406, "global_step": 63661, "epoch": 767} {"train_loss": -19.890661239624023, "global_step": 63662, "epoch": 767} {"train_loss": -20.66852378845215, "global_step": 63663, "epoch": 767} {"train_loss": -20.461511611938477, "global_step": 63664, "epoch": 767} {"train_loss": -20.326948165893555, "global_step": 63665, "epoch": 767} {"train_loss": -20.42946434020996, "global_step": 63666, "epoch": 767} {"train_loss": -20.711444854736328, "global_step": 63667, "epoch": 767} {"train_loss": -20.13502311706543, "global_step": 63668, "epoch": 767} {"train_loss": -20.207181930541992, "global_step": 63669, "epoch": 767} {"train_loss": -20.13716697692871, "global_step": 63670, "epoch": 767} {"train_loss": -20.344181060791016, "global_step": 63671, "epoch": 767} {"train_loss": -20.29457664489746, "global_step": 63672, "epoch": 767} {"train_loss": -20.261632919311523, "global_step": 63673, "epoch": 767} {"train_loss": -20.29330062866211, "global_step": 63674, "epoch": 767} {"train_loss": -19.995323181152344, "global_step": 63675, "epoch": 767} {"train_loss": -19.98381996154785, "global_step": 63676, "epoch": 767} {"train_loss": -20.73445701599121, "global_step": 63677, "epoch": 767} {"train_loss": -20.357187271118164, "global_step": 63678, "epoch": 767} {"train_loss": -20.29867935180664, "global_step": 63679, "epoch": 767} {"train_loss": -20.144933700561523, "global_step": 63680, "epoch": 767} {"train_loss": -20.81903648376465, "global_step": 63681, "epoch": 767} {"train_loss": -20.72096824645996, "global_step": 63682, "epoch": 767} {"train_loss": -20.621545791625977, "global_step": 63683, "epoch": 767} {"train_loss": -20.567474365234375, "global_step": 63684, "epoch": 767} {"train_loss": -20.876001358032227, "global_step": 63685, "epoch": 767} {"train_loss": -20.67568016052246, "global_step": 63686, "epoch": 767} {"train_loss": -20.31466293334961, "global_step": 63687, "epoch": 767} {"train_loss": -20.226985931396484, "global_step": 63688, "epoch": 767} {"train_loss": -20.708282470703125, "global_step": 63689, "epoch": 767} {"train_loss": -20.508852005004883, "global_step": 63690, "epoch": 767} {"train_loss": -20.360301971435547, "global_step": 63691, "epoch": 767} {"train_loss": -20.661767959594727, "global_step": 63692, "epoch": 767} {"train_loss": -20.398365020751953, "global_step": 63693, "epoch": 767} {"train_loss": -20.888723373413086, "global_step": 63694, "epoch": 767} {"train_loss": -21.028921127319336, "global_step": 63695, "epoch": 767} {"train_loss": -20.8001766204834, "global_step": 63696, "epoch": 767} {"train_loss": -20.574899673461914, "global_step": 63697, "epoch": 767} {"train_loss": -20.592716217041016, "global_step": 63698, "epoch": 767} {"train_loss": -20.514577865600586, "global_step": 63699, "epoch": 767} {"train_loss": -20.514074325561523, "global_step": 63700, "epoch": 767} {"train_loss": -20.50861167907715, "global_step": 63701, "epoch": 767} {"train_loss": -20.98849868774414, "global_step": 63702, "epoch": 767} {"train_loss": -20.889432907104492, "global_step": 63703, "epoch": 767} {"train_loss": -20.517377853393555, "global_step": 63704, "epoch": 767} {"train_loss": -20.48899269104004, "global_step": 63705, "epoch": 767} {"train_loss": -20.654489517211914, "global_step": 63706, "epoch": 767} {"train_loss": -20.3702335357666, "global_step": 63707, "epoch": 767} {"train_loss": -20.557201385498047, "global_step": 63708, "epoch": 767} {"train_loss": -20.569622039794922, "global_step": 63709, "epoch": 767} {"train_loss": -20.48607635498047, "global_step": 63710, "epoch": 767} {"train_loss": -20.7912654876709, "global_step": 63711, "epoch": 767} {"train_loss": -20.730600357055664, "global_step": 63712, "epoch": 767} {"train_loss": -20.540494918823242, "global_step": 63713, "epoch": 767} {"train_loss": -20.318490982055664, "global_step": 63714, "epoch": 767} {"train_loss": -20.514680862426758, "global_step": 63715, "epoch": 767} {"train_loss": -20.37381362915039, "global_step": 63716, "epoch": 767} {"train_loss": -20.094396591186523, "global_step": 63717, "epoch": 767} {"train_loss": -20.382490158081055, "global_step": 63718, "epoch": 767} {"train_loss": -20.48818016052246, "global_step": 63719, "epoch": 767} {"train_loss": -20.511905670166016, "global_step": 63720, "epoch": 767} {"train_loss": -20.453208923339844, "global_step": 63721, "epoch": 767} {"train_loss": -20.6124267578125, "global_step": 63722, "epoch": 767} {"train_loss": -20.411273956298828, "global_step": 63723, "epoch": 767} {"train_loss": -20.560089111328125, "global_step": 63724, "epoch": 767} {"train_loss": -20.882537841796875, "global_step": 63725, "epoch": 767} {"train_loss": -20.595470428466797, "global_step": 63726, "epoch": 767} {"train_loss": -20.76643180847168, "global_step": 63727, "epoch": 767} {"train_loss": -20.355993270874023, "global_step": 63728, "epoch": 767} {"train_loss": -20.825895309448242, "global_step": 63729, "epoch": 767} {"train_loss": -20.661151885986328, "global_step": 63730, "epoch": 767} {"train_loss": -20.36846351623535, "global_step": 63731, "epoch": 767} {"train_loss": -20.602109909057617, "global_step": 63732, "epoch": 767} {"train_loss": -20.555091857910156, "global_step": 63733, "epoch": 767} {"train_loss": -20.581594467163086, "global_step": 63734, "epoch": 767} {"train_loss": -20.502126693725586, "global_step": 63735, "epoch": 767} {"train_loss": -20.88385009765625, "global_step": 63736, "epoch": 767} {"train_loss": -20.427188873291016, "global_step": 63737, "epoch": 767} {"train_loss": -20.639724731445312, "global_step": 63738, "epoch": 767} {"train_loss": -20.311691284179688, "global_step": 63739, "epoch": 767} {"train_loss": -20.631988525390625, "global_step": 63740, "epoch": 767} {"train_loss": -20.381837844848633, "global_step": 63741, "epoch": 767} {"train_loss": -20.35076904296875, "global_step": 63742, "epoch": 767} {"train_loss": -20.499833463186242, "global_step": 63743, "epoch": 767, "val_loss": 5990954.0} {"train_loss": -19.8834171295166, "global_step": 63744, "epoch": 768} {"train_loss": -20.62794303894043, "global_step": 63745, "epoch": 768} {"train_loss": -19.792591094970703, "global_step": 63746, "epoch": 768} {"train_loss": -20.28145408630371, "global_step": 63747, "epoch": 768} {"train_loss": -20.266023635864258, "global_step": 63748, "epoch": 768} {"train_loss": -20.43997573852539, "global_step": 63749, "epoch": 768} {"train_loss": -20.258060455322266, "global_step": 63750, "epoch": 768} {"train_loss": -20.276290893554688, "global_step": 63751, "epoch": 768} {"train_loss": -20.561948776245117, "global_step": 63752, "epoch": 768} {"train_loss": -20.365095138549805, "global_step": 63753, "epoch": 768} {"train_loss": -20.58269691467285, "global_step": 63754, "epoch": 768} {"train_loss": -20.569379806518555, "global_step": 63755, "epoch": 768} {"train_loss": -20.600183486938477, "global_step": 63756, "epoch": 768} {"train_loss": -20.498706817626953, "global_step": 63757, "epoch": 768} {"train_loss": -20.73650550842285, "global_step": 63758, "epoch": 768} {"train_loss": -20.34988784790039, "global_step": 63759, "epoch": 768} {"train_loss": -20.524730682373047, "global_step": 63760, "epoch": 768} {"train_loss": -20.74612808227539, "global_step": 63761, "epoch": 768} {"train_loss": -20.11858367919922, "global_step": 63762, "epoch": 768} {"train_loss": -20.331602096557617, "global_step": 63763, "epoch": 768} {"train_loss": -20.26540184020996, "global_step": 63764, "epoch": 768} {"train_loss": -20.537038803100586, "global_step": 63765, "epoch": 768} {"train_loss": -20.297176361083984, "global_step": 63766, "epoch": 768} {"train_loss": -20.42822265625, "global_step": 63767, "epoch": 768} {"train_loss": -20.657337188720703, "global_step": 63768, "epoch": 768} {"train_loss": -20.3595027923584, "global_step": 63769, "epoch": 768} {"train_loss": -20.283884048461914, "global_step": 63770, "epoch": 768} {"train_loss": -20.683568954467773, "global_step": 63771, "epoch": 768} {"train_loss": -20.34949493408203, "global_step": 63772, "epoch": 768} {"train_loss": -20.40865135192871, "global_step": 63773, "epoch": 768} {"train_loss": -20.598981857299805, "global_step": 63774, "epoch": 768} {"train_loss": -20.542282104492188, "global_step": 63775, "epoch": 768} {"train_loss": -20.6279354095459, "global_step": 63776, "epoch": 768} {"train_loss": -20.394725799560547, "global_step": 63777, "epoch": 768} {"train_loss": -20.709842681884766, "global_step": 63778, "epoch": 768} {"train_loss": -20.415037155151367, "global_step": 63779, "epoch": 768} {"train_loss": -20.520675659179688, "global_step": 63780, "epoch": 768} {"train_loss": -20.41933250427246, "global_step": 63781, "epoch": 768} {"train_loss": -20.326887130737305, "global_step": 63782, "epoch": 768} {"train_loss": -20.714242935180664, "global_step": 63783, "epoch": 768} {"train_loss": -20.36317253112793, "global_step": 63784, "epoch": 768} {"train_loss": -20.372114181518555, "global_step": 63785, "epoch": 768} {"train_loss": -20.62417221069336, "global_step": 63786, "epoch": 768} {"train_loss": -20.661481857299805, "global_step": 63787, "epoch": 768} {"train_loss": -20.860788345336914, "global_step": 63788, "epoch": 768} {"train_loss": -20.927566528320312, "global_step": 63789, "epoch": 768} {"train_loss": -20.797073364257812, "global_step": 63790, "epoch": 768} {"train_loss": -20.585025787353516, "global_step": 63791, "epoch": 768} {"train_loss": -20.758663177490234, "global_step": 63792, "epoch": 768} {"train_loss": -20.530057907104492, "global_step": 63793, "epoch": 768} {"train_loss": -20.52887535095215, "global_step": 63794, "epoch": 768} {"train_loss": -20.475418090820312, "global_step": 63795, "epoch": 768} {"train_loss": -20.097564697265625, "global_step": 63796, "epoch": 768} {"train_loss": -20.14620018005371, "global_step": 63797, "epoch": 768} {"train_loss": -20.46073341369629, "global_step": 63798, "epoch": 768} {"train_loss": -20.420669555664062, "global_step": 63799, "epoch": 768} {"train_loss": -20.876684188842773, "global_step": 63800, "epoch": 768} {"train_loss": -20.868667602539062, "global_step": 63801, "epoch": 768} {"train_loss": -20.671762466430664, "global_step": 63802, "epoch": 768} {"train_loss": -20.629209518432617, "global_step": 63803, "epoch": 768} {"train_loss": -20.408912658691406, "global_step": 63804, "epoch": 768} {"train_loss": -20.800626754760742, "global_step": 63805, "epoch": 768} {"train_loss": -20.3807373046875, "global_step": 63806, "epoch": 768} {"train_loss": -20.637304306030273, "global_step": 63807, "epoch": 768} {"train_loss": -20.154529571533203, "global_step": 63808, "epoch": 768} {"train_loss": -20.689090728759766, "global_step": 63809, "epoch": 768} {"train_loss": -21.0856876373291, "global_step": 63810, "epoch": 768} {"train_loss": -20.617904663085938, "global_step": 63811, "epoch": 768} {"train_loss": -20.529321670532227, "global_step": 63812, "epoch": 768} {"train_loss": -20.740629196166992, "global_step": 63813, "epoch": 768} {"train_loss": -20.216772079467773, "global_step": 63814, "epoch": 768} {"train_loss": -20.52509880065918, "global_step": 63815, "epoch": 768} {"train_loss": -20.8271427154541, "global_step": 63816, "epoch": 768} {"train_loss": -21.028905868530273, "global_step": 63817, "epoch": 768} {"train_loss": -20.3507022857666, "global_step": 63818, "epoch": 768} {"train_loss": -20.219213485717773, "global_step": 63819, "epoch": 768} {"train_loss": -20.862478256225586, "global_step": 63820, "epoch": 768} {"train_loss": -20.199575424194336, "global_step": 63821, "epoch": 768} {"train_loss": -20.4626407623291, "global_step": 63822, "epoch": 768} {"train_loss": -20.640268325805664, "global_step": 63823, "epoch": 768} {"train_loss": -20.479541778564453, "global_step": 63824, "epoch": 768} {"train_loss": -20.731754302978516, "global_step": 63825, "epoch": 768} {"train_loss": -20.49631789793451, "global_step": 63826, "epoch": 768, "val_loss": 5911038.5} {"train_loss": -20.180023193359375, "global_step": 63827, "epoch": 769} {"train_loss": -20.608118057250977, "global_step": 63828, "epoch": 769} {"train_loss": -19.889936447143555, "global_step": 63829, "epoch": 769} {"train_loss": -19.928802490234375, "global_step": 63830, "epoch": 769} {"train_loss": -20.488088607788086, "global_step": 63831, "epoch": 769} {"train_loss": -19.967191696166992, "global_step": 63832, "epoch": 769} {"train_loss": -20.348474502563477, "global_step": 63833, "epoch": 769} {"train_loss": -19.79159927368164, "global_step": 63834, "epoch": 769} {"train_loss": -20.28843879699707, "global_step": 63835, "epoch": 769} {"train_loss": -20.680322647094727, "global_step": 63836, "epoch": 769} {"train_loss": -20.184606552124023, "global_step": 63837, "epoch": 769} {"train_loss": -20.51041030883789, "global_step": 63838, "epoch": 769} {"train_loss": -20.42033576965332, "global_step": 63839, "epoch": 769} {"train_loss": -20.727310180664062, "global_step": 63840, "epoch": 769} {"train_loss": -20.184078216552734, "global_step": 63841, "epoch": 769} {"train_loss": -20.53989028930664, "global_step": 63842, "epoch": 769} {"train_loss": -20.666366577148438, "global_step": 63843, "epoch": 769} {"train_loss": -20.551204681396484, "global_step": 63844, "epoch": 769} {"train_loss": -20.398130416870117, "global_step": 63845, "epoch": 769} {"train_loss": -20.20660400390625, "global_step": 63846, "epoch": 769} {"train_loss": -20.525434494018555, "global_step": 63847, "epoch": 769} {"train_loss": -20.100677490234375, "global_step": 63848, "epoch": 769} {"train_loss": -20.512939453125, "global_step": 63849, "epoch": 769} {"train_loss": -20.1518611907959, "global_step": 63850, "epoch": 769} {"train_loss": -20.213119506835938, "global_step": 63851, "epoch": 769} {"train_loss": -20.501880645751953, "global_step": 63852, "epoch": 769} {"train_loss": -20.746984481811523, "global_step": 63853, "epoch": 769} {"train_loss": -20.395090103149414, "global_step": 63854, "epoch": 769} {"train_loss": -20.31477165222168, "global_step": 63855, "epoch": 769} {"train_loss": -20.40328025817871, "global_step": 63856, "epoch": 769} {"train_loss": -20.619951248168945, "global_step": 63857, "epoch": 769} {"train_loss": -20.805809020996094, "global_step": 63858, "epoch": 769} {"train_loss": -20.752466201782227, "global_step": 63859, "epoch": 769} {"train_loss": -20.692861557006836, "global_step": 63860, "epoch": 769} {"train_loss": -20.42072868347168, "global_step": 63861, "epoch": 769} {"train_loss": -20.50892448425293, "global_step": 63862, "epoch": 769} {"train_loss": -20.372417449951172, "global_step": 63863, "epoch": 769} {"train_loss": -20.627798080444336, "global_step": 63864, "epoch": 769} {"train_loss": -20.72972297668457, "global_step": 63865, "epoch": 769} {"train_loss": -20.67241668701172, "global_step": 63866, "epoch": 769} {"train_loss": -20.15296745300293, "global_step": 63867, "epoch": 769} {"train_loss": -20.55607795715332, "global_step": 63868, "epoch": 769} {"train_loss": -20.645099639892578, "global_step": 63869, "epoch": 769} {"train_loss": -20.539485931396484, "global_step": 63870, "epoch": 769} {"train_loss": -20.71647071838379, "global_step": 63871, "epoch": 769} {"train_loss": -20.741392135620117, "global_step": 63872, "epoch": 769} {"train_loss": -20.723926544189453, "global_step": 63873, "epoch": 769} {"train_loss": -20.490005493164062, "global_step": 63874, "epoch": 769} {"train_loss": -20.452726364135742, "global_step": 63875, "epoch": 769} {"train_loss": -20.566707611083984, "global_step": 63876, "epoch": 769} {"train_loss": -20.515151977539062, "global_step": 63877, "epoch": 769} {"train_loss": -20.83989906311035, "global_step": 63878, "epoch": 769} {"train_loss": -20.487934112548828, "global_step": 63879, "epoch": 769} {"train_loss": -20.37007713317871, "global_step": 63880, "epoch": 769} {"train_loss": -20.278772354125977, "global_step": 63881, "epoch": 769} {"train_loss": -20.453205108642578, "global_step": 63882, "epoch": 769} {"train_loss": -20.396738052368164, "global_step": 63883, "epoch": 769} {"train_loss": -20.638654708862305, "global_step": 63884, "epoch": 769} {"train_loss": -20.29279136657715, "global_step": 63885, "epoch": 769} {"train_loss": -20.652257919311523, "global_step": 63886, "epoch": 769} {"train_loss": -20.46712875366211, "global_step": 63887, "epoch": 769} {"train_loss": -20.339481353759766, "global_step": 63888, "epoch": 769} {"train_loss": -20.86128807067871, "global_step": 63889, "epoch": 769} {"train_loss": -20.485807418823242, "global_step": 63890, "epoch": 769} {"train_loss": -20.683034896850586, "global_step": 63891, "epoch": 769} {"train_loss": -20.898895263671875, "global_step": 63892, "epoch": 769} {"train_loss": -20.517057418823242, "global_step": 63893, "epoch": 769} {"train_loss": -20.70652198791504, "global_step": 63894, "epoch": 769} {"train_loss": -20.474151611328125, "global_step": 63895, "epoch": 769} {"train_loss": -20.576248168945312, "global_step": 63896, "epoch": 769} {"train_loss": -20.23368263244629, "global_step": 63897, "epoch": 769} {"train_loss": -20.663808822631836, "global_step": 63898, "epoch": 769} {"train_loss": -20.55290985107422, "global_step": 63899, "epoch": 769} {"train_loss": -20.565725326538086, "global_step": 63900, "epoch": 769} {"train_loss": -20.49394989013672, "global_step": 63901, "epoch": 769} {"train_loss": -20.505964279174805, "global_step": 63902, "epoch": 769} {"train_loss": -20.458158493041992, "global_step": 63903, "epoch": 769} {"train_loss": -20.6140079498291, "global_step": 63904, "epoch": 769} {"train_loss": -20.207294464111328, "global_step": 63905, "epoch": 769} {"train_loss": -20.43722152709961, "global_step": 63906, "epoch": 769} {"train_loss": -20.47784996032715, "global_step": 63907, "epoch": 769} {"train_loss": -20.210067749023438, "global_step": 63908, "epoch": 769} {"train_loss": -20.476487722741552, "global_step": 63909, "epoch": 769, "val_loss": 5969231.0} {"train_loss": -19.975309371948242, "global_step": 63910, "epoch": 770} {"train_loss": -20.38661003112793, "global_step": 63911, "epoch": 770} {"train_loss": -20.600141525268555, "global_step": 63912, "epoch": 770} {"train_loss": -20.21833610534668, "global_step": 63913, "epoch": 770} {"train_loss": -20.78580665588379, "global_step": 63914, "epoch": 770} {"train_loss": -20.419681549072266, "global_step": 63915, "epoch": 770} {"train_loss": -20.639690399169922, "global_step": 63916, "epoch": 770} {"train_loss": -20.139646530151367, "global_step": 63917, "epoch": 770} {"train_loss": -20.338485717773438, "global_step": 63918, "epoch": 770} {"train_loss": -20.847707748413086, "global_step": 63919, "epoch": 770} {"train_loss": -20.47305679321289, "global_step": 63920, "epoch": 770} {"train_loss": -20.464147567749023, "global_step": 63921, "epoch": 770} {"train_loss": -20.59889793395996, "global_step": 63922, "epoch": 770} {"train_loss": -20.552608489990234, "global_step": 63923, "epoch": 770} {"train_loss": -20.402956008911133, "global_step": 63924, "epoch": 770} {"train_loss": -20.468732833862305, "global_step": 63925, "epoch": 770} {"train_loss": -20.574464797973633, "global_step": 63926, "epoch": 770} {"train_loss": -20.3942813873291, "global_step": 63927, "epoch": 770} {"train_loss": -20.59663963317871, "global_step": 63928, "epoch": 770} {"train_loss": -20.211875915527344, "global_step": 63929, "epoch": 770} {"train_loss": -20.389081954956055, "global_step": 63930, "epoch": 770} {"train_loss": -20.36396598815918, "global_step": 63931, "epoch": 770} {"train_loss": -20.449369430541992, "global_step": 63932, "epoch": 770} {"train_loss": -20.44024658203125, "global_step": 63933, "epoch": 770} {"train_loss": -20.36021614074707, "global_step": 63934, "epoch": 770} {"train_loss": -20.761577606201172, "global_step": 63935, "epoch": 770} {"train_loss": -20.36444664001465, "global_step": 63936, "epoch": 770} {"train_loss": -20.638822555541992, "global_step": 63937, "epoch": 770} {"train_loss": -20.31137466430664, "global_step": 63938, "epoch": 770} {"train_loss": -20.546728134155273, "global_step": 63939, "epoch": 770} {"train_loss": -20.68598747253418, "global_step": 63940, "epoch": 770} {"train_loss": -20.461339950561523, "global_step": 63941, "epoch": 770} {"train_loss": -20.577138900756836, "global_step": 63942, "epoch": 770} {"train_loss": -20.618268966674805, "global_step": 63943, "epoch": 770} {"train_loss": -20.72434425354004, "global_step": 63944, "epoch": 770} {"train_loss": -20.42579460144043, "global_step": 63945, "epoch": 770} {"train_loss": -20.37970542907715, "global_step": 63946, "epoch": 770} {"train_loss": -20.595739364624023, "global_step": 63947, "epoch": 770} {"train_loss": -20.94548988342285, "global_step": 63948, "epoch": 770} {"train_loss": -20.6983585357666, "global_step": 63949, "epoch": 770} {"train_loss": -21.01624870300293, "global_step": 63950, "epoch": 770} {"train_loss": -20.380952835083008, "global_step": 63951, "epoch": 770} {"train_loss": -20.88983726501465, "global_step": 63952, "epoch": 770} {"train_loss": -20.56519889831543, "global_step": 63953, "epoch": 770} {"train_loss": -20.39142417907715, "global_step": 63954, "epoch": 770} {"train_loss": -20.25490951538086, "global_step": 63955, "epoch": 770} {"train_loss": -20.74775505065918, "global_step": 63956, "epoch": 770} {"train_loss": -20.743942260742188, "global_step": 63957, "epoch": 770} {"train_loss": -20.57419204711914, "global_step": 63958, "epoch": 770} {"train_loss": -20.793668746948242, "global_step": 63959, "epoch": 770} {"train_loss": -20.5430850982666, "global_step": 63960, "epoch": 770} {"train_loss": -20.50661277770996, "global_step": 63961, "epoch": 770} {"train_loss": -20.907644271850586, "global_step": 63962, "epoch": 770} {"train_loss": -20.365083694458008, "global_step": 63963, "epoch": 770} {"train_loss": -20.906265258789062, "global_step": 63964, "epoch": 770} {"train_loss": -20.42949867248535, "global_step": 63965, "epoch": 770} {"train_loss": -20.660268783569336, "global_step": 63966, "epoch": 770} {"train_loss": -20.57683753967285, "global_step": 63967, "epoch": 770} {"train_loss": -20.595285415649414, "global_step": 63968, "epoch": 770} {"train_loss": -20.827707290649414, "global_step": 63969, "epoch": 770} {"train_loss": -20.22990608215332, "global_step": 63970, "epoch": 770} {"train_loss": -21.070280075073242, "global_step": 63971, "epoch": 770} {"train_loss": -20.450363159179688, "global_step": 63972, "epoch": 770} {"train_loss": -20.343616485595703, "global_step": 63973, "epoch": 770} {"train_loss": -20.523557662963867, "global_step": 63974, "epoch": 770} {"train_loss": -20.457475662231445, "global_step": 63975, "epoch": 770} {"train_loss": -20.92474937438965, "global_step": 63976, "epoch": 770} {"train_loss": -20.652755737304688, "global_step": 63977, "epoch": 770} {"train_loss": -20.298633575439453, "global_step": 63978, "epoch": 770} {"train_loss": -20.640939712524414, "global_step": 63979, "epoch": 770} {"train_loss": -20.49525260925293, "global_step": 63980, "epoch": 770} {"train_loss": -20.72372817993164, "global_step": 63981, "epoch": 770} {"train_loss": -20.79119110107422, "global_step": 63982, "epoch": 770} {"train_loss": -20.6481990814209, "global_step": 63983, "epoch": 770} {"train_loss": -20.491411209106445, "global_step": 63984, "epoch": 770} {"train_loss": -20.53134536743164, "global_step": 63985, "epoch": 770} {"train_loss": -20.584060668945312, "global_step": 63986, "epoch": 770} {"train_loss": -20.852767944335938, "global_step": 63987, "epoch": 770} {"train_loss": -20.75057601928711, "global_step": 63988, "epoch": 770} {"train_loss": -20.481609344482422, "global_step": 63989, "epoch": 770} {"train_loss": -20.80315399169922, "global_step": 63990, "epoch": 770} {"train_loss": -20.472402572631836, "global_step": 63991, "epoch": 770} {"train_loss": -20.546454946678804, "global_step": 63992, "epoch": 770, "val_loss": 5945377.0} {"train_loss": -20.411455154418945, "global_step": 63993, "epoch": 771} {"train_loss": -20.455493927001953, "global_step": 63994, "epoch": 771} {"train_loss": -20.16071128845215, "global_step": 63995, "epoch": 771} {"train_loss": -20.328718185424805, "global_step": 63996, "epoch": 771} {"train_loss": -20.296279907226562, "global_step": 63997, "epoch": 771} {"train_loss": -20.540491104125977, "global_step": 63998, "epoch": 771} {"train_loss": -20.22351837158203, "global_step": 63999, "epoch": 771} {"train_loss": -20.81178855895996, "global_step": 64000, "epoch": 771} {"train_loss": -20.22170066833496, "global_step": 64001, "epoch": 771} {"train_loss": -20.415693283081055, "global_step": 64002, "epoch": 771} {"train_loss": -20.132463455200195, "global_step": 64003, "epoch": 771} {"train_loss": -20.455671310424805, "global_step": 64004, "epoch": 771} {"train_loss": -20.415250778198242, "global_step": 64005, "epoch": 771} {"train_loss": -20.66928482055664, "global_step": 64006, "epoch": 771} {"train_loss": -20.301233291625977, "global_step": 64007, "epoch": 771} {"train_loss": -20.580463409423828, "global_step": 64008, "epoch": 771} {"train_loss": -20.473907470703125, "global_step": 64009, "epoch": 771} {"train_loss": -20.321563720703125, "global_step": 64010, "epoch": 771} {"train_loss": -20.763830184936523, "global_step": 64011, "epoch": 771} {"train_loss": -20.180479049682617, "global_step": 64012, "epoch": 771} {"train_loss": -20.702634811401367, "global_step": 64013, "epoch": 771} {"train_loss": -20.799543380737305, "global_step": 64014, "epoch": 771} {"train_loss": -20.459012985229492, "global_step": 64015, "epoch": 771} {"train_loss": -20.825056076049805, "global_step": 64016, "epoch": 771} {"train_loss": -20.813465118408203, "global_step": 64017, "epoch": 771} {"train_loss": -20.57277488708496, "global_step": 64018, "epoch": 771} {"train_loss": -20.337677001953125, "global_step": 64019, "epoch": 771} {"train_loss": -20.427799224853516, "global_step": 64020, "epoch": 771} {"train_loss": -20.400684356689453, "global_step": 64021, "epoch": 771} {"train_loss": -20.568029403686523, "global_step": 64022, "epoch": 771} {"train_loss": -20.590024948120117, "global_step": 64023, "epoch": 771} {"train_loss": -20.52806854248047, "global_step": 64024, "epoch": 771} {"train_loss": -20.431299209594727, "global_step": 64025, "epoch": 771} {"train_loss": -20.931859970092773, "global_step": 64026, "epoch": 771} {"train_loss": -20.48517417907715, "global_step": 64027, "epoch": 771} {"train_loss": -20.363842010498047, "global_step": 64028, "epoch": 771} {"train_loss": -20.670654296875, "global_step": 64029, "epoch": 771} {"train_loss": -20.583120346069336, "global_step": 64030, "epoch": 771} {"train_loss": -20.703227996826172, "global_step": 64031, "epoch": 771} {"train_loss": -20.48541259765625, "global_step": 64032, "epoch": 771} {"train_loss": -20.500499725341797, "global_step": 64033, "epoch": 771} {"train_loss": -20.96112632751465, "global_step": 64034, "epoch": 771} {"train_loss": -20.685951232910156, "global_step": 64035, "epoch": 771} {"train_loss": -20.77248764038086, "global_step": 64036, "epoch": 771} {"train_loss": -20.593547821044922, "global_step": 64037, "epoch": 771} {"train_loss": -20.32598304748535, "global_step": 64038, "epoch": 771} {"train_loss": -20.57710838317871, "global_step": 64039, "epoch": 771} {"train_loss": -20.198335647583008, "global_step": 64040, "epoch": 771} {"train_loss": -20.51834487915039, "global_step": 64041, "epoch": 771} {"train_loss": -20.479366302490234, "global_step": 64042, "epoch": 771} {"train_loss": -20.52467155456543, "global_step": 64043, "epoch": 771} {"train_loss": -20.74928092956543, "global_step": 64044, "epoch": 771} {"train_loss": -20.354087829589844, "global_step": 64045, "epoch": 771} {"train_loss": -20.513425827026367, "global_step": 64046, "epoch": 771} {"train_loss": -20.5277156829834, "global_step": 64047, "epoch": 771} {"train_loss": -20.830570220947266, "global_step": 64048, "epoch": 771} {"train_loss": -20.847911834716797, "global_step": 64049, "epoch": 771} {"train_loss": -20.297428131103516, "global_step": 64050, "epoch": 771} {"train_loss": -20.550142288208008, "global_step": 64051, "epoch": 771} {"train_loss": -20.818418502807617, "global_step": 64052, "epoch": 771} {"train_loss": -20.39649200439453, "global_step": 64053, "epoch": 771} {"train_loss": -20.62349510192871, "global_step": 64054, "epoch": 771} {"train_loss": -21.174894332885742, "global_step": 64055, "epoch": 771} {"train_loss": -20.53466796875, "global_step": 64056, "epoch": 771} {"train_loss": -20.317790985107422, "global_step": 64057, "epoch": 771} {"train_loss": -20.63608169555664, "global_step": 64058, "epoch": 771} {"train_loss": -20.780643463134766, "global_step": 64059, "epoch": 771} {"train_loss": -20.759185791015625, "global_step": 64060, "epoch": 771} {"train_loss": -20.381732940673828, "global_step": 64061, "epoch": 771} {"train_loss": -20.69160270690918, "global_step": 64062, "epoch": 771} {"train_loss": -20.290342330932617, "global_step": 64063, "epoch": 771} {"train_loss": -20.95303726196289, "global_step": 64064, "epoch": 771} {"train_loss": -20.767688751220703, "global_step": 64065, "epoch": 771} {"train_loss": -20.811817169189453, "global_step": 64066, "epoch": 771} {"train_loss": -20.69623374938965, "global_step": 64067, "epoch": 771} {"train_loss": -20.422853469848633, "global_step": 64068, "epoch": 771} {"train_loss": -20.689332962036133, "global_step": 64069, "epoch": 771} {"train_loss": -20.749221801757812, "global_step": 64070, "epoch": 771} {"train_loss": -20.506000518798828, "global_step": 64071, "epoch": 771} {"train_loss": -20.897144317626953, "global_step": 64072, "epoch": 771} {"train_loss": -20.206838607788086, "global_step": 64073, "epoch": 771} {"train_loss": -20.455421447753906, "global_step": 64074, "epoch": 771} {"train_loss": -20.568534506372657, "global_step": 64075, "epoch": 771, "val_loss": 5997424.5} {"train_loss": -19.930736541748047, "global_step": 64076, "epoch": 772} {"train_loss": -20.212366104125977, "global_step": 64077, "epoch": 772} {"train_loss": -20.365854263305664, "global_step": 64078, "epoch": 772} {"train_loss": -20.216665267944336, "global_step": 64079, "epoch": 772} {"train_loss": -20.46196937561035, "global_step": 64080, "epoch": 772} {"train_loss": -20.018056869506836, "global_step": 64081, "epoch": 772} {"train_loss": -20.559446334838867, "global_step": 64082, "epoch": 772} {"train_loss": -20.46784019470215, "global_step": 64083, "epoch": 772} {"train_loss": -20.307931900024414, "global_step": 64084, "epoch": 772} {"train_loss": -20.276403427124023, "global_step": 64085, "epoch": 772} {"train_loss": -20.078580856323242, "global_step": 64086, "epoch": 772} {"train_loss": -20.192852020263672, "global_step": 64087, "epoch": 772} {"train_loss": -20.36513328552246, "global_step": 64088, "epoch": 772} {"train_loss": -20.37366485595703, "global_step": 64089, "epoch": 772} {"train_loss": -20.398916244506836, "global_step": 64090, "epoch": 772} {"train_loss": -20.271299362182617, "global_step": 64091, "epoch": 772} {"train_loss": -20.39923667907715, "global_step": 64092, "epoch": 772} {"train_loss": -20.70838737487793, "global_step": 64093, "epoch": 772} {"train_loss": -20.660566329956055, "global_step": 64094, "epoch": 772} {"train_loss": -20.564111709594727, "global_step": 64095, "epoch": 772} {"train_loss": -20.331201553344727, "global_step": 64096, "epoch": 772} {"train_loss": -20.642166137695312, "global_step": 64097, "epoch": 772} {"train_loss": -20.513154983520508, "global_step": 64098, "epoch": 772} {"train_loss": -20.71327018737793, "global_step": 64099, "epoch": 772} {"train_loss": -20.2340145111084, "global_step": 64100, "epoch": 772} {"train_loss": -20.565216064453125, "global_step": 64101, "epoch": 772} {"train_loss": -20.446945190429688, "global_step": 64102, "epoch": 772} {"train_loss": -20.6649112701416, "global_step": 64103, "epoch": 772} {"train_loss": -20.725568771362305, "global_step": 64104, "epoch": 772} {"train_loss": -20.392305374145508, "global_step": 64105, "epoch": 772} {"train_loss": -20.620908737182617, "global_step": 64106, "epoch": 772} {"train_loss": -20.458189010620117, "global_step": 64107, "epoch": 772} {"train_loss": -20.5651798248291, "global_step": 64108, "epoch": 772} {"train_loss": -20.656911849975586, "global_step": 64109, "epoch": 772} {"train_loss": -20.45076560974121, "global_step": 64110, "epoch": 772} {"train_loss": -20.54473304748535, "global_step": 64111, "epoch": 772} {"train_loss": -20.554641723632812, "global_step": 64112, "epoch": 772} {"train_loss": -20.780630111694336, "global_step": 64113, "epoch": 772} {"train_loss": -20.75311279296875, "global_step": 64114, "epoch": 772} {"train_loss": -20.641117095947266, "global_step": 64115, "epoch": 772} {"train_loss": -20.756254196166992, "global_step": 64116, "epoch": 772} {"train_loss": -20.278432846069336, "global_step": 64117, "epoch": 772} {"train_loss": -20.641677856445312, "global_step": 64118, "epoch": 772} {"train_loss": -20.25294303894043, "global_step": 64119, "epoch": 772} {"train_loss": -20.614765167236328, "global_step": 64120, "epoch": 772} {"train_loss": -20.533727645874023, "global_step": 64121, "epoch": 772} {"train_loss": -20.921375274658203, "global_step": 64122, "epoch": 772} {"train_loss": -20.766569137573242, "global_step": 64123, "epoch": 772} {"train_loss": -20.134658813476562, "global_step": 64124, "epoch": 772} {"train_loss": -20.610332489013672, "global_step": 64125, "epoch": 772} {"train_loss": -20.671531677246094, "global_step": 64126, "epoch": 772} {"train_loss": -20.606218338012695, "global_step": 64127, "epoch": 772} {"train_loss": -20.53997230529785, "global_step": 64128, "epoch": 772} {"train_loss": -20.661779403686523, "global_step": 64129, "epoch": 772} {"train_loss": -20.39942741394043, "global_step": 64130, "epoch": 772} {"train_loss": -20.558612823486328, "global_step": 64131, "epoch": 772} {"train_loss": -20.878173828125, "global_step": 64132, "epoch": 772} {"train_loss": -20.97824478149414, "global_step": 64133, "epoch": 772} {"train_loss": -20.608469009399414, "global_step": 64134, "epoch": 772} {"train_loss": -20.625226974487305, "global_step": 64135, "epoch": 772} {"train_loss": -20.8179931640625, "global_step": 64136, "epoch": 772} {"train_loss": -20.376611709594727, "global_step": 64137, "epoch": 772} {"train_loss": -20.249502182006836, "global_step": 64138, "epoch": 772} {"train_loss": -20.63912582397461, "global_step": 64139, "epoch": 772} {"train_loss": -20.493389129638672, "global_step": 64140, "epoch": 772} {"train_loss": -20.6781063079834, "global_step": 64141, "epoch": 772} {"train_loss": -20.398639678955078, "global_step": 64142, "epoch": 772} {"train_loss": -20.625717163085938, "global_step": 64143, "epoch": 772} {"train_loss": -21.086210250854492, "global_step": 64144, "epoch": 772} {"train_loss": -20.6890926361084, "global_step": 64145, "epoch": 772} {"train_loss": -20.67852783203125, "global_step": 64146, "epoch": 772} {"train_loss": -20.610074996948242, "global_step": 64147, "epoch": 772} {"train_loss": -20.615970611572266, "global_step": 64148, "epoch": 772} {"train_loss": -20.49789810180664, "global_step": 64149, "epoch": 772} {"train_loss": -20.379732131958008, "global_step": 64150, "epoch": 772} {"train_loss": -20.401155471801758, "global_step": 64151, "epoch": 772} {"train_loss": -20.653451919555664, "global_step": 64152, "epoch": 772} {"train_loss": -20.703237533569336, "global_step": 64153, "epoch": 772} {"train_loss": -20.179153442382812, "global_step": 64154, "epoch": 772} {"train_loss": -20.30050277709961, "global_step": 64155, "epoch": 772} {"train_loss": -20.246177673339844, "global_step": 64156, "epoch": 772} {"train_loss": -20.856748580932617, "global_step": 64157, "epoch": 772} {"train_loss": -20.498025756284417, "global_step": 64158, "epoch": 772, "val_loss": 6088216.0} {"train_loss": -19.918359756469727, "global_step": 64159, "epoch": 773} {"train_loss": -20.156057357788086, "global_step": 64160, "epoch": 773} {"train_loss": -20.028430938720703, "global_step": 64161, "epoch": 773} {"train_loss": -20.282182693481445, "global_step": 64162, "epoch": 773} {"train_loss": -20.423887252807617, "global_step": 64163, "epoch": 773} {"train_loss": -20.034011840820312, "global_step": 64164, "epoch": 773} {"train_loss": -20.303373336791992, "global_step": 64165, "epoch": 773} {"train_loss": -20.602964401245117, "global_step": 64166, "epoch": 773} {"train_loss": -20.319700241088867, "global_step": 64167, "epoch": 773} {"train_loss": -20.54426383972168, "global_step": 64168, "epoch": 773} {"train_loss": -20.211196899414062, "global_step": 64169, "epoch": 773} {"train_loss": -20.591245651245117, "global_step": 64170, "epoch": 773} {"train_loss": -20.604665756225586, "global_step": 64171, "epoch": 773} {"train_loss": -20.478212356567383, "global_step": 64172, "epoch": 773} {"train_loss": -20.456077575683594, "global_step": 64173, "epoch": 773} {"train_loss": -20.63868522644043, "global_step": 64174, "epoch": 773} {"train_loss": -20.55156707763672, "global_step": 64175, "epoch": 773} {"train_loss": -20.373531341552734, "global_step": 64176, "epoch": 773} {"train_loss": -20.371057510375977, "global_step": 64177, "epoch": 773} {"train_loss": -20.525606155395508, "global_step": 64178, "epoch": 773} {"train_loss": -20.343976974487305, "global_step": 64179, "epoch": 773} {"train_loss": -20.018651962280273, "global_step": 64180, "epoch": 773} {"train_loss": -20.634017944335938, "global_step": 64181, "epoch": 773} {"train_loss": -20.389326095581055, "global_step": 64182, "epoch": 773} {"train_loss": -21.080739974975586, "global_step": 64183, "epoch": 773} {"train_loss": -20.006681442260742, "global_step": 64184, "epoch": 773} {"train_loss": -19.929155349731445, "global_step": 64185, "epoch": 773} {"train_loss": -20.257633209228516, "global_step": 64186, "epoch": 773} {"train_loss": -20.57448959350586, "global_step": 64187, "epoch": 773} {"train_loss": -20.33510398864746, "global_step": 64188, "epoch": 773} {"train_loss": -20.896629333496094, "global_step": 64189, "epoch": 773} {"train_loss": -20.67296028137207, "global_step": 64190, "epoch": 773} {"train_loss": -20.48301124572754, "global_step": 64191, "epoch": 773} {"train_loss": -20.194339752197266, "global_step": 64192, "epoch": 773} {"train_loss": -20.376007080078125, "global_step": 64193, "epoch": 773} {"train_loss": -20.72324562072754, "global_step": 64194, "epoch": 773} {"train_loss": -20.3609676361084, "global_step": 64195, "epoch": 773} {"train_loss": -20.9420223236084, "global_step": 64196, "epoch": 773} {"train_loss": -21.062021255493164, "global_step": 64197, "epoch": 773} {"train_loss": -20.5284423828125, "global_step": 64198, "epoch": 773} {"train_loss": -20.68631362915039, "global_step": 64199, "epoch": 773} {"train_loss": -20.692174911499023, "global_step": 64200, "epoch": 773} {"train_loss": -20.55925941467285, "global_step": 64201, "epoch": 773} {"train_loss": -20.554439544677734, "global_step": 64202, "epoch": 773} {"train_loss": -20.454591751098633, "global_step": 64203, "epoch": 773} {"train_loss": -20.624011993408203, "global_step": 64204, "epoch": 773} {"train_loss": -20.47022247314453, "global_step": 64205, "epoch": 773} {"train_loss": -20.70154571533203, "global_step": 64206, "epoch": 773} {"train_loss": -20.49736785888672, "global_step": 64207, "epoch": 773} {"train_loss": -20.52000617980957, "global_step": 64208, "epoch": 773} {"train_loss": -20.754486083984375, "global_step": 64209, "epoch": 773} {"train_loss": -20.128889083862305, "global_step": 64210, "epoch": 773} {"train_loss": -20.9140682220459, "global_step": 64211, "epoch": 773} {"train_loss": -20.5854549407959, "global_step": 64212, "epoch": 773} {"train_loss": -20.715085983276367, "global_step": 64213, "epoch": 773} {"train_loss": -20.82135772705078, "global_step": 64214, "epoch": 773} {"train_loss": -20.990793228149414, "global_step": 64215, "epoch": 773} {"train_loss": -20.351713180541992, "global_step": 64216, "epoch": 773} {"train_loss": -20.451684951782227, "global_step": 64217, "epoch": 773} {"train_loss": -20.324350357055664, "global_step": 64218, "epoch": 773} {"train_loss": -20.871837615966797, "global_step": 64219, "epoch": 773} {"train_loss": -20.58595085144043, "global_step": 64220, "epoch": 773} {"train_loss": -20.743410110473633, "global_step": 64221, "epoch": 773} {"train_loss": -20.738977432250977, "global_step": 64222, "epoch": 773} {"train_loss": -20.682706832885742, "global_step": 64223, "epoch": 773} {"train_loss": -20.470617294311523, "global_step": 64224, "epoch": 773} {"train_loss": -20.79348373413086, "global_step": 64225, "epoch": 773} {"train_loss": -20.579740524291992, "global_step": 64226, "epoch": 773} {"train_loss": -20.648691177368164, "global_step": 64227, "epoch": 773} {"train_loss": -20.46856117248535, "global_step": 64228, "epoch": 773} {"train_loss": -21.005455017089844, "global_step": 64229, "epoch": 773} {"train_loss": -20.44950294494629, "global_step": 64230, "epoch": 773} {"train_loss": -20.7650146484375, "global_step": 64231, "epoch": 773} {"train_loss": -20.811410903930664, "global_step": 64232, "epoch": 773} {"train_loss": -20.478511810302734, "global_step": 64233, "epoch": 773} {"train_loss": -20.501300811767578, "global_step": 64234, "epoch": 773} {"train_loss": -20.533634185791016, "global_step": 64235, "epoch": 773} {"train_loss": -20.344892501831055, "global_step": 64236, "epoch": 773} {"train_loss": -20.618223190307617, "global_step": 64237, "epoch": 773} {"train_loss": -20.861238479614258, "global_step": 64238, "epoch": 773} {"train_loss": -20.844205856323242, "global_step": 64239, "epoch": 773} {"train_loss": -20.671064376831055, "global_step": 64240, "epoch": 773} {"train_loss": -20.51671887593097, "global_step": 64241, "epoch": 773, "val_loss": 6112123.5} {"train_loss": -20.385929107666016, "global_step": 64242, "epoch": 774} {"train_loss": -20.39383888244629, "global_step": 64243, "epoch": 774} {"train_loss": -20.091337203979492, "global_step": 64244, "epoch": 774} {"train_loss": -20.124547958374023, "global_step": 64245, "epoch": 774} {"train_loss": -20.4625244140625, "global_step": 64246, "epoch": 774} {"train_loss": -20.311594009399414, "global_step": 64247, "epoch": 774} {"train_loss": -20.238622665405273, "global_step": 64248, "epoch": 774} {"train_loss": -20.369455337524414, "global_step": 64249, "epoch": 774} {"train_loss": -20.57185935974121, "global_step": 64250, "epoch": 774} {"train_loss": -20.140493392944336, "global_step": 64251, "epoch": 774} {"train_loss": -20.833799362182617, "global_step": 64252, "epoch": 774} {"train_loss": -20.398765563964844, "global_step": 64253, "epoch": 774} {"train_loss": -20.196796417236328, "global_step": 64254, "epoch": 774} {"train_loss": -20.6844539642334, "global_step": 64255, "epoch": 774} {"train_loss": -20.308242797851562, "global_step": 64256, "epoch": 774} {"train_loss": -20.65004539489746, "global_step": 64257, "epoch": 774} {"train_loss": -20.42460060119629, "global_step": 64258, "epoch": 774} {"train_loss": -20.503843307495117, "global_step": 64259, "epoch": 774} {"train_loss": -20.63532066345215, "global_step": 64260, "epoch": 774} {"train_loss": -20.858783721923828, "global_step": 64261, "epoch": 774} {"train_loss": -20.49248504638672, "global_step": 64262, "epoch": 774} {"train_loss": -20.687332153320312, "global_step": 64263, "epoch": 774} {"train_loss": -19.894208908081055, "global_step": 64264, "epoch": 774} {"train_loss": -20.577085494995117, "global_step": 64265, "epoch": 774} {"train_loss": -20.887840270996094, "global_step": 64266, "epoch": 774} {"train_loss": -20.433719635009766, "global_step": 64267, "epoch": 774} {"train_loss": -20.770694732666016, "global_step": 64268, "epoch": 774} {"train_loss": -20.380786895751953, "global_step": 64269, "epoch": 774} {"train_loss": -20.68391990661621, "global_step": 64270, "epoch": 774} {"train_loss": -20.049222946166992, "global_step": 64271, "epoch": 774} {"train_loss": -20.637964248657227, "global_step": 64272, "epoch": 774} {"train_loss": -20.498035430908203, "global_step": 64273, "epoch": 774} {"train_loss": -20.518753051757812, "global_step": 64274, "epoch": 774} {"train_loss": -20.759777069091797, "global_step": 64275, "epoch": 774} {"train_loss": -20.340620040893555, "global_step": 64276, "epoch": 774} {"train_loss": -20.6253662109375, "global_step": 64277, "epoch": 774} {"train_loss": -20.572097778320312, "global_step": 64278, "epoch": 774} {"train_loss": -20.837827682495117, "global_step": 64279, "epoch": 774} {"train_loss": -20.401575088500977, "global_step": 64280, "epoch": 774} {"train_loss": -20.639646530151367, "global_step": 64281, "epoch": 774} {"train_loss": -20.43265724182129, "global_step": 64282, "epoch": 774} {"train_loss": -20.870664596557617, "global_step": 64283, "epoch": 774} {"train_loss": -20.440683364868164, "global_step": 64284, "epoch": 774} {"train_loss": -20.828577041625977, "global_step": 64285, "epoch": 774} {"train_loss": -20.756866455078125, "global_step": 64286, "epoch": 774} {"train_loss": -20.528390884399414, "global_step": 64287, "epoch": 774} {"train_loss": -20.68392562866211, "global_step": 64288, "epoch": 774} {"train_loss": -20.255569458007812, "global_step": 64289, "epoch": 774} {"train_loss": -21.00726318359375, "global_step": 64290, "epoch": 774} {"train_loss": -20.372526168823242, "global_step": 64291, "epoch": 774} {"train_loss": -20.514022827148438, "global_step": 64292, "epoch": 774} {"train_loss": -21.063140869140625, "global_step": 64293, "epoch": 774} {"train_loss": -20.64995574951172, "global_step": 64294, "epoch": 774} {"train_loss": -20.702695846557617, "global_step": 64295, "epoch": 774} {"train_loss": -20.686922073364258, "global_step": 64296, "epoch": 774} {"train_loss": -20.566917419433594, "global_step": 64297, "epoch": 774} {"train_loss": -20.50056266784668, "global_step": 64298, "epoch": 774} {"train_loss": -20.684961318969727, "global_step": 64299, "epoch": 774} {"train_loss": -20.756200790405273, "global_step": 64300, "epoch": 774} {"train_loss": -20.681964874267578, "global_step": 64301, "epoch": 774} {"train_loss": -20.43855094909668, "global_step": 64302, "epoch": 774} {"train_loss": -20.484378814697266, "global_step": 64303, "epoch": 774} {"train_loss": -20.308088302612305, "global_step": 64304, "epoch": 774} {"train_loss": -20.640045166015625, "global_step": 64305, "epoch": 774} {"train_loss": -20.46900749206543, "global_step": 64306, "epoch": 774} {"train_loss": -20.549440383911133, "global_step": 64307, "epoch": 774} {"train_loss": -20.5136775970459, "global_step": 64308, "epoch": 774} {"train_loss": -20.5318603515625, "global_step": 64309, "epoch": 774} {"train_loss": -20.5677433013916, "global_step": 64310, "epoch": 774} {"train_loss": -20.330581665039062, "global_step": 64311, "epoch": 774} {"train_loss": -20.452068328857422, "global_step": 64312, "epoch": 774} {"train_loss": -20.494291305541992, "global_step": 64313, "epoch": 774} {"train_loss": -20.594114303588867, "global_step": 64314, "epoch": 774} {"train_loss": -20.767444610595703, "global_step": 64315, "epoch": 774} {"train_loss": -20.600975036621094, "global_step": 64316, "epoch": 774} {"train_loss": -20.630964279174805, "global_step": 64317, "epoch": 774} {"train_loss": -20.44830322265625, "global_step": 64318, "epoch": 774} {"train_loss": -20.718982696533203, "global_step": 64319, "epoch": 774} {"train_loss": -20.29451560974121, "global_step": 64320, "epoch": 774} {"train_loss": -20.671422958374023, "global_step": 64321, "epoch": 774} {"train_loss": -20.765165328979492, "global_step": 64322, "epoch": 774} {"train_loss": -20.49617576599121, "global_step": 64323, "epoch": 774} {"train_loss": -20.551734120012767, "global_step": 64324, "epoch": 774, "val_loss": 5948863.0} {"train_loss": -19.925397872924805, "global_step": 64325, "epoch": 775} {"train_loss": -20.065673828125, "global_step": 64326, "epoch": 775} {"train_loss": -20.320215225219727, "global_step": 64327, "epoch": 775} {"train_loss": -20.4022159576416, "global_step": 64328, "epoch": 775} {"train_loss": -20.66587257385254, "global_step": 64329, "epoch": 775} {"train_loss": -20.356521606445312, "global_step": 64330, "epoch": 775} {"train_loss": -20.208097457885742, "global_step": 64331, "epoch": 775} {"train_loss": -20.480525970458984, "global_step": 64332, "epoch": 775} {"train_loss": -20.298919677734375, "global_step": 64333, "epoch": 775} {"train_loss": -20.727956771850586, "global_step": 64334, "epoch": 775} {"train_loss": -20.296253204345703, "global_step": 64335, "epoch": 775} {"train_loss": -20.555225372314453, "global_step": 64336, "epoch": 775} {"train_loss": -20.54231071472168, "global_step": 64337, "epoch": 775} {"train_loss": -20.600812911987305, "global_step": 64338, "epoch": 775} {"train_loss": -20.347665786743164, "global_step": 64339, "epoch": 775} {"train_loss": -20.421600341796875, "global_step": 64340, "epoch": 775} {"train_loss": -20.523305892944336, "global_step": 64341, "epoch": 775} {"train_loss": -20.51272964477539, "global_step": 64342, "epoch": 775} {"train_loss": -20.8439998626709, "global_step": 64343, "epoch": 775} {"train_loss": -20.159032821655273, "global_step": 64344, "epoch": 775} {"train_loss": -20.37445640563965, "global_step": 64345, "epoch": 775} {"train_loss": -20.37348747253418, "global_step": 64346, "epoch": 775} {"train_loss": -20.347681045532227, "global_step": 64347, "epoch": 775} {"train_loss": -20.150983810424805, "global_step": 64348, "epoch": 775} {"train_loss": -20.508955001831055, "global_step": 64349, "epoch": 775} {"train_loss": -20.643850326538086, "global_step": 64350, "epoch": 775} {"train_loss": -20.686195373535156, "global_step": 64351, "epoch": 775} {"train_loss": -20.90325927734375, "global_step": 64352, "epoch": 775} {"train_loss": -20.716867446899414, "global_step": 64353, "epoch": 775} {"train_loss": -20.097166061401367, "global_step": 64354, "epoch": 775} {"train_loss": -20.447134017944336, "global_step": 64355, "epoch": 775} {"train_loss": -20.6640567779541, "global_step": 64356, "epoch": 775} {"train_loss": -20.371646881103516, "global_step": 64357, "epoch": 775} {"train_loss": -20.5961971282959, "global_step": 64358, "epoch": 775} {"train_loss": -20.6915340423584, "global_step": 64359, "epoch": 775} {"train_loss": -21.097318649291992, "global_step": 64360, "epoch": 775} {"train_loss": -20.335376739501953, "global_step": 64361, "epoch": 775} {"train_loss": -20.68233299255371, "global_step": 64362, "epoch": 775} {"train_loss": -20.653348922729492, "global_step": 64363, "epoch": 775} {"train_loss": -20.80866050720215, "global_step": 64364, "epoch": 775} {"train_loss": -20.61421775817871, "global_step": 64365, "epoch": 775} {"train_loss": -20.551095962524414, "global_step": 64366, "epoch": 775} {"train_loss": -20.528921127319336, "global_step": 64367, "epoch": 775} {"train_loss": -20.581933975219727, "global_step": 64368, "epoch": 775} {"train_loss": -20.967681884765625, "global_step": 64369, "epoch": 775} {"train_loss": -20.86684226989746, "global_step": 64370, "epoch": 775} {"train_loss": -20.61130714416504, "global_step": 64371, "epoch": 775} {"train_loss": -20.85056495666504, "global_step": 64372, "epoch": 775} {"train_loss": -20.48120880126953, "global_step": 64373, "epoch": 775} {"train_loss": -20.683359146118164, "global_step": 64374, "epoch": 775} {"train_loss": -20.6662654876709, "global_step": 64375, "epoch": 775} {"train_loss": -20.60133934020996, "global_step": 64376, "epoch": 775} {"train_loss": -20.702655792236328, "global_step": 64377, "epoch": 775} {"train_loss": -20.241605758666992, "global_step": 64378, "epoch": 775} {"train_loss": -20.577884674072266, "global_step": 64379, "epoch": 775} {"train_loss": -20.483461380004883, "global_step": 64380, "epoch": 775} {"train_loss": -20.260326385498047, "global_step": 64381, "epoch": 775} {"train_loss": -20.523374557495117, "global_step": 64382, "epoch": 775} {"train_loss": -20.646493911743164, "global_step": 64383, "epoch": 775} {"train_loss": -20.44166374206543, "global_step": 64384, "epoch": 775} {"train_loss": -20.71462059020996, "global_step": 64385, "epoch": 775} {"train_loss": -20.49410057067871, "global_step": 64386, "epoch": 775} {"train_loss": -20.62221336364746, "global_step": 64387, "epoch": 775} {"train_loss": -20.414648056030273, "global_step": 64388, "epoch": 775} {"train_loss": -20.470054626464844, "global_step": 64389, "epoch": 775} {"train_loss": -20.792694091796875, "global_step": 64390, "epoch": 775} {"train_loss": -20.22046661376953, "global_step": 64391, "epoch": 775} {"train_loss": -20.418216705322266, "global_step": 64392, "epoch": 775} {"train_loss": -20.975391387939453, "global_step": 64393, "epoch": 775} {"train_loss": -20.915250778198242, "global_step": 64394, "epoch": 775} {"train_loss": -20.49986457824707, "global_step": 64395, "epoch": 775} {"train_loss": -20.467313766479492, "global_step": 64396, "epoch": 775} {"train_loss": -20.78013038635254, "global_step": 64397, "epoch": 775} {"train_loss": -20.920734405517578, "global_step": 64398, "epoch": 775} {"train_loss": -20.692325592041016, "global_step": 64399, "epoch": 775} {"train_loss": -20.67228889465332, "global_step": 64400, "epoch": 775} {"train_loss": -20.545753479003906, "global_step": 64401, "epoch": 775} {"train_loss": -20.70175552368164, "global_step": 64402, "epoch": 775} {"train_loss": -20.482465744018555, "global_step": 64403, "epoch": 775} {"train_loss": -20.47586441040039, "global_step": 64404, "epoch": 775} {"train_loss": -20.644777297973633, "global_step": 64405, "epoch": 775} {"train_loss": -20.5109806060791, "global_step": 64406, "epoch": 775} {"train_loss": -20.540903160370977, "global_step": 64407, "epoch": 775, "val_loss": 6045450.0} {"train_loss": -20.20826530456543, "global_step": 64408, "epoch": 776} {"train_loss": -19.91016960144043, "global_step": 64409, "epoch": 776} {"train_loss": -20.035018920898438, "global_step": 64410, "epoch": 776} {"train_loss": -20.170812606811523, "global_step": 64411, "epoch": 776} {"train_loss": -20.428159713745117, "global_step": 64412, "epoch": 776} {"train_loss": -20.418081283569336, "global_step": 64413, "epoch": 776} {"train_loss": -20.388660430908203, "global_step": 64414, "epoch": 776} {"train_loss": -20.475305557250977, "global_step": 64415, "epoch": 776} {"train_loss": -20.590177536010742, "global_step": 64416, "epoch": 776} {"train_loss": -20.19936752319336, "global_step": 64417, "epoch": 776} {"train_loss": -20.29435920715332, "global_step": 64418, "epoch": 776} {"train_loss": -19.909086227416992, "global_step": 64419, "epoch": 776} {"train_loss": -20.3707332611084, "global_step": 64420, "epoch": 776} {"train_loss": -20.06158447265625, "global_step": 64421, "epoch": 776} {"train_loss": -20.499717712402344, "global_step": 64422, "epoch": 776} {"train_loss": -20.35434913635254, "global_step": 64423, "epoch": 776} {"train_loss": -20.654481887817383, "global_step": 64424, "epoch": 776} {"train_loss": -20.403812408447266, "global_step": 64425, "epoch": 776} {"train_loss": -20.487043380737305, "global_step": 64426, "epoch": 776} {"train_loss": -20.36583137512207, "global_step": 64427, "epoch": 776} {"train_loss": -20.64376449584961, "global_step": 64428, "epoch": 776} {"train_loss": -20.425352096557617, "global_step": 64429, "epoch": 776} {"train_loss": -20.664634704589844, "global_step": 64430, "epoch": 776} {"train_loss": -20.732053756713867, "global_step": 64431, "epoch": 776} {"train_loss": -20.843358993530273, "global_step": 64432, "epoch": 776} {"train_loss": -20.5861759185791, "global_step": 64433, "epoch": 776} {"train_loss": -20.89260482788086, "global_step": 64434, "epoch": 776} {"train_loss": -20.594736099243164, "global_step": 64435, "epoch": 776} {"train_loss": -20.4104061126709, "global_step": 64436, "epoch": 776} {"train_loss": -20.72942543029785, "global_step": 64437, "epoch": 776} {"train_loss": -20.604066848754883, "global_step": 64438, "epoch": 776} {"train_loss": -20.416196823120117, "global_step": 64439, "epoch": 776} {"train_loss": -20.708799362182617, "global_step": 64440, "epoch": 776} {"train_loss": -20.750288009643555, "global_step": 64441, "epoch": 776} {"train_loss": -20.749340057373047, "global_step": 64442, "epoch": 776} {"train_loss": -20.56947898864746, "global_step": 64443, "epoch": 776} {"train_loss": -20.791091918945312, "global_step": 64444, "epoch": 776} {"train_loss": -20.36104393005371, "global_step": 64445, "epoch": 776} {"train_loss": -20.884790420532227, "global_step": 64446, "epoch": 776} {"train_loss": -20.713396072387695, "global_step": 64447, "epoch": 776} {"train_loss": -20.371522903442383, "global_step": 64448, "epoch": 776} {"train_loss": -20.5284366607666, "global_step": 64449, "epoch": 776} {"train_loss": -20.40858268737793, "global_step": 64450, "epoch": 776} {"train_loss": -20.75534439086914, "global_step": 64451, "epoch": 776} {"train_loss": -20.303220748901367, "global_step": 64452, "epoch": 776} {"train_loss": -20.526071548461914, "global_step": 64453, "epoch": 776} {"train_loss": -20.609285354614258, "global_step": 64454, "epoch": 776} {"train_loss": -20.523597717285156, "global_step": 64455, "epoch": 776} {"train_loss": -20.5322265625, "global_step": 64456, "epoch": 776} {"train_loss": -20.40504264831543, "global_step": 64457, "epoch": 776} {"train_loss": -20.295618057250977, "global_step": 64458, "epoch": 776} {"train_loss": -20.345916748046875, "global_step": 64459, "epoch": 776} {"train_loss": -20.44811248779297, "global_step": 64460, "epoch": 776} {"train_loss": -20.299976348876953, "global_step": 64461, "epoch": 776} {"train_loss": -20.620351791381836, "global_step": 64462, "epoch": 776} {"train_loss": -20.499563217163086, "global_step": 64463, "epoch": 776} {"train_loss": -20.410776138305664, "global_step": 64464, "epoch": 776} {"train_loss": -20.284976959228516, "global_step": 64465, "epoch": 776} {"train_loss": -20.564451217651367, "global_step": 64466, "epoch": 776} {"train_loss": -20.571874618530273, "global_step": 64467, "epoch": 776} {"train_loss": -20.533384323120117, "global_step": 64468, "epoch": 776} {"train_loss": -20.194995880126953, "global_step": 64469, "epoch": 776} {"train_loss": -20.563159942626953, "global_step": 64470, "epoch": 776} {"train_loss": -20.8021240234375, "global_step": 64471, "epoch": 776} {"train_loss": -20.755353927612305, "global_step": 64472, "epoch": 776} {"train_loss": -20.905475616455078, "global_step": 64473, "epoch": 776} {"train_loss": -20.4657039642334, "global_step": 64474, "epoch": 776} {"train_loss": -20.509531021118164, "global_step": 64475, "epoch": 776} {"train_loss": -20.642990112304688, "global_step": 64476, "epoch": 776} {"train_loss": -20.59036636352539, "global_step": 64477, "epoch": 776} {"train_loss": -21.044771194458008, "global_step": 64478, "epoch": 776} {"train_loss": -20.67974281311035, "global_step": 64479, "epoch": 776} {"train_loss": -21.065479278564453, "global_step": 64480, "epoch": 776} {"train_loss": -20.682321548461914, "global_step": 64481, "epoch": 776} {"train_loss": -20.6431941986084, "global_step": 64482, "epoch": 776} {"train_loss": -20.73956871032715, "global_step": 64483, "epoch": 776} {"train_loss": -20.60455322265625, "global_step": 64484, "epoch": 776} {"train_loss": -20.537349700927734, "global_step": 64485, "epoch": 776} {"train_loss": -20.623645782470703, "global_step": 64486, "epoch": 776} {"train_loss": -20.743650436401367, "global_step": 64487, "epoch": 776} {"train_loss": -20.371660232543945, "global_step": 64488, "epoch": 776} {"train_loss": -20.878952026367188, "global_step": 64489, "epoch": 776} {"train_loss": -20.551069765205842, "global_step": 64490, "epoch": 776, "val_loss": 5921336.5} {"train_loss": -19.974241256713867, "global_step": 64491, "epoch": 777} {"train_loss": -20.592546463012695, "global_step": 64492, "epoch": 777} {"train_loss": -19.92347526550293, "global_step": 64493, "epoch": 777} {"train_loss": -20.09950828552246, "global_step": 64494, "epoch": 777} {"train_loss": -20.495132446289062, "global_step": 64495, "epoch": 777} {"train_loss": -20.29225730895996, "global_step": 64496, "epoch": 777} {"train_loss": -19.940610885620117, "global_step": 64497, "epoch": 777} {"train_loss": -20.686994552612305, "global_step": 64498, "epoch": 777} {"train_loss": -20.422142028808594, "global_step": 64499, "epoch": 777} {"train_loss": -20.6582088470459, "global_step": 64500, "epoch": 777} {"train_loss": -20.4011173248291, "global_step": 64501, "epoch": 777} {"train_loss": -20.604873657226562, "global_step": 64502, "epoch": 777} {"train_loss": -20.501474380493164, "global_step": 64503, "epoch": 777} {"train_loss": -20.28888511657715, "global_step": 64504, "epoch": 777} {"train_loss": -20.671287536621094, "global_step": 64505, "epoch": 777} {"train_loss": -20.477048873901367, "global_step": 64506, "epoch": 777} {"train_loss": -20.313352584838867, "global_step": 64507, "epoch": 777} {"train_loss": -20.572168350219727, "global_step": 64508, "epoch": 777} {"train_loss": -20.45501708984375, "global_step": 64509, "epoch": 777} {"train_loss": -20.6715145111084, "global_step": 64510, "epoch": 777} {"train_loss": -20.084623336791992, "global_step": 64511, "epoch": 777} {"train_loss": -20.599071502685547, "global_step": 64512, "epoch": 777} {"train_loss": -20.380979537963867, "global_step": 64513, "epoch": 777} {"train_loss": -20.858810424804688, "global_step": 64514, "epoch": 777} {"train_loss": -20.4901123046875, "global_step": 64515, "epoch": 777} {"train_loss": -20.502187728881836, "global_step": 64516, "epoch": 777} {"train_loss": -20.473073959350586, "global_step": 64517, "epoch": 777} {"train_loss": -20.264453887939453, "global_step": 64518, "epoch": 777} {"train_loss": -20.729480743408203, "global_step": 64519, "epoch": 777} {"train_loss": -20.20728302001953, "global_step": 64520, "epoch": 777} {"train_loss": -20.48908042907715, "global_step": 64521, "epoch": 777} {"train_loss": -20.660551071166992, "global_step": 64522, "epoch": 777} {"train_loss": -20.499784469604492, "global_step": 64523, "epoch": 777} {"train_loss": -20.4674129486084, "global_step": 64524, "epoch": 777} {"train_loss": -20.53900909423828, "global_step": 64525, "epoch": 777} {"train_loss": -20.63916015625, "global_step": 64526, "epoch": 777} {"train_loss": -20.464570999145508, "global_step": 64527, "epoch": 777} {"train_loss": -20.616918563842773, "global_step": 64528, "epoch": 777} {"train_loss": -20.561656951904297, "global_step": 64529, "epoch": 777} {"train_loss": -20.64961814880371, "global_step": 64530, "epoch": 777} {"train_loss": -20.98981285095215, "global_step": 64531, "epoch": 777} {"train_loss": -20.446298599243164, "global_step": 64532, "epoch": 777} {"train_loss": -20.741186141967773, "global_step": 64533, "epoch": 777} {"train_loss": -20.62655258178711, "global_step": 64534, "epoch": 777} {"train_loss": -20.8741512298584, "global_step": 64535, "epoch": 777} {"train_loss": -20.824987411499023, "global_step": 64536, "epoch": 777} {"train_loss": -20.737770080566406, "global_step": 64537, "epoch": 777} {"train_loss": -21.051626205444336, "global_step": 64538, "epoch": 777} {"train_loss": -20.52803611755371, "global_step": 64539, "epoch": 777} {"train_loss": -20.40669059753418, "global_step": 64540, "epoch": 777} {"train_loss": -20.60540771484375, "global_step": 64541, "epoch": 777} {"train_loss": -20.626060485839844, "global_step": 64542, "epoch": 777} {"train_loss": -20.608800888061523, "global_step": 64543, "epoch": 777} {"train_loss": -20.713544845581055, "global_step": 64544, "epoch": 777} {"train_loss": -20.740713119506836, "global_step": 64545, "epoch": 777} {"train_loss": -20.665861129760742, "global_step": 64546, "epoch": 777} {"train_loss": -20.61384391784668, "global_step": 64547, "epoch": 777} {"train_loss": -20.380836486816406, "global_step": 64548, "epoch": 777} {"train_loss": -21.10710906982422, "global_step": 64549, "epoch": 777} {"train_loss": -20.676315307617188, "global_step": 64550, "epoch": 777} {"train_loss": -21.054813385009766, "global_step": 64551, "epoch": 777} {"train_loss": -20.294281005859375, "global_step": 64552, "epoch": 777} {"train_loss": -20.56878662109375, "global_step": 64553, "epoch": 777} {"train_loss": -20.356000900268555, "global_step": 64554, "epoch": 777} {"train_loss": -20.63120460510254, "global_step": 64555, "epoch": 777} {"train_loss": -20.513315200805664, "global_step": 64556, "epoch": 777} {"train_loss": -20.941640853881836, "global_step": 64557, "epoch": 777} {"train_loss": -20.759540557861328, "global_step": 64558, "epoch": 777} {"train_loss": -20.668827056884766, "global_step": 64559, "epoch": 777} {"train_loss": -20.620512008666992, "global_step": 64560, "epoch": 777} {"train_loss": -20.38435935974121, "global_step": 64561, "epoch": 777} {"train_loss": -20.60169219970703, "global_step": 64562, "epoch": 777} {"train_loss": -20.516820907592773, "global_step": 64563, "epoch": 777} {"train_loss": -20.50381088256836, "global_step": 64564, "epoch": 777} {"train_loss": -20.629322052001953, "global_step": 64565, "epoch": 777} {"train_loss": -20.984140396118164, "global_step": 64566, "epoch": 777} {"train_loss": -20.368947982788086, "global_step": 64567, "epoch": 777} {"train_loss": -20.70680809020996, "global_step": 64568, "epoch": 777} {"train_loss": -20.304723739624023, "global_step": 64569, "epoch": 777} {"train_loss": -20.692617416381836, "global_step": 64570, "epoch": 777} {"train_loss": -20.0692081451416, "global_step": 64571, "epoch": 777} {"train_loss": -20.50739097595215, "global_step": 64572, "epoch": 777} {"train_loss": -20.543085282107434, "global_step": 64573, "epoch": 777, "val_loss": 6170349.5} {"train_loss": -20.443159103393555, "global_step": 64574, "epoch": 778} {"train_loss": -20.52732276916504, "global_step": 64575, "epoch": 778} {"train_loss": -20.402437210083008, "global_step": 64576, "epoch": 778} {"train_loss": -20.49240493774414, "global_step": 64577, "epoch": 778} {"train_loss": -20.40753746032715, "global_step": 64578, "epoch": 778} {"train_loss": -20.705217361450195, "global_step": 64579, "epoch": 778} {"train_loss": -20.067813873291016, "global_step": 64580, "epoch": 778} {"train_loss": -20.52632713317871, "global_step": 64581, "epoch": 778} {"train_loss": -20.770679473876953, "global_step": 64582, "epoch": 778} {"train_loss": -20.37898826599121, "global_step": 64583, "epoch": 778} {"train_loss": -21.021686553955078, "global_step": 64584, "epoch": 778} {"train_loss": -20.735675811767578, "global_step": 64585, "epoch": 778} {"train_loss": -20.74349021911621, "global_step": 64586, "epoch": 778} {"train_loss": -20.45477294921875, "global_step": 64587, "epoch": 778} {"train_loss": -20.110654830932617, "global_step": 64588, "epoch": 778} {"train_loss": -20.433759689331055, "global_step": 64589, "epoch": 778} {"train_loss": -20.143970489501953, "global_step": 64590, "epoch": 778} {"train_loss": -20.561792373657227, "global_step": 64591, "epoch": 778} {"train_loss": -20.46180534362793, "global_step": 64592, "epoch": 778} {"train_loss": -20.77118492126465, "global_step": 64593, "epoch": 778} {"train_loss": -20.733739852905273, "global_step": 64594, "epoch": 778} {"train_loss": -20.69633674621582, "global_step": 64595, "epoch": 778} {"train_loss": -20.60910987854004, "global_step": 64596, "epoch": 778} {"train_loss": -20.711170196533203, "global_step": 64597, "epoch": 778} {"train_loss": -20.653757095336914, "global_step": 64598, "epoch": 778} {"train_loss": -20.72006607055664, "global_step": 64599, "epoch": 778} {"train_loss": -20.770936965942383, "global_step": 64600, "epoch": 778} {"train_loss": -20.81191635131836, "global_step": 64601, "epoch": 778} {"train_loss": -21.0894775390625, "global_step": 64602, "epoch": 778} {"train_loss": -20.743268966674805, "global_step": 64603, "epoch": 778} {"train_loss": -20.650449752807617, "global_step": 64604, "epoch": 778} {"train_loss": -20.739486694335938, "global_step": 64605, "epoch": 778} {"train_loss": -20.316909790039062, "global_step": 64606, "epoch": 778} {"train_loss": -20.85470962524414, "global_step": 64607, "epoch": 778} {"train_loss": -20.885921478271484, "global_step": 64608, "epoch": 778} {"train_loss": -20.94110107421875, "global_step": 64609, "epoch": 778} {"train_loss": -20.42898941040039, "global_step": 64610, "epoch": 778} {"train_loss": -20.525585174560547, "global_step": 64611, "epoch": 778} {"train_loss": -20.638242721557617, "global_step": 64612, "epoch": 778} {"train_loss": -20.833650588989258, "global_step": 64613, "epoch": 778} {"train_loss": -20.581220626831055, "global_step": 64614, "epoch": 778} {"train_loss": -20.654691696166992, "global_step": 64615, "epoch": 778} {"train_loss": -20.618715286254883, "global_step": 64616, "epoch": 778} {"train_loss": -20.650938034057617, "global_step": 64617, "epoch": 778} {"train_loss": -20.539993286132812, "global_step": 64618, "epoch": 778} {"train_loss": -20.53253173828125, "global_step": 64619, "epoch": 778} {"train_loss": -20.386402130126953, "global_step": 64620, "epoch": 778} {"train_loss": -20.65584373474121, "global_step": 64621, "epoch": 778} {"train_loss": -20.877161026000977, "global_step": 64622, "epoch": 778} {"train_loss": -20.842451095581055, "global_step": 64623, "epoch": 778} {"train_loss": -20.868894577026367, "global_step": 64624, "epoch": 778} {"train_loss": -20.469602584838867, "global_step": 64625, "epoch": 778} {"train_loss": -20.74457359313965, "global_step": 64626, "epoch": 778} {"train_loss": -20.480697631835938, "global_step": 64627, "epoch": 778} {"train_loss": -20.286685943603516, "global_step": 64628, "epoch": 778} {"train_loss": -20.987659454345703, "global_step": 64629, "epoch": 778} {"train_loss": -20.641401290893555, "global_step": 64630, "epoch": 778} {"train_loss": -20.40048599243164, "global_step": 64631, "epoch": 778} {"train_loss": -20.636844635009766, "global_step": 64632, "epoch": 778} {"train_loss": -20.64520835876465, "global_step": 64633, "epoch": 778} {"train_loss": -20.295297622680664, "global_step": 64634, "epoch": 778} {"train_loss": -20.641359329223633, "global_step": 64635, "epoch": 778} {"train_loss": -20.686893463134766, "global_step": 64636, "epoch": 778} {"train_loss": -20.30611228942871, "global_step": 64637, "epoch": 778} {"train_loss": -20.78665542602539, "global_step": 64638, "epoch": 778} {"train_loss": -20.4372615814209, "global_step": 64639, "epoch": 778} {"train_loss": -20.287845611572266, "global_step": 64640, "epoch": 778} {"train_loss": -20.604772567749023, "global_step": 64641, "epoch": 778} {"train_loss": -20.473657608032227, "global_step": 64642, "epoch": 778} {"train_loss": -20.801603317260742, "global_step": 64643, "epoch": 778} {"train_loss": -20.693235397338867, "global_step": 64644, "epoch": 778} {"train_loss": -20.277311325073242, "global_step": 64645, "epoch": 778} {"train_loss": -20.694686889648438, "global_step": 64646, "epoch": 778} {"train_loss": -20.291908264160156, "global_step": 64647, "epoch": 778} {"train_loss": -20.713825225830078, "global_step": 64648, "epoch": 778} {"train_loss": -20.618432998657227, "global_step": 64649, "epoch": 778} {"train_loss": -20.633838653564453, "global_step": 64650, "epoch": 778} {"train_loss": -20.51737403869629, "global_step": 64651, "epoch": 778} {"train_loss": -20.77155876159668, "global_step": 64652, "epoch": 778} {"train_loss": -21.020339965820312, "global_step": 64653, "epoch": 778} {"train_loss": -20.446182250976562, "global_step": 64654, "epoch": 778} {"train_loss": -20.245145797729492, "global_step": 64655, "epoch": 778} {"train_loss": -20.616697702063135, "global_step": 64656, "epoch": 778, "val_loss": 5950059.5} {"train_loss": -20.24067497253418, "global_step": 64657, "epoch": 779} {"train_loss": -20.13204002380371, "global_step": 64658, "epoch": 779} {"train_loss": -20.412626266479492, "global_step": 64659, "epoch": 779} {"train_loss": -20.479524612426758, "global_step": 64660, "epoch": 779} {"train_loss": -20.352725982666016, "global_step": 64661, "epoch": 779} {"train_loss": -20.504079818725586, "global_step": 64662, "epoch": 779} {"train_loss": -20.067319869995117, "global_step": 64663, "epoch": 779} {"train_loss": -19.998388290405273, "global_step": 64664, "epoch": 779} {"train_loss": -20.28328514099121, "global_step": 64665, "epoch": 779} {"train_loss": -20.181846618652344, "global_step": 64666, "epoch": 779} {"train_loss": -20.517398834228516, "global_step": 64667, "epoch": 779} {"train_loss": -20.679187774658203, "global_step": 64668, "epoch": 779} {"train_loss": -20.662057876586914, "global_step": 64669, "epoch": 779} {"train_loss": -20.14229393005371, "global_step": 64670, "epoch": 779} {"train_loss": -20.514022827148438, "global_step": 64671, "epoch": 779} {"train_loss": -20.549453735351562, "global_step": 64672, "epoch": 779} {"train_loss": -20.245603561401367, "global_step": 64673, "epoch": 779} {"train_loss": -20.810789108276367, "global_step": 64674, "epoch": 779} {"train_loss": -20.331628799438477, "global_step": 64675, "epoch": 779} {"train_loss": -20.499860763549805, "global_step": 64676, "epoch": 779} {"train_loss": -20.63483238220215, "global_step": 64677, "epoch": 779} {"train_loss": -20.24614906311035, "global_step": 64678, "epoch": 779} {"train_loss": -20.61389923095703, "global_step": 64679, "epoch": 779} {"train_loss": -20.30079460144043, "global_step": 64680, "epoch": 779} {"train_loss": -20.39204978942871, "global_step": 64681, "epoch": 779} {"train_loss": -20.651823043823242, "global_step": 64682, "epoch": 779} {"train_loss": -20.132171630859375, "global_step": 64683, "epoch": 779} {"train_loss": -20.78399085998535, "global_step": 64684, "epoch": 779} {"train_loss": -20.378686904907227, "global_step": 64685, "epoch": 779} {"train_loss": -20.704832077026367, "global_step": 64686, "epoch": 779} {"train_loss": -20.409753799438477, "global_step": 64687, "epoch": 779} {"train_loss": -20.67650032043457, "global_step": 64688, "epoch": 779} {"train_loss": -20.50611686706543, "global_step": 64689, "epoch": 779} {"train_loss": -20.705930709838867, "global_step": 64690, "epoch": 779} {"train_loss": -20.70855140686035, "global_step": 64691, "epoch": 779} {"train_loss": -20.342336654663086, "global_step": 64692, "epoch": 779} {"train_loss": -20.77337646484375, "global_step": 64693, "epoch": 779} {"train_loss": -20.240793228149414, "global_step": 64694, "epoch": 779} {"train_loss": -20.370283126831055, "global_step": 64695, "epoch": 779} {"train_loss": -20.568628311157227, "global_step": 64696, "epoch": 779} {"train_loss": -20.720701217651367, "global_step": 64697, "epoch": 779} {"train_loss": -20.22165298461914, "global_step": 64698, "epoch": 779} {"train_loss": -20.653440475463867, "global_step": 64699, "epoch": 779} {"train_loss": -20.248510360717773, "global_step": 64700, "epoch": 779} {"train_loss": -20.68259048461914, "global_step": 64701, "epoch": 779} {"train_loss": -20.827604293823242, "global_step": 64702, "epoch": 779} {"train_loss": -20.792282104492188, "global_step": 64703, "epoch": 779} {"train_loss": -20.653772354125977, "global_step": 64704, "epoch": 779} {"train_loss": -20.62787437438965, "global_step": 64705, "epoch": 779} {"train_loss": -20.864652633666992, "global_step": 64706, "epoch": 779} {"train_loss": -20.2250919342041, "global_step": 64707, "epoch": 779} {"train_loss": -20.47811508178711, "global_step": 64708, "epoch": 779} {"train_loss": -20.72430419921875, "global_step": 64709, "epoch": 779} {"train_loss": -20.5928897857666, "global_step": 64710, "epoch": 779} {"train_loss": -21.090482711791992, "global_step": 64711, "epoch": 779} {"train_loss": -20.373035430908203, "global_step": 64712, "epoch": 779} {"train_loss": -20.223623275756836, "global_step": 64713, "epoch": 779} {"train_loss": -20.574514389038086, "global_step": 64714, "epoch": 779} {"train_loss": -20.508316040039062, "global_step": 64715, "epoch": 779} {"train_loss": -20.466140747070312, "global_step": 64716, "epoch": 779} {"train_loss": -20.548171997070312, "global_step": 64717, "epoch": 779} {"train_loss": -20.45235252380371, "global_step": 64718, "epoch": 779} {"train_loss": -20.73729705810547, "global_step": 64719, "epoch": 779} {"train_loss": -20.629419326782227, "global_step": 64720, "epoch": 779} {"train_loss": -20.39223289489746, "global_step": 64721, "epoch": 779} {"train_loss": -20.659732818603516, "global_step": 64722, "epoch": 779} {"train_loss": -20.596181869506836, "global_step": 64723, "epoch": 779} {"train_loss": -20.97191619873047, "global_step": 64724, "epoch": 779} {"train_loss": -20.487224578857422, "global_step": 64725, "epoch": 779} {"train_loss": -20.975967407226562, "global_step": 64726, "epoch": 779} {"train_loss": -20.598674774169922, "global_step": 64727, "epoch": 779} {"train_loss": -20.620819091796875, "global_step": 64728, "epoch": 779} {"train_loss": -20.667409896850586, "global_step": 64729, "epoch": 779} {"train_loss": -20.59534454345703, "global_step": 64730, "epoch": 779} {"train_loss": -20.45357322692871, "global_step": 64731, "epoch": 779} {"train_loss": -20.480224609375, "global_step": 64732, "epoch": 779} {"train_loss": -20.7560977935791, "global_step": 64733, "epoch": 779} {"train_loss": -21.021150588989258, "global_step": 64734, "epoch": 779} {"train_loss": -20.915374755859375, "global_step": 64735, "epoch": 779} {"train_loss": -20.57204246520996, "global_step": 64736, "epoch": 779} {"train_loss": -20.620973587036133, "global_step": 64737, "epoch": 779} {"train_loss": -20.630619049072266, "global_step": 64738, "epoch": 779} {"train_loss": -20.542877381106457, "global_step": 64739, "epoch": 779, "val_loss": 6165767.0} {"train_loss": -20.5445499420166, "global_step": 64740, "epoch": 780} {"train_loss": -20.533063888549805, "global_step": 64741, "epoch": 780} {"train_loss": -20.347110748291016, "global_step": 64742, "epoch": 780} {"train_loss": -20.198423385620117, "global_step": 64743, "epoch": 780} {"train_loss": -20.433523178100586, "global_step": 64744, "epoch": 780} {"train_loss": -20.899499893188477, "global_step": 64745, "epoch": 780} {"train_loss": -20.437536239624023, "global_step": 64746, "epoch": 780} {"train_loss": -20.62763023376465, "global_step": 64747, "epoch": 780} {"train_loss": -20.6297607421875, "global_step": 64748, "epoch": 780} {"train_loss": -20.571760177612305, "global_step": 64749, "epoch": 780} {"train_loss": -20.612401962280273, "global_step": 64750, "epoch": 780} {"train_loss": -20.685022354125977, "global_step": 64751, "epoch": 780} {"train_loss": -20.87058448791504, "global_step": 64752, "epoch": 780} {"train_loss": -20.698720932006836, "global_step": 64753, "epoch": 780} {"train_loss": -20.48052215576172, "global_step": 64754, "epoch": 780} {"train_loss": -20.680757522583008, "global_step": 64755, "epoch": 780} {"train_loss": -20.874616622924805, "global_step": 64756, "epoch": 780} {"train_loss": -20.933717727661133, "global_step": 64757, "epoch": 780} {"train_loss": -20.786314010620117, "global_step": 64758, "epoch": 780} {"train_loss": -20.51605224609375, "global_step": 64759, "epoch": 780} {"train_loss": -20.490585327148438, "global_step": 64760, "epoch": 780} {"train_loss": -20.669517517089844, "global_step": 64761, "epoch": 780} {"train_loss": -20.569183349609375, "global_step": 64762, "epoch": 780} {"train_loss": -20.692337036132812, "global_step": 64763, "epoch": 780} {"train_loss": -20.668983459472656, "global_step": 64764, "epoch": 780} {"train_loss": -20.41131591796875, "global_step": 64765, "epoch": 780} {"train_loss": -20.583770751953125, "global_step": 64766, "epoch": 780} {"train_loss": -20.926738739013672, "global_step": 64767, "epoch": 780} {"train_loss": -20.431415557861328, "global_step": 64768, "epoch": 780} {"train_loss": -20.335800170898438, "global_step": 64769, "epoch": 780} {"train_loss": -20.526493072509766, "global_step": 64770, "epoch": 780} {"train_loss": -20.254602432250977, "global_step": 64771, "epoch": 780} {"train_loss": -20.279218673706055, "global_step": 64772, "epoch": 780} {"train_loss": -20.348783493041992, "global_step": 64773, "epoch": 780} {"train_loss": -20.6414794921875, "global_step": 64774, "epoch": 780} {"train_loss": -20.489852905273438, "global_step": 64775, "epoch": 780} {"train_loss": -20.680612564086914, "global_step": 64776, "epoch": 780} {"train_loss": -20.58218002319336, "global_step": 64777, "epoch": 780} {"train_loss": -20.63038444519043, "global_step": 64778, "epoch": 780} {"train_loss": -20.839496612548828, "global_step": 64779, "epoch": 780} {"train_loss": -20.383970260620117, "global_step": 64780, "epoch": 780} {"train_loss": -20.739471435546875, "global_step": 64781, "epoch": 780} {"train_loss": -20.491191864013672, "global_step": 64782, "epoch": 780} {"train_loss": -20.727632522583008, "global_step": 64783, "epoch": 780} {"train_loss": -20.742246627807617, "global_step": 64784, "epoch": 780} {"train_loss": -20.827054977416992, "global_step": 64785, "epoch": 780} {"train_loss": -20.93930435180664, "global_step": 64786, "epoch": 780} {"train_loss": -20.38726806640625, "global_step": 64787, "epoch": 780} {"train_loss": -20.70274543762207, "global_step": 64788, "epoch": 780} {"train_loss": -20.488265991210938, "global_step": 64789, "epoch": 780} {"train_loss": -20.780290603637695, "global_step": 64790, "epoch": 780} {"train_loss": -20.40862464904785, "global_step": 64791, "epoch": 780} {"train_loss": -20.224748611450195, "global_step": 64792, "epoch": 780} {"train_loss": -20.82656478881836, "global_step": 64793, "epoch": 780} {"train_loss": -20.5643253326416, "global_step": 64794, "epoch": 780} {"train_loss": -20.55388641357422, "global_step": 64795, "epoch": 780} {"train_loss": -20.87919807434082, "global_step": 64796, "epoch": 780} {"train_loss": -20.32777976989746, "global_step": 64797, "epoch": 780} {"train_loss": -20.71231460571289, "global_step": 64798, "epoch": 780} {"train_loss": -20.998859405517578, "global_step": 64799, "epoch": 780} {"train_loss": -20.600156784057617, "global_step": 64800, "epoch": 780} {"train_loss": -20.5682430267334, "global_step": 64801, "epoch": 780} {"train_loss": -20.477140426635742, "global_step": 64802, "epoch": 780} {"train_loss": -20.829282760620117, "global_step": 64803, "epoch": 780} {"train_loss": -20.389402389526367, "global_step": 64804, "epoch": 780} {"train_loss": -21.018735885620117, "global_step": 64805, "epoch": 780} {"train_loss": -20.124256134033203, "global_step": 64806, "epoch": 780} {"train_loss": -20.622358322143555, "global_step": 64807, "epoch": 780} {"train_loss": -20.529966354370117, "global_step": 64808, "epoch": 780} {"train_loss": -20.705036163330078, "global_step": 64809, "epoch": 780} {"train_loss": -20.447372436523438, "global_step": 64810, "epoch": 780} {"train_loss": -20.648847579956055, "global_step": 64811, "epoch": 780} {"train_loss": -20.60625648498535, "global_step": 64812, "epoch": 780} {"train_loss": -20.384706497192383, "global_step": 64813, "epoch": 780} {"train_loss": -20.4122371673584, "global_step": 64814, "epoch": 780} {"train_loss": -20.498977661132812, "global_step": 64815, "epoch": 780} {"train_loss": -20.38157081604004, "global_step": 64816, "epoch": 780} {"train_loss": -20.709819793701172, "global_step": 64817, "epoch": 780} {"train_loss": -20.3304386138916, "global_step": 64818, "epoch": 780} {"train_loss": -20.19764518737793, "global_step": 64819, "epoch": 780} {"train_loss": -20.411579132080078, "global_step": 64820, "epoch": 780} {"train_loss": -20.17073631286621, "global_step": 64821, "epoch": 780} {"train_loss": -20.574708088334784, "global_step": 64822, "epoch": 780, "val_loss": 5880983.5} {"train_loss": -19.435155868530273, "global_step": 64823, "epoch": 781} {"train_loss": -19.984622955322266, "global_step": 64824, "epoch": 781} {"train_loss": -20.007253646850586, "global_step": 64825, "epoch": 781} {"train_loss": -19.516376495361328, "global_step": 64826, "epoch": 781} {"train_loss": -19.745752334594727, "global_step": 64827, "epoch": 781} {"train_loss": -20.056087493896484, "global_step": 64828, "epoch": 781} {"train_loss": -20.00848960876465, "global_step": 64829, "epoch": 781} {"train_loss": -19.810300827026367, "global_step": 64830, "epoch": 781} {"train_loss": -20.543994903564453, "global_step": 64831, "epoch": 781} {"train_loss": -20.407337188720703, "global_step": 64832, "epoch": 781} {"train_loss": -20.55476188659668, "global_step": 64833, "epoch": 781} {"train_loss": -19.962352752685547, "global_step": 64834, "epoch": 781} {"train_loss": -20.445098876953125, "global_step": 64835, "epoch": 781} {"train_loss": -20.222816467285156, "global_step": 64836, "epoch": 781} {"train_loss": -20.382293701171875, "global_step": 64837, "epoch": 781} {"train_loss": -20.419687271118164, "global_step": 64838, "epoch": 781} {"train_loss": -20.660646438598633, "global_step": 64839, "epoch": 781} {"train_loss": -20.143909454345703, "global_step": 64840, "epoch": 781} {"train_loss": -20.12359619140625, "global_step": 64841, "epoch": 781} {"train_loss": -20.278356552124023, "global_step": 64842, "epoch": 781} {"train_loss": -20.27952003479004, "global_step": 64843, "epoch": 781} {"train_loss": -20.572927474975586, "global_step": 64844, "epoch": 781} {"train_loss": -20.47962760925293, "global_step": 64845, "epoch": 781} {"train_loss": -20.647275924682617, "global_step": 64846, "epoch": 781} {"train_loss": -20.423179626464844, "global_step": 64847, "epoch": 781} {"train_loss": -20.357389450073242, "global_step": 64848, "epoch": 781} {"train_loss": -20.530420303344727, "global_step": 64849, "epoch": 781} {"train_loss": -20.73463249206543, "global_step": 64850, "epoch": 781} {"train_loss": -20.355987548828125, "global_step": 64851, "epoch": 781} {"train_loss": -20.80331802368164, "global_step": 64852, "epoch": 781} {"train_loss": -20.20985221862793, "global_step": 64853, "epoch": 781} {"train_loss": -20.301284790039062, "global_step": 64854, "epoch": 781} {"train_loss": -20.63055419921875, "global_step": 64855, "epoch": 781} {"train_loss": -20.453886032104492, "global_step": 64856, "epoch": 781} {"train_loss": -20.701248168945312, "global_step": 64857, "epoch": 781} {"train_loss": -20.542251586914062, "global_step": 64858, "epoch": 781} {"train_loss": -20.735340118408203, "global_step": 64859, "epoch": 781} {"train_loss": -20.415943145751953, "global_step": 64860, "epoch": 781} {"train_loss": -20.694486618041992, "global_step": 64861, "epoch": 781} {"train_loss": -20.740476608276367, "global_step": 64862, "epoch": 781} {"train_loss": -20.398630142211914, "global_step": 64863, "epoch": 781} {"train_loss": -20.262121200561523, "global_step": 64864, "epoch": 781} {"train_loss": -20.435047149658203, "global_step": 64865, "epoch": 781} {"train_loss": -20.731693267822266, "global_step": 64866, "epoch": 781} {"train_loss": -20.495298385620117, "global_step": 64867, "epoch": 781} {"train_loss": -20.25807762145996, "global_step": 64868, "epoch": 781} {"train_loss": -20.756336212158203, "global_step": 64869, "epoch": 781} {"train_loss": -20.39255142211914, "global_step": 64870, "epoch": 781} {"train_loss": -20.602460861206055, "global_step": 64871, "epoch": 781} {"train_loss": -20.718481063842773, "global_step": 64872, "epoch": 781} {"train_loss": -20.701608657836914, "global_step": 64873, "epoch": 781} {"train_loss": -20.659809112548828, "global_step": 64874, "epoch": 781} {"train_loss": -20.473779678344727, "global_step": 64875, "epoch": 781} {"train_loss": -20.57792854309082, "global_step": 64876, "epoch": 781} {"train_loss": -20.409292221069336, "global_step": 64877, "epoch": 781} {"train_loss": -20.376550674438477, "global_step": 64878, "epoch": 781} {"train_loss": -20.75929832458496, "global_step": 64879, "epoch": 781} {"train_loss": -20.86028289794922, "global_step": 64880, "epoch": 781} {"train_loss": -20.875991821289062, "global_step": 64881, "epoch": 781} {"train_loss": -20.758100509643555, "global_step": 64882, "epoch": 781} {"train_loss": -20.806726455688477, "global_step": 64883, "epoch": 781} {"train_loss": -20.642532348632812, "global_step": 64884, "epoch": 781} {"train_loss": -21.171247482299805, "global_step": 64885, "epoch": 781} {"train_loss": -20.539793014526367, "global_step": 64886, "epoch": 781} {"train_loss": -20.421262741088867, "global_step": 64887, "epoch": 781} {"train_loss": -20.900894165039062, "global_step": 64888, "epoch": 781} {"train_loss": -20.489154815673828, "global_step": 64889, "epoch": 781} {"train_loss": -20.612611770629883, "global_step": 64890, "epoch": 781} {"train_loss": -20.495370864868164, "global_step": 64891, "epoch": 781} {"train_loss": -20.374231338500977, "global_step": 64892, "epoch": 781} {"train_loss": -20.352840423583984, "global_step": 64893, "epoch": 781} {"train_loss": -20.49640464782715, "global_step": 64894, "epoch": 781} {"train_loss": -20.563695907592773, "global_step": 64895, "epoch": 781} {"train_loss": -20.894262313842773, "global_step": 64896, "epoch": 781} {"train_loss": -20.815933227539062, "global_step": 64897, "epoch": 781} {"train_loss": -20.31451416015625, "global_step": 64898, "epoch": 781} {"train_loss": -20.590246200561523, "global_step": 64899, "epoch": 781} {"train_loss": -20.655210494995117, "global_step": 64900, "epoch": 781} {"train_loss": -20.761411666870117, "global_step": 64901, "epoch": 781} {"train_loss": -20.48270034790039, "global_step": 64902, "epoch": 781} {"train_loss": -20.25234603881836, "global_step": 64903, "epoch": 781} {"train_loss": -20.580020904541016, "global_step": 64904, "epoch": 781} {"train_loss": -20.47824436785227, "global_step": 64905, "epoch": 781, "val_loss": 6058253.5} {"train_loss": -20.031614303588867, "global_step": 64906, "epoch": 782} {"train_loss": -20.118507385253906, "global_step": 64907, "epoch": 782} {"train_loss": -20.348495483398438, "global_step": 64908, "epoch": 782} {"train_loss": -20.41733741760254, "global_step": 64909, "epoch": 782} {"train_loss": -20.605052947998047, "global_step": 64910, "epoch": 782} {"train_loss": -20.560514450073242, "global_step": 64911, "epoch": 782} {"train_loss": -20.504619598388672, "global_step": 64912, "epoch": 782} {"train_loss": -20.32990837097168, "global_step": 64913, "epoch": 782} {"train_loss": -20.38932228088379, "global_step": 64914, "epoch": 782} {"train_loss": -20.59432029724121, "global_step": 64915, "epoch": 782} {"train_loss": -20.246580123901367, "global_step": 64916, "epoch": 782} {"train_loss": -20.712879180908203, "global_step": 64917, "epoch": 782} {"train_loss": -20.482755661010742, "global_step": 64918, "epoch": 782} {"train_loss": -20.757150650024414, "global_step": 64919, "epoch": 782} {"train_loss": -20.27288818359375, "global_step": 64920, "epoch": 782} {"train_loss": -20.305343627929688, "global_step": 64921, "epoch": 782} {"train_loss": -20.51796531677246, "global_step": 64922, "epoch": 782} {"train_loss": -20.59507179260254, "global_step": 64923, "epoch": 782} {"train_loss": -20.56305503845215, "global_step": 64924, "epoch": 782} {"train_loss": -20.444551467895508, "global_step": 64925, "epoch": 782} {"train_loss": -20.63606071472168, "global_step": 64926, "epoch": 782} {"train_loss": -20.455167770385742, "global_step": 64927, "epoch": 782} {"train_loss": -20.69524574279785, "global_step": 64928, "epoch": 782} {"train_loss": -20.444398880004883, "global_step": 64929, "epoch": 782} {"train_loss": -20.4739933013916, "global_step": 64930, "epoch": 782} {"train_loss": -20.997623443603516, "global_step": 64931, "epoch": 782} {"train_loss": -20.736913681030273, "global_step": 64932, "epoch": 782} {"train_loss": -20.700510025024414, "global_step": 64933, "epoch": 782} {"train_loss": -20.60610008239746, "global_step": 64934, "epoch": 782} {"train_loss": -20.67029571533203, "global_step": 64935, "epoch": 782} {"train_loss": -20.550411224365234, "global_step": 64936, "epoch": 782} {"train_loss": -20.671499252319336, "global_step": 64937, "epoch": 782} {"train_loss": -20.798986434936523, "global_step": 64938, "epoch": 782} {"train_loss": -20.365915298461914, "global_step": 64939, "epoch": 782} {"train_loss": -20.62032127380371, "global_step": 64940, "epoch": 782} {"train_loss": -20.67159080505371, "global_step": 64941, "epoch": 782} {"train_loss": -20.584707260131836, "global_step": 64942, "epoch": 782} {"train_loss": -20.365507125854492, "global_step": 64943, "epoch": 782} {"train_loss": -20.458608627319336, "global_step": 64944, "epoch": 782} {"train_loss": -20.71689224243164, "global_step": 64945, "epoch": 782} {"train_loss": -20.927961349487305, "global_step": 64946, "epoch": 782} {"train_loss": -20.461986541748047, "global_step": 64947, "epoch": 782} {"train_loss": -20.160980224609375, "global_step": 64948, "epoch": 782} {"train_loss": -20.36858558654785, "global_step": 64949, "epoch": 782} {"train_loss": -20.854297637939453, "global_step": 64950, "epoch": 782} {"train_loss": -20.663755416870117, "global_step": 64951, "epoch": 782} {"train_loss": -20.674560546875, "global_step": 64952, "epoch": 782} {"train_loss": -20.853206634521484, "global_step": 64953, "epoch": 782} {"train_loss": -20.65934944152832, "global_step": 64954, "epoch": 782} {"train_loss": -20.845508575439453, "global_step": 64955, "epoch": 782} {"train_loss": -20.29991912841797, "global_step": 64956, "epoch": 782} {"train_loss": -20.876861572265625, "global_step": 64957, "epoch": 782} {"train_loss": -20.721155166625977, "global_step": 64958, "epoch": 782} {"train_loss": -20.826175689697266, "global_step": 64959, "epoch": 782} {"train_loss": -20.59120750427246, "global_step": 64960, "epoch": 782} {"train_loss": -20.429288864135742, "global_step": 64961, "epoch": 782} {"train_loss": -20.668197631835938, "global_step": 64962, "epoch": 782} {"train_loss": -20.838207244873047, "global_step": 64963, "epoch": 782} {"train_loss": -20.512893676757812, "global_step": 64964, "epoch": 782} {"train_loss": -20.760412216186523, "global_step": 64965, "epoch": 782} {"train_loss": -20.44279670715332, "global_step": 64966, "epoch": 782} {"train_loss": -20.704954147338867, "global_step": 64967, "epoch": 782} {"train_loss": -20.499330520629883, "global_step": 64968, "epoch": 782} {"train_loss": -20.513568878173828, "global_step": 64969, "epoch": 782} {"train_loss": -20.79518699645996, "global_step": 64970, "epoch": 782} {"train_loss": -21.118362426757812, "global_step": 64971, "epoch": 782} {"train_loss": -20.65005874633789, "global_step": 64972, "epoch": 782} {"train_loss": -20.414445877075195, "global_step": 64973, "epoch": 782} {"train_loss": -20.84255027770996, "global_step": 64974, "epoch": 782} {"train_loss": -20.376052856445312, "global_step": 64975, "epoch": 782} {"train_loss": -20.753141403198242, "global_step": 64976, "epoch": 782} {"train_loss": -20.845487594604492, "global_step": 64977, "epoch": 782} {"train_loss": -20.461978912353516, "global_step": 64978, "epoch": 782} {"train_loss": -20.981494903564453, "global_step": 64979, "epoch": 782} {"train_loss": -20.54438591003418, "global_step": 64980, "epoch": 782} {"train_loss": -20.43328285217285, "global_step": 64981, "epoch": 782} {"train_loss": -20.507598876953125, "global_step": 64982, "epoch": 782} {"train_loss": -20.64252471923828, "global_step": 64983, "epoch": 782} {"train_loss": -20.875019073486328, "global_step": 64984, "epoch": 782} {"train_loss": -20.54250144958496, "global_step": 64985, "epoch": 782} {"train_loss": -20.52530860900879, "global_step": 64986, "epoch": 782} {"train_loss": -20.605993270874023, "global_step": 64987, "epoch": 782} {"train_loss": -20.587827383753766, "global_step": 64988, "epoch": 782, "val_loss": 5991405.0} {"train_loss": -20.304365158081055, "global_step": 64989, "epoch": 783} {"train_loss": -20.482816696166992, "global_step": 64990, "epoch": 783} {"train_loss": -20.60204315185547, "global_step": 64991, "epoch": 783} {"train_loss": -20.296262741088867, "global_step": 64992, "epoch": 783} {"train_loss": -20.56206703186035, "global_step": 64993, "epoch": 783} {"train_loss": -20.590269088745117, "global_step": 64994, "epoch": 783} {"train_loss": -20.21393585205078, "global_step": 64995, "epoch": 783} {"train_loss": -20.61125373840332, "global_step": 64996, "epoch": 783} {"train_loss": -20.216598510742188, "global_step": 64997, "epoch": 783} {"train_loss": -20.208927154541016, "global_step": 64998, "epoch": 783} {"train_loss": -20.36884117126465, "global_step": 64999, "epoch": 783} {"train_loss": -20.628734588623047, "global_step": 65000, "epoch": 783} {"train_loss": -20.30191421508789, "global_step": 65001, "epoch": 783} {"train_loss": -20.84384536743164, "global_step": 65002, "epoch": 783} {"train_loss": -20.216320037841797, "global_step": 65003, "epoch": 783} {"train_loss": -20.259740829467773, "global_step": 65004, "epoch": 783} {"train_loss": -20.40044403076172, "global_step": 65005, "epoch": 783} {"train_loss": -20.475427627563477, "global_step": 65006, "epoch": 783} {"train_loss": -20.6472110748291, "global_step": 65007, "epoch": 783} {"train_loss": -20.821569442749023, "global_step": 65008, "epoch": 783} {"train_loss": -20.867679595947266, "global_step": 65009, "epoch": 783} {"train_loss": -20.24368667602539, "global_step": 65010, "epoch": 783} {"train_loss": -20.441118240356445, "global_step": 65011, "epoch": 783} {"train_loss": -20.553932189941406, "global_step": 65012, "epoch": 783} {"train_loss": -20.375272750854492, "global_step": 65013, "epoch": 783} {"train_loss": -20.152664184570312, "global_step": 65014, "epoch": 783} {"train_loss": -20.696439743041992, "global_step": 65015, "epoch": 783} {"train_loss": -20.50876808166504, "global_step": 65016, "epoch": 783} {"train_loss": -20.36307716369629, "global_step": 65017, "epoch": 783} {"train_loss": -20.524749755859375, "global_step": 65018, "epoch": 783} {"train_loss": -20.79297637939453, "global_step": 65019, "epoch": 783} {"train_loss": -20.450735092163086, "global_step": 65020, "epoch": 783} {"train_loss": -20.60957145690918, "global_step": 65021, "epoch": 783} {"train_loss": -20.62739372253418, "global_step": 65022, "epoch": 783} {"train_loss": -20.601774215698242, "global_step": 65023, "epoch": 783} {"train_loss": -20.90471076965332, "global_step": 65024, "epoch": 783} {"train_loss": -20.748659133911133, "global_step": 65025, "epoch": 783} {"train_loss": -20.65460777282715, "global_step": 65026, "epoch": 783} {"train_loss": -21.314870834350586, "global_step": 65027, "epoch": 783} {"train_loss": -20.41019630432129, "global_step": 65028, "epoch": 783} {"train_loss": -20.931737899780273, "global_step": 65029, "epoch": 783} {"train_loss": -20.67569923400879, "global_step": 65030, "epoch": 783} {"train_loss": -20.606061935424805, "global_step": 65031, "epoch": 783} {"train_loss": -20.876026153564453, "global_step": 65032, "epoch": 783} {"train_loss": -20.64752769470215, "global_step": 65033, "epoch": 783} {"train_loss": -20.55201530456543, "global_step": 65034, "epoch": 783} {"train_loss": -20.54582977294922, "global_step": 65035, "epoch": 783} {"train_loss": -20.474050521850586, "global_step": 65036, "epoch": 783} {"train_loss": -20.886173248291016, "global_step": 65037, "epoch": 783} {"train_loss": -20.76798439025879, "global_step": 65038, "epoch": 783} {"train_loss": -20.532896041870117, "global_step": 65039, "epoch": 783} {"train_loss": -20.766376495361328, "global_step": 65040, "epoch": 783} {"train_loss": -19.941402435302734, "global_step": 65041, "epoch": 783} {"train_loss": -20.5364990234375, "global_step": 65042, "epoch": 783} {"train_loss": -20.51809310913086, "global_step": 65043, "epoch": 783} {"train_loss": -20.532241821289062, "global_step": 65044, "epoch": 783} {"train_loss": -20.469141006469727, "global_step": 65045, "epoch": 783} {"train_loss": -20.321943283081055, "global_step": 65046, "epoch": 783} {"train_loss": -20.8983211517334, "global_step": 65047, "epoch": 783} {"train_loss": -20.170995712280273, "global_step": 65048, "epoch": 783} {"train_loss": -20.607864379882812, "global_step": 65049, "epoch": 783} {"train_loss": -20.944936752319336, "global_step": 65050, "epoch": 783} {"train_loss": -20.333158493041992, "global_step": 65051, "epoch": 783} {"train_loss": -20.884502410888672, "global_step": 65052, "epoch": 783} {"train_loss": -20.829410552978516, "global_step": 65053, "epoch": 783} {"train_loss": -20.68097496032715, "global_step": 65054, "epoch": 783} {"train_loss": -20.781105041503906, "global_step": 65055, "epoch": 783} {"train_loss": -20.637632369995117, "global_step": 65056, "epoch": 783} {"train_loss": -20.981721878051758, "global_step": 65057, "epoch": 783} {"train_loss": -20.609020233154297, "global_step": 65058, "epoch": 783} {"train_loss": -20.655860900878906, "global_step": 65059, "epoch": 783} {"train_loss": -20.340335845947266, "global_step": 65060, "epoch": 783} {"train_loss": -20.632551193237305, "global_step": 65061, "epoch": 783} {"train_loss": -20.70586395263672, "global_step": 65062, "epoch": 783} {"train_loss": -20.938770294189453, "global_step": 65063, "epoch": 783} {"train_loss": -20.640989303588867, "global_step": 65064, "epoch": 783} {"train_loss": -20.66168785095215, "global_step": 65065, "epoch": 783} {"train_loss": -20.853628158569336, "global_step": 65066, "epoch": 783} {"train_loss": -20.167936325073242, "global_step": 65067, "epoch": 783} {"train_loss": -20.803552627563477, "global_step": 65068, "epoch": 783} {"train_loss": -20.62967300415039, "global_step": 65069, "epoch": 783} {"train_loss": -20.47566795349121, "global_step": 65070, "epoch": 783} {"train_loss": -20.59652098690171, "global_step": 65071, "epoch": 783, "val_loss": 5924410.5} {"train_loss": -19.8077335357666, "global_step": 65072, "epoch": 784} {"train_loss": -20.584707260131836, "global_step": 65073, "epoch": 784} {"train_loss": -19.919845581054688, "global_step": 65074, "epoch": 784} {"train_loss": -20.437074661254883, "global_step": 65075, "epoch": 784} {"train_loss": -19.77283477783203, "global_step": 65076, "epoch": 784} {"train_loss": -20.578397750854492, "global_step": 65077, "epoch": 784} {"train_loss": -20.326719284057617, "global_step": 65078, "epoch": 784} {"train_loss": -20.76546287536621, "global_step": 65079, "epoch": 784} {"train_loss": -20.49712562561035, "global_step": 65080, "epoch": 784} {"train_loss": -20.374067306518555, "global_step": 65081, "epoch": 784} {"train_loss": -20.353574752807617, "global_step": 65082, "epoch": 784} {"train_loss": -20.08217430114746, "global_step": 65083, "epoch": 784} {"train_loss": -20.701374053955078, "global_step": 65084, "epoch": 784} {"train_loss": -20.3303279876709, "global_step": 65085, "epoch": 784} {"train_loss": -20.796979904174805, "global_step": 65086, "epoch": 784} {"train_loss": -20.291791915893555, "global_step": 65087, "epoch": 784} {"train_loss": -20.18286895751953, "global_step": 65088, "epoch": 784} {"train_loss": -20.50462532043457, "global_step": 65089, "epoch": 784} {"train_loss": -20.621763229370117, "global_step": 65090, "epoch": 784} {"train_loss": -20.803909301757812, "global_step": 65091, "epoch": 784} {"train_loss": -20.80935287475586, "global_step": 65092, "epoch": 784} {"train_loss": -20.930662155151367, "global_step": 65093, "epoch": 784} {"train_loss": -20.484373092651367, "global_step": 65094, "epoch": 784} {"train_loss": -20.878433227539062, "global_step": 65095, "epoch": 784} {"train_loss": -20.744800567626953, "global_step": 65096, "epoch": 784} {"train_loss": -20.657516479492188, "global_step": 65097, "epoch": 784} {"train_loss": -20.327152252197266, "global_step": 65098, "epoch": 784} {"train_loss": -20.427196502685547, "global_step": 65099, "epoch": 784} {"train_loss": -20.602752685546875, "global_step": 65100, "epoch": 784} {"train_loss": -20.803020477294922, "global_step": 65101, "epoch": 784} {"train_loss": -20.3684024810791, "global_step": 65102, "epoch": 784} {"train_loss": -20.4652099609375, "global_step": 65103, "epoch": 784} {"train_loss": -20.616195678710938, "global_step": 65104, "epoch": 784} {"train_loss": -20.508304595947266, "global_step": 65105, "epoch": 784} {"train_loss": -20.82120132446289, "global_step": 65106, "epoch": 784} {"train_loss": -20.853363037109375, "global_step": 65107, "epoch": 784} {"train_loss": -20.826400756835938, "global_step": 65108, "epoch": 784} {"train_loss": -20.413970947265625, "global_step": 65109, "epoch": 784} {"train_loss": -20.383913040161133, "global_step": 65110, "epoch": 784} {"train_loss": -20.26881217956543, "global_step": 65111, "epoch": 784} {"train_loss": -20.495052337646484, "global_step": 65112, "epoch": 784} {"train_loss": -20.65416717529297, "global_step": 65113, "epoch": 784} {"train_loss": -20.737735748291016, "global_step": 65114, "epoch": 784} {"train_loss": -20.641103744506836, "global_step": 65115, "epoch": 784} {"train_loss": -20.42037010192871, "global_step": 65116, "epoch": 784} {"train_loss": -20.34450340270996, "global_step": 65117, "epoch": 784} {"train_loss": -20.695051193237305, "global_step": 65118, "epoch": 784} {"train_loss": -20.980283737182617, "global_step": 65119, "epoch": 784} {"train_loss": -20.638687133789062, "global_step": 65120, "epoch": 784} {"train_loss": -20.62619400024414, "global_step": 65121, "epoch": 784} {"train_loss": -20.275571823120117, "global_step": 65122, "epoch": 784} {"train_loss": -20.737442016601562, "global_step": 65123, "epoch": 784} {"train_loss": -20.210519790649414, "global_step": 65124, "epoch": 784} {"train_loss": -21.19251823425293, "global_step": 65125, "epoch": 784} {"train_loss": -21.02338218688965, "global_step": 65126, "epoch": 784} {"train_loss": -20.489416122436523, "global_step": 65127, "epoch": 784} {"train_loss": -20.634672164916992, "global_step": 65128, "epoch": 784} {"train_loss": -20.8441104888916, "global_step": 65129, "epoch": 784} {"train_loss": -20.621240615844727, "global_step": 65130, "epoch": 784} {"train_loss": -20.64130210876465, "global_step": 65131, "epoch": 784} {"train_loss": -20.604400634765625, "global_step": 65132, "epoch": 784} {"train_loss": -20.761051177978516, "global_step": 65133, "epoch": 784} {"train_loss": -20.596572875976562, "global_step": 65134, "epoch": 784} {"train_loss": -20.334260940551758, "global_step": 65135, "epoch": 784} {"train_loss": -20.419921875, "global_step": 65136, "epoch": 784} {"train_loss": -20.73383903503418, "global_step": 65137, "epoch": 784} {"train_loss": -20.82283592224121, "global_step": 65138, "epoch": 784} {"train_loss": -20.9677677154541, "global_step": 65139, "epoch": 784} {"train_loss": -20.78245735168457, "global_step": 65140, "epoch": 784} {"train_loss": -20.907995223999023, "global_step": 65141, "epoch": 784} {"train_loss": -20.652881622314453, "global_step": 65142, "epoch": 784} {"train_loss": -20.518123626708984, "global_step": 65143, "epoch": 784} {"train_loss": -21.152982711791992, "global_step": 65144, "epoch": 784} {"train_loss": -20.865478515625, "global_step": 65145, "epoch": 784} {"train_loss": -20.769739151000977, "global_step": 65146, "epoch": 784} {"train_loss": -20.819732666015625, "global_step": 65147, "epoch": 784} {"train_loss": -20.433109283447266, "global_step": 65148, "epoch": 784} {"train_loss": -20.601686477661133, "global_step": 65149, "epoch": 784} {"train_loss": -20.8397159576416, "global_step": 65150, "epoch": 784} {"train_loss": -20.778152465820312, "global_step": 65151, "epoch": 784} {"train_loss": -20.5305233001709, "global_step": 65152, "epoch": 784} {"train_loss": -20.432716369628906, "global_step": 65153, "epoch": 784} {"train_loss": -20.60993325566671, "global_step": 65154, "epoch": 784, "val_loss": 5962632.0} {"train_loss": -19.465925216674805, "global_step": 65155, "epoch": 785} {"train_loss": -19.529315948486328, "global_step": 65156, "epoch": 785} {"train_loss": -20.234067916870117, "global_step": 65157, "epoch": 785} {"train_loss": -20.134761810302734, "global_step": 65158, "epoch": 785} {"train_loss": -19.871610641479492, "global_step": 65159, "epoch": 785} {"train_loss": -20.522449493408203, "global_step": 65160, "epoch": 785} {"train_loss": -20.515796661376953, "global_step": 65161, "epoch": 785} {"train_loss": -20.628347396850586, "global_step": 65162, "epoch": 785} {"train_loss": -20.286239624023438, "global_step": 65163, "epoch": 785} {"train_loss": -20.2742977142334, "global_step": 65164, "epoch": 785} {"train_loss": -20.303003311157227, "global_step": 65165, "epoch": 785} {"train_loss": -20.27536392211914, "global_step": 65166, "epoch": 785} {"train_loss": -20.43830108642578, "global_step": 65167, "epoch": 785} {"train_loss": -20.696569442749023, "global_step": 65168, "epoch": 785} {"train_loss": -20.52147102355957, "global_step": 65169, "epoch": 785} {"train_loss": -20.664302825927734, "global_step": 65170, "epoch": 785} {"train_loss": -20.62221908569336, "global_step": 65171, "epoch": 785} {"train_loss": -20.625696182250977, "global_step": 65172, "epoch": 785} {"train_loss": -20.74936866760254, "global_step": 65173, "epoch": 785} {"train_loss": -20.274436950683594, "global_step": 65174, "epoch": 785} {"train_loss": -20.730375289916992, "global_step": 65175, "epoch": 785} {"train_loss": -20.29212760925293, "global_step": 65176, "epoch": 785} {"train_loss": -20.80768585205078, "global_step": 65177, "epoch": 785} {"train_loss": -20.509807586669922, "global_step": 65178, "epoch": 785} {"train_loss": -20.74884796142578, "global_step": 65179, "epoch": 785} {"train_loss": -20.664512634277344, "global_step": 65180, "epoch": 785} {"train_loss": -20.6527099609375, "global_step": 65181, "epoch": 785} {"train_loss": -20.58121109008789, "global_step": 65182, "epoch": 785} {"train_loss": -20.4633731842041, "global_step": 65183, "epoch": 785} {"train_loss": -20.76566505432129, "global_step": 65184, "epoch": 785} {"train_loss": -20.921390533447266, "global_step": 65185, "epoch": 785} {"train_loss": -20.53253936767578, "global_step": 65186, "epoch": 785} {"train_loss": -20.525266647338867, "global_step": 65187, "epoch": 785} {"train_loss": -20.718015670776367, "global_step": 65188, "epoch": 785} {"train_loss": -20.112747192382812, "global_step": 65189, "epoch": 785} {"train_loss": -20.699758529663086, "global_step": 65190, "epoch": 785} {"train_loss": -21.078975677490234, "global_step": 65191, "epoch": 785} {"train_loss": -20.72316551208496, "global_step": 65192, "epoch": 785} {"train_loss": -20.43056297302246, "global_step": 65193, "epoch": 785} {"train_loss": -20.323535919189453, "global_step": 65194, "epoch": 785} {"train_loss": -20.70549964904785, "global_step": 65195, "epoch": 785} {"train_loss": -20.671293258666992, "global_step": 65196, "epoch": 785} {"train_loss": -20.650741577148438, "global_step": 65197, "epoch": 785} {"train_loss": -20.207258224487305, "global_step": 65198, "epoch": 785} {"train_loss": -20.714218139648438, "global_step": 65199, "epoch": 785} {"train_loss": -20.270309448242188, "global_step": 65200, "epoch": 785} {"train_loss": -20.913318634033203, "global_step": 65201, "epoch": 785} {"train_loss": -20.919103622436523, "global_step": 65202, "epoch": 785} {"train_loss": -20.28223991394043, "global_step": 65203, "epoch": 785} {"train_loss": -20.904573440551758, "global_step": 65204, "epoch": 785} {"train_loss": -20.505342483520508, "global_step": 65205, "epoch": 785} {"train_loss": -20.724716186523438, "global_step": 65206, "epoch": 785} {"train_loss": -20.576797485351562, "global_step": 65207, "epoch": 785} {"train_loss": -20.769311904907227, "global_step": 65208, "epoch": 785} {"train_loss": -20.942609786987305, "global_step": 65209, "epoch": 785} {"train_loss": -20.600706100463867, "global_step": 65210, "epoch": 785} {"train_loss": -20.406503677368164, "global_step": 65211, "epoch": 785} {"train_loss": -20.52124786376953, "global_step": 65212, "epoch": 785} {"train_loss": -20.123632431030273, "global_step": 65213, "epoch": 785} {"train_loss": -20.097251892089844, "global_step": 65214, "epoch": 785} {"train_loss": -20.69666290283203, "global_step": 65215, "epoch": 785} {"train_loss": -20.356199264526367, "global_step": 65216, "epoch": 785} {"train_loss": -21.06242561340332, "global_step": 65217, "epoch": 785} {"train_loss": -20.659343719482422, "global_step": 65218, "epoch": 785} {"train_loss": -20.790693283081055, "global_step": 65219, "epoch": 785} {"train_loss": -20.97662925720215, "global_step": 65220, "epoch": 785} {"train_loss": -21.114233016967773, "global_step": 65221, "epoch": 785} {"train_loss": -20.638961791992188, "global_step": 65222, "epoch": 785} {"train_loss": -20.275638580322266, "global_step": 65223, "epoch": 785} {"train_loss": -20.806074142456055, "global_step": 65224, "epoch": 785} {"train_loss": -20.554967880249023, "global_step": 65225, "epoch": 785} {"train_loss": -20.302001953125, "global_step": 65226, "epoch": 785} {"train_loss": -20.453840255737305, "global_step": 65227, "epoch": 785} {"train_loss": -20.446308135986328, "global_step": 65228, "epoch": 785} {"train_loss": -20.67043113708496, "global_step": 65229, "epoch": 785} {"train_loss": -20.35404396057129, "global_step": 65230, "epoch": 785} {"train_loss": -20.460651397705078, "global_step": 65231, "epoch": 785} {"train_loss": -20.656660079956055, "global_step": 65232, "epoch": 785} {"train_loss": -20.319610595703125, "global_step": 65233, "epoch": 785} {"train_loss": -20.40657615661621, "global_step": 65234, "epoch": 785} {"train_loss": -20.903791427612305, "global_step": 65235, "epoch": 785} {"train_loss": -20.451753616333008, "global_step": 65236, "epoch": 785} {"train_loss": -20.54605798836214, "global_step": 65237, "epoch": 785, "val_loss": 5936513.0} {"train_loss": -19.7912654876709, "global_step": 65238, "epoch": 786} {"train_loss": -20.30602264404297, "global_step": 65239, "epoch": 786} {"train_loss": -20.19902801513672, "global_step": 65240, "epoch": 786} {"train_loss": -20.592100143432617, "global_step": 65241, "epoch": 786} {"train_loss": -20.284366607666016, "global_step": 65242, "epoch": 786} {"train_loss": -20.11105728149414, "global_step": 65243, "epoch": 786} {"train_loss": -20.507369995117188, "global_step": 65244, "epoch": 786} {"train_loss": -20.649667739868164, "global_step": 65245, "epoch": 786} {"train_loss": -20.3885555267334, "global_step": 65246, "epoch": 786} {"train_loss": -20.370643615722656, "global_step": 65247, "epoch": 786} {"train_loss": -20.3979434967041, "global_step": 65248, "epoch": 786} {"train_loss": -20.450883865356445, "global_step": 65249, "epoch": 786} {"train_loss": -20.574193954467773, "global_step": 65250, "epoch": 786} {"train_loss": -20.59065055847168, "global_step": 65251, "epoch": 786} {"train_loss": -20.8214111328125, "global_step": 65252, "epoch": 786} {"train_loss": -20.377391815185547, "global_step": 65253, "epoch": 786} {"train_loss": -20.6296329498291, "global_step": 65254, "epoch": 786} {"train_loss": -20.713720321655273, "global_step": 65255, "epoch": 786} {"train_loss": -20.698928833007812, "global_step": 65256, "epoch": 786} {"train_loss": -20.811689376831055, "global_step": 65257, "epoch": 786} {"train_loss": -20.46735191345215, "global_step": 65258, "epoch": 786} {"train_loss": -20.553264617919922, "global_step": 65259, "epoch": 786} {"train_loss": -20.59063148498535, "global_step": 65260, "epoch": 786} {"train_loss": -20.85060691833496, "global_step": 65261, "epoch": 786} {"train_loss": -20.420196533203125, "global_step": 65262, "epoch": 786} {"train_loss": -20.5830135345459, "global_step": 65263, "epoch": 786} {"train_loss": -20.85860252380371, "global_step": 65264, "epoch": 786} {"train_loss": -20.32423210144043, "global_step": 65265, "epoch": 786} {"train_loss": -20.62779998779297, "global_step": 65266, "epoch": 786} {"train_loss": -20.646738052368164, "global_step": 65267, "epoch": 786} {"train_loss": -20.478607177734375, "global_step": 65268, "epoch": 786} {"train_loss": -20.64595603942871, "global_step": 65269, "epoch": 786} {"train_loss": -20.56172752380371, "global_step": 65270, "epoch": 786} {"train_loss": -20.866708755493164, "global_step": 65271, "epoch": 786} {"train_loss": -20.697967529296875, "global_step": 65272, "epoch": 786} {"train_loss": -20.676374435424805, "global_step": 65273, "epoch": 786} {"train_loss": -20.959699630737305, "global_step": 65274, "epoch": 786} {"train_loss": -20.708545684814453, "global_step": 65275, "epoch": 786} {"train_loss": -20.78497886657715, "global_step": 65276, "epoch": 786} {"train_loss": -20.644758224487305, "global_step": 65277, "epoch": 786} {"train_loss": -20.509756088256836, "global_step": 65278, "epoch": 786} {"train_loss": -20.853662490844727, "global_step": 65279, "epoch": 786} {"train_loss": -20.816791534423828, "global_step": 65280, "epoch": 786} {"train_loss": -20.749170303344727, "global_step": 65281, "epoch": 786} {"train_loss": -20.26565170288086, "global_step": 65282, "epoch": 786} {"train_loss": -20.618864059448242, "global_step": 65283, "epoch": 786} {"train_loss": -20.652271270751953, "global_step": 65284, "epoch": 786} {"train_loss": -20.647464752197266, "global_step": 65285, "epoch": 786} {"train_loss": -20.564823150634766, "global_step": 65286, "epoch": 786} {"train_loss": -20.870140075683594, "global_step": 65287, "epoch": 786} {"train_loss": -20.877954483032227, "global_step": 65288, "epoch": 786} {"train_loss": -20.970489501953125, "global_step": 65289, "epoch": 786} {"train_loss": -20.635282516479492, "global_step": 65290, "epoch": 786} {"train_loss": -20.43684959411621, "global_step": 65291, "epoch": 786} {"train_loss": -20.595304489135742, "global_step": 65292, "epoch": 786} {"train_loss": -20.538490295410156, "global_step": 65293, "epoch": 786} {"train_loss": -20.48426628112793, "global_step": 65294, "epoch": 786} {"train_loss": -20.829391479492188, "global_step": 65295, "epoch": 786} {"train_loss": -20.474365234375, "global_step": 65296, "epoch": 786} {"train_loss": -21.148618698120117, "global_step": 65297, "epoch": 786} {"train_loss": -20.64571189880371, "global_step": 65298, "epoch": 786} {"train_loss": -20.445526123046875, "global_step": 65299, "epoch": 786} {"train_loss": -20.18653678894043, "global_step": 65300, "epoch": 786} {"train_loss": -20.78574562072754, "global_step": 65301, "epoch": 786} {"train_loss": -20.370718002319336, "global_step": 65302, "epoch": 786} {"train_loss": -20.699050903320312, "global_step": 65303, "epoch": 786} {"train_loss": -20.494409561157227, "global_step": 65304, "epoch": 786} {"train_loss": -20.308929443359375, "global_step": 65305, "epoch": 786} {"train_loss": -20.48207664489746, "global_step": 65306, "epoch": 786} {"train_loss": -20.82022476196289, "global_step": 65307, "epoch": 786} {"train_loss": -20.71478843688965, "global_step": 65308, "epoch": 786} {"train_loss": -20.973196029663086, "global_step": 65309, "epoch": 786} {"train_loss": -20.768136978149414, "global_step": 65310, "epoch": 786} {"train_loss": -20.723661422729492, "global_step": 65311, "epoch": 786} {"train_loss": -20.505290985107422, "global_step": 65312, "epoch": 786} {"train_loss": -20.45549964904785, "global_step": 65313, "epoch": 786} {"train_loss": -20.68590545654297, "global_step": 65314, "epoch": 786} {"train_loss": -20.841754913330078, "global_step": 65315, "epoch": 786} {"train_loss": -20.21656036376953, "global_step": 65316, "epoch": 786} {"train_loss": -20.540637969970703, "global_step": 65317, "epoch": 786} {"train_loss": -20.644521713256836, "global_step": 65318, "epoch": 786} {"train_loss": -20.801435470581055, "global_step": 65319, "epoch": 786} {"train_loss": -20.604985271591737, "global_step": 65320, "epoch": 786, "val_loss": 5916958.5} {"train_loss": -20.736373901367188, "global_step": 65321, "epoch": 787} {"train_loss": -20.63574981689453, "global_step": 65322, "epoch": 787} {"train_loss": -20.817564010620117, "global_step": 65323, "epoch": 787} {"train_loss": -20.59846305847168, "global_step": 65324, "epoch": 787} {"train_loss": -20.59455680847168, "global_step": 65325, "epoch": 787} {"train_loss": -20.83859634399414, "global_step": 65326, "epoch": 787} {"train_loss": -20.711681365966797, "global_step": 65327, "epoch": 787} {"train_loss": -20.821693420410156, "global_step": 65328, "epoch": 787} {"train_loss": -20.608396530151367, "global_step": 65329, "epoch": 787} {"train_loss": -20.960050582885742, "global_step": 65330, "epoch": 787} {"train_loss": -20.454177856445312, "global_step": 65331, "epoch": 787} {"train_loss": -20.65519142150879, "global_step": 65332, "epoch": 787} {"train_loss": -20.69346046447754, "global_step": 65333, "epoch": 787} {"train_loss": -20.585081100463867, "global_step": 65334, "epoch": 787} {"train_loss": -20.446809768676758, "global_step": 65335, "epoch": 787} {"train_loss": -20.24910545349121, "global_step": 65336, "epoch": 787} {"train_loss": -20.816741943359375, "global_step": 65337, "epoch": 787} {"train_loss": -20.63924217224121, "global_step": 65338, "epoch": 787} {"train_loss": -20.45248794555664, "global_step": 65339, "epoch": 787} {"train_loss": -20.66290855407715, "global_step": 65340, "epoch": 787} {"train_loss": -20.520456314086914, "global_step": 65341, "epoch": 787} {"train_loss": -20.57038688659668, "global_step": 65342, "epoch": 787} {"train_loss": -20.673009872436523, "global_step": 65343, "epoch": 787} {"train_loss": -20.65899085998535, "global_step": 65344, "epoch": 787} {"train_loss": -20.795398712158203, "global_step": 65345, "epoch": 787} {"train_loss": -20.291763305664062, "global_step": 65346, "epoch": 787} {"train_loss": -20.557205200195312, "global_step": 65347, "epoch": 787} {"train_loss": -20.80110740661621, "global_step": 65348, "epoch": 787} {"train_loss": -20.916425704956055, "global_step": 65349, "epoch": 787} {"train_loss": -20.634449005126953, "global_step": 65350, "epoch": 787} {"train_loss": -20.746597290039062, "global_step": 65351, "epoch": 787} {"train_loss": -20.831315994262695, "global_step": 65352, "epoch": 787} {"train_loss": -20.6600284576416, "global_step": 65353, "epoch": 787} {"train_loss": -20.5634765625, "global_step": 65354, "epoch": 787} {"train_loss": -20.53667640686035, "global_step": 65355, "epoch": 787} {"train_loss": -20.618528366088867, "global_step": 65356, "epoch": 787} {"train_loss": -20.69622230529785, "global_step": 65357, "epoch": 787} {"train_loss": -20.389301300048828, "global_step": 65358, "epoch": 787} {"train_loss": -21.045976638793945, "global_step": 65359, "epoch": 787} {"train_loss": -20.622344970703125, "global_step": 65360, "epoch": 787} {"train_loss": -20.650341033935547, "global_step": 65361, "epoch": 787} {"train_loss": -20.368871688842773, "global_step": 65362, "epoch": 787} {"train_loss": -20.567869186401367, "global_step": 65363, "epoch": 787} {"train_loss": -20.841663360595703, "global_step": 65364, "epoch": 787} {"train_loss": -20.817785263061523, "global_step": 65365, "epoch": 787} {"train_loss": -20.54193878173828, "global_step": 65366, "epoch": 787} {"train_loss": -20.622955322265625, "global_step": 65367, "epoch": 787} {"train_loss": -20.7556209564209, "global_step": 65368, "epoch": 787} {"train_loss": -20.317617416381836, "global_step": 65369, "epoch": 787} {"train_loss": -20.85175132751465, "global_step": 65370, "epoch": 787} {"train_loss": -20.41630744934082, "global_step": 65371, "epoch": 787} {"train_loss": -20.698917388916016, "global_step": 65372, "epoch": 787} {"train_loss": -20.432462692260742, "global_step": 65373, "epoch": 787} {"train_loss": -20.801361083984375, "global_step": 65374, "epoch": 787} {"train_loss": -20.705820083618164, "global_step": 65375, "epoch": 787} {"train_loss": -20.986989974975586, "global_step": 65376, "epoch": 787} {"train_loss": -20.54149627685547, "global_step": 65377, "epoch": 787} {"train_loss": -20.77524757385254, "global_step": 65378, "epoch": 787} {"train_loss": -20.347681045532227, "global_step": 65379, "epoch": 787} {"train_loss": -20.883127212524414, "global_step": 65380, "epoch": 787} {"train_loss": -20.537357330322266, "global_step": 65381, "epoch": 787} {"train_loss": -20.559423446655273, "global_step": 65382, "epoch": 787} {"train_loss": -20.404651641845703, "global_step": 65383, "epoch": 787} {"train_loss": -20.587413787841797, "global_step": 65384, "epoch": 787} {"train_loss": -20.47350311279297, "global_step": 65385, "epoch": 787} {"train_loss": -20.466716766357422, "global_step": 65386, "epoch": 787} {"train_loss": -20.93807029724121, "global_step": 65387, "epoch": 787} {"train_loss": -20.381513595581055, "global_step": 65388, "epoch": 787} {"train_loss": -20.60025405883789, "global_step": 65389, "epoch": 787} {"train_loss": -20.809083938598633, "global_step": 65390, "epoch": 787} {"train_loss": -21.03789710998535, "global_step": 65391, "epoch": 787} {"train_loss": -20.656665802001953, "global_step": 65392, "epoch": 787} {"train_loss": -20.5611629486084, "global_step": 65393, "epoch": 787} {"train_loss": -20.986074447631836, "global_step": 65394, "epoch": 787} {"train_loss": -20.501998901367188, "global_step": 65395, "epoch": 787} {"train_loss": -20.56641960144043, "global_step": 65396, "epoch": 787} {"train_loss": -20.502933502197266, "global_step": 65397, "epoch": 787} {"train_loss": -20.587833404541016, "global_step": 65398, "epoch": 787} {"train_loss": -20.18433380126953, "global_step": 65399, "epoch": 787} {"train_loss": -20.48247718811035, "global_step": 65400, "epoch": 787} {"train_loss": -20.794973373413086, "global_step": 65401, "epoch": 787} {"train_loss": -20.53595542907715, "global_step": 65402, "epoch": 787} {"train_loss": -20.627734517476643, "global_step": 65403, "epoch": 787, "val_loss": 5947917.0} {"train_loss": -19.895938873291016, "global_step": 65404, "epoch": 788} {"train_loss": -20.472187042236328, "global_step": 65405, "epoch": 788} {"train_loss": -20.2392635345459, "global_step": 65406, "epoch": 788} {"train_loss": -20.020193099975586, "global_step": 65407, "epoch": 788} {"train_loss": -20.511655807495117, "global_step": 65408, "epoch": 788} {"train_loss": -20.3023681640625, "global_step": 65409, "epoch": 788} {"train_loss": -20.439105987548828, "global_step": 65410, "epoch": 788} {"train_loss": -20.452482223510742, "global_step": 65411, "epoch": 788} {"train_loss": -20.4481201171875, "global_step": 65412, "epoch": 788} {"train_loss": -20.565797805786133, "global_step": 65413, "epoch": 788} {"train_loss": -20.707738876342773, "global_step": 65414, "epoch": 788} {"train_loss": -20.42609214782715, "global_step": 65415, "epoch": 788} {"train_loss": -20.6304931640625, "global_step": 65416, "epoch": 788} {"train_loss": -20.666723251342773, "global_step": 65417, "epoch": 788} {"train_loss": -20.5922908782959, "global_step": 65418, "epoch": 788} {"train_loss": -20.2558650970459, "global_step": 65419, "epoch": 788} {"train_loss": -20.297061920166016, "global_step": 65420, "epoch": 788} {"train_loss": -20.78842544555664, "global_step": 65421, "epoch": 788} {"train_loss": -20.542316436767578, "global_step": 65422, "epoch": 788} {"train_loss": -20.598373413085938, "global_step": 65423, "epoch": 788} {"train_loss": -20.868335723876953, "global_step": 65424, "epoch": 788} {"train_loss": -20.93210220336914, "global_step": 65425, "epoch": 788} {"train_loss": -20.511398315429688, "global_step": 65426, "epoch": 788} {"train_loss": -20.494165420532227, "global_step": 65427, "epoch": 788} {"train_loss": -20.497068405151367, "global_step": 65428, "epoch": 788} {"train_loss": -20.468969345092773, "global_step": 65429, "epoch": 788} {"train_loss": -20.415538787841797, "global_step": 65430, "epoch": 788} {"train_loss": -20.532041549682617, "global_step": 65431, "epoch": 788} {"train_loss": -20.577180862426758, "global_step": 65432, "epoch": 788} {"train_loss": -20.58998680114746, "global_step": 65433, "epoch": 788} {"train_loss": -20.385217666625977, "global_step": 65434, "epoch": 788} {"train_loss": -20.518644332885742, "global_step": 65435, "epoch": 788} {"train_loss": -20.773332595825195, "global_step": 65436, "epoch": 788} {"train_loss": -20.546024322509766, "global_step": 65437, "epoch": 788} {"train_loss": -20.730976104736328, "global_step": 65438, "epoch": 788} {"train_loss": -20.587818145751953, "global_step": 65439, "epoch": 788} {"train_loss": -21.079296112060547, "global_step": 65440, "epoch": 788} {"train_loss": -20.86213493347168, "global_step": 65441, "epoch": 788} {"train_loss": -20.788272857666016, "global_step": 65442, "epoch": 788} {"train_loss": -21.021108627319336, "global_step": 65443, "epoch": 788} {"train_loss": -20.386022567749023, "global_step": 65444, "epoch": 788} {"train_loss": -20.905996322631836, "global_step": 65445, "epoch": 788} {"train_loss": -20.619985580444336, "global_step": 65446, "epoch": 788} {"train_loss": -20.49676513671875, "global_step": 65447, "epoch": 788} {"train_loss": -20.879911422729492, "global_step": 65448, "epoch": 788} {"train_loss": -20.248268127441406, "global_step": 65449, "epoch": 788} {"train_loss": -20.65583610534668, "global_step": 65450, "epoch": 788} {"train_loss": -20.67987823486328, "global_step": 65451, "epoch": 788} {"train_loss": -20.074026107788086, "global_step": 65452, "epoch": 788} {"train_loss": -20.807859420776367, "global_step": 65453, "epoch": 788} {"train_loss": -20.576406478881836, "global_step": 65454, "epoch": 788} {"train_loss": -20.29607582092285, "global_step": 65455, "epoch": 788} {"train_loss": -20.566659927368164, "global_step": 65456, "epoch": 788} {"train_loss": -20.297189712524414, "global_step": 65457, "epoch": 788} {"train_loss": -21.006135940551758, "global_step": 65458, "epoch": 788} {"train_loss": -20.7078857421875, "global_step": 65459, "epoch": 788} {"train_loss": -20.61250877380371, "global_step": 65460, "epoch": 788} {"train_loss": -20.573652267456055, "global_step": 65461, "epoch": 788} {"train_loss": -20.564186096191406, "global_step": 65462, "epoch": 788} {"train_loss": -21.03587532043457, "global_step": 65463, "epoch": 788} {"train_loss": -20.597074508666992, "global_step": 65464, "epoch": 788} {"train_loss": -20.968698501586914, "global_step": 65465, "epoch": 788} {"train_loss": -20.50528335571289, "global_step": 65466, "epoch": 788} {"train_loss": -20.456317901611328, "global_step": 65467, "epoch": 788} {"train_loss": -20.584857940673828, "global_step": 65468, "epoch": 788} {"train_loss": -20.652952194213867, "global_step": 65469, "epoch": 788} {"train_loss": -20.676382064819336, "global_step": 65470, "epoch": 788} {"train_loss": -20.52744483947754, "global_step": 65471, "epoch": 788} {"train_loss": -20.863216400146484, "global_step": 65472, "epoch": 788} {"train_loss": -20.888315200805664, "global_step": 65473, "epoch": 788} {"train_loss": -21.15089988708496, "global_step": 65474, "epoch": 788} {"train_loss": -20.74881935119629, "global_step": 65475, "epoch": 788} {"train_loss": -20.606538772583008, "global_step": 65476, "epoch": 788} {"train_loss": -20.932661056518555, "global_step": 65477, "epoch": 788} {"train_loss": -21.029138565063477, "global_step": 65478, "epoch": 788} {"train_loss": -21.017337799072266, "global_step": 65479, "epoch": 788} {"train_loss": -20.31476402282715, "global_step": 65480, "epoch": 788} {"train_loss": -20.24416160583496, "global_step": 65481, "epoch": 788} {"train_loss": -20.578229904174805, "global_step": 65482, "epoch": 788} {"train_loss": -20.535167694091797, "global_step": 65483, "epoch": 788} {"train_loss": -20.565893173217773, "global_step": 65484, "epoch": 788} {"train_loss": -20.57166862487793, "global_step": 65485, "epoch": 788} {"train_loss": -20.615375495818725, "global_step": 65486, "epoch": 788, "val_loss": 5956863.5} {"train_loss": -19.845243453979492, "global_step": 65487, "epoch": 789} {"train_loss": -20.027587890625, "global_step": 65488, "epoch": 789} {"train_loss": -20.523807525634766, "global_step": 65489, "epoch": 789} {"train_loss": -20.20564079284668, "global_step": 65490, "epoch": 789} {"train_loss": -20.159936904907227, "global_step": 65491, "epoch": 789} {"train_loss": -20.45674705505371, "global_step": 65492, "epoch": 789} {"train_loss": -20.2121639251709, "global_step": 65493, "epoch": 789} {"train_loss": -20.69532585144043, "global_step": 65494, "epoch": 789} {"train_loss": -20.345722198486328, "global_step": 65495, "epoch": 789} {"train_loss": -20.2586612701416, "global_step": 65496, "epoch": 789} {"train_loss": -20.143218994140625, "global_step": 65497, "epoch": 789} {"train_loss": -20.405118942260742, "global_step": 65498, "epoch": 789} {"train_loss": -20.050588607788086, "global_step": 65499, "epoch": 789} {"train_loss": -20.31624412536621, "global_step": 65500, "epoch": 789} {"train_loss": -20.268112182617188, "global_step": 65501, "epoch": 789} {"train_loss": -20.33197021484375, "global_step": 65502, "epoch": 789} {"train_loss": -20.25592613220215, "global_step": 65503, "epoch": 789} {"train_loss": -20.431806564331055, "global_step": 65504, "epoch": 789} {"train_loss": -20.528730392456055, "global_step": 65505, "epoch": 789} {"train_loss": -20.26417350769043, "global_step": 65506, "epoch": 789} {"train_loss": -20.5676326751709, "global_step": 65507, "epoch": 789} {"train_loss": -20.347713470458984, "global_step": 65508, "epoch": 789} {"train_loss": -20.6540584564209, "global_step": 65509, "epoch": 789} {"train_loss": -20.58445167541504, "global_step": 65510, "epoch": 789} {"train_loss": -20.731292724609375, "global_step": 65511, "epoch": 789} {"train_loss": -20.624666213989258, "global_step": 65512, "epoch": 789} {"train_loss": -20.535551071166992, "global_step": 65513, "epoch": 789} {"train_loss": -20.987869262695312, "global_step": 65514, "epoch": 789} {"train_loss": -20.616764068603516, "global_step": 65515, "epoch": 789} {"train_loss": -20.537342071533203, "global_step": 65516, "epoch": 789} {"train_loss": -20.583059310913086, "global_step": 65517, "epoch": 789} {"train_loss": -20.533483505249023, "global_step": 65518, "epoch": 789} {"train_loss": -20.69939422607422, "global_step": 65519, "epoch": 789} {"train_loss": -20.556264877319336, "global_step": 65520, "epoch": 789} {"train_loss": -20.744171142578125, "global_step": 65521, "epoch": 789} {"train_loss": -20.57758140563965, "global_step": 65522, "epoch": 789} {"train_loss": -20.33003807067871, "global_step": 65523, "epoch": 789} {"train_loss": -20.426504135131836, "global_step": 65524, "epoch": 789} {"train_loss": -20.57560920715332, "global_step": 65525, "epoch": 789} {"train_loss": -20.408044815063477, "global_step": 65526, "epoch": 789} {"train_loss": -20.481698989868164, "global_step": 65527, "epoch": 789} {"train_loss": -20.53635597229004, "global_step": 65528, "epoch": 789} {"train_loss": -20.486875534057617, "global_step": 65529, "epoch": 789} {"train_loss": -20.771024703979492, "global_step": 65530, "epoch": 789} {"train_loss": -20.60615348815918, "global_step": 65531, "epoch": 789} {"train_loss": -20.427629470825195, "global_step": 65532, "epoch": 789} {"train_loss": -20.778715133666992, "global_step": 65533, "epoch": 789} {"train_loss": -20.80647850036621, "global_step": 65534, "epoch": 789} {"train_loss": -20.932058334350586, "global_step": 65535, "epoch": 789} {"train_loss": -20.35004234313965, "global_step": 65536, "epoch": 789} {"train_loss": -20.832849502563477, "global_step": 65537, "epoch": 789} {"train_loss": -20.047927856445312, "global_step": 65538, "epoch": 789} {"train_loss": -20.40427017211914, "global_step": 65539, "epoch": 789} {"train_loss": -20.6264705657959, "global_step": 65540, "epoch": 789} {"train_loss": -20.95791244506836, "global_step": 65541, "epoch": 789} {"train_loss": -20.786550521850586, "global_step": 65542, "epoch": 789} {"train_loss": -20.996248245239258, "global_step": 65543, "epoch": 789} {"train_loss": -21.058032989501953, "global_step": 65544, "epoch": 789} {"train_loss": -20.321226119995117, "global_step": 65545, "epoch": 789} {"train_loss": -20.965543746948242, "global_step": 65546, "epoch": 789} {"train_loss": -20.547025680541992, "global_step": 65547, "epoch": 789} {"train_loss": -20.660659790039062, "global_step": 65548, "epoch": 789} {"train_loss": -20.522815704345703, "global_step": 65549, "epoch": 789} {"train_loss": -20.5969295501709, "global_step": 65550, "epoch": 789} {"train_loss": -20.7181396484375, "global_step": 65551, "epoch": 789} {"train_loss": -20.863496780395508, "global_step": 65552, "epoch": 789} {"train_loss": -20.54926300048828, "global_step": 65553, "epoch": 789} {"train_loss": -20.528676986694336, "global_step": 65554, "epoch": 789} {"train_loss": -20.75491714477539, "global_step": 65555, "epoch": 789} {"train_loss": -20.93438720703125, "global_step": 65556, "epoch": 789} {"train_loss": -20.669784545898438, "global_step": 65557, "epoch": 789} {"train_loss": -20.501012802124023, "global_step": 65558, "epoch": 789} {"train_loss": -20.527982711791992, "global_step": 65559, "epoch": 789} {"train_loss": -20.682706832885742, "global_step": 65560, "epoch": 789} {"train_loss": -20.737565994262695, "global_step": 65561, "epoch": 789} {"train_loss": -20.688108444213867, "global_step": 65562, "epoch": 789} {"train_loss": -20.2997989654541, "global_step": 65563, "epoch": 789} {"train_loss": -20.67232322692871, "global_step": 65564, "epoch": 789} {"train_loss": -20.692703247070312, "global_step": 65565, "epoch": 789} {"train_loss": -20.738019943237305, "global_step": 65566, "epoch": 789} {"train_loss": -20.73256492614746, "global_step": 65567, "epoch": 789} {"train_loss": -20.44600486755371, "global_step": 65568, "epoch": 789} {"train_loss": -20.549083089253987, "global_step": 65569, "epoch": 789, "val_loss": 5921054.5} {"train_loss": -20.2446231842041, "global_step": 65570, "epoch": 790} {"train_loss": -19.959327697753906, "global_step": 65571, "epoch": 790} {"train_loss": -20.36102294921875, "global_step": 65572, "epoch": 790} {"train_loss": -20.43235206604004, "global_step": 65573, "epoch": 790} {"train_loss": -20.3268985748291, "global_step": 65574, "epoch": 790} {"train_loss": -20.748207092285156, "global_step": 65575, "epoch": 790} {"train_loss": -20.445539474487305, "global_step": 65576, "epoch": 790} {"train_loss": -20.52225685119629, "global_step": 65577, "epoch": 790} {"train_loss": -20.01566505432129, "global_step": 65578, "epoch": 790} {"train_loss": -20.750761032104492, "global_step": 65579, "epoch": 790} {"train_loss": -20.354801177978516, "global_step": 65580, "epoch": 790} {"train_loss": -20.487695693969727, "global_step": 65581, "epoch": 790} {"train_loss": -20.838890075683594, "global_step": 65582, "epoch": 790} {"train_loss": -20.40653419494629, "global_step": 65583, "epoch": 790} {"train_loss": -20.54323387145996, "global_step": 65584, "epoch": 790} {"train_loss": -20.586483001708984, "global_step": 65585, "epoch": 790} {"train_loss": -20.035003662109375, "global_step": 65586, "epoch": 790} {"train_loss": -20.473791122436523, "global_step": 65587, "epoch": 790} {"train_loss": -20.337942123413086, "global_step": 65588, "epoch": 790} {"train_loss": -20.727670669555664, "global_step": 65589, "epoch": 790} {"train_loss": -20.514057159423828, "global_step": 65590, "epoch": 790} {"train_loss": -20.402202606201172, "global_step": 65591, "epoch": 790} {"train_loss": -20.391860961914062, "global_step": 65592, "epoch": 790} {"train_loss": -20.151151657104492, "global_step": 65593, "epoch": 790} {"train_loss": -20.54085922241211, "global_step": 65594, "epoch": 790} {"train_loss": -20.739519119262695, "global_step": 65595, "epoch": 790} {"train_loss": -20.69121742248535, "global_step": 65596, "epoch": 790} {"train_loss": -20.554906845092773, "global_step": 65597, "epoch": 790} {"train_loss": -20.756032943725586, "global_step": 65598, "epoch": 790} {"train_loss": -20.72542381286621, "global_step": 65599, "epoch": 790} {"train_loss": -20.50055503845215, "global_step": 65600, "epoch": 790} {"train_loss": -20.493886947631836, "global_step": 65601, "epoch": 790} {"train_loss": -21.232900619506836, "global_step": 65602, "epoch": 790} {"train_loss": -20.78915786743164, "global_step": 65603, "epoch": 790} {"train_loss": -20.823307037353516, "global_step": 65604, "epoch": 790} {"train_loss": -20.776958465576172, "global_step": 65605, "epoch": 790} {"train_loss": -20.93079948425293, "global_step": 65606, "epoch": 790} {"train_loss": -20.741527557373047, "global_step": 65607, "epoch": 790} {"train_loss": -21.180212020874023, "global_step": 65608, "epoch": 790} {"train_loss": -20.22781753540039, "global_step": 65609, "epoch": 790} {"train_loss": -20.553213119506836, "global_step": 65610, "epoch": 790} {"train_loss": -20.71846580505371, "global_step": 65611, "epoch": 790} {"train_loss": -20.160175323486328, "global_step": 65612, "epoch": 790} {"train_loss": -20.60425567626953, "global_step": 65613, "epoch": 790} {"train_loss": -20.72258186340332, "global_step": 65614, "epoch": 790} {"train_loss": -21.103845596313477, "global_step": 65615, "epoch": 790} {"train_loss": -20.70938491821289, "global_step": 65616, "epoch": 790} {"train_loss": -20.770599365234375, "global_step": 65617, "epoch": 790} {"train_loss": -20.737167358398438, "global_step": 65618, "epoch": 790} {"train_loss": -20.734891891479492, "global_step": 65619, "epoch": 790} {"train_loss": -20.73752212524414, "global_step": 65620, "epoch": 790} {"train_loss": -20.469348907470703, "global_step": 65621, "epoch": 790} {"train_loss": -20.500871658325195, "global_step": 65622, "epoch": 790} {"train_loss": -20.28606414794922, "global_step": 65623, "epoch": 790} {"train_loss": -20.625049591064453, "global_step": 65624, "epoch": 790} {"train_loss": -20.405208587646484, "global_step": 65625, "epoch": 790} {"train_loss": -20.08487319946289, "global_step": 65626, "epoch": 790} {"train_loss": -20.568662643432617, "global_step": 65627, "epoch": 790} {"train_loss": -20.594985961914062, "global_step": 65628, "epoch": 790} {"train_loss": -20.536375045776367, "global_step": 65629, "epoch": 790} {"train_loss": -20.604154586791992, "global_step": 65630, "epoch": 790} {"train_loss": -20.325115203857422, "global_step": 65631, "epoch": 790} {"train_loss": -20.87249183654785, "global_step": 65632, "epoch": 790} {"train_loss": -20.52756118774414, "global_step": 65633, "epoch": 790} {"train_loss": -20.567405700683594, "global_step": 65634, "epoch": 790} {"train_loss": -20.677820205688477, "global_step": 65635, "epoch": 790} {"train_loss": -20.568754196166992, "global_step": 65636, "epoch": 790} {"train_loss": -20.858829498291016, "global_step": 65637, "epoch": 790} {"train_loss": -20.763126373291016, "global_step": 65638, "epoch": 790} {"train_loss": -20.538896560668945, "global_step": 65639, "epoch": 790} {"train_loss": -20.378055572509766, "global_step": 65640, "epoch": 790} {"train_loss": -20.5660343170166, "global_step": 65641, "epoch": 790} {"train_loss": -20.859058380126953, "global_step": 65642, "epoch": 790} {"train_loss": -20.6490478515625, "global_step": 65643, "epoch": 790} {"train_loss": -20.653873443603516, "global_step": 65644, "epoch": 790} {"train_loss": -20.669998168945312, "global_step": 65645, "epoch": 790} {"train_loss": -20.824459075927734, "global_step": 65646, "epoch": 790} {"train_loss": -20.737730026245117, "global_step": 65647, "epoch": 790} {"train_loss": -20.60238265991211, "global_step": 65648, "epoch": 790} {"train_loss": -20.77570152282715, "global_step": 65649, "epoch": 790} {"train_loss": -20.71759796142578, "global_step": 65650, "epoch": 790} {"train_loss": -20.469493865966797, "global_step": 65651, "epoch": 790} {"train_loss": -20.581534672932452, "global_step": 65652, "epoch": 790, "val_loss": 6065202.5} {"train_loss": -20.52919578552246, "global_step": 65653, "epoch": 791} {"train_loss": -20.220966339111328, "global_step": 65654, "epoch": 791} {"train_loss": -20.123851776123047, "global_step": 65655, "epoch": 791} {"train_loss": -20.53327751159668, "global_step": 65656, "epoch": 791} {"train_loss": -20.322858810424805, "global_step": 65657, "epoch": 791} {"train_loss": -20.711742401123047, "global_step": 65658, "epoch": 791} {"train_loss": -20.489980697631836, "global_step": 65659, "epoch": 791} {"train_loss": -20.44437026977539, "global_step": 65660, "epoch": 791} {"train_loss": -20.37578773498535, "global_step": 65661, "epoch": 791} {"train_loss": -20.7113037109375, "global_step": 65662, "epoch": 791} {"train_loss": -20.216947555541992, "global_step": 65663, "epoch": 791} {"train_loss": -20.28254508972168, "global_step": 65664, "epoch": 791} {"train_loss": -20.304275512695312, "global_step": 65665, "epoch": 791} {"train_loss": -20.264841079711914, "global_step": 65666, "epoch": 791} {"train_loss": -20.788908004760742, "global_step": 65667, "epoch": 791} {"train_loss": -20.718843460083008, "global_step": 65668, "epoch": 791} {"train_loss": -20.607213973999023, "global_step": 65669, "epoch": 791} {"train_loss": -20.4915828704834, "global_step": 65670, "epoch": 791} {"train_loss": -20.39816665649414, "global_step": 65671, "epoch": 791} {"train_loss": -20.47425651550293, "global_step": 65672, "epoch": 791} {"train_loss": -20.649423599243164, "global_step": 65673, "epoch": 791} {"train_loss": -20.829267501831055, "global_step": 65674, "epoch": 791} {"train_loss": -20.5970516204834, "global_step": 65675, "epoch": 791} {"train_loss": -20.85580062866211, "global_step": 65676, "epoch": 791} {"train_loss": -20.588821411132812, "global_step": 65677, "epoch": 791} {"train_loss": -20.85145378112793, "global_step": 65678, "epoch": 791} {"train_loss": -20.470264434814453, "global_step": 65679, "epoch": 791} {"train_loss": -20.597517013549805, "global_step": 65680, "epoch": 791} {"train_loss": -20.53924560546875, "global_step": 65681, "epoch": 791} {"train_loss": -20.72064971923828, "global_step": 65682, "epoch": 791} {"train_loss": -20.18805503845215, "global_step": 65683, "epoch": 791} {"train_loss": -20.649133682250977, "global_step": 65684, "epoch": 791} {"train_loss": -20.758142471313477, "global_step": 65685, "epoch": 791} {"train_loss": -20.532440185546875, "global_step": 65686, "epoch": 791} {"train_loss": -20.62940788269043, "global_step": 65687, "epoch": 791} {"train_loss": -20.81524658203125, "global_step": 65688, "epoch": 791} {"train_loss": -20.769437789916992, "global_step": 65689, "epoch": 791} {"train_loss": -20.285200119018555, "global_step": 65690, "epoch": 791} {"train_loss": -20.438993453979492, "global_step": 65691, "epoch": 791} {"train_loss": -20.805463790893555, "global_step": 65692, "epoch": 791} {"train_loss": -20.73795509338379, "global_step": 65693, "epoch": 791} {"train_loss": -21.073719024658203, "global_step": 65694, "epoch": 791} {"train_loss": -20.494550704956055, "global_step": 65695, "epoch": 791} {"train_loss": -20.523422241210938, "global_step": 65696, "epoch": 791} {"train_loss": -20.53609275817871, "global_step": 65697, "epoch": 791} {"train_loss": -20.570287704467773, "global_step": 65698, "epoch": 791} {"train_loss": -20.45786476135254, "global_step": 65699, "epoch": 791} {"train_loss": -21.196022033691406, "global_step": 65700, "epoch": 791} {"train_loss": -20.916563034057617, "global_step": 65701, "epoch": 791} {"train_loss": -20.473739624023438, "global_step": 65702, "epoch": 791} {"train_loss": -20.90882682800293, "global_step": 65703, "epoch": 791} {"train_loss": -20.76920509338379, "global_step": 65704, "epoch": 791} {"train_loss": -20.688215255737305, "global_step": 65705, "epoch": 791} {"train_loss": -20.485877990722656, "global_step": 65706, "epoch": 791} {"train_loss": -21.099760055541992, "global_step": 65707, "epoch": 791} {"train_loss": -20.61472511291504, "global_step": 65708, "epoch": 791} {"train_loss": -20.573514938354492, "global_step": 65709, "epoch": 791} {"train_loss": -20.520700454711914, "global_step": 65710, "epoch": 791} {"train_loss": -20.881134033203125, "global_step": 65711, "epoch": 791} {"train_loss": -20.843994140625, "global_step": 65712, "epoch": 791} {"train_loss": -20.797189712524414, "global_step": 65713, "epoch": 791} {"train_loss": -20.36820411682129, "global_step": 65714, "epoch": 791} {"train_loss": -20.72504997253418, "global_step": 65715, "epoch": 791} {"train_loss": -20.89594078063965, "global_step": 65716, "epoch": 791} {"train_loss": -20.336153030395508, "global_step": 65717, "epoch": 791} {"train_loss": -20.573577880859375, "global_step": 65718, "epoch": 791} {"train_loss": -20.614139556884766, "global_step": 65719, "epoch": 791} {"train_loss": -20.899274826049805, "global_step": 65720, "epoch": 791} {"train_loss": -20.644254684448242, "global_step": 65721, "epoch": 791} {"train_loss": -20.648273468017578, "global_step": 65722, "epoch": 791} {"train_loss": -20.579816818237305, "global_step": 65723, "epoch": 791} {"train_loss": -20.61823081970215, "global_step": 65724, "epoch": 791} {"train_loss": -21.010114669799805, "global_step": 65725, "epoch": 791} {"train_loss": -20.68316650390625, "global_step": 65726, "epoch": 791} {"train_loss": -20.856962203979492, "global_step": 65727, "epoch": 791} {"train_loss": -20.907825469970703, "global_step": 65728, "epoch": 791} {"train_loss": -20.563575744628906, "global_step": 65729, "epoch": 791} {"train_loss": -20.628854751586914, "global_step": 65730, "epoch": 791} {"train_loss": -20.45523452758789, "global_step": 65731, "epoch": 791} {"train_loss": -20.488834381103516, "global_step": 65732, "epoch": 791} {"train_loss": -20.57293128967285, "global_step": 65733, "epoch": 791} {"train_loss": -20.742963790893555, "global_step": 65734, "epoch": 791} {"train_loss": -20.597784134278815, "global_step": 65735, "epoch": 791, "val_loss": 6071470.0} {"train_loss": -20.182828903198242, "global_step": 65736, "epoch": 792} {"train_loss": -20.481346130371094, "global_step": 65737, "epoch": 792} {"train_loss": -20.481958389282227, "global_step": 65738, "epoch": 792} {"train_loss": -20.416305541992188, "global_step": 65739, "epoch": 792} {"train_loss": -20.609220504760742, "global_step": 65740, "epoch": 792} {"train_loss": -20.3352108001709, "global_step": 65741, "epoch": 792} {"train_loss": -20.661611557006836, "global_step": 65742, "epoch": 792} {"train_loss": -20.115474700927734, "global_step": 65743, "epoch": 792} {"train_loss": -20.800281524658203, "global_step": 65744, "epoch": 792} {"train_loss": -20.5040283203125, "global_step": 65745, "epoch": 792} {"train_loss": -20.561594009399414, "global_step": 65746, "epoch": 792} {"train_loss": -20.707061767578125, "global_step": 65747, "epoch": 792} {"train_loss": -20.70882225036621, "global_step": 65748, "epoch": 792} {"train_loss": -20.686946868896484, "global_step": 65749, "epoch": 792} {"train_loss": -20.640663146972656, "global_step": 65750, "epoch": 792} {"train_loss": -20.66034698486328, "global_step": 65751, "epoch": 792} {"train_loss": -20.754262924194336, "global_step": 65752, "epoch": 792} {"train_loss": -20.589685440063477, "global_step": 65753, "epoch": 792} {"train_loss": -20.748844146728516, "global_step": 65754, "epoch": 792} {"train_loss": -20.643056869506836, "global_step": 65755, "epoch": 792} {"train_loss": -21.024948120117188, "global_step": 65756, "epoch": 792} {"train_loss": -20.763111114501953, "global_step": 65757, "epoch": 792} {"train_loss": -20.605852127075195, "global_step": 65758, "epoch": 792} {"train_loss": -20.527475357055664, "global_step": 65759, "epoch": 792} {"train_loss": -20.59539794921875, "global_step": 65760, "epoch": 792} {"train_loss": -20.456106185913086, "global_step": 65761, "epoch": 792} {"train_loss": -20.85721778869629, "global_step": 65762, "epoch": 792} {"train_loss": -20.611129760742188, "global_step": 65763, "epoch": 792} {"train_loss": -20.609743118286133, "global_step": 65764, "epoch": 792} {"train_loss": -20.906797409057617, "global_step": 65765, "epoch": 792} {"train_loss": -20.619192123413086, "global_step": 65766, "epoch": 792} {"train_loss": -20.47854995727539, "global_step": 65767, "epoch": 792} {"train_loss": -20.708738327026367, "global_step": 65768, "epoch": 792} {"train_loss": -20.547657012939453, "global_step": 65769, "epoch": 792} {"train_loss": -20.331253051757812, "global_step": 65770, "epoch": 792} {"train_loss": -20.855594635009766, "global_step": 65771, "epoch": 792} {"train_loss": -20.595752716064453, "global_step": 65772, "epoch": 792} {"train_loss": -20.643798828125, "global_step": 65773, "epoch": 792} {"train_loss": -20.85053062438965, "global_step": 65774, "epoch": 792} {"train_loss": -20.582664489746094, "global_step": 65775, "epoch": 792} {"train_loss": -20.54329490661621, "global_step": 65776, "epoch": 792} {"train_loss": -20.44806480407715, "global_step": 65777, "epoch": 792} {"train_loss": -20.608734130859375, "global_step": 65778, "epoch": 792} {"train_loss": -20.611581802368164, "global_step": 65779, "epoch": 792} {"train_loss": -20.439273834228516, "global_step": 65780, "epoch": 792} {"train_loss": -20.584243774414062, "global_step": 65781, "epoch": 792} {"train_loss": -20.38054847717285, "global_step": 65782, "epoch": 792} {"train_loss": -20.33339500427246, "global_step": 65783, "epoch": 792} {"train_loss": -20.592632293701172, "global_step": 65784, "epoch": 792} {"train_loss": -20.561704635620117, "global_step": 65785, "epoch": 792} {"train_loss": -20.502927780151367, "global_step": 65786, "epoch": 792} {"train_loss": -20.48013687133789, "global_step": 65787, "epoch": 792} {"train_loss": -20.651355743408203, "global_step": 65788, "epoch": 792} {"train_loss": -20.581924438476562, "global_step": 65789, "epoch": 792} {"train_loss": -20.71746063232422, "global_step": 65790, "epoch": 792} {"train_loss": -20.647520065307617, "global_step": 65791, "epoch": 792} {"train_loss": -20.8951416015625, "global_step": 65792, "epoch": 792} {"train_loss": -20.881423950195312, "global_step": 65793, "epoch": 792} {"train_loss": -20.542478561401367, "global_step": 65794, "epoch": 792} {"train_loss": -20.813114166259766, "global_step": 65795, "epoch": 792} {"train_loss": -20.656396865844727, "global_step": 65796, "epoch": 792} {"train_loss": -20.4692440032959, "global_step": 65797, "epoch": 792} {"train_loss": -20.817577362060547, "global_step": 65798, "epoch": 792} {"train_loss": -20.34260368347168, "global_step": 65799, "epoch": 792} {"train_loss": -20.506750106811523, "global_step": 65800, "epoch": 792} {"train_loss": -20.68877601623535, "global_step": 65801, "epoch": 792} {"train_loss": -20.749393463134766, "global_step": 65802, "epoch": 792} {"train_loss": -20.451465606689453, "global_step": 65803, "epoch": 792} {"train_loss": -20.732248306274414, "global_step": 65804, "epoch": 792} {"train_loss": -20.47568130493164, "global_step": 65805, "epoch": 792} {"train_loss": -20.283649444580078, "global_step": 65806, "epoch": 792} {"train_loss": -20.868005752563477, "global_step": 65807, "epoch": 792} {"train_loss": -20.412921905517578, "global_step": 65808, "epoch": 792} {"train_loss": -20.89188003540039, "global_step": 65809, "epoch": 792} {"train_loss": -20.44642448425293, "global_step": 65810, "epoch": 792} {"train_loss": -20.806814193725586, "global_step": 65811, "epoch": 792} {"train_loss": -20.57259750366211, "global_step": 65812, "epoch": 792} {"train_loss": -20.68558120727539, "global_step": 65813, "epoch": 792} {"train_loss": -20.7880802154541, "global_step": 65814, "epoch": 792} {"train_loss": -20.822994232177734, "global_step": 65815, "epoch": 792} {"train_loss": -20.643091201782227, "global_step": 65816, "epoch": 792} {"train_loss": -20.580432891845703, "global_step": 65817, "epoch": 792} {"train_loss": -20.61697723204831, "global_step": 65818, "epoch": 792, "val_loss": 5963909.0} {"train_loss": -19.8941593170166, "global_step": 65819, "epoch": 793} {"train_loss": -20.556474685668945, "global_step": 65820, "epoch": 793} {"train_loss": -19.787195205688477, "global_step": 65821, "epoch": 793} {"train_loss": -19.67024803161621, "global_step": 65822, "epoch": 793} {"train_loss": -20.57331657409668, "global_step": 65823, "epoch": 793} {"train_loss": -20.176223754882812, "global_step": 65824, "epoch": 793} {"train_loss": -20.23362922668457, "global_step": 65825, "epoch": 793} {"train_loss": -20.49273681640625, "global_step": 65826, "epoch": 793} {"train_loss": -20.372526168823242, "global_step": 65827, "epoch": 793} {"train_loss": -20.27435302734375, "global_step": 65828, "epoch": 793} {"train_loss": -20.46616554260254, "global_step": 65829, "epoch": 793} {"train_loss": -20.495925903320312, "global_step": 65830, "epoch": 793} {"train_loss": -20.49993324279785, "global_step": 65831, "epoch": 793} {"train_loss": -20.262895584106445, "global_step": 65832, "epoch": 793} {"train_loss": -20.96663475036621, "global_step": 65833, "epoch": 793} {"train_loss": -20.675113677978516, "global_step": 65834, "epoch": 793} {"train_loss": -20.391361236572266, "global_step": 65835, "epoch": 793} {"train_loss": -20.318960189819336, "global_step": 65836, "epoch": 793} {"train_loss": -20.691970825195312, "global_step": 65837, "epoch": 793} {"train_loss": -20.73009490966797, "global_step": 65838, "epoch": 793} {"train_loss": -20.701231002807617, "global_step": 65839, "epoch": 793} {"train_loss": -20.610280990600586, "global_step": 65840, "epoch": 793} {"train_loss": -20.688339233398438, "global_step": 65841, "epoch": 793} {"train_loss": -20.362102508544922, "global_step": 65842, "epoch": 793} {"train_loss": -20.688291549682617, "global_step": 65843, "epoch": 793} {"train_loss": -20.420087814331055, "global_step": 65844, "epoch": 793} {"train_loss": -20.59349250793457, "global_step": 65845, "epoch": 793} {"train_loss": -20.49244499206543, "global_step": 65846, "epoch": 793} {"train_loss": -20.571563720703125, "global_step": 65847, "epoch": 793} {"train_loss": -20.786985397338867, "global_step": 65848, "epoch": 793} {"train_loss": -20.289844512939453, "global_step": 65849, "epoch": 793} {"train_loss": -20.957651138305664, "global_step": 65850, "epoch": 793} {"train_loss": -20.609670639038086, "global_step": 65851, "epoch": 793} {"train_loss": -20.426525115966797, "global_step": 65852, "epoch": 793} {"train_loss": -21.03110694885254, "global_step": 65853, "epoch": 793} {"train_loss": -20.569353103637695, "global_step": 65854, "epoch": 793} {"train_loss": -20.959182739257812, "global_step": 65855, "epoch": 793} {"train_loss": -20.259124755859375, "global_step": 65856, "epoch": 793} {"train_loss": -20.78144645690918, "global_step": 65857, "epoch": 793} {"train_loss": -20.818632125854492, "global_step": 65858, "epoch": 793} {"train_loss": -20.567066192626953, "global_step": 65859, "epoch": 793} {"train_loss": -20.58253288269043, "global_step": 65860, "epoch": 793} {"train_loss": -20.92975425720215, "global_step": 65861, "epoch": 793} {"train_loss": -20.512521743774414, "global_step": 65862, "epoch": 793} {"train_loss": -20.465604782104492, "global_step": 65863, "epoch": 793} {"train_loss": -20.53786277770996, "global_step": 65864, "epoch": 793} {"train_loss": -20.630168914794922, "global_step": 65865, "epoch": 793} {"train_loss": -20.70686912536621, "global_step": 65866, "epoch": 793} {"train_loss": -20.998350143432617, "global_step": 65867, "epoch": 793} {"train_loss": -20.4136962890625, "global_step": 65868, "epoch": 793} {"train_loss": -20.58697509765625, "global_step": 65869, "epoch": 793} {"train_loss": -20.954435348510742, "global_step": 65870, "epoch": 793} {"train_loss": -20.457401275634766, "global_step": 65871, "epoch": 793} {"train_loss": -20.68333625793457, "global_step": 65872, "epoch": 793} {"train_loss": -20.50095558166504, "global_step": 65873, "epoch": 793} {"train_loss": -20.438894271850586, "global_step": 65874, "epoch": 793} {"train_loss": -20.598630905151367, "global_step": 65875, "epoch": 793} {"train_loss": -20.654943466186523, "global_step": 65876, "epoch": 793} {"train_loss": -20.23545265197754, "global_step": 65877, "epoch": 793} {"train_loss": -20.676542282104492, "global_step": 65878, "epoch": 793} {"train_loss": -20.52809715270996, "global_step": 65879, "epoch": 793} {"train_loss": -20.58821678161621, "global_step": 65880, "epoch": 793} {"train_loss": -20.78867530822754, "global_step": 65881, "epoch": 793} {"train_loss": -21.015226364135742, "global_step": 65882, "epoch": 793} {"train_loss": -20.709514617919922, "global_step": 65883, "epoch": 793} {"train_loss": -20.79173469543457, "global_step": 65884, "epoch": 793} {"train_loss": -20.648603439331055, "global_step": 65885, "epoch": 793} {"train_loss": -20.45218849182129, "global_step": 65886, "epoch": 793} {"train_loss": -20.901348114013672, "global_step": 65887, "epoch": 793} {"train_loss": -20.59571075439453, "global_step": 65888, "epoch": 793} {"train_loss": -20.60207748413086, "global_step": 65889, "epoch": 793} {"train_loss": -20.621084213256836, "global_step": 65890, "epoch": 793} {"train_loss": -20.59947967529297, "global_step": 65891, "epoch": 793} {"train_loss": -20.617633819580078, "global_step": 65892, "epoch": 793} {"train_loss": -20.736902236938477, "global_step": 65893, "epoch": 793} {"train_loss": -20.27980613708496, "global_step": 65894, "epoch": 793} {"train_loss": -20.454975128173828, "global_step": 65895, "epoch": 793} {"train_loss": -20.548160552978516, "global_step": 65896, "epoch": 793} {"train_loss": -20.808603286743164, "global_step": 65897, "epoch": 793} {"train_loss": -20.875837326049805, "global_step": 65898, "epoch": 793} {"train_loss": -20.429349899291992, "global_step": 65899, "epoch": 793} {"train_loss": -20.75739860534668, "global_step": 65900, "epoch": 793} {"train_loss": -20.57964021613799, "global_step": 65901, "epoch": 793, "val_loss": 5897137.0} {"train_loss": -20.54207420349121, "global_step": 65902, "epoch": 794} {"train_loss": -20.744731903076172, "global_step": 65903, "epoch": 794} {"train_loss": -20.90681266784668, "global_step": 65904, "epoch": 794} {"train_loss": -20.875667572021484, "global_step": 65905, "epoch": 794} {"train_loss": -20.863473892211914, "global_step": 65906, "epoch": 794} {"train_loss": -20.673828125, "global_step": 65907, "epoch": 794} {"train_loss": -20.681753158569336, "global_step": 65908, "epoch": 794} {"train_loss": -20.66373062133789, "global_step": 65909, "epoch": 794} {"train_loss": -20.408538818359375, "global_step": 65910, "epoch": 794} {"train_loss": -20.79401397705078, "global_step": 65911, "epoch": 794} {"train_loss": -20.66229248046875, "global_step": 65912, "epoch": 794} {"train_loss": -20.579038619995117, "global_step": 65913, "epoch": 794} {"train_loss": -20.382001876831055, "global_step": 65914, "epoch": 794} {"train_loss": -20.75945472717285, "global_step": 65915, "epoch": 794} {"train_loss": -20.29111671447754, "global_step": 65916, "epoch": 794} {"train_loss": -20.715200424194336, "global_step": 65917, "epoch": 794} {"train_loss": -20.875280380249023, "global_step": 65918, "epoch": 794} {"train_loss": -20.827146530151367, "global_step": 65919, "epoch": 794} {"train_loss": -20.929651260375977, "global_step": 65920, "epoch": 794} {"train_loss": -20.7081356048584, "global_step": 65921, "epoch": 794} {"train_loss": -20.934324264526367, "global_step": 65922, "epoch": 794} {"train_loss": -20.827810287475586, "global_step": 65923, "epoch": 794} {"train_loss": -20.409515380859375, "global_step": 65924, "epoch": 794} {"train_loss": -20.466684341430664, "global_step": 65925, "epoch": 794} {"train_loss": -20.57325553894043, "global_step": 65926, "epoch": 794} {"train_loss": -20.218612670898438, "global_step": 65927, "epoch": 794} {"train_loss": -20.722421646118164, "global_step": 65928, "epoch": 794} {"train_loss": -20.43313980102539, "global_step": 65929, "epoch": 794} {"train_loss": -20.92585563659668, "global_step": 65930, "epoch": 794} {"train_loss": -20.747873306274414, "global_step": 65931, "epoch": 794} {"train_loss": -20.567874908447266, "global_step": 65932, "epoch": 794} {"train_loss": -20.722309112548828, "global_step": 65933, "epoch": 794} {"train_loss": -20.568159103393555, "global_step": 65934, "epoch": 794} {"train_loss": -20.55970573425293, "global_step": 65935, "epoch": 794} {"train_loss": -20.364652633666992, "global_step": 65936, "epoch": 794} {"train_loss": -20.735519409179688, "global_step": 65937, "epoch": 794} {"train_loss": -20.791671752929688, "global_step": 65938, "epoch": 794} {"train_loss": -20.621976852416992, "global_step": 65939, "epoch": 794} {"train_loss": -20.41855239868164, "global_step": 65940, "epoch": 794} {"train_loss": -20.86237907409668, "global_step": 65941, "epoch": 794} {"train_loss": -20.97840690612793, "global_step": 65942, "epoch": 794} {"train_loss": -20.581134796142578, "global_step": 65943, "epoch": 794} {"train_loss": -20.61809539794922, "global_step": 65944, "epoch": 794} {"train_loss": -20.51068687438965, "global_step": 65945, "epoch": 794} {"train_loss": -20.81831932067871, "global_step": 65946, "epoch": 794} {"train_loss": -20.90785789489746, "global_step": 65947, "epoch": 794} {"train_loss": -20.562957763671875, "global_step": 65948, "epoch": 794} {"train_loss": -20.793415069580078, "global_step": 65949, "epoch": 794} {"train_loss": -20.861713409423828, "global_step": 65950, "epoch": 794} {"train_loss": -20.929685592651367, "global_step": 65951, "epoch": 794} {"train_loss": -20.881439208984375, "global_step": 65952, "epoch": 794} {"train_loss": -20.643978118896484, "global_step": 65953, "epoch": 794} {"train_loss": -20.81782341003418, "global_step": 65954, "epoch": 794} {"train_loss": -20.4395694732666, "global_step": 65955, "epoch": 794} {"train_loss": -20.58782386779785, "global_step": 65956, "epoch": 794} {"train_loss": -20.566404342651367, "global_step": 65957, "epoch": 794} {"train_loss": -20.64349937438965, "global_step": 65958, "epoch": 794} {"train_loss": -20.990785598754883, "global_step": 65959, "epoch": 794} {"train_loss": -20.845579147338867, "global_step": 65960, "epoch": 794} {"train_loss": -20.739843368530273, "global_step": 65961, "epoch": 794} {"train_loss": -20.766416549682617, "global_step": 65962, "epoch": 794} {"train_loss": -20.65200424194336, "global_step": 65963, "epoch": 794} {"train_loss": -20.923446655273438, "global_step": 65964, "epoch": 794} {"train_loss": -20.68404769897461, "global_step": 65965, "epoch": 794} {"train_loss": -20.8547420501709, "global_step": 65966, "epoch": 794} {"train_loss": -20.794416427612305, "global_step": 65967, "epoch": 794} {"train_loss": -20.666242599487305, "global_step": 65968, "epoch": 794} {"train_loss": -20.570270538330078, "global_step": 65969, "epoch": 794} {"train_loss": -20.464710235595703, "global_step": 65970, "epoch": 794} {"train_loss": -20.424142837524414, "global_step": 65971, "epoch": 794} {"train_loss": -20.282608032226562, "global_step": 65972, "epoch": 794} {"train_loss": -20.52412986755371, "global_step": 65973, "epoch": 794} {"train_loss": -20.613527297973633, "global_step": 65974, "epoch": 794} {"train_loss": -21.285215377807617, "global_step": 65975, "epoch": 794} {"train_loss": -21.18269920349121, "global_step": 65976, "epoch": 794} {"train_loss": -20.804946899414062, "global_step": 65977, "epoch": 794} {"train_loss": -20.800161361694336, "global_step": 65978, "epoch": 794} {"train_loss": -20.240123748779297, "global_step": 65979, "epoch": 794} {"train_loss": -20.6772403717041, "global_step": 65980, "epoch": 794} {"train_loss": -20.80853843688965, "global_step": 65981, "epoch": 794} {"train_loss": -20.657529830932617, "global_step": 65982, "epoch": 794} {"train_loss": -20.412961959838867, "global_step": 65983, "epoch": 794} {"train_loss": -20.678801226328655, "global_step": 65984, "epoch": 794, "val_loss": 5923196.5} {"train_loss": -19.999256134033203, "global_step": 65985, "epoch": 795} {"train_loss": -20.341886520385742, "global_step": 65986, "epoch": 795} {"train_loss": -20.284076690673828, "global_step": 65987, "epoch": 795} {"train_loss": -20.59876823425293, "global_step": 65988, "epoch": 795} {"train_loss": -20.591148376464844, "global_step": 65989, "epoch": 795} {"train_loss": -20.297096252441406, "global_step": 65990, "epoch": 795} {"train_loss": -20.426870346069336, "global_step": 65991, "epoch": 795} {"train_loss": -20.454374313354492, "global_step": 65992, "epoch": 795} {"train_loss": -20.66471290588379, "global_step": 65993, "epoch": 795} {"train_loss": -20.762775421142578, "global_step": 65994, "epoch": 795} {"train_loss": -20.400920867919922, "global_step": 65995, "epoch": 795} {"train_loss": -20.52306365966797, "global_step": 65996, "epoch": 795} {"train_loss": -20.691633224487305, "global_step": 65997, "epoch": 795} {"train_loss": -20.7349796295166, "global_step": 65998, "epoch": 795} {"train_loss": -20.505582809448242, "global_step": 65999, "epoch": 795} {"train_loss": -20.65399742126465, "global_step": 66000, "epoch": 795} {"train_loss": -20.659982681274414, "global_step": 66001, "epoch": 795} {"train_loss": -20.187910079956055, "global_step": 66002, "epoch": 795} {"train_loss": -20.501340866088867, "global_step": 66003, "epoch": 795} {"train_loss": -20.66468620300293, "global_step": 66004, "epoch": 795} {"train_loss": -20.555570602416992, "global_step": 66005, "epoch": 795} {"train_loss": -20.790218353271484, "global_step": 66006, "epoch": 795} {"train_loss": -20.613391876220703, "global_step": 66007, "epoch": 795} {"train_loss": -20.4006404876709, "global_step": 66008, "epoch": 795} {"train_loss": -20.743844985961914, "global_step": 66009, "epoch": 795} {"train_loss": -20.973365783691406, "global_step": 66010, "epoch": 795} {"train_loss": -20.265424728393555, "global_step": 66011, "epoch": 795} {"train_loss": -20.479145050048828, "global_step": 66012, "epoch": 795} {"train_loss": -20.682889938354492, "global_step": 66013, "epoch": 795} {"train_loss": -20.66913414001465, "global_step": 66014, "epoch": 795} {"train_loss": -20.57636833190918, "global_step": 66015, "epoch": 795} {"train_loss": -20.58504295349121, "global_step": 66016, "epoch": 795} {"train_loss": -20.523971557617188, "global_step": 66017, "epoch": 795} {"train_loss": -20.76938819885254, "global_step": 66018, "epoch": 795} {"train_loss": -20.552663803100586, "global_step": 66019, "epoch": 795} {"train_loss": -20.83844757080078, "global_step": 66020, "epoch": 795} {"train_loss": -21.04319190979004, "global_step": 66021, "epoch": 795} {"train_loss": -20.62275505065918, "global_step": 66022, "epoch": 795} {"train_loss": -20.767324447631836, "global_step": 66023, "epoch": 795} {"train_loss": -20.730056762695312, "global_step": 66024, "epoch": 795} {"train_loss": -20.557273864746094, "global_step": 66025, "epoch": 795} {"train_loss": -20.94260597229004, "global_step": 66026, "epoch": 795} {"train_loss": -20.793298721313477, "global_step": 66027, "epoch": 795} {"train_loss": -20.437551498413086, "global_step": 66028, "epoch": 795} {"train_loss": -20.698932647705078, "global_step": 66029, "epoch": 795} {"train_loss": -20.47357749938965, "global_step": 66030, "epoch": 795} {"train_loss": -20.50607681274414, "global_step": 66031, "epoch": 795} {"train_loss": -20.445737838745117, "global_step": 66032, "epoch": 795} {"train_loss": -20.26093864440918, "global_step": 66033, "epoch": 795} {"train_loss": -20.813831329345703, "global_step": 66034, "epoch": 795} {"train_loss": -20.352710723876953, "global_step": 66035, "epoch": 795} {"train_loss": -20.734989166259766, "global_step": 66036, "epoch": 795} {"train_loss": -20.5145320892334, "global_step": 66037, "epoch": 795} {"train_loss": -20.710371017456055, "global_step": 66038, "epoch": 795} {"train_loss": -20.26980972290039, "global_step": 66039, "epoch": 795} {"train_loss": -20.421619415283203, "global_step": 66040, "epoch": 795} {"train_loss": -20.910268783569336, "global_step": 66041, "epoch": 795} {"train_loss": -20.419187545776367, "global_step": 66042, "epoch": 795} {"train_loss": -20.604597091674805, "global_step": 66043, "epoch": 795} {"train_loss": -20.615995407104492, "global_step": 66044, "epoch": 795} {"train_loss": -20.603158950805664, "global_step": 66045, "epoch": 795} {"train_loss": -20.551956176757812, "global_step": 66046, "epoch": 795} {"train_loss": -20.806228637695312, "global_step": 66047, "epoch": 795} {"train_loss": -20.59117317199707, "global_step": 66048, "epoch": 795} {"train_loss": -20.76795768737793, "global_step": 66049, "epoch": 795} {"train_loss": -20.91027069091797, "global_step": 66050, "epoch": 795} {"train_loss": -20.518678665161133, "global_step": 66051, "epoch": 795} {"train_loss": -20.676485061645508, "global_step": 66052, "epoch": 795} {"train_loss": -20.302566528320312, "global_step": 66053, "epoch": 795} {"train_loss": -20.82700538635254, "global_step": 66054, "epoch": 795} {"train_loss": -20.44217300415039, "global_step": 66055, "epoch": 795} {"train_loss": -20.61345100402832, "global_step": 66056, "epoch": 795} {"train_loss": -20.672550201416016, "global_step": 66057, "epoch": 795} {"train_loss": -20.538192749023438, "global_step": 66058, "epoch": 795} {"train_loss": -21.03267478942871, "global_step": 66059, "epoch": 795} {"train_loss": -20.358301162719727, "global_step": 66060, "epoch": 795} {"train_loss": -20.728750228881836, "global_step": 66061, "epoch": 795} {"train_loss": -20.831579208374023, "global_step": 66062, "epoch": 795} {"train_loss": -20.589406967163086, "global_step": 66063, "epoch": 795} {"train_loss": -20.57081413269043, "global_step": 66064, "epoch": 795} {"train_loss": -20.22598648071289, "global_step": 66065, "epoch": 795} {"train_loss": -20.640411376953125, "global_step": 66066, "epoch": 795} {"train_loss": -20.590905545705773, "global_step": 66067, "epoch": 795, "val_loss": 5898640.0} {"train_loss": -20.915973663330078, "global_step": 66068, "epoch": 796} {"train_loss": -20.298261642456055, "global_step": 66069, "epoch": 796} {"train_loss": -20.41130256652832, "global_step": 66070, "epoch": 796} {"train_loss": -20.451181411743164, "global_step": 66071, "epoch": 796} {"train_loss": -20.723621368408203, "global_step": 66072, "epoch": 796} {"train_loss": -21.07032585144043, "global_step": 66073, "epoch": 796} {"train_loss": -20.597185134887695, "global_step": 66074, "epoch": 796} {"train_loss": -20.467960357666016, "global_step": 66075, "epoch": 796} {"train_loss": -20.482370376586914, "global_step": 66076, "epoch": 796} {"train_loss": -20.382652282714844, "global_step": 66077, "epoch": 796} {"train_loss": -20.606054306030273, "global_step": 66078, "epoch": 796} {"train_loss": -20.71918296813965, "global_step": 66079, "epoch": 796} {"train_loss": -20.879291534423828, "global_step": 66080, "epoch": 796} {"train_loss": -20.068132400512695, "global_step": 66081, "epoch": 796} {"train_loss": -20.436315536499023, "global_step": 66082, "epoch": 796} {"train_loss": -20.64764976501465, "global_step": 66083, "epoch": 796} {"train_loss": -20.339887619018555, "global_step": 66084, "epoch": 796} {"train_loss": -20.50252914428711, "global_step": 66085, "epoch": 796} {"train_loss": -20.89512062072754, "global_step": 66086, "epoch": 796} {"train_loss": -20.479206085205078, "global_step": 66087, "epoch": 796} {"train_loss": -20.6730899810791, "global_step": 66088, "epoch": 796} {"train_loss": -20.49088478088379, "global_step": 66089, "epoch": 796} {"train_loss": -20.29396629333496, "global_step": 66090, "epoch": 796} {"train_loss": -20.635967254638672, "global_step": 66091, "epoch": 796} {"train_loss": -20.60774040222168, "global_step": 66092, "epoch": 796} {"train_loss": -20.69110870361328, "global_step": 66093, "epoch": 796} {"train_loss": -21.093814849853516, "global_step": 66094, "epoch": 796} {"train_loss": -20.831623077392578, "global_step": 66095, "epoch": 796} {"train_loss": -20.781539916992188, "global_step": 66096, "epoch": 796} {"train_loss": -20.677946090698242, "global_step": 66097, "epoch": 796} {"train_loss": -20.5876522064209, "global_step": 66098, "epoch": 796} {"train_loss": -20.432796478271484, "global_step": 66099, "epoch": 796} {"train_loss": -20.351776123046875, "global_step": 66100, "epoch": 796} {"train_loss": -20.240690231323242, "global_step": 66101, "epoch": 796} {"train_loss": -20.574535369873047, "global_step": 66102, "epoch": 796} {"train_loss": -20.548526763916016, "global_step": 66103, "epoch": 796} {"train_loss": -21.069377899169922, "global_step": 66104, "epoch": 796} {"train_loss": -20.4052791595459, "global_step": 66105, "epoch": 796} {"train_loss": -20.9007625579834, "global_step": 66106, "epoch": 796} {"train_loss": -20.58689308166504, "global_step": 66107, "epoch": 796} {"train_loss": -20.947927474975586, "global_step": 66108, "epoch": 796} {"train_loss": -20.49392318725586, "global_step": 66109, "epoch": 796} {"train_loss": -20.946447372436523, "global_step": 66110, "epoch": 796} {"train_loss": -20.70686149597168, "global_step": 66111, "epoch": 796} {"train_loss": -20.71907615661621, "global_step": 66112, "epoch": 796} {"train_loss": -20.595685958862305, "global_step": 66113, "epoch": 796} {"train_loss": -20.79868507385254, "global_step": 66114, "epoch": 796} {"train_loss": -20.2369441986084, "global_step": 66115, "epoch": 796} {"train_loss": -20.65873908996582, "global_step": 66116, "epoch": 796} {"train_loss": -20.284116744995117, "global_step": 66117, "epoch": 796} {"train_loss": -20.42714500427246, "global_step": 66118, "epoch": 796} {"train_loss": -21.05980682373047, "global_step": 66119, "epoch": 796} {"train_loss": -20.51700210571289, "global_step": 66120, "epoch": 796} {"train_loss": -20.7777156829834, "global_step": 66121, "epoch": 796} {"train_loss": -20.82929801940918, "global_step": 66122, "epoch": 796} {"train_loss": -20.595930099487305, "global_step": 66123, "epoch": 796} {"train_loss": -20.594839096069336, "global_step": 66124, "epoch": 796} {"train_loss": -20.937652587890625, "global_step": 66125, "epoch": 796} {"train_loss": -20.733320236206055, "global_step": 66126, "epoch": 796} {"train_loss": -20.39393424987793, "global_step": 66127, "epoch": 796} {"train_loss": -20.62896728515625, "global_step": 66128, "epoch": 796} {"train_loss": -20.995094299316406, "global_step": 66129, "epoch": 796} {"train_loss": -20.734159469604492, "global_step": 66130, "epoch": 796} {"train_loss": -20.969911575317383, "global_step": 66131, "epoch": 796} {"train_loss": -20.78291893005371, "global_step": 66132, "epoch": 796} {"train_loss": -20.69040298461914, "global_step": 66133, "epoch": 796} {"train_loss": -20.625478744506836, "global_step": 66134, "epoch": 796} {"train_loss": -20.767271041870117, "global_step": 66135, "epoch": 796} {"train_loss": -20.475130081176758, "global_step": 66136, "epoch": 796} {"train_loss": -20.57229232788086, "global_step": 66137, "epoch": 796} {"train_loss": -21.063276290893555, "global_step": 66138, "epoch": 796} {"train_loss": -20.808246612548828, "global_step": 66139, "epoch": 796} {"train_loss": -20.812002182006836, "global_step": 66140, "epoch": 796} {"train_loss": -20.887849807739258, "global_step": 66141, "epoch": 796} {"train_loss": -20.985191345214844, "global_step": 66142, "epoch": 796} {"train_loss": -20.970800399780273, "global_step": 66143, "epoch": 796} {"train_loss": -20.892276763916016, "global_step": 66144, "epoch": 796} {"train_loss": -20.62241554260254, "global_step": 66145, "epoch": 796} {"train_loss": -20.60861587524414, "global_step": 66146, "epoch": 796} {"train_loss": -20.559598922729492, "global_step": 66147, "epoch": 796} {"train_loss": -20.724084854125977, "global_step": 66148, "epoch": 796} {"train_loss": -20.53386116027832, "global_step": 66149, "epoch": 796} {"train_loss": -20.669407718152886, "global_step": 66150, "epoch": 796, "val_loss": 5929023.0} {"train_loss": -20.758474349975586, "global_step": 66151, "epoch": 797} {"train_loss": -20.352874755859375, "global_step": 66152, "epoch": 797} {"train_loss": -20.634611129760742, "global_step": 66153, "epoch": 797} {"train_loss": -20.542673110961914, "global_step": 66154, "epoch": 797} {"train_loss": -20.553451538085938, "global_step": 66155, "epoch": 797} {"train_loss": -20.63926124572754, "global_step": 66156, "epoch": 797} {"train_loss": -20.50648307800293, "global_step": 66157, "epoch": 797} {"train_loss": -20.288454055786133, "global_step": 66158, "epoch": 797} {"train_loss": -20.681442260742188, "global_step": 66159, "epoch": 797} {"train_loss": -20.80112075805664, "global_step": 66160, "epoch": 797} {"train_loss": -20.719482421875, "global_step": 66161, "epoch": 797} {"train_loss": -20.7669677734375, "global_step": 66162, "epoch": 797} {"train_loss": -20.465444564819336, "global_step": 66163, "epoch": 797} {"train_loss": -20.47541618347168, "global_step": 66164, "epoch": 797} {"train_loss": -20.64710235595703, "global_step": 66165, "epoch": 797} {"train_loss": -20.955854415893555, "global_step": 66166, "epoch": 797} {"train_loss": -20.643842697143555, "global_step": 66167, "epoch": 797} {"train_loss": -20.74090003967285, "global_step": 66168, "epoch": 797} {"train_loss": -20.80378532409668, "global_step": 66169, "epoch": 797} {"train_loss": -20.61648178100586, "global_step": 66170, "epoch": 797} {"train_loss": -20.53272247314453, "global_step": 66171, "epoch": 797} {"train_loss": -20.55088233947754, "global_step": 66172, "epoch": 797} {"train_loss": -20.55044937133789, "global_step": 66173, "epoch": 797} {"train_loss": -20.748981475830078, "global_step": 66174, "epoch": 797} {"train_loss": -20.544361114501953, "global_step": 66175, "epoch": 797} {"train_loss": -20.476791381835938, "global_step": 66176, "epoch": 797} {"train_loss": -20.554052352905273, "global_step": 66177, "epoch": 797} {"train_loss": -20.53571128845215, "global_step": 66178, "epoch": 797} {"train_loss": -20.33777618408203, "global_step": 66179, "epoch": 797} {"train_loss": -20.954442977905273, "global_step": 66180, "epoch": 797} {"train_loss": -20.672597885131836, "global_step": 66181, "epoch": 797} {"train_loss": -20.886911392211914, "global_step": 66182, "epoch": 797} {"train_loss": -20.960554122924805, "global_step": 66183, "epoch": 797} {"train_loss": -20.659543991088867, "global_step": 66184, "epoch": 797} {"train_loss": -20.525793075561523, "global_step": 66185, "epoch": 797} {"train_loss": -20.341672897338867, "global_step": 66186, "epoch": 797} {"train_loss": -20.907499313354492, "global_step": 66187, "epoch": 797} {"train_loss": -20.056772232055664, "global_step": 66188, "epoch": 797} {"train_loss": -20.276653289794922, "global_step": 66189, "epoch": 797} {"train_loss": -20.716035842895508, "global_step": 66190, "epoch": 797} {"train_loss": -20.50371742248535, "global_step": 66191, "epoch": 797} {"train_loss": -20.42363929748535, "global_step": 66192, "epoch": 797} {"train_loss": -20.839466094970703, "global_step": 66193, "epoch": 797} {"train_loss": -20.52069091796875, "global_step": 66194, "epoch": 797} {"train_loss": -20.769832611083984, "global_step": 66195, "epoch": 797} {"train_loss": -20.762863159179688, "global_step": 66196, "epoch": 797} {"train_loss": -20.46445655822754, "global_step": 66197, "epoch": 797} {"train_loss": -20.913930892944336, "global_step": 66198, "epoch": 797} {"train_loss": -20.77118492126465, "global_step": 66199, "epoch": 797} {"train_loss": -20.76393699645996, "global_step": 66200, "epoch": 797} {"train_loss": -20.240859985351562, "global_step": 66201, "epoch": 797} {"train_loss": -20.47121810913086, "global_step": 66202, "epoch": 797} {"train_loss": -20.80173110961914, "global_step": 66203, "epoch": 797} {"train_loss": -20.440900802612305, "global_step": 66204, "epoch": 797} {"train_loss": -20.55989646911621, "global_step": 66205, "epoch": 797} {"train_loss": -20.721498489379883, "global_step": 66206, "epoch": 797} {"train_loss": -20.966386795043945, "global_step": 66207, "epoch": 797} {"train_loss": -20.760986328125, "global_step": 66208, "epoch": 797} {"train_loss": -20.4990177154541, "global_step": 66209, "epoch": 797} {"train_loss": -20.37103843688965, "global_step": 66210, "epoch": 797} {"train_loss": -20.634187698364258, "global_step": 66211, "epoch": 797} {"train_loss": -20.63848304748535, "global_step": 66212, "epoch": 797} {"train_loss": -20.77315330505371, "global_step": 66213, "epoch": 797} {"train_loss": -20.866796493530273, "global_step": 66214, "epoch": 797} {"train_loss": -20.413105010986328, "global_step": 66215, "epoch": 797} {"train_loss": -20.609601974487305, "global_step": 66216, "epoch": 797} {"train_loss": -20.715423583984375, "global_step": 66217, "epoch": 797} {"train_loss": -20.211257934570312, "global_step": 66218, "epoch": 797} {"train_loss": -20.499412536621094, "global_step": 66219, "epoch": 797} {"train_loss": -20.296951293945312, "global_step": 66220, "epoch": 797} {"train_loss": -20.620725631713867, "global_step": 66221, "epoch": 797} {"train_loss": -20.401708602905273, "global_step": 66222, "epoch": 797} {"train_loss": -20.91457748413086, "global_step": 66223, "epoch": 797} {"train_loss": -20.48050308227539, "global_step": 66224, "epoch": 797} {"train_loss": -20.653430938720703, "global_step": 66225, "epoch": 797} {"train_loss": -20.745145797729492, "global_step": 66226, "epoch": 797} {"train_loss": -20.556123733520508, "global_step": 66227, "epoch": 797} {"train_loss": -20.673521041870117, "global_step": 66228, "epoch": 797} {"train_loss": -20.667360305786133, "global_step": 66229, "epoch": 797} {"train_loss": -20.251800537109375, "global_step": 66230, "epoch": 797} {"train_loss": -20.34967613220215, "global_step": 66231, "epoch": 797} {"train_loss": -20.86964225769043, "global_step": 66232, "epoch": 797} {"train_loss": -20.61848877136966, "global_step": 66233, "epoch": 797, "val_loss": 6159694.5} {"train_loss": -20.40367317199707, "global_step": 66234, "epoch": 798} {"train_loss": -20.549177169799805, "global_step": 66235, "epoch": 798} {"train_loss": -20.004045486450195, "global_step": 66236, "epoch": 798} {"train_loss": -20.477035522460938, "global_step": 66237, "epoch": 798} {"train_loss": -20.570703506469727, "global_step": 66238, "epoch": 798} {"train_loss": -20.35874366760254, "global_step": 66239, "epoch": 798} {"train_loss": -20.38877296447754, "global_step": 66240, "epoch": 798} {"train_loss": -20.52243423461914, "global_step": 66241, "epoch": 798} {"train_loss": -20.327268600463867, "global_step": 66242, "epoch": 798} {"train_loss": -20.585355758666992, "global_step": 66243, "epoch": 798} {"train_loss": -20.318798065185547, "global_step": 66244, "epoch": 798} {"train_loss": -19.877378463745117, "global_step": 66245, "epoch": 798} {"train_loss": -20.548994064331055, "global_step": 66246, "epoch": 798} {"train_loss": -20.370473861694336, "global_step": 66247, "epoch": 798} {"train_loss": -20.401351928710938, "global_step": 66248, "epoch": 798} {"train_loss": -20.57538414001465, "global_step": 66249, "epoch": 798} {"train_loss": -20.844297409057617, "global_step": 66250, "epoch": 798} {"train_loss": -20.492685317993164, "global_step": 66251, "epoch": 798} {"train_loss": -21.133235931396484, "global_step": 66252, "epoch": 798} {"train_loss": -21.061065673828125, "global_step": 66253, "epoch": 798} {"train_loss": -20.969480514526367, "global_step": 66254, "epoch": 798} {"train_loss": -20.596649169921875, "global_step": 66255, "epoch": 798} {"train_loss": -20.999284744262695, "global_step": 66256, "epoch": 798} {"train_loss": -20.57046890258789, "global_step": 66257, "epoch": 798} {"train_loss": -20.92319679260254, "global_step": 66258, "epoch": 798} {"train_loss": -20.714584350585938, "global_step": 66259, "epoch": 798} {"train_loss": -20.76518440246582, "global_step": 66260, "epoch": 798} {"train_loss": -20.605566024780273, "global_step": 66261, "epoch": 798} {"train_loss": -20.489398956298828, "global_step": 66262, "epoch": 798} {"train_loss": -20.4725284576416, "global_step": 66263, "epoch": 798} {"train_loss": -20.758426666259766, "global_step": 66264, "epoch": 798} {"train_loss": -21.007959365844727, "global_step": 66265, "epoch": 798} {"train_loss": -20.784555435180664, "global_step": 66266, "epoch": 798} {"train_loss": -20.678457260131836, "global_step": 66267, "epoch": 798} {"train_loss": -20.95417594909668, "global_step": 66268, "epoch": 798} {"train_loss": -20.7169132232666, "global_step": 66269, "epoch": 798} {"train_loss": -20.248109817504883, "global_step": 66270, "epoch": 798} {"train_loss": -20.380470275878906, "global_step": 66271, "epoch": 798} {"train_loss": -20.980579376220703, "global_step": 66272, "epoch": 798} {"train_loss": -20.241064071655273, "global_step": 66273, "epoch": 798} {"train_loss": -20.745899200439453, "global_step": 66274, "epoch": 798} {"train_loss": -20.507055282592773, "global_step": 66275, "epoch": 798} {"train_loss": -20.399160385131836, "global_step": 66276, "epoch": 798} {"train_loss": -20.509611129760742, "global_step": 66277, "epoch": 798} {"train_loss": -20.536056518554688, "global_step": 66278, "epoch": 798} {"train_loss": -20.336200714111328, "global_step": 66279, "epoch": 798} {"train_loss": -20.470321655273438, "global_step": 66280, "epoch": 798} {"train_loss": -20.432424545288086, "global_step": 66281, "epoch": 798} {"train_loss": -20.50827407836914, "global_step": 66282, "epoch": 798} {"train_loss": -20.506057739257812, "global_step": 66283, "epoch": 798} {"train_loss": -20.25424575805664, "global_step": 66284, "epoch": 798} {"train_loss": -20.951263427734375, "global_step": 66285, "epoch": 798} {"train_loss": -20.752111434936523, "global_step": 66286, "epoch": 798} {"train_loss": -20.603330612182617, "global_step": 66287, "epoch": 798} {"train_loss": -20.884675979614258, "global_step": 66288, "epoch": 798} {"train_loss": -20.978635787963867, "global_step": 66289, "epoch": 798} {"train_loss": -20.65679359436035, "global_step": 66290, "epoch": 798} {"train_loss": -20.708051681518555, "global_step": 66291, "epoch": 798} {"train_loss": -21.04250144958496, "global_step": 66292, "epoch": 798} {"train_loss": -20.711782455444336, "global_step": 66293, "epoch": 798} {"train_loss": -20.749731063842773, "global_step": 66294, "epoch": 798} {"train_loss": -20.823495864868164, "global_step": 66295, "epoch": 798} {"train_loss": -20.82853126525879, "global_step": 66296, "epoch": 798} {"train_loss": -20.70258331298828, "global_step": 66297, "epoch": 798} {"train_loss": -21.05832862854004, "global_step": 66298, "epoch": 798} {"train_loss": -20.752138137817383, "global_step": 66299, "epoch": 798} {"train_loss": -21.261152267456055, "global_step": 66300, "epoch": 798} {"train_loss": -20.703216552734375, "global_step": 66301, "epoch": 798} {"train_loss": -20.589426040649414, "global_step": 66302, "epoch": 798} {"train_loss": -20.74761962890625, "global_step": 66303, "epoch": 798} {"train_loss": -20.12541389465332, "global_step": 66304, "epoch": 798} {"train_loss": -20.401182174682617, "global_step": 66305, "epoch": 798} {"train_loss": -20.465787887573242, "global_step": 66306, "epoch": 798} {"train_loss": -20.865379333496094, "global_step": 66307, "epoch": 798} {"train_loss": -20.900787353515625, "global_step": 66308, "epoch": 798} {"train_loss": -20.56490135192871, "global_step": 66309, "epoch": 798} {"train_loss": -20.50449562072754, "global_step": 66310, "epoch": 798} {"train_loss": -20.488805770874023, "global_step": 66311, "epoch": 798} {"train_loss": -20.850605010986328, "global_step": 66312, "epoch": 798} {"train_loss": -20.69571304321289, "global_step": 66313, "epoch": 798} {"train_loss": -20.740610122680664, "global_step": 66314, "epoch": 798} {"train_loss": -21.011234283447266, "global_step": 66315, "epoch": 798} {"train_loss": -20.62288360136101, "global_step": 66316, "epoch": 798, "val_loss": 5977221.0} {"train_loss": -20.333749771118164, "global_step": 66317, "epoch": 799} {"train_loss": -20.736270904541016, "global_step": 66318, "epoch": 799} {"train_loss": -20.502553939819336, "global_step": 66319, "epoch": 799} {"train_loss": -20.59646224975586, "global_step": 66320, "epoch": 799} {"train_loss": -20.519487380981445, "global_step": 66321, "epoch": 799} {"train_loss": -20.680139541625977, "global_step": 66322, "epoch": 799} {"train_loss": -20.412736892700195, "global_step": 66323, "epoch": 799} {"train_loss": -20.812849044799805, "global_step": 66324, "epoch": 799} {"train_loss": -20.752363204956055, "global_step": 66325, "epoch": 799} {"train_loss": -20.17945671081543, "global_step": 66326, "epoch": 799} {"train_loss": -20.364809036254883, "global_step": 66327, "epoch": 799} {"train_loss": -20.149524688720703, "global_step": 66328, "epoch": 799} {"train_loss": -20.925016403198242, "global_step": 66329, "epoch": 799} {"train_loss": -20.39435386657715, "global_step": 66330, "epoch": 799} {"train_loss": -20.644943237304688, "global_step": 66331, "epoch": 799} {"train_loss": -20.571561813354492, "global_step": 66332, "epoch": 799} {"train_loss": -20.849660873413086, "global_step": 66333, "epoch": 799} {"train_loss": -20.895986557006836, "global_step": 66334, "epoch": 799} {"train_loss": -20.358478546142578, "global_step": 66335, "epoch": 799} {"train_loss": -21.059560775756836, "global_step": 66336, "epoch": 799} {"train_loss": -20.734411239624023, "global_step": 66337, "epoch": 799} {"train_loss": -20.7830867767334, "global_step": 66338, "epoch": 799} {"train_loss": -20.72799301147461, "global_step": 66339, "epoch": 799} {"train_loss": -20.688264846801758, "global_step": 66340, "epoch": 799} {"train_loss": -20.517776489257812, "global_step": 66341, "epoch": 799} {"train_loss": -20.73119354248047, "global_step": 66342, "epoch": 799} {"train_loss": -20.426605224609375, "global_step": 66343, "epoch": 799} {"train_loss": -20.94791603088379, "global_step": 66344, "epoch": 799} {"train_loss": -20.4467716217041, "global_step": 66345, "epoch": 799} {"train_loss": -20.479419708251953, "global_step": 66346, "epoch": 799} {"train_loss": -20.466022491455078, "global_step": 66347, "epoch": 799} {"train_loss": -20.55621910095215, "global_step": 66348, "epoch": 799} {"train_loss": -20.812397003173828, "global_step": 66349, "epoch": 799} {"train_loss": -20.8961238861084, "global_step": 66350, "epoch": 799} {"train_loss": -21.012157440185547, "global_step": 66351, "epoch": 799} {"train_loss": -20.793598175048828, "global_step": 66352, "epoch": 799} {"train_loss": -20.753347396850586, "global_step": 66353, "epoch": 799} {"train_loss": -20.897417068481445, "global_step": 66354, "epoch": 799} {"train_loss": -20.54691505432129, "global_step": 66355, "epoch": 799} {"train_loss": -20.53079605102539, "global_step": 66356, "epoch": 799} {"train_loss": -20.728635787963867, "global_step": 66357, "epoch": 799} {"train_loss": -20.27132797241211, "global_step": 66358, "epoch": 799} {"train_loss": -20.42548942565918, "global_step": 66359, "epoch": 799} {"train_loss": -20.461313247680664, "global_step": 66360, "epoch": 799} {"train_loss": -20.577640533447266, "global_step": 66361, "epoch": 799} {"train_loss": -20.56390380859375, "global_step": 66362, "epoch": 799} {"train_loss": -20.527868270874023, "global_step": 66363, "epoch": 799} {"train_loss": -20.59124183654785, "global_step": 66364, "epoch": 799} {"train_loss": -20.854337692260742, "global_step": 66365, "epoch": 799} {"train_loss": -20.59015464782715, "global_step": 66366, "epoch": 799} {"train_loss": -20.327396392822266, "global_step": 66367, "epoch": 799} {"train_loss": -20.34752655029297, "global_step": 66368, "epoch": 799} {"train_loss": -20.699298858642578, "global_step": 66369, "epoch": 799} {"train_loss": -20.557607650756836, "global_step": 66370, "epoch": 799} {"train_loss": -20.682973861694336, "global_step": 66371, "epoch": 799} {"train_loss": -20.715002059936523, "global_step": 66372, "epoch": 799} {"train_loss": -21.003877639770508, "global_step": 66373, "epoch": 799} {"train_loss": -20.43254280090332, "global_step": 66374, "epoch": 799} {"train_loss": -20.64971923828125, "global_step": 66375, "epoch": 799} {"train_loss": -20.959911346435547, "global_step": 66376, "epoch": 799} {"train_loss": -20.573047637939453, "global_step": 66377, "epoch": 799} {"train_loss": -20.565526962280273, "global_step": 66378, "epoch": 799} {"train_loss": -20.821908950805664, "global_step": 66379, "epoch": 799} {"train_loss": -21.096227645874023, "global_step": 66380, "epoch": 799} {"train_loss": -20.473047256469727, "global_step": 66381, "epoch": 799} {"train_loss": -20.887958526611328, "global_step": 66382, "epoch": 799} {"train_loss": -20.255456924438477, "global_step": 66383, "epoch": 799} {"train_loss": -20.72201919555664, "global_step": 66384, "epoch": 799} {"train_loss": -19.948213577270508, "global_step": 66385, "epoch": 799} {"train_loss": -21.131338119506836, "global_step": 66386, "epoch": 799} {"train_loss": -20.670148849487305, "global_step": 66387, "epoch": 799} {"train_loss": -20.32539176940918, "global_step": 66388, "epoch": 799} {"train_loss": -20.071325302124023, "global_step": 66389, "epoch": 799} {"train_loss": -21.09454917907715, "global_step": 66390, "epoch": 799} {"train_loss": -20.837566375732422, "global_step": 66391, "epoch": 799} {"train_loss": -20.489492416381836, "global_step": 66392, "epoch": 799} {"train_loss": -20.63312339782715, "global_step": 66393, "epoch": 799} {"train_loss": -20.213850021362305, "global_step": 66394, "epoch": 799} {"train_loss": -20.308345794677734, "global_step": 66395, "epoch": 799} {"train_loss": -20.61168670654297, "global_step": 66396, "epoch": 799} {"train_loss": -20.64689064025879, "global_step": 66397, "epoch": 799} {"train_loss": -20.42945671081543, "global_step": 66398, "epoch": 799} {"train_loss": -20.598826465836492, "global_step": 66399, "epoch": 799, "val_loss": 5742748.5} {"train_loss": -19.78365707397461, "global_step": 66400, "epoch": 800} {"train_loss": -20.296672821044922, "global_step": 66401, "epoch": 800} {"train_loss": -20.24196434020996, "global_step": 66402, "epoch": 800} {"train_loss": -20.08772087097168, "global_step": 66403, "epoch": 800} {"train_loss": -20.302047729492188, "global_step": 66404, "epoch": 800} {"train_loss": -20.102659225463867, "global_step": 66405, "epoch": 800} {"train_loss": -19.93202018737793, "global_step": 66406, "epoch": 800} {"train_loss": -20.347091674804688, "global_step": 66407, "epoch": 800} {"train_loss": -20.476675033569336, "global_step": 66408, "epoch": 800} {"train_loss": -19.999723434448242, "global_step": 66409, "epoch": 800} {"train_loss": -20.274322509765625, "global_step": 66410, "epoch": 800} {"train_loss": -20.01093864440918, "global_step": 66411, "epoch": 800} {"train_loss": -20.449039459228516, "global_step": 66412, "epoch": 800} {"train_loss": -20.296348571777344, "global_step": 66413, "epoch": 800} {"train_loss": -20.13474464416504, "global_step": 66414, "epoch": 800} {"train_loss": -20.4407958984375, "global_step": 66415, "epoch": 800} {"train_loss": -20.608083724975586, "global_step": 66416, "epoch": 800} {"train_loss": -20.96109962463379, "global_step": 66417, "epoch": 800} {"train_loss": -20.345373153686523, "global_step": 66418, "epoch": 800} {"train_loss": -20.90018653869629, "global_step": 66419, "epoch": 800} {"train_loss": -20.589786529541016, "global_step": 66420, "epoch": 800} {"train_loss": -20.86222267150879, "global_step": 66421, "epoch": 800} {"train_loss": -20.58186912536621, "global_step": 66422, "epoch": 800} {"train_loss": -20.633556365966797, "global_step": 66423, "epoch": 800} {"train_loss": -20.79780387878418, "global_step": 66424, "epoch": 800} {"train_loss": -20.857786178588867, "global_step": 66425, "epoch": 800} {"train_loss": -20.48080825805664, "global_step": 66426, "epoch": 800} {"train_loss": -20.717655181884766, "global_step": 66427, "epoch": 800} {"train_loss": -20.898544311523438, "global_step": 66428, "epoch": 800} {"train_loss": -20.91286849975586, "global_step": 66429, "epoch": 800} {"train_loss": -20.647079467773438, "global_step": 66430, "epoch": 800} {"train_loss": -20.697153091430664, "global_step": 66431, "epoch": 800} {"train_loss": -20.655485153198242, "global_step": 66432, "epoch": 800} {"train_loss": -20.67946434020996, "global_step": 66433, "epoch": 800} {"train_loss": -20.804187774658203, "global_step": 66434, "epoch": 800} {"train_loss": -20.544031143188477, "global_step": 66435, "epoch": 800} {"train_loss": -20.385873794555664, "global_step": 66436, "epoch": 800} {"train_loss": -20.484130859375, "global_step": 66437, "epoch": 800} {"train_loss": -20.831317901611328, "global_step": 66438, "epoch": 800} {"train_loss": -20.607271194458008, "global_step": 66439, "epoch": 800} {"train_loss": -20.615755081176758, "global_step": 66440, "epoch": 800} {"train_loss": -20.487268447875977, "global_step": 66441, "epoch": 800} {"train_loss": -20.785215377807617, "global_step": 66442, "epoch": 800} {"train_loss": -20.846649169921875, "global_step": 66443, "epoch": 800} {"train_loss": -20.775327682495117, "global_step": 66444, "epoch": 800} {"train_loss": -21.045743942260742, "global_step": 66445, "epoch": 800} {"train_loss": -20.878339767456055, "global_step": 66446, "epoch": 800} {"train_loss": -20.827606201171875, "global_step": 66447, "epoch": 800} {"train_loss": -20.779088973999023, "global_step": 66448, "epoch": 800} {"train_loss": -20.932729721069336, "global_step": 66449, "epoch": 800} {"train_loss": -20.672842025756836, "global_step": 66450, "epoch": 800} {"train_loss": -20.496397018432617, "global_step": 66451, "epoch": 800} {"train_loss": -20.596378326416016, "global_step": 66452, "epoch": 800} {"train_loss": -20.716894149780273, "global_step": 66453, "epoch": 800} {"train_loss": -20.37810707092285, "global_step": 66454, "epoch": 800} {"train_loss": -20.246967315673828, "global_step": 66455, "epoch": 800} {"train_loss": -20.832475662231445, "global_step": 66456, "epoch": 800} {"train_loss": -20.37425422668457, "global_step": 66457, "epoch": 800} {"train_loss": -20.701698303222656, "global_step": 66458, "epoch": 800} {"train_loss": -20.70103645324707, "global_step": 66459, "epoch": 800} {"train_loss": -20.324188232421875, "global_step": 66460, "epoch": 800} {"train_loss": -20.41855812072754, "global_step": 66461, "epoch": 800} {"train_loss": -20.470783233642578, "global_step": 66462, "epoch": 800} {"train_loss": -20.699783325195312, "global_step": 66463, "epoch": 800} {"train_loss": -20.4045467376709, "global_step": 66464, "epoch": 800} {"train_loss": -20.91728973388672, "global_step": 66465, "epoch": 800} {"train_loss": -20.609004974365234, "global_step": 66466, "epoch": 800} {"train_loss": -20.67557716369629, "global_step": 66467, "epoch": 800} {"train_loss": -20.94654655456543, "global_step": 66468, "epoch": 800} {"train_loss": -20.273056030273438, "global_step": 66469, "epoch": 800} {"train_loss": -20.763193130493164, "global_step": 66470, "epoch": 800} {"train_loss": -20.72795867919922, "global_step": 66471, "epoch": 800} {"train_loss": -20.32819366455078, "global_step": 66472, "epoch": 800} {"train_loss": -20.508419036865234, "global_step": 66473, "epoch": 800} {"train_loss": -20.39046287536621, "global_step": 66474, "epoch": 800} {"train_loss": -20.7612361907959, "global_step": 66475, "epoch": 800} {"train_loss": -20.632394790649414, "global_step": 66476, "epoch": 800} {"train_loss": -20.945781707763672, "global_step": 66477, "epoch": 800} {"train_loss": -20.502485275268555, "global_step": 66478, "epoch": 800} {"train_loss": -20.323741912841797, "global_step": 66479, "epoch": 800} {"train_loss": -20.9522762298584, "global_step": 66480, "epoch": 800} {"train_loss": -20.561771392822266, "global_step": 66481, "epoch": 800} {"train_loss": -20.569010792008367, "global_step": 66482, "epoch": 800, "train/sim_max_reward_0": 1.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 0.0, "train/sim_max_reward_4": 0.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4500000": 1.0, "test/sim_max_reward_4500001": 1.0, "test/sim_max_reward_4500002": 1.0, "test/sim_max_reward_4500003": 1.0, "test/sim_max_reward_4500004": 0.0, "test/sim_max_reward_4500005": 1.0, "test/sim_max_reward_4500006": 1.0, "test/sim_max_reward_4500007": 1.0, "test/sim_max_reward_4500008": 1.0, "test/sim_max_reward_4500009": 1.0, "test/sim_max_reward_4500010": 1.0, "test/sim_max_reward_4500011": 1.0, "test/sim_max_reward_4500012": 1.0, "test/sim_max_reward_4500013": 1.0, "test/sim_max_reward_4500014": 1.0, "test/sim_max_reward_4500015": 1.0, "test/sim_max_reward_4500016": 1.0, "test/sim_max_reward_4500017": 1.0, "test/sim_max_reward_4500018": 1.0, "test/sim_max_reward_4500019": 0.0, "test/sim_max_reward_4500020": 1.0, "test/sim_max_reward_4500021": 1.0, "train/mean_score": 0.6666666666666666, "test/mean_score": 0.9090909090909091, "val_loss": 5983249.0} {"train_loss": -20.825132369995117, "global_step": 66483, "epoch": 801} {"train_loss": -20.409170150756836, "global_step": 66484, "epoch": 801} {"train_loss": -20.522491455078125, "global_step": 66485, "epoch": 801} {"train_loss": -20.25541114807129, "global_step": 66486, "epoch": 801} {"train_loss": -20.279685974121094, "global_step": 66487, "epoch": 801} {"train_loss": -20.78408432006836, "global_step": 66488, "epoch": 801} {"train_loss": -20.610679626464844, "global_step": 66489, "epoch": 801} {"train_loss": -21.03424644470215, "global_step": 66490, "epoch": 801} {"train_loss": -20.605918884277344, "global_step": 66491, "epoch": 801} {"train_loss": -20.65781593322754, "global_step": 66492, "epoch": 801} {"train_loss": -20.3236141204834, "global_step": 66493, "epoch": 801} {"train_loss": -20.22081184387207, "global_step": 66494, "epoch": 801} {"train_loss": -20.513328552246094, "global_step": 66495, "epoch": 801} {"train_loss": -20.77438735961914, "global_step": 66496, "epoch": 801} {"train_loss": -21.014123916625977, "global_step": 66497, "epoch": 801} {"train_loss": -20.585010528564453, "global_step": 66498, "epoch": 801} {"train_loss": -20.7177791595459, "global_step": 66499, "epoch": 801} {"train_loss": -20.147974014282227, "global_step": 66500, "epoch": 801} {"train_loss": -20.656827926635742, "global_step": 66501, "epoch": 801} {"train_loss": -20.610830307006836, "global_step": 66502, "epoch": 801} {"train_loss": -20.69546890258789, "global_step": 66503, "epoch": 801} {"train_loss": -20.58341407775879, "global_step": 66504, "epoch": 801} {"train_loss": -20.959959030151367, "global_step": 66505, "epoch": 801} {"train_loss": -20.74202537536621, "global_step": 66506, "epoch": 801} {"train_loss": -20.726425170898438, "global_step": 66507, "epoch": 801} {"train_loss": -20.626920700073242, "global_step": 66508, "epoch": 801} {"train_loss": -20.640127182006836, "global_step": 66509, "epoch": 801} {"train_loss": -21.106040954589844, "global_step": 66510, "epoch": 801} {"train_loss": -20.847806930541992, "global_step": 66511, "epoch": 801} {"train_loss": -20.499441146850586, "global_step": 66512, "epoch": 801} {"train_loss": -20.87059783935547, "global_step": 66513, "epoch": 801} {"train_loss": -20.578380584716797, "global_step": 66514, "epoch": 801} {"train_loss": -20.74795913696289, "global_step": 66515, "epoch": 801} {"train_loss": -20.753013610839844, "global_step": 66516, "epoch": 801} {"train_loss": -20.94217300415039, "global_step": 66517, "epoch": 801} {"train_loss": -20.420547485351562, "global_step": 66518, "epoch": 801} {"train_loss": -20.895811080932617, "global_step": 66519, "epoch": 801} {"train_loss": -20.42580223083496, "global_step": 66520, "epoch": 801} {"train_loss": -20.39115333557129, "global_step": 66521, "epoch": 801} {"train_loss": -20.39479637145996, "global_step": 66522, "epoch": 801} {"train_loss": -20.83049964904785, "global_step": 66523, "epoch": 801} {"train_loss": -20.626544952392578, "global_step": 66524, "epoch": 801} {"train_loss": -20.563541412353516, "global_step": 66525, "epoch": 801} {"train_loss": -20.63197898864746, "global_step": 66526, "epoch": 801} {"train_loss": -20.60203742980957, "global_step": 66527, "epoch": 801} {"train_loss": -20.749847412109375, "global_step": 66528, "epoch": 801} {"train_loss": -20.689401626586914, "global_step": 66529, "epoch": 801} {"train_loss": -20.613229751586914, "global_step": 66530, "epoch": 801} {"train_loss": -20.66929054260254, "global_step": 66531, "epoch": 801} {"train_loss": -20.902347564697266, "global_step": 66532, "epoch": 801} {"train_loss": -20.4683780670166, "global_step": 66533, "epoch": 801} {"train_loss": -20.70315933227539, "global_step": 66534, "epoch": 801} {"train_loss": -20.396413803100586, "global_step": 66535, "epoch": 801} {"train_loss": -20.467145919799805, "global_step": 66536, "epoch": 801} {"train_loss": -20.753067016601562, "global_step": 66537, "epoch": 801} {"train_loss": -20.763721466064453, "global_step": 66538, "epoch": 801} {"train_loss": -20.786718368530273, "global_step": 66539, "epoch": 801} {"train_loss": -20.58785629272461, "global_step": 66540, "epoch": 801} {"train_loss": -20.55958366394043, "global_step": 66541, "epoch": 801} {"train_loss": -20.759992599487305, "global_step": 66542, "epoch": 801} {"train_loss": -20.93659782409668, "global_step": 66543, "epoch": 801} {"train_loss": -20.401199340820312, "global_step": 66544, "epoch": 801} {"train_loss": -20.7979736328125, "global_step": 66545, "epoch": 801} {"train_loss": -20.8414306640625, "global_step": 66546, "epoch": 801} {"train_loss": -20.52744483947754, "global_step": 66547, "epoch": 801} {"train_loss": -20.990034103393555, "global_step": 66548, "epoch": 801} {"train_loss": -20.95386505126953, "global_step": 66549, "epoch": 801} {"train_loss": -20.69919204711914, "global_step": 66550, "epoch": 801} {"train_loss": -20.666601181030273, "global_step": 66551, "epoch": 801} {"train_loss": -20.710647583007812, "global_step": 66552, "epoch": 801} {"train_loss": -20.697383880615234, "global_step": 66553, "epoch": 801} {"train_loss": -20.91643714904785, "global_step": 66554, "epoch": 801} {"train_loss": -20.676639556884766, "global_step": 66555, "epoch": 801} {"train_loss": -20.6223087310791, "global_step": 66556, "epoch": 801} {"train_loss": -20.991392135620117, "global_step": 66557, "epoch": 801} {"train_loss": -20.50689125061035, "global_step": 66558, "epoch": 801} {"train_loss": -20.81119728088379, "global_step": 66559, "epoch": 801} {"train_loss": -20.443904876708984, "global_step": 66560, "epoch": 801} {"train_loss": -20.9464111328125, "global_step": 66561, "epoch": 801} {"train_loss": -20.621335983276367, "global_step": 66562, "epoch": 801} {"train_loss": -20.861541748046875, "global_step": 66563, "epoch": 801} {"train_loss": -20.86290740966797, "global_step": 66564, "epoch": 801} {"train_loss": -20.67321060364505, "global_step": 66565, "epoch": 801, "val_loss": 6042446.0} {"train_loss": -20.004837036132812, "global_step": 66566, "epoch": 802} {"train_loss": -20.63435173034668, "global_step": 66567, "epoch": 802} {"train_loss": -20.35381507873535, "global_step": 66568, "epoch": 802} {"train_loss": -20.178930282592773, "global_step": 66569, "epoch": 802} {"train_loss": -20.28959846496582, "global_step": 66570, "epoch": 802} {"train_loss": -20.41171646118164, "global_step": 66571, "epoch": 802} {"train_loss": -20.815732955932617, "global_step": 66572, "epoch": 802} {"train_loss": -20.637664794921875, "global_step": 66573, "epoch": 802} {"train_loss": -20.424392700195312, "global_step": 66574, "epoch": 802} {"train_loss": -20.266660690307617, "global_step": 66575, "epoch": 802} {"train_loss": -20.373044967651367, "global_step": 66576, "epoch": 802} {"train_loss": -20.221521377563477, "global_step": 66577, "epoch": 802} {"train_loss": -20.18849754333496, "global_step": 66578, "epoch": 802} {"train_loss": -20.35503578186035, "global_step": 66579, "epoch": 802} {"train_loss": -20.913593292236328, "global_step": 66580, "epoch": 802} {"train_loss": -20.526437759399414, "global_step": 66581, "epoch": 802} {"train_loss": -20.63270378112793, "global_step": 66582, "epoch": 802} {"train_loss": -20.887680053710938, "global_step": 66583, "epoch": 802} {"train_loss": -20.576061248779297, "global_step": 66584, "epoch": 802} {"train_loss": -20.24896812438965, "global_step": 66585, "epoch": 802} {"train_loss": -20.738323211669922, "global_step": 66586, "epoch": 802} {"train_loss": -21.031282424926758, "global_step": 66587, "epoch": 802} {"train_loss": -20.86903953552246, "global_step": 66588, "epoch": 802} {"train_loss": -21.00965118408203, "global_step": 66589, "epoch": 802} {"train_loss": -20.870262145996094, "global_step": 66590, "epoch": 802} {"train_loss": -20.601947784423828, "global_step": 66591, "epoch": 802} {"train_loss": -20.491287231445312, "global_step": 66592, "epoch": 802} {"train_loss": -20.97430419921875, "global_step": 66593, "epoch": 802} {"train_loss": -20.186399459838867, "global_step": 66594, "epoch": 802} {"train_loss": -20.903738021850586, "global_step": 66595, "epoch": 802} {"train_loss": -20.757749557495117, "global_step": 66596, "epoch": 802} {"train_loss": -20.537107467651367, "global_step": 66597, "epoch": 802} {"train_loss": -20.81157112121582, "global_step": 66598, "epoch": 802} {"train_loss": -20.505338668823242, "global_step": 66599, "epoch": 802} {"train_loss": -20.991056442260742, "global_step": 66600, "epoch": 802} {"train_loss": -20.58980369567871, "global_step": 66601, "epoch": 802} {"train_loss": -20.567569732666016, "global_step": 66602, "epoch": 802} {"train_loss": -20.703454971313477, "global_step": 66603, "epoch": 802} {"train_loss": -20.498367309570312, "global_step": 66604, "epoch": 802} {"train_loss": -20.94278907775879, "global_step": 66605, "epoch": 802} {"train_loss": -20.59525489807129, "global_step": 66606, "epoch": 802} {"train_loss": -20.660995483398438, "global_step": 66607, "epoch": 802} {"train_loss": -20.74959373474121, "global_step": 66608, "epoch": 802} {"train_loss": -20.437042236328125, "global_step": 66609, "epoch": 802} {"train_loss": -21.0570011138916, "global_step": 66610, "epoch": 802} {"train_loss": -20.710294723510742, "global_step": 66611, "epoch": 802} {"train_loss": -20.09442710876465, "global_step": 66612, "epoch": 802} {"train_loss": -20.706838607788086, "global_step": 66613, "epoch": 802} {"train_loss": -20.79193687438965, "global_step": 66614, "epoch": 802} {"train_loss": -20.62074089050293, "global_step": 66615, "epoch": 802} {"train_loss": -20.968456268310547, "global_step": 66616, "epoch": 802} {"train_loss": -20.673320770263672, "global_step": 66617, "epoch": 802} {"train_loss": -20.90212631225586, "global_step": 66618, "epoch": 802} {"train_loss": -20.880565643310547, "global_step": 66619, "epoch": 802} {"train_loss": -20.6212215423584, "global_step": 66620, "epoch": 802} {"train_loss": -20.885648727416992, "global_step": 66621, "epoch": 802} {"train_loss": -21.13201141357422, "global_step": 66622, "epoch": 802} {"train_loss": -20.59616470336914, "global_step": 66623, "epoch": 802} {"train_loss": -20.896780014038086, "global_step": 66624, "epoch": 802} {"train_loss": -20.942047119140625, "global_step": 66625, "epoch": 802} {"train_loss": -21.05413818359375, "global_step": 66626, "epoch": 802} {"train_loss": -20.595380783081055, "global_step": 66627, "epoch": 802} {"train_loss": -20.52030372619629, "global_step": 66628, "epoch": 802} {"train_loss": -20.64235496520996, "global_step": 66629, "epoch": 802} {"train_loss": -21.00876235961914, "global_step": 66630, "epoch": 802} {"train_loss": -21.06861686706543, "global_step": 66631, "epoch": 802} {"train_loss": -20.646991729736328, "global_step": 66632, "epoch": 802} {"train_loss": -20.253751754760742, "global_step": 66633, "epoch": 802} {"train_loss": -20.186927795410156, "global_step": 66634, "epoch": 802} {"train_loss": -20.9390926361084, "global_step": 66635, "epoch": 802} {"train_loss": -20.58440589904785, "global_step": 66636, "epoch": 802} {"train_loss": -20.45197868347168, "global_step": 66637, "epoch": 802} {"train_loss": -20.691911697387695, "global_step": 66638, "epoch": 802} {"train_loss": -20.81441307067871, "global_step": 66639, "epoch": 802} {"train_loss": -21.11693000793457, "global_step": 66640, "epoch": 802} {"train_loss": -21.18655776977539, "global_step": 66641, "epoch": 802} {"train_loss": -20.83831214904785, "global_step": 66642, "epoch": 802} {"train_loss": -21.17977523803711, "global_step": 66643, "epoch": 802} {"train_loss": -20.78244400024414, "global_step": 66644, "epoch": 802} {"train_loss": -20.874521255493164, "global_step": 66645, "epoch": 802} {"train_loss": -20.837282180786133, "global_step": 66646, "epoch": 802} {"train_loss": -21.0490665435791, "global_step": 66647, "epoch": 802} {"train_loss": -20.70543201860175, "global_step": 66648, "epoch": 802, "val_loss": 5912829.5} {"train_loss": -20.86690902709961, "global_step": 66649, "epoch": 803} {"train_loss": -20.557729721069336, "global_step": 66650, "epoch": 803} {"train_loss": -20.430612564086914, "global_step": 66651, "epoch": 803} {"train_loss": -20.348844528198242, "global_step": 66652, "epoch": 803} {"train_loss": -20.64589500427246, "global_step": 66653, "epoch": 803} {"train_loss": -20.6333065032959, "global_step": 66654, "epoch": 803} {"train_loss": -20.037351608276367, "global_step": 66655, "epoch": 803} {"train_loss": -20.783550262451172, "global_step": 66656, "epoch": 803} {"train_loss": -20.649511337280273, "global_step": 66657, "epoch": 803} {"train_loss": -20.201187133789062, "global_step": 66658, "epoch": 803} {"train_loss": -20.514469146728516, "global_step": 66659, "epoch": 803} {"train_loss": -20.67770767211914, "global_step": 66660, "epoch": 803} {"train_loss": -20.74758529663086, "global_step": 66661, "epoch": 803} {"train_loss": -20.6022891998291, "global_step": 66662, "epoch": 803} {"train_loss": -20.494977951049805, "global_step": 66663, "epoch": 803} {"train_loss": -20.568449020385742, "global_step": 66664, "epoch": 803} {"train_loss": -20.572317123413086, "global_step": 66665, "epoch": 803} {"train_loss": -20.67256736755371, "global_step": 66666, "epoch": 803} {"train_loss": -20.26539421081543, "global_step": 66667, "epoch": 803} {"train_loss": -20.804807662963867, "global_step": 66668, "epoch": 803} {"train_loss": -20.93614387512207, "global_step": 66669, "epoch": 803} {"train_loss": -20.6478214263916, "global_step": 66670, "epoch": 803} {"train_loss": -20.65380859375, "global_step": 66671, "epoch": 803} {"train_loss": -20.29473304748535, "global_step": 66672, "epoch": 803} {"train_loss": -20.872861862182617, "global_step": 66673, "epoch": 803} {"train_loss": -20.8841609954834, "global_step": 66674, "epoch": 803} {"train_loss": -21.0103816986084, "global_step": 66675, "epoch": 803} {"train_loss": -20.411033630371094, "global_step": 66676, "epoch": 803} {"train_loss": -20.713956832885742, "global_step": 66677, "epoch": 803} {"train_loss": -20.808513641357422, "global_step": 66678, "epoch": 803} {"train_loss": -20.756881713867188, "global_step": 66679, "epoch": 803} {"train_loss": -20.337541580200195, "global_step": 66680, "epoch": 803} {"train_loss": -20.594409942626953, "global_step": 66681, "epoch": 803} {"train_loss": -20.59770965576172, "global_step": 66682, "epoch": 803} {"train_loss": -20.601642608642578, "global_step": 66683, "epoch": 803} {"train_loss": -20.550861358642578, "global_step": 66684, "epoch": 803} {"train_loss": -20.361032485961914, "global_step": 66685, "epoch": 803} {"train_loss": -20.613988876342773, "global_step": 66686, "epoch": 803} {"train_loss": -20.798337936401367, "global_step": 66687, "epoch": 803} {"train_loss": -20.58320426940918, "global_step": 66688, "epoch": 803} {"train_loss": -20.634824752807617, "global_step": 66689, "epoch": 803} {"train_loss": -20.60301971435547, "global_step": 66690, "epoch": 803} {"train_loss": -20.48084259033203, "global_step": 66691, "epoch": 803} {"train_loss": -20.36310386657715, "global_step": 66692, "epoch": 803} {"train_loss": -20.676502227783203, "global_step": 66693, "epoch": 803} {"train_loss": -20.71656608581543, "global_step": 66694, "epoch": 803} {"train_loss": -20.71784782409668, "global_step": 66695, "epoch": 803} {"train_loss": -20.52409553527832, "global_step": 66696, "epoch": 803} {"train_loss": -20.512975692749023, "global_step": 66697, "epoch": 803} {"train_loss": -20.511066436767578, "global_step": 66698, "epoch": 803} {"train_loss": -20.822803497314453, "global_step": 66699, "epoch": 803} {"train_loss": -20.78438377380371, "global_step": 66700, "epoch": 803} {"train_loss": -20.93528175354004, "global_step": 66701, "epoch": 803} {"train_loss": -20.560840606689453, "global_step": 66702, "epoch": 803} {"train_loss": -21.00764274597168, "global_step": 66703, "epoch": 803} {"train_loss": -20.727313995361328, "global_step": 66704, "epoch": 803} {"train_loss": -20.911230087280273, "global_step": 66705, "epoch": 803} {"train_loss": -20.523483276367188, "global_step": 66706, "epoch": 803} {"train_loss": -20.960580825805664, "global_step": 66707, "epoch": 803} {"train_loss": -20.479711532592773, "global_step": 66708, "epoch": 803} {"train_loss": -20.764389038085938, "global_step": 66709, "epoch": 803} {"train_loss": -20.396835327148438, "global_step": 66710, "epoch": 803} {"train_loss": -20.693204879760742, "global_step": 66711, "epoch": 803} {"train_loss": -20.860095977783203, "global_step": 66712, "epoch": 803} {"train_loss": -20.762990951538086, "global_step": 66713, "epoch": 803} {"train_loss": -20.624773025512695, "global_step": 66714, "epoch": 803} {"train_loss": -20.448942184448242, "global_step": 66715, "epoch": 803} {"train_loss": -20.68621253967285, "global_step": 66716, "epoch": 803} {"train_loss": -20.65632438659668, "global_step": 66717, "epoch": 803} {"train_loss": -20.58588981628418, "global_step": 66718, "epoch": 803} {"train_loss": -20.799680709838867, "global_step": 66719, "epoch": 803} {"train_loss": -20.636091232299805, "global_step": 66720, "epoch": 803} {"train_loss": -20.84322738647461, "global_step": 66721, "epoch": 803} {"train_loss": -20.729616165161133, "global_step": 66722, "epoch": 803} {"train_loss": -20.76323890686035, "global_step": 66723, "epoch": 803} {"train_loss": -20.612319946289062, "global_step": 66724, "epoch": 803} {"train_loss": -21.0595760345459, "global_step": 66725, "epoch": 803} {"train_loss": -20.593332290649414, "global_step": 66726, "epoch": 803} {"train_loss": -20.796545028686523, "global_step": 66727, "epoch": 803} {"train_loss": -20.94657325744629, "global_step": 66728, "epoch": 803} {"train_loss": -20.63617515563965, "global_step": 66729, "epoch": 803} {"train_loss": -20.596961975097656, "global_step": 66730, "epoch": 803} {"train_loss": -20.642682845333972, "global_step": 66731, "epoch": 803, "val_loss": 5963598.0} {"train_loss": -20.63105583190918, "global_step": 66732, "epoch": 804} {"train_loss": -20.10325050354004, "global_step": 66733, "epoch": 804} {"train_loss": -20.465717315673828, "global_step": 66734, "epoch": 804} {"train_loss": -20.301895141601562, "global_step": 66735, "epoch": 804} {"train_loss": -20.44000816345215, "global_step": 66736, "epoch": 804} {"train_loss": -20.53192901611328, "global_step": 66737, "epoch": 804} {"train_loss": -20.421415328979492, "global_step": 66738, "epoch": 804} {"train_loss": -20.307538986206055, "global_step": 66739, "epoch": 804} {"train_loss": -20.528322219848633, "global_step": 66740, "epoch": 804} {"train_loss": -20.696014404296875, "global_step": 66741, "epoch": 804} {"train_loss": -20.35824966430664, "global_step": 66742, "epoch": 804} {"train_loss": -20.7071533203125, "global_step": 66743, "epoch": 804} {"train_loss": -20.685705184936523, "global_step": 66744, "epoch": 804} {"train_loss": -20.52413558959961, "global_step": 66745, "epoch": 804} {"train_loss": -20.616352081298828, "global_step": 66746, "epoch": 804} {"train_loss": -20.32050132751465, "global_step": 66747, "epoch": 804} {"train_loss": -20.614622116088867, "global_step": 66748, "epoch": 804} {"train_loss": -20.70539093017578, "global_step": 66749, "epoch": 804} {"train_loss": -20.815378189086914, "global_step": 66750, "epoch": 804} {"train_loss": -21.060476303100586, "global_step": 66751, "epoch": 804} {"train_loss": -20.580034255981445, "global_step": 66752, "epoch": 804} {"train_loss": -20.612524032592773, "global_step": 66753, "epoch": 804} {"train_loss": -20.957321166992188, "global_step": 66754, "epoch": 804} {"train_loss": -20.345956802368164, "global_step": 66755, "epoch": 804} {"train_loss": -20.656259536743164, "global_step": 66756, "epoch": 804} {"train_loss": -20.8624324798584, "global_step": 66757, "epoch": 804} {"train_loss": -20.236143112182617, "global_step": 66758, "epoch": 804} {"train_loss": -20.759721755981445, "global_step": 66759, "epoch": 804} {"train_loss": -20.731050491333008, "global_step": 66760, "epoch": 804} {"train_loss": -20.490976333618164, "global_step": 66761, "epoch": 804} {"train_loss": -20.466039657592773, "global_step": 66762, "epoch": 804} {"train_loss": -20.585453033447266, "global_step": 66763, "epoch": 804} {"train_loss": -20.425498962402344, "global_step": 66764, "epoch": 804} {"train_loss": -20.74559211730957, "global_step": 66765, "epoch": 804} {"train_loss": -20.611942291259766, "global_step": 66766, "epoch": 804} {"train_loss": -20.963144302368164, "global_step": 66767, "epoch": 804} {"train_loss": -20.674880981445312, "global_step": 66768, "epoch": 804} {"train_loss": -20.36646270751953, "global_step": 66769, "epoch": 804} {"train_loss": -20.758779525756836, "global_step": 66770, "epoch": 804} {"train_loss": -20.550800323486328, "global_step": 66771, "epoch": 804} {"train_loss": -20.444820404052734, "global_step": 66772, "epoch": 804} {"train_loss": -21.123769760131836, "global_step": 66773, "epoch": 804} {"train_loss": -20.851459503173828, "global_step": 66774, "epoch": 804} {"train_loss": -20.55629539489746, "global_step": 66775, "epoch": 804} {"train_loss": -21.116188049316406, "global_step": 66776, "epoch": 804} {"train_loss": -20.520071029663086, "global_step": 66777, "epoch": 804} {"train_loss": -20.995450973510742, "global_step": 66778, "epoch": 804} {"train_loss": -20.803495407104492, "global_step": 66779, "epoch": 804} {"train_loss": -20.95513153076172, "global_step": 66780, "epoch": 804} {"train_loss": -20.819169998168945, "global_step": 66781, "epoch": 804} {"train_loss": -21.016061782836914, "global_step": 66782, "epoch": 804} {"train_loss": -20.983320236206055, "global_step": 66783, "epoch": 804} {"train_loss": -20.749319076538086, "global_step": 66784, "epoch": 804} {"train_loss": -20.537492752075195, "global_step": 66785, "epoch": 804} {"train_loss": -20.952558517456055, "global_step": 66786, "epoch": 804} {"train_loss": -20.60943031311035, "global_step": 66787, "epoch": 804} {"train_loss": -20.44471549987793, "global_step": 66788, "epoch": 804} {"train_loss": -20.77684211730957, "global_step": 66789, "epoch": 804} {"train_loss": -20.672819137573242, "global_step": 66790, "epoch": 804} {"train_loss": -20.741378784179688, "global_step": 66791, "epoch": 804} {"train_loss": -20.550573348999023, "global_step": 66792, "epoch": 804} {"train_loss": -20.715810775756836, "global_step": 66793, "epoch": 804} {"train_loss": -20.538541793823242, "global_step": 66794, "epoch": 804} {"train_loss": -20.701627731323242, "global_step": 66795, "epoch": 804} {"train_loss": -20.605178833007812, "global_step": 66796, "epoch": 804} {"train_loss": -20.22515296936035, "global_step": 66797, "epoch": 804} {"train_loss": -20.713064193725586, "global_step": 66798, "epoch": 804} {"train_loss": -20.78116226196289, "global_step": 66799, "epoch": 804} {"train_loss": -20.78035545349121, "global_step": 66800, "epoch": 804} {"train_loss": -20.673721313476562, "global_step": 66801, "epoch": 804} {"train_loss": -20.883451461791992, "global_step": 66802, "epoch": 804} {"train_loss": -20.860952377319336, "global_step": 66803, "epoch": 804} {"train_loss": -21.24495506286621, "global_step": 66804, "epoch": 804} {"train_loss": -20.656021118164062, "global_step": 66805, "epoch": 804} {"train_loss": -21.03961181640625, "global_step": 66806, "epoch": 804} {"train_loss": -20.674795150756836, "global_step": 66807, "epoch": 804} {"train_loss": -20.760164260864258, "global_step": 66808, "epoch": 804} {"train_loss": -20.575551986694336, "global_step": 66809, "epoch": 804} {"train_loss": -20.609525680541992, "global_step": 66810, "epoch": 804} {"train_loss": -20.536176681518555, "global_step": 66811, "epoch": 804} {"train_loss": -20.754329681396484, "global_step": 66812, "epoch": 804} {"train_loss": -20.694795608520508, "global_step": 66813, "epoch": 804} {"train_loss": -20.659927092402814, "global_step": 66814, "epoch": 804, "val_loss": 6021565.0} {"train_loss": -20.266836166381836, "global_step": 66815, "epoch": 805} {"train_loss": -19.775840759277344, "global_step": 66816, "epoch": 805} {"train_loss": -20.446195602416992, "global_step": 66817, "epoch": 805} {"train_loss": -20.290212631225586, "global_step": 66818, "epoch": 805} {"train_loss": -19.542001724243164, "global_step": 66819, "epoch": 805} {"train_loss": -20.619644165039062, "global_step": 66820, "epoch": 805} {"train_loss": -19.980955123901367, "global_step": 66821, "epoch": 805} {"train_loss": -20.302417755126953, "global_step": 66822, "epoch": 805} {"train_loss": -20.21819305419922, "global_step": 66823, "epoch": 805} {"train_loss": -20.21626091003418, "global_step": 66824, "epoch": 805} {"train_loss": -19.858596801757812, "global_step": 66825, "epoch": 805} {"train_loss": -20.57496452331543, "global_step": 66826, "epoch": 805} {"train_loss": -19.861928939819336, "global_step": 66827, "epoch": 805} {"train_loss": -20.379444122314453, "global_step": 66828, "epoch": 805} {"train_loss": -20.2823543548584, "global_step": 66829, "epoch": 805} {"train_loss": -20.688928604125977, "global_step": 66830, "epoch": 805} {"train_loss": -20.632953643798828, "global_step": 66831, "epoch": 805} {"train_loss": -21.05694580078125, "global_step": 66832, "epoch": 805} {"train_loss": -20.573741912841797, "global_step": 66833, "epoch": 805} {"train_loss": -20.769277572631836, "global_step": 66834, "epoch": 805} {"train_loss": -20.458621978759766, "global_step": 66835, "epoch": 805} {"train_loss": -20.692691802978516, "global_step": 66836, "epoch": 805} {"train_loss": -20.383819580078125, "global_step": 66837, "epoch": 805} {"train_loss": -20.530221939086914, "global_step": 66838, "epoch": 805} {"train_loss": -20.52425193786621, "global_step": 66839, "epoch": 805} {"train_loss": -20.646188735961914, "global_step": 66840, "epoch": 805} {"train_loss": -20.470067977905273, "global_step": 66841, "epoch": 805} {"train_loss": -20.8961124420166, "global_step": 66842, "epoch": 805} {"train_loss": -20.407270431518555, "global_step": 66843, "epoch": 805} {"train_loss": -20.499059677124023, "global_step": 66844, "epoch": 805} {"train_loss": -20.604705810546875, "global_step": 66845, "epoch": 805} {"train_loss": -20.83790397644043, "global_step": 66846, "epoch": 805} {"train_loss": -20.605972290039062, "global_step": 66847, "epoch": 805} {"train_loss": -20.5047607421875, "global_step": 66848, "epoch": 805} {"train_loss": -20.785764694213867, "global_step": 66849, "epoch": 805} {"train_loss": -20.935163497924805, "global_step": 66850, "epoch": 805} {"train_loss": -20.52745246887207, "global_step": 66851, "epoch": 805} {"train_loss": -20.775867462158203, "global_step": 66852, "epoch": 805} {"train_loss": -20.75518798828125, "global_step": 66853, "epoch": 805} {"train_loss": -20.697072982788086, "global_step": 66854, "epoch": 805} {"train_loss": -20.575780868530273, "global_step": 66855, "epoch": 805} {"train_loss": -20.584857940673828, "global_step": 66856, "epoch": 805} {"train_loss": -20.52872085571289, "global_step": 66857, "epoch": 805} {"train_loss": -20.574308395385742, "global_step": 66858, "epoch": 805} {"train_loss": -20.75338363647461, "global_step": 66859, "epoch": 805} {"train_loss": -20.56814193725586, "global_step": 66860, "epoch": 805} {"train_loss": -20.807174682617188, "global_step": 66861, "epoch": 805} {"train_loss": -20.484729766845703, "global_step": 66862, "epoch": 805} {"train_loss": -20.54512596130371, "global_step": 66863, "epoch": 805} {"train_loss": -20.539165496826172, "global_step": 66864, "epoch": 805} {"train_loss": -20.97220802307129, "global_step": 66865, "epoch": 805} {"train_loss": -20.861242294311523, "global_step": 66866, "epoch": 805} {"train_loss": -21.067007064819336, "global_step": 66867, "epoch": 805} {"train_loss": -20.847841262817383, "global_step": 66868, "epoch": 805} {"train_loss": -20.572359085083008, "global_step": 66869, "epoch": 805} {"train_loss": -20.594018936157227, "global_step": 66870, "epoch": 805} {"train_loss": -20.762109756469727, "global_step": 66871, "epoch": 805} {"train_loss": -20.97279930114746, "global_step": 66872, "epoch": 805} {"train_loss": -20.87116813659668, "global_step": 66873, "epoch": 805} {"train_loss": -20.80841636657715, "global_step": 66874, "epoch": 805} {"train_loss": -20.574188232421875, "global_step": 66875, "epoch": 805} {"train_loss": -20.68446922302246, "global_step": 66876, "epoch": 805} {"train_loss": -21.023696899414062, "global_step": 66877, "epoch": 805} {"train_loss": -20.451932907104492, "global_step": 66878, "epoch": 805} {"train_loss": -20.45586585998535, "global_step": 66879, "epoch": 805} {"train_loss": -20.859275817871094, "global_step": 66880, "epoch": 805} {"train_loss": -20.764638900756836, "global_step": 66881, "epoch": 805} {"train_loss": -20.7052059173584, "global_step": 66882, "epoch": 805} {"train_loss": -20.41282081604004, "global_step": 66883, "epoch": 805} {"train_loss": -20.533164978027344, "global_step": 66884, "epoch": 805} {"train_loss": -20.98565673828125, "global_step": 66885, "epoch": 805} {"train_loss": -20.637985229492188, "global_step": 66886, "epoch": 805} {"train_loss": -20.491077423095703, "global_step": 66887, "epoch": 805} {"train_loss": -20.623552322387695, "global_step": 66888, "epoch": 805} {"train_loss": -20.882417678833008, "global_step": 66889, "epoch": 805} {"train_loss": -20.651853561401367, "global_step": 66890, "epoch": 805} {"train_loss": -20.421579360961914, "global_step": 66891, "epoch": 805} {"train_loss": -20.955995559692383, "global_step": 66892, "epoch": 805} {"train_loss": -20.93289566040039, "global_step": 66893, "epoch": 805} {"train_loss": -20.819852828979492, "global_step": 66894, "epoch": 805} {"train_loss": -20.800931930541992, "global_step": 66895, "epoch": 805} {"train_loss": -20.375146865844727, "global_step": 66896, "epoch": 805} {"train_loss": -20.571179424423768, "global_step": 66897, "epoch": 805, "val_loss": 5965893.0} {"train_loss": -20.412952423095703, "global_step": 66898, "epoch": 806} {"train_loss": -20.4930419921875, "global_step": 66899, "epoch": 806} {"train_loss": -20.420146942138672, "global_step": 66900, "epoch": 806} {"train_loss": -20.442991256713867, "global_step": 66901, "epoch": 806} {"train_loss": -20.150312423706055, "global_step": 66902, "epoch": 806} {"train_loss": -20.619749069213867, "global_step": 66903, "epoch": 806} {"train_loss": -20.71534538269043, "global_step": 66904, "epoch": 806} {"train_loss": -20.41098403930664, "global_step": 66905, "epoch": 806} {"train_loss": -20.327016830444336, "global_step": 66906, "epoch": 806} {"train_loss": -20.774656295776367, "global_step": 66907, "epoch": 806} {"train_loss": -20.53203582763672, "global_step": 66908, "epoch": 806} {"train_loss": -20.56307029724121, "global_step": 66909, "epoch": 806} {"train_loss": -20.616748809814453, "global_step": 66910, "epoch": 806} {"train_loss": -20.656240463256836, "global_step": 66911, "epoch": 806} {"train_loss": -20.404924392700195, "global_step": 66912, "epoch": 806} {"train_loss": -20.956119537353516, "global_step": 66913, "epoch": 806} {"train_loss": -20.33029556274414, "global_step": 66914, "epoch": 806} {"train_loss": -20.8244686126709, "global_step": 66915, "epoch": 806} {"train_loss": -20.817493438720703, "global_step": 66916, "epoch": 806} {"train_loss": -20.771087646484375, "global_step": 66917, "epoch": 806} {"train_loss": -20.851886749267578, "global_step": 66918, "epoch": 806} {"train_loss": -20.606857299804688, "global_step": 66919, "epoch": 806} {"train_loss": -20.669601440429688, "global_step": 66920, "epoch": 806} {"train_loss": -20.719730377197266, "global_step": 66921, "epoch": 806} {"train_loss": -20.8950252532959, "global_step": 66922, "epoch": 806} {"train_loss": -20.46271324157715, "global_step": 66923, "epoch": 806} {"train_loss": -20.76972198486328, "global_step": 66924, "epoch": 806} {"train_loss": -20.482818603515625, "global_step": 66925, "epoch": 806} {"train_loss": -20.587034225463867, "global_step": 66926, "epoch": 806} {"train_loss": -20.828474044799805, "global_step": 66927, "epoch": 806} {"train_loss": -20.570005416870117, "global_step": 66928, "epoch": 806} {"train_loss": -20.583951950073242, "global_step": 66929, "epoch": 806} {"train_loss": -20.55183219909668, "global_step": 66930, "epoch": 806} {"train_loss": -20.925701141357422, "global_step": 66931, "epoch": 806} {"train_loss": -20.842161178588867, "global_step": 66932, "epoch": 806} {"train_loss": -20.730571746826172, "global_step": 66933, "epoch": 806} {"train_loss": -20.71407127380371, "global_step": 66934, "epoch": 806} {"train_loss": -20.498172760009766, "global_step": 66935, "epoch": 806} {"train_loss": -20.465726852416992, "global_step": 66936, "epoch": 806} {"train_loss": -21.02811622619629, "global_step": 66937, "epoch": 806} {"train_loss": -21.127456665039062, "global_step": 66938, "epoch": 806} {"train_loss": -20.8801212310791, "global_step": 66939, "epoch": 806} {"train_loss": -20.666296005249023, "global_step": 66940, "epoch": 806} {"train_loss": -20.6965389251709, "global_step": 66941, "epoch": 806} {"train_loss": -20.936105728149414, "global_step": 66942, "epoch": 806} {"train_loss": -21.119138717651367, "global_step": 66943, "epoch": 806} {"train_loss": -20.478750228881836, "global_step": 66944, "epoch": 806} {"train_loss": -20.60487937927246, "global_step": 66945, "epoch": 806} {"train_loss": -20.406492233276367, "global_step": 66946, "epoch": 806} {"train_loss": -20.666322708129883, "global_step": 66947, "epoch": 806} {"train_loss": -20.64740562438965, "global_step": 66948, "epoch": 806} {"train_loss": -20.97553825378418, "global_step": 66949, "epoch": 806} {"train_loss": -20.279325485229492, "global_step": 66950, "epoch": 806} {"train_loss": -20.771764755249023, "global_step": 66951, "epoch": 806} {"train_loss": -20.639726638793945, "global_step": 66952, "epoch": 806} {"train_loss": -20.87542152404785, "global_step": 66953, "epoch": 806} {"train_loss": -20.812101364135742, "global_step": 66954, "epoch": 806} {"train_loss": -20.949626922607422, "global_step": 66955, "epoch": 806} {"train_loss": -20.69120979309082, "global_step": 66956, "epoch": 806} {"train_loss": -20.788116455078125, "global_step": 66957, "epoch": 806} {"train_loss": -20.52766227722168, "global_step": 66958, "epoch": 806} {"train_loss": -21.080585479736328, "global_step": 66959, "epoch": 806} {"train_loss": -20.738088607788086, "global_step": 66960, "epoch": 806} {"train_loss": -20.767881393432617, "global_step": 66961, "epoch": 806} {"train_loss": -20.567825317382812, "global_step": 66962, "epoch": 806} {"train_loss": -20.873703002929688, "global_step": 66963, "epoch": 806} {"train_loss": -20.964984893798828, "global_step": 66964, "epoch": 806} {"train_loss": -20.798994064331055, "global_step": 66965, "epoch": 806} {"train_loss": -20.692914962768555, "global_step": 66966, "epoch": 806} {"train_loss": -20.926834106445312, "global_step": 66967, "epoch": 806} {"train_loss": -20.83478355407715, "global_step": 66968, "epoch": 806} {"train_loss": -20.510791778564453, "global_step": 66969, "epoch": 806} {"train_loss": -20.754276275634766, "global_step": 66970, "epoch": 806} {"train_loss": -20.283836364746094, "global_step": 66971, "epoch": 806} {"train_loss": -20.468931198120117, "global_step": 66972, "epoch": 806} {"train_loss": -20.595874786376953, "global_step": 66973, "epoch": 806} {"train_loss": -20.667530059814453, "global_step": 66974, "epoch": 806} {"train_loss": -20.637134552001953, "global_step": 66975, "epoch": 806} {"train_loss": -20.66055679321289, "global_step": 66976, "epoch": 806} {"train_loss": -20.547143936157227, "global_step": 66977, "epoch": 806} {"train_loss": -20.184598922729492, "global_step": 66978, "epoch": 806} {"train_loss": -20.888662338256836, "global_step": 66979, "epoch": 806} {"train_loss": -20.684065324714386, "global_step": 66980, "epoch": 806, "val_loss": 6023077.0} {"train_loss": -19.998779296875, "global_step": 66981, "epoch": 807} {"train_loss": -20.750768661499023, "global_step": 66982, "epoch": 807} {"train_loss": -20.1318302154541, "global_step": 66983, "epoch": 807} {"train_loss": -20.406204223632812, "global_step": 66984, "epoch": 807} {"train_loss": -20.264062881469727, "global_step": 66985, "epoch": 807} {"train_loss": -20.546415328979492, "global_step": 66986, "epoch": 807} {"train_loss": -20.449132919311523, "global_step": 66987, "epoch": 807} {"train_loss": -20.492984771728516, "global_step": 66988, "epoch": 807} {"train_loss": -20.509984970092773, "global_step": 66989, "epoch": 807} {"train_loss": -20.504032135009766, "global_step": 66990, "epoch": 807} {"train_loss": -20.46782112121582, "global_step": 66991, "epoch": 807} {"train_loss": -20.325302124023438, "global_step": 66992, "epoch": 807} {"train_loss": -20.312761306762695, "global_step": 66993, "epoch": 807} {"train_loss": -20.75722312927246, "global_step": 66994, "epoch": 807} {"train_loss": -20.764711380004883, "global_step": 66995, "epoch": 807} {"train_loss": -20.639158248901367, "global_step": 66996, "epoch": 807} {"train_loss": -20.647897720336914, "global_step": 66997, "epoch": 807} {"train_loss": -20.858579635620117, "global_step": 66998, "epoch": 807} {"train_loss": -20.379287719726562, "global_step": 66999, "epoch": 807} {"train_loss": -20.5700740814209, "global_step": 67000, "epoch": 807} {"train_loss": -20.787900924682617, "global_step": 67001, "epoch": 807} {"train_loss": -20.873525619506836, "global_step": 67002, "epoch": 807} {"train_loss": -20.50497055053711, "global_step": 67003, "epoch": 807} {"train_loss": -20.494342803955078, "global_step": 67004, "epoch": 807} {"train_loss": -20.70950698852539, "global_step": 67005, "epoch": 807} {"train_loss": -20.34837532043457, "global_step": 67006, "epoch": 807} {"train_loss": -20.6431827545166, "global_step": 67007, "epoch": 807} {"train_loss": -20.930034637451172, "global_step": 67008, "epoch": 807} {"train_loss": -20.664213180541992, "global_step": 67009, "epoch": 807} {"train_loss": -20.88627052307129, "global_step": 67010, "epoch": 807} {"train_loss": -20.462459564208984, "global_step": 67011, "epoch": 807} {"train_loss": -20.86346435546875, "global_step": 67012, "epoch": 807} {"train_loss": -21.18690299987793, "global_step": 67013, "epoch": 807} {"train_loss": -20.609447479248047, "global_step": 67014, "epoch": 807} {"train_loss": -20.533750534057617, "global_step": 67015, "epoch": 807} {"train_loss": -20.8138484954834, "global_step": 67016, "epoch": 807} {"train_loss": -20.711572647094727, "global_step": 67017, "epoch": 807} {"train_loss": -20.747461318969727, "global_step": 67018, "epoch": 807} {"train_loss": -21.184316635131836, "global_step": 67019, "epoch": 807} {"train_loss": -21.26008415222168, "global_step": 67020, "epoch": 807} {"train_loss": -20.605178833007812, "global_step": 67021, "epoch": 807} {"train_loss": -20.26972770690918, "global_step": 67022, "epoch": 807} {"train_loss": -21.097715377807617, "global_step": 67023, "epoch": 807} {"train_loss": -21.00215721130371, "global_step": 67024, "epoch": 807} {"train_loss": -20.32368278503418, "global_step": 67025, "epoch": 807} {"train_loss": -20.264793395996094, "global_step": 67026, "epoch": 807} {"train_loss": -20.737878799438477, "global_step": 67027, "epoch": 807} {"train_loss": -21.01422691345215, "global_step": 67028, "epoch": 807} {"train_loss": -20.731372833251953, "global_step": 67029, "epoch": 807} {"train_loss": -20.79098892211914, "global_step": 67030, "epoch": 807} {"train_loss": -20.896940231323242, "global_step": 67031, "epoch": 807} {"train_loss": -20.442415237426758, "global_step": 67032, "epoch": 807} {"train_loss": -20.927549362182617, "global_step": 67033, "epoch": 807} {"train_loss": -20.618717193603516, "global_step": 67034, "epoch": 807} {"train_loss": -20.7071533203125, "global_step": 67035, "epoch": 807} {"train_loss": -20.664566040039062, "global_step": 67036, "epoch": 807} {"train_loss": -20.530344009399414, "global_step": 67037, "epoch": 807} {"train_loss": -20.969144821166992, "global_step": 67038, "epoch": 807} {"train_loss": -20.296756744384766, "global_step": 67039, "epoch": 807} {"train_loss": -20.854021072387695, "global_step": 67040, "epoch": 807} {"train_loss": -21.09657859802246, "global_step": 67041, "epoch": 807} {"train_loss": -20.64218521118164, "global_step": 67042, "epoch": 807} {"train_loss": -20.616931915283203, "global_step": 67043, "epoch": 807} {"train_loss": -20.522438049316406, "global_step": 67044, "epoch": 807} {"train_loss": -20.47144889831543, "global_step": 67045, "epoch": 807} {"train_loss": -20.734825134277344, "global_step": 67046, "epoch": 807} {"train_loss": -20.916269302368164, "global_step": 67047, "epoch": 807} {"train_loss": -20.793701171875, "global_step": 67048, "epoch": 807} {"train_loss": -20.67110252380371, "global_step": 67049, "epoch": 807} {"train_loss": -20.694442749023438, "global_step": 67050, "epoch": 807} {"train_loss": -20.563739776611328, "global_step": 67051, "epoch": 807} {"train_loss": -20.68902015686035, "global_step": 67052, "epoch": 807} {"train_loss": -20.72817039489746, "global_step": 67053, "epoch": 807} {"train_loss": -20.627643585205078, "global_step": 67054, "epoch": 807} {"train_loss": -20.702505111694336, "global_step": 67055, "epoch": 807} {"train_loss": -21.061010360717773, "global_step": 67056, "epoch": 807} {"train_loss": -20.698041915893555, "global_step": 67057, "epoch": 807} {"train_loss": -20.6927433013916, "global_step": 67058, "epoch": 807} {"train_loss": -21.075927734375, "global_step": 67059, "epoch": 807} {"train_loss": -20.698780059814453, "global_step": 67060, "epoch": 807} {"train_loss": -20.75646209716797, "global_step": 67061, "epoch": 807} {"train_loss": -20.534242630004883, "global_step": 67062, "epoch": 807} {"train_loss": -20.656459095966387, "global_step": 67063, "epoch": 807, "val_loss": 5941907.5} {"train_loss": -20.582040786743164, "global_step": 67064, "epoch": 808} {"train_loss": -20.456695556640625, "global_step": 67065, "epoch": 808} {"train_loss": -20.72193145751953, "global_step": 67066, "epoch": 808} {"train_loss": -20.274839401245117, "global_step": 67067, "epoch": 808} {"train_loss": -20.60176658630371, "global_step": 67068, "epoch": 808} {"train_loss": -20.533456802368164, "global_step": 67069, "epoch": 808} {"train_loss": -20.285053253173828, "global_step": 67070, "epoch": 808} {"train_loss": -20.35098648071289, "global_step": 67071, "epoch": 808} {"train_loss": -20.413150787353516, "global_step": 67072, "epoch": 808} {"train_loss": -20.608251571655273, "global_step": 67073, "epoch": 808} {"train_loss": -20.691810607910156, "global_step": 67074, "epoch": 808} {"train_loss": -20.647323608398438, "global_step": 67075, "epoch": 808} {"train_loss": -20.856449127197266, "global_step": 67076, "epoch": 808} {"train_loss": -20.73036003112793, "global_step": 67077, "epoch": 808} {"train_loss": -20.455459594726562, "global_step": 67078, "epoch": 808} {"train_loss": -20.52993392944336, "global_step": 67079, "epoch": 808} {"train_loss": -20.96077537536621, "global_step": 67080, "epoch": 808} {"train_loss": -21.0290470123291, "global_step": 67081, "epoch": 808} {"train_loss": -20.89383316040039, "global_step": 67082, "epoch": 808} {"train_loss": -21.096620559692383, "global_step": 67083, "epoch": 808} {"train_loss": -20.184001922607422, "global_step": 67084, "epoch": 808} {"train_loss": -20.581022262573242, "global_step": 67085, "epoch": 808} {"train_loss": -20.8499755859375, "global_step": 67086, "epoch": 808} {"train_loss": -20.91245460510254, "global_step": 67087, "epoch": 808} {"train_loss": -20.91896629333496, "global_step": 67088, "epoch": 808} {"train_loss": -20.712295532226562, "global_step": 67089, "epoch": 808} {"train_loss": -20.7526912689209, "global_step": 67090, "epoch": 808} {"train_loss": -20.47145652770996, "global_step": 67091, "epoch": 808} {"train_loss": -20.49397087097168, "global_step": 67092, "epoch": 808} {"train_loss": -21.27605628967285, "global_step": 67093, "epoch": 808} {"train_loss": -20.64542007446289, "global_step": 67094, "epoch": 808} {"train_loss": -20.56807518005371, "global_step": 67095, "epoch": 808} {"train_loss": -20.516019821166992, "global_step": 67096, "epoch": 808} {"train_loss": -20.768667221069336, "global_step": 67097, "epoch": 808} {"train_loss": -20.42508888244629, "global_step": 67098, "epoch": 808} {"train_loss": -20.62572479248047, "global_step": 67099, "epoch": 808} {"train_loss": -20.525602340698242, "global_step": 67100, "epoch": 808} {"train_loss": -20.57682991027832, "global_step": 67101, "epoch": 808} {"train_loss": -20.691679000854492, "global_step": 67102, "epoch": 808} {"train_loss": -20.932697296142578, "global_step": 67103, "epoch": 808} {"train_loss": -20.73398208618164, "global_step": 67104, "epoch": 808} {"train_loss": -20.72948455810547, "global_step": 67105, "epoch": 808} {"train_loss": -20.65811538696289, "global_step": 67106, "epoch": 808} {"train_loss": -20.577043533325195, "global_step": 67107, "epoch": 808} {"train_loss": -20.52685546875, "global_step": 67108, "epoch": 808} {"train_loss": -20.651376724243164, "global_step": 67109, "epoch": 808} {"train_loss": -20.598783493041992, "global_step": 67110, "epoch": 808} {"train_loss": -20.837116241455078, "global_step": 67111, "epoch": 808} {"train_loss": -20.747400283813477, "global_step": 67112, "epoch": 808} {"train_loss": -20.826025009155273, "global_step": 67113, "epoch": 808} {"train_loss": -20.548627853393555, "global_step": 67114, "epoch": 808} {"train_loss": -20.438390731811523, "global_step": 67115, "epoch": 808} {"train_loss": -20.45951271057129, "global_step": 67116, "epoch": 808} {"train_loss": -20.502552032470703, "global_step": 67117, "epoch": 808} {"train_loss": -20.767770767211914, "global_step": 67118, "epoch": 808} {"train_loss": -20.634305953979492, "global_step": 67119, "epoch": 808} {"train_loss": -20.875349044799805, "global_step": 67120, "epoch": 808} {"train_loss": -20.680509567260742, "global_step": 67121, "epoch": 808} {"train_loss": -20.432546615600586, "global_step": 67122, "epoch": 808} {"train_loss": -20.616483688354492, "global_step": 67123, "epoch": 808} {"train_loss": -20.95313835144043, "global_step": 67124, "epoch": 808} {"train_loss": -20.71729850769043, "global_step": 67125, "epoch": 808} {"train_loss": -20.688566207885742, "global_step": 67126, "epoch": 808} {"train_loss": -20.783353805541992, "global_step": 67127, "epoch": 808} {"train_loss": -20.56912612915039, "global_step": 67128, "epoch": 808} {"train_loss": -20.713369369506836, "global_step": 67129, "epoch": 808} {"train_loss": -20.770902633666992, "global_step": 67130, "epoch": 808} {"train_loss": -21.007415771484375, "global_step": 67131, "epoch": 808} {"train_loss": -20.839527130126953, "global_step": 67132, "epoch": 808} {"train_loss": -20.53322982788086, "global_step": 67133, "epoch": 808} {"train_loss": -20.857187271118164, "global_step": 67134, "epoch": 808} {"train_loss": -20.98457908630371, "global_step": 67135, "epoch": 808} {"train_loss": -20.736143112182617, "global_step": 67136, "epoch": 808} {"train_loss": -20.811172485351562, "global_step": 67137, "epoch": 808} {"train_loss": -20.715747833251953, "global_step": 67138, "epoch": 808} {"train_loss": -20.60980224609375, "global_step": 67139, "epoch": 808} {"train_loss": -20.58540153503418, "global_step": 67140, "epoch": 808} {"train_loss": -20.56525421142578, "global_step": 67141, "epoch": 808} {"train_loss": -20.701017379760742, "global_step": 67142, "epoch": 808} {"train_loss": -20.979352951049805, "global_step": 67143, "epoch": 808} {"train_loss": -20.935346603393555, "global_step": 67144, "epoch": 808} {"train_loss": -20.841732025146484, "global_step": 67145, "epoch": 808} {"train_loss": -20.693171259868574, "global_step": 67146, "epoch": 808, "val_loss": 6012738.5} {"train_loss": -20.291650772094727, "global_step": 67147, "epoch": 809} {"train_loss": -20.383962631225586, "global_step": 67148, "epoch": 809} {"train_loss": -20.26996421813965, "global_step": 67149, "epoch": 809} {"train_loss": -20.283071517944336, "global_step": 67150, "epoch": 809} {"train_loss": -20.4008846282959, "global_step": 67151, "epoch": 809} {"train_loss": -20.381671905517578, "global_step": 67152, "epoch": 809} {"train_loss": -20.515226364135742, "global_step": 67153, "epoch": 809} {"train_loss": -20.525680541992188, "global_step": 67154, "epoch": 809} {"train_loss": -20.29837989807129, "global_step": 67155, "epoch": 809} {"train_loss": -21.076881408691406, "global_step": 67156, "epoch": 809} {"train_loss": -20.347944259643555, "global_step": 67157, "epoch": 809} {"train_loss": -20.665830612182617, "global_step": 67158, "epoch": 809} {"train_loss": -20.376245498657227, "global_step": 67159, "epoch": 809} {"train_loss": -20.94478416442871, "global_step": 67160, "epoch": 809} {"train_loss": -20.827322006225586, "global_step": 67161, "epoch": 809} {"train_loss": -20.67605972290039, "global_step": 67162, "epoch": 809} {"train_loss": -20.37153434753418, "global_step": 67163, "epoch": 809} {"train_loss": -20.585798263549805, "global_step": 67164, "epoch": 809} {"train_loss": -20.57014274597168, "global_step": 67165, "epoch": 809} {"train_loss": -20.49906349182129, "global_step": 67166, "epoch": 809} {"train_loss": -21.06125831604004, "global_step": 67167, "epoch": 809} {"train_loss": -20.781095504760742, "global_step": 67168, "epoch": 809} {"train_loss": -21.119918823242188, "global_step": 67169, "epoch": 809} {"train_loss": -20.764612197875977, "global_step": 67170, "epoch": 809} {"train_loss": -20.608688354492188, "global_step": 67171, "epoch": 809} {"train_loss": -20.71650505065918, "global_step": 67172, "epoch": 809} {"train_loss": -21.092153549194336, "global_step": 67173, "epoch": 809} {"train_loss": -20.867965698242188, "global_step": 67174, "epoch": 809} {"train_loss": -21.067235946655273, "global_step": 67175, "epoch": 809} {"train_loss": -20.9677734375, "global_step": 67176, "epoch": 809} {"train_loss": -20.444997787475586, "global_step": 67177, "epoch": 809} {"train_loss": -20.416584014892578, "global_step": 67178, "epoch": 809} {"train_loss": -20.815711975097656, "global_step": 67179, "epoch": 809} {"train_loss": -20.67230796813965, "global_step": 67180, "epoch": 809} {"train_loss": -20.636220932006836, "global_step": 67181, "epoch": 809} {"train_loss": -20.57181167602539, "global_step": 67182, "epoch": 809} {"train_loss": -20.689085006713867, "global_step": 67183, "epoch": 809} {"train_loss": -20.481420516967773, "global_step": 67184, "epoch": 809} {"train_loss": -20.254196166992188, "global_step": 67185, "epoch": 809} {"train_loss": -20.6782283782959, "global_step": 67186, "epoch": 809} {"train_loss": -20.505109786987305, "global_step": 67187, "epoch": 809} {"train_loss": -20.54217529296875, "global_step": 67188, "epoch": 809} {"train_loss": -20.31871223449707, "global_step": 67189, "epoch": 809} {"train_loss": -20.4366512298584, "global_step": 67190, "epoch": 809} {"train_loss": -20.944711685180664, "global_step": 67191, "epoch": 809} {"train_loss": -20.492156982421875, "global_step": 67192, "epoch": 809} {"train_loss": -20.64998435974121, "global_step": 67193, "epoch": 809} {"train_loss": -20.47406768798828, "global_step": 67194, "epoch": 809} {"train_loss": -20.470603942871094, "global_step": 67195, "epoch": 809} {"train_loss": -20.72065544128418, "global_step": 67196, "epoch": 809} {"train_loss": -20.584232330322266, "global_step": 67197, "epoch": 809} {"train_loss": -20.424100875854492, "global_step": 67198, "epoch": 809} {"train_loss": -20.65308952331543, "global_step": 67199, "epoch": 809} {"train_loss": -20.481435775756836, "global_step": 67200, "epoch": 809} {"train_loss": -20.647869110107422, "global_step": 67201, "epoch": 809} {"train_loss": -20.638519287109375, "global_step": 67202, "epoch": 809} {"train_loss": -20.80560302734375, "global_step": 67203, "epoch": 809} {"train_loss": -20.50095558166504, "global_step": 67204, "epoch": 809} {"train_loss": -20.510021209716797, "global_step": 67205, "epoch": 809} {"train_loss": -20.654788970947266, "global_step": 67206, "epoch": 809} {"train_loss": -20.64493179321289, "global_step": 67207, "epoch": 809} {"train_loss": -20.45265007019043, "global_step": 67208, "epoch": 809} {"train_loss": -20.89398193359375, "global_step": 67209, "epoch": 809} {"train_loss": -20.792434692382812, "global_step": 67210, "epoch": 809} {"train_loss": -20.484272003173828, "global_step": 67211, "epoch": 809} {"train_loss": -20.40053939819336, "global_step": 67212, "epoch": 809} {"train_loss": -20.777036666870117, "global_step": 67213, "epoch": 809} {"train_loss": -20.488327026367188, "global_step": 67214, "epoch": 809} {"train_loss": -20.562158584594727, "global_step": 67215, "epoch": 809} {"train_loss": -20.469322204589844, "global_step": 67216, "epoch": 809} {"train_loss": -20.707908630371094, "global_step": 67217, "epoch": 809} {"train_loss": -20.952993392944336, "global_step": 67218, "epoch": 809} {"train_loss": -20.65375328063965, "global_step": 67219, "epoch": 809} {"train_loss": -20.67840576171875, "global_step": 67220, "epoch": 809} {"train_loss": -20.728124618530273, "global_step": 67221, "epoch": 809} {"train_loss": -20.747970581054688, "global_step": 67222, "epoch": 809} {"train_loss": -20.65181541442871, "global_step": 67223, "epoch": 809} {"train_loss": -21.11499786376953, "global_step": 67224, "epoch": 809} {"train_loss": -20.496702194213867, "global_step": 67225, "epoch": 809} {"train_loss": -20.61111831665039, "global_step": 67226, "epoch": 809} {"train_loss": -20.642885208129883, "global_step": 67227, "epoch": 809} {"train_loss": -20.554296493530273, "global_step": 67228, "epoch": 809} {"train_loss": -20.61517837248653, "global_step": 67229, "epoch": 809, "val_loss": 5996758.0} {"train_loss": -20.823286056518555, "global_step": 67230, "epoch": 810} {"train_loss": -20.548139572143555, "global_step": 67231, "epoch": 810} {"train_loss": -21.083127975463867, "global_step": 67232, "epoch": 810} {"train_loss": -20.42745590209961, "global_step": 67233, "epoch": 810} {"train_loss": -20.49091339111328, "global_step": 67234, "epoch": 810} {"train_loss": -20.871551513671875, "global_step": 67235, "epoch": 810} {"train_loss": -20.299654006958008, "global_step": 67236, "epoch": 810} {"train_loss": -20.751367568969727, "global_step": 67237, "epoch": 810} {"train_loss": -20.612104415893555, "global_step": 67238, "epoch": 810} {"train_loss": -20.71657371520996, "global_step": 67239, "epoch": 810} {"train_loss": -20.307344436645508, "global_step": 67240, "epoch": 810} {"train_loss": -20.2977237701416, "global_step": 67241, "epoch": 810} {"train_loss": -20.934818267822266, "global_step": 67242, "epoch": 810} {"train_loss": -20.795209884643555, "global_step": 67243, "epoch": 810} {"train_loss": -20.133344650268555, "global_step": 67244, "epoch": 810} {"train_loss": -20.6767520904541, "global_step": 67245, "epoch": 810} {"train_loss": -20.508092880249023, "global_step": 67246, "epoch": 810} {"train_loss": -20.681583404541016, "global_step": 67247, "epoch": 810} {"train_loss": -20.667219161987305, "global_step": 67248, "epoch": 810} {"train_loss": -20.78415298461914, "global_step": 67249, "epoch": 810} {"train_loss": -20.88857078552246, "global_step": 67250, "epoch": 810} {"train_loss": -20.609943389892578, "global_step": 67251, "epoch": 810} {"train_loss": -20.80260467529297, "global_step": 67252, "epoch": 810} {"train_loss": -20.854455947875977, "global_step": 67253, "epoch": 810} {"train_loss": -20.86330223083496, "global_step": 67254, "epoch": 810} {"train_loss": -20.5924129486084, "global_step": 67255, "epoch": 810} {"train_loss": -20.263517379760742, "global_step": 67256, "epoch": 810} {"train_loss": -21.228458404541016, "global_step": 67257, "epoch": 810} {"train_loss": -20.51806640625, "global_step": 67258, "epoch": 810} {"train_loss": -20.960742950439453, "global_step": 67259, "epoch": 810} {"train_loss": -20.514999389648438, "global_step": 67260, "epoch": 810} {"train_loss": -20.8410701751709, "global_step": 67261, "epoch": 810} {"train_loss": -20.536832809448242, "global_step": 67262, "epoch": 810} {"train_loss": -20.497770309448242, "global_step": 67263, "epoch": 810} {"train_loss": -20.490633010864258, "global_step": 67264, "epoch": 810} {"train_loss": -20.481849670410156, "global_step": 67265, "epoch": 810} {"train_loss": -20.76784324645996, "global_step": 67266, "epoch": 810} {"train_loss": -20.629117965698242, "global_step": 67267, "epoch": 810} {"train_loss": -21.036069869995117, "global_step": 67268, "epoch": 810} {"train_loss": -20.39994239807129, "global_step": 67269, "epoch": 810} {"train_loss": -20.64914321899414, "global_step": 67270, "epoch": 810} {"train_loss": -20.790611267089844, "global_step": 67271, "epoch": 810} {"train_loss": -20.72884178161621, "global_step": 67272, "epoch": 810} {"train_loss": -20.935882568359375, "global_step": 67273, "epoch": 810} {"train_loss": -20.86220932006836, "global_step": 67274, "epoch": 810} {"train_loss": -20.742307662963867, "global_step": 67275, "epoch": 810} {"train_loss": -20.8126277923584, "global_step": 67276, "epoch": 810} {"train_loss": -20.898839950561523, "global_step": 67277, "epoch": 810} {"train_loss": -20.77821922302246, "global_step": 67278, "epoch": 810} {"train_loss": -20.527780532836914, "global_step": 67279, "epoch": 810} {"train_loss": -21.06987190246582, "global_step": 67280, "epoch": 810} {"train_loss": -20.741361618041992, "global_step": 67281, "epoch": 810} {"train_loss": -20.851552963256836, "global_step": 67282, "epoch": 810} {"train_loss": -20.59856414794922, "global_step": 67283, "epoch": 810} {"train_loss": -20.570688247680664, "global_step": 67284, "epoch": 810} {"train_loss": -20.86634063720703, "global_step": 67285, "epoch": 810} {"train_loss": -20.945985794067383, "global_step": 67286, "epoch": 810} {"train_loss": -21.069433212280273, "global_step": 67287, "epoch": 810} {"train_loss": -21.070114135742188, "global_step": 67288, "epoch": 810} {"train_loss": -21.1114444732666, "global_step": 67289, "epoch": 810} {"train_loss": -20.408910751342773, "global_step": 67290, "epoch": 810} {"train_loss": -20.67405891418457, "global_step": 67291, "epoch": 810} {"train_loss": -20.631439208984375, "global_step": 67292, "epoch": 810} {"train_loss": -20.687313079833984, "global_step": 67293, "epoch": 810} {"train_loss": -20.832786560058594, "global_step": 67294, "epoch": 810} {"train_loss": -20.820125579833984, "global_step": 67295, "epoch": 810} {"train_loss": -20.498716354370117, "global_step": 67296, "epoch": 810} {"train_loss": -20.831830978393555, "global_step": 67297, "epoch": 810} {"train_loss": -20.68842887878418, "global_step": 67298, "epoch": 810} {"train_loss": -20.78529167175293, "global_step": 67299, "epoch": 810} {"train_loss": -20.739551544189453, "global_step": 67300, "epoch": 810} {"train_loss": -20.614643096923828, "global_step": 67301, "epoch": 810} {"train_loss": -20.625699996948242, "global_step": 67302, "epoch": 810} {"train_loss": -20.91010093688965, "global_step": 67303, "epoch": 810} {"train_loss": -20.652435302734375, "global_step": 67304, "epoch": 810} {"train_loss": -20.916364669799805, "global_step": 67305, "epoch": 810} {"train_loss": -20.659894943237305, "global_step": 67306, "epoch": 810} {"train_loss": -20.36781883239746, "global_step": 67307, "epoch": 810} {"train_loss": -20.72832679748535, "global_step": 67308, "epoch": 810} {"train_loss": -20.38648796081543, "global_step": 67309, "epoch": 810} {"train_loss": -20.816137313842773, "global_step": 67310, "epoch": 810} {"train_loss": -20.71906852722168, "global_step": 67311, "epoch": 810} {"train_loss": -20.702502790703832, "global_step": 67312, "epoch": 810, "val_loss": 6002923.0} {"train_loss": -20.15204620361328, "global_step": 67313, "epoch": 811} {"train_loss": -20.2445125579834, "global_step": 67314, "epoch": 811} {"train_loss": -20.717252731323242, "global_step": 67315, "epoch": 811} {"train_loss": -20.39179039001465, "global_step": 67316, "epoch": 811} {"train_loss": -20.557355880737305, "global_step": 67317, "epoch": 811} {"train_loss": -20.327695846557617, "global_step": 67318, "epoch": 811} {"train_loss": -20.008468627929688, "global_step": 67319, "epoch": 811} {"train_loss": -20.605701446533203, "global_step": 67320, "epoch": 811} {"train_loss": -20.608749389648438, "global_step": 67321, "epoch": 811} {"train_loss": -20.600278854370117, "global_step": 67322, "epoch": 811} {"train_loss": -20.531660079956055, "global_step": 67323, "epoch": 811} {"train_loss": -20.64472770690918, "global_step": 67324, "epoch": 811} {"train_loss": -20.28980827331543, "global_step": 67325, "epoch": 811} {"train_loss": -20.427013397216797, "global_step": 67326, "epoch": 811} {"train_loss": -20.482927322387695, "global_step": 67327, "epoch": 811} {"train_loss": -20.541181564331055, "global_step": 67328, "epoch": 811} {"train_loss": -20.36516761779785, "global_step": 67329, "epoch": 811} {"train_loss": -20.759708404541016, "global_step": 67330, "epoch": 811} {"train_loss": -20.797006607055664, "global_step": 67331, "epoch": 811} {"train_loss": -20.63759422302246, "global_step": 67332, "epoch": 811} {"train_loss": -20.47157096862793, "global_step": 67333, "epoch": 811} {"train_loss": -20.42957878112793, "global_step": 67334, "epoch": 811} {"train_loss": -20.467777252197266, "global_step": 67335, "epoch": 811} {"train_loss": -20.613239288330078, "global_step": 67336, "epoch": 811} {"train_loss": -20.66225242614746, "global_step": 67337, "epoch": 811} {"train_loss": -20.94516372680664, "global_step": 67338, "epoch": 811} {"train_loss": -20.826784133911133, "global_step": 67339, "epoch": 811} {"train_loss": -21.060760498046875, "global_step": 67340, "epoch": 811} {"train_loss": -20.703575134277344, "global_step": 67341, "epoch": 811} {"train_loss": -20.548690795898438, "global_step": 67342, "epoch": 811} {"train_loss": -20.642597198486328, "global_step": 67343, "epoch": 811} {"train_loss": -20.7362117767334, "global_step": 67344, "epoch": 811} {"train_loss": -20.840286254882812, "global_step": 67345, "epoch": 811} {"train_loss": -20.52530288696289, "global_step": 67346, "epoch": 811} {"train_loss": -20.69790267944336, "global_step": 67347, "epoch": 811} {"train_loss": -20.733448028564453, "global_step": 67348, "epoch": 811} {"train_loss": -20.713088989257812, "global_step": 67349, "epoch": 811} {"train_loss": -20.90437126159668, "global_step": 67350, "epoch": 811} {"train_loss": -20.654802322387695, "global_step": 67351, "epoch": 811} {"train_loss": -21.092195510864258, "global_step": 67352, "epoch": 811} {"train_loss": -20.654434204101562, "global_step": 67353, "epoch": 811} {"train_loss": -20.475168228149414, "global_step": 67354, "epoch": 811} {"train_loss": -20.788179397583008, "global_step": 67355, "epoch": 811} {"train_loss": -20.70716667175293, "global_step": 67356, "epoch": 811} {"train_loss": -20.683767318725586, "global_step": 67357, "epoch": 811} {"train_loss": -20.980573654174805, "global_step": 67358, "epoch": 811} {"train_loss": -20.558561325073242, "global_step": 67359, "epoch": 811} {"train_loss": -20.852529525756836, "global_step": 67360, "epoch": 811} {"train_loss": -20.632986068725586, "global_step": 67361, "epoch": 811} {"train_loss": -20.709257125854492, "global_step": 67362, "epoch": 811} {"train_loss": -20.6306209564209, "global_step": 67363, "epoch": 811} {"train_loss": -21.055418014526367, "global_step": 67364, "epoch": 811} {"train_loss": -20.579940795898438, "global_step": 67365, "epoch": 811} {"train_loss": -20.914539337158203, "global_step": 67366, "epoch": 811} {"train_loss": -20.89645767211914, "global_step": 67367, "epoch": 811} {"train_loss": -20.651416778564453, "global_step": 67368, "epoch": 811} {"train_loss": -20.334566116333008, "global_step": 67369, "epoch": 811} {"train_loss": -20.798669815063477, "global_step": 67370, "epoch": 811} {"train_loss": -20.616867065429688, "global_step": 67371, "epoch": 811} {"train_loss": -20.476932525634766, "global_step": 67372, "epoch": 811} {"train_loss": -20.59736442565918, "global_step": 67373, "epoch": 811} {"train_loss": -20.648130416870117, "global_step": 67374, "epoch": 811} {"train_loss": -20.397642135620117, "global_step": 67375, "epoch": 811} {"train_loss": -20.728118896484375, "global_step": 67376, "epoch": 811} {"train_loss": -21.03165626525879, "global_step": 67377, "epoch": 811} {"train_loss": -20.709945678710938, "global_step": 67378, "epoch": 811} {"train_loss": -20.657350540161133, "global_step": 67379, "epoch": 811} {"train_loss": -21.13878059387207, "global_step": 67380, "epoch": 811} {"train_loss": -20.877365112304688, "global_step": 67381, "epoch": 811} {"train_loss": -20.6872615814209, "global_step": 67382, "epoch": 811} {"train_loss": -20.92873191833496, "global_step": 67383, "epoch": 811} {"train_loss": -20.950971603393555, "global_step": 67384, "epoch": 811} {"train_loss": -20.92041015625, "global_step": 67385, "epoch": 811} {"train_loss": -20.898862838745117, "global_step": 67386, "epoch": 811} {"train_loss": -20.356658935546875, "global_step": 67387, "epoch": 811} {"train_loss": -20.228504180908203, "global_step": 67388, "epoch": 811} {"train_loss": -21.145967483520508, "global_step": 67389, "epoch": 811} {"train_loss": -20.69797706604004, "global_step": 67390, "epoch": 811} {"train_loss": -20.74968147277832, "global_step": 67391, "epoch": 811} {"train_loss": -20.6646728515625, "global_step": 67392, "epoch": 811} {"train_loss": -20.646726608276367, "global_step": 67393, "epoch": 811} {"train_loss": -21.069204330444336, "global_step": 67394, "epoch": 811} {"train_loss": -20.64988423542804, "global_step": 67395, "epoch": 811, "val_loss": 6005232.5} {"train_loss": -19.839885711669922, "global_step": 67396, "epoch": 812} {"train_loss": -20.381053924560547, "global_step": 67397, "epoch": 812} {"train_loss": -20.160184860229492, "global_step": 67398, "epoch": 812} {"train_loss": -20.5872859954834, "global_step": 67399, "epoch": 812} {"train_loss": -20.319791793823242, "global_step": 67400, "epoch": 812} {"train_loss": -20.72592544555664, "global_step": 67401, "epoch": 812} {"train_loss": -20.687204360961914, "global_step": 67402, "epoch": 812} {"train_loss": -20.662023544311523, "global_step": 67403, "epoch": 812} {"train_loss": -20.429807662963867, "global_step": 67404, "epoch": 812} {"train_loss": -20.705364227294922, "global_step": 67405, "epoch": 812} {"train_loss": -20.499191284179688, "global_step": 67406, "epoch": 812} {"train_loss": -20.032772064208984, "global_step": 67407, "epoch": 812} {"train_loss": -20.228796005249023, "global_step": 67408, "epoch": 812} {"train_loss": -20.531925201416016, "global_step": 67409, "epoch": 812} {"train_loss": -20.767431259155273, "global_step": 67410, "epoch": 812} {"train_loss": -20.483572006225586, "global_step": 67411, "epoch": 812} {"train_loss": -20.870038986206055, "global_step": 67412, "epoch": 812} {"train_loss": -20.736631393432617, "global_step": 67413, "epoch": 812} {"train_loss": -20.673873901367188, "global_step": 67414, "epoch": 812} {"train_loss": -20.480920791625977, "global_step": 67415, "epoch": 812} {"train_loss": -20.411157608032227, "global_step": 67416, "epoch": 812} {"train_loss": -20.627567291259766, "global_step": 67417, "epoch": 812} {"train_loss": -20.849912643432617, "global_step": 67418, "epoch": 812} {"train_loss": -20.600536346435547, "global_step": 67419, "epoch": 812} {"train_loss": -19.925710678100586, "global_step": 67420, "epoch": 812} {"train_loss": -20.765249252319336, "global_step": 67421, "epoch": 812} {"train_loss": -20.746795654296875, "global_step": 67422, "epoch": 812} {"train_loss": -20.951324462890625, "global_step": 67423, "epoch": 812} {"train_loss": -20.50117301940918, "global_step": 67424, "epoch": 812} {"train_loss": -20.505651473999023, "global_step": 67425, "epoch": 812} {"train_loss": -20.64980125427246, "global_step": 67426, "epoch": 812} {"train_loss": -21.0135498046875, "global_step": 67427, "epoch": 812} {"train_loss": -20.811769485473633, "global_step": 67428, "epoch": 812} {"train_loss": -20.767667770385742, "global_step": 67429, "epoch": 812} {"train_loss": -20.51954460144043, "global_step": 67430, "epoch": 812} {"train_loss": -20.574132919311523, "global_step": 67431, "epoch": 812} {"train_loss": -20.807889938354492, "global_step": 67432, "epoch": 812} {"train_loss": -20.547992706298828, "global_step": 67433, "epoch": 812} {"train_loss": -20.784399032592773, "global_step": 67434, "epoch": 812} {"train_loss": -20.48505973815918, "global_step": 67435, "epoch": 812} {"train_loss": -20.526765823364258, "global_step": 67436, "epoch": 812} {"train_loss": -20.677587509155273, "global_step": 67437, "epoch": 812} {"train_loss": -20.840045928955078, "global_step": 67438, "epoch": 812} {"train_loss": -20.767179489135742, "global_step": 67439, "epoch": 812} {"train_loss": -20.810962677001953, "global_step": 67440, "epoch": 812} {"train_loss": -20.81780433654785, "global_step": 67441, "epoch": 812} {"train_loss": -20.718786239624023, "global_step": 67442, "epoch": 812} {"train_loss": -20.665740966796875, "global_step": 67443, "epoch": 812} {"train_loss": -20.687206268310547, "global_step": 67444, "epoch": 812} {"train_loss": -21.102285385131836, "global_step": 67445, "epoch": 812} {"train_loss": -20.530776977539062, "global_step": 67446, "epoch": 812} {"train_loss": -20.66493797302246, "global_step": 67447, "epoch": 812} {"train_loss": -20.687414169311523, "global_step": 67448, "epoch": 812} {"train_loss": -20.726484298706055, "global_step": 67449, "epoch": 812} {"train_loss": -20.982318878173828, "global_step": 67450, "epoch": 812} {"train_loss": -20.90812110900879, "global_step": 67451, "epoch": 812} {"train_loss": -20.6058349609375, "global_step": 67452, "epoch": 812} {"train_loss": -20.60938262939453, "global_step": 67453, "epoch": 812} {"train_loss": -20.751493453979492, "global_step": 67454, "epoch": 812} {"train_loss": -21.007495880126953, "global_step": 67455, "epoch": 812} {"train_loss": -20.724699020385742, "global_step": 67456, "epoch": 812} {"train_loss": -20.806058883666992, "global_step": 67457, "epoch": 812} {"train_loss": -20.675100326538086, "global_step": 67458, "epoch": 812} {"train_loss": -20.297250747680664, "global_step": 67459, "epoch": 812} {"train_loss": -20.471405029296875, "global_step": 67460, "epoch": 812} {"train_loss": -20.71124839782715, "global_step": 67461, "epoch": 812} {"train_loss": -20.965314865112305, "global_step": 67462, "epoch": 812} {"train_loss": -20.69283103942871, "global_step": 67463, "epoch": 812} {"train_loss": -20.82423210144043, "global_step": 67464, "epoch": 812} {"train_loss": -20.68949317932129, "global_step": 67465, "epoch": 812} {"train_loss": -20.60896873474121, "global_step": 67466, "epoch": 812} {"train_loss": -21.041038513183594, "global_step": 67467, "epoch": 812} {"train_loss": -20.901700973510742, "global_step": 67468, "epoch": 812} {"train_loss": -20.917226791381836, "global_step": 67469, "epoch": 812} {"train_loss": -20.348669052124023, "global_step": 67470, "epoch": 812} {"train_loss": -20.828840255737305, "global_step": 67471, "epoch": 812} {"train_loss": -21.064741134643555, "global_step": 67472, "epoch": 812} {"train_loss": -20.630491256713867, "global_step": 67473, "epoch": 812} {"train_loss": -20.65387535095215, "global_step": 67474, "epoch": 812} {"train_loss": -20.579288482666016, "global_step": 67475, "epoch": 812} {"train_loss": -20.824203491210938, "global_step": 67476, "epoch": 812} {"train_loss": -20.881439208984375, "global_step": 67477, "epoch": 812} {"train_loss": -20.669325127659075, "global_step": 67478, "epoch": 812, "val_loss": 5913437.0} {"train_loss": -20.476789474487305, "global_step": 67479, "epoch": 813} {"train_loss": -20.55529022216797, "global_step": 67480, "epoch": 813} {"train_loss": -20.849889755249023, "global_step": 67481, "epoch": 813} {"train_loss": -20.73380470275879, "global_step": 67482, "epoch": 813} {"train_loss": -20.658889770507812, "global_step": 67483, "epoch": 813} {"train_loss": -20.35112953186035, "global_step": 67484, "epoch": 813} {"train_loss": -20.753324508666992, "global_step": 67485, "epoch": 813} {"train_loss": -20.54535484313965, "global_step": 67486, "epoch": 813} {"train_loss": -20.4966983795166, "global_step": 67487, "epoch": 813} {"train_loss": -20.743324279785156, "global_step": 67488, "epoch": 813} {"train_loss": -20.839357376098633, "global_step": 67489, "epoch": 813} {"train_loss": -20.64374351501465, "global_step": 67490, "epoch": 813} {"train_loss": -20.652563095092773, "global_step": 67491, "epoch": 813} {"train_loss": -20.562002182006836, "global_step": 67492, "epoch": 813} {"train_loss": -20.509809494018555, "global_step": 67493, "epoch": 813} {"train_loss": -20.44440269470215, "global_step": 67494, "epoch": 813} {"train_loss": -20.53714942932129, "global_step": 67495, "epoch": 813} {"train_loss": -20.719099044799805, "global_step": 67496, "epoch": 813} {"train_loss": -20.459394454956055, "global_step": 67497, "epoch": 813} {"train_loss": -20.83400535583496, "global_step": 67498, "epoch": 813} {"train_loss": -20.60025978088379, "global_step": 67499, "epoch": 813} {"train_loss": -20.804790496826172, "global_step": 67500, "epoch": 813} {"train_loss": -20.905109405517578, "global_step": 67501, "epoch": 813} {"train_loss": -20.576766967773438, "global_step": 67502, "epoch": 813} {"train_loss": -20.68830680847168, "global_step": 67503, "epoch": 813} {"train_loss": -20.915063858032227, "global_step": 67504, "epoch": 813} {"train_loss": -20.761333465576172, "global_step": 67505, "epoch": 813} {"train_loss": -21.00715446472168, "global_step": 67506, "epoch": 813} {"train_loss": -20.691341400146484, "global_step": 67507, "epoch": 813} {"train_loss": -21.1304988861084, "global_step": 67508, "epoch": 813} {"train_loss": -21.099384307861328, "global_step": 67509, "epoch": 813} {"train_loss": -20.79056167602539, "global_step": 67510, "epoch": 813} {"train_loss": -20.545827865600586, "global_step": 67511, "epoch": 813} {"train_loss": -20.857685089111328, "global_step": 67512, "epoch": 813} {"train_loss": -20.592945098876953, "global_step": 67513, "epoch": 813} {"train_loss": -20.759296417236328, "global_step": 67514, "epoch": 813} {"train_loss": -20.81689453125, "global_step": 67515, "epoch": 813} {"train_loss": -21.043989181518555, "global_step": 67516, "epoch": 813} {"train_loss": -20.619367599487305, "global_step": 67517, "epoch": 813} {"train_loss": -20.916725158691406, "global_step": 67518, "epoch": 813} {"train_loss": -20.514915466308594, "global_step": 67519, "epoch": 813} {"train_loss": -21.10087776184082, "global_step": 67520, "epoch": 813} {"train_loss": -20.750869750976562, "global_step": 67521, "epoch": 813} {"train_loss": -20.704166412353516, "global_step": 67522, "epoch": 813} {"train_loss": -20.787405014038086, "global_step": 67523, "epoch": 813} {"train_loss": -20.611608505249023, "global_step": 67524, "epoch": 813} {"train_loss": -20.577367782592773, "global_step": 67525, "epoch": 813} {"train_loss": -20.437238693237305, "global_step": 67526, "epoch": 813} {"train_loss": -20.696767807006836, "global_step": 67527, "epoch": 813} {"train_loss": -20.577829360961914, "global_step": 67528, "epoch": 813} {"train_loss": -20.426158905029297, "global_step": 67529, "epoch": 813} {"train_loss": -20.629470825195312, "global_step": 67530, "epoch": 813} {"train_loss": -20.581409454345703, "global_step": 67531, "epoch": 813} {"train_loss": -20.801271438598633, "global_step": 67532, "epoch": 813} {"train_loss": -20.956634521484375, "global_step": 67533, "epoch": 813} {"train_loss": -20.99372100830078, "global_step": 67534, "epoch": 813} {"train_loss": -20.794511795043945, "global_step": 67535, "epoch": 813} {"train_loss": -20.809614181518555, "global_step": 67536, "epoch": 813} {"train_loss": -20.43509292602539, "global_step": 67537, "epoch": 813} {"train_loss": -20.674091339111328, "global_step": 67538, "epoch": 813} {"train_loss": -20.512195587158203, "global_step": 67539, "epoch": 813} {"train_loss": -20.73212242126465, "global_step": 67540, "epoch": 813} {"train_loss": -20.885425567626953, "global_step": 67541, "epoch": 813} {"train_loss": -20.759008407592773, "global_step": 67542, "epoch": 813} {"train_loss": -20.53818702697754, "global_step": 67543, "epoch": 813} {"train_loss": -20.704954147338867, "global_step": 67544, "epoch": 813} {"train_loss": -20.505163192749023, "global_step": 67545, "epoch": 813} {"train_loss": -20.888259887695312, "global_step": 67546, "epoch": 813} {"train_loss": -21.025711059570312, "global_step": 67547, "epoch": 813} {"train_loss": -20.395185470581055, "global_step": 67548, "epoch": 813} {"train_loss": -20.480735778808594, "global_step": 67549, "epoch": 813} {"train_loss": -20.475187301635742, "global_step": 67550, "epoch": 813} {"train_loss": -20.710407257080078, "global_step": 67551, "epoch": 813} {"train_loss": -20.61236000061035, "global_step": 67552, "epoch": 813} {"train_loss": -20.1937198638916, "global_step": 67553, "epoch": 813} {"train_loss": -20.80140495300293, "global_step": 67554, "epoch": 813} {"train_loss": -20.595630645751953, "global_step": 67555, "epoch": 813} {"train_loss": -20.610443115234375, "global_step": 67556, "epoch": 813} {"train_loss": -20.30670928955078, "global_step": 67557, "epoch": 813} {"train_loss": -20.357547760009766, "global_step": 67558, "epoch": 813} {"train_loss": -20.376598358154297, "global_step": 67559, "epoch": 813} {"train_loss": -20.637439727783203, "global_step": 67560, "epoch": 813} {"train_loss": -20.674835825540935, "global_step": 67561, "epoch": 813, "val_loss": 5828401.0} {"train_loss": -20.611209869384766, "global_step": 67562, "epoch": 814} {"train_loss": -20.766752243041992, "global_step": 67563, "epoch": 814} {"train_loss": -20.48692512512207, "global_step": 67564, "epoch": 814} {"train_loss": -20.265777587890625, "global_step": 67565, "epoch": 814} {"train_loss": -20.561847686767578, "global_step": 67566, "epoch": 814} {"train_loss": -20.451610565185547, "global_step": 67567, "epoch": 814} {"train_loss": -20.37946319580078, "global_step": 67568, "epoch": 814} {"train_loss": -20.560800552368164, "global_step": 67569, "epoch": 814} {"train_loss": -20.32999038696289, "global_step": 67570, "epoch": 814} {"train_loss": -20.59038543701172, "global_step": 67571, "epoch": 814} {"train_loss": -20.93761444091797, "global_step": 67572, "epoch": 814} {"train_loss": -20.414234161376953, "global_step": 67573, "epoch": 814} {"train_loss": -20.58963966369629, "global_step": 67574, "epoch": 814} {"train_loss": -20.785627365112305, "global_step": 67575, "epoch": 814} {"train_loss": -20.67384147644043, "global_step": 67576, "epoch": 814} {"train_loss": -20.471792221069336, "global_step": 67577, "epoch": 814} {"train_loss": -20.882863998413086, "global_step": 67578, "epoch": 814} {"train_loss": -20.678598403930664, "global_step": 67579, "epoch": 814} {"train_loss": -20.488203048706055, "global_step": 67580, "epoch": 814} {"train_loss": -20.601470947265625, "global_step": 67581, "epoch": 814} {"train_loss": -20.78299903869629, "global_step": 67582, "epoch": 814} {"train_loss": -21.067304611206055, "global_step": 67583, "epoch": 814} {"train_loss": -20.78249168395996, "global_step": 67584, "epoch": 814} {"train_loss": -20.865636825561523, "global_step": 67585, "epoch": 814} {"train_loss": -20.421142578125, "global_step": 67586, "epoch": 814} {"train_loss": -20.824872970581055, "global_step": 67587, "epoch": 814} {"train_loss": -20.451040267944336, "global_step": 67588, "epoch": 814} {"train_loss": -20.618614196777344, "global_step": 67589, "epoch": 814} {"train_loss": -20.68247413635254, "global_step": 67590, "epoch": 814} {"train_loss": -20.817951202392578, "global_step": 67591, "epoch": 814} {"train_loss": -20.80164909362793, "global_step": 67592, "epoch": 814} {"train_loss": -20.697998046875, "global_step": 67593, "epoch": 814} {"train_loss": -20.75235366821289, "global_step": 67594, "epoch": 814} {"train_loss": -21.209070205688477, "global_step": 67595, "epoch": 814} {"train_loss": -20.269336700439453, "global_step": 67596, "epoch": 814} {"train_loss": -20.436416625976562, "global_step": 67597, "epoch": 814} {"train_loss": -20.6441593170166, "global_step": 67598, "epoch": 814} {"train_loss": -20.499526977539062, "global_step": 67599, "epoch": 814} {"train_loss": -20.84395408630371, "global_step": 67600, "epoch": 814} {"train_loss": -20.652326583862305, "global_step": 67601, "epoch": 814} {"train_loss": -20.874515533447266, "global_step": 67602, "epoch": 814} {"train_loss": -20.428211212158203, "global_step": 67603, "epoch": 814} {"train_loss": -20.692731857299805, "global_step": 67604, "epoch": 814} {"train_loss": -20.798526763916016, "global_step": 67605, "epoch": 814} {"train_loss": -20.877477645874023, "global_step": 67606, "epoch": 814} {"train_loss": -20.426475524902344, "global_step": 67607, "epoch": 814} {"train_loss": -20.780094146728516, "global_step": 67608, "epoch": 814} {"train_loss": -20.58125114440918, "global_step": 67609, "epoch": 814} {"train_loss": -20.99649429321289, "global_step": 67610, "epoch": 814} {"train_loss": -21.188318252563477, "global_step": 67611, "epoch": 814} {"train_loss": -20.740238189697266, "global_step": 67612, "epoch": 814} {"train_loss": -20.74617576599121, "global_step": 67613, "epoch": 814} {"train_loss": -20.813692092895508, "global_step": 67614, "epoch": 814} {"train_loss": -20.615079879760742, "global_step": 67615, "epoch": 814} {"train_loss": -20.670915603637695, "global_step": 67616, "epoch": 814} {"train_loss": -21.03948402404785, "global_step": 67617, "epoch": 814} {"train_loss": -20.616796493530273, "global_step": 67618, "epoch": 814} {"train_loss": -20.35750961303711, "global_step": 67619, "epoch": 814} {"train_loss": -21.049697875976562, "global_step": 67620, "epoch": 814} {"train_loss": -20.691120147705078, "global_step": 67621, "epoch": 814} {"train_loss": -20.536283493041992, "global_step": 67622, "epoch": 814} {"train_loss": -20.764114379882812, "global_step": 67623, "epoch": 814} {"train_loss": -20.423490524291992, "global_step": 67624, "epoch": 814} {"train_loss": -20.696083068847656, "global_step": 67625, "epoch": 814} {"train_loss": -20.955076217651367, "global_step": 67626, "epoch": 814} {"train_loss": -20.85658836364746, "global_step": 67627, "epoch": 814} {"train_loss": -20.489282608032227, "global_step": 67628, "epoch": 814} {"train_loss": -21.11444664001465, "global_step": 67629, "epoch": 814} {"train_loss": -20.944904327392578, "global_step": 67630, "epoch": 814} {"train_loss": -20.672677993774414, "global_step": 67631, "epoch": 814} {"train_loss": -20.700613021850586, "global_step": 67632, "epoch": 814} {"train_loss": -20.4884033203125, "global_step": 67633, "epoch": 814} {"train_loss": -20.517000198364258, "global_step": 67634, "epoch": 814} {"train_loss": -20.51980972290039, "global_step": 67635, "epoch": 814} {"train_loss": -21.029403686523438, "global_step": 67636, "epoch": 814} {"train_loss": -20.737213134765625, "global_step": 67637, "epoch": 814} {"train_loss": -20.460201263427734, "global_step": 67638, "epoch": 814} {"train_loss": -20.90018653869629, "global_step": 67639, "epoch": 814} {"train_loss": -20.83108139038086, "global_step": 67640, "epoch": 814} {"train_loss": -20.661300659179688, "global_step": 67641, "epoch": 814} {"train_loss": -20.83778953552246, "global_step": 67642, "epoch": 814} {"train_loss": -20.86893081665039, "global_step": 67643, "epoch": 814} {"train_loss": -20.68276007778673, "global_step": 67644, "epoch": 814, "val_loss": 5767155.0} {"train_loss": -20.323392868041992, "global_step": 67645, "epoch": 815} {"train_loss": -20.480459213256836, "global_step": 67646, "epoch": 815} {"train_loss": -20.667308807373047, "global_step": 67647, "epoch": 815} {"train_loss": -20.523365020751953, "global_step": 67648, "epoch": 815} {"train_loss": -20.744291305541992, "global_step": 67649, "epoch": 815} {"train_loss": -20.206979751586914, "global_step": 67650, "epoch": 815} {"train_loss": -20.726652145385742, "global_step": 67651, "epoch": 815} {"train_loss": -20.64183235168457, "global_step": 67652, "epoch": 815} {"train_loss": -20.448116302490234, "global_step": 67653, "epoch": 815} {"train_loss": -20.578922271728516, "global_step": 67654, "epoch": 815} {"train_loss": -20.390024185180664, "global_step": 67655, "epoch": 815} {"train_loss": -20.651884078979492, "global_step": 67656, "epoch": 815} {"train_loss": -20.22068977355957, "global_step": 67657, "epoch": 815} {"train_loss": -20.58427619934082, "global_step": 67658, "epoch": 815} {"train_loss": -20.858068466186523, "global_step": 67659, "epoch": 815} {"train_loss": -20.554903030395508, "global_step": 67660, "epoch": 815} {"train_loss": -20.706003189086914, "global_step": 67661, "epoch": 815} {"train_loss": -20.375370025634766, "global_step": 67662, "epoch": 815} {"train_loss": -20.348072052001953, "global_step": 67663, "epoch": 815} {"train_loss": -20.840639114379883, "global_step": 67664, "epoch": 815} {"train_loss": -20.642011642456055, "global_step": 67665, "epoch": 815} {"train_loss": -20.68043327331543, "global_step": 67666, "epoch": 815} {"train_loss": -20.41391944885254, "global_step": 67667, "epoch": 815} {"train_loss": -20.556734085083008, "global_step": 67668, "epoch": 815} {"train_loss": -20.40418243408203, "global_step": 67669, "epoch": 815} {"train_loss": -21.013324737548828, "global_step": 67670, "epoch": 815} {"train_loss": -20.74473762512207, "global_step": 67671, "epoch": 815} {"train_loss": -20.8778133392334, "global_step": 67672, "epoch": 815} {"train_loss": -20.516530990600586, "global_step": 67673, "epoch": 815} {"train_loss": -21.096464157104492, "global_step": 67674, "epoch": 815} {"train_loss": -20.56192398071289, "global_step": 67675, "epoch": 815} {"train_loss": -20.68694496154785, "global_step": 67676, "epoch": 815} {"train_loss": -20.51741600036621, "global_step": 67677, "epoch": 815} {"train_loss": -20.704687118530273, "global_step": 67678, "epoch": 815} {"train_loss": -20.694196701049805, "global_step": 67679, "epoch": 815} {"train_loss": -20.829753875732422, "global_step": 67680, "epoch": 815} {"train_loss": -20.654619216918945, "global_step": 67681, "epoch": 815} {"train_loss": -20.673933029174805, "global_step": 67682, "epoch": 815} {"train_loss": -20.506122589111328, "global_step": 67683, "epoch": 815} {"train_loss": -21.080286026000977, "global_step": 67684, "epoch": 815} {"train_loss": -20.538942337036133, "global_step": 67685, "epoch": 815} {"train_loss": -20.809921264648438, "global_step": 67686, "epoch": 815} {"train_loss": -20.882577896118164, "global_step": 67687, "epoch": 815} {"train_loss": -20.842199325561523, "global_step": 67688, "epoch": 815} {"train_loss": -20.723798751831055, "global_step": 67689, "epoch": 815} {"train_loss": -20.7761287689209, "global_step": 67690, "epoch": 815} {"train_loss": -20.753067016601562, "global_step": 67691, "epoch": 815} {"train_loss": -20.826101303100586, "global_step": 67692, "epoch": 815} {"train_loss": -20.63850212097168, "global_step": 67693, "epoch": 815} {"train_loss": -20.691225051879883, "global_step": 67694, "epoch": 815} {"train_loss": -20.64828872680664, "global_step": 67695, "epoch": 815} {"train_loss": -21.048723220825195, "global_step": 67696, "epoch": 815} {"train_loss": -20.884695053100586, "global_step": 67697, "epoch": 815} {"train_loss": -20.843801498413086, "global_step": 67698, "epoch": 815} {"train_loss": -20.90091896057129, "global_step": 67699, "epoch": 815} {"train_loss": -20.574243545532227, "global_step": 67700, "epoch": 815} {"train_loss": -20.60012435913086, "global_step": 67701, "epoch": 815} {"train_loss": -20.185861587524414, "global_step": 67702, "epoch": 815} {"train_loss": -20.64223289489746, "global_step": 67703, "epoch": 815} {"train_loss": -20.860214233398438, "global_step": 67704, "epoch": 815} {"train_loss": -20.621540069580078, "global_step": 67705, "epoch": 815} {"train_loss": -20.7412052154541, "global_step": 67706, "epoch": 815} {"train_loss": -20.576093673706055, "global_step": 67707, "epoch": 815} {"train_loss": -20.939525604248047, "global_step": 67708, "epoch": 815} {"train_loss": -20.921445846557617, "global_step": 67709, "epoch": 815} {"train_loss": -20.543691635131836, "global_step": 67710, "epoch": 815} {"train_loss": -20.79264259338379, "global_step": 67711, "epoch": 815} {"train_loss": -20.4147891998291, "global_step": 67712, "epoch": 815} {"train_loss": -20.73078727722168, "global_step": 67713, "epoch": 815} {"train_loss": -20.7609806060791, "global_step": 67714, "epoch": 815} {"train_loss": -20.871444702148438, "global_step": 67715, "epoch": 815} {"train_loss": -20.649045944213867, "global_step": 67716, "epoch": 815} {"train_loss": -20.504690170288086, "global_step": 67717, "epoch": 815} {"train_loss": -20.772871017456055, "global_step": 67718, "epoch": 815} {"train_loss": -21.220273971557617, "global_step": 67719, "epoch": 815} {"train_loss": -20.71290397644043, "global_step": 67720, "epoch": 815} {"train_loss": -20.685077667236328, "global_step": 67721, "epoch": 815} {"train_loss": -20.678695678710938, "global_step": 67722, "epoch": 815} {"train_loss": -20.76178550720215, "global_step": 67723, "epoch": 815} {"train_loss": -20.65898323059082, "global_step": 67724, "epoch": 815} {"train_loss": -20.47121238708496, "global_step": 67725, "epoch": 815} {"train_loss": -20.83926773071289, "global_step": 67726, "epoch": 815} {"train_loss": -20.70158657395696, "global_step": 67727, "epoch": 815, "val_loss": 6103439.5} {"train_loss": -20.443605422973633, "global_step": 67728, "epoch": 816} {"train_loss": -20.331342697143555, "global_step": 67729, "epoch": 816} {"train_loss": -20.463027954101562, "global_step": 67730, "epoch": 816} {"train_loss": -20.829954147338867, "global_step": 67731, "epoch": 816} {"train_loss": -20.84803581237793, "global_step": 67732, "epoch": 816} {"train_loss": -20.21826934814453, "global_step": 67733, "epoch": 816} {"train_loss": -20.832733154296875, "global_step": 67734, "epoch": 816} {"train_loss": -20.98459243774414, "global_step": 67735, "epoch": 816} {"train_loss": -20.52792739868164, "global_step": 67736, "epoch": 816} {"train_loss": -20.65645980834961, "global_step": 67737, "epoch": 816} {"train_loss": -20.336320877075195, "global_step": 67738, "epoch": 816} {"train_loss": -20.767255783081055, "global_step": 67739, "epoch": 816} {"train_loss": -20.467483520507812, "global_step": 67740, "epoch": 816} {"train_loss": -20.738691329956055, "global_step": 67741, "epoch": 816} {"train_loss": -20.576114654541016, "global_step": 67742, "epoch": 816} {"train_loss": -20.296222686767578, "global_step": 67743, "epoch": 816} {"train_loss": -20.42974853515625, "global_step": 67744, "epoch": 816} {"train_loss": -20.705930709838867, "global_step": 67745, "epoch": 816} {"train_loss": -20.787137985229492, "global_step": 67746, "epoch": 816} {"train_loss": -20.38784408569336, "global_step": 67747, "epoch": 816} {"train_loss": -20.61979103088379, "global_step": 67748, "epoch": 816} {"train_loss": -20.67610740661621, "global_step": 67749, "epoch": 816} {"train_loss": -20.801767349243164, "global_step": 67750, "epoch": 816} {"train_loss": -20.508604049682617, "global_step": 67751, "epoch": 816} {"train_loss": -21.125730514526367, "global_step": 67752, "epoch": 816} {"train_loss": -20.622587203979492, "global_step": 67753, "epoch": 816} {"train_loss": -20.67866325378418, "global_step": 67754, "epoch": 816} {"train_loss": -20.59524917602539, "global_step": 67755, "epoch": 816} {"train_loss": -21.05854606628418, "global_step": 67756, "epoch": 816} {"train_loss": -20.737253189086914, "global_step": 67757, "epoch": 816} {"train_loss": -20.76797866821289, "global_step": 67758, "epoch": 816} {"train_loss": -20.66400718688965, "global_step": 67759, "epoch": 816} {"train_loss": -20.895248413085938, "global_step": 67760, "epoch": 816} {"train_loss": -20.4846248626709, "global_step": 67761, "epoch": 816} {"train_loss": -21.163753509521484, "global_step": 67762, "epoch": 816} {"train_loss": -20.610807418823242, "global_step": 67763, "epoch": 816} {"train_loss": -20.828649520874023, "global_step": 67764, "epoch": 816} {"train_loss": -20.986051559448242, "global_step": 67765, "epoch": 816} {"train_loss": -20.555171966552734, "global_step": 67766, "epoch": 816} {"train_loss": -20.54199981689453, "global_step": 67767, "epoch": 816} {"train_loss": -20.437580108642578, "global_step": 67768, "epoch": 816} {"train_loss": -20.437450408935547, "global_step": 67769, "epoch": 816} {"train_loss": -20.84235954284668, "global_step": 67770, "epoch": 816} {"train_loss": -20.812002182006836, "global_step": 67771, "epoch": 816} {"train_loss": -20.47540855407715, "global_step": 67772, "epoch": 816} {"train_loss": -20.726755142211914, "global_step": 67773, "epoch": 816} {"train_loss": -20.485456466674805, "global_step": 67774, "epoch": 816} {"train_loss": -20.563344955444336, "global_step": 67775, "epoch": 816} {"train_loss": -20.718355178833008, "global_step": 67776, "epoch": 816} {"train_loss": -20.85890769958496, "global_step": 67777, "epoch": 816} {"train_loss": -20.602319717407227, "global_step": 67778, "epoch": 816} {"train_loss": -20.8576602935791, "global_step": 67779, "epoch": 816} {"train_loss": -20.852441787719727, "global_step": 67780, "epoch": 816} {"train_loss": -20.64735984802246, "global_step": 67781, "epoch": 816} {"train_loss": -21.1254940032959, "global_step": 67782, "epoch": 816} {"train_loss": -21.087772369384766, "global_step": 67783, "epoch": 816} {"train_loss": -20.5602970123291, "global_step": 67784, "epoch": 816} {"train_loss": -20.666601181030273, "global_step": 67785, "epoch": 816} {"train_loss": -20.924421310424805, "global_step": 67786, "epoch": 816} {"train_loss": -20.847501754760742, "global_step": 67787, "epoch": 816} {"train_loss": -20.80292510986328, "global_step": 67788, "epoch": 816} {"train_loss": -20.63496971130371, "global_step": 67789, "epoch": 816} {"train_loss": -20.341096878051758, "global_step": 67790, "epoch": 816} {"train_loss": -20.69386863708496, "global_step": 67791, "epoch": 816} {"train_loss": -20.94037628173828, "global_step": 67792, "epoch": 816} {"train_loss": -20.537694931030273, "global_step": 67793, "epoch": 816} {"train_loss": -20.875682830810547, "global_step": 67794, "epoch": 816} {"train_loss": -20.818740844726562, "global_step": 67795, "epoch": 816} {"train_loss": -20.435504913330078, "global_step": 67796, "epoch": 816} {"train_loss": -21.203699111938477, "global_step": 67797, "epoch": 816} {"train_loss": -20.96820068359375, "global_step": 67798, "epoch": 816} {"train_loss": -20.953571319580078, "global_step": 67799, "epoch": 816} {"train_loss": -20.7987060546875, "global_step": 67800, "epoch": 816} {"train_loss": -21.263425827026367, "global_step": 67801, "epoch": 816} {"train_loss": -20.50080680847168, "global_step": 67802, "epoch": 816} {"train_loss": -20.869089126586914, "global_step": 67803, "epoch": 816} {"train_loss": -20.527753829956055, "global_step": 67804, "epoch": 816} {"train_loss": -20.71210289001465, "global_step": 67805, "epoch": 816} {"train_loss": -20.922061920166016, "global_step": 67806, "epoch": 816} {"train_loss": -20.60328483581543, "global_step": 67807, "epoch": 816} {"train_loss": -20.936248779296875, "global_step": 67808, "epoch": 816} {"train_loss": -20.625783920288086, "global_step": 67809, "epoch": 816} {"train_loss": -20.713874449212867, "global_step": 67810, "epoch": 816, "val_loss": 5869263.5} {"train_loss": -19.614988327026367, "global_step": 67811, "epoch": 817} {"train_loss": -20.590911865234375, "global_step": 67812, "epoch": 817} {"train_loss": -19.89845085144043, "global_step": 67813, "epoch": 817} {"train_loss": -20.61067008972168, "global_step": 67814, "epoch": 817} {"train_loss": -20.6147403717041, "global_step": 67815, "epoch": 817} {"train_loss": -20.04471778869629, "global_step": 67816, "epoch": 817} {"train_loss": -20.140167236328125, "global_step": 67817, "epoch": 817} {"train_loss": -20.423940658569336, "global_step": 67818, "epoch": 817} {"train_loss": -20.355972290039062, "global_step": 67819, "epoch": 817} {"train_loss": -20.684080123901367, "global_step": 67820, "epoch": 817} {"train_loss": -20.445758819580078, "global_step": 67821, "epoch": 817} {"train_loss": -20.543893814086914, "global_step": 67822, "epoch": 817} {"train_loss": -20.511474609375, "global_step": 67823, "epoch": 817} {"train_loss": -20.704362869262695, "global_step": 67824, "epoch": 817} {"train_loss": -20.3261661529541, "global_step": 67825, "epoch": 817} {"train_loss": -20.224266052246094, "global_step": 67826, "epoch": 817} {"train_loss": -20.663496017456055, "global_step": 67827, "epoch": 817} {"train_loss": -20.698143005371094, "global_step": 67828, "epoch": 817} {"train_loss": -20.431472778320312, "global_step": 67829, "epoch": 817} {"train_loss": -20.559532165527344, "global_step": 67830, "epoch": 817} {"train_loss": -21.10200309753418, "global_step": 67831, "epoch": 817} {"train_loss": -20.788970947265625, "global_step": 67832, "epoch": 817} {"train_loss": -20.84894561767578, "global_step": 67833, "epoch": 817} {"train_loss": -20.73464012145996, "global_step": 67834, "epoch": 817} {"train_loss": -20.596755981445312, "global_step": 67835, "epoch": 817} {"train_loss": -20.796478271484375, "global_step": 67836, "epoch": 817} {"train_loss": -20.830774307250977, "global_step": 67837, "epoch": 817} {"train_loss": -20.516183853149414, "global_step": 67838, "epoch": 817} {"train_loss": -20.613950729370117, "global_step": 67839, "epoch": 817} {"train_loss": -20.612844467163086, "global_step": 67840, "epoch": 817} {"train_loss": -20.677249908447266, "global_step": 67841, "epoch": 817} {"train_loss": -20.72983169555664, "global_step": 67842, "epoch": 817} {"train_loss": -20.52260398864746, "global_step": 67843, "epoch": 817} {"train_loss": -20.9797420501709, "global_step": 67844, "epoch": 817} {"train_loss": -20.634672164916992, "global_step": 67845, "epoch": 817} {"train_loss": -20.648527145385742, "global_step": 67846, "epoch": 817} {"train_loss": -20.593629837036133, "global_step": 67847, "epoch": 817} {"train_loss": -20.87312889099121, "global_step": 67848, "epoch": 817} {"train_loss": -20.69219970703125, "global_step": 67849, "epoch": 817} {"train_loss": -20.499963760375977, "global_step": 67850, "epoch": 817} {"train_loss": -20.487585067749023, "global_step": 67851, "epoch": 817} {"train_loss": -20.879880905151367, "global_step": 67852, "epoch": 817} {"train_loss": -20.565263748168945, "global_step": 67853, "epoch": 817} {"train_loss": -20.885141372680664, "global_step": 67854, "epoch": 817} {"train_loss": -20.523193359375, "global_step": 67855, "epoch": 817} {"train_loss": -20.647504806518555, "global_step": 67856, "epoch": 817} {"train_loss": -20.611982345581055, "global_step": 67857, "epoch": 817} {"train_loss": -21.1756591796875, "global_step": 67858, "epoch": 817} {"train_loss": -20.58525848388672, "global_step": 67859, "epoch": 817} {"train_loss": -20.429149627685547, "global_step": 67860, "epoch": 817} {"train_loss": -20.750829696655273, "global_step": 67861, "epoch": 817} {"train_loss": -21.123449325561523, "global_step": 67862, "epoch": 817} {"train_loss": -20.738943099975586, "global_step": 67863, "epoch": 817} {"train_loss": -20.9371280670166, "global_step": 67864, "epoch": 817} {"train_loss": -20.386688232421875, "global_step": 67865, "epoch": 817} {"train_loss": -20.70924186706543, "global_step": 67866, "epoch": 817} {"train_loss": -20.653669357299805, "global_step": 67867, "epoch": 817} {"train_loss": -20.438264846801758, "global_step": 67868, "epoch": 817} {"train_loss": -20.88014793395996, "global_step": 67869, "epoch": 817} {"train_loss": -20.801654815673828, "global_step": 67870, "epoch": 817} {"train_loss": -20.8604679107666, "global_step": 67871, "epoch": 817} {"train_loss": -20.587093353271484, "global_step": 67872, "epoch": 817} {"train_loss": -20.9085693359375, "global_step": 67873, "epoch": 817} {"train_loss": -20.63739013671875, "global_step": 67874, "epoch": 817} {"train_loss": -21.053932189941406, "global_step": 67875, "epoch": 817} {"train_loss": -20.607385635375977, "global_step": 67876, "epoch": 817} {"train_loss": -20.743680953979492, "global_step": 67877, "epoch": 817} {"train_loss": -20.65938377380371, "global_step": 67878, "epoch": 817} {"train_loss": -20.792417526245117, "global_step": 67879, "epoch": 817} {"train_loss": -20.963224411010742, "global_step": 67880, "epoch": 817} {"train_loss": -20.780454635620117, "global_step": 67881, "epoch": 817} {"train_loss": -20.764728546142578, "global_step": 67882, "epoch": 817} {"train_loss": -20.4249324798584, "global_step": 67883, "epoch": 817} {"train_loss": -20.583341598510742, "global_step": 67884, "epoch": 817} {"train_loss": -20.708499908447266, "global_step": 67885, "epoch": 817} {"train_loss": -20.980077743530273, "global_step": 67886, "epoch": 817} {"train_loss": -20.54237937927246, "global_step": 67887, "epoch": 817} {"train_loss": -20.61581802368164, "global_step": 67888, "epoch": 817} {"train_loss": -20.60064125061035, "global_step": 67889, "epoch": 817} {"train_loss": -20.498857498168945, "global_step": 67890, "epoch": 817} {"train_loss": -20.683574676513672, "global_step": 67891, "epoch": 817} {"train_loss": -20.560680389404297, "global_step": 67892, "epoch": 817} {"train_loss": -20.618220662496174, "global_step": 67893, "epoch": 817, "val_loss": 5990564.0} {"train_loss": -20.265827178955078, "global_step": 67894, "epoch": 818} {"train_loss": -20.283506393432617, "global_step": 67895, "epoch": 818} {"train_loss": -20.67892074584961, "global_step": 67896, "epoch": 818} {"train_loss": -20.327007293701172, "global_step": 67897, "epoch": 818} {"train_loss": -20.06913185119629, "global_step": 67898, "epoch": 818} {"train_loss": -20.415563583374023, "global_step": 67899, "epoch": 818} {"train_loss": -20.37690544128418, "global_step": 67900, "epoch": 818} {"train_loss": -20.479108810424805, "global_step": 67901, "epoch": 818} {"train_loss": -20.73525619506836, "global_step": 67902, "epoch": 818} {"train_loss": -20.455951690673828, "global_step": 67903, "epoch": 818} {"train_loss": -20.35603141784668, "global_step": 67904, "epoch": 818} {"train_loss": -20.123783111572266, "global_step": 67905, "epoch": 818} {"train_loss": -20.833070755004883, "global_step": 67906, "epoch": 818} {"train_loss": -20.130163192749023, "global_step": 67907, "epoch": 818} {"train_loss": -20.794044494628906, "global_step": 67908, "epoch": 818} {"train_loss": -20.760467529296875, "global_step": 67909, "epoch": 818} {"train_loss": -20.557647705078125, "global_step": 67910, "epoch": 818} {"train_loss": -20.865575790405273, "global_step": 67911, "epoch": 818} {"train_loss": -20.67698097229004, "global_step": 67912, "epoch": 818} {"train_loss": -20.434019088745117, "global_step": 67913, "epoch": 818} {"train_loss": -20.78285789489746, "global_step": 67914, "epoch": 818} {"train_loss": -20.835119247436523, "global_step": 67915, "epoch": 818} {"train_loss": -20.402795791625977, "global_step": 67916, "epoch": 818} {"train_loss": -20.594938278198242, "global_step": 67917, "epoch": 818} {"train_loss": -20.946643829345703, "global_step": 67918, "epoch": 818} {"train_loss": -20.5263671875, "global_step": 67919, "epoch": 818} {"train_loss": -20.616376876831055, "global_step": 67920, "epoch": 818} {"train_loss": -20.742368698120117, "global_step": 67921, "epoch": 818} {"train_loss": -20.617290496826172, "global_step": 67922, "epoch": 818} {"train_loss": -20.613388061523438, "global_step": 67923, "epoch": 818} {"train_loss": -20.452735900878906, "global_step": 67924, "epoch": 818} {"train_loss": -20.732990264892578, "global_step": 67925, "epoch": 818} {"train_loss": -21.065153121948242, "global_step": 67926, "epoch": 818} {"train_loss": -20.734827041625977, "global_step": 67927, "epoch": 818} {"train_loss": -21.047840118408203, "global_step": 67928, "epoch": 818} {"train_loss": -20.74482536315918, "global_step": 67929, "epoch": 818} {"train_loss": -20.649866104125977, "global_step": 67930, "epoch": 818} {"train_loss": -20.593748092651367, "global_step": 67931, "epoch": 818} {"train_loss": -20.8314151763916, "global_step": 67932, "epoch": 818} {"train_loss": -20.952579498291016, "global_step": 67933, "epoch": 818} {"train_loss": -20.898969650268555, "global_step": 67934, "epoch": 818} {"train_loss": -20.918622970581055, "global_step": 67935, "epoch": 818} {"train_loss": -20.438669204711914, "global_step": 67936, "epoch": 818} {"train_loss": -20.525373458862305, "global_step": 67937, "epoch": 818} {"train_loss": -20.68848991394043, "global_step": 67938, "epoch": 818} {"train_loss": -20.650060653686523, "global_step": 67939, "epoch": 818} {"train_loss": -20.8062686920166, "global_step": 67940, "epoch": 818} {"train_loss": -21.07001495361328, "global_step": 67941, "epoch": 818} {"train_loss": -21.411176681518555, "global_step": 67942, "epoch": 818} {"train_loss": -20.55476951599121, "global_step": 67943, "epoch": 818} {"train_loss": -20.638141632080078, "global_step": 67944, "epoch": 818} {"train_loss": -20.63818359375, "global_step": 67945, "epoch": 818} {"train_loss": -20.890932083129883, "global_step": 67946, "epoch": 818} {"train_loss": -20.57240867614746, "global_step": 67947, "epoch": 818} {"train_loss": -20.50066375732422, "global_step": 67948, "epoch": 818} {"train_loss": -20.514678955078125, "global_step": 67949, "epoch": 818} {"train_loss": -20.42873191833496, "global_step": 67950, "epoch": 818} {"train_loss": -20.95582389831543, "global_step": 67951, "epoch": 818} {"train_loss": -21.0992488861084, "global_step": 67952, "epoch": 818} {"train_loss": -20.734758377075195, "global_step": 67953, "epoch": 818} {"train_loss": -20.861608505249023, "global_step": 67954, "epoch": 818} {"train_loss": -21.085304260253906, "global_step": 67955, "epoch": 818} {"train_loss": -20.77696418762207, "global_step": 67956, "epoch": 818} {"train_loss": -20.710046768188477, "global_step": 67957, "epoch": 818} {"train_loss": -20.671588897705078, "global_step": 67958, "epoch": 818} {"train_loss": -20.554960250854492, "global_step": 67959, "epoch": 818} {"train_loss": -20.65139389038086, "global_step": 67960, "epoch": 818} {"train_loss": -20.91361427307129, "global_step": 67961, "epoch": 818} {"train_loss": -21.054336547851562, "global_step": 67962, "epoch": 818} {"train_loss": -20.522863388061523, "global_step": 67963, "epoch": 818} {"train_loss": -21.143163681030273, "global_step": 67964, "epoch": 818} {"train_loss": -20.69921875, "global_step": 67965, "epoch": 818} {"train_loss": -20.711973190307617, "global_step": 67966, "epoch": 818} {"train_loss": -20.444116592407227, "global_step": 67967, "epoch": 818} {"train_loss": -20.7091007232666, "global_step": 67968, "epoch": 818} {"train_loss": -20.501026153564453, "global_step": 67969, "epoch": 818} {"train_loss": -20.988983154296875, "global_step": 67970, "epoch": 818} {"train_loss": -20.490039825439453, "global_step": 67971, "epoch": 818} {"train_loss": -21.07359504699707, "global_step": 67972, "epoch": 818} {"train_loss": -20.445117950439453, "global_step": 67973, "epoch": 818} {"train_loss": -20.891796112060547, "global_step": 67974, "epoch": 818} {"train_loss": -20.407917022705078, "global_step": 67975, "epoch": 818} {"train_loss": -20.675354762249682, "global_step": 67976, "epoch": 818, "val_loss": 6075652.0} {"train_loss": -20.754304885864258, "global_step": 67977, "epoch": 819} {"train_loss": -20.94261932373047, "global_step": 67978, "epoch": 819} {"train_loss": -20.50530433654785, "global_step": 67979, "epoch": 819} {"train_loss": -20.453662872314453, "global_step": 67980, "epoch": 819} {"train_loss": -20.7995548248291, "global_step": 67981, "epoch": 819} {"train_loss": -20.930099487304688, "global_step": 67982, "epoch": 819} {"train_loss": -20.538785934448242, "global_step": 67983, "epoch": 819} {"train_loss": -20.997011184692383, "global_step": 67984, "epoch": 819} {"train_loss": -20.28256607055664, "global_step": 67985, "epoch": 819} {"train_loss": -20.92001724243164, "global_step": 67986, "epoch": 819} {"train_loss": -20.960092544555664, "global_step": 67987, "epoch": 819} {"train_loss": -20.95377540588379, "global_step": 67988, "epoch": 819} {"train_loss": -20.348072052001953, "global_step": 67989, "epoch": 819} {"train_loss": -20.767154693603516, "global_step": 67990, "epoch": 819} {"train_loss": -20.933887481689453, "global_step": 67991, "epoch": 819} {"train_loss": -20.78364372253418, "global_step": 67992, "epoch": 819} {"train_loss": -20.972286224365234, "global_step": 67993, "epoch": 819} {"train_loss": -20.421751022338867, "global_step": 67994, "epoch": 819} {"train_loss": -20.491714477539062, "global_step": 67995, "epoch": 819} {"train_loss": -20.147048950195312, "global_step": 67996, "epoch": 819} {"train_loss": -20.201509475708008, "global_step": 67997, "epoch": 819} {"train_loss": -20.75905990600586, "global_step": 67998, "epoch": 819} {"train_loss": -20.548643112182617, "global_step": 67999, "epoch": 819} {"train_loss": -20.818838119506836, "global_step": 68000, "epoch": 819} {"train_loss": -20.75044059753418, "global_step": 68001, "epoch": 819} {"train_loss": -20.58771324157715, "global_step": 68002, "epoch": 819} {"train_loss": -20.513519287109375, "global_step": 68003, "epoch": 819} {"train_loss": -20.773832321166992, "global_step": 68004, "epoch": 819} {"train_loss": -20.547163009643555, "global_step": 68005, "epoch": 819} {"train_loss": -20.690553665161133, "global_step": 68006, "epoch": 819} {"train_loss": -20.531675338745117, "global_step": 68007, "epoch": 819} {"train_loss": -20.703353881835938, "global_step": 68008, "epoch": 819} {"train_loss": -20.629806518554688, "global_step": 68009, "epoch": 819} {"train_loss": -20.633575439453125, "global_step": 68010, "epoch": 819} {"train_loss": -20.712615966796875, "global_step": 68011, "epoch": 819} {"train_loss": -21.05756950378418, "global_step": 68012, "epoch": 819} {"train_loss": -20.982620239257812, "global_step": 68013, "epoch": 819} {"train_loss": -20.37360191345215, "global_step": 68014, "epoch": 819} {"train_loss": -20.900554656982422, "global_step": 68015, "epoch": 819} {"train_loss": -21.198755264282227, "global_step": 68016, "epoch": 819} {"train_loss": -20.470422744750977, "global_step": 68017, "epoch": 819} {"train_loss": -20.839330673217773, "global_step": 68018, "epoch": 819} {"train_loss": -20.798044204711914, "global_step": 68019, "epoch": 819} {"train_loss": -21.0175724029541, "global_step": 68020, "epoch": 819} {"train_loss": -20.8344783782959, "global_step": 68021, "epoch": 819} {"train_loss": -20.55060386657715, "global_step": 68022, "epoch": 819} {"train_loss": -20.477455139160156, "global_step": 68023, "epoch": 819} {"train_loss": -21.070112228393555, "global_step": 68024, "epoch": 819} {"train_loss": -20.770618438720703, "global_step": 68025, "epoch": 819} {"train_loss": -20.731273651123047, "global_step": 68026, "epoch": 819} {"train_loss": -20.552169799804688, "global_step": 68027, "epoch": 819} {"train_loss": -20.503854751586914, "global_step": 68028, "epoch": 819} {"train_loss": -20.681133270263672, "global_step": 68029, "epoch": 819} {"train_loss": -20.64784049987793, "global_step": 68030, "epoch": 819} {"train_loss": -20.873733520507812, "global_step": 68031, "epoch": 819} {"train_loss": -20.906721115112305, "global_step": 68032, "epoch": 819} {"train_loss": -20.840194702148438, "global_step": 68033, "epoch": 819} {"train_loss": -20.70284652709961, "global_step": 68034, "epoch": 819} {"train_loss": -20.512218475341797, "global_step": 68035, "epoch": 819} {"train_loss": -20.77821159362793, "global_step": 68036, "epoch": 819} {"train_loss": -20.767606735229492, "global_step": 68037, "epoch": 819} {"train_loss": -20.824478149414062, "global_step": 68038, "epoch": 819} {"train_loss": -20.617883682250977, "global_step": 68039, "epoch": 819} {"train_loss": -20.469846725463867, "global_step": 68040, "epoch": 819} {"train_loss": -20.838199615478516, "global_step": 68041, "epoch": 819} {"train_loss": -20.289339065551758, "global_step": 68042, "epoch": 819} {"train_loss": -20.347837448120117, "global_step": 68043, "epoch": 819} {"train_loss": -20.72365379333496, "global_step": 68044, "epoch": 819} {"train_loss": -20.470678329467773, "global_step": 68045, "epoch": 819} {"train_loss": -20.825307846069336, "global_step": 68046, "epoch": 819} {"train_loss": -20.538969039916992, "global_step": 68047, "epoch": 819} {"train_loss": -20.42412757873535, "global_step": 68048, "epoch": 819} {"train_loss": -20.88919448852539, "global_step": 68049, "epoch": 819} {"train_loss": -21.030315399169922, "global_step": 68050, "epoch": 819} {"train_loss": -20.849365234375, "global_step": 68051, "epoch": 819} {"train_loss": -20.791671752929688, "global_step": 68052, "epoch": 819} {"train_loss": -20.367950439453125, "global_step": 68053, "epoch": 819} {"train_loss": -20.749174118041992, "global_step": 68054, "epoch": 819} {"train_loss": -20.908151626586914, "global_step": 68055, "epoch": 819} {"train_loss": -20.95237922668457, "global_step": 68056, "epoch": 819} {"train_loss": -20.652469635009766, "global_step": 68057, "epoch": 819} {"train_loss": -20.712217330932617, "global_step": 68058, "epoch": 819} {"train_loss": -20.700675504753388, "global_step": 68059, "epoch": 819, "val_loss": 5896706.5} {"train_loss": -19.463781356811523, "global_step": 68060, "epoch": 820} {"train_loss": -20.355167388916016, "global_step": 68061, "epoch": 820} {"train_loss": -20.408714294433594, "global_step": 68062, "epoch": 820} {"train_loss": -19.946908950805664, "global_step": 68063, "epoch": 820} {"train_loss": -20.610239028930664, "global_step": 68064, "epoch": 820} {"train_loss": -19.989713668823242, "global_step": 68065, "epoch": 820} {"train_loss": -20.520009994506836, "global_step": 68066, "epoch": 820} {"train_loss": -20.337207794189453, "global_step": 68067, "epoch": 820} {"train_loss": -20.792774200439453, "global_step": 68068, "epoch": 820} {"train_loss": -20.480215072631836, "global_step": 68069, "epoch": 820} {"train_loss": -20.435270309448242, "global_step": 68070, "epoch": 820} {"train_loss": -20.427358627319336, "global_step": 68071, "epoch": 820} {"train_loss": -20.535140991210938, "global_step": 68072, "epoch": 820} {"train_loss": -20.492780685424805, "global_step": 68073, "epoch": 820} {"train_loss": -20.578107833862305, "global_step": 68074, "epoch": 820} {"train_loss": -20.376798629760742, "global_step": 68075, "epoch": 820} {"train_loss": -20.621912002563477, "global_step": 68076, "epoch": 820} {"train_loss": -20.836212158203125, "global_step": 68077, "epoch": 820} {"train_loss": -20.433744430541992, "global_step": 68078, "epoch": 820} {"train_loss": -20.380041122436523, "global_step": 68079, "epoch": 820} {"train_loss": -20.783187866210938, "global_step": 68080, "epoch": 820} {"train_loss": -20.83960723876953, "global_step": 68081, "epoch": 820} {"train_loss": -20.8790283203125, "global_step": 68082, "epoch": 820} {"train_loss": -20.585668563842773, "global_step": 68083, "epoch": 820} {"train_loss": -20.68561363220215, "global_step": 68084, "epoch": 820} {"train_loss": -20.747970581054688, "global_step": 68085, "epoch": 820} {"train_loss": -20.956396102905273, "global_step": 68086, "epoch": 820} {"train_loss": -21.2023983001709, "global_step": 68087, "epoch": 820} {"train_loss": -20.727275848388672, "global_step": 68088, "epoch": 820} {"train_loss": -20.735551834106445, "global_step": 68089, "epoch": 820} {"train_loss": -20.76766014099121, "global_step": 68090, "epoch": 820} {"train_loss": -20.96607208251953, "global_step": 68091, "epoch": 820} {"train_loss": -20.8815975189209, "global_step": 68092, "epoch": 820} {"train_loss": -20.632253646850586, "global_step": 68093, "epoch": 820} {"train_loss": -20.89798927307129, "global_step": 68094, "epoch": 820} {"train_loss": -21.10157585144043, "global_step": 68095, "epoch": 820} {"train_loss": -20.93739128112793, "global_step": 68096, "epoch": 820} {"train_loss": -20.91055679321289, "global_step": 68097, "epoch": 820} {"train_loss": -20.63294792175293, "global_step": 68098, "epoch": 820} {"train_loss": -20.731809616088867, "global_step": 68099, "epoch": 820} {"train_loss": -21.467803955078125, "global_step": 68100, "epoch": 820} {"train_loss": -20.885656356811523, "global_step": 68101, "epoch": 820} {"train_loss": -20.775959014892578, "global_step": 68102, "epoch": 820} {"train_loss": -21.103199005126953, "global_step": 68103, "epoch": 820} {"train_loss": -20.647022247314453, "global_step": 68104, "epoch": 820} {"train_loss": -20.819643020629883, "global_step": 68105, "epoch": 820} {"train_loss": -20.7872314453125, "global_step": 68106, "epoch": 820} {"train_loss": -21.069318771362305, "global_step": 68107, "epoch": 820} {"train_loss": -20.745407104492188, "global_step": 68108, "epoch": 820} {"train_loss": -20.92917823791504, "global_step": 68109, "epoch": 820} {"train_loss": -20.824325561523438, "global_step": 68110, "epoch": 820} {"train_loss": -20.583698272705078, "global_step": 68111, "epoch": 820} {"train_loss": -20.480329513549805, "global_step": 68112, "epoch": 820} {"train_loss": -20.624168395996094, "global_step": 68113, "epoch": 820} {"train_loss": -20.587900161743164, "global_step": 68114, "epoch": 820} {"train_loss": -20.6376953125, "global_step": 68115, "epoch": 820} {"train_loss": -20.555072784423828, "global_step": 68116, "epoch": 820} {"train_loss": -20.53679656982422, "global_step": 68117, "epoch": 820} {"train_loss": -21.0598087310791, "global_step": 68118, "epoch": 820} {"train_loss": -20.623031616210938, "global_step": 68119, "epoch": 820} {"train_loss": -20.367979049682617, "global_step": 68120, "epoch": 820} {"train_loss": -20.77853775024414, "global_step": 68121, "epoch": 820} {"train_loss": -20.862533569335938, "global_step": 68122, "epoch": 820} {"train_loss": -21.01519203186035, "global_step": 68123, "epoch": 820} {"train_loss": -21.018033981323242, "global_step": 68124, "epoch": 820} {"train_loss": -20.507482528686523, "global_step": 68125, "epoch": 820} {"train_loss": -20.67267417907715, "global_step": 68126, "epoch": 820} {"train_loss": -21.01643180847168, "global_step": 68127, "epoch": 820} {"train_loss": -20.928754806518555, "global_step": 68128, "epoch": 820} {"train_loss": -21.028867721557617, "global_step": 68129, "epoch": 820} {"train_loss": -20.777456283569336, "global_step": 68130, "epoch": 820} {"train_loss": -20.540029525756836, "global_step": 68131, "epoch": 820} {"train_loss": -20.454225540161133, "global_step": 68132, "epoch": 820} {"train_loss": -20.823108673095703, "global_step": 68133, "epoch": 820} {"train_loss": -20.989303588867188, "global_step": 68134, "epoch": 820} {"train_loss": -20.313161849975586, "global_step": 68135, "epoch": 820} {"train_loss": -20.86801528930664, "global_step": 68136, "epoch": 820} {"train_loss": -20.658327102661133, "global_step": 68137, "epoch": 820} {"train_loss": -21.043964385986328, "global_step": 68138, "epoch": 820} {"train_loss": -20.726667404174805, "global_step": 68139, "epoch": 820} {"train_loss": -20.472759246826172, "global_step": 68140, "epoch": 820} {"train_loss": -20.672657012939453, "global_step": 68141, "epoch": 820} {"train_loss": -20.70730308165033, "global_step": 68142, "epoch": 820, "val_loss": 6305372.0} {"train_loss": -20.000247955322266, "global_step": 68143, "epoch": 821} {"train_loss": -19.917646408081055, "global_step": 68144, "epoch": 821} {"train_loss": -20.58642578125, "global_step": 68145, "epoch": 821} {"train_loss": -19.827098846435547, "global_step": 68146, "epoch": 821} {"train_loss": -20.59560203552246, "global_step": 68147, "epoch": 821} {"train_loss": -20.277141571044922, "global_step": 68148, "epoch": 821} {"train_loss": -20.215856552124023, "global_step": 68149, "epoch": 821} {"train_loss": -20.626853942871094, "global_step": 68150, "epoch": 821} {"train_loss": -20.734237670898438, "global_step": 68151, "epoch": 821} {"train_loss": -20.536678314208984, "global_step": 68152, "epoch": 821} {"train_loss": -20.314939498901367, "global_step": 68153, "epoch": 821} {"train_loss": -20.815963745117188, "global_step": 68154, "epoch": 821} {"train_loss": -20.72670555114746, "global_step": 68155, "epoch": 821} {"train_loss": -20.472900390625, "global_step": 68156, "epoch": 821} {"train_loss": -20.52935218811035, "global_step": 68157, "epoch": 821} {"train_loss": -20.52555274963379, "global_step": 68158, "epoch": 821} {"train_loss": -20.633142471313477, "global_step": 68159, "epoch": 821} {"train_loss": -20.603919982910156, "global_step": 68160, "epoch": 821} {"train_loss": -20.876291275024414, "global_step": 68161, "epoch": 821} {"train_loss": -20.622892379760742, "global_step": 68162, "epoch": 821} {"train_loss": -20.75881004333496, "global_step": 68163, "epoch": 821} {"train_loss": -20.885061264038086, "global_step": 68164, "epoch": 821} {"train_loss": -20.43360710144043, "global_step": 68165, "epoch": 821} {"train_loss": -20.663244247436523, "global_step": 68166, "epoch": 821} {"train_loss": -20.38022804260254, "global_step": 68167, "epoch": 821} {"train_loss": -20.840673446655273, "global_step": 68168, "epoch": 821} {"train_loss": -20.864206314086914, "global_step": 68169, "epoch": 821} {"train_loss": -20.593643188476562, "global_step": 68170, "epoch": 821} {"train_loss": -20.696903228759766, "global_step": 68171, "epoch": 821} {"train_loss": -20.850069046020508, "global_step": 68172, "epoch": 821} {"train_loss": -20.794845581054688, "global_step": 68173, "epoch": 821} {"train_loss": -20.865219116210938, "global_step": 68174, "epoch": 821} {"train_loss": -20.684988021850586, "global_step": 68175, "epoch": 821} {"train_loss": -20.481496810913086, "global_step": 68176, "epoch": 821} {"train_loss": -20.634153366088867, "global_step": 68177, "epoch": 821} {"train_loss": -20.75323486328125, "global_step": 68178, "epoch": 821} {"train_loss": -20.539697647094727, "global_step": 68179, "epoch": 821} {"train_loss": -20.718664169311523, "global_step": 68180, "epoch": 821} {"train_loss": -20.735485076904297, "global_step": 68181, "epoch": 821} {"train_loss": -21.193403244018555, "global_step": 68182, "epoch": 821} {"train_loss": -20.873929977416992, "global_step": 68183, "epoch": 821} {"train_loss": -20.761503219604492, "global_step": 68184, "epoch": 821} {"train_loss": -20.78171730041504, "global_step": 68185, "epoch": 821} {"train_loss": -20.985013961791992, "global_step": 68186, "epoch": 821} {"train_loss": -20.673030853271484, "global_step": 68187, "epoch": 821} {"train_loss": -20.918380737304688, "global_step": 68188, "epoch": 821} {"train_loss": -20.775527954101562, "global_step": 68189, "epoch": 821} {"train_loss": -20.654687881469727, "global_step": 68190, "epoch": 821} {"train_loss": -21.11131477355957, "global_step": 68191, "epoch": 821} {"train_loss": -20.433189392089844, "global_step": 68192, "epoch": 821} {"train_loss": -20.5947265625, "global_step": 68193, "epoch": 821} {"train_loss": -20.935667037963867, "global_step": 68194, "epoch": 821} {"train_loss": -21.00679588317871, "global_step": 68195, "epoch": 821} {"train_loss": -20.716150283813477, "global_step": 68196, "epoch": 821} {"train_loss": -20.906513214111328, "global_step": 68197, "epoch": 821} {"train_loss": -20.995609283447266, "global_step": 68198, "epoch": 821} {"train_loss": -20.631032943725586, "global_step": 68199, "epoch": 821} {"train_loss": -20.56757164001465, "global_step": 68200, "epoch": 821} {"train_loss": -20.640302658081055, "global_step": 68201, "epoch": 821} {"train_loss": -20.772031784057617, "global_step": 68202, "epoch": 821} {"train_loss": -20.956295013427734, "global_step": 68203, "epoch": 821} {"train_loss": -20.88225746154785, "global_step": 68204, "epoch": 821} {"train_loss": -21.142072677612305, "global_step": 68205, "epoch": 821} {"train_loss": -21.045917510986328, "global_step": 68206, "epoch": 821} {"train_loss": -21.260251998901367, "global_step": 68207, "epoch": 821} {"train_loss": -20.554025650024414, "global_step": 68208, "epoch": 821} {"train_loss": -20.483478546142578, "global_step": 68209, "epoch": 821} {"train_loss": -21.065900802612305, "global_step": 68210, "epoch": 821} {"train_loss": -20.56257438659668, "global_step": 68211, "epoch": 821} {"train_loss": -20.568811416625977, "global_step": 68212, "epoch": 821} {"train_loss": -21.0757999420166, "global_step": 68213, "epoch": 821} {"train_loss": -20.606348037719727, "global_step": 68214, "epoch": 821} {"train_loss": -20.39847755432129, "global_step": 68215, "epoch": 821} {"train_loss": -20.642431259155273, "global_step": 68216, "epoch": 821} {"train_loss": -20.589868545532227, "global_step": 68217, "epoch": 821} {"train_loss": -20.541250228881836, "global_step": 68218, "epoch": 821} {"train_loss": -20.833953857421875, "global_step": 68219, "epoch": 821} {"train_loss": -20.587583541870117, "global_step": 68220, "epoch": 821} {"train_loss": -20.6124324798584, "global_step": 68221, "epoch": 821} {"train_loss": -20.34218406677246, "global_step": 68222, "epoch": 821} {"train_loss": -20.774484634399414, "global_step": 68223, "epoch": 821} {"train_loss": -20.218624114990234, "global_step": 68224, "epoch": 821} {"train_loss": -20.6830332652632, "global_step": 68225, "epoch": 821, "val_loss": 5955888.0} {"train_loss": -20.573270797729492, "global_step": 68226, "epoch": 822} {"train_loss": -20.404460906982422, "global_step": 68227, "epoch": 822} {"train_loss": -20.628849029541016, "global_step": 68228, "epoch": 822} {"train_loss": -20.723567962646484, "global_step": 68229, "epoch": 822} {"train_loss": -20.274763107299805, "global_step": 68230, "epoch": 822} {"train_loss": -20.78074073791504, "global_step": 68231, "epoch": 822} {"train_loss": -20.302169799804688, "global_step": 68232, "epoch": 822} {"train_loss": -20.8467960357666, "global_step": 68233, "epoch": 822} {"train_loss": -20.571386337280273, "global_step": 68234, "epoch": 822} {"train_loss": -20.805166244506836, "global_step": 68235, "epoch": 822} {"train_loss": -20.782461166381836, "global_step": 68236, "epoch": 822} {"train_loss": -20.472204208374023, "global_step": 68237, "epoch": 822} {"train_loss": -20.510374069213867, "global_step": 68238, "epoch": 822} {"train_loss": -20.832096099853516, "global_step": 68239, "epoch": 822} {"train_loss": -20.617280960083008, "global_step": 68240, "epoch": 822} {"train_loss": -20.556699752807617, "global_step": 68241, "epoch": 822} {"train_loss": -20.51004981994629, "global_step": 68242, "epoch": 822} {"train_loss": -20.804908752441406, "global_step": 68243, "epoch": 822} {"train_loss": -20.77950096130371, "global_step": 68244, "epoch": 822} {"train_loss": -20.93204116821289, "global_step": 68245, "epoch": 822} {"train_loss": -20.309371948242188, "global_step": 68246, "epoch": 822} {"train_loss": -20.750959396362305, "global_step": 68247, "epoch": 822} {"train_loss": -20.76462173461914, "global_step": 68248, "epoch": 822} {"train_loss": -20.749950408935547, "global_step": 68249, "epoch": 822} {"train_loss": -20.97313117980957, "global_step": 68250, "epoch": 822} {"train_loss": -20.425657272338867, "global_step": 68251, "epoch": 822} {"train_loss": -20.843725204467773, "global_step": 68252, "epoch": 822} {"train_loss": -20.98204803466797, "global_step": 68253, "epoch": 822} {"train_loss": -20.691247940063477, "global_step": 68254, "epoch": 822} {"train_loss": -20.916772842407227, "global_step": 68255, "epoch": 822} {"train_loss": -20.733278274536133, "global_step": 68256, "epoch": 822} {"train_loss": -20.88343048095703, "global_step": 68257, "epoch": 822} {"train_loss": -20.68723487854004, "global_step": 68258, "epoch": 822} {"train_loss": -20.824499130249023, "global_step": 68259, "epoch": 822} {"train_loss": -20.344396591186523, "global_step": 68260, "epoch": 822} {"train_loss": -20.562849044799805, "global_step": 68261, "epoch": 822} {"train_loss": -20.799606323242188, "global_step": 68262, "epoch": 822} {"train_loss": -20.570180892944336, "global_step": 68263, "epoch": 822} {"train_loss": -20.884986877441406, "global_step": 68264, "epoch": 822} {"train_loss": -20.974531173706055, "global_step": 68265, "epoch": 822} {"train_loss": -20.52567481994629, "global_step": 68266, "epoch": 822} {"train_loss": -21.090654373168945, "global_step": 68267, "epoch": 822} {"train_loss": -20.671430587768555, "global_step": 68268, "epoch": 822} {"train_loss": -20.39487648010254, "global_step": 68269, "epoch": 822} {"train_loss": -20.640409469604492, "global_step": 68270, "epoch": 822} {"train_loss": -20.799203872680664, "global_step": 68271, "epoch": 822} {"train_loss": -20.58570671081543, "global_step": 68272, "epoch": 822} {"train_loss": -20.457595825195312, "global_step": 68273, "epoch": 822} {"train_loss": -20.73308563232422, "global_step": 68274, "epoch": 822} {"train_loss": -20.51250648498535, "global_step": 68275, "epoch": 822} {"train_loss": -20.439367294311523, "global_step": 68276, "epoch": 822} {"train_loss": -20.716886520385742, "global_step": 68277, "epoch": 822} {"train_loss": -21.186872482299805, "global_step": 68278, "epoch": 822} {"train_loss": -20.66036605834961, "global_step": 68279, "epoch": 822} {"train_loss": -20.83861541748047, "global_step": 68280, "epoch": 822} {"train_loss": -20.862436294555664, "global_step": 68281, "epoch": 822} {"train_loss": -20.58880615234375, "global_step": 68282, "epoch": 822} {"train_loss": -20.744752883911133, "global_step": 68283, "epoch": 822} {"train_loss": -20.858692169189453, "global_step": 68284, "epoch": 822} {"train_loss": -20.723739624023438, "global_step": 68285, "epoch": 822} {"train_loss": -20.70450210571289, "global_step": 68286, "epoch": 822} {"train_loss": -20.77113151550293, "global_step": 68287, "epoch": 822} {"train_loss": -20.85912322998047, "global_step": 68288, "epoch": 822} {"train_loss": -20.763259887695312, "global_step": 68289, "epoch": 822} {"train_loss": -20.74439239501953, "global_step": 68290, "epoch": 822} {"train_loss": -20.957624435424805, "global_step": 68291, "epoch": 822} {"train_loss": -20.838199615478516, "global_step": 68292, "epoch": 822} {"train_loss": -20.65990447998047, "global_step": 68293, "epoch": 822} {"train_loss": -20.516733169555664, "global_step": 68294, "epoch": 822} {"train_loss": -20.67544937133789, "global_step": 68295, "epoch": 822} {"train_loss": -20.967849731445312, "global_step": 68296, "epoch": 822} {"train_loss": -20.679798126220703, "global_step": 68297, "epoch": 822} {"train_loss": -20.524940490722656, "global_step": 68298, "epoch": 822} {"train_loss": -21.011747360229492, "global_step": 68299, "epoch": 822} {"train_loss": -20.786731719970703, "global_step": 68300, "epoch": 822} {"train_loss": -20.9337215423584, "global_step": 68301, "epoch": 822} {"train_loss": -20.676738739013672, "global_step": 68302, "epoch": 822} {"train_loss": -20.31467628479004, "global_step": 68303, "epoch": 822} {"train_loss": -20.960905075073242, "global_step": 68304, "epoch": 822} {"train_loss": -21.111480712890625, "global_step": 68305, "epoch": 822} {"train_loss": -20.724027633666992, "global_step": 68306, "epoch": 822} {"train_loss": -20.763561248779297, "global_step": 68307, "epoch": 822} {"train_loss": -20.71404151456902, "global_step": 68308, "epoch": 822, "val_loss": 5986389.5} {"train_loss": -20.711889266967773, "global_step": 68309, "epoch": 823} {"train_loss": -21.00252342224121, "global_step": 68310, "epoch": 823} {"train_loss": -20.497140884399414, "global_step": 68311, "epoch": 823} {"train_loss": -20.725238800048828, "global_step": 68312, "epoch": 823} {"train_loss": -20.746061325073242, "global_step": 68313, "epoch": 823} {"train_loss": -20.573022842407227, "global_step": 68314, "epoch": 823} {"train_loss": -20.91939926147461, "global_step": 68315, "epoch": 823} {"train_loss": -20.821378707885742, "global_step": 68316, "epoch": 823} {"train_loss": -20.603967666625977, "global_step": 68317, "epoch": 823} {"train_loss": -20.685110092163086, "global_step": 68318, "epoch": 823} {"train_loss": -20.94467544555664, "global_step": 68319, "epoch": 823} {"train_loss": -20.778942108154297, "global_step": 68320, "epoch": 823} {"train_loss": -20.702985763549805, "global_step": 68321, "epoch": 823} {"train_loss": -20.914541244506836, "global_step": 68322, "epoch": 823} {"train_loss": -20.541244506835938, "global_step": 68323, "epoch": 823} {"train_loss": -20.2226619720459, "global_step": 68324, "epoch": 823} {"train_loss": -20.83321189880371, "global_step": 68325, "epoch": 823} {"train_loss": -20.433124542236328, "global_step": 68326, "epoch": 823} {"train_loss": -20.873218536376953, "global_step": 68327, "epoch": 823} {"train_loss": -20.46773338317871, "global_step": 68328, "epoch": 823} {"train_loss": -20.713415145874023, "global_step": 68329, "epoch": 823} {"train_loss": -20.66902732849121, "global_step": 68330, "epoch": 823} {"train_loss": -20.813297271728516, "global_step": 68331, "epoch": 823} {"train_loss": -20.784910202026367, "global_step": 68332, "epoch": 823} {"train_loss": -20.972944259643555, "global_step": 68333, "epoch": 823} {"train_loss": -20.56947135925293, "global_step": 68334, "epoch": 823} {"train_loss": -20.905168533325195, "global_step": 68335, "epoch": 823} {"train_loss": -20.785757064819336, "global_step": 68336, "epoch": 823} {"train_loss": -20.810537338256836, "global_step": 68337, "epoch": 823} {"train_loss": -20.2934627532959, "global_step": 68338, "epoch": 823} {"train_loss": -20.81153106689453, "global_step": 68339, "epoch": 823} {"train_loss": -20.39303970336914, "global_step": 68340, "epoch": 823} {"train_loss": -20.137210845947266, "global_step": 68341, "epoch": 823} {"train_loss": -20.874998092651367, "global_step": 68342, "epoch": 823} {"train_loss": -20.4385986328125, "global_step": 68343, "epoch": 823} {"train_loss": -20.99074363708496, "global_step": 68344, "epoch": 823} {"train_loss": -20.759729385375977, "global_step": 68345, "epoch": 823} {"train_loss": -21.050918579101562, "global_step": 68346, "epoch": 823} {"train_loss": -20.83237075805664, "global_step": 68347, "epoch": 823} {"train_loss": -20.921573638916016, "global_step": 68348, "epoch": 823} {"train_loss": -20.745365142822266, "global_step": 68349, "epoch": 823} {"train_loss": -20.916616439819336, "global_step": 68350, "epoch": 823} {"train_loss": -20.83623695373535, "global_step": 68351, "epoch": 823} {"train_loss": -20.94626235961914, "global_step": 68352, "epoch": 823} {"train_loss": -20.235795974731445, "global_step": 68353, "epoch": 823} {"train_loss": -20.397825241088867, "global_step": 68354, "epoch": 823} {"train_loss": -21.042295455932617, "global_step": 68355, "epoch": 823} {"train_loss": -20.275236129760742, "global_step": 68356, "epoch": 823} {"train_loss": -20.695880889892578, "global_step": 68357, "epoch": 823} {"train_loss": -20.56439971923828, "global_step": 68358, "epoch": 823} {"train_loss": -20.4410400390625, "global_step": 68359, "epoch": 823} {"train_loss": -20.662452697753906, "global_step": 68360, "epoch": 823} {"train_loss": -20.5474796295166, "global_step": 68361, "epoch": 823} {"train_loss": -20.777685165405273, "global_step": 68362, "epoch": 823} {"train_loss": -20.450387954711914, "global_step": 68363, "epoch": 823} {"train_loss": -20.683025360107422, "global_step": 68364, "epoch": 823} {"train_loss": -20.74355125427246, "global_step": 68365, "epoch": 823} {"train_loss": -20.751724243164062, "global_step": 68366, "epoch": 823} {"train_loss": -21.132844924926758, "global_step": 68367, "epoch": 823} {"train_loss": -20.38555335998535, "global_step": 68368, "epoch": 823} {"train_loss": -20.652910232543945, "global_step": 68369, "epoch": 823} {"train_loss": -20.567331314086914, "global_step": 68370, "epoch": 823} {"train_loss": -20.62395477294922, "global_step": 68371, "epoch": 823} {"train_loss": -20.71060562133789, "global_step": 68372, "epoch": 823} {"train_loss": -20.570117950439453, "global_step": 68373, "epoch": 823} {"train_loss": -20.67133903503418, "global_step": 68374, "epoch": 823} {"train_loss": -20.408926010131836, "global_step": 68375, "epoch": 823} {"train_loss": -20.945466995239258, "global_step": 68376, "epoch": 823} {"train_loss": -20.764135360717773, "global_step": 68377, "epoch": 823} {"train_loss": -20.7418270111084, "global_step": 68378, "epoch": 823} {"train_loss": -21.075122833251953, "global_step": 68379, "epoch": 823} {"train_loss": -20.71780014038086, "global_step": 68380, "epoch": 823} {"train_loss": -20.84369468688965, "global_step": 68381, "epoch": 823} {"train_loss": -21.031423568725586, "global_step": 68382, "epoch": 823} {"train_loss": -21.007461547851562, "global_step": 68383, "epoch": 823} {"train_loss": -20.63216209411621, "global_step": 68384, "epoch": 823} {"train_loss": -20.79038429260254, "global_step": 68385, "epoch": 823} {"train_loss": -20.880538940429688, "global_step": 68386, "epoch": 823} {"train_loss": -20.780136108398438, "global_step": 68387, "epoch": 823} {"train_loss": -20.897214889526367, "global_step": 68388, "epoch": 823} {"train_loss": -20.76358985900879, "global_step": 68389, "epoch": 823} {"train_loss": -20.88273048400879, "global_step": 68390, "epoch": 823} {"train_loss": -20.713515270187195, "global_step": 68391, "epoch": 823, "val_loss": 5884471.5} {"train_loss": -20.194303512573242, "global_step": 68392, "epoch": 824} {"train_loss": -20.243444442749023, "global_step": 68393, "epoch": 824} {"train_loss": -20.456552505493164, "global_step": 68394, "epoch": 824} {"train_loss": -20.360841751098633, "global_step": 68395, "epoch": 824} {"train_loss": -20.66365623474121, "global_step": 68396, "epoch": 824} {"train_loss": -20.581575393676758, "global_step": 68397, "epoch": 824} {"train_loss": -20.77461814880371, "global_step": 68398, "epoch": 824} {"train_loss": -20.83686637878418, "global_step": 68399, "epoch": 824} {"train_loss": -20.913129806518555, "global_step": 68400, "epoch": 824} {"train_loss": -20.622072219848633, "global_step": 68401, "epoch": 824} {"train_loss": -20.7855281829834, "global_step": 68402, "epoch": 824} {"train_loss": -20.8061580657959, "global_step": 68403, "epoch": 824} {"train_loss": -20.688989639282227, "global_step": 68404, "epoch": 824} {"train_loss": -20.670156478881836, "global_step": 68405, "epoch": 824} {"train_loss": -20.416921615600586, "global_step": 68406, "epoch": 824} {"train_loss": -20.831497192382812, "global_step": 68407, "epoch": 824} {"train_loss": -20.925113677978516, "global_step": 68408, "epoch": 824} {"train_loss": -21.107580184936523, "global_step": 68409, "epoch": 824} {"train_loss": -20.49965476989746, "global_step": 68410, "epoch": 824} {"train_loss": -20.625181198120117, "global_step": 68411, "epoch": 824} {"train_loss": -21.442523956298828, "global_step": 68412, "epoch": 824} {"train_loss": -20.716596603393555, "global_step": 68413, "epoch": 824} {"train_loss": -20.253244400024414, "global_step": 68414, "epoch": 824} {"train_loss": -20.99091911315918, "global_step": 68415, "epoch": 824} {"train_loss": -20.669845581054688, "global_step": 68416, "epoch": 824} {"train_loss": -20.914451599121094, "global_step": 68417, "epoch": 824} {"train_loss": -20.854883193969727, "global_step": 68418, "epoch": 824} {"train_loss": -20.51608657836914, "global_step": 68419, "epoch": 824} {"train_loss": -20.888273239135742, "global_step": 68420, "epoch": 824} {"train_loss": -20.83208656311035, "global_step": 68421, "epoch": 824} {"train_loss": -20.722476959228516, "global_step": 68422, "epoch": 824} {"train_loss": -20.862565994262695, "global_step": 68423, "epoch": 824} {"train_loss": -20.422649383544922, "global_step": 68424, "epoch": 824} {"train_loss": -21.038663864135742, "global_step": 68425, "epoch": 824} {"train_loss": -20.383947372436523, "global_step": 68426, "epoch": 824} {"train_loss": -20.790884017944336, "global_step": 68427, "epoch": 824} {"train_loss": -20.52589988708496, "global_step": 68428, "epoch": 824} {"train_loss": -20.701772689819336, "global_step": 68429, "epoch": 824} {"train_loss": -20.558286666870117, "global_step": 68430, "epoch": 824} {"train_loss": -20.53833770751953, "global_step": 68431, "epoch": 824} {"train_loss": -20.473848342895508, "global_step": 68432, "epoch": 824} {"train_loss": -20.812759399414062, "global_step": 68433, "epoch": 824} {"train_loss": -20.58101463317871, "global_step": 68434, "epoch": 824} {"train_loss": -20.743247985839844, "global_step": 68435, "epoch": 824} {"train_loss": -20.8772029876709, "global_step": 68436, "epoch": 824} {"train_loss": -20.576065063476562, "global_step": 68437, "epoch": 824} {"train_loss": -20.536338806152344, "global_step": 68438, "epoch": 824} {"train_loss": -20.53435707092285, "global_step": 68439, "epoch": 824} {"train_loss": -20.61124610900879, "global_step": 68440, "epoch": 824} {"train_loss": -20.547109603881836, "global_step": 68441, "epoch": 824} {"train_loss": -20.754850387573242, "global_step": 68442, "epoch": 824} {"train_loss": -20.802865982055664, "global_step": 68443, "epoch": 824} {"train_loss": -20.483184814453125, "global_step": 68444, "epoch": 824} {"train_loss": -20.950088500976562, "global_step": 68445, "epoch": 824} {"train_loss": -20.7565975189209, "global_step": 68446, "epoch": 824} {"train_loss": -20.83734703063965, "global_step": 68447, "epoch": 824} {"train_loss": -20.5311336517334, "global_step": 68448, "epoch": 824} {"train_loss": -20.725980758666992, "global_step": 68449, "epoch": 824} {"train_loss": -20.69179916381836, "global_step": 68450, "epoch": 824} {"train_loss": -20.67682456970215, "global_step": 68451, "epoch": 824} {"train_loss": -20.462202072143555, "global_step": 68452, "epoch": 824} {"train_loss": -20.637311935424805, "global_step": 68453, "epoch": 824} {"train_loss": -20.66966438293457, "global_step": 68454, "epoch": 824} {"train_loss": -20.725969314575195, "global_step": 68455, "epoch": 824} {"train_loss": -20.782623291015625, "global_step": 68456, "epoch": 824} {"train_loss": -20.78076934814453, "global_step": 68457, "epoch": 824} {"train_loss": -20.74222755432129, "global_step": 68458, "epoch": 824} {"train_loss": -20.610910415649414, "global_step": 68459, "epoch": 824} {"train_loss": -20.650564193725586, "global_step": 68460, "epoch": 824} {"train_loss": -20.725784301757812, "global_step": 68461, "epoch": 824} {"train_loss": -20.718477249145508, "global_step": 68462, "epoch": 824} {"train_loss": -21.20526695251465, "global_step": 68463, "epoch": 824} {"train_loss": -21.00201988220215, "global_step": 68464, "epoch": 824} {"train_loss": -20.606428146362305, "global_step": 68465, "epoch": 824} {"train_loss": -20.810712814331055, "global_step": 68466, "epoch": 824} {"train_loss": -20.830705642700195, "global_step": 68467, "epoch": 824} {"train_loss": -20.718128204345703, "global_step": 68468, "epoch": 824} {"train_loss": -21.043842315673828, "global_step": 68469, "epoch": 824} {"train_loss": -20.684566497802734, "global_step": 68470, "epoch": 824} {"train_loss": -21.003559112548828, "global_step": 68471, "epoch": 824} {"train_loss": -20.86213493347168, "global_step": 68472, "epoch": 824} {"train_loss": -20.641542434692383, "global_step": 68473, "epoch": 824} {"train_loss": -20.712404664740504, "global_step": 68474, "epoch": 824, "val_loss": 6129793.5} {"train_loss": -19.859569549560547, "global_step": 68475, "epoch": 825} {"train_loss": -20.646997451782227, "global_step": 68476, "epoch": 825} {"train_loss": -20.219575881958008, "global_step": 68477, "epoch": 825} {"train_loss": -20.672521591186523, "global_step": 68478, "epoch": 825} {"train_loss": -20.383926391601562, "global_step": 68479, "epoch": 825} {"train_loss": -20.879026412963867, "global_step": 68480, "epoch": 825} {"train_loss": -19.85371208190918, "global_step": 68481, "epoch": 825} {"train_loss": -20.562177658081055, "global_step": 68482, "epoch": 825} {"train_loss": -20.1731014251709, "global_step": 68483, "epoch": 825} {"train_loss": -21.09228515625, "global_step": 68484, "epoch": 825} {"train_loss": -20.588973999023438, "global_step": 68485, "epoch": 825} {"train_loss": -20.49448585510254, "global_step": 68486, "epoch": 825} {"train_loss": -20.48699378967285, "global_step": 68487, "epoch": 825} {"train_loss": -20.587787628173828, "global_step": 68488, "epoch": 825} {"train_loss": -20.558319091796875, "global_step": 68489, "epoch": 825} {"train_loss": -20.485280990600586, "global_step": 68490, "epoch": 825} {"train_loss": -20.340726852416992, "global_step": 68491, "epoch": 825} {"train_loss": -20.7470703125, "global_step": 68492, "epoch": 825} {"train_loss": -20.70212173461914, "global_step": 68493, "epoch": 825} {"train_loss": -20.862659454345703, "global_step": 68494, "epoch": 825} {"train_loss": -20.58792495727539, "global_step": 68495, "epoch": 825} {"train_loss": -20.231952667236328, "global_step": 68496, "epoch": 825} {"train_loss": -20.55156135559082, "global_step": 68497, "epoch": 825} {"train_loss": -20.693002700805664, "global_step": 68498, "epoch": 825} {"train_loss": -20.4499568939209, "global_step": 68499, "epoch": 825} {"train_loss": -20.718952178955078, "global_step": 68500, "epoch": 825} {"train_loss": -21.053598403930664, "global_step": 68501, "epoch": 825} {"train_loss": -20.6214656829834, "global_step": 68502, "epoch": 825} {"train_loss": -20.44453239440918, "global_step": 68503, "epoch": 825} {"train_loss": -21.013675689697266, "global_step": 68504, "epoch": 825} {"train_loss": -20.7063045501709, "global_step": 68505, "epoch": 825} {"train_loss": -20.843860626220703, "global_step": 68506, "epoch": 825} {"train_loss": -20.909889221191406, "global_step": 68507, "epoch": 825} {"train_loss": -20.765832901000977, "global_step": 68508, "epoch": 825} {"train_loss": -20.340375900268555, "global_step": 68509, "epoch": 825} {"train_loss": -20.42448616027832, "global_step": 68510, "epoch": 825} {"train_loss": -20.56880760192871, "global_step": 68511, "epoch": 825} {"train_loss": -21.11895751953125, "global_step": 68512, "epoch": 825} {"train_loss": -20.70625114440918, "global_step": 68513, "epoch": 825} {"train_loss": -20.951440811157227, "global_step": 68514, "epoch": 825} {"train_loss": -20.56024742126465, "global_step": 68515, "epoch": 825} {"train_loss": -20.772998809814453, "global_step": 68516, "epoch": 825} {"train_loss": -20.721881866455078, "global_step": 68517, "epoch": 825} {"train_loss": -21.06226348876953, "global_step": 68518, "epoch": 825} {"train_loss": -20.3359432220459, "global_step": 68519, "epoch": 825} {"train_loss": -20.645811080932617, "global_step": 68520, "epoch": 825} {"train_loss": -20.88445472717285, "global_step": 68521, "epoch": 825} {"train_loss": -20.714677810668945, "global_step": 68522, "epoch": 825} {"train_loss": -20.88471031188965, "global_step": 68523, "epoch": 825} {"train_loss": -20.71974754333496, "global_step": 68524, "epoch": 825} {"train_loss": -20.80548095703125, "global_step": 68525, "epoch": 825} {"train_loss": -21.124013900756836, "global_step": 68526, "epoch": 825} {"train_loss": -20.998918533325195, "global_step": 68527, "epoch": 825} {"train_loss": -20.520042419433594, "global_step": 68528, "epoch": 825} {"train_loss": -20.972806930541992, "global_step": 68529, "epoch": 825} {"train_loss": -20.869932174682617, "global_step": 68530, "epoch": 825} {"train_loss": -20.577810287475586, "global_step": 68531, "epoch": 825} {"train_loss": -20.535491943359375, "global_step": 68532, "epoch": 825} {"train_loss": -20.60901641845703, "global_step": 68533, "epoch": 825} {"train_loss": -20.654294967651367, "global_step": 68534, "epoch": 825} {"train_loss": -20.938196182250977, "global_step": 68535, "epoch": 825} {"train_loss": -20.5694580078125, "global_step": 68536, "epoch": 825} {"train_loss": -20.742290496826172, "global_step": 68537, "epoch": 825} {"train_loss": -20.660079956054688, "global_step": 68538, "epoch": 825} {"train_loss": -20.48238182067871, "global_step": 68539, "epoch": 825} {"train_loss": -20.341632843017578, "global_step": 68540, "epoch": 825} {"train_loss": -21.09402847290039, "global_step": 68541, "epoch": 825} {"train_loss": -20.87519645690918, "global_step": 68542, "epoch": 825} {"train_loss": -20.87240982055664, "global_step": 68543, "epoch": 825} {"train_loss": -20.814970016479492, "global_step": 68544, "epoch": 825} {"train_loss": -20.517438888549805, "global_step": 68545, "epoch": 825} {"train_loss": -20.84186363220215, "global_step": 68546, "epoch": 825} {"train_loss": -21.000171661376953, "global_step": 68547, "epoch": 825} {"train_loss": -20.627363204956055, "global_step": 68548, "epoch": 825} {"train_loss": -20.887256622314453, "global_step": 68549, "epoch": 825} {"train_loss": -20.27805519104004, "global_step": 68550, "epoch": 825} {"train_loss": -20.69002342224121, "global_step": 68551, "epoch": 825} {"train_loss": -20.994979858398438, "global_step": 68552, "epoch": 825} {"train_loss": -20.553939819335938, "global_step": 68553, "epoch": 825} {"train_loss": -20.666349411010742, "global_step": 68554, "epoch": 825} {"train_loss": -20.825239181518555, "global_step": 68555, "epoch": 825} {"train_loss": -20.891111373901367, "global_step": 68556, "epoch": 825} {"train_loss": -20.683585178421204, "global_step": 68557, "epoch": 825, "val_loss": 5949947.5} {"train_loss": -20.523998260498047, "global_step": 68558, "epoch": 826} {"train_loss": -20.418079376220703, "global_step": 68559, "epoch": 826} {"train_loss": -20.45725440979004, "global_step": 68560, "epoch": 826} {"train_loss": -20.395360946655273, "global_step": 68561, "epoch": 826} {"train_loss": -20.57172203063965, "global_step": 68562, "epoch": 826} {"train_loss": -20.360782623291016, "global_step": 68563, "epoch": 826} {"train_loss": -20.58363914489746, "global_step": 68564, "epoch": 826} {"train_loss": -20.87806510925293, "global_step": 68565, "epoch": 826} {"train_loss": -20.394290924072266, "global_step": 68566, "epoch": 826} {"train_loss": -20.519529342651367, "global_step": 68567, "epoch": 826} {"train_loss": -21.057615280151367, "global_step": 68568, "epoch": 826} {"train_loss": -20.541032791137695, "global_step": 68569, "epoch": 826} {"train_loss": -20.82413101196289, "global_step": 68570, "epoch": 826} {"train_loss": -20.728805541992188, "global_step": 68571, "epoch": 826} {"train_loss": -20.909854888916016, "global_step": 68572, "epoch": 826} {"train_loss": -20.55124282836914, "global_step": 68573, "epoch": 826} {"train_loss": -21.00021743774414, "global_step": 68574, "epoch": 826} {"train_loss": -20.666915893554688, "global_step": 68575, "epoch": 826} {"train_loss": -20.969972610473633, "global_step": 68576, "epoch": 826} {"train_loss": -20.773181915283203, "global_step": 68577, "epoch": 826} {"train_loss": -20.86256217956543, "global_step": 68578, "epoch": 826} {"train_loss": -20.843435287475586, "global_step": 68579, "epoch": 826} {"train_loss": -20.80767250061035, "global_step": 68580, "epoch": 826} {"train_loss": -20.749210357666016, "global_step": 68581, "epoch": 826} {"train_loss": -20.614316940307617, "global_step": 68582, "epoch": 826} {"train_loss": -21.03480339050293, "global_step": 68583, "epoch": 826} {"train_loss": -20.74639129638672, "global_step": 68584, "epoch": 826} {"train_loss": -21.096899032592773, "global_step": 68585, "epoch": 826} {"train_loss": -20.615041732788086, "global_step": 68586, "epoch": 826} {"train_loss": -20.405179977416992, "global_step": 68587, "epoch": 826} {"train_loss": -20.71288299560547, "global_step": 68588, "epoch": 826} {"train_loss": -20.777015686035156, "global_step": 68589, "epoch": 826} {"train_loss": -20.589025497436523, "global_step": 68590, "epoch": 826} {"train_loss": -20.85444450378418, "global_step": 68591, "epoch": 826} {"train_loss": -20.7938289642334, "global_step": 68592, "epoch": 826} {"train_loss": -20.66292953491211, "global_step": 68593, "epoch": 826} {"train_loss": -20.716636657714844, "global_step": 68594, "epoch": 826} {"train_loss": -20.578269958496094, "global_step": 68595, "epoch": 826} {"train_loss": -20.58784294128418, "global_step": 68596, "epoch": 826} {"train_loss": -20.8530216217041, "global_step": 68597, "epoch": 826} {"train_loss": -20.983259201049805, "global_step": 68598, "epoch": 826} {"train_loss": -20.97712516784668, "global_step": 68599, "epoch": 826} {"train_loss": -20.628713607788086, "global_step": 68600, "epoch": 826} {"train_loss": -20.58146095275879, "global_step": 68601, "epoch": 826} {"train_loss": -20.973508834838867, "global_step": 68602, "epoch": 826} {"train_loss": -21.17671775817871, "global_step": 68603, "epoch": 826} {"train_loss": -20.636564254760742, "global_step": 68604, "epoch": 826} {"train_loss": -20.70958709716797, "global_step": 68605, "epoch": 826} {"train_loss": -20.426061630249023, "global_step": 68606, "epoch": 826} {"train_loss": -20.404401779174805, "global_step": 68607, "epoch": 826} {"train_loss": -20.97620964050293, "global_step": 68608, "epoch": 826} {"train_loss": -20.86362648010254, "global_step": 68609, "epoch": 826} {"train_loss": -20.53757667541504, "global_step": 68610, "epoch": 826} {"train_loss": -20.638748168945312, "global_step": 68611, "epoch": 826} {"train_loss": -20.838090896606445, "global_step": 68612, "epoch": 826} {"train_loss": -20.820646286010742, "global_step": 68613, "epoch": 826} {"train_loss": -20.964487075805664, "global_step": 68614, "epoch": 826} {"train_loss": -20.46116065979004, "global_step": 68615, "epoch": 826} {"train_loss": -20.53196144104004, "global_step": 68616, "epoch": 826} {"train_loss": -20.64859962463379, "global_step": 68617, "epoch": 826} {"train_loss": -20.903234481811523, "global_step": 68618, "epoch": 826} {"train_loss": -20.571163177490234, "global_step": 68619, "epoch": 826} {"train_loss": -20.34401512145996, "global_step": 68620, "epoch": 826} {"train_loss": -20.554967880249023, "global_step": 68621, "epoch": 826} {"train_loss": -20.63673210144043, "global_step": 68622, "epoch": 826} {"train_loss": -20.538818359375, "global_step": 68623, "epoch": 826} {"train_loss": -20.61626625061035, "global_step": 68624, "epoch": 826} {"train_loss": -20.803131103515625, "global_step": 68625, "epoch": 826} {"train_loss": -20.94899559020996, "global_step": 68626, "epoch": 826} {"train_loss": -20.5423641204834, "global_step": 68627, "epoch": 826} {"train_loss": -21.038419723510742, "global_step": 68628, "epoch": 826} {"train_loss": -20.91219711303711, "global_step": 68629, "epoch": 826} {"train_loss": -20.617971420288086, "global_step": 68630, "epoch": 826} {"train_loss": -20.733854293823242, "global_step": 68631, "epoch": 826} {"train_loss": -20.865209579467773, "global_step": 68632, "epoch": 826} {"train_loss": -20.799806594848633, "global_step": 68633, "epoch": 826} {"train_loss": -21.046045303344727, "global_step": 68634, "epoch": 826} {"train_loss": -20.30531120300293, "global_step": 68635, "epoch": 826} {"train_loss": -20.71517562866211, "global_step": 68636, "epoch": 826} {"train_loss": -20.683107376098633, "global_step": 68637, "epoch": 826} {"train_loss": -20.716245651245117, "global_step": 68638, "epoch": 826} {"train_loss": -20.933263778686523, "global_step": 68639, "epoch": 826} {"train_loss": -20.724453799695855, "global_step": 68640, "epoch": 826, "val_loss": 5943430.5} {"train_loss": -20.643949508666992, "global_step": 68641, "epoch": 827} {"train_loss": -20.511302947998047, "global_step": 68642, "epoch": 827} {"train_loss": -20.184049606323242, "global_step": 68643, "epoch": 827} {"train_loss": -20.629026412963867, "global_step": 68644, "epoch": 827} {"train_loss": -20.469144821166992, "global_step": 68645, "epoch": 827} {"train_loss": -20.557302474975586, "global_step": 68646, "epoch": 827} {"train_loss": -20.51416015625, "global_step": 68647, "epoch": 827} {"train_loss": -20.77425193786621, "global_step": 68648, "epoch": 827} {"train_loss": -20.980802536010742, "global_step": 68649, "epoch": 827} {"train_loss": -20.85811424255371, "global_step": 68650, "epoch": 827} {"train_loss": -20.73772621154785, "global_step": 68651, "epoch": 827} {"train_loss": -20.661346435546875, "global_step": 68652, "epoch": 827} {"train_loss": -20.732614517211914, "global_step": 68653, "epoch": 827} {"train_loss": -20.85149383544922, "global_step": 68654, "epoch": 827} {"train_loss": -20.395421981811523, "global_step": 68655, "epoch": 827} {"train_loss": -20.727466583251953, "global_step": 68656, "epoch": 827} {"train_loss": -20.586761474609375, "global_step": 68657, "epoch": 827} {"train_loss": -20.93397331237793, "global_step": 68658, "epoch": 827} {"train_loss": -20.62959098815918, "global_step": 68659, "epoch": 827} {"train_loss": -20.87872314453125, "global_step": 68660, "epoch": 827} {"train_loss": -20.662424087524414, "global_step": 68661, "epoch": 827} {"train_loss": -20.575349807739258, "global_step": 68662, "epoch": 827} {"train_loss": -20.699548721313477, "global_step": 68663, "epoch": 827} {"train_loss": -20.745296478271484, "global_step": 68664, "epoch": 827} {"train_loss": -20.8658504486084, "global_step": 68665, "epoch": 827} {"train_loss": -20.55791664123535, "global_step": 68666, "epoch": 827} {"train_loss": -20.765823364257812, "global_step": 68667, "epoch": 827} {"train_loss": -20.906484603881836, "global_step": 68668, "epoch": 827} {"train_loss": -20.606552124023438, "global_step": 68669, "epoch": 827} {"train_loss": -20.606721878051758, "global_step": 68670, "epoch": 827} {"train_loss": -20.863595962524414, "global_step": 68671, "epoch": 827} {"train_loss": -20.598684310913086, "global_step": 68672, "epoch": 827} {"train_loss": -20.45533561706543, "global_step": 68673, "epoch": 827} {"train_loss": -20.856325149536133, "global_step": 68674, "epoch": 827} {"train_loss": -20.745189666748047, "global_step": 68675, "epoch": 827} {"train_loss": -20.43762969970703, "global_step": 68676, "epoch": 827} {"train_loss": -20.826017379760742, "global_step": 68677, "epoch": 827} {"train_loss": -21.025192260742188, "global_step": 68678, "epoch": 827} {"train_loss": -20.48988151550293, "global_step": 68679, "epoch": 827} {"train_loss": -20.689420700073242, "global_step": 68680, "epoch": 827} {"train_loss": -20.954980850219727, "global_step": 68681, "epoch": 827} {"train_loss": -20.7232723236084, "global_step": 68682, "epoch": 827} {"train_loss": -20.714750289916992, "global_step": 68683, "epoch": 827} {"train_loss": -20.716007232666016, "global_step": 68684, "epoch": 827} {"train_loss": -20.698686599731445, "global_step": 68685, "epoch": 827} {"train_loss": -20.602598190307617, "global_step": 68686, "epoch": 827} {"train_loss": -20.71025848388672, "global_step": 68687, "epoch": 827} {"train_loss": -20.67327880859375, "global_step": 68688, "epoch": 827} {"train_loss": -20.336252212524414, "global_step": 68689, "epoch": 827} {"train_loss": -20.754697799682617, "global_step": 68690, "epoch": 827} {"train_loss": -20.474470138549805, "global_step": 68691, "epoch": 827} {"train_loss": -21.0423526763916, "global_step": 68692, "epoch": 827} {"train_loss": -20.580293655395508, "global_step": 68693, "epoch": 827} {"train_loss": -20.392595291137695, "global_step": 68694, "epoch": 827} {"train_loss": -20.616727828979492, "global_step": 68695, "epoch": 827} {"train_loss": -21.230602264404297, "global_step": 68696, "epoch": 827} {"train_loss": -20.776824951171875, "global_step": 68697, "epoch": 827} {"train_loss": -20.47501564025879, "global_step": 68698, "epoch": 827} {"train_loss": -20.91847801208496, "global_step": 68699, "epoch": 827} {"train_loss": -20.4245548248291, "global_step": 68700, "epoch": 827} {"train_loss": -20.915882110595703, "global_step": 68701, "epoch": 827} {"train_loss": -20.570234298706055, "global_step": 68702, "epoch": 827} {"train_loss": -20.731719970703125, "global_step": 68703, "epoch": 827} {"train_loss": -20.967615127563477, "global_step": 68704, "epoch": 827} {"train_loss": -20.41375160217285, "global_step": 68705, "epoch": 827} {"train_loss": -20.728437423706055, "global_step": 68706, "epoch": 827} {"train_loss": -20.60586929321289, "global_step": 68707, "epoch": 827} {"train_loss": -20.681528091430664, "global_step": 68708, "epoch": 827} {"train_loss": -20.826852798461914, "global_step": 68709, "epoch": 827} {"train_loss": -20.891199111938477, "global_step": 68710, "epoch": 827} {"train_loss": -20.827470779418945, "global_step": 68711, "epoch": 827} {"train_loss": -21.236297607421875, "global_step": 68712, "epoch": 827} {"train_loss": -20.677650451660156, "global_step": 68713, "epoch": 827} {"train_loss": -20.806015014648438, "global_step": 68714, "epoch": 827} {"train_loss": -20.378171920776367, "global_step": 68715, "epoch": 827} {"train_loss": -20.94965934753418, "global_step": 68716, "epoch": 827} {"train_loss": -20.455663681030273, "global_step": 68717, "epoch": 827} {"train_loss": -21.077810287475586, "global_step": 68718, "epoch": 827} {"train_loss": -20.885648727416992, "global_step": 68719, "epoch": 827} {"train_loss": -20.739843368530273, "global_step": 68720, "epoch": 827} {"train_loss": -20.631010055541992, "global_step": 68721, "epoch": 827} {"train_loss": -20.69329261779785, "global_step": 68722, "epoch": 827} {"train_loss": -20.703662045030708, "global_step": 68723, "epoch": 827, "val_loss": 6174661.0} {"train_loss": -20.178434371948242, "global_step": 68724, "epoch": 828} {"train_loss": -19.966283798217773, "global_step": 68725, "epoch": 828} {"train_loss": -20.44782829284668, "global_step": 68726, "epoch": 828} {"train_loss": -20.222835540771484, "global_step": 68727, "epoch": 828} {"train_loss": -20.349475860595703, "global_step": 68728, "epoch": 828} {"train_loss": -20.49295997619629, "global_step": 68729, "epoch": 828} {"train_loss": -20.37641143798828, "global_step": 68730, "epoch": 828} {"train_loss": -20.298866271972656, "global_step": 68731, "epoch": 828} {"train_loss": -20.440128326416016, "global_step": 68732, "epoch": 828} {"train_loss": -20.707853317260742, "global_step": 68733, "epoch": 828} {"train_loss": -20.66143035888672, "global_step": 68734, "epoch": 828} {"train_loss": -20.48328971862793, "global_step": 68735, "epoch": 828} {"train_loss": -20.519330978393555, "global_step": 68736, "epoch": 828} {"train_loss": -20.477081298828125, "global_step": 68737, "epoch": 828} {"train_loss": -20.57895851135254, "global_step": 68738, "epoch": 828} {"train_loss": -20.612220764160156, "global_step": 68739, "epoch": 828} {"train_loss": -20.712003707885742, "global_step": 68740, "epoch": 828} {"train_loss": -20.740570068359375, "global_step": 68741, "epoch": 828} {"train_loss": -20.622060775756836, "global_step": 68742, "epoch": 828} {"train_loss": -20.65000343322754, "global_step": 68743, "epoch": 828} {"train_loss": -20.50851821899414, "global_step": 68744, "epoch": 828} {"train_loss": -20.895326614379883, "global_step": 68745, "epoch": 828} {"train_loss": -20.354995727539062, "global_step": 68746, "epoch": 828} {"train_loss": -21.03156852722168, "global_step": 68747, "epoch": 828} {"train_loss": -20.957141876220703, "global_step": 68748, "epoch": 828} {"train_loss": -20.745288848876953, "global_step": 68749, "epoch": 828} {"train_loss": -20.919509887695312, "global_step": 68750, "epoch": 828} {"train_loss": -20.58424949645996, "global_step": 68751, "epoch": 828} {"train_loss": -20.7189998626709, "global_step": 68752, "epoch": 828} {"train_loss": -20.70240592956543, "global_step": 68753, "epoch": 828} {"train_loss": -20.954486846923828, "global_step": 68754, "epoch": 828} {"train_loss": -21.015094757080078, "global_step": 68755, "epoch": 828} {"train_loss": -20.67279624938965, "global_step": 68756, "epoch": 828} {"train_loss": -20.6652774810791, "global_step": 68757, "epoch": 828} {"train_loss": -21.003646850585938, "global_step": 68758, "epoch": 828} {"train_loss": -20.963022232055664, "global_step": 68759, "epoch": 828} {"train_loss": -20.78386878967285, "global_step": 68760, "epoch": 828} {"train_loss": -20.665119171142578, "global_step": 68761, "epoch": 828} {"train_loss": -20.80439567565918, "global_step": 68762, "epoch": 828} {"train_loss": -20.800687789916992, "global_step": 68763, "epoch": 828} {"train_loss": -20.667390823364258, "global_step": 68764, "epoch": 828} {"train_loss": -20.433914184570312, "global_step": 68765, "epoch": 828} {"train_loss": -20.825082778930664, "global_step": 68766, "epoch": 828} {"train_loss": -21.079591751098633, "global_step": 68767, "epoch": 828} {"train_loss": -20.533544540405273, "global_step": 68768, "epoch": 828} {"train_loss": -20.905447006225586, "global_step": 68769, "epoch": 828} {"train_loss": -20.477916717529297, "global_step": 68770, "epoch": 828} {"train_loss": -21.275197982788086, "global_step": 68771, "epoch": 828} {"train_loss": -20.49464225769043, "global_step": 68772, "epoch": 828} {"train_loss": -20.822267532348633, "global_step": 68773, "epoch": 828} {"train_loss": -20.947797775268555, "global_step": 68774, "epoch": 828} {"train_loss": -20.86097526550293, "global_step": 68775, "epoch": 828} {"train_loss": -21.266019821166992, "global_step": 68776, "epoch": 828} {"train_loss": -20.500890731811523, "global_step": 68777, "epoch": 828} {"train_loss": -20.959854125976562, "global_step": 68778, "epoch": 828} {"train_loss": -20.76101303100586, "global_step": 68779, "epoch": 828} {"train_loss": -20.63788414001465, "global_step": 68780, "epoch": 828} {"train_loss": -20.817129135131836, "global_step": 68781, "epoch": 828} {"train_loss": -20.8956241607666, "global_step": 68782, "epoch": 828} {"train_loss": -20.765966415405273, "global_step": 68783, "epoch": 828} {"train_loss": -20.783405303955078, "global_step": 68784, "epoch": 828} {"train_loss": -20.709632873535156, "global_step": 68785, "epoch": 828} {"train_loss": -20.3035945892334, "global_step": 68786, "epoch": 828} {"train_loss": -20.401086807250977, "global_step": 68787, "epoch": 828} {"train_loss": -20.716449737548828, "global_step": 68788, "epoch": 828} {"train_loss": -20.836679458618164, "global_step": 68789, "epoch": 828} {"train_loss": -20.988910675048828, "global_step": 68790, "epoch": 828} {"train_loss": -21.437280654907227, "global_step": 68791, "epoch": 828} {"train_loss": -20.834789276123047, "global_step": 68792, "epoch": 828} {"train_loss": -20.859342575073242, "global_step": 68793, "epoch": 828} {"train_loss": -21.00538444519043, "global_step": 68794, "epoch": 828} {"train_loss": -20.970670700073242, "global_step": 68795, "epoch": 828} {"train_loss": -20.94683837890625, "global_step": 68796, "epoch": 828} {"train_loss": -20.943227767944336, "global_step": 68797, "epoch": 828} {"train_loss": -20.918720245361328, "global_step": 68798, "epoch": 828} {"train_loss": -20.58156394958496, "global_step": 68799, "epoch": 828} {"train_loss": -20.965045928955078, "global_step": 68800, "epoch": 828} {"train_loss": -20.885730743408203, "global_step": 68801, "epoch": 828} {"train_loss": -20.763397216796875, "global_step": 68802, "epoch": 828} {"train_loss": -21.0974063873291, "global_step": 68803, "epoch": 828} {"train_loss": -21.20233917236328, "global_step": 68804, "epoch": 828} {"train_loss": -20.63431739807129, "global_step": 68805, "epoch": 828} {"train_loss": -20.746222346662037, "global_step": 68806, "epoch": 828, "val_loss": 5952920.5} {"train_loss": -20.549076080322266, "global_step": 68807, "epoch": 829} {"train_loss": -20.9122314453125, "global_step": 68808, "epoch": 829} {"train_loss": -20.853546142578125, "global_step": 68809, "epoch": 829} {"train_loss": -20.820337295532227, "global_step": 68810, "epoch": 829} {"train_loss": -20.896015167236328, "global_step": 68811, "epoch": 829} {"train_loss": -20.88492202758789, "global_step": 68812, "epoch": 829} {"train_loss": -20.70570945739746, "global_step": 68813, "epoch": 829} {"train_loss": -21.081113815307617, "global_step": 68814, "epoch": 829} {"train_loss": -20.92158317565918, "global_step": 68815, "epoch": 829} {"train_loss": -20.880943298339844, "global_step": 68816, "epoch": 829} {"train_loss": -20.672225952148438, "global_step": 68817, "epoch": 829} {"train_loss": -20.910064697265625, "global_step": 68818, "epoch": 829} {"train_loss": -20.39531898498535, "global_step": 68819, "epoch": 829} {"train_loss": -20.56821632385254, "global_step": 68820, "epoch": 829} {"train_loss": -20.71668815612793, "global_step": 68821, "epoch": 829} {"train_loss": -20.49945640563965, "global_step": 68822, "epoch": 829} {"train_loss": -20.83819007873535, "global_step": 68823, "epoch": 829} {"train_loss": -20.77395248413086, "global_step": 68824, "epoch": 829} {"train_loss": -20.60230827331543, "global_step": 68825, "epoch": 829} {"train_loss": -21.190641403198242, "global_step": 68826, "epoch": 829} {"train_loss": -21.053607940673828, "global_step": 68827, "epoch": 829} {"train_loss": -20.77878761291504, "global_step": 68828, "epoch": 829} {"train_loss": -20.754220962524414, "global_step": 68829, "epoch": 829} {"train_loss": -20.539777755737305, "global_step": 68830, "epoch": 829} {"train_loss": -20.55722999572754, "global_step": 68831, "epoch": 829} {"train_loss": -20.93592643737793, "global_step": 68832, "epoch": 829} {"train_loss": -21.0811767578125, "global_step": 68833, "epoch": 829} {"train_loss": -20.65826988220215, "global_step": 68834, "epoch": 829} {"train_loss": -20.55773162841797, "global_step": 68835, "epoch": 829} {"train_loss": -20.80450439453125, "global_step": 68836, "epoch": 829} {"train_loss": -20.9121150970459, "global_step": 68837, "epoch": 829} {"train_loss": -20.73053550720215, "global_step": 68838, "epoch": 829} {"train_loss": -20.569923400878906, "global_step": 68839, "epoch": 829} {"train_loss": -20.911426544189453, "global_step": 68840, "epoch": 829} {"train_loss": -20.78977394104004, "global_step": 68841, "epoch": 829} {"train_loss": -20.568561553955078, "global_step": 68842, "epoch": 829} {"train_loss": -20.81760025024414, "global_step": 68843, "epoch": 829} {"train_loss": -21.112546920776367, "global_step": 68844, "epoch": 829} {"train_loss": -20.903045654296875, "global_step": 68845, "epoch": 829} {"train_loss": -21.08368492126465, "global_step": 68846, "epoch": 829} {"train_loss": -20.6192684173584, "global_step": 68847, "epoch": 829} {"train_loss": -20.80970573425293, "global_step": 68848, "epoch": 829} {"train_loss": -20.56403160095215, "global_step": 68849, "epoch": 829} {"train_loss": -20.95695686340332, "global_step": 68850, "epoch": 829} {"train_loss": -20.953277587890625, "global_step": 68851, "epoch": 829} {"train_loss": -20.74188232421875, "global_step": 68852, "epoch": 829} {"train_loss": -20.71638298034668, "global_step": 68853, "epoch": 829} {"train_loss": -20.804645538330078, "global_step": 68854, "epoch": 829} {"train_loss": -21.086931228637695, "global_step": 68855, "epoch": 829} {"train_loss": -21.10958480834961, "global_step": 68856, "epoch": 829} {"train_loss": -20.614192962646484, "global_step": 68857, "epoch": 829} {"train_loss": -21.02325439453125, "global_step": 68858, "epoch": 829} {"train_loss": -20.698911666870117, "global_step": 68859, "epoch": 829} {"train_loss": -20.572111129760742, "global_step": 68860, "epoch": 829} {"train_loss": -20.777240753173828, "global_step": 68861, "epoch": 829} {"train_loss": -20.78300666809082, "global_step": 68862, "epoch": 829} {"train_loss": -20.896686553955078, "global_step": 68863, "epoch": 829} {"train_loss": -20.697280883789062, "global_step": 68864, "epoch": 829} {"train_loss": -20.50116539001465, "global_step": 68865, "epoch": 829} {"train_loss": -20.785062789916992, "global_step": 68866, "epoch": 829} {"train_loss": -20.38395118713379, "global_step": 68867, "epoch": 829} {"train_loss": -21.219324111938477, "global_step": 68868, "epoch": 829} {"train_loss": -20.40142250061035, "global_step": 68869, "epoch": 829} {"train_loss": -21.100507736206055, "global_step": 68870, "epoch": 829} {"train_loss": -20.696613311767578, "global_step": 68871, "epoch": 829} {"train_loss": -20.947677612304688, "global_step": 68872, "epoch": 829} {"train_loss": -20.455373764038086, "global_step": 68873, "epoch": 829} {"train_loss": -20.681745529174805, "global_step": 68874, "epoch": 829} {"train_loss": -21.02048683166504, "global_step": 68875, "epoch": 829} {"train_loss": -20.75459861755371, "global_step": 68876, "epoch": 829} {"train_loss": -21.186935424804688, "global_step": 68877, "epoch": 829} {"train_loss": -20.261404037475586, "global_step": 68878, "epoch": 829} {"train_loss": -20.68333625793457, "global_step": 68879, "epoch": 829} {"train_loss": -21.020599365234375, "global_step": 68880, "epoch": 829} {"train_loss": -20.63755989074707, "global_step": 68881, "epoch": 829} {"train_loss": -20.617046356201172, "global_step": 68882, "epoch": 829} {"train_loss": -20.60640525817871, "global_step": 68883, "epoch": 829} {"train_loss": -20.649539947509766, "global_step": 68884, "epoch": 829} {"train_loss": -20.97163963317871, "global_step": 68885, "epoch": 829} {"train_loss": -20.898019790649414, "global_step": 68886, "epoch": 829} {"train_loss": -21.23870277404785, "global_step": 68887, "epoch": 829} {"train_loss": -20.567127227783203, "global_step": 68888, "epoch": 829} {"train_loss": -20.777161931417073, "global_step": 68889, "epoch": 829, "val_loss": 5936458.0} {"train_loss": -20.433500289916992, "global_step": 68890, "epoch": 830} {"train_loss": -20.046873092651367, "global_step": 68891, "epoch": 830} {"train_loss": -20.36566162109375, "global_step": 68892, "epoch": 830} {"train_loss": -20.573902130126953, "global_step": 68893, "epoch": 830} {"train_loss": -20.26932716369629, "global_step": 68894, "epoch": 830} {"train_loss": -20.924354553222656, "global_step": 68895, "epoch": 830} {"train_loss": -20.465469360351562, "global_step": 68896, "epoch": 830} {"train_loss": -20.50533103942871, "global_step": 68897, "epoch": 830} {"train_loss": -20.880197525024414, "global_step": 68898, "epoch": 830} {"train_loss": -20.608362197875977, "global_step": 68899, "epoch": 830} {"train_loss": -20.823183059692383, "global_step": 68900, "epoch": 830} {"train_loss": -20.70600700378418, "global_step": 68901, "epoch": 830} {"train_loss": -20.609521865844727, "global_step": 68902, "epoch": 830} {"train_loss": -20.629867553710938, "global_step": 68903, "epoch": 830} {"train_loss": -20.47930335998535, "global_step": 68904, "epoch": 830} {"train_loss": -20.683218002319336, "global_step": 68905, "epoch": 830} {"train_loss": -20.964975357055664, "global_step": 68906, "epoch": 830} {"train_loss": -20.67741584777832, "global_step": 68907, "epoch": 830} {"train_loss": -20.59034538269043, "global_step": 68908, "epoch": 830} {"train_loss": -20.998767852783203, "global_step": 68909, "epoch": 830} {"train_loss": -20.755664825439453, "global_step": 68910, "epoch": 830} {"train_loss": -20.84518051147461, "global_step": 68911, "epoch": 830} {"train_loss": -21.002994537353516, "global_step": 68912, "epoch": 830} {"train_loss": -20.969375610351562, "global_step": 68913, "epoch": 830} {"train_loss": -20.627887725830078, "global_step": 68914, "epoch": 830} {"train_loss": -20.76920509338379, "global_step": 68915, "epoch": 830} {"train_loss": -20.74264144897461, "global_step": 68916, "epoch": 830} {"train_loss": -20.823505401611328, "global_step": 68917, "epoch": 830} {"train_loss": -20.999296188354492, "global_step": 68918, "epoch": 830} {"train_loss": -21.007837295532227, "global_step": 68919, "epoch": 830} {"train_loss": -21.01736831665039, "global_step": 68920, "epoch": 830} {"train_loss": -20.86189842224121, "global_step": 68921, "epoch": 830} {"train_loss": -20.647506713867188, "global_step": 68922, "epoch": 830} {"train_loss": -21.16059112548828, "global_step": 68923, "epoch": 830} {"train_loss": -20.61508560180664, "global_step": 68924, "epoch": 830} {"train_loss": -20.942285537719727, "global_step": 68925, "epoch": 830} {"train_loss": -20.71359634399414, "global_step": 68926, "epoch": 830} {"train_loss": -20.5883846282959, "global_step": 68927, "epoch": 830} {"train_loss": -20.554250717163086, "global_step": 68928, "epoch": 830} {"train_loss": -20.803068161010742, "global_step": 68929, "epoch": 830} {"train_loss": -21.325037002563477, "global_step": 68930, "epoch": 830} {"train_loss": -20.71337890625, "global_step": 68931, "epoch": 830} {"train_loss": -20.918285369873047, "global_step": 68932, "epoch": 830} {"train_loss": -20.821828842163086, "global_step": 68933, "epoch": 830} {"train_loss": -20.689855575561523, "global_step": 68934, "epoch": 830} {"train_loss": -20.928518295288086, "global_step": 68935, "epoch": 830} {"train_loss": -20.806795120239258, "global_step": 68936, "epoch": 830} {"train_loss": -21.018917083740234, "global_step": 68937, "epoch": 830} {"train_loss": -20.661911010742188, "global_step": 68938, "epoch": 830} {"train_loss": -20.43467140197754, "global_step": 68939, "epoch": 830} {"train_loss": -20.962350845336914, "global_step": 68940, "epoch": 830} {"train_loss": -20.602100372314453, "global_step": 68941, "epoch": 830} {"train_loss": -20.986520767211914, "global_step": 68942, "epoch": 830} {"train_loss": -21.08219337463379, "global_step": 68943, "epoch": 830} {"train_loss": -20.63273048400879, "global_step": 68944, "epoch": 830} {"train_loss": -21.117624282836914, "global_step": 68945, "epoch": 830} {"train_loss": -20.525794982910156, "global_step": 68946, "epoch": 830} {"train_loss": -20.87384605407715, "global_step": 68947, "epoch": 830} {"train_loss": -21.196149826049805, "global_step": 68948, "epoch": 830} {"train_loss": -20.920461654663086, "global_step": 68949, "epoch": 830} {"train_loss": -20.451745986938477, "global_step": 68950, "epoch": 830} {"train_loss": -20.85120391845703, "global_step": 68951, "epoch": 830} {"train_loss": -20.83782386779785, "global_step": 68952, "epoch": 830} {"train_loss": -20.82533836364746, "global_step": 68953, "epoch": 830} {"train_loss": -20.730859756469727, "global_step": 68954, "epoch": 830} {"train_loss": -20.72416114807129, "global_step": 68955, "epoch": 830} {"train_loss": -20.56468963623047, "global_step": 68956, "epoch": 830} {"train_loss": -20.826200485229492, "global_step": 68957, "epoch": 830} {"train_loss": -20.73956871032715, "global_step": 68958, "epoch": 830} {"train_loss": -20.987964630126953, "global_step": 68959, "epoch": 830} {"train_loss": -20.475200653076172, "global_step": 68960, "epoch": 830} {"train_loss": -20.87269401550293, "global_step": 68961, "epoch": 830} {"train_loss": -20.733842849731445, "global_step": 68962, "epoch": 830} {"train_loss": -20.721405029296875, "global_step": 68963, "epoch": 830} {"train_loss": -20.930789947509766, "global_step": 68964, "epoch": 830} {"train_loss": -20.76235580444336, "global_step": 68965, "epoch": 830} {"train_loss": -20.92457389831543, "global_step": 68966, "epoch": 830} {"train_loss": -20.921993255615234, "global_step": 68967, "epoch": 830} {"train_loss": -20.599971771240234, "global_step": 68968, "epoch": 830} {"train_loss": -20.584524154663086, "global_step": 68969, "epoch": 830} {"train_loss": -21.084049224853516, "global_step": 68970, "epoch": 830} {"train_loss": -20.448593139648438, "global_step": 68971, "epoch": 830} {"train_loss": -20.768666830407568, "global_step": 68972, "epoch": 830, "val_loss": 6065464.0} {"train_loss": -20.626073837280273, "global_step": 68973, "epoch": 831} {"train_loss": -20.815488815307617, "global_step": 68974, "epoch": 831} {"train_loss": -20.694852828979492, "global_step": 68975, "epoch": 831} {"train_loss": -20.533878326416016, "global_step": 68976, "epoch": 831} {"train_loss": -20.56599998474121, "global_step": 68977, "epoch": 831} {"train_loss": -20.903623580932617, "global_step": 68978, "epoch": 831} {"train_loss": -20.653799057006836, "global_step": 68979, "epoch": 831} {"train_loss": -20.523630142211914, "global_step": 68980, "epoch": 831} {"train_loss": -20.848339080810547, "global_step": 68981, "epoch": 831} {"train_loss": -21.046361923217773, "global_step": 68982, "epoch": 831} {"train_loss": -20.664234161376953, "global_step": 68983, "epoch": 831} {"train_loss": -20.981693267822266, "global_step": 68984, "epoch": 831} {"train_loss": -21.078641891479492, "global_step": 68985, "epoch": 831} {"train_loss": -20.540996551513672, "global_step": 68986, "epoch": 831} {"train_loss": -20.7908992767334, "global_step": 68987, "epoch": 831} {"train_loss": -20.964344024658203, "global_step": 68988, "epoch": 831} {"train_loss": -20.663095474243164, "global_step": 68989, "epoch": 831} {"train_loss": -20.970495223999023, "global_step": 68990, "epoch": 831} {"train_loss": -20.54632568359375, "global_step": 68991, "epoch": 831} {"train_loss": -20.68430519104004, "global_step": 68992, "epoch": 831} {"train_loss": -21.049436569213867, "global_step": 68993, "epoch": 831} {"train_loss": -21.070764541625977, "global_step": 68994, "epoch": 831} {"train_loss": -20.87579917907715, "global_step": 68995, "epoch": 831} {"train_loss": -20.56800651550293, "global_step": 68996, "epoch": 831} {"train_loss": -20.84467887878418, "global_step": 68997, "epoch": 831} {"train_loss": -20.803281784057617, "global_step": 68998, "epoch": 831} {"train_loss": -20.48966407775879, "global_step": 68999, "epoch": 831} {"train_loss": -20.706005096435547, "global_step": 69000, "epoch": 831} {"train_loss": -21.081350326538086, "global_step": 69001, "epoch": 831} {"train_loss": -20.660104751586914, "global_step": 69002, "epoch": 831} {"train_loss": -20.723730087280273, "global_step": 69003, "epoch": 831} {"train_loss": -20.591388702392578, "global_step": 69004, "epoch": 831} {"train_loss": -20.83644676208496, "global_step": 69005, "epoch": 831} {"train_loss": -20.86604118347168, "global_step": 69006, "epoch": 831} {"train_loss": -20.750173568725586, "global_step": 69007, "epoch": 831} {"train_loss": -20.840402603149414, "global_step": 69008, "epoch": 831} {"train_loss": -20.647327423095703, "global_step": 69009, "epoch": 831} {"train_loss": -21.223175048828125, "global_step": 69010, "epoch": 831} {"train_loss": -20.93772315979004, "global_step": 69011, "epoch": 831} {"train_loss": -20.836450576782227, "global_step": 69012, "epoch": 831} {"train_loss": -20.653839111328125, "global_step": 69013, "epoch": 831} {"train_loss": -20.721670150756836, "global_step": 69014, "epoch": 831} {"train_loss": -20.853837966918945, "global_step": 69015, "epoch": 831} {"train_loss": -20.998579025268555, "global_step": 69016, "epoch": 831} {"train_loss": -20.830808639526367, "global_step": 69017, "epoch": 831} {"train_loss": -20.418701171875, "global_step": 69018, "epoch": 831} {"train_loss": -20.44959259033203, "global_step": 69019, "epoch": 831} {"train_loss": -20.737897872924805, "global_step": 69020, "epoch": 831} {"train_loss": -20.756397247314453, "global_step": 69021, "epoch": 831} {"train_loss": -20.722402572631836, "global_step": 69022, "epoch": 831} {"train_loss": -21.178295135498047, "global_step": 69023, "epoch": 831} {"train_loss": -20.595932006835938, "global_step": 69024, "epoch": 831} {"train_loss": -20.76742172241211, "global_step": 69025, "epoch": 831} {"train_loss": -21.378034591674805, "global_step": 69026, "epoch": 831} {"train_loss": -20.5950927734375, "global_step": 69027, "epoch": 831} {"train_loss": -20.470701217651367, "global_step": 69028, "epoch": 831} {"train_loss": -20.617584228515625, "global_step": 69029, "epoch": 831} {"train_loss": -20.386571884155273, "global_step": 69030, "epoch": 831} {"train_loss": -20.494653701782227, "global_step": 69031, "epoch": 831} {"train_loss": -20.70834732055664, "global_step": 69032, "epoch": 831} {"train_loss": -20.868896484375, "global_step": 69033, "epoch": 831} {"train_loss": -20.738628387451172, "global_step": 69034, "epoch": 831} {"train_loss": -20.33407211303711, "global_step": 69035, "epoch": 831} {"train_loss": -20.851165771484375, "global_step": 69036, "epoch": 831} {"train_loss": -20.54955291748047, "global_step": 69037, "epoch": 831} {"train_loss": -20.46748924255371, "global_step": 69038, "epoch": 831} {"train_loss": -21.11236572265625, "global_step": 69039, "epoch": 831} {"train_loss": -20.193313598632812, "global_step": 69040, "epoch": 831} {"train_loss": -21.08403205871582, "global_step": 69041, "epoch": 831} {"train_loss": -20.852495193481445, "global_step": 69042, "epoch": 831} {"train_loss": -20.576650619506836, "global_step": 69043, "epoch": 831} {"train_loss": -20.800861358642578, "global_step": 69044, "epoch": 831} {"train_loss": -20.459747314453125, "global_step": 69045, "epoch": 831} {"train_loss": -20.722814559936523, "global_step": 69046, "epoch": 831} {"train_loss": -20.57672882080078, "global_step": 69047, "epoch": 831} {"train_loss": -20.6136531829834, "global_step": 69048, "epoch": 831} {"train_loss": -20.531299591064453, "global_step": 69049, "epoch": 831} {"train_loss": -20.789234161376953, "global_step": 69050, "epoch": 831} {"train_loss": -20.64884376525879, "global_step": 69051, "epoch": 831} {"train_loss": -20.857709884643555, "global_step": 69052, "epoch": 831} {"train_loss": -20.469751358032227, "global_step": 69053, "epoch": 831} {"train_loss": -20.63299560546875, "global_step": 69054, "epoch": 831} {"train_loss": -20.738310641553028, "global_step": 69055, "epoch": 831, "val_loss": 5877617.5} {"train_loss": -20.797616958618164, "global_step": 69056, "epoch": 832} {"train_loss": -20.554590225219727, "global_step": 69057, "epoch": 832} {"train_loss": -20.634777069091797, "global_step": 69058, "epoch": 832} {"train_loss": -20.576879501342773, "global_step": 69059, "epoch": 832} {"train_loss": -20.738662719726562, "global_step": 69060, "epoch": 832} {"train_loss": -20.7572078704834, "global_step": 69061, "epoch": 832} {"train_loss": -20.708995819091797, "global_step": 69062, "epoch": 832} {"train_loss": -20.841764450073242, "global_step": 69063, "epoch": 832} {"train_loss": -20.785627365112305, "global_step": 69064, "epoch": 832} {"train_loss": -20.620742797851562, "global_step": 69065, "epoch": 832} {"train_loss": -20.687589645385742, "global_step": 69066, "epoch": 832} {"train_loss": -20.718069076538086, "global_step": 69067, "epoch": 832} {"train_loss": -20.52952003479004, "global_step": 69068, "epoch": 832} {"train_loss": -20.50202751159668, "global_step": 69069, "epoch": 832} {"train_loss": -20.760086059570312, "global_step": 69070, "epoch": 832} {"train_loss": -20.784231185913086, "global_step": 69071, "epoch": 832} {"train_loss": -20.894027709960938, "global_step": 69072, "epoch": 832} {"train_loss": -20.64607810974121, "global_step": 69073, "epoch": 832} {"train_loss": -20.642301559448242, "global_step": 69074, "epoch": 832} {"train_loss": -21.179458618164062, "global_step": 69075, "epoch": 832} {"train_loss": -20.6378173828125, "global_step": 69076, "epoch": 832} {"train_loss": -20.472326278686523, "global_step": 69077, "epoch": 832} {"train_loss": -20.7780704498291, "global_step": 69078, "epoch": 832} {"train_loss": -20.974773406982422, "global_step": 69079, "epoch": 832} {"train_loss": -21.092985153198242, "global_step": 69080, "epoch": 832} {"train_loss": -20.8819637298584, "global_step": 69081, "epoch": 832} {"train_loss": -20.722715377807617, "global_step": 69082, "epoch": 832} {"train_loss": -20.92679214477539, "global_step": 69083, "epoch": 832} {"train_loss": -21.064062118530273, "global_step": 69084, "epoch": 832} {"train_loss": -20.742164611816406, "global_step": 69085, "epoch": 832} {"train_loss": -20.46378517150879, "global_step": 69086, "epoch": 832} {"train_loss": -20.932971954345703, "global_step": 69087, "epoch": 832} {"train_loss": -20.87689208984375, "global_step": 69088, "epoch": 832} {"train_loss": -20.573169708251953, "global_step": 69089, "epoch": 832} {"train_loss": -20.59209632873535, "global_step": 69090, "epoch": 832} {"train_loss": -20.744125366210938, "global_step": 69091, "epoch": 832} {"train_loss": -20.826337814331055, "global_step": 69092, "epoch": 832} {"train_loss": -20.613636016845703, "global_step": 69093, "epoch": 832} {"train_loss": -20.772106170654297, "global_step": 69094, "epoch": 832} {"train_loss": -20.907058715820312, "global_step": 69095, "epoch": 832} {"train_loss": -20.645498275756836, "global_step": 69096, "epoch": 832} {"train_loss": -21.06886863708496, "global_step": 69097, "epoch": 832} {"train_loss": -20.700071334838867, "global_step": 69098, "epoch": 832} {"train_loss": -20.82788848876953, "global_step": 69099, "epoch": 832} {"train_loss": -20.354516983032227, "global_step": 69100, "epoch": 832} {"train_loss": -20.49751091003418, "global_step": 69101, "epoch": 832} {"train_loss": -21.20821189880371, "global_step": 69102, "epoch": 832} {"train_loss": -20.785476684570312, "global_step": 69103, "epoch": 832} {"train_loss": -20.97964859008789, "global_step": 69104, "epoch": 832} {"train_loss": -20.850248336791992, "global_step": 69105, "epoch": 832} {"train_loss": -20.50373649597168, "global_step": 69106, "epoch": 832} {"train_loss": -20.937299728393555, "global_step": 69107, "epoch": 832} {"train_loss": -20.700956344604492, "global_step": 69108, "epoch": 832} {"train_loss": -20.658218383789062, "global_step": 69109, "epoch": 832} {"train_loss": -20.714628219604492, "global_step": 69110, "epoch": 832} {"train_loss": -20.69476318359375, "global_step": 69111, "epoch": 832} {"train_loss": -20.948108673095703, "global_step": 69112, "epoch": 832} {"train_loss": -21.050575256347656, "global_step": 69113, "epoch": 832} {"train_loss": -20.53737449645996, "global_step": 69114, "epoch": 832} {"train_loss": -20.712112426757812, "global_step": 69115, "epoch": 832} {"train_loss": -20.52205467224121, "global_step": 69116, "epoch": 832} {"train_loss": -20.932607650756836, "global_step": 69117, "epoch": 832} {"train_loss": -20.848453521728516, "global_step": 69118, "epoch": 832} {"train_loss": -20.767210006713867, "global_step": 69119, "epoch": 832} {"train_loss": -20.563688278198242, "global_step": 69120, "epoch": 832} {"train_loss": -20.992889404296875, "global_step": 69121, "epoch": 832} {"train_loss": -20.731002807617188, "global_step": 69122, "epoch": 832} {"train_loss": -20.5532169342041, "global_step": 69123, "epoch": 832} {"train_loss": -20.95083999633789, "global_step": 69124, "epoch": 832} {"train_loss": -21.019689559936523, "global_step": 69125, "epoch": 832} {"train_loss": -21.090688705444336, "global_step": 69126, "epoch": 832} {"train_loss": -20.856201171875, "global_step": 69127, "epoch": 832} {"train_loss": -20.942251205444336, "global_step": 69128, "epoch": 832} {"train_loss": -20.55600357055664, "global_step": 69129, "epoch": 832} {"train_loss": -20.8114013671875, "global_step": 69130, "epoch": 832} {"train_loss": -20.712310791015625, "global_step": 69131, "epoch": 832} {"train_loss": -20.594772338867188, "global_step": 69132, "epoch": 832} {"train_loss": -20.839902877807617, "global_step": 69133, "epoch": 832} {"train_loss": -20.837766647338867, "global_step": 69134, "epoch": 832} {"train_loss": -20.60866355895996, "global_step": 69135, "epoch": 832} {"train_loss": -20.824695587158203, "global_step": 69136, "epoch": 832} {"train_loss": -20.50860023498535, "global_step": 69137, "epoch": 832} {"train_loss": -20.750027920826373, "global_step": 69138, "epoch": 832, "val_loss": 6010366.0} {"train_loss": -20.412830352783203, "global_step": 69139, "epoch": 833} {"train_loss": -20.71996307373047, "global_step": 69140, "epoch": 833} {"train_loss": -20.5578556060791, "global_step": 69141, "epoch": 833} {"train_loss": -20.632062911987305, "global_step": 69142, "epoch": 833} {"train_loss": -20.449588775634766, "global_step": 69143, "epoch": 833} {"train_loss": -20.721731185913086, "global_step": 69144, "epoch": 833} {"train_loss": -20.64302635192871, "global_step": 69145, "epoch": 833} {"train_loss": -20.720932006835938, "global_step": 69146, "epoch": 833} {"train_loss": -20.338239669799805, "global_step": 69147, "epoch": 833} {"train_loss": -20.71427345275879, "global_step": 69148, "epoch": 833} {"train_loss": -20.78474235534668, "global_step": 69149, "epoch": 833} {"train_loss": -20.6312198638916, "global_step": 69150, "epoch": 833} {"train_loss": -20.6241512298584, "global_step": 69151, "epoch": 833} {"train_loss": -20.8930606842041, "global_step": 69152, "epoch": 833} {"train_loss": -20.989471435546875, "global_step": 69153, "epoch": 833} {"train_loss": -20.300607681274414, "global_step": 69154, "epoch": 833} {"train_loss": -21.09537124633789, "global_step": 69155, "epoch": 833} {"train_loss": -20.473039627075195, "global_step": 69156, "epoch": 833} {"train_loss": -20.54433250427246, "global_step": 69157, "epoch": 833} {"train_loss": -20.658851623535156, "global_step": 69158, "epoch": 833} {"train_loss": -20.704843521118164, "global_step": 69159, "epoch": 833} {"train_loss": -20.832124710083008, "global_step": 69160, "epoch": 833} {"train_loss": -20.704496383666992, "global_step": 69161, "epoch": 833} {"train_loss": -20.558847427368164, "global_step": 69162, "epoch": 833} {"train_loss": -20.791046142578125, "global_step": 69163, "epoch": 833} {"train_loss": -20.754261016845703, "global_step": 69164, "epoch": 833} {"train_loss": -20.582324981689453, "global_step": 69165, "epoch": 833} {"train_loss": -20.80078125, "global_step": 69166, "epoch": 833} {"train_loss": -21.077716827392578, "global_step": 69167, "epoch": 833} {"train_loss": -20.86277961730957, "global_step": 69168, "epoch": 833} {"train_loss": -21.067649841308594, "global_step": 69169, "epoch": 833} {"train_loss": -20.723966598510742, "global_step": 69170, "epoch": 833} {"train_loss": -21.082151412963867, "global_step": 69171, "epoch": 833} {"train_loss": -20.81561279296875, "global_step": 69172, "epoch": 833} {"train_loss": -20.61027717590332, "global_step": 69173, "epoch": 833} {"train_loss": -21.154071807861328, "global_step": 69174, "epoch": 833} {"train_loss": -21.02090835571289, "global_step": 69175, "epoch": 833} {"train_loss": -20.58720588684082, "global_step": 69176, "epoch": 833} {"train_loss": -20.509571075439453, "global_step": 69177, "epoch": 833} {"train_loss": -20.899368286132812, "global_step": 69178, "epoch": 833} {"train_loss": -20.904653549194336, "global_step": 69179, "epoch": 833} {"train_loss": -20.739212036132812, "global_step": 69180, "epoch": 833} {"train_loss": -20.726003646850586, "global_step": 69181, "epoch": 833} {"train_loss": -20.807798385620117, "global_step": 69182, "epoch": 833} {"train_loss": -20.911914825439453, "global_step": 69183, "epoch": 833} {"train_loss": -20.314598083496094, "global_step": 69184, "epoch": 833} {"train_loss": -20.766735076904297, "global_step": 69185, "epoch": 833} {"train_loss": -20.525480270385742, "global_step": 69186, "epoch": 833} {"train_loss": -20.840686798095703, "global_step": 69187, "epoch": 833} {"train_loss": -20.601810455322266, "global_step": 69188, "epoch": 833} {"train_loss": -20.547025680541992, "global_step": 69189, "epoch": 833} {"train_loss": -20.979642868041992, "global_step": 69190, "epoch": 833} {"train_loss": -20.848600387573242, "global_step": 69191, "epoch": 833} {"train_loss": -20.91287612915039, "global_step": 69192, "epoch": 833} {"train_loss": -20.945051193237305, "global_step": 69193, "epoch": 833} {"train_loss": -21.200347900390625, "global_step": 69194, "epoch": 833} {"train_loss": -20.5400447845459, "global_step": 69195, "epoch": 833} {"train_loss": -20.860593795776367, "global_step": 69196, "epoch": 833} {"train_loss": -20.968017578125, "global_step": 69197, "epoch": 833} {"train_loss": -20.954206466674805, "global_step": 69198, "epoch": 833} {"train_loss": -20.714895248413086, "global_step": 69199, "epoch": 833} {"train_loss": -20.729413986206055, "global_step": 69200, "epoch": 833} {"train_loss": -20.858617782592773, "global_step": 69201, "epoch": 833} {"train_loss": -21.05100440979004, "global_step": 69202, "epoch": 833} {"train_loss": -21.11579704284668, "global_step": 69203, "epoch": 833} {"train_loss": -20.692764282226562, "global_step": 69204, "epoch": 833} {"train_loss": -21.024198532104492, "global_step": 69205, "epoch": 833} {"train_loss": -20.62684440612793, "global_step": 69206, "epoch": 833} {"train_loss": -20.7031307220459, "global_step": 69207, "epoch": 833} {"train_loss": -20.73060417175293, "global_step": 69208, "epoch": 833} {"train_loss": -20.752744674682617, "global_step": 69209, "epoch": 833} {"train_loss": -21.048622131347656, "global_step": 69210, "epoch": 833} {"train_loss": -21.066415786743164, "global_step": 69211, "epoch": 833} {"train_loss": -21.204198837280273, "global_step": 69212, "epoch": 833} {"train_loss": -20.674915313720703, "global_step": 69213, "epoch": 833} {"train_loss": -20.614526748657227, "global_step": 69214, "epoch": 833} {"train_loss": -20.7714900970459, "global_step": 69215, "epoch": 833} {"train_loss": -20.640836715698242, "global_step": 69216, "epoch": 833} {"train_loss": -20.86799430847168, "global_step": 69217, "epoch": 833} {"train_loss": -21.037748336791992, "global_step": 69218, "epoch": 833} {"train_loss": -21.05011749267578, "global_step": 69219, "epoch": 833} {"train_loss": -20.77065086364746, "global_step": 69220, "epoch": 833} {"train_loss": -20.773150731282062, "global_step": 69221, "epoch": 833, "val_loss": 5992107.0} {"train_loss": -20.22114372253418, "global_step": 69222, "epoch": 834} {"train_loss": -20.20949363708496, "global_step": 69223, "epoch": 834} {"train_loss": -20.361204147338867, "global_step": 69224, "epoch": 834} {"train_loss": -20.234678268432617, "global_step": 69225, "epoch": 834} {"train_loss": -20.174571990966797, "global_step": 69226, "epoch": 834} {"train_loss": -20.6265926361084, "global_step": 69227, "epoch": 834} {"train_loss": -20.515644073486328, "global_step": 69228, "epoch": 834} {"train_loss": -20.579957962036133, "global_step": 69229, "epoch": 834} {"train_loss": -20.110275268554688, "global_step": 69230, "epoch": 834} {"train_loss": -20.42567253112793, "global_step": 69231, "epoch": 834} {"train_loss": -19.626829147338867, "global_step": 69232, "epoch": 834} {"train_loss": -20.34381675720215, "global_step": 69233, "epoch": 834} {"train_loss": -20.05206298828125, "global_step": 69234, "epoch": 834} {"train_loss": -20.416362762451172, "global_step": 69235, "epoch": 834} {"train_loss": -20.464567184448242, "global_step": 69236, "epoch": 834} {"train_loss": -20.555749893188477, "global_step": 69237, "epoch": 834} {"train_loss": -20.470685958862305, "global_step": 69238, "epoch": 834} {"train_loss": -20.3022518157959, "global_step": 69239, "epoch": 834} {"train_loss": -20.72342300415039, "global_step": 69240, "epoch": 834} {"train_loss": -20.611791610717773, "global_step": 69241, "epoch": 834} {"train_loss": -20.525409698486328, "global_step": 69242, "epoch": 834} {"train_loss": -20.229631423950195, "global_step": 69243, "epoch": 834} {"train_loss": -20.522714614868164, "global_step": 69244, "epoch": 834} {"train_loss": -20.561330795288086, "global_step": 69245, "epoch": 834} {"train_loss": -20.853342056274414, "global_step": 69246, "epoch": 834} {"train_loss": -20.410404205322266, "global_step": 69247, "epoch": 834} {"train_loss": -20.787410736083984, "global_step": 69248, "epoch": 834} {"train_loss": -20.91513442993164, "global_step": 69249, "epoch": 834} {"train_loss": -21.128141403198242, "global_step": 69250, "epoch": 834} {"train_loss": -20.837827682495117, "global_step": 69251, "epoch": 834} {"train_loss": -20.92268943786621, "global_step": 69252, "epoch": 834} {"train_loss": -20.45997428894043, "global_step": 69253, "epoch": 834} {"train_loss": -20.771808624267578, "global_step": 69254, "epoch": 834} {"train_loss": -20.735889434814453, "global_step": 69255, "epoch": 834} {"train_loss": -20.888477325439453, "global_step": 69256, "epoch": 834} {"train_loss": -20.339895248413086, "global_step": 69257, "epoch": 834} {"train_loss": -20.92958641052246, "global_step": 69258, "epoch": 834} {"train_loss": -21.040414810180664, "global_step": 69259, "epoch": 834} {"train_loss": -20.735776901245117, "global_step": 69260, "epoch": 834} {"train_loss": -20.850400924682617, "global_step": 69261, "epoch": 834} {"train_loss": -21.112314224243164, "global_step": 69262, "epoch": 834} {"train_loss": -20.70926284790039, "global_step": 69263, "epoch": 834} {"train_loss": -20.76462745666504, "global_step": 69264, "epoch": 834} {"train_loss": -20.3416690826416, "global_step": 69265, "epoch": 834} {"train_loss": -20.827329635620117, "global_step": 69266, "epoch": 834} {"train_loss": -20.862607955932617, "global_step": 69267, "epoch": 834} {"train_loss": -20.687528610229492, "global_step": 69268, "epoch": 834} {"train_loss": -20.60219955444336, "global_step": 69269, "epoch": 834} {"train_loss": -20.589597702026367, "global_step": 69270, "epoch": 834} {"train_loss": -21.04087257385254, "global_step": 69271, "epoch": 834} {"train_loss": -20.457080841064453, "global_step": 69272, "epoch": 834} {"train_loss": -20.379465103149414, "global_step": 69273, "epoch": 834} {"train_loss": -20.58622169494629, "global_step": 69274, "epoch": 834} {"train_loss": -20.615568161010742, "global_step": 69275, "epoch": 834} {"train_loss": -20.654693603515625, "global_step": 69276, "epoch": 834} {"train_loss": -20.35483169555664, "global_step": 69277, "epoch": 834} {"train_loss": -20.47040367126465, "global_step": 69278, "epoch": 834} {"train_loss": -20.806642532348633, "global_step": 69279, "epoch": 834} {"train_loss": -20.529394149780273, "global_step": 69280, "epoch": 834} {"train_loss": -20.804719924926758, "global_step": 69281, "epoch": 834} {"train_loss": -20.576751708984375, "global_step": 69282, "epoch": 834} {"train_loss": -20.58774757385254, "global_step": 69283, "epoch": 834} {"train_loss": -20.639698028564453, "global_step": 69284, "epoch": 834} {"train_loss": -20.686349868774414, "global_step": 69285, "epoch": 834} {"train_loss": -20.738035202026367, "global_step": 69286, "epoch": 834} {"train_loss": -20.61874771118164, "global_step": 69287, "epoch": 834} {"train_loss": -20.768844604492188, "global_step": 69288, "epoch": 834} {"train_loss": -20.960058212280273, "global_step": 69289, "epoch": 834} {"train_loss": -20.905502319335938, "global_step": 69290, "epoch": 834} {"train_loss": -21.031543731689453, "global_step": 69291, "epoch": 834} {"train_loss": -20.5324764251709, "global_step": 69292, "epoch": 834} {"train_loss": -20.916501998901367, "global_step": 69293, "epoch": 834} {"train_loss": -20.92298698425293, "global_step": 69294, "epoch": 834} {"train_loss": -20.900842666625977, "global_step": 69295, "epoch": 834} {"train_loss": -21.11301612854004, "global_step": 69296, "epoch": 834} {"train_loss": -20.760395050048828, "global_step": 69297, "epoch": 834} {"train_loss": -21.013423919677734, "global_step": 69298, "epoch": 834} {"train_loss": -21.187366485595703, "global_step": 69299, "epoch": 834} {"train_loss": -20.671955108642578, "global_step": 69300, "epoch": 834} {"train_loss": -20.950748443603516, "global_step": 69301, "epoch": 834} {"train_loss": -20.915287017822266, "global_step": 69302, "epoch": 834} {"train_loss": -20.854700088500977, "global_step": 69303, "epoch": 834} {"train_loss": -20.637486859976526, "global_step": 69304, "epoch": 834, "val_loss": 6003235.0} {"train_loss": -20.31842041015625, "global_step": 69305, "epoch": 835} {"train_loss": -20.107389450073242, "global_step": 69306, "epoch": 835} {"train_loss": -20.885663986206055, "global_step": 69307, "epoch": 835} {"train_loss": -20.148427963256836, "global_step": 69308, "epoch": 835} {"train_loss": -20.57979965209961, "global_step": 69309, "epoch": 835} {"train_loss": -20.396623611450195, "global_step": 69310, "epoch": 835} {"train_loss": -20.3668270111084, "global_step": 69311, "epoch": 835} {"train_loss": -20.591283798217773, "global_step": 69312, "epoch": 835} {"train_loss": -20.378164291381836, "global_step": 69313, "epoch": 835} {"train_loss": -20.515899658203125, "global_step": 69314, "epoch": 835} {"train_loss": -20.8519287109375, "global_step": 69315, "epoch": 835} {"train_loss": -20.599882125854492, "global_step": 69316, "epoch": 835} {"train_loss": -20.979276657104492, "global_step": 69317, "epoch": 835} {"train_loss": -20.620290756225586, "global_step": 69318, "epoch": 835} {"train_loss": -20.3403263092041, "global_step": 69319, "epoch": 835} {"train_loss": -20.79628562927246, "global_step": 69320, "epoch": 835} {"train_loss": -20.739866256713867, "global_step": 69321, "epoch": 835} {"train_loss": -20.46993064880371, "global_step": 69322, "epoch": 835} {"train_loss": -20.798063278198242, "global_step": 69323, "epoch": 835} {"train_loss": -20.91382598876953, "global_step": 69324, "epoch": 835} {"train_loss": -20.92986488342285, "global_step": 69325, "epoch": 835} {"train_loss": -20.6834716796875, "global_step": 69326, "epoch": 835} {"train_loss": -20.697193145751953, "global_step": 69327, "epoch": 835} {"train_loss": -20.673778533935547, "global_step": 69328, "epoch": 835} {"train_loss": -20.26711082458496, "global_step": 69329, "epoch": 835} {"train_loss": -20.705665588378906, "global_step": 69330, "epoch": 835} {"train_loss": -20.824201583862305, "global_step": 69331, "epoch": 835} {"train_loss": -20.540327072143555, "global_step": 69332, "epoch": 835} {"train_loss": -20.54859733581543, "global_step": 69333, "epoch": 835} {"train_loss": -20.536577224731445, "global_step": 69334, "epoch": 835} {"train_loss": -20.635915756225586, "global_step": 69335, "epoch": 835} {"train_loss": -20.77788734436035, "global_step": 69336, "epoch": 835} {"train_loss": -20.53785514831543, "global_step": 69337, "epoch": 835} {"train_loss": -20.490276336669922, "global_step": 69338, "epoch": 835} {"train_loss": -20.851428985595703, "global_step": 69339, "epoch": 835} {"train_loss": -20.740224838256836, "global_step": 69340, "epoch": 835} {"train_loss": -20.669340133666992, "global_step": 69341, "epoch": 835} {"train_loss": -20.730865478515625, "global_step": 69342, "epoch": 835} {"train_loss": -20.844532012939453, "global_step": 69343, "epoch": 835} {"train_loss": -20.7330322265625, "global_step": 69344, "epoch": 835} {"train_loss": -20.77316665649414, "global_step": 69345, "epoch": 835} {"train_loss": -20.281108856201172, "global_step": 69346, "epoch": 835} {"train_loss": -20.634334564208984, "global_step": 69347, "epoch": 835} {"train_loss": -21.055316925048828, "global_step": 69348, "epoch": 835} {"train_loss": -20.462539672851562, "global_step": 69349, "epoch": 835} {"train_loss": -20.862504959106445, "global_step": 69350, "epoch": 835} {"train_loss": -20.483144760131836, "global_step": 69351, "epoch": 835} {"train_loss": -20.430822372436523, "global_step": 69352, "epoch": 835} {"train_loss": -20.716154098510742, "global_step": 69353, "epoch": 835} {"train_loss": -20.781164169311523, "global_step": 69354, "epoch": 835} {"train_loss": -20.506948471069336, "global_step": 69355, "epoch": 835} {"train_loss": -20.641748428344727, "global_step": 69356, "epoch": 835} {"train_loss": -20.665023803710938, "global_step": 69357, "epoch": 835} {"train_loss": -20.87384605407715, "global_step": 69358, "epoch": 835} {"train_loss": -20.887548446655273, "global_step": 69359, "epoch": 835} {"train_loss": -20.575572967529297, "global_step": 69360, "epoch": 835} {"train_loss": -20.881519317626953, "global_step": 69361, "epoch": 835} {"train_loss": -20.88702964782715, "global_step": 69362, "epoch": 835} {"train_loss": -20.996749877929688, "global_step": 69363, "epoch": 835} {"train_loss": -20.879776000976562, "global_step": 69364, "epoch": 835} {"train_loss": -20.670114517211914, "global_step": 69365, "epoch": 835} {"train_loss": -20.895166397094727, "global_step": 69366, "epoch": 835} {"train_loss": -20.728391647338867, "global_step": 69367, "epoch": 835} {"train_loss": -20.866455078125, "global_step": 69368, "epoch": 835} {"train_loss": -21.005170822143555, "global_step": 69369, "epoch": 835} {"train_loss": -20.93889617919922, "global_step": 69370, "epoch": 835} {"train_loss": -20.885669708251953, "global_step": 69371, "epoch": 835} {"train_loss": -21.100008010864258, "global_step": 69372, "epoch": 835} {"train_loss": -20.735464096069336, "global_step": 69373, "epoch": 835} {"train_loss": -21.107580184936523, "global_step": 69374, "epoch": 835} {"train_loss": -20.77910614013672, "global_step": 69375, "epoch": 835} {"train_loss": -20.69569969177246, "global_step": 69376, "epoch": 835} {"train_loss": -20.757022857666016, "global_step": 69377, "epoch": 835} {"train_loss": -21.046142578125, "global_step": 69378, "epoch": 835} {"train_loss": -20.701162338256836, "global_step": 69379, "epoch": 835} {"train_loss": -21.053083419799805, "global_step": 69380, "epoch": 835} {"train_loss": -20.664154052734375, "global_step": 69381, "epoch": 835} {"train_loss": -20.810012817382812, "global_step": 69382, "epoch": 835} {"train_loss": -20.72196388244629, "global_step": 69383, "epoch": 835} {"train_loss": -20.93506622314453, "global_step": 69384, "epoch": 835} {"train_loss": -20.62919044494629, "global_step": 69385, "epoch": 835} {"train_loss": -21.3710994720459, "global_step": 69386, "epoch": 835} {"train_loss": -20.70319479057588, "global_step": 69387, "epoch": 835, "val_loss": 5975318.5} {"train_loss": -20.731483459472656, "global_step": 69388, "epoch": 836} {"train_loss": -20.646923065185547, "global_step": 69389, "epoch": 836} {"train_loss": -20.42548179626465, "global_step": 69390, "epoch": 836} {"train_loss": -20.84187889099121, "global_step": 69391, "epoch": 836} {"train_loss": -20.681379318237305, "global_step": 69392, "epoch": 836} {"train_loss": -20.706388473510742, "global_step": 69393, "epoch": 836} {"train_loss": -20.460468292236328, "global_step": 69394, "epoch": 836} {"train_loss": -20.653766632080078, "global_step": 69395, "epoch": 836} {"train_loss": -20.7014217376709, "global_step": 69396, "epoch": 836} {"train_loss": -20.973867416381836, "global_step": 69397, "epoch": 836} {"train_loss": -20.915348052978516, "global_step": 69398, "epoch": 836} {"train_loss": -20.526582717895508, "global_step": 69399, "epoch": 836} {"train_loss": -20.760669708251953, "global_step": 69400, "epoch": 836} {"train_loss": -20.217437744140625, "global_step": 69401, "epoch": 836} {"train_loss": -20.63508415222168, "global_step": 69402, "epoch": 836} {"train_loss": -20.735809326171875, "global_step": 69403, "epoch": 836} {"train_loss": -21.127607345581055, "global_step": 69404, "epoch": 836} {"train_loss": -20.527175903320312, "global_step": 69405, "epoch": 836} {"train_loss": -20.75341033935547, "global_step": 69406, "epoch": 836} {"train_loss": -20.39409828186035, "global_step": 69407, "epoch": 836} {"train_loss": -21.10565757751465, "global_step": 69408, "epoch": 836} {"train_loss": -20.945497512817383, "global_step": 69409, "epoch": 836} {"train_loss": -20.953662872314453, "global_step": 69410, "epoch": 836} {"train_loss": -20.348735809326172, "global_step": 69411, "epoch": 836} {"train_loss": -20.8204402923584, "global_step": 69412, "epoch": 836} {"train_loss": -20.839506149291992, "global_step": 69413, "epoch": 836} {"train_loss": -21.130247116088867, "global_step": 69414, "epoch": 836} {"train_loss": -20.686813354492188, "global_step": 69415, "epoch": 836} {"train_loss": -20.84220314025879, "global_step": 69416, "epoch": 836} {"train_loss": -20.693540573120117, "global_step": 69417, "epoch": 836} {"train_loss": -21.025400161743164, "global_step": 69418, "epoch": 836} {"train_loss": -20.919538497924805, "global_step": 69419, "epoch": 836} {"train_loss": -21.320341110229492, "global_step": 69420, "epoch": 836} {"train_loss": -20.40999412536621, "global_step": 69421, "epoch": 836} {"train_loss": -20.414953231811523, "global_step": 69422, "epoch": 836} {"train_loss": -20.82826805114746, "global_step": 69423, "epoch": 836} {"train_loss": -20.747095108032227, "global_step": 69424, "epoch": 836} {"train_loss": -20.697145462036133, "global_step": 69425, "epoch": 836} {"train_loss": -20.78765869140625, "global_step": 69426, "epoch": 836} {"train_loss": -20.753860473632812, "global_step": 69427, "epoch": 836} {"train_loss": -20.8020076751709, "global_step": 69428, "epoch": 836} {"train_loss": -21.011627197265625, "global_step": 69429, "epoch": 836} {"train_loss": -20.854455947875977, "global_step": 69430, "epoch": 836} {"train_loss": -20.622121810913086, "global_step": 69431, "epoch": 836} {"train_loss": -20.654346466064453, "global_step": 69432, "epoch": 836} {"train_loss": -20.838598251342773, "global_step": 69433, "epoch": 836} {"train_loss": -20.85293197631836, "global_step": 69434, "epoch": 836} {"train_loss": -20.80094337463379, "global_step": 69435, "epoch": 836} {"train_loss": -20.911733627319336, "global_step": 69436, "epoch": 836} {"train_loss": -21.090415954589844, "global_step": 69437, "epoch": 836} {"train_loss": -20.639713287353516, "global_step": 69438, "epoch": 836} {"train_loss": -20.707300186157227, "global_step": 69439, "epoch": 836} {"train_loss": -20.89938735961914, "global_step": 69440, "epoch": 836} {"train_loss": -20.815319061279297, "global_step": 69441, "epoch": 836} {"train_loss": -21.104047775268555, "global_step": 69442, "epoch": 836} {"train_loss": -20.646249771118164, "global_step": 69443, "epoch": 836} {"train_loss": -20.811368942260742, "global_step": 69444, "epoch": 836} {"train_loss": -20.62485122680664, "global_step": 69445, "epoch": 836} {"train_loss": -20.88055419921875, "global_step": 69446, "epoch": 836} {"train_loss": -21.065876007080078, "global_step": 69447, "epoch": 836} {"train_loss": -20.954456329345703, "global_step": 69448, "epoch": 836} {"train_loss": -20.556562423706055, "global_step": 69449, "epoch": 836} {"train_loss": -20.654348373413086, "global_step": 69450, "epoch": 836} {"train_loss": -20.7860164642334, "global_step": 69451, "epoch": 836} {"train_loss": -20.600065231323242, "global_step": 69452, "epoch": 836} {"train_loss": -20.822399139404297, "global_step": 69453, "epoch": 836} {"train_loss": -21.05978012084961, "global_step": 69454, "epoch": 836} {"train_loss": -20.82982063293457, "global_step": 69455, "epoch": 836} {"train_loss": -20.85804557800293, "global_step": 69456, "epoch": 836} {"train_loss": -21.157047271728516, "global_step": 69457, "epoch": 836} {"train_loss": -20.725021362304688, "global_step": 69458, "epoch": 836} {"train_loss": -20.80299949645996, "global_step": 69459, "epoch": 836} {"train_loss": -20.706632614135742, "global_step": 69460, "epoch": 836} {"train_loss": -20.796613693237305, "global_step": 69461, "epoch": 836} {"train_loss": -20.833248138427734, "global_step": 69462, "epoch": 836} {"train_loss": -20.6905574798584, "global_step": 69463, "epoch": 836} {"train_loss": -21.007558822631836, "global_step": 69464, "epoch": 836} {"train_loss": -20.669675827026367, "global_step": 69465, "epoch": 836} {"train_loss": -20.493860244750977, "global_step": 69466, "epoch": 836} {"train_loss": -20.714059829711914, "global_step": 69467, "epoch": 836} {"train_loss": -20.637653350830078, "global_step": 69468, "epoch": 836} {"train_loss": -20.870298385620117, "global_step": 69469, "epoch": 836} {"train_loss": -20.76728664536074, "global_step": 69470, "epoch": 836, "val_loss": 6068720.0} {"train_loss": -20.594867706298828, "global_step": 69471, "epoch": 837} {"train_loss": -20.644399642944336, "global_step": 69472, "epoch": 837} {"train_loss": -20.513166427612305, "global_step": 69473, "epoch": 837} {"train_loss": -20.963430404663086, "global_step": 69474, "epoch": 837} {"train_loss": -20.789587020874023, "global_step": 69475, "epoch": 837} {"train_loss": -20.87105369567871, "global_step": 69476, "epoch": 837} {"train_loss": -21.005598068237305, "global_step": 69477, "epoch": 837} {"train_loss": -20.368249893188477, "global_step": 69478, "epoch": 837} {"train_loss": -20.437759399414062, "global_step": 69479, "epoch": 837} {"train_loss": -20.973922729492188, "global_step": 69480, "epoch": 837} {"train_loss": -20.735990524291992, "global_step": 69481, "epoch": 837} {"train_loss": -20.491750717163086, "global_step": 69482, "epoch": 837} {"train_loss": -20.747756958007812, "global_step": 69483, "epoch": 837} {"train_loss": -20.672271728515625, "global_step": 69484, "epoch": 837} {"train_loss": -20.8271541595459, "global_step": 69485, "epoch": 837} {"train_loss": -20.570316314697266, "global_step": 69486, "epoch": 837} {"train_loss": -20.69771385192871, "global_step": 69487, "epoch": 837} {"train_loss": -20.75127410888672, "global_step": 69488, "epoch": 837} {"train_loss": -20.880935668945312, "global_step": 69489, "epoch": 837} {"train_loss": -21.137266159057617, "global_step": 69490, "epoch": 837} {"train_loss": -20.837427139282227, "global_step": 69491, "epoch": 837} {"train_loss": -21.055484771728516, "global_step": 69492, "epoch": 837} {"train_loss": -21.00586700439453, "global_step": 69493, "epoch": 837} {"train_loss": -20.951194763183594, "global_step": 69494, "epoch": 837} {"train_loss": -20.6063289642334, "global_step": 69495, "epoch": 837} {"train_loss": -20.892858505249023, "global_step": 69496, "epoch": 837} {"train_loss": -20.945316314697266, "global_step": 69497, "epoch": 837} {"train_loss": -20.72892189025879, "global_step": 69498, "epoch": 837} {"train_loss": -20.831531524658203, "global_step": 69499, "epoch": 837} {"train_loss": -20.893051147460938, "global_step": 69500, "epoch": 837} {"train_loss": -20.712995529174805, "global_step": 69501, "epoch": 837} {"train_loss": -20.825597763061523, "global_step": 69502, "epoch": 837} {"train_loss": -21.13395881652832, "global_step": 69503, "epoch": 837} {"train_loss": -20.695968627929688, "global_step": 69504, "epoch": 837} {"train_loss": -21.128549575805664, "global_step": 69505, "epoch": 837} {"train_loss": -20.834598541259766, "global_step": 69506, "epoch": 837} {"train_loss": -21.048917770385742, "global_step": 69507, "epoch": 837} {"train_loss": -20.920135498046875, "global_step": 69508, "epoch": 837} {"train_loss": -20.328678131103516, "global_step": 69509, "epoch": 837} {"train_loss": -20.852277755737305, "global_step": 69510, "epoch": 837} {"train_loss": -20.6984806060791, "global_step": 69511, "epoch": 837} {"train_loss": -20.818408966064453, "global_step": 69512, "epoch": 837} {"train_loss": -20.64832878112793, "global_step": 69513, "epoch": 837} {"train_loss": -21.189207077026367, "global_step": 69514, "epoch": 837} {"train_loss": -21.210399627685547, "global_step": 69515, "epoch": 837} {"train_loss": -20.839279174804688, "global_step": 69516, "epoch": 837} {"train_loss": -20.927616119384766, "global_step": 69517, "epoch": 837} {"train_loss": -20.527734756469727, "global_step": 69518, "epoch": 837} {"train_loss": -20.753402709960938, "global_step": 69519, "epoch": 837} {"train_loss": -20.675613403320312, "global_step": 69520, "epoch": 837} {"train_loss": -20.708749771118164, "global_step": 69521, "epoch": 837} {"train_loss": -21.10744285583496, "global_step": 69522, "epoch": 837} {"train_loss": -20.67043113708496, "global_step": 69523, "epoch": 837} {"train_loss": -21.01858901977539, "global_step": 69524, "epoch": 837} {"train_loss": -20.6237850189209, "global_step": 69525, "epoch": 837} {"train_loss": -21.134336471557617, "global_step": 69526, "epoch": 837} {"train_loss": -20.8732967376709, "global_step": 69527, "epoch": 837} {"train_loss": -20.70442771911621, "global_step": 69528, "epoch": 837} {"train_loss": -20.693716049194336, "global_step": 69529, "epoch": 837} {"train_loss": -20.663480758666992, "global_step": 69530, "epoch": 837} {"train_loss": -21.114933013916016, "global_step": 69531, "epoch": 837} {"train_loss": -20.714691162109375, "global_step": 69532, "epoch": 837} {"train_loss": -20.743864059448242, "global_step": 69533, "epoch": 837} {"train_loss": -20.694931030273438, "global_step": 69534, "epoch": 837} {"train_loss": -20.58794403076172, "global_step": 69535, "epoch": 837} {"train_loss": -21.070453643798828, "global_step": 69536, "epoch": 837} {"train_loss": -20.477338790893555, "global_step": 69537, "epoch": 837} {"train_loss": -20.70181655883789, "global_step": 69538, "epoch": 837} {"train_loss": -20.887836456298828, "global_step": 69539, "epoch": 837} {"train_loss": -21.038129806518555, "global_step": 69540, "epoch": 837} {"train_loss": -20.6762638092041, "global_step": 69541, "epoch": 837} {"train_loss": -20.692060470581055, "global_step": 69542, "epoch": 837} {"train_loss": -20.882932662963867, "global_step": 69543, "epoch": 837} {"train_loss": -20.58735466003418, "global_step": 69544, "epoch": 837} {"train_loss": -20.58579444885254, "global_step": 69545, "epoch": 837} {"train_loss": -20.90229606628418, "global_step": 69546, "epoch": 837} {"train_loss": -20.509199142456055, "global_step": 69547, "epoch": 837} {"train_loss": -20.873483657836914, "global_step": 69548, "epoch": 837} {"train_loss": -20.723388671875, "global_step": 69549, "epoch": 837} {"train_loss": -20.873600006103516, "global_step": 69550, "epoch": 837} {"train_loss": -20.774255752563477, "global_step": 69551, "epoch": 837} {"train_loss": -20.688831329345703, "global_step": 69552, "epoch": 837} {"train_loss": -20.793897651764283, "global_step": 69553, "epoch": 837, "val_loss": 6087278.0} {"train_loss": -20.274612426757812, "global_step": 69554, "epoch": 838} {"train_loss": -20.384796142578125, "global_step": 69555, "epoch": 838} {"train_loss": -20.842599868774414, "global_step": 69556, "epoch": 838} {"train_loss": -20.63587760925293, "global_step": 69557, "epoch": 838} {"train_loss": -20.820730209350586, "global_step": 69558, "epoch": 838} {"train_loss": -20.60369300842285, "global_step": 69559, "epoch": 838} {"train_loss": -20.7636775970459, "global_step": 69560, "epoch": 838} {"train_loss": -20.375133514404297, "global_step": 69561, "epoch": 838} {"train_loss": -20.828184127807617, "global_step": 69562, "epoch": 838} {"train_loss": -20.868148803710938, "global_step": 69563, "epoch": 838} {"train_loss": -20.400924682617188, "global_step": 69564, "epoch": 838} {"train_loss": -20.555389404296875, "global_step": 69565, "epoch": 838} {"train_loss": -20.65452766418457, "global_step": 69566, "epoch": 838} {"train_loss": -20.63368797302246, "global_step": 69567, "epoch": 838} {"train_loss": -20.455846786499023, "global_step": 69568, "epoch": 838} {"train_loss": -21.020004272460938, "global_step": 69569, "epoch": 838} {"train_loss": -21.034788131713867, "global_step": 69570, "epoch": 838} {"train_loss": -20.791942596435547, "global_step": 69571, "epoch": 838} {"train_loss": -20.911211013793945, "global_step": 69572, "epoch": 838} {"train_loss": -20.60031509399414, "global_step": 69573, "epoch": 838} {"train_loss": -20.567079544067383, "global_step": 69574, "epoch": 838} {"train_loss": -20.818063735961914, "global_step": 69575, "epoch": 838} {"train_loss": -20.62727165222168, "global_step": 69576, "epoch": 838} {"train_loss": -21.157583236694336, "global_step": 69577, "epoch": 838} {"train_loss": -21.115570068359375, "global_step": 69578, "epoch": 838} {"train_loss": -20.944902420043945, "global_step": 69579, "epoch": 838} {"train_loss": -20.853382110595703, "global_step": 69580, "epoch": 838} {"train_loss": -21.123186111450195, "global_step": 69581, "epoch": 838} {"train_loss": -20.967451095581055, "global_step": 69582, "epoch": 838} {"train_loss": -20.930492401123047, "global_step": 69583, "epoch": 838} {"train_loss": -20.93927574157715, "global_step": 69584, "epoch": 838} {"train_loss": -20.774105072021484, "global_step": 69585, "epoch": 838} {"train_loss": -21.049856185913086, "global_step": 69586, "epoch": 838} {"train_loss": -21.03791618347168, "global_step": 69587, "epoch": 838} {"train_loss": -20.752527236938477, "global_step": 69588, "epoch": 838} {"train_loss": -21.205936431884766, "global_step": 69589, "epoch": 838} {"train_loss": -20.945768356323242, "global_step": 69590, "epoch": 838} {"train_loss": -20.942203521728516, "global_step": 69591, "epoch": 838} {"train_loss": -20.906436920166016, "global_step": 69592, "epoch": 838} {"train_loss": -20.610082626342773, "global_step": 69593, "epoch": 838} {"train_loss": -20.932422637939453, "global_step": 69594, "epoch": 838} {"train_loss": -20.805482864379883, "global_step": 69595, "epoch": 838} {"train_loss": -20.758440017700195, "global_step": 69596, "epoch": 838} {"train_loss": -21.035747528076172, "global_step": 69597, "epoch": 838} {"train_loss": -20.532032012939453, "global_step": 69598, "epoch": 838} {"train_loss": -20.96607780456543, "global_step": 69599, "epoch": 838} {"train_loss": -20.70394515991211, "global_step": 69600, "epoch": 838} {"train_loss": -20.824331283569336, "global_step": 69601, "epoch": 838} {"train_loss": -20.639677047729492, "global_step": 69602, "epoch": 838} {"train_loss": -20.76055335998535, "global_step": 69603, "epoch": 838} {"train_loss": -20.595584869384766, "global_step": 69604, "epoch": 838} {"train_loss": -20.859052658081055, "global_step": 69605, "epoch": 838} {"train_loss": -20.513288497924805, "global_step": 69606, "epoch": 838} {"train_loss": -20.57174301147461, "global_step": 69607, "epoch": 838} {"train_loss": -20.908588409423828, "global_step": 69608, "epoch": 838} {"train_loss": -20.73090934753418, "global_step": 69609, "epoch": 838} {"train_loss": -20.734050750732422, "global_step": 69610, "epoch": 838} {"train_loss": -20.628192901611328, "global_step": 69611, "epoch": 838} {"train_loss": -20.555557250976562, "global_step": 69612, "epoch": 838} {"train_loss": -20.70790672302246, "global_step": 69613, "epoch": 838} {"train_loss": -21.05055809020996, "global_step": 69614, "epoch": 838} {"train_loss": -20.78708267211914, "global_step": 69615, "epoch": 838} {"train_loss": -21.12690544128418, "global_step": 69616, "epoch": 838} {"train_loss": -20.922977447509766, "global_step": 69617, "epoch": 838} {"train_loss": -20.39393424987793, "global_step": 69618, "epoch": 838} {"train_loss": -20.88351821899414, "global_step": 69619, "epoch": 838} {"train_loss": -20.4704647064209, "global_step": 69620, "epoch": 838} {"train_loss": -20.741453170776367, "global_step": 69621, "epoch": 838} {"train_loss": -20.822965621948242, "global_step": 69622, "epoch": 838} {"train_loss": -21.024986267089844, "global_step": 69623, "epoch": 838} {"train_loss": -21.004104614257812, "global_step": 69624, "epoch": 838} {"train_loss": -20.563642501831055, "global_step": 69625, "epoch": 838} {"train_loss": -20.538148880004883, "global_step": 69626, "epoch": 838} {"train_loss": -20.853271484375, "global_step": 69627, "epoch": 838} {"train_loss": -21.011672973632812, "global_step": 69628, "epoch": 838} {"train_loss": -20.862045288085938, "global_step": 69629, "epoch": 838} {"train_loss": -20.702417373657227, "global_step": 69630, "epoch": 838} {"train_loss": -20.60245704650879, "global_step": 69631, "epoch": 838} {"train_loss": -20.48716163635254, "global_step": 69632, "epoch": 838} {"train_loss": -20.727357864379883, "global_step": 69633, "epoch": 838} {"train_loss": -20.961698532104492, "global_step": 69634, "epoch": 838} {"train_loss": -20.591222763061523, "global_step": 69635, "epoch": 838} {"train_loss": -20.78425437283803, "global_step": 69636, "epoch": 838, "val_loss": 5939971.0} {"train_loss": -20.191558837890625, "global_step": 69637, "epoch": 839} {"train_loss": -20.482498168945312, "global_step": 69638, "epoch": 839} {"train_loss": -20.962242126464844, "global_step": 69639, "epoch": 839} {"train_loss": -20.285892486572266, "global_step": 69640, "epoch": 839} {"train_loss": -20.776155471801758, "global_step": 69641, "epoch": 839} {"train_loss": -20.580265045166016, "global_step": 69642, "epoch": 839} {"train_loss": -20.603708267211914, "global_step": 69643, "epoch": 839} {"train_loss": -21.11226463317871, "global_step": 69644, "epoch": 839} {"train_loss": -20.62141227722168, "global_step": 69645, "epoch": 839} {"train_loss": -20.51462173461914, "global_step": 69646, "epoch": 839} {"train_loss": -20.76508903503418, "global_step": 69647, "epoch": 839} {"train_loss": -20.63616180419922, "global_step": 69648, "epoch": 839} {"train_loss": -20.993146896362305, "global_step": 69649, "epoch": 839} {"train_loss": -20.818387985229492, "global_step": 69650, "epoch": 839} {"train_loss": -20.52651023864746, "global_step": 69651, "epoch": 839} {"train_loss": -20.783641815185547, "global_step": 69652, "epoch": 839} {"train_loss": -20.211488723754883, "global_step": 69653, "epoch": 839} {"train_loss": -20.611379623413086, "global_step": 69654, "epoch": 839} {"train_loss": -21.016130447387695, "global_step": 69655, "epoch": 839} {"train_loss": -20.896221160888672, "global_step": 69656, "epoch": 839} {"train_loss": -20.790098190307617, "global_step": 69657, "epoch": 839} {"train_loss": -20.5993595123291, "global_step": 69658, "epoch": 839} {"train_loss": -20.758981704711914, "global_step": 69659, "epoch": 839} {"train_loss": -21.121978759765625, "global_step": 69660, "epoch": 839} {"train_loss": -20.73809242248535, "global_step": 69661, "epoch": 839} {"train_loss": -20.870885848999023, "global_step": 69662, "epoch": 839} {"train_loss": -20.86066246032715, "global_step": 69663, "epoch": 839} {"train_loss": -20.96196937561035, "global_step": 69664, "epoch": 839} {"train_loss": -21.204607009887695, "global_step": 69665, "epoch": 839} {"train_loss": -20.864904403686523, "global_step": 69666, "epoch": 839} {"train_loss": -21.116926193237305, "global_step": 69667, "epoch": 839} {"train_loss": -21.23896598815918, "global_step": 69668, "epoch": 839} {"train_loss": -20.944360733032227, "global_step": 69669, "epoch": 839} {"train_loss": -20.930532455444336, "global_step": 69670, "epoch": 839} {"train_loss": -21.047788619995117, "global_step": 69671, "epoch": 839} {"train_loss": -20.723983764648438, "global_step": 69672, "epoch": 839} {"train_loss": -20.87647819519043, "global_step": 69673, "epoch": 839} {"train_loss": -20.908672332763672, "global_step": 69674, "epoch": 839} {"train_loss": -21.034788131713867, "global_step": 69675, "epoch": 839} {"train_loss": -20.985626220703125, "global_step": 69676, "epoch": 839} {"train_loss": -20.683637619018555, "global_step": 69677, "epoch": 839} {"train_loss": -20.99361228942871, "global_step": 69678, "epoch": 839} {"train_loss": -20.92932891845703, "global_step": 69679, "epoch": 839} {"train_loss": -20.931133270263672, "global_step": 69680, "epoch": 839} {"train_loss": -20.92456817626953, "global_step": 69681, "epoch": 839} {"train_loss": -21.14054298400879, "global_step": 69682, "epoch": 839} {"train_loss": -20.897903442382812, "global_step": 69683, "epoch": 839} {"train_loss": -20.7930908203125, "global_step": 69684, "epoch": 839} {"train_loss": -20.382604598999023, "global_step": 69685, "epoch": 839} {"train_loss": -21.096603393554688, "global_step": 69686, "epoch": 839} {"train_loss": -20.801435470581055, "global_step": 69687, "epoch": 839} {"train_loss": -20.54897117614746, "global_step": 69688, "epoch": 839} {"train_loss": -20.902250289916992, "global_step": 69689, "epoch": 839} {"train_loss": -20.549182891845703, "global_step": 69690, "epoch": 839} {"train_loss": -20.324222564697266, "global_step": 69691, "epoch": 839} {"train_loss": -20.25748634338379, "global_step": 69692, "epoch": 839} {"train_loss": -21.003156661987305, "global_step": 69693, "epoch": 839} {"train_loss": -20.662532806396484, "global_step": 69694, "epoch": 839} {"train_loss": -20.669723510742188, "global_step": 69695, "epoch": 839} {"train_loss": -20.856252670288086, "global_step": 69696, "epoch": 839} {"train_loss": -20.816192626953125, "global_step": 69697, "epoch": 839} {"train_loss": -20.96539878845215, "global_step": 69698, "epoch": 839} {"train_loss": -21.040525436401367, "global_step": 69699, "epoch": 839} {"train_loss": -20.361806869506836, "global_step": 69700, "epoch": 839} {"train_loss": -20.787290573120117, "global_step": 69701, "epoch": 839} {"train_loss": -20.633493423461914, "global_step": 69702, "epoch": 839} {"train_loss": -20.743703842163086, "global_step": 69703, "epoch": 839} {"train_loss": -20.860990524291992, "global_step": 69704, "epoch": 839} {"train_loss": -20.886783599853516, "global_step": 69705, "epoch": 839} {"train_loss": -20.675260543823242, "global_step": 69706, "epoch": 839} {"train_loss": -20.901105880737305, "global_step": 69707, "epoch": 839} {"train_loss": -20.938854217529297, "global_step": 69708, "epoch": 839} {"train_loss": -20.756256103515625, "global_step": 69709, "epoch": 839} {"train_loss": -20.796281814575195, "global_step": 69710, "epoch": 839} {"train_loss": -21.062936782836914, "global_step": 69711, "epoch": 839} {"train_loss": -21.2691650390625, "global_step": 69712, "epoch": 839} {"train_loss": -20.280210494995117, "global_step": 69713, "epoch": 839} {"train_loss": -21.27358055114746, "global_step": 69714, "epoch": 839} {"train_loss": -20.93027114868164, "global_step": 69715, "epoch": 839} {"train_loss": -20.684179306030273, "global_step": 69716, "epoch": 839} {"train_loss": -21.091882705688477, "global_step": 69717, "epoch": 839} {"train_loss": -20.889745712280273, "global_step": 69718, "epoch": 839} {"train_loss": -20.81801242138966, "global_step": 69719, "epoch": 839, "val_loss": 5895864.5} {"train_loss": -20.71465301513672, "global_step": 69720, "epoch": 840} {"train_loss": -20.878278732299805, "global_step": 69721, "epoch": 840} {"train_loss": -20.506372451782227, "global_step": 69722, "epoch": 840} {"train_loss": -20.660818099975586, "global_step": 69723, "epoch": 840} {"train_loss": -20.56753158569336, "global_step": 69724, "epoch": 840} {"train_loss": -20.267087936401367, "global_step": 69725, "epoch": 840} {"train_loss": -20.656064987182617, "global_step": 69726, "epoch": 840} {"train_loss": -20.831960678100586, "global_step": 69727, "epoch": 840} {"train_loss": -20.749942779541016, "global_step": 69728, "epoch": 840} {"train_loss": -20.823286056518555, "global_step": 69729, "epoch": 840} {"train_loss": -20.757688522338867, "global_step": 69730, "epoch": 840} {"train_loss": -20.902606964111328, "global_step": 69731, "epoch": 840} {"train_loss": -20.454675674438477, "global_step": 69732, "epoch": 840} {"train_loss": -20.806055068969727, "global_step": 69733, "epoch": 840} {"train_loss": -20.377714157104492, "global_step": 69734, "epoch": 840} {"train_loss": -20.40207290649414, "global_step": 69735, "epoch": 840} {"train_loss": -20.751554489135742, "global_step": 69736, "epoch": 840} {"train_loss": -21.153182983398438, "global_step": 69737, "epoch": 840} {"train_loss": -20.82962417602539, "global_step": 69738, "epoch": 840} {"train_loss": -21.217559814453125, "global_step": 69739, "epoch": 840} {"train_loss": -20.501829147338867, "global_step": 69740, "epoch": 840} {"train_loss": -20.89393424987793, "global_step": 69741, "epoch": 840} {"train_loss": -20.650609970092773, "global_step": 69742, "epoch": 840} {"train_loss": -20.80801010131836, "global_step": 69743, "epoch": 840} {"train_loss": -20.721982955932617, "global_step": 69744, "epoch": 840} {"train_loss": -21.19647979736328, "global_step": 69745, "epoch": 840} {"train_loss": -20.645933151245117, "global_step": 69746, "epoch": 840} {"train_loss": -20.839372634887695, "global_step": 69747, "epoch": 840} {"train_loss": -20.99726676940918, "global_step": 69748, "epoch": 840} {"train_loss": -20.92466926574707, "global_step": 69749, "epoch": 840} {"train_loss": -21.170364379882812, "global_step": 69750, "epoch": 840} {"train_loss": -20.80953025817871, "global_step": 69751, "epoch": 840} {"train_loss": -20.85831642150879, "global_step": 69752, "epoch": 840} {"train_loss": -20.49701690673828, "global_step": 69753, "epoch": 840} {"train_loss": -20.89840316772461, "global_step": 69754, "epoch": 840} {"train_loss": -21.065587997436523, "global_step": 69755, "epoch": 840} {"train_loss": -20.771894454956055, "global_step": 69756, "epoch": 840} {"train_loss": -21.036365509033203, "global_step": 69757, "epoch": 840} {"train_loss": -20.71028709411621, "global_step": 69758, "epoch": 840} {"train_loss": -20.681949615478516, "global_step": 69759, "epoch": 840} {"train_loss": -21.32227325439453, "global_step": 69760, "epoch": 840} {"train_loss": -20.81399154663086, "global_step": 69761, "epoch": 840} {"train_loss": -20.890243530273438, "global_step": 69762, "epoch": 840} {"train_loss": -20.75507926940918, "global_step": 69763, "epoch": 840} {"train_loss": -20.677387237548828, "global_step": 69764, "epoch": 840} {"train_loss": -21.017276763916016, "global_step": 69765, "epoch": 840} {"train_loss": -20.87704849243164, "global_step": 69766, "epoch": 840} {"train_loss": -20.44867515563965, "global_step": 69767, "epoch": 840} {"train_loss": -20.791563034057617, "global_step": 69768, "epoch": 840} {"train_loss": -20.861295700073242, "global_step": 69769, "epoch": 840} {"train_loss": -20.887062072753906, "global_step": 69770, "epoch": 840} {"train_loss": -20.79279327392578, "global_step": 69771, "epoch": 840} {"train_loss": -20.81011390686035, "global_step": 69772, "epoch": 840} {"train_loss": -20.87813377380371, "global_step": 69773, "epoch": 840} {"train_loss": -20.73157501220703, "global_step": 69774, "epoch": 840} {"train_loss": -20.702768325805664, "global_step": 69775, "epoch": 840} {"train_loss": -20.64773941040039, "global_step": 69776, "epoch": 840} {"train_loss": -20.92449951171875, "global_step": 69777, "epoch": 840} {"train_loss": -20.7766170501709, "global_step": 69778, "epoch": 840} {"train_loss": -20.746488571166992, "global_step": 69779, "epoch": 840} {"train_loss": -20.88789176940918, "global_step": 69780, "epoch": 840} {"train_loss": -21.066770553588867, "global_step": 69781, "epoch": 840} {"train_loss": -21.080286026000977, "global_step": 69782, "epoch": 840} {"train_loss": -20.78384780883789, "global_step": 69783, "epoch": 840} {"train_loss": -20.770549774169922, "global_step": 69784, "epoch": 840} {"train_loss": -21.140073776245117, "global_step": 69785, "epoch": 840} {"train_loss": -20.5787353515625, "global_step": 69786, "epoch": 840} {"train_loss": -20.951749801635742, "global_step": 69787, "epoch": 840} {"train_loss": -21.036319732666016, "global_step": 69788, "epoch": 840} {"train_loss": -21.17299461364746, "global_step": 69789, "epoch": 840} {"train_loss": -20.748043060302734, "global_step": 69790, "epoch": 840} {"train_loss": -21.114349365234375, "global_step": 69791, "epoch": 840} {"train_loss": -20.86870574951172, "global_step": 69792, "epoch": 840} {"train_loss": -20.9399356842041, "global_step": 69793, "epoch": 840} {"train_loss": -20.747446060180664, "global_step": 69794, "epoch": 840} {"train_loss": -20.673465728759766, "global_step": 69795, "epoch": 840} {"train_loss": -20.99188804626465, "global_step": 69796, "epoch": 840} {"train_loss": -20.69345474243164, "global_step": 69797, "epoch": 840} {"train_loss": -20.76981544494629, "global_step": 69798, "epoch": 840} {"train_loss": -21.0155086517334, "global_step": 69799, "epoch": 840} {"train_loss": -21.100557327270508, "global_step": 69800, "epoch": 840} {"train_loss": -20.911848068237305, "global_step": 69801, "epoch": 840} {"train_loss": -20.82017650374447, "global_step": 69802, "epoch": 840, "val_loss": 6035867.5} {"train_loss": -20.326196670532227, "global_step": 69803, "epoch": 841} {"train_loss": -20.43337631225586, "global_step": 69804, "epoch": 841} {"train_loss": -20.694568634033203, "global_step": 69805, "epoch": 841} {"train_loss": -20.252334594726562, "global_step": 69806, "epoch": 841} {"train_loss": -20.662389755249023, "global_step": 69807, "epoch": 841} {"train_loss": -20.39812660217285, "global_step": 69808, "epoch": 841} {"train_loss": -20.67195701599121, "global_step": 69809, "epoch": 841} {"train_loss": -20.609548568725586, "global_step": 69810, "epoch": 841} {"train_loss": -20.28980827331543, "global_step": 69811, "epoch": 841} {"train_loss": -20.672420501708984, "global_step": 69812, "epoch": 841} {"train_loss": -20.743061065673828, "global_step": 69813, "epoch": 841} {"train_loss": -21.047372817993164, "global_step": 69814, "epoch": 841} {"train_loss": -20.868412017822266, "global_step": 69815, "epoch": 841} {"train_loss": -20.759990692138672, "global_step": 69816, "epoch": 841} {"train_loss": -20.641141891479492, "global_step": 69817, "epoch": 841} {"train_loss": -20.698074340820312, "global_step": 69818, "epoch": 841} {"train_loss": -20.57181739807129, "global_step": 69819, "epoch": 841} {"train_loss": -20.845434188842773, "global_step": 69820, "epoch": 841} {"train_loss": -20.823522567749023, "global_step": 69821, "epoch": 841} {"train_loss": -20.743637084960938, "global_step": 69822, "epoch": 841} {"train_loss": -21.039392471313477, "global_step": 69823, "epoch": 841} {"train_loss": -20.589574813842773, "global_step": 69824, "epoch": 841} {"train_loss": -20.867292404174805, "global_step": 69825, "epoch": 841} {"train_loss": -20.654544830322266, "global_step": 69826, "epoch": 841} {"train_loss": -21.021406173706055, "global_step": 69827, "epoch": 841} {"train_loss": -20.511083602905273, "global_step": 69828, "epoch": 841} {"train_loss": -20.666799545288086, "global_step": 69829, "epoch": 841} {"train_loss": -20.571882247924805, "global_step": 69830, "epoch": 841} {"train_loss": -20.529739379882812, "global_step": 69831, "epoch": 841} {"train_loss": -20.817720413208008, "global_step": 69832, "epoch": 841} {"train_loss": -20.846511840820312, "global_step": 69833, "epoch": 841} {"train_loss": -20.725080490112305, "global_step": 69834, "epoch": 841} {"train_loss": -20.961219787597656, "global_step": 69835, "epoch": 841} {"train_loss": -20.983617782592773, "global_step": 69836, "epoch": 841} {"train_loss": -21.06155776977539, "global_step": 69837, "epoch": 841} {"train_loss": -20.998594284057617, "global_step": 69838, "epoch": 841} {"train_loss": -21.28716468811035, "global_step": 69839, "epoch": 841} {"train_loss": -21.069793701171875, "global_step": 69840, "epoch": 841} {"train_loss": -20.7760009765625, "global_step": 69841, "epoch": 841} {"train_loss": -21.1396484375, "global_step": 69842, "epoch": 841} {"train_loss": -20.642913818359375, "global_step": 69843, "epoch": 841} {"train_loss": -20.7465763092041, "global_step": 69844, "epoch": 841} {"train_loss": -20.97089958190918, "global_step": 69845, "epoch": 841} {"train_loss": -21.24993324279785, "global_step": 69846, "epoch": 841} {"train_loss": -20.51378631591797, "global_step": 69847, "epoch": 841} {"train_loss": -20.92146873474121, "global_step": 69848, "epoch": 841} {"train_loss": -21.20221519470215, "global_step": 69849, "epoch": 841} {"train_loss": -20.40766716003418, "global_step": 69850, "epoch": 841} {"train_loss": -20.75503921508789, "global_step": 69851, "epoch": 841} {"train_loss": -20.501184463500977, "global_step": 69852, "epoch": 841} {"train_loss": -21.268386840820312, "global_step": 69853, "epoch": 841} {"train_loss": -20.531784057617188, "global_step": 69854, "epoch": 841} {"train_loss": -20.96790885925293, "global_step": 69855, "epoch": 841} {"train_loss": -21.024250030517578, "global_step": 69856, "epoch": 841} {"train_loss": -20.471330642700195, "global_step": 69857, "epoch": 841} {"train_loss": -21.149700164794922, "global_step": 69858, "epoch": 841} {"train_loss": -21.154199600219727, "global_step": 69859, "epoch": 841} {"train_loss": -20.754531860351562, "global_step": 69860, "epoch": 841} {"train_loss": -20.654956817626953, "global_step": 69861, "epoch": 841} {"train_loss": -20.360536575317383, "global_step": 69862, "epoch": 841} {"train_loss": -20.78565788269043, "global_step": 69863, "epoch": 841} {"train_loss": -20.628889083862305, "global_step": 69864, "epoch": 841} {"train_loss": -20.832992553710938, "global_step": 69865, "epoch": 841} {"train_loss": -20.08247947692871, "global_step": 69866, "epoch": 841} {"train_loss": -21.370983123779297, "global_step": 69867, "epoch": 841} {"train_loss": -21.082626342773438, "global_step": 69868, "epoch": 841} {"train_loss": -20.437236785888672, "global_step": 69869, "epoch": 841} {"train_loss": -20.785913467407227, "global_step": 69870, "epoch": 841} {"train_loss": -20.953161239624023, "global_step": 69871, "epoch": 841} {"train_loss": -20.557798385620117, "global_step": 69872, "epoch": 841} {"train_loss": -20.740982055664062, "global_step": 69873, "epoch": 841} {"train_loss": -20.243032455444336, "global_step": 69874, "epoch": 841} {"train_loss": -20.86934471130371, "global_step": 69875, "epoch": 841} {"train_loss": -20.421010971069336, "global_step": 69876, "epoch": 841} {"train_loss": -20.382654190063477, "global_step": 69877, "epoch": 841} {"train_loss": -20.759756088256836, "global_step": 69878, "epoch": 841} {"train_loss": -21.145496368408203, "global_step": 69879, "epoch": 841} {"train_loss": -20.534208297729492, "global_step": 69880, "epoch": 841} {"train_loss": -20.639360427856445, "global_step": 69881, "epoch": 841} {"train_loss": -20.4464054107666, "global_step": 69882, "epoch": 841} {"train_loss": -21.108657836914062, "global_step": 69883, "epoch": 841} {"train_loss": -20.529388427734375, "global_step": 69884, "epoch": 841} {"train_loss": -20.738604786884355, "global_step": 69885, "epoch": 841, "val_loss": 6056596.0} {"train_loss": -20.41342544555664, "global_step": 69886, "epoch": 842} {"train_loss": -20.395761489868164, "global_step": 69887, "epoch": 842} {"train_loss": -21.05373191833496, "global_step": 69888, "epoch": 842} {"train_loss": -20.799121856689453, "global_step": 69889, "epoch": 842} {"train_loss": -20.676687240600586, "global_step": 69890, "epoch": 842} {"train_loss": -20.9213924407959, "global_step": 69891, "epoch": 842} {"train_loss": -20.529895782470703, "global_step": 69892, "epoch": 842} {"train_loss": -20.513671875, "global_step": 69893, "epoch": 842} {"train_loss": -20.781330108642578, "global_step": 69894, "epoch": 842} {"train_loss": -20.819440841674805, "global_step": 69895, "epoch": 842} {"train_loss": -20.656627655029297, "global_step": 69896, "epoch": 842} {"train_loss": -20.67123031616211, "global_step": 69897, "epoch": 842} {"train_loss": -20.69126319885254, "global_step": 69898, "epoch": 842} {"train_loss": -20.815006256103516, "global_step": 69899, "epoch": 842} {"train_loss": -21.425153732299805, "global_step": 69900, "epoch": 842} {"train_loss": -20.738168716430664, "global_step": 69901, "epoch": 842} {"train_loss": -20.745187759399414, "global_step": 69902, "epoch": 842} {"train_loss": -20.338682174682617, "global_step": 69903, "epoch": 842} {"train_loss": -20.63765525817871, "global_step": 69904, "epoch": 842} {"train_loss": -20.36678123474121, "global_step": 69905, "epoch": 842} {"train_loss": -20.827810287475586, "global_step": 69906, "epoch": 842} {"train_loss": -20.747695922851562, "global_step": 69907, "epoch": 842} {"train_loss": -20.993192672729492, "global_step": 69908, "epoch": 842} {"train_loss": -20.984128952026367, "global_step": 69909, "epoch": 842} {"train_loss": -20.288564682006836, "global_step": 69910, "epoch": 842} {"train_loss": -20.756763458251953, "global_step": 69911, "epoch": 842} {"train_loss": -20.955799102783203, "global_step": 69912, "epoch": 842} {"train_loss": -20.951566696166992, "global_step": 69913, "epoch": 842} {"train_loss": -20.604442596435547, "global_step": 69914, "epoch": 842} {"train_loss": -20.656965255737305, "global_step": 69915, "epoch": 842} {"train_loss": -21.401477813720703, "global_step": 69916, "epoch": 842} {"train_loss": -20.695371627807617, "global_step": 69917, "epoch": 842} {"train_loss": -20.80524253845215, "global_step": 69918, "epoch": 842} {"train_loss": -20.882978439331055, "global_step": 69919, "epoch": 842} {"train_loss": -20.927597045898438, "global_step": 69920, "epoch": 842} {"train_loss": -21.03152847290039, "global_step": 69921, "epoch": 842} {"train_loss": -20.773435592651367, "global_step": 69922, "epoch": 842} {"train_loss": -20.929895401000977, "global_step": 69923, "epoch": 842} {"train_loss": -20.727827072143555, "global_step": 69924, "epoch": 842} {"train_loss": -20.852645874023438, "global_step": 69925, "epoch": 842} {"train_loss": -20.67860984802246, "global_step": 69926, "epoch": 842} {"train_loss": -20.340171813964844, "global_step": 69927, "epoch": 842} {"train_loss": -20.90797233581543, "global_step": 69928, "epoch": 842} {"train_loss": -21.200733184814453, "global_step": 69929, "epoch": 842} {"train_loss": -20.981149673461914, "global_step": 69930, "epoch": 842} {"train_loss": -20.94166374206543, "global_step": 69931, "epoch": 842} {"train_loss": -20.987380981445312, "global_step": 69932, "epoch": 842} {"train_loss": -20.938724517822266, "global_step": 69933, "epoch": 842} {"train_loss": -20.659799575805664, "global_step": 69934, "epoch": 842} {"train_loss": -20.63259506225586, "global_step": 69935, "epoch": 842} {"train_loss": -20.506555557250977, "global_step": 69936, "epoch": 842} {"train_loss": -21.084882736206055, "global_step": 69937, "epoch": 842} {"train_loss": -21.151763916015625, "global_step": 69938, "epoch": 842} {"train_loss": -20.93572235107422, "global_step": 69939, "epoch": 842} {"train_loss": -20.70998191833496, "global_step": 69940, "epoch": 842} {"train_loss": -20.97170066833496, "global_step": 69941, "epoch": 842} {"train_loss": -21.029111862182617, "global_step": 69942, "epoch": 842} {"train_loss": -21.04637336730957, "global_step": 69943, "epoch": 842} {"train_loss": -20.773340225219727, "global_step": 69944, "epoch": 842} {"train_loss": -21.122426986694336, "global_step": 69945, "epoch": 842} {"train_loss": -20.925668716430664, "global_step": 69946, "epoch": 842} {"train_loss": -20.81450843811035, "global_step": 69947, "epoch": 842} {"train_loss": -21.06026268005371, "global_step": 69948, "epoch": 842} {"train_loss": -21.049335479736328, "global_step": 69949, "epoch": 842} {"train_loss": -20.77063751220703, "global_step": 69950, "epoch": 842} {"train_loss": -20.911954879760742, "global_step": 69951, "epoch": 842} {"train_loss": -20.819210052490234, "global_step": 69952, "epoch": 842} {"train_loss": -20.74069595336914, "global_step": 69953, "epoch": 842} {"train_loss": -20.767858505249023, "global_step": 69954, "epoch": 842} {"train_loss": -20.812416076660156, "global_step": 69955, "epoch": 842} {"train_loss": -21.024078369140625, "global_step": 69956, "epoch": 842} {"train_loss": -20.879465103149414, "global_step": 69957, "epoch": 842} {"train_loss": -20.683958053588867, "global_step": 69958, "epoch": 842} {"train_loss": -20.677688598632812, "global_step": 69959, "epoch": 842} {"train_loss": -20.819223403930664, "global_step": 69960, "epoch": 842} {"train_loss": -20.68329429626465, "global_step": 69961, "epoch": 842} {"train_loss": -20.843875885009766, "global_step": 69962, "epoch": 842} {"train_loss": -20.957014083862305, "global_step": 69963, "epoch": 842} {"train_loss": -20.582439422607422, "global_step": 69964, "epoch": 842} {"train_loss": -20.666990280151367, "global_step": 69965, "epoch": 842} {"train_loss": -20.512741088867188, "global_step": 69966, "epoch": 842} {"train_loss": -20.462814331054688, "global_step": 69967, "epoch": 842} {"train_loss": -20.811632501073632, "global_step": 69968, "epoch": 842, "val_loss": 6023901.5} {"train_loss": -20.17305564880371, "global_step": 69969, "epoch": 843} {"train_loss": -20.495023727416992, "global_step": 69970, "epoch": 843} {"train_loss": -20.816316604614258, "global_step": 69971, "epoch": 843} {"train_loss": -20.888216018676758, "global_step": 69972, "epoch": 843} {"train_loss": -20.79014778137207, "global_step": 69973, "epoch": 843} {"train_loss": -21.03672218322754, "global_step": 69974, "epoch": 843} {"train_loss": -20.39698600769043, "global_step": 69975, "epoch": 843} {"train_loss": -20.189977645874023, "global_step": 69976, "epoch": 843} {"train_loss": -21.02668571472168, "global_step": 69977, "epoch": 843} {"train_loss": -20.612743377685547, "global_step": 69978, "epoch": 843} {"train_loss": -20.398317337036133, "global_step": 69979, "epoch": 843} {"train_loss": -20.627288818359375, "global_step": 69980, "epoch": 843} {"train_loss": -20.85329246520996, "global_step": 69981, "epoch": 843} {"train_loss": -21.06690788269043, "global_step": 69982, "epoch": 843} {"train_loss": -20.4660701751709, "global_step": 69983, "epoch": 843} {"train_loss": -20.631208419799805, "global_step": 69984, "epoch": 843} {"train_loss": -20.402542114257812, "global_step": 69985, "epoch": 843} {"train_loss": -20.976787567138672, "global_step": 69986, "epoch": 843} {"train_loss": -20.78963279724121, "global_step": 69987, "epoch": 843} {"train_loss": -20.5307674407959, "global_step": 69988, "epoch": 843} {"train_loss": -20.889394760131836, "global_step": 69989, "epoch": 843} {"train_loss": -21.125545501708984, "global_step": 69990, "epoch": 843} {"train_loss": -20.87333869934082, "global_step": 69991, "epoch": 843} {"train_loss": -20.900976181030273, "global_step": 69992, "epoch": 843} {"train_loss": -20.866544723510742, "global_step": 69993, "epoch": 843} {"train_loss": -20.978775024414062, "global_step": 69994, "epoch": 843} {"train_loss": -20.9211483001709, "global_step": 69995, "epoch": 843} {"train_loss": -20.580244064331055, "global_step": 69996, "epoch": 843} {"train_loss": -21.083532333374023, "global_step": 69997, "epoch": 843} {"train_loss": -20.676956176757812, "global_step": 69998, "epoch": 843} {"train_loss": -20.65859031677246, "global_step": 69999, "epoch": 843} {"train_loss": -20.5560359954834, "global_step": 70000, "epoch": 843} {"train_loss": -21.220346450805664, "global_step": 70001, "epoch": 843} {"train_loss": -20.802703857421875, "global_step": 70002, "epoch": 843} {"train_loss": -20.865005493164062, "global_step": 70003, "epoch": 843} {"train_loss": -21.02494239807129, "global_step": 70004, "epoch": 843} {"train_loss": -20.999807357788086, "global_step": 70005, "epoch": 843} {"train_loss": -20.898059844970703, "global_step": 70006, "epoch": 843} {"train_loss": -21.02103042602539, "global_step": 70007, "epoch": 843} {"train_loss": -21.053401947021484, "global_step": 70008, "epoch": 843} {"train_loss": -20.594717025756836, "global_step": 70009, "epoch": 843} {"train_loss": -21.030216217041016, "global_step": 70010, "epoch": 843} {"train_loss": -20.87356948852539, "global_step": 70011, "epoch": 843} {"train_loss": -20.568435668945312, "global_step": 70012, "epoch": 843} {"train_loss": -20.828338623046875, "global_step": 70013, "epoch": 843} {"train_loss": -21.160058975219727, "global_step": 70014, "epoch": 843} {"train_loss": -20.92034912109375, "global_step": 70015, "epoch": 843} {"train_loss": -21.006244659423828, "global_step": 70016, "epoch": 843} {"train_loss": -20.697101593017578, "global_step": 70017, "epoch": 843} {"train_loss": -20.781532287597656, "global_step": 70018, "epoch": 843} {"train_loss": -20.880348205566406, "global_step": 70019, "epoch": 843} {"train_loss": -21.10769271850586, "global_step": 70020, "epoch": 843} {"train_loss": -20.574077606201172, "global_step": 70021, "epoch": 843} {"train_loss": -21.403156280517578, "global_step": 70022, "epoch": 843} {"train_loss": -20.312246322631836, "global_step": 70023, "epoch": 843} {"train_loss": -21.05606460571289, "global_step": 70024, "epoch": 843} {"train_loss": -20.871845245361328, "global_step": 70025, "epoch": 843} {"train_loss": -20.99835777282715, "global_step": 70026, "epoch": 843} {"train_loss": -20.953603744506836, "global_step": 70027, "epoch": 843} {"train_loss": -21.20039176940918, "global_step": 70028, "epoch": 843} {"train_loss": -20.959957122802734, "global_step": 70029, "epoch": 843} {"train_loss": -20.914703369140625, "global_step": 70030, "epoch": 843} {"train_loss": -20.896825790405273, "global_step": 70031, "epoch": 843} {"train_loss": -20.78223991394043, "global_step": 70032, "epoch": 843} {"train_loss": -21.17681884765625, "global_step": 70033, "epoch": 843} {"train_loss": -20.959348678588867, "global_step": 70034, "epoch": 843} {"train_loss": -20.896169662475586, "global_step": 70035, "epoch": 843} {"train_loss": -20.64313316345215, "global_step": 70036, "epoch": 843} {"train_loss": -20.969343185424805, "global_step": 70037, "epoch": 843} {"train_loss": -20.730527877807617, "global_step": 70038, "epoch": 843} {"train_loss": -20.81041145324707, "global_step": 70039, "epoch": 843} {"train_loss": -20.980934143066406, "global_step": 70040, "epoch": 843} {"train_loss": -20.746150970458984, "global_step": 70041, "epoch": 843} {"train_loss": -20.349079132080078, "global_step": 70042, "epoch": 843} {"train_loss": -20.952322006225586, "global_step": 70043, "epoch": 843} {"train_loss": -20.716306686401367, "global_step": 70044, "epoch": 843} {"train_loss": -20.62531852722168, "global_step": 70045, "epoch": 843} {"train_loss": -20.5272216796875, "global_step": 70046, "epoch": 843} {"train_loss": -20.654165267944336, "global_step": 70047, "epoch": 843} {"train_loss": -20.722824096679688, "global_step": 70048, "epoch": 843} {"train_loss": -20.276670455932617, "global_step": 70049, "epoch": 843} {"train_loss": -20.351757049560547, "global_step": 70050, "epoch": 843} {"train_loss": -20.798312244645086, "global_step": 70051, "epoch": 843, "val_loss": 6128177.0} {"train_loss": -20.5675106048584, "global_step": 70052, "epoch": 844} {"train_loss": -20.398366928100586, "global_step": 70053, "epoch": 844} {"train_loss": -20.863428115844727, "global_step": 70054, "epoch": 844} {"train_loss": -20.545425415039062, "global_step": 70055, "epoch": 844} {"train_loss": -20.58218002319336, "global_step": 70056, "epoch": 844} {"train_loss": -20.785058975219727, "global_step": 70057, "epoch": 844} {"train_loss": -20.806472778320312, "global_step": 70058, "epoch": 844} {"train_loss": -20.80426025390625, "global_step": 70059, "epoch": 844} {"train_loss": -20.36042594909668, "global_step": 70060, "epoch": 844} {"train_loss": -20.24728012084961, "global_step": 70061, "epoch": 844} {"train_loss": -20.655258178710938, "global_step": 70062, "epoch": 844} {"train_loss": -20.85352897644043, "global_step": 70063, "epoch": 844} {"train_loss": -20.79585075378418, "global_step": 70064, "epoch": 844} {"train_loss": -20.713224411010742, "global_step": 70065, "epoch": 844} {"train_loss": -20.11138153076172, "global_step": 70066, "epoch": 844} {"train_loss": -21.30478858947754, "global_step": 70067, "epoch": 844} {"train_loss": -20.88568878173828, "global_step": 70068, "epoch": 844} {"train_loss": -20.874290466308594, "global_step": 70069, "epoch": 844} {"train_loss": -21.274301528930664, "global_step": 70070, "epoch": 844} {"train_loss": -21.15821647644043, "global_step": 70071, "epoch": 844} {"train_loss": -21.088037490844727, "global_step": 70072, "epoch": 844} {"train_loss": -21.131269454956055, "global_step": 70073, "epoch": 844} {"train_loss": -20.879484176635742, "global_step": 70074, "epoch": 844} {"train_loss": -20.891300201416016, "global_step": 70075, "epoch": 844} {"train_loss": -20.536806106567383, "global_step": 70076, "epoch": 844} {"train_loss": -20.79559326171875, "global_step": 70077, "epoch": 844} {"train_loss": -20.382768630981445, "global_step": 70078, "epoch": 844} {"train_loss": -20.73947525024414, "global_step": 70079, "epoch": 844} {"train_loss": -21.21516227722168, "global_step": 70080, "epoch": 844} {"train_loss": -20.512409210205078, "global_step": 70081, "epoch": 844} {"train_loss": -20.70149803161621, "global_step": 70082, "epoch": 844} {"train_loss": -20.81110954284668, "global_step": 70083, "epoch": 844} {"train_loss": -20.656755447387695, "global_step": 70084, "epoch": 844} {"train_loss": -20.762622833251953, "global_step": 70085, "epoch": 844} {"train_loss": -20.784582138061523, "global_step": 70086, "epoch": 844} {"train_loss": -20.558856964111328, "global_step": 70087, "epoch": 844} {"train_loss": -20.619138717651367, "global_step": 70088, "epoch": 844} {"train_loss": -20.59372901916504, "global_step": 70089, "epoch": 844} {"train_loss": -20.84103775024414, "global_step": 70090, "epoch": 844} {"train_loss": -20.62688636779785, "global_step": 70091, "epoch": 844} {"train_loss": -20.40631866455078, "global_step": 70092, "epoch": 844} {"train_loss": -20.718257904052734, "global_step": 70093, "epoch": 844} {"train_loss": -20.51359748840332, "global_step": 70094, "epoch": 844} {"train_loss": -20.676218032836914, "global_step": 70095, "epoch": 844} {"train_loss": -20.563199996948242, "global_step": 70096, "epoch": 844} {"train_loss": -20.983230590820312, "global_step": 70097, "epoch": 844} {"train_loss": -20.70397186279297, "global_step": 70098, "epoch": 844} {"train_loss": -20.753637313842773, "global_step": 70099, "epoch": 844} {"train_loss": -21.024507522583008, "global_step": 70100, "epoch": 844} {"train_loss": -20.9737491607666, "global_step": 70101, "epoch": 844} {"train_loss": -21.00627899169922, "global_step": 70102, "epoch": 844} {"train_loss": -21.143646240234375, "global_step": 70103, "epoch": 844} {"train_loss": -20.80695343017578, "global_step": 70104, "epoch": 844} {"train_loss": -20.7768611907959, "global_step": 70105, "epoch": 844} {"train_loss": -20.942537307739258, "global_step": 70106, "epoch": 844} {"train_loss": -21.142120361328125, "global_step": 70107, "epoch": 844} {"train_loss": -20.824535369873047, "global_step": 70108, "epoch": 844} {"train_loss": -21.068349838256836, "global_step": 70109, "epoch": 844} {"train_loss": -20.383934020996094, "global_step": 70110, "epoch": 844} {"train_loss": -21.04192352294922, "global_step": 70111, "epoch": 844} {"train_loss": -21.10853385925293, "global_step": 70112, "epoch": 844} {"train_loss": -20.8678035736084, "global_step": 70113, "epoch": 844} {"train_loss": -20.70960807800293, "global_step": 70114, "epoch": 844} {"train_loss": -20.759199142456055, "global_step": 70115, "epoch": 844} {"train_loss": -21.113391876220703, "global_step": 70116, "epoch": 844} {"train_loss": -21.054672241210938, "global_step": 70117, "epoch": 844} {"train_loss": -20.635787963867188, "global_step": 70118, "epoch": 844} {"train_loss": -21.125839233398438, "global_step": 70119, "epoch": 844} {"train_loss": -21.094392776489258, "global_step": 70120, "epoch": 844} {"train_loss": -20.968276977539062, "global_step": 70121, "epoch": 844} {"train_loss": -20.958724975585938, "global_step": 70122, "epoch": 844} {"train_loss": -20.9449520111084, "global_step": 70123, "epoch": 844} {"train_loss": -20.83344078063965, "global_step": 70124, "epoch": 844} {"train_loss": -20.376821517944336, "global_step": 70125, "epoch": 844} {"train_loss": -20.73079490661621, "global_step": 70126, "epoch": 844} {"train_loss": -20.542959213256836, "global_step": 70127, "epoch": 844} {"train_loss": -21.120223999023438, "global_step": 70128, "epoch": 844} {"train_loss": -20.794418334960938, "global_step": 70129, "epoch": 844} {"train_loss": -21.05109214782715, "global_step": 70130, "epoch": 844} {"train_loss": -20.552175521850586, "global_step": 70131, "epoch": 844} {"train_loss": -20.767961502075195, "global_step": 70132, "epoch": 844} {"train_loss": -20.88832664489746, "global_step": 70133, "epoch": 844} {"train_loss": -20.789734323340728, "global_step": 70134, "epoch": 844, "val_loss": 6064901.0} {"train_loss": -20.74810218811035, "global_step": 70135, "epoch": 845} {"train_loss": -20.842376708984375, "global_step": 70136, "epoch": 845} {"train_loss": -20.6331844329834, "global_step": 70137, "epoch": 845} {"train_loss": -20.34351921081543, "global_step": 70138, "epoch": 845} {"train_loss": -20.661996841430664, "global_step": 70139, "epoch": 845} {"train_loss": -20.659639358520508, "global_step": 70140, "epoch": 845} {"train_loss": -20.400686264038086, "global_step": 70141, "epoch": 845} {"train_loss": -20.584184646606445, "global_step": 70142, "epoch": 845} {"train_loss": -20.699325561523438, "global_step": 70143, "epoch": 845} {"train_loss": -20.47020721435547, "global_step": 70144, "epoch": 845} {"train_loss": -20.324087142944336, "global_step": 70145, "epoch": 845} {"train_loss": -20.778234481811523, "global_step": 70146, "epoch": 845} {"train_loss": -20.644123077392578, "global_step": 70147, "epoch": 845} {"train_loss": -20.67743492126465, "global_step": 70148, "epoch": 845} {"train_loss": -21.263898849487305, "global_step": 70149, "epoch": 845} {"train_loss": -20.818880081176758, "global_step": 70150, "epoch": 845} {"train_loss": -20.570148468017578, "global_step": 70151, "epoch": 845} {"train_loss": -21.0334415435791, "global_step": 70152, "epoch": 845} {"train_loss": -20.836393356323242, "global_step": 70153, "epoch": 845} {"train_loss": -20.903860092163086, "global_step": 70154, "epoch": 845} {"train_loss": -20.926897048950195, "global_step": 70155, "epoch": 845} {"train_loss": -20.8765811920166, "global_step": 70156, "epoch": 845} {"train_loss": -21.16695785522461, "global_step": 70157, "epoch": 845} {"train_loss": -21.050825119018555, "global_step": 70158, "epoch": 845} {"train_loss": -21.115970611572266, "global_step": 70159, "epoch": 845} {"train_loss": -21.05952262878418, "global_step": 70160, "epoch": 845} {"train_loss": -21.0668888092041, "global_step": 70161, "epoch": 845} {"train_loss": -21.19154930114746, "global_step": 70162, "epoch": 845} {"train_loss": -21.258703231811523, "global_step": 70163, "epoch": 845} {"train_loss": -21.459901809692383, "global_step": 70164, "epoch": 845} {"train_loss": -20.891462326049805, "global_step": 70165, "epoch": 845} {"train_loss": -21.017492294311523, "global_step": 70166, "epoch": 845} {"train_loss": -20.800451278686523, "global_step": 70167, "epoch": 845} {"train_loss": -21.292348861694336, "global_step": 70168, "epoch": 845} {"train_loss": -20.793603897094727, "global_step": 70169, "epoch": 845} {"train_loss": -20.895923614501953, "global_step": 70170, "epoch": 845} {"train_loss": -20.940542221069336, "global_step": 70171, "epoch": 845} {"train_loss": -21.00883674621582, "global_step": 70172, "epoch": 845} {"train_loss": -20.492399215698242, "global_step": 70173, "epoch": 845} {"train_loss": -21.006559371948242, "global_step": 70174, "epoch": 845} {"train_loss": -20.688217163085938, "global_step": 70175, "epoch": 845} {"train_loss": -20.872478485107422, "global_step": 70176, "epoch": 845} {"train_loss": -20.758766174316406, "global_step": 70177, "epoch": 845} {"train_loss": -20.97797203063965, "global_step": 70178, "epoch": 845} {"train_loss": -20.746015548706055, "global_step": 70179, "epoch": 845} {"train_loss": -20.876806259155273, "global_step": 70180, "epoch": 845} {"train_loss": -21.191104888916016, "global_step": 70181, "epoch": 845} {"train_loss": -20.920455932617188, "global_step": 70182, "epoch": 845} {"train_loss": -20.617368698120117, "global_step": 70183, "epoch": 845} {"train_loss": -20.675565719604492, "global_step": 70184, "epoch": 845} {"train_loss": -20.836761474609375, "global_step": 70185, "epoch": 845} {"train_loss": -20.708251953125, "global_step": 70186, "epoch": 845} {"train_loss": -20.846542358398438, "global_step": 70187, "epoch": 845} {"train_loss": -20.712461471557617, "global_step": 70188, "epoch": 845} {"train_loss": -20.590757369995117, "global_step": 70189, "epoch": 845} {"train_loss": -20.707916259765625, "global_step": 70190, "epoch": 845} {"train_loss": -21.165573120117188, "global_step": 70191, "epoch": 845} {"train_loss": -20.732038497924805, "global_step": 70192, "epoch": 845} {"train_loss": -20.527793884277344, "global_step": 70193, "epoch": 845} {"train_loss": -20.597272872924805, "global_step": 70194, "epoch": 845} {"train_loss": -20.779634475708008, "global_step": 70195, "epoch": 845} {"train_loss": -21.054813385009766, "global_step": 70196, "epoch": 845} {"train_loss": -20.67507553100586, "global_step": 70197, "epoch": 845} {"train_loss": -20.736236572265625, "global_step": 70198, "epoch": 845} {"train_loss": -21.162879943847656, "global_step": 70199, "epoch": 845} {"train_loss": -21.051374435424805, "global_step": 70200, "epoch": 845} {"train_loss": -21.022266387939453, "global_step": 70201, "epoch": 845} {"train_loss": -20.768299102783203, "global_step": 70202, "epoch": 845} {"train_loss": -21.038101196289062, "global_step": 70203, "epoch": 845} {"train_loss": -20.616188049316406, "global_step": 70204, "epoch": 845} {"train_loss": -20.860782623291016, "global_step": 70205, "epoch": 845} {"train_loss": -21.02161407470703, "global_step": 70206, "epoch": 845} {"train_loss": -20.899084091186523, "global_step": 70207, "epoch": 845} {"train_loss": -20.88736343383789, "global_step": 70208, "epoch": 845} {"train_loss": -21.105369567871094, "global_step": 70209, "epoch": 845} {"train_loss": -20.72928237915039, "global_step": 70210, "epoch": 845} {"train_loss": -21.434125900268555, "global_step": 70211, "epoch": 845} {"train_loss": -20.689151763916016, "global_step": 70212, "epoch": 845} {"train_loss": -20.34047508239746, "global_step": 70213, "epoch": 845} {"train_loss": -20.547441482543945, "global_step": 70214, "epoch": 845} {"train_loss": -20.485904693603516, "global_step": 70215, "epoch": 845} {"train_loss": -20.936399459838867, "global_step": 70216, "epoch": 845} {"train_loss": -20.8352113746735, "global_step": 70217, "epoch": 845, "val_loss": 5942663.5} {"train_loss": -20.600038528442383, "global_step": 70218, "epoch": 846} {"train_loss": -20.094953536987305, "global_step": 70219, "epoch": 846} {"train_loss": -20.571638107299805, "global_step": 70220, "epoch": 846} {"train_loss": -20.493955612182617, "global_step": 70221, "epoch": 846} {"train_loss": -20.66937828063965, "global_step": 70222, "epoch": 846} {"train_loss": -20.399477005004883, "global_step": 70223, "epoch": 846} {"train_loss": -20.68082618713379, "global_step": 70224, "epoch": 846} {"train_loss": -20.545124053955078, "global_step": 70225, "epoch": 846} {"train_loss": -20.44380760192871, "global_step": 70226, "epoch": 846} {"train_loss": -20.431310653686523, "global_step": 70227, "epoch": 846} {"train_loss": -20.605390548706055, "global_step": 70228, "epoch": 846} {"train_loss": -20.865888595581055, "global_step": 70229, "epoch": 846} {"train_loss": -20.443052291870117, "global_step": 70230, "epoch": 846} {"train_loss": -20.931015014648438, "global_step": 70231, "epoch": 846} {"train_loss": -20.379791259765625, "global_step": 70232, "epoch": 846} {"train_loss": -20.625425338745117, "global_step": 70233, "epoch": 846} {"train_loss": -20.45753288269043, "global_step": 70234, "epoch": 846} {"train_loss": -20.655498504638672, "global_step": 70235, "epoch": 846} {"train_loss": -20.53013038635254, "global_step": 70236, "epoch": 846} {"train_loss": -20.737979888916016, "global_step": 70237, "epoch": 846} {"train_loss": -20.128604888916016, "global_step": 70238, "epoch": 846} {"train_loss": -20.586835861206055, "global_step": 70239, "epoch": 846} {"train_loss": -20.681283950805664, "global_step": 70240, "epoch": 846} {"train_loss": -20.596454620361328, "global_step": 70241, "epoch": 846} {"train_loss": -20.69191551208496, "global_step": 70242, "epoch": 846} {"train_loss": -20.738845825195312, "global_step": 70243, "epoch": 846} {"train_loss": -20.443479537963867, "global_step": 70244, "epoch": 846} {"train_loss": -20.220046997070312, "global_step": 70245, "epoch": 846} {"train_loss": -20.356870651245117, "global_step": 70246, "epoch": 846} {"train_loss": -20.89767837524414, "global_step": 70247, "epoch": 846} {"train_loss": -20.384918212890625, "global_step": 70248, "epoch": 846} {"train_loss": -20.5794620513916, "global_step": 70249, "epoch": 846} {"train_loss": -21.22247886657715, "global_step": 70250, "epoch": 846} {"train_loss": -21.075538635253906, "global_step": 70251, "epoch": 846} {"train_loss": -20.860179901123047, "global_step": 70252, "epoch": 846} {"train_loss": -21.153278350830078, "global_step": 70253, "epoch": 846} {"train_loss": -20.706348419189453, "global_step": 70254, "epoch": 846} {"train_loss": -20.634136199951172, "global_step": 70255, "epoch": 846} {"train_loss": -20.67452049255371, "global_step": 70256, "epoch": 846} {"train_loss": -20.639354705810547, "global_step": 70257, "epoch": 846} {"train_loss": -20.95232582092285, "global_step": 70258, "epoch": 846} {"train_loss": -20.776165008544922, "global_step": 70259, "epoch": 846} {"train_loss": -21.12965965270996, "global_step": 70260, "epoch": 846} {"train_loss": -21.111644744873047, "global_step": 70261, "epoch": 846} {"train_loss": -20.908140182495117, "global_step": 70262, "epoch": 846} {"train_loss": -20.9921932220459, "global_step": 70263, "epoch": 846} {"train_loss": -20.86444664001465, "global_step": 70264, "epoch": 846} {"train_loss": -20.78246307373047, "global_step": 70265, "epoch": 846} {"train_loss": -20.40412712097168, "global_step": 70266, "epoch": 846} {"train_loss": -20.84415054321289, "global_step": 70267, "epoch": 846} {"train_loss": -20.828258514404297, "global_step": 70268, "epoch": 846} {"train_loss": -20.93959617614746, "global_step": 70269, "epoch": 846} {"train_loss": -20.9439640045166, "global_step": 70270, "epoch": 846} {"train_loss": -21.106203079223633, "global_step": 70271, "epoch": 846} {"train_loss": -20.935861587524414, "global_step": 70272, "epoch": 846} {"train_loss": -20.707265853881836, "global_step": 70273, "epoch": 846} {"train_loss": -21.2131290435791, "global_step": 70274, "epoch": 846} {"train_loss": -20.960315704345703, "global_step": 70275, "epoch": 846} {"train_loss": -20.70051383972168, "global_step": 70276, "epoch": 846} {"train_loss": -20.485736846923828, "global_step": 70277, "epoch": 846} {"train_loss": -20.650348663330078, "global_step": 70278, "epoch": 846} {"train_loss": -21.00026512145996, "global_step": 70279, "epoch": 846} {"train_loss": -20.799711227416992, "global_step": 70280, "epoch": 846} {"train_loss": -21.05384635925293, "global_step": 70281, "epoch": 846} {"train_loss": -21.209081649780273, "global_step": 70282, "epoch": 846} {"train_loss": -20.97470474243164, "global_step": 70283, "epoch": 846} {"train_loss": -20.958345413208008, "global_step": 70284, "epoch": 846} {"train_loss": -20.54601287841797, "global_step": 70285, "epoch": 846} {"train_loss": -20.696271896362305, "global_step": 70286, "epoch": 846} {"train_loss": -20.806425094604492, "global_step": 70287, "epoch": 846} {"train_loss": -20.955419540405273, "global_step": 70288, "epoch": 846} {"train_loss": -21.089542388916016, "global_step": 70289, "epoch": 846} {"train_loss": -20.885190963745117, "global_step": 70290, "epoch": 846} {"train_loss": -21.089824676513672, "global_step": 70291, "epoch": 846} {"train_loss": -20.689762115478516, "global_step": 70292, "epoch": 846} {"train_loss": -20.958221435546875, "global_step": 70293, "epoch": 846} {"train_loss": -20.791065216064453, "global_step": 70294, "epoch": 846} {"train_loss": -21.012187957763672, "global_step": 70295, "epoch": 846} {"train_loss": -20.900712966918945, "global_step": 70296, "epoch": 846} {"train_loss": -20.713329315185547, "global_step": 70297, "epoch": 846} {"train_loss": -20.62116813659668, "global_step": 70298, "epoch": 846} {"train_loss": -20.718534469604492, "global_step": 70299, "epoch": 846} {"train_loss": -20.734472389680793, "global_step": 70300, "epoch": 846, "val_loss": 5951530.5} {"train_loss": -20.651573181152344, "global_step": 70301, "epoch": 847} {"train_loss": -20.852815628051758, "global_step": 70302, "epoch": 847} {"train_loss": -20.468061447143555, "global_step": 70303, "epoch": 847} {"train_loss": -20.53533363342285, "global_step": 70304, "epoch": 847} {"train_loss": -19.98756980895996, "global_step": 70305, "epoch": 847} {"train_loss": -20.811965942382812, "global_step": 70306, "epoch": 847} {"train_loss": -20.68982696533203, "global_step": 70307, "epoch": 847} {"train_loss": -20.591014862060547, "global_step": 70308, "epoch": 847} {"train_loss": -21.00592041015625, "global_step": 70309, "epoch": 847} {"train_loss": -20.615497589111328, "global_step": 70310, "epoch": 847} {"train_loss": -20.92110824584961, "global_step": 70311, "epoch": 847} {"train_loss": -21.05044174194336, "global_step": 70312, "epoch": 847} {"train_loss": -20.737497329711914, "global_step": 70313, "epoch": 847} {"train_loss": -21.042043685913086, "global_step": 70314, "epoch": 847} {"train_loss": -20.922109603881836, "global_step": 70315, "epoch": 847} {"train_loss": -21.192461013793945, "global_step": 70316, "epoch": 847} {"train_loss": -21.0067195892334, "global_step": 70317, "epoch": 847} {"train_loss": -21.013504028320312, "global_step": 70318, "epoch": 847} {"train_loss": -20.70429801940918, "global_step": 70319, "epoch": 847} {"train_loss": -21.226333618164062, "global_step": 70320, "epoch": 847} {"train_loss": -21.1162109375, "global_step": 70321, "epoch": 847} {"train_loss": -20.97212028503418, "global_step": 70322, "epoch": 847} {"train_loss": -20.76295280456543, "global_step": 70323, "epoch": 847} {"train_loss": -20.880762100219727, "global_step": 70324, "epoch": 847} {"train_loss": -21.35450553894043, "global_step": 70325, "epoch": 847} {"train_loss": -21.014284133911133, "global_step": 70326, "epoch": 847} {"train_loss": -20.8668270111084, "global_step": 70327, "epoch": 847} {"train_loss": -20.665924072265625, "global_step": 70328, "epoch": 847} {"train_loss": -20.674596786499023, "global_step": 70329, "epoch": 847} {"train_loss": -20.628833770751953, "global_step": 70330, "epoch": 847} {"train_loss": -20.83974266052246, "global_step": 70331, "epoch": 847} {"train_loss": -20.92703628540039, "global_step": 70332, "epoch": 847} {"train_loss": -20.894794464111328, "global_step": 70333, "epoch": 847} {"train_loss": -20.718595504760742, "global_step": 70334, "epoch": 847} {"train_loss": -20.5180606842041, "global_step": 70335, "epoch": 847} {"train_loss": -20.737756729125977, "global_step": 70336, "epoch": 847} {"train_loss": -20.709575653076172, "global_step": 70337, "epoch": 847} {"train_loss": -20.91162109375, "global_step": 70338, "epoch": 847} {"train_loss": -20.598800659179688, "global_step": 70339, "epoch": 847} {"train_loss": -20.720937728881836, "global_step": 70340, "epoch": 847} {"train_loss": -20.722850799560547, "global_step": 70341, "epoch": 847} {"train_loss": -21.135902404785156, "global_step": 70342, "epoch": 847} {"train_loss": -21.211944580078125, "global_step": 70343, "epoch": 847} {"train_loss": -20.91193962097168, "global_step": 70344, "epoch": 847} {"train_loss": -20.701343536376953, "global_step": 70345, "epoch": 847} {"train_loss": -20.90071678161621, "global_step": 70346, "epoch": 847} {"train_loss": -20.995410919189453, "global_step": 70347, "epoch": 847} {"train_loss": -20.950775146484375, "global_step": 70348, "epoch": 847} {"train_loss": -20.752731323242188, "global_step": 70349, "epoch": 847} {"train_loss": -20.466814041137695, "global_step": 70350, "epoch": 847} {"train_loss": -20.718189239501953, "global_step": 70351, "epoch": 847} {"train_loss": -21.439746856689453, "global_step": 70352, "epoch": 847} {"train_loss": -20.70826530456543, "global_step": 70353, "epoch": 847} {"train_loss": -20.722265243530273, "global_step": 70354, "epoch": 847} {"train_loss": -20.712894439697266, "global_step": 70355, "epoch": 847} {"train_loss": -20.68520736694336, "global_step": 70356, "epoch": 847} {"train_loss": -20.412769317626953, "global_step": 70357, "epoch": 847} {"train_loss": -20.705652236938477, "global_step": 70358, "epoch": 847} {"train_loss": -20.600915908813477, "global_step": 70359, "epoch": 847} {"train_loss": -20.6947021484375, "global_step": 70360, "epoch": 847} {"train_loss": -21.36039161682129, "global_step": 70361, "epoch": 847} {"train_loss": -20.55909538269043, "global_step": 70362, "epoch": 847} {"train_loss": -20.754796981811523, "global_step": 70363, "epoch": 847} {"train_loss": -20.906726837158203, "global_step": 70364, "epoch": 847} {"train_loss": -20.692472457885742, "global_step": 70365, "epoch": 847} {"train_loss": -20.791196823120117, "global_step": 70366, "epoch": 847} {"train_loss": -20.537351608276367, "global_step": 70367, "epoch": 847} {"train_loss": -20.963848114013672, "global_step": 70368, "epoch": 847} {"train_loss": -20.814184188842773, "global_step": 70369, "epoch": 847} {"train_loss": -21.12968635559082, "global_step": 70370, "epoch": 847} {"train_loss": -20.7242431640625, "global_step": 70371, "epoch": 847} {"train_loss": -20.709720611572266, "global_step": 70372, "epoch": 847} {"train_loss": -20.918149948120117, "global_step": 70373, "epoch": 847} {"train_loss": -20.781864166259766, "global_step": 70374, "epoch": 847} {"train_loss": -20.546689987182617, "global_step": 70375, "epoch": 847} {"train_loss": -21.136215209960938, "global_step": 70376, "epoch": 847} {"train_loss": -20.726104736328125, "global_step": 70377, "epoch": 847} {"train_loss": -21.130220413208008, "global_step": 70378, "epoch": 847} {"train_loss": -20.90522575378418, "global_step": 70379, "epoch": 847} {"train_loss": -20.527759552001953, "global_step": 70380, "epoch": 847} {"train_loss": -20.929338455200195, "global_step": 70381, "epoch": 847} {"train_loss": -20.73194694519043, "global_step": 70382, "epoch": 847} {"train_loss": -20.817163858068994, "global_step": 70383, "epoch": 847, "val_loss": 6207769.0} {"train_loss": -20.938074111938477, "global_step": 70384, "epoch": 848} {"train_loss": -20.633817672729492, "global_step": 70385, "epoch": 848} {"train_loss": -21.03383445739746, "global_step": 70386, "epoch": 848} {"train_loss": -20.585859298706055, "global_step": 70387, "epoch": 848} {"train_loss": -20.746444702148438, "global_step": 70388, "epoch": 848} {"train_loss": -20.905282974243164, "global_step": 70389, "epoch": 848} {"train_loss": -20.7972469329834, "global_step": 70390, "epoch": 848} {"train_loss": -20.69662857055664, "global_step": 70391, "epoch": 848} {"train_loss": -20.340238571166992, "global_step": 70392, "epoch": 848} {"train_loss": -20.60996437072754, "global_step": 70393, "epoch": 848} {"train_loss": -20.999311447143555, "global_step": 70394, "epoch": 848} {"train_loss": -20.83586311340332, "global_step": 70395, "epoch": 848} {"train_loss": -21.033363342285156, "global_step": 70396, "epoch": 848} {"train_loss": -20.83499526977539, "global_step": 70397, "epoch": 848} {"train_loss": -20.678287506103516, "global_step": 70398, "epoch": 848} {"train_loss": -21.031694412231445, "global_step": 70399, "epoch": 848} {"train_loss": -20.6981258392334, "global_step": 70400, "epoch": 848} {"train_loss": -20.7362003326416, "global_step": 70401, "epoch": 848} {"train_loss": -20.585378646850586, "global_step": 70402, "epoch": 848} {"train_loss": -20.793109893798828, "global_step": 70403, "epoch": 848} {"train_loss": -20.891727447509766, "global_step": 70404, "epoch": 848} {"train_loss": -20.3520565032959, "global_step": 70405, "epoch": 848} {"train_loss": -20.733678817749023, "global_step": 70406, "epoch": 848} {"train_loss": -21.082792282104492, "global_step": 70407, "epoch": 848} {"train_loss": -21.1687068939209, "global_step": 70408, "epoch": 848} {"train_loss": -21.154748916625977, "global_step": 70409, "epoch": 848} {"train_loss": -20.825210571289062, "global_step": 70410, "epoch": 848} {"train_loss": -21.004446029663086, "global_step": 70411, "epoch": 848} {"train_loss": -20.839908599853516, "global_step": 70412, "epoch": 848} {"train_loss": -20.776105880737305, "global_step": 70413, "epoch": 848} {"train_loss": -21.05862808227539, "global_step": 70414, "epoch": 848} {"train_loss": -21.061378479003906, "global_step": 70415, "epoch": 848} {"train_loss": -20.508703231811523, "global_step": 70416, "epoch": 848} {"train_loss": -20.80847930908203, "global_step": 70417, "epoch": 848} {"train_loss": -20.86879539489746, "global_step": 70418, "epoch": 848} {"train_loss": -20.753000259399414, "global_step": 70419, "epoch": 848} {"train_loss": -20.953044891357422, "global_step": 70420, "epoch": 848} {"train_loss": -20.886798858642578, "global_step": 70421, "epoch": 848} {"train_loss": -21.02838706970215, "global_step": 70422, "epoch": 848} {"train_loss": -20.575042724609375, "global_step": 70423, "epoch": 848} {"train_loss": -20.63273048400879, "global_step": 70424, "epoch": 848} {"train_loss": -20.40475082397461, "global_step": 70425, "epoch": 848} {"train_loss": -20.916160583496094, "global_step": 70426, "epoch": 848} {"train_loss": -20.996755599975586, "global_step": 70427, "epoch": 848} {"train_loss": -20.359771728515625, "global_step": 70428, "epoch": 848} {"train_loss": -20.514606475830078, "global_step": 70429, "epoch": 848} {"train_loss": -20.246484756469727, "global_step": 70430, "epoch": 848} {"train_loss": -20.486143112182617, "global_step": 70431, "epoch": 848} {"train_loss": -20.47865867614746, "global_step": 70432, "epoch": 848} {"train_loss": -20.415557861328125, "global_step": 70433, "epoch": 848} {"train_loss": -20.917638778686523, "global_step": 70434, "epoch": 848} {"train_loss": -20.6937313079834, "global_step": 70435, "epoch": 848} {"train_loss": -20.775699615478516, "global_step": 70436, "epoch": 848} {"train_loss": -20.810056686401367, "global_step": 70437, "epoch": 848} {"train_loss": -20.773420333862305, "global_step": 70438, "epoch": 848} {"train_loss": -20.516942977905273, "global_step": 70439, "epoch": 848} {"train_loss": -20.618040084838867, "global_step": 70440, "epoch": 848} {"train_loss": -20.695865631103516, "global_step": 70441, "epoch": 848} {"train_loss": -20.750829696655273, "global_step": 70442, "epoch": 848} {"train_loss": -20.775388717651367, "global_step": 70443, "epoch": 848} {"train_loss": -21.008750915527344, "global_step": 70444, "epoch": 848} {"train_loss": -20.511085510253906, "global_step": 70445, "epoch": 848} {"train_loss": -20.77113914489746, "global_step": 70446, "epoch": 848} {"train_loss": -20.871965408325195, "global_step": 70447, "epoch": 848} {"train_loss": -20.454904556274414, "global_step": 70448, "epoch": 848} {"train_loss": -20.830673217773438, "global_step": 70449, "epoch": 848} {"train_loss": -20.843313217163086, "global_step": 70450, "epoch": 848} {"train_loss": -20.81737518310547, "global_step": 70451, "epoch": 848} {"train_loss": -20.68426513671875, "global_step": 70452, "epoch": 848} {"train_loss": -20.727418899536133, "global_step": 70453, "epoch": 848} {"train_loss": -20.60110092163086, "global_step": 70454, "epoch": 848} {"train_loss": -20.982419967651367, "global_step": 70455, "epoch": 848} {"train_loss": -20.95200538635254, "global_step": 70456, "epoch": 848} {"train_loss": -20.991840362548828, "global_step": 70457, "epoch": 848} {"train_loss": -20.662715911865234, "global_step": 70458, "epoch": 848} {"train_loss": -20.375869750976562, "global_step": 70459, "epoch": 848} {"train_loss": -20.694660186767578, "global_step": 70460, "epoch": 848} {"train_loss": -20.921934127807617, "global_step": 70461, "epoch": 848} {"train_loss": -20.81170082092285, "global_step": 70462, "epoch": 848} {"train_loss": -20.465070724487305, "global_step": 70463, "epoch": 848} {"train_loss": -20.770288467407227, "global_step": 70464, "epoch": 848} {"train_loss": -20.76752281188965, "global_step": 70465, "epoch": 848} {"train_loss": -20.746195069278578, "global_step": 70466, "epoch": 848, "val_loss": 6057483.0} {"train_loss": -20.540281295776367, "global_step": 70467, "epoch": 849} {"train_loss": -20.631689071655273, "global_step": 70468, "epoch": 849} {"train_loss": -20.695119857788086, "global_step": 70469, "epoch": 849} {"train_loss": -20.999250411987305, "global_step": 70470, "epoch": 849} {"train_loss": -20.845766067504883, "global_step": 70471, "epoch": 849} {"train_loss": -20.821075439453125, "global_step": 70472, "epoch": 849} {"train_loss": -20.601224899291992, "global_step": 70473, "epoch": 849} {"train_loss": -20.72085189819336, "global_step": 70474, "epoch": 849} {"train_loss": -20.974964141845703, "global_step": 70475, "epoch": 849} {"train_loss": -20.775775909423828, "global_step": 70476, "epoch": 849} {"train_loss": -20.778154373168945, "global_step": 70477, "epoch": 849} {"train_loss": -20.8582763671875, "global_step": 70478, "epoch": 849} {"train_loss": -20.797311782836914, "global_step": 70479, "epoch": 849} {"train_loss": -20.59056282043457, "global_step": 70480, "epoch": 849} {"train_loss": -20.864240646362305, "global_step": 70481, "epoch": 849} {"train_loss": -20.783464431762695, "global_step": 70482, "epoch": 849} {"train_loss": -20.581777572631836, "global_step": 70483, "epoch": 849} {"train_loss": -20.885746002197266, "global_step": 70484, "epoch": 849} {"train_loss": -20.871524810791016, "global_step": 70485, "epoch": 849} {"train_loss": -20.56658172607422, "global_step": 70486, "epoch": 849} {"train_loss": -20.601713180541992, "global_step": 70487, "epoch": 849} {"train_loss": -20.504825592041016, "global_step": 70488, "epoch": 849} {"train_loss": -20.863744735717773, "global_step": 70489, "epoch": 849} {"train_loss": -20.85788345336914, "global_step": 70490, "epoch": 849} {"train_loss": -20.63729476928711, "global_step": 70491, "epoch": 849} {"train_loss": -20.628847122192383, "global_step": 70492, "epoch": 849} {"train_loss": -21.022565841674805, "global_step": 70493, "epoch": 849} {"train_loss": -20.930835723876953, "global_step": 70494, "epoch": 849} {"train_loss": -20.748258590698242, "global_step": 70495, "epoch": 849} {"train_loss": -20.9488468170166, "global_step": 70496, "epoch": 849} {"train_loss": -21.169891357421875, "global_step": 70497, "epoch": 849} {"train_loss": -20.546117782592773, "global_step": 70498, "epoch": 849} {"train_loss": -20.980520248413086, "global_step": 70499, "epoch": 849} {"train_loss": -21.343568801879883, "global_step": 70500, "epoch": 849} {"train_loss": -20.666446685791016, "global_step": 70501, "epoch": 849} {"train_loss": -20.965225219726562, "global_step": 70502, "epoch": 849} {"train_loss": -20.853971481323242, "global_step": 70503, "epoch": 849} {"train_loss": -20.702686309814453, "global_step": 70504, "epoch": 849} {"train_loss": -20.869789123535156, "global_step": 70505, "epoch": 849} {"train_loss": -20.87391471862793, "global_step": 70506, "epoch": 849} {"train_loss": -20.91707992553711, "global_step": 70507, "epoch": 849} {"train_loss": -20.952552795410156, "global_step": 70508, "epoch": 849} {"train_loss": -20.869657516479492, "global_step": 70509, "epoch": 849} {"train_loss": -20.74200439453125, "global_step": 70510, "epoch": 849} {"train_loss": -20.817197799682617, "global_step": 70511, "epoch": 849} {"train_loss": -20.61868667602539, "global_step": 70512, "epoch": 849} {"train_loss": -20.734724044799805, "global_step": 70513, "epoch": 849} {"train_loss": -20.786340713500977, "global_step": 70514, "epoch": 849} {"train_loss": -21.165904998779297, "global_step": 70515, "epoch": 849} {"train_loss": -20.554086685180664, "global_step": 70516, "epoch": 849} {"train_loss": -20.732559204101562, "global_step": 70517, "epoch": 849} {"train_loss": -20.71059799194336, "global_step": 70518, "epoch": 849} {"train_loss": -20.55960464477539, "global_step": 70519, "epoch": 849} {"train_loss": -21.014812469482422, "global_step": 70520, "epoch": 849} {"train_loss": -21.020151138305664, "global_step": 70521, "epoch": 849} {"train_loss": -21.00258445739746, "global_step": 70522, "epoch": 849} {"train_loss": -20.785184860229492, "global_step": 70523, "epoch": 849} {"train_loss": -21.226106643676758, "global_step": 70524, "epoch": 849} {"train_loss": -20.396337509155273, "global_step": 70525, "epoch": 849} {"train_loss": -20.908926010131836, "global_step": 70526, "epoch": 849} {"train_loss": -21.0076961517334, "global_step": 70527, "epoch": 849} {"train_loss": -20.671222686767578, "global_step": 70528, "epoch": 849} {"train_loss": -20.800573348999023, "global_step": 70529, "epoch": 849} {"train_loss": -21.040054321289062, "global_step": 70530, "epoch": 849} {"train_loss": -20.759214401245117, "global_step": 70531, "epoch": 849} {"train_loss": -20.728391647338867, "global_step": 70532, "epoch": 849} {"train_loss": -20.77251625061035, "global_step": 70533, "epoch": 849} {"train_loss": -20.683629989624023, "global_step": 70534, "epoch": 849} {"train_loss": -20.719385147094727, "global_step": 70535, "epoch": 849} {"train_loss": -20.510854721069336, "global_step": 70536, "epoch": 849} {"train_loss": -21.0993709564209, "global_step": 70537, "epoch": 849} {"train_loss": -21.066787719726562, "global_step": 70538, "epoch": 849} {"train_loss": -20.677902221679688, "global_step": 70539, "epoch": 849} {"train_loss": -20.46555519104004, "global_step": 70540, "epoch": 849} {"train_loss": -20.958528518676758, "global_step": 70541, "epoch": 849} {"train_loss": -20.85502815246582, "global_step": 70542, "epoch": 849} {"train_loss": -21.006704330444336, "global_step": 70543, "epoch": 849} {"train_loss": -20.84586524963379, "global_step": 70544, "epoch": 849} {"train_loss": -20.723142623901367, "global_step": 70545, "epoch": 849} {"train_loss": -21.26755142211914, "global_step": 70546, "epoch": 849} {"train_loss": -21.01810646057129, "global_step": 70547, "epoch": 849} {"train_loss": -20.80689811706543, "global_step": 70548, "epoch": 849} {"train_loss": -20.814518985978093, "global_step": 70549, "epoch": 849, "val_loss": 5998624.0} {"train_loss": -20.975391387939453, "global_step": 70550, "epoch": 850} {"train_loss": -20.741657257080078, "global_step": 70551, "epoch": 850} {"train_loss": -20.346593856811523, "global_step": 70552, "epoch": 850} {"train_loss": -21.129179000854492, "global_step": 70553, "epoch": 850} {"train_loss": -20.53385353088379, "global_step": 70554, "epoch": 850} {"train_loss": -20.970993041992188, "global_step": 70555, "epoch": 850} {"train_loss": -20.884763717651367, "global_step": 70556, "epoch": 850} {"train_loss": -20.516605377197266, "global_step": 70557, "epoch": 850} {"train_loss": -20.623693466186523, "global_step": 70558, "epoch": 850} {"train_loss": -20.82925033569336, "global_step": 70559, "epoch": 850} {"train_loss": -20.809858322143555, "global_step": 70560, "epoch": 850} {"train_loss": -20.621688842773438, "global_step": 70561, "epoch": 850} {"train_loss": -20.887310028076172, "global_step": 70562, "epoch": 850} {"train_loss": -20.717365264892578, "global_step": 70563, "epoch": 850} {"train_loss": -21.144729614257812, "global_step": 70564, "epoch": 850} {"train_loss": -20.95290184020996, "global_step": 70565, "epoch": 850} {"train_loss": -20.699447631835938, "global_step": 70566, "epoch": 850} {"train_loss": -20.946945190429688, "global_step": 70567, "epoch": 850} {"train_loss": -21.022607803344727, "global_step": 70568, "epoch": 850} {"train_loss": -20.84479331970215, "global_step": 70569, "epoch": 850} {"train_loss": -20.77579689025879, "global_step": 70570, "epoch": 850} {"train_loss": -20.79693031311035, "global_step": 70571, "epoch": 850} {"train_loss": -20.53944206237793, "global_step": 70572, "epoch": 850} {"train_loss": -20.692174911499023, "global_step": 70573, "epoch": 850} {"train_loss": -21.206655502319336, "global_step": 70574, "epoch": 850} {"train_loss": -20.801633834838867, "global_step": 70575, "epoch": 850} {"train_loss": -21.069751739501953, "global_step": 70576, "epoch": 850} {"train_loss": -20.73170280456543, "global_step": 70577, "epoch": 850} {"train_loss": -20.632471084594727, "global_step": 70578, "epoch": 850} {"train_loss": -20.96193504333496, "global_step": 70579, "epoch": 850} {"train_loss": -20.78244400024414, "global_step": 70580, "epoch": 850} {"train_loss": -20.487672805786133, "global_step": 70581, "epoch": 850} {"train_loss": -21.028287887573242, "global_step": 70582, "epoch": 850} {"train_loss": -20.70476531982422, "global_step": 70583, "epoch": 850} {"train_loss": -20.899267196655273, "global_step": 70584, "epoch": 850} {"train_loss": -21.0872859954834, "global_step": 70585, "epoch": 850} {"train_loss": -20.99266815185547, "global_step": 70586, "epoch": 850} {"train_loss": -21.030492782592773, "global_step": 70587, "epoch": 850} {"train_loss": -21.260223388671875, "global_step": 70588, "epoch": 850} {"train_loss": -20.783449172973633, "global_step": 70589, "epoch": 850} {"train_loss": -20.74185562133789, "global_step": 70590, "epoch": 850} {"train_loss": -21.1441707611084, "global_step": 70591, "epoch": 850} {"train_loss": -21.031038284301758, "global_step": 70592, "epoch": 850} {"train_loss": -21.238317489624023, "global_step": 70593, "epoch": 850} {"train_loss": -20.960620880126953, "global_step": 70594, "epoch": 850} {"train_loss": -20.526382446289062, "global_step": 70595, "epoch": 850} {"train_loss": -20.84097671508789, "global_step": 70596, "epoch": 850} {"train_loss": -20.853696823120117, "global_step": 70597, "epoch": 850} {"train_loss": -20.48567008972168, "global_step": 70598, "epoch": 850} {"train_loss": -21.28285026550293, "global_step": 70599, "epoch": 850} {"train_loss": -21.093854904174805, "global_step": 70600, "epoch": 850} {"train_loss": -20.99469566345215, "global_step": 70601, "epoch": 850} {"train_loss": -20.73052978515625, "global_step": 70602, "epoch": 850} {"train_loss": -20.51706314086914, "global_step": 70603, "epoch": 850} {"train_loss": -20.479511260986328, "global_step": 70604, "epoch": 850} {"train_loss": -20.68934440612793, "global_step": 70605, "epoch": 850} {"train_loss": -20.587711334228516, "global_step": 70606, "epoch": 850} {"train_loss": -20.827402114868164, "global_step": 70607, "epoch": 850} {"train_loss": -20.80836296081543, "global_step": 70608, "epoch": 850} {"train_loss": -20.95819091796875, "global_step": 70609, "epoch": 850} {"train_loss": -20.762353897094727, "global_step": 70610, "epoch": 850} {"train_loss": -20.75807762145996, "global_step": 70611, "epoch": 850} {"train_loss": -20.874982833862305, "global_step": 70612, "epoch": 850} {"train_loss": -21.039865493774414, "global_step": 70613, "epoch": 850} {"train_loss": -20.916805267333984, "global_step": 70614, "epoch": 850} {"train_loss": -21.11632537841797, "global_step": 70615, "epoch": 850} {"train_loss": -20.76161003112793, "global_step": 70616, "epoch": 850} {"train_loss": -20.78741455078125, "global_step": 70617, "epoch": 850} {"train_loss": -21.02957534790039, "global_step": 70618, "epoch": 850} {"train_loss": -21.07156753540039, "global_step": 70619, "epoch": 850} {"train_loss": -21.1362361907959, "global_step": 70620, "epoch": 850} {"train_loss": -20.916059494018555, "global_step": 70621, "epoch": 850} {"train_loss": -20.569860458374023, "global_step": 70622, "epoch": 850} {"train_loss": -20.95964241027832, "global_step": 70623, "epoch": 850} {"train_loss": -20.858814239501953, "global_step": 70624, "epoch": 850} {"train_loss": -20.92880630493164, "global_step": 70625, "epoch": 850} {"train_loss": -20.695240020751953, "global_step": 70626, "epoch": 850} {"train_loss": -21.112464904785156, "global_step": 70627, "epoch": 850} {"train_loss": -20.608129501342773, "global_step": 70628, "epoch": 850} {"train_loss": -20.733243942260742, "global_step": 70629, "epoch": 850} {"train_loss": -20.842756271362305, "global_step": 70630, "epoch": 850} {"train_loss": -20.52919578552246, "global_step": 70631, "epoch": 850} {"train_loss": -20.837244033813477, "global_step": 70632, "epoch": 850, "train/sim_max_reward_0": 1.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 0.0, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4500000": 1.0, "test/sim_max_reward_4500001": 1.0, "test/sim_max_reward_4500002": 1.0, "test/sim_max_reward_4500003": 1.0, "test/sim_max_reward_4500004": 1.0, "test/sim_max_reward_4500005": 1.0, "test/sim_max_reward_4500006": 0.0, "test/sim_max_reward_4500007": 1.0, "test/sim_max_reward_4500008": 1.0, "test/sim_max_reward_4500009": 1.0, "test/sim_max_reward_4500010": 1.0, "test/sim_max_reward_4500011": 1.0, "test/sim_max_reward_4500012": 1.0, "test/sim_max_reward_4500013": 1.0, "test/sim_max_reward_4500014": 1.0, "test/sim_max_reward_4500015": 1.0, "test/sim_max_reward_4500016": 1.0, "test/sim_max_reward_4500017": 1.0, "test/sim_max_reward_4500018": 1.0, "test/sim_max_reward_4500019": 0.0, "test/sim_max_reward_4500020": 1.0, "test/sim_max_reward_4500021": 1.0, "train/mean_score": 0.8333333333333334, "test/mean_score": 0.9090909090909091, "val_loss": 6063430.0} {"train_loss": -20.123321533203125, "global_step": 70633, "epoch": 851} {"train_loss": -19.93886375427246, "global_step": 70634, "epoch": 851} {"train_loss": -20.096616744995117, "global_step": 70635, "epoch": 851} {"train_loss": -20.5440731048584, "global_step": 70636, "epoch": 851} {"train_loss": -20.10856056213379, "global_step": 70637, "epoch": 851} {"train_loss": -20.420621871948242, "global_step": 70638, "epoch": 851} {"train_loss": -20.845388412475586, "global_step": 70639, "epoch": 851} {"train_loss": -20.390785217285156, "global_step": 70640, "epoch": 851} {"train_loss": -21.02020263671875, "global_step": 70641, "epoch": 851} {"train_loss": -20.675363540649414, "global_step": 70642, "epoch": 851} {"train_loss": -20.494911193847656, "global_step": 70643, "epoch": 851} {"train_loss": -20.325321197509766, "global_step": 70644, "epoch": 851} {"train_loss": -20.89400291442871, "global_step": 70645, "epoch": 851} {"train_loss": -20.65340805053711, "global_step": 70646, "epoch": 851} {"train_loss": -20.594213485717773, "global_step": 70647, "epoch": 851} {"train_loss": -20.535871505737305, "global_step": 70648, "epoch": 851} {"train_loss": -21.07286834716797, "global_step": 70649, "epoch": 851} {"train_loss": -20.644826889038086, "global_step": 70650, "epoch": 851} {"train_loss": -21.223295211791992, "global_step": 70651, "epoch": 851} {"train_loss": -20.689346313476562, "global_step": 70652, "epoch": 851} {"train_loss": -20.868215560913086, "global_step": 70653, "epoch": 851} {"train_loss": -20.97144889831543, "global_step": 70654, "epoch": 851} {"train_loss": -20.86067008972168, "global_step": 70655, "epoch": 851} {"train_loss": -20.820194244384766, "global_step": 70656, "epoch": 851} {"train_loss": -20.87599754333496, "global_step": 70657, "epoch": 851} {"train_loss": -20.8872127532959, "global_step": 70658, "epoch": 851} {"train_loss": -20.584264755249023, "global_step": 70659, "epoch": 851} {"train_loss": -20.73761749267578, "global_step": 70660, "epoch": 851} {"train_loss": -21.092252731323242, "global_step": 70661, "epoch": 851} {"train_loss": -20.898714065551758, "global_step": 70662, "epoch": 851} {"train_loss": -20.565092086791992, "global_step": 70663, "epoch": 851} {"train_loss": -20.646488189697266, "global_step": 70664, "epoch": 851} {"train_loss": -21.037017822265625, "global_step": 70665, "epoch": 851} {"train_loss": -20.594940185546875, "global_step": 70666, "epoch": 851} {"train_loss": -20.786367416381836, "global_step": 70667, "epoch": 851} {"train_loss": -20.839712142944336, "global_step": 70668, "epoch": 851} {"train_loss": -20.829879760742188, "global_step": 70669, "epoch": 851} {"train_loss": -20.766069412231445, "global_step": 70670, "epoch": 851} {"train_loss": -21.316184997558594, "global_step": 70671, "epoch": 851} {"train_loss": -20.462553024291992, "global_step": 70672, "epoch": 851} {"train_loss": -21.21474266052246, "global_step": 70673, "epoch": 851} {"train_loss": -21.16635513305664, "global_step": 70674, "epoch": 851} {"train_loss": -20.90241813659668, "global_step": 70675, "epoch": 851} {"train_loss": -20.949920654296875, "global_step": 70676, "epoch": 851} {"train_loss": -20.82136344909668, "global_step": 70677, "epoch": 851} {"train_loss": -21.070154190063477, "global_step": 70678, "epoch": 851} {"train_loss": -20.722204208374023, "global_step": 70679, "epoch": 851} {"train_loss": -21.103422164916992, "global_step": 70680, "epoch": 851} {"train_loss": -20.650379180908203, "global_step": 70681, "epoch": 851} {"train_loss": -21.015487670898438, "global_step": 70682, "epoch": 851} {"train_loss": -20.632911682128906, "global_step": 70683, "epoch": 851} {"train_loss": -21.126371383666992, "global_step": 70684, "epoch": 851} {"train_loss": -20.873157501220703, "global_step": 70685, "epoch": 851} {"train_loss": -20.994064331054688, "global_step": 70686, "epoch": 851} {"train_loss": -21.13098907470703, "global_step": 70687, "epoch": 851} {"train_loss": -21.191316604614258, "global_step": 70688, "epoch": 851} {"train_loss": -20.838741302490234, "global_step": 70689, "epoch": 851} {"train_loss": -21.084836959838867, "global_step": 70690, "epoch": 851} {"train_loss": -20.933368682861328, "global_step": 70691, "epoch": 851} {"train_loss": -20.672544479370117, "global_step": 70692, "epoch": 851} {"train_loss": -20.931596755981445, "global_step": 70693, "epoch": 851} {"train_loss": -20.632213592529297, "global_step": 70694, "epoch": 851} {"train_loss": -20.49847412109375, "global_step": 70695, "epoch": 851} {"train_loss": -20.719385147094727, "global_step": 70696, "epoch": 851} {"train_loss": -21.088214874267578, "global_step": 70697, "epoch": 851} {"train_loss": -20.831228256225586, "global_step": 70698, "epoch": 851} {"train_loss": -20.965557098388672, "global_step": 70699, "epoch": 851} {"train_loss": -20.72352409362793, "global_step": 70700, "epoch": 851} {"train_loss": -20.722402572631836, "global_step": 70701, "epoch": 851} {"train_loss": -20.694299697875977, "global_step": 70702, "epoch": 851} {"train_loss": -20.5427303314209, "global_step": 70703, "epoch": 851} {"train_loss": -21.220693588256836, "global_step": 70704, "epoch": 851} {"train_loss": -21.143980026245117, "global_step": 70705, "epoch": 851} {"train_loss": -20.638309478759766, "global_step": 70706, "epoch": 851} {"train_loss": -20.98457908630371, "global_step": 70707, "epoch": 851} {"train_loss": -20.822919845581055, "global_step": 70708, "epoch": 851} {"train_loss": -20.733022689819336, "global_step": 70709, "epoch": 851} {"train_loss": -21.02541160583496, "global_step": 70710, "epoch": 851} {"train_loss": -21.1866397857666, "global_step": 70711, "epoch": 851} {"train_loss": -21.028818130493164, "global_step": 70712, "epoch": 851} {"train_loss": -20.658966064453125, "global_step": 70713, "epoch": 851} {"train_loss": -20.84682273864746, "global_step": 70714, "epoch": 851} {"train_loss": -20.805115228675934, "global_step": 70715, "epoch": 851, "val_loss": 5894373.0} {"train_loss": -20.047332763671875, "global_step": 70716, "epoch": 852} {"train_loss": -19.869827270507812, "global_step": 70717, "epoch": 852} {"train_loss": -20.310791015625, "global_step": 70718, "epoch": 852} {"train_loss": -20.176137924194336, "global_step": 70719, "epoch": 852} {"train_loss": -20.425506591796875, "global_step": 70720, "epoch": 852} {"train_loss": -20.875988006591797, "global_step": 70721, "epoch": 852} {"train_loss": -20.114521026611328, "global_step": 70722, "epoch": 852} {"train_loss": -20.539886474609375, "global_step": 70723, "epoch": 852} {"train_loss": -20.57131004333496, "global_step": 70724, "epoch": 852} {"train_loss": -20.5635986328125, "global_step": 70725, "epoch": 852} {"train_loss": -20.177871704101562, "global_step": 70726, "epoch": 852} {"train_loss": -20.662574768066406, "global_step": 70727, "epoch": 852} {"train_loss": -20.6778564453125, "global_step": 70728, "epoch": 852} {"train_loss": -20.357959747314453, "global_step": 70729, "epoch": 852} {"train_loss": -20.49226188659668, "global_step": 70730, "epoch": 852} {"train_loss": -20.54446029663086, "global_step": 70731, "epoch": 852} {"train_loss": -20.490049362182617, "global_step": 70732, "epoch": 852} {"train_loss": -20.961183547973633, "global_step": 70733, "epoch": 852} {"train_loss": -20.92839241027832, "global_step": 70734, "epoch": 852} {"train_loss": -20.679059982299805, "global_step": 70735, "epoch": 852} {"train_loss": -21.288204193115234, "global_step": 70736, "epoch": 852} {"train_loss": -20.677515029907227, "global_step": 70737, "epoch": 852} {"train_loss": -21.12586784362793, "global_step": 70738, "epoch": 852} {"train_loss": -20.595367431640625, "global_step": 70739, "epoch": 852} {"train_loss": -20.696640014648438, "global_step": 70740, "epoch": 852} {"train_loss": -20.760526657104492, "global_step": 70741, "epoch": 852} {"train_loss": -20.63401985168457, "global_step": 70742, "epoch": 852} {"train_loss": -20.672565460205078, "global_step": 70743, "epoch": 852} {"train_loss": -20.949737548828125, "global_step": 70744, "epoch": 852} {"train_loss": -20.585058212280273, "global_step": 70745, "epoch": 852} {"train_loss": -20.8818302154541, "global_step": 70746, "epoch": 852} {"train_loss": -20.599952697753906, "global_step": 70747, "epoch": 852} {"train_loss": -20.71601676940918, "global_step": 70748, "epoch": 852} {"train_loss": -20.873245239257812, "global_step": 70749, "epoch": 852} {"train_loss": -20.466989517211914, "global_step": 70750, "epoch": 852} {"train_loss": -20.50645637512207, "global_step": 70751, "epoch": 852} {"train_loss": -20.74845314025879, "global_step": 70752, "epoch": 852} {"train_loss": -20.74337387084961, "global_step": 70753, "epoch": 852} {"train_loss": -20.701629638671875, "global_step": 70754, "epoch": 852} {"train_loss": -20.813907623291016, "global_step": 70755, "epoch": 852} {"train_loss": -20.513591766357422, "global_step": 70756, "epoch": 852} {"train_loss": -20.75773048400879, "global_step": 70757, "epoch": 852} {"train_loss": -20.69510841369629, "global_step": 70758, "epoch": 852} {"train_loss": -21.041601181030273, "global_step": 70759, "epoch": 852} {"train_loss": -20.692317962646484, "global_step": 70760, "epoch": 852} {"train_loss": -20.762149810791016, "global_step": 70761, "epoch": 852} {"train_loss": -20.836305618286133, "global_step": 70762, "epoch": 852} {"train_loss": -20.591421127319336, "global_step": 70763, "epoch": 852} {"train_loss": -20.67436408996582, "global_step": 70764, "epoch": 852} {"train_loss": -21.046842575073242, "global_step": 70765, "epoch": 852} {"train_loss": -20.951871871948242, "global_step": 70766, "epoch": 852} {"train_loss": -20.654376983642578, "global_step": 70767, "epoch": 852} {"train_loss": -20.5523738861084, "global_step": 70768, "epoch": 852} {"train_loss": -20.83283042907715, "global_step": 70769, "epoch": 852} {"train_loss": -20.92084503173828, "global_step": 70770, "epoch": 852} {"train_loss": -21.35944175720215, "global_step": 70771, "epoch": 852} {"train_loss": -20.89000129699707, "global_step": 70772, "epoch": 852} {"train_loss": -20.942914962768555, "global_step": 70773, "epoch": 852} {"train_loss": -20.267602920532227, "global_step": 70774, "epoch": 852} {"train_loss": -20.65055274963379, "global_step": 70775, "epoch": 852} {"train_loss": -20.886974334716797, "global_step": 70776, "epoch": 852} {"train_loss": -20.574180603027344, "global_step": 70777, "epoch": 852} {"train_loss": -21.126922607421875, "global_step": 70778, "epoch": 852} {"train_loss": -21.221097946166992, "global_step": 70779, "epoch": 852} {"train_loss": -21.207077026367188, "global_step": 70780, "epoch": 852} {"train_loss": -20.567230224609375, "global_step": 70781, "epoch": 852} {"train_loss": -20.62042999267578, "global_step": 70782, "epoch": 852} {"train_loss": -20.81574058532715, "global_step": 70783, "epoch": 852} {"train_loss": -20.984220504760742, "global_step": 70784, "epoch": 852} {"train_loss": -20.62375831604004, "global_step": 70785, "epoch": 852} {"train_loss": -21.041433334350586, "global_step": 70786, "epoch": 852} {"train_loss": -21.22088623046875, "global_step": 70787, "epoch": 852} {"train_loss": -20.918071746826172, "global_step": 70788, "epoch": 852} {"train_loss": -20.980188369750977, "global_step": 70789, "epoch": 852} {"train_loss": -20.897302627563477, "global_step": 70790, "epoch": 852} {"train_loss": -20.893299102783203, "global_step": 70791, "epoch": 852} {"train_loss": -20.862478256225586, "global_step": 70792, "epoch": 852} {"train_loss": -20.75316619873047, "global_step": 70793, "epoch": 852} {"train_loss": -20.850236892700195, "global_step": 70794, "epoch": 852} {"train_loss": -21.2271671295166, "global_step": 70795, "epoch": 852} {"train_loss": -21.074308395385742, "global_step": 70796, "epoch": 852} {"train_loss": -21.08609962463379, "global_step": 70797, "epoch": 852} {"train_loss": -20.73630755780691, "global_step": 70798, "epoch": 852, "val_loss": 6113444.0} {"train_loss": -20.65103530883789, "global_step": 70799, "epoch": 853} {"train_loss": -20.440889358520508, "global_step": 70800, "epoch": 853} {"train_loss": -20.279382705688477, "global_step": 70801, "epoch": 853} {"train_loss": -20.93918228149414, "global_step": 70802, "epoch": 853} {"train_loss": -20.51509666442871, "global_step": 70803, "epoch": 853} {"train_loss": -20.573078155517578, "global_step": 70804, "epoch": 853} {"train_loss": -20.639280319213867, "global_step": 70805, "epoch": 853} {"train_loss": -20.618385314941406, "global_step": 70806, "epoch": 853} {"train_loss": -21.038406372070312, "global_step": 70807, "epoch": 853} {"train_loss": -20.62415313720703, "global_step": 70808, "epoch": 853} {"train_loss": -20.358413696289062, "global_step": 70809, "epoch": 853} {"train_loss": -20.324920654296875, "global_step": 70810, "epoch": 853} {"train_loss": -20.744585037231445, "global_step": 70811, "epoch": 853} {"train_loss": -20.6070499420166, "global_step": 70812, "epoch": 853} {"train_loss": -20.897979736328125, "global_step": 70813, "epoch": 853} {"train_loss": -21.07546615600586, "global_step": 70814, "epoch": 853} {"train_loss": -21.157773971557617, "global_step": 70815, "epoch": 853} {"train_loss": -21.151090621948242, "global_step": 70816, "epoch": 853} {"train_loss": -20.774980545043945, "global_step": 70817, "epoch": 853} {"train_loss": -20.87815284729004, "global_step": 70818, "epoch": 853} {"train_loss": -20.73704719543457, "global_step": 70819, "epoch": 853} {"train_loss": -20.9036922454834, "global_step": 70820, "epoch": 853} {"train_loss": -20.890005111694336, "global_step": 70821, "epoch": 853} {"train_loss": -20.62154197692871, "global_step": 70822, "epoch": 853} {"train_loss": -20.925683975219727, "global_step": 70823, "epoch": 853} {"train_loss": -20.883302688598633, "global_step": 70824, "epoch": 853} {"train_loss": -20.868186950683594, "global_step": 70825, "epoch": 853} {"train_loss": -21.12773323059082, "global_step": 70826, "epoch": 853} {"train_loss": -20.80195426940918, "global_step": 70827, "epoch": 853} {"train_loss": -20.8688907623291, "global_step": 70828, "epoch": 853} {"train_loss": -20.75665855407715, "global_step": 70829, "epoch": 853} {"train_loss": -20.350366592407227, "global_step": 70830, "epoch": 853} {"train_loss": -20.75800132751465, "global_step": 70831, "epoch": 853} {"train_loss": -20.852584838867188, "global_step": 70832, "epoch": 853} {"train_loss": -20.967966079711914, "global_step": 70833, "epoch": 853} {"train_loss": -20.844038009643555, "global_step": 70834, "epoch": 853} {"train_loss": -21.047544479370117, "global_step": 70835, "epoch": 853} {"train_loss": -20.778644561767578, "global_step": 70836, "epoch": 853} {"train_loss": -20.854612350463867, "global_step": 70837, "epoch": 853} {"train_loss": -20.838359832763672, "global_step": 70838, "epoch": 853} {"train_loss": -20.811691284179688, "global_step": 70839, "epoch": 853} {"train_loss": -20.633697509765625, "global_step": 70840, "epoch": 853} {"train_loss": -20.93660545349121, "global_step": 70841, "epoch": 853} {"train_loss": -20.61805534362793, "global_step": 70842, "epoch": 853} {"train_loss": -20.684053421020508, "global_step": 70843, "epoch": 853} {"train_loss": -20.5439395904541, "global_step": 70844, "epoch": 853} {"train_loss": -20.868194580078125, "global_step": 70845, "epoch": 853} {"train_loss": -20.65619659423828, "global_step": 70846, "epoch": 853} {"train_loss": -20.500850677490234, "global_step": 70847, "epoch": 853} {"train_loss": -21.090621948242188, "global_step": 70848, "epoch": 853} {"train_loss": -20.832365036010742, "global_step": 70849, "epoch": 853} {"train_loss": -20.73952293395996, "global_step": 70850, "epoch": 853} {"train_loss": -20.907995223999023, "global_step": 70851, "epoch": 853} {"train_loss": -20.99416160583496, "global_step": 70852, "epoch": 853} {"train_loss": -20.9190673828125, "global_step": 70853, "epoch": 853} {"train_loss": -21.24429702758789, "global_step": 70854, "epoch": 853} {"train_loss": -20.542011260986328, "global_step": 70855, "epoch": 853} {"train_loss": -21.09762954711914, "global_step": 70856, "epoch": 853} {"train_loss": -21.034841537475586, "global_step": 70857, "epoch": 853} {"train_loss": -20.814599990844727, "global_step": 70858, "epoch": 853} {"train_loss": -20.952184677124023, "global_step": 70859, "epoch": 853} {"train_loss": -20.613306045532227, "global_step": 70860, "epoch": 853} {"train_loss": -20.579017639160156, "global_step": 70861, "epoch": 853} {"train_loss": -20.997350692749023, "global_step": 70862, "epoch": 853} {"train_loss": -20.92909049987793, "global_step": 70863, "epoch": 853} {"train_loss": -20.839946746826172, "global_step": 70864, "epoch": 853} {"train_loss": -20.925893783569336, "global_step": 70865, "epoch": 853} {"train_loss": -20.673105239868164, "global_step": 70866, "epoch": 853} {"train_loss": -20.88223648071289, "global_step": 70867, "epoch": 853} {"train_loss": -20.6458683013916, "global_step": 70868, "epoch": 853} {"train_loss": -20.75599479675293, "global_step": 70869, "epoch": 853} {"train_loss": -20.8572998046875, "global_step": 70870, "epoch": 853} {"train_loss": -21.442964553833008, "global_step": 70871, "epoch": 853} {"train_loss": -20.533334732055664, "global_step": 70872, "epoch": 853} {"train_loss": -21.083328247070312, "global_step": 70873, "epoch": 853} {"train_loss": -21.22859001159668, "global_step": 70874, "epoch": 853} {"train_loss": -20.443513870239258, "global_step": 70875, "epoch": 853} {"train_loss": -20.978084564208984, "global_step": 70876, "epoch": 853} {"train_loss": -21.101104736328125, "global_step": 70877, "epoch": 853} {"train_loss": -20.92036247253418, "global_step": 70878, "epoch": 853} {"train_loss": -20.823083877563477, "global_step": 70879, "epoch": 853} {"train_loss": -21.16358757019043, "global_step": 70880, "epoch": 853} {"train_loss": -20.83097600362387, "global_step": 70881, "epoch": 853, "val_loss": 6073300.0} {"train_loss": -20.13987159729004, "global_step": 70882, "epoch": 854} {"train_loss": -20.681241989135742, "global_step": 70883, "epoch": 854} {"train_loss": -19.89959144592285, "global_step": 70884, "epoch": 854} {"train_loss": -20.523420333862305, "global_step": 70885, "epoch": 854} {"train_loss": -20.615970611572266, "global_step": 70886, "epoch": 854} {"train_loss": -20.836156845092773, "global_step": 70887, "epoch": 854} {"train_loss": -20.555744171142578, "global_step": 70888, "epoch": 854} {"train_loss": -20.603689193725586, "global_step": 70889, "epoch": 854} {"train_loss": -20.413162231445312, "global_step": 70890, "epoch": 854} {"train_loss": -20.555923461914062, "global_step": 70891, "epoch": 854} {"train_loss": -20.649005889892578, "global_step": 70892, "epoch": 854} {"train_loss": -20.87200164794922, "global_step": 70893, "epoch": 854} {"train_loss": -20.6655330657959, "global_step": 70894, "epoch": 854} {"train_loss": -20.462385177612305, "global_step": 70895, "epoch": 854} {"train_loss": -20.533254623413086, "global_step": 70896, "epoch": 854} {"train_loss": -20.663597106933594, "global_step": 70897, "epoch": 854} {"train_loss": -20.65630531311035, "global_step": 70898, "epoch": 854} {"train_loss": -20.892187118530273, "global_step": 70899, "epoch": 854} {"train_loss": -21.12335777282715, "global_step": 70900, "epoch": 854} {"train_loss": -20.82201385498047, "global_step": 70901, "epoch": 854} {"train_loss": -20.627714157104492, "global_step": 70902, "epoch": 854} {"train_loss": -20.788419723510742, "global_step": 70903, "epoch": 854} {"train_loss": -20.753482818603516, "global_step": 70904, "epoch": 854} {"train_loss": -20.760347366333008, "global_step": 70905, "epoch": 854} {"train_loss": -20.712289810180664, "global_step": 70906, "epoch": 854} {"train_loss": -20.50152015686035, "global_step": 70907, "epoch": 854} {"train_loss": -21.0250301361084, "global_step": 70908, "epoch": 854} {"train_loss": -21.047794342041016, "global_step": 70909, "epoch": 854} {"train_loss": -21.014753341674805, "global_step": 70910, "epoch": 854} {"train_loss": -20.596616744995117, "global_step": 70911, "epoch": 854} {"train_loss": -21.033918380737305, "global_step": 70912, "epoch": 854} {"train_loss": -21.040292739868164, "global_step": 70913, "epoch": 854} {"train_loss": -21.121435165405273, "global_step": 70914, "epoch": 854} {"train_loss": -20.646169662475586, "global_step": 70915, "epoch": 854} {"train_loss": -20.69370460510254, "global_step": 70916, "epoch": 854} {"train_loss": -20.78244972229004, "global_step": 70917, "epoch": 854} {"train_loss": -21.092260360717773, "global_step": 70918, "epoch": 854} {"train_loss": -20.81720542907715, "global_step": 70919, "epoch": 854} {"train_loss": -20.94451332092285, "global_step": 70920, "epoch": 854} {"train_loss": -20.49233055114746, "global_step": 70921, "epoch": 854} {"train_loss": -20.978092193603516, "global_step": 70922, "epoch": 854} {"train_loss": -20.70941162109375, "global_step": 70923, "epoch": 854} {"train_loss": -21.01920509338379, "global_step": 70924, "epoch": 854} {"train_loss": -20.744428634643555, "global_step": 70925, "epoch": 854} {"train_loss": -20.272424697875977, "global_step": 70926, "epoch": 854} {"train_loss": -20.655683517456055, "global_step": 70927, "epoch": 854} {"train_loss": -20.760730743408203, "global_step": 70928, "epoch": 854} {"train_loss": -20.827499389648438, "global_step": 70929, "epoch": 854} {"train_loss": -21.130599975585938, "global_step": 70930, "epoch": 854} {"train_loss": -21.140310287475586, "global_step": 70931, "epoch": 854} {"train_loss": -20.87698745727539, "global_step": 70932, "epoch": 854} {"train_loss": -20.75672721862793, "global_step": 70933, "epoch": 854} {"train_loss": -20.87458610534668, "global_step": 70934, "epoch": 854} {"train_loss": -20.66686248779297, "global_step": 70935, "epoch": 854} {"train_loss": -20.671918869018555, "global_step": 70936, "epoch": 854} {"train_loss": -20.894132614135742, "global_step": 70937, "epoch": 854} {"train_loss": -20.58156967163086, "global_step": 70938, "epoch": 854} {"train_loss": -20.88658332824707, "global_step": 70939, "epoch": 854} {"train_loss": -21.17356300354004, "global_step": 70940, "epoch": 854} {"train_loss": -20.8656063079834, "global_step": 70941, "epoch": 854} {"train_loss": -21.062999725341797, "global_step": 70942, "epoch": 854} {"train_loss": -20.753381729125977, "global_step": 70943, "epoch": 854} {"train_loss": -21.193357467651367, "global_step": 70944, "epoch": 854} {"train_loss": -20.907255172729492, "global_step": 70945, "epoch": 854} {"train_loss": -20.589319229125977, "global_step": 70946, "epoch": 854} {"train_loss": -20.89484977722168, "global_step": 70947, "epoch": 854} {"train_loss": -20.898265838623047, "global_step": 70948, "epoch": 854} {"train_loss": -20.772626876831055, "global_step": 70949, "epoch": 854} {"train_loss": -20.933082580566406, "global_step": 70950, "epoch": 854} {"train_loss": -20.49268913269043, "global_step": 70951, "epoch": 854} {"train_loss": -20.70081901550293, "global_step": 70952, "epoch": 854} {"train_loss": -21.11653709411621, "global_step": 70953, "epoch": 854} {"train_loss": -20.25715446472168, "global_step": 70954, "epoch": 854} {"train_loss": -20.67316246032715, "global_step": 70955, "epoch": 854} {"train_loss": -20.819658279418945, "global_step": 70956, "epoch": 854} {"train_loss": -20.538496017456055, "global_step": 70957, "epoch": 854} {"train_loss": -21.085073471069336, "global_step": 70958, "epoch": 854} {"train_loss": -21.19537353515625, "global_step": 70959, "epoch": 854} {"train_loss": -20.692615509033203, "global_step": 70960, "epoch": 854} {"train_loss": -20.74714469909668, "global_step": 70961, "epoch": 854} {"train_loss": -20.815853118896484, "global_step": 70962, "epoch": 854} {"train_loss": -21.100187301635742, "global_step": 70963, "epoch": 854} {"train_loss": -20.78209272637425, "global_step": 70964, "epoch": 854, "val_loss": 5991836.0} {"train_loss": -20.186620712280273, "global_step": 70965, "epoch": 855} {"train_loss": -20.310726165771484, "global_step": 70966, "epoch": 855} {"train_loss": -20.54548454284668, "global_step": 70967, "epoch": 855} {"train_loss": -20.06690788269043, "global_step": 70968, "epoch": 855} {"train_loss": -20.29432487487793, "global_step": 70969, "epoch": 855} {"train_loss": -20.497251510620117, "global_step": 70970, "epoch": 855} {"train_loss": -20.233888626098633, "global_step": 70971, "epoch": 855} {"train_loss": -20.800626754760742, "global_step": 70972, "epoch": 855} {"train_loss": -20.5870304107666, "global_step": 70973, "epoch": 855} {"train_loss": -20.61672019958496, "global_step": 70974, "epoch": 855} {"train_loss": -20.585723876953125, "global_step": 70975, "epoch": 855} {"train_loss": -21.08405876159668, "global_step": 70976, "epoch": 855} {"train_loss": -20.62164878845215, "global_step": 70977, "epoch": 855} {"train_loss": -20.425369262695312, "global_step": 70978, "epoch": 855} {"train_loss": -20.639240264892578, "global_step": 70979, "epoch": 855} {"train_loss": -20.56987953186035, "global_step": 70980, "epoch": 855} {"train_loss": -20.60877799987793, "global_step": 70981, "epoch": 855} {"train_loss": -20.858041763305664, "global_step": 70982, "epoch": 855} {"train_loss": -20.685171127319336, "global_step": 70983, "epoch": 855} {"train_loss": -20.433080673217773, "global_step": 70984, "epoch": 855} {"train_loss": -20.8941707611084, "global_step": 70985, "epoch": 855} {"train_loss": -20.82330322265625, "global_step": 70986, "epoch": 855} {"train_loss": -20.91790771484375, "global_step": 70987, "epoch": 855} {"train_loss": -21.015764236450195, "global_step": 70988, "epoch": 855} {"train_loss": -20.74208641052246, "global_step": 70989, "epoch": 855} {"train_loss": -20.4708194732666, "global_step": 70990, "epoch": 855} {"train_loss": -20.782949447631836, "global_step": 70991, "epoch": 855} {"train_loss": -21.035690307617188, "global_step": 70992, "epoch": 855} {"train_loss": -20.641386032104492, "global_step": 70993, "epoch": 855} {"train_loss": -20.311279296875, "global_step": 70994, "epoch": 855} {"train_loss": -20.605161666870117, "global_step": 70995, "epoch": 855} {"train_loss": -20.713478088378906, "global_step": 70996, "epoch": 855} {"train_loss": -20.744136810302734, "global_step": 70997, "epoch": 855} {"train_loss": -20.736251831054688, "global_step": 70998, "epoch": 855} {"train_loss": -21.121137619018555, "global_step": 70999, "epoch": 855} {"train_loss": -20.995010375976562, "global_step": 71000, "epoch": 855} {"train_loss": -20.865907669067383, "global_step": 71001, "epoch": 855} {"train_loss": -20.709226608276367, "global_step": 71002, "epoch": 855} {"train_loss": -20.94916343688965, "global_step": 71003, "epoch": 855} {"train_loss": -20.86451530456543, "global_step": 71004, "epoch": 855} {"train_loss": -20.31665802001953, "global_step": 71005, "epoch": 855} {"train_loss": -20.86117172241211, "global_step": 71006, "epoch": 855} {"train_loss": -20.818449020385742, "global_step": 71007, "epoch": 855} {"train_loss": -20.782873153686523, "global_step": 71008, "epoch": 855} {"train_loss": -20.760284423828125, "global_step": 71009, "epoch": 855} {"train_loss": -20.983448028564453, "global_step": 71010, "epoch": 855} {"train_loss": -20.830427169799805, "global_step": 71011, "epoch": 855} {"train_loss": -20.80725860595703, "global_step": 71012, "epoch": 855} {"train_loss": -20.93650245666504, "global_step": 71013, "epoch": 855} {"train_loss": -20.742238998413086, "global_step": 71014, "epoch": 855} {"train_loss": -20.561996459960938, "global_step": 71015, "epoch": 855} {"train_loss": -20.806222915649414, "global_step": 71016, "epoch": 855} {"train_loss": -21.106252670288086, "global_step": 71017, "epoch": 855} {"train_loss": -21.166088104248047, "global_step": 71018, "epoch": 855} {"train_loss": -20.80082130432129, "global_step": 71019, "epoch": 855} {"train_loss": -20.8021183013916, "global_step": 71020, "epoch": 855} {"train_loss": -21.18796730041504, "global_step": 71021, "epoch": 855} {"train_loss": -20.643041610717773, "global_step": 71022, "epoch": 855} {"train_loss": -20.64051055908203, "global_step": 71023, "epoch": 855} {"train_loss": -21.167373657226562, "global_step": 71024, "epoch": 855} {"train_loss": -20.830381393432617, "global_step": 71025, "epoch": 855} {"train_loss": -21.057157516479492, "global_step": 71026, "epoch": 855} {"train_loss": -21.027198791503906, "global_step": 71027, "epoch": 855} {"train_loss": -21.28471565246582, "global_step": 71028, "epoch": 855} {"train_loss": -20.656444549560547, "global_step": 71029, "epoch": 855} {"train_loss": -20.859195709228516, "global_step": 71030, "epoch": 855} {"train_loss": -20.798532485961914, "global_step": 71031, "epoch": 855} {"train_loss": -21.274499893188477, "global_step": 71032, "epoch": 855} {"train_loss": -20.88528823852539, "global_step": 71033, "epoch": 855} {"train_loss": -20.709692001342773, "global_step": 71034, "epoch": 855} {"train_loss": -21.030536651611328, "global_step": 71035, "epoch": 855} {"train_loss": -20.571517944335938, "global_step": 71036, "epoch": 855} {"train_loss": -20.886310577392578, "global_step": 71037, "epoch": 855} {"train_loss": -21.09226417541504, "global_step": 71038, "epoch": 855} {"train_loss": -20.812044143676758, "global_step": 71039, "epoch": 855} {"train_loss": -20.76826286315918, "global_step": 71040, "epoch": 855} {"train_loss": -21.142446517944336, "global_step": 71041, "epoch": 855} {"train_loss": -20.88095474243164, "global_step": 71042, "epoch": 855} {"train_loss": -20.8106689453125, "global_step": 71043, "epoch": 855} {"train_loss": -20.7657527923584, "global_step": 71044, "epoch": 855} {"train_loss": -20.8731746673584, "global_step": 71045, "epoch": 855} {"train_loss": -20.81203269958496, "global_step": 71046, "epoch": 855} {"train_loss": -20.78882879234222, "global_step": 71047, "epoch": 855, "val_loss": 5977633.0} {"train_loss": -20.5308895111084, "global_step": 71048, "epoch": 856} {"train_loss": -20.472532272338867, "global_step": 71049, "epoch": 856} {"train_loss": -20.400625228881836, "global_step": 71050, "epoch": 856} {"train_loss": -20.615629196166992, "global_step": 71051, "epoch": 856} {"train_loss": -20.512128829956055, "global_step": 71052, "epoch": 856} {"train_loss": -20.33860206604004, "global_step": 71053, "epoch": 856} {"train_loss": -20.510557174682617, "global_step": 71054, "epoch": 856} {"train_loss": -20.608057022094727, "global_step": 71055, "epoch": 856} {"train_loss": -20.753698348999023, "global_step": 71056, "epoch": 856} {"train_loss": -20.221391677856445, "global_step": 71057, "epoch": 856} {"train_loss": -20.82131004333496, "global_step": 71058, "epoch": 856} {"train_loss": -20.640901565551758, "global_step": 71059, "epoch": 856} {"train_loss": -20.434995651245117, "global_step": 71060, "epoch": 856} {"train_loss": -21.004240036010742, "global_step": 71061, "epoch": 856} {"train_loss": -20.792089462280273, "global_step": 71062, "epoch": 856} {"train_loss": -20.775793075561523, "global_step": 71063, "epoch": 856} {"train_loss": -20.888671875, "global_step": 71064, "epoch": 856} {"train_loss": -20.766551971435547, "global_step": 71065, "epoch": 856} {"train_loss": -20.62887954711914, "global_step": 71066, "epoch": 856} {"train_loss": -20.94742774963379, "global_step": 71067, "epoch": 856} {"train_loss": -21.140865325927734, "global_step": 71068, "epoch": 856} {"train_loss": -20.88791847229004, "global_step": 71069, "epoch": 856} {"train_loss": -20.5205020904541, "global_step": 71070, "epoch": 856} {"train_loss": -21.013246536254883, "global_step": 71071, "epoch": 856} {"train_loss": -20.943002700805664, "global_step": 71072, "epoch": 856} {"train_loss": -21.20771598815918, "global_step": 71073, "epoch": 856} {"train_loss": -21.198734283447266, "global_step": 71074, "epoch": 856} {"train_loss": -20.606712341308594, "global_step": 71075, "epoch": 856} {"train_loss": -20.71036720275879, "global_step": 71076, "epoch": 856} {"train_loss": -20.691144943237305, "global_step": 71077, "epoch": 856} {"train_loss": -21.019506454467773, "global_step": 71078, "epoch": 856} {"train_loss": -20.8909854888916, "global_step": 71079, "epoch": 856} {"train_loss": -20.991779327392578, "global_step": 71080, "epoch": 856} {"train_loss": -20.63370132446289, "global_step": 71081, "epoch": 856} {"train_loss": -20.63943862915039, "global_step": 71082, "epoch": 856} {"train_loss": -20.999889373779297, "global_step": 71083, "epoch": 856} {"train_loss": -20.743335723876953, "global_step": 71084, "epoch": 856} {"train_loss": -20.946680068969727, "global_step": 71085, "epoch": 856} {"train_loss": -21.0184383392334, "global_step": 71086, "epoch": 856} {"train_loss": -20.909637451171875, "global_step": 71087, "epoch": 856} {"train_loss": -20.794370651245117, "global_step": 71088, "epoch": 856} {"train_loss": -21.180185317993164, "global_step": 71089, "epoch": 856} {"train_loss": -20.937583923339844, "global_step": 71090, "epoch": 856} {"train_loss": -20.84242057800293, "global_step": 71091, "epoch": 856} {"train_loss": -20.52869987487793, "global_step": 71092, "epoch": 856} {"train_loss": -20.764694213867188, "global_step": 71093, "epoch": 856} {"train_loss": -21.28912353515625, "global_step": 71094, "epoch": 856} {"train_loss": -20.938432693481445, "global_step": 71095, "epoch": 856} {"train_loss": -20.810890197753906, "global_step": 71096, "epoch": 856} {"train_loss": -20.89057731628418, "global_step": 71097, "epoch": 856} {"train_loss": -20.75926971435547, "global_step": 71098, "epoch": 856} {"train_loss": -20.928466796875, "global_step": 71099, "epoch": 856} {"train_loss": -20.759540557861328, "global_step": 71100, "epoch": 856} {"train_loss": -20.96947479248047, "global_step": 71101, "epoch": 856} {"train_loss": -20.783376693725586, "global_step": 71102, "epoch": 856} {"train_loss": -21.033445358276367, "global_step": 71103, "epoch": 856} {"train_loss": -20.81878662109375, "global_step": 71104, "epoch": 856} {"train_loss": -20.765161514282227, "global_step": 71105, "epoch": 856} {"train_loss": -20.96137809753418, "global_step": 71106, "epoch": 856} {"train_loss": -20.848255157470703, "global_step": 71107, "epoch": 856} {"train_loss": -20.697431564331055, "global_step": 71108, "epoch": 856} {"train_loss": -21.162216186523438, "global_step": 71109, "epoch": 856} {"train_loss": -20.590482711791992, "global_step": 71110, "epoch": 856} {"train_loss": -20.725406646728516, "global_step": 71111, "epoch": 856} {"train_loss": -20.738208770751953, "global_step": 71112, "epoch": 856} {"train_loss": -21.079914093017578, "global_step": 71113, "epoch": 856} {"train_loss": -21.16535758972168, "global_step": 71114, "epoch": 856} {"train_loss": -20.76991081237793, "global_step": 71115, "epoch": 856} {"train_loss": -20.59700584411621, "global_step": 71116, "epoch": 856} {"train_loss": -20.99639320373535, "global_step": 71117, "epoch": 856} {"train_loss": -20.95172691345215, "global_step": 71118, "epoch": 856} {"train_loss": -20.714738845825195, "global_step": 71119, "epoch": 856} {"train_loss": -21.00998306274414, "global_step": 71120, "epoch": 856} {"train_loss": -20.701955795288086, "global_step": 71121, "epoch": 856} {"train_loss": -20.646255493164062, "global_step": 71122, "epoch": 856} {"train_loss": -21.151193618774414, "global_step": 71123, "epoch": 856} {"train_loss": -20.93771743774414, "global_step": 71124, "epoch": 856} {"train_loss": -20.589344024658203, "global_step": 71125, "epoch": 856} {"train_loss": -20.9233455657959, "global_step": 71126, "epoch": 856} {"train_loss": -20.97983169555664, "global_step": 71127, "epoch": 856} {"train_loss": -20.759836196899414, "global_step": 71128, "epoch": 856} {"train_loss": -20.95359230041504, "global_step": 71129, "epoch": 856} {"train_loss": -20.804364353777416, "global_step": 71130, "epoch": 856, "val_loss": 6018261.0} {"train_loss": -20.582656860351562, "global_step": 71131, "epoch": 857} {"train_loss": -20.75237464904785, "global_step": 71132, "epoch": 857} {"train_loss": -20.495729446411133, "global_step": 71133, "epoch": 857} {"train_loss": -20.83363151550293, "global_step": 71134, "epoch": 857} {"train_loss": -20.627561569213867, "global_step": 71135, "epoch": 857} {"train_loss": -20.649375915527344, "global_step": 71136, "epoch": 857} {"train_loss": -20.804014205932617, "global_step": 71137, "epoch": 857} {"train_loss": -20.756309509277344, "global_step": 71138, "epoch": 857} {"train_loss": -20.939687728881836, "global_step": 71139, "epoch": 857} {"train_loss": -20.766555786132812, "global_step": 71140, "epoch": 857} {"train_loss": -21.095481872558594, "global_step": 71141, "epoch": 857} {"train_loss": -20.60841178894043, "global_step": 71142, "epoch": 857} {"train_loss": -21.041730880737305, "global_step": 71143, "epoch": 857} {"train_loss": -21.007251739501953, "global_step": 71144, "epoch": 857} {"train_loss": -20.93189811706543, "global_step": 71145, "epoch": 857} {"train_loss": -21.074031829833984, "global_step": 71146, "epoch": 857} {"train_loss": -20.62192726135254, "global_step": 71147, "epoch": 857} {"train_loss": -20.763362884521484, "global_step": 71148, "epoch": 857} {"train_loss": -21.145662307739258, "global_step": 71149, "epoch": 857} {"train_loss": -20.70564079284668, "global_step": 71150, "epoch": 857} {"train_loss": -20.85978889465332, "global_step": 71151, "epoch": 857} {"train_loss": -20.84016990661621, "global_step": 71152, "epoch": 857} {"train_loss": -21.09495735168457, "global_step": 71153, "epoch": 857} {"train_loss": -21.006690979003906, "global_step": 71154, "epoch": 857} {"train_loss": -20.99796485900879, "global_step": 71155, "epoch": 857} {"train_loss": -20.60587501525879, "global_step": 71156, "epoch": 857} {"train_loss": -20.806669235229492, "global_step": 71157, "epoch": 857} {"train_loss": -20.812196731567383, "global_step": 71158, "epoch": 857} {"train_loss": -20.85787010192871, "global_step": 71159, "epoch": 857} {"train_loss": -21.061628341674805, "global_step": 71160, "epoch": 857} {"train_loss": -20.9270076751709, "global_step": 71161, "epoch": 857} {"train_loss": -20.833322525024414, "global_step": 71162, "epoch": 857} {"train_loss": -20.89297103881836, "global_step": 71163, "epoch": 857} {"train_loss": -21.167985916137695, "global_step": 71164, "epoch": 857} {"train_loss": -21.02229118347168, "global_step": 71165, "epoch": 857} {"train_loss": -20.742101669311523, "global_step": 71166, "epoch": 857} {"train_loss": -21.0458984375, "global_step": 71167, "epoch": 857} {"train_loss": -20.96726417541504, "global_step": 71168, "epoch": 857} {"train_loss": -21.163728713989258, "global_step": 71169, "epoch": 857} {"train_loss": -20.895856857299805, "global_step": 71170, "epoch": 857} {"train_loss": -20.6839599609375, "global_step": 71171, "epoch": 857} {"train_loss": -20.997299194335938, "global_step": 71172, "epoch": 857} {"train_loss": -20.585214614868164, "global_step": 71173, "epoch": 857} {"train_loss": -20.624380111694336, "global_step": 71174, "epoch": 857} {"train_loss": -21.2439022064209, "global_step": 71175, "epoch": 857} {"train_loss": -20.88395118713379, "global_step": 71176, "epoch": 857} {"train_loss": -20.426883697509766, "global_step": 71177, "epoch": 857} {"train_loss": -20.947998046875, "global_step": 71178, "epoch": 857} {"train_loss": -20.47450828552246, "global_step": 71179, "epoch": 857} {"train_loss": -20.863311767578125, "global_step": 71180, "epoch": 857} {"train_loss": -20.98655128479004, "global_step": 71181, "epoch": 857} {"train_loss": -21.100854873657227, "global_step": 71182, "epoch": 857} {"train_loss": -20.651782989501953, "global_step": 71183, "epoch": 857} {"train_loss": -20.672544479370117, "global_step": 71184, "epoch": 857} {"train_loss": -21.153461456298828, "global_step": 71185, "epoch": 857} {"train_loss": -20.66621208190918, "global_step": 71186, "epoch": 857} {"train_loss": -20.85519027709961, "global_step": 71187, "epoch": 857} {"train_loss": -21.03959083557129, "global_step": 71188, "epoch": 857} {"train_loss": -20.96039390563965, "global_step": 71189, "epoch": 857} {"train_loss": -20.927587509155273, "global_step": 71190, "epoch": 857} {"train_loss": -21.267492294311523, "global_step": 71191, "epoch": 857} {"train_loss": -21.00069808959961, "global_step": 71192, "epoch": 857} {"train_loss": -20.82318115234375, "global_step": 71193, "epoch": 857} {"train_loss": -21.085111618041992, "global_step": 71194, "epoch": 857} {"train_loss": -21.1322021484375, "global_step": 71195, "epoch": 857} {"train_loss": -21.020771026611328, "global_step": 71196, "epoch": 857} {"train_loss": -20.78299331665039, "global_step": 71197, "epoch": 857} {"train_loss": -20.74090576171875, "global_step": 71198, "epoch": 857} {"train_loss": -21.014570236206055, "global_step": 71199, "epoch": 857} {"train_loss": -21.097095489501953, "global_step": 71200, "epoch": 857} {"train_loss": -20.898283004760742, "global_step": 71201, "epoch": 857} {"train_loss": -20.760543823242188, "global_step": 71202, "epoch": 857} {"train_loss": -20.960750579833984, "global_step": 71203, "epoch": 857} {"train_loss": -20.943836212158203, "global_step": 71204, "epoch": 857} {"train_loss": -20.943912506103516, "global_step": 71205, "epoch": 857} {"train_loss": -20.944013595581055, "global_step": 71206, "epoch": 857} {"train_loss": -20.744232177734375, "global_step": 71207, "epoch": 857} {"train_loss": -20.912925720214844, "global_step": 71208, "epoch": 857} {"train_loss": -20.60001564025879, "global_step": 71209, "epoch": 857} {"train_loss": -20.592849731445312, "global_step": 71210, "epoch": 857} {"train_loss": -20.622434616088867, "global_step": 71211, "epoch": 857} {"train_loss": -20.696584701538086, "global_step": 71212, "epoch": 857} {"train_loss": -20.85130385892937, "global_step": 71213, "epoch": 857, "val_loss": 6024168.5} {"train_loss": -20.36252212524414, "global_step": 71214, "epoch": 858} {"train_loss": -20.87682342529297, "global_step": 71215, "epoch": 858} {"train_loss": -20.808055877685547, "global_step": 71216, "epoch": 858} {"train_loss": -20.673879623413086, "global_step": 71217, "epoch": 858} {"train_loss": -20.933027267456055, "global_step": 71218, "epoch": 858} {"train_loss": -20.830825805664062, "global_step": 71219, "epoch": 858} {"train_loss": -20.37607765197754, "global_step": 71220, "epoch": 858} {"train_loss": -20.836395263671875, "global_step": 71221, "epoch": 858} {"train_loss": -20.511266708374023, "global_step": 71222, "epoch": 858} {"train_loss": -20.970834732055664, "global_step": 71223, "epoch": 858} {"train_loss": -21.155363082885742, "global_step": 71224, "epoch": 858} {"train_loss": -20.746044158935547, "global_step": 71225, "epoch": 858} {"train_loss": -20.795696258544922, "global_step": 71226, "epoch": 858} {"train_loss": -20.65146255493164, "global_step": 71227, "epoch": 858} {"train_loss": -21.372772216796875, "global_step": 71228, "epoch": 858} {"train_loss": -20.793420791625977, "global_step": 71229, "epoch": 858} {"train_loss": -20.87172508239746, "global_step": 71230, "epoch": 858} {"train_loss": -20.866636276245117, "global_step": 71231, "epoch": 858} {"train_loss": -20.9349365234375, "global_step": 71232, "epoch": 858} {"train_loss": -20.816116333007812, "global_step": 71233, "epoch": 858} {"train_loss": -20.69607925415039, "global_step": 71234, "epoch": 858} {"train_loss": -20.741052627563477, "global_step": 71235, "epoch": 858} {"train_loss": -21.087661743164062, "global_step": 71236, "epoch": 858} {"train_loss": -20.777610778808594, "global_step": 71237, "epoch": 858} {"train_loss": -20.950464248657227, "global_step": 71238, "epoch": 858} {"train_loss": -20.693408966064453, "global_step": 71239, "epoch": 858} {"train_loss": -20.865365982055664, "global_step": 71240, "epoch": 858} {"train_loss": -20.895915985107422, "global_step": 71241, "epoch": 858} {"train_loss": -20.884973526000977, "global_step": 71242, "epoch": 858} {"train_loss": -20.908248901367188, "global_step": 71243, "epoch": 858} {"train_loss": -21.051259994506836, "global_step": 71244, "epoch": 858} {"train_loss": -21.052404403686523, "global_step": 71245, "epoch": 858} {"train_loss": -20.792743682861328, "global_step": 71246, "epoch": 858} {"train_loss": -20.990942001342773, "global_step": 71247, "epoch": 858} {"train_loss": -20.766088485717773, "global_step": 71248, "epoch": 858} {"train_loss": -21.17304801940918, "global_step": 71249, "epoch": 858} {"train_loss": -20.938283920288086, "global_step": 71250, "epoch": 858} {"train_loss": -20.919218063354492, "global_step": 71251, "epoch": 858} {"train_loss": -20.889995574951172, "global_step": 71252, "epoch": 858} {"train_loss": -20.790754318237305, "global_step": 71253, "epoch": 858} {"train_loss": -20.549213409423828, "global_step": 71254, "epoch": 858} {"train_loss": -20.866336822509766, "global_step": 71255, "epoch": 858} {"train_loss": -21.087125778198242, "global_step": 71256, "epoch": 858} {"train_loss": -20.79754066467285, "global_step": 71257, "epoch": 858} {"train_loss": -21.008886337280273, "global_step": 71258, "epoch": 858} {"train_loss": -20.919132232666016, "global_step": 71259, "epoch": 858} {"train_loss": -20.88969612121582, "global_step": 71260, "epoch": 858} {"train_loss": -21.03766441345215, "global_step": 71261, "epoch": 858} {"train_loss": -20.79067039489746, "global_step": 71262, "epoch": 858} {"train_loss": -21.196653366088867, "global_step": 71263, "epoch": 858} {"train_loss": -21.036453247070312, "global_step": 71264, "epoch": 858} {"train_loss": -20.506446838378906, "global_step": 71265, "epoch": 858} {"train_loss": -20.81483268737793, "global_step": 71266, "epoch": 858} {"train_loss": -21.27570915222168, "global_step": 71267, "epoch": 858} {"train_loss": -21.04593849182129, "global_step": 71268, "epoch": 858} {"train_loss": -21.078336715698242, "global_step": 71269, "epoch": 858} {"train_loss": -20.987632751464844, "global_step": 71270, "epoch": 858} {"train_loss": -20.464475631713867, "global_step": 71271, "epoch": 858} {"train_loss": -20.837230682373047, "global_step": 71272, "epoch": 858} {"train_loss": -20.71497917175293, "global_step": 71273, "epoch": 858} {"train_loss": -20.948667526245117, "global_step": 71274, "epoch": 858} {"train_loss": -20.743436813354492, "global_step": 71275, "epoch": 858} {"train_loss": -20.802885055541992, "global_step": 71276, "epoch": 858} {"train_loss": -20.78067970275879, "global_step": 71277, "epoch": 858} {"train_loss": -20.640188217163086, "global_step": 71278, "epoch": 858} {"train_loss": -20.943618774414062, "global_step": 71279, "epoch": 858} {"train_loss": -21.225942611694336, "global_step": 71280, "epoch": 858} {"train_loss": -21.00602912902832, "global_step": 71281, "epoch": 858} {"train_loss": -21.022302627563477, "global_step": 71282, "epoch": 858} {"train_loss": -20.53313636779785, "global_step": 71283, "epoch": 858} {"train_loss": -20.820480346679688, "global_step": 71284, "epoch": 858} {"train_loss": -20.93621826171875, "global_step": 71285, "epoch": 858} {"train_loss": -20.899677276611328, "global_step": 71286, "epoch": 858} {"train_loss": -21.06842803955078, "global_step": 71287, "epoch": 858} {"train_loss": -20.994043350219727, "global_step": 71288, "epoch": 858} {"train_loss": -20.85858726501465, "global_step": 71289, "epoch": 858} {"train_loss": -21.189411163330078, "global_step": 71290, "epoch": 858} {"train_loss": -20.918851852416992, "global_step": 71291, "epoch": 858} {"train_loss": -20.920682907104492, "global_step": 71292, "epoch": 858} {"train_loss": -20.99179458618164, "global_step": 71293, "epoch": 858} {"train_loss": -20.523542404174805, "global_step": 71294, "epoch": 858} {"train_loss": -20.715560913085938, "global_step": 71295, "epoch": 858} {"train_loss": -20.85378412453525, "global_step": 71296, "epoch": 858, "val_loss": 5962135.0} {"train_loss": -20.746328353881836, "global_step": 71297, "epoch": 859} {"train_loss": -20.548410415649414, "global_step": 71298, "epoch": 859} {"train_loss": -20.546438217163086, "global_step": 71299, "epoch": 859} {"train_loss": -20.389175415039062, "global_step": 71300, "epoch": 859} {"train_loss": -20.614782333374023, "global_step": 71301, "epoch": 859} {"train_loss": -20.864748001098633, "global_step": 71302, "epoch": 859} {"train_loss": -20.689014434814453, "global_step": 71303, "epoch": 859} {"train_loss": -20.980867385864258, "global_step": 71304, "epoch": 859} {"train_loss": -21.047372817993164, "global_step": 71305, "epoch": 859} {"train_loss": -20.701135635375977, "global_step": 71306, "epoch": 859} {"train_loss": -20.967899322509766, "global_step": 71307, "epoch": 859} {"train_loss": -20.922786712646484, "global_step": 71308, "epoch": 859} {"train_loss": -20.798486709594727, "global_step": 71309, "epoch": 859} {"train_loss": -20.63204574584961, "global_step": 71310, "epoch": 859} {"train_loss": -20.813419342041016, "global_step": 71311, "epoch": 859} {"train_loss": -20.351394653320312, "global_step": 71312, "epoch": 859} {"train_loss": -20.740341186523438, "global_step": 71313, "epoch": 859} {"train_loss": -20.7271785736084, "global_step": 71314, "epoch": 859} {"train_loss": -21.033233642578125, "global_step": 71315, "epoch": 859} {"train_loss": -21.256418228149414, "global_step": 71316, "epoch": 859} {"train_loss": -21.142343521118164, "global_step": 71317, "epoch": 859} {"train_loss": -21.020957946777344, "global_step": 71318, "epoch": 859} {"train_loss": -20.620229721069336, "global_step": 71319, "epoch": 859} {"train_loss": -21.05866813659668, "global_step": 71320, "epoch": 859} {"train_loss": -20.592714309692383, "global_step": 71321, "epoch": 859} {"train_loss": -20.296772003173828, "global_step": 71322, "epoch": 859} {"train_loss": -20.56886100769043, "global_step": 71323, "epoch": 859} {"train_loss": -21.063568115234375, "global_step": 71324, "epoch": 859} {"train_loss": -20.795597076416016, "global_step": 71325, "epoch": 859} {"train_loss": -20.686521530151367, "global_step": 71326, "epoch": 859} {"train_loss": -20.954513549804688, "global_step": 71327, "epoch": 859} {"train_loss": -20.777219772338867, "global_step": 71328, "epoch": 859} {"train_loss": -20.58588218688965, "global_step": 71329, "epoch": 859} {"train_loss": -20.914525985717773, "global_step": 71330, "epoch": 859} {"train_loss": -20.830209732055664, "global_step": 71331, "epoch": 859} {"train_loss": -21.057764053344727, "global_step": 71332, "epoch": 859} {"train_loss": -20.815134048461914, "global_step": 71333, "epoch": 859} {"train_loss": -21.350671768188477, "global_step": 71334, "epoch": 859} {"train_loss": -20.55388641357422, "global_step": 71335, "epoch": 859} {"train_loss": -20.93755531311035, "global_step": 71336, "epoch": 859} {"train_loss": -20.804141998291016, "global_step": 71337, "epoch": 859} {"train_loss": -20.89037322998047, "global_step": 71338, "epoch": 859} {"train_loss": -20.754369735717773, "global_step": 71339, "epoch": 859} {"train_loss": -21.34332847595215, "global_step": 71340, "epoch": 859} {"train_loss": -20.680604934692383, "global_step": 71341, "epoch": 859} {"train_loss": -20.61905860900879, "global_step": 71342, "epoch": 859} {"train_loss": -21.011503219604492, "global_step": 71343, "epoch": 859} {"train_loss": -21.145349502563477, "global_step": 71344, "epoch": 859} {"train_loss": -20.701597213745117, "global_step": 71345, "epoch": 859} {"train_loss": -21.08094596862793, "global_step": 71346, "epoch": 859} {"train_loss": -20.34963035583496, "global_step": 71347, "epoch": 859} {"train_loss": -20.883373260498047, "global_step": 71348, "epoch": 859} {"train_loss": -21.000547409057617, "global_step": 71349, "epoch": 859} {"train_loss": -20.859060287475586, "global_step": 71350, "epoch": 859} {"train_loss": -20.682697296142578, "global_step": 71351, "epoch": 859} {"train_loss": -20.778013229370117, "global_step": 71352, "epoch": 859} {"train_loss": -21.060802459716797, "global_step": 71353, "epoch": 859} {"train_loss": -21.12451171875, "global_step": 71354, "epoch": 859} {"train_loss": -21.0049991607666, "global_step": 71355, "epoch": 859} {"train_loss": -21.0849552154541, "global_step": 71356, "epoch": 859} {"train_loss": -20.81850242614746, "global_step": 71357, "epoch": 859} {"train_loss": -20.793655395507812, "global_step": 71358, "epoch": 859} {"train_loss": -20.672666549682617, "global_step": 71359, "epoch": 859} {"train_loss": -21.142227172851562, "global_step": 71360, "epoch": 859} {"train_loss": -20.922513961791992, "global_step": 71361, "epoch": 859} {"train_loss": -20.795642852783203, "global_step": 71362, "epoch": 859} {"train_loss": -21.04800796508789, "global_step": 71363, "epoch": 859} {"train_loss": -20.850753784179688, "global_step": 71364, "epoch": 859} {"train_loss": -21.01996421813965, "global_step": 71365, "epoch": 859} {"train_loss": -20.775217056274414, "global_step": 71366, "epoch": 859} {"train_loss": -20.37102508544922, "global_step": 71367, "epoch": 859} {"train_loss": -20.88527488708496, "global_step": 71368, "epoch": 859} {"train_loss": -20.641746520996094, "global_step": 71369, "epoch": 859} {"train_loss": -21.256084442138672, "global_step": 71370, "epoch": 859} {"train_loss": -20.807762145996094, "global_step": 71371, "epoch": 859} {"train_loss": -21.16761589050293, "global_step": 71372, "epoch": 859} {"train_loss": -20.962940216064453, "global_step": 71373, "epoch": 859} {"train_loss": -20.772014617919922, "global_step": 71374, "epoch": 859} {"train_loss": -21.00957489013672, "global_step": 71375, "epoch": 859} {"train_loss": -21.082307815551758, "global_step": 71376, "epoch": 859} {"train_loss": -20.763126373291016, "global_step": 71377, "epoch": 859} {"train_loss": -20.82402801513672, "global_step": 71378, "epoch": 859} {"train_loss": -20.84902802432876, "global_step": 71379, "epoch": 859, "val_loss": 5956463.0} {"train_loss": -20.529598236083984, "global_step": 71380, "epoch": 860} {"train_loss": -20.53520965576172, "global_step": 71381, "epoch": 860} {"train_loss": -20.76641082763672, "global_step": 71382, "epoch": 860} {"train_loss": -20.25168228149414, "global_step": 71383, "epoch": 860} {"train_loss": -20.541614532470703, "global_step": 71384, "epoch": 860} {"train_loss": -20.868581771850586, "global_step": 71385, "epoch": 860} {"train_loss": -20.52050018310547, "global_step": 71386, "epoch": 860} {"train_loss": -20.494871139526367, "global_step": 71387, "epoch": 860} {"train_loss": -20.72767448425293, "global_step": 71388, "epoch": 860} {"train_loss": -20.6513729095459, "global_step": 71389, "epoch": 860} {"train_loss": -20.46431541442871, "global_step": 71390, "epoch": 860} {"train_loss": -20.5717830657959, "global_step": 71391, "epoch": 860} {"train_loss": -20.620431900024414, "global_step": 71392, "epoch": 860} {"train_loss": -20.48599624633789, "global_step": 71393, "epoch": 860} {"train_loss": -20.676206588745117, "global_step": 71394, "epoch": 860} {"train_loss": -21.07270050048828, "global_step": 71395, "epoch": 860} {"train_loss": -20.53643798828125, "global_step": 71396, "epoch": 860} {"train_loss": -20.523061752319336, "global_step": 71397, "epoch": 860} {"train_loss": -20.894697189331055, "global_step": 71398, "epoch": 860} {"train_loss": -20.492677688598633, "global_step": 71399, "epoch": 860} {"train_loss": -20.708118438720703, "global_step": 71400, "epoch": 860} {"train_loss": -20.57204246520996, "global_step": 71401, "epoch": 860} {"train_loss": -20.45638084411621, "global_step": 71402, "epoch": 860} {"train_loss": -20.47679328918457, "global_step": 71403, "epoch": 860} {"train_loss": -20.814870834350586, "global_step": 71404, "epoch": 860} {"train_loss": -20.874923706054688, "global_step": 71405, "epoch": 860} {"train_loss": -20.591012954711914, "global_step": 71406, "epoch": 860} {"train_loss": -20.882375717163086, "global_step": 71407, "epoch": 860} {"train_loss": -20.874664306640625, "global_step": 71408, "epoch": 860} {"train_loss": -20.942468643188477, "global_step": 71409, "epoch": 860} {"train_loss": -20.58225440979004, "global_step": 71410, "epoch": 860} {"train_loss": -20.738880157470703, "global_step": 71411, "epoch": 860} {"train_loss": -21.010038375854492, "global_step": 71412, "epoch": 860} {"train_loss": -21.042268753051758, "global_step": 71413, "epoch": 860} {"train_loss": -20.934171676635742, "global_step": 71414, "epoch": 860} {"train_loss": -20.984914779663086, "global_step": 71415, "epoch": 860} {"train_loss": -20.59647560119629, "global_step": 71416, "epoch": 860} {"train_loss": -20.958349227905273, "global_step": 71417, "epoch": 860} {"train_loss": -20.715906143188477, "global_step": 71418, "epoch": 860} {"train_loss": -20.804258346557617, "global_step": 71419, "epoch": 860} {"train_loss": -21.072736740112305, "global_step": 71420, "epoch": 860} {"train_loss": -20.976835250854492, "global_step": 71421, "epoch": 860} {"train_loss": -20.690637588500977, "global_step": 71422, "epoch": 860} {"train_loss": -21.047012329101562, "global_step": 71423, "epoch": 860} {"train_loss": -20.884323120117188, "global_step": 71424, "epoch": 860} {"train_loss": -21.08311653137207, "global_step": 71425, "epoch": 860} {"train_loss": -21.04779624938965, "global_step": 71426, "epoch": 860} {"train_loss": -20.632827758789062, "global_step": 71427, "epoch": 860} {"train_loss": -20.657289505004883, "global_step": 71428, "epoch": 860} {"train_loss": -20.63827896118164, "global_step": 71429, "epoch": 860} {"train_loss": -20.5865535736084, "global_step": 71430, "epoch": 860} {"train_loss": -21.026174545288086, "global_step": 71431, "epoch": 860} {"train_loss": -20.773605346679688, "global_step": 71432, "epoch": 860} {"train_loss": -20.626251220703125, "global_step": 71433, "epoch": 860} {"train_loss": -21.38007926940918, "global_step": 71434, "epoch": 860} {"train_loss": -20.90895652770996, "global_step": 71435, "epoch": 860} {"train_loss": -20.88205909729004, "global_step": 71436, "epoch": 860} {"train_loss": -20.922000885009766, "global_step": 71437, "epoch": 860} {"train_loss": -20.798982620239258, "global_step": 71438, "epoch": 860} {"train_loss": -20.457107543945312, "global_step": 71439, "epoch": 860} {"train_loss": -21.461549758911133, "global_step": 71440, "epoch": 860} {"train_loss": -20.707416534423828, "global_step": 71441, "epoch": 860} {"train_loss": -21.174701690673828, "global_step": 71442, "epoch": 860} {"train_loss": -20.669767379760742, "global_step": 71443, "epoch": 860} {"train_loss": -20.870441436767578, "global_step": 71444, "epoch": 860} {"train_loss": -20.991662979125977, "global_step": 71445, "epoch": 860} {"train_loss": -20.959836959838867, "global_step": 71446, "epoch": 860} {"train_loss": -20.73297119140625, "global_step": 71447, "epoch": 860} {"train_loss": -20.955320358276367, "global_step": 71448, "epoch": 860} {"train_loss": -21.041648864746094, "global_step": 71449, "epoch": 860} {"train_loss": -20.628597259521484, "global_step": 71450, "epoch": 860} {"train_loss": -21.10707664489746, "global_step": 71451, "epoch": 860} {"train_loss": -20.86216163635254, "global_step": 71452, "epoch": 860} {"train_loss": -20.547834396362305, "global_step": 71453, "epoch": 860} {"train_loss": -20.7806396484375, "global_step": 71454, "epoch": 860} {"train_loss": -20.80234146118164, "global_step": 71455, "epoch": 860} {"train_loss": -20.849111557006836, "global_step": 71456, "epoch": 860} {"train_loss": -20.767621994018555, "global_step": 71457, "epoch": 860} {"train_loss": -20.7294921875, "global_step": 71458, "epoch": 860} {"train_loss": -21.326923370361328, "global_step": 71459, "epoch": 860} {"train_loss": -20.753002166748047, "global_step": 71460, "epoch": 860} {"train_loss": -20.69672203063965, "global_step": 71461, "epoch": 860} {"train_loss": -20.800066384924463, "global_step": 71462, "epoch": 860, "val_loss": 5903828.5} {"train_loss": -20.07318878173828, "global_step": 71463, "epoch": 861} {"train_loss": -20.584936141967773, "global_step": 71464, "epoch": 861} {"train_loss": -20.906558990478516, "global_step": 71465, "epoch": 861} {"train_loss": -20.139522552490234, "global_step": 71466, "epoch": 861} {"train_loss": -20.890487670898438, "global_step": 71467, "epoch": 861} {"train_loss": -20.417713165283203, "global_step": 71468, "epoch": 861} {"train_loss": -20.6157169342041, "global_step": 71469, "epoch": 861} {"train_loss": -20.804920196533203, "global_step": 71470, "epoch": 861} {"train_loss": -20.594594955444336, "global_step": 71471, "epoch": 861} {"train_loss": -20.453325271606445, "global_step": 71472, "epoch": 861} {"train_loss": -20.879369735717773, "global_step": 71473, "epoch": 861} {"train_loss": -20.64628791809082, "global_step": 71474, "epoch": 861} {"train_loss": -20.408000946044922, "global_step": 71475, "epoch": 861} {"train_loss": -20.669065475463867, "global_step": 71476, "epoch": 861} {"train_loss": -20.91660499572754, "global_step": 71477, "epoch": 861} {"train_loss": -20.4601993560791, "global_step": 71478, "epoch": 861} {"train_loss": -20.77861976623535, "global_step": 71479, "epoch": 861} {"train_loss": -20.461349487304688, "global_step": 71480, "epoch": 861} {"train_loss": -20.878707885742188, "global_step": 71481, "epoch": 861} {"train_loss": -21.107275009155273, "global_step": 71482, "epoch": 861} {"train_loss": -20.85078239440918, "global_step": 71483, "epoch": 861} {"train_loss": -20.685104370117188, "global_step": 71484, "epoch": 861} {"train_loss": -21.03078842163086, "global_step": 71485, "epoch": 861} {"train_loss": -20.606502532958984, "global_step": 71486, "epoch": 861} {"train_loss": -21.082382202148438, "global_step": 71487, "epoch": 861} {"train_loss": -21.045122146606445, "global_step": 71488, "epoch": 861} {"train_loss": -20.880605697631836, "global_step": 71489, "epoch": 861} {"train_loss": -20.834400177001953, "global_step": 71490, "epoch": 861} {"train_loss": -20.746667861938477, "global_step": 71491, "epoch": 861} {"train_loss": -21.100976943969727, "global_step": 71492, "epoch": 861} {"train_loss": -20.564498901367188, "global_step": 71493, "epoch": 861} {"train_loss": -20.85462760925293, "global_step": 71494, "epoch": 861} {"train_loss": -20.9803409576416, "global_step": 71495, "epoch": 861} {"train_loss": -20.801645278930664, "global_step": 71496, "epoch": 861} {"train_loss": -20.922592163085938, "global_step": 71497, "epoch": 861} {"train_loss": -20.656219482421875, "global_step": 71498, "epoch": 861} {"train_loss": -20.565637588500977, "global_step": 71499, "epoch": 861} {"train_loss": -21.06905746459961, "global_step": 71500, "epoch": 861} {"train_loss": -20.752042770385742, "global_step": 71501, "epoch": 861} {"train_loss": -20.91919708251953, "global_step": 71502, "epoch": 861} {"train_loss": -21.143125534057617, "global_step": 71503, "epoch": 861} {"train_loss": -21.00796890258789, "global_step": 71504, "epoch": 861} {"train_loss": -20.71550178527832, "global_step": 71505, "epoch": 861} {"train_loss": -20.63750648498535, "global_step": 71506, "epoch": 861} {"train_loss": -20.761964797973633, "global_step": 71507, "epoch": 861} {"train_loss": -20.54120445251465, "global_step": 71508, "epoch": 861} {"train_loss": -21.23538589477539, "global_step": 71509, "epoch": 861} {"train_loss": -20.866060256958008, "global_step": 71510, "epoch": 861} {"train_loss": -20.745450973510742, "global_step": 71511, "epoch": 861} {"train_loss": -21.09507942199707, "global_step": 71512, "epoch": 861} {"train_loss": -20.924100875854492, "global_step": 71513, "epoch": 861} {"train_loss": -20.930694580078125, "global_step": 71514, "epoch": 861} {"train_loss": -20.628202438354492, "global_step": 71515, "epoch": 861} {"train_loss": -20.86515235900879, "global_step": 71516, "epoch": 861} {"train_loss": -20.85956382751465, "global_step": 71517, "epoch": 861} {"train_loss": -21.11574935913086, "global_step": 71518, "epoch": 861} {"train_loss": -21.072561264038086, "global_step": 71519, "epoch": 861} {"train_loss": -20.891569137573242, "global_step": 71520, "epoch": 861} {"train_loss": -20.899545669555664, "global_step": 71521, "epoch": 861} {"train_loss": -20.987546920776367, "global_step": 71522, "epoch": 861} {"train_loss": -21.00901222229004, "global_step": 71523, "epoch": 861} {"train_loss": -21.01789665222168, "global_step": 71524, "epoch": 861} {"train_loss": -20.825122833251953, "global_step": 71525, "epoch": 861} {"train_loss": -20.96114730834961, "global_step": 71526, "epoch": 861} {"train_loss": -20.94614601135254, "global_step": 71527, "epoch": 861} {"train_loss": -20.650583267211914, "global_step": 71528, "epoch": 861} {"train_loss": -20.840490341186523, "global_step": 71529, "epoch": 861} {"train_loss": -20.969226837158203, "global_step": 71530, "epoch": 861} {"train_loss": -20.636951446533203, "global_step": 71531, "epoch": 861} {"train_loss": -20.826045989990234, "global_step": 71532, "epoch": 861} {"train_loss": -20.995960235595703, "global_step": 71533, "epoch": 861} {"train_loss": -20.477209091186523, "global_step": 71534, "epoch": 861} {"train_loss": -20.96542739868164, "global_step": 71535, "epoch": 861} {"train_loss": -20.858884811401367, "global_step": 71536, "epoch": 861} {"train_loss": -20.98737907409668, "global_step": 71537, "epoch": 861} {"train_loss": -20.712833404541016, "global_step": 71538, "epoch": 861} {"train_loss": -20.95827293395996, "global_step": 71539, "epoch": 861} {"train_loss": -21.027616500854492, "global_step": 71540, "epoch": 861} {"train_loss": -20.834957122802734, "global_step": 71541, "epoch": 861} {"train_loss": -20.956737518310547, "global_step": 71542, "epoch": 861} {"train_loss": -21.002485275268555, "global_step": 71543, "epoch": 861} {"train_loss": -20.98493766784668, "global_step": 71544, "epoch": 861} {"train_loss": -20.82313450273261, "global_step": 71545, "epoch": 861, "val_loss": 5953474.0} {"train_loss": -20.79155158996582, "global_step": 71546, "epoch": 862} {"train_loss": -21.133848190307617, "global_step": 71547, "epoch": 862} {"train_loss": -20.29368019104004, "global_step": 71548, "epoch": 862} {"train_loss": -20.865631103515625, "global_step": 71549, "epoch": 862} {"train_loss": -20.635528564453125, "global_step": 71550, "epoch": 862} {"train_loss": -20.894926071166992, "global_step": 71551, "epoch": 862} {"train_loss": -20.39950180053711, "global_step": 71552, "epoch": 862} {"train_loss": -20.455663681030273, "global_step": 71553, "epoch": 862} {"train_loss": -20.64609146118164, "global_step": 71554, "epoch": 862} {"train_loss": -20.92275047302246, "global_step": 71555, "epoch": 862} {"train_loss": -20.998905181884766, "global_step": 71556, "epoch": 862} {"train_loss": -20.454374313354492, "global_step": 71557, "epoch": 862} {"train_loss": -20.59920310974121, "global_step": 71558, "epoch": 862} {"train_loss": -20.380380630493164, "global_step": 71559, "epoch": 862} {"train_loss": -20.827651977539062, "global_step": 71560, "epoch": 862} {"train_loss": -20.755916595458984, "global_step": 71561, "epoch": 862} {"train_loss": -20.567325592041016, "global_step": 71562, "epoch": 862} {"train_loss": -20.92669677734375, "global_step": 71563, "epoch": 862} {"train_loss": -20.440168380737305, "global_step": 71564, "epoch": 862} {"train_loss": -20.368566513061523, "global_step": 71565, "epoch": 862} {"train_loss": -20.652284622192383, "global_step": 71566, "epoch": 862} {"train_loss": -20.62299919128418, "global_step": 71567, "epoch": 862} {"train_loss": -20.81032371520996, "global_step": 71568, "epoch": 862} {"train_loss": -20.833683013916016, "global_step": 71569, "epoch": 862} {"train_loss": -20.790985107421875, "global_step": 71570, "epoch": 862} {"train_loss": -21.11800193786621, "global_step": 71571, "epoch": 862} {"train_loss": -20.84571647644043, "global_step": 71572, "epoch": 862} {"train_loss": -20.925790786743164, "global_step": 71573, "epoch": 862} {"train_loss": -21.084760665893555, "global_step": 71574, "epoch": 862} {"train_loss": -20.641653060913086, "global_step": 71575, "epoch": 862} {"train_loss": -20.576602935791016, "global_step": 71576, "epoch": 862} {"train_loss": -20.817798614501953, "global_step": 71577, "epoch": 862} {"train_loss": -21.035390853881836, "global_step": 71578, "epoch": 862} {"train_loss": -21.213560104370117, "global_step": 71579, "epoch": 862} {"train_loss": -20.997323989868164, "global_step": 71580, "epoch": 862} {"train_loss": -20.823163986206055, "global_step": 71581, "epoch": 862} {"train_loss": -21.013111114501953, "global_step": 71582, "epoch": 862} {"train_loss": -20.686725616455078, "global_step": 71583, "epoch": 862} {"train_loss": -20.888158798217773, "global_step": 71584, "epoch": 862} {"train_loss": -20.716022491455078, "global_step": 71585, "epoch": 862} {"train_loss": -21.053171157836914, "global_step": 71586, "epoch": 862} {"train_loss": -20.90991973876953, "global_step": 71587, "epoch": 862} {"train_loss": -20.968826293945312, "global_step": 71588, "epoch": 862} {"train_loss": -21.13687515258789, "global_step": 71589, "epoch": 862} {"train_loss": -20.883615493774414, "global_step": 71590, "epoch": 862} {"train_loss": -20.828378677368164, "global_step": 71591, "epoch": 862} {"train_loss": -20.9267635345459, "global_step": 71592, "epoch": 862} {"train_loss": -21.03229331970215, "global_step": 71593, "epoch": 862} {"train_loss": -20.887710571289062, "global_step": 71594, "epoch": 862} {"train_loss": -21.041749954223633, "global_step": 71595, "epoch": 862} {"train_loss": -20.61021614074707, "global_step": 71596, "epoch": 862} {"train_loss": -20.731447219848633, "global_step": 71597, "epoch": 862} {"train_loss": -20.97443389892578, "global_step": 71598, "epoch": 862} {"train_loss": -20.82856559753418, "global_step": 71599, "epoch": 862} {"train_loss": -20.841739654541016, "global_step": 71600, "epoch": 862} {"train_loss": -21.04488182067871, "global_step": 71601, "epoch": 862} {"train_loss": -20.907384872436523, "global_step": 71602, "epoch": 862} {"train_loss": -21.07649040222168, "global_step": 71603, "epoch": 862} {"train_loss": -20.86181640625, "global_step": 71604, "epoch": 862} {"train_loss": -21.385114669799805, "global_step": 71605, "epoch": 862} {"train_loss": -20.80080223083496, "global_step": 71606, "epoch": 862} {"train_loss": -20.890424728393555, "global_step": 71607, "epoch": 862} {"train_loss": -20.87037467956543, "global_step": 71608, "epoch": 862} {"train_loss": -20.965961456298828, "global_step": 71609, "epoch": 862} {"train_loss": -20.606746673583984, "global_step": 71610, "epoch": 862} {"train_loss": -20.820688247680664, "global_step": 71611, "epoch": 862} {"train_loss": -20.5650634765625, "global_step": 71612, "epoch": 862} {"train_loss": -21.109708786010742, "global_step": 71613, "epoch": 862} {"train_loss": -21.088844299316406, "global_step": 71614, "epoch": 862} {"train_loss": -20.580121994018555, "global_step": 71615, "epoch": 862} {"train_loss": -21.009977340698242, "global_step": 71616, "epoch": 862} {"train_loss": -20.885894775390625, "global_step": 71617, "epoch": 862} {"train_loss": -21.225189208984375, "global_step": 71618, "epoch": 862} {"train_loss": -21.1124267578125, "global_step": 71619, "epoch": 862} {"train_loss": -21.013212203979492, "global_step": 71620, "epoch": 862} {"train_loss": -21.13880729675293, "global_step": 71621, "epoch": 862} {"train_loss": -20.891029357910156, "global_step": 71622, "epoch": 862} {"train_loss": -20.627405166625977, "global_step": 71623, "epoch": 862} {"train_loss": -21.186124801635742, "global_step": 71624, "epoch": 862} {"train_loss": -20.859710693359375, "global_step": 71625, "epoch": 862} {"train_loss": -21.148733139038086, "global_step": 71626, "epoch": 862} {"train_loss": -20.880491256713867, "global_step": 71627, "epoch": 862} {"train_loss": -20.871948219207397, "global_step": 71628, "epoch": 862, "val_loss": 5958840.0} {"train_loss": -20.357046127319336, "global_step": 71629, "epoch": 863} {"train_loss": -20.602113723754883, "global_step": 71630, "epoch": 863} {"train_loss": -20.569995880126953, "global_step": 71631, "epoch": 863} {"train_loss": -20.720022201538086, "global_step": 71632, "epoch": 863} {"train_loss": -20.71834945678711, "global_step": 71633, "epoch": 863} {"train_loss": -20.56619644165039, "global_step": 71634, "epoch": 863} {"train_loss": -20.497159957885742, "global_step": 71635, "epoch": 863} {"train_loss": -20.1546573638916, "global_step": 71636, "epoch": 863} {"train_loss": -20.556493759155273, "global_step": 71637, "epoch": 863} {"train_loss": -20.78714370727539, "global_step": 71638, "epoch": 863} {"train_loss": -20.987138748168945, "global_step": 71639, "epoch": 863} {"train_loss": -20.826190948486328, "global_step": 71640, "epoch": 863} {"train_loss": -20.52021598815918, "global_step": 71641, "epoch": 863} {"train_loss": -21.209278106689453, "global_step": 71642, "epoch": 863} {"train_loss": -20.798574447631836, "global_step": 71643, "epoch": 863} {"train_loss": -20.855472564697266, "global_step": 71644, "epoch": 863} {"train_loss": -20.51041603088379, "global_step": 71645, "epoch": 863} {"train_loss": -20.629796981811523, "global_step": 71646, "epoch": 863} {"train_loss": -20.427194595336914, "global_step": 71647, "epoch": 863} {"train_loss": -20.631933212280273, "global_step": 71648, "epoch": 863} {"train_loss": -20.678319931030273, "global_step": 71649, "epoch": 863} {"train_loss": -20.87501335144043, "global_step": 71650, "epoch": 863} {"train_loss": -20.597869873046875, "global_step": 71651, "epoch": 863} {"train_loss": -20.740453720092773, "global_step": 71652, "epoch": 863} {"train_loss": -20.96897315979004, "global_step": 71653, "epoch": 863} {"train_loss": -21.148263931274414, "global_step": 71654, "epoch": 863} {"train_loss": -21.0924129486084, "global_step": 71655, "epoch": 863} {"train_loss": -20.9405574798584, "global_step": 71656, "epoch": 863} {"train_loss": -20.82184410095215, "global_step": 71657, "epoch": 863} {"train_loss": -21.067758560180664, "global_step": 71658, "epoch": 863} {"train_loss": -21.050437927246094, "global_step": 71659, "epoch": 863} {"train_loss": -20.7785587310791, "global_step": 71660, "epoch": 863} {"train_loss": -20.938434600830078, "global_step": 71661, "epoch": 863} {"train_loss": -20.750085830688477, "global_step": 71662, "epoch": 863} {"train_loss": -20.80317497253418, "global_step": 71663, "epoch": 863} {"train_loss": -21.08989143371582, "global_step": 71664, "epoch": 863} {"train_loss": -20.724966049194336, "global_step": 71665, "epoch": 863} {"train_loss": -20.896024703979492, "global_step": 71666, "epoch": 863} {"train_loss": -20.70516014099121, "global_step": 71667, "epoch": 863} {"train_loss": -20.875375747680664, "global_step": 71668, "epoch": 863} {"train_loss": -20.990766525268555, "global_step": 71669, "epoch": 863} {"train_loss": -21.408994674682617, "global_step": 71670, "epoch": 863} {"train_loss": -20.811981201171875, "global_step": 71671, "epoch": 863} {"train_loss": -20.942625045776367, "global_step": 71672, "epoch": 863} {"train_loss": -21.055173873901367, "global_step": 71673, "epoch": 863} {"train_loss": -20.95852279663086, "global_step": 71674, "epoch": 863} {"train_loss": -20.742292404174805, "global_step": 71675, "epoch": 863} {"train_loss": -20.688270568847656, "global_step": 71676, "epoch": 863} {"train_loss": -20.69473648071289, "global_step": 71677, "epoch": 863} {"train_loss": -21.190195083618164, "global_step": 71678, "epoch": 863} {"train_loss": -20.753225326538086, "global_step": 71679, "epoch": 863} {"train_loss": -21.283008575439453, "global_step": 71680, "epoch": 863} {"train_loss": -20.710615158081055, "global_step": 71681, "epoch": 863} {"train_loss": -21.029483795166016, "global_step": 71682, "epoch": 863} {"train_loss": -20.918350219726562, "global_step": 71683, "epoch": 863} {"train_loss": -21.025175094604492, "global_step": 71684, "epoch": 863} {"train_loss": -21.036710739135742, "global_step": 71685, "epoch": 863} {"train_loss": -20.808942794799805, "global_step": 71686, "epoch": 863} {"train_loss": -20.92844009399414, "global_step": 71687, "epoch": 863} {"train_loss": -20.583250045776367, "global_step": 71688, "epoch": 863} {"train_loss": -20.548385620117188, "global_step": 71689, "epoch": 863} {"train_loss": -20.516592025756836, "global_step": 71690, "epoch": 863} {"train_loss": -21.061603546142578, "global_step": 71691, "epoch": 863} {"train_loss": -20.877885818481445, "global_step": 71692, "epoch": 863} {"train_loss": -20.924320220947266, "global_step": 71693, "epoch": 863} {"train_loss": -20.95979118347168, "global_step": 71694, "epoch": 863} {"train_loss": -20.756141662597656, "global_step": 71695, "epoch": 863} {"train_loss": -20.664724349975586, "global_step": 71696, "epoch": 863} {"train_loss": -21.065977096557617, "global_step": 71697, "epoch": 863} {"train_loss": -20.6551513671875, "global_step": 71698, "epoch": 863} {"train_loss": -20.77292823791504, "global_step": 71699, "epoch": 863} {"train_loss": -20.46659278869629, "global_step": 71700, "epoch": 863} {"train_loss": -21.017072677612305, "global_step": 71701, "epoch": 863} {"train_loss": -20.903900146484375, "global_step": 71702, "epoch": 863} {"train_loss": -20.778579711914062, "global_step": 71703, "epoch": 863} {"train_loss": -20.91690444946289, "global_step": 71704, "epoch": 863} {"train_loss": -20.69135284423828, "global_step": 71705, "epoch": 863} {"train_loss": -20.925642013549805, "global_step": 71706, "epoch": 863} {"train_loss": -21.136899948120117, "global_step": 71707, "epoch": 863} {"train_loss": -21.112873077392578, "global_step": 71708, "epoch": 863} {"train_loss": -20.649473190307617, "global_step": 71709, "epoch": 863} {"train_loss": -20.914472579956055, "global_step": 71710, "epoch": 863} {"train_loss": -20.819249716149756, "global_step": 71711, "epoch": 863, "val_loss": 5956316.0} {"train_loss": -20.321332931518555, "global_step": 71712, "epoch": 864} {"train_loss": -20.570646286010742, "global_step": 71713, "epoch": 864} {"train_loss": -20.861007690429688, "global_step": 71714, "epoch": 864} {"train_loss": -20.758684158325195, "global_step": 71715, "epoch": 864} {"train_loss": -20.6921329498291, "global_step": 71716, "epoch": 864} {"train_loss": -20.435970306396484, "global_step": 71717, "epoch": 864} {"train_loss": -20.92706871032715, "global_step": 71718, "epoch": 864} {"train_loss": -21.039621353149414, "global_step": 71719, "epoch": 864} {"train_loss": -20.50827980041504, "global_step": 71720, "epoch": 864} {"train_loss": -20.858322143554688, "global_step": 71721, "epoch": 864} {"train_loss": -20.857885360717773, "global_step": 71722, "epoch": 864} {"train_loss": -20.508647918701172, "global_step": 71723, "epoch": 864} {"train_loss": -21.101160049438477, "global_step": 71724, "epoch": 864} {"train_loss": -21.3631591796875, "global_step": 71725, "epoch": 864} {"train_loss": -20.54616355895996, "global_step": 71726, "epoch": 864} {"train_loss": -20.719335556030273, "global_step": 71727, "epoch": 864} {"train_loss": -20.705839157104492, "global_step": 71728, "epoch": 864} {"train_loss": -20.901691436767578, "global_step": 71729, "epoch": 864} {"train_loss": -21.07684898376465, "global_step": 71730, "epoch": 864} {"train_loss": -20.266279220581055, "global_step": 71731, "epoch": 864} {"train_loss": -20.92544174194336, "global_step": 71732, "epoch": 864} {"train_loss": -20.639690399169922, "global_step": 71733, "epoch": 864} {"train_loss": -20.786779403686523, "global_step": 71734, "epoch": 864} {"train_loss": -20.749223709106445, "global_step": 71735, "epoch": 864} {"train_loss": -21.118637084960938, "global_step": 71736, "epoch": 864} {"train_loss": -20.951143264770508, "global_step": 71737, "epoch": 864} {"train_loss": -20.978866577148438, "global_step": 71738, "epoch": 864} {"train_loss": -20.45476722717285, "global_step": 71739, "epoch": 864} {"train_loss": -21.248159408569336, "global_step": 71740, "epoch": 864} {"train_loss": -21.218013763427734, "global_step": 71741, "epoch": 864} {"train_loss": -20.785856246948242, "global_step": 71742, "epoch": 864} {"train_loss": -20.771095275878906, "global_step": 71743, "epoch": 864} {"train_loss": -21.238880157470703, "global_step": 71744, "epoch": 864} {"train_loss": -20.91042137145996, "global_step": 71745, "epoch": 864} {"train_loss": -21.36539649963379, "global_step": 71746, "epoch": 864} {"train_loss": -20.88508415222168, "global_step": 71747, "epoch": 864} {"train_loss": -20.817983627319336, "global_step": 71748, "epoch": 864} {"train_loss": -21.275705337524414, "global_step": 71749, "epoch": 864} {"train_loss": -21.016088485717773, "global_step": 71750, "epoch": 864} {"train_loss": -20.97892189025879, "global_step": 71751, "epoch": 864} {"train_loss": -20.73212432861328, "global_step": 71752, "epoch": 864} {"train_loss": -20.89398765563965, "global_step": 71753, "epoch": 864} {"train_loss": -20.927234649658203, "global_step": 71754, "epoch": 864} {"train_loss": -20.33146858215332, "global_step": 71755, "epoch": 864} {"train_loss": -21.0339412689209, "global_step": 71756, "epoch": 864} {"train_loss": -20.804044723510742, "global_step": 71757, "epoch": 864} {"train_loss": -21.085790634155273, "global_step": 71758, "epoch": 864} {"train_loss": -20.950483322143555, "global_step": 71759, "epoch": 864} {"train_loss": -20.78426170349121, "global_step": 71760, "epoch": 864} {"train_loss": -21.006750106811523, "global_step": 71761, "epoch": 864} {"train_loss": -20.82282066345215, "global_step": 71762, "epoch": 864} {"train_loss": -20.899967193603516, "global_step": 71763, "epoch": 864} {"train_loss": -21.006210327148438, "global_step": 71764, "epoch": 864} {"train_loss": -20.898061752319336, "global_step": 71765, "epoch": 864} {"train_loss": -20.724103927612305, "global_step": 71766, "epoch": 864} {"train_loss": -21.192808151245117, "global_step": 71767, "epoch": 864} {"train_loss": -20.766761779785156, "global_step": 71768, "epoch": 864} {"train_loss": -20.440967559814453, "global_step": 71769, "epoch": 864} {"train_loss": -20.89009666442871, "global_step": 71770, "epoch": 864} {"train_loss": -20.839529037475586, "global_step": 71771, "epoch": 864} {"train_loss": -21.163646697998047, "global_step": 71772, "epoch": 864} {"train_loss": -20.921772003173828, "global_step": 71773, "epoch": 864} {"train_loss": -21.21254539489746, "global_step": 71774, "epoch": 864} {"train_loss": -20.359155654907227, "global_step": 71775, "epoch": 864} {"train_loss": -21.005996704101562, "global_step": 71776, "epoch": 864} {"train_loss": -20.973861694335938, "global_step": 71777, "epoch": 864} {"train_loss": -21.194177627563477, "global_step": 71778, "epoch": 864} {"train_loss": -21.19098663330078, "global_step": 71779, "epoch": 864} {"train_loss": -20.78301239013672, "global_step": 71780, "epoch": 864} {"train_loss": -20.634885787963867, "global_step": 71781, "epoch": 864} {"train_loss": -20.547212600708008, "global_step": 71782, "epoch": 864} {"train_loss": -21.119665145874023, "global_step": 71783, "epoch": 864} {"train_loss": -20.953826904296875, "global_step": 71784, "epoch": 864} {"train_loss": -20.941360473632812, "global_step": 71785, "epoch": 864} {"train_loss": -20.977811813354492, "global_step": 71786, "epoch": 864} {"train_loss": -21.01322364807129, "global_step": 71787, "epoch": 864} {"train_loss": -21.065641403198242, "global_step": 71788, "epoch": 864} {"train_loss": -20.740339279174805, "global_step": 71789, "epoch": 864} {"train_loss": -20.959409713745117, "global_step": 71790, "epoch": 864} {"train_loss": -20.815853118896484, "global_step": 71791, "epoch": 864} {"train_loss": -20.87820053100586, "global_step": 71792, "epoch": 864} {"train_loss": -20.592445373535156, "global_step": 71793, "epoch": 864} {"train_loss": -20.868369481649744, "global_step": 71794, "epoch": 864, "val_loss": 5986544.5} {"train_loss": -20.24714469909668, "global_step": 71795, "epoch": 865} {"train_loss": -20.193939208984375, "global_step": 71796, "epoch": 865} {"train_loss": -20.162540435791016, "global_step": 71797, "epoch": 865} {"train_loss": -20.438322067260742, "global_step": 71798, "epoch": 865} {"train_loss": -20.839136123657227, "global_step": 71799, "epoch": 865} {"train_loss": -20.441741943359375, "global_step": 71800, "epoch": 865} {"train_loss": -20.5024471282959, "global_step": 71801, "epoch": 865} {"train_loss": -20.5623722076416, "global_step": 71802, "epoch": 865} {"train_loss": -20.393335342407227, "global_step": 71803, "epoch": 865} {"train_loss": -20.72332763671875, "global_step": 71804, "epoch": 865} {"train_loss": -20.797468185424805, "global_step": 71805, "epoch": 865} {"train_loss": -20.61402130126953, "global_step": 71806, "epoch": 865} {"train_loss": -20.72535514831543, "global_step": 71807, "epoch": 865} {"train_loss": -21.1661434173584, "global_step": 71808, "epoch": 865} {"train_loss": -20.379159927368164, "global_step": 71809, "epoch": 865} {"train_loss": -20.783767700195312, "global_step": 71810, "epoch": 865} {"train_loss": -20.789947509765625, "global_step": 71811, "epoch": 865} {"train_loss": -20.757213592529297, "global_step": 71812, "epoch": 865} {"train_loss": -20.75436782836914, "global_step": 71813, "epoch": 865} {"train_loss": -20.98171043395996, "global_step": 71814, "epoch": 865} {"train_loss": -20.776145935058594, "global_step": 71815, "epoch": 865} {"train_loss": -20.847259521484375, "global_step": 71816, "epoch": 865} {"train_loss": -20.888154983520508, "global_step": 71817, "epoch": 865} {"train_loss": -21.044946670532227, "global_step": 71818, "epoch": 865} {"train_loss": -20.811229705810547, "global_step": 71819, "epoch": 865} {"train_loss": -20.82108497619629, "global_step": 71820, "epoch": 865} {"train_loss": -20.973981857299805, "global_step": 71821, "epoch": 865} {"train_loss": -20.920169830322266, "global_step": 71822, "epoch": 865} {"train_loss": -20.935461044311523, "global_step": 71823, "epoch": 865} {"train_loss": -20.93292808532715, "global_step": 71824, "epoch": 865} {"train_loss": -20.646249771118164, "global_step": 71825, "epoch": 865} {"train_loss": -20.78019905090332, "global_step": 71826, "epoch": 865} {"train_loss": -20.67661476135254, "global_step": 71827, "epoch": 865} {"train_loss": -21.101531982421875, "global_step": 71828, "epoch": 865} {"train_loss": -21.090904235839844, "global_step": 71829, "epoch": 865} {"train_loss": -20.75699234008789, "global_step": 71830, "epoch": 865} {"train_loss": -21.124052047729492, "global_step": 71831, "epoch": 865} {"train_loss": -21.038251876831055, "global_step": 71832, "epoch": 865} {"train_loss": -20.796470642089844, "global_step": 71833, "epoch": 865} {"train_loss": -21.023345947265625, "global_step": 71834, "epoch": 865} {"train_loss": -20.801233291625977, "global_step": 71835, "epoch": 865} {"train_loss": -20.856403350830078, "global_step": 71836, "epoch": 865} {"train_loss": -20.93479347229004, "global_step": 71837, "epoch": 865} {"train_loss": -20.748519897460938, "global_step": 71838, "epoch": 865} {"train_loss": -20.983234405517578, "global_step": 71839, "epoch": 865} {"train_loss": -21.096311569213867, "global_step": 71840, "epoch": 865} {"train_loss": -20.796001434326172, "global_step": 71841, "epoch": 865} {"train_loss": -20.822874069213867, "global_step": 71842, "epoch": 865} {"train_loss": -20.945524215698242, "global_step": 71843, "epoch": 865} {"train_loss": -21.047779083251953, "global_step": 71844, "epoch": 865} {"train_loss": -21.153732299804688, "global_step": 71845, "epoch": 865} {"train_loss": -20.74298667907715, "global_step": 71846, "epoch": 865} {"train_loss": -20.957019805908203, "global_step": 71847, "epoch": 865} {"train_loss": -20.912673950195312, "global_step": 71848, "epoch": 865} {"train_loss": -21.002933502197266, "global_step": 71849, "epoch": 865} {"train_loss": -20.90032386779785, "global_step": 71850, "epoch": 865} {"train_loss": -20.84897232055664, "global_step": 71851, "epoch": 865} {"train_loss": -20.78749656677246, "global_step": 71852, "epoch": 865} {"train_loss": -20.939863204956055, "global_step": 71853, "epoch": 865} {"train_loss": -20.963369369506836, "global_step": 71854, "epoch": 865} {"train_loss": -21.083086013793945, "global_step": 71855, "epoch": 865} {"train_loss": -20.942419052124023, "global_step": 71856, "epoch": 865} {"train_loss": -20.953332901000977, "global_step": 71857, "epoch": 865} {"train_loss": -20.864126205444336, "global_step": 71858, "epoch": 865} {"train_loss": -21.19732093811035, "global_step": 71859, "epoch": 865} {"train_loss": -21.333709716796875, "global_step": 71860, "epoch": 865} {"train_loss": -21.233415603637695, "global_step": 71861, "epoch": 865} {"train_loss": -21.235671997070312, "global_step": 71862, "epoch": 865} {"train_loss": -21.304031372070312, "global_step": 71863, "epoch": 865} {"train_loss": -20.894193649291992, "global_step": 71864, "epoch": 865} {"train_loss": -21.19654655456543, "global_step": 71865, "epoch": 865} {"train_loss": -20.61527442932129, "global_step": 71866, "epoch": 865} {"train_loss": -20.517702102661133, "global_step": 71867, "epoch": 865} {"train_loss": -20.69700050354004, "global_step": 71868, "epoch": 865} {"train_loss": -21.040157318115234, "global_step": 71869, "epoch": 865} {"train_loss": -20.833423614501953, "global_step": 71870, "epoch": 865} {"train_loss": -20.645437240600586, "global_step": 71871, "epoch": 865} {"train_loss": -20.873807907104492, "global_step": 71872, "epoch": 865} {"train_loss": -21.071834564208984, "global_step": 71873, "epoch": 865} {"train_loss": -20.6560001373291, "global_step": 71874, "epoch": 865} {"train_loss": -20.73508644104004, "global_step": 71875, "epoch": 865} {"train_loss": -20.7222900390625, "global_step": 71876, "epoch": 865} {"train_loss": -20.842494642878155, "global_step": 71877, "epoch": 865, "val_loss": 5985268.0} {"train_loss": -20.90727424621582, "global_step": 71878, "epoch": 866} {"train_loss": -20.86916160583496, "global_step": 71879, "epoch": 866} {"train_loss": -21.17542266845703, "global_step": 71880, "epoch": 866} {"train_loss": -21.084518432617188, "global_step": 71881, "epoch": 866} {"train_loss": -21.029470443725586, "global_step": 71882, "epoch": 866} {"train_loss": -20.582687377929688, "global_step": 71883, "epoch": 866} {"train_loss": -20.570297241210938, "global_step": 71884, "epoch": 866} {"train_loss": -20.825571060180664, "global_step": 71885, "epoch": 866} {"train_loss": -20.796390533447266, "global_step": 71886, "epoch": 866} {"train_loss": -20.82620620727539, "global_step": 71887, "epoch": 866} {"train_loss": -20.978544235229492, "global_step": 71888, "epoch": 866} {"train_loss": -20.61813735961914, "global_step": 71889, "epoch": 866} {"train_loss": -20.85089111328125, "global_step": 71890, "epoch": 866} {"train_loss": -20.8868465423584, "global_step": 71891, "epoch": 866} {"train_loss": -21.172048568725586, "global_step": 71892, "epoch": 866} {"train_loss": -20.686447143554688, "global_step": 71893, "epoch": 866} {"train_loss": -20.96478271484375, "global_step": 71894, "epoch": 866} {"train_loss": -21.12066650390625, "global_step": 71895, "epoch": 866} {"train_loss": -20.776519775390625, "global_step": 71896, "epoch": 866} {"train_loss": -21.427867889404297, "global_step": 71897, "epoch": 866} {"train_loss": -20.586231231689453, "global_step": 71898, "epoch": 866} {"train_loss": -21.343748092651367, "global_step": 71899, "epoch": 866} {"train_loss": -20.804046630859375, "global_step": 71900, "epoch": 866} {"train_loss": -21.076292037963867, "global_step": 71901, "epoch": 866} {"train_loss": -21.000280380249023, "global_step": 71902, "epoch": 866} {"train_loss": -20.96758460998535, "global_step": 71903, "epoch": 866} {"train_loss": -20.79356575012207, "global_step": 71904, "epoch": 866} {"train_loss": -20.95716667175293, "global_step": 71905, "epoch": 866} {"train_loss": -20.997196197509766, "global_step": 71906, "epoch": 866} {"train_loss": -20.813922882080078, "global_step": 71907, "epoch": 866} {"train_loss": -21.039142608642578, "global_step": 71908, "epoch": 866} {"train_loss": -20.903411865234375, "global_step": 71909, "epoch": 866} {"train_loss": -20.991596221923828, "global_step": 71910, "epoch": 866} {"train_loss": -20.77137565612793, "global_step": 71911, "epoch": 866} {"train_loss": -21.3205509185791, "global_step": 71912, "epoch": 866} {"train_loss": -20.83692741394043, "global_step": 71913, "epoch": 866} {"train_loss": -20.872453689575195, "global_step": 71914, "epoch": 866} {"train_loss": -20.96199607849121, "global_step": 71915, "epoch": 866} {"train_loss": -20.8885555267334, "global_step": 71916, "epoch": 866} {"train_loss": -21.28888702392578, "global_step": 71917, "epoch": 866} {"train_loss": -20.775619506835938, "global_step": 71918, "epoch": 866} {"train_loss": -21.02640724182129, "global_step": 71919, "epoch": 866} {"train_loss": -20.761884689331055, "global_step": 71920, "epoch": 866} {"train_loss": -20.796342849731445, "global_step": 71921, "epoch": 866} {"train_loss": -20.861242294311523, "global_step": 71922, "epoch": 866} {"train_loss": -20.8864688873291, "global_step": 71923, "epoch": 866} {"train_loss": -20.883691787719727, "global_step": 71924, "epoch": 866} {"train_loss": -20.657621383666992, "global_step": 71925, "epoch": 866} {"train_loss": -21.026466369628906, "global_step": 71926, "epoch": 866} {"train_loss": -20.76639175415039, "global_step": 71927, "epoch": 866} {"train_loss": -20.9880428314209, "global_step": 71928, "epoch": 866} {"train_loss": -20.86472511291504, "global_step": 71929, "epoch": 866} {"train_loss": -20.62663459777832, "global_step": 71930, "epoch": 866} {"train_loss": -20.818687438964844, "global_step": 71931, "epoch": 866} {"train_loss": -20.8977108001709, "global_step": 71932, "epoch": 866} {"train_loss": -21.00873374938965, "global_step": 71933, "epoch": 866} {"train_loss": -20.951026916503906, "global_step": 71934, "epoch": 866} {"train_loss": -20.88054847717285, "global_step": 71935, "epoch": 866} {"train_loss": -21.037099838256836, "global_step": 71936, "epoch": 866} {"train_loss": -20.814537048339844, "global_step": 71937, "epoch": 866} {"train_loss": -21.065872192382812, "global_step": 71938, "epoch": 866} {"train_loss": -20.911733627319336, "global_step": 71939, "epoch": 866} {"train_loss": -20.701644897460938, "global_step": 71940, "epoch": 866} {"train_loss": -20.922101974487305, "global_step": 71941, "epoch": 866} {"train_loss": -20.728036880493164, "global_step": 71942, "epoch": 866} {"train_loss": -20.58938980102539, "global_step": 71943, "epoch": 866} {"train_loss": -20.841262817382812, "global_step": 71944, "epoch": 866} {"train_loss": -20.91851806640625, "global_step": 71945, "epoch": 866} {"train_loss": -20.996843338012695, "global_step": 71946, "epoch": 866} {"train_loss": -20.687711715698242, "global_step": 71947, "epoch": 866} {"train_loss": -20.885141372680664, "global_step": 71948, "epoch": 866} {"train_loss": -20.694416046142578, "global_step": 71949, "epoch": 866} {"train_loss": -21.243478775024414, "global_step": 71950, "epoch": 866} {"train_loss": -20.78483009338379, "global_step": 71951, "epoch": 866} {"train_loss": -20.916500091552734, "global_step": 71952, "epoch": 866} {"train_loss": -21.20013999938965, "global_step": 71953, "epoch": 866} {"train_loss": -20.913297653198242, "global_step": 71954, "epoch": 866} {"train_loss": -20.816938400268555, "global_step": 71955, "epoch": 866} {"train_loss": -20.85910987854004, "global_step": 71956, "epoch": 866} {"train_loss": -21.096242904663086, "global_step": 71957, "epoch": 866} {"train_loss": -20.789613723754883, "global_step": 71958, "epoch": 866} {"train_loss": -21.131681442260742, "global_step": 71959, "epoch": 866} {"train_loss": -20.902589338371552, "global_step": 71960, "epoch": 866, "val_loss": 6018728.5} {"train_loss": -20.443532943725586, "global_step": 71961, "epoch": 867} {"train_loss": -20.567489624023438, "global_step": 71962, "epoch": 867} {"train_loss": -20.798261642456055, "global_step": 71963, "epoch": 867} {"train_loss": -20.470182418823242, "global_step": 71964, "epoch": 867} {"train_loss": -20.568164825439453, "global_step": 71965, "epoch": 867} {"train_loss": -21.13688087463379, "global_step": 71966, "epoch": 867} {"train_loss": -20.39134979248047, "global_step": 71967, "epoch": 867} {"train_loss": -21.18548011779785, "global_step": 71968, "epoch": 867} {"train_loss": -20.33187484741211, "global_step": 71969, "epoch": 867} {"train_loss": -21.1771297454834, "global_step": 71970, "epoch": 867} {"train_loss": -20.717432022094727, "global_step": 71971, "epoch": 867} {"train_loss": -20.99921226501465, "global_step": 71972, "epoch": 867} {"train_loss": -20.94748878479004, "global_step": 71973, "epoch": 867} {"train_loss": -20.621570587158203, "global_step": 71974, "epoch": 867} {"train_loss": -20.669910430908203, "global_step": 71975, "epoch": 867} {"train_loss": -20.803255081176758, "global_step": 71976, "epoch": 867} {"train_loss": -21.003820419311523, "global_step": 71977, "epoch": 867} {"train_loss": -20.969242095947266, "global_step": 71978, "epoch": 867} {"train_loss": -20.74711036682129, "global_step": 71979, "epoch": 867} {"train_loss": -20.924455642700195, "global_step": 71980, "epoch": 867} {"train_loss": -20.801776885986328, "global_step": 71981, "epoch": 867} {"train_loss": -20.530866622924805, "global_step": 71982, "epoch": 867} {"train_loss": -21.021570205688477, "global_step": 71983, "epoch": 867} {"train_loss": -20.531389236450195, "global_step": 71984, "epoch": 867} {"train_loss": -20.873188018798828, "global_step": 71985, "epoch": 867} {"train_loss": -21.057010650634766, "global_step": 71986, "epoch": 867} {"train_loss": -20.812999725341797, "global_step": 71987, "epoch": 867} {"train_loss": -20.804141998291016, "global_step": 71988, "epoch": 867} {"train_loss": -20.608701705932617, "global_step": 71989, "epoch": 867} {"train_loss": -21.190275192260742, "global_step": 71990, "epoch": 867} {"train_loss": -20.766836166381836, "global_step": 71991, "epoch": 867} {"train_loss": -21.03377914428711, "global_step": 71992, "epoch": 867} {"train_loss": -20.85829734802246, "global_step": 71993, "epoch": 867} {"train_loss": -21.256052017211914, "global_step": 71994, "epoch": 867} {"train_loss": -20.79163932800293, "global_step": 71995, "epoch": 867} {"train_loss": -20.83698081970215, "global_step": 71996, "epoch": 867} {"train_loss": -20.897451400756836, "global_step": 71997, "epoch": 867} {"train_loss": -20.879018783569336, "global_step": 71998, "epoch": 867} {"train_loss": -21.052045822143555, "global_step": 71999, "epoch": 867} {"train_loss": -21.11835289001465, "global_step": 72000, "epoch": 867} {"train_loss": -20.91254234313965, "global_step": 72001, "epoch": 867} {"train_loss": -20.92660903930664, "global_step": 72002, "epoch": 867} {"train_loss": -20.63765525817871, "global_step": 72003, "epoch": 867} {"train_loss": -20.83011245727539, "global_step": 72004, "epoch": 867} {"train_loss": -20.833059310913086, "global_step": 72005, "epoch": 867} {"train_loss": -20.922727584838867, "global_step": 72006, "epoch": 867} {"train_loss": -21.118240356445312, "global_step": 72007, "epoch": 867} {"train_loss": -21.045734405517578, "global_step": 72008, "epoch": 867} {"train_loss": -21.05660057067871, "global_step": 72009, "epoch": 867} {"train_loss": -21.02327537536621, "global_step": 72010, "epoch": 867} {"train_loss": -21.03076171875, "global_step": 72011, "epoch": 867} {"train_loss": -20.753883361816406, "global_step": 72012, "epoch": 867} {"train_loss": -20.755260467529297, "global_step": 72013, "epoch": 867} {"train_loss": -20.984045028686523, "global_step": 72014, "epoch": 867} {"train_loss": -20.829687118530273, "global_step": 72015, "epoch": 867} {"train_loss": -20.832622528076172, "global_step": 72016, "epoch": 867} {"train_loss": -20.72455406188965, "global_step": 72017, "epoch": 867} {"train_loss": -21.010549545288086, "global_step": 72018, "epoch": 867} {"train_loss": -21.20673942565918, "global_step": 72019, "epoch": 867} {"train_loss": -20.78873634338379, "global_step": 72020, "epoch": 867} {"train_loss": -20.791101455688477, "global_step": 72021, "epoch": 867} {"train_loss": -21.386756896972656, "global_step": 72022, "epoch": 867} {"train_loss": -20.81918716430664, "global_step": 72023, "epoch": 867} {"train_loss": -21.00916862487793, "global_step": 72024, "epoch": 867} {"train_loss": -21.141395568847656, "global_step": 72025, "epoch": 867} {"train_loss": -20.897382736206055, "global_step": 72026, "epoch": 867} {"train_loss": -20.8143367767334, "global_step": 72027, "epoch": 867} {"train_loss": -20.96308708190918, "global_step": 72028, "epoch": 867} {"train_loss": -20.131826400756836, "global_step": 72029, "epoch": 867} {"train_loss": -20.978778839111328, "global_step": 72030, "epoch": 867} {"train_loss": -20.963029861450195, "global_step": 72031, "epoch": 867} {"train_loss": -20.87363624572754, "global_step": 72032, "epoch": 867} {"train_loss": -21.267484664916992, "global_step": 72033, "epoch": 867} {"train_loss": -21.052474975585938, "global_step": 72034, "epoch": 867} {"train_loss": -20.69914436340332, "global_step": 72035, "epoch": 867} {"train_loss": -21.045072555541992, "global_step": 72036, "epoch": 867} {"train_loss": -20.622602462768555, "global_step": 72037, "epoch": 867} {"train_loss": -20.446319580078125, "global_step": 72038, "epoch": 867} {"train_loss": -20.88254737854004, "global_step": 72039, "epoch": 867} {"train_loss": -21.051921844482422, "global_step": 72040, "epoch": 867} {"train_loss": -20.812623977661133, "global_step": 72041, "epoch": 867} {"train_loss": -21.06099510192871, "global_step": 72042, "epoch": 867} {"train_loss": -20.852385601365423, "global_step": 72043, "epoch": 867, "val_loss": 6174714.5} {"train_loss": -20.56167984008789, "global_step": 72044, "epoch": 868} {"train_loss": -20.95256996154785, "global_step": 72045, "epoch": 868} {"train_loss": -20.26896858215332, "global_step": 72046, "epoch": 868} {"train_loss": -20.24648666381836, "global_step": 72047, "epoch": 868} {"train_loss": -20.867460250854492, "global_step": 72048, "epoch": 868} {"train_loss": -20.812801361083984, "global_step": 72049, "epoch": 868} {"train_loss": -20.627382278442383, "global_step": 72050, "epoch": 868} {"train_loss": -21.029499053955078, "global_step": 72051, "epoch": 868} {"train_loss": -20.913171768188477, "global_step": 72052, "epoch": 868} {"train_loss": -20.83627700805664, "global_step": 72053, "epoch": 868} {"train_loss": -20.768264770507812, "global_step": 72054, "epoch": 868} {"train_loss": -20.992055892944336, "global_step": 72055, "epoch": 868} {"train_loss": -20.95221519470215, "global_step": 72056, "epoch": 868} {"train_loss": -20.714872360229492, "global_step": 72057, "epoch": 868} {"train_loss": -20.885665893554688, "global_step": 72058, "epoch": 868} {"train_loss": -20.934078216552734, "global_step": 72059, "epoch": 868} {"train_loss": -20.99289321899414, "global_step": 72060, "epoch": 868} {"train_loss": -20.886388778686523, "global_step": 72061, "epoch": 868} {"train_loss": -20.634565353393555, "global_step": 72062, "epoch": 868} {"train_loss": -21.020870208740234, "global_step": 72063, "epoch": 868} {"train_loss": -20.89644432067871, "global_step": 72064, "epoch": 868} {"train_loss": -21.102975845336914, "global_step": 72065, "epoch": 868} {"train_loss": -20.828475952148438, "global_step": 72066, "epoch": 868} {"train_loss": -20.703771591186523, "global_step": 72067, "epoch": 868} {"train_loss": -20.902084350585938, "global_step": 72068, "epoch": 868} {"train_loss": -21.22635269165039, "global_step": 72069, "epoch": 868} {"train_loss": -20.785001754760742, "global_step": 72070, "epoch": 868} {"train_loss": -20.723203659057617, "global_step": 72071, "epoch": 868} {"train_loss": -20.91758918762207, "global_step": 72072, "epoch": 868} {"train_loss": -20.774478912353516, "global_step": 72073, "epoch": 868} {"train_loss": -20.746137619018555, "global_step": 72074, "epoch": 868} {"train_loss": -21.178762435913086, "global_step": 72075, "epoch": 868} {"train_loss": -20.974872589111328, "global_step": 72076, "epoch": 868} {"train_loss": -21.052749633789062, "global_step": 72077, "epoch": 868} {"train_loss": -20.85700035095215, "global_step": 72078, "epoch": 868} {"train_loss": -20.537275314331055, "global_step": 72079, "epoch": 868} {"train_loss": -20.660018920898438, "global_step": 72080, "epoch": 868} {"train_loss": -20.49825096130371, "global_step": 72081, "epoch": 868} {"train_loss": -20.636661529541016, "global_step": 72082, "epoch": 868} {"train_loss": -21.2091064453125, "global_step": 72083, "epoch": 868} {"train_loss": -21.01712417602539, "global_step": 72084, "epoch": 868} {"train_loss": -20.875368118286133, "global_step": 72085, "epoch": 868} {"train_loss": -21.15524673461914, "global_step": 72086, "epoch": 868} {"train_loss": -20.82400894165039, "global_step": 72087, "epoch": 868} {"train_loss": -21.112598419189453, "global_step": 72088, "epoch": 868} {"train_loss": -20.46463394165039, "global_step": 72089, "epoch": 868} {"train_loss": -20.612964630126953, "global_step": 72090, "epoch": 868} {"train_loss": -20.561359405517578, "global_step": 72091, "epoch": 868} {"train_loss": -20.970111846923828, "global_step": 72092, "epoch": 868} {"train_loss": -20.841943740844727, "global_step": 72093, "epoch": 868} {"train_loss": -20.80218505859375, "global_step": 72094, "epoch": 868} {"train_loss": -21.20135498046875, "global_step": 72095, "epoch": 868} {"train_loss": -20.990039825439453, "global_step": 72096, "epoch": 868} {"train_loss": -21.00593376159668, "global_step": 72097, "epoch": 868} {"train_loss": -20.911758422851562, "global_step": 72098, "epoch": 868} {"train_loss": -21.47468376159668, "global_step": 72099, "epoch": 868} {"train_loss": -20.658308029174805, "global_step": 72100, "epoch": 868} {"train_loss": -21.060361862182617, "global_step": 72101, "epoch": 868} {"train_loss": -21.037677764892578, "global_step": 72102, "epoch": 868} {"train_loss": -21.139585494995117, "global_step": 72103, "epoch": 868} {"train_loss": -20.978891372680664, "global_step": 72104, "epoch": 868} {"train_loss": -20.680456161499023, "global_step": 72105, "epoch": 868} {"train_loss": -20.812429428100586, "global_step": 72106, "epoch": 868} {"train_loss": -20.649988174438477, "global_step": 72107, "epoch": 868} {"train_loss": -20.892765045166016, "global_step": 72108, "epoch": 868} {"train_loss": -21.058502197265625, "global_step": 72109, "epoch": 868} {"train_loss": -20.871063232421875, "global_step": 72110, "epoch": 868} {"train_loss": -21.15718650817871, "global_step": 72111, "epoch": 868} {"train_loss": -20.972936630249023, "global_step": 72112, "epoch": 868} {"train_loss": -20.64345932006836, "global_step": 72113, "epoch": 868} {"train_loss": -21.03597068786621, "global_step": 72114, "epoch": 868} {"train_loss": -21.168746948242188, "global_step": 72115, "epoch": 868} {"train_loss": -21.110889434814453, "global_step": 72116, "epoch": 868} {"train_loss": -20.886333465576172, "global_step": 72117, "epoch": 868} {"train_loss": -20.9171085357666, "global_step": 72118, "epoch": 868} {"train_loss": -21.41742515563965, "global_step": 72119, "epoch": 868} {"train_loss": -21.111862182617188, "global_step": 72120, "epoch": 868} {"train_loss": -20.610074996948242, "global_step": 72121, "epoch": 868} {"train_loss": -20.726200103759766, "global_step": 72122, "epoch": 868} {"train_loss": -21.034711837768555, "global_step": 72123, "epoch": 868} {"train_loss": -20.81867218017578, "global_step": 72124, "epoch": 868} {"train_loss": -21.24494171142578, "global_step": 72125, "epoch": 868} {"train_loss": -20.88592333965991, "global_step": 72126, "epoch": 868, "val_loss": 5957050.5} {"train_loss": -20.90814971923828, "global_step": 72127, "epoch": 869} {"train_loss": -20.792465209960938, "global_step": 72128, "epoch": 869} {"train_loss": -20.511316299438477, "global_step": 72129, "epoch": 869} {"train_loss": -20.456790924072266, "global_step": 72130, "epoch": 869} {"train_loss": -21.039798736572266, "global_step": 72131, "epoch": 869} {"train_loss": -20.513479232788086, "global_step": 72132, "epoch": 869} {"train_loss": -21.035633087158203, "global_step": 72133, "epoch": 869} {"train_loss": -20.820466995239258, "global_step": 72134, "epoch": 869} {"train_loss": -20.526172637939453, "global_step": 72135, "epoch": 869} {"train_loss": -20.945697784423828, "global_step": 72136, "epoch": 869} {"train_loss": -21.07289695739746, "global_step": 72137, "epoch": 869} {"train_loss": -20.821338653564453, "global_step": 72138, "epoch": 869} {"train_loss": -21.011550903320312, "global_step": 72139, "epoch": 869} {"train_loss": -20.569616317749023, "global_step": 72140, "epoch": 869} {"train_loss": -20.8183536529541, "global_step": 72141, "epoch": 869} {"train_loss": -20.54897117614746, "global_step": 72142, "epoch": 869} {"train_loss": -20.673664093017578, "global_step": 72143, "epoch": 869} {"train_loss": -21.05190086364746, "global_step": 72144, "epoch": 869} {"train_loss": -20.701053619384766, "global_step": 72145, "epoch": 869} {"train_loss": -20.743070602416992, "global_step": 72146, "epoch": 869} {"train_loss": -20.691442489624023, "global_step": 72147, "epoch": 869} {"train_loss": -20.97734832763672, "global_step": 72148, "epoch": 869} {"train_loss": -20.714309692382812, "global_step": 72149, "epoch": 869} {"train_loss": -21.148862838745117, "global_step": 72150, "epoch": 869} {"train_loss": -21.147489547729492, "global_step": 72151, "epoch": 869} {"train_loss": -20.77681541442871, "global_step": 72152, "epoch": 869} {"train_loss": -20.824832916259766, "global_step": 72153, "epoch": 869} {"train_loss": -20.7589054107666, "global_step": 72154, "epoch": 869} {"train_loss": -20.717926025390625, "global_step": 72155, "epoch": 869} {"train_loss": -20.91077995300293, "global_step": 72156, "epoch": 869} {"train_loss": -20.993825912475586, "global_step": 72157, "epoch": 869} {"train_loss": -20.68781852722168, "global_step": 72158, "epoch": 869} {"train_loss": -20.622812271118164, "global_step": 72159, "epoch": 869} {"train_loss": -20.9442081451416, "global_step": 72160, "epoch": 869} {"train_loss": -20.998579025268555, "global_step": 72161, "epoch": 869} {"train_loss": -21.088245391845703, "global_step": 72162, "epoch": 869} {"train_loss": -20.608783721923828, "global_step": 72163, "epoch": 869} {"train_loss": -21.069570541381836, "global_step": 72164, "epoch": 869} {"train_loss": -20.90077018737793, "global_step": 72165, "epoch": 869} {"train_loss": -20.89328384399414, "global_step": 72166, "epoch": 869} {"train_loss": -20.577829360961914, "global_step": 72167, "epoch": 869} {"train_loss": -21.24732780456543, "global_step": 72168, "epoch": 869} {"train_loss": -20.830537796020508, "global_step": 72169, "epoch": 869} {"train_loss": -20.978300094604492, "global_step": 72170, "epoch": 869} {"train_loss": -21.00298500061035, "global_step": 72171, "epoch": 869} {"train_loss": -20.80649185180664, "global_step": 72172, "epoch": 869} {"train_loss": -20.948644638061523, "global_step": 72173, "epoch": 869} {"train_loss": -21.196107864379883, "global_step": 72174, "epoch": 869} {"train_loss": -21.336572647094727, "global_step": 72175, "epoch": 869} {"train_loss": -20.559783935546875, "global_step": 72176, "epoch": 869} {"train_loss": -20.485065460205078, "global_step": 72177, "epoch": 869} {"train_loss": -20.87136459350586, "global_step": 72178, "epoch": 869} {"train_loss": -20.861103057861328, "global_step": 72179, "epoch": 869} {"train_loss": -21.066009521484375, "global_step": 72180, "epoch": 869} {"train_loss": -20.9213809967041, "global_step": 72181, "epoch": 869} {"train_loss": -21.335973739624023, "global_step": 72182, "epoch": 869} {"train_loss": -21.107074737548828, "global_step": 72183, "epoch": 869} {"train_loss": -21.100589752197266, "global_step": 72184, "epoch": 869} {"train_loss": -21.20596694946289, "global_step": 72185, "epoch": 869} {"train_loss": -20.99531364440918, "global_step": 72186, "epoch": 869} {"train_loss": -21.310068130493164, "global_step": 72187, "epoch": 869} {"train_loss": -20.817665100097656, "global_step": 72188, "epoch": 869} {"train_loss": -20.601049423217773, "global_step": 72189, "epoch": 869} {"train_loss": -21.104543685913086, "global_step": 72190, "epoch": 869} {"train_loss": -20.875701904296875, "global_step": 72191, "epoch": 869} {"train_loss": -20.371505737304688, "global_step": 72192, "epoch": 869} {"train_loss": -21.09734535217285, "global_step": 72193, "epoch": 869} {"train_loss": -20.862462997436523, "global_step": 72194, "epoch": 869} {"train_loss": -20.870595932006836, "global_step": 72195, "epoch": 869} {"train_loss": -21.050561904907227, "global_step": 72196, "epoch": 869} {"train_loss": -21.11610984802246, "global_step": 72197, "epoch": 869} {"train_loss": -20.74851417541504, "global_step": 72198, "epoch": 869} {"train_loss": -21.07935333251953, "global_step": 72199, "epoch": 869} {"train_loss": -20.877201080322266, "global_step": 72200, "epoch": 869} {"train_loss": -20.96568489074707, "global_step": 72201, "epoch": 869} {"train_loss": -20.905841827392578, "global_step": 72202, "epoch": 869} {"train_loss": -20.931209564208984, "global_step": 72203, "epoch": 869} {"train_loss": -20.90876579284668, "global_step": 72204, "epoch": 869} {"train_loss": -21.057584762573242, "global_step": 72205, "epoch": 869} {"train_loss": -21.096973419189453, "global_step": 72206, "epoch": 869} {"train_loss": -21.15120506286621, "global_step": 72207, "epoch": 869} {"train_loss": -21.133275985717773, "global_step": 72208, "epoch": 869} {"train_loss": -20.878248927104902, "global_step": 72209, "epoch": 869, "val_loss": 6011386.0} {"train_loss": -20.608205795288086, "global_step": 72210, "epoch": 870} {"train_loss": -21.145212173461914, "global_step": 72211, "epoch": 870} {"train_loss": -20.958820343017578, "global_step": 72212, "epoch": 870} {"train_loss": -21.039749145507812, "global_step": 72213, "epoch": 870} {"train_loss": -20.108707427978516, "global_step": 72214, "epoch": 870} {"train_loss": -20.877782821655273, "global_step": 72215, "epoch": 870} {"train_loss": -20.087839126586914, "global_step": 72216, "epoch": 870} {"train_loss": -20.653352737426758, "global_step": 72217, "epoch": 870} {"train_loss": -21.057119369506836, "global_step": 72218, "epoch": 870} {"train_loss": -21.01949691772461, "global_step": 72219, "epoch": 870} {"train_loss": -20.75873565673828, "global_step": 72220, "epoch": 870} {"train_loss": -20.82550048828125, "global_step": 72221, "epoch": 870} {"train_loss": -20.43619155883789, "global_step": 72222, "epoch": 870} {"train_loss": -20.706527709960938, "global_step": 72223, "epoch": 870} {"train_loss": -20.589229583740234, "global_step": 72224, "epoch": 870} {"train_loss": -20.839767456054688, "global_step": 72225, "epoch": 870} {"train_loss": -21.108802795410156, "global_step": 72226, "epoch": 870} {"train_loss": -20.52324867248535, "global_step": 72227, "epoch": 870} {"train_loss": -21.092605590820312, "global_step": 72228, "epoch": 870} {"train_loss": -21.00091552734375, "global_step": 72229, "epoch": 870} {"train_loss": -21.143451690673828, "global_step": 72230, "epoch": 870} {"train_loss": -20.87763023376465, "global_step": 72231, "epoch": 870} {"train_loss": -20.834617614746094, "global_step": 72232, "epoch": 870} {"train_loss": -20.52859115600586, "global_step": 72233, "epoch": 870} {"train_loss": -20.996688842773438, "global_step": 72234, "epoch": 870} {"train_loss": -20.9998836517334, "global_step": 72235, "epoch": 870} {"train_loss": -20.60814094543457, "global_step": 72236, "epoch": 870} {"train_loss": -21.012128829956055, "global_step": 72237, "epoch": 870} {"train_loss": -21.245027542114258, "global_step": 72238, "epoch": 870} {"train_loss": -21.41166877746582, "global_step": 72239, "epoch": 870} {"train_loss": -20.82899284362793, "global_step": 72240, "epoch": 870} {"train_loss": -20.704954147338867, "global_step": 72241, "epoch": 870} {"train_loss": -20.43552017211914, "global_step": 72242, "epoch": 870} {"train_loss": -20.898252487182617, "global_step": 72243, "epoch": 870} {"train_loss": -20.78818130493164, "global_step": 72244, "epoch": 870} {"train_loss": -20.930622100830078, "global_step": 72245, "epoch": 870} {"train_loss": -21.104665756225586, "global_step": 72246, "epoch": 870} {"train_loss": -21.05012321472168, "global_step": 72247, "epoch": 870} {"train_loss": -20.664880752563477, "global_step": 72248, "epoch": 870} {"train_loss": -20.78018569946289, "global_step": 72249, "epoch": 870} {"train_loss": -21.17051124572754, "global_step": 72250, "epoch": 870} {"train_loss": -20.740793228149414, "global_step": 72251, "epoch": 870} {"train_loss": -20.995126724243164, "global_step": 72252, "epoch": 870} {"train_loss": -21.076406478881836, "global_step": 72253, "epoch": 870} {"train_loss": -21.111948013305664, "global_step": 72254, "epoch": 870} {"train_loss": -20.568225860595703, "global_step": 72255, "epoch": 870} {"train_loss": -20.56228256225586, "global_step": 72256, "epoch": 870} {"train_loss": -21.234804153442383, "global_step": 72257, "epoch": 870} {"train_loss": -20.86774253845215, "global_step": 72258, "epoch": 870} {"train_loss": -21.046239852905273, "global_step": 72259, "epoch": 870} {"train_loss": -21.04939842224121, "global_step": 72260, "epoch": 870} {"train_loss": -20.757537841796875, "global_step": 72261, "epoch": 870} {"train_loss": -21.251075744628906, "global_step": 72262, "epoch": 870} {"train_loss": -20.962661743164062, "global_step": 72263, "epoch": 870} {"train_loss": -21.060258865356445, "global_step": 72264, "epoch": 870} {"train_loss": -20.94373893737793, "global_step": 72265, "epoch": 870} {"train_loss": -21.11771583557129, "global_step": 72266, "epoch": 870} {"train_loss": -20.750452041625977, "global_step": 72267, "epoch": 870} {"train_loss": -21.5523738861084, "global_step": 72268, "epoch": 870} {"train_loss": -21.191974639892578, "global_step": 72269, "epoch": 870} {"train_loss": -21.244922637939453, "global_step": 72270, "epoch": 870} {"train_loss": -20.97989845275879, "global_step": 72271, "epoch": 870} {"train_loss": -20.79373550415039, "global_step": 72272, "epoch": 870} {"train_loss": -20.809860229492188, "global_step": 72273, "epoch": 870} {"train_loss": -20.867490768432617, "global_step": 72274, "epoch": 870} {"train_loss": -21.014022827148438, "global_step": 72275, "epoch": 870} {"train_loss": -20.633081436157227, "global_step": 72276, "epoch": 870} {"train_loss": -20.970014572143555, "global_step": 72277, "epoch": 870} {"train_loss": -21.039461135864258, "global_step": 72278, "epoch": 870} {"train_loss": -21.037328720092773, "global_step": 72279, "epoch": 870} {"train_loss": -21.220487594604492, "global_step": 72280, "epoch": 870} {"train_loss": -20.964197158813477, "global_step": 72281, "epoch": 870} {"train_loss": -20.81772232055664, "global_step": 72282, "epoch": 870} {"train_loss": -20.848573684692383, "global_step": 72283, "epoch": 870} {"train_loss": -20.249155044555664, "global_step": 72284, "epoch": 870} {"train_loss": -21.004056930541992, "global_step": 72285, "epoch": 870} {"train_loss": -20.852752685546875, "global_step": 72286, "epoch": 870} {"train_loss": -20.953889846801758, "global_step": 72287, "epoch": 870} {"train_loss": -20.572601318359375, "global_step": 72288, "epoch": 870} {"train_loss": -20.963960647583008, "global_step": 72289, "epoch": 870} {"train_loss": -21.103330612182617, "global_step": 72290, "epoch": 870} {"train_loss": -21.06830406188965, "global_step": 72291, "epoch": 870} {"train_loss": -20.889151171029333, "global_step": 72292, "epoch": 870, "val_loss": 5906174.5} {"train_loss": -21.18564224243164, "global_step": 72293, "epoch": 871} {"train_loss": -20.855379104614258, "global_step": 72294, "epoch": 871} {"train_loss": -20.768335342407227, "global_step": 72295, "epoch": 871} {"train_loss": -20.904016494750977, "global_step": 72296, "epoch": 871} {"train_loss": -20.639211654663086, "global_step": 72297, "epoch": 871} {"train_loss": -20.80292320251465, "global_step": 72298, "epoch": 871} {"train_loss": -20.90971565246582, "global_step": 72299, "epoch": 871} {"train_loss": -21.21393394470215, "global_step": 72300, "epoch": 871} {"train_loss": -21.14618492126465, "global_step": 72301, "epoch": 871} {"train_loss": -20.697629928588867, "global_step": 72302, "epoch": 871} {"train_loss": -20.804885864257812, "global_step": 72303, "epoch": 871} {"train_loss": -20.822874069213867, "global_step": 72304, "epoch": 871} {"train_loss": -20.670604705810547, "global_step": 72305, "epoch": 871} {"train_loss": -20.782577514648438, "global_step": 72306, "epoch": 871} {"train_loss": -20.95020866394043, "global_step": 72307, "epoch": 871} {"train_loss": -20.95931053161621, "global_step": 72308, "epoch": 871} {"train_loss": -20.9338436126709, "global_step": 72309, "epoch": 871} {"train_loss": -20.77022361755371, "global_step": 72310, "epoch": 871} {"train_loss": -20.990530014038086, "global_step": 72311, "epoch": 871} {"train_loss": -20.82844352722168, "global_step": 72312, "epoch": 871} {"train_loss": -21.18800926208496, "global_step": 72313, "epoch": 871} {"train_loss": -21.222562789916992, "global_step": 72314, "epoch": 871} {"train_loss": -21.08462905883789, "global_step": 72315, "epoch": 871} {"train_loss": -21.196496963500977, "global_step": 72316, "epoch": 871} {"train_loss": -21.131465911865234, "global_step": 72317, "epoch": 871} {"train_loss": -21.232057571411133, "global_step": 72318, "epoch": 871} {"train_loss": -20.982927322387695, "global_step": 72319, "epoch": 871} {"train_loss": -20.9505558013916, "global_step": 72320, "epoch": 871} {"train_loss": -20.944059371948242, "global_step": 72321, "epoch": 871} {"train_loss": -21.121936798095703, "global_step": 72322, "epoch": 871} {"train_loss": -21.16486930847168, "global_step": 72323, "epoch": 871} {"train_loss": -20.641374588012695, "global_step": 72324, "epoch": 871} {"train_loss": -21.29485511779785, "global_step": 72325, "epoch": 871} {"train_loss": -21.01118278503418, "global_step": 72326, "epoch": 871} {"train_loss": -20.790563583374023, "global_step": 72327, "epoch": 871} {"train_loss": -21.17213249206543, "global_step": 72328, "epoch": 871} {"train_loss": -21.1641902923584, "global_step": 72329, "epoch": 871} {"train_loss": -21.071542739868164, "global_step": 72330, "epoch": 871} {"train_loss": -20.96394157409668, "global_step": 72331, "epoch": 871} {"train_loss": -20.85677719116211, "global_step": 72332, "epoch": 871} {"train_loss": -20.86248779296875, "global_step": 72333, "epoch": 871} {"train_loss": -21.253372192382812, "global_step": 72334, "epoch": 871} {"train_loss": -20.861703872680664, "global_step": 72335, "epoch": 871} {"train_loss": -21.276399612426758, "global_step": 72336, "epoch": 871} {"train_loss": -20.768924713134766, "global_step": 72337, "epoch": 871} {"train_loss": -20.739627838134766, "global_step": 72338, "epoch": 871} {"train_loss": -21.01389503479004, "global_step": 72339, "epoch": 871} {"train_loss": -21.059354782104492, "global_step": 72340, "epoch": 871} {"train_loss": -20.810901641845703, "global_step": 72341, "epoch": 871} {"train_loss": -20.968128204345703, "global_step": 72342, "epoch": 871} {"train_loss": -20.844650268554688, "global_step": 72343, "epoch": 871} {"train_loss": -20.843618392944336, "global_step": 72344, "epoch": 871} {"train_loss": -21.024927139282227, "global_step": 72345, "epoch": 871} {"train_loss": -20.945537567138672, "global_step": 72346, "epoch": 871} {"train_loss": -21.148218154907227, "global_step": 72347, "epoch": 871} {"train_loss": -20.84364891052246, "global_step": 72348, "epoch": 871} {"train_loss": -20.991064071655273, "global_step": 72349, "epoch": 871} {"train_loss": -20.930437088012695, "global_step": 72350, "epoch": 871} {"train_loss": -21.042295455932617, "global_step": 72351, "epoch": 871} {"train_loss": -21.099929809570312, "global_step": 72352, "epoch": 871} {"train_loss": -20.97525405883789, "global_step": 72353, "epoch": 871} {"train_loss": -20.921106338500977, "global_step": 72354, "epoch": 871} {"train_loss": -20.940275192260742, "global_step": 72355, "epoch": 871} {"train_loss": -20.927087783813477, "global_step": 72356, "epoch": 871} {"train_loss": -20.971818923950195, "global_step": 72357, "epoch": 871} {"train_loss": -20.926877975463867, "global_step": 72358, "epoch": 871} {"train_loss": -20.62088394165039, "global_step": 72359, "epoch": 871} {"train_loss": -20.89011001586914, "global_step": 72360, "epoch": 871} {"train_loss": -20.749086380004883, "global_step": 72361, "epoch": 871} {"train_loss": -21.101438522338867, "global_step": 72362, "epoch": 871} {"train_loss": -21.13240623474121, "global_step": 72363, "epoch": 871} {"train_loss": -21.281660079956055, "global_step": 72364, "epoch": 871} {"train_loss": -20.764631271362305, "global_step": 72365, "epoch": 871} {"train_loss": -20.951032638549805, "global_step": 72366, "epoch": 871} {"train_loss": -20.40130615234375, "global_step": 72367, "epoch": 871} {"train_loss": -20.695926666259766, "global_step": 72368, "epoch": 871} {"train_loss": -20.61003875732422, "global_step": 72369, "epoch": 871} {"train_loss": -20.992597579956055, "global_step": 72370, "epoch": 871} {"train_loss": -20.849496841430664, "global_step": 72371, "epoch": 871} {"train_loss": -20.8310604095459, "global_step": 72372, "epoch": 871} {"train_loss": -20.814680099487305, "global_step": 72373, "epoch": 871} {"train_loss": -21.08683204650879, "global_step": 72374, "epoch": 871} {"train_loss": -20.9442173142031, "global_step": 72375, "epoch": 871, "val_loss": 5919615.5} {"train_loss": -20.150375366210938, "global_step": 72376, "epoch": 872} {"train_loss": -20.739355087280273, "global_step": 72377, "epoch": 872} {"train_loss": -20.772733688354492, "global_step": 72378, "epoch": 872} {"train_loss": -20.589263916015625, "global_step": 72379, "epoch": 872} {"train_loss": -21.272388458251953, "global_step": 72380, "epoch": 872} {"train_loss": -20.850173950195312, "global_step": 72381, "epoch": 872} {"train_loss": -20.473234176635742, "global_step": 72382, "epoch": 872} {"train_loss": -20.461910247802734, "global_step": 72383, "epoch": 872} {"train_loss": -20.573936462402344, "global_step": 72384, "epoch": 872} {"train_loss": -20.902578353881836, "global_step": 72385, "epoch": 872} {"train_loss": -20.845108032226562, "global_step": 72386, "epoch": 872} {"train_loss": -21.07503318786621, "global_step": 72387, "epoch": 872} {"train_loss": -20.684680938720703, "global_step": 72388, "epoch": 872} {"train_loss": -20.75519561767578, "global_step": 72389, "epoch": 872} {"train_loss": -20.393362045288086, "global_step": 72390, "epoch": 872} {"train_loss": -20.9161319732666, "global_step": 72391, "epoch": 872} {"train_loss": -20.59685516357422, "global_step": 72392, "epoch": 872} {"train_loss": -20.994016647338867, "global_step": 72393, "epoch": 872} {"train_loss": -20.926471710205078, "global_step": 72394, "epoch": 872} {"train_loss": -21.17575454711914, "global_step": 72395, "epoch": 872} {"train_loss": -21.076772689819336, "global_step": 72396, "epoch": 872} {"train_loss": -20.39204978942871, "global_step": 72397, "epoch": 872} {"train_loss": -20.640695571899414, "global_step": 72398, "epoch": 872} {"train_loss": -21.349985122680664, "global_step": 72399, "epoch": 872} {"train_loss": -21.149295806884766, "global_step": 72400, "epoch": 872} {"train_loss": -21.155033111572266, "global_step": 72401, "epoch": 872} {"train_loss": -21.282386779785156, "global_step": 72402, "epoch": 872} {"train_loss": -20.849349975585938, "global_step": 72403, "epoch": 872} {"train_loss": -21.080785751342773, "global_step": 72404, "epoch": 872} {"train_loss": -20.831857681274414, "global_step": 72405, "epoch": 872} {"train_loss": -21.082860946655273, "global_step": 72406, "epoch": 872} {"train_loss": -20.77610206604004, "global_step": 72407, "epoch": 872} {"train_loss": -21.30342674255371, "global_step": 72408, "epoch": 872} {"train_loss": -20.980514526367188, "global_step": 72409, "epoch": 872} {"train_loss": -20.546051025390625, "global_step": 72410, "epoch": 872} {"train_loss": -21.178098678588867, "global_step": 72411, "epoch": 872} {"train_loss": -20.852018356323242, "global_step": 72412, "epoch": 872} {"train_loss": -20.368942260742188, "global_step": 72413, "epoch": 872} {"train_loss": -20.845073699951172, "global_step": 72414, "epoch": 872} {"train_loss": -21.349445343017578, "global_step": 72415, "epoch": 872} {"train_loss": -20.720212936401367, "global_step": 72416, "epoch": 872} {"train_loss": -20.63813018798828, "global_step": 72417, "epoch": 872} {"train_loss": -20.853654861450195, "global_step": 72418, "epoch": 872} {"train_loss": -20.82069969177246, "global_step": 72419, "epoch": 872} {"train_loss": -20.75339126586914, "global_step": 72420, "epoch": 872} {"train_loss": -20.907865524291992, "global_step": 72421, "epoch": 872} {"train_loss": -20.952049255371094, "global_step": 72422, "epoch": 872} {"train_loss": -21.411008834838867, "global_step": 72423, "epoch": 872} {"train_loss": -20.891084671020508, "global_step": 72424, "epoch": 872} {"train_loss": -21.4833927154541, "global_step": 72425, "epoch": 872} {"train_loss": -20.871164321899414, "global_step": 72426, "epoch": 872} {"train_loss": -20.92449188232422, "global_step": 72427, "epoch": 872} {"train_loss": -20.850421905517578, "global_step": 72428, "epoch": 872} {"train_loss": -21.209522247314453, "global_step": 72429, "epoch": 872} {"train_loss": -21.140186309814453, "global_step": 72430, "epoch": 872} {"train_loss": -21.069204330444336, "global_step": 72431, "epoch": 872} {"train_loss": -20.559789657592773, "global_step": 72432, "epoch": 872} {"train_loss": -21.07341766357422, "global_step": 72433, "epoch": 872} {"train_loss": -21.051868438720703, "global_step": 72434, "epoch": 872} {"train_loss": -20.743209838867188, "global_step": 72435, "epoch": 872} {"train_loss": -21.07457733154297, "global_step": 72436, "epoch": 872} {"train_loss": -20.508146286010742, "global_step": 72437, "epoch": 872} {"train_loss": -21.158193588256836, "global_step": 72438, "epoch": 872} {"train_loss": -21.021451950073242, "global_step": 72439, "epoch": 872} {"train_loss": -20.984027862548828, "global_step": 72440, "epoch": 872} {"train_loss": -21.011625289916992, "global_step": 72441, "epoch": 872} {"train_loss": -20.913009643554688, "global_step": 72442, "epoch": 872} {"train_loss": -20.994115829467773, "global_step": 72443, "epoch": 872} {"train_loss": -20.531444549560547, "global_step": 72444, "epoch": 872} {"train_loss": -21.034555435180664, "global_step": 72445, "epoch": 872} {"train_loss": -20.386367797851562, "global_step": 72446, "epoch": 872} {"train_loss": -20.874107360839844, "global_step": 72447, "epoch": 872} {"train_loss": -21.040451049804688, "global_step": 72448, "epoch": 872} {"train_loss": -20.692914962768555, "global_step": 72449, "epoch": 872} {"train_loss": -20.94270133972168, "global_step": 72450, "epoch": 872} {"train_loss": -20.880783081054688, "global_step": 72451, "epoch": 872} {"train_loss": -21.345489501953125, "global_step": 72452, "epoch": 872} {"train_loss": -20.878524780273438, "global_step": 72453, "epoch": 872} {"train_loss": -21.17558479309082, "global_step": 72454, "epoch": 872} {"train_loss": -20.818931579589844, "global_step": 72455, "epoch": 872} {"train_loss": -20.88401222229004, "global_step": 72456, "epoch": 872} {"train_loss": -20.659549713134766, "global_step": 72457, "epoch": 872} {"train_loss": -20.887600473610753, "global_step": 72458, "epoch": 872, "val_loss": 6112169.0} {"train_loss": -20.07472038269043, "global_step": 72459, "epoch": 873} {"train_loss": -20.351652145385742, "global_step": 72460, "epoch": 873} {"train_loss": -20.516233444213867, "global_step": 72461, "epoch": 873} {"train_loss": -20.86176109313965, "global_step": 72462, "epoch": 873} {"train_loss": -20.416717529296875, "global_step": 72463, "epoch": 873} {"train_loss": -20.208877563476562, "global_step": 72464, "epoch": 873} {"train_loss": -20.647001266479492, "global_step": 72465, "epoch": 873} {"train_loss": -20.843952178955078, "global_step": 72466, "epoch": 873} {"train_loss": -20.83487319946289, "global_step": 72467, "epoch": 873} {"train_loss": -20.61518669128418, "global_step": 72468, "epoch": 873} {"train_loss": -20.930877685546875, "global_step": 72469, "epoch": 873} {"train_loss": -20.997238159179688, "global_step": 72470, "epoch": 873} {"train_loss": -20.448144912719727, "global_step": 72471, "epoch": 873} {"train_loss": -21.021944046020508, "global_step": 72472, "epoch": 873} {"train_loss": -21.040863037109375, "global_step": 72473, "epoch": 873} {"train_loss": -20.5666561126709, "global_step": 72474, "epoch": 873} {"train_loss": -20.648975372314453, "global_step": 72475, "epoch": 873} {"train_loss": -20.80867576599121, "global_step": 72476, "epoch": 873} {"train_loss": -20.584623336791992, "global_step": 72477, "epoch": 873} {"train_loss": -20.722623825073242, "global_step": 72478, "epoch": 873} {"train_loss": -20.613191604614258, "global_step": 72479, "epoch": 873} {"train_loss": -20.8546199798584, "global_step": 72480, "epoch": 873} {"train_loss": -21.03529930114746, "global_step": 72481, "epoch": 873} {"train_loss": -20.885244369506836, "global_step": 72482, "epoch": 873} {"train_loss": -20.966053009033203, "global_step": 72483, "epoch": 873} {"train_loss": -20.753713607788086, "global_step": 72484, "epoch": 873} {"train_loss": -21.045255661010742, "global_step": 72485, "epoch": 873} {"train_loss": -20.84766960144043, "global_step": 72486, "epoch": 873} {"train_loss": -20.85205841064453, "global_step": 72487, "epoch": 873} {"train_loss": -20.621252059936523, "global_step": 72488, "epoch": 873} {"train_loss": -20.90744400024414, "global_step": 72489, "epoch": 873} {"train_loss": -20.834447860717773, "global_step": 72490, "epoch": 873} {"train_loss": -21.046119689941406, "global_step": 72491, "epoch": 873} {"train_loss": -20.68477439880371, "global_step": 72492, "epoch": 873} {"train_loss": -20.92825698852539, "global_step": 72493, "epoch": 873} {"train_loss": -20.90630340576172, "global_step": 72494, "epoch": 873} {"train_loss": -20.641895294189453, "global_step": 72495, "epoch": 873} {"train_loss": -21.02313804626465, "global_step": 72496, "epoch": 873} {"train_loss": -21.444046020507812, "global_step": 72497, "epoch": 873} {"train_loss": -21.07942771911621, "global_step": 72498, "epoch": 873} {"train_loss": -20.78371238708496, "global_step": 72499, "epoch": 873} {"train_loss": -21.035425186157227, "global_step": 72500, "epoch": 873} {"train_loss": -20.60161590576172, "global_step": 72501, "epoch": 873} {"train_loss": -21.08987808227539, "global_step": 72502, "epoch": 873} {"train_loss": -21.217517852783203, "global_step": 72503, "epoch": 873} {"train_loss": -21.25771713256836, "global_step": 72504, "epoch": 873} {"train_loss": -20.961515426635742, "global_step": 72505, "epoch": 873} {"train_loss": -20.90293312072754, "global_step": 72506, "epoch": 873} {"train_loss": -20.61121940612793, "global_step": 72507, "epoch": 873} {"train_loss": -21.16848373413086, "global_step": 72508, "epoch": 873} {"train_loss": -20.932435989379883, "global_step": 72509, "epoch": 873} {"train_loss": -20.851808547973633, "global_step": 72510, "epoch": 873} {"train_loss": -20.779552459716797, "global_step": 72511, "epoch": 873} {"train_loss": -20.657827377319336, "global_step": 72512, "epoch": 873} {"train_loss": -20.843671798706055, "global_step": 72513, "epoch": 873} {"train_loss": -20.649301528930664, "global_step": 72514, "epoch": 873} {"train_loss": -20.91773796081543, "global_step": 72515, "epoch": 873} {"train_loss": -20.949399948120117, "global_step": 72516, "epoch": 873} {"train_loss": -21.130483627319336, "global_step": 72517, "epoch": 873} {"train_loss": -20.497312545776367, "global_step": 72518, "epoch": 873} {"train_loss": -20.95021629333496, "global_step": 72519, "epoch": 873} {"train_loss": -20.885360717773438, "global_step": 72520, "epoch": 873} {"train_loss": -20.726390838623047, "global_step": 72521, "epoch": 873} {"train_loss": -20.904129028320312, "global_step": 72522, "epoch": 873} {"train_loss": -21.238155364990234, "global_step": 72523, "epoch": 873} {"train_loss": -20.626623153686523, "global_step": 72524, "epoch": 873} {"train_loss": -20.540494918823242, "global_step": 72525, "epoch": 873} {"train_loss": -21.098251342773438, "global_step": 72526, "epoch": 873} {"train_loss": -20.52286720275879, "global_step": 72527, "epoch": 873} {"train_loss": -20.891555786132812, "global_step": 72528, "epoch": 873} {"train_loss": -20.909879684448242, "global_step": 72529, "epoch": 873} {"train_loss": -21.006511688232422, "global_step": 72530, "epoch": 873} {"train_loss": -20.842679977416992, "global_step": 72531, "epoch": 873} {"train_loss": -20.691862106323242, "global_step": 72532, "epoch": 873} {"train_loss": -20.409284591674805, "global_step": 72533, "epoch": 873} {"train_loss": -21.112884521484375, "global_step": 72534, "epoch": 873} {"train_loss": -20.93710708618164, "global_step": 72535, "epoch": 873} {"train_loss": -20.446500778198242, "global_step": 72536, "epoch": 873} {"train_loss": -20.746612548828125, "global_step": 72537, "epoch": 873} {"train_loss": -20.951465606689453, "global_step": 72538, "epoch": 873} {"train_loss": -20.95655632019043, "global_step": 72539, "epoch": 873} {"train_loss": -20.996423721313477, "global_step": 72540, "epoch": 873} {"train_loss": -20.81728399805276, "global_step": 72541, "epoch": 873, "val_loss": 5899256.0} {"train_loss": -21.004364013671875, "global_step": 72542, "epoch": 874} {"train_loss": -21.065067291259766, "global_step": 72543, "epoch": 874} {"train_loss": -20.635639190673828, "global_step": 72544, "epoch": 874} {"train_loss": -20.680530548095703, "global_step": 72545, "epoch": 874} {"train_loss": -20.865097045898438, "global_step": 72546, "epoch": 874} {"train_loss": -20.783777236938477, "global_step": 72547, "epoch": 874} {"train_loss": -20.8399600982666, "global_step": 72548, "epoch": 874} {"train_loss": -20.81513214111328, "global_step": 72549, "epoch": 874} {"train_loss": -21.072174072265625, "global_step": 72550, "epoch": 874} {"train_loss": -20.955474853515625, "global_step": 72551, "epoch": 874} {"train_loss": -20.455156326293945, "global_step": 72552, "epoch": 874} {"train_loss": -20.806636810302734, "global_step": 72553, "epoch": 874} {"train_loss": -20.845199584960938, "global_step": 72554, "epoch": 874} {"train_loss": -20.743627548217773, "global_step": 72555, "epoch": 874} {"train_loss": -21.08856201171875, "global_step": 72556, "epoch": 874} {"train_loss": -21.066232681274414, "global_step": 72557, "epoch": 874} {"train_loss": -21.279556274414062, "global_step": 72558, "epoch": 874} {"train_loss": -20.93740463256836, "global_step": 72559, "epoch": 874} {"train_loss": -20.960208892822266, "global_step": 72560, "epoch": 874} {"train_loss": -20.836294174194336, "global_step": 72561, "epoch": 874} {"train_loss": -20.707746505737305, "global_step": 72562, "epoch": 874} {"train_loss": -20.348474502563477, "global_step": 72563, "epoch": 874} {"train_loss": -20.77446937561035, "global_step": 72564, "epoch": 874} {"train_loss": -20.74310302734375, "global_step": 72565, "epoch": 874} {"train_loss": -20.552412033081055, "global_step": 72566, "epoch": 874} {"train_loss": -20.94330406188965, "global_step": 72567, "epoch": 874} {"train_loss": -20.834264755249023, "global_step": 72568, "epoch": 874} {"train_loss": -20.668094635009766, "global_step": 72569, "epoch": 874} {"train_loss": -20.8332576751709, "global_step": 72570, "epoch": 874} {"train_loss": -20.816495895385742, "global_step": 72571, "epoch": 874} {"train_loss": -20.86093521118164, "global_step": 72572, "epoch": 874} {"train_loss": -20.95144271850586, "global_step": 72573, "epoch": 874} {"train_loss": -20.78367805480957, "global_step": 72574, "epoch": 874} {"train_loss": -21.03350257873535, "global_step": 72575, "epoch": 874} {"train_loss": -20.655603408813477, "global_step": 72576, "epoch": 874} {"train_loss": -21.010822296142578, "global_step": 72577, "epoch": 874} {"train_loss": -21.225858688354492, "global_step": 72578, "epoch": 874} {"train_loss": -20.7406063079834, "global_step": 72579, "epoch": 874} {"train_loss": -21.08928108215332, "global_step": 72580, "epoch": 874} {"train_loss": -20.922815322875977, "global_step": 72581, "epoch": 874} {"train_loss": -21.09010887145996, "global_step": 72582, "epoch": 874} {"train_loss": -21.233051300048828, "global_step": 72583, "epoch": 874} {"train_loss": -21.04866600036621, "global_step": 72584, "epoch": 874} {"train_loss": -21.16511344909668, "global_step": 72585, "epoch": 874} {"train_loss": -21.132869720458984, "global_step": 72586, "epoch": 874} {"train_loss": -20.754108428955078, "global_step": 72587, "epoch": 874} {"train_loss": -20.95199966430664, "global_step": 72588, "epoch": 874} {"train_loss": -21.051706314086914, "global_step": 72589, "epoch": 874} {"train_loss": -21.1639461517334, "global_step": 72590, "epoch": 874} {"train_loss": -20.979917526245117, "global_step": 72591, "epoch": 874} {"train_loss": -21.262847900390625, "global_step": 72592, "epoch": 874} {"train_loss": -20.85207176208496, "global_step": 72593, "epoch": 874} {"train_loss": -21.016141891479492, "global_step": 72594, "epoch": 874} {"train_loss": -20.893768310546875, "global_step": 72595, "epoch": 874} {"train_loss": -20.87727165222168, "global_step": 72596, "epoch": 874} {"train_loss": -20.888023376464844, "global_step": 72597, "epoch": 874} {"train_loss": -20.95832633972168, "global_step": 72598, "epoch": 874} {"train_loss": -21.106727600097656, "global_step": 72599, "epoch": 874} {"train_loss": -21.27426528930664, "global_step": 72600, "epoch": 874} {"train_loss": -20.952823638916016, "global_step": 72601, "epoch": 874} {"train_loss": -20.79957389831543, "global_step": 72602, "epoch": 874} {"train_loss": -21.145483016967773, "global_step": 72603, "epoch": 874} {"train_loss": -21.035531997680664, "global_step": 72604, "epoch": 874} {"train_loss": -20.930973052978516, "global_step": 72605, "epoch": 874} {"train_loss": -20.679277420043945, "global_step": 72606, "epoch": 874} {"train_loss": -20.446409225463867, "global_step": 72607, "epoch": 874} {"train_loss": -20.885583877563477, "global_step": 72608, "epoch": 874} {"train_loss": -20.95021629333496, "global_step": 72609, "epoch": 874} {"train_loss": -20.94038200378418, "global_step": 72610, "epoch": 874} {"train_loss": -21.020627975463867, "global_step": 72611, "epoch": 874} {"train_loss": -20.68985939025879, "global_step": 72612, "epoch": 874} {"train_loss": -20.863920211791992, "global_step": 72613, "epoch": 874} {"train_loss": -20.75363540649414, "global_step": 72614, "epoch": 874} {"train_loss": -20.769075393676758, "global_step": 72615, "epoch": 874} {"train_loss": -20.816608428955078, "global_step": 72616, "epoch": 874} {"train_loss": -21.301246643066406, "global_step": 72617, "epoch": 874} {"train_loss": -20.81174659729004, "global_step": 72618, "epoch": 874} {"train_loss": -21.15837287902832, "global_step": 72619, "epoch": 874} {"train_loss": -21.55170249938965, "global_step": 72620, "epoch": 874} {"train_loss": -20.682235717773438, "global_step": 72621, "epoch": 874} {"train_loss": -21.099424362182617, "global_step": 72622, "epoch": 874} {"train_loss": -21.249692916870117, "global_step": 72623, "epoch": 874} {"train_loss": -20.918731620512812, "global_step": 72624, "epoch": 874, "val_loss": 5790705.5} {"train_loss": -20.656248092651367, "global_step": 72625, "epoch": 875} {"train_loss": -20.609399795532227, "global_step": 72626, "epoch": 875} {"train_loss": -20.760154724121094, "global_step": 72627, "epoch": 875} {"train_loss": -21.01417350769043, "global_step": 72628, "epoch": 875} {"train_loss": -20.63751983642578, "global_step": 72629, "epoch": 875} {"train_loss": -20.896411895751953, "global_step": 72630, "epoch": 875} {"train_loss": -20.594045639038086, "global_step": 72631, "epoch": 875} {"train_loss": -20.736446380615234, "global_step": 72632, "epoch": 875} {"train_loss": -21.179616928100586, "global_step": 72633, "epoch": 875} {"train_loss": -20.62842559814453, "global_step": 72634, "epoch": 875} {"train_loss": -20.689716339111328, "global_step": 72635, "epoch": 875} {"train_loss": -21.31980323791504, "global_step": 72636, "epoch": 875} {"train_loss": -20.8587589263916, "global_step": 72637, "epoch": 875} {"train_loss": -20.603347778320312, "global_step": 72638, "epoch": 875} {"train_loss": -20.838056564331055, "global_step": 72639, "epoch": 875} {"train_loss": -20.620067596435547, "global_step": 72640, "epoch": 875} {"train_loss": -21.07284927368164, "global_step": 72641, "epoch": 875} {"train_loss": -20.725217819213867, "global_step": 72642, "epoch": 875} {"train_loss": -21.133060455322266, "global_step": 72643, "epoch": 875} {"train_loss": -21.05149269104004, "global_step": 72644, "epoch": 875} {"train_loss": -20.59906768798828, "global_step": 72645, "epoch": 875} {"train_loss": -20.63495445251465, "global_step": 72646, "epoch": 875} {"train_loss": -21.270597457885742, "global_step": 72647, "epoch": 875} {"train_loss": -20.748029708862305, "global_step": 72648, "epoch": 875} {"train_loss": -20.770919799804688, "global_step": 72649, "epoch": 875} {"train_loss": -20.9383602142334, "global_step": 72650, "epoch": 875} {"train_loss": -20.966413497924805, "global_step": 72651, "epoch": 875} {"train_loss": -20.6279354095459, "global_step": 72652, "epoch": 875} {"train_loss": -21.2146053314209, "global_step": 72653, "epoch": 875} {"train_loss": -20.857421875, "global_step": 72654, "epoch": 875} {"train_loss": -20.906009674072266, "global_step": 72655, "epoch": 875} {"train_loss": -20.871932983398438, "global_step": 72656, "epoch": 875} {"train_loss": -20.92353630065918, "global_step": 72657, "epoch": 875} {"train_loss": -20.706396102905273, "global_step": 72658, "epoch": 875} {"train_loss": -21.169355392456055, "global_step": 72659, "epoch": 875} {"train_loss": -21.05049705505371, "global_step": 72660, "epoch": 875} {"train_loss": -20.657529830932617, "global_step": 72661, "epoch": 875} {"train_loss": -20.807586669921875, "global_step": 72662, "epoch": 875} {"train_loss": -21.035661697387695, "global_step": 72663, "epoch": 875} {"train_loss": -21.084287643432617, "global_step": 72664, "epoch": 875} {"train_loss": -20.865110397338867, "global_step": 72665, "epoch": 875} {"train_loss": -20.608850479125977, "global_step": 72666, "epoch": 875} {"train_loss": -21.30671501159668, "global_step": 72667, "epoch": 875} {"train_loss": -21.135465621948242, "global_step": 72668, "epoch": 875} {"train_loss": -20.748737335205078, "global_step": 72669, "epoch": 875} {"train_loss": -21.078813552856445, "global_step": 72670, "epoch": 875} {"train_loss": -20.929378509521484, "global_step": 72671, "epoch": 875} {"train_loss": -21.056838989257812, "global_step": 72672, "epoch": 875} {"train_loss": -20.656982421875, "global_step": 72673, "epoch": 875} {"train_loss": -20.780790328979492, "global_step": 72674, "epoch": 875} {"train_loss": -20.95638084411621, "global_step": 72675, "epoch": 875} {"train_loss": -21.024871826171875, "global_step": 72676, "epoch": 875} {"train_loss": -21.034955978393555, "global_step": 72677, "epoch": 875} {"train_loss": -20.932220458984375, "global_step": 72678, "epoch": 875} {"train_loss": -20.889007568359375, "global_step": 72679, "epoch": 875} {"train_loss": -20.535724639892578, "global_step": 72680, "epoch": 875} {"train_loss": -20.959781646728516, "global_step": 72681, "epoch": 875} {"train_loss": -21.095304489135742, "global_step": 72682, "epoch": 875} {"train_loss": -20.906953811645508, "global_step": 72683, "epoch": 875} {"train_loss": -20.993436813354492, "global_step": 72684, "epoch": 875} {"train_loss": -20.7844181060791, "global_step": 72685, "epoch": 875} {"train_loss": -21.345130920410156, "global_step": 72686, "epoch": 875} {"train_loss": -20.52213478088379, "global_step": 72687, "epoch": 875} {"train_loss": -20.830312728881836, "global_step": 72688, "epoch": 875} {"train_loss": -20.67902183532715, "global_step": 72689, "epoch": 875} {"train_loss": -21.127981185913086, "global_step": 72690, "epoch": 875} {"train_loss": -20.804536819458008, "global_step": 72691, "epoch": 875} {"train_loss": -20.73282814025879, "global_step": 72692, "epoch": 875} {"train_loss": -20.806034088134766, "global_step": 72693, "epoch": 875} {"train_loss": -20.807409286499023, "global_step": 72694, "epoch": 875} {"train_loss": -21.49362564086914, "global_step": 72695, "epoch": 875} {"train_loss": -20.82667350769043, "global_step": 72696, "epoch": 875} {"train_loss": -20.766712188720703, "global_step": 72697, "epoch": 875} {"train_loss": -20.528226852416992, "global_step": 72698, "epoch": 875} {"train_loss": -20.971166610717773, "global_step": 72699, "epoch": 875} {"train_loss": -20.84992790222168, "global_step": 72700, "epoch": 875} {"train_loss": -20.68932342529297, "global_step": 72701, "epoch": 875} {"train_loss": -20.987384796142578, "global_step": 72702, "epoch": 875} {"train_loss": -20.767866134643555, "global_step": 72703, "epoch": 875} {"train_loss": -20.78435516357422, "global_step": 72704, "epoch": 875} {"train_loss": -21.053621292114258, "global_step": 72705, "epoch": 875} {"train_loss": -20.859113693237305, "global_step": 72706, "epoch": 875} {"train_loss": -20.878121778189417, "global_step": 72707, "epoch": 875, "val_loss": 6116760.0} {"train_loss": -20.316707611083984, "global_step": 72708, "epoch": 876} {"train_loss": -20.759233474731445, "global_step": 72709, "epoch": 876} {"train_loss": -20.86183738708496, "global_step": 72710, "epoch": 876} {"train_loss": -20.548429489135742, "global_step": 72711, "epoch": 876} {"train_loss": -20.507577896118164, "global_step": 72712, "epoch": 876} {"train_loss": -20.853660583496094, "global_step": 72713, "epoch": 876} {"train_loss": -20.903881072998047, "global_step": 72714, "epoch": 876} {"train_loss": -20.84893226623535, "global_step": 72715, "epoch": 876} {"train_loss": -20.235807418823242, "global_step": 72716, "epoch": 876} {"train_loss": -20.744487762451172, "global_step": 72717, "epoch": 876} {"train_loss": -20.78461456298828, "global_step": 72718, "epoch": 876} {"train_loss": -20.730762481689453, "global_step": 72719, "epoch": 876} {"train_loss": -20.644506454467773, "global_step": 72720, "epoch": 876} {"train_loss": -20.72183609008789, "global_step": 72721, "epoch": 876} {"train_loss": -20.7193546295166, "global_step": 72722, "epoch": 876} {"train_loss": -20.353200912475586, "global_step": 72723, "epoch": 876} {"train_loss": -20.638172149658203, "global_step": 72724, "epoch": 876} {"train_loss": -20.79242515563965, "global_step": 72725, "epoch": 876} {"train_loss": -21.050500869750977, "global_step": 72726, "epoch": 876} {"train_loss": -20.96988868713379, "global_step": 72727, "epoch": 876} {"train_loss": -20.94744300842285, "global_step": 72728, "epoch": 876} {"train_loss": -21.06452751159668, "global_step": 72729, "epoch": 876} {"train_loss": -20.804643630981445, "global_step": 72730, "epoch": 876} {"train_loss": -21.13071632385254, "global_step": 72731, "epoch": 876} {"train_loss": -20.837167739868164, "global_step": 72732, "epoch": 876} {"train_loss": -21.16248321533203, "global_step": 72733, "epoch": 876} {"train_loss": -20.77741241455078, "global_step": 72734, "epoch": 876} {"train_loss": -20.404895782470703, "global_step": 72735, "epoch": 876} {"train_loss": -20.877777099609375, "global_step": 72736, "epoch": 876} {"train_loss": -21.116012573242188, "global_step": 72737, "epoch": 876} {"train_loss": -21.263839721679688, "global_step": 72738, "epoch": 876} {"train_loss": -20.91969871520996, "global_step": 72739, "epoch": 876} {"train_loss": -21.087993621826172, "global_step": 72740, "epoch": 876} {"train_loss": -21.05232810974121, "global_step": 72741, "epoch": 876} {"train_loss": -21.162649154663086, "global_step": 72742, "epoch": 876} {"train_loss": -20.96135902404785, "global_step": 72743, "epoch": 876} {"train_loss": -20.94430160522461, "global_step": 72744, "epoch": 876} {"train_loss": -20.653127670288086, "global_step": 72745, "epoch": 876} {"train_loss": -21.015226364135742, "global_step": 72746, "epoch": 876} {"train_loss": -20.717674255371094, "global_step": 72747, "epoch": 876} {"train_loss": -21.25376319885254, "global_step": 72748, "epoch": 876} {"train_loss": -20.941463470458984, "global_step": 72749, "epoch": 876} {"train_loss": -21.23781967163086, "global_step": 72750, "epoch": 876} {"train_loss": -20.80440330505371, "global_step": 72751, "epoch": 876} {"train_loss": -21.167312622070312, "global_step": 72752, "epoch": 876} {"train_loss": -20.81414031982422, "global_step": 72753, "epoch": 876} {"train_loss": -20.76888084411621, "global_step": 72754, "epoch": 876} {"train_loss": -20.821918487548828, "global_step": 72755, "epoch": 876} {"train_loss": -20.87055015563965, "global_step": 72756, "epoch": 876} {"train_loss": -20.858417510986328, "global_step": 72757, "epoch": 876} {"train_loss": -20.691307067871094, "global_step": 72758, "epoch": 876} {"train_loss": -20.86187171936035, "global_step": 72759, "epoch": 876} {"train_loss": -20.89291763305664, "global_step": 72760, "epoch": 876} {"train_loss": -20.769262313842773, "global_step": 72761, "epoch": 876} {"train_loss": -20.855541229248047, "global_step": 72762, "epoch": 876} {"train_loss": -20.814708709716797, "global_step": 72763, "epoch": 876} {"train_loss": -20.748889923095703, "global_step": 72764, "epoch": 876} {"train_loss": -20.859222412109375, "global_step": 72765, "epoch": 876} {"train_loss": -20.86554527282715, "global_step": 72766, "epoch": 876} {"train_loss": -20.8599853515625, "global_step": 72767, "epoch": 876} {"train_loss": -21.236906051635742, "global_step": 72768, "epoch": 876} {"train_loss": -20.929492950439453, "global_step": 72769, "epoch": 876} {"train_loss": -20.958587646484375, "global_step": 72770, "epoch": 876} {"train_loss": -21.045316696166992, "global_step": 72771, "epoch": 876} {"train_loss": -20.98456382751465, "global_step": 72772, "epoch": 876} {"train_loss": -21.425846099853516, "global_step": 72773, "epoch": 876} {"train_loss": -21.150192260742188, "global_step": 72774, "epoch": 876} {"train_loss": -20.72027587890625, "global_step": 72775, "epoch": 876} {"train_loss": -20.9781551361084, "global_step": 72776, "epoch": 876} {"train_loss": -21.22299575805664, "global_step": 72777, "epoch": 876} {"train_loss": -21.17621421813965, "global_step": 72778, "epoch": 876} {"train_loss": -21.037511825561523, "global_step": 72779, "epoch": 876} {"train_loss": -21.369430541992188, "global_step": 72780, "epoch": 876} {"train_loss": -20.705610275268555, "global_step": 72781, "epoch": 876} {"train_loss": -20.490177154541016, "global_step": 72782, "epoch": 876} {"train_loss": -21.23410415649414, "global_step": 72783, "epoch": 876} {"train_loss": -20.561246871948242, "global_step": 72784, "epoch": 876} {"train_loss": -20.676410675048828, "global_step": 72785, "epoch": 876} {"train_loss": -20.71652603149414, "global_step": 72786, "epoch": 876} {"train_loss": -20.652612686157227, "global_step": 72787, "epoch": 876} {"train_loss": -20.982145309448242, "global_step": 72788, "epoch": 876} {"train_loss": -20.65860366821289, "global_step": 72789, "epoch": 876} {"train_loss": -20.881928570299262, "global_step": 72790, "epoch": 876, "val_loss": 5906007.5} {"train_loss": -20.608444213867188, "global_step": 72791, "epoch": 877} {"train_loss": -20.505035400390625, "global_step": 72792, "epoch": 877} {"train_loss": -20.426237106323242, "global_step": 72793, "epoch": 877} {"train_loss": -20.18490982055664, "global_step": 72794, "epoch": 877} {"train_loss": -20.560861587524414, "global_step": 72795, "epoch": 877} {"train_loss": -20.960941314697266, "global_step": 72796, "epoch": 877} {"train_loss": -20.81758689880371, "global_step": 72797, "epoch": 877} {"train_loss": -20.51313591003418, "global_step": 72798, "epoch": 877} {"train_loss": -20.877796173095703, "global_step": 72799, "epoch": 877} {"train_loss": -20.566659927368164, "global_step": 72800, "epoch": 877} {"train_loss": -20.79954719543457, "global_step": 72801, "epoch": 877} {"train_loss": -20.535993576049805, "global_step": 72802, "epoch": 877} {"train_loss": -20.63914680480957, "global_step": 72803, "epoch": 877} {"train_loss": -20.927427291870117, "global_step": 72804, "epoch": 877} {"train_loss": -21.025447845458984, "global_step": 72805, "epoch": 877} {"train_loss": -20.8780460357666, "global_step": 72806, "epoch": 877} {"train_loss": -20.90846061706543, "global_step": 72807, "epoch": 877} {"train_loss": -21.107824325561523, "global_step": 72808, "epoch": 877} {"train_loss": -20.86760711669922, "global_step": 72809, "epoch": 877} {"train_loss": -20.985607147216797, "global_step": 72810, "epoch": 877} {"train_loss": -20.89836883544922, "global_step": 72811, "epoch": 877} {"train_loss": -20.91468620300293, "global_step": 72812, "epoch": 877} {"train_loss": -20.991281509399414, "global_step": 72813, "epoch": 877} {"train_loss": -20.69480323791504, "global_step": 72814, "epoch": 877} {"train_loss": -21.13971710205078, "global_step": 72815, "epoch": 877} {"train_loss": -20.765424728393555, "global_step": 72816, "epoch": 877} {"train_loss": -20.85030746459961, "global_step": 72817, "epoch": 877} {"train_loss": -20.849058151245117, "global_step": 72818, "epoch": 877} {"train_loss": -20.88527488708496, "global_step": 72819, "epoch": 877} {"train_loss": -21.099117279052734, "global_step": 72820, "epoch": 877} {"train_loss": -21.387821197509766, "global_step": 72821, "epoch": 877} {"train_loss": -20.766820907592773, "global_step": 72822, "epoch": 877} {"train_loss": -21.26556968688965, "global_step": 72823, "epoch": 877} {"train_loss": -20.878841400146484, "global_step": 72824, "epoch": 877} {"train_loss": -20.9226131439209, "global_step": 72825, "epoch": 877} {"train_loss": -20.951391220092773, "global_step": 72826, "epoch": 877} {"train_loss": -20.735183715820312, "global_step": 72827, "epoch": 877} {"train_loss": -20.792694091796875, "global_step": 72828, "epoch": 877} {"train_loss": -20.996337890625, "global_step": 72829, "epoch": 877} {"train_loss": -21.064868927001953, "global_step": 72830, "epoch": 877} {"train_loss": -20.526273727416992, "global_step": 72831, "epoch": 877} {"train_loss": -20.883941650390625, "global_step": 72832, "epoch": 877} {"train_loss": -20.8201961517334, "global_step": 72833, "epoch": 877} {"train_loss": -20.787519454956055, "global_step": 72834, "epoch": 877} {"train_loss": -20.73294448852539, "global_step": 72835, "epoch": 877} {"train_loss": -21.388395309448242, "global_step": 72836, "epoch": 877} {"train_loss": -21.440725326538086, "global_step": 72837, "epoch": 877} {"train_loss": -21.191221237182617, "global_step": 72838, "epoch": 877} {"train_loss": -21.149206161499023, "global_step": 72839, "epoch": 877} {"train_loss": -20.62168312072754, "global_step": 72840, "epoch": 877} {"train_loss": -20.892810821533203, "global_step": 72841, "epoch": 877} {"train_loss": -20.653593063354492, "global_step": 72842, "epoch": 877} {"train_loss": -20.64332389831543, "global_step": 72843, "epoch": 877} {"train_loss": -20.98883819580078, "global_step": 72844, "epoch": 877} {"train_loss": -21.113962173461914, "global_step": 72845, "epoch": 877} {"train_loss": -20.96748161315918, "global_step": 72846, "epoch": 877} {"train_loss": -21.037378311157227, "global_step": 72847, "epoch": 877} {"train_loss": -21.255407333374023, "global_step": 72848, "epoch": 877} {"train_loss": -20.89492416381836, "global_step": 72849, "epoch": 877} {"train_loss": -20.604780197143555, "global_step": 72850, "epoch": 877} {"train_loss": -20.42852783203125, "global_step": 72851, "epoch": 877} {"train_loss": -20.589523315429688, "global_step": 72852, "epoch": 877} {"train_loss": -21.275184631347656, "global_step": 72853, "epoch": 877} {"train_loss": -20.891021728515625, "global_step": 72854, "epoch": 877} {"train_loss": -20.68980598449707, "global_step": 72855, "epoch": 877} {"train_loss": -20.92042350769043, "global_step": 72856, "epoch": 877} {"train_loss": -20.919818878173828, "global_step": 72857, "epoch": 877} {"train_loss": -20.731739044189453, "global_step": 72858, "epoch": 877} {"train_loss": -20.915395736694336, "global_step": 72859, "epoch": 877} {"train_loss": -21.05500602722168, "global_step": 72860, "epoch": 877} {"train_loss": -20.83057975769043, "global_step": 72861, "epoch": 877} {"train_loss": -20.838876724243164, "global_step": 72862, "epoch": 877} {"train_loss": -21.235458374023438, "global_step": 72863, "epoch": 877} {"train_loss": -20.334745407104492, "global_step": 72864, "epoch": 877} {"train_loss": -21.187597274780273, "global_step": 72865, "epoch": 877} {"train_loss": -20.989044189453125, "global_step": 72866, "epoch": 877} {"train_loss": -20.997480392456055, "global_step": 72867, "epoch": 877} {"train_loss": -20.968595504760742, "global_step": 72868, "epoch": 877} {"train_loss": -20.95887565612793, "global_step": 72869, "epoch": 877} {"train_loss": -21.276578903198242, "global_step": 72870, "epoch": 877} {"train_loss": -21.428125381469727, "global_step": 72871, "epoch": 877} {"train_loss": -21.36258888244629, "global_step": 72872, "epoch": 877} {"train_loss": -20.895567216068866, "global_step": 72873, "epoch": 877, "val_loss": 6209147.0} {"train_loss": -20.575754165649414, "global_step": 72874, "epoch": 878} {"train_loss": -20.299909591674805, "global_step": 72875, "epoch": 878} {"train_loss": -20.661407470703125, "global_step": 72876, "epoch": 878} {"train_loss": -20.430370330810547, "global_step": 72877, "epoch": 878} {"train_loss": -20.798582077026367, "global_step": 72878, "epoch": 878} {"train_loss": -19.994556427001953, "global_step": 72879, "epoch": 878} {"train_loss": -20.355810165405273, "global_step": 72880, "epoch": 878} {"train_loss": -20.518239974975586, "global_step": 72881, "epoch": 878} {"train_loss": -20.964889526367188, "global_step": 72882, "epoch": 878} {"train_loss": -20.69587516784668, "global_step": 72883, "epoch": 878} {"train_loss": -20.866703033447266, "global_step": 72884, "epoch": 878} {"train_loss": -20.706674575805664, "global_step": 72885, "epoch": 878} {"train_loss": -21.028352737426758, "global_step": 72886, "epoch": 878} {"train_loss": -20.59547233581543, "global_step": 72887, "epoch": 878} {"train_loss": -20.778579711914062, "global_step": 72888, "epoch": 878} {"train_loss": -20.29530906677246, "global_step": 72889, "epoch": 878} {"train_loss": -20.95680809020996, "global_step": 72890, "epoch": 878} {"train_loss": -20.786182403564453, "global_step": 72891, "epoch": 878} {"train_loss": -20.80219841003418, "global_step": 72892, "epoch": 878} {"train_loss": -21.09665298461914, "global_step": 72893, "epoch": 878} {"train_loss": -20.88292694091797, "global_step": 72894, "epoch": 878} {"train_loss": -21.0026912689209, "global_step": 72895, "epoch": 878} {"train_loss": -20.644657135009766, "global_step": 72896, "epoch": 878} {"train_loss": -20.59227180480957, "global_step": 72897, "epoch": 878} {"train_loss": -20.7760066986084, "global_step": 72898, "epoch": 878} {"train_loss": -20.794145584106445, "global_step": 72899, "epoch": 878} {"train_loss": -20.704288482666016, "global_step": 72900, "epoch": 878} {"train_loss": -20.859506607055664, "global_step": 72901, "epoch": 878} {"train_loss": -21.1929988861084, "global_step": 72902, "epoch": 878} {"train_loss": -20.973800659179688, "global_step": 72903, "epoch": 878} {"train_loss": -21.373971939086914, "global_step": 72904, "epoch": 878} {"train_loss": -20.970020294189453, "global_step": 72905, "epoch": 878} {"train_loss": -20.890045166015625, "global_step": 72906, "epoch": 878} {"train_loss": -20.807661056518555, "global_step": 72907, "epoch": 878} {"train_loss": -21.137718200683594, "global_step": 72908, "epoch": 878} {"train_loss": -20.900026321411133, "global_step": 72909, "epoch": 878} {"train_loss": -20.992910385131836, "global_step": 72910, "epoch": 878} {"train_loss": -20.778654098510742, "global_step": 72911, "epoch": 878} {"train_loss": -21.243778228759766, "global_step": 72912, "epoch": 878} {"train_loss": -21.25705909729004, "global_step": 72913, "epoch": 878} {"train_loss": -20.82378578186035, "global_step": 72914, "epoch": 878} {"train_loss": -20.902755737304688, "global_step": 72915, "epoch": 878} {"train_loss": -21.12059783935547, "global_step": 72916, "epoch": 878} {"train_loss": -20.92923355102539, "global_step": 72917, "epoch": 878} {"train_loss": -20.91596031188965, "global_step": 72918, "epoch": 878} {"train_loss": -20.951847076416016, "global_step": 72919, "epoch": 878} {"train_loss": -20.718183517456055, "global_step": 72920, "epoch": 878} {"train_loss": -20.64015769958496, "global_step": 72921, "epoch": 878} {"train_loss": -21.009906768798828, "global_step": 72922, "epoch": 878} {"train_loss": -21.237293243408203, "global_step": 72923, "epoch": 878} {"train_loss": -21.07307243347168, "global_step": 72924, "epoch": 878} {"train_loss": -21.086702346801758, "global_step": 72925, "epoch": 878} {"train_loss": -20.94379234313965, "global_step": 72926, "epoch": 878} {"train_loss": -20.819684982299805, "global_step": 72927, "epoch": 878} {"train_loss": -21.26666831970215, "global_step": 72928, "epoch": 878} {"train_loss": -21.22977066040039, "global_step": 72929, "epoch": 878} {"train_loss": -20.74868392944336, "global_step": 72930, "epoch": 878} {"train_loss": -21.044858932495117, "global_step": 72931, "epoch": 878} {"train_loss": -20.537038803100586, "global_step": 72932, "epoch": 878} {"train_loss": -21.230762481689453, "global_step": 72933, "epoch": 878} {"train_loss": -21.212278366088867, "global_step": 72934, "epoch": 878} {"train_loss": -20.974979400634766, "global_step": 72935, "epoch": 878} {"train_loss": -21.009763717651367, "global_step": 72936, "epoch": 878} {"train_loss": -20.919885635375977, "global_step": 72937, "epoch": 878} {"train_loss": -20.6571102142334, "global_step": 72938, "epoch": 878} {"train_loss": -21.24648666381836, "global_step": 72939, "epoch": 878} {"train_loss": -21.444684982299805, "global_step": 72940, "epoch": 878} {"train_loss": -21.202661514282227, "global_step": 72941, "epoch": 878} {"train_loss": -21.01163101196289, "global_step": 72942, "epoch": 878} {"train_loss": -20.946365356445312, "global_step": 72943, "epoch": 878} {"train_loss": -20.93814468383789, "global_step": 72944, "epoch": 878} {"train_loss": -20.90809440612793, "global_step": 72945, "epoch": 878} {"train_loss": -20.540271759033203, "global_step": 72946, "epoch": 878} {"train_loss": -20.86618423461914, "global_step": 72947, "epoch": 878} {"train_loss": -20.68488883972168, "global_step": 72948, "epoch": 878} {"train_loss": -21.127553939819336, "global_step": 72949, "epoch": 878} {"train_loss": -20.987272262573242, "global_step": 72950, "epoch": 878} {"train_loss": -20.948396682739258, "global_step": 72951, "epoch": 878} {"train_loss": -20.734838485717773, "global_step": 72952, "epoch": 878} {"train_loss": -20.757139205932617, "global_step": 72953, "epoch": 878} {"train_loss": -20.74693489074707, "global_step": 72954, "epoch": 878} {"train_loss": -20.82503318786621, "global_step": 72955, "epoch": 878} {"train_loss": -20.878054009862694, "global_step": 72956, "epoch": 878, "val_loss": 6063549.0} {"train_loss": -20.714183807373047, "global_step": 72957, "epoch": 879} {"train_loss": -20.662729263305664, "global_step": 72958, "epoch": 879} {"train_loss": -20.797964096069336, "global_step": 72959, "epoch": 879} {"train_loss": -20.48429298400879, "global_step": 72960, "epoch": 879} {"train_loss": -20.57139015197754, "global_step": 72961, "epoch": 879} {"train_loss": -20.277738571166992, "global_step": 72962, "epoch": 879} {"train_loss": -20.47402000427246, "global_step": 72963, "epoch": 879} {"train_loss": -20.506258010864258, "global_step": 72964, "epoch": 879} {"train_loss": -20.337936401367188, "global_step": 72965, "epoch": 879} {"train_loss": -20.632986068725586, "global_step": 72966, "epoch": 879} {"train_loss": -20.946319580078125, "global_step": 72967, "epoch": 879} {"train_loss": -20.50603675842285, "global_step": 72968, "epoch": 879} {"train_loss": -20.64803123474121, "global_step": 72969, "epoch": 879} {"train_loss": -20.848865509033203, "global_step": 72970, "epoch": 879} {"train_loss": -20.645803451538086, "global_step": 72971, "epoch": 879} {"train_loss": -20.783414840698242, "global_step": 72972, "epoch": 879} {"train_loss": -20.939783096313477, "global_step": 72973, "epoch": 879} {"train_loss": -20.710744857788086, "global_step": 72974, "epoch": 879} {"train_loss": -20.76832389831543, "global_step": 72975, "epoch": 879} {"train_loss": -20.55596351623535, "global_step": 72976, "epoch": 879} {"train_loss": -20.894193649291992, "global_step": 72977, "epoch": 879} {"train_loss": -20.829965591430664, "global_step": 72978, "epoch": 879} {"train_loss": -21.15828514099121, "global_step": 72979, "epoch": 879} {"train_loss": -21.113967895507812, "global_step": 72980, "epoch": 879} {"train_loss": -21.210744857788086, "global_step": 72981, "epoch": 879} {"train_loss": -20.559219360351562, "global_step": 72982, "epoch": 879} {"train_loss": -20.97936248779297, "global_step": 72983, "epoch": 879} {"train_loss": -21.128217697143555, "global_step": 72984, "epoch": 879} {"train_loss": -20.966150283813477, "global_step": 72985, "epoch": 879} {"train_loss": -20.814855575561523, "global_step": 72986, "epoch": 879} {"train_loss": -21.122081756591797, "global_step": 72987, "epoch": 879} {"train_loss": -20.335002899169922, "global_step": 72988, "epoch": 879} {"train_loss": -21.13343620300293, "global_step": 72989, "epoch": 879} {"train_loss": -21.07388687133789, "global_step": 72990, "epoch": 879} {"train_loss": -20.849946975708008, "global_step": 72991, "epoch": 879} {"train_loss": -21.078126907348633, "global_step": 72992, "epoch": 879} {"train_loss": -20.80167579650879, "global_step": 72993, "epoch": 879} {"train_loss": -20.824539184570312, "global_step": 72994, "epoch": 879} {"train_loss": -20.785417556762695, "global_step": 72995, "epoch": 879} {"train_loss": -21.216238021850586, "global_step": 72996, "epoch": 879} {"train_loss": -21.095876693725586, "global_step": 72997, "epoch": 879} {"train_loss": -20.741758346557617, "global_step": 72998, "epoch": 879} {"train_loss": -20.88197898864746, "global_step": 72999, "epoch": 879} {"train_loss": -21.1409969329834, "global_step": 73000, "epoch": 879} {"train_loss": -20.686176300048828, "global_step": 73001, "epoch": 879} {"train_loss": -20.750125885009766, "global_step": 73002, "epoch": 879} {"train_loss": -20.886127471923828, "global_step": 73003, "epoch": 879} {"train_loss": -21.121061325073242, "global_step": 73004, "epoch": 879} {"train_loss": -20.839723587036133, "global_step": 73005, "epoch": 879} {"train_loss": -21.154123306274414, "global_step": 73006, "epoch": 879} {"train_loss": -21.612098693847656, "global_step": 73007, "epoch": 879} {"train_loss": -21.171070098876953, "global_step": 73008, "epoch": 879} {"train_loss": -21.02533531188965, "global_step": 73009, "epoch": 879} {"train_loss": -21.063322067260742, "global_step": 73010, "epoch": 879} {"train_loss": -20.75324058532715, "global_step": 73011, "epoch": 879} {"train_loss": -21.42556381225586, "global_step": 73012, "epoch": 879} {"train_loss": -20.98679542541504, "global_step": 73013, "epoch": 879} {"train_loss": -20.777679443359375, "global_step": 73014, "epoch": 879} {"train_loss": -21.341495513916016, "global_step": 73015, "epoch": 879} {"train_loss": -20.948179244995117, "global_step": 73016, "epoch": 879} {"train_loss": -21.091516494750977, "global_step": 73017, "epoch": 879} {"train_loss": -20.88801383972168, "global_step": 73018, "epoch": 879} {"train_loss": -20.891674041748047, "global_step": 73019, "epoch": 879} {"train_loss": -20.80504608154297, "global_step": 73020, "epoch": 879} {"train_loss": -21.152515411376953, "global_step": 73021, "epoch": 879} {"train_loss": -21.17594337463379, "global_step": 73022, "epoch": 879} {"train_loss": -21.392065048217773, "global_step": 73023, "epoch": 879} {"train_loss": -20.86673355102539, "global_step": 73024, "epoch": 879} {"train_loss": -21.374454498291016, "global_step": 73025, "epoch": 879} {"train_loss": -20.77554702758789, "global_step": 73026, "epoch": 879} {"train_loss": -21.135255813598633, "global_step": 73027, "epoch": 879} {"train_loss": -20.84976577758789, "global_step": 73028, "epoch": 879} {"train_loss": -21.35104751586914, "global_step": 73029, "epoch": 879} {"train_loss": -20.73471450805664, "global_step": 73030, "epoch": 879} {"train_loss": -21.031919479370117, "global_step": 73031, "epoch": 879} {"train_loss": -20.701148986816406, "global_step": 73032, "epoch": 879} {"train_loss": -21.16413688659668, "global_step": 73033, "epoch": 879} {"train_loss": -20.92518424987793, "global_step": 73034, "epoch": 879} {"train_loss": -20.827543258666992, "global_step": 73035, "epoch": 879} {"train_loss": -21.03108787536621, "global_step": 73036, "epoch": 879} {"train_loss": -21.19984245300293, "global_step": 73037, "epoch": 879} {"train_loss": -21.00093650817871, "global_step": 73038, "epoch": 879} {"train_loss": -20.895176301519555, "global_step": 73039, "epoch": 879, "val_loss": 6071213.0} {"train_loss": -20.842191696166992, "global_step": 73040, "epoch": 880} {"train_loss": -20.90328025817871, "global_step": 73041, "epoch": 880} {"train_loss": -20.759361267089844, "global_step": 73042, "epoch": 880} {"train_loss": -21.150053024291992, "global_step": 73043, "epoch": 880} {"train_loss": -20.556732177734375, "global_step": 73044, "epoch": 880} {"train_loss": -20.819608688354492, "global_step": 73045, "epoch": 880} {"train_loss": -20.608915328979492, "global_step": 73046, "epoch": 880} {"train_loss": -20.637807846069336, "global_step": 73047, "epoch": 880} {"train_loss": -20.480573654174805, "global_step": 73048, "epoch": 880} {"train_loss": -20.875858306884766, "global_step": 73049, "epoch": 880} {"train_loss": -20.499080657958984, "global_step": 73050, "epoch": 880} {"train_loss": -21.142398834228516, "global_step": 73051, "epoch": 880} {"train_loss": -20.755836486816406, "global_step": 73052, "epoch": 880} {"train_loss": -20.98213768005371, "global_step": 73053, "epoch": 880} {"train_loss": -20.745899200439453, "global_step": 73054, "epoch": 880} {"train_loss": -20.79292106628418, "global_step": 73055, "epoch": 880} {"train_loss": -20.69598960876465, "global_step": 73056, "epoch": 880} {"train_loss": -20.826391220092773, "global_step": 73057, "epoch": 880} {"train_loss": -20.69361686706543, "global_step": 73058, "epoch": 880} {"train_loss": -21.088607788085938, "global_step": 73059, "epoch": 880} {"train_loss": -20.480741500854492, "global_step": 73060, "epoch": 880} {"train_loss": -20.8225154876709, "global_step": 73061, "epoch": 880} {"train_loss": -21.006301879882812, "global_step": 73062, "epoch": 880} {"train_loss": -20.70265007019043, "global_step": 73063, "epoch": 880} {"train_loss": -21.49039649963379, "global_step": 73064, "epoch": 880} {"train_loss": -20.60012435913086, "global_step": 73065, "epoch": 880} {"train_loss": -20.930204391479492, "global_step": 73066, "epoch": 880} {"train_loss": -20.745161056518555, "global_step": 73067, "epoch": 880} {"train_loss": -20.333250045776367, "global_step": 73068, "epoch": 880} {"train_loss": -20.817434310913086, "global_step": 73069, "epoch": 880} {"train_loss": -20.82908058166504, "global_step": 73070, "epoch": 880} {"train_loss": -20.998624801635742, "global_step": 73071, "epoch": 880} {"train_loss": -20.8149471282959, "global_step": 73072, "epoch": 880} {"train_loss": -20.535503387451172, "global_step": 73073, "epoch": 880} {"train_loss": -20.970687866210938, "global_step": 73074, "epoch": 880} {"train_loss": -20.856470108032227, "global_step": 73075, "epoch": 880} {"train_loss": -20.670637130737305, "global_step": 73076, "epoch": 880} {"train_loss": -21.041339874267578, "global_step": 73077, "epoch": 880} {"train_loss": -21.05091667175293, "global_step": 73078, "epoch": 880} {"train_loss": -20.824316024780273, "global_step": 73079, "epoch": 880} {"train_loss": -20.865894317626953, "global_step": 73080, "epoch": 880} {"train_loss": -21.393949508666992, "global_step": 73081, "epoch": 880} {"train_loss": -21.41796875, "global_step": 73082, "epoch": 880} {"train_loss": -21.157976150512695, "global_step": 73083, "epoch": 880} {"train_loss": -21.0198917388916, "global_step": 73084, "epoch": 880} {"train_loss": -20.9194393157959, "global_step": 73085, "epoch": 880} {"train_loss": -21.079504013061523, "global_step": 73086, "epoch": 880} {"train_loss": -21.062849044799805, "global_step": 73087, "epoch": 880} {"train_loss": -20.62842559814453, "global_step": 73088, "epoch": 880} {"train_loss": -20.743995666503906, "global_step": 73089, "epoch": 880} {"train_loss": -21.030065536499023, "global_step": 73090, "epoch": 880} {"train_loss": -21.197160720825195, "global_step": 73091, "epoch": 880} {"train_loss": -20.843467712402344, "global_step": 73092, "epoch": 880} {"train_loss": -21.442371368408203, "global_step": 73093, "epoch": 880} {"train_loss": -20.696441650390625, "global_step": 73094, "epoch": 880} {"train_loss": -20.989694595336914, "global_step": 73095, "epoch": 880} {"train_loss": -21.0035400390625, "global_step": 73096, "epoch": 880} {"train_loss": -20.595666885375977, "global_step": 73097, "epoch": 880} {"train_loss": -20.81015396118164, "global_step": 73098, "epoch": 880} {"train_loss": -20.86684226989746, "global_step": 73099, "epoch": 880} {"train_loss": -20.90108299255371, "global_step": 73100, "epoch": 880} {"train_loss": -20.913677215576172, "global_step": 73101, "epoch": 880} {"train_loss": -20.943939208984375, "global_step": 73102, "epoch": 880} {"train_loss": -20.84558868408203, "global_step": 73103, "epoch": 880} {"train_loss": -20.929141998291016, "global_step": 73104, "epoch": 880} {"train_loss": -20.808597564697266, "global_step": 73105, "epoch": 880} {"train_loss": -21.13715362548828, "global_step": 73106, "epoch": 880} {"train_loss": -20.987709045410156, "global_step": 73107, "epoch": 880} {"train_loss": -20.783321380615234, "global_step": 73108, "epoch": 880} {"train_loss": -20.897823333740234, "global_step": 73109, "epoch": 880} {"train_loss": -20.87163734436035, "global_step": 73110, "epoch": 880} {"train_loss": -21.091373443603516, "global_step": 73111, "epoch": 880} {"train_loss": -21.04193687438965, "global_step": 73112, "epoch": 880} {"train_loss": -21.29105567932129, "global_step": 73113, "epoch": 880} {"train_loss": -20.63730812072754, "global_step": 73114, "epoch": 880} {"train_loss": -20.607025146484375, "global_step": 73115, "epoch": 880} {"train_loss": -20.803709030151367, "global_step": 73116, "epoch": 880} {"train_loss": -20.78166389465332, "global_step": 73117, "epoch": 880} {"train_loss": -20.468400955200195, "global_step": 73118, "epoch": 880} {"train_loss": -21.058076858520508, "global_step": 73119, "epoch": 880} {"train_loss": -20.801191329956055, "global_step": 73120, "epoch": 880} {"train_loss": -20.94453239440918, "global_step": 73121, "epoch": 880} {"train_loss": -20.88756143041404, "global_step": 73122, "epoch": 880, "val_loss": 5935717.5} {"train_loss": -20.882043838500977, "global_step": 73123, "epoch": 881} {"train_loss": -20.495874404907227, "global_step": 73124, "epoch": 881} {"train_loss": -20.126651763916016, "global_step": 73125, "epoch": 881} {"train_loss": -20.79183006286621, "global_step": 73126, "epoch": 881} {"train_loss": -20.417964935302734, "global_step": 73127, "epoch": 881} {"train_loss": -20.667375564575195, "global_step": 73128, "epoch": 881} {"train_loss": -20.248701095581055, "global_step": 73129, "epoch": 881} {"train_loss": -20.713125228881836, "global_step": 73130, "epoch": 881} {"train_loss": -20.577796936035156, "global_step": 73131, "epoch": 881} {"train_loss": -20.805408477783203, "global_step": 73132, "epoch": 881} {"train_loss": -20.62472915649414, "global_step": 73133, "epoch": 881} {"train_loss": -21.030630111694336, "global_step": 73134, "epoch": 881} {"train_loss": -20.763864517211914, "global_step": 73135, "epoch": 881} {"train_loss": -20.893918991088867, "global_step": 73136, "epoch": 881} {"train_loss": -20.24286460876465, "global_step": 73137, "epoch": 881} {"train_loss": -20.6937313079834, "global_step": 73138, "epoch": 881} {"train_loss": -20.947052001953125, "global_step": 73139, "epoch": 881} {"train_loss": -20.476776123046875, "global_step": 73140, "epoch": 881} {"train_loss": -20.53458595275879, "global_step": 73141, "epoch": 881} {"train_loss": -21.192140579223633, "global_step": 73142, "epoch": 881} {"train_loss": -21.253385543823242, "global_step": 73143, "epoch": 881} {"train_loss": -21.11797332763672, "global_step": 73144, "epoch": 881} {"train_loss": -21.0413761138916, "global_step": 73145, "epoch": 881} {"train_loss": -21.043859481811523, "global_step": 73146, "epoch": 881} {"train_loss": -21.007282257080078, "global_step": 73147, "epoch": 881} {"train_loss": -21.25304412841797, "global_step": 73148, "epoch": 881} {"train_loss": -20.587919235229492, "global_step": 73149, "epoch": 881} {"train_loss": -20.9475154876709, "global_step": 73150, "epoch": 881} {"train_loss": -21.36665153503418, "global_step": 73151, "epoch": 881} {"train_loss": -20.9566593170166, "global_step": 73152, "epoch": 881} {"train_loss": -20.694610595703125, "global_step": 73153, "epoch": 881} {"train_loss": -20.845172882080078, "global_step": 73154, "epoch": 881} {"train_loss": -20.905868530273438, "global_step": 73155, "epoch": 881} {"train_loss": -21.220563888549805, "global_step": 73156, "epoch": 881} {"train_loss": -21.071378707885742, "global_step": 73157, "epoch": 881} {"train_loss": -21.02040672302246, "global_step": 73158, "epoch": 881} {"train_loss": -20.78261375427246, "global_step": 73159, "epoch": 881} {"train_loss": -20.851274490356445, "global_step": 73160, "epoch": 881} {"train_loss": -20.5548038482666, "global_step": 73161, "epoch": 881} {"train_loss": -20.869583129882812, "global_step": 73162, "epoch": 881} {"train_loss": -20.961538314819336, "global_step": 73163, "epoch": 881} {"train_loss": -21.10072135925293, "global_step": 73164, "epoch": 881} {"train_loss": -20.645132064819336, "global_step": 73165, "epoch": 881} {"train_loss": -20.947643280029297, "global_step": 73166, "epoch": 881} {"train_loss": -20.809017181396484, "global_step": 73167, "epoch": 881} {"train_loss": -21.186635971069336, "global_step": 73168, "epoch": 881} {"train_loss": -21.180648803710938, "global_step": 73169, "epoch": 881} {"train_loss": -20.649877548217773, "global_step": 73170, "epoch": 881} {"train_loss": -21.214452743530273, "global_step": 73171, "epoch": 881} {"train_loss": -20.93218231201172, "global_step": 73172, "epoch": 881} {"train_loss": -21.305532455444336, "global_step": 73173, "epoch": 881} {"train_loss": -20.630216598510742, "global_step": 73174, "epoch": 881} {"train_loss": -20.890155792236328, "global_step": 73175, "epoch": 881} {"train_loss": -20.864042282104492, "global_step": 73176, "epoch": 881} {"train_loss": -21.15201187133789, "global_step": 73177, "epoch": 881} {"train_loss": -20.867053985595703, "global_step": 73178, "epoch": 881} {"train_loss": -20.967741012573242, "global_step": 73179, "epoch": 881} {"train_loss": -21.12798500061035, "global_step": 73180, "epoch": 881} {"train_loss": -20.924760818481445, "global_step": 73181, "epoch": 881} {"train_loss": -21.144041061401367, "global_step": 73182, "epoch": 881} {"train_loss": -20.90802574157715, "global_step": 73183, "epoch": 881} {"train_loss": -21.123769760131836, "global_step": 73184, "epoch": 881} {"train_loss": -20.862377166748047, "global_step": 73185, "epoch": 881} {"train_loss": -21.152210235595703, "global_step": 73186, "epoch": 881} {"train_loss": -21.115293502807617, "global_step": 73187, "epoch": 881} {"train_loss": -20.99477195739746, "global_step": 73188, "epoch": 881} {"train_loss": -21.207508087158203, "global_step": 73189, "epoch": 881} {"train_loss": -20.78706169128418, "global_step": 73190, "epoch": 881} {"train_loss": -21.094135284423828, "global_step": 73191, "epoch": 881} {"train_loss": -20.941930770874023, "global_step": 73192, "epoch": 881} {"train_loss": -21.065906524658203, "global_step": 73193, "epoch": 881} {"train_loss": -20.955142974853516, "global_step": 73194, "epoch": 881} {"train_loss": -20.905332565307617, "global_step": 73195, "epoch": 881} {"train_loss": -21.111352920532227, "global_step": 73196, "epoch": 881} {"train_loss": -21.000402450561523, "global_step": 73197, "epoch": 881} {"train_loss": -21.063451766967773, "global_step": 73198, "epoch": 881} {"train_loss": -20.9298152923584, "global_step": 73199, "epoch": 881} {"train_loss": -21.013519287109375, "global_step": 73200, "epoch": 881} {"train_loss": -20.657846450805664, "global_step": 73201, "epoch": 881} {"train_loss": -20.985523223876953, "global_step": 73202, "epoch": 881} {"train_loss": -20.932279586791992, "global_step": 73203, "epoch": 881} {"train_loss": -21.036466598510742, "global_step": 73204, "epoch": 881} {"train_loss": -20.90553552558623, "global_step": 73205, "epoch": 881, "val_loss": 6006277.0} {"train_loss": -20.68317985534668, "global_step": 73206, "epoch": 882} {"train_loss": -21.08441734313965, "global_step": 73207, "epoch": 882} {"train_loss": -20.56790542602539, "global_step": 73208, "epoch": 882} {"train_loss": -20.561506271362305, "global_step": 73209, "epoch": 882} {"train_loss": -20.998632431030273, "global_step": 73210, "epoch": 882} {"train_loss": -20.960376739501953, "global_step": 73211, "epoch": 882} {"train_loss": -20.931447982788086, "global_step": 73212, "epoch": 882} {"train_loss": -20.702695846557617, "global_step": 73213, "epoch": 882} {"train_loss": -20.544187545776367, "global_step": 73214, "epoch": 882} {"train_loss": -20.71392059326172, "global_step": 73215, "epoch": 882} {"train_loss": -21.002878189086914, "global_step": 73216, "epoch": 882} {"train_loss": -21.152366638183594, "global_step": 73217, "epoch": 882} {"train_loss": -20.851612091064453, "global_step": 73218, "epoch": 882} {"train_loss": -20.990732192993164, "global_step": 73219, "epoch": 882} {"train_loss": -20.67935562133789, "global_step": 73220, "epoch": 882} {"train_loss": -20.985233306884766, "global_step": 73221, "epoch": 882} {"train_loss": -21.01787757873535, "global_step": 73222, "epoch": 882} {"train_loss": -20.78376579284668, "global_step": 73223, "epoch": 882} {"train_loss": -20.80168914794922, "global_step": 73224, "epoch": 882} {"train_loss": -21.209890365600586, "global_step": 73225, "epoch": 882} {"train_loss": -20.823307037353516, "global_step": 73226, "epoch": 882} {"train_loss": -21.390356063842773, "global_step": 73227, "epoch": 882} {"train_loss": -20.83536148071289, "global_step": 73228, "epoch": 882} {"train_loss": -21.009563446044922, "global_step": 73229, "epoch": 882} {"train_loss": -21.099590301513672, "global_step": 73230, "epoch": 882} {"train_loss": -20.90140151977539, "global_step": 73231, "epoch": 882} {"train_loss": -20.980260848999023, "global_step": 73232, "epoch": 882} {"train_loss": -21.228376388549805, "global_step": 73233, "epoch": 882} {"train_loss": -21.18747329711914, "global_step": 73234, "epoch": 882} {"train_loss": -20.8419246673584, "global_step": 73235, "epoch": 882} {"train_loss": -21.090078353881836, "global_step": 73236, "epoch": 882} {"train_loss": -21.178586959838867, "global_step": 73237, "epoch": 882} {"train_loss": -20.54111671447754, "global_step": 73238, "epoch": 882} {"train_loss": -20.754898071289062, "global_step": 73239, "epoch": 882} {"train_loss": -21.314023971557617, "global_step": 73240, "epoch": 882} {"train_loss": -20.842374801635742, "global_step": 73241, "epoch": 882} {"train_loss": -20.965803146362305, "global_step": 73242, "epoch": 882} {"train_loss": -21.173383712768555, "global_step": 73243, "epoch": 882} {"train_loss": -21.120960235595703, "global_step": 73244, "epoch": 882} {"train_loss": -20.969213485717773, "global_step": 73245, "epoch": 882} {"train_loss": -21.200712203979492, "global_step": 73246, "epoch": 882} {"train_loss": -21.195680618286133, "global_step": 73247, "epoch": 882} {"train_loss": -21.100147247314453, "global_step": 73248, "epoch": 882} {"train_loss": -20.909635543823242, "global_step": 73249, "epoch": 882} {"train_loss": -20.545181274414062, "global_step": 73250, "epoch": 882} {"train_loss": -21.039209365844727, "global_step": 73251, "epoch": 882} {"train_loss": -21.05756187438965, "global_step": 73252, "epoch": 882} {"train_loss": -21.04741859436035, "global_step": 73253, "epoch": 882} {"train_loss": -20.716232299804688, "global_step": 73254, "epoch": 882} {"train_loss": -20.985107421875, "global_step": 73255, "epoch": 882} {"train_loss": -20.35709571838379, "global_step": 73256, "epoch": 882} {"train_loss": -20.68588638305664, "global_step": 73257, "epoch": 882} {"train_loss": -20.767894744873047, "global_step": 73258, "epoch": 882} {"train_loss": -20.6763916015625, "global_step": 73259, "epoch": 882} {"train_loss": -20.881689071655273, "global_step": 73260, "epoch": 882} {"train_loss": -20.883413314819336, "global_step": 73261, "epoch": 882} {"train_loss": -20.874338150024414, "global_step": 73262, "epoch": 882} {"train_loss": -20.68671417236328, "global_step": 73263, "epoch": 882} {"train_loss": -20.784900665283203, "global_step": 73264, "epoch": 882} {"train_loss": -20.882017135620117, "global_step": 73265, "epoch": 882} {"train_loss": -20.66167449951172, "global_step": 73266, "epoch": 882} {"train_loss": -20.9620418548584, "global_step": 73267, "epoch": 882} {"train_loss": -20.70356559753418, "global_step": 73268, "epoch": 882} {"train_loss": -20.725088119506836, "global_step": 73269, "epoch": 882} {"train_loss": -21.065580368041992, "global_step": 73270, "epoch": 882} {"train_loss": -20.669795989990234, "global_step": 73271, "epoch": 882} {"train_loss": -20.866443634033203, "global_step": 73272, "epoch": 882} {"train_loss": -21.21140480041504, "global_step": 73273, "epoch": 882} {"train_loss": -20.944189071655273, "global_step": 73274, "epoch": 882} {"train_loss": -21.135852813720703, "global_step": 73275, "epoch": 882} {"train_loss": -20.916139602661133, "global_step": 73276, "epoch": 882} {"train_loss": -20.93604850769043, "global_step": 73277, "epoch": 882} {"train_loss": -21.125699996948242, "global_step": 73278, "epoch": 882} {"train_loss": -20.773359298706055, "global_step": 73279, "epoch": 882} {"train_loss": -20.703792572021484, "global_step": 73280, "epoch": 882} {"train_loss": -20.77415657043457, "global_step": 73281, "epoch": 882} {"train_loss": -20.806827545166016, "global_step": 73282, "epoch": 882} {"train_loss": -20.734392166137695, "global_step": 73283, "epoch": 882} {"train_loss": -20.89177131652832, "global_step": 73284, "epoch": 882} {"train_loss": -20.85434913635254, "global_step": 73285, "epoch": 882} {"train_loss": -20.672765731811523, "global_step": 73286, "epoch": 882} {"train_loss": -20.88661766052246, "global_step": 73287, "epoch": 882} {"train_loss": -20.907579766698632, "global_step": 73288, "epoch": 882, "val_loss": 5913267.0} {"train_loss": -21.022924423217773, "global_step": 73289, "epoch": 883} {"train_loss": -20.881484985351562, "global_step": 73290, "epoch": 883} {"train_loss": -20.830114364624023, "global_step": 73291, "epoch": 883} {"train_loss": -20.609113693237305, "global_step": 73292, "epoch": 883} {"train_loss": -20.594009399414062, "global_step": 73293, "epoch": 883} {"train_loss": -20.567285537719727, "global_step": 73294, "epoch": 883} {"train_loss": -20.529605865478516, "global_step": 73295, "epoch": 883} {"train_loss": -20.64544677734375, "global_step": 73296, "epoch": 883} {"train_loss": -20.97606086730957, "global_step": 73297, "epoch": 883} {"train_loss": -20.69268226623535, "global_step": 73298, "epoch": 883} {"train_loss": -21.024301528930664, "global_step": 73299, "epoch": 883} {"train_loss": -21.01727867126465, "global_step": 73300, "epoch": 883} {"train_loss": -20.90911293029785, "global_step": 73301, "epoch": 883} {"train_loss": -20.82430076599121, "global_step": 73302, "epoch": 883} {"train_loss": -20.706838607788086, "global_step": 73303, "epoch": 883} {"train_loss": -21.09359359741211, "global_step": 73304, "epoch": 883} {"train_loss": -21.078786849975586, "global_step": 73305, "epoch": 883} {"train_loss": -21.154096603393555, "global_step": 73306, "epoch": 883} {"train_loss": -21.19464111328125, "global_step": 73307, "epoch": 883} {"train_loss": -21.018640518188477, "global_step": 73308, "epoch": 883} {"train_loss": -20.750680923461914, "global_step": 73309, "epoch": 883} {"train_loss": -20.79030418395996, "global_step": 73310, "epoch": 883} {"train_loss": -21.046749114990234, "global_step": 73311, "epoch": 883} {"train_loss": -21.009510040283203, "global_step": 73312, "epoch": 883} {"train_loss": -21.073806762695312, "global_step": 73313, "epoch": 883} {"train_loss": -21.022703170776367, "global_step": 73314, "epoch": 883} {"train_loss": -20.751432418823242, "global_step": 73315, "epoch": 883} {"train_loss": -20.561832427978516, "global_step": 73316, "epoch": 883} {"train_loss": -20.929162979125977, "global_step": 73317, "epoch": 883} {"train_loss": -20.780277252197266, "global_step": 73318, "epoch": 883} {"train_loss": -21.06316566467285, "global_step": 73319, "epoch": 883} {"train_loss": -20.790966033935547, "global_step": 73320, "epoch": 883} {"train_loss": -20.906808853149414, "global_step": 73321, "epoch": 883} {"train_loss": -20.874921798706055, "global_step": 73322, "epoch": 883} {"train_loss": -20.962392807006836, "global_step": 73323, "epoch": 883} {"train_loss": -20.870634078979492, "global_step": 73324, "epoch": 883} {"train_loss": -20.951580047607422, "global_step": 73325, "epoch": 883} {"train_loss": -21.310638427734375, "global_step": 73326, "epoch": 883} {"train_loss": -20.820669174194336, "global_step": 73327, "epoch": 883} {"train_loss": -21.061477661132812, "global_step": 73328, "epoch": 883} {"train_loss": -20.86488914489746, "global_step": 73329, "epoch": 883} {"train_loss": -20.96181297302246, "global_step": 73330, "epoch": 883} {"train_loss": -20.882888793945312, "global_step": 73331, "epoch": 883} {"train_loss": -20.976966857910156, "global_step": 73332, "epoch": 883} {"train_loss": -21.02638053894043, "global_step": 73333, "epoch": 883} {"train_loss": -20.76786231994629, "global_step": 73334, "epoch": 883} {"train_loss": -20.77028465270996, "global_step": 73335, "epoch": 883} {"train_loss": -20.894887924194336, "global_step": 73336, "epoch": 883} {"train_loss": -20.761526107788086, "global_step": 73337, "epoch": 883} {"train_loss": -20.76114273071289, "global_step": 73338, "epoch": 883} {"train_loss": -21.060958862304688, "global_step": 73339, "epoch": 883} {"train_loss": -20.77579116821289, "global_step": 73340, "epoch": 883} {"train_loss": -21.122507095336914, "global_step": 73341, "epoch": 883} {"train_loss": -20.900192260742188, "global_step": 73342, "epoch": 883} {"train_loss": -21.012434005737305, "global_step": 73343, "epoch": 883} {"train_loss": -21.191831588745117, "global_step": 73344, "epoch": 883} {"train_loss": -20.736988067626953, "global_step": 73345, "epoch": 883} {"train_loss": -20.84443473815918, "global_step": 73346, "epoch": 883} {"train_loss": -21.045623779296875, "global_step": 73347, "epoch": 883} {"train_loss": -20.723466873168945, "global_step": 73348, "epoch": 883} {"train_loss": -20.761199951171875, "global_step": 73349, "epoch": 883} {"train_loss": -21.099884033203125, "global_step": 73350, "epoch": 883} {"train_loss": -20.953672409057617, "global_step": 73351, "epoch": 883} {"train_loss": -21.06663703918457, "global_step": 73352, "epoch": 883} {"train_loss": -21.269704818725586, "global_step": 73353, "epoch": 883} {"train_loss": -20.938175201416016, "global_step": 73354, "epoch": 883} {"train_loss": -20.53809928894043, "global_step": 73355, "epoch": 883} {"train_loss": -20.915246963500977, "global_step": 73356, "epoch": 883} {"train_loss": -20.966110229492188, "global_step": 73357, "epoch": 883} {"train_loss": -21.19562530517578, "global_step": 73358, "epoch": 883} {"train_loss": -21.007598876953125, "global_step": 73359, "epoch": 883} {"train_loss": -21.139846801757812, "global_step": 73360, "epoch": 883} {"train_loss": -21.079679489135742, "global_step": 73361, "epoch": 883} {"train_loss": -20.952274322509766, "global_step": 73362, "epoch": 883} {"train_loss": -21.307659149169922, "global_step": 73363, "epoch": 883} {"train_loss": -21.159774780273438, "global_step": 73364, "epoch": 883} {"train_loss": -20.673551559448242, "global_step": 73365, "epoch": 883} {"train_loss": -21.05765724182129, "global_step": 73366, "epoch": 883} {"train_loss": -21.106916427612305, "global_step": 73367, "epoch": 883} {"train_loss": -20.842477798461914, "global_step": 73368, "epoch": 883} {"train_loss": -21.00901222229004, "global_step": 73369, "epoch": 883} {"train_loss": -21.162473678588867, "global_step": 73370, "epoch": 883} {"train_loss": -20.927463899175805, "global_step": 73371, "epoch": 883, "val_loss": 6091087.0} {"train_loss": -20.46780776977539, "global_step": 73372, "epoch": 884} {"train_loss": -20.606128692626953, "global_step": 73373, "epoch": 884} {"train_loss": -20.94451904296875, "global_step": 73374, "epoch": 884} {"train_loss": -20.483707427978516, "global_step": 73375, "epoch": 884} {"train_loss": -20.75669288635254, "global_step": 73376, "epoch": 884} {"train_loss": -20.05848503112793, "global_step": 73377, "epoch": 884} {"train_loss": -20.5833740234375, "global_step": 73378, "epoch": 884} {"train_loss": -20.531503677368164, "global_step": 73379, "epoch": 884} {"train_loss": -20.796157836914062, "global_step": 73380, "epoch": 884} {"train_loss": -21.041500091552734, "global_step": 73381, "epoch": 884} {"train_loss": -20.60383415222168, "global_step": 73382, "epoch": 884} {"train_loss": -20.94205665588379, "global_step": 73383, "epoch": 884} {"train_loss": -20.93097496032715, "global_step": 73384, "epoch": 884} {"train_loss": -20.533082962036133, "global_step": 73385, "epoch": 884} {"train_loss": -20.89266586303711, "global_step": 73386, "epoch": 884} {"train_loss": -20.767271041870117, "global_step": 73387, "epoch": 884} {"train_loss": -20.537078857421875, "global_step": 73388, "epoch": 884} {"train_loss": -20.57977294921875, "global_step": 73389, "epoch": 884} {"train_loss": -20.907007217407227, "global_step": 73390, "epoch": 884} {"train_loss": -20.669971466064453, "global_step": 73391, "epoch": 884} {"train_loss": -20.447479248046875, "global_step": 73392, "epoch": 884} {"train_loss": -21.183773040771484, "global_step": 73393, "epoch": 884} {"train_loss": -20.821645736694336, "global_step": 73394, "epoch": 884} {"train_loss": -20.87546730041504, "global_step": 73395, "epoch": 884} {"train_loss": -20.618682861328125, "global_step": 73396, "epoch": 884} {"train_loss": -20.96620750427246, "global_step": 73397, "epoch": 884} {"train_loss": -20.759119033813477, "global_step": 73398, "epoch": 884} {"train_loss": -20.46358871459961, "global_step": 73399, "epoch": 884} {"train_loss": -21.233379364013672, "global_step": 73400, "epoch": 884} {"train_loss": -20.530029296875, "global_step": 73401, "epoch": 884} {"train_loss": -21.095266342163086, "global_step": 73402, "epoch": 884} {"train_loss": -20.982290267944336, "global_step": 73403, "epoch": 884} {"train_loss": -20.575035095214844, "global_step": 73404, "epoch": 884} {"train_loss": -20.944665908813477, "global_step": 73405, "epoch": 884} {"train_loss": -21.043439865112305, "global_step": 73406, "epoch": 884} {"train_loss": -20.884931564331055, "global_step": 73407, "epoch": 884} {"train_loss": -20.472509384155273, "global_step": 73408, "epoch": 884} {"train_loss": -20.97171974182129, "global_step": 73409, "epoch": 884} {"train_loss": -21.188566207885742, "global_step": 73410, "epoch": 884} {"train_loss": -20.73033905029297, "global_step": 73411, "epoch": 884} {"train_loss": -20.97710609436035, "global_step": 73412, "epoch": 884} {"train_loss": -20.942115783691406, "global_step": 73413, "epoch": 884} {"train_loss": -20.511566162109375, "global_step": 73414, "epoch": 884} {"train_loss": -20.81123161315918, "global_step": 73415, "epoch": 884} {"train_loss": -20.803640365600586, "global_step": 73416, "epoch": 884} {"train_loss": -20.807157516479492, "global_step": 73417, "epoch": 884} {"train_loss": -20.9219913482666, "global_step": 73418, "epoch": 884} {"train_loss": -21.01510238647461, "global_step": 73419, "epoch": 884} {"train_loss": -21.129987716674805, "global_step": 73420, "epoch": 884} {"train_loss": -21.055204391479492, "global_step": 73421, "epoch": 884} {"train_loss": -20.907148361206055, "global_step": 73422, "epoch": 884} {"train_loss": -20.938674926757812, "global_step": 73423, "epoch": 884} {"train_loss": -20.561262130737305, "global_step": 73424, "epoch": 884} {"train_loss": -20.94782829284668, "global_step": 73425, "epoch": 884} {"train_loss": -21.22223472595215, "global_step": 73426, "epoch": 884} {"train_loss": -21.034780502319336, "global_step": 73427, "epoch": 884} {"train_loss": -20.913127899169922, "global_step": 73428, "epoch": 884} {"train_loss": -20.755229949951172, "global_step": 73429, "epoch": 884} {"train_loss": -20.64365577697754, "global_step": 73430, "epoch": 884} {"train_loss": -20.823028564453125, "global_step": 73431, "epoch": 884} {"train_loss": -21.113069534301758, "global_step": 73432, "epoch": 884} {"train_loss": -20.63851547241211, "global_step": 73433, "epoch": 884} {"train_loss": -20.903228759765625, "global_step": 73434, "epoch": 884} {"train_loss": -21.217649459838867, "global_step": 73435, "epoch": 884} {"train_loss": -20.880929946899414, "global_step": 73436, "epoch": 884} {"train_loss": -21.135934829711914, "global_step": 73437, "epoch": 884} {"train_loss": -20.886260986328125, "global_step": 73438, "epoch": 884} {"train_loss": -21.430885314941406, "global_step": 73439, "epoch": 884} {"train_loss": -21.4591121673584, "global_step": 73440, "epoch": 884} {"train_loss": -21.082372665405273, "global_step": 73441, "epoch": 884} {"train_loss": -21.020845413208008, "global_step": 73442, "epoch": 884} {"train_loss": -20.88506507873535, "global_step": 73443, "epoch": 884} {"train_loss": -20.931638717651367, "global_step": 73444, "epoch": 884} {"train_loss": -21.168861389160156, "global_step": 73445, "epoch": 884} {"train_loss": -20.72274398803711, "global_step": 73446, "epoch": 884} {"train_loss": -21.216243743896484, "global_step": 73447, "epoch": 884} {"train_loss": -21.04886817932129, "global_step": 73448, "epoch": 884} {"train_loss": -20.843229293823242, "global_step": 73449, "epoch": 884} {"train_loss": -20.803232192993164, "global_step": 73450, "epoch": 884} {"train_loss": -21.01301383972168, "global_step": 73451, "epoch": 884} {"train_loss": -20.8055477142334, "global_step": 73452, "epoch": 884} {"train_loss": -21.049530029296875, "global_step": 73453, "epoch": 884} {"train_loss": -20.872239009443536, "global_step": 73454, "epoch": 884, "val_loss": 5980173.0} {"train_loss": -20.67974853515625, "global_step": 73455, "epoch": 885} {"train_loss": -20.45989990234375, "global_step": 73456, "epoch": 885} {"train_loss": -20.789466857910156, "global_step": 73457, "epoch": 885} {"train_loss": -20.45444107055664, "global_step": 73458, "epoch": 885} {"train_loss": -20.516721725463867, "global_step": 73459, "epoch": 885} {"train_loss": -20.67305564880371, "global_step": 73460, "epoch": 885} {"train_loss": -20.690153121948242, "global_step": 73461, "epoch": 885} {"train_loss": -20.580102920532227, "global_step": 73462, "epoch": 885} {"train_loss": -20.493507385253906, "global_step": 73463, "epoch": 885} {"train_loss": -20.7978515625, "global_step": 73464, "epoch": 885} {"train_loss": -20.751667022705078, "global_step": 73465, "epoch": 885} {"train_loss": -20.318281173706055, "global_step": 73466, "epoch": 885} {"train_loss": -21.420957565307617, "global_step": 73467, "epoch": 885} {"train_loss": -20.42655372619629, "global_step": 73468, "epoch": 885} {"train_loss": -20.70514488220215, "global_step": 73469, "epoch": 885} {"train_loss": -20.605716705322266, "global_step": 73470, "epoch": 885} {"train_loss": -20.90955352783203, "global_step": 73471, "epoch": 885} {"train_loss": -20.877695083618164, "global_step": 73472, "epoch": 885} {"train_loss": -21.047842025756836, "global_step": 73473, "epoch": 885} {"train_loss": -21.2741756439209, "global_step": 73474, "epoch": 885} {"train_loss": -20.515913009643555, "global_step": 73475, "epoch": 885} {"train_loss": -20.549245834350586, "global_step": 73476, "epoch": 885} {"train_loss": -20.95199203491211, "global_step": 73477, "epoch": 885} {"train_loss": -20.792463302612305, "global_step": 73478, "epoch": 885} {"train_loss": -21.414165496826172, "global_step": 73479, "epoch": 885} {"train_loss": -20.857938766479492, "global_step": 73480, "epoch": 885} {"train_loss": -20.758718490600586, "global_step": 73481, "epoch": 885} {"train_loss": -21.082794189453125, "global_step": 73482, "epoch": 885} {"train_loss": -20.97881317138672, "global_step": 73483, "epoch": 885} {"train_loss": -21.18045425415039, "global_step": 73484, "epoch": 885} {"train_loss": -21.071544647216797, "global_step": 73485, "epoch": 885} {"train_loss": -20.774206161499023, "global_step": 73486, "epoch": 885} {"train_loss": -21.179616928100586, "global_step": 73487, "epoch": 885} {"train_loss": -21.320348739624023, "global_step": 73488, "epoch": 885} {"train_loss": -21.00741958618164, "global_step": 73489, "epoch": 885} {"train_loss": -20.867488861083984, "global_step": 73490, "epoch": 885} {"train_loss": -20.77500343322754, "global_step": 73491, "epoch": 885} {"train_loss": -21.043973922729492, "global_step": 73492, "epoch": 885} {"train_loss": -20.835012435913086, "global_step": 73493, "epoch": 885} {"train_loss": -21.1368408203125, "global_step": 73494, "epoch": 885} {"train_loss": -21.214385986328125, "global_step": 73495, "epoch": 885} {"train_loss": -20.8656063079834, "global_step": 73496, "epoch": 885} {"train_loss": -21.14114761352539, "global_step": 73497, "epoch": 885} {"train_loss": -21.250707626342773, "global_step": 73498, "epoch": 885} {"train_loss": -21.30731964111328, "global_step": 73499, "epoch": 885} {"train_loss": -21.242483139038086, "global_step": 73500, "epoch": 885} {"train_loss": -21.01893424987793, "global_step": 73501, "epoch": 885} {"train_loss": -21.029897689819336, "global_step": 73502, "epoch": 885} {"train_loss": -20.770919799804688, "global_step": 73503, "epoch": 885} {"train_loss": -20.743141174316406, "global_step": 73504, "epoch": 885} {"train_loss": -20.658008575439453, "global_step": 73505, "epoch": 885} {"train_loss": -21.425413131713867, "global_step": 73506, "epoch": 885} {"train_loss": -21.059783935546875, "global_step": 73507, "epoch": 885} {"train_loss": -21.1528377532959, "global_step": 73508, "epoch": 885} {"train_loss": -21.04408836364746, "global_step": 73509, "epoch": 885} {"train_loss": -20.80189323425293, "global_step": 73510, "epoch": 885} {"train_loss": -21.039342880249023, "global_step": 73511, "epoch": 885} {"train_loss": -21.04729652404785, "global_step": 73512, "epoch": 885} {"train_loss": -20.829071044921875, "global_step": 73513, "epoch": 885} {"train_loss": -20.839359283447266, "global_step": 73514, "epoch": 885} {"train_loss": -20.97650718688965, "global_step": 73515, "epoch": 885} {"train_loss": -20.623943328857422, "global_step": 73516, "epoch": 885} {"train_loss": -21.11610221862793, "global_step": 73517, "epoch": 885} {"train_loss": -21.162860870361328, "global_step": 73518, "epoch": 885} {"train_loss": -21.073530197143555, "global_step": 73519, "epoch": 885} {"train_loss": -20.995590209960938, "global_step": 73520, "epoch": 885} {"train_loss": -20.800283432006836, "global_step": 73521, "epoch": 885} {"train_loss": -21.101726531982422, "global_step": 73522, "epoch": 885} {"train_loss": -21.142194747924805, "global_step": 73523, "epoch": 885} {"train_loss": -21.255813598632812, "global_step": 73524, "epoch": 885} {"train_loss": -21.029951095581055, "global_step": 73525, "epoch": 885} {"train_loss": -20.88490867614746, "global_step": 73526, "epoch": 885} {"train_loss": -20.81578254699707, "global_step": 73527, "epoch": 885} {"train_loss": -21.451074600219727, "global_step": 73528, "epoch": 885} {"train_loss": -21.144445419311523, "global_step": 73529, "epoch": 885} {"train_loss": -21.17327117919922, "global_step": 73530, "epoch": 885} {"train_loss": -21.046573638916016, "global_step": 73531, "epoch": 885} {"train_loss": -20.989919662475586, "global_step": 73532, "epoch": 885} {"train_loss": -21.190906524658203, "global_step": 73533, "epoch": 885} {"train_loss": -20.859668731689453, "global_step": 73534, "epoch": 885} {"train_loss": -20.831159591674805, "global_step": 73535, "epoch": 885} {"train_loss": -20.71755027770996, "global_step": 73536, "epoch": 885} {"train_loss": -20.914793060486573, "global_step": 73537, "epoch": 885, "val_loss": 6035989.5} {"train_loss": -20.659509658813477, "global_step": 73538, "epoch": 886} {"train_loss": -20.618669509887695, "global_step": 73539, "epoch": 886} {"train_loss": -20.872533798217773, "global_step": 73540, "epoch": 886} {"train_loss": -20.845794677734375, "global_step": 73541, "epoch": 886} {"train_loss": -21.010684967041016, "global_step": 73542, "epoch": 886} {"train_loss": -20.788267135620117, "global_step": 73543, "epoch": 886} {"train_loss": -20.965667724609375, "global_step": 73544, "epoch": 886} {"train_loss": -20.629106521606445, "global_step": 73545, "epoch": 886} {"train_loss": -20.717042922973633, "global_step": 73546, "epoch": 886} {"train_loss": -20.741989135742188, "global_step": 73547, "epoch": 886} {"train_loss": -20.749189376831055, "global_step": 73548, "epoch": 886} {"train_loss": -20.759614944458008, "global_step": 73549, "epoch": 886} {"train_loss": -20.770824432373047, "global_step": 73550, "epoch": 886} {"train_loss": -20.77166748046875, "global_step": 73551, "epoch": 886} {"train_loss": -20.575878143310547, "global_step": 73552, "epoch": 886} {"train_loss": -21.053861618041992, "global_step": 73553, "epoch": 886} {"train_loss": -20.807376861572266, "global_step": 73554, "epoch": 886} {"train_loss": -21.164255142211914, "global_step": 73555, "epoch": 886} {"train_loss": -20.778100967407227, "global_step": 73556, "epoch": 886} {"train_loss": -21.132160186767578, "global_step": 73557, "epoch": 886} {"train_loss": -21.216354370117188, "global_step": 73558, "epoch": 886} {"train_loss": -20.949377059936523, "global_step": 73559, "epoch": 886} {"train_loss": -21.07380485534668, "global_step": 73560, "epoch": 886} {"train_loss": -21.113401412963867, "global_step": 73561, "epoch": 886} {"train_loss": -20.985408782958984, "global_step": 73562, "epoch": 886} {"train_loss": -21.06618309020996, "global_step": 73563, "epoch": 886} {"train_loss": -21.272043228149414, "global_step": 73564, "epoch": 886} {"train_loss": -21.182697296142578, "global_step": 73565, "epoch": 886} {"train_loss": -21.122486114501953, "global_step": 73566, "epoch": 886} {"train_loss": -21.17872428894043, "global_step": 73567, "epoch": 886} {"train_loss": -21.321996688842773, "global_step": 73568, "epoch": 886} {"train_loss": -21.00898551940918, "global_step": 73569, "epoch": 886} {"train_loss": -20.84456443786621, "global_step": 73570, "epoch": 886} {"train_loss": -21.257455825805664, "global_step": 73571, "epoch": 886} {"train_loss": -20.820667266845703, "global_step": 73572, "epoch": 886} {"train_loss": -21.115140914916992, "global_step": 73573, "epoch": 886} {"train_loss": -20.637678146362305, "global_step": 73574, "epoch": 886} {"train_loss": -20.870389938354492, "global_step": 73575, "epoch": 886} {"train_loss": -21.03413200378418, "global_step": 73576, "epoch": 886} {"train_loss": -20.551639556884766, "global_step": 73577, "epoch": 886} {"train_loss": -21.012460708618164, "global_step": 73578, "epoch": 886} {"train_loss": -20.887706756591797, "global_step": 73579, "epoch": 886} {"train_loss": -20.99822998046875, "global_step": 73580, "epoch": 886} {"train_loss": -21.19487953186035, "global_step": 73581, "epoch": 886} {"train_loss": -21.216623306274414, "global_step": 73582, "epoch": 886} {"train_loss": -20.703903198242188, "global_step": 73583, "epoch": 886} {"train_loss": -20.903474807739258, "global_step": 73584, "epoch": 886} {"train_loss": -20.867252349853516, "global_step": 73585, "epoch": 886} {"train_loss": -21.1101131439209, "global_step": 73586, "epoch": 886} {"train_loss": -20.828615188598633, "global_step": 73587, "epoch": 886} {"train_loss": -20.898956298828125, "global_step": 73588, "epoch": 886} {"train_loss": -21.268003463745117, "global_step": 73589, "epoch": 886} {"train_loss": -20.946805953979492, "global_step": 73590, "epoch": 886} {"train_loss": -21.618223190307617, "global_step": 73591, "epoch": 886} {"train_loss": -20.841123580932617, "global_step": 73592, "epoch": 886} {"train_loss": -21.126516342163086, "global_step": 73593, "epoch": 886} {"train_loss": -21.41254234313965, "global_step": 73594, "epoch": 886} {"train_loss": -20.971113204956055, "global_step": 73595, "epoch": 886} {"train_loss": -20.758596420288086, "global_step": 73596, "epoch": 886} {"train_loss": -20.914199829101562, "global_step": 73597, "epoch": 886} {"train_loss": -20.93743896484375, "global_step": 73598, "epoch": 886} {"train_loss": -20.888839721679688, "global_step": 73599, "epoch": 886} {"train_loss": -20.982818603515625, "global_step": 73600, "epoch": 886} {"train_loss": -21.364233016967773, "global_step": 73601, "epoch": 886} {"train_loss": -21.2423095703125, "global_step": 73602, "epoch": 886} {"train_loss": -20.865930557250977, "global_step": 73603, "epoch": 886} {"train_loss": -20.974258422851562, "global_step": 73604, "epoch": 886} {"train_loss": -21.08026123046875, "global_step": 73605, "epoch": 886} {"train_loss": -20.763761520385742, "global_step": 73606, "epoch": 886} {"train_loss": -20.85911750793457, "global_step": 73607, "epoch": 886} {"train_loss": -20.86945915222168, "global_step": 73608, "epoch": 886} {"train_loss": -21.35324478149414, "global_step": 73609, "epoch": 886} {"train_loss": -20.931066513061523, "global_step": 73610, "epoch": 886} {"train_loss": -21.067279815673828, "global_step": 73611, "epoch": 886} {"train_loss": -21.42027473449707, "global_step": 73612, "epoch": 886} {"train_loss": -21.194965362548828, "global_step": 73613, "epoch": 886} {"train_loss": -20.927322387695312, "global_step": 73614, "epoch": 886} {"train_loss": -20.763565063476562, "global_step": 73615, "epoch": 886} {"train_loss": -21.023672103881836, "global_step": 73616, "epoch": 886} {"train_loss": -21.22260856628418, "global_step": 73617, "epoch": 886} {"train_loss": -21.277448654174805, "global_step": 73618, "epoch": 886} {"train_loss": -20.375186920166016, "global_step": 73619, "epoch": 886} {"train_loss": -20.9653194151729, "global_step": 73620, "epoch": 886, "val_loss": 5996482.5} {"train_loss": -20.51979637145996, "global_step": 73621, "epoch": 887} {"train_loss": -20.655973434448242, "global_step": 73622, "epoch": 887} {"train_loss": -20.782445907592773, "global_step": 73623, "epoch": 887} {"train_loss": -20.6685848236084, "global_step": 73624, "epoch": 887} {"train_loss": -21.035306930541992, "global_step": 73625, "epoch": 887} {"train_loss": -20.81525230407715, "global_step": 73626, "epoch": 887} {"train_loss": -20.896636962890625, "global_step": 73627, "epoch": 887} {"train_loss": -21.151424407958984, "global_step": 73628, "epoch": 887} {"train_loss": -20.548002243041992, "global_step": 73629, "epoch": 887} {"train_loss": -20.879562377929688, "global_step": 73630, "epoch": 887} {"train_loss": -20.380556106567383, "global_step": 73631, "epoch": 887} {"train_loss": -20.808502197265625, "global_step": 73632, "epoch": 887} {"train_loss": -20.842947006225586, "global_step": 73633, "epoch": 887} {"train_loss": -20.610124588012695, "global_step": 73634, "epoch": 887} {"train_loss": -21.400455474853516, "global_step": 73635, "epoch": 887} {"train_loss": -21.04825210571289, "global_step": 73636, "epoch": 887} {"train_loss": -20.82673454284668, "global_step": 73637, "epoch": 887} {"train_loss": -21.27373695373535, "global_step": 73638, "epoch": 887} {"train_loss": -20.629213333129883, "global_step": 73639, "epoch": 887} {"train_loss": -21.08357810974121, "global_step": 73640, "epoch": 887} {"train_loss": -20.717315673828125, "global_step": 73641, "epoch": 887} {"train_loss": -20.695093154907227, "global_step": 73642, "epoch": 887} {"train_loss": -20.716466903686523, "global_step": 73643, "epoch": 887} {"train_loss": -20.812471389770508, "global_step": 73644, "epoch": 887} {"train_loss": -20.954864501953125, "global_step": 73645, "epoch": 887} {"train_loss": -21.26761245727539, "global_step": 73646, "epoch": 887} {"train_loss": -20.935049057006836, "global_step": 73647, "epoch": 887} {"train_loss": -21.047321319580078, "global_step": 73648, "epoch": 887} {"train_loss": -20.917518615722656, "global_step": 73649, "epoch": 887} {"train_loss": -21.31722068786621, "global_step": 73650, "epoch": 887} {"train_loss": -20.878253936767578, "global_step": 73651, "epoch": 887} {"train_loss": -21.09856605529785, "global_step": 73652, "epoch": 887} {"train_loss": -21.4471378326416, "global_step": 73653, "epoch": 887} {"train_loss": -20.961503982543945, "global_step": 73654, "epoch": 887} {"train_loss": -21.349790573120117, "global_step": 73655, "epoch": 887} {"train_loss": -20.734960556030273, "global_step": 73656, "epoch": 887} {"train_loss": -21.04506492614746, "global_step": 73657, "epoch": 887} {"train_loss": -20.8073787689209, "global_step": 73658, "epoch": 887} {"train_loss": -20.706357955932617, "global_step": 73659, "epoch": 887} {"train_loss": -20.817123413085938, "global_step": 73660, "epoch": 887} {"train_loss": -20.835046768188477, "global_step": 73661, "epoch": 887} {"train_loss": -21.057178497314453, "global_step": 73662, "epoch": 887} {"train_loss": -20.901792526245117, "global_step": 73663, "epoch": 887} {"train_loss": -20.785131454467773, "global_step": 73664, "epoch": 887} {"train_loss": -20.649023056030273, "global_step": 73665, "epoch": 887} {"train_loss": -21.049970626831055, "global_step": 73666, "epoch": 887} {"train_loss": -21.02107048034668, "global_step": 73667, "epoch": 887} {"train_loss": -20.947736740112305, "global_step": 73668, "epoch": 887} {"train_loss": -20.937429428100586, "global_step": 73669, "epoch": 887} {"train_loss": -20.960895538330078, "global_step": 73670, "epoch": 887} {"train_loss": -20.70453453063965, "global_step": 73671, "epoch": 887} {"train_loss": -20.790138244628906, "global_step": 73672, "epoch": 887} {"train_loss": -20.61098289489746, "global_step": 73673, "epoch": 887} {"train_loss": -20.8653621673584, "global_step": 73674, "epoch": 887} {"train_loss": -21.35685157775879, "global_step": 73675, "epoch": 887} {"train_loss": -20.636310577392578, "global_step": 73676, "epoch": 887} {"train_loss": -20.95977783203125, "global_step": 73677, "epoch": 887} {"train_loss": -20.905210494995117, "global_step": 73678, "epoch": 887} {"train_loss": -20.995746612548828, "global_step": 73679, "epoch": 887} {"train_loss": -20.610614776611328, "global_step": 73680, "epoch": 887} {"train_loss": -21.21271514892578, "global_step": 73681, "epoch": 887} {"train_loss": -20.837614059448242, "global_step": 73682, "epoch": 887} {"train_loss": -20.612607955932617, "global_step": 73683, "epoch": 887} {"train_loss": -21.011682510375977, "global_step": 73684, "epoch": 887} {"train_loss": -20.697538375854492, "global_step": 73685, "epoch": 887} {"train_loss": -21.07463264465332, "global_step": 73686, "epoch": 887} {"train_loss": -20.927101135253906, "global_step": 73687, "epoch": 887} {"train_loss": -20.983346939086914, "global_step": 73688, "epoch": 887} {"train_loss": -20.779146194458008, "global_step": 73689, "epoch": 887} {"train_loss": -20.964811325073242, "global_step": 73690, "epoch": 887} {"train_loss": -20.87080192565918, "global_step": 73691, "epoch": 887} {"train_loss": -21.077369689941406, "global_step": 73692, "epoch": 887} {"train_loss": -21.387447357177734, "global_step": 73693, "epoch": 887} {"train_loss": -20.586185455322266, "global_step": 73694, "epoch": 887} {"train_loss": -21.180051803588867, "global_step": 73695, "epoch": 887} {"train_loss": -20.938440322875977, "global_step": 73696, "epoch": 887} {"train_loss": -21.17415428161621, "global_step": 73697, "epoch": 887} {"train_loss": -20.86275291442871, "global_step": 73698, "epoch": 887} {"train_loss": -21.10735511779785, "global_step": 73699, "epoch": 887} {"train_loss": -20.92008399963379, "global_step": 73700, "epoch": 887} {"train_loss": -21.188491821289062, "global_step": 73701, "epoch": 887} {"train_loss": -21.23170280456543, "global_step": 73702, "epoch": 887} {"train_loss": -20.92352880914527, "global_step": 73703, "epoch": 887, "val_loss": 5911304.5} {"train_loss": -20.175556182861328, "global_step": 73704, "epoch": 888} {"train_loss": -20.204519271850586, "global_step": 73705, "epoch": 888} {"train_loss": -20.277301788330078, "global_step": 73706, "epoch": 888} {"train_loss": -20.887577056884766, "global_step": 73707, "epoch": 888} {"train_loss": -20.45570945739746, "global_step": 73708, "epoch": 888} {"train_loss": -20.372121810913086, "global_step": 73709, "epoch": 888} {"train_loss": -20.30264663696289, "global_step": 73710, "epoch": 888} {"train_loss": -19.841907501220703, "global_step": 73711, "epoch": 888} {"train_loss": -20.252286911010742, "global_step": 73712, "epoch": 888} {"train_loss": -20.52815818786621, "global_step": 73713, "epoch": 888} {"train_loss": -20.998987197875977, "global_step": 73714, "epoch": 888} {"train_loss": -20.49320411682129, "global_step": 73715, "epoch": 888} {"train_loss": -20.853174209594727, "global_step": 73716, "epoch": 888} {"train_loss": -20.69827651977539, "global_step": 73717, "epoch": 888} {"train_loss": -20.605289459228516, "global_step": 73718, "epoch": 888} {"train_loss": -20.497547149658203, "global_step": 73719, "epoch": 888} {"train_loss": -20.571229934692383, "global_step": 73720, "epoch": 888} {"train_loss": -20.721609115600586, "global_step": 73721, "epoch": 888} {"train_loss": -20.813840866088867, "global_step": 73722, "epoch": 888} {"train_loss": -20.522287368774414, "global_step": 73723, "epoch": 888} {"train_loss": -21.095483779907227, "global_step": 73724, "epoch": 888} {"train_loss": -20.978744506835938, "global_step": 73725, "epoch": 888} {"train_loss": -20.875436782836914, "global_step": 73726, "epoch": 888} {"train_loss": -20.6656436920166, "global_step": 73727, "epoch": 888} {"train_loss": -20.853622436523438, "global_step": 73728, "epoch": 888} {"train_loss": -20.911542892456055, "global_step": 73729, "epoch": 888} {"train_loss": -20.783401489257812, "global_step": 73730, "epoch": 888} {"train_loss": -21.21242332458496, "global_step": 73731, "epoch": 888} {"train_loss": -21.271455764770508, "global_step": 73732, "epoch": 888} {"train_loss": -21.02933120727539, "global_step": 73733, "epoch": 888} {"train_loss": -20.922515869140625, "global_step": 73734, "epoch": 888} {"train_loss": -20.77271842956543, "global_step": 73735, "epoch": 888} {"train_loss": -20.9855899810791, "global_step": 73736, "epoch": 888} {"train_loss": -20.789289474487305, "global_step": 73737, "epoch": 888} {"train_loss": -20.953229904174805, "global_step": 73738, "epoch": 888} {"train_loss": -20.926862716674805, "global_step": 73739, "epoch": 888} {"train_loss": -21.228212356567383, "global_step": 73740, "epoch": 888} {"train_loss": -20.869604110717773, "global_step": 73741, "epoch": 888} {"train_loss": -20.827133178710938, "global_step": 73742, "epoch": 888} {"train_loss": -21.077436447143555, "global_step": 73743, "epoch": 888} {"train_loss": -21.06864356994629, "global_step": 73744, "epoch": 888} {"train_loss": -21.125741958618164, "global_step": 73745, "epoch": 888} {"train_loss": -21.104415893554688, "global_step": 73746, "epoch": 888} {"train_loss": -21.175310134887695, "global_step": 73747, "epoch": 888} {"train_loss": -20.782129287719727, "global_step": 73748, "epoch": 888} {"train_loss": -21.081884384155273, "global_step": 73749, "epoch": 888} {"train_loss": -20.871349334716797, "global_step": 73750, "epoch": 888} {"train_loss": -21.13077735900879, "global_step": 73751, "epoch": 888} {"train_loss": -20.661785125732422, "global_step": 73752, "epoch": 888} {"train_loss": -21.109329223632812, "global_step": 73753, "epoch": 888} {"train_loss": -20.761079788208008, "global_step": 73754, "epoch": 888} {"train_loss": -20.642831802368164, "global_step": 73755, "epoch": 888} {"train_loss": -21.17034912109375, "global_step": 73756, "epoch": 888} {"train_loss": -20.903263092041016, "global_step": 73757, "epoch": 888} {"train_loss": -21.016138076782227, "global_step": 73758, "epoch": 888} {"train_loss": -20.67384910583496, "global_step": 73759, "epoch": 888} {"train_loss": -20.998764038085938, "global_step": 73760, "epoch": 888} {"train_loss": -20.76019859313965, "global_step": 73761, "epoch": 888} {"train_loss": -20.92974090576172, "global_step": 73762, "epoch": 888} {"train_loss": -20.933481216430664, "global_step": 73763, "epoch": 888} {"train_loss": -21.061660766601562, "global_step": 73764, "epoch": 888} {"train_loss": -21.155323028564453, "global_step": 73765, "epoch": 888} {"train_loss": -20.7365779876709, "global_step": 73766, "epoch": 888} {"train_loss": -20.760791778564453, "global_step": 73767, "epoch": 888} {"train_loss": -20.96512222290039, "global_step": 73768, "epoch": 888} {"train_loss": -20.985578536987305, "global_step": 73769, "epoch": 888} {"train_loss": -20.991365432739258, "global_step": 73770, "epoch": 888} {"train_loss": -20.724403381347656, "global_step": 73771, "epoch": 888} {"train_loss": -20.768400192260742, "global_step": 73772, "epoch": 888} {"train_loss": -21.390777587890625, "global_step": 73773, "epoch": 888} {"train_loss": -21.082244873046875, "global_step": 73774, "epoch": 888} {"train_loss": -21.29198455810547, "global_step": 73775, "epoch": 888} {"train_loss": -20.948307037353516, "global_step": 73776, "epoch": 888} {"train_loss": -20.9639892578125, "global_step": 73777, "epoch": 888} {"train_loss": -20.903833389282227, "global_step": 73778, "epoch": 888} {"train_loss": -21.034265518188477, "global_step": 73779, "epoch": 888} {"train_loss": -20.839094161987305, "global_step": 73780, "epoch": 888} {"train_loss": -21.158493041992188, "global_step": 73781, "epoch": 888} {"train_loss": -20.793216705322266, "global_step": 73782, "epoch": 888} {"train_loss": -20.807844161987305, "global_step": 73783, "epoch": 888} {"train_loss": -21.014070510864258, "global_step": 73784, "epoch": 888} {"train_loss": -21.07728385925293, "global_step": 73785, "epoch": 888} {"train_loss": -20.85535302219621, "global_step": 73786, "epoch": 888, "val_loss": 5941894.0} {"train_loss": -20.923492431640625, "global_step": 73787, "epoch": 889} {"train_loss": -21.019197463989258, "global_step": 73788, "epoch": 889} {"train_loss": -20.673843383789062, "global_step": 73789, "epoch": 889} {"train_loss": -20.74528694152832, "global_step": 73790, "epoch": 889} {"train_loss": -20.787797927856445, "global_step": 73791, "epoch": 889} {"train_loss": -20.489702224731445, "global_step": 73792, "epoch": 889} {"train_loss": -20.611621856689453, "global_step": 73793, "epoch": 889} {"train_loss": -20.83087730407715, "global_step": 73794, "epoch": 889} {"train_loss": -21.219261169433594, "global_step": 73795, "epoch": 889} {"train_loss": -20.895523071289062, "global_step": 73796, "epoch": 889} {"train_loss": -21.157909393310547, "global_step": 73797, "epoch": 889} {"train_loss": -20.671619415283203, "global_step": 73798, "epoch": 889} {"train_loss": -21.132543563842773, "global_step": 73799, "epoch": 889} {"train_loss": -20.979713439941406, "global_step": 73800, "epoch": 889} {"train_loss": -20.949050903320312, "global_step": 73801, "epoch": 889} {"train_loss": -21.32281494140625, "global_step": 73802, "epoch": 889} {"train_loss": -20.658363342285156, "global_step": 73803, "epoch": 889} {"train_loss": -20.61016845703125, "global_step": 73804, "epoch": 889} {"train_loss": -20.76242446899414, "global_step": 73805, "epoch": 889} {"train_loss": -21.210403442382812, "global_step": 73806, "epoch": 889} {"train_loss": -21.2690486907959, "global_step": 73807, "epoch": 889} {"train_loss": -21.01081085205078, "global_step": 73808, "epoch": 889} {"train_loss": -20.996206283569336, "global_step": 73809, "epoch": 889} {"train_loss": -21.016361236572266, "global_step": 73810, "epoch": 889} {"train_loss": -21.113418579101562, "global_step": 73811, "epoch": 889} {"train_loss": -21.18039321899414, "global_step": 73812, "epoch": 889} {"train_loss": -20.859159469604492, "global_step": 73813, "epoch": 889} {"train_loss": -21.230419158935547, "global_step": 73814, "epoch": 889} {"train_loss": -21.062429428100586, "global_step": 73815, "epoch": 889} {"train_loss": -20.855388641357422, "global_step": 73816, "epoch": 889} {"train_loss": -21.02840232849121, "global_step": 73817, "epoch": 889} {"train_loss": -21.23956298828125, "global_step": 73818, "epoch": 889} {"train_loss": -21.065784454345703, "global_step": 73819, "epoch": 889} {"train_loss": -21.17444610595703, "global_step": 73820, "epoch": 889} {"train_loss": -20.864377975463867, "global_step": 73821, "epoch": 889} {"train_loss": -21.050209045410156, "global_step": 73822, "epoch": 889} {"train_loss": -20.95032501220703, "global_step": 73823, "epoch": 889} {"train_loss": -20.99185562133789, "global_step": 73824, "epoch": 889} {"train_loss": -20.6756649017334, "global_step": 73825, "epoch": 889} {"train_loss": -21.373153686523438, "global_step": 73826, "epoch": 889} {"train_loss": -21.2393741607666, "global_step": 73827, "epoch": 889} {"train_loss": -21.058433532714844, "global_step": 73828, "epoch": 889} {"train_loss": -20.985414505004883, "global_step": 73829, "epoch": 889} {"train_loss": -21.01310157775879, "global_step": 73830, "epoch": 889} {"train_loss": -21.176855087280273, "global_step": 73831, "epoch": 889} {"train_loss": -20.86817741394043, "global_step": 73832, "epoch": 889} {"train_loss": -20.756061553955078, "global_step": 73833, "epoch": 889} {"train_loss": -21.07484245300293, "global_step": 73834, "epoch": 889} {"train_loss": -21.239511489868164, "global_step": 73835, "epoch": 889} {"train_loss": -21.05352783203125, "global_step": 73836, "epoch": 889} {"train_loss": -21.07668113708496, "global_step": 73837, "epoch": 889} {"train_loss": -21.0427303314209, "global_step": 73838, "epoch": 889} {"train_loss": -20.930185317993164, "global_step": 73839, "epoch": 889} {"train_loss": -21.0640811920166, "global_step": 73840, "epoch": 889} {"train_loss": -21.23076820373535, "global_step": 73841, "epoch": 889} {"train_loss": -21.025190353393555, "global_step": 73842, "epoch": 889} {"train_loss": -21.1146183013916, "global_step": 73843, "epoch": 889} {"train_loss": -21.405515670776367, "global_step": 73844, "epoch": 889} {"train_loss": -20.802278518676758, "global_step": 73845, "epoch": 889} {"train_loss": -20.974706649780273, "global_step": 73846, "epoch": 889} {"train_loss": -21.44139862060547, "global_step": 73847, "epoch": 889} {"train_loss": -20.865018844604492, "global_step": 73848, "epoch": 889} {"train_loss": -20.593618392944336, "global_step": 73849, "epoch": 889} {"train_loss": -21.04168128967285, "global_step": 73850, "epoch": 889} {"train_loss": -20.740140914916992, "global_step": 73851, "epoch": 889} {"train_loss": -20.73537254333496, "global_step": 73852, "epoch": 889} {"train_loss": -21.03761100769043, "global_step": 73853, "epoch": 889} {"train_loss": -21.051816940307617, "global_step": 73854, "epoch": 889} {"train_loss": -20.849958419799805, "global_step": 73855, "epoch": 889} {"train_loss": -21.116403579711914, "global_step": 73856, "epoch": 889} {"train_loss": -21.107955932617188, "global_step": 73857, "epoch": 889} {"train_loss": -21.190553665161133, "global_step": 73858, "epoch": 889} {"train_loss": -20.9649658203125, "global_step": 73859, "epoch": 889} {"train_loss": -20.844249725341797, "global_step": 73860, "epoch": 889} {"train_loss": -20.90595817565918, "global_step": 73861, "epoch": 889} {"train_loss": -20.91620445251465, "global_step": 73862, "epoch": 889} {"train_loss": -20.69986915588379, "global_step": 73863, "epoch": 889} {"train_loss": -21.264305114746094, "global_step": 73864, "epoch": 889} {"train_loss": -21.03435516357422, "global_step": 73865, "epoch": 889} {"train_loss": -20.604902267456055, "global_step": 73866, "epoch": 889} {"train_loss": -20.854089736938477, "global_step": 73867, "epoch": 889} {"train_loss": -20.8369083404541, "global_step": 73868, "epoch": 889} {"train_loss": -20.96707059101886, "global_step": 73869, "epoch": 889, "val_loss": 5956989.0} {"train_loss": -21.15829849243164, "global_step": 73870, "epoch": 890} {"train_loss": -20.878190994262695, "global_step": 73871, "epoch": 890} {"train_loss": -20.90235710144043, "global_step": 73872, "epoch": 890} {"train_loss": -20.688329696655273, "global_step": 73873, "epoch": 890} {"train_loss": -21.078344345092773, "global_step": 73874, "epoch": 890} {"train_loss": -20.890544891357422, "global_step": 73875, "epoch": 890} {"train_loss": -21.097631454467773, "global_step": 73876, "epoch": 890} {"train_loss": -20.70662498474121, "global_step": 73877, "epoch": 890} {"train_loss": -20.781099319458008, "global_step": 73878, "epoch": 890} {"train_loss": -21.143457412719727, "global_step": 73879, "epoch": 890} {"train_loss": -21.15538215637207, "global_step": 73880, "epoch": 890} {"train_loss": -20.847698211669922, "global_step": 73881, "epoch": 890} {"train_loss": -21.090694427490234, "global_step": 73882, "epoch": 890} {"train_loss": -20.811508178710938, "global_step": 73883, "epoch": 890} {"train_loss": -21.32440757751465, "global_step": 73884, "epoch": 890} {"train_loss": -20.671911239624023, "global_step": 73885, "epoch": 890} {"train_loss": -20.84413719177246, "global_step": 73886, "epoch": 890} {"train_loss": -21.256742477416992, "global_step": 73887, "epoch": 890} {"train_loss": -20.982376098632812, "global_step": 73888, "epoch": 890} {"train_loss": -21.137958526611328, "global_step": 73889, "epoch": 890} {"train_loss": -21.105337142944336, "global_step": 73890, "epoch": 890} {"train_loss": -20.950864791870117, "global_step": 73891, "epoch": 890} {"train_loss": -20.858203887939453, "global_step": 73892, "epoch": 890} {"train_loss": -20.824100494384766, "global_step": 73893, "epoch": 890} {"train_loss": -21.274412155151367, "global_step": 73894, "epoch": 890} {"train_loss": -20.785669326782227, "global_step": 73895, "epoch": 890} {"train_loss": -20.871463775634766, "global_step": 73896, "epoch": 890} {"train_loss": -21.098419189453125, "global_step": 73897, "epoch": 890} {"train_loss": -20.91547203063965, "global_step": 73898, "epoch": 890} {"train_loss": -20.694477081298828, "global_step": 73899, "epoch": 890} {"train_loss": -20.74644660949707, "global_step": 73900, "epoch": 890} {"train_loss": -20.73055076599121, "global_step": 73901, "epoch": 890} {"train_loss": -21.23862075805664, "global_step": 73902, "epoch": 890} {"train_loss": -20.917821884155273, "global_step": 73903, "epoch": 890} {"train_loss": -20.560794830322266, "global_step": 73904, "epoch": 890} {"train_loss": -20.779605865478516, "global_step": 73905, "epoch": 890} {"train_loss": -20.73099136352539, "global_step": 73906, "epoch": 890} {"train_loss": -20.411401748657227, "global_step": 73907, "epoch": 890} {"train_loss": -21.12360191345215, "global_step": 73908, "epoch": 890} {"train_loss": -21.041982650756836, "global_step": 73909, "epoch": 890} {"train_loss": -20.95075798034668, "global_step": 73910, "epoch": 890} {"train_loss": -21.025487899780273, "global_step": 73911, "epoch": 890} {"train_loss": -21.040693283081055, "global_step": 73912, "epoch": 890} {"train_loss": -21.13275146484375, "global_step": 73913, "epoch": 890} {"train_loss": -21.170028686523438, "global_step": 73914, "epoch": 890} {"train_loss": -20.917749404907227, "global_step": 73915, "epoch": 890} {"train_loss": -21.080608367919922, "global_step": 73916, "epoch": 890} {"train_loss": -21.10297966003418, "global_step": 73917, "epoch": 890} {"train_loss": -21.038257598876953, "global_step": 73918, "epoch": 890} {"train_loss": -21.089069366455078, "global_step": 73919, "epoch": 890} {"train_loss": -21.046606063842773, "global_step": 73920, "epoch": 890} {"train_loss": -21.45709991455078, "global_step": 73921, "epoch": 890} {"train_loss": -20.70485496520996, "global_step": 73922, "epoch": 890} {"train_loss": -20.87876319885254, "global_step": 73923, "epoch": 890} {"train_loss": -21.16192626953125, "global_step": 73924, "epoch": 890} {"train_loss": -21.16227149963379, "global_step": 73925, "epoch": 890} {"train_loss": -20.748220443725586, "global_step": 73926, "epoch": 890} {"train_loss": -20.904773712158203, "global_step": 73927, "epoch": 890} {"train_loss": -20.977094650268555, "global_step": 73928, "epoch": 890} {"train_loss": -21.30817985534668, "global_step": 73929, "epoch": 890} {"train_loss": -21.46125602722168, "global_step": 73930, "epoch": 890} {"train_loss": -21.177539825439453, "global_step": 73931, "epoch": 890} {"train_loss": -21.22395133972168, "global_step": 73932, "epoch": 890} {"train_loss": -20.64997673034668, "global_step": 73933, "epoch": 890} {"train_loss": -21.107236862182617, "global_step": 73934, "epoch": 890} {"train_loss": -21.080589294433594, "global_step": 73935, "epoch": 890} {"train_loss": -21.033018112182617, "global_step": 73936, "epoch": 890} {"train_loss": -20.668739318847656, "global_step": 73937, "epoch": 890} {"train_loss": -21.146255493164062, "global_step": 73938, "epoch": 890} {"train_loss": -20.662960052490234, "global_step": 73939, "epoch": 890} {"train_loss": -21.141164779663086, "global_step": 73940, "epoch": 890} {"train_loss": -20.991559982299805, "global_step": 73941, "epoch": 890} {"train_loss": -21.034168243408203, "global_step": 73942, "epoch": 890} {"train_loss": -21.066360473632812, "global_step": 73943, "epoch": 890} {"train_loss": -21.206493377685547, "global_step": 73944, "epoch": 890} {"train_loss": -21.188871383666992, "global_step": 73945, "epoch": 890} {"train_loss": -21.437091827392578, "global_step": 73946, "epoch": 890} {"train_loss": -21.035493850708008, "global_step": 73947, "epoch": 890} {"train_loss": -20.75725555419922, "global_step": 73948, "epoch": 890} {"train_loss": -21.25196647644043, "global_step": 73949, "epoch": 890} {"train_loss": -21.023008346557617, "global_step": 73950, "epoch": 890} {"train_loss": -20.978727340698242, "global_step": 73951, "epoch": 890} {"train_loss": -20.98949377220797, "global_step": 73952, "epoch": 890, "val_loss": 5952868.0} {"train_loss": -20.813650131225586, "global_step": 73953, "epoch": 891} {"train_loss": -20.861970901489258, "global_step": 73954, "epoch": 891} {"train_loss": -21.27597427368164, "global_step": 73955, "epoch": 891} {"train_loss": -20.28924560546875, "global_step": 73956, "epoch": 891} {"train_loss": -20.794198989868164, "global_step": 73957, "epoch": 891} {"train_loss": -20.70330238342285, "global_step": 73958, "epoch": 891} {"train_loss": -20.6333065032959, "global_step": 73959, "epoch": 891} {"train_loss": -20.80484962463379, "global_step": 73960, "epoch": 891} {"train_loss": -20.743318557739258, "global_step": 73961, "epoch": 891} {"train_loss": -21.08716583251953, "global_step": 73962, "epoch": 891} {"train_loss": -20.971708297729492, "global_step": 73963, "epoch": 891} {"train_loss": -21.089933395385742, "global_step": 73964, "epoch": 891} {"train_loss": -20.97031593322754, "global_step": 73965, "epoch": 891} {"train_loss": -20.8072566986084, "global_step": 73966, "epoch": 891} {"train_loss": -20.81045913696289, "global_step": 73967, "epoch": 891} {"train_loss": -20.938793182373047, "global_step": 73968, "epoch": 891} {"train_loss": -20.62113380432129, "global_step": 73969, "epoch": 891} {"train_loss": -20.704551696777344, "global_step": 73970, "epoch": 891} {"train_loss": -20.64185905456543, "global_step": 73971, "epoch": 891} {"train_loss": -20.777873992919922, "global_step": 73972, "epoch": 891} {"train_loss": -20.76737403869629, "global_step": 73973, "epoch": 891} {"train_loss": -20.754858016967773, "global_step": 73974, "epoch": 891} {"train_loss": -21.069944381713867, "global_step": 73975, "epoch": 891} {"train_loss": -20.942703247070312, "global_step": 73976, "epoch": 891} {"train_loss": -21.126401901245117, "global_step": 73977, "epoch": 891} {"train_loss": -20.7180233001709, "global_step": 73978, "epoch": 891} {"train_loss": -21.467065811157227, "global_step": 73979, "epoch": 891} {"train_loss": -21.041494369506836, "global_step": 73980, "epoch": 891} {"train_loss": -20.89571189880371, "global_step": 73981, "epoch": 891} {"train_loss": -21.23697280883789, "global_step": 73982, "epoch": 891} {"train_loss": -20.96738052368164, "global_step": 73983, "epoch": 891} {"train_loss": -20.513137817382812, "global_step": 73984, "epoch": 891} {"train_loss": -20.8266658782959, "global_step": 73985, "epoch": 891} {"train_loss": -20.85175323486328, "global_step": 73986, "epoch": 891} {"train_loss": -21.159353256225586, "global_step": 73987, "epoch": 891} {"train_loss": -21.046493530273438, "global_step": 73988, "epoch": 891} {"train_loss": -20.90382194519043, "global_step": 73989, "epoch": 891} {"train_loss": -21.150968551635742, "global_step": 73990, "epoch": 891} {"train_loss": -20.965946197509766, "global_step": 73991, "epoch": 891} {"train_loss": -21.190549850463867, "global_step": 73992, "epoch": 891} {"train_loss": -20.984607696533203, "global_step": 73993, "epoch": 891} {"train_loss": -20.621023178100586, "global_step": 73994, "epoch": 891} {"train_loss": -21.000974655151367, "global_step": 73995, "epoch": 891} {"train_loss": -20.755258560180664, "global_step": 73996, "epoch": 891} {"train_loss": -21.192434310913086, "global_step": 73997, "epoch": 891} {"train_loss": -21.004541397094727, "global_step": 73998, "epoch": 891} {"train_loss": -20.95336151123047, "global_step": 73999, "epoch": 891} {"train_loss": -20.667566299438477, "global_step": 74000, "epoch": 891} {"train_loss": -21.44025993347168, "global_step": 74001, "epoch": 891} {"train_loss": -20.9957218170166, "global_step": 74002, "epoch": 891} {"train_loss": -20.621662139892578, "global_step": 74003, "epoch": 891} {"train_loss": -20.972753524780273, "global_step": 74004, "epoch": 891} {"train_loss": -21.09111976623535, "global_step": 74005, "epoch": 891} {"train_loss": -20.97536277770996, "global_step": 74006, "epoch": 891} {"train_loss": -20.658811569213867, "global_step": 74007, "epoch": 891} {"train_loss": -20.431243896484375, "global_step": 74008, "epoch": 891} {"train_loss": -20.842973709106445, "global_step": 74009, "epoch": 891} {"train_loss": -20.806333541870117, "global_step": 74010, "epoch": 891} {"train_loss": -20.56919288635254, "global_step": 74011, "epoch": 891} {"train_loss": -21.112638473510742, "global_step": 74012, "epoch": 891} {"train_loss": -20.9713191986084, "global_step": 74013, "epoch": 891} {"train_loss": -21.53525161743164, "global_step": 74014, "epoch": 891} {"train_loss": -20.73405647277832, "global_step": 74015, "epoch": 891} {"train_loss": -21.127979278564453, "global_step": 74016, "epoch": 891} {"train_loss": -21.03843116760254, "global_step": 74017, "epoch": 891} {"train_loss": -21.0103816986084, "global_step": 74018, "epoch": 891} {"train_loss": -20.79080581665039, "global_step": 74019, "epoch": 891} {"train_loss": -20.93902587890625, "global_step": 74020, "epoch": 891} {"train_loss": -20.822616577148438, "global_step": 74021, "epoch": 891} {"train_loss": -21.031707763671875, "global_step": 74022, "epoch": 891} {"train_loss": -21.453168869018555, "global_step": 74023, "epoch": 891} {"train_loss": -21.085264205932617, "global_step": 74024, "epoch": 891} {"train_loss": -20.702116012573242, "global_step": 74025, "epoch": 891} {"train_loss": -20.928377151489258, "global_step": 74026, "epoch": 891} {"train_loss": -20.72109031677246, "global_step": 74027, "epoch": 891} {"train_loss": -20.57553482055664, "global_step": 74028, "epoch": 891} {"train_loss": -20.837369918823242, "global_step": 74029, "epoch": 891} {"train_loss": -20.525285720825195, "global_step": 74030, "epoch": 891} {"train_loss": -20.90285301208496, "global_step": 74031, "epoch": 891} {"train_loss": -20.937149047851562, "global_step": 74032, "epoch": 891} {"train_loss": -20.933469772338867, "global_step": 74033, "epoch": 891} {"train_loss": -20.68665313720703, "global_step": 74034, "epoch": 891} {"train_loss": -20.895141969244165, "global_step": 74035, "epoch": 891, "val_loss": 6177152.0} {"train_loss": -20.381149291992188, "global_step": 74036, "epoch": 892} {"train_loss": -20.69561195373535, "global_step": 74037, "epoch": 892} {"train_loss": -20.905561447143555, "global_step": 74038, "epoch": 892} {"train_loss": -20.799030303955078, "global_step": 74039, "epoch": 892} {"train_loss": -20.95970344543457, "global_step": 74040, "epoch": 892} {"train_loss": -20.62163734436035, "global_step": 74041, "epoch": 892} {"train_loss": -20.86297607421875, "global_step": 74042, "epoch": 892} {"train_loss": -20.660171508789062, "global_step": 74043, "epoch": 892} {"train_loss": -20.773075103759766, "global_step": 74044, "epoch": 892} {"train_loss": -20.60997772216797, "global_step": 74045, "epoch": 892} {"train_loss": -20.766672134399414, "global_step": 74046, "epoch": 892} {"train_loss": -20.892574310302734, "global_step": 74047, "epoch": 892} {"train_loss": -21.000385284423828, "global_step": 74048, "epoch": 892} {"train_loss": -20.993026733398438, "global_step": 74049, "epoch": 892} {"train_loss": -20.82306480407715, "global_step": 74050, "epoch": 892} {"train_loss": -20.82184410095215, "global_step": 74051, "epoch": 892} {"train_loss": -20.48118019104004, "global_step": 74052, "epoch": 892} {"train_loss": -20.848651885986328, "global_step": 74053, "epoch": 892} {"train_loss": -21.1520938873291, "global_step": 74054, "epoch": 892} {"train_loss": -20.697673797607422, "global_step": 74055, "epoch": 892} {"train_loss": -20.93246841430664, "global_step": 74056, "epoch": 892} {"train_loss": -21.145902633666992, "global_step": 74057, "epoch": 892} {"train_loss": -20.923978805541992, "global_step": 74058, "epoch": 892} {"train_loss": -20.90105628967285, "global_step": 74059, "epoch": 892} {"train_loss": -21.2382869720459, "global_step": 74060, "epoch": 892} {"train_loss": -21.355024337768555, "global_step": 74061, "epoch": 892} {"train_loss": -20.795846939086914, "global_step": 74062, "epoch": 892} {"train_loss": -20.931249618530273, "global_step": 74063, "epoch": 892} {"train_loss": -20.927106857299805, "global_step": 74064, "epoch": 892} {"train_loss": -20.99955177307129, "global_step": 74065, "epoch": 892} {"train_loss": -20.7403564453125, "global_step": 74066, "epoch": 892} {"train_loss": -21.063879013061523, "global_step": 74067, "epoch": 892} {"train_loss": -20.860971450805664, "global_step": 74068, "epoch": 892} {"train_loss": -21.078327178955078, "global_step": 74069, "epoch": 892} {"train_loss": -21.001718521118164, "global_step": 74070, "epoch": 892} {"train_loss": -20.410741806030273, "global_step": 74071, "epoch": 892} {"train_loss": -21.10919189453125, "global_step": 74072, "epoch": 892} {"train_loss": -20.832965850830078, "global_step": 74073, "epoch": 892} {"train_loss": -20.913368225097656, "global_step": 74074, "epoch": 892} {"train_loss": -21.206836700439453, "global_step": 74075, "epoch": 892} {"train_loss": -20.85834503173828, "global_step": 74076, "epoch": 892} {"train_loss": -20.81278419494629, "global_step": 74077, "epoch": 892} {"train_loss": -21.306852340698242, "global_step": 74078, "epoch": 892} {"train_loss": -21.141490936279297, "global_step": 74079, "epoch": 892} {"train_loss": -21.387569427490234, "global_step": 74080, "epoch": 892} {"train_loss": -20.59699249267578, "global_step": 74081, "epoch": 892} {"train_loss": -21.023527145385742, "global_step": 74082, "epoch": 892} {"train_loss": -20.77447509765625, "global_step": 74083, "epoch": 892} {"train_loss": -20.90533447265625, "global_step": 74084, "epoch": 892} {"train_loss": -21.062204360961914, "global_step": 74085, "epoch": 892} {"train_loss": -21.112834930419922, "global_step": 74086, "epoch": 892} {"train_loss": -21.31148338317871, "global_step": 74087, "epoch": 892} {"train_loss": -21.031110763549805, "global_step": 74088, "epoch": 892} {"train_loss": -21.09646987915039, "global_step": 74089, "epoch": 892} {"train_loss": -21.040180206298828, "global_step": 74090, "epoch": 892} {"train_loss": -21.101171493530273, "global_step": 74091, "epoch": 892} {"train_loss": -20.960205078125, "global_step": 74092, "epoch": 892} {"train_loss": -20.970064163208008, "global_step": 74093, "epoch": 892} {"train_loss": -21.068527221679688, "global_step": 74094, "epoch": 892} {"train_loss": -21.173460006713867, "global_step": 74095, "epoch": 892} {"train_loss": -20.936403274536133, "global_step": 74096, "epoch": 892} {"train_loss": -21.23166275024414, "global_step": 74097, "epoch": 892} {"train_loss": -21.12595558166504, "global_step": 74098, "epoch": 892} {"train_loss": -21.023481369018555, "global_step": 74099, "epoch": 892} {"train_loss": -21.26702308654785, "global_step": 74100, "epoch": 892} {"train_loss": -20.798851013183594, "global_step": 74101, "epoch": 892} {"train_loss": -20.85688591003418, "global_step": 74102, "epoch": 892} {"train_loss": -20.736597061157227, "global_step": 74103, "epoch": 892} {"train_loss": -21.14442253112793, "global_step": 74104, "epoch": 892} {"train_loss": -20.77452278137207, "global_step": 74105, "epoch": 892} {"train_loss": -20.45738983154297, "global_step": 74106, "epoch": 892} {"train_loss": -20.79219627380371, "global_step": 74107, "epoch": 892} {"train_loss": -20.898618698120117, "global_step": 74108, "epoch": 892} {"train_loss": -21.153335571289062, "global_step": 74109, "epoch": 892} {"train_loss": -21.06593894958496, "global_step": 74110, "epoch": 892} {"train_loss": -21.25448989868164, "global_step": 74111, "epoch": 892} {"train_loss": -20.830244064331055, "global_step": 74112, "epoch": 892} {"train_loss": -20.72194480895996, "global_step": 74113, "epoch": 892} {"train_loss": -21.095544815063477, "global_step": 74114, "epoch": 892} {"train_loss": -21.195167541503906, "global_step": 74115, "epoch": 892} {"train_loss": -21.13585662841797, "global_step": 74116, "epoch": 892} {"train_loss": -20.905515670776367, "global_step": 74117, "epoch": 892} {"train_loss": -20.937050945787544, "global_step": 74118, "epoch": 892, "val_loss": 6045939.0} {"train_loss": -20.701141357421875, "global_step": 74119, "epoch": 893} {"train_loss": -20.714508056640625, "global_step": 74120, "epoch": 893} {"train_loss": -21.202306747436523, "global_step": 74121, "epoch": 893} {"train_loss": -20.673458099365234, "global_step": 74122, "epoch": 893} {"train_loss": -20.141897201538086, "global_step": 74123, "epoch": 893} {"train_loss": -20.778568267822266, "global_step": 74124, "epoch": 893} {"train_loss": -20.240537643432617, "global_step": 74125, "epoch": 893} {"train_loss": -20.780561447143555, "global_step": 74126, "epoch": 893} {"train_loss": -20.35004234313965, "global_step": 74127, "epoch": 893} {"train_loss": -20.241018295288086, "global_step": 74128, "epoch": 893} {"train_loss": -20.961158752441406, "global_step": 74129, "epoch": 893} {"train_loss": -21.006479263305664, "global_step": 74130, "epoch": 893} {"train_loss": -20.709049224853516, "global_step": 74131, "epoch": 893} {"train_loss": -20.817420959472656, "global_step": 74132, "epoch": 893} {"train_loss": -20.414304733276367, "global_step": 74133, "epoch": 893} {"train_loss": -20.53116798400879, "global_step": 74134, "epoch": 893} {"train_loss": -20.663307189941406, "global_step": 74135, "epoch": 893} {"train_loss": -20.94391441345215, "global_step": 74136, "epoch": 893} {"train_loss": -20.8157901763916, "global_step": 74137, "epoch": 893} {"train_loss": -20.749271392822266, "global_step": 74138, "epoch": 893} {"train_loss": -20.58265495300293, "global_step": 74139, "epoch": 893} {"train_loss": -20.907678604125977, "global_step": 74140, "epoch": 893} {"train_loss": -20.633710861206055, "global_step": 74141, "epoch": 893} {"train_loss": -21.085580825805664, "global_step": 74142, "epoch": 893} {"train_loss": -20.690244674682617, "global_step": 74143, "epoch": 893} {"train_loss": -20.755950927734375, "global_step": 74144, "epoch": 893} {"train_loss": -21.116737365722656, "global_step": 74145, "epoch": 893} {"train_loss": -20.867643356323242, "global_step": 74146, "epoch": 893} {"train_loss": -21.125877380371094, "global_step": 74147, "epoch": 893} {"train_loss": -20.62825584411621, "global_step": 74148, "epoch": 893} {"train_loss": -20.702617645263672, "global_step": 74149, "epoch": 893} {"train_loss": -21.183149337768555, "global_step": 74150, "epoch": 893} {"train_loss": -20.772830963134766, "global_step": 74151, "epoch": 893} {"train_loss": -21.072378158569336, "global_step": 74152, "epoch": 893} {"train_loss": -20.91791343688965, "global_step": 74153, "epoch": 893} {"train_loss": -20.66231346130371, "global_step": 74154, "epoch": 893} {"train_loss": -21.235549926757812, "global_step": 74155, "epoch": 893} {"train_loss": -21.00680923461914, "global_step": 74156, "epoch": 893} {"train_loss": -20.551450729370117, "global_step": 74157, "epoch": 893} {"train_loss": -20.951980590820312, "global_step": 74158, "epoch": 893} {"train_loss": -21.177656173706055, "global_step": 74159, "epoch": 893} {"train_loss": -21.09452247619629, "global_step": 74160, "epoch": 893} {"train_loss": -21.20815658569336, "global_step": 74161, "epoch": 893} {"train_loss": -20.783958435058594, "global_step": 74162, "epoch": 893} {"train_loss": -21.28847312927246, "global_step": 74163, "epoch": 893} {"train_loss": -21.214765548706055, "global_step": 74164, "epoch": 893} {"train_loss": -21.145231246948242, "global_step": 74165, "epoch": 893} {"train_loss": -21.478307723999023, "global_step": 74166, "epoch": 893} {"train_loss": -20.999601364135742, "global_step": 74167, "epoch": 893} {"train_loss": -20.980405807495117, "global_step": 74168, "epoch": 893} {"train_loss": -21.122718811035156, "global_step": 74169, "epoch": 893} {"train_loss": -21.185392379760742, "global_step": 74170, "epoch": 893} {"train_loss": -20.831499099731445, "global_step": 74171, "epoch": 893} {"train_loss": -20.92278480529785, "global_step": 74172, "epoch": 893} {"train_loss": -21.023351669311523, "global_step": 74173, "epoch": 893} {"train_loss": -21.385726928710938, "global_step": 74174, "epoch": 893} {"train_loss": -20.947805404663086, "global_step": 74175, "epoch": 893} {"train_loss": -20.64447593688965, "global_step": 74176, "epoch": 893} {"train_loss": -21.345083236694336, "global_step": 74177, "epoch": 893} {"train_loss": -20.918439865112305, "global_step": 74178, "epoch": 893} {"train_loss": -21.08979606628418, "global_step": 74179, "epoch": 893} {"train_loss": -20.947059631347656, "global_step": 74180, "epoch": 893} {"train_loss": -20.866117477416992, "global_step": 74181, "epoch": 893} {"train_loss": -20.9373722076416, "global_step": 74182, "epoch": 893} {"train_loss": -21.486141204833984, "global_step": 74183, "epoch": 893} {"train_loss": -21.356271743774414, "global_step": 74184, "epoch": 893} {"train_loss": -21.188114166259766, "global_step": 74185, "epoch": 893} {"train_loss": -20.72133445739746, "global_step": 74186, "epoch": 893} {"train_loss": -21.213424682617188, "global_step": 74187, "epoch": 893} {"train_loss": -21.17207145690918, "global_step": 74188, "epoch": 893} {"train_loss": -20.742158889770508, "global_step": 74189, "epoch": 893} {"train_loss": -21.155126571655273, "global_step": 74190, "epoch": 893} {"train_loss": -20.98859214782715, "global_step": 74191, "epoch": 893} {"train_loss": -20.809404373168945, "global_step": 74192, "epoch": 893} {"train_loss": -21.065092086791992, "global_step": 74193, "epoch": 893} {"train_loss": -21.35262107849121, "global_step": 74194, "epoch": 893} {"train_loss": -21.092863082885742, "global_step": 74195, "epoch": 893} {"train_loss": -20.939443588256836, "global_step": 74196, "epoch": 893} {"train_loss": -21.251445770263672, "global_step": 74197, "epoch": 893} {"train_loss": -20.59308433532715, "global_step": 74198, "epoch": 893} {"train_loss": -21.10726547241211, "global_step": 74199, "epoch": 893} {"train_loss": -21.215618133544922, "global_step": 74200, "epoch": 893} {"train_loss": -20.91402816772461, "global_step": 74201, "epoch": 893, "val_loss": 5975583.0} {"train_loss": -19.7945556640625, "global_step": 74202, "epoch": 894} {"train_loss": -20.515270233154297, "global_step": 74203, "epoch": 894} {"train_loss": -20.364398956298828, "global_step": 74204, "epoch": 894} {"train_loss": -20.05582046508789, "global_step": 74205, "epoch": 894} {"train_loss": -20.753559112548828, "global_step": 74206, "epoch": 894} {"train_loss": -19.891881942749023, "global_step": 74207, "epoch": 894} {"train_loss": -19.983051300048828, "global_step": 74208, "epoch": 894} {"train_loss": -20.5011043548584, "global_step": 74209, "epoch": 894} {"train_loss": -20.080591201782227, "global_step": 74210, "epoch": 894} {"train_loss": -20.310802459716797, "global_step": 74211, "epoch": 894} {"train_loss": -20.36503791809082, "global_step": 74212, "epoch": 894} {"train_loss": -20.253311157226562, "global_step": 74213, "epoch": 894} {"train_loss": -20.195653915405273, "global_step": 74214, "epoch": 894} {"train_loss": -20.656574249267578, "global_step": 74215, "epoch": 894} {"train_loss": -20.656362533569336, "global_step": 74216, "epoch": 894} {"train_loss": -20.452306747436523, "global_step": 74217, "epoch": 894} {"train_loss": -20.41570281982422, "global_step": 74218, "epoch": 894} {"train_loss": -20.855695724487305, "global_step": 74219, "epoch": 894} {"train_loss": -20.653451919555664, "global_step": 74220, "epoch": 894} {"train_loss": -20.52761459350586, "global_step": 74221, "epoch": 894} {"train_loss": -20.795507431030273, "global_step": 74222, "epoch": 894} {"train_loss": -20.613718032836914, "global_step": 74223, "epoch": 894} {"train_loss": -20.832416534423828, "global_step": 74224, "epoch": 894} {"train_loss": -20.762571334838867, "global_step": 74225, "epoch": 894} {"train_loss": -20.707666397094727, "global_step": 74226, "epoch": 894} {"train_loss": -20.846546173095703, "global_step": 74227, "epoch": 894} {"train_loss": -20.798612594604492, "global_step": 74228, "epoch": 894} {"train_loss": -20.85371208190918, "global_step": 74229, "epoch": 894} {"train_loss": -20.50731086730957, "global_step": 74230, "epoch": 894} {"train_loss": -20.777372360229492, "global_step": 74231, "epoch": 894} {"train_loss": -21.008859634399414, "global_step": 74232, "epoch": 894} {"train_loss": -20.835813522338867, "global_step": 74233, "epoch": 894} {"train_loss": -20.981962203979492, "global_step": 74234, "epoch": 894} {"train_loss": -20.604618072509766, "global_step": 74235, "epoch": 894} {"train_loss": -20.603525161743164, "global_step": 74236, "epoch": 894} {"train_loss": -20.550500869750977, "global_step": 74237, "epoch": 894} {"train_loss": -20.92424964904785, "global_step": 74238, "epoch": 894} {"train_loss": -20.56254768371582, "global_step": 74239, "epoch": 894} {"train_loss": -20.775362014770508, "global_step": 74240, "epoch": 894} {"train_loss": -20.865467071533203, "global_step": 74241, "epoch": 894} {"train_loss": -20.922033309936523, "global_step": 74242, "epoch": 894} {"train_loss": -20.931583404541016, "global_step": 74243, "epoch": 894} {"train_loss": -20.7442626953125, "global_step": 74244, "epoch": 894} {"train_loss": -20.906274795532227, "global_step": 74245, "epoch": 894} {"train_loss": -21.37409210205078, "global_step": 74246, "epoch": 894} {"train_loss": -20.83199119567871, "global_step": 74247, "epoch": 894} {"train_loss": -20.71442222595215, "global_step": 74248, "epoch": 894} {"train_loss": -21.000394821166992, "global_step": 74249, "epoch": 894} {"train_loss": -21.056079864501953, "global_step": 74250, "epoch": 894} {"train_loss": -20.99199867248535, "global_step": 74251, "epoch": 894} {"train_loss": -20.71404266357422, "global_step": 74252, "epoch": 894} {"train_loss": -20.978595733642578, "global_step": 74253, "epoch": 894} {"train_loss": -20.987802505493164, "global_step": 74254, "epoch": 894} {"train_loss": -21.0200252532959, "global_step": 74255, "epoch": 894} {"train_loss": -21.542158126831055, "global_step": 74256, "epoch": 894} {"train_loss": -21.37091636657715, "global_step": 74257, "epoch": 894} {"train_loss": -20.84330177307129, "global_step": 74258, "epoch": 894} {"train_loss": -21.157007217407227, "global_step": 74259, "epoch": 894} {"train_loss": -20.915451049804688, "global_step": 74260, "epoch": 894} {"train_loss": -20.814634323120117, "global_step": 74261, "epoch": 894} {"train_loss": -21.33510398864746, "global_step": 74262, "epoch": 894} {"train_loss": -21.082386016845703, "global_step": 74263, "epoch": 894} {"train_loss": -21.101926803588867, "global_step": 74264, "epoch": 894} {"train_loss": -21.018718719482422, "global_step": 74265, "epoch": 894} {"train_loss": -20.98482322692871, "global_step": 74266, "epoch": 894} {"train_loss": -21.05461883544922, "global_step": 74267, "epoch": 894} {"train_loss": -21.148244857788086, "global_step": 74268, "epoch": 894} {"train_loss": -21.117895126342773, "global_step": 74269, "epoch": 894} {"train_loss": -21.239643096923828, "global_step": 74270, "epoch": 894} {"train_loss": -20.905582427978516, "global_step": 74271, "epoch": 894} {"train_loss": -20.90168571472168, "global_step": 74272, "epoch": 894} {"train_loss": -21.324487686157227, "global_step": 74273, "epoch": 894} {"train_loss": -21.139760971069336, "global_step": 74274, "epoch": 894} {"train_loss": -21.190820693969727, "global_step": 74275, "epoch": 894} {"train_loss": -20.887298583984375, "global_step": 74276, "epoch": 894} {"train_loss": -20.822065353393555, "global_step": 74277, "epoch": 894} {"train_loss": -20.873397827148438, "global_step": 74278, "epoch": 894} {"train_loss": -20.87190055847168, "global_step": 74279, "epoch": 894} {"train_loss": -21.207843780517578, "global_step": 74280, "epoch": 894} {"train_loss": -20.826963424682617, "global_step": 74281, "epoch": 894} {"train_loss": -20.722850799560547, "global_step": 74282, "epoch": 894} {"train_loss": -21.18635368347168, "global_step": 74283, "epoch": 894} {"train_loss": -20.811133809836512, "global_step": 74284, "epoch": 894, "val_loss": 5925615.5} {"train_loss": -20.527265548706055, "global_step": 74285, "epoch": 895} {"train_loss": -20.590848922729492, "global_step": 74286, "epoch": 895} {"train_loss": -21.028310775756836, "global_step": 74287, "epoch": 895} {"train_loss": -20.921100616455078, "global_step": 74288, "epoch": 895} {"train_loss": -20.753347396850586, "global_step": 74289, "epoch": 895} {"train_loss": -20.8602352142334, "global_step": 74290, "epoch": 895} {"train_loss": -20.28413200378418, "global_step": 74291, "epoch": 895} {"train_loss": -20.667743682861328, "global_step": 74292, "epoch": 895} {"train_loss": -20.75826072692871, "global_step": 74293, "epoch": 895} {"train_loss": -20.911130905151367, "global_step": 74294, "epoch": 895} {"train_loss": -20.695148468017578, "global_step": 74295, "epoch": 895} {"train_loss": -20.883459091186523, "global_step": 74296, "epoch": 895} {"train_loss": -21.230998992919922, "global_step": 74297, "epoch": 895} {"train_loss": -20.773754119873047, "global_step": 74298, "epoch": 895} {"train_loss": -20.965356826782227, "global_step": 74299, "epoch": 895} {"train_loss": -20.703556060791016, "global_step": 74300, "epoch": 895} {"train_loss": -20.87921142578125, "global_step": 74301, "epoch": 895} {"train_loss": -20.796981811523438, "global_step": 74302, "epoch": 895} {"train_loss": -20.767364501953125, "global_step": 74303, "epoch": 895} {"train_loss": -20.853071212768555, "global_step": 74304, "epoch": 895} {"train_loss": -20.863981246948242, "global_step": 74305, "epoch": 895} {"train_loss": -20.94986343383789, "global_step": 74306, "epoch": 895} {"train_loss": -20.914175033569336, "global_step": 74307, "epoch": 895} {"train_loss": -20.78026580810547, "global_step": 74308, "epoch": 895} {"train_loss": -21.070926666259766, "global_step": 74309, "epoch": 895} {"train_loss": -20.837270736694336, "global_step": 74310, "epoch": 895} {"train_loss": -20.938018798828125, "global_step": 74311, "epoch": 895} {"train_loss": -21.320043563842773, "global_step": 74312, "epoch": 895} {"train_loss": -20.705886840820312, "global_step": 74313, "epoch": 895} {"train_loss": -20.734542846679688, "global_step": 74314, "epoch": 895} {"train_loss": -20.79636573791504, "global_step": 74315, "epoch": 895} {"train_loss": -20.947683334350586, "global_step": 74316, "epoch": 895} {"train_loss": -21.206207275390625, "global_step": 74317, "epoch": 895} {"train_loss": -20.535884857177734, "global_step": 74318, "epoch": 895} {"train_loss": -21.081296920776367, "global_step": 74319, "epoch": 895} {"train_loss": -20.91973304748535, "global_step": 74320, "epoch": 895} {"train_loss": -21.154312133789062, "global_step": 74321, "epoch": 895} {"train_loss": -20.8690242767334, "global_step": 74322, "epoch": 895} {"train_loss": -21.0277156829834, "global_step": 74323, "epoch": 895} {"train_loss": -20.942420959472656, "global_step": 74324, "epoch": 895} {"train_loss": -20.732465744018555, "global_step": 74325, "epoch": 895} {"train_loss": -20.883792877197266, "global_step": 74326, "epoch": 895} {"train_loss": -21.192411422729492, "global_step": 74327, "epoch": 895} {"train_loss": -21.327301025390625, "global_step": 74328, "epoch": 895} {"train_loss": -20.973987579345703, "global_step": 74329, "epoch": 895} {"train_loss": -21.213659286499023, "global_step": 74330, "epoch": 895} {"train_loss": -20.65884780883789, "global_step": 74331, "epoch": 895} {"train_loss": -20.906095504760742, "global_step": 74332, "epoch": 895} {"train_loss": -21.037275314331055, "global_step": 74333, "epoch": 895} {"train_loss": -20.9759578704834, "global_step": 74334, "epoch": 895} {"train_loss": -21.02203941345215, "global_step": 74335, "epoch": 895} {"train_loss": -21.224674224853516, "global_step": 74336, "epoch": 895} {"train_loss": -21.370939254760742, "global_step": 74337, "epoch": 895} {"train_loss": -21.127222061157227, "global_step": 74338, "epoch": 895} {"train_loss": -21.139297485351562, "global_step": 74339, "epoch": 895} {"train_loss": -20.926435470581055, "global_step": 74340, "epoch": 895} {"train_loss": -20.608413696289062, "global_step": 74341, "epoch": 895} {"train_loss": -21.114627838134766, "global_step": 74342, "epoch": 895} {"train_loss": -20.987504959106445, "global_step": 74343, "epoch": 895} {"train_loss": -21.112316131591797, "global_step": 74344, "epoch": 895} {"train_loss": -20.912511825561523, "global_step": 74345, "epoch": 895} {"train_loss": -21.006305694580078, "global_step": 74346, "epoch": 895} {"train_loss": -21.056631088256836, "global_step": 74347, "epoch": 895} {"train_loss": -21.18189811706543, "global_step": 74348, "epoch": 895} {"train_loss": -21.285694122314453, "global_step": 74349, "epoch": 895} {"train_loss": -21.15637969970703, "global_step": 74350, "epoch": 895} {"train_loss": -20.52313232421875, "global_step": 74351, "epoch": 895} {"train_loss": -21.00539207458496, "global_step": 74352, "epoch": 895} {"train_loss": -20.998397827148438, "global_step": 74353, "epoch": 895} {"train_loss": -20.967885971069336, "global_step": 74354, "epoch": 895} {"train_loss": -21.18559455871582, "global_step": 74355, "epoch": 895} {"train_loss": -20.948633193969727, "global_step": 74356, "epoch": 895} {"train_loss": -20.984703063964844, "global_step": 74357, "epoch": 895} {"train_loss": -21.04640769958496, "global_step": 74358, "epoch": 895} {"train_loss": -21.125831604003906, "global_step": 74359, "epoch": 895} {"train_loss": -20.970415115356445, "global_step": 74360, "epoch": 895} {"train_loss": -21.17449951171875, "global_step": 74361, "epoch": 895} {"train_loss": -21.27316665649414, "global_step": 74362, "epoch": 895} {"train_loss": -21.18488883972168, "global_step": 74363, "epoch": 895} {"train_loss": -20.83827781677246, "global_step": 74364, "epoch": 895} {"train_loss": -21.359256744384766, "global_step": 74365, "epoch": 895} {"train_loss": -21.220653533935547, "global_step": 74366, "epoch": 895} {"train_loss": -20.9748449210661, "global_step": 74367, "epoch": 895, "val_loss": 6050560.5} {"train_loss": -20.694379806518555, "global_step": 74368, "epoch": 896} {"train_loss": -20.599821090698242, "global_step": 74369, "epoch": 896} {"train_loss": -20.511262893676758, "global_step": 74370, "epoch": 896} {"train_loss": -20.567819595336914, "global_step": 74371, "epoch": 896} {"train_loss": -20.85040283203125, "global_step": 74372, "epoch": 896} {"train_loss": -20.641164779663086, "global_step": 74373, "epoch": 896} {"train_loss": -20.628759384155273, "global_step": 74374, "epoch": 896} {"train_loss": -20.80794334411621, "global_step": 74375, "epoch": 896} {"train_loss": -20.75584602355957, "global_step": 74376, "epoch": 896} {"train_loss": -20.684553146362305, "global_step": 74377, "epoch": 896} {"train_loss": -20.91419792175293, "global_step": 74378, "epoch": 896} {"train_loss": -20.60051918029785, "global_step": 74379, "epoch": 896} {"train_loss": -20.612598419189453, "global_step": 74380, "epoch": 896} {"train_loss": -20.849994659423828, "global_step": 74381, "epoch": 896} {"train_loss": -21.133649826049805, "global_step": 74382, "epoch": 896} {"train_loss": -20.446327209472656, "global_step": 74383, "epoch": 896} {"train_loss": -20.392364501953125, "global_step": 74384, "epoch": 896} {"train_loss": -20.584930419921875, "global_step": 74385, "epoch": 896} {"train_loss": -20.72983741760254, "global_step": 74386, "epoch": 896} {"train_loss": -20.468265533447266, "global_step": 74387, "epoch": 896} {"train_loss": -20.842788696289062, "global_step": 74388, "epoch": 896} {"train_loss": -20.522789001464844, "global_step": 74389, "epoch": 896} {"train_loss": -21.226425170898438, "global_step": 74390, "epoch": 896} {"train_loss": -20.68750762939453, "global_step": 74391, "epoch": 896} {"train_loss": -20.952404022216797, "global_step": 74392, "epoch": 896} {"train_loss": -20.89776039123535, "global_step": 74393, "epoch": 896} {"train_loss": -21.061283111572266, "global_step": 74394, "epoch": 896} {"train_loss": -20.911306381225586, "global_step": 74395, "epoch": 896} {"train_loss": -20.34296417236328, "global_step": 74396, "epoch": 896} {"train_loss": -21.070114135742188, "global_step": 74397, "epoch": 896} {"train_loss": -21.189062118530273, "global_step": 74398, "epoch": 896} {"train_loss": -20.586944580078125, "global_step": 74399, "epoch": 896} {"train_loss": -21.065690994262695, "global_step": 74400, "epoch": 896} {"train_loss": -21.07954978942871, "global_step": 74401, "epoch": 896} {"train_loss": -21.04585838317871, "global_step": 74402, "epoch": 896} {"train_loss": -20.810535430908203, "global_step": 74403, "epoch": 896} {"train_loss": -20.85672950744629, "global_step": 74404, "epoch": 896} {"train_loss": -20.668193817138672, "global_step": 74405, "epoch": 896} {"train_loss": -21.15753936767578, "global_step": 74406, "epoch": 896} {"train_loss": -20.862051010131836, "global_step": 74407, "epoch": 896} {"train_loss": -21.206769943237305, "global_step": 74408, "epoch": 896} {"train_loss": -20.814977645874023, "global_step": 74409, "epoch": 896} {"train_loss": -20.861583709716797, "global_step": 74410, "epoch": 896} {"train_loss": -20.97928237915039, "global_step": 74411, "epoch": 896} {"train_loss": -21.094202041625977, "global_step": 74412, "epoch": 896} {"train_loss": -20.8459529876709, "global_step": 74413, "epoch": 896} {"train_loss": -20.648405075073242, "global_step": 74414, "epoch": 896} {"train_loss": -20.866491317749023, "global_step": 74415, "epoch": 896} {"train_loss": -21.053192138671875, "global_step": 74416, "epoch": 896} {"train_loss": -21.351163864135742, "global_step": 74417, "epoch": 896} {"train_loss": -21.340900421142578, "global_step": 74418, "epoch": 896} {"train_loss": -21.086172103881836, "global_step": 74419, "epoch": 896} {"train_loss": -21.324983596801758, "global_step": 74420, "epoch": 896} {"train_loss": -20.98221778869629, "global_step": 74421, "epoch": 896} {"train_loss": -21.193042755126953, "global_step": 74422, "epoch": 896} {"train_loss": -21.107616424560547, "global_step": 74423, "epoch": 896} {"train_loss": -21.081939697265625, "global_step": 74424, "epoch": 896} {"train_loss": -21.07521629333496, "global_step": 74425, "epoch": 896} {"train_loss": -21.356061935424805, "global_step": 74426, "epoch": 896} {"train_loss": -20.90389060974121, "global_step": 74427, "epoch": 896} {"train_loss": -21.147464752197266, "global_step": 74428, "epoch": 896} {"train_loss": -20.99433708190918, "global_step": 74429, "epoch": 896} {"train_loss": -21.237905502319336, "global_step": 74430, "epoch": 896} {"train_loss": -21.17026138305664, "global_step": 74431, "epoch": 896} {"train_loss": -20.55318832397461, "global_step": 74432, "epoch": 896} {"train_loss": -20.921899795532227, "global_step": 74433, "epoch": 896} {"train_loss": -20.524202346801758, "global_step": 74434, "epoch": 896} {"train_loss": -20.802032470703125, "global_step": 74435, "epoch": 896} {"train_loss": -20.78887939453125, "global_step": 74436, "epoch": 896} {"train_loss": -20.8621768951416, "global_step": 74437, "epoch": 896} {"train_loss": -20.888776779174805, "global_step": 74438, "epoch": 896} {"train_loss": -20.9473819732666, "global_step": 74439, "epoch": 896} {"train_loss": -20.85628890991211, "global_step": 74440, "epoch": 896} {"train_loss": -20.871898651123047, "global_step": 74441, "epoch": 896} {"train_loss": -21.113178253173828, "global_step": 74442, "epoch": 896} {"train_loss": -20.73267364501953, "global_step": 74443, "epoch": 896} {"train_loss": -21.084218978881836, "global_step": 74444, "epoch": 896} {"train_loss": -20.72755241394043, "global_step": 74445, "epoch": 896} {"train_loss": -20.915409088134766, "global_step": 74446, "epoch": 896} {"train_loss": -21.045623779296875, "global_step": 74447, "epoch": 896} {"train_loss": -21.267921447753906, "global_step": 74448, "epoch": 896} {"train_loss": -21.49823570251465, "global_step": 74449, "epoch": 896} {"train_loss": -20.89415210126394, "global_step": 74450, "epoch": 896, "val_loss": 6068115.0} {"train_loss": -20.261493682861328, "global_step": 74451, "epoch": 897} {"train_loss": -20.77461051940918, "global_step": 74452, "epoch": 897} {"train_loss": -20.52583885192871, "global_step": 74453, "epoch": 897} {"train_loss": -20.683250427246094, "global_step": 74454, "epoch": 897} {"train_loss": -21.088638305664062, "global_step": 74455, "epoch": 897} {"train_loss": -20.844268798828125, "global_step": 74456, "epoch": 897} {"train_loss": -20.58986473083496, "global_step": 74457, "epoch": 897} {"train_loss": -21.08272361755371, "global_step": 74458, "epoch": 897} {"train_loss": -20.822107315063477, "global_step": 74459, "epoch": 897} {"train_loss": -20.804933547973633, "global_step": 74460, "epoch": 897} {"train_loss": -20.667705535888672, "global_step": 74461, "epoch": 897} {"train_loss": -20.67289924621582, "global_step": 74462, "epoch": 897} {"train_loss": -20.70513153076172, "global_step": 74463, "epoch": 897} {"train_loss": -20.92106819152832, "global_step": 74464, "epoch": 897} {"train_loss": -20.910140991210938, "global_step": 74465, "epoch": 897} {"train_loss": -20.478498458862305, "global_step": 74466, "epoch": 897} {"train_loss": -20.728788375854492, "global_step": 74467, "epoch": 897} {"train_loss": -20.941274642944336, "global_step": 74468, "epoch": 897} {"train_loss": -20.93438720703125, "global_step": 74469, "epoch": 897} {"train_loss": -20.85103416442871, "global_step": 74470, "epoch": 897} {"train_loss": -21.09743309020996, "global_step": 74471, "epoch": 897} {"train_loss": -20.641788482666016, "global_step": 74472, "epoch": 897} {"train_loss": -21.241619110107422, "global_step": 74473, "epoch": 897} {"train_loss": -20.82375144958496, "global_step": 74474, "epoch": 897} {"train_loss": -21.08905601501465, "global_step": 74475, "epoch": 897} {"train_loss": -20.690685272216797, "global_step": 74476, "epoch": 897} {"train_loss": -21.12978172302246, "global_step": 74477, "epoch": 897} {"train_loss": -20.8209228515625, "global_step": 74478, "epoch": 897} {"train_loss": -21.257293701171875, "global_step": 74479, "epoch": 897} {"train_loss": -20.661508560180664, "global_step": 74480, "epoch": 897} {"train_loss": -20.817724227905273, "global_step": 74481, "epoch": 897} {"train_loss": -21.08913230895996, "global_step": 74482, "epoch": 897} {"train_loss": -20.979520797729492, "global_step": 74483, "epoch": 897} {"train_loss": -20.865625381469727, "global_step": 74484, "epoch": 897} {"train_loss": -20.934675216674805, "global_step": 74485, "epoch": 897} {"train_loss": -21.031301498413086, "global_step": 74486, "epoch": 897} {"train_loss": -21.31459617614746, "global_step": 74487, "epoch": 897} {"train_loss": -21.01521873474121, "global_step": 74488, "epoch": 897} {"train_loss": -20.73573875427246, "global_step": 74489, "epoch": 897} {"train_loss": -21.3475284576416, "global_step": 74490, "epoch": 897} {"train_loss": -21.09718132019043, "global_step": 74491, "epoch": 897} {"train_loss": -21.1143856048584, "global_step": 74492, "epoch": 897} {"train_loss": -21.3280086517334, "global_step": 74493, "epoch": 897} {"train_loss": -20.832197189331055, "global_step": 74494, "epoch": 897} {"train_loss": -21.18938636779785, "global_step": 74495, "epoch": 897} {"train_loss": -20.65913963317871, "global_step": 74496, "epoch": 897} {"train_loss": -21.145767211914062, "global_step": 74497, "epoch": 897} {"train_loss": -20.8214168548584, "global_step": 74498, "epoch": 897} {"train_loss": -21.22317886352539, "global_step": 74499, "epoch": 897} {"train_loss": -20.97859001159668, "global_step": 74500, "epoch": 897} {"train_loss": -20.826086044311523, "global_step": 74501, "epoch": 897} {"train_loss": -21.111682891845703, "global_step": 74502, "epoch": 897} {"train_loss": -21.157962799072266, "global_step": 74503, "epoch": 897} {"train_loss": -21.091703414916992, "global_step": 74504, "epoch": 897} {"train_loss": -21.139591217041016, "global_step": 74505, "epoch": 897} {"train_loss": -21.09212303161621, "global_step": 74506, "epoch": 897} {"train_loss": -21.23444938659668, "global_step": 74507, "epoch": 897} {"train_loss": -20.824548721313477, "global_step": 74508, "epoch": 897} {"train_loss": -21.026540756225586, "global_step": 74509, "epoch": 897} {"train_loss": -21.219816207885742, "global_step": 74510, "epoch": 897} {"train_loss": -20.51896095275879, "global_step": 74511, "epoch": 897} {"train_loss": -20.86158561706543, "global_step": 74512, "epoch": 897} {"train_loss": -21.1307430267334, "global_step": 74513, "epoch": 897} {"train_loss": -20.82900047302246, "global_step": 74514, "epoch": 897} {"train_loss": -21.189544677734375, "global_step": 74515, "epoch": 897} {"train_loss": -20.997726440429688, "global_step": 74516, "epoch": 897} {"train_loss": -21.39693260192871, "global_step": 74517, "epoch": 897} {"train_loss": -20.93501853942871, "global_step": 74518, "epoch": 897} {"train_loss": -20.776065826416016, "global_step": 74519, "epoch": 897} {"train_loss": -21.070661544799805, "global_step": 74520, "epoch": 897} {"train_loss": -21.29766082763672, "global_step": 74521, "epoch": 897} {"train_loss": -20.62776756286621, "global_step": 74522, "epoch": 897} {"train_loss": -21.149227142333984, "global_step": 74523, "epoch": 897} {"train_loss": -20.940900802612305, "global_step": 74524, "epoch": 897} {"train_loss": -20.83510398864746, "global_step": 74525, "epoch": 897} {"train_loss": -21.254518508911133, "global_step": 74526, "epoch": 897} {"train_loss": -20.923948287963867, "global_step": 74527, "epoch": 897} {"train_loss": -20.87776756286621, "global_step": 74528, "epoch": 897} {"train_loss": -20.78449821472168, "global_step": 74529, "epoch": 897} {"train_loss": -21.09316062927246, "global_step": 74530, "epoch": 897} {"train_loss": -21.081892013549805, "global_step": 74531, "epoch": 897} {"train_loss": -20.868757247924805, "global_step": 74532, "epoch": 897} {"train_loss": -20.9618435595409, "global_step": 74533, "epoch": 897, "val_loss": 6154373.0} {"train_loss": -20.4366512298584, "global_step": 74534, "epoch": 898} {"train_loss": -19.648529052734375, "global_step": 74535, "epoch": 898} {"train_loss": -20.737668991088867, "global_step": 74536, "epoch": 898} {"train_loss": -20.64906883239746, "global_step": 74537, "epoch": 898} {"train_loss": -20.914087295532227, "global_step": 74538, "epoch": 898} {"train_loss": -20.864416122436523, "global_step": 74539, "epoch": 898} {"train_loss": -20.282352447509766, "global_step": 74540, "epoch": 898} {"train_loss": -20.726478576660156, "global_step": 74541, "epoch": 898} {"train_loss": -20.62493133544922, "global_step": 74542, "epoch": 898} {"train_loss": -20.810937881469727, "global_step": 74543, "epoch": 898} {"train_loss": -20.69861602783203, "global_step": 74544, "epoch": 898} {"train_loss": -20.9075984954834, "global_step": 74545, "epoch": 898} {"train_loss": -20.440412521362305, "global_step": 74546, "epoch": 898} {"train_loss": -20.501272201538086, "global_step": 74547, "epoch": 898} {"train_loss": -20.884252548217773, "global_step": 74548, "epoch": 898} {"train_loss": -20.840927124023438, "global_step": 74549, "epoch": 898} {"train_loss": -20.899017333984375, "global_step": 74550, "epoch": 898} {"train_loss": -20.988218307495117, "global_step": 74551, "epoch": 898} {"train_loss": -20.976131439208984, "global_step": 74552, "epoch": 898} {"train_loss": -20.798105239868164, "global_step": 74553, "epoch": 898} {"train_loss": -21.038755416870117, "global_step": 74554, "epoch": 898} {"train_loss": -20.592676162719727, "global_step": 74555, "epoch": 898} {"train_loss": -20.992782592773438, "global_step": 74556, "epoch": 898} {"train_loss": -21.114240646362305, "global_step": 74557, "epoch": 898} {"train_loss": -21.098005294799805, "global_step": 74558, "epoch": 898} {"train_loss": -21.031330108642578, "global_step": 74559, "epoch": 898} {"train_loss": -20.984872817993164, "global_step": 74560, "epoch": 898} {"train_loss": -21.0769100189209, "global_step": 74561, "epoch": 898} {"train_loss": -21.066587448120117, "global_step": 74562, "epoch": 898} {"train_loss": -20.756540298461914, "global_step": 74563, "epoch": 898} {"train_loss": -20.930891036987305, "global_step": 74564, "epoch": 898} {"train_loss": -21.214521408081055, "global_step": 74565, "epoch": 898} {"train_loss": -20.85609245300293, "global_step": 74566, "epoch": 898} {"train_loss": -20.8775691986084, "global_step": 74567, "epoch": 898} {"train_loss": -20.913923263549805, "global_step": 74568, "epoch": 898} {"train_loss": -21.223581314086914, "global_step": 74569, "epoch": 898} {"train_loss": -20.79155731201172, "global_step": 74570, "epoch": 898} {"train_loss": -20.92955207824707, "global_step": 74571, "epoch": 898} {"train_loss": -21.363183975219727, "global_step": 74572, "epoch": 898} {"train_loss": -20.947912216186523, "global_step": 74573, "epoch": 898} {"train_loss": -21.249582290649414, "global_step": 74574, "epoch": 898} {"train_loss": -21.26235008239746, "global_step": 74575, "epoch": 898} {"train_loss": -21.002511978149414, "global_step": 74576, "epoch": 898} {"train_loss": -21.03085708618164, "global_step": 74577, "epoch": 898} {"train_loss": -21.031837463378906, "global_step": 74578, "epoch": 898} {"train_loss": -21.2463321685791, "global_step": 74579, "epoch": 898} {"train_loss": -20.843847274780273, "global_step": 74580, "epoch": 898} {"train_loss": -21.45258903503418, "global_step": 74581, "epoch": 898} {"train_loss": -20.61530876159668, "global_step": 74582, "epoch": 898} {"train_loss": -20.603891372680664, "global_step": 74583, "epoch": 898} {"train_loss": -21.41446304321289, "global_step": 74584, "epoch": 898} {"train_loss": -20.49639892578125, "global_step": 74585, "epoch": 898} {"train_loss": -20.89826774597168, "global_step": 74586, "epoch": 898} {"train_loss": -21.234027862548828, "global_step": 74587, "epoch": 898} {"train_loss": -20.6523380279541, "global_step": 74588, "epoch": 898} {"train_loss": -20.98579216003418, "global_step": 74589, "epoch": 898} {"train_loss": -20.882566452026367, "global_step": 74590, "epoch": 898} {"train_loss": -21.068235397338867, "global_step": 74591, "epoch": 898} {"train_loss": -21.033889770507812, "global_step": 74592, "epoch": 898} {"train_loss": -21.094141006469727, "global_step": 74593, "epoch": 898} {"train_loss": -21.533695220947266, "global_step": 74594, "epoch": 898} {"train_loss": -20.873310089111328, "global_step": 74595, "epoch": 898} {"train_loss": -20.977258682250977, "global_step": 74596, "epoch": 898} {"train_loss": -20.906410217285156, "global_step": 74597, "epoch": 898} {"train_loss": -21.104795455932617, "global_step": 74598, "epoch": 898} {"train_loss": -20.925825119018555, "global_step": 74599, "epoch": 898} {"train_loss": -20.806196212768555, "global_step": 74600, "epoch": 898} {"train_loss": -20.76250457763672, "global_step": 74601, "epoch": 898} {"train_loss": -21.727798461914062, "global_step": 74602, "epoch": 898} {"train_loss": -21.02313804626465, "global_step": 74603, "epoch": 898} {"train_loss": -20.87094497680664, "global_step": 74604, "epoch": 898} {"train_loss": -20.91010093688965, "global_step": 74605, "epoch": 898} {"train_loss": -21.029890060424805, "global_step": 74606, "epoch": 898} {"train_loss": -21.005834579467773, "global_step": 74607, "epoch": 898} {"train_loss": -20.63492202758789, "global_step": 74608, "epoch": 898} {"train_loss": -21.047122955322266, "global_step": 74609, "epoch": 898} {"train_loss": -20.839933395385742, "global_step": 74610, "epoch": 898} {"train_loss": -21.0579833984375, "global_step": 74611, "epoch": 898} {"train_loss": -20.820093154907227, "global_step": 74612, "epoch": 898} {"train_loss": -20.646299362182617, "global_step": 74613, "epoch": 898} {"train_loss": -21.098676681518555, "global_step": 74614, "epoch": 898} {"train_loss": -20.794496536254883, "global_step": 74615, "epoch": 898} {"train_loss": -20.90428306395749, "global_step": 74616, "epoch": 898, "val_loss": 5976798.0} {"train_loss": -20.51732635498047, "global_step": 74617, "epoch": 899} {"train_loss": -20.863569259643555, "global_step": 74618, "epoch": 899} {"train_loss": -20.33185386657715, "global_step": 74619, "epoch": 899} {"train_loss": -21.05684471130371, "global_step": 74620, "epoch": 899} {"train_loss": -20.492856979370117, "global_step": 74621, "epoch": 899} {"train_loss": -20.733686447143555, "global_step": 74622, "epoch": 899} {"train_loss": -20.48160743713379, "global_step": 74623, "epoch": 899} {"train_loss": -20.5498046875, "global_step": 74624, "epoch": 899} {"train_loss": -20.936925888061523, "global_step": 74625, "epoch": 899} {"train_loss": -20.871076583862305, "global_step": 74626, "epoch": 899} {"train_loss": -20.5892276763916, "global_step": 74627, "epoch": 899} {"train_loss": -20.630512237548828, "global_step": 74628, "epoch": 899} {"train_loss": -21.214462280273438, "global_step": 74629, "epoch": 899} {"train_loss": -20.68967056274414, "global_step": 74630, "epoch": 899} {"train_loss": -20.733455657958984, "global_step": 74631, "epoch": 899} {"train_loss": -21.407535552978516, "global_step": 74632, "epoch": 899} {"train_loss": -20.8787784576416, "global_step": 74633, "epoch": 899} {"train_loss": -20.381271362304688, "global_step": 74634, "epoch": 899} {"train_loss": -20.586246490478516, "global_step": 74635, "epoch": 899} {"train_loss": -21.23843765258789, "global_step": 74636, "epoch": 899} {"train_loss": -20.787229537963867, "global_step": 74637, "epoch": 899} {"train_loss": -20.709890365600586, "global_step": 74638, "epoch": 899} {"train_loss": -20.52182388305664, "global_step": 74639, "epoch": 899} {"train_loss": -20.516462326049805, "global_step": 74640, "epoch": 899} {"train_loss": -20.559568405151367, "global_step": 74641, "epoch": 899} {"train_loss": -21.04010581970215, "global_step": 74642, "epoch": 899} {"train_loss": -20.999496459960938, "global_step": 74643, "epoch": 899} {"train_loss": -20.892505645751953, "global_step": 74644, "epoch": 899} {"train_loss": -20.721515655517578, "global_step": 74645, "epoch": 899} {"train_loss": -20.967418670654297, "global_step": 74646, "epoch": 899} {"train_loss": -21.002424240112305, "global_step": 74647, "epoch": 899} {"train_loss": -20.727413177490234, "global_step": 74648, "epoch": 899} {"train_loss": -20.950450897216797, "global_step": 74649, "epoch": 899} {"train_loss": -21.224781036376953, "global_step": 74650, "epoch": 899} {"train_loss": -20.931808471679688, "global_step": 74651, "epoch": 899} {"train_loss": -20.921735763549805, "global_step": 74652, "epoch": 899} {"train_loss": -21.1035213470459, "global_step": 74653, "epoch": 899} {"train_loss": -20.671613693237305, "global_step": 74654, "epoch": 899} {"train_loss": -20.973846435546875, "global_step": 74655, "epoch": 899} {"train_loss": -21.077835083007812, "global_step": 74656, "epoch": 899} {"train_loss": -20.768857955932617, "global_step": 74657, "epoch": 899} {"train_loss": -20.903684616088867, "global_step": 74658, "epoch": 899} {"train_loss": -21.205982208251953, "global_step": 74659, "epoch": 899} {"train_loss": -21.39208984375, "global_step": 74660, "epoch": 899} {"train_loss": -21.088693618774414, "global_step": 74661, "epoch": 899} {"train_loss": -21.085336685180664, "global_step": 74662, "epoch": 899} {"train_loss": -20.980390548706055, "global_step": 74663, "epoch": 899} {"train_loss": -20.935049057006836, "global_step": 74664, "epoch": 899} {"train_loss": -21.231321334838867, "global_step": 74665, "epoch": 899} {"train_loss": -20.889720916748047, "global_step": 74666, "epoch": 899} {"train_loss": -20.818578720092773, "global_step": 74667, "epoch": 899} {"train_loss": -21.156436920166016, "global_step": 74668, "epoch": 899} {"train_loss": -21.146677017211914, "global_step": 74669, "epoch": 899} {"train_loss": -21.05568504333496, "global_step": 74670, "epoch": 899} {"train_loss": -21.11579704284668, "global_step": 74671, "epoch": 899} {"train_loss": -21.473840713500977, "global_step": 74672, "epoch": 899} {"train_loss": -20.94948387145996, "global_step": 74673, "epoch": 899} {"train_loss": -20.94679832458496, "global_step": 74674, "epoch": 899} {"train_loss": -21.268585205078125, "global_step": 74675, "epoch": 899} {"train_loss": -21.423704147338867, "global_step": 74676, "epoch": 899} {"train_loss": -21.172229766845703, "global_step": 74677, "epoch": 899} {"train_loss": -21.2352352142334, "global_step": 74678, "epoch": 899} {"train_loss": -21.053190231323242, "global_step": 74679, "epoch": 899} {"train_loss": -20.77748680114746, "global_step": 74680, "epoch": 899} {"train_loss": -21.112714767456055, "global_step": 74681, "epoch": 899} {"train_loss": -20.958791732788086, "global_step": 74682, "epoch": 899} {"train_loss": -20.927762985229492, "global_step": 74683, "epoch": 899} {"train_loss": -21.154857635498047, "global_step": 74684, "epoch": 899} {"train_loss": -21.017288208007812, "global_step": 74685, "epoch": 899} {"train_loss": -20.991514205932617, "global_step": 74686, "epoch": 899} {"train_loss": -21.034311294555664, "global_step": 74687, "epoch": 899} {"train_loss": -20.92901039123535, "global_step": 74688, "epoch": 899} {"train_loss": -20.512081146240234, "global_step": 74689, "epoch": 899} {"train_loss": -20.919599533081055, "global_step": 74690, "epoch": 899} {"train_loss": -20.848142623901367, "global_step": 74691, "epoch": 899} {"train_loss": -20.822172164916992, "global_step": 74692, "epoch": 899} {"train_loss": -21.245580673217773, "global_step": 74693, "epoch": 899} {"train_loss": -20.744373321533203, "global_step": 74694, "epoch": 899} {"train_loss": -21.54244041442871, "global_step": 74695, "epoch": 899} {"train_loss": -21.182159423828125, "global_step": 74696, "epoch": 899} {"train_loss": -20.977680206298828, "global_step": 74697, "epoch": 899} {"train_loss": -20.888843536376953, "global_step": 74698, "epoch": 899} {"train_loss": -20.924768034234106, "global_step": 74699, "epoch": 899, "val_loss": 6019714.5} {"train_loss": -21.05368995666504, "global_step": 74700, "epoch": 900} {"train_loss": -20.993179321289062, "global_step": 74701, "epoch": 900} {"train_loss": -20.91012954711914, "global_step": 74702, "epoch": 900} {"train_loss": -20.87027931213379, "global_step": 74703, "epoch": 900} {"train_loss": -20.960359573364258, "global_step": 74704, "epoch": 900} {"train_loss": -21.030834197998047, "global_step": 74705, "epoch": 900} {"train_loss": -20.931907653808594, "global_step": 74706, "epoch": 900} {"train_loss": -21.051715850830078, "global_step": 74707, "epoch": 900} {"train_loss": -21.089651107788086, "global_step": 74708, "epoch": 900} {"train_loss": -20.8701229095459, "global_step": 74709, "epoch": 900} {"train_loss": -20.789670944213867, "global_step": 74710, "epoch": 900} {"train_loss": -21.252674102783203, "global_step": 74711, "epoch": 900} {"train_loss": -20.797887802124023, "global_step": 74712, "epoch": 900} {"train_loss": -20.979461669921875, "global_step": 74713, "epoch": 900} {"train_loss": -21.01446533203125, "global_step": 74714, "epoch": 900} {"train_loss": -20.92095375061035, "global_step": 74715, "epoch": 900} {"train_loss": -21.101318359375, "global_step": 74716, "epoch": 900} {"train_loss": -20.661651611328125, "global_step": 74717, "epoch": 900} {"train_loss": -20.977392196655273, "global_step": 74718, "epoch": 900} {"train_loss": -20.955322265625, "global_step": 74719, "epoch": 900} {"train_loss": -21.089757919311523, "global_step": 74720, "epoch": 900} {"train_loss": -20.78337287902832, "global_step": 74721, "epoch": 900} {"train_loss": -20.972543716430664, "global_step": 74722, "epoch": 900} {"train_loss": -21.0660457611084, "global_step": 74723, "epoch": 900} {"train_loss": -21.129547119140625, "global_step": 74724, "epoch": 900} {"train_loss": -21.02789878845215, "global_step": 74725, "epoch": 900} {"train_loss": -21.031105041503906, "global_step": 74726, "epoch": 900} {"train_loss": -20.711462020874023, "global_step": 74727, "epoch": 900} {"train_loss": -21.152219772338867, "global_step": 74728, "epoch": 900} {"train_loss": -21.06325340270996, "global_step": 74729, "epoch": 900} {"train_loss": -20.869291305541992, "global_step": 74730, "epoch": 900} {"train_loss": -20.9439697265625, "global_step": 74731, "epoch": 900} {"train_loss": -21.037670135498047, "global_step": 74732, "epoch": 900} {"train_loss": -21.01930046081543, "global_step": 74733, "epoch": 900} {"train_loss": -21.23628807067871, "global_step": 74734, "epoch": 900} {"train_loss": -20.744260787963867, "global_step": 74735, "epoch": 900} {"train_loss": -20.56678009033203, "global_step": 74736, "epoch": 900} {"train_loss": -20.651708602905273, "global_step": 74737, "epoch": 900} {"train_loss": -21.143985748291016, "global_step": 74738, "epoch": 900} {"train_loss": -20.92574119567871, "global_step": 74739, "epoch": 900} {"train_loss": -21.20779800415039, "global_step": 74740, "epoch": 900} {"train_loss": -21.091115951538086, "global_step": 74741, "epoch": 900} {"train_loss": -20.827056884765625, "global_step": 74742, "epoch": 900} {"train_loss": -20.996585845947266, "global_step": 74743, "epoch": 900} {"train_loss": -21.098926544189453, "global_step": 74744, "epoch": 900} {"train_loss": -20.868391036987305, "global_step": 74745, "epoch": 900} {"train_loss": -21.13868522644043, "global_step": 74746, "epoch": 900} {"train_loss": -21.20920753479004, "global_step": 74747, "epoch": 900} {"train_loss": -21.046445846557617, "global_step": 74748, "epoch": 900} {"train_loss": -21.316572189331055, "global_step": 74749, "epoch": 900} {"train_loss": -21.034177780151367, "global_step": 74750, "epoch": 900} {"train_loss": -20.987144470214844, "global_step": 74751, "epoch": 900} {"train_loss": -20.992416381835938, "global_step": 74752, "epoch": 900} {"train_loss": -21.118196487426758, "global_step": 74753, "epoch": 900} {"train_loss": -21.30933952331543, "global_step": 74754, "epoch": 900} {"train_loss": -20.997587203979492, "global_step": 74755, "epoch": 900} {"train_loss": -20.828636169433594, "global_step": 74756, "epoch": 900} {"train_loss": -20.76898765563965, "global_step": 74757, "epoch": 900} {"train_loss": -20.939208984375, "global_step": 74758, "epoch": 900} {"train_loss": -20.893835067749023, "global_step": 74759, "epoch": 900} {"train_loss": -21.18052864074707, "global_step": 74760, "epoch": 900} {"train_loss": -21.269187927246094, "global_step": 74761, "epoch": 900} {"train_loss": -21.027677536010742, "global_step": 74762, "epoch": 900} {"train_loss": -20.621545791625977, "global_step": 74763, "epoch": 900} {"train_loss": -21.204160690307617, "global_step": 74764, "epoch": 900} {"train_loss": -21.18995475769043, "global_step": 74765, "epoch": 900} {"train_loss": -21.01600456237793, "global_step": 74766, "epoch": 900} {"train_loss": -20.910078048706055, "global_step": 74767, "epoch": 900} {"train_loss": -20.930561065673828, "global_step": 74768, "epoch": 900} {"train_loss": -20.40106964111328, "global_step": 74769, "epoch": 900} {"train_loss": -20.66046905517578, "global_step": 74770, "epoch": 900} {"train_loss": -20.98823356628418, "global_step": 74771, "epoch": 900} {"train_loss": -21.09186363220215, "global_step": 74772, "epoch": 900} {"train_loss": -21.09966468811035, "global_step": 74773, "epoch": 900} {"train_loss": -21.03919792175293, "global_step": 74774, "epoch": 900} {"train_loss": -20.430849075317383, "global_step": 74775, "epoch": 900} {"train_loss": -21.155853271484375, "global_step": 74776, "epoch": 900} {"train_loss": -20.906208038330078, "global_step": 74777, "epoch": 900} {"train_loss": -20.4949893951416, "global_step": 74778, "epoch": 900} {"train_loss": -21.17249870300293, "global_step": 74779, "epoch": 900} {"train_loss": -21.165868759155273, "global_step": 74780, "epoch": 900} {"train_loss": -20.8740234375, "global_step": 74781, "epoch": 900} {"train_loss": -20.965019478855364, "global_step": 74782, "epoch": 900, "train/sim_max_reward_0": 1.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 0.0, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4500000": 1.0, "test/sim_max_reward_4500001": 1.0, "test/sim_max_reward_4500002": 1.0, "test/sim_max_reward_4500003": 1.0, "test/sim_max_reward_4500004": 0.0, "test/sim_max_reward_4500005": 1.0, "test/sim_max_reward_4500006": 1.0, "test/sim_max_reward_4500007": 1.0, "test/sim_max_reward_4500008": 1.0, "test/sim_max_reward_4500009": 1.0, "test/sim_max_reward_4500010": 1.0, "test/sim_max_reward_4500011": 1.0, "test/sim_max_reward_4500012": 1.0, "test/sim_max_reward_4500013": 1.0, "test/sim_max_reward_4500014": 1.0, "test/sim_max_reward_4500015": 1.0, "test/sim_max_reward_4500016": 1.0, "test/sim_max_reward_4500017": 1.0, "test/sim_max_reward_4500018": 1.0, "test/sim_max_reward_4500019": 0.0, "test/sim_max_reward_4500020": 1.0, "test/sim_max_reward_4500021": 1.0, "train/mean_score": 0.8333333333333334, "test/mean_score": 0.9090909090909091, "val_loss": 6084892.0} {"train_loss": -20.365453720092773, "global_step": 74783, "epoch": 901} {"train_loss": -20.85041618347168, "global_step": 74784, "epoch": 901} {"train_loss": -20.20467185974121, "global_step": 74785, "epoch": 901} {"train_loss": -20.53632164001465, "global_step": 74786, "epoch": 901} {"train_loss": -20.31892967224121, "global_step": 74787, "epoch": 901} {"train_loss": -20.50885009765625, "global_step": 74788, "epoch": 901} {"train_loss": -20.81277084350586, "global_step": 74789, "epoch": 901} {"train_loss": -20.64397430419922, "global_step": 74790, "epoch": 901} {"train_loss": -20.800189971923828, "global_step": 74791, "epoch": 901} {"train_loss": -20.727136611938477, "global_step": 74792, "epoch": 901} {"train_loss": -20.507436752319336, "global_step": 74793, "epoch": 901} {"train_loss": -20.412273406982422, "global_step": 74794, "epoch": 901} {"train_loss": -21.185134887695312, "global_step": 74795, "epoch": 901} {"train_loss": -20.939573287963867, "global_step": 74796, "epoch": 901} {"train_loss": -20.876495361328125, "global_step": 74797, "epoch": 901} {"train_loss": -21.109216690063477, "global_step": 74798, "epoch": 901} {"train_loss": -21.025745391845703, "global_step": 74799, "epoch": 901} {"train_loss": -20.823978424072266, "global_step": 74800, "epoch": 901} {"train_loss": -21.07806396484375, "global_step": 74801, "epoch": 901} {"train_loss": -21.176687240600586, "global_step": 74802, "epoch": 901} {"train_loss": -21.2315616607666, "global_step": 74803, "epoch": 901} {"train_loss": -20.880273818969727, "global_step": 74804, "epoch": 901} {"train_loss": -21.001739501953125, "global_step": 74805, "epoch": 901} {"train_loss": -20.858484268188477, "global_step": 74806, "epoch": 901} {"train_loss": -20.827768325805664, "global_step": 74807, "epoch": 901} {"train_loss": -20.95372772216797, "global_step": 74808, "epoch": 901} {"train_loss": -20.855947494506836, "global_step": 74809, "epoch": 901} {"train_loss": -21.023109436035156, "global_step": 74810, "epoch": 901} {"train_loss": -20.77350616455078, "global_step": 74811, "epoch": 901} {"train_loss": -21.138341903686523, "global_step": 74812, "epoch": 901} {"train_loss": -21.0658016204834, "global_step": 74813, "epoch": 901} {"train_loss": -20.710498809814453, "global_step": 74814, "epoch": 901} {"train_loss": -20.85359764099121, "global_step": 74815, "epoch": 901} {"train_loss": -21.01606559753418, "global_step": 74816, "epoch": 901} {"train_loss": -20.941831588745117, "global_step": 74817, "epoch": 901} {"train_loss": -20.990882873535156, "global_step": 74818, "epoch": 901} {"train_loss": -20.635242462158203, "global_step": 74819, "epoch": 901} {"train_loss": -20.899076461791992, "global_step": 74820, "epoch": 901} {"train_loss": -20.634571075439453, "global_step": 74821, "epoch": 901} {"train_loss": -20.45890235900879, "global_step": 74822, "epoch": 901} {"train_loss": -21.190994262695312, "global_step": 74823, "epoch": 901} {"train_loss": -20.93231201171875, "global_step": 74824, "epoch": 901} {"train_loss": -20.853609085083008, "global_step": 74825, "epoch": 901} {"train_loss": -21.029834747314453, "global_step": 74826, "epoch": 901} {"train_loss": -21.084026336669922, "global_step": 74827, "epoch": 901} {"train_loss": -21.21780776977539, "global_step": 74828, "epoch": 901} {"train_loss": -21.122364044189453, "global_step": 74829, "epoch": 901} {"train_loss": -20.884300231933594, "global_step": 74830, "epoch": 901} {"train_loss": -21.078414916992188, "global_step": 74831, "epoch": 901} {"train_loss": -21.021329879760742, "global_step": 74832, "epoch": 901} {"train_loss": -21.060102462768555, "global_step": 74833, "epoch": 901} {"train_loss": -21.105981826782227, "global_step": 74834, "epoch": 901} {"train_loss": -20.971921920776367, "global_step": 74835, "epoch": 901} {"train_loss": -20.767852783203125, "global_step": 74836, "epoch": 901} {"train_loss": -20.80191993713379, "global_step": 74837, "epoch": 901} {"train_loss": -21.27680778503418, "global_step": 74838, "epoch": 901} {"train_loss": -20.903974533081055, "global_step": 74839, "epoch": 901} {"train_loss": -20.95686149597168, "global_step": 74840, "epoch": 901} {"train_loss": -21.230560302734375, "global_step": 74841, "epoch": 901} {"train_loss": -21.106645584106445, "global_step": 74842, "epoch": 901} {"train_loss": -21.194793701171875, "global_step": 74843, "epoch": 901} {"train_loss": -20.804601669311523, "global_step": 74844, "epoch": 901} {"train_loss": -20.8729248046875, "global_step": 74845, "epoch": 901} {"train_loss": -21.088682174682617, "global_step": 74846, "epoch": 901} {"train_loss": -20.69963836669922, "global_step": 74847, "epoch": 901} {"train_loss": -20.917320251464844, "global_step": 74848, "epoch": 901} {"train_loss": -21.206192016601562, "global_step": 74849, "epoch": 901} {"train_loss": -20.977441787719727, "global_step": 74850, "epoch": 901} {"train_loss": -20.741222381591797, "global_step": 74851, "epoch": 901} {"train_loss": -21.03155517578125, "global_step": 74852, "epoch": 901} {"train_loss": -21.24234962463379, "global_step": 74853, "epoch": 901} {"train_loss": -20.90205192565918, "global_step": 74854, "epoch": 901} {"train_loss": -20.9411678314209, "global_step": 74855, "epoch": 901} {"train_loss": -21.22210693359375, "global_step": 74856, "epoch": 901} {"train_loss": -21.484296798706055, "global_step": 74857, "epoch": 901} {"train_loss": -20.78757095336914, "global_step": 74858, "epoch": 901} {"train_loss": -20.74144172668457, "global_step": 74859, "epoch": 901} {"train_loss": -21.10114860534668, "global_step": 74860, "epoch": 901} {"train_loss": -21.288131713867188, "global_step": 74861, "epoch": 901} {"train_loss": -21.157133102416992, "global_step": 74862, "epoch": 901} {"train_loss": -21.159564971923828, "global_step": 74863, "epoch": 901} {"train_loss": -21.02658462524414, "global_step": 74864, "epoch": 901} {"train_loss": -20.92126391307417, "global_step": 74865, "epoch": 901, "val_loss": 5901338.5} {"train_loss": -20.599266052246094, "global_step": 74866, "epoch": 902} {"train_loss": -21.0025691986084, "global_step": 74867, "epoch": 902} {"train_loss": -20.28632926940918, "global_step": 74868, "epoch": 902} {"train_loss": -21.023401260375977, "global_step": 74869, "epoch": 902} {"train_loss": -20.575193405151367, "global_step": 74870, "epoch": 902} {"train_loss": -20.6035099029541, "global_step": 74871, "epoch": 902} {"train_loss": -21.107152938842773, "global_step": 74872, "epoch": 902} {"train_loss": -20.6662654876709, "global_step": 74873, "epoch": 902} {"train_loss": -20.689884185791016, "global_step": 74874, "epoch": 902} {"train_loss": -21.09478759765625, "global_step": 74875, "epoch": 902} {"train_loss": -20.38197898864746, "global_step": 74876, "epoch": 902} {"train_loss": -20.681806564331055, "global_step": 74877, "epoch": 902} {"train_loss": -20.620817184448242, "global_step": 74878, "epoch": 902} {"train_loss": -20.741619110107422, "global_step": 74879, "epoch": 902} {"train_loss": -20.884916305541992, "global_step": 74880, "epoch": 902} {"train_loss": -20.99944496154785, "global_step": 74881, "epoch": 902} {"train_loss": -21.167266845703125, "global_step": 74882, "epoch": 902} {"train_loss": -21.053424835205078, "global_step": 74883, "epoch": 902} {"train_loss": -20.961957931518555, "global_step": 74884, "epoch": 902} {"train_loss": -20.995624542236328, "global_step": 74885, "epoch": 902} {"train_loss": -21.318994522094727, "global_step": 74886, "epoch": 902} {"train_loss": -21.019662857055664, "global_step": 74887, "epoch": 902} {"train_loss": -20.815725326538086, "global_step": 74888, "epoch": 902} {"train_loss": -20.782093048095703, "global_step": 74889, "epoch": 902} {"train_loss": -20.931304931640625, "global_step": 74890, "epoch": 902} {"train_loss": -21.142032623291016, "global_step": 74891, "epoch": 902} {"train_loss": -20.98801040649414, "global_step": 74892, "epoch": 902} {"train_loss": -20.9879207611084, "global_step": 74893, "epoch": 902} {"train_loss": -21.270645141601562, "global_step": 74894, "epoch": 902} {"train_loss": -21.218494415283203, "global_step": 74895, "epoch": 902} {"train_loss": -21.716665267944336, "global_step": 74896, "epoch": 902} {"train_loss": -20.918804168701172, "global_step": 74897, "epoch": 902} {"train_loss": -20.89621925354004, "global_step": 74898, "epoch": 902} {"train_loss": -21.078367233276367, "global_step": 74899, "epoch": 902} {"train_loss": -21.38429832458496, "global_step": 74900, "epoch": 902} {"train_loss": -21.027193069458008, "global_step": 74901, "epoch": 902} {"train_loss": -20.939355850219727, "global_step": 74902, "epoch": 902} {"train_loss": -20.782718658447266, "global_step": 74903, "epoch": 902} {"train_loss": -21.43642807006836, "global_step": 74904, "epoch": 902} {"train_loss": -21.0288143157959, "global_step": 74905, "epoch": 902} {"train_loss": -21.010772705078125, "global_step": 74906, "epoch": 902} {"train_loss": -21.130334854125977, "global_step": 74907, "epoch": 902} {"train_loss": -21.02461814880371, "global_step": 74908, "epoch": 902} {"train_loss": -20.8671932220459, "global_step": 74909, "epoch": 902} {"train_loss": -21.37262535095215, "global_step": 74910, "epoch": 902} {"train_loss": -20.923925399780273, "global_step": 74911, "epoch": 902} {"train_loss": -20.346006393432617, "global_step": 74912, "epoch": 902} {"train_loss": -20.736251831054688, "global_step": 74913, "epoch": 902} {"train_loss": -21.11629295349121, "global_step": 74914, "epoch": 902} {"train_loss": -21.156278610229492, "global_step": 74915, "epoch": 902} {"train_loss": -20.744403839111328, "global_step": 74916, "epoch": 902} {"train_loss": -21.374998092651367, "global_step": 74917, "epoch": 902} {"train_loss": -21.14472198486328, "global_step": 74918, "epoch": 902} {"train_loss": -21.200916290283203, "global_step": 74919, "epoch": 902} {"train_loss": -21.30830955505371, "global_step": 74920, "epoch": 902} {"train_loss": -21.248655319213867, "global_step": 74921, "epoch": 902} {"train_loss": -20.803747177124023, "global_step": 74922, "epoch": 902} {"train_loss": -20.978824615478516, "global_step": 74923, "epoch": 902} {"train_loss": -20.85907554626465, "global_step": 74924, "epoch": 902} {"train_loss": -21.049238204956055, "global_step": 74925, "epoch": 902} {"train_loss": -21.131061553955078, "global_step": 74926, "epoch": 902} {"train_loss": -21.023113250732422, "global_step": 74927, "epoch": 902} {"train_loss": -21.23196792602539, "global_step": 74928, "epoch": 902} {"train_loss": -20.963865280151367, "global_step": 74929, "epoch": 902} {"train_loss": -20.750843048095703, "global_step": 74930, "epoch": 902} {"train_loss": -21.320959091186523, "global_step": 74931, "epoch": 902} {"train_loss": -21.095876693725586, "global_step": 74932, "epoch": 902} {"train_loss": -20.884017944335938, "global_step": 74933, "epoch": 902} {"train_loss": -21.28712272644043, "global_step": 74934, "epoch": 902} {"train_loss": -20.709165573120117, "global_step": 74935, "epoch": 902} {"train_loss": -21.32402992248535, "global_step": 74936, "epoch": 902} {"train_loss": -21.243133544921875, "global_step": 74937, "epoch": 902} {"train_loss": -21.08499526977539, "global_step": 74938, "epoch": 902} {"train_loss": -21.199615478515625, "global_step": 74939, "epoch": 902} {"train_loss": -21.062314987182617, "global_step": 74940, "epoch": 902} {"train_loss": -21.20245933532715, "global_step": 74941, "epoch": 902} {"train_loss": -20.744970321655273, "global_step": 74942, "epoch": 902} {"train_loss": -21.197900772094727, "global_step": 74943, "epoch": 902} {"train_loss": -20.9528751373291, "global_step": 74944, "epoch": 902} {"train_loss": -20.948026657104492, "global_step": 74945, "epoch": 902} {"train_loss": -21.09113121032715, "global_step": 74946, "epoch": 902} {"train_loss": -20.781116485595703, "global_step": 74947, "epoch": 902} {"train_loss": -20.9964072445789, "global_step": 74948, "epoch": 902, "val_loss": 6008303.0} {"train_loss": -20.982955932617188, "global_step": 74949, "epoch": 903} {"train_loss": -20.903432846069336, "global_step": 74950, "epoch": 903} {"train_loss": -20.88106918334961, "global_step": 74951, "epoch": 903} {"train_loss": -21.03983497619629, "global_step": 74952, "epoch": 903} {"train_loss": -20.74842643737793, "global_step": 74953, "epoch": 903} {"train_loss": -21.186330795288086, "global_step": 74954, "epoch": 903} {"train_loss": -20.76634979248047, "global_step": 74955, "epoch": 903} {"train_loss": -20.8690242767334, "global_step": 74956, "epoch": 903} {"train_loss": -20.789993286132812, "global_step": 74957, "epoch": 903} {"train_loss": -20.474702835083008, "global_step": 74958, "epoch": 903} {"train_loss": -20.493906021118164, "global_step": 74959, "epoch": 903} {"train_loss": -20.9185791015625, "global_step": 74960, "epoch": 903} {"train_loss": -20.680570602416992, "global_step": 74961, "epoch": 903} {"train_loss": -21.03484535217285, "global_step": 74962, "epoch": 903} {"train_loss": -21.20766258239746, "global_step": 74963, "epoch": 903} {"train_loss": -21.05634880065918, "global_step": 74964, "epoch": 903} {"train_loss": -20.968276977539062, "global_step": 74965, "epoch": 903} {"train_loss": -21.221683502197266, "global_step": 74966, "epoch": 903} {"train_loss": -21.137968063354492, "global_step": 74967, "epoch": 903} {"train_loss": -21.131847381591797, "global_step": 74968, "epoch": 903} {"train_loss": -20.854284286499023, "global_step": 74969, "epoch": 903} {"train_loss": -21.010465621948242, "global_step": 74970, "epoch": 903} {"train_loss": -20.80853271484375, "global_step": 74971, "epoch": 903} {"train_loss": -20.915205001831055, "global_step": 74972, "epoch": 903} {"train_loss": -20.85579490661621, "global_step": 74973, "epoch": 903} {"train_loss": -20.749900817871094, "global_step": 74974, "epoch": 903} {"train_loss": -21.103946685791016, "global_step": 74975, "epoch": 903} {"train_loss": -20.906208038330078, "global_step": 74976, "epoch": 903} {"train_loss": -20.71718406677246, "global_step": 74977, "epoch": 903} {"train_loss": -21.331945419311523, "global_step": 74978, "epoch": 903} {"train_loss": -20.862133026123047, "global_step": 74979, "epoch": 903} {"train_loss": -20.770214080810547, "global_step": 74980, "epoch": 903} {"train_loss": -20.7060604095459, "global_step": 74981, "epoch": 903} {"train_loss": -20.36471939086914, "global_step": 74982, "epoch": 903} {"train_loss": -21.439136505126953, "global_step": 74983, "epoch": 903} {"train_loss": -20.90358543395996, "global_step": 74984, "epoch": 903} {"train_loss": -20.994775772094727, "global_step": 74985, "epoch": 903} {"train_loss": -21.24181365966797, "global_step": 74986, "epoch": 903} {"train_loss": -20.962467193603516, "global_step": 74987, "epoch": 903} {"train_loss": -21.18974494934082, "global_step": 74988, "epoch": 903} {"train_loss": -20.986087799072266, "global_step": 74989, "epoch": 903} {"train_loss": -21.106369018554688, "global_step": 74990, "epoch": 903} {"train_loss": -20.826797485351562, "global_step": 74991, "epoch": 903} {"train_loss": -21.271244049072266, "global_step": 74992, "epoch": 903} {"train_loss": -21.04081916809082, "global_step": 74993, "epoch": 903} {"train_loss": -21.403905868530273, "global_step": 74994, "epoch": 903} {"train_loss": -21.032976150512695, "global_step": 74995, "epoch": 903} {"train_loss": -20.886449813842773, "global_step": 74996, "epoch": 903} {"train_loss": -20.992856979370117, "global_step": 74997, "epoch": 903} {"train_loss": -20.94002342224121, "global_step": 74998, "epoch": 903} {"train_loss": -20.80369758605957, "global_step": 74999, "epoch": 903} {"train_loss": -20.830595016479492, "global_step": 75000, "epoch": 903} {"train_loss": -21.0145206451416, "global_step": 75001, "epoch": 903} {"train_loss": -21.034366607666016, "global_step": 75002, "epoch": 903} {"train_loss": -20.918485641479492, "global_step": 75003, "epoch": 903} {"train_loss": -21.388765335083008, "global_step": 75004, "epoch": 903} {"train_loss": -20.719547271728516, "global_step": 75005, "epoch": 903} {"train_loss": -20.84987449645996, "global_step": 75006, "epoch": 903} {"train_loss": -20.912715911865234, "global_step": 75007, "epoch": 903} {"train_loss": -20.98396110534668, "global_step": 75008, "epoch": 903} {"train_loss": -21.435712814331055, "global_step": 75009, "epoch": 903} {"train_loss": -21.06264877319336, "global_step": 75010, "epoch": 903} {"train_loss": -21.114294052124023, "global_step": 75011, "epoch": 903} {"train_loss": -21.018779754638672, "global_step": 75012, "epoch": 903} {"train_loss": -21.264646530151367, "global_step": 75013, "epoch": 903} {"train_loss": -21.3839168548584, "global_step": 75014, "epoch": 903} {"train_loss": -20.771459579467773, "global_step": 75015, "epoch": 903} {"train_loss": -21.13714599609375, "global_step": 75016, "epoch": 903} {"train_loss": -21.112546920776367, "global_step": 75017, "epoch": 903} {"train_loss": -20.861989974975586, "global_step": 75018, "epoch": 903} {"train_loss": -20.835275650024414, "global_step": 75019, "epoch": 903} {"train_loss": -20.936960220336914, "global_step": 75020, "epoch": 903} {"train_loss": -20.931730270385742, "global_step": 75021, "epoch": 903} {"train_loss": -21.064220428466797, "global_step": 75022, "epoch": 903} {"train_loss": -21.055932998657227, "global_step": 75023, "epoch": 903} {"train_loss": -21.133798599243164, "global_step": 75024, "epoch": 903} {"train_loss": -21.67899513244629, "global_step": 75025, "epoch": 903} {"train_loss": -20.902408599853516, "global_step": 75026, "epoch": 903} {"train_loss": -20.869871139526367, "global_step": 75027, "epoch": 903} {"train_loss": -20.83393669128418, "global_step": 75028, "epoch": 903} {"train_loss": -20.941770553588867, "global_step": 75029, "epoch": 903} {"train_loss": -21.106679916381836, "global_step": 75030, "epoch": 903} {"train_loss": -20.983441548175122, "global_step": 75031, "epoch": 903, "val_loss": 6066942.5} {"train_loss": -20.78965950012207, "global_step": 75032, "epoch": 904} {"train_loss": -21.110740661621094, "global_step": 75033, "epoch": 904} {"train_loss": -21.041400909423828, "global_step": 75034, "epoch": 904} {"train_loss": -21.241010665893555, "global_step": 75035, "epoch": 904} {"train_loss": -20.82322120666504, "global_step": 75036, "epoch": 904} {"train_loss": -21.168338775634766, "global_step": 75037, "epoch": 904} {"train_loss": -20.939743041992188, "global_step": 75038, "epoch": 904} {"train_loss": -21.199724197387695, "global_step": 75039, "epoch": 904} {"train_loss": -21.00286865234375, "global_step": 75040, "epoch": 904} {"train_loss": -20.744840621948242, "global_step": 75041, "epoch": 904} {"train_loss": -20.871294021606445, "global_step": 75042, "epoch": 904} {"train_loss": -21.27058219909668, "global_step": 75043, "epoch": 904} {"train_loss": -21.01232147216797, "global_step": 75044, "epoch": 904} {"train_loss": -20.79244041442871, "global_step": 75045, "epoch": 904} {"train_loss": -20.681577682495117, "global_step": 75046, "epoch": 904} {"train_loss": -21.016454696655273, "global_step": 75047, "epoch": 904} {"train_loss": -21.119049072265625, "global_step": 75048, "epoch": 904} {"train_loss": -21.17768669128418, "global_step": 75049, "epoch": 904} {"train_loss": -20.653404235839844, "global_step": 75050, "epoch": 904} {"train_loss": -21.144113540649414, "global_step": 75051, "epoch": 904} {"train_loss": -21.32500457763672, "global_step": 75052, "epoch": 904} {"train_loss": -20.545791625976562, "global_step": 75053, "epoch": 904} {"train_loss": -20.656314849853516, "global_step": 75054, "epoch": 904} {"train_loss": -20.93033218383789, "global_step": 75055, "epoch": 904} {"train_loss": -21.01112937927246, "global_step": 75056, "epoch": 904} {"train_loss": -21.218915939331055, "global_step": 75057, "epoch": 904} {"train_loss": -20.97673988342285, "global_step": 75058, "epoch": 904} {"train_loss": -21.457639694213867, "global_step": 75059, "epoch": 904} {"train_loss": -21.160383224487305, "global_step": 75060, "epoch": 904} {"train_loss": -21.225400924682617, "global_step": 75061, "epoch": 904} {"train_loss": -21.28985595703125, "global_step": 75062, "epoch": 904} {"train_loss": -21.122798919677734, "global_step": 75063, "epoch": 904} {"train_loss": -21.256576538085938, "global_step": 75064, "epoch": 904} {"train_loss": -20.985933303833008, "global_step": 75065, "epoch": 904} {"train_loss": -20.904932022094727, "global_step": 75066, "epoch": 904} {"train_loss": -21.002548217773438, "global_step": 75067, "epoch": 904} {"train_loss": -21.28550148010254, "global_step": 75068, "epoch": 904} {"train_loss": -21.160268783569336, "global_step": 75069, "epoch": 904} {"train_loss": -21.322986602783203, "global_step": 75070, "epoch": 904} {"train_loss": -20.90382957458496, "global_step": 75071, "epoch": 904} {"train_loss": -20.874265670776367, "global_step": 75072, "epoch": 904} {"train_loss": -21.0841007232666, "global_step": 75073, "epoch": 904} {"train_loss": -21.303787231445312, "global_step": 75074, "epoch": 904} {"train_loss": -21.46886444091797, "global_step": 75075, "epoch": 904} {"train_loss": -20.92788314819336, "global_step": 75076, "epoch": 904} {"train_loss": -20.723459243774414, "global_step": 75077, "epoch": 904} {"train_loss": -20.805627822875977, "global_step": 75078, "epoch": 904} {"train_loss": -21.220243453979492, "global_step": 75079, "epoch": 904} {"train_loss": -21.19668197631836, "global_step": 75080, "epoch": 904} {"train_loss": -21.426790237426758, "global_step": 75081, "epoch": 904} {"train_loss": -20.980422973632812, "global_step": 75082, "epoch": 904} {"train_loss": -21.42095947265625, "global_step": 75083, "epoch": 904} {"train_loss": -20.952512741088867, "global_step": 75084, "epoch": 904} {"train_loss": -20.840240478515625, "global_step": 75085, "epoch": 904} {"train_loss": -20.722185134887695, "global_step": 75086, "epoch": 904} {"train_loss": -20.908884048461914, "global_step": 75087, "epoch": 904} {"train_loss": -20.982885360717773, "global_step": 75088, "epoch": 904} {"train_loss": -21.000883102416992, "global_step": 75089, "epoch": 904} {"train_loss": -21.180051803588867, "global_step": 75090, "epoch": 904} {"train_loss": -21.0382022857666, "global_step": 75091, "epoch": 904} {"train_loss": -21.190786361694336, "global_step": 75092, "epoch": 904} {"train_loss": -20.983991622924805, "global_step": 75093, "epoch": 904} {"train_loss": -21.11840057373047, "global_step": 75094, "epoch": 904} {"train_loss": -20.80878257751465, "global_step": 75095, "epoch": 904} {"train_loss": -20.61692237854004, "global_step": 75096, "epoch": 904} {"train_loss": -20.885282516479492, "global_step": 75097, "epoch": 904} {"train_loss": -20.954875946044922, "global_step": 75098, "epoch": 904} {"train_loss": -21.000720977783203, "global_step": 75099, "epoch": 904} {"train_loss": -21.307111740112305, "global_step": 75100, "epoch": 904} {"train_loss": -20.64143943786621, "global_step": 75101, "epoch": 904} {"train_loss": -20.814533233642578, "global_step": 75102, "epoch": 904} {"train_loss": -20.887426376342773, "global_step": 75103, "epoch": 904} {"train_loss": -21.192190170288086, "global_step": 75104, "epoch": 904} {"train_loss": -21.097578048706055, "global_step": 75105, "epoch": 904} {"train_loss": -20.939428329467773, "global_step": 75106, "epoch": 904} {"train_loss": -21.37759017944336, "global_step": 75107, "epoch": 904} {"train_loss": -21.408376693725586, "global_step": 75108, "epoch": 904} {"train_loss": -20.87458610534668, "global_step": 75109, "epoch": 904} {"train_loss": -20.901363372802734, "global_step": 75110, "epoch": 904} {"train_loss": -20.944068908691406, "global_step": 75111, "epoch": 904} {"train_loss": -20.65516471862793, "global_step": 75112, "epoch": 904} {"train_loss": -20.93235206604004, "global_step": 75113, "epoch": 904} {"train_loss": -21.023372029683674, "global_step": 75114, "epoch": 904, "val_loss": 5957805.5} {"train_loss": -20.35916519165039, "global_step": 75115, "epoch": 905} {"train_loss": -20.623252868652344, "global_step": 75116, "epoch": 905} {"train_loss": -20.22393035888672, "global_step": 75117, "epoch": 905} {"train_loss": -20.8216609954834, "global_step": 75118, "epoch": 905} {"train_loss": -20.72369384765625, "global_step": 75119, "epoch": 905} {"train_loss": -20.728097915649414, "global_step": 75120, "epoch": 905} {"train_loss": -20.397159576416016, "global_step": 75121, "epoch": 905} {"train_loss": -20.707853317260742, "global_step": 75122, "epoch": 905} {"train_loss": -20.630502700805664, "global_step": 75123, "epoch": 905} {"train_loss": -20.818872451782227, "global_step": 75124, "epoch": 905} {"train_loss": -20.63910484313965, "global_step": 75125, "epoch": 905} {"train_loss": -20.732553482055664, "global_step": 75126, "epoch": 905} {"train_loss": -20.87327766418457, "global_step": 75127, "epoch": 905} {"train_loss": -20.64876365661621, "global_step": 75128, "epoch": 905} {"train_loss": -20.602378845214844, "global_step": 75129, "epoch": 905} {"train_loss": -20.784521102905273, "global_step": 75130, "epoch": 905} {"train_loss": -21.001012802124023, "global_step": 75131, "epoch": 905} {"train_loss": -21.15213394165039, "global_step": 75132, "epoch": 905} {"train_loss": -21.226863861083984, "global_step": 75133, "epoch": 905} {"train_loss": -20.460269927978516, "global_step": 75134, "epoch": 905} {"train_loss": -21.01934242248535, "global_step": 75135, "epoch": 905} {"train_loss": -20.841299057006836, "global_step": 75136, "epoch": 905} {"train_loss": -20.944774627685547, "global_step": 75137, "epoch": 905} {"train_loss": -20.988605499267578, "global_step": 75138, "epoch": 905} {"train_loss": -20.758026123046875, "global_step": 75139, "epoch": 905} {"train_loss": -20.755537033081055, "global_step": 75140, "epoch": 905} {"train_loss": -20.951501846313477, "global_step": 75141, "epoch": 905} {"train_loss": -21.115070343017578, "global_step": 75142, "epoch": 905} {"train_loss": -20.7509822845459, "global_step": 75143, "epoch": 905} {"train_loss": -21.16167640686035, "global_step": 75144, "epoch": 905} {"train_loss": -21.0689754486084, "global_step": 75145, "epoch": 905} {"train_loss": -20.824954986572266, "global_step": 75146, "epoch": 905} {"train_loss": -21.06092643737793, "global_step": 75147, "epoch": 905} {"train_loss": -21.06833839416504, "global_step": 75148, "epoch": 905} {"train_loss": -21.333072662353516, "global_step": 75149, "epoch": 905} {"train_loss": -20.901294708251953, "global_step": 75150, "epoch": 905} {"train_loss": -20.909343719482422, "global_step": 75151, "epoch": 905} {"train_loss": -21.056398391723633, "global_step": 75152, "epoch": 905} {"train_loss": -21.39909553527832, "global_step": 75153, "epoch": 905} {"train_loss": -20.998062133789062, "global_step": 75154, "epoch": 905} {"train_loss": -21.33641815185547, "global_step": 75155, "epoch": 905} {"train_loss": -20.985971450805664, "global_step": 75156, "epoch": 905} {"train_loss": -20.99161720275879, "global_step": 75157, "epoch": 905} {"train_loss": -21.169767379760742, "global_step": 75158, "epoch": 905} {"train_loss": -21.169584274291992, "global_step": 75159, "epoch": 905} {"train_loss": -21.09573745727539, "global_step": 75160, "epoch": 905} {"train_loss": -20.865644454956055, "global_step": 75161, "epoch": 905} {"train_loss": -20.94536781311035, "global_step": 75162, "epoch": 905} {"train_loss": -21.037925720214844, "global_step": 75163, "epoch": 905} {"train_loss": -20.830379486083984, "global_step": 75164, "epoch": 905} {"train_loss": -20.773828506469727, "global_step": 75165, "epoch": 905} {"train_loss": -21.242755889892578, "global_step": 75166, "epoch": 905} {"train_loss": -20.5427303314209, "global_step": 75167, "epoch": 905} {"train_loss": -20.981061935424805, "global_step": 75168, "epoch": 905} {"train_loss": -20.827497482299805, "global_step": 75169, "epoch": 905} {"train_loss": -21.08619499206543, "global_step": 75170, "epoch": 905} {"train_loss": -20.6871395111084, "global_step": 75171, "epoch": 905} {"train_loss": -21.35694694519043, "global_step": 75172, "epoch": 905} {"train_loss": -21.41628074645996, "global_step": 75173, "epoch": 905} {"train_loss": -20.810224533081055, "global_step": 75174, "epoch": 905} {"train_loss": -20.894142150878906, "global_step": 75175, "epoch": 905} {"train_loss": -21.01842498779297, "global_step": 75176, "epoch": 905} {"train_loss": -21.138465881347656, "global_step": 75177, "epoch": 905} {"train_loss": -20.96113395690918, "global_step": 75178, "epoch": 905} {"train_loss": -21.376367568969727, "global_step": 75179, "epoch": 905} {"train_loss": -20.90064239501953, "global_step": 75180, "epoch": 905} {"train_loss": -21.096525192260742, "global_step": 75181, "epoch": 905} {"train_loss": -21.39643669128418, "global_step": 75182, "epoch": 905} {"train_loss": -21.0856876373291, "global_step": 75183, "epoch": 905} {"train_loss": -21.044198989868164, "global_step": 75184, "epoch": 905} {"train_loss": -20.969221115112305, "global_step": 75185, "epoch": 905} {"train_loss": -20.965171813964844, "global_step": 75186, "epoch": 905} {"train_loss": -20.851110458374023, "global_step": 75187, "epoch": 905} {"train_loss": -21.032381057739258, "global_step": 75188, "epoch": 905} {"train_loss": -20.877960205078125, "global_step": 75189, "epoch": 905} {"train_loss": -21.364267349243164, "global_step": 75190, "epoch": 905} {"train_loss": -21.586984634399414, "global_step": 75191, "epoch": 905} {"train_loss": -20.897560119628906, "global_step": 75192, "epoch": 905} {"train_loss": -21.246780395507812, "global_step": 75193, "epoch": 905} {"train_loss": -20.782882690429688, "global_step": 75194, "epoch": 905} {"train_loss": -21.099510192871094, "global_step": 75195, "epoch": 905} {"train_loss": -20.813501358032227, "global_step": 75196, "epoch": 905} {"train_loss": -20.950985644237104, "global_step": 75197, "epoch": 905, "val_loss": 5991898.0} {"train_loss": -20.641536712646484, "global_step": 75198, "epoch": 906} {"train_loss": -21.16180992126465, "global_step": 75199, "epoch": 906} {"train_loss": -20.192304611206055, "global_step": 75200, "epoch": 906} {"train_loss": -20.63526725769043, "global_step": 75201, "epoch": 906} {"train_loss": -20.910581588745117, "global_step": 75202, "epoch": 906} {"train_loss": -20.83014488220215, "global_step": 75203, "epoch": 906} {"train_loss": -20.754806518554688, "global_step": 75204, "epoch": 906} {"train_loss": -20.610727310180664, "global_step": 75205, "epoch": 906} {"train_loss": -20.725027084350586, "global_step": 75206, "epoch": 906} {"train_loss": -21.2450008392334, "global_step": 75207, "epoch": 906} {"train_loss": -20.631328582763672, "global_step": 75208, "epoch": 906} {"train_loss": -20.783926010131836, "global_step": 75209, "epoch": 906} {"train_loss": -20.679067611694336, "global_step": 75210, "epoch": 906} {"train_loss": -20.86714744567871, "global_step": 75211, "epoch": 906} {"train_loss": -20.759122848510742, "global_step": 75212, "epoch": 906} {"train_loss": -20.766990661621094, "global_step": 75213, "epoch": 906} {"train_loss": -21.152353286743164, "global_step": 75214, "epoch": 906} {"train_loss": -20.695165634155273, "global_step": 75215, "epoch": 906} {"train_loss": -21.052602767944336, "global_step": 75216, "epoch": 906} {"train_loss": -20.853269577026367, "global_step": 75217, "epoch": 906} {"train_loss": -20.578123092651367, "global_step": 75218, "epoch": 906} {"train_loss": -21.072420120239258, "global_step": 75219, "epoch": 906} {"train_loss": -20.971603393554688, "global_step": 75220, "epoch": 906} {"train_loss": -21.07293701171875, "global_step": 75221, "epoch": 906} {"train_loss": -20.81752586364746, "global_step": 75222, "epoch": 906} {"train_loss": -20.874805450439453, "global_step": 75223, "epoch": 906} {"train_loss": -20.90943717956543, "global_step": 75224, "epoch": 906} {"train_loss": -21.02109146118164, "global_step": 75225, "epoch": 906} {"train_loss": -20.809280395507812, "global_step": 75226, "epoch": 906} {"train_loss": -21.22121238708496, "global_step": 75227, "epoch": 906} {"train_loss": -21.036121368408203, "global_step": 75228, "epoch": 906} {"train_loss": -20.819835662841797, "global_step": 75229, "epoch": 906} {"train_loss": -21.082672119140625, "global_step": 75230, "epoch": 906} {"train_loss": -21.064556121826172, "global_step": 75231, "epoch": 906} {"train_loss": -21.153091430664062, "global_step": 75232, "epoch": 906} {"train_loss": -21.250051498413086, "global_step": 75233, "epoch": 906} {"train_loss": -21.028078079223633, "global_step": 75234, "epoch": 906} {"train_loss": -21.050573348999023, "global_step": 75235, "epoch": 906} {"train_loss": -21.19075584411621, "global_step": 75236, "epoch": 906} {"train_loss": -21.13434600830078, "global_step": 75237, "epoch": 906} {"train_loss": -20.967390060424805, "global_step": 75238, "epoch": 906} {"train_loss": -21.19009780883789, "global_step": 75239, "epoch": 906} {"train_loss": -20.878509521484375, "global_step": 75240, "epoch": 906} {"train_loss": -21.308687210083008, "global_step": 75241, "epoch": 906} {"train_loss": -21.16950798034668, "global_step": 75242, "epoch": 906} {"train_loss": -21.290151596069336, "global_step": 75243, "epoch": 906} {"train_loss": -20.797639846801758, "global_step": 75244, "epoch": 906} {"train_loss": -20.793203353881836, "global_step": 75245, "epoch": 906} {"train_loss": -20.858510971069336, "global_step": 75246, "epoch": 906} {"train_loss": -21.19054412841797, "global_step": 75247, "epoch": 906} {"train_loss": -21.03269386291504, "global_step": 75248, "epoch": 906} {"train_loss": -21.193204879760742, "global_step": 75249, "epoch": 906} {"train_loss": -21.227033615112305, "global_step": 75250, "epoch": 906} {"train_loss": -21.21429443359375, "global_step": 75251, "epoch": 906} {"train_loss": -21.132959365844727, "global_step": 75252, "epoch": 906} {"train_loss": -21.047199249267578, "global_step": 75253, "epoch": 906} {"train_loss": -21.019819259643555, "global_step": 75254, "epoch": 906} {"train_loss": -20.787351608276367, "global_step": 75255, "epoch": 906} {"train_loss": -21.31776237487793, "global_step": 75256, "epoch": 906} {"train_loss": -21.349775314331055, "global_step": 75257, "epoch": 906} {"train_loss": -21.07807731628418, "global_step": 75258, "epoch": 906} {"train_loss": -21.07245445251465, "global_step": 75259, "epoch": 906} {"train_loss": -21.200223922729492, "global_step": 75260, "epoch": 906} {"train_loss": -20.99358367919922, "global_step": 75261, "epoch": 906} {"train_loss": -21.11233901977539, "global_step": 75262, "epoch": 906} {"train_loss": -20.78966522216797, "global_step": 75263, "epoch": 906} {"train_loss": -21.18943214416504, "global_step": 75264, "epoch": 906} {"train_loss": -21.29414176940918, "global_step": 75265, "epoch": 906} {"train_loss": -21.13360595703125, "global_step": 75266, "epoch": 906} {"train_loss": -20.932910919189453, "global_step": 75267, "epoch": 906} {"train_loss": -21.346603393554688, "global_step": 75268, "epoch": 906} {"train_loss": -21.28885841369629, "global_step": 75269, "epoch": 906} {"train_loss": -20.88429832458496, "global_step": 75270, "epoch": 906} {"train_loss": -20.86220359802246, "global_step": 75271, "epoch": 906} {"train_loss": -21.132099151611328, "global_step": 75272, "epoch": 906} {"train_loss": -21.035593032836914, "global_step": 75273, "epoch": 906} {"train_loss": -21.096481323242188, "global_step": 75274, "epoch": 906} {"train_loss": -20.851388931274414, "global_step": 75275, "epoch": 906} {"train_loss": -21.224992752075195, "global_step": 75276, "epoch": 906} {"train_loss": -21.045265197753906, "global_step": 75277, "epoch": 906} {"train_loss": -21.53148651123047, "global_step": 75278, "epoch": 906} {"train_loss": -20.933324813842773, "global_step": 75279, "epoch": 906} {"train_loss": -21.003917671111694, "global_step": 75280, "epoch": 906, "val_loss": 6036879.0} {"train_loss": -20.86849021911621, "global_step": 75281, "epoch": 907} {"train_loss": -20.959848403930664, "global_step": 75282, "epoch": 907} {"train_loss": -20.71772575378418, "global_step": 75283, "epoch": 907} {"train_loss": -20.870386123657227, "global_step": 75284, "epoch": 907} {"train_loss": -20.718568801879883, "global_step": 75285, "epoch": 907} {"train_loss": -21.22495460510254, "global_step": 75286, "epoch": 907} {"train_loss": -20.932924270629883, "global_step": 75287, "epoch": 907} {"train_loss": -21.126108169555664, "global_step": 75288, "epoch": 907} {"train_loss": -20.903112411499023, "global_step": 75289, "epoch": 907} {"train_loss": -21.15964698791504, "global_step": 75290, "epoch": 907} {"train_loss": -20.911901473999023, "global_step": 75291, "epoch": 907} {"train_loss": -20.991992950439453, "global_step": 75292, "epoch": 907} {"train_loss": -21.060985565185547, "global_step": 75293, "epoch": 907} {"train_loss": -20.8848876953125, "global_step": 75294, "epoch": 907} {"train_loss": -20.74982452392578, "global_step": 75295, "epoch": 907} {"train_loss": -20.840606689453125, "global_step": 75296, "epoch": 907} {"train_loss": -20.969083786010742, "global_step": 75297, "epoch": 907} {"train_loss": -20.89754295349121, "global_step": 75298, "epoch": 907} {"train_loss": -21.1696834564209, "global_step": 75299, "epoch": 907} {"train_loss": -20.805274963378906, "global_step": 75300, "epoch": 907} {"train_loss": -21.150196075439453, "global_step": 75301, "epoch": 907} {"train_loss": -20.568342208862305, "global_step": 75302, "epoch": 907} {"train_loss": -20.96537208557129, "global_step": 75303, "epoch": 907} {"train_loss": -21.19034767150879, "global_step": 75304, "epoch": 907} {"train_loss": -21.06207275390625, "global_step": 75305, "epoch": 907} {"train_loss": -21.201566696166992, "global_step": 75306, "epoch": 907} {"train_loss": -21.083410263061523, "global_step": 75307, "epoch": 907} {"train_loss": -21.01578712463379, "global_step": 75308, "epoch": 907} {"train_loss": -21.17597770690918, "global_step": 75309, "epoch": 907} {"train_loss": -21.133441925048828, "global_step": 75310, "epoch": 907} {"train_loss": -20.581933975219727, "global_step": 75311, "epoch": 907} {"train_loss": -21.057355880737305, "global_step": 75312, "epoch": 907} {"train_loss": -20.814416885375977, "global_step": 75313, "epoch": 907} {"train_loss": -21.24317169189453, "global_step": 75314, "epoch": 907} {"train_loss": -20.96327781677246, "global_step": 75315, "epoch": 907} {"train_loss": -21.24530029296875, "global_step": 75316, "epoch": 907} {"train_loss": -21.150156021118164, "global_step": 75317, "epoch": 907} {"train_loss": -21.039411544799805, "global_step": 75318, "epoch": 907} {"train_loss": -21.058530807495117, "global_step": 75319, "epoch": 907} {"train_loss": -20.911670684814453, "global_step": 75320, "epoch": 907} {"train_loss": -21.102136611938477, "global_step": 75321, "epoch": 907} {"train_loss": -20.643115997314453, "global_step": 75322, "epoch": 907} {"train_loss": -20.910654067993164, "global_step": 75323, "epoch": 907} {"train_loss": -21.196992874145508, "global_step": 75324, "epoch": 907} {"train_loss": -21.114179611206055, "global_step": 75325, "epoch": 907} {"train_loss": -21.353282928466797, "global_step": 75326, "epoch": 907} {"train_loss": -20.958375930786133, "global_step": 75327, "epoch": 907} {"train_loss": -20.988590240478516, "global_step": 75328, "epoch": 907} {"train_loss": -21.184005737304688, "global_step": 75329, "epoch": 907} {"train_loss": -21.14826774597168, "global_step": 75330, "epoch": 907} {"train_loss": -21.203359603881836, "global_step": 75331, "epoch": 907} {"train_loss": -21.318483352661133, "global_step": 75332, "epoch": 907} {"train_loss": -21.208683013916016, "global_step": 75333, "epoch": 907} {"train_loss": -20.645044326782227, "global_step": 75334, "epoch": 907} {"train_loss": -21.182830810546875, "global_step": 75335, "epoch": 907} {"train_loss": -21.09923553466797, "global_step": 75336, "epoch": 907} {"train_loss": -21.23200035095215, "global_step": 75337, "epoch": 907} {"train_loss": -20.915037155151367, "global_step": 75338, "epoch": 907} {"train_loss": -21.227928161621094, "global_step": 75339, "epoch": 907} {"train_loss": -21.29513931274414, "global_step": 75340, "epoch": 907} {"train_loss": -20.920286178588867, "global_step": 75341, "epoch": 907} {"train_loss": -20.428348541259766, "global_step": 75342, "epoch": 907} {"train_loss": -20.93643569946289, "global_step": 75343, "epoch": 907} {"train_loss": -21.267152786254883, "global_step": 75344, "epoch": 907} {"train_loss": -21.132465362548828, "global_step": 75345, "epoch": 907} {"train_loss": -20.734886169433594, "global_step": 75346, "epoch": 907} {"train_loss": -20.753725051879883, "global_step": 75347, "epoch": 907} {"train_loss": -21.30870819091797, "global_step": 75348, "epoch": 907} {"train_loss": -21.00107765197754, "global_step": 75349, "epoch": 907} {"train_loss": -21.308897018432617, "global_step": 75350, "epoch": 907} {"train_loss": -21.35875701904297, "global_step": 75351, "epoch": 907} {"train_loss": -20.700246810913086, "global_step": 75352, "epoch": 907} {"train_loss": -20.94723892211914, "global_step": 75353, "epoch": 907} {"train_loss": -21.41202735900879, "global_step": 75354, "epoch": 907} {"train_loss": -21.23956298828125, "global_step": 75355, "epoch": 907} {"train_loss": -20.780710220336914, "global_step": 75356, "epoch": 907} {"train_loss": -20.871740341186523, "global_step": 75357, "epoch": 907} {"train_loss": -21.01031494140625, "global_step": 75358, "epoch": 907} {"train_loss": -21.041400909423828, "global_step": 75359, "epoch": 907} {"train_loss": -20.891515731811523, "global_step": 75360, "epoch": 907} {"train_loss": -21.059873580932617, "global_step": 75361, "epoch": 907} {"train_loss": -20.785953521728516, "global_step": 75362, "epoch": 907} {"train_loss": -21.011914770287202, "global_step": 75363, "epoch": 907, "val_loss": 5983262.5} {"train_loss": -20.065811157226562, "global_step": 75364, "epoch": 908} {"train_loss": -20.931516647338867, "global_step": 75365, "epoch": 908} {"train_loss": -20.680749893188477, "global_step": 75366, "epoch": 908} {"train_loss": -20.743101119995117, "global_step": 75367, "epoch": 908} {"train_loss": -21.045562744140625, "global_step": 75368, "epoch": 908} {"train_loss": -21.054271697998047, "global_step": 75369, "epoch": 908} {"train_loss": -20.776365280151367, "global_step": 75370, "epoch": 908} {"train_loss": -20.800186157226562, "global_step": 75371, "epoch": 908} {"train_loss": -20.789955139160156, "global_step": 75372, "epoch": 908} {"train_loss": -21.029953002929688, "global_step": 75373, "epoch": 908} {"train_loss": -20.948280334472656, "global_step": 75374, "epoch": 908} {"train_loss": -20.88419532775879, "global_step": 75375, "epoch": 908} {"train_loss": -20.992292404174805, "global_step": 75376, "epoch": 908} {"train_loss": -21.166555404663086, "global_step": 75377, "epoch": 908} {"train_loss": -20.59871482849121, "global_step": 75378, "epoch": 908} {"train_loss": -21.086139678955078, "global_step": 75379, "epoch": 908} {"train_loss": -20.896535873413086, "global_step": 75380, "epoch": 908} {"train_loss": -20.829849243164062, "global_step": 75381, "epoch": 908} {"train_loss": -20.60336685180664, "global_step": 75382, "epoch": 908} {"train_loss": -21.03752326965332, "global_step": 75383, "epoch": 908} {"train_loss": -20.829755783081055, "global_step": 75384, "epoch": 908} {"train_loss": -21.159605026245117, "global_step": 75385, "epoch": 908} {"train_loss": -21.185773849487305, "global_step": 75386, "epoch": 908} {"train_loss": -21.360355377197266, "global_step": 75387, "epoch": 908} {"train_loss": -20.787181854248047, "global_step": 75388, "epoch": 908} {"train_loss": -21.080114364624023, "global_step": 75389, "epoch": 908} {"train_loss": -21.16023826599121, "global_step": 75390, "epoch": 908} {"train_loss": -20.809391021728516, "global_step": 75391, "epoch": 908} {"train_loss": -21.095670700073242, "global_step": 75392, "epoch": 908} {"train_loss": -20.830833435058594, "global_step": 75393, "epoch": 908} {"train_loss": -20.776697158813477, "global_step": 75394, "epoch": 908} {"train_loss": -20.766010284423828, "global_step": 75395, "epoch": 908} {"train_loss": -21.126184463500977, "global_step": 75396, "epoch": 908} {"train_loss": -21.09541893005371, "global_step": 75397, "epoch": 908} {"train_loss": -20.95924949645996, "global_step": 75398, "epoch": 908} {"train_loss": -21.02257537841797, "global_step": 75399, "epoch": 908} {"train_loss": -20.93488121032715, "global_step": 75400, "epoch": 908} {"train_loss": -21.1826229095459, "global_step": 75401, "epoch": 908} {"train_loss": -21.153623580932617, "global_step": 75402, "epoch": 908} {"train_loss": -21.219635009765625, "global_step": 75403, "epoch": 908} {"train_loss": -21.30104637145996, "global_step": 75404, "epoch": 908} {"train_loss": -21.06486701965332, "global_step": 75405, "epoch": 908} {"train_loss": -21.050270080566406, "global_step": 75406, "epoch": 908} {"train_loss": -21.1713809967041, "global_step": 75407, "epoch": 908} {"train_loss": -21.22407341003418, "global_step": 75408, "epoch": 908} {"train_loss": -21.166154861450195, "global_step": 75409, "epoch": 908} {"train_loss": -21.074918746948242, "global_step": 75410, "epoch": 908} {"train_loss": -21.188230514526367, "global_step": 75411, "epoch": 908} {"train_loss": -21.032073974609375, "global_step": 75412, "epoch": 908} {"train_loss": -21.021713256835938, "global_step": 75413, "epoch": 908} {"train_loss": -21.09516716003418, "global_step": 75414, "epoch": 908} {"train_loss": -21.005001068115234, "global_step": 75415, "epoch": 908} {"train_loss": -21.13457489013672, "global_step": 75416, "epoch": 908} {"train_loss": -21.066781997680664, "global_step": 75417, "epoch": 908} {"train_loss": -21.1569766998291, "global_step": 75418, "epoch": 908} {"train_loss": -21.207632064819336, "global_step": 75419, "epoch": 908} {"train_loss": -20.991308212280273, "global_step": 75420, "epoch": 908} {"train_loss": -21.04566192626953, "global_step": 75421, "epoch": 908} {"train_loss": -21.39303207397461, "global_step": 75422, "epoch": 908} {"train_loss": -21.33888816833496, "global_step": 75423, "epoch": 908} {"train_loss": -20.790016174316406, "global_step": 75424, "epoch": 908} {"train_loss": -21.30677032470703, "global_step": 75425, "epoch": 908} {"train_loss": -21.050094604492188, "global_step": 75426, "epoch": 908} {"train_loss": -20.868183135986328, "global_step": 75427, "epoch": 908} {"train_loss": -21.15679931640625, "global_step": 75428, "epoch": 908} {"train_loss": -21.110797882080078, "global_step": 75429, "epoch": 908} {"train_loss": -20.954269409179688, "global_step": 75430, "epoch": 908} {"train_loss": -21.184057235717773, "global_step": 75431, "epoch": 908} {"train_loss": -20.9986515045166, "global_step": 75432, "epoch": 908} {"train_loss": -21.61367416381836, "global_step": 75433, "epoch": 908} {"train_loss": -21.121845245361328, "global_step": 75434, "epoch": 908} {"train_loss": -21.08717918395996, "global_step": 75435, "epoch": 908} {"train_loss": -21.004846572875977, "global_step": 75436, "epoch": 908} {"train_loss": -21.1931209564209, "global_step": 75437, "epoch": 908} {"train_loss": -21.15852928161621, "global_step": 75438, "epoch": 908} {"train_loss": -20.909526824951172, "global_step": 75439, "epoch": 908} {"train_loss": -21.10976791381836, "global_step": 75440, "epoch": 908} {"train_loss": -21.021759033203125, "global_step": 75441, "epoch": 908} {"train_loss": -20.898639678955078, "global_step": 75442, "epoch": 908} {"train_loss": -21.239320755004883, "global_step": 75443, "epoch": 908} {"train_loss": -20.965505599975586, "global_step": 75444, "epoch": 908} {"train_loss": -20.94008445739746, "global_step": 75445, "epoch": 908} {"train_loss": -21.00695366457284, "global_step": 75446, "epoch": 908, "val_loss": 5882748.5} {"train_loss": -21.03798484802246, "global_step": 75447, "epoch": 909} {"train_loss": -20.344627380371094, "global_step": 75448, "epoch": 909} {"train_loss": -20.218873977661133, "global_step": 75449, "epoch": 909} {"train_loss": -20.17337417602539, "global_step": 75450, "epoch": 909} {"train_loss": -20.90083122253418, "global_step": 75451, "epoch": 909} {"train_loss": -20.326772689819336, "global_step": 75452, "epoch": 909} {"train_loss": -20.765546798706055, "global_step": 75453, "epoch": 909} {"train_loss": -20.61948585510254, "global_step": 75454, "epoch": 909} {"train_loss": -21.145408630371094, "global_step": 75455, "epoch": 909} {"train_loss": -21.25646209716797, "global_step": 75456, "epoch": 909} {"train_loss": -20.54313087463379, "global_step": 75457, "epoch": 909} {"train_loss": -20.97818946838379, "global_step": 75458, "epoch": 909} {"train_loss": -20.920364379882812, "global_step": 75459, "epoch": 909} {"train_loss": -21.05535316467285, "global_step": 75460, "epoch": 909} {"train_loss": -21.17915916442871, "global_step": 75461, "epoch": 909} {"train_loss": -21.018274307250977, "global_step": 75462, "epoch": 909} {"train_loss": -21.064252853393555, "global_step": 75463, "epoch": 909} {"train_loss": -21.008481979370117, "global_step": 75464, "epoch": 909} {"train_loss": -21.010339736938477, "global_step": 75465, "epoch": 909} {"train_loss": -20.786405563354492, "global_step": 75466, "epoch": 909} {"train_loss": -21.22260856628418, "global_step": 75467, "epoch": 909} {"train_loss": -20.8049259185791, "global_step": 75468, "epoch": 909} {"train_loss": -20.870397567749023, "global_step": 75469, "epoch": 909} {"train_loss": -21.002634048461914, "global_step": 75470, "epoch": 909} {"train_loss": -21.13697624206543, "global_step": 75471, "epoch": 909} {"train_loss": -21.42926025390625, "global_step": 75472, "epoch": 909} {"train_loss": -21.086284637451172, "global_step": 75473, "epoch": 909} {"train_loss": -21.01258659362793, "global_step": 75474, "epoch": 909} {"train_loss": -20.93692970275879, "global_step": 75475, "epoch": 909} {"train_loss": -21.260295867919922, "global_step": 75476, "epoch": 909} {"train_loss": -20.874303817749023, "global_step": 75477, "epoch": 909} {"train_loss": -21.141225814819336, "global_step": 75478, "epoch": 909} {"train_loss": -20.949161529541016, "global_step": 75479, "epoch": 909} {"train_loss": -21.00738525390625, "global_step": 75480, "epoch": 909} {"train_loss": -21.13431739807129, "global_step": 75481, "epoch": 909} {"train_loss": -20.993101119995117, "global_step": 75482, "epoch": 909} {"train_loss": -21.00516128540039, "global_step": 75483, "epoch": 909} {"train_loss": -21.14910888671875, "global_step": 75484, "epoch": 909} {"train_loss": -20.69620132446289, "global_step": 75485, "epoch": 909} {"train_loss": -21.355131149291992, "global_step": 75486, "epoch": 909} {"train_loss": -21.444704055786133, "global_step": 75487, "epoch": 909} {"train_loss": -21.240285873413086, "global_step": 75488, "epoch": 909} {"train_loss": -21.077478408813477, "global_step": 75489, "epoch": 909} {"train_loss": -20.844314575195312, "global_step": 75490, "epoch": 909} {"train_loss": -21.31020164489746, "global_step": 75491, "epoch": 909} {"train_loss": -21.082345962524414, "global_step": 75492, "epoch": 909} {"train_loss": -20.982900619506836, "global_step": 75493, "epoch": 909} {"train_loss": -21.043603897094727, "global_step": 75494, "epoch": 909} {"train_loss": -21.11150360107422, "global_step": 75495, "epoch": 909} {"train_loss": -20.80445671081543, "global_step": 75496, "epoch": 909} {"train_loss": -21.283117294311523, "global_step": 75497, "epoch": 909} {"train_loss": -21.13216209411621, "global_step": 75498, "epoch": 909} {"train_loss": -21.0645809173584, "global_step": 75499, "epoch": 909} {"train_loss": -20.887409210205078, "global_step": 75500, "epoch": 909} {"train_loss": -20.82892417907715, "global_step": 75501, "epoch": 909} {"train_loss": -20.871597290039062, "global_step": 75502, "epoch": 909} {"train_loss": -21.36647605895996, "global_step": 75503, "epoch": 909} {"train_loss": -20.95025634765625, "global_step": 75504, "epoch": 909} {"train_loss": -20.851593017578125, "global_step": 75505, "epoch": 909} {"train_loss": -21.36916732788086, "global_step": 75506, "epoch": 909} {"train_loss": -21.360071182250977, "global_step": 75507, "epoch": 909} {"train_loss": -20.914386749267578, "global_step": 75508, "epoch": 909} {"train_loss": -21.27448081970215, "global_step": 75509, "epoch": 909} {"train_loss": -20.81659507751465, "global_step": 75510, "epoch": 909} {"train_loss": -20.96108055114746, "global_step": 75511, "epoch": 909} {"train_loss": -20.900609970092773, "global_step": 75512, "epoch": 909} {"train_loss": -21.009384155273438, "global_step": 75513, "epoch": 909} {"train_loss": -20.81893539428711, "global_step": 75514, "epoch": 909} {"train_loss": -21.490421295166016, "global_step": 75515, "epoch": 909} {"train_loss": -20.78364372253418, "global_step": 75516, "epoch": 909} {"train_loss": -21.02023696899414, "global_step": 75517, "epoch": 909} {"train_loss": -21.12514305114746, "global_step": 75518, "epoch": 909} {"train_loss": -21.268789291381836, "global_step": 75519, "epoch": 909} {"train_loss": -20.983869552612305, "global_step": 75520, "epoch": 909} {"train_loss": -20.989492416381836, "global_step": 75521, "epoch": 909} {"train_loss": -20.881967544555664, "global_step": 75522, "epoch": 909} {"train_loss": -21.219350814819336, "global_step": 75523, "epoch": 909} {"train_loss": -21.064340591430664, "global_step": 75524, "epoch": 909} {"train_loss": -20.906347274780273, "global_step": 75525, "epoch": 909} {"train_loss": -21.23945426940918, "global_step": 75526, "epoch": 909} {"train_loss": -20.808189392089844, "global_step": 75527, "epoch": 909} {"train_loss": -21.10016632080078, "global_step": 75528, "epoch": 909} {"train_loss": -20.992124534515014, "global_step": 75529, "epoch": 909, "val_loss": 5891125.0} {"train_loss": -20.253259658813477, "global_step": 75530, "epoch": 910} {"train_loss": -21.00935935974121, "global_step": 75531, "epoch": 910} {"train_loss": -20.122390747070312, "global_step": 75532, "epoch": 910} {"train_loss": -20.703243255615234, "global_step": 75533, "epoch": 910} {"train_loss": -20.583486557006836, "global_step": 75534, "epoch": 910} {"train_loss": -20.764867782592773, "global_step": 75535, "epoch": 910} {"train_loss": -20.67067527770996, "global_step": 75536, "epoch": 910} {"train_loss": -20.84742546081543, "global_step": 75537, "epoch": 910} {"train_loss": -21.029003143310547, "global_step": 75538, "epoch": 910} {"train_loss": -20.351308822631836, "global_step": 75539, "epoch": 910} {"train_loss": -20.571191787719727, "global_step": 75540, "epoch": 910} {"train_loss": -20.89800453186035, "global_step": 75541, "epoch": 910} {"train_loss": -20.65595054626465, "global_step": 75542, "epoch": 910} {"train_loss": -20.918848037719727, "global_step": 75543, "epoch": 910} {"train_loss": -20.975187301635742, "global_step": 75544, "epoch": 910} {"train_loss": -20.930883407592773, "global_step": 75545, "epoch": 910} {"train_loss": -20.947036743164062, "global_step": 75546, "epoch": 910} {"train_loss": -21.405384063720703, "global_step": 75547, "epoch": 910} {"train_loss": -20.748647689819336, "global_step": 75548, "epoch": 910} {"train_loss": -20.891197204589844, "global_step": 75549, "epoch": 910} {"train_loss": -21.007749557495117, "global_step": 75550, "epoch": 910} {"train_loss": -20.875822067260742, "global_step": 75551, "epoch": 910} {"train_loss": -20.738019943237305, "global_step": 75552, "epoch": 910} {"train_loss": -20.638505935668945, "global_step": 75553, "epoch": 910} {"train_loss": -21.04842185974121, "global_step": 75554, "epoch": 910} {"train_loss": -21.349271774291992, "global_step": 75555, "epoch": 910} {"train_loss": -21.201513290405273, "global_step": 75556, "epoch": 910} {"train_loss": -20.66777992248535, "global_step": 75557, "epoch": 910} {"train_loss": -21.21493911743164, "global_step": 75558, "epoch": 910} {"train_loss": -21.100061416625977, "global_step": 75559, "epoch": 910} {"train_loss": -21.023155212402344, "global_step": 75560, "epoch": 910} {"train_loss": -21.039113998413086, "global_step": 75561, "epoch": 910} {"train_loss": -20.834083557128906, "global_step": 75562, "epoch": 910} {"train_loss": -21.124826431274414, "global_step": 75563, "epoch": 910} {"train_loss": -20.764333724975586, "global_step": 75564, "epoch": 910} {"train_loss": -20.873891830444336, "global_step": 75565, "epoch": 910} {"train_loss": -21.1478271484375, "global_step": 75566, "epoch": 910} {"train_loss": -20.997655868530273, "global_step": 75567, "epoch": 910} {"train_loss": -21.008115768432617, "global_step": 75568, "epoch": 910} {"train_loss": -21.051610946655273, "global_step": 75569, "epoch": 910} {"train_loss": -21.302562713623047, "global_step": 75570, "epoch": 910} {"train_loss": -20.85084342956543, "global_step": 75571, "epoch": 910} {"train_loss": -21.19258689880371, "global_step": 75572, "epoch": 910} {"train_loss": -20.837982177734375, "global_step": 75573, "epoch": 910} {"train_loss": -21.05587387084961, "global_step": 75574, "epoch": 910} {"train_loss": -21.18381690979004, "global_step": 75575, "epoch": 910} {"train_loss": -20.767642974853516, "global_step": 75576, "epoch": 910} {"train_loss": -21.42729949951172, "global_step": 75577, "epoch": 910} {"train_loss": -20.95594596862793, "global_step": 75578, "epoch": 910} {"train_loss": -21.16914176940918, "global_step": 75579, "epoch": 910} {"train_loss": -20.86488151550293, "global_step": 75580, "epoch": 910} {"train_loss": -20.693565368652344, "global_step": 75581, "epoch": 910} {"train_loss": -21.368871688842773, "global_step": 75582, "epoch": 910} {"train_loss": -21.520395278930664, "global_step": 75583, "epoch": 910} {"train_loss": -21.160537719726562, "global_step": 75584, "epoch": 910} {"train_loss": -21.10147476196289, "global_step": 75585, "epoch": 910} {"train_loss": -21.163923263549805, "global_step": 75586, "epoch": 910} {"train_loss": -20.802154541015625, "global_step": 75587, "epoch": 910} {"train_loss": -21.066694259643555, "global_step": 75588, "epoch": 910} {"train_loss": -21.08539390563965, "global_step": 75589, "epoch": 910} {"train_loss": -20.93975830078125, "global_step": 75590, "epoch": 910} {"train_loss": -21.01105308532715, "global_step": 75591, "epoch": 910} {"train_loss": -21.08278465270996, "global_step": 75592, "epoch": 910} {"train_loss": -21.182897567749023, "global_step": 75593, "epoch": 910} {"train_loss": -21.009302139282227, "global_step": 75594, "epoch": 910} {"train_loss": -20.745901107788086, "global_step": 75595, "epoch": 910} {"train_loss": -20.90266990661621, "global_step": 75596, "epoch": 910} {"train_loss": -21.18440818786621, "global_step": 75597, "epoch": 910} {"train_loss": -21.065631866455078, "global_step": 75598, "epoch": 910} {"train_loss": -20.954181671142578, "global_step": 75599, "epoch": 910} {"train_loss": -21.035154342651367, "global_step": 75600, "epoch": 910} {"train_loss": -21.018009185791016, "global_step": 75601, "epoch": 910} {"train_loss": -21.000843048095703, "global_step": 75602, "epoch": 910} {"train_loss": -20.899507522583008, "global_step": 75603, "epoch": 910} {"train_loss": -20.79436683654785, "global_step": 75604, "epoch": 910} {"train_loss": -21.053621292114258, "global_step": 75605, "epoch": 910} {"train_loss": -21.46260643005371, "global_step": 75606, "epoch": 910} {"train_loss": -21.18324851989746, "global_step": 75607, "epoch": 910} {"train_loss": -21.086483001708984, "global_step": 75608, "epoch": 910} {"train_loss": -21.211576461791992, "global_step": 75609, "epoch": 910} {"train_loss": -20.852140426635742, "global_step": 75610, "epoch": 910} {"train_loss": -21.284658432006836, "global_step": 75611, "epoch": 910} {"train_loss": -20.953443320400744, "global_step": 75612, "epoch": 910, "val_loss": 6014639.0} {"train_loss": -20.958982467651367, "global_step": 75613, "epoch": 911} {"train_loss": -20.413084030151367, "global_step": 75614, "epoch": 911} {"train_loss": -20.530527114868164, "global_step": 75615, "epoch": 911} {"train_loss": -21.067153930664062, "global_step": 75616, "epoch": 911} {"train_loss": -20.56143569946289, "global_step": 75617, "epoch": 911} {"train_loss": -20.487550735473633, "global_step": 75618, "epoch": 911} {"train_loss": -20.633869171142578, "global_step": 75619, "epoch": 911} {"train_loss": -20.974328994750977, "global_step": 75620, "epoch": 911} {"train_loss": -20.734716415405273, "global_step": 75621, "epoch": 911} {"train_loss": -21.017141342163086, "global_step": 75622, "epoch": 911} {"train_loss": -20.695941925048828, "global_step": 75623, "epoch": 911} {"train_loss": -20.908445358276367, "global_step": 75624, "epoch": 911} {"train_loss": -20.78194236755371, "global_step": 75625, "epoch": 911} {"train_loss": -20.60841941833496, "global_step": 75626, "epoch": 911} {"train_loss": -20.581050872802734, "global_step": 75627, "epoch": 911} {"train_loss": -20.69232177734375, "global_step": 75628, "epoch": 911} {"train_loss": -20.732059478759766, "global_step": 75629, "epoch": 911} {"train_loss": -21.130842208862305, "global_step": 75630, "epoch": 911} {"train_loss": -21.003467559814453, "global_step": 75631, "epoch": 911} {"train_loss": -21.272937774658203, "global_step": 75632, "epoch": 911} {"train_loss": -20.559680938720703, "global_step": 75633, "epoch": 911} {"train_loss": -20.97867202758789, "global_step": 75634, "epoch": 911} {"train_loss": -21.068506240844727, "global_step": 75635, "epoch": 911} {"train_loss": -20.843114852905273, "global_step": 75636, "epoch": 911} {"train_loss": -20.731428146362305, "global_step": 75637, "epoch": 911} {"train_loss": -20.763700485229492, "global_step": 75638, "epoch": 911} {"train_loss": -20.71029281616211, "global_step": 75639, "epoch": 911} {"train_loss": -21.071203231811523, "global_step": 75640, "epoch": 911} {"train_loss": -20.782987594604492, "global_step": 75641, "epoch": 911} {"train_loss": -20.581762313842773, "global_step": 75642, "epoch": 911} {"train_loss": -21.2352294921875, "global_step": 75643, "epoch": 911} {"train_loss": -20.91000747680664, "global_step": 75644, "epoch": 911} {"train_loss": -21.250652313232422, "global_step": 75645, "epoch": 911} {"train_loss": -21.19968605041504, "global_step": 75646, "epoch": 911} {"train_loss": -21.44881820678711, "global_step": 75647, "epoch": 911} {"train_loss": -21.075305938720703, "global_step": 75648, "epoch": 911} {"train_loss": -21.001876831054688, "global_step": 75649, "epoch": 911} {"train_loss": -21.0681209564209, "global_step": 75650, "epoch": 911} {"train_loss": -21.14314842224121, "global_step": 75651, "epoch": 911} {"train_loss": -21.051557540893555, "global_step": 75652, "epoch": 911} {"train_loss": -21.240577697753906, "global_step": 75653, "epoch": 911} {"train_loss": -21.033071517944336, "global_step": 75654, "epoch": 911} {"train_loss": -21.13527488708496, "global_step": 75655, "epoch": 911} {"train_loss": -21.000423431396484, "global_step": 75656, "epoch": 911} {"train_loss": -21.625457763671875, "global_step": 75657, "epoch": 911} {"train_loss": -21.12068748474121, "global_step": 75658, "epoch": 911} {"train_loss": -21.521942138671875, "global_step": 75659, "epoch": 911} {"train_loss": -21.496601104736328, "global_step": 75660, "epoch": 911} {"train_loss": -21.101118087768555, "global_step": 75661, "epoch": 911} {"train_loss": -21.34335708618164, "global_step": 75662, "epoch": 911} {"train_loss": -20.87137794494629, "global_step": 75663, "epoch": 911} {"train_loss": -20.86551284790039, "global_step": 75664, "epoch": 911} {"train_loss": -21.01311683654785, "global_step": 75665, "epoch": 911} {"train_loss": -21.09882926940918, "global_step": 75666, "epoch": 911} {"train_loss": -21.468063354492188, "global_step": 75667, "epoch": 911} {"train_loss": -21.19395637512207, "global_step": 75668, "epoch": 911} {"train_loss": -20.8804988861084, "global_step": 75669, "epoch": 911} {"train_loss": -21.349393844604492, "global_step": 75670, "epoch": 911} {"train_loss": -20.98195457458496, "global_step": 75671, "epoch": 911} {"train_loss": -21.163461685180664, "global_step": 75672, "epoch": 911} {"train_loss": -21.065004348754883, "global_step": 75673, "epoch": 911} {"train_loss": -21.36128807067871, "global_step": 75674, "epoch": 911} {"train_loss": -20.887968063354492, "global_step": 75675, "epoch": 911} {"train_loss": -21.260700225830078, "global_step": 75676, "epoch": 911} {"train_loss": -21.08547019958496, "global_step": 75677, "epoch": 911} {"train_loss": -20.70305824279785, "global_step": 75678, "epoch": 911} {"train_loss": -21.09803581237793, "global_step": 75679, "epoch": 911} {"train_loss": -21.4697208404541, "global_step": 75680, "epoch": 911} {"train_loss": -20.643558502197266, "global_step": 75681, "epoch": 911} {"train_loss": -20.897354125976562, "global_step": 75682, "epoch": 911} {"train_loss": -20.839632034301758, "global_step": 75683, "epoch": 911} {"train_loss": -21.262195587158203, "global_step": 75684, "epoch": 911} {"train_loss": -21.135406494140625, "global_step": 75685, "epoch": 911} {"train_loss": -20.954999923706055, "global_step": 75686, "epoch": 911} {"train_loss": -21.029436111450195, "global_step": 75687, "epoch": 911} {"train_loss": -21.197620391845703, "global_step": 75688, "epoch": 911} {"train_loss": -20.960281372070312, "global_step": 75689, "epoch": 911} {"train_loss": -20.804609298706055, "global_step": 75690, "epoch": 911} {"train_loss": -21.38042449951172, "global_step": 75691, "epoch": 911} {"train_loss": -21.2183780670166, "global_step": 75692, "epoch": 911} {"train_loss": -21.064733505249023, "global_step": 75693, "epoch": 911} {"train_loss": -21.19576644897461, "global_step": 75694, "epoch": 911} {"train_loss": -20.988401734685322, "global_step": 75695, "epoch": 911, "val_loss": 5975291.0} {"train_loss": -20.576662063598633, "global_step": 75696, "epoch": 912} {"train_loss": -20.783044815063477, "global_step": 75697, "epoch": 912} {"train_loss": -20.411643981933594, "global_step": 75698, "epoch": 912} {"train_loss": -21.121896743774414, "global_step": 75699, "epoch": 912} {"train_loss": -20.90476417541504, "global_step": 75700, "epoch": 912} {"train_loss": -20.971904754638672, "global_step": 75701, "epoch": 912} {"train_loss": -20.7808895111084, "global_step": 75702, "epoch": 912} {"train_loss": -20.831737518310547, "global_step": 75703, "epoch": 912} {"train_loss": -20.765745162963867, "global_step": 75704, "epoch": 912} {"train_loss": -20.408992767333984, "global_step": 75705, "epoch": 912} {"train_loss": -20.79237937927246, "global_step": 75706, "epoch": 912} {"train_loss": -20.425533294677734, "global_step": 75707, "epoch": 912} {"train_loss": -21.02386474609375, "global_step": 75708, "epoch": 912} {"train_loss": -21.171756744384766, "global_step": 75709, "epoch": 912} {"train_loss": -21.222179412841797, "global_step": 75710, "epoch": 912} {"train_loss": -20.961334228515625, "global_step": 75711, "epoch": 912} {"train_loss": -20.680072784423828, "global_step": 75712, "epoch": 912} {"train_loss": -21.071691513061523, "global_step": 75713, "epoch": 912} {"train_loss": -20.750852584838867, "global_step": 75714, "epoch": 912} {"train_loss": -20.985523223876953, "global_step": 75715, "epoch": 912} {"train_loss": -21.256668090820312, "global_step": 75716, "epoch": 912} {"train_loss": -21.062501907348633, "global_step": 75717, "epoch": 912} {"train_loss": -21.30439567565918, "global_step": 75718, "epoch": 912} {"train_loss": -20.865615844726562, "global_step": 75719, "epoch": 912} {"train_loss": -21.22125816345215, "global_step": 75720, "epoch": 912} {"train_loss": -21.127887725830078, "global_step": 75721, "epoch": 912} {"train_loss": -20.921110153198242, "global_step": 75722, "epoch": 912} {"train_loss": -20.96058464050293, "global_step": 75723, "epoch": 912} {"train_loss": -20.815366744995117, "global_step": 75724, "epoch": 912} {"train_loss": -21.130674362182617, "global_step": 75725, "epoch": 912} {"train_loss": -21.109914779663086, "global_step": 75726, "epoch": 912} {"train_loss": -21.154869079589844, "global_step": 75727, "epoch": 912} {"train_loss": -20.99357795715332, "global_step": 75728, "epoch": 912} {"train_loss": -20.799673080444336, "global_step": 75729, "epoch": 912} {"train_loss": -21.542217254638672, "global_step": 75730, "epoch": 912} {"train_loss": -21.412992477416992, "global_step": 75731, "epoch": 912} {"train_loss": -21.100370407104492, "global_step": 75732, "epoch": 912} {"train_loss": -20.87531852722168, "global_step": 75733, "epoch": 912} {"train_loss": -21.254013061523438, "global_step": 75734, "epoch": 912} {"train_loss": -20.80525779724121, "global_step": 75735, "epoch": 912} {"train_loss": -21.12882423400879, "global_step": 75736, "epoch": 912} {"train_loss": -21.210453033447266, "global_step": 75737, "epoch": 912} {"train_loss": -20.638498306274414, "global_step": 75738, "epoch": 912} {"train_loss": -21.128677368164062, "global_step": 75739, "epoch": 912} {"train_loss": -20.897836685180664, "global_step": 75740, "epoch": 912} {"train_loss": -20.849109649658203, "global_step": 75741, "epoch": 912} {"train_loss": -20.891006469726562, "global_step": 75742, "epoch": 912} {"train_loss": -20.83241081237793, "global_step": 75743, "epoch": 912} {"train_loss": -21.222379684448242, "global_step": 75744, "epoch": 912} {"train_loss": -20.6402645111084, "global_step": 75745, "epoch": 912} {"train_loss": -21.263105392456055, "global_step": 75746, "epoch": 912} {"train_loss": -20.830093383789062, "global_step": 75747, "epoch": 912} {"train_loss": -21.080310821533203, "global_step": 75748, "epoch": 912} {"train_loss": -20.902219772338867, "global_step": 75749, "epoch": 912} {"train_loss": -21.480432510375977, "global_step": 75750, "epoch": 912} {"train_loss": -21.09303092956543, "global_step": 75751, "epoch": 912} {"train_loss": -21.078948974609375, "global_step": 75752, "epoch": 912} {"train_loss": -21.18603515625, "global_step": 75753, "epoch": 912} {"train_loss": -21.17051887512207, "global_step": 75754, "epoch": 912} {"train_loss": -21.052982330322266, "global_step": 75755, "epoch": 912} {"train_loss": -21.06980323791504, "global_step": 75756, "epoch": 912} {"train_loss": -20.990503311157227, "global_step": 75757, "epoch": 912} {"train_loss": -20.925687789916992, "global_step": 75758, "epoch": 912} {"train_loss": -20.815214157104492, "global_step": 75759, "epoch": 912} {"train_loss": -21.160913467407227, "global_step": 75760, "epoch": 912} {"train_loss": -21.16441535949707, "global_step": 75761, "epoch": 912} {"train_loss": -20.950302124023438, "global_step": 75762, "epoch": 912} {"train_loss": -21.550668716430664, "global_step": 75763, "epoch": 912} {"train_loss": -20.968814849853516, "global_step": 75764, "epoch": 912} {"train_loss": -21.207151412963867, "global_step": 75765, "epoch": 912} {"train_loss": -20.899490356445312, "global_step": 75766, "epoch": 912} {"train_loss": -20.954187393188477, "global_step": 75767, "epoch": 912} {"train_loss": -20.650474548339844, "global_step": 75768, "epoch": 912} {"train_loss": -20.869144439697266, "global_step": 75769, "epoch": 912} {"train_loss": -21.02914810180664, "global_step": 75770, "epoch": 912} {"train_loss": -20.44654655456543, "global_step": 75771, "epoch": 912} {"train_loss": -20.598556518554688, "global_step": 75772, "epoch": 912} {"train_loss": -21.00923728942871, "global_step": 75773, "epoch": 912} {"train_loss": -21.25422477722168, "global_step": 75774, "epoch": 912} {"train_loss": -20.615657806396484, "global_step": 75775, "epoch": 912} {"train_loss": -20.826730728149414, "global_step": 75776, "epoch": 912} {"train_loss": -20.575824737548828, "global_step": 75777, "epoch": 912} {"train_loss": -20.973437366715398, "global_step": 75778, "epoch": 912, "val_loss": 5989555.5} {"train_loss": -20.97507095336914, "global_step": 75779, "epoch": 913} {"train_loss": -20.75606346130371, "global_step": 75780, "epoch": 913} {"train_loss": -20.943933486938477, "global_step": 75781, "epoch": 913} {"train_loss": -21.230148315429688, "global_step": 75782, "epoch": 913} {"train_loss": -21.138364791870117, "global_step": 75783, "epoch": 913} {"train_loss": -20.787586212158203, "global_step": 75784, "epoch": 913} {"train_loss": -21.17392349243164, "global_step": 75785, "epoch": 913} {"train_loss": -20.690282821655273, "global_step": 75786, "epoch": 913} {"train_loss": -20.97185516357422, "global_step": 75787, "epoch": 913} {"train_loss": -21.223438262939453, "global_step": 75788, "epoch": 913} {"train_loss": -21.16157341003418, "global_step": 75789, "epoch": 913} {"train_loss": -20.861248016357422, "global_step": 75790, "epoch": 913} {"train_loss": -20.78828239440918, "global_step": 75791, "epoch": 913} {"train_loss": -21.0161190032959, "global_step": 75792, "epoch": 913} {"train_loss": -21.348129272460938, "global_step": 75793, "epoch": 913} {"train_loss": -21.196216583251953, "global_step": 75794, "epoch": 913} {"train_loss": -21.54366111755371, "global_step": 75795, "epoch": 913} {"train_loss": -20.920330047607422, "global_step": 75796, "epoch": 913} {"train_loss": -21.387670516967773, "global_step": 75797, "epoch": 913} {"train_loss": -21.181503295898438, "global_step": 75798, "epoch": 913} {"train_loss": -21.38507080078125, "global_step": 75799, "epoch": 913} {"train_loss": -21.37424087524414, "global_step": 75800, "epoch": 913} {"train_loss": -21.32326316833496, "global_step": 75801, "epoch": 913} {"train_loss": -21.138708114624023, "global_step": 75802, "epoch": 913} {"train_loss": -21.118497848510742, "global_step": 75803, "epoch": 913} {"train_loss": -21.051782608032227, "global_step": 75804, "epoch": 913} {"train_loss": -21.072269439697266, "global_step": 75805, "epoch": 913} {"train_loss": -21.14893913269043, "global_step": 75806, "epoch": 913} {"train_loss": -20.977354049682617, "global_step": 75807, "epoch": 913} {"train_loss": -21.23723602294922, "global_step": 75808, "epoch": 913} {"train_loss": -21.23531723022461, "global_step": 75809, "epoch": 913} {"train_loss": -21.266881942749023, "global_step": 75810, "epoch": 913} {"train_loss": -21.077777862548828, "global_step": 75811, "epoch": 913} {"train_loss": -21.04401206970215, "global_step": 75812, "epoch": 913} {"train_loss": -21.0304012298584, "global_step": 75813, "epoch": 913} {"train_loss": -21.365558624267578, "global_step": 75814, "epoch": 913} {"train_loss": -21.28696632385254, "global_step": 75815, "epoch": 913} {"train_loss": -20.843151092529297, "global_step": 75816, "epoch": 913} {"train_loss": -20.7360897064209, "global_step": 75817, "epoch": 913} {"train_loss": -20.976022720336914, "global_step": 75818, "epoch": 913} {"train_loss": -20.813817977905273, "global_step": 75819, "epoch": 913} {"train_loss": -21.070905685424805, "global_step": 75820, "epoch": 913} {"train_loss": -20.906917572021484, "global_step": 75821, "epoch": 913} {"train_loss": -21.253870010375977, "global_step": 75822, "epoch": 913} {"train_loss": -21.078161239624023, "global_step": 75823, "epoch": 913} {"train_loss": -21.131187438964844, "global_step": 75824, "epoch": 913} {"train_loss": -20.977331161499023, "global_step": 75825, "epoch": 913} {"train_loss": -20.9345760345459, "global_step": 75826, "epoch": 913} {"train_loss": -20.800567626953125, "global_step": 75827, "epoch": 913} {"train_loss": -21.075439453125, "global_step": 75828, "epoch": 913} {"train_loss": -21.33003044128418, "global_step": 75829, "epoch": 913} {"train_loss": -20.780832290649414, "global_step": 75830, "epoch": 913} {"train_loss": -20.89889907836914, "global_step": 75831, "epoch": 913} {"train_loss": -20.68082618713379, "global_step": 75832, "epoch": 913} {"train_loss": -21.11297035217285, "global_step": 75833, "epoch": 913} {"train_loss": -20.72942352294922, "global_step": 75834, "epoch": 913} {"train_loss": -20.969850540161133, "global_step": 75835, "epoch": 913} {"train_loss": -21.179101943969727, "global_step": 75836, "epoch": 913} {"train_loss": -21.10263442993164, "global_step": 75837, "epoch": 913} {"train_loss": -20.864501953125, "global_step": 75838, "epoch": 913} {"train_loss": -20.664255142211914, "global_step": 75839, "epoch": 913} {"train_loss": -21.258956909179688, "global_step": 75840, "epoch": 913} {"train_loss": -21.15420913696289, "global_step": 75841, "epoch": 913} {"train_loss": -20.78032875061035, "global_step": 75842, "epoch": 913} {"train_loss": -20.967145919799805, "global_step": 75843, "epoch": 913} {"train_loss": -21.175199508666992, "global_step": 75844, "epoch": 913} {"train_loss": -21.01749610900879, "global_step": 75845, "epoch": 913} {"train_loss": -21.265819549560547, "global_step": 75846, "epoch": 913} {"train_loss": -20.950103759765625, "global_step": 75847, "epoch": 913} {"train_loss": -20.652612686157227, "global_step": 75848, "epoch": 913} {"train_loss": -20.99485206604004, "global_step": 75849, "epoch": 913} {"train_loss": -20.70061683654785, "global_step": 75850, "epoch": 913} {"train_loss": -21.415451049804688, "global_step": 75851, "epoch": 913} {"train_loss": -21.164047241210938, "global_step": 75852, "epoch": 913} {"train_loss": -21.436538696289062, "global_step": 75853, "epoch": 913} {"train_loss": -20.99810791015625, "global_step": 75854, "epoch": 913} {"train_loss": -20.886985778808594, "global_step": 75855, "epoch": 913} {"train_loss": -21.063634872436523, "global_step": 75856, "epoch": 913} {"train_loss": -21.029783248901367, "global_step": 75857, "epoch": 913} {"train_loss": -20.786046981811523, "global_step": 75858, "epoch": 913} {"train_loss": -20.66719627380371, "global_step": 75859, "epoch": 913} {"train_loss": -20.829811096191406, "global_step": 75860, "epoch": 913} {"train_loss": -21.047548983470502, "global_step": 75861, "epoch": 913, "val_loss": 5984549.0} {"train_loss": -20.701066970825195, "global_step": 75862, "epoch": 914} {"train_loss": -21.032005310058594, "global_step": 75863, "epoch": 914} {"train_loss": -20.772178649902344, "global_step": 75864, "epoch": 914} {"train_loss": -20.7547550201416, "global_step": 75865, "epoch": 914} {"train_loss": -20.573654174804688, "global_step": 75866, "epoch": 914} {"train_loss": -20.684720993041992, "global_step": 75867, "epoch": 914} {"train_loss": -21.059457778930664, "global_step": 75868, "epoch": 914} {"train_loss": -20.823949813842773, "global_step": 75869, "epoch": 914} {"train_loss": -21.356367111206055, "global_step": 75870, "epoch": 914} {"train_loss": -20.83908462524414, "global_step": 75871, "epoch": 914} {"train_loss": -21.229883193969727, "global_step": 75872, "epoch": 914} {"train_loss": -20.43264389038086, "global_step": 75873, "epoch": 914} {"train_loss": -20.801965713500977, "global_step": 75874, "epoch": 914} {"train_loss": -21.148662567138672, "global_step": 75875, "epoch": 914} {"train_loss": -20.761436462402344, "global_step": 75876, "epoch": 914} {"train_loss": -20.898265838623047, "global_step": 75877, "epoch": 914} {"train_loss": -20.891935348510742, "global_step": 75878, "epoch": 914} {"train_loss": -20.836511611938477, "global_step": 75879, "epoch": 914} {"train_loss": -20.89081382751465, "global_step": 75880, "epoch": 914} {"train_loss": -20.791107177734375, "global_step": 75881, "epoch": 914} {"train_loss": -21.189334869384766, "global_step": 75882, "epoch": 914} {"train_loss": -21.031330108642578, "global_step": 75883, "epoch": 914} {"train_loss": -20.97066879272461, "global_step": 75884, "epoch": 914} {"train_loss": -21.433101654052734, "global_step": 75885, "epoch": 914} {"train_loss": -21.165369033813477, "global_step": 75886, "epoch": 914} {"train_loss": -20.913419723510742, "global_step": 75887, "epoch": 914} {"train_loss": -21.416610717773438, "global_step": 75888, "epoch": 914} {"train_loss": -20.82278823852539, "global_step": 75889, "epoch": 914} {"train_loss": -20.85533332824707, "global_step": 75890, "epoch": 914} {"train_loss": -21.26323890686035, "global_step": 75891, "epoch": 914} {"train_loss": -20.882444381713867, "global_step": 75892, "epoch": 914} {"train_loss": -21.420827865600586, "global_step": 75893, "epoch": 914} {"train_loss": -20.681745529174805, "global_step": 75894, "epoch": 914} {"train_loss": -21.480030059814453, "global_step": 75895, "epoch": 914} {"train_loss": -21.0045108795166, "global_step": 75896, "epoch": 914} {"train_loss": -21.105907440185547, "global_step": 75897, "epoch": 914} {"train_loss": -21.16817283630371, "global_step": 75898, "epoch": 914} {"train_loss": -21.11342430114746, "global_step": 75899, "epoch": 914} {"train_loss": -21.082307815551758, "global_step": 75900, "epoch": 914} {"train_loss": -21.028661727905273, "global_step": 75901, "epoch": 914} {"train_loss": -21.224611282348633, "global_step": 75902, "epoch": 914} {"train_loss": -21.324811935424805, "global_step": 75903, "epoch": 914} {"train_loss": -20.816274642944336, "global_step": 75904, "epoch": 914} {"train_loss": -20.813873291015625, "global_step": 75905, "epoch": 914} {"train_loss": -21.067861557006836, "global_step": 75906, "epoch": 914} {"train_loss": -21.02374267578125, "global_step": 75907, "epoch": 914} {"train_loss": -21.263111114501953, "global_step": 75908, "epoch": 914} {"train_loss": -20.987607955932617, "global_step": 75909, "epoch": 914} {"train_loss": -21.140499114990234, "global_step": 75910, "epoch": 914} {"train_loss": -20.913410186767578, "global_step": 75911, "epoch": 914} {"train_loss": -21.219959259033203, "global_step": 75912, "epoch": 914} {"train_loss": -21.138025283813477, "global_step": 75913, "epoch": 914} {"train_loss": -20.86573600769043, "global_step": 75914, "epoch": 914} {"train_loss": -21.148893356323242, "global_step": 75915, "epoch": 914} {"train_loss": -21.057119369506836, "global_step": 75916, "epoch": 914} {"train_loss": -21.88136100769043, "global_step": 75917, "epoch": 914} {"train_loss": -21.45097541809082, "global_step": 75918, "epoch": 914} {"train_loss": -21.040647506713867, "global_step": 75919, "epoch": 914} {"train_loss": -21.159168243408203, "global_step": 75920, "epoch": 914} {"train_loss": -21.194242477416992, "global_step": 75921, "epoch": 914} {"train_loss": -21.14887809753418, "global_step": 75922, "epoch": 914} {"train_loss": -21.084228515625, "global_step": 75923, "epoch": 914} {"train_loss": -20.77894401550293, "global_step": 75924, "epoch": 914} {"train_loss": -21.126239776611328, "global_step": 75925, "epoch": 914} {"train_loss": -20.83208465576172, "global_step": 75926, "epoch": 914} {"train_loss": -21.08232879638672, "global_step": 75927, "epoch": 914} {"train_loss": -21.068607330322266, "global_step": 75928, "epoch": 914} {"train_loss": -21.017566680908203, "global_step": 75929, "epoch": 914} {"train_loss": -21.23953628540039, "global_step": 75930, "epoch": 914} {"train_loss": -21.178951263427734, "global_step": 75931, "epoch": 914} {"train_loss": -21.13062858581543, "global_step": 75932, "epoch": 914} {"train_loss": -20.926097869873047, "global_step": 75933, "epoch": 914} {"train_loss": -21.05303955078125, "global_step": 75934, "epoch": 914} {"train_loss": -20.838041305541992, "global_step": 75935, "epoch": 914} {"train_loss": -20.93973731994629, "global_step": 75936, "epoch": 914} {"train_loss": -21.281156539916992, "global_step": 75937, "epoch": 914} {"train_loss": -20.7230281829834, "global_step": 75938, "epoch": 914} {"train_loss": -20.825016021728516, "global_step": 75939, "epoch": 914} {"train_loss": -21.131948471069336, "global_step": 75940, "epoch": 914} {"train_loss": -20.909244537353516, "global_step": 75941, "epoch": 914} {"train_loss": -21.130720138549805, "global_step": 75942, "epoch": 914} {"train_loss": -20.93062973022461, "global_step": 75943, "epoch": 914} {"train_loss": -21.04660029583667, "global_step": 75944, "epoch": 914, "val_loss": 5887323.5} {"train_loss": -20.6058406829834, "global_step": 75945, "epoch": 915} {"train_loss": -21.301267623901367, "global_step": 75946, "epoch": 915} {"train_loss": -20.712987899780273, "global_step": 75947, "epoch": 915} {"train_loss": -20.5229434967041, "global_step": 75948, "epoch": 915} {"train_loss": -20.442655563354492, "global_step": 75949, "epoch": 915} {"train_loss": -21.054250717163086, "global_step": 75950, "epoch": 915} {"train_loss": -20.93088150024414, "global_step": 75951, "epoch": 915} {"train_loss": -20.831689834594727, "global_step": 75952, "epoch": 915} {"train_loss": -20.846601486206055, "global_step": 75953, "epoch": 915} {"train_loss": -20.722030639648438, "global_step": 75954, "epoch": 915} {"train_loss": -20.822351455688477, "global_step": 75955, "epoch": 915} {"train_loss": -20.607303619384766, "global_step": 75956, "epoch": 915} {"train_loss": -20.634946823120117, "global_step": 75957, "epoch": 915} {"train_loss": -20.814437866210938, "global_step": 75958, "epoch": 915} {"train_loss": -20.661893844604492, "global_step": 75959, "epoch": 915} {"train_loss": -20.796579360961914, "global_step": 75960, "epoch": 915} {"train_loss": -21.028942108154297, "global_step": 75961, "epoch": 915} {"train_loss": -21.172330856323242, "global_step": 75962, "epoch": 915} {"train_loss": -20.43116569519043, "global_step": 75963, "epoch": 915} {"train_loss": -21.084314346313477, "global_step": 75964, "epoch": 915} {"train_loss": -21.13427734375, "global_step": 75965, "epoch": 915} {"train_loss": -21.104496002197266, "global_step": 75966, "epoch": 915} {"train_loss": -21.12741470336914, "global_step": 75967, "epoch": 915} {"train_loss": -21.05573081970215, "global_step": 75968, "epoch": 915} {"train_loss": -21.090818405151367, "global_step": 75969, "epoch": 915} {"train_loss": -21.11903190612793, "global_step": 75970, "epoch": 915} {"train_loss": -20.989727020263672, "global_step": 75971, "epoch": 915} {"train_loss": -21.043264389038086, "global_step": 75972, "epoch": 915} {"train_loss": -21.225553512573242, "global_step": 75973, "epoch": 915} {"train_loss": -20.95755958557129, "global_step": 75974, "epoch": 915} {"train_loss": -20.982816696166992, "global_step": 75975, "epoch": 915} {"train_loss": -20.99361801147461, "global_step": 75976, "epoch": 915} {"train_loss": -21.152555465698242, "global_step": 75977, "epoch": 915} {"train_loss": -21.38544273376465, "global_step": 75978, "epoch": 915} {"train_loss": -20.85216522216797, "global_step": 75979, "epoch": 915} {"train_loss": -20.678152084350586, "global_step": 75980, "epoch": 915} {"train_loss": -20.9537410736084, "global_step": 75981, "epoch": 915} {"train_loss": -20.907983779907227, "global_step": 75982, "epoch": 915} {"train_loss": -21.20575523376465, "global_step": 75983, "epoch": 915} {"train_loss": -21.067153930664062, "global_step": 75984, "epoch": 915} {"train_loss": -21.433425903320312, "global_step": 75985, "epoch": 915} {"train_loss": -20.62264633178711, "global_step": 75986, "epoch": 915} {"train_loss": -21.327085494995117, "global_step": 75987, "epoch": 915} {"train_loss": -21.04652214050293, "global_step": 75988, "epoch": 915} {"train_loss": -21.265609741210938, "global_step": 75989, "epoch": 915} {"train_loss": -21.036720275878906, "global_step": 75990, "epoch": 915} {"train_loss": -21.0501766204834, "global_step": 75991, "epoch": 915} {"train_loss": -20.98953628540039, "global_step": 75992, "epoch": 915} {"train_loss": -21.013246536254883, "global_step": 75993, "epoch": 915} {"train_loss": -21.155780792236328, "global_step": 75994, "epoch": 915} {"train_loss": -20.91267967224121, "global_step": 75995, "epoch": 915} {"train_loss": -21.118732452392578, "global_step": 75996, "epoch": 915} {"train_loss": -20.94293975830078, "global_step": 75997, "epoch": 915} {"train_loss": -21.34785270690918, "global_step": 75998, "epoch": 915} {"train_loss": -21.45288848876953, "global_step": 75999, "epoch": 915} {"train_loss": -21.2088680267334, "global_step": 76000, "epoch": 915} {"train_loss": -21.474727630615234, "global_step": 76001, "epoch": 915} {"train_loss": -21.625476837158203, "global_step": 76002, "epoch": 915} {"train_loss": -20.536027908325195, "global_step": 76003, "epoch": 915} {"train_loss": -20.98981285095215, "global_step": 76004, "epoch": 915} {"train_loss": -21.296781539916992, "global_step": 76005, "epoch": 915} {"train_loss": -20.868484497070312, "global_step": 76006, "epoch": 915} {"train_loss": -21.218050003051758, "global_step": 76007, "epoch": 915} {"train_loss": -21.062864303588867, "global_step": 76008, "epoch": 915} {"train_loss": -21.361303329467773, "global_step": 76009, "epoch": 915} {"train_loss": -20.807769775390625, "global_step": 76010, "epoch": 915} {"train_loss": -21.099834442138672, "global_step": 76011, "epoch": 915} {"train_loss": -20.923242568969727, "global_step": 76012, "epoch": 915} {"train_loss": -20.977405548095703, "global_step": 76013, "epoch": 915} {"train_loss": -21.320388793945312, "global_step": 76014, "epoch": 915} {"train_loss": -21.356048583984375, "global_step": 76015, "epoch": 915} {"train_loss": -21.331220626831055, "global_step": 76016, "epoch": 915} {"train_loss": -20.856054306030273, "global_step": 76017, "epoch": 915} {"train_loss": -21.062870025634766, "global_step": 76018, "epoch": 915} {"train_loss": -20.675216674804688, "global_step": 76019, "epoch": 915} {"train_loss": -21.224706649780273, "global_step": 76020, "epoch": 915} {"train_loss": -20.949691772460938, "global_step": 76021, "epoch": 915} {"train_loss": -20.961740493774414, "global_step": 76022, "epoch": 915} {"train_loss": -20.919713973999023, "global_step": 76023, "epoch": 915} {"train_loss": -21.044513702392578, "global_step": 76024, "epoch": 915} {"train_loss": -21.081344604492188, "global_step": 76025, "epoch": 915} {"train_loss": -21.070465087890625, "global_step": 76026, "epoch": 915} {"train_loss": -21.00804485183164, "global_step": 76027, "epoch": 915, "val_loss": 6077398.5} {"train_loss": -20.924936294555664, "global_step": 76028, "epoch": 916} {"train_loss": -20.76302146911621, "global_step": 76029, "epoch": 916} {"train_loss": -20.849695205688477, "global_step": 76030, "epoch": 916} {"train_loss": -20.993860244750977, "global_step": 76031, "epoch": 916} {"train_loss": -21.07923126220703, "global_step": 76032, "epoch": 916} {"train_loss": -20.87122344970703, "global_step": 76033, "epoch": 916} {"train_loss": -20.874155044555664, "global_step": 76034, "epoch": 916} {"train_loss": -21.045225143432617, "global_step": 76035, "epoch": 916} {"train_loss": -21.08843994140625, "global_step": 76036, "epoch": 916} {"train_loss": -20.641380310058594, "global_step": 76037, "epoch": 916} {"train_loss": -20.873106002807617, "global_step": 76038, "epoch": 916} {"train_loss": -21.133819580078125, "global_step": 76039, "epoch": 916} {"train_loss": -20.81325340270996, "global_step": 76040, "epoch": 916} {"train_loss": -21.32608413696289, "global_step": 76041, "epoch": 916} {"train_loss": -21.05990982055664, "global_step": 76042, "epoch": 916} {"train_loss": -21.4854736328125, "global_step": 76043, "epoch": 916} {"train_loss": -21.03920555114746, "global_step": 76044, "epoch": 916} {"train_loss": -21.173242568969727, "global_step": 76045, "epoch": 916} {"train_loss": -20.923770904541016, "global_step": 76046, "epoch": 916} {"train_loss": -20.877622604370117, "global_step": 76047, "epoch": 916} {"train_loss": -21.096487045288086, "global_step": 76048, "epoch": 916} {"train_loss": -21.42716407775879, "global_step": 76049, "epoch": 916} {"train_loss": -20.942337036132812, "global_step": 76050, "epoch": 916} {"train_loss": -20.9888973236084, "global_step": 76051, "epoch": 916} {"train_loss": -21.00978660583496, "global_step": 76052, "epoch": 916} {"train_loss": -21.02031898498535, "global_step": 76053, "epoch": 916} {"train_loss": -21.203296661376953, "global_step": 76054, "epoch": 916} {"train_loss": -20.83542251586914, "global_step": 76055, "epoch": 916} {"train_loss": -21.101072311401367, "global_step": 76056, "epoch": 916} {"train_loss": -20.991024017333984, "global_step": 76057, "epoch": 916} {"train_loss": -20.72078514099121, "global_step": 76058, "epoch": 916} {"train_loss": -20.995691299438477, "global_step": 76059, "epoch": 916} {"train_loss": -20.866355895996094, "global_step": 76060, "epoch": 916} {"train_loss": -20.999120712280273, "global_step": 76061, "epoch": 916} {"train_loss": -20.881305694580078, "global_step": 76062, "epoch": 916} {"train_loss": -20.905275344848633, "global_step": 76063, "epoch": 916} {"train_loss": -20.9447021484375, "global_step": 76064, "epoch": 916} {"train_loss": -20.92640495300293, "global_step": 76065, "epoch": 916} {"train_loss": -21.039688110351562, "global_step": 76066, "epoch": 916} {"train_loss": -20.903854370117188, "global_step": 76067, "epoch": 916} {"train_loss": -21.047224044799805, "global_step": 76068, "epoch": 916} {"train_loss": -21.32390785217285, "global_step": 76069, "epoch": 916} {"train_loss": -20.960018157958984, "global_step": 76070, "epoch": 916} {"train_loss": -20.545124053955078, "global_step": 76071, "epoch": 916} {"train_loss": -21.121402740478516, "global_step": 76072, "epoch": 916} {"train_loss": -21.536529541015625, "global_step": 76073, "epoch": 916} {"train_loss": -21.202632904052734, "global_step": 76074, "epoch": 916} {"train_loss": -20.840229034423828, "global_step": 76075, "epoch": 916} {"train_loss": -21.180356979370117, "global_step": 76076, "epoch": 916} {"train_loss": -21.186269760131836, "global_step": 76077, "epoch": 916} {"train_loss": -20.94242286682129, "global_step": 76078, "epoch": 916} {"train_loss": -21.14052963256836, "global_step": 76079, "epoch": 916} {"train_loss": -20.84163475036621, "global_step": 76080, "epoch": 916} {"train_loss": -21.293254852294922, "global_step": 76081, "epoch": 916} {"train_loss": -21.14081382751465, "global_step": 76082, "epoch": 916} {"train_loss": -20.45008659362793, "global_step": 76083, "epoch": 916} {"train_loss": -20.901702880859375, "global_step": 76084, "epoch": 916} {"train_loss": -20.9945011138916, "global_step": 76085, "epoch": 916} {"train_loss": -21.0041446685791, "global_step": 76086, "epoch": 916} {"train_loss": -21.131000518798828, "global_step": 76087, "epoch": 916} {"train_loss": -20.997594833374023, "global_step": 76088, "epoch": 916} {"train_loss": -20.751218795776367, "global_step": 76089, "epoch": 916} {"train_loss": -21.100032806396484, "global_step": 76090, "epoch": 916} {"train_loss": -21.388492584228516, "global_step": 76091, "epoch": 916} {"train_loss": -21.015811920166016, "global_step": 76092, "epoch": 916} {"train_loss": -21.075420379638672, "global_step": 76093, "epoch": 916} {"train_loss": -21.066007614135742, "global_step": 76094, "epoch": 916} {"train_loss": -21.297597885131836, "global_step": 76095, "epoch": 916} {"train_loss": -21.287832260131836, "global_step": 76096, "epoch": 916} {"train_loss": -21.54183006286621, "global_step": 76097, "epoch": 916} {"train_loss": -21.251134872436523, "global_step": 76098, "epoch": 916} {"train_loss": -21.04171371459961, "global_step": 76099, "epoch": 916} {"train_loss": -21.28732681274414, "global_step": 76100, "epoch": 916} {"train_loss": -20.834089279174805, "global_step": 76101, "epoch": 916} {"train_loss": -20.926584243774414, "global_step": 76102, "epoch": 916} {"train_loss": -20.967824935913086, "global_step": 76103, "epoch": 916} {"train_loss": -20.839263916015625, "global_step": 76104, "epoch": 916} {"train_loss": -20.974496841430664, "global_step": 76105, "epoch": 916} {"train_loss": -21.202966690063477, "global_step": 76106, "epoch": 916} {"train_loss": -20.784696578979492, "global_step": 76107, "epoch": 916} {"train_loss": -21.172456741333008, "global_step": 76108, "epoch": 916} {"train_loss": -21.062116622924805, "global_step": 76109, "epoch": 916} {"train_loss": -21.03717282306717, "global_step": 76110, "epoch": 916, "val_loss": 6081129.0} {"train_loss": -20.90988540649414, "global_step": 76111, "epoch": 917} {"train_loss": -21.06547737121582, "global_step": 76112, "epoch": 917} {"train_loss": -20.51273536682129, "global_step": 76113, "epoch": 917} {"train_loss": -20.614519119262695, "global_step": 76114, "epoch": 917} {"train_loss": -20.76454734802246, "global_step": 76115, "epoch": 917} {"train_loss": -20.704797744750977, "global_step": 76116, "epoch": 917} {"train_loss": -20.356168746948242, "global_step": 76117, "epoch": 917} {"train_loss": -21.115774154663086, "global_step": 76118, "epoch": 917} {"train_loss": -21.087371826171875, "global_step": 76119, "epoch": 917} {"train_loss": -20.792774200439453, "global_step": 76120, "epoch": 917} {"train_loss": -21.110944747924805, "global_step": 76121, "epoch": 917} {"train_loss": -21.09515953063965, "global_step": 76122, "epoch": 917} {"train_loss": -20.751760482788086, "global_step": 76123, "epoch": 917} {"train_loss": -20.737079620361328, "global_step": 76124, "epoch": 917} {"train_loss": -20.947620391845703, "global_step": 76125, "epoch": 917} {"train_loss": -20.89117431640625, "global_step": 76126, "epoch": 917} {"train_loss": -20.72454071044922, "global_step": 76127, "epoch": 917} {"train_loss": -21.132558822631836, "global_step": 76128, "epoch": 917} {"train_loss": -21.344568252563477, "global_step": 76129, "epoch": 917} {"train_loss": -20.694040298461914, "global_step": 76130, "epoch": 917} {"train_loss": -21.007503509521484, "global_step": 76131, "epoch": 917} {"train_loss": -21.169584274291992, "global_step": 76132, "epoch": 917} {"train_loss": -20.805709838867188, "global_step": 76133, "epoch": 917} {"train_loss": -20.888334274291992, "global_step": 76134, "epoch": 917} {"train_loss": -21.06081199645996, "global_step": 76135, "epoch": 917} {"train_loss": -21.064964294433594, "global_step": 76136, "epoch": 917} {"train_loss": -20.913959503173828, "global_step": 76137, "epoch": 917} {"train_loss": -21.316818237304688, "global_step": 76138, "epoch": 917} {"train_loss": -21.125534057617188, "global_step": 76139, "epoch": 917} {"train_loss": -21.278411865234375, "global_step": 76140, "epoch": 917} {"train_loss": -21.32640266418457, "global_step": 76141, "epoch": 917} {"train_loss": -21.123111724853516, "global_step": 76142, "epoch": 917} {"train_loss": -20.748641967773438, "global_step": 76143, "epoch": 917} {"train_loss": -21.50456428527832, "global_step": 76144, "epoch": 917} {"train_loss": -21.366527557373047, "global_step": 76145, "epoch": 917} {"train_loss": -20.80238914489746, "global_step": 76146, "epoch": 917} {"train_loss": -21.25798988342285, "global_step": 76147, "epoch": 917} {"train_loss": -20.606454849243164, "global_step": 76148, "epoch": 917} {"train_loss": -21.275989532470703, "global_step": 76149, "epoch": 917} {"train_loss": -21.099273681640625, "global_step": 76150, "epoch": 917} {"train_loss": -21.264114379882812, "global_step": 76151, "epoch": 917} {"train_loss": -21.12959861755371, "global_step": 76152, "epoch": 917} {"train_loss": -21.284164428710938, "global_step": 76153, "epoch": 917} {"train_loss": -20.792072296142578, "global_step": 76154, "epoch": 917} {"train_loss": -20.940645217895508, "global_step": 76155, "epoch": 917} {"train_loss": -21.198843002319336, "global_step": 76156, "epoch": 917} {"train_loss": -21.1363525390625, "global_step": 76157, "epoch": 917} {"train_loss": -21.422090530395508, "global_step": 76158, "epoch": 917} {"train_loss": -20.976985931396484, "global_step": 76159, "epoch": 917} {"train_loss": -21.22321319580078, "global_step": 76160, "epoch": 917} {"train_loss": -21.23702049255371, "global_step": 76161, "epoch": 917} {"train_loss": -21.15231704711914, "global_step": 76162, "epoch": 917} {"train_loss": -21.37862205505371, "global_step": 76163, "epoch": 917} {"train_loss": -21.249982833862305, "global_step": 76164, "epoch": 917} {"train_loss": -21.069456100463867, "global_step": 76165, "epoch": 917} {"train_loss": -20.78615951538086, "global_step": 76166, "epoch": 917} {"train_loss": -21.4387149810791, "global_step": 76167, "epoch": 917} {"train_loss": -21.0058650970459, "global_step": 76168, "epoch": 917} {"train_loss": -21.07779884338379, "global_step": 76169, "epoch": 917} {"train_loss": -20.97500991821289, "global_step": 76170, "epoch": 917} {"train_loss": -20.829965591430664, "global_step": 76171, "epoch": 917} {"train_loss": -21.06365394592285, "global_step": 76172, "epoch": 917} {"train_loss": -20.930631637573242, "global_step": 76173, "epoch": 917} {"train_loss": -20.921449661254883, "global_step": 76174, "epoch": 917} {"train_loss": -21.04817008972168, "global_step": 76175, "epoch": 917} {"train_loss": -20.97821044921875, "global_step": 76176, "epoch": 917} {"train_loss": -21.38402557373047, "global_step": 76177, "epoch": 917} {"train_loss": -21.13856315612793, "global_step": 76178, "epoch": 917} {"train_loss": -21.219377517700195, "global_step": 76179, "epoch": 917} {"train_loss": -20.83158302307129, "global_step": 76180, "epoch": 917} {"train_loss": -21.139766693115234, "global_step": 76181, "epoch": 917} {"train_loss": -21.105087280273438, "global_step": 76182, "epoch": 917} {"train_loss": -21.29429054260254, "global_step": 76183, "epoch": 917} {"train_loss": -20.95008659362793, "global_step": 76184, "epoch": 917} {"train_loss": -20.91615867614746, "global_step": 76185, "epoch": 917} {"train_loss": -21.20370864868164, "global_step": 76186, "epoch": 917} {"train_loss": -21.201852798461914, "global_step": 76187, "epoch": 917} {"train_loss": -20.772151947021484, "global_step": 76188, "epoch": 917} {"train_loss": -21.268009185791016, "global_step": 76189, "epoch": 917} {"train_loss": -21.34212303161621, "global_step": 76190, "epoch": 917} {"train_loss": -21.2504940032959, "global_step": 76191, "epoch": 917} {"train_loss": -21.298599243164062, "global_step": 76192, "epoch": 917} {"train_loss": -21.044652686061628, "global_step": 76193, "epoch": 917, "val_loss": 6213709.0} {"train_loss": -20.581296920776367, "global_step": 76194, "epoch": 918} {"train_loss": -21.107297897338867, "global_step": 76195, "epoch": 918} {"train_loss": -21.120920181274414, "global_step": 76196, "epoch": 918} {"train_loss": -20.653217315673828, "global_step": 76197, "epoch": 918} {"train_loss": -20.738807678222656, "global_step": 76198, "epoch": 918} {"train_loss": -20.763898849487305, "global_step": 76199, "epoch": 918} {"train_loss": -20.99007797241211, "global_step": 76200, "epoch": 918} {"train_loss": -21.191394805908203, "global_step": 76201, "epoch": 918} {"train_loss": -20.808176040649414, "global_step": 76202, "epoch": 918} {"train_loss": -20.70623779296875, "global_step": 76203, "epoch": 918} {"train_loss": -21.244918823242188, "global_step": 76204, "epoch": 918} {"train_loss": -21.023984909057617, "global_step": 76205, "epoch": 918} {"train_loss": -21.185415267944336, "global_step": 76206, "epoch": 918} {"train_loss": -21.006420135498047, "global_step": 76207, "epoch": 918} {"train_loss": -21.098949432373047, "global_step": 76208, "epoch": 918} {"train_loss": -20.729215621948242, "global_step": 76209, "epoch": 918} {"train_loss": -20.984405517578125, "global_step": 76210, "epoch": 918} {"train_loss": -21.03898048400879, "global_step": 76211, "epoch": 918} {"train_loss": -21.04935073852539, "global_step": 76212, "epoch": 918} {"train_loss": -20.370933532714844, "global_step": 76213, "epoch": 918} {"train_loss": -21.13270378112793, "global_step": 76214, "epoch": 918} {"train_loss": -21.425128936767578, "global_step": 76215, "epoch": 918} {"train_loss": -21.000091552734375, "global_step": 76216, "epoch": 918} {"train_loss": -20.965160369873047, "global_step": 76217, "epoch": 918} {"train_loss": -21.30450439453125, "global_step": 76218, "epoch": 918} {"train_loss": -20.575958251953125, "global_step": 76219, "epoch": 918} {"train_loss": -21.194833755493164, "global_step": 76220, "epoch": 918} {"train_loss": -21.118642807006836, "global_step": 76221, "epoch": 918} {"train_loss": -20.881183624267578, "global_step": 76222, "epoch": 918} {"train_loss": -20.785417556762695, "global_step": 76223, "epoch": 918} {"train_loss": -21.189035415649414, "global_step": 76224, "epoch": 918} {"train_loss": -21.057357788085938, "global_step": 76225, "epoch": 918} {"train_loss": -21.279932022094727, "global_step": 76226, "epoch": 918} {"train_loss": -21.356985092163086, "global_step": 76227, "epoch": 918} {"train_loss": -21.142698287963867, "global_step": 76228, "epoch": 918} {"train_loss": -21.245819091796875, "global_step": 76229, "epoch": 918} {"train_loss": -21.143993377685547, "global_step": 76230, "epoch": 918} {"train_loss": -21.176973342895508, "global_step": 76231, "epoch": 918} {"train_loss": -20.901588439941406, "global_step": 76232, "epoch": 918} {"train_loss": -21.1407470703125, "global_step": 76233, "epoch": 918} {"train_loss": -21.333209991455078, "global_step": 76234, "epoch": 918} {"train_loss": -21.149017333984375, "global_step": 76235, "epoch": 918} {"train_loss": -21.21187400817871, "global_step": 76236, "epoch": 918} {"train_loss": -21.075010299682617, "global_step": 76237, "epoch": 918} {"train_loss": -21.023727416992188, "global_step": 76238, "epoch": 918} {"train_loss": -20.913150787353516, "global_step": 76239, "epoch": 918} {"train_loss": -21.438528060913086, "global_step": 76240, "epoch": 918} {"train_loss": -20.900938034057617, "global_step": 76241, "epoch": 918} {"train_loss": -20.84589958190918, "global_step": 76242, "epoch": 918} {"train_loss": -20.922468185424805, "global_step": 76243, "epoch": 918} {"train_loss": -20.732669830322266, "global_step": 76244, "epoch": 918} {"train_loss": -20.872390747070312, "global_step": 76245, "epoch": 918} {"train_loss": -20.916645050048828, "global_step": 76246, "epoch": 918} {"train_loss": -20.763029098510742, "global_step": 76247, "epoch": 918} {"train_loss": -21.114107131958008, "global_step": 76248, "epoch": 918} {"train_loss": -21.027814865112305, "global_step": 76249, "epoch": 918} {"train_loss": -20.606046676635742, "global_step": 76250, "epoch": 918} {"train_loss": -20.827922821044922, "global_step": 76251, "epoch": 918} {"train_loss": -20.878931045532227, "global_step": 76252, "epoch": 918} {"train_loss": -20.718475341796875, "global_step": 76253, "epoch": 918} {"train_loss": -21.0216121673584, "global_step": 76254, "epoch": 918} {"train_loss": -21.122421264648438, "global_step": 76255, "epoch": 918} {"train_loss": -20.783138275146484, "global_step": 76256, "epoch": 918} {"train_loss": -21.251527786254883, "global_step": 76257, "epoch": 918} {"train_loss": -20.699642181396484, "global_step": 76258, "epoch": 918} {"train_loss": -21.148481369018555, "global_step": 76259, "epoch": 918} {"train_loss": -20.652456283569336, "global_step": 76260, "epoch": 918} {"train_loss": -20.94410514831543, "global_step": 76261, "epoch": 918} {"train_loss": -21.252050399780273, "global_step": 76262, "epoch": 918} {"train_loss": -21.38751792907715, "global_step": 76263, "epoch": 918} {"train_loss": -21.307668685913086, "global_step": 76264, "epoch": 918} {"train_loss": -21.038333892822266, "global_step": 76265, "epoch": 918} {"train_loss": -20.957183837890625, "global_step": 76266, "epoch": 918} {"train_loss": -21.33134651184082, "global_step": 76267, "epoch": 918} {"train_loss": -21.139524459838867, "global_step": 76268, "epoch": 918} {"train_loss": -21.156719207763672, "global_step": 76269, "epoch": 918} {"train_loss": -21.074504852294922, "global_step": 76270, "epoch": 918} {"train_loss": -21.258705139160156, "global_step": 76271, "epoch": 918} {"train_loss": -21.125717163085938, "global_step": 76272, "epoch": 918} {"train_loss": -21.2480525970459, "global_step": 76273, "epoch": 918} {"train_loss": -21.052715301513672, "global_step": 76274, "epoch": 918} {"train_loss": -21.29270362854004, "global_step": 76275, "epoch": 918} {"train_loss": -21.024317247321807, "global_step": 76276, "epoch": 918, "val_loss": 6047248.5} {"train_loss": -20.40190887451172, "global_step": 76277, "epoch": 919} {"train_loss": -20.308563232421875, "global_step": 76278, "epoch": 919} {"train_loss": -21.161495208740234, "global_step": 76279, "epoch": 919} {"train_loss": -20.477428436279297, "global_step": 76280, "epoch": 919} {"train_loss": -20.717016220092773, "global_step": 76281, "epoch": 919} {"train_loss": -21.255186080932617, "global_step": 76282, "epoch": 919} {"train_loss": -20.755210876464844, "global_step": 76283, "epoch": 919} {"train_loss": -20.755126953125, "global_step": 76284, "epoch": 919} {"train_loss": -21.082035064697266, "global_step": 76285, "epoch": 919} {"train_loss": -20.81524658203125, "global_step": 76286, "epoch": 919} {"train_loss": -21.237884521484375, "global_step": 76287, "epoch": 919} {"train_loss": -21.013988494873047, "global_step": 76288, "epoch": 919} {"train_loss": -20.727474212646484, "global_step": 76289, "epoch": 919} {"train_loss": -20.9396915435791, "global_step": 76290, "epoch": 919} {"train_loss": -20.36244773864746, "global_step": 76291, "epoch": 919} {"train_loss": -21.125011444091797, "global_step": 76292, "epoch": 919} {"train_loss": -21.16297721862793, "global_step": 76293, "epoch": 919} {"train_loss": -20.793468475341797, "global_step": 76294, "epoch": 919} {"train_loss": -21.02016830444336, "global_step": 76295, "epoch": 919} {"train_loss": -20.92254638671875, "global_step": 76296, "epoch": 919} {"train_loss": -20.624765396118164, "global_step": 76297, "epoch": 919} {"train_loss": -21.31156349182129, "global_step": 76298, "epoch": 919} {"train_loss": -21.323562622070312, "global_step": 76299, "epoch": 919} {"train_loss": -21.014249801635742, "global_step": 76300, "epoch": 919} {"train_loss": -21.064971923828125, "global_step": 76301, "epoch": 919} {"train_loss": -20.9914608001709, "global_step": 76302, "epoch": 919} {"train_loss": -21.166006088256836, "global_step": 76303, "epoch": 919} {"train_loss": -21.026357650756836, "global_step": 76304, "epoch": 919} {"train_loss": -21.287372589111328, "global_step": 76305, "epoch": 919} {"train_loss": -20.872102737426758, "global_step": 76306, "epoch": 919} {"train_loss": -21.047922134399414, "global_step": 76307, "epoch": 919} {"train_loss": -21.43222427368164, "global_step": 76308, "epoch": 919} {"train_loss": -21.398120880126953, "global_step": 76309, "epoch": 919} {"train_loss": -21.049724578857422, "global_step": 76310, "epoch": 919} {"train_loss": -20.642269134521484, "global_step": 76311, "epoch": 919} {"train_loss": -20.942703247070312, "global_step": 76312, "epoch": 919} {"train_loss": -21.428455352783203, "global_step": 76313, "epoch": 919} {"train_loss": -21.158653259277344, "global_step": 76314, "epoch": 919} {"train_loss": -20.98952293395996, "global_step": 76315, "epoch": 919} {"train_loss": -20.828168869018555, "global_step": 76316, "epoch": 919} {"train_loss": -21.046253204345703, "global_step": 76317, "epoch": 919} {"train_loss": -20.605192184448242, "global_step": 76318, "epoch": 919} {"train_loss": -20.973583221435547, "global_step": 76319, "epoch": 919} {"train_loss": -20.858051300048828, "global_step": 76320, "epoch": 919} {"train_loss": -20.942434310913086, "global_step": 76321, "epoch": 919} {"train_loss": -21.2486515045166, "global_step": 76322, "epoch": 919} {"train_loss": -20.6568660736084, "global_step": 76323, "epoch": 919} {"train_loss": -21.374582290649414, "global_step": 76324, "epoch": 919} {"train_loss": -21.365156173706055, "global_step": 76325, "epoch": 919} {"train_loss": -21.206207275390625, "global_step": 76326, "epoch": 919} {"train_loss": -20.966779708862305, "global_step": 76327, "epoch": 919} {"train_loss": -21.302186965942383, "global_step": 76328, "epoch": 919} {"train_loss": -20.989540100097656, "global_step": 76329, "epoch": 919} {"train_loss": -21.164539337158203, "global_step": 76330, "epoch": 919} {"train_loss": -21.240636825561523, "global_step": 76331, "epoch": 919} {"train_loss": -21.080467224121094, "global_step": 76332, "epoch": 919} {"train_loss": -21.132160186767578, "global_step": 76333, "epoch": 919} {"train_loss": -21.100858688354492, "global_step": 76334, "epoch": 919} {"train_loss": -20.919281005859375, "global_step": 76335, "epoch": 919} {"train_loss": -21.434125900268555, "global_step": 76336, "epoch": 919} {"train_loss": -21.165008544921875, "global_step": 76337, "epoch": 919} {"train_loss": -20.73779296875, "global_step": 76338, "epoch": 919} {"train_loss": -21.08319091796875, "global_step": 76339, "epoch": 919} {"train_loss": -20.880287170410156, "global_step": 76340, "epoch": 919} {"train_loss": -20.93433380126953, "global_step": 76341, "epoch": 919} {"train_loss": -21.224655151367188, "global_step": 76342, "epoch": 919} {"train_loss": -21.177989959716797, "global_step": 76343, "epoch": 919} {"train_loss": -20.817413330078125, "global_step": 76344, "epoch": 919} {"train_loss": -21.29043960571289, "global_step": 76345, "epoch": 919} {"train_loss": -20.797962188720703, "global_step": 76346, "epoch": 919} {"train_loss": -20.72356414794922, "global_step": 76347, "epoch": 919} {"train_loss": -20.835548400878906, "global_step": 76348, "epoch": 919} {"train_loss": -21.114181518554688, "global_step": 76349, "epoch": 919} {"train_loss": -21.129987716674805, "global_step": 76350, "epoch": 919} {"train_loss": -21.005634307861328, "global_step": 76351, "epoch": 919} {"train_loss": -21.13435173034668, "global_step": 76352, "epoch": 919} {"train_loss": -21.049240112304688, "global_step": 76353, "epoch": 919} {"train_loss": -21.168689727783203, "global_step": 76354, "epoch": 919} {"train_loss": -21.2239933013916, "global_step": 76355, "epoch": 919} {"train_loss": -20.971328735351562, "global_step": 76356, "epoch": 919} {"train_loss": -20.930421829223633, "global_step": 76357, "epoch": 919} {"train_loss": -21.18229103088379, "global_step": 76358, "epoch": 919} {"train_loss": -20.98529916786286, "global_step": 76359, "epoch": 919, "val_loss": 5894753.0} {"train_loss": -20.624113082885742, "global_step": 76360, "epoch": 920} {"train_loss": -20.461759567260742, "global_step": 76361, "epoch": 920} {"train_loss": -20.455183029174805, "global_step": 76362, "epoch": 920} {"train_loss": -19.800546646118164, "global_step": 76363, "epoch": 920} {"train_loss": -20.79837989807129, "global_step": 76364, "epoch": 920} {"train_loss": -20.29377555847168, "global_step": 76365, "epoch": 920} {"train_loss": -20.71063804626465, "global_step": 76366, "epoch": 920} {"train_loss": -20.30921173095703, "global_step": 76367, "epoch": 920} {"train_loss": -20.403841018676758, "global_step": 76368, "epoch": 920} {"train_loss": -20.388120651245117, "global_step": 76369, "epoch": 920} {"train_loss": -21.225875854492188, "global_step": 76370, "epoch": 920} {"train_loss": -20.55264663696289, "global_step": 76371, "epoch": 920} {"train_loss": -20.762157440185547, "global_step": 76372, "epoch": 920} {"train_loss": -21.13348388671875, "global_step": 76373, "epoch": 920} {"train_loss": -20.58477020263672, "global_step": 76374, "epoch": 920} {"train_loss": -20.647573471069336, "global_step": 76375, "epoch": 920} {"train_loss": -20.632766723632812, "global_step": 76376, "epoch": 920} {"train_loss": -20.74671173095703, "global_step": 76377, "epoch": 920} {"train_loss": -21.11781120300293, "global_step": 76378, "epoch": 920} {"train_loss": -20.835657119750977, "global_step": 76379, "epoch": 920} {"train_loss": -20.958829879760742, "global_step": 76380, "epoch": 920} {"train_loss": -20.850305557250977, "global_step": 76381, "epoch": 920} {"train_loss": -20.692848205566406, "global_step": 76382, "epoch": 920} {"train_loss": -21.33224868774414, "global_step": 76383, "epoch": 920} {"train_loss": -20.94515037536621, "global_step": 76384, "epoch": 920} {"train_loss": -20.937437057495117, "global_step": 76385, "epoch": 920} {"train_loss": -21.409391403198242, "global_step": 76386, "epoch": 920} {"train_loss": -20.935693740844727, "global_step": 76387, "epoch": 920} {"train_loss": -21.055326461791992, "global_step": 76388, "epoch": 920} {"train_loss": -20.956830978393555, "global_step": 76389, "epoch": 920} {"train_loss": -21.086015701293945, "global_step": 76390, "epoch": 920} {"train_loss": -21.54298210144043, "global_step": 76391, "epoch": 920} {"train_loss": -20.7474365234375, "global_step": 76392, "epoch": 920} {"train_loss": -21.149839401245117, "global_step": 76393, "epoch": 920} {"train_loss": -21.179094314575195, "global_step": 76394, "epoch": 920} {"train_loss": -21.157800674438477, "global_step": 76395, "epoch": 920} {"train_loss": -20.8746337890625, "global_step": 76396, "epoch": 920} {"train_loss": -21.08809471130371, "global_step": 76397, "epoch": 920} {"train_loss": -21.259525299072266, "global_step": 76398, "epoch": 920} {"train_loss": -21.098690032958984, "global_step": 76399, "epoch": 920} {"train_loss": -20.854740142822266, "global_step": 76400, "epoch": 920} {"train_loss": -20.989398956298828, "global_step": 76401, "epoch": 920} {"train_loss": -21.427968978881836, "global_step": 76402, "epoch": 920} {"train_loss": -21.55711555480957, "global_step": 76403, "epoch": 920} {"train_loss": -21.296323776245117, "global_step": 76404, "epoch": 920} {"train_loss": -21.393918991088867, "global_step": 76405, "epoch": 920} {"train_loss": -21.379058837890625, "global_step": 76406, "epoch": 920} {"train_loss": -21.283361434936523, "global_step": 76407, "epoch": 920} {"train_loss": -21.0324649810791, "global_step": 76408, "epoch": 920} {"train_loss": -21.034690856933594, "global_step": 76409, "epoch": 920} {"train_loss": -20.718122482299805, "global_step": 76410, "epoch": 920} {"train_loss": -20.889713287353516, "global_step": 76411, "epoch": 920} {"train_loss": -21.0716495513916, "global_step": 76412, "epoch": 920} {"train_loss": -21.249549865722656, "global_step": 76413, "epoch": 920} {"train_loss": -21.059894561767578, "global_step": 76414, "epoch": 920} {"train_loss": -20.6910400390625, "global_step": 76415, "epoch": 920} {"train_loss": -21.039968490600586, "global_step": 76416, "epoch": 920} {"train_loss": -21.1026554107666, "global_step": 76417, "epoch": 920} {"train_loss": -20.79258155822754, "global_step": 76418, "epoch": 920} {"train_loss": -21.2889461517334, "global_step": 76419, "epoch": 920} {"train_loss": -20.71588706970215, "global_step": 76420, "epoch": 920} {"train_loss": -21.215417861938477, "global_step": 76421, "epoch": 920} {"train_loss": -20.908004760742188, "global_step": 76422, "epoch": 920} {"train_loss": -21.314794540405273, "global_step": 76423, "epoch": 920} {"train_loss": -21.108015060424805, "global_step": 76424, "epoch": 920} {"train_loss": -20.93662452697754, "global_step": 76425, "epoch": 920} {"train_loss": -20.775297164916992, "global_step": 76426, "epoch": 920} {"train_loss": -20.758649826049805, "global_step": 76427, "epoch": 920} {"train_loss": -20.935077667236328, "global_step": 76428, "epoch": 920} {"train_loss": -20.905630111694336, "global_step": 76429, "epoch": 920} {"train_loss": -21.049253463745117, "global_step": 76430, "epoch": 920} {"train_loss": -21.128305435180664, "global_step": 76431, "epoch": 920} {"train_loss": -21.212366104125977, "global_step": 76432, "epoch": 920} {"train_loss": -20.740501403808594, "global_step": 76433, "epoch": 920} {"train_loss": -20.975616455078125, "global_step": 76434, "epoch": 920} {"train_loss": -20.912399291992188, "global_step": 76435, "epoch": 920} {"train_loss": -21.242788314819336, "global_step": 76436, "epoch": 920} {"train_loss": -20.988571166992188, "global_step": 76437, "epoch": 920} {"train_loss": -20.84784507751465, "global_step": 76438, "epoch": 920} {"train_loss": -21.169790267944336, "global_step": 76439, "epoch": 920} {"train_loss": -21.233928680419922, "global_step": 76440, "epoch": 920} {"train_loss": -21.001619338989258, "global_step": 76441, "epoch": 920} {"train_loss": -20.962696420141015, "global_step": 76442, "epoch": 920, "val_loss": 6273388.0} {"train_loss": -20.99187660217285, "global_step": 76443, "epoch": 921} {"train_loss": -21.020788192749023, "global_step": 76444, "epoch": 921} {"train_loss": -20.788768768310547, "global_step": 76445, "epoch": 921} {"train_loss": -20.91524314880371, "global_step": 76446, "epoch": 921} {"train_loss": -20.683774948120117, "global_step": 76447, "epoch": 921} {"train_loss": -21.334951400756836, "global_step": 76448, "epoch": 921} {"train_loss": -21.042320251464844, "global_step": 76449, "epoch": 921} {"train_loss": -21.189096450805664, "global_step": 76450, "epoch": 921} {"train_loss": -21.3137149810791, "global_step": 76451, "epoch": 921} {"train_loss": -20.60736083984375, "global_step": 76452, "epoch": 921} {"train_loss": -20.921344757080078, "global_step": 76453, "epoch": 921} {"train_loss": -21.10986328125, "global_step": 76454, "epoch": 921} {"train_loss": -20.857431411743164, "global_step": 76455, "epoch": 921} {"train_loss": -20.942747116088867, "global_step": 76456, "epoch": 921} {"train_loss": -21.02876091003418, "global_step": 76457, "epoch": 921} {"train_loss": -20.810123443603516, "global_step": 76458, "epoch": 921} {"train_loss": -21.123741149902344, "global_step": 76459, "epoch": 921} {"train_loss": -21.239255905151367, "global_step": 76460, "epoch": 921} {"train_loss": -20.471691131591797, "global_step": 76461, "epoch": 921} {"train_loss": -20.962270736694336, "global_step": 76462, "epoch": 921} {"train_loss": -21.094640731811523, "global_step": 76463, "epoch": 921} {"train_loss": -21.04572868347168, "global_step": 76464, "epoch": 921} {"train_loss": -21.141036987304688, "global_step": 76465, "epoch": 921} {"train_loss": -20.88187599182129, "global_step": 76466, "epoch": 921} {"train_loss": -20.961362838745117, "global_step": 76467, "epoch": 921} {"train_loss": -21.181007385253906, "global_step": 76468, "epoch": 921} {"train_loss": -20.84039306640625, "global_step": 76469, "epoch": 921} {"train_loss": -20.78957748413086, "global_step": 76470, "epoch": 921} {"train_loss": -20.984338760375977, "global_step": 76471, "epoch": 921} {"train_loss": -20.724863052368164, "global_step": 76472, "epoch": 921} {"train_loss": -21.088354110717773, "global_step": 76473, "epoch": 921} {"train_loss": -20.856464385986328, "global_step": 76474, "epoch": 921} {"train_loss": -21.08223533630371, "global_step": 76475, "epoch": 921} {"train_loss": -21.37552261352539, "global_step": 76476, "epoch": 921} {"train_loss": -21.11079978942871, "global_step": 76477, "epoch": 921} {"train_loss": -21.263259887695312, "global_step": 76478, "epoch": 921} {"train_loss": -21.00164222717285, "global_step": 76479, "epoch": 921} {"train_loss": -21.492122650146484, "global_step": 76480, "epoch": 921} {"train_loss": -20.758007049560547, "global_step": 76481, "epoch": 921} {"train_loss": -21.226163864135742, "global_step": 76482, "epoch": 921} {"train_loss": -21.08009147644043, "global_step": 76483, "epoch": 921} {"train_loss": -20.553815841674805, "global_step": 76484, "epoch": 921} {"train_loss": -20.86277198791504, "global_step": 76485, "epoch": 921} {"train_loss": -21.267566680908203, "global_step": 76486, "epoch": 921} {"train_loss": -20.91878318786621, "global_step": 76487, "epoch": 921} {"train_loss": -21.19573402404785, "global_step": 76488, "epoch": 921} {"train_loss": -20.773828506469727, "global_step": 76489, "epoch": 921} {"train_loss": -21.032934188842773, "global_step": 76490, "epoch": 921} {"train_loss": -21.612226486206055, "global_step": 76491, "epoch": 921} {"train_loss": -21.383758544921875, "global_step": 76492, "epoch": 921} {"train_loss": -20.910381317138672, "global_step": 76493, "epoch": 921} {"train_loss": -21.291963577270508, "global_step": 76494, "epoch": 921} {"train_loss": -20.600040435791016, "global_step": 76495, "epoch": 921} {"train_loss": -21.010055541992188, "global_step": 76496, "epoch": 921} {"train_loss": -21.02428436279297, "global_step": 76497, "epoch": 921} {"train_loss": -20.92695426940918, "global_step": 76498, "epoch": 921} {"train_loss": -21.08201026916504, "global_step": 76499, "epoch": 921} {"train_loss": -21.203624725341797, "global_step": 76500, "epoch": 921} {"train_loss": -21.177156448364258, "global_step": 76501, "epoch": 921} {"train_loss": -20.907608032226562, "global_step": 76502, "epoch": 921} {"train_loss": -21.198274612426758, "global_step": 76503, "epoch": 921} {"train_loss": -21.129104614257812, "global_step": 76504, "epoch": 921} {"train_loss": -21.220399856567383, "global_step": 76505, "epoch": 921} {"train_loss": -21.289243698120117, "global_step": 76506, "epoch": 921} {"train_loss": -20.984851837158203, "global_step": 76507, "epoch": 921} {"train_loss": -21.322568893432617, "global_step": 76508, "epoch": 921} {"train_loss": -21.1972599029541, "global_step": 76509, "epoch": 921} {"train_loss": -21.329017639160156, "global_step": 76510, "epoch": 921} {"train_loss": -21.35268211364746, "global_step": 76511, "epoch": 921} {"train_loss": -21.20970344543457, "global_step": 76512, "epoch": 921} {"train_loss": -21.187421798706055, "global_step": 76513, "epoch": 921} {"train_loss": -21.063278198242188, "global_step": 76514, "epoch": 921} {"train_loss": -21.10108184814453, "global_step": 76515, "epoch": 921} {"train_loss": -21.182727813720703, "global_step": 76516, "epoch": 921} {"train_loss": -21.08246421813965, "global_step": 76517, "epoch": 921} {"train_loss": -20.934391021728516, "global_step": 76518, "epoch": 921} {"train_loss": -21.10540199279785, "global_step": 76519, "epoch": 921} {"train_loss": -21.18048095703125, "global_step": 76520, "epoch": 921} {"train_loss": -21.05782127380371, "global_step": 76521, "epoch": 921} {"train_loss": -20.864973068237305, "global_step": 76522, "epoch": 921} {"train_loss": -20.921354293823242, "global_step": 76523, "epoch": 921} {"train_loss": -20.686037063598633, "global_step": 76524, "epoch": 921} {"train_loss": -21.03553254920316, "global_step": 76525, "epoch": 921, "val_loss": 6043103.5} {"train_loss": -20.990976333618164, "global_step": 76526, "epoch": 922} {"train_loss": -21.233606338500977, "global_step": 76527, "epoch": 922} {"train_loss": -21.014333724975586, "global_step": 76528, "epoch": 922} {"train_loss": -20.82491111755371, "global_step": 76529, "epoch": 922} {"train_loss": -20.882535934448242, "global_step": 76530, "epoch": 922} {"train_loss": -21.286457061767578, "global_step": 76531, "epoch": 922} {"train_loss": -20.82094383239746, "global_step": 76532, "epoch": 922} {"train_loss": -20.818204879760742, "global_step": 76533, "epoch": 922} {"train_loss": -20.903690338134766, "global_step": 76534, "epoch": 922} {"train_loss": -20.711450576782227, "global_step": 76535, "epoch": 922} {"train_loss": -21.016433715820312, "global_step": 76536, "epoch": 922} {"train_loss": -21.116254806518555, "global_step": 76537, "epoch": 922} {"train_loss": -21.345111846923828, "global_step": 76538, "epoch": 922} {"train_loss": -20.82745361328125, "global_step": 76539, "epoch": 922} {"train_loss": -21.08871841430664, "global_step": 76540, "epoch": 922} {"train_loss": -21.241270065307617, "global_step": 76541, "epoch": 922} {"train_loss": -20.755117416381836, "global_step": 76542, "epoch": 922} {"train_loss": -21.05777359008789, "global_step": 76543, "epoch": 922} {"train_loss": -21.18707275390625, "global_step": 76544, "epoch": 922} {"train_loss": -21.085058212280273, "global_step": 76545, "epoch": 922} {"train_loss": -21.054906845092773, "global_step": 76546, "epoch": 922} {"train_loss": -21.073118209838867, "global_step": 76547, "epoch": 922} {"train_loss": -21.01369285583496, "global_step": 76548, "epoch": 922} {"train_loss": -21.255435943603516, "global_step": 76549, "epoch": 922} {"train_loss": -21.151233673095703, "global_step": 76550, "epoch": 922} {"train_loss": -21.038755416870117, "global_step": 76551, "epoch": 922} {"train_loss": -21.077253341674805, "global_step": 76552, "epoch": 922} {"train_loss": -21.077505111694336, "global_step": 76553, "epoch": 922} {"train_loss": -21.237735748291016, "global_step": 76554, "epoch": 922} {"train_loss": -21.28297233581543, "global_step": 76555, "epoch": 922} {"train_loss": -21.39153289794922, "global_step": 76556, "epoch": 922} {"train_loss": -20.897903442382812, "global_step": 76557, "epoch": 922} {"train_loss": -21.449748992919922, "global_step": 76558, "epoch": 922} {"train_loss": -20.922544479370117, "global_step": 76559, "epoch": 922} {"train_loss": -21.253509521484375, "global_step": 76560, "epoch": 922} {"train_loss": -20.989377975463867, "global_step": 76561, "epoch": 922} {"train_loss": -21.43089485168457, "global_step": 76562, "epoch": 922} {"train_loss": -21.037918090820312, "global_step": 76563, "epoch": 922} {"train_loss": -21.019580841064453, "global_step": 76564, "epoch": 922} {"train_loss": -21.430326461791992, "global_step": 76565, "epoch": 922} {"train_loss": -21.142871856689453, "global_step": 76566, "epoch": 922} {"train_loss": -21.145069122314453, "global_step": 76567, "epoch": 922} {"train_loss": -21.222169876098633, "global_step": 76568, "epoch": 922} {"train_loss": -21.0825138092041, "global_step": 76569, "epoch": 922} {"train_loss": -21.212820053100586, "global_step": 76570, "epoch": 922} {"train_loss": -21.24492835998535, "global_step": 76571, "epoch": 922} {"train_loss": -21.0622501373291, "global_step": 76572, "epoch": 922} {"train_loss": -21.47962760925293, "global_step": 76573, "epoch": 922} {"train_loss": -21.10470962524414, "global_step": 76574, "epoch": 922} {"train_loss": -20.69270896911621, "global_step": 76575, "epoch": 922} {"train_loss": -20.68460464477539, "global_step": 76576, "epoch": 922} {"train_loss": -21.11054801940918, "global_step": 76577, "epoch": 922} {"train_loss": -21.026500701904297, "global_step": 76578, "epoch": 922} {"train_loss": -21.08528709411621, "global_step": 76579, "epoch": 922} {"train_loss": -21.177227020263672, "global_step": 76580, "epoch": 922} {"train_loss": -20.940288543701172, "global_step": 76581, "epoch": 922} {"train_loss": -21.11100196838379, "global_step": 76582, "epoch": 922} {"train_loss": -21.27201271057129, "global_step": 76583, "epoch": 922} {"train_loss": -20.826597213745117, "global_step": 76584, "epoch": 922} {"train_loss": -20.96042251586914, "global_step": 76585, "epoch": 922} {"train_loss": -21.31768226623535, "global_step": 76586, "epoch": 922} {"train_loss": -21.055110931396484, "global_step": 76587, "epoch": 922} {"train_loss": -20.78742218017578, "global_step": 76588, "epoch": 922} {"train_loss": -20.95387077331543, "global_step": 76589, "epoch": 922} {"train_loss": -21.30272102355957, "global_step": 76590, "epoch": 922} {"train_loss": -21.09563636779785, "global_step": 76591, "epoch": 922} {"train_loss": -21.116315841674805, "global_step": 76592, "epoch": 922} {"train_loss": -21.273788452148438, "global_step": 76593, "epoch": 922} {"train_loss": -21.16054344177246, "global_step": 76594, "epoch": 922} {"train_loss": -21.07073974609375, "global_step": 76595, "epoch": 922} {"train_loss": -20.95088005065918, "global_step": 76596, "epoch": 922} {"train_loss": -20.91908836364746, "global_step": 76597, "epoch": 922} {"train_loss": -21.240671157836914, "global_step": 76598, "epoch": 922} {"train_loss": -20.679121017456055, "global_step": 76599, "epoch": 922} {"train_loss": -20.515417098999023, "global_step": 76600, "epoch": 922} {"train_loss": -21.3408145904541, "global_step": 76601, "epoch": 922} {"train_loss": -20.967321395874023, "global_step": 76602, "epoch": 922} {"train_loss": -20.905912399291992, "global_step": 76603, "epoch": 922} {"train_loss": -21.013824462890625, "global_step": 76604, "epoch": 922} {"train_loss": -21.06686019897461, "global_step": 76605, "epoch": 922} {"train_loss": -20.866796493530273, "global_step": 76606, "epoch": 922} {"train_loss": -20.952350616455078, "global_step": 76607, "epoch": 922} {"train_loss": -21.076589285609234, "global_step": 76608, "epoch": 922, "val_loss": 6031061.5} {"train_loss": -20.87502670288086, "global_step": 76609, "epoch": 923} {"train_loss": -20.783981323242188, "global_step": 76610, "epoch": 923} {"train_loss": -20.910905838012695, "global_step": 76611, "epoch": 923} {"train_loss": -20.966001510620117, "global_step": 76612, "epoch": 923} {"train_loss": -20.970752716064453, "global_step": 76613, "epoch": 923} {"train_loss": -20.78728675842285, "global_step": 76614, "epoch": 923} {"train_loss": -20.73606300354004, "global_step": 76615, "epoch": 923} {"train_loss": -20.867530822753906, "global_step": 76616, "epoch": 923} {"train_loss": -20.955432891845703, "global_step": 76617, "epoch": 923} {"train_loss": -20.86500358581543, "global_step": 76618, "epoch": 923} {"train_loss": -20.966062545776367, "global_step": 76619, "epoch": 923} {"train_loss": -20.9660701751709, "global_step": 76620, "epoch": 923} {"train_loss": -21.004064559936523, "global_step": 76621, "epoch": 923} {"train_loss": -20.9536190032959, "global_step": 76622, "epoch": 923} {"train_loss": -20.945051193237305, "global_step": 76623, "epoch": 923} {"train_loss": -20.875497817993164, "global_step": 76624, "epoch": 923} {"train_loss": -21.18654441833496, "global_step": 76625, "epoch": 923} {"train_loss": -20.892793655395508, "global_step": 76626, "epoch": 923} {"train_loss": -21.279726028442383, "global_step": 76627, "epoch": 923} {"train_loss": -21.265432357788086, "global_step": 76628, "epoch": 923} {"train_loss": -21.254789352416992, "global_step": 76629, "epoch": 923} {"train_loss": -20.986068725585938, "global_step": 76630, "epoch": 923} {"train_loss": -21.220869064331055, "global_step": 76631, "epoch": 923} {"train_loss": -21.198986053466797, "global_step": 76632, "epoch": 923} {"train_loss": -20.405887603759766, "global_step": 76633, "epoch": 923} {"train_loss": -21.428497314453125, "global_step": 76634, "epoch": 923} {"train_loss": -20.963733673095703, "global_step": 76635, "epoch": 923} {"train_loss": -20.506107330322266, "global_step": 76636, "epoch": 923} {"train_loss": -21.192419052124023, "global_step": 76637, "epoch": 923} {"train_loss": -21.213151931762695, "global_step": 76638, "epoch": 923} {"train_loss": -20.96318244934082, "global_step": 76639, "epoch": 923} {"train_loss": -20.936100006103516, "global_step": 76640, "epoch": 923} {"train_loss": -21.036909103393555, "global_step": 76641, "epoch": 923} {"train_loss": -20.895944595336914, "global_step": 76642, "epoch": 923} {"train_loss": -20.690580368041992, "global_step": 76643, "epoch": 923} {"train_loss": -21.129358291625977, "global_step": 76644, "epoch": 923} {"train_loss": -21.111791610717773, "global_step": 76645, "epoch": 923} {"train_loss": -21.1580867767334, "global_step": 76646, "epoch": 923} {"train_loss": -21.261442184448242, "global_step": 76647, "epoch": 923} {"train_loss": -20.960168838500977, "global_step": 76648, "epoch": 923} {"train_loss": -20.92371940612793, "global_step": 76649, "epoch": 923} {"train_loss": -20.96717643737793, "global_step": 76650, "epoch": 923} {"train_loss": -21.167789459228516, "global_step": 76651, "epoch": 923} {"train_loss": -21.386655807495117, "global_step": 76652, "epoch": 923} {"train_loss": -20.97914695739746, "global_step": 76653, "epoch": 923} {"train_loss": -20.838733673095703, "global_step": 76654, "epoch": 923} {"train_loss": -20.782400131225586, "global_step": 76655, "epoch": 923} {"train_loss": -20.919498443603516, "global_step": 76656, "epoch": 923} {"train_loss": -21.07489585876465, "global_step": 76657, "epoch": 923} {"train_loss": -21.160715103149414, "global_step": 76658, "epoch": 923} {"train_loss": -21.031919479370117, "global_step": 76659, "epoch": 923} {"train_loss": -21.11054801940918, "global_step": 76660, "epoch": 923} {"train_loss": -21.058679580688477, "global_step": 76661, "epoch": 923} {"train_loss": -20.87616539001465, "global_step": 76662, "epoch": 923} {"train_loss": -21.057199478149414, "global_step": 76663, "epoch": 923} {"train_loss": -21.0593204498291, "global_step": 76664, "epoch": 923} {"train_loss": -21.081750869750977, "global_step": 76665, "epoch": 923} {"train_loss": -21.209716796875, "global_step": 76666, "epoch": 923} {"train_loss": -21.323740005493164, "global_step": 76667, "epoch": 923} {"train_loss": -21.0720272064209, "global_step": 76668, "epoch": 923} {"train_loss": -21.155521392822266, "global_step": 76669, "epoch": 923} {"train_loss": -20.984342575073242, "global_step": 76670, "epoch": 923} {"train_loss": -20.797346115112305, "global_step": 76671, "epoch": 923} {"train_loss": -20.882034301757812, "global_step": 76672, "epoch": 923} {"train_loss": -21.163497924804688, "global_step": 76673, "epoch": 923} {"train_loss": -20.918752670288086, "global_step": 76674, "epoch": 923} {"train_loss": -21.549758911132812, "global_step": 76675, "epoch": 923} {"train_loss": -20.853927612304688, "global_step": 76676, "epoch": 923} {"train_loss": -21.110746383666992, "global_step": 76677, "epoch": 923} {"train_loss": -20.935302734375, "global_step": 76678, "epoch": 923} {"train_loss": -20.97355079650879, "global_step": 76679, "epoch": 923} {"train_loss": -21.204469680786133, "global_step": 76680, "epoch": 923} {"train_loss": -21.170150756835938, "global_step": 76681, "epoch": 923} {"train_loss": -20.881671905517578, "global_step": 76682, "epoch": 923} {"train_loss": -21.175668716430664, "global_step": 76683, "epoch": 923} {"train_loss": -21.013113021850586, "global_step": 76684, "epoch": 923} {"train_loss": -20.80023765563965, "global_step": 76685, "epoch": 923} {"train_loss": -21.364776611328125, "global_step": 76686, "epoch": 923} {"train_loss": -21.166139602661133, "global_step": 76687, "epoch": 923} {"train_loss": -21.17267608642578, "global_step": 76688, "epoch": 923} {"train_loss": -21.142492294311523, "global_step": 76689, "epoch": 923} {"train_loss": -20.911691665649414, "global_step": 76690, "epoch": 923} {"train_loss": -21.029827117919922, "global_step": 76691, "epoch": 923, "val_loss": 6010286.0} {"train_loss": -20.422826766967773, "global_step": 76692, "epoch": 924} {"train_loss": -20.50847816467285, "global_step": 76693, "epoch": 924} {"train_loss": -19.603713989257812, "global_step": 76694, "epoch": 924} {"train_loss": -20.452146530151367, "global_step": 76695, "epoch": 924} {"train_loss": -20.090261459350586, "global_step": 76696, "epoch": 924} {"train_loss": -20.758970260620117, "global_step": 76697, "epoch": 924} {"train_loss": -19.89902687072754, "global_step": 76698, "epoch": 924} {"train_loss": -20.8665771484375, "global_step": 76699, "epoch": 924} {"train_loss": -20.766464233398438, "global_step": 76700, "epoch": 924} {"train_loss": -20.228330612182617, "global_step": 76701, "epoch": 924} {"train_loss": -20.531583786010742, "global_step": 76702, "epoch": 924} {"train_loss": -20.43610954284668, "global_step": 76703, "epoch": 924} {"train_loss": -20.83294105529785, "global_step": 76704, "epoch": 924} {"train_loss": -20.689437866210938, "global_step": 76705, "epoch": 924} {"train_loss": -20.78218650817871, "global_step": 76706, "epoch": 924} {"train_loss": -20.664331436157227, "global_step": 76707, "epoch": 924} {"train_loss": -20.643239974975586, "global_step": 76708, "epoch": 924} {"train_loss": -20.662403106689453, "global_step": 76709, "epoch": 924} {"train_loss": -20.83922004699707, "global_step": 76710, "epoch": 924} {"train_loss": -20.673696517944336, "global_step": 76711, "epoch": 924} {"train_loss": -20.968017578125, "global_step": 76712, "epoch": 924} {"train_loss": -20.992061614990234, "global_step": 76713, "epoch": 924} {"train_loss": -20.98292350769043, "global_step": 76714, "epoch": 924} {"train_loss": -20.946399688720703, "global_step": 76715, "epoch": 924} {"train_loss": -20.712038040161133, "global_step": 76716, "epoch": 924} {"train_loss": -20.868499755859375, "global_step": 76717, "epoch": 924} {"train_loss": -21.14145851135254, "global_step": 76718, "epoch": 924} {"train_loss": -20.911911010742188, "global_step": 76719, "epoch": 924} {"train_loss": -21.319766998291016, "global_step": 76720, "epoch": 924} {"train_loss": -21.362043380737305, "global_step": 76721, "epoch": 924} {"train_loss": -21.156843185424805, "global_step": 76722, "epoch": 924} {"train_loss": -21.207168579101562, "global_step": 76723, "epoch": 924} {"train_loss": -20.83225440979004, "global_step": 76724, "epoch": 924} {"train_loss": -20.969709396362305, "global_step": 76725, "epoch": 924} {"train_loss": -20.861927032470703, "global_step": 76726, "epoch": 924} {"train_loss": -21.16440773010254, "global_step": 76727, "epoch": 924} {"train_loss": -21.258087158203125, "global_step": 76728, "epoch": 924} {"train_loss": -21.120052337646484, "global_step": 76729, "epoch": 924} {"train_loss": -20.87568473815918, "global_step": 76730, "epoch": 924} {"train_loss": -20.825021743774414, "global_step": 76731, "epoch": 924} {"train_loss": -21.3261661529541, "global_step": 76732, "epoch": 924} {"train_loss": -21.089513778686523, "global_step": 76733, "epoch": 924} {"train_loss": -21.30317497253418, "global_step": 76734, "epoch": 924} {"train_loss": -21.025684356689453, "global_step": 76735, "epoch": 924} {"train_loss": -21.073596954345703, "global_step": 76736, "epoch": 924} {"train_loss": -20.8038272857666, "global_step": 76737, "epoch": 924} {"train_loss": -21.156606674194336, "global_step": 76738, "epoch": 924} {"train_loss": -20.94587516784668, "global_step": 76739, "epoch": 924} {"train_loss": -20.934263229370117, "global_step": 76740, "epoch": 924} {"train_loss": -21.09316062927246, "global_step": 76741, "epoch": 924} {"train_loss": -21.082355499267578, "global_step": 76742, "epoch": 924} {"train_loss": -21.30034828186035, "global_step": 76743, "epoch": 924} {"train_loss": -20.897342681884766, "global_step": 76744, "epoch": 924} {"train_loss": -21.203445434570312, "global_step": 76745, "epoch": 924} {"train_loss": -21.267324447631836, "global_step": 76746, "epoch": 924} {"train_loss": -20.881141662597656, "global_step": 76747, "epoch": 924} {"train_loss": -21.055932998657227, "global_step": 76748, "epoch": 924} {"train_loss": -21.26456642150879, "global_step": 76749, "epoch": 924} {"train_loss": -21.258386611938477, "global_step": 76750, "epoch": 924} {"train_loss": -21.241790771484375, "global_step": 76751, "epoch": 924} {"train_loss": -21.125654220581055, "global_step": 76752, "epoch": 924} {"train_loss": -21.01992416381836, "global_step": 76753, "epoch": 924} {"train_loss": -21.06130027770996, "global_step": 76754, "epoch": 924} {"train_loss": -21.305761337280273, "global_step": 76755, "epoch": 924} {"train_loss": -21.098764419555664, "global_step": 76756, "epoch": 924} {"train_loss": -20.99033546447754, "global_step": 76757, "epoch": 924} {"train_loss": -20.93024253845215, "global_step": 76758, "epoch": 924} {"train_loss": -21.054386138916016, "global_step": 76759, "epoch": 924} {"train_loss": -21.315744400024414, "global_step": 76760, "epoch": 924} {"train_loss": -20.875244140625, "global_step": 76761, "epoch": 924} {"train_loss": -21.153966903686523, "global_step": 76762, "epoch": 924} {"train_loss": -20.944578170776367, "global_step": 76763, "epoch": 924} {"train_loss": -21.093984603881836, "global_step": 76764, "epoch": 924} {"train_loss": -20.841266632080078, "global_step": 76765, "epoch": 924} {"train_loss": -21.071563720703125, "global_step": 76766, "epoch": 924} {"train_loss": -20.740957260131836, "global_step": 76767, "epoch": 924} {"train_loss": -21.389942169189453, "global_step": 76768, "epoch": 924} {"train_loss": -20.887237548828125, "global_step": 76769, "epoch": 924} {"train_loss": -21.2290096282959, "global_step": 76770, "epoch": 924} {"train_loss": -20.898502349853516, "global_step": 76771, "epoch": 924} {"train_loss": -21.0383358001709, "global_step": 76772, "epoch": 924} {"train_loss": -20.869417190551758, "global_step": 76773, "epoch": 924} {"train_loss": -20.92980773190418, "global_step": 76774, "epoch": 924, "val_loss": 5922339.5} {"train_loss": -20.242090225219727, "global_step": 76775, "epoch": 925} {"train_loss": -20.52060890197754, "global_step": 76776, "epoch": 925} {"train_loss": -20.976425170898438, "global_step": 76777, "epoch": 925} {"train_loss": -20.26313591003418, "global_step": 76778, "epoch": 925} {"train_loss": -20.664636611938477, "global_step": 76779, "epoch": 925} {"train_loss": -20.724853515625, "global_step": 76780, "epoch": 925} {"train_loss": -21.1417179107666, "global_step": 76781, "epoch": 925} {"train_loss": -20.666629791259766, "global_step": 76782, "epoch": 925} {"train_loss": -20.92870330810547, "global_step": 76783, "epoch": 925} {"train_loss": -20.97043228149414, "global_step": 76784, "epoch": 925} {"train_loss": -21.08853530883789, "global_step": 76785, "epoch": 925} {"train_loss": -20.682050704956055, "global_step": 76786, "epoch": 925} {"train_loss": -20.794940948486328, "global_step": 76787, "epoch": 925} {"train_loss": -20.54449462890625, "global_step": 76788, "epoch": 925} {"train_loss": -21.264007568359375, "global_step": 76789, "epoch": 925} {"train_loss": -21.184402465820312, "global_step": 76790, "epoch": 925} {"train_loss": -20.994029998779297, "global_step": 76791, "epoch": 925} {"train_loss": -20.882423400878906, "global_step": 76792, "epoch": 925} {"train_loss": -21.291521072387695, "global_step": 76793, "epoch": 925} {"train_loss": -21.111774444580078, "global_step": 76794, "epoch": 925} {"train_loss": -20.72178077697754, "global_step": 76795, "epoch": 925} {"train_loss": -20.98261833190918, "global_step": 76796, "epoch": 925} {"train_loss": -21.343976974487305, "global_step": 76797, "epoch": 925} {"train_loss": -21.167993545532227, "global_step": 76798, "epoch": 925} {"train_loss": -21.134756088256836, "global_step": 76799, "epoch": 925} {"train_loss": -21.00086784362793, "global_step": 76800, "epoch": 925} {"train_loss": -21.123449325561523, "global_step": 76801, "epoch": 925} {"train_loss": -21.189062118530273, "global_step": 76802, "epoch": 925} {"train_loss": -21.250669479370117, "global_step": 76803, "epoch": 925} {"train_loss": -20.822126388549805, "global_step": 76804, "epoch": 925} {"train_loss": -20.965164184570312, "global_step": 76805, "epoch": 925} {"train_loss": -21.104310989379883, "global_step": 76806, "epoch": 925} {"train_loss": -20.788219451904297, "global_step": 76807, "epoch": 925} {"train_loss": -21.21822166442871, "global_step": 76808, "epoch": 925} {"train_loss": -20.996755599975586, "global_step": 76809, "epoch": 925} {"train_loss": -21.26055335998535, "global_step": 76810, "epoch": 925} {"train_loss": -20.941869735717773, "global_step": 76811, "epoch": 925} {"train_loss": -20.94939613342285, "global_step": 76812, "epoch": 925} {"train_loss": -21.112031936645508, "global_step": 76813, "epoch": 925} {"train_loss": -21.30162239074707, "global_step": 76814, "epoch": 925} {"train_loss": -21.37860107421875, "global_step": 76815, "epoch": 925} {"train_loss": -21.1098690032959, "global_step": 76816, "epoch": 925} {"train_loss": -21.1143798828125, "global_step": 76817, "epoch": 925} {"train_loss": -20.976327896118164, "global_step": 76818, "epoch": 925} {"train_loss": -21.326208114624023, "global_step": 76819, "epoch": 925} {"train_loss": -21.048620223999023, "global_step": 76820, "epoch": 925} {"train_loss": -21.247678756713867, "global_step": 76821, "epoch": 925} {"train_loss": -21.05390167236328, "global_step": 76822, "epoch": 925} {"train_loss": -20.965167999267578, "global_step": 76823, "epoch": 925} {"train_loss": -21.141151428222656, "global_step": 76824, "epoch": 925} {"train_loss": -20.7153263092041, "global_step": 76825, "epoch": 925} {"train_loss": -21.02845573425293, "global_step": 76826, "epoch": 925} {"train_loss": -21.16043472290039, "global_step": 76827, "epoch": 925} {"train_loss": -20.947206497192383, "global_step": 76828, "epoch": 925} {"train_loss": -20.9548282623291, "global_step": 76829, "epoch": 925} {"train_loss": -21.175474166870117, "global_step": 76830, "epoch": 925} {"train_loss": -21.258712768554688, "global_step": 76831, "epoch": 925} {"train_loss": -20.411392211914062, "global_step": 76832, "epoch": 925} {"train_loss": -21.344161987304688, "global_step": 76833, "epoch": 925} {"train_loss": -21.107213973999023, "global_step": 76834, "epoch": 925} {"train_loss": -20.838932037353516, "global_step": 76835, "epoch": 925} {"train_loss": -21.15134048461914, "global_step": 76836, "epoch": 925} {"train_loss": -20.898529052734375, "global_step": 76837, "epoch": 925} {"train_loss": -20.868392944335938, "global_step": 76838, "epoch": 925} {"train_loss": -21.386816024780273, "global_step": 76839, "epoch": 925} {"train_loss": -21.31353759765625, "global_step": 76840, "epoch": 925} {"train_loss": -21.318681716918945, "global_step": 76841, "epoch": 925} {"train_loss": -21.054807662963867, "global_step": 76842, "epoch": 925} {"train_loss": -21.54286766052246, "global_step": 76843, "epoch": 925} {"train_loss": -21.083168029785156, "global_step": 76844, "epoch": 925} {"train_loss": -21.4338321685791, "global_step": 76845, "epoch": 925} {"train_loss": -21.330533981323242, "global_step": 76846, "epoch": 925} {"train_loss": -20.99031639099121, "global_step": 76847, "epoch": 925} {"train_loss": -21.303340911865234, "global_step": 76848, "epoch": 925} {"train_loss": -21.31428337097168, "global_step": 76849, "epoch": 925} {"train_loss": -21.437734603881836, "global_step": 76850, "epoch": 925} {"train_loss": -21.083738327026367, "global_step": 76851, "epoch": 925} {"train_loss": -21.01474380493164, "global_step": 76852, "epoch": 925} {"train_loss": -21.62613296508789, "global_step": 76853, "epoch": 925} {"train_loss": -20.939298629760742, "global_step": 76854, "epoch": 925} {"train_loss": -21.11090660095215, "global_step": 76855, "epoch": 925} {"train_loss": -21.283781051635742, "global_step": 76856, "epoch": 925} {"train_loss": -21.022197516567736, "global_step": 76857, "epoch": 925, "val_loss": 5943375.0} {"train_loss": -20.8145751953125, "global_step": 76858, "epoch": 926} {"train_loss": -21.29347801208496, "global_step": 76859, "epoch": 926} {"train_loss": -21.24738121032715, "global_step": 76860, "epoch": 926} {"train_loss": -21.049650192260742, "global_step": 76861, "epoch": 926} {"train_loss": -21.043994903564453, "global_step": 76862, "epoch": 926} {"train_loss": -21.1728572845459, "global_step": 76863, "epoch": 926} {"train_loss": -21.049272537231445, "global_step": 76864, "epoch": 926} {"train_loss": -21.323026657104492, "global_step": 76865, "epoch": 926} {"train_loss": -21.0266170501709, "global_step": 76866, "epoch": 926} {"train_loss": -21.072509765625, "global_step": 76867, "epoch": 926} {"train_loss": -21.026832580566406, "global_step": 76868, "epoch": 926} {"train_loss": -21.25006675720215, "global_step": 76869, "epoch": 926} {"train_loss": -21.145872116088867, "global_step": 76870, "epoch": 926} {"train_loss": -21.128326416015625, "global_step": 76871, "epoch": 926} {"train_loss": -21.16956901550293, "global_step": 76872, "epoch": 926} {"train_loss": -20.701866149902344, "global_step": 76873, "epoch": 926} {"train_loss": -21.068029403686523, "global_step": 76874, "epoch": 926} {"train_loss": -20.989667892456055, "global_step": 76875, "epoch": 926} {"train_loss": -20.850961685180664, "global_step": 76876, "epoch": 926} {"train_loss": -21.04608154296875, "global_step": 76877, "epoch": 926} {"train_loss": -21.097951889038086, "global_step": 76878, "epoch": 926} {"train_loss": -21.048114776611328, "global_step": 76879, "epoch": 926} {"train_loss": -21.312376022338867, "global_step": 76880, "epoch": 926} {"train_loss": -21.316770553588867, "global_step": 76881, "epoch": 926} {"train_loss": -20.71561622619629, "global_step": 76882, "epoch": 926} {"train_loss": -20.79029655456543, "global_step": 76883, "epoch": 926} {"train_loss": -20.872543334960938, "global_step": 76884, "epoch": 926} {"train_loss": -21.006366729736328, "global_step": 76885, "epoch": 926} {"train_loss": -21.14575958251953, "global_step": 76886, "epoch": 926} {"train_loss": -21.278583526611328, "global_step": 76887, "epoch": 926} {"train_loss": -20.90339469909668, "global_step": 76888, "epoch": 926} {"train_loss": -21.06307601928711, "global_step": 76889, "epoch": 926} {"train_loss": -21.264047622680664, "global_step": 76890, "epoch": 926} {"train_loss": -21.151575088500977, "global_step": 76891, "epoch": 926} {"train_loss": -21.028850555419922, "global_step": 76892, "epoch": 926} {"train_loss": -21.011953353881836, "global_step": 76893, "epoch": 926} {"train_loss": -21.046457290649414, "global_step": 76894, "epoch": 926} {"train_loss": -20.8065242767334, "global_step": 76895, "epoch": 926} {"train_loss": -20.751432418823242, "global_step": 76896, "epoch": 926} {"train_loss": -21.266027450561523, "global_step": 76897, "epoch": 926} {"train_loss": -21.1156005859375, "global_step": 76898, "epoch": 926} {"train_loss": -20.906116485595703, "global_step": 76899, "epoch": 926} {"train_loss": -21.02667808532715, "global_step": 76900, "epoch": 926} {"train_loss": -21.034177780151367, "global_step": 76901, "epoch": 926} {"train_loss": -21.056182861328125, "global_step": 76902, "epoch": 926} {"train_loss": -21.158926010131836, "global_step": 76903, "epoch": 926} {"train_loss": -20.788436889648438, "global_step": 76904, "epoch": 926} {"train_loss": -21.09629249572754, "global_step": 76905, "epoch": 926} {"train_loss": -20.88080406188965, "global_step": 76906, "epoch": 926} {"train_loss": -21.082054138183594, "global_step": 76907, "epoch": 926} {"train_loss": -21.016170501708984, "global_step": 76908, "epoch": 926} {"train_loss": -20.9692325592041, "global_step": 76909, "epoch": 926} {"train_loss": -21.223445892333984, "global_step": 76910, "epoch": 926} {"train_loss": -21.089618682861328, "global_step": 76911, "epoch": 926} {"train_loss": -21.200389862060547, "global_step": 76912, "epoch": 926} {"train_loss": -21.243335723876953, "global_step": 76913, "epoch": 926} {"train_loss": -21.12337303161621, "global_step": 76914, "epoch": 926} {"train_loss": -21.24211883544922, "global_step": 76915, "epoch": 926} {"train_loss": -20.92972755432129, "global_step": 76916, "epoch": 926} {"train_loss": -21.060565948486328, "global_step": 76917, "epoch": 926} {"train_loss": -21.382638931274414, "global_step": 76918, "epoch": 926} {"train_loss": -21.36557960510254, "global_step": 76919, "epoch": 926} {"train_loss": -21.101057052612305, "global_step": 76920, "epoch": 926} {"train_loss": -20.808856964111328, "global_step": 76921, "epoch": 926} {"train_loss": -21.187204360961914, "global_step": 76922, "epoch": 926} {"train_loss": -21.182737350463867, "global_step": 76923, "epoch": 926} {"train_loss": -21.0004940032959, "global_step": 76924, "epoch": 926} {"train_loss": -20.776409149169922, "global_step": 76925, "epoch": 926} {"train_loss": -21.735740661621094, "global_step": 76926, "epoch": 926} {"train_loss": -20.716032028198242, "global_step": 76927, "epoch": 926} {"train_loss": -21.224721908569336, "global_step": 76928, "epoch": 926} {"train_loss": -21.196378707885742, "global_step": 76929, "epoch": 926} {"train_loss": -21.33124351501465, "global_step": 76930, "epoch": 926} {"train_loss": -21.008941650390625, "global_step": 76931, "epoch": 926} {"train_loss": -20.780351638793945, "global_step": 76932, "epoch": 926} {"train_loss": -20.999027252197266, "global_step": 76933, "epoch": 926} {"train_loss": -20.838132858276367, "global_step": 76934, "epoch": 926} {"train_loss": -21.03607940673828, "global_step": 76935, "epoch": 926} {"train_loss": -20.91737937927246, "global_step": 76936, "epoch": 926} {"train_loss": -21.174482345581055, "global_step": 76937, "epoch": 926} {"train_loss": -21.264589309692383, "global_step": 76938, "epoch": 926} {"train_loss": -21.177047729492188, "global_step": 76939, "epoch": 926} {"train_loss": -21.073333556393543, "global_step": 76940, "epoch": 926, "val_loss": 6068422.0} {"train_loss": -20.467531204223633, "global_step": 76941, "epoch": 927} {"train_loss": -20.7252197265625, "global_step": 76942, "epoch": 927} {"train_loss": -20.730905532836914, "global_step": 76943, "epoch": 927} {"train_loss": -20.93489646911621, "global_step": 76944, "epoch": 927} {"train_loss": -21.230422973632812, "global_step": 76945, "epoch": 927} {"train_loss": -20.395498275756836, "global_step": 76946, "epoch": 927} {"train_loss": -21.054006576538086, "global_step": 76947, "epoch": 927} {"train_loss": -20.5570011138916, "global_step": 76948, "epoch": 927} {"train_loss": -21.155858993530273, "global_step": 76949, "epoch": 927} {"train_loss": -21.32637596130371, "global_step": 76950, "epoch": 927} {"train_loss": -20.415788650512695, "global_step": 76951, "epoch": 927} {"train_loss": -20.769742965698242, "global_step": 76952, "epoch": 927} {"train_loss": -21.225679397583008, "global_step": 76953, "epoch": 927} {"train_loss": -20.93482780456543, "global_step": 76954, "epoch": 927} {"train_loss": -21.16573143005371, "global_step": 76955, "epoch": 927} {"train_loss": -20.922685623168945, "global_step": 76956, "epoch": 927} {"train_loss": -20.97566795349121, "global_step": 76957, "epoch": 927} {"train_loss": -20.694225311279297, "global_step": 76958, "epoch": 927} {"train_loss": -21.037221908569336, "global_step": 76959, "epoch": 927} {"train_loss": -21.257518768310547, "global_step": 76960, "epoch": 927} {"train_loss": -21.024354934692383, "global_step": 76961, "epoch": 927} {"train_loss": -20.859554290771484, "global_step": 76962, "epoch": 927} {"train_loss": -21.100811004638672, "global_step": 76963, "epoch": 927} {"train_loss": -21.202621459960938, "global_step": 76964, "epoch": 927} {"train_loss": -20.846220016479492, "global_step": 76965, "epoch": 927} {"train_loss": -20.84528923034668, "global_step": 76966, "epoch": 927} {"train_loss": -21.16111183166504, "global_step": 76967, "epoch": 927} {"train_loss": -21.108306884765625, "global_step": 76968, "epoch": 927} {"train_loss": -21.411285400390625, "global_step": 76969, "epoch": 927} {"train_loss": -21.06700897216797, "global_step": 76970, "epoch": 927} {"train_loss": -21.206859588623047, "global_step": 76971, "epoch": 927} {"train_loss": -20.995119094848633, "global_step": 76972, "epoch": 927} {"train_loss": -21.23050880432129, "global_step": 76973, "epoch": 927} {"train_loss": -20.982894897460938, "global_step": 76974, "epoch": 927} {"train_loss": -21.267948150634766, "global_step": 76975, "epoch": 927} {"train_loss": -21.283790588378906, "global_step": 76976, "epoch": 927} {"train_loss": -21.154478073120117, "global_step": 76977, "epoch": 927} {"train_loss": -21.051692962646484, "global_step": 76978, "epoch": 927} {"train_loss": -21.19422149658203, "global_step": 76979, "epoch": 927} {"train_loss": -21.118947982788086, "global_step": 76980, "epoch": 927} {"train_loss": -20.76755142211914, "global_step": 76981, "epoch": 927} {"train_loss": -21.209518432617188, "global_step": 76982, "epoch": 927} {"train_loss": -20.481748580932617, "global_step": 76983, "epoch": 927} {"train_loss": -21.238996505737305, "global_step": 76984, "epoch": 927} {"train_loss": -20.840198516845703, "global_step": 76985, "epoch": 927} {"train_loss": -21.085834503173828, "global_step": 76986, "epoch": 927} {"train_loss": -21.05265235900879, "global_step": 76987, "epoch": 927} {"train_loss": -21.5039005279541, "global_step": 76988, "epoch": 927} {"train_loss": -21.048086166381836, "global_step": 76989, "epoch": 927} {"train_loss": -20.97882652282715, "global_step": 76990, "epoch": 927} {"train_loss": -21.12074851989746, "global_step": 76991, "epoch": 927} {"train_loss": -21.0059814453125, "global_step": 76992, "epoch": 927} {"train_loss": -20.9749813079834, "global_step": 76993, "epoch": 927} {"train_loss": -20.935932159423828, "global_step": 76994, "epoch": 927} {"train_loss": -21.595365524291992, "global_step": 76995, "epoch": 927} {"train_loss": -20.747848510742188, "global_step": 76996, "epoch": 927} {"train_loss": -21.18039894104004, "global_step": 76997, "epoch": 927} {"train_loss": -21.074609756469727, "global_step": 76998, "epoch": 927} {"train_loss": -21.244720458984375, "global_step": 76999, "epoch": 927} {"train_loss": -20.728925704956055, "global_step": 77000, "epoch": 927} {"train_loss": -21.15656852722168, "global_step": 77001, "epoch": 927} {"train_loss": -21.48061180114746, "global_step": 77002, "epoch": 927} {"train_loss": -21.334558486938477, "global_step": 77003, "epoch": 927} {"train_loss": -21.4781494140625, "global_step": 77004, "epoch": 927} {"train_loss": -21.03401756286621, "global_step": 77005, "epoch": 927} {"train_loss": -21.323057174682617, "global_step": 77006, "epoch": 927} {"train_loss": -21.286178588867188, "global_step": 77007, "epoch": 927} {"train_loss": -20.951017379760742, "global_step": 77008, "epoch": 927} {"train_loss": -20.942626953125, "global_step": 77009, "epoch": 927} {"train_loss": -21.456024169921875, "global_step": 77010, "epoch": 927} {"train_loss": -21.040847778320312, "global_step": 77011, "epoch": 927} {"train_loss": -21.375938415527344, "global_step": 77012, "epoch": 927} {"train_loss": -21.42024803161621, "global_step": 77013, "epoch": 927} {"train_loss": -21.094669342041016, "global_step": 77014, "epoch": 927} {"train_loss": -21.152341842651367, "global_step": 77015, "epoch": 927} {"train_loss": -21.243223190307617, "global_step": 77016, "epoch": 927} {"train_loss": -21.494779586791992, "global_step": 77017, "epoch": 927} {"train_loss": -21.019359588623047, "global_step": 77018, "epoch": 927} {"train_loss": -20.881977081298828, "global_step": 77019, "epoch": 927} {"train_loss": -21.089176177978516, "global_step": 77020, "epoch": 927} {"train_loss": -21.070980072021484, "global_step": 77021, "epoch": 927} {"train_loss": -21.086030960083008, "global_step": 77022, "epoch": 927} {"train_loss": -21.068578260490693, "global_step": 77023, "epoch": 927, "val_loss": 6100441.0} {"train_loss": -20.881879806518555, "global_step": 77024, "epoch": 928} {"train_loss": -20.77859878540039, "global_step": 77025, "epoch": 928} {"train_loss": -21.13330841064453, "global_step": 77026, "epoch": 928} {"train_loss": -21.11610984802246, "global_step": 77027, "epoch": 928} {"train_loss": -20.844589233398438, "global_step": 77028, "epoch": 928} {"train_loss": -20.89768409729004, "global_step": 77029, "epoch": 928} {"train_loss": -21.53456687927246, "global_step": 77030, "epoch": 928} {"train_loss": -21.001663208007812, "global_step": 77031, "epoch": 928} {"train_loss": -20.82135009765625, "global_step": 77032, "epoch": 928} {"train_loss": -20.586151123046875, "global_step": 77033, "epoch": 928} {"train_loss": -20.935529708862305, "global_step": 77034, "epoch": 928} {"train_loss": -21.270627975463867, "global_step": 77035, "epoch": 928} {"train_loss": -20.991943359375, "global_step": 77036, "epoch": 928} {"train_loss": -20.610361099243164, "global_step": 77037, "epoch": 928} {"train_loss": -21.081642150878906, "global_step": 77038, "epoch": 928} {"train_loss": -21.240636825561523, "global_step": 77039, "epoch": 928} {"train_loss": -20.878597259521484, "global_step": 77040, "epoch": 928} {"train_loss": -20.979639053344727, "global_step": 77041, "epoch": 928} {"train_loss": -21.030805587768555, "global_step": 77042, "epoch": 928} {"train_loss": -21.61418914794922, "global_step": 77043, "epoch": 928} {"train_loss": -20.89735984802246, "global_step": 77044, "epoch": 928} {"train_loss": -20.786855697631836, "global_step": 77045, "epoch": 928} {"train_loss": -21.1921443939209, "global_step": 77046, "epoch": 928} {"train_loss": -21.342395782470703, "global_step": 77047, "epoch": 928} {"train_loss": -21.281299591064453, "global_step": 77048, "epoch": 928} {"train_loss": -21.159244537353516, "global_step": 77049, "epoch": 928} {"train_loss": -21.095373153686523, "global_step": 77050, "epoch": 928} {"train_loss": -20.93459129333496, "global_step": 77051, "epoch": 928} {"train_loss": -21.040685653686523, "global_step": 77052, "epoch": 928} {"train_loss": -20.747711181640625, "global_step": 77053, "epoch": 928} {"train_loss": -20.6179141998291, "global_step": 77054, "epoch": 928} {"train_loss": -21.049280166625977, "global_step": 77055, "epoch": 928} {"train_loss": -21.161436080932617, "global_step": 77056, "epoch": 928} {"train_loss": -20.839340209960938, "global_step": 77057, "epoch": 928} {"train_loss": -21.511859893798828, "global_step": 77058, "epoch": 928} {"train_loss": -21.03254508972168, "global_step": 77059, "epoch": 928} {"train_loss": -20.93610191345215, "global_step": 77060, "epoch": 928} {"train_loss": -21.27174949645996, "global_step": 77061, "epoch": 928} {"train_loss": -21.339866638183594, "global_step": 77062, "epoch": 928} {"train_loss": -20.929670333862305, "global_step": 77063, "epoch": 928} {"train_loss": -21.243759155273438, "global_step": 77064, "epoch": 928} {"train_loss": -20.914709091186523, "global_step": 77065, "epoch": 928} {"train_loss": -21.242345809936523, "global_step": 77066, "epoch": 928} {"train_loss": -20.8105525970459, "global_step": 77067, "epoch": 928} {"train_loss": -21.142562866210938, "global_step": 77068, "epoch": 928} {"train_loss": -21.04440689086914, "global_step": 77069, "epoch": 928} {"train_loss": -21.105178833007812, "global_step": 77070, "epoch": 928} {"train_loss": -21.46223258972168, "global_step": 77071, "epoch": 928} {"train_loss": -21.225662231445312, "global_step": 77072, "epoch": 928} {"train_loss": -21.307790756225586, "global_step": 77073, "epoch": 928} {"train_loss": -21.166446685791016, "global_step": 77074, "epoch": 928} {"train_loss": -20.836889266967773, "global_step": 77075, "epoch": 928} {"train_loss": -21.283061981201172, "global_step": 77076, "epoch": 928} {"train_loss": -21.068674087524414, "global_step": 77077, "epoch": 928} {"train_loss": -21.444290161132812, "global_step": 77078, "epoch": 928} {"train_loss": -20.82904052734375, "global_step": 77079, "epoch": 928} {"train_loss": -21.011133193969727, "global_step": 77080, "epoch": 928} {"train_loss": -21.033828735351562, "global_step": 77081, "epoch": 928} {"train_loss": -21.032079696655273, "global_step": 77082, "epoch": 928} {"train_loss": -20.6638126373291, "global_step": 77083, "epoch": 928} {"train_loss": -21.21534538269043, "global_step": 77084, "epoch": 928} {"train_loss": -21.296741485595703, "global_step": 77085, "epoch": 928} {"train_loss": -20.751075744628906, "global_step": 77086, "epoch": 928} {"train_loss": -21.444543838500977, "global_step": 77087, "epoch": 928} {"train_loss": -20.758502960205078, "global_step": 77088, "epoch": 928} {"train_loss": -21.247350692749023, "global_step": 77089, "epoch": 928} {"train_loss": -21.36753273010254, "global_step": 77090, "epoch": 928} {"train_loss": -21.08933448791504, "global_step": 77091, "epoch": 928} {"train_loss": -21.049436569213867, "global_step": 77092, "epoch": 928} {"train_loss": -21.06778907775879, "global_step": 77093, "epoch": 928} {"train_loss": -21.291406631469727, "global_step": 77094, "epoch": 928} {"train_loss": -20.68023109436035, "global_step": 77095, "epoch": 928} {"train_loss": -21.5743408203125, "global_step": 77096, "epoch": 928} {"train_loss": -21.35054588317871, "global_step": 77097, "epoch": 928} {"train_loss": -21.130294799804688, "global_step": 77098, "epoch": 928} {"train_loss": -21.17396354675293, "global_step": 77099, "epoch": 928} {"train_loss": -20.760297775268555, "global_step": 77100, "epoch": 928} {"train_loss": -21.094093322753906, "global_step": 77101, "epoch": 928} {"train_loss": -21.255126953125, "global_step": 77102, "epoch": 928} {"train_loss": -21.464101791381836, "global_step": 77103, "epoch": 928} {"train_loss": -21.10992431640625, "global_step": 77104, "epoch": 928} {"train_loss": -21.11818504333496, "global_step": 77105, "epoch": 928} {"train_loss": -21.07088449776891, "global_step": 77106, "epoch": 928, "val_loss": 6015820.5} {"train_loss": -20.690977096557617, "global_step": 77107, "epoch": 929} {"train_loss": -21.045312881469727, "global_step": 77108, "epoch": 929} {"train_loss": -20.83856964111328, "global_step": 77109, "epoch": 929} {"train_loss": -21.032550811767578, "global_step": 77110, "epoch": 929} {"train_loss": -21.215435028076172, "global_step": 77111, "epoch": 929} {"train_loss": -20.89227867126465, "global_step": 77112, "epoch": 929} {"train_loss": -20.872236251831055, "global_step": 77113, "epoch": 929} {"train_loss": -20.94708824157715, "global_step": 77114, "epoch": 929} {"train_loss": -21.005277633666992, "global_step": 77115, "epoch": 929} {"train_loss": -20.98509979248047, "global_step": 77116, "epoch": 929} {"train_loss": -21.428693771362305, "global_step": 77117, "epoch": 929} {"train_loss": -21.381114959716797, "global_step": 77118, "epoch": 929} {"train_loss": -20.852205276489258, "global_step": 77119, "epoch": 929} {"train_loss": -20.965917587280273, "global_step": 77120, "epoch": 929} {"train_loss": -21.166587829589844, "global_step": 77121, "epoch": 929} {"train_loss": -21.35513687133789, "global_step": 77122, "epoch": 929} {"train_loss": -20.916141510009766, "global_step": 77123, "epoch": 929} {"train_loss": -21.140111923217773, "global_step": 77124, "epoch": 929} {"train_loss": -21.28675651550293, "global_step": 77125, "epoch": 929} {"train_loss": -21.027286529541016, "global_step": 77126, "epoch": 929} {"train_loss": -21.089948654174805, "global_step": 77127, "epoch": 929} {"train_loss": -21.099796295166016, "global_step": 77128, "epoch": 929} {"train_loss": -20.80455780029297, "global_step": 77129, "epoch": 929} {"train_loss": -20.58198356628418, "global_step": 77130, "epoch": 929} {"train_loss": -21.106882095336914, "global_step": 77131, "epoch": 929} {"train_loss": -21.08064079284668, "global_step": 77132, "epoch": 929} {"train_loss": -21.253652572631836, "global_step": 77133, "epoch": 929} {"train_loss": -21.26299285888672, "global_step": 77134, "epoch": 929} {"train_loss": -21.26749610900879, "global_step": 77135, "epoch": 929} {"train_loss": -20.841644287109375, "global_step": 77136, "epoch": 929} {"train_loss": -21.147268295288086, "global_step": 77137, "epoch": 929} {"train_loss": -21.0982723236084, "global_step": 77138, "epoch": 929} {"train_loss": -21.31777000427246, "global_step": 77139, "epoch": 929} {"train_loss": -21.03846549987793, "global_step": 77140, "epoch": 929} {"train_loss": -21.047256469726562, "global_step": 77141, "epoch": 929} {"train_loss": -21.07598304748535, "global_step": 77142, "epoch": 929} {"train_loss": -21.217395782470703, "global_step": 77143, "epoch": 929} {"train_loss": -21.400686264038086, "global_step": 77144, "epoch": 929} {"train_loss": -21.047422409057617, "global_step": 77145, "epoch": 929} {"train_loss": -21.160924911499023, "global_step": 77146, "epoch": 929} {"train_loss": -21.222524642944336, "global_step": 77147, "epoch": 929} {"train_loss": -20.902441024780273, "global_step": 77148, "epoch": 929} {"train_loss": -21.190465927124023, "global_step": 77149, "epoch": 929} {"train_loss": -21.42362403869629, "global_step": 77150, "epoch": 929} {"train_loss": -20.80142593383789, "global_step": 77151, "epoch": 929} {"train_loss": -21.56760025024414, "global_step": 77152, "epoch": 929} {"train_loss": -20.97578239440918, "global_step": 77153, "epoch": 929} {"train_loss": -20.722023010253906, "global_step": 77154, "epoch": 929} {"train_loss": -21.408151626586914, "global_step": 77155, "epoch": 929} {"train_loss": -20.930143356323242, "global_step": 77156, "epoch": 929} {"train_loss": -21.196819305419922, "global_step": 77157, "epoch": 929} {"train_loss": -21.122608184814453, "global_step": 77158, "epoch": 929} {"train_loss": -21.100744247436523, "global_step": 77159, "epoch": 929} {"train_loss": -21.23105239868164, "global_step": 77160, "epoch": 929} {"train_loss": -20.79880142211914, "global_step": 77161, "epoch": 929} {"train_loss": -21.126571655273438, "global_step": 77162, "epoch": 929} {"train_loss": -20.88968276977539, "global_step": 77163, "epoch": 929} {"train_loss": -21.028717041015625, "global_step": 77164, "epoch": 929} {"train_loss": -21.374622344970703, "global_step": 77165, "epoch": 929} {"train_loss": -21.360336303710938, "global_step": 77166, "epoch": 929} {"train_loss": -20.745317459106445, "global_step": 77167, "epoch": 929} {"train_loss": -21.308557510375977, "global_step": 77168, "epoch": 929} {"train_loss": -21.10065269470215, "global_step": 77169, "epoch": 929} {"train_loss": -21.251556396484375, "global_step": 77170, "epoch": 929} {"train_loss": -21.05537986755371, "global_step": 77171, "epoch": 929} {"train_loss": -20.908201217651367, "global_step": 77172, "epoch": 929} {"train_loss": -21.384733200073242, "global_step": 77173, "epoch": 929} {"train_loss": -21.28783416748047, "global_step": 77174, "epoch": 929} {"train_loss": -21.255735397338867, "global_step": 77175, "epoch": 929} {"train_loss": -20.916433334350586, "global_step": 77176, "epoch": 929} {"train_loss": -21.181135177612305, "global_step": 77177, "epoch": 929} {"train_loss": -20.7542724609375, "global_step": 77178, "epoch": 929} {"train_loss": -20.66008758544922, "global_step": 77179, "epoch": 929} {"train_loss": -21.337736129760742, "global_step": 77180, "epoch": 929} {"train_loss": -21.176767349243164, "global_step": 77181, "epoch": 929} {"train_loss": -20.96624755859375, "global_step": 77182, "epoch": 929} {"train_loss": -21.088546752929688, "global_step": 77183, "epoch": 929} {"train_loss": -20.708707809448242, "global_step": 77184, "epoch": 929} {"train_loss": -21.46681022644043, "global_step": 77185, "epoch": 929} {"train_loss": -21.059904098510742, "global_step": 77186, "epoch": 929} {"train_loss": -21.142438888549805, "global_step": 77187, "epoch": 929} {"train_loss": -20.923128128051758, "global_step": 77188, "epoch": 929} {"train_loss": -21.08356806743576, "global_step": 77189, "epoch": 929, "val_loss": 5995666.0} {"train_loss": -20.866180419921875, "global_step": 77190, "epoch": 930} {"train_loss": -21.085559844970703, "global_step": 77191, "epoch": 930} {"train_loss": -21.340389251708984, "global_step": 77192, "epoch": 930} {"train_loss": -20.848379135131836, "global_step": 77193, "epoch": 930} {"train_loss": -20.88188934326172, "global_step": 77194, "epoch": 930} {"train_loss": -20.629497528076172, "global_step": 77195, "epoch": 930} {"train_loss": -21.123336791992188, "global_step": 77196, "epoch": 930} {"train_loss": -21.136035919189453, "global_step": 77197, "epoch": 930} {"train_loss": -20.809850692749023, "global_step": 77198, "epoch": 930} {"train_loss": -21.25360107421875, "global_step": 77199, "epoch": 930} {"train_loss": -20.971433639526367, "global_step": 77200, "epoch": 930} {"train_loss": -21.051618576049805, "global_step": 77201, "epoch": 930} {"train_loss": -21.54450035095215, "global_step": 77202, "epoch": 930} {"train_loss": -21.4481143951416, "global_step": 77203, "epoch": 930} {"train_loss": -21.165149688720703, "global_step": 77204, "epoch": 930} {"train_loss": -21.21026611328125, "global_step": 77205, "epoch": 930} {"train_loss": -21.228540420532227, "global_step": 77206, "epoch": 930} {"train_loss": -21.041654586791992, "global_step": 77207, "epoch": 930} {"train_loss": -21.51116371154785, "global_step": 77208, "epoch": 930} {"train_loss": -20.980016708374023, "global_step": 77209, "epoch": 930} {"train_loss": -21.34412384033203, "global_step": 77210, "epoch": 930} {"train_loss": -20.9046688079834, "global_step": 77211, "epoch": 930} {"train_loss": -21.4027042388916, "global_step": 77212, "epoch": 930} {"train_loss": -21.2222843170166, "global_step": 77213, "epoch": 930} {"train_loss": -20.85105323791504, "global_step": 77214, "epoch": 930} {"train_loss": -20.691959381103516, "global_step": 77215, "epoch": 930} {"train_loss": -21.21913719177246, "global_step": 77216, "epoch": 930} {"train_loss": -21.192102432250977, "global_step": 77217, "epoch": 930} {"train_loss": -21.07303237915039, "global_step": 77218, "epoch": 930} {"train_loss": -21.12923240661621, "global_step": 77219, "epoch": 930} {"train_loss": -21.52606964111328, "global_step": 77220, "epoch": 930} {"train_loss": -21.144283294677734, "global_step": 77221, "epoch": 930} {"train_loss": -21.214645385742188, "global_step": 77222, "epoch": 930} {"train_loss": -21.308061599731445, "global_step": 77223, "epoch": 930} {"train_loss": -21.224319458007812, "global_step": 77224, "epoch": 930} {"train_loss": -21.08348846435547, "global_step": 77225, "epoch": 930} {"train_loss": -20.76138687133789, "global_step": 77226, "epoch": 930} {"train_loss": -20.83023452758789, "global_step": 77227, "epoch": 930} {"train_loss": -21.286142349243164, "global_step": 77228, "epoch": 930} {"train_loss": -21.22218894958496, "global_step": 77229, "epoch": 930} {"train_loss": -21.149038314819336, "global_step": 77230, "epoch": 930} {"train_loss": -21.41147232055664, "global_step": 77231, "epoch": 930} {"train_loss": -21.01338768005371, "global_step": 77232, "epoch": 930} {"train_loss": -21.181884765625, "global_step": 77233, "epoch": 930} {"train_loss": -21.326496124267578, "global_step": 77234, "epoch": 930} {"train_loss": -21.1043758392334, "global_step": 77235, "epoch": 930} {"train_loss": -20.61077308654785, "global_step": 77236, "epoch": 930} {"train_loss": -21.09853172302246, "global_step": 77237, "epoch": 930} {"train_loss": -21.103134155273438, "global_step": 77238, "epoch": 930} {"train_loss": -20.968181610107422, "global_step": 77239, "epoch": 930} {"train_loss": -21.31923484802246, "global_step": 77240, "epoch": 930} {"train_loss": -20.502857208251953, "global_step": 77241, "epoch": 930} {"train_loss": -21.13542366027832, "global_step": 77242, "epoch": 930} {"train_loss": -20.855621337890625, "global_step": 77243, "epoch": 930} {"train_loss": -21.193130493164062, "global_step": 77244, "epoch": 930} {"train_loss": -20.64023780822754, "global_step": 77245, "epoch": 930} {"train_loss": -21.023481369018555, "global_step": 77246, "epoch": 930} {"train_loss": -21.25948143005371, "global_step": 77247, "epoch": 930} {"train_loss": -20.794326782226562, "global_step": 77248, "epoch": 930} {"train_loss": -21.01789665222168, "global_step": 77249, "epoch": 930} {"train_loss": -21.08828353881836, "global_step": 77250, "epoch": 930} {"train_loss": -21.091510772705078, "global_step": 77251, "epoch": 930} {"train_loss": -21.323049545288086, "global_step": 77252, "epoch": 930} {"train_loss": -21.272422790527344, "global_step": 77253, "epoch": 930} {"train_loss": -20.654592514038086, "global_step": 77254, "epoch": 930} {"train_loss": -20.981382369995117, "global_step": 77255, "epoch": 930} {"train_loss": -21.104999542236328, "global_step": 77256, "epoch": 930} {"train_loss": -21.2515811920166, "global_step": 77257, "epoch": 930} {"train_loss": -20.852916717529297, "global_step": 77258, "epoch": 930} {"train_loss": -21.440189361572266, "global_step": 77259, "epoch": 930} {"train_loss": -21.052444458007812, "global_step": 77260, "epoch": 930} {"train_loss": -21.20098304748535, "global_step": 77261, "epoch": 930} {"train_loss": -21.2060604095459, "global_step": 77262, "epoch": 930} {"train_loss": -21.01163673400879, "global_step": 77263, "epoch": 930} {"train_loss": -21.25216293334961, "global_step": 77264, "epoch": 930} {"train_loss": -21.035757064819336, "global_step": 77265, "epoch": 930} {"train_loss": -21.12713623046875, "global_step": 77266, "epoch": 930} {"train_loss": -21.620447158813477, "global_step": 77267, "epoch": 930} {"train_loss": -21.204206466674805, "global_step": 77268, "epoch": 930} {"train_loss": -21.10486602783203, "global_step": 77269, "epoch": 930} {"train_loss": -21.164958953857422, "global_step": 77270, "epoch": 930} {"train_loss": -21.03866958618164, "global_step": 77271, "epoch": 930} {"train_loss": -21.105555775653887, "global_step": 77272, "epoch": 930, "val_loss": 6144520.5} {"train_loss": -20.98409080505371, "global_step": 77273, "epoch": 931} {"train_loss": -20.961597442626953, "global_step": 77274, "epoch": 931} {"train_loss": -20.427457809448242, "global_step": 77275, "epoch": 931} {"train_loss": -20.939725875854492, "global_step": 77276, "epoch": 931} {"train_loss": -21.071386337280273, "global_step": 77277, "epoch": 931} {"train_loss": -21.092069625854492, "global_step": 77278, "epoch": 931} {"train_loss": -20.741209030151367, "global_step": 77279, "epoch": 931} {"train_loss": -20.97043800354004, "global_step": 77280, "epoch": 931} {"train_loss": -21.07703399658203, "global_step": 77281, "epoch": 931} {"train_loss": -21.185972213745117, "global_step": 77282, "epoch": 931} {"train_loss": -21.010025024414062, "global_step": 77283, "epoch": 931} {"train_loss": -21.0413761138916, "global_step": 77284, "epoch": 931} {"train_loss": -21.093990325927734, "global_step": 77285, "epoch": 931} {"train_loss": -20.7413330078125, "global_step": 77286, "epoch": 931} {"train_loss": -20.936019897460938, "global_step": 77287, "epoch": 931} {"train_loss": -21.045026779174805, "global_step": 77288, "epoch": 931} {"train_loss": -21.00564193725586, "global_step": 77289, "epoch": 931} {"train_loss": -21.071304321289062, "global_step": 77290, "epoch": 931} {"train_loss": -21.432064056396484, "global_step": 77291, "epoch": 931} {"train_loss": -21.197866439819336, "global_step": 77292, "epoch": 931} {"train_loss": -21.097782135009766, "global_step": 77293, "epoch": 931} {"train_loss": -20.975257873535156, "global_step": 77294, "epoch": 931} {"train_loss": -21.293771743774414, "global_step": 77295, "epoch": 931} {"train_loss": -21.023162841796875, "global_step": 77296, "epoch": 931} {"train_loss": -21.135204315185547, "global_step": 77297, "epoch": 931} {"train_loss": -21.080289840698242, "global_step": 77298, "epoch": 931} {"train_loss": -21.20284080505371, "global_step": 77299, "epoch": 931} {"train_loss": -21.227190017700195, "global_step": 77300, "epoch": 931} {"train_loss": -21.0293025970459, "global_step": 77301, "epoch": 931} {"train_loss": -21.46798324584961, "global_step": 77302, "epoch": 931} {"train_loss": -21.31388282775879, "global_step": 77303, "epoch": 931} {"train_loss": -21.206937789916992, "global_step": 77304, "epoch": 931} {"train_loss": -21.124204635620117, "global_step": 77305, "epoch": 931} {"train_loss": -21.279804229736328, "global_step": 77306, "epoch": 931} {"train_loss": -21.01730728149414, "global_step": 77307, "epoch": 931} {"train_loss": -21.42294692993164, "global_step": 77308, "epoch": 931} {"train_loss": -21.333751678466797, "global_step": 77309, "epoch": 931} {"train_loss": -20.96877098083496, "global_step": 77310, "epoch": 931} {"train_loss": -20.755163192749023, "global_step": 77311, "epoch": 931} {"train_loss": -20.8197078704834, "global_step": 77312, "epoch": 931} {"train_loss": -21.02902603149414, "global_step": 77313, "epoch": 931} {"train_loss": -20.901403427124023, "global_step": 77314, "epoch": 931} {"train_loss": -21.330177307128906, "global_step": 77315, "epoch": 931} {"train_loss": -21.086515426635742, "global_step": 77316, "epoch": 931} {"train_loss": -21.237913131713867, "global_step": 77317, "epoch": 931} {"train_loss": -21.133766174316406, "global_step": 77318, "epoch": 931} {"train_loss": -21.412315368652344, "global_step": 77319, "epoch": 931} {"train_loss": -20.92559051513672, "global_step": 77320, "epoch": 931} {"train_loss": -21.1163387298584, "global_step": 77321, "epoch": 931} {"train_loss": -20.94855308532715, "global_step": 77322, "epoch": 931} {"train_loss": -21.31051254272461, "global_step": 77323, "epoch": 931} {"train_loss": -20.856159210205078, "global_step": 77324, "epoch": 931} {"train_loss": -20.953550338745117, "global_step": 77325, "epoch": 931} {"train_loss": -21.297025680541992, "global_step": 77326, "epoch": 931} {"train_loss": -21.408967971801758, "global_step": 77327, "epoch": 931} {"train_loss": -20.75682258605957, "global_step": 77328, "epoch": 931} {"train_loss": -21.268808364868164, "global_step": 77329, "epoch": 931} {"train_loss": -20.64754295349121, "global_step": 77330, "epoch": 931} {"train_loss": -20.962289810180664, "global_step": 77331, "epoch": 931} {"train_loss": -20.975873947143555, "global_step": 77332, "epoch": 931} {"train_loss": -20.950952529907227, "global_step": 77333, "epoch": 931} {"train_loss": -21.277124404907227, "global_step": 77334, "epoch": 931} {"train_loss": -20.905324935913086, "global_step": 77335, "epoch": 931} {"train_loss": -21.496139526367188, "global_step": 77336, "epoch": 931} {"train_loss": -20.986391067504883, "global_step": 77337, "epoch": 931} {"train_loss": -21.032800674438477, "global_step": 77338, "epoch": 931} {"train_loss": -21.244287490844727, "global_step": 77339, "epoch": 931} {"train_loss": -21.15983009338379, "global_step": 77340, "epoch": 931} {"train_loss": -21.145336151123047, "global_step": 77341, "epoch": 931} {"train_loss": -21.055063247680664, "global_step": 77342, "epoch": 931} {"train_loss": -21.097333908081055, "global_step": 77343, "epoch": 931} {"train_loss": -20.955795288085938, "global_step": 77344, "epoch": 931} {"train_loss": -21.31611442565918, "global_step": 77345, "epoch": 931} {"train_loss": -21.071735382080078, "global_step": 77346, "epoch": 931} {"train_loss": -21.002342224121094, "global_step": 77347, "epoch": 931} {"train_loss": -21.2926025390625, "global_step": 77348, "epoch": 931} {"train_loss": -21.396846771240234, "global_step": 77349, "epoch": 931} {"train_loss": -20.981225967407227, "global_step": 77350, "epoch": 931} {"train_loss": -20.78167152404785, "global_step": 77351, "epoch": 931} {"train_loss": -21.059484481811523, "global_step": 77352, "epoch": 931} {"train_loss": -21.25746726989746, "global_step": 77353, "epoch": 931} {"train_loss": -21.355104446411133, "global_step": 77354, "epoch": 931} {"train_loss": -21.103351179375707, "global_step": 77355, "epoch": 931, "val_loss": 6121582.5} {"train_loss": -20.618772506713867, "global_step": 77356, "epoch": 932} {"train_loss": -21.060558319091797, "global_step": 77357, "epoch": 932} {"train_loss": -20.743467330932617, "global_step": 77358, "epoch": 932} {"train_loss": -20.984468460083008, "global_step": 77359, "epoch": 932} {"train_loss": -21.0050106048584, "global_step": 77360, "epoch": 932} {"train_loss": -21.149202346801758, "global_step": 77361, "epoch": 932} {"train_loss": -21.18840789794922, "global_step": 77362, "epoch": 932} {"train_loss": -20.943511962890625, "global_step": 77363, "epoch": 932} {"train_loss": -21.1616153717041, "global_step": 77364, "epoch": 932} {"train_loss": -21.096843719482422, "global_step": 77365, "epoch": 932} {"train_loss": -21.191755294799805, "global_step": 77366, "epoch": 932} {"train_loss": -20.958282470703125, "global_step": 77367, "epoch": 932} {"train_loss": -21.13775062561035, "global_step": 77368, "epoch": 932} {"train_loss": -20.917861938476562, "global_step": 77369, "epoch": 932} {"train_loss": -20.828689575195312, "global_step": 77370, "epoch": 932} {"train_loss": -21.151897430419922, "global_step": 77371, "epoch": 932} {"train_loss": -21.10544776916504, "global_step": 77372, "epoch": 932} {"train_loss": -20.922183990478516, "global_step": 77373, "epoch": 932} {"train_loss": -21.326725006103516, "global_step": 77374, "epoch": 932} {"train_loss": -21.015384674072266, "global_step": 77375, "epoch": 932} {"train_loss": -20.79898452758789, "global_step": 77376, "epoch": 932} {"train_loss": -21.082199096679688, "global_step": 77377, "epoch": 932} {"train_loss": -20.765647888183594, "global_step": 77378, "epoch": 932} {"train_loss": -21.108182907104492, "global_step": 77379, "epoch": 932} {"train_loss": -20.967037200927734, "global_step": 77380, "epoch": 932} {"train_loss": -21.198373794555664, "global_step": 77381, "epoch": 932} {"train_loss": -21.355527877807617, "global_step": 77382, "epoch": 932} {"train_loss": -21.286895751953125, "global_step": 77383, "epoch": 932} {"train_loss": -21.146541595458984, "global_step": 77384, "epoch": 932} {"train_loss": -21.047937393188477, "global_step": 77385, "epoch": 932} {"train_loss": -20.99343490600586, "global_step": 77386, "epoch": 932} {"train_loss": -21.1181697845459, "global_step": 77387, "epoch": 932} {"train_loss": -21.129240036010742, "global_step": 77388, "epoch": 932} {"train_loss": -21.08600425720215, "global_step": 77389, "epoch": 932} {"train_loss": -20.955045700073242, "global_step": 77390, "epoch": 932} {"train_loss": -20.933059692382812, "global_step": 77391, "epoch": 932} {"train_loss": -21.322324752807617, "global_step": 77392, "epoch": 932} {"train_loss": -21.11981201171875, "global_step": 77393, "epoch": 932} {"train_loss": -21.20424461364746, "global_step": 77394, "epoch": 932} {"train_loss": -21.13254165649414, "global_step": 77395, "epoch": 932} {"train_loss": -20.943490982055664, "global_step": 77396, "epoch": 932} {"train_loss": -20.995710372924805, "global_step": 77397, "epoch": 932} {"train_loss": -21.100933074951172, "global_step": 77398, "epoch": 932} {"train_loss": -21.328834533691406, "global_step": 77399, "epoch": 932} {"train_loss": -21.06292152404785, "global_step": 77400, "epoch": 932} {"train_loss": -21.169221878051758, "global_step": 77401, "epoch": 932} {"train_loss": -21.05299186706543, "global_step": 77402, "epoch": 932} {"train_loss": -21.38693618774414, "global_step": 77403, "epoch": 932} {"train_loss": -21.1841983795166, "global_step": 77404, "epoch": 932} {"train_loss": -21.175521850585938, "global_step": 77405, "epoch": 932} {"train_loss": -21.08318328857422, "global_step": 77406, "epoch": 932} {"train_loss": -21.324682235717773, "global_step": 77407, "epoch": 932} {"train_loss": -21.102691650390625, "global_step": 77408, "epoch": 932} {"train_loss": -21.226484298706055, "global_step": 77409, "epoch": 932} {"train_loss": -21.398832321166992, "global_step": 77410, "epoch": 932} {"train_loss": -21.133764266967773, "global_step": 77411, "epoch": 932} {"train_loss": -20.92595100402832, "global_step": 77412, "epoch": 932} {"train_loss": -21.012714385986328, "global_step": 77413, "epoch": 932} {"train_loss": -21.437286376953125, "global_step": 77414, "epoch": 932} {"train_loss": -21.426149368286133, "global_step": 77415, "epoch": 932} {"train_loss": -21.135089874267578, "global_step": 77416, "epoch": 932} {"train_loss": -21.136611938476562, "global_step": 77417, "epoch": 932} {"train_loss": -21.191787719726562, "global_step": 77418, "epoch": 932} {"train_loss": -21.010251998901367, "global_step": 77419, "epoch": 932} {"train_loss": -21.283430099487305, "global_step": 77420, "epoch": 932} {"train_loss": -21.124176025390625, "global_step": 77421, "epoch": 932} {"train_loss": -21.44553565979004, "global_step": 77422, "epoch": 932} {"train_loss": -21.164396286010742, "global_step": 77423, "epoch": 932} {"train_loss": -21.395429611206055, "global_step": 77424, "epoch": 932} {"train_loss": -21.059661865234375, "global_step": 77425, "epoch": 932} {"train_loss": -21.01313591003418, "global_step": 77426, "epoch": 932} {"train_loss": -20.869985580444336, "global_step": 77427, "epoch": 932} {"train_loss": -21.352527618408203, "global_step": 77428, "epoch": 932} {"train_loss": -20.941261291503906, "global_step": 77429, "epoch": 932} {"train_loss": -20.655765533447266, "global_step": 77430, "epoch": 932} {"train_loss": -21.369937896728516, "global_step": 77431, "epoch": 932} {"train_loss": -20.98950958251953, "global_step": 77432, "epoch": 932} {"train_loss": -21.008024215698242, "global_step": 77433, "epoch": 932} {"train_loss": -20.908798217773438, "global_step": 77434, "epoch": 932} {"train_loss": -20.9597225189209, "global_step": 77435, "epoch": 932} {"train_loss": -21.212509155273438, "global_step": 77436, "epoch": 932} {"train_loss": -20.993507385253906, "global_step": 77437, "epoch": 932} {"train_loss": -21.094123679471302, "global_step": 77438, "epoch": 932, "val_loss": 6006499.5} {"train_loss": -20.90989112854004, "global_step": 77439, "epoch": 933} {"train_loss": -20.906845092773438, "global_step": 77440, "epoch": 933} {"train_loss": -20.81984519958496, "global_step": 77441, "epoch": 933} {"train_loss": -20.531232833862305, "global_step": 77442, "epoch": 933} {"train_loss": -20.749042510986328, "global_step": 77443, "epoch": 933} {"train_loss": -20.7785587310791, "global_step": 77444, "epoch": 933} {"train_loss": -21.444665908813477, "global_step": 77445, "epoch": 933} {"train_loss": -20.716163635253906, "global_step": 77446, "epoch": 933} {"train_loss": -21.033475875854492, "global_step": 77447, "epoch": 933} {"train_loss": -20.717655181884766, "global_step": 77448, "epoch": 933} {"train_loss": -20.998855590820312, "global_step": 77449, "epoch": 933} {"train_loss": -20.3696231842041, "global_step": 77450, "epoch": 933} {"train_loss": -21.315933227539062, "global_step": 77451, "epoch": 933} {"train_loss": -20.96269989013672, "global_step": 77452, "epoch": 933} {"train_loss": -20.864944458007812, "global_step": 77453, "epoch": 933} {"train_loss": -20.945743560791016, "global_step": 77454, "epoch": 933} {"train_loss": -20.813535690307617, "global_step": 77455, "epoch": 933} {"train_loss": -20.764806747436523, "global_step": 77456, "epoch": 933} {"train_loss": -20.777372360229492, "global_step": 77457, "epoch": 933} {"train_loss": -21.17203712463379, "global_step": 77458, "epoch": 933} {"train_loss": -21.38057518005371, "global_step": 77459, "epoch": 933} {"train_loss": -21.527555465698242, "global_step": 77460, "epoch": 933} {"train_loss": -21.040861129760742, "global_step": 77461, "epoch": 933} {"train_loss": -21.113107681274414, "global_step": 77462, "epoch": 933} {"train_loss": -21.2490177154541, "global_step": 77463, "epoch": 933} {"train_loss": -21.443241119384766, "global_step": 77464, "epoch": 933} {"train_loss": -21.21107292175293, "global_step": 77465, "epoch": 933} {"train_loss": -20.989736557006836, "global_step": 77466, "epoch": 933} {"train_loss": -21.27777099609375, "global_step": 77467, "epoch": 933} {"train_loss": -21.073598861694336, "global_step": 77468, "epoch": 933} {"train_loss": -21.249237060546875, "global_step": 77469, "epoch": 933} {"train_loss": -21.407506942749023, "global_step": 77470, "epoch": 933} {"train_loss": -21.34711265563965, "global_step": 77471, "epoch": 933} {"train_loss": -21.439205169677734, "global_step": 77472, "epoch": 933} {"train_loss": -21.235355377197266, "global_step": 77473, "epoch": 933} {"train_loss": -21.006752014160156, "global_step": 77474, "epoch": 933} {"train_loss": -21.095714569091797, "global_step": 77475, "epoch": 933} {"train_loss": -21.274015426635742, "global_step": 77476, "epoch": 933} {"train_loss": -21.230371475219727, "global_step": 77477, "epoch": 933} {"train_loss": -20.836450576782227, "global_step": 77478, "epoch": 933} {"train_loss": -21.014158248901367, "global_step": 77479, "epoch": 933} {"train_loss": -21.14446258544922, "global_step": 77480, "epoch": 933} {"train_loss": -20.919078826904297, "global_step": 77481, "epoch": 933} {"train_loss": -20.969274520874023, "global_step": 77482, "epoch": 933} {"train_loss": -20.8692626953125, "global_step": 77483, "epoch": 933} {"train_loss": -21.340978622436523, "global_step": 77484, "epoch": 933} {"train_loss": -21.35088539123535, "global_step": 77485, "epoch": 933} {"train_loss": -21.038349151611328, "global_step": 77486, "epoch": 933} {"train_loss": -21.349882125854492, "global_step": 77487, "epoch": 933} {"train_loss": -21.087751388549805, "global_step": 77488, "epoch": 933} {"train_loss": -21.232017517089844, "global_step": 77489, "epoch": 933} {"train_loss": -21.162626266479492, "global_step": 77490, "epoch": 933} {"train_loss": -21.200448989868164, "global_step": 77491, "epoch": 933} {"train_loss": -21.189470291137695, "global_step": 77492, "epoch": 933} {"train_loss": -21.145673751831055, "global_step": 77493, "epoch": 933} {"train_loss": -21.08857536315918, "global_step": 77494, "epoch": 933} {"train_loss": -21.303403854370117, "global_step": 77495, "epoch": 933} {"train_loss": -21.454334259033203, "global_step": 77496, "epoch": 933} {"train_loss": -21.10175895690918, "global_step": 77497, "epoch": 933} {"train_loss": -20.68401527404785, "global_step": 77498, "epoch": 933} {"train_loss": -21.551111221313477, "global_step": 77499, "epoch": 933} {"train_loss": -21.29569435119629, "global_step": 77500, "epoch": 933} {"train_loss": -21.069517135620117, "global_step": 77501, "epoch": 933} {"train_loss": -20.797849655151367, "global_step": 77502, "epoch": 933} {"train_loss": -21.09589958190918, "global_step": 77503, "epoch": 933} {"train_loss": -21.045408248901367, "global_step": 77504, "epoch": 933} {"train_loss": -21.2481746673584, "global_step": 77505, "epoch": 933} {"train_loss": -21.115324020385742, "global_step": 77506, "epoch": 933} {"train_loss": -20.799896240234375, "global_step": 77507, "epoch": 933} {"train_loss": -21.11170768737793, "global_step": 77508, "epoch": 933} {"train_loss": -21.079492568969727, "global_step": 77509, "epoch": 933} {"train_loss": -20.61994171142578, "global_step": 77510, "epoch": 933} {"train_loss": -20.990726470947266, "global_step": 77511, "epoch": 933} {"train_loss": -20.889747619628906, "global_step": 77512, "epoch": 933} {"train_loss": -21.440988540649414, "global_step": 77513, "epoch": 933} {"train_loss": -21.274633407592773, "global_step": 77514, "epoch": 933} {"train_loss": -21.201335906982422, "global_step": 77515, "epoch": 933} {"train_loss": -21.017637252807617, "global_step": 77516, "epoch": 933} {"train_loss": -21.034109115600586, "global_step": 77517, "epoch": 933} {"train_loss": -21.143199920654297, "global_step": 77518, "epoch": 933} {"train_loss": -21.35505485534668, "global_step": 77519, "epoch": 933} {"train_loss": -21.213117599487305, "global_step": 77520, "epoch": 933} {"train_loss": -21.06758460079331, "global_step": 77521, "epoch": 933, "val_loss": 5809130.0} {"train_loss": -20.772035598754883, "global_step": 77522, "epoch": 934} {"train_loss": -20.837854385375977, "global_step": 77523, "epoch": 934} {"train_loss": -21.231060028076172, "global_step": 77524, "epoch": 934} {"train_loss": -20.72066307067871, "global_step": 77525, "epoch": 934} {"train_loss": -20.641481399536133, "global_step": 77526, "epoch": 934} {"train_loss": -20.942602157592773, "global_step": 77527, "epoch": 934} {"train_loss": -20.73595428466797, "global_step": 77528, "epoch": 934} {"train_loss": -20.70263671875, "global_step": 77529, "epoch": 934} {"train_loss": -21.156686782836914, "global_step": 77530, "epoch": 934} {"train_loss": -21.152170181274414, "global_step": 77531, "epoch": 934} {"train_loss": -20.91153907775879, "global_step": 77532, "epoch": 934} {"train_loss": -20.93653106689453, "global_step": 77533, "epoch": 934} {"train_loss": -20.810134887695312, "global_step": 77534, "epoch": 934} {"train_loss": -20.925317764282227, "global_step": 77535, "epoch": 934} {"train_loss": -20.7951602935791, "global_step": 77536, "epoch": 934} {"train_loss": -21.29924964904785, "global_step": 77537, "epoch": 934} {"train_loss": -21.115116119384766, "global_step": 77538, "epoch": 934} {"train_loss": -20.889074325561523, "global_step": 77539, "epoch": 934} {"train_loss": -20.9764404296875, "global_step": 77540, "epoch": 934} {"train_loss": -20.907499313354492, "global_step": 77541, "epoch": 934} {"train_loss": -20.92171287536621, "global_step": 77542, "epoch": 934} {"train_loss": -20.97620964050293, "global_step": 77543, "epoch": 934} {"train_loss": -21.29555320739746, "global_step": 77544, "epoch": 934} {"train_loss": -21.39986228942871, "global_step": 77545, "epoch": 934} {"train_loss": -21.430063247680664, "global_step": 77546, "epoch": 934} {"train_loss": -21.59793472290039, "global_step": 77547, "epoch": 934} {"train_loss": -21.219711303710938, "global_step": 77548, "epoch": 934} {"train_loss": -20.942655563354492, "global_step": 77549, "epoch": 934} {"train_loss": -20.841552734375, "global_step": 77550, "epoch": 934} {"train_loss": -21.270355224609375, "global_step": 77551, "epoch": 934} {"train_loss": -21.171234130859375, "global_step": 77552, "epoch": 934} {"train_loss": -21.07243537902832, "global_step": 77553, "epoch": 934} {"train_loss": -21.240156173706055, "global_step": 77554, "epoch": 934} {"train_loss": -21.028226852416992, "global_step": 77555, "epoch": 934} {"train_loss": -21.250764846801758, "global_step": 77556, "epoch": 934} {"train_loss": -21.19423484802246, "global_step": 77557, "epoch": 934} {"train_loss": -20.664886474609375, "global_step": 77558, "epoch": 934} {"train_loss": -21.642017364501953, "global_step": 77559, "epoch": 934} {"train_loss": -21.090078353881836, "global_step": 77560, "epoch": 934} {"train_loss": -21.198530197143555, "global_step": 77561, "epoch": 934} {"train_loss": -21.152099609375, "global_step": 77562, "epoch": 934} {"train_loss": -21.17057228088379, "global_step": 77563, "epoch": 934} {"train_loss": -21.125192642211914, "global_step": 77564, "epoch": 934} {"train_loss": -21.00589942932129, "global_step": 77565, "epoch": 934} {"train_loss": -21.112403869628906, "global_step": 77566, "epoch": 934} {"train_loss": -21.0620174407959, "global_step": 77567, "epoch": 934} {"train_loss": -21.166624069213867, "global_step": 77568, "epoch": 934} {"train_loss": -21.15749168395996, "global_step": 77569, "epoch": 934} {"train_loss": -20.603864669799805, "global_step": 77570, "epoch": 934} {"train_loss": -21.233861923217773, "global_step": 77571, "epoch": 934} {"train_loss": -20.715269088745117, "global_step": 77572, "epoch": 934} {"train_loss": -21.027637481689453, "global_step": 77573, "epoch": 934} {"train_loss": -21.314218521118164, "global_step": 77574, "epoch": 934} {"train_loss": -20.968856811523438, "global_step": 77575, "epoch": 934} {"train_loss": -21.12288475036621, "global_step": 77576, "epoch": 934} {"train_loss": -21.306949615478516, "global_step": 77577, "epoch": 934} {"train_loss": -21.359601974487305, "global_step": 77578, "epoch": 934} {"train_loss": -21.156307220458984, "global_step": 77579, "epoch": 934} {"train_loss": -21.12215805053711, "global_step": 77580, "epoch": 934} {"train_loss": -21.312511444091797, "global_step": 77581, "epoch": 934} {"train_loss": -21.69233512878418, "global_step": 77582, "epoch": 934} {"train_loss": -21.457517623901367, "global_step": 77583, "epoch": 934} {"train_loss": -20.954147338867188, "global_step": 77584, "epoch": 934} {"train_loss": -21.24469566345215, "global_step": 77585, "epoch": 934} {"train_loss": -21.166107177734375, "global_step": 77586, "epoch": 934} {"train_loss": -21.262475967407227, "global_step": 77587, "epoch": 934} {"train_loss": -21.39829444885254, "global_step": 77588, "epoch": 934} {"train_loss": -21.19252586364746, "global_step": 77589, "epoch": 934} {"train_loss": -21.09819984436035, "global_step": 77590, "epoch": 934} {"train_loss": -21.365955352783203, "global_step": 77591, "epoch": 934} {"train_loss": -21.04913330078125, "global_step": 77592, "epoch": 934} {"train_loss": -21.387109756469727, "global_step": 77593, "epoch": 934} {"train_loss": -21.057268142700195, "global_step": 77594, "epoch": 934} {"train_loss": -21.15726661682129, "global_step": 77595, "epoch": 934} {"train_loss": -21.152292251586914, "global_step": 77596, "epoch": 934} {"train_loss": -21.124900817871094, "global_step": 77597, "epoch": 934} {"train_loss": -20.63817596435547, "global_step": 77598, "epoch": 934} {"train_loss": -21.260122299194336, "global_step": 77599, "epoch": 934} {"train_loss": -21.105783462524414, "global_step": 77600, "epoch": 934} {"train_loss": -20.953067779541016, "global_step": 77601, "epoch": 934} {"train_loss": -21.140134811401367, "global_step": 77602, "epoch": 934} {"train_loss": -20.816709518432617, "global_step": 77603, "epoch": 934} {"train_loss": -21.08550161338714, "global_step": 77604, "epoch": 934, "val_loss": 5972898.0} {"train_loss": -20.310592651367188, "global_step": 77605, "epoch": 935} {"train_loss": -20.543785095214844, "global_step": 77606, "epoch": 935} {"train_loss": -21.110111236572266, "global_step": 77607, "epoch": 935} {"train_loss": -20.599822998046875, "global_step": 77608, "epoch": 935} {"train_loss": -20.956151962280273, "global_step": 77609, "epoch": 935} {"train_loss": -20.416040420532227, "global_step": 77610, "epoch": 935} {"train_loss": -20.79713249206543, "global_step": 77611, "epoch": 935} {"train_loss": -20.52118492126465, "global_step": 77612, "epoch": 935} {"train_loss": -20.724088668823242, "global_step": 77613, "epoch": 935} {"train_loss": -20.67084312438965, "global_step": 77614, "epoch": 935} {"train_loss": -21.069082260131836, "global_step": 77615, "epoch": 935} {"train_loss": -20.870874404907227, "global_step": 77616, "epoch": 935} {"train_loss": -21.21792221069336, "global_step": 77617, "epoch": 935} {"train_loss": -21.04527473449707, "global_step": 77618, "epoch": 935} {"train_loss": -21.1505069732666, "global_step": 77619, "epoch": 935} {"train_loss": -20.86630630493164, "global_step": 77620, "epoch": 935} {"train_loss": -21.057392120361328, "global_step": 77621, "epoch": 935} {"train_loss": -21.34524154663086, "global_step": 77622, "epoch": 935} {"train_loss": -21.13800621032715, "global_step": 77623, "epoch": 935} {"train_loss": -21.204792022705078, "global_step": 77624, "epoch": 935} {"train_loss": -21.27924919128418, "global_step": 77625, "epoch": 935} {"train_loss": -20.817123413085938, "global_step": 77626, "epoch": 935} {"train_loss": -21.281583786010742, "global_step": 77627, "epoch": 935} {"train_loss": -21.081178665161133, "global_step": 77628, "epoch": 935} {"train_loss": -21.02425193786621, "global_step": 77629, "epoch": 935} {"train_loss": -21.282928466796875, "global_step": 77630, "epoch": 935} {"train_loss": -21.466527938842773, "global_step": 77631, "epoch": 935} {"train_loss": -21.193620681762695, "global_step": 77632, "epoch": 935} {"train_loss": -21.273300170898438, "global_step": 77633, "epoch": 935} {"train_loss": -21.26664161682129, "global_step": 77634, "epoch": 935} {"train_loss": -21.14784049987793, "global_step": 77635, "epoch": 935} {"train_loss": -21.215686798095703, "global_step": 77636, "epoch": 935} {"train_loss": -21.233856201171875, "global_step": 77637, "epoch": 935} {"train_loss": -20.663450241088867, "global_step": 77638, "epoch": 935} {"train_loss": -21.18613052368164, "global_step": 77639, "epoch": 935} {"train_loss": -21.393789291381836, "global_step": 77640, "epoch": 935} {"train_loss": -21.02895164489746, "global_step": 77641, "epoch": 935} {"train_loss": -20.979055404663086, "global_step": 77642, "epoch": 935} {"train_loss": -21.29645347595215, "global_step": 77643, "epoch": 935} {"train_loss": -21.046253204345703, "global_step": 77644, "epoch": 935} {"train_loss": -21.01967430114746, "global_step": 77645, "epoch": 935} {"train_loss": -21.074209213256836, "global_step": 77646, "epoch": 935} {"train_loss": -21.1115779876709, "global_step": 77647, "epoch": 935} {"train_loss": -21.671987533569336, "global_step": 77648, "epoch": 935} {"train_loss": -21.134057998657227, "global_step": 77649, "epoch": 935} {"train_loss": -21.133228302001953, "global_step": 77650, "epoch": 935} {"train_loss": -21.440410614013672, "global_step": 77651, "epoch": 935} {"train_loss": -21.42024803161621, "global_step": 77652, "epoch": 935} {"train_loss": -21.009830474853516, "global_step": 77653, "epoch": 935} {"train_loss": -20.95413589477539, "global_step": 77654, "epoch": 935} {"train_loss": -20.912004470825195, "global_step": 77655, "epoch": 935} {"train_loss": -21.286191940307617, "global_step": 77656, "epoch": 935} {"train_loss": -21.064178466796875, "global_step": 77657, "epoch": 935} {"train_loss": -20.802431106567383, "global_step": 77658, "epoch": 935} {"train_loss": -21.443965911865234, "global_step": 77659, "epoch": 935} {"train_loss": -20.971349716186523, "global_step": 77660, "epoch": 935} {"train_loss": -21.392770767211914, "global_step": 77661, "epoch": 935} {"train_loss": -21.105356216430664, "global_step": 77662, "epoch": 935} {"train_loss": -21.222328186035156, "global_step": 77663, "epoch": 935} {"train_loss": -21.368005752563477, "global_step": 77664, "epoch": 935} {"train_loss": -21.117536544799805, "global_step": 77665, "epoch": 935} {"train_loss": -21.417112350463867, "global_step": 77666, "epoch": 935} {"train_loss": -21.554031372070312, "global_step": 77667, "epoch": 935} {"train_loss": -21.104806900024414, "global_step": 77668, "epoch": 935} {"train_loss": -21.144285202026367, "global_step": 77669, "epoch": 935} {"train_loss": -21.36834716796875, "global_step": 77670, "epoch": 935} {"train_loss": -21.116683959960938, "global_step": 77671, "epoch": 935} {"train_loss": -20.853666305541992, "global_step": 77672, "epoch": 935} {"train_loss": -21.338804244995117, "global_step": 77673, "epoch": 935} {"train_loss": -20.9935359954834, "global_step": 77674, "epoch": 935} {"train_loss": -21.05447769165039, "global_step": 77675, "epoch": 935} {"train_loss": -21.37872886657715, "global_step": 77676, "epoch": 935} {"train_loss": -21.018049240112305, "global_step": 77677, "epoch": 935} {"train_loss": -21.2304630279541, "global_step": 77678, "epoch": 935} {"train_loss": -21.287200927734375, "global_step": 77679, "epoch": 935} {"train_loss": -21.179723739624023, "global_step": 77680, "epoch": 935} {"train_loss": -21.24751853942871, "global_step": 77681, "epoch": 935} {"train_loss": -21.020601272583008, "global_step": 77682, "epoch": 935} {"train_loss": -21.059446334838867, "global_step": 77683, "epoch": 935} {"train_loss": -21.1376953125, "global_step": 77684, "epoch": 935} {"train_loss": -20.96600914001465, "global_step": 77685, "epoch": 935} {"train_loss": -20.917593002319336, "global_step": 77686, "epoch": 935} {"train_loss": -21.09669372834355, "global_step": 77687, "epoch": 935, "val_loss": 5986278.0} {"train_loss": -21.09363555908203, "global_step": 77688, "epoch": 936} {"train_loss": -20.99098014831543, "global_step": 77689, "epoch": 936} {"train_loss": -21.137319564819336, "global_step": 77690, "epoch": 936} {"train_loss": -20.61909294128418, "global_step": 77691, "epoch": 936} {"train_loss": -20.974321365356445, "global_step": 77692, "epoch": 936} {"train_loss": -21.262039184570312, "global_step": 77693, "epoch": 936} {"train_loss": -20.98637580871582, "global_step": 77694, "epoch": 936} {"train_loss": -20.6594295501709, "global_step": 77695, "epoch": 936} {"train_loss": -20.978389739990234, "global_step": 77696, "epoch": 936} {"train_loss": -20.795133590698242, "global_step": 77697, "epoch": 936} {"train_loss": -21.146886825561523, "global_step": 77698, "epoch": 936} {"train_loss": -20.781261444091797, "global_step": 77699, "epoch": 936} {"train_loss": -20.809600830078125, "global_step": 77700, "epoch": 936} {"train_loss": -21.271133422851562, "global_step": 77701, "epoch": 936} {"train_loss": -21.10271453857422, "global_step": 77702, "epoch": 936} {"train_loss": -21.240938186645508, "global_step": 77703, "epoch": 936} {"train_loss": -21.166336059570312, "global_step": 77704, "epoch": 936} {"train_loss": -21.543180465698242, "global_step": 77705, "epoch": 936} {"train_loss": -21.4450740814209, "global_step": 77706, "epoch": 936} {"train_loss": -20.714685440063477, "global_step": 77707, "epoch": 936} {"train_loss": -21.181894302368164, "global_step": 77708, "epoch": 936} {"train_loss": -21.61220359802246, "global_step": 77709, "epoch": 936} {"train_loss": -21.279647827148438, "global_step": 77710, "epoch": 936} {"train_loss": -21.273778915405273, "global_step": 77711, "epoch": 936} {"train_loss": -21.325658798217773, "global_step": 77712, "epoch": 936} {"train_loss": -20.952411651611328, "global_step": 77713, "epoch": 936} {"train_loss": -21.156421661376953, "global_step": 77714, "epoch": 936} {"train_loss": -21.313682556152344, "global_step": 77715, "epoch": 936} {"train_loss": -21.05426597595215, "global_step": 77716, "epoch": 936} {"train_loss": -21.221708297729492, "global_step": 77717, "epoch": 936} {"train_loss": -21.06471061706543, "global_step": 77718, "epoch": 936} {"train_loss": -21.1250057220459, "global_step": 77719, "epoch": 936} {"train_loss": -20.97441291809082, "global_step": 77720, "epoch": 936} {"train_loss": -21.05807876586914, "global_step": 77721, "epoch": 936} {"train_loss": -21.286216735839844, "global_step": 77722, "epoch": 936} {"train_loss": -21.284992218017578, "global_step": 77723, "epoch": 936} {"train_loss": -21.362276077270508, "global_step": 77724, "epoch": 936} {"train_loss": -21.2138671875, "global_step": 77725, "epoch": 936} {"train_loss": -21.379871368408203, "global_step": 77726, "epoch": 936} {"train_loss": -20.82575035095215, "global_step": 77727, "epoch": 936} {"train_loss": -21.27532196044922, "global_step": 77728, "epoch": 936} {"train_loss": -21.49482536315918, "global_step": 77729, "epoch": 936} {"train_loss": -21.30604362487793, "global_step": 77730, "epoch": 936} {"train_loss": -21.11627197265625, "global_step": 77731, "epoch": 936} {"train_loss": -21.431365966796875, "global_step": 77732, "epoch": 936} {"train_loss": -20.955781936645508, "global_step": 77733, "epoch": 936} {"train_loss": -20.698545455932617, "global_step": 77734, "epoch": 936} {"train_loss": -21.264007568359375, "global_step": 77735, "epoch": 936} {"train_loss": -21.488767623901367, "global_step": 77736, "epoch": 936} {"train_loss": -21.220050811767578, "global_step": 77737, "epoch": 936} {"train_loss": -20.993337631225586, "global_step": 77738, "epoch": 936} {"train_loss": -21.216676712036133, "global_step": 77739, "epoch": 936} {"train_loss": -21.1874942779541, "global_step": 77740, "epoch": 936} {"train_loss": -21.322479248046875, "global_step": 77741, "epoch": 936} {"train_loss": -21.074010848999023, "global_step": 77742, "epoch": 936} {"train_loss": -20.93244743347168, "global_step": 77743, "epoch": 936} {"train_loss": -21.031131744384766, "global_step": 77744, "epoch": 936} {"train_loss": -21.493436813354492, "global_step": 77745, "epoch": 936} {"train_loss": -21.240079879760742, "global_step": 77746, "epoch": 936} {"train_loss": -21.094812393188477, "global_step": 77747, "epoch": 936} {"train_loss": -21.397676467895508, "global_step": 77748, "epoch": 936} {"train_loss": -20.864110946655273, "global_step": 77749, "epoch": 936} {"train_loss": -20.796138763427734, "global_step": 77750, "epoch": 936} {"train_loss": -21.473384857177734, "global_step": 77751, "epoch": 936} {"train_loss": -21.092578887939453, "global_step": 77752, "epoch": 936} {"train_loss": -21.133520126342773, "global_step": 77753, "epoch": 936} {"train_loss": -21.063833236694336, "global_step": 77754, "epoch": 936} {"train_loss": -21.321531295776367, "global_step": 77755, "epoch": 936} {"train_loss": -20.888147354125977, "global_step": 77756, "epoch": 936} {"train_loss": -20.83625602722168, "global_step": 77757, "epoch": 936} {"train_loss": -21.220861434936523, "global_step": 77758, "epoch": 936} {"train_loss": -21.269662857055664, "global_step": 77759, "epoch": 936} {"train_loss": -20.979450225830078, "global_step": 77760, "epoch": 936} {"train_loss": -20.946168899536133, "global_step": 77761, "epoch": 936} {"train_loss": -21.105836868286133, "global_step": 77762, "epoch": 936} {"train_loss": -21.343595504760742, "global_step": 77763, "epoch": 936} {"train_loss": -20.9520206451416, "global_step": 77764, "epoch": 936} {"train_loss": -21.3441162109375, "global_step": 77765, "epoch": 936} {"train_loss": -21.220903396606445, "global_step": 77766, "epoch": 936} {"train_loss": -20.9438533782959, "global_step": 77767, "epoch": 936} {"train_loss": -20.987558364868164, "global_step": 77768, "epoch": 936} {"train_loss": -20.920612335205078, "global_step": 77769, "epoch": 936} {"train_loss": -21.124906562897095, "global_step": 77770, "epoch": 936, "val_loss": 5914169.0} {"train_loss": -20.494609832763672, "global_step": 77771, "epoch": 937} {"train_loss": -21.053220748901367, "global_step": 77772, "epoch": 937} {"train_loss": -21.06621551513672, "global_step": 77773, "epoch": 937} {"train_loss": -20.898151397705078, "global_step": 77774, "epoch": 937} {"train_loss": -20.638113021850586, "global_step": 77775, "epoch": 937} {"train_loss": -20.905933380126953, "global_step": 77776, "epoch": 937} {"train_loss": -21.135560989379883, "global_step": 77777, "epoch": 937} {"train_loss": -21.058076858520508, "global_step": 77778, "epoch": 937} {"train_loss": -20.817468643188477, "global_step": 77779, "epoch": 937} {"train_loss": -21.158796310424805, "global_step": 77780, "epoch": 937} {"train_loss": -20.78151512145996, "global_step": 77781, "epoch": 937} {"train_loss": -21.281675338745117, "global_step": 77782, "epoch": 937} {"train_loss": -20.896324157714844, "global_step": 77783, "epoch": 937} {"train_loss": -21.13278579711914, "global_step": 77784, "epoch": 937} {"train_loss": -20.850284576416016, "global_step": 77785, "epoch": 937} {"train_loss": -20.99460220336914, "global_step": 77786, "epoch": 937} {"train_loss": -20.967641830444336, "global_step": 77787, "epoch": 937} {"train_loss": -21.137577056884766, "global_step": 77788, "epoch": 937} {"train_loss": -20.879240036010742, "global_step": 77789, "epoch": 937} {"train_loss": -20.937732696533203, "global_step": 77790, "epoch": 937} {"train_loss": -20.889602661132812, "global_step": 77791, "epoch": 937} {"train_loss": -21.050094604492188, "global_step": 77792, "epoch": 937} {"train_loss": -21.352338790893555, "global_step": 77793, "epoch": 937} {"train_loss": -21.17529296875, "global_step": 77794, "epoch": 937} {"train_loss": -21.175878524780273, "global_step": 77795, "epoch": 937} {"train_loss": -21.1278018951416, "global_step": 77796, "epoch": 937} {"train_loss": -21.111879348754883, "global_step": 77797, "epoch": 937} {"train_loss": -21.072080612182617, "global_step": 77798, "epoch": 937} {"train_loss": -20.820608139038086, "global_step": 77799, "epoch": 937} {"train_loss": -21.376129150390625, "global_step": 77800, "epoch": 937} {"train_loss": -21.489118576049805, "global_step": 77801, "epoch": 937} {"train_loss": -20.90352439880371, "global_step": 77802, "epoch": 937} {"train_loss": -21.062849044799805, "global_step": 77803, "epoch": 937} {"train_loss": -21.258955001831055, "global_step": 77804, "epoch": 937} {"train_loss": -21.114572525024414, "global_step": 77805, "epoch": 937} {"train_loss": -21.078109741210938, "global_step": 77806, "epoch": 937} {"train_loss": -21.252145767211914, "global_step": 77807, "epoch": 937} {"train_loss": -21.12272834777832, "global_step": 77808, "epoch": 937} {"train_loss": -21.325912475585938, "global_step": 77809, "epoch": 937} {"train_loss": -21.175338745117188, "global_step": 77810, "epoch": 937} {"train_loss": -20.96835708618164, "global_step": 77811, "epoch": 937} {"train_loss": -21.671689987182617, "global_step": 77812, "epoch": 937} {"train_loss": -21.027212142944336, "global_step": 77813, "epoch": 937} {"train_loss": -21.37298583984375, "global_step": 77814, "epoch": 937} {"train_loss": -21.18596839904785, "global_step": 77815, "epoch": 937} {"train_loss": -21.36106300354004, "global_step": 77816, "epoch": 937} {"train_loss": -21.164541244506836, "global_step": 77817, "epoch": 937} {"train_loss": -21.47113037109375, "global_step": 77818, "epoch": 937} {"train_loss": -21.181461334228516, "global_step": 77819, "epoch": 937} {"train_loss": -20.975975036621094, "global_step": 77820, "epoch": 937} {"train_loss": -21.243093490600586, "global_step": 77821, "epoch": 937} {"train_loss": -20.719623565673828, "global_step": 77822, "epoch": 937} {"train_loss": -21.18593406677246, "global_step": 77823, "epoch": 937} {"train_loss": -20.913785934448242, "global_step": 77824, "epoch": 937} {"train_loss": -21.339174270629883, "global_step": 77825, "epoch": 937} {"train_loss": -21.281232833862305, "global_step": 77826, "epoch": 937} {"train_loss": -20.718942642211914, "global_step": 77827, "epoch": 937} {"train_loss": -20.951093673706055, "global_step": 77828, "epoch": 937} {"train_loss": -21.214759826660156, "global_step": 77829, "epoch": 937} {"train_loss": -20.939212799072266, "global_step": 77830, "epoch": 937} {"train_loss": -20.896047592163086, "global_step": 77831, "epoch": 937} {"train_loss": -21.33854103088379, "global_step": 77832, "epoch": 937} {"train_loss": -20.89775848388672, "global_step": 77833, "epoch": 937} {"train_loss": -21.09354019165039, "global_step": 77834, "epoch": 937} {"train_loss": -21.03999900817871, "global_step": 77835, "epoch": 937} {"train_loss": -20.8640079498291, "global_step": 77836, "epoch": 937} {"train_loss": -20.882070541381836, "global_step": 77837, "epoch": 937} {"train_loss": -21.155948638916016, "global_step": 77838, "epoch": 937} {"train_loss": -21.117033004760742, "global_step": 77839, "epoch": 937} {"train_loss": -21.16522216796875, "global_step": 77840, "epoch": 937} {"train_loss": -21.368452072143555, "global_step": 77841, "epoch": 937} {"train_loss": -20.8763370513916, "global_step": 77842, "epoch": 937} {"train_loss": -21.009336471557617, "global_step": 77843, "epoch": 937} {"train_loss": -20.63985824584961, "global_step": 77844, "epoch": 937} {"train_loss": -20.948896408081055, "global_step": 77845, "epoch": 937} {"train_loss": -21.256877899169922, "global_step": 77846, "epoch": 937} {"train_loss": -21.019012451171875, "global_step": 77847, "epoch": 937} {"train_loss": -21.18160057067871, "global_step": 77848, "epoch": 937} {"train_loss": -21.24051284790039, "global_step": 77849, "epoch": 937} {"train_loss": -21.21930694580078, "global_step": 77850, "epoch": 937} {"train_loss": -21.238950729370117, "global_step": 77851, "epoch": 937} {"train_loss": -21.245481491088867, "global_step": 77852, "epoch": 937} {"train_loss": -21.099690793508508, "global_step": 77853, "epoch": 937, "val_loss": 6107749.0} {"train_loss": -20.156551361083984, "global_step": 77854, "epoch": 938} {"train_loss": -21.250843048095703, "global_step": 77855, "epoch": 938} {"train_loss": -20.454971313476562, "global_step": 77856, "epoch": 938} {"train_loss": -20.437116622924805, "global_step": 77857, "epoch": 938} {"train_loss": -20.54879379272461, "global_step": 77858, "epoch": 938} {"train_loss": -20.548925399780273, "global_step": 77859, "epoch": 938} {"train_loss": -20.671072006225586, "global_step": 77860, "epoch": 938} {"train_loss": -20.990272521972656, "global_step": 77861, "epoch": 938} {"train_loss": -21.16216468811035, "global_step": 77862, "epoch": 938} {"train_loss": -21.108245849609375, "global_step": 77863, "epoch": 938} {"train_loss": -20.788297653198242, "global_step": 77864, "epoch": 938} {"train_loss": -20.747095108032227, "global_step": 77865, "epoch": 938} {"train_loss": -21.145645141601562, "global_step": 77866, "epoch": 938} {"train_loss": -20.877988815307617, "global_step": 77867, "epoch": 938} {"train_loss": -21.47313117980957, "global_step": 77868, "epoch": 938} {"train_loss": -21.020584106445312, "global_step": 77869, "epoch": 938} {"train_loss": -21.062482833862305, "global_step": 77870, "epoch": 938} {"train_loss": -20.76544761657715, "global_step": 77871, "epoch": 938} {"train_loss": -20.955432891845703, "global_step": 77872, "epoch": 938} {"train_loss": -20.641698837280273, "global_step": 77873, "epoch": 938} {"train_loss": -21.251855850219727, "global_step": 77874, "epoch": 938} {"train_loss": -21.055253982543945, "global_step": 77875, "epoch": 938} {"train_loss": -20.887189865112305, "global_step": 77876, "epoch": 938} {"train_loss": -21.351486206054688, "global_step": 77877, "epoch": 938} {"train_loss": -20.8252010345459, "global_step": 77878, "epoch": 938} {"train_loss": -20.9232234954834, "global_step": 77879, "epoch": 938} {"train_loss": -21.58461570739746, "global_step": 77880, "epoch": 938} {"train_loss": -20.991064071655273, "global_step": 77881, "epoch": 938} {"train_loss": -21.186443328857422, "global_step": 77882, "epoch": 938} {"train_loss": -21.29843521118164, "global_step": 77883, "epoch": 938} {"train_loss": -21.141679763793945, "global_step": 77884, "epoch": 938} {"train_loss": -21.192642211914062, "global_step": 77885, "epoch": 938} {"train_loss": -21.179208755493164, "global_step": 77886, "epoch": 938} {"train_loss": -21.45503044128418, "global_step": 77887, "epoch": 938} {"train_loss": -21.135189056396484, "global_step": 77888, "epoch": 938} {"train_loss": -21.071640014648438, "global_step": 77889, "epoch": 938} {"train_loss": -21.3631591796875, "global_step": 77890, "epoch": 938} {"train_loss": -21.282678604125977, "global_step": 77891, "epoch": 938} {"train_loss": -20.89004135131836, "global_step": 77892, "epoch": 938} {"train_loss": -21.097318649291992, "global_step": 77893, "epoch": 938} {"train_loss": -21.262893676757812, "global_step": 77894, "epoch": 938} {"train_loss": -21.416818618774414, "global_step": 77895, "epoch": 938} {"train_loss": -20.892593383789062, "global_step": 77896, "epoch": 938} {"train_loss": -21.130807876586914, "global_step": 77897, "epoch": 938} {"train_loss": -21.21624183654785, "global_step": 77898, "epoch": 938} {"train_loss": -21.23982048034668, "global_step": 77899, "epoch": 938} {"train_loss": -21.307357788085938, "global_step": 77900, "epoch": 938} {"train_loss": -21.25644302368164, "global_step": 77901, "epoch": 938} {"train_loss": -21.204744338989258, "global_step": 77902, "epoch": 938} {"train_loss": -21.123260498046875, "global_step": 77903, "epoch": 938} {"train_loss": -21.134817123413086, "global_step": 77904, "epoch": 938} {"train_loss": -21.67849349975586, "global_step": 77905, "epoch": 938} {"train_loss": -20.849647521972656, "global_step": 77906, "epoch": 938} {"train_loss": -21.067197799682617, "global_step": 77907, "epoch": 938} {"train_loss": -21.359790802001953, "global_step": 77908, "epoch": 938} {"train_loss": -21.035144805908203, "global_step": 77909, "epoch": 938} {"train_loss": -21.572065353393555, "global_step": 77910, "epoch": 938} {"train_loss": -21.37738800048828, "global_step": 77911, "epoch": 938} {"train_loss": -21.19343376159668, "global_step": 77912, "epoch": 938} {"train_loss": -21.224184036254883, "global_step": 77913, "epoch": 938} {"train_loss": -21.215246200561523, "global_step": 77914, "epoch": 938} {"train_loss": -21.25619888305664, "global_step": 77915, "epoch": 938} {"train_loss": -20.92130470275879, "global_step": 77916, "epoch": 938} {"train_loss": -21.25322914123535, "global_step": 77917, "epoch": 938} {"train_loss": -21.24116325378418, "global_step": 77918, "epoch": 938} {"train_loss": -21.15674591064453, "global_step": 77919, "epoch": 938} {"train_loss": -20.98333168029785, "global_step": 77920, "epoch": 938} {"train_loss": -21.166587829589844, "global_step": 77921, "epoch": 938} {"train_loss": -21.190397262573242, "global_step": 77922, "epoch": 938} {"train_loss": -21.272132873535156, "global_step": 77923, "epoch": 938} {"train_loss": -21.343740463256836, "global_step": 77924, "epoch": 938} {"train_loss": -21.216550827026367, "global_step": 77925, "epoch": 938} {"train_loss": -21.570261001586914, "global_step": 77926, "epoch": 938} {"train_loss": -20.96544075012207, "global_step": 77927, "epoch": 938} {"train_loss": -21.144346237182617, "global_step": 77928, "epoch": 938} {"train_loss": -21.498708724975586, "global_step": 77929, "epoch": 938} {"train_loss": -20.997465133666992, "global_step": 77930, "epoch": 938} {"train_loss": -21.012380599975586, "global_step": 77931, "epoch": 938} {"train_loss": -21.626317977905273, "global_step": 77932, "epoch": 938} {"train_loss": -21.1420955657959, "global_step": 77933, "epoch": 938} {"train_loss": -21.219253540039062, "global_step": 77934, "epoch": 938} {"train_loss": -20.867704391479492, "global_step": 77935, "epoch": 938} {"train_loss": -21.114176692732844, "global_step": 77936, "epoch": 938, "val_loss": 6176965.0} {"train_loss": -21.00678825378418, "global_step": 77937, "epoch": 939} {"train_loss": -21.32503318786621, "global_step": 77938, "epoch": 939} {"train_loss": -20.94815444946289, "global_step": 77939, "epoch": 939} {"train_loss": -20.960546493530273, "global_step": 77940, "epoch": 939} {"train_loss": -20.734758377075195, "global_step": 77941, "epoch": 939} {"train_loss": -21.198925018310547, "global_step": 77942, "epoch": 939} {"train_loss": -20.89165496826172, "global_step": 77943, "epoch": 939} {"train_loss": -21.363719940185547, "global_step": 77944, "epoch": 939} {"train_loss": -21.34058952331543, "global_step": 77945, "epoch": 939} {"train_loss": -21.24920082092285, "global_step": 77946, "epoch": 939} {"train_loss": -21.03896713256836, "global_step": 77947, "epoch": 939} {"train_loss": -20.987966537475586, "global_step": 77948, "epoch": 939} {"train_loss": -21.103376388549805, "global_step": 77949, "epoch": 939} {"train_loss": -20.833831787109375, "global_step": 77950, "epoch": 939} {"train_loss": -20.836139678955078, "global_step": 77951, "epoch": 939} {"train_loss": -21.49932289123535, "global_step": 77952, "epoch": 939} {"train_loss": -20.67352867126465, "global_step": 77953, "epoch": 939} {"train_loss": -21.285058975219727, "global_step": 77954, "epoch": 939} {"train_loss": -21.107351303100586, "global_step": 77955, "epoch": 939} {"train_loss": -21.03468132019043, "global_step": 77956, "epoch": 939} {"train_loss": -21.349502563476562, "global_step": 77957, "epoch": 939} {"train_loss": -21.246747970581055, "global_step": 77958, "epoch": 939} {"train_loss": -21.04281234741211, "global_step": 77959, "epoch": 939} {"train_loss": -21.14464569091797, "global_step": 77960, "epoch": 939} {"train_loss": -21.51405906677246, "global_step": 77961, "epoch": 939} {"train_loss": -21.12604331970215, "global_step": 77962, "epoch": 939} {"train_loss": -21.395732879638672, "global_step": 77963, "epoch": 939} {"train_loss": -21.54163932800293, "global_step": 77964, "epoch": 939} {"train_loss": -20.94782829284668, "global_step": 77965, "epoch": 939} {"train_loss": -20.96072769165039, "global_step": 77966, "epoch": 939} {"train_loss": -20.911130905151367, "global_step": 77967, "epoch": 939} {"train_loss": -21.271406173706055, "global_step": 77968, "epoch": 939} {"train_loss": -20.95884132385254, "global_step": 77969, "epoch": 939} {"train_loss": -21.159725189208984, "global_step": 77970, "epoch": 939} {"train_loss": -21.309064865112305, "global_step": 77971, "epoch": 939} {"train_loss": -20.970111846923828, "global_step": 77972, "epoch": 939} {"train_loss": -20.487783432006836, "global_step": 77973, "epoch": 939} {"train_loss": -20.839696884155273, "global_step": 77974, "epoch": 939} {"train_loss": -20.989187240600586, "global_step": 77975, "epoch": 939} {"train_loss": -21.245683670043945, "global_step": 77976, "epoch": 939} {"train_loss": -21.079069137573242, "global_step": 77977, "epoch": 939} {"train_loss": -21.235300064086914, "global_step": 77978, "epoch": 939} {"train_loss": -21.191024780273438, "global_step": 77979, "epoch": 939} {"train_loss": -21.095718383789062, "global_step": 77980, "epoch": 939} {"train_loss": -21.2303409576416, "global_step": 77981, "epoch": 939} {"train_loss": -21.17746353149414, "global_step": 77982, "epoch": 939} {"train_loss": -21.200090408325195, "global_step": 77983, "epoch": 939} {"train_loss": -21.267602920532227, "global_step": 77984, "epoch": 939} {"train_loss": -21.106718063354492, "global_step": 77985, "epoch": 939} {"train_loss": -20.551725387573242, "global_step": 77986, "epoch": 939} {"train_loss": -21.2636661529541, "global_step": 77987, "epoch": 939} {"train_loss": -20.963794708251953, "global_step": 77988, "epoch": 939} {"train_loss": -20.965778350830078, "global_step": 77989, "epoch": 939} {"train_loss": -21.58016014099121, "global_step": 77990, "epoch": 939} {"train_loss": -21.13979148864746, "global_step": 77991, "epoch": 939} {"train_loss": -21.393156051635742, "global_step": 77992, "epoch": 939} {"train_loss": -20.68178367614746, "global_step": 77993, "epoch": 939} {"train_loss": -20.90789222717285, "global_step": 77994, "epoch": 939} {"train_loss": -21.265575408935547, "global_step": 77995, "epoch": 939} {"train_loss": -21.30014419555664, "global_step": 77996, "epoch": 939} {"train_loss": -21.185514450073242, "global_step": 77997, "epoch": 939} {"train_loss": -21.32485580444336, "global_step": 77998, "epoch": 939} {"train_loss": -20.955862045288086, "global_step": 77999, "epoch": 939} {"train_loss": -21.18833351135254, "global_step": 78000, "epoch": 939} {"train_loss": -21.239320755004883, "global_step": 78001, "epoch": 939} {"train_loss": -21.239744186401367, "global_step": 78002, "epoch": 939} {"train_loss": -21.141672134399414, "global_step": 78003, "epoch": 939} {"train_loss": -21.177976608276367, "global_step": 78004, "epoch": 939} {"train_loss": -21.130735397338867, "global_step": 78005, "epoch": 939} {"train_loss": -20.783384323120117, "global_step": 78006, "epoch": 939} {"train_loss": -21.12250328063965, "global_step": 78007, "epoch": 939} {"train_loss": -21.40082359313965, "global_step": 78008, "epoch": 939} {"train_loss": -21.003955841064453, "global_step": 78009, "epoch": 939} {"train_loss": -21.208450317382812, "global_step": 78010, "epoch": 939} {"train_loss": -21.141286849975586, "global_step": 78011, "epoch": 939} {"train_loss": -21.08932876586914, "global_step": 78012, "epoch": 939} {"train_loss": -20.9378604888916, "global_step": 78013, "epoch": 939} {"train_loss": -20.807138442993164, "global_step": 78014, "epoch": 939} {"train_loss": -21.39836883544922, "global_step": 78015, "epoch": 939} {"train_loss": -21.07845687866211, "global_step": 78016, "epoch": 939} {"train_loss": -20.950559616088867, "global_step": 78017, "epoch": 939} {"train_loss": -21.117027282714844, "global_step": 78018, "epoch": 939} {"train_loss": -21.12055291325213, "global_step": 78019, "epoch": 939, "val_loss": 6308225.0} {"train_loss": -20.176374435424805, "global_step": 78020, "epoch": 940} {"train_loss": -20.867191314697266, "global_step": 78021, "epoch": 940} {"train_loss": -20.775680541992188, "global_step": 78022, "epoch": 940} {"train_loss": -20.360986709594727, "global_step": 78023, "epoch": 940} {"train_loss": -20.862333297729492, "global_step": 78024, "epoch": 940} {"train_loss": -20.46330451965332, "global_step": 78025, "epoch": 940} {"train_loss": -20.797447204589844, "global_step": 78026, "epoch": 940} {"train_loss": -20.806232452392578, "global_step": 78027, "epoch": 940} {"train_loss": -20.726734161376953, "global_step": 78028, "epoch": 940} {"train_loss": -20.568769454956055, "global_step": 78029, "epoch": 940} {"train_loss": -20.55653190612793, "global_step": 78030, "epoch": 940} {"train_loss": -21.007736206054688, "global_step": 78031, "epoch": 940} {"train_loss": -21.075544357299805, "global_step": 78032, "epoch": 940} {"train_loss": -20.627492904663086, "global_step": 78033, "epoch": 940} {"train_loss": -20.92709732055664, "global_step": 78034, "epoch": 940} {"train_loss": -21.01472282409668, "global_step": 78035, "epoch": 940} {"train_loss": -20.80857276916504, "global_step": 78036, "epoch": 940} {"train_loss": -20.7047176361084, "global_step": 78037, "epoch": 940} {"train_loss": -21.05109214782715, "global_step": 78038, "epoch": 940} {"train_loss": -21.26344871520996, "global_step": 78039, "epoch": 940} {"train_loss": -20.872039794921875, "global_step": 78040, "epoch": 940} {"train_loss": -20.935300827026367, "global_step": 78041, "epoch": 940} {"train_loss": -20.866384506225586, "global_step": 78042, "epoch": 940} {"train_loss": -21.39224624633789, "global_step": 78043, "epoch": 940} {"train_loss": -21.303146362304688, "global_step": 78044, "epoch": 940} {"train_loss": -21.086673736572266, "global_step": 78045, "epoch": 940} {"train_loss": -20.770177841186523, "global_step": 78046, "epoch": 940} {"train_loss": -21.071102142333984, "global_step": 78047, "epoch": 940} {"train_loss": -21.26736831665039, "global_step": 78048, "epoch": 940} {"train_loss": -20.997146606445312, "global_step": 78049, "epoch": 940} {"train_loss": -21.013774871826172, "global_step": 78050, "epoch": 940} {"train_loss": -20.961984634399414, "global_step": 78051, "epoch": 940} {"train_loss": -21.170509338378906, "global_step": 78052, "epoch": 940} {"train_loss": -21.206192016601562, "global_step": 78053, "epoch": 940} {"train_loss": -21.21076011657715, "global_step": 78054, "epoch": 940} {"train_loss": -21.418624877929688, "global_step": 78055, "epoch": 940} {"train_loss": -21.205982208251953, "global_step": 78056, "epoch": 940} {"train_loss": -20.94746971130371, "global_step": 78057, "epoch": 940} {"train_loss": -21.141324996948242, "global_step": 78058, "epoch": 940} {"train_loss": -21.151456832885742, "global_step": 78059, "epoch": 940} {"train_loss": -20.856237411499023, "global_step": 78060, "epoch": 940} {"train_loss": -21.30536460876465, "global_step": 78061, "epoch": 940} {"train_loss": -20.69829559326172, "global_step": 78062, "epoch": 940} {"train_loss": -21.075164794921875, "global_step": 78063, "epoch": 940} {"train_loss": -20.756784439086914, "global_step": 78064, "epoch": 940} {"train_loss": -20.949247360229492, "global_step": 78065, "epoch": 940} {"train_loss": -21.04579734802246, "global_step": 78066, "epoch": 940} {"train_loss": -21.392480850219727, "global_step": 78067, "epoch": 940} {"train_loss": -21.049449920654297, "global_step": 78068, "epoch": 940} {"train_loss": -21.023517608642578, "global_step": 78069, "epoch": 940} {"train_loss": -21.07697105407715, "global_step": 78070, "epoch": 940} {"train_loss": -20.642173767089844, "global_step": 78071, "epoch": 940} {"train_loss": -20.859128952026367, "global_step": 78072, "epoch": 940} {"train_loss": -21.109312057495117, "global_step": 78073, "epoch": 940} {"train_loss": -20.807058334350586, "global_step": 78074, "epoch": 940} {"train_loss": -21.297779083251953, "global_step": 78075, "epoch": 940} {"train_loss": -21.680757522583008, "global_step": 78076, "epoch": 940} {"train_loss": -21.148900985717773, "global_step": 78077, "epoch": 940} {"train_loss": -21.20391845703125, "global_step": 78078, "epoch": 940} {"train_loss": -20.87637710571289, "global_step": 78079, "epoch": 940} {"train_loss": -20.960783004760742, "global_step": 78080, "epoch": 940} {"train_loss": -21.081470489501953, "global_step": 78081, "epoch": 940} {"train_loss": -21.197111129760742, "global_step": 78082, "epoch": 940} {"train_loss": -21.126663208007812, "global_step": 78083, "epoch": 940} {"train_loss": -20.875934600830078, "global_step": 78084, "epoch": 940} {"train_loss": -21.26859474182129, "global_step": 78085, "epoch": 940} {"train_loss": -20.90130615234375, "global_step": 78086, "epoch": 940} {"train_loss": -21.36734390258789, "global_step": 78087, "epoch": 940} {"train_loss": -21.218204498291016, "global_step": 78088, "epoch": 940} {"train_loss": -21.3281307220459, "global_step": 78089, "epoch": 940} {"train_loss": -21.081466674804688, "global_step": 78090, "epoch": 940} {"train_loss": -21.120718002319336, "global_step": 78091, "epoch": 940} {"train_loss": -21.160255432128906, "global_step": 78092, "epoch": 940} {"train_loss": -21.703266143798828, "global_step": 78093, "epoch": 940} {"train_loss": -20.910354614257812, "global_step": 78094, "epoch": 940} {"train_loss": -21.2064266204834, "global_step": 78095, "epoch": 940} {"train_loss": -20.978256225585938, "global_step": 78096, "epoch": 940} {"train_loss": -21.22651481628418, "global_step": 78097, "epoch": 940} {"train_loss": -21.09333610534668, "global_step": 78098, "epoch": 940} {"train_loss": -21.00211524963379, "global_step": 78099, "epoch": 940} {"train_loss": -21.455703735351562, "global_step": 78100, "epoch": 940} {"train_loss": -21.450838088989258, "global_step": 78101, "epoch": 940} {"train_loss": -21.01157742236034, "global_step": 78102, "epoch": 940, "val_loss": 6020451.5} {"train_loss": -21.22144889831543, "global_step": 78103, "epoch": 941} {"train_loss": -21.4274959564209, "global_step": 78104, "epoch": 941} {"train_loss": -21.43153953552246, "global_step": 78105, "epoch": 941} {"train_loss": -21.336318969726562, "global_step": 78106, "epoch": 941} {"train_loss": -21.14173698425293, "global_step": 78107, "epoch": 941} {"train_loss": -21.395654678344727, "global_step": 78108, "epoch": 941} {"train_loss": -21.211994171142578, "global_step": 78109, "epoch": 941} {"train_loss": -21.192262649536133, "global_step": 78110, "epoch": 941} {"train_loss": -20.962310791015625, "global_step": 78111, "epoch": 941} {"train_loss": -21.09902000427246, "global_step": 78112, "epoch": 941} {"train_loss": -21.27796173095703, "global_step": 78113, "epoch": 941} {"train_loss": -21.095720291137695, "global_step": 78114, "epoch": 941} {"train_loss": -21.241056442260742, "global_step": 78115, "epoch": 941} {"train_loss": -21.196439743041992, "global_step": 78116, "epoch": 941} {"train_loss": -21.497928619384766, "global_step": 78117, "epoch": 941} {"train_loss": -21.180150985717773, "global_step": 78118, "epoch": 941} {"train_loss": -21.2531795501709, "global_step": 78119, "epoch": 941} {"train_loss": -21.182600021362305, "global_step": 78120, "epoch": 941} {"train_loss": -20.918771743774414, "global_step": 78121, "epoch": 941} {"train_loss": -21.110275268554688, "global_step": 78122, "epoch": 941} {"train_loss": -20.92099380493164, "global_step": 78123, "epoch": 941} {"train_loss": -20.896697998046875, "global_step": 78124, "epoch": 941} {"train_loss": -21.138671875, "global_step": 78125, "epoch": 941} {"train_loss": -20.889196395874023, "global_step": 78126, "epoch": 941} {"train_loss": -20.782928466796875, "global_step": 78127, "epoch": 941} {"train_loss": -21.1114501953125, "global_step": 78128, "epoch": 941} {"train_loss": -21.26505470275879, "global_step": 78129, "epoch": 941} {"train_loss": -21.12165641784668, "global_step": 78130, "epoch": 941} {"train_loss": -21.304128646850586, "global_step": 78131, "epoch": 941} {"train_loss": -21.065414428710938, "global_step": 78132, "epoch": 941} {"train_loss": -20.928817749023438, "global_step": 78133, "epoch": 941} {"train_loss": -21.10757064819336, "global_step": 78134, "epoch": 941} {"train_loss": -21.013397216796875, "global_step": 78135, "epoch": 941} {"train_loss": -21.140043258666992, "global_step": 78136, "epoch": 941} {"train_loss": -21.2758731842041, "global_step": 78137, "epoch": 941} {"train_loss": -21.00600242614746, "global_step": 78138, "epoch": 941} {"train_loss": -21.183942794799805, "global_step": 78139, "epoch": 941} {"train_loss": -21.280977249145508, "global_step": 78140, "epoch": 941} {"train_loss": -20.9896240234375, "global_step": 78141, "epoch": 941} {"train_loss": -21.31987190246582, "global_step": 78142, "epoch": 941} {"train_loss": -21.076536178588867, "global_step": 78143, "epoch": 941} {"train_loss": -21.317481994628906, "global_step": 78144, "epoch": 941} {"train_loss": -21.05986976623535, "global_step": 78145, "epoch": 941} {"train_loss": -21.1981258392334, "global_step": 78146, "epoch": 941} {"train_loss": -21.3013858795166, "global_step": 78147, "epoch": 941} {"train_loss": -21.477100372314453, "global_step": 78148, "epoch": 941} {"train_loss": -21.479944229125977, "global_step": 78149, "epoch": 941} {"train_loss": -20.879783630371094, "global_step": 78150, "epoch": 941} {"train_loss": -21.023893356323242, "global_step": 78151, "epoch": 941} {"train_loss": -21.21773910522461, "global_step": 78152, "epoch": 941} {"train_loss": -21.391239166259766, "global_step": 78153, "epoch": 941} {"train_loss": -21.195720672607422, "global_step": 78154, "epoch": 941} {"train_loss": -21.317487716674805, "global_step": 78155, "epoch": 941} {"train_loss": -20.729534149169922, "global_step": 78156, "epoch": 941} {"train_loss": -20.683135986328125, "global_step": 78157, "epoch": 941} {"train_loss": -20.8452205657959, "global_step": 78158, "epoch": 941} {"train_loss": -21.123517990112305, "global_step": 78159, "epoch": 941} {"train_loss": -20.728403091430664, "global_step": 78160, "epoch": 941} {"train_loss": -21.1298828125, "global_step": 78161, "epoch": 941} {"train_loss": -20.428279876708984, "global_step": 78162, "epoch": 941} {"train_loss": -21.15071678161621, "global_step": 78163, "epoch": 941} {"train_loss": -20.86940574645996, "global_step": 78164, "epoch": 941} {"train_loss": -20.979204177856445, "global_step": 78165, "epoch": 941} {"train_loss": -21.259628295898438, "global_step": 78166, "epoch": 941} {"train_loss": -21.152238845825195, "global_step": 78167, "epoch": 941} {"train_loss": -20.889188766479492, "global_step": 78168, "epoch": 941} {"train_loss": -21.165355682373047, "global_step": 78169, "epoch": 941} {"train_loss": -20.85736083984375, "global_step": 78170, "epoch": 941} {"train_loss": -21.376253128051758, "global_step": 78171, "epoch": 941} {"train_loss": -21.06593894958496, "global_step": 78172, "epoch": 941} {"train_loss": -21.04524040222168, "global_step": 78173, "epoch": 941} {"train_loss": -21.28452491760254, "global_step": 78174, "epoch": 941} {"train_loss": -21.18525505065918, "global_step": 78175, "epoch": 941} {"train_loss": -21.33864402770996, "global_step": 78176, "epoch": 941} {"train_loss": -21.043004989624023, "global_step": 78177, "epoch": 941} {"train_loss": -21.329538345336914, "global_step": 78178, "epoch": 941} {"train_loss": -20.806594848632812, "global_step": 78179, "epoch": 941} {"train_loss": -20.676115036010742, "global_step": 78180, "epoch": 941} {"train_loss": -21.437362670898438, "global_step": 78181, "epoch": 941} {"train_loss": -21.084598541259766, "global_step": 78182, "epoch": 941} {"train_loss": -21.23615837097168, "global_step": 78183, "epoch": 941} {"train_loss": -21.523466110229492, "global_step": 78184, "epoch": 941} {"train_loss": -21.11508771597621, "global_step": 78185, "epoch": 941, "val_loss": 6216586.5} {"train_loss": -20.547876358032227, "global_step": 78186, "epoch": 942} {"train_loss": -20.320615768432617, "global_step": 78187, "epoch": 942} {"train_loss": -20.602415084838867, "global_step": 78188, "epoch": 942} {"train_loss": -20.39586067199707, "global_step": 78189, "epoch": 942} {"train_loss": -20.7592830657959, "global_step": 78190, "epoch": 942} {"train_loss": -20.492799758911133, "global_step": 78191, "epoch": 942} {"train_loss": -20.378223419189453, "global_step": 78192, "epoch": 942} {"train_loss": -20.714853286743164, "global_step": 78193, "epoch": 942} {"train_loss": -20.755970001220703, "global_step": 78194, "epoch": 942} {"train_loss": -20.914133071899414, "global_step": 78195, "epoch": 942} {"train_loss": -20.597360610961914, "global_step": 78196, "epoch": 942} {"train_loss": -20.747777938842773, "global_step": 78197, "epoch": 942} {"train_loss": -20.631389617919922, "global_step": 78198, "epoch": 942} {"train_loss": -21.049039840698242, "global_step": 78199, "epoch": 942} {"train_loss": -20.81005096435547, "global_step": 78200, "epoch": 942} {"train_loss": -21.281909942626953, "global_step": 78201, "epoch": 942} {"train_loss": -20.521276473999023, "global_step": 78202, "epoch": 942} {"train_loss": -20.974863052368164, "global_step": 78203, "epoch": 942} {"train_loss": -20.9672908782959, "global_step": 78204, "epoch": 942} {"train_loss": -20.985979080200195, "global_step": 78205, "epoch": 942} {"train_loss": -21.0755558013916, "global_step": 78206, "epoch": 942} {"train_loss": -21.06379508972168, "global_step": 78207, "epoch": 942} {"train_loss": -20.71161460876465, "global_step": 78208, "epoch": 942} {"train_loss": -20.706161499023438, "global_step": 78209, "epoch": 942} {"train_loss": -21.02495765686035, "global_step": 78210, "epoch": 942} {"train_loss": -21.269943237304688, "global_step": 78211, "epoch": 942} {"train_loss": -21.170917510986328, "global_step": 78212, "epoch": 942} {"train_loss": -20.821319580078125, "global_step": 78213, "epoch": 942} {"train_loss": -20.853010177612305, "global_step": 78214, "epoch": 942} {"train_loss": -21.063810348510742, "global_step": 78215, "epoch": 942} {"train_loss": -21.037233352661133, "global_step": 78216, "epoch": 942} {"train_loss": -20.93829345703125, "global_step": 78217, "epoch": 942} {"train_loss": -21.079675674438477, "global_step": 78218, "epoch": 942} {"train_loss": -20.855390548706055, "global_step": 78219, "epoch": 942} {"train_loss": -21.146488189697266, "global_step": 78220, "epoch": 942} {"train_loss": -21.446420669555664, "global_step": 78221, "epoch": 942} {"train_loss": -20.991621017456055, "global_step": 78222, "epoch": 942} {"train_loss": -21.020986557006836, "global_step": 78223, "epoch": 942} {"train_loss": -21.435596466064453, "global_step": 78224, "epoch": 942} {"train_loss": -20.828426361083984, "global_step": 78225, "epoch": 942} {"train_loss": -20.950849533081055, "global_step": 78226, "epoch": 942} {"train_loss": -21.341754913330078, "global_step": 78227, "epoch": 942} {"train_loss": -20.858503341674805, "global_step": 78228, "epoch": 942} {"train_loss": -20.958162307739258, "global_step": 78229, "epoch": 942} {"train_loss": -21.1771183013916, "global_step": 78230, "epoch": 942} {"train_loss": -21.28558349609375, "global_step": 78231, "epoch": 942} {"train_loss": -21.074100494384766, "global_step": 78232, "epoch": 942} {"train_loss": -21.032007217407227, "global_step": 78233, "epoch": 942} {"train_loss": -20.970111846923828, "global_step": 78234, "epoch": 942} {"train_loss": -21.014501571655273, "global_step": 78235, "epoch": 942} {"train_loss": -21.34430503845215, "global_step": 78236, "epoch": 942} {"train_loss": -21.201251983642578, "global_step": 78237, "epoch": 942} {"train_loss": -21.57172966003418, "global_step": 78238, "epoch": 942} {"train_loss": -21.258764266967773, "global_step": 78239, "epoch": 942} {"train_loss": -20.79003143310547, "global_step": 78240, "epoch": 942} {"train_loss": -21.02655029296875, "global_step": 78241, "epoch": 942} {"train_loss": -21.082822799682617, "global_step": 78242, "epoch": 942} {"train_loss": -20.999786376953125, "global_step": 78243, "epoch": 942} {"train_loss": -20.780153274536133, "global_step": 78244, "epoch": 942} {"train_loss": -21.667285919189453, "global_step": 78245, "epoch": 942} {"train_loss": -20.823144912719727, "global_step": 78246, "epoch": 942} {"train_loss": -21.178831100463867, "global_step": 78247, "epoch": 942} {"train_loss": -21.28468132019043, "global_step": 78248, "epoch": 942} {"train_loss": -21.178653717041016, "global_step": 78249, "epoch": 942} {"train_loss": -21.024084091186523, "global_step": 78250, "epoch": 942} {"train_loss": -21.315689086914062, "global_step": 78251, "epoch": 942} {"train_loss": -21.371267318725586, "global_step": 78252, "epoch": 942} {"train_loss": -21.504032135009766, "global_step": 78253, "epoch": 942} {"train_loss": -21.10029411315918, "global_step": 78254, "epoch": 942} {"train_loss": -21.25611686706543, "global_step": 78255, "epoch": 942} {"train_loss": -21.386857986450195, "global_step": 78256, "epoch": 942} {"train_loss": -21.680402755737305, "global_step": 78257, "epoch": 942} {"train_loss": -21.284353256225586, "global_step": 78258, "epoch": 942} {"train_loss": -21.322181701660156, "global_step": 78259, "epoch": 942} {"train_loss": -20.981809616088867, "global_step": 78260, "epoch": 942} {"train_loss": -21.5283203125, "global_step": 78261, "epoch": 942} {"train_loss": -21.285253524780273, "global_step": 78262, "epoch": 942} {"train_loss": -21.70326805114746, "global_step": 78263, "epoch": 942} {"train_loss": -21.396854400634766, "global_step": 78264, "epoch": 942} {"train_loss": -20.83695411682129, "global_step": 78265, "epoch": 942} {"train_loss": -21.023202896118164, "global_step": 78266, "epoch": 942} {"train_loss": -21.30286979675293, "global_step": 78267, "epoch": 942} {"train_loss": -21.0455700518137, "global_step": 78268, "epoch": 942, "val_loss": 6196508.0} {"train_loss": -21.018951416015625, "global_step": 78269, "epoch": 943} {"train_loss": -20.718679428100586, "global_step": 78270, "epoch": 943} {"train_loss": -20.904438018798828, "global_step": 78271, "epoch": 943} {"train_loss": -21.18949317932129, "global_step": 78272, "epoch": 943} {"train_loss": -20.804723739624023, "global_step": 78273, "epoch": 943} {"train_loss": -20.955398559570312, "global_step": 78274, "epoch": 943} {"train_loss": -20.96108055114746, "global_step": 78275, "epoch": 943} {"train_loss": -21.02328109741211, "global_step": 78276, "epoch": 943} {"train_loss": -21.2925968170166, "global_step": 78277, "epoch": 943} {"train_loss": -20.731313705444336, "global_step": 78278, "epoch": 943} {"train_loss": -21.33392906188965, "global_step": 78279, "epoch": 943} {"train_loss": -21.059345245361328, "global_step": 78280, "epoch": 943} {"train_loss": -21.173349380493164, "global_step": 78281, "epoch": 943} {"train_loss": -20.90395164489746, "global_step": 78282, "epoch": 943} {"train_loss": -20.991008758544922, "global_step": 78283, "epoch": 943} {"train_loss": -21.016067504882812, "global_step": 78284, "epoch": 943} {"train_loss": -20.92830467224121, "global_step": 78285, "epoch": 943} {"train_loss": -21.187326431274414, "global_step": 78286, "epoch": 943} {"train_loss": -21.358402252197266, "global_step": 78287, "epoch": 943} {"train_loss": -21.228561401367188, "global_step": 78288, "epoch": 943} {"train_loss": -20.909452438354492, "global_step": 78289, "epoch": 943} {"train_loss": -21.286514282226562, "global_step": 78290, "epoch": 943} {"train_loss": -21.402969360351562, "global_step": 78291, "epoch": 943} {"train_loss": -21.493207931518555, "global_step": 78292, "epoch": 943} {"train_loss": -21.003650665283203, "global_step": 78293, "epoch": 943} {"train_loss": -21.272748947143555, "global_step": 78294, "epoch": 943} {"train_loss": -21.0847225189209, "global_step": 78295, "epoch": 943} {"train_loss": -20.99553871154785, "global_step": 78296, "epoch": 943} {"train_loss": -20.8743839263916, "global_step": 78297, "epoch": 943} {"train_loss": -20.997343063354492, "global_step": 78298, "epoch": 943} {"train_loss": -20.993070602416992, "global_step": 78299, "epoch": 943} {"train_loss": -21.35460090637207, "global_step": 78300, "epoch": 943} {"train_loss": -20.847869873046875, "global_step": 78301, "epoch": 943} {"train_loss": -20.84191131591797, "global_step": 78302, "epoch": 943} {"train_loss": -21.225507736206055, "global_step": 78303, "epoch": 943} {"train_loss": -20.994281768798828, "global_step": 78304, "epoch": 943} {"train_loss": -21.10582160949707, "global_step": 78305, "epoch": 943} {"train_loss": -21.1497859954834, "global_step": 78306, "epoch": 943} {"train_loss": -21.464447021484375, "global_step": 78307, "epoch": 943} {"train_loss": -21.544261932373047, "global_step": 78308, "epoch": 943} {"train_loss": -21.040197372436523, "global_step": 78309, "epoch": 943} {"train_loss": -21.101743698120117, "global_step": 78310, "epoch": 943} {"train_loss": -20.794498443603516, "global_step": 78311, "epoch": 943} {"train_loss": -20.946029663085938, "global_step": 78312, "epoch": 943} {"train_loss": -20.92584800720215, "global_step": 78313, "epoch": 943} {"train_loss": -21.353342056274414, "global_step": 78314, "epoch": 943} {"train_loss": -21.020116806030273, "global_step": 78315, "epoch": 943} {"train_loss": -21.163904190063477, "global_step": 78316, "epoch": 943} {"train_loss": -21.172632217407227, "global_step": 78317, "epoch": 943} {"train_loss": -21.210859298706055, "global_step": 78318, "epoch": 943} {"train_loss": -21.16446304321289, "global_step": 78319, "epoch": 943} {"train_loss": -21.512495040893555, "global_step": 78320, "epoch": 943} {"train_loss": -20.920978546142578, "global_step": 78321, "epoch": 943} {"train_loss": -21.084192276000977, "global_step": 78322, "epoch": 943} {"train_loss": -21.182092666625977, "global_step": 78323, "epoch": 943} {"train_loss": -20.764724731445312, "global_step": 78324, "epoch": 943} {"train_loss": -21.225055694580078, "global_step": 78325, "epoch": 943} {"train_loss": -21.204479217529297, "global_step": 78326, "epoch": 943} {"train_loss": -21.123966217041016, "global_step": 78327, "epoch": 943} {"train_loss": -21.384601593017578, "global_step": 78328, "epoch": 943} {"train_loss": -21.348464965820312, "global_step": 78329, "epoch": 943} {"train_loss": -21.093595504760742, "global_step": 78330, "epoch": 943} {"train_loss": -21.698110580444336, "global_step": 78331, "epoch": 943} {"train_loss": -21.17608070373535, "global_step": 78332, "epoch": 943} {"train_loss": -21.166208267211914, "global_step": 78333, "epoch": 943} {"train_loss": -21.41635513305664, "global_step": 78334, "epoch": 943} {"train_loss": -21.08039093017578, "global_step": 78335, "epoch": 943} {"train_loss": -21.092323303222656, "global_step": 78336, "epoch": 943} {"train_loss": -21.167160034179688, "global_step": 78337, "epoch": 943} {"train_loss": -21.165494918823242, "global_step": 78338, "epoch": 943} {"train_loss": -21.290075302124023, "global_step": 78339, "epoch": 943} {"train_loss": -20.965194702148438, "global_step": 78340, "epoch": 943} {"train_loss": -21.337892532348633, "global_step": 78341, "epoch": 943} {"train_loss": -21.201004028320312, "global_step": 78342, "epoch": 943} {"train_loss": -20.93422508239746, "global_step": 78343, "epoch": 943} {"train_loss": -20.865488052368164, "global_step": 78344, "epoch": 943} {"train_loss": -21.554180145263672, "global_step": 78345, "epoch": 943} {"train_loss": -21.325143814086914, "global_step": 78346, "epoch": 943} {"train_loss": -21.080686569213867, "global_step": 78347, "epoch": 943} {"train_loss": -21.51615333557129, "global_step": 78348, "epoch": 943} {"train_loss": -21.177343368530273, "global_step": 78349, "epoch": 943} {"train_loss": -21.25343132019043, "global_step": 78350, "epoch": 943} {"train_loss": -21.121961088065643, "global_step": 78351, "epoch": 943, "val_loss": 6102714.0} {"train_loss": -20.476348876953125, "global_step": 78352, "epoch": 944} {"train_loss": -20.713098526000977, "global_step": 78353, "epoch": 944} {"train_loss": -20.603254318237305, "global_step": 78354, "epoch": 944} {"train_loss": -21.063573837280273, "global_step": 78355, "epoch": 944} {"train_loss": -20.359907150268555, "global_step": 78356, "epoch": 944} {"train_loss": -20.764192581176758, "global_step": 78357, "epoch": 944} {"train_loss": -20.874561309814453, "global_step": 78358, "epoch": 944} {"train_loss": -21.056352615356445, "global_step": 78359, "epoch": 944} {"train_loss": -21.062164306640625, "global_step": 78360, "epoch": 944} {"train_loss": -20.854320526123047, "global_step": 78361, "epoch": 944} {"train_loss": -21.12555503845215, "global_step": 78362, "epoch": 944} {"train_loss": -20.908884048461914, "global_step": 78363, "epoch": 944} {"train_loss": -20.789907455444336, "global_step": 78364, "epoch": 944} {"train_loss": -21.255521774291992, "global_step": 78365, "epoch": 944} {"train_loss": -20.537277221679688, "global_step": 78366, "epoch": 944} {"train_loss": -21.299097061157227, "global_step": 78367, "epoch": 944} {"train_loss": -21.22871971130371, "global_step": 78368, "epoch": 944} {"train_loss": -20.65363121032715, "global_step": 78369, "epoch": 944} {"train_loss": -21.11671257019043, "global_step": 78370, "epoch": 944} {"train_loss": -20.860570907592773, "global_step": 78371, "epoch": 944} {"train_loss": -21.1618595123291, "global_step": 78372, "epoch": 944} {"train_loss": -20.960840225219727, "global_step": 78373, "epoch": 944} {"train_loss": -20.946531295776367, "global_step": 78374, "epoch": 944} {"train_loss": -20.92476463317871, "global_step": 78375, "epoch": 944} {"train_loss": -20.82114601135254, "global_step": 78376, "epoch": 944} {"train_loss": -21.037763595581055, "global_step": 78377, "epoch": 944} {"train_loss": -20.973941802978516, "global_step": 78378, "epoch": 944} {"train_loss": -21.03969383239746, "global_step": 78379, "epoch": 944} {"train_loss": -21.20912742614746, "global_step": 78380, "epoch": 944} {"train_loss": -21.1740779876709, "global_step": 78381, "epoch": 944} {"train_loss": -21.09991455078125, "global_step": 78382, "epoch": 944} {"train_loss": -21.662092208862305, "global_step": 78383, "epoch": 944} {"train_loss": -20.7468204498291, "global_step": 78384, "epoch": 944} {"train_loss": -20.709701538085938, "global_step": 78385, "epoch": 944} {"train_loss": -21.150909423828125, "global_step": 78386, "epoch": 944} {"train_loss": -20.853378295898438, "global_step": 78387, "epoch": 944} {"train_loss": -21.09442901611328, "global_step": 78388, "epoch": 944} {"train_loss": -21.07674217224121, "global_step": 78389, "epoch": 944} {"train_loss": -20.8769474029541, "global_step": 78390, "epoch": 944} {"train_loss": -21.158708572387695, "global_step": 78391, "epoch": 944} {"train_loss": -21.25672721862793, "global_step": 78392, "epoch": 944} {"train_loss": -21.18450927734375, "global_step": 78393, "epoch": 944} {"train_loss": -20.8267822265625, "global_step": 78394, "epoch": 944} {"train_loss": -21.100854873657227, "global_step": 78395, "epoch": 944} {"train_loss": -21.223100662231445, "global_step": 78396, "epoch": 944} {"train_loss": -21.087791442871094, "global_step": 78397, "epoch": 944} {"train_loss": -20.985431671142578, "global_step": 78398, "epoch": 944} {"train_loss": -21.136314392089844, "global_step": 78399, "epoch": 944} {"train_loss": -21.092390060424805, "global_step": 78400, "epoch": 944} {"train_loss": -21.159616470336914, "global_step": 78401, "epoch": 944} {"train_loss": -21.247787475585938, "global_step": 78402, "epoch": 944} {"train_loss": -21.1993465423584, "global_step": 78403, "epoch": 944} {"train_loss": -21.042404174804688, "global_step": 78404, "epoch": 944} {"train_loss": -21.166898727416992, "global_step": 78405, "epoch": 944} {"train_loss": -21.075271606445312, "global_step": 78406, "epoch": 944} {"train_loss": -21.320789337158203, "global_step": 78407, "epoch": 944} {"train_loss": -21.3823184967041, "global_step": 78408, "epoch": 944} {"train_loss": -20.577316284179688, "global_step": 78409, "epoch": 944} {"train_loss": -21.330644607543945, "global_step": 78410, "epoch": 944} {"train_loss": -21.137048721313477, "global_step": 78411, "epoch": 944} {"train_loss": -21.240493774414062, "global_step": 78412, "epoch": 944} {"train_loss": -21.386566162109375, "global_step": 78413, "epoch": 944} {"train_loss": -21.215238571166992, "global_step": 78414, "epoch": 944} {"train_loss": -20.587373733520508, "global_step": 78415, "epoch": 944} {"train_loss": -20.906837463378906, "global_step": 78416, "epoch": 944} {"train_loss": -21.363767623901367, "global_step": 78417, "epoch": 944} {"train_loss": -20.772348403930664, "global_step": 78418, "epoch": 944} {"train_loss": -21.326374053955078, "global_step": 78419, "epoch": 944} {"train_loss": -21.18094825744629, "global_step": 78420, "epoch": 944} {"train_loss": -21.14592170715332, "global_step": 78421, "epoch": 944} {"train_loss": -21.374605178833008, "global_step": 78422, "epoch": 944} {"train_loss": -21.345205307006836, "global_step": 78423, "epoch": 944} {"train_loss": -21.216060638427734, "global_step": 78424, "epoch": 944} {"train_loss": -21.024534225463867, "global_step": 78425, "epoch": 944} {"train_loss": -21.24192237854004, "global_step": 78426, "epoch": 944} {"train_loss": -21.335660934448242, "global_step": 78427, "epoch": 944} {"train_loss": -21.178319931030273, "global_step": 78428, "epoch": 944} {"train_loss": -20.939321517944336, "global_step": 78429, "epoch": 944} {"train_loss": -21.09286117553711, "global_step": 78430, "epoch": 944} {"train_loss": -20.6649112701416, "global_step": 78431, "epoch": 944} {"train_loss": -20.826065063476562, "global_step": 78432, "epoch": 944} {"train_loss": -20.995710372924805, "global_step": 78433, "epoch": 944} {"train_loss": -21.032833788768354, "global_step": 78434, "epoch": 944, "val_loss": 6059304.0} {"train_loss": -20.525863647460938, "global_step": 78435, "epoch": 945} {"train_loss": -20.462583541870117, "global_step": 78436, "epoch": 945} {"train_loss": -20.748172760009766, "global_step": 78437, "epoch": 945} {"train_loss": -20.115659713745117, "global_step": 78438, "epoch": 945} {"train_loss": -20.994182586669922, "global_step": 78439, "epoch": 945} {"train_loss": -20.543701171875, "global_step": 78440, "epoch": 945} {"train_loss": -20.724149703979492, "global_step": 78441, "epoch": 945} {"train_loss": -20.916147232055664, "global_step": 78442, "epoch": 945} {"train_loss": -20.727874755859375, "global_step": 78443, "epoch": 945} {"train_loss": -20.600482940673828, "global_step": 78444, "epoch": 945} {"train_loss": -20.52772331237793, "global_step": 78445, "epoch": 945} {"train_loss": -21.194326400756836, "global_step": 78446, "epoch": 945} {"train_loss": -21.344825744628906, "global_step": 78447, "epoch": 945} {"train_loss": -21.109643936157227, "global_step": 78448, "epoch": 945} {"train_loss": -21.140792846679688, "global_step": 78449, "epoch": 945} {"train_loss": -20.979583740234375, "global_step": 78450, "epoch": 945} {"train_loss": -21.042844772338867, "global_step": 78451, "epoch": 945} {"train_loss": -21.052852630615234, "global_step": 78452, "epoch": 945} {"train_loss": -20.936399459838867, "global_step": 78453, "epoch": 945} {"train_loss": -21.426794052124023, "global_step": 78454, "epoch": 945} {"train_loss": -21.048152923583984, "global_step": 78455, "epoch": 945} {"train_loss": -21.000463485717773, "global_step": 78456, "epoch": 945} {"train_loss": -21.257186889648438, "global_step": 78457, "epoch": 945} {"train_loss": -21.211538314819336, "global_step": 78458, "epoch": 945} {"train_loss": -20.933568954467773, "global_step": 78459, "epoch": 945} {"train_loss": -20.644887924194336, "global_step": 78460, "epoch": 945} {"train_loss": -21.027847290039062, "global_step": 78461, "epoch": 945} {"train_loss": -21.16531753540039, "global_step": 78462, "epoch": 945} {"train_loss": -21.09470558166504, "global_step": 78463, "epoch": 945} {"train_loss": -21.086172103881836, "global_step": 78464, "epoch": 945} {"train_loss": -21.07765769958496, "global_step": 78465, "epoch": 945} {"train_loss": -20.714799880981445, "global_step": 78466, "epoch": 945} {"train_loss": -20.682565689086914, "global_step": 78467, "epoch": 945} {"train_loss": -21.26043128967285, "global_step": 78468, "epoch": 945} {"train_loss": -21.114669799804688, "global_step": 78469, "epoch": 945} {"train_loss": -21.30535316467285, "global_step": 78470, "epoch": 945} {"train_loss": -21.114606857299805, "global_step": 78471, "epoch": 945} {"train_loss": -20.816526412963867, "global_step": 78472, "epoch": 945} {"train_loss": -20.951435089111328, "global_step": 78473, "epoch": 945} {"train_loss": -20.800994873046875, "global_step": 78474, "epoch": 945} {"train_loss": -21.111936569213867, "global_step": 78475, "epoch": 945} {"train_loss": -20.967559814453125, "global_step": 78476, "epoch": 945} {"train_loss": -21.20712661743164, "global_step": 78477, "epoch": 945} {"train_loss": -21.08429527282715, "global_step": 78478, "epoch": 945} {"train_loss": -21.330366134643555, "global_step": 78479, "epoch": 945} {"train_loss": -21.3062686920166, "global_step": 78480, "epoch": 945} {"train_loss": -21.125473022460938, "global_step": 78481, "epoch": 945} {"train_loss": -21.371524810791016, "global_step": 78482, "epoch": 945} {"train_loss": -21.294464111328125, "global_step": 78483, "epoch": 945} {"train_loss": -21.36870574951172, "global_step": 78484, "epoch": 945} {"train_loss": -21.032140731811523, "global_step": 78485, "epoch": 945} {"train_loss": -21.543197631835938, "global_step": 78486, "epoch": 945} {"train_loss": -21.413938522338867, "global_step": 78487, "epoch": 945} {"train_loss": -21.43765640258789, "global_step": 78488, "epoch": 945} {"train_loss": -20.907514572143555, "global_step": 78489, "epoch": 945} {"train_loss": -21.1119441986084, "global_step": 78490, "epoch": 945} {"train_loss": -20.628835678100586, "global_step": 78491, "epoch": 945} {"train_loss": -21.152786254882812, "global_step": 78492, "epoch": 945} {"train_loss": -21.06784439086914, "global_step": 78493, "epoch": 945} {"train_loss": -21.125783920288086, "global_step": 78494, "epoch": 945} {"train_loss": -20.711700439453125, "global_step": 78495, "epoch": 945} {"train_loss": -20.89804458618164, "global_step": 78496, "epoch": 945} {"train_loss": -21.128646850585938, "global_step": 78497, "epoch": 945} {"train_loss": -21.262495040893555, "global_step": 78498, "epoch": 945} {"train_loss": -21.245582580566406, "global_step": 78499, "epoch": 945} {"train_loss": -21.430984497070312, "global_step": 78500, "epoch": 945} {"train_loss": -20.965147018432617, "global_step": 78501, "epoch": 945} {"train_loss": -21.056995391845703, "global_step": 78502, "epoch": 945} {"train_loss": -21.231916427612305, "global_step": 78503, "epoch": 945} {"train_loss": -21.268754959106445, "global_step": 78504, "epoch": 945} {"train_loss": -20.85087013244629, "global_step": 78505, "epoch": 945} {"train_loss": -21.113601684570312, "global_step": 78506, "epoch": 945} {"train_loss": -21.092931747436523, "global_step": 78507, "epoch": 945} {"train_loss": -21.35700035095215, "global_step": 78508, "epoch": 945} {"train_loss": -21.38065528869629, "global_step": 78509, "epoch": 945} {"train_loss": -20.937231063842773, "global_step": 78510, "epoch": 945} {"train_loss": -21.492090225219727, "global_step": 78511, "epoch": 945} {"train_loss": -20.913557052612305, "global_step": 78512, "epoch": 945} {"train_loss": -21.15818977355957, "global_step": 78513, "epoch": 945} {"train_loss": -21.01018524169922, "global_step": 78514, "epoch": 945} {"train_loss": -21.443246841430664, "global_step": 78515, "epoch": 945} {"train_loss": -20.966575622558594, "global_step": 78516, "epoch": 945} {"train_loss": -21.035516922732434, "global_step": 78517, "epoch": 945, "val_loss": 6052156.0} {"train_loss": -20.067609786987305, "global_step": 78518, "epoch": 946} {"train_loss": -20.660982131958008, "global_step": 78519, "epoch": 946} {"train_loss": -20.14335060119629, "global_step": 78520, "epoch": 946} {"train_loss": -21.04425048828125, "global_step": 78521, "epoch": 946} {"train_loss": -20.148366928100586, "global_step": 78522, "epoch": 946} {"train_loss": -20.443435668945312, "global_step": 78523, "epoch": 946} {"train_loss": -20.436323165893555, "global_step": 78524, "epoch": 946} {"train_loss": -20.44179344177246, "global_step": 78525, "epoch": 946} {"train_loss": -20.64971160888672, "global_step": 78526, "epoch": 946} {"train_loss": -20.464000701904297, "global_step": 78527, "epoch": 946} {"train_loss": -20.795330047607422, "global_step": 78528, "epoch": 946} {"train_loss": -20.605623245239258, "global_step": 78529, "epoch": 946} {"train_loss": -20.453283309936523, "global_step": 78530, "epoch": 946} {"train_loss": -20.415058135986328, "global_step": 78531, "epoch": 946} {"train_loss": -20.399860382080078, "global_step": 78532, "epoch": 946} {"train_loss": -21.08060646057129, "global_step": 78533, "epoch": 946} {"train_loss": -20.584251403808594, "global_step": 78534, "epoch": 946} {"train_loss": -20.85634422302246, "global_step": 78535, "epoch": 946} {"train_loss": -20.82037353515625, "global_step": 78536, "epoch": 946} {"train_loss": -21.017343521118164, "global_step": 78537, "epoch": 946} {"train_loss": -20.36594009399414, "global_step": 78538, "epoch": 946} {"train_loss": -20.908477783203125, "global_step": 78539, "epoch": 946} {"train_loss": -21.004711151123047, "global_step": 78540, "epoch": 946} {"train_loss": -20.760242462158203, "global_step": 78541, "epoch": 946} {"train_loss": -21.098974227905273, "global_step": 78542, "epoch": 946} {"train_loss": -20.77044105529785, "global_step": 78543, "epoch": 946} {"train_loss": -20.885419845581055, "global_step": 78544, "epoch": 946} {"train_loss": -20.697101593017578, "global_step": 78545, "epoch": 946} {"train_loss": -20.314123153686523, "global_step": 78546, "epoch": 946} {"train_loss": -20.640445709228516, "global_step": 78547, "epoch": 946} {"train_loss": -21.077091217041016, "global_step": 78548, "epoch": 946} {"train_loss": -21.21622657775879, "global_step": 78549, "epoch": 946} {"train_loss": -21.156064987182617, "global_step": 78550, "epoch": 946} {"train_loss": -20.9372615814209, "global_step": 78551, "epoch": 946} {"train_loss": -21.132186889648438, "global_step": 78552, "epoch": 946} {"train_loss": -20.99376106262207, "global_step": 78553, "epoch": 946} {"train_loss": -20.966711044311523, "global_step": 78554, "epoch": 946} {"train_loss": -21.203460693359375, "global_step": 78555, "epoch": 946} {"train_loss": -21.186559677124023, "global_step": 78556, "epoch": 946} {"train_loss": -21.079248428344727, "global_step": 78557, "epoch": 946} {"train_loss": -20.80976676940918, "global_step": 78558, "epoch": 946} {"train_loss": -20.896526336669922, "global_step": 78559, "epoch": 946} {"train_loss": -21.03853416442871, "global_step": 78560, "epoch": 946} {"train_loss": -21.182966232299805, "global_step": 78561, "epoch": 946} {"train_loss": -21.154048919677734, "global_step": 78562, "epoch": 946} {"train_loss": -21.133188247680664, "global_step": 78563, "epoch": 946} {"train_loss": -20.91214370727539, "global_step": 78564, "epoch": 946} {"train_loss": -20.95391273498535, "global_step": 78565, "epoch": 946} {"train_loss": -21.541004180908203, "global_step": 78566, "epoch": 946} {"train_loss": -21.09354591369629, "global_step": 78567, "epoch": 946} {"train_loss": -21.345102310180664, "global_step": 78568, "epoch": 946} {"train_loss": -21.10440444946289, "global_step": 78569, "epoch": 946} {"train_loss": -20.6911678314209, "global_step": 78570, "epoch": 946} {"train_loss": -20.888559341430664, "global_step": 78571, "epoch": 946} {"train_loss": -21.321279525756836, "global_step": 78572, "epoch": 946} {"train_loss": -21.408950805664062, "global_step": 78573, "epoch": 946} {"train_loss": -21.154821395874023, "global_step": 78574, "epoch": 946} {"train_loss": -21.474342346191406, "global_step": 78575, "epoch": 946} {"train_loss": -21.14411735534668, "global_step": 78576, "epoch": 946} {"train_loss": -21.199466705322266, "global_step": 78577, "epoch": 946} {"train_loss": -21.628870010375977, "global_step": 78578, "epoch": 946} {"train_loss": -21.05631446838379, "global_step": 78579, "epoch": 946} {"train_loss": -21.156538009643555, "global_step": 78580, "epoch": 946} {"train_loss": -21.08106803894043, "global_step": 78581, "epoch": 946} {"train_loss": -21.190845489501953, "global_step": 78582, "epoch": 946} {"train_loss": -20.850378036499023, "global_step": 78583, "epoch": 946} {"train_loss": -21.117185592651367, "global_step": 78584, "epoch": 946} {"train_loss": -21.265581130981445, "global_step": 78585, "epoch": 946} {"train_loss": -20.68058204650879, "global_step": 78586, "epoch": 946} {"train_loss": -21.199262619018555, "global_step": 78587, "epoch": 946} {"train_loss": -21.366018295288086, "global_step": 78588, "epoch": 946} {"train_loss": -20.77573585510254, "global_step": 78589, "epoch": 946} {"train_loss": -21.329864501953125, "global_step": 78590, "epoch": 946} {"train_loss": -21.153690338134766, "global_step": 78591, "epoch": 946} {"train_loss": -21.147947311401367, "global_step": 78592, "epoch": 946} {"train_loss": -20.915332794189453, "global_step": 78593, "epoch": 946} {"train_loss": -21.219318389892578, "global_step": 78594, "epoch": 946} {"train_loss": -20.99532127380371, "global_step": 78595, "epoch": 946} {"train_loss": -21.220102310180664, "global_step": 78596, "epoch": 946} {"train_loss": -21.254592895507812, "global_step": 78597, "epoch": 946} {"train_loss": -20.894346237182617, "global_step": 78598, "epoch": 946} {"train_loss": -20.7314510345459, "global_step": 78599, "epoch": 946} {"train_loss": -20.945675585643354, "global_step": 78600, "epoch": 946, "val_loss": 6080303.0} {"train_loss": -19.741718292236328, "global_step": 78601, "epoch": 947} {"train_loss": -20.81947898864746, "global_step": 78602, "epoch": 947} {"train_loss": -20.79248046875, "global_step": 78603, "epoch": 947} {"train_loss": -20.625141143798828, "global_step": 78604, "epoch": 947} {"train_loss": -20.75253677368164, "global_step": 78605, "epoch": 947} {"train_loss": -20.736509323120117, "global_step": 78606, "epoch": 947} {"train_loss": -20.928714752197266, "global_step": 78607, "epoch": 947} {"train_loss": -20.804824829101562, "global_step": 78608, "epoch": 947} {"train_loss": -20.611635208129883, "global_step": 78609, "epoch": 947} {"train_loss": -20.968420028686523, "global_step": 78610, "epoch": 947} {"train_loss": -20.847675323486328, "global_step": 78611, "epoch": 947} {"train_loss": -20.501245498657227, "global_step": 78612, "epoch": 947} {"train_loss": -21.112844467163086, "global_step": 78613, "epoch": 947} {"train_loss": -20.90336036682129, "global_step": 78614, "epoch": 947} {"train_loss": -21.085683822631836, "global_step": 78615, "epoch": 947} {"train_loss": -20.556318283081055, "global_step": 78616, "epoch": 947} {"train_loss": -20.594064712524414, "global_step": 78617, "epoch": 947} {"train_loss": -20.856582641601562, "global_step": 78618, "epoch": 947} {"train_loss": -20.99359893798828, "global_step": 78619, "epoch": 947} {"train_loss": -20.807907104492188, "global_step": 78620, "epoch": 947} {"train_loss": -21.191207885742188, "global_step": 78621, "epoch": 947} {"train_loss": -20.560354232788086, "global_step": 78622, "epoch": 947} {"train_loss": -21.020404815673828, "global_step": 78623, "epoch": 947} {"train_loss": -20.923158645629883, "global_step": 78624, "epoch": 947} {"train_loss": -21.05991554260254, "global_step": 78625, "epoch": 947} {"train_loss": -21.255847930908203, "global_step": 78626, "epoch": 947} {"train_loss": -21.3287353515625, "global_step": 78627, "epoch": 947} {"train_loss": -20.93868064880371, "global_step": 78628, "epoch": 947} {"train_loss": -21.213109970092773, "global_step": 78629, "epoch": 947} {"train_loss": -20.915639877319336, "global_step": 78630, "epoch": 947} {"train_loss": -21.336387634277344, "global_step": 78631, "epoch": 947} {"train_loss": -21.419198989868164, "global_step": 78632, "epoch": 947} {"train_loss": -21.06386375427246, "global_step": 78633, "epoch": 947} {"train_loss": -21.050369262695312, "global_step": 78634, "epoch": 947} {"train_loss": -20.865049362182617, "global_step": 78635, "epoch": 947} {"train_loss": -21.011198043823242, "global_step": 78636, "epoch": 947} {"train_loss": -21.07846450805664, "global_step": 78637, "epoch": 947} {"train_loss": -21.286062240600586, "global_step": 78638, "epoch": 947} {"train_loss": -21.15851402282715, "global_step": 78639, "epoch": 947} {"train_loss": -21.111209869384766, "global_step": 78640, "epoch": 947} {"train_loss": -21.113994598388672, "global_step": 78641, "epoch": 947} {"train_loss": -21.2440185546875, "global_step": 78642, "epoch": 947} {"train_loss": -21.073545455932617, "global_step": 78643, "epoch": 947} {"train_loss": -20.789316177368164, "global_step": 78644, "epoch": 947} {"train_loss": -20.91559410095215, "global_step": 78645, "epoch": 947} {"train_loss": -21.198749542236328, "global_step": 78646, "epoch": 947} {"train_loss": -21.168041229248047, "global_step": 78647, "epoch": 947} {"train_loss": -21.23174476623535, "global_step": 78648, "epoch": 947} {"train_loss": -21.324493408203125, "global_step": 78649, "epoch": 947} {"train_loss": -21.10418128967285, "global_step": 78650, "epoch": 947} {"train_loss": -20.940977096557617, "global_step": 78651, "epoch": 947} {"train_loss": -21.360361099243164, "global_step": 78652, "epoch": 947} {"train_loss": -21.00874137878418, "global_step": 78653, "epoch": 947} {"train_loss": -21.220489501953125, "global_step": 78654, "epoch": 947} {"train_loss": -21.614166259765625, "global_step": 78655, "epoch": 947} {"train_loss": -21.011192321777344, "global_step": 78656, "epoch": 947} {"train_loss": -21.19841766357422, "global_step": 78657, "epoch": 947} {"train_loss": -21.031482696533203, "global_step": 78658, "epoch": 947} {"train_loss": -21.254575729370117, "global_step": 78659, "epoch": 947} {"train_loss": -21.503477096557617, "global_step": 78660, "epoch": 947} {"train_loss": -21.326873779296875, "global_step": 78661, "epoch": 947} {"train_loss": -21.271286010742188, "global_step": 78662, "epoch": 947} {"train_loss": -20.9920711517334, "global_step": 78663, "epoch": 947} {"train_loss": -20.992393493652344, "global_step": 78664, "epoch": 947} {"train_loss": -21.181089401245117, "global_step": 78665, "epoch": 947} {"train_loss": -21.142017364501953, "global_step": 78666, "epoch": 947} {"train_loss": -21.1191349029541, "global_step": 78667, "epoch": 947} {"train_loss": -20.92317008972168, "global_step": 78668, "epoch": 947} {"train_loss": -21.18946075439453, "global_step": 78669, "epoch": 947} {"train_loss": -21.437101364135742, "global_step": 78670, "epoch": 947} {"train_loss": -21.36410140991211, "global_step": 78671, "epoch": 947} {"train_loss": -21.096548080444336, "global_step": 78672, "epoch": 947} {"train_loss": -21.143125534057617, "global_step": 78673, "epoch": 947} {"train_loss": -21.166486740112305, "global_step": 78674, "epoch": 947} {"train_loss": -21.17294692993164, "global_step": 78675, "epoch": 947} {"train_loss": -21.152189254760742, "global_step": 78676, "epoch": 947} {"train_loss": -21.018606185913086, "global_step": 78677, "epoch": 947} {"train_loss": -21.056293487548828, "global_step": 78678, "epoch": 947} {"train_loss": -20.78424072265625, "global_step": 78679, "epoch": 947} {"train_loss": -21.743741989135742, "global_step": 78680, "epoch": 947} {"train_loss": -21.11859703063965, "global_step": 78681, "epoch": 947} {"train_loss": -21.37361717224121, "global_step": 78682, "epoch": 947} {"train_loss": -21.054256278348255, "global_step": 78683, "epoch": 947, "val_loss": 6084100.5} {"train_loss": -20.771106719970703, "global_step": 78684, "epoch": 948} {"train_loss": -21.0251522064209, "global_step": 78685, "epoch": 948} {"train_loss": -20.97513198852539, "global_step": 78686, "epoch": 948} {"train_loss": -20.593351364135742, "global_step": 78687, "epoch": 948} {"train_loss": -21.112611770629883, "global_step": 78688, "epoch": 948} {"train_loss": -20.782907485961914, "global_step": 78689, "epoch": 948} {"train_loss": -20.806901931762695, "global_step": 78690, "epoch": 948} {"train_loss": -21.361242294311523, "global_step": 78691, "epoch": 948} {"train_loss": -20.979557037353516, "global_step": 78692, "epoch": 948} {"train_loss": -21.1837215423584, "global_step": 78693, "epoch": 948} {"train_loss": -21.050588607788086, "global_step": 78694, "epoch": 948} {"train_loss": -20.928537368774414, "global_step": 78695, "epoch": 948} {"train_loss": -21.29152488708496, "global_step": 78696, "epoch": 948} {"train_loss": -21.2469539642334, "global_step": 78697, "epoch": 948} {"train_loss": -21.044431686401367, "global_step": 78698, "epoch": 948} {"train_loss": -21.248937606811523, "global_step": 78699, "epoch": 948} {"train_loss": -21.024795532226562, "global_step": 78700, "epoch": 948} {"train_loss": -20.989925384521484, "global_step": 78701, "epoch": 948} {"train_loss": -20.78075408935547, "global_step": 78702, "epoch": 948} {"train_loss": -21.669605255126953, "global_step": 78703, "epoch": 948} {"train_loss": -21.44541358947754, "global_step": 78704, "epoch": 948} {"train_loss": -20.944950103759766, "global_step": 78705, "epoch": 948} {"train_loss": -21.25686264038086, "global_step": 78706, "epoch": 948} {"train_loss": -20.74173927307129, "global_step": 78707, "epoch": 948} {"train_loss": -21.300031661987305, "global_step": 78708, "epoch": 948} {"train_loss": -21.123167037963867, "global_step": 78709, "epoch": 948} {"train_loss": -21.41261863708496, "global_step": 78710, "epoch": 948} {"train_loss": -21.128097534179688, "global_step": 78711, "epoch": 948} {"train_loss": -21.180368423461914, "global_step": 78712, "epoch": 948} {"train_loss": -21.36556053161621, "global_step": 78713, "epoch": 948} {"train_loss": -21.36525535583496, "global_step": 78714, "epoch": 948} {"train_loss": -21.335840225219727, "global_step": 78715, "epoch": 948} {"train_loss": -21.500141143798828, "global_step": 78716, "epoch": 948} {"train_loss": -21.043949127197266, "global_step": 78717, "epoch": 948} {"train_loss": -21.389066696166992, "global_step": 78718, "epoch": 948} {"train_loss": -21.040302276611328, "global_step": 78719, "epoch": 948} {"train_loss": -21.069360733032227, "global_step": 78720, "epoch": 948} {"train_loss": -21.10232925415039, "global_step": 78721, "epoch": 948} {"train_loss": -21.020313262939453, "global_step": 78722, "epoch": 948} {"train_loss": -21.415395736694336, "global_step": 78723, "epoch": 948} {"train_loss": -21.283109664916992, "global_step": 78724, "epoch": 948} {"train_loss": -21.410974502563477, "global_step": 78725, "epoch": 948} {"train_loss": -21.28025245666504, "global_step": 78726, "epoch": 948} {"train_loss": -21.302555084228516, "global_step": 78727, "epoch": 948} {"train_loss": -21.109777450561523, "global_step": 78728, "epoch": 948} {"train_loss": -21.321096420288086, "global_step": 78729, "epoch": 948} {"train_loss": -21.262372970581055, "global_step": 78730, "epoch": 948} {"train_loss": -20.85210609436035, "global_step": 78731, "epoch": 948} {"train_loss": -21.002267837524414, "global_step": 78732, "epoch": 948} {"train_loss": -21.18168830871582, "global_step": 78733, "epoch": 948} {"train_loss": -21.532194137573242, "global_step": 78734, "epoch": 948} {"train_loss": -21.15389060974121, "global_step": 78735, "epoch": 948} {"train_loss": -21.366796493530273, "global_step": 78736, "epoch": 948} {"train_loss": -21.3404483795166, "global_step": 78737, "epoch": 948} {"train_loss": -21.18218231201172, "global_step": 78738, "epoch": 948} {"train_loss": -21.3772029876709, "global_step": 78739, "epoch": 948} {"train_loss": -20.959157943725586, "global_step": 78740, "epoch": 948} {"train_loss": -21.119516372680664, "global_step": 78741, "epoch": 948} {"train_loss": -21.441715240478516, "global_step": 78742, "epoch": 948} {"train_loss": -21.281585693359375, "global_step": 78743, "epoch": 948} {"train_loss": -20.890478134155273, "global_step": 78744, "epoch": 948} {"train_loss": -21.592538833618164, "global_step": 78745, "epoch": 948} {"train_loss": -21.44428062438965, "global_step": 78746, "epoch": 948} {"train_loss": -21.367942810058594, "global_step": 78747, "epoch": 948} {"train_loss": -21.242841720581055, "global_step": 78748, "epoch": 948} {"train_loss": -21.288602828979492, "global_step": 78749, "epoch": 948} {"train_loss": -21.393129348754883, "global_step": 78750, "epoch": 948} {"train_loss": -20.89060401916504, "global_step": 78751, "epoch": 948} {"train_loss": -21.031667709350586, "global_step": 78752, "epoch": 948} {"train_loss": -21.210906982421875, "global_step": 78753, "epoch": 948} {"train_loss": -20.847780227661133, "global_step": 78754, "epoch": 948} {"train_loss": -21.203289031982422, "global_step": 78755, "epoch": 948} {"train_loss": -21.434804916381836, "global_step": 78756, "epoch": 948} {"train_loss": -21.22807502746582, "global_step": 78757, "epoch": 948} {"train_loss": -20.939294815063477, "global_step": 78758, "epoch": 948} {"train_loss": -21.049055099487305, "global_step": 78759, "epoch": 948} {"train_loss": -21.237167358398438, "global_step": 78760, "epoch": 948} {"train_loss": -20.853971481323242, "global_step": 78761, "epoch": 948} {"train_loss": -21.18523597717285, "global_step": 78762, "epoch": 948} {"train_loss": -21.154518127441406, "global_step": 78763, "epoch": 948} {"train_loss": -21.236989974975586, "global_step": 78764, "epoch": 948} {"train_loss": -21.20134735107422, "global_step": 78765, "epoch": 948} {"train_loss": -21.176711944212396, "global_step": 78766, "epoch": 948, "val_loss": 6045439.5} {"train_loss": -21.220029830932617, "global_step": 78767, "epoch": 949} {"train_loss": -20.833965301513672, "global_step": 78768, "epoch": 949} {"train_loss": -21.148319244384766, "global_step": 78769, "epoch": 949} {"train_loss": -20.44434356689453, "global_step": 78770, "epoch": 949} {"train_loss": -21.19205093383789, "global_step": 78771, "epoch": 949} {"train_loss": -20.859914779663086, "global_step": 78772, "epoch": 949} {"train_loss": -20.9769344329834, "global_step": 78773, "epoch": 949} {"train_loss": -21.324743270874023, "global_step": 78774, "epoch": 949} {"train_loss": -20.87465476989746, "global_step": 78775, "epoch": 949} {"train_loss": -20.928375244140625, "global_step": 78776, "epoch": 949} {"train_loss": -21.25018882751465, "global_step": 78777, "epoch": 949} {"train_loss": -21.1744441986084, "global_step": 78778, "epoch": 949} {"train_loss": -21.166664123535156, "global_step": 78779, "epoch": 949} {"train_loss": -20.887561798095703, "global_step": 78780, "epoch": 949} {"train_loss": -21.162424087524414, "global_step": 78781, "epoch": 949} {"train_loss": -20.908954620361328, "global_step": 78782, "epoch": 949} {"train_loss": -20.870649337768555, "global_step": 78783, "epoch": 949} {"train_loss": -21.3207950592041, "global_step": 78784, "epoch": 949} {"train_loss": -20.954618453979492, "global_step": 78785, "epoch": 949} {"train_loss": -21.14301872253418, "global_step": 78786, "epoch": 949} {"train_loss": -20.853849411010742, "global_step": 78787, "epoch": 949} {"train_loss": -21.106840133666992, "global_step": 78788, "epoch": 949} {"train_loss": -21.277748107910156, "global_step": 78789, "epoch": 949} {"train_loss": -21.117218017578125, "global_step": 78790, "epoch": 949} {"train_loss": -20.988821029663086, "global_step": 78791, "epoch": 949} {"train_loss": -20.775400161743164, "global_step": 78792, "epoch": 949} {"train_loss": -21.133085250854492, "global_step": 78793, "epoch": 949} {"train_loss": -21.378807067871094, "global_step": 78794, "epoch": 949} {"train_loss": -21.271636962890625, "global_step": 78795, "epoch": 949} {"train_loss": -21.107715606689453, "global_step": 78796, "epoch": 949} {"train_loss": -20.82511329650879, "global_step": 78797, "epoch": 949} {"train_loss": -21.23939323425293, "global_step": 78798, "epoch": 949} {"train_loss": -21.097936630249023, "global_step": 78799, "epoch": 949} {"train_loss": -21.10855484008789, "global_step": 78800, "epoch": 949} {"train_loss": -21.528669357299805, "global_step": 78801, "epoch": 949} {"train_loss": -21.5048828125, "global_step": 78802, "epoch": 949} {"train_loss": -21.361984252929688, "global_step": 78803, "epoch": 949} {"train_loss": -21.259679794311523, "global_step": 78804, "epoch": 949} {"train_loss": -21.27534294128418, "global_step": 78805, "epoch": 949} {"train_loss": -21.251893997192383, "global_step": 78806, "epoch": 949} {"train_loss": -21.199560165405273, "global_step": 78807, "epoch": 949} {"train_loss": -21.106111526489258, "global_step": 78808, "epoch": 949} {"train_loss": -21.066497802734375, "global_step": 78809, "epoch": 949} {"train_loss": -20.93146514892578, "global_step": 78810, "epoch": 949} {"train_loss": -20.90041732788086, "global_step": 78811, "epoch": 949} {"train_loss": -21.073471069335938, "global_step": 78812, "epoch": 949} {"train_loss": -21.23482322692871, "global_step": 78813, "epoch": 949} {"train_loss": -21.07623863220215, "global_step": 78814, "epoch": 949} {"train_loss": -21.163467407226562, "global_step": 78815, "epoch": 949} {"train_loss": -21.381376266479492, "global_step": 78816, "epoch": 949} {"train_loss": -21.05852699279785, "global_step": 78817, "epoch": 949} {"train_loss": -21.2235050201416, "global_step": 78818, "epoch": 949} {"train_loss": -20.74946403503418, "global_step": 78819, "epoch": 949} {"train_loss": -21.177186965942383, "global_step": 78820, "epoch": 949} {"train_loss": -21.447769165039062, "global_step": 78821, "epoch": 949} {"train_loss": -20.958698272705078, "global_step": 78822, "epoch": 949} {"train_loss": -21.6975154876709, "global_step": 78823, "epoch": 949} {"train_loss": -20.982458114624023, "global_step": 78824, "epoch": 949} {"train_loss": -21.17138671875, "global_step": 78825, "epoch": 949} {"train_loss": -21.576284408569336, "global_step": 78826, "epoch": 949} {"train_loss": -20.666654586791992, "global_step": 78827, "epoch": 949} {"train_loss": -21.304851531982422, "global_step": 78828, "epoch": 949} {"train_loss": -21.278873443603516, "global_step": 78829, "epoch": 949} {"train_loss": -21.646902084350586, "global_step": 78830, "epoch": 949} {"train_loss": -21.351816177368164, "global_step": 78831, "epoch": 949} {"train_loss": -20.668058395385742, "global_step": 78832, "epoch": 949} {"train_loss": -21.298736572265625, "global_step": 78833, "epoch": 949} {"train_loss": -21.259931564331055, "global_step": 78834, "epoch": 949} {"train_loss": -21.372173309326172, "global_step": 78835, "epoch": 949} {"train_loss": -21.089773178100586, "global_step": 78836, "epoch": 949} {"train_loss": -21.23783302307129, "global_step": 78837, "epoch": 949} {"train_loss": -21.13945960998535, "global_step": 78838, "epoch": 949} {"train_loss": -21.37244987487793, "global_step": 78839, "epoch": 949} {"train_loss": -21.62796974182129, "global_step": 78840, "epoch": 949} {"train_loss": -21.135913848876953, "global_step": 78841, "epoch": 949} {"train_loss": -21.091093063354492, "global_step": 78842, "epoch": 949} {"train_loss": -21.1877384185791, "global_step": 78843, "epoch": 949} {"train_loss": -21.4737548828125, "global_step": 78844, "epoch": 949} {"train_loss": -21.314579010009766, "global_step": 78845, "epoch": 949} {"train_loss": -21.547531127929688, "global_step": 78846, "epoch": 949} {"train_loss": -21.090042114257812, "global_step": 78847, "epoch": 949} {"train_loss": -21.623573303222656, "global_step": 78848, "epoch": 949} {"train_loss": -21.14010744209749, "global_step": 78849, "epoch": 949, "val_loss": 6101102.5} {"train_loss": -20.934499740600586, "global_step": 78850, "epoch": 950} {"train_loss": -20.669403076171875, "global_step": 78851, "epoch": 950} {"train_loss": -20.72086524963379, "global_step": 78852, "epoch": 950} {"train_loss": -21.12912368774414, "global_step": 78853, "epoch": 950} {"train_loss": -20.442075729370117, "global_step": 78854, "epoch": 950} {"train_loss": -20.800445556640625, "global_step": 78855, "epoch": 950} {"train_loss": -21.093358993530273, "global_step": 78856, "epoch": 950} {"train_loss": -21.209110260009766, "global_step": 78857, "epoch": 950} {"train_loss": -20.585163116455078, "global_step": 78858, "epoch": 950} {"train_loss": -21.06372833251953, "global_step": 78859, "epoch": 950} {"train_loss": -20.961164474487305, "global_step": 78860, "epoch": 950} {"train_loss": -20.816499710083008, "global_step": 78861, "epoch": 950} {"train_loss": -20.822494506835938, "global_step": 78862, "epoch": 950} {"train_loss": -20.978527069091797, "global_step": 78863, "epoch": 950} {"train_loss": -20.873220443725586, "global_step": 78864, "epoch": 950} {"train_loss": -21.23760414123535, "global_step": 78865, "epoch": 950} {"train_loss": -21.02069091796875, "global_step": 78866, "epoch": 950} {"train_loss": -20.924245834350586, "global_step": 78867, "epoch": 950} {"train_loss": -21.123172760009766, "global_step": 78868, "epoch": 950} {"train_loss": -21.330686569213867, "global_step": 78869, "epoch": 950} {"train_loss": -21.11678123474121, "global_step": 78870, "epoch": 950} {"train_loss": -20.9077205657959, "global_step": 78871, "epoch": 950} {"train_loss": -20.87623405456543, "global_step": 78872, "epoch": 950} {"train_loss": -20.9499568939209, "global_step": 78873, "epoch": 950} {"train_loss": -21.168289184570312, "global_step": 78874, "epoch": 950} {"train_loss": -20.882444381713867, "global_step": 78875, "epoch": 950} {"train_loss": -21.166091918945312, "global_step": 78876, "epoch": 950} {"train_loss": -21.05489158630371, "global_step": 78877, "epoch": 950} {"train_loss": -21.12113380432129, "global_step": 78878, "epoch": 950} {"train_loss": -21.288434982299805, "global_step": 78879, "epoch": 950} {"train_loss": -21.666120529174805, "global_step": 78880, "epoch": 950} {"train_loss": -20.94197654724121, "global_step": 78881, "epoch": 950} {"train_loss": -21.202838897705078, "global_step": 78882, "epoch": 950} {"train_loss": -21.22013282775879, "global_step": 78883, "epoch": 950} {"train_loss": -21.38861656188965, "global_step": 78884, "epoch": 950} {"train_loss": -21.24394989013672, "global_step": 78885, "epoch": 950} {"train_loss": -21.37378692626953, "global_step": 78886, "epoch": 950} {"train_loss": -21.645841598510742, "global_step": 78887, "epoch": 950} {"train_loss": -21.28396987915039, "global_step": 78888, "epoch": 950} {"train_loss": -21.287073135375977, "global_step": 78889, "epoch": 950} {"train_loss": -21.387161254882812, "global_step": 78890, "epoch": 950} {"train_loss": -21.051403045654297, "global_step": 78891, "epoch": 950} {"train_loss": -21.50456428527832, "global_step": 78892, "epoch": 950} {"train_loss": -21.02712059020996, "global_step": 78893, "epoch": 950} {"train_loss": -20.730375289916992, "global_step": 78894, "epoch": 950} {"train_loss": -20.788251876831055, "global_step": 78895, "epoch": 950} {"train_loss": -20.83791160583496, "global_step": 78896, "epoch": 950} {"train_loss": -21.138154983520508, "global_step": 78897, "epoch": 950} {"train_loss": -21.395044326782227, "global_step": 78898, "epoch": 950} {"train_loss": -21.51704216003418, "global_step": 78899, "epoch": 950} {"train_loss": -20.883304595947266, "global_step": 78900, "epoch": 950} {"train_loss": -21.442251205444336, "global_step": 78901, "epoch": 950} {"train_loss": -20.897207260131836, "global_step": 78902, "epoch": 950} {"train_loss": -21.035898208618164, "global_step": 78903, "epoch": 950} {"train_loss": -21.082849502563477, "global_step": 78904, "epoch": 950} {"train_loss": -21.051929473876953, "global_step": 78905, "epoch": 950} {"train_loss": -21.386531829833984, "global_step": 78906, "epoch": 950} {"train_loss": -20.889392852783203, "global_step": 78907, "epoch": 950} {"train_loss": -21.10601234436035, "global_step": 78908, "epoch": 950} {"train_loss": -21.194982528686523, "global_step": 78909, "epoch": 950} {"train_loss": -20.913047790527344, "global_step": 78910, "epoch": 950} {"train_loss": -21.5106143951416, "global_step": 78911, "epoch": 950} {"train_loss": -21.29422378540039, "global_step": 78912, "epoch": 950} {"train_loss": -21.407730102539062, "global_step": 78913, "epoch": 950} {"train_loss": -21.20755386352539, "global_step": 78914, "epoch": 950} {"train_loss": -21.165660858154297, "global_step": 78915, "epoch": 950} {"train_loss": -21.17597770690918, "global_step": 78916, "epoch": 950} {"train_loss": -21.310277938842773, "global_step": 78917, "epoch": 950} {"train_loss": -21.420690536499023, "global_step": 78918, "epoch": 950} {"train_loss": -21.366744995117188, "global_step": 78919, "epoch": 950} {"train_loss": -21.3542537689209, "global_step": 78920, "epoch": 950} {"train_loss": -21.492637634277344, "global_step": 78921, "epoch": 950} {"train_loss": -21.076223373413086, "global_step": 78922, "epoch": 950} {"train_loss": -21.162288665771484, "global_step": 78923, "epoch": 950} {"train_loss": -21.347082138061523, "global_step": 78924, "epoch": 950} {"train_loss": -21.397573471069336, "global_step": 78925, "epoch": 950} {"train_loss": -21.54334831237793, "global_step": 78926, "epoch": 950} {"train_loss": -20.81271743774414, "global_step": 78927, "epoch": 950} {"train_loss": -21.484638214111328, "global_step": 78928, "epoch": 950} {"train_loss": -21.003637313842773, "global_step": 78929, "epoch": 950} {"train_loss": -21.302465438842773, "global_step": 78930, "epoch": 950} {"train_loss": -21.239320755004883, "global_step": 78931, "epoch": 950} {"train_loss": -21.134688136089277, "global_step": 78932, "epoch": 950, "train/sim_max_reward_0": 1.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 0.0, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4500000": 1.0, "test/sim_max_reward_4500001": 1.0, "test/sim_max_reward_4500002": 1.0, "test/sim_max_reward_4500003": 1.0, "test/sim_max_reward_4500004": 1.0, "test/sim_max_reward_4500005": 1.0, "test/sim_max_reward_4500006": 0.0, "test/sim_max_reward_4500007": 1.0, "test/sim_max_reward_4500008": 1.0, "test/sim_max_reward_4500009": 1.0, "test/sim_max_reward_4500010": 1.0, "test/sim_max_reward_4500011": 1.0, "test/sim_max_reward_4500012": 1.0, "test/sim_max_reward_4500013": 1.0, "test/sim_max_reward_4500014": 1.0, "test/sim_max_reward_4500015": 1.0, "test/sim_max_reward_4500016": 1.0, "test/sim_max_reward_4500017": 1.0, "test/sim_max_reward_4500018": 1.0, "test/sim_max_reward_4500019": 1.0, "test/sim_max_reward_4500020": 1.0, "test/sim_max_reward_4500021": 1.0, "train/mean_score": 0.8333333333333334, "test/mean_score": 0.9545454545454546, "val_loss": 6000260.0} {"train_loss": -20.99665641784668, "global_step": 78933, "epoch": 951} {"train_loss": -21.094640731811523, "global_step": 78934, "epoch": 951} {"train_loss": -20.90228271484375, "global_step": 78935, "epoch": 951} {"train_loss": -21.159936904907227, "global_step": 78936, "epoch": 951} {"train_loss": -21.24041175842285, "global_step": 78937, "epoch": 951} {"train_loss": -21.074308395385742, "global_step": 78938, "epoch": 951} {"train_loss": -20.957860946655273, "global_step": 78939, "epoch": 951} {"train_loss": -21.090734481811523, "global_step": 78940, "epoch": 951} {"train_loss": -20.7611141204834, "global_step": 78941, "epoch": 951} {"train_loss": -20.623958587646484, "global_step": 78942, "epoch": 951} {"train_loss": -21.06035614013672, "global_step": 78943, "epoch": 951} {"train_loss": -21.475444793701172, "global_step": 78944, "epoch": 951} {"train_loss": -21.102298736572266, "global_step": 78945, "epoch": 951} {"train_loss": -20.76804542541504, "global_step": 78946, "epoch": 951} {"train_loss": -20.915586471557617, "global_step": 78947, "epoch": 951} {"train_loss": -21.1826229095459, "global_step": 78948, "epoch": 951} {"train_loss": -21.228742599487305, "global_step": 78949, "epoch": 951} {"train_loss": -21.04176139831543, "global_step": 78950, "epoch": 951} {"train_loss": -20.954023361206055, "global_step": 78951, "epoch": 951} {"train_loss": -21.13254737854004, "global_step": 78952, "epoch": 951} {"train_loss": -21.108482360839844, "global_step": 78953, "epoch": 951} {"train_loss": -21.169401168823242, "global_step": 78954, "epoch": 951} {"train_loss": -21.30161476135254, "global_step": 78955, "epoch": 951} {"train_loss": -21.115495681762695, "global_step": 78956, "epoch": 951} {"train_loss": -20.80817985534668, "global_step": 78957, "epoch": 951} {"train_loss": -20.85097312927246, "global_step": 78958, "epoch": 951} {"train_loss": -20.945470809936523, "global_step": 78959, "epoch": 951} {"train_loss": -21.065805435180664, "global_step": 78960, "epoch": 951} {"train_loss": -20.873214721679688, "global_step": 78961, "epoch": 951} {"train_loss": -21.061800003051758, "global_step": 78962, "epoch": 951} {"train_loss": -21.10271644592285, "global_step": 78963, "epoch": 951} {"train_loss": -21.34309196472168, "global_step": 78964, "epoch": 951} {"train_loss": -21.091672897338867, "global_step": 78965, "epoch": 951} {"train_loss": -21.424118041992188, "global_step": 78966, "epoch": 951} {"train_loss": -20.95001792907715, "global_step": 78967, "epoch": 951} {"train_loss": -21.41196060180664, "global_step": 78968, "epoch": 951} {"train_loss": -21.18450927734375, "global_step": 78969, "epoch": 951} {"train_loss": -20.942731857299805, "global_step": 78970, "epoch": 951} {"train_loss": -21.07792854309082, "global_step": 78971, "epoch": 951} {"train_loss": -20.989604949951172, "global_step": 78972, "epoch": 951} {"train_loss": -21.262243270874023, "global_step": 78973, "epoch": 951} {"train_loss": -21.548444747924805, "global_step": 78974, "epoch": 951} {"train_loss": -20.534605026245117, "global_step": 78975, "epoch": 951} {"train_loss": -21.362117767333984, "global_step": 78976, "epoch": 951} {"train_loss": -21.081037521362305, "global_step": 78977, "epoch": 951} {"train_loss": -21.341751098632812, "global_step": 78978, "epoch": 951} {"train_loss": -21.281362533569336, "global_step": 78979, "epoch": 951} {"train_loss": -20.991785049438477, "global_step": 78980, "epoch": 951} {"train_loss": -21.32842445373535, "global_step": 78981, "epoch": 951} {"train_loss": -21.237747192382812, "global_step": 78982, "epoch": 951} {"train_loss": -20.715574264526367, "global_step": 78983, "epoch": 951} {"train_loss": -21.04709243774414, "global_step": 78984, "epoch": 951} {"train_loss": -21.328523635864258, "global_step": 78985, "epoch": 951} {"train_loss": -21.29448890686035, "global_step": 78986, "epoch": 951} {"train_loss": -20.957063674926758, "global_step": 78987, "epoch": 951} {"train_loss": -21.47238540649414, "global_step": 78988, "epoch": 951} {"train_loss": -21.56087875366211, "global_step": 78989, "epoch": 951} {"train_loss": -21.38804054260254, "global_step": 78990, "epoch": 951} {"train_loss": -21.067380905151367, "global_step": 78991, "epoch": 951} {"train_loss": -20.828771591186523, "global_step": 78992, "epoch": 951} {"train_loss": -20.978546142578125, "global_step": 78993, "epoch": 951} {"train_loss": -21.3006534576416, "global_step": 78994, "epoch": 951} {"train_loss": -21.07834815979004, "global_step": 78995, "epoch": 951} {"train_loss": -20.901540756225586, "global_step": 78996, "epoch": 951} {"train_loss": -21.136709213256836, "global_step": 78997, "epoch": 951} {"train_loss": -21.048276901245117, "global_step": 78998, "epoch": 951} {"train_loss": -21.557079315185547, "global_step": 78999, "epoch": 951} {"train_loss": -21.4163818359375, "global_step": 79000, "epoch": 951} {"train_loss": -21.116817474365234, "global_step": 79001, "epoch": 951} {"train_loss": -21.101545333862305, "global_step": 79002, "epoch": 951} {"train_loss": -21.518646240234375, "global_step": 79003, "epoch": 951} {"train_loss": -21.113908767700195, "global_step": 79004, "epoch": 951} {"train_loss": -21.203388214111328, "global_step": 79005, "epoch": 951} {"train_loss": -21.02103042602539, "global_step": 79006, "epoch": 951} {"train_loss": -20.942569732666016, "global_step": 79007, "epoch": 951} {"train_loss": -21.331668853759766, "global_step": 79008, "epoch": 951} {"train_loss": -20.90083885192871, "global_step": 79009, "epoch": 951} {"train_loss": -21.25956153869629, "global_step": 79010, "epoch": 951} {"train_loss": -20.8955135345459, "global_step": 79011, "epoch": 951} {"train_loss": -21.231977462768555, "global_step": 79012, "epoch": 951} {"train_loss": -21.071781158447266, "global_step": 79013, "epoch": 951} {"train_loss": -20.914899826049805, "global_step": 79014, "epoch": 951} {"train_loss": -21.11998686733016, "global_step": 79015, "epoch": 951, "val_loss": 6154303.0} {"train_loss": -21.13858985900879, "global_step": 79016, "epoch": 952} {"train_loss": -20.56764793395996, "global_step": 79017, "epoch": 952} {"train_loss": -20.954130172729492, "global_step": 79018, "epoch": 952} {"train_loss": -21.055679321289062, "global_step": 79019, "epoch": 952} {"train_loss": -21.189664840698242, "global_step": 79020, "epoch": 952} {"train_loss": -20.939477920532227, "global_step": 79021, "epoch": 952} {"train_loss": -20.8748836517334, "global_step": 79022, "epoch": 952} {"train_loss": -20.968122482299805, "global_step": 79023, "epoch": 952} {"train_loss": -20.799570083618164, "global_step": 79024, "epoch": 952} {"train_loss": -20.910696029663086, "global_step": 79025, "epoch": 952} {"train_loss": -21.045019149780273, "global_step": 79026, "epoch": 952} {"train_loss": -20.9340763092041, "global_step": 79027, "epoch": 952} {"train_loss": -21.430418014526367, "global_step": 79028, "epoch": 952} {"train_loss": -21.1386661529541, "global_step": 79029, "epoch": 952} {"train_loss": -21.1005859375, "global_step": 79030, "epoch": 952} {"train_loss": -21.107410430908203, "global_step": 79031, "epoch": 952} {"train_loss": -21.12740707397461, "global_step": 79032, "epoch": 952} {"train_loss": -20.817340850830078, "global_step": 79033, "epoch": 952} {"train_loss": -21.255023956298828, "global_step": 79034, "epoch": 952} {"train_loss": -21.440549850463867, "global_step": 79035, "epoch": 952} {"train_loss": -21.037479400634766, "global_step": 79036, "epoch": 952} {"train_loss": -21.287397384643555, "global_step": 79037, "epoch": 952} {"train_loss": -21.287595748901367, "global_step": 79038, "epoch": 952} {"train_loss": -21.342350006103516, "global_step": 79039, "epoch": 952} {"train_loss": -20.80427360534668, "global_step": 79040, "epoch": 952} {"train_loss": -20.989303588867188, "global_step": 79041, "epoch": 952} {"train_loss": -20.86248779296875, "global_step": 79042, "epoch": 952} {"train_loss": -21.170358657836914, "global_step": 79043, "epoch": 952} {"train_loss": -21.260141372680664, "global_step": 79044, "epoch": 952} {"train_loss": -21.619741439819336, "global_step": 79045, "epoch": 952} {"train_loss": -21.24437141418457, "global_step": 79046, "epoch": 952} {"train_loss": -21.541540145874023, "global_step": 79047, "epoch": 952} {"train_loss": -21.39802360534668, "global_step": 79048, "epoch": 952} {"train_loss": -21.24923324584961, "global_step": 79049, "epoch": 952} {"train_loss": -21.02703285217285, "global_step": 79050, "epoch": 952} {"train_loss": -21.365522384643555, "global_step": 79051, "epoch": 952} {"train_loss": -21.178815841674805, "global_step": 79052, "epoch": 952} {"train_loss": -21.288705825805664, "global_step": 79053, "epoch": 952} {"train_loss": -21.05903434753418, "global_step": 79054, "epoch": 952} {"train_loss": -21.379104614257812, "global_step": 79055, "epoch": 952} {"train_loss": -21.085920333862305, "global_step": 79056, "epoch": 952} {"train_loss": -21.405759811401367, "global_step": 79057, "epoch": 952} {"train_loss": -21.302818298339844, "global_step": 79058, "epoch": 952} {"train_loss": -21.50843620300293, "global_step": 79059, "epoch": 952} {"train_loss": -21.521190643310547, "global_step": 79060, "epoch": 952} {"train_loss": -21.037870407104492, "global_step": 79061, "epoch": 952} {"train_loss": -21.02565574645996, "global_step": 79062, "epoch": 952} {"train_loss": -21.246435165405273, "global_step": 79063, "epoch": 952} {"train_loss": -21.119382858276367, "global_step": 79064, "epoch": 952} {"train_loss": -21.252119064331055, "global_step": 79065, "epoch": 952} {"train_loss": -21.08746337890625, "global_step": 79066, "epoch": 952} {"train_loss": -21.153837203979492, "global_step": 79067, "epoch": 952} {"train_loss": -21.071630477905273, "global_step": 79068, "epoch": 952} {"train_loss": -21.218748092651367, "global_step": 79069, "epoch": 952} {"train_loss": -20.957263946533203, "global_step": 79070, "epoch": 952} {"train_loss": -20.961145401000977, "global_step": 79071, "epoch": 952} {"train_loss": -21.160974502563477, "global_step": 79072, "epoch": 952} {"train_loss": -21.179956436157227, "global_step": 79073, "epoch": 952} {"train_loss": -21.401010513305664, "global_step": 79074, "epoch": 952} {"train_loss": -21.01199722290039, "global_step": 79075, "epoch": 952} {"train_loss": -21.215763092041016, "global_step": 79076, "epoch": 952} {"train_loss": -21.536441802978516, "global_step": 79077, "epoch": 952} {"train_loss": -21.482297897338867, "global_step": 79078, "epoch": 952} {"train_loss": -21.406509399414062, "global_step": 79079, "epoch": 952} {"train_loss": -21.399213790893555, "global_step": 79080, "epoch": 952} {"train_loss": -21.31391716003418, "global_step": 79081, "epoch": 952} {"train_loss": -21.419965744018555, "global_step": 79082, "epoch": 952} {"train_loss": -21.283422470092773, "global_step": 79083, "epoch": 952} {"train_loss": -20.997156143188477, "global_step": 79084, "epoch": 952} {"train_loss": -21.322683334350586, "global_step": 79085, "epoch": 952} {"train_loss": -21.1152400970459, "global_step": 79086, "epoch": 952} {"train_loss": -21.026962280273438, "global_step": 79087, "epoch": 952} {"train_loss": -21.3763484954834, "global_step": 79088, "epoch": 952} {"train_loss": -21.18992042541504, "global_step": 79089, "epoch": 952} {"train_loss": -21.411529541015625, "global_step": 79090, "epoch": 952} {"train_loss": -21.208328247070312, "global_step": 79091, "epoch": 952} {"train_loss": -21.1989688873291, "global_step": 79092, "epoch": 952} {"train_loss": -20.986825942993164, "global_step": 79093, "epoch": 952} {"train_loss": -21.053831100463867, "global_step": 79094, "epoch": 952} {"train_loss": -21.2049560546875, "global_step": 79095, "epoch": 952} {"train_loss": -20.985279083251953, "global_step": 79096, "epoch": 952} {"train_loss": -21.204214096069336, "global_step": 79097, "epoch": 952} {"train_loss": -21.197879630399036, "global_step": 79098, "epoch": 952, "val_loss": 5880858.5} {"train_loss": -20.799978256225586, "global_step": 79099, "epoch": 953} {"train_loss": -20.95097541809082, "global_step": 79100, "epoch": 953} {"train_loss": -20.84084129333496, "global_step": 79101, "epoch": 953} {"train_loss": -21.06731605529785, "global_step": 79102, "epoch": 953} {"train_loss": -21.147092819213867, "global_step": 79103, "epoch": 953} {"train_loss": -21.111249923706055, "global_step": 79104, "epoch": 953} {"train_loss": -21.187667846679688, "global_step": 79105, "epoch": 953} {"train_loss": -21.045303344726562, "global_step": 79106, "epoch": 953} {"train_loss": -21.137813568115234, "global_step": 79107, "epoch": 953} {"train_loss": -21.12428092956543, "global_step": 79108, "epoch": 953} {"train_loss": -21.036109924316406, "global_step": 79109, "epoch": 953} {"train_loss": -21.087589263916016, "global_step": 79110, "epoch": 953} {"train_loss": -21.244949340820312, "global_step": 79111, "epoch": 953} {"train_loss": -21.049396514892578, "global_step": 79112, "epoch": 953} {"train_loss": -20.9339542388916, "global_step": 79113, "epoch": 953} {"train_loss": -20.855459213256836, "global_step": 79114, "epoch": 953} {"train_loss": -20.988693237304688, "global_step": 79115, "epoch": 953} {"train_loss": -21.064489364624023, "global_step": 79116, "epoch": 953} {"train_loss": -21.10764503479004, "global_step": 79117, "epoch": 953} {"train_loss": -20.831745147705078, "global_step": 79118, "epoch": 953} {"train_loss": -21.220062255859375, "global_step": 79119, "epoch": 953} {"train_loss": -21.031583786010742, "global_step": 79120, "epoch": 953} {"train_loss": -20.854528427124023, "global_step": 79121, "epoch": 953} {"train_loss": -20.766502380371094, "global_step": 79122, "epoch": 953} {"train_loss": -21.411100387573242, "global_step": 79123, "epoch": 953} {"train_loss": -21.185874938964844, "global_step": 79124, "epoch": 953} {"train_loss": -21.4632625579834, "global_step": 79125, "epoch": 953} {"train_loss": -21.069446563720703, "global_step": 79126, "epoch": 953} {"train_loss": -20.998546600341797, "global_step": 79127, "epoch": 953} {"train_loss": -21.20987892150879, "global_step": 79128, "epoch": 953} {"train_loss": -20.880905151367188, "global_step": 79129, "epoch": 953} {"train_loss": -21.46335220336914, "global_step": 79130, "epoch": 953} {"train_loss": -20.982967376708984, "global_step": 79131, "epoch": 953} {"train_loss": -21.177122116088867, "global_step": 79132, "epoch": 953} {"train_loss": -21.402145385742188, "global_step": 79133, "epoch": 953} {"train_loss": -21.29086685180664, "global_step": 79134, "epoch": 953} {"train_loss": -21.221332550048828, "global_step": 79135, "epoch": 953} {"train_loss": -21.023160934448242, "global_step": 79136, "epoch": 953} {"train_loss": -21.39092445373535, "global_step": 79137, "epoch": 953} {"train_loss": -21.134489059448242, "global_step": 79138, "epoch": 953} {"train_loss": -21.1337833404541, "global_step": 79139, "epoch": 953} {"train_loss": -20.773725509643555, "global_step": 79140, "epoch": 953} {"train_loss": -20.95658302307129, "global_step": 79141, "epoch": 953} {"train_loss": -21.193544387817383, "global_step": 79142, "epoch": 953} {"train_loss": -21.21116065979004, "global_step": 79143, "epoch": 953} {"train_loss": -21.351560592651367, "global_step": 79144, "epoch": 953} {"train_loss": -21.536575317382812, "global_step": 79145, "epoch": 953} {"train_loss": -21.154111862182617, "global_step": 79146, "epoch": 953} {"train_loss": -21.101022720336914, "global_step": 79147, "epoch": 953} {"train_loss": -20.89961814880371, "global_step": 79148, "epoch": 953} {"train_loss": -21.202930450439453, "global_step": 79149, "epoch": 953} {"train_loss": -21.12593650817871, "global_step": 79150, "epoch": 953} {"train_loss": -21.387924194335938, "global_step": 79151, "epoch": 953} {"train_loss": -21.260086059570312, "global_step": 79152, "epoch": 953} {"train_loss": -21.308683395385742, "global_step": 79153, "epoch": 953} {"train_loss": -21.344953536987305, "global_step": 79154, "epoch": 953} {"train_loss": -21.29817771911621, "global_step": 79155, "epoch": 953} {"train_loss": -21.265714645385742, "global_step": 79156, "epoch": 953} {"train_loss": -21.002214431762695, "global_step": 79157, "epoch": 953} {"train_loss": -21.207426071166992, "global_step": 79158, "epoch": 953} {"train_loss": -21.40058708190918, "global_step": 79159, "epoch": 953} {"train_loss": -21.188833236694336, "global_step": 79160, "epoch": 953} {"train_loss": -21.28469467163086, "global_step": 79161, "epoch": 953} {"train_loss": -21.320730209350586, "global_step": 79162, "epoch": 953} {"train_loss": -20.99043846130371, "global_step": 79163, "epoch": 953} {"train_loss": -21.41692543029785, "global_step": 79164, "epoch": 953} {"train_loss": -21.05618667602539, "global_step": 79165, "epoch": 953} {"train_loss": -21.03533172607422, "global_step": 79166, "epoch": 953} {"train_loss": -21.12030601501465, "global_step": 79167, "epoch": 953} {"train_loss": -21.395614624023438, "global_step": 79168, "epoch": 953} {"train_loss": -21.329572677612305, "global_step": 79169, "epoch": 953} {"train_loss": -21.019683837890625, "global_step": 79170, "epoch": 953} {"train_loss": -21.39983558654785, "global_step": 79171, "epoch": 953} {"train_loss": -21.222137451171875, "global_step": 79172, "epoch": 953} {"train_loss": -20.88981056213379, "global_step": 79173, "epoch": 953} {"train_loss": -21.03323745727539, "global_step": 79174, "epoch": 953} {"train_loss": -21.24738883972168, "global_step": 79175, "epoch": 953} {"train_loss": -21.260950088500977, "global_step": 79176, "epoch": 953} {"train_loss": -21.26328468322754, "global_step": 79177, "epoch": 953} {"train_loss": -21.07648277282715, "global_step": 79178, "epoch": 953} {"train_loss": -21.029836654663086, "global_step": 79179, "epoch": 953} {"train_loss": -21.35255241394043, "global_step": 79180, "epoch": 953} {"train_loss": -21.14623405272702, "global_step": 79181, "epoch": 953, "val_loss": 6016246.0} {"train_loss": -20.886402130126953, "global_step": 79182, "epoch": 954} {"train_loss": -21.273527145385742, "global_step": 79183, "epoch": 954} {"train_loss": -21.017841339111328, "global_step": 79184, "epoch": 954} {"train_loss": -21.04244041442871, "global_step": 79185, "epoch": 954} {"train_loss": -21.23371696472168, "global_step": 79186, "epoch": 954} {"train_loss": -21.236316680908203, "global_step": 79187, "epoch": 954} {"train_loss": -21.346181869506836, "global_step": 79188, "epoch": 954} {"train_loss": -21.32817840576172, "global_step": 79189, "epoch": 954} {"train_loss": -21.10287857055664, "global_step": 79190, "epoch": 954} {"train_loss": -21.2148494720459, "global_step": 79191, "epoch": 954} {"train_loss": -21.317174911499023, "global_step": 79192, "epoch": 954} {"train_loss": -21.118223190307617, "global_step": 79193, "epoch": 954} {"train_loss": -21.06268882751465, "global_step": 79194, "epoch": 954} {"train_loss": -21.287500381469727, "global_step": 79195, "epoch": 954} {"train_loss": -21.31565284729004, "global_step": 79196, "epoch": 954} {"train_loss": -21.024688720703125, "global_step": 79197, "epoch": 954} {"train_loss": -21.399261474609375, "global_step": 79198, "epoch": 954} {"train_loss": -21.318220138549805, "global_step": 79199, "epoch": 954} {"train_loss": -21.052490234375, "global_step": 79200, "epoch": 954} {"train_loss": -21.20606803894043, "global_step": 79201, "epoch": 954} {"train_loss": -20.985078811645508, "global_step": 79202, "epoch": 954} {"train_loss": -21.332387924194336, "global_step": 79203, "epoch": 954} {"train_loss": -20.738235473632812, "global_step": 79204, "epoch": 954} {"train_loss": -20.825300216674805, "global_step": 79205, "epoch": 954} {"train_loss": -21.323888778686523, "global_step": 79206, "epoch": 954} {"train_loss": -20.84669303894043, "global_step": 79207, "epoch": 954} {"train_loss": -21.229211807250977, "global_step": 79208, "epoch": 954} {"train_loss": -21.282339096069336, "global_step": 79209, "epoch": 954} {"train_loss": -21.10416603088379, "global_step": 79210, "epoch": 954} {"train_loss": -21.515100479125977, "global_step": 79211, "epoch": 954} {"train_loss": -21.362730026245117, "global_step": 79212, "epoch": 954} {"train_loss": -21.564483642578125, "global_step": 79213, "epoch": 954} {"train_loss": -21.0402774810791, "global_step": 79214, "epoch": 954} {"train_loss": -21.29564666748047, "global_step": 79215, "epoch": 954} {"train_loss": -21.36275291442871, "global_step": 79216, "epoch": 954} {"train_loss": -21.17563819885254, "global_step": 79217, "epoch": 954} {"train_loss": -21.125173568725586, "global_step": 79218, "epoch": 954} {"train_loss": -20.978744506835938, "global_step": 79219, "epoch": 954} {"train_loss": -21.57895851135254, "global_step": 79220, "epoch": 954} {"train_loss": -21.067657470703125, "global_step": 79221, "epoch": 954} {"train_loss": -21.06483268737793, "global_step": 79222, "epoch": 954} {"train_loss": -21.06587791442871, "global_step": 79223, "epoch": 954} {"train_loss": -21.522417068481445, "global_step": 79224, "epoch": 954} {"train_loss": -21.575658798217773, "global_step": 79225, "epoch": 954} {"train_loss": -21.338912963867188, "global_step": 79226, "epoch": 954} {"train_loss": -20.985076904296875, "global_step": 79227, "epoch": 954} {"train_loss": -20.754003524780273, "global_step": 79228, "epoch": 954} {"train_loss": -21.82094383239746, "global_step": 79229, "epoch": 954} {"train_loss": -20.946992874145508, "global_step": 79230, "epoch": 954} {"train_loss": -21.000362396240234, "global_step": 79231, "epoch": 954} {"train_loss": -20.92023277282715, "global_step": 79232, "epoch": 954} {"train_loss": -21.470962524414062, "global_step": 79233, "epoch": 954} {"train_loss": -21.085996627807617, "global_step": 79234, "epoch": 954} {"train_loss": -21.153682708740234, "global_step": 79235, "epoch": 954} {"train_loss": -21.1497859954834, "global_step": 79236, "epoch": 954} {"train_loss": -21.216352462768555, "global_step": 79237, "epoch": 954} {"train_loss": -21.324209213256836, "global_step": 79238, "epoch": 954} {"train_loss": -21.2036190032959, "global_step": 79239, "epoch": 954} {"train_loss": -21.094375610351562, "global_step": 79240, "epoch": 954} {"train_loss": -21.31318473815918, "global_step": 79241, "epoch": 954} {"train_loss": -21.185922622680664, "global_step": 79242, "epoch": 954} {"train_loss": -20.89564323425293, "global_step": 79243, "epoch": 954} {"train_loss": -21.071008682250977, "global_step": 79244, "epoch": 954} {"train_loss": -21.331998825073242, "global_step": 79245, "epoch": 954} {"train_loss": -21.164627075195312, "global_step": 79246, "epoch": 954} {"train_loss": -21.513797760009766, "global_step": 79247, "epoch": 954} {"train_loss": -21.010257720947266, "global_step": 79248, "epoch": 954} {"train_loss": -21.1232967376709, "global_step": 79249, "epoch": 954} {"train_loss": -21.31302833557129, "global_step": 79250, "epoch": 954} {"train_loss": -20.80032730102539, "global_step": 79251, "epoch": 954} {"train_loss": -20.95401382446289, "global_step": 79252, "epoch": 954} {"train_loss": -21.454973220825195, "global_step": 79253, "epoch": 954} {"train_loss": -21.202245712280273, "global_step": 79254, "epoch": 954} {"train_loss": -21.39967155456543, "global_step": 79255, "epoch": 954} {"train_loss": -21.078306198120117, "global_step": 79256, "epoch": 954} {"train_loss": -20.99099349975586, "global_step": 79257, "epoch": 954} {"train_loss": -21.107419967651367, "global_step": 79258, "epoch": 954} {"train_loss": -21.06294059753418, "global_step": 79259, "epoch": 954} {"train_loss": -20.631284713745117, "global_step": 79260, "epoch": 954} {"train_loss": -21.19266700744629, "global_step": 79261, "epoch": 954} {"train_loss": -21.04632568359375, "global_step": 79262, "epoch": 954} {"train_loss": -20.947874069213867, "global_step": 79263, "epoch": 954} {"train_loss": -21.176260959671204, "global_step": 79264, "epoch": 954, "val_loss": 6069736.5} {"train_loss": -20.582477569580078, "global_step": 79265, "epoch": 955} {"train_loss": -20.82443618774414, "global_step": 79266, "epoch": 955} {"train_loss": -20.933557510375977, "global_step": 79267, "epoch": 955} {"train_loss": -20.873666763305664, "global_step": 79268, "epoch": 955} {"train_loss": -20.639408111572266, "global_step": 79269, "epoch": 955} {"train_loss": -20.772438049316406, "global_step": 79270, "epoch": 955} {"train_loss": -21.087665557861328, "global_step": 79271, "epoch": 955} {"train_loss": -20.96098518371582, "global_step": 79272, "epoch": 955} {"train_loss": -21.096933364868164, "global_step": 79273, "epoch": 955} {"train_loss": -21.09354019165039, "global_step": 79274, "epoch": 955} {"train_loss": -20.599185943603516, "global_step": 79275, "epoch": 955} {"train_loss": -21.060728073120117, "global_step": 79276, "epoch": 955} {"train_loss": -21.33853530883789, "global_step": 79277, "epoch": 955} {"train_loss": -21.536096572875977, "global_step": 79278, "epoch": 955} {"train_loss": -21.196134567260742, "global_step": 79279, "epoch": 955} {"train_loss": -20.917816162109375, "global_step": 79280, "epoch": 955} {"train_loss": -21.10162353515625, "global_step": 79281, "epoch": 955} {"train_loss": -20.82915496826172, "global_step": 79282, "epoch": 955} {"train_loss": -21.285715103149414, "global_step": 79283, "epoch": 955} {"train_loss": -21.33534812927246, "global_step": 79284, "epoch": 955} {"train_loss": -21.678281784057617, "global_step": 79285, "epoch": 955} {"train_loss": -20.931543350219727, "global_step": 79286, "epoch": 955} {"train_loss": -20.818706512451172, "global_step": 79287, "epoch": 955} {"train_loss": -21.288679122924805, "global_step": 79288, "epoch": 955} {"train_loss": -20.968168258666992, "global_step": 79289, "epoch": 955} {"train_loss": -21.03854751586914, "global_step": 79290, "epoch": 955} {"train_loss": -21.115236282348633, "global_step": 79291, "epoch": 955} {"train_loss": -21.064069747924805, "global_step": 79292, "epoch": 955} {"train_loss": -20.846166610717773, "global_step": 79293, "epoch": 955} {"train_loss": -21.10048484802246, "global_step": 79294, "epoch": 955} {"train_loss": -21.29306411743164, "global_step": 79295, "epoch": 955} {"train_loss": -21.27130126953125, "global_step": 79296, "epoch": 955} {"train_loss": -21.1474552154541, "global_step": 79297, "epoch": 955} {"train_loss": -21.133581161499023, "global_step": 79298, "epoch": 955} {"train_loss": -21.119571685791016, "global_step": 79299, "epoch": 955} {"train_loss": -21.117385864257812, "global_step": 79300, "epoch": 955} {"train_loss": -21.167264938354492, "global_step": 79301, "epoch": 955} {"train_loss": -20.953542709350586, "global_step": 79302, "epoch": 955} {"train_loss": -20.853736877441406, "global_step": 79303, "epoch": 955} {"train_loss": -21.10091781616211, "global_step": 79304, "epoch": 955} {"train_loss": -21.108808517456055, "global_step": 79305, "epoch": 955} {"train_loss": -21.520238876342773, "global_step": 79306, "epoch": 955} {"train_loss": -21.564163208007812, "global_step": 79307, "epoch": 955} {"train_loss": -21.31956672668457, "global_step": 79308, "epoch": 955} {"train_loss": -21.38900375366211, "global_step": 79309, "epoch": 955} {"train_loss": -21.175254821777344, "global_step": 79310, "epoch": 955} {"train_loss": -21.340957641601562, "global_step": 79311, "epoch": 955} {"train_loss": -21.614309310913086, "global_step": 79312, "epoch": 955} {"train_loss": -21.256444931030273, "global_step": 79313, "epoch": 955} {"train_loss": -21.013980865478516, "global_step": 79314, "epoch": 955} {"train_loss": -21.45490837097168, "global_step": 79315, "epoch": 955} {"train_loss": -21.555150985717773, "global_step": 79316, "epoch": 955} {"train_loss": -20.932096481323242, "global_step": 79317, "epoch": 955} {"train_loss": -21.05459976196289, "global_step": 79318, "epoch": 955} {"train_loss": -20.974096298217773, "global_step": 79319, "epoch": 955} {"train_loss": -21.318269729614258, "global_step": 79320, "epoch": 955} {"train_loss": -21.186193466186523, "global_step": 79321, "epoch": 955} {"train_loss": -21.304468154907227, "global_step": 79322, "epoch": 955} {"train_loss": -21.246198654174805, "global_step": 79323, "epoch": 955} {"train_loss": -21.187776565551758, "global_step": 79324, "epoch": 955} {"train_loss": -21.41938591003418, "global_step": 79325, "epoch": 955} {"train_loss": -21.25784683227539, "global_step": 79326, "epoch": 955} {"train_loss": -21.50117301940918, "global_step": 79327, "epoch": 955} {"train_loss": -21.012853622436523, "global_step": 79328, "epoch": 955} {"train_loss": -21.164398193359375, "global_step": 79329, "epoch": 955} {"train_loss": -21.592084884643555, "global_step": 79330, "epoch": 955} {"train_loss": -21.254919052124023, "global_step": 79331, "epoch": 955} {"train_loss": -20.90984344482422, "global_step": 79332, "epoch": 955} {"train_loss": -21.00053596496582, "global_step": 79333, "epoch": 955} {"train_loss": -21.13587760925293, "global_step": 79334, "epoch": 955} {"train_loss": -21.0645809173584, "global_step": 79335, "epoch": 955} {"train_loss": -21.360794067382812, "global_step": 79336, "epoch": 955} {"train_loss": -21.27522087097168, "global_step": 79337, "epoch": 955} {"train_loss": -21.12853240966797, "global_step": 79338, "epoch": 955} {"train_loss": -21.25165367126465, "global_step": 79339, "epoch": 955} {"train_loss": -21.03645896911621, "global_step": 79340, "epoch": 955} {"train_loss": -20.88407325744629, "global_step": 79341, "epoch": 955} {"train_loss": -21.26242446899414, "global_step": 79342, "epoch": 955} {"train_loss": -20.773862838745117, "global_step": 79343, "epoch": 955} {"train_loss": -21.118085861206055, "global_step": 79344, "epoch": 955} {"train_loss": -21.85350799560547, "global_step": 79345, "epoch": 955} {"train_loss": -21.126230239868164, "global_step": 79346, "epoch": 955} {"train_loss": -21.156032263514508, "global_step": 79347, "epoch": 955, "val_loss": 5891352.0} {"train_loss": -20.850141525268555, "global_step": 79348, "epoch": 956} {"train_loss": -20.82427978515625, "global_step": 79349, "epoch": 956} {"train_loss": -21.196950912475586, "global_step": 79350, "epoch": 956} {"train_loss": -20.852624893188477, "global_step": 79351, "epoch": 956} {"train_loss": -21.39036750793457, "global_step": 79352, "epoch": 956} {"train_loss": -20.695852279663086, "global_step": 79353, "epoch": 956} {"train_loss": -20.897958755493164, "global_step": 79354, "epoch": 956} {"train_loss": -20.936918258666992, "global_step": 79355, "epoch": 956} {"train_loss": -21.131322860717773, "global_step": 79356, "epoch": 956} {"train_loss": -20.804502487182617, "global_step": 79357, "epoch": 956} {"train_loss": -21.296100616455078, "global_step": 79358, "epoch": 956} {"train_loss": -20.932905197143555, "global_step": 79359, "epoch": 956} {"train_loss": -21.209871292114258, "global_step": 79360, "epoch": 956} {"train_loss": -20.405942916870117, "global_step": 79361, "epoch": 956} {"train_loss": -20.7268009185791, "global_step": 79362, "epoch": 956} {"train_loss": -20.728132247924805, "global_step": 79363, "epoch": 956} {"train_loss": -21.104948043823242, "global_step": 79364, "epoch": 956} {"train_loss": -21.161666870117188, "global_step": 79365, "epoch": 956} {"train_loss": -21.07145118713379, "global_step": 79366, "epoch": 956} {"train_loss": -20.83901023864746, "global_step": 79367, "epoch": 956} {"train_loss": -21.089059829711914, "global_step": 79368, "epoch": 956} {"train_loss": -21.224145889282227, "global_step": 79369, "epoch": 956} {"train_loss": -20.7558650970459, "global_step": 79370, "epoch": 956} {"train_loss": -20.934873580932617, "global_step": 79371, "epoch": 956} {"train_loss": -21.142732620239258, "global_step": 79372, "epoch": 956} {"train_loss": -21.238649368286133, "global_step": 79373, "epoch": 956} {"train_loss": -21.04105567932129, "global_step": 79374, "epoch": 956} {"train_loss": -21.37240982055664, "global_step": 79375, "epoch": 956} {"train_loss": -21.013565063476562, "global_step": 79376, "epoch": 956} {"train_loss": -21.259445190429688, "global_step": 79377, "epoch": 956} {"train_loss": -21.045446395874023, "global_step": 79378, "epoch": 956} {"train_loss": -21.15830421447754, "global_step": 79379, "epoch": 956} {"train_loss": -21.427576065063477, "global_step": 79380, "epoch": 956} {"train_loss": -20.857736587524414, "global_step": 79381, "epoch": 956} {"train_loss": -20.913572311401367, "global_step": 79382, "epoch": 956} {"train_loss": -21.208707809448242, "global_step": 79383, "epoch": 956} {"train_loss": -20.78887939453125, "global_step": 79384, "epoch": 956} {"train_loss": -21.29019546508789, "global_step": 79385, "epoch": 956} {"train_loss": -21.220081329345703, "global_step": 79386, "epoch": 956} {"train_loss": -21.096067428588867, "global_step": 79387, "epoch": 956} {"train_loss": -21.100175857543945, "global_step": 79388, "epoch": 956} {"train_loss": -21.254627227783203, "global_step": 79389, "epoch": 956} {"train_loss": -21.20943832397461, "global_step": 79390, "epoch": 956} {"train_loss": -20.942569732666016, "global_step": 79391, "epoch": 956} {"train_loss": -21.302560806274414, "global_step": 79392, "epoch": 956} {"train_loss": -21.48554039001465, "global_step": 79393, "epoch": 956} {"train_loss": -20.858726501464844, "global_step": 79394, "epoch": 956} {"train_loss": -21.546051025390625, "global_step": 79395, "epoch": 956} {"train_loss": -20.836124420166016, "global_step": 79396, "epoch": 956} {"train_loss": -21.215988159179688, "global_step": 79397, "epoch": 956} {"train_loss": -21.246593475341797, "global_step": 79398, "epoch": 956} {"train_loss": -21.16147804260254, "global_step": 79399, "epoch": 956} {"train_loss": -21.232398986816406, "global_step": 79400, "epoch": 956} {"train_loss": -21.126392364501953, "global_step": 79401, "epoch": 956} {"train_loss": -20.87517738342285, "global_step": 79402, "epoch": 956} {"train_loss": -21.144453048706055, "global_step": 79403, "epoch": 956} {"train_loss": -20.800840377807617, "global_step": 79404, "epoch": 956} {"train_loss": -21.03634262084961, "global_step": 79405, "epoch": 956} {"train_loss": -20.902881622314453, "global_step": 79406, "epoch": 956} {"train_loss": -21.37447166442871, "global_step": 79407, "epoch": 956} {"train_loss": -21.34901237487793, "global_step": 79408, "epoch": 956} {"train_loss": -21.001977920532227, "global_step": 79409, "epoch": 956} {"train_loss": -21.0521240234375, "global_step": 79410, "epoch": 956} {"train_loss": -21.271146774291992, "global_step": 79411, "epoch": 956} {"train_loss": -21.087568283081055, "global_step": 79412, "epoch": 956} {"train_loss": -21.283071517944336, "global_step": 79413, "epoch": 956} {"train_loss": -21.1964168548584, "global_step": 79414, "epoch": 956} {"train_loss": -21.18403434753418, "global_step": 79415, "epoch": 956} {"train_loss": -21.293027877807617, "global_step": 79416, "epoch": 956} {"train_loss": -21.40751075744629, "global_step": 79417, "epoch": 956} {"train_loss": -21.157255172729492, "global_step": 79418, "epoch": 956} {"train_loss": -20.95481300354004, "global_step": 79419, "epoch": 956} {"train_loss": -21.37202262878418, "global_step": 79420, "epoch": 956} {"train_loss": -20.834875106811523, "global_step": 79421, "epoch": 956} {"train_loss": -21.53861427307129, "global_step": 79422, "epoch": 956} {"train_loss": -21.18867301940918, "global_step": 79423, "epoch": 956} {"train_loss": -21.02898597717285, "global_step": 79424, "epoch": 956} {"train_loss": -21.156747817993164, "global_step": 79425, "epoch": 956} {"train_loss": -21.30777359008789, "global_step": 79426, "epoch": 956} {"train_loss": -21.092248916625977, "global_step": 79427, "epoch": 956} {"train_loss": -21.036218643188477, "global_step": 79428, "epoch": 956} {"train_loss": -21.32599449157715, "global_step": 79429, "epoch": 956} {"train_loss": -21.10207417499588, "global_step": 79430, "epoch": 956, "val_loss": 6102209.5} {"train_loss": -20.660755157470703, "global_step": 79431, "epoch": 957} {"train_loss": -21.086233139038086, "global_step": 79432, "epoch": 957} {"train_loss": -20.949718475341797, "global_step": 79433, "epoch": 957} {"train_loss": -20.872827529907227, "global_step": 79434, "epoch": 957} {"train_loss": -20.941457748413086, "global_step": 79435, "epoch": 957} {"train_loss": -20.975210189819336, "global_step": 79436, "epoch": 957} {"train_loss": -21.129568099975586, "global_step": 79437, "epoch": 957} {"train_loss": -21.36507225036621, "global_step": 79438, "epoch": 957} {"train_loss": -20.915828704833984, "global_step": 79439, "epoch": 957} {"train_loss": -21.332351684570312, "global_step": 79440, "epoch": 957} {"train_loss": -21.217437744140625, "global_step": 79441, "epoch": 957} {"train_loss": -21.11444091796875, "global_step": 79442, "epoch": 957} {"train_loss": -21.10454559326172, "global_step": 79443, "epoch": 957} {"train_loss": -21.154953002929688, "global_step": 79444, "epoch": 957} {"train_loss": -21.302404403686523, "global_step": 79445, "epoch": 957} {"train_loss": -21.067626953125, "global_step": 79446, "epoch": 957} {"train_loss": -21.387357711791992, "global_step": 79447, "epoch": 957} {"train_loss": -20.869539260864258, "global_step": 79448, "epoch": 957} {"train_loss": -21.367542266845703, "global_step": 79449, "epoch": 957} {"train_loss": -21.36533546447754, "global_step": 79450, "epoch": 957} {"train_loss": -21.22805404663086, "global_step": 79451, "epoch": 957} {"train_loss": -21.122655868530273, "global_step": 79452, "epoch": 957} {"train_loss": -20.961936950683594, "global_step": 79453, "epoch": 957} {"train_loss": -21.391698837280273, "global_step": 79454, "epoch": 957} {"train_loss": -21.16585350036621, "global_step": 79455, "epoch": 957} {"train_loss": -21.010099411010742, "global_step": 79456, "epoch": 957} {"train_loss": -20.995214462280273, "global_step": 79457, "epoch": 957} {"train_loss": -21.410871505737305, "global_step": 79458, "epoch": 957} {"train_loss": -21.327756881713867, "global_step": 79459, "epoch": 957} {"train_loss": -21.17217445373535, "global_step": 79460, "epoch": 957} {"train_loss": -21.029804229736328, "global_step": 79461, "epoch": 957} {"train_loss": -21.144529342651367, "global_step": 79462, "epoch": 957} {"train_loss": -21.51283073425293, "global_step": 79463, "epoch": 957} {"train_loss": -21.26725196838379, "global_step": 79464, "epoch": 957} {"train_loss": -21.399381637573242, "global_step": 79465, "epoch": 957} {"train_loss": -21.08035659790039, "global_step": 79466, "epoch": 957} {"train_loss": -21.033727645874023, "global_step": 79467, "epoch": 957} {"train_loss": -21.213205337524414, "global_step": 79468, "epoch": 957} {"train_loss": -21.118473052978516, "global_step": 79469, "epoch": 957} {"train_loss": -21.163114547729492, "global_step": 79470, "epoch": 957} {"train_loss": -21.232175827026367, "global_step": 79471, "epoch": 957} {"train_loss": -20.81999397277832, "global_step": 79472, "epoch": 957} {"train_loss": -21.2248477935791, "global_step": 79473, "epoch": 957} {"train_loss": -21.031911849975586, "global_step": 79474, "epoch": 957} {"train_loss": -20.894681930541992, "global_step": 79475, "epoch": 957} {"train_loss": -21.364330291748047, "global_step": 79476, "epoch": 957} {"train_loss": -21.267770767211914, "global_step": 79477, "epoch": 957} {"train_loss": -20.967905044555664, "global_step": 79478, "epoch": 957} {"train_loss": -21.4610652923584, "global_step": 79479, "epoch": 957} {"train_loss": -21.21225357055664, "global_step": 79480, "epoch": 957} {"train_loss": -21.31358528137207, "global_step": 79481, "epoch": 957} {"train_loss": -20.974790573120117, "global_step": 79482, "epoch": 957} {"train_loss": -21.232284545898438, "global_step": 79483, "epoch": 957} {"train_loss": -21.264251708984375, "global_step": 79484, "epoch": 957} {"train_loss": -21.386051177978516, "global_step": 79485, "epoch": 957} {"train_loss": -21.08575439453125, "global_step": 79486, "epoch": 957} {"train_loss": -20.918004989624023, "global_step": 79487, "epoch": 957} {"train_loss": -20.997817993164062, "global_step": 79488, "epoch": 957} {"train_loss": -20.854827880859375, "global_step": 79489, "epoch": 957} {"train_loss": -21.34479522705078, "global_step": 79490, "epoch": 957} {"train_loss": -21.113637924194336, "global_step": 79491, "epoch": 957} {"train_loss": -21.12539291381836, "global_step": 79492, "epoch": 957} {"train_loss": -21.310176849365234, "global_step": 79493, "epoch": 957} {"train_loss": -20.90926742553711, "global_step": 79494, "epoch": 957} {"train_loss": -21.180017471313477, "global_step": 79495, "epoch": 957} {"train_loss": -21.4827938079834, "global_step": 79496, "epoch": 957} {"train_loss": -20.919904708862305, "global_step": 79497, "epoch": 957} {"train_loss": -21.26727867126465, "global_step": 79498, "epoch": 957} {"train_loss": -21.009489059448242, "global_step": 79499, "epoch": 957} {"train_loss": -21.377809524536133, "global_step": 79500, "epoch": 957} {"train_loss": -21.350025177001953, "global_step": 79501, "epoch": 957} {"train_loss": -21.365936279296875, "global_step": 79502, "epoch": 957} {"train_loss": -21.220489501953125, "global_step": 79503, "epoch": 957} {"train_loss": -21.222578048706055, "global_step": 79504, "epoch": 957} {"train_loss": -20.98394012451172, "global_step": 79505, "epoch": 957} {"train_loss": -21.035276412963867, "global_step": 79506, "epoch": 957} {"train_loss": -21.43729019165039, "global_step": 79507, "epoch": 957} {"train_loss": -21.1337890625, "global_step": 79508, "epoch": 957} {"train_loss": -21.107240676879883, "global_step": 79509, "epoch": 957} {"train_loss": -21.54188346862793, "global_step": 79510, "epoch": 957} {"train_loss": -21.265897750854492, "global_step": 79511, "epoch": 957} {"train_loss": -21.40073013305664, "global_step": 79512, "epoch": 957} {"train_loss": -21.170341767460467, "global_step": 79513, "epoch": 957, "val_loss": 6087264.0} {"train_loss": -20.254638671875, "global_step": 79514, "epoch": 958} {"train_loss": -20.506338119506836, "global_step": 79515, "epoch": 958} {"train_loss": -20.94172477722168, "global_step": 79516, "epoch": 958} {"train_loss": -20.2967529296875, "global_step": 79517, "epoch": 958} {"train_loss": -20.719327926635742, "global_step": 79518, "epoch": 958} {"train_loss": -21.172590255737305, "global_step": 79519, "epoch": 958} {"train_loss": -20.723791122436523, "global_step": 79520, "epoch": 958} {"train_loss": -20.898366928100586, "global_step": 79521, "epoch": 958} {"train_loss": -20.74001693725586, "global_step": 79522, "epoch": 958} {"train_loss": -21.341379165649414, "global_step": 79523, "epoch": 958} {"train_loss": -20.565893173217773, "global_step": 79524, "epoch": 958} {"train_loss": -20.82979393005371, "global_step": 79525, "epoch": 958} {"train_loss": -21.216400146484375, "global_step": 79526, "epoch": 958} {"train_loss": -20.8104248046875, "global_step": 79527, "epoch": 958} {"train_loss": -21.067468643188477, "global_step": 79528, "epoch": 958} {"train_loss": -21.080610275268555, "global_step": 79529, "epoch": 958} {"train_loss": -21.189361572265625, "global_step": 79530, "epoch": 958} {"train_loss": -20.861618041992188, "global_step": 79531, "epoch": 958} {"train_loss": -21.067258834838867, "global_step": 79532, "epoch": 958} {"train_loss": -21.170570373535156, "global_step": 79533, "epoch": 958} {"train_loss": -21.476621627807617, "global_step": 79534, "epoch": 958} {"train_loss": -20.921056747436523, "global_step": 79535, "epoch": 958} {"train_loss": -21.118444442749023, "global_step": 79536, "epoch": 958} {"train_loss": -20.877965927124023, "global_step": 79537, "epoch": 958} {"train_loss": -21.18219566345215, "global_step": 79538, "epoch": 958} {"train_loss": -21.566848754882812, "global_step": 79539, "epoch": 958} {"train_loss": -21.0723934173584, "global_step": 79540, "epoch": 958} {"train_loss": -21.29975700378418, "global_step": 79541, "epoch": 958} {"train_loss": -21.151941299438477, "global_step": 79542, "epoch": 958} {"train_loss": -21.069913864135742, "global_step": 79543, "epoch": 958} {"train_loss": -21.105518341064453, "global_step": 79544, "epoch": 958} {"train_loss": -21.384658813476562, "global_step": 79545, "epoch": 958} {"train_loss": -21.2236270904541, "global_step": 79546, "epoch": 958} {"train_loss": -21.25481414794922, "global_step": 79547, "epoch": 958} {"train_loss": -20.926740646362305, "global_step": 79548, "epoch": 958} {"train_loss": -21.127058029174805, "global_step": 79549, "epoch": 958} {"train_loss": -21.061683654785156, "global_step": 79550, "epoch": 958} {"train_loss": -21.11277198791504, "global_step": 79551, "epoch": 958} {"train_loss": -20.97286033630371, "global_step": 79552, "epoch": 958} {"train_loss": -21.005773544311523, "global_step": 79553, "epoch": 958} {"train_loss": -21.2983455657959, "global_step": 79554, "epoch": 958} {"train_loss": -21.4801025390625, "global_step": 79555, "epoch": 958} {"train_loss": -20.912771224975586, "global_step": 79556, "epoch": 958} {"train_loss": -21.185611724853516, "global_step": 79557, "epoch": 958} {"train_loss": -21.195934295654297, "global_step": 79558, "epoch": 958} {"train_loss": -21.053997039794922, "global_step": 79559, "epoch": 958} {"train_loss": -20.911008834838867, "global_step": 79560, "epoch": 958} {"train_loss": -21.372941970825195, "global_step": 79561, "epoch": 958} {"train_loss": -20.9672794342041, "global_step": 79562, "epoch": 958} {"train_loss": -21.049327850341797, "global_step": 79563, "epoch": 958} {"train_loss": -21.27130699157715, "global_step": 79564, "epoch": 958} {"train_loss": -21.282325744628906, "global_step": 79565, "epoch": 958} {"train_loss": -21.363208770751953, "global_step": 79566, "epoch": 958} {"train_loss": -21.255573272705078, "global_step": 79567, "epoch": 958} {"train_loss": -21.14822006225586, "global_step": 79568, "epoch": 958} {"train_loss": -21.144498825073242, "global_step": 79569, "epoch": 958} {"train_loss": -21.179365158081055, "global_step": 79570, "epoch": 958} {"train_loss": -21.131383895874023, "global_step": 79571, "epoch": 958} {"train_loss": -20.960758209228516, "global_step": 79572, "epoch": 958} {"train_loss": -21.49750518798828, "global_step": 79573, "epoch": 958} {"train_loss": -21.089075088500977, "global_step": 79574, "epoch": 958} {"train_loss": -21.12999725341797, "global_step": 79575, "epoch": 958} {"train_loss": -21.216083526611328, "global_step": 79576, "epoch": 958} {"train_loss": -21.549728393554688, "global_step": 79577, "epoch": 958} {"train_loss": -21.193288803100586, "global_step": 79578, "epoch": 958} {"train_loss": -21.168893814086914, "global_step": 79579, "epoch": 958} {"train_loss": -21.051898956298828, "global_step": 79580, "epoch": 958} {"train_loss": -21.355199813842773, "global_step": 79581, "epoch": 958} {"train_loss": -21.01132583618164, "global_step": 79582, "epoch": 958} {"train_loss": -21.185546875, "global_step": 79583, "epoch": 958} {"train_loss": -21.42486572265625, "global_step": 79584, "epoch": 958} {"train_loss": -21.275531768798828, "global_step": 79585, "epoch": 958} {"train_loss": -21.48653793334961, "global_step": 79586, "epoch": 958} {"train_loss": -21.192886352539062, "global_step": 79587, "epoch": 958} {"train_loss": -21.246448516845703, "global_step": 79588, "epoch": 958} {"train_loss": -21.413982391357422, "global_step": 79589, "epoch": 958} {"train_loss": -20.82651710510254, "global_step": 79590, "epoch": 958} {"train_loss": -21.262182235717773, "global_step": 79591, "epoch": 958} {"train_loss": -20.92324447631836, "global_step": 79592, "epoch": 958} {"train_loss": -21.38779067993164, "global_step": 79593, "epoch": 958} {"train_loss": -21.242345809936523, "global_step": 79594, "epoch": 958} {"train_loss": -21.28380584716797, "global_step": 79595, "epoch": 958} {"train_loss": -21.114058138376258, "global_step": 79596, "epoch": 958, "val_loss": 5958275.0} {"train_loss": -20.650501251220703, "global_step": 79597, "epoch": 959} {"train_loss": -21.31337547302246, "global_step": 79598, "epoch": 959} {"train_loss": -20.9560604095459, "global_step": 79599, "epoch": 959} {"train_loss": -21.23143768310547, "global_step": 79600, "epoch": 959} {"train_loss": -20.77106285095215, "global_step": 79601, "epoch": 959} {"train_loss": -20.962966918945312, "global_step": 79602, "epoch": 959} {"train_loss": -20.971303939819336, "global_step": 79603, "epoch": 959} {"train_loss": -21.28948211669922, "global_step": 79604, "epoch": 959} {"train_loss": -21.006431579589844, "global_step": 79605, "epoch": 959} {"train_loss": -20.93216323852539, "global_step": 79606, "epoch": 959} {"train_loss": -21.002059936523438, "global_step": 79607, "epoch": 959} {"train_loss": -21.089059829711914, "global_step": 79608, "epoch": 959} {"train_loss": -20.820798873901367, "global_step": 79609, "epoch": 959} {"train_loss": -20.85015106201172, "global_step": 79610, "epoch": 959} {"train_loss": -21.44434928894043, "global_step": 79611, "epoch": 959} {"train_loss": -20.945556640625, "global_step": 79612, "epoch": 959} {"train_loss": -21.123096466064453, "global_step": 79613, "epoch": 959} {"train_loss": -21.005979537963867, "global_step": 79614, "epoch": 959} {"train_loss": -21.023025512695312, "global_step": 79615, "epoch": 959} {"train_loss": -21.0695743560791, "global_step": 79616, "epoch": 959} {"train_loss": -21.09223747253418, "global_step": 79617, "epoch": 959} {"train_loss": -21.24530601501465, "global_step": 79618, "epoch": 959} {"train_loss": -21.141620635986328, "global_step": 79619, "epoch": 959} {"train_loss": -21.06460952758789, "global_step": 79620, "epoch": 959} {"train_loss": -21.26493263244629, "global_step": 79621, "epoch": 959} {"train_loss": -20.905170440673828, "global_step": 79622, "epoch": 959} {"train_loss": -21.239469528198242, "global_step": 79623, "epoch": 959} {"train_loss": -21.130937576293945, "global_step": 79624, "epoch": 959} {"train_loss": -21.249204635620117, "global_step": 79625, "epoch": 959} {"train_loss": -21.114303588867188, "global_step": 79626, "epoch": 959} {"train_loss": -20.929975509643555, "global_step": 79627, "epoch": 959} {"train_loss": -21.27991485595703, "global_step": 79628, "epoch": 959} {"train_loss": -20.98172950744629, "global_step": 79629, "epoch": 959} {"train_loss": -21.32680320739746, "global_step": 79630, "epoch": 959} {"train_loss": -21.4008846282959, "global_step": 79631, "epoch": 959} {"train_loss": -21.136640548706055, "global_step": 79632, "epoch": 959} {"train_loss": -21.336088180541992, "global_step": 79633, "epoch": 959} {"train_loss": -21.309606552124023, "global_step": 79634, "epoch": 959} {"train_loss": -21.1319637298584, "global_step": 79635, "epoch": 959} {"train_loss": -21.264135360717773, "global_step": 79636, "epoch": 959} {"train_loss": -21.30428123474121, "global_step": 79637, "epoch": 959} {"train_loss": -21.254789352416992, "global_step": 79638, "epoch": 959} {"train_loss": -21.30438804626465, "global_step": 79639, "epoch": 959} {"train_loss": -21.31020164489746, "global_step": 79640, "epoch": 959} {"train_loss": -21.428022384643555, "global_step": 79641, "epoch": 959} {"train_loss": -21.29683494567871, "global_step": 79642, "epoch": 959} {"train_loss": -21.313648223876953, "global_step": 79643, "epoch": 959} {"train_loss": -21.020423889160156, "global_step": 79644, "epoch": 959} {"train_loss": -21.618864059448242, "global_step": 79645, "epoch": 959} {"train_loss": -21.1112003326416, "global_step": 79646, "epoch": 959} {"train_loss": -21.054929733276367, "global_step": 79647, "epoch": 959} {"train_loss": -21.185291290283203, "global_step": 79648, "epoch": 959} {"train_loss": -21.087326049804688, "global_step": 79649, "epoch": 959} {"train_loss": -21.054662704467773, "global_step": 79650, "epoch": 959} {"train_loss": -21.381614685058594, "global_step": 79651, "epoch": 959} {"train_loss": -21.495832443237305, "global_step": 79652, "epoch": 959} {"train_loss": -21.021774291992188, "global_step": 79653, "epoch": 959} {"train_loss": -21.18979835510254, "global_step": 79654, "epoch": 959} {"train_loss": -21.203378677368164, "global_step": 79655, "epoch": 959} {"train_loss": -20.812332153320312, "global_step": 79656, "epoch": 959} {"train_loss": -21.292726516723633, "global_step": 79657, "epoch": 959} {"train_loss": -21.308752059936523, "global_step": 79658, "epoch": 959} {"train_loss": -21.33576011657715, "global_step": 79659, "epoch": 959} {"train_loss": -21.264625549316406, "global_step": 79660, "epoch": 959} {"train_loss": -20.865018844604492, "global_step": 79661, "epoch": 959} {"train_loss": -21.607358932495117, "global_step": 79662, "epoch": 959} {"train_loss": -21.502357482910156, "global_step": 79663, "epoch": 959} {"train_loss": -20.876306533813477, "global_step": 79664, "epoch": 959} {"train_loss": -20.802005767822266, "global_step": 79665, "epoch": 959} {"train_loss": -21.142423629760742, "global_step": 79666, "epoch": 959} {"train_loss": -20.998626708984375, "global_step": 79667, "epoch": 959} {"train_loss": -21.278728485107422, "global_step": 79668, "epoch": 959} {"train_loss": -21.2072811126709, "global_step": 79669, "epoch": 959} {"train_loss": -21.237808227539062, "global_step": 79670, "epoch": 959} {"train_loss": -20.893545150756836, "global_step": 79671, "epoch": 959} {"train_loss": -21.460737228393555, "global_step": 79672, "epoch": 959} {"train_loss": -21.52923011779785, "global_step": 79673, "epoch": 959} {"train_loss": -21.05978012084961, "global_step": 79674, "epoch": 959} {"train_loss": -21.83949089050293, "global_step": 79675, "epoch": 959} {"train_loss": -21.14385986328125, "global_step": 79676, "epoch": 959} {"train_loss": -21.123519897460938, "global_step": 79677, "epoch": 959} {"train_loss": -21.092798233032227, "global_step": 79678, "epoch": 959} {"train_loss": -21.15896328386054, "global_step": 79679, "epoch": 959, "val_loss": 6126414.5} {"train_loss": -19.620473861694336, "global_step": 79680, "epoch": 960} {"train_loss": -20.76710319519043, "global_step": 79681, "epoch": 960} {"train_loss": -20.363807678222656, "global_step": 79682, "epoch": 960} {"train_loss": -20.20682716369629, "global_step": 79683, "epoch": 960} {"train_loss": -20.20086097717285, "global_step": 79684, "epoch": 960} {"train_loss": -20.27782440185547, "global_step": 79685, "epoch": 960} {"train_loss": -20.458803176879883, "global_step": 79686, "epoch": 960} {"train_loss": -20.9440860748291, "global_step": 79687, "epoch": 960} {"train_loss": -20.388364791870117, "global_step": 79688, "epoch": 960} {"train_loss": -20.853055953979492, "global_step": 79689, "epoch": 960} {"train_loss": -20.67203140258789, "global_step": 79690, "epoch": 960} {"train_loss": -20.654150009155273, "global_step": 79691, "epoch": 960} {"train_loss": -20.7202205657959, "global_step": 79692, "epoch": 960} {"train_loss": -20.771696090698242, "global_step": 79693, "epoch": 960} {"train_loss": -20.748136520385742, "global_step": 79694, "epoch": 960} {"train_loss": -20.54924774169922, "global_step": 79695, "epoch": 960} {"train_loss": -20.744544982910156, "global_step": 79696, "epoch": 960} {"train_loss": -20.952016830444336, "global_step": 79697, "epoch": 960} {"train_loss": -20.719877243041992, "global_step": 79698, "epoch": 960} {"train_loss": -20.758787155151367, "global_step": 79699, "epoch": 960} {"train_loss": -21.053335189819336, "global_step": 79700, "epoch": 960} {"train_loss": -21.25804901123047, "global_step": 79701, "epoch": 960} {"train_loss": -21.04397964477539, "global_step": 79702, "epoch": 960} {"train_loss": -20.765233993530273, "global_step": 79703, "epoch": 960} {"train_loss": -21.079853057861328, "global_step": 79704, "epoch": 960} {"train_loss": -20.924680709838867, "global_step": 79705, "epoch": 960} {"train_loss": -21.12660789489746, "global_step": 79706, "epoch": 960} {"train_loss": -20.946626663208008, "global_step": 79707, "epoch": 960} {"train_loss": -21.182554244995117, "global_step": 79708, "epoch": 960} {"train_loss": -21.00309181213379, "global_step": 79709, "epoch": 960} {"train_loss": -21.36528778076172, "global_step": 79710, "epoch": 960} {"train_loss": -21.45255470275879, "global_step": 79711, "epoch": 960} {"train_loss": -21.33011245727539, "global_step": 79712, "epoch": 960} {"train_loss": -21.687376022338867, "global_step": 79713, "epoch": 960} {"train_loss": -21.25459861755371, "global_step": 79714, "epoch": 960} {"train_loss": -21.026918411254883, "global_step": 79715, "epoch": 960} {"train_loss": -20.8572998046875, "global_step": 79716, "epoch": 960} {"train_loss": -20.9210262298584, "global_step": 79717, "epoch": 960} {"train_loss": -21.156753540039062, "global_step": 79718, "epoch": 960} {"train_loss": -21.385766983032227, "global_step": 79719, "epoch": 960} {"train_loss": -21.490224838256836, "global_step": 79720, "epoch": 960} {"train_loss": -20.87001609802246, "global_step": 79721, "epoch": 960} {"train_loss": -21.308298110961914, "global_step": 79722, "epoch": 960} {"train_loss": -21.03485679626465, "global_step": 79723, "epoch": 960} {"train_loss": -21.33677101135254, "global_step": 79724, "epoch": 960} {"train_loss": -20.955312728881836, "global_step": 79725, "epoch": 960} {"train_loss": -20.982147216796875, "global_step": 79726, "epoch": 960} {"train_loss": -21.29473876953125, "global_step": 79727, "epoch": 960} {"train_loss": -21.28146743774414, "global_step": 79728, "epoch": 960} {"train_loss": -21.498022079467773, "global_step": 79729, "epoch": 960} {"train_loss": -21.556421279907227, "global_step": 79730, "epoch": 960} {"train_loss": -20.9908447265625, "global_step": 79731, "epoch": 960} {"train_loss": -21.24399757385254, "global_step": 79732, "epoch": 960} {"train_loss": -21.23616600036621, "global_step": 79733, "epoch": 960} {"train_loss": -21.417247772216797, "global_step": 79734, "epoch": 960} {"train_loss": -21.438684463500977, "global_step": 79735, "epoch": 960} {"train_loss": -21.206628799438477, "global_step": 79736, "epoch": 960} {"train_loss": -21.49112892150879, "global_step": 79737, "epoch": 960} {"train_loss": -21.35414695739746, "global_step": 79738, "epoch": 960} {"train_loss": -21.018306732177734, "global_step": 79739, "epoch": 960} {"train_loss": -21.140148162841797, "global_step": 79740, "epoch": 960} {"train_loss": -21.324359893798828, "global_step": 79741, "epoch": 960} {"train_loss": -21.113815307617188, "global_step": 79742, "epoch": 960} {"train_loss": -20.849369049072266, "global_step": 79743, "epoch": 960} {"train_loss": -21.131759643554688, "global_step": 79744, "epoch": 960} {"train_loss": -21.47041130065918, "global_step": 79745, "epoch": 960} {"train_loss": -20.98303985595703, "global_step": 79746, "epoch": 960} {"train_loss": -21.52402687072754, "global_step": 79747, "epoch": 960} {"train_loss": -21.341754913330078, "global_step": 79748, "epoch": 960} {"train_loss": -20.997751235961914, "global_step": 79749, "epoch": 960} {"train_loss": -21.2957763671875, "global_step": 79750, "epoch": 960} {"train_loss": -20.861677169799805, "global_step": 79751, "epoch": 960} {"train_loss": -21.27134132385254, "global_step": 79752, "epoch": 960} {"train_loss": -21.019899368286133, "global_step": 79753, "epoch": 960} {"train_loss": -21.295988082885742, "global_step": 79754, "epoch": 960} {"train_loss": -21.224294662475586, "global_step": 79755, "epoch": 960} {"train_loss": -21.32924461364746, "global_step": 79756, "epoch": 960} {"train_loss": -21.092700958251953, "global_step": 79757, "epoch": 960} {"train_loss": -21.17375946044922, "global_step": 79758, "epoch": 960} {"train_loss": -21.00275993347168, "global_step": 79759, "epoch": 960} {"train_loss": -21.308279037475586, "global_step": 79760, "epoch": 960} {"train_loss": -21.446205139160156, "global_step": 79761, "epoch": 960} {"train_loss": -21.051697099065205, "global_step": 79762, "epoch": 960, "val_loss": 6196412.5} {"train_loss": -20.531583786010742, "global_step": 79763, "epoch": 961} {"train_loss": -20.969409942626953, "global_step": 79764, "epoch": 961} {"train_loss": -21.05135154724121, "global_step": 79765, "epoch": 961} {"train_loss": -20.827011108398438, "global_step": 79766, "epoch": 961} {"train_loss": -20.50641632080078, "global_step": 79767, "epoch": 961} {"train_loss": -21.256210327148438, "global_step": 79768, "epoch": 961} {"train_loss": -21.211322784423828, "global_step": 79769, "epoch": 961} {"train_loss": -20.811426162719727, "global_step": 79770, "epoch": 961} {"train_loss": -21.332660675048828, "global_step": 79771, "epoch": 961} {"train_loss": -21.445520401000977, "global_step": 79772, "epoch": 961} {"train_loss": -20.9052791595459, "global_step": 79773, "epoch": 961} {"train_loss": -20.816984176635742, "global_step": 79774, "epoch": 961} {"train_loss": -21.12334442138672, "global_step": 79775, "epoch": 961} {"train_loss": -20.9002742767334, "global_step": 79776, "epoch": 961} {"train_loss": -21.201705932617188, "global_step": 79777, "epoch": 961} {"train_loss": -20.8531436920166, "global_step": 79778, "epoch": 961} {"train_loss": -21.119531631469727, "global_step": 79779, "epoch": 961} {"train_loss": -21.036285400390625, "global_step": 79780, "epoch": 961} {"train_loss": -21.215120315551758, "global_step": 79781, "epoch": 961} {"train_loss": -21.488393783569336, "global_step": 79782, "epoch": 961} {"train_loss": -21.067363739013672, "global_step": 79783, "epoch": 961} {"train_loss": -21.104206085205078, "global_step": 79784, "epoch": 961} {"train_loss": -21.263830184936523, "global_step": 79785, "epoch": 961} {"train_loss": -21.170673370361328, "global_step": 79786, "epoch": 961} {"train_loss": -21.19515609741211, "global_step": 79787, "epoch": 961} {"train_loss": -21.246007919311523, "global_step": 79788, "epoch": 961} {"train_loss": -21.296070098876953, "global_step": 79789, "epoch": 961} {"train_loss": -20.968326568603516, "global_step": 79790, "epoch": 961} {"train_loss": -21.050369262695312, "global_step": 79791, "epoch": 961} {"train_loss": -21.54836082458496, "global_step": 79792, "epoch": 961} {"train_loss": -21.408340454101562, "global_step": 79793, "epoch": 961} {"train_loss": -21.235198974609375, "global_step": 79794, "epoch": 961} {"train_loss": -20.992645263671875, "global_step": 79795, "epoch": 961} {"train_loss": -21.301599502563477, "global_step": 79796, "epoch": 961} {"train_loss": -21.334421157836914, "global_step": 79797, "epoch": 961} {"train_loss": -20.985639572143555, "global_step": 79798, "epoch": 961} {"train_loss": -21.326618194580078, "global_step": 79799, "epoch": 961} {"train_loss": -20.901309967041016, "global_step": 79800, "epoch": 961} {"train_loss": -21.254653930664062, "global_step": 79801, "epoch": 961} {"train_loss": -21.223947525024414, "global_step": 79802, "epoch": 961} {"train_loss": -20.517715454101562, "global_step": 79803, "epoch": 961} {"train_loss": -21.21537971496582, "global_step": 79804, "epoch": 961} {"train_loss": -21.50638198852539, "global_step": 79805, "epoch": 961} {"train_loss": -21.054092407226562, "global_step": 79806, "epoch": 961} {"train_loss": -21.29780387878418, "global_step": 79807, "epoch": 961} {"train_loss": -21.01808738708496, "global_step": 79808, "epoch": 961} {"train_loss": -20.90005874633789, "global_step": 79809, "epoch": 961} {"train_loss": -21.16963005065918, "global_step": 79810, "epoch": 961} {"train_loss": -20.630523681640625, "global_step": 79811, "epoch": 961} {"train_loss": -20.902433395385742, "global_step": 79812, "epoch": 961} {"train_loss": -20.962568283081055, "global_step": 79813, "epoch": 961} {"train_loss": -21.0050048828125, "global_step": 79814, "epoch": 961} {"train_loss": -21.207651138305664, "global_step": 79815, "epoch": 961} {"train_loss": -21.391826629638672, "global_step": 79816, "epoch": 961} {"train_loss": -20.756662368774414, "global_step": 79817, "epoch": 961} {"train_loss": -21.08314323425293, "global_step": 79818, "epoch": 961} {"train_loss": -21.179479598999023, "global_step": 79819, "epoch": 961} {"train_loss": -21.052997589111328, "global_step": 79820, "epoch": 961} {"train_loss": -21.019865036010742, "global_step": 79821, "epoch": 961} {"train_loss": -21.299863815307617, "global_step": 79822, "epoch": 961} {"train_loss": -21.528066635131836, "global_step": 79823, "epoch": 961} {"train_loss": -21.55927085876465, "global_step": 79824, "epoch": 961} {"train_loss": -21.294530868530273, "global_step": 79825, "epoch": 961} {"train_loss": -21.303844451904297, "global_step": 79826, "epoch": 961} {"train_loss": -21.856592178344727, "global_step": 79827, "epoch": 961} {"train_loss": -21.243722915649414, "global_step": 79828, "epoch": 961} {"train_loss": -21.218124389648438, "global_step": 79829, "epoch": 961} {"train_loss": -21.003210067749023, "global_step": 79830, "epoch": 961} {"train_loss": -21.059253692626953, "global_step": 79831, "epoch": 961} {"train_loss": -21.29542350769043, "global_step": 79832, "epoch": 961} {"train_loss": -21.416921615600586, "global_step": 79833, "epoch": 961} {"train_loss": -21.118066787719727, "global_step": 79834, "epoch": 961} {"train_loss": -21.357072830200195, "global_step": 79835, "epoch": 961} {"train_loss": -21.024642944335938, "global_step": 79836, "epoch": 961} {"train_loss": -21.273366928100586, "global_step": 79837, "epoch": 961} {"train_loss": -21.2277774810791, "global_step": 79838, "epoch": 961} {"train_loss": -21.437772750854492, "global_step": 79839, "epoch": 961} {"train_loss": -21.058759689331055, "global_step": 79840, "epoch": 961} {"train_loss": -21.244882583618164, "global_step": 79841, "epoch": 961} {"train_loss": -21.069503784179688, "global_step": 79842, "epoch": 961} {"train_loss": -20.8901424407959, "global_step": 79843, "epoch": 961} {"train_loss": -21.059619903564453, "global_step": 79844, "epoch": 961} {"train_loss": -21.12662696838379, "global_step": 79845, "epoch": 961, "val_loss": 6029167.0} {"train_loss": -20.57961082458496, "global_step": 79846, "epoch": 962} {"train_loss": -21.00249481201172, "global_step": 79847, "epoch": 962} {"train_loss": -20.908533096313477, "global_step": 79848, "epoch": 962} {"train_loss": -21.05027198791504, "global_step": 79849, "epoch": 962} {"train_loss": -20.984891891479492, "global_step": 79850, "epoch": 962} {"train_loss": -21.162569046020508, "global_step": 79851, "epoch": 962} {"train_loss": -20.778491973876953, "global_step": 79852, "epoch": 962} {"train_loss": -20.80083465576172, "global_step": 79853, "epoch": 962} {"train_loss": -20.686017990112305, "global_step": 79854, "epoch": 962} {"train_loss": -20.77534294128418, "global_step": 79855, "epoch": 962} {"train_loss": -21.14656639099121, "global_step": 79856, "epoch": 962} {"train_loss": -20.745960235595703, "global_step": 79857, "epoch": 962} {"train_loss": -21.339990615844727, "global_step": 79858, "epoch": 962} {"train_loss": -20.76102638244629, "global_step": 79859, "epoch": 962} {"train_loss": -21.25758171081543, "global_step": 79860, "epoch": 962} {"train_loss": -21.2001895904541, "global_step": 79861, "epoch": 962} {"train_loss": -20.947458267211914, "global_step": 79862, "epoch": 962} {"train_loss": -20.861623764038086, "global_step": 79863, "epoch": 962} {"train_loss": -20.996320724487305, "global_step": 79864, "epoch": 962} {"train_loss": -21.10090446472168, "global_step": 79865, "epoch": 962} {"train_loss": -21.378433227539062, "global_step": 79866, "epoch": 962} {"train_loss": -21.105485916137695, "global_step": 79867, "epoch": 962} {"train_loss": -20.80757713317871, "global_step": 79868, "epoch": 962} {"train_loss": -21.140806198120117, "global_step": 79869, "epoch": 962} {"train_loss": -20.831525802612305, "global_step": 79870, "epoch": 962} {"train_loss": -21.46198844909668, "global_step": 79871, "epoch": 962} {"train_loss": -21.170503616333008, "global_step": 79872, "epoch": 962} {"train_loss": -21.17292594909668, "global_step": 79873, "epoch": 962} {"train_loss": -21.168685913085938, "global_step": 79874, "epoch": 962} {"train_loss": -21.160085678100586, "global_step": 79875, "epoch": 962} {"train_loss": -21.1329345703125, "global_step": 79876, "epoch": 962} {"train_loss": -21.134313583374023, "global_step": 79877, "epoch": 962} {"train_loss": -21.30893898010254, "global_step": 79878, "epoch": 962} {"train_loss": -21.275110244750977, "global_step": 79879, "epoch": 962} {"train_loss": -21.34779167175293, "global_step": 79880, "epoch": 962} {"train_loss": -21.19215965270996, "global_step": 79881, "epoch": 962} {"train_loss": -21.303274154663086, "global_step": 79882, "epoch": 962} {"train_loss": -21.43019676208496, "global_step": 79883, "epoch": 962} {"train_loss": -21.489212036132812, "global_step": 79884, "epoch": 962} {"train_loss": -21.0196533203125, "global_step": 79885, "epoch": 962} {"train_loss": -21.16185760498047, "global_step": 79886, "epoch": 962} {"train_loss": -21.20281219482422, "global_step": 79887, "epoch": 962} {"train_loss": -21.488229751586914, "global_step": 79888, "epoch": 962} {"train_loss": -20.85841178894043, "global_step": 79889, "epoch": 962} {"train_loss": -21.249786376953125, "global_step": 79890, "epoch": 962} {"train_loss": -21.03758430480957, "global_step": 79891, "epoch": 962} {"train_loss": -21.381315231323242, "global_step": 79892, "epoch": 962} {"train_loss": -21.626922607421875, "global_step": 79893, "epoch": 962} {"train_loss": -21.580366134643555, "global_step": 79894, "epoch": 962} {"train_loss": -21.040796279907227, "global_step": 79895, "epoch": 962} {"train_loss": -20.847806930541992, "global_step": 79896, "epoch": 962} {"train_loss": -21.289793014526367, "global_step": 79897, "epoch": 962} {"train_loss": -20.977163314819336, "global_step": 79898, "epoch": 962} {"train_loss": -20.970712661743164, "global_step": 79899, "epoch": 962} {"train_loss": -21.2611141204834, "global_step": 79900, "epoch": 962} {"train_loss": -21.0145206451416, "global_step": 79901, "epoch": 962} {"train_loss": -21.420560836791992, "global_step": 79902, "epoch": 962} {"train_loss": -21.15187644958496, "global_step": 79903, "epoch": 962} {"train_loss": -20.983118057250977, "global_step": 79904, "epoch": 962} {"train_loss": -21.039518356323242, "global_step": 79905, "epoch": 962} {"train_loss": -21.01072883605957, "global_step": 79906, "epoch": 962} {"train_loss": -21.1442928314209, "global_step": 79907, "epoch": 962} {"train_loss": -21.62788200378418, "global_step": 79908, "epoch": 962} {"train_loss": -21.041128158569336, "global_step": 79909, "epoch": 962} {"train_loss": -21.24662971496582, "global_step": 79910, "epoch": 962} {"train_loss": -21.280485153198242, "global_step": 79911, "epoch": 962} {"train_loss": -21.08359718322754, "global_step": 79912, "epoch": 962} {"train_loss": -21.288570404052734, "global_step": 79913, "epoch": 962} {"train_loss": -21.185361862182617, "global_step": 79914, "epoch": 962} {"train_loss": -21.06434440612793, "global_step": 79915, "epoch": 962} {"train_loss": -21.43222427368164, "global_step": 79916, "epoch": 962} {"train_loss": -21.201213836669922, "global_step": 79917, "epoch": 962} {"train_loss": -21.265756607055664, "global_step": 79918, "epoch": 962} {"train_loss": -20.596433639526367, "global_step": 79919, "epoch": 962} {"train_loss": -21.153629302978516, "global_step": 79920, "epoch": 962} {"train_loss": -21.596790313720703, "global_step": 79921, "epoch": 962} {"train_loss": -21.07683753967285, "global_step": 79922, "epoch": 962} {"train_loss": -20.81954002380371, "global_step": 79923, "epoch": 962} {"train_loss": -21.4090576171875, "global_step": 79924, "epoch": 962} {"train_loss": -21.146169662475586, "global_step": 79925, "epoch": 962} {"train_loss": -21.413124084472656, "global_step": 79926, "epoch": 962} {"train_loss": -21.10483169555664, "global_step": 79927, "epoch": 962} {"train_loss": -21.12693834879312, "global_step": 79928, "epoch": 962, "val_loss": 6104272.0} {"train_loss": -21.01826286315918, "global_step": 79929, "epoch": 963} {"train_loss": -20.533945083618164, "global_step": 79930, "epoch": 963} {"train_loss": -21.283802032470703, "global_step": 79931, "epoch": 963} {"train_loss": -20.815961837768555, "global_step": 79932, "epoch": 963} {"train_loss": -20.686471939086914, "global_step": 79933, "epoch": 963} {"train_loss": -20.766626358032227, "global_step": 79934, "epoch": 963} {"train_loss": -21.10634422302246, "global_step": 79935, "epoch": 963} {"train_loss": -21.323949813842773, "global_step": 79936, "epoch": 963} {"train_loss": -20.750869750976562, "global_step": 79937, "epoch": 963} {"train_loss": -21.02414321899414, "global_step": 79938, "epoch": 963} {"train_loss": -20.974699020385742, "global_step": 79939, "epoch": 963} {"train_loss": -20.963455200195312, "global_step": 79940, "epoch": 963} {"train_loss": -21.19370460510254, "global_step": 79941, "epoch": 963} {"train_loss": -21.05001449584961, "global_step": 79942, "epoch": 963} {"train_loss": -21.240331649780273, "global_step": 79943, "epoch": 963} {"train_loss": -21.011144638061523, "global_step": 79944, "epoch": 963} {"train_loss": -21.268613815307617, "global_step": 79945, "epoch": 963} {"train_loss": -21.177352905273438, "global_step": 79946, "epoch": 963} {"train_loss": -20.948408126831055, "global_step": 79947, "epoch": 963} {"train_loss": -21.34660530090332, "global_step": 79948, "epoch": 963} {"train_loss": -21.130142211914062, "global_step": 79949, "epoch": 963} {"train_loss": -20.83852195739746, "global_step": 79950, "epoch": 963} {"train_loss": -20.823951721191406, "global_step": 79951, "epoch": 963} {"train_loss": -20.86794090270996, "global_step": 79952, "epoch": 963} {"train_loss": -20.966094970703125, "global_step": 79953, "epoch": 963} {"train_loss": -21.242807388305664, "global_step": 79954, "epoch": 963} {"train_loss": -20.988384246826172, "global_step": 79955, "epoch": 963} {"train_loss": -20.94439697265625, "global_step": 79956, "epoch": 963} {"train_loss": -21.326324462890625, "global_step": 79957, "epoch": 963} {"train_loss": -21.757291793823242, "global_step": 79958, "epoch": 963} {"train_loss": -21.30430030822754, "global_step": 79959, "epoch": 963} {"train_loss": -21.106210708618164, "global_step": 79960, "epoch": 963} {"train_loss": -20.871679306030273, "global_step": 79961, "epoch": 963} {"train_loss": -21.399948120117188, "global_step": 79962, "epoch": 963} {"train_loss": -21.149030685424805, "global_step": 79963, "epoch": 963} {"train_loss": -21.234403610229492, "global_step": 79964, "epoch": 963} {"train_loss": -21.436176300048828, "global_step": 79965, "epoch": 963} {"train_loss": -21.426267623901367, "global_step": 79966, "epoch": 963} {"train_loss": -21.371475219726562, "global_step": 79967, "epoch": 963} {"train_loss": -21.130840301513672, "global_step": 79968, "epoch": 963} {"train_loss": -21.209012985229492, "global_step": 79969, "epoch": 963} {"train_loss": -21.5775203704834, "global_step": 79970, "epoch": 963} {"train_loss": -21.593164443969727, "global_step": 79971, "epoch": 963} {"train_loss": -21.2745418548584, "global_step": 79972, "epoch": 963} {"train_loss": -21.076385498046875, "global_step": 79973, "epoch": 963} {"train_loss": -21.289264678955078, "global_step": 79974, "epoch": 963} {"train_loss": -21.273101806640625, "global_step": 79975, "epoch": 963} {"train_loss": -20.84805679321289, "global_step": 79976, "epoch": 963} {"train_loss": -20.927623748779297, "global_step": 79977, "epoch": 963} {"train_loss": -20.9636173248291, "global_step": 79978, "epoch": 963} {"train_loss": -21.185495376586914, "global_step": 79979, "epoch": 963} {"train_loss": -21.160438537597656, "global_step": 79980, "epoch": 963} {"train_loss": -21.135910034179688, "global_step": 79981, "epoch": 963} {"train_loss": -20.971088409423828, "global_step": 79982, "epoch": 963} {"train_loss": -21.349822998046875, "global_step": 79983, "epoch": 963} {"train_loss": -21.45656394958496, "global_step": 79984, "epoch": 963} {"train_loss": -21.1682186126709, "global_step": 79985, "epoch": 963} {"train_loss": -21.26972198486328, "global_step": 79986, "epoch": 963} {"train_loss": -21.639118194580078, "global_step": 79987, "epoch": 963} {"train_loss": -21.26882553100586, "global_step": 79988, "epoch": 963} {"train_loss": -21.35872459411621, "global_step": 79989, "epoch": 963} {"train_loss": -21.526935577392578, "global_step": 79990, "epoch": 963} {"train_loss": -21.072132110595703, "global_step": 79991, "epoch": 963} {"train_loss": -21.089492797851562, "global_step": 79992, "epoch": 963} {"train_loss": -21.392122268676758, "global_step": 79993, "epoch": 963} {"train_loss": -21.172042846679688, "global_step": 79994, "epoch": 963} {"train_loss": -21.329315185546875, "global_step": 79995, "epoch": 963} {"train_loss": -20.890640258789062, "global_step": 79996, "epoch": 963} {"train_loss": -20.921913146972656, "global_step": 79997, "epoch": 963} {"train_loss": -21.492313385009766, "global_step": 79998, "epoch": 963} {"train_loss": -20.877599716186523, "global_step": 79999, "epoch": 963} {"train_loss": -21.56332015991211, "global_step": 80000, "epoch": 963} {"train_loss": -21.299915313720703, "global_step": 80001, "epoch": 963} {"train_loss": -21.191030502319336, "global_step": 80002, "epoch": 963} {"train_loss": -21.313098907470703, "global_step": 80003, "epoch": 963} {"train_loss": -21.110876083374023, "global_step": 80004, "epoch": 963} {"train_loss": -21.419824600219727, "global_step": 80005, "epoch": 963} {"train_loss": -21.28314781188965, "global_step": 80006, "epoch": 963} {"train_loss": -21.284666061401367, "global_step": 80007, "epoch": 963} {"train_loss": -21.350473403930664, "global_step": 80008, "epoch": 963} {"train_loss": -21.024642944335938, "global_step": 80009, "epoch": 963} {"train_loss": -21.222776412963867, "global_step": 80010, "epoch": 963} {"train_loss": -21.18324537162321, "global_step": 80011, "epoch": 963, "val_loss": 6231501.0} {"train_loss": -21.25439453125, "global_step": 80012, "epoch": 964} {"train_loss": -20.96651268005371, "global_step": 80013, "epoch": 964} {"train_loss": -20.4075984954834, "global_step": 80014, "epoch": 964} {"train_loss": -20.83385467529297, "global_step": 80015, "epoch": 964} {"train_loss": -21.2417049407959, "global_step": 80016, "epoch": 964} {"train_loss": -20.497737884521484, "global_step": 80017, "epoch": 964} {"train_loss": -20.98395347595215, "global_step": 80018, "epoch": 964} {"train_loss": -21.000782012939453, "global_step": 80019, "epoch": 964} {"train_loss": -21.166181564331055, "global_step": 80020, "epoch": 964} {"train_loss": -21.43321990966797, "global_step": 80021, "epoch": 964} {"train_loss": -20.892324447631836, "global_step": 80022, "epoch": 964} {"train_loss": -21.27960205078125, "global_step": 80023, "epoch": 964} {"train_loss": -20.792959213256836, "global_step": 80024, "epoch": 964} {"train_loss": -20.974000930786133, "global_step": 80025, "epoch": 964} {"train_loss": -20.61482810974121, "global_step": 80026, "epoch": 964} {"train_loss": -20.915918350219727, "global_step": 80027, "epoch": 964} {"train_loss": -21.051513671875, "global_step": 80028, "epoch": 964} {"train_loss": -20.764698028564453, "global_step": 80029, "epoch": 964} {"train_loss": -21.264928817749023, "global_step": 80030, "epoch": 964} {"train_loss": -21.365203857421875, "global_step": 80031, "epoch": 964} {"train_loss": -21.307117462158203, "global_step": 80032, "epoch": 964} {"train_loss": -21.139707565307617, "global_step": 80033, "epoch": 964} {"train_loss": -21.352783203125, "global_step": 80034, "epoch": 964} {"train_loss": -21.341398239135742, "global_step": 80035, "epoch": 964} {"train_loss": -21.303743362426758, "global_step": 80036, "epoch": 964} {"train_loss": -21.144582748413086, "global_step": 80037, "epoch": 964} {"train_loss": -21.41904640197754, "global_step": 80038, "epoch": 964} {"train_loss": -21.065786361694336, "global_step": 80039, "epoch": 964} {"train_loss": -20.930587768554688, "global_step": 80040, "epoch": 964} {"train_loss": -21.221345901489258, "global_step": 80041, "epoch": 964} {"train_loss": -21.041784286499023, "global_step": 80042, "epoch": 964} {"train_loss": -21.334562301635742, "global_step": 80043, "epoch": 964} {"train_loss": -21.163150787353516, "global_step": 80044, "epoch": 964} {"train_loss": -21.232349395751953, "global_step": 80045, "epoch": 964} {"train_loss": -21.39528465270996, "global_step": 80046, "epoch": 964} {"train_loss": -20.682430267333984, "global_step": 80047, "epoch": 964} {"train_loss": -21.198453903198242, "global_step": 80048, "epoch": 964} {"train_loss": -21.297321319580078, "global_step": 80049, "epoch": 964} {"train_loss": -21.24652671813965, "global_step": 80050, "epoch": 964} {"train_loss": -21.204992294311523, "global_step": 80051, "epoch": 964} {"train_loss": -21.149656295776367, "global_step": 80052, "epoch": 964} {"train_loss": -21.18794059753418, "global_step": 80053, "epoch": 964} {"train_loss": -20.990720748901367, "global_step": 80054, "epoch": 964} {"train_loss": -21.305145263671875, "global_step": 80055, "epoch": 964} {"train_loss": -21.62325096130371, "global_step": 80056, "epoch": 964} {"train_loss": -21.17998695373535, "global_step": 80057, "epoch": 964} {"train_loss": -21.383682250976562, "global_step": 80058, "epoch": 964} {"train_loss": -21.18869972229004, "global_step": 80059, "epoch": 964} {"train_loss": -20.995391845703125, "global_step": 80060, "epoch": 964} {"train_loss": -21.22688102722168, "global_step": 80061, "epoch": 964} {"train_loss": -21.071849822998047, "global_step": 80062, "epoch": 964} {"train_loss": -21.009654998779297, "global_step": 80063, "epoch": 964} {"train_loss": -21.511062622070312, "global_step": 80064, "epoch": 964} {"train_loss": -21.106355667114258, "global_step": 80065, "epoch": 964} {"train_loss": -21.098026275634766, "global_step": 80066, "epoch": 964} {"train_loss": -20.95378303527832, "global_step": 80067, "epoch": 964} {"train_loss": -21.308094024658203, "global_step": 80068, "epoch": 964} {"train_loss": -21.373477935791016, "global_step": 80069, "epoch": 964} {"train_loss": -21.377099990844727, "global_step": 80070, "epoch": 964} {"train_loss": -21.07343864440918, "global_step": 80071, "epoch": 964} {"train_loss": -21.21754264831543, "global_step": 80072, "epoch": 964} {"train_loss": -21.31876564025879, "global_step": 80073, "epoch": 964} {"train_loss": -21.144329071044922, "global_step": 80074, "epoch": 964} {"train_loss": -21.09783935546875, "global_step": 80075, "epoch": 964} {"train_loss": -21.371288299560547, "global_step": 80076, "epoch": 964} {"train_loss": -21.288606643676758, "global_step": 80077, "epoch": 964} {"train_loss": -21.5830078125, "global_step": 80078, "epoch": 964} {"train_loss": -21.312284469604492, "global_step": 80079, "epoch": 964} {"train_loss": -21.43951416015625, "global_step": 80080, "epoch": 964} {"train_loss": -21.296823501586914, "global_step": 80081, "epoch": 964} {"train_loss": -21.324621200561523, "global_step": 80082, "epoch": 964} {"train_loss": -21.09921646118164, "global_step": 80083, "epoch": 964} {"train_loss": -21.53837013244629, "global_step": 80084, "epoch": 964} {"train_loss": -20.967817306518555, "global_step": 80085, "epoch": 964} {"train_loss": -20.93726348876953, "global_step": 80086, "epoch": 964} {"train_loss": -21.4062442779541, "global_step": 80087, "epoch": 964} {"train_loss": -20.974401473999023, "global_step": 80088, "epoch": 964} {"train_loss": -21.09138298034668, "global_step": 80089, "epoch": 964} {"train_loss": -20.862295150756836, "global_step": 80090, "epoch": 964} {"train_loss": -21.03337287902832, "global_step": 80091, "epoch": 964} {"train_loss": -21.156354904174805, "global_step": 80092, "epoch": 964} {"train_loss": -21.312543869018555, "global_step": 80093, "epoch": 964} {"train_loss": -21.165378593536744, "global_step": 80094, "epoch": 964, "val_loss": 5968646.5} {"train_loss": -20.90838050842285, "global_step": 80095, "epoch": 965} {"train_loss": -20.756134033203125, "global_step": 80096, "epoch": 965} {"train_loss": -20.724702835083008, "global_step": 80097, "epoch": 965} {"train_loss": -20.611242294311523, "global_step": 80098, "epoch": 965} {"train_loss": -20.918241500854492, "global_step": 80099, "epoch": 965} {"train_loss": -20.923059463500977, "global_step": 80100, "epoch": 965} {"train_loss": -21.234447479248047, "global_step": 80101, "epoch": 965} {"train_loss": -20.90688133239746, "global_step": 80102, "epoch": 965} {"train_loss": -21.225553512573242, "global_step": 80103, "epoch": 965} {"train_loss": -20.89927101135254, "global_step": 80104, "epoch": 965} {"train_loss": -20.886579513549805, "global_step": 80105, "epoch": 965} {"train_loss": -21.2913818359375, "global_step": 80106, "epoch": 965} {"train_loss": -21.142635345458984, "global_step": 80107, "epoch": 965} {"train_loss": -21.451704025268555, "global_step": 80108, "epoch": 965} {"train_loss": -21.29925537109375, "global_step": 80109, "epoch": 965} {"train_loss": -21.365863800048828, "global_step": 80110, "epoch": 965} {"train_loss": -20.82284164428711, "global_step": 80111, "epoch": 965} {"train_loss": -20.856552124023438, "global_step": 80112, "epoch": 965} {"train_loss": -20.85587501525879, "global_step": 80113, "epoch": 965} {"train_loss": -21.15411949157715, "global_step": 80114, "epoch": 965} {"train_loss": -21.610509872436523, "global_step": 80115, "epoch": 965} {"train_loss": -21.28498077392578, "global_step": 80116, "epoch": 965} {"train_loss": -21.21611976623535, "global_step": 80117, "epoch": 965} {"train_loss": -20.93138313293457, "global_step": 80118, "epoch": 965} {"train_loss": -21.381942749023438, "global_step": 80119, "epoch": 965} {"train_loss": -21.241933822631836, "global_step": 80120, "epoch": 965} {"train_loss": -20.646989822387695, "global_step": 80121, "epoch": 965} {"train_loss": -21.19138526916504, "global_step": 80122, "epoch": 965} {"train_loss": -20.985090255737305, "global_step": 80123, "epoch": 965} {"train_loss": -21.033065795898438, "global_step": 80124, "epoch": 965} {"train_loss": -21.349388122558594, "global_step": 80125, "epoch": 965} {"train_loss": -21.05219078063965, "global_step": 80126, "epoch": 965} {"train_loss": -21.403860092163086, "global_step": 80127, "epoch": 965} {"train_loss": -21.35621452331543, "global_step": 80128, "epoch": 965} {"train_loss": -20.874265670776367, "global_step": 80129, "epoch": 965} {"train_loss": -21.212614059448242, "global_step": 80130, "epoch": 965} {"train_loss": -21.544811248779297, "global_step": 80131, "epoch": 965} {"train_loss": -21.354055404663086, "global_step": 80132, "epoch": 965} {"train_loss": -21.243803024291992, "global_step": 80133, "epoch": 965} {"train_loss": -21.547443389892578, "global_step": 80134, "epoch": 965} {"train_loss": -21.074922561645508, "global_step": 80135, "epoch": 965} {"train_loss": -21.403676986694336, "global_step": 80136, "epoch": 965} {"train_loss": -21.236974716186523, "global_step": 80137, "epoch": 965} {"train_loss": -21.581928253173828, "global_step": 80138, "epoch": 965} {"train_loss": -21.11187171936035, "global_step": 80139, "epoch": 965} {"train_loss": -21.16767692565918, "global_step": 80140, "epoch": 965} {"train_loss": -20.980224609375, "global_step": 80141, "epoch": 965} {"train_loss": -21.168819427490234, "global_step": 80142, "epoch": 965} {"train_loss": -21.411762237548828, "global_step": 80143, "epoch": 965} {"train_loss": -21.106403350830078, "global_step": 80144, "epoch": 965} {"train_loss": -21.463991165161133, "global_step": 80145, "epoch": 965} {"train_loss": -21.085412979125977, "global_step": 80146, "epoch": 965} {"train_loss": -21.403364181518555, "global_step": 80147, "epoch": 965} {"train_loss": -21.430654525756836, "global_step": 80148, "epoch": 965} {"train_loss": -21.104520797729492, "global_step": 80149, "epoch": 965} {"train_loss": -21.534250259399414, "global_step": 80150, "epoch": 965} {"train_loss": -21.497724533081055, "global_step": 80151, "epoch": 965} {"train_loss": -21.06134033203125, "global_step": 80152, "epoch": 965} {"train_loss": -21.626813888549805, "global_step": 80153, "epoch": 965} {"train_loss": -21.25335121154785, "global_step": 80154, "epoch": 965} {"train_loss": -21.081846237182617, "global_step": 80155, "epoch": 965} {"train_loss": -21.425588607788086, "global_step": 80156, "epoch": 965} {"train_loss": -21.21541404724121, "global_step": 80157, "epoch": 965} {"train_loss": -21.26381492614746, "global_step": 80158, "epoch": 965} {"train_loss": -21.333810806274414, "global_step": 80159, "epoch": 965} {"train_loss": -21.435834884643555, "global_step": 80160, "epoch": 965} {"train_loss": -21.222368240356445, "global_step": 80161, "epoch": 965} {"train_loss": -21.51363182067871, "global_step": 80162, "epoch": 965} {"train_loss": -21.370197296142578, "global_step": 80163, "epoch": 965} {"train_loss": -21.235532760620117, "global_step": 80164, "epoch": 965} {"train_loss": -21.368316650390625, "global_step": 80165, "epoch": 965} {"train_loss": -21.565710067749023, "global_step": 80166, "epoch": 965} {"train_loss": -21.420278549194336, "global_step": 80167, "epoch": 965} {"train_loss": -21.126258850097656, "global_step": 80168, "epoch": 965} {"train_loss": -21.45828628540039, "global_step": 80169, "epoch": 965} {"train_loss": -21.124326705932617, "global_step": 80170, "epoch": 965} {"train_loss": -21.58418846130371, "global_step": 80171, "epoch": 965} {"train_loss": -21.077150344848633, "global_step": 80172, "epoch": 965} {"train_loss": -21.215229034423828, "global_step": 80173, "epoch": 965} {"train_loss": -21.239831924438477, "global_step": 80174, "epoch": 965} {"train_loss": -21.12296485900879, "global_step": 80175, "epoch": 965} {"train_loss": -21.103666305541992, "global_step": 80176, "epoch": 965} {"train_loss": -21.20947277115052, "global_step": 80177, "epoch": 965, "val_loss": 6091729.5} {"train_loss": -20.866256713867188, "global_step": 80178, "epoch": 966} {"train_loss": -21.101234436035156, "global_step": 80179, "epoch": 966} {"train_loss": -21.181928634643555, "global_step": 80180, "epoch": 966} {"train_loss": -21.290800094604492, "global_step": 80181, "epoch": 966} {"train_loss": -21.1717472076416, "global_step": 80182, "epoch": 966} {"train_loss": -21.188291549682617, "global_step": 80183, "epoch": 966} {"train_loss": -21.092782974243164, "global_step": 80184, "epoch": 966} {"train_loss": -21.262548446655273, "global_step": 80185, "epoch": 966} {"train_loss": -20.966888427734375, "global_step": 80186, "epoch": 966} {"train_loss": -21.319093704223633, "global_step": 80187, "epoch": 966} {"train_loss": -21.2933292388916, "global_step": 80188, "epoch": 966} {"train_loss": -21.159210205078125, "global_step": 80189, "epoch": 966} {"train_loss": -21.20224380493164, "global_step": 80190, "epoch": 966} {"train_loss": -21.27288246154785, "global_step": 80191, "epoch": 966} {"train_loss": -21.18505859375, "global_step": 80192, "epoch": 966} {"train_loss": -21.29521369934082, "global_step": 80193, "epoch": 966} {"train_loss": -21.492795944213867, "global_step": 80194, "epoch": 966} {"train_loss": -21.013452529907227, "global_step": 80195, "epoch": 966} {"train_loss": -21.247617721557617, "global_step": 80196, "epoch": 966} {"train_loss": -21.18825340270996, "global_step": 80197, "epoch": 966} {"train_loss": -21.078083038330078, "global_step": 80198, "epoch": 966} {"train_loss": -21.315078735351562, "global_step": 80199, "epoch": 966} {"train_loss": -21.30500602722168, "global_step": 80200, "epoch": 966} {"train_loss": -21.4717960357666, "global_step": 80201, "epoch": 966} {"train_loss": -21.655752182006836, "global_step": 80202, "epoch": 966} {"train_loss": -21.35085105895996, "global_step": 80203, "epoch": 966} {"train_loss": -21.74635124206543, "global_step": 80204, "epoch": 966} {"train_loss": -21.18311882019043, "global_step": 80205, "epoch": 966} {"train_loss": -21.395477294921875, "global_step": 80206, "epoch": 966} {"train_loss": -21.273832321166992, "global_step": 80207, "epoch": 966} {"train_loss": -20.87506675720215, "global_step": 80208, "epoch": 966} {"train_loss": -21.078582763671875, "global_step": 80209, "epoch": 966} {"train_loss": -21.06976318359375, "global_step": 80210, "epoch": 966} {"train_loss": -20.767297744750977, "global_step": 80211, "epoch": 966} {"train_loss": -21.020023345947266, "global_step": 80212, "epoch": 966} {"train_loss": -21.53785514831543, "global_step": 80213, "epoch": 966} {"train_loss": -21.532522201538086, "global_step": 80214, "epoch": 966} {"train_loss": -21.278284072875977, "global_step": 80215, "epoch": 966} {"train_loss": -21.391267776489258, "global_step": 80216, "epoch": 966} {"train_loss": -20.931562423706055, "global_step": 80217, "epoch": 966} {"train_loss": -21.263015747070312, "global_step": 80218, "epoch": 966} {"train_loss": -21.037433624267578, "global_step": 80219, "epoch": 966} {"train_loss": -20.743680953979492, "global_step": 80220, "epoch": 966} {"train_loss": -21.07411766052246, "global_step": 80221, "epoch": 966} {"train_loss": -21.157527923583984, "global_step": 80222, "epoch": 966} {"train_loss": -21.20581817626953, "global_step": 80223, "epoch": 966} {"train_loss": -21.261594772338867, "global_step": 80224, "epoch": 966} {"train_loss": -20.958831787109375, "global_step": 80225, "epoch": 966} {"train_loss": -21.771503448486328, "global_step": 80226, "epoch": 966} {"train_loss": -21.759458541870117, "global_step": 80227, "epoch": 966} {"train_loss": -21.548280715942383, "global_step": 80228, "epoch": 966} {"train_loss": -20.662992477416992, "global_step": 80229, "epoch": 966} {"train_loss": -21.16822624206543, "global_step": 80230, "epoch": 966} {"train_loss": -20.597082138061523, "global_step": 80231, "epoch": 966} {"train_loss": -21.266576766967773, "global_step": 80232, "epoch": 966} {"train_loss": -20.93938636779785, "global_step": 80233, "epoch": 966} {"train_loss": -21.09872055053711, "global_step": 80234, "epoch": 966} {"train_loss": -20.921537399291992, "global_step": 80235, "epoch": 966} {"train_loss": -20.803739547729492, "global_step": 80236, "epoch": 966} {"train_loss": -20.874399185180664, "global_step": 80237, "epoch": 966} {"train_loss": -21.50946617126465, "global_step": 80238, "epoch": 966} {"train_loss": -20.848745346069336, "global_step": 80239, "epoch": 966} {"train_loss": -21.263137817382812, "global_step": 80240, "epoch": 966} {"train_loss": -21.127416610717773, "global_step": 80241, "epoch": 966} {"train_loss": -21.590030670166016, "global_step": 80242, "epoch": 966} {"train_loss": -20.812612533569336, "global_step": 80243, "epoch": 966} {"train_loss": -21.366819381713867, "global_step": 80244, "epoch": 966} {"train_loss": -21.39322853088379, "global_step": 80245, "epoch": 966} {"train_loss": -21.073965072631836, "global_step": 80246, "epoch": 966} {"train_loss": -21.08688735961914, "global_step": 80247, "epoch": 966} {"train_loss": -21.220504760742188, "global_step": 80248, "epoch": 966} {"train_loss": -20.949384689331055, "global_step": 80249, "epoch": 966} {"train_loss": -21.116519927978516, "global_step": 80250, "epoch": 966} {"train_loss": -21.415151596069336, "global_step": 80251, "epoch": 966} {"train_loss": -21.123014450073242, "global_step": 80252, "epoch": 966} {"train_loss": -21.486610412597656, "global_step": 80253, "epoch": 966} {"train_loss": -20.86139488220215, "global_step": 80254, "epoch": 966} {"train_loss": -20.76317024230957, "global_step": 80255, "epoch": 966} {"train_loss": -21.30852508544922, "global_step": 80256, "epoch": 966} {"train_loss": -21.149595260620117, "global_step": 80257, "epoch": 966} {"train_loss": -21.282485961914062, "global_step": 80258, "epoch": 966} {"train_loss": -21.15937042236328, "global_step": 80259, "epoch": 966} {"train_loss": -21.17792538562453, "global_step": 80260, "epoch": 966, "val_loss": 5928835.5} {"train_loss": -20.96792221069336, "global_step": 80261, "epoch": 967} {"train_loss": -20.817148208618164, "global_step": 80262, "epoch": 967} {"train_loss": -20.657852172851562, "global_step": 80263, "epoch": 967} {"train_loss": -20.492294311523438, "global_step": 80264, "epoch": 967} {"train_loss": -21.075714111328125, "global_step": 80265, "epoch": 967} {"train_loss": -20.656225204467773, "global_step": 80266, "epoch": 967} {"train_loss": -20.527257919311523, "global_step": 80267, "epoch": 967} {"train_loss": -20.844715118408203, "global_step": 80268, "epoch": 967} {"train_loss": -20.962615966796875, "global_step": 80269, "epoch": 967} {"train_loss": -20.63180923461914, "global_step": 80270, "epoch": 967} {"train_loss": -21.07494354248047, "global_step": 80271, "epoch": 967} {"train_loss": -21.027637481689453, "global_step": 80272, "epoch": 967} {"train_loss": -20.881332397460938, "global_step": 80273, "epoch": 967} {"train_loss": -21.003244400024414, "global_step": 80274, "epoch": 967} {"train_loss": -21.087665557861328, "global_step": 80275, "epoch": 967} {"train_loss": -21.285642623901367, "global_step": 80276, "epoch": 967} {"train_loss": -20.8686466217041, "global_step": 80277, "epoch": 967} {"train_loss": -20.976776123046875, "global_step": 80278, "epoch": 967} {"train_loss": -21.21061134338379, "global_step": 80279, "epoch": 967} {"train_loss": -21.09714126586914, "global_step": 80280, "epoch": 967} {"train_loss": -21.119937896728516, "global_step": 80281, "epoch": 967} {"train_loss": -21.19501304626465, "global_step": 80282, "epoch": 967} {"train_loss": -21.10671043395996, "global_step": 80283, "epoch": 967} {"train_loss": -21.036670684814453, "global_step": 80284, "epoch": 967} {"train_loss": -21.363571166992188, "global_step": 80285, "epoch": 967} {"train_loss": -21.231292724609375, "global_step": 80286, "epoch": 967} {"train_loss": -21.647907257080078, "global_step": 80287, "epoch": 967} {"train_loss": -21.197935104370117, "global_step": 80288, "epoch": 967} {"train_loss": -21.27229118347168, "global_step": 80289, "epoch": 967} {"train_loss": -21.0, "global_step": 80290, "epoch": 967} {"train_loss": -21.39813804626465, "global_step": 80291, "epoch": 967} {"train_loss": -21.169340133666992, "global_step": 80292, "epoch": 967} {"train_loss": -21.288860321044922, "global_step": 80293, "epoch": 967} {"train_loss": -21.280956268310547, "global_step": 80294, "epoch": 967} {"train_loss": -21.309091567993164, "global_step": 80295, "epoch": 967} {"train_loss": -21.335418701171875, "global_step": 80296, "epoch": 967} {"train_loss": -21.292407989501953, "global_step": 80297, "epoch": 967} {"train_loss": -21.68929672241211, "global_step": 80298, "epoch": 967} {"train_loss": -21.212522506713867, "global_step": 80299, "epoch": 967} {"train_loss": -21.02164077758789, "global_step": 80300, "epoch": 967} {"train_loss": -20.856910705566406, "global_step": 80301, "epoch": 967} {"train_loss": -21.08199119567871, "global_step": 80302, "epoch": 967} {"train_loss": -21.07822036743164, "global_step": 80303, "epoch": 967} {"train_loss": -21.304059982299805, "global_step": 80304, "epoch": 967} {"train_loss": -21.446842193603516, "global_step": 80305, "epoch": 967} {"train_loss": -21.002138137817383, "global_step": 80306, "epoch": 967} {"train_loss": -21.584699630737305, "global_step": 80307, "epoch": 967} {"train_loss": -20.877965927124023, "global_step": 80308, "epoch": 967} {"train_loss": -21.149133682250977, "global_step": 80309, "epoch": 967} {"train_loss": -21.524686813354492, "global_step": 80310, "epoch": 967} {"train_loss": -21.282140731811523, "global_step": 80311, "epoch": 967} {"train_loss": -21.061203002929688, "global_step": 80312, "epoch": 967} {"train_loss": -20.986679077148438, "global_step": 80313, "epoch": 967} {"train_loss": -21.366247177124023, "global_step": 80314, "epoch": 967} {"train_loss": -21.171735763549805, "global_step": 80315, "epoch": 967} {"train_loss": -21.462636947631836, "global_step": 80316, "epoch": 967} {"train_loss": -21.42726707458496, "global_step": 80317, "epoch": 967} {"train_loss": -21.610471725463867, "global_step": 80318, "epoch": 967} {"train_loss": -20.73477554321289, "global_step": 80319, "epoch": 967} {"train_loss": -21.3901424407959, "global_step": 80320, "epoch": 967} {"train_loss": -20.957059860229492, "global_step": 80321, "epoch": 967} {"train_loss": -21.205076217651367, "global_step": 80322, "epoch": 967} {"train_loss": -20.989826202392578, "global_step": 80323, "epoch": 967} {"train_loss": -21.1740779876709, "global_step": 80324, "epoch": 967} {"train_loss": -20.812957763671875, "global_step": 80325, "epoch": 967} {"train_loss": -20.895456314086914, "global_step": 80326, "epoch": 967} {"train_loss": -21.237157821655273, "global_step": 80327, "epoch": 967} {"train_loss": -20.692533493041992, "global_step": 80328, "epoch": 967} {"train_loss": -21.02545738220215, "global_step": 80329, "epoch": 967} {"train_loss": -20.88361358642578, "global_step": 80330, "epoch": 967} {"train_loss": -21.193937301635742, "global_step": 80331, "epoch": 967} {"train_loss": -21.21565818786621, "global_step": 80332, "epoch": 967} {"train_loss": -21.41383934020996, "global_step": 80333, "epoch": 967} {"train_loss": -21.630035400390625, "global_step": 80334, "epoch": 967} {"train_loss": -21.38837432861328, "global_step": 80335, "epoch": 967} {"train_loss": -21.15285301208496, "global_step": 80336, "epoch": 967} {"train_loss": -21.4840145111084, "global_step": 80337, "epoch": 967} {"train_loss": -21.57312774658203, "global_step": 80338, "epoch": 967} {"train_loss": -21.200986862182617, "global_step": 80339, "epoch": 967} {"train_loss": -21.29041862487793, "global_step": 80340, "epoch": 967} {"train_loss": -21.080081939697266, "global_step": 80341, "epoch": 967} {"train_loss": -21.410633087158203, "global_step": 80342, "epoch": 967} {"train_loss": -21.1164390150323, "global_step": 80343, "epoch": 967, "val_loss": 5948663.0} {"train_loss": -20.861391067504883, "global_step": 80344, "epoch": 968} {"train_loss": -21.230493545532227, "global_step": 80345, "epoch": 968} {"train_loss": -21.260013580322266, "global_step": 80346, "epoch": 968} {"train_loss": -20.96818733215332, "global_step": 80347, "epoch": 968} {"train_loss": -21.092668533325195, "global_step": 80348, "epoch": 968} {"train_loss": -21.033552169799805, "global_step": 80349, "epoch": 968} {"train_loss": -21.025114059448242, "global_step": 80350, "epoch": 968} {"train_loss": -21.506261825561523, "global_step": 80351, "epoch": 968} {"train_loss": -21.038496017456055, "global_step": 80352, "epoch": 968} {"train_loss": -21.261423110961914, "global_step": 80353, "epoch": 968} {"train_loss": -21.272329330444336, "global_step": 80354, "epoch": 968} {"train_loss": -20.7587833404541, "global_step": 80355, "epoch": 968} {"train_loss": -20.8906192779541, "global_step": 80356, "epoch": 968} {"train_loss": -21.007917404174805, "global_step": 80357, "epoch": 968} {"train_loss": -21.014429092407227, "global_step": 80358, "epoch": 968} {"train_loss": -21.70110321044922, "global_step": 80359, "epoch": 968} {"train_loss": -21.221288681030273, "global_step": 80360, "epoch": 968} {"train_loss": -21.56971549987793, "global_step": 80361, "epoch": 968} {"train_loss": -21.1707763671875, "global_step": 80362, "epoch": 968} {"train_loss": -21.705270767211914, "global_step": 80363, "epoch": 968} {"train_loss": -21.504955291748047, "global_step": 80364, "epoch": 968} {"train_loss": -21.12456703186035, "global_step": 80365, "epoch": 968} {"train_loss": -21.101062774658203, "global_step": 80366, "epoch": 968} {"train_loss": -21.360055923461914, "global_step": 80367, "epoch": 968} {"train_loss": -21.479162216186523, "global_step": 80368, "epoch": 968} {"train_loss": -21.103147506713867, "global_step": 80369, "epoch": 968} {"train_loss": -20.825481414794922, "global_step": 80370, "epoch": 968} {"train_loss": -21.233991622924805, "global_step": 80371, "epoch": 968} {"train_loss": -21.21368980407715, "global_step": 80372, "epoch": 968} {"train_loss": -21.196823120117188, "global_step": 80373, "epoch": 968} {"train_loss": -20.997310638427734, "global_step": 80374, "epoch": 968} {"train_loss": -21.347965240478516, "global_step": 80375, "epoch": 968} {"train_loss": -21.064584732055664, "global_step": 80376, "epoch": 968} {"train_loss": -21.176546096801758, "global_step": 80377, "epoch": 968} {"train_loss": -21.27528953552246, "global_step": 80378, "epoch": 968} {"train_loss": -21.330184936523438, "global_step": 80379, "epoch": 968} {"train_loss": -21.102115631103516, "global_step": 80380, "epoch": 968} {"train_loss": -21.062171936035156, "global_step": 80381, "epoch": 968} {"train_loss": -20.977346420288086, "global_step": 80382, "epoch": 968} {"train_loss": -21.352806091308594, "global_step": 80383, "epoch": 968} {"train_loss": -21.34632682800293, "global_step": 80384, "epoch": 968} {"train_loss": -20.86775016784668, "global_step": 80385, "epoch": 968} {"train_loss": -21.422321319580078, "global_step": 80386, "epoch": 968} {"train_loss": -21.658842086791992, "global_step": 80387, "epoch": 968} {"train_loss": -21.25907325744629, "global_step": 80388, "epoch": 968} {"train_loss": -21.412145614624023, "global_step": 80389, "epoch": 968} {"train_loss": -21.364200592041016, "global_step": 80390, "epoch": 968} {"train_loss": -21.091440200805664, "global_step": 80391, "epoch": 968} {"train_loss": -21.124082565307617, "global_step": 80392, "epoch": 968} {"train_loss": -21.376766204833984, "global_step": 80393, "epoch": 968} {"train_loss": -21.45716667175293, "global_step": 80394, "epoch": 968} {"train_loss": -21.08099365234375, "global_step": 80395, "epoch": 968} {"train_loss": -21.091398239135742, "global_step": 80396, "epoch": 968} {"train_loss": -21.187808990478516, "global_step": 80397, "epoch": 968} {"train_loss": -21.21378517150879, "global_step": 80398, "epoch": 968} {"train_loss": -20.821420669555664, "global_step": 80399, "epoch": 968} {"train_loss": -21.224828720092773, "global_step": 80400, "epoch": 968} {"train_loss": -21.398401260375977, "global_step": 80401, "epoch": 968} {"train_loss": -21.129413604736328, "global_step": 80402, "epoch": 968} {"train_loss": -20.659292221069336, "global_step": 80403, "epoch": 968} {"train_loss": -21.26943016052246, "global_step": 80404, "epoch": 968} {"train_loss": -21.20588493347168, "global_step": 80405, "epoch": 968} {"train_loss": -21.097774505615234, "global_step": 80406, "epoch": 968} {"train_loss": -21.170034408569336, "global_step": 80407, "epoch": 968} {"train_loss": -21.488740921020508, "global_step": 80408, "epoch": 968} {"train_loss": -21.2724552154541, "global_step": 80409, "epoch": 968} {"train_loss": -21.308521270751953, "global_step": 80410, "epoch": 968} {"train_loss": -21.38329315185547, "global_step": 80411, "epoch": 968} {"train_loss": -20.820810317993164, "global_step": 80412, "epoch": 968} {"train_loss": -20.99860954284668, "global_step": 80413, "epoch": 968} {"train_loss": -21.572477340698242, "global_step": 80414, "epoch": 968} {"train_loss": -21.355403900146484, "global_step": 80415, "epoch": 968} {"train_loss": -21.53706932067871, "global_step": 80416, "epoch": 968} {"train_loss": -21.429813385009766, "global_step": 80417, "epoch": 968} {"train_loss": -21.09325408935547, "global_step": 80418, "epoch": 968} {"train_loss": -21.01384735107422, "global_step": 80419, "epoch": 968} {"train_loss": -21.25786781311035, "global_step": 80420, "epoch": 968} {"train_loss": -20.865079879760742, "global_step": 80421, "epoch": 968} {"train_loss": -21.25104331970215, "global_step": 80422, "epoch": 968} {"train_loss": -21.439529418945312, "global_step": 80423, "epoch": 968} {"train_loss": -21.569128036499023, "global_step": 80424, "epoch": 968} {"train_loss": -21.174840927124023, "global_step": 80425, "epoch": 968} {"train_loss": -21.220874119953937, "global_step": 80426, "epoch": 968, "val_loss": 6145846.0} {"train_loss": -20.348892211914062, "global_step": 80427, "epoch": 969} {"train_loss": -20.41756248474121, "global_step": 80428, "epoch": 969} {"train_loss": -20.63071632385254, "global_step": 80429, "epoch": 969} {"train_loss": -20.82520866394043, "global_step": 80430, "epoch": 969} {"train_loss": -20.4895076751709, "global_step": 80431, "epoch": 969} {"train_loss": -20.953393936157227, "global_step": 80432, "epoch": 969} {"train_loss": -20.44539451599121, "global_step": 80433, "epoch": 969} {"train_loss": -20.612632751464844, "global_step": 80434, "epoch": 969} {"train_loss": -20.956876754760742, "global_step": 80435, "epoch": 969} {"train_loss": -20.959836959838867, "global_step": 80436, "epoch": 969} {"train_loss": -20.718067169189453, "global_step": 80437, "epoch": 969} {"train_loss": -20.69937515258789, "global_step": 80438, "epoch": 969} {"train_loss": -20.866750717163086, "global_step": 80439, "epoch": 969} {"train_loss": -20.9099178314209, "global_step": 80440, "epoch": 969} {"train_loss": -21.21797752380371, "global_step": 80441, "epoch": 969} {"train_loss": -21.002445220947266, "global_step": 80442, "epoch": 969} {"train_loss": -20.90675926208496, "global_step": 80443, "epoch": 969} {"train_loss": -20.887666702270508, "global_step": 80444, "epoch": 969} {"train_loss": -21.179197311401367, "global_step": 80445, "epoch": 969} {"train_loss": -20.96271324157715, "global_step": 80446, "epoch": 969} {"train_loss": -21.313140869140625, "global_step": 80447, "epoch": 969} {"train_loss": -20.966894149780273, "global_step": 80448, "epoch": 969} {"train_loss": -20.93606948852539, "global_step": 80449, "epoch": 969} {"train_loss": -21.009668350219727, "global_step": 80450, "epoch": 969} {"train_loss": -21.175268173217773, "global_step": 80451, "epoch": 969} {"train_loss": -21.155771255493164, "global_step": 80452, "epoch": 969} {"train_loss": -21.028268814086914, "global_step": 80453, "epoch": 969} {"train_loss": -21.29745864868164, "global_step": 80454, "epoch": 969} {"train_loss": -20.849597930908203, "global_step": 80455, "epoch": 969} {"train_loss": -21.778635025024414, "global_step": 80456, "epoch": 969} {"train_loss": -20.739395141601562, "global_step": 80457, "epoch": 969} {"train_loss": -21.244001388549805, "global_step": 80458, "epoch": 969} {"train_loss": -21.378992080688477, "global_step": 80459, "epoch": 969} {"train_loss": -21.11885643005371, "global_step": 80460, "epoch": 969} {"train_loss": -21.159406661987305, "global_step": 80461, "epoch": 969} {"train_loss": -21.544307708740234, "global_step": 80462, "epoch": 969} {"train_loss": -20.88397216796875, "global_step": 80463, "epoch": 969} {"train_loss": -21.26340103149414, "global_step": 80464, "epoch": 969} {"train_loss": -21.555803298950195, "global_step": 80465, "epoch": 969} {"train_loss": -21.28035545349121, "global_step": 80466, "epoch": 969} {"train_loss": -21.459171295166016, "global_step": 80467, "epoch": 969} {"train_loss": -21.195236206054688, "global_step": 80468, "epoch": 969} {"train_loss": -20.93781852722168, "global_step": 80469, "epoch": 969} {"train_loss": -21.492115020751953, "global_step": 80470, "epoch": 969} {"train_loss": -21.337787628173828, "global_step": 80471, "epoch": 969} {"train_loss": -20.960561752319336, "global_step": 80472, "epoch": 969} {"train_loss": -21.030622482299805, "global_step": 80473, "epoch": 969} {"train_loss": -21.317455291748047, "global_step": 80474, "epoch": 969} {"train_loss": -21.2984561920166, "global_step": 80475, "epoch": 969} {"train_loss": -21.204442977905273, "global_step": 80476, "epoch": 969} {"train_loss": -21.414457321166992, "global_step": 80477, "epoch": 969} {"train_loss": -21.33578109741211, "global_step": 80478, "epoch": 969} {"train_loss": -21.418682098388672, "global_step": 80479, "epoch": 969} {"train_loss": -21.242664337158203, "global_step": 80480, "epoch": 969} {"train_loss": -21.28182029724121, "global_step": 80481, "epoch": 969} {"train_loss": -20.8870849609375, "global_step": 80482, "epoch": 969} {"train_loss": -21.05521011352539, "global_step": 80483, "epoch": 969} {"train_loss": -21.354169845581055, "global_step": 80484, "epoch": 969} {"train_loss": -21.208059310913086, "global_step": 80485, "epoch": 969} {"train_loss": -21.05728530883789, "global_step": 80486, "epoch": 969} {"train_loss": -21.39746856689453, "global_step": 80487, "epoch": 969} {"train_loss": -21.234182357788086, "global_step": 80488, "epoch": 969} {"train_loss": -21.159473419189453, "global_step": 80489, "epoch": 969} {"train_loss": -21.203527450561523, "global_step": 80490, "epoch": 969} {"train_loss": -20.97456932067871, "global_step": 80491, "epoch": 969} {"train_loss": -21.510480880737305, "global_step": 80492, "epoch": 969} {"train_loss": -20.936304092407227, "global_step": 80493, "epoch": 969} {"train_loss": -21.267011642456055, "global_step": 80494, "epoch": 969} {"train_loss": -21.114482879638672, "global_step": 80495, "epoch": 969} {"train_loss": -21.421457290649414, "global_step": 80496, "epoch": 969} {"train_loss": -20.795936584472656, "global_step": 80497, "epoch": 969} {"train_loss": -21.219091415405273, "global_step": 80498, "epoch": 969} {"train_loss": -21.377363204956055, "global_step": 80499, "epoch": 969} {"train_loss": -21.24948501586914, "global_step": 80500, "epoch": 969} {"train_loss": -21.36899757385254, "global_step": 80501, "epoch": 969} {"train_loss": -21.421964645385742, "global_step": 80502, "epoch": 969} {"train_loss": -21.384056091308594, "global_step": 80503, "epoch": 969} {"train_loss": -21.055334091186523, "global_step": 80504, "epoch": 969} {"train_loss": -21.492027282714844, "global_step": 80505, "epoch": 969} {"train_loss": -21.403213500976562, "global_step": 80506, "epoch": 969} {"train_loss": -21.270639419555664, "global_step": 80507, "epoch": 969} {"train_loss": -21.328706741333008, "global_step": 80508, "epoch": 969} {"train_loss": -21.127238974513777, "global_step": 80509, "epoch": 969, "val_loss": 5998686.5} {"train_loss": -19.372045516967773, "global_step": 80510, "epoch": 970} {"train_loss": -20.75604820251465, "global_step": 80511, "epoch": 970} {"train_loss": -20.178876876831055, "global_step": 80512, "epoch": 970} {"train_loss": -20.8901424407959, "global_step": 80513, "epoch": 970} {"train_loss": -20.253793716430664, "global_step": 80514, "epoch": 970} {"train_loss": -20.566614151000977, "global_step": 80515, "epoch": 970} {"train_loss": -20.6949520111084, "global_step": 80516, "epoch": 970} {"train_loss": -20.58553123474121, "global_step": 80517, "epoch": 970} {"train_loss": -20.420881271362305, "global_step": 80518, "epoch": 970} {"train_loss": -20.378263473510742, "global_step": 80519, "epoch": 970} {"train_loss": -20.678607940673828, "global_step": 80520, "epoch": 970} {"train_loss": -20.639257431030273, "global_step": 80521, "epoch": 970} {"train_loss": -20.820798873901367, "global_step": 80522, "epoch": 970} {"train_loss": -20.644617080688477, "global_step": 80523, "epoch": 970} {"train_loss": -20.590782165527344, "global_step": 80524, "epoch": 970} {"train_loss": -20.49930191040039, "global_step": 80525, "epoch": 970} {"train_loss": -20.415830612182617, "global_step": 80526, "epoch": 970} {"train_loss": -20.797945022583008, "global_step": 80527, "epoch": 970} {"train_loss": -20.508207321166992, "global_step": 80528, "epoch": 970} {"train_loss": -20.830907821655273, "global_step": 80529, "epoch": 970} {"train_loss": -21.1044864654541, "global_step": 80530, "epoch": 970} {"train_loss": -20.877765655517578, "global_step": 80531, "epoch": 970} {"train_loss": -21.210922241210938, "global_step": 80532, "epoch": 970} {"train_loss": -20.661041259765625, "global_step": 80533, "epoch": 970} {"train_loss": -21.36639976501465, "global_step": 80534, "epoch": 970} {"train_loss": -21.210830688476562, "global_step": 80535, "epoch": 970} {"train_loss": -21.11790657043457, "global_step": 80536, "epoch": 970} {"train_loss": -21.27449607849121, "global_step": 80537, "epoch": 970} {"train_loss": -21.009979248046875, "global_step": 80538, "epoch": 970} {"train_loss": -21.44765281677246, "global_step": 80539, "epoch": 970} {"train_loss": -21.08652687072754, "global_step": 80540, "epoch": 970} {"train_loss": -21.45794677734375, "global_step": 80541, "epoch": 970} {"train_loss": -21.439584732055664, "global_step": 80542, "epoch": 970} {"train_loss": -21.1888370513916, "global_step": 80543, "epoch": 970} {"train_loss": -20.974180221557617, "global_step": 80544, "epoch": 970} {"train_loss": -21.559900283813477, "global_step": 80545, "epoch": 970} {"train_loss": -21.740346908569336, "global_step": 80546, "epoch": 970} {"train_loss": -20.973388671875, "global_step": 80547, "epoch": 970} {"train_loss": -21.388153076171875, "global_step": 80548, "epoch": 970} {"train_loss": -21.19538688659668, "global_step": 80549, "epoch": 970} {"train_loss": -21.36751365661621, "global_step": 80550, "epoch": 970} {"train_loss": -21.411930084228516, "global_step": 80551, "epoch": 970} {"train_loss": -21.15724754333496, "global_step": 80552, "epoch": 970} {"train_loss": -21.014911651611328, "global_step": 80553, "epoch": 970} {"train_loss": -21.25836944580078, "global_step": 80554, "epoch": 970} {"train_loss": -20.74739646911621, "global_step": 80555, "epoch": 970} {"train_loss": -21.125341415405273, "global_step": 80556, "epoch": 970} {"train_loss": -21.46438980102539, "global_step": 80557, "epoch": 970} {"train_loss": -21.57172203063965, "global_step": 80558, "epoch": 970} {"train_loss": -21.194059371948242, "global_step": 80559, "epoch": 970} {"train_loss": -21.398649215698242, "global_step": 80560, "epoch": 970} {"train_loss": -21.045705795288086, "global_step": 80561, "epoch": 970} {"train_loss": -21.414159774780273, "global_step": 80562, "epoch": 970} {"train_loss": -21.465534210205078, "global_step": 80563, "epoch": 970} {"train_loss": -21.27811622619629, "global_step": 80564, "epoch": 970} {"train_loss": -21.33324432373047, "global_step": 80565, "epoch": 970} {"train_loss": -21.51105308532715, "global_step": 80566, "epoch": 970} {"train_loss": -21.45246696472168, "global_step": 80567, "epoch": 970} {"train_loss": -20.98821449279785, "global_step": 80568, "epoch": 970} {"train_loss": -21.36660385131836, "global_step": 80569, "epoch": 970} {"train_loss": -21.210586547851562, "global_step": 80570, "epoch": 970} {"train_loss": -21.76479721069336, "global_step": 80571, "epoch": 970} {"train_loss": -21.15734100341797, "global_step": 80572, "epoch": 970} {"train_loss": -21.637815475463867, "global_step": 80573, "epoch": 970} {"train_loss": -21.496597290039062, "global_step": 80574, "epoch": 970} {"train_loss": -21.180418014526367, "global_step": 80575, "epoch": 970} {"train_loss": -21.227521896362305, "global_step": 80576, "epoch": 970} {"train_loss": -21.32986068725586, "global_step": 80577, "epoch": 970} {"train_loss": -21.077442169189453, "global_step": 80578, "epoch": 970} {"train_loss": -21.509571075439453, "global_step": 80579, "epoch": 970} {"train_loss": -21.11130714416504, "global_step": 80580, "epoch": 970} {"train_loss": -21.373008728027344, "global_step": 80581, "epoch": 970} {"train_loss": -21.422712326049805, "global_step": 80582, "epoch": 970} {"train_loss": -21.102399826049805, "global_step": 80583, "epoch": 970} {"train_loss": -21.409582138061523, "global_step": 80584, "epoch": 970} {"train_loss": -21.470548629760742, "global_step": 80585, "epoch": 970} {"train_loss": -21.100727081298828, "global_step": 80586, "epoch": 970} {"train_loss": -21.306598663330078, "global_step": 80587, "epoch": 970} {"train_loss": -21.210342407226562, "global_step": 80588, "epoch": 970} {"train_loss": -20.908727645874023, "global_step": 80589, "epoch": 970} {"train_loss": -20.910383224487305, "global_step": 80590, "epoch": 970} {"train_loss": -20.9781436920166, "global_step": 80591, "epoch": 970} {"train_loss": -21.077362520148956, "global_step": 80592, "epoch": 970, "val_loss": 6056305.0} {"train_loss": -21.428834915161133, "global_step": 80593, "epoch": 971} {"train_loss": -21.234365463256836, "global_step": 80594, "epoch": 971} {"train_loss": -20.8707218170166, "global_step": 80595, "epoch": 971} {"train_loss": -21.226329803466797, "global_step": 80596, "epoch": 971} {"train_loss": -20.702014923095703, "global_step": 80597, "epoch": 971} {"train_loss": -21.079601287841797, "global_step": 80598, "epoch": 971} {"train_loss": -21.212202072143555, "global_step": 80599, "epoch": 971} {"train_loss": -20.710269927978516, "global_step": 80600, "epoch": 971} {"train_loss": -20.9711856842041, "global_step": 80601, "epoch": 971} {"train_loss": -20.778867721557617, "global_step": 80602, "epoch": 971} {"train_loss": -21.16416358947754, "global_step": 80603, "epoch": 971} {"train_loss": -20.910377502441406, "global_step": 80604, "epoch": 971} {"train_loss": -21.28498649597168, "global_step": 80605, "epoch": 971} {"train_loss": -21.031858444213867, "global_step": 80606, "epoch": 971} {"train_loss": -20.673994064331055, "global_step": 80607, "epoch": 971} {"train_loss": -21.284276962280273, "global_step": 80608, "epoch": 971} {"train_loss": -21.277713775634766, "global_step": 80609, "epoch": 971} {"train_loss": -20.95512580871582, "global_step": 80610, "epoch": 971} {"train_loss": -21.446462631225586, "global_step": 80611, "epoch": 971} {"train_loss": -21.29438018798828, "global_step": 80612, "epoch": 971} {"train_loss": -21.002593994140625, "global_step": 80613, "epoch": 971} {"train_loss": -21.060651779174805, "global_step": 80614, "epoch": 971} {"train_loss": -21.079994201660156, "global_step": 80615, "epoch": 971} {"train_loss": -20.893667221069336, "global_step": 80616, "epoch": 971} {"train_loss": -21.144451141357422, "global_step": 80617, "epoch": 971} {"train_loss": -21.23700523376465, "global_step": 80618, "epoch": 971} {"train_loss": -21.133831024169922, "global_step": 80619, "epoch": 971} {"train_loss": -21.24909019470215, "global_step": 80620, "epoch": 971} {"train_loss": -21.243778228759766, "global_step": 80621, "epoch": 971} {"train_loss": -20.841236114501953, "global_step": 80622, "epoch": 971} {"train_loss": -21.248777389526367, "global_step": 80623, "epoch": 971} {"train_loss": -21.085966110229492, "global_step": 80624, "epoch": 971} {"train_loss": -20.961544036865234, "global_step": 80625, "epoch": 971} {"train_loss": -21.15839195251465, "global_step": 80626, "epoch": 971} {"train_loss": -20.890079498291016, "global_step": 80627, "epoch": 971} {"train_loss": -21.089628219604492, "global_step": 80628, "epoch": 971} {"train_loss": -21.24856948852539, "global_step": 80629, "epoch": 971} {"train_loss": -21.35000228881836, "global_step": 80630, "epoch": 971} {"train_loss": -21.24407958984375, "global_step": 80631, "epoch": 971} {"train_loss": -20.887826919555664, "global_step": 80632, "epoch": 971} {"train_loss": -20.99454689025879, "global_step": 80633, "epoch": 971} {"train_loss": -21.338472366333008, "global_step": 80634, "epoch": 971} {"train_loss": -20.98064422607422, "global_step": 80635, "epoch": 971} {"train_loss": -21.004384994506836, "global_step": 80636, "epoch": 971} {"train_loss": -21.815963745117188, "global_step": 80637, "epoch": 971} {"train_loss": -21.318561553955078, "global_step": 80638, "epoch": 971} {"train_loss": -21.617395401000977, "global_step": 80639, "epoch": 971} {"train_loss": -21.49601173400879, "global_step": 80640, "epoch": 971} {"train_loss": -21.095550537109375, "global_step": 80641, "epoch": 971} {"train_loss": -21.387704849243164, "global_step": 80642, "epoch": 971} {"train_loss": -21.174245834350586, "global_step": 80643, "epoch": 971} {"train_loss": -21.254417419433594, "global_step": 80644, "epoch": 971} {"train_loss": -21.64751625061035, "global_step": 80645, "epoch": 971} {"train_loss": -21.265981674194336, "global_step": 80646, "epoch": 971} {"train_loss": -21.358489990234375, "global_step": 80647, "epoch": 971} {"train_loss": -21.42764663696289, "global_step": 80648, "epoch": 971} {"train_loss": -21.224763870239258, "global_step": 80649, "epoch": 971} {"train_loss": -21.469200134277344, "global_step": 80650, "epoch": 971} {"train_loss": -21.354101181030273, "global_step": 80651, "epoch": 971} {"train_loss": -21.832014083862305, "global_step": 80652, "epoch": 971} {"train_loss": -21.19993782043457, "global_step": 80653, "epoch": 971} {"train_loss": -21.352331161499023, "global_step": 80654, "epoch": 971} {"train_loss": -21.2010555267334, "global_step": 80655, "epoch": 971} {"train_loss": -21.298171997070312, "global_step": 80656, "epoch": 971} {"train_loss": -21.432722091674805, "global_step": 80657, "epoch": 971} {"train_loss": -21.346960067749023, "global_step": 80658, "epoch": 971} {"train_loss": -21.667789459228516, "global_step": 80659, "epoch": 971} {"train_loss": -21.031147003173828, "global_step": 80660, "epoch": 971} {"train_loss": -21.777860641479492, "global_step": 80661, "epoch": 971} {"train_loss": -21.229341506958008, "global_step": 80662, "epoch": 971} {"train_loss": -21.439014434814453, "global_step": 80663, "epoch": 971} {"train_loss": -21.219802856445312, "global_step": 80664, "epoch": 971} {"train_loss": -21.53510284423828, "global_step": 80665, "epoch": 971} {"train_loss": -21.25264549255371, "global_step": 80666, "epoch": 971} {"train_loss": -21.4102725982666, "global_step": 80667, "epoch": 971} {"train_loss": -21.2750186920166, "global_step": 80668, "epoch": 971} {"train_loss": -21.373945236206055, "global_step": 80669, "epoch": 971} {"train_loss": -21.371170043945312, "global_step": 80670, "epoch": 971} {"train_loss": -21.416400909423828, "global_step": 80671, "epoch": 971} {"train_loss": -21.33584976196289, "global_step": 80672, "epoch": 971} {"train_loss": -21.282522201538086, "global_step": 80673, "epoch": 971} {"train_loss": -21.37020492553711, "global_step": 80674, "epoch": 971} {"train_loss": -21.23277450469603, "global_step": 80675, "epoch": 971, "val_loss": 5923988.5} {"train_loss": -20.9665470123291, "global_step": 80676, "epoch": 972} {"train_loss": -20.18534278869629, "global_step": 80677, "epoch": 972} {"train_loss": -20.73227882385254, "global_step": 80678, "epoch": 972} {"train_loss": -20.672597885131836, "global_step": 80679, "epoch": 972} {"train_loss": -20.771297454833984, "global_step": 80680, "epoch": 972} {"train_loss": -20.73282814025879, "global_step": 80681, "epoch": 972} {"train_loss": -20.775699615478516, "global_step": 80682, "epoch": 972} {"train_loss": -20.7794132232666, "global_step": 80683, "epoch": 972} {"train_loss": -21.118013381958008, "global_step": 80684, "epoch": 972} {"train_loss": -20.83563804626465, "global_step": 80685, "epoch": 972} {"train_loss": -21.1373291015625, "global_step": 80686, "epoch": 972} {"train_loss": -21.386215209960938, "global_step": 80687, "epoch": 972} {"train_loss": -21.349384307861328, "global_step": 80688, "epoch": 972} {"train_loss": -20.581647872924805, "global_step": 80689, "epoch": 972} {"train_loss": -21.10689353942871, "global_step": 80690, "epoch": 972} {"train_loss": -20.79905128479004, "global_step": 80691, "epoch": 972} {"train_loss": -21.097684860229492, "global_step": 80692, "epoch": 972} {"train_loss": -20.818540573120117, "global_step": 80693, "epoch": 972} {"train_loss": -20.78057289123535, "global_step": 80694, "epoch": 972} {"train_loss": -21.08112907409668, "global_step": 80695, "epoch": 972} {"train_loss": -21.225778579711914, "global_step": 80696, "epoch": 972} {"train_loss": -20.970561981201172, "global_step": 80697, "epoch": 972} {"train_loss": -21.559133529663086, "global_step": 80698, "epoch": 972} {"train_loss": -20.372909545898438, "global_step": 80699, "epoch": 972} {"train_loss": -20.953798294067383, "global_step": 80700, "epoch": 972} {"train_loss": -21.18758773803711, "global_step": 80701, "epoch": 972} {"train_loss": -21.37203025817871, "global_step": 80702, "epoch": 972} {"train_loss": -21.23664665222168, "global_step": 80703, "epoch": 972} {"train_loss": -21.511335372924805, "global_step": 80704, "epoch": 972} {"train_loss": -21.50994110107422, "global_step": 80705, "epoch": 972} {"train_loss": -21.375852584838867, "global_step": 80706, "epoch": 972} {"train_loss": -21.27256965637207, "global_step": 80707, "epoch": 972} {"train_loss": -21.232046127319336, "global_step": 80708, "epoch": 972} {"train_loss": -21.471208572387695, "global_step": 80709, "epoch": 972} {"train_loss": -21.42911720275879, "global_step": 80710, "epoch": 972} {"train_loss": -21.235631942749023, "global_step": 80711, "epoch": 972} {"train_loss": -21.470136642456055, "global_step": 80712, "epoch": 972} {"train_loss": -21.207155227661133, "global_step": 80713, "epoch": 972} {"train_loss": -21.793411254882812, "global_step": 80714, "epoch": 972} {"train_loss": -20.985212326049805, "global_step": 80715, "epoch": 972} {"train_loss": -21.550365447998047, "global_step": 80716, "epoch": 972} {"train_loss": -21.354076385498047, "global_step": 80717, "epoch": 972} {"train_loss": -21.509580612182617, "global_step": 80718, "epoch": 972} {"train_loss": -21.21278190612793, "global_step": 80719, "epoch": 972} {"train_loss": -21.05597496032715, "global_step": 80720, "epoch": 972} {"train_loss": -21.290233612060547, "global_step": 80721, "epoch": 972} {"train_loss": -21.373046875, "global_step": 80722, "epoch": 972} {"train_loss": -21.4829158782959, "global_step": 80723, "epoch": 972} {"train_loss": -21.159204483032227, "global_step": 80724, "epoch": 972} {"train_loss": -21.284469604492188, "global_step": 80725, "epoch": 972} {"train_loss": -21.640783309936523, "global_step": 80726, "epoch": 972} {"train_loss": -21.4476261138916, "global_step": 80727, "epoch": 972} {"train_loss": -21.449966430664062, "global_step": 80728, "epoch": 972} {"train_loss": -21.255231857299805, "global_step": 80729, "epoch": 972} {"train_loss": -21.145185470581055, "global_step": 80730, "epoch": 972} {"train_loss": -21.49887466430664, "global_step": 80731, "epoch": 972} {"train_loss": -21.013233184814453, "global_step": 80732, "epoch": 972} {"train_loss": -20.845048904418945, "global_step": 80733, "epoch": 972} {"train_loss": -21.629491806030273, "global_step": 80734, "epoch": 972} {"train_loss": -21.470972061157227, "global_step": 80735, "epoch": 972} {"train_loss": -21.200048446655273, "global_step": 80736, "epoch": 972} {"train_loss": -21.146841049194336, "global_step": 80737, "epoch": 972} {"train_loss": -20.97480010986328, "global_step": 80738, "epoch": 972} {"train_loss": -21.52707862854004, "global_step": 80739, "epoch": 972} {"train_loss": -21.272287368774414, "global_step": 80740, "epoch": 972} {"train_loss": -21.24708366394043, "global_step": 80741, "epoch": 972} {"train_loss": -21.18695640563965, "global_step": 80742, "epoch": 972} {"train_loss": -21.455015182495117, "global_step": 80743, "epoch": 972} {"train_loss": -21.336484909057617, "global_step": 80744, "epoch": 972} {"train_loss": -21.27618980407715, "global_step": 80745, "epoch": 972} {"train_loss": -21.45484161376953, "global_step": 80746, "epoch": 972} {"train_loss": -21.28325653076172, "global_step": 80747, "epoch": 972} {"train_loss": -21.29880142211914, "global_step": 80748, "epoch": 972} {"train_loss": -21.044208526611328, "global_step": 80749, "epoch": 972} {"train_loss": -21.333724975585938, "global_step": 80750, "epoch": 972} {"train_loss": -21.300928115844727, "global_step": 80751, "epoch": 972} {"train_loss": -20.811113357543945, "global_step": 80752, "epoch": 972} {"train_loss": -21.240001678466797, "global_step": 80753, "epoch": 972} {"train_loss": -21.32596206665039, "global_step": 80754, "epoch": 972} {"train_loss": -21.12178611755371, "global_step": 80755, "epoch": 972} {"train_loss": -20.71527671813965, "global_step": 80756, "epoch": 972} {"train_loss": -21.104116439819336, "global_step": 80757, "epoch": 972} {"train_loss": -21.193228135626, "global_step": 80758, "epoch": 972, "val_loss": 5980867.5} {"train_loss": -20.920608520507812, "global_step": 80759, "epoch": 973} {"train_loss": -20.561538696289062, "global_step": 80760, "epoch": 973} {"train_loss": -21.09949493408203, "global_step": 80761, "epoch": 973} {"train_loss": -20.73720932006836, "global_step": 80762, "epoch": 973} {"train_loss": -21.20676612854004, "global_step": 80763, "epoch": 973} {"train_loss": -20.681365966796875, "global_step": 80764, "epoch": 973} {"train_loss": -20.782114028930664, "global_step": 80765, "epoch": 973} {"train_loss": -21.119277954101562, "global_step": 80766, "epoch": 973} {"train_loss": -21.147838592529297, "global_step": 80767, "epoch": 973} {"train_loss": -20.6921443939209, "global_step": 80768, "epoch": 973} {"train_loss": -21.178049087524414, "global_step": 80769, "epoch": 973} {"train_loss": -20.86348533630371, "global_step": 80770, "epoch": 973} {"train_loss": -20.81258201599121, "global_step": 80771, "epoch": 973} {"train_loss": -21.14004898071289, "global_step": 80772, "epoch": 973} {"train_loss": -21.201221466064453, "global_step": 80773, "epoch": 973} {"train_loss": -21.3161678314209, "global_step": 80774, "epoch": 973} {"train_loss": -21.639591217041016, "global_step": 80775, "epoch": 973} {"train_loss": -20.941312789916992, "global_step": 80776, "epoch": 973} {"train_loss": -21.246366500854492, "global_step": 80777, "epoch": 973} {"train_loss": -21.199316024780273, "global_step": 80778, "epoch": 973} {"train_loss": -21.47942543029785, "global_step": 80779, "epoch": 973} {"train_loss": -21.16572380065918, "global_step": 80780, "epoch": 973} {"train_loss": -21.29237174987793, "global_step": 80781, "epoch": 973} {"train_loss": -20.879709243774414, "global_step": 80782, "epoch": 973} {"train_loss": -21.200271606445312, "global_step": 80783, "epoch": 973} {"train_loss": -21.359420776367188, "global_step": 80784, "epoch": 973} {"train_loss": -21.03720474243164, "global_step": 80785, "epoch": 973} {"train_loss": -21.342376708984375, "global_step": 80786, "epoch": 973} {"train_loss": -21.108102798461914, "global_step": 80787, "epoch": 973} {"train_loss": -21.48354721069336, "global_step": 80788, "epoch": 973} {"train_loss": -20.832265853881836, "global_step": 80789, "epoch": 973} {"train_loss": -21.304731369018555, "global_step": 80790, "epoch": 973} {"train_loss": -21.277225494384766, "global_step": 80791, "epoch": 973} {"train_loss": -21.318464279174805, "global_step": 80792, "epoch": 973} {"train_loss": -21.130569458007812, "global_step": 80793, "epoch": 973} {"train_loss": -21.250328063964844, "global_step": 80794, "epoch": 973} {"train_loss": -21.386014938354492, "global_step": 80795, "epoch": 973} {"train_loss": -21.52288818359375, "global_step": 80796, "epoch": 973} {"train_loss": -21.3417911529541, "global_step": 80797, "epoch": 973} {"train_loss": -21.29619598388672, "global_step": 80798, "epoch": 973} {"train_loss": -21.62807273864746, "global_step": 80799, "epoch": 973} {"train_loss": -21.35550308227539, "global_step": 80800, "epoch": 973} {"train_loss": -21.052427291870117, "global_step": 80801, "epoch": 973} {"train_loss": -21.54974365234375, "global_step": 80802, "epoch": 973} {"train_loss": -21.25672149658203, "global_step": 80803, "epoch": 973} {"train_loss": -21.15595817565918, "global_step": 80804, "epoch": 973} {"train_loss": -21.315650939941406, "global_step": 80805, "epoch": 973} {"train_loss": -21.2650203704834, "global_step": 80806, "epoch": 973} {"train_loss": -20.956266403198242, "global_step": 80807, "epoch": 973} {"train_loss": -21.20368003845215, "global_step": 80808, "epoch": 973} {"train_loss": -21.328088760375977, "global_step": 80809, "epoch": 973} {"train_loss": -21.194074630737305, "global_step": 80810, "epoch": 973} {"train_loss": -21.397764205932617, "global_step": 80811, "epoch": 973} {"train_loss": -21.52915382385254, "global_step": 80812, "epoch": 973} {"train_loss": -21.197967529296875, "global_step": 80813, "epoch": 973} {"train_loss": -21.598121643066406, "global_step": 80814, "epoch": 973} {"train_loss": -21.646528244018555, "global_step": 80815, "epoch": 973} {"train_loss": -21.33749771118164, "global_step": 80816, "epoch": 973} {"train_loss": -21.180402755737305, "global_step": 80817, "epoch": 973} {"train_loss": -21.281208038330078, "global_step": 80818, "epoch": 973} {"train_loss": -21.2294921875, "global_step": 80819, "epoch": 973} {"train_loss": -21.272216796875, "global_step": 80820, "epoch": 973} {"train_loss": -21.362668991088867, "global_step": 80821, "epoch": 973} {"train_loss": -21.184507369995117, "global_step": 80822, "epoch": 973} {"train_loss": -21.4080867767334, "global_step": 80823, "epoch": 973} {"train_loss": -21.62748908996582, "global_step": 80824, "epoch": 973} {"train_loss": -21.329391479492188, "global_step": 80825, "epoch": 973} {"train_loss": -21.243555068969727, "global_step": 80826, "epoch": 973} {"train_loss": -20.915687561035156, "global_step": 80827, "epoch": 973} {"train_loss": -21.332792282104492, "global_step": 80828, "epoch": 973} {"train_loss": -21.23215103149414, "global_step": 80829, "epoch": 973} {"train_loss": -21.451772689819336, "global_step": 80830, "epoch": 973} {"train_loss": -20.692583084106445, "global_step": 80831, "epoch": 973} {"train_loss": -21.045591354370117, "global_step": 80832, "epoch": 973} {"train_loss": -21.12613868713379, "global_step": 80833, "epoch": 973} {"train_loss": -21.25092887878418, "global_step": 80834, "epoch": 973} {"train_loss": -21.083984375, "global_step": 80835, "epoch": 973} {"train_loss": -21.240467071533203, "global_step": 80836, "epoch": 973} {"train_loss": -21.352548599243164, "global_step": 80837, "epoch": 973} {"train_loss": -21.03462791442871, "global_step": 80838, "epoch": 973} {"train_loss": -21.31298828125, "global_step": 80839, "epoch": 973} {"train_loss": -21.217737197875977, "global_step": 80840, "epoch": 973} {"train_loss": -21.215233446603797, "global_step": 80841, "epoch": 973, "val_loss": 6059122.5} {"train_loss": -19.78371238708496, "global_step": 80842, "epoch": 974} {"train_loss": -20.29347038269043, "global_step": 80843, "epoch": 974} {"train_loss": -20.572593688964844, "global_step": 80844, "epoch": 974} {"train_loss": -19.97224998474121, "global_step": 80845, "epoch": 974} {"train_loss": -20.741809844970703, "global_step": 80846, "epoch": 974} {"train_loss": -20.7840633392334, "global_step": 80847, "epoch": 974} {"train_loss": -20.611663818359375, "global_step": 80848, "epoch": 974} {"train_loss": -20.551227569580078, "global_step": 80849, "epoch": 974} {"train_loss": -20.76590347290039, "global_step": 80850, "epoch": 974} {"train_loss": -20.969907760620117, "global_step": 80851, "epoch": 974} {"train_loss": -20.973087310791016, "global_step": 80852, "epoch": 974} {"train_loss": -20.963729858398438, "global_step": 80853, "epoch": 974} {"train_loss": -21.208776473999023, "global_step": 80854, "epoch": 974} {"train_loss": -20.957386016845703, "global_step": 80855, "epoch": 974} {"train_loss": -20.988840103149414, "global_step": 80856, "epoch": 974} {"train_loss": -21.2165584564209, "global_step": 80857, "epoch": 974} {"train_loss": -20.773157119750977, "global_step": 80858, "epoch": 974} {"train_loss": -20.8256893157959, "global_step": 80859, "epoch": 974} {"train_loss": -20.804031372070312, "global_step": 80860, "epoch": 974} {"train_loss": -20.67938232421875, "global_step": 80861, "epoch": 974} {"train_loss": -21.102651596069336, "global_step": 80862, "epoch": 974} {"train_loss": -21.356582641601562, "global_step": 80863, "epoch": 974} {"train_loss": -21.19245719909668, "global_step": 80864, "epoch": 974} {"train_loss": -21.389944076538086, "global_step": 80865, "epoch": 974} {"train_loss": -21.157062530517578, "global_step": 80866, "epoch": 974} {"train_loss": -21.0305233001709, "global_step": 80867, "epoch": 974} {"train_loss": -21.430349349975586, "global_step": 80868, "epoch": 974} {"train_loss": -21.431074142456055, "global_step": 80869, "epoch": 974} {"train_loss": -21.20745277404785, "global_step": 80870, "epoch": 974} {"train_loss": -21.058685302734375, "global_step": 80871, "epoch": 974} {"train_loss": -21.186864852905273, "global_step": 80872, "epoch": 974} {"train_loss": -21.417007446289062, "global_step": 80873, "epoch": 974} {"train_loss": -21.466907501220703, "global_step": 80874, "epoch": 974} {"train_loss": -21.649173736572266, "global_step": 80875, "epoch": 974} {"train_loss": -21.431745529174805, "global_step": 80876, "epoch": 974} {"train_loss": -21.111984252929688, "global_step": 80877, "epoch": 974} {"train_loss": -21.250015258789062, "global_step": 80878, "epoch": 974} {"train_loss": -21.21013641357422, "global_step": 80879, "epoch": 974} {"train_loss": -21.575788497924805, "global_step": 80880, "epoch": 974} {"train_loss": -21.018007278442383, "global_step": 80881, "epoch": 974} {"train_loss": -21.446413040161133, "global_step": 80882, "epoch": 974} {"train_loss": -21.1823673248291, "global_step": 80883, "epoch": 974} {"train_loss": -21.40279769897461, "global_step": 80884, "epoch": 974} {"train_loss": -21.225086212158203, "global_step": 80885, "epoch": 974} {"train_loss": -21.403776168823242, "global_step": 80886, "epoch": 974} {"train_loss": -21.483057022094727, "global_step": 80887, "epoch": 974} {"train_loss": -21.58285903930664, "global_step": 80888, "epoch": 974} {"train_loss": -21.161283493041992, "global_step": 80889, "epoch": 974} {"train_loss": -21.456281661987305, "global_step": 80890, "epoch": 974} {"train_loss": -21.352624893188477, "global_step": 80891, "epoch": 974} {"train_loss": -21.545303344726562, "global_step": 80892, "epoch": 974} {"train_loss": -21.262653350830078, "global_step": 80893, "epoch": 974} {"train_loss": -21.58280372619629, "global_step": 80894, "epoch": 974} {"train_loss": -21.3408203125, "global_step": 80895, "epoch": 974} {"train_loss": -21.615571975708008, "global_step": 80896, "epoch": 974} {"train_loss": -21.291898727416992, "global_step": 80897, "epoch": 974} {"train_loss": -21.226770401000977, "global_step": 80898, "epoch": 974} {"train_loss": -21.122295379638672, "global_step": 80899, "epoch": 974} {"train_loss": -21.325590133666992, "global_step": 80900, "epoch": 974} {"train_loss": -21.466327667236328, "global_step": 80901, "epoch": 974} {"train_loss": -21.14939308166504, "global_step": 80902, "epoch": 974} {"train_loss": -21.22841453552246, "global_step": 80903, "epoch": 974} {"train_loss": -21.183259963989258, "global_step": 80904, "epoch": 974} {"train_loss": -21.086545944213867, "global_step": 80905, "epoch": 974} {"train_loss": -21.189498901367188, "global_step": 80906, "epoch": 974} {"train_loss": -21.712270736694336, "global_step": 80907, "epoch": 974} {"train_loss": -21.488525390625, "global_step": 80908, "epoch": 974} {"train_loss": -21.288816452026367, "global_step": 80909, "epoch": 974} {"train_loss": -21.3211669921875, "global_step": 80910, "epoch": 974} {"train_loss": -21.0217342376709, "global_step": 80911, "epoch": 974} {"train_loss": -21.3089542388916, "global_step": 80912, "epoch": 974} {"train_loss": -21.486318588256836, "global_step": 80913, "epoch": 974} {"train_loss": -21.295345306396484, "global_step": 80914, "epoch": 974} {"train_loss": -20.4124755859375, "global_step": 80915, "epoch": 974} {"train_loss": -21.306533813476562, "global_step": 80916, "epoch": 974} {"train_loss": -21.596250534057617, "global_step": 80917, "epoch": 974} {"train_loss": -21.169897079467773, "global_step": 80918, "epoch": 974} {"train_loss": -21.4511661529541, "global_step": 80919, "epoch": 974} {"train_loss": -21.053285598754883, "global_step": 80920, "epoch": 974} {"train_loss": -21.411935806274414, "global_step": 80921, "epoch": 974} {"train_loss": -21.322568893432617, "global_step": 80922, "epoch": 974} {"train_loss": -21.014314651489258, "global_step": 80923, "epoch": 974} {"train_loss": -21.145519348512213, "global_step": 80924, "epoch": 974, "val_loss": 6242128.0} {"train_loss": -20.810239791870117, "global_step": 80925, "epoch": 975} {"train_loss": -20.521224975585938, "global_step": 80926, "epoch": 975} {"train_loss": -20.5422306060791, "global_step": 80927, "epoch": 975} {"train_loss": -20.786741256713867, "global_step": 80928, "epoch": 975} {"train_loss": -20.693151473999023, "global_step": 80929, "epoch": 975} {"train_loss": -20.602462768554688, "global_step": 80930, "epoch": 975} {"train_loss": -20.829914093017578, "global_step": 80931, "epoch": 975} {"train_loss": -21.00969886779785, "global_step": 80932, "epoch": 975} {"train_loss": -20.680112838745117, "global_step": 80933, "epoch": 975} {"train_loss": -20.8889102935791, "global_step": 80934, "epoch": 975} {"train_loss": -21.112720489501953, "global_step": 80935, "epoch": 975} {"train_loss": -20.868778228759766, "global_step": 80936, "epoch": 975} {"train_loss": -20.87353515625, "global_step": 80937, "epoch": 975} {"train_loss": -21.355558395385742, "global_step": 80938, "epoch": 975} {"train_loss": -21.076358795166016, "global_step": 80939, "epoch": 975} {"train_loss": -20.876188278198242, "global_step": 80940, "epoch": 975} {"train_loss": -20.781530380249023, "global_step": 80941, "epoch": 975} {"train_loss": -21.164655685424805, "global_step": 80942, "epoch": 975} {"train_loss": -21.204633712768555, "global_step": 80943, "epoch": 975} {"train_loss": -21.211362838745117, "global_step": 80944, "epoch": 975} {"train_loss": -20.880891799926758, "global_step": 80945, "epoch": 975} {"train_loss": -20.95184898376465, "global_step": 80946, "epoch": 975} {"train_loss": -20.89024543762207, "global_step": 80947, "epoch": 975} {"train_loss": -21.63128089904785, "global_step": 80948, "epoch": 975} {"train_loss": -21.319738388061523, "global_step": 80949, "epoch": 975} {"train_loss": -21.316734313964844, "global_step": 80950, "epoch": 975} {"train_loss": -21.448001861572266, "global_step": 80951, "epoch": 975} {"train_loss": -20.99338722229004, "global_step": 80952, "epoch": 975} {"train_loss": -21.409025192260742, "global_step": 80953, "epoch": 975} {"train_loss": -21.427570343017578, "global_step": 80954, "epoch": 975} {"train_loss": -21.30167007446289, "global_step": 80955, "epoch": 975} {"train_loss": -21.373210906982422, "global_step": 80956, "epoch": 975} {"train_loss": -21.39877700805664, "global_step": 80957, "epoch": 975} {"train_loss": -20.873729705810547, "global_step": 80958, "epoch": 975} {"train_loss": -20.813199996948242, "global_step": 80959, "epoch": 975} {"train_loss": -21.19451332092285, "global_step": 80960, "epoch": 975} {"train_loss": -21.069332122802734, "global_step": 80961, "epoch": 975} {"train_loss": -20.857126235961914, "global_step": 80962, "epoch": 975} {"train_loss": -21.229379653930664, "global_step": 80963, "epoch": 975} {"train_loss": -21.0975399017334, "global_step": 80964, "epoch": 975} {"train_loss": -21.15859031677246, "global_step": 80965, "epoch": 975} {"train_loss": -21.41227149963379, "global_step": 80966, "epoch": 975} {"train_loss": -21.378767013549805, "global_step": 80967, "epoch": 975} {"train_loss": -21.209657669067383, "global_step": 80968, "epoch": 975} {"train_loss": -21.259265899658203, "global_step": 80969, "epoch": 975} {"train_loss": -21.369632720947266, "global_step": 80970, "epoch": 975} {"train_loss": -21.270999908447266, "global_step": 80971, "epoch": 975} {"train_loss": -21.33376121520996, "global_step": 80972, "epoch": 975} {"train_loss": -21.18556022644043, "global_step": 80973, "epoch": 975} {"train_loss": -21.714115142822266, "global_step": 80974, "epoch": 975} {"train_loss": -21.443601608276367, "global_step": 80975, "epoch": 975} {"train_loss": -21.111722946166992, "global_step": 80976, "epoch": 975} {"train_loss": -21.087862014770508, "global_step": 80977, "epoch": 975} {"train_loss": -21.179494857788086, "global_step": 80978, "epoch": 975} {"train_loss": -21.789226531982422, "global_step": 80979, "epoch": 975} {"train_loss": -21.274490356445312, "global_step": 80980, "epoch": 975} {"train_loss": -21.00463104248047, "global_step": 80981, "epoch": 975} {"train_loss": -21.40590476989746, "global_step": 80982, "epoch": 975} {"train_loss": -21.288330078125, "global_step": 80983, "epoch": 975} {"train_loss": -21.03811264038086, "global_step": 80984, "epoch": 975} {"train_loss": -21.123327255249023, "global_step": 80985, "epoch": 975} {"train_loss": -21.00723648071289, "global_step": 80986, "epoch": 975} {"train_loss": -21.366012573242188, "global_step": 80987, "epoch": 975} {"train_loss": -21.24442481994629, "global_step": 80988, "epoch": 975} {"train_loss": -21.27637481689453, "global_step": 80989, "epoch": 975} {"train_loss": -21.28083610534668, "global_step": 80990, "epoch": 975} {"train_loss": -21.144760131835938, "global_step": 80991, "epoch": 975} {"train_loss": -21.137174606323242, "global_step": 80992, "epoch": 975} {"train_loss": -21.10688591003418, "global_step": 80993, "epoch": 975} {"train_loss": -21.152639389038086, "global_step": 80994, "epoch": 975} {"train_loss": -21.612136840820312, "global_step": 80995, "epoch": 975} {"train_loss": -21.608463287353516, "global_step": 80996, "epoch": 975} {"train_loss": -21.695560455322266, "global_step": 80997, "epoch": 975} {"train_loss": -21.185148239135742, "global_step": 80998, "epoch": 975} {"train_loss": -21.256851196289062, "global_step": 80999, "epoch": 975} {"train_loss": -21.62415885925293, "global_step": 81000, "epoch": 975} {"train_loss": -21.38117218017578, "global_step": 81001, "epoch": 975} {"train_loss": -21.56950569152832, "global_step": 81002, "epoch": 975} {"train_loss": -21.16791534423828, "global_step": 81003, "epoch": 975} {"train_loss": -20.9931640625, "global_step": 81004, "epoch": 975} {"train_loss": -20.82118034362793, "global_step": 81005, "epoch": 975} {"train_loss": -21.003156661987305, "global_step": 81006, "epoch": 975} {"train_loss": -21.165224488959254, "global_step": 81007, "epoch": 975, "val_loss": 6264915.0} {"train_loss": -20.99433708190918, "global_step": 81008, "epoch": 976} {"train_loss": -21.044401168823242, "global_step": 81009, "epoch": 976} {"train_loss": -20.5388126373291, "global_step": 81010, "epoch": 976} {"train_loss": -21.362869262695312, "global_step": 81011, "epoch": 976} {"train_loss": -21.296621322631836, "global_step": 81012, "epoch": 976} {"train_loss": -20.96957778930664, "global_step": 81013, "epoch": 976} {"train_loss": -21.083831787109375, "global_step": 81014, "epoch": 976} {"train_loss": -20.750028610229492, "global_step": 81015, "epoch": 976} {"train_loss": -21.182886123657227, "global_step": 81016, "epoch": 976} {"train_loss": -21.11897850036621, "global_step": 81017, "epoch": 976} {"train_loss": -20.991270065307617, "global_step": 81018, "epoch": 976} {"train_loss": -21.432430267333984, "global_step": 81019, "epoch": 976} {"train_loss": -21.22637939453125, "global_step": 81020, "epoch": 976} {"train_loss": -21.02186393737793, "global_step": 81021, "epoch": 976} {"train_loss": -21.31165885925293, "global_step": 81022, "epoch": 976} {"train_loss": -20.89826774597168, "global_step": 81023, "epoch": 976} {"train_loss": -21.185317993164062, "global_step": 81024, "epoch": 976} {"train_loss": -21.002408981323242, "global_step": 81025, "epoch": 976} {"train_loss": -21.302621841430664, "global_step": 81026, "epoch": 976} {"train_loss": -21.585325241088867, "global_step": 81027, "epoch": 976} {"train_loss": -20.920408248901367, "global_step": 81028, "epoch": 976} {"train_loss": -21.527074813842773, "global_step": 81029, "epoch": 976} {"train_loss": -21.157861709594727, "global_step": 81030, "epoch": 976} {"train_loss": -21.15766716003418, "global_step": 81031, "epoch": 976} {"train_loss": -20.999135971069336, "global_step": 81032, "epoch": 976} {"train_loss": -21.27040672302246, "global_step": 81033, "epoch": 976} {"train_loss": -21.365367889404297, "global_step": 81034, "epoch": 976} {"train_loss": -21.06998062133789, "global_step": 81035, "epoch": 976} {"train_loss": -21.66728401184082, "global_step": 81036, "epoch": 976} {"train_loss": -21.46843147277832, "global_step": 81037, "epoch": 976} {"train_loss": -21.224668502807617, "global_step": 81038, "epoch": 976} {"train_loss": -21.158428192138672, "global_step": 81039, "epoch": 976} {"train_loss": -21.26820182800293, "global_step": 81040, "epoch": 976} {"train_loss": -20.890911102294922, "global_step": 81041, "epoch": 976} {"train_loss": -20.8996639251709, "global_step": 81042, "epoch": 976} {"train_loss": -21.36676025390625, "global_step": 81043, "epoch": 976} {"train_loss": -21.03577995300293, "global_step": 81044, "epoch": 976} {"train_loss": -21.27177619934082, "global_step": 81045, "epoch": 976} {"train_loss": -21.241443634033203, "global_step": 81046, "epoch": 976} {"train_loss": -21.105825424194336, "global_step": 81047, "epoch": 976} {"train_loss": -21.24286460876465, "global_step": 81048, "epoch": 976} {"train_loss": -21.361143112182617, "global_step": 81049, "epoch": 976} {"train_loss": -21.478927612304688, "global_step": 81050, "epoch": 976} {"train_loss": -21.436880111694336, "global_step": 81051, "epoch": 976} {"train_loss": -21.288118362426758, "global_step": 81052, "epoch": 976} {"train_loss": -21.5982723236084, "global_step": 81053, "epoch": 976} {"train_loss": -21.225055694580078, "global_step": 81054, "epoch": 976} {"train_loss": -21.203622817993164, "global_step": 81055, "epoch": 976} {"train_loss": -21.28507423400879, "global_step": 81056, "epoch": 976} {"train_loss": -21.299222946166992, "global_step": 81057, "epoch": 976} {"train_loss": -21.56415367126465, "global_step": 81058, "epoch": 976} {"train_loss": -21.143075942993164, "global_step": 81059, "epoch": 976} {"train_loss": -21.093812942504883, "global_step": 81060, "epoch": 976} {"train_loss": -21.510597229003906, "global_step": 81061, "epoch": 976} {"train_loss": -21.433706283569336, "global_step": 81062, "epoch": 976} {"train_loss": -21.409582138061523, "global_step": 81063, "epoch": 976} {"train_loss": -21.332660675048828, "global_step": 81064, "epoch": 976} {"train_loss": -21.583847045898438, "global_step": 81065, "epoch": 976} {"train_loss": -21.315902709960938, "global_step": 81066, "epoch": 976} {"train_loss": -21.435073852539062, "global_step": 81067, "epoch": 976} {"train_loss": -21.320131301879883, "global_step": 81068, "epoch": 976} {"train_loss": -20.98382568359375, "global_step": 81069, "epoch": 976} {"train_loss": -21.20065689086914, "global_step": 81070, "epoch": 976} {"train_loss": -21.324691772460938, "global_step": 81071, "epoch": 976} {"train_loss": -21.221267700195312, "global_step": 81072, "epoch": 976} {"train_loss": -21.508586883544922, "global_step": 81073, "epoch": 976} {"train_loss": -21.359386444091797, "global_step": 81074, "epoch": 976} {"train_loss": -21.55135154724121, "global_step": 81075, "epoch": 976} {"train_loss": -21.216064453125, "global_step": 81076, "epoch": 976} {"train_loss": -21.160907745361328, "global_step": 81077, "epoch": 976} {"train_loss": -21.547739028930664, "global_step": 81078, "epoch": 976} {"train_loss": -21.322391510009766, "global_step": 81079, "epoch": 976} {"train_loss": -21.658849716186523, "global_step": 81080, "epoch": 976} {"train_loss": -21.572406768798828, "global_step": 81081, "epoch": 976} {"train_loss": -21.288307189941406, "global_step": 81082, "epoch": 976} {"train_loss": -21.693723678588867, "global_step": 81083, "epoch": 976} {"train_loss": -20.85355567932129, "global_step": 81084, "epoch": 976} {"train_loss": -21.36151885986328, "global_step": 81085, "epoch": 976} {"train_loss": -21.210861206054688, "global_step": 81086, "epoch": 976} {"train_loss": -21.276098251342773, "global_step": 81087, "epoch": 976} {"train_loss": -20.968534469604492, "global_step": 81088, "epoch": 976} {"train_loss": -20.91546630859375, "global_step": 81089, "epoch": 976} {"train_loss": -21.241340246545263, "global_step": 81090, "epoch": 976, "val_loss": 6080288.5} {"train_loss": -20.58058738708496, "global_step": 81091, "epoch": 977} {"train_loss": -20.569046020507812, "global_step": 81092, "epoch": 977} {"train_loss": -21.072566986083984, "global_step": 81093, "epoch": 977} {"train_loss": -20.955400466918945, "global_step": 81094, "epoch": 977} {"train_loss": -21.23555564880371, "global_step": 81095, "epoch": 977} {"train_loss": -20.81403923034668, "global_step": 81096, "epoch": 977} {"train_loss": -21.031896591186523, "global_step": 81097, "epoch": 977} {"train_loss": -21.293249130249023, "global_step": 81098, "epoch": 977} {"train_loss": -21.070178985595703, "global_step": 81099, "epoch": 977} {"train_loss": -20.678314208984375, "global_step": 81100, "epoch": 977} {"train_loss": -21.55609703063965, "global_step": 81101, "epoch": 977} {"train_loss": -20.70791244506836, "global_step": 81102, "epoch": 977} {"train_loss": -21.182249069213867, "global_step": 81103, "epoch": 977} {"train_loss": -20.945226669311523, "global_step": 81104, "epoch": 977} {"train_loss": -21.538862228393555, "global_step": 81105, "epoch": 977} {"train_loss": -21.13182830810547, "global_step": 81106, "epoch": 977} {"train_loss": -21.232534408569336, "global_step": 81107, "epoch": 977} {"train_loss": -21.018709182739258, "global_step": 81108, "epoch": 977} {"train_loss": -21.3430233001709, "global_step": 81109, "epoch": 977} {"train_loss": -21.22011375427246, "global_step": 81110, "epoch": 977} {"train_loss": -21.31505584716797, "global_step": 81111, "epoch": 977} {"train_loss": -21.238691329956055, "global_step": 81112, "epoch": 977} {"train_loss": -21.048917770385742, "global_step": 81113, "epoch": 977} {"train_loss": -21.33081817626953, "global_step": 81114, "epoch": 977} {"train_loss": -21.48731803894043, "global_step": 81115, "epoch": 977} {"train_loss": -21.228519439697266, "global_step": 81116, "epoch": 977} {"train_loss": -21.303983688354492, "global_step": 81117, "epoch": 977} {"train_loss": -21.017284393310547, "global_step": 81118, "epoch": 977} {"train_loss": -21.562036514282227, "global_step": 81119, "epoch": 977} {"train_loss": -21.44944953918457, "global_step": 81120, "epoch": 977} {"train_loss": -21.19097900390625, "global_step": 81121, "epoch": 977} {"train_loss": -21.26743507385254, "global_step": 81122, "epoch": 977} {"train_loss": -21.318561553955078, "global_step": 81123, "epoch": 977} {"train_loss": -21.557769775390625, "global_step": 81124, "epoch": 977} {"train_loss": -21.280349731445312, "global_step": 81125, "epoch": 977} {"train_loss": -21.469423294067383, "global_step": 81126, "epoch": 977} {"train_loss": -21.50876235961914, "global_step": 81127, "epoch": 977} {"train_loss": -20.9309139251709, "global_step": 81128, "epoch": 977} {"train_loss": -21.258390426635742, "global_step": 81129, "epoch": 977} {"train_loss": -21.267932891845703, "global_step": 81130, "epoch": 977} {"train_loss": -21.248884201049805, "global_step": 81131, "epoch": 977} {"train_loss": -21.269033432006836, "global_step": 81132, "epoch": 977} {"train_loss": -21.263898849487305, "global_step": 81133, "epoch": 977} {"train_loss": -21.597585678100586, "global_step": 81134, "epoch": 977} {"train_loss": -21.426610946655273, "global_step": 81135, "epoch": 977} {"train_loss": -21.199800491333008, "global_step": 81136, "epoch": 977} {"train_loss": -21.28548240661621, "global_step": 81137, "epoch": 977} {"train_loss": -21.213804244995117, "global_step": 81138, "epoch": 977} {"train_loss": -21.511098861694336, "global_step": 81139, "epoch": 977} {"train_loss": -21.150981903076172, "global_step": 81140, "epoch": 977} {"train_loss": -21.238447189331055, "global_step": 81141, "epoch": 977} {"train_loss": -21.595190048217773, "global_step": 81142, "epoch": 977} {"train_loss": -21.67350196838379, "global_step": 81143, "epoch": 977} {"train_loss": -21.218854904174805, "global_step": 81144, "epoch": 977} {"train_loss": -21.0739803314209, "global_step": 81145, "epoch": 977} {"train_loss": -20.99653434753418, "global_step": 81146, "epoch": 977} {"train_loss": -21.46261978149414, "global_step": 81147, "epoch": 977} {"train_loss": -21.410032272338867, "global_step": 81148, "epoch": 977} {"train_loss": -21.11151123046875, "global_step": 81149, "epoch": 977} {"train_loss": -21.260578155517578, "global_step": 81150, "epoch": 977} {"train_loss": -21.552955627441406, "global_step": 81151, "epoch": 977} {"train_loss": -21.279861450195312, "global_step": 81152, "epoch": 977} {"train_loss": -21.350339889526367, "global_step": 81153, "epoch": 977} {"train_loss": -21.123003005981445, "global_step": 81154, "epoch": 977} {"train_loss": -21.146615982055664, "global_step": 81155, "epoch": 977} {"train_loss": -21.403501510620117, "global_step": 81156, "epoch": 977} {"train_loss": -21.031005859375, "global_step": 81157, "epoch": 977} {"train_loss": -21.63897705078125, "global_step": 81158, "epoch": 977} {"train_loss": -21.217023849487305, "global_step": 81159, "epoch": 977} {"train_loss": -21.592084884643555, "global_step": 81160, "epoch": 977} {"train_loss": -21.178848266601562, "global_step": 81161, "epoch": 977} {"train_loss": -21.06475830078125, "global_step": 81162, "epoch": 977} {"train_loss": -21.2437744140625, "global_step": 81163, "epoch": 977} {"train_loss": -21.384735107421875, "global_step": 81164, "epoch": 977} {"train_loss": -21.198888778686523, "global_step": 81165, "epoch": 977} {"train_loss": -20.807090759277344, "global_step": 81166, "epoch": 977} {"train_loss": -21.29718780517578, "global_step": 81167, "epoch": 977} {"train_loss": -21.034509658813477, "global_step": 81168, "epoch": 977} {"train_loss": -21.329914093017578, "global_step": 81169, "epoch": 977} {"train_loss": -21.433103561401367, "global_step": 81170, "epoch": 977} {"train_loss": -21.09299659729004, "global_step": 81171, "epoch": 977} {"train_loss": -21.123050689697266, "global_step": 81172, "epoch": 977} {"train_loss": -21.238421175853315, "global_step": 81173, "epoch": 977, "val_loss": 5964296.5} {"train_loss": -20.738222122192383, "global_step": 81174, "epoch": 978} {"train_loss": -20.98700523376465, "global_step": 81175, "epoch": 978} {"train_loss": -21.234228134155273, "global_step": 81176, "epoch": 978} {"train_loss": -20.575544357299805, "global_step": 81177, "epoch": 978} {"train_loss": -20.63329315185547, "global_step": 81178, "epoch": 978} {"train_loss": -20.630117416381836, "global_step": 81179, "epoch": 978} {"train_loss": -20.300127029418945, "global_step": 81180, "epoch": 978} {"train_loss": -20.4360294342041, "global_step": 81181, "epoch": 978} {"train_loss": -20.788471221923828, "global_step": 81182, "epoch": 978} {"train_loss": -20.919347763061523, "global_step": 81183, "epoch": 978} {"train_loss": -21.21767234802246, "global_step": 81184, "epoch": 978} {"train_loss": -20.91145896911621, "global_step": 81185, "epoch": 978} {"train_loss": -20.818023681640625, "global_step": 81186, "epoch": 978} {"train_loss": -20.792509078979492, "global_step": 81187, "epoch": 978} {"train_loss": -21.206375122070312, "global_step": 81188, "epoch": 978} {"train_loss": -21.2836971282959, "global_step": 81189, "epoch": 978} {"train_loss": -21.28513526916504, "global_step": 81190, "epoch": 978} {"train_loss": -21.345434188842773, "global_step": 81191, "epoch": 978} {"train_loss": -21.228038787841797, "global_step": 81192, "epoch": 978} {"train_loss": -21.329864501953125, "global_step": 81193, "epoch": 978} {"train_loss": -21.027250289916992, "global_step": 81194, "epoch": 978} {"train_loss": -21.17344093322754, "global_step": 81195, "epoch": 978} {"train_loss": -21.07417106628418, "global_step": 81196, "epoch": 978} {"train_loss": -21.18377113342285, "global_step": 81197, "epoch": 978} {"train_loss": -21.491106033325195, "global_step": 81198, "epoch": 978} {"train_loss": -21.39151954650879, "global_step": 81199, "epoch": 978} {"train_loss": -21.085329055786133, "global_step": 81200, "epoch": 978} {"train_loss": -21.591367721557617, "global_step": 81201, "epoch": 978} {"train_loss": -21.134931564331055, "global_step": 81202, "epoch": 978} {"train_loss": -21.362302780151367, "global_step": 81203, "epoch": 978} {"train_loss": -21.09413719177246, "global_step": 81204, "epoch": 978} {"train_loss": -21.07761001586914, "global_step": 81205, "epoch": 978} {"train_loss": -21.48274040222168, "global_step": 81206, "epoch": 978} {"train_loss": -21.237503051757812, "global_step": 81207, "epoch": 978} {"train_loss": -21.437421798706055, "global_step": 81208, "epoch": 978} {"train_loss": -21.1218318939209, "global_step": 81209, "epoch": 978} {"train_loss": -21.025039672851562, "global_step": 81210, "epoch": 978} {"train_loss": -21.2539119720459, "global_step": 81211, "epoch": 978} {"train_loss": -20.92664337158203, "global_step": 81212, "epoch": 978} {"train_loss": -21.224586486816406, "global_step": 81213, "epoch": 978} {"train_loss": -20.9422550201416, "global_step": 81214, "epoch": 978} {"train_loss": -21.41790199279785, "global_step": 81215, "epoch": 978} {"train_loss": -21.383743286132812, "global_step": 81216, "epoch": 978} {"train_loss": -21.120805740356445, "global_step": 81217, "epoch": 978} {"train_loss": -21.52020835876465, "global_step": 81218, "epoch": 978} {"train_loss": -21.534521102905273, "global_step": 81219, "epoch": 978} {"train_loss": -21.21979331970215, "global_step": 81220, "epoch": 978} {"train_loss": -21.049274444580078, "global_step": 81221, "epoch": 978} {"train_loss": -21.04659080505371, "global_step": 81222, "epoch": 978} {"train_loss": -21.37906265258789, "global_step": 81223, "epoch": 978} {"train_loss": -21.399686813354492, "global_step": 81224, "epoch": 978} {"train_loss": -21.283998489379883, "global_step": 81225, "epoch": 978} {"train_loss": -20.986005783081055, "global_step": 81226, "epoch": 978} {"train_loss": -21.155715942382812, "global_step": 81227, "epoch": 978} {"train_loss": -21.28009033203125, "global_step": 81228, "epoch": 978} {"train_loss": -21.395498275756836, "global_step": 81229, "epoch": 978} {"train_loss": -20.917287826538086, "global_step": 81230, "epoch": 978} {"train_loss": -21.175281524658203, "global_step": 81231, "epoch": 978} {"train_loss": -20.745824813842773, "global_step": 81232, "epoch": 978} {"train_loss": -21.28006362915039, "global_step": 81233, "epoch": 978} {"train_loss": -21.027816772460938, "global_step": 81234, "epoch": 978} {"train_loss": -21.265043258666992, "global_step": 81235, "epoch": 978} {"train_loss": -21.27939796447754, "global_step": 81236, "epoch": 978} {"train_loss": -21.06953239440918, "global_step": 81237, "epoch": 978} {"train_loss": -21.356487274169922, "global_step": 81238, "epoch": 978} {"train_loss": -21.11213493347168, "global_step": 81239, "epoch": 978} {"train_loss": -21.16798210144043, "global_step": 81240, "epoch": 978} {"train_loss": -21.179258346557617, "global_step": 81241, "epoch": 978} {"train_loss": -21.357948303222656, "global_step": 81242, "epoch": 978} {"train_loss": -20.739805221557617, "global_step": 81243, "epoch": 978} {"train_loss": -21.070232391357422, "global_step": 81244, "epoch": 978} {"train_loss": -21.658687591552734, "global_step": 81245, "epoch": 978} {"train_loss": -20.823984146118164, "global_step": 81246, "epoch": 978} {"train_loss": -20.93800926208496, "global_step": 81247, "epoch": 978} {"train_loss": -20.857709884643555, "global_step": 81248, "epoch": 978} {"train_loss": -21.456260681152344, "global_step": 81249, "epoch": 978} {"train_loss": -21.452138900756836, "global_step": 81250, "epoch": 978} {"train_loss": -21.541379928588867, "global_step": 81251, "epoch": 978} {"train_loss": -21.486141204833984, "global_step": 81252, "epoch": 978} {"train_loss": -21.586122512817383, "global_step": 81253, "epoch": 978} {"train_loss": -21.06580924987793, "global_step": 81254, "epoch": 978} {"train_loss": -21.235990524291992, "global_step": 81255, "epoch": 978} {"train_loss": -21.129398437867682, "global_step": 81256, "epoch": 978, "val_loss": 5894356.5} {"train_loss": -20.854413986206055, "global_step": 81257, "epoch": 979} {"train_loss": -21.009000778198242, "global_step": 81258, "epoch": 979} {"train_loss": -21.25533103942871, "global_step": 81259, "epoch": 979} {"train_loss": -21.024545669555664, "global_step": 81260, "epoch": 979} {"train_loss": -20.694746017456055, "global_step": 81261, "epoch": 979} {"train_loss": -20.986188888549805, "global_step": 81262, "epoch": 979} {"train_loss": -20.781885147094727, "global_step": 81263, "epoch": 979} {"train_loss": -20.776960372924805, "global_step": 81264, "epoch": 979} {"train_loss": -21.012731552124023, "global_step": 81265, "epoch": 979} {"train_loss": -20.559104919433594, "global_step": 81266, "epoch": 979} {"train_loss": -20.893644332885742, "global_step": 81267, "epoch": 979} {"train_loss": -21.304288864135742, "global_step": 81268, "epoch": 979} {"train_loss": -20.863712310791016, "global_step": 81269, "epoch": 979} {"train_loss": -20.88506317138672, "global_step": 81270, "epoch": 979} {"train_loss": -21.18281364440918, "global_step": 81271, "epoch": 979} {"train_loss": -20.901565551757812, "global_step": 81272, "epoch": 979} {"train_loss": -20.933584213256836, "global_step": 81273, "epoch": 979} {"train_loss": -21.20448112487793, "global_step": 81274, "epoch": 979} {"train_loss": -21.38236427307129, "global_step": 81275, "epoch": 979} {"train_loss": -21.00628662109375, "global_step": 81276, "epoch": 979} {"train_loss": -21.252439498901367, "global_step": 81277, "epoch": 979} {"train_loss": -20.907257080078125, "global_step": 81278, "epoch": 979} {"train_loss": -21.22834587097168, "global_step": 81279, "epoch": 979} {"train_loss": -21.090909957885742, "global_step": 81280, "epoch": 979} {"train_loss": -21.141788482666016, "global_step": 81281, "epoch": 979} {"train_loss": -21.428955078125, "global_step": 81282, "epoch": 979} {"train_loss": -21.116804122924805, "global_step": 81283, "epoch": 979} {"train_loss": -21.256776809692383, "global_step": 81284, "epoch": 979} {"train_loss": -21.302291870117188, "global_step": 81285, "epoch": 979} {"train_loss": -21.39008140563965, "global_step": 81286, "epoch": 979} {"train_loss": -21.497472763061523, "global_step": 81287, "epoch": 979} {"train_loss": -21.258886337280273, "global_step": 81288, "epoch": 979} {"train_loss": -21.29971694946289, "global_step": 81289, "epoch": 979} {"train_loss": -21.544321060180664, "global_step": 81290, "epoch": 979} {"train_loss": -21.391376495361328, "global_step": 81291, "epoch": 979} {"train_loss": -20.989694595336914, "global_step": 81292, "epoch": 979} {"train_loss": -21.106964111328125, "global_step": 81293, "epoch": 979} {"train_loss": -21.101694107055664, "global_step": 81294, "epoch": 979} {"train_loss": -21.152769088745117, "global_step": 81295, "epoch": 979} {"train_loss": -21.130197525024414, "global_step": 81296, "epoch": 979} {"train_loss": -21.239486694335938, "global_step": 81297, "epoch": 979} {"train_loss": -21.419008255004883, "global_step": 81298, "epoch": 979} {"train_loss": -21.526283264160156, "global_step": 81299, "epoch": 979} {"train_loss": -20.84409523010254, "global_step": 81300, "epoch": 979} {"train_loss": -21.307859420776367, "global_step": 81301, "epoch": 979} {"train_loss": -21.127355575561523, "global_step": 81302, "epoch": 979} {"train_loss": -21.13492774963379, "global_step": 81303, "epoch": 979} {"train_loss": -21.396970748901367, "global_step": 81304, "epoch": 979} {"train_loss": -21.102874755859375, "global_step": 81305, "epoch": 979} {"train_loss": -21.14031982421875, "global_step": 81306, "epoch": 979} {"train_loss": -21.031814575195312, "global_step": 81307, "epoch": 979} {"train_loss": -21.27774429321289, "global_step": 81308, "epoch": 979} {"train_loss": -21.076862335205078, "global_step": 81309, "epoch": 979} {"train_loss": -21.18869400024414, "global_step": 81310, "epoch": 979} {"train_loss": -21.366682052612305, "global_step": 81311, "epoch": 979} {"train_loss": -21.232851028442383, "global_step": 81312, "epoch": 979} {"train_loss": -21.418489456176758, "global_step": 81313, "epoch": 979} {"train_loss": -20.974376678466797, "global_step": 81314, "epoch": 979} {"train_loss": -20.78072738647461, "global_step": 81315, "epoch": 979} {"train_loss": -21.136098861694336, "global_step": 81316, "epoch": 979} {"train_loss": -20.87293815612793, "global_step": 81317, "epoch": 979} {"train_loss": -21.159109115600586, "global_step": 81318, "epoch": 979} {"train_loss": -21.24483871459961, "global_step": 81319, "epoch": 979} {"train_loss": -20.854568481445312, "global_step": 81320, "epoch": 979} {"train_loss": -21.428009033203125, "global_step": 81321, "epoch": 979} {"train_loss": -21.241302490234375, "global_step": 81322, "epoch": 979} {"train_loss": -20.834720611572266, "global_step": 81323, "epoch": 979} {"train_loss": -21.41621208190918, "global_step": 81324, "epoch": 979} {"train_loss": -21.013111114501953, "global_step": 81325, "epoch": 979} {"train_loss": -21.30069923400879, "global_step": 81326, "epoch": 979} {"train_loss": -21.652883529663086, "global_step": 81327, "epoch": 979} {"train_loss": -20.829334259033203, "global_step": 81328, "epoch": 979} {"train_loss": -21.03989028930664, "global_step": 81329, "epoch": 979} {"train_loss": -21.309415817260742, "global_step": 81330, "epoch": 979} {"train_loss": -21.0306396484375, "global_step": 81331, "epoch": 979} {"train_loss": -21.20430564880371, "global_step": 81332, "epoch": 979} {"train_loss": -21.726409912109375, "global_step": 81333, "epoch": 979} {"train_loss": -21.279882431030273, "global_step": 81334, "epoch": 979} {"train_loss": -21.304672241210938, "global_step": 81335, "epoch": 979} {"train_loss": -21.683446884155273, "global_step": 81336, "epoch": 979} {"train_loss": -21.23441505432129, "global_step": 81337, "epoch": 979} {"train_loss": -21.396451950073242, "global_step": 81338, "epoch": 979} {"train_loss": -21.171034571636152, "global_step": 81339, "epoch": 979, "val_loss": 6133538.0} {"train_loss": -20.585851669311523, "global_step": 81340, "epoch": 980} {"train_loss": -20.675918579101562, "global_step": 81341, "epoch": 980} {"train_loss": -21.007789611816406, "global_step": 81342, "epoch": 980} {"train_loss": -20.74420738220215, "global_step": 81343, "epoch": 980} {"train_loss": -20.838163375854492, "global_step": 81344, "epoch": 980} {"train_loss": -20.89197540283203, "global_step": 81345, "epoch": 980} {"train_loss": -21.00604820251465, "global_step": 81346, "epoch": 980} {"train_loss": -20.940305709838867, "global_step": 81347, "epoch": 980} {"train_loss": -21.265588760375977, "global_step": 81348, "epoch": 980} {"train_loss": -21.246204376220703, "global_step": 81349, "epoch": 980} {"train_loss": -21.215272903442383, "global_step": 81350, "epoch": 980} {"train_loss": -21.433561325073242, "global_step": 81351, "epoch": 980} {"train_loss": -21.319852828979492, "global_step": 81352, "epoch": 980} {"train_loss": -20.95331382751465, "global_step": 81353, "epoch": 980} {"train_loss": -20.761625289916992, "global_step": 81354, "epoch": 980} {"train_loss": -21.431081771850586, "global_step": 81355, "epoch": 980} {"train_loss": -20.956899642944336, "global_step": 81356, "epoch": 980} {"train_loss": -21.732561111450195, "global_step": 81357, "epoch": 980} {"train_loss": -21.158140182495117, "global_step": 81358, "epoch": 980} {"train_loss": -21.597564697265625, "global_step": 81359, "epoch": 980} {"train_loss": -21.418603897094727, "global_step": 81360, "epoch": 980} {"train_loss": -21.412973403930664, "global_step": 81361, "epoch": 980} {"train_loss": -21.29410743713379, "global_step": 81362, "epoch": 980} {"train_loss": -21.45070457458496, "global_step": 81363, "epoch": 980} {"train_loss": -21.302820205688477, "global_step": 81364, "epoch": 980} {"train_loss": -21.43372917175293, "global_step": 81365, "epoch": 980} {"train_loss": -21.54775047302246, "global_step": 81366, "epoch": 980} {"train_loss": -21.569028854370117, "global_step": 81367, "epoch": 980} {"train_loss": -20.9367618560791, "global_step": 81368, "epoch": 980} {"train_loss": -21.42754554748535, "global_step": 81369, "epoch": 980} {"train_loss": -21.293092727661133, "global_step": 81370, "epoch": 980} {"train_loss": -21.324405670166016, "global_step": 81371, "epoch": 980} {"train_loss": -21.367813110351562, "global_step": 81372, "epoch": 980} {"train_loss": -21.57254981994629, "global_step": 81373, "epoch": 980} {"train_loss": -21.501399993896484, "global_step": 81374, "epoch": 980} {"train_loss": -20.933881759643555, "global_step": 81375, "epoch": 980} {"train_loss": -21.095731735229492, "global_step": 81376, "epoch": 980} {"train_loss": -21.335105895996094, "global_step": 81377, "epoch": 980} {"train_loss": -21.26746940612793, "global_step": 81378, "epoch": 980} {"train_loss": -21.184621810913086, "global_step": 81379, "epoch": 980} {"train_loss": -21.367679595947266, "global_step": 81380, "epoch": 980} {"train_loss": -21.162582397460938, "global_step": 81381, "epoch": 980} {"train_loss": -21.406530380249023, "global_step": 81382, "epoch": 980} {"train_loss": -21.470008850097656, "global_step": 81383, "epoch": 980} {"train_loss": -21.501012802124023, "global_step": 81384, "epoch": 980} {"train_loss": -21.224742889404297, "global_step": 81385, "epoch": 980} {"train_loss": -21.052579879760742, "global_step": 81386, "epoch": 980} {"train_loss": -20.707168579101562, "global_step": 81387, "epoch": 980} {"train_loss": -21.221927642822266, "global_step": 81388, "epoch": 980} {"train_loss": -21.121356964111328, "global_step": 81389, "epoch": 980} {"train_loss": -21.183252334594727, "global_step": 81390, "epoch": 980} {"train_loss": -21.370054244995117, "global_step": 81391, "epoch": 980} {"train_loss": -21.24342155456543, "global_step": 81392, "epoch": 980} {"train_loss": -21.219045639038086, "global_step": 81393, "epoch": 980} {"train_loss": -21.02650260925293, "global_step": 81394, "epoch": 980} {"train_loss": -21.175464630126953, "global_step": 81395, "epoch": 980} {"train_loss": -21.105833053588867, "global_step": 81396, "epoch": 980} {"train_loss": -21.295162200927734, "global_step": 81397, "epoch": 980} {"train_loss": -21.482839584350586, "global_step": 81398, "epoch": 980} {"train_loss": -21.501483917236328, "global_step": 81399, "epoch": 980} {"train_loss": -21.36977767944336, "global_step": 81400, "epoch": 980} {"train_loss": -21.166231155395508, "global_step": 81401, "epoch": 980} {"train_loss": -21.358428955078125, "global_step": 81402, "epoch": 980} {"train_loss": -21.332029342651367, "global_step": 81403, "epoch": 980} {"train_loss": -21.11066246032715, "global_step": 81404, "epoch": 980} {"train_loss": -21.257932662963867, "global_step": 81405, "epoch": 980} {"train_loss": -21.082923889160156, "global_step": 81406, "epoch": 980} {"train_loss": -21.154327392578125, "global_step": 81407, "epoch": 980} {"train_loss": -21.396255493164062, "global_step": 81408, "epoch": 980} {"train_loss": -21.06545066833496, "global_step": 81409, "epoch": 980} {"train_loss": -21.31044578552246, "global_step": 81410, "epoch": 980} {"train_loss": -20.98457145690918, "global_step": 81411, "epoch": 980} {"train_loss": -21.652109146118164, "global_step": 81412, "epoch": 980} {"train_loss": -21.214025497436523, "global_step": 81413, "epoch": 980} {"train_loss": -21.180631637573242, "global_step": 81414, "epoch": 980} {"train_loss": -21.507497787475586, "global_step": 81415, "epoch": 980} {"train_loss": -21.38117027282715, "global_step": 81416, "epoch": 980} {"train_loss": -21.2796688079834, "global_step": 81417, "epoch": 980} {"train_loss": -21.404464721679688, "global_step": 81418, "epoch": 980} {"train_loss": -21.274099349975586, "global_step": 81419, "epoch": 980} {"train_loss": -21.357160568237305, "global_step": 81420, "epoch": 980} {"train_loss": -21.26068687438965, "global_step": 81421, "epoch": 980} {"train_loss": -21.25069854920169, "global_step": 81422, "epoch": 980, "val_loss": 5982275.0} {"train_loss": -20.980619430541992, "global_step": 81423, "epoch": 981} {"train_loss": -20.166757583618164, "global_step": 81424, "epoch": 981} {"train_loss": -21.20326042175293, "global_step": 81425, "epoch": 981} {"train_loss": -21.052509307861328, "global_step": 81426, "epoch": 981} {"train_loss": -20.769773483276367, "global_step": 81427, "epoch": 981} {"train_loss": -21.0722599029541, "global_step": 81428, "epoch": 981} {"train_loss": -21.29544448852539, "global_step": 81429, "epoch": 981} {"train_loss": -21.301362991333008, "global_step": 81430, "epoch": 981} {"train_loss": -20.8896427154541, "global_step": 81431, "epoch": 981} {"train_loss": -21.353864669799805, "global_step": 81432, "epoch": 981} {"train_loss": -21.5837345123291, "global_step": 81433, "epoch": 981} {"train_loss": -20.98960304260254, "global_step": 81434, "epoch": 981} {"train_loss": -21.321638107299805, "global_step": 81435, "epoch": 981} {"train_loss": -20.6254825592041, "global_step": 81436, "epoch": 981} {"train_loss": -21.49614715576172, "global_step": 81437, "epoch": 981} {"train_loss": -20.626209259033203, "global_step": 81438, "epoch": 981} {"train_loss": -21.036970138549805, "global_step": 81439, "epoch": 981} {"train_loss": -20.915624618530273, "global_step": 81440, "epoch": 981} {"train_loss": -20.466480255126953, "global_step": 81441, "epoch": 981} {"train_loss": -21.178197860717773, "global_step": 81442, "epoch": 981} {"train_loss": -21.2553653717041, "global_step": 81443, "epoch": 981} {"train_loss": -21.088987350463867, "global_step": 81444, "epoch": 981} {"train_loss": -21.328535079956055, "global_step": 81445, "epoch": 981} {"train_loss": -20.97139549255371, "global_step": 81446, "epoch": 981} {"train_loss": -21.382970809936523, "global_step": 81447, "epoch": 981} {"train_loss": -21.40289878845215, "global_step": 81448, "epoch": 981} {"train_loss": -21.211212158203125, "global_step": 81449, "epoch": 981} {"train_loss": -21.300617218017578, "global_step": 81450, "epoch": 981} {"train_loss": -21.080446243286133, "global_step": 81451, "epoch": 981} {"train_loss": -21.277387619018555, "global_step": 81452, "epoch": 981} {"train_loss": -21.702497482299805, "global_step": 81453, "epoch": 981} {"train_loss": -21.51424217224121, "global_step": 81454, "epoch": 981} {"train_loss": -21.257368087768555, "global_step": 81455, "epoch": 981} {"train_loss": -21.272859573364258, "global_step": 81456, "epoch": 981} {"train_loss": -21.320606231689453, "global_step": 81457, "epoch": 981} {"train_loss": -21.29796028137207, "global_step": 81458, "epoch": 981} {"train_loss": -21.197813034057617, "global_step": 81459, "epoch": 981} {"train_loss": -21.21419334411621, "global_step": 81460, "epoch": 981} {"train_loss": -21.24184799194336, "global_step": 81461, "epoch": 981} {"train_loss": -21.4715518951416, "global_step": 81462, "epoch": 981} {"train_loss": -21.435773849487305, "global_step": 81463, "epoch": 981} {"train_loss": -21.41411590576172, "global_step": 81464, "epoch": 981} {"train_loss": -21.297088623046875, "global_step": 81465, "epoch": 981} {"train_loss": -20.994747161865234, "global_step": 81466, "epoch": 981} {"train_loss": -21.195249557495117, "global_step": 81467, "epoch": 981} {"train_loss": -21.19919204711914, "global_step": 81468, "epoch": 981} {"train_loss": -21.417789459228516, "global_step": 81469, "epoch": 981} {"train_loss": -21.43658447265625, "global_step": 81470, "epoch": 981} {"train_loss": -21.32869529724121, "global_step": 81471, "epoch": 981} {"train_loss": -21.4046573638916, "global_step": 81472, "epoch": 981} {"train_loss": -21.199684143066406, "global_step": 81473, "epoch": 981} {"train_loss": -21.68514060974121, "global_step": 81474, "epoch": 981} {"train_loss": -21.205209732055664, "global_step": 81475, "epoch": 981} {"train_loss": -21.349103927612305, "global_step": 81476, "epoch": 981} {"train_loss": -21.088788986206055, "global_step": 81477, "epoch": 981} {"train_loss": -21.475133895874023, "global_step": 81478, "epoch": 981} {"train_loss": -21.45180320739746, "global_step": 81479, "epoch": 981} {"train_loss": -21.15605354309082, "global_step": 81480, "epoch": 981} {"train_loss": -21.49644660949707, "global_step": 81481, "epoch": 981} {"train_loss": -20.969879150390625, "global_step": 81482, "epoch": 981} {"train_loss": -20.96044921875, "global_step": 81483, "epoch": 981} {"train_loss": -21.563934326171875, "global_step": 81484, "epoch": 981} {"train_loss": -21.440885543823242, "global_step": 81485, "epoch": 981} {"train_loss": -20.92697525024414, "global_step": 81486, "epoch": 981} {"train_loss": -21.45017433166504, "global_step": 81487, "epoch": 981} {"train_loss": -21.557241439819336, "global_step": 81488, "epoch": 981} {"train_loss": -21.418359756469727, "global_step": 81489, "epoch": 981} {"train_loss": -21.161699295043945, "global_step": 81490, "epoch": 981} {"train_loss": -21.6102237701416, "global_step": 81491, "epoch": 981} {"train_loss": -21.65030288696289, "global_step": 81492, "epoch": 981} {"train_loss": -21.400163650512695, "global_step": 81493, "epoch": 981} {"train_loss": -21.469539642333984, "global_step": 81494, "epoch": 981} {"train_loss": -21.391754150390625, "global_step": 81495, "epoch": 981} {"train_loss": -20.824960708618164, "global_step": 81496, "epoch": 981} {"train_loss": -21.310073852539062, "global_step": 81497, "epoch": 981} {"train_loss": -21.339197158813477, "global_step": 81498, "epoch": 981} {"train_loss": -21.170568466186523, "global_step": 81499, "epoch": 981} {"train_loss": -21.422218322753906, "global_step": 81500, "epoch": 981} {"train_loss": -21.08802604675293, "global_step": 81501, "epoch": 981} {"train_loss": -20.797870635986328, "global_step": 81502, "epoch": 981} {"train_loss": -21.270841598510742, "global_step": 81503, "epoch": 981} {"train_loss": -20.96109962463379, "global_step": 81504, "epoch": 981} {"train_loss": -21.238231589995234, "global_step": 81505, "epoch": 981, "val_loss": 5954441.0} {"train_loss": -20.934223175048828, "global_step": 81506, "epoch": 982} {"train_loss": -20.326522827148438, "global_step": 81507, "epoch": 982} {"train_loss": -20.954914093017578, "global_step": 81508, "epoch": 982} {"train_loss": -20.294620513916016, "global_step": 81509, "epoch": 982} {"train_loss": -20.803253173828125, "global_step": 81510, "epoch": 982} {"train_loss": -20.60346031188965, "global_step": 81511, "epoch": 982} {"train_loss": -20.771921157836914, "global_step": 81512, "epoch": 982} {"train_loss": -20.54022789001465, "global_step": 81513, "epoch": 982} {"train_loss": -20.53548240661621, "global_step": 81514, "epoch": 982} {"train_loss": -21.222824096679688, "global_step": 81515, "epoch": 982} {"train_loss": -20.694808959960938, "global_step": 81516, "epoch": 982} {"train_loss": -20.7769718170166, "global_step": 81517, "epoch": 982} {"train_loss": -21.19235610961914, "global_step": 81518, "epoch": 982} {"train_loss": -20.61522674560547, "global_step": 81519, "epoch": 982} {"train_loss": -20.917621612548828, "global_step": 81520, "epoch": 982} {"train_loss": -20.90566062927246, "global_step": 81521, "epoch": 982} {"train_loss": -21.087919235229492, "global_step": 81522, "epoch": 982} {"train_loss": -20.984094619750977, "global_step": 81523, "epoch": 982} {"train_loss": -21.03537368774414, "global_step": 81524, "epoch": 982} {"train_loss": -21.07550811767578, "global_step": 81525, "epoch": 982} {"train_loss": -20.926424026489258, "global_step": 81526, "epoch": 982} {"train_loss": -21.067289352416992, "global_step": 81527, "epoch": 982} {"train_loss": -21.150985717773438, "global_step": 81528, "epoch": 982} {"train_loss": -20.97160530090332, "global_step": 81529, "epoch": 982} {"train_loss": -21.1872615814209, "global_step": 81530, "epoch": 982} {"train_loss": -20.865530014038086, "global_step": 81531, "epoch": 982} {"train_loss": -21.374441146850586, "global_step": 81532, "epoch": 982} {"train_loss": -20.656274795532227, "global_step": 81533, "epoch": 982} {"train_loss": -20.981287002563477, "global_step": 81534, "epoch": 982} {"train_loss": -21.591520309448242, "global_step": 81535, "epoch": 982} {"train_loss": -21.55905532836914, "global_step": 81536, "epoch": 982} {"train_loss": -21.06987953186035, "global_step": 81537, "epoch": 982} {"train_loss": -21.4299259185791, "global_step": 81538, "epoch": 982} {"train_loss": -21.357587814331055, "global_step": 81539, "epoch": 982} {"train_loss": -21.621692657470703, "global_step": 81540, "epoch": 982} {"train_loss": -21.297260284423828, "global_step": 81541, "epoch": 982} {"train_loss": -21.476327896118164, "global_step": 81542, "epoch": 982} {"train_loss": -21.487585067749023, "global_step": 81543, "epoch": 982} {"train_loss": -21.283803939819336, "global_step": 81544, "epoch": 982} {"train_loss": -21.502084732055664, "global_step": 81545, "epoch": 982} {"train_loss": -21.033124923706055, "global_step": 81546, "epoch": 982} {"train_loss": -21.756301879882812, "global_step": 81547, "epoch": 982} {"train_loss": -21.405521392822266, "global_step": 81548, "epoch": 982} {"train_loss": -21.296859741210938, "global_step": 81549, "epoch": 982} {"train_loss": -21.377790451049805, "global_step": 81550, "epoch": 982} {"train_loss": -21.878446578979492, "global_step": 81551, "epoch": 982} {"train_loss": -21.653215408325195, "global_step": 81552, "epoch": 982} {"train_loss": -21.4122314453125, "global_step": 81553, "epoch": 982} {"train_loss": -21.135204315185547, "global_step": 81554, "epoch": 982} {"train_loss": -21.566761016845703, "global_step": 81555, "epoch": 982} {"train_loss": -21.02147674560547, "global_step": 81556, "epoch": 982} {"train_loss": -21.23142433166504, "global_step": 81557, "epoch": 982} {"train_loss": -21.122180938720703, "global_step": 81558, "epoch": 982} {"train_loss": -21.614187240600586, "global_step": 81559, "epoch": 982} {"train_loss": -21.305936813354492, "global_step": 81560, "epoch": 982} {"train_loss": -21.048460006713867, "global_step": 81561, "epoch": 982} {"train_loss": -21.412212371826172, "global_step": 81562, "epoch": 982} {"train_loss": -21.1016845703125, "global_step": 81563, "epoch": 982} {"train_loss": -21.110198974609375, "global_step": 81564, "epoch": 982} {"train_loss": -21.02522087097168, "global_step": 81565, "epoch": 982} {"train_loss": -21.117685317993164, "global_step": 81566, "epoch": 982} {"train_loss": -20.9871883392334, "global_step": 81567, "epoch": 982} {"train_loss": -21.544572830200195, "global_step": 81568, "epoch": 982} {"train_loss": -21.29740333557129, "global_step": 81569, "epoch": 982} {"train_loss": -21.65076446533203, "global_step": 81570, "epoch": 982} {"train_loss": -21.316526412963867, "global_step": 81571, "epoch": 982} {"train_loss": -21.32754135131836, "global_step": 81572, "epoch": 982} {"train_loss": -21.641035079956055, "global_step": 81573, "epoch": 982} {"train_loss": -20.840198516845703, "global_step": 81574, "epoch": 982} {"train_loss": -21.418899536132812, "global_step": 81575, "epoch": 982} {"train_loss": -20.989521026611328, "global_step": 81576, "epoch": 982} {"train_loss": -21.568588256835938, "global_step": 81577, "epoch": 982} {"train_loss": -21.22174644470215, "global_step": 81578, "epoch": 982} {"train_loss": -21.71693229675293, "global_step": 81579, "epoch": 982} {"train_loss": -21.116987228393555, "global_step": 81580, "epoch": 982} {"train_loss": -21.202468872070312, "global_step": 81581, "epoch": 982} {"train_loss": -21.4145450592041, "global_step": 81582, "epoch": 982} {"train_loss": -21.441120147705078, "global_step": 81583, "epoch": 982} {"train_loss": -21.333721160888672, "global_step": 81584, "epoch": 982} {"train_loss": -21.362918853759766, "global_step": 81585, "epoch": 982} {"train_loss": -21.058374404907227, "global_step": 81586, "epoch": 982} {"train_loss": -21.267059326171875, "global_step": 81587, "epoch": 982} {"train_loss": -21.204804615802075, "global_step": 81588, "epoch": 982, "val_loss": 6047649.0} {"train_loss": -20.95670509338379, "global_step": 81589, "epoch": 983} {"train_loss": -20.943145751953125, "global_step": 81590, "epoch": 983} {"train_loss": -21.141748428344727, "global_step": 81591, "epoch": 983} {"train_loss": -20.93170738220215, "global_step": 81592, "epoch": 983} {"train_loss": -20.562509536743164, "global_step": 81593, "epoch": 983} {"train_loss": -20.922992706298828, "global_step": 81594, "epoch": 983} {"train_loss": -20.859304428100586, "global_step": 81595, "epoch": 983} {"train_loss": -20.851728439331055, "global_step": 81596, "epoch": 983} {"train_loss": -21.029251098632812, "global_step": 81597, "epoch": 983} {"train_loss": -21.162290573120117, "global_step": 81598, "epoch": 983} {"train_loss": -20.956815719604492, "global_step": 81599, "epoch": 983} {"train_loss": -21.29499053955078, "global_step": 81600, "epoch": 983} {"train_loss": -21.28671646118164, "global_step": 81601, "epoch": 983} {"train_loss": -20.984342575073242, "global_step": 81602, "epoch": 983} {"train_loss": -21.3907527923584, "global_step": 81603, "epoch": 983} {"train_loss": -20.705656051635742, "global_step": 81604, "epoch": 983} {"train_loss": -21.33875846862793, "global_step": 81605, "epoch": 983} {"train_loss": -21.466299057006836, "global_step": 81606, "epoch": 983} {"train_loss": -21.12386131286621, "global_step": 81607, "epoch": 983} {"train_loss": -21.52286148071289, "global_step": 81608, "epoch": 983} {"train_loss": -21.16434097290039, "global_step": 81609, "epoch": 983} {"train_loss": -21.41609001159668, "global_step": 81610, "epoch": 983} {"train_loss": -21.462387084960938, "global_step": 81611, "epoch": 983} {"train_loss": -20.91818618774414, "global_step": 81612, "epoch": 983} {"train_loss": -21.205280303955078, "global_step": 81613, "epoch": 983} {"train_loss": -20.842809677124023, "global_step": 81614, "epoch": 983} {"train_loss": -20.947589874267578, "global_step": 81615, "epoch": 983} {"train_loss": -21.278064727783203, "global_step": 81616, "epoch": 983} {"train_loss": -21.196353912353516, "global_step": 81617, "epoch": 983} {"train_loss": -21.09969139099121, "global_step": 81618, "epoch": 983} {"train_loss": -21.272968292236328, "global_step": 81619, "epoch": 983} {"train_loss": -21.545780181884766, "global_step": 81620, "epoch": 983} {"train_loss": -21.307701110839844, "global_step": 81621, "epoch": 983} {"train_loss": -21.077260971069336, "global_step": 81622, "epoch": 983} {"train_loss": -21.618154525756836, "global_step": 81623, "epoch": 983} {"train_loss": -21.313634872436523, "global_step": 81624, "epoch": 983} {"train_loss": -21.15743064880371, "global_step": 81625, "epoch": 983} {"train_loss": -21.45068359375, "global_step": 81626, "epoch": 983} {"train_loss": -21.480234146118164, "global_step": 81627, "epoch": 983} {"train_loss": -20.916410446166992, "global_step": 81628, "epoch": 983} {"train_loss": -21.232946395874023, "global_step": 81629, "epoch": 983} {"train_loss": -21.260379791259766, "global_step": 81630, "epoch": 983} {"train_loss": -21.389652252197266, "global_step": 81631, "epoch": 983} {"train_loss": -21.08323097229004, "global_step": 81632, "epoch": 983} {"train_loss": -21.298120498657227, "global_step": 81633, "epoch": 983} {"train_loss": -21.08810043334961, "global_step": 81634, "epoch": 983} {"train_loss": -21.397932052612305, "global_step": 81635, "epoch": 983} {"train_loss": -21.64565086364746, "global_step": 81636, "epoch": 983} {"train_loss": -21.41986083984375, "global_step": 81637, "epoch": 983} {"train_loss": -21.508834838867188, "global_step": 81638, "epoch": 983} {"train_loss": -21.30246925354004, "global_step": 81639, "epoch": 983} {"train_loss": -21.300020217895508, "global_step": 81640, "epoch": 983} {"train_loss": -21.417814254760742, "global_step": 81641, "epoch": 983} {"train_loss": -21.66132926940918, "global_step": 81642, "epoch": 983} {"train_loss": -21.714414596557617, "global_step": 81643, "epoch": 983} {"train_loss": -21.1551456451416, "global_step": 81644, "epoch": 983} {"train_loss": -21.31325340270996, "global_step": 81645, "epoch": 983} {"train_loss": -21.304492950439453, "global_step": 81646, "epoch": 983} {"train_loss": -21.28580093383789, "global_step": 81647, "epoch": 983} {"train_loss": -21.669239044189453, "global_step": 81648, "epoch": 983} {"train_loss": -21.571853637695312, "global_step": 81649, "epoch": 983} {"train_loss": -21.575088500976562, "global_step": 81650, "epoch": 983} {"train_loss": -21.171934127807617, "global_step": 81651, "epoch": 983} {"train_loss": -21.257286071777344, "global_step": 81652, "epoch": 983} {"train_loss": -21.893817901611328, "global_step": 81653, "epoch": 983} {"train_loss": -21.19208335876465, "global_step": 81654, "epoch": 983} {"train_loss": -21.219968795776367, "global_step": 81655, "epoch": 983} {"train_loss": -21.14801788330078, "global_step": 81656, "epoch": 983} {"train_loss": -21.683948516845703, "global_step": 81657, "epoch": 983} {"train_loss": -21.414688110351562, "global_step": 81658, "epoch": 983} {"train_loss": -21.442628860473633, "global_step": 81659, "epoch": 983} {"train_loss": -21.60660743713379, "global_step": 81660, "epoch": 983} {"train_loss": -20.959583282470703, "global_step": 81661, "epoch": 983} {"train_loss": -21.281362533569336, "global_step": 81662, "epoch": 983} {"train_loss": -21.4043025970459, "global_step": 81663, "epoch": 983} {"train_loss": -21.370412826538086, "global_step": 81664, "epoch": 983} {"train_loss": -21.00196647644043, "global_step": 81665, "epoch": 983} {"train_loss": -21.45947265625, "global_step": 81666, "epoch": 983} {"train_loss": -21.11060905456543, "global_step": 81667, "epoch": 983} {"train_loss": -21.199777603149414, "global_step": 81668, "epoch": 983} {"train_loss": -20.8585262298584, "global_step": 81669, "epoch": 983} {"train_loss": -21.315866470336914, "global_step": 81670, "epoch": 983} {"train_loss": -21.246303765170545, "global_step": 81671, "epoch": 983, "val_loss": 6114636.5} {"train_loss": -20.527822494506836, "global_step": 81672, "epoch": 984} {"train_loss": -21.11567497253418, "global_step": 81673, "epoch": 984} {"train_loss": -21.1028995513916, "global_step": 81674, "epoch": 984} {"train_loss": -21.072202682495117, "global_step": 81675, "epoch": 984} {"train_loss": -21.051177978515625, "global_step": 81676, "epoch": 984} {"train_loss": -20.97023582458496, "global_step": 81677, "epoch": 984} {"train_loss": -20.825841903686523, "global_step": 81678, "epoch": 984} {"train_loss": -20.947269439697266, "global_step": 81679, "epoch": 984} {"train_loss": -21.376821517944336, "global_step": 81680, "epoch": 984} {"train_loss": -21.14625358581543, "global_step": 81681, "epoch": 984} {"train_loss": -21.11266326904297, "global_step": 81682, "epoch": 984} {"train_loss": -21.520299911499023, "global_step": 81683, "epoch": 984} {"train_loss": -21.304983139038086, "global_step": 81684, "epoch": 984} {"train_loss": -20.96820640563965, "global_step": 81685, "epoch": 984} {"train_loss": -20.97412109375, "global_step": 81686, "epoch": 984} {"train_loss": -21.208593368530273, "global_step": 81687, "epoch": 984} {"train_loss": -21.376028060913086, "global_step": 81688, "epoch": 984} {"train_loss": -21.11794090270996, "global_step": 81689, "epoch": 984} {"train_loss": -21.428571701049805, "global_step": 81690, "epoch": 984} {"train_loss": -21.603097915649414, "global_step": 81691, "epoch": 984} {"train_loss": -20.975622177124023, "global_step": 81692, "epoch": 984} {"train_loss": -21.235614776611328, "global_step": 81693, "epoch": 984} {"train_loss": -21.434894561767578, "global_step": 81694, "epoch": 984} {"train_loss": -21.10001564025879, "global_step": 81695, "epoch": 984} {"train_loss": -21.032358169555664, "global_step": 81696, "epoch": 984} {"train_loss": -21.231355667114258, "global_step": 81697, "epoch": 984} {"train_loss": -21.142765045166016, "global_step": 81698, "epoch": 984} {"train_loss": -21.346158981323242, "global_step": 81699, "epoch": 984} {"train_loss": -21.37129020690918, "global_step": 81700, "epoch": 984} {"train_loss": -21.19887351989746, "global_step": 81701, "epoch": 984} {"train_loss": -21.157278060913086, "global_step": 81702, "epoch": 984} {"train_loss": -21.47763442993164, "global_step": 81703, "epoch": 984} {"train_loss": -21.291677474975586, "global_step": 81704, "epoch": 984} {"train_loss": -21.307540893554688, "global_step": 81705, "epoch": 984} {"train_loss": -21.2850341796875, "global_step": 81706, "epoch": 984} {"train_loss": -20.776844024658203, "global_step": 81707, "epoch": 984} {"train_loss": -21.209503173828125, "global_step": 81708, "epoch": 984} {"train_loss": -21.409711837768555, "global_step": 81709, "epoch": 984} {"train_loss": -21.62023162841797, "global_step": 81710, "epoch": 984} {"train_loss": -21.027013778686523, "global_step": 81711, "epoch": 984} {"train_loss": -21.42056655883789, "global_step": 81712, "epoch": 984} {"train_loss": -21.61826515197754, "global_step": 81713, "epoch": 984} {"train_loss": -21.435640335083008, "global_step": 81714, "epoch": 984} {"train_loss": -21.38252067565918, "global_step": 81715, "epoch": 984} {"train_loss": -21.21796989440918, "global_step": 81716, "epoch": 984} {"train_loss": -20.705398559570312, "global_step": 81717, "epoch": 984} {"train_loss": -21.155643463134766, "global_step": 81718, "epoch": 984} {"train_loss": -21.318979263305664, "global_step": 81719, "epoch": 984} {"train_loss": -21.269733428955078, "global_step": 81720, "epoch": 984} {"train_loss": -21.32411766052246, "global_step": 81721, "epoch": 984} {"train_loss": -21.026123046875, "global_step": 81722, "epoch": 984} {"train_loss": -20.905790328979492, "global_step": 81723, "epoch": 984} {"train_loss": -21.557661056518555, "global_step": 81724, "epoch": 984} {"train_loss": -21.682254791259766, "global_step": 81725, "epoch": 984} {"train_loss": -21.267309188842773, "global_step": 81726, "epoch": 984} {"train_loss": -20.964691162109375, "global_step": 81727, "epoch": 984} {"train_loss": -21.2838191986084, "global_step": 81728, "epoch": 984} {"train_loss": -21.342500686645508, "global_step": 81729, "epoch": 984} {"train_loss": -21.293684005737305, "global_step": 81730, "epoch": 984} {"train_loss": -21.388914108276367, "global_step": 81731, "epoch": 984} {"train_loss": -21.191577911376953, "global_step": 81732, "epoch": 984} {"train_loss": -20.941547393798828, "global_step": 81733, "epoch": 984} {"train_loss": -21.163463592529297, "global_step": 81734, "epoch": 984} {"train_loss": -21.33853530883789, "global_step": 81735, "epoch": 984} {"train_loss": -21.174949645996094, "global_step": 81736, "epoch": 984} {"train_loss": -21.369781494140625, "global_step": 81737, "epoch": 984} {"train_loss": -21.376728057861328, "global_step": 81738, "epoch": 984} {"train_loss": -21.36830711364746, "global_step": 81739, "epoch": 984} {"train_loss": -21.52198600769043, "global_step": 81740, "epoch": 984} {"train_loss": -21.289657592773438, "global_step": 81741, "epoch": 984} {"train_loss": -21.485788345336914, "global_step": 81742, "epoch": 984} {"train_loss": -21.0538387298584, "global_step": 81743, "epoch": 984} {"train_loss": -21.189298629760742, "global_step": 81744, "epoch": 984} {"train_loss": -21.200803756713867, "global_step": 81745, "epoch": 984} {"train_loss": -21.062015533447266, "global_step": 81746, "epoch": 984} {"train_loss": -21.34421730041504, "global_step": 81747, "epoch": 984} {"train_loss": -21.41681480407715, "global_step": 81748, "epoch": 984} {"train_loss": -21.383848190307617, "global_step": 81749, "epoch": 984} {"train_loss": -21.454017639160156, "global_step": 81750, "epoch": 984} {"train_loss": -21.373098373413086, "global_step": 81751, "epoch": 984} {"train_loss": -21.1268253326416, "global_step": 81752, "epoch": 984} {"train_loss": -21.404376983642578, "global_step": 81753, "epoch": 984} {"train_loss": -21.23673967568271, "global_step": 81754, "epoch": 984, "val_loss": 6205953.5} {"train_loss": -20.973142623901367, "global_step": 81755, "epoch": 985} {"train_loss": -21.173242568969727, "global_step": 81756, "epoch": 985} {"train_loss": -21.194929122924805, "global_step": 81757, "epoch": 985} {"train_loss": -21.071203231811523, "global_step": 81758, "epoch": 985} {"train_loss": -20.777820587158203, "global_step": 81759, "epoch": 985} {"train_loss": -20.863073348999023, "global_step": 81760, "epoch": 985} {"train_loss": -21.19221305847168, "global_step": 81761, "epoch": 985} {"train_loss": -20.997730255126953, "global_step": 81762, "epoch": 985} {"train_loss": -20.914024353027344, "global_step": 81763, "epoch": 985} {"train_loss": -20.908170700073242, "global_step": 81764, "epoch": 985} {"train_loss": -21.360570907592773, "global_step": 81765, "epoch": 985} {"train_loss": -21.470388412475586, "global_step": 81766, "epoch": 985} {"train_loss": -21.13235855102539, "global_step": 81767, "epoch": 985} {"train_loss": -21.246763229370117, "global_step": 81768, "epoch": 985} {"train_loss": -21.651657104492188, "global_step": 81769, "epoch": 985} {"train_loss": -21.3553466796875, "global_step": 81770, "epoch": 985} {"train_loss": -20.960391998291016, "global_step": 81771, "epoch": 985} {"train_loss": -20.798748016357422, "global_step": 81772, "epoch": 985} {"train_loss": -21.469192504882812, "global_step": 81773, "epoch": 985} {"train_loss": -21.17677879333496, "global_step": 81774, "epoch": 985} {"train_loss": -21.170759201049805, "global_step": 81775, "epoch": 985} {"train_loss": -21.0579891204834, "global_step": 81776, "epoch": 985} {"train_loss": -21.282197952270508, "global_step": 81777, "epoch": 985} {"train_loss": -21.23900032043457, "global_step": 81778, "epoch": 985} {"train_loss": -21.163267135620117, "global_step": 81779, "epoch": 985} {"train_loss": -21.221567153930664, "global_step": 81780, "epoch": 985} {"train_loss": -21.078418731689453, "global_step": 81781, "epoch": 985} {"train_loss": -21.308618545532227, "global_step": 81782, "epoch": 985} {"train_loss": -20.934492111206055, "global_step": 81783, "epoch": 985} {"train_loss": -21.412891387939453, "global_step": 81784, "epoch": 985} {"train_loss": -21.34916114807129, "global_step": 81785, "epoch": 985} {"train_loss": -21.00168800354004, "global_step": 81786, "epoch": 985} {"train_loss": -21.13776206970215, "global_step": 81787, "epoch": 985} {"train_loss": -21.50724220275879, "global_step": 81788, "epoch": 985} {"train_loss": -20.852689743041992, "global_step": 81789, "epoch": 985} {"train_loss": -21.31977653503418, "global_step": 81790, "epoch": 985} {"train_loss": -21.29217529296875, "global_step": 81791, "epoch": 985} {"train_loss": -21.89139747619629, "global_step": 81792, "epoch": 985} {"train_loss": -20.978160858154297, "global_step": 81793, "epoch": 985} {"train_loss": -21.374019622802734, "global_step": 81794, "epoch": 985} {"train_loss": -21.12214469909668, "global_step": 81795, "epoch": 985} {"train_loss": -21.53505516052246, "global_step": 81796, "epoch": 985} {"train_loss": -21.367826461791992, "global_step": 81797, "epoch": 985} {"train_loss": -21.204547882080078, "global_step": 81798, "epoch": 985} {"train_loss": -21.07917594909668, "global_step": 81799, "epoch": 985} {"train_loss": -21.544025421142578, "global_step": 81800, "epoch": 985} {"train_loss": -21.527456283569336, "global_step": 81801, "epoch": 985} {"train_loss": -21.235776901245117, "global_step": 81802, "epoch": 985} {"train_loss": -21.36275863647461, "global_step": 81803, "epoch": 985} {"train_loss": -21.51877784729004, "global_step": 81804, "epoch": 985} {"train_loss": -21.49072265625, "global_step": 81805, "epoch": 985} {"train_loss": -21.376510620117188, "global_step": 81806, "epoch": 985} {"train_loss": -21.22710609436035, "global_step": 81807, "epoch": 985} {"train_loss": -21.294095993041992, "global_step": 81808, "epoch": 985} {"train_loss": -20.998136520385742, "global_step": 81809, "epoch": 985} {"train_loss": -21.277055740356445, "global_step": 81810, "epoch": 985} {"train_loss": -21.466388702392578, "global_step": 81811, "epoch": 985} {"train_loss": -21.262680053710938, "global_step": 81812, "epoch": 985} {"train_loss": -21.16191291809082, "global_step": 81813, "epoch": 985} {"train_loss": -21.57621955871582, "global_step": 81814, "epoch": 985} {"train_loss": -21.20522117614746, "global_step": 81815, "epoch": 985} {"train_loss": -21.534486770629883, "global_step": 81816, "epoch": 985} {"train_loss": -21.458253860473633, "global_step": 81817, "epoch": 985} {"train_loss": -21.43670082092285, "global_step": 81818, "epoch": 985} {"train_loss": -21.37676429748535, "global_step": 81819, "epoch": 985} {"train_loss": -21.250953674316406, "global_step": 81820, "epoch": 985} {"train_loss": -21.45872688293457, "global_step": 81821, "epoch": 985} {"train_loss": -21.623632431030273, "global_step": 81822, "epoch": 985} {"train_loss": -21.040515899658203, "global_step": 81823, "epoch": 985} {"train_loss": -21.415695190429688, "global_step": 81824, "epoch": 985} {"train_loss": -21.455991744995117, "global_step": 81825, "epoch": 985} {"train_loss": -21.35530662536621, "global_step": 81826, "epoch": 985} {"train_loss": -21.30926513671875, "global_step": 81827, "epoch": 985} {"train_loss": -21.486459732055664, "global_step": 81828, "epoch": 985} {"train_loss": -21.230255126953125, "global_step": 81829, "epoch": 985} {"train_loss": -21.57786750793457, "global_step": 81830, "epoch": 985} {"train_loss": -21.46786117553711, "global_step": 81831, "epoch": 985} {"train_loss": -21.321081161499023, "global_step": 81832, "epoch": 985} {"train_loss": -21.241743087768555, "global_step": 81833, "epoch": 985} {"train_loss": -21.387956619262695, "global_step": 81834, "epoch": 985} {"train_loss": -21.53580093383789, "global_step": 81835, "epoch": 985} {"train_loss": -21.512861251831055, "global_step": 81836, "epoch": 985} {"train_loss": -21.278173216854235, "global_step": 81837, "epoch": 985, "val_loss": 6065858.0} {"train_loss": -21.033235549926758, "global_step": 81838, "epoch": 986} {"train_loss": -20.794864654541016, "global_step": 81839, "epoch": 986} {"train_loss": -20.94794273376465, "global_step": 81840, "epoch": 986} {"train_loss": -20.80658531188965, "global_step": 81841, "epoch": 986} {"train_loss": -21.162443161010742, "global_step": 81842, "epoch": 986} {"train_loss": -21.24800682067871, "global_step": 81843, "epoch": 986} {"train_loss": -21.423892974853516, "global_step": 81844, "epoch": 986} {"train_loss": -20.892322540283203, "global_step": 81845, "epoch": 986} {"train_loss": -21.252838134765625, "global_step": 81846, "epoch": 986} {"train_loss": -21.479740142822266, "global_step": 81847, "epoch": 986} {"train_loss": -21.287490844726562, "global_step": 81848, "epoch": 986} {"train_loss": -21.4019718170166, "global_step": 81849, "epoch": 986} {"train_loss": -21.224994659423828, "global_step": 81850, "epoch": 986} {"train_loss": -21.129770278930664, "global_step": 81851, "epoch": 986} {"train_loss": -21.396787643432617, "global_step": 81852, "epoch": 986} {"train_loss": -21.35032081604004, "global_step": 81853, "epoch": 986} {"train_loss": -21.2203311920166, "global_step": 81854, "epoch": 986} {"train_loss": -21.23597526550293, "global_step": 81855, "epoch": 986} {"train_loss": -21.460973739624023, "global_step": 81856, "epoch": 986} {"train_loss": -21.140836715698242, "global_step": 81857, "epoch": 986} {"train_loss": -21.62493324279785, "global_step": 81858, "epoch": 986} {"train_loss": -21.27505111694336, "global_step": 81859, "epoch": 986} {"train_loss": -21.61261558532715, "global_step": 81860, "epoch": 986} {"train_loss": -20.820058822631836, "global_step": 81861, "epoch": 986} {"train_loss": -21.80277442932129, "global_step": 81862, "epoch": 986} {"train_loss": -21.147104263305664, "global_step": 81863, "epoch": 986} {"train_loss": -21.1815185546875, "global_step": 81864, "epoch": 986} {"train_loss": -21.67816734313965, "global_step": 81865, "epoch": 986} {"train_loss": -21.158811569213867, "global_step": 81866, "epoch": 986} {"train_loss": -21.17119598388672, "global_step": 81867, "epoch": 986} {"train_loss": -21.312292098999023, "global_step": 81868, "epoch": 986} {"train_loss": -21.245071411132812, "global_step": 81869, "epoch": 986} {"train_loss": -21.443832397460938, "global_step": 81870, "epoch": 986} {"train_loss": -21.753665924072266, "global_step": 81871, "epoch": 986} {"train_loss": -21.248838424682617, "global_step": 81872, "epoch": 986} {"train_loss": -21.323257446289062, "global_step": 81873, "epoch": 986} {"train_loss": -21.37640953063965, "global_step": 81874, "epoch": 986} {"train_loss": -21.367477416992188, "global_step": 81875, "epoch": 986} {"train_loss": -21.274045944213867, "global_step": 81876, "epoch": 986} {"train_loss": -21.387605667114258, "global_step": 81877, "epoch": 986} {"train_loss": -21.548389434814453, "global_step": 81878, "epoch": 986} {"train_loss": -21.303363800048828, "global_step": 81879, "epoch": 986} {"train_loss": -21.330148696899414, "global_step": 81880, "epoch": 986} {"train_loss": -21.65428924560547, "global_step": 81881, "epoch": 986} {"train_loss": -21.53559684753418, "global_step": 81882, "epoch": 986} {"train_loss": -21.33833885192871, "global_step": 81883, "epoch": 986} {"train_loss": -21.132780075073242, "global_step": 81884, "epoch": 986} {"train_loss": -21.424501419067383, "global_step": 81885, "epoch": 986} {"train_loss": -21.133651733398438, "global_step": 81886, "epoch": 986} {"train_loss": -21.393075942993164, "global_step": 81887, "epoch": 986} {"train_loss": -21.290212631225586, "global_step": 81888, "epoch": 986} {"train_loss": -21.363292694091797, "global_step": 81889, "epoch": 986} {"train_loss": -21.21420669555664, "global_step": 81890, "epoch": 986} {"train_loss": -21.240449905395508, "global_step": 81891, "epoch": 986} {"train_loss": -21.1419677734375, "global_step": 81892, "epoch": 986} {"train_loss": -21.185617446899414, "global_step": 81893, "epoch": 986} {"train_loss": -21.510459899902344, "global_step": 81894, "epoch": 986} {"train_loss": -21.24300765991211, "global_step": 81895, "epoch": 986} {"train_loss": -21.6966609954834, "global_step": 81896, "epoch": 986} {"train_loss": -21.057876586914062, "global_step": 81897, "epoch": 986} {"train_loss": -21.27601432800293, "global_step": 81898, "epoch": 986} {"train_loss": -21.28223419189453, "global_step": 81899, "epoch": 986} {"train_loss": -21.49388885498047, "global_step": 81900, "epoch": 986} {"train_loss": -21.322343826293945, "global_step": 81901, "epoch": 986} {"train_loss": -21.04673957824707, "global_step": 81902, "epoch": 986} {"train_loss": -21.35097312927246, "global_step": 81903, "epoch": 986} {"train_loss": -21.488344192504883, "global_step": 81904, "epoch": 986} {"train_loss": -21.22699546813965, "global_step": 81905, "epoch": 986} {"train_loss": -21.422163009643555, "global_step": 81906, "epoch": 986} {"train_loss": -21.34481430053711, "global_step": 81907, "epoch": 986} {"train_loss": -21.22141456604004, "global_step": 81908, "epoch": 986} {"train_loss": -21.320188522338867, "global_step": 81909, "epoch": 986} {"train_loss": -21.379894256591797, "global_step": 81910, "epoch": 986} {"train_loss": -21.082380294799805, "global_step": 81911, "epoch": 986} {"train_loss": -21.067495346069336, "global_step": 81912, "epoch": 986} {"train_loss": -21.38985252380371, "global_step": 81913, "epoch": 986} {"train_loss": -21.403928756713867, "global_step": 81914, "epoch": 986} {"train_loss": -21.63565444946289, "global_step": 81915, "epoch": 986} {"train_loss": -21.358768463134766, "global_step": 81916, "epoch": 986} {"train_loss": -21.37776756286621, "global_step": 81917, "epoch": 986} {"train_loss": -21.42157554626465, "global_step": 81918, "epoch": 986} {"train_loss": -21.031021118164062, "global_step": 81919, "epoch": 986} {"train_loss": -21.294857898390436, "global_step": 81920, "epoch": 986, "val_loss": 5986093.0} {"train_loss": -21.087745666503906, "global_step": 81921, "epoch": 987} {"train_loss": -21.29001235961914, "global_step": 81922, "epoch": 987} {"train_loss": -21.009124755859375, "global_step": 81923, "epoch": 987} {"train_loss": -21.042356491088867, "global_step": 81924, "epoch": 987} {"train_loss": -21.391372680664062, "global_step": 81925, "epoch": 987} {"train_loss": -21.406034469604492, "global_step": 81926, "epoch": 987} {"train_loss": -21.062753677368164, "global_step": 81927, "epoch": 987} {"train_loss": -21.227909088134766, "global_step": 81928, "epoch": 987} {"train_loss": -21.149860382080078, "global_step": 81929, "epoch": 987} {"train_loss": -20.984817504882812, "global_step": 81930, "epoch": 987} {"train_loss": -21.358911514282227, "global_step": 81931, "epoch": 987} {"train_loss": -21.24460792541504, "global_step": 81932, "epoch": 987} {"train_loss": -21.2092342376709, "global_step": 81933, "epoch": 987} {"train_loss": -21.030303955078125, "global_step": 81934, "epoch": 987} {"train_loss": -21.100698471069336, "global_step": 81935, "epoch": 987} {"train_loss": -21.299591064453125, "global_step": 81936, "epoch": 987} {"train_loss": -21.356962203979492, "global_step": 81937, "epoch": 987} {"train_loss": -21.063703536987305, "global_step": 81938, "epoch": 987} {"train_loss": -21.081436157226562, "global_step": 81939, "epoch": 987} {"train_loss": -21.5801944732666, "global_step": 81940, "epoch": 987} {"train_loss": -21.33455467224121, "global_step": 81941, "epoch": 987} {"train_loss": -21.435651779174805, "global_step": 81942, "epoch": 987} {"train_loss": -21.32883071899414, "global_step": 81943, "epoch": 987} {"train_loss": -21.489730834960938, "global_step": 81944, "epoch": 987} {"train_loss": -21.709854125976562, "global_step": 81945, "epoch": 987} {"train_loss": -21.568115234375, "global_step": 81946, "epoch": 987} {"train_loss": -21.30647850036621, "global_step": 81947, "epoch": 987} {"train_loss": -21.188302993774414, "global_step": 81948, "epoch": 987} {"train_loss": -21.082447052001953, "global_step": 81949, "epoch": 987} {"train_loss": -21.263198852539062, "global_step": 81950, "epoch": 987} {"train_loss": -21.323345184326172, "global_step": 81951, "epoch": 987} {"train_loss": -21.235721588134766, "global_step": 81952, "epoch": 987} {"train_loss": -21.248769760131836, "global_step": 81953, "epoch": 987} {"train_loss": -21.734710693359375, "global_step": 81954, "epoch": 987} {"train_loss": -21.566598892211914, "global_step": 81955, "epoch": 987} {"train_loss": -21.24576187133789, "global_step": 81956, "epoch": 987} {"train_loss": -21.40222930908203, "global_step": 81957, "epoch": 987} {"train_loss": -21.079179763793945, "global_step": 81958, "epoch": 987} {"train_loss": -21.613040924072266, "global_step": 81959, "epoch": 987} {"train_loss": -21.148399353027344, "global_step": 81960, "epoch": 987} {"train_loss": -21.182472229003906, "global_step": 81961, "epoch": 987} {"train_loss": -21.24286460876465, "global_step": 81962, "epoch": 987} {"train_loss": -21.56495475769043, "global_step": 81963, "epoch": 987} {"train_loss": -20.831212997436523, "global_step": 81964, "epoch": 987} {"train_loss": -21.00934410095215, "global_step": 81965, "epoch": 987} {"train_loss": -20.844627380371094, "global_step": 81966, "epoch": 987} {"train_loss": -21.463918685913086, "global_step": 81967, "epoch": 987} {"train_loss": -21.289575576782227, "global_step": 81968, "epoch": 987} {"train_loss": -21.033605575561523, "global_step": 81969, "epoch": 987} {"train_loss": -21.37419891357422, "global_step": 81970, "epoch": 987} {"train_loss": -21.38059425354004, "global_step": 81971, "epoch": 987} {"train_loss": -21.11722755432129, "global_step": 81972, "epoch": 987} {"train_loss": -21.275733947753906, "global_step": 81973, "epoch": 987} {"train_loss": -21.383102416992188, "global_step": 81974, "epoch": 987} {"train_loss": -21.49778175354004, "global_step": 81975, "epoch": 987} {"train_loss": -21.066591262817383, "global_step": 81976, "epoch": 987} {"train_loss": -21.561281204223633, "global_step": 81977, "epoch": 987} {"train_loss": -21.205617904663086, "global_step": 81978, "epoch": 987} {"train_loss": -21.379764556884766, "global_step": 81979, "epoch": 987} {"train_loss": -21.440277099609375, "global_step": 81980, "epoch": 987} {"train_loss": -21.41932487487793, "global_step": 81981, "epoch": 987} {"train_loss": -21.080732345581055, "global_step": 81982, "epoch": 987} {"train_loss": -21.071069717407227, "global_step": 81983, "epoch": 987} {"train_loss": -21.384952545166016, "global_step": 81984, "epoch": 987} {"train_loss": -21.59031867980957, "global_step": 81985, "epoch": 987} {"train_loss": -21.48744773864746, "global_step": 81986, "epoch": 987} {"train_loss": -21.61850929260254, "global_step": 81987, "epoch": 987} {"train_loss": -21.668493270874023, "global_step": 81988, "epoch": 987} {"train_loss": -21.331850051879883, "global_step": 81989, "epoch": 987} {"train_loss": -21.649106979370117, "global_step": 81990, "epoch": 987} {"train_loss": -21.143789291381836, "global_step": 81991, "epoch": 987} {"train_loss": -21.422040939331055, "global_step": 81992, "epoch": 987} {"train_loss": -21.465927124023438, "global_step": 81993, "epoch": 987} {"train_loss": -21.092466354370117, "global_step": 81994, "epoch": 987} {"train_loss": -21.343826293945312, "global_step": 81995, "epoch": 987} {"train_loss": -21.405099868774414, "global_step": 81996, "epoch": 987} {"train_loss": -21.18739128112793, "global_step": 81997, "epoch": 987} {"train_loss": -21.498750686645508, "global_step": 81998, "epoch": 987} {"train_loss": -21.210378646850586, "global_step": 81999, "epoch": 987} {"train_loss": -20.95660972595215, "global_step": 82000, "epoch": 987} {"train_loss": -21.173484802246094, "global_step": 82001, "epoch": 987} {"train_loss": -20.919424057006836, "global_step": 82002, "epoch": 987} {"train_loss": -21.280793086591974, "global_step": 82003, "epoch": 987, "val_loss": 6062729.0} {"train_loss": -21.63252067565918, "global_step": 82004, "epoch": 988} {"train_loss": -20.85594367980957, "global_step": 82005, "epoch": 988} {"train_loss": -21.04571533203125, "global_step": 82006, "epoch": 988} {"train_loss": -20.95806312561035, "global_step": 82007, "epoch": 988} {"train_loss": -20.973852157592773, "global_step": 82008, "epoch": 988} {"train_loss": -20.723840713500977, "global_step": 82009, "epoch": 988} {"train_loss": -21.014545440673828, "global_step": 82010, "epoch": 988} {"train_loss": -21.145557403564453, "global_step": 82011, "epoch": 988} {"train_loss": -21.114288330078125, "global_step": 82012, "epoch": 988} {"train_loss": -21.38241195678711, "global_step": 82013, "epoch": 988} {"train_loss": -21.253828048706055, "global_step": 82014, "epoch": 988} {"train_loss": -21.42374610900879, "global_step": 82015, "epoch": 988} {"train_loss": -21.402109146118164, "global_step": 82016, "epoch": 988} {"train_loss": -21.07619857788086, "global_step": 82017, "epoch": 988} {"train_loss": -21.48879051208496, "global_step": 82018, "epoch": 988} {"train_loss": -20.855802536010742, "global_step": 82019, "epoch": 988} {"train_loss": -21.147872924804688, "global_step": 82020, "epoch": 988} {"train_loss": -21.366235733032227, "global_step": 82021, "epoch": 988} {"train_loss": -21.33736801147461, "global_step": 82022, "epoch": 988} {"train_loss": -21.516836166381836, "global_step": 82023, "epoch": 988} {"train_loss": -21.03736686706543, "global_step": 82024, "epoch": 988} {"train_loss": -21.453699111938477, "global_step": 82025, "epoch": 988} {"train_loss": -21.190067291259766, "global_step": 82026, "epoch": 988} {"train_loss": -21.237489700317383, "global_step": 82027, "epoch": 988} {"train_loss": -20.936574935913086, "global_step": 82028, "epoch": 988} {"train_loss": -21.320022583007812, "global_step": 82029, "epoch": 988} {"train_loss": -21.264551162719727, "global_step": 82030, "epoch": 988} {"train_loss": -21.287368774414062, "global_step": 82031, "epoch": 988} {"train_loss": -21.267148971557617, "global_step": 82032, "epoch": 988} {"train_loss": -21.44195556640625, "global_step": 82033, "epoch": 988} {"train_loss": -21.49724578857422, "global_step": 82034, "epoch": 988} {"train_loss": -20.92532730102539, "global_step": 82035, "epoch": 988} {"train_loss": -21.53342056274414, "global_step": 82036, "epoch": 988} {"train_loss": -21.39554214477539, "global_step": 82037, "epoch": 988} {"train_loss": -21.262474060058594, "global_step": 82038, "epoch": 988} {"train_loss": -20.978958129882812, "global_step": 82039, "epoch": 988} {"train_loss": -21.41412353515625, "global_step": 82040, "epoch": 988} {"train_loss": -21.105690002441406, "global_step": 82041, "epoch": 988} {"train_loss": -21.025846481323242, "global_step": 82042, "epoch": 988} {"train_loss": -21.107860565185547, "global_step": 82043, "epoch": 988} {"train_loss": -21.66009521484375, "global_step": 82044, "epoch": 988} {"train_loss": -21.384946823120117, "global_step": 82045, "epoch": 988} {"train_loss": -21.473237991333008, "global_step": 82046, "epoch": 988} {"train_loss": -20.991716384887695, "global_step": 82047, "epoch": 988} {"train_loss": -21.37735939025879, "global_step": 82048, "epoch": 988} {"train_loss": -21.4265193939209, "global_step": 82049, "epoch": 988} {"train_loss": -21.3729190826416, "global_step": 82050, "epoch": 988} {"train_loss": -21.519922256469727, "global_step": 82051, "epoch": 988} {"train_loss": -21.22327995300293, "global_step": 82052, "epoch": 988} {"train_loss": -21.4378662109375, "global_step": 82053, "epoch": 988} {"train_loss": -20.873014450073242, "global_step": 82054, "epoch": 988} {"train_loss": -20.85521697998047, "global_step": 82055, "epoch": 988} {"train_loss": -21.177085876464844, "global_step": 82056, "epoch": 988} {"train_loss": -21.155033111572266, "global_step": 82057, "epoch": 988} {"train_loss": -21.519363403320312, "global_step": 82058, "epoch": 988} {"train_loss": -21.52027130126953, "global_step": 82059, "epoch": 988} {"train_loss": -21.49072265625, "global_step": 82060, "epoch": 988} {"train_loss": -21.11494255065918, "global_step": 82061, "epoch": 988} {"train_loss": -21.33955955505371, "global_step": 82062, "epoch": 988} {"train_loss": -21.395963668823242, "global_step": 82063, "epoch": 988} {"train_loss": -20.843862533569336, "global_step": 82064, "epoch": 988} {"train_loss": -21.326730728149414, "global_step": 82065, "epoch": 988} {"train_loss": -20.917123794555664, "global_step": 82066, "epoch": 988} {"train_loss": -21.172658920288086, "global_step": 82067, "epoch": 988} {"train_loss": -21.299320220947266, "global_step": 82068, "epoch": 988} {"train_loss": -21.364858627319336, "global_step": 82069, "epoch": 988} {"train_loss": -21.161535263061523, "global_step": 82070, "epoch": 988} {"train_loss": -21.161184310913086, "global_step": 82071, "epoch": 988} {"train_loss": -21.270099639892578, "global_step": 82072, "epoch": 988} {"train_loss": -21.245058059692383, "global_step": 82073, "epoch": 988} {"train_loss": -21.189603805541992, "global_step": 82074, "epoch": 988} {"train_loss": -21.31839942932129, "global_step": 82075, "epoch": 988} {"train_loss": -21.2568302154541, "global_step": 82076, "epoch": 988} {"train_loss": -21.27760124206543, "global_step": 82077, "epoch": 988} {"train_loss": -21.547489166259766, "global_step": 82078, "epoch": 988} {"train_loss": -21.44685935974121, "global_step": 82079, "epoch": 988} {"train_loss": -21.37554359436035, "global_step": 82080, "epoch": 988} {"train_loss": -21.317235946655273, "global_step": 82081, "epoch": 988} {"train_loss": -21.31711769104004, "global_step": 82082, "epoch": 988} {"train_loss": -21.19656753540039, "global_step": 82083, "epoch": 988} {"train_loss": -21.20490837097168, "global_step": 82084, "epoch": 988} {"train_loss": -21.10424041748047, "global_step": 82085, "epoch": 988} {"train_loss": -21.2474835177502, "global_step": 82086, "epoch": 988, "val_loss": 6085658.5} {"train_loss": -20.85361099243164, "global_step": 82087, "epoch": 989} {"train_loss": -20.986045837402344, "global_step": 82088, "epoch": 989} {"train_loss": -20.97811508178711, "global_step": 82089, "epoch": 989} {"train_loss": -20.903867721557617, "global_step": 82090, "epoch": 989} {"train_loss": -20.7357234954834, "global_step": 82091, "epoch": 989} {"train_loss": -21.414329528808594, "global_step": 82092, "epoch": 989} {"train_loss": -20.759796142578125, "global_step": 82093, "epoch": 989} {"train_loss": -21.409147262573242, "global_step": 82094, "epoch": 989} {"train_loss": -21.17542839050293, "global_step": 82095, "epoch": 989} {"train_loss": -21.16720199584961, "global_step": 82096, "epoch": 989} {"train_loss": -21.120298385620117, "global_step": 82097, "epoch": 989} {"train_loss": -20.92804718017578, "global_step": 82098, "epoch": 989} {"train_loss": -21.018863677978516, "global_step": 82099, "epoch": 989} {"train_loss": -21.398962020874023, "global_step": 82100, "epoch": 989} {"train_loss": -21.380081176757812, "global_step": 82101, "epoch": 989} {"train_loss": -21.36240005493164, "global_step": 82102, "epoch": 989} {"train_loss": -21.29043960571289, "global_step": 82103, "epoch": 989} {"train_loss": -21.456220626831055, "global_step": 82104, "epoch": 989} {"train_loss": -21.145559310913086, "global_step": 82105, "epoch": 989} {"train_loss": -21.468175888061523, "global_step": 82106, "epoch": 989} {"train_loss": -21.15003776550293, "global_step": 82107, "epoch": 989} {"train_loss": -21.187929153442383, "global_step": 82108, "epoch": 989} {"train_loss": -21.59693145751953, "global_step": 82109, "epoch": 989} {"train_loss": -21.44757652282715, "global_step": 82110, "epoch": 989} {"train_loss": -21.06256675720215, "global_step": 82111, "epoch": 989} {"train_loss": -21.598142623901367, "global_step": 82112, "epoch": 989} {"train_loss": -21.11411476135254, "global_step": 82113, "epoch": 989} {"train_loss": -21.068593978881836, "global_step": 82114, "epoch": 989} {"train_loss": -21.3126220703125, "global_step": 82115, "epoch": 989} {"train_loss": -21.53376007080078, "global_step": 82116, "epoch": 989} {"train_loss": -20.97515869140625, "global_step": 82117, "epoch": 989} {"train_loss": -21.444658279418945, "global_step": 82118, "epoch": 989} {"train_loss": -21.12175750732422, "global_step": 82119, "epoch": 989} {"train_loss": -21.26800537109375, "global_step": 82120, "epoch": 989} {"train_loss": -21.36744499206543, "global_step": 82121, "epoch": 989} {"train_loss": -20.819414138793945, "global_step": 82122, "epoch": 989} {"train_loss": -21.309858322143555, "global_step": 82123, "epoch": 989} {"train_loss": -21.326141357421875, "global_step": 82124, "epoch": 989} {"train_loss": -21.383852005004883, "global_step": 82125, "epoch": 989} {"train_loss": -20.968984603881836, "global_step": 82126, "epoch": 989} {"train_loss": -21.1903076171875, "global_step": 82127, "epoch": 989} {"train_loss": -21.196420669555664, "global_step": 82128, "epoch": 989} {"train_loss": -21.324533462524414, "global_step": 82129, "epoch": 989} {"train_loss": -21.207122802734375, "global_step": 82130, "epoch": 989} {"train_loss": -21.43120574951172, "global_step": 82131, "epoch": 989} {"train_loss": -21.309947967529297, "global_step": 82132, "epoch": 989} {"train_loss": -21.23432159423828, "global_step": 82133, "epoch": 989} {"train_loss": -21.748546600341797, "global_step": 82134, "epoch": 989} {"train_loss": -21.57817840576172, "global_step": 82135, "epoch": 989} {"train_loss": -21.205825805664062, "global_step": 82136, "epoch": 989} {"train_loss": -21.171506881713867, "global_step": 82137, "epoch": 989} {"train_loss": -21.278669357299805, "global_step": 82138, "epoch": 989} {"train_loss": -21.338422775268555, "global_step": 82139, "epoch": 989} {"train_loss": -21.10767936706543, "global_step": 82140, "epoch": 989} {"train_loss": -21.035486221313477, "global_step": 82141, "epoch": 989} {"train_loss": -21.201536178588867, "global_step": 82142, "epoch": 989} {"train_loss": -21.208602905273438, "global_step": 82143, "epoch": 989} {"train_loss": -21.161823272705078, "global_step": 82144, "epoch": 989} {"train_loss": -20.745271682739258, "global_step": 82145, "epoch": 989} {"train_loss": -20.829282760620117, "global_step": 82146, "epoch": 989} {"train_loss": -21.798490524291992, "global_step": 82147, "epoch": 989} {"train_loss": -20.967456817626953, "global_step": 82148, "epoch": 989} {"train_loss": -21.509998321533203, "global_step": 82149, "epoch": 989} {"train_loss": -21.364988327026367, "global_step": 82150, "epoch": 989} {"train_loss": -20.81551170349121, "global_step": 82151, "epoch": 989} {"train_loss": -21.572553634643555, "global_step": 82152, "epoch": 989} {"train_loss": -21.399402618408203, "global_step": 82153, "epoch": 989} {"train_loss": -21.211606979370117, "global_step": 82154, "epoch": 989} {"train_loss": -21.05533218383789, "global_step": 82155, "epoch": 989} {"train_loss": -21.35748863220215, "global_step": 82156, "epoch": 989} {"train_loss": -21.0749568939209, "global_step": 82157, "epoch": 989} {"train_loss": -21.457366943359375, "global_step": 82158, "epoch": 989} {"train_loss": -21.442367553710938, "global_step": 82159, "epoch": 989} {"train_loss": -21.12419891357422, "global_step": 82160, "epoch": 989} {"train_loss": -21.348329544067383, "global_step": 82161, "epoch": 989} {"train_loss": -21.273193359375, "global_step": 82162, "epoch": 989} {"train_loss": -21.459274291992188, "global_step": 82163, "epoch": 989} {"train_loss": -21.604799270629883, "global_step": 82164, "epoch": 989} {"train_loss": -20.99808120727539, "global_step": 82165, "epoch": 989} {"train_loss": -21.159561157226562, "global_step": 82166, "epoch": 989} {"train_loss": -21.20502281188965, "global_step": 82167, "epoch": 989} {"train_loss": -21.465559005737305, "global_step": 82168, "epoch": 989} {"train_loss": -21.24483676129077, "global_step": 82169, "epoch": 989, "val_loss": 5982236.5} {"train_loss": -21.505794525146484, "global_step": 82170, "epoch": 990} {"train_loss": -21.180606842041016, "global_step": 82171, "epoch": 990} {"train_loss": -21.445810317993164, "global_step": 82172, "epoch": 990} {"train_loss": -20.88404655456543, "global_step": 82173, "epoch": 990} {"train_loss": -21.36634635925293, "global_step": 82174, "epoch": 990} {"train_loss": -21.019067764282227, "global_step": 82175, "epoch": 990} {"train_loss": -21.045963287353516, "global_step": 82176, "epoch": 990} {"train_loss": -21.381351470947266, "global_step": 82177, "epoch": 990} {"train_loss": -21.058130264282227, "global_step": 82178, "epoch": 990} {"train_loss": -20.753278732299805, "global_step": 82179, "epoch": 990} {"train_loss": -20.95599365234375, "global_step": 82180, "epoch": 990} {"train_loss": -21.36085319519043, "global_step": 82181, "epoch": 990} {"train_loss": -21.33601188659668, "global_step": 82182, "epoch": 990} {"train_loss": -21.402240753173828, "global_step": 82183, "epoch": 990} {"train_loss": -21.321361541748047, "global_step": 82184, "epoch": 990} {"train_loss": -21.34467887878418, "global_step": 82185, "epoch": 990} {"train_loss": -21.448795318603516, "global_step": 82186, "epoch": 990} {"train_loss": -21.202238082885742, "global_step": 82187, "epoch": 990} {"train_loss": -21.359222412109375, "global_step": 82188, "epoch": 990} {"train_loss": -20.792591094970703, "global_step": 82189, "epoch": 990} {"train_loss": -21.591920852661133, "global_step": 82190, "epoch": 990} {"train_loss": -21.131519317626953, "global_step": 82191, "epoch": 990} {"train_loss": -21.681272506713867, "global_step": 82192, "epoch": 990} {"train_loss": -20.77534294128418, "global_step": 82193, "epoch": 990} {"train_loss": -21.531570434570312, "global_step": 82194, "epoch": 990} {"train_loss": -20.855375289916992, "global_step": 82195, "epoch": 990} {"train_loss": -21.238052368164062, "global_step": 82196, "epoch": 990} {"train_loss": -21.612228393554688, "global_step": 82197, "epoch": 990} {"train_loss": -21.137296676635742, "global_step": 82198, "epoch": 990} {"train_loss": -21.380231857299805, "global_step": 82199, "epoch": 990} {"train_loss": -21.500883102416992, "global_step": 82200, "epoch": 990} {"train_loss": -21.266239166259766, "global_step": 82201, "epoch": 990} {"train_loss": -21.31882667541504, "global_step": 82202, "epoch": 990} {"train_loss": -21.48636817932129, "global_step": 82203, "epoch": 990} {"train_loss": -21.160518646240234, "global_step": 82204, "epoch": 990} {"train_loss": -21.502544403076172, "global_step": 82205, "epoch": 990} {"train_loss": -21.198049545288086, "global_step": 82206, "epoch": 990} {"train_loss": -21.35645294189453, "global_step": 82207, "epoch": 990} {"train_loss": -20.955657958984375, "global_step": 82208, "epoch": 990} {"train_loss": -21.21866798400879, "global_step": 82209, "epoch": 990} {"train_loss": -21.316757202148438, "global_step": 82210, "epoch": 990} {"train_loss": -21.332685470581055, "global_step": 82211, "epoch": 990} {"train_loss": -21.4051570892334, "global_step": 82212, "epoch": 990} {"train_loss": -21.16314697265625, "global_step": 82213, "epoch": 990} {"train_loss": -21.522808074951172, "global_step": 82214, "epoch": 990} {"train_loss": -21.23634147644043, "global_step": 82215, "epoch": 990} {"train_loss": -21.082929611206055, "global_step": 82216, "epoch": 990} {"train_loss": -20.978036880493164, "global_step": 82217, "epoch": 990} {"train_loss": -21.080686569213867, "global_step": 82218, "epoch": 990} {"train_loss": -21.372529983520508, "global_step": 82219, "epoch": 990} {"train_loss": -21.33978843688965, "global_step": 82220, "epoch": 990} {"train_loss": -21.16208839416504, "global_step": 82221, "epoch": 990} {"train_loss": -21.436603546142578, "global_step": 82222, "epoch": 990} {"train_loss": -21.481674194335938, "global_step": 82223, "epoch": 990} {"train_loss": -21.443592071533203, "global_step": 82224, "epoch": 990} {"train_loss": -21.579565048217773, "global_step": 82225, "epoch": 990} {"train_loss": -21.26151466369629, "global_step": 82226, "epoch": 990} {"train_loss": -21.31593132019043, "global_step": 82227, "epoch": 990} {"train_loss": -21.260847091674805, "global_step": 82228, "epoch": 990} {"train_loss": -21.391386032104492, "global_step": 82229, "epoch": 990} {"train_loss": -21.177404403686523, "global_step": 82230, "epoch": 990} {"train_loss": -21.017459869384766, "global_step": 82231, "epoch": 990} {"train_loss": -21.630842208862305, "global_step": 82232, "epoch": 990} {"train_loss": -21.302658081054688, "global_step": 82233, "epoch": 990} {"train_loss": -21.074983596801758, "global_step": 82234, "epoch": 990} {"train_loss": -20.920289993286133, "global_step": 82235, "epoch": 990} {"train_loss": -21.35173225402832, "global_step": 82236, "epoch": 990} {"train_loss": -21.387495040893555, "global_step": 82237, "epoch": 990} {"train_loss": -21.256546020507812, "global_step": 82238, "epoch": 990} {"train_loss": -21.237689971923828, "global_step": 82239, "epoch": 990} {"train_loss": -21.772563934326172, "global_step": 82240, "epoch": 990} {"train_loss": -21.24723243713379, "global_step": 82241, "epoch": 990} {"train_loss": -21.447675704956055, "global_step": 82242, "epoch": 990} {"train_loss": -21.341093063354492, "global_step": 82243, "epoch": 990} {"train_loss": -21.14299964904785, "global_step": 82244, "epoch": 990} {"train_loss": -21.138198852539062, "global_step": 82245, "epoch": 990} {"train_loss": -21.481122970581055, "global_step": 82246, "epoch": 990} {"train_loss": -21.375293731689453, "global_step": 82247, "epoch": 990} {"train_loss": -21.07435417175293, "global_step": 82248, "epoch": 990} {"train_loss": -21.423532485961914, "global_step": 82249, "epoch": 990} {"train_loss": -21.58548355102539, "global_step": 82250, "epoch": 990} {"train_loss": -21.527891159057617, "global_step": 82251, "epoch": 990} {"train_loss": -21.2748903021755, "global_step": 82252, "epoch": 990, "val_loss": 6156396.0} {"train_loss": -21.172016143798828, "global_step": 82253, "epoch": 991} {"train_loss": -20.905317306518555, "global_step": 82254, "epoch": 991} {"train_loss": -21.198026657104492, "global_step": 82255, "epoch": 991} {"train_loss": -21.377368927001953, "global_step": 82256, "epoch": 991} {"train_loss": -21.12296485900879, "global_step": 82257, "epoch": 991} {"train_loss": -21.16945457458496, "global_step": 82258, "epoch": 991} {"train_loss": -21.316125869750977, "global_step": 82259, "epoch": 991} {"train_loss": -21.3707332611084, "global_step": 82260, "epoch": 991} {"train_loss": -20.65289306640625, "global_step": 82261, "epoch": 991} {"train_loss": -21.31709098815918, "global_step": 82262, "epoch": 991} {"train_loss": -21.39262580871582, "global_step": 82263, "epoch": 991} {"train_loss": -21.110986709594727, "global_step": 82264, "epoch": 991} {"train_loss": -21.131818771362305, "global_step": 82265, "epoch": 991} {"train_loss": -20.767990112304688, "global_step": 82266, "epoch": 991} {"train_loss": -21.409055709838867, "global_step": 82267, "epoch": 991} {"train_loss": -20.8369083404541, "global_step": 82268, "epoch": 991} {"train_loss": -21.02520751953125, "global_step": 82269, "epoch": 991} {"train_loss": -21.320981979370117, "global_step": 82270, "epoch": 991} {"train_loss": -21.037967681884766, "global_step": 82271, "epoch": 991} {"train_loss": -21.075897216796875, "global_step": 82272, "epoch": 991} {"train_loss": -21.233991622924805, "global_step": 82273, "epoch": 991} {"train_loss": -21.067480087280273, "global_step": 82274, "epoch": 991} {"train_loss": -21.094715118408203, "global_step": 82275, "epoch": 991} {"train_loss": -21.15091323852539, "global_step": 82276, "epoch": 991} {"train_loss": -21.372949600219727, "global_step": 82277, "epoch": 991} {"train_loss": -21.607568740844727, "global_step": 82278, "epoch": 991} {"train_loss": -21.162233352661133, "global_step": 82279, "epoch": 991} {"train_loss": -21.170068740844727, "global_step": 82280, "epoch": 991} {"train_loss": -21.276390075683594, "global_step": 82281, "epoch": 991} {"train_loss": -21.406883239746094, "global_step": 82282, "epoch": 991} {"train_loss": -21.857622146606445, "global_step": 82283, "epoch": 991} {"train_loss": -21.374704360961914, "global_step": 82284, "epoch": 991} {"train_loss": -21.534936904907227, "global_step": 82285, "epoch": 991} {"train_loss": -21.260093688964844, "global_step": 82286, "epoch": 991} {"train_loss": -21.48825454711914, "global_step": 82287, "epoch": 991} {"train_loss": -21.185672760009766, "global_step": 82288, "epoch": 991} {"train_loss": -21.18022918701172, "global_step": 82289, "epoch": 991} {"train_loss": -21.518272399902344, "global_step": 82290, "epoch": 991} {"train_loss": -21.032398223876953, "global_step": 82291, "epoch": 991} {"train_loss": -21.165138244628906, "global_step": 82292, "epoch": 991} {"train_loss": -20.899471282958984, "global_step": 82293, "epoch": 991} {"train_loss": -21.363828659057617, "global_step": 82294, "epoch": 991} {"train_loss": -21.267925262451172, "global_step": 82295, "epoch": 991} {"train_loss": -21.265703201293945, "global_step": 82296, "epoch": 991} {"train_loss": -21.573572158813477, "global_step": 82297, "epoch": 991} {"train_loss": -21.197843551635742, "global_step": 82298, "epoch": 991} {"train_loss": -21.45591163635254, "global_step": 82299, "epoch": 991} {"train_loss": -21.231122970581055, "global_step": 82300, "epoch": 991} {"train_loss": -21.24235725402832, "global_step": 82301, "epoch": 991} {"train_loss": -21.322181701660156, "global_step": 82302, "epoch": 991} {"train_loss": -21.6330509185791, "global_step": 82303, "epoch": 991} {"train_loss": -21.217639923095703, "global_step": 82304, "epoch": 991} {"train_loss": -21.341690063476562, "global_step": 82305, "epoch": 991} {"train_loss": -21.545740127563477, "global_step": 82306, "epoch": 991} {"train_loss": -21.385135650634766, "global_step": 82307, "epoch": 991} {"train_loss": -21.81917381286621, "global_step": 82308, "epoch": 991} {"train_loss": -21.806821823120117, "global_step": 82309, "epoch": 991} {"train_loss": -21.105056762695312, "global_step": 82310, "epoch": 991} {"train_loss": -21.08146095275879, "global_step": 82311, "epoch": 991} {"train_loss": -21.386762619018555, "global_step": 82312, "epoch": 991} {"train_loss": -21.308216094970703, "global_step": 82313, "epoch": 991} {"train_loss": -21.008243560791016, "global_step": 82314, "epoch": 991} {"train_loss": -21.22330093383789, "global_step": 82315, "epoch": 991} {"train_loss": -21.37735366821289, "global_step": 82316, "epoch": 991} {"train_loss": -21.711162567138672, "global_step": 82317, "epoch": 991} {"train_loss": -21.253080368041992, "global_step": 82318, "epoch": 991} {"train_loss": -21.137897491455078, "global_step": 82319, "epoch": 991} {"train_loss": -21.314224243164062, "global_step": 82320, "epoch": 991} {"train_loss": -21.583751678466797, "global_step": 82321, "epoch": 991} {"train_loss": -21.34222984313965, "global_step": 82322, "epoch": 991} {"train_loss": -21.158462524414062, "global_step": 82323, "epoch": 991} {"train_loss": -21.384170532226562, "global_step": 82324, "epoch": 991} {"train_loss": -21.3026180267334, "global_step": 82325, "epoch": 991} {"train_loss": -21.24738121032715, "global_step": 82326, "epoch": 991} {"train_loss": -21.16581153869629, "global_step": 82327, "epoch": 991} {"train_loss": -21.541181564331055, "global_step": 82328, "epoch": 991} {"train_loss": -21.332054138183594, "global_step": 82329, "epoch": 991} {"train_loss": -21.285062789916992, "global_step": 82330, "epoch": 991} {"train_loss": -21.398595809936523, "global_step": 82331, "epoch": 991} {"train_loss": -21.478239059448242, "global_step": 82332, "epoch": 991} {"train_loss": -21.437902450561523, "global_step": 82333, "epoch": 991} {"train_loss": -21.14887046813965, "global_step": 82334, "epoch": 991} {"train_loss": -21.26836997342397, "global_step": 82335, "epoch": 991, "val_loss": 6043176.5} {"train_loss": -19.917936325073242, "global_step": 82336, "epoch": 992} {"train_loss": -19.714466094970703, "global_step": 82337, "epoch": 992} {"train_loss": -20.32538604736328, "global_step": 82338, "epoch": 992} {"train_loss": -21.023365020751953, "global_step": 82339, "epoch": 992} {"train_loss": -20.198537826538086, "global_step": 82340, "epoch": 992} {"train_loss": -20.887592315673828, "global_step": 82341, "epoch": 992} {"train_loss": -20.815282821655273, "global_step": 82342, "epoch": 992} {"train_loss": -20.990840911865234, "global_step": 82343, "epoch": 992} {"train_loss": -20.721092224121094, "global_step": 82344, "epoch": 992} {"train_loss": -20.490402221679688, "global_step": 82345, "epoch": 992} {"train_loss": -20.897708892822266, "global_step": 82346, "epoch": 992} {"train_loss": -20.8430233001709, "global_step": 82347, "epoch": 992} {"train_loss": -20.634241104125977, "global_step": 82348, "epoch": 992} {"train_loss": -21.033401489257812, "global_step": 82349, "epoch": 992} {"train_loss": -21.1186580657959, "global_step": 82350, "epoch": 992} {"train_loss": -20.854461669921875, "global_step": 82351, "epoch": 992} {"train_loss": -20.69131851196289, "global_step": 82352, "epoch": 992} {"train_loss": -21.038654327392578, "global_step": 82353, "epoch": 992} {"train_loss": -20.96525001525879, "global_step": 82354, "epoch": 992} {"train_loss": -20.733163833618164, "global_step": 82355, "epoch": 992} {"train_loss": -20.980072021484375, "global_step": 82356, "epoch": 992} {"train_loss": -20.93580436706543, "global_step": 82357, "epoch": 992} {"train_loss": -21.13802146911621, "global_step": 82358, "epoch": 992} {"train_loss": -21.194181442260742, "global_step": 82359, "epoch": 992} {"train_loss": -20.87343406677246, "global_step": 82360, "epoch": 992} {"train_loss": -21.579833984375, "global_step": 82361, "epoch": 992} {"train_loss": -20.94374656677246, "global_step": 82362, "epoch": 992} {"train_loss": -20.920791625976562, "global_step": 82363, "epoch": 992} {"train_loss": -21.239852905273438, "global_step": 82364, "epoch": 992} {"train_loss": -21.157455444335938, "global_step": 82365, "epoch": 992} {"train_loss": -21.740585327148438, "global_step": 82366, "epoch": 992} {"train_loss": -21.171010971069336, "global_step": 82367, "epoch": 992} {"train_loss": -20.99160385131836, "global_step": 82368, "epoch": 992} {"train_loss": -20.876996994018555, "global_step": 82369, "epoch": 992} {"train_loss": -21.632186889648438, "global_step": 82370, "epoch": 992} {"train_loss": -21.18123435974121, "global_step": 82371, "epoch": 992} {"train_loss": -21.34113883972168, "global_step": 82372, "epoch": 992} {"train_loss": -20.96394920349121, "global_step": 82373, "epoch": 992} {"train_loss": -21.19350242614746, "global_step": 82374, "epoch": 992} {"train_loss": -21.30023765563965, "global_step": 82375, "epoch": 992} {"train_loss": -21.12579345703125, "global_step": 82376, "epoch": 992} {"train_loss": -21.212507247924805, "global_step": 82377, "epoch": 992} {"train_loss": -21.444616317749023, "global_step": 82378, "epoch": 992} {"train_loss": -21.248615264892578, "global_step": 82379, "epoch": 992} {"train_loss": -21.22309684753418, "global_step": 82380, "epoch": 992} {"train_loss": -21.106618881225586, "global_step": 82381, "epoch": 992} {"train_loss": -21.303638458251953, "global_step": 82382, "epoch": 992} {"train_loss": -21.551176071166992, "global_step": 82383, "epoch": 992} {"train_loss": -21.002214431762695, "global_step": 82384, "epoch": 992} {"train_loss": -21.462514877319336, "global_step": 82385, "epoch": 992} {"train_loss": -21.331787109375, "global_step": 82386, "epoch": 992} {"train_loss": -21.058300018310547, "global_step": 82387, "epoch": 992} {"train_loss": -21.37060546875, "global_step": 82388, "epoch": 992} {"train_loss": -21.135889053344727, "global_step": 82389, "epoch": 992} {"train_loss": -21.31962013244629, "global_step": 82390, "epoch": 992} {"train_loss": -21.05658531188965, "global_step": 82391, "epoch": 992} {"train_loss": -21.28769874572754, "global_step": 82392, "epoch": 992} {"train_loss": -21.32093620300293, "global_step": 82393, "epoch": 992} {"train_loss": -21.410675048828125, "global_step": 82394, "epoch": 992} {"train_loss": -21.16904640197754, "global_step": 82395, "epoch": 992} {"train_loss": -21.28963279724121, "global_step": 82396, "epoch": 992} {"train_loss": -21.262287139892578, "global_step": 82397, "epoch": 992} {"train_loss": -21.43208885192871, "global_step": 82398, "epoch": 992} {"train_loss": -21.445682525634766, "global_step": 82399, "epoch": 992} {"train_loss": -21.40973663330078, "global_step": 82400, "epoch": 992} {"train_loss": -21.236469268798828, "global_step": 82401, "epoch": 992} {"train_loss": -21.32040786743164, "global_step": 82402, "epoch": 992} {"train_loss": -21.35405921936035, "global_step": 82403, "epoch": 992} {"train_loss": -21.585857391357422, "global_step": 82404, "epoch": 992} {"train_loss": -21.222488403320312, "global_step": 82405, "epoch": 992} {"train_loss": -21.368223190307617, "global_step": 82406, "epoch": 992} {"train_loss": -21.235509872436523, "global_step": 82407, "epoch": 992} {"train_loss": -21.50147819519043, "global_step": 82408, "epoch": 992} {"train_loss": -21.317808151245117, "global_step": 82409, "epoch": 992} {"train_loss": -21.023420333862305, "global_step": 82410, "epoch": 992} {"train_loss": -21.56458854675293, "global_step": 82411, "epoch": 992} {"train_loss": -21.006315231323242, "global_step": 82412, "epoch": 992} {"train_loss": -21.559926986694336, "global_step": 82413, "epoch": 992} {"train_loss": -21.411508560180664, "global_step": 82414, "epoch": 992} {"train_loss": -21.438655853271484, "global_step": 82415, "epoch": 992} {"train_loss": -21.292993545532227, "global_step": 82416, "epoch": 992} {"train_loss": -21.554136276245117, "global_step": 82417, "epoch": 992} {"train_loss": -21.13085466407868, "global_step": 82418, "epoch": 992, "val_loss": 6010001.5} {"train_loss": -20.82527732849121, "global_step": 82419, "epoch": 993} {"train_loss": -21.121946334838867, "global_step": 82420, "epoch": 993} {"train_loss": -20.807126998901367, "global_step": 82421, "epoch": 993} {"train_loss": -21.355077743530273, "global_step": 82422, "epoch": 993} {"train_loss": -20.803556442260742, "global_step": 82423, "epoch": 993} {"train_loss": -20.976232528686523, "global_step": 82424, "epoch": 993} {"train_loss": -20.995309829711914, "global_step": 82425, "epoch": 993} {"train_loss": -21.097745895385742, "global_step": 82426, "epoch": 993} {"train_loss": -21.487295150756836, "global_step": 82427, "epoch": 993} {"train_loss": -20.731250762939453, "global_step": 82428, "epoch": 993} {"train_loss": -21.192914962768555, "global_step": 82429, "epoch": 993} {"train_loss": -21.38838768005371, "global_step": 82430, "epoch": 993} {"train_loss": -21.16916275024414, "global_step": 82431, "epoch": 993} {"train_loss": -21.433618545532227, "global_step": 82432, "epoch": 993} {"train_loss": -21.211042404174805, "global_step": 82433, "epoch": 993} {"train_loss": -21.23124122619629, "global_step": 82434, "epoch": 993} {"train_loss": -21.21286392211914, "global_step": 82435, "epoch": 993} {"train_loss": -21.664316177368164, "global_step": 82436, "epoch": 993} {"train_loss": -21.213651657104492, "global_step": 82437, "epoch": 993} {"train_loss": -21.35883903503418, "global_step": 82438, "epoch": 993} {"train_loss": -21.514524459838867, "global_step": 82439, "epoch": 993} {"train_loss": -21.110031127929688, "global_step": 82440, "epoch": 993} {"train_loss": -21.311826705932617, "global_step": 82441, "epoch": 993} {"train_loss": -21.393157958984375, "global_step": 82442, "epoch": 993} {"train_loss": -21.320714950561523, "global_step": 82443, "epoch": 993} {"train_loss": -21.326732635498047, "global_step": 82444, "epoch": 993} {"train_loss": -21.129438400268555, "global_step": 82445, "epoch": 993} {"train_loss": -21.634431838989258, "global_step": 82446, "epoch": 993} {"train_loss": -21.03592872619629, "global_step": 82447, "epoch": 993} {"train_loss": -21.2592830657959, "global_step": 82448, "epoch": 993} {"train_loss": -21.34117317199707, "global_step": 82449, "epoch": 993} {"train_loss": -21.039209365844727, "global_step": 82450, "epoch": 993} {"train_loss": -21.394376754760742, "global_step": 82451, "epoch": 993} {"train_loss": -21.657514572143555, "global_step": 82452, "epoch": 993} {"train_loss": -21.040212631225586, "global_step": 82453, "epoch": 993} {"train_loss": -21.161916732788086, "global_step": 82454, "epoch": 993} {"train_loss": -21.50503158569336, "global_step": 82455, "epoch": 993} {"train_loss": -21.353912353515625, "global_step": 82456, "epoch": 993} {"train_loss": -21.621334075927734, "global_step": 82457, "epoch": 993} {"train_loss": -21.553375244140625, "global_step": 82458, "epoch": 993} {"train_loss": -21.236154556274414, "global_step": 82459, "epoch": 993} {"train_loss": -21.27361297607422, "global_step": 82460, "epoch": 993} {"train_loss": -21.010141372680664, "global_step": 82461, "epoch": 993} {"train_loss": -21.51534080505371, "global_step": 82462, "epoch": 993} {"train_loss": -21.185949325561523, "global_step": 82463, "epoch": 993} {"train_loss": -21.405981063842773, "global_step": 82464, "epoch": 993} {"train_loss": -21.004121780395508, "global_step": 82465, "epoch": 993} {"train_loss": -21.272397994995117, "global_step": 82466, "epoch": 993} {"train_loss": -21.20415687561035, "global_step": 82467, "epoch": 993} {"train_loss": -21.250934600830078, "global_step": 82468, "epoch": 993} {"train_loss": -21.20601463317871, "global_step": 82469, "epoch": 993} {"train_loss": -20.98842430114746, "global_step": 82470, "epoch": 993} {"train_loss": -21.50611114501953, "global_step": 82471, "epoch": 993} {"train_loss": -21.182016372680664, "global_step": 82472, "epoch": 993} {"train_loss": -20.954004287719727, "global_step": 82473, "epoch": 993} {"train_loss": -21.58552360534668, "global_step": 82474, "epoch": 993} {"train_loss": -21.25592041015625, "global_step": 82475, "epoch": 993} {"train_loss": -20.925466537475586, "global_step": 82476, "epoch": 993} {"train_loss": -21.4630069732666, "global_step": 82477, "epoch": 993} {"train_loss": -21.358671188354492, "global_step": 82478, "epoch": 993} {"train_loss": -20.943655014038086, "global_step": 82479, "epoch": 993} {"train_loss": -21.4420223236084, "global_step": 82480, "epoch": 993} {"train_loss": -21.481454849243164, "global_step": 82481, "epoch": 993} {"train_loss": -21.329431533813477, "global_step": 82482, "epoch": 993} {"train_loss": -21.318246841430664, "global_step": 82483, "epoch": 993} {"train_loss": -21.796512603759766, "global_step": 82484, "epoch": 993} {"train_loss": -21.50015640258789, "global_step": 82485, "epoch": 993} {"train_loss": -21.13453483581543, "global_step": 82486, "epoch": 993} {"train_loss": -21.560056686401367, "global_step": 82487, "epoch": 993} {"train_loss": -21.141555786132812, "global_step": 82488, "epoch": 993} {"train_loss": -21.703306198120117, "global_step": 82489, "epoch": 993} {"train_loss": -21.344152450561523, "global_step": 82490, "epoch": 993} {"train_loss": -21.559804916381836, "global_step": 82491, "epoch": 993} {"train_loss": -21.69733238220215, "global_step": 82492, "epoch": 993} {"train_loss": -21.379281997680664, "global_step": 82493, "epoch": 993} {"train_loss": -21.463979721069336, "global_step": 82494, "epoch": 993} {"train_loss": -21.289636611938477, "global_step": 82495, "epoch": 993} {"train_loss": -21.483854293823242, "global_step": 82496, "epoch": 993} {"train_loss": -21.41895866394043, "global_step": 82497, "epoch": 993} {"train_loss": -21.048978805541992, "global_step": 82498, "epoch": 993} {"train_loss": -21.11501693725586, "global_step": 82499, "epoch": 993} {"train_loss": -21.325712203979492, "global_step": 82500, "epoch": 993} {"train_loss": -21.274809664990528, "global_step": 82501, "epoch": 993, "val_loss": 6004190.5} {"train_loss": -21.39159393310547, "global_step": 82502, "epoch": 994} {"train_loss": -20.923744201660156, "global_step": 82503, "epoch": 994} {"train_loss": -21.25367546081543, "global_step": 82504, "epoch": 994} {"train_loss": -21.371566772460938, "global_step": 82505, "epoch": 994} {"train_loss": -21.19382095336914, "global_step": 82506, "epoch": 994} {"train_loss": -21.15193748474121, "global_step": 82507, "epoch": 994} {"train_loss": -21.417722702026367, "global_step": 82508, "epoch": 994} {"train_loss": -21.366552352905273, "global_step": 82509, "epoch": 994} {"train_loss": -21.388721466064453, "global_step": 82510, "epoch": 994} {"train_loss": -21.344770431518555, "global_step": 82511, "epoch": 994} {"train_loss": -21.181610107421875, "global_step": 82512, "epoch": 994} {"train_loss": -21.007978439331055, "global_step": 82513, "epoch": 994} {"train_loss": -21.076871871948242, "global_step": 82514, "epoch": 994} {"train_loss": -21.201038360595703, "global_step": 82515, "epoch": 994} {"train_loss": -21.56052589416504, "global_step": 82516, "epoch": 994} {"train_loss": -21.23447036743164, "global_step": 82517, "epoch": 994} {"train_loss": -21.56194305419922, "global_step": 82518, "epoch": 994} {"train_loss": -21.358068466186523, "global_step": 82519, "epoch": 994} {"train_loss": -21.36046600341797, "global_step": 82520, "epoch": 994} {"train_loss": -21.2026309967041, "global_step": 82521, "epoch": 994} {"train_loss": -21.269041061401367, "global_step": 82522, "epoch": 994} {"train_loss": -21.301488876342773, "global_step": 82523, "epoch": 994} {"train_loss": -21.258020401000977, "global_step": 82524, "epoch": 994} {"train_loss": -21.36970329284668, "global_step": 82525, "epoch": 994} {"train_loss": -21.159778594970703, "global_step": 82526, "epoch": 994} {"train_loss": -21.7605037689209, "global_step": 82527, "epoch": 994} {"train_loss": -21.126798629760742, "global_step": 82528, "epoch": 994} {"train_loss": -21.41744041442871, "global_step": 82529, "epoch": 994} {"train_loss": -21.271034240722656, "global_step": 82530, "epoch": 994} {"train_loss": -21.147830963134766, "global_step": 82531, "epoch": 994} {"train_loss": -21.109811782836914, "global_step": 82532, "epoch": 994} {"train_loss": -20.94455337524414, "global_step": 82533, "epoch": 994} {"train_loss": -20.899829864501953, "global_step": 82534, "epoch": 994} {"train_loss": -21.212223052978516, "global_step": 82535, "epoch": 994} {"train_loss": -21.46756935119629, "global_step": 82536, "epoch": 994} {"train_loss": -21.3034610748291, "global_step": 82537, "epoch": 994} {"train_loss": -21.577817916870117, "global_step": 82538, "epoch": 994} {"train_loss": -21.716533660888672, "global_step": 82539, "epoch": 994} {"train_loss": -21.20380210876465, "global_step": 82540, "epoch": 994} {"train_loss": -21.289270401000977, "global_step": 82541, "epoch": 994} {"train_loss": -21.133956909179688, "global_step": 82542, "epoch": 994} {"train_loss": -21.408666610717773, "global_step": 82543, "epoch": 994} {"train_loss": -21.248762130737305, "global_step": 82544, "epoch": 994} {"train_loss": -21.88045310974121, "global_step": 82545, "epoch": 994} {"train_loss": -21.421934127807617, "global_step": 82546, "epoch": 994} {"train_loss": -21.201250076293945, "global_step": 82547, "epoch": 994} {"train_loss": -21.477914810180664, "global_step": 82548, "epoch": 994} {"train_loss": -21.526920318603516, "global_step": 82549, "epoch": 994} {"train_loss": -21.269800186157227, "global_step": 82550, "epoch": 994} {"train_loss": -21.45249366760254, "global_step": 82551, "epoch": 994} {"train_loss": -21.666866302490234, "global_step": 82552, "epoch": 994} {"train_loss": -21.27133560180664, "global_step": 82553, "epoch": 994} {"train_loss": -21.52130699157715, "global_step": 82554, "epoch": 994} {"train_loss": -20.971464157104492, "global_step": 82555, "epoch": 994} {"train_loss": -21.51203727722168, "global_step": 82556, "epoch": 994} {"train_loss": -21.555469512939453, "global_step": 82557, "epoch": 994} {"train_loss": -21.217355728149414, "global_step": 82558, "epoch": 994} {"train_loss": -21.244253158569336, "global_step": 82559, "epoch": 994} {"train_loss": -21.573719024658203, "global_step": 82560, "epoch": 994} {"train_loss": -21.267780303955078, "global_step": 82561, "epoch": 994} {"train_loss": -21.44100570678711, "global_step": 82562, "epoch": 994} {"train_loss": -21.253755569458008, "global_step": 82563, "epoch": 994} {"train_loss": -21.158843994140625, "global_step": 82564, "epoch": 994} {"train_loss": -21.087644577026367, "global_step": 82565, "epoch": 994} {"train_loss": -21.22943115234375, "global_step": 82566, "epoch": 994} {"train_loss": -21.64154052734375, "global_step": 82567, "epoch": 994} {"train_loss": -21.085439682006836, "global_step": 82568, "epoch": 994} {"train_loss": -20.766374588012695, "global_step": 82569, "epoch": 994} {"train_loss": -21.132949829101562, "global_step": 82570, "epoch": 994} {"train_loss": -21.323774337768555, "global_step": 82571, "epoch": 994} {"train_loss": -21.2155704498291, "global_step": 82572, "epoch": 994} {"train_loss": -21.38620376586914, "global_step": 82573, "epoch": 994} {"train_loss": -21.3610782623291, "global_step": 82574, "epoch": 994} {"train_loss": -21.58657455444336, "global_step": 82575, "epoch": 994} {"train_loss": -21.17609214782715, "global_step": 82576, "epoch": 994} {"train_loss": -21.541427612304688, "global_step": 82577, "epoch": 994} {"train_loss": -21.19637107849121, "global_step": 82578, "epoch": 994} {"train_loss": -21.401168823242188, "global_step": 82579, "epoch": 994} {"train_loss": -21.682159423828125, "global_step": 82580, "epoch": 994} {"train_loss": -21.189701080322266, "global_step": 82581, "epoch": 994} {"train_loss": -21.301542282104492, "global_step": 82582, "epoch": 994} {"train_loss": -21.329193115234375, "global_step": 82583, "epoch": 994} {"train_loss": -21.311211298747235, "global_step": 82584, "epoch": 994, "val_loss": 6118029.5} {"train_loss": -21.196043014526367, "global_step": 82585, "epoch": 995} {"train_loss": -20.703519821166992, "global_step": 82586, "epoch": 995} {"train_loss": -20.973989486694336, "global_step": 82587, "epoch": 995} {"train_loss": -21.055862426757812, "global_step": 82588, "epoch": 995} {"train_loss": -21.029050827026367, "global_step": 82589, "epoch": 995} {"train_loss": -21.051982879638672, "global_step": 82590, "epoch": 995} {"train_loss": -21.392871856689453, "global_step": 82591, "epoch": 995} {"train_loss": -21.003393173217773, "global_step": 82592, "epoch": 995} {"train_loss": -21.035144805908203, "global_step": 82593, "epoch": 995} {"train_loss": -21.328384399414062, "global_step": 82594, "epoch": 995} {"train_loss": -20.843643188476562, "global_step": 82595, "epoch": 995} {"train_loss": -21.018766403198242, "global_step": 82596, "epoch": 995} {"train_loss": -21.48638916015625, "global_step": 82597, "epoch": 995} {"train_loss": -21.339059829711914, "global_step": 82598, "epoch": 995} {"train_loss": -21.60812759399414, "global_step": 82599, "epoch": 995} {"train_loss": -21.396343231201172, "global_step": 82600, "epoch": 995} {"train_loss": -21.720823287963867, "global_step": 82601, "epoch": 995} {"train_loss": -21.58255386352539, "global_step": 82602, "epoch": 995} {"train_loss": -21.353065490722656, "global_step": 82603, "epoch": 995} {"train_loss": -21.24102210998535, "global_step": 82604, "epoch": 995} {"train_loss": -21.058408737182617, "global_step": 82605, "epoch": 995} {"train_loss": -21.13406753540039, "global_step": 82606, "epoch": 995} {"train_loss": -21.495878219604492, "global_step": 82607, "epoch": 995} {"train_loss": -21.252758026123047, "global_step": 82608, "epoch": 995} {"train_loss": -21.272136688232422, "global_step": 82609, "epoch": 995} {"train_loss": -21.335552215576172, "global_step": 82610, "epoch": 995} {"train_loss": -21.35072898864746, "global_step": 82611, "epoch": 995} {"train_loss": -21.29243278503418, "global_step": 82612, "epoch": 995} {"train_loss": -21.392698287963867, "global_step": 82613, "epoch": 995} {"train_loss": -21.457061767578125, "global_step": 82614, "epoch": 995} {"train_loss": -21.26093101501465, "global_step": 82615, "epoch": 995} {"train_loss": -21.355695724487305, "global_step": 82616, "epoch": 995} {"train_loss": -21.38162612915039, "global_step": 82617, "epoch": 995} {"train_loss": -21.177976608276367, "global_step": 82618, "epoch": 995} {"train_loss": -21.3681697845459, "global_step": 82619, "epoch": 995} {"train_loss": -21.071063995361328, "global_step": 82620, "epoch": 995} {"train_loss": -21.321393966674805, "global_step": 82621, "epoch": 995} {"train_loss": -21.599924087524414, "global_step": 82622, "epoch": 995} {"train_loss": -21.341629028320312, "global_step": 82623, "epoch": 995} {"train_loss": -21.058109283447266, "global_step": 82624, "epoch": 995} {"train_loss": -21.248085021972656, "global_step": 82625, "epoch": 995} {"train_loss": -21.065580368041992, "global_step": 82626, "epoch": 995} {"train_loss": -21.44106101989746, "global_step": 82627, "epoch": 995} {"train_loss": -20.945220947265625, "global_step": 82628, "epoch": 995} {"train_loss": -21.422588348388672, "global_step": 82629, "epoch": 995} {"train_loss": -21.24857521057129, "global_step": 82630, "epoch": 995} {"train_loss": -20.952960968017578, "global_step": 82631, "epoch": 995} {"train_loss": -20.9339542388916, "global_step": 82632, "epoch": 995} {"train_loss": -21.315122604370117, "global_step": 82633, "epoch": 995} {"train_loss": -21.30354881286621, "global_step": 82634, "epoch": 995} {"train_loss": -21.03573989868164, "global_step": 82635, "epoch": 995} {"train_loss": -21.188030242919922, "global_step": 82636, "epoch": 995} {"train_loss": -20.980743408203125, "global_step": 82637, "epoch": 995} {"train_loss": -21.44612693786621, "global_step": 82638, "epoch": 995} {"train_loss": -21.100690841674805, "global_step": 82639, "epoch": 995} {"train_loss": -20.914011001586914, "global_step": 82640, "epoch": 995} {"train_loss": -21.36882209777832, "global_step": 82641, "epoch": 995} {"train_loss": -21.2386531829834, "global_step": 82642, "epoch": 995} {"train_loss": -21.436176300048828, "global_step": 82643, "epoch": 995} {"train_loss": -21.150842666625977, "global_step": 82644, "epoch": 995} {"train_loss": -21.468042373657227, "global_step": 82645, "epoch": 995} {"train_loss": -21.3729305267334, "global_step": 82646, "epoch": 995} {"train_loss": -21.578292846679688, "global_step": 82647, "epoch": 995} {"train_loss": -21.497156143188477, "global_step": 82648, "epoch": 995} {"train_loss": -21.180456161499023, "global_step": 82649, "epoch": 995} {"train_loss": -21.445518493652344, "global_step": 82650, "epoch": 995} {"train_loss": -21.239734649658203, "global_step": 82651, "epoch": 995} {"train_loss": -21.366586685180664, "global_step": 82652, "epoch": 995} {"train_loss": -21.671356201171875, "global_step": 82653, "epoch": 995} {"train_loss": -21.416105270385742, "global_step": 82654, "epoch": 995} {"train_loss": -21.48647117614746, "global_step": 82655, "epoch": 995} {"train_loss": -21.638347625732422, "global_step": 82656, "epoch": 995} {"train_loss": -21.145217895507812, "global_step": 82657, "epoch": 995} {"train_loss": -21.52353286743164, "global_step": 82658, "epoch": 995} {"train_loss": -21.34870719909668, "global_step": 82659, "epoch": 995} {"train_loss": -21.580726623535156, "global_step": 82660, "epoch": 995} {"train_loss": -21.177183151245117, "global_step": 82661, "epoch": 995} {"train_loss": -21.372608184814453, "global_step": 82662, "epoch": 995} {"train_loss": -21.461759567260742, "global_step": 82663, "epoch": 995} {"train_loss": -21.781309127807617, "global_step": 82664, "epoch": 995} {"train_loss": -21.221220016479492, "global_step": 82665, "epoch": 995} {"train_loss": -21.59337043762207, "global_step": 82666, "epoch": 995} {"train_loss": -21.30511720496488, "global_step": 82667, "epoch": 995, "val_loss": 6081738.0} {"train_loss": -21.214265823364258, "global_step": 82668, "epoch": 996} {"train_loss": -21.485706329345703, "global_step": 82669, "epoch": 996} {"train_loss": -21.180997848510742, "global_step": 82670, "epoch": 996} {"train_loss": -20.9179744720459, "global_step": 82671, "epoch": 996} {"train_loss": -21.13479995727539, "global_step": 82672, "epoch": 996} {"train_loss": -21.102792739868164, "global_step": 82673, "epoch": 996} {"train_loss": -21.527633666992188, "global_step": 82674, "epoch": 996} {"train_loss": -21.24597930908203, "global_step": 82675, "epoch": 996} {"train_loss": -21.115419387817383, "global_step": 82676, "epoch": 996} {"train_loss": -21.319868087768555, "global_step": 82677, "epoch": 996} {"train_loss": -21.370389938354492, "global_step": 82678, "epoch": 996} {"train_loss": -21.386322021484375, "global_step": 82679, "epoch": 996} {"train_loss": -21.275592803955078, "global_step": 82680, "epoch": 996} {"train_loss": -21.266881942749023, "global_step": 82681, "epoch": 996} {"train_loss": -21.1057071685791, "global_step": 82682, "epoch": 996} {"train_loss": -21.344646453857422, "global_step": 82683, "epoch": 996} {"train_loss": -21.374990463256836, "global_step": 82684, "epoch": 996} {"train_loss": -21.057458877563477, "global_step": 82685, "epoch": 996} {"train_loss": -20.88590431213379, "global_step": 82686, "epoch": 996} {"train_loss": -21.484333038330078, "global_step": 82687, "epoch": 996} {"train_loss": -21.26804542541504, "global_step": 82688, "epoch": 996} {"train_loss": -21.600784301757812, "global_step": 82689, "epoch": 996} {"train_loss": -21.095783233642578, "global_step": 82690, "epoch": 996} {"train_loss": -21.17811393737793, "global_step": 82691, "epoch": 996} {"train_loss": -21.404937744140625, "global_step": 82692, "epoch": 996} {"train_loss": -21.323741912841797, "global_step": 82693, "epoch": 996} {"train_loss": -21.345111846923828, "global_step": 82694, "epoch": 996} {"train_loss": -21.43296241760254, "global_step": 82695, "epoch": 996} {"train_loss": -21.45503044128418, "global_step": 82696, "epoch": 996} {"train_loss": -21.339757919311523, "global_step": 82697, "epoch": 996} {"train_loss": -21.512781143188477, "global_step": 82698, "epoch": 996} {"train_loss": -21.07733917236328, "global_step": 82699, "epoch": 996} {"train_loss": -21.613454818725586, "global_step": 82700, "epoch": 996} {"train_loss": -21.121320724487305, "global_step": 82701, "epoch": 996} {"train_loss": -21.387052536010742, "global_step": 82702, "epoch": 996} {"train_loss": -21.098947525024414, "global_step": 82703, "epoch": 996} {"train_loss": -21.408905029296875, "global_step": 82704, "epoch": 996} {"train_loss": -21.317834854125977, "global_step": 82705, "epoch": 996} {"train_loss": -21.341629028320312, "global_step": 82706, "epoch": 996} {"train_loss": -21.404428482055664, "global_step": 82707, "epoch": 996} {"train_loss": -21.390899658203125, "global_step": 82708, "epoch": 996} {"train_loss": -21.28657341003418, "global_step": 82709, "epoch": 996} {"train_loss": -21.42808723449707, "global_step": 82710, "epoch": 996} {"train_loss": -21.12102699279785, "global_step": 82711, "epoch": 996} {"train_loss": -21.71661949157715, "global_step": 82712, "epoch": 996} {"train_loss": -21.27955436706543, "global_step": 82713, "epoch": 996} {"train_loss": -21.701053619384766, "global_step": 82714, "epoch": 996} {"train_loss": -21.278650283813477, "global_step": 82715, "epoch": 996} {"train_loss": -21.200929641723633, "global_step": 82716, "epoch": 996} {"train_loss": -21.749237060546875, "global_step": 82717, "epoch": 996} {"train_loss": -21.04728126525879, "global_step": 82718, "epoch": 996} {"train_loss": -21.247705459594727, "global_step": 82719, "epoch": 996} {"train_loss": -21.39893913269043, "global_step": 82720, "epoch": 996} {"train_loss": -21.319631576538086, "global_step": 82721, "epoch": 996} {"train_loss": -21.204923629760742, "global_step": 82722, "epoch": 996} {"train_loss": -21.343887329101562, "global_step": 82723, "epoch": 996} {"train_loss": -21.219804763793945, "global_step": 82724, "epoch": 996} {"train_loss": -21.631528854370117, "global_step": 82725, "epoch": 996} {"train_loss": -21.337739944458008, "global_step": 82726, "epoch": 996} {"train_loss": -21.209163665771484, "global_step": 82727, "epoch": 996} {"train_loss": -20.91750144958496, "global_step": 82728, "epoch": 996} {"train_loss": -20.908536911010742, "global_step": 82729, "epoch": 996} {"train_loss": -20.983768463134766, "global_step": 82730, "epoch": 996} {"train_loss": -21.10109519958496, "global_step": 82731, "epoch": 996} {"train_loss": -21.40119743347168, "global_step": 82732, "epoch": 996} {"train_loss": -21.325862884521484, "global_step": 82733, "epoch": 996} {"train_loss": -21.148839950561523, "global_step": 82734, "epoch": 996} {"train_loss": -21.21304702758789, "global_step": 82735, "epoch": 996} {"train_loss": -21.464603424072266, "global_step": 82736, "epoch": 996} {"train_loss": -21.120746612548828, "global_step": 82737, "epoch": 996} {"train_loss": -21.195981979370117, "global_step": 82738, "epoch": 996} {"train_loss": -21.077096939086914, "global_step": 82739, "epoch": 996} {"train_loss": -21.187755584716797, "global_step": 82740, "epoch": 996} {"train_loss": -21.033109664916992, "global_step": 82741, "epoch": 996} {"train_loss": -21.532058715820312, "global_step": 82742, "epoch": 996} {"train_loss": -21.106708526611328, "global_step": 82743, "epoch": 996} {"train_loss": -21.183820724487305, "global_step": 82744, "epoch": 996} {"train_loss": -21.305570602416992, "global_step": 82745, "epoch": 996} {"train_loss": -20.942174911499023, "global_step": 82746, "epoch": 996} {"train_loss": -21.351760864257812, "global_step": 82747, "epoch": 996} {"train_loss": -21.4874267578125, "global_step": 82748, "epoch": 996} {"train_loss": -20.99071502685547, "global_step": 82749, "epoch": 996} {"train_loss": -21.300238023321313, "global_step": 82750, "epoch": 996, "val_loss": 5872948.0} {"train_loss": -20.36042022705078, "global_step": 82751, "epoch": 997} {"train_loss": -20.62074851989746, "global_step": 82752, "epoch": 997} {"train_loss": -20.73383140563965, "global_step": 82753, "epoch": 997} {"train_loss": -20.48468017578125, "global_step": 82754, "epoch": 997} {"train_loss": -20.909746170043945, "global_step": 82755, "epoch": 997} {"train_loss": -20.71248435974121, "global_step": 82756, "epoch": 997} {"train_loss": -21.1835880279541, "global_step": 82757, "epoch": 997} {"train_loss": -21.07939910888672, "global_step": 82758, "epoch": 997} {"train_loss": -20.727949142456055, "global_step": 82759, "epoch": 997} {"train_loss": -20.56982421875, "global_step": 82760, "epoch": 997} {"train_loss": -21.094100952148438, "global_step": 82761, "epoch": 997} {"train_loss": -20.775150299072266, "global_step": 82762, "epoch": 997} {"train_loss": -20.733266830444336, "global_step": 82763, "epoch": 997} {"train_loss": -20.795963287353516, "global_step": 82764, "epoch": 997} {"train_loss": -21.023046493530273, "global_step": 82765, "epoch": 997} {"train_loss": -21.262353897094727, "global_step": 82766, "epoch": 997} {"train_loss": -21.01376724243164, "global_step": 82767, "epoch": 997} {"train_loss": -21.00157356262207, "global_step": 82768, "epoch": 997} {"train_loss": -21.21587562561035, "global_step": 82769, "epoch": 997} {"train_loss": -21.307039260864258, "global_step": 82770, "epoch": 997} {"train_loss": -21.10822105407715, "global_step": 82771, "epoch": 997} {"train_loss": -21.31148338317871, "global_step": 82772, "epoch": 997} {"train_loss": -21.258764266967773, "global_step": 82773, "epoch": 997} {"train_loss": -21.156423568725586, "global_step": 82774, "epoch": 997} {"train_loss": -21.47369956970215, "global_step": 82775, "epoch": 997} {"train_loss": -21.176589965820312, "global_step": 82776, "epoch": 997} {"train_loss": -21.077363967895508, "global_step": 82777, "epoch": 997} {"train_loss": -20.99637794494629, "global_step": 82778, "epoch": 997} {"train_loss": -21.598163604736328, "global_step": 82779, "epoch": 997} {"train_loss": -21.535146713256836, "global_step": 82780, "epoch": 997} {"train_loss": -21.20112419128418, "global_step": 82781, "epoch": 997} {"train_loss": -21.263914108276367, "global_step": 82782, "epoch": 997} {"train_loss": -21.057138442993164, "global_step": 82783, "epoch": 997} {"train_loss": -21.550556182861328, "global_step": 82784, "epoch": 997} {"train_loss": -21.300491333007812, "global_step": 82785, "epoch": 997} {"train_loss": -21.35750389099121, "global_step": 82786, "epoch": 997} {"train_loss": -21.20172691345215, "global_step": 82787, "epoch": 997} {"train_loss": -21.352069854736328, "global_step": 82788, "epoch": 997} {"train_loss": -21.463781356811523, "global_step": 82789, "epoch": 997} {"train_loss": -21.74152183532715, "global_step": 82790, "epoch": 997} {"train_loss": -21.580015182495117, "global_step": 82791, "epoch": 997} {"train_loss": -21.13246726989746, "global_step": 82792, "epoch": 997} {"train_loss": -21.463232040405273, "global_step": 82793, "epoch": 997} {"train_loss": -21.313024520874023, "global_step": 82794, "epoch": 997} {"train_loss": -20.93279457092285, "global_step": 82795, "epoch": 997} {"train_loss": -21.454273223876953, "global_step": 82796, "epoch": 997} {"train_loss": -20.941904067993164, "global_step": 82797, "epoch": 997} {"train_loss": -21.322813034057617, "global_step": 82798, "epoch": 997} {"train_loss": -21.406198501586914, "global_step": 82799, "epoch": 997} {"train_loss": -21.399024963378906, "global_step": 82800, "epoch": 997} {"train_loss": -21.44327163696289, "global_step": 82801, "epoch": 997} {"train_loss": -21.288860321044922, "global_step": 82802, "epoch": 997} {"train_loss": -21.32111167907715, "global_step": 82803, "epoch": 997} {"train_loss": -21.104284286499023, "global_step": 82804, "epoch": 997} {"train_loss": -21.08320426940918, "global_step": 82805, "epoch": 997} {"train_loss": -21.52076530456543, "global_step": 82806, "epoch": 997} {"train_loss": -21.412145614624023, "global_step": 82807, "epoch": 997} {"train_loss": -21.353696823120117, "global_step": 82808, "epoch": 997} {"train_loss": -21.514680862426758, "global_step": 82809, "epoch": 997} {"train_loss": -21.386438369750977, "global_step": 82810, "epoch": 997} {"train_loss": -21.43963623046875, "global_step": 82811, "epoch": 997} {"train_loss": -21.332935333251953, "global_step": 82812, "epoch": 997} {"train_loss": -21.581775665283203, "global_step": 82813, "epoch": 997} {"train_loss": -21.407367706298828, "global_step": 82814, "epoch": 997} {"train_loss": -21.74616050720215, "global_step": 82815, "epoch": 997} {"train_loss": -21.576528549194336, "global_step": 82816, "epoch": 997} {"train_loss": -21.18816375732422, "global_step": 82817, "epoch": 997} {"train_loss": -21.331436157226562, "global_step": 82818, "epoch": 997} {"train_loss": -21.676572799682617, "global_step": 82819, "epoch": 997} {"train_loss": -21.248428344726562, "global_step": 82820, "epoch": 997} {"train_loss": -21.54128074645996, "global_step": 82821, "epoch": 997} {"train_loss": -21.38702392578125, "global_step": 82822, "epoch": 997} {"train_loss": -21.39133644104004, "global_step": 82823, "epoch": 997} {"train_loss": -21.479537963867188, "global_step": 82824, "epoch": 997} {"train_loss": -21.320743560791016, "global_step": 82825, "epoch": 997} {"train_loss": -21.54510498046875, "global_step": 82826, "epoch": 997} {"train_loss": -21.31892204284668, "global_step": 82827, "epoch": 997} {"train_loss": -21.35487174987793, "global_step": 82828, "epoch": 997} {"train_loss": -21.368772506713867, "global_step": 82829, "epoch": 997} {"train_loss": -21.729978561401367, "global_step": 82830, "epoch": 997} {"train_loss": -20.957618713378906, "global_step": 82831, "epoch": 997} {"train_loss": -21.38674545288086, "global_step": 82832, "epoch": 997} {"train_loss": -21.24812617933894, "global_step": 82833, "epoch": 997, "val_loss": 5998141.5} {"train_loss": -20.57819175720215, "global_step": 82834, "epoch": 998} {"train_loss": -20.981746673583984, "global_step": 82835, "epoch": 998} {"train_loss": -20.480100631713867, "global_step": 82836, "epoch": 998} {"train_loss": -21.0177001953125, "global_step": 82837, "epoch": 998} {"train_loss": -20.55328941345215, "global_step": 82838, "epoch": 998} {"train_loss": -20.726930618286133, "global_step": 82839, "epoch": 998} {"train_loss": -21.145788192749023, "global_step": 82840, "epoch": 998} {"train_loss": -20.979589462280273, "global_step": 82841, "epoch": 998} {"train_loss": -20.837827682495117, "global_step": 82842, "epoch": 998} {"train_loss": -20.775638580322266, "global_step": 82843, "epoch": 998} {"train_loss": -21.348148345947266, "global_step": 82844, "epoch": 998} {"train_loss": -20.956846237182617, "global_step": 82845, "epoch": 998} {"train_loss": -21.08035659790039, "global_step": 82846, "epoch": 998} {"train_loss": -21.215513229370117, "global_step": 82847, "epoch": 998} {"train_loss": -21.07550621032715, "global_step": 82848, "epoch": 998} {"train_loss": -21.37491226196289, "global_step": 82849, "epoch": 998} {"train_loss": -21.482990264892578, "global_step": 82850, "epoch": 998} {"train_loss": -20.98063087463379, "global_step": 82851, "epoch": 998} {"train_loss": -21.240436553955078, "global_step": 82852, "epoch": 998} {"train_loss": -21.006439208984375, "global_step": 82853, "epoch": 998} {"train_loss": -21.356746673583984, "global_step": 82854, "epoch": 998} {"train_loss": -21.53681182861328, "global_step": 82855, "epoch": 998} {"train_loss": -21.491483688354492, "global_step": 82856, "epoch": 998} {"train_loss": -21.094362258911133, "global_step": 82857, "epoch": 998} {"train_loss": -21.190401077270508, "global_step": 82858, "epoch": 998} {"train_loss": -21.320419311523438, "global_step": 82859, "epoch": 998} {"train_loss": -21.46705436706543, "global_step": 82860, "epoch": 998} {"train_loss": -21.172630310058594, "global_step": 82861, "epoch": 998} {"train_loss": -21.378019332885742, "global_step": 82862, "epoch": 998} {"train_loss": -21.303762435913086, "global_step": 82863, "epoch": 998} {"train_loss": -21.490659713745117, "global_step": 82864, "epoch": 998} {"train_loss": -21.39820098876953, "global_step": 82865, "epoch": 998} {"train_loss": -21.153472900390625, "global_step": 82866, "epoch": 998} {"train_loss": -21.29779624938965, "global_step": 82867, "epoch": 998} {"train_loss": -21.415267944335938, "global_step": 82868, "epoch": 998} {"train_loss": -21.484357833862305, "global_step": 82869, "epoch": 998} {"train_loss": -21.55229377746582, "global_step": 82870, "epoch": 998} {"train_loss": -21.278257369995117, "global_step": 82871, "epoch": 998} {"train_loss": -21.231069564819336, "global_step": 82872, "epoch": 998} {"train_loss": -20.90378189086914, "global_step": 82873, "epoch": 998} {"train_loss": -21.004070281982422, "global_step": 82874, "epoch": 998} {"train_loss": -21.693992614746094, "global_step": 82875, "epoch": 998} {"train_loss": -21.00711441040039, "global_step": 82876, "epoch": 998} {"train_loss": -21.091428756713867, "global_step": 82877, "epoch": 998} {"train_loss": -21.443283081054688, "global_step": 82878, "epoch": 998} {"train_loss": -20.998260498046875, "global_step": 82879, "epoch": 998} {"train_loss": -21.42591094970703, "global_step": 82880, "epoch": 998} {"train_loss": -21.343036651611328, "global_step": 82881, "epoch": 998} {"train_loss": -21.199926376342773, "global_step": 82882, "epoch": 998} {"train_loss": -21.340368270874023, "global_step": 82883, "epoch": 998} {"train_loss": -21.397653579711914, "global_step": 82884, "epoch": 998} {"train_loss": -21.625507354736328, "global_step": 82885, "epoch": 998} {"train_loss": -21.10219383239746, "global_step": 82886, "epoch": 998} {"train_loss": -21.34392738342285, "global_step": 82887, "epoch": 998} {"train_loss": -21.019487380981445, "global_step": 82888, "epoch": 998} {"train_loss": -21.251440048217773, "global_step": 82889, "epoch": 998} {"train_loss": -20.980857849121094, "global_step": 82890, "epoch": 998} {"train_loss": -21.485700607299805, "global_step": 82891, "epoch": 998} {"train_loss": -21.045581817626953, "global_step": 82892, "epoch": 998} {"train_loss": -21.284778594970703, "global_step": 82893, "epoch": 998} {"train_loss": -21.496309280395508, "global_step": 82894, "epoch": 998} {"train_loss": -21.613662719726562, "global_step": 82895, "epoch": 998} {"train_loss": -21.316038131713867, "global_step": 82896, "epoch": 998} {"train_loss": -21.740949630737305, "global_step": 82897, "epoch": 998} {"train_loss": -21.266036987304688, "global_step": 82898, "epoch": 998} {"train_loss": -21.36762809753418, "global_step": 82899, "epoch": 998} {"train_loss": -21.202470779418945, "global_step": 82900, "epoch": 998} {"train_loss": -21.323453903198242, "global_step": 82901, "epoch": 998} {"train_loss": -21.6928768157959, "global_step": 82902, "epoch": 998} {"train_loss": -21.172290802001953, "global_step": 82903, "epoch": 998} {"train_loss": -21.55237579345703, "global_step": 82904, "epoch": 998} {"train_loss": -21.08672523498535, "global_step": 82905, "epoch": 998} {"train_loss": -21.533653259277344, "global_step": 82906, "epoch": 998} {"train_loss": -20.95881462097168, "global_step": 82907, "epoch": 998} {"train_loss": -21.239253997802734, "global_step": 82908, "epoch": 998} {"train_loss": -21.286252975463867, "global_step": 82909, "epoch": 998} {"train_loss": -20.690719604492188, "global_step": 82910, "epoch": 998} {"train_loss": -21.2926025390625, "global_step": 82911, "epoch": 998} {"train_loss": -21.541494369506836, "global_step": 82912, "epoch": 998} {"train_loss": -21.444921493530273, "global_step": 82913, "epoch": 998} {"train_loss": -21.07734489440918, "global_step": 82914, "epoch": 998} {"train_loss": -21.0029354095459, "global_step": 82915, "epoch": 998} {"train_loss": -21.2272570966238, "global_step": 82916, "epoch": 998, "val_loss": 6161042.0} {"train_loss": -21.007816314697266, "global_step": 82917, "epoch": 999} {"train_loss": -21.239973068237305, "global_step": 82918, "epoch": 999} {"train_loss": -20.92169189453125, "global_step": 82919, "epoch": 999} {"train_loss": -20.995325088500977, "global_step": 82920, "epoch": 999} {"train_loss": -21.57126235961914, "global_step": 82921, "epoch": 999} {"train_loss": -20.989973068237305, "global_step": 82922, "epoch": 999} {"train_loss": -20.887176513671875, "global_step": 82923, "epoch": 999} {"train_loss": -21.07355308532715, "global_step": 82924, "epoch": 999} {"train_loss": -20.95989227294922, "global_step": 82925, "epoch": 999} {"train_loss": -21.251340866088867, "global_step": 82926, "epoch": 999} {"train_loss": -21.566682815551758, "global_step": 82927, "epoch": 999} {"train_loss": -21.281084060668945, "global_step": 82928, "epoch": 999} {"train_loss": -21.1489315032959, "global_step": 82929, "epoch": 999} {"train_loss": -20.990896224975586, "global_step": 82930, "epoch": 999} {"train_loss": -21.104995727539062, "global_step": 82931, "epoch": 999} {"train_loss": -20.701095581054688, "global_step": 82932, "epoch": 999} {"train_loss": -21.317245483398438, "global_step": 82933, "epoch": 999} {"train_loss": -21.61366081237793, "global_step": 82934, "epoch": 999} {"train_loss": -21.04071617126465, "global_step": 82935, "epoch": 999} {"train_loss": -21.214275360107422, "global_step": 82936, "epoch": 999} {"train_loss": -21.699874877929688, "global_step": 82937, "epoch": 999} {"train_loss": -21.058490753173828, "global_step": 82938, "epoch": 999} {"train_loss": -21.399213790893555, "global_step": 82939, "epoch": 999} {"train_loss": -21.334518432617188, "global_step": 82940, "epoch": 999} {"train_loss": -21.435165405273438, "global_step": 82941, "epoch": 999} {"train_loss": -21.209278106689453, "global_step": 82942, "epoch": 999} {"train_loss": -21.033782958984375, "global_step": 82943, "epoch": 999} {"train_loss": -21.276697158813477, "global_step": 82944, "epoch": 999} {"train_loss": -21.54376792907715, "global_step": 82945, "epoch": 999} {"train_loss": -21.133337020874023, "global_step": 82946, "epoch": 999} {"train_loss": -21.361570358276367, "global_step": 82947, "epoch": 999} {"train_loss": -21.3648681640625, "global_step": 82948, "epoch": 999} {"train_loss": -21.358577728271484, "global_step": 82949, "epoch": 999} {"train_loss": -21.4199275970459, "global_step": 82950, "epoch": 999} {"train_loss": -21.22559928894043, "global_step": 82951, "epoch": 999} {"train_loss": -21.342321395874023, "global_step": 82952, "epoch": 999} {"train_loss": -21.4119873046875, "global_step": 82953, "epoch": 999} {"train_loss": -21.476652145385742, "global_step": 82954, "epoch": 999} {"train_loss": -21.610597610473633, "global_step": 82955, "epoch": 999} {"train_loss": -21.298297882080078, "global_step": 82956, "epoch": 999} {"train_loss": -21.41364860534668, "global_step": 82957, "epoch": 999} {"train_loss": -21.342121124267578, "global_step": 82958, "epoch": 999} {"train_loss": -21.659597396850586, "global_step": 82959, "epoch": 999} {"train_loss": -21.15109634399414, "global_step": 82960, "epoch": 999} {"train_loss": -20.826536178588867, "global_step": 82961, "epoch": 999} {"train_loss": -21.209341049194336, "global_step": 82962, "epoch": 999} {"train_loss": -21.245588302612305, "global_step": 82963, "epoch": 999} {"train_loss": -21.53537940979004, "global_step": 82964, "epoch": 999} {"train_loss": -21.27465057373047, "global_step": 82965, "epoch": 999} {"train_loss": -21.345212936401367, "global_step": 82966, "epoch": 999} {"train_loss": -21.234697341918945, "global_step": 82967, "epoch": 999} {"train_loss": -21.455244064331055, "global_step": 82968, "epoch": 999} {"train_loss": -21.642194747924805, "global_step": 82969, "epoch": 999} {"train_loss": -21.74997901916504, "global_step": 82970, "epoch": 999} {"train_loss": -21.533769607543945, "global_step": 82971, "epoch": 999} {"train_loss": -20.952346801757812, "global_step": 82972, "epoch": 999} {"train_loss": -21.495481491088867, "global_step": 82973, "epoch": 999} {"train_loss": -21.20423698425293, "global_step": 82974, "epoch": 999} {"train_loss": -21.341873168945312, "global_step": 82975, "epoch": 999} {"train_loss": -21.446949005126953, "global_step": 82976, "epoch": 999} {"train_loss": -21.3831844329834, "global_step": 82977, "epoch": 999} {"train_loss": -21.501497268676758, "global_step": 82978, "epoch": 999} {"train_loss": -21.485584259033203, "global_step": 82979, "epoch": 999} {"train_loss": -21.342071533203125, "global_step": 82980, "epoch": 999} {"train_loss": -21.240659713745117, "global_step": 82981, "epoch": 999} {"train_loss": -21.431928634643555, "global_step": 82982, "epoch": 999} {"train_loss": -21.518526077270508, "global_step": 82983, "epoch": 999} {"train_loss": -21.13962745666504, "global_step": 82984, "epoch": 999} {"train_loss": -20.75381851196289, "global_step": 82985, "epoch": 999} {"train_loss": -21.23974609375, "global_step": 82986, "epoch": 999} {"train_loss": -21.598129272460938, "global_step": 82987, "epoch": 999} {"train_loss": -21.545000076293945, "global_step": 82988, "epoch": 999} {"train_loss": -21.55517578125, "global_step": 82989, "epoch": 999} {"train_loss": -21.344038009643555, "global_step": 82990, "epoch": 999} {"train_loss": -21.48341178894043, "global_step": 82991, "epoch": 999} {"train_loss": -21.25799560546875, "global_step": 82992, "epoch": 999} {"train_loss": -21.192781448364258, "global_step": 82993, "epoch": 999} {"train_loss": -21.231603622436523, "global_step": 82994, "epoch": 999} {"train_loss": -21.130924224853516, "global_step": 82995, "epoch": 999} {"train_loss": -21.12531089782715, "global_step": 82996, "epoch": 999} {"train_loss": -21.12812614440918, "global_step": 82997, "epoch": 999} {"train_loss": -21.370595932006836, "global_step": 82998, "epoch": 999} {"train_loss": -21.29754077957337, "global_step": 82999, "epoch": 999, "val_loss": 5926293.5} {"train_loss": -20.788728713989258, "global_step": 83000, "epoch": 1000} {"train_loss": -21.0272274017334, "global_step": 83001, "epoch": 1000} {"train_loss": -20.927112579345703, "global_step": 83002, "epoch": 1000} {"train_loss": -21.0233097076416, "global_step": 83003, "epoch": 1000} {"train_loss": -21.332992553710938, "global_step": 83004, "epoch": 1000} {"train_loss": -21.286142349243164, "global_step": 83005, "epoch": 1000} {"train_loss": -21.174776077270508, "global_step": 83006, "epoch": 1000} {"train_loss": -21.37911033630371, "global_step": 83007, "epoch": 1000} {"train_loss": -21.090362548828125, "global_step": 83008, "epoch": 1000} {"train_loss": -20.89045524597168, "global_step": 83009, "epoch": 1000} {"train_loss": -21.272218704223633, "global_step": 83010, "epoch": 1000} {"train_loss": -21.187641143798828, "global_step": 83011, "epoch": 1000} {"train_loss": -21.03726577758789, "global_step": 83012, "epoch": 1000} {"train_loss": -21.36297607421875, "global_step": 83013, "epoch": 1000} {"train_loss": -21.206504821777344, "global_step": 83014, "epoch": 1000} {"train_loss": -21.519018173217773, "global_step": 83015, "epoch": 1000} {"train_loss": -21.031919479370117, "global_step": 83016, "epoch": 1000} {"train_loss": -21.21604347229004, "global_step": 83017, "epoch": 1000} {"train_loss": -21.07124137878418, "global_step": 83018, "epoch": 1000} {"train_loss": -21.806718826293945, "global_step": 83019, "epoch": 1000} {"train_loss": -21.176177978515625, "global_step": 83020, "epoch": 1000} {"train_loss": -21.075571060180664, "global_step": 83021, "epoch": 1000} {"train_loss": -21.21430015563965, "global_step": 83022, "epoch": 1000} {"train_loss": -21.216190338134766, "global_step": 83023, "epoch": 1000} {"train_loss": -21.092859268188477, "global_step": 83024, "epoch": 1000} {"train_loss": -21.293386459350586, "global_step": 83025, "epoch": 1000} {"train_loss": -21.714059829711914, "global_step": 83026, "epoch": 1000} {"train_loss": -21.17645835876465, "global_step": 83027, "epoch": 1000} {"train_loss": -21.508909225463867, "global_step": 83028, "epoch": 1000} {"train_loss": -21.33551025390625, "global_step": 83029, "epoch": 1000} {"train_loss": -21.064062118530273, "global_step": 83030, "epoch": 1000} {"train_loss": -21.36707305908203, "global_step": 83031, "epoch": 1000} {"train_loss": -21.54762077331543, "global_step": 83032, "epoch": 1000} {"train_loss": -21.274303436279297, "global_step": 83033, "epoch": 1000} {"train_loss": -21.43565559387207, "global_step": 83034, "epoch": 1000} {"train_loss": -21.298460006713867, "global_step": 83035, "epoch": 1000} {"train_loss": -21.25788688659668, "global_step": 83036, "epoch": 1000} {"train_loss": -21.542306900024414, "global_step": 83037, "epoch": 1000} {"train_loss": -21.514108657836914, "global_step": 83038, "epoch": 1000} {"train_loss": -21.76520347595215, "global_step": 83039, "epoch": 1000} {"train_loss": -21.432825088500977, "global_step": 83040, "epoch": 1000} {"train_loss": -21.601669311523438, "global_step": 83041, "epoch": 1000} {"train_loss": -21.181659698486328, "global_step": 83042, "epoch": 1000} {"train_loss": -21.481048583984375, "global_step": 83043, "epoch": 1000} {"train_loss": -21.47921371459961, "global_step": 83044, "epoch": 1000} {"train_loss": -21.40114402770996, "global_step": 83045, "epoch": 1000} {"train_loss": -21.04233169555664, "global_step": 83046, "epoch": 1000} {"train_loss": -21.428203582763672, "global_step": 83047, "epoch": 1000} {"train_loss": -21.253103256225586, "global_step": 83048, "epoch": 1000} {"train_loss": -21.492849349975586, "global_step": 83049, "epoch": 1000} {"train_loss": -21.366758346557617, "global_step": 83050, "epoch": 1000} {"train_loss": -21.334177017211914, "global_step": 83051, "epoch": 1000} {"train_loss": -21.724821090698242, "global_step": 83052, "epoch": 1000} {"train_loss": -20.76907730102539, "global_step": 83053, "epoch": 1000} {"train_loss": -21.508649826049805, "global_step": 83054, "epoch": 1000} {"train_loss": -21.415678024291992, "global_step": 83055, "epoch": 1000} {"train_loss": -21.754423141479492, "global_step": 83056, "epoch": 1000} {"train_loss": -21.226943969726562, "global_step": 83057, "epoch": 1000} {"train_loss": -21.349369049072266, "global_step": 83058, "epoch": 1000} {"train_loss": -21.26946449279785, "global_step": 83059, "epoch": 1000} {"train_loss": -21.549543380737305, "global_step": 83060, "epoch": 1000} {"train_loss": -21.240705490112305, "global_step": 83061, "epoch": 1000} {"train_loss": -21.628934860229492, "global_step": 83062, "epoch": 1000} {"train_loss": -21.205677032470703, "global_step": 83063, "epoch": 1000} {"train_loss": -21.127349853515625, "global_step": 83064, "epoch": 1000} {"train_loss": -21.5671443939209, "global_step": 83065, "epoch": 1000} {"train_loss": -21.475996017456055, "global_step": 83066, "epoch": 1000} {"train_loss": -21.451549530029297, "global_step": 83067, "epoch": 1000} {"train_loss": -21.678579330444336, "global_step": 83068, "epoch": 1000} {"train_loss": -21.679933547973633, "global_step": 83069, "epoch": 1000} {"train_loss": -21.824081420898438, "global_step": 83070, "epoch": 1000} {"train_loss": -21.58374786376953, "global_step": 83071, "epoch": 1000} {"train_loss": -21.544485092163086, "global_step": 83072, "epoch": 1000} {"train_loss": -21.463499069213867, "global_step": 83073, "epoch": 1000} {"train_loss": -21.91314125061035, "global_step": 83074, "epoch": 1000} {"train_loss": -21.216625213623047, "global_step": 83075, "epoch": 1000} {"train_loss": -21.23396873474121, "global_step": 83076, "epoch": 1000} {"train_loss": -21.310148239135742, "global_step": 83077, "epoch": 1000} {"train_loss": -21.351533889770508, "global_step": 83078, "epoch": 1000} {"train_loss": -21.005474090576172, "global_step": 83079, "epoch": 1000} {"train_loss": -20.64974594116211, "global_step": 83080, "epoch": 1000} {"train_loss": -21.359148025512695, "global_step": 83081, "epoch": 1000} {"train_loss": -21.346651582832795, "global_step": 83082, "epoch": 1000, "train/sim_max_reward_0": 1.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4500000": 1.0, "test/sim_max_reward_4500001": 1.0, "test/sim_max_reward_4500002": 1.0, "test/sim_max_reward_4500003": 1.0, "test/sim_max_reward_4500004": 1.0, "test/sim_max_reward_4500005": 1.0, "test/sim_max_reward_4500006": 1.0, "test/sim_max_reward_4500007": 1.0, "test/sim_max_reward_4500008": 1.0, "test/sim_max_reward_4500009": 1.0, "test/sim_max_reward_4500010": 1.0, "test/sim_max_reward_4500011": 1.0, "test/sim_max_reward_4500012": 1.0, "test/sim_max_reward_4500013": 1.0, "test/sim_max_reward_4500014": 1.0, "test/sim_max_reward_4500015": 1.0, "test/sim_max_reward_4500016": 1.0, "test/sim_max_reward_4500017": 1.0, "test/sim_max_reward_4500018": 1.0, "test/sim_max_reward_4500019": 1.0, "test/sim_max_reward_4500020": 1.0, "test/sim_max_reward_4500021": 1.0, "train/mean_score": 1.0, "test/mean_score": 1.0, "val_loss": 5983882.5} {"train_loss": -21.308637619018555, "global_step": 83083, "epoch": 1001} {"train_loss": -20.369522094726562, "global_step": 83084, "epoch": 1001} {"train_loss": -21.20981788635254, "global_step": 83085, "epoch": 1001} {"train_loss": -21.0553035736084, "global_step": 83086, "epoch": 1001} {"train_loss": -21.30344009399414, "global_step": 83087, "epoch": 1001} {"train_loss": -20.92913246154785, "global_step": 83088, "epoch": 1001} {"train_loss": -20.852489471435547, "global_step": 83089, "epoch": 1001} {"train_loss": -21.335920333862305, "global_step": 83090, "epoch": 1001} {"train_loss": -20.97313690185547, "global_step": 83091, "epoch": 1001} {"train_loss": -20.904584884643555, "global_step": 83092, "epoch": 1001} {"train_loss": -21.235498428344727, "global_step": 83093, "epoch": 1001} {"train_loss": -20.927722930908203, "global_step": 83094, "epoch": 1001} {"train_loss": -21.33368492126465, "global_step": 83095, "epoch": 1001} {"train_loss": -21.104734420776367, "global_step": 83096, "epoch": 1001} {"train_loss": -21.192075729370117, "global_step": 83097, "epoch": 1001} {"train_loss": -21.31403923034668, "global_step": 83098, "epoch": 1001} {"train_loss": -21.15065574645996, "global_step": 83099, "epoch": 1001} {"train_loss": -21.595951080322266, "global_step": 83100, "epoch": 1001} {"train_loss": -21.13778305053711, "global_step": 83101, "epoch": 1001} {"train_loss": -21.177959442138672, "global_step": 83102, "epoch": 1001} {"train_loss": -21.310230255126953, "global_step": 83103, "epoch": 1001} {"train_loss": -21.649282455444336, "global_step": 83104, "epoch": 1001} {"train_loss": -21.140291213989258, "global_step": 83105, "epoch": 1001} {"train_loss": -21.09547996520996, "global_step": 83106, "epoch": 1001} {"train_loss": -21.552490234375, "global_step": 83107, "epoch": 1001} {"train_loss": -21.321744918823242, "global_step": 83108, "epoch": 1001} {"train_loss": -21.498188018798828, "global_step": 83109, "epoch": 1001} {"train_loss": -21.25072479248047, "global_step": 83110, "epoch": 1001} {"train_loss": -21.07958984375, "global_step": 83111, "epoch": 1001} {"train_loss": -21.367525100708008, "global_step": 83112, "epoch": 1001} {"train_loss": -21.553281784057617, "global_step": 83113, "epoch": 1001} {"train_loss": -21.203874588012695, "global_step": 83114, "epoch": 1001} {"train_loss": -21.24837875366211, "global_step": 83115, "epoch": 1001} {"train_loss": -21.504301071166992, "global_step": 83116, "epoch": 1001} {"train_loss": -21.035751342773438, "global_step": 83117, "epoch": 1001} {"train_loss": -21.410202026367188, "global_step": 83118, "epoch": 1001} {"train_loss": -21.25978660583496, "global_step": 83119, "epoch": 1001} {"train_loss": -21.5366268157959, "global_step": 83120, "epoch": 1001} {"train_loss": -21.721330642700195, "global_step": 83121, "epoch": 1001} {"train_loss": -21.27439308166504, "global_step": 83122, "epoch": 1001} {"train_loss": -21.56675148010254, "global_step": 83123, "epoch": 1001} {"train_loss": -21.23151397705078, "global_step": 83124, "epoch": 1001} {"train_loss": -21.920705795288086, "global_step": 83125, "epoch": 1001} {"train_loss": -21.6668758392334, "global_step": 83126, "epoch": 1001} {"train_loss": -21.382431030273438, "global_step": 83127, "epoch": 1001} {"train_loss": -21.43275260925293, "global_step": 83128, "epoch": 1001} {"train_loss": -21.574270248413086, "global_step": 83129, "epoch": 1001} {"train_loss": -21.288862228393555, "global_step": 83130, "epoch": 1001} {"train_loss": -21.5844783782959, "global_step": 83131, "epoch": 1001} {"train_loss": -21.5688533782959, "global_step": 83132, "epoch": 1001} {"train_loss": -21.29789924621582, "global_step": 83133, "epoch": 1001} {"train_loss": -21.33538055419922, "global_step": 83134, "epoch": 1001} {"train_loss": -21.289562225341797, "global_step": 83135, "epoch": 1001} {"train_loss": -21.505844116210938, "global_step": 83136, "epoch": 1001} {"train_loss": -21.215600967407227, "global_step": 83137, "epoch": 1001} {"train_loss": -21.208087921142578, "global_step": 83138, "epoch": 1001} {"train_loss": -21.547273635864258, "global_step": 83139, "epoch": 1001} {"train_loss": -21.20123863220215, "global_step": 83140, "epoch": 1001} {"train_loss": -21.563318252563477, "global_step": 83141, "epoch": 1001} {"train_loss": -21.520389556884766, "global_step": 83142, "epoch": 1001} {"train_loss": -21.95972442626953, "global_step": 83143, "epoch": 1001} {"train_loss": -21.725982666015625, "global_step": 83144, "epoch": 1001} {"train_loss": -21.094881057739258, "global_step": 83145, "epoch": 1001} {"train_loss": -21.573244094848633, "global_step": 83146, "epoch": 1001} {"train_loss": -20.958118438720703, "global_step": 83147, "epoch": 1001} {"train_loss": -21.374677658081055, "global_step": 83148, "epoch": 1001} {"train_loss": -21.33133888244629, "global_step": 83149, "epoch": 1001} {"train_loss": -21.58549690246582, "global_step": 83150, "epoch": 1001} {"train_loss": -21.252912521362305, "global_step": 83151, "epoch": 1001} {"train_loss": -21.16867446899414, "global_step": 83152, "epoch": 1001} {"train_loss": -21.363664627075195, "global_step": 83153, "epoch": 1001} {"train_loss": -21.483016967773438, "global_step": 83154, "epoch": 1001} {"train_loss": -21.44391632080078, "global_step": 83155, "epoch": 1001} {"train_loss": -21.45465660095215, "global_step": 83156, "epoch": 1001} {"train_loss": -21.279861450195312, "global_step": 83157, "epoch": 1001} {"train_loss": -21.252443313598633, "global_step": 83158, "epoch": 1001} {"train_loss": -21.245864868164062, "global_step": 83159, "epoch": 1001} {"train_loss": -21.666582107543945, "global_step": 83160, "epoch": 1001} {"train_loss": -21.302091598510742, "global_step": 83161, "epoch": 1001} {"train_loss": -21.122394561767578, "global_step": 83162, "epoch": 1001} {"train_loss": -21.293474197387695, "global_step": 83163, "epoch": 1001} {"train_loss": -21.34674835205078, "global_step": 83164, "epoch": 1001} {"train_loss": -21.312518315142896, "global_step": 83165, "epoch": 1001, "val_loss": 6014110.5} {"train_loss": -21.098751068115234, "global_step": 83166, "epoch": 1002} {"train_loss": -21.118749618530273, "global_step": 83167, "epoch": 1002} {"train_loss": -21.434524536132812, "global_step": 83168, "epoch": 1002} {"train_loss": -21.094655990600586, "global_step": 83169, "epoch": 1002} {"train_loss": -21.203876495361328, "global_step": 83170, "epoch": 1002} {"train_loss": -20.85394287109375, "global_step": 83171, "epoch": 1002} {"train_loss": -21.19148826599121, "global_step": 83172, "epoch": 1002} {"train_loss": -21.142744064331055, "global_step": 83173, "epoch": 1002} {"train_loss": -21.038963317871094, "global_step": 83174, "epoch": 1002} {"train_loss": -21.043060302734375, "global_step": 83175, "epoch": 1002} {"train_loss": -21.2362003326416, "global_step": 83176, "epoch": 1002} {"train_loss": -21.247358322143555, "global_step": 83177, "epoch": 1002} {"train_loss": -21.100250244140625, "global_step": 83178, "epoch": 1002} {"train_loss": -21.322500228881836, "global_step": 83179, "epoch": 1002} {"train_loss": -21.095373153686523, "global_step": 83180, "epoch": 1002} {"train_loss": -21.0887393951416, "global_step": 83181, "epoch": 1002} {"train_loss": -21.358810424804688, "global_step": 83182, "epoch": 1002} {"train_loss": -21.287307739257812, "global_step": 83183, "epoch": 1002} {"train_loss": -21.012760162353516, "global_step": 83184, "epoch": 1002} {"train_loss": -21.22365379333496, "global_step": 83185, "epoch": 1002} {"train_loss": -21.119972229003906, "global_step": 83186, "epoch": 1002} {"train_loss": -21.33369255065918, "global_step": 83187, "epoch": 1002} {"train_loss": -20.958311080932617, "global_step": 83188, "epoch": 1002} {"train_loss": -20.795072555541992, "global_step": 83189, "epoch": 1002} {"train_loss": -21.244792938232422, "global_step": 83190, "epoch": 1002} {"train_loss": -21.529016494750977, "global_step": 83191, "epoch": 1002} {"train_loss": -21.627511978149414, "global_step": 83192, "epoch": 1002} {"train_loss": -21.80082130432129, "global_step": 83193, "epoch": 1002} {"train_loss": -21.769153594970703, "global_step": 83194, "epoch": 1002} {"train_loss": -20.784156799316406, "global_step": 83195, "epoch": 1002} {"train_loss": -21.430620193481445, "global_step": 83196, "epoch": 1002} {"train_loss": -21.351028442382812, "global_step": 83197, "epoch": 1002} {"train_loss": -21.10079002380371, "global_step": 83198, "epoch": 1002} {"train_loss": -21.052276611328125, "global_step": 83199, "epoch": 1002} {"train_loss": -20.726652145385742, "global_step": 83200, "epoch": 1002} {"train_loss": -21.27886199951172, "global_step": 83201, "epoch": 1002} {"train_loss": -21.148557662963867, "global_step": 83202, "epoch": 1002} {"train_loss": -21.06648063659668, "global_step": 83203, "epoch": 1002} {"train_loss": -21.66745948791504, "global_step": 83204, "epoch": 1002} {"train_loss": -21.44062042236328, "global_step": 83205, "epoch": 1002} {"train_loss": -21.216327667236328, "global_step": 83206, "epoch": 1002} {"train_loss": -21.25465202331543, "global_step": 83207, "epoch": 1002} {"train_loss": -21.382131576538086, "global_step": 83208, "epoch": 1002} {"train_loss": -21.085819244384766, "global_step": 83209, "epoch": 1002} {"train_loss": -20.888263702392578, "global_step": 83210, "epoch": 1002} {"train_loss": -21.392332077026367, "global_step": 83211, "epoch": 1002} {"train_loss": -21.42012596130371, "global_step": 83212, "epoch": 1002} {"train_loss": -21.143125534057617, "global_step": 83213, "epoch": 1002} {"train_loss": -21.536331176757812, "global_step": 83214, "epoch": 1002} {"train_loss": -20.987897872924805, "global_step": 83215, "epoch": 1002} {"train_loss": -21.034679412841797, "global_step": 83216, "epoch": 1002} {"train_loss": -21.238229751586914, "global_step": 83217, "epoch": 1002} {"train_loss": -20.87619972229004, "global_step": 83218, "epoch": 1002} {"train_loss": -21.00265121459961, "global_step": 83219, "epoch": 1002} {"train_loss": -21.182207107543945, "global_step": 83220, "epoch": 1002} {"train_loss": -21.209856033325195, "global_step": 83221, "epoch": 1002} {"train_loss": -21.293930053710938, "global_step": 83222, "epoch": 1002} {"train_loss": -21.589826583862305, "global_step": 83223, "epoch": 1002} {"train_loss": -21.378982543945312, "global_step": 83224, "epoch": 1002} {"train_loss": -21.7120418548584, "global_step": 83225, "epoch": 1002} {"train_loss": -21.281085968017578, "global_step": 83226, "epoch": 1002} {"train_loss": -21.427291870117188, "global_step": 83227, "epoch": 1002} {"train_loss": -21.166412353515625, "global_step": 83228, "epoch": 1002} {"train_loss": -21.278871536254883, "global_step": 83229, "epoch": 1002} {"train_loss": -21.17573356628418, "global_step": 83230, "epoch": 1002} {"train_loss": -21.359817504882812, "global_step": 83231, "epoch": 1002} {"train_loss": -21.45790672302246, "global_step": 83232, "epoch": 1002} {"train_loss": -21.361557006835938, "global_step": 83233, "epoch": 1002} {"train_loss": -21.44594955444336, "global_step": 83234, "epoch": 1002} {"train_loss": -21.46553611755371, "global_step": 83235, "epoch": 1002} {"train_loss": -21.446456909179688, "global_step": 83236, "epoch": 1002} {"train_loss": -21.253080368041992, "global_step": 83237, "epoch": 1002} {"train_loss": -21.224559783935547, "global_step": 83238, "epoch": 1002} {"train_loss": -21.483983993530273, "global_step": 83239, "epoch": 1002} {"train_loss": -21.359760284423828, "global_step": 83240, "epoch": 1002} {"train_loss": -21.497020721435547, "global_step": 83241, "epoch": 1002} {"train_loss": -21.260419845581055, "global_step": 83242, "epoch": 1002} {"train_loss": -21.47418785095215, "global_step": 83243, "epoch": 1002} {"train_loss": -21.3750057220459, "global_step": 83244, "epoch": 1002} {"train_loss": -21.607574462890625, "global_step": 83245, "epoch": 1002} {"train_loss": -21.319744110107422, "global_step": 83246, "epoch": 1002} {"train_loss": -21.574752807617188, "global_step": 83247, "epoch": 1002} {"train_loss": -21.257930296013154, "global_step": 83248, "epoch": 1002, "val_loss": 6013498.5} {"train_loss": -21.402233123779297, "global_step": 83249, "epoch": 1003} {"train_loss": -21.159448623657227, "global_step": 83250, "epoch": 1003} {"train_loss": -21.207611083984375, "global_step": 83251, "epoch": 1003} {"train_loss": -21.54633140563965, "global_step": 83252, "epoch": 1003} {"train_loss": -21.31243324279785, "global_step": 83253, "epoch": 1003} {"train_loss": -21.187397003173828, "global_step": 83254, "epoch": 1003} {"train_loss": -21.24104881286621, "global_step": 83255, "epoch": 1003} {"train_loss": -21.369861602783203, "global_step": 83256, "epoch": 1003} {"train_loss": -21.247102737426758, "global_step": 83257, "epoch": 1003} {"train_loss": -21.294431686401367, "global_step": 83258, "epoch": 1003} {"train_loss": -21.171234130859375, "global_step": 83259, "epoch": 1003} {"train_loss": -21.226402282714844, "global_step": 83260, "epoch": 1003} {"train_loss": -21.519451141357422, "global_step": 83261, "epoch": 1003} {"train_loss": -20.939762115478516, "global_step": 83262, "epoch": 1003} {"train_loss": -21.27911376953125, "global_step": 83263, "epoch": 1003} {"train_loss": -21.294666290283203, "global_step": 83264, "epoch": 1003} {"train_loss": -20.632959365844727, "global_step": 83265, "epoch": 1003} {"train_loss": -20.875247955322266, "global_step": 83266, "epoch": 1003} {"train_loss": -21.137832641601562, "global_step": 83267, "epoch": 1003} {"train_loss": -21.207717895507812, "global_step": 83268, "epoch": 1003} {"train_loss": -21.24924087524414, "global_step": 83269, "epoch": 1003} {"train_loss": -21.561120986938477, "global_step": 83270, "epoch": 1003} {"train_loss": -21.294179916381836, "global_step": 83271, "epoch": 1003} {"train_loss": -21.17013168334961, "global_step": 83272, "epoch": 1003} {"train_loss": -21.343122482299805, "global_step": 83273, "epoch": 1003} {"train_loss": -21.325637817382812, "global_step": 83274, "epoch": 1003} {"train_loss": -21.428489685058594, "global_step": 83275, "epoch": 1003} {"train_loss": -21.22870635986328, "global_step": 83276, "epoch": 1003} {"train_loss": -21.0262508392334, "global_step": 83277, "epoch": 1003} {"train_loss": -21.62786293029785, "global_step": 83278, "epoch": 1003} {"train_loss": -21.18292808532715, "global_step": 83279, "epoch": 1003} {"train_loss": -21.42896842956543, "global_step": 83280, "epoch": 1003} {"train_loss": -21.37701988220215, "global_step": 83281, "epoch": 1003} {"train_loss": -21.272214889526367, "global_step": 83282, "epoch": 1003} {"train_loss": -21.121944427490234, "global_step": 83283, "epoch": 1003} {"train_loss": -21.789884567260742, "global_step": 83284, "epoch": 1003} {"train_loss": -21.23880958557129, "global_step": 83285, "epoch": 1003} {"train_loss": -21.382160186767578, "global_step": 83286, "epoch": 1003} {"train_loss": -21.36332893371582, "global_step": 83287, "epoch": 1003} {"train_loss": -21.101181030273438, "global_step": 83288, "epoch": 1003} {"train_loss": -21.263593673706055, "global_step": 83289, "epoch": 1003} {"train_loss": -21.64594078063965, "global_step": 83290, "epoch": 1003} {"train_loss": -21.621023178100586, "global_step": 83291, "epoch": 1003} {"train_loss": -21.211339950561523, "global_step": 83292, "epoch": 1003} {"train_loss": -21.186084747314453, "global_step": 83293, "epoch": 1003} {"train_loss": -21.75870704650879, "global_step": 83294, "epoch": 1003} {"train_loss": -21.07830238342285, "global_step": 83295, "epoch": 1003} {"train_loss": -21.232202529907227, "global_step": 83296, "epoch": 1003} {"train_loss": -21.489986419677734, "global_step": 83297, "epoch": 1003} {"train_loss": -21.375368118286133, "global_step": 83298, "epoch": 1003} {"train_loss": -21.364606857299805, "global_step": 83299, "epoch": 1003} {"train_loss": -21.327489852905273, "global_step": 83300, "epoch": 1003} {"train_loss": -21.27030372619629, "global_step": 83301, "epoch": 1003} {"train_loss": -21.203542709350586, "global_step": 83302, "epoch": 1003} {"train_loss": -21.506818771362305, "global_step": 83303, "epoch": 1003} {"train_loss": -21.405696868896484, "global_step": 83304, "epoch": 1003} {"train_loss": -21.43070411682129, "global_step": 83305, "epoch": 1003} {"train_loss": -21.166662216186523, "global_step": 83306, "epoch": 1003} {"train_loss": -21.307767868041992, "global_step": 83307, "epoch": 1003} {"train_loss": -21.34738540649414, "global_step": 83308, "epoch": 1003} {"train_loss": -21.259206771850586, "global_step": 83309, "epoch": 1003} {"train_loss": -21.415504455566406, "global_step": 83310, "epoch": 1003} {"train_loss": -21.662628173828125, "global_step": 83311, "epoch": 1003} {"train_loss": -21.440357208251953, "global_step": 83312, "epoch": 1003} {"train_loss": -21.166717529296875, "global_step": 83313, "epoch": 1003} {"train_loss": -21.43378257751465, "global_step": 83314, "epoch": 1003} {"train_loss": -21.10761070251465, "global_step": 83315, "epoch": 1003} {"train_loss": -21.4876708984375, "global_step": 83316, "epoch": 1003} {"train_loss": -21.500289916992188, "global_step": 83317, "epoch": 1003} {"train_loss": -21.303258895874023, "global_step": 83318, "epoch": 1003} {"train_loss": -21.69417381286621, "global_step": 83319, "epoch": 1003} {"train_loss": -21.37781524658203, "global_step": 83320, "epoch": 1003} {"train_loss": -21.07356071472168, "global_step": 83321, "epoch": 1003} {"train_loss": -21.3583984375, "global_step": 83322, "epoch": 1003} {"train_loss": -21.114660263061523, "global_step": 83323, "epoch": 1003} {"train_loss": -20.91667938232422, "global_step": 83324, "epoch": 1003} {"train_loss": -21.146411895751953, "global_step": 83325, "epoch": 1003} {"train_loss": -21.535411834716797, "global_step": 83326, "epoch": 1003} {"train_loss": -21.35877799987793, "global_step": 83327, "epoch": 1003} {"train_loss": -21.33367919921875, "global_step": 83328, "epoch": 1003} {"train_loss": -21.311838150024414, "global_step": 83329, "epoch": 1003} {"train_loss": -21.235212326049805, "global_step": 83330, "epoch": 1003} {"train_loss": -21.285013221832642, "global_step": 83331, "epoch": 1003, "val_loss": 6044205.0} {"train_loss": -21.250280380249023, "global_step": 83332, "epoch": 1004} {"train_loss": -21.118894577026367, "global_step": 83333, "epoch": 1004} {"train_loss": -21.51078224182129, "global_step": 83334, "epoch": 1004} {"train_loss": -21.144514083862305, "global_step": 83335, "epoch": 1004} {"train_loss": -21.128082275390625, "global_step": 83336, "epoch": 1004} {"train_loss": -21.258914947509766, "global_step": 83337, "epoch": 1004} {"train_loss": -21.198156356811523, "global_step": 83338, "epoch": 1004} {"train_loss": -20.81267738342285, "global_step": 83339, "epoch": 1004} {"train_loss": -20.9523983001709, "global_step": 83340, "epoch": 1004} {"train_loss": -21.097463607788086, "global_step": 83341, "epoch": 1004} {"train_loss": -21.27467918395996, "global_step": 83342, "epoch": 1004} {"train_loss": -21.139751434326172, "global_step": 83343, "epoch": 1004} {"train_loss": -21.434492111206055, "global_step": 83344, "epoch": 1004} {"train_loss": -21.359695434570312, "global_step": 83345, "epoch": 1004} {"train_loss": -21.4301700592041, "global_step": 83346, "epoch": 1004} {"train_loss": -21.400426864624023, "global_step": 83347, "epoch": 1004} {"train_loss": -21.131582260131836, "global_step": 83348, "epoch": 1004} {"train_loss": -21.204315185546875, "global_step": 83349, "epoch": 1004} {"train_loss": -21.43680191040039, "global_step": 83350, "epoch": 1004} {"train_loss": -21.189685821533203, "global_step": 83351, "epoch": 1004} {"train_loss": -21.50267791748047, "global_step": 83352, "epoch": 1004} {"train_loss": -21.006103515625, "global_step": 83353, "epoch": 1004} {"train_loss": -21.480098724365234, "global_step": 83354, "epoch": 1004} {"train_loss": -21.073152542114258, "global_step": 83355, "epoch": 1004} {"train_loss": -21.44137954711914, "global_step": 83356, "epoch": 1004} {"train_loss": -21.41547203063965, "global_step": 83357, "epoch": 1004} {"train_loss": -21.481237411499023, "global_step": 83358, "epoch": 1004} {"train_loss": -21.430503845214844, "global_step": 83359, "epoch": 1004} {"train_loss": -21.027196884155273, "global_step": 83360, "epoch": 1004} {"train_loss": -21.342443466186523, "global_step": 83361, "epoch": 1004} {"train_loss": -21.31869888305664, "global_step": 83362, "epoch": 1004} {"train_loss": -21.554492950439453, "global_step": 83363, "epoch": 1004} {"train_loss": -21.16236686706543, "global_step": 83364, "epoch": 1004} {"train_loss": -21.473859786987305, "global_step": 83365, "epoch": 1004} {"train_loss": -21.514753341674805, "global_step": 83366, "epoch": 1004} {"train_loss": -21.769399642944336, "global_step": 83367, "epoch": 1004} {"train_loss": -21.368778228759766, "global_step": 83368, "epoch": 1004} {"train_loss": -21.67807388305664, "global_step": 83369, "epoch": 1004} {"train_loss": -21.339319229125977, "global_step": 83370, "epoch": 1004} {"train_loss": -21.45590591430664, "global_step": 83371, "epoch": 1004} {"train_loss": -21.091657638549805, "global_step": 83372, "epoch": 1004} {"train_loss": -21.291706085205078, "global_step": 83373, "epoch": 1004} {"train_loss": -21.5104923248291, "global_step": 83374, "epoch": 1004} {"train_loss": -21.243581771850586, "global_step": 83375, "epoch": 1004} {"train_loss": -21.436368942260742, "global_step": 83376, "epoch": 1004} {"train_loss": -21.342260360717773, "global_step": 83377, "epoch": 1004} {"train_loss": -21.56745719909668, "global_step": 83378, "epoch": 1004} {"train_loss": -21.57046127319336, "global_step": 83379, "epoch": 1004} {"train_loss": -21.155513763427734, "global_step": 83380, "epoch": 1004} {"train_loss": -21.15829849243164, "global_step": 83381, "epoch": 1004} {"train_loss": -21.4603328704834, "global_step": 83382, "epoch": 1004} {"train_loss": -21.09088134765625, "global_step": 83383, "epoch": 1004} {"train_loss": -21.338342666625977, "global_step": 83384, "epoch": 1004} {"train_loss": -21.23136329650879, "global_step": 83385, "epoch": 1004} {"train_loss": -21.30341911315918, "global_step": 83386, "epoch": 1004} {"train_loss": -21.587982177734375, "global_step": 83387, "epoch": 1004} {"train_loss": -21.012985229492188, "global_step": 83388, "epoch": 1004} {"train_loss": -21.208961486816406, "global_step": 83389, "epoch": 1004} {"train_loss": -21.235546112060547, "global_step": 83390, "epoch": 1004} {"train_loss": -21.680923461914062, "global_step": 83391, "epoch": 1004} {"train_loss": -21.239301681518555, "global_step": 83392, "epoch": 1004} {"train_loss": -21.611989974975586, "global_step": 83393, "epoch": 1004} {"train_loss": -21.2436580657959, "global_step": 83394, "epoch": 1004} {"train_loss": -21.494121551513672, "global_step": 83395, "epoch": 1004} {"train_loss": -21.07541275024414, "global_step": 83396, "epoch": 1004} {"train_loss": -21.381732940673828, "global_step": 83397, "epoch": 1004} {"train_loss": -21.182769775390625, "global_step": 83398, "epoch": 1004} {"train_loss": -21.104440689086914, "global_step": 83399, "epoch": 1004} {"train_loss": -21.245777130126953, "global_step": 83400, "epoch": 1004} {"train_loss": -21.30998420715332, "global_step": 83401, "epoch": 1004} {"train_loss": -21.609195709228516, "global_step": 83402, "epoch": 1004} {"train_loss": -21.211362838745117, "global_step": 83403, "epoch": 1004} {"train_loss": -21.02137565612793, "global_step": 83404, "epoch": 1004} {"train_loss": -21.387815475463867, "global_step": 83405, "epoch": 1004} {"train_loss": -21.564176559448242, "global_step": 83406, "epoch": 1004} {"train_loss": -21.435895919799805, "global_step": 83407, "epoch": 1004} {"train_loss": -21.286924362182617, "global_step": 83408, "epoch": 1004} {"train_loss": -21.02119255065918, "global_step": 83409, "epoch": 1004} {"train_loss": -21.301542282104492, "global_step": 83410, "epoch": 1004} {"train_loss": -21.36732292175293, "global_step": 83411, "epoch": 1004} {"train_loss": -21.669965744018555, "global_step": 83412, "epoch": 1004} {"train_loss": -21.27875328063965, "global_step": 83413, "epoch": 1004} {"train_loss": -21.32234088484063, "global_step": 83414, "epoch": 1004, "val_loss": 6015351.5} {"train_loss": -20.574548721313477, "global_step": 83415, "epoch": 1005} {"train_loss": -20.979490280151367, "global_step": 83416, "epoch": 1005} {"train_loss": -20.91762351989746, "global_step": 83417, "epoch": 1005} {"train_loss": -20.6761474609375, "global_step": 83418, "epoch": 1005} {"train_loss": -21.530780792236328, "global_step": 83419, "epoch": 1005} {"train_loss": -21.075963973999023, "global_step": 83420, "epoch": 1005} {"train_loss": -21.510507583618164, "global_step": 83421, "epoch": 1005} {"train_loss": -21.19404411315918, "global_step": 83422, "epoch": 1005} {"train_loss": -21.326108932495117, "global_step": 83423, "epoch": 1005} {"train_loss": -21.263565063476562, "global_step": 83424, "epoch": 1005} {"train_loss": -21.049917221069336, "global_step": 83425, "epoch": 1005} {"train_loss": -21.0322208404541, "global_step": 83426, "epoch": 1005} {"train_loss": -20.940515518188477, "global_step": 83427, "epoch": 1005} {"train_loss": -20.94191551208496, "global_step": 83428, "epoch": 1005} {"train_loss": -21.449501037597656, "global_step": 83429, "epoch": 1005} {"train_loss": -21.35304832458496, "global_step": 83430, "epoch": 1005} {"train_loss": -21.391454696655273, "global_step": 83431, "epoch": 1005} {"train_loss": -21.362539291381836, "global_step": 83432, "epoch": 1005} {"train_loss": -21.306440353393555, "global_step": 83433, "epoch": 1005} {"train_loss": -21.28398323059082, "global_step": 83434, "epoch": 1005} {"train_loss": -20.88459587097168, "global_step": 83435, "epoch": 1005} {"train_loss": -21.594331741333008, "global_step": 83436, "epoch": 1005} {"train_loss": -21.16056251525879, "global_step": 83437, "epoch": 1005} {"train_loss": -21.190595626831055, "global_step": 83438, "epoch": 1005} {"train_loss": -21.488611221313477, "global_step": 83439, "epoch": 1005} {"train_loss": -21.46101188659668, "global_step": 83440, "epoch": 1005} {"train_loss": -21.66217613220215, "global_step": 83441, "epoch": 1005} {"train_loss": -21.54267692565918, "global_step": 83442, "epoch": 1005} {"train_loss": -21.232587814331055, "global_step": 83443, "epoch": 1005} {"train_loss": -21.431928634643555, "global_step": 83444, "epoch": 1005} {"train_loss": -21.79258155822754, "global_step": 83445, "epoch": 1005} {"train_loss": -21.386014938354492, "global_step": 83446, "epoch": 1005} {"train_loss": -21.58174705505371, "global_step": 83447, "epoch": 1005} {"train_loss": -21.327775955200195, "global_step": 83448, "epoch": 1005} {"train_loss": -21.486913681030273, "global_step": 83449, "epoch": 1005} {"train_loss": -21.4049129486084, "global_step": 83450, "epoch": 1005} {"train_loss": -21.303678512573242, "global_step": 83451, "epoch": 1005} {"train_loss": -21.232776641845703, "global_step": 83452, "epoch": 1005} {"train_loss": -21.22810173034668, "global_step": 83453, "epoch": 1005} {"train_loss": -21.41107749938965, "global_step": 83454, "epoch": 1005} {"train_loss": -21.269702911376953, "global_step": 83455, "epoch": 1005} {"train_loss": -21.317447662353516, "global_step": 83456, "epoch": 1005} {"train_loss": -21.19290542602539, "global_step": 83457, "epoch": 1005} {"train_loss": -21.376426696777344, "global_step": 83458, "epoch": 1005} {"train_loss": -21.78932762145996, "global_step": 83459, "epoch": 1005} {"train_loss": -21.60697364807129, "global_step": 83460, "epoch": 1005} {"train_loss": -21.231672286987305, "global_step": 83461, "epoch": 1005} {"train_loss": -21.379636764526367, "global_step": 83462, "epoch": 1005} {"train_loss": -20.79117774963379, "global_step": 83463, "epoch": 1005} {"train_loss": -21.15285873413086, "global_step": 83464, "epoch": 1005} {"train_loss": -21.364194869995117, "global_step": 83465, "epoch": 1005} {"train_loss": -21.255603790283203, "global_step": 83466, "epoch": 1005} {"train_loss": -21.426769256591797, "global_step": 83467, "epoch": 1005} {"train_loss": -21.244586944580078, "global_step": 83468, "epoch": 1005} {"train_loss": -21.778348922729492, "global_step": 83469, "epoch": 1005} {"train_loss": -21.1834774017334, "global_step": 83470, "epoch": 1005} {"train_loss": -21.325063705444336, "global_step": 83471, "epoch": 1005} {"train_loss": -21.5504093170166, "global_step": 83472, "epoch": 1005} {"train_loss": -21.502897262573242, "global_step": 83473, "epoch": 1005} {"train_loss": -21.714021682739258, "global_step": 83474, "epoch": 1005} {"train_loss": -21.535734176635742, "global_step": 83475, "epoch": 1005} {"train_loss": -21.133996963500977, "global_step": 83476, "epoch": 1005} {"train_loss": -21.20475196838379, "global_step": 83477, "epoch": 1005} {"train_loss": -21.368555068969727, "global_step": 83478, "epoch": 1005} {"train_loss": -21.405719757080078, "global_step": 83479, "epoch": 1005} {"train_loss": -20.859344482421875, "global_step": 83480, "epoch": 1005} {"train_loss": -21.391820907592773, "global_step": 83481, "epoch": 1005} {"train_loss": -21.416095733642578, "global_step": 83482, "epoch": 1005} {"train_loss": -21.06515884399414, "global_step": 83483, "epoch": 1005} {"train_loss": -21.07989501953125, "global_step": 83484, "epoch": 1005} {"train_loss": -21.07879066467285, "global_step": 83485, "epoch": 1005} {"train_loss": -21.32754898071289, "global_step": 83486, "epoch": 1005} {"train_loss": -21.548051834106445, "global_step": 83487, "epoch": 1005} {"train_loss": -21.532928466796875, "global_step": 83488, "epoch": 1005} {"train_loss": -21.237621307373047, "global_step": 83489, "epoch": 1005} {"train_loss": -21.408985137939453, "global_step": 83490, "epoch": 1005} {"train_loss": -21.447345733642578, "global_step": 83491, "epoch": 1005} {"train_loss": -21.686677932739258, "global_step": 83492, "epoch": 1005} {"train_loss": -21.29669761657715, "global_step": 83493, "epoch": 1005} {"train_loss": -21.569290161132812, "global_step": 83494, "epoch": 1005} {"train_loss": -21.6867618560791, "global_step": 83495, "epoch": 1005} {"train_loss": -21.389904022216797, "global_step": 83496, "epoch": 1005} {"train_loss": -21.33022570322795, "global_step": 83497, "epoch": 1005, "val_loss": 6276061.0} {"train_loss": -20.77004051208496, "global_step": 83498, "epoch": 1006} {"train_loss": -20.972702026367188, "global_step": 83499, "epoch": 1006} {"train_loss": -20.902400970458984, "global_step": 83500, "epoch": 1006} {"train_loss": -20.823871612548828, "global_step": 83501, "epoch": 1006} {"train_loss": -21.075836181640625, "global_step": 83502, "epoch": 1006} {"train_loss": -20.873376846313477, "global_step": 83503, "epoch": 1006} {"train_loss": -21.009145736694336, "global_step": 83504, "epoch": 1006} {"train_loss": -21.246862411499023, "global_step": 83505, "epoch": 1006} {"train_loss": -21.43500328063965, "global_step": 83506, "epoch": 1006} {"train_loss": -21.24195671081543, "global_step": 83507, "epoch": 1006} {"train_loss": -21.127622604370117, "global_step": 83508, "epoch": 1006} {"train_loss": -21.149417877197266, "global_step": 83509, "epoch": 1006} {"train_loss": -21.13776206970215, "global_step": 83510, "epoch": 1006} {"train_loss": -21.01826286315918, "global_step": 83511, "epoch": 1006} {"train_loss": -21.25987434387207, "global_step": 83512, "epoch": 1006} {"train_loss": -21.448820114135742, "global_step": 83513, "epoch": 1006} {"train_loss": -21.220165252685547, "global_step": 83514, "epoch": 1006} {"train_loss": -21.382705688476562, "global_step": 83515, "epoch": 1006} {"train_loss": -21.146991729736328, "global_step": 83516, "epoch": 1006} {"train_loss": -21.076642990112305, "global_step": 83517, "epoch": 1006} {"train_loss": -21.28493309020996, "global_step": 83518, "epoch": 1006} {"train_loss": -21.18454933166504, "global_step": 83519, "epoch": 1006} {"train_loss": -21.35154914855957, "global_step": 83520, "epoch": 1006} {"train_loss": -21.087278366088867, "global_step": 83521, "epoch": 1006} {"train_loss": -21.244796752929688, "global_step": 83522, "epoch": 1006} {"train_loss": -21.289962768554688, "global_step": 83523, "epoch": 1006} {"train_loss": -21.01650047302246, "global_step": 83524, "epoch": 1006} {"train_loss": -21.022855758666992, "global_step": 83525, "epoch": 1006} {"train_loss": -21.533702850341797, "global_step": 83526, "epoch": 1006} {"train_loss": -21.30475616455078, "global_step": 83527, "epoch": 1006} {"train_loss": -21.229307174682617, "global_step": 83528, "epoch": 1006} {"train_loss": -21.641345977783203, "global_step": 83529, "epoch": 1006} {"train_loss": -21.519718170166016, "global_step": 83530, "epoch": 1006} {"train_loss": -21.95145606994629, "global_step": 83531, "epoch": 1006} {"train_loss": -21.148319244384766, "global_step": 83532, "epoch": 1006} {"train_loss": -21.62051773071289, "global_step": 83533, "epoch": 1006} {"train_loss": -21.239721298217773, "global_step": 83534, "epoch": 1006} {"train_loss": -21.32992935180664, "global_step": 83535, "epoch": 1006} {"train_loss": -21.12689208984375, "global_step": 83536, "epoch": 1006} {"train_loss": -21.158466339111328, "global_step": 83537, "epoch": 1006} {"train_loss": -21.235782623291016, "global_step": 83538, "epoch": 1006} {"train_loss": -21.4147891998291, "global_step": 83539, "epoch": 1006} {"train_loss": -21.173736572265625, "global_step": 83540, "epoch": 1006} {"train_loss": -21.560415267944336, "global_step": 83541, "epoch": 1006} {"train_loss": -20.89628791809082, "global_step": 83542, "epoch": 1006} {"train_loss": -21.33538055419922, "global_step": 83543, "epoch": 1006} {"train_loss": -21.27992820739746, "global_step": 83544, "epoch": 1006} {"train_loss": -21.244543075561523, "global_step": 83545, "epoch": 1006} {"train_loss": -21.070894241333008, "global_step": 83546, "epoch": 1006} {"train_loss": -21.3760929107666, "global_step": 83547, "epoch": 1006} {"train_loss": -21.160112380981445, "global_step": 83548, "epoch": 1006} {"train_loss": -21.589431762695312, "global_step": 83549, "epoch": 1006} {"train_loss": -21.1611270904541, "global_step": 83550, "epoch": 1006} {"train_loss": -21.12718963623047, "global_step": 83551, "epoch": 1006} {"train_loss": -21.21625328063965, "global_step": 83552, "epoch": 1006} {"train_loss": -21.072250366210938, "global_step": 83553, "epoch": 1006} {"train_loss": -21.53891944885254, "global_step": 83554, "epoch": 1006} {"train_loss": -21.402393341064453, "global_step": 83555, "epoch": 1006} {"train_loss": -21.29591178894043, "global_step": 83556, "epoch": 1006} {"train_loss": -21.347436904907227, "global_step": 83557, "epoch": 1006} {"train_loss": -21.55365753173828, "global_step": 83558, "epoch": 1006} {"train_loss": -21.1796932220459, "global_step": 83559, "epoch": 1006} {"train_loss": -21.635610580444336, "global_step": 83560, "epoch": 1006} {"train_loss": -21.333799362182617, "global_step": 83561, "epoch": 1006} {"train_loss": -21.340871810913086, "global_step": 83562, "epoch": 1006} {"train_loss": -21.275287628173828, "global_step": 83563, "epoch": 1006} {"train_loss": -21.231840133666992, "global_step": 83564, "epoch": 1006} {"train_loss": -21.362043380737305, "global_step": 83565, "epoch": 1006} {"train_loss": -21.45192527770996, "global_step": 83566, "epoch": 1006} {"train_loss": -21.180646896362305, "global_step": 83567, "epoch": 1006} {"train_loss": -21.359100341796875, "global_step": 83568, "epoch": 1006} {"train_loss": -21.31317710876465, "global_step": 83569, "epoch": 1006} {"train_loss": -21.328990936279297, "global_step": 83570, "epoch": 1006} {"train_loss": -21.49237632751465, "global_step": 83571, "epoch": 1006} {"train_loss": -21.6710262298584, "global_step": 83572, "epoch": 1006} {"train_loss": -21.31070327758789, "global_step": 83573, "epoch": 1006} {"train_loss": -21.440580368041992, "global_step": 83574, "epoch": 1006} {"train_loss": -21.314651489257812, "global_step": 83575, "epoch": 1006} {"train_loss": -21.778079986572266, "global_step": 83576, "epoch": 1006} {"train_loss": -21.61444854736328, "global_step": 83577, "epoch": 1006} {"train_loss": -21.445327758789062, "global_step": 83578, "epoch": 1006} {"train_loss": -21.688817977905273, "global_step": 83579, "epoch": 1006} {"train_loss": -21.29398474635848, "global_step": 83580, "epoch": 1006, "val_loss": 5928373.0} {"train_loss": -21.128765106201172, "global_step": 83581, "epoch": 1007} {"train_loss": -21.4337100982666, "global_step": 83582, "epoch": 1007} {"train_loss": -21.300050735473633, "global_step": 83583, "epoch": 1007} {"train_loss": -21.09981346130371, "global_step": 83584, "epoch": 1007} {"train_loss": -21.133466720581055, "global_step": 83585, "epoch": 1007} {"train_loss": -20.769458770751953, "global_step": 83586, "epoch": 1007} {"train_loss": -21.331327438354492, "global_step": 83587, "epoch": 1007} {"train_loss": -21.299793243408203, "global_step": 83588, "epoch": 1007} {"train_loss": -21.053516387939453, "global_step": 83589, "epoch": 1007} {"train_loss": -21.00826072692871, "global_step": 83590, "epoch": 1007} {"train_loss": -21.205759048461914, "global_step": 83591, "epoch": 1007} {"train_loss": -21.258329391479492, "global_step": 83592, "epoch": 1007} {"train_loss": -21.068098068237305, "global_step": 83593, "epoch": 1007} {"train_loss": -20.836685180664062, "global_step": 83594, "epoch": 1007} {"train_loss": -21.363914489746094, "global_step": 83595, "epoch": 1007} {"train_loss": -21.401607513427734, "global_step": 83596, "epoch": 1007} {"train_loss": -21.08767318725586, "global_step": 83597, "epoch": 1007} {"train_loss": -21.323991775512695, "global_step": 83598, "epoch": 1007} {"train_loss": -21.399185180664062, "global_step": 83599, "epoch": 1007} {"train_loss": -21.442665100097656, "global_step": 83600, "epoch": 1007} {"train_loss": -21.580331802368164, "global_step": 83601, "epoch": 1007} {"train_loss": -21.324893951416016, "global_step": 83602, "epoch": 1007} {"train_loss": -21.35662841796875, "global_step": 83603, "epoch": 1007} {"train_loss": -21.275636672973633, "global_step": 83604, "epoch": 1007} {"train_loss": -21.16132926940918, "global_step": 83605, "epoch": 1007} {"train_loss": -21.687400817871094, "global_step": 83606, "epoch": 1007} {"train_loss": -21.443252563476562, "global_step": 83607, "epoch": 1007} {"train_loss": -21.206741333007812, "global_step": 83608, "epoch": 1007} {"train_loss": -21.468313217163086, "global_step": 83609, "epoch": 1007} {"train_loss": -21.205732345581055, "global_step": 83610, "epoch": 1007} {"train_loss": -21.451492309570312, "global_step": 83611, "epoch": 1007} {"train_loss": -21.2467098236084, "global_step": 83612, "epoch": 1007} {"train_loss": -21.28328514099121, "global_step": 83613, "epoch": 1007} {"train_loss": -21.511741638183594, "global_step": 83614, "epoch": 1007} {"train_loss": -21.189212799072266, "global_step": 83615, "epoch": 1007} {"train_loss": -21.218246459960938, "global_step": 83616, "epoch": 1007} {"train_loss": -21.27705192565918, "global_step": 83617, "epoch": 1007} {"train_loss": -21.20331382751465, "global_step": 83618, "epoch": 1007} {"train_loss": -21.8183650970459, "global_step": 83619, "epoch": 1007} {"train_loss": -21.106184005737305, "global_step": 83620, "epoch": 1007} {"train_loss": -21.303007125854492, "global_step": 83621, "epoch": 1007} {"train_loss": -21.422916412353516, "global_step": 83622, "epoch": 1007} {"train_loss": -21.67494773864746, "global_step": 83623, "epoch": 1007} {"train_loss": -21.12099266052246, "global_step": 83624, "epoch": 1007} {"train_loss": -21.319562911987305, "global_step": 83625, "epoch": 1007} {"train_loss": -21.415515899658203, "global_step": 83626, "epoch": 1007} {"train_loss": -21.22004508972168, "global_step": 83627, "epoch": 1007} {"train_loss": -21.03559112548828, "global_step": 83628, "epoch": 1007} {"train_loss": -21.42255401611328, "global_step": 83629, "epoch": 1007} {"train_loss": -21.198278427124023, "global_step": 83630, "epoch": 1007} {"train_loss": -20.898773193359375, "global_step": 83631, "epoch": 1007} {"train_loss": -21.107006072998047, "global_step": 83632, "epoch": 1007} {"train_loss": -20.995275497436523, "global_step": 83633, "epoch": 1007} {"train_loss": -21.08191680908203, "global_step": 83634, "epoch": 1007} {"train_loss": -21.239582061767578, "global_step": 83635, "epoch": 1007} {"train_loss": -21.303573608398438, "global_step": 83636, "epoch": 1007} {"train_loss": -21.308687210083008, "global_step": 83637, "epoch": 1007} {"train_loss": -21.45144271850586, "global_step": 83638, "epoch": 1007} {"train_loss": -21.580520629882812, "global_step": 83639, "epoch": 1007} {"train_loss": -20.972007751464844, "global_step": 83640, "epoch": 1007} {"train_loss": -21.30491828918457, "global_step": 83641, "epoch": 1007} {"train_loss": -21.245386123657227, "global_step": 83642, "epoch": 1007} {"train_loss": -21.161334991455078, "global_step": 83643, "epoch": 1007} {"train_loss": -21.40525245666504, "global_step": 83644, "epoch": 1007} {"train_loss": -21.107181549072266, "global_step": 83645, "epoch": 1007} {"train_loss": -21.463356018066406, "global_step": 83646, "epoch": 1007} {"train_loss": -21.192703247070312, "global_step": 83647, "epoch": 1007} {"train_loss": -21.547590255737305, "global_step": 83648, "epoch": 1007} {"train_loss": -21.611713409423828, "global_step": 83649, "epoch": 1007} {"train_loss": -21.41305923461914, "global_step": 83650, "epoch": 1007} {"train_loss": -21.286609649658203, "global_step": 83651, "epoch": 1007} {"train_loss": -20.998462677001953, "global_step": 83652, "epoch": 1007} {"train_loss": -21.33338737487793, "global_step": 83653, "epoch": 1007} {"train_loss": -21.29024314880371, "global_step": 83654, "epoch": 1007} {"train_loss": -21.389371871948242, "global_step": 83655, "epoch": 1007} {"train_loss": -21.597776412963867, "global_step": 83656, "epoch": 1007} {"train_loss": -21.271343231201172, "global_step": 83657, "epoch": 1007} {"train_loss": -21.784208297729492, "global_step": 83658, "epoch": 1007} {"train_loss": -21.204254150390625, "global_step": 83659, "epoch": 1007} {"train_loss": -21.44122886657715, "global_step": 83660, "epoch": 1007} {"train_loss": -21.180131912231445, "global_step": 83661, "epoch": 1007} {"train_loss": -21.228382110595703, "global_step": 83662, "epoch": 1007} {"train_loss": -21.309606138482152, "global_step": 83663, "epoch": 1007, "val_loss": 6074633.0} {"train_loss": -21.186641693115234, "global_step": 83664, "epoch": 1008} {"train_loss": -21.148469924926758, "global_step": 83665, "epoch": 1008} {"train_loss": -20.998762130737305, "global_step": 83666, "epoch": 1008} {"train_loss": -21.204212188720703, "global_step": 83667, "epoch": 1008} {"train_loss": -20.820819854736328, "global_step": 83668, "epoch": 1008} {"train_loss": -21.09976577758789, "global_step": 83669, "epoch": 1008} {"train_loss": -21.369375228881836, "global_step": 83670, "epoch": 1008} {"train_loss": -21.022192001342773, "global_step": 83671, "epoch": 1008} {"train_loss": -21.07144546508789, "global_step": 83672, "epoch": 1008} {"train_loss": -21.201263427734375, "global_step": 83673, "epoch": 1008} {"train_loss": -21.06617546081543, "global_step": 83674, "epoch": 1008} {"train_loss": -21.013456344604492, "global_step": 83675, "epoch": 1008} {"train_loss": -21.10944175720215, "global_step": 83676, "epoch": 1008} {"train_loss": -21.142459869384766, "global_step": 83677, "epoch": 1008} {"train_loss": -21.78309440612793, "global_step": 83678, "epoch": 1008} {"train_loss": -21.183868408203125, "global_step": 83679, "epoch": 1008} {"train_loss": -21.411767959594727, "global_step": 83680, "epoch": 1008} {"train_loss": -21.423490524291992, "global_step": 83681, "epoch": 1008} {"train_loss": -21.124250411987305, "global_step": 83682, "epoch": 1008} {"train_loss": -21.278217315673828, "global_step": 83683, "epoch": 1008} {"train_loss": -21.120542526245117, "global_step": 83684, "epoch": 1008} {"train_loss": -21.379138946533203, "global_step": 83685, "epoch": 1008} {"train_loss": -21.451339721679688, "global_step": 83686, "epoch": 1008} {"train_loss": -21.78937339782715, "global_step": 83687, "epoch": 1008} {"train_loss": -21.311038970947266, "global_step": 83688, "epoch": 1008} {"train_loss": -21.30385398864746, "global_step": 83689, "epoch": 1008} {"train_loss": -21.237192153930664, "global_step": 83690, "epoch": 1008} {"train_loss": -21.30582046508789, "global_step": 83691, "epoch": 1008} {"train_loss": -21.42816734313965, "global_step": 83692, "epoch": 1008} {"train_loss": -21.413379669189453, "global_step": 83693, "epoch": 1008} {"train_loss": -21.208349227905273, "global_step": 83694, "epoch": 1008} {"train_loss": -21.479816436767578, "global_step": 83695, "epoch": 1008} {"train_loss": -21.267316818237305, "global_step": 83696, "epoch": 1008} {"train_loss": -21.434476852416992, "global_step": 83697, "epoch": 1008} {"train_loss": -21.39581871032715, "global_step": 83698, "epoch": 1008} {"train_loss": -21.293792724609375, "global_step": 83699, "epoch": 1008} {"train_loss": -21.264219284057617, "global_step": 83700, "epoch": 1008} {"train_loss": -21.527055740356445, "global_step": 83701, "epoch": 1008} {"train_loss": -21.360933303833008, "global_step": 83702, "epoch": 1008} {"train_loss": -21.35776138305664, "global_step": 83703, "epoch": 1008} {"train_loss": -21.330846786499023, "global_step": 83704, "epoch": 1008} {"train_loss": -21.61993408203125, "global_step": 83705, "epoch": 1008} {"train_loss": -21.262868881225586, "global_step": 83706, "epoch": 1008} {"train_loss": -21.516448974609375, "global_step": 83707, "epoch": 1008} {"train_loss": -21.26047706604004, "global_step": 83708, "epoch": 1008} {"train_loss": -21.769235610961914, "global_step": 83709, "epoch": 1008} {"train_loss": -20.89800453186035, "global_step": 83710, "epoch": 1008} {"train_loss": -21.38983726501465, "global_step": 83711, "epoch": 1008} {"train_loss": -21.72059440612793, "global_step": 83712, "epoch": 1008} {"train_loss": -21.328489303588867, "global_step": 83713, "epoch": 1008} {"train_loss": -21.270864486694336, "global_step": 83714, "epoch": 1008} {"train_loss": -21.038633346557617, "global_step": 83715, "epoch": 1008} {"train_loss": -21.33260154724121, "global_step": 83716, "epoch": 1008} {"train_loss": -21.256444931030273, "global_step": 83717, "epoch": 1008} {"train_loss": -21.73133087158203, "global_step": 83718, "epoch": 1008} {"train_loss": -21.390274047851562, "global_step": 83719, "epoch": 1008} {"train_loss": -21.80415916442871, "global_step": 83720, "epoch": 1008} {"train_loss": -21.436872482299805, "global_step": 83721, "epoch": 1008} {"train_loss": -21.15546226501465, "global_step": 83722, "epoch": 1008} {"train_loss": -21.191402435302734, "global_step": 83723, "epoch": 1008} {"train_loss": -21.329498291015625, "global_step": 83724, "epoch": 1008} {"train_loss": -21.359390258789062, "global_step": 83725, "epoch": 1008} {"train_loss": -21.037673950195312, "global_step": 83726, "epoch": 1008} {"train_loss": -21.47163200378418, "global_step": 83727, "epoch": 1008} {"train_loss": -21.42856788635254, "global_step": 83728, "epoch": 1008} {"train_loss": -21.519861221313477, "global_step": 83729, "epoch": 1008} {"train_loss": -21.20130729675293, "global_step": 83730, "epoch": 1008} {"train_loss": -21.567245483398438, "global_step": 83731, "epoch": 1008} {"train_loss": -21.566999435424805, "global_step": 83732, "epoch": 1008} {"train_loss": -21.30807876586914, "global_step": 83733, "epoch": 1008} {"train_loss": -21.463285446166992, "global_step": 83734, "epoch": 1008} {"train_loss": -21.248580932617188, "global_step": 83735, "epoch": 1008} {"train_loss": -21.39265251159668, "global_step": 83736, "epoch": 1008} {"train_loss": -21.362207412719727, "global_step": 83737, "epoch": 1008} {"train_loss": -21.578744888305664, "global_step": 83738, "epoch": 1008} {"train_loss": -21.267704010009766, "global_step": 83739, "epoch": 1008} {"train_loss": -21.379531860351562, "global_step": 83740, "epoch": 1008} {"train_loss": -21.379924774169922, "global_step": 83741, "epoch": 1008} {"train_loss": -21.168546676635742, "global_step": 83742, "epoch": 1008} {"train_loss": -21.272478103637695, "global_step": 83743, "epoch": 1008} {"train_loss": -21.498563766479492, "global_step": 83744, "epoch": 1008} {"train_loss": -21.0289363861084, "global_step": 83745, "epoch": 1008} {"train_loss": -21.337365368762647, "global_step": 83746, "epoch": 1008, "val_loss": 6021429.5} {"train_loss": -20.70774269104004, "global_step": 83747, "epoch": 1009} {"train_loss": -20.937116622924805, "global_step": 83748, "epoch": 1009} {"train_loss": -21.04461097717285, "global_step": 83749, "epoch": 1009} {"train_loss": -21.12845230102539, "global_step": 83750, "epoch": 1009} {"train_loss": -21.188739776611328, "global_step": 83751, "epoch": 1009} {"train_loss": -21.039392471313477, "global_step": 83752, "epoch": 1009} {"train_loss": -21.183130264282227, "global_step": 83753, "epoch": 1009} {"train_loss": -21.388212203979492, "global_step": 83754, "epoch": 1009} {"train_loss": -21.364652633666992, "global_step": 83755, "epoch": 1009} {"train_loss": -21.166807174682617, "global_step": 83756, "epoch": 1009} {"train_loss": -21.24845314025879, "global_step": 83757, "epoch": 1009} {"train_loss": -21.27088737487793, "global_step": 83758, "epoch": 1009} {"train_loss": -21.27811622619629, "global_step": 83759, "epoch": 1009} {"train_loss": -21.36036491394043, "global_step": 83760, "epoch": 1009} {"train_loss": -21.13199806213379, "global_step": 83761, "epoch": 1009} {"train_loss": -21.136159896850586, "global_step": 83762, "epoch": 1009} {"train_loss": -21.237043380737305, "global_step": 83763, "epoch": 1009} {"train_loss": -21.18805503845215, "global_step": 83764, "epoch": 1009} {"train_loss": -21.215274810791016, "global_step": 83765, "epoch": 1009} {"train_loss": -21.342920303344727, "global_step": 83766, "epoch": 1009} {"train_loss": -21.13945960998535, "global_step": 83767, "epoch": 1009} {"train_loss": -21.304800033569336, "global_step": 83768, "epoch": 1009} {"train_loss": -21.288843154907227, "global_step": 83769, "epoch": 1009} {"train_loss": -21.32331657409668, "global_step": 83770, "epoch": 1009} {"train_loss": -21.31455421447754, "global_step": 83771, "epoch": 1009} {"train_loss": -20.961183547973633, "global_step": 83772, "epoch": 1009} {"train_loss": -21.33945083618164, "global_step": 83773, "epoch": 1009} {"train_loss": -21.45073890686035, "global_step": 83774, "epoch": 1009} {"train_loss": -21.262109756469727, "global_step": 83775, "epoch": 1009} {"train_loss": -21.003652572631836, "global_step": 83776, "epoch": 1009} {"train_loss": -21.403156280517578, "global_step": 83777, "epoch": 1009} {"train_loss": -21.200727462768555, "global_step": 83778, "epoch": 1009} {"train_loss": -21.399951934814453, "global_step": 83779, "epoch": 1009} {"train_loss": -21.36557388305664, "global_step": 83780, "epoch": 1009} {"train_loss": -21.6241397857666, "global_step": 83781, "epoch": 1009} {"train_loss": -21.637632369995117, "global_step": 83782, "epoch": 1009} {"train_loss": -21.29894256591797, "global_step": 83783, "epoch": 1009} {"train_loss": -21.550073623657227, "global_step": 83784, "epoch": 1009} {"train_loss": -21.125164031982422, "global_step": 83785, "epoch": 1009} {"train_loss": -21.57416343688965, "global_step": 83786, "epoch": 1009} {"train_loss": -21.350271224975586, "global_step": 83787, "epoch": 1009} {"train_loss": -21.49603271484375, "global_step": 83788, "epoch": 1009} {"train_loss": -21.52176284790039, "global_step": 83789, "epoch": 1009} {"train_loss": -21.29170036315918, "global_step": 83790, "epoch": 1009} {"train_loss": -21.631729125976562, "global_step": 83791, "epoch": 1009} {"train_loss": -21.393814086914062, "global_step": 83792, "epoch": 1009} {"train_loss": -21.239826202392578, "global_step": 83793, "epoch": 1009} {"train_loss": -21.595111846923828, "global_step": 83794, "epoch": 1009} {"train_loss": -21.098526000976562, "global_step": 83795, "epoch": 1009} {"train_loss": -20.993513107299805, "global_step": 83796, "epoch": 1009} {"train_loss": -21.28303337097168, "global_step": 83797, "epoch": 1009} {"train_loss": -21.316274642944336, "global_step": 83798, "epoch": 1009} {"train_loss": -21.324691772460938, "global_step": 83799, "epoch": 1009} {"train_loss": -21.947603225708008, "global_step": 83800, "epoch": 1009} {"train_loss": -21.216449737548828, "global_step": 83801, "epoch": 1009} {"train_loss": -21.034746170043945, "global_step": 83802, "epoch": 1009} {"train_loss": -21.55426025390625, "global_step": 83803, "epoch": 1009} {"train_loss": -21.490591049194336, "global_step": 83804, "epoch": 1009} {"train_loss": -21.379276275634766, "global_step": 83805, "epoch": 1009} {"train_loss": -21.376480102539062, "global_step": 83806, "epoch": 1009} {"train_loss": -21.4427433013916, "global_step": 83807, "epoch": 1009} {"train_loss": -21.082321166992188, "global_step": 83808, "epoch": 1009} {"train_loss": -21.432546615600586, "global_step": 83809, "epoch": 1009} {"train_loss": -21.24121856689453, "global_step": 83810, "epoch": 1009} {"train_loss": -21.466527938842773, "global_step": 83811, "epoch": 1009} {"train_loss": -21.600317001342773, "global_step": 83812, "epoch": 1009} {"train_loss": -21.456653594970703, "global_step": 83813, "epoch": 1009} {"train_loss": -21.88237190246582, "global_step": 83814, "epoch": 1009} {"train_loss": -21.655677795410156, "global_step": 83815, "epoch": 1009} {"train_loss": -21.38822364807129, "global_step": 83816, "epoch": 1009} {"train_loss": -21.60597801208496, "global_step": 83817, "epoch": 1009} {"train_loss": -21.335670471191406, "global_step": 83818, "epoch": 1009} {"train_loss": -21.466909408569336, "global_step": 83819, "epoch": 1009} {"train_loss": -20.916351318359375, "global_step": 83820, "epoch": 1009} {"train_loss": -21.596532821655273, "global_step": 83821, "epoch": 1009} {"train_loss": -21.41611671447754, "global_step": 83822, "epoch": 1009} {"train_loss": -21.294647216796875, "global_step": 83823, "epoch": 1009} {"train_loss": -21.74234390258789, "global_step": 83824, "epoch": 1009} {"train_loss": -21.30110740661621, "global_step": 83825, "epoch": 1009} {"train_loss": -21.443252563476562, "global_step": 83826, "epoch": 1009} {"train_loss": -21.349674224853516, "global_step": 83827, "epoch": 1009} {"train_loss": -21.3541202545166, "global_step": 83828, "epoch": 1009} {"train_loss": -21.33176539317671, "global_step": 83829, "epoch": 1009, "val_loss": 6016778.0} {"train_loss": -20.856962203979492, "global_step": 83830, "epoch": 1010} {"train_loss": -21.21194839477539, "global_step": 83831, "epoch": 1010} {"train_loss": -21.356704711914062, "global_step": 83832, "epoch": 1010} {"train_loss": -21.130779266357422, "global_step": 83833, "epoch": 1010} {"train_loss": -21.070663452148438, "global_step": 83834, "epoch": 1010} {"train_loss": -21.055158615112305, "global_step": 83835, "epoch": 1010} {"train_loss": -20.94548225402832, "global_step": 83836, "epoch": 1010} {"train_loss": -21.138526916503906, "global_step": 83837, "epoch": 1010} {"train_loss": -21.290311813354492, "global_step": 83838, "epoch": 1010} {"train_loss": -21.316986083984375, "global_step": 83839, "epoch": 1010} {"train_loss": -20.640344619750977, "global_step": 83840, "epoch": 1010} {"train_loss": -21.033857345581055, "global_step": 83841, "epoch": 1010} {"train_loss": -21.1828556060791, "global_step": 83842, "epoch": 1010} {"train_loss": -21.081796646118164, "global_step": 83843, "epoch": 1010} {"train_loss": -21.2450008392334, "global_step": 83844, "epoch": 1010} {"train_loss": -21.73786735534668, "global_step": 83845, "epoch": 1010} {"train_loss": -21.3023738861084, "global_step": 83846, "epoch": 1010} {"train_loss": -21.697675704956055, "global_step": 83847, "epoch": 1010} {"train_loss": -21.278888702392578, "global_step": 83848, "epoch": 1010} {"train_loss": -21.272266387939453, "global_step": 83849, "epoch": 1010} {"train_loss": -21.40057945251465, "global_step": 83850, "epoch": 1010} {"train_loss": -21.439207077026367, "global_step": 83851, "epoch": 1010} {"train_loss": -21.0975399017334, "global_step": 83852, "epoch": 1010} {"train_loss": -21.404207229614258, "global_step": 83853, "epoch": 1010} {"train_loss": -21.5376033782959, "global_step": 83854, "epoch": 1010} {"train_loss": -21.1473331451416, "global_step": 83855, "epoch": 1010} {"train_loss": -21.550559997558594, "global_step": 83856, "epoch": 1010} {"train_loss": -21.4580135345459, "global_step": 83857, "epoch": 1010} {"train_loss": -21.502660751342773, "global_step": 83858, "epoch": 1010} {"train_loss": -21.406492233276367, "global_step": 83859, "epoch": 1010} {"train_loss": -21.24830436706543, "global_step": 83860, "epoch": 1010} {"train_loss": -21.06794548034668, "global_step": 83861, "epoch": 1010} {"train_loss": -21.049097061157227, "global_step": 83862, "epoch": 1010} {"train_loss": -21.499845504760742, "global_step": 83863, "epoch": 1010} {"train_loss": -21.58856201171875, "global_step": 83864, "epoch": 1010} {"train_loss": -21.62095069885254, "global_step": 83865, "epoch": 1010} {"train_loss": -21.64042091369629, "global_step": 83866, "epoch": 1010} {"train_loss": -21.427175521850586, "global_step": 83867, "epoch": 1010} {"train_loss": -21.273975372314453, "global_step": 83868, "epoch": 1010} {"train_loss": -21.610870361328125, "global_step": 83869, "epoch": 1010} {"train_loss": -21.24545669555664, "global_step": 83870, "epoch": 1010} {"train_loss": -21.5865421295166, "global_step": 83871, "epoch": 1010} {"train_loss": -21.819822311401367, "global_step": 83872, "epoch": 1010} {"train_loss": -21.22068214416504, "global_step": 83873, "epoch": 1010} {"train_loss": -21.437467575073242, "global_step": 83874, "epoch": 1010} {"train_loss": -21.302465438842773, "global_step": 83875, "epoch": 1010} {"train_loss": -21.200485229492188, "global_step": 83876, "epoch": 1010} {"train_loss": -21.239992141723633, "global_step": 83877, "epoch": 1010} {"train_loss": -21.517837524414062, "global_step": 83878, "epoch": 1010} {"train_loss": -21.151338577270508, "global_step": 83879, "epoch": 1010} {"train_loss": -21.40923309326172, "global_step": 83880, "epoch": 1010} {"train_loss": -21.508121490478516, "global_step": 83881, "epoch": 1010} {"train_loss": -21.428030014038086, "global_step": 83882, "epoch": 1010} {"train_loss": -21.70863151550293, "global_step": 83883, "epoch": 1010} {"train_loss": -21.714946746826172, "global_step": 83884, "epoch": 1010} {"train_loss": -21.616262435913086, "global_step": 83885, "epoch": 1010} {"train_loss": -21.25164794921875, "global_step": 83886, "epoch": 1010} {"train_loss": -21.149282455444336, "global_step": 83887, "epoch": 1010} {"train_loss": -21.52406883239746, "global_step": 83888, "epoch": 1010} {"train_loss": -21.31880760192871, "global_step": 83889, "epoch": 1010} {"train_loss": -21.31877899169922, "global_step": 83890, "epoch": 1010} {"train_loss": -21.192821502685547, "global_step": 83891, "epoch": 1010} {"train_loss": -21.552471160888672, "global_step": 83892, "epoch": 1010} {"train_loss": -21.529203414916992, "global_step": 83893, "epoch": 1010} {"train_loss": -21.115432739257812, "global_step": 83894, "epoch": 1010} {"train_loss": -21.50144386291504, "global_step": 83895, "epoch": 1010} {"train_loss": -21.3370418548584, "global_step": 83896, "epoch": 1010} {"train_loss": -21.362058639526367, "global_step": 83897, "epoch": 1010} {"train_loss": -21.065265655517578, "global_step": 83898, "epoch": 1010} {"train_loss": -21.525922775268555, "global_step": 83899, "epoch": 1010} {"train_loss": -21.368927001953125, "global_step": 83900, "epoch": 1010} {"train_loss": -21.59433364868164, "global_step": 83901, "epoch": 1010} {"train_loss": -21.142576217651367, "global_step": 83902, "epoch": 1010} {"train_loss": -21.814498901367188, "global_step": 83903, "epoch": 1010} {"train_loss": -21.126920700073242, "global_step": 83904, "epoch": 1010} {"train_loss": -20.884443283081055, "global_step": 83905, "epoch": 1010} {"train_loss": -21.66713523864746, "global_step": 83906, "epoch": 1010} {"train_loss": -21.218463897705078, "global_step": 83907, "epoch": 1010} {"train_loss": -21.234960556030273, "global_step": 83908, "epoch": 1010} {"train_loss": -21.543439865112305, "global_step": 83909, "epoch": 1010} {"train_loss": -21.198379516601562, "global_step": 83910, "epoch": 1010} {"train_loss": -21.118694305419922, "global_step": 83911, "epoch": 1010} {"train_loss": -21.326659650687713, "global_step": 83912, "epoch": 1010, "val_loss": 6136145.0} {"train_loss": -20.25419044494629, "global_step": 83913, "epoch": 1011} {"train_loss": -20.734617233276367, "global_step": 83914, "epoch": 1011} {"train_loss": -20.75006675720215, "global_step": 83915, "epoch": 1011} {"train_loss": -20.97884750366211, "global_step": 83916, "epoch": 1011} {"train_loss": -21.344562530517578, "global_step": 83917, "epoch": 1011} {"train_loss": -20.940048217773438, "global_step": 83918, "epoch": 1011} {"train_loss": -20.656970977783203, "global_step": 83919, "epoch": 1011} {"train_loss": -21.076196670532227, "global_step": 83920, "epoch": 1011} {"train_loss": -21.243013381958008, "global_step": 83921, "epoch": 1011} {"train_loss": -21.201505661010742, "global_step": 83922, "epoch": 1011} {"train_loss": -20.982084274291992, "global_step": 83923, "epoch": 1011} {"train_loss": -21.232650756835938, "global_step": 83924, "epoch": 1011} {"train_loss": -21.334875106811523, "global_step": 83925, "epoch": 1011} {"train_loss": -20.930057525634766, "global_step": 83926, "epoch": 1011} {"train_loss": -21.04583740234375, "global_step": 83927, "epoch": 1011} {"train_loss": -21.152097702026367, "global_step": 83928, "epoch": 1011} {"train_loss": -21.357091903686523, "global_step": 83929, "epoch": 1011} {"train_loss": -21.346044540405273, "global_step": 83930, "epoch": 1011} {"train_loss": -21.398025512695312, "global_step": 83931, "epoch": 1011} {"train_loss": -21.459508895874023, "global_step": 83932, "epoch": 1011} {"train_loss": -20.9411563873291, "global_step": 83933, "epoch": 1011} {"train_loss": -21.410247802734375, "global_step": 83934, "epoch": 1011} {"train_loss": -21.175933837890625, "global_step": 83935, "epoch": 1011} {"train_loss": -21.165863037109375, "global_step": 83936, "epoch": 1011} {"train_loss": -21.35196304321289, "global_step": 83937, "epoch": 1011} {"train_loss": -21.158029556274414, "global_step": 83938, "epoch": 1011} {"train_loss": -21.37360191345215, "global_step": 83939, "epoch": 1011} {"train_loss": -21.438894271850586, "global_step": 83940, "epoch": 1011} {"train_loss": -20.88934326171875, "global_step": 83941, "epoch": 1011} {"train_loss": -21.50960922241211, "global_step": 83942, "epoch": 1011} {"train_loss": -21.282766342163086, "global_step": 83943, "epoch": 1011} {"train_loss": -21.194122314453125, "global_step": 83944, "epoch": 1011} {"train_loss": -21.178974151611328, "global_step": 83945, "epoch": 1011} {"train_loss": -21.5157470703125, "global_step": 83946, "epoch": 1011} {"train_loss": -21.411779403686523, "global_step": 83947, "epoch": 1011} {"train_loss": -21.189453125, "global_step": 83948, "epoch": 1011} {"train_loss": -21.472366333007812, "global_step": 83949, "epoch": 1011} {"train_loss": -21.472553253173828, "global_step": 83950, "epoch": 1011} {"train_loss": -21.843656539916992, "global_step": 83951, "epoch": 1011} {"train_loss": -21.492704391479492, "global_step": 83952, "epoch": 1011} {"train_loss": -21.620283126831055, "global_step": 83953, "epoch": 1011} {"train_loss": -21.587350845336914, "global_step": 83954, "epoch": 1011} {"train_loss": -21.61648941040039, "global_step": 83955, "epoch": 1011} {"train_loss": -21.485973358154297, "global_step": 83956, "epoch": 1011} {"train_loss": -21.249624252319336, "global_step": 83957, "epoch": 1011} {"train_loss": -21.195802688598633, "global_step": 83958, "epoch": 1011} {"train_loss": -21.391510009765625, "global_step": 83959, "epoch": 1011} {"train_loss": -21.119741439819336, "global_step": 83960, "epoch": 1011} {"train_loss": -21.540042877197266, "global_step": 83961, "epoch": 1011} {"train_loss": -21.37861442565918, "global_step": 83962, "epoch": 1011} {"train_loss": -21.2145938873291, "global_step": 83963, "epoch": 1011} {"train_loss": -21.52945327758789, "global_step": 83964, "epoch": 1011} {"train_loss": -21.288928985595703, "global_step": 83965, "epoch": 1011} {"train_loss": -21.528650283813477, "global_step": 83966, "epoch": 1011} {"train_loss": -21.293066024780273, "global_step": 83967, "epoch": 1011} {"train_loss": -21.350383758544922, "global_step": 83968, "epoch": 1011} {"train_loss": -21.223798751831055, "global_step": 83969, "epoch": 1011} {"train_loss": -21.747648239135742, "global_step": 83970, "epoch": 1011} {"train_loss": -21.35889434814453, "global_step": 83971, "epoch": 1011} {"train_loss": -21.70102310180664, "global_step": 83972, "epoch": 1011} {"train_loss": -21.54153823852539, "global_step": 83973, "epoch": 1011} {"train_loss": -21.7264461517334, "global_step": 83974, "epoch": 1011} {"train_loss": -21.375783920288086, "global_step": 83975, "epoch": 1011} {"train_loss": -21.488853454589844, "global_step": 83976, "epoch": 1011} {"train_loss": -21.21148109436035, "global_step": 83977, "epoch": 1011} {"train_loss": -21.487520217895508, "global_step": 83978, "epoch": 1011} {"train_loss": -21.440229415893555, "global_step": 83979, "epoch": 1011} {"train_loss": -21.50118064880371, "global_step": 83980, "epoch": 1011} {"train_loss": -21.436830520629883, "global_step": 83981, "epoch": 1011} {"train_loss": -21.666828155517578, "global_step": 83982, "epoch": 1011} {"train_loss": -21.399030685424805, "global_step": 83983, "epoch": 1011} {"train_loss": -21.49696159362793, "global_step": 83984, "epoch": 1011} {"train_loss": -21.633520126342773, "global_step": 83985, "epoch": 1011} {"train_loss": -21.54323387145996, "global_step": 83986, "epoch": 1011} {"train_loss": -21.469005584716797, "global_step": 83987, "epoch": 1011} {"train_loss": -21.23191261291504, "global_step": 83988, "epoch": 1011} {"train_loss": -21.3917179107666, "global_step": 83989, "epoch": 1011} {"train_loss": -21.262893676757812, "global_step": 83990, "epoch": 1011} {"train_loss": -21.3693790435791, "global_step": 83991, "epoch": 1011} {"train_loss": -21.12102699279785, "global_step": 83992, "epoch": 1011} {"train_loss": -21.380319595336914, "global_step": 83993, "epoch": 1011} {"train_loss": -21.29581642150879, "global_step": 83994, "epoch": 1011} {"train_loss": -21.312636662678546, "global_step": 83995, "epoch": 1011, "val_loss": 6161833.0} {"train_loss": -21.09290885925293, "global_step": 83996, "epoch": 1012} {"train_loss": -21.458498001098633, "global_step": 83997, "epoch": 1012} {"train_loss": -20.916522979736328, "global_step": 83998, "epoch": 1012} {"train_loss": -21.37904167175293, "global_step": 83999, "epoch": 1012} {"train_loss": -21.033954620361328, "global_step": 84000, "epoch": 1012} {"train_loss": -20.699575424194336, "global_step": 84001, "epoch": 1012} {"train_loss": -21.306549072265625, "global_step": 84002, "epoch": 1012} {"train_loss": -21.02398681640625, "global_step": 84003, "epoch": 1012} {"train_loss": -21.114782333374023, "global_step": 84004, "epoch": 1012} {"train_loss": -21.193593978881836, "global_step": 84005, "epoch": 1012} {"train_loss": -21.715015411376953, "global_step": 84006, "epoch": 1012} {"train_loss": -20.848487854003906, "global_step": 84007, "epoch": 1012} {"train_loss": -20.944196701049805, "global_step": 84008, "epoch": 1012} {"train_loss": -20.854827880859375, "global_step": 84009, "epoch": 1012} {"train_loss": -21.324283599853516, "global_step": 84010, "epoch": 1012} {"train_loss": -21.052846908569336, "global_step": 84011, "epoch": 1012} {"train_loss": -21.221149444580078, "global_step": 84012, "epoch": 1012} {"train_loss": -21.385345458984375, "global_step": 84013, "epoch": 1012} {"train_loss": -21.401355743408203, "global_step": 84014, "epoch": 1012} {"train_loss": -21.10609245300293, "global_step": 84015, "epoch": 1012} {"train_loss": -21.631284713745117, "global_step": 84016, "epoch": 1012} {"train_loss": -21.042591094970703, "global_step": 84017, "epoch": 1012} {"train_loss": -21.04118537902832, "global_step": 84018, "epoch": 1012} {"train_loss": -21.566442489624023, "global_step": 84019, "epoch": 1012} {"train_loss": -21.38092803955078, "global_step": 84020, "epoch": 1012} {"train_loss": -21.540441513061523, "global_step": 84021, "epoch": 1012} {"train_loss": -21.562225341796875, "global_step": 84022, "epoch": 1012} {"train_loss": -21.065210342407227, "global_step": 84023, "epoch": 1012} {"train_loss": -21.38995933532715, "global_step": 84024, "epoch": 1012} {"train_loss": -21.481149673461914, "global_step": 84025, "epoch": 1012} {"train_loss": -21.454879760742188, "global_step": 84026, "epoch": 1012} {"train_loss": -21.277551651000977, "global_step": 84027, "epoch": 1012} {"train_loss": -21.068632125854492, "global_step": 84028, "epoch": 1012} {"train_loss": -21.351224899291992, "global_step": 84029, "epoch": 1012} {"train_loss": -21.277297973632812, "global_step": 84030, "epoch": 1012} {"train_loss": -21.255661010742188, "global_step": 84031, "epoch": 1012} {"train_loss": -21.1787166595459, "global_step": 84032, "epoch": 1012} {"train_loss": -21.03425407409668, "global_step": 84033, "epoch": 1012} {"train_loss": -21.718603134155273, "global_step": 84034, "epoch": 1012} {"train_loss": -21.21982765197754, "global_step": 84035, "epoch": 1012} {"train_loss": -21.06561851501465, "global_step": 84036, "epoch": 1012} {"train_loss": -21.295576095581055, "global_step": 84037, "epoch": 1012} {"train_loss": -21.52704620361328, "global_step": 84038, "epoch": 1012} {"train_loss": -21.502731323242188, "global_step": 84039, "epoch": 1012} {"train_loss": -21.178638458251953, "global_step": 84040, "epoch": 1012} {"train_loss": -21.169021606445312, "global_step": 84041, "epoch": 1012} {"train_loss": -21.24380874633789, "global_step": 84042, "epoch": 1012} {"train_loss": -21.262468338012695, "global_step": 84043, "epoch": 1012} {"train_loss": -20.912748336791992, "global_step": 84044, "epoch": 1012} {"train_loss": -21.69386100769043, "global_step": 84045, "epoch": 1012} {"train_loss": -21.41810417175293, "global_step": 84046, "epoch": 1012} {"train_loss": -21.465017318725586, "global_step": 84047, "epoch": 1012} {"train_loss": -21.316404342651367, "global_step": 84048, "epoch": 1012} {"train_loss": -21.353469848632812, "global_step": 84049, "epoch": 1012} {"train_loss": -21.401376724243164, "global_step": 84050, "epoch": 1012} {"train_loss": -21.472871780395508, "global_step": 84051, "epoch": 1012} {"train_loss": -21.10879898071289, "global_step": 84052, "epoch": 1012} {"train_loss": -21.29568862915039, "global_step": 84053, "epoch": 1012} {"train_loss": -21.451181411743164, "global_step": 84054, "epoch": 1012} {"train_loss": -21.403932571411133, "global_step": 84055, "epoch": 1012} {"train_loss": -21.15189552307129, "global_step": 84056, "epoch": 1012} {"train_loss": -21.3875675201416, "global_step": 84057, "epoch": 1012} {"train_loss": -21.502931594848633, "global_step": 84058, "epoch": 1012} {"train_loss": -21.29608726501465, "global_step": 84059, "epoch": 1012} {"train_loss": -21.259613037109375, "global_step": 84060, "epoch": 1012} {"train_loss": -21.38288688659668, "global_step": 84061, "epoch": 1012} {"train_loss": -21.250261306762695, "global_step": 84062, "epoch": 1012} {"train_loss": -21.340879440307617, "global_step": 84063, "epoch": 1012} {"train_loss": -21.441389083862305, "global_step": 84064, "epoch": 1012} {"train_loss": -21.89004135131836, "global_step": 84065, "epoch": 1012} {"train_loss": -21.480140686035156, "global_step": 84066, "epoch": 1012} {"train_loss": -21.676809310913086, "global_step": 84067, "epoch": 1012} {"train_loss": -21.90614128112793, "global_step": 84068, "epoch": 1012} {"train_loss": -21.581274032592773, "global_step": 84069, "epoch": 1012} {"train_loss": -21.438358306884766, "global_step": 84070, "epoch": 1012} {"train_loss": -21.436609268188477, "global_step": 84071, "epoch": 1012} {"train_loss": -21.22614288330078, "global_step": 84072, "epoch": 1012} {"train_loss": -21.626699447631836, "global_step": 84073, "epoch": 1012} {"train_loss": -21.684335708618164, "global_step": 84074, "epoch": 1012} {"train_loss": -21.464210510253906, "global_step": 84075, "epoch": 1012} {"train_loss": -21.296796798706055, "global_step": 84076, "epoch": 1012} {"train_loss": -21.332765579223633, "global_step": 84077, "epoch": 1012} {"train_loss": -21.32539951370423, "global_step": 84078, "epoch": 1012, "val_loss": 6193974.0} {"train_loss": -21.03860092163086, "global_step": 84079, "epoch": 1013} {"train_loss": -21.05379867553711, "global_step": 84080, "epoch": 1013} {"train_loss": -21.2806339263916, "global_step": 84081, "epoch": 1013} {"train_loss": -20.8769588470459, "global_step": 84082, "epoch": 1013} {"train_loss": -21.01667594909668, "global_step": 84083, "epoch": 1013} {"train_loss": -20.847707748413086, "global_step": 84084, "epoch": 1013} {"train_loss": -21.343046188354492, "global_step": 84085, "epoch": 1013} {"train_loss": -20.668537139892578, "global_step": 84086, "epoch": 1013} {"train_loss": -20.997802734375, "global_step": 84087, "epoch": 1013} {"train_loss": -21.35895347595215, "global_step": 84088, "epoch": 1013} {"train_loss": -21.66597557067871, "global_step": 84089, "epoch": 1013} {"train_loss": -21.278278350830078, "global_step": 84090, "epoch": 1013} {"train_loss": -21.40684700012207, "global_step": 84091, "epoch": 1013} {"train_loss": -21.768835067749023, "global_step": 84092, "epoch": 1013} {"train_loss": -21.360876083374023, "global_step": 84093, "epoch": 1013} {"train_loss": -21.065649032592773, "global_step": 84094, "epoch": 1013} {"train_loss": -21.1182861328125, "global_step": 84095, "epoch": 1013} {"train_loss": -21.37159538269043, "global_step": 84096, "epoch": 1013} {"train_loss": -21.053646087646484, "global_step": 84097, "epoch": 1013} {"train_loss": -21.468461990356445, "global_step": 84098, "epoch": 1013} {"train_loss": -21.587560653686523, "global_step": 84099, "epoch": 1013} {"train_loss": -21.38910484313965, "global_step": 84100, "epoch": 1013} {"train_loss": -21.597936630249023, "global_step": 84101, "epoch": 1013} {"train_loss": -21.393545150756836, "global_step": 84102, "epoch": 1013} {"train_loss": -21.585309982299805, "global_step": 84103, "epoch": 1013} {"train_loss": -21.347394943237305, "global_step": 84104, "epoch": 1013} {"train_loss": -21.078411102294922, "global_step": 84105, "epoch": 1013} {"train_loss": -21.405750274658203, "global_step": 84106, "epoch": 1013} {"train_loss": -21.0853271484375, "global_step": 84107, "epoch": 1013} {"train_loss": -21.333023071289062, "global_step": 84108, "epoch": 1013} {"train_loss": -21.484819412231445, "global_step": 84109, "epoch": 1013} {"train_loss": -21.315956115722656, "global_step": 84110, "epoch": 1013} {"train_loss": -20.957468032836914, "global_step": 84111, "epoch": 1013} {"train_loss": -21.561185836791992, "global_step": 84112, "epoch": 1013} {"train_loss": -21.386550903320312, "global_step": 84113, "epoch": 1013} {"train_loss": -20.9875545501709, "global_step": 84114, "epoch": 1013} {"train_loss": -20.870450973510742, "global_step": 84115, "epoch": 1013} {"train_loss": -20.83308982849121, "global_step": 84116, "epoch": 1013} {"train_loss": -21.44246482849121, "global_step": 84117, "epoch": 1013} {"train_loss": -21.263662338256836, "global_step": 84118, "epoch": 1013} {"train_loss": -21.62083625793457, "global_step": 84119, "epoch": 1013} {"train_loss": -21.24525260925293, "global_step": 84120, "epoch": 1013} {"train_loss": -21.16592788696289, "global_step": 84121, "epoch": 1013} {"train_loss": -21.611726760864258, "global_step": 84122, "epoch": 1013} {"train_loss": -21.222929000854492, "global_step": 84123, "epoch": 1013} {"train_loss": -21.09013557434082, "global_step": 84124, "epoch": 1013} {"train_loss": -21.16007423400879, "global_step": 84125, "epoch": 1013} {"train_loss": -21.52707290649414, "global_step": 84126, "epoch": 1013} {"train_loss": -21.429122924804688, "global_step": 84127, "epoch": 1013} {"train_loss": -21.377538681030273, "global_step": 84128, "epoch": 1013} {"train_loss": -21.206735610961914, "global_step": 84129, "epoch": 1013} {"train_loss": -21.040109634399414, "global_step": 84130, "epoch": 1013} {"train_loss": -22.007144927978516, "global_step": 84131, "epoch": 1013} {"train_loss": -21.197980880737305, "global_step": 84132, "epoch": 1013} {"train_loss": -21.75585174560547, "global_step": 84133, "epoch": 1013} {"train_loss": -20.98756980895996, "global_step": 84134, "epoch": 1013} {"train_loss": -21.664636611938477, "global_step": 84135, "epoch": 1013} {"train_loss": -21.208942413330078, "global_step": 84136, "epoch": 1013} {"train_loss": -21.43318748474121, "global_step": 84137, "epoch": 1013} {"train_loss": -21.62220001220703, "global_step": 84138, "epoch": 1013} {"train_loss": -21.378252029418945, "global_step": 84139, "epoch": 1013} {"train_loss": -21.208600997924805, "global_step": 84140, "epoch": 1013} {"train_loss": -21.04346466064453, "global_step": 84141, "epoch": 1013} {"train_loss": -21.49434471130371, "global_step": 84142, "epoch": 1013} {"train_loss": -21.781692504882812, "global_step": 84143, "epoch": 1013} {"train_loss": -21.380674362182617, "global_step": 84144, "epoch": 1013} {"train_loss": -21.200340270996094, "global_step": 84145, "epoch": 1013} {"train_loss": -21.348844528198242, "global_step": 84146, "epoch": 1013} {"train_loss": -21.59212303161621, "global_step": 84147, "epoch": 1013} {"train_loss": -21.925996780395508, "global_step": 84148, "epoch": 1013} {"train_loss": -21.04990577697754, "global_step": 84149, "epoch": 1013} {"train_loss": -21.60308265686035, "global_step": 84150, "epoch": 1013} {"train_loss": -21.614654541015625, "global_step": 84151, "epoch": 1013} {"train_loss": -21.263050079345703, "global_step": 84152, "epoch": 1013} {"train_loss": -21.676319122314453, "global_step": 84153, "epoch": 1013} {"train_loss": -20.88930320739746, "global_step": 84154, "epoch": 1013} {"train_loss": -21.446521759033203, "global_step": 84155, "epoch": 1013} {"train_loss": -21.691129684448242, "global_step": 84156, "epoch": 1013} {"train_loss": -21.818050384521484, "global_step": 84157, "epoch": 1013} {"train_loss": -21.048093795776367, "global_step": 84158, "epoch": 1013} {"train_loss": -21.222471237182617, "global_step": 84159, "epoch": 1013} {"train_loss": -21.231647491455078, "global_step": 84160, "epoch": 1013} {"train_loss": -21.318397521972656, "global_step": 84161, "epoch": 1013, "val_loss": 6194920.0} {"train_loss": -21.08150863647461, "global_step": 84162, "epoch": 1014} {"train_loss": -21.02846336364746, "global_step": 84163, "epoch": 1014} {"train_loss": -20.7156982421875, "global_step": 84164, "epoch": 1014} {"train_loss": -21.443342208862305, "global_step": 84165, "epoch": 1014} {"train_loss": -20.814563751220703, "global_step": 84166, "epoch": 1014} {"train_loss": -21.2264461517334, "global_step": 84167, "epoch": 1014} {"train_loss": -21.12776756286621, "global_step": 84168, "epoch": 1014} {"train_loss": -21.30955696105957, "global_step": 84169, "epoch": 1014} {"train_loss": -21.263460159301758, "global_step": 84170, "epoch": 1014} {"train_loss": -20.947572708129883, "global_step": 84171, "epoch": 1014} {"train_loss": -20.944433212280273, "global_step": 84172, "epoch": 1014} {"train_loss": -20.926950454711914, "global_step": 84173, "epoch": 1014} {"train_loss": -21.103473663330078, "global_step": 84174, "epoch": 1014} {"train_loss": -21.2984619140625, "global_step": 84175, "epoch": 1014} {"train_loss": -21.401575088500977, "global_step": 84176, "epoch": 1014} {"train_loss": -21.016653060913086, "global_step": 84177, "epoch": 1014} {"train_loss": -21.502817153930664, "global_step": 84178, "epoch": 1014} {"train_loss": -21.383913040161133, "global_step": 84179, "epoch": 1014} {"train_loss": -20.856138229370117, "global_step": 84180, "epoch": 1014} {"train_loss": -21.42329216003418, "global_step": 84181, "epoch": 1014} {"train_loss": -20.7018985748291, "global_step": 84182, "epoch": 1014} {"train_loss": -21.055452346801758, "global_step": 84183, "epoch": 1014} {"train_loss": -21.387676239013672, "global_step": 84184, "epoch": 1014} {"train_loss": -21.039648056030273, "global_step": 84185, "epoch": 1014} {"train_loss": -21.5526180267334, "global_step": 84186, "epoch": 1014} {"train_loss": -21.201242446899414, "global_step": 84187, "epoch": 1014} {"train_loss": -20.638689041137695, "global_step": 84188, "epoch": 1014} {"train_loss": -21.4525089263916, "global_step": 84189, "epoch": 1014} {"train_loss": -20.906333923339844, "global_step": 84190, "epoch": 1014} {"train_loss": -21.473806381225586, "global_step": 84191, "epoch": 1014} {"train_loss": -21.5568790435791, "global_step": 84192, "epoch": 1014} {"train_loss": -21.54584312438965, "global_step": 84193, "epoch": 1014} {"train_loss": -21.45705795288086, "global_step": 84194, "epoch": 1014} {"train_loss": -21.395055770874023, "global_step": 84195, "epoch": 1014} {"train_loss": -21.572166442871094, "global_step": 84196, "epoch": 1014} {"train_loss": -21.261388778686523, "global_step": 84197, "epoch": 1014} {"train_loss": -21.232921600341797, "global_step": 84198, "epoch": 1014} {"train_loss": -21.320140838623047, "global_step": 84199, "epoch": 1014} {"train_loss": -21.81641387939453, "global_step": 84200, "epoch": 1014} {"train_loss": -21.60219383239746, "global_step": 84201, "epoch": 1014} {"train_loss": -21.233755111694336, "global_step": 84202, "epoch": 1014} {"train_loss": -21.766321182250977, "global_step": 84203, "epoch": 1014} {"train_loss": -21.639820098876953, "global_step": 84204, "epoch": 1014} {"train_loss": -21.296031951904297, "global_step": 84205, "epoch": 1014} {"train_loss": -21.42758560180664, "global_step": 84206, "epoch": 1014} {"train_loss": -21.301298141479492, "global_step": 84207, "epoch": 1014} {"train_loss": -20.9822940826416, "global_step": 84208, "epoch": 1014} {"train_loss": -21.415678024291992, "global_step": 84209, "epoch": 1014} {"train_loss": -21.259172439575195, "global_step": 84210, "epoch": 1014} {"train_loss": -21.131153106689453, "global_step": 84211, "epoch": 1014} {"train_loss": -21.41659927368164, "global_step": 84212, "epoch": 1014} {"train_loss": -21.744876861572266, "global_step": 84213, "epoch": 1014} {"train_loss": -21.18912696838379, "global_step": 84214, "epoch": 1014} {"train_loss": -21.51490592956543, "global_step": 84215, "epoch": 1014} {"train_loss": -21.256967544555664, "global_step": 84216, "epoch": 1014} {"train_loss": -21.289175033569336, "global_step": 84217, "epoch": 1014} {"train_loss": -21.272573471069336, "global_step": 84218, "epoch": 1014} {"train_loss": -21.48141860961914, "global_step": 84219, "epoch": 1014} {"train_loss": -21.263656616210938, "global_step": 84220, "epoch": 1014} {"train_loss": -21.691959381103516, "global_step": 84221, "epoch": 1014} {"train_loss": -21.34601593017578, "global_step": 84222, "epoch": 1014} {"train_loss": -21.38332176208496, "global_step": 84223, "epoch": 1014} {"train_loss": -21.513334274291992, "global_step": 84224, "epoch": 1014} {"train_loss": -21.704015731811523, "global_step": 84225, "epoch": 1014} {"train_loss": -21.419387817382812, "global_step": 84226, "epoch": 1014} {"train_loss": -21.567651748657227, "global_step": 84227, "epoch": 1014} {"train_loss": -21.436399459838867, "global_step": 84228, "epoch": 1014} {"train_loss": -21.42500114440918, "global_step": 84229, "epoch": 1014} {"train_loss": -20.9517765045166, "global_step": 84230, "epoch": 1014} {"train_loss": -21.542116165161133, "global_step": 84231, "epoch": 1014} {"train_loss": -21.332897186279297, "global_step": 84232, "epoch": 1014} {"train_loss": -21.35078239440918, "global_step": 84233, "epoch": 1014} {"train_loss": -20.99951171875, "global_step": 84234, "epoch": 1014} {"train_loss": -21.27614974975586, "global_step": 84235, "epoch": 1014} {"train_loss": -21.07879066467285, "global_step": 84236, "epoch": 1014} {"train_loss": -21.180952072143555, "global_step": 84237, "epoch": 1014} {"train_loss": -21.66330909729004, "global_step": 84238, "epoch": 1014} {"train_loss": -21.162174224853516, "global_step": 84239, "epoch": 1014} {"train_loss": -21.47088623046875, "global_step": 84240, "epoch": 1014} {"train_loss": -21.2877197265625, "global_step": 84241, "epoch": 1014} {"train_loss": -21.391971588134766, "global_step": 84242, "epoch": 1014} {"train_loss": -21.55060386657715, "global_step": 84243, "epoch": 1014} {"train_loss": -21.286446490919733, "global_step": 84244, "epoch": 1014, "val_loss": 6074727.0} {"train_loss": -20.587453842163086, "global_step": 84245, "epoch": 1015} {"train_loss": -20.392303466796875, "global_step": 84246, "epoch": 1015} {"train_loss": -19.58629035949707, "global_step": 84247, "epoch": 1015} {"train_loss": -20.978988647460938, "global_step": 84248, "epoch": 1015} {"train_loss": -20.89394187927246, "global_step": 84249, "epoch": 1015} {"train_loss": -20.931894302368164, "global_step": 84250, "epoch": 1015} {"train_loss": -20.763731002807617, "global_step": 84251, "epoch": 1015} {"train_loss": -20.77960205078125, "global_step": 84252, "epoch": 1015} {"train_loss": -20.77337074279785, "global_step": 84253, "epoch": 1015} {"train_loss": -20.682785034179688, "global_step": 84254, "epoch": 1015} {"train_loss": -20.780466079711914, "global_step": 84255, "epoch": 1015} {"train_loss": -20.704294204711914, "global_step": 84256, "epoch": 1015} {"train_loss": -21.217239379882812, "global_step": 84257, "epoch": 1015} {"train_loss": -20.600223541259766, "global_step": 84258, "epoch": 1015} {"train_loss": -21.13509178161621, "global_step": 84259, "epoch": 1015} {"train_loss": -20.95439338684082, "global_step": 84260, "epoch": 1015} {"train_loss": -20.92840576171875, "global_step": 84261, "epoch": 1015} {"train_loss": -21.176605224609375, "global_step": 84262, "epoch": 1015} {"train_loss": -21.137908935546875, "global_step": 84263, "epoch": 1015} {"train_loss": -21.38936424255371, "global_step": 84264, "epoch": 1015} {"train_loss": -20.71364402770996, "global_step": 84265, "epoch": 1015} {"train_loss": -21.293210983276367, "global_step": 84266, "epoch": 1015} {"train_loss": -21.077056884765625, "global_step": 84267, "epoch": 1015} {"train_loss": -21.241952896118164, "global_step": 84268, "epoch": 1015} {"train_loss": -21.391407012939453, "global_step": 84269, "epoch": 1015} {"train_loss": -21.147308349609375, "global_step": 84270, "epoch": 1015} {"train_loss": -21.338579177856445, "global_step": 84271, "epoch": 1015} {"train_loss": -21.301773071289062, "global_step": 84272, "epoch": 1015} {"train_loss": -21.791589736938477, "global_step": 84273, "epoch": 1015} {"train_loss": -21.29510498046875, "global_step": 84274, "epoch": 1015} {"train_loss": -21.42876625061035, "global_step": 84275, "epoch": 1015} {"train_loss": -21.182453155517578, "global_step": 84276, "epoch": 1015} {"train_loss": -21.264358520507812, "global_step": 84277, "epoch": 1015} {"train_loss": -21.748367309570312, "global_step": 84278, "epoch": 1015} {"train_loss": -21.24456024169922, "global_step": 84279, "epoch": 1015} {"train_loss": -21.371265411376953, "global_step": 84280, "epoch": 1015} {"train_loss": -21.15682029724121, "global_step": 84281, "epoch": 1015} {"train_loss": -21.69175148010254, "global_step": 84282, "epoch": 1015} {"train_loss": -21.365272521972656, "global_step": 84283, "epoch": 1015} {"train_loss": -21.41781234741211, "global_step": 84284, "epoch": 1015} {"train_loss": -21.408414840698242, "global_step": 84285, "epoch": 1015} {"train_loss": -21.33558464050293, "global_step": 84286, "epoch": 1015} {"train_loss": -21.106281280517578, "global_step": 84287, "epoch": 1015} {"train_loss": -21.4014835357666, "global_step": 84288, "epoch": 1015} {"train_loss": -21.422393798828125, "global_step": 84289, "epoch": 1015} {"train_loss": -21.108661651611328, "global_step": 84290, "epoch": 1015} {"train_loss": -21.489608764648438, "global_step": 84291, "epoch": 1015} {"train_loss": -21.122314453125, "global_step": 84292, "epoch": 1015} {"train_loss": -21.504751205444336, "global_step": 84293, "epoch": 1015} {"train_loss": -21.472827911376953, "global_step": 84294, "epoch": 1015} {"train_loss": -21.628517150878906, "global_step": 84295, "epoch": 1015} {"train_loss": -21.62204933166504, "global_step": 84296, "epoch": 1015} {"train_loss": -21.32876968383789, "global_step": 84297, "epoch": 1015} {"train_loss": -21.461950302124023, "global_step": 84298, "epoch": 1015} {"train_loss": -21.3774471282959, "global_step": 84299, "epoch": 1015} {"train_loss": -21.46478271484375, "global_step": 84300, "epoch": 1015} {"train_loss": -21.319107055664062, "global_step": 84301, "epoch": 1015} {"train_loss": -21.61907958984375, "global_step": 84302, "epoch": 1015} {"train_loss": -21.657121658325195, "global_step": 84303, "epoch": 1015} {"train_loss": -21.366971969604492, "global_step": 84304, "epoch": 1015} {"train_loss": -21.396589279174805, "global_step": 84305, "epoch": 1015} {"train_loss": -21.332944869995117, "global_step": 84306, "epoch": 1015} {"train_loss": -21.20306968688965, "global_step": 84307, "epoch": 1015} {"train_loss": -21.613983154296875, "global_step": 84308, "epoch": 1015} {"train_loss": -21.468652725219727, "global_step": 84309, "epoch": 1015} {"train_loss": -21.67936897277832, "global_step": 84310, "epoch": 1015} {"train_loss": -21.562314987182617, "global_step": 84311, "epoch": 1015} {"train_loss": -21.666091918945312, "global_step": 84312, "epoch": 1015} {"train_loss": -21.702651977539062, "global_step": 84313, "epoch": 1015} {"train_loss": -21.354021072387695, "global_step": 84314, "epoch": 1015} {"train_loss": -21.31598472595215, "global_step": 84315, "epoch": 1015} {"train_loss": -21.258344650268555, "global_step": 84316, "epoch": 1015} {"train_loss": -20.99997901916504, "global_step": 84317, "epoch": 1015} {"train_loss": -21.226911544799805, "global_step": 84318, "epoch": 1015} {"train_loss": -20.900806427001953, "global_step": 84319, "epoch": 1015} {"train_loss": -21.14413833618164, "global_step": 84320, "epoch": 1015} {"train_loss": -20.798799514770508, "global_step": 84321, "epoch": 1015} {"train_loss": -20.94626235961914, "global_step": 84322, "epoch": 1015} {"train_loss": -20.954130172729492, "global_step": 84323, "epoch": 1015} {"train_loss": -21.490060806274414, "global_step": 84324, "epoch": 1015} {"train_loss": -21.358570098876953, "global_step": 84325, "epoch": 1015} {"train_loss": -21.377399444580078, "global_step": 84326, "epoch": 1015} {"train_loss": -21.23126781417663, "global_step": 84327, "epoch": 1015, "val_loss": 6056979.5} {"train_loss": -21.19439697265625, "global_step": 84328, "epoch": 1016} {"train_loss": -21.588642120361328, "global_step": 84329, "epoch": 1016} {"train_loss": -21.362150192260742, "global_step": 84330, "epoch": 1016} {"train_loss": -21.268566131591797, "global_step": 84331, "epoch": 1016} {"train_loss": -21.65961265563965, "global_step": 84332, "epoch": 1016} {"train_loss": -21.111860275268555, "global_step": 84333, "epoch": 1016} {"train_loss": -21.286426544189453, "global_step": 84334, "epoch": 1016} {"train_loss": -21.070951461791992, "global_step": 84335, "epoch": 1016} {"train_loss": -21.087814331054688, "global_step": 84336, "epoch": 1016} {"train_loss": -20.897735595703125, "global_step": 84337, "epoch": 1016} {"train_loss": -21.119598388671875, "global_step": 84338, "epoch": 1016} {"train_loss": -21.629674911499023, "global_step": 84339, "epoch": 1016} {"train_loss": -21.24678611755371, "global_step": 84340, "epoch": 1016} {"train_loss": -21.010028839111328, "global_step": 84341, "epoch": 1016} {"train_loss": -21.429983139038086, "global_step": 84342, "epoch": 1016} {"train_loss": -21.308591842651367, "global_step": 84343, "epoch": 1016} {"train_loss": -21.324974060058594, "global_step": 84344, "epoch": 1016} {"train_loss": -21.497501373291016, "global_step": 84345, "epoch": 1016} {"train_loss": -21.590641021728516, "global_step": 84346, "epoch": 1016} {"train_loss": -21.34145736694336, "global_step": 84347, "epoch": 1016} {"train_loss": -21.277883529663086, "global_step": 84348, "epoch": 1016} {"train_loss": -21.285036087036133, "global_step": 84349, "epoch": 1016} {"train_loss": -21.099742889404297, "global_step": 84350, "epoch": 1016} {"train_loss": -21.10367774963379, "global_step": 84351, "epoch": 1016} {"train_loss": -21.517192840576172, "global_step": 84352, "epoch": 1016} {"train_loss": -21.23316764831543, "global_step": 84353, "epoch": 1016} {"train_loss": -21.37325668334961, "global_step": 84354, "epoch": 1016} {"train_loss": -21.583669662475586, "global_step": 84355, "epoch": 1016} {"train_loss": -21.578771591186523, "global_step": 84356, "epoch": 1016} {"train_loss": -21.118696212768555, "global_step": 84357, "epoch": 1016} {"train_loss": -21.3367862701416, "global_step": 84358, "epoch": 1016} {"train_loss": -21.641742706298828, "global_step": 84359, "epoch": 1016} {"train_loss": -21.235584259033203, "global_step": 84360, "epoch": 1016} {"train_loss": -21.64176368713379, "global_step": 84361, "epoch": 1016} {"train_loss": -21.652690887451172, "global_step": 84362, "epoch": 1016} {"train_loss": -21.6766357421875, "global_step": 84363, "epoch": 1016} {"train_loss": -21.49624252319336, "global_step": 84364, "epoch": 1016} {"train_loss": -21.431947708129883, "global_step": 84365, "epoch": 1016} {"train_loss": -21.055179595947266, "global_step": 84366, "epoch": 1016} {"train_loss": -20.906484603881836, "global_step": 84367, "epoch": 1016} {"train_loss": -21.534687042236328, "global_step": 84368, "epoch": 1016} {"train_loss": -21.119413375854492, "global_step": 84369, "epoch": 1016} {"train_loss": -21.48946762084961, "global_step": 84370, "epoch": 1016} {"train_loss": -21.4088077545166, "global_step": 84371, "epoch": 1016} {"train_loss": -20.944913864135742, "global_step": 84372, "epoch": 1016} {"train_loss": -21.676753997802734, "global_step": 84373, "epoch": 1016} {"train_loss": -21.163284301757812, "global_step": 84374, "epoch": 1016} {"train_loss": -21.50457191467285, "global_step": 84375, "epoch": 1016} {"train_loss": -21.113597869873047, "global_step": 84376, "epoch": 1016} {"train_loss": -21.494678497314453, "global_step": 84377, "epoch": 1016} {"train_loss": -21.265792846679688, "global_step": 84378, "epoch": 1016} {"train_loss": -21.379499435424805, "global_step": 84379, "epoch": 1016} {"train_loss": -21.295087814331055, "global_step": 84380, "epoch": 1016} {"train_loss": -21.61638832092285, "global_step": 84381, "epoch": 1016} {"train_loss": -21.311389923095703, "global_step": 84382, "epoch": 1016} {"train_loss": -21.56955337524414, "global_step": 84383, "epoch": 1016} {"train_loss": -21.34305763244629, "global_step": 84384, "epoch": 1016} {"train_loss": -21.986858367919922, "global_step": 84385, "epoch": 1016} {"train_loss": -21.501203536987305, "global_step": 84386, "epoch": 1016} {"train_loss": -21.671506881713867, "global_step": 84387, "epoch": 1016} {"train_loss": -21.083341598510742, "global_step": 84388, "epoch": 1016} {"train_loss": -21.194868087768555, "global_step": 84389, "epoch": 1016} {"train_loss": -21.37323570251465, "global_step": 84390, "epoch": 1016} {"train_loss": -21.596406936645508, "global_step": 84391, "epoch": 1016} {"train_loss": -21.524181365966797, "global_step": 84392, "epoch": 1016} {"train_loss": -21.575586318969727, "global_step": 84393, "epoch": 1016} {"train_loss": -21.516767501831055, "global_step": 84394, "epoch": 1016} {"train_loss": -21.202373504638672, "global_step": 84395, "epoch": 1016} {"train_loss": -21.481332778930664, "global_step": 84396, "epoch": 1016} {"train_loss": -21.18648338317871, "global_step": 84397, "epoch": 1016} {"train_loss": -21.330463409423828, "global_step": 84398, "epoch": 1016} {"train_loss": -21.508211135864258, "global_step": 84399, "epoch": 1016} {"train_loss": -21.229068756103516, "global_step": 84400, "epoch": 1016} {"train_loss": -21.93849754333496, "global_step": 84401, "epoch": 1016} {"train_loss": -21.534393310546875, "global_step": 84402, "epoch": 1016} {"train_loss": -21.390771865844727, "global_step": 84403, "epoch": 1016} {"train_loss": -21.43793296813965, "global_step": 84404, "epoch": 1016} {"train_loss": -21.22569465637207, "global_step": 84405, "epoch": 1016} {"train_loss": -21.1925048828125, "global_step": 84406, "epoch": 1016} {"train_loss": -21.553152084350586, "global_step": 84407, "epoch": 1016} {"train_loss": -21.554349899291992, "global_step": 84408, "epoch": 1016} {"train_loss": -21.161081314086914, "global_step": 84409, "epoch": 1016} {"train_loss": -21.376932534826807, "global_step": 84410, "epoch": 1016, "val_loss": 6137582.5} {"train_loss": -20.893064498901367, "global_step": 84411, "epoch": 1017} {"train_loss": -21.409021377563477, "global_step": 84412, "epoch": 1017} {"train_loss": -20.82943344116211, "global_step": 84413, "epoch": 1017} {"train_loss": -21.012283325195312, "global_step": 84414, "epoch": 1017} {"train_loss": -21.10931968688965, "global_step": 84415, "epoch": 1017} {"train_loss": -21.137929916381836, "global_step": 84416, "epoch": 1017} {"train_loss": -20.8698787689209, "global_step": 84417, "epoch": 1017} {"train_loss": -21.504180908203125, "global_step": 84418, "epoch": 1017} {"train_loss": -21.18625831604004, "global_step": 84419, "epoch": 1017} {"train_loss": -21.2121639251709, "global_step": 84420, "epoch": 1017} {"train_loss": -21.475332260131836, "global_step": 84421, "epoch": 1017} {"train_loss": -21.462677001953125, "global_step": 84422, "epoch": 1017} {"train_loss": -21.31727409362793, "global_step": 84423, "epoch": 1017} {"train_loss": -21.463712692260742, "global_step": 84424, "epoch": 1017} {"train_loss": -20.994586944580078, "global_step": 84425, "epoch": 1017} {"train_loss": -21.325258255004883, "global_step": 84426, "epoch": 1017} {"train_loss": -21.294347763061523, "global_step": 84427, "epoch": 1017} {"train_loss": -21.681249618530273, "global_step": 84428, "epoch": 1017} {"train_loss": -21.38017463684082, "global_step": 84429, "epoch": 1017} {"train_loss": -21.4449520111084, "global_step": 84430, "epoch": 1017} {"train_loss": -21.303112030029297, "global_step": 84431, "epoch": 1017} {"train_loss": -21.2486515045166, "global_step": 84432, "epoch": 1017} {"train_loss": -21.418363571166992, "global_step": 84433, "epoch": 1017} {"train_loss": -21.13770866394043, "global_step": 84434, "epoch": 1017} {"train_loss": -21.322521209716797, "global_step": 84435, "epoch": 1017} {"train_loss": -21.61875343322754, "global_step": 84436, "epoch": 1017} {"train_loss": -21.53427505493164, "global_step": 84437, "epoch": 1017} {"train_loss": -21.3548583984375, "global_step": 84438, "epoch": 1017} {"train_loss": -21.365863800048828, "global_step": 84439, "epoch": 1017} {"train_loss": -21.144184112548828, "global_step": 84440, "epoch": 1017} {"train_loss": -21.182950973510742, "global_step": 84441, "epoch": 1017} {"train_loss": -21.7956600189209, "global_step": 84442, "epoch": 1017} {"train_loss": -21.23082733154297, "global_step": 84443, "epoch": 1017} {"train_loss": -21.510679244995117, "global_step": 84444, "epoch": 1017} {"train_loss": -20.623455047607422, "global_step": 84445, "epoch": 1017} {"train_loss": -21.40694236755371, "global_step": 84446, "epoch": 1017} {"train_loss": -21.61728286743164, "global_step": 84447, "epoch": 1017} {"train_loss": -21.55789566040039, "global_step": 84448, "epoch": 1017} {"train_loss": -21.404747009277344, "global_step": 84449, "epoch": 1017} {"train_loss": -21.52302360534668, "global_step": 84450, "epoch": 1017} {"train_loss": -21.486988067626953, "global_step": 84451, "epoch": 1017} {"train_loss": -20.775693893432617, "global_step": 84452, "epoch": 1017} {"train_loss": -21.24543571472168, "global_step": 84453, "epoch": 1017} {"train_loss": -21.754867553710938, "global_step": 84454, "epoch": 1017} {"train_loss": -21.147857666015625, "global_step": 84455, "epoch": 1017} {"train_loss": -21.111286163330078, "global_step": 84456, "epoch": 1017} {"train_loss": -21.247257232666016, "global_step": 84457, "epoch": 1017} {"train_loss": -21.60589599609375, "global_step": 84458, "epoch": 1017} {"train_loss": -21.66840171813965, "global_step": 84459, "epoch": 1017} {"train_loss": -21.44223976135254, "global_step": 84460, "epoch": 1017} {"train_loss": -21.240747451782227, "global_step": 84461, "epoch": 1017} {"train_loss": -21.339468002319336, "global_step": 84462, "epoch": 1017} {"train_loss": -21.28250503540039, "global_step": 84463, "epoch": 1017} {"train_loss": -21.215173721313477, "global_step": 84464, "epoch": 1017} {"train_loss": -21.412418365478516, "global_step": 84465, "epoch": 1017} {"train_loss": -21.337461471557617, "global_step": 84466, "epoch": 1017} {"train_loss": -21.42326545715332, "global_step": 84467, "epoch": 1017} {"train_loss": -21.239662170410156, "global_step": 84468, "epoch": 1017} {"train_loss": -21.46876335144043, "global_step": 84469, "epoch": 1017} {"train_loss": -21.583110809326172, "global_step": 84470, "epoch": 1017} {"train_loss": -21.335163116455078, "global_step": 84471, "epoch": 1017} {"train_loss": -21.33154296875, "global_step": 84472, "epoch": 1017} {"train_loss": -21.08245277404785, "global_step": 84473, "epoch": 1017} {"train_loss": -21.480091094970703, "global_step": 84474, "epoch": 1017} {"train_loss": -21.43795394897461, "global_step": 84475, "epoch": 1017} {"train_loss": -21.319019317626953, "global_step": 84476, "epoch": 1017} {"train_loss": -21.367597579956055, "global_step": 84477, "epoch": 1017} {"train_loss": -21.03177833557129, "global_step": 84478, "epoch": 1017} {"train_loss": -21.55990219116211, "global_step": 84479, "epoch": 1017} {"train_loss": -21.465667724609375, "global_step": 84480, "epoch": 1017} {"train_loss": -21.35066795349121, "global_step": 84481, "epoch": 1017} {"train_loss": -21.227415084838867, "global_step": 84482, "epoch": 1017} {"train_loss": -21.415830612182617, "global_step": 84483, "epoch": 1017} {"train_loss": -21.30044174194336, "global_step": 84484, "epoch": 1017} {"train_loss": -21.348596572875977, "global_step": 84485, "epoch": 1017} {"train_loss": -21.387195587158203, "global_step": 84486, "epoch": 1017} {"train_loss": -21.50739097595215, "global_step": 84487, "epoch": 1017} {"train_loss": -21.264503479003906, "global_step": 84488, "epoch": 1017} {"train_loss": -21.07404136657715, "global_step": 84489, "epoch": 1017} {"train_loss": -21.97435760498047, "global_step": 84490, "epoch": 1017} {"train_loss": -21.509008407592773, "global_step": 84491, "epoch": 1017} {"train_loss": -21.540225982666016, "global_step": 84492, "epoch": 1017} {"train_loss": -21.345571793705584, "global_step": 84493, "epoch": 1017, "val_loss": 5960243.0} {"train_loss": -20.869300842285156, "global_step": 84494, "epoch": 1018} {"train_loss": -20.96982765197754, "global_step": 84495, "epoch": 1018} {"train_loss": -20.614490509033203, "global_step": 84496, "epoch": 1018} {"train_loss": -21.064908981323242, "global_step": 84497, "epoch": 1018} {"train_loss": -20.825178146362305, "global_step": 84498, "epoch": 1018} {"train_loss": -21.12761878967285, "global_step": 84499, "epoch": 1018} {"train_loss": -21.2219295501709, "global_step": 84500, "epoch": 1018} {"train_loss": -20.94901466369629, "global_step": 84501, "epoch": 1018} {"train_loss": -21.06044578552246, "global_step": 84502, "epoch": 1018} {"train_loss": -21.677900314331055, "global_step": 84503, "epoch": 1018} {"train_loss": -20.855375289916992, "global_step": 84504, "epoch": 1018} {"train_loss": -21.42753028869629, "global_step": 84505, "epoch": 1018} {"train_loss": -21.16727066040039, "global_step": 84506, "epoch": 1018} {"train_loss": -21.036718368530273, "global_step": 84507, "epoch": 1018} {"train_loss": -21.054126739501953, "global_step": 84508, "epoch": 1018} {"train_loss": -20.877079010009766, "global_step": 84509, "epoch": 1018} {"train_loss": -21.34803581237793, "global_step": 84510, "epoch": 1018} {"train_loss": -21.263158798217773, "global_step": 84511, "epoch": 1018} {"train_loss": -21.424087524414062, "global_step": 84512, "epoch": 1018} {"train_loss": -21.214157104492188, "global_step": 84513, "epoch": 1018} {"train_loss": -21.297378540039062, "global_step": 84514, "epoch": 1018} {"train_loss": -21.253698348999023, "global_step": 84515, "epoch": 1018} {"train_loss": -21.43918800354004, "global_step": 84516, "epoch": 1018} {"train_loss": -21.08662223815918, "global_step": 84517, "epoch": 1018} {"train_loss": -21.145349502563477, "global_step": 84518, "epoch": 1018} {"train_loss": -21.24277114868164, "global_step": 84519, "epoch": 1018} {"train_loss": -21.288034439086914, "global_step": 84520, "epoch": 1018} {"train_loss": -21.47707176208496, "global_step": 84521, "epoch": 1018} {"train_loss": -21.604480743408203, "global_step": 84522, "epoch": 1018} {"train_loss": -21.312305450439453, "global_step": 84523, "epoch": 1018} {"train_loss": -21.45918846130371, "global_step": 84524, "epoch": 1018} {"train_loss": -21.549713134765625, "global_step": 84525, "epoch": 1018} {"train_loss": -21.50623321533203, "global_step": 84526, "epoch": 1018} {"train_loss": -21.28368377685547, "global_step": 84527, "epoch": 1018} {"train_loss": -21.14157485961914, "global_step": 84528, "epoch": 1018} {"train_loss": -21.363393783569336, "global_step": 84529, "epoch": 1018} {"train_loss": -21.398221969604492, "global_step": 84530, "epoch": 1018} {"train_loss": -21.18879508972168, "global_step": 84531, "epoch": 1018} {"train_loss": -21.299535751342773, "global_step": 84532, "epoch": 1018} {"train_loss": -21.31145668029785, "global_step": 84533, "epoch": 1018} {"train_loss": -21.21537208557129, "global_step": 84534, "epoch": 1018} {"train_loss": -21.315937042236328, "global_step": 84535, "epoch": 1018} {"train_loss": -21.044843673706055, "global_step": 84536, "epoch": 1018} {"train_loss": -21.40797233581543, "global_step": 84537, "epoch": 1018} {"train_loss": -20.954313278198242, "global_step": 84538, "epoch": 1018} {"train_loss": -21.29901885986328, "global_step": 84539, "epoch": 1018} {"train_loss": -21.55805778503418, "global_step": 84540, "epoch": 1018} {"train_loss": -21.637805938720703, "global_step": 84541, "epoch": 1018} {"train_loss": -21.04949951171875, "global_step": 84542, "epoch": 1018} {"train_loss": -21.73029899597168, "global_step": 84543, "epoch": 1018} {"train_loss": -21.52399444580078, "global_step": 84544, "epoch": 1018} {"train_loss": -21.550823211669922, "global_step": 84545, "epoch": 1018} {"train_loss": -21.122669219970703, "global_step": 84546, "epoch": 1018} {"train_loss": -21.358678817749023, "global_step": 84547, "epoch": 1018} {"train_loss": -21.46138572692871, "global_step": 84548, "epoch": 1018} {"train_loss": -21.124225616455078, "global_step": 84549, "epoch": 1018} {"train_loss": -21.382862091064453, "global_step": 84550, "epoch": 1018} {"train_loss": -21.465362548828125, "global_step": 84551, "epoch": 1018} {"train_loss": -21.635358810424805, "global_step": 84552, "epoch": 1018} {"train_loss": -21.225839614868164, "global_step": 84553, "epoch": 1018} {"train_loss": -21.535078048706055, "global_step": 84554, "epoch": 1018} {"train_loss": -20.908472061157227, "global_step": 84555, "epoch": 1018} {"train_loss": -21.41366958618164, "global_step": 84556, "epoch": 1018} {"train_loss": -21.287738800048828, "global_step": 84557, "epoch": 1018} {"train_loss": -21.56654167175293, "global_step": 84558, "epoch": 1018} {"train_loss": -21.087331771850586, "global_step": 84559, "epoch": 1018} {"train_loss": -21.02910804748535, "global_step": 84560, "epoch": 1018} {"train_loss": -21.033349990844727, "global_step": 84561, "epoch": 1018} {"train_loss": -21.70030975341797, "global_step": 84562, "epoch": 1018} {"train_loss": -21.258024215698242, "global_step": 84563, "epoch": 1018} {"train_loss": -21.462636947631836, "global_step": 84564, "epoch": 1018} {"train_loss": -21.73504066467285, "global_step": 84565, "epoch": 1018} {"train_loss": -21.333984375, "global_step": 84566, "epoch": 1018} {"train_loss": -21.927780151367188, "global_step": 84567, "epoch": 1018} {"train_loss": -21.38044548034668, "global_step": 84568, "epoch": 1018} {"train_loss": -21.499771118164062, "global_step": 84569, "epoch": 1018} {"train_loss": -21.30019187927246, "global_step": 84570, "epoch": 1018} {"train_loss": -21.6143798828125, "global_step": 84571, "epoch": 1018} {"train_loss": -21.218605041503906, "global_step": 84572, "epoch": 1018} {"train_loss": -21.762409210205078, "global_step": 84573, "epoch": 1018} {"train_loss": -21.55497169494629, "global_step": 84574, "epoch": 1018} {"train_loss": -21.563064575195312, "global_step": 84575, "epoch": 1018} {"train_loss": -21.295880972620953, "global_step": 84576, "epoch": 1018, "val_loss": 6101271.0} {"train_loss": -21.02231788635254, "global_step": 84577, "epoch": 1019} {"train_loss": -21.28818702697754, "global_step": 84578, "epoch": 1019} {"train_loss": -21.145767211914062, "global_step": 84579, "epoch": 1019} {"train_loss": -21.161115646362305, "global_step": 84580, "epoch": 1019} {"train_loss": -21.38495445251465, "global_step": 84581, "epoch": 1019} {"train_loss": -20.968664169311523, "global_step": 84582, "epoch": 1019} {"train_loss": -21.034156799316406, "global_step": 84583, "epoch": 1019} {"train_loss": -21.442615509033203, "global_step": 84584, "epoch": 1019} {"train_loss": -21.189786911010742, "global_step": 84585, "epoch": 1019} {"train_loss": -21.280515670776367, "global_step": 84586, "epoch": 1019} {"train_loss": -21.30595588684082, "global_step": 84587, "epoch": 1019} {"train_loss": -21.398969650268555, "global_step": 84588, "epoch": 1019} {"train_loss": -21.806598663330078, "global_step": 84589, "epoch": 1019} {"train_loss": -21.743370056152344, "global_step": 84590, "epoch": 1019} {"train_loss": -21.203657150268555, "global_step": 84591, "epoch": 1019} {"train_loss": -21.31641387939453, "global_step": 84592, "epoch": 1019} {"train_loss": -21.27738380432129, "global_step": 84593, "epoch": 1019} {"train_loss": -21.6373348236084, "global_step": 84594, "epoch": 1019} {"train_loss": -21.480667114257812, "global_step": 84595, "epoch": 1019} {"train_loss": -21.661989212036133, "global_step": 84596, "epoch": 1019} {"train_loss": -21.492856979370117, "global_step": 84597, "epoch": 1019} {"train_loss": -21.186946868896484, "global_step": 84598, "epoch": 1019} {"train_loss": -21.24895668029785, "global_step": 84599, "epoch": 1019} {"train_loss": -21.554454803466797, "global_step": 84600, "epoch": 1019} {"train_loss": -21.43666648864746, "global_step": 84601, "epoch": 1019} {"train_loss": -21.773183822631836, "global_step": 84602, "epoch": 1019} {"train_loss": -21.363927841186523, "global_step": 84603, "epoch": 1019} {"train_loss": -21.384021759033203, "global_step": 84604, "epoch": 1019} {"train_loss": -21.19646644592285, "global_step": 84605, "epoch": 1019} {"train_loss": -21.71478843688965, "global_step": 84606, "epoch": 1019} {"train_loss": -21.510717391967773, "global_step": 84607, "epoch": 1019} {"train_loss": -21.83513641357422, "global_step": 84608, "epoch": 1019} {"train_loss": -21.566390991210938, "global_step": 84609, "epoch": 1019} {"train_loss": -21.502016067504883, "global_step": 84610, "epoch": 1019} {"train_loss": -21.6085147857666, "global_step": 84611, "epoch": 1019} {"train_loss": -21.616422653198242, "global_step": 84612, "epoch": 1019} {"train_loss": -21.4942626953125, "global_step": 84613, "epoch": 1019} {"train_loss": -21.395858764648438, "global_step": 84614, "epoch": 1019} {"train_loss": -21.49860191345215, "global_step": 84615, "epoch": 1019} {"train_loss": -21.68166732788086, "global_step": 84616, "epoch": 1019} {"train_loss": -21.313678741455078, "global_step": 84617, "epoch": 1019} {"train_loss": -21.507719039916992, "global_step": 84618, "epoch": 1019} {"train_loss": -20.9503173828125, "global_step": 84619, "epoch": 1019} {"train_loss": -21.15081214904785, "global_step": 84620, "epoch": 1019} {"train_loss": -21.216379165649414, "global_step": 84621, "epoch": 1019} {"train_loss": -21.117462158203125, "global_step": 84622, "epoch": 1019} {"train_loss": -21.54231834411621, "global_step": 84623, "epoch": 1019} {"train_loss": -21.281339645385742, "global_step": 84624, "epoch": 1019} {"train_loss": -21.184368133544922, "global_step": 84625, "epoch": 1019} {"train_loss": -21.18512535095215, "global_step": 84626, "epoch": 1019} {"train_loss": -21.04851722717285, "global_step": 84627, "epoch": 1019} {"train_loss": -21.252607345581055, "global_step": 84628, "epoch": 1019} {"train_loss": -21.416709899902344, "global_step": 84629, "epoch": 1019} {"train_loss": -21.017873764038086, "global_step": 84630, "epoch": 1019} {"train_loss": -21.361722946166992, "global_step": 84631, "epoch": 1019} {"train_loss": -21.1855525970459, "global_step": 84632, "epoch": 1019} {"train_loss": -21.522262573242188, "global_step": 84633, "epoch": 1019} {"train_loss": -21.437908172607422, "global_step": 84634, "epoch": 1019} {"train_loss": -21.517087936401367, "global_step": 84635, "epoch": 1019} {"train_loss": -21.252836227416992, "global_step": 84636, "epoch": 1019} {"train_loss": -21.214033126831055, "global_step": 84637, "epoch": 1019} {"train_loss": -21.656469345092773, "global_step": 84638, "epoch": 1019} {"train_loss": -21.183340072631836, "global_step": 84639, "epoch": 1019} {"train_loss": -21.360336303710938, "global_step": 84640, "epoch": 1019} {"train_loss": -21.055938720703125, "global_step": 84641, "epoch": 1019} {"train_loss": -20.884435653686523, "global_step": 84642, "epoch": 1019} {"train_loss": -21.591594696044922, "global_step": 84643, "epoch": 1019} {"train_loss": -21.305978775024414, "global_step": 84644, "epoch": 1019} {"train_loss": -21.386390686035156, "global_step": 84645, "epoch": 1019} {"train_loss": -21.327802658081055, "global_step": 84646, "epoch": 1019} {"train_loss": -21.39345359802246, "global_step": 84647, "epoch": 1019} {"train_loss": -21.20847511291504, "global_step": 84648, "epoch": 1019} {"train_loss": -21.30710220336914, "global_step": 84649, "epoch": 1019} {"train_loss": -21.528955459594727, "global_step": 84650, "epoch": 1019} {"train_loss": -21.15366554260254, "global_step": 84651, "epoch": 1019} {"train_loss": -21.339277267456055, "global_step": 84652, "epoch": 1019} {"train_loss": -21.404678344726562, "global_step": 84653, "epoch": 1019} {"train_loss": -21.798900604248047, "global_step": 84654, "epoch": 1019} {"train_loss": -21.31914710998535, "global_step": 84655, "epoch": 1019} {"train_loss": -21.327423095703125, "global_step": 84656, "epoch": 1019} {"train_loss": -21.54607582092285, "global_step": 84657, "epoch": 1019} {"train_loss": -21.35768699645996, "global_step": 84658, "epoch": 1019} {"train_loss": -21.353659158729645, "global_step": 84659, "epoch": 1019, "val_loss": 6086665.5} {"train_loss": -21.02345848083496, "global_step": 84660, "epoch": 1020} {"train_loss": -21.214576721191406, "global_step": 84661, "epoch": 1020} {"train_loss": -21.059856414794922, "global_step": 84662, "epoch": 1020} {"train_loss": -20.924657821655273, "global_step": 84663, "epoch": 1020} {"train_loss": -21.140390396118164, "global_step": 84664, "epoch": 1020} {"train_loss": -21.61092185974121, "global_step": 84665, "epoch": 1020} {"train_loss": -21.02455711364746, "global_step": 84666, "epoch": 1020} {"train_loss": -21.353567123413086, "global_step": 84667, "epoch": 1020} {"train_loss": -21.684694290161133, "global_step": 84668, "epoch": 1020} {"train_loss": -20.777664184570312, "global_step": 84669, "epoch": 1020} {"train_loss": -21.246631622314453, "global_step": 84670, "epoch": 1020} {"train_loss": -21.671850204467773, "global_step": 84671, "epoch": 1020} {"train_loss": -20.79770278930664, "global_step": 84672, "epoch": 1020} {"train_loss": -21.4733943939209, "global_step": 84673, "epoch": 1020} {"train_loss": -21.345251083374023, "global_step": 84674, "epoch": 1020} {"train_loss": -21.089231491088867, "global_step": 84675, "epoch": 1020} {"train_loss": -21.3442440032959, "global_step": 84676, "epoch": 1020} {"train_loss": -21.2910213470459, "global_step": 84677, "epoch": 1020} {"train_loss": -21.406909942626953, "global_step": 84678, "epoch": 1020} {"train_loss": -21.363155364990234, "global_step": 84679, "epoch": 1020} {"train_loss": -21.243587493896484, "global_step": 84680, "epoch": 1020} {"train_loss": -21.336166381835938, "global_step": 84681, "epoch": 1020} {"train_loss": -21.429662704467773, "global_step": 84682, "epoch": 1020} {"train_loss": -21.318735122680664, "global_step": 84683, "epoch": 1020} {"train_loss": -21.4968318939209, "global_step": 84684, "epoch": 1020} {"train_loss": -21.551916122436523, "global_step": 84685, "epoch": 1020} {"train_loss": -21.581787109375, "global_step": 84686, "epoch": 1020} {"train_loss": -21.277570724487305, "global_step": 84687, "epoch": 1020} {"train_loss": -21.37650489807129, "global_step": 84688, "epoch": 1020} {"train_loss": -21.412036895751953, "global_step": 84689, "epoch": 1020} {"train_loss": -21.691387176513672, "global_step": 84690, "epoch": 1020} {"train_loss": -21.168439865112305, "global_step": 84691, "epoch": 1020} {"train_loss": -21.426198959350586, "global_step": 84692, "epoch": 1020} {"train_loss": -21.68339729309082, "global_step": 84693, "epoch": 1020} {"train_loss": -21.745716094970703, "global_step": 84694, "epoch": 1020} {"train_loss": -21.45597267150879, "global_step": 84695, "epoch": 1020} {"train_loss": -21.43845558166504, "global_step": 84696, "epoch": 1020} {"train_loss": -21.577688217163086, "global_step": 84697, "epoch": 1020} {"train_loss": -21.448118209838867, "global_step": 84698, "epoch": 1020} {"train_loss": -21.459442138671875, "global_step": 84699, "epoch": 1020} {"train_loss": -21.654645919799805, "global_step": 84700, "epoch": 1020} {"train_loss": -21.420284271240234, "global_step": 84701, "epoch": 1020} {"train_loss": -21.565580368041992, "global_step": 84702, "epoch": 1020} {"train_loss": -21.45720863342285, "global_step": 84703, "epoch": 1020} {"train_loss": -21.70364761352539, "global_step": 84704, "epoch": 1020} {"train_loss": -21.212718963623047, "global_step": 84705, "epoch": 1020} {"train_loss": -21.262075424194336, "global_step": 84706, "epoch": 1020} {"train_loss": -21.315031051635742, "global_step": 84707, "epoch": 1020} {"train_loss": -21.381635665893555, "global_step": 84708, "epoch": 1020} {"train_loss": -21.22940444946289, "global_step": 84709, "epoch": 1020} {"train_loss": -21.20021629333496, "global_step": 84710, "epoch": 1020} {"train_loss": -21.399585723876953, "global_step": 84711, "epoch": 1020} {"train_loss": -21.02203941345215, "global_step": 84712, "epoch": 1020} {"train_loss": -21.25841522216797, "global_step": 84713, "epoch": 1020} {"train_loss": -21.701446533203125, "global_step": 84714, "epoch": 1020} {"train_loss": -21.569284439086914, "global_step": 84715, "epoch": 1020} {"train_loss": -22.006933212280273, "global_step": 84716, "epoch": 1020} {"train_loss": -21.588041305541992, "global_step": 84717, "epoch": 1020} {"train_loss": -21.58577537536621, "global_step": 84718, "epoch": 1020} {"train_loss": -21.261734008789062, "global_step": 84719, "epoch": 1020} {"train_loss": -21.504314422607422, "global_step": 84720, "epoch": 1020} {"train_loss": -21.676542282104492, "global_step": 84721, "epoch": 1020} {"train_loss": -21.374309539794922, "global_step": 84722, "epoch": 1020} {"train_loss": -20.949636459350586, "global_step": 84723, "epoch": 1020} {"train_loss": -21.444801330566406, "global_step": 84724, "epoch": 1020} {"train_loss": -21.337339401245117, "global_step": 84725, "epoch": 1020} {"train_loss": -21.660140991210938, "global_step": 84726, "epoch": 1020} {"train_loss": -21.47658920288086, "global_step": 84727, "epoch": 1020} {"train_loss": -21.753847122192383, "global_step": 84728, "epoch": 1020} {"train_loss": -21.406234741210938, "global_step": 84729, "epoch": 1020} {"train_loss": -21.40309715270996, "global_step": 84730, "epoch": 1020} {"train_loss": -21.361225128173828, "global_step": 84731, "epoch": 1020} {"train_loss": -21.692716598510742, "global_step": 84732, "epoch": 1020} {"train_loss": -21.86244773864746, "global_step": 84733, "epoch": 1020} {"train_loss": -21.505197525024414, "global_step": 84734, "epoch": 1020} {"train_loss": -21.5023193359375, "global_step": 84735, "epoch": 1020} {"train_loss": -21.046998977661133, "global_step": 84736, "epoch": 1020} {"train_loss": -21.717756271362305, "global_step": 84737, "epoch": 1020} {"train_loss": -21.108549118041992, "global_step": 84738, "epoch": 1020} {"train_loss": -21.71445655822754, "global_step": 84739, "epoch": 1020} {"train_loss": -21.41322898864746, "global_step": 84740, "epoch": 1020} {"train_loss": -21.221403121948242, "global_step": 84741, "epoch": 1020} {"train_loss": -21.40623995769455, "global_step": 84742, "epoch": 1020, "val_loss": 6055474.0} {"train_loss": -20.377639770507812, "global_step": 84743, "epoch": 1021} {"train_loss": -21.02568244934082, "global_step": 84744, "epoch": 1021} {"train_loss": -20.757062911987305, "global_step": 84745, "epoch": 1021} {"train_loss": -20.947179794311523, "global_step": 84746, "epoch": 1021} {"train_loss": -20.79070472717285, "global_step": 84747, "epoch": 1021} {"train_loss": -20.245166778564453, "global_step": 84748, "epoch": 1021} {"train_loss": -20.838123321533203, "global_step": 84749, "epoch": 1021} {"train_loss": -20.4864559173584, "global_step": 84750, "epoch": 1021} {"train_loss": -20.72650718688965, "global_step": 84751, "epoch": 1021} {"train_loss": -21.044631958007812, "global_step": 84752, "epoch": 1021} {"train_loss": -20.8231143951416, "global_step": 84753, "epoch": 1021} {"train_loss": -21.221921920776367, "global_step": 84754, "epoch": 1021} {"train_loss": -21.480998992919922, "global_step": 84755, "epoch": 1021} {"train_loss": -20.99493980407715, "global_step": 84756, "epoch": 1021} {"train_loss": -21.212926864624023, "global_step": 84757, "epoch": 1021} {"train_loss": -21.324750900268555, "global_step": 84758, "epoch": 1021} {"train_loss": -21.492767333984375, "global_step": 84759, "epoch": 1021} {"train_loss": -21.117263793945312, "global_step": 84760, "epoch": 1021} {"train_loss": -20.984973907470703, "global_step": 84761, "epoch": 1021} {"train_loss": -21.35256004333496, "global_step": 84762, "epoch": 1021} {"train_loss": -20.855928421020508, "global_step": 84763, "epoch": 1021} {"train_loss": -21.41756248474121, "global_step": 84764, "epoch": 1021} {"train_loss": -21.1563720703125, "global_step": 84765, "epoch": 1021} {"train_loss": -21.29485511779785, "global_step": 84766, "epoch": 1021} {"train_loss": -21.425785064697266, "global_step": 84767, "epoch": 1021} {"train_loss": -21.236677169799805, "global_step": 84768, "epoch": 1021} {"train_loss": -20.900222778320312, "global_step": 84769, "epoch": 1021} {"train_loss": -21.184112548828125, "global_step": 84770, "epoch": 1021} {"train_loss": -21.724502563476562, "global_step": 84771, "epoch": 1021} {"train_loss": -21.405540466308594, "global_step": 84772, "epoch": 1021} {"train_loss": -21.85076904296875, "global_step": 84773, "epoch": 1021} {"train_loss": -21.350847244262695, "global_step": 84774, "epoch": 1021} {"train_loss": -21.398725509643555, "global_step": 84775, "epoch": 1021} {"train_loss": -21.23458480834961, "global_step": 84776, "epoch": 1021} {"train_loss": -21.351850509643555, "global_step": 84777, "epoch": 1021} {"train_loss": -21.686935424804688, "global_step": 84778, "epoch": 1021} {"train_loss": -21.46012306213379, "global_step": 84779, "epoch": 1021} {"train_loss": -21.78769874572754, "global_step": 84780, "epoch": 1021} {"train_loss": -21.801990509033203, "global_step": 84781, "epoch": 1021} {"train_loss": -21.651559829711914, "global_step": 84782, "epoch": 1021} {"train_loss": -21.651294708251953, "global_step": 84783, "epoch": 1021} {"train_loss": -21.341943740844727, "global_step": 84784, "epoch": 1021} {"train_loss": -21.761829376220703, "global_step": 84785, "epoch": 1021} {"train_loss": -21.507421493530273, "global_step": 84786, "epoch": 1021} {"train_loss": -21.18511199951172, "global_step": 84787, "epoch": 1021} {"train_loss": -21.4705753326416, "global_step": 84788, "epoch": 1021} {"train_loss": -21.87459945678711, "global_step": 84789, "epoch": 1021} {"train_loss": -21.14676284790039, "global_step": 84790, "epoch": 1021} {"train_loss": -21.617328643798828, "global_step": 84791, "epoch": 1021} {"train_loss": -21.290931701660156, "global_step": 84792, "epoch": 1021} {"train_loss": -21.439783096313477, "global_step": 84793, "epoch": 1021} {"train_loss": -21.178997039794922, "global_step": 84794, "epoch": 1021} {"train_loss": -21.178476333618164, "global_step": 84795, "epoch": 1021} {"train_loss": -21.609525680541992, "global_step": 84796, "epoch": 1021} {"train_loss": -21.481958389282227, "global_step": 84797, "epoch": 1021} {"train_loss": -21.191116333007812, "global_step": 84798, "epoch": 1021} {"train_loss": -21.261510848999023, "global_step": 84799, "epoch": 1021} {"train_loss": -20.933744430541992, "global_step": 84800, "epoch": 1021} {"train_loss": -21.388452529907227, "global_step": 84801, "epoch": 1021} {"train_loss": -21.36952018737793, "global_step": 84802, "epoch": 1021} {"train_loss": -21.404903411865234, "global_step": 84803, "epoch": 1021} {"train_loss": -21.211156845092773, "global_step": 84804, "epoch": 1021} {"train_loss": -21.549671173095703, "global_step": 84805, "epoch": 1021} {"train_loss": -21.41916275024414, "global_step": 84806, "epoch": 1021} {"train_loss": -21.185110092163086, "global_step": 84807, "epoch": 1021} {"train_loss": -21.015899658203125, "global_step": 84808, "epoch": 1021} {"train_loss": -21.648366928100586, "global_step": 84809, "epoch": 1021} {"train_loss": -21.266193389892578, "global_step": 84810, "epoch": 1021} {"train_loss": -21.3106689453125, "global_step": 84811, "epoch": 1021} {"train_loss": -21.52226448059082, "global_step": 84812, "epoch": 1021} {"train_loss": -21.238510131835938, "global_step": 84813, "epoch": 1021} {"train_loss": -21.518325805664062, "global_step": 84814, "epoch": 1021} {"train_loss": -21.449766159057617, "global_step": 84815, "epoch": 1021} {"train_loss": -21.49408531188965, "global_step": 84816, "epoch": 1021} {"train_loss": -21.680795669555664, "global_step": 84817, "epoch": 1021} {"train_loss": -21.494237899780273, "global_step": 84818, "epoch": 1021} {"train_loss": -21.497774124145508, "global_step": 84819, "epoch": 1021} {"train_loss": -21.377798080444336, "global_step": 84820, "epoch": 1021} {"train_loss": -21.18326759338379, "global_step": 84821, "epoch": 1021} {"train_loss": -21.430130004882812, "global_step": 84822, "epoch": 1021} {"train_loss": -21.070154190063477, "global_step": 84823, "epoch": 1021} {"train_loss": -21.57358169555664, "global_step": 84824, "epoch": 1021} {"train_loss": -21.27548564773008, "global_step": 84825, "epoch": 1021, "val_loss": 6173623.5} {"train_loss": -20.553434371948242, "global_step": 84826, "epoch": 1022} {"train_loss": -20.821205139160156, "global_step": 84827, "epoch": 1022} {"train_loss": -21.211978912353516, "global_step": 84828, "epoch": 1022} {"train_loss": -21.232587814331055, "global_step": 84829, "epoch": 1022} {"train_loss": -20.803756713867188, "global_step": 84830, "epoch": 1022} {"train_loss": -20.88736343383789, "global_step": 84831, "epoch": 1022} {"train_loss": -21.09871482849121, "global_step": 84832, "epoch": 1022} {"train_loss": -21.072128295898438, "global_step": 84833, "epoch": 1022} {"train_loss": -21.107044219970703, "global_step": 84834, "epoch": 1022} {"train_loss": -20.869043350219727, "global_step": 84835, "epoch": 1022} {"train_loss": -20.916584014892578, "global_step": 84836, "epoch": 1022} {"train_loss": -21.046710968017578, "global_step": 84837, "epoch": 1022} {"train_loss": -21.342416763305664, "global_step": 84838, "epoch": 1022} {"train_loss": -21.34242820739746, "global_step": 84839, "epoch": 1022} {"train_loss": -21.23927116394043, "global_step": 84840, "epoch": 1022} {"train_loss": -21.405912399291992, "global_step": 84841, "epoch": 1022} {"train_loss": -20.978721618652344, "global_step": 84842, "epoch": 1022} {"train_loss": -21.182798385620117, "global_step": 84843, "epoch": 1022} {"train_loss": -21.253177642822266, "global_step": 84844, "epoch": 1022} {"train_loss": -21.683130264282227, "global_step": 84845, "epoch": 1022} {"train_loss": -21.019563674926758, "global_step": 84846, "epoch": 1022} {"train_loss": -21.142620086669922, "global_step": 84847, "epoch": 1022} {"train_loss": -21.47110366821289, "global_step": 84848, "epoch": 1022} {"train_loss": -21.08266258239746, "global_step": 84849, "epoch": 1022} {"train_loss": -21.66872787475586, "global_step": 84850, "epoch": 1022} {"train_loss": -21.30025863647461, "global_step": 84851, "epoch": 1022} {"train_loss": -21.288686752319336, "global_step": 84852, "epoch": 1022} {"train_loss": -21.73334312438965, "global_step": 84853, "epoch": 1022} {"train_loss": -21.550888061523438, "global_step": 84854, "epoch": 1022} {"train_loss": -21.42316436767578, "global_step": 84855, "epoch": 1022} {"train_loss": -21.408884048461914, "global_step": 84856, "epoch": 1022} {"train_loss": -21.602800369262695, "global_step": 84857, "epoch": 1022} {"train_loss": -21.030364990234375, "global_step": 84858, "epoch": 1022} {"train_loss": -21.387754440307617, "global_step": 84859, "epoch": 1022} {"train_loss": -21.42680549621582, "global_step": 84860, "epoch": 1022} {"train_loss": -21.725204467773438, "global_step": 84861, "epoch": 1022} {"train_loss": -21.512582778930664, "global_step": 84862, "epoch": 1022} {"train_loss": -21.39511489868164, "global_step": 84863, "epoch": 1022} {"train_loss": -21.334796905517578, "global_step": 84864, "epoch": 1022} {"train_loss": -21.595687866210938, "global_step": 84865, "epoch": 1022} {"train_loss": -21.692365646362305, "global_step": 84866, "epoch": 1022} {"train_loss": -21.0788516998291, "global_step": 84867, "epoch": 1022} {"train_loss": -21.579702377319336, "global_step": 84868, "epoch": 1022} {"train_loss": -21.00326919555664, "global_step": 84869, "epoch": 1022} {"train_loss": -21.409345626831055, "global_step": 84870, "epoch": 1022} {"train_loss": -21.588764190673828, "global_step": 84871, "epoch": 1022} {"train_loss": -21.210926055908203, "global_step": 84872, "epoch": 1022} {"train_loss": -21.33358383178711, "global_step": 84873, "epoch": 1022} {"train_loss": -21.03182029724121, "global_step": 84874, "epoch": 1022} {"train_loss": -21.300846099853516, "global_step": 84875, "epoch": 1022} {"train_loss": -21.114002227783203, "global_step": 84876, "epoch": 1022} {"train_loss": -21.370542526245117, "global_step": 84877, "epoch": 1022} {"train_loss": -21.334774017333984, "global_step": 84878, "epoch": 1022} {"train_loss": -21.4176025390625, "global_step": 84879, "epoch": 1022} {"train_loss": -21.615209579467773, "global_step": 84880, "epoch": 1022} {"train_loss": -21.746103286743164, "global_step": 84881, "epoch": 1022} {"train_loss": -21.460355758666992, "global_step": 84882, "epoch": 1022} {"train_loss": -21.692672729492188, "global_step": 84883, "epoch": 1022} {"train_loss": -21.522687911987305, "global_step": 84884, "epoch": 1022} {"train_loss": -21.415878295898438, "global_step": 84885, "epoch": 1022} {"train_loss": -21.195556640625, "global_step": 84886, "epoch": 1022} {"train_loss": -21.66181755065918, "global_step": 84887, "epoch": 1022} {"train_loss": -21.635547637939453, "global_step": 84888, "epoch": 1022} {"train_loss": -21.47373390197754, "global_step": 84889, "epoch": 1022} {"train_loss": -21.314924240112305, "global_step": 84890, "epoch": 1022} {"train_loss": -21.315338134765625, "global_step": 84891, "epoch": 1022} {"train_loss": -21.535409927368164, "global_step": 84892, "epoch": 1022} {"train_loss": -21.269699096679688, "global_step": 84893, "epoch": 1022} {"train_loss": -21.602807998657227, "global_step": 84894, "epoch": 1022} {"train_loss": -21.272964477539062, "global_step": 84895, "epoch": 1022} {"train_loss": -21.507837295532227, "global_step": 84896, "epoch": 1022} {"train_loss": -21.459949493408203, "global_step": 84897, "epoch": 1022} {"train_loss": -21.73770523071289, "global_step": 84898, "epoch": 1022} {"train_loss": -21.36111831665039, "global_step": 84899, "epoch": 1022} {"train_loss": -21.632299423217773, "global_step": 84900, "epoch": 1022} {"train_loss": -21.275081634521484, "global_step": 84901, "epoch": 1022} {"train_loss": -21.42500114440918, "global_step": 84902, "epoch": 1022} {"train_loss": -21.18538475036621, "global_step": 84903, "epoch": 1022} {"train_loss": -21.569820404052734, "global_step": 84904, "epoch": 1022} {"train_loss": -21.579736709594727, "global_step": 84905, "epoch": 1022} {"train_loss": -21.06524085998535, "global_step": 84906, "epoch": 1022} {"train_loss": -21.667200088500977, "global_step": 84907, "epoch": 1022} {"train_loss": -21.357999939516365, "global_step": 84908, "epoch": 1022, "val_loss": 6021644.0} {"train_loss": -21.029584884643555, "global_step": 84909, "epoch": 1023} {"train_loss": -20.716880798339844, "global_step": 84910, "epoch": 1023} {"train_loss": -21.283863067626953, "global_step": 84911, "epoch": 1023} {"train_loss": -21.230506896972656, "global_step": 84912, "epoch": 1023} {"train_loss": -21.549463272094727, "global_step": 84913, "epoch": 1023} {"train_loss": -21.504323959350586, "global_step": 84914, "epoch": 1023} {"train_loss": -21.725605010986328, "global_step": 84915, "epoch": 1023} {"train_loss": -21.403167724609375, "global_step": 84916, "epoch": 1023} {"train_loss": -21.142436981201172, "global_step": 84917, "epoch": 1023} {"train_loss": -21.073883056640625, "global_step": 84918, "epoch": 1023} {"train_loss": -21.17196273803711, "global_step": 84919, "epoch": 1023} {"train_loss": -21.16162872314453, "global_step": 84920, "epoch": 1023} {"train_loss": -21.412322998046875, "global_step": 84921, "epoch": 1023} {"train_loss": -21.512117385864258, "global_step": 84922, "epoch": 1023} {"train_loss": -21.32464599609375, "global_step": 84923, "epoch": 1023} {"train_loss": -21.116867065429688, "global_step": 84924, "epoch": 1023} {"train_loss": -21.620023727416992, "global_step": 84925, "epoch": 1023} {"train_loss": -21.405927658081055, "global_step": 84926, "epoch": 1023} {"train_loss": -21.406660079956055, "global_step": 84927, "epoch": 1023} {"train_loss": -21.36025047302246, "global_step": 84928, "epoch": 1023} {"train_loss": -21.771387100219727, "global_step": 84929, "epoch": 1023} {"train_loss": -21.163002014160156, "global_step": 84930, "epoch": 1023} {"train_loss": -21.331024169921875, "global_step": 84931, "epoch": 1023} {"train_loss": -21.55903434753418, "global_step": 84932, "epoch": 1023} {"train_loss": -21.357675552368164, "global_step": 84933, "epoch": 1023} {"train_loss": -21.388463973999023, "global_step": 84934, "epoch": 1023} {"train_loss": -21.492218017578125, "global_step": 84935, "epoch": 1023} {"train_loss": -21.332992553710938, "global_step": 84936, "epoch": 1023} {"train_loss": -21.414642333984375, "global_step": 84937, "epoch": 1023} {"train_loss": -21.83316993713379, "global_step": 84938, "epoch": 1023} {"train_loss": -21.541309356689453, "global_step": 84939, "epoch": 1023} {"train_loss": -21.481704711914062, "global_step": 84940, "epoch": 1023} {"train_loss": -21.452259063720703, "global_step": 84941, "epoch": 1023} {"train_loss": -21.390607833862305, "global_step": 84942, "epoch": 1023} {"train_loss": -21.38789176940918, "global_step": 84943, "epoch": 1023} {"train_loss": -21.260700225830078, "global_step": 84944, "epoch": 1023} {"train_loss": -21.581144332885742, "global_step": 84945, "epoch": 1023} {"train_loss": -21.18746566772461, "global_step": 84946, "epoch": 1023} {"train_loss": -21.2323055267334, "global_step": 84947, "epoch": 1023} {"train_loss": -21.494312286376953, "global_step": 84948, "epoch": 1023} {"train_loss": -21.156707763671875, "global_step": 84949, "epoch": 1023} {"train_loss": -21.287199020385742, "global_step": 84950, "epoch": 1023} {"train_loss": -21.519807815551758, "global_step": 84951, "epoch": 1023} {"train_loss": -21.250045776367188, "global_step": 84952, "epoch": 1023} {"train_loss": -21.150714874267578, "global_step": 84953, "epoch": 1023} {"train_loss": -21.569089889526367, "global_step": 84954, "epoch": 1023} {"train_loss": -21.52947425842285, "global_step": 84955, "epoch": 1023} {"train_loss": -21.205495834350586, "global_step": 84956, "epoch": 1023} {"train_loss": -21.579038619995117, "global_step": 84957, "epoch": 1023} {"train_loss": -21.64491844177246, "global_step": 84958, "epoch": 1023} {"train_loss": -21.105010986328125, "global_step": 84959, "epoch": 1023} {"train_loss": -21.72955322265625, "global_step": 84960, "epoch": 1023} {"train_loss": -21.091379165649414, "global_step": 84961, "epoch": 1023} {"train_loss": -20.97246742248535, "global_step": 84962, "epoch": 1023} {"train_loss": -21.460418701171875, "global_step": 84963, "epoch": 1023} {"train_loss": -21.49663734436035, "global_step": 84964, "epoch": 1023} {"train_loss": -21.207395553588867, "global_step": 84965, "epoch": 1023} {"train_loss": -21.1861629486084, "global_step": 84966, "epoch": 1023} {"train_loss": -21.168357849121094, "global_step": 84967, "epoch": 1023} {"train_loss": -21.250370025634766, "global_step": 84968, "epoch": 1023} {"train_loss": -21.271711349487305, "global_step": 84969, "epoch": 1023} {"train_loss": -20.94964027404785, "global_step": 84970, "epoch": 1023} {"train_loss": -21.332063674926758, "global_step": 84971, "epoch": 1023} {"train_loss": -21.15607261657715, "global_step": 84972, "epoch": 1023} {"train_loss": -21.103300094604492, "global_step": 84973, "epoch": 1023} {"train_loss": -21.59092140197754, "global_step": 84974, "epoch": 1023} {"train_loss": -20.890592575073242, "global_step": 84975, "epoch": 1023} {"train_loss": -21.290563583374023, "global_step": 84976, "epoch": 1023} {"train_loss": -21.201955795288086, "global_step": 84977, "epoch": 1023} {"train_loss": -21.356054306030273, "global_step": 84978, "epoch": 1023} {"train_loss": -21.581745147705078, "global_step": 84979, "epoch": 1023} {"train_loss": -21.516164779663086, "global_step": 84980, "epoch": 1023} {"train_loss": -21.626468658447266, "global_step": 84981, "epoch": 1023} {"train_loss": -21.69788360595703, "global_step": 84982, "epoch": 1023} {"train_loss": -21.2583065032959, "global_step": 84983, "epoch": 1023} {"train_loss": -21.32317543029785, "global_step": 84984, "epoch": 1023} {"train_loss": -21.737686157226562, "global_step": 84985, "epoch": 1023} {"train_loss": -21.50617218017578, "global_step": 84986, "epoch": 1023} {"train_loss": -21.38251304626465, "global_step": 84987, "epoch": 1023} {"train_loss": -21.366682052612305, "global_step": 84988, "epoch": 1023} {"train_loss": -20.923925399780273, "global_step": 84989, "epoch": 1023} {"train_loss": -21.521411895751953, "global_step": 84990, "epoch": 1023} {"train_loss": -21.362255900739186, "global_step": 84991, "epoch": 1023, "val_loss": 6023155.5} {"train_loss": -20.780027389526367, "global_step": 84992, "epoch": 1024} {"train_loss": -20.695547103881836, "global_step": 84993, "epoch": 1024} {"train_loss": -21.08040428161621, "global_step": 84994, "epoch": 1024} {"train_loss": -21.352256774902344, "global_step": 84995, "epoch": 1024} {"train_loss": -20.696218490600586, "global_step": 84996, "epoch": 1024} {"train_loss": -20.953672409057617, "global_step": 84997, "epoch": 1024} {"train_loss": -21.295608520507812, "global_step": 84998, "epoch": 1024} {"train_loss": -20.806610107421875, "global_step": 84999, "epoch": 1024} {"train_loss": -21.094358444213867, "global_step": 85000, "epoch": 1024} {"train_loss": -21.232404708862305, "global_step": 85001, "epoch": 1024} {"train_loss": -21.483901977539062, "global_step": 85002, "epoch": 1024} {"train_loss": -21.327497482299805, "global_step": 85003, "epoch": 1024} {"train_loss": -21.209646224975586, "global_step": 85004, "epoch": 1024} {"train_loss": -21.320920944213867, "global_step": 85005, "epoch": 1024} {"train_loss": -21.362518310546875, "global_step": 85006, "epoch": 1024} {"train_loss": -21.481998443603516, "global_step": 85007, "epoch": 1024} {"train_loss": -21.420673370361328, "global_step": 85008, "epoch": 1024} {"train_loss": -21.52669906616211, "global_step": 85009, "epoch": 1024} {"train_loss": -21.434104919433594, "global_step": 85010, "epoch": 1024} {"train_loss": -21.698455810546875, "global_step": 85011, "epoch": 1024} {"train_loss": -21.313074111938477, "global_step": 85012, "epoch": 1024} {"train_loss": -21.524707794189453, "global_step": 85013, "epoch": 1024} {"train_loss": -21.495681762695312, "global_step": 85014, "epoch": 1024} {"train_loss": -21.18929672241211, "global_step": 85015, "epoch": 1024} {"train_loss": -21.370037078857422, "global_step": 85016, "epoch": 1024} {"train_loss": -21.14431381225586, "global_step": 85017, "epoch": 1024} {"train_loss": -21.235265731811523, "global_step": 85018, "epoch": 1024} {"train_loss": -21.312271118164062, "global_step": 85019, "epoch": 1024} {"train_loss": -21.444700241088867, "global_step": 85020, "epoch": 1024} {"train_loss": -21.742908477783203, "global_step": 85021, "epoch": 1024} {"train_loss": -21.42627716064453, "global_step": 85022, "epoch": 1024} {"train_loss": -21.750707626342773, "global_step": 85023, "epoch": 1024} {"train_loss": -21.668869018554688, "global_step": 85024, "epoch": 1024} {"train_loss": -21.398717880249023, "global_step": 85025, "epoch": 1024} {"train_loss": -21.575469970703125, "global_step": 85026, "epoch": 1024} {"train_loss": -21.291427612304688, "global_step": 85027, "epoch": 1024} {"train_loss": -21.84040641784668, "global_step": 85028, "epoch": 1024} {"train_loss": -21.479900360107422, "global_step": 85029, "epoch": 1024} {"train_loss": -21.140724182128906, "global_step": 85030, "epoch": 1024} {"train_loss": -21.18404197692871, "global_step": 85031, "epoch": 1024} {"train_loss": -21.51517105102539, "global_step": 85032, "epoch": 1024} {"train_loss": -21.51338005065918, "global_step": 85033, "epoch": 1024} {"train_loss": -21.63783073425293, "global_step": 85034, "epoch": 1024} {"train_loss": -21.431949615478516, "global_step": 85035, "epoch": 1024} {"train_loss": -21.328201293945312, "global_step": 85036, "epoch": 1024} {"train_loss": -21.84858512878418, "global_step": 85037, "epoch": 1024} {"train_loss": -21.408710479736328, "global_step": 85038, "epoch": 1024} {"train_loss": -20.962696075439453, "global_step": 85039, "epoch": 1024} {"train_loss": -21.38593864440918, "global_step": 85040, "epoch": 1024} {"train_loss": -21.424978256225586, "global_step": 85041, "epoch": 1024} {"train_loss": -21.5737361907959, "global_step": 85042, "epoch": 1024} {"train_loss": -21.554128646850586, "global_step": 85043, "epoch": 1024} {"train_loss": -21.24354362487793, "global_step": 85044, "epoch": 1024} {"train_loss": -21.60906410217285, "global_step": 85045, "epoch": 1024} {"train_loss": -21.269346237182617, "global_step": 85046, "epoch": 1024} {"train_loss": -21.30878448486328, "global_step": 85047, "epoch": 1024} {"train_loss": -21.871023178100586, "global_step": 85048, "epoch": 1024} {"train_loss": -21.561492919921875, "global_step": 85049, "epoch": 1024} {"train_loss": -21.61079978942871, "global_step": 85050, "epoch": 1024} {"train_loss": -21.612518310546875, "global_step": 85051, "epoch": 1024} {"train_loss": -21.355066299438477, "global_step": 85052, "epoch": 1024} {"train_loss": -21.4807186126709, "global_step": 85053, "epoch": 1024} {"train_loss": -21.53554344177246, "global_step": 85054, "epoch": 1024} {"train_loss": -21.627836227416992, "global_step": 85055, "epoch": 1024} {"train_loss": -21.69944190979004, "global_step": 85056, "epoch": 1024} {"train_loss": -20.866809844970703, "global_step": 85057, "epoch": 1024} {"train_loss": -21.274564743041992, "global_step": 85058, "epoch": 1024} {"train_loss": -21.315458297729492, "global_step": 85059, "epoch": 1024} {"train_loss": -21.539472579956055, "global_step": 85060, "epoch": 1024} {"train_loss": -21.56821632385254, "global_step": 85061, "epoch": 1024} {"train_loss": -21.23190689086914, "global_step": 85062, "epoch": 1024} {"train_loss": -21.552907943725586, "global_step": 85063, "epoch": 1024} {"train_loss": -21.3148250579834, "global_step": 85064, "epoch": 1024} {"train_loss": -21.435731887817383, "global_step": 85065, "epoch": 1024} {"train_loss": -21.47307777404785, "global_step": 85066, "epoch": 1024} {"train_loss": -21.7728271484375, "global_step": 85067, "epoch": 1024} {"train_loss": -21.44581413269043, "global_step": 85068, "epoch": 1024} {"train_loss": -21.589345932006836, "global_step": 85069, "epoch": 1024} {"train_loss": -21.400020599365234, "global_step": 85070, "epoch": 1024} {"train_loss": -21.35765838623047, "global_step": 85071, "epoch": 1024} {"train_loss": -21.204116821289062, "global_step": 85072, "epoch": 1024} {"train_loss": -21.01144790649414, "global_step": 85073, "epoch": 1024} {"train_loss": -21.379109486039862, "global_step": 85074, "epoch": 1024, "val_loss": 6208711.5} {"train_loss": -20.3426456451416, "global_step": 85075, "epoch": 1025} {"train_loss": -20.995689392089844, "global_step": 85076, "epoch": 1025} {"train_loss": -20.777311325073242, "global_step": 85077, "epoch": 1025} {"train_loss": -21.089475631713867, "global_step": 85078, "epoch": 1025} {"train_loss": -21.105228424072266, "global_step": 85079, "epoch": 1025} {"train_loss": -21.144987106323242, "global_step": 85080, "epoch": 1025} {"train_loss": -21.087888717651367, "global_step": 85081, "epoch": 1025} {"train_loss": -21.05234146118164, "global_step": 85082, "epoch": 1025} {"train_loss": -21.18937110900879, "global_step": 85083, "epoch": 1025} {"train_loss": -20.966609954833984, "global_step": 85084, "epoch": 1025} {"train_loss": -21.2846736907959, "global_step": 85085, "epoch": 1025} {"train_loss": -20.98648452758789, "global_step": 85086, "epoch": 1025} {"train_loss": -21.35268783569336, "global_step": 85087, "epoch": 1025} {"train_loss": -21.29375648498535, "global_step": 85088, "epoch": 1025} {"train_loss": -21.113882064819336, "global_step": 85089, "epoch": 1025} {"train_loss": -21.065521240234375, "global_step": 85090, "epoch": 1025} {"train_loss": -21.023710250854492, "global_step": 85091, "epoch": 1025} {"train_loss": -21.494661331176758, "global_step": 85092, "epoch": 1025} {"train_loss": -21.313480377197266, "global_step": 85093, "epoch": 1025} {"train_loss": -21.212568283081055, "global_step": 85094, "epoch": 1025} {"train_loss": -21.362060546875, "global_step": 85095, "epoch": 1025} {"train_loss": -21.150598526000977, "global_step": 85096, "epoch": 1025} {"train_loss": -21.559614181518555, "global_step": 85097, "epoch": 1025} {"train_loss": -21.287580490112305, "global_step": 85098, "epoch": 1025} {"train_loss": -21.354084014892578, "global_step": 85099, "epoch": 1025} {"train_loss": -21.39689064025879, "global_step": 85100, "epoch": 1025} {"train_loss": -21.1997127532959, "global_step": 85101, "epoch": 1025} {"train_loss": -21.306730270385742, "global_step": 85102, "epoch": 1025} {"train_loss": -21.34249496459961, "global_step": 85103, "epoch": 1025} {"train_loss": -21.53632354736328, "global_step": 85104, "epoch": 1025} {"train_loss": -21.4542293548584, "global_step": 85105, "epoch": 1025} {"train_loss": -21.407562255859375, "global_step": 85106, "epoch": 1025} {"train_loss": -21.422515869140625, "global_step": 85107, "epoch": 1025} {"train_loss": -21.19500160217285, "global_step": 85108, "epoch": 1025} {"train_loss": -21.46015739440918, "global_step": 85109, "epoch": 1025} {"train_loss": -21.337881088256836, "global_step": 85110, "epoch": 1025} {"train_loss": -21.31831169128418, "global_step": 85111, "epoch": 1025} {"train_loss": -21.520761489868164, "global_step": 85112, "epoch": 1025} {"train_loss": -21.451704025268555, "global_step": 85113, "epoch": 1025} {"train_loss": -21.399311065673828, "global_step": 85114, "epoch": 1025} {"train_loss": -21.874876022338867, "global_step": 85115, "epoch": 1025} {"train_loss": -21.693376541137695, "global_step": 85116, "epoch": 1025} {"train_loss": -21.46732521057129, "global_step": 85117, "epoch": 1025} {"train_loss": -21.296852111816406, "global_step": 85118, "epoch": 1025} {"train_loss": -21.32791519165039, "global_step": 85119, "epoch": 1025} {"train_loss": -21.3404598236084, "global_step": 85120, "epoch": 1025} {"train_loss": -21.32938575744629, "global_step": 85121, "epoch": 1025} {"train_loss": -21.403705596923828, "global_step": 85122, "epoch": 1025} {"train_loss": -21.23386573791504, "global_step": 85123, "epoch": 1025} {"train_loss": -21.575969696044922, "global_step": 85124, "epoch": 1025} {"train_loss": -21.2379207611084, "global_step": 85125, "epoch": 1025} {"train_loss": -21.5604305267334, "global_step": 85126, "epoch": 1025} {"train_loss": -21.575145721435547, "global_step": 85127, "epoch": 1025} {"train_loss": -21.552837371826172, "global_step": 85128, "epoch": 1025} {"train_loss": -21.51701545715332, "global_step": 85129, "epoch": 1025} {"train_loss": -20.83717918395996, "global_step": 85130, "epoch": 1025} {"train_loss": -21.989126205444336, "global_step": 85131, "epoch": 1025} {"train_loss": -21.5860538482666, "global_step": 85132, "epoch": 1025} {"train_loss": -21.34166717529297, "global_step": 85133, "epoch": 1025} {"train_loss": -21.317712783813477, "global_step": 85134, "epoch": 1025} {"train_loss": -21.215137481689453, "global_step": 85135, "epoch": 1025} {"train_loss": -21.605628967285156, "global_step": 85136, "epoch": 1025} {"train_loss": -21.403366088867188, "global_step": 85137, "epoch": 1025} {"train_loss": -21.43342399597168, "global_step": 85138, "epoch": 1025} {"train_loss": -21.454444885253906, "global_step": 85139, "epoch": 1025} {"train_loss": -21.577964782714844, "global_step": 85140, "epoch": 1025} {"train_loss": -21.375446319580078, "global_step": 85141, "epoch": 1025} {"train_loss": -21.64410400390625, "global_step": 85142, "epoch": 1025} {"train_loss": -21.328369140625, "global_step": 85143, "epoch": 1025} {"train_loss": -21.48459815979004, "global_step": 85144, "epoch": 1025} {"train_loss": -21.445234298706055, "global_step": 85145, "epoch": 1025} {"train_loss": -21.36244773864746, "global_step": 85146, "epoch": 1025} {"train_loss": -21.444700241088867, "global_step": 85147, "epoch": 1025} {"train_loss": -21.204418182373047, "global_step": 85148, "epoch": 1025} {"train_loss": -22.103378295898438, "global_step": 85149, "epoch": 1025} {"train_loss": -21.55348014831543, "global_step": 85150, "epoch": 1025} {"train_loss": -21.208698272705078, "global_step": 85151, "epoch": 1025} {"train_loss": -21.562864303588867, "global_step": 85152, "epoch": 1025} {"train_loss": -21.3294734954834, "global_step": 85153, "epoch": 1025} {"train_loss": -21.677034378051758, "global_step": 85154, "epoch": 1025} {"train_loss": -21.507675170898438, "global_step": 85155, "epoch": 1025} {"train_loss": -21.244199752807617, "global_step": 85156, "epoch": 1025} {"train_loss": -21.358260901577502, "global_step": 85157, "epoch": 1025, "val_loss": 5964352.5} {"train_loss": -20.94888687133789, "global_step": 85158, "epoch": 1026} {"train_loss": -21.349512100219727, "global_step": 85159, "epoch": 1026} {"train_loss": -21.475988388061523, "global_step": 85160, "epoch": 1026} {"train_loss": -21.038053512573242, "global_step": 85161, "epoch": 1026} {"train_loss": -21.067615509033203, "global_step": 85162, "epoch": 1026} {"train_loss": -21.09173011779785, "global_step": 85163, "epoch": 1026} {"train_loss": -20.69632911682129, "global_step": 85164, "epoch": 1026} {"train_loss": -21.37636375427246, "global_step": 85165, "epoch": 1026} {"train_loss": -20.750173568725586, "global_step": 85166, "epoch": 1026} {"train_loss": -21.18342399597168, "global_step": 85167, "epoch": 1026} {"train_loss": -20.88775634765625, "global_step": 85168, "epoch": 1026} {"train_loss": -21.740663528442383, "global_step": 85169, "epoch": 1026} {"train_loss": -20.99295425415039, "global_step": 85170, "epoch": 1026} {"train_loss": -21.404369354248047, "global_step": 85171, "epoch": 1026} {"train_loss": -21.456811904907227, "global_step": 85172, "epoch": 1026} {"train_loss": -21.139541625976562, "global_step": 85173, "epoch": 1026} {"train_loss": -21.099695205688477, "global_step": 85174, "epoch": 1026} {"train_loss": -21.388273239135742, "global_step": 85175, "epoch": 1026} {"train_loss": -21.082347869873047, "global_step": 85176, "epoch": 1026} {"train_loss": -21.173620223999023, "global_step": 85177, "epoch": 1026} {"train_loss": -21.57257080078125, "global_step": 85178, "epoch": 1026} {"train_loss": -21.233463287353516, "global_step": 85179, "epoch": 1026} {"train_loss": -21.565176010131836, "global_step": 85180, "epoch": 1026} {"train_loss": -21.46274757385254, "global_step": 85181, "epoch": 1026} {"train_loss": -21.16974639892578, "global_step": 85182, "epoch": 1026} {"train_loss": -21.490934371948242, "global_step": 85183, "epoch": 1026} {"train_loss": -20.9898624420166, "global_step": 85184, "epoch": 1026} {"train_loss": -21.23189926147461, "global_step": 85185, "epoch": 1026} {"train_loss": -21.5600643157959, "global_step": 85186, "epoch": 1026} {"train_loss": -21.41273307800293, "global_step": 85187, "epoch": 1026} {"train_loss": -21.382246017456055, "global_step": 85188, "epoch": 1026} {"train_loss": -21.2518253326416, "global_step": 85189, "epoch": 1026} {"train_loss": -21.116117477416992, "global_step": 85190, "epoch": 1026} {"train_loss": -21.742063522338867, "global_step": 85191, "epoch": 1026} {"train_loss": -21.19732093811035, "global_step": 85192, "epoch": 1026} {"train_loss": -21.258028030395508, "global_step": 85193, "epoch": 1026} {"train_loss": -21.2927303314209, "global_step": 85194, "epoch": 1026} {"train_loss": -21.218616485595703, "global_step": 85195, "epoch": 1026} {"train_loss": -21.447702407836914, "global_step": 85196, "epoch": 1026} {"train_loss": -21.381216049194336, "global_step": 85197, "epoch": 1026} {"train_loss": -21.540952682495117, "global_step": 85198, "epoch": 1026} {"train_loss": -21.518543243408203, "global_step": 85199, "epoch": 1026} {"train_loss": -21.705097198486328, "global_step": 85200, "epoch": 1026} {"train_loss": -21.06797218322754, "global_step": 85201, "epoch": 1026} {"train_loss": -21.50503921508789, "global_step": 85202, "epoch": 1026} {"train_loss": -21.194753646850586, "global_step": 85203, "epoch": 1026} {"train_loss": -20.879419326782227, "global_step": 85204, "epoch": 1026} {"train_loss": -21.393827438354492, "global_step": 85205, "epoch": 1026} {"train_loss": -21.1431884765625, "global_step": 85206, "epoch": 1026} {"train_loss": -21.514514923095703, "global_step": 85207, "epoch": 1026} {"train_loss": -21.252304077148438, "global_step": 85208, "epoch": 1026} {"train_loss": -21.334362030029297, "global_step": 85209, "epoch": 1026} {"train_loss": -21.615886688232422, "global_step": 85210, "epoch": 1026} {"train_loss": -21.474374771118164, "global_step": 85211, "epoch": 1026} {"train_loss": -21.328956604003906, "global_step": 85212, "epoch": 1026} {"train_loss": -21.457887649536133, "global_step": 85213, "epoch": 1026} {"train_loss": -21.328506469726562, "global_step": 85214, "epoch": 1026} {"train_loss": -21.212081909179688, "global_step": 85215, "epoch": 1026} {"train_loss": -21.527929306030273, "global_step": 85216, "epoch": 1026} {"train_loss": -21.113813400268555, "global_step": 85217, "epoch": 1026} {"train_loss": -21.605098724365234, "global_step": 85218, "epoch": 1026} {"train_loss": -21.479351043701172, "global_step": 85219, "epoch": 1026} {"train_loss": -21.317441940307617, "global_step": 85220, "epoch": 1026} {"train_loss": -21.66814613342285, "global_step": 85221, "epoch": 1026} {"train_loss": -20.916553497314453, "global_step": 85222, "epoch": 1026} {"train_loss": -21.778409957885742, "global_step": 85223, "epoch": 1026} {"train_loss": -21.519254684448242, "global_step": 85224, "epoch": 1026} {"train_loss": -21.265989303588867, "global_step": 85225, "epoch": 1026} {"train_loss": -21.360801696777344, "global_step": 85226, "epoch": 1026} {"train_loss": -21.478702545166016, "global_step": 85227, "epoch": 1026} {"train_loss": -21.464479446411133, "global_step": 85228, "epoch": 1026} {"train_loss": -21.16876792907715, "global_step": 85229, "epoch": 1026} {"train_loss": -21.56113052368164, "global_step": 85230, "epoch": 1026} {"train_loss": -21.64070701599121, "global_step": 85231, "epoch": 1026} {"train_loss": -21.31678009033203, "global_step": 85232, "epoch": 1026} {"train_loss": -21.34749412536621, "global_step": 85233, "epoch": 1026} {"train_loss": -21.398014068603516, "global_step": 85234, "epoch": 1026} {"train_loss": -21.635746002197266, "global_step": 85235, "epoch": 1026} {"train_loss": -21.450355529785156, "global_step": 85236, "epoch": 1026} {"train_loss": -21.261272430419922, "global_step": 85237, "epoch": 1026} {"train_loss": -21.32065200805664, "global_step": 85238, "epoch": 1026} {"train_loss": -21.403610229492188, "global_step": 85239, "epoch": 1026} {"train_loss": -21.343242966985127, "global_step": 85240, "epoch": 1026, "val_loss": 6057248.5} {"train_loss": -21.145095825195312, "global_step": 85241, "epoch": 1027} {"train_loss": -20.940378189086914, "global_step": 85242, "epoch": 1027} {"train_loss": -21.121732711791992, "global_step": 85243, "epoch": 1027} {"train_loss": -21.065542221069336, "global_step": 85244, "epoch": 1027} {"train_loss": -21.35438346862793, "global_step": 85245, "epoch": 1027} {"train_loss": -21.28575325012207, "global_step": 85246, "epoch": 1027} {"train_loss": -21.106664657592773, "global_step": 85247, "epoch": 1027} {"train_loss": -21.385051727294922, "global_step": 85248, "epoch": 1027} {"train_loss": -21.23404312133789, "global_step": 85249, "epoch": 1027} {"train_loss": -21.126073837280273, "global_step": 85250, "epoch": 1027} {"train_loss": -21.154512405395508, "global_step": 85251, "epoch": 1027} {"train_loss": -21.398405075073242, "global_step": 85252, "epoch": 1027} {"train_loss": -21.47649383544922, "global_step": 85253, "epoch": 1027} {"train_loss": -21.157175064086914, "global_step": 85254, "epoch": 1027} {"train_loss": -21.312963485717773, "global_step": 85255, "epoch": 1027} {"train_loss": -21.443418502807617, "global_step": 85256, "epoch": 1027} {"train_loss": -21.29663848876953, "global_step": 85257, "epoch": 1027} {"train_loss": -21.14862060546875, "global_step": 85258, "epoch": 1027} {"train_loss": -21.383832931518555, "global_step": 85259, "epoch": 1027} {"train_loss": -21.26258087158203, "global_step": 85260, "epoch": 1027} {"train_loss": -21.375064849853516, "global_step": 85261, "epoch": 1027} {"train_loss": -21.260578155517578, "global_step": 85262, "epoch": 1027} {"train_loss": -21.13782501220703, "global_step": 85263, "epoch": 1027} {"train_loss": -21.459888458251953, "global_step": 85264, "epoch": 1027} {"train_loss": -21.28704261779785, "global_step": 85265, "epoch": 1027} {"train_loss": -21.32823944091797, "global_step": 85266, "epoch": 1027} {"train_loss": -21.34119987487793, "global_step": 85267, "epoch": 1027} {"train_loss": -21.6234188079834, "global_step": 85268, "epoch": 1027} {"train_loss": -21.140348434448242, "global_step": 85269, "epoch": 1027} {"train_loss": -21.100505828857422, "global_step": 85270, "epoch": 1027} {"train_loss": -21.70500373840332, "global_step": 85271, "epoch": 1027} {"train_loss": -21.041419982910156, "global_step": 85272, "epoch": 1027} {"train_loss": -20.88676643371582, "global_step": 85273, "epoch": 1027} {"train_loss": -21.154300689697266, "global_step": 85274, "epoch": 1027} {"train_loss": -21.220428466796875, "global_step": 85275, "epoch": 1027} {"train_loss": -21.884862899780273, "global_step": 85276, "epoch": 1027} {"train_loss": -21.1243839263916, "global_step": 85277, "epoch": 1027} {"train_loss": -21.26019859313965, "global_step": 85278, "epoch": 1027} {"train_loss": -21.347471237182617, "global_step": 85279, "epoch": 1027} {"train_loss": -21.257474899291992, "global_step": 85280, "epoch": 1027} {"train_loss": -21.119863510131836, "global_step": 85281, "epoch": 1027} {"train_loss": -21.010610580444336, "global_step": 85282, "epoch": 1027} {"train_loss": -21.0085391998291, "global_step": 85283, "epoch": 1027} {"train_loss": -21.2683162689209, "global_step": 85284, "epoch": 1027} {"train_loss": -21.34730339050293, "global_step": 85285, "epoch": 1027} {"train_loss": -21.452028274536133, "global_step": 85286, "epoch": 1027} {"train_loss": -21.47612953186035, "global_step": 85287, "epoch": 1027} {"train_loss": -21.265790939331055, "global_step": 85288, "epoch": 1027} {"train_loss": -21.19314956665039, "global_step": 85289, "epoch": 1027} {"train_loss": -21.027313232421875, "global_step": 85290, "epoch": 1027} {"train_loss": -21.407663345336914, "global_step": 85291, "epoch": 1027} {"train_loss": -21.82378578186035, "global_step": 85292, "epoch": 1027} {"train_loss": -21.628238677978516, "global_step": 85293, "epoch": 1027} {"train_loss": -21.628299713134766, "global_step": 85294, "epoch": 1027} {"train_loss": -21.301328659057617, "global_step": 85295, "epoch": 1027} {"train_loss": -21.529653549194336, "global_step": 85296, "epoch": 1027} {"train_loss": -21.351179122924805, "global_step": 85297, "epoch": 1027} {"train_loss": -21.58491325378418, "global_step": 85298, "epoch": 1027} {"train_loss": -21.634733200073242, "global_step": 85299, "epoch": 1027} {"train_loss": -21.23868751525879, "global_step": 85300, "epoch": 1027} {"train_loss": -21.298583984375, "global_step": 85301, "epoch": 1027} {"train_loss": -21.442363739013672, "global_step": 85302, "epoch": 1027} {"train_loss": -21.660797119140625, "global_step": 85303, "epoch": 1027} {"train_loss": -21.29844093322754, "global_step": 85304, "epoch": 1027} {"train_loss": -21.63154411315918, "global_step": 85305, "epoch": 1027} {"train_loss": -21.60272789001465, "global_step": 85306, "epoch": 1027} {"train_loss": -21.21685218811035, "global_step": 85307, "epoch": 1027} {"train_loss": -21.46381187438965, "global_step": 85308, "epoch": 1027} {"train_loss": -21.41555404663086, "global_step": 85309, "epoch": 1027} {"train_loss": -21.65464210510254, "global_step": 85310, "epoch": 1027} {"train_loss": -21.760395050048828, "global_step": 85311, "epoch": 1027} {"train_loss": -21.839094161987305, "global_step": 85312, "epoch": 1027} {"train_loss": -21.503767013549805, "global_step": 85313, "epoch": 1027} {"train_loss": -21.43525505065918, "global_step": 85314, "epoch": 1027} {"train_loss": -21.15996742248535, "global_step": 85315, "epoch": 1027} {"train_loss": -21.51934814453125, "global_step": 85316, "epoch": 1027} {"train_loss": -21.162199020385742, "global_step": 85317, "epoch": 1027} {"train_loss": -21.429691314697266, "global_step": 85318, "epoch": 1027} {"train_loss": -21.341495513916016, "global_step": 85319, "epoch": 1027} {"train_loss": -21.357702255249023, "global_step": 85320, "epoch": 1027} {"train_loss": -21.291793823242188, "global_step": 85321, "epoch": 1027} {"train_loss": -21.464099884033203, "global_step": 85322, "epoch": 1027} {"train_loss": -21.332369425210608, "global_step": 85323, "epoch": 1027, "val_loss": 6119300.0} {"train_loss": -21.210113525390625, "global_step": 85324, "epoch": 1028} {"train_loss": -20.966943740844727, "global_step": 85325, "epoch": 1028} {"train_loss": -21.05864906311035, "global_step": 85326, "epoch": 1028} {"train_loss": -21.474355697631836, "global_step": 85327, "epoch": 1028} {"train_loss": -20.9628963470459, "global_step": 85328, "epoch": 1028} {"train_loss": -21.287160873413086, "global_step": 85329, "epoch": 1028} {"train_loss": -21.12932586669922, "global_step": 85330, "epoch": 1028} {"train_loss": -21.103483200073242, "global_step": 85331, "epoch": 1028} {"train_loss": -21.28166961669922, "global_step": 85332, "epoch": 1028} {"train_loss": -21.003883361816406, "global_step": 85333, "epoch": 1028} {"train_loss": -21.521575927734375, "global_step": 85334, "epoch": 1028} {"train_loss": -20.759923934936523, "global_step": 85335, "epoch": 1028} {"train_loss": -21.19037437438965, "global_step": 85336, "epoch": 1028} {"train_loss": -21.013511657714844, "global_step": 85337, "epoch": 1028} {"train_loss": -21.26275634765625, "global_step": 85338, "epoch": 1028} {"train_loss": -21.34199333190918, "global_step": 85339, "epoch": 1028} {"train_loss": -21.733762741088867, "global_step": 85340, "epoch": 1028} {"train_loss": -21.41779136657715, "global_step": 85341, "epoch": 1028} {"train_loss": -21.3343505859375, "global_step": 85342, "epoch": 1028} {"train_loss": -21.408498764038086, "global_step": 85343, "epoch": 1028} {"train_loss": -21.42893409729004, "global_step": 85344, "epoch": 1028} {"train_loss": -21.431970596313477, "global_step": 85345, "epoch": 1028} {"train_loss": -21.205366134643555, "global_step": 85346, "epoch": 1028} {"train_loss": -21.358510971069336, "global_step": 85347, "epoch": 1028} {"train_loss": -21.655046463012695, "global_step": 85348, "epoch": 1028} {"train_loss": -21.335952758789062, "global_step": 85349, "epoch": 1028} {"train_loss": -21.52111053466797, "global_step": 85350, "epoch": 1028} {"train_loss": -21.958852767944336, "global_step": 85351, "epoch": 1028} {"train_loss": -21.498395919799805, "global_step": 85352, "epoch": 1028} {"train_loss": -21.530744552612305, "global_step": 85353, "epoch": 1028} {"train_loss": -21.60003662109375, "global_step": 85354, "epoch": 1028} {"train_loss": -21.602445602416992, "global_step": 85355, "epoch": 1028} {"train_loss": -21.26328468322754, "global_step": 85356, "epoch": 1028} {"train_loss": -21.670124053955078, "global_step": 85357, "epoch": 1028} {"train_loss": -21.530752182006836, "global_step": 85358, "epoch": 1028} {"train_loss": -21.636089324951172, "global_step": 85359, "epoch": 1028} {"train_loss": -21.179487228393555, "global_step": 85360, "epoch": 1028} {"train_loss": -21.12663459777832, "global_step": 85361, "epoch": 1028} {"train_loss": -21.390695571899414, "global_step": 85362, "epoch": 1028} {"train_loss": -21.607105255126953, "global_step": 85363, "epoch": 1028} {"train_loss": -20.95332145690918, "global_step": 85364, "epoch": 1028} {"train_loss": -21.368478775024414, "global_step": 85365, "epoch": 1028} {"train_loss": -21.810741424560547, "global_step": 85366, "epoch": 1028} {"train_loss": -21.224414825439453, "global_step": 85367, "epoch": 1028} {"train_loss": -21.572463989257812, "global_step": 85368, "epoch": 1028} {"train_loss": -21.66423225402832, "global_step": 85369, "epoch": 1028} {"train_loss": -21.59820556640625, "global_step": 85370, "epoch": 1028} {"train_loss": -21.651220321655273, "global_step": 85371, "epoch": 1028} {"train_loss": -21.648969650268555, "global_step": 85372, "epoch": 1028} {"train_loss": -21.321828842163086, "global_step": 85373, "epoch": 1028} {"train_loss": -21.7484130859375, "global_step": 85374, "epoch": 1028} {"train_loss": -21.286670684814453, "global_step": 85375, "epoch": 1028} {"train_loss": -21.56442642211914, "global_step": 85376, "epoch": 1028} {"train_loss": -21.136009216308594, "global_step": 85377, "epoch": 1028} {"train_loss": -21.442520141601562, "global_step": 85378, "epoch": 1028} {"train_loss": -21.57133674621582, "global_step": 85379, "epoch": 1028} {"train_loss": -21.27379608154297, "global_step": 85380, "epoch": 1028} {"train_loss": -21.813438415527344, "global_step": 85381, "epoch": 1028} {"train_loss": -21.257421493530273, "global_step": 85382, "epoch": 1028} {"train_loss": -21.69748878479004, "global_step": 85383, "epoch": 1028} {"train_loss": -21.741012573242188, "global_step": 85384, "epoch": 1028} {"train_loss": -21.09769630432129, "global_step": 85385, "epoch": 1028} {"train_loss": -21.797439575195312, "global_step": 85386, "epoch": 1028} {"train_loss": -21.35565757751465, "global_step": 85387, "epoch": 1028} {"train_loss": -21.255859375, "global_step": 85388, "epoch": 1028} {"train_loss": -21.366653442382812, "global_step": 85389, "epoch": 1028} {"train_loss": -21.801706314086914, "global_step": 85390, "epoch": 1028} {"train_loss": -21.285511016845703, "global_step": 85391, "epoch": 1028} {"train_loss": -21.250783920288086, "global_step": 85392, "epoch": 1028} {"train_loss": -21.466814041137695, "global_step": 85393, "epoch": 1028} {"train_loss": -21.467071533203125, "global_step": 85394, "epoch": 1028} {"train_loss": -21.546274185180664, "global_step": 85395, "epoch": 1028} {"train_loss": -21.469928741455078, "global_step": 85396, "epoch": 1028} {"train_loss": -21.431472778320312, "global_step": 85397, "epoch": 1028} {"train_loss": -21.062393188476562, "global_step": 85398, "epoch": 1028} {"train_loss": -21.60968780517578, "global_step": 85399, "epoch": 1028} {"train_loss": -21.27685546875, "global_step": 85400, "epoch": 1028} {"train_loss": -21.49349021911621, "global_step": 85401, "epoch": 1028} {"train_loss": -21.52735710144043, "global_step": 85402, "epoch": 1028} {"train_loss": -21.554136276245117, "global_step": 85403, "epoch": 1028} {"train_loss": -21.676305770874023, "global_step": 85404, "epoch": 1028} {"train_loss": -21.629980087280273, "global_step": 85405, "epoch": 1028} {"train_loss": -21.38831685537315, "global_step": 85406, "epoch": 1028, "val_loss": 6090201.0} {"train_loss": -20.93361473083496, "global_step": 85407, "epoch": 1029} {"train_loss": -21.413921356201172, "global_step": 85408, "epoch": 1029} {"train_loss": -21.416107177734375, "global_step": 85409, "epoch": 1029} {"train_loss": -21.35325050354004, "global_step": 85410, "epoch": 1029} {"train_loss": -21.165517807006836, "global_step": 85411, "epoch": 1029} {"train_loss": -21.298553466796875, "global_step": 85412, "epoch": 1029} {"train_loss": -21.40988540649414, "global_step": 85413, "epoch": 1029} {"train_loss": -21.447690963745117, "global_step": 85414, "epoch": 1029} {"train_loss": -20.968198776245117, "global_step": 85415, "epoch": 1029} {"train_loss": -21.752805709838867, "global_step": 85416, "epoch": 1029} {"train_loss": -21.223461151123047, "global_step": 85417, "epoch": 1029} {"train_loss": -21.18781089782715, "global_step": 85418, "epoch": 1029} {"train_loss": -21.281574249267578, "global_step": 85419, "epoch": 1029} {"train_loss": -21.37446403503418, "global_step": 85420, "epoch": 1029} {"train_loss": -21.39472198486328, "global_step": 85421, "epoch": 1029} {"train_loss": -21.408681869506836, "global_step": 85422, "epoch": 1029} {"train_loss": -21.209409713745117, "global_step": 85423, "epoch": 1029} {"train_loss": -21.471046447753906, "global_step": 85424, "epoch": 1029} {"train_loss": -21.472530364990234, "global_step": 85425, "epoch": 1029} {"train_loss": -21.265897750854492, "global_step": 85426, "epoch": 1029} {"train_loss": -21.370487213134766, "global_step": 85427, "epoch": 1029} {"train_loss": -21.27005386352539, "global_step": 85428, "epoch": 1029} {"train_loss": -21.61861228942871, "global_step": 85429, "epoch": 1029} {"train_loss": -21.420394897460938, "global_step": 85430, "epoch": 1029} {"train_loss": -20.810379028320312, "global_step": 85431, "epoch": 1029} {"train_loss": -21.23480796813965, "global_step": 85432, "epoch": 1029} {"train_loss": -21.454885482788086, "global_step": 85433, "epoch": 1029} {"train_loss": -21.593780517578125, "global_step": 85434, "epoch": 1029} {"train_loss": -21.371532440185547, "global_step": 85435, "epoch": 1029} {"train_loss": -21.289113998413086, "global_step": 85436, "epoch": 1029} {"train_loss": -21.512298583984375, "global_step": 85437, "epoch": 1029} {"train_loss": -21.919782638549805, "global_step": 85438, "epoch": 1029} {"train_loss": -21.338581085205078, "global_step": 85439, "epoch": 1029} {"train_loss": -21.320798873901367, "global_step": 85440, "epoch": 1029} {"train_loss": -21.159460067749023, "global_step": 85441, "epoch": 1029} {"train_loss": -21.072494506835938, "global_step": 85442, "epoch": 1029} {"train_loss": -21.342662811279297, "global_step": 85443, "epoch": 1029} {"train_loss": -21.217588424682617, "global_step": 85444, "epoch": 1029} {"train_loss": -21.594511032104492, "global_step": 85445, "epoch": 1029} {"train_loss": -21.46540641784668, "global_step": 85446, "epoch": 1029} {"train_loss": -21.45564079284668, "global_step": 85447, "epoch": 1029} {"train_loss": -21.64352798461914, "global_step": 85448, "epoch": 1029} {"train_loss": -21.672428131103516, "global_step": 85449, "epoch": 1029} {"train_loss": -20.773563385009766, "global_step": 85450, "epoch": 1029} {"train_loss": -21.436012268066406, "global_step": 85451, "epoch": 1029} {"train_loss": -21.470006942749023, "global_step": 85452, "epoch": 1029} {"train_loss": -21.45588493347168, "global_step": 85453, "epoch": 1029} {"train_loss": -21.372514724731445, "global_step": 85454, "epoch": 1029} {"train_loss": -21.25153923034668, "global_step": 85455, "epoch": 1029} {"train_loss": -21.473621368408203, "global_step": 85456, "epoch": 1029} {"train_loss": -21.76569175720215, "global_step": 85457, "epoch": 1029} {"train_loss": -21.50672721862793, "global_step": 85458, "epoch": 1029} {"train_loss": -21.90785026550293, "global_step": 85459, "epoch": 1029} {"train_loss": -21.613317489624023, "global_step": 85460, "epoch": 1029} {"train_loss": -21.39137077331543, "global_step": 85461, "epoch": 1029} {"train_loss": -21.272336959838867, "global_step": 85462, "epoch": 1029} {"train_loss": -21.233736038208008, "global_step": 85463, "epoch": 1029} {"train_loss": -21.30832290649414, "global_step": 85464, "epoch": 1029} {"train_loss": -21.10096549987793, "global_step": 85465, "epoch": 1029} {"train_loss": -21.605457305908203, "global_step": 85466, "epoch": 1029} {"train_loss": -21.63232421875, "global_step": 85467, "epoch": 1029} {"train_loss": -21.569427490234375, "global_step": 85468, "epoch": 1029} {"train_loss": -21.181299209594727, "global_step": 85469, "epoch": 1029} {"train_loss": -21.494409561157227, "global_step": 85470, "epoch": 1029} {"train_loss": -21.543975830078125, "global_step": 85471, "epoch": 1029} {"train_loss": -20.76797866821289, "global_step": 85472, "epoch": 1029} {"train_loss": -21.440887451171875, "global_step": 85473, "epoch": 1029} {"train_loss": -21.572874069213867, "global_step": 85474, "epoch": 1029} {"train_loss": -21.193723678588867, "global_step": 85475, "epoch": 1029} {"train_loss": -21.247831344604492, "global_step": 85476, "epoch": 1029} {"train_loss": -21.531564712524414, "global_step": 85477, "epoch": 1029} {"train_loss": -21.2861385345459, "global_step": 85478, "epoch": 1029} {"train_loss": -21.45813751220703, "global_step": 85479, "epoch": 1029} {"train_loss": -21.018909454345703, "global_step": 85480, "epoch": 1029} {"train_loss": -21.298114776611328, "global_step": 85481, "epoch": 1029} {"train_loss": -21.133033752441406, "global_step": 85482, "epoch": 1029} {"train_loss": -21.01049041748047, "global_step": 85483, "epoch": 1029} {"train_loss": -21.66810417175293, "global_step": 85484, "epoch": 1029} {"train_loss": -21.56061363220215, "global_step": 85485, "epoch": 1029} {"train_loss": -21.45523452758789, "global_step": 85486, "epoch": 1029} {"train_loss": -21.266111373901367, "global_step": 85487, "epoch": 1029} {"train_loss": -21.462583541870117, "global_step": 85488, "epoch": 1029} {"train_loss": -21.360818081591503, "global_step": 85489, "epoch": 1029, "val_loss": 6044597.0} {"train_loss": -20.630971908569336, "global_step": 85490, "epoch": 1030} {"train_loss": -20.695165634155273, "global_step": 85491, "epoch": 1030} {"train_loss": -20.996845245361328, "global_step": 85492, "epoch": 1030} {"train_loss": -20.794370651245117, "global_step": 85493, "epoch": 1030} {"train_loss": -21.228849411010742, "global_step": 85494, "epoch": 1030} {"train_loss": -20.948400497436523, "global_step": 85495, "epoch": 1030} {"train_loss": -21.132715225219727, "global_step": 85496, "epoch": 1030} {"train_loss": -21.2224178314209, "global_step": 85497, "epoch": 1030} {"train_loss": -20.758941650390625, "global_step": 85498, "epoch": 1030} {"train_loss": -21.143909454345703, "global_step": 85499, "epoch": 1030} {"train_loss": -21.060094833374023, "global_step": 85500, "epoch": 1030} {"train_loss": -21.063838958740234, "global_step": 85501, "epoch": 1030} {"train_loss": -21.10675621032715, "global_step": 85502, "epoch": 1030} {"train_loss": -21.282869338989258, "global_step": 85503, "epoch": 1030} {"train_loss": -21.33180809020996, "global_step": 85504, "epoch": 1030} {"train_loss": -21.043094635009766, "global_step": 85505, "epoch": 1030} {"train_loss": -21.432178497314453, "global_step": 85506, "epoch": 1030} {"train_loss": -21.601673126220703, "global_step": 85507, "epoch": 1030} {"train_loss": -21.578828811645508, "global_step": 85508, "epoch": 1030} {"train_loss": -21.586307525634766, "global_step": 85509, "epoch": 1030} {"train_loss": -21.003095626831055, "global_step": 85510, "epoch": 1030} {"train_loss": -21.519086837768555, "global_step": 85511, "epoch": 1030} {"train_loss": -21.500761032104492, "global_step": 85512, "epoch": 1030} {"train_loss": -21.516695022583008, "global_step": 85513, "epoch": 1030} {"train_loss": -21.250228881835938, "global_step": 85514, "epoch": 1030} {"train_loss": -21.367576599121094, "global_step": 85515, "epoch": 1030} {"train_loss": -21.572519302368164, "global_step": 85516, "epoch": 1030} {"train_loss": -21.32593536376953, "global_step": 85517, "epoch": 1030} {"train_loss": -21.381664276123047, "global_step": 85518, "epoch": 1030} {"train_loss": -21.4351749420166, "global_step": 85519, "epoch": 1030} {"train_loss": -21.401901245117188, "global_step": 85520, "epoch": 1030} {"train_loss": -21.370807647705078, "global_step": 85521, "epoch": 1030} {"train_loss": -21.480117797851562, "global_step": 85522, "epoch": 1030} {"train_loss": -21.0766658782959, "global_step": 85523, "epoch": 1030} {"train_loss": -21.45177459716797, "global_step": 85524, "epoch": 1030} {"train_loss": -21.245882034301758, "global_step": 85525, "epoch": 1030} {"train_loss": -21.553510665893555, "global_step": 85526, "epoch": 1030} {"train_loss": -21.53523063659668, "global_step": 85527, "epoch": 1030} {"train_loss": -20.964908599853516, "global_step": 85528, "epoch": 1030} {"train_loss": -21.372716903686523, "global_step": 85529, "epoch": 1030} {"train_loss": -21.55219078063965, "global_step": 85530, "epoch": 1030} {"train_loss": -21.4873046875, "global_step": 85531, "epoch": 1030} {"train_loss": -21.315824508666992, "global_step": 85532, "epoch": 1030} {"train_loss": -21.198440551757812, "global_step": 85533, "epoch": 1030} {"train_loss": -21.290754318237305, "global_step": 85534, "epoch": 1030} {"train_loss": -21.41672706604004, "global_step": 85535, "epoch": 1030} {"train_loss": -21.535884857177734, "global_step": 85536, "epoch": 1030} {"train_loss": -21.73865509033203, "global_step": 85537, "epoch": 1030} {"train_loss": -21.54286766052246, "global_step": 85538, "epoch": 1030} {"train_loss": -21.2833309173584, "global_step": 85539, "epoch": 1030} {"train_loss": -21.092273712158203, "global_step": 85540, "epoch": 1030} {"train_loss": -21.65769386291504, "global_step": 85541, "epoch": 1030} {"train_loss": -21.62678337097168, "global_step": 85542, "epoch": 1030} {"train_loss": -21.302831649780273, "global_step": 85543, "epoch": 1030} {"train_loss": -21.101150512695312, "global_step": 85544, "epoch": 1030} {"train_loss": -21.77876853942871, "global_step": 85545, "epoch": 1030} {"train_loss": -21.692218780517578, "global_step": 85546, "epoch": 1030} {"train_loss": -21.878360748291016, "global_step": 85547, "epoch": 1030} {"train_loss": -21.559738159179688, "global_step": 85548, "epoch": 1030} {"train_loss": -21.202268600463867, "global_step": 85549, "epoch": 1030} {"train_loss": -21.923622131347656, "global_step": 85550, "epoch": 1030} {"train_loss": -21.576284408569336, "global_step": 85551, "epoch": 1030} {"train_loss": -21.257848739624023, "global_step": 85552, "epoch": 1030} {"train_loss": -21.783727645874023, "global_step": 85553, "epoch": 1030} {"train_loss": -21.833084106445312, "global_step": 85554, "epoch": 1030} {"train_loss": -21.298187255859375, "global_step": 85555, "epoch": 1030} {"train_loss": -21.752321243286133, "global_step": 85556, "epoch": 1030} {"train_loss": -21.499738693237305, "global_step": 85557, "epoch": 1030} {"train_loss": -21.30548667907715, "global_step": 85558, "epoch": 1030} {"train_loss": -21.472116470336914, "global_step": 85559, "epoch": 1030} {"train_loss": -21.705408096313477, "global_step": 85560, "epoch": 1030} {"train_loss": -21.46670913696289, "global_step": 85561, "epoch": 1030} {"train_loss": -21.126602172851562, "global_step": 85562, "epoch": 1030} {"train_loss": -21.803861618041992, "global_step": 85563, "epoch": 1030} {"train_loss": -21.35573387145996, "global_step": 85564, "epoch": 1030} {"train_loss": -21.93547248840332, "global_step": 85565, "epoch": 1030} {"train_loss": -21.68120002746582, "global_step": 85566, "epoch": 1030} {"train_loss": -21.778995513916016, "global_step": 85567, "epoch": 1030} {"train_loss": -21.361799240112305, "global_step": 85568, "epoch": 1030} {"train_loss": -21.443716049194336, "global_step": 85569, "epoch": 1030} {"train_loss": -20.956315994262695, "global_step": 85570, "epoch": 1030} {"train_loss": -21.28367042541504, "global_step": 85571, "epoch": 1030} {"train_loss": -21.384012199309936, "global_step": 85572, "epoch": 1030, "val_loss": 6176393.0} {"train_loss": -21.435026168823242, "global_step": 85573, "epoch": 1031} {"train_loss": -21.582639694213867, "global_step": 85574, "epoch": 1031} {"train_loss": -21.21336555480957, "global_step": 85575, "epoch": 1031} {"train_loss": -21.60609245300293, "global_step": 85576, "epoch": 1031} {"train_loss": -20.878944396972656, "global_step": 85577, "epoch": 1031} {"train_loss": -21.418912887573242, "global_step": 85578, "epoch": 1031} {"train_loss": -21.289968490600586, "global_step": 85579, "epoch": 1031} {"train_loss": -20.87408447265625, "global_step": 85580, "epoch": 1031} {"train_loss": -21.074615478515625, "global_step": 85581, "epoch": 1031} {"train_loss": -21.270906448364258, "global_step": 85582, "epoch": 1031} {"train_loss": -21.544111251831055, "global_step": 85583, "epoch": 1031} {"train_loss": -21.277700424194336, "global_step": 85584, "epoch": 1031} {"train_loss": -21.63776969909668, "global_step": 85585, "epoch": 1031} {"train_loss": -20.90264129638672, "global_step": 85586, "epoch": 1031} {"train_loss": -21.501117706298828, "global_step": 85587, "epoch": 1031} {"train_loss": -21.051910400390625, "global_step": 85588, "epoch": 1031} {"train_loss": -21.279386520385742, "global_step": 85589, "epoch": 1031} {"train_loss": -21.63348388671875, "global_step": 85590, "epoch": 1031} {"train_loss": -21.43273162841797, "global_step": 85591, "epoch": 1031} {"train_loss": -21.10395050048828, "global_step": 85592, "epoch": 1031} {"train_loss": -21.362268447875977, "global_step": 85593, "epoch": 1031} {"train_loss": -21.861404418945312, "global_step": 85594, "epoch": 1031} {"train_loss": -21.361499786376953, "global_step": 85595, "epoch": 1031} {"train_loss": -21.388967514038086, "global_step": 85596, "epoch": 1031} {"train_loss": -21.16583824157715, "global_step": 85597, "epoch": 1031} {"train_loss": -21.480087280273438, "global_step": 85598, "epoch": 1031} {"train_loss": -21.31993293762207, "global_step": 85599, "epoch": 1031} {"train_loss": -21.5094051361084, "global_step": 85600, "epoch": 1031} {"train_loss": -21.526397705078125, "global_step": 85601, "epoch": 1031} {"train_loss": -21.54193687438965, "global_step": 85602, "epoch": 1031} {"train_loss": -21.287504196166992, "global_step": 85603, "epoch": 1031} {"train_loss": -21.28611183166504, "global_step": 85604, "epoch": 1031} {"train_loss": -21.138334274291992, "global_step": 85605, "epoch": 1031} {"train_loss": -21.050830841064453, "global_step": 85606, "epoch": 1031} {"train_loss": -21.559396743774414, "global_step": 85607, "epoch": 1031} {"train_loss": -21.252525329589844, "global_step": 85608, "epoch": 1031} {"train_loss": -21.85321617126465, "global_step": 85609, "epoch": 1031} {"train_loss": -20.988534927368164, "global_step": 85610, "epoch": 1031} {"train_loss": -21.343551635742188, "global_step": 85611, "epoch": 1031} {"train_loss": -21.561674118041992, "global_step": 85612, "epoch": 1031} {"train_loss": -21.555103302001953, "global_step": 85613, "epoch": 1031} {"train_loss": -21.59016990661621, "global_step": 85614, "epoch": 1031} {"train_loss": -21.4761905670166, "global_step": 85615, "epoch": 1031} {"train_loss": -21.562213897705078, "global_step": 85616, "epoch": 1031} {"train_loss": -21.432308197021484, "global_step": 85617, "epoch": 1031} {"train_loss": -21.44999122619629, "global_step": 85618, "epoch": 1031} {"train_loss": -21.895830154418945, "global_step": 85619, "epoch": 1031} {"train_loss": -21.410266876220703, "global_step": 85620, "epoch": 1031} {"train_loss": -21.469684600830078, "global_step": 85621, "epoch": 1031} {"train_loss": -21.34343910217285, "global_step": 85622, "epoch": 1031} {"train_loss": -21.663352966308594, "global_step": 85623, "epoch": 1031} {"train_loss": -21.381351470947266, "global_step": 85624, "epoch": 1031} {"train_loss": -21.55028533935547, "global_step": 85625, "epoch": 1031} {"train_loss": -21.62066650390625, "global_step": 85626, "epoch": 1031} {"train_loss": -21.547744750976562, "global_step": 85627, "epoch": 1031} {"train_loss": -21.106435775756836, "global_step": 85628, "epoch": 1031} {"train_loss": -21.330459594726562, "global_step": 85629, "epoch": 1031} {"train_loss": -21.266294479370117, "global_step": 85630, "epoch": 1031} {"train_loss": -21.47822380065918, "global_step": 85631, "epoch": 1031} {"train_loss": -21.739871978759766, "global_step": 85632, "epoch": 1031} {"train_loss": -21.268991470336914, "global_step": 85633, "epoch": 1031} {"train_loss": -21.606576919555664, "global_step": 85634, "epoch": 1031} {"train_loss": -21.294170379638672, "global_step": 85635, "epoch": 1031} {"train_loss": -21.341468811035156, "global_step": 85636, "epoch": 1031} {"train_loss": -20.993215560913086, "global_step": 85637, "epoch": 1031} {"train_loss": -21.519405364990234, "global_step": 85638, "epoch": 1031} {"train_loss": -21.087589263916016, "global_step": 85639, "epoch": 1031} {"train_loss": -20.98164939880371, "global_step": 85640, "epoch": 1031} {"train_loss": -21.339380264282227, "global_step": 85641, "epoch": 1031} {"train_loss": -21.597265243530273, "global_step": 85642, "epoch": 1031} {"train_loss": -21.356382369995117, "global_step": 85643, "epoch": 1031} {"train_loss": -21.441635131835938, "global_step": 85644, "epoch": 1031} {"train_loss": -21.45583724975586, "global_step": 85645, "epoch": 1031} {"train_loss": -20.934534072875977, "global_step": 85646, "epoch": 1031} {"train_loss": -21.301563262939453, "global_step": 85647, "epoch": 1031} {"train_loss": -21.500158309936523, "global_step": 85648, "epoch": 1031} {"train_loss": -21.772741317749023, "global_step": 85649, "epoch": 1031} {"train_loss": -21.692472457885742, "global_step": 85650, "epoch": 1031} {"train_loss": -21.5479736328125, "global_step": 85651, "epoch": 1031} {"train_loss": -21.142820358276367, "global_step": 85652, "epoch": 1031} {"train_loss": -21.595956802368164, "global_step": 85653, "epoch": 1031} {"train_loss": -21.1765193939209, "global_step": 85654, "epoch": 1031} {"train_loss": -21.39024778159268, "global_step": 85655, "epoch": 1031, "val_loss": 6021582.0} {"train_loss": -20.515422821044922, "global_step": 85656, "epoch": 1032} {"train_loss": -21.059354782104492, "global_step": 85657, "epoch": 1032} {"train_loss": -20.88051414489746, "global_step": 85658, "epoch": 1032} {"train_loss": -20.849790573120117, "global_step": 85659, "epoch": 1032} {"train_loss": -20.86244010925293, "global_step": 85660, "epoch": 1032} {"train_loss": -20.884431838989258, "global_step": 85661, "epoch": 1032} {"train_loss": -21.08291244506836, "global_step": 85662, "epoch": 1032} {"train_loss": -20.925098419189453, "global_step": 85663, "epoch": 1032} {"train_loss": -21.051801681518555, "global_step": 85664, "epoch": 1032} {"train_loss": -21.07747459411621, "global_step": 85665, "epoch": 1032} {"train_loss": -20.73232650756836, "global_step": 85666, "epoch": 1032} {"train_loss": -21.20249366760254, "global_step": 85667, "epoch": 1032} {"train_loss": -20.709516525268555, "global_step": 85668, "epoch": 1032} {"train_loss": -21.108787536621094, "global_step": 85669, "epoch": 1032} {"train_loss": -21.227415084838867, "global_step": 85670, "epoch": 1032} {"train_loss": -21.27034568786621, "global_step": 85671, "epoch": 1032} {"train_loss": -21.375680923461914, "global_step": 85672, "epoch": 1032} {"train_loss": -21.423660278320312, "global_step": 85673, "epoch": 1032} {"train_loss": -21.273244857788086, "global_step": 85674, "epoch": 1032} {"train_loss": -21.393503189086914, "global_step": 85675, "epoch": 1032} {"train_loss": -21.240854263305664, "global_step": 85676, "epoch": 1032} {"train_loss": -21.668136596679688, "global_step": 85677, "epoch": 1032} {"train_loss": -21.40958023071289, "global_step": 85678, "epoch": 1032} {"train_loss": -21.763879776000977, "global_step": 85679, "epoch": 1032} {"train_loss": -21.49108123779297, "global_step": 85680, "epoch": 1032} {"train_loss": -21.58228302001953, "global_step": 85681, "epoch": 1032} {"train_loss": -21.509199142456055, "global_step": 85682, "epoch": 1032} {"train_loss": -21.22892189025879, "global_step": 85683, "epoch": 1032} {"train_loss": -21.118972778320312, "global_step": 85684, "epoch": 1032} {"train_loss": -21.000701904296875, "global_step": 85685, "epoch": 1032} {"train_loss": -21.19502830505371, "global_step": 85686, "epoch": 1032} {"train_loss": -21.527021408081055, "global_step": 85687, "epoch": 1032} {"train_loss": -21.51222801208496, "global_step": 85688, "epoch": 1032} {"train_loss": -21.833995819091797, "global_step": 85689, "epoch": 1032} {"train_loss": -21.4856014251709, "global_step": 85690, "epoch": 1032} {"train_loss": -21.486452102661133, "global_step": 85691, "epoch": 1032} {"train_loss": -21.085302352905273, "global_step": 85692, "epoch": 1032} {"train_loss": -21.386764526367188, "global_step": 85693, "epoch": 1032} {"train_loss": -21.266530990600586, "global_step": 85694, "epoch": 1032} {"train_loss": -21.114845275878906, "global_step": 85695, "epoch": 1032} {"train_loss": -21.628896713256836, "global_step": 85696, "epoch": 1032} {"train_loss": -21.493444442749023, "global_step": 85697, "epoch": 1032} {"train_loss": -21.390172958374023, "global_step": 85698, "epoch": 1032} {"train_loss": -21.4765682220459, "global_step": 85699, "epoch": 1032} {"train_loss": -21.339670181274414, "global_step": 85700, "epoch": 1032} {"train_loss": -21.63852310180664, "global_step": 85701, "epoch": 1032} {"train_loss": -21.460092544555664, "global_step": 85702, "epoch": 1032} {"train_loss": -21.591411590576172, "global_step": 85703, "epoch": 1032} {"train_loss": -21.2642879486084, "global_step": 85704, "epoch": 1032} {"train_loss": -21.681913375854492, "global_step": 85705, "epoch": 1032} {"train_loss": -21.484758377075195, "global_step": 85706, "epoch": 1032} {"train_loss": -21.312528610229492, "global_step": 85707, "epoch": 1032} {"train_loss": -21.416217803955078, "global_step": 85708, "epoch": 1032} {"train_loss": -21.458236694335938, "global_step": 85709, "epoch": 1032} {"train_loss": -21.520496368408203, "global_step": 85710, "epoch": 1032} {"train_loss": -21.426172256469727, "global_step": 85711, "epoch": 1032} {"train_loss": -21.56426429748535, "global_step": 85712, "epoch": 1032} {"train_loss": -21.3823184967041, "global_step": 85713, "epoch": 1032} {"train_loss": -21.509790420532227, "global_step": 85714, "epoch": 1032} {"train_loss": -21.424772262573242, "global_step": 85715, "epoch": 1032} {"train_loss": -21.394941329956055, "global_step": 85716, "epoch": 1032} {"train_loss": -21.336042404174805, "global_step": 85717, "epoch": 1032} {"train_loss": -21.2495059967041, "global_step": 85718, "epoch": 1032} {"train_loss": -21.535659790039062, "global_step": 85719, "epoch": 1032} {"train_loss": -21.2007999420166, "global_step": 85720, "epoch": 1032} {"train_loss": -21.723928451538086, "global_step": 85721, "epoch": 1032} {"train_loss": -21.853282928466797, "global_step": 85722, "epoch": 1032} {"train_loss": -21.718732833862305, "global_step": 85723, "epoch": 1032} {"train_loss": -21.669946670532227, "global_step": 85724, "epoch": 1032} {"train_loss": -21.49445152282715, "global_step": 85725, "epoch": 1032} {"train_loss": -21.52292251586914, "global_step": 85726, "epoch": 1032} {"train_loss": -21.64532470703125, "global_step": 85727, "epoch": 1032} {"train_loss": -21.626962661743164, "global_step": 85728, "epoch": 1032} {"train_loss": -21.36746597290039, "global_step": 85729, "epoch": 1032} {"train_loss": -21.691877365112305, "global_step": 85730, "epoch": 1032} {"train_loss": -21.50473976135254, "global_step": 85731, "epoch": 1032} {"train_loss": -21.383609771728516, "global_step": 85732, "epoch": 1032} {"train_loss": -21.299163818359375, "global_step": 85733, "epoch": 1032} {"train_loss": -21.201810836791992, "global_step": 85734, "epoch": 1032} {"train_loss": -21.56850242614746, "global_step": 85735, "epoch": 1032} {"train_loss": -21.26753807067871, "global_step": 85736, "epoch": 1032} {"train_loss": -21.54636573791504, "global_step": 85737, "epoch": 1032} {"train_loss": -21.352709299110504, "global_step": 85738, "epoch": 1032, "val_loss": 5964827.0} {"train_loss": -20.36958122253418, "global_step": 85739, "epoch": 1033} {"train_loss": -20.854887008666992, "global_step": 85740, "epoch": 1033} {"train_loss": -20.847593307495117, "global_step": 85741, "epoch": 1033} {"train_loss": -20.53889274597168, "global_step": 85742, "epoch": 1033} {"train_loss": -20.206552505493164, "global_step": 85743, "epoch": 1033} {"train_loss": -20.781705856323242, "global_step": 85744, "epoch": 1033} {"train_loss": -20.859619140625, "global_step": 85745, "epoch": 1033} {"train_loss": -20.74983787536621, "global_step": 85746, "epoch": 1033} {"train_loss": -21.324756622314453, "global_step": 85747, "epoch": 1033} {"train_loss": -21.008514404296875, "global_step": 85748, "epoch": 1033} {"train_loss": -20.979408264160156, "global_step": 85749, "epoch": 1033} {"train_loss": -20.81956672668457, "global_step": 85750, "epoch": 1033} {"train_loss": -21.003238677978516, "global_step": 85751, "epoch": 1033} {"train_loss": -20.8825740814209, "global_step": 85752, "epoch": 1033} {"train_loss": -21.162460327148438, "global_step": 85753, "epoch": 1033} {"train_loss": -21.148298263549805, "global_step": 85754, "epoch": 1033} {"train_loss": -21.241609573364258, "global_step": 85755, "epoch": 1033} {"train_loss": -21.07411766052246, "global_step": 85756, "epoch": 1033} {"train_loss": -21.265256881713867, "global_step": 85757, "epoch": 1033} {"train_loss": -21.136005401611328, "global_step": 85758, "epoch": 1033} {"train_loss": -21.451766967773438, "global_step": 85759, "epoch": 1033} {"train_loss": -21.11683464050293, "global_step": 85760, "epoch": 1033} {"train_loss": -20.99028968811035, "global_step": 85761, "epoch": 1033} {"train_loss": -21.020734786987305, "global_step": 85762, "epoch": 1033} {"train_loss": -21.59480094909668, "global_step": 85763, "epoch": 1033} {"train_loss": -21.27724266052246, "global_step": 85764, "epoch": 1033} {"train_loss": -21.4601993560791, "global_step": 85765, "epoch": 1033} {"train_loss": -21.330846786499023, "global_step": 85766, "epoch": 1033} {"train_loss": -21.465681076049805, "global_step": 85767, "epoch": 1033} {"train_loss": -21.304706573486328, "global_step": 85768, "epoch": 1033} {"train_loss": -20.935636520385742, "global_step": 85769, "epoch": 1033} {"train_loss": -21.353485107421875, "global_step": 85770, "epoch": 1033} {"train_loss": -21.233381271362305, "global_step": 85771, "epoch": 1033} {"train_loss": -21.46620750427246, "global_step": 85772, "epoch": 1033} {"train_loss": -21.367021560668945, "global_step": 85773, "epoch": 1033} {"train_loss": -21.926855087280273, "global_step": 85774, "epoch": 1033} {"train_loss": -21.341176986694336, "global_step": 85775, "epoch": 1033} {"train_loss": -21.114988327026367, "global_step": 85776, "epoch": 1033} {"train_loss": -21.372568130493164, "global_step": 85777, "epoch": 1033} {"train_loss": -21.648365020751953, "global_step": 85778, "epoch": 1033} {"train_loss": -21.28443717956543, "global_step": 85779, "epoch": 1033} {"train_loss": -21.35820198059082, "global_step": 85780, "epoch": 1033} {"train_loss": -21.417003631591797, "global_step": 85781, "epoch": 1033} {"train_loss": -21.7778263092041, "global_step": 85782, "epoch": 1033} {"train_loss": -21.522069931030273, "global_step": 85783, "epoch": 1033} {"train_loss": -21.479448318481445, "global_step": 85784, "epoch": 1033} {"train_loss": -21.497838973999023, "global_step": 85785, "epoch": 1033} {"train_loss": -21.59977149963379, "global_step": 85786, "epoch": 1033} {"train_loss": -21.543193817138672, "global_step": 85787, "epoch": 1033} {"train_loss": -21.474185943603516, "global_step": 85788, "epoch": 1033} {"train_loss": -21.37421989440918, "global_step": 85789, "epoch": 1033} {"train_loss": -21.453279495239258, "global_step": 85790, "epoch": 1033} {"train_loss": -21.19846534729004, "global_step": 85791, "epoch": 1033} {"train_loss": -21.68459129333496, "global_step": 85792, "epoch": 1033} {"train_loss": -21.490493774414062, "global_step": 85793, "epoch": 1033} {"train_loss": -21.635183334350586, "global_step": 85794, "epoch": 1033} {"train_loss": -21.627111434936523, "global_step": 85795, "epoch": 1033} {"train_loss": -21.503599166870117, "global_step": 85796, "epoch": 1033} {"train_loss": -21.384775161743164, "global_step": 85797, "epoch": 1033} {"train_loss": -21.308027267456055, "global_step": 85798, "epoch": 1033} {"train_loss": -21.505828857421875, "global_step": 85799, "epoch": 1033} {"train_loss": -21.346088409423828, "global_step": 85800, "epoch": 1033} {"train_loss": -21.45670509338379, "global_step": 85801, "epoch": 1033} {"train_loss": -21.492979049682617, "global_step": 85802, "epoch": 1033} {"train_loss": -21.012466430664062, "global_step": 85803, "epoch": 1033} {"train_loss": -21.318164825439453, "global_step": 85804, "epoch": 1033} {"train_loss": -21.308025360107422, "global_step": 85805, "epoch": 1033} {"train_loss": -21.463830947875977, "global_step": 85806, "epoch": 1033} {"train_loss": -21.299448013305664, "global_step": 85807, "epoch": 1033} {"train_loss": -21.197317123413086, "global_step": 85808, "epoch": 1033} {"train_loss": -21.488561630249023, "global_step": 85809, "epoch": 1033} {"train_loss": -21.481908798217773, "global_step": 85810, "epoch": 1033} {"train_loss": -21.536863327026367, "global_step": 85811, "epoch": 1033} {"train_loss": -21.32498550415039, "global_step": 85812, "epoch": 1033} {"train_loss": -21.437047958374023, "global_step": 85813, "epoch": 1033} {"train_loss": -21.466222763061523, "global_step": 85814, "epoch": 1033} {"train_loss": -21.39274787902832, "global_step": 85815, "epoch": 1033} {"train_loss": -21.47286033630371, "global_step": 85816, "epoch": 1033} {"train_loss": -21.606849670410156, "global_step": 85817, "epoch": 1033} {"train_loss": -21.117759704589844, "global_step": 85818, "epoch": 1033} {"train_loss": -21.512462615966797, "global_step": 85819, "epoch": 1033} {"train_loss": -21.687170028686523, "global_step": 85820, "epoch": 1033} {"train_loss": -21.291410216365954, "global_step": 85821, "epoch": 1033, "val_loss": 6106358.0} {"train_loss": -20.45815658569336, "global_step": 85822, "epoch": 1034} {"train_loss": -21.158573150634766, "global_step": 85823, "epoch": 1034} {"train_loss": -20.541168212890625, "global_step": 85824, "epoch": 1034} {"train_loss": -21.22271156311035, "global_step": 85825, "epoch": 1034} {"train_loss": -20.50797462463379, "global_step": 85826, "epoch": 1034} {"train_loss": -21.313032150268555, "global_step": 85827, "epoch": 1034} {"train_loss": -21.228666305541992, "global_step": 85828, "epoch": 1034} {"train_loss": -20.968326568603516, "global_step": 85829, "epoch": 1034} {"train_loss": -21.012937545776367, "global_step": 85830, "epoch": 1034} {"train_loss": -21.07132339477539, "global_step": 85831, "epoch": 1034} {"train_loss": -21.00520133972168, "global_step": 85832, "epoch": 1034} {"train_loss": -21.357120513916016, "global_step": 85833, "epoch": 1034} {"train_loss": -21.032041549682617, "global_step": 85834, "epoch": 1034} {"train_loss": -21.537811279296875, "global_step": 85835, "epoch": 1034} {"train_loss": -21.403966903686523, "global_step": 85836, "epoch": 1034} {"train_loss": -21.34259033203125, "global_step": 85837, "epoch": 1034} {"train_loss": -21.595226287841797, "global_step": 85838, "epoch": 1034} {"train_loss": -21.004486083984375, "global_step": 85839, "epoch": 1034} {"train_loss": -21.33942985534668, "global_step": 85840, "epoch": 1034} {"train_loss": -21.239086151123047, "global_step": 85841, "epoch": 1034} {"train_loss": -21.3299503326416, "global_step": 85842, "epoch": 1034} {"train_loss": -21.53580665588379, "global_step": 85843, "epoch": 1034} {"train_loss": -21.306427001953125, "global_step": 85844, "epoch": 1034} {"train_loss": -21.122495651245117, "global_step": 85845, "epoch": 1034} {"train_loss": -21.315065383911133, "global_step": 85846, "epoch": 1034} {"train_loss": -21.208786010742188, "global_step": 85847, "epoch": 1034} {"train_loss": -21.59056854248047, "global_step": 85848, "epoch": 1034} {"train_loss": -21.08144187927246, "global_step": 85849, "epoch": 1034} {"train_loss": -21.250247955322266, "global_step": 85850, "epoch": 1034} {"train_loss": -21.49831771850586, "global_step": 85851, "epoch": 1034} {"train_loss": -21.253681182861328, "global_step": 85852, "epoch": 1034} {"train_loss": -21.190664291381836, "global_step": 85853, "epoch": 1034} {"train_loss": -21.179317474365234, "global_step": 85854, "epoch": 1034} {"train_loss": -20.881147384643555, "global_step": 85855, "epoch": 1034} {"train_loss": -21.39497184753418, "global_step": 85856, "epoch": 1034} {"train_loss": -21.245698928833008, "global_step": 85857, "epoch": 1034} {"train_loss": -21.16169548034668, "global_step": 85858, "epoch": 1034} {"train_loss": -21.478017807006836, "global_step": 85859, "epoch": 1034} {"train_loss": -21.045080184936523, "global_step": 85860, "epoch": 1034} {"train_loss": -21.337146759033203, "global_step": 85861, "epoch": 1034} {"train_loss": -21.353832244873047, "global_step": 85862, "epoch": 1034} {"train_loss": -21.221750259399414, "global_step": 85863, "epoch": 1034} {"train_loss": -21.679655075073242, "global_step": 85864, "epoch": 1034} {"train_loss": -21.368650436401367, "global_step": 85865, "epoch": 1034} {"train_loss": -21.326889038085938, "global_step": 85866, "epoch": 1034} {"train_loss": -21.140974044799805, "global_step": 85867, "epoch": 1034} {"train_loss": -21.64219093322754, "global_step": 85868, "epoch": 1034} {"train_loss": -21.833288192749023, "global_step": 85869, "epoch": 1034} {"train_loss": -21.570730209350586, "global_step": 85870, "epoch": 1034} {"train_loss": -21.399551391601562, "global_step": 85871, "epoch": 1034} {"train_loss": -21.160062789916992, "global_step": 85872, "epoch": 1034} {"train_loss": -21.26250648498535, "global_step": 85873, "epoch": 1034} {"train_loss": -21.65153694152832, "global_step": 85874, "epoch": 1034} {"train_loss": -21.023771286010742, "global_step": 85875, "epoch": 1034} {"train_loss": -21.260528564453125, "global_step": 85876, "epoch": 1034} {"train_loss": -21.524993896484375, "global_step": 85877, "epoch": 1034} {"train_loss": -21.445768356323242, "global_step": 85878, "epoch": 1034} {"train_loss": -21.516183853149414, "global_step": 85879, "epoch": 1034} {"train_loss": -21.689842224121094, "global_step": 85880, "epoch": 1034} {"train_loss": -21.167875289916992, "global_step": 85881, "epoch": 1034} {"train_loss": -21.345457077026367, "global_step": 85882, "epoch": 1034} {"train_loss": -21.675853729248047, "global_step": 85883, "epoch": 1034} {"train_loss": -20.57489013671875, "global_step": 85884, "epoch": 1034} {"train_loss": -21.503469467163086, "global_step": 85885, "epoch": 1034} {"train_loss": -21.067394256591797, "global_step": 85886, "epoch": 1034} {"train_loss": -21.253681182861328, "global_step": 85887, "epoch": 1034} {"train_loss": -21.54737663269043, "global_step": 85888, "epoch": 1034} {"train_loss": -21.253950119018555, "global_step": 85889, "epoch": 1034} {"train_loss": -21.35927391052246, "global_step": 85890, "epoch": 1034} {"train_loss": -21.000144958496094, "global_step": 85891, "epoch": 1034} {"train_loss": -21.415771484375, "global_step": 85892, "epoch": 1034} {"train_loss": -21.5256290435791, "global_step": 85893, "epoch": 1034} {"train_loss": -21.476049423217773, "global_step": 85894, "epoch": 1034} {"train_loss": -21.43470573425293, "global_step": 85895, "epoch": 1034} {"train_loss": -21.209508895874023, "global_step": 85896, "epoch": 1034} {"train_loss": -21.502286911010742, "global_step": 85897, "epoch": 1034} {"train_loss": -21.81622886657715, "global_step": 85898, "epoch": 1034} {"train_loss": -21.48933219909668, "global_step": 85899, "epoch": 1034} {"train_loss": -21.41250991821289, "global_step": 85900, "epoch": 1034} {"train_loss": -21.61594009399414, "global_step": 85901, "epoch": 1034} {"train_loss": -21.52964973449707, "global_step": 85902, "epoch": 1034} {"train_loss": -21.3160343170166, "global_step": 85903, "epoch": 1034} {"train_loss": -21.301696685423334, "global_step": 85904, "epoch": 1034, "val_loss": 6090537.5} {"train_loss": -20.925046920776367, "global_step": 85905, "epoch": 1035} {"train_loss": -20.74812126159668, "global_step": 85906, "epoch": 1035} {"train_loss": -21.19002342224121, "global_step": 85907, "epoch": 1035} {"train_loss": -21.180500030517578, "global_step": 85908, "epoch": 1035} {"train_loss": -21.54230499267578, "global_step": 85909, "epoch": 1035} {"train_loss": -21.174137115478516, "global_step": 85910, "epoch": 1035} {"train_loss": -21.33713150024414, "global_step": 85911, "epoch": 1035} {"train_loss": -21.174488067626953, "global_step": 85912, "epoch": 1035} {"train_loss": -21.485456466674805, "global_step": 85913, "epoch": 1035} {"train_loss": -21.740365982055664, "global_step": 85914, "epoch": 1035} {"train_loss": -21.4002628326416, "global_step": 85915, "epoch": 1035} {"train_loss": -21.677942276000977, "global_step": 85916, "epoch": 1035} {"train_loss": -21.522550582885742, "global_step": 85917, "epoch": 1035} {"train_loss": -21.516983032226562, "global_step": 85918, "epoch": 1035} {"train_loss": -21.173538208007812, "global_step": 85919, "epoch": 1035} {"train_loss": -21.541357040405273, "global_step": 85920, "epoch": 1035} {"train_loss": -21.381784439086914, "global_step": 85921, "epoch": 1035} {"train_loss": -20.935224533081055, "global_step": 85922, "epoch": 1035} {"train_loss": -21.241065979003906, "global_step": 85923, "epoch": 1035} {"train_loss": -21.377416610717773, "global_step": 85924, "epoch": 1035} {"train_loss": -21.349672317504883, "global_step": 85925, "epoch": 1035} {"train_loss": -21.533926010131836, "global_step": 85926, "epoch": 1035} {"train_loss": -21.93434715270996, "global_step": 85927, "epoch": 1035} {"train_loss": -21.373655319213867, "global_step": 85928, "epoch": 1035} {"train_loss": -21.22800636291504, "global_step": 85929, "epoch": 1035} {"train_loss": -21.42474365234375, "global_step": 85930, "epoch": 1035} {"train_loss": -21.491567611694336, "global_step": 85931, "epoch": 1035} {"train_loss": -21.367935180664062, "global_step": 85932, "epoch": 1035} {"train_loss": -21.87173843383789, "global_step": 85933, "epoch": 1035} {"train_loss": -21.409812927246094, "global_step": 85934, "epoch": 1035} {"train_loss": -21.627317428588867, "global_step": 85935, "epoch": 1035} {"train_loss": -21.728130340576172, "global_step": 85936, "epoch": 1035} {"train_loss": -21.372196197509766, "global_step": 85937, "epoch": 1035} {"train_loss": -21.625242233276367, "global_step": 85938, "epoch": 1035} {"train_loss": -21.2086238861084, "global_step": 85939, "epoch": 1035} {"train_loss": -21.842456817626953, "global_step": 85940, "epoch": 1035} {"train_loss": -21.255735397338867, "global_step": 85941, "epoch": 1035} {"train_loss": -21.502744674682617, "global_step": 85942, "epoch": 1035} {"train_loss": -21.480300903320312, "global_step": 85943, "epoch": 1035} {"train_loss": -21.404661178588867, "global_step": 85944, "epoch": 1035} {"train_loss": -21.580297470092773, "global_step": 85945, "epoch": 1035} {"train_loss": -21.357440948486328, "global_step": 85946, "epoch": 1035} {"train_loss": -21.680631637573242, "global_step": 85947, "epoch": 1035} {"train_loss": -21.76729965209961, "global_step": 85948, "epoch": 1035} {"train_loss": -21.167922973632812, "global_step": 85949, "epoch": 1035} {"train_loss": -21.518978118896484, "global_step": 85950, "epoch": 1035} {"train_loss": -21.404052734375, "global_step": 85951, "epoch": 1035} {"train_loss": -21.110843658447266, "global_step": 85952, "epoch": 1035} {"train_loss": -21.57366371154785, "global_step": 85953, "epoch": 1035} {"train_loss": -21.454797744750977, "global_step": 85954, "epoch": 1035} {"train_loss": -21.592758178710938, "global_step": 85955, "epoch": 1035} {"train_loss": -21.785581588745117, "global_step": 85956, "epoch": 1035} {"train_loss": -21.473373413085938, "global_step": 85957, "epoch": 1035} {"train_loss": -21.56827163696289, "global_step": 85958, "epoch": 1035} {"train_loss": -21.456716537475586, "global_step": 85959, "epoch": 1035} {"train_loss": -21.235862731933594, "global_step": 85960, "epoch": 1035} {"train_loss": -21.555585861206055, "global_step": 85961, "epoch": 1035} {"train_loss": -21.91501235961914, "global_step": 85962, "epoch": 1035} {"train_loss": -21.82337760925293, "global_step": 85963, "epoch": 1035} {"train_loss": -21.434568405151367, "global_step": 85964, "epoch": 1035} {"train_loss": -21.82961082458496, "global_step": 85965, "epoch": 1035} {"train_loss": -21.086942672729492, "global_step": 85966, "epoch": 1035} {"train_loss": -21.980558395385742, "global_step": 85967, "epoch": 1035} {"train_loss": -21.659692764282227, "global_step": 85968, "epoch": 1035} {"train_loss": -21.58087921142578, "global_step": 85969, "epoch": 1035} {"train_loss": -21.479246139526367, "global_step": 85970, "epoch": 1035} {"train_loss": -21.504135131835938, "global_step": 85971, "epoch": 1035} {"train_loss": -21.237577438354492, "global_step": 85972, "epoch": 1035} {"train_loss": -21.29503059387207, "global_step": 85973, "epoch": 1035} {"train_loss": -21.394779205322266, "global_step": 85974, "epoch": 1035} {"train_loss": -21.03811264038086, "global_step": 85975, "epoch": 1035} {"train_loss": -21.26677894592285, "global_step": 85976, "epoch": 1035} {"train_loss": -21.611438751220703, "global_step": 85977, "epoch": 1035} {"train_loss": -21.477338790893555, "global_step": 85978, "epoch": 1035} {"train_loss": -21.422754287719727, "global_step": 85979, "epoch": 1035} {"train_loss": -21.73876953125, "global_step": 85980, "epoch": 1035} {"train_loss": -21.170944213867188, "global_step": 85981, "epoch": 1035} {"train_loss": -21.171960830688477, "global_step": 85982, "epoch": 1035} {"train_loss": -21.5025691986084, "global_step": 85983, "epoch": 1035} {"train_loss": -21.33785057067871, "global_step": 85984, "epoch": 1035} {"train_loss": -21.45966148376465, "global_step": 85985, "epoch": 1035} {"train_loss": -21.424585342407227, "global_step": 85986, "epoch": 1035} {"train_loss": -21.4624883123191, "global_step": 85987, "epoch": 1035, "val_loss": 5963563.0} {"train_loss": -21.122283935546875, "global_step": 85988, "epoch": 1036} {"train_loss": -21.06235694885254, "global_step": 85989, "epoch": 1036} {"train_loss": -21.007436752319336, "global_step": 85990, "epoch": 1036} {"train_loss": -20.690088272094727, "global_step": 85991, "epoch": 1036} {"train_loss": -21.436038970947266, "global_step": 85992, "epoch": 1036} {"train_loss": -21.096012115478516, "global_step": 85993, "epoch": 1036} {"train_loss": -21.120840072631836, "global_step": 85994, "epoch": 1036} {"train_loss": -21.26252555847168, "global_step": 85995, "epoch": 1036} {"train_loss": -21.472511291503906, "global_step": 85996, "epoch": 1036} {"train_loss": -21.17485809326172, "global_step": 85997, "epoch": 1036} {"train_loss": -21.310596466064453, "global_step": 85998, "epoch": 1036} {"train_loss": -21.162099838256836, "global_step": 85999, "epoch": 1036} {"train_loss": -21.25453758239746, "global_step": 86000, "epoch": 1036} {"train_loss": -21.117570877075195, "global_step": 86001, "epoch": 1036} {"train_loss": -21.74977684020996, "global_step": 86002, "epoch": 1036} {"train_loss": -20.930326461791992, "global_step": 86003, "epoch": 1036} {"train_loss": -20.961061477661133, "global_step": 86004, "epoch": 1036} {"train_loss": -21.485944747924805, "global_step": 86005, "epoch": 1036} {"train_loss": -21.327987670898438, "global_step": 86006, "epoch": 1036} {"train_loss": -21.172597885131836, "global_step": 86007, "epoch": 1036} {"train_loss": -21.37249183654785, "global_step": 86008, "epoch": 1036} {"train_loss": -21.52008628845215, "global_step": 86009, "epoch": 1036} {"train_loss": -21.35500144958496, "global_step": 86010, "epoch": 1036} {"train_loss": -21.40128517150879, "global_step": 86011, "epoch": 1036} {"train_loss": -21.604249954223633, "global_step": 86012, "epoch": 1036} {"train_loss": -21.181188583374023, "global_step": 86013, "epoch": 1036} {"train_loss": -21.448331832885742, "global_step": 86014, "epoch": 1036} {"train_loss": -21.38092613220215, "global_step": 86015, "epoch": 1036} {"train_loss": -21.145893096923828, "global_step": 86016, "epoch": 1036} {"train_loss": -21.514631271362305, "global_step": 86017, "epoch": 1036} {"train_loss": -21.514162063598633, "global_step": 86018, "epoch": 1036} {"train_loss": -21.7288761138916, "global_step": 86019, "epoch": 1036} {"train_loss": -21.79848289489746, "global_step": 86020, "epoch": 1036} {"train_loss": -21.287389755249023, "global_step": 86021, "epoch": 1036} {"train_loss": -21.13702964782715, "global_step": 86022, "epoch": 1036} {"train_loss": -21.178058624267578, "global_step": 86023, "epoch": 1036} {"train_loss": -21.586265563964844, "global_step": 86024, "epoch": 1036} {"train_loss": -21.507966995239258, "global_step": 86025, "epoch": 1036} {"train_loss": -21.439807891845703, "global_step": 86026, "epoch": 1036} {"train_loss": -21.35188102722168, "global_step": 86027, "epoch": 1036} {"train_loss": -21.570510864257812, "global_step": 86028, "epoch": 1036} {"train_loss": -21.157135009765625, "global_step": 86029, "epoch": 1036} {"train_loss": -21.762861251831055, "global_step": 86030, "epoch": 1036} {"train_loss": -21.54768943786621, "global_step": 86031, "epoch": 1036} {"train_loss": -21.45401954650879, "global_step": 86032, "epoch": 1036} {"train_loss": -21.084157943725586, "global_step": 86033, "epoch": 1036} {"train_loss": -21.555822372436523, "global_step": 86034, "epoch": 1036} {"train_loss": -21.405797958374023, "global_step": 86035, "epoch": 1036} {"train_loss": -21.3216552734375, "global_step": 86036, "epoch": 1036} {"train_loss": -20.966848373413086, "global_step": 86037, "epoch": 1036} {"train_loss": -21.488895416259766, "global_step": 86038, "epoch": 1036} {"train_loss": -21.612567901611328, "global_step": 86039, "epoch": 1036} {"train_loss": -21.450057983398438, "global_step": 86040, "epoch": 1036} {"train_loss": -21.391992568969727, "global_step": 86041, "epoch": 1036} {"train_loss": -21.442974090576172, "global_step": 86042, "epoch": 1036} {"train_loss": -21.185733795166016, "global_step": 86043, "epoch": 1036} {"train_loss": -21.293149948120117, "global_step": 86044, "epoch": 1036} {"train_loss": -21.269515991210938, "global_step": 86045, "epoch": 1036} {"train_loss": -21.43104362487793, "global_step": 86046, "epoch": 1036} {"train_loss": -21.335121154785156, "global_step": 86047, "epoch": 1036} {"train_loss": -21.79770851135254, "global_step": 86048, "epoch": 1036} {"train_loss": -21.36663818359375, "global_step": 86049, "epoch": 1036} {"train_loss": -21.1054630279541, "global_step": 86050, "epoch": 1036} {"train_loss": -21.734676361083984, "global_step": 86051, "epoch": 1036} {"train_loss": -21.281335830688477, "global_step": 86052, "epoch": 1036} {"train_loss": -21.615005493164062, "global_step": 86053, "epoch": 1036} {"train_loss": -21.296688079833984, "global_step": 86054, "epoch": 1036} {"train_loss": -21.214313507080078, "global_step": 86055, "epoch": 1036} {"train_loss": -21.36800193786621, "global_step": 86056, "epoch": 1036} {"train_loss": -21.019407272338867, "global_step": 86057, "epoch": 1036} {"train_loss": -21.78053855895996, "global_step": 86058, "epoch": 1036} {"train_loss": -21.300464630126953, "global_step": 86059, "epoch": 1036} {"train_loss": -21.76180076599121, "global_step": 86060, "epoch": 1036} {"train_loss": -21.653202056884766, "global_step": 86061, "epoch": 1036} {"train_loss": -21.610000610351562, "global_step": 86062, "epoch": 1036} {"train_loss": -21.424842834472656, "global_step": 86063, "epoch": 1036} {"train_loss": -21.763486862182617, "global_step": 86064, "epoch": 1036} {"train_loss": -22.16988182067871, "global_step": 86065, "epoch": 1036} {"train_loss": -21.371885299682617, "global_step": 86066, "epoch": 1036} {"train_loss": -21.184885025024414, "global_step": 86067, "epoch": 1036} {"train_loss": -21.414688110351562, "global_step": 86068, "epoch": 1036} {"train_loss": -21.47666358947754, "global_step": 86069, "epoch": 1036} {"train_loss": -21.368051161249, "global_step": 86070, "epoch": 1036, "val_loss": 5966957.5} {"train_loss": -20.73841094970703, "global_step": 86071, "epoch": 1037} {"train_loss": -21.39044189453125, "global_step": 86072, "epoch": 1037} {"train_loss": -21.20953941345215, "global_step": 86073, "epoch": 1037} {"train_loss": -21.481672286987305, "global_step": 86074, "epoch": 1037} {"train_loss": -21.130590438842773, "global_step": 86075, "epoch": 1037} {"train_loss": -20.94599723815918, "global_step": 86076, "epoch": 1037} {"train_loss": -21.2532958984375, "global_step": 86077, "epoch": 1037} {"train_loss": -21.308820724487305, "global_step": 86078, "epoch": 1037} {"train_loss": -21.278528213500977, "global_step": 86079, "epoch": 1037} {"train_loss": -21.3508358001709, "global_step": 86080, "epoch": 1037} {"train_loss": -21.1738224029541, "global_step": 86081, "epoch": 1037} {"train_loss": -21.5963077545166, "global_step": 86082, "epoch": 1037} {"train_loss": -21.497678756713867, "global_step": 86083, "epoch": 1037} {"train_loss": -21.713380813598633, "global_step": 86084, "epoch": 1037} {"train_loss": -21.27540397644043, "global_step": 86085, "epoch": 1037} {"train_loss": -21.34294319152832, "global_step": 86086, "epoch": 1037} {"train_loss": -21.38274574279785, "global_step": 86087, "epoch": 1037} {"train_loss": -21.18312644958496, "global_step": 86088, "epoch": 1037} {"train_loss": -21.097692489624023, "global_step": 86089, "epoch": 1037} {"train_loss": -21.610149383544922, "global_step": 86090, "epoch": 1037} {"train_loss": -21.456533432006836, "global_step": 86091, "epoch": 1037} {"train_loss": -21.568500518798828, "global_step": 86092, "epoch": 1037} {"train_loss": -21.696979522705078, "global_step": 86093, "epoch": 1037} {"train_loss": -21.701093673706055, "global_step": 86094, "epoch": 1037} {"train_loss": -21.78932762145996, "global_step": 86095, "epoch": 1037} {"train_loss": -21.211824417114258, "global_step": 86096, "epoch": 1037} {"train_loss": -21.673688888549805, "global_step": 86097, "epoch": 1037} {"train_loss": -21.917402267456055, "global_step": 86098, "epoch": 1037} {"train_loss": -21.524309158325195, "global_step": 86099, "epoch": 1037} {"train_loss": -21.4615421295166, "global_step": 86100, "epoch": 1037} {"train_loss": -21.458728790283203, "global_step": 86101, "epoch": 1037} {"train_loss": -21.54715919494629, "global_step": 86102, "epoch": 1037} {"train_loss": -21.667144775390625, "global_step": 86103, "epoch": 1037} {"train_loss": -21.587854385375977, "global_step": 86104, "epoch": 1037} {"train_loss": -21.814437866210938, "global_step": 86105, "epoch": 1037} {"train_loss": -21.573989868164062, "global_step": 86106, "epoch": 1037} {"train_loss": -21.28924560546875, "global_step": 86107, "epoch": 1037} {"train_loss": -21.20991325378418, "global_step": 86108, "epoch": 1037} {"train_loss": -21.397192001342773, "global_step": 86109, "epoch": 1037} {"train_loss": -21.829713821411133, "global_step": 86110, "epoch": 1037} {"train_loss": -21.357282638549805, "global_step": 86111, "epoch": 1037} {"train_loss": -21.353290557861328, "global_step": 86112, "epoch": 1037} {"train_loss": -21.211990356445312, "global_step": 86113, "epoch": 1037} {"train_loss": -21.829866409301758, "global_step": 86114, "epoch": 1037} {"train_loss": -21.571924209594727, "global_step": 86115, "epoch": 1037} {"train_loss": -21.625442504882812, "global_step": 86116, "epoch": 1037} {"train_loss": -20.965951919555664, "global_step": 86117, "epoch": 1037} {"train_loss": -21.63949966430664, "global_step": 86118, "epoch": 1037} {"train_loss": -21.41280174255371, "global_step": 86119, "epoch": 1037} {"train_loss": -21.304828643798828, "global_step": 86120, "epoch": 1037} {"train_loss": -21.465116500854492, "global_step": 86121, "epoch": 1037} {"train_loss": -21.212804794311523, "global_step": 86122, "epoch": 1037} {"train_loss": -21.630203247070312, "global_step": 86123, "epoch": 1037} {"train_loss": -21.5705623626709, "global_step": 86124, "epoch": 1037} {"train_loss": -21.41693878173828, "global_step": 86125, "epoch": 1037} {"train_loss": -21.172637939453125, "global_step": 86126, "epoch": 1037} {"train_loss": -21.480791091918945, "global_step": 86127, "epoch": 1037} {"train_loss": -21.639280319213867, "global_step": 86128, "epoch": 1037} {"train_loss": -21.244794845581055, "global_step": 86129, "epoch": 1037} {"train_loss": -21.46508026123047, "global_step": 86130, "epoch": 1037} {"train_loss": -21.21455955505371, "global_step": 86131, "epoch": 1037} {"train_loss": -21.424970626831055, "global_step": 86132, "epoch": 1037} {"train_loss": -21.55069923400879, "global_step": 86133, "epoch": 1037} {"train_loss": -21.692323684692383, "global_step": 86134, "epoch": 1037} {"train_loss": -21.83245277404785, "global_step": 86135, "epoch": 1037} {"train_loss": -21.69168472290039, "global_step": 86136, "epoch": 1037} {"train_loss": -21.61297607421875, "global_step": 86137, "epoch": 1037} {"train_loss": -21.435178756713867, "global_step": 86138, "epoch": 1037} {"train_loss": -21.257909774780273, "global_step": 86139, "epoch": 1037} {"train_loss": -21.65835189819336, "global_step": 86140, "epoch": 1037} {"train_loss": -21.50798988342285, "global_step": 86141, "epoch": 1037} {"train_loss": -21.559240341186523, "global_step": 86142, "epoch": 1037} {"train_loss": -21.52801513671875, "global_step": 86143, "epoch": 1037} {"train_loss": -21.67947769165039, "global_step": 86144, "epoch": 1037} {"train_loss": -21.43010902404785, "global_step": 86145, "epoch": 1037} {"train_loss": -21.662485122680664, "global_step": 86146, "epoch": 1037} {"train_loss": -21.204572677612305, "global_step": 86147, "epoch": 1037} {"train_loss": -21.50217628479004, "global_step": 86148, "epoch": 1037} {"train_loss": -21.200347900390625, "global_step": 86149, "epoch": 1037} {"train_loss": -21.024913787841797, "global_step": 86150, "epoch": 1037} {"train_loss": -21.382028579711914, "global_step": 86151, "epoch": 1037} {"train_loss": -21.644989013671875, "global_step": 86152, "epoch": 1037} {"train_loss": -21.457074889217516, "global_step": 86153, "epoch": 1037, "val_loss": 6181074.0} {"train_loss": -19.881942749023438, "global_step": 86154, "epoch": 1038} {"train_loss": -20.555387496948242, "global_step": 86155, "epoch": 1038} {"train_loss": -20.935028076171875, "global_step": 86156, "epoch": 1038} {"train_loss": -20.70655632019043, "global_step": 86157, "epoch": 1038} {"train_loss": -20.77552604675293, "global_step": 86158, "epoch": 1038} {"train_loss": -20.74985122680664, "global_step": 86159, "epoch": 1038} {"train_loss": -20.77423667907715, "global_step": 86160, "epoch": 1038} {"train_loss": -20.850950241088867, "global_step": 86161, "epoch": 1038} {"train_loss": -20.838041305541992, "global_step": 86162, "epoch": 1038} {"train_loss": -20.807485580444336, "global_step": 86163, "epoch": 1038} {"train_loss": -21.20112419128418, "global_step": 86164, "epoch": 1038} {"train_loss": -20.975666046142578, "global_step": 86165, "epoch": 1038} {"train_loss": -20.941442489624023, "global_step": 86166, "epoch": 1038} {"train_loss": -20.939781188964844, "global_step": 86167, "epoch": 1038} {"train_loss": -21.37831687927246, "global_step": 86168, "epoch": 1038} {"train_loss": -21.079280853271484, "global_step": 86169, "epoch": 1038} {"train_loss": -21.40657615661621, "global_step": 86170, "epoch": 1038} {"train_loss": -20.97786521911621, "global_step": 86171, "epoch": 1038} {"train_loss": -21.466398239135742, "global_step": 86172, "epoch": 1038} {"train_loss": -21.040922164916992, "global_step": 86173, "epoch": 1038} {"train_loss": -21.499414443969727, "global_step": 86174, "epoch": 1038} {"train_loss": -21.3027400970459, "global_step": 86175, "epoch": 1038} {"train_loss": -21.160795211791992, "global_step": 86176, "epoch": 1038} {"train_loss": -21.44261932373047, "global_step": 86177, "epoch": 1038} {"train_loss": -21.434926986694336, "global_step": 86178, "epoch": 1038} {"train_loss": -21.120695114135742, "global_step": 86179, "epoch": 1038} {"train_loss": -21.372533798217773, "global_step": 86180, "epoch": 1038} {"train_loss": -21.984878540039062, "global_step": 86181, "epoch": 1038} {"train_loss": -21.298297882080078, "global_step": 86182, "epoch": 1038} {"train_loss": -21.248376846313477, "global_step": 86183, "epoch": 1038} {"train_loss": -21.29623794555664, "global_step": 86184, "epoch": 1038} {"train_loss": -21.3182373046875, "global_step": 86185, "epoch": 1038} {"train_loss": -21.333463668823242, "global_step": 86186, "epoch": 1038} {"train_loss": -21.402976989746094, "global_step": 86187, "epoch": 1038} {"train_loss": -20.9748477935791, "global_step": 86188, "epoch": 1038} {"train_loss": -21.174551010131836, "global_step": 86189, "epoch": 1038} {"train_loss": -21.65778923034668, "global_step": 86190, "epoch": 1038} {"train_loss": -21.473186492919922, "global_step": 86191, "epoch": 1038} {"train_loss": -21.18441390991211, "global_step": 86192, "epoch": 1038} {"train_loss": -21.462766647338867, "global_step": 86193, "epoch": 1038} {"train_loss": -21.353363037109375, "global_step": 86194, "epoch": 1038} {"train_loss": -21.145751953125, "global_step": 86195, "epoch": 1038} {"train_loss": -21.17552947998047, "global_step": 86196, "epoch": 1038} {"train_loss": -21.268482208251953, "global_step": 86197, "epoch": 1038} {"train_loss": -21.478137969970703, "global_step": 86198, "epoch": 1038} {"train_loss": -21.48362159729004, "global_step": 86199, "epoch": 1038} {"train_loss": -21.520505905151367, "global_step": 86200, "epoch": 1038} {"train_loss": -21.4930477142334, "global_step": 86201, "epoch": 1038} {"train_loss": -21.42308235168457, "global_step": 86202, "epoch": 1038} {"train_loss": -21.400501251220703, "global_step": 86203, "epoch": 1038} {"train_loss": -21.47023582458496, "global_step": 86204, "epoch": 1038} {"train_loss": -21.376745223999023, "global_step": 86205, "epoch": 1038} {"train_loss": -21.700986862182617, "global_step": 86206, "epoch": 1038} {"train_loss": -21.626113891601562, "global_step": 86207, "epoch": 1038} {"train_loss": -21.301536560058594, "global_step": 86208, "epoch": 1038} {"train_loss": -21.21967124938965, "global_step": 86209, "epoch": 1038} {"train_loss": -21.33967399597168, "global_step": 86210, "epoch": 1038} {"train_loss": -21.16209602355957, "global_step": 86211, "epoch": 1038} {"train_loss": -21.361303329467773, "global_step": 86212, "epoch": 1038} {"train_loss": -21.526657104492188, "global_step": 86213, "epoch": 1038} {"train_loss": -21.45768928527832, "global_step": 86214, "epoch": 1038} {"train_loss": -21.48833465576172, "global_step": 86215, "epoch": 1038} {"train_loss": -21.53558921813965, "global_step": 86216, "epoch": 1038} {"train_loss": -21.441137313842773, "global_step": 86217, "epoch": 1038} {"train_loss": -21.59140396118164, "global_step": 86218, "epoch": 1038} {"train_loss": -21.461679458618164, "global_step": 86219, "epoch": 1038} {"train_loss": -21.810789108276367, "global_step": 86220, "epoch": 1038} {"train_loss": -21.70585823059082, "global_step": 86221, "epoch": 1038} {"train_loss": -21.43985366821289, "global_step": 86222, "epoch": 1038} {"train_loss": -21.15993309020996, "global_step": 86223, "epoch": 1038} {"train_loss": -21.520475387573242, "global_step": 86224, "epoch": 1038} {"train_loss": -21.409032821655273, "global_step": 86225, "epoch": 1038} {"train_loss": -21.184415817260742, "global_step": 86226, "epoch": 1038} {"train_loss": -21.464622497558594, "global_step": 86227, "epoch": 1038} {"train_loss": -21.234161376953125, "global_step": 86228, "epoch": 1038} {"train_loss": -21.858564376831055, "global_step": 86229, "epoch": 1038} {"train_loss": -21.583431243896484, "global_step": 86230, "epoch": 1038} {"train_loss": -21.49642562866211, "global_step": 86231, "epoch": 1038} {"train_loss": -21.559078216552734, "global_step": 86232, "epoch": 1038} {"train_loss": -21.36774253845215, "global_step": 86233, "epoch": 1038} {"train_loss": -21.369529724121094, "global_step": 86234, "epoch": 1038} {"train_loss": -21.4902400970459, "global_step": 86235, "epoch": 1038} {"train_loss": -21.281943815300263, "global_step": 86236, "epoch": 1038, "val_loss": 6082868.5} {"train_loss": -21.315433502197266, "global_step": 86237, "epoch": 1039} {"train_loss": -21.037477493286133, "global_step": 86238, "epoch": 1039} {"train_loss": -21.265106201171875, "global_step": 86239, "epoch": 1039} {"train_loss": -21.38128662109375, "global_step": 86240, "epoch": 1039} {"train_loss": -21.73785400390625, "global_step": 86241, "epoch": 1039} {"train_loss": -21.100671768188477, "global_step": 86242, "epoch": 1039} {"train_loss": -21.520376205444336, "global_step": 86243, "epoch": 1039} {"train_loss": -21.287221908569336, "global_step": 86244, "epoch": 1039} {"train_loss": -21.332616806030273, "global_step": 86245, "epoch": 1039} {"train_loss": -21.4338436126709, "global_step": 86246, "epoch": 1039} {"train_loss": -21.468564987182617, "global_step": 86247, "epoch": 1039} {"train_loss": -21.46363639831543, "global_step": 86248, "epoch": 1039} {"train_loss": -21.48671531677246, "global_step": 86249, "epoch": 1039} {"train_loss": -21.607030868530273, "global_step": 86250, "epoch": 1039} {"train_loss": -21.130409240722656, "global_step": 86251, "epoch": 1039} {"train_loss": -21.44046974182129, "global_step": 86252, "epoch": 1039} {"train_loss": -21.749256134033203, "global_step": 86253, "epoch": 1039} {"train_loss": -21.813383102416992, "global_step": 86254, "epoch": 1039} {"train_loss": -21.400251388549805, "global_step": 86255, "epoch": 1039} {"train_loss": -21.284345626831055, "global_step": 86256, "epoch": 1039} {"train_loss": -20.91805076599121, "global_step": 86257, "epoch": 1039} {"train_loss": -20.91510009765625, "global_step": 86258, "epoch": 1039} {"train_loss": -21.116012573242188, "global_step": 86259, "epoch": 1039} {"train_loss": -21.40938377380371, "global_step": 86260, "epoch": 1039} {"train_loss": -21.715499877929688, "global_step": 86261, "epoch": 1039} {"train_loss": -21.45815086364746, "global_step": 86262, "epoch": 1039} {"train_loss": -21.602859497070312, "global_step": 86263, "epoch": 1039} {"train_loss": -21.443212509155273, "global_step": 86264, "epoch": 1039} {"train_loss": -21.530920028686523, "global_step": 86265, "epoch": 1039} {"train_loss": -21.54046058654785, "global_step": 86266, "epoch": 1039} {"train_loss": -21.560672760009766, "global_step": 86267, "epoch": 1039} {"train_loss": -21.55940055847168, "global_step": 86268, "epoch": 1039} {"train_loss": -21.67892837524414, "global_step": 86269, "epoch": 1039} {"train_loss": -21.42816162109375, "global_step": 86270, "epoch": 1039} {"train_loss": -21.35881233215332, "global_step": 86271, "epoch": 1039} {"train_loss": -21.359106063842773, "global_step": 86272, "epoch": 1039} {"train_loss": -21.45762062072754, "global_step": 86273, "epoch": 1039} {"train_loss": -21.577730178833008, "global_step": 86274, "epoch": 1039} {"train_loss": -21.752622604370117, "global_step": 86275, "epoch": 1039} {"train_loss": -21.125375747680664, "global_step": 86276, "epoch": 1039} {"train_loss": -21.20338249206543, "global_step": 86277, "epoch": 1039} {"train_loss": -21.253141403198242, "global_step": 86278, "epoch": 1039} {"train_loss": -21.2050724029541, "global_step": 86279, "epoch": 1039} {"train_loss": -21.648441314697266, "global_step": 86280, "epoch": 1039} {"train_loss": -21.515993118286133, "global_step": 86281, "epoch": 1039} {"train_loss": -21.436172485351562, "global_step": 86282, "epoch": 1039} {"train_loss": -21.23504066467285, "global_step": 86283, "epoch": 1039} {"train_loss": -21.455059051513672, "global_step": 86284, "epoch": 1039} {"train_loss": -21.513675689697266, "global_step": 86285, "epoch": 1039} {"train_loss": -21.63886260986328, "global_step": 86286, "epoch": 1039} {"train_loss": -21.58689308166504, "global_step": 86287, "epoch": 1039} {"train_loss": -21.435192108154297, "global_step": 86288, "epoch": 1039} {"train_loss": -21.643085479736328, "global_step": 86289, "epoch": 1039} {"train_loss": -21.70863151550293, "global_step": 86290, "epoch": 1039} {"train_loss": -21.341922760009766, "global_step": 86291, "epoch": 1039} {"train_loss": -21.60160255432129, "global_step": 86292, "epoch": 1039} {"train_loss": -21.645816802978516, "global_step": 86293, "epoch": 1039} {"train_loss": -21.6359920501709, "global_step": 86294, "epoch": 1039} {"train_loss": -21.72886848449707, "global_step": 86295, "epoch": 1039} {"train_loss": -21.507827758789062, "global_step": 86296, "epoch": 1039} {"train_loss": -21.512985229492188, "global_step": 86297, "epoch": 1039} {"train_loss": -21.655052185058594, "global_step": 86298, "epoch": 1039} {"train_loss": -21.231542587280273, "global_step": 86299, "epoch": 1039} {"train_loss": -21.42856788635254, "global_step": 86300, "epoch": 1039} {"train_loss": -21.49088478088379, "global_step": 86301, "epoch": 1039} {"train_loss": -21.848020553588867, "global_step": 86302, "epoch": 1039} {"train_loss": -21.211423873901367, "global_step": 86303, "epoch": 1039} {"train_loss": -21.347518920898438, "global_step": 86304, "epoch": 1039} {"train_loss": -21.341703414916992, "global_step": 86305, "epoch": 1039} {"train_loss": -21.406293869018555, "global_step": 86306, "epoch": 1039} {"train_loss": -21.06118392944336, "global_step": 86307, "epoch": 1039} {"train_loss": -21.316408157348633, "global_step": 86308, "epoch": 1039} {"train_loss": -20.995412826538086, "global_step": 86309, "epoch": 1039} {"train_loss": -21.15584373474121, "global_step": 86310, "epoch": 1039} {"train_loss": -21.48958396911621, "global_step": 86311, "epoch": 1039} {"train_loss": -21.266334533691406, "global_step": 86312, "epoch": 1039} {"train_loss": -21.544021606445312, "global_step": 86313, "epoch": 1039} {"train_loss": -21.36588478088379, "global_step": 86314, "epoch": 1039} {"train_loss": -21.277830123901367, "global_step": 86315, "epoch": 1039} {"train_loss": -21.410051345825195, "global_step": 86316, "epoch": 1039} {"train_loss": -21.624189376831055, "global_step": 86317, "epoch": 1039} {"train_loss": -21.587726593017578, "global_step": 86318, "epoch": 1039} {"train_loss": -21.396397533186946, "global_step": 86319, "epoch": 1039, "val_loss": 6013068.5} {"train_loss": -20.954675674438477, "global_step": 86320, "epoch": 1040} {"train_loss": -21.129032135009766, "global_step": 86321, "epoch": 1040} {"train_loss": -20.88182258605957, "global_step": 86322, "epoch": 1040} {"train_loss": -21.28306007385254, "global_step": 86323, "epoch": 1040} {"train_loss": -21.009981155395508, "global_step": 86324, "epoch": 1040} {"train_loss": -21.259613037109375, "global_step": 86325, "epoch": 1040} {"train_loss": -20.993457794189453, "global_step": 86326, "epoch": 1040} {"train_loss": -21.60759735107422, "global_step": 86327, "epoch": 1040} {"train_loss": -21.347646713256836, "global_step": 86328, "epoch": 1040} {"train_loss": -21.20688819885254, "global_step": 86329, "epoch": 1040} {"train_loss": -21.24178123474121, "global_step": 86330, "epoch": 1040} {"train_loss": -21.227148056030273, "global_step": 86331, "epoch": 1040} {"train_loss": -21.189199447631836, "global_step": 86332, "epoch": 1040} {"train_loss": -21.189565658569336, "global_step": 86333, "epoch": 1040} {"train_loss": -21.38104820251465, "global_step": 86334, "epoch": 1040} {"train_loss": -21.406919479370117, "global_step": 86335, "epoch": 1040} {"train_loss": -21.290611267089844, "global_step": 86336, "epoch": 1040} {"train_loss": -21.548755645751953, "global_step": 86337, "epoch": 1040} {"train_loss": -21.63528060913086, "global_step": 86338, "epoch": 1040} {"train_loss": -21.147371292114258, "global_step": 86339, "epoch": 1040} {"train_loss": -21.533727645874023, "global_step": 86340, "epoch": 1040} {"train_loss": -21.885828018188477, "global_step": 86341, "epoch": 1040} {"train_loss": -21.372039794921875, "global_step": 86342, "epoch": 1040} {"train_loss": -21.521621704101562, "global_step": 86343, "epoch": 1040} {"train_loss": -21.861339569091797, "global_step": 86344, "epoch": 1040} {"train_loss": -21.66007423400879, "global_step": 86345, "epoch": 1040} {"train_loss": -21.429325103759766, "global_step": 86346, "epoch": 1040} {"train_loss": -21.274250030517578, "global_step": 86347, "epoch": 1040} {"train_loss": -21.46882438659668, "global_step": 86348, "epoch": 1040} {"train_loss": -21.344236373901367, "global_step": 86349, "epoch": 1040} {"train_loss": -21.162538528442383, "global_step": 86350, "epoch": 1040} {"train_loss": -21.5020809173584, "global_step": 86351, "epoch": 1040} {"train_loss": -21.110685348510742, "global_step": 86352, "epoch": 1040} {"train_loss": -21.091291427612305, "global_step": 86353, "epoch": 1040} {"train_loss": -21.507017135620117, "global_step": 86354, "epoch": 1040} {"train_loss": -21.52073097229004, "global_step": 86355, "epoch": 1040} {"train_loss": -21.34576988220215, "global_step": 86356, "epoch": 1040} {"train_loss": -21.024255752563477, "global_step": 86357, "epoch": 1040} {"train_loss": -21.6682071685791, "global_step": 86358, "epoch": 1040} {"train_loss": -21.71951675415039, "global_step": 86359, "epoch": 1040} {"train_loss": -21.221115112304688, "global_step": 86360, "epoch": 1040} {"train_loss": -21.447708129882812, "global_step": 86361, "epoch": 1040} {"train_loss": -21.241575241088867, "global_step": 86362, "epoch": 1040} {"train_loss": -21.031518936157227, "global_step": 86363, "epoch": 1040} {"train_loss": -20.9974308013916, "global_step": 86364, "epoch": 1040} {"train_loss": -21.2861328125, "global_step": 86365, "epoch": 1040} {"train_loss": -21.32468605041504, "global_step": 86366, "epoch": 1040} {"train_loss": -21.20404052734375, "global_step": 86367, "epoch": 1040} {"train_loss": -21.42158317565918, "global_step": 86368, "epoch": 1040} {"train_loss": -21.63538360595703, "global_step": 86369, "epoch": 1040} {"train_loss": -21.30732536315918, "global_step": 86370, "epoch": 1040} {"train_loss": -21.23380470275879, "global_step": 86371, "epoch": 1040} {"train_loss": -21.905675888061523, "global_step": 86372, "epoch": 1040} {"train_loss": -21.023975372314453, "global_step": 86373, "epoch": 1040} {"train_loss": -21.59087562561035, "global_step": 86374, "epoch": 1040} {"train_loss": -21.56972312927246, "global_step": 86375, "epoch": 1040} {"train_loss": -21.161109924316406, "global_step": 86376, "epoch": 1040} {"train_loss": -21.41522789001465, "global_step": 86377, "epoch": 1040} {"train_loss": -21.248825073242188, "global_step": 86378, "epoch": 1040} {"train_loss": -21.321386337280273, "global_step": 86379, "epoch": 1040} {"train_loss": -22.050630569458008, "global_step": 86380, "epoch": 1040} {"train_loss": -21.441171646118164, "global_step": 86381, "epoch": 1040} {"train_loss": -21.475400924682617, "global_step": 86382, "epoch": 1040} {"train_loss": -21.494665145874023, "global_step": 86383, "epoch": 1040} {"train_loss": -21.581396102905273, "global_step": 86384, "epoch": 1040} {"train_loss": -21.857526779174805, "global_step": 86385, "epoch": 1040} {"train_loss": -21.697561264038086, "global_step": 86386, "epoch": 1040} {"train_loss": -21.459474563598633, "global_step": 86387, "epoch": 1040} {"train_loss": -21.61289405822754, "global_step": 86388, "epoch": 1040} {"train_loss": -21.490270614624023, "global_step": 86389, "epoch": 1040} {"train_loss": -21.36990737915039, "global_step": 86390, "epoch": 1040} {"train_loss": -21.496919631958008, "global_step": 86391, "epoch": 1040} {"train_loss": -21.40409278869629, "global_step": 86392, "epoch": 1040} {"train_loss": -21.402755737304688, "global_step": 86393, "epoch": 1040} {"train_loss": -21.298078536987305, "global_step": 86394, "epoch": 1040} {"train_loss": -21.409778594970703, "global_step": 86395, "epoch": 1040} {"train_loss": -21.65045738220215, "global_step": 86396, "epoch": 1040} {"train_loss": -21.50994300842285, "global_step": 86397, "epoch": 1040} {"train_loss": -21.564022064208984, "global_step": 86398, "epoch": 1040} {"train_loss": -21.61371421813965, "global_step": 86399, "epoch": 1040} {"train_loss": -21.638830184936523, "global_step": 86400, "epoch": 1040} {"train_loss": -21.267728805541992, "global_step": 86401, "epoch": 1040} {"train_loss": -21.413076331816523, "global_step": 86402, "epoch": 1040, "val_loss": 6175611.5} {"train_loss": -21.082365036010742, "global_step": 86403, "epoch": 1041} {"train_loss": -20.8212890625, "global_step": 86404, "epoch": 1041} {"train_loss": -21.243343353271484, "global_step": 86405, "epoch": 1041} {"train_loss": -21.0128116607666, "global_step": 86406, "epoch": 1041} {"train_loss": -20.947525024414062, "global_step": 86407, "epoch": 1041} {"train_loss": -21.157072067260742, "global_step": 86408, "epoch": 1041} {"train_loss": -21.225400924682617, "global_step": 86409, "epoch": 1041} {"train_loss": -21.028396606445312, "global_step": 86410, "epoch": 1041} {"train_loss": -21.02115821838379, "global_step": 86411, "epoch": 1041} {"train_loss": -21.569812774658203, "global_step": 86412, "epoch": 1041} {"train_loss": -21.12317657470703, "global_step": 86413, "epoch": 1041} {"train_loss": -21.027681350708008, "global_step": 86414, "epoch": 1041} {"train_loss": -20.967008590698242, "global_step": 86415, "epoch": 1041} {"train_loss": -21.44127655029297, "global_step": 86416, "epoch": 1041} {"train_loss": -21.20734977722168, "global_step": 86417, "epoch": 1041} {"train_loss": -21.161893844604492, "global_step": 86418, "epoch": 1041} {"train_loss": -21.183143615722656, "global_step": 86419, "epoch": 1041} {"train_loss": -21.380186080932617, "global_step": 86420, "epoch": 1041} {"train_loss": -20.985273361206055, "global_step": 86421, "epoch": 1041} {"train_loss": -21.249027252197266, "global_step": 86422, "epoch": 1041} {"train_loss": -21.421480178833008, "global_step": 86423, "epoch": 1041} {"train_loss": -21.61857795715332, "global_step": 86424, "epoch": 1041} {"train_loss": -21.342815399169922, "global_step": 86425, "epoch": 1041} {"train_loss": -21.325796127319336, "global_step": 86426, "epoch": 1041} {"train_loss": -21.3922176361084, "global_step": 86427, "epoch": 1041} {"train_loss": -21.321561813354492, "global_step": 86428, "epoch": 1041} {"train_loss": -21.108556747436523, "global_step": 86429, "epoch": 1041} {"train_loss": -21.42306137084961, "global_step": 86430, "epoch": 1041} {"train_loss": -21.21083641052246, "global_step": 86431, "epoch": 1041} {"train_loss": -21.5910587310791, "global_step": 86432, "epoch": 1041} {"train_loss": -21.23900032043457, "global_step": 86433, "epoch": 1041} {"train_loss": -21.292173385620117, "global_step": 86434, "epoch": 1041} {"train_loss": -21.342477798461914, "global_step": 86435, "epoch": 1041} {"train_loss": -21.449237823486328, "global_step": 86436, "epoch": 1041} {"train_loss": -21.292997360229492, "global_step": 86437, "epoch": 1041} {"train_loss": -21.376781463623047, "global_step": 86438, "epoch": 1041} {"train_loss": -21.535694122314453, "global_step": 86439, "epoch": 1041} {"train_loss": -21.740461349487305, "global_step": 86440, "epoch": 1041} {"train_loss": -21.73292350769043, "global_step": 86441, "epoch": 1041} {"train_loss": -21.386682510375977, "global_step": 86442, "epoch": 1041} {"train_loss": -21.443073272705078, "global_step": 86443, "epoch": 1041} {"train_loss": -21.35480499267578, "global_step": 86444, "epoch": 1041} {"train_loss": -21.76780128479004, "global_step": 86445, "epoch": 1041} {"train_loss": -21.537321090698242, "global_step": 86446, "epoch": 1041} {"train_loss": -21.48766326904297, "global_step": 86447, "epoch": 1041} {"train_loss": -21.325454711914062, "global_step": 86448, "epoch": 1041} {"train_loss": -21.466110229492188, "global_step": 86449, "epoch": 1041} {"train_loss": -21.875751495361328, "global_step": 86450, "epoch": 1041} {"train_loss": -21.670730590820312, "global_step": 86451, "epoch": 1041} {"train_loss": -21.256481170654297, "global_step": 86452, "epoch": 1041} {"train_loss": -21.908241271972656, "global_step": 86453, "epoch": 1041} {"train_loss": -21.31459617614746, "global_step": 86454, "epoch": 1041} {"train_loss": -21.2283935546875, "global_step": 86455, "epoch": 1041} {"train_loss": -21.7357234954834, "global_step": 86456, "epoch": 1041} {"train_loss": -21.29629898071289, "global_step": 86457, "epoch": 1041} {"train_loss": -21.759180068969727, "global_step": 86458, "epoch": 1041} {"train_loss": -21.622806549072266, "global_step": 86459, "epoch": 1041} {"train_loss": -21.48819351196289, "global_step": 86460, "epoch": 1041} {"train_loss": -21.13527488708496, "global_step": 86461, "epoch": 1041} {"train_loss": -21.196762084960938, "global_step": 86462, "epoch": 1041} {"train_loss": -21.842687606811523, "global_step": 86463, "epoch": 1041} {"train_loss": -21.555377960205078, "global_step": 86464, "epoch": 1041} {"train_loss": -21.276430130004883, "global_step": 86465, "epoch": 1041} {"train_loss": -21.37548828125, "global_step": 86466, "epoch": 1041} {"train_loss": -21.308551788330078, "global_step": 86467, "epoch": 1041} {"train_loss": -21.61944580078125, "global_step": 86468, "epoch": 1041} {"train_loss": -21.279438018798828, "global_step": 86469, "epoch": 1041} {"train_loss": -21.13746452331543, "global_step": 86470, "epoch": 1041} {"train_loss": -21.490829467773438, "global_step": 86471, "epoch": 1041} {"train_loss": -21.405561447143555, "global_step": 86472, "epoch": 1041} {"train_loss": -20.908536911010742, "global_step": 86473, "epoch": 1041} {"train_loss": -21.321475982666016, "global_step": 86474, "epoch": 1041} {"train_loss": -21.15729331970215, "global_step": 86475, "epoch": 1041} {"train_loss": -21.447086334228516, "global_step": 86476, "epoch": 1041} {"train_loss": -20.960233688354492, "global_step": 86477, "epoch": 1041} {"train_loss": -21.36455726623535, "global_step": 86478, "epoch": 1041} {"train_loss": -21.19045066833496, "global_step": 86479, "epoch": 1041} {"train_loss": -21.290245056152344, "global_step": 86480, "epoch": 1041} {"train_loss": -21.232006072998047, "global_step": 86481, "epoch": 1041} {"train_loss": -21.221715927124023, "global_step": 86482, "epoch": 1041} {"train_loss": -20.99177360534668, "global_step": 86483, "epoch": 1041} {"train_loss": -21.59920883178711, "global_step": 86484, "epoch": 1041} {"train_loss": -21.333927591162993, "global_step": 86485, "epoch": 1041, "val_loss": 6038677.0} {"train_loss": -21.32937240600586, "global_step": 86486, "epoch": 1042} {"train_loss": -20.801572799682617, "global_step": 86487, "epoch": 1042} {"train_loss": -20.734920501708984, "global_step": 86488, "epoch": 1042} {"train_loss": -21.377140045166016, "global_step": 86489, "epoch": 1042} {"train_loss": -21.275850296020508, "global_step": 86490, "epoch": 1042} {"train_loss": -20.963998794555664, "global_step": 86491, "epoch": 1042} {"train_loss": -20.876073837280273, "global_step": 86492, "epoch": 1042} {"train_loss": -21.291629791259766, "global_step": 86493, "epoch": 1042} {"train_loss": -21.228126525878906, "global_step": 86494, "epoch": 1042} {"train_loss": -21.26220703125, "global_step": 86495, "epoch": 1042} {"train_loss": -21.490339279174805, "global_step": 86496, "epoch": 1042} {"train_loss": -21.285667419433594, "global_step": 86497, "epoch": 1042} {"train_loss": -21.42241668701172, "global_step": 86498, "epoch": 1042} {"train_loss": -21.333881378173828, "global_step": 86499, "epoch": 1042} {"train_loss": -21.45113754272461, "global_step": 86500, "epoch": 1042} {"train_loss": -21.09847068786621, "global_step": 86501, "epoch": 1042} {"train_loss": -21.529155731201172, "global_step": 86502, "epoch": 1042} {"train_loss": -21.788299560546875, "global_step": 86503, "epoch": 1042} {"train_loss": -21.618392944335938, "global_step": 86504, "epoch": 1042} {"train_loss": -21.34075164794922, "global_step": 86505, "epoch": 1042} {"train_loss": -21.418052673339844, "global_step": 86506, "epoch": 1042} {"train_loss": -21.82164764404297, "global_step": 86507, "epoch": 1042} {"train_loss": -21.73818588256836, "global_step": 86508, "epoch": 1042} {"train_loss": -21.675640106201172, "global_step": 86509, "epoch": 1042} {"train_loss": -21.35181999206543, "global_step": 86510, "epoch": 1042} {"train_loss": -21.582937240600586, "global_step": 86511, "epoch": 1042} {"train_loss": -21.700952529907227, "global_step": 86512, "epoch": 1042} {"train_loss": -21.223854064941406, "global_step": 86513, "epoch": 1042} {"train_loss": -21.319366455078125, "global_step": 86514, "epoch": 1042} {"train_loss": -21.68391990661621, "global_step": 86515, "epoch": 1042} {"train_loss": -20.812427520751953, "global_step": 86516, "epoch": 1042} {"train_loss": -21.478673934936523, "global_step": 86517, "epoch": 1042} {"train_loss": -21.73246955871582, "global_step": 86518, "epoch": 1042} {"train_loss": -21.163166046142578, "global_step": 86519, "epoch": 1042} {"train_loss": -21.76553726196289, "global_step": 86520, "epoch": 1042} {"train_loss": -21.362524032592773, "global_step": 86521, "epoch": 1042} {"train_loss": -21.620624542236328, "global_step": 86522, "epoch": 1042} {"train_loss": -21.0936336517334, "global_step": 86523, "epoch": 1042} {"train_loss": -21.20345115661621, "global_step": 86524, "epoch": 1042} {"train_loss": -21.499300003051758, "global_step": 86525, "epoch": 1042} {"train_loss": -21.253700256347656, "global_step": 86526, "epoch": 1042} {"train_loss": -21.521902084350586, "global_step": 86527, "epoch": 1042} {"train_loss": -21.470426559448242, "global_step": 86528, "epoch": 1042} {"train_loss": -21.405872344970703, "global_step": 86529, "epoch": 1042} {"train_loss": -21.658422470092773, "global_step": 86530, "epoch": 1042} {"train_loss": -21.51161766052246, "global_step": 86531, "epoch": 1042} {"train_loss": -21.650129318237305, "global_step": 86532, "epoch": 1042} {"train_loss": -21.589941024780273, "global_step": 86533, "epoch": 1042} {"train_loss": -21.613182067871094, "global_step": 86534, "epoch": 1042} {"train_loss": -21.2308292388916, "global_step": 86535, "epoch": 1042} {"train_loss": -21.728076934814453, "global_step": 86536, "epoch": 1042} {"train_loss": -21.38187599182129, "global_step": 86537, "epoch": 1042} {"train_loss": -21.625320434570312, "global_step": 86538, "epoch": 1042} {"train_loss": -21.34844398498535, "global_step": 86539, "epoch": 1042} {"train_loss": -21.48748207092285, "global_step": 86540, "epoch": 1042} {"train_loss": -21.508420944213867, "global_step": 86541, "epoch": 1042} {"train_loss": -21.76927375793457, "global_step": 86542, "epoch": 1042} {"train_loss": -21.1927490234375, "global_step": 86543, "epoch": 1042} {"train_loss": -21.71282196044922, "global_step": 86544, "epoch": 1042} {"train_loss": -21.303638458251953, "global_step": 86545, "epoch": 1042} {"train_loss": -21.381444931030273, "global_step": 86546, "epoch": 1042} {"train_loss": -21.556385040283203, "global_step": 86547, "epoch": 1042} {"train_loss": -21.625234603881836, "global_step": 86548, "epoch": 1042} {"train_loss": -21.719690322875977, "global_step": 86549, "epoch": 1042} {"train_loss": -21.39890480041504, "global_step": 86550, "epoch": 1042} {"train_loss": -21.0826416015625, "global_step": 86551, "epoch": 1042} {"train_loss": -21.530302047729492, "global_step": 86552, "epoch": 1042} {"train_loss": -21.235837936401367, "global_step": 86553, "epoch": 1042} {"train_loss": -21.647043228149414, "global_step": 86554, "epoch": 1042} {"train_loss": -21.525331497192383, "global_step": 86555, "epoch": 1042} {"train_loss": -21.687427520751953, "global_step": 86556, "epoch": 1042} {"train_loss": -21.57037925720215, "global_step": 86557, "epoch": 1042} {"train_loss": -21.65966796875, "global_step": 86558, "epoch": 1042} {"train_loss": -21.55802345275879, "global_step": 86559, "epoch": 1042} {"train_loss": -21.664384841918945, "global_step": 86560, "epoch": 1042} {"train_loss": -21.25761604309082, "global_step": 86561, "epoch": 1042} {"train_loss": -21.22983741760254, "global_step": 86562, "epoch": 1042} {"train_loss": -21.5458927154541, "global_step": 86563, "epoch": 1042} {"train_loss": -21.313095092773438, "global_step": 86564, "epoch": 1042} {"train_loss": -21.614707946777344, "global_step": 86565, "epoch": 1042} {"train_loss": -21.430269241333008, "global_step": 86566, "epoch": 1042} {"train_loss": -21.651243209838867, "global_step": 86567, "epoch": 1042} {"train_loss": -21.44631507597774, "global_step": 86568, "epoch": 1042, "val_loss": 5976980.0} {"train_loss": -20.293920516967773, "global_step": 86569, "epoch": 1043} {"train_loss": -20.373706817626953, "global_step": 86570, "epoch": 1043} {"train_loss": -21.00111198425293, "global_step": 86571, "epoch": 1043} {"train_loss": -20.961790084838867, "global_step": 86572, "epoch": 1043} {"train_loss": -20.981496810913086, "global_step": 86573, "epoch": 1043} {"train_loss": -21.180221557617188, "global_step": 86574, "epoch": 1043} {"train_loss": -21.307043075561523, "global_step": 86575, "epoch": 1043} {"train_loss": -20.775217056274414, "global_step": 86576, "epoch": 1043} {"train_loss": -20.964218139648438, "global_step": 86577, "epoch": 1043} {"train_loss": -21.101179122924805, "global_step": 86578, "epoch": 1043} {"train_loss": -21.252912521362305, "global_step": 86579, "epoch": 1043} {"train_loss": -21.375574111938477, "global_step": 86580, "epoch": 1043} {"train_loss": -20.982885360717773, "global_step": 86581, "epoch": 1043} {"train_loss": -21.43104362487793, "global_step": 86582, "epoch": 1043} {"train_loss": -20.95416831970215, "global_step": 86583, "epoch": 1043} {"train_loss": -21.130292892456055, "global_step": 86584, "epoch": 1043} {"train_loss": -20.95712661743164, "global_step": 86585, "epoch": 1043} {"train_loss": -21.217039108276367, "global_step": 86586, "epoch": 1043} {"train_loss": -21.408544540405273, "global_step": 86587, "epoch": 1043} {"train_loss": -21.457183837890625, "global_step": 86588, "epoch": 1043} {"train_loss": -21.04048728942871, "global_step": 86589, "epoch": 1043} {"train_loss": -21.28949546813965, "global_step": 86590, "epoch": 1043} {"train_loss": -21.50857925415039, "global_step": 86591, "epoch": 1043} {"train_loss": -21.183618545532227, "global_step": 86592, "epoch": 1043} {"train_loss": -21.381757736206055, "global_step": 86593, "epoch": 1043} {"train_loss": -21.506389617919922, "global_step": 86594, "epoch": 1043} {"train_loss": -21.434040069580078, "global_step": 86595, "epoch": 1043} {"train_loss": -21.36600112915039, "global_step": 86596, "epoch": 1043} {"train_loss": -21.83734703063965, "global_step": 86597, "epoch": 1043} {"train_loss": -21.4946346282959, "global_step": 86598, "epoch": 1043} {"train_loss": -21.49330711364746, "global_step": 86599, "epoch": 1043} {"train_loss": -21.70100975036621, "global_step": 86600, "epoch": 1043} {"train_loss": -21.58321762084961, "global_step": 86601, "epoch": 1043} {"train_loss": -21.63410758972168, "global_step": 86602, "epoch": 1043} {"train_loss": -21.48740005493164, "global_step": 86603, "epoch": 1043} {"train_loss": -21.310075759887695, "global_step": 86604, "epoch": 1043} {"train_loss": -21.854284286499023, "global_step": 86605, "epoch": 1043} {"train_loss": -21.583389282226562, "global_step": 86606, "epoch": 1043} {"train_loss": -21.600004196166992, "global_step": 86607, "epoch": 1043} {"train_loss": -21.47797203063965, "global_step": 86608, "epoch": 1043} {"train_loss": -21.783700942993164, "global_step": 86609, "epoch": 1043} {"train_loss": -21.466684341430664, "global_step": 86610, "epoch": 1043} {"train_loss": -21.603519439697266, "global_step": 86611, "epoch": 1043} {"train_loss": -21.44293212890625, "global_step": 86612, "epoch": 1043} {"train_loss": -21.4376277923584, "global_step": 86613, "epoch": 1043} {"train_loss": -21.163225173950195, "global_step": 86614, "epoch": 1043} {"train_loss": -21.27412223815918, "global_step": 86615, "epoch": 1043} {"train_loss": -20.87531852722168, "global_step": 86616, "epoch": 1043} {"train_loss": -21.66326332092285, "global_step": 86617, "epoch": 1043} {"train_loss": -21.247087478637695, "global_step": 86618, "epoch": 1043} {"train_loss": -21.749143600463867, "global_step": 86619, "epoch": 1043} {"train_loss": -21.528669357299805, "global_step": 86620, "epoch": 1043} {"train_loss": -21.705692291259766, "global_step": 86621, "epoch": 1043} {"train_loss": -21.57771873474121, "global_step": 86622, "epoch": 1043} {"train_loss": -21.661605834960938, "global_step": 86623, "epoch": 1043} {"train_loss": -21.554182052612305, "global_step": 86624, "epoch": 1043} {"train_loss": -21.443037033081055, "global_step": 86625, "epoch": 1043} {"train_loss": -21.688169479370117, "global_step": 86626, "epoch": 1043} {"train_loss": -21.802631378173828, "global_step": 86627, "epoch": 1043} {"train_loss": -21.702594757080078, "global_step": 86628, "epoch": 1043} {"train_loss": -21.308732986450195, "global_step": 86629, "epoch": 1043} {"train_loss": -21.636621475219727, "global_step": 86630, "epoch": 1043} {"train_loss": -21.343687057495117, "global_step": 86631, "epoch": 1043} {"train_loss": -21.6243839263916, "global_step": 86632, "epoch": 1043} {"train_loss": -21.644351959228516, "global_step": 86633, "epoch": 1043} {"train_loss": -21.67951774597168, "global_step": 86634, "epoch": 1043} {"train_loss": -21.68899154663086, "global_step": 86635, "epoch": 1043} {"train_loss": -21.643381118774414, "global_step": 86636, "epoch": 1043} {"train_loss": -21.795320510864258, "global_step": 86637, "epoch": 1043} {"train_loss": -21.30607032775879, "global_step": 86638, "epoch": 1043} {"train_loss": -21.308698654174805, "global_step": 86639, "epoch": 1043} {"train_loss": -21.676406860351562, "global_step": 86640, "epoch": 1043} {"train_loss": -21.295452117919922, "global_step": 86641, "epoch": 1043} {"train_loss": -21.32107925415039, "global_step": 86642, "epoch": 1043} {"train_loss": -21.636268615722656, "global_step": 86643, "epoch": 1043} {"train_loss": -21.44317626953125, "global_step": 86644, "epoch": 1043} {"train_loss": -21.18771743774414, "global_step": 86645, "epoch": 1043} {"train_loss": -21.378095626831055, "global_step": 86646, "epoch": 1043} {"train_loss": -21.622371673583984, "global_step": 86647, "epoch": 1043} {"train_loss": -21.655513763427734, "global_step": 86648, "epoch": 1043} {"train_loss": -21.383268356323242, "global_step": 86649, "epoch": 1043} {"train_loss": -21.465259552001953, "global_step": 86650, "epoch": 1043} {"train_loss": -21.396831857152733, "global_step": 86651, "epoch": 1043, "val_loss": 6104202.5} {"train_loss": -21.432249069213867, "global_step": 86652, "epoch": 1044} {"train_loss": -21.750656127929688, "global_step": 86653, "epoch": 1044} {"train_loss": -21.613861083984375, "global_step": 86654, "epoch": 1044} {"train_loss": -21.54734230041504, "global_step": 86655, "epoch": 1044} {"train_loss": -21.1502742767334, "global_step": 86656, "epoch": 1044} {"train_loss": -21.297245025634766, "global_step": 86657, "epoch": 1044} {"train_loss": -21.311803817749023, "global_step": 86658, "epoch": 1044} {"train_loss": -21.474720001220703, "global_step": 86659, "epoch": 1044} {"train_loss": -21.10085678100586, "global_step": 86660, "epoch": 1044} {"train_loss": -21.459400177001953, "global_step": 86661, "epoch": 1044} {"train_loss": -21.51381492614746, "global_step": 86662, "epoch": 1044} {"train_loss": -21.112401962280273, "global_step": 86663, "epoch": 1044} {"train_loss": -21.61948585510254, "global_step": 86664, "epoch": 1044} {"train_loss": -21.334848403930664, "global_step": 86665, "epoch": 1044} {"train_loss": -21.444787979125977, "global_step": 86666, "epoch": 1044} {"train_loss": -21.364397048950195, "global_step": 86667, "epoch": 1044} {"train_loss": -21.50636863708496, "global_step": 86668, "epoch": 1044} {"train_loss": -21.35906982421875, "global_step": 86669, "epoch": 1044} {"train_loss": -21.278213500976562, "global_step": 86670, "epoch": 1044} {"train_loss": -21.626890182495117, "global_step": 86671, "epoch": 1044} {"train_loss": -21.18268394470215, "global_step": 86672, "epoch": 1044} {"train_loss": -21.61628532409668, "global_step": 86673, "epoch": 1044} {"train_loss": -21.226917266845703, "global_step": 86674, "epoch": 1044} {"train_loss": -21.340564727783203, "global_step": 86675, "epoch": 1044} {"train_loss": -21.564346313476562, "global_step": 86676, "epoch": 1044} {"train_loss": -20.997045516967773, "global_step": 86677, "epoch": 1044} {"train_loss": -21.299318313598633, "global_step": 86678, "epoch": 1044} {"train_loss": -21.91242218017578, "global_step": 86679, "epoch": 1044} {"train_loss": -21.408119201660156, "global_step": 86680, "epoch": 1044} {"train_loss": -21.602964401245117, "global_step": 86681, "epoch": 1044} {"train_loss": -21.36115837097168, "global_step": 86682, "epoch": 1044} {"train_loss": -21.285062789916992, "global_step": 86683, "epoch": 1044} {"train_loss": -21.6254825592041, "global_step": 86684, "epoch": 1044} {"train_loss": -21.34405517578125, "global_step": 86685, "epoch": 1044} {"train_loss": -21.117130279541016, "global_step": 86686, "epoch": 1044} {"train_loss": -21.453718185424805, "global_step": 86687, "epoch": 1044} {"train_loss": -21.488168716430664, "global_step": 86688, "epoch": 1044} {"train_loss": -21.168893814086914, "global_step": 86689, "epoch": 1044} {"train_loss": -21.58042335510254, "global_step": 86690, "epoch": 1044} {"train_loss": -21.53359031677246, "global_step": 86691, "epoch": 1044} {"train_loss": -21.764957427978516, "global_step": 86692, "epoch": 1044} {"train_loss": -21.152544021606445, "global_step": 86693, "epoch": 1044} {"train_loss": -21.50141716003418, "global_step": 86694, "epoch": 1044} {"train_loss": -21.785947799682617, "global_step": 86695, "epoch": 1044} {"train_loss": -21.473546981811523, "global_step": 86696, "epoch": 1044} {"train_loss": -21.674283981323242, "global_step": 86697, "epoch": 1044} {"train_loss": -21.63059425354004, "global_step": 86698, "epoch": 1044} {"train_loss": -21.483335494995117, "global_step": 86699, "epoch": 1044} {"train_loss": -21.323657989501953, "global_step": 86700, "epoch": 1044} {"train_loss": -21.68903350830078, "global_step": 86701, "epoch": 1044} {"train_loss": -21.508399963378906, "global_step": 86702, "epoch": 1044} {"train_loss": -21.612810134887695, "global_step": 86703, "epoch": 1044} {"train_loss": -21.173086166381836, "global_step": 86704, "epoch": 1044} {"train_loss": -21.69813346862793, "global_step": 86705, "epoch": 1044} {"train_loss": -21.444067001342773, "global_step": 86706, "epoch": 1044} {"train_loss": -21.09132194519043, "global_step": 86707, "epoch": 1044} {"train_loss": -21.45369529724121, "global_step": 86708, "epoch": 1044} {"train_loss": -21.37354850769043, "global_step": 86709, "epoch": 1044} {"train_loss": -21.39959144592285, "global_step": 86710, "epoch": 1044} {"train_loss": -21.199399948120117, "global_step": 86711, "epoch": 1044} {"train_loss": -21.589536666870117, "global_step": 86712, "epoch": 1044} {"train_loss": -21.366140365600586, "global_step": 86713, "epoch": 1044} {"train_loss": -21.551366806030273, "global_step": 86714, "epoch": 1044} {"train_loss": -21.329954147338867, "global_step": 86715, "epoch": 1044} {"train_loss": -21.329296112060547, "global_step": 86716, "epoch": 1044} {"train_loss": -21.175626754760742, "global_step": 86717, "epoch": 1044} {"train_loss": -21.59857749938965, "global_step": 86718, "epoch": 1044} {"train_loss": -21.2982234954834, "global_step": 86719, "epoch": 1044} {"train_loss": -21.692827224731445, "global_step": 86720, "epoch": 1044} {"train_loss": -21.496173858642578, "global_step": 86721, "epoch": 1044} {"train_loss": -21.193466186523438, "global_step": 86722, "epoch": 1044} {"train_loss": -21.594282150268555, "global_step": 86723, "epoch": 1044} {"train_loss": -21.722946166992188, "global_step": 86724, "epoch": 1044} {"train_loss": -21.678314208984375, "global_step": 86725, "epoch": 1044} {"train_loss": -21.732236862182617, "global_step": 86726, "epoch": 1044} {"train_loss": -21.313919067382812, "global_step": 86727, "epoch": 1044} {"train_loss": -21.27931785583496, "global_step": 86728, "epoch": 1044} {"train_loss": -21.468616485595703, "global_step": 86729, "epoch": 1044} {"train_loss": -21.40376853942871, "global_step": 86730, "epoch": 1044} {"train_loss": -21.23672866821289, "global_step": 86731, "epoch": 1044} {"train_loss": -21.58551025390625, "global_step": 86732, "epoch": 1044} {"train_loss": -21.358091354370117, "global_step": 86733, "epoch": 1044} {"train_loss": -21.425120709890344, "global_step": 86734, "epoch": 1044, "val_loss": 6146625.5} {"train_loss": -21.725116729736328, "global_step": 86735, "epoch": 1045} {"train_loss": -21.409921646118164, "global_step": 86736, "epoch": 1045} {"train_loss": -21.20132827758789, "global_step": 86737, "epoch": 1045} {"train_loss": -21.376773834228516, "global_step": 86738, "epoch": 1045} {"train_loss": -21.654455184936523, "global_step": 86739, "epoch": 1045} {"train_loss": -21.309310913085938, "global_step": 86740, "epoch": 1045} {"train_loss": -21.322439193725586, "global_step": 86741, "epoch": 1045} {"train_loss": -21.335113525390625, "global_step": 86742, "epoch": 1045} {"train_loss": -21.334712982177734, "global_step": 86743, "epoch": 1045} {"train_loss": -21.264089584350586, "global_step": 86744, "epoch": 1045} {"train_loss": -20.97026252746582, "global_step": 86745, "epoch": 1045} {"train_loss": -21.57819175720215, "global_step": 86746, "epoch": 1045} {"train_loss": -21.623491287231445, "global_step": 86747, "epoch": 1045} {"train_loss": -21.566953659057617, "global_step": 86748, "epoch": 1045} {"train_loss": -21.349916458129883, "global_step": 86749, "epoch": 1045} {"train_loss": -21.48666763305664, "global_step": 86750, "epoch": 1045} {"train_loss": -21.49903678894043, "global_step": 86751, "epoch": 1045} {"train_loss": -20.916961669921875, "global_step": 86752, "epoch": 1045} {"train_loss": -21.412403106689453, "global_step": 86753, "epoch": 1045} {"train_loss": -21.607328414916992, "global_step": 86754, "epoch": 1045} {"train_loss": -21.091812133789062, "global_step": 86755, "epoch": 1045} {"train_loss": -21.593809127807617, "global_step": 86756, "epoch": 1045} {"train_loss": -21.481637954711914, "global_step": 86757, "epoch": 1045} {"train_loss": -21.048160552978516, "global_step": 86758, "epoch": 1045} {"train_loss": -21.748098373413086, "global_step": 86759, "epoch": 1045} {"train_loss": -21.212343215942383, "global_step": 86760, "epoch": 1045} {"train_loss": -21.573163986206055, "global_step": 86761, "epoch": 1045} {"train_loss": -21.3992919921875, "global_step": 86762, "epoch": 1045} {"train_loss": -21.47877311706543, "global_step": 86763, "epoch": 1045} {"train_loss": -21.444242477416992, "global_step": 86764, "epoch": 1045} {"train_loss": -21.38791275024414, "global_step": 86765, "epoch": 1045} {"train_loss": -21.096355438232422, "global_step": 86766, "epoch": 1045} {"train_loss": -21.427953720092773, "global_step": 86767, "epoch": 1045} {"train_loss": -21.577152252197266, "global_step": 86768, "epoch": 1045} {"train_loss": -21.71481704711914, "global_step": 86769, "epoch": 1045} {"train_loss": -21.40170669555664, "global_step": 86770, "epoch": 1045} {"train_loss": -21.56682586669922, "global_step": 86771, "epoch": 1045} {"train_loss": -21.869285583496094, "global_step": 86772, "epoch": 1045} {"train_loss": -21.294973373413086, "global_step": 86773, "epoch": 1045} {"train_loss": -21.53584861755371, "global_step": 86774, "epoch": 1045} {"train_loss": -21.47652244567871, "global_step": 86775, "epoch": 1045} {"train_loss": -21.64204978942871, "global_step": 86776, "epoch": 1045} {"train_loss": -21.62824058532715, "global_step": 86777, "epoch": 1045} {"train_loss": -21.244482040405273, "global_step": 86778, "epoch": 1045} {"train_loss": -21.324804306030273, "global_step": 86779, "epoch": 1045} {"train_loss": -21.303024291992188, "global_step": 86780, "epoch": 1045} {"train_loss": -21.724369049072266, "global_step": 86781, "epoch": 1045} {"train_loss": -21.792377471923828, "global_step": 86782, "epoch": 1045} {"train_loss": -21.320798873901367, "global_step": 86783, "epoch": 1045} {"train_loss": -21.636381149291992, "global_step": 86784, "epoch": 1045} {"train_loss": -21.751388549804688, "global_step": 86785, "epoch": 1045} {"train_loss": -21.391355514526367, "global_step": 86786, "epoch": 1045} {"train_loss": -21.28193473815918, "global_step": 86787, "epoch": 1045} {"train_loss": -21.402862548828125, "global_step": 86788, "epoch": 1045} {"train_loss": -21.162860870361328, "global_step": 86789, "epoch": 1045} {"train_loss": -21.601041793823242, "global_step": 86790, "epoch": 1045} {"train_loss": -21.528348922729492, "global_step": 86791, "epoch": 1045} {"train_loss": -21.38811683654785, "global_step": 86792, "epoch": 1045} {"train_loss": -21.38356590270996, "global_step": 86793, "epoch": 1045} {"train_loss": -21.412839889526367, "global_step": 86794, "epoch": 1045} {"train_loss": -21.54160499572754, "global_step": 86795, "epoch": 1045} {"train_loss": -21.842832565307617, "global_step": 86796, "epoch": 1045} {"train_loss": -21.261524200439453, "global_step": 86797, "epoch": 1045} {"train_loss": -21.563251495361328, "global_step": 86798, "epoch": 1045} {"train_loss": -21.282499313354492, "global_step": 86799, "epoch": 1045} {"train_loss": -21.587732315063477, "global_step": 86800, "epoch": 1045} {"train_loss": -21.177387237548828, "global_step": 86801, "epoch": 1045} {"train_loss": -21.488794326782227, "global_step": 86802, "epoch": 1045} {"train_loss": -21.200042724609375, "global_step": 86803, "epoch": 1045} {"train_loss": -21.353885650634766, "global_step": 86804, "epoch": 1045} {"train_loss": -21.482851028442383, "global_step": 86805, "epoch": 1045} {"train_loss": -21.62660026550293, "global_step": 86806, "epoch": 1045} {"train_loss": -21.548324584960938, "global_step": 86807, "epoch": 1045} {"train_loss": -21.535175323486328, "global_step": 86808, "epoch": 1045} {"train_loss": -21.41213035583496, "global_step": 86809, "epoch": 1045} {"train_loss": -21.828845977783203, "global_step": 86810, "epoch": 1045} {"train_loss": -21.670045852661133, "global_step": 86811, "epoch": 1045} {"train_loss": -21.389915466308594, "global_step": 86812, "epoch": 1045} {"train_loss": -21.285024642944336, "global_step": 86813, "epoch": 1045} {"train_loss": -21.49835205078125, "global_step": 86814, "epoch": 1045} {"train_loss": -21.847187042236328, "global_step": 86815, "epoch": 1045} {"train_loss": -21.71400260925293, "global_step": 86816, "epoch": 1045} {"train_loss": -21.480631678937428, "global_step": 86817, "epoch": 1045, "val_loss": 6315849.0} {"train_loss": -20.490264892578125, "global_step": 86818, "epoch": 1046} {"train_loss": -20.31393814086914, "global_step": 86819, "epoch": 1046} {"train_loss": -21.075010299682617, "global_step": 86820, "epoch": 1046} {"train_loss": -20.5516300201416, "global_step": 86821, "epoch": 1046} {"train_loss": -20.97665786743164, "global_step": 86822, "epoch": 1046} {"train_loss": -21.121973037719727, "global_step": 86823, "epoch": 1046} {"train_loss": -21.08420753479004, "global_step": 86824, "epoch": 1046} {"train_loss": -20.94135856628418, "global_step": 86825, "epoch": 1046} {"train_loss": -20.92061424255371, "global_step": 86826, "epoch": 1046} {"train_loss": -21.351377487182617, "global_step": 86827, "epoch": 1046} {"train_loss": -20.66109275817871, "global_step": 86828, "epoch": 1046} {"train_loss": -21.412099838256836, "global_step": 86829, "epoch": 1046} {"train_loss": -21.444252014160156, "global_step": 86830, "epoch": 1046} {"train_loss": -21.073789596557617, "global_step": 86831, "epoch": 1046} {"train_loss": -21.180173873901367, "global_step": 86832, "epoch": 1046} {"train_loss": -21.449054718017578, "global_step": 86833, "epoch": 1046} {"train_loss": -21.326265335083008, "global_step": 86834, "epoch": 1046} {"train_loss": -21.379484176635742, "global_step": 86835, "epoch": 1046} {"train_loss": -21.054609298706055, "global_step": 86836, "epoch": 1046} {"train_loss": -21.67566680908203, "global_step": 86837, "epoch": 1046} {"train_loss": -21.219364166259766, "global_step": 86838, "epoch": 1046} {"train_loss": -21.276052474975586, "global_step": 86839, "epoch": 1046} {"train_loss": -21.036664962768555, "global_step": 86840, "epoch": 1046} {"train_loss": -21.576261520385742, "global_step": 86841, "epoch": 1046} {"train_loss": -21.622848510742188, "global_step": 86842, "epoch": 1046} {"train_loss": -21.345657348632812, "global_step": 86843, "epoch": 1046} {"train_loss": -21.134525299072266, "global_step": 86844, "epoch": 1046} {"train_loss": -21.228179931640625, "global_step": 86845, "epoch": 1046} {"train_loss": -21.04041862487793, "global_step": 86846, "epoch": 1046} {"train_loss": -21.233976364135742, "global_step": 86847, "epoch": 1046} {"train_loss": -21.24627685546875, "global_step": 86848, "epoch": 1046} {"train_loss": -21.471220016479492, "global_step": 86849, "epoch": 1046} {"train_loss": -21.75824546813965, "global_step": 86850, "epoch": 1046} {"train_loss": -21.349544525146484, "global_step": 86851, "epoch": 1046} {"train_loss": -21.302682876586914, "global_step": 86852, "epoch": 1046} {"train_loss": -21.462615966796875, "global_step": 86853, "epoch": 1046} {"train_loss": -21.553091049194336, "global_step": 86854, "epoch": 1046} {"train_loss": -21.70818328857422, "global_step": 86855, "epoch": 1046} {"train_loss": -21.31555938720703, "global_step": 86856, "epoch": 1046} {"train_loss": -21.712806701660156, "global_step": 86857, "epoch": 1046} {"train_loss": -21.50360679626465, "global_step": 86858, "epoch": 1046} {"train_loss": -21.195642471313477, "global_step": 86859, "epoch": 1046} {"train_loss": -21.48306655883789, "global_step": 86860, "epoch": 1046} {"train_loss": -21.528671264648438, "global_step": 86861, "epoch": 1046} {"train_loss": -21.651538848876953, "global_step": 86862, "epoch": 1046} {"train_loss": -21.670337677001953, "global_step": 86863, "epoch": 1046} {"train_loss": -21.714248657226562, "global_step": 86864, "epoch": 1046} {"train_loss": -21.490747451782227, "global_step": 86865, "epoch": 1046} {"train_loss": -21.4705810546875, "global_step": 86866, "epoch": 1046} {"train_loss": -21.184011459350586, "global_step": 86867, "epoch": 1046} {"train_loss": -21.5132999420166, "global_step": 86868, "epoch": 1046} {"train_loss": -21.399038314819336, "global_step": 86869, "epoch": 1046} {"train_loss": -21.541269302368164, "global_step": 86870, "epoch": 1046} {"train_loss": -21.577640533447266, "global_step": 86871, "epoch": 1046} {"train_loss": -21.415555953979492, "global_step": 86872, "epoch": 1046} {"train_loss": -21.437711715698242, "global_step": 86873, "epoch": 1046} {"train_loss": -21.592260360717773, "global_step": 86874, "epoch": 1046} {"train_loss": -21.59358024597168, "global_step": 86875, "epoch": 1046} {"train_loss": -21.47021484375, "global_step": 86876, "epoch": 1046} {"train_loss": -21.480972290039062, "global_step": 86877, "epoch": 1046} {"train_loss": -21.400745391845703, "global_step": 86878, "epoch": 1046} {"train_loss": -21.1876220703125, "global_step": 86879, "epoch": 1046} {"train_loss": -21.218191146850586, "global_step": 86880, "epoch": 1046} {"train_loss": -21.546987533569336, "global_step": 86881, "epoch": 1046} {"train_loss": -21.391958236694336, "global_step": 86882, "epoch": 1046} {"train_loss": -21.318588256835938, "global_step": 86883, "epoch": 1046} {"train_loss": -21.120328903198242, "global_step": 86884, "epoch": 1046} {"train_loss": -21.557157516479492, "global_step": 86885, "epoch": 1046} {"train_loss": -21.459623336791992, "global_step": 86886, "epoch": 1046} {"train_loss": -21.25869369506836, "global_step": 86887, "epoch": 1046} {"train_loss": -21.337905883789062, "global_step": 86888, "epoch": 1046} {"train_loss": -21.50269889831543, "global_step": 86889, "epoch": 1046} {"train_loss": -21.7110595703125, "global_step": 86890, "epoch": 1046} {"train_loss": -21.33809471130371, "global_step": 86891, "epoch": 1046} {"train_loss": -21.721555709838867, "global_step": 86892, "epoch": 1046} {"train_loss": -21.530132293701172, "global_step": 86893, "epoch": 1046} {"train_loss": -21.40825080871582, "global_step": 86894, "epoch": 1046} {"train_loss": -21.712291717529297, "global_step": 86895, "epoch": 1046} {"train_loss": -21.1051025390625, "global_step": 86896, "epoch": 1046} {"train_loss": -21.609405517578125, "global_step": 86897, "epoch": 1046} {"train_loss": -21.335317611694336, "global_step": 86898, "epoch": 1046} {"train_loss": -21.172500610351562, "global_step": 86899, "epoch": 1046} {"train_loss": -21.352006475609468, "global_step": 86900, "epoch": 1046, "val_loss": 6114595.5} {"train_loss": -20.735151290893555, "global_step": 86901, "epoch": 1047} {"train_loss": -21.239246368408203, "global_step": 86902, "epoch": 1047} {"train_loss": -21.29828453063965, "global_step": 86903, "epoch": 1047} {"train_loss": -21.38004493713379, "global_step": 86904, "epoch": 1047} {"train_loss": -20.696237564086914, "global_step": 86905, "epoch": 1047} {"train_loss": -21.1106014251709, "global_step": 86906, "epoch": 1047} {"train_loss": -21.05620765686035, "global_step": 86907, "epoch": 1047} {"train_loss": -21.069852828979492, "global_step": 86908, "epoch": 1047} {"train_loss": -21.24653434753418, "global_step": 86909, "epoch": 1047} {"train_loss": -21.105812072753906, "global_step": 86910, "epoch": 1047} {"train_loss": -21.4560604095459, "global_step": 86911, "epoch": 1047} {"train_loss": -21.224994659423828, "global_step": 86912, "epoch": 1047} {"train_loss": -21.373212814331055, "global_step": 86913, "epoch": 1047} {"train_loss": -21.1047420501709, "global_step": 86914, "epoch": 1047} {"train_loss": -21.42423439025879, "global_step": 86915, "epoch": 1047} {"train_loss": -21.249034881591797, "global_step": 86916, "epoch": 1047} {"train_loss": -21.433917999267578, "global_step": 86917, "epoch": 1047} {"train_loss": -21.341922760009766, "global_step": 86918, "epoch": 1047} {"train_loss": -21.59323501586914, "global_step": 86919, "epoch": 1047} {"train_loss": -21.188501358032227, "global_step": 86920, "epoch": 1047} {"train_loss": -21.942808151245117, "global_step": 86921, "epoch": 1047} {"train_loss": -21.4605655670166, "global_step": 86922, "epoch": 1047} {"train_loss": -21.41315460205078, "global_step": 86923, "epoch": 1047} {"train_loss": -21.49541664123535, "global_step": 86924, "epoch": 1047} {"train_loss": -21.115018844604492, "global_step": 86925, "epoch": 1047} {"train_loss": -21.40479850769043, "global_step": 86926, "epoch": 1047} {"train_loss": -21.510141372680664, "global_step": 86927, "epoch": 1047} {"train_loss": -21.462684631347656, "global_step": 86928, "epoch": 1047} {"train_loss": -21.353252410888672, "global_step": 86929, "epoch": 1047} {"train_loss": -21.658294677734375, "global_step": 86930, "epoch": 1047} {"train_loss": -21.647138595581055, "global_step": 86931, "epoch": 1047} {"train_loss": -21.488088607788086, "global_step": 86932, "epoch": 1047} {"train_loss": -21.071914672851562, "global_step": 86933, "epoch": 1047} {"train_loss": -21.186954498291016, "global_step": 86934, "epoch": 1047} {"train_loss": -21.370121002197266, "global_step": 86935, "epoch": 1047} {"train_loss": -21.770421981811523, "global_step": 86936, "epoch": 1047} {"train_loss": -21.40437889099121, "global_step": 86937, "epoch": 1047} {"train_loss": -21.655109405517578, "global_step": 86938, "epoch": 1047} {"train_loss": -21.55010414123535, "global_step": 86939, "epoch": 1047} {"train_loss": -21.604366302490234, "global_step": 86940, "epoch": 1047} {"train_loss": -21.359092712402344, "global_step": 86941, "epoch": 1047} {"train_loss": -21.72500991821289, "global_step": 86942, "epoch": 1047} {"train_loss": -21.399328231811523, "global_step": 86943, "epoch": 1047} {"train_loss": -21.385717391967773, "global_step": 86944, "epoch": 1047} {"train_loss": -21.948455810546875, "global_step": 86945, "epoch": 1047} {"train_loss": -21.88443374633789, "global_step": 86946, "epoch": 1047} {"train_loss": -21.53907585144043, "global_step": 86947, "epoch": 1047} {"train_loss": -21.47560691833496, "global_step": 86948, "epoch": 1047} {"train_loss": -21.564701080322266, "global_step": 86949, "epoch": 1047} {"train_loss": -21.41046905517578, "global_step": 86950, "epoch": 1047} {"train_loss": -21.35358238220215, "global_step": 86951, "epoch": 1047} {"train_loss": -21.824186325073242, "global_step": 86952, "epoch": 1047} {"train_loss": -21.3460693359375, "global_step": 86953, "epoch": 1047} {"train_loss": -21.73516273498535, "global_step": 86954, "epoch": 1047} {"train_loss": -21.3420467376709, "global_step": 86955, "epoch": 1047} {"train_loss": -21.57071304321289, "global_step": 86956, "epoch": 1047} {"train_loss": -21.27665138244629, "global_step": 86957, "epoch": 1047} {"train_loss": -21.55486488342285, "global_step": 86958, "epoch": 1047} {"train_loss": -21.19521141052246, "global_step": 86959, "epoch": 1047} {"train_loss": -21.5745906829834, "global_step": 86960, "epoch": 1047} {"train_loss": -21.596153259277344, "global_step": 86961, "epoch": 1047} {"train_loss": -21.56167984008789, "global_step": 86962, "epoch": 1047} {"train_loss": -21.85184669494629, "global_step": 86963, "epoch": 1047} {"train_loss": -21.51963233947754, "global_step": 86964, "epoch": 1047} {"train_loss": -21.573883056640625, "global_step": 86965, "epoch": 1047} {"train_loss": -21.50246238708496, "global_step": 86966, "epoch": 1047} {"train_loss": -21.927167892456055, "global_step": 86967, "epoch": 1047} {"train_loss": -21.561315536499023, "global_step": 86968, "epoch": 1047} {"train_loss": -21.62969398498535, "global_step": 86969, "epoch": 1047} {"train_loss": -21.331586837768555, "global_step": 86970, "epoch": 1047} {"train_loss": -21.050888061523438, "global_step": 86971, "epoch": 1047} {"train_loss": -21.852785110473633, "global_step": 86972, "epoch": 1047} {"train_loss": -21.515026092529297, "global_step": 86973, "epoch": 1047} {"train_loss": -21.36321449279785, "global_step": 86974, "epoch": 1047} {"train_loss": -21.313793182373047, "global_step": 86975, "epoch": 1047} {"train_loss": -21.24375343322754, "global_step": 86976, "epoch": 1047} {"train_loss": -21.430212020874023, "global_step": 86977, "epoch": 1047} {"train_loss": -21.547744750976562, "global_step": 86978, "epoch": 1047} {"train_loss": -21.49410629272461, "global_step": 86979, "epoch": 1047} {"train_loss": -21.37332534790039, "global_step": 86980, "epoch": 1047} {"train_loss": -21.131423950195312, "global_step": 86981, "epoch": 1047} {"train_loss": -21.479124069213867, "global_step": 86982, "epoch": 1047} {"train_loss": -21.447730834225574, "global_step": 86983, "epoch": 1047, "val_loss": 6198044.5} {"train_loss": -21.089263916015625, "global_step": 86984, "epoch": 1048} {"train_loss": -21.352365493774414, "global_step": 86985, "epoch": 1048} {"train_loss": -21.265552520751953, "global_step": 86986, "epoch": 1048} {"train_loss": -21.48249626159668, "global_step": 86987, "epoch": 1048} {"train_loss": -21.169775009155273, "global_step": 86988, "epoch": 1048} {"train_loss": -21.59208869934082, "global_step": 86989, "epoch": 1048} {"train_loss": -20.982654571533203, "global_step": 86990, "epoch": 1048} {"train_loss": -20.875442504882812, "global_step": 86991, "epoch": 1048} {"train_loss": -21.209814071655273, "global_step": 86992, "epoch": 1048} {"train_loss": -21.455686569213867, "global_step": 86993, "epoch": 1048} {"train_loss": -21.379497528076172, "global_step": 86994, "epoch": 1048} {"train_loss": -21.28684425354004, "global_step": 86995, "epoch": 1048} {"train_loss": -21.28688621520996, "global_step": 86996, "epoch": 1048} {"train_loss": -21.721403121948242, "global_step": 86997, "epoch": 1048} {"train_loss": -21.52410888671875, "global_step": 86998, "epoch": 1048} {"train_loss": -21.476606369018555, "global_step": 86999, "epoch": 1048} {"train_loss": -21.22422218322754, "global_step": 87000, "epoch": 1048} {"train_loss": -21.718963623046875, "global_step": 87001, "epoch": 1048} {"train_loss": -21.36365509033203, "global_step": 87002, "epoch": 1048} {"train_loss": -21.18175506591797, "global_step": 87003, "epoch": 1048} {"train_loss": -21.68402862548828, "global_step": 87004, "epoch": 1048} {"train_loss": -21.380475997924805, "global_step": 87005, "epoch": 1048} {"train_loss": -21.502334594726562, "global_step": 87006, "epoch": 1048} {"train_loss": -21.338571548461914, "global_step": 87007, "epoch": 1048} {"train_loss": -21.426239013671875, "global_step": 87008, "epoch": 1048} {"train_loss": -21.560802459716797, "global_step": 87009, "epoch": 1048} {"train_loss": -21.579519271850586, "global_step": 87010, "epoch": 1048} {"train_loss": -21.44759178161621, "global_step": 87011, "epoch": 1048} {"train_loss": -21.39794921875, "global_step": 87012, "epoch": 1048} {"train_loss": -21.380178451538086, "global_step": 87013, "epoch": 1048} {"train_loss": -21.705907821655273, "global_step": 87014, "epoch": 1048} {"train_loss": -21.541521072387695, "global_step": 87015, "epoch": 1048} {"train_loss": -21.521728515625, "global_step": 87016, "epoch": 1048} {"train_loss": -21.420400619506836, "global_step": 87017, "epoch": 1048} {"train_loss": -21.42828941345215, "global_step": 87018, "epoch": 1048} {"train_loss": -21.63117027282715, "global_step": 87019, "epoch": 1048} {"train_loss": -21.3867130279541, "global_step": 87020, "epoch": 1048} {"train_loss": -21.11897087097168, "global_step": 87021, "epoch": 1048} {"train_loss": -21.69110870361328, "global_step": 87022, "epoch": 1048} {"train_loss": -21.389751434326172, "global_step": 87023, "epoch": 1048} {"train_loss": -22.000194549560547, "global_step": 87024, "epoch": 1048} {"train_loss": -21.32147216796875, "global_step": 87025, "epoch": 1048} {"train_loss": -21.625577926635742, "global_step": 87026, "epoch": 1048} {"train_loss": -21.21120262145996, "global_step": 87027, "epoch": 1048} {"train_loss": -21.222402572631836, "global_step": 87028, "epoch": 1048} {"train_loss": -21.30811882019043, "global_step": 87029, "epoch": 1048} {"train_loss": -21.07880210876465, "global_step": 87030, "epoch": 1048} {"train_loss": -21.522241592407227, "global_step": 87031, "epoch": 1048} {"train_loss": -21.44891357421875, "global_step": 87032, "epoch": 1048} {"train_loss": -21.472455978393555, "global_step": 87033, "epoch": 1048} {"train_loss": -21.712873458862305, "global_step": 87034, "epoch": 1048} {"train_loss": -21.48702049255371, "global_step": 87035, "epoch": 1048} {"train_loss": -21.50676727294922, "global_step": 87036, "epoch": 1048} {"train_loss": -21.755441665649414, "global_step": 87037, "epoch": 1048} {"train_loss": -21.749021530151367, "global_step": 87038, "epoch": 1048} {"train_loss": -21.365964889526367, "global_step": 87039, "epoch": 1048} {"train_loss": -21.410245895385742, "global_step": 87040, "epoch": 1048} {"train_loss": -21.523693084716797, "global_step": 87041, "epoch": 1048} {"train_loss": -21.646596908569336, "global_step": 87042, "epoch": 1048} {"train_loss": -21.339162826538086, "global_step": 87043, "epoch": 1048} {"train_loss": -21.418107986450195, "global_step": 87044, "epoch": 1048} {"train_loss": -21.592023849487305, "global_step": 87045, "epoch": 1048} {"train_loss": -21.329248428344727, "global_step": 87046, "epoch": 1048} {"train_loss": -21.363168716430664, "global_step": 87047, "epoch": 1048} {"train_loss": -21.5977840423584, "global_step": 87048, "epoch": 1048} {"train_loss": -20.98809242248535, "global_step": 87049, "epoch": 1048} {"train_loss": -21.360212326049805, "global_step": 87050, "epoch": 1048} {"train_loss": -21.75172233581543, "global_step": 87051, "epoch": 1048} {"train_loss": -21.376863479614258, "global_step": 87052, "epoch": 1048} {"train_loss": -21.26807975769043, "global_step": 87053, "epoch": 1048} {"train_loss": -21.45095443725586, "global_step": 87054, "epoch": 1048} {"train_loss": -21.492795944213867, "global_step": 87055, "epoch": 1048} {"train_loss": -21.410062789916992, "global_step": 87056, "epoch": 1048} {"train_loss": -21.716747283935547, "global_step": 87057, "epoch": 1048} {"train_loss": -21.724430084228516, "global_step": 87058, "epoch": 1048} {"train_loss": -21.540117263793945, "global_step": 87059, "epoch": 1048} {"train_loss": -21.60976219177246, "global_step": 87060, "epoch": 1048} {"train_loss": -22.0179443359375, "global_step": 87061, "epoch": 1048} {"train_loss": -21.339786529541016, "global_step": 87062, "epoch": 1048} {"train_loss": -21.53450584411621, "global_step": 87063, "epoch": 1048} {"train_loss": -21.3811092376709, "global_step": 87064, "epoch": 1048} {"train_loss": -21.326826095581055, "global_step": 87065, "epoch": 1048} {"train_loss": -21.451555366975715, "global_step": 87066, "epoch": 1048, "val_loss": 6044134.0} {"train_loss": -21.4157772064209, "global_step": 87067, "epoch": 1049} {"train_loss": -21.571304321289062, "global_step": 87068, "epoch": 1049} {"train_loss": -20.99173355102539, "global_step": 87069, "epoch": 1049} {"train_loss": -21.451095581054688, "global_step": 87070, "epoch": 1049} {"train_loss": -21.28925132751465, "global_step": 87071, "epoch": 1049} {"train_loss": -21.42316246032715, "global_step": 87072, "epoch": 1049} {"train_loss": -21.281431198120117, "global_step": 87073, "epoch": 1049} {"train_loss": -21.382587432861328, "global_step": 87074, "epoch": 1049} {"train_loss": -21.075071334838867, "global_step": 87075, "epoch": 1049} {"train_loss": -21.18649673461914, "global_step": 87076, "epoch": 1049} {"train_loss": -21.129318237304688, "global_step": 87077, "epoch": 1049} {"train_loss": -21.308536529541016, "global_step": 87078, "epoch": 1049} {"train_loss": -20.84749412536621, "global_step": 87079, "epoch": 1049} {"train_loss": -21.3858642578125, "global_step": 87080, "epoch": 1049} {"train_loss": -21.160587310791016, "global_step": 87081, "epoch": 1049} {"train_loss": -21.278167724609375, "global_step": 87082, "epoch": 1049} {"train_loss": -21.234609603881836, "global_step": 87083, "epoch": 1049} {"train_loss": -21.57016372680664, "global_step": 87084, "epoch": 1049} {"train_loss": -21.323890686035156, "global_step": 87085, "epoch": 1049} {"train_loss": -21.474943161010742, "global_step": 87086, "epoch": 1049} {"train_loss": -21.490819931030273, "global_step": 87087, "epoch": 1049} {"train_loss": -21.443580627441406, "global_step": 87088, "epoch": 1049} {"train_loss": -21.778945922851562, "global_step": 87089, "epoch": 1049} {"train_loss": -21.396207809448242, "global_step": 87090, "epoch": 1049} {"train_loss": -21.508527755737305, "global_step": 87091, "epoch": 1049} {"train_loss": -21.593307495117188, "global_step": 87092, "epoch": 1049} {"train_loss": -21.22031593322754, "global_step": 87093, "epoch": 1049} {"train_loss": -21.000446319580078, "global_step": 87094, "epoch": 1049} {"train_loss": -21.60114097595215, "global_step": 87095, "epoch": 1049} {"train_loss": -21.270322799682617, "global_step": 87096, "epoch": 1049} {"train_loss": -21.422897338867188, "global_step": 87097, "epoch": 1049} {"train_loss": -21.47298812866211, "global_step": 87098, "epoch": 1049} {"train_loss": -21.095504760742188, "global_step": 87099, "epoch": 1049} {"train_loss": -21.560714721679688, "global_step": 87100, "epoch": 1049} {"train_loss": -21.342557907104492, "global_step": 87101, "epoch": 1049} {"train_loss": -21.341230392456055, "global_step": 87102, "epoch": 1049} {"train_loss": -21.472015380859375, "global_step": 87103, "epoch": 1049} {"train_loss": -21.530691146850586, "global_step": 87104, "epoch": 1049} {"train_loss": -21.45962905883789, "global_step": 87105, "epoch": 1049} {"train_loss": -21.516761779785156, "global_step": 87106, "epoch": 1049} {"train_loss": -21.67099952697754, "global_step": 87107, "epoch": 1049} {"train_loss": -21.442697525024414, "global_step": 87108, "epoch": 1049} {"train_loss": -21.868896484375, "global_step": 87109, "epoch": 1049} {"train_loss": -21.76566505432129, "global_step": 87110, "epoch": 1049} {"train_loss": -21.805932998657227, "global_step": 87111, "epoch": 1049} {"train_loss": -21.488615036010742, "global_step": 87112, "epoch": 1049} {"train_loss": -21.838144302368164, "global_step": 87113, "epoch": 1049} {"train_loss": -21.54071044921875, "global_step": 87114, "epoch": 1049} {"train_loss": -21.820680618286133, "global_step": 87115, "epoch": 1049} {"train_loss": -21.191207885742188, "global_step": 87116, "epoch": 1049} {"train_loss": -21.443580627441406, "global_step": 87117, "epoch": 1049} {"train_loss": -21.34581756591797, "global_step": 87118, "epoch": 1049} {"train_loss": -21.316801071166992, "global_step": 87119, "epoch": 1049} {"train_loss": -21.629724502563477, "global_step": 87120, "epoch": 1049} {"train_loss": -21.299888610839844, "global_step": 87121, "epoch": 1049} {"train_loss": -21.87678337097168, "global_step": 87122, "epoch": 1049} {"train_loss": -21.557584762573242, "global_step": 87123, "epoch": 1049} {"train_loss": -21.642086029052734, "global_step": 87124, "epoch": 1049} {"train_loss": -21.193958282470703, "global_step": 87125, "epoch": 1049} {"train_loss": -21.290332794189453, "global_step": 87126, "epoch": 1049} {"train_loss": -21.818891525268555, "global_step": 87127, "epoch": 1049} {"train_loss": -21.442020416259766, "global_step": 87128, "epoch": 1049} {"train_loss": -21.6164493560791, "global_step": 87129, "epoch": 1049} {"train_loss": -21.60979652404785, "global_step": 87130, "epoch": 1049} {"train_loss": -21.692153930664062, "global_step": 87131, "epoch": 1049} {"train_loss": -21.058685302734375, "global_step": 87132, "epoch": 1049} {"train_loss": -21.20548439025879, "global_step": 87133, "epoch": 1049} {"train_loss": -21.706945419311523, "global_step": 87134, "epoch": 1049} {"train_loss": -21.51832389831543, "global_step": 87135, "epoch": 1049} {"train_loss": -21.433378219604492, "global_step": 87136, "epoch": 1049} {"train_loss": -21.374441146850586, "global_step": 87137, "epoch": 1049} {"train_loss": -21.600915908813477, "global_step": 87138, "epoch": 1049} {"train_loss": -21.52819061279297, "global_step": 87139, "epoch": 1049} {"train_loss": -21.318218231201172, "global_step": 87140, "epoch": 1049} {"train_loss": -21.57756805419922, "global_step": 87141, "epoch": 1049} {"train_loss": -21.081933975219727, "global_step": 87142, "epoch": 1049} {"train_loss": -21.796777725219727, "global_step": 87143, "epoch": 1049} {"train_loss": -21.618865966796875, "global_step": 87144, "epoch": 1049} {"train_loss": -21.602937698364258, "global_step": 87145, "epoch": 1049} {"train_loss": -21.68269920349121, "global_step": 87146, "epoch": 1049} {"train_loss": -21.388460159301758, "global_step": 87147, "epoch": 1049} {"train_loss": -21.445194244384766, "global_step": 87148, "epoch": 1049} {"train_loss": -21.444750613476856, "global_step": 87149, "epoch": 1049, "val_loss": 6088208.0} {"train_loss": -21.3747615814209, "global_step": 87150, "epoch": 1050} {"train_loss": -21.371335983276367, "global_step": 87151, "epoch": 1050} {"train_loss": -21.08113670349121, "global_step": 87152, "epoch": 1050} {"train_loss": -21.5314884185791, "global_step": 87153, "epoch": 1050} {"train_loss": -21.3365535736084, "global_step": 87154, "epoch": 1050} {"train_loss": -21.23102378845215, "global_step": 87155, "epoch": 1050} {"train_loss": -21.19968605041504, "global_step": 87156, "epoch": 1050} {"train_loss": -21.387313842773438, "global_step": 87157, "epoch": 1050} {"train_loss": -21.7851619720459, "global_step": 87158, "epoch": 1050} {"train_loss": -21.401716232299805, "global_step": 87159, "epoch": 1050} {"train_loss": -21.470640182495117, "global_step": 87160, "epoch": 1050} {"train_loss": -21.333290100097656, "global_step": 87161, "epoch": 1050} {"train_loss": -21.221973419189453, "global_step": 87162, "epoch": 1050} {"train_loss": -21.699365615844727, "global_step": 87163, "epoch": 1050} {"train_loss": -21.18125343322754, "global_step": 87164, "epoch": 1050} {"train_loss": -21.4526424407959, "global_step": 87165, "epoch": 1050} {"train_loss": -21.6960506439209, "global_step": 87166, "epoch": 1050} {"train_loss": -21.50855827331543, "global_step": 87167, "epoch": 1050} {"train_loss": -21.222488403320312, "global_step": 87168, "epoch": 1050} {"train_loss": -21.687231063842773, "global_step": 87169, "epoch": 1050} {"train_loss": -21.617633819580078, "global_step": 87170, "epoch": 1050} {"train_loss": -21.543659210205078, "global_step": 87171, "epoch": 1050} {"train_loss": -21.589645385742188, "global_step": 87172, "epoch": 1050} {"train_loss": -21.199142456054688, "global_step": 87173, "epoch": 1050} {"train_loss": -21.592693328857422, "global_step": 87174, "epoch": 1050} {"train_loss": -21.261646270751953, "global_step": 87175, "epoch": 1050} {"train_loss": -21.39127540588379, "global_step": 87176, "epoch": 1050} {"train_loss": -21.65651512145996, "global_step": 87177, "epoch": 1050} {"train_loss": -21.456083297729492, "global_step": 87178, "epoch": 1050} {"train_loss": -21.570865631103516, "global_step": 87179, "epoch": 1050} {"train_loss": -21.549354553222656, "global_step": 87180, "epoch": 1050} {"train_loss": -21.50385856628418, "global_step": 87181, "epoch": 1050} {"train_loss": -21.566802978515625, "global_step": 87182, "epoch": 1050} {"train_loss": -21.391769409179688, "global_step": 87183, "epoch": 1050} {"train_loss": -21.925363540649414, "global_step": 87184, "epoch": 1050} {"train_loss": -21.571218490600586, "global_step": 87185, "epoch": 1050} {"train_loss": -21.536178588867188, "global_step": 87186, "epoch": 1050} {"train_loss": -21.980030059814453, "global_step": 87187, "epoch": 1050} {"train_loss": -21.3633975982666, "global_step": 87188, "epoch": 1050} {"train_loss": -21.459400177001953, "global_step": 87189, "epoch": 1050} {"train_loss": -21.63655662536621, "global_step": 87190, "epoch": 1050} {"train_loss": -21.637252807617188, "global_step": 87191, "epoch": 1050} {"train_loss": -21.30126953125, "global_step": 87192, "epoch": 1050} {"train_loss": -21.35822868347168, "global_step": 87193, "epoch": 1050} {"train_loss": -21.42410659790039, "global_step": 87194, "epoch": 1050} {"train_loss": -21.829151153564453, "global_step": 87195, "epoch": 1050} {"train_loss": -21.287534713745117, "global_step": 87196, "epoch": 1050} {"train_loss": -21.369659423828125, "global_step": 87197, "epoch": 1050} {"train_loss": -21.66388702392578, "global_step": 87198, "epoch": 1050} {"train_loss": -21.135318756103516, "global_step": 87199, "epoch": 1050} {"train_loss": -21.501998901367188, "global_step": 87200, "epoch": 1050} {"train_loss": -21.719409942626953, "global_step": 87201, "epoch": 1050} {"train_loss": -21.49888038635254, "global_step": 87202, "epoch": 1050} {"train_loss": -21.549692153930664, "global_step": 87203, "epoch": 1050} {"train_loss": -21.522705078125, "global_step": 87204, "epoch": 1050} {"train_loss": -21.23356056213379, "global_step": 87205, "epoch": 1050} {"train_loss": -21.671823501586914, "global_step": 87206, "epoch": 1050} {"train_loss": -21.112836837768555, "global_step": 87207, "epoch": 1050} {"train_loss": -22.002466201782227, "global_step": 87208, "epoch": 1050} {"train_loss": -21.527786254882812, "global_step": 87209, "epoch": 1050} {"train_loss": -21.32890510559082, "global_step": 87210, "epoch": 1050} {"train_loss": -21.701627731323242, "global_step": 87211, "epoch": 1050} {"train_loss": -21.418561935424805, "global_step": 87212, "epoch": 1050} {"train_loss": -21.400115966796875, "global_step": 87213, "epoch": 1050} {"train_loss": -21.428634643554688, "global_step": 87214, "epoch": 1050} {"train_loss": -21.813278198242188, "global_step": 87215, "epoch": 1050} {"train_loss": -21.452924728393555, "global_step": 87216, "epoch": 1050} {"train_loss": -21.53874969482422, "global_step": 87217, "epoch": 1050} {"train_loss": -21.441211700439453, "global_step": 87218, "epoch": 1050} {"train_loss": -21.586057662963867, "global_step": 87219, "epoch": 1050} {"train_loss": -21.47858428955078, "global_step": 87220, "epoch": 1050} {"train_loss": -21.649572372436523, "global_step": 87221, "epoch": 1050} {"train_loss": -21.207849502563477, "global_step": 87222, "epoch": 1050} {"train_loss": -21.485580444335938, "global_step": 87223, "epoch": 1050} {"train_loss": -21.559772491455078, "global_step": 87224, "epoch": 1050} {"train_loss": -21.382827758789062, "global_step": 87225, "epoch": 1050} {"train_loss": -21.092937469482422, "global_step": 87226, "epoch": 1050} {"train_loss": -21.50887107849121, "global_step": 87227, "epoch": 1050} {"train_loss": -21.538408279418945, "global_step": 87228, "epoch": 1050} {"train_loss": -21.43873405456543, "global_step": 87229, "epoch": 1050} {"train_loss": -21.202560424804688, "global_step": 87230, "epoch": 1050} {"train_loss": -21.338468551635742, "global_step": 87231, "epoch": 1050} {"train_loss": -21.48058479952525, "global_step": 87232, "epoch": 1050, "train/sim_max_reward_0": 1.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 0.0, "test/sim_max_reward_4500000": 1.0, "test/sim_max_reward_4500001": 1.0, "test/sim_max_reward_4500002": 1.0, "test/sim_max_reward_4500003": 1.0, "test/sim_max_reward_4500004": 1.0, "test/sim_max_reward_4500005": 1.0, "test/sim_max_reward_4500006": 1.0, "test/sim_max_reward_4500007": 1.0, "test/sim_max_reward_4500008": 1.0, "test/sim_max_reward_4500009": 1.0, "test/sim_max_reward_4500010": 1.0, "test/sim_max_reward_4500011": 1.0, "test/sim_max_reward_4500012": 1.0, "test/sim_max_reward_4500013": 1.0, "test/sim_max_reward_4500014": 1.0, "test/sim_max_reward_4500015": 1.0, "test/sim_max_reward_4500016": 1.0, "test/sim_max_reward_4500017": 1.0, "test/sim_max_reward_4500018": 1.0, "test/sim_max_reward_4500019": 1.0, "test/sim_max_reward_4500020": 1.0, "test/sim_max_reward_4500021": 1.0, "train/mean_score": 0.8333333333333334, "test/mean_score": 1.0, "val_loss": 6119604.0} {"train_loss": -21.131620407104492, "global_step": 87233, "epoch": 1051} {"train_loss": -21.40464973449707, "global_step": 87234, "epoch": 1051} {"train_loss": -21.55381202697754, "global_step": 87235, "epoch": 1051} {"train_loss": -21.252676010131836, "global_step": 87236, "epoch": 1051} {"train_loss": -21.008548736572266, "global_step": 87237, "epoch": 1051} {"train_loss": -21.448719024658203, "global_step": 87238, "epoch": 1051} {"train_loss": -21.350921630859375, "global_step": 87239, "epoch": 1051} {"train_loss": -21.354812622070312, "global_step": 87240, "epoch": 1051} {"train_loss": -21.211889266967773, "global_step": 87241, "epoch": 1051} {"train_loss": -21.414005279541016, "global_step": 87242, "epoch": 1051} {"train_loss": -21.13062858581543, "global_step": 87243, "epoch": 1051} {"train_loss": -21.62326431274414, "global_step": 87244, "epoch": 1051} {"train_loss": -21.481931686401367, "global_step": 87245, "epoch": 1051} {"train_loss": -21.295944213867188, "global_step": 87246, "epoch": 1051} {"train_loss": -21.16217613220215, "global_step": 87247, "epoch": 1051} {"train_loss": -21.1552677154541, "global_step": 87248, "epoch": 1051} {"train_loss": -21.183835983276367, "global_step": 87249, "epoch": 1051} {"train_loss": -21.260915756225586, "global_step": 87250, "epoch": 1051} {"train_loss": -21.212993621826172, "global_step": 87251, "epoch": 1051} {"train_loss": -21.892845153808594, "global_step": 87252, "epoch": 1051} {"train_loss": -21.252561569213867, "global_step": 87253, "epoch": 1051} {"train_loss": -21.61775779724121, "global_step": 87254, "epoch": 1051} {"train_loss": -21.256277084350586, "global_step": 87255, "epoch": 1051} {"train_loss": -21.312910079956055, "global_step": 87256, "epoch": 1051} {"train_loss": -21.304059982299805, "global_step": 87257, "epoch": 1051} {"train_loss": -21.45988655090332, "global_step": 87258, "epoch": 1051} {"train_loss": -21.810049057006836, "global_step": 87259, "epoch": 1051} {"train_loss": -21.483495712280273, "global_step": 87260, "epoch": 1051} {"train_loss": -21.7266788482666, "global_step": 87261, "epoch": 1051} {"train_loss": -21.173660278320312, "global_step": 87262, "epoch": 1051} {"train_loss": -21.415884017944336, "global_step": 87263, "epoch": 1051} {"train_loss": -21.151355743408203, "global_step": 87264, "epoch": 1051} {"train_loss": -21.636465072631836, "global_step": 87265, "epoch": 1051} {"train_loss": -21.837982177734375, "global_step": 87266, "epoch": 1051} {"train_loss": -21.25324058532715, "global_step": 87267, "epoch": 1051} {"train_loss": -21.482446670532227, "global_step": 87268, "epoch": 1051} {"train_loss": -21.520864486694336, "global_step": 87269, "epoch": 1051} {"train_loss": -21.639572143554688, "global_step": 87270, "epoch": 1051} {"train_loss": -21.1614990234375, "global_step": 87271, "epoch": 1051} {"train_loss": -21.647815704345703, "global_step": 87272, "epoch": 1051} {"train_loss": -21.31409454345703, "global_step": 87273, "epoch": 1051} {"train_loss": -21.39334487915039, "global_step": 87274, "epoch": 1051} {"train_loss": -21.55869483947754, "global_step": 87275, "epoch": 1051} {"train_loss": -22.144750595092773, "global_step": 87276, "epoch": 1051} {"train_loss": -21.49151611328125, "global_step": 87277, "epoch": 1051} {"train_loss": -21.474668502807617, "global_step": 87278, "epoch": 1051} {"train_loss": -21.777341842651367, "global_step": 87279, "epoch": 1051} {"train_loss": -21.657730102539062, "global_step": 87280, "epoch": 1051} {"train_loss": -21.34391975402832, "global_step": 87281, "epoch": 1051} {"train_loss": -21.689361572265625, "global_step": 87282, "epoch": 1051} {"train_loss": -21.542531967163086, "global_step": 87283, "epoch": 1051} {"train_loss": -21.345827102661133, "global_step": 87284, "epoch": 1051} {"train_loss": -21.495708465576172, "global_step": 87285, "epoch": 1051} {"train_loss": -21.983219146728516, "global_step": 87286, "epoch": 1051} {"train_loss": -20.875476837158203, "global_step": 87287, "epoch": 1051} {"train_loss": -21.780296325683594, "global_step": 87288, "epoch": 1051} {"train_loss": -21.537078857421875, "global_step": 87289, "epoch": 1051} {"train_loss": -21.648061752319336, "global_step": 87290, "epoch": 1051} {"train_loss": -21.37468719482422, "global_step": 87291, "epoch": 1051} {"train_loss": -21.587482452392578, "global_step": 87292, "epoch": 1051} {"train_loss": -21.317445755004883, "global_step": 87293, "epoch": 1051} {"train_loss": -21.378135681152344, "global_step": 87294, "epoch": 1051} {"train_loss": -21.247060775756836, "global_step": 87295, "epoch": 1051} {"train_loss": -21.765949249267578, "global_step": 87296, "epoch": 1051} {"train_loss": -21.265588760375977, "global_step": 87297, "epoch": 1051} {"train_loss": -21.5057315826416, "global_step": 87298, "epoch": 1051} {"train_loss": -21.443681716918945, "global_step": 87299, "epoch": 1051} {"train_loss": -21.658599853515625, "global_step": 87300, "epoch": 1051} {"train_loss": -21.701858520507812, "global_step": 87301, "epoch": 1051} {"train_loss": -21.545635223388672, "global_step": 87302, "epoch": 1051} {"train_loss": -21.070295333862305, "global_step": 87303, "epoch": 1051} {"train_loss": -21.499343872070312, "global_step": 87304, "epoch": 1051} {"train_loss": -21.142065048217773, "global_step": 87305, "epoch": 1051} {"train_loss": -21.576147079467773, "global_step": 87306, "epoch": 1051} {"train_loss": -21.658044815063477, "global_step": 87307, "epoch": 1051} {"train_loss": -21.33500862121582, "global_step": 87308, "epoch": 1051} {"train_loss": -21.2804012298584, "global_step": 87309, "epoch": 1051} {"train_loss": -21.438369750976562, "global_step": 87310, "epoch": 1051} {"train_loss": -21.653772354125977, "global_step": 87311, "epoch": 1051} {"train_loss": -21.409860610961914, "global_step": 87312, "epoch": 1051} {"train_loss": -21.83909034729004, "global_step": 87313, "epoch": 1051} {"train_loss": -21.286462783813477, "global_step": 87314, "epoch": 1051} {"train_loss": -21.466206447187677, "global_step": 87315, "epoch": 1051, "val_loss": 6017595.5} {"train_loss": -20.936887741088867, "global_step": 87316, "epoch": 1052} {"train_loss": -20.653364181518555, "global_step": 87317, "epoch": 1052} {"train_loss": -21.375337600708008, "global_step": 87318, "epoch": 1052} {"train_loss": -20.86842918395996, "global_step": 87319, "epoch": 1052} {"train_loss": -21.473051071166992, "global_step": 87320, "epoch": 1052} {"train_loss": -21.349567413330078, "global_step": 87321, "epoch": 1052} {"train_loss": -20.85658073425293, "global_step": 87322, "epoch": 1052} {"train_loss": -21.068288803100586, "global_step": 87323, "epoch": 1052} {"train_loss": -21.040136337280273, "global_step": 87324, "epoch": 1052} {"train_loss": -21.407583236694336, "global_step": 87325, "epoch": 1052} {"train_loss": -21.364233016967773, "global_step": 87326, "epoch": 1052} {"train_loss": -21.52446174621582, "global_step": 87327, "epoch": 1052} {"train_loss": -21.2202091217041, "global_step": 87328, "epoch": 1052} {"train_loss": -21.150999069213867, "global_step": 87329, "epoch": 1052} {"train_loss": -21.307119369506836, "global_step": 87330, "epoch": 1052} {"train_loss": -21.395404815673828, "global_step": 87331, "epoch": 1052} {"train_loss": -21.085113525390625, "global_step": 87332, "epoch": 1052} {"train_loss": -21.577354431152344, "global_step": 87333, "epoch": 1052} {"train_loss": -21.287826538085938, "global_step": 87334, "epoch": 1052} {"train_loss": -21.827369689941406, "global_step": 87335, "epoch": 1052} {"train_loss": -21.155351638793945, "global_step": 87336, "epoch": 1052} {"train_loss": -21.744016647338867, "global_step": 87337, "epoch": 1052} {"train_loss": -21.40011978149414, "global_step": 87338, "epoch": 1052} {"train_loss": -21.71174430847168, "global_step": 87339, "epoch": 1052} {"train_loss": -21.275405883789062, "global_step": 87340, "epoch": 1052} {"train_loss": -21.172330856323242, "global_step": 87341, "epoch": 1052} {"train_loss": -21.659696578979492, "global_step": 87342, "epoch": 1052} {"train_loss": -21.649473190307617, "global_step": 87343, "epoch": 1052} {"train_loss": -21.525226593017578, "global_step": 87344, "epoch": 1052} {"train_loss": -21.410749435424805, "global_step": 87345, "epoch": 1052} {"train_loss": -21.302505493164062, "global_step": 87346, "epoch": 1052} {"train_loss": -21.5501766204834, "global_step": 87347, "epoch": 1052} {"train_loss": -21.07533073425293, "global_step": 87348, "epoch": 1052} {"train_loss": -21.456562042236328, "global_step": 87349, "epoch": 1052} {"train_loss": -21.273818969726562, "global_step": 87350, "epoch": 1052} {"train_loss": -21.269079208374023, "global_step": 87351, "epoch": 1052} {"train_loss": -21.2586727142334, "global_step": 87352, "epoch": 1052} {"train_loss": -21.132644653320312, "global_step": 87353, "epoch": 1052} {"train_loss": -21.68451499938965, "global_step": 87354, "epoch": 1052} {"train_loss": -21.66315269470215, "global_step": 87355, "epoch": 1052} {"train_loss": -21.434232711791992, "global_step": 87356, "epoch": 1052} {"train_loss": -21.866477966308594, "global_step": 87357, "epoch": 1052} {"train_loss": -21.678762435913086, "global_step": 87358, "epoch": 1052} {"train_loss": -21.69537925720215, "global_step": 87359, "epoch": 1052} {"train_loss": -21.274322509765625, "global_step": 87360, "epoch": 1052} {"train_loss": -21.435331344604492, "global_step": 87361, "epoch": 1052} {"train_loss": -21.724651336669922, "global_step": 87362, "epoch": 1052} {"train_loss": -21.44099998474121, "global_step": 87363, "epoch": 1052} {"train_loss": -21.667646408081055, "global_step": 87364, "epoch": 1052} {"train_loss": -21.47718048095703, "global_step": 87365, "epoch": 1052} {"train_loss": -21.41913414001465, "global_step": 87366, "epoch": 1052} {"train_loss": -21.763505935668945, "global_step": 87367, "epoch": 1052} {"train_loss": -21.43660545349121, "global_step": 87368, "epoch": 1052} {"train_loss": -21.171375274658203, "global_step": 87369, "epoch": 1052} {"train_loss": -21.413217544555664, "global_step": 87370, "epoch": 1052} {"train_loss": -21.9821834564209, "global_step": 87371, "epoch": 1052} {"train_loss": -21.295942306518555, "global_step": 87372, "epoch": 1052} {"train_loss": -21.533592224121094, "global_step": 87373, "epoch": 1052} {"train_loss": -21.529298782348633, "global_step": 87374, "epoch": 1052} {"train_loss": -21.845361709594727, "global_step": 87375, "epoch": 1052} {"train_loss": -21.58833122253418, "global_step": 87376, "epoch": 1052} {"train_loss": -21.64265251159668, "global_step": 87377, "epoch": 1052} {"train_loss": -21.46771812438965, "global_step": 87378, "epoch": 1052} {"train_loss": -21.833261489868164, "global_step": 87379, "epoch": 1052} {"train_loss": -21.643545150756836, "global_step": 87380, "epoch": 1052} {"train_loss": -21.862354278564453, "global_step": 87381, "epoch": 1052} {"train_loss": -21.802955627441406, "global_step": 87382, "epoch": 1052} {"train_loss": -21.583059310913086, "global_step": 87383, "epoch": 1052} {"train_loss": -21.233198165893555, "global_step": 87384, "epoch": 1052} {"train_loss": -21.73581886291504, "global_step": 87385, "epoch": 1052} {"train_loss": -20.975162506103516, "global_step": 87386, "epoch": 1052} {"train_loss": -21.38117027282715, "global_step": 87387, "epoch": 1052} {"train_loss": -21.270437240600586, "global_step": 87388, "epoch": 1052} {"train_loss": -21.18739891052246, "global_step": 87389, "epoch": 1052} {"train_loss": -21.68077278137207, "global_step": 87390, "epoch": 1052} {"train_loss": -21.452733993530273, "global_step": 87391, "epoch": 1052} {"train_loss": -21.453765869140625, "global_step": 87392, "epoch": 1052} {"train_loss": -21.610567092895508, "global_step": 87393, "epoch": 1052} {"train_loss": -21.515260696411133, "global_step": 87394, "epoch": 1052} {"train_loss": -21.695722579956055, "global_step": 87395, "epoch": 1052} {"train_loss": -21.589801788330078, "global_step": 87396, "epoch": 1052} {"train_loss": -21.467504501342773, "global_step": 87397, "epoch": 1052} {"train_loss": -21.434400811252825, "global_step": 87398, "epoch": 1052, "val_loss": 6147641.5} {"train_loss": -21.31743049621582, "global_step": 87399, "epoch": 1053} {"train_loss": -20.94756317138672, "global_step": 87400, "epoch": 1053} {"train_loss": -21.59359359741211, "global_step": 87401, "epoch": 1053} {"train_loss": -21.25069236755371, "global_step": 87402, "epoch": 1053} {"train_loss": -21.27424430847168, "global_step": 87403, "epoch": 1053} {"train_loss": -21.282752990722656, "global_step": 87404, "epoch": 1053} {"train_loss": -21.431119918823242, "global_step": 87405, "epoch": 1053} {"train_loss": -21.618831634521484, "global_step": 87406, "epoch": 1053} {"train_loss": -21.32337760925293, "global_step": 87407, "epoch": 1053} {"train_loss": -21.695632934570312, "global_step": 87408, "epoch": 1053} {"train_loss": -21.61728858947754, "global_step": 87409, "epoch": 1053} {"train_loss": -21.2817440032959, "global_step": 87410, "epoch": 1053} {"train_loss": -21.575281143188477, "global_step": 87411, "epoch": 1053} {"train_loss": -21.430112838745117, "global_step": 87412, "epoch": 1053} {"train_loss": -21.548786163330078, "global_step": 87413, "epoch": 1053} {"train_loss": -21.602338790893555, "global_step": 87414, "epoch": 1053} {"train_loss": -21.295392990112305, "global_step": 87415, "epoch": 1053} {"train_loss": -21.465824127197266, "global_step": 87416, "epoch": 1053} {"train_loss": -21.120040893554688, "global_step": 87417, "epoch": 1053} {"train_loss": -21.50593376159668, "global_step": 87418, "epoch": 1053} {"train_loss": -21.461891174316406, "global_step": 87419, "epoch": 1053} {"train_loss": -21.701772689819336, "global_step": 87420, "epoch": 1053} {"train_loss": -21.56194496154785, "global_step": 87421, "epoch": 1053} {"train_loss": -21.501802444458008, "global_step": 87422, "epoch": 1053} {"train_loss": -21.782207489013672, "global_step": 87423, "epoch": 1053} {"train_loss": -21.82331657409668, "global_step": 87424, "epoch": 1053} {"train_loss": -21.389883041381836, "global_step": 87425, "epoch": 1053} {"train_loss": -21.75941276550293, "global_step": 87426, "epoch": 1053} {"train_loss": -21.559720993041992, "global_step": 87427, "epoch": 1053} {"train_loss": -21.4777889251709, "global_step": 87428, "epoch": 1053} {"train_loss": -21.291418075561523, "global_step": 87429, "epoch": 1053} {"train_loss": -21.490392684936523, "global_step": 87430, "epoch": 1053} {"train_loss": -21.357269287109375, "global_step": 87431, "epoch": 1053} {"train_loss": -21.65097427368164, "global_step": 87432, "epoch": 1053} {"train_loss": -21.46905517578125, "global_step": 87433, "epoch": 1053} {"train_loss": -21.95509147644043, "global_step": 87434, "epoch": 1053} {"train_loss": -21.34963035583496, "global_step": 87435, "epoch": 1053} {"train_loss": -21.324270248413086, "global_step": 87436, "epoch": 1053} {"train_loss": -21.24062156677246, "global_step": 87437, "epoch": 1053} {"train_loss": -21.593429565429688, "global_step": 87438, "epoch": 1053} {"train_loss": -21.763540267944336, "global_step": 87439, "epoch": 1053} {"train_loss": -21.669347763061523, "global_step": 87440, "epoch": 1053} {"train_loss": -21.845779418945312, "global_step": 87441, "epoch": 1053} {"train_loss": -21.364843368530273, "global_step": 87442, "epoch": 1053} {"train_loss": -21.433456420898438, "global_step": 87443, "epoch": 1053} {"train_loss": -21.437795639038086, "global_step": 87444, "epoch": 1053} {"train_loss": -21.338666915893555, "global_step": 87445, "epoch": 1053} {"train_loss": -21.790822982788086, "global_step": 87446, "epoch": 1053} {"train_loss": -21.759611129760742, "global_step": 87447, "epoch": 1053} {"train_loss": -21.68275260925293, "global_step": 87448, "epoch": 1053} {"train_loss": -21.387483596801758, "global_step": 87449, "epoch": 1053} {"train_loss": -21.912288665771484, "global_step": 87450, "epoch": 1053} {"train_loss": -21.30226707458496, "global_step": 87451, "epoch": 1053} {"train_loss": -21.594396591186523, "global_step": 87452, "epoch": 1053} {"train_loss": -21.42506217956543, "global_step": 87453, "epoch": 1053} {"train_loss": -21.6983699798584, "global_step": 87454, "epoch": 1053} {"train_loss": -21.571035385131836, "global_step": 87455, "epoch": 1053} {"train_loss": -21.64131736755371, "global_step": 87456, "epoch": 1053} {"train_loss": -21.752099990844727, "global_step": 87457, "epoch": 1053} {"train_loss": -21.493438720703125, "global_step": 87458, "epoch": 1053} {"train_loss": -21.54530143737793, "global_step": 87459, "epoch": 1053} {"train_loss": -21.43946647644043, "global_step": 87460, "epoch": 1053} {"train_loss": -21.75724220275879, "global_step": 87461, "epoch": 1053} {"train_loss": -21.816184997558594, "global_step": 87462, "epoch": 1053} {"train_loss": -21.262487411499023, "global_step": 87463, "epoch": 1053} {"train_loss": -21.784711837768555, "global_step": 87464, "epoch": 1053} {"train_loss": -21.316110610961914, "global_step": 87465, "epoch": 1053} {"train_loss": -21.573375701904297, "global_step": 87466, "epoch": 1053} {"train_loss": -21.57806396484375, "global_step": 87467, "epoch": 1053} {"train_loss": -21.3826904296875, "global_step": 87468, "epoch": 1053} {"train_loss": -21.442474365234375, "global_step": 87469, "epoch": 1053} {"train_loss": -21.26338768005371, "global_step": 87470, "epoch": 1053} {"train_loss": -21.37210464477539, "global_step": 87471, "epoch": 1053} {"train_loss": -21.179412841796875, "global_step": 87472, "epoch": 1053} {"train_loss": -21.248193740844727, "global_step": 87473, "epoch": 1053} {"train_loss": -21.46305274963379, "global_step": 87474, "epoch": 1053} {"train_loss": -21.477035522460938, "global_step": 87475, "epoch": 1053} {"train_loss": -21.30367660522461, "global_step": 87476, "epoch": 1053} {"train_loss": -21.56787872314453, "global_step": 87477, "epoch": 1053} {"train_loss": -21.57917594909668, "global_step": 87478, "epoch": 1053} {"train_loss": -21.62410545349121, "global_step": 87479, "epoch": 1053} {"train_loss": -21.496124267578125, "global_step": 87480, "epoch": 1053} {"train_loss": -21.517006265111718, "global_step": 87481, "epoch": 1053, "val_loss": 6100579.0} {"train_loss": -21.285411834716797, "global_step": 87482, "epoch": 1054} {"train_loss": -21.46756362915039, "global_step": 87483, "epoch": 1054} {"train_loss": -20.96030616760254, "global_step": 87484, "epoch": 1054} {"train_loss": -21.430240631103516, "global_step": 87485, "epoch": 1054} {"train_loss": -21.260250091552734, "global_step": 87486, "epoch": 1054} {"train_loss": -20.68714714050293, "global_step": 87487, "epoch": 1054} {"train_loss": -21.394241333007812, "global_step": 87488, "epoch": 1054} {"train_loss": -20.83055877685547, "global_step": 87489, "epoch": 1054} {"train_loss": -21.716228485107422, "global_step": 87490, "epoch": 1054} {"train_loss": -20.993980407714844, "global_step": 87491, "epoch": 1054} {"train_loss": -21.694387435913086, "global_step": 87492, "epoch": 1054} {"train_loss": -21.0473575592041, "global_step": 87493, "epoch": 1054} {"train_loss": -21.181692123413086, "global_step": 87494, "epoch": 1054} {"train_loss": -21.555713653564453, "global_step": 87495, "epoch": 1054} {"train_loss": -21.172035217285156, "global_step": 87496, "epoch": 1054} {"train_loss": -21.484621047973633, "global_step": 87497, "epoch": 1054} {"train_loss": -21.4072265625, "global_step": 87498, "epoch": 1054} {"train_loss": -21.3892879486084, "global_step": 87499, "epoch": 1054} {"train_loss": -21.202417373657227, "global_step": 87500, "epoch": 1054} {"train_loss": -21.992727279663086, "global_step": 87501, "epoch": 1054} {"train_loss": -21.505552291870117, "global_step": 87502, "epoch": 1054} {"train_loss": -21.3483829498291, "global_step": 87503, "epoch": 1054} {"train_loss": -21.797544479370117, "global_step": 87504, "epoch": 1054} {"train_loss": -21.537878036499023, "global_step": 87505, "epoch": 1054} {"train_loss": -21.481657028198242, "global_step": 87506, "epoch": 1054} {"train_loss": -21.607025146484375, "global_step": 87507, "epoch": 1054} {"train_loss": -21.5897216796875, "global_step": 87508, "epoch": 1054} {"train_loss": -21.9091854095459, "global_step": 87509, "epoch": 1054} {"train_loss": -21.4114990234375, "global_step": 87510, "epoch": 1054} {"train_loss": -21.864500045776367, "global_step": 87511, "epoch": 1054} {"train_loss": -21.770761489868164, "global_step": 87512, "epoch": 1054} {"train_loss": -21.31484031677246, "global_step": 87513, "epoch": 1054} {"train_loss": -21.6259708404541, "global_step": 87514, "epoch": 1054} {"train_loss": -21.472244262695312, "global_step": 87515, "epoch": 1054} {"train_loss": -21.234296798706055, "global_step": 87516, "epoch": 1054} {"train_loss": -21.571699142456055, "global_step": 87517, "epoch": 1054} {"train_loss": -20.9841251373291, "global_step": 87518, "epoch": 1054} {"train_loss": -21.392826080322266, "global_step": 87519, "epoch": 1054} {"train_loss": -21.33620834350586, "global_step": 87520, "epoch": 1054} {"train_loss": -21.150436401367188, "global_step": 87521, "epoch": 1054} {"train_loss": -21.82098388671875, "global_step": 87522, "epoch": 1054} {"train_loss": -21.018299102783203, "global_step": 87523, "epoch": 1054} {"train_loss": -21.33255386352539, "global_step": 87524, "epoch": 1054} {"train_loss": -21.244688034057617, "global_step": 87525, "epoch": 1054} {"train_loss": -21.465261459350586, "global_step": 87526, "epoch": 1054} {"train_loss": -21.265323638916016, "global_step": 87527, "epoch": 1054} {"train_loss": -21.1378173828125, "global_step": 87528, "epoch": 1054} {"train_loss": -21.3847713470459, "global_step": 87529, "epoch": 1054} {"train_loss": -21.664331436157227, "global_step": 87530, "epoch": 1054} {"train_loss": -21.27511215209961, "global_step": 87531, "epoch": 1054} {"train_loss": -21.67416763305664, "global_step": 87532, "epoch": 1054} {"train_loss": -21.445810317993164, "global_step": 87533, "epoch": 1054} {"train_loss": -21.190330505371094, "global_step": 87534, "epoch": 1054} {"train_loss": -21.890079498291016, "global_step": 87535, "epoch": 1054} {"train_loss": -21.64542579650879, "global_step": 87536, "epoch": 1054} {"train_loss": -21.394216537475586, "global_step": 87537, "epoch": 1054} {"train_loss": -21.379194259643555, "global_step": 87538, "epoch": 1054} {"train_loss": -21.591272354125977, "global_step": 87539, "epoch": 1054} {"train_loss": -21.372047424316406, "global_step": 87540, "epoch": 1054} {"train_loss": -21.377050399780273, "global_step": 87541, "epoch": 1054} {"train_loss": -21.737401962280273, "global_step": 87542, "epoch": 1054} {"train_loss": -21.44373893737793, "global_step": 87543, "epoch": 1054} {"train_loss": -20.991641998291016, "global_step": 87544, "epoch": 1054} {"train_loss": -21.320350646972656, "global_step": 87545, "epoch": 1054} {"train_loss": -21.490163803100586, "global_step": 87546, "epoch": 1054} {"train_loss": -21.505800247192383, "global_step": 87547, "epoch": 1054} {"train_loss": -21.550519943237305, "global_step": 87548, "epoch": 1054} {"train_loss": -21.140439987182617, "global_step": 87549, "epoch": 1054} {"train_loss": -21.778120040893555, "global_step": 87550, "epoch": 1054} {"train_loss": -21.21533966064453, "global_step": 87551, "epoch": 1054} {"train_loss": -21.47489356994629, "global_step": 87552, "epoch": 1054} {"train_loss": -21.508350372314453, "global_step": 87553, "epoch": 1054} {"train_loss": -21.392026901245117, "global_step": 87554, "epoch": 1054} {"train_loss": -21.790130615234375, "global_step": 87555, "epoch": 1054} {"train_loss": -21.348987579345703, "global_step": 87556, "epoch": 1054} {"train_loss": -21.442312240600586, "global_step": 87557, "epoch": 1054} {"train_loss": -21.59758758544922, "global_step": 87558, "epoch": 1054} {"train_loss": -21.17526626586914, "global_step": 87559, "epoch": 1054} {"train_loss": -21.573774337768555, "global_step": 87560, "epoch": 1054} {"train_loss": -21.370840072631836, "global_step": 87561, "epoch": 1054} {"train_loss": -21.604825973510742, "global_step": 87562, "epoch": 1054} {"train_loss": -21.498720169067383, "global_step": 87563, "epoch": 1054} {"train_loss": -21.423201756305005, "global_step": 87564, "epoch": 1054, "val_loss": 6058087.0} {"train_loss": -21.521818161010742, "global_step": 87565, "epoch": 1055} {"train_loss": -21.15644073486328, "global_step": 87566, "epoch": 1055} {"train_loss": -21.560827255249023, "global_step": 87567, "epoch": 1055} {"train_loss": -21.181333541870117, "global_step": 87568, "epoch": 1055} {"train_loss": -21.3024959564209, "global_step": 87569, "epoch": 1055} {"train_loss": -21.57016372680664, "global_step": 87570, "epoch": 1055} {"train_loss": -21.474872589111328, "global_step": 87571, "epoch": 1055} {"train_loss": -21.622299194335938, "global_step": 87572, "epoch": 1055} {"train_loss": -21.738122940063477, "global_step": 87573, "epoch": 1055} {"train_loss": -21.034780502319336, "global_step": 87574, "epoch": 1055} {"train_loss": -21.59587860107422, "global_step": 87575, "epoch": 1055} {"train_loss": -20.901512145996094, "global_step": 87576, "epoch": 1055} {"train_loss": -21.407304763793945, "global_step": 87577, "epoch": 1055} {"train_loss": -21.49344825744629, "global_step": 87578, "epoch": 1055} {"train_loss": -21.22500228881836, "global_step": 87579, "epoch": 1055} {"train_loss": -21.28196144104004, "global_step": 87580, "epoch": 1055} {"train_loss": -21.1993408203125, "global_step": 87581, "epoch": 1055} {"train_loss": -21.61188316345215, "global_step": 87582, "epoch": 1055} {"train_loss": -21.881385803222656, "global_step": 87583, "epoch": 1055} {"train_loss": -21.147388458251953, "global_step": 87584, "epoch": 1055} {"train_loss": -21.542619705200195, "global_step": 87585, "epoch": 1055} {"train_loss": -21.89649772644043, "global_step": 87586, "epoch": 1055} {"train_loss": -21.626060485839844, "global_step": 87587, "epoch": 1055} {"train_loss": -21.621143341064453, "global_step": 87588, "epoch": 1055} {"train_loss": -21.1658878326416, "global_step": 87589, "epoch": 1055} {"train_loss": -21.49435806274414, "global_step": 87590, "epoch": 1055} {"train_loss": -21.96120262145996, "global_step": 87591, "epoch": 1055} {"train_loss": -21.308818817138672, "global_step": 87592, "epoch": 1055} {"train_loss": -21.68878173828125, "global_step": 87593, "epoch": 1055} {"train_loss": -21.88645362854004, "global_step": 87594, "epoch": 1055} {"train_loss": -21.91635513305664, "global_step": 87595, "epoch": 1055} {"train_loss": -21.605224609375, "global_step": 87596, "epoch": 1055} {"train_loss": -21.577497482299805, "global_step": 87597, "epoch": 1055} {"train_loss": -21.543088912963867, "global_step": 87598, "epoch": 1055} {"train_loss": -21.3161678314209, "global_step": 87599, "epoch": 1055} {"train_loss": -21.578962326049805, "global_step": 87600, "epoch": 1055} {"train_loss": -21.613344192504883, "global_step": 87601, "epoch": 1055} {"train_loss": -21.603212356567383, "global_step": 87602, "epoch": 1055} {"train_loss": -21.0873966217041, "global_step": 87603, "epoch": 1055} {"train_loss": -21.83997917175293, "global_step": 87604, "epoch": 1055} {"train_loss": -21.82767677307129, "global_step": 87605, "epoch": 1055} {"train_loss": -21.544719696044922, "global_step": 87606, "epoch": 1055} {"train_loss": -21.214797973632812, "global_step": 87607, "epoch": 1055} {"train_loss": -21.6016788482666, "global_step": 87608, "epoch": 1055} {"train_loss": -21.85044288635254, "global_step": 87609, "epoch": 1055} {"train_loss": -21.699182510375977, "global_step": 87610, "epoch": 1055} {"train_loss": -21.699634552001953, "global_step": 87611, "epoch": 1055} {"train_loss": -21.838123321533203, "global_step": 87612, "epoch": 1055} {"train_loss": -21.47127342224121, "global_step": 87613, "epoch": 1055} {"train_loss": -21.521398544311523, "global_step": 87614, "epoch": 1055} {"train_loss": -21.595169067382812, "global_step": 87615, "epoch": 1055} {"train_loss": -21.2139892578125, "global_step": 87616, "epoch": 1055} {"train_loss": -21.531232833862305, "global_step": 87617, "epoch": 1055} {"train_loss": -21.524307250976562, "global_step": 87618, "epoch": 1055} {"train_loss": -21.7996883392334, "global_step": 87619, "epoch": 1055} {"train_loss": -21.216772079467773, "global_step": 87620, "epoch": 1055} {"train_loss": -21.38819122314453, "global_step": 87621, "epoch": 1055} {"train_loss": -21.581357955932617, "global_step": 87622, "epoch": 1055} {"train_loss": -21.35430335998535, "global_step": 87623, "epoch": 1055} {"train_loss": -20.98271369934082, "global_step": 87624, "epoch": 1055} {"train_loss": -21.746841430664062, "global_step": 87625, "epoch": 1055} {"train_loss": -21.312864303588867, "global_step": 87626, "epoch": 1055} {"train_loss": -21.152891159057617, "global_step": 87627, "epoch": 1055} {"train_loss": -21.462976455688477, "global_step": 87628, "epoch": 1055} {"train_loss": -21.335912704467773, "global_step": 87629, "epoch": 1055} {"train_loss": -21.09652328491211, "global_step": 87630, "epoch": 1055} {"train_loss": -21.4688777923584, "global_step": 87631, "epoch": 1055} {"train_loss": -21.76904296875, "global_step": 87632, "epoch": 1055} {"train_loss": -21.54163932800293, "global_step": 87633, "epoch": 1055} {"train_loss": -21.588918685913086, "global_step": 87634, "epoch": 1055} {"train_loss": -21.219078063964844, "global_step": 87635, "epoch": 1055} {"train_loss": -21.604475021362305, "global_step": 87636, "epoch": 1055} {"train_loss": -21.3745174407959, "global_step": 87637, "epoch": 1055} {"train_loss": -21.35896110534668, "global_step": 87638, "epoch": 1055} {"train_loss": -21.5399227142334, "global_step": 87639, "epoch": 1055} {"train_loss": -21.809560775756836, "global_step": 87640, "epoch": 1055} {"train_loss": -21.080251693725586, "global_step": 87641, "epoch": 1055} {"train_loss": -21.412031173706055, "global_step": 87642, "epoch": 1055} {"train_loss": -21.90365219116211, "global_step": 87643, "epoch": 1055} {"train_loss": -21.408254623413086, "global_step": 87644, "epoch": 1055} {"train_loss": -21.411375045776367, "global_step": 87645, "epoch": 1055} {"train_loss": -21.267614364624023, "global_step": 87646, "epoch": 1055} {"train_loss": -21.50475897271949, "global_step": 87647, "epoch": 1055, "val_loss": 6075173.0} {"train_loss": -21.30316734313965, "global_step": 87648, "epoch": 1056} {"train_loss": -21.237945556640625, "global_step": 87649, "epoch": 1056} {"train_loss": -21.201807022094727, "global_step": 87650, "epoch": 1056} {"train_loss": -21.366910934448242, "global_step": 87651, "epoch": 1056} {"train_loss": -21.48042869567871, "global_step": 87652, "epoch": 1056} {"train_loss": -21.176605224609375, "global_step": 87653, "epoch": 1056} {"train_loss": -21.365102767944336, "global_step": 87654, "epoch": 1056} {"train_loss": -21.388111114501953, "global_step": 87655, "epoch": 1056} {"train_loss": -21.182329177856445, "global_step": 87656, "epoch": 1056} {"train_loss": -21.28766441345215, "global_step": 87657, "epoch": 1056} {"train_loss": -21.11223602294922, "global_step": 87658, "epoch": 1056} {"train_loss": -21.611021041870117, "global_step": 87659, "epoch": 1056} {"train_loss": -21.544681549072266, "global_step": 87660, "epoch": 1056} {"train_loss": -21.53879165649414, "global_step": 87661, "epoch": 1056} {"train_loss": -21.47043800354004, "global_step": 87662, "epoch": 1056} {"train_loss": -21.792333602905273, "global_step": 87663, "epoch": 1056} {"train_loss": -21.26711654663086, "global_step": 87664, "epoch": 1056} {"train_loss": -21.392898559570312, "global_step": 87665, "epoch": 1056} {"train_loss": -20.985660552978516, "global_step": 87666, "epoch": 1056} {"train_loss": -21.30995750427246, "global_step": 87667, "epoch": 1056} {"train_loss": -21.6866397857666, "global_step": 87668, "epoch": 1056} {"train_loss": -21.433395385742188, "global_step": 87669, "epoch": 1056} {"train_loss": -21.131919860839844, "global_step": 87670, "epoch": 1056} {"train_loss": -21.440465927124023, "global_step": 87671, "epoch": 1056} {"train_loss": -21.61246681213379, "global_step": 87672, "epoch": 1056} {"train_loss": -21.68707847595215, "global_step": 87673, "epoch": 1056} {"train_loss": -21.987777709960938, "global_step": 87674, "epoch": 1056} {"train_loss": -21.367639541625977, "global_step": 87675, "epoch": 1056} {"train_loss": -21.182453155517578, "global_step": 87676, "epoch": 1056} {"train_loss": -21.472047805786133, "global_step": 87677, "epoch": 1056} {"train_loss": -21.05596923828125, "global_step": 87678, "epoch": 1056} {"train_loss": -21.418397903442383, "global_step": 87679, "epoch": 1056} {"train_loss": -21.547155380249023, "global_step": 87680, "epoch": 1056} {"train_loss": -21.6136417388916, "global_step": 87681, "epoch": 1056} {"train_loss": -21.545639038085938, "global_step": 87682, "epoch": 1056} {"train_loss": -21.372831344604492, "global_step": 87683, "epoch": 1056} {"train_loss": -21.545988082885742, "global_step": 87684, "epoch": 1056} {"train_loss": -21.718952178955078, "global_step": 87685, "epoch": 1056} {"train_loss": -21.7437801361084, "global_step": 87686, "epoch": 1056} {"train_loss": -21.368392944335938, "global_step": 87687, "epoch": 1056} {"train_loss": -21.464628219604492, "global_step": 87688, "epoch": 1056} {"train_loss": -21.581302642822266, "global_step": 87689, "epoch": 1056} {"train_loss": -21.444433212280273, "global_step": 87690, "epoch": 1056} {"train_loss": -21.570825576782227, "global_step": 87691, "epoch": 1056} {"train_loss": -21.771596908569336, "global_step": 87692, "epoch": 1056} {"train_loss": -21.13996696472168, "global_step": 87693, "epoch": 1056} {"train_loss": -21.42793846130371, "global_step": 87694, "epoch": 1056} {"train_loss": -21.904022216796875, "global_step": 87695, "epoch": 1056} {"train_loss": -21.32355308532715, "global_step": 87696, "epoch": 1056} {"train_loss": -21.8642520904541, "global_step": 87697, "epoch": 1056} {"train_loss": -21.907085418701172, "global_step": 87698, "epoch": 1056} {"train_loss": -21.563886642456055, "global_step": 87699, "epoch": 1056} {"train_loss": -21.764469146728516, "global_step": 87700, "epoch": 1056} {"train_loss": -21.25421714782715, "global_step": 87701, "epoch": 1056} {"train_loss": -21.39523696899414, "global_step": 87702, "epoch": 1056} {"train_loss": -21.57077980041504, "global_step": 87703, "epoch": 1056} {"train_loss": -21.637929916381836, "global_step": 87704, "epoch": 1056} {"train_loss": -21.90363121032715, "global_step": 87705, "epoch": 1056} {"train_loss": -21.58163833618164, "global_step": 87706, "epoch": 1056} {"train_loss": -21.538496017456055, "global_step": 87707, "epoch": 1056} {"train_loss": -21.118497848510742, "global_step": 87708, "epoch": 1056} {"train_loss": -21.509553909301758, "global_step": 87709, "epoch": 1056} {"train_loss": -21.533605575561523, "global_step": 87710, "epoch": 1056} {"train_loss": -21.688791275024414, "global_step": 87711, "epoch": 1056} {"train_loss": -21.390281677246094, "global_step": 87712, "epoch": 1056} {"train_loss": -21.579532623291016, "global_step": 87713, "epoch": 1056} {"train_loss": -22.091665267944336, "global_step": 87714, "epoch": 1056} {"train_loss": -21.59809112548828, "global_step": 87715, "epoch": 1056} {"train_loss": -21.420398712158203, "global_step": 87716, "epoch": 1056} {"train_loss": -21.390689849853516, "global_step": 87717, "epoch": 1056} {"train_loss": -21.780763626098633, "global_step": 87718, "epoch": 1056} {"train_loss": -21.643583297729492, "global_step": 87719, "epoch": 1056} {"train_loss": -21.645774841308594, "global_step": 87720, "epoch": 1056} {"train_loss": -21.313373565673828, "global_step": 87721, "epoch": 1056} {"train_loss": -21.66855239868164, "global_step": 87722, "epoch": 1056} {"train_loss": -21.73524284362793, "global_step": 87723, "epoch": 1056} {"train_loss": -21.318395614624023, "global_step": 87724, "epoch": 1056} {"train_loss": -22.065921783447266, "global_step": 87725, "epoch": 1056} {"train_loss": -21.83548355102539, "global_step": 87726, "epoch": 1056} {"train_loss": -21.698421478271484, "global_step": 87727, "epoch": 1056} {"train_loss": -21.746604919433594, "global_step": 87728, "epoch": 1056} {"train_loss": -21.32962417602539, "global_step": 87729, "epoch": 1056} {"train_loss": -21.497860828077936, "global_step": 87730, "epoch": 1056, "val_loss": 6108862.0} {"train_loss": -21.40949821472168, "global_step": 87731, "epoch": 1057} {"train_loss": -21.224454879760742, "global_step": 87732, "epoch": 1057} {"train_loss": -21.333219528198242, "global_step": 87733, "epoch": 1057} {"train_loss": -21.141605377197266, "global_step": 87734, "epoch": 1057} {"train_loss": -21.25935935974121, "global_step": 87735, "epoch": 1057} {"train_loss": -21.20875358581543, "global_step": 87736, "epoch": 1057} {"train_loss": -21.344289779663086, "global_step": 87737, "epoch": 1057} {"train_loss": -21.261037826538086, "global_step": 87738, "epoch": 1057} {"train_loss": -21.412185668945312, "global_step": 87739, "epoch": 1057} {"train_loss": -21.295156478881836, "global_step": 87740, "epoch": 1057} {"train_loss": -21.451725006103516, "global_step": 87741, "epoch": 1057} {"train_loss": -21.424184799194336, "global_step": 87742, "epoch": 1057} {"train_loss": -21.40938949584961, "global_step": 87743, "epoch": 1057} {"train_loss": -21.092533111572266, "global_step": 87744, "epoch": 1057} {"train_loss": -21.45472526550293, "global_step": 87745, "epoch": 1057} {"train_loss": -21.10981559753418, "global_step": 87746, "epoch": 1057} {"train_loss": -21.034929275512695, "global_step": 87747, "epoch": 1057} {"train_loss": -21.48488426208496, "global_step": 87748, "epoch": 1057} {"train_loss": -21.507211685180664, "global_step": 87749, "epoch": 1057} {"train_loss": -21.203083038330078, "global_step": 87750, "epoch": 1057} {"train_loss": -21.627483367919922, "global_step": 87751, "epoch": 1057} {"train_loss": -21.709375381469727, "global_step": 87752, "epoch": 1057} {"train_loss": -21.291141510009766, "global_step": 87753, "epoch": 1057} {"train_loss": -21.44398307800293, "global_step": 87754, "epoch": 1057} {"train_loss": -21.60431480407715, "global_step": 87755, "epoch": 1057} {"train_loss": -21.33528709411621, "global_step": 87756, "epoch": 1057} {"train_loss": -21.291406631469727, "global_step": 87757, "epoch": 1057} {"train_loss": -21.66949462890625, "global_step": 87758, "epoch": 1057} {"train_loss": -21.512989044189453, "global_step": 87759, "epoch": 1057} {"train_loss": -21.58009910583496, "global_step": 87760, "epoch": 1057} {"train_loss": -21.568037033081055, "global_step": 87761, "epoch": 1057} {"train_loss": -21.312150955200195, "global_step": 87762, "epoch": 1057} {"train_loss": -21.789281845092773, "global_step": 87763, "epoch": 1057} {"train_loss": -21.547182083129883, "global_step": 87764, "epoch": 1057} {"train_loss": -21.78057289123535, "global_step": 87765, "epoch": 1057} {"train_loss": -21.379465103149414, "global_step": 87766, "epoch": 1057} {"train_loss": -21.328922271728516, "global_step": 87767, "epoch": 1057} {"train_loss": -21.45636749267578, "global_step": 87768, "epoch": 1057} {"train_loss": -21.664705276489258, "global_step": 87769, "epoch": 1057} {"train_loss": -21.309667587280273, "global_step": 87770, "epoch": 1057} {"train_loss": -21.66716957092285, "global_step": 87771, "epoch": 1057} {"train_loss": -21.305278778076172, "global_step": 87772, "epoch": 1057} {"train_loss": -21.77984046936035, "global_step": 87773, "epoch": 1057} {"train_loss": -21.854162216186523, "global_step": 87774, "epoch": 1057} {"train_loss": -21.0709228515625, "global_step": 87775, "epoch": 1057} {"train_loss": -21.53194808959961, "global_step": 87776, "epoch": 1057} {"train_loss": -21.326080322265625, "global_step": 87777, "epoch": 1057} {"train_loss": -21.41429901123047, "global_step": 87778, "epoch": 1057} {"train_loss": -21.70781898498535, "global_step": 87779, "epoch": 1057} {"train_loss": -21.597700119018555, "global_step": 87780, "epoch": 1057} {"train_loss": -21.7435359954834, "global_step": 87781, "epoch": 1057} {"train_loss": -21.029769897460938, "global_step": 87782, "epoch": 1057} {"train_loss": -21.543869018554688, "global_step": 87783, "epoch": 1057} {"train_loss": -21.39417839050293, "global_step": 87784, "epoch": 1057} {"train_loss": -21.418439865112305, "global_step": 87785, "epoch": 1057} {"train_loss": -21.79532241821289, "global_step": 87786, "epoch": 1057} {"train_loss": -21.395858764648438, "global_step": 87787, "epoch": 1057} {"train_loss": -21.661422729492188, "global_step": 87788, "epoch": 1057} {"train_loss": -21.47535514831543, "global_step": 87789, "epoch": 1057} {"train_loss": -21.85367774963379, "global_step": 87790, "epoch": 1057} {"train_loss": -21.525592803955078, "global_step": 87791, "epoch": 1057} {"train_loss": -21.600238800048828, "global_step": 87792, "epoch": 1057} {"train_loss": -21.69161033630371, "global_step": 87793, "epoch": 1057} {"train_loss": -21.597166061401367, "global_step": 87794, "epoch": 1057} {"train_loss": -21.892562866210938, "global_step": 87795, "epoch": 1057} {"train_loss": -21.798343658447266, "global_step": 87796, "epoch": 1057} {"train_loss": -21.661338806152344, "global_step": 87797, "epoch": 1057} {"train_loss": -21.543989181518555, "global_step": 87798, "epoch": 1057} {"train_loss": -21.605504989624023, "global_step": 87799, "epoch": 1057} {"train_loss": -21.611799240112305, "global_step": 87800, "epoch": 1057} {"train_loss": -21.811798095703125, "global_step": 87801, "epoch": 1057} {"train_loss": -21.710309982299805, "global_step": 87802, "epoch": 1057} {"train_loss": -21.761682510375977, "global_step": 87803, "epoch": 1057} {"train_loss": -21.31315040588379, "global_step": 87804, "epoch": 1057} {"train_loss": -21.256460189819336, "global_step": 87805, "epoch": 1057} {"train_loss": -21.728500366210938, "global_step": 87806, "epoch": 1057} {"train_loss": -21.603857040405273, "global_step": 87807, "epoch": 1057} {"train_loss": -21.597412109375, "global_step": 87808, "epoch": 1057} {"train_loss": -21.62171745300293, "global_step": 87809, "epoch": 1057} {"train_loss": -21.73163414001465, "global_step": 87810, "epoch": 1057} {"train_loss": -21.673795700073242, "global_step": 87811, "epoch": 1057} {"train_loss": -21.30379295349121, "global_step": 87812, "epoch": 1057} {"train_loss": -21.49755567527679, "global_step": 87813, "epoch": 1057, "val_loss": 6158154.0} {"train_loss": -21.142364501953125, "global_step": 87814, "epoch": 1058} {"train_loss": -21.18715476989746, "global_step": 87815, "epoch": 1058} {"train_loss": -21.50050926208496, "global_step": 87816, "epoch": 1058} {"train_loss": -21.09895896911621, "global_step": 87817, "epoch": 1058} {"train_loss": -21.252777099609375, "global_step": 87818, "epoch": 1058} {"train_loss": -21.05184555053711, "global_step": 87819, "epoch": 1058} {"train_loss": -21.46561050415039, "global_step": 87820, "epoch": 1058} {"train_loss": -21.037460327148438, "global_step": 87821, "epoch": 1058} {"train_loss": -21.397756576538086, "global_step": 87822, "epoch": 1058} {"train_loss": -21.067733764648438, "global_step": 87823, "epoch": 1058} {"train_loss": -21.36932945251465, "global_step": 87824, "epoch": 1058} {"train_loss": -21.452444076538086, "global_step": 87825, "epoch": 1058} {"train_loss": -21.124195098876953, "global_step": 87826, "epoch": 1058} {"train_loss": -21.25589942932129, "global_step": 87827, "epoch": 1058} {"train_loss": -20.867399215698242, "global_step": 87828, "epoch": 1058} {"train_loss": -21.151365280151367, "global_step": 87829, "epoch": 1058} {"train_loss": -21.391721725463867, "global_step": 87830, "epoch": 1058} {"train_loss": -20.91297149658203, "global_step": 87831, "epoch": 1058} {"train_loss": -21.778841018676758, "global_step": 87832, "epoch": 1058} {"train_loss": -21.5499210357666, "global_step": 87833, "epoch": 1058} {"train_loss": -21.431840896606445, "global_step": 87834, "epoch": 1058} {"train_loss": -21.31748390197754, "global_step": 87835, "epoch": 1058} {"train_loss": -21.643020629882812, "global_step": 87836, "epoch": 1058} {"train_loss": -21.330764770507812, "global_step": 87837, "epoch": 1058} {"train_loss": -21.25312614440918, "global_step": 87838, "epoch": 1058} {"train_loss": -21.597623825073242, "global_step": 87839, "epoch": 1058} {"train_loss": -21.365596771240234, "global_step": 87840, "epoch": 1058} {"train_loss": -21.489545822143555, "global_step": 87841, "epoch": 1058} {"train_loss": -21.424604415893555, "global_step": 87842, "epoch": 1058} {"train_loss": -21.322969436645508, "global_step": 87843, "epoch": 1058} {"train_loss": -21.567550659179688, "global_step": 87844, "epoch": 1058} {"train_loss": -21.53611183166504, "global_step": 87845, "epoch": 1058} {"train_loss": -21.54511260986328, "global_step": 87846, "epoch": 1058} {"train_loss": -21.73516845703125, "global_step": 87847, "epoch": 1058} {"train_loss": -21.921762466430664, "global_step": 87848, "epoch": 1058} {"train_loss": -21.869646072387695, "global_step": 87849, "epoch": 1058} {"train_loss": -21.525243759155273, "global_step": 87850, "epoch": 1058} {"train_loss": -21.678421020507812, "global_step": 87851, "epoch": 1058} {"train_loss": -21.514841079711914, "global_step": 87852, "epoch": 1058} {"train_loss": -21.3384952545166, "global_step": 87853, "epoch": 1058} {"train_loss": -21.719482421875, "global_step": 87854, "epoch": 1058} {"train_loss": -21.795442581176758, "global_step": 87855, "epoch": 1058} {"train_loss": -21.788084030151367, "global_step": 87856, "epoch": 1058} {"train_loss": -21.552536010742188, "global_step": 87857, "epoch": 1058} {"train_loss": -21.36866569519043, "global_step": 87858, "epoch": 1058} {"train_loss": -21.693098068237305, "global_step": 87859, "epoch": 1058} {"train_loss": -20.9810733795166, "global_step": 87860, "epoch": 1058} {"train_loss": -21.42316436767578, "global_step": 87861, "epoch": 1058} {"train_loss": -21.244237899780273, "global_step": 87862, "epoch": 1058} {"train_loss": -21.241544723510742, "global_step": 87863, "epoch": 1058} {"train_loss": -21.72438621520996, "global_step": 87864, "epoch": 1058} {"train_loss": -21.583789825439453, "global_step": 87865, "epoch": 1058} {"train_loss": -21.6724910736084, "global_step": 87866, "epoch": 1058} {"train_loss": -21.537822723388672, "global_step": 87867, "epoch": 1058} {"train_loss": -21.227895736694336, "global_step": 87868, "epoch": 1058} {"train_loss": -21.231115341186523, "global_step": 87869, "epoch": 1058} {"train_loss": -21.244476318359375, "global_step": 87870, "epoch": 1058} {"train_loss": -21.665327072143555, "global_step": 87871, "epoch": 1058} {"train_loss": -21.68027114868164, "global_step": 87872, "epoch": 1058} {"train_loss": -21.300552368164062, "global_step": 87873, "epoch": 1058} {"train_loss": -21.503042221069336, "global_step": 87874, "epoch": 1058} {"train_loss": -20.957048416137695, "global_step": 87875, "epoch": 1058} {"train_loss": -21.82794761657715, "global_step": 87876, "epoch": 1058} {"train_loss": -21.939529418945312, "global_step": 87877, "epoch": 1058} {"train_loss": -21.56951141357422, "global_step": 87878, "epoch": 1058} {"train_loss": -21.294544219970703, "global_step": 87879, "epoch": 1058} {"train_loss": -21.398685455322266, "global_step": 87880, "epoch": 1058} {"train_loss": -21.681716918945312, "global_step": 87881, "epoch": 1058} {"train_loss": -21.688268661499023, "global_step": 87882, "epoch": 1058} {"train_loss": -21.641525268554688, "global_step": 87883, "epoch": 1058} {"train_loss": -21.618494033813477, "global_step": 87884, "epoch": 1058} {"train_loss": -21.13187026977539, "global_step": 87885, "epoch": 1058} {"train_loss": -21.522558212280273, "global_step": 87886, "epoch": 1058} {"train_loss": -21.156328201293945, "global_step": 87887, "epoch": 1058} {"train_loss": -21.469959259033203, "global_step": 87888, "epoch": 1058} {"train_loss": -21.189706802368164, "global_step": 87889, "epoch": 1058} {"train_loss": -21.28630828857422, "global_step": 87890, "epoch": 1058} {"train_loss": -21.21876335144043, "global_step": 87891, "epoch": 1058} {"train_loss": -21.587779998779297, "global_step": 87892, "epoch": 1058} {"train_loss": -21.508695602416992, "global_step": 87893, "epoch": 1058} {"train_loss": -21.515216827392578, "global_step": 87894, "epoch": 1058} {"train_loss": -21.138412475585938, "global_step": 87895, "epoch": 1058} {"train_loss": -21.436639969607434, "global_step": 87896, "epoch": 1058, "val_loss": 6155767.0} {"train_loss": -20.634321212768555, "global_step": 87897, "epoch": 1059} {"train_loss": -21.487567901611328, "global_step": 87898, "epoch": 1059} {"train_loss": -21.067235946655273, "global_step": 87899, "epoch": 1059} {"train_loss": -21.593687057495117, "global_step": 87900, "epoch": 1059} {"train_loss": -21.264877319335938, "global_step": 87901, "epoch": 1059} {"train_loss": -20.936267852783203, "global_step": 87902, "epoch": 1059} {"train_loss": -20.873981475830078, "global_step": 87903, "epoch": 1059} {"train_loss": -21.097869873046875, "global_step": 87904, "epoch": 1059} {"train_loss": -21.16810417175293, "global_step": 87905, "epoch": 1059} {"train_loss": -21.433948516845703, "global_step": 87906, "epoch": 1059} {"train_loss": -21.182565689086914, "global_step": 87907, "epoch": 1059} {"train_loss": -21.314626693725586, "global_step": 87908, "epoch": 1059} {"train_loss": -21.370319366455078, "global_step": 87909, "epoch": 1059} {"train_loss": -21.332181930541992, "global_step": 87910, "epoch": 1059} {"train_loss": -21.290414810180664, "global_step": 87911, "epoch": 1059} {"train_loss": -21.18486976623535, "global_step": 87912, "epoch": 1059} {"train_loss": -21.566802978515625, "global_step": 87913, "epoch": 1059} {"train_loss": -21.332979202270508, "global_step": 87914, "epoch": 1059} {"train_loss": -21.52579689025879, "global_step": 87915, "epoch": 1059} {"train_loss": -21.33060073852539, "global_step": 87916, "epoch": 1059} {"train_loss": -21.505292892456055, "global_step": 87917, "epoch": 1059} {"train_loss": -21.268423080444336, "global_step": 87918, "epoch": 1059} {"train_loss": -21.578895568847656, "global_step": 87919, "epoch": 1059} {"train_loss": -21.477340698242188, "global_step": 87920, "epoch": 1059} {"train_loss": -21.25200843811035, "global_step": 87921, "epoch": 1059} {"train_loss": -21.84914207458496, "global_step": 87922, "epoch": 1059} {"train_loss": -21.695240020751953, "global_step": 87923, "epoch": 1059} {"train_loss": -21.269018173217773, "global_step": 87924, "epoch": 1059} {"train_loss": -21.300296783447266, "global_step": 87925, "epoch": 1059} {"train_loss": -21.50079917907715, "global_step": 87926, "epoch": 1059} {"train_loss": -21.28583335876465, "global_step": 87927, "epoch": 1059} {"train_loss": -21.32493019104004, "global_step": 87928, "epoch": 1059} {"train_loss": -21.899600982666016, "global_step": 87929, "epoch": 1059} {"train_loss": -21.610626220703125, "global_step": 87930, "epoch": 1059} {"train_loss": -21.163043975830078, "global_step": 87931, "epoch": 1059} {"train_loss": -21.271724700927734, "global_step": 87932, "epoch": 1059} {"train_loss": -21.66196060180664, "global_step": 87933, "epoch": 1059} {"train_loss": -21.203182220458984, "global_step": 87934, "epoch": 1059} {"train_loss": -21.64202308654785, "global_step": 87935, "epoch": 1059} {"train_loss": -21.405088424682617, "global_step": 87936, "epoch": 1059} {"train_loss": -21.452167510986328, "global_step": 87937, "epoch": 1059} {"train_loss": -21.5964298248291, "global_step": 87938, "epoch": 1059} {"train_loss": -21.87350845336914, "global_step": 87939, "epoch": 1059} {"train_loss": -21.68471336364746, "global_step": 87940, "epoch": 1059} {"train_loss": -21.422048568725586, "global_step": 87941, "epoch": 1059} {"train_loss": -21.685007095336914, "global_step": 87942, "epoch": 1059} {"train_loss": -21.327993392944336, "global_step": 87943, "epoch": 1059} {"train_loss": -21.447004318237305, "global_step": 87944, "epoch": 1059} {"train_loss": -21.421974182128906, "global_step": 87945, "epoch": 1059} {"train_loss": -21.483139038085938, "global_step": 87946, "epoch": 1059} {"train_loss": -21.645063400268555, "global_step": 87947, "epoch": 1059} {"train_loss": -21.752248764038086, "global_step": 87948, "epoch": 1059} {"train_loss": -21.480220794677734, "global_step": 87949, "epoch": 1059} {"train_loss": -21.612218856811523, "global_step": 87950, "epoch": 1059} {"train_loss": -21.35470962524414, "global_step": 87951, "epoch": 1059} {"train_loss": -21.606985092163086, "global_step": 87952, "epoch": 1059} {"train_loss": -21.3264217376709, "global_step": 87953, "epoch": 1059} {"train_loss": -21.19308090209961, "global_step": 87954, "epoch": 1059} {"train_loss": -21.323232650756836, "global_step": 87955, "epoch": 1059} {"train_loss": -21.638452529907227, "global_step": 87956, "epoch": 1059} {"train_loss": -21.323331832885742, "global_step": 87957, "epoch": 1059} {"train_loss": -21.551645278930664, "global_step": 87958, "epoch": 1059} {"train_loss": -21.14747428894043, "global_step": 87959, "epoch": 1059} {"train_loss": -21.397947311401367, "global_step": 87960, "epoch": 1059} {"train_loss": -21.730405807495117, "global_step": 87961, "epoch": 1059} {"train_loss": -21.240446090698242, "global_step": 87962, "epoch": 1059} {"train_loss": -21.667516708374023, "global_step": 87963, "epoch": 1059} {"train_loss": -21.53786277770996, "global_step": 87964, "epoch": 1059} {"train_loss": -21.244171142578125, "global_step": 87965, "epoch": 1059} {"train_loss": -21.78621482849121, "global_step": 87966, "epoch": 1059} {"train_loss": -21.293272018432617, "global_step": 87967, "epoch": 1059} {"train_loss": -21.749719619750977, "global_step": 87968, "epoch": 1059} {"train_loss": -21.444580078125, "global_step": 87969, "epoch": 1059} {"train_loss": -21.482030868530273, "global_step": 87970, "epoch": 1059} {"train_loss": -21.71161460876465, "global_step": 87971, "epoch": 1059} {"train_loss": -21.328195571899414, "global_step": 87972, "epoch": 1059} {"train_loss": -21.213083267211914, "global_step": 87973, "epoch": 1059} {"train_loss": -21.702287673950195, "global_step": 87974, "epoch": 1059} {"train_loss": -21.452974319458008, "global_step": 87975, "epoch": 1059} {"train_loss": -21.610794067382812, "global_step": 87976, "epoch": 1059} {"train_loss": -21.222503662109375, "global_step": 87977, "epoch": 1059} {"train_loss": -21.687763214111328, "global_step": 87978, "epoch": 1059} {"train_loss": -21.415044692625482, "global_step": 87979, "epoch": 1059, "val_loss": 6031535.0} {"train_loss": -21.20308494567871, "global_step": 87980, "epoch": 1060} {"train_loss": -21.300601959228516, "global_step": 87981, "epoch": 1060} {"train_loss": -21.010501861572266, "global_step": 87982, "epoch": 1060} {"train_loss": -21.270090103149414, "global_step": 87983, "epoch": 1060} {"train_loss": -21.124656677246094, "global_step": 87984, "epoch": 1060} {"train_loss": -21.501054763793945, "global_step": 87985, "epoch": 1060} {"train_loss": -20.903589248657227, "global_step": 87986, "epoch": 1060} {"train_loss": -21.385229110717773, "global_step": 87987, "epoch": 1060} {"train_loss": -21.136320114135742, "global_step": 87988, "epoch": 1060} {"train_loss": -21.602811813354492, "global_step": 87989, "epoch": 1060} {"train_loss": -21.30143165588379, "global_step": 87990, "epoch": 1060} {"train_loss": -21.555761337280273, "global_step": 87991, "epoch": 1060} {"train_loss": -21.3712158203125, "global_step": 87992, "epoch": 1060} {"train_loss": -21.387311935424805, "global_step": 87993, "epoch": 1060} {"train_loss": -21.274852752685547, "global_step": 87994, "epoch": 1060} {"train_loss": -21.371612548828125, "global_step": 87995, "epoch": 1060} {"train_loss": -21.712158203125, "global_step": 87996, "epoch": 1060} {"train_loss": -21.514427185058594, "global_step": 87997, "epoch": 1060} {"train_loss": -21.534399032592773, "global_step": 87998, "epoch": 1060} {"train_loss": -21.382095336914062, "global_step": 87999, "epoch": 1060} {"train_loss": -21.458953857421875, "global_step": 88000, "epoch": 1060} {"train_loss": -21.6424503326416, "global_step": 88001, "epoch": 1060} {"train_loss": -21.603694915771484, "global_step": 88002, "epoch": 1060} {"train_loss": -21.225202560424805, "global_step": 88003, "epoch": 1060} {"train_loss": -21.414535522460938, "global_step": 88004, "epoch": 1060} {"train_loss": -21.637939453125, "global_step": 88005, "epoch": 1060} {"train_loss": -21.165592193603516, "global_step": 88006, "epoch": 1060} {"train_loss": -21.639949798583984, "global_step": 88007, "epoch": 1060} {"train_loss": -21.310443878173828, "global_step": 88008, "epoch": 1060} {"train_loss": -21.717554092407227, "global_step": 88009, "epoch": 1060} {"train_loss": -21.722742080688477, "global_step": 88010, "epoch": 1060} {"train_loss": -21.726978302001953, "global_step": 88011, "epoch": 1060} {"train_loss": -21.55731773376465, "global_step": 88012, "epoch": 1060} {"train_loss": -21.505558013916016, "global_step": 88013, "epoch": 1060} {"train_loss": -21.424365997314453, "global_step": 88014, "epoch": 1060} {"train_loss": -21.132417678833008, "global_step": 88015, "epoch": 1060} {"train_loss": -21.41867446899414, "global_step": 88016, "epoch": 1060} {"train_loss": -21.439260482788086, "global_step": 88017, "epoch": 1060} {"train_loss": -21.483810424804688, "global_step": 88018, "epoch": 1060} {"train_loss": -21.449495315551758, "global_step": 88019, "epoch": 1060} {"train_loss": -21.49104881286621, "global_step": 88020, "epoch": 1060} {"train_loss": -21.704730987548828, "global_step": 88021, "epoch": 1060} {"train_loss": -21.115447998046875, "global_step": 88022, "epoch": 1060} {"train_loss": -21.520414352416992, "global_step": 88023, "epoch": 1060} {"train_loss": -21.587581634521484, "global_step": 88024, "epoch": 1060} {"train_loss": -21.718942642211914, "global_step": 88025, "epoch": 1060} {"train_loss": -21.64432144165039, "global_step": 88026, "epoch": 1060} {"train_loss": -21.416574478149414, "global_step": 88027, "epoch": 1060} {"train_loss": -21.231624603271484, "global_step": 88028, "epoch": 1060} {"train_loss": -21.210832595825195, "global_step": 88029, "epoch": 1060} {"train_loss": -21.5452823638916, "global_step": 88030, "epoch": 1060} {"train_loss": -21.299570083618164, "global_step": 88031, "epoch": 1060} {"train_loss": -21.342609405517578, "global_step": 88032, "epoch": 1060} {"train_loss": -21.45134925842285, "global_step": 88033, "epoch": 1060} {"train_loss": -21.597238540649414, "global_step": 88034, "epoch": 1060} {"train_loss": -21.12727928161621, "global_step": 88035, "epoch": 1060} {"train_loss": -21.606130599975586, "global_step": 88036, "epoch": 1060} {"train_loss": -21.567729949951172, "global_step": 88037, "epoch": 1060} {"train_loss": -21.61164665222168, "global_step": 88038, "epoch": 1060} {"train_loss": -21.550764083862305, "global_step": 88039, "epoch": 1060} {"train_loss": -21.31911277770996, "global_step": 88040, "epoch": 1060} {"train_loss": -21.628049850463867, "global_step": 88041, "epoch": 1060} {"train_loss": -21.48402214050293, "global_step": 88042, "epoch": 1060} {"train_loss": -21.361188888549805, "global_step": 88043, "epoch": 1060} {"train_loss": -21.56389045715332, "global_step": 88044, "epoch": 1060} {"train_loss": -21.000411987304688, "global_step": 88045, "epoch": 1060} {"train_loss": -21.90128517150879, "global_step": 88046, "epoch": 1060} {"train_loss": -21.677078247070312, "global_step": 88047, "epoch": 1060} {"train_loss": -21.728885650634766, "global_step": 88048, "epoch": 1060} {"train_loss": -21.666873931884766, "global_step": 88049, "epoch": 1060} {"train_loss": -21.290971755981445, "global_step": 88050, "epoch": 1060} {"train_loss": -21.901123046875, "global_step": 88051, "epoch": 1060} {"train_loss": -21.72250747680664, "global_step": 88052, "epoch": 1060} {"train_loss": -21.651247024536133, "global_step": 88053, "epoch": 1060} {"train_loss": -21.392559051513672, "global_step": 88054, "epoch": 1060} {"train_loss": -21.61094856262207, "global_step": 88055, "epoch": 1060} {"train_loss": -21.533414840698242, "global_step": 88056, "epoch": 1060} {"train_loss": -21.376100540161133, "global_step": 88057, "epoch": 1060} {"train_loss": -21.891910552978516, "global_step": 88058, "epoch": 1060} {"train_loss": -21.894210815429688, "global_step": 88059, "epoch": 1060} {"train_loss": -21.695138931274414, "global_step": 88060, "epoch": 1060} {"train_loss": -21.29257583618164, "global_step": 88061, "epoch": 1060} {"train_loss": -21.47395368369229, "global_step": 88062, "epoch": 1060, "val_loss": 6036418.0} {"train_loss": -21.106122970581055, "global_step": 88063, "epoch": 1061} {"train_loss": -21.696998596191406, "global_step": 88064, "epoch": 1061} {"train_loss": -21.427387237548828, "global_step": 88065, "epoch": 1061} {"train_loss": -21.425189971923828, "global_step": 88066, "epoch": 1061} {"train_loss": -21.256607055664062, "global_step": 88067, "epoch": 1061} {"train_loss": -21.439661026000977, "global_step": 88068, "epoch": 1061} {"train_loss": -21.64002227783203, "global_step": 88069, "epoch": 1061} {"train_loss": -21.08112335205078, "global_step": 88070, "epoch": 1061} {"train_loss": -21.426105499267578, "global_step": 88071, "epoch": 1061} {"train_loss": -21.615385055541992, "global_step": 88072, "epoch": 1061} {"train_loss": -21.433937072753906, "global_step": 88073, "epoch": 1061} {"train_loss": -21.326725006103516, "global_step": 88074, "epoch": 1061} {"train_loss": -21.415494918823242, "global_step": 88075, "epoch": 1061} {"train_loss": -21.646339416503906, "global_step": 88076, "epoch": 1061} {"train_loss": -21.433935165405273, "global_step": 88077, "epoch": 1061} {"train_loss": -21.64735221862793, "global_step": 88078, "epoch": 1061} {"train_loss": -21.50431251525879, "global_step": 88079, "epoch": 1061} {"train_loss": -21.49228286743164, "global_step": 88080, "epoch": 1061} {"train_loss": -21.769500732421875, "global_step": 88081, "epoch": 1061} {"train_loss": -21.495325088500977, "global_step": 88082, "epoch": 1061} {"train_loss": -21.340015411376953, "global_step": 88083, "epoch": 1061} {"train_loss": -21.691848754882812, "global_step": 88084, "epoch": 1061} {"train_loss": -21.42130470275879, "global_step": 88085, "epoch": 1061} {"train_loss": -21.251340866088867, "global_step": 88086, "epoch": 1061} {"train_loss": -21.75272560119629, "global_step": 88087, "epoch": 1061} {"train_loss": -21.43214988708496, "global_step": 88088, "epoch": 1061} {"train_loss": -21.54479217529297, "global_step": 88089, "epoch": 1061} {"train_loss": -21.63541603088379, "global_step": 88090, "epoch": 1061} {"train_loss": -21.751829147338867, "global_step": 88091, "epoch": 1061} {"train_loss": -21.641756057739258, "global_step": 88092, "epoch": 1061} {"train_loss": -21.52070426940918, "global_step": 88093, "epoch": 1061} {"train_loss": -21.199796676635742, "global_step": 88094, "epoch": 1061} {"train_loss": -21.3977108001709, "global_step": 88095, "epoch": 1061} {"train_loss": -21.388166427612305, "global_step": 88096, "epoch": 1061} {"train_loss": -21.7827091217041, "global_step": 88097, "epoch": 1061} {"train_loss": -21.552053451538086, "global_step": 88098, "epoch": 1061} {"train_loss": -21.496719360351562, "global_step": 88099, "epoch": 1061} {"train_loss": -21.75592613220215, "global_step": 88100, "epoch": 1061} {"train_loss": -21.64473533630371, "global_step": 88101, "epoch": 1061} {"train_loss": -21.548952102661133, "global_step": 88102, "epoch": 1061} {"train_loss": -21.678482055664062, "global_step": 88103, "epoch": 1061} {"train_loss": -21.74433708190918, "global_step": 88104, "epoch": 1061} {"train_loss": -21.51678466796875, "global_step": 88105, "epoch": 1061} {"train_loss": -21.956125259399414, "global_step": 88106, "epoch": 1061} {"train_loss": -21.467334747314453, "global_step": 88107, "epoch": 1061} {"train_loss": -21.5087833404541, "global_step": 88108, "epoch": 1061} {"train_loss": -21.44475746154785, "global_step": 88109, "epoch": 1061} {"train_loss": -21.46533966064453, "global_step": 88110, "epoch": 1061} {"train_loss": -21.423416137695312, "global_step": 88111, "epoch": 1061} {"train_loss": -21.613874435424805, "global_step": 88112, "epoch": 1061} {"train_loss": -21.766677856445312, "global_step": 88113, "epoch": 1061} {"train_loss": -21.534711837768555, "global_step": 88114, "epoch": 1061} {"train_loss": -21.159610748291016, "global_step": 88115, "epoch": 1061} {"train_loss": -21.614805221557617, "global_step": 88116, "epoch": 1061} {"train_loss": -21.687602996826172, "global_step": 88117, "epoch": 1061} {"train_loss": -21.500402450561523, "global_step": 88118, "epoch": 1061} {"train_loss": -21.329757690429688, "global_step": 88119, "epoch": 1061} {"train_loss": -21.331716537475586, "global_step": 88120, "epoch": 1061} {"train_loss": -21.652156829833984, "global_step": 88121, "epoch": 1061} {"train_loss": -21.588375091552734, "global_step": 88122, "epoch": 1061} {"train_loss": -21.578754425048828, "global_step": 88123, "epoch": 1061} {"train_loss": -21.68745231628418, "global_step": 88124, "epoch": 1061} {"train_loss": -21.50919532775879, "global_step": 88125, "epoch": 1061} {"train_loss": -21.4013729095459, "global_step": 88126, "epoch": 1061} {"train_loss": -21.57564353942871, "global_step": 88127, "epoch": 1061} {"train_loss": -21.619382858276367, "global_step": 88128, "epoch": 1061} {"train_loss": -21.506921768188477, "global_step": 88129, "epoch": 1061} {"train_loss": -21.620447158813477, "global_step": 88130, "epoch": 1061} {"train_loss": -21.594167709350586, "global_step": 88131, "epoch": 1061} {"train_loss": -21.487842559814453, "global_step": 88132, "epoch": 1061} {"train_loss": -21.625165939331055, "global_step": 88133, "epoch": 1061} {"train_loss": -21.36408233642578, "global_step": 88134, "epoch": 1061} {"train_loss": -21.73499870300293, "global_step": 88135, "epoch": 1061} {"train_loss": -21.511817932128906, "global_step": 88136, "epoch": 1061} {"train_loss": -21.52126121520996, "global_step": 88137, "epoch": 1061} {"train_loss": -21.776212692260742, "global_step": 88138, "epoch": 1061} {"train_loss": -21.417221069335938, "global_step": 88139, "epoch": 1061} {"train_loss": -21.60157585144043, "global_step": 88140, "epoch": 1061} {"train_loss": -21.56390380859375, "global_step": 88141, "epoch": 1061} {"train_loss": -21.720548629760742, "global_step": 88142, "epoch": 1061} {"train_loss": -21.51678466796875, "global_step": 88143, "epoch": 1061} {"train_loss": -21.604928970336914, "global_step": 88144, "epoch": 1061} {"train_loss": -21.54015269911433, "global_step": 88145, "epoch": 1061, "val_loss": 6309241.0} {"train_loss": -20.79026222229004, "global_step": 88146, "epoch": 1062} {"train_loss": -21.112741470336914, "global_step": 88147, "epoch": 1062} {"train_loss": -21.798986434936523, "global_step": 88148, "epoch": 1062} {"train_loss": -21.3073673248291, "global_step": 88149, "epoch": 1062} {"train_loss": -21.262577056884766, "global_step": 88150, "epoch": 1062} {"train_loss": -20.83085823059082, "global_step": 88151, "epoch": 1062} {"train_loss": -21.390811920166016, "global_step": 88152, "epoch": 1062} {"train_loss": -21.134166717529297, "global_step": 88153, "epoch": 1062} {"train_loss": -21.399250030517578, "global_step": 88154, "epoch": 1062} {"train_loss": -21.52337646484375, "global_step": 88155, "epoch": 1062} {"train_loss": -21.28116226196289, "global_step": 88156, "epoch": 1062} {"train_loss": -21.463308334350586, "global_step": 88157, "epoch": 1062} {"train_loss": -21.45907211303711, "global_step": 88158, "epoch": 1062} {"train_loss": -21.450674057006836, "global_step": 88159, "epoch": 1062} {"train_loss": -21.19047737121582, "global_step": 88160, "epoch": 1062} {"train_loss": -21.317136764526367, "global_step": 88161, "epoch": 1062} {"train_loss": -21.723012924194336, "global_step": 88162, "epoch": 1062} {"train_loss": -21.382522583007812, "global_step": 88163, "epoch": 1062} {"train_loss": -21.22542381286621, "global_step": 88164, "epoch": 1062} {"train_loss": -21.67893409729004, "global_step": 88165, "epoch": 1062} {"train_loss": -21.77937126159668, "global_step": 88166, "epoch": 1062} {"train_loss": -21.322233200073242, "global_step": 88167, "epoch": 1062} {"train_loss": -21.479124069213867, "global_step": 88168, "epoch": 1062} {"train_loss": -21.665761947631836, "global_step": 88169, "epoch": 1062} {"train_loss": -21.362991333007812, "global_step": 88170, "epoch": 1062} {"train_loss": -21.487552642822266, "global_step": 88171, "epoch": 1062} {"train_loss": -21.66150665283203, "global_step": 88172, "epoch": 1062} {"train_loss": -21.166799545288086, "global_step": 88173, "epoch": 1062} {"train_loss": -21.641042709350586, "global_step": 88174, "epoch": 1062} {"train_loss": -21.304941177368164, "global_step": 88175, "epoch": 1062} {"train_loss": -21.434362411499023, "global_step": 88176, "epoch": 1062} {"train_loss": -21.158742904663086, "global_step": 88177, "epoch": 1062} {"train_loss": -21.313039779663086, "global_step": 88178, "epoch": 1062} {"train_loss": -21.212953567504883, "global_step": 88179, "epoch": 1062} {"train_loss": -21.76641273498535, "global_step": 88180, "epoch": 1062} {"train_loss": -22.056180953979492, "global_step": 88181, "epoch": 1062} {"train_loss": -21.31751823425293, "global_step": 88182, "epoch": 1062} {"train_loss": -21.83019256591797, "global_step": 88183, "epoch": 1062} {"train_loss": -21.215890884399414, "global_step": 88184, "epoch": 1062} {"train_loss": -21.41285514831543, "global_step": 88185, "epoch": 1062} {"train_loss": -21.52083396911621, "global_step": 88186, "epoch": 1062} {"train_loss": -21.594409942626953, "global_step": 88187, "epoch": 1062} {"train_loss": -21.87604331970215, "global_step": 88188, "epoch": 1062} {"train_loss": -21.48247528076172, "global_step": 88189, "epoch": 1062} {"train_loss": -21.6103515625, "global_step": 88190, "epoch": 1062} {"train_loss": -21.284473419189453, "global_step": 88191, "epoch": 1062} {"train_loss": -21.60382652282715, "global_step": 88192, "epoch": 1062} {"train_loss": -21.64839744567871, "global_step": 88193, "epoch": 1062} {"train_loss": -21.563350677490234, "global_step": 88194, "epoch": 1062} {"train_loss": -21.15822410583496, "global_step": 88195, "epoch": 1062} {"train_loss": -20.916488647460938, "global_step": 88196, "epoch": 1062} {"train_loss": -21.479145050048828, "global_step": 88197, "epoch": 1062} {"train_loss": -21.19630241394043, "global_step": 88198, "epoch": 1062} {"train_loss": -21.679533004760742, "global_step": 88199, "epoch": 1062} {"train_loss": -21.594045639038086, "global_step": 88200, "epoch": 1062} {"train_loss": -21.333709716796875, "global_step": 88201, "epoch": 1062} {"train_loss": -21.426115036010742, "global_step": 88202, "epoch": 1062} {"train_loss": -21.36464500427246, "global_step": 88203, "epoch": 1062} {"train_loss": -21.193832397460938, "global_step": 88204, "epoch": 1062} {"train_loss": -21.305994033813477, "global_step": 88205, "epoch": 1062} {"train_loss": -21.794586181640625, "global_step": 88206, "epoch": 1062} {"train_loss": -21.32415199279785, "global_step": 88207, "epoch": 1062} {"train_loss": -21.397281646728516, "global_step": 88208, "epoch": 1062} {"train_loss": -21.578737258911133, "global_step": 88209, "epoch": 1062} {"train_loss": -21.029996871948242, "global_step": 88210, "epoch": 1062} {"train_loss": -21.180583953857422, "global_step": 88211, "epoch": 1062} {"train_loss": -21.892637252807617, "global_step": 88212, "epoch": 1062} {"train_loss": -21.291275024414062, "global_step": 88213, "epoch": 1062} {"train_loss": -21.616390228271484, "global_step": 88214, "epoch": 1062} {"train_loss": -21.344079971313477, "global_step": 88215, "epoch": 1062} {"train_loss": -21.7409610748291, "global_step": 88216, "epoch": 1062} {"train_loss": -21.461685180664062, "global_step": 88217, "epoch": 1062} {"train_loss": -21.492462158203125, "global_step": 88218, "epoch": 1062} {"train_loss": -21.0112361907959, "global_step": 88219, "epoch": 1062} {"train_loss": -21.090681076049805, "global_step": 88220, "epoch": 1062} {"train_loss": -21.620248794555664, "global_step": 88221, "epoch": 1062} {"train_loss": -21.522659301757812, "global_step": 88222, "epoch": 1062} {"train_loss": -21.579648971557617, "global_step": 88223, "epoch": 1062} {"train_loss": -21.58576774597168, "global_step": 88224, "epoch": 1062} {"train_loss": -21.664386749267578, "global_step": 88225, "epoch": 1062} {"train_loss": -21.561960220336914, "global_step": 88226, "epoch": 1062} {"train_loss": -21.60695457458496, "global_step": 88227, "epoch": 1062} {"train_loss": -21.41592862232622, "global_step": 88228, "epoch": 1062, "val_loss": 6018717.5} {"train_loss": -21.598514556884766, "global_step": 88229, "epoch": 1063} {"train_loss": -21.38344383239746, "global_step": 88230, "epoch": 1063} {"train_loss": -21.12272071838379, "global_step": 88231, "epoch": 1063} {"train_loss": -21.102642059326172, "global_step": 88232, "epoch": 1063} {"train_loss": -21.241260528564453, "global_step": 88233, "epoch": 1063} {"train_loss": -20.943662643432617, "global_step": 88234, "epoch": 1063} {"train_loss": -21.06760025024414, "global_step": 88235, "epoch": 1063} {"train_loss": -21.099609375, "global_step": 88236, "epoch": 1063} {"train_loss": -21.357154846191406, "global_step": 88237, "epoch": 1063} {"train_loss": -21.575592041015625, "global_step": 88238, "epoch": 1063} {"train_loss": -21.503875732421875, "global_step": 88239, "epoch": 1063} {"train_loss": -21.423877716064453, "global_step": 88240, "epoch": 1063} {"train_loss": -21.977781295776367, "global_step": 88241, "epoch": 1063} {"train_loss": -21.20120620727539, "global_step": 88242, "epoch": 1063} {"train_loss": -21.17866325378418, "global_step": 88243, "epoch": 1063} {"train_loss": -21.32590675354004, "global_step": 88244, "epoch": 1063} {"train_loss": -21.29806137084961, "global_step": 88245, "epoch": 1063} {"train_loss": -21.522476196289062, "global_step": 88246, "epoch": 1063} {"train_loss": -21.4536190032959, "global_step": 88247, "epoch": 1063} {"train_loss": -21.163822174072266, "global_step": 88248, "epoch": 1063} {"train_loss": -21.20492935180664, "global_step": 88249, "epoch": 1063} {"train_loss": -21.49540138244629, "global_step": 88250, "epoch": 1063} {"train_loss": -21.544178009033203, "global_step": 88251, "epoch": 1063} {"train_loss": -21.364160537719727, "global_step": 88252, "epoch": 1063} {"train_loss": -21.328176498413086, "global_step": 88253, "epoch": 1063} {"train_loss": -21.640466690063477, "global_step": 88254, "epoch": 1063} {"train_loss": -21.15257453918457, "global_step": 88255, "epoch": 1063} {"train_loss": -21.3585205078125, "global_step": 88256, "epoch": 1063} {"train_loss": -21.623029708862305, "global_step": 88257, "epoch": 1063} {"train_loss": -21.420072555541992, "global_step": 88258, "epoch": 1063} {"train_loss": -21.659032821655273, "global_step": 88259, "epoch": 1063} {"train_loss": -21.585039138793945, "global_step": 88260, "epoch": 1063} {"train_loss": -21.522891998291016, "global_step": 88261, "epoch": 1063} {"train_loss": -21.687868118286133, "global_step": 88262, "epoch": 1063} {"train_loss": -21.405323028564453, "global_step": 88263, "epoch": 1063} {"train_loss": -21.686790466308594, "global_step": 88264, "epoch": 1063} {"train_loss": -21.67801284790039, "global_step": 88265, "epoch": 1063} {"train_loss": -21.370189666748047, "global_step": 88266, "epoch": 1063} {"train_loss": -21.975671768188477, "global_step": 88267, "epoch": 1063} {"train_loss": -21.725656509399414, "global_step": 88268, "epoch": 1063} {"train_loss": -21.583810806274414, "global_step": 88269, "epoch": 1063} {"train_loss": -21.356346130371094, "global_step": 88270, "epoch": 1063} {"train_loss": -21.581979751586914, "global_step": 88271, "epoch": 1063} {"train_loss": -21.662521362304688, "global_step": 88272, "epoch": 1063} {"train_loss": -21.821598052978516, "global_step": 88273, "epoch": 1063} {"train_loss": -21.915647506713867, "global_step": 88274, "epoch": 1063} {"train_loss": -21.627683639526367, "global_step": 88275, "epoch": 1063} {"train_loss": -21.639123916625977, "global_step": 88276, "epoch": 1063} {"train_loss": -21.384336471557617, "global_step": 88277, "epoch": 1063} {"train_loss": -21.62095832824707, "global_step": 88278, "epoch": 1063} {"train_loss": -21.396326065063477, "global_step": 88279, "epoch": 1063} {"train_loss": -21.218664169311523, "global_step": 88280, "epoch": 1063} {"train_loss": -21.249305725097656, "global_step": 88281, "epoch": 1063} {"train_loss": -21.382139205932617, "global_step": 88282, "epoch": 1063} {"train_loss": -21.25115203857422, "global_step": 88283, "epoch": 1063} {"train_loss": -21.64692497253418, "global_step": 88284, "epoch": 1063} {"train_loss": -21.173757553100586, "global_step": 88285, "epoch": 1063} {"train_loss": -21.485218048095703, "global_step": 88286, "epoch": 1063} {"train_loss": -21.074893951416016, "global_step": 88287, "epoch": 1063} {"train_loss": -21.736637115478516, "global_step": 88288, "epoch": 1063} {"train_loss": -21.265567779541016, "global_step": 88289, "epoch": 1063} {"train_loss": -21.592622756958008, "global_step": 88290, "epoch": 1063} {"train_loss": -21.22848129272461, "global_step": 88291, "epoch": 1063} {"train_loss": -21.26679801940918, "global_step": 88292, "epoch": 1063} {"train_loss": -21.56821060180664, "global_step": 88293, "epoch": 1063} {"train_loss": -21.594266891479492, "global_step": 88294, "epoch": 1063} {"train_loss": -21.77105140686035, "global_step": 88295, "epoch": 1063} {"train_loss": -21.43494987487793, "global_step": 88296, "epoch": 1063} {"train_loss": -21.265546798706055, "global_step": 88297, "epoch": 1063} {"train_loss": -21.512052536010742, "global_step": 88298, "epoch": 1063} {"train_loss": -21.508909225463867, "global_step": 88299, "epoch": 1063} {"train_loss": -21.66457176208496, "global_step": 88300, "epoch": 1063} {"train_loss": -21.434926986694336, "global_step": 88301, "epoch": 1063} {"train_loss": -21.339200973510742, "global_step": 88302, "epoch": 1063} {"train_loss": -21.815980911254883, "global_step": 88303, "epoch": 1063} {"train_loss": -21.778676986694336, "global_step": 88304, "epoch": 1063} {"train_loss": -21.90704345703125, "global_step": 88305, "epoch": 1063} {"train_loss": -21.856725692749023, "global_step": 88306, "epoch": 1063} {"train_loss": -21.6811580657959, "global_step": 88307, "epoch": 1063} {"train_loss": -21.703805923461914, "global_step": 88308, "epoch": 1063} {"train_loss": -21.448486328125, "global_step": 88309, "epoch": 1063} {"train_loss": -21.963905334472656, "global_step": 88310, "epoch": 1063} {"train_loss": -21.48282515284527, "global_step": 88311, "epoch": 1063, "val_loss": 6220910.0} {"train_loss": -20.809711456298828, "global_step": 88312, "epoch": 1064} {"train_loss": -21.00052833557129, "global_step": 88313, "epoch": 1064} {"train_loss": -20.97942352294922, "global_step": 88314, "epoch": 1064} {"train_loss": -20.7282657623291, "global_step": 88315, "epoch": 1064} {"train_loss": -20.799772262573242, "global_step": 88316, "epoch": 1064} {"train_loss": -21.1010684967041, "global_step": 88317, "epoch": 1064} {"train_loss": -21.083133697509766, "global_step": 88318, "epoch": 1064} {"train_loss": -20.926137924194336, "global_step": 88319, "epoch": 1064} {"train_loss": -21.04587173461914, "global_step": 88320, "epoch": 1064} {"train_loss": -20.977336883544922, "global_step": 88321, "epoch": 1064} {"train_loss": -20.7558650970459, "global_step": 88322, "epoch": 1064} {"train_loss": -20.60198211669922, "global_step": 88323, "epoch": 1064} {"train_loss": -21.324602127075195, "global_step": 88324, "epoch": 1064} {"train_loss": -20.810943603515625, "global_step": 88325, "epoch": 1064} {"train_loss": -21.358789443969727, "global_step": 88326, "epoch": 1064} {"train_loss": -20.659923553466797, "global_step": 88327, "epoch": 1064} {"train_loss": -21.414094924926758, "global_step": 88328, "epoch": 1064} {"train_loss": -21.489160537719727, "global_step": 88329, "epoch": 1064} {"train_loss": -21.244016647338867, "global_step": 88330, "epoch": 1064} {"train_loss": -21.21452522277832, "global_step": 88331, "epoch": 1064} {"train_loss": -21.613195419311523, "global_step": 88332, "epoch": 1064} {"train_loss": -21.54376220703125, "global_step": 88333, "epoch": 1064} {"train_loss": -21.32961654663086, "global_step": 88334, "epoch": 1064} {"train_loss": -21.78383445739746, "global_step": 88335, "epoch": 1064} {"train_loss": -21.496431350708008, "global_step": 88336, "epoch": 1064} {"train_loss": -21.428604125976562, "global_step": 88337, "epoch": 1064} {"train_loss": -21.881011962890625, "global_step": 88338, "epoch": 1064} {"train_loss": -21.231992721557617, "global_step": 88339, "epoch": 1064} {"train_loss": -21.85334587097168, "global_step": 88340, "epoch": 1064} {"train_loss": -21.64149284362793, "global_step": 88341, "epoch": 1064} {"train_loss": -20.999618530273438, "global_step": 88342, "epoch": 1064} {"train_loss": -21.73550796508789, "global_step": 88343, "epoch": 1064} {"train_loss": -21.826547622680664, "global_step": 88344, "epoch": 1064} {"train_loss": -21.458837509155273, "global_step": 88345, "epoch": 1064} {"train_loss": -21.098251342773438, "global_step": 88346, "epoch": 1064} {"train_loss": -21.405866622924805, "global_step": 88347, "epoch": 1064} {"train_loss": -21.257797241210938, "global_step": 88348, "epoch": 1064} {"train_loss": -21.420093536376953, "global_step": 88349, "epoch": 1064} {"train_loss": -21.602880477905273, "global_step": 88350, "epoch": 1064} {"train_loss": -21.459016799926758, "global_step": 88351, "epoch": 1064} {"train_loss": -21.569353103637695, "global_step": 88352, "epoch": 1064} {"train_loss": -21.71173667907715, "global_step": 88353, "epoch": 1064} {"train_loss": -21.50616455078125, "global_step": 88354, "epoch": 1064} {"train_loss": -21.3167781829834, "global_step": 88355, "epoch": 1064} {"train_loss": -21.627336502075195, "global_step": 88356, "epoch": 1064} {"train_loss": -21.802791595458984, "global_step": 88357, "epoch": 1064} {"train_loss": -21.719064712524414, "global_step": 88358, "epoch": 1064} {"train_loss": -21.263473510742188, "global_step": 88359, "epoch": 1064} {"train_loss": -21.504940032958984, "global_step": 88360, "epoch": 1064} {"train_loss": -21.790719985961914, "global_step": 88361, "epoch": 1064} {"train_loss": -21.81914520263672, "global_step": 88362, "epoch": 1064} {"train_loss": -21.232250213623047, "global_step": 88363, "epoch": 1064} {"train_loss": -21.42949676513672, "global_step": 88364, "epoch": 1064} {"train_loss": -21.26334571838379, "global_step": 88365, "epoch": 1064} {"train_loss": -21.626882553100586, "global_step": 88366, "epoch": 1064} {"train_loss": -21.599821090698242, "global_step": 88367, "epoch": 1064} {"train_loss": -21.692150115966797, "global_step": 88368, "epoch": 1064} {"train_loss": -21.60346794128418, "global_step": 88369, "epoch": 1064} {"train_loss": -21.401670455932617, "global_step": 88370, "epoch": 1064} {"train_loss": -21.92133140563965, "global_step": 88371, "epoch": 1064} {"train_loss": -21.46173667907715, "global_step": 88372, "epoch": 1064} {"train_loss": -21.784528732299805, "global_step": 88373, "epoch": 1064} {"train_loss": -21.52168846130371, "global_step": 88374, "epoch": 1064} {"train_loss": -21.46504783630371, "global_step": 88375, "epoch": 1064} {"train_loss": -21.54007339477539, "global_step": 88376, "epoch": 1064} {"train_loss": -21.8030948638916, "global_step": 88377, "epoch": 1064} {"train_loss": -21.511035919189453, "global_step": 88378, "epoch": 1064} {"train_loss": -21.553640365600586, "global_step": 88379, "epoch": 1064} {"train_loss": -21.80124282836914, "global_step": 88380, "epoch": 1064} {"train_loss": -21.66229248046875, "global_step": 88381, "epoch": 1064} {"train_loss": -21.615842819213867, "global_step": 88382, "epoch": 1064} {"train_loss": -21.652883529663086, "global_step": 88383, "epoch": 1064} {"train_loss": -21.653051376342773, "global_step": 88384, "epoch": 1064} {"train_loss": -21.327342987060547, "global_step": 88385, "epoch": 1064} {"train_loss": -21.466796875, "global_step": 88386, "epoch": 1064} {"train_loss": -21.687055587768555, "global_step": 88387, "epoch": 1064} {"train_loss": -21.7203369140625, "global_step": 88388, "epoch": 1064} {"train_loss": -21.611465454101562, "global_step": 88389, "epoch": 1064} {"train_loss": -21.6192684173584, "global_step": 88390, "epoch": 1064} {"train_loss": -21.43265151977539, "global_step": 88391, "epoch": 1064} {"train_loss": -21.617603302001953, "global_step": 88392, "epoch": 1064} {"train_loss": -21.78226661682129, "global_step": 88393, "epoch": 1064} {"train_loss": -21.430413395525463, "global_step": 88394, "epoch": 1064, "val_loss": 6030648.5} {"train_loss": -21.095775604248047, "global_step": 88395, "epoch": 1065} {"train_loss": -21.5125675201416, "global_step": 88396, "epoch": 1065} {"train_loss": -21.651792526245117, "global_step": 88397, "epoch": 1065} {"train_loss": -21.55291748046875, "global_step": 88398, "epoch": 1065} {"train_loss": -21.29576873779297, "global_step": 88399, "epoch": 1065} {"train_loss": -21.184738159179688, "global_step": 88400, "epoch": 1065} {"train_loss": -21.30689811706543, "global_step": 88401, "epoch": 1065} {"train_loss": -20.88974380493164, "global_step": 88402, "epoch": 1065} {"train_loss": -21.425556182861328, "global_step": 88403, "epoch": 1065} {"train_loss": -21.60202980041504, "global_step": 88404, "epoch": 1065} {"train_loss": -21.512727737426758, "global_step": 88405, "epoch": 1065} {"train_loss": -21.084854125976562, "global_step": 88406, "epoch": 1065} {"train_loss": -21.615568161010742, "global_step": 88407, "epoch": 1065} {"train_loss": -21.172372817993164, "global_step": 88408, "epoch": 1065} {"train_loss": -21.26704216003418, "global_step": 88409, "epoch": 1065} {"train_loss": -21.309864044189453, "global_step": 88410, "epoch": 1065} {"train_loss": -21.698856353759766, "global_step": 88411, "epoch": 1065} {"train_loss": -21.399423599243164, "global_step": 88412, "epoch": 1065} {"train_loss": -21.17496109008789, "global_step": 88413, "epoch": 1065} {"train_loss": -21.483905792236328, "global_step": 88414, "epoch": 1065} {"train_loss": -21.583145141601562, "global_step": 88415, "epoch": 1065} {"train_loss": -21.429729461669922, "global_step": 88416, "epoch": 1065} {"train_loss": -21.7687931060791, "global_step": 88417, "epoch": 1065} {"train_loss": -21.520355224609375, "global_step": 88418, "epoch": 1065} {"train_loss": -21.67807960510254, "global_step": 88419, "epoch": 1065} {"train_loss": -21.430347442626953, "global_step": 88420, "epoch": 1065} {"train_loss": -21.509113311767578, "global_step": 88421, "epoch": 1065} {"train_loss": -21.595748901367188, "global_step": 88422, "epoch": 1065} {"train_loss": -21.464406967163086, "global_step": 88423, "epoch": 1065} {"train_loss": -21.589332580566406, "global_step": 88424, "epoch": 1065} {"train_loss": -21.926727294921875, "global_step": 88425, "epoch": 1065} {"train_loss": -21.88155174255371, "global_step": 88426, "epoch": 1065} {"train_loss": -22.014123916625977, "global_step": 88427, "epoch": 1065} {"train_loss": -21.7262020111084, "global_step": 88428, "epoch": 1065} {"train_loss": -21.31667137145996, "global_step": 88429, "epoch": 1065} {"train_loss": -21.431671142578125, "global_step": 88430, "epoch": 1065} {"train_loss": -21.536449432373047, "global_step": 88431, "epoch": 1065} {"train_loss": -21.463050842285156, "global_step": 88432, "epoch": 1065} {"train_loss": -21.23124885559082, "global_step": 88433, "epoch": 1065} {"train_loss": -21.562402725219727, "global_step": 88434, "epoch": 1065} {"train_loss": -21.219045639038086, "global_step": 88435, "epoch": 1065} {"train_loss": -21.621482849121094, "global_step": 88436, "epoch": 1065} {"train_loss": -21.270904541015625, "global_step": 88437, "epoch": 1065} {"train_loss": -21.678518295288086, "global_step": 88438, "epoch": 1065} {"train_loss": -21.337881088256836, "global_step": 88439, "epoch": 1065} {"train_loss": -21.48451805114746, "global_step": 88440, "epoch": 1065} {"train_loss": -21.36068344116211, "global_step": 88441, "epoch": 1065} {"train_loss": -21.28608512878418, "global_step": 88442, "epoch": 1065} {"train_loss": -21.749774932861328, "global_step": 88443, "epoch": 1065} {"train_loss": -21.517608642578125, "global_step": 88444, "epoch": 1065} {"train_loss": -21.07608985900879, "global_step": 88445, "epoch": 1065} {"train_loss": -21.389352798461914, "global_step": 88446, "epoch": 1065} {"train_loss": -21.430835723876953, "global_step": 88447, "epoch": 1065} {"train_loss": -21.235408782958984, "global_step": 88448, "epoch": 1065} {"train_loss": -21.917844772338867, "global_step": 88449, "epoch": 1065} {"train_loss": -21.749332427978516, "global_step": 88450, "epoch": 1065} {"train_loss": -21.563758850097656, "global_step": 88451, "epoch": 1065} {"train_loss": -21.503583908081055, "global_step": 88452, "epoch": 1065} {"train_loss": -21.487966537475586, "global_step": 88453, "epoch": 1065} {"train_loss": -21.204341888427734, "global_step": 88454, "epoch": 1065} {"train_loss": -21.6363468170166, "global_step": 88455, "epoch": 1065} {"train_loss": -21.80059814453125, "global_step": 88456, "epoch": 1065} {"train_loss": -21.443391799926758, "global_step": 88457, "epoch": 1065} {"train_loss": -21.542404174804688, "global_step": 88458, "epoch": 1065} {"train_loss": -21.639087677001953, "global_step": 88459, "epoch": 1065} {"train_loss": -21.603384017944336, "global_step": 88460, "epoch": 1065} {"train_loss": -21.8124942779541, "global_step": 88461, "epoch": 1065} {"train_loss": -21.903228759765625, "global_step": 88462, "epoch": 1065} {"train_loss": -21.586341857910156, "global_step": 88463, "epoch": 1065} {"train_loss": -21.9724178314209, "global_step": 88464, "epoch": 1065} {"train_loss": -21.377676010131836, "global_step": 88465, "epoch": 1065} {"train_loss": -21.591354370117188, "global_step": 88466, "epoch": 1065} {"train_loss": -21.365964889526367, "global_step": 88467, "epoch": 1065} {"train_loss": -21.592248916625977, "global_step": 88468, "epoch": 1065} {"train_loss": -21.845115661621094, "global_step": 88469, "epoch": 1065} {"train_loss": -21.148365020751953, "global_step": 88470, "epoch": 1065} {"train_loss": -21.2912540435791, "global_step": 88471, "epoch": 1065} {"train_loss": -21.17797088623047, "global_step": 88472, "epoch": 1065} {"train_loss": -21.261938095092773, "global_step": 88473, "epoch": 1065} {"train_loss": -21.246736526489258, "global_step": 88474, "epoch": 1065} {"train_loss": -21.84914779663086, "global_step": 88475, "epoch": 1065} {"train_loss": -21.554458618164062, "global_step": 88476, "epoch": 1065} {"train_loss": -21.502131657428052, "global_step": 88477, "epoch": 1065, "val_loss": 6209228.0} {"train_loss": -21.416715621948242, "global_step": 88478, "epoch": 1066} {"train_loss": -20.93783187866211, "global_step": 88479, "epoch": 1066} {"train_loss": -21.283796310424805, "global_step": 88480, "epoch": 1066} {"train_loss": -21.005735397338867, "global_step": 88481, "epoch": 1066} {"train_loss": -21.119604110717773, "global_step": 88482, "epoch": 1066} {"train_loss": -21.145248413085938, "global_step": 88483, "epoch": 1066} {"train_loss": -20.987516403198242, "global_step": 88484, "epoch": 1066} {"train_loss": -21.081684112548828, "global_step": 88485, "epoch": 1066} {"train_loss": -20.890613555908203, "global_step": 88486, "epoch": 1066} {"train_loss": -21.129514694213867, "global_step": 88487, "epoch": 1066} {"train_loss": -21.160287857055664, "global_step": 88488, "epoch": 1066} {"train_loss": -21.50308609008789, "global_step": 88489, "epoch": 1066} {"train_loss": -21.42759895324707, "global_step": 88490, "epoch": 1066} {"train_loss": -21.461349487304688, "global_step": 88491, "epoch": 1066} {"train_loss": -21.586698532104492, "global_step": 88492, "epoch": 1066} {"train_loss": -21.39312171936035, "global_step": 88493, "epoch": 1066} {"train_loss": -21.301259994506836, "global_step": 88494, "epoch": 1066} {"train_loss": -21.127201080322266, "global_step": 88495, "epoch": 1066} {"train_loss": -21.23734474182129, "global_step": 88496, "epoch": 1066} {"train_loss": -21.572786331176758, "global_step": 88497, "epoch": 1066} {"train_loss": -21.380292892456055, "global_step": 88498, "epoch": 1066} {"train_loss": -21.52439308166504, "global_step": 88499, "epoch": 1066} {"train_loss": -21.090864181518555, "global_step": 88500, "epoch": 1066} {"train_loss": -21.834848403930664, "global_step": 88501, "epoch": 1066} {"train_loss": -21.38064193725586, "global_step": 88502, "epoch": 1066} {"train_loss": -21.581518173217773, "global_step": 88503, "epoch": 1066} {"train_loss": -21.660669326782227, "global_step": 88504, "epoch": 1066} {"train_loss": -21.544612884521484, "global_step": 88505, "epoch": 1066} {"train_loss": -21.89422035217285, "global_step": 88506, "epoch": 1066} {"train_loss": -21.617639541625977, "global_step": 88507, "epoch": 1066} {"train_loss": -21.175922393798828, "global_step": 88508, "epoch": 1066} {"train_loss": -21.365055084228516, "global_step": 88509, "epoch": 1066} {"train_loss": -21.48946189880371, "global_step": 88510, "epoch": 1066} {"train_loss": -21.636016845703125, "global_step": 88511, "epoch": 1066} {"train_loss": -21.138940811157227, "global_step": 88512, "epoch": 1066} {"train_loss": -21.78923797607422, "global_step": 88513, "epoch": 1066} {"train_loss": -21.417160034179688, "global_step": 88514, "epoch": 1066} {"train_loss": -21.8109188079834, "global_step": 88515, "epoch": 1066} {"train_loss": -21.44061279296875, "global_step": 88516, "epoch": 1066} {"train_loss": -21.852344512939453, "global_step": 88517, "epoch": 1066} {"train_loss": -21.839740753173828, "global_step": 88518, "epoch": 1066} {"train_loss": -21.60556411743164, "global_step": 88519, "epoch": 1066} {"train_loss": -21.580352783203125, "global_step": 88520, "epoch": 1066} {"train_loss": -21.30095863342285, "global_step": 88521, "epoch": 1066} {"train_loss": -21.624292373657227, "global_step": 88522, "epoch": 1066} {"train_loss": -21.585500717163086, "global_step": 88523, "epoch": 1066} {"train_loss": -21.727863311767578, "global_step": 88524, "epoch": 1066} {"train_loss": -21.826406478881836, "global_step": 88525, "epoch": 1066} {"train_loss": -21.14753532409668, "global_step": 88526, "epoch": 1066} {"train_loss": -21.823102951049805, "global_step": 88527, "epoch": 1066} {"train_loss": -21.35950469970703, "global_step": 88528, "epoch": 1066} {"train_loss": -21.421092987060547, "global_step": 88529, "epoch": 1066} {"train_loss": -21.85727882385254, "global_step": 88530, "epoch": 1066} {"train_loss": -21.855501174926758, "global_step": 88531, "epoch": 1066} {"train_loss": -21.656591415405273, "global_step": 88532, "epoch": 1066} {"train_loss": -21.41868019104004, "global_step": 88533, "epoch": 1066} {"train_loss": -21.227628707885742, "global_step": 88534, "epoch": 1066} {"train_loss": -21.54498291015625, "global_step": 88535, "epoch": 1066} {"train_loss": -21.48232650756836, "global_step": 88536, "epoch": 1066} {"train_loss": -21.672962188720703, "global_step": 88537, "epoch": 1066} {"train_loss": -21.03257942199707, "global_step": 88538, "epoch": 1066} {"train_loss": -21.654796600341797, "global_step": 88539, "epoch": 1066} {"train_loss": -21.320281982421875, "global_step": 88540, "epoch": 1066} {"train_loss": -21.144140243530273, "global_step": 88541, "epoch": 1066} {"train_loss": -21.57246208190918, "global_step": 88542, "epoch": 1066} {"train_loss": -21.331729888916016, "global_step": 88543, "epoch": 1066} {"train_loss": -20.97989273071289, "global_step": 88544, "epoch": 1066} {"train_loss": -21.324491500854492, "global_step": 88545, "epoch": 1066} {"train_loss": -21.392650604248047, "global_step": 88546, "epoch": 1066} {"train_loss": -21.425588607788086, "global_step": 88547, "epoch": 1066} {"train_loss": -21.58210563659668, "global_step": 88548, "epoch": 1066} {"train_loss": -21.324661254882812, "global_step": 88549, "epoch": 1066} {"train_loss": -21.781986236572266, "global_step": 88550, "epoch": 1066} {"train_loss": -21.546483993530273, "global_step": 88551, "epoch": 1066} {"train_loss": -21.4599552154541, "global_step": 88552, "epoch": 1066} {"train_loss": -21.97121238708496, "global_step": 88553, "epoch": 1066} {"train_loss": -21.19866371154785, "global_step": 88554, "epoch": 1066} {"train_loss": -21.4470157623291, "global_step": 88555, "epoch": 1066} {"train_loss": -21.641576766967773, "global_step": 88556, "epoch": 1066} {"train_loss": -21.4676513671875, "global_step": 88557, "epoch": 1066} {"train_loss": -21.86026954650879, "global_step": 88558, "epoch": 1066} {"train_loss": -21.871084213256836, "global_step": 88559, "epoch": 1066} {"train_loss": -21.46963245897408, "global_step": 88560, "epoch": 1066, "val_loss": 6096839.0} {"train_loss": -21.37141990661621, "global_step": 88561, "epoch": 1067} {"train_loss": -20.90348243713379, "global_step": 88562, "epoch": 1067} {"train_loss": -20.932828903198242, "global_step": 88563, "epoch": 1067} {"train_loss": -21.52044677734375, "global_step": 88564, "epoch": 1067} {"train_loss": -21.360631942749023, "global_step": 88565, "epoch": 1067} {"train_loss": -21.56705093383789, "global_step": 88566, "epoch": 1067} {"train_loss": -21.500112533569336, "global_step": 88567, "epoch": 1067} {"train_loss": -21.335525512695312, "global_step": 88568, "epoch": 1067} {"train_loss": -21.318363189697266, "global_step": 88569, "epoch": 1067} {"train_loss": -21.474172592163086, "global_step": 88570, "epoch": 1067} {"train_loss": -21.57269859313965, "global_step": 88571, "epoch": 1067} {"train_loss": -21.28340721130371, "global_step": 88572, "epoch": 1067} {"train_loss": -21.242084503173828, "global_step": 88573, "epoch": 1067} {"train_loss": -21.252302169799805, "global_step": 88574, "epoch": 1067} {"train_loss": -21.8992977142334, "global_step": 88575, "epoch": 1067} {"train_loss": -21.40690040588379, "global_step": 88576, "epoch": 1067} {"train_loss": -21.621387481689453, "global_step": 88577, "epoch": 1067} {"train_loss": -21.79537010192871, "global_step": 88578, "epoch": 1067} {"train_loss": -21.302505493164062, "global_step": 88579, "epoch": 1067} {"train_loss": -21.57270622253418, "global_step": 88580, "epoch": 1067} {"train_loss": -21.17071533203125, "global_step": 88581, "epoch": 1067} {"train_loss": -21.381454467773438, "global_step": 88582, "epoch": 1067} {"train_loss": -21.3736515045166, "global_step": 88583, "epoch": 1067} {"train_loss": -21.0587158203125, "global_step": 88584, "epoch": 1067} {"train_loss": -21.741926193237305, "global_step": 88585, "epoch": 1067} {"train_loss": -21.124433517456055, "global_step": 88586, "epoch": 1067} {"train_loss": -21.263992309570312, "global_step": 88587, "epoch": 1067} {"train_loss": -21.430105209350586, "global_step": 88588, "epoch": 1067} {"train_loss": -21.2319393157959, "global_step": 88589, "epoch": 1067} {"train_loss": -21.577360153198242, "global_step": 88590, "epoch": 1067} {"train_loss": -21.554338455200195, "global_step": 88591, "epoch": 1067} {"train_loss": -21.573436737060547, "global_step": 88592, "epoch": 1067} {"train_loss": -21.391164779663086, "global_step": 88593, "epoch": 1067} {"train_loss": -21.920114517211914, "global_step": 88594, "epoch": 1067} {"train_loss": -21.589736938476562, "global_step": 88595, "epoch": 1067} {"train_loss": -21.335010528564453, "global_step": 88596, "epoch": 1067} {"train_loss": -21.337270736694336, "global_step": 88597, "epoch": 1067} {"train_loss": -21.72420310974121, "global_step": 88598, "epoch": 1067} {"train_loss": -21.631818771362305, "global_step": 88599, "epoch": 1067} {"train_loss": -21.268924713134766, "global_step": 88600, "epoch": 1067} {"train_loss": -21.43635368347168, "global_step": 88601, "epoch": 1067} {"train_loss": -21.525882720947266, "global_step": 88602, "epoch": 1067} {"train_loss": -21.356250762939453, "global_step": 88603, "epoch": 1067} {"train_loss": -21.686080932617188, "global_step": 88604, "epoch": 1067} {"train_loss": -21.495906829833984, "global_step": 88605, "epoch": 1067} {"train_loss": -21.763303756713867, "global_step": 88606, "epoch": 1067} {"train_loss": -21.078393936157227, "global_step": 88607, "epoch": 1067} {"train_loss": -21.515539169311523, "global_step": 88608, "epoch": 1067} {"train_loss": -21.223968505859375, "global_step": 88609, "epoch": 1067} {"train_loss": -21.253509521484375, "global_step": 88610, "epoch": 1067} {"train_loss": -21.76148796081543, "global_step": 88611, "epoch": 1067} {"train_loss": -21.5279541015625, "global_step": 88612, "epoch": 1067} {"train_loss": -21.115036010742188, "global_step": 88613, "epoch": 1067} {"train_loss": -21.274436950683594, "global_step": 88614, "epoch": 1067} {"train_loss": -21.72503662109375, "global_step": 88615, "epoch": 1067} {"train_loss": -21.73487663269043, "global_step": 88616, "epoch": 1067} {"train_loss": -21.53888511657715, "global_step": 88617, "epoch": 1067} {"train_loss": -21.20953941345215, "global_step": 88618, "epoch": 1067} {"train_loss": -21.685251235961914, "global_step": 88619, "epoch": 1067} {"train_loss": -21.5261287689209, "global_step": 88620, "epoch": 1067} {"train_loss": -21.512216567993164, "global_step": 88621, "epoch": 1067} {"train_loss": -21.499948501586914, "global_step": 88622, "epoch": 1067} {"train_loss": -21.70657730102539, "global_step": 88623, "epoch": 1067} {"train_loss": -21.31073570251465, "global_step": 88624, "epoch": 1067} {"train_loss": -21.563650131225586, "global_step": 88625, "epoch": 1067} {"train_loss": -21.460403442382812, "global_step": 88626, "epoch": 1067} {"train_loss": -21.24971580505371, "global_step": 88627, "epoch": 1067} {"train_loss": -21.612171173095703, "global_step": 88628, "epoch": 1067} {"train_loss": -21.79530906677246, "global_step": 88629, "epoch": 1067} {"train_loss": -21.44129180908203, "global_step": 88630, "epoch": 1067} {"train_loss": -21.5601749420166, "global_step": 88631, "epoch": 1067} {"train_loss": -21.52337074279785, "global_step": 88632, "epoch": 1067} {"train_loss": -21.612930297851562, "global_step": 88633, "epoch": 1067} {"train_loss": -21.63602066040039, "global_step": 88634, "epoch": 1067} {"train_loss": -21.25608253479004, "global_step": 88635, "epoch": 1067} {"train_loss": -21.444595336914062, "global_step": 88636, "epoch": 1067} {"train_loss": -21.9802303314209, "global_step": 88637, "epoch": 1067} {"train_loss": -21.47802734375, "global_step": 88638, "epoch": 1067} {"train_loss": -21.581640243530273, "global_step": 88639, "epoch": 1067} {"train_loss": -21.610036849975586, "global_step": 88640, "epoch": 1067} {"train_loss": -21.6561279296875, "global_step": 88641, "epoch": 1067} {"train_loss": -21.569992065429688, "global_step": 88642, "epoch": 1067} {"train_loss": -21.48331658236952, "global_step": 88643, "epoch": 1067, "val_loss": 5991849.0} {"train_loss": -20.92291831970215, "global_step": 88644, "epoch": 1068} {"train_loss": -20.73568344116211, "global_step": 88645, "epoch": 1068} {"train_loss": -21.368282318115234, "global_step": 88646, "epoch": 1068} {"train_loss": -21.42437171936035, "global_step": 88647, "epoch": 1068} {"train_loss": -21.032773971557617, "global_step": 88648, "epoch": 1068} {"train_loss": -21.278728485107422, "global_step": 88649, "epoch": 1068} {"train_loss": -20.995580673217773, "global_step": 88650, "epoch": 1068} {"train_loss": -21.24723243713379, "global_step": 88651, "epoch": 1068} {"train_loss": -21.24301528930664, "global_step": 88652, "epoch": 1068} {"train_loss": -21.4713191986084, "global_step": 88653, "epoch": 1068} {"train_loss": -21.30011558532715, "global_step": 88654, "epoch": 1068} {"train_loss": -21.373676300048828, "global_step": 88655, "epoch": 1068} {"train_loss": -21.225614547729492, "global_step": 88656, "epoch": 1068} {"train_loss": -21.209592819213867, "global_step": 88657, "epoch": 1068} {"train_loss": -21.43691062927246, "global_step": 88658, "epoch": 1068} {"train_loss": -21.639680862426758, "global_step": 88659, "epoch": 1068} {"train_loss": -21.560510635375977, "global_step": 88660, "epoch": 1068} {"train_loss": -21.46013832092285, "global_step": 88661, "epoch": 1068} {"train_loss": -21.54439353942871, "global_step": 88662, "epoch": 1068} {"train_loss": -21.631933212280273, "global_step": 88663, "epoch": 1068} {"train_loss": -21.416685104370117, "global_step": 88664, "epoch": 1068} {"train_loss": -21.336301803588867, "global_step": 88665, "epoch": 1068} {"train_loss": -21.573698043823242, "global_step": 88666, "epoch": 1068} {"train_loss": -21.27787208557129, "global_step": 88667, "epoch": 1068} {"train_loss": -21.904939651489258, "global_step": 88668, "epoch": 1068} {"train_loss": -21.48951530456543, "global_step": 88669, "epoch": 1068} {"train_loss": -21.513376235961914, "global_step": 88670, "epoch": 1068} {"train_loss": -21.242664337158203, "global_step": 88671, "epoch": 1068} {"train_loss": -21.60451316833496, "global_step": 88672, "epoch": 1068} {"train_loss": -21.286378860473633, "global_step": 88673, "epoch": 1068} {"train_loss": -21.802234649658203, "global_step": 88674, "epoch": 1068} {"train_loss": -21.307706832885742, "global_step": 88675, "epoch": 1068} {"train_loss": -21.537992477416992, "global_step": 88676, "epoch": 1068} {"train_loss": -21.81662940979004, "global_step": 88677, "epoch": 1068} {"train_loss": -21.946128845214844, "global_step": 88678, "epoch": 1068} {"train_loss": -21.55118179321289, "global_step": 88679, "epoch": 1068} {"train_loss": -21.589508056640625, "global_step": 88680, "epoch": 1068} {"train_loss": -21.25775718688965, "global_step": 88681, "epoch": 1068} {"train_loss": -21.6011905670166, "global_step": 88682, "epoch": 1068} {"train_loss": -21.4794921875, "global_step": 88683, "epoch": 1068} {"train_loss": -21.864578247070312, "global_step": 88684, "epoch": 1068} {"train_loss": -21.768512725830078, "global_step": 88685, "epoch": 1068} {"train_loss": -21.78987693786621, "global_step": 88686, "epoch": 1068} {"train_loss": -21.914236068725586, "global_step": 88687, "epoch": 1068} {"train_loss": -21.61227035522461, "global_step": 88688, "epoch": 1068} {"train_loss": -21.40677261352539, "global_step": 88689, "epoch": 1068} {"train_loss": -21.614547729492188, "global_step": 88690, "epoch": 1068} {"train_loss": -21.580219268798828, "global_step": 88691, "epoch": 1068} {"train_loss": -21.498899459838867, "global_step": 88692, "epoch": 1068} {"train_loss": -21.399120330810547, "global_step": 88693, "epoch": 1068} {"train_loss": -21.477441787719727, "global_step": 88694, "epoch": 1068} {"train_loss": -21.672517776489258, "global_step": 88695, "epoch": 1068} {"train_loss": -21.591726303100586, "global_step": 88696, "epoch": 1068} {"train_loss": -21.56406593322754, "global_step": 88697, "epoch": 1068} {"train_loss": -21.456418991088867, "global_step": 88698, "epoch": 1068} {"train_loss": -21.371070861816406, "global_step": 88699, "epoch": 1068} {"train_loss": -21.819726943969727, "global_step": 88700, "epoch": 1068} {"train_loss": -21.763065338134766, "global_step": 88701, "epoch": 1068} {"train_loss": -21.864063262939453, "global_step": 88702, "epoch": 1068} {"train_loss": -21.903608322143555, "global_step": 88703, "epoch": 1068} {"train_loss": -21.544431686401367, "global_step": 88704, "epoch": 1068} {"train_loss": -21.76247215270996, "global_step": 88705, "epoch": 1068} {"train_loss": -21.5776309967041, "global_step": 88706, "epoch": 1068} {"train_loss": -21.679943084716797, "global_step": 88707, "epoch": 1068} {"train_loss": -21.60306739807129, "global_step": 88708, "epoch": 1068} {"train_loss": -21.288801193237305, "global_step": 88709, "epoch": 1068} {"train_loss": -21.33938217163086, "global_step": 88710, "epoch": 1068} {"train_loss": -21.900197982788086, "global_step": 88711, "epoch": 1068} {"train_loss": -21.474210739135742, "global_step": 88712, "epoch": 1068} {"train_loss": -21.56691551208496, "global_step": 88713, "epoch": 1068} {"train_loss": -21.835683822631836, "global_step": 88714, "epoch": 1068} {"train_loss": -21.434057235717773, "global_step": 88715, "epoch": 1068} {"train_loss": -21.296043395996094, "global_step": 88716, "epoch": 1068} {"train_loss": -21.170358657836914, "global_step": 88717, "epoch": 1068} {"train_loss": -21.499740600585938, "global_step": 88718, "epoch": 1068} {"train_loss": -21.483203887939453, "global_step": 88719, "epoch": 1068} {"train_loss": -21.122098922729492, "global_step": 88720, "epoch": 1068} {"train_loss": -21.730602264404297, "global_step": 88721, "epoch": 1068} {"train_loss": -21.529085159301758, "global_step": 88722, "epoch": 1068} {"train_loss": -21.909090042114258, "global_step": 88723, "epoch": 1068} {"train_loss": -21.375879287719727, "global_step": 88724, "epoch": 1068} {"train_loss": -21.529748916625977, "global_step": 88725, "epoch": 1068} {"train_loss": -21.490184163472737, "global_step": 88726, "epoch": 1068, "val_loss": 6136597.0} {"train_loss": -20.991743087768555, "global_step": 88727, "epoch": 1069} {"train_loss": -20.6184024810791, "global_step": 88728, "epoch": 1069} {"train_loss": -20.98203468322754, "global_step": 88729, "epoch": 1069} {"train_loss": -21.154211044311523, "global_step": 88730, "epoch": 1069} {"train_loss": -21.05527687072754, "global_step": 88731, "epoch": 1069} {"train_loss": -21.344165802001953, "global_step": 88732, "epoch": 1069} {"train_loss": -21.306522369384766, "global_step": 88733, "epoch": 1069} {"train_loss": -21.117788314819336, "global_step": 88734, "epoch": 1069} {"train_loss": -21.101821899414062, "global_step": 88735, "epoch": 1069} {"train_loss": -21.699995040893555, "global_step": 88736, "epoch": 1069} {"train_loss": -21.07808494567871, "global_step": 88737, "epoch": 1069} {"train_loss": -21.523496627807617, "global_step": 88738, "epoch": 1069} {"train_loss": -21.25110626220703, "global_step": 88739, "epoch": 1069} {"train_loss": -21.255701065063477, "global_step": 88740, "epoch": 1069} {"train_loss": -21.004413604736328, "global_step": 88741, "epoch": 1069} {"train_loss": -20.986433029174805, "global_step": 88742, "epoch": 1069} {"train_loss": -21.417566299438477, "global_step": 88743, "epoch": 1069} {"train_loss": -21.30478286743164, "global_step": 88744, "epoch": 1069} {"train_loss": -21.457670211791992, "global_step": 88745, "epoch": 1069} {"train_loss": -21.66302490234375, "global_step": 88746, "epoch": 1069} {"train_loss": -21.73553466796875, "global_step": 88747, "epoch": 1069} {"train_loss": -21.186803817749023, "global_step": 88748, "epoch": 1069} {"train_loss": -21.195417404174805, "global_step": 88749, "epoch": 1069} {"train_loss": -21.474576950073242, "global_step": 88750, "epoch": 1069} {"train_loss": -21.75255012512207, "global_step": 88751, "epoch": 1069} {"train_loss": -21.68575096130371, "global_step": 88752, "epoch": 1069} {"train_loss": -21.738561630249023, "global_step": 88753, "epoch": 1069} {"train_loss": -21.882041931152344, "global_step": 88754, "epoch": 1069} {"train_loss": -21.41191864013672, "global_step": 88755, "epoch": 1069} {"train_loss": -21.096792221069336, "global_step": 88756, "epoch": 1069} {"train_loss": -21.78651237487793, "global_step": 88757, "epoch": 1069} {"train_loss": -21.525522232055664, "global_step": 88758, "epoch": 1069} {"train_loss": -21.502445220947266, "global_step": 88759, "epoch": 1069} {"train_loss": -21.502538681030273, "global_step": 88760, "epoch": 1069} {"train_loss": -21.67782974243164, "global_step": 88761, "epoch": 1069} {"train_loss": -21.2143611907959, "global_step": 88762, "epoch": 1069} {"train_loss": -21.331588745117188, "global_step": 88763, "epoch": 1069} {"train_loss": -21.541208267211914, "global_step": 88764, "epoch": 1069} {"train_loss": -21.64740562438965, "global_step": 88765, "epoch": 1069} {"train_loss": -21.186513900756836, "global_step": 88766, "epoch": 1069} {"train_loss": -21.508657455444336, "global_step": 88767, "epoch": 1069} {"train_loss": -21.558395385742188, "global_step": 88768, "epoch": 1069} {"train_loss": -21.90983772277832, "global_step": 88769, "epoch": 1069} {"train_loss": -21.515195846557617, "global_step": 88770, "epoch": 1069} {"train_loss": -21.57209587097168, "global_step": 88771, "epoch": 1069} {"train_loss": -21.487205505371094, "global_step": 88772, "epoch": 1069} {"train_loss": -21.33379554748535, "global_step": 88773, "epoch": 1069} {"train_loss": -21.80672264099121, "global_step": 88774, "epoch": 1069} {"train_loss": -21.634824752807617, "global_step": 88775, "epoch": 1069} {"train_loss": -21.753170013427734, "global_step": 88776, "epoch": 1069} {"train_loss": -22.062644958496094, "global_step": 88777, "epoch": 1069} {"train_loss": -21.506311416625977, "global_step": 88778, "epoch": 1069} {"train_loss": -21.9112606048584, "global_step": 88779, "epoch": 1069} {"train_loss": -21.342451095581055, "global_step": 88780, "epoch": 1069} {"train_loss": -21.8968448638916, "global_step": 88781, "epoch": 1069} {"train_loss": -21.607423782348633, "global_step": 88782, "epoch": 1069} {"train_loss": -21.330625534057617, "global_step": 88783, "epoch": 1069} {"train_loss": -21.50596046447754, "global_step": 88784, "epoch": 1069} {"train_loss": -21.50518798828125, "global_step": 88785, "epoch": 1069} {"train_loss": -21.602773666381836, "global_step": 88786, "epoch": 1069} {"train_loss": -21.320642471313477, "global_step": 88787, "epoch": 1069} {"train_loss": -21.507827758789062, "global_step": 88788, "epoch": 1069} {"train_loss": -21.31009864807129, "global_step": 88789, "epoch": 1069} {"train_loss": -20.9067325592041, "global_step": 88790, "epoch": 1069} {"train_loss": -21.47721290588379, "global_step": 88791, "epoch": 1069} {"train_loss": -21.420896530151367, "global_step": 88792, "epoch": 1069} {"train_loss": -21.642568588256836, "global_step": 88793, "epoch": 1069} {"train_loss": -21.427520751953125, "global_step": 88794, "epoch": 1069} {"train_loss": -21.66798210144043, "global_step": 88795, "epoch": 1069} {"train_loss": -21.471149444580078, "global_step": 88796, "epoch": 1069} {"train_loss": -21.8968505859375, "global_step": 88797, "epoch": 1069} {"train_loss": -21.37775993347168, "global_step": 88798, "epoch": 1069} {"train_loss": -21.57159423828125, "global_step": 88799, "epoch": 1069} {"train_loss": -21.580699920654297, "global_step": 88800, "epoch": 1069} {"train_loss": -21.220434188842773, "global_step": 88801, "epoch": 1069} {"train_loss": -21.418935775756836, "global_step": 88802, "epoch": 1069} {"train_loss": -21.487043380737305, "global_step": 88803, "epoch": 1069} {"train_loss": -21.365095138549805, "global_step": 88804, "epoch": 1069} {"train_loss": -21.467697143554688, "global_step": 88805, "epoch": 1069} {"train_loss": -21.865140914916992, "global_step": 88806, "epoch": 1069} {"train_loss": -21.78499412536621, "global_step": 88807, "epoch": 1069} {"train_loss": -21.573469161987305, "global_step": 88808, "epoch": 1069} {"train_loss": -21.45168927204178, "global_step": 88809, "epoch": 1069, "val_loss": 6252329.0} {"train_loss": -21.16359519958496, "global_step": 88810, "epoch": 1070} {"train_loss": -21.676496505737305, "global_step": 88811, "epoch": 1070} {"train_loss": -21.270660400390625, "global_step": 88812, "epoch": 1070} {"train_loss": -21.319974899291992, "global_step": 88813, "epoch": 1070} {"train_loss": -21.431795120239258, "global_step": 88814, "epoch": 1070} {"train_loss": -21.442182540893555, "global_step": 88815, "epoch": 1070} {"train_loss": -21.211753845214844, "global_step": 88816, "epoch": 1070} {"train_loss": -21.60590171813965, "global_step": 88817, "epoch": 1070} {"train_loss": -21.468244552612305, "global_step": 88818, "epoch": 1070} {"train_loss": -21.555522918701172, "global_step": 88819, "epoch": 1070} {"train_loss": -21.464740753173828, "global_step": 88820, "epoch": 1070} {"train_loss": -21.12274742126465, "global_step": 88821, "epoch": 1070} {"train_loss": -21.446651458740234, "global_step": 88822, "epoch": 1070} {"train_loss": -21.313135147094727, "global_step": 88823, "epoch": 1070} {"train_loss": -21.67106819152832, "global_step": 88824, "epoch": 1070} {"train_loss": -21.476594924926758, "global_step": 88825, "epoch": 1070} {"train_loss": -21.059982299804688, "global_step": 88826, "epoch": 1070} {"train_loss": -21.51410484313965, "global_step": 88827, "epoch": 1070} {"train_loss": -21.358001708984375, "global_step": 88828, "epoch": 1070} {"train_loss": -21.175901412963867, "global_step": 88829, "epoch": 1070} {"train_loss": -21.212020874023438, "global_step": 88830, "epoch": 1070} {"train_loss": -21.19266128540039, "global_step": 88831, "epoch": 1070} {"train_loss": -21.27069854736328, "global_step": 88832, "epoch": 1070} {"train_loss": -21.489255905151367, "global_step": 88833, "epoch": 1070} {"train_loss": -21.12375259399414, "global_step": 88834, "epoch": 1070} {"train_loss": -21.553958892822266, "global_step": 88835, "epoch": 1070} {"train_loss": -20.921430587768555, "global_step": 88836, "epoch": 1070} {"train_loss": -21.317962646484375, "global_step": 88837, "epoch": 1070} {"train_loss": -21.54103660583496, "global_step": 88838, "epoch": 1070} {"train_loss": -21.315134048461914, "global_step": 88839, "epoch": 1070} {"train_loss": -21.300668716430664, "global_step": 88840, "epoch": 1070} {"train_loss": -21.082012176513672, "global_step": 88841, "epoch": 1070} {"train_loss": -21.353567123413086, "global_step": 88842, "epoch": 1070} {"train_loss": -21.444074630737305, "global_step": 88843, "epoch": 1070} {"train_loss": -21.718324661254883, "global_step": 88844, "epoch": 1070} {"train_loss": -21.30378532409668, "global_step": 88845, "epoch": 1070} {"train_loss": -21.510480880737305, "global_step": 88846, "epoch": 1070} {"train_loss": -21.58372688293457, "global_step": 88847, "epoch": 1070} {"train_loss": -21.81333351135254, "global_step": 88848, "epoch": 1070} {"train_loss": -21.4859676361084, "global_step": 88849, "epoch": 1070} {"train_loss": -21.755970001220703, "global_step": 88850, "epoch": 1070} {"train_loss": -21.718238830566406, "global_step": 88851, "epoch": 1070} {"train_loss": -21.62705421447754, "global_step": 88852, "epoch": 1070} {"train_loss": -21.354251861572266, "global_step": 88853, "epoch": 1070} {"train_loss": -21.127897262573242, "global_step": 88854, "epoch": 1070} {"train_loss": -21.38777732849121, "global_step": 88855, "epoch": 1070} {"train_loss": -21.106130599975586, "global_step": 88856, "epoch": 1070} {"train_loss": -21.38419532775879, "global_step": 88857, "epoch": 1070} {"train_loss": -21.3807373046875, "global_step": 88858, "epoch": 1070} {"train_loss": -21.460805892944336, "global_step": 88859, "epoch": 1070} {"train_loss": -21.36463165283203, "global_step": 88860, "epoch": 1070} {"train_loss": -21.274124145507812, "global_step": 88861, "epoch": 1070} {"train_loss": -21.522445678710938, "global_step": 88862, "epoch": 1070} {"train_loss": -21.384536743164062, "global_step": 88863, "epoch": 1070} {"train_loss": -22.049304962158203, "global_step": 88864, "epoch": 1070} {"train_loss": -21.214767456054688, "global_step": 88865, "epoch": 1070} {"train_loss": -21.261240005493164, "global_step": 88866, "epoch": 1070} {"train_loss": -21.451040267944336, "global_step": 88867, "epoch": 1070} {"train_loss": -22.033435821533203, "global_step": 88868, "epoch": 1070} {"train_loss": -21.28268051147461, "global_step": 88869, "epoch": 1070} {"train_loss": -21.8583927154541, "global_step": 88870, "epoch": 1070} {"train_loss": -21.35032844543457, "global_step": 88871, "epoch": 1070} {"train_loss": -21.856468200683594, "global_step": 88872, "epoch": 1070} {"train_loss": -21.48445701599121, "global_step": 88873, "epoch": 1070} {"train_loss": -21.833023071289062, "global_step": 88874, "epoch": 1070} {"train_loss": -21.981494903564453, "global_step": 88875, "epoch": 1070} {"train_loss": -21.397504806518555, "global_step": 88876, "epoch": 1070} {"train_loss": -21.624675750732422, "global_step": 88877, "epoch": 1070} {"train_loss": -21.661542892456055, "global_step": 88878, "epoch": 1070} {"train_loss": -21.73236656188965, "global_step": 88879, "epoch": 1070} {"train_loss": -21.70625114440918, "global_step": 88880, "epoch": 1070} {"train_loss": -21.918790817260742, "global_step": 88881, "epoch": 1070} {"train_loss": -21.71046257019043, "global_step": 88882, "epoch": 1070} {"train_loss": -21.36519432067871, "global_step": 88883, "epoch": 1070} {"train_loss": -21.614526748657227, "global_step": 88884, "epoch": 1070} {"train_loss": -21.20290184020996, "global_step": 88885, "epoch": 1070} {"train_loss": -21.473234176635742, "global_step": 88886, "epoch": 1070} {"train_loss": -21.42720603942871, "global_step": 88887, "epoch": 1070} {"train_loss": -21.87253189086914, "global_step": 88888, "epoch": 1070} {"train_loss": -21.581586837768555, "global_step": 88889, "epoch": 1070} {"train_loss": -21.82988166809082, "global_step": 88890, "epoch": 1070} {"train_loss": -21.498937606811523, "global_step": 88891, "epoch": 1070} {"train_loss": -21.471913142376636, "global_step": 88892, "epoch": 1070, "val_loss": 6118960.5} {"train_loss": -21.51840591430664, "global_step": 88893, "epoch": 1071} {"train_loss": -21.487058639526367, "global_step": 88894, "epoch": 1071} {"train_loss": -21.342172622680664, "global_step": 88895, "epoch": 1071} {"train_loss": -20.90756607055664, "global_step": 88896, "epoch": 1071} {"train_loss": -20.98625373840332, "global_step": 88897, "epoch": 1071} {"train_loss": -21.286222457885742, "global_step": 88898, "epoch": 1071} {"train_loss": -21.32062339782715, "global_step": 88899, "epoch": 1071} {"train_loss": -21.316648483276367, "global_step": 88900, "epoch": 1071} {"train_loss": -21.609619140625, "global_step": 88901, "epoch": 1071} {"train_loss": -21.480100631713867, "global_step": 88902, "epoch": 1071} {"train_loss": -21.415754318237305, "global_step": 88903, "epoch": 1071} {"train_loss": -21.364044189453125, "global_step": 88904, "epoch": 1071} {"train_loss": -21.48264503479004, "global_step": 88905, "epoch": 1071} {"train_loss": -21.841962814331055, "global_step": 88906, "epoch": 1071} {"train_loss": -21.545011520385742, "global_step": 88907, "epoch": 1071} {"train_loss": -21.416242599487305, "global_step": 88908, "epoch": 1071} {"train_loss": -21.27280616760254, "global_step": 88909, "epoch": 1071} {"train_loss": -21.37803840637207, "global_step": 88910, "epoch": 1071} {"train_loss": -21.404762268066406, "global_step": 88911, "epoch": 1071} {"train_loss": -21.236061096191406, "global_step": 88912, "epoch": 1071} {"train_loss": -21.49854850769043, "global_step": 88913, "epoch": 1071} {"train_loss": -21.633167266845703, "global_step": 88914, "epoch": 1071} {"train_loss": -21.5095272064209, "global_step": 88915, "epoch": 1071} {"train_loss": -21.221782684326172, "global_step": 88916, "epoch": 1071} {"train_loss": -21.52246856689453, "global_step": 88917, "epoch": 1071} {"train_loss": -21.529705047607422, "global_step": 88918, "epoch": 1071} {"train_loss": -21.348915100097656, "global_step": 88919, "epoch": 1071} {"train_loss": -21.3562068939209, "global_step": 88920, "epoch": 1071} {"train_loss": -21.19647216796875, "global_step": 88921, "epoch": 1071} {"train_loss": -21.417661666870117, "global_step": 88922, "epoch": 1071} {"train_loss": -21.6622314453125, "global_step": 88923, "epoch": 1071} {"train_loss": -21.630075454711914, "global_step": 88924, "epoch": 1071} {"train_loss": -21.78529167175293, "global_step": 88925, "epoch": 1071} {"train_loss": -21.426860809326172, "global_step": 88926, "epoch": 1071} {"train_loss": -21.755271911621094, "global_step": 88927, "epoch": 1071} {"train_loss": -21.693899154663086, "global_step": 88928, "epoch": 1071} {"train_loss": -21.598295211791992, "global_step": 88929, "epoch": 1071} {"train_loss": -21.49249839782715, "global_step": 88930, "epoch": 1071} {"train_loss": -21.777311325073242, "global_step": 88931, "epoch": 1071} {"train_loss": -21.601119995117188, "global_step": 88932, "epoch": 1071} {"train_loss": -21.61225700378418, "global_step": 88933, "epoch": 1071} {"train_loss": -21.96116065979004, "global_step": 88934, "epoch": 1071} {"train_loss": -22.084369659423828, "global_step": 88935, "epoch": 1071} {"train_loss": -21.364572525024414, "global_step": 88936, "epoch": 1071} {"train_loss": -21.312259674072266, "global_step": 88937, "epoch": 1071} {"train_loss": -21.146373748779297, "global_step": 88938, "epoch": 1071} {"train_loss": -21.800352096557617, "global_step": 88939, "epoch": 1071} {"train_loss": -21.699857711791992, "global_step": 88940, "epoch": 1071} {"train_loss": -21.81757164001465, "global_step": 88941, "epoch": 1071} {"train_loss": -21.38438606262207, "global_step": 88942, "epoch": 1071} {"train_loss": -21.612836837768555, "global_step": 88943, "epoch": 1071} {"train_loss": -21.445402145385742, "global_step": 88944, "epoch": 1071} {"train_loss": -21.447980880737305, "global_step": 88945, "epoch": 1071} {"train_loss": -21.70683479309082, "global_step": 88946, "epoch": 1071} {"train_loss": -21.340028762817383, "global_step": 88947, "epoch": 1071} {"train_loss": -21.8836612701416, "global_step": 88948, "epoch": 1071} {"train_loss": -21.711013793945312, "global_step": 88949, "epoch": 1071} {"train_loss": -21.696102142333984, "global_step": 88950, "epoch": 1071} {"train_loss": -21.308454513549805, "global_step": 88951, "epoch": 1071} {"train_loss": -21.742650985717773, "global_step": 88952, "epoch": 1071} {"train_loss": -21.86542320251465, "global_step": 88953, "epoch": 1071} {"train_loss": -21.712011337280273, "global_step": 88954, "epoch": 1071} {"train_loss": -21.755775451660156, "global_step": 88955, "epoch": 1071} {"train_loss": -21.266172409057617, "global_step": 88956, "epoch": 1071} {"train_loss": -21.68084716796875, "global_step": 88957, "epoch": 1071} {"train_loss": -21.6555233001709, "global_step": 88958, "epoch": 1071} {"train_loss": -21.830259323120117, "global_step": 88959, "epoch": 1071} {"train_loss": -21.779706954956055, "global_step": 88960, "epoch": 1071} {"train_loss": -21.77365493774414, "global_step": 88961, "epoch": 1071} {"train_loss": -21.32492446899414, "global_step": 88962, "epoch": 1071} {"train_loss": -21.426483154296875, "global_step": 88963, "epoch": 1071} {"train_loss": -21.35868263244629, "global_step": 88964, "epoch": 1071} {"train_loss": -21.476167678833008, "global_step": 88965, "epoch": 1071} {"train_loss": -21.55095863342285, "global_step": 88966, "epoch": 1071} {"train_loss": -21.652536392211914, "global_step": 88967, "epoch": 1071} {"train_loss": -21.774152755737305, "global_step": 88968, "epoch": 1071} {"train_loss": -21.358022689819336, "global_step": 88969, "epoch": 1071} {"train_loss": -21.74168586730957, "global_step": 88970, "epoch": 1071} {"train_loss": -21.647871017456055, "global_step": 88971, "epoch": 1071} {"train_loss": -21.52150535583496, "global_step": 88972, "epoch": 1071} {"train_loss": -21.556915283203125, "global_step": 88973, "epoch": 1071} {"train_loss": -21.563194274902344, "global_step": 88974, "epoch": 1071} {"train_loss": -21.527306476271296, "global_step": 88975, "epoch": 1071, "val_loss": 6161875.0} {"train_loss": -20.911359786987305, "global_step": 88976, "epoch": 1072} {"train_loss": -21.100828170776367, "global_step": 88977, "epoch": 1072} {"train_loss": -21.343379974365234, "global_step": 88978, "epoch": 1072} {"train_loss": -21.377199172973633, "global_step": 88979, "epoch": 1072} {"train_loss": -21.385303497314453, "global_step": 88980, "epoch": 1072} {"train_loss": -21.507816314697266, "global_step": 88981, "epoch": 1072} {"train_loss": -21.740524291992188, "global_step": 88982, "epoch": 1072} {"train_loss": -21.11554527282715, "global_step": 88983, "epoch": 1072} {"train_loss": -21.307964324951172, "global_step": 88984, "epoch": 1072} {"train_loss": -21.47798728942871, "global_step": 88985, "epoch": 1072} {"train_loss": -21.767297744750977, "global_step": 88986, "epoch": 1072} {"train_loss": -21.213850021362305, "global_step": 88987, "epoch": 1072} {"train_loss": -21.680395126342773, "global_step": 88988, "epoch": 1072} {"train_loss": -20.984024047851562, "global_step": 88989, "epoch": 1072} {"train_loss": -21.43464469909668, "global_step": 88990, "epoch": 1072} {"train_loss": -21.4821834564209, "global_step": 88991, "epoch": 1072} {"train_loss": -21.138343811035156, "global_step": 88992, "epoch": 1072} {"train_loss": -21.832189559936523, "global_step": 88993, "epoch": 1072} {"train_loss": -21.482786178588867, "global_step": 88994, "epoch": 1072} {"train_loss": -21.282154083251953, "global_step": 88995, "epoch": 1072} {"train_loss": -21.509450912475586, "global_step": 88996, "epoch": 1072} {"train_loss": -21.295291900634766, "global_step": 88997, "epoch": 1072} {"train_loss": -21.492944717407227, "global_step": 88998, "epoch": 1072} {"train_loss": -21.422361373901367, "global_step": 88999, "epoch": 1072} {"train_loss": -21.627628326416016, "global_step": 89000, "epoch": 1072} {"train_loss": -21.625253677368164, "global_step": 89001, "epoch": 1072} {"train_loss": -21.58748435974121, "global_step": 89002, "epoch": 1072} {"train_loss": -21.57625389099121, "global_step": 89003, "epoch": 1072} {"train_loss": -21.545820236206055, "global_step": 89004, "epoch": 1072} {"train_loss": -21.378583908081055, "global_step": 89005, "epoch": 1072} {"train_loss": -21.46711540222168, "global_step": 89006, "epoch": 1072} {"train_loss": -21.52950096130371, "global_step": 89007, "epoch": 1072} {"train_loss": -21.454742431640625, "global_step": 89008, "epoch": 1072} {"train_loss": -21.568096160888672, "global_step": 89009, "epoch": 1072} {"train_loss": -21.44693946838379, "global_step": 89010, "epoch": 1072} {"train_loss": -21.397754669189453, "global_step": 89011, "epoch": 1072} {"train_loss": -21.624475479125977, "global_step": 89012, "epoch": 1072} {"train_loss": -21.614572525024414, "global_step": 89013, "epoch": 1072} {"train_loss": -21.392087936401367, "global_step": 89014, "epoch": 1072} {"train_loss": -21.521451950073242, "global_step": 89015, "epoch": 1072} {"train_loss": -21.278669357299805, "global_step": 89016, "epoch": 1072} {"train_loss": -21.45081901550293, "global_step": 89017, "epoch": 1072} {"train_loss": -21.609424591064453, "global_step": 89018, "epoch": 1072} {"train_loss": -21.48963737487793, "global_step": 89019, "epoch": 1072} {"train_loss": -21.333044052124023, "global_step": 89020, "epoch": 1072} {"train_loss": -21.433094024658203, "global_step": 89021, "epoch": 1072} {"train_loss": -21.38947105407715, "global_step": 89022, "epoch": 1072} {"train_loss": -21.281103134155273, "global_step": 89023, "epoch": 1072} {"train_loss": -21.807188034057617, "global_step": 89024, "epoch": 1072} {"train_loss": -21.641416549682617, "global_step": 89025, "epoch": 1072} {"train_loss": -21.744176864624023, "global_step": 89026, "epoch": 1072} {"train_loss": -21.5462703704834, "global_step": 89027, "epoch": 1072} {"train_loss": -21.519033432006836, "global_step": 89028, "epoch": 1072} {"train_loss": -21.505294799804688, "global_step": 89029, "epoch": 1072} {"train_loss": -21.706811904907227, "global_step": 89030, "epoch": 1072} {"train_loss": -21.584444046020508, "global_step": 89031, "epoch": 1072} {"train_loss": -21.47797203063965, "global_step": 89032, "epoch": 1072} {"train_loss": -21.54854393005371, "global_step": 89033, "epoch": 1072} {"train_loss": -21.95978355407715, "global_step": 89034, "epoch": 1072} {"train_loss": -21.705350875854492, "global_step": 89035, "epoch": 1072} {"train_loss": -21.694171905517578, "global_step": 89036, "epoch": 1072} {"train_loss": -21.915746688842773, "global_step": 89037, "epoch": 1072} {"train_loss": -21.71000862121582, "global_step": 89038, "epoch": 1072} {"train_loss": -21.249265670776367, "global_step": 89039, "epoch": 1072} {"train_loss": -21.79575538635254, "global_step": 89040, "epoch": 1072} {"train_loss": -21.21913719177246, "global_step": 89041, "epoch": 1072} {"train_loss": -21.77931022644043, "global_step": 89042, "epoch": 1072} {"train_loss": -21.310949325561523, "global_step": 89043, "epoch": 1072} {"train_loss": -21.45499038696289, "global_step": 89044, "epoch": 1072} {"train_loss": -21.786115646362305, "global_step": 89045, "epoch": 1072} {"train_loss": -21.686826705932617, "global_step": 89046, "epoch": 1072} {"train_loss": -21.352359771728516, "global_step": 89047, "epoch": 1072} {"train_loss": -21.525583267211914, "global_step": 89048, "epoch": 1072} {"train_loss": -21.404077529907227, "global_step": 89049, "epoch": 1072} {"train_loss": -21.157745361328125, "global_step": 89050, "epoch": 1072} {"train_loss": -21.768842697143555, "global_step": 89051, "epoch": 1072} {"train_loss": -21.163015365600586, "global_step": 89052, "epoch": 1072} {"train_loss": -21.07623863220215, "global_step": 89053, "epoch": 1072} {"train_loss": -21.495573043823242, "global_step": 89054, "epoch": 1072} {"train_loss": -21.401765823364258, "global_step": 89055, "epoch": 1072} {"train_loss": -21.594755172729492, "global_step": 89056, "epoch": 1072} {"train_loss": -21.60647201538086, "global_step": 89057, "epoch": 1072} {"train_loss": -21.48475948012019, "global_step": 89058, "epoch": 1072, "val_loss": 6157641.5} {"train_loss": -21.287498474121094, "global_step": 89059, "epoch": 1073} {"train_loss": -21.480670928955078, "global_step": 89060, "epoch": 1073} {"train_loss": -21.503957748413086, "global_step": 89061, "epoch": 1073} {"train_loss": -21.585195541381836, "global_step": 89062, "epoch": 1073} {"train_loss": -20.817495346069336, "global_step": 89063, "epoch": 1073} {"train_loss": -21.4017391204834, "global_step": 89064, "epoch": 1073} {"train_loss": -21.400604248046875, "global_step": 89065, "epoch": 1073} {"train_loss": -21.61467933654785, "global_step": 89066, "epoch": 1073} {"train_loss": -21.551305770874023, "global_step": 89067, "epoch": 1073} {"train_loss": -21.153884887695312, "global_step": 89068, "epoch": 1073} {"train_loss": -21.628036499023438, "global_step": 89069, "epoch": 1073} {"train_loss": -21.305124282836914, "global_step": 89070, "epoch": 1073} {"train_loss": -21.55863380432129, "global_step": 89071, "epoch": 1073} {"train_loss": -21.09120750427246, "global_step": 89072, "epoch": 1073} {"train_loss": -21.70088005065918, "global_step": 89073, "epoch": 1073} {"train_loss": -21.61408805847168, "global_step": 89074, "epoch": 1073} {"train_loss": -21.607559204101562, "global_step": 89075, "epoch": 1073} {"train_loss": -21.450572967529297, "global_step": 89076, "epoch": 1073} {"train_loss": -21.27215003967285, "global_step": 89077, "epoch": 1073} {"train_loss": -21.633785247802734, "global_step": 89078, "epoch": 1073} {"train_loss": -21.454360961914062, "global_step": 89079, "epoch": 1073} {"train_loss": -21.462474822998047, "global_step": 89080, "epoch": 1073} {"train_loss": -21.466934204101562, "global_step": 89081, "epoch": 1073} {"train_loss": -21.46381950378418, "global_step": 89082, "epoch": 1073} {"train_loss": -21.530609130859375, "global_step": 89083, "epoch": 1073} {"train_loss": -21.646543502807617, "global_step": 89084, "epoch": 1073} {"train_loss": -21.464008331298828, "global_step": 89085, "epoch": 1073} {"train_loss": -21.687129974365234, "global_step": 89086, "epoch": 1073} {"train_loss": -21.386014938354492, "global_step": 89087, "epoch": 1073} {"train_loss": -21.561307907104492, "global_step": 89088, "epoch": 1073} {"train_loss": -21.82037925720215, "global_step": 89089, "epoch": 1073} {"train_loss": -21.500267028808594, "global_step": 89090, "epoch": 1073} {"train_loss": -21.765670776367188, "global_step": 89091, "epoch": 1073} {"train_loss": -21.67379379272461, "global_step": 89092, "epoch": 1073} {"train_loss": -21.46962547302246, "global_step": 89093, "epoch": 1073} {"train_loss": -21.754165649414062, "global_step": 89094, "epoch": 1073} {"train_loss": -21.471805572509766, "global_step": 89095, "epoch": 1073} {"train_loss": -21.465396881103516, "global_step": 89096, "epoch": 1073} {"train_loss": -21.518747329711914, "global_step": 89097, "epoch": 1073} {"train_loss": -21.759485244750977, "global_step": 89098, "epoch": 1073} {"train_loss": -21.725624084472656, "global_step": 89099, "epoch": 1073} {"train_loss": -21.71109390258789, "global_step": 89100, "epoch": 1073} {"train_loss": -21.646780014038086, "global_step": 89101, "epoch": 1073} {"train_loss": -21.742677688598633, "global_step": 89102, "epoch": 1073} {"train_loss": -21.42589569091797, "global_step": 89103, "epoch": 1073} {"train_loss": -21.63143539428711, "global_step": 89104, "epoch": 1073} {"train_loss": -21.407432556152344, "global_step": 89105, "epoch": 1073} {"train_loss": -21.748456954956055, "global_step": 89106, "epoch": 1073} {"train_loss": -20.869260787963867, "global_step": 89107, "epoch": 1073} {"train_loss": -21.665573120117188, "global_step": 89108, "epoch": 1073} {"train_loss": -21.48127555847168, "global_step": 89109, "epoch": 1073} {"train_loss": -21.351247787475586, "global_step": 89110, "epoch": 1073} {"train_loss": -21.36421012878418, "global_step": 89111, "epoch": 1073} {"train_loss": -21.63113021850586, "global_step": 89112, "epoch": 1073} {"train_loss": -21.65753936767578, "global_step": 89113, "epoch": 1073} {"train_loss": -21.62698745727539, "global_step": 89114, "epoch": 1073} {"train_loss": -21.615131378173828, "global_step": 89115, "epoch": 1073} {"train_loss": -21.706035614013672, "global_step": 89116, "epoch": 1073} {"train_loss": -21.224578857421875, "global_step": 89117, "epoch": 1073} {"train_loss": -21.580121994018555, "global_step": 89118, "epoch": 1073} {"train_loss": -21.61164665222168, "global_step": 89119, "epoch": 1073} {"train_loss": -21.028791427612305, "global_step": 89120, "epoch": 1073} {"train_loss": -21.561243057250977, "global_step": 89121, "epoch": 1073} {"train_loss": -21.6191349029541, "global_step": 89122, "epoch": 1073} {"train_loss": -21.314157485961914, "global_step": 89123, "epoch": 1073} {"train_loss": -21.776443481445312, "global_step": 89124, "epoch": 1073} {"train_loss": -21.774829864501953, "global_step": 89125, "epoch": 1073} {"train_loss": -21.545608520507812, "global_step": 89126, "epoch": 1073} {"train_loss": -21.473976135253906, "global_step": 89127, "epoch": 1073} {"train_loss": -21.48650550842285, "global_step": 89128, "epoch": 1073} {"train_loss": -21.52725601196289, "global_step": 89129, "epoch": 1073} {"train_loss": -21.475372314453125, "global_step": 89130, "epoch": 1073} {"train_loss": -21.636518478393555, "global_step": 89131, "epoch": 1073} {"train_loss": -21.553367614746094, "global_step": 89132, "epoch": 1073} {"train_loss": -21.77685546875, "global_step": 89133, "epoch": 1073} {"train_loss": -21.90858268737793, "global_step": 89134, "epoch": 1073} {"train_loss": -21.651227951049805, "global_step": 89135, "epoch": 1073} {"train_loss": -21.73468017578125, "global_step": 89136, "epoch": 1073} {"train_loss": -21.645713806152344, "global_step": 89137, "epoch": 1073} {"train_loss": -21.556232452392578, "global_step": 89138, "epoch": 1073} {"train_loss": -21.621387481689453, "global_step": 89139, "epoch": 1073} {"train_loss": -21.453001022338867, "global_step": 89140, "epoch": 1073} {"train_loss": -21.548056636948182, "global_step": 89141, "epoch": 1073, "val_loss": 6190377.0} {"train_loss": -21.039762496948242, "global_step": 89142, "epoch": 1074} {"train_loss": -21.1569766998291, "global_step": 89143, "epoch": 1074} {"train_loss": -21.01519012451172, "global_step": 89144, "epoch": 1074} {"train_loss": -21.199268341064453, "global_step": 89145, "epoch": 1074} {"train_loss": -21.26315689086914, "global_step": 89146, "epoch": 1074} {"train_loss": -21.236284255981445, "global_step": 89147, "epoch": 1074} {"train_loss": -21.123517990112305, "global_step": 89148, "epoch": 1074} {"train_loss": -20.992029190063477, "global_step": 89149, "epoch": 1074} {"train_loss": -21.300708770751953, "global_step": 89150, "epoch": 1074} {"train_loss": -21.209583282470703, "global_step": 89151, "epoch": 1074} {"train_loss": -21.31952476501465, "global_step": 89152, "epoch": 1074} {"train_loss": -21.275461196899414, "global_step": 89153, "epoch": 1074} {"train_loss": -21.370214462280273, "global_step": 89154, "epoch": 1074} {"train_loss": -21.501468658447266, "global_step": 89155, "epoch": 1074} {"train_loss": -21.30263328552246, "global_step": 89156, "epoch": 1074} {"train_loss": -21.624279022216797, "global_step": 89157, "epoch": 1074} {"train_loss": -21.628677368164062, "global_step": 89158, "epoch": 1074} {"train_loss": -21.589208602905273, "global_step": 89159, "epoch": 1074} {"train_loss": -21.277135848999023, "global_step": 89160, "epoch": 1074} {"train_loss": -21.48394775390625, "global_step": 89161, "epoch": 1074} {"train_loss": -21.512746810913086, "global_step": 89162, "epoch": 1074} {"train_loss": -21.712369918823242, "global_step": 89163, "epoch": 1074} {"train_loss": -21.361923217773438, "global_step": 89164, "epoch": 1074} {"train_loss": -21.998525619506836, "global_step": 89165, "epoch": 1074} {"train_loss": -21.087656021118164, "global_step": 89166, "epoch": 1074} {"train_loss": -21.5799503326416, "global_step": 89167, "epoch": 1074} {"train_loss": -21.526546478271484, "global_step": 89168, "epoch": 1074} {"train_loss": -21.2576961517334, "global_step": 89169, "epoch": 1074} {"train_loss": -21.284528732299805, "global_step": 89170, "epoch": 1074} {"train_loss": -21.90561866760254, "global_step": 89171, "epoch": 1074} {"train_loss": -21.178058624267578, "global_step": 89172, "epoch": 1074} {"train_loss": -22.022438049316406, "global_step": 89173, "epoch": 1074} {"train_loss": -21.64455223083496, "global_step": 89174, "epoch": 1074} {"train_loss": -21.49757194519043, "global_step": 89175, "epoch": 1074} {"train_loss": -21.243406295776367, "global_step": 89176, "epoch": 1074} {"train_loss": -21.28595542907715, "global_step": 89177, "epoch": 1074} {"train_loss": -21.444427490234375, "global_step": 89178, "epoch": 1074} {"train_loss": -21.590438842773438, "global_step": 89179, "epoch": 1074} {"train_loss": -21.8573055267334, "global_step": 89180, "epoch": 1074} {"train_loss": -21.520706176757812, "global_step": 89181, "epoch": 1074} {"train_loss": -21.753156661987305, "global_step": 89182, "epoch": 1074} {"train_loss": -22.042057037353516, "global_step": 89183, "epoch": 1074} {"train_loss": -21.523395538330078, "global_step": 89184, "epoch": 1074} {"train_loss": -21.683713912963867, "global_step": 89185, "epoch": 1074} {"train_loss": -21.803714752197266, "global_step": 89186, "epoch": 1074} {"train_loss": -21.57147216796875, "global_step": 89187, "epoch": 1074} {"train_loss": -21.666576385498047, "global_step": 89188, "epoch": 1074} {"train_loss": -21.59256935119629, "global_step": 89189, "epoch": 1074} {"train_loss": -21.927356719970703, "global_step": 89190, "epoch": 1074} {"train_loss": -21.618778228759766, "global_step": 89191, "epoch": 1074} {"train_loss": -21.539295196533203, "global_step": 89192, "epoch": 1074} {"train_loss": -21.584980010986328, "global_step": 89193, "epoch": 1074} {"train_loss": -21.916912078857422, "global_step": 89194, "epoch": 1074} {"train_loss": -21.85145378112793, "global_step": 89195, "epoch": 1074} {"train_loss": -21.553665161132812, "global_step": 89196, "epoch": 1074} {"train_loss": -21.8819637298584, "global_step": 89197, "epoch": 1074} {"train_loss": -21.327268600463867, "global_step": 89198, "epoch": 1074} {"train_loss": -21.084699630737305, "global_step": 89199, "epoch": 1074} {"train_loss": -21.481826782226562, "global_step": 89200, "epoch": 1074} {"train_loss": -21.362194061279297, "global_step": 89201, "epoch": 1074} {"train_loss": -21.379724502563477, "global_step": 89202, "epoch": 1074} {"train_loss": -21.855365753173828, "global_step": 89203, "epoch": 1074} {"train_loss": -21.909645080566406, "global_step": 89204, "epoch": 1074} {"train_loss": -21.70810317993164, "global_step": 89205, "epoch": 1074} {"train_loss": -21.798770904541016, "global_step": 89206, "epoch": 1074} {"train_loss": -21.7596492767334, "global_step": 89207, "epoch": 1074} {"train_loss": -21.57265281677246, "global_step": 89208, "epoch": 1074} {"train_loss": -21.56777000427246, "global_step": 89209, "epoch": 1074} {"train_loss": -21.50307273864746, "global_step": 89210, "epoch": 1074} {"train_loss": -21.4335880279541, "global_step": 89211, "epoch": 1074} {"train_loss": -21.5399169921875, "global_step": 89212, "epoch": 1074} {"train_loss": -21.926830291748047, "global_step": 89213, "epoch": 1074} {"train_loss": -21.237043380737305, "global_step": 89214, "epoch": 1074} {"train_loss": -21.14485740661621, "global_step": 89215, "epoch": 1074} {"train_loss": -21.745641708374023, "global_step": 89216, "epoch": 1074} {"train_loss": -21.220956802368164, "global_step": 89217, "epoch": 1074} {"train_loss": -21.51923942565918, "global_step": 89218, "epoch": 1074} {"train_loss": -21.6695499420166, "global_step": 89219, "epoch": 1074} {"train_loss": -21.2724609375, "global_step": 89220, "epoch": 1074} {"train_loss": -21.44636344909668, "global_step": 89221, "epoch": 1074} {"train_loss": -21.204151153564453, "global_step": 89222, "epoch": 1074} {"train_loss": -21.714982986450195, "global_step": 89223, "epoch": 1074} {"train_loss": -21.514842826199818, "global_step": 89224, "epoch": 1074, "val_loss": 6076183.0} {"train_loss": -20.975351333618164, "global_step": 89225, "epoch": 1075} {"train_loss": -21.338224411010742, "global_step": 89226, "epoch": 1075} {"train_loss": -20.880752563476562, "global_step": 89227, "epoch": 1075} {"train_loss": -21.08484649658203, "global_step": 89228, "epoch": 1075} {"train_loss": -21.146244049072266, "global_step": 89229, "epoch": 1075} {"train_loss": -20.709083557128906, "global_step": 89230, "epoch": 1075} {"train_loss": -21.440570831298828, "global_step": 89231, "epoch": 1075} {"train_loss": -21.067777633666992, "global_step": 89232, "epoch": 1075} {"train_loss": -21.02121925354004, "global_step": 89233, "epoch": 1075} {"train_loss": -21.25050163269043, "global_step": 89234, "epoch": 1075} {"train_loss": -21.037113189697266, "global_step": 89235, "epoch": 1075} {"train_loss": -21.342344284057617, "global_step": 89236, "epoch": 1075} {"train_loss": -21.33110809326172, "global_step": 89237, "epoch": 1075} {"train_loss": -21.36673927307129, "global_step": 89238, "epoch": 1075} {"train_loss": -21.548185348510742, "global_step": 89239, "epoch": 1075} {"train_loss": -21.563335418701172, "global_step": 89240, "epoch": 1075} {"train_loss": -21.352737426757812, "global_step": 89241, "epoch": 1075} {"train_loss": -21.443042755126953, "global_step": 89242, "epoch": 1075} {"train_loss": -21.304296493530273, "global_step": 89243, "epoch": 1075} {"train_loss": -21.608076095581055, "global_step": 89244, "epoch": 1075} {"train_loss": -21.51217269897461, "global_step": 89245, "epoch": 1075} {"train_loss": -21.285736083984375, "global_step": 89246, "epoch": 1075} {"train_loss": -21.629535675048828, "global_step": 89247, "epoch": 1075} {"train_loss": -21.532520294189453, "global_step": 89248, "epoch": 1075} {"train_loss": -21.092975616455078, "global_step": 89249, "epoch": 1075} {"train_loss": -21.63340950012207, "global_step": 89250, "epoch": 1075} {"train_loss": -21.195531845092773, "global_step": 89251, "epoch": 1075} {"train_loss": -21.446901321411133, "global_step": 89252, "epoch": 1075} {"train_loss": -21.64876365661621, "global_step": 89253, "epoch": 1075} {"train_loss": -21.325586318969727, "global_step": 89254, "epoch": 1075} {"train_loss": -21.157913208007812, "global_step": 89255, "epoch": 1075} {"train_loss": -21.574447631835938, "global_step": 89256, "epoch": 1075} {"train_loss": -21.583568572998047, "global_step": 89257, "epoch": 1075} {"train_loss": -21.186182022094727, "global_step": 89258, "epoch": 1075} {"train_loss": -21.547666549682617, "global_step": 89259, "epoch": 1075} {"train_loss": -21.378890991210938, "global_step": 89260, "epoch": 1075} {"train_loss": -21.668886184692383, "global_step": 89261, "epoch": 1075} {"train_loss": -21.619029998779297, "global_step": 89262, "epoch": 1075} {"train_loss": -21.836950302124023, "global_step": 89263, "epoch": 1075} {"train_loss": -21.397796630859375, "global_step": 89264, "epoch": 1075} {"train_loss": -21.88888931274414, "global_step": 89265, "epoch": 1075} {"train_loss": -21.392642974853516, "global_step": 89266, "epoch": 1075} {"train_loss": -21.483261108398438, "global_step": 89267, "epoch": 1075} {"train_loss": -21.69927978515625, "global_step": 89268, "epoch": 1075} {"train_loss": -21.518077850341797, "global_step": 89269, "epoch": 1075} {"train_loss": -21.427698135375977, "global_step": 89270, "epoch": 1075} {"train_loss": -21.708126068115234, "global_step": 89271, "epoch": 1075} {"train_loss": -21.204730987548828, "global_step": 89272, "epoch": 1075} {"train_loss": -21.449928283691406, "global_step": 89273, "epoch": 1075} {"train_loss": -21.72822380065918, "global_step": 89274, "epoch": 1075} {"train_loss": -21.606046676635742, "global_step": 89275, "epoch": 1075} {"train_loss": -21.87270736694336, "global_step": 89276, "epoch": 1075} {"train_loss": -21.377424240112305, "global_step": 89277, "epoch": 1075} {"train_loss": -21.895858764648438, "global_step": 89278, "epoch": 1075} {"train_loss": -21.526884078979492, "global_step": 89279, "epoch": 1075} {"train_loss": -21.6223201751709, "global_step": 89280, "epoch": 1075} {"train_loss": -20.958887100219727, "global_step": 89281, "epoch": 1075} {"train_loss": -21.926319122314453, "global_step": 89282, "epoch": 1075} {"train_loss": -22.0422306060791, "global_step": 89283, "epoch": 1075} {"train_loss": -21.615869522094727, "global_step": 89284, "epoch": 1075} {"train_loss": -21.84152603149414, "global_step": 89285, "epoch": 1075} {"train_loss": -21.740856170654297, "global_step": 89286, "epoch": 1075} {"train_loss": -21.550222396850586, "global_step": 89287, "epoch": 1075} {"train_loss": -21.373218536376953, "global_step": 89288, "epoch": 1075} {"train_loss": -21.184099197387695, "global_step": 89289, "epoch": 1075} {"train_loss": -21.65552520751953, "global_step": 89290, "epoch": 1075} {"train_loss": -21.668813705444336, "global_step": 89291, "epoch": 1075} {"train_loss": -21.7616024017334, "global_step": 89292, "epoch": 1075} {"train_loss": -21.33455467224121, "global_step": 89293, "epoch": 1075} {"train_loss": -21.439573287963867, "global_step": 89294, "epoch": 1075} {"train_loss": -21.739032745361328, "global_step": 89295, "epoch": 1075} {"train_loss": -21.751157760620117, "global_step": 89296, "epoch": 1075} {"train_loss": -21.28564453125, "global_step": 89297, "epoch": 1075} {"train_loss": -21.5521297454834, "global_step": 89298, "epoch": 1075} {"train_loss": -21.753711700439453, "global_step": 89299, "epoch": 1075} {"train_loss": -21.354846954345703, "global_step": 89300, "epoch": 1075} {"train_loss": -21.659086227416992, "global_step": 89301, "epoch": 1075} {"train_loss": -21.635284423828125, "global_step": 89302, "epoch": 1075} {"train_loss": -21.224456787109375, "global_step": 89303, "epoch": 1075} {"train_loss": -21.434432983398438, "global_step": 89304, "epoch": 1075} {"train_loss": -21.466093063354492, "global_step": 89305, "epoch": 1075} {"train_loss": -21.427637100219727, "global_step": 89306, "epoch": 1075} {"train_loss": -21.46040996873235, "global_step": 89307, "epoch": 1075, "val_loss": 6132686.5} {"train_loss": -21.091123580932617, "global_step": 89308, "epoch": 1076} {"train_loss": -21.36983871459961, "global_step": 89309, "epoch": 1076} {"train_loss": -21.380464553833008, "global_step": 89310, "epoch": 1076} {"train_loss": -21.068403244018555, "global_step": 89311, "epoch": 1076} {"train_loss": -21.148176193237305, "global_step": 89312, "epoch": 1076} {"train_loss": -21.572126388549805, "global_step": 89313, "epoch": 1076} {"train_loss": -21.127914428710938, "global_step": 89314, "epoch": 1076} {"train_loss": -21.57195281982422, "global_step": 89315, "epoch": 1076} {"train_loss": -21.49146270751953, "global_step": 89316, "epoch": 1076} {"train_loss": -21.287744522094727, "global_step": 89317, "epoch": 1076} {"train_loss": -21.649595260620117, "global_step": 89318, "epoch": 1076} {"train_loss": -21.163007736206055, "global_step": 89319, "epoch": 1076} {"train_loss": -21.339393615722656, "global_step": 89320, "epoch": 1076} {"train_loss": -21.301599502563477, "global_step": 89321, "epoch": 1076} {"train_loss": -21.47397804260254, "global_step": 89322, "epoch": 1076} {"train_loss": -21.3048095703125, "global_step": 89323, "epoch": 1076} {"train_loss": -21.239788055419922, "global_step": 89324, "epoch": 1076} {"train_loss": -21.51264190673828, "global_step": 89325, "epoch": 1076} {"train_loss": -21.53721809387207, "global_step": 89326, "epoch": 1076} {"train_loss": -21.51386070251465, "global_step": 89327, "epoch": 1076} {"train_loss": -21.402677536010742, "global_step": 89328, "epoch": 1076} {"train_loss": -21.59183120727539, "global_step": 89329, "epoch": 1076} {"train_loss": -21.443830490112305, "global_step": 89330, "epoch": 1076} {"train_loss": -21.708250045776367, "global_step": 89331, "epoch": 1076} {"train_loss": -21.6743106842041, "global_step": 89332, "epoch": 1076} {"train_loss": -21.232595443725586, "global_step": 89333, "epoch": 1076} {"train_loss": -21.4116153717041, "global_step": 89334, "epoch": 1076} {"train_loss": -21.66983413696289, "global_step": 89335, "epoch": 1076} {"train_loss": -21.49820327758789, "global_step": 89336, "epoch": 1076} {"train_loss": -21.497663497924805, "global_step": 89337, "epoch": 1076} {"train_loss": -21.595966339111328, "global_step": 89338, "epoch": 1076} {"train_loss": -21.49407196044922, "global_step": 89339, "epoch": 1076} {"train_loss": -21.42795753479004, "global_step": 89340, "epoch": 1076} {"train_loss": -21.4910945892334, "global_step": 89341, "epoch": 1076} {"train_loss": -21.423933029174805, "global_step": 89342, "epoch": 1076} {"train_loss": -21.40534782409668, "global_step": 89343, "epoch": 1076} {"train_loss": -21.525388717651367, "global_step": 89344, "epoch": 1076} {"train_loss": -21.50910758972168, "global_step": 89345, "epoch": 1076} {"train_loss": -21.64869499206543, "global_step": 89346, "epoch": 1076} {"train_loss": -21.536951065063477, "global_step": 89347, "epoch": 1076} {"train_loss": -21.592071533203125, "global_step": 89348, "epoch": 1076} {"train_loss": -21.890735626220703, "global_step": 89349, "epoch": 1076} {"train_loss": -21.458206176757812, "global_step": 89350, "epoch": 1076} {"train_loss": -21.745407104492188, "global_step": 89351, "epoch": 1076} {"train_loss": -21.5263729095459, "global_step": 89352, "epoch": 1076} {"train_loss": -21.614364624023438, "global_step": 89353, "epoch": 1076} {"train_loss": -21.391477584838867, "global_step": 89354, "epoch": 1076} {"train_loss": -21.15805435180664, "global_step": 89355, "epoch": 1076} {"train_loss": -21.85452651977539, "global_step": 89356, "epoch": 1076} {"train_loss": -21.562410354614258, "global_step": 89357, "epoch": 1076} {"train_loss": -21.468420028686523, "global_step": 89358, "epoch": 1076} {"train_loss": -21.280426025390625, "global_step": 89359, "epoch": 1076} {"train_loss": -21.683246612548828, "global_step": 89360, "epoch": 1076} {"train_loss": -21.39411163330078, "global_step": 89361, "epoch": 1076} {"train_loss": -21.66912841796875, "global_step": 89362, "epoch": 1076} {"train_loss": -21.640409469604492, "global_step": 89363, "epoch": 1076} {"train_loss": -21.427104949951172, "global_step": 89364, "epoch": 1076} {"train_loss": -21.71001625061035, "global_step": 89365, "epoch": 1076} {"train_loss": -21.706348419189453, "global_step": 89366, "epoch": 1076} {"train_loss": -21.39607810974121, "global_step": 89367, "epoch": 1076} {"train_loss": -21.517995834350586, "global_step": 89368, "epoch": 1076} {"train_loss": -21.683523178100586, "global_step": 89369, "epoch": 1076} {"train_loss": -21.203550338745117, "global_step": 89370, "epoch": 1076} {"train_loss": -21.63928985595703, "global_step": 89371, "epoch": 1076} {"train_loss": -21.79764175415039, "global_step": 89372, "epoch": 1076} {"train_loss": -21.80609703063965, "global_step": 89373, "epoch": 1076} {"train_loss": -21.499113082885742, "global_step": 89374, "epoch": 1076} {"train_loss": -21.71877098083496, "global_step": 89375, "epoch": 1076} {"train_loss": -21.517759323120117, "global_step": 89376, "epoch": 1076} {"train_loss": -21.33839225769043, "global_step": 89377, "epoch": 1076} {"train_loss": -21.484024047851562, "global_step": 89378, "epoch": 1076} {"train_loss": -21.640064239501953, "global_step": 89379, "epoch": 1076} {"train_loss": -21.51166343688965, "global_step": 89380, "epoch": 1076} {"train_loss": -21.75459861755371, "global_step": 89381, "epoch": 1076} {"train_loss": -21.306598663330078, "global_step": 89382, "epoch": 1076} {"train_loss": -21.5041561126709, "global_step": 89383, "epoch": 1076} {"train_loss": -21.890348434448242, "global_step": 89384, "epoch": 1076} {"train_loss": -21.757606506347656, "global_step": 89385, "epoch": 1076} {"train_loss": -21.762113571166992, "global_step": 89386, "epoch": 1076} {"train_loss": -21.522329330444336, "global_step": 89387, "epoch": 1076} {"train_loss": -21.94455909729004, "global_step": 89388, "epoch": 1076} {"train_loss": -21.463327407836914, "global_step": 89389, "epoch": 1076} {"train_loss": -21.50080582032721, "global_step": 89390, "epoch": 1076, "val_loss": 6102632.5} {"train_loss": -21.1868953704834, "global_step": 89391, "epoch": 1077} {"train_loss": -21.570981979370117, "global_step": 89392, "epoch": 1077} {"train_loss": -21.619298934936523, "global_step": 89393, "epoch": 1077} {"train_loss": -21.900548934936523, "global_step": 89394, "epoch": 1077} {"train_loss": -21.440458297729492, "global_step": 89395, "epoch": 1077} {"train_loss": -21.340415954589844, "global_step": 89396, "epoch": 1077} {"train_loss": -21.41840934753418, "global_step": 89397, "epoch": 1077} {"train_loss": -21.916547775268555, "global_step": 89398, "epoch": 1077} {"train_loss": -21.339895248413086, "global_step": 89399, "epoch": 1077} {"train_loss": -21.882429122924805, "global_step": 89400, "epoch": 1077} {"train_loss": -21.35213279724121, "global_step": 89401, "epoch": 1077} {"train_loss": -21.249807357788086, "global_step": 89402, "epoch": 1077} {"train_loss": -21.689115524291992, "global_step": 89403, "epoch": 1077} {"train_loss": -21.541379928588867, "global_step": 89404, "epoch": 1077} {"train_loss": -21.64858055114746, "global_step": 89405, "epoch": 1077} {"train_loss": -21.337921142578125, "global_step": 89406, "epoch": 1077} {"train_loss": -21.70206069946289, "global_step": 89407, "epoch": 1077} {"train_loss": -21.68890380859375, "global_step": 89408, "epoch": 1077} {"train_loss": -21.619596481323242, "global_step": 89409, "epoch": 1077} {"train_loss": -21.532323837280273, "global_step": 89410, "epoch": 1077} {"train_loss": -21.30295753479004, "global_step": 89411, "epoch": 1077} {"train_loss": -21.723974227905273, "global_step": 89412, "epoch": 1077} {"train_loss": -21.546899795532227, "global_step": 89413, "epoch": 1077} {"train_loss": -21.434791564941406, "global_step": 89414, "epoch": 1077} {"train_loss": -21.271148681640625, "global_step": 89415, "epoch": 1077} {"train_loss": -21.30225944519043, "global_step": 89416, "epoch": 1077} {"train_loss": -21.558391571044922, "global_step": 89417, "epoch": 1077} {"train_loss": -21.38474464416504, "global_step": 89418, "epoch": 1077} {"train_loss": -21.434125900268555, "global_step": 89419, "epoch": 1077} {"train_loss": -21.75273323059082, "global_step": 89420, "epoch": 1077} {"train_loss": -21.449220657348633, "global_step": 89421, "epoch": 1077} {"train_loss": -21.724149703979492, "global_step": 89422, "epoch": 1077} {"train_loss": -21.1636962890625, "global_step": 89423, "epoch": 1077} {"train_loss": -21.99234962463379, "global_step": 89424, "epoch": 1077} {"train_loss": -21.34689712524414, "global_step": 89425, "epoch": 1077} {"train_loss": -21.291908264160156, "global_step": 89426, "epoch": 1077} {"train_loss": -21.548954010009766, "global_step": 89427, "epoch": 1077} {"train_loss": -21.618947982788086, "global_step": 89428, "epoch": 1077} {"train_loss": -21.745635986328125, "global_step": 89429, "epoch": 1077} {"train_loss": -21.578927993774414, "global_step": 89430, "epoch": 1077} {"train_loss": -21.457178115844727, "global_step": 89431, "epoch": 1077} {"train_loss": -21.183441162109375, "global_step": 89432, "epoch": 1077} {"train_loss": -21.581037521362305, "global_step": 89433, "epoch": 1077} {"train_loss": -22.098098754882812, "global_step": 89434, "epoch": 1077} {"train_loss": -21.564193725585938, "global_step": 89435, "epoch": 1077} {"train_loss": -21.685338973999023, "global_step": 89436, "epoch": 1077} {"train_loss": -21.521499633789062, "global_step": 89437, "epoch": 1077} {"train_loss": -21.3492374420166, "global_step": 89438, "epoch": 1077} {"train_loss": -21.663890838623047, "global_step": 89439, "epoch": 1077} {"train_loss": -21.55195426940918, "global_step": 89440, "epoch": 1077} {"train_loss": -21.589702606201172, "global_step": 89441, "epoch": 1077} {"train_loss": -21.559926986694336, "global_step": 89442, "epoch": 1077} {"train_loss": -21.406728744506836, "global_step": 89443, "epoch": 1077} {"train_loss": -21.944366455078125, "global_step": 89444, "epoch": 1077} {"train_loss": -21.579147338867188, "global_step": 89445, "epoch": 1077} {"train_loss": -21.8201847076416, "global_step": 89446, "epoch": 1077} {"train_loss": -21.636899948120117, "global_step": 89447, "epoch": 1077} {"train_loss": -21.653623580932617, "global_step": 89448, "epoch": 1077} {"train_loss": -21.80216407775879, "global_step": 89449, "epoch": 1077} {"train_loss": -21.41948127746582, "global_step": 89450, "epoch": 1077} {"train_loss": -21.662145614624023, "global_step": 89451, "epoch": 1077} {"train_loss": -21.77467155456543, "global_step": 89452, "epoch": 1077} {"train_loss": -21.743030548095703, "global_step": 89453, "epoch": 1077} {"train_loss": -21.37344741821289, "global_step": 89454, "epoch": 1077} {"train_loss": -21.76192283630371, "global_step": 89455, "epoch": 1077} {"train_loss": -21.560712814331055, "global_step": 89456, "epoch": 1077} {"train_loss": -21.53074073791504, "global_step": 89457, "epoch": 1077} {"train_loss": -21.904003143310547, "global_step": 89458, "epoch": 1077} {"train_loss": -21.266233444213867, "global_step": 89459, "epoch": 1077} {"train_loss": -21.35239028930664, "global_step": 89460, "epoch": 1077} {"train_loss": -21.6323184967041, "global_step": 89461, "epoch": 1077} {"train_loss": -21.45530128479004, "global_step": 89462, "epoch": 1077} {"train_loss": -21.81007957458496, "global_step": 89463, "epoch": 1077} {"train_loss": -21.509714126586914, "global_step": 89464, "epoch": 1077} {"train_loss": -21.679218292236328, "global_step": 89465, "epoch": 1077} {"train_loss": -21.59916114807129, "global_step": 89466, "epoch": 1077} {"train_loss": -21.825185775756836, "global_step": 89467, "epoch": 1077} {"train_loss": -21.747291564941406, "global_step": 89468, "epoch": 1077} {"train_loss": -21.657846450805664, "global_step": 89469, "epoch": 1077} {"train_loss": -21.506174087524414, "global_step": 89470, "epoch": 1077} {"train_loss": -21.934921264648438, "global_step": 89471, "epoch": 1077} {"train_loss": -21.822383880615234, "global_step": 89472, "epoch": 1077} {"train_loss": -21.565470385264202, "global_step": 89473, "epoch": 1077, "val_loss": 6172676.5} {"train_loss": -21.865829467773438, "global_step": 89474, "epoch": 1078} {"train_loss": -21.548215866088867, "global_step": 89475, "epoch": 1078} {"train_loss": -21.407726287841797, "global_step": 89476, "epoch": 1078} {"train_loss": -21.4630184173584, "global_step": 89477, "epoch": 1078} {"train_loss": -21.259824752807617, "global_step": 89478, "epoch": 1078} {"train_loss": -21.75526237487793, "global_step": 89479, "epoch": 1078} {"train_loss": -21.0624942779541, "global_step": 89480, "epoch": 1078} {"train_loss": -21.5711727142334, "global_step": 89481, "epoch": 1078} {"train_loss": -21.118391036987305, "global_step": 89482, "epoch": 1078} {"train_loss": -21.076387405395508, "global_step": 89483, "epoch": 1078} {"train_loss": -21.35091209411621, "global_step": 89484, "epoch": 1078} {"train_loss": -21.42523193359375, "global_step": 89485, "epoch": 1078} {"train_loss": -21.410200119018555, "global_step": 89486, "epoch": 1078} {"train_loss": -20.9024658203125, "global_step": 89487, "epoch": 1078} {"train_loss": -21.38028907775879, "global_step": 89488, "epoch": 1078} {"train_loss": -21.329795837402344, "global_step": 89489, "epoch": 1078} {"train_loss": -21.43948745727539, "global_step": 89490, "epoch": 1078} {"train_loss": -21.54556655883789, "global_step": 89491, "epoch": 1078} {"train_loss": -21.5332088470459, "global_step": 89492, "epoch": 1078} {"train_loss": -21.437335968017578, "global_step": 89493, "epoch": 1078} {"train_loss": -21.475072860717773, "global_step": 89494, "epoch": 1078} {"train_loss": -21.43434715270996, "global_step": 89495, "epoch": 1078} {"train_loss": -21.121810913085938, "global_step": 89496, "epoch": 1078} {"train_loss": -21.815738677978516, "global_step": 89497, "epoch": 1078} {"train_loss": -21.2706356048584, "global_step": 89498, "epoch": 1078} {"train_loss": -21.380130767822266, "global_step": 89499, "epoch": 1078} {"train_loss": -21.551679611206055, "global_step": 89500, "epoch": 1078} {"train_loss": -21.50764274597168, "global_step": 89501, "epoch": 1078} {"train_loss": -21.87911605834961, "global_step": 89502, "epoch": 1078} {"train_loss": -21.42758560180664, "global_step": 89503, "epoch": 1078} {"train_loss": -21.25351905822754, "global_step": 89504, "epoch": 1078} {"train_loss": -22.03515625, "global_step": 89505, "epoch": 1078} {"train_loss": -21.5911922454834, "global_step": 89506, "epoch": 1078} {"train_loss": -21.110549926757812, "global_step": 89507, "epoch": 1078} {"train_loss": -21.369070053100586, "global_step": 89508, "epoch": 1078} {"train_loss": -21.483884811401367, "global_step": 89509, "epoch": 1078} {"train_loss": -21.914981842041016, "global_step": 89510, "epoch": 1078} {"train_loss": -21.566349029541016, "global_step": 89511, "epoch": 1078} {"train_loss": -21.692312240600586, "global_step": 89512, "epoch": 1078} {"train_loss": -21.748228073120117, "global_step": 89513, "epoch": 1078} {"train_loss": -21.49934959411621, "global_step": 89514, "epoch": 1078} {"train_loss": -21.41758155822754, "global_step": 89515, "epoch": 1078} {"train_loss": -21.772140502929688, "global_step": 89516, "epoch": 1078} {"train_loss": -21.56817626953125, "global_step": 89517, "epoch": 1078} {"train_loss": -21.711776733398438, "global_step": 89518, "epoch": 1078} {"train_loss": -21.267724990844727, "global_step": 89519, "epoch": 1078} {"train_loss": -21.608230590820312, "global_step": 89520, "epoch": 1078} {"train_loss": -21.660451889038086, "global_step": 89521, "epoch": 1078} {"train_loss": -21.48439598083496, "global_step": 89522, "epoch": 1078} {"train_loss": -21.49264144897461, "global_step": 89523, "epoch": 1078} {"train_loss": -21.46883773803711, "global_step": 89524, "epoch": 1078} {"train_loss": -21.31380271911621, "global_step": 89525, "epoch": 1078} {"train_loss": -21.206390380859375, "global_step": 89526, "epoch": 1078} {"train_loss": -21.412656784057617, "global_step": 89527, "epoch": 1078} {"train_loss": -21.60579490661621, "global_step": 89528, "epoch": 1078} {"train_loss": -21.86111831665039, "global_step": 89529, "epoch": 1078} {"train_loss": -21.490625381469727, "global_step": 89530, "epoch": 1078} {"train_loss": -21.87645149230957, "global_step": 89531, "epoch": 1078} {"train_loss": -21.786251068115234, "global_step": 89532, "epoch": 1078} {"train_loss": -21.8397274017334, "global_step": 89533, "epoch": 1078} {"train_loss": -21.865907669067383, "global_step": 89534, "epoch": 1078} {"train_loss": -21.655241012573242, "global_step": 89535, "epoch": 1078} {"train_loss": -21.457386016845703, "global_step": 89536, "epoch": 1078} {"train_loss": -21.98628044128418, "global_step": 89537, "epoch": 1078} {"train_loss": -21.3167667388916, "global_step": 89538, "epoch": 1078} {"train_loss": -21.430212020874023, "global_step": 89539, "epoch": 1078} {"train_loss": -21.78420066833496, "global_step": 89540, "epoch": 1078} {"train_loss": -21.736249923706055, "global_step": 89541, "epoch": 1078} {"train_loss": -21.738035202026367, "global_step": 89542, "epoch": 1078} {"train_loss": -21.770471572875977, "global_step": 89543, "epoch": 1078} {"train_loss": -21.617246627807617, "global_step": 89544, "epoch": 1078} {"train_loss": -21.618680953979492, "global_step": 89545, "epoch": 1078} {"train_loss": -21.39088249206543, "global_step": 89546, "epoch": 1078} {"train_loss": -21.391447067260742, "global_step": 89547, "epoch": 1078} {"train_loss": -21.459636688232422, "global_step": 89548, "epoch": 1078} {"train_loss": -22.0070858001709, "global_step": 89549, "epoch": 1078} {"train_loss": -21.57263946533203, "global_step": 89550, "epoch": 1078} {"train_loss": -21.52034568786621, "global_step": 89551, "epoch": 1078} {"train_loss": -21.73777198791504, "global_step": 89552, "epoch": 1078} {"train_loss": -21.637386322021484, "global_step": 89553, "epoch": 1078} {"train_loss": -21.443614959716797, "global_step": 89554, "epoch": 1078} {"train_loss": -21.536788940429688, "global_step": 89555, "epoch": 1078} {"train_loss": -21.53748509970056, "global_step": 89556, "epoch": 1078, "val_loss": 6043309.5} {"train_loss": -20.92807960510254, "global_step": 89557, "epoch": 1079} {"train_loss": -20.94972801208496, "global_step": 89558, "epoch": 1079} {"train_loss": -20.973371505737305, "global_step": 89559, "epoch": 1079} {"train_loss": -20.932941436767578, "global_step": 89560, "epoch": 1079} {"train_loss": -20.870620727539062, "global_step": 89561, "epoch": 1079} {"train_loss": -21.209117889404297, "global_step": 89562, "epoch": 1079} {"train_loss": -20.97317886352539, "global_step": 89563, "epoch": 1079} {"train_loss": -21.20306968688965, "global_step": 89564, "epoch": 1079} {"train_loss": -21.136510848999023, "global_step": 89565, "epoch": 1079} {"train_loss": -21.024581909179688, "global_step": 89566, "epoch": 1079} {"train_loss": -21.25142478942871, "global_step": 89567, "epoch": 1079} {"train_loss": -20.842010498046875, "global_step": 89568, "epoch": 1079} {"train_loss": -21.3731689453125, "global_step": 89569, "epoch": 1079} {"train_loss": -21.25292205810547, "global_step": 89570, "epoch": 1079} {"train_loss": -21.30524253845215, "global_step": 89571, "epoch": 1079} {"train_loss": -21.530902862548828, "global_step": 89572, "epoch": 1079} {"train_loss": -21.218490600585938, "global_step": 89573, "epoch": 1079} {"train_loss": -21.376638412475586, "global_step": 89574, "epoch": 1079} {"train_loss": -21.726789474487305, "global_step": 89575, "epoch": 1079} {"train_loss": -21.21546745300293, "global_step": 89576, "epoch": 1079} {"train_loss": -21.582944869995117, "global_step": 89577, "epoch": 1079} {"train_loss": -21.333724975585938, "global_step": 89578, "epoch": 1079} {"train_loss": -21.475862503051758, "global_step": 89579, "epoch": 1079} {"train_loss": -21.612165451049805, "global_step": 89580, "epoch": 1079} {"train_loss": -21.540904998779297, "global_step": 89581, "epoch": 1079} {"train_loss": -21.570632934570312, "global_step": 89582, "epoch": 1079} {"train_loss": -21.41961097717285, "global_step": 89583, "epoch": 1079} {"train_loss": -21.630456924438477, "global_step": 89584, "epoch": 1079} {"train_loss": -21.388486862182617, "global_step": 89585, "epoch": 1079} {"train_loss": -21.55461883544922, "global_step": 89586, "epoch": 1079} {"train_loss": -21.3234920501709, "global_step": 89587, "epoch": 1079} {"train_loss": -21.886404037475586, "global_step": 89588, "epoch": 1079} {"train_loss": -21.626251220703125, "global_step": 89589, "epoch": 1079} {"train_loss": -21.813121795654297, "global_step": 89590, "epoch": 1079} {"train_loss": -21.635852813720703, "global_step": 89591, "epoch": 1079} {"train_loss": -21.593929290771484, "global_step": 89592, "epoch": 1079} {"train_loss": -21.554319381713867, "global_step": 89593, "epoch": 1079} {"train_loss": -21.53627586364746, "global_step": 89594, "epoch": 1079} {"train_loss": -21.580581665039062, "global_step": 89595, "epoch": 1079} {"train_loss": -21.555240631103516, "global_step": 89596, "epoch": 1079} {"train_loss": -21.493982315063477, "global_step": 89597, "epoch": 1079} {"train_loss": -21.658584594726562, "global_step": 89598, "epoch": 1079} {"train_loss": -21.374771118164062, "global_step": 89599, "epoch": 1079} {"train_loss": -21.644739151000977, "global_step": 89600, "epoch": 1079} {"train_loss": -21.653045654296875, "global_step": 89601, "epoch": 1079} {"train_loss": -21.378271102905273, "global_step": 89602, "epoch": 1079} {"train_loss": -21.767593383789062, "global_step": 89603, "epoch": 1079} {"train_loss": -21.603174209594727, "global_step": 89604, "epoch": 1079} {"train_loss": -21.245264053344727, "global_step": 89605, "epoch": 1079} {"train_loss": -21.551700592041016, "global_step": 89606, "epoch": 1079} {"train_loss": -21.65839958190918, "global_step": 89607, "epoch": 1079} {"train_loss": -21.653995513916016, "global_step": 89608, "epoch": 1079} {"train_loss": -21.873476028442383, "global_step": 89609, "epoch": 1079} {"train_loss": -21.350196838378906, "global_step": 89610, "epoch": 1079} {"train_loss": -21.30335235595703, "global_step": 89611, "epoch": 1079} {"train_loss": -21.370508193969727, "global_step": 89612, "epoch": 1079} {"train_loss": -21.655231475830078, "global_step": 89613, "epoch": 1079} {"train_loss": -21.364852905273438, "global_step": 89614, "epoch": 1079} {"train_loss": -21.27521324157715, "global_step": 89615, "epoch": 1079} {"train_loss": -21.25601577758789, "global_step": 89616, "epoch": 1079} {"train_loss": -21.492551803588867, "global_step": 89617, "epoch": 1079} {"train_loss": -21.16872787475586, "global_step": 89618, "epoch": 1079} {"train_loss": -21.573209762573242, "global_step": 89619, "epoch": 1079} {"train_loss": -21.673166275024414, "global_step": 89620, "epoch": 1079} {"train_loss": -21.752498626708984, "global_step": 89621, "epoch": 1079} {"train_loss": -21.424457550048828, "global_step": 89622, "epoch": 1079} {"train_loss": -21.81572151184082, "global_step": 89623, "epoch": 1079} {"train_loss": -21.735065460205078, "global_step": 89624, "epoch": 1079} {"train_loss": -21.797649383544922, "global_step": 89625, "epoch": 1079} {"train_loss": -21.836206436157227, "global_step": 89626, "epoch": 1079} {"train_loss": -21.70242691040039, "global_step": 89627, "epoch": 1079} {"train_loss": -21.28631591796875, "global_step": 89628, "epoch": 1079} {"train_loss": -21.697874069213867, "global_step": 89629, "epoch": 1079} {"train_loss": -21.5257511138916, "global_step": 89630, "epoch": 1079} {"train_loss": -21.297393798828125, "global_step": 89631, "epoch": 1079} {"train_loss": -21.478605270385742, "global_step": 89632, "epoch": 1079} {"train_loss": -21.878664016723633, "global_step": 89633, "epoch": 1079} {"train_loss": -21.6205997467041, "global_step": 89634, "epoch": 1079} {"train_loss": -21.393964767456055, "global_step": 89635, "epoch": 1079} {"train_loss": -21.21885108947754, "global_step": 89636, "epoch": 1079} {"train_loss": -21.708982467651367, "global_step": 89637, "epoch": 1079} {"train_loss": -21.98543930053711, "global_step": 89638, "epoch": 1079} {"train_loss": -21.440191383821418, "global_step": 89639, "epoch": 1079, "val_loss": 6039504.5} {"train_loss": -20.7092227935791, "global_step": 89640, "epoch": 1080} {"train_loss": -20.905963897705078, "global_step": 89641, "epoch": 1080} {"train_loss": -20.901596069335938, "global_step": 89642, "epoch": 1080} {"train_loss": -20.713159561157227, "global_step": 89643, "epoch": 1080} {"train_loss": -21.182249069213867, "global_step": 89644, "epoch": 1080} {"train_loss": -21.204694747924805, "global_step": 89645, "epoch": 1080} {"train_loss": -21.024213790893555, "global_step": 89646, "epoch": 1080} {"train_loss": -21.422996520996094, "global_step": 89647, "epoch": 1080} {"train_loss": -21.338504791259766, "global_step": 89648, "epoch": 1080} {"train_loss": -21.122947692871094, "global_step": 89649, "epoch": 1080} {"train_loss": -21.089750289916992, "global_step": 89650, "epoch": 1080} {"train_loss": -21.419477462768555, "global_step": 89651, "epoch": 1080} {"train_loss": -21.283798217773438, "global_step": 89652, "epoch": 1080} {"train_loss": -21.084482192993164, "global_step": 89653, "epoch": 1080} {"train_loss": -21.202136993408203, "global_step": 89654, "epoch": 1080} {"train_loss": -21.31002426147461, "global_step": 89655, "epoch": 1080} {"train_loss": -20.90013313293457, "global_step": 89656, "epoch": 1080} {"train_loss": -21.530750274658203, "global_step": 89657, "epoch": 1080} {"train_loss": -21.043746948242188, "global_step": 89658, "epoch": 1080} {"train_loss": -21.608102798461914, "global_step": 89659, "epoch": 1080} {"train_loss": -21.319944381713867, "global_step": 89660, "epoch": 1080} {"train_loss": -21.855052947998047, "global_step": 89661, "epoch": 1080} {"train_loss": -21.418302536010742, "global_step": 89662, "epoch": 1080} {"train_loss": -21.548242568969727, "global_step": 89663, "epoch": 1080} {"train_loss": -21.76499366760254, "global_step": 89664, "epoch": 1080} {"train_loss": -21.208463668823242, "global_step": 89665, "epoch": 1080} {"train_loss": -21.567123413085938, "global_step": 89666, "epoch": 1080} {"train_loss": -21.487382888793945, "global_step": 89667, "epoch": 1080} {"train_loss": -21.06924057006836, "global_step": 89668, "epoch": 1080} {"train_loss": -21.464447021484375, "global_step": 89669, "epoch": 1080} {"train_loss": -21.493698120117188, "global_step": 89670, "epoch": 1080} {"train_loss": -21.35599708557129, "global_step": 89671, "epoch": 1080} {"train_loss": -21.705278396606445, "global_step": 89672, "epoch": 1080} {"train_loss": -21.47134780883789, "global_step": 89673, "epoch": 1080} {"train_loss": -21.508413314819336, "global_step": 89674, "epoch": 1080} {"train_loss": -21.555212020874023, "global_step": 89675, "epoch": 1080} {"train_loss": -21.22968292236328, "global_step": 89676, "epoch": 1080} {"train_loss": -21.667142868041992, "global_step": 89677, "epoch": 1080} {"train_loss": -21.547163009643555, "global_step": 89678, "epoch": 1080} {"train_loss": -21.740707397460938, "global_step": 89679, "epoch": 1080} {"train_loss": -21.62746238708496, "global_step": 89680, "epoch": 1080} {"train_loss": -21.274106979370117, "global_step": 89681, "epoch": 1080} {"train_loss": -21.2248592376709, "global_step": 89682, "epoch": 1080} {"train_loss": -21.637371063232422, "global_step": 89683, "epoch": 1080} {"train_loss": -21.776723861694336, "global_step": 89684, "epoch": 1080} {"train_loss": -21.61808204650879, "global_step": 89685, "epoch": 1080} {"train_loss": -21.747556686401367, "global_step": 89686, "epoch": 1080} {"train_loss": -21.821502685546875, "global_step": 89687, "epoch": 1080} {"train_loss": -22.097570419311523, "global_step": 89688, "epoch": 1080} {"train_loss": -21.527509689331055, "global_step": 89689, "epoch": 1080} {"train_loss": -21.650131225585938, "global_step": 89690, "epoch": 1080} {"train_loss": -21.437957763671875, "global_step": 89691, "epoch": 1080} {"train_loss": -21.362211227416992, "global_step": 89692, "epoch": 1080} {"train_loss": -21.525806427001953, "global_step": 89693, "epoch": 1080} {"train_loss": -21.903181076049805, "global_step": 89694, "epoch": 1080} {"train_loss": -21.541645050048828, "global_step": 89695, "epoch": 1080} {"train_loss": -21.52420425415039, "global_step": 89696, "epoch": 1080} {"train_loss": -21.71428871154785, "global_step": 89697, "epoch": 1080} {"train_loss": -21.426673889160156, "global_step": 89698, "epoch": 1080} {"train_loss": -21.180744171142578, "global_step": 89699, "epoch": 1080} {"train_loss": -21.539716720581055, "global_step": 89700, "epoch": 1080} {"train_loss": -21.522748947143555, "global_step": 89701, "epoch": 1080} {"train_loss": -21.337051391601562, "global_step": 89702, "epoch": 1080} {"train_loss": -21.561511993408203, "global_step": 89703, "epoch": 1080} {"train_loss": -21.74051856994629, "global_step": 89704, "epoch": 1080} {"train_loss": -21.30257225036621, "global_step": 89705, "epoch": 1080} {"train_loss": -21.911067962646484, "global_step": 89706, "epoch": 1080} {"train_loss": -21.488468170166016, "global_step": 89707, "epoch": 1080} {"train_loss": -21.606718063354492, "global_step": 89708, "epoch": 1080} {"train_loss": -21.125112533569336, "global_step": 89709, "epoch": 1080} {"train_loss": -21.835912704467773, "global_step": 89710, "epoch": 1080} {"train_loss": -21.814682006835938, "global_step": 89711, "epoch": 1080} {"train_loss": -21.587732315063477, "global_step": 89712, "epoch": 1080} {"train_loss": -21.554563522338867, "global_step": 89713, "epoch": 1080} {"train_loss": -21.500686645507812, "global_step": 89714, "epoch": 1080} {"train_loss": -21.429546356201172, "global_step": 89715, "epoch": 1080} {"train_loss": -21.71441078186035, "global_step": 89716, "epoch": 1080} {"train_loss": -21.320899963378906, "global_step": 89717, "epoch": 1080} {"train_loss": -21.880477905273438, "global_step": 89718, "epoch": 1080} {"train_loss": -21.82371711730957, "global_step": 89719, "epoch": 1080} {"train_loss": -21.6610164642334, "global_step": 89720, "epoch": 1080} {"train_loss": -21.32974624633789, "global_step": 89721, "epoch": 1080} {"train_loss": -21.4396342311997, "global_step": 89722, "epoch": 1080, "val_loss": 5984048.5} {"train_loss": -21.542882919311523, "global_step": 89723, "epoch": 1081} {"train_loss": -21.408109664916992, "global_step": 89724, "epoch": 1081} {"train_loss": -21.572832107543945, "global_step": 89725, "epoch": 1081} {"train_loss": -21.600942611694336, "global_step": 89726, "epoch": 1081} {"train_loss": -21.33284568786621, "global_step": 89727, "epoch": 1081} {"train_loss": -21.526735305786133, "global_step": 89728, "epoch": 1081} {"train_loss": -21.4868106842041, "global_step": 89729, "epoch": 1081} {"train_loss": -21.248395919799805, "global_step": 89730, "epoch": 1081} {"train_loss": -21.393518447875977, "global_step": 89731, "epoch": 1081} {"train_loss": -21.70125389099121, "global_step": 89732, "epoch": 1081} {"train_loss": -21.433486938476562, "global_step": 89733, "epoch": 1081} {"train_loss": -21.717182159423828, "global_step": 89734, "epoch": 1081} {"train_loss": -21.456628799438477, "global_step": 89735, "epoch": 1081} {"train_loss": -21.39288902282715, "global_step": 89736, "epoch": 1081} {"train_loss": -21.805540084838867, "global_step": 89737, "epoch": 1081} {"train_loss": -21.64115333557129, "global_step": 89738, "epoch": 1081} {"train_loss": -21.95120620727539, "global_step": 89739, "epoch": 1081} {"train_loss": -21.423349380493164, "global_step": 89740, "epoch": 1081} {"train_loss": -21.724700927734375, "global_step": 89741, "epoch": 1081} {"train_loss": -21.886199951171875, "global_step": 89742, "epoch": 1081} {"train_loss": -21.587064743041992, "global_step": 89743, "epoch": 1081} {"train_loss": -21.477920532226562, "global_step": 89744, "epoch": 1081} {"train_loss": -21.61515235900879, "global_step": 89745, "epoch": 1081} {"train_loss": -21.459901809692383, "global_step": 89746, "epoch": 1081} {"train_loss": -21.735790252685547, "global_step": 89747, "epoch": 1081} {"train_loss": -21.933063507080078, "global_step": 89748, "epoch": 1081} {"train_loss": -21.350305557250977, "global_step": 89749, "epoch": 1081} {"train_loss": -21.6859130859375, "global_step": 89750, "epoch": 1081} {"train_loss": -21.569427490234375, "global_step": 89751, "epoch": 1081} {"train_loss": -21.697965621948242, "global_step": 89752, "epoch": 1081} {"train_loss": -21.579486846923828, "global_step": 89753, "epoch": 1081} {"train_loss": -21.69053077697754, "global_step": 89754, "epoch": 1081} {"train_loss": -21.55293846130371, "global_step": 89755, "epoch": 1081} {"train_loss": -21.49110221862793, "global_step": 89756, "epoch": 1081} {"train_loss": -21.655519485473633, "global_step": 89757, "epoch": 1081} {"train_loss": -21.703536987304688, "global_step": 89758, "epoch": 1081} {"train_loss": -21.540653228759766, "global_step": 89759, "epoch": 1081} {"train_loss": -21.573598861694336, "global_step": 89760, "epoch": 1081} {"train_loss": -21.480587005615234, "global_step": 89761, "epoch": 1081} {"train_loss": -21.720136642456055, "global_step": 89762, "epoch": 1081} {"train_loss": -21.549713134765625, "global_step": 89763, "epoch": 1081} {"train_loss": -21.474266052246094, "global_step": 89764, "epoch": 1081} {"train_loss": -21.603740692138672, "global_step": 89765, "epoch": 1081} {"train_loss": -21.408985137939453, "global_step": 89766, "epoch": 1081} {"train_loss": -21.38775062561035, "global_step": 89767, "epoch": 1081} {"train_loss": -21.913965225219727, "global_step": 89768, "epoch": 1081} {"train_loss": -21.887601852416992, "global_step": 89769, "epoch": 1081} {"train_loss": -21.72859001159668, "global_step": 89770, "epoch": 1081} {"train_loss": -21.435781478881836, "global_step": 89771, "epoch": 1081} {"train_loss": -21.590688705444336, "global_step": 89772, "epoch": 1081} {"train_loss": -21.53388786315918, "global_step": 89773, "epoch": 1081} {"train_loss": -21.424671173095703, "global_step": 89774, "epoch": 1081} {"train_loss": -21.54327392578125, "global_step": 89775, "epoch": 1081} {"train_loss": -21.452417373657227, "global_step": 89776, "epoch": 1081} {"train_loss": -21.98090171813965, "global_step": 89777, "epoch": 1081} {"train_loss": -21.541120529174805, "global_step": 89778, "epoch": 1081} {"train_loss": -21.268354415893555, "global_step": 89779, "epoch": 1081} {"train_loss": -21.304401397705078, "global_step": 89780, "epoch": 1081} {"train_loss": -21.57834815979004, "global_step": 89781, "epoch": 1081} {"train_loss": -21.402915954589844, "global_step": 89782, "epoch": 1081} {"train_loss": -21.85634422302246, "global_step": 89783, "epoch": 1081} {"train_loss": -21.50694465637207, "global_step": 89784, "epoch": 1081} {"train_loss": -21.790063858032227, "global_step": 89785, "epoch": 1081} {"train_loss": -22.011465072631836, "global_step": 89786, "epoch": 1081} {"train_loss": -21.36592674255371, "global_step": 89787, "epoch": 1081} {"train_loss": -21.5406436920166, "global_step": 89788, "epoch": 1081} {"train_loss": -21.802059173583984, "global_step": 89789, "epoch": 1081} {"train_loss": -22.073144912719727, "global_step": 89790, "epoch": 1081} {"train_loss": -21.765979766845703, "global_step": 89791, "epoch": 1081} {"train_loss": -21.78801727294922, "global_step": 89792, "epoch": 1081} {"train_loss": -21.6960506439209, "global_step": 89793, "epoch": 1081} {"train_loss": -21.977476119995117, "global_step": 89794, "epoch": 1081} {"train_loss": -21.746313095092773, "global_step": 89795, "epoch": 1081} {"train_loss": -21.95197105407715, "global_step": 89796, "epoch": 1081} {"train_loss": -21.570451736450195, "global_step": 89797, "epoch": 1081} {"train_loss": -21.26548194885254, "global_step": 89798, "epoch": 1081} {"train_loss": -21.472742080688477, "global_step": 89799, "epoch": 1081} {"train_loss": -22.041458129882812, "global_step": 89800, "epoch": 1081} {"train_loss": -21.520618438720703, "global_step": 89801, "epoch": 1081} {"train_loss": -21.428939819335938, "global_step": 89802, "epoch": 1081} {"train_loss": -21.689950942993164, "global_step": 89803, "epoch": 1081} {"train_loss": -21.324228286743164, "global_step": 89804, "epoch": 1081} {"train_loss": -21.607082757605127, "global_step": 89805, "epoch": 1081, "val_loss": 5956691.0} {"train_loss": -20.875490188598633, "global_step": 89806, "epoch": 1082} {"train_loss": -20.721054077148438, "global_step": 89807, "epoch": 1082} {"train_loss": -21.232559204101562, "global_step": 89808, "epoch": 1082} {"train_loss": -20.99351692199707, "global_step": 89809, "epoch": 1082} {"train_loss": -21.121105194091797, "global_step": 89810, "epoch": 1082} {"train_loss": -21.38910484313965, "global_step": 89811, "epoch": 1082} {"train_loss": -21.40180015563965, "global_step": 89812, "epoch": 1082} {"train_loss": -21.401029586791992, "global_step": 89813, "epoch": 1082} {"train_loss": -21.647079467773438, "global_step": 89814, "epoch": 1082} {"train_loss": -21.659099578857422, "global_step": 89815, "epoch": 1082} {"train_loss": -21.6600399017334, "global_step": 89816, "epoch": 1082} {"train_loss": -21.358339309692383, "global_step": 89817, "epoch": 1082} {"train_loss": -21.6981201171875, "global_step": 89818, "epoch": 1082} {"train_loss": -21.896223068237305, "global_step": 89819, "epoch": 1082} {"train_loss": -21.747739791870117, "global_step": 89820, "epoch": 1082} {"train_loss": -21.69044303894043, "global_step": 89821, "epoch": 1082} {"train_loss": -21.335615158081055, "global_step": 89822, "epoch": 1082} {"train_loss": -21.64809226989746, "global_step": 89823, "epoch": 1082} {"train_loss": -21.549022674560547, "global_step": 89824, "epoch": 1082} {"train_loss": -21.336746215820312, "global_step": 89825, "epoch": 1082} {"train_loss": -21.9127254486084, "global_step": 89826, "epoch": 1082} {"train_loss": -21.453882217407227, "global_step": 89827, "epoch": 1082} {"train_loss": -21.320127487182617, "global_step": 89828, "epoch": 1082} {"train_loss": -21.2879638671875, "global_step": 89829, "epoch": 1082} {"train_loss": -21.614004135131836, "global_step": 89830, "epoch": 1082} {"train_loss": -21.847980499267578, "global_step": 89831, "epoch": 1082} {"train_loss": -21.5360050201416, "global_step": 89832, "epoch": 1082} {"train_loss": -21.426166534423828, "global_step": 89833, "epoch": 1082} {"train_loss": -21.803058624267578, "global_step": 89834, "epoch": 1082} {"train_loss": -21.619375228881836, "global_step": 89835, "epoch": 1082} {"train_loss": -21.395492553710938, "global_step": 89836, "epoch": 1082} {"train_loss": -21.592588424682617, "global_step": 89837, "epoch": 1082} {"train_loss": -21.948087692260742, "global_step": 89838, "epoch": 1082} {"train_loss": -21.870681762695312, "global_step": 89839, "epoch": 1082} {"train_loss": -21.459131240844727, "global_step": 89840, "epoch": 1082} {"train_loss": -21.493911743164062, "global_step": 89841, "epoch": 1082} {"train_loss": -21.77318000793457, "global_step": 89842, "epoch": 1082} {"train_loss": -21.586149215698242, "global_step": 89843, "epoch": 1082} {"train_loss": -21.706588745117188, "global_step": 89844, "epoch": 1082} {"train_loss": -21.772306442260742, "global_step": 89845, "epoch": 1082} {"train_loss": -21.58795738220215, "global_step": 89846, "epoch": 1082} {"train_loss": -21.510610580444336, "global_step": 89847, "epoch": 1082} {"train_loss": -22.102706909179688, "global_step": 89848, "epoch": 1082} {"train_loss": -21.297119140625, "global_step": 89849, "epoch": 1082} {"train_loss": -21.237754821777344, "global_step": 89850, "epoch": 1082} {"train_loss": -21.536108016967773, "global_step": 89851, "epoch": 1082} {"train_loss": -21.43754005432129, "global_step": 89852, "epoch": 1082} {"train_loss": -21.317564010620117, "global_step": 89853, "epoch": 1082} {"train_loss": -21.91237449645996, "global_step": 89854, "epoch": 1082} {"train_loss": -21.492401123046875, "global_step": 89855, "epoch": 1082} {"train_loss": -21.52265739440918, "global_step": 89856, "epoch": 1082} {"train_loss": -21.44008445739746, "global_step": 89857, "epoch": 1082} {"train_loss": -21.28763771057129, "global_step": 89858, "epoch": 1082} {"train_loss": -21.498050689697266, "global_step": 89859, "epoch": 1082} {"train_loss": -21.87623405456543, "global_step": 89860, "epoch": 1082} {"train_loss": -21.739858627319336, "global_step": 89861, "epoch": 1082} {"train_loss": -21.303205490112305, "global_step": 89862, "epoch": 1082} {"train_loss": -22.141645431518555, "global_step": 89863, "epoch": 1082} {"train_loss": -21.4365177154541, "global_step": 89864, "epoch": 1082} {"train_loss": -21.352325439453125, "global_step": 89865, "epoch": 1082} {"train_loss": -21.52308464050293, "global_step": 89866, "epoch": 1082} {"train_loss": -21.553386688232422, "global_step": 89867, "epoch": 1082} {"train_loss": -21.408300399780273, "global_step": 89868, "epoch": 1082} {"train_loss": -21.23479652404785, "global_step": 89869, "epoch": 1082} {"train_loss": -21.4249267578125, "global_step": 89870, "epoch": 1082} {"train_loss": -21.341934204101562, "global_step": 89871, "epoch": 1082} {"train_loss": -21.666067123413086, "global_step": 89872, "epoch": 1082} {"train_loss": -21.480716705322266, "global_step": 89873, "epoch": 1082} {"train_loss": -22.02174949645996, "global_step": 89874, "epoch": 1082} {"train_loss": -21.340662002563477, "global_step": 89875, "epoch": 1082} {"train_loss": -21.57744598388672, "global_step": 89876, "epoch": 1082} {"train_loss": -21.747848510742188, "global_step": 89877, "epoch": 1082} {"train_loss": -21.50257682800293, "global_step": 89878, "epoch": 1082} {"train_loss": -21.525007247924805, "global_step": 89879, "epoch": 1082} {"train_loss": -21.21780776977539, "global_step": 89880, "epoch": 1082} {"train_loss": -21.292469024658203, "global_step": 89881, "epoch": 1082} {"train_loss": -21.258153915405273, "global_step": 89882, "epoch": 1082} {"train_loss": -21.331899642944336, "global_step": 89883, "epoch": 1082} {"train_loss": -21.33245849609375, "global_step": 89884, "epoch": 1082} {"train_loss": -21.506826400756836, "global_step": 89885, "epoch": 1082} {"train_loss": -21.754657745361328, "global_step": 89886, "epoch": 1082} {"train_loss": -21.602294921875, "global_step": 89887, "epoch": 1082} {"train_loss": -21.530598996633508, "global_step": 89888, "epoch": 1082, "val_loss": 6040768.0} {"train_loss": -21.392059326171875, "global_step": 89889, "epoch": 1083} {"train_loss": -21.255151748657227, "global_step": 89890, "epoch": 1083} {"train_loss": -21.2634334564209, "global_step": 89891, "epoch": 1083} {"train_loss": -21.46293067932129, "global_step": 89892, "epoch": 1083} {"train_loss": -20.86185073852539, "global_step": 89893, "epoch": 1083} {"train_loss": -20.999217987060547, "global_step": 89894, "epoch": 1083} {"train_loss": -21.31097412109375, "global_step": 89895, "epoch": 1083} {"train_loss": -21.31015396118164, "global_step": 89896, "epoch": 1083} {"train_loss": -21.818517684936523, "global_step": 89897, "epoch": 1083} {"train_loss": -21.299041748046875, "global_step": 89898, "epoch": 1083} {"train_loss": -21.471485137939453, "global_step": 89899, "epoch": 1083} {"train_loss": -21.455224990844727, "global_step": 89900, "epoch": 1083} {"train_loss": -21.857406616210938, "global_step": 89901, "epoch": 1083} {"train_loss": -21.498889923095703, "global_step": 89902, "epoch": 1083} {"train_loss": -21.469388961791992, "global_step": 89903, "epoch": 1083} {"train_loss": -21.386804580688477, "global_step": 89904, "epoch": 1083} {"train_loss": -21.348546981811523, "global_step": 89905, "epoch": 1083} {"train_loss": -21.027170181274414, "global_step": 89906, "epoch": 1083} {"train_loss": -21.413557052612305, "global_step": 89907, "epoch": 1083} {"train_loss": -21.62468910217285, "global_step": 89908, "epoch": 1083} {"train_loss": -21.773601531982422, "global_step": 89909, "epoch": 1083} {"train_loss": -21.661096572875977, "global_step": 89910, "epoch": 1083} {"train_loss": -21.231359481811523, "global_step": 89911, "epoch": 1083} {"train_loss": -21.51543617248535, "global_step": 89912, "epoch": 1083} {"train_loss": -22.034231185913086, "global_step": 89913, "epoch": 1083} {"train_loss": -21.4726619720459, "global_step": 89914, "epoch": 1083} {"train_loss": -21.74934196472168, "global_step": 89915, "epoch": 1083} {"train_loss": -21.36322021484375, "global_step": 89916, "epoch": 1083} {"train_loss": -21.566341400146484, "global_step": 89917, "epoch": 1083} {"train_loss": -21.412521362304688, "global_step": 89918, "epoch": 1083} {"train_loss": -21.823637008666992, "global_step": 89919, "epoch": 1083} {"train_loss": -21.7369327545166, "global_step": 89920, "epoch": 1083} {"train_loss": -22.01447296142578, "global_step": 89921, "epoch": 1083} {"train_loss": -21.512197494506836, "global_step": 89922, "epoch": 1083} {"train_loss": -21.571924209594727, "global_step": 89923, "epoch": 1083} {"train_loss": -21.36750602722168, "global_step": 89924, "epoch": 1083} {"train_loss": -21.62117576599121, "global_step": 89925, "epoch": 1083} {"train_loss": -21.572912216186523, "global_step": 89926, "epoch": 1083} {"train_loss": -21.827383041381836, "global_step": 89927, "epoch": 1083} {"train_loss": -21.368745803833008, "global_step": 89928, "epoch": 1083} {"train_loss": -21.548633575439453, "global_step": 89929, "epoch": 1083} {"train_loss": -21.13572883605957, "global_step": 89930, "epoch": 1083} {"train_loss": -21.62771224975586, "global_step": 89931, "epoch": 1083} {"train_loss": -21.537256240844727, "global_step": 89932, "epoch": 1083} {"train_loss": -21.46058464050293, "global_step": 89933, "epoch": 1083} {"train_loss": -20.921451568603516, "global_step": 89934, "epoch": 1083} {"train_loss": -21.707075119018555, "global_step": 89935, "epoch": 1083} {"train_loss": -21.632492065429688, "global_step": 89936, "epoch": 1083} {"train_loss": -21.612503051757812, "global_step": 89937, "epoch": 1083} {"train_loss": -21.456619262695312, "global_step": 89938, "epoch": 1083} {"train_loss": -21.716388702392578, "global_step": 89939, "epoch": 1083} {"train_loss": -21.96561050415039, "global_step": 89940, "epoch": 1083} {"train_loss": -22.033157348632812, "global_step": 89941, "epoch": 1083} {"train_loss": -21.77996253967285, "global_step": 89942, "epoch": 1083} {"train_loss": -21.290372848510742, "global_step": 89943, "epoch": 1083} {"train_loss": -21.831655502319336, "global_step": 89944, "epoch": 1083} {"train_loss": -21.271299362182617, "global_step": 89945, "epoch": 1083} {"train_loss": -21.843570709228516, "global_step": 89946, "epoch": 1083} {"train_loss": -21.939655303955078, "global_step": 89947, "epoch": 1083} {"train_loss": -21.33974838256836, "global_step": 89948, "epoch": 1083} {"train_loss": -21.792926788330078, "global_step": 89949, "epoch": 1083} {"train_loss": -21.386428833007812, "global_step": 89950, "epoch": 1083} {"train_loss": -21.866910934448242, "global_step": 89951, "epoch": 1083} {"train_loss": -21.874929428100586, "global_step": 89952, "epoch": 1083} {"train_loss": -22.004106521606445, "global_step": 89953, "epoch": 1083} {"train_loss": -21.53446388244629, "global_step": 89954, "epoch": 1083} {"train_loss": -21.589569091796875, "global_step": 89955, "epoch": 1083} {"train_loss": -21.715951919555664, "global_step": 89956, "epoch": 1083} {"train_loss": -21.51940155029297, "global_step": 89957, "epoch": 1083} {"train_loss": -21.830224990844727, "global_step": 89958, "epoch": 1083} {"train_loss": -21.693998336791992, "global_step": 89959, "epoch": 1083} {"train_loss": -21.41303253173828, "global_step": 89960, "epoch": 1083} {"train_loss": -22.156604766845703, "global_step": 89961, "epoch": 1083} {"train_loss": -21.409765243530273, "global_step": 89962, "epoch": 1083} {"train_loss": -21.369564056396484, "global_step": 89963, "epoch": 1083} {"train_loss": -21.305988311767578, "global_step": 89964, "epoch": 1083} {"train_loss": -21.610063552856445, "global_step": 89965, "epoch": 1083} {"train_loss": -21.03923988342285, "global_step": 89966, "epoch": 1083} {"train_loss": -21.382604598999023, "global_step": 89967, "epoch": 1083} {"train_loss": -21.745046615600586, "global_step": 89968, "epoch": 1083} {"train_loss": -21.639795303344727, "global_step": 89969, "epoch": 1083} {"train_loss": -21.223112106323242, "global_step": 89970, "epoch": 1083} {"train_loss": -21.538902880197547, "global_step": 89971, "epoch": 1083, "val_loss": 6076649.0} {"train_loss": -21.061357498168945, "global_step": 89972, "epoch": 1084} {"train_loss": -21.040647506713867, "global_step": 89973, "epoch": 1084} {"train_loss": -20.643644332885742, "global_step": 89974, "epoch": 1084} {"train_loss": -20.528182983398438, "global_step": 89975, "epoch": 1084} {"train_loss": -21.185529708862305, "global_step": 89976, "epoch": 1084} {"train_loss": -21.02595329284668, "global_step": 89977, "epoch": 1084} {"train_loss": -20.97369384765625, "global_step": 89978, "epoch": 1084} {"train_loss": -21.354537963867188, "global_step": 89979, "epoch": 1084} {"train_loss": -21.12183952331543, "global_step": 89980, "epoch": 1084} {"train_loss": -21.43267059326172, "global_step": 89981, "epoch": 1084} {"train_loss": -21.257261276245117, "global_step": 89982, "epoch": 1084} {"train_loss": -21.342876434326172, "global_step": 89983, "epoch": 1084} {"train_loss": -21.376996994018555, "global_step": 89984, "epoch": 1084} {"train_loss": -21.54120445251465, "global_step": 89985, "epoch": 1084} {"train_loss": -21.29913902282715, "global_step": 89986, "epoch": 1084} {"train_loss": -21.47504425048828, "global_step": 89987, "epoch": 1084} {"train_loss": -21.457910537719727, "global_step": 89988, "epoch": 1084} {"train_loss": -21.407522201538086, "global_step": 89989, "epoch": 1084} {"train_loss": -21.310195922851562, "global_step": 89990, "epoch": 1084} {"train_loss": -21.357458114624023, "global_step": 89991, "epoch": 1084} {"train_loss": -21.7014217376709, "global_step": 89992, "epoch": 1084} {"train_loss": -21.438629150390625, "global_step": 89993, "epoch": 1084} {"train_loss": -21.415311813354492, "global_step": 89994, "epoch": 1084} {"train_loss": -21.54656410217285, "global_step": 89995, "epoch": 1084} {"train_loss": -21.635547637939453, "global_step": 89996, "epoch": 1084} {"train_loss": -21.6267147064209, "global_step": 89997, "epoch": 1084} {"train_loss": -21.491743087768555, "global_step": 89998, "epoch": 1084} {"train_loss": -21.495100021362305, "global_step": 89999, "epoch": 1084} {"train_loss": -21.74871253967285, "global_step": 90000, "epoch": 1084} {"train_loss": -21.5769100189209, "global_step": 90001, "epoch": 1084} {"train_loss": -21.766904830932617, "global_step": 90002, "epoch": 1084} {"train_loss": -21.68906021118164, "global_step": 90003, "epoch": 1084} {"train_loss": -22.029388427734375, "global_step": 90004, "epoch": 1084} {"train_loss": -21.370344161987305, "global_step": 90005, "epoch": 1084} {"train_loss": -21.525548934936523, "global_step": 90006, "epoch": 1084} {"train_loss": -21.524927139282227, "global_step": 90007, "epoch": 1084} {"train_loss": -21.312589645385742, "global_step": 90008, "epoch": 1084} {"train_loss": -21.710390090942383, "global_step": 90009, "epoch": 1084} {"train_loss": -21.591886520385742, "global_step": 90010, "epoch": 1084} {"train_loss": -21.921857833862305, "global_step": 90011, "epoch": 1084} {"train_loss": -21.274314880371094, "global_step": 90012, "epoch": 1084} {"train_loss": -21.3612060546875, "global_step": 90013, "epoch": 1084} {"train_loss": -21.55435562133789, "global_step": 90014, "epoch": 1084} {"train_loss": -21.627939224243164, "global_step": 90015, "epoch": 1084} {"train_loss": -21.37229347229004, "global_step": 90016, "epoch": 1084} {"train_loss": -21.508996963500977, "global_step": 90017, "epoch": 1084} {"train_loss": -21.173364639282227, "global_step": 90018, "epoch": 1084} {"train_loss": -21.737401962280273, "global_step": 90019, "epoch": 1084} {"train_loss": -21.415185928344727, "global_step": 90020, "epoch": 1084} {"train_loss": -21.617755889892578, "global_step": 90021, "epoch": 1084} {"train_loss": -21.26764488220215, "global_step": 90022, "epoch": 1084} {"train_loss": -21.514921188354492, "global_step": 90023, "epoch": 1084} {"train_loss": -21.476957321166992, "global_step": 90024, "epoch": 1084} {"train_loss": -21.473840713500977, "global_step": 90025, "epoch": 1084} {"train_loss": -21.64217185974121, "global_step": 90026, "epoch": 1084} {"train_loss": -21.558229446411133, "global_step": 90027, "epoch": 1084} {"train_loss": -21.490320205688477, "global_step": 90028, "epoch": 1084} {"train_loss": -21.353668212890625, "global_step": 90029, "epoch": 1084} {"train_loss": -21.476713180541992, "global_step": 90030, "epoch": 1084} {"train_loss": -21.38337516784668, "global_step": 90031, "epoch": 1084} {"train_loss": -21.210067749023438, "global_step": 90032, "epoch": 1084} {"train_loss": -21.652565002441406, "global_step": 90033, "epoch": 1084} {"train_loss": -21.502796173095703, "global_step": 90034, "epoch": 1084} {"train_loss": -21.415348052978516, "global_step": 90035, "epoch": 1084} {"train_loss": -21.55129051208496, "global_step": 90036, "epoch": 1084} {"train_loss": -21.745641708374023, "global_step": 90037, "epoch": 1084} {"train_loss": -21.620023727416992, "global_step": 90038, "epoch": 1084} {"train_loss": -21.734331130981445, "global_step": 90039, "epoch": 1084} {"train_loss": -21.496545791625977, "global_step": 90040, "epoch": 1084} {"train_loss": -21.758459091186523, "global_step": 90041, "epoch": 1084} {"train_loss": -21.257394790649414, "global_step": 90042, "epoch": 1084} {"train_loss": -21.745418548583984, "global_step": 90043, "epoch": 1084} {"train_loss": -21.642187118530273, "global_step": 90044, "epoch": 1084} {"train_loss": -21.468061447143555, "global_step": 90045, "epoch": 1084} {"train_loss": -21.572582244873047, "global_step": 90046, "epoch": 1084} {"train_loss": -21.53227996826172, "global_step": 90047, "epoch": 1084} {"train_loss": -21.48509407043457, "global_step": 90048, "epoch": 1084} {"train_loss": -21.67292594909668, "global_step": 90049, "epoch": 1084} {"train_loss": -21.723831176757812, "global_step": 90050, "epoch": 1084} {"train_loss": -21.740997314453125, "global_step": 90051, "epoch": 1084} {"train_loss": -21.47747230529785, "global_step": 90052, "epoch": 1084} {"train_loss": -21.402515411376953, "global_step": 90053, "epoch": 1084} {"train_loss": -21.476455022053546, "global_step": 90054, "epoch": 1084, "val_loss": 6141346.0} {"train_loss": -21.338245391845703, "global_step": 90055, "epoch": 1085} {"train_loss": -21.365989685058594, "global_step": 90056, "epoch": 1085} {"train_loss": -21.459436416625977, "global_step": 90057, "epoch": 1085} {"train_loss": -21.718324661254883, "global_step": 90058, "epoch": 1085} {"train_loss": -21.40210723876953, "global_step": 90059, "epoch": 1085} {"train_loss": -21.10407066345215, "global_step": 90060, "epoch": 1085} {"train_loss": -21.439863204956055, "global_step": 90061, "epoch": 1085} {"train_loss": -20.89284324645996, "global_step": 90062, "epoch": 1085} {"train_loss": -21.59092140197754, "global_step": 90063, "epoch": 1085} {"train_loss": -21.257047653198242, "global_step": 90064, "epoch": 1085} {"train_loss": -21.118896484375, "global_step": 90065, "epoch": 1085} {"train_loss": -21.451204299926758, "global_step": 90066, "epoch": 1085} {"train_loss": -21.866779327392578, "global_step": 90067, "epoch": 1085} {"train_loss": -21.3123722076416, "global_step": 90068, "epoch": 1085} {"train_loss": -21.834095001220703, "global_step": 90069, "epoch": 1085} {"train_loss": -21.39097023010254, "global_step": 90070, "epoch": 1085} {"train_loss": -21.435791015625, "global_step": 90071, "epoch": 1085} {"train_loss": -21.80219841003418, "global_step": 90072, "epoch": 1085} {"train_loss": -21.521926879882812, "global_step": 90073, "epoch": 1085} {"train_loss": -21.35504150390625, "global_step": 90074, "epoch": 1085} {"train_loss": -21.67035484313965, "global_step": 90075, "epoch": 1085} {"train_loss": -21.619918823242188, "global_step": 90076, "epoch": 1085} {"train_loss": -21.724451065063477, "global_step": 90077, "epoch": 1085} {"train_loss": -21.146915435791016, "global_step": 90078, "epoch": 1085} {"train_loss": -21.945693969726562, "global_step": 90079, "epoch": 1085} {"train_loss": -21.674907684326172, "global_step": 90080, "epoch": 1085} {"train_loss": -21.47393798828125, "global_step": 90081, "epoch": 1085} {"train_loss": -21.513879776000977, "global_step": 90082, "epoch": 1085} {"train_loss": -21.545217514038086, "global_step": 90083, "epoch": 1085} {"train_loss": -21.76602554321289, "global_step": 90084, "epoch": 1085} {"train_loss": -21.64539909362793, "global_step": 90085, "epoch": 1085} {"train_loss": -21.706966400146484, "global_step": 90086, "epoch": 1085} {"train_loss": -21.957050323486328, "global_step": 90087, "epoch": 1085} {"train_loss": -21.334287643432617, "global_step": 90088, "epoch": 1085} {"train_loss": -21.553495407104492, "global_step": 90089, "epoch": 1085} {"train_loss": -21.661481857299805, "global_step": 90090, "epoch": 1085} {"train_loss": -21.42580795288086, "global_step": 90091, "epoch": 1085} {"train_loss": -21.45844841003418, "global_step": 90092, "epoch": 1085} {"train_loss": -21.19466781616211, "global_step": 90093, "epoch": 1085} {"train_loss": -21.444772720336914, "global_step": 90094, "epoch": 1085} {"train_loss": -21.684635162353516, "global_step": 90095, "epoch": 1085} {"train_loss": -21.8190975189209, "global_step": 90096, "epoch": 1085} {"train_loss": -21.461347579956055, "global_step": 90097, "epoch": 1085} {"train_loss": -21.66599464416504, "global_step": 90098, "epoch": 1085} {"train_loss": -21.503196716308594, "global_step": 90099, "epoch": 1085} {"train_loss": -21.366966247558594, "global_step": 90100, "epoch": 1085} {"train_loss": -21.51620864868164, "global_step": 90101, "epoch": 1085} {"train_loss": -21.58658218383789, "global_step": 90102, "epoch": 1085} {"train_loss": -21.771411895751953, "global_step": 90103, "epoch": 1085} {"train_loss": -21.459623336791992, "global_step": 90104, "epoch": 1085} {"train_loss": -21.370458602905273, "global_step": 90105, "epoch": 1085} {"train_loss": -21.431011199951172, "global_step": 90106, "epoch": 1085} {"train_loss": -21.817474365234375, "global_step": 90107, "epoch": 1085} {"train_loss": -21.47381591796875, "global_step": 90108, "epoch": 1085} {"train_loss": -21.905759811401367, "global_step": 90109, "epoch": 1085} {"train_loss": -21.54158592224121, "global_step": 90110, "epoch": 1085} {"train_loss": -21.45058250427246, "global_step": 90111, "epoch": 1085} {"train_loss": -21.607664108276367, "global_step": 90112, "epoch": 1085} {"train_loss": -21.79728126525879, "global_step": 90113, "epoch": 1085} {"train_loss": -21.403512954711914, "global_step": 90114, "epoch": 1085} {"train_loss": -21.562702178955078, "global_step": 90115, "epoch": 1085} {"train_loss": -21.478254318237305, "global_step": 90116, "epoch": 1085} {"train_loss": -22.02813148498535, "global_step": 90117, "epoch": 1085} {"train_loss": -21.731399536132812, "global_step": 90118, "epoch": 1085} {"train_loss": -21.594270706176758, "global_step": 90119, "epoch": 1085} {"train_loss": -21.96248435974121, "global_step": 90120, "epoch": 1085} {"train_loss": -21.514341354370117, "global_step": 90121, "epoch": 1085} {"train_loss": -21.73531723022461, "global_step": 90122, "epoch": 1085} {"train_loss": -21.77314567565918, "global_step": 90123, "epoch": 1085} {"train_loss": -21.79664421081543, "global_step": 90124, "epoch": 1085} {"train_loss": -22.263975143432617, "global_step": 90125, "epoch": 1085} {"train_loss": -21.77168083190918, "global_step": 90126, "epoch": 1085} {"train_loss": -21.637195587158203, "global_step": 90127, "epoch": 1085} {"train_loss": -21.577564239501953, "global_step": 90128, "epoch": 1085} {"train_loss": -21.46766471862793, "global_step": 90129, "epoch": 1085} {"train_loss": -21.5827693939209, "global_step": 90130, "epoch": 1085} {"train_loss": -21.48061180114746, "global_step": 90131, "epoch": 1085} {"train_loss": -21.4958553314209, "global_step": 90132, "epoch": 1085} {"train_loss": -21.732351303100586, "global_step": 90133, "epoch": 1085} {"train_loss": -21.879850387573242, "global_step": 90134, "epoch": 1085} {"train_loss": -21.893966674804688, "global_step": 90135, "epoch": 1085} {"train_loss": -21.844375610351562, "global_step": 90136, "epoch": 1085} {"train_loss": -21.573592680046357, "global_step": 90137, "epoch": 1085, "val_loss": 6336575.5} {"train_loss": -20.890470504760742, "global_step": 90138, "epoch": 1086} {"train_loss": -20.59708595275879, "global_step": 90139, "epoch": 1086} {"train_loss": -21.01470375061035, "global_step": 90140, "epoch": 1086} {"train_loss": -20.794147491455078, "global_step": 90141, "epoch": 1086} {"train_loss": -21.420286178588867, "global_step": 90142, "epoch": 1086} {"train_loss": -21.310693740844727, "global_step": 90143, "epoch": 1086} {"train_loss": -21.25872230529785, "global_step": 90144, "epoch": 1086} {"train_loss": -21.703596115112305, "global_step": 90145, "epoch": 1086} {"train_loss": -21.096418380737305, "global_step": 90146, "epoch": 1086} {"train_loss": -20.904632568359375, "global_step": 90147, "epoch": 1086} {"train_loss": -21.2308349609375, "global_step": 90148, "epoch": 1086} {"train_loss": -21.171720504760742, "global_step": 90149, "epoch": 1086} {"train_loss": -21.414306640625, "global_step": 90150, "epoch": 1086} {"train_loss": -21.44184684753418, "global_step": 90151, "epoch": 1086} {"train_loss": -21.41926383972168, "global_step": 90152, "epoch": 1086} {"train_loss": -21.872835159301758, "global_step": 90153, "epoch": 1086} {"train_loss": -21.406545639038086, "global_step": 90154, "epoch": 1086} {"train_loss": -21.13042640686035, "global_step": 90155, "epoch": 1086} {"train_loss": -21.362916946411133, "global_step": 90156, "epoch": 1086} {"train_loss": -21.302175521850586, "global_step": 90157, "epoch": 1086} {"train_loss": -21.364410400390625, "global_step": 90158, "epoch": 1086} {"train_loss": -21.552579879760742, "global_step": 90159, "epoch": 1086} {"train_loss": -21.639501571655273, "global_step": 90160, "epoch": 1086} {"train_loss": -21.638961791992188, "global_step": 90161, "epoch": 1086} {"train_loss": -21.629072189331055, "global_step": 90162, "epoch": 1086} {"train_loss": -21.265226364135742, "global_step": 90163, "epoch": 1086} {"train_loss": -21.41253089904785, "global_step": 90164, "epoch": 1086} {"train_loss": -21.699636459350586, "global_step": 90165, "epoch": 1086} {"train_loss": -21.515073776245117, "global_step": 90166, "epoch": 1086} {"train_loss": -21.331335067749023, "global_step": 90167, "epoch": 1086} {"train_loss": -21.805410385131836, "global_step": 90168, "epoch": 1086} {"train_loss": -21.389841079711914, "global_step": 90169, "epoch": 1086} {"train_loss": -21.430490493774414, "global_step": 90170, "epoch": 1086} {"train_loss": -21.416555404663086, "global_step": 90171, "epoch": 1086} {"train_loss": -21.801137924194336, "global_step": 90172, "epoch": 1086} {"train_loss": -22.09584617614746, "global_step": 90173, "epoch": 1086} {"train_loss": -21.594249725341797, "global_step": 90174, "epoch": 1086} {"train_loss": -21.206418991088867, "global_step": 90175, "epoch": 1086} {"train_loss": -21.163909912109375, "global_step": 90176, "epoch": 1086} {"train_loss": -21.66002082824707, "global_step": 90177, "epoch": 1086} {"train_loss": -21.572725296020508, "global_step": 90178, "epoch": 1086} {"train_loss": -21.697011947631836, "global_step": 90179, "epoch": 1086} {"train_loss": -21.670190811157227, "global_step": 90180, "epoch": 1086} {"train_loss": -21.506746292114258, "global_step": 90181, "epoch": 1086} {"train_loss": -21.86187744140625, "global_step": 90182, "epoch": 1086} {"train_loss": -21.383533477783203, "global_step": 90183, "epoch": 1086} {"train_loss": -21.504262924194336, "global_step": 90184, "epoch": 1086} {"train_loss": -21.58493423461914, "global_step": 90185, "epoch": 1086} {"train_loss": -21.4168643951416, "global_step": 90186, "epoch": 1086} {"train_loss": -21.723020553588867, "global_step": 90187, "epoch": 1086} {"train_loss": -21.553955078125, "global_step": 90188, "epoch": 1086} {"train_loss": -21.810747146606445, "global_step": 90189, "epoch": 1086} {"train_loss": -21.69862937927246, "global_step": 90190, "epoch": 1086} {"train_loss": -21.75835609436035, "global_step": 90191, "epoch": 1086} {"train_loss": -21.617515563964844, "global_step": 90192, "epoch": 1086} {"train_loss": -21.554340362548828, "global_step": 90193, "epoch": 1086} {"train_loss": -21.771366119384766, "global_step": 90194, "epoch": 1086} {"train_loss": -21.38419532775879, "global_step": 90195, "epoch": 1086} {"train_loss": -21.595918655395508, "global_step": 90196, "epoch": 1086} {"train_loss": -21.709537506103516, "global_step": 90197, "epoch": 1086} {"train_loss": -21.6385498046875, "global_step": 90198, "epoch": 1086} {"train_loss": -21.585674285888672, "global_step": 90199, "epoch": 1086} {"train_loss": -21.941913604736328, "global_step": 90200, "epoch": 1086} {"train_loss": -21.77059555053711, "global_step": 90201, "epoch": 1086} {"train_loss": -21.386823654174805, "global_step": 90202, "epoch": 1086} {"train_loss": -21.715747833251953, "global_step": 90203, "epoch": 1086} {"train_loss": -21.561445236206055, "global_step": 90204, "epoch": 1086} {"train_loss": -21.9361572265625, "global_step": 90205, "epoch": 1086} {"train_loss": -21.34047508239746, "global_step": 90206, "epoch": 1086} {"train_loss": -21.694059371948242, "global_step": 90207, "epoch": 1086} {"train_loss": -21.475282669067383, "global_step": 90208, "epoch": 1086} {"train_loss": -21.452842712402344, "global_step": 90209, "epoch": 1086} {"train_loss": -21.752634048461914, "global_step": 90210, "epoch": 1086} {"train_loss": -21.67023277282715, "global_step": 90211, "epoch": 1086} {"train_loss": -21.594419479370117, "global_step": 90212, "epoch": 1086} {"train_loss": -21.3909854888916, "global_step": 90213, "epoch": 1086} {"train_loss": -21.158170700073242, "global_step": 90214, "epoch": 1086} {"train_loss": -21.62666893005371, "global_step": 90215, "epoch": 1086} {"train_loss": -21.20187759399414, "global_step": 90216, "epoch": 1086} {"train_loss": -21.585472106933594, "global_step": 90217, "epoch": 1086} {"train_loss": -21.7796630859375, "global_step": 90218, "epoch": 1086} {"train_loss": -21.238954544067383, "global_step": 90219, "epoch": 1086} {"train_loss": -21.492134737681194, "global_step": 90220, "epoch": 1086, "val_loss": 6031405.5} {"train_loss": -21.162372589111328, "global_step": 90221, "epoch": 1087} {"train_loss": -20.530811309814453, "global_step": 90222, "epoch": 1087} {"train_loss": -20.951868057250977, "global_step": 90223, "epoch": 1087} {"train_loss": -20.6528263092041, "global_step": 90224, "epoch": 1087} {"train_loss": -21.269556045532227, "global_step": 90225, "epoch": 1087} {"train_loss": -21.084074020385742, "global_step": 90226, "epoch": 1087} {"train_loss": -21.03065299987793, "global_step": 90227, "epoch": 1087} {"train_loss": -21.592456817626953, "global_step": 90228, "epoch": 1087} {"train_loss": -21.05489158630371, "global_step": 90229, "epoch": 1087} {"train_loss": -21.18403434753418, "global_step": 90230, "epoch": 1087} {"train_loss": -20.873300552368164, "global_step": 90231, "epoch": 1087} {"train_loss": -21.532028198242188, "global_step": 90232, "epoch": 1087} {"train_loss": -21.096052169799805, "global_step": 90233, "epoch": 1087} {"train_loss": -20.914457321166992, "global_step": 90234, "epoch": 1087} {"train_loss": -21.302072525024414, "global_step": 90235, "epoch": 1087} {"train_loss": -21.521059036254883, "global_step": 90236, "epoch": 1087} {"train_loss": -21.585987091064453, "global_step": 90237, "epoch": 1087} {"train_loss": -21.80230712890625, "global_step": 90238, "epoch": 1087} {"train_loss": -21.705982208251953, "global_step": 90239, "epoch": 1087} {"train_loss": -21.67159080505371, "global_step": 90240, "epoch": 1087} {"train_loss": -21.703092575073242, "global_step": 90241, "epoch": 1087} {"train_loss": -21.585514068603516, "global_step": 90242, "epoch": 1087} {"train_loss": -21.670459747314453, "global_step": 90243, "epoch": 1087} {"train_loss": -21.579727172851562, "global_step": 90244, "epoch": 1087} {"train_loss": -21.757863998413086, "global_step": 90245, "epoch": 1087} {"train_loss": -21.622827529907227, "global_step": 90246, "epoch": 1087} {"train_loss": -21.262516021728516, "global_step": 90247, "epoch": 1087} {"train_loss": -21.427953720092773, "global_step": 90248, "epoch": 1087} {"train_loss": -21.49347496032715, "global_step": 90249, "epoch": 1087} {"train_loss": -21.611608505249023, "global_step": 90250, "epoch": 1087} {"train_loss": -21.49329948425293, "global_step": 90251, "epoch": 1087} {"train_loss": -21.243209838867188, "global_step": 90252, "epoch": 1087} {"train_loss": -21.540220260620117, "global_step": 90253, "epoch": 1087} {"train_loss": -21.607301712036133, "global_step": 90254, "epoch": 1087} {"train_loss": -21.839181900024414, "global_step": 90255, "epoch": 1087} {"train_loss": -21.841581344604492, "global_step": 90256, "epoch": 1087} {"train_loss": -21.774356842041016, "global_step": 90257, "epoch": 1087} {"train_loss": -21.724899291992188, "global_step": 90258, "epoch": 1087} {"train_loss": -21.77780532836914, "global_step": 90259, "epoch": 1087} {"train_loss": -21.368635177612305, "global_step": 90260, "epoch": 1087} {"train_loss": -21.28407859802246, "global_step": 90261, "epoch": 1087} {"train_loss": -21.716405868530273, "global_step": 90262, "epoch": 1087} {"train_loss": -21.68668556213379, "global_step": 90263, "epoch": 1087} {"train_loss": -21.65839958190918, "global_step": 90264, "epoch": 1087} {"train_loss": -21.591943740844727, "global_step": 90265, "epoch": 1087} {"train_loss": -21.216856002807617, "global_step": 90266, "epoch": 1087} {"train_loss": -21.591581344604492, "global_step": 90267, "epoch": 1087} {"train_loss": -21.908903121948242, "global_step": 90268, "epoch": 1087} {"train_loss": -21.715253829956055, "global_step": 90269, "epoch": 1087} {"train_loss": -21.631269454956055, "global_step": 90270, "epoch": 1087} {"train_loss": -21.733978271484375, "global_step": 90271, "epoch": 1087} {"train_loss": -21.22003173828125, "global_step": 90272, "epoch": 1087} {"train_loss": -21.656667709350586, "global_step": 90273, "epoch": 1087} {"train_loss": -21.729135513305664, "global_step": 90274, "epoch": 1087} {"train_loss": -21.92962646484375, "global_step": 90275, "epoch": 1087} {"train_loss": -21.722156524658203, "global_step": 90276, "epoch": 1087} {"train_loss": -21.192832946777344, "global_step": 90277, "epoch": 1087} {"train_loss": -21.46772575378418, "global_step": 90278, "epoch": 1087} {"train_loss": -21.491409301757812, "global_step": 90279, "epoch": 1087} {"train_loss": -21.313934326171875, "global_step": 90280, "epoch": 1087} {"train_loss": -21.595558166503906, "global_step": 90281, "epoch": 1087} {"train_loss": -21.759103775024414, "global_step": 90282, "epoch": 1087} {"train_loss": -21.517065048217773, "global_step": 90283, "epoch": 1087} {"train_loss": -21.996152877807617, "global_step": 90284, "epoch": 1087} {"train_loss": -21.428308486938477, "global_step": 90285, "epoch": 1087} {"train_loss": -21.776315689086914, "global_step": 90286, "epoch": 1087} {"train_loss": -21.449827194213867, "global_step": 90287, "epoch": 1087} {"train_loss": -21.629541397094727, "global_step": 90288, "epoch": 1087} {"train_loss": -21.618913650512695, "global_step": 90289, "epoch": 1087} {"train_loss": -21.708463668823242, "global_step": 90290, "epoch": 1087} {"train_loss": -21.739347457885742, "global_step": 90291, "epoch": 1087} {"train_loss": -21.727163314819336, "global_step": 90292, "epoch": 1087} {"train_loss": -21.502410888671875, "global_step": 90293, "epoch": 1087} {"train_loss": -21.50181007385254, "global_step": 90294, "epoch": 1087} {"train_loss": -21.68134117126465, "global_step": 90295, "epoch": 1087} {"train_loss": -22.127681732177734, "global_step": 90296, "epoch": 1087} {"train_loss": -21.37921905517578, "global_step": 90297, "epoch": 1087} {"train_loss": -21.614341735839844, "global_step": 90298, "epoch": 1087} {"train_loss": -21.944425582885742, "global_step": 90299, "epoch": 1087} {"train_loss": -21.6834716796875, "global_step": 90300, "epoch": 1087} {"train_loss": -21.41299819946289, "global_step": 90301, "epoch": 1087} {"train_loss": -21.712514877319336, "global_step": 90302, "epoch": 1087} {"train_loss": -21.514664385692182, "global_step": 90303, "epoch": 1087, "val_loss": 6181578.5} {"train_loss": -20.77228355407715, "global_step": 90304, "epoch": 1088} {"train_loss": -21.05698013305664, "global_step": 90305, "epoch": 1088} {"train_loss": -21.214929580688477, "global_step": 90306, "epoch": 1088} {"train_loss": -21.62611961364746, "global_step": 90307, "epoch": 1088} {"train_loss": -20.99483871459961, "global_step": 90308, "epoch": 1088} {"train_loss": -21.153425216674805, "global_step": 90309, "epoch": 1088} {"train_loss": -21.379980087280273, "global_step": 90310, "epoch": 1088} {"train_loss": -21.566722869873047, "global_step": 90311, "epoch": 1088} {"train_loss": -21.058324813842773, "global_step": 90312, "epoch": 1088} {"train_loss": -21.48723602294922, "global_step": 90313, "epoch": 1088} {"train_loss": -21.30866050720215, "global_step": 90314, "epoch": 1088} {"train_loss": -21.28262710571289, "global_step": 90315, "epoch": 1088} {"train_loss": -21.074684143066406, "global_step": 90316, "epoch": 1088} {"train_loss": -21.309045791625977, "global_step": 90317, "epoch": 1088} {"train_loss": -21.313974380493164, "global_step": 90318, "epoch": 1088} {"train_loss": -21.63852310180664, "global_step": 90319, "epoch": 1088} {"train_loss": -21.601806640625, "global_step": 90320, "epoch": 1088} {"train_loss": -21.58275604248047, "global_step": 90321, "epoch": 1088} {"train_loss": -21.538414001464844, "global_step": 90322, "epoch": 1088} {"train_loss": -21.573688507080078, "global_step": 90323, "epoch": 1088} {"train_loss": -21.52536964416504, "global_step": 90324, "epoch": 1088} {"train_loss": -21.78339958190918, "global_step": 90325, "epoch": 1088} {"train_loss": -21.98768424987793, "global_step": 90326, "epoch": 1088} {"train_loss": -22.060672760009766, "global_step": 90327, "epoch": 1088} {"train_loss": -21.547103881835938, "global_step": 90328, "epoch": 1088} {"train_loss": -21.636594772338867, "global_step": 90329, "epoch": 1088} {"train_loss": -21.671707153320312, "global_step": 90330, "epoch": 1088} {"train_loss": -21.47353172302246, "global_step": 90331, "epoch": 1088} {"train_loss": -21.615867614746094, "global_step": 90332, "epoch": 1088} {"train_loss": -21.669225692749023, "global_step": 90333, "epoch": 1088} {"train_loss": -21.85529136657715, "global_step": 90334, "epoch": 1088} {"train_loss": -21.56517219543457, "global_step": 90335, "epoch": 1088} {"train_loss": -21.577102661132812, "global_step": 90336, "epoch": 1088} {"train_loss": -21.362150192260742, "global_step": 90337, "epoch": 1088} {"train_loss": -21.629514694213867, "global_step": 90338, "epoch": 1088} {"train_loss": -21.56145668029785, "global_step": 90339, "epoch": 1088} {"train_loss": -21.8526611328125, "global_step": 90340, "epoch": 1088} {"train_loss": -21.079374313354492, "global_step": 90341, "epoch": 1088} {"train_loss": -21.576974868774414, "global_step": 90342, "epoch": 1088} {"train_loss": -21.598655700683594, "global_step": 90343, "epoch": 1088} {"train_loss": -21.572195053100586, "global_step": 90344, "epoch": 1088} {"train_loss": -21.393659591674805, "global_step": 90345, "epoch": 1088} {"train_loss": -21.642576217651367, "global_step": 90346, "epoch": 1088} {"train_loss": -21.695608139038086, "global_step": 90347, "epoch": 1088} {"train_loss": -21.46896743774414, "global_step": 90348, "epoch": 1088} {"train_loss": -21.521841049194336, "global_step": 90349, "epoch": 1088} {"train_loss": -21.77070426940918, "global_step": 90350, "epoch": 1088} {"train_loss": -21.788633346557617, "global_step": 90351, "epoch": 1088} {"train_loss": -21.42213249206543, "global_step": 90352, "epoch": 1088} {"train_loss": -21.66448974609375, "global_step": 90353, "epoch": 1088} {"train_loss": -21.61358642578125, "global_step": 90354, "epoch": 1088} {"train_loss": -21.805208206176758, "global_step": 90355, "epoch": 1088} {"train_loss": -21.291479110717773, "global_step": 90356, "epoch": 1088} {"train_loss": -21.628965377807617, "global_step": 90357, "epoch": 1088} {"train_loss": -21.696979522705078, "global_step": 90358, "epoch": 1088} {"train_loss": -21.526777267456055, "global_step": 90359, "epoch": 1088} {"train_loss": -21.45160484313965, "global_step": 90360, "epoch": 1088} {"train_loss": -21.673227310180664, "global_step": 90361, "epoch": 1088} {"train_loss": -21.630538940429688, "global_step": 90362, "epoch": 1088} {"train_loss": -21.547502517700195, "global_step": 90363, "epoch": 1088} {"train_loss": -21.666906356811523, "global_step": 90364, "epoch": 1088} {"train_loss": -21.884952545166016, "global_step": 90365, "epoch": 1088} {"train_loss": -21.527135848999023, "global_step": 90366, "epoch": 1088} {"train_loss": -21.826526641845703, "global_step": 90367, "epoch": 1088} {"train_loss": -21.786087036132812, "global_step": 90368, "epoch": 1088} {"train_loss": -21.70448875427246, "global_step": 90369, "epoch": 1088} {"train_loss": -21.341928482055664, "global_step": 90370, "epoch": 1088} {"train_loss": -21.638965606689453, "global_step": 90371, "epoch": 1088} {"train_loss": -21.520771026611328, "global_step": 90372, "epoch": 1088} {"train_loss": -21.566173553466797, "global_step": 90373, "epoch": 1088} {"train_loss": -21.743825912475586, "global_step": 90374, "epoch": 1088} {"train_loss": -21.446237564086914, "global_step": 90375, "epoch": 1088} {"train_loss": -21.485475540161133, "global_step": 90376, "epoch": 1088} {"train_loss": -21.833227157592773, "global_step": 90377, "epoch": 1088} {"train_loss": -21.532621383666992, "global_step": 90378, "epoch": 1088} {"train_loss": -21.65766716003418, "global_step": 90379, "epoch": 1088} {"train_loss": -21.532567977905273, "global_step": 90380, "epoch": 1088} {"train_loss": -21.937063217163086, "global_step": 90381, "epoch": 1088} {"train_loss": -21.11806297302246, "global_step": 90382, "epoch": 1088} {"train_loss": -21.877405166625977, "global_step": 90383, "epoch": 1088} {"train_loss": -21.648897171020508, "global_step": 90384, "epoch": 1088} {"train_loss": -21.499486923217773, "global_step": 90385, "epoch": 1088} {"train_loss": -21.56028090327619, "global_step": 90386, "epoch": 1088, "val_loss": 6073915.5} {"train_loss": -21.328702926635742, "global_step": 90387, "epoch": 1089} {"train_loss": -21.100929260253906, "global_step": 90388, "epoch": 1089} {"train_loss": -21.364639282226562, "global_step": 90389, "epoch": 1089} {"train_loss": -21.344709396362305, "global_step": 90390, "epoch": 1089} {"train_loss": -21.112403869628906, "global_step": 90391, "epoch": 1089} {"train_loss": -21.160085678100586, "global_step": 90392, "epoch": 1089} {"train_loss": -21.244464874267578, "global_step": 90393, "epoch": 1089} {"train_loss": -21.279279708862305, "global_step": 90394, "epoch": 1089} {"train_loss": -21.498310089111328, "global_step": 90395, "epoch": 1089} {"train_loss": -21.903615951538086, "global_step": 90396, "epoch": 1089} {"train_loss": -21.337677001953125, "global_step": 90397, "epoch": 1089} {"train_loss": -21.273555755615234, "global_step": 90398, "epoch": 1089} {"train_loss": -21.52492904663086, "global_step": 90399, "epoch": 1089} {"train_loss": -21.370161056518555, "global_step": 90400, "epoch": 1089} {"train_loss": -21.294208526611328, "global_step": 90401, "epoch": 1089} {"train_loss": -21.586116790771484, "global_step": 90402, "epoch": 1089} {"train_loss": -21.538076400756836, "global_step": 90403, "epoch": 1089} {"train_loss": -21.783199310302734, "global_step": 90404, "epoch": 1089} {"train_loss": -21.63917350769043, "global_step": 90405, "epoch": 1089} {"train_loss": -21.353788375854492, "global_step": 90406, "epoch": 1089} {"train_loss": -21.60310935974121, "global_step": 90407, "epoch": 1089} {"train_loss": -21.603515625, "global_step": 90408, "epoch": 1089} {"train_loss": -21.434452056884766, "global_step": 90409, "epoch": 1089} {"train_loss": -21.67456817626953, "global_step": 90410, "epoch": 1089} {"train_loss": -21.55980110168457, "global_step": 90411, "epoch": 1089} {"train_loss": -21.541412353515625, "global_step": 90412, "epoch": 1089} {"train_loss": -21.75905990600586, "global_step": 90413, "epoch": 1089} {"train_loss": -21.564369201660156, "global_step": 90414, "epoch": 1089} {"train_loss": -21.399938583374023, "global_step": 90415, "epoch": 1089} {"train_loss": -21.412841796875, "global_step": 90416, "epoch": 1089} {"train_loss": -21.19573402404785, "global_step": 90417, "epoch": 1089} {"train_loss": -21.46009635925293, "global_step": 90418, "epoch": 1089} {"train_loss": -21.125642776489258, "global_step": 90419, "epoch": 1089} {"train_loss": -21.762149810791016, "global_step": 90420, "epoch": 1089} {"train_loss": -21.495121002197266, "global_step": 90421, "epoch": 1089} {"train_loss": -21.52775001525879, "global_step": 90422, "epoch": 1089} {"train_loss": -21.95246696472168, "global_step": 90423, "epoch": 1089} {"train_loss": -21.476200103759766, "global_step": 90424, "epoch": 1089} {"train_loss": -21.801435470581055, "global_step": 90425, "epoch": 1089} {"train_loss": -21.76473045349121, "global_step": 90426, "epoch": 1089} {"train_loss": -21.756513595581055, "global_step": 90427, "epoch": 1089} {"train_loss": -21.329465866088867, "global_step": 90428, "epoch": 1089} {"train_loss": -21.73076820373535, "global_step": 90429, "epoch": 1089} {"train_loss": -21.668668746948242, "global_step": 90430, "epoch": 1089} {"train_loss": -21.43089485168457, "global_step": 90431, "epoch": 1089} {"train_loss": -21.109533309936523, "global_step": 90432, "epoch": 1089} {"train_loss": -21.0327091217041, "global_step": 90433, "epoch": 1089} {"train_loss": -21.764814376831055, "global_step": 90434, "epoch": 1089} {"train_loss": -21.440860748291016, "global_step": 90435, "epoch": 1089} {"train_loss": -21.70768928527832, "global_step": 90436, "epoch": 1089} {"train_loss": -21.693445205688477, "global_step": 90437, "epoch": 1089} {"train_loss": -21.46004295349121, "global_step": 90438, "epoch": 1089} {"train_loss": -21.644094467163086, "global_step": 90439, "epoch": 1089} {"train_loss": -21.367551803588867, "global_step": 90440, "epoch": 1089} {"train_loss": -21.548307418823242, "global_step": 90441, "epoch": 1089} {"train_loss": -21.392953872680664, "global_step": 90442, "epoch": 1089} {"train_loss": -21.80461883544922, "global_step": 90443, "epoch": 1089} {"train_loss": -21.25678062438965, "global_step": 90444, "epoch": 1089} {"train_loss": -22.012802124023438, "global_step": 90445, "epoch": 1089} {"train_loss": -21.38945960998535, "global_step": 90446, "epoch": 1089} {"train_loss": -21.942121505737305, "global_step": 90447, "epoch": 1089} {"train_loss": -21.650754928588867, "global_step": 90448, "epoch": 1089} {"train_loss": -21.589712142944336, "global_step": 90449, "epoch": 1089} {"train_loss": -21.238563537597656, "global_step": 90450, "epoch": 1089} {"train_loss": -21.559659957885742, "global_step": 90451, "epoch": 1089} {"train_loss": -21.299514770507812, "global_step": 90452, "epoch": 1089} {"train_loss": -21.688819885253906, "global_step": 90453, "epoch": 1089} {"train_loss": -21.643003463745117, "global_step": 90454, "epoch": 1089} {"train_loss": -21.512556076049805, "global_step": 90455, "epoch": 1089} {"train_loss": -21.562070846557617, "global_step": 90456, "epoch": 1089} {"train_loss": -21.609163284301758, "global_step": 90457, "epoch": 1089} {"train_loss": -21.505695343017578, "global_step": 90458, "epoch": 1089} {"train_loss": -21.55433464050293, "global_step": 90459, "epoch": 1089} {"train_loss": -21.746414184570312, "global_step": 90460, "epoch": 1089} {"train_loss": -21.7493896484375, "global_step": 90461, "epoch": 1089} {"train_loss": -21.809600830078125, "global_step": 90462, "epoch": 1089} {"train_loss": -21.621320724487305, "global_step": 90463, "epoch": 1089} {"train_loss": -21.57681655883789, "global_step": 90464, "epoch": 1089} {"train_loss": -21.707862854003906, "global_step": 90465, "epoch": 1089} {"train_loss": -21.518218994140625, "global_step": 90466, "epoch": 1089} {"train_loss": -21.640562057495117, "global_step": 90467, "epoch": 1089} {"train_loss": -21.59153175354004, "global_step": 90468, "epoch": 1089} {"train_loss": -21.540134200130602, "global_step": 90469, "epoch": 1089, "val_loss": 6150624.5} {"train_loss": -21.224674224853516, "global_step": 90470, "epoch": 1090} {"train_loss": -21.189105987548828, "global_step": 90471, "epoch": 1090} {"train_loss": -21.16275405883789, "global_step": 90472, "epoch": 1090} {"train_loss": -20.76079750061035, "global_step": 90473, "epoch": 1090} {"train_loss": -21.82167625427246, "global_step": 90474, "epoch": 1090} {"train_loss": -21.089935302734375, "global_step": 90475, "epoch": 1090} {"train_loss": -21.366117477416992, "global_step": 90476, "epoch": 1090} {"train_loss": -21.419099807739258, "global_step": 90477, "epoch": 1090} {"train_loss": -21.1596736907959, "global_step": 90478, "epoch": 1090} {"train_loss": -21.298795700073242, "global_step": 90479, "epoch": 1090} {"train_loss": -21.165884017944336, "global_step": 90480, "epoch": 1090} {"train_loss": -21.39530372619629, "global_step": 90481, "epoch": 1090} {"train_loss": -21.360336303710938, "global_step": 90482, "epoch": 1090} {"train_loss": -21.66877555847168, "global_step": 90483, "epoch": 1090} {"train_loss": -21.39511489868164, "global_step": 90484, "epoch": 1090} {"train_loss": -21.51218032836914, "global_step": 90485, "epoch": 1090} {"train_loss": -21.71318817138672, "global_step": 90486, "epoch": 1090} {"train_loss": -21.048669815063477, "global_step": 90487, "epoch": 1090} {"train_loss": -21.682260513305664, "global_step": 90488, "epoch": 1090} {"train_loss": -21.12593650817871, "global_step": 90489, "epoch": 1090} {"train_loss": -21.215839385986328, "global_step": 90490, "epoch": 1090} {"train_loss": -21.44769859313965, "global_step": 90491, "epoch": 1090} {"train_loss": -21.707496643066406, "global_step": 90492, "epoch": 1090} {"train_loss": -21.516523361206055, "global_step": 90493, "epoch": 1090} {"train_loss": -21.29168128967285, "global_step": 90494, "epoch": 1090} {"train_loss": -21.578832626342773, "global_step": 90495, "epoch": 1090} {"train_loss": -21.690998077392578, "global_step": 90496, "epoch": 1090} {"train_loss": -21.60662841796875, "global_step": 90497, "epoch": 1090} {"train_loss": -21.82014274597168, "global_step": 90498, "epoch": 1090} {"train_loss": -21.29669952392578, "global_step": 90499, "epoch": 1090} {"train_loss": -21.374422073364258, "global_step": 90500, "epoch": 1090} {"train_loss": -21.378175735473633, "global_step": 90501, "epoch": 1090} {"train_loss": -21.766897201538086, "global_step": 90502, "epoch": 1090} {"train_loss": -21.432567596435547, "global_step": 90503, "epoch": 1090} {"train_loss": -21.6281795501709, "global_step": 90504, "epoch": 1090} {"train_loss": -21.581247329711914, "global_step": 90505, "epoch": 1090} {"train_loss": -22.00031852722168, "global_step": 90506, "epoch": 1090} {"train_loss": -21.818227767944336, "global_step": 90507, "epoch": 1090} {"train_loss": -21.96897315979004, "global_step": 90508, "epoch": 1090} {"train_loss": -21.947063446044922, "global_step": 90509, "epoch": 1090} {"train_loss": -21.634855270385742, "global_step": 90510, "epoch": 1090} {"train_loss": -22.166555404663086, "global_step": 90511, "epoch": 1090} {"train_loss": -21.37017822265625, "global_step": 90512, "epoch": 1090} {"train_loss": -21.6107234954834, "global_step": 90513, "epoch": 1090} {"train_loss": -21.430648803710938, "global_step": 90514, "epoch": 1090} {"train_loss": -21.91452407836914, "global_step": 90515, "epoch": 1090} {"train_loss": -21.9378662109375, "global_step": 90516, "epoch": 1090} {"train_loss": -21.650339126586914, "global_step": 90517, "epoch": 1090} {"train_loss": -21.660388946533203, "global_step": 90518, "epoch": 1090} {"train_loss": -21.649394989013672, "global_step": 90519, "epoch": 1090} {"train_loss": -21.243083953857422, "global_step": 90520, "epoch": 1090} {"train_loss": -21.98001480102539, "global_step": 90521, "epoch": 1090} {"train_loss": -22.04146385192871, "global_step": 90522, "epoch": 1090} {"train_loss": -21.602741241455078, "global_step": 90523, "epoch": 1090} {"train_loss": -21.9166316986084, "global_step": 90524, "epoch": 1090} {"train_loss": -21.45846939086914, "global_step": 90525, "epoch": 1090} {"train_loss": -21.54978370666504, "global_step": 90526, "epoch": 1090} {"train_loss": -21.726478576660156, "global_step": 90527, "epoch": 1090} {"train_loss": -21.77491569519043, "global_step": 90528, "epoch": 1090} {"train_loss": -21.358449935913086, "global_step": 90529, "epoch": 1090} {"train_loss": -21.536651611328125, "global_step": 90530, "epoch": 1090} {"train_loss": -21.77015495300293, "global_step": 90531, "epoch": 1090} {"train_loss": -21.546411514282227, "global_step": 90532, "epoch": 1090} {"train_loss": -21.734819412231445, "global_step": 90533, "epoch": 1090} {"train_loss": -21.579687118530273, "global_step": 90534, "epoch": 1090} {"train_loss": -21.72493553161621, "global_step": 90535, "epoch": 1090} {"train_loss": -21.92354393005371, "global_step": 90536, "epoch": 1090} {"train_loss": -22.044260025024414, "global_step": 90537, "epoch": 1090} {"train_loss": -21.40578269958496, "global_step": 90538, "epoch": 1090} {"train_loss": -21.776071548461914, "global_step": 90539, "epoch": 1090} {"train_loss": -21.280643463134766, "global_step": 90540, "epoch": 1090} {"train_loss": -22.056852340698242, "global_step": 90541, "epoch": 1090} {"train_loss": -21.409032821655273, "global_step": 90542, "epoch": 1090} {"train_loss": -21.379318237304688, "global_step": 90543, "epoch": 1090} {"train_loss": -21.81550407409668, "global_step": 90544, "epoch": 1090} {"train_loss": -21.487075805664062, "global_step": 90545, "epoch": 1090} {"train_loss": -21.39109230041504, "global_step": 90546, "epoch": 1090} {"train_loss": -21.4827938079834, "global_step": 90547, "epoch": 1090} {"train_loss": -21.317529678344727, "global_step": 90548, "epoch": 1090} {"train_loss": -21.205923080444336, "global_step": 90549, "epoch": 1090} {"train_loss": -22.10951805114746, "global_step": 90550, "epoch": 1090} {"train_loss": -21.375255584716797, "global_step": 90551, "epoch": 1090} {"train_loss": -21.549420161419604, "global_step": 90552, "epoch": 1090, "val_loss": 6090847.0} {"train_loss": -20.91715431213379, "global_step": 90553, "epoch": 1091} {"train_loss": -21.400121688842773, "global_step": 90554, "epoch": 1091} {"train_loss": -21.089622497558594, "global_step": 90555, "epoch": 1091} {"train_loss": -21.682510375976562, "global_step": 90556, "epoch": 1091} {"train_loss": -21.093557357788086, "global_step": 90557, "epoch": 1091} {"train_loss": -21.29994773864746, "global_step": 90558, "epoch": 1091} {"train_loss": -21.536775588989258, "global_step": 90559, "epoch": 1091} {"train_loss": -21.467288970947266, "global_step": 90560, "epoch": 1091} {"train_loss": -21.359230041503906, "global_step": 90561, "epoch": 1091} {"train_loss": -21.339523315429688, "global_step": 90562, "epoch": 1091} {"train_loss": -21.355680465698242, "global_step": 90563, "epoch": 1091} {"train_loss": -21.3724308013916, "global_step": 90564, "epoch": 1091} {"train_loss": -21.440046310424805, "global_step": 90565, "epoch": 1091} {"train_loss": -21.662939071655273, "global_step": 90566, "epoch": 1091} {"train_loss": -21.594091415405273, "global_step": 90567, "epoch": 1091} {"train_loss": -21.267492294311523, "global_step": 90568, "epoch": 1091} {"train_loss": -21.586759567260742, "global_step": 90569, "epoch": 1091} {"train_loss": -21.998157501220703, "global_step": 90570, "epoch": 1091} {"train_loss": -21.642881393432617, "global_step": 90571, "epoch": 1091} {"train_loss": -21.38399887084961, "global_step": 90572, "epoch": 1091} {"train_loss": -21.7283992767334, "global_step": 90573, "epoch": 1091} {"train_loss": -21.6488037109375, "global_step": 90574, "epoch": 1091} {"train_loss": -21.641754150390625, "global_step": 90575, "epoch": 1091} {"train_loss": -21.463598251342773, "global_step": 90576, "epoch": 1091} {"train_loss": -21.541025161743164, "global_step": 90577, "epoch": 1091} {"train_loss": -21.218305587768555, "global_step": 90578, "epoch": 1091} {"train_loss": -21.309284210205078, "global_step": 90579, "epoch": 1091} {"train_loss": -21.76827049255371, "global_step": 90580, "epoch": 1091} {"train_loss": -21.589096069335938, "global_step": 90581, "epoch": 1091} {"train_loss": -21.790800094604492, "global_step": 90582, "epoch": 1091} {"train_loss": -21.19925880432129, "global_step": 90583, "epoch": 1091} {"train_loss": -21.5577335357666, "global_step": 90584, "epoch": 1091} {"train_loss": -21.76609230041504, "global_step": 90585, "epoch": 1091} {"train_loss": -21.395282745361328, "global_step": 90586, "epoch": 1091} {"train_loss": -21.990718841552734, "global_step": 90587, "epoch": 1091} {"train_loss": -21.480146408081055, "global_step": 90588, "epoch": 1091} {"train_loss": -21.401540756225586, "global_step": 90589, "epoch": 1091} {"train_loss": -21.645490646362305, "global_step": 90590, "epoch": 1091} {"train_loss": -21.842182159423828, "global_step": 90591, "epoch": 1091} {"train_loss": -21.57504653930664, "global_step": 90592, "epoch": 1091} {"train_loss": -21.723648071289062, "global_step": 90593, "epoch": 1091} {"train_loss": -21.543739318847656, "global_step": 90594, "epoch": 1091} {"train_loss": -21.222841262817383, "global_step": 90595, "epoch": 1091} {"train_loss": -21.757184982299805, "global_step": 90596, "epoch": 1091} {"train_loss": -21.889408111572266, "global_step": 90597, "epoch": 1091} {"train_loss": -21.734594345092773, "global_step": 90598, "epoch": 1091} {"train_loss": -21.59589958190918, "global_step": 90599, "epoch": 1091} {"train_loss": -22.06670379638672, "global_step": 90600, "epoch": 1091} {"train_loss": -21.348148345947266, "global_step": 90601, "epoch": 1091} {"train_loss": -21.688993453979492, "global_step": 90602, "epoch": 1091} {"train_loss": -21.46564483642578, "global_step": 90603, "epoch": 1091} {"train_loss": -21.63934326171875, "global_step": 90604, "epoch": 1091} {"train_loss": -21.4010066986084, "global_step": 90605, "epoch": 1091} {"train_loss": -21.440277099609375, "global_step": 90606, "epoch": 1091} {"train_loss": -21.578290939331055, "global_step": 90607, "epoch": 1091} {"train_loss": -21.595979690551758, "global_step": 90608, "epoch": 1091} {"train_loss": -21.64991569519043, "global_step": 90609, "epoch": 1091} {"train_loss": -21.58112907409668, "global_step": 90610, "epoch": 1091} {"train_loss": -21.445682525634766, "global_step": 90611, "epoch": 1091} {"train_loss": -21.546396255493164, "global_step": 90612, "epoch": 1091} {"train_loss": -21.528972625732422, "global_step": 90613, "epoch": 1091} {"train_loss": -21.384708404541016, "global_step": 90614, "epoch": 1091} {"train_loss": -21.90224838256836, "global_step": 90615, "epoch": 1091} {"train_loss": -21.539203643798828, "global_step": 90616, "epoch": 1091} {"train_loss": -21.373580932617188, "global_step": 90617, "epoch": 1091} {"train_loss": -21.536375045776367, "global_step": 90618, "epoch": 1091} {"train_loss": -21.526914596557617, "global_step": 90619, "epoch": 1091} {"train_loss": -21.73267936706543, "global_step": 90620, "epoch": 1091} {"train_loss": -21.686935424804688, "global_step": 90621, "epoch": 1091} {"train_loss": -21.703216552734375, "global_step": 90622, "epoch": 1091} {"train_loss": -21.823659896850586, "global_step": 90623, "epoch": 1091} {"train_loss": -21.727298736572266, "global_step": 90624, "epoch": 1091} {"train_loss": -21.45964813232422, "global_step": 90625, "epoch": 1091} {"train_loss": -21.497709274291992, "global_step": 90626, "epoch": 1091} {"train_loss": -21.355161666870117, "global_step": 90627, "epoch": 1091} {"train_loss": -21.64156150817871, "global_step": 90628, "epoch": 1091} {"train_loss": -21.52143669128418, "global_step": 90629, "epoch": 1091} {"train_loss": -21.22951316833496, "global_step": 90630, "epoch": 1091} {"train_loss": -21.7789249420166, "global_step": 90631, "epoch": 1091} {"train_loss": -21.827796936035156, "global_step": 90632, "epoch": 1091} {"train_loss": -22.057788848876953, "global_step": 90633, "epoch": 1091} {"train_loss": -21.84699058532715, "global_step": 90634, "epoch": 1091} {"train_loss": -21.545892508633166, "global_step": 90635, "epoch": 1091, "val_loss": 5954278.0} {"train_loss": -20.778493881225586, "global_step": 90636, "epoch": 1092} {"train_loss": -20.65826416015625, "global_step": 90637, "epoch": 1092} {"train_loss": -20.963956832885742, "global_step": 90638, "epoch": 1092} {"train_loss": -20.880647659301758, "global_step": 90639, "epoch": 1092} {"train_loss": -20.92886734008789, "global_step": 90640, "epoch": 1092} {"train_loss": -21.02765464782715, "global_step": 90641, "epoch": 1092} {"train_loss": -21.0401611328125, "global_step": 90642, "epoch": 1092} {"train_loss": -21.283287048339844, "global_step": 90643, "epoch": 1092} {"train_loss": -21.244047164916992, "global_step": 90644, "epoch": 1092} {"train_loss": -20.86903953552246, "global_step": 90645, "epoch": 1092} {"train_loss": -21.502408981323242, "global_step": 90646, "epoch": 1092} {"train_loss": -20.949508666992188, "global_step": 90647, "epoch": 1092} {"train_loss": -21.360342025756836, "global_step": 90648, "epoch": 1092} {"train_loss": -21.127721786499023, "global_step": 90649, "epoch": 1092} {"train_loss": -21.344690322875977, "global_step": 90650, "epoch": 1092} {"train_loss": -21.2550106048584, "global_step": 90651, "epoch": 1092} {"train_loss": -21.3721866607666, "global_step": 90652, "epoch": 1092} {"train_loss": -21.317907333374023, "global_step": 90653, "epoch": 1092} {"train_loss": -21.411245346069336, "global_step": 90654, "epoch": 1092} {"train_loss": -21.255735397338867, "global_step": 90655, "epoch": 1092} {"train_loss": -21.416217803955078, "global_step": 90656, "epoch": 1092} {"train_loss": -21.283187866210938, "global_step": 90657, "epoch": 1092} {"train_loss": -21.46921157836914, "global_step": 90658, "epoch": 1092} {"train_loss": -21.58587074279785, "global_step": 90659, "epoch": 1092} {"train_loss": -21.228139877319336, "global_step": 90660, "epoch": 1092} {"train_loss": -21.260650634765625, "global_step": 90661, "epoch": 1092} {"train_loss": -21.681821823120117, "global_step": 90662, "epoch": 1092} {"train_loss": -21.44584846496582, "global_step": 90663, "epoch": 1092} {"train_loss": -21.25803565979004, "global_step": 90664, "epoch": 1092} {"train_loss": -21.505573272705078, "global_step": 90665, "epoch": 1092} {"train_loss": -21.43947410583496, "global_step": 90666, "epoch": 1092} {"train_loss": -21.55423927307129, "global_step": 90667, "epoch": 1092} {"train_loss": -21.452289581298828, "global_step": 90668, "epoch": 1092} {"train_loss": -21.60646629333496, "global_step": 90669, "epoch": 1092} {"train_loss": -21.742887496948242, "global_step": 90670, "epoch": 1092} {"train_loss": -21.548513412475586, "global_step": 90671, "epoch": 1092} {"train_loss": -21.505916595458984, "global_step": 90672, "epoch": 1092} {"train_loss": -21.47010612487793, "global_step": 90673, "epoch": 1092} {"train_loss": -21.77362632751465, "global_step": 90674, "epoch": 1092} {"train_loss": -21.960233688354492, "global_step": 90675, "epoch": 1092} {"train_loss": -22.01861000061035, "global_step": 90676, "epoch": 1092} {"train_loss": -21.389236450195312, "global_step": 90677, "epoch": 1092} {"train_loss": -21.77533721923828, "global_step": 90678, "epoch": 1092} {"train_loss": -21.22024154663086, "global_step": 90679, "epoch": 1092} {"train_loss": -21.852569580078125, "global_step": 90680, "epoch": 1092} {"train_loss": -21.64907455444336, "global_step": 90681, "epoch": 1092} {"train_loss": -21.851743698120117, "global_step": 90682, "epoch": 1092} {"train_loss": -21.667936325073242, "global_step": 90683, "epoch": 1092} {"train_loss": -21.67779541015625, "global_step": 90684, "epoch": 1092} {"train_loss": -21.94025230407715, "global_step": 90685, "epoch": 1092} {"train_loss": -21.735319137573242, "global_step": 90686, "epoch": 1092} {"train_loss": -21.62217903137207, "global_step": 90687, "epoch": 1092} {"train_loss": -21.75362777709961, "global_step": 90688, "epoch": 1092} {"train_loss": -21.757617950439453, "global_step": 90689, "epoch": 1092} {"train_loss": -21.385887145996094, "global_step": 90690, "epoch": 1092} {"train_loss": -21.38955307006836, "global_step": 90691, "epoch": 1092} {"train_loss": -21.768394470214844, "global_step": 90692, "epoch": 1092} {"train_loss": -21.6634521484375, "global_step": 90693, "epoch": 1092} {"train_loss": -21.49567413330078, "global_step": 90694, "epoch": 1092} {"train_loss": -21.70313262939453, "global_step": 90695, "epoch": 1092} {"train_loss": -21.625356674194336, "global_step": 90696, "epoch": 1092} {"train_loss": -21.76106834411621, "global_step": 90697, "epoch": 1092} {"train_loss": -21.667739868164062, "global_step": 90698, "epoch": 1092} {"train_loss": -21.72102928161621, "global_step": 90699, "epoch": 1092} {"train_loss": -21.303869247436523, "global_step": 90700, "epoch": 1092} {"train_loss": -20.987581253051758, "global_step": 90701, "epoch": 1092} {"train_loss": -21.515409469604492, "global_step": 90702, "epoch": 1092} {"train_loss": -21.61857032775879, "global_step": 90703, "epoch": 1092} {"train_loss": -21.690841674804688, "global_step": 90704, "epoch": 1092} {"train_loss": -21.474292755126953, "global_step": 90705, "epoch": 1092} {"train_loss": -21.69985008239746, "global_step": 90706, "epoch": 1092} {"train_loss": -21.6846923828125, "global_step": 90707, "epoch": 1092} {"train_loss": -21.541908264160156, "global_step": 90708, "epoch": 1092} {"train_loss": -21.700057983398438, "global_step": 90709, "epoch": 1092} {"train_loss": -21.82454490661621, "global_step": 90710, "epoch": 1092} {"train_loss": -21.80819320678711, "global_step": 90711, "epoch": 1092} {"train_loss": -21.792470932006836, "global_step": 90712, "epoch": 1092} {"train_loss": -21.31117057800293, "global_step": 90713, "epoch": 1092} {"train_loss": -21.756078720092773, "global_step": 90714, "epoch": 1092} {"train_loss": -21.304494857788086, "global_step": 90715, "epoch": 1092} {"train_loss": -20.995267868041992, "global_step": 90716, "epoch": 1092} {"train_loss": -21.576929092407227, "global_step": 90717, "epoch": 1092} {"train_loss": -21.46452189066324, "global_step": 90718, "epoch": 1092, "val_loss": 6041307.5} {"train_loss": -20.84992027282715, "global_step": 90719, "epoch": 1093} {"train_loss": -21.413366317749023, "global_step": 90720, "epoch": 1093} {"train_loss": -21.392810821533203, "global_step": 90721, "epoch": 1093} {"train_loss": -21.297334671020508, "global_step": 90722, "epoch": 1093} {"train_loss": -20.97478485107422, "global_step": 90723, "epoch": 1093} {"train_loss": -21.654945373535156, "global_step": 90724, "epoch": 1093} {"train_loss": -21.434518814086914, "global_step": 90725, "epoch": 1093} {"train_loss": -21.378463745117188, "global_step": 90726, "epoch": 1093} {"train_loss": -21.576005935668945, "global_step": 90727, "epoch": 1093} {"train_loss": -21.404333114624023, "global_step": 90728, "epoch": 1093} {"train_loss": -21.74401092529297, "global_step": 90729, "epoch": 1093} {"train_loss": -21.40827178955078, "global_step": 90730, "epoch": 1093} {"train_loss": -21.177433013916016, "global_step": 90731, "epoch": 1093} {"train_loss": -21.852306365966797, "global_step": 90732, "epoch": 1093} {"train_loss": -21.697675704956055, "global_step": 90733, "epoch": 1093} {"train_loss": -21.53180503845215, "global_step": 90734, "epoch": 1093} {"train_loss": -21.47056007385254, "global_step": 90735, "epoch": 1093} {"train_loss": -21.226747512817383, "global_step": 90736, "epoch": 1093} {"train_loss": -21.65437889099121, "global_step": 90737, "epoch": 1093} {"train_loss": -21.176061630249023, "global_step": 90738, "epoch": 1093} {"train_loss": -21.958066940307617, "global_step": 90739, "epoch": 1093} {"train_loss": -21.463481903076172, "global_step": 90740, "epoch": 1093} {"train_loss": -21.788471221923828, "global_step": 90741, "epoch": 1093} {"train_loss": -21.3702449798584, "global_step": 90742, "epoch": 1093} {"train_loss": -21.65024757385254, "global_step": 90743, "epoch": 1093} {"train_loss": -21.587385177612305, "global_step": 90744, "epoch": 1093} {"train_loss": -21.739360809326172, "global_step": 90745, "epoch": 1093} {"train_loss": -21.54144859313965, "global_step": 90746, "epoch": 1093} {"train_loss": -21.916059494018555, "global_step": 90747, "epoch": 1093} {"train_loss": -21.91823387145996, "global_step": 90748, "epoch": 1093} {"train_loss": -21.327661514282227, "global_step": 90749, "epoch": 1093} {"train_loss": -21.553937911987305, "global_step": 90750, "epoch": 1093} {"train_loss": -21.426462173461914, "global_step": 90751, "epoch": 1093} {"train_loss": -21.35400390625, "global_step": 90752, "epoch": 1093} {"train_loss": -21.574634552001953, "global_step": 90753, "epoch": 1093} {"train_loss": -21.791324615478516, "global_step": 90754, "epoch": 1093} {"train_loss": -21.775226593017578, "global_step": 90755, "epoch": 1093} {"train_loss": -21.66077995300293, "global_step": 90756, "epoch": 1093} {"train_loss": -21.748849868774414, "global_step": 90757, "epoch": 1093} {"train_loss": -21.87550163269043, "global_step": 90758, "epoch": 1093} {"train_loss": -22.237314224243164, "global_step": 90759, "epoch": 1093} {"train_loss": -21.894699096679688, "global_step": 90760, "epoch": 1093} {"train_loss": -21.473432540893555, "global_step": 90761, "epoch": 1093} {"train_loss": -21.777713775634766, "global_step": 90762, "epoch": 1093} {"train_loss": -21.937042236328125, "global_step": 90763, "epoch": 1093} {"train_loss": -22.106061935424805, "global_step": 90764, "epoch": 1093} {"train_loss": -21.666711807250977, "global_step": 90765, "epoch": 1093} {"train_loss": -21.60332679748535, "global_step": 90766, "epoch": 1093} {"train_loss": -21.87624168395996, "global_step": 90767, "epoch": 1093} {"train_loss": -21.576696395874023, "global_step": 90768, "epoch": 1093} {"train_loss": -21.596715927124023, "global_step": 90769, "epoch": 1093} {"train_loss": -21.44757652282715, "global_step": 90770, "epoch": 1093} {"train_loss": -21.607145309448242, "global_step": 90771, "epoch": 1093} {"train_loss": -21.80075454711914, "global_step": 90772, "epoch": 1093} {"train_loss": -21.823352813720703, "global_step": 90773, "epoch": 1093} {"train_loss": -21.88796043395996, "global_step": 90774, "epoch": 1093} {"train_loss": -21.541471481323242, "global_step": 90775, "epoch": 1093} {"train_loss": -21.698381423950195, "global_step": 90776, "epoch": 1093} {"train_loss": -21.79164695739746, "global_step": 90777, "epoch": 1093} {"train_loss": -21.616363525390625, "global_step": 90778, "epoch": 1093} {"train_loss": -21.901472091674805, "global_step": 90779, "epoch": 1093} {"train_loss": -21.527565002441406, "global_step": 90780, "epoch": 1093} {"train_loss": -21.69121551513672, "global_step": 90781, "epoch": 1093} {"train_loss": -21.744857788085938, "global_step": 90782, "epoch": 1093} {"train_loss": -21.4217529296875, "global_step": 90783, "epoch": 1093} {"train_loss": -21.88950538635254, "global_step": 90784, "epoch": 1093} {"train_loss": -21.58052635192871, "global_step": 90785, "epoch": 1093} {"train_loss": -21.615102767944336, "global_step": 90786, "epoch": 1093} {"train_loss": -21.10150718688965, "global_step": 90787, "epoch": 1093} {"train_loss": -21.743928909301758, "global_step": 90788, "epoch": 1093} {"train_loss": -21.488075256347656, "global_step": 90789, "epoch": 1093} {"train_loss": -21.698760986328125, "global_step": 90790, "epoch": 1093} {"train_loss": -21.756248474121094, "global_step": 90791, "epoch": 1093} {"train_loss": -21.650693893432617, "global_step": 90792, "epoch": 1093} {"train_loss": -21.87216567993164, "global_step": 90793, "epoch": 1093} {"train_loss": -21.60857582092285, "global_step": 90794, "epoch": 1093} {"train_loss": -21.284517288208008, "global_step": 90795, "epoch": 1093} {"train_loss": -21.556686401367188, "global_step": 90796, "epoch": 1093} {"train_loss": -21.776540756225586, "global_step": 90797, "epoch": 1093} {"train_loss": -21.646390914916992, "global_step": 90798, "epoch": 1093} {"train_loss": -21.27924346923828, "global_step": 90799, "epoch": 1093} {"train_loss": -21.616239547729492, "global_step": 90800, "epoch": 1093} {"train_loss": -21.592038212052312, "global_step": 90801, "epoch": 1093, "val_loss": 5997232.5} {"train_loss": -21.215152740478516, "global_step": 90802, "epoch": 1094} {"train_loss": -21.70425033569336, "global_step": 90803, "epoch": 1094} {"train_loss": -21.506851196289062, "global_step": 90804, "epoch": 1094} {"train_loss": -21.577512741088867, "global_step": 90805, "epoch": 1094} {"train_loss": -21.95199203491211, "global_step": 90806, "epoch": 1094} {"train_loss": -21.282045364379883, "global_step": 90807, "epoch": 1094} {"train_loss": -21.3719425201416, "global_step": 90808, "epoch": 1094} {"train_loss": -21.9511661529541, "global_step": 90809, "epoch": 1094} {"train_loss": -21.548398971557617, "global_step": 90810, "epoch": 1094} {"train_loss": -21.583053588867188, "global_step": 90811, "epoch": 1094} {"train_loss": -21.843557357788086, "global_step": 90812, "epoch": 1094} {"train_loss": -21.693647384643555, "global_step": 90813, "epoch": 1094} {"train_loss": -21.734098434448242, "global_step": 90814, "epoch": 1094} {"train_loss": -21.500097274780273, "global_step": 90815, "epoch": 1094} {"train_loss": -21.503629684448242, "global_step": 90816, "epoch": 1094} {"train_loss": -21.66790199279785, "global_step": 90817, "epoch": 1094} {"train_loss": -21.228757858276367, "global_step": 90818, "epoch": 1094} {"train_loss": -21.661983489990234, "global_step": 90819, "epoch": 1094} {"train_loss": -21.430509567260742, "global_step": 90820, "epoch": 1094} {"train_loss": -21.422077178955078, "global_step": 90821, "epoch": 1094} {"train_loss": -21.498762130737305, "global_step": 90822, "epoch": 1094} {"train_loss": -21.69828224182129, "global_step": 90823, "epoch": 1094} {"train_loss": -21.279253005981445, "global_step": 90824, "epoch": 1094} {"train_loss": -21.701297760009766, "global_step": 90825, "epoch": 1094} {"train_loss": -21.190387725830078, "global_step": 90826, "epoch": 1094} {"train_loss": -21.67088508605957, "global_step": 90827, "epoch": 1094} {"train_loss": -21.854719161987305, "global_step": 90828, "epoch": 1094} {"train_loss": -21.769472122192383, "global_step": 90829, "epoch": 1094} {"train_loss": -21.002761840820312, "global_step": 90830, "epoch": 1094} {"train_loss": -22.039775848388672, "global_step": 90831, "epoch": 1094} {"train_loss": -21.654983520507812, "global_step": 90832, "epoch": 1094} {"train_loss": -21.395105361938477, "global_step": 90833, "epoch": 1094} {"train_loss": -21.360904693603516, "global_step": 90834, "epoch": 1094} {"train_loss": -21.462064743041992, "global_step": 90835, "epoch": 1094} {"train_loss": -21.67877769470215, "global_step": 90836, "epoch": 1094} {"train_loss": -21.707517623901367, "global_step": 90837, "epoch": 1094} {"train_loss": -21.338565826416016, "global_step": 90838, "epoch": 1094} {"train_loss": -21.870988845825195, "global_step": 90839, "epoch": 1094} {"train_loss": -21.361770629882812, "global_step": 90840, "epoch": 1094} {"train_loss": -21.493000030517578, "global_step": 90841, "epoch": 1094} {"train_loss": -21.683040618896484, "global_step": 90842, "epoch": 1094} {"train_loss": -21.817825317382812, "global_step": 90843, "epoch": 1094} {"train_loss": -21.55258560180664, "global_step": 90844, "epoch": 1094} {"train_loss": -21.733312606811523, "global_step": 90845, "epoch": 1094} {"train_loss": -21.66419792175293, "global_step": 90846, "epoch": 1094} {"train_loss": -21.844493865966797, "global_step": 90847, "epoch": 1094} {"train_loss": -21.457136154174805, "global_step": 90848, "epoch": 1094} {"train_loss": -21.599868774414062, "global_step": 90849, "epoch": 1094} {"train_loss": -21.924257278442383, "global_step": 90850, "epoch": 1094} {"train_loss": -21.773426055908203, "global_step": 90851, "epoch": 1094} {"train_loss": -21.70782470703125, "global_step": 90852, "epoch": 1094} {"train_loss": -22.089326858520508, "global_step": 90853, "epoch": 1094} {"train_loss": -22.009727478027344, "global_step": 90854, "epoch": 1094} {"train_loss": -21.635053634643555, "global_step": 90855, "epoch": 1094} {"train_loss": -21.578781127929688, "global_step": 90856, "epoch": 1094} {"train_loss": -21.66451072692871, "global_step": 90857, "epoch": 1094} {"train_loss": -21.285913467407227, "global_step": 90858, "epoch": 1094} {"train_loss": -21.54027557373047, "global_step": 90859, "epoch": 1094} {"train_loss": -21.529775619506836, "global_step": 90860, "epoch": 1094} {"train_loss": -21.476499557495117, "global_step": 90861, "epoch": 1094} {"train_loss": -21.959665298461914, "global_step": 90862, "epoch": 1094} {"train_loss": -21.796979904174805, "global_step": 90863, "epoch": 1094} {"train_loss": -21.58761978149414, "global_step": 90864, "epoch": 1094} {"train_loss": -21.648998260498047, "global_step": 90865, "epoch": 1094} {"train_loss": -21.7900333404541, "global_step": 90866, "epoch": 1094} {"train_loss": -21.747289657592773, "global_step": 90867, "epoch": 1094} {"train_loss": -22.04233741760254, "global_step": 90868, "epoch": 1094} {"train_loss": -21.69577980041504, "global_step": 90869, "epoch": 1094} {"train_loss": -21.939348220825195, "global_step": 90870, "epoch": 1094} {"train_loss": -21.74216079711914, "global_step": 90871, "epoch": 1094} {"train_loss": -21.697494506835938, "global_step": 90872, "epoch": 1094} {"train_loss": -21.88314437866211, "global_step": 90873, "epoch": 1094} {"train_loss": -21.63191032409668, "global_step": 90874, "epoch": 1094} {"train_loss": -21.54134178161621, "global_step": 90875, "epoch": 1094} {"train_loss": -21.747379302978516, "global_step": 90876, "epoch": 1094} {"train_loss": -21.5897274017334, "global_step": 90877, "epoch": 1094} {"train_loss": -21.644107818603516, "global_step": 90878, "epoch": 1094} {"train_loss": -21.656888961791992, "global_step": 90879, "epoch": 1094} {"train_loss": -21.51988983154297, "global_step": 90880, "epoch": 1094} {"train_loss": -21.73341178894043, "global_step": 90881, "epoch": 1094} {"train_loss": -21.947538375854492, "global_step": 90882, "epoch": 1094} {"train_loss": -21.45197105407715, "global_step": 90883, "epoch": 1094} {"train_loss": -21.628695016883942, "global_step": 90884, "epoch": 1094, "val_loss": 6208148.0} {"train_loss": -21.509885787963867, "global_step": 90885, "epoch": 1095} {"train_loss": -21.588666915893555, "global_step": 90886, "epoch": 1095} {"train_loss": -21.509685516357422, "global_step": 90887, "epoch": 1095} {"train_loss": -21.441469192504883, "global_step": 90888, "epoch": 1095} {"train_loss": -21.6820011138916, "global_step": 90889, "epoch": 1095} {"train_loss": -21.602346420288086, "global_step": 90890, "epoch": 1095} {"train_loss": -21.395322799682617, "global_step": 90891, "epoch": 1095} {"train_loss": -21.23151206970215, "global_step": 90892, "epoch": 1095} {"train_loss": -21.767194747924805, "global_step": 90893, "epoch": 1095} {"train_loss": -21.48862648010254, "global_step": 90894, "epoch": 1095} {"train_loss": -21.520179748535156, "global_step": 90895, "epoch": 1095} {"train_loss": -21.60605812072754, "global_step": 90896, "epoch": 1095} {"train_loss": -21.630966186523438, "global_step": 90897, "epoch": 1095} {"train_loss": -21.434743881225586, "global_step": 90898, "epoch": 1095} {"train_loss": -21.56477165222168, "global_step": 90899, "epoch": 1095} {"train_loss": -21.38606834411621, "global_step": 90900, "epoch": 1095} {"train_loss": -21.544666290283203, "global_step": 90901, "epoch": 1095} {"train_loss": -21.751684188842773, "global_step": 90902, "epoch": 1095} {"train_loss": -21.491315841674805, "global_step": 90903, "epoch": 1095} {"train_loss": -21.554414749145508, "global_step": 90904, "epoch": 1095} {"train_loss": -21.47560691833496, "global_step": 90905, "epoch": 1095} {"train_loss": -21.698843002319336, "global_step": 90906, "epoch": 1095} {"train_loss": -21.7803955078125, "global_step": 90907, "epoch": 1095} {"train_loss": -21.560075759887695, "global_step": 90908, "epoch": 1095} {"train_loss": -21.480606079101562, "global_step": 90909, "epoch": 1095} {"train_loss": -21.744688034057617, "global_step": 90910, "epoch": 1095} {"train_loss": -22.032323837280273, "global_step": 90911, "epoch": 1095} {"train_loss": -21.668180465698242, "global_step": 90912, "epoch": 1095} {"train_loss": -21.43350601196289, "global_step": 90913, "epoch": 1095} {"train_loss": -21.719715118408203, "global_step": 90914, "epoch": 1095} {"train_loss": -21.509531021118164, "global_step": 90915, "epoch": 1095} {"train_loss": -21.62872886657715, "global_step": 90916, "epoch": 1095} {"train_loss": -21.29941749572754, "global_step": 90917, "epoch": 1095} {"train_loss": -21.852401733398438, "global_step": 90918, "epoch": 1095} {"train_loss": -21.296789169311523, "global_step": 90919, "epoch": 1095} {"train_loss": -21.60353660583496, "global_step": 90920, "epoch": 1095} {"train_loss": -21.762836456298828, "global_step": 90921, "epoch": 1095} {"train_loss": -21.58724021911621, "global_step": 90922, "epoch": 1095} {"train_loss": -21.696744918823242, "global_step": 90923, "epoch": 1095} {"train_loss": -21.95490837097168, "global_step": 90924, "epoch": 1095} {"train_loss": -21.54867172241211, "global_step": 90925, "epoch": 1095} {"train_loss": -21.585203170776367, "global_step": 90926, "epoch": 1095} {"train_loss": -22.1004581451416, "global_step": 90927, "epoch": 1095} {"train_loss": -21.6020565032959, "global_step": 90928, "epoch": 1095} {"train_loss": -21.546159744262695, "global_step": 90929, "epoch": 1095} {"train_loss": -21.653661727905273, "global_step": 90930, "epoch": 1095} {"train_loss": -21.50287437438965, "global_step": 90931, "epoch": 1095} {"train_loss": -21.619592666625977, "global_step": 90932, "epoch": 1095} {"train_loss": -21.15273666381836, "global_step": 90933, "epoch": 1095} {"train_loss": -22.028579711914062, "global_step": 90934, "epoch": 1095} {"train_loss": -21.307165145874023, "global_step": 90935, "epoch": 1095} {"train_loss": -21.655248641967773, "global_step": 90936, "epoch": 1095} {"train_loss": -21.647354125976562, "global_step": 90937, "epoch": 1095} {"train_loss": -21.551206588745117, "global_step": 90938, "epoch": 1095} {"train_loss": -21.4682559967041, "global_step": 90939, "epoch": 1095} {"train_loss": -21.571308135986328, "global_step": 90940, "epoch": 1095} {"train_loss": -21.52825164794922, "global_step": 90941, "epoch": 1095} {"train_loss": -21.465192794799805, "global_step": 90942, "epoch": 1095} {"train_loss": -21.776952743530273, "global_step": 90943, "epoch": 1095} {"train_loss": -21.317472457885742, "global_step": 90944, "epoch": 1095} {"train_loss": -21.512910842895508, "global_step": 90945, "epoch": 1095} {"train_loss": -21.72434425354004, "global_step": 90946, "epoch": 1095} {"train_loss": -21.85100746154785, "global_step": 90947, "epoch": 1095} {"train_loss": -21.58656883239746, "global_step": 90948, "epoch": 1095} {"train_loss": -21.330358505249023, "global_step": 90949, "epoch": 1095} {"train_loss": -21.350980758666992, "global_step": 90950, "epoch": 1095} {"train_loss": -21.649293899536133, "global_step": 90951, "epoch": 1095} {"train_loss": -21.53645896911621, "global_step": 90952, "epoch": 1095} {"train_loss": -21.707862854003906, "global_step": 90953, "epoch": 1095} {"train_loss": -21.44074821472168, "global_step": 90954, "epoch": 1095} {"train_loss": -21.61704444885254, "global_step": 90955, "epoch": 1095} {"train_loss": -21.845279693603516, "global_step": 90956, "epoch": 1095} {"train_loss": -21.324100494384766, "global_step": 90957, "epoch": 1095} {"train_loss": -21.411197662353516, "global_step": 90958, "epoch": 1095} {"train_loss": -22.08452606201172, "global_step": 90959, "epoch": 1095} {"train_loss": -21.247411727905273, "global_step": 90960, "epoch": 1095} {"train_loss": -21.47854995727539, "global_step": 90961, "epoch": 1095} {"train_loss": -21.844423294067383, "global_step": 90962, "epoch": 1095} {"train_loss": -21.52322006225586, "global_step": 90963, "epoch": 1095} {"train_loss": -21.465721130371094, "global_step": 90964, "epoch": 1095} {"train_loss": -21.553945541381836, "global_step": 90965, "epoch": 1095} {"train_loss": -21.517086029052734, "global_step": 90966, "epoch": 1095} {"train_loss": -21.57756931810494, "global_step": 90967, "epoch": 1095, "val_loss": 6153282.5} {"train_loss": -20.798534393310547, "global_step": 90968, "epoch": 1096} {"train_loss": -21.5669002532959, "global_step": 90969, "epoch": 1096} {"train_loss": -20.798242568969727, "global_step": 90970, "epoch": 1096} {"train_loss": -21.131006240844727, "global_step": 90971, "epoch": 1096} {"train_loss": -21.43279266357422, "global_step": 90972, "epoch": 1096} {"train_loss": -21.506633758544922, "global_step": 90973, "epoch": 1096} {"train_loss": -21.27083969116211, "global_step": 90974, "epoch": 1096} {"train_loss": -21.308029174804688, "global_step": 90975, "epoch": 1096} {"train_loss": -21.23176383972168, "global_step": 90976, "epoch": 1096} {"train_loss": -21.40396499633789, "global_step": 90977, "epoch": 1096} {"train_loss": -21.31609535217285, "global_step": 90978, "epoch": 1096} {"train_loss": -21.432727813720703, "global_step": 90979, "epoch": 1096} {"train_loss": -21.76386833190918, "global_step": 90980, "epoch": 1096} {"train_loss": -21.46392250061035, "global_step": 90981, "epoch": 1096} {"train_loss": -21.445341110229492, "global_step": 90982, "epoch": 1096} {"train_loss": -21.51773452758789, "global_step": 90983, "epoch": 1096} {"train_loss": -21.497474670410156, "global_step": 90984, "epoch": 1096} {"train_loss": -21.664228439331055, "global_step": 90985, "epoch": 1096} {"train_loss": -21.40313720703125, "global_step": 90986, "epoch": 1096} {"train_loss": -21.714492797851562, "global_step": 90987, "epoch": 1096} {"train_loss": -21.77608299255371, "global_step": 90988, "epoch": 1096} {"train_loss": -21.003910064697266, "global_step": 90989, "epoch": 1096} {"train_loss": -21.708738327026367, "global_step": 90990, "epoch": 1096} {"train_loss": -21.039987564086914, "global_step": 90991, "epoch": 1096} {"train_loss": -21.04042625427246, "global_step": 90992, "epoch": 1096} {"train_loss": -21.441150665283203, "global_step": 90993, "epoch": 1096} {"train_loss": -21.498258590698242, "global_step": 90994, "epoch": 1096} {"train_loss": -21.77015495300293, "global_step": 90995, "epoch": 1096} {"train_loss": -21.565311431884766, "global_step": 90996, "epoch": 1096} {"train_loss": -21.546781539916992, "global_step": 90997, "epoch": 1096} {"train_loss": -21.340164184570312, "global_step": 90998, "epoch": 1096} {"train_loss": -21.205244064331055, "global_step": 90999, "epoch": 1096} {"train_loss": -21.684057235717773, "global_step": 91000, "epoch": 1096} {"train_loss": -21.72126007080078, "global_step": 91001, "epoch": 1096} {"train_loss": -21.52289581298828, "global_step": 91002, "epoch": 1096} {"train_loss": -21.712902069091797, "global_step": 91003, "epoch": 1096} {"train_loss": -21.82893180847168, "global_step": 91004, "epoch": 1096} {"train_loss": -21.344011306762695, "global_step": 91005, "epoch": 1096} {"train_loss": -21.575580596923828, "global_step": 91006, "epoch": 1096} {"train_loss": -21.60455894470215, "global_step": 91007, "epoch": 1096} {"train_loss": -21.657941818237305, "global_step": 91008, "epoch": 1096} {"train_loss": -22.002668380737305, "global_step": 91009, "epoch": 1096} {"train_loss": -21.688100814819336, "global_step": 91010, "epoch": 1096} {"train_loss": -21.419897079467773, "global_step": 91011, "epoch": 1096} {"train_loss": -21.824310302734375, "global_step": 91012, "epoch": 1096} {"train_loss": -21.694334030151367, "global_step": 91013, "epoch": 1096} {"train_loss": -21.471603393554688, "global_step": 91014, "epoch": 1096} {"train_loss": -21.7283992767334, "global_step": 91015, "epoch": 1096} {"train_loss": -21.748197555541992, "global_step": 91016, "epoch": 1096} {"train_loss": -21.574026107788086, "global_step": 91017, "epoch": 1096} {"train_loss": -21.710424423217773, "global_step": 91018, "epoch": 1096} {"train_loss": -21.591903686523438, "global_step": 91019, "epoch": 1096} {"train_loss": -21.77284812927246, "global_step": 91020, "epoch": 1096} {"train_loss": -21.66664695739746, "global_step": 91021, "epoch": 1096} {"train_loss": -21.696914672851562, "global_step": 91022, "epoch": 1096} {"train_loss": -21.566255569458008, "global_step": 91023, "epoch": 1096} {"train_loss": -21.88228988647461, "global_step": 91024, "epoch": 1096} {"train_loss": -21.50710105895996, "global_step": 91025, "epoch": 1096} {"train_loss": -21.519033432006836, "global_step": 91026, "epoch": 1096} {"train_loss": -22.009809494018555, "global_step": 91027, "epoch": 1096} {"train_loss": -21.502782821655273, "global_step": 91028, "epoch": 1096} {"train_loss": -21.549062728881836, "global_step": 91029, "epoch": 1096} {"train_loss": -21.95699119567871, "global_step": 91030, "epoch": 1096} {"train_loss": -21.934860229492188, "global_step": 91031, "epoch": 1096} {"train_loss": -21.691068649291992, "global_step": 91032, "epoch": 1096} {"train_loss": -21.29207420349121, "global_step": 91033, "epoch": 1096} {"train_loss": -21.47255516052246, "global_step": 91034, "epoch": 1096} {"train_loss": -21.53691864013672, "global_step": 91035, "epoch": 1096} {"train_loss": -21.49249839782715, "global_step": 91036, "epoch": 1096} {"train_loss": -21.40478515625, "global_step": 91037, "epoch": 1096} {"train_loss": -21.665388107299805, "global_step": 91038, "epoch": 1096} {"train_loss": -21.5986328125, "global_step": 91039, "epoch": 1096} {"train_loss": -21.46710968017578, "global_step": 91040, "epoch": 1096} {"train_loss": -21.85817527770996, "global_step": 91041, "epoch": 1096} {"train_loss": -21.574308395385742, "global_step": 91042, "epoch": 1096} {"train_loss": -22.02047348022461, "global_step": 91043, "epoch": 1096} {"train_loss": -21.571414947509766, "global_step": 91044, "epoch": 1096} {"train_loss": -21.681852340698242, "global_step": 91045, "epoch": 1096} {"train_loss": -21.567319869995117, "global_step": 91046, "epoch": 1096} {"train_loss": -21.335546493530273, "global_step": 91047, "epoch": 1096} {"train_loss": -21.602476119995117, "global_step": 91048, "epoch": 1096} {"train_loss": -21.6602840423584, "global_step": 91049, "epoch": 1096} {"train_loss": -21.539397641836878, "global_step": 91050, "epoch": 1096, "val_loss": 6275042.0} {"train_loss": -21.224328994750977, "global_step": 91051, "epoch": 1097} {"train_loss": -21.4937744140625, "global_step": 91052, "epoch": 1097} {"train_loss": -21.265701293945312, "global_step": 91053, "epoch": 1097} {"train_loss": -21.113876342773438, "global_step": 91054, "epoch": 1097} {"train_loss": -21.07874870300293, "global_step": 91055, "epoch": 1097} {"train_loss": -21.275907516479492, "global_step": 91056, "epoch": 1097} {"train_loss": -21.09274673461914, "global_step": 91057, "epoch": 1097} {"train_loss": -21.425579071044922, "global_step": 91058, "epoch": 1097} {"train_loss": -21.64310073852539, "global_step": 91059, "epoch": 1097} {"train_loss": -21.707275390625, "global_step": 91060, "epoch": 1097} {"train_loss": -21.523523330688477, "global_step": 91061, "epoch": 1097} {"train_loss": -21.37528419494629, "global_step": 91062, "epoch": 1097} {"train_loss": -21.2742977142334, "global_step": 91063, "epoch": 1097} {"train_loss": -21.75452423095703, "global_step": 91064, "epoch": 1097} {"train_loss": -21.400318145751953, "global_step": 91065, "epoch": 1097} {"train_loss": -21.654293060302734, "global_step": 91066, "epoch": 1097} {"train_loss": -21.58201026916504, "global_step": 91067, "epoch": 1097} {"train_loss": -21.860641479492188, "global_step": 91068, "epoch": 1097} {"train_loss": -21.710155487060547, "global_step": 91069, "epoch": 1097} {"train_loss": -21.553516387939453, "global_step": 91070, "epoch": 1097} {"train_loss": -21.4191951751709, "global_step": 91071, "epoch": 1097} {"train_loss": -21.457304000854492, "global_step": 91072, "epoch": 1097} {"train_loss": -21.39559555053711, "global_step": 91073, "epoch": 1097} {"train_loss": -21.61990737915039, "global_step": 91074, "epoch": 1097} {"train_loss": -21.393646240234375, "global_step": 91075, "epoch": 1097} {"train_loss": -21.144824981689453, "global_step": 91076, "epoch": 1097} {"train_loss": -21.428354263305664, "global_step": 91077, "epoch": 1097} {"train_loss": -21.336029052734375, "global_step": 91078, "epoch": 1097} {"train_loss": -22.017309188842773, "global_step": 91079, "epoch": 1097} {"train_loss": -21.252864837646484, "global_step": 91080, "epoch": 1097} {"train_loss": -21.383499145507812, "global_step": 91081, "epoch": 1097} {"train_loss": -21.46370506286621, "global_step": 91082, "epoch": 1097} {"train_loss": -21.881669998168945, "global_step": 91083, "epoch": 1097} {"train_loss": -21.423816680908203, "global_step": 91084, "epoch": 1097} {"train_loss": -21.63228416442871, "global_step": 91085, "epoch": 1097} {"train_loss": -21.4989070892334, "global_step": 91086, "epoch": 1097} {"train_loss": -21.453405380249023, "global_step": 91087, "epoch": 1097} {"train_loss": -21.90346336364746, "global_step": 91088, "epoch": 1097} {"train_loss": -21.556238174438477, "global_step": 91089, "epoch": 1097} {"train_loss": -21.547069549560547, "global_step": 91090, "epoch": 1097} {"train_loss": -21.625015258789062, "global_step": 91091, "epoch": 1097} {"train_loss": -21.46384620666504, "global_step": 91092, "epoch": 1097} {"train_loss": -21.472339630126953, "global_step": 91093, "epoch": 1097} {"train_loss": -21.681812286376953, "global_step": 91094, "epoch": 1097} {"train_loss": -21.485652923583984, "global_step": 91095, "epoch": 1097} {"train_loss": -21.41714859008789, "global_step": 91096, "epoch": 1097} {"train_loss": -21.78508186340332, "global_step": 91097, "epoch": 1097} {"train_loss": -21.315465927124023, "global_step": 91098, "epoch": 1097} {"train_loss": -21.585302352905273, "global_step": 91099, "epoch": 1097} {"train_loss": -21.652462005615234, "global_step": 91100, "epoch": 1097} {"train_loss": -21.713886260986328, "global_step": 91101, "epoch": 1097} {"train_loss": -21.953351974487305, "global_step": 91102, "epoch": 1097} {"train_loss": -21.4267520904541, "global_step": 91103, "epoch": 1097} {"train_loss": -21.79547691345215, "global_step": 91104, "epoch": 1097} {"train_loss": -21.909997940063477, "global_step": 91105, "epoch": 1097} {"train_loss": -21.836341857910156, "global_step": 91106, "epoch": 1097} {"train_loss": -21.96295738220215, "global_step": 91107, "epoch": 1097} {"train_loss": -21.684995651245117, "global_step": 91108, "epoch": 1097} {"train_loss": -21.40892791748047, "global_step": 91109, "epoch": 1097} {"train_loss": -21.715675354003906, "global_step": 91110, "epoch": 1097} {"train_loss": -22.03749656677246, "global_step": 91111, "epoch": 1097} {"train_loss": -21.559215545654297, "global_step": 91112, "epoch": 1097} {"train_loss": -21.81769371032715, "global_step": 91113, "epoch": 1097} {"train_loss": -21.718669891357422, "global_step": 91114, "epoch": 1097} {"train_loss": -21.80514144897461, "global_step": 91115, "epoch": 1097} {"train_loss": -21.509723663330078, "global_step": 91116, "epoch": 1097} {"train_loss": -21.722110748291016, "global_step": 91117, "epoch": 1097} {"train_loss": -21.551801681518555, "global_step": 91118, "epoch": 1097} {"train_loss": -21.700607299804688, "global_step": 91119, "epoch": 1097} {"train_loss": -21.64301872253418, "global_step": 91120, "epoch": 1097} {"train_loss": -21.854970932006836, "global_step": 91121, "epoch": 1097} {"train_loss": -21.907743453979492, "global_step": 91122, "epoch": 1097} {"train_loss": -21.900405883789062, "global_step": 91123, "epoch": 1097} {"train_loss": -21.810474395751953, "global_step": 91124, "epoch": 1097} {"train_loss": -22.004968643188477, "global_step": 91125, "epoch": 1097} {"train_loss": -21.665464401245117, "global_step": 91126, "epoch": 1097} {"train_loss": -21.732227325439453, "global_step": 91127, "epoch": 1097} {"train_loss": -21.669605255126953, "global_step": 91128, "epoch": 1097} {"train_loss": -21.584136962890625, "global_step": 91129, "epoch": 1097} {"train_loss": -21.853107452392578, "global_step": 91130, "epoch": 1097} {"train_loss": -21.824857711791992, "global_step": 91131, "epoch": 1097} {"train_loss": -21.75978660583496, "global_step": 91132, "epoch": 1097} {"train_loss": -21.620426614600493, "global_step": 91133, "epoch": 1097, "val_loss": 6098111.0} {"train_loss": -20.781003952026367, "global_step": 91134, "epoch": 1098} {"train_loss": -21.928298950195312, "global_step": 91135, "epoch": 1098} {"train_loss": -20.63054084777832, "global_step": 91136, "epoch": 1098} {"train_loss": -21.24496841430664, "global_step": 91137, "epoch": 1098} {"train_loss": -21.193607330322266, "global_step": 91138, "epoch": 1098} {"train_loss": -21.541078567504883, "global_step": 91139, "epoch": 1098} {"train_loss": -20.849197387695312, "global_step": 91140, "epoch": 1098} {"train_loss": -21.260435104370117, "global_step": 91141, "epoch": 1098} {"train_loss": -21.59200096130371, "global_step": 91142, "epoch": 1098} {"train_loss": -21.342344284057617, "global_step": 91143, "epoch": 1098} {"train_loss": -21.364564895629883, "global_step": 91144, "epoch": 1098} {"train_loss": -21.51265525817871, "global_step": 91145, "epoch": 1098} {"train_loss": -21.129003524780273, "global_step": 91146, "epoch": 1098} {"train_loss": -21.301055908203125, "global_step": 91147, "epoch": 1098} {"train_loss": -21.54048728942871, "global_step": 91148, "epoch": 1098} {"train_loss": -21.396039962768555, "global_step": 91149, "epoch": 1098} {"train_loss": -21.187955856323242, "global_step": 91150, "epoch": 1098} {"train_loss": -21.43548583984375, "global_step": 91151, "epoch": 1098} {"train_loss": -21.838895797729492, "global_step": 91152, "epoch": 1098} {"train_loss": -21.582386016845703, "global_step": 91153, "epoch": 1098} {"train_loss": -21.642148971557617, "global_step": 91154, "epoch": 1098} {"train_loss": -21.389286041259766, "global_step": 91155, "epoch": 1098} {"train_loss": -21.471790313720703, "global_step": 91156, "epoch": 1098} {"train_loss": -21.6070499420166, "global_step": 91157, "epoch": 1098} {"train_loss": -21.720144271850586, "global_step": 91158, "epoch": 1098} {"train_loss": -21.169715881347656, "global_step": 91159, "epoch": 1098} {"train_loss": -21.62929344177246, "global_step": 91160, "epoch": 1098} {"train_loss": -21.65804100036621, "global_step": 91161, "epoch": 1098} {"train_loss": -21.351951599121094, "global_step": 91162, "epoch": 1098} {"train_loss": -21.482318878173828, "global_step": 91163, "epoch": 1098} {"train_loss": -21.5842342376709, "global_step": 91164, "epoch": 1098} {"train_loss": -21.549938201904297, "global_step": 91165, "epoch": 1098} {"train_loss": -21.47501564025879, "global_step": 91166, "epoch": 1098} {"train_loss": -21.74241065979004, "global_step": 91167, "epoch": 1098} {"train_loss": -21.356199264526367, "global_step": 91168, "epoch": 1098} {"train_loss": -21.694211959838867, "global_step": 91169, "epoch": 1098} {"train_loss": -21.37991714477539, "global_step": 91170, "epoch": 1098} {"train_loss": -21.22344207763672, "global_step": 91171, "epoch": 1098} {"train_loss": -21.589141845703125, "global_step": 91172, "epoch": 1098} {"train_loss": -21.321020126342773, "global_step": 91173, "epoch": 1098} {"train_loss": -21.730777740478516, "global_step": 91174, "epoch": 1098} {"train_loss": -21.442493438720703, "global_step": 91175, "epoch": 1098} {"train_loss": -21.429149627685547, "global_step": 91176, "epoch": 1098} {"train_loss": -21.91391372680664, "global_step": 91177, "epoch": 1098} {"train_loss": -21.564756393432617, "global_step": 91178, "epoch": 1098} {"train_loss": -21.11321449279785, "global_step": 91179, "epoch": 1098} {"train_loss": -21.37282371520996, "global_step": 91180, "epoch": 1098} {"train_loss": -21.534177780151367, "global_step": 91181, "epoch": 1098} {"train_loss": -21.521268844604492, "global_step": 91182, "epoch": 1098} {"train_loss": -21.73565101623535, "global_step": 91183, "epoch": 1098} {"train_loss": -21.972349166870117, "global_step": 91184, "epoch": 1098} {"train_loss": -21.39764976501465, "global_step": 91185, "epoch": 1098} {"train_loss": -21.549081802368164, "global_step": 91186, "epoch": 1098} {"train_loss": -21.719301223754883, "global_step": 91187, "epoch": 1098} {"train_loss": -21.871301651000977, "global_step": 91188, "epoch": 1098} {"train_loss": -21.75850486755371, "global_step": 91189, "epoch": 1098} {"train_loss": -21.68378448486328, "global_step": 91190, "epoch": 1098} {"train_loss": -21.544919967651367, "global_step": 91191, "epoch": 1098} {"train_loss": -21.26698875427246, "global_step": 91192, "epoch": 1098} {"train_loss": -21.74770164489746, "global_step": 91193, "epoch": 1098} {"train_loss": -21.608312606811523, "global_step": 91194, "epoch": 1098} {"train_loss": -21.982568740844727, "global_step": 91195, "epoch": 1098} {"train_loss": -21.771392822265625, "global_step": 91196, "epoch": 1098} {"train_loss": -21.524572372436523, "global_step": 91197, "epoch": 1098} {"train_loss": -21.477441787719727, "global_step": 91198, "epoch": 1098} {"train_loss": -22.133275985717773, "global_step": 91199, "epoch": 1098} {"train_loss": -21.806241989135742, "global_step": 91200, "epoch": 1098} {"train_loss": -21.902578353881836, "global_step": 91201, "epoch": 1098} {"train_loss": -21.768707275390625, "global_step": 91202, "epoch": 1098} {"train_loss": -21.747146606445312, "global_step": 91203, "epoch": 1098} {"train_loss": -21.599185943603516, "global_step": 91204, "epoch": 1098} {"train_loss": -21.972370147705078, "global_step": 91205, "epoch": 1098} {"train_loss": -21.2762393951416, "global_step": 91206, "epoch": 1098} {"train_loss": -21.45302391052246, "global_step": 91207, "epoch": 1098} {"train_loss": -21.568836212158203, "global_step": 91208, "epoch": 1098} {"train_loss": -21.61591339111328, "global_step": 91209, "epoch": 1098} {"train_loss": -21.707529067993164, "global_step": 91210, "epoch": 1098} {"train_loss": -21.131004333496094, "global_step": 91211, "epoch": 1098} {"train_loss": -21.220930099487305, "global_step": 91212, "epoch": 1098} {"train_loss": -21.769384384155273, "global_step": 91213, "epoch": 1098} {"train_loss": -21.135498046875, "global_step": 91214, "epoch": 1098} {"train_loss": -21.491506576538086, "global_step": 91215, "epoch": 1098} {"train_loss": -21.511852425265026, "global_step": 91216, "epoch": 1098, "val_loss": 6014222.0} {"train_loss": -19.624380111694336, "global_step": 91217, "epoch": 1099} {"train_loss": -20.926862716674805, "global_step": 91218, "epoch": 1099} {"train_loss": -20.46791648864746, "global_step": 91219, "epoch": 1099} {"train_loss": -20.61124038696289, "global_step": 91220, "epoch": 1099} {"train_loss": -20.464136123657227, "global_step": 91221, "epoch": 1099} {"train_loss": -20.57790184020996, "global_step": 91222, "epoch": 1099} {"train_loss": -20.71626091003418, "global_step": 91223, "epoch": 1099} {"train_loss": -20.705121994018555, "global_step": 91224, "epoch": 1099} {"train_loss": -20.704843521118164, "global_step": 91225, "epoch": 1099} {"train_loss": -20.826513290405273, "global_step": 91226, "epoch": 1099} {"train_loss": -20.802566528320312, "global_step": 91227, "epoch": 1099} {"train_loss": -21.30351448059082, "global_step": 91228, "epoch": 1099} {"train_loss": -20.62310791015625, "global_step": 91229, "epoch": 1099} {"train_loss": -20.8339900970459, "global_step": 91230, "epoch": 1099} {"train_loss": -21.067033767700195, "global_step": 91231, "epoch": 1099} {"train_loss": -21.80735969543457, "global_step": 91232, "epoch": 1099} {"train_loss": -20.90639305114746, "global_step": 91233, "epoch": 1099} {"train_loss": -21.380807876586914, "global_step": 91234, "epoch": 1099} {"train_loss": -21.177534103393555, "global_step": 91235, "epoch": 1099} {"train_loss": -20.919544219970703, "global_step": 91236, "epoch": 1099} {"train_loss": -21.37579917907715, "global_step": 91237, "epoch": 1099} {"train_loss": -21.302310943603516, "global_step": 91238, "epoch": 1099} {"train_loss": -20.942373275756836, "global_step": 91239, "epoch": 1099} {"train_loss": -21.37900733947754, "global_step": 91240, "epoch": 1099} {"train_loss": -21.30607032775879, "global_step": 91241, "epoch": 1099} {"train_loss": -21.169050216674805, "global_step": 91242, "epoch": 1099} {"train_loss": -21.511062622070312, "global_step": 91243, "epoch": 1099} {"train_loss": -21.269834518432617, "global_step": 91244, "epoch": 1099} {"train_loss": -21.43535041809082, "global_step": 91245, "epoch": 1099} {"train_loss": -21.63359260559082, "global_step": 91246, "epoch": 1099} {"train_loss": -21.613906860351562, "global_step": 91247, "epoch": 1099} {"train_loss": -21.484832763671875, "global_step": 91248, "epoch": 1099} {"train_loss": -21.4805908203125, "global_step": 91249, "epoch": 1099} {"train_loss": -21.816267013549805, "global_step": 91250, "epoch": 1099} {"train_loss": -21.64613151550293, "global_step": 91251, "epoch": 1099} {"train_loss": -21.503883361816406, "global_step": 91252, "epoch": 1099} {"train_loss": -21.31905746459961, "global_step": 91253, "epoch": 1099} {"train_loss": -21.679439544677734, "global_step": 91254, "epoch": 1099} {"train_loss": -21.6870174407959, "global_step": 91255, "epoch": 1099} {"train_loss": -21.596792221069336, "global_step": 91256, "epoch": 1099} {"train_loss": -21.51753807067871, "global_step": 91257, "epoch": 1099} {"train_loss": -21.3504638671875, "global_step": 91258, "epoch": 1099} {"train_loss": -21.630184173583984, "global_step": 91259, "epoch": 1099} {"train_loss": -21.505537033081055, "global_step": 91260, "epoch": 1099} {"train_loss": -21.911569595336914, "global_step": 91261, "epoch": 1099} {"train_loss": -21.92081642150879, "global_step": 91262, "epoch": 1099} {"train_loss": -21.939380645751953, "global_step": 91263, "epoch": 1099} {"train_loss": -21.879911422729492, "global_step": 91264, "epoch": 1099} {"train_loss": -21.67180824279785, "global_step": 91265, "epoch": 1099} {"train_loss": -21.924863815307617, "global_step": 91266, "epoch": 1099} {"train_loss": -21.63031005859375, "global_step": 91267, "epoch": 1099} {"train_loss": -21.174131393432617, "global_step": 91268, "epoch": 1099} {"train_loss": -22.054920196533203, "global_step": 91269, "epoch": 1099} {"train_loss": -21.854190826416016, "global_step": 91270, "epoch": 1099} {"train_loss": -21.41971206665039, "global_step": 91271, "epoch": 1099} {"train_loss": -21.670236587524414, "global_step": 91272, "epoch": 1099} {"train_loss": -21.98189926147461, "global_step": 91273, "epoch": 1099} {"train_loss": -21.407669067382812, "global_step": 91274, "epoch": 1099} {"train_loss": -21.77489471435547, "global_step": 91275, "epoch": 1099} {"train_loss": -21.573747634887695, "global_step": 91276, "epoch": 1099} {"train_loss": -21.50653076171875, "global_step": 91277, "epoch": 1099} {"train_loss": -21.383670806884766, "global_step": 91278, "epoch": 1099} {"train_loss": -21.712446212768555, "global_step": 91279, "epoch": 1099} {"train_loss": -21.957021713256836, "global_step": 91280, "epoch": 1099} {"train_loss": -21.651906967163086, "global_step": 91281, "epoch": 1099} {"train_loss": -21.904775619506836, "global_step": 91282, "epoch": 1099} {"train_loss": -21.495635986328125, "global_step": 91283, "epoch": 1099} {"train_loss": -21.730539321899414, "global_step": 91284, "epoch": 1099} {"train_loss": -21.71790885925293, "global_step": 91285, "epoch": 1099} {"train_loss": -21.2272891998291, "global_step": 91286, "epoch": 1099} {"train_loss": -21.602664947509766, "global_step": 91287, "epoch": 1099} {"train_loss": -21.608503341674805, "global_step": 91288, "epoch": 1099} {"train_loss": -21.776395797729492, "global_step": 91289, "epoch": 1099} {"train_loss": -21.329999923706055, "global_step": 91290, "epoch": 1099} {"train_loss": -21.753864288330078, "global_step": 91291, "epoch": 1099} {"train_loss": -21.4383602142334, "global_step": 91292, "epoch": 1099} {"train_loss": -21.172496795654297, "global_step": 91293, "epoch": 1099} {"train_loss": -21.503849029541016, "global_step": 91294, "epoch": 1099} {"train_loss": -21.544782638549805, "global_step": 91295, "epoch": 1099} {"train_loss": -21.72293472290039, "global_step": 91296, "epoch": 1099} {"train_loss": -21.44202995300293, "global_step": 91297, "epoch": 1099} {"train_loss": -21.27479362487793, "global_step": 91298, "epoch": 1099} {"train_loss": -21.39344017764172, "global_step": 91299, "epoch": 1099, "val_loss": 6134512.0} {"train_loss": -21.01852798461914, "global_step": 91300, "epoch": 1100} {"train_loss": -21.40275764465332, "global_step": 91301, "epoch": 1100} {"train_loss": -21.33880615234375, "global_step": 91302, "epoch": 1100} {"train_loss": -20.90642738342285, "global_step": 91303, "epoch": 1100} {"train_loss": -21.04964256286621, "global_step": 91304, "epoch": 1100} {"train_loss": -21.352277755737305, "global_step": 91305, "epoch": 1100} {"train_loss": -21.327228546142578, "global_step": 91306, "epoch": 1100} {"train_loss": -21.54660415649414, "global_step": 91307, "epoch": 1100} {"train_loss": -21.492347717285156, "global_step": 91308, "epoch": 1100} {"train_loss": -21.28834342956543, "global_step": 91309, "epoch": 1100} {"train_loss": -21.306528091430664, "global_step": 91310, "epoch": 1100} {"train_loss": -21.905370712280273, "global_step": 91311, "epoch": 1100} {"train_loss": -21.63528823852539, "global_step": 91312, "epoch": 1100} {"train_loss": -21.55584716796875, "global_step": 91313, "epoch": 1100} {"train_loss": -21.26801872253418, "global_step": 91314, "epoch": 1100} {"train_loss": -21.575048446655273, "global_step": 91315, "epoch": 1100} {"train_loss": -21.425281524658203, "global_step": 91316, "epoch": 1100} {"train_loss": -21.4842529296875, "global_step": 91317, "epoch": 1100} {"train_loss": -21.242460250854492, "global_step": 91318, "epoch": 1100} {"train_loss": -21.244138717651367, "global_step": 91319, "epoch": 1100} {"train_loss": -21.89811897277832, "global_step": 91320, "epoch": 1100} {"train_loss": -21.440820693969727, "global_step": 91321, "epoch": 1100} {"train_loss": -21.413667678833008, "global_step": 91322, "epoch": 1100} {"train_loss": -21.419126510620117, "global_step": 91323, "epoch": 1100} {"train_loss": -21.664167404174805, "global_step": 91324, "epoch": 1100} {"train_loss": -21.420385360717773, "global_step": 91325, "epoch": 1100} {"train_loss": -21.63411521911621, "global_step": 91326, "epoch": 1100} {"train_loss": -21.905841827392578, "global_step": 91327, "epoch": 1100} {"train_loss": -21.61008071899414, "global_step": 91328, "epoch": 1100} {"train_loss": -21.292701721191406, "global_step": 91329, "epoch": 1100} {"train_loss": -21.992219924926758, "global_step": 91330, "epoch": 1100} {"train_loss": -21.399106979370117, "global_step": 91331, "epoch": 1100} {"train_loss": -21.636859893798828, "global_step": 91332, "epoch": 1100} {"train_loss": -21.501195907592773, "global_step": 91333, "epoch": 1100} {"train_loss": -21.610641479492188, "global_step": 91334, "epoch": 1100} {"train_loss": -21.515111923217773, "global_step": 91335, "epoch": 1100} {"train_loss": -21.733322143554688, "global_step": 91336, "epoch": 1100} {"train_loss": -21.47235679626465, "global_step": 91337, "epoch": 1100} {"train_loss": -21.731821060180664, "global_step": 91338, "epoch": 1100} {"train_loss": -21.646345138549805, "global_step": 91339, "epoch": 1100} {"train_loss": -21.81048011779785, "global_step": 91340, "epoch": 1100} {"train_loss": -21.71518898010254, "global_step": 91341, "epoch": 1100} {"train_loss": -21.345834732055664, "global_step": 91342, "epoch": 1100} {"train_loss": -21.73291015625, "global_step": 91343, "epoch": 1100} {"train_loss": -21.34174919128418, "global_step": 91344, "epoch": 1100} {"train_loss": -21.983789443969727, "global_step": 91345, "epoch": 1100} {"train_loss": -21.738189697265625, "global_step": 91346, "epoch": 1100} {"train_loss": -21.911758422851562, "global_step": 91347, "epoch": 1100} {"train_loss": -21.625974655151367, "global_step": 91348, "epoch": 1100} {"train_loss": -22.034170150756836, "global_step": 91349, "epoch": 1100} {"train_loss": -21.63075065612793, "global_step": 91350, "epoch": 1100} {"train_loss": -21.527984619140625, "global_step": 91351, "epoch": 1100} {"train_loss": -21.53447151184082, "global_step": 91352, "epoch": 1100} {"train_loss": -21.502588272094727, "global_step": 91353, "epoch": 1100} {"train_loss": -21.75439453125, "global_step": 91354, "epoch": 1100} {"train_loss": -21.680627822875977, "global_step": 91355, "epoch": 1100} {"train_loss": -21.468263626098633, "global_step": 91356, "epoch": 1100} {"train_loss": -22.116376876831055, "global_step": 91357, "epoch": 1100} {"train_loss": -21.741010665893555, "global_step": 91358, "epoch": 1100} {"train_loss": -21.671268463134766, "global_step": 91359, "epoch": 1100} {"train_loss": -21.860729217529297, "global_step": 91360, "epoch": 1100} {"train_loss": -21.62858772277832, "global_step": 91361, "epoch": 1100} {"train_loss": -21.80141258239746, "global_step": 91362, "epoch": 1100} {"train_loss": -21.773893356323242, "global_step": 91363, "epoch": 1100} {"train_loss": -22.003936767578125, "global_step": 91364, "epoch": 1100} {"train_loss": -21.407367706298828, "global_step": 91365, "epoch": 1100} {"train_loss": -21.66438865661621, "global_step": 91366, "epoch": 1100} {"train_loss": -21.67293357849121, "global_step": 91367, "epoch": 1100} {"train_loss": -21.21596336364746, "global_step": 91368, "epoch": 1100} {"train_loss": -21.76798439025879, "global_step": 91369, "epoch": 1100} {"train_loss": -21.714447021484375, "global_step": 91370, "epoch": 1100} {"train_loss": -21.563955307006836, "global_step": 91371, "epoch": 1100} {"train_loss": -21.778478622436523, "global_step": 91372, "epoch": 1100} {"train_loss": -21.768985748291016, "global_step": 91373, "epoch": 1100} {"train_loss": -21.664915084838867, "global_step": 91374, "epoch": 1100} {"train_loss": -21.568056106567383, "global_step": 91375, "epoch": 1100} {"train_loss": -21.84871482849121, "global_step": 91376, "epoch": 1100} {"train_loss": -21.74957847595215, "global_step": 91377, "epoch": 1100} {"train_loss": -21.823959350585938, "global_step": 91378, "epoch": 1100} {"train_loss": -21.86306381225586, "global_step": 91379, "epoch": 1100} {"train_loss": -21.503965377807617, "global_step": 91380, "epoch": 1100} {"train_loss": -21.673063278198242, "global_step": 91381, "epoch": 1100} {"train_loss": -21.59333994302405, "global_step": 91382, "epoch": 1100, "train/sim_max_reward_0": 1.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4500000": 1.0, "test/sim_max_reward_4500001": 1.0, "test/sim_max_reward_4500002": 1.0, "test/sim_max_reward_4500003": 1.0, "test/sim_max_reward_4500004": 0.0, "test/sim_max_reward_4500005": 1.0, "test/sim_max_reward_4500006": 1.0, "test/sim_max_reward_4500007": 1.0, "test/sim_max_reward_4500008": 1.0, "test/sim_max_reward_4500009": 1.0, "test/sim_max_reward_4500010": 1.0, "test/sim_max_reward_4500011": 1.0, "test/sim_max_reward_4500012": 1.0, "test/sim_max_reward_4500013": 1.0, "test/sim_max_reward_4500014": 1.0, "test/sim_max_reward_4500015": 1.0, "test/sim_max_reward_4500016": 1.0, "test/sim_max_reward_4500017": 1.0, "test/sim_max_reward_4500018": 1.0, "test/sim_max_reward_4500019": 1.0, "test/sim_max_reward_4500020": 1.0, "test/sim_max_reward_4500021": 1.0, "train/mean_score": 1.0, "test/mean_score": 0.9545454545454546, "val_loss": 6492215.0} {"train_loss": -21.039138793945312, "global_step": 91383, "epoch": 1101} {"train_loss": -21.165658950805664, "global_step": 91384, "epoch": 1101} {"train_loss": -21.56056022644043, "global_step": 91385, "epoch": 1101} {"train_loss": -21.585193634033203, "global_step": 91386, "epoch": 1101} {"train_loss": -21.16288948059082, "global_step": 91387, "epoch": 1101} {"train_loss": -21.47524070739746, "global_step": 91388, "epoch": 1101} {"train_loss": -21.444238662719727, "global_step": 91389, "epoch": 1101} {"train_loss": -21.567840576171875, "global_step": 91390, "epoch": 1101} {"train_loss": -21.37244415283203, "global_step": 91391, "epoch": 1101} {"train_loss": -21.160724639892578, "global_step": 91392, "epoch": 1101} {"train_loss": -21.659372329711914, "global_step": 91393, "epoch": 1101} {"train_loss": -21.46832847595215, "global_step": 91394, "epoch": 1101} {"train_loss": -21.39994239807129, "global_step": 91395, "epoch": 1101} {"train_loss": -21.342679977416992, "global_step": 91396, "epoch": 1101} {"train_loss": -21.39607810974121, "global_step": 91397, "epoch": 1101} {"train_loss": -21.47083854675293, "global_step": 91398, "epoch": 1101} {"train_loss": -21.5305233001709, "global_step": 91399, "epoch": 1101} {"train_loss": -21.513748168945312, "global_step": 91400, "epoch": 1101} {"train_loss": -21.538183212280273, "global_step": 91401, "epoch": 1101} {"train_loss": -21.24624252319336, "global_step": 91402, "epoch": 1101} {"train_loss": -21.331899642944336, "global_step": 91403, "epoch": 1101} {"train_loss": -21.708465576171875, "global_step": 91404, "epoch": 1101} {"train_loss": -21.507652282714844, "global_step": 91405, "epoch": 1101} {"train_loss": -21.052488327026367, "global_step": 91406, "epoch": 1101} {"train_loss": -21.591293334960938, "global_step": 91407, "epoch": 1101} {"train_loss": -21.240137100219727, "global_step": 91408, "epoch": 1101} {"train_loss": -21.720443725585938, "global_step": 91409, "epoch": 1101} {"train_loss": -22.064960479736328, "global_step": 91410, "epoch": 1101} {"train_loss": -21.60166358947754, "global_step": 91411, "epoch": 1101} {"train_loss": -21.589994430541992, "global_step": 91412, "epoch": 1101} {"train_loss": -21.763723373413086, "global_step": 91413, "epoch": 1101} {"train_loss": -21.54170799255371, "global_step": 91414, "epoch": 1101} {"train_loss": -21.965280532836914, "global_step": 91415, "epoch": 1101} {"train_loss": -21.59560775756836, "global_step": 91416, "epoch": 1101} {"train_loss": -21.6062068939209, "global_step": 91417, "epoch": 1101} {"train_loss": -21.559171676635742, "global_step": 91418, "epoch": 1101} {"train_loss": -21.599544525146484, "global_step": 91419, "epoch": 1101} {"train_loss": -21.574663162231445, "global_step": 91420, "epoch": 1101} {"train_loss": -21.930492401123047, "global_step": 91421, "epoch": 1101} {"train_loss": -21.29933738708496, "global_step": 91422, "epoch": 1101} {"train_loss": -21.322744369506836, "global_step": 91423, "epoch": 1101} {"train_loss": -21.67213249206543, "global_step": 91424, "epoch": 1101} {"train_loss": -21.59463882446289, "global_step": 91425, "epoch": 1101} {"train_loss": -21.641494750976562, "global_step": 91426, "epoch": 1101} {"train_loss": -21.520376205444336, "global_step": 91427, "epoch": 1101} {"train_loss": -21.802419662475586, "global_step": 91428, "epoch": 1101} {"train_loss": -21.720630645751953, "global_step": 91429, "epoch": 1101} {"train_loss": -22.022216796875, "global_step": 91430, "epoch": 1101} {"train_loss": -21.29405975341797, "global_step": 91431, "epoch": 1101} {"train_loss": -21.52103042602539, "global_step": 91432, "epoch": 1101} {"train_loss": -21.43732261657715, "global_step": 91433, "epoch": 1101} {"train_loss": -21.438444137573242, "global_step": 91434, "epoch": 1101} {"train_loss": -21.91295051574707, "global_step": 91435, "epoch": 1101} {"train_loss": -21.70634651184082, "global_step": 91436, "epoch": 1101} {"train_loss": -21.89580726623535, "global_step": 91437, "epoch": 1101} {"train_loss": -21.562419891357422, "global_step": 91438, "epoch": 1101} {"train_loss": -21.631195068359375, "global_step": 91439, "epoch": 1101} {"train_loss": -21.943021774291992, "global_step": 91440, "epoch": 1101} {"train_loss": -21.598196029663086, "global_step": 91441, "epoch": 1101} {"train_loss": -21.75726318359375, "global_step": 91442, "epoch": 1101} {"train_loss": -21.815414428710938, "global_step": 91443, "epoch": 1101} {"train_loss": -21.718460083007812, "global_step": 91444, "epoch": 1101} {"train_loss": -21.689149856567383, "global_step": 91445, "epoch": 1101} {"train_loss": -21.598857879638672, "global_step": 91446, "epoch": 1101} {"train_loss": -21.393470764160156, "global_step": 91447, "epoch": 1101} {"train_loss": -21.3204402923584, "global_step": 91448, "epoch": 1101} {"train_loss": -21.533288955688477, "global_step": 91449, "epoch": 1101} {"train_loss": -21.592639923095703, "global_step": 91450, "epoch": 1101} {"train_loss": -21.780078887939453, "global_step": 91451, "epoch": 1101} {"train_loss": -21.61756134033203, "global_step": 91452, "epoch": 1101} {"train_loss": -21.856840133666992, "global_step": 91453, "epoch": 1101} {"train_loss": -21.670455932617188, "global_step": 91454, "epoch": 1101} {"train_loss": -22.048526763916016, "global_step": 91455, "epoch": 1101} {"train_loss": -21.93354606628418, "global_step": 91456, "epoch": 1101} {"train_loss": -21.993066787719727, "global_step": 91457, "epoch": 1101} {"train_loss": -21.4897518157959, "global_step": 91458, "epoch": 1101} {"train_loss": -21.874967575073242, "global_step": 91459, "epoch": 1101} {"train_loss": -21.65955924987793, "global_step": 91460, "epoch": 1101} {"train_loss": -21.9545955657959, "global_step": 91461, "epoch": 1101} {"train_loss": -21.797704696655273, "global_step": 91462, "epoch": 1101} {"train_loss": -21.63327980041504, "global_step": 91463, "epoch": 1101} {"train_loss": -21.565811157226562, "global_step": 91464, "epoch": 1101} {"train_loss": -21.5929986654994, "global_step": 91465, "epoch": 1101, "val_loss": 6100781.5} {"train_loss": -21.16033363342285, "global_step": 91466, "epoch": 1102} {"train_loss": -21.641855239868164, "global_step": 91467, "epoch": 1102} {"train_loss": -20.999221801757812, "global_step": 91468, "epoch": 1102} {"train_loss": -21.334680557250977, "global_step": 91469, "epoch": 1102} {"train_loss": -21.27569580078125, "global_step": 91470, "epoch": 1102} {"train_loss": -21.50836181640625, "global_step": 91471, "epoch": 1102} {"train_loss": -21.601903915405273, "global_step": 91472, "epoch": 1102} {"train_loss": -21.2587947845459, "global_step": 91473, "epoch": 1102} {"train_loss": -21.217390060424805, "global_step": 91474, "epoch": 1102} {"train_loss": -21.520233154296875, "global_step": 91475, "epoch": 1102} {"train_loss": -21.680173873901367, "global_step": 91476, "epoch": 1102} {"train_loss": -21.448278427124023, "global_step": 91477, "epoch": 1102} {"train_loss": -21.432849884033203, "global_step": 91478, "epoch": 1102} {"train_loss": -21.60393714904785, "global_step": 91479, "epoch": 1102} {"train_loss": -21.678956985473633, "global_step": 91480, "epoch": 1102} {"train_loss": -21.40398406982422, "global_step": 91481, "epoch": 1102} {"train_loss": -21.607505798339844, "global_step": 91482, "epoch": 1102} {"train_loss": -21.39192008972168, "global_step": 91483, "epoch": 1102} {"train_loss": -21.55219841003418, "global_step": 91484, "epoch": 1102} {"train_loss": -21.716001510620117, "global_step": 91485, "epoch": 1102} {"train_loss": -21.5745849609375, "global_step": 91486, "epoch": 1102} {"train_loss": -21.39719581604004, "global_step": 91487, "epoch": 1102} {"train_loss": -21.674449920654297, "global_step": 91488, "epoch": 1102} {"train_loss": -21.625980377197266, "global_step": 91489, "epoch": 1102} {"train_loss": -21.62891960144043, "global_step": 91490, "epoch": 1102} {"train_loss": -21.906665802001953, "global_step": 91491, "epoch": 1102} {"train_loss": -21.507871627807617, "global_step": 91492, "epoch": 1102} {"train_loss": -21.533926010131836, "global_step": 91493, "epoch": 1102} {"train_loss": -21.806732177734375, "global_step": 91494, "epoch": 1102} {"train_loss": -21.851964950561523, "global_step": 91495, "epoch": 1102} {"train_loss": -21.866220474243164, "global_step": 91496, "epoch": 1102} {"train_loss": -21.565671920776367, "global_step": 91497, "epoch": 1102} {"train_loss": -21.5932559967041, "global_step": 91498, "epoch": 1102} {"train_loss": -21.671003341674805, "global_step": 91499, "epoch": 1102} {"train_loss": -21.599328994750977, "global_step": 91500, "epoch": 1102} {"train_loss": -21.220169067382812, "global_step": 91501, "epoch": 1102} {"train_loss": -21.442346572875977, "global_step": 91502, "epoch": 1102} {"train_loss": -21.72916030883789, "global_step": 91503, "epoch": 1102} {"train_loss": -21.92405128479004, "global_step": 91504, "epoch": 1102} {"train_loss": -21.576169967651367, "global_step": 91505, "epoch": 1102} {"train_loss": -21.656827926635742, "global_step": 91506, "epoch": 1102} {"train_loss": -21.752256393432617, "global_step": 91507, "epoch": 1102} {"train_loss": -21.81294059753418, "global_step": 91508, "epoch": 1102} {"train_loss": -21.560911178588867, "global_step": 91509, "epoch": 1102} {"train_loss": -21.582965850830078, "global_step": 91510, "epoch": 1102} {"train_loss": -21.697265625, "global_step": 91511, "epoch": 1102} {"train_loss": -21.882253646850586, "global_step": 91512, "epoch": 1102} {"train_loss": -21.542936325073242, "global_step": 91513, "epoch": 1102} {"train_loss": -21.302021026611328, "global_step": 91514, "epoch": 1102} {"train_loss": -21.38294219970703, "global_step": 91515, "epoch": 1102} {"train_loss": -21.699695587158203, "global_step": 91516, "epoch": 1102} {"train_loss": -21.530845642089844, "global_step": 91517, "epoch": 1102} {"train_loss": -21.791250228881836, "global_step": 91518, "epoch": 1102} {"train_loss": -21.536579132080078, "global_step": 91519, "epoch": 1102} {"train_loss": -21.50546646118164, "global_step": 91520, "epoch": 1102} {"train_loss": -21.8170166015625, "global_step": 91521, "epoch": 1102} {"train_loss": -21.771230697631836, "global_step": 91522, "epoch": 1102} {"train_loss": -21.502702713012695, "global_step": 91523, "epoch": 1102} {"train_loss": -21.794368743896484, "global_step": 91524, "epoch": 1102} {"train_loss": -21.519086837768555, "global_step": 91525, "epoch": 1102} {"train_loss": -21.92054557800293, "global_step": 91526, "epoch": 1102} {"train_loss": -21.259965896606445, "global_step": 91527, "epoch": 1102} {"train_loss": -21.703588485717773, "global_step": 91528, "epoch": 1102} {"train_loss": -21.72796630859375, "global_step": 91529, "epoch": 1102} {"train_loss": -21.52837562561035, "global_step": 91530, "epoch": 1102} {"train_loss": -21.881406784057617, "global_step": 91531, "epoch": 1102} {"train_loss": -21.26597023010254, "global_step": 91532, "epoch": 1102} {"train_loss": -21.601072311401367, "global_step": 91533, "epoch": 1102} {"train_loss": -21.617368698120117, "global_step": 91534, "epoch": 1102} {"train_loss": -21.676742553710938, "global_step": 91535, "epoch": 1102} {"train_loss": -21.35227394104004, "global_step": 91536, "epoch": 1102} {"train_loss": -21.83746910095215, "global_step": 91537, "epoch": 1102} {"train_loss": -21.325281143188477, "global_step": 91538, "epoch": 1102} {"train_loss": -21.505216598510742, "global_step": 91539, "epoch": 1102} {"train_loss": -21.628095626831055, "global_step": 91540, "epoch": 1102} {"train_loss": -21.660261154174805, "global_step": 91541, "epoch": 1102} {"train_loss": -21.588912963867188, "global_step": 91542, "epoch": 1102} {"train_loss": -21.429561614990234, "global_step": 91543, "epoch": 1102} {"train_loss": -21.287525177001953, "global_step": 91544, "epoch": 1102} {"train_loss": -21.675395965576172, "global_step": 91545, "epoch": 1102} {"train_loss": -21.696279525756836, "global_step": 91546, "epoch": 1102} {"train_loss": -21.50324249267578, "global_step": 91547, "epoch": 1102} {"train_loss": -21.583698272705078, "global_step": 91548, "epoch": 1102, "val_loss": 6062325.0} {"train_loss": -21.308963775634766, "global_step": 91549, "epoch": 1103} {"train_loss": -21.26946449279785, "global_step": 91550, "epoch": 1103} {"train_loss": -21.5648250579834, "global_step": 91551, "epoch": 1103} {"train_loss": -21.54376220703125, "global_step": 91552, "epoch": 1103} {"train_loss": -21.045576095581055, "global_step": 91553, "epoch": 1103} {"train_loss": -21.341115951538086, "global_step": 91554, "epoch": 1103} {"train_loss": -21.386465072631836, "global_step": 91555, "epoch": 1103} {"train_loss": -20.9887638092041, "global_step": 91556, "epoch": 1103} {"train_loss": -21.08439064025879, "global_step": 91557, "epoch": 1103} {"train_loss": -21.40257453918457, "global_step": 91558, "epoch": 1103} {"train_loss": -21.832799911499023, "global_step": 91559, "epoch": 1103} {"train_loss": -21.50568199157715, "global_step": 91560, "epoch": 1103} {"train_loss": -21.552459716796875, "global_step": 91561, "epoch": 1103} {"train_loss": -21.64082908630371, "global_step": 91562, "epoch": 1103} {"train_loss": -21.414785385131836, "global_step": 91563, "epoch": 1103} {"train_loss": -21.732423782348633, "global_step": 91564, "epoch": 1103} {"train_loss": -21.376062393188477, "global_step": 91565, "epoch": 1103} {"train_loss": -21.469717025756836, "global_step": 91566, "epoch": 1103} {"train_loss": -21.5048828125, "global_step": 91567, "epoch": 1103} {"train_loss": -21.449542999267578, "global_step": 91568, "epoch": 1103} {"train_loss": -21.659452438354492, "global_step": 91569, "epoch": 1103} {"train_loss": -21.16813087463379, "global_step": 91570, "epoch": 1103} {"train_loss": -21.70097541809082, "global_step": 91571, "epoch": 1103} {"train_loss": -21.629121780395508, "global_step": 91572, "epoch": 1103} {"train_loss": -21.887653350830078, "global_step": 91573, "epoch": 1103} {"train_loss": -21.56106948852539, "global_step": 91574, "epoch": 1103} {"train_loss": -21.405254364013672, "global_step": 91575, "epoch": 1103} {"train_loss": -21.392578125, "global_step": 91576, "epoch": 1103} {"train_loss": -21.933088302612305, "global_step": 91577, "epoch": 1103} {"train_loss": -21.370641708374023, "global_step": 91578, "epoch": 1103} {"train_loss": -21.739194869995117, "global_step": 91579, "epoch": 1103} {"train_loss": -21.556190490722656, "global_step": 91580, "epoch": 1103} {"train_loss": -21.630578994750977, "global_step": 91581, "epoch": 1103} {"train_loss": -21.451154708862305, "global_step": 91582, "epoch": 1103} {"train_loss": -21.920454025268555, "global_step": 91583, "epoch": 1103} {"train_loss": -21.976863861083984, "global_step": 91584, "epoch": 1103} {"train_loss": -21.633142471313477, "global_step": 91585, "epoch": 1103} {"train_loss": -21.24208641052246, "global_step": 91586, "epoch": 1103} {"train_loss": -21.667667388916016, "global_step": 91587, "epoch": 1103} {"train_loss": -21.51527214050293, "global_step": 91588, "epoch": 1103} {"train_loss": -21.57990074157715, "global_step": 91589, "epoch": 1103} {"train_loss": -21.398862838745117, "global_step": 91590, "epoch": 1103} {"train_loss": -22.165990829467773, "global_step": 91591, "epoch": 1103} {"train_loss": -21.547779083251953, "global_step": 91592, "epoch": 1103} {"train_loss": -21.38642692565918, "global_step": 91593, "epoch": 1103} {"train_loss": -21.713871002197266, "global_step": 91594, "epoch": 1103} {"train_loss": -21.785154342651367, "global_step": 91595, "epoch": 1103} {"train_loss": -22.170576095581055, "global_step": 91596, "epoch": 1103} {"train_loss": -21.796539306640625, "global_step": 91597, "epoch": 1103} {"train_loss": -21.476972579956055, "global_step": 91598, "epoch": 1103} {"train_loss": -21.381187438964844, "global_step": 91599, "epoch": 1103} {"train_loss": -21.978515625, "global_step": 91600, "epoch": 1103} {"train_loss": -21.918317794799805, "global_step": 91601, "epoch": 1103} {"train_loss": -22.15803337097168, "global_step": 91602, "epoch": 1103} {"train_loss": -21.95469093322754, "global_step": 91603, "epoch": 1103} {"train_loss": -21.320966720581055, "global_step": 91604, "epoch": 1103} {"train_loss": -21.781723022460938, "global_step": 91605, "epoch": 1103} {"train_loss": -21.8312931060791, "global_step": 91606, "epoch": 1103} {"train_loss": -21.763486862182617, "global_step": 91607, "epoch": 1103} {"train_loss": -21.515409469604492, "global_step": 91608, "epoch": 1103} {"train_loss": -21.549619674682617, "global_step": 91609, "epoch": 1103} {"train_loss": -21.894433975219727, "global_step": 91610, "epoch": 1103} {"train_loss": -21.89851188659668, "global_step": 91611, "epoch": 1103} {"train_loss": -21.5477237701416, "global_step": 91612, "epoch": 1103} {"train_loss": -21.83036231994629, "global_step": 91613, "epoch": 1103} {"train_loss": -21.49262046813965, "global_step": 91614, "epoch": 1103} {"train_loss": -21.783384323120117, "global_step": 91615, "epoch": 1103} {"train_loss": -21.472383499145508, "global_step": 91616, "epoch": 1103} {"train_loss": -21.539167404174805, "global_step": 91617, "epoch": 1103} {"train_loss": -21.662755966186523, "global_step": 91618, "epoch": 1103} {"train_loss": -21.912616729736328, "global_step": 91619, "epoch": 1103} {"train_loss": -21.645305633544922, "global_step": 91620, "epoch": 1103} {"train_loss": -21.060834884643555, "global_step": 91621, "epoch": 1103} {"train_loss": -21.375295639038086, "global_step": 91622, "epoch": 1103} {"train_loss": -21.538190841674805, "global_step": 91623, "epoch": 1103} {"train_loss": -21.730960845947266, "global_step": 91624, "epoch": 1103} {"train_loss": -21.651748657226562, "global_step": 91625, "epoch": 1103} {"train_loss": -21.67278480529785, "global_step": 91626, "epoch": 1103} {"train_loss": -21.521596908569336, "global_step": 91627, "epoch": 1103} {"train_loss": -21.509185791015625, "global_step": 91628, "epoch": 1103} {"train_loss": -21.80303382873535, "global_step": 91629, "epoch": 1103} {"train_loss": -21.934354782104492, "global_step": 91630, "epoch": 1103} {"train_loss": -21.597905928830066, "global_step": 91631, "epoch": 1103, "val_loss": 5989106.0} {"train_loss": -21.120315551757812, "global_step": 91632, "epoch": 1104} {"train_loss": -21.534231185913086, "global_step": 91633, "epoch": 1104} {"train_loss": -21.59674644470215, "global_step": 91634, "epoch": 1104} {"train_loss": -21.004575729370117, "global_step": 91635, "epoch": 1104} {"train_loss": -21.511489868164062, "global_step": 91636, "epoch": 1104} {"train_loss": -21.50347900390625, "global_step": 91637, "epoch": 1104} {"train_loss": -21.64886474609375, "global_step": 91638, "epoch": 1104} {"train_loss": -21.577177047729492, "global_step": 91639, "epoch": 1104} {"train_loss": -21.68403434753418, "global_step": 91640, "epoch": 1104} {"train_loss": -21.608951568603516, "global_step": 91641, "epoch": 1104} {"train_loss": -21.513715744018555, "global_step": 91642, "epoch": 1104} {"train_loss": -21.674131393432617, "global_step": 91643, "epoch": 1104} {"train_loss": -21.895160675048828, "global_step": 91644, "epoch": 1104} {"train_loss": -21.792675018310547, "global_step": 91645, "epoch": 1104} {"train_loss": -21.73267936706543, "global_step": 91646, "epoch": 1104} {"train_loss": -21.899030685424805, "global_step": 91647, "epoch": 1104} {"train_loss": -21.87295913696289, "global_step": 91648, "epoch": 1104} {"train_loss": -21.554197311401367, "global_step": 91649, "epoch": 1104} {"train_loss": -21.26708984375, "global_step": 91650, "epoch": 1104} {"train_loss": -21.162260055541992, "global_step": 91651, "epoch": 1104} {"train_loss": -21.47977638244629, "global_step": 91652, "epoch": 1104} {"train_loss": -21.70167350769043, "global_step": 91653, "epoch": 1104} {"train_loss": -21.76372718811035, "global_step": 91654, "epoch": 1104} {"train_loss": -21.614561080932617, "global_step": 91655, "epoch": 1104} {"train_loss": -21.796537399291992, "global_step": 91656, "epoch": 1104} {"train_loss": -21.441654205322266, "global_step": 91657, "epoch": 1104} {"train_loss": -22.016088485717773, "global_step": 91658, "epoch": 1104} {"train_loss": -21.484189987182617, "global_step": 91659, "epoch": 1104} {"train_loss": -21.69392967224121, "global_step": 91660, "epoch": 1104} {"train_loss": -21.537220001220703, "global_step": 91661, "epoch": 1104} {"train_loss": -21.43439292907715, "global_step": 91662, "epoch": 1104} {"train_loss": -21.71158218383789, "global_step": 91663, "epoch": 1104} {"train_loss": -21.845996856689453, "global_step": 91664, "epoch": 1104} {"train_loss": -21.88230323791504, "global_step": 91665, "epoch": 1104} {"train_loss": -21.772724151611328, "global_step": 91666, "epoch": 1104} {"train_loss": -21.64988136291504, "global_step": 91667, "epoch": 1104} {"train_loss": -22.105825424194336, "global_step": 91668, "epoch": 1104} {"train_loss": -21.62200164794922, "global_step": 91669, "epoch": 1104} {"train_loss": -21.821048736572266, "global_step": 91670, "epoch": 1104} {"train_loss": -21.783966064453125, "global_step": 91671, "epoch": 1104} {"train_loss": -21.534740447998047, "global_step": 91672, "epoch": 1104} {"train_loss": -21.83571434020996, "global_step": 91673, "epoch": 1104} {"train_loss": -21.97836685180664, "global_step": 91674, "epoch": 1104} {"train_loss": -21.846454620361328, "global_step": 91675, "epoch": 1104} {"train_loss": -21.950408935546875, "global_step": 91676, "epoch": 1104} {"train_loss": -21.58095359802246, "global_step": 91677, "epoch": 1104} {"train_loss": -21.397775650024414, "global_step": 91678, "epoch": 1104} {"train_loss": -21.620527267456055, "global_step": 91679, "epoch": 1104} {"train_loss": -21.572412490844727, "global_step": 91680, "epoch": 1104} {"train_loss": -21.64560317993164, "global_step": 91681, "epoch": 1104} {"train_loss": -21.73060417175293, "global_step": 91682, "epoch": 1104} {"train_loss": -21.775907516479492, "global_step": 91683, "epoch": 1104} {"train_loss": -22.023242950439453, "global_step": 91684, "epoch": 1104} {"train_loss": -21.43662452697754, "global_step": 91685, "epoch": 1104} {"train_loss": -22.041391372680664, "global_step": 91686, "epoch": 1104} {"train_loss": -22.13132095336914, "global_step": 91687, "epoch": 1104} {"train_loss": -21.931745529174805, "global_step": 91688, "epoch": 1104} {"train_loss": -21.28219985961914, "global_step": 91689, "epoch": 1104} {"train_loss": -21.54890251159668, "global_step": 91690, "epoch": 1104} {"train_loss": -21.63750648498535, "global_step": 91691, "epoch": 1104} {"train_loss": -21.75776481628418, "global_step": 91692, "epoch": 1104} {"train_loss": -21.853849411010742, "global_step": 91693, "epoch": 1104} {"train_loss": -21.725387573242188, "global_step": 91694, "epoch": 1104} {"train_loss": -21.876220703125, "global_step": 91695, "epoch": 1104} {"train_loss": -21.548473358154297, "global_step": 91696, "epoch": 1104} {"train_loss": -21.59940528869629, "global_step": 91697, "epoch": 1104} {"train_loss": -21.471466064453125, "global_step": 91698, "epoch": 1104} {"train_loss": -21.76405143737793, "global_step": 91699, "epoch": 1104} {"train_loss": -21.37184715270996, "global_step": 91700, "epoch": 1104} {"train_loss": -21.509931564331055, "global_step": 91701, "epoch": 1104} {"train_loss": -22.103050231933594, "global_step": 91702, "epoch": 1104} {"train_loss": -21.57172203063965, "global_step": 91703, "epoch": 1104} {"train_loss": -21.3508358001709, "global_step": 91704, "epoch": 1104} {"train_loss": -21.858190536499023, "global_step": 91705, "epoch": 1104} {"train_loss": -21.1966609954834, "global_step": 91706, "epoch": 1104} {"train_loss": -21.877607345581055, "global_step": 91707, "epoch": 1104} {"train_loss": -21.274259567260742, "global_step": 91708, "epoch": 1104} {"train_loss": -21.27473258972168, "global_step": 91709, "epoch": 1104} {"train_loss": -21.921947479248047, "global_step": 91710, "epoch": 1104} {"train_loss": -21.395719528198242, "global_step": 91711, "epoch": 1104} {"train_loss": -21.581087112426758, "global_step": 91712, "epoch": 1104} {"train_loss": -21.100210189819336, "global_step": 91713, "epoch": 1104} {"train_loss": -21.62862593869129, "global_step": 91714, "epoch": 1104, "val_loss": 6131633.0} {"train_loss": -21.35603141784668, "global_step": 91715, "epoch": 1105} {"train_loss": -21.27495765686035, "global_step": 91716, "epoch": 1105} {"train_loss": -21.722822189331055, "global_step": 91717, "epoch": 1105} {"train_loss": -21.207351684570312, "global_step": 91718, "epoch": 1105} {"train_loss": -21.411487579345703, "global_step": 91719, "epoch": 1105} {"train_loss": -21.58125877380371, "global_step": 91720, "epoch": 1105} {"train_loss": -21.43239402770996, "global_step": 91721, "epoch": 1105} {"train_loss": -21.72168731689453, "global_step": 91722, "epoch": 1105} {"train_loss": -21.478134155273438, "global_step": 91723, "epoch": 1105} {"train_loss": -21.905109405517578, "global_step": 91724, "epoch": 1105} {"train_loss": -21.48438835144043, "global_step": 91725, "epoch": 1105} {"train_loss": -21.739221572875977, "global_step": 91726, "epoch": 1105} {"train_loss": -21.669950485229492, "global_step": 91727, "epoch": 1105} {"train_loss": -21.182458877563477, "global_step": 91728, "epoch": 1105} {"train_loss": -21.702194213867188, "global_step": 91729, "epoch": 1105} {"train_loss": -21.169858932495117, "global_step": 91730, "epoch": 1105} {"train_loss": -21.50010108947754, "global_step": 91731, "epoch": 1105} {"train_loss": -21.970699310302734, "global_step": 91732, "epoch": 1105} {"train_loss": -21.695886611938477, "global_step": 91733, "epoch": 1105} {"train_loss": -21.80780792236328, "global_step": 91734, "epoch": 1105} {"train_loss": -21.605316162109375, "global_step": 91735, "epoch": 1105} {"train_loss": -21.61078643798828, "global_step": 91736, "epoch": 1105} {"train_loss": -21.664167404174805, "global_step": 91737, "epoch": 1105} {"train_loss": -21.518537521362305, "global_step": 91738, "epoch": 1105} {"train_loss": -21.857349395751953, "global_step": 91739, "epoch": 1105} {"train_loss": -21.70377540588379, "global_step": 91740, "epoch": 1105} {"train_loss": -21.76875114440918, "global_step": 91741, "epoch": 1105} {"train_loss": -21.613969802856445, "global_step": 91742, "epoch": 1105} {"train_loss": -21.79193115234375, "global_step": 91743, "epoch": 1105} {"train_loss": -21.708053588867188, "global_step": 91744, "epoch": 1105} {"train_loss": -21.542652130126953, "global_step": 91745, "epoch": 1105} {"train_loss": -21.93743896484375, "global_step": 91746, "epoch": 1105} {"train_loss": -21.611190795898438, "global_step": 91747, "epoch": 1105} {"train_loss": -21.69846534729004, "global_step": 91748, "epoch": 1105} {"train_loss": -21.474279403686523, "global_step": 91749, "epoch": 1105} {"train_loss": -21.42806053161621, "global_step": 91750, "epoch": 1105} {"train_loss": -21.566150665283203, "global_step": 91751, "epoch": 1105} {"train_loss": -21.659223556518555, "global_step": 91752, "epoch": 1105} {"train_loss": -21.627119064331055, "global_step": 91753, "epoch": 1105} {"train_loss": -21.812997817993164, "global_step": 91754, "epoch": 1105} {"train_loss": -21.903226852416992, "global_step": 91755, "epoch": 1105} {"train_loss": -21.783681869506836, "global_step": 91756, "epoch": 1105} {"train_loss": -21.533842086791992, "global_step": 91757, "epoch": 1105} {"train_loss": -21.69832420349121, "global_step": 91758, "epoch": 1105} {"train_loss": -21.873865127563477, "global_step": 91759, "epoch": 1105} {"train_loss": -21.755840301513672, "global_step": 91760, "epoch": 1105} {"train_loss": -21.551219940185547, "global_step": 91761, "epoch": 1105} {"train_loss": -21.821680068969727, "global_step": 91762, "epoch": 1105} {"train_loss": -21.673959732055664, "global_step": 91763, "epoch": 1105} {"train_loss": -21.697336196899414, "global_step": 91764, "epoch": 1105} {"train_loss": -21.358238220214844, "global_step": 91765, "epoch": 1105} {"train_loss": -21.85085105895996, "global_step": 91766, "epoch": 1105} {"train_loss": -21.629526138305664, "global_step": 91767, "epoch": 1105} {"train_loss": -21.62628746032715, "global_step": 91768, "epoch": 1105} {"train_loss": -21.587295532226562, "global_step": 91769, "epoch": 1105} {"train_loss": -21.42319679260254, "global_step": 91770, "epoch": 1105} {"train_loss": -21.517789840698242, "global_step": 91771, "epoch": 1105} {"train_loss": -21.41641616821289, "global_step": 91772, "epoch": 1105} {"train_loss": -21.16208267211914, "global_step": 91773, "epoch": 1105} {"train_loss": -21.63961410522461, "global_step": 91774, "epoch": 1105} {"train_loss": -21.930713653564453, "global_step": 91775, "epoch": 1105} {"train_loss": -21.30929183959961, "global_step": 91776, "epoch": 1105} {"train_loss": -21.72574234008789, "global_step": 91777, "epoch": 1105} {"train_loss": -21.475427627563477, "global_step": 91778, "epoch": 1105} {"train_loss": -21.374217987060547, "global_step": 91779, "epoch": 1105} {"train_loss": -22.032611846923828, "global_step": 91780, "epoch": 1105} {"train_loss": -21.688461303710938, "global_step": 91781, "epoch": 1105} {"train_loss": -21.719507217407227, "global_step": 91782, "epoch": 1105} {"train_loss": -21.845762252807617, "global_step": 91783, "epoch": 1105} {"train_loss": -21.423906326293945, "global_step": 91784, "epoch": 1105} {"train_loss": -21.739835739135742, "global_step": 91785, "epoch": 1105} {"train_loss": -21.71023941040039, "global_step": 91786, "epoch": 1105} {"train_loss": -22.02826690673828, "global_step": 91787, "epoch": 1105} {"train_loss": -21.459623336791992, "global_step": 91788, "epoch": 1105} {"train_loss": -21.81623649597168, "global_step": 91789, "epoch": 1105} {"train_loss": -21.690799713134766, "global_step": 91790, "epoch": 1105} {"train_loss": -21.71024513244629, "global_step": 91791, "epoch": 1105} {"train_loss": -21.60874366760254, "global_step": 91792, "epoch": 1105} {"train_loss": -21.551239013671875, "global_step": 91793, "epoch": 1105} {"train_loss": -21.6365909576416, "global_step": 91794, "epoch": 1105} {"train_loss": -21.362442016601562, "global_step": 91795, "epoch": 1105} {"train_loss": -21.72320556640625, "global_step": 91796, "epoch": 1105} {"train_loss": -21.617635657988398, "global_step": 91797, "epoch": 1105, "val_loss": 6017682.0} {"train_loss": -21.630033493041992, "global_step": 91798, "epoch": 1106} {"train_loss": -21.58722496032715, "global_step": 91799, "epoch": 1106} {"train_loss": -21.544553756713867, "global_step": 91800, "epoch": 1106} {"train_loss": -21.400484085083008, "global_step": 91801, "epoch": 1106} {"train_loss": -21.880184173583984, "global_step": 91802, "epoch": 1106} {"train_loss": -21.773771286010742, "global_step": 91803, "epoch": 1106} {"train_loss": -21.166147232055664, "global_step": 91804, "epoch": 1106} {"train_loss": -21.61431121826172, "global_step": 91805, "epoch": 1106} {"train_loss": -21.34744644165039, "global_step": 91806, "epoch": 1106} {"train_loss": -21.489459991455078, "global_step": 91807, "epoch": 1106} {"train_loss": -21.135786056518555, "global_step": 91808, "epoch": 1106} {"train_loss": -21.50693702697754, "global_step": 91809, "epoch": 1106} {"train_loss": -21.609081268310547, "global_step": 91810, "epoch": 1106} {"train_loss": -21.32745933532715, "global_step": 91811, "epoch": 1106} {"train_loss": -21.34036636352539, "global_step": 91812, "epoch": 1106} {"train_loss": -21.78087615966797, "global_step": 91813, "epoch": 1106} {"train_loss": -21.564077377319336, "global_step": 91814, "epoch": 1106} {"train_loss": -21.871078491210938, "global_step": 91815, "epoch": 1106} {"train_loss": -21.43732261657715, "global_step": 91816, "epoch": 1106} {"train_loss": -21.662199020385742, "global_step": 91817, "epoch": 1106} {"train_loss": -21.52243423461914, "global_step": 91818, "epoch": 1106} {"train_loss": -22.0302791595459, "global_step": 91819, "epoch": 1106} {"train_loss": -21.7386531829834, "global_step": 91820, "epoch": 1106} {"train_loss": -21.617250442504883, "global_step": 91821, "epoch": 1106} {"train_loss": -21.711688995361328, "global_step": 91822, "epoch": 1106} {"train_loss": -21.29654312133789, "global_step": 91823, "epoch": 1106} {"train_loss": -21.769245147705078, "global_step": 91824, "epoch": 1106} {"train_loss": -21.786569595336914, "global_step": 91825, "epoch": 1106} {"train_loss": -21.209543228149414, "global_step": 91826, "epoch": 1106} {"train_loss": -21.84076499938965, "global_step": 91827, "epoch": 1106} {"train_loss": -21.303091049194336, "global_step": 91828, "epoch": 1106} {"train_loss": -21.474332809448242, "global_step": 91829, "epoch": 1106} {"train_loss": -21.447284698486328, "global_step": 91830, "epoch": 1106} {"train_loss": -21.073333740234375, "global_step": 91831, "epoch": 1106} {"train_loss": -21.401899337768555, "global_step": 91832, "epoch": 1106} {"train_loss": -21.574045181274414, "global_step": 91833, "epoch": 1106} {"train_loss": -21.82883071899414, "global_step": 91834, "epoch": 1106} {"train_loss": -21.167905807495117, "global_step": 91835, "epoch": 1106} {"train_loss": -21.184850692749023, "global_step": 91836, "epoch": 1106} {"train_loss": -21.532196044921875, "global_step": 91837, "epoch": 1106} {"train_loss": -21.63779067993164, "global_step": 91838, "epoch": 1106} {"train_loss": -21.708585739135742, "global_step": 91839, "epoch": 1106} {"train_loss": -21.13783073425293, "global_step": 91840, "epoch": 1106} {"train_loss": -21.602270126342773, "global_step": 91841, "epoch": 1106} {"train_loss": -21.36992835998535, "global_step": 91842, "epoch": 1106} {"train_loss": -21.75296974182129, "global_step": 91843, "epoch": 1106} {"train_loss": -21.47454071044922, "global_step": 91844, "epoch": 1106} {"train_loss": -21.639507293701172, "global_step": 91845, "epoch": 1106} {"train_loss": -21.746000289916992, "global_step": 91846, "epoch": 1106} {"train_loss": -22.043537139892578, "global_step": 91847, "epoch": 1106} {"train_loss": -22.100811004638672, "global_step": 91848, "epoch": 1106} {"train_loss": -21.60170555114746, "global_step": 91849, "epoch": 1106} {"train_loss": -21.47169303894043, "global_step": 91850, "epoch": 1106} {"train_loss": -21.472640991210938, "global_step": 91851, "epoch": 1106} {"train_loss": -21.792821884155273, "global_step": 91852, "epoch": 1106} {"train_loss": -21.647626876831055, "global_step": 91853, "epoch": 1106} {"train_loss": -21.52130126953125, "global_step": 91854, "epoch": 1106} {"train_loss": -21.65108299255371, "global_step": 91855, "epoch": 1106} {"train_loss": -22.079221725463867, "global_step": 91856, "epoch": 1106} {"train_loss": -21.488271713256836, "global_step": 91857, "epoch": 1106} {"train_loss": -21.585607528686523, "global_step": 91858, "epoch": 1106} {"train_loss": -21.573389053344727, "global_step": 91859, "epoch": 1106} {"train_loss": -21.7598934173584, "global_step": 91860, "epoch": 1106} {"train_loss": -21.86167335510254, "global_step": 91861, "epoch": 1106} {"train_loss": -21.757797241210938, "global_step": 91862, "epoch": 1106} {"train_loss": -21.57569694519043, "global_step": 91863, "epoch": 1106} {"train_loss": -21.36690902709961, "global_step": 91864, "epoch": 1106} {"train_loss": -21.532188415527344, "global_step": 91865, "epoch": 1106} {"train_loss": -21.560739517211914, "global_step": 91866, "epoch": 1106} {"train_loss": -22.175588607788086, "global_step": 91867, "epoch": 1106} {"train_loss": -21.645633697509766, "global_step": 91868, "epoch": 1106} {"train_loss": -21.571382522583008, "global_step": 91869, "epoch": 1106} {"train_loss": -21.55746078491211, "global_step": 91870, "epoch": 1106} {"train_loss": -21.928096771240234, "global_step": 91871, "epoch": 1106} {"train_loss": -21.586217880249023, "global_step": 91872, "epoch": 1106} {"train_loss": -21.930862426757812, "global_step": 91873, "epoch": 1106} {"train_loss": -21.943130493164062, "global_step": 91874, "epoch": 1106} {"train_loss": -21.694223403930664, "global_step": 91875, "epoch": 1106} {"train_loss": -21.879581451416016, "global_step": 91876, "epoch": 1106} {"train_loss": -21.973447799682617, "global_step": 91877, "epoch": 1106} {"train_loss": -21.771472930908203, "global_step": 91878, "epoch": 1106} {"train_loss": -21.582551956176758, "global_step": 91879, "epoch": 1106} {"train_loss": -21.605531830385505, "global_step": 91880, "epoch": 1106, "val_loss": 6164357.0} {"train_loss": -21.418912887573242, "global_step": 91881, "epoch": 1107} {"train_loss": -21.314191818237305, "global_step": 91882, "epoch": 1107} {"train_loss": -21.443811416625977, "global_step": 91883, "epoch": 1107} {"train_loss": -21.033222198486328, "global_step": 91884, "epoch": 1107} {"train_loss": -21.562280654907227, "global_step": 91885, "epoch": 1107} {"train_loss": -21.777069091796875, "global_step": 91886, "epoch": 1107} {"train_loss": -21.498971939086914, "global_step": 91887, "epoch": 1107} {"train_loss": -21.716957092285156, "global_step": 91888, "epoch": 1107} {"train_loss": -21.433116912841797, "global_step": 91889, "epoch": 1107} {"train_loss": -21.254425048828125, "global_step": 91890, "epoch": 1107} {"train_loss": -21.51997947692871, "global_step": 91891, "epoch": 1107} {"train_loss": -20.912527084350586, "global_step": 91892, "epoch": 1107} {"train_loss": -21.638681411743164, "global_step": 91893, "epoch": 1107} {"train_loss": -21.782703399658203, "global_step": 91894, "epoch": 1107} {"train_loss": -21.56850242614746, "global_step": 91895, "epoch": 1107} {"train_loss": -21.86152458190918, "global_step": 91896, "epoch": 1107} {"train_loss": -21.34132194519043, "global_step": 91897, "epoch": 1107} {"train_loss": -21.476886749267578, "global_step": 91898, "epoch": 1107} {"train_loss": -21.687803268432617, "global_step": 91899, "epoch": 1107} {"train_loss": -21.208723068237305, "global_step": 91900, "epoch": 1107} {"train_loss": -21.53767204284668, "global_step": 91901, "epoch": 1107} {"train_loss": -21.139326095581055, "global_step": 91902, "epoch": 1107} {"train_loss": -20.912832260131836, "global_step": 91903, "epoch": 1107} {"train_loss": -21.558361053466797, "global_step": 91904, "epoch": 1107} {"train_loss": -21.57691764831543, "global_step": 91905, "epoch": 1107} {"train_loss": -21.601343154907227, "global_step": 91906, "epoch": 1107} {"train_loss": -21.34871482849121, "global_step": 91907, "epoch": 1107} {"train_loss": -21.752439498901367, "global_step": 91908, "epoch": 1107} {"train_loss": -21.384445190429688, "global_step": 91909, "epoch": 1107} {"train_loss": -21.868030548095703, "global_step": 91910, "epoch": 1107} {"train_loss": -21.519317626953125, "global_step": 91911, "epoch": 1107} {"train_loss": -21.4521427154541, "global_step": 91912, "epoch": 1107} {"train_loss": -21.789560317993164, "global_step": 91913, "epoch": 1107} {"train_loss": -21.801050186157227, "global_step": 91914, "epoch": 1107} {"train_loss": -21.61492919921875, "global_step": 91915, "epoch": 1107} {"train_loss": -21.90843391418457, "global_step": 91916, "epoch": 1107} {"train_loss": -21.127527236938477, "global_step": 91917, "epoch": 1107} {"train_loss": -22.057260513305664, "global_step": 91918, "epoch": 1107} {"train_loss": -21.351057052612305, "global_step": 91919, "epoch": 1107} {"train_loss": -21.9046573638916, "global_step": 91920, "epoch": 1107} {"train_loss": -21.670848846435547, "global_step": 91921, "epoch": 1107} {"train_loss": -21.762908935546875, "global_step": 91922, "epoch": 1107} {"train_loss": -21.560352325439453, "global_step": 91923, "epoch": 1107} {"train_loss": -21.501638412475586, "global_step": 91924, "epoch": 1107} {"train_loss": -22.002714157104492, "global_step": 91925, "epoch": 1107} {"train_loss": -21.441970825195312, "global_step": 91926, "epoch": 1107} {"train_loss": -21.846590042114258, "global_step": 91927, "epoch": 1107} {"train_loss": -21.871795654296875, "global_step": 91928, "epoch": 1107} {"train_loss": -21.665334701538086, "global_step": 91929, "epoch": 1107} {"train_loss": -21.82333755493164, "global_step": 91930, "epoch": 1107} {"train_loss": -21.83441734313965, "global_step": 91931, "epoch": 1107} {"train_loss": -21.40979766845703, "global_step": 91932, "epoch": 1107} {"train_loss": -21.62324333190918, "global_step": 91933, "epoch": 1107} {"train_loss": -21.683691024780273, "global_step": 91934, "epoch": 1107} {"train_loss": -21.781904220581055, "global_step": 91935, "epoch": 1107} {"train_loss": -21.623184204101562, "global_step": 91936, "epoch": 1107} {"train_loss": -21.36329460144043, "global_step": 91937, "epoch": 1107} {"train_loss": -22.017826080322266, "global_step": 91938, "epoch": 1107} {"train_loss": -21.766992568969727, "global_step": 91939, "epoch": 1107} {"train_loss": -21.155439376831055, "global_step": 91940, "epoch": 1107} {"train_loss": -21.711538314819336, "global_step": 91941, "epoch": 1107} {"train_loss": -21.564762115478516, "global_step": 91942, "epoch": 1107} {"train_loss": -21.6384220123291, "global_step": 91943, "epoch": 1107} {"train_loss": -21.57343864440918, "global_step": 91944, "epoch": 1107} {"train_loss": -21.6988468170166, "global_step": 91945, "epoch": 1107} {"train_loss": -21.25078773498535, "global_step": 91946, "epoch": 1107} {"train_loss": -21.78468132019043, "global_step": 91947, "epoch": 1107} {"train_loss": -22.053125381469727, "global_step": 91948, "epoch": 1107} {"train_loss": -21.650089263916016, "global_step": 91949, "epoch": 1107} {"train_loss": -21.552228927612305, "global_step": 91950, "epoch": 1107} {"train_loss": -21.03669548034668, "global_step": 91951, "epoch": 1107} {"train_loss": -21.530681610107422, "global_step": 91952, "epoch": 1107} {"train_loss": -21.62469482421875, "global_step": 91953, "epoch": 1107} {"train_loss": -21.605670928955078, "global_step": 91954, "epoch": 1107} {"train_loss": -21.42656707763672, "global_step": 91955, "epoch": 1107} {"train_loss": -21.65106201171875, "global_step": 91956, "epoch": 1107} {"train_loss": -21.73483657836914, "global_step": 91957, "epoch": 1107} {"train_loss": -21.427352905273438, "global_step": 91958, "epoch": 1107} {"train_loss": -21.946958541870117, "global_step": 91959, "epoch": 1107} {"train_loss": -21.91007423400879, "global_step": 91960, "epoch": 1107} {"train_loss": -21.688772201538086, "global_step": 91961, "epoch": 1107} {"train_loss": -21.636137008666992, "global_step": 91962, "epoch": 1107} {"train_loss": -21.574088062148498, "global_step": 91963, "epoch": 1107, "val_loss": 6063420.5} {"train_loss": -21.639360427856445, "global_step": 91964, "epoch": 1108} {"train_loss": -21.689695358276367, "global_step": 91965, "epoch": 1108} {"train_loss": -21.313596725463867, "global_step": 91966, "epoch": 1108} {"train_loss": -21.178546905517578, "global_step": 91967, "epoch": 1108} {"train_loss": -21.130496978759766, "global_step": 91968, "epoch": 1108} {"train_loss": -21.24928855895996, "global_step": 91969, "epoch": 1108} {"train_loss": -21.427854537963867, "global_step": 91970, "epoch": 1108} {"train_loss": -21.16676139831543, "global_step": 91971, "epoch": 1108} {"train_loss": -21.616384506225586, "global_step": 91972, "epoch": 1108} {"train_loss": -21.16737174987793, "global_step": 91973, "epoch": 1108} {"train_loss": -21.564565658569336, "global_step": 91974, "epoch": 1108} {"train_loss": -21.32774543762207, "global_step": 91975, "epoch": 1108} {"train_loss": -21.612226486206055, "global_step": 91976, "epoch": 1108} {"train_loss": -21.37507438659668, "global_step": 91977, "epoch": 1108} {"train_loss": -21.587305068969727, "global_step": 91978, "epoch": 1108} {"train_loss": -21.66762351989746, "global_step": 91979, "epoch": 1108} {"train_loss": -21.24306869506836, "global_step": 91980, "epoch": 1108} {"train_loss": -21.69964599609375, "global_step": 91981, "epoch": 1108} {"train_loss": -21.253393173217773, "global_step": 91982, "epoch": 1108} {"train_loss": -21.525436401367188, "global_step": 91983, "epoch": 1108} {"train_loss": -20.93149185180664, "global_step": 91984, "epoch": 1108} {"train_loss": -21.531356811523438, "global_step": 91985, "epoch": 1108} {"train_loss": -21.032377243041992, "global_step": 91986, "epoch": 1108} {"train_loss": -21.60513687133789, "global_step": 91987, "epoch": 1108} {"train_loss": -21.53116798400879, "global_step": 91988, "epoch": 1108} {"train_loss": -21.557666778564453, "global_step": 91989, "epoch": 1108} {"train_loss": -21.724594116210938, "global_step": 91990, "epoch": 1108} {"train_loss": -21.75874900817871, "global_step": 91991, "epoch": 1108} {"train_loss": -21.73691749572754, "global_step": 91992, "epoch": 1108} {"train_loss": -21.522367477416992, "global_step": 91993, "epoch": 1108} {"train_loss": -21.774442672729492, "global_step": 91994, "epoch": 1108} {"train_loss": -21.42561149597168, "global_step": 91995, "epoch": 1108} {"train_loss": -21.68857765197754, "global_step": 91996, "epoch": 1108} {"train_loss": -22.11122703552246, "global_step": 91997, "epoch": 1108} {"train_loss": -21.713367462158203, "global_step": 91998, "epoch": 1108} {"train_loss": -21.585758209228516, "global_step": 91999, "epoch": 1108} {"train_loss": -21.965299606323242, "global_step": 92000, "epoch": 1108} {"train_loss": -21.565412521362305, "global_step": 92001, "epoch": 1108} {"train_loss": -21.654041290283203, "global_step": 92002, "epoch": 1108} {"train_loss": -21.656612396240234, "global_step": 92003, "epoch": 1108} {"train_loss": -21.376224517822266, "global_step": 92004, "epoch": 1108} {"train_loss": -21.741640090942383, "global_step": 92005, "epoch": 1108} {"train_loss": -21.41021156311035, "global_step": 92006, "epoch": 1108} {"train_loss": -21.73941421508789, "global_step": 92007, "epoch": 1108} {"train_loss": -21.81070327758789, "global_step": 92008, "epoch": 1108} {"train_loss": -21.673803329467773, "global_step": 92009, "epoch": 1108} {"train_loss": -22.0250186920166, "global_step": 92010, "epoch": 1108} {"train_loss": -21.680234909057617, "global_step": 92011, "epoch": 1108} {"train_loss": -21.524185180664062, "global_step": 92012, "epoch": 1108} {"train_loss": -21.83017349243164, "global_step": 92013, "epoch": 1108} {"train_loss": -21.412981033325195, "global_step": 92014, "epoch": 1108} {"train_loss": -21.514572143554688, "global_step": 92015, "epoch": 1108} {"train_loss": -21.684974670410156, "global_step": 92016, "epoch": 1108} {"train_loss": -21.546661376953125, "global_step": 92017, "epoch": 1108} {"train_loss": -21.5692195892334, "global_step": 92018, "epoch": 1108} {"train_loss": -21.79913330078125, "global_step": 92019, "epoch": 1108} {"train_loss": -21.891380310058594, "global_step": 92020, "epoch": 1108} {"train_loss": -21.826120376586914, "global_step": 92021, "epoch": 1108} {"train_loss": -21.808408737182617, "global_step": 92022, "epoch": 1108} {"train_loss": -21.69141960144043, "global_step": 92023, "epoch": 1108} {"train_loss": -21.671010971069336, "global_step": 92024, "epoch": 1108} {"train_loss": -21.624052047729492, "global_step": 92025, "epoch": 1108} {"train_loss": -21.65107536315918, "global_step": 92026, "epoch": 1108} {"train_loss": -21.594152450561523, "global_step": 92027, "epoch": 1108} {"train_loss": -21.7913818359375, "global_step": 92028, "epoch": 1108} {"train_loss": -21.754501342773438, "global_step": 92029, "epoch": 1108} {"train_loss": -21.776775360107422, "global_step": 92030, "epoch": 1108} {"train_loss": -21.87835121154785, "global_step": 92031, "epoch": 1108} {"train_loss": -21.937957763671875, "global_step": 92032, "epoch": 1108} {"train_loss": -21.919055938720703, "global_step": 92033, "epoch": 1108} {"train_loss": -21.705860137939453, "global_step": 92034, "epoch": 1108} {"train_loss": -21.63467788696289, "global_step": 92035, "epoch": 1108} {"train_loss": -21.73395538330078, "global_step": 92036, "epoch": 1108} {"train_loss": -21.69224739074707, "global_step": 92037, "epoch": 1108} {"train_loss": -21.872482299804688, "global_step": 92038, "epoch": 1108} {"train_loss": -21.397912979125977, "global_step": 92039, "epoch": 1108} {"train_loss": -21.999282836914062, "global_step": 92040, "epoch": 1108} {"train_loss": -21.512083053588867, "global_step": 92041, "epoch": 1108} {"train_loss": -21.300582885742188, "global_step": 92042, "epoch": 1108} {"train_loss": -21.261444091796875, "global_step": 92043, "epoch": 1108} {"train_loss": -21.717023849487305, "global_step": 92044, "epoch": 1108} {"train_loss": -21.36276626586914, "global_step": 92045, "epoch": 1108} {"train_loss": -21.5923132379371, "global_step": 92046, "epoch": 1108, "val_loss": 6015355.5} {"train_loss": -21.04840087890625, "global_step": 92047, "epoch": 1109} {"train_loss": -21.1347599029541, "global_step": 92048, "epoch": 1109} {"train_loss": -21.293933868408203, "global_step": 92049, "epoch": 1109} {"train_loss": -21.511035919189453, "global_step": 92050, "epoch": 1109} {"train_loss": -21.322677612304688, "global_step": 92051, "epoch": 1109} {"train_loss": -21.661563873291016, "global_step": 92052, "epoch": 1109} {"train_loss": -21.482088088989258, "global_step": 92053, "epoch": 1109} {"train_loss": -21.546672821044922, "global_step": 92054, "epoch": 1109} {"train_loss": -21.51962661743164, "global_step": 92055, "epoch": 1109} {"train_loss": -21.708805084228516, "global_step": 92056, "epoch": 1109} {"train_loss": -21.3968563079834, "global_step": 92057, "epoch": 1109} {"train_loss": -21.515583038330078, "global_step": 92058, "epoch": 1109} {"train_loss": -21.523788452148438, "global_step": 92059, "epoch": 1109} {"train_loss": -21.834928512573242, "global_step": 92060, "epoch": 1109} {"train_loss": -21.5587100982666, "global_step": 92061, "epoch": 1109} {"train_loss": -21.647573471069336, "global_step": 92062, "epoch": 1109} {"train_loss": -21.497364044189453, "global_step": 92063, "epoch": 1109} {"train_loss": -21.5345516204834, "global_step": 92064, "epoch": 1109} {"train_loss": -22.110647201538086, "global_step": 92065, "epoch": 1109} {"train_loss": -21.914920806884766, "global_step": 92066, "epoch": 1109} {"train_loss": -21.26077651977539, "global_step": 92067, "epoch": 1109} {"train_loss": -21.35465431213379, "global_step": 92068, "epoch": 1109} {"train_loss": -22.080127716064453, "global_step": 92069, "epoch": 1109} {"train_loss": -21.618370056152344, "global_step": 92070, "epoch": 1109} {"train_loss": -21.516677856445312, "global_step": 92071, "epoch": 1109} {"train_loss": -21.738525390625, "global_step": 92072, "epoch": 1109} {"train_loss": -21.841787338256836, "global_step": 92073, "epoch": 1109} {"train_loss": -21.6412353515625, "global_step": 92074, "epoch": 1109} {"train_loss": -21.701610565185547, "global_step": 92075, "epoch": 1109} {"train_loss": -21.522184371948242, "global_step": 92076, "epoch": 1109} {"train_loss": -21.606943130493164, "global_step": 92077, "epoch": 1109} {"train_loss": -21.738981246948242, "global_step": 92078, "epoch": 1109} {"train_loss": -21.931936264038086, "global_step": 92079, "epoch": 1109} {"train_loss": -21.898508071899414, "global_step": 92080, "epoch": 1109} {"train_loss": -21.524993896484375, "global_step": 92081, "epoch": 1109} {"train_loss": -21.1968936920166, "global_step": 92082, "epoch": 1109} {"train_loss": -21.601242065429688, "global_step": 92083, "epoch": 1109} {"train_loss": -21.758689880371094, "global_step": 92084, "epoch": 1109} {"train_loss": -21.3460636138916, "global_step": 92085, "epoch": 1109} {"train_loss": -21.437589645385742, "global_step": 92086, "epoch": 1109} {"train_loss": -21.50288200378418, "global_step": 92087, "epoch": 1109} {"train_loss": -21.59148597717285, "global_step": 92088, "epoch": 1109} {"train_loss": -21.5955867767334, "global_step": 92089, "epoch": 1109} {"train_loss": -21.707305908203125, "global_step": 92090, "epoch": 1109} {"train_loss": -21.92470359802246, "global_step": 92091, "epoch": 1109} {"train_loss": -21.635940551757812, "global_step": 92092, "epoch": 1109} {"train_loss": -21.602981567382812, "global_step": 92093, "epoch": 1109} {"train_loss": -21.432498931884766, "global_step": 92094, "epoch": 1109} {"train_loss": -21.51761817932129, "global_step": 92095, "epoch": 1109} {"train_loss": -21.135650634765625, "global_step": 92096, "epoch": 1109} {"train_loss": -21.7371883392334, "global_step": 92097, "epoch": 1109} {"train_loss": -21.53700828552246, "global_step": 92098, "epoch": 1109} {"train_loss": -21.929794311523438, "global_step": 92099, "epoch": 1109} {"train_loss": -21.469970703125, "global_step": 92100, "epoch": 1109} {"train_loss": -21.823230743408203, "global_step": 92101, "epoch": 1109} {"train_loss": -21.482303619384766, "global_step": 92102, "epoch": 1109} {"train_loss": -21.74629020690918, "global_step": 92103, "epoch": 1109} {"train_loss": -21.856016159057617, "global_step": 92104, "epoch": 1109} {"train_loss": -21.402790069580078, "global_step": 92105, "epoch": 1109} {"train_loss": -21.58133316040039, "global_step": 92106, "epoch": 1109} {"train_loss": -21.672142028808594, "global_step": 92107, "epoch": 1109} {"train_loss": -21.950315475463867, "global_step": 92108, "epoch": 1109} {"train_loss": -21.894882202148438, "global_step": 92109, "epoch": 1109} {"train_loss": -22.19098472595215, "global_step": 92110, "epoch": 1109} {"train_loss": -21.861801147460938, "global_step": 92111, "epoch": 1109} {"train_loss": -21.516183853149414, "global_step": 92112, "epoch": 1109} {"train_loss": -21.615358352661133, "global_step": 92113, "epoch": 1109} {"train_loss": -21.753755569458008, "global_step": 92114, "epoch": 1109} {"train_loss": -21.894649505615234, "global_step": 92115, "epoch": 1109} {"train_loss": -21.640668869018555, "global_step": 92116, "epoch": 1109} {"train_loss": -21.91194725036621, "global_step": 92117, "epoch": 1109} {"train_loss": -21.571712493896484, "global_step": 92118, "epoch": 1109} {"train_loss": -22.173694610595703, "global_step": 92119, "epoch": 1109} {"train_loss": -21.25543212890625, "global_step": 92120, "epoch": 1109} {"train_loss": -21.415624618530273, "global_step": 92121, "epoch": 1109} {"train_loss": -21.746374130249023, "global_step": 92122, "epoch": 1109} {"train_loss": -21.36918067932129, "global_step": 92123, "epoch": 1109} {"train_loss": -21.352846145629883, "global_step": 92124, "epoch": 1109} {"train_loss": -21.42719841003418, "global_step": 92125, "epoch": 1109} {"train_loss": -21.8621826171875, "global_step": 92126, "epoch": 1109} {"train_loss": -21.468347549438477, "global_step": 92127, "epoch": 1109} {"train_loss": -21.496667861938477, "global_step": 92128, "epoch": 1109} {"train_loss": -21.605699056602386, "global_step": 92129, "epoch": 1109, "val_loss": 6160766.0} {"train_loss": -20.93906021118164, "global_step": 92130, "epoch": 1110} {"train_loss": -21.109819412231445, "global_step": 92131, "epoch": 1110} {"train_loss": -21.679004669189453, "global_step": 92132, "epoch": 1110} {"train_loss": -20.938880920410156, "global_step": 92133, "epoch": 1110} {"train_loss": -21.413671493530273, "global_step": 92134, "epoch": 1110} {"train_loss": -21.434520721435547, "global_step": 92135, "epoch": 1110} {"train_loss": -21.03470230102539, "global_step": 92136, "epoch": 1110} {"train_loss": -21.274551391601562, "global_step": 92137, "epoch": 1110} {"train_loss": -21.161510467529297, "global_step": 92138, "epoch": 1110} {"train_loss": -21.42996597290039, "global_step": 92139, "epoch": 1110} {"train_loss": -21.5679931640625, "global_step": 92140, "epoch": 1110} {"train_loss": -21.551610946655273, "global_step": 92141, "epoch": 1110} {"train_loss": -21.462865829467773, "global_step": 92142, "epoch": 1110} {"train_loss": -21.77142906188965, "global_step": 92143, "epoch": 1110} {"train_loss": -21.748544692993164, "global_step": 92144, "epoch": 1110} {"train_loss": -21.610097885131836, "global_step": 92145, "epoch": 1110} {"train_loss": -21.79953956604004, "global_step": 92146, "epoch": 1110} {"train_loss": -21.69313621520996, "global_step": 92147, "epoch": 1110} {"train_loss": -21.58839988708496, "global_step": 92148, "epoch": 1110} {"train_loss": -21.519285202026367, "global_step": 92149, "epoch": 1110} {"train_loss": -21.537979125976562, "global_step": 92150, "epoch": 1110} {"train_loss": -21.968948364257812, "global_step": 92151, "epoch": 1110} {"train_loss": -21.340850830078125, "global_step": 92152, "epoch": 1110} {"train_loss": -21.751909255981445, "global_step": 92153, "epoch": 1110} {"train_loss": -21.363162994384766, "global_step": 92154, "epoch": 1110} {"train_loss": -21.9884090423584, "global_step": 92155, "epoch": 1110} {"train_loss": -21.758708953857422, "global_step": 92156, "epoch": 1110} {"train_loss": -21.353069305419922, "global_step": 92157, "epoch": 1110} {"train_loss": -21.70404815673828, "global_step": 92158, "epoch": 1110} {"train_loss": -21.86041831970215, "global_step": 92159, "epoch": 1110} {"train_loss": -21.855436325073242, "global_step": 92160, "epoch": 1110} {"train_loss": -21.23907470703125, "global_step": 92161, "epoch": 1110} {"train_loss": -21.531524658203125, "global_step": 92162, "epoch": 1110} {"train_loss": -21.636173248291016, "global_step": 92163, "epoch": 1110} {"train_loss": -22.0422306060791, "global_step": 92164, "epoch": 1110} {"train_loss": -21.3217830657959, "global_step": 92165, "epoch": 1110} {"train_loss": -21.763580322265625, "global_step": 92166, "epoch": 1110} {"train_loss": -21.727453231811523, "global_step": 92167, "epoch": 1110} {"train_loss": -21.56541633605957, "global_step": 92168, "epoch": 1110} {"train_loss": -22.100011825561523, "global_step": 92169, "epoch": 1110} {"train_loss": -22.123889923095703, "global_step": 92170, "epoch": 1110} {"train_loss": -21.82742691040039, "global_step": 92171, "epoch": 1110} {"train_loss": -21.46884536743164, "global_step": 92172, "epoch": 1110} {"train_loss": -21.46758270263672, "global_step": 92173, "epoch": 1110} {"train_loss": -21.440275192260742, "global_step": 92174, "epoch": 1110} {"train_loss": -21.555278778076172, "global_step": 92175, "epoch": 1110} {"train_loss": -21.60210418701172, "global_step": 92176, "epoch": 1110} {"train_loss": -21.903499603271484, "global_step": 92177, "epoch": 1110} {"train_loss": -21.5738468170166, "global_step": 92178, "epoch": 1110} {"train_loss": -21.88698387145996, "global_step": 92179, "epoch": 1110} {"train_loss": -21.71632194519043, "global_step": 92180, "epoch": 1110} {"train_loss": -21.78334617614746, "global_step": 92181, "epoch": 1110} {"train_loss": -21.698875427246094, "global_step": 92182, "epoch": 1110} {"train_loss": -21.659305572509766, "global_step": 92183, "epoch": 1110} {"train_loss": -21.571256637573242, "global_step": 92184, "epoch": 1110} {"train_loss": -21.60491371154785, "global_step": 92185, "epoch": 1110} {"train_loss": -21.617727279663086, "global_step": 92186, "epoch": 1110} {"train_loss": -21.642436981201172, "global_step": 92187, "epoch": 1110} {"train_loss": -21.607685089111328, "global_step": 92188, "epoch": 1110} {"train_loss": -21.533233642578125, "global_step": 92189, "epoch": 1110} {"train_loss": -21.894298553466797, "global_step": 92190, "epoch": 1110} {"train_loss": -21.29701805114746, "global_step": 92191, "epoch": 1110} {"train_loss": -21.458959579467773, "global_step": 92192, "epoch": 1110} {"train_loss": -21.770532608032227, "global_step": 92193, "epoch": 1110} {"train_loss": -21.942813873291016, "global_step": 92194, "epoch": 1110} {"train_loss": -21.182470321655273, "global_step": 92195, "epoch": 1110} {"train_loss": -22.05231285095215, "global_step": 92196, "epoch": 1110} {"train_loss": -21.58990478515625, "global_step": 92197, "epoch": 1110} {"train_loss": -21.40555191040039, "global_step": 92198, "epoch": 1110} {"train_loss": -21.602487564086914, "global_step": 92199, "epoch": 1110} {"train_loss": -21.740171432495117, "global_step": 92200, "epoch": 1110} {"train_loss": -21.800249099731445, "global_step": 92201, "epoch": 1110} {"train_loss": -21.884281158447266, "global_step": 92202, "epoch": 1110} {"train_loss": -21.838722229003906, "global_step": 92203, "epoch": 1110} {"train_loss": -21.594928741455078, "global_step": 92204, "epoch": 1110} {"train_loss": -21.98601722717285, "global_step": 92205, "epoch": 1110} {"train_loss": -21.806947708129883, "global_step": 92206, "epoch": 1110} {"train_loss": -21.702890396118164, "global_step": 92207, "epoch": 1110} {"train_loss": -21.732006072998047, "global_step": 92208, "epoch": 1110} {"train_loss": -21.685537338256836, "global_step": 92209, "epoch": 1110} {"train_loss": -21.71478843688965, "global_step": 92210, "epoch": 1110} {"train_loss": -21.43430519104004, "global_step": 92211, "epoch": 1110} {"train_loss": -21.61101132128612, "global_step": 92212, "epoch": 1110, "val_loss": 5924562.5} {"train_loss": -21.794042587280273, "global_step": 92213, "epoch": 1111} {"train_loss": -21.015111923217773, "global_step": 92214, "epoch": 1111} {"train_loss": -21.590368270874023, "global_step": 92215, "epoch": 1111} {"train_loss": -20.949676513671875, "global_step": 92216, "epoch": 1111} {"train_loss": -21.040952682495117, "global_step": 92217, "epoch": 1111} {"train_loss": -21.19799041748047, "global_step": 92218, "epoch": 1111} {"train_loss": -21.338491439819336, "global_step": 92219, "epoch": 1111} {"train_loss": -21.225675582885742, "global_step": 92220, "epoch": 1111} {"train_loss": -21.27471351623535, "global_step": 92221, "epoch": 1111} {"train_loss": -21.049406051635742, "global_step": 92222, "epoch": 1111} {"train_loss": -21.227157592773438, "global_step": 92223, "epoch": 1111} {"train_loss": -21.30388832092285, "global_step": 92224, "epoch": 1111} {"train_loss": -21.473251342773438, "global_step": 92225, "epoch": 1111} {"train_loss": -21.331201553344727, "global_step": 92226, "epoch": 1111} {"train_loss": -21.012372970581055, "global_step": 92227, "epoch": 1111} {"train_loss": -21.369932174682617, "global_step": 92228, "epoch": 1111} {"train_loss": -21.67914581298828, "global_step": 92229, "epoch": 1111} {"train_loss": -21.472633361816406, "global_step": 92230, "epoch": 1111} {"train_loss": -21.801076889038086, "global_step": 92231, "epoch": 1111} {"train_loss": -21.86187744140625, "global_step": 92232, "epoch": 1111} {"train_loss": -21.542943954467773, "global_step": 92233, "epoch": 1111} {"train_loss": -21.559852600097656, "global_step": 92234, "epoch": 1111} {"train_loss": -21.739727020263672, "global_step": 92235, "epoch": 1111} {"train_loss": -21.3441162109375, "global_step": 92236, "epoch": 1111} {"train_loss": -22.0731143951416, "global_step": 92237, "epoch": 1111} {"train_loss": -21.569704055786133, "global_step": 92238, "epoch": 1111} {"train_loss": -21.483373641967773, "global_step": 92239, "epoch": 1111} {"train_loss": -21.84671974182129, "global_step": 92240, "epoch": 1111} {"train_loss": -21.51712989807129, "global_step": 92241, "epoch": 1111} {"train_loss": -21.49277114868164, "global_step": 92242, "epoch": 1111} {"train_loss": -21.491926193237305, "global_step": 92243, "epoch": 1111} {"train_loss": -21.796018600463867, "global_step": 92244, "epoch": 1111} {"train_loss": -21.459636688232422, "global_step": 92245, "epoch": 1111} {"train_loss": -21.687137603759766, "global_step": 92246, "epoch": 1111} {"train_loss": -21.815959930419922, "global_step": 92247, "epoch": 1111} {"train_loss": -21.825231552124023, "global_step": 92248, "epoch": 1111} {"train_loss": -21.848997116088867, "global_step": 92249, "epoch": 1111} {"train_loss": -21.914518356323242, "global_step": 92250, "epoch": 1111} {"train_loss": -21.894067764282227, "global_step": 92251, "epoch": 1111} {"train_loss": -21.40665054321289, "global_step": 92252, "epoch": 1111} {"train_loss": -21.44716453552246, "global_step": 92253, "epoch": 1111} {"train_loss": -21.571226119995117, "global_step": 92254, "epoch": 1111} {"train_loss": -21.767087936401367, "global_step": 92255, "epoch": 1111} {"train_loss": -21.60750961303711, "global_step": 92256, "epoch": 1111} {"train_loss": -21.740615844726562, "global_step": 92257, "epoch": 1111} {"train_loss": -21.635135650634766, "global_step": 92258, "epoch": 1111} {"train_loss": -21.834762573242188, "global_step": 92259, "epoch": 1111} {"train_loss": -21.71041488647461, "global_step": 92260, "epoch": 1111} {"train_loss": -21.65997314453125, "global_step": 92261, "epoch": 1111} {"train_loss": -21.629318237304688, "global_step": 92262, "epoch": 1111} {"train_loss": -21.548053741455078, "global_step": 92263, "epoch": 1111} {"train_loss": -21.322751998901367, "global_step": 92264, "epoch": 1111} {"train_loss": -21.93405532836914, "global_step": 92265, "epoch": 1111} {"train_loss": -22.105497360229492, "global_step": 92266, "epoch": 1111} {"train_loss": -21.761859893798828, "global_step": 92267, "epoch": 1111} {"train_loss": -21.922273635864258, "global_step": 92268, "epoch": 1111} {"train_loss": -21.782791137695312, "global_step": 92269, "epoch": 1111} {"train_loss": -21.757339477539062, "global_step": 92270, "epoch": 1111} {"train_loss": -21.71531867980957, "global_step": 92271, "epoch": 1111} {"train_loss": -21.838350296020508, "global_step": 92272, "epoch": 1111} {"train_loss": -21.797513961791992, "global_step": 92273, "epoch": 1111} {"train_loss": -21.890483856201172, "global_step": 92274, "epoch": 1111} {"train_loss": -21.7032527923584, "global_step": 92275, "epoch": 1111} {"train_loss": -21.748594284057617, "global_step": 92276, "epoch": 1111} {"train_loss": -21.826568603515625, "global_step": 92277, "epoch": 1111} {"train_loss": -21.797000885009766, "global_step": 92278, "epoch": 1111} {"train_loss": -21.459762573242188, "global_step": 92279, "epoch": 1111} {"train_loss": -21.442230224609375, "global_step": 92280, "epoch": 1111} {"train_loss": -21.556726455688477, "global_step": 92281, "epoch": 1111} {"train_loss": -21.45461082458496, "global_step": 92282, "epoch": 1111} {"train_loss": -21.725967407226562, "global_step": 92283, "epoch": 1111} {"train_loss": -21.366657257080078, "global_step": 92284, "epoch": 1111} {"train_loss": -21.61578941345215, "global_step": 92285, "epoch": 1111} {"train_loss": -21.430801391601562, "global_step": 92286, "epoch": 1111} {"train_loss": -21.501893997192383, "global_step": 92287, "epoch": 1111} {"train_loss": -21.63542938232422, "global_step": 92288, "epoch": 1111} {"train_loss": -21.75851058959961, "global_step": 92289, "epoch": 1111} {"train_loss": -22.155961990356445, "global_step": 92290, "epoch": 1111} {"train_loss": -21.729406356811523, "global_step": 92291, "epoch": 1111} {"train_loss": -21.67483901977539, "global_step": 92292, "epoch": 1111} {"train_loss": -21.65229606628418, "global_step": 92293, "epoch": 1111} {"train_loss": -21.340909957885742, "global_step": 92294, "epoch": 1111} {"train_loss": -21.594156288238892, "global_step": 92295, "epoch": 1111, "val_loss": 6278375.0} {"train_loss": -21.4755859375, "global_step": 92296, "epoch": 1112} {"train_loss": -21.125015258789062, "global_step": 92297, "epoch": 1112} {"train_loss": -21.7832088470459, "global_step": 92298, "epoch": 1112} {"train_loss": -21.265750885009766, "global_step": 92299, "epoch": 1112} {"train_loss": -21.4890193939209, "global_step": 92300, "epoch": 1112} {"train_loss": -21.40010643005371, "global_step": 92301, "epoch": 1112} {"train_loss": -21.73652458190918, "global_step": 92302, "epoch": 1112} {"train_loss": -21.478036880493164, "global_step": 92303, "epoch": 1112} {"train_loss": -21.707378387451172, "global_step": 92304, "epoch": 1112} {"train_loss": -21.383535385131836, "global_step": 92305, "epoch": 1112} {"train_loss": -21.48893165588379, "global_step": 92306, "epoch": 1112} {"train_loss": -21.793798446655273, "global_step": 92307, "epoch": 1112} {"train_loss": -21.59946632385254, "global_step": 92308, "epoch": 1112} {"train_loss": -21.679946899414062, "global_step": 92309, "epoch": 1112} {"train_loss": -21.748640060424805, "global_step": 92310, "epoch": 1112} {"train_loss": -21.69055938720703, "global_step": 92311, "epoch": 1112} {"train_loss": -21.893966674804688, "global_step": 92312, "epoch": 1112} {"train_loss": -21.37891960144043, "global_step": 92313, "epoch": 1112} {"train_loss": -21.50190544128418, "global_step": 92314, "epoch": 1112} {"train_loss": -21.567174911499023, "global_step": 92315, "epoch": 1112} {"train_loss": -21.721336364746094, "global_step": 92316, "epoch": 1112} {"train_loss": -21.8637752532959, "global_step": 92317, "epoch": 1112} {"train_loss": -21.40241813659668, "global_step": 92318, "epoch": 1112} {"train_loss": -22.003005981445312, "global_step": 92319, "epoch": 1112} {"train_loss": -21.732385635375977, "global_step": 92320, "epoch": 1112} {"train_loss": -21.83481788635254, "global_step": 92321, "epoch": 1112} {"train_loss": -21.623151779174805, "global_step": 92322, "epoch": 1112} {"train_loss": -21.73177146911621, "global_step": 92323, "epoch": 1112} {"train_loss": -21.64204216003418, "global_step": 92324, "epoch": 1112} {"train_loss": -21.701757431030273, "global_step": 92325, "epoch": 1112} {"train_loss": -21.900970458984375, "global_step": 92326, "epoch": 1112} {"train_loss": -21.680286407470703, "global_step": 92327, "epoch": 1112} {"train_loss": -21.4532527923584, "global_step": 92328, "epoch": 1112} {"train_loss": -21.474002838134766, "global_step": 92329, "epoch": 1112} {"train_loss": -21.648052215576172, "global_step": 92330, "epoch": 1112} {"train_loss": -21.965164184570312, "global_step": 92331, "epoch": 1112} {"train_loss": -21.213775634765625, "global_step": 92332, "epoch": 1112} {"train_loss": -21.647682189941406, "global_step": 92333, "epoch": 1112} {"train_loss": -21.53165626525879, "global_step": 92334, "epoch": 1112} {"train_loss": -21.49593162536621, "global_step": 92335, "epoch": 1112} {"train_loss": -21.637786865234375, "global_step": 92336, "epoch": 1112} {"train_loss": -21.9759464263916, "global_step": 92337, "epoch": 1112} {"train_loss": -21.59039306640625, "global_step": 92338, "epoch": 1112} {"train_loss": -21.736957550048828, "global_step": 92339, "epoch": 1112} {"train_loss": -21.752761840820312, "global_step": 92340, "epoch": 1112} {"train_loss": -21.589414596557617, "global_step": 92341, "epoch": 1112} {"train_loss": -22.025897979736328, "global_step": 92342, "epoch": 1112} {"train_loss": -22.015104293823242, "global_step": 92343, "epoch": 1112} {"train_loss": -21.816579818725586, "global_step": 92344, "epoch": 1112} {"train_loss": -21.70086097717285, "global_step": 92345, "epoch": 1112} {"train_loss": -21.592138290405273, "global_step": 92346, "epoch": 1112} {"train_loss": -21.876081466674805, "global_step": 92347, "epoch": 1112} {"train_loss": -21.344877243041992, "global_step": 92348, "epoch": 1112} {"train_loss": -21.578107833862305, "global_step": 92349, "epoch": 1112} {"train_loss": -21.836210250854492, "global_step": 92350, "epoch": 1112} {"train_loss": -21.953901290893555, "global_step": 92351, "epoch": 1112} {"train_loss": -21.698991775512695, "global_step": 92352, "epoch": 1112} {"train_loss": -21.846452713012695, "global_step": 92353, "epoch": 1112} {"train_loss": -21.56422996520996, "global_step": 92354, "epoch": 1112} {"train_loss": -21.86294937133789, "global_step": 92355, "epoch": 1112} {"train_loss": -21.568246841430664, "global_step": 92356, "epoch": 1112} {"train_loss": -21.6427059173584, "global_step": 92357, "epoch": 1112} {"train_loss": -21.583784103393555, "global_step": 92358, "epoch": 1112} {"train_loss": -21.813796997070312, "global_step": 92359, "epoch": 1112} {"train_loss": -21.4935245513916, "global_step": 92360, "epoch": 1112} {"train_loss": -21.89290428161621, "global_step": 92361, "epoch": 1112} {"train_loss": -21.428701400756836, "global_step": 92362, "epoch": 1112} {"train_loss": -21.713403701782227, "global_step": 92363, "epoch": 1112} {"train_loss": -21.846487045288086, "global_step": 92364, "epoch": 1112} {"train_loss": -22.02060317993164, "global_step": 92365, "epoch": 1112} {"train_loss": -21.552335739135742, "global_step": 92366, "epoch": 1112} {"train_loss": -21.52739906311035, "global_step": 92367, "epoch": 1112} {"train_loss": -22.050134658813477, "global_step": 92368, "epoch": 1112} {"train_loss": -21.34451675415039, "global_step": 92369, "epoch": 1112} {"train_loss": -21.57706069946289, "global_step": 92370, "epoch": 1112} {"train_loss": -21.69718360900879, "global_step": 92371, "epoch": 1112} {"train_loss": -21.85895538330078, "global_step": 92372, "epoch": 1112} {"train_loss": -21.672029495239258, "global_step": 92373, "epoch": 1112} {"train_loss": -21.4600830078125, "global_step": 92374, "epoch": 1112} {"train_loss": -21.991498947143555, "global_step": 92375, "epoch": 1112} {"train_loss": -21.30903434753418, "global_step": 92376, "epoch": 1112} {"train_loss": -21.853342056274414, "global_step": 92377, "epoch": 1112} {"train_loss": -21.678814279027733, "global_step": 92378, "epoch": 1112, "val_loss": 6184416.5} {"train_loss": -20.775634765625, "global_step": 92379, "epoch": 1113} {"train_loss": -20.424711227416992, "global_step": 92380, "epoch": 1113} {"train_loss": -21.31081771850586, "global_step": 92381, "epoch": 1113} {"train_loss": -20.783681869506836, "global_step": 92382, "epoch": 1113} {"train_loss": -21.331586837768555, "global_step": 92383, "epoch": 1113} {"train_loss": -21.0258731842041, "global_step": 92384, "epoch": 1113} {"train_loss": -21.237699508666992, "global_step": 92385, "epoch": 1113} {"train_loss": -21.194067001342773, "global_step": 92386, "epoch": 1113} {"train_loss": -20.940954208374023, "global_step": 92387, "epoch": 1113} {"train_loss": -21.60397720336914, "global_step": 92388, "epoch": 1113} {"train_loss": -21.324811935424805, "global_step": 92389, "epoch": 1113} {"train_loss": -21.597171783447266, "global_step": 92390, "epoch": 1113} {"train_loss": -21.322555541992188, "global_step": 92391, "epoch": 1113} {"train_loss": -21.35268211364746, "global_step": 92392, "epoch": 1113} {"train_loss": -21.27578353881836, "global_step": 92393, "epoch": 1113} {"train_loss": -21.167484283447266, "global_step": 92394, "epoch": 1113} {"train_loss": -21.608200073242188, "global_step": 92395, "epoch": 1113} {"train_loss": -21.451923370361328, "global_step": 92396, "epoch": 1113} {"train_loss": -21.605159759521484, "global_step": 92397, "epoch": 1113} {"train_loss": -21.63299560546875, "global_step": 92398, "epoch": 1113} {"train_loss": -21.2117862701416, "global_step": 92399, "epoch": 1113} {"train_loss": -21.38026237487793, "global_step": 92400, "epoch": 1113} {"train_loss": -21.378469467163086, "global_step": 92401, "epoch": 1113} {"train_loss": -21.387853622436523, "global_step": 92402, "epoch": 1113} {"train_loss": -21.79474449157715, "global_step": 92403, "epoch": 1113} {"train_loss": -21.51947021484375, "global_step": 92404, "epoch": 1113} {"train_loss": -21.854829788208008, "global_step": 92405, "epoch": 1113} {"train_loss": -21.818618774414062, "global_step": 92406, "epoch": 1113} {"train_loss": -21.783842086791992, "global_step": 92407, "epoch": 1113} {"train_loss": -21.874486923217773, "global_step": 92408, "epoch": 1113} {"train_loss": -21.77089500427246, "global_step": 92409, "epoch": 1113} {"train_loss": -21.34592628479004, "global_step": 92410, "epoch": 1113} {"train_loss": -21.582477569580078, "global_step": 92411, "epoch": 1113} {"train_loss": -21.979434967041016, "global_step": 92412, "epoch": 1113} {"train_loss": -21.58661460876465, "global_step": 92413, "epoch": 1113} {"train_loss": -21.741378784179688, "global_step": 92414, "epoch": 1113} {"train_loss": -22.018604278564453, "global_step": 92415, "epoch": 1113} {"train_loss": -21.390897750854492, "global_step": 92416, "epoch": 1113} {"train_loss": -21.65806007385254, "global_step": 92417, "epoch": 1113} {"train_loss": -21.67068099975586, "global_step": 92418, "epoch": 1113} {"train_loss": -21.246267318725586, "global_step": 92419, "epoch": 1113} {"train_loss": -21.43281364440918, "global_step": 92420, "epoch": 1113} {"train_loss": -21.871623992919922, "global_step": 92421, "epoch": 1113} {"train_loss": -21.809207916259766, "global_step": 92422, "epoch": 1113} {"train_loss": -21.4281005859375, "global_step": 92423, "epoch": 1113} {"train_loss": -21.47456169128418, "global_step": 92424, "epoch": 1113} {"train_loss": -21.561756134033203, "global_step": 92425, "epoch": 1113} {"train_loss": -21.77798843383789, "global_step": 92426, "epoch": 1113} {"train_loss": -21.51236915588379, "global_step": 92427, "epoch": 1113} {"train_loss": -21.522815704345703, "global_step": 92428, "epoch": 1113} {"train_loss": -21.766040802001953, "global_step": 92429, "epoch": 1113} {"train_loss": -21.43015480041504, "global_step": 92430, "epoch": 1113} {"train_loss": -21.466535568237305, "global_step": 92431, "epoch": 1113} {"train_loss": -21.958425521850586, "global_step": 92432, "epoch": 1113} {"train_loss": -21.65485382080078, "global_step": 92433, "epoch": 1113} {"train_loss": -21.875072479248047, "global_step": 92434, "epoch": 1113} {"train_loss": -21.76778221130371, "global_step": 92435, "epoch": 1113} {"train_loss": -22.127899169921875, "global_step": 92436, "epoch": 1113} {"train_loss": -21.442873001098633, "global_step": 92437, "epoch": 1113} {"train_loss": -21.904699325561523, "global_step": 92438, "epoch": 1113} {"train_loss": -21.7281436920166, "global_step": 92439, "epoch": 1113} {"train_loss": -21.79549217224121, "global_step": 92440, "epoch": 1113} {"train_loss": -21.8458194732666, "global_step": 92441, "epoch": 1113} {"train_loss": -21.646860122680664, "global_step": 92442, "epoch": 1113} {"train_loss": -21.673608779907227, "global_step": 92443, "epoch": 1113} {"train_loss": -21.740768432617188, "global_step": 92444, "epoch": 1113} {"train_loss": -21.63570213317871, "global_step": 92445, "epoch": 1113} {"train_loss": -21.296648025512695, "global_step": 92446, "epoch": 1113} {"train_loss": -21.872787475585938, "global_step": 92447, "epoch": 1113} {"train_loss": -21.876344680786133, "global_step": 92448, "epoch": 1113} {"train_loss": -21.378787994384766, "global_step": 92449, "epoch": 1113} {"train_loss": -21.50487518310547, "global_step": 92450, "epoch": 1113} {"train_loss": -21.5540828704834, "global_step": 92451, "epoch": 1113} {"train_loss": -21.138635635375977, "global_step": 92452, "epoch": 1113} {"train_loss": -21.93123435974121, "global_step": 92453, "epoch": 1113} {"train_loss": -21.78372573852539, "global_step": 92454, "epoch": 1113} {"train_loss": -21.59447479248047, "global_step": 92455, "epoch": 1113} {"train_loss": -21.756696701049805, "global_step": 92456, "epoch": 1113} {"train_loss": -21.528074264526367, "global_step": 92457, "epoch": 1113} {"train_loss": -21.246057510375977, "global_step": 92458, "epoch": 1113} {"train_loss": -21.272729873657227, "global_step": 92459, "epoch": 1113} {"train_loss": -21.666757583618164, "global_step": 92460, "epoch": 1113} {"train_loss": -21.540937262845326, "global_step": 92461, "epoch": 1113, "val_loss": 6169261.0} {"train_loss": -21.654020309448242, "global_step": 92462, "epoch": 1114} {"train_loss": -21.413427352905273, "global_step": 92463, "epoch": 1114} {"train_loss": -21.7252254486084, "global_step": 92464, "epoch": 1114} {"train_loss": -21.224592208862305, "global_step": 92465, "epoch": 1114} {"train_loss": -21.28952980041504, "global_step": 92466, "epoch": 1114} {"train_loss": -21.70297622680664, "global_step": 92467, "epoch": 1114} {"train_loss": -21.39275360107422, "global_step": 92468, "epoch": 1114} {"train_loss": -21.649721145629883, "global_step": 92469, "epoch": 1114} {"train_loss": -21.761938095092773, "global_step": 92470, "epoch": 1114} {"train_loss": -22.025421142578125, "global_step": 92471, "epoch": 1114} {"train_loss": -21.555400848388672, "global_step": 92472, "epoch": 1114} {"train_loss": -21.49713134765625, "global_step": 92473, "epoch": 1114} {"train_loss": -21.96675682067871, "global_step": 92474, "epoch": 1114} {"train_loss": -21.711009979248047, "global_step": 92475, "epoch": 1114} {"train_loss": -21.274702072143555, "global_step": 92476, "epoch": 1114} {"train_loss": -21.732595443725586, "global_step": 92477, "epoch": 1114} {"train_loss": -21.75356101989746, "global_step": 92478, "epoch": 1114} {"train_loss": -21.5914249420166, "global_step": 92479, "epoch": 1114} {"train_loss": -21.835981369018555, "global_step": 92480, "epoch": 1114} {"train_loss": -21.70250701904297, "global_step": 92481, "epoch": 1114} {"train_loss": -21.75223731994629, "global_step": 92482, "epoch": 1114} {"train_loss": -21.982358932495117, "global_step": 92483, "epoch": 1114} {"train_loss": -21.213918685913086, "global_step": 92484, "epoch": 1114} {"train_loss": -21.654817581176758, "global_step": 92485, "epoch": 1114} {"train_loss": -21.474712371826172, "global_step": 92486, "epoch": 1114} {"train_loss": -21.88935661315918, "global_step": 92487, "epoch": 1114} {"train_loss": -21.885343551635742, "global_step": 92488, "epoch": 1114} {"train_loss": -21.461380004882812, "global_step": 92489, "epoch": 1114} {"train_loss": -21.725128173828125, "global_step": 92490, "epoch": 1114} {"train_loss": -21.853225708007812, "global_step": 92491, "epoch": 1114} {"train_loss": -21.771909713745117, "global_step": 92492, "epoch": 1114} {"train_loss": -21.941452026367188, "global_step": 92493, "epoch": 1114} {"train_loss": -21.398296356201172, "global_step": 92494, "epoch": 1114} {"train_loss": -21.50884437561035, "global_step": 92495, "epoch": 1114} {"train_loss": -21.945682525634766, "global_step": 92496, "epoch": 1114} {"train_loss": -21.730533599853516, "global_step": 92497, "epoch": 1114} {"train_loss": -21.69584083557129, "global_step": 92498, "epoch": 1114} {"train_loss": -21.705366134643555, "global_step": 92499, "epoch": 1114} {"train_loss": -21.429838180541992, "global_step": 92500, "epoch": 1114} {"train_loss": -21.538053512573242, "global_step": 92501, "epoch": 1114} {"train_loss": -21.830554962158203, "global_step": 92502, "epoch": 1114} {"train_loss": -21.45009422302246, "global_step": 92503, "epoch": 1114} {"train_loss": -21.78641700744629, "global_step": 92504, "epoch": 1114} {"train_loss": -21.755910873413086, "global_step": 92505, "epoch": 1114} {"train_loss": -21.749998092651367, "global_step": 92506, "epoch": 1114} {"train_loss": -21.673961639404297, "global_step": 92507, "epoch": 1114} {"train_loss": -21.78958511352539, "global_step": 92508, "epoch": 1114} {"train_loss": -21.756813049316406, "global_step": 92509, "epoch": 1114} {"train_loss": -21.88763999938965, "global_step": 92510, "epoch": 1114} {"train_loss": -21.621585845947266, "global_step": 92511, "epoch": 1114} {"train_loss": -21.72030258178711, "global_step": 92512, "epoch": 1114} {"train_loss": -21.921377182006836, "global_step": 92513, "epoch": 1114} {"train_loss": -21.729293823242188, "global_step": 92514, "epoch": 1114} {"train_loss": -21.773908615112305, "global_step": 92515, "epoch": 1114} {"train_loss": -21.620222091674805, "global_step": 92516, "epoch": 1114} {"train_loss": -21.601181030273438, "global_step": 92517, "epoch": 1114} {"train_loss": -21.6488094329834, "global_step": 92518, "epoch": 1114} {"train_loss": -21.99360466003418, "global_step": 92519, "epoch": 1114} {"train_loss": -21.888427734375, "global_step": 92520, "epoch": 1114} {"train_loss": -21.77443504333496, "global_step": 92521, "epoch": 1114} {"train_loss": -21.580280303955078, "global_step": 92522, "epoch": 1114} {"train_loss": -21.829030990600586, "global_step": 92523, "epoch": 1114} {"train_loss": -21.60418128967285, "global_step": 92524, "epoch": 1114} {"train_loss": -21.71076774597168, "global_step": 92525, "epoch": 1114} {"train_loss": -22.016529083251953, "global_step": 92526, "epoch": 1114} {"train_loss": -21.599332809448242, "global_step": 92527, "epoch": 1114} {"train_loss": -21.560205459594727, "global_step": 92528, "epoch": 1114} {"train_loss": -21.628000259399414, "global_step": 92529, "epoch": 1114} {"train_loss": -21.963136672973633, "global_step": 92530, "epoch": 1114} {"train_loss": -21.932109832763672, "global_step": 92531, "epoch": 1114} {"train_loss": -21.620004653930664, "global_step": 92532, "epoch": 1114} {"train_loss": -21.94292640686035, "global_step": 92533, "epoch": 1114} {"train_loss": -21.90741729736328, "global_step": 92534, "epoch": 1114} {"train_loss": -21.8577938079834, "global_step": 92535, "epoch": 1114} {"train_loss": -21.748512268066406, "global_step": 92536, "epoch": 1114} {"train_loss": -22.102659225463867, "global_step": 92537, "epoch": 1114} {"train_loss": -21.80849266052246, "global_step": 92538, "epoch": 1114} {"train_loss": -21.251272201538086, "global_step": 92539, "epoch": 1114} {"train_loss": -21.25420570373535, "global_step": 92540, "epoch": 1114} {"train_loss": -21.467086791992188, "global_step": 92541, "epoch": 1114} {"train_loss": -21.857593536376953, "global_step": 92542, "epoch": 1114} {"train_loss": -21.188013076782227, "global_step": 92543, "epoch": 1114} {"train_loss": -21.691070051078338, "global_step": 92544, "epoch": 1114, "val_loss": 5960663.5} {"train_loss": -21.8618106842041, "global_step": 92545, "epoch": 1115} {"train_loss": -21.398900985717773, "global_step": 92546, "epoch": 1115} {"train_loss": -21.53558921813965, "global_step": 92547, "epoch": 1115} {"train_loss": -20.81515121459961, "global_step": 92548, "epoch": 1115} {"train_loss": -21.79217529296875, "global_step": 92549, "epoch": 1115} {"train_loss": -21.560510635375977, "global_step": 92550, "epoch": 1115} {"train_loss": -21.07863426208496, "global_step": 92551, "epoch": 1115} {"train_loss": -21.520055770874023, "global_step": 92552, "epoch": 1115} {"train_loss": -21.56969451904297, "global_step": 92553, "epoch": 1115} {"train_loss": -21.26033592224121, "global_step": 92554, "epoch": 1115} {"train_loss": -21.901891708374023, "global_step": 92555, "epoch": 1115} {"train_loss": -21.482954025268555, "global_step": 92556, "epoch": 1115} {"train_loss": -21.57332992553711, "global_step": 92557, "epoch": 1115} {"train_loss": -21.559621810913086, "global_step": 92558, "epoch": 1115} {"train_loss": -21.404958724975586, "global_step": 92559, "epoch": 1115} {"train_loss": -21.3760986328125, "global_step": 92560, "epoch": 1115} {"train_loss": -21.4563045501709, "global_step": 92561, "epoch": 1115} {"train_loss": -21.659143447875977, "global_step": 92562, "epoch": 1115} {"train_loss": -21.60300636291504, "global_step": 92563, "epoch": 1115} {"train_loss": -21.596601486206055, "global_step": 92564, "epoch": 1115} {"train_loss": -21.814416885375977, "global_step": 92565, "epoch": 1115} {"train_loss": -21.988435745239258, "global_step": 92566, "epoch": 1115} {"train_loss": -21.387372970581055, "global_step": 92567, "epoch": 1115} {"train_loss": -21.24698257446289, "global_step": 92568, "epoch": 1115} {"train_loss": -21.46897315979004, "global_step": 92569, "epoch": 1115} {"train_loss": -21.686172485351562, "global_step": 92570, "epoch": 1115} {"train_loss": -21.891376495361328, "global_step": 92571, "epoch": 1115} {"train_loss": -21.297636032104492, "global_step": 92572, "epoch": 1115} {"train_loss": -21.504423141479492, "global_step": 92573, "epoch": 1115} {"train_loss": -21.5377197265625, "global_step": 92574, "epoch": 1115} {"train_loss": -21.45475196838379, "global_step": 92575, "epoch": 1115} {"train_loss": -22.08073616027832, "global_step": 92576, "epoch": 1115} {"train_loss": -21.491830825805664, "global_step": 92577, "epoch": 1115} {"train_loss": -21.4278507232666, "global_step": 92578, "epoch": 1115} {"train_loss": -22.111621856689453, "global_step": 92579, "epoch": 1115} {"train_loss": -21.388219833374023, "global_step": 92580, "epoch": 1115} {"train_loss": -21.819034576416016, "global_step": 92581, "epoch": 1115} {"train_loss": -21.553466796875, "global_step": 92582, "epoch": 1115} {"train_loss": -21.795276641845703, "global_step": 92583, "epoch": 1115} {"train_loss": -21.806615829467773, "global_step": 92584, "epoch": 1115} {"train_loss": -21.468887329101562, "global_step": 92585, "epoch": 1115} {"train_loss": -22.10451316833496, "global_step": 92586, "epoch": 1115} {"train_loss": -21.574527740478516, "global_step": 92587, "epoch": 1115} {"train_loss": -21.68079948425293, "global_step": 92588, "epoch": 1115} {"train_loss": -21.470460891723633, "global_step": 92589, "epoch": 1115} {"train_loss": -21.62217903137207, "global_step": 92590, "epoch": 1115} {"train_loss": -21.956586837768555, "global_step": 92591, "epoch": 1115} {"train_loss": -21.93738555908203, "global_step": 92592, "epoch": 1115} {"train_loss": -21.295120239257812, "global_step": 92593, "epoch": 1115} {"train_loss": -21.526399612426758, "global_step": 92594, "epoch": 1115} {"train_loss": -21.771930694580078, "global_step": 92595, "epoch": 1115} {"train_loss": -21.293611526489258, "global_step": 92596, "epoch": 1115} {"train_loss": -21.582548141479492, "global_step": 92597, "epoch": 1115} {"train_loss": -21.745174407958984, "global_step": 92598, "epoch": 1115} {"train_loss": -21.534042358398438, "global_step": 92599, "epoch": 1115} {"train_loss": -21.494537353515625, "global_step": 92600, "epoch": 1115} {"train_loss": -21.57774543762207, "global_step": 92601, "epoch": 1115} {"train_loss": -21.33873176574707, "global_step": 92602, "epoch": 1115} {"train_loss": -21.804141998291016, "global_step": 92603, "epoch": 1115} {"train_loss": -21.87748146057129, "global_step": 92604, "epoch": 1115} {"train_loss": -21.632678985595703, "global_step": 92605, "epoch": 1115} {"train_loss": -21.72601318359375, "global_step": 92606, "epoch": 1115} {"train_loss": -21.9190616607666, "global_step": 92607, "epoch": 1115} {"train_loss": -21.716150283813477, "global_step": 92608, "epoch": 1115} {"train_loss": -21.697912216186523, "global_step": 92609, "epoch": 1115} {"train_loss": -21.64695167541504, "global_step": 92610, "epoch": 1115} {"train_loss": -21.767980575561523, "global_step": 92611, "epoch": 1115} {"train_loss": -21.682363510131836, "global_step": 92612, "epoch": 1115} {"train_loss": -21.919408798217773, "global_step": 92613, "epoch": 1115} {"train_loss": -21.734312057495117, "global_step": 92614, "epoch": 1115} {"train_loss": -21.699718475341797, "global_step": 92615, "epoch": 1115} {"train_loss": -21.68020248413086, "global_step": 92616, "epoch": 1115} {"train_loss": -21.85863494873047, "global_step": 92617, "epoch": 1115} {"train_loss": -21.981027603149414, "global_step": 92618, "epoch": 1115} {"train_loss": -21.861238479614258, "global_step": 92619, "epoch": 1115} {"train_loss": -21.725738525390625, "global_step": 92620, "epoch": 1115} {"train_loss": -21.6752986907959, "global_step": 92621, "epoch": 1115} {"train_loss": -21.52147674560547, "global_step": 92622, "epoch": 1115} {"train_loss": -21.778249740600586, "global_step": 92623, "epoch": 1115} {"train_loss": -21.7302303314209, "global_step": 92624, "epoch": 1115} {"train_loss": -21.86240577697754, "global_step": 92625, "epoch": 1115} {"train_loss": -21.642675399780273, "global_step": 92626, "epoch": 1115} {"train_loss": -21.644713712025837, "global_step": 92627, "epoch": 1115, "val_loss": 6171854.0} {"train_loss": -21.356481552124023, "global_step": 92628, "epoch": 1116} {"train_loss": -21.229108810424805, "global_step": 92629, "epoch": 1116} {"train_loss": -21.21034812927246, "global_step": 92630, "epoch": 1116} {"train_loss": -21.055997848510742, "global_step": 92631, "epoch": 1116} {"train_loss": -21.463153839111328, "global_step": 92632, "epoch": 1116} {"train_loss": -21.559537887573242, "global_step": 92633, "epoch": 1116} {"train_loss": -21.183034896850586, "global_step": 92634, "epoch": 1116} {"train_loss": -21.681447982788086, "global_step": 92635, "epoch": 1116} {"train_loss": -21.548349380493164, "global_step": 92636, "epoch": 1116} {"train_loss": -21.514047622680664, "global_step": 92637, "epoch": 1116} {"train_loss": -21.598901748657227, "global_step": 92638, "epoch": 1116} {"train_loss": -21.319490432739258, "global_step": 92639, "epoch": 1116} {"train_loss": -21.587766647338867, "global_step": 92640, "epoch": 1116} {"train_loss": -21.68064308166504, "global_step": 92641, "epoch": 1116} {"train_loss": -21.6683406829834, "global_step": 92642, "epoch": 1116} {"train_loss": -21.46595573425293, "global_step": 92643, "epoch": 1116} {"train_loss": -21.672021865844727, "global_step": 92644, "epoch": 1116} {"train_loss": -21.458953857421875, "global_step": 92645, "epoch": 1116} {"train_loss": -21.51314353942871, "global_step": 92646, "epoch": 1116} {"train_loss": -21.321027755737305, "global_step": 92647, "epoch": 1116} {"train_loss": -21.694067001342773, "global_step": 92648, "epoch": 1116} {"train_loss": -21.478017807006836, "global_step": 92649, "epoch": 1116} {"train_loss": -21.247522354125977, "global_step": 92650, "epoch": 1116} {"train_loss": -21.419702529907227, "global_step": 92651, "epoch": 1116} {"train_loss": -21.310415267944336, "global_step": 92652, "epoch": 1116} {"train_loss": -21.28171157836914, "global_step": 92653, "epoch": 1116} {"train_loss": -21.854459762573242, "global_step": 92654, "epoch": 1116} {"train_loss": -21.69990348815918, "global_step": 92655, "epoch": 1116} {"train_loss": -21.725345611572266, "global_step": 92656, "epoch": 1116} {"train_loss": -21.783950805664062, "global_step": 92657, "epoch": 1116} {"train_loss": -21.784645080566406, "global_step": 92658, "epoch": 1116} {"train_loss": -21.51775360107422, "global_step": 92659, "epoch": 1116} {"train_loss": -21.727890014648438, "global_step": 92660, "epoch": 1116} {"train_loss": -21.550798416137695, "global_step": 92661, "epoch": 1116} {"train_loss": -22.06075096130371, "global_step": 92662, "epoch": 1116} {"train_loss": -21.49555778503418, "global_step": 92663, "epoch": 1116} {"train_loss": -21.75716209411621, "global_step": 92664, "epoch": 1116} {"train_loss": -21.679168701171875, "global_step": 92665, "epoch": 1116} {"train_loss": -21.826908111572266, "global_step": 92666, "epoch": 1116} {"train_loss": -21.685382843017578, "global_step": 92667, "epoch": 1116} {"train_loss": -21.94571304321289, "global_step": 92668, "epoch": 1116} {"train_loss": -21.779342651367188, "global_step": 92669, "epoch": 1116} {"train_loss": -21.302892684936523, "global_step": 92670, "epoch": 1116} {"train_loss": -21.664337158203125, "global_step": 92671, "epoch": 1116} {"train_loss": -21.85691261291504, "global_step": 92672, "epoch": 1116} {"train_loss": -21.7100830078125, "global_step": 92673, "epoch": 1116} {"train_loss": -21.52753257751465, "global_step": 92674, "epoch": 1116} {"train_loss": -21.6823787689209, "global_step": 92675, "epoch": 1116} {"train_loss": -21.753013610839844, "global_step": 92676, "epoch": 1116} {"train_loss": -21.930892944335938, "global_step": 92677, "epoch": 1116} {"train_loss": -21.282129287719727, "global_step": 92678, "epoch": 1116} {"train_loss": -21.71494483947754, "global_step": 92679, "epoch": 1116} {"train_loss": -21.573287963867188, "global_step": 92680, "epoch": 1116} {"train_loss": -21.777482986450195, "global_step": 92681, "epoch": 1116} {"train_loss": -21.60941505432129, "global_step": 92682, "epoch": 1116} {"train_loss": -21.979278564453125, "global_step": 92683, "epoch": 1116} {"train_loss": -21.671438217163086, "global_step": 92684, "epoch": 1116} {"train_loss": -21.674692153930664, "global_step": 92685, "epoch": 1116} {"train_loss": -22.062597274780273, "global_step": 92686, "epoch": 1116} {"train_loss": -21.91534996032715, "global_step": 92687, "epoch": 1116} {"train_loss": -21.71092414855957, "global_step": 92688, "epoch": 1116} {"train_loss": -21.5301513671875, "global_step": 92689, "epoch": 1116} {"train_loss": -21.534059524536133, "global_step": 92690, "epoch": 1116} {"train_loss": -22.073217391967773, "global_step": 92691, "epoch": 1116} {"train_loss": -21.407320022583008, "global_step": 92692, "epoch": 1116} {"train_loss": -22.17734718322754, "global_step": 92693, "epoch": 1116} {"train_loss": -21.82676124572754, "global_step": 92694, "epoch": 1116} {"train_loss": -20.9697265625, "global_step": 92695, "epoch": 1116} {"train_loss": -21.638757705688477, "global_step": 92696, "epoch": 1116} {"train_loss": -21.482864379882812, "global_step": 92697, "epoch": 1116} {"train_loss": -21.53461265563965, "global_step": 92698, "epoch": 1116} {"train_loss": -21.660396575927734, "global_step": 92699, "epoch": 1116} {"train_loss": -21.469924926757812, "global_step": 92700, "epoch": 1116} {"train_loss": -21.799463272094727, "global_step": 92701, "epoch": 1116} {"train_loss": -21.711061477661133, "global_step": 92702, "epoch": 1116} {"train_loss": -21.82054328918457, "global_step": 92703, "epoch": 1116} {"train_loss": -21.638504028320312, "global_step": 92704, "epoch": 1116} {"train_loss": -21.450233459472656, "global_step": 92705, "epoch": 1116} {"train_loss": -21.92078971862793, "global_step": 92706, "epoch": 1116} {"train_loss": -21.81854820251465, "global_step": 92707, "epoch": 1116} {"train_loss": -21.637714385986328, "global_step": 92708, "epoch": 1116} {"train_loss": -21.626005172729492, "global_step": 92709, "epoch": 1116} {"train_loss": -21.624377537922687, "global_step": 92710, "epoch": 1116, "val_loss": 6171324.5} {"train_loss": -21.4810733795166, "global_step": 92711, "epoch": 1117} {"train_loss": -21.09309959411621, "global_step": 92712, "epoch": 1117} {"train_loss": -21.519489288330078, "global_step": 92713, "epoch": 1117} {"train_loss": -21.324459075927734, "global_step": 92714, "epoch": 1117} {"train_loss": -21.158445358276367, "global_step": 92715, "epoch": 1117} {"train_loss": -21.598371505737305, "global_step": 92716, "epoch": 1117} {"train_loss": -21.35645866394043, "global_step": 92717, "epoch": 1117} {"train_loss": -21.371023178100586, "global_step": 92718, "epoch": 1117} {"train_loss": -21.89592742919922, "global_step": 92719, "epoch": 1117} {"train_loss": -21.592145919799805, "global_step": 92720, "epoch": 1117} {"train_loss": -21.21198081970215, "global_step": 92721, "epoch": 1117} {"train_loss": -21.566177368164062, "global_step": 92722, "epoch": 1117} {"train_loss": -21.45172882080078, "global_step": 92723, "epoch": 1117} {"train_loss": -21.74629783630371, "global_step": 92724, "epoch": 1117} {"train_loss": -21.5252742767334, "global_step": 92725, "epoch": 1117} {"train_loss": -21.769914627075195, "global_step": 92726, "epoch": 1117} {"train_loss": -21.087646484375, "global_step": 92727, "epoch": 1117} {"train_loss": -21.596115112304688, "global_step": 92728, "epoch": 1117} {"train_loss": -21.631975173950195, "global_step": 92729, "epoch": 1117} {"train_loss": -21.624393463134766, "global_step": 92730, "epoch": 1117} {"train_loss": -21.260805130004883, "global_step": 92731, "epoch": 1117} {"train_loss": -21.425661087036133, "global_step": 92732, "epoch": 1117} {"train_loss": -21.630102157592773, "global_step": 92733, "epoch": 1117} {"train_loss": -21.6208553314209, "global_step": 92734, "epoch": 1117} {"train_loss": -21.83853530883789, "global_step": 92735, "epoch": 1117} {"train_loss": -21.720062255859375, "global_step": 92736, "epoch": 1117} {"train_loss": -21.68294334411621, "global_step": 92737, "epoch": 1117} {"train_loss": -21.689533233642578, "global_step": 92738, "epoch": 1117} {"train_loss": -21.690195083618164, "global_step": 92739, "epoch": 1117} {"train_loss": -21.389053344726562, "global_step": 92740, "epoch": 1117} {"train_loss": -21.738248825073242, "global_step": 92741, "epoch": 1117} {"train_loss": -21.801977157592773, "global_step": 92742, "epoch": 1117} {"train_loss": -21.699766159057617, "global_step": 92743, "epoch": 1117} {"train_loss": -21.812475204467773, "global_step": 92744, "epoch": 1117} {"train_loss": -21.80559539794922, "global_step": 92745, "epoch": 1117} {"train_loss": -21.81413459777832, "global_step": 92746, "epoch": 1117} {"train_loss": -21.714252471923828, "global_step": 92747, "epoch": 1117} {"train_loss": -21.999303817749023, "global_step": 92748, "epoch": 1117} {"train_loss": -21.865427017211914, "global_step": 92749, "epoch": 1117} {"train_loss": -21.60906982421875, "global_step": 92750, "epoch": 1117} {"train_loss": -21.59126853942871, "global_step": 92751, "epoch": 1117} {"train_loss": -21.434032440185547, "global_step": 92752, "epoch": 1117} {"train_loss": -21.662275314331055, "global_step": 92753, "epoch": 1117} {"train_loss": -22.065567016601562, "global_step": 92754, "epoch": 1117} {"train_loss": -21.485715866088867, "global_step": 92755, "epoch": 1117} {"train_loss": -21.621936798095703, "global_step": 92756, "epoch": 1117} {"train_loss": -21.767683029174805, "global_step": 92757, "epoch": 1117} {"train_loss": -21.610410690307617, "global_step": 92758, "epoch": 1117} {"train_loss": -21.840425491333008, "global_step": 92759, "epoch": 1117} {"train_loss": -21.525835037231445, "global_step": 92760, "epoch": 1117} {"train_loss": -21.787519454956055, "global_step": 92761, "epoch": 1117} {"train_loss": -21.230016708374023, "global_step": 92762, "epoch": 1117} {"train_loss": -21.666528701782227, "global_step": 92763, "epoch": 1117} {"train_loss": -21.644275665283203, "global_step": 92764, "epoch": 1117} {"train_loss": -21.12466812133789, "global_step": 92765, "epoch": 1117} {"train_loss": -21.707929611206055, "global_step": 92766, "epoch": 1117} {"train_loss": -21.71044921875, "global_step": 92767, "epoch": 1117} {"train_loss": -21.281675338745117, "global_step": 92768, "epoch": 1117} {"train_loss": -21.920713424682617, "global_step": 92769, "epoch": 1117} {"train_loss": -21.559825897216797, "global_step": 92770, "epoch": 1117} {"train_loss": -21.425220489501953, "global_step": 92771, "epoch": 1117} {"train_loss": -22.009992599487305, "global_step": 92772, "epoch": 1117} {"train_loss": -21.289546966552734, "global_step": 92773, "epoch": 1117} {"train_loss": -21.66554069519043, "global_step": 92774, "epoch": 1117} {"train_loss": -21.724227905273438, "global_step": 92775, "epoch": 1117} {"train_loss": -21.774168014526367, "global_step": 92776, "epoch": 1117} {"train_loss": -21.394208908081055, "global_step": 92777, "epoch": 1117} {"train_loss": -21.70990562438965, "global_step": 92778, "epoch": 1117} {"train_loss": -21.462879180908203, "global_step": 92779, "epoch": 1117} {"train_loss": -21.568771362304688, "global_step": 92780, "epoch": 1117} {"train_loss": -21.86874771118164, "global_step": 92781, "epoch": 1117} {"train_loss": -21.61131477355957, "global_step": 92782, "epoch": 1117} {"train_loss": -21.790327072143555, "global_step": 92783, "epoch": 1117} {"train_loss": -21.500905990600586, "global_step": 92784, "epoch": 1117} {"train_loss": -21.77908706665039, "global_step": 92785, "epoch": 1117} {"train_loss": -21.470094680786133, "global_step": 92786, "epoch": 1117} {"train_loss": -21.72821617126465, "global_step": 92787, "epoch": 1117} {"train_loss": -21.390867233276367, "global_step": 92788, "epoch": 1117} {"train_loss": -21.84588050842285, "global_step": 92789, "epoch": 1117} {"train_loss": -22.003036499023438, "global_step": 92790, "epoch": 1117} {"train_loss": -21.612716674804688, "global_step": 92791, "epoch": 1117} {"train_loss": -21.583280563354492, "global_step": 92792, "epoch": 1117} {"train_loss": -21.604909161487257, "global_step": 92793, "epoch": 1117, "val_loss": 6200110.5} {"train_loss": -21.683837890625, "global_step": 92794, "epoch": 1118} {"train_loss": -21.411270141601562, "global_step": 92795, "epoch": 1118} {"train_loss": -21.435836791992188, "global_step": 92796, "epoch": 1118} {"train_loss": -21.66545867919922, "global_step": 92797, "epoch": 1118} {"train_loss": -21.434446334838867, "global_step": 92798, "epoch": 1118} {"train_loss": -21.654911041259766, "global_step": 92799, "epoch": 1118} {"train_loss": -21.703325271606445, "global_step": 92800, "epoch": 1118} {"train_loss": -21.340845108032227, "global_step": 92801, "epoch": 1118} {"train_loss": -21.5686092376709, "global_step": 92802, "epoch": 1118} {"train_loss": -21.7735538482666, "global_step": 92803, "epoch": 1118} {"train_loss": -21.858245849609375, "global_step": 92804, "epoch": 1118} {"train_loss": -21.612768173217773, "global_step": 92805, "epoch": 1118} {"train_loss": -21.368194580078125, "global_step": 92806, "epoch": 1118} {"train_loss": -21.856958389282227, "global_step": 92807, "epoch": 1118} {"train_loss": -21.75860595703125, "global_step": 92808, "epoch": 1118} {"train_loss": -21.84731101989746, "global_step": 92809, "epoch": 1118} {"train_loss": -21.484317779541016, "global_step": 92810, "epoch": 1118} {"train_loss": -21.522144317626953, "global_step": 92811, "epoch": 1118} {"train_loss": -21.542057037353516, "global_step": 92812, "epoch": 1118} {"train_loss": -21.680355072021484, "global_step": 92813, "epoch": 1118} {"train_loss": -21.538774490356445, "global_step": 92814, "epoch": 1118} {"train_loss": -21.66058349609375, "global_step": 92815, "epoch": 1118} {"train_loss": -21.695138931274414, "global_step": 92816, "epoch": 1118} {"train_loss": -21.567270278930664, "global_step": 92817, "epoch": 1118} {"train_loss": -22.106409072875977, "global_step": 92818, "epoch": 1118} {"train_loss": -21.50090217590332, "global_step": 92819, "epoch": 1118} {"train_loss": -21.63962745666504, "global_step": 92820, "epoch": 1118} {"train_loss": -21.648672103881836, "global_step": 92821, "epoch": 1118} {"train_loss": -21.541690826416016, "global_step": 92822, "epoch": 1118} {"train_loss": -22.181821823120117, "global_step": 92823, "epoch": 1118} {"train_loss": -21.71942138671875, "global_step": 92824, "epoch": 1118} {"train_loss": -21.683252334594727, "global_step": 92825, "epoch": 1118} {"train_loss": -21.487014770507812, "global_step": 92826, "epoch": 1118} {"train_loss": -21.496292114257812, "global_step": 92827, "epoch": 1118} {"train_loss": -21.600502014160156, "global_step": 92828, "epoch": 1118} {"train_loss": -21.826595306396484, "global_step": 92829, "epoch": 1118} {"train_loss": -21.52471160888672, "global_step": 92830, "epoch": 1118} {"train_loss": -21.758224487304688, "global_step": 92831, "epoch": 1118} {"train_loss": -21.669599533081055, "global_step": 92832, "epoch": 1118} {"train_loss": -22.07155418395996, "global_step": 92833, "epoch": 1118} {"train_loss": -21.507976531982422, "global_step": 92834, "epoch": 1118} {"train_loss": -21.62651824951172, "global_step": 92835, "epoch": 1118} {"train_loss": -21.58173942565918, "global_step": 92836, "epoch": 1118} {"train_loss": -21.812824249267578, "global_step": 92837, "epoch": 1118} {"train_loss": -21.980283737182617, "global_step": 92838, "epoch": 1118} {"train_loss": -21.610795974731445, "global_step": 92839, "epoch": 1118} {"train_loss": -21.84006118774414, "global_step": 92840, "epoch": 1118} {"train_loss": -21.7593936920166, "global_step": 92841, "epoch": 1118} {"train_loss": -21.998498916625977, "global_step": 92842, "epoch": 1118} {"train_loss": -21.940706253051758, "global_step": 92843, "epoch": 1118} {"train_loss": -21.34169578552246, "global_step": 92844, "epoch": 1118} {"train_loss": -21.709491729736328, "global_step": 92845, "epoch": 1118} {"train_loss": -21.785781860351562, "global_step": 92846, "epoch": 1118} {"train_loss": -21.62579917907715, "global_step": 92847, "epoch": 1118} {"train_loss": -21.523406982421875, "global_step": 92848, "epoch": 1118} {"train_loss": -21.894575119018555, "global_step": 92849, "epoch": 1118} {"train_loss": -21.76490592956543, "global_step": 92850, "epoch": 1118} {"train_loss": -21.495203018188477, "global_step": 92851, "epoch": 1118} {"train_loss": -21.73044776916504, "global_step": 92852, "epoch": 1118} {"train_loss": -22.07330322265625, "global_step": 92853, "epoch": 1118} {"train_loss": -21.1877498626709, "global_step": 92854, "epoch": 1118} {"train_loss": -21.672897338867188, "global_step": 92855, "epoch": 1118} {"train_loss": -21.95942497253418, "global_step": 92856, "epoch": 1118} {"train_loss": -21.631244659423828, "global_step": 92857, "epoch": 1118} {"train_loss": -21.482070922851562, "global_step": 92858, "epoch": 1118} {"train_loss": -22.0313720703125, "global_step": 92859, "epoch": 1118} {"train_loss": -21.711109161376953, "global_step": 92860, "epoch": 1118} {"train_loss": -21.594741821289062, "global_step": 92861, "epoch": 1118} {"train_loss": -21.51095962524414, "global_step": 92862, "epoch": 1118} {"train_loss": -21.6552677154541, "global_step": 92863, "epoch": 1118} {"train_loss": -21.739526748657227, "global_step": 92864, "epoch": 1118} {"train_loss": -21.670312881469727, "global_step": 92865, "epoch": 1118} {"train_loss": -21.85870933532715, "global_step": 92866, "epoch": 1118} {"train_loss": -22.259309768676758, "global_step": 92867, "epoch": 1118} {"train_loss": -21.786319732666016, "global_step": 92868, "epoch": 1118} {"train_loss": -21.635501861572266, "global_step": 92869, "epoch": 1118} {"train_loss": -21.711137771606445, "global_step": 92870, "epoch": 1118} {"train_loss": -21.616994857788086, "global_step": 92871, "epoch": 1118} {"train_loss": -21.40843391418457, "global_step": 92872, "epoch": 1118} {"train_loss": -21.887012481689453, "global_step": 92873, "epoch": 1118} {"train_loss": -21.606687545776367, "global_step": 92874, "epoch": 1118} {"train_loss": -21.741775512695312, "global_step": 92875, "epoch": 1118} {"train_loss": -21.662974254194513, "global_step": 92876, "epoch": 1118, "val_loss": 6014955.0} {"train_loss": -21.148061752319336, "global_step": 92877, "epoch": 1119} {"train_loss": -21.785505294799805, "global_step": 92878, "epoch": 1119} {"train_loss": -21.132291793823242, "global_step": 92879, "epoch": 1119} {"train_loss": -20.73940086364746, "global_step": 92880, "epoch": 1119} {"train_loss": -21.144062042236328, "global_step": 92881, "epoch": 1119} {"train_loss": -21.792871475219727, "global_step": 92882, "epoch": 1119} {"train_loss": -20.783594131469727, "global_step": 92883, "epoch": 1119} {"train_loss": -21.58609962463379, "global_step": 92884, "epoch": 1119} {"train_loss": -21.30148696899414, "global_step": 92885, "epoch": 1119} {"train_loss": -21.409948348999023, "global_step": 92886, "epoch": 1119} {"train_loss": -21.463781356811523, "global_step": 92887, "epoch": 1119} {"train_loss": -21.14922523498535, "global_step": 92888, "epoch": 1119} {"train_loss": -21.41788101196289, "global_step": 92889, "epoch": 1119} {"train_loss": -21.29840660095215, "global_step": 92890, "epoch": 1119} {"train_loss": -21.58780288696289, "global_step": 92891, "epoch": 1119} {"train_loss": -21.72463607788086, "global_step": 92892, "epoch": 1119} {"train_loss": -21.26333999633789, "global_step": 92893, "epoch": 1119} {"train_loss": -21.660696029663086, "global_step": 92894, "epoch": 1119} {"train_loss": -21.40846824645996, "global_step": 92895, "epoch": 1119} {"train_loss": -21.32289695739746, "global_step": 92896, "epoch": 1119} {"train_loss": -21.519338607788086, "global_step": 92897, "epoch": 1119} {"train_loss": -21.681650161743164, "global_step": 92898, "epoch": 1119} {"train_loss": -21.685623168945312, "global_step": 92899, "epoch": 1119} {"train_loss": -21.247655868530273, "global_step": 92900, "epoch": 1119} {"train_loss": -21.569549560546875, "global_step": 92901, "epoch": 1119} {"train_loss": -21.426382064819336, "global_step": 92902, "epoch": 1119} {"train_loss": -21.61037254333496, "global_step": 92903, "epoch": 1119} {"train_loss": -21.427932739257812, "global_step": 92904, "epoch": 1119} {"train_loss": -21.506853103637695, "global_step": 92905, "epoch": 1119} {"train_loss": -21.37717056274414, "global_step": 92906, "epoch": 1119} {"train_loss": -21.81584358215332, "global_step": 92907, "epoch": 1119} {"train_loss": -21.574748992919922, "global_step": 92908, "epoch": 1119} {"train_loss": -21.58511734008789, "global_step": 92909, "epoch": 1119} {"train_loss": -21.826461791992188, "global_step": 92910, "epoch": 1119} {"train_loss": -21.49324607849121, "global_step": 92911, "epoch": 1119} {"train_loss": -21.541662216186523, "global_step": 92912, "epoch": 1119} {"train_loss": -21.693979263305664, "global_step": 92913, "epoch": 1119} {"train_loss": -21.601886749267578, "global_step": 92914, "epoch": 1119} {"train_loss": -21.673290252685547, "global_step": 92915, "epoch": 1119} {"train_loss": -21.492399215698242, "global_step": 92916, "epoch": 1119} {"train_loss": -21.818758010864258, "global_step": 92917, "epoch": 1119} {"train_loss": -21.993560791015625, "global_step": 92918, "epoch": 1119} {"train_loss": -21.75087547302246, "global_step": 92919, "epoch": 1119} {"train_loss": -21.424341201782227, "global_step": 92920, "epoch": 1119} {"train_loss": -21.801258087158203, "global_step": 92921, "epoch": 1119} {"train_loss": -21.308879852294922, "global_step": 92922, "epoch": 1119} {"train_loss": -21.596738815307617, "global_step": 92923, "epoch": 1119} {"train_loss": -21.717580795288086, "global_step": 92924, "epoch": 1119} {"train_loss": -21.551340103149414, "global_step": 92925, "epoch": 1119} {"train_loss": -21.89805030822754, "global_step": 92926, "epoch": 1119} {"train_loss": -21.805648803710938, "global_step": 92927, "epoch": 1119} {"train_loss": -21.774686813354492, "global_step": 92928, "epoch": 1119} {"train_loss": -21.47489356994629, "global_step": 92929, "epoch": 1119} {"train_loss": -21.569046020507812, "global_step": 92930, "epoch": 1119} {"train_loss": -21.654390335083008, "global_step": 92931, "epoch": 1119} {"train_loss": -21.688180923461914, "global_step": 92932, "epoch": 1119} {"train_loss": -21.874683380126953, "global_step": 92933, "epoch": 1119} {"train_loss": -21.6640567779541, "global_step": 92934, "epoch": 1119} {"train_loss": -21.830312728881836, "global_step": 92935, "epoch": 1119} {"train_loss": -21.949481964111328, "global_step": 92936, "epoch": 1119} {"train_loss": -21.888797760009766, "global_step": 92937, "epoch": 1119} {"train_loss": -21.626556396484375, "global_step": 92938, "epoch": 1119} {"train_loss": -21.71339225769043, "global_step": 92939, "epoch": 1119} {"train_loss": -21.565021514892578, "global_step": 92940, "epoch": 1119} {"train_loss": -21.910568237304688, "global_step": 92941, "epoch": 1119} {"train_loss": -22.044527053833008, "global_step": 92942, "epoch": 1119} {"train_loss": -22.056928634643555, "global_step": 92943, "epoch": 1119} {"train_loss": -21.696266174316406, "global_step": 92944, "epoch": 1119} {"train_loss": -21.892375946044922, "global_step": 92945, "epoch": 1119} {"train_loss": -21.728689193725586, "global_step": 92946, "epoch": 1119} {"train_loss": -21.490768432617188, "global_step": 92947, "epoch": 1119} {"train_loss": -21.899755477905273, "global_step": 92948, "epoch": 1119} {"train_loss": -21.757572174072266, "global_step": 92949, "epoch": 1119} {"train_loss": -21.354475021362305, "global_step": 92950, "epoch": 1119} {"train_loss": -22.139511108398438, "global_step": 92951, "epoch": 1119} {"train_loss": -21.789674758911133, "global_step": 92952, "epoch": 1119} {"train_loss": -21.414043426513672, "global_step": 92953, "epoch": 1119} {"train_loss": -21.685503005981445, "global_step": 92954, "epoch": 1119} {"train_loss": -21.433996200561523, "global_step": 92955, "epoch": 1119} {"train_loss": -21.45637321472168, "global_step": 92956, "epoch": 1119} {"train_loss": -21.73306655883789, "global_step": 92957, "epoch": 1119} {"train_loss": -21.792469024658203, "global_step": 92958, "epoch": 1119} {"train_loss": -21.606113985360388, "global_step": 92959, "epoch": 1119, "val_loss": 6164998.0} {"train_loss": -21.259262084960938, "global_step": 92960, "epoch": 1120} {"train_loss": -21.174362182617188, "global_step": 92961, "epoch": 1120} {"train_loss": -21.173145294189453, "global_step": 92962, "epoch": 1120} {"train_loss": -20.949750900268555, "global_step": 92963, "epoch": 1120} {"train_loss": -21.578351974487305, "global_step": 92964, "epoch": 1120} {"train_loss": -21.511594772338867, "global_step": 92965, "epoch": 1120} {"train_loss": -21.527982711791992, "global_step": 92966, "epoch": 1120} {"train_loss": -21.621713638305664, "global_step": 92967, "epoch": 1120} {"train_loss": -21.091196060180664, "global_step": 92968, "epoch": 1120} {"train_loss": -21.307226181030273, "global_step": 92969, "epoch": 1120} {"train_loss": -21.48619842529297, "global_step": 92970, "epoch": 1120} {"train_loss": -21.958759307861328, "global_step": 92971, "epoch": 1120} {"train_loss": -21.776819229125977, "global_step": 92972, "epoch": 1120} {"train_loss": -21.60374641418457, "global_step": 92973, "epoch": 1120} {"train_loss": -21.552478790283203, "global_step": 92974, "epoch": 1120} {"train_loss": -21.884174346923828, "global_step": 92975, "epoch": 1120} {"train_loss": -21.418790817260742, "global_step": 92976, "epoch": 1120} {"train_loss": -21.5192928314209, "global_step": 92977, "epoch": 1120} {"train_loss": -21.285388946533203, "global_step": 92978, "epoch": 1120} {"train_loss": -21.478076934814453, "global_step": 92979, "epoch": 1120} {"train_loss": -21.401325225830078, "global_step": 92980, "epoch": 1120} {"train_loss": -21.7266845703125, "global_step": 92981, "epoch": 1120} {"train_loss": -21.62179946899414, "global_step": 92982, "epoch": 1120} {"train_loss": -21.626874923706055, "global_step": 92983, "epoch": 1120} {"train_loss": -21.389062881469727, "global_step": 92984, "epoch": 1120} {"train_loss": -21.926895141601562, "global_step": 92985, "epoch": 1120} {"train_loss": -21.860225677490234, "global_step": 92986, "epoch": 1120} {"train_loss": -21.444791793823242, "global_step": 92987, "epoch": 1120} {"train_loss": -22.069929122924805, "global_step": 92988, "epoch": 1120} {"train_loss": -21.41664695739746, "global_step": 92989, "epoch": 1120} {"train_loss": -21.606210708618164, "global_step": 92990, "epoch": 1120} {"train_loss": -21.56713104248047, "global_step": 92991, "epoch": 1120} {"train_loss": -21.776681900024414, "global_step": 92992, "epoch": 1120} {"train_loss": -21.277204513549805, "global_step": 92993, "epoch": 1120} {"train_loss": -21.442394256591797, "global_step": 92994, "epoch": 1120} {"train_loss": -21.634538650512695, "global_step": 92995, "epoch": 1120} {"train_loss": -21.707550048828125, "global_step": 92996, "epoch": 1120} {"train_loss": -21.62417984008789, "global_step": 92997, "epoch": 1120} {"train_loss": -21.8336181640625, "global_step": 92998, "epoch": 1120} {"train_loss": -21.76680564880371, "global_step": 92999, "epoch": 1120} {"train_loss": -21.883451461791992, "global_step": 93000, "epoch": 1120} {"train_loss": -21.503292083740234, "global_step": 93001, "epoch": 1120} {"train_loss": -21.893781661987305, "global_step": 93002, "epoch": 1120} {"train_loss": -21.467330932617188, "global_step": 93003, "epoch": 1120} {"train_loss": -21.25150489807129, "global_step": 93004, "epoch": 1120} {"train_loss": -21.73138427734375, "global_step": 93005, "epoch": 1120} {"train_loss": -21.774478912353516, "global_step": 93006, "epoch": 1120} {"train_loss": -21.296586990356445, "global_step": 93007, "epoch": 1120} {"train_loss": -21.930585861206055, "global_step": 93008, "epoch": 1120} {"train_loss": -22.00284194946289, "global_step": 93009, "epoch": 1120} {"train_loss": -21.728946685791016, "global_step": 93010, "epoch": 1120} {"train_loss": -21.750877380371094, "global_step": 93011, "epoch": 1120} {"train_loss": -21.772974014282227, "global_step": 93012, "epoch": 1120} {"train_loss": -21.450199127197266, "global_step": 93013, "epoch": 1120} {"train_loss": -21.917795181274414, "global_step": 93014, "epoch": 1120} {"train_loss": -22.126741409301758, "global_step": 93015, "epoch": 1120} {"train_loss": -21.566083908081055, "global_step": 93016, "epoch": 1120} {"train_loss": -21.726015090942383, "global_step": 93017, "epoch": 1120} {"train_loss": -21.921085357666016, "global_step": 93018, "epoch": 1120} {"train_loss": -21.704029083251953, "global_step": 93019, "epoch": 1120} {"train_loss": -21.68815040588379, "global_step": 93020, "epoch": 1120} {"train_loss": -21.470611572265625, "global_step": 93021, "epoch": 1120} {"train_loss": -21.77134132385254, "global_step": 93022, "epoch": 1120} {"train_loss": -21.173147201538086, "global_step": 93023, "epoch": 1120} {"train_loss": -21.69852066040039, "global_step": 93024, "epoch": 1120} {"train_loss": -21.472787857055664, "global_step": 93025, "epoch": 1120} {"train_loss": -21.75440788269043, "global_step": 93026, "epoch": 1120} {"train_loss": -21.922361373901367, "global_step": 93027, "epoch": 1120} {"train_loss": -21.47394371032715, "global_step": 93028, "epoch": 1120} {"train_loss": -21.937667846679688, "global_step": 93029, "epoch": 1120} {"train_loss": -21.878339767456055, "global_step": 93030, "epoch": 1120} {"train_loss": -21.714445114135742, "global_step": 93031, "epoch": 1120} {"train_loss": -21.7678279876709, "global_step": 93032, "epoch": 1120} {"train_loss": -21.69988441467285, "global_step": 93033, "epoch": 1120} {"train_loss": -21.377771377563477, "global_step": 93034, "epoch": 1120} {"train_loss": -21.6007080078125, "global_step": 93035, "epoch": 1120} {"train_loss": -21.37715721130371, "global_step": 93036, "epoch": 1120} {"train_loss": -21.741565704345703, "global_step": 93037, "epoch": 1120} {"train_loss": -21.700244903564453, "global_step": 93038, "epoch": 1120} {"train_loss": -21.532094955444336, "global_step": 93039, "epoch": 1120} {"train_loss": -21.634580612182617, "global_step": 93040, "epoch": 1120} {"train_loss": -21.850988388061523, "global_step": 93041, "epoch": 1120} {"train_loss": -21.598131570471338, "global_step": 93042, "epoch": 1120, "val_loss": 6066082.5} {"train_loss": -21.041181564331055, "global_step": 93043, "epoch": 1121} {"train_loss": -21.83131217956543, "global_step": 93044, "epoch": 1121} {"train_loss": -21.14418601989746, "global_step": 93045, "epoch": 1121} {"train_loss": -21.783838272094727, "global_step": 93046, "epoch": 1121} {"train_loss": -21.464139938354492, "global_step": 93047, "epoch": 1121} {"train_loss": -21.595870971679688, "global_step": 93048, "epoch": 1121} {"train_loss": -21.416860580444336, "global_step": 93049, "epoch": 1121} {"train_loss": -21.159042358398438, "global_step": 93050, "epoch": 1121} {"train_loss": -21.11885643005371, "global_step": 93051, "epoch": 1121} {"train_loss": -21.267471313476562, "global_step": 93052, "epoch": 1121} {"train_loss": -21.184431076049805, "global_step": 93053, "epoch": 1121} {"train_loss": -21.748876571655273, "global_step": 93054, "epoch": 1121} {"train_loss": -21.478017807006836, "global_step": 93055, "epoch": 1121} {"train_loss": -21.61055564880371, "global_step": 93056, "epoch": 1121} {"train_loss": -21.370847702026367, "global_step": 93057, "epoch": 1121} {"train_loss": -21.609371185302734, "global_step": 93058, "epoch": 1121} {"train_loss": -21.51603889465332, "global_step": 93059, "epoch": 1121} {"train_loss": -21.46088981628418, "global_step": 93060, "epoch": 1121} {"train_loss": -21.81146812438965, "global_step": 93061, "epoch": 1121} {"train_loss": -21.2045955657959, "global_step": 93062, "epoch": 1121} {"train_loss": -21.489328384399414, "global_step": 93063, "epoch": 1121} {"train_loss": -21.826257705688477, "global_step": 93064, "epoch": 1121} {"train_loss": -21.468168258666992, "global_step": 93065, "epoch": 1121} {"train_loss": -21.331371307373047, "global_step": 93066, "epoch": 1121} {"train_loss": -21.737163543701172, "global_step": 93067, "epoch": 1121} {"train_loss": -21.721487045288086, "global_step": 93068, "epoch": 1121} {"train_loss": -21.855606079101562, "global_step": 93069, "epoch": 1121} {"train_loss": -21.95538330078125, "global_step": 93070, "epoch": 1121} {"train_loss": -21.716358184814453, "global_step": 93071, "epoch": 1121} {"train_loss": -21.578786849975586, "global_step": 93072, "epoch": 1121} {"train_loss": -21.6335391998291, "global_step": 93073, "epoch": 1121} {"train_loss": -21.662097930908203, "global_step": 93074, "epoch": 1121} {"train_loss": -21.99574851989746, "global_step": 93075, "epoch": 1121} {"train_loss": -21.559316635131836, "global_step": 93076, "epoch": 1121} {"train_loss": -21.853364944458008, "global_step": 93077, "epoch": 1121} {"train_loss": -22.073810577392578, "global_step": 93078, "epoch": 1121} {"train_loss": -21.67621421813965, "global_step": 93079, "epoch": 1121} {"train_loss": -21.76531410217285, "global_step": 93080, "epoch": 1121} {"train_loss": -21.42154884338379, "global_step": 93081, "epoch": 1121} {"train_loss": -21.7817440032959, "global_step": 93082, "epoch": 1121} {"train_loss": -21.735082626342773, "global_step": 93083, "epoch": 1121} {"train_loss": -21.64603614807129, "global_step": 93084, "epoch": 1121} {"train_loss": -21.810653686523438, "global_step": 93085, "epoch": 1121} {"train_loss": -21.89086151123047, "global_step": 93086, "epoch": 1121} {"train_loss": -21.74787712097168, "global_step": 93087, "epoch": 1121} {"train_loss": -21.765594482421875, "global_step": 93088, "epoch": 1121} {"train_loss": -21.573617935180664, "global_step": 93089, "epoch": 1121} {"train_loss": -21.549097061157227, "global_step": 93090, "epoch": 1121} {"train_loss": -21.60231590270996, "global_step": 93091, "epoch": 1121} {"train_loss": -21.539915084838867, "global_step": 93092, "epoch": 1121} {"train_loss": -21.558256149291992, "global_step": 93093, "epoch": 1121} {"train_loss": -22.215221405029297, "global_step": 93094, "epoch": 1121} {"train_loss": -21.841093063354492, "global_step": 93095, "epoch": 1121} {"train_loss": -21.76643180847168, "global_step": 93096, "epoch": 1121} {"train_loss": -21.64154052734375, "global_step": 93097, "epoch": 1121} {"train_loss": -21.88576316833496, "global_step": 93098, "epoch": 1121} {"train_loss": -21.83113670349121, "global_step": 93099, "epoch": 1121} {"train_loss": -21.841747283935547, "global_step": 93100, "epoch": 1121} {"train_loss": -21.72701072692871, "global_step": 93101, "epoch": 1121} {"train_loss": -21.740148544311523, "global_step": 93102, "epoch": 1121} {"train_loss": -21.440271377563477, "global_step": 93103, "epoch": 1121} {"train_loss": -21.71943473815918, "global_step": 93104, "epoch": 1121} {"train_loss": -21.823942184448242, "global_step": 93105, "epoch": 1121} {"train_loss": -22.009624481201172, "global_step": 93106, "epoch": 1121} {"train_loss": -21.748703002929688, "global_step": 93107, "epoch": 1121} {"train_loss": -21.87116050720215, "global_step": 93108, "epoch": 1121} {"train_loss": -21.44919776916504, "global_step": 93109, "epoch": 1121} {"train_loss": -21.743972778320312, "global_step": 93110, "epoch": 1121} {"train_loss": -21.912317276000977, "global_step": 93111, "epoch": 1121} {"train_loss": -21.985809326171875, "global_step": 93112, "epoch": 1121} {"train_loss": -21.732439041137695, "global_step": 93113, "epoch": 1121} {"train_loss": -21.757413864135742, "global_step": 93114, "epoch": 1121} {"train_loss": -21.481054306030273, "global_step": 93115, "epoch": 1121} {"train_loss": -21.46223258972168, "global_step": 93116, "epoch": 1121} {"train_loss": -21.832128524780273, "global_step": 93117, "epoch": 1121} {"train_loss": -21.861494064331055, "global_step": 93118, "epoch": 1121} {"train_loss": -21.95218276977539, "global_step": 93119, "epoch": 1121} {"train_loss": -22.1228084564209, "global_step": 93120, "epoch": 1121} {"train_loss": -21.627042770385742, "global_step": 93121, "epoch": 1121} {"train_loss": -21.869489669799805, "global_step": 93122, "epoch": 1121} {"train_loss": -21.277551651000977, "global_step": 93123, "epoch": 1121} {"train_loss": -21.700773239135742, "global_step": 93124, "epoch": 1121} {"train_loss": -21.636130781058807, "global_step": 93125, "epoch": 1121, "val_loss": 6318572.0} {"train_loss": -20.956222534179688, "global_step": 93126, "epoch": 1122} {"train_loss": -21.463823318481445, "global_step": 93127, "epoch": 1122} {"train_loss": -21.459701538085938, "global_step": 93128, "epoch": 1122} {"train_loss": -21.6602725982666, "global_step": 93129, "epoch": 1122} {"train_loss": -21.322416305541992, "global_step": 93130, "epoch": 1122} {"train_loss": -21.795230865478516, "global_step": 93131, "epoch": 1122} {"train_loss": -21.365467071533203, "global_step": 93132, "epoch": 1122} {"train_loss": -21.21967124938965, "global_step": 93133, "epoch": 1122} {"train_loss": -21.322677612304688, "global_step": 93134, "epoch": 1122} {"train_loss": -21.6560001373291, "global_step": 93135, "epoch": 1122} {"train_loss": -21.331893920898438, "global_step": 93136, "epoch": 1122} {"train_loss": -21.649211883544922, "global_step": 93137, "epoch": 1122} {"train_loss": -21.566869735717773, "global_step": 93138, "epoch": 1122} {"train_loss": -21.665990829467773, "global_step": 93139, "epoch": 1122} {"train_loss": -21.50144386291504, "global_step": 93140, "epoch": 1122} {"train_loss": -21.682605743408203, "global_step": 93141, "epoch": 1122} {"train_loss": -21.32944679260254, "global_step": 93142, "epoch": 1122} {"train_loss": -21.814298629760742, "global_step": 93143, "epoch": 1122} {"train_loss": -21.68416976928711, "global_step": 93144, "epoch": 1122} {"train_loss": -21.327163696289062, "global_step": 93145, "epoch": 1122} {"train_loss": -21.38648796081543, "global_step": 93146, "epoch": 1122} {"train_loss": -21.966318130493164, "global_step": 93147, "epoch": 1122} {"train_loss": -21.436180114746094, "global_step": 93148, "epoch": 1122} {"train_loss": -21.83702850341797, "global_step": 93149, "epoch": 1122} {"train_loss": -21.815446853637695, "global_step": 93150, "epoch": 1122} {"train_loss": -22.01057243347168, "global_step": 93151, "epoch": 1122} {"train_loss": -21.587448120117188, "global_step": 93152, "epoch": 1122} {"train_loss": -21.342466354370117, "global_step": 93153, "epoch": 1122} {"train_loss": -21.74595832824707, "global_step": 93154, "epoch": 1122} {"train_loss": -21.60616111755371, "global_step": 93155, "epoch": 1122} {"train_loss": -21.530109405517578, "global_step": 93156, "epoch": 1122} {"train_loss": -21.696765899658203, "global_step": 93157, "epoch": 1122} {"train_loss": -21.71893310546875, "global_step": 93158, "epoch": 1122} {"train_loss": -21.796443939208984, "global_step": 93159, "epoch": 1122} {"train_loss": -21.668638229370117, "global_step": 93160, "epoch": 1122} {"train_loss": -21.937381744384766, "global_step": 93161, "epoch": 1122} {"train_loss": -21.907358169555664, "global_step": 93162, "epoch": 1122} {"train_loss": -21.358295440673828, "global_step": 93163, "epoch": 1122} {"train_loss": -21.771657943725586, "global_step": 93164, "epoch": 1122} {"train_loss": -21.965234756469727, "global_step": 93165, "epoch": 1122} {"train_loss": -21.755857467651367, "global_step": 93166, "epoch": 1122} {"train_loss": -21.953266143798828, "global_step": 93167, "epoch": 1122} {"train_loss": -21.65260887145996, "global_step": 93168, "epoch": 1122} {"train_loss": -21.5357666015625, "global_step": 93169, "epoch": 1122} {"train_loss": -21.381851196289062, "global_step": 93170, "epoch": 1122} {"train_loss": -21.510854721069336, "global_step": 93171, "epoch": 1122} {"train_loss": -21.52910804748535, "global_step": 93172, "epoch": 1122} {"train_loss": -21.298620223999023, "global_step": 93173, "epoch": 1122} {"train_loss": -21.713912963867188, "global_step": 93174, "epoch": 1122} {"train_loss": -21.6743106842041, "global_step": 93175, "epoch": 1122} {"train_loss": -21.49869728088379, "global_step": 93176, "epoch": 1122} {"train_loss": -21.500024795532227, "global_step": 93177, "epoch": 1122} {"train_loss": -21.942153930664062, "global_step": 93178, "epoch": 1122} {"train_loss": -21.67962646484375, "global_step": 93179, "epoch": 1122} {"train_loss": -22.16278648376465, "global_step": 93180, "epoch": 1122} {"train_loss": -21.717172622680664, "global_step": 93181, "epoch": 1122} {"train_loss": -21.832630157470703, "global_step": 93182, "epoch": 1122} {"train_loss": -21.913467407226562, "global_step": 93183, "epoch": 1122} {"train_loss": -21.960647583007812, "global_step": 93184, "epoch": 1122} {"train_loss": -21.79681968688965, "global_step": 93185, "epoch": 1122} {"train_loss": -21.997005462646484, "global_step": 93186, "epoch": 1122} {"train_loss": -21.66206169128418, "global_step": 93187, "epoch": 1122} {"train_loss": -21.642114639282227, "global_step": 93188, "epoch": 1122} {"train_loss": -21.805784225463867, "global_step": 93189, "epoch": 1122} {"train_loss": -21.37578773498535, "global_step": 93190, "epoch": 1122} {"train_loss": -21.53786277770996, "global_step": 93191, "epoch": 1122} {"train_loss": -21.967479705810547, "global_step": 93192, "epoch": 1122} {"train_loss": -21.83936882019043, "global_step": 93193, "epoch": 1122} {"train_loss": -21.669479370117188, "global_step": 93194, "epoch": 1122} {"train_loss": -21.537479400634766, "global_step": 93195, "epoch": 1122} {"train_loss": -21.792325973510742, "global_step": 93196, "epoch": 1122} {"train_loss": -21.901214599609375, "global_step": 93197, "epoch": 1122} {"train_loss": -21.83648681640625, "global_step": 93198, "epoch": 1122} {"train_loss": -21.85843276977539, "global_step": 93199, "epoch": 1122} {"train_loss": -21.742441177368164, "global_step": 93200, "epoch": 1122} {"train_loss": -21.9022159576416, "global_step": 93201, "epoch": 1122} {"train_loss": -21.702434539794922, "global_step": 93202, "epoch": 1122} {"train_loss": -21.681812286376953, "global_step": 93203, "epoch": 1122} {"train_loss": -21.9610538482666, "global_step": 93204, "epoch": 1122} {"train_loss": -21.787979125976562, "global_step": 93205, "epoch": 1122} {"train_loss": -21.55628776550293, "global_step": 93206, "epoch": 1122} {"train_loss": -21.626920700073242, "global_step": 93207, "epoch": 1122} {"train_loss": -21.67108841401985, "global_step": 93208, "epoch": 1122, "val_loss": 6130252.0} {"train_loss": -21.691370010375977, "global_step": 93209, "epoch": 1123} {"train_loss": -21.327932357788086, "global_step": 93210, "epoch": 1123} {"train_loss": -21.295841217041016, "global_step": 93211, "epoch": 1123} {"train_loss": -21.634069442749023, "global_step": 93212, "epoch": 1123} {"train_loss": -21.541316986083984, "global_step": 93213, "epoch": 1123} {"train_loss": -21.239425659179688, "global_step": 93214, "epoch": 1123} {"train_loss": -21.498722076416016, "global_step": 93215, "epoch": 1123} {"train_loss": -21.583812713623047, "global_step": 93216, "epoch": 1123} {"train_loss": -21.642566680908203, "global_step": 93217, "epoch": 1123} {"train_loss": -21.27345848083496, "global_step": 93218, "epoch": 1123} {"train_loss": -21.4512996673584, "global_step": 93219, "epoch": 1123} {"train_loss": -21.67667007446289, "global_step": 93220, "epoch": 1123} {"train_loss": -21.905956268310547, "global_step": 93221, "epoch": 1123} {"train_loss": -21.52254295349121, "global_step": 93222, "epoch": 1123} {"train_loss": -21.659595489501953, "global_step": 93223, "epoch": 1123} {"train_loss": -21.737476348876953, "global_step": 93224, "epoch": 1123} {"train_loss": -22.01633644104004, "global_step": 93225, "epoch": 1123} {"train_loss": -21.793622970581055, "global_step": 93226, "epoch": 1123} {"train_loss": -21.41632652282715, "global_step": 93227, "epoch": 1123} {"train_loss": -21.5662784576416, "global_step": 93228, "epoch": 1123} {"train_loss": -21.86467170715332, "global_step": 93229, "epoch": 1123} {"train_loss": -21.662012100219727, "global_step": 93230, "epoch": 1123} {"train_loss": -21.735599517822266, "global_step": 93231, "epoch": 1123} {"train_loss": -21.952938079833984, "global_step": 93232, "epoch": 1123} {"train_loss": -21.709985733032227, "global_step": 93233, "epoch": 1123} {"train_loss": -21.767480850219727, "global_step": 93234, "epoch": 1123} {"train_loss": -21.72793960571289, "global_step": 93235, "epoch": 1123} {"train_loss": -21.487668991088867, "global_step": 93236, "epoch": 1123} {"train_loss": -21.539630889892578, "global_step": 93237, "epoch": 1123} {"train_loss": -21.5957088470459, "global_step": 93238, "epoch": 1123} {"train_loss": -21.634193420410156, "global_step": 93239, "epoch": 1123} {"train_loss": -21.652524948120117, "global_step": 93240, "epoch": 1123} {"train_loss": -21.80632209777832, "global_step": 93241, "epoch": 1123} {"train_loss": -21.574676513671875, "global_step": 93242, "epoch": 1123} {"train_loss": -21.851747512817383, "global_step": 93243, "epoch": 1123} {"train_loss": -21.601720809936523, "global_step": 93244, "epoch": 1123} {"train_loss": -21.969648361206055, "global_step": 93245, "epoch": 1123} {"train_loss": -21.784605026245117, "global_step": 93246, "epoch": 1123} {"train_loss": -21.52993392944336, "global_step": 93247, "epoch": 1123} {"train_loss": -21.521066665649414, "global_step": 93248, "epoch": 1123} {"train_loss": -21.460750579833984, "global_step": 93249, "epoch": 1123} {"train_loss": -21.642595291137695, "global_step": 93250, "epoch": 1123} {"train_loss": -21.531766891479492, "global_step": 93251, "epoch": 1123} {"train_loss": -21.840133666992188, "global_step": 93252, "epoch": 1123} {"train_loss": -21.841848373413086, "global_step": 93253, "epoch": 1123} {"train_loss": -21.783954620361328, "global_step": 93254, "epoch": 1123} {"train_loss": -21.864110946655273, "global_step": 93255, "epoch": 1123} {"train_loss": -21.84462547302246, "global_step": 93256, "epoch": 1123} {"train_loss": -21.844614028930664, "global_step": 93257, "epoch": 1123} {"train_loss": -21.86578369140625, "global_step": 93258, "epoch": 1123} {"train_loss": -21.87693214416504, "global_step": 93259, "epoch": 1123} {"train_loss": -21.73493766784668, "global_step": 93260, "epoch": 1123} {"train_loss": -21.692827224731445, "global_step": 93261, "epoch": 1123} {"train_loss": -21.676605224609375, "global_step": 93262, "epoch": 1123} {"train_loss": -21.537595748901367, "global_step": 93263, "epoch": 1123} {"train_loss": -21.9426326751709, "global_step": 93264, "epoch": 1123} {"train_loss": -21.951025009155273, "global_step": 93265, "epoch": 1123} {"train_loss": -21.836383819580078, "global_step": 93266, "epoch": 1123} {"train_loss": -22.066390991210938, "global_step": 93267, "epoch": 1123} {"train_loss": -21.540725708007812, "global_step": 93268, "epoch": 1123} {"train_loss": -21.562015533447266, "global_step": 93269, "epoch": 1123} {"train_loss": -21.75029182434082, "global_step": 93270, "epoch": 1123} {"train_loss": -21.490816116333008, "global_step": 93271, "epoch": 1123} {"train_loss": -21.799728393554688, "global_step": 93272, "epoch": 1123} {"train_loss": -21.695932388305664, "global_step": 93273, "epoch": 1123} {"train_loss": -21.87334632873535, "global_step": 93274, "epoch": 1123} {"train_loss": -21.89034652709961, "global_step": 93275, "epoch": 1123} {"train_loss": -21.713422775268555, "global_step": 93276, "epoch": 1123} {"train_loss": -21.533178329467773, "global_step": 93277, "epoch": 1123} {"train_loss": -21.704477310180664, "global_step": 93278, "epoch": 1123} {"train_loss": -21.533300399780273, "global_step": 93279, "epoch": 1123} {"train_loss": -21.872093200683594, "global_step": 93280, "epoch": 1123} {"train_loss": -21.502490997314453, "global_step": 93281, "epoch": 1123} {"train_loss": -21.64125633239746, "global_step": 93282, "epoch": 1123} {"train_loss": -21.804677963256836, "global_step": 93283, "epoch": 1123} {"train_loss": -21.7357120513916, "global_step": 93284, "epoch": 1123} {"train_loss": -21.692174911499023, "global_step": 93285, "epoch": 1123} {"train_loss": -21.335439682006836, "global_step": 93286, "epoch": 1123} {"train_loss": -21.479888916015625, "global_step": 93287, "epoch": 1123} {"train_loss": -21.444204330444336, "global_step": 93288, "epoch": 1123} {"train_loss": -21.791868209838867, "global_step": 93289, "epoch": 1123} {"train_loss": -21.537832260131836, "global_step": 93290, "epoch": 1123} {"train_loss": -21.677582177771143, "global_step": 93291, "epoch": 1123, "val_loss": 6274943.5} {"train_loss": -21.51800537109375, "global_step": 93292, "epoch": 1124} {"train_loss": -21.375417709350586, "global_step": 93293, "epoch": 1124} {"train_loss": -21.864564895629883, "global_step": 93294, "epoch": 1124} {"train_loss": -21.492910385131836, "global_step": 93295, "epoch": 1124} {"train_loss": -21.2733211517334, "global_step": 93296, "epoch": 1124} {"train_loss": -21.42096519470215, "global_step": 93297, "epoch": 1124} {"train_loss": -21.9167537689209, "global_step": 93298, "epoch": 1124} {"train_loss": -21.847883224487305, "global_step": 93299, "epoch": 1124} {"train_loss": -21.288471221923828, "global_step": 93300, "epoch": 1124} {"train_loss": -21.813152313232422, "global_step": 93301, "epoch": 1124} {"train_loss": -21.548751831054688, "global_step": 93302, "epoch": 1124} {"train_loss": -21.3853702545166, "global_step": 93303, "epoch": 1124} {"train_loss": -21.94032096862793, "global_step": 93304, "epoch": 1124} {"train_loss": -21.790433883666992, "global_step": 93305, "epoch": 1124} {"train_loss": -21.8471622467041, "global_step": 93306, "epoch": 1124} {"train_loss": -21.347915649414062, "global_step": 93307, "epoch": 1124} {"train_loss": -21.477313995361328, "global_step": 93308, "epoch": 1124} {"train_loss": -21.69355010986328, "global_step": 93309, "epoch": 1124} {"train_loss": -21.6810245513916, "global_step": 93310, "epoch": 1124} {"train_loss": -21.62598991394043, "global_step": 93311, "epoch": 1124} {"train_loss": -21.796154022216797, "global_step": 93312, "epoch": 1124} {"train_loss": -21.960535049438477, "global_step": 93313, "epoch": 1124} {"train_loss": -21.811033248901367, "global_step": 93314, "epoch": 1124} {"train_loss": -21.727136611938477, "global_step": 93315, "epoch": 1124} {"train_loss": -21.420045852661133, "global_step": 93316, "epoch": 1124} {"train_loss": -22.129779815673828, "global_step": 93317, "epoch": 1124} {"train_loss": -21.609500885009766, "global_step": 93318, "epoch": 1124} {"train_loss": -21.268726348876953, "global_step": 93319, "epoch": 1124} {"train_loss": -21.586734771728516, "global_step": 93320, "epoch": 1124} {"train_loss": -21.709218978881836, "global_step": 93321, "epoch": 1124} {"train_loss": -21.69621467590332, "global_step": 93322, "epoch": 1124} {"train_loss": -21.73187255859375, "global_step": 93323, "epoch": 1124} {"train_loss": -21.778717041015625, "global_step": 93324, "epoch": 1124} {"train_loss": -21.662893295288086, "global_step": 93325, "epoch": 1124} {"train_loss": -22.111358642578125, "global_step": 93326, "epoch": 1124} {"train_loss": -22.324542999267578, "global_step": 93327, "epoch": 1124} {"train_loss": -21.643577575683594, "global_step": 93328, "epoch": 1124} {"train_loss": -21.469167709350586, "global_step": 93329, "epoch": 1124} {"train_loss": -21.760164260864258, "global_step": 93330, "epoch": 1124} {"train_loss": -21.805051803588867, "global_step": 93331, "epoch": 1124} {"train_loss": -21.840547561645508, "global_step": 93332, "epoch": 1124} {"train_loss": -21.852746963500977, "global_step": 93333, "epoch": 1124} {"train_loss": -21.90755271911621, "global_step": 93334, "epoch": 1124} {"train_loss": -21.670948028564453, "global_step": 93335, "epoch": 1124} {"train_loss": -21.727394104003906, "global_step": 93336, "epoch": 1124} {"train_loss": -21.8607177734375, "global_step": 93337, "epoch": 1124} {"train_loss": -22.16233253479004, "global_step": 93338, "epoch": 1124} {"train_loss": -21.825580596923828, "global_step": 93339, "epoch": 1124} {"train_loss": -21.135046005249023, "global_step": 93340, "epoch": 1124} {"train_loss": -21.583541870117188, "global_step": 93341, "epoch": 1124} {"train_loss": -21.732891082763672, "global_step": 93342, "epoch": 1124} {"train_loss": -22.024856567382812, "global_step": 93343, "epoch": 1124} {"train_loss": -21.462085723876953, "global_step": 93344, "epoch": 1124} {"train_loss": -21.70047950744629, "global_step": 93345, "epoch": 1124} {"train_loss": -21.703128814697266, "global_step": 93346, "epoch": 1124} {"train_loss": -21.758758544921875, "global_step": 93347, "epoch": 1124} {"train_loss": -21.756650924682617, "global_step": 93348, "epoch": 1124} {"train_loss": -21.923612594604492, "global_step": 93349, "epoch": 1124} {"train_loss": -21.517431259155273, "global_step": 93350, "epoch": 1124} {"train_loss": -21.749011993408203, "global_step": 93351, "epoch": 1124} {"train_loss": -21.7795467376709, "global_step": 93352, "epoch": 1124} {"train_loss": -21.94004249572754, "global_step": 93353, "epoch": 1124} {"train_loss": -21.39627456665039, "global_step": 93354, "epoch": 1124} {"train_loss": -21.611221313476562, "global_step": 93355, "epoch": 1124} {"train_loss": -21.810773849487305, "global_step": 93356, "epoch": 1124} {"train_loss": -21.599119186401367, "global_step": 93357, "epoch": 1124} {"train_loss": -21.47119140625, "global_step": 93358, "epoch": 1124} {"train_loss": -21.725955963134766, "global_step": 93359, "epoch": 1124} {"train_loss": -21.543996810913086, "global_step": 93360, "epoch": 1124} {"train_loss": -21.67906379699707, "global_step": 93361, "epoch": 1124} {"train_loss": -21.601337432861328, "global_step": 93362, "epoch": 1124} {"train_loss": -21.73990821838379, "global_step": 93363, "epoch": 1124} {"train_loss": -21.572895050048828, "global_step": 93364, "epoch": 1124} {"train_loss": -21.33941650390625, "global_step": 93365, "epoch": 1124} {"train_loss": -21.584768295288086, "global_step": 93366, "epoch": 1124} {"train_loss": -21.64613151550293, "global_step": 93367, "epoch": 1124} {"train_loss": -21.547090530395508, "global_step": 93368, "epoch": 1124} {"train_loss": -21.834087371826172, "global_step": 93369, "epoch": 1124} {"train_loss": -21.822858810424805, "global_step": 93370, "epoch": 1124} {"train_loss": -22.122770309448242, "global_step": 93371, "epoch": 1124} {"train_loss": -21.72696876525879, "global_step": 93372, "epoch": 1124} {"train_loss": -21.537073135375977, "global_step": 93373, "epoch": 1124} {"train_loss": -21.704385458704937, "global_step": 93374, "epoch": 1124, "val_loss": 6251375.5} {"train_loss": -20.92140007019043, "global_step": 93375, "epoch": 1125} {"train_loss": -20.87312889099121, "global_step": 93376, "epoch": 1125} {"train_loss": -21.345321655273438, "global_step": 93377, "epoch": 1125} {"train_loss": -20.6961727142334, "global_step": 93378, "epoch": 1125} {"train_loss": -21.43514060974121, "global_step": 93379, "epoch": 1125} {"train_loss": -21.36515235900879, "global_step": 93380, "epoch": 1125} {"train_loss": -20.9705867767334, "global_step": 93381, "epoch": 1125} {"train_loss": -21.034597396850586, "global_step": 93382, "epoch": 1125} {"train_loss": -21.24867820739746, "global_step": 93383, "epoch": 1125} {"train_loss": -21.05501365661621, "global_step": 93384, "epoch": 1125} {"train_loss": -21.37767791748047, "global_step": 93385, "epoch": 1125} {"train_loss": -21.19940185546875, "global_step": 93386, "epoch": 1125} {"train_loss": -21.175142288208008, "global_step": 93387, "epoch": 1125} {"train_loss": -21.225543975830078, "global_step": 93388, "epoch": 1125} {"train_loss": -21.2374210357666, "global_step": 93389, "epoch": 1125} {"train_loss": -21.612403869628906, "global_step": 93390, "epoch": 1125} {"train_loss": -21.467164993286133, "global_step": 93391, "epoch": 1125} {"train_loss": -21.237079620361328, "global_step": 93392, "epoch": 1125} {"train_loss": -21.573883056640625, "global_step": 93393, "epoch": 1125} {"train_loss": -21.683576583862305, "global_step": 93394, "epoch": 1125} {"train_loss": -21.50095558166504, "global_step": 93395, "epoch": 1125} {"train_loss": -21.241037368774414, "global_step": 93396, "epoch": 1125} {"train_loss": -21.375295639038086, "global_step": 93397, "epoch": 1125} {"train_loss": -21.40034294128418, "global_step": 93398, "epoch": 1125} {"train_loss": -21.626935958862305, "global_step": 93399, "epoch": 1125} {"train_loss": -21.725465774536133, "global_step": 93400, "epoch": 1125} {"train_loss": -21.919097900390625, "global_step": 93401, "epoch": 1125} {"train_loss": -21.464719772338867, "global_step": 93402, "epoch": 1125} {"train_loss": -21.573728561401367, "global_step": 93403, "epoch": 1125} {"train_loss": -21.679197311401367, "global_step": 93404, "epoch": 1125} {"train_loss": -21.830894470214844, "global_step": 93405, "epoch": 1125} {"train_loss": -21.470367431640625, "global_step": 93406, "epoch": 1125} {"train_loss": -21.625564575195312, "global_step": 93407, "epoch": 1125} {"train_loss": -21.93895149230957, "global_step": 93408, "epoch": 1125} {"train_loss": -21.879318237304688, "global_step": 93409, "epoch": 1125} {"train_loss": -21.55141258239746, "global_step": 93410, "epoch": 1125} {"train_loss": -21.502193450927734, "global_step": 93411, "epoch": 1125} {"train_loss": -22.2462215423584, "global_step": 93412, "epoch": 1125} {"train_loss": -21.64666748046875, "global_step": 93413, "epoch": 1125} {"train_loss": -21.98761749267578, "global_step": 93414, "epoch": 1125} {"train_loss": -21.50038719177246, "global_step": 93415, "epoch": 1125} {"train_loss": -21.706165313720703, "global_step": 93416, "epoch": 1125} {"train_loss": -21.8011474609375, "global_step": 93417, "epoch": 1125} {"train_loss": -21.87146759033203, "global_step": 93418, "epoch": 1125} {"train_loss": -22.006528854370117, "global_step": 93419, "epoch": 1125} {"train_loss": -21.61111831665039, "global_step": 93420, "epoch": 1125} {"train_loss": -21.61767578125, "global_step": 93421, "epoch": 1125} {"train_loss": -21.814077377319336, "global_step": 93422, "epoch": 1125} {"train_loss": -21.56855010986328, "global_step": 93423, "epoch": 1125} {"train_loss": -21.802490234375, "global_step": 93424, "epoch": 1125} {"train_loss": -21.56077003479004, "global_step": 93425, "epoch": 1125} {"train_loss": -21.711416244506836, "global_step": 93426, "epoch": 1125} {"train_loss": -21.720170974731445, "global_step": 93427, "epoch": 1125} {"train_loss": -21.848318099975586, "global_step": 93428, "epoch": 1125} {"train_loss": -21.766942977905273, "global_step": 93429, "epoch": 1125} {"train_loss": -22.102859497070312, "global_step": 93430, "epoch": 1125} {"train_loss": -21.7675838470459, "global_step": 93431, "epoch": 1125} {"train_loss": -21.76921844482422, "global_step": 93432, "epoch": 1125} {"train_loss": -21.46307373046875, "global_step": 93433, "epoch": 1125} {"train_loss": -21.835153579711914, "global_step": 93434, "epoch": 1125} {"train_loss": -21.729948043823242, "global_step": 93435, "epoch": 1125} {"train_loss": -21.87918472290039, "global_step": 93436, "epoch": 1125} {"train_loss": -21.9621639251709, "global_step": 93437, "epoch": 1125} {"train_loss": -21.643579483032227, "global_step": 93438, "epoch": 1125} {"train_loss": -21.769577026367188, "global_step": 93439, "epoch": 1125} {"train_loss": -21.848325729370117, "global_step": 93440, "epoch": 1125} {"train_loss": -21.661474227905273, "global_step": 93441, "epoch": 1125} {"train_loss": -21.870969772338867, "global_step": 93442, "epoch": 1125} {"train_loss": -21.904571533203125, "global_step": 93443, "epoch": 1125} {"train_loss": -21.508405685424805, "global_step": 93444, "epoch": 1125} {"train_loss": -21.817480087280273, "global_step": 93445, "epoch": 1125} {"train_loss": -21.847143173217773, "global_step": 93446, "epoch": 1125} {"train_loss": -21.9306697845459, "global_step": 93447, "epoch": 1125} {"train_loss": -21.746992111206055, "global_step": 93448, "epoch": 1125} {"train_loss": -21.871658325195312, "global_step": 93449, "epoch": 1125} {"train_loss": -21.636472702026367, "global_step": 93450, "epoch": 1125} {"train_loss": -21.669126510620117, "global_step": 93451, "epoch": 1125} {"train_loss": -21.637426376342773, "global_step": 93452, "epoch": 1125} {"train_loss": -21.793912887573242, "global_step": 93453, "epoch": 1125} {"train_loss": -21.767484664916992, "global_step": 93454, "epoch": 1125} {"train_loss": -21.557981491088867, "global_step": 93455, "epoch": 1125} {"train_loss": -21.93886375427246, "global_step": 93456, "epoch": 1125} {"train_loss": -21.607829519065028, "global_step": 93457, "epoch": 1125, "val_loss": 6277342.0} {"train_loss": -20.730024337768555, "global_step": 93458, "epoch": 1126} {"train_loss": -20.593656539916992, "global_step": 93459, "epoch": 1126} {"train_loss": -21.10300064086914, "global_step": 93460, "epoch": 1126} {"train_loss": -20.016592025756836, "global_step": 93461, "epoch": 1126} {"train_loss": -21.17707633972168, "global_step": 93462, "epoch": 1126} {"train_loss": -20.615732192993164, "global_step": 93463, "epoch": 1126} {"train_loss": -21.150146484375, "global_step": 93464, "epoch": 1126} {"train_loss": -21.239561080932617, "global_step": 93465, "epoch": 1126} {"train_loss": -21.349441528320312, "global_step": 93466, "epoch": 1126} {"train_loss": -21.403593063354492, "global_step": 93467, "epoch": 1126} {"train_loss": -20.945425033569336, "global_step": 93468, "epoch": 1126} {"train_loss": -21.322046279907227, "global_step": 93469, "epoch": 1126} {"train_loss": -21.06976890563965, "global_step": 93470, "epoch": 1126} {"train_loss": -21.339569091796875, "global_step": 93471, "epoch": 1126} {"train_loss": -21.174652099609375, "global_step": 93472, "epoch": 1126} {"train_loss": -21.484294891357422, "global_step": 93473, "epoch": 1126} {"train_loss": -21.379528045654297, "global_step": 93474, "epoch": 1126} {"train_loss": -20.937580108642578, "global_step": 93475, "epoch": 1126} {"train_loss": -20.948450088500977, "global_step": 93476, "epoch": 1126} {"train_loss": -21.490127563476562, "global_step": 93477, "epoch": 1126} {"train_loss": -21.295251846313477, "global_step": 93478, "epoch": 1126} {"train_loss": -21.484012603759766, "global_step": 93479, "epoch": 1126} {"train_loss": -21.42989158630371, "global_step": 93480, "epoch": 1126} {"train_loss": -21.615737915039062, "global_step": 93481, "epoch": 1126} {"train_loss": -21.71510887145996, "global_step": 93482, "epoch": 1126} {"train_loss": -21.55763053894043, "global_step": 93483, "epoch": 1126} {"train_loss": -21.593002319335938, "global_step": 93484, "epoch": 1126} {"train_loss": -21.554636001586914, "global_step": 93485, "epoch": 1126} {"train_loss": -21.27654266357422, "global_step": 93486, "epoch": 1126} {"train_loss": -21.770910263061523, "global_step": 93487, "epoch": 1126} {"train_loss": -21.584863662719727, "global_step": 93488, "epoch": 1126} {"train_loss": -21.69550895690918, "global_step": 93489, "epoch": 1126} {"train_loss": -21.8940372467041, "global_step": 93490, "epoch": 1126} {"train_loss": -21.783222198486328, "global_step": 93491, "epoch": 1126} {"train_loss": -21.771085739135742, "global_step": 93492, "epoch": 1126} {"train_loss": -21.57643699645996, "global_step": 93493, "epoch": 1126} {"train_loss": -21.592771530151367, "global_step": 93494, "epoch": 1126} {"train_loss": -21.71140480041504, "global_step": 93495, "epoch": 1126} {"train_loss": -21.69038200378418, "global_step": 93496, "epoch": 1126} {"train_loss": -21.633718490600586, "global_step": 93497, "epoch": 1126} {"train_loss": -21.562685012817383, "global_step": 93498, "epoch": 1126} {"train_loss": -21.714284896850586, "global_step": 93499, "epoch": 1126} {"train_loss": -21.59095001220703, "global_step": 93500, "epoch": 1126} {"train_loss": -21.79609489440918, "global_step": 93501, "epoch": 1126} {"train_loss": -21.909543991088867, "global_step": 93502, "epoch": 1126} {"train_loss": -21.509397506713867, "global_step": 93503, "epoch": 1126} {"train_loss": -21.899511337280273, "global_step": 93504, "epoch": 1126} {"train_loss": -21.703088760375977, "global_step": 93505, "epoch": 1126} {"train_loss": -21.7847957611084, "global_step": 93506, "epoch": 1126} {"train_loss": -21.78804588317871, "global_step": 93507, "epoch": 1126} {"train_loss": -21.412952423095703, "global_step": 93508, "epoch": 1126} {"train_loss": -21.501121520996094, "global_step": 93509, "epoch": 1126} {"train_loss": -21.677513122558594, "global_step": 93510, "epoch": 1126} {"train_loss": -22.12965202331543, "global_step": 93511, "epoch": 1126} {"train_loss": -21.758041381835938, "global_step": 93512, "epoch": 1126} {"train_loss": -21.370031356811523, "global_step": 93513, "epoch": 1126} {"train_loss": -21.70938491821289, "global_step": 93514, "epoch": 1126} {"train_loss": -21.69612693786621, "global_step": 93515, "epoch": 1126} {"train_loss": -21.64661979675293, "global_step": 93516, "epoch": 1126} {"train_loss": -21.671049118041992, "global_step": 93517, "epoch": 1126} {"train_loss": -21.5913143157959, "global_step": 93518, "epoch": 1126} {"train_loss": -21.711698532104492, "global_step": 93519, "epoch": 1126} {"train_loss": -21.69266128540039, "global_step": 93520, "epoch": 1126} {"train_loss": -21.961000442504883, "global_step": 93521, "epoch": 1126} {"train_loss": -21.41103172302246, "global_step": 93522, "epoch": 1126} {"train_loss": -21.557260513305664, "global_step": 93523, "epoch": 1126} {"train_loss": -21.880388259887695, "global_step": 93524, "epoch": 1126} {"train_loss": -21.397275924682617, "global_step": 93525, "epoch": 1126} {"train_loss": -21.764450073242188, "global_step": 93526, "epoch": 1126} {"train_loss": -21.9497013092041, "global_step": 93527, "epoch": 1126} {"train_loss": -21.727750778198242, "global_step": 93528, "epoch": 1126} {"train_loss": -21.487333297729492, "global_step": 93529, "epoch": 1126} {"train_loss": -21.635601043701172, "global_step": 93530, "epoch": 1126} {"train_loss": -21.821157455444336, "global_step": 93531, "epoch": 1126} {"train_loss": -21.529287338256836, "global_step": 93532, "epoch": 1126} {"train_loss": -21.44026756286621, "global_step": 93533, "epoch": 1126} {"train_loss": -21.808277130126953, "global_step": 93534, "epoch": 1126} {"train_loss": -21.92035484313965, "global_step": 93535, "epoch": 1126} {"train_loss": -21.639047622680664, "global_step": 93536, "epoch": 1126} {"train_loss": -21.694713592529297, "global_step": 93537, "epoch": 1126} {"train_loss": -21.746946334838867, "global_step": 93538, "epoch": 1126} {"train_loss": -21.66423988342285, "global_step": 93539, "epoch": 1126} {"train_loss": -21.509653803813887, "global_step": 93540, "epoch": 1126, "val_loss": 6182242.0} {"train_loss": -21.5582275390625, "global_step": 93541, "epoch": 1127} {"train_loss": -21.184158325195312, "global_step": 93542, "epoch": 1127} {"train_loss": -21.278162002563477, "global_step": 93543, "epoch": 1127} {"train_loss": -21.10670280456543, "global_step": 93544, "epoch": 1127} {"train_loss": -21.267650604248047, "global_step": 93545, "epoch": 1127} {"train_loss": -21.51371955871582, "global_step": 93546, "epoch": 1127} {"train_loss": -21.679502487182617, "global_step": 93547, "epoch": 1127} {"train_loss": -21.680320739746094, "global_step": 93548, "epoch": 1127} {"train_loss": -21.803325653076172, "global_step": 93549, "epoch": 1127} {"train_loss": -21.405256271362305, "global_step": 93550, "epoch": 1127} {"train_loss": -21.48192024230957, "global_step": 93551, "epoch": 1127} {"train_loss": -21.21187973022461, "global_step": 93552, "epoch": 1127} {"train_loss": -21.956615447998047, "global_step": 93553, "epoch": 1127} {"train_loss": -21.547948837280273, "global_step": 93554, "epoch": 1127} {"train_loss": -21.884654998779297, "global_step": 93555, "epoch": 1127} {"train_loss": -21.50960922241211, "global_step": 93556, "epoch": 1127} {"train_loss": -21.722166061401367, "global_step": 93557, "epoch": 1127} {"train_loss": -21.678808212280273, "global_step": 93558, "epoch": 1127} {"train_loss": -21.824020385742188, "global_step": 93559, "epoch": 1127} {"train_loss": -21.989728927612305, "global_step": 93560, "epoch": 1127} {"train_loss": -22.08005714416504, "global_step": 93561, "epoch": 1127} {"train_loss": -21.71637535095215, "global_step": 93562, "epoch": 1127} {"train_loss": -21.859649658203125, "global_step": 93563, "epoch": 1127} {"train_loss": -21.334802627563477, "global_step": 93564, "epoch": 1127} {"train_loss": -21.66552734375, "global_step": 93565, "epoch": 1127} {"train_loss": -21.777557373046875, "global_step": 93566, "epoch": 1127} {"train_loss": -21.740955352783203, "global_step": 93567, "epoch": 1127} {"train_loss": -21.531936645507812, "global_step": 93568, "epoch": 1127} {"train_loss": -21.626129150390625, "global_step": 93569, "epoch": 1127} {"train_loss": -22.170684814453125, "global_step": 93570, "epoch": 1127} {"train_loss": -21.82077980041504, "global_step": 93571, "epoch": 1127} {"train_loss": -21.70001220703125, "global_step": 93572, "epoch": 1127} {"train_loss": -22.161216735839844, "global_step": 93573, "epoch": 1127} {"train_loss": -21.484296798706055, "global_step": 93574, "epoch": 1127} {"train_loss": -21.416105270385742, "global_step": 93575, "epoch": 1127} {"train_loss": -21.655963897705078, "global_step": 93576, "epoch": 1127} {"train_loss": -22.002347946166992, "global_step": 93577, "epoch": 1127} {"train_loss": -21.5053768157959, "global_step": 93578, "epoch": 1127} {"train_loss": -21.62015724182129, "global_step": 93579, "epoch": 1127} {"train_loss": -21.60435676574707, "global_step": 93580, "epoch": 1127} {"train_loss": -21.493350982666016, "global_step": 93581, "epoch": 1127} {"train_loss": -21.855573654174805, "global_step": 93582, "epoch": 1127} {"train_loss": -21.561317443847656, "global_step": 93583, "epoch": 1127} {"train_loss": -21.579864501953125, "global_step": 93584, "epoch": 1127} {"train_loss": -21.97833251953125, "global_step": 93585, "epoch": 1127} {"train_loss": -21.534194946289062, "global_step": 93586, "epoch": 1127} {"train_loss": -21.619873046875, "global_step": 93587, "epoch": 1127} {"train_loss": -21.809736251831055, "global_step": 93588, "epoch": 1127} {"train_loss": -21.553932189941406, "global_step": 93589, "epoch": 1127} {"train_loss": -21.828189849853516, "global_step": 93590, "epoch": 1127} {"train_loss": -21.5745849609375, "global_step": 93591, "epoch": 1127} {"train_loss": -20.919485092163086, "global_step": 93592, "epoch": 1127} {"train_loss": -21.59889793395996, "global_step": 93593, "epoch": 1127} {"train_loss": -21.75129508972168, "global_step": 93594, "epoch": 1127} {"train_loss": -21.734895706176758, "global_step": 93595, "epoch": 1127} {"train_loss": -21.872440338134766, "global_step": 93596, "epoch": 1127} {"train_loss": -21.574954986572266, "global_step": 93597, "epoch": 1127} {"train_loss": -21.693572998046875, "global_step": 93598, "epoch": 1127} {"train_loss": -21.64316749572754, "global_step": 93599, "epoch": 1127} {"train_loss": -21.687345504760742, "global_step": 93600, "epoch": 1127} {"train_loss": -21.941526412963867, "global_step": 93601, "epoch": 1127} {"train_loss": -21.858230590820312, "global_step": 93602, "epoch": 1127} {"train_loss": -21.693864822387695, "global_step": 93603, "epoch": 1127} {"train_loss": -21.567123413085938, "global_step": 93604, "epoch": 1127} {"train_loss": -21.838064193725586, "global_step": 93605, "epoch": 1127} {"train_loss": -21.867361068725586, "global_step": 93606, "epoch": 1127} {"train_loss": -21.979703903198242, "global_step": 93607, "epoch": 1127} {"train_loss": -21.94976043701172, "global_step": 93608, "epoch": 1127} {"train_loss": -21.982349395751953, "global_step": 93609, "epoch": 1127} {"train_loss": -22.071069717407227, "global_step": 93610, "epoch": 1127} {"train_loss": -21.717538833618164, "global_step": 93611, "epoch": 1127} {"train_loss": -22.221805572509766, "global_step": 93612, "epoch": 1127} {"train_loss": -21.62093162536621, "global_step": 93613, "epoch": 1127} {"train_loss": -21.67732048034668, "global_step": 93614, "epoch": 1127} {"train_loss": -21.749284744262695, "global_step": 93615, "epoch": 1127} {"train_loss": -22.032817840576172, "global_step": 93616, "epoch": 1127} {"train_loss": -21.854217529296875, "global_step": 93617, "epoch": 1127} {"train_loss": -21.485822677612305, "global_step": 93618, "epoch": 1127} {"train_loss": -21.62013053894043, "global_step": 93619, "epoch": 1127} {"train_loss": -21.63518714904785, "global_step": 93620, "epoch": 1127} {"train_loss": -21.80828857421875, "global_step": 93621, "epoch": 1127} {"train_loss": -21.494586944580078, "global_step": 93622, "epoch": 1127} {"train_loss": -21.709368993000812, "global_step": 93623, "epoch": 1127, "val_loss": 6204536.0} {"train_loss": -21.550743103027344, "global_step": 93624, "epoch": 1128} {"train_loss": -21.309295654296875, "global_step": 93625, "epoch": 1128} {"train_loss": -21.70533561706543, "global_step": 93626, "epoch": 1128} {"train_loss": -21.468544006347656, "global_step": 93627, "epoch": 1128} {"train_loss": -21.18128204345703, "global_step": 93628, "epoch": 1128} {"train_loss": -20.874774932861328, "global_step": 93629, "epoch": 1128} {"train_loss": -21.508764266967773, "global_step": 93630, "epoch": 1128} {"train_loss": -21.425708770751953, "global_step": 93631, "epoch": 1128} {"train_loss": -21.720478057861328, "global_step": 93632, "epoch": 1128} {"train_loss": -21.945594787597656, "global_step": 93633, "epoch": 1128} {"train_loss": -21.255502700805664, "global_step": 93634, "epoch": 1128} {"train_loss": -21.560733795166016, "global_step": 93635, "epoch": 1128} {"train_loss": -21.432449340820312, "global_step": 93636, "epoch": 1128} {"train_loss": -21.79327964782715, "global_step": 93637, "epoch": 1128} {"train_loss": -21.3590030670166, "global_step": 93638, "epoch": 1128} {"train_loss": -21.416555404663086, "global_step": 93639, "epoch": 1128} {"train_loss": -21.7021427154541, "global_step": 93640, "epoch": 1128} {"train_loss": -21.68827247619629, "global_step": 93641, "epoch": 1128} {"train_loss": -21.556015014648438, "global_step": 93642, "epoch": 1128} {"train_loss": -21.3448486328125, "global_step": 93643, "epoch": 1128} {"train_loss": -21.665578842163086, "global_step": 93644, "epoch": 1128} {"train_loss": -21.33645248413086, "global_step": 93645, "epoch": 1128} {"train_loss": -21.364917755126953, "global_step": 93646, "epoch": 1128} {"train_loss": -21.656387329101562, "global_step": 93647, "epoch": 1128} {"train_loss": -21.747039794921875, "global_step": 93648, "epoch": 1128} {"train_loss": -21.733673095703125, "global_step": 93649, "epoch": 1128} {"train_loss": -21.714269638061523, "global_step": 93650, "epoch": 1128} {"train_loss": -21.742231369018555, "global_step": 93651, "epoch": 1128} {"train_loss": -21.747150421142578, "global_step": 93652, "epoch": 1128} {"train_loss": -21.888837814331055, "global_step": 93653, "epoch": 1128} {"train_loss": -21.659345626831055, "global_step": 93654, "epoch": 1128} {"train_loss": -21.786636352539062, "global_step": 93655, "epoch": 1128} {"train_loss": -21.601552963256836, "global_step": 93656, "epoch": 1128} {"train_loss": -21.798542022705078, "global_step": 93657, "epoch": 1128} {"train_loss": -21.50044059753418, "global_step": 93658, "epoch": 1128} {"train_loss": -21.70493507385254, "global_step": 93659, "epoch": 1128} {"train_loss": -21.596755981445312, "global_step": 93660, "epoch": 1128} {"train_loss": -22.01263999938965, "global_step": 93661, "epoch": 1128} {"train_loss": -21.484464645385742, "global_step": 93662, "epoch": 1128} {"train_loss": -22.16509437561035, "global_step": 93663, "epoch": 1128} {"train_loss": -22.08640480041504, "global_step": 93664, "epoch": 1128} {"train_loss": -22.020410537719727, "global_step": 93665, "epoch": 1128} {"train_loss": -22.073232650756836, "global_step": 93666, "epoch": 1128} {"train_loss": -21.702713012695312, "global_step": 93667, "epoch": 1128} {"train_loss": -21.671682357788086, "global_step": 93668, "epoch": 1128} {"train_loss": -21.407926559448242, "global_step": 93669, "epoch": 1128} {"train_loss": -21.838336944580078, "global_step": 93670, "epoch": 1128} {"train_loss": -21.430570602416992, "global_step": 93671, "epoch": 1128} {"train_loss": -21.807401657104492, "global_step": 93672, "epoch": 1128} {"train_loss": -22.038843154907227, "global_step": 93673, "epoch": 1128} {"train_loss": -22.044858932495117, "global_step": 93674, "epoch": 1128} {"train_loss": -21.859949111938477, "global_step": 93675, "epoch": 1128} {"train_loss": -21.904375076293945, "global_step": 93676, "epoch": 1128} {"train_loss": -21.349998474121094, "global_step": 93677, "epoch": 1128} {"train_loss": -21.670251846313477, "global_step": 93678, "epoch": 1128} {"train_loss": -21.92711639404297, "global_step": 93679, "epoch": 1128} {"train_loss": -21.717496871948242, "global_step": 93680, "epoch": 1128} {"train_loss": -22.02667999267578, "global_step": 93681, "epoch": 1128} {"train_loss": -21.821292877197266, "global_step": 93682, "epoch": 1128} {"train_loss": -21.477880477905273, "global_step": 93683, "epoch": 1128} {"train_loss": -21.63702392578125, "global_step": 93684, "epoch": 1128} {"train_loss": -21.65108299255371, "global_step": 93685, "epoch": 1128} {"train_loss": -21.75829315185547, "global_step": 93686, "epoch": 1128} {"train_loss": -21.501571655273438, "global_step": 93687, "epoch": 1128} {"train_loss": -21.576208114624023, "global_step": 93688, "epoch": 1128} {"train_loss": -21.662656784057617, "global_step": 93689, "epoch": 1128} {"train_loss": -21.788076400756836, "global_step": 93690, "epoch": 1128} {"train_loss": -21.696704864501953, "global_step": 93691, "epoch": 1128} {"train_loss": -21.559539794921875, "global_step": 93692, "epoch": 1128} {"train_loss": -21.991968154907227, "global_step": 93693, "epoch": 1128} {"train_loss": -21.988842010498047, "global_step": 93694, "epoch": 1128} {"train_loss": -21.291919708251953, "global_step": 93695, "epoch": 1128} {"train_loss": -21.63149070739746, "global_step": 93696, "epoch": 1128} {"train_loss": -21.99490737915039, "global_step": 93697, "epoch": 1128} {"train_loss": -21.771991729736328, "global_step": 93698, "epoch": 1128} {"train_loss": -21.571535110473633, "global_step": 93699, "epoch": 1128} {"train_loss": -21.9924259185791, "global_step": 93700, "epoch": 1128} {"train_loss": -21.718509674072266, "global_step": 93701, "epoch": 1128} {"train_loss": -21.28811264038086, "global_step": 93702, "epoch": 1128} {"train_loss": -21.68707847595215, "global_step": 93703, "epoch": 1128} {"train_loss": -21.792137145996094, "global_step": 93704, "epoch": 1128} {"train_loss": -21.600988388061523, "global_step": 93705, "epoch": 1128} {"train_loss": -21.65579421261707, "global_step": 93706, "epoch": 1128, "val_loss": 6266219.0} {"train_loss": -21.2790584564209, "global_step": 93707, "epoch": 1129} {"train_loss": -21.355031967163086, "global_step": 93708, "epoch": 1129} {"train_loss": -21.23377227783203, "global_step": 93709, "epoch": 1129} {"train_loss": -21.47218132019043, "global_step": 93710, "epoch": 1129} {"train_loss": -21.243566513061523, "global_step": 93711, "epoch": 1129} {"train_loss": -21.575057983398438, "global_step": 93712, "epoch": 1129} {"train_loss": -21.37042808532715, "global_step": 93713, "epoch": 1129} {"train_loss": -21.389068603515625, "global_step": 93714, "epoch": 1129} {"train_loss": -21.175809860229492, "global_step": 93715, "epoch": 1129} {"train_loss": -21.77899742126465, "global_step": 93716, "epoch": 1129} {"train_loss": -21.201452255249023, "global_step": 93717, "epoch": 1129} {"train_loss": -21.20842933654785, "global_step": 93718, "epoch": 1129} {"train_loss": -21.376453399658203, "global_step": 93719, "epoch": 1129} {"train_loss": -21.555587768554688, "global_step": 93720, "epoch": 1129} {"train_loss": -21.67597198486328, "global_step": 93721, "epoch": 1129} {"train_loss": -21.824005126953125, "global_step": 93722, "epoch": 1129} {"train_loss": -21.846250534057617, "global_step": 93723, "epoch": 1129} {"train_loss": -21.484195709228516, "global_step": 93724, "epoch": 1129} {"train_loss": -21.7603759765625, "global_step": 93725, "epoch": 1129} {"train_loss": -21.86423683166504, "global_step": 93726, "epoch": 1129} {"train_loss": -21.282215118408203, "global_step": 93727, "epoch": 1129} {"train_loss": -21.56089210510254, "global_step": 93728, "epoch": 1129} {"train_loss": -21.84333610534668, "global_step": 93729, "epoch": 1129} {"train_loss": -21.583921432495117, "global_step": 93730, "epoch": 1129} {"train_loss": -21.92243766784668, "global_step": 93731, "epoch": 1129} {"train_loss": -22.2021484375, "global_step": 93732, "epoch": 1129} {"train_loss": -21.941598892211914, "global_step": 93733, "epoch": 1129} {"train_loss": -21.51493263244629, "global_step": 93734, "epoch": 1129} {"train_loss": -21.786909103393555, "global_step": 93735, "epoch": 1129} {"train_loss": -21.831912994384766, "global_step": 93736, "epoch": 1129} {"train_loss": -21.8560733795166, "global_step": 93737, "epoch": 1129} {"train_loss": -21.403440475463867, "global_step": 93738, "epoch": 1129} {"train_loss": -21.412540435791016, "global_step": 93739, "epoch": 1129} {"train_loss": -21.822607040405273, "global_step": 93740, "epoch": 1129} {"train_loss": -21.79792594909668, "global_step": 93741, "epoch": 1129} {"train_loss": -21.50111198425293, "global_step": 93742, "epoch": 1129} {"train_loss": -21.33625030517578, "global_step": 93743, "epoch": 1129} {"train_loss": -21.512311935424805, "global_step": 93744, "epoch": 1129} {"train_loss": -22.032564163208008, "global_step": 93745, "epoch": 1129} {"train_loss": -21.860273361206055, "global_step": 93746, "epoch": 1129} {"train_loss": -21.836124420166016, "global_step": 93747, "epoch": 1129} {"train_loss": -21.617298126220703, "global_step": 93748, "epoch": 1129} {"train_loss": -21.8089656829834, "global_step": 93749, "epoch": 1129} {"train_loss": -22.129568099975586, "global_step": 93750, "epoch": 1129} {"train_loss": -21.527326583862305, "global_step": 93751, "epoch": 1129} {"train_loss": -21.45181655883789, "global_step": 93752, "epoch": 1129} {"train_loss": -21.508838653564453, "global_step": 93753, "epoch": 1129} {"train_loss": -21.596851348876953, "global_step": 93754, "epoch": 1129} {"train_loss": -21.496580123901367, "global_step": 93755, "epoch": 1129} {"train_loss": -21.633743286132812, "global_step": 93756, "epoch": 1129} {"train_loss": -21.468276977539062, "global_step": 93757, "epoch": 1129} {"train_loss": -21.417282104492188, "global_step": 93758, "epoch": 1129} {"train_loss": -21.613204956054688, "global_step": 93759, "epoch": 1129} {"train_loss": -21.30776023864746, "global_step": 93760, "epoch": 1129} {"train_loss": -21.635635375976562, "global_step": 93761, "epoch": 1129} {"train_loss": -21.72100067138672, "global_step": 93762, "epoch": 1129} {"train_loss": -21.728717803955078, "global_step": 93763, "epoch": 1129} {"train_loss": -21.697906494140625, "global_step": 93764, "epoch": 1129} {"train_loss": -21.805715560913086, "global_step": 93765, "epoch": 1129} {"train_loss": -21.856266021728516, "global_step": 93766, "epoch": 1129} {"train_loss": -21.655057907104492, "global_step": 93767, "epoch": 1129} {"train_loss": -22.168210983276367, "global_step": 93768, "epoch": 1129} {"train_loss": -21.908294677734375, "global_step": 93769, "epoch": 1129} {"train_loss": -22.08969497680664, "global_step": 93770, "epoch": 1129} {"train_loss": -21.721372604370117, "global_step": 93771, "epoch": 1129} {"train_loss": -21.33829689025879, "global_step": 93772, "epoch": 1129} {"train_loss": -21.769811630249023, "global_step": 93773, "epoch": 1129} {"train_loss": -21.839984893798828, "global_step": 93774, "epoch": 1129} {"train_loss": -22.03762435913086, "global_step": 93775, "epoch": 1129} {"train_loss": -21.8892879486084, "global_step": 93776, "epoch": 1129} {"train_loss": -22.160266876220703, "global_step": 93777, "epoch": 1129} {"train_loss": -21.929101943969727, "global_step": 93778, "epoch": 1129} {"train_loss": -21.961835861206055, "global_step": 93779, "epoch": 1129} {"train_loss": -21.807165145874023, "global_step": 93780, "epoch": 1129} {"train_loss": -21.475187301635742, "global_step": 93781, "epoch": 1129} {"train_loss": -21.843481063842773, "global_step": 93782, "epoch": 1129} {"train_loss": -21.75556755065918, "global_step": 93783, "epoch": 1129} {"train_loss": -21.758563995361328, "global_step": 93784, "epoch": 1129} {"train_loss": -22.000442504882812, "global_step": 93785, "epoch": 1129} {"train_loss": -21.57026481628418, "global_step": 93786, "epoch": 1129} {"train_loss": -21.751440048217773, "global_step": 93787, "epoch": 1129} {"train_loss": -21.604894638061523, "global_step": 93788, "epoch": 1129} {"train_loss": -21.65530374825719, "global_step": 93789, "epoch": 1129, "val_loss": 6097908.0} {"train_loss": -21.255142211914062, "global_step": 93790, "epoch": 1130} {"train_loss": -21.401376724243164, "global_step": 93791, "epoch": 1130} {"train_loss": -21.044034957885742, "global_step": 93792, "epoch": 1130} {"train_loss": -21.048797607421875, "global_step": 93793, "epoch": 1130} {"train_loss": -21.01871109008789, "global_step": 93794, "epoch": 1130} {"train_loss": -20.68035316467285, "global_step": 93795, "epoch": 1130} {"train_loss": -21.5819091796875, "global_step": 93796, "epoch": 1130} {"train_loss": -21.53072166442871, "global_step": 93797, "epoch": 1130} {"train_loss": -21.17568016052246, "global_step": 93798, "epoch": 1130} {"train_loss": -21.213451385498047, "global_step": 93799, "epoch": 1130} {"train_loss": -21.20537567138672, "global_step": 93800, "epoch": 1130} {"train_loss": -21.414541244506836, "global_step": 93801, "epoch": 1130} {"train_loss": -21.115158081054688, "global_step": 93802, "epoch": 1130} {"train_loss": -21.358871459960938, "global_step": 93803, "epoch": 1130} {"train_loss": -21.501928329467773, "global_step": 93804, "epoch": 1130} {"train_loss": -21.508405685424805, "global_step": 93805, "epoch": 1130} {"train_loss": -21.47516441345215, "global_step": 93806, "epoch": 1130} {"train_loss": -21.731891632080078, "global_step": 93807, "epoch": 1130} {"train_loss": -21.82804298400879, "global_step": 93808, "epoch": 1130} {"train_loss": -21.980405807495117, "global_step": 93809, "epoch": 1130} {"train_loss": -21.63469123840332, "global_step": 93810, "epoch": 1130} {"train_loss": -21.54230308532715, "global_step": 93811, "epoch": 1130} {"train_loss": -21.712465286254883, "global_step": 93812, "epoch": 1130} {"train_loss": -21.612977981567383, "global_step": 93813, "epoch": 1130} {"train_loss": -21.723501205444336, "global_step": 93814, "epoch": 1130} {"train_loss": -21.776453018188477, "global_step": 93815, "epoch": 1130} {"train_loss": -21.7259578704834, "global_step": 93816, "epoch": 1130} {"train_loss": -21.298442840576172, "global_step": 93817, "epoch": 1130} {"train_loss": -21.748987197875977, "global_step": 93818, "epoch": 1130} {"train_loss": -22.083219528198242, "global_step": 93819, "epoch": 1130} {"train_loss": -21.67501449584961, "global_step": 93820, "epoch": 1130} {"train_loss": -21.57761001586914, "global_step": 93821, "epoch": 1130} {"train_loss": -21.630332946777344, "global_step": 93822, "epoch": 1130} {"train_loss": -21.564367294311523, "global_step": 93823, "epoch": 1130} {"train_loss": -21.308643341064453, "global_step": 93824, "epoch": 1130} {"train_loss": -21.84095573425293, "global_step": 93825, "epoch": 1130} {"train_loss": -21.68987464904785, "global_step": 93826, "epoch": 1130} {"train_loss": -22.087635040283203, "global_step": 93827, "epoch": 1130} {"train_loss": -21.837980270385742, "global_step": 93828, "epoch": 1130} {"train_loss": -21.623340606689453, "global_step": 93829, "epoch": 1130} {"train_loss": -21.61449432373047, "global_step": 93830, "epoch": 1130} {"train_loss": -21.69719696044922, "global_step": 93831, "epoch": 1130} {"train_loss": -21.787216186523438, "global_step": 93832, "epoch": 1130} {"train_loss": -21.85906410217285, "global_step": 93833, "epoch": 1130} {"train_loss": -21.689411163330078, "global_step": 93834, "epoch": 1130} {"train_loss": -21.547454833984375, "global_step": 93835, "epoch": 1130} {"train_loss": -21.729156494140625, "global_step": 93836, "epoch": 1130} {"train_loss": -21.371387481689453, "global_step": 93837, "epoch": 1130} {"train_loss": -22.080339431762695, "global_step": 93838, "epoch": 1130} {"train_loss": -21.658945083618164, "global_step": 93839, "epoch": 1130} {"train_loss": -21.893939971923828, "global_step": 93840, "epoch": 1130} {"train_loss": -21.47454261779785, "global_step": 93841, "epoch": 1130} {"train_loss": -21.87203025817871, "global_step": 93842, "epoch": 1130} {"train_loss": -21.82039451599121, "global_step": 93843, "epoch": 1130} {"train_loss": -22.013774871826172, "global_step": 93844, "epoch": 1130} {"train_loss": -21.915258407592773, "global_step": 93845, "epoch": 1130} {"train_loss": -21.83096694946289, "global_step": 93846, "epoch": 1130} {"train_loss": -21.649658203125, "global_step": 93847, "epoch": 1130} {"train_loss": -21.74247169494629, "global_step": 93848, "epoch": 1130} {"train_loss": -21.937467575073242, "global_step": 93849, "epoch": 1130} {"train_loss": -22.09979248046875, "global_step": 93850, "epoch": 1130} {"train_loss": -21.55873680114746, "global_step": 93851, "epoch": 1130} {"train_loss": -21.467309951782227, "global_step": 93852, "epoch": 1130} {"train_loss": -21.441701889038086, "global_step": 93853, "epoch": 1130} {"train_loss": -21.486099243164062, "global_step": 93854, "epoch": 1130} {"train_loss": -21.630075454711914, "global_step": 93855, "epoch": 1130} {"train_loss": -21.64755630493164, "global_step": 93856, "epoch": 1130} {"train_loss": -22.211734771728516, "global_step": 93857, "epoch": 1130} {"train_loss": -21.652158737182617, "global_step": 93858, "epoch": 1130} {"train_loss": -21.999792098999023, "global_step": 93859, "epoch": 1130} {"train_loss": -21.745786666870117, "global_step": 93860, "epoch": 1130} {"train_loss": -21.833513259887695, "global_step": 93861, "epoch": 1130} {"train_loss": -21.706186294555664, "global_step": 93862, "epoch": 1130} {"train_loss": -21.49306297302246, "global_step": 93863, "epoch": 1130} {"train_loss": -22.075910568237305, "global_step": 93864, "epoch": 1130} {"train_loss": -21.834924697875977, "global_step": 93865, "epoch": 1130} {"train_loss": -21.861011505126953, "global_step": 93866, "epoch": 1130} {"train_loss": -21.97369956970215, "global_step": 93867, "epoch": 1130} {"train_loss": -21.92390251159668, "global_step": 93868, "epoch": 1130} {"train_loss": -21.908645629882812, "global_step": 93869, "epoch": 1130} {"train_loss": -21.87648582458496, "global_step": 93870, "epoch": 1130} {"train_loss": -21.623157501220703, "global_step": 93871, "epoch": 1130} {"train_loss": -21.63531356260001, "global_step": 93872, "epoch": 1130, "val_loss": 6147452.0} {"train_loss": -22.081396102905273, "global_step": 93873, "epoch": 1131} {"train_loss": -21.844806671142578, "global_step": 93874, "epoch": 1131} {"train_loss": -21.643278121948242, "global_step": 93875, "epoch": 1131} {"train_loss": -21.66748046875, "global_step": 93876, "epoch": 1131} {"train_loss": -21.53386878967285, "global_step": 93877, "epoch": 1131} {"train_loss": -21.642221450805664, "global_step": 93878, "epoch": 1131} {"train_loss": -21.7128963470459, "global_step": 93879, "epoch": 1131} {"train_loss": -22.122678756713867, "global_step": 93880, "epoch": 1131} {"train_loss": -21.484642028808594, "global_step": 93881, "epoch": 1131} {"train_loss": -21.727073669433594, "global_step": 93882, "epoch": 1131} {"train_loss": -22.018936157226562, "global_step": 93883, "epoch": 1131} {"train_loss": -21.80792999267578, "global_step": 93884, "epoch": 1131} {"train_loss": -21.79680061340332, "global_step": 93885, "epoch": 1131} {"train_loss": -21.830097198486328, "global_step": 93886, "epoch": 1131} {"train_loss": -21.596986770629883, "global_step": 93887, "epoch": 1131} {"train_loss": -21.9686222076416, "global_step": 93888, "epoch": 1131} {"train_loss": -21.464099884033203, "global_step": 93889, "epoch": 1131} {"train_loss": -21.49475860595703, "global_step": 93890, "epoch": 1131} {"train_loss": -21.418502807617188, "global_step": 93891, "epoch": 1131} {"train_loss": -22.061553955078125, "global_step": 93892, "epoch": 1131} {"train_loss": -21.814071655273438, "global_step": 93893, "epoch": 1131} {"train_loss": -21.8006591796875, "global_step": 93894, "epoch": 1131} {"train_loss": -21.565200805664062, "global_step": 93895, "epoch": 1131} {"train_loss": -21.779531478881836, "global_step": 93896, "epoch": 1131} {"train_loss": -21.385456085205078, "global_step": 93897, "epoch": 1131} {"train_loss": -21.731557846069336, "global_step": 93898, "epoch": 1131} {"train_loss": -21.435453414916992, "global_step": 93899, "epoch": 1131} {"train_loss": -21.48733901977539, "global_step": 93900, "epoch": 1131} {"train_loss": -21.758729934692383, "global_step": 93901, "epoch": 1131} {"train_loss": -21.4914608001709, "global_step": 93902, "epoch": 1131} {"train_loss": -21.626569747924805, "global_step": 93903, "epoch": 1131} {"train_loss": -21.455121994018555, "global_step": 93904, "epoch": 1131} {"train_loss": -21.37495231628418, "global_step": 93905, "epoch": 1131} {"train_loss": -21.760915756225586, "global_step": 93906, "epoch": 1131} {"train_loss": -21.699729919433594, "global_step": 93907, "epoch": 1131} {"train_loss": -21.859651565551758, "global_step": 93908, "epoch": 1131} {"train_loss": -21.54676628112793, "global_step": 93909, "epoch": 1131} {"train_loss": -21.604110717773438, "global_step": 93910, "epoch": 1131} {"train_loss": -21.605016708374023, "global_step": 93911, "epoch": 1131} {"train_loss": -21.816499710083008, "global_step": 93912, "epoch": 1131} {"train_loss": -21.608800888061523, "global_step": 93913, "epoch": 1131} {"train_loss": -21.862947463989258, "global_step": 93914, "epoch": 1131} {"train_loss": -21.731298446655273, "global_step": 93915, "epoch": 1131} {"train_loss": -21.304622650146484, "global_step": 93916, "epoch": 1131} {"train_loss": -21.973800659179688, "global_step": 93917, "epoch": 1131} {"train_loss": -21.707862854003906, "global_step": 93918, "epoch": 1131} {"train_loss": -21.839353561401367, "global_step": 93919, "epoch": 1131} {"train_loss": -21.71934700012207, "global_step": 93920, "epoch": 1131} {"train_loss": -21.589872360229492, "global_step": 93921, "epoch": 1131} {"train_loss": -21.463428497314453, "global_step": 93922, "epoch": 1131} {"train_loss": -21.737030029296875, "global_step": 93923, "epoch": 1131} {"train_loss": -21.946043014526367, "global_step": 93924, "epoch": 1131} {"train_loss": -21.534452438354492, "global_step": 93925, "epoch": 1131} {"train_loss": -21.972368240356445, "global_step": 93926, "epoch": 1131} {"train_loss": -21.857894897460938, "global_step": 93927, "epoch": 1131} {"train_loss": -21.825902938842773, "global_step": 93928, "epoch": 1131} {"train_loss": -21.96849250793457, "global_step": 93929, "epoch": 1131} {"train_loss": -21.63530921936035, "global_step": 93930, "epoch": 1131} {"train_loss": -21.81570816040039, "global_step": 93931, "epoch": 1131} {"train_loss": -21.598398208618164, "global_step": 93932, "epoch": 1131} {"train_loss": -21.551877975463867, "global_step": 93933, "epoch": 1131} {"train_loss": -21.57415199279785, "global_step": 93934, "epoch": 1131} {"train_loss": -21.760387420654297, "global_step": 93935, "epoch": 1131} {"train_loss": -21.550764083862305, "global_step": 93936, "epoch": 1131} {"train_loss": -21.512527465820312, "global_step": 93937, "epoch": 1131} {"train_loss": -21.726314544677734, "global_step": 93938, "epoch": 1131} {"train_loss": -22.116058349609375, "global_step": 93939, "epoch": 1131} {"train_loss": -21.593042373657227, "global_step": 93940, "epoch": 1131} {"train_loss": -21.809167861938477, "global_step": 93941, "epoch": 1131} {"train_loss": -21.7689208984375, "global_step": 93942, "epoch": 1131} {"train_loss": -21.721887588500977, "global_step": 93943, "epoch": 1131} {"train_loss": -21.776901245117188, "global_step": 93944, "epoch": 1131} {"train_loss": -21.484540939331055, "global_step": 93945, "epoch": 1131} {"train_loss": -21.779739379882812, "global_step": 93946, "epoch": 1131} {"train_loss": -21.932592391967773, "global_step": 93947, "epoch": 1131} {"train_loss": -22.15203285217285, "global_step": 93948, "epoch": 1131} {"train_loss": -21.75170135498047, "global_step": 93949, "epoch": 1131} {"train_loss": -22.037593841552734, "global_step": 93950, "epoch": 1131} {"train_loss": -22.014911651611328, "global_step": 93951, "epoch": 1131} {"train_loss": -21.67771339416504, "global_step": 93952, "epoch": 1131} {"train_loss": -21.46526527404785, "global_step": 93953, "epoch": 1131} {"train_loss": -22.15367889404297, "global_step": 93954, "epoch": 1131} {"train_loss": -21.73037299190659, "global_step": 93955, "epoch": 1131, "val_loss": 6230916.5} {"train_loss": -20.93446922302246, "global_step": 93956, "epoch": 1132} {"train_loss": -20.93988037109375, "global_step": 93957, "epoch": 1132} {"train_loss": -21.559968948364258, "global_step": 93958, "epoch": 1132} {"train_loss": -21.616846084594727, "global_step": 93959, "epoch": 1132} {"train_loss": -20.797962188720703, "global_step": 93960, "epoch": 1132} {"train_loss": -21.81947135925293, "global_step": 93961, "epoch": 1132} {"train_loss": -21.315292358398438, "global_step": 93962, "epoch": 1132} {"train_loss": -21.024629592895508, "global_step": 93963, "epoch": 1132} {"train_loss": -21.68341064453125, "global_step": 93964, "epoch": 1132} {"train_loss": -21.37411880493164, "global_step": 93965, "epoch": 1132} {"train_loss": -21.651357650756836, "global_step": 93966, "epoch": 1132} {"train_loss": -21.20282554626465, "global_step": 93967, "epoch": 1132} {"train_loss": -21.319250106811523, "global_step": 93968, "epoch": 1132} {"train_loss": -21.366060256958008, "global_step": 93969, "epoch": 1132} {"train_loss": -21.16912078857422, "global_step": 93970, "epoch": 1132} {"train_loss": -21.410018920898438, "global_step": 93971, "epoch": 1132} {"train_loss": -21.497722625732422, "global_step": 93972, "epoch": 1132} {"train_loss": -21.39705467224121, "global_step": 93973, "epoch": 1132} {"train_loss": -21.81987190246582, "global_step": 93974, "epoch": 1132} {"train_loss": -21.37315559387207, "global_step": 93975, "epoch": 1132} {"train_loss": -21.454675674438477, "global_step": 93976, "epoch": 1132} {"train_loss": -21.583282470703125, "global_step": 93977, "epoch": 1132} {"train_loss": -21.51171875, "global_step": 93978, "epoch": 1132} {"train_loss": -21.70892906188965, "global_step": 93979, "epoch": 1132} {"train_loss": -21.8458309173584, "global_step": 93980, "epoch": 1132} {"train_loss": -21.58518409729004, "global_step": 93981, "epoch": 1132} {"train_loss": -21.742565155029297, "global_step": 93982, "epoch": 1132} {"train_loss": -21.690746307373047, "global_step": 93983, "epoch": 1132} {"train_loss": -21.7863826751709, "global_step": 93984, "epoch": 1132} {"train_loss": -21.74796485900879, "global_step": 93985, "epoch": 1132} {"train_loss": -21.835113525390625, "global_step": 93986, "epoch": 1132} {"train_loss": -21.886581420898438, "global_step": 93987, "epoch": 1132} {"train_loss": -21.687917709350586, "global_step": 93988, "epoch": 1132} {"train_loss": -21.713993072509766, "global_step": 93989, "epoch": 1132} {"train_loss": -22.025205612182617, "global_step": 93990, "epoch": 1132} {"train_loss": -22.01765251159668, "global_step": 93991, "epoch": 1132} {"train_loss": -21.66426658630371, "global_step": 93992, "epoch": 1132} {"train_loss": -21.773420333862305, "global_step": 93993, "epoch": 1132} {"train_loss": -21.936908721923828, "global_step": 93994, "epoch": 1132} {"train_loss": -21.393423080444336, "global_step": 93995, "epoch": 1132} {"train_loss": -21.663158416748047, "global_step": 93996, "epoch": 1132} {"train_loss": -21.557205200195312, "global_step": 93997, "epoch": 1132} {"train_loss": -21.788883209228516, "global_step": 93998, "epoch": 1132} {"train_loss": -21.648481369018555, "global_step": 93999, "epoch": 1132} {"train_loss": -22.051054000854492, "global_step": 94000, "epoch": 1132} {"train_loss": -21.81907081604004, "global_step": 94001, "epoch": 1132} {"train_loss": -21.654340744018555, "global_step": 94002, "epoch": 1132} {"train_loss": -21.688480377197266, "global_step": 94003, "epoch": 1132} {"train_loss": -21.593048095703125, "global_step": 94004, "epoch": 1132} {"train_loss": -21.74107551574707, "global_step": 94005, "epoch": 1132} {"train_loss": -22.055233001708984, "global_step": 94006, "epoch": 1132} {"train_loss": -21.6669864654541, "global_step": 94007, "epoch": 1132} {"train_loss": -21.826963424682617, "global_step": 94008, "epoch": 1132} {"train_loss": -21.79669761657715, "global_step": 94009, "epoch": 1132} {"train_loss": -21.78323745727539, "global_step": 94010, "epoch": 1132} {"train_loss": -21.780664443969727, "global_step": 94011, "epoch": 1132} {"train_loss": -21.95020866394043, "global_step": 94012, "epoch": 1132} {"train_loss": -21.754608154296875, "global_step": 94013, "epoch": 1132} {"train_loss": -21.757883071899414, "global_step": 94014, "epoch": 1132} {"train_loss": -22.088106155395508, "global_step": 94015, "epoch": 1132} {"train_loss": -21.62009620666504, "global_step": 94016, "epoch": 1132} {"train_loss": -21.624807357788086, "global_step": 94017, "epoch": 1132} {"train_loss": -21.75600242614746, "global_step": 94018, "epoch": 1132} {"train_loss": -21.745662689208984, "global_step": 94019, "epoch": 1132} {"train_loss": -21.482603073120117, "global_step": 94020, "epoch": 1132} {"train_loss": -21.92573356628418, "global_step": 94021, "epoch": 1132} {"train_loss": -21.556798934936523, "global_step": 94022, "epoch": 1132} {"train_loss": -21.58316421508789, "global_step": 94023, "epoch": 1132} {"train_loss": -21.55817985534668, "global_step": 94024, "epoch": 1132} {"train_loss": -21.93820571899414, "global_step": 94025, "epoch": 1132} {"train_loss": -21.937170028686523, "global_step": 94026, "epoch": 1132} {"train_loss": -21.118988037109375, "global_step": 94027, "epoch": 1132} {"train_loss": -21.77484893798828, "global_step": 94028, "epoch": 1132} {"train_loss": -21.864334106445312, "global_step": 94029, "epoch": 1132} {"train_loss": -21.665424346923828, "global_step": 94030, "epoch": 1132} {"train_loss": -21.776594161987305, "global_step": 94031, "epoch": 1132} {"train_loss": -21.99909019470215, "global_step": 94032, "epoch": 1132} {"train_loss": -21.850894927978516, "global_step": 94033, "epoch": 1132} {"train_loss": -21.80356788635254, "global_step": 94034, "epoch": 1132} {"train_loss": -21.826467514038086, "global_step": 94035, "epoch": 1132} {"train_loss": -21.924270629882812, "global_step": 94036, "epoch": 1132} {"train_loss": -21.840646743774414, "global_step": 94037, "epoch": 1132} {"train_loss": -21.662735858595514, "global_step": 94038, "epoch": 1132, "val_loss": 6355024.0} {"train_loss": -21.427154541015625, "global_step": 94039, "epoch": 1133} {"train_loss": -21.449628829956055, "global_step": 94040, "epoch": 1133} {"train_loss": -21.715309143066406, "global_step": 94041, "epoch": 1133} {"train_loss": -21.64710807800293, "global_step": 94042, "epoch": 1133} {"train_loss": -21.44013023376465, "global_step": 94043, "epoch": 1133} {"train_loss": -21.736282348632812, "global_step": 94044, "epoch": 1133} {"train_loss": -21.658462524414062, "global_step": 94045, "epoch": 1133} {"train_loss": -21.533720016479492, "global_step": 94046, "epoch": 1133} {"train_loss": -21.580482482910156, "global_step": 94047, "epoch": 1133} {"train_loss": -21.386123657226562, "global_step": 94048, "epoch": 1133} {"train_loss": -21.66152000427246, "global_step": 94049, "epoch": 1133} {"train_loss": -21.48944664001465, "global_step": 94050, "epoch": 1133} {"train_loss": -21.782529830932617, "global_step": 94051, "epoch": 1133} {"train_loss": -21.54670524597168, "global_step": 94052, "epoch": 1133} {"train_loss": -21.688161849975586, "global_step": 94053, "epoch": 1133} {"train_loss": -21.754297256469727, "global_step": 94054, "epoch": 1133} {"train_loss": -21.540390014648438, "global_step": 94055, "epoch": 1133} {"train_loss": -21.689496994018555, "global_step": 94056, "epoch": 1133} {"train_loss": -21.698511123657227, "global_step": 94057, "epoch": 1133} {"train_loss": -21.74788475036621, "global_step": 94058, "epoch": 1133} {"train_loss": -21.74916648864746, "global_step": 94059, "epoch": 1133} {"train_loss": -21.691965103149414, "global_step": 94060, "epoch": 1133} {"train_loss": -22.011213302612305, "global_step": 94061, "epoch": 1133} {"train_loss": -21.67526626586914, "global_step": 94062, "epoch": 1133} {"train_loss": -21.779088973999023, "global_step": 94063, "epoch": 1133} {"train_loss": -21.59163475036621, "global_step": 94064, "epoch": 1133} {"train_loss": -21.867053985595703, "global_step": 94065, "epoch": 1133} {"train_loss": -21.734155654907227, "global_step": 94066, "epoch": 1133} {"train_loss": -21.7819766998291, "global_step": 94067, "epoch": 1133} {"train_loss": -21.543315887451172, "global_step": 94068, "epoch": 1133} {"train_loss": -22.0369930267334, "global_step": 94069, "epoch": 1133} {"train_loss": -21.49541664123535, "global_step": 94070, "epoch": 1133} {"train_loss": -21.521774291992188, "global_step": 94071, "epoch": 1133} {"train_loss": -21.571928024291992, "global_step": 94072, "epoch": 1133} {"train_loss": -21.72837257385254, "global_step": 94073, "epoch": 1133} {"train_loss": -21.42742347717285, "global_step": 94074, "epoch": 1133} {"train_loss": -21.932708740234375, "global_step": 94075, "epoch": 1133} {"train_loss": -21.584518432617188, "global_step": 94076, "epoch": 1133} {"train_loss": -22.097631454467773, "global_step": 94077, "epoch": 1133} {"train_loss": -21.582929611206055, "global_step": 94078, "epoch": 1133} {"train_loss": -21.91617202758789, "global_step": 94079, "epoch": 1133} {"train_loss": -21.601469039916992, "global_step": 94080, "epoch": 1133} {"train_loss": -21.511219024658203, "global_step": 94081, "epoch": 1133} {"train_loss": -21.744037628173828, "global_step": 94082, "epoch": 1133} {"train_loss": -21.936120986938477, "global_step": 94083, "epoch": 1133} {"train_loss": -21.764535903930664, "global_step": 94084, "epoch": 1133} {"train_loss": -21.664209365844727, "global_step": 94085, "epoch": 1133} {"train_loss": -21.78095817565918, "global_step": 94086, "epoch": 1133} {"train_loss": -22.04633140563965, "global_step": 94087, "epoch": 1133} {"train_loss": -21.564878463745117, "global_step": 94088, "epoch": 1133} {"train_loss": -21.927284240722656, "global_step": 94089, "epoch": 1133} {"train_loss": -21.8387508392334, "global_step": 94090, "epoch": 1133} {"train_loss": -21.77617835998535, "global_step": 94091, "epoch": 1133} {"train_loss": -21.594118118286133, "global_step": 94092, "epoch": 1133} {"train_loss": -22.164531707763672, "global_step": 94093, "epoch": 1133} {"train_loss": -22.075408935546875, "global_step": 94094, "epoch": 1133} {"train_loss": -21.912532806396484, "global_step": 94095, "epoch": 1133} {"train_loss": -22.078659057617188, "global_step": 94096, "epoch": 1133} {"train_loss": -21.54815673828125, "global_step": 94097, "epoch": 1133} {"train_loss": -21.54029655456543, "global_step": 94098, "epoch": 1133} {"train_loss": -22.141969680786133, "global_step": 94099, "epoch": 1133} {"train_loss": -21.639205932617188, "global_step": 94100, "epoch": 1133} {"train_loss": -21.81709861755371, "global_step": 94101, "epoch": 1133} {"train_loss": -21.84058952331543, "global_step": 94102, "epoch": 1133} {"train_loss": -21.804838180541992, "global_step": 94103, "epoch": 1133} {"train_loss": -21.499107360839844, "global_step": 94104, "epoch": 1133} {"train_loss": -21.54022216796875, "global_step": 94105, "epoch": 1133} {"train_loss": -21.894474029541016, "global_step": 94106, "epoch": 1133} {"train_loss": -21.840709686279297, "global_step": 94107, "epoch": 1133} {"train_loss": -21.51002311706543, "global_step": 94108, "epoch": 1133} {"train_loss": -21.375844955444336, "global_step": 94109, "epoch": 1133} {"train_loss": -21.964569091796875, "global_step": 94110, "epoch": 1133} {"train_loss": -21.84157943725586, "global_step": 94111, "epoch": 1133} {"train_loss": -21.678943634033203, "global_step": 94112, "epoch": 1133} {"train_loss": -21.88309097290039, "global_step": 94113, "epoch": 1133} {"train_loss": -21.413650512695312, "global_step": 94114, "epoch": 1133} {"train_loss": -21.45184326171875, "global_step": 94115, "epoch": 1133} {"train_loss": -21.965574264526367, "global_step": 94116, "epoch": 1133} {"train_loss": -21.739269256591797, "global_step": 94117, "epoch": 1133} {"train_loss": -21.55470085144043, "global_step": 94118, "epoch": 1133} {"train_loss": -21.602140426635742, "global_step": 94119, "epoch": 1133} {"train_loss": -21.931615829467773, "global_step": 94120, "epoch": 1133} {"train_loss": -21.708176555403742, "global_step": 94121, "epoch": 1133, "val_loss": 6151026.5} {"train_loss": -21.15830421447754, "global_step": 94122, "epoch": 1134} {"train_loss": -21.04719352722168, "global_step": 94123, "epoch": 1134} {"train_loss": -21.307193756103516, "global_step": 94124, "epoch": 1134} {"train_loss": -21.54498291015625, "global_step": 94125, "epoch": 1134} {"train_loss": -21.085708618164062, "global_step": 94126, "epoch": 1134} {"train_loss": -21.47018814086914, "global_step": 94127, "epoch": 1134} {"train_loss": -21.377731323242188, "global_step": 94128, "epoch": 1134} {"train_loss": -21.151611328125, "global_step": 94129, "epoch": 1134} {"train_loss": -21.814777374267578, "global_step": 94130, "epoch": 1134} {"train_loss": -21.651086807250977, "global_step": 94131, "epoch": 1134} {"train_loss": -21.634729385375977, "global_step": 94132, "epoch": 1134} {"train_loss": -21.83306312561035, "global_step": 94133, "epoch": 1134} {"train_loss": -22.27931785583496, "global_step": 94134, "epoch": 1134} {"train_loss": -21.277034759521484, "global_step": 94135, "epoch": 1134} {"train_loss": -21.592130661010742, "global_step": 94136, "epoch": 1134} {"train_loss": -21.544401168823242, "global_step": 94137, "epoch": 1134} {"train_loss": -21.679311752319336, "global_step": 94138, "epoch": 1134} {"train_loss": -21.5535888671875, "global_step": 94139, "epoch": 1134} {"train_loss": -21.533544540405273, "global_step": 94140, "epoch": 1134} {"train_loss": -22.0769100189209, "global_step": 94141, "epoch": 1134} {"train_loss": -21.5037841796875, "global_step": 94142, "epoch": 1134} {"train_loss": -21.67271614074707, "global_step": 94143, "epoch": 1134} {"train_loss": -21.98243522644043, "global_step": 94144, "epoch": 1134} {"train_loss": -21.654895782470703, "global_step": 94145, "epoch": 1134} {"train_loss": -21.638044357299805, "global_step": 94146, "epoch": 1134} {"train_loss": -21.844491958618164, "global_step": 94147, "epoch": 1134} {"train_loss": -21.651113510131836, "global_step": 94148, "epoch": 1134} {"train_loss": -21.50152015686035, "global_step": 94149, "epoch": 1134} {"train_loss": -21.550891876220703, "global_step": 94150, "epoch": 1134} {"train_loss": -22.03492546081543, "global_step": 94151, "epoch": 1134} {"train_loss": -21.77622413635254, "global_step": 94152, "epoch": 1134} {"train_loss": -21.700870513916016, "global_step": 94153, "epoch": 1134} {"train_loss": -21.929235458374023, "global_step": 94154, "epoch": 1134} {"train_loss": -21.783666610717773, "global_step": 94155, "epoch": 1134} {"train_loss": -21.689041137695312, "global_step": 94156, "epoch": 1134} {"train_loss": -21.530410766601562, "global_step": 94157, "epoch": 1134} {"train_loss": -21.68623161315918, "global_step": 94158, "epoch": 1134} {"train_loss": -21.77901268005371, "global_step": 94159, "epoch": 1134} {"train_loss": -21.868555068969727, "global_step": 94160, "epoch": 1134} {"train_loss": -21.909873962402344, "global_step": 94161, "epoch": 1134} {"train_loss": -21.923002243041992, "global_step": 94162, "epoch": 1134} {"train_loss": -21.6148681640625, "global_step": 94163, "epoch": 1134} {"train_loss": -21.840423583984375, "global_step": 94164, "epoch": 1134} {"train_loss": -21.614139556884766, "global_step": 94165, "epoch": 1134} {"train_loss": -21.817502975463867, "global_step": 94166, "epoch": 1134} {"train_loss": -22.021366119384766, "global_step": 94167, "epoch": 1134} {"train_loss": -21.292428970336914, "global_step": 94168, "epoch": 1134} {"train_loss": -21.723363876342773, "global_step": 94169, "epoch": 1134} {"train_loss": -21.38040542602539, "global_step": 94170, "epoch": 1134} {"train_loss": -21.888450622558594, "global_step": 94171, "epoch": 1134} {"train_loss": -21.736286163330078, "global_step": 94172, "epoch": 1134} {"train_loss": -22.163908004760742, "global_step": 94173, "epoch": 1134} {"train_loss": -21.60685920715332, "global_step": 94174, "epoch": 1134} {"train_loss": -22.072751998901367, "global_step": 94175, "epoch": 1134} {"train_loss": -21.626754760742188, "global_step": 94176, "epoch": 1134} {"train_loss": -21.603849411010742, "global_step": 94177, "epoch": 1134} {"train_loss": -21.614665985107422, "global_step": 94178, "epoch": 1134} {"train_loss": -21.51563835144043, "global_step": 94179, "epoch": 1134} {"train_loss": -21.940649032592773, "global_step": 94180, "epoch": 1134} {"train_loss": -21.39242935180664, "global_step": 94181, "epoch": 1134} {"train_loss": -21.48184585571289, "global_step": 94182, "epoch": 1134} {"train_loss": -21.751752853393555, "global_step": 94183, "epoch": 1134} {"train_loss": -21.483556747436523, "global_step": 94184, "epoch": 1134} {"train_loss": -21.748565673828125, "global_step": 94185, "epoch": 1134} {"train_loss": -21.6756534576416, "global_step": 94186, "epoch": 1134} {"train_loss": -21.5056095123291, "global_step": 94187, "epoch": 1134} {"train_loss": -21.8630313873291, "global_step": 94188, "epoch": 1134} {"train_loss": -21.643444061279297, "global_step": 94189, "epoch": 1134} {"train_loss": -21.763864517211914, "global_step": 94190, "epoch": 1134} {"train_loss": -21.69233512878418, "global_step": 94191, "epoch": 1134} {"train_loss": -21.610403060913086, "global_step": 94192, "epoch": 1134} {"train_loss": -21.586063385009766, "global_step": 94193, "epoch": 1134} {"train_loss": -21.622467041015625, "global_step": 94194, "epoch": 1134} {"train_loss": -21.985095977783203, "global_step": 94195, "epoch": 1134} {"train_loss": -21.982572555541992, "global_step": 94196, "epoch": 1134} {"train_loss": -21.842802047729492, "global_step": 94197, "epoch": 1134} {"train_loss": -21.476675033569336, "global_step": 94198, "epoch": 1134} {"train_loss": -22.011316299438477, "global_step": 94199, "epoch": 1134} {"train_loss": -21.894622802734375, "global_step": 94200, "epoch": 1134} {"train_loss": -21.591371536254883, "global_step": 94201, "epoch": 1134} {"train_loss": -21.455459594726562, "global_step": 94202, "epoch": 1134} {"train_loss": -21.96025848388672, "global_step": 94203, "epoch": 1134} {"train_loss": -21.674830723957843, "global_step": 94204, "epoch": 1134, "val_loss": 6091645.0} {"train_loss": -21.73019790649414, "global_step": 94205, "epoch": 1135} {"train_loss": -21.198078155517578, "global_step": 94206, "epoch": 1135} {"train_loss": -21.552427291870117, "global_step": 94207, "epoch": 1135} {"train_loss": -21.511777877807617, "global_step": 94208, "epoch": 1135} {"train_loss": -21.361616134643555, "global_step": 94209, "epoch": 1135} {"train_loss": -21.545745849609375, "global_step": 94210, "epoch": 1135} {"train_loss": -21.467683792114258, "global_step": 94211, "epoch": 1135} {"train_loss": -21.449533462524414, "global_step": 94212, "epoch": 1135} {"train_loss": -21.746854782104492, "global_step": 94213, "epoch": 1135} {"train_loss": -21.846179962158203, "global_step": 94214, "epoch": 1135} {"train_loss": -21.568349838256836, "global_step": 94215, "epoch": 1135} {"train_loss": -21.480649948120117, "global_step": 94216, "epoch": 1135} {"train_loss": -21.434980392456055, "global_step": 94217, "epoch": 1135} {"train_loss": -21.203115463256836, "global_step": 94218, "epoch": 1135} {"train_loss": -21.510150909423828, "global_step": 94219, "epoch": 1135} {"train_loss": -21.56648826599121, "global_step": 94220, "epoch": 1135} {"train_loss": -21.677127838134766, "global_step": 94221, "epoch": 1135} {"train_loss": -21.261850357055664, "global_step": 94222, "epoch": 1135} {"train_loss": -21.36236000061035, "global_step": 94223, "epoch": 1135} {"train_loss": -21.754247665405273, "global_step": 94224, "epoch": 1135} {"train_loss": -21.60512351989746, "global_step": 94225, "epoch": 1135} {"train_loss": -21.995569229125977, "global_step": 94226, "epoch": 1135} {"train_loss": -21.71384620666504, "global_step": 94227, "epoch": 1135} {"train_loss": -21.852285385131836, "global_step": 94228, "epoch": 1135} {"train_loss": -21.976308822631836, "global_step": 94229, "epoch": 1135} {"train_loss": -21.511554718017578, "global_step": 94230, "epoch": 1135} {"train_loss": -21.813093185424805, "global_step": 94231, "epoch": 1135} {"train_loss": -22.037744522094727, "global_step": 94232, "epoch": 1135} {"train_loss": -21.61212730407715, "global_step": 94233, "epoch": 1135} {"train_loss": -21.95021629333496, "global_step": 94234, "epoch": 1135} {"train_loss": -21.85409927368164, "global_step": 94235, "epoch": 1135} {"train_loss": -21.69205665588379, "global_step": 94236, "epoch": 1135} {"train_loss": -21.787382125854492, "global_step": 94237, "epoch": 1135} {"train_loss": -21.658374786376953, "global_step": 94238, "epoch": 1135} {"train_loss": -21.84031105041504, "global_step": 94239, "epoch": 1135} {"train_loss": -21.500036239624023, "global_step": 94240, "epoch": 1135} {"train_loss": -21.440732955932617, "global_step": 94241, "epoch": 1135} {"train_loss": -21.780811309814453, "global_step": 94242, "epoch": 1135} {"train_loss": -21.764211654663086, "global_step": 94243, "epoch": 1135} {"train_loss": -21.630847930908203, "global_step": 94244, "epoch": 1135} {"train_loss": -21.903776168823242, "global_step": 94245, "epoch": 1135} {"train_loss": -21.85212516784668, "global_step": 94246, "epoch": 1135} {"train_loss": -21.730085372924805, "global_step": 94247, "epoch": 1135} {"train_loss": -21.674619674682617, "global_step": 94248, "epoch": 1135} {"train_loss": -21.768348693847656, "global_step": 94249, "epoch": 1135} {"train_loss": -22.001575469970703, "global_step": 94250, "epoch": 1135} {"train_loss": -21.7557430267334, "global_step": 94251, "epoch": 1135} {"train_loss": -21.64198112487793, "global_step": 94252, "epoch": 1135} {"train_loss": -21.523096084594727, "global_step": 94253, "epoch": 1135} {"train_loss": -21.57913589477539, "global_step": 94254, "epoch": 1135} {"train_loss": -21.883543014526367, "global_step": 94255, "epoch": 1135} {"train_loss": -22.019899368286133, "global_step": 94256, "epoch": 1135} {"train_loss": -21.495206832885742, "global_step": 94257, "epoch": 1135} {"train_loss": -21.811777114868164, "global_step": 94258, "epoch": 1135} {"train_loss": -21.807485580444336, "global_step": 94259, "epoch": 1135} {"train_loss": -21.523136138916016, "global_step": 94260, "epoch": 1135} {"train_loss": -21.725507736206055, "global_step": 94261, "epoch": 1135} {"train_loss": -21.909204483032227, "global_step": 94262, "epoch": 1135} {"train_loss": -21.62016487121582, "global_step": 94263, "epoch": 1135} {"train_loss": -21.759174346923828, "global_step": 94264, "epoch": 1135} {"train_loss": -21.757572174072266, "global_step": 94265, "epoch": 1135} {"train_loss": -21.526050567626953, "global_step": 94266, "epoch": 1135} {"train_loss": -21.682275772094727, "global_step": 94267, "epoch": 1135} {"train_loss": -21.802045822143555, "global_step": 94268, "epoch": 1135} {"train_loss": -21.79816436767578, "global_step": 94269, "epoch": 1135} {"train_loss": -21.60453224182129, "global_step": 94270, "epoch": 1135} {"train_loss": -21.548704147338867, "global_step": 94271, "epoch": 1135} {"train_loss": -21.7808895111084, "global_step": 94272, "epoch": 1135} {"train_loss": -21.719404220581055, "global_step": 94273, "epoch": 1135} {"train_loss": -21.8060302734375, "global_step": 94274, "epoch": 1135} {"train_loss": -21.981863021850586, "global_step": 94275, "epoch": 1135} {"train_loss": -21.665990829467773, "global_step": 94276, "epoch": 1135} {"train_loss": -21.72368812561035, "global_step": 94277, "epoch": 1135} {"train_loss": -21.526090621948242, "global_step": 94278, "epoch": 1135} {"train_loss": -21.76131248474121, "global_step": 94279, "epoch": 1135} {"train_loss": -21.74995994567871, "global_step": 94280, "epoch": 1135} {"train_loss": -21.751218795776367, "global_step": 94281, "epoch": 1135} {"train_loss": -21.416833877563477, "global_step": 94282, "epoch": 1135} {"train_loss": -21.984785079956055, "global_step": 94283, "epoch": 1135} {"train_loss": -22.07917022705078, "global_step": 94284, "epoch": 1135} {"train_loss": -21.564367294311523, "global_step": 94285, "epoch": 1135} {"train_loss": -22.069719314575195, "global_step": 94286, "epoch": 1135} {"train_loss": -21.680607577404345, "global_step": 94287, "epoch": 1135, "val_loss": 6223077.0} {"train_loss": -21.183063507080078, "global_step": 94288, "epoch": 1136} {"train_loss": -21.32972526550293, "global_step": 94289, "epoch": 1136} {"train_loss": -21.638824462890625, "global_step": 94290, "epoch": 1136} {"train_loss": -21.3464412689209, "global_step": 94291, "epoch": 1136} {"train_loss": -21.105167388916016, "global_step": 94292, "epoch": 1136} {"train_loss": -21.488887786865234, "global_step": 94293, "epoch": 1136} {"train_loss": -21.74752426147461, "global_step": 94294, "epoch": 1136} {"train_loss": -21.4899845123291, "global_step": 94295, "epoch": 1136} {"train_loss": -21.46515464782715, "global_step": 94296, "epoch": 1136} {"train_loss": -21.513595581054688, "global_step": 94297, "epoch": 1136} {"train_loss": -21.27752113342285, "global_step": 94298, "epoch": 1136} {"train_loss": -21.516754150390625, "global_step": 94299, "epoch": 1136} {"train_loss": -21.627077102661133, "global_step": 94300, "epoch": 1136} {"train_loss": -21.16014862060547, "global_step": 94301, "epoch": 1136} {"train_loss": -21.639814376831055, "global_step": 94302, "epoch": 1136} {"train_loss": -21.73053741455078, "global_step": 94303, "epoch": 1136} {"train_loss": -21.50459098815918, "global_step": 94304, "epoch": 1136} {"train_loss": -21.626684188842773, "global_step": 94305, "epoch": 1136} {"train_loss": -21.655302047729492, "global_step": 94306, "epoch": 1136} {"train_loss": -21.553302764892578, "global_step": 94307, "epoch": 1136} {"train_loss": -21.3352108001709, "global_step": 94308, "epoch": 1136} {"train_loss": -21.409887313842773, "global_step": 94309, "epoch": 1136} {"train_loss": -21.785537719726562, "global_step": 94310, "epoch": 1136} {"train_loss": -21.370718002319336, "global_step": 94311, "epoch": 1136} {"train_loss": -21.652420043945312, "global_step": 94312, "epoch": 1136} {"train_loss": -21.71979331970215, "global_step": 94313, "epoch": 1136} {"train_loss": -21.83774757385254, "global_step": 94314, "epoch": 1136} {"train_loss": -21.348346710205078, "global_step": 94315, "epoch": 1136} {"train_loss": -21.6044979095459, "global_step": 94316, "epoch": 1136} {"train_loss": -21.659927368164062, "global_step": 94317, "epoch": 1136} {"train_loss": -21.920602798461914, "global_step": 94318, "epoch": 1136} {"train_loss": -21.76378059387207, "global_step": 94319, "epoch": 1136} {"train_loss": -21.86720848083496, "global_step": 94320, "epoch": 1136} {"train_loss": -21.776636123657227, "global_step": 94321, "epoch": 1136} {"train_loss": -21.829862594604492, "global_step": 94322, "epoch": 1136} {"train_loss": -21.73695182800293, "global_step": 94323, "epoch": 1136} {"train_loss": -22.105093002319336, "global_step": 94324, "epoch": 1136} {"train_loss": -21.74258804321289, "global_step": 94325, "epoch": 1136} {"train_loss": -21.931299209594727, "global_step": 94326, "epoch": 1136} {"train_loss": -21.479698181152344, "global_step": 94327, "epoch": 1136} {"train_loss": -21.375473022460938, "global_step": 94328, "epoch": 1136} {"train_loss": -21.6860408782959, "global_step": 94329, "epoch": 1136} {"train_loss": -21.772480010986328, "global_step": 94330, "epoch": 1136} {"train_loss": -21.645740509033203, "global_step": 94331, "epoch": 1136} {"train_loss": -21.54791259765625, "global_step": 94332, "epoch": 1136} {"train_loss": -21.12325096130371, "global_step": 94333, "epoch": 1136} {"train_loss": -21.830623626708984, "global_step": 94334, "epoch": 1136} {"train_loss": -21.76969337463379, "global_step": 94335, "epoch": 1136} {"train_loss": -21.48358154296875, "global_step": 94336, "epoch": 1136} {"train_loss": -21.825246810913086, "global_step": 94337, "epoch": 1136} {"train_loss": -21.448665618896484, "global_step": 94338, "epoch": 1136} {"train_loss": -21.72608757019043, "global_step": 94339, "epoch": 1136} {"train_loss": -21.9324893951416, "global_step": 94340, "epoch": 1136} {"train_loss": -21.325490951538086, "global_step": 94341, "epoch": 1136} {"train_loss": -21.672256469726562, "global_step": 94342, "epoch": 1136} {"train_loss": -21.505199432373047, "global_step": 94343, "epoch": 1136} {"train_loss": -21.526073455810547, "global_step": 94344, "epoch": 1136} {"train_loss": -21.716833114624023, "global_step": 94345, "epoch": 1136} {"train_loss": -21.934717178344727, "global_step": 94346, "epoch": 1136} {"train_loss": -22.03496742248535, "global_step": 94347, "epoch": 1136} {"train_loss": -21.86311912536621, "global_step": 94348, "epoch": 1136} {"train_loss": -21.79005241394043, "global_step": 94349, "epoch": 1136} {"train_loss": -21.72165298461914, "global_step": 94350, "epoch": 1136} {"train_loss": -21.41725730895996, "global_step": 94351, "epoch": 1136} {"train_loss": -21.540515899658203, "global_step": 94352, "epoch": 1136} {"train_loss": -22.027616500854492, "global_step": 94353, "epoch": 1136} {"train_loss": -21.771947860717773, "global_step": 94354, "epoch": 1136} {"train_loss": -21.910476684570312, "global_step": 94355, "epoch": 1136} {"train_loss": -21.86470603942871, "global_step": 94356, "epoch": 1136} {"train_loss": -21.541339874267578, "global_step": 94357, "epoch": 1136} {"train_loss": -22.01736831665039, "global_step": 94358, "epoch": 1136} {"train_loss": -21.993192672729492, "global_step": 94359, "epoch": 1136} {"train_loss": -21.907140731811523, "global_step": 94360, "epoch": 1136} {"train_loss": -21.863515853881836, "global_step": 94361, "epoch": 1136} {"train_loss": -22.0794620513916, "global_step": 94362, "epoch": 1136} {"train_loss": -21.717864990234375, "global_step": 94363, "epoch": 1136} {"train_loss": -21.807470321655273, "global_step": 94364, "epoch": 1136} {"train_loss": -21.70195960998535, "global_step": 94365, "epoch": 1136} {"train_loss": -21.89662742614746, "global_step": 94366, "epoch": 1136} {"train_loss": -21.778629302978516, "global_step": 94367, "epoch": 1136} {"train_loss": -21.594221115112305, "global_step": 94368, "epoch": 1136} {"train_loss": -22.27750015258789, "global_step": 94369, "epoch": 1136} {"train_loss": -21.660920269518012, "global_step": 94370, "epoch": 1136, "val_loss": 6202318.0} {"train_loss": -19.65181541442871, "global_step": 94371, "epoch": 1137} {"train_loss": -21.008535385131836, "global_step": 94372, "epoch": 1137} {"train_loss": -20.10062026977539, "global_step": 94373, "epoch": 1137} {"train_loss": -20.931398391723633, "global_step": 94374, "epoch": 1137} {"train_loss": -21.228561401367188, "global_step": 94375, "epoch": 1137} {"train_loss": -21.037782669067383, "global_step": 94376, "epoch": 1137} {"train_loss": -20.788066864013672, "global_step": 94377, "epoch": 1137} {"train_loss": -21.073545455932617, "global_step": 94378, "epoch": 1137} {"train_loss": -20.89621353149414, "global_step": 94379, "epoch": 1137} {"train_loss": -20.939884185791016, "global_step": 94380, "epoch": 1137} {"train_loss": -21.11920738220215, "global_step": 94381, "epoch": 1137} {"train_loss": -21.054960250854492, "global_step": 94382, "epoch": 1137} {"train_loss": -21.041515350341797, "global_step": 94383, "epoch": 1137} {"train_loss": -21.319171905517578, "global_step": 94384, "epoch": 1137} {"train_loss": -21.42622184753418, "global_step": 94385, "epoch": 1137} {"train_loss": -21.07010841369629, "global_step": 94386, "epoch": 1137} {"train_loss": -21.165136337280273, "global_step": 94387, "epoch": 1137} {"train_loss": -21.507619857788086, "global_step": 94388, "epoch": 1137} {"train_loss": -21.205028533935547, "global_step": 94389, "epoch": 1137} {"train_loss": -21.31294822692871, "global_step": 94390, "epoch": 1137} {"train_loss": -21.479312896728516, "global_step": 94391, "epoch": 1137} {"train_loss": -21.569677352905273, "global_step": 94392, "epoch": 1137} {"train_loss": -21.265018463134766, "global_step": 94393, "epoch": 1137} {"train_loss": -21.457706451416016, "global_step": 94394, "epoch": 1137} {"train_loss": -21.391071319580078, "global_step": 94395, "epoch": 1137} {"train_loss": -21.517908096313477, "global_step": 94396, "epoch": 1137} {"train_loss": -21.503040313720703, "global_step": 94397, "epoch": 1137} {"train_loss": -21.35688591003418, "global_step": 94398, "epoch": 1137} {"train_loss": -21.221817016601562, "global_step": 94399, "epoch": 1137} {"train_loss": -21.49260902404785, "global_step": 94400, "epoch": 1137} {"train_loss": -21.776029586791992, "global_step": 94401, "epoch": 1137} {"train_loss": -21.18439292907715, "global_step": 94402, "epoch": 1137} {"train_loss": -21.749860763549805, "global_step": 94403, "epoch": 1137} {"train_loss": -21.790029525756836, "global_step": 94404, "epoch": 1137} {"train_loss": -21.556854248046875, "global_step": 94405, "epoch": 1137} {"train_loss": -21.825672149658203, "global_step": 94406, "epoch": 1137} {"train_loss": -21.714496612548828, "global_step": 94407, "epoch": 1137} {"train_loss": -21.22587776184082, "global_step": 94408, "epoch": 1137} {"train_loss": -21.52954864501953, "global_step": 94409, "epoch": 1137} {"train_loss": -21.472196578979492, "global_step": 94410, "epoch": 1137} {"train_loss": -21.86098289489746, "global_step": 94411, "epoch": 1137} {"train_loss": -21.678518295288086, "global_step": 94412, "epoch": 1137} {"train_loss": -21.512218475341797, "global_step": 94413, "epoch": 1137} {"train_loss": -21.6763858795166, "global_step": 94414, "epoch": 1137} {"train_loss": -21.639678955078125, "global_step": 94415, "epoch": 1137} {"train_loss": -21.6980037689209, "global_step": 94416, "epoch": 1137} {"train_loss": -21.40755271911621, "global_step": 94417, "epoch": 1137} {"train_loss": -21.51376724243164, "global_step": 94418, "epoch": 1137} {"train_loss": -21.83925437927246, "global_step": 94419, "epoch": 1137} {"train_loss": -21.606969833374023, "global_step": 94420, "epoch": 1137} {"train_loss": -21.511205673217773, "global_step": 94421, "epoch": 1137} {"train_loss": -21.794931411743164, "global_step": 94422, "epoch": 1137} {"train_loss": -21.535131454467773, "global_step": 94423, "epoch": 1137} {"train_loss": -21.829448699951172, "global_step": 94424, "epoch": 1137} {"train_loss": -21.6464900970459, "global_step": 94425, "epoch": 1137} {"train_loss": -21.513090133666992, "global_step": 94426, "epoch": 1137} {"train_loss": -21.59651756286621, "global_step": 94427, "epoch": 1137} {"train_loss": -21.529285430908203, "global_step": 94428, "epoch": 1137} {"train_loss": -21.91257667541504, "global_step": 94429, "epoch": 1137} {"train_loss": -21.585813522338867, "global_step": 94430, "epoch": 1137} {"train_loss": -21.811506271362305, "global_step": 94431, "epoch": 1137} {"train_loss": -21.727731704711914, "global_step": 94432, "epoch": 1137} {"train_loss": -21.49639320373535, "global_step": 94433, "epoch": 1137} {"train_loss": -21.783979415893555, "global_step": 94434, "epoch": 1137} {"train_loss": -21.49376678466797, "global_step": 94435, "epoch": 1137} {"train_loss": -21.395511627197266, "global_step": 94436, "epoch": 1137} {"train_loss": -21.562732696533203, "global_step": 94437, "epoch": 1137} {"train_loss": -21.862775802612305, "global_step": 94438, "epoch": 1137} {"train_loss": -21.35128402709961, "global_step": 94439, "epoch": 1137} {"train_loss": -21.908735275268555, "global_step": 94440, "epoch": 1137} {"train_loss": -21.336938858032227, "global_step": 94441, "epoch": 1137} {"train_loss": -21.356098175048828, "global_step": 94442, "epoch": 1137} {"train_loss": -21.683698654174805, "global_step": 94443, "epoch": 1137} {"train_loss": -21.56442642211914, "global_step": 94444, "epoch": 1137} {"train_loss": -21.92140769958496, "global_step": 94445, "epoch": 1137} {"train_loss": -21.493574142456055, "global_step": 94446, "epoch": 1137} {"train_loss": -21.735567092895508, "global_step": 94447, "epoch": 1137} {"train_loss": -21.56357765197754, "global_step": 94448, "epoch": 1137} {"train_loss": -21.26410484313965, "global_step": 94449, "epoch": 1137} {"train_loss": -21.275562286376953, "global_step": 94450, "epoch": 1137} {"train_loss": -21.6318416595459, "global_step": 94451, "epoch": 1137} {"train_loss": -21.095373153686523, "global_step": 94452, "epoch": 1137} {"train_loss": -21.433461430561113, "global_step": 94453, "epoch": 1137, "val_loss": 6104683.0} {"train_loss": -21.605966567993164, "global_step": 94454, "epoch": 1138} {"train_loss": -21.472131729125977, "global_step": 94455, "epoch": 1138} {"train_loss": -21.313825607299805, "global_step": 94456, "epoch": 1138} {"train_loss": -21.636877059936523, "global_step": 94457, "epoch": 1138} {"train_loss": -21.770017623901367, "global_step": 94458, "epoch": 1138} {"train_loss": -21.743078231811523, "global_step": 94459, "epoch": 1138} {"train_loss": -21.48023796081543, "global_step": 94460, "epoch": 1138} {"train_loss": -21.6907901763916, "global_step": 94461, "epoch": 1138} {"train_loss": -21.400793075561523, "global_step": 94462, "epoch": 1138} {"train_loss": -21.571823120117188, "global_step": 94463, "epoch": 1138} {"train_loss": -21.691448211669922, "global_step": 94464, "epoch": 1138} {"train_loss": -21.529335021972656, "global_step": 94465, "epoch": 1138} {"train_loss": -21.943805694580078, "global_step": 94466, "epoch": 1138} {"train_loss": -21.503774642944336, "global_step": 94467, "epoch": 1138} {"train_loss": -21.65326499938965, "global_step": 94468, "epoch": 1138} {"train_loss": -21.7264347076416, "global_step": 94469, "epoch": 1138} {"train_loss": -21.25701904296875, "global_step": 94470, "epoch": 1138} {"train_loss": -21.687715530395508, "global_step": 94471, "epoch": 1138} {"train_loss": -21.389802932739258, "global_step": 94472, "epoch": 1138} {"train_loss": -21.366504669189453, "global_step": 94473, "epoch": 1138} {"train_loss": -21.797460556030273, "global_step": 94474, "epoch": 1138} {"train_loss": -21.3655948638916, "global_step": 94475, "epoch": 1138} {"train_loss": -21.96978759765625, "global_step": 94476, "epoch": 1138} {"train_loss": -21.638662338256836, "global_step": 94477, "epoch": 1138} {"train_loss": -21.917142868041992, "global_step": 94478, "epoch": 1138} {"train_loss": -21.872495651245117, "global_step": 94479, "epoch": 1138} {"train_loss": -21.91672706604004, "global_step": 94480, "epoch": 1138} {"train_loss": -21.736425399780273, "global_step": 94481, "epoch": 1138} {"train_loss": -21.8291072845459, "global_step": 94482, "epoch": 1138} {"train_loss": -21.45821189880371, "global_step": 94483, "epoch": 1138} {"train_loss": -21.59296989440918, "global_step": 94484, "epoch": 1138} {"train_loss": -21.905359268188477, "global_step": 94485, "epoch": 1138} {"train_loss": -21.528980255126953, "global_step": 94486, "epoch": 1138} {"train_loss": -21.737085342407227, "global_step": 94487, "epoch": 1138} {"train_loss": -22.198266983032227, "global_step": 94488, "epoch": 1138} {"train_loss": -21.457319259643555, "global_step": 94489, "epoch": 1138} {"train_loss": -21.67254066467285, "global_step": 94490, "epoch": 1138} {"train_loss": -21.71525764465332, "global_step": 94491, "epoch": 1138} {"train_loss": -21.992130279541016, "global_step": 94492, "epoch": 1138} {"train_loss": -21.85508155822754, "global_step": 94493, "epoch": 1138} {"train_loss": -22.28432846069336, "global_step": 94494, "epoch": 1138} {"train_loss": -21.47117042541504, "global_step": 94495, "epoch": 1138} {"train_loss": -21.658960342407227, "global_step": 94496, "epoch": 1138} {"train_loss": -21.726165771484375, "global_step": 94497, "epoch": 1138} {"train_loss": -21.88922691345215, "global_step": 94498, "epoch": 1138} {"train_loss": -21.44468116760254, "global_step": 94499, "epoch": 1138} {"train_loss": -21.756742477416992, "global_step": 94500, "epoch": 1138} {"train_loss": -22.0296573638916, "global_step": 94501, "epoch": 1138} {"train_loss": -21.773340225219727, "global_step": 94502, "epoch": 1138} {"train_loss": -21.819162368774414, "global_step": 94503, "epoch": 1138} {"train_loss": -21.84635353088379, "global_step": 94504, "epoch": 1138} {"train_loss": -21.743337631225586, "global_step": 94505, "epoch": 1138} {"train_loss": -21.873605728149414, "global_step": 94506, "epoch": 1138} {"train_loss": -22.19620704650879, "global_step": 94507, "epoch": 1138} {"train_loss": -21.78179931640625, "global_step": 94508, "epoch": 1138} {"train_loss": -21.438047409057617, "global_step": 94509, "epoch": 1138} {"train_loss": -21.6694393157959, "global_step": 94510, "epoch": 1138} {"train_loss": -21.981708526611328, "global_step": 94511, "epoch": 1138} {"train_loss": -21.809635162353516, "global_step": 94512, "epoch": 1138} {"train_loss": -21.925323486328125, "global_step": 94513, "epoch": 1138} {"train_loss": -22.047502517700195, "global_step": 94514, "epoch": 1138} {"train_loss": -21.631473541259766, "global_step": 94515, "epoch": 1138} {"train_loss": -21.930015563964844, "global_step": 94516, "epoch": 1138} {"train_loss": -21.589107513427734, "global_step": 94517, "epoch": 1138} {"train_loss": -22.02603530883789, "global_step": 94518, "epoch": 1138} {"train_loss": -21.673934936523438, "global_step": 94519, "epoch": 1138} {"train_loss": -21.494489669799805, "global_step": 94520, "epoch": 1138} {"train_loss": -22.192564010620117, "global_step": 94521, "epoch": 1138} {"train_loss": -21.746702194213867, "global_step": 94522, "epoch": 1138} {"train_loss": -21.656261444091797, "global_step": 94523, "epoch": 1138} {"train_loss": -21.356386184692383, "global_step": 94524, "epoch": 1138} {"train_loss": -21.744558334350586, "global_step": 94525, "epoch": 1138} {"train_loss": -21.788389205932617, "global_step": 94526, "epoch": 1138} {"train_loss": -21.358335494995117, "global_step": 94527, "epoch": 1138} {"train_loss": -21.782146453857422, "global_step": 94528, "epoch": 1138} {"train_loss": -21.7916202545166, "global_step": 94529, "epoch": 1138} {"train_loss": -21.569902420043945, "global_step": 94530, "epoch": 1138} {"train_loss": -21.673294067382812, "global_step": 94531, "epoch": 1138} {"train_loss": -21.70790672302246, "global_step": 94532, "epoch": 1138} {"train_loss": -21.68126106262207, "global_step": 94533, "epoch": 1138} {"train_loss": -21.924320220947266, "global_step": 94534, "epoch": 1138} {"train_loss": -21.66956901550293, "global_step": 94535, "epoch": 1138} {"train_loss": -21.695077597376812, "global_step": 94536, "epoch": 1138, "val_loss": 6138317.5} {"train_loss": -21.068021774291992, "global_step": 94537, "epoch": 1139} {"train_loss": -21.369617462158203, "global_step": 94538, "epoch": 1139} {"train_loss": -20.93959617614746, "global_step": 94539, "epoch": 1139} {"train_loss": -21.02743911743164, "global_step": 94540, "epoch": 1139} {"train_loss": -21.274616241455078, "global_step": 94541, "epoch": 1139} {"train_loss": -21.14711570739746, "global_step": 94542, "epoch": 1139} {"train_loss": -21.238088607788086, "global_step": 94543, "epoch": 1139} {"train_loss": -21.64702796936035, "global_step": 94544, "epoch": 1139} {"train_loss": -21.323501586914062, "global_step": 94545, "epoch": 1139} {"train_loss": -21.439186096191406, "global_step": 94546, "epoch": 1139} {"train_loss": -21.576644897460938, "global_step": 94547, "epoch": 1139} {"train_loss": -21.20870018005371, "global_step": 94548, "epoch": 1139} {"train_loss": -21.48471450805664, "global_step": 94549, "epoch": 1139} {"train_loss": -21.545555114746094, "global_step": 94550, "epoch": 1139} {"train_loss": -21.808738708496094, "global_step": 94551, "epoch": 1139} {"train_loss": -21.443815231323242, "global_step": 94552, "epoch": 1139} {"train_loss": -21.72422981262207, "global_step": 94553, "epoch": 1139} {"train_loss": -21.432493209838867, "global_step": 94554, "epoch": 1139} {"train_loss": -22.032997131347656, "global_step": 94555, "epoch": 1139} {"train_loss": -21.74678611755371, "global_step": 94556, "epoch": 1139} {"train_loss": -21.349477767944336, "global_step": 94557, "epoch": 1139} {"train_loss": -21.469478607177734, "global_step": 94558, "epoch": 1139} {"train_loss": -21.203689575195312, "global_step": 94559, "epoch": 1139} {"train_loss": -22.1280574798584, "global_step": 94560, "epoch": 1139} {"train_loss": -21.47759437561035, "global_step": 94561, "epoch": 1139} {"train_loss": -21.932741165161133, "global_step": 94562, "epoch": 1139} {"train_loss": -21.74517822265625, "global_step": 94563, "epoch": 1139} {"train_loss": -21.83717155456543, "global_step": 94564, "epoch": 1139} {"train_loss": -21.229373931884766, "global_step": 94565, "epoch": 1139} {"train_loss": -21.850303649902344, "global_step": 94566, "epoch": 1139} {"train_loss": -21.603010177612305, "global_step": 94567, "epoch": 1139} {"train_loss": -21.45920753479004, "global_step": 94568, "epoch": 1139} {"train_loss": -21.807809829711914, "global_step": 94569, "epoch": 1139} {"train_loss": -21.405057907104492, "global_step": 94570, "epoch": 1139} {"train_loss": -21.527555465698242, "global_step": 94571, "epoch": 1139} {"train_loss": -21.90838050842285, "global_step": 94572, "epoch": 1139} {"train_loss": -21.7930908203125, "global_step": 94573, "epoch": 1139} {"train_loss": -21.356029510498047, "global_step": 94574, "epoch": 1139} {"train_loss": -21.669950485229492, "global_step": 94575, "epoch": 1139} {"train_loss": -21.868335723876953, "global_step": 94576, "epoch": 1139} {"train_loss": -21.896162033081055, "global_step": 94577, "epoch": 1139} {"train_loss": -21.368757247924805, "global_step": 94578, "epoch": 1139} {"train_loss": -21.476511001586914, "global_step": 94579, "epoch": 1139} {"train_loss": -21.614055633544922, "global_step": 94580, "epoch": 1139} {"train_loss": -21.716781616210938, "global_step": 94581, "epoch": 1139} {"train_loss": -21.84571075439453, "global_step": 94582, "epoch": 1139} {"train_loss": -21.841476440429688, "global_step": 94583, "epoch": 1139} {"train_loss": -21.564273834228516, "global_step": 94584, "epoch": 1139} {"train_loss": -21.388599395751953, "global_step": 94585, "epoch": 1139} {"train_loss": -21.5151424407959, "global_step": 94586, "epoch": 1139} {"train_loss": -22.08446502685547, "global_step": 94587, "epoch": 1139} {"train_loss": -21.866239547729492, "global_step": 94588, "epoch": 1139} {"train_loss": -21.756750106811523, "global_step": 94589, "epoch": 1139} {"train_loss": -22.087339401245117, "global_step": 94590, "epoch": 1139} {"train_loss": -21.63504409790039, "global_step": 94591, "epoch": 1139} {"train_loss": -21.515384674072266, "global_step": 94592, "epoch": 1139} {"train_loss": -22.142099380493164, "global_step": 94593, "epoch": 1139} {"train_loss": -21.868091583251953, "global_step": 94594, "epoch": 1139} {"train_loss": -21.776416778564453, "global_step": 94595, "epoch": 1139} {"train_loss": -21.781707763671875, "global_step": 94596, "epoch": 1139} {"train_loss": -21.709672927856445, "global_step": 94597, "epoch": 1139} {"train_loss": -21.887983322143555, "global_step": 94598, "epoch": 1139} {"train_loss": -22.011762619018555, "global_step": 94599, "epoch": 1139} {"train_loss": -21.939634323120117, "global_step": 94600, "epoch": 1139} {"train_loss": -21.948150634765625, "global_step": 94601, "epoch": 1139} {"train_loss": -21.966861724853516, "global_step": 94602, "epoch": 1139} {"train_loss": -21.99518394470215, "global_step": 94603, "epoch": 1139} {"train_loss": -21.75664710998535, "global_step": 94604, "epoch": 1139} {"train_loss": -21.718109130859375, "global_step": 94605, "epoch": 1139} {"train_loss": -21.835941314697266, "global_step": 94606, "epoch": 1139} {"train_loss": -22.02207374572754, "global_step": 94607, "epoch": 1139} {"train_loss": -21.821428298950195, "global_step": 94608, "epoch": 1139} {"train_loss": -21.644241333007812, "global_step": 94609, "epoch": 1139} {"train_loss": -21.93466567993164, "global_step": 94610, "epoch": 1139} {"train_loss": -21.716934204101562, "global_step": 94611, "epoch": 1139} {"train_loss": -21.685346603393555, "global_step": 94612, "epoch": 1139} {"train_loss": -21.720178604125977, "global_step": 94613, "epoch": 1139} {"train_loss": -21.900381088256836, "global_step": 94614, "epoch": 1139} {"train_loss": -21.730051040649414, "global_step": 94615, "epoch": 1139} {"train_loss": -21.959447860717773, "global_step": 94616, "epoch": 1139} {"train_loss": -21.741533279418945, "global_step": 94617, "epoch": 1139} {"train_loss": -21.88028335571289, "global_step": 94618, "epoch": 1139} {"train_loss": -21.662896144820984, "global_step": 94619, "epoch": 1139, "val_loss": 6192904.0} {"train_loss": -21.137495040893555, "global_step": 94620, "epoch": 1140} {"train_loss": -21.402544021606445, "global_step": 94621, "epoch": 1140} {"train_loss": -21.73151969909668, "global_step": 94622, "epoch": 1140} {"train_loss": -21.79726219177246, "global_step": 94623, "epoch": 1140} {"train_loss": -21.476661682128906, "global_step": 94624, "epoch": 1140} {"train_loss": -21.312686920166016, "global_step": 94625, "epoch": 1140} {"train_loss": -21.203540802001953, "global_step": 94626, "epoch": 1140} {"train_loss": -21.488601684570312, "global_step": 94627, "epoch": 1140} {"train_loss": -21.255380630493164, "global_step": 94628, "epoch": 1140} {"train_loss": -20.84991455078125, "global_step": 94629, "epoch": 1140} {"train_loss": -21.370159149169922, "global_step": 94630, "epoch": 1140} {"train_loss": -21.554588317871094, "global_step": 94631, "epoch": 1140} {"train_loss": -21.626127243041992, "global_step": 94632, "epoch": 1140} {"train_loss": -21.608049392700195, "global_step": 94633, "epoch": 1140} {"train_loss": -21.462617874145508, "global_step": 94634, "epoch": 1140} {"train_loss": -21.65888023376465, "global_step": 94635, "epoch": 1140} {"train_loss": -21.704038619995117, "global_step": 94636, "epoch": 1140} {"train_loss": -21.6005859375, "global_step": 94637, "epoch": 1140} {"train_loss": -22.079980850219727, "global_step": 94638, "epoch": 1140} {"train_loss": -21.646642684936523, "global_step": 94639, "epoch": 1140} {"train_loss": -21.842458724975586, "global_step": 94640, "epoch": 1140} {"train_loss": -21.29782485961914, "global_step": 94641, "epoch": 1140} {"train_loss": -21.39569091796875, "global_step": 94642, "epoch": 1140} {"train_loss": -21.863210678100586, "global_step": 94643, "epoch": 1140} {"train_loss": -21.539575576782227, "global_step": 94644, "epoch": 1140} {"train_loss": -21.853483200073242, "global_step": 94645, "epoch": 1140} {"train_loss": -22.229846954345703, "global_step": 94646, "epoch": 1140} {"train_loss": -21.89444351196289, "global_step": 94647, "epoch": 1140} {"train_loss": -21.85993003845215, "global_step": 94648, "epoch": 1140} {"train_loss": -21.512086868286133, "global_step": 94649, "epoch": 1140} {"train_loss": -21.863725662231445, "global_step": 94650, "epoch": 1140} {"train_loss": -21.575714111328125, "global_step": 94651, "epoch": 1140} {"train_loss": -21.8483829498291, "global_step": 94652, "epoch": 1140} {"train_loss": -21.927579879760742, "global_step": 94653, "epoch": 1140} {"train_loss": -22.165273666381836, "global_step": 94654, "epoch": 1140} {"train_loss": -21.627904891967773, "global_step": 94655, "epoch": 1140} {"train_loss": -21.89828872680664, "global_step": 94656, "epoch": 1140} {"train_loss": -21.781301498413086, "global_step": 94657, "epoch": 1140} {"train_loss": -21.609033584594727, "global_step": 94658, "epoch": 1140} {"train_loss": -21.83548355102539, "global_step": 94659, "epoch": 1140} {"train_loss": -22.04652214050293, "global_step": 94660, "epoch": 1140} {"train_loss": -21.752857208251953, "global_step": 94661, "epoch": 1140} {"train_loss": -21.889253616333008, "global_step": 94662, "epoch": 1140} {"train_loss": -21.42290687561035, "global_step": 94663, "epoch": 1140} {"train_loss": -21.4659481048584, "global_step": 94664, "epoch": 1140} {"train_loss": -22.134870529174805, "global_step": 94665, "epoch": 1140} {"train_loss": -21.768325805664062, "global_step": 94666, "epoch": 1140} {"train_loss": -22.049301147460938, "global_step": 94667, "epoch": 1140} {"train_loss": -21.950721740722656, "global_step": 94668, "epoch": 1140} {"train_loss": -21.54530143737793, "global_step": 94669, "epoch": 1140} {"train_loss": -21.477649688720703, "global_step": 94670, "epoch": 1140} {"train_loss": -21.91422462463379, "global_step": 94671, "epoch": 1140} {"train_loss": -22.144771575927734, "global_step": 94672, "epoch": 1140} {"train_loss": -21.948776245117188, "global_step": 94673, "epoch": 1140} {"train_loss": -21.854047775268555, "global_step": 94674, "epoch": 1140} {"train_loss": -21.659931182861328, "global_step": 94675, "epoch": 1140} {"train_loss": -21.939970016479492, "global_step": 94676, "epoch": 1140} {"train_loss": -21.797269821166992, "global_step": 94677, "epoch": 1140} {"train_loss": -21.628746032714844, "global_step": 94678, "epoch": 1140} {"train_loss": -21.906919479370117, "global_step": 94679, "epoch": 1140} {"train_loss": -21.987104415893555, "global_step": 94680, "epoch": 1140} {"train_loss": -21.671066284179688, "global_step": 94681, "epoch": 1140} {"train_loss": -21.418977737426758, "global_step": 94682, "epoch": 1140} {"train_loss": -21.990812301635742, "global_step": 94683, "epoch": 1140} {"train_loss": -21.920366287231445, "global_step": 94684, "epoch": 1140} {"train_loss": -21.954740524291992, "global_step": 94685, "epoch": 1140} {"train_loss": -21.92367935180664, "global_step": 94686, "epoch": 1140} {"train_loss": -22.037752151489258, "global_step": 94687, "epoch": 1140} {"train_loss": -22.032983779907227, "global_step": 94688, "epoch": 1140} {"train_loss": -21.576330184936523, "global_step": 94689, "epoch": 1140} {"train_loss": -22.078725814819336, "global_step": 94690, "epoch": 1140} {"train_loss": -21.695331573486328, "global_step": 94691, "epoch": 1140} {"train_loss": -21.782794952392578, "global_step": 94692, "epoch": 1140} {"train_loss": -22.00703239440918, "global_step": 94693, "epoch": 1140} {"train_loss": -21.83318519592285, "global_step": 94694, "epoch": 1140} {"train_loss": -21.65081214904785, "global_step": 94695, "epoch": 1140} {"train_loss": -21.718406677246094, "global_step": 94696, "epoch": 1140} {"train_loss": -21.655725479125977, "global_step": 94697, "epoch": 1140} {"train_loss": -21.336606979370117, "global_step": 94698, "epoch": 1140} {"train_loss": -22.17801284790039, "global_step": 94699, "epoch": 1140} {"train_loss": -21.7401065826416, "global_step": 94700, "epoch": 1140} {"train_loss": -21.712783813476562, "global_step": 94701, "epoch": 1140} {"train_loss": -21.713816562330866, "global_step": 94702, "epoch": 1140, "val_loss": 6303781.0} {"train_loss": -21.413715362548828, "global_step": 94703, "epoch": 1141} {"train_loss": -21.797931671142578, "global_step": 94704, "epoch": 1141} {"train_loss": -21.687063217163086, "global_step": 94705, "epoch": 1141} {"train_loss": -21.888456344604492, "global_step": 94706, "epoch": 1141} {"train_loss": -22.02733039855957, "global_step": 94707, "epoch": 1141} {"train_loss": -21.349464416503906, "global_step": 94708, "epoch": 1141} {"train_loss": -21.382213592529297, "global_step": 94709, "epoch": 1141} {"train_loss": -21.730337142944336, "global_step": 94710, "epoch": 1141} {"train_loss": -21.41847038269043, "global_step": 94711, "epoch": 1141} {"train_loss": -21.31692886352539, "global_step": 94712, "epoch": 1141} {"train_loss": -21.819013595581055, "global_step": 94713, "epoch": 1141} {"train_loss": -21.925785064697266, "global_step": 94714, "epoch": 1141} {"train_loss": -21.81804847717285, "global_step": 94715, "epoch": 1141} {"train_loss": -22.056852340698242, "global_step": 94716, "epoch": 1141} {"train_loss": -21.612634658813477, "global_step": 94717, "epoch": 1141} {"train_loss": -21.732358932495117, "global_step": 94718, "epoch": 1141} {"train_loss": -22.17257308959961, "global_step": 94719, "epoch": 1141} {"train_loss": -21.564760208129883, "global_step": 94720, "epoch": 1141} {"train_loss": -21.5443172454834, "global_step": 94721, "epoch": 1141} {"train_loss": -21.851675033569336, "global_step": 94722, "epoch": 1141} {"train_loss": -21.328092575073242, "global_step": 94723, "epoch": 1141} {"train_loss": -21.374963760375977, "global_step": 94724, "epoch": 1141} {"train_loss": -21.52496910095215, "global_step": 94725, "epoch": 1141} {"train_loss": -21.58846664428711, "global_step": 94726, "epoch": 1141} {"train_loss": -21.568103790283203, "global_step": 94727, "epoch": 1141} {"train_loss": -21.73658561706543, "global_step": 94728, "epoch": 1141} {"train_loss": -21.837682723999023, "global_step": 94729, "epoch": 1141} {"train_loss": -21.560976028442383, "global_step": 94730, "epoch": 1141} {"train_loss": -21.77142906188965, "global_step": 94731, "epoch": 1141} {"train_loss": -22.14109230041504, "global_step": 94732, "epoch": 1141} {"train_loss": -21.61083984375, "global_step": 94733, "epoch": 1141} {"train_loss": -21.92340660095215, "global_step": 94734, "epoch": 1141} {"train_loss": -21.80049705505371, "global_step": 94735, "epoch": 1141} {"train_loss": -21.807180404663086, "global_step": 94736, "epoch": 1141} {"train_loss": -21.814794540405273, "global_step": 94737, "epoch": 1141} {"train_loss": -21.68195152282715, "global_step": 94738, "epoch": 1141} {"train_loss": -21.70268440246582, "global_step": 94739, "epoch": 1141} {"train_loss": -21.801267623901367, "global_step": 94740, "epoch": 1141} {"train_loss": -21.576581954956055, "global_step": 94741, "epoch": 1141} {"train_loss": -21.82206153869629, "global_step": 94742, "epoch": 1141} {"train_loss": -21.589954376220703, "global_step": 94743, "epoch": 1141} {"train_loss": -21.805015563964844, "global_step": 94744, "epoch": 1141} {"train_loss": -21.488723754882812, "global_step": 94745, "epoch": 1141} {"train_loss": -21.406219482421875, "global_step": 94746, "epoch": 1141} {"train_loss": -21.663259506225586, "global_step": 94747, "epoch": 1141} {"train_loss": -21.215322494506836, "global_step": 94748, "epoch": 1141} {"train_loss": -21.138444900512695, "global_step": 94749, "epoch": 1141} {"train_loss": -21.521207809448242, "global_step": 94750, "epoch": 1141} {"train_loss": -21.141193389892578, "global_step": 94751, "epoch": 1141} {"train_loss": -22.010202407836914, "global_step": 94752, "epoch": 1141} {"train_loss": -21.481494903564453, "global_step": 94753, "epoch": 1141} {"train_loss": -21.740041732788086, "global_step": 94754, "epoch": 1141} {"train_loss": -21.17975425720215, "global_step": 94755, "epoch": 1141} {"train_loss": -21.686771392822266, "global_step": 94756, "epoch": 1141} {"train_loss": -21.59212303161621, "global_step": 94757, "epoch": 1141} {"train_loss": -21.58882713317871, "global_step": 94758, "epoch": 1141} {"train_loss": -21.999067306518555, "global_step": 94759, "epoch": 1141} {"train_loss": -21.649322509765625, "global_step": 94760, "epoch": 1141} {"train_loss": -21.802227020263672, "global_step": 94761, "epoch": 1141} {"train_loss": -21.230792999267578, "global_step": 94762, "epoch": 1141} {"train_loss": -21.4945011138916, "global_step": 94763, "epoch": 1141} {"train_loss": -21.738037109375, "global_step": 94764, "epoch": 1141} {"train_loss": -21.840368270874023, "global_step": 94765, "epoch": 1141} {"train_loss": -21.54080581665039, "global_step": 94766, "epoch": 1141} {"train_loss": -21.77528953552246, "global_step": 94767, "epoch": 1141} {"train_loss": -21.902572631835938, "global_step": 94768, "epoch": 1141} {"train_loss": -21.82622718811035, "global_step": 94769, "epoch": 1141} {"train_loss": -21.38147735595703, "global_step": 94770, "epoch": 1141} {"train_loss": -21.524723052978516, "global_step": 94771, "epoch": 1141} {"train_loss": -21.9458065032959, "global_step": 94772, "epoch": 1141} {"train_loss": -21.613609313964844, "global_step": 94773, "epoch": 1141} {"train_loss": -21.69744300842285, "global_step": 94774, "epoch": 1141} {"train_loss": -21.597248077392578, "global_step": 94775, "epoch": 1141} {"train_loss": -21.70160484313965, "global_step": 94776, "epoch": 1141} {"train_loss": -21.971742630004883, "global_step": 94777, "epoch": 1141} {"train_loss": -21.641653060913086, "global_step": 94778, "epoch": 1141} {"train_loss": -22.062646865844727, "global_step": 94779, "epoch": 1141} {"train_loss": -21.619747161865234, "global_step": 94780, "epoch": 1141} {"train_loss": -21.984973907470703, "global_step": 94781, "epoch": 1141} {"train_loss": -21.546560287475586, "global_step": 94782, "epoch": 1141} {"train_loss": -21.8747615814209, "global_step": 94783, "epoch": 1141} {"train_loss": -21.951955795288086, "global_step": 94784, "epoch": 1141} {"train_loss": -21.700345786221057, "global_step": 94785, "epoch": 1141, "val_loss": 6252704.5} {"train_loss": -20.8782958984375, "global_step": 94786, "epoch": 1142} {"train_loss": -21.78158950805664, "global_step": 94787, "epoch": 1142} {"train_loss": -21.003149032592773, "global_step": 94788, "epoch": 1142} {"train_loss": -21.361806869506836, "global_step": 94789, "epoch": 1142} {"train_loss": -21.389057159423828, "global_step": 94790, "epoch": 1142} {"train_loss": -21.295591354370117, "global_step": 94791, "epoch": 1142} {"train_loss": -20.982255935668945, "global_step": 94792, "epoch": 1142} {"train_loss": -20.986461639404297, "global_step": 94793, "epoch": 1142} {"train_loss": -21.35861587524414, "global_step": 94794, "epoch": 1142} {"train_loss": -21.476186752319336, "global_step": 94795, "epoch": 1142} {"train_loss": -21.408784866333008, "global_step": 94796, "epoch": 1142} {"train_loss": -21.475250244140625, "global_step": 94797, "epoch": 1142} {"train_loss": -21.36228370666504, "global_step": 94798, "epoch": 1142} {"train_loss": -21.539695739746094, "global_step": 94799, "epoch": 1142} {"train_loss": -21.0897274017334, "global_step": 94800, "epoch": 1142} {"train_loss": -21.756803512573242, "global_step": 94801, "epoch": 1142} {"train_loss": -21.40920066833496, "global_step": 94802, "epoch": 1142} {"train_loss": -21.5709228515625, "global_step": 94803, "epoch": 1142} {"train_loss": -21.173755645751953, "global_step": 94804, "epoch": 1142} {"train_loss": -21.617856979370117, "global_step": 94805, "epoch": 1142} {"train_loss": -21.907901763916016, "global_step": 94806, "epoch": 1142} {"train_loss": -21.697961807250977, "global_step": 94807, "epoch": 1142} {"train_loss": -21.728967666625977, "global_step": 94808, "epoch": 1142} {"train_loss": -21.577049255371094, "global_step": 94809, "epoch": 1142} {"train_loss": -21.22344970703125, "global_step": 94810, "epoch": 1142} {"train_loss": -21.64319610595703, "global_step": 94811, "epoch": 1142} {"train_loss": -21.7965030670166, "global_step": 94812, "epoch": 1142} {"train_loss": -21.795835494995117, "global_step": 94813, "epoch": 1142} {"train_loss": -22.146221160888672, "global_step": 94814, "epoch": 1142} {"train_loss": -21.646726608276367, "global_step": 94815, "epoch": 1142} {"train_loss": -21.933746337890625, "global_step": 94816, "epoch": 1142} {"train_loss": -21.76301383972168, "global_step": 94817, "epoch": 1142} {"train_loss": -21.984960556030273, "global_step": 94818, "epoch": 1142} {"train_loss": -21.741748809814453, "global_step": 94819, "epoch": 1142} {"train_loss": -21.778499603271484, "global_step": 94820, "epoch": 1142} {"train_loss": -21.733671188354492, "global_step": 94821, "epoch": 1142} {"train_loss": -21.991682052612305, "global_step": 94822, "epoch": 1142} {"train_loss": -21.953039169311523, "global_step": 94823, "epoch": 1142} {"train_loss": -21.552724838256836, "global_step": 94824, "epoch": 1142} {"train_loss": -21.656757354736328, "global_step": 94825, "epoch": 1142} {"train_loss": -22.201948165893555, "global_step": 94826, "epoch": 1142} {"train_loss": -22.042354583740234, "global_step": 94827, "epoch": 1142} {"train_loss": -21.7602596282959, "global_step": 94828, "epoch": 1142} {"train_loss": -22.0776424407959, "global_step": 94829, "epoch": 1142} {"train_loss": -21.42282485961914, "global_step": 94830, "epoch": 1142} {"train_loss": -21.704532623291016, "global_step": 94831, "epoch": 1142} {"train_loss": -21.835763931274414, "global_step": 94832, "epoch": 1142} {"train_loss": -21.95246124267578, "global_step": 94833, "epoch": 1142} {"train_loss": -21.556365966796875, "global_step": 94834, "epoch": 1142} {"train_loss": -22.0069637298584, "global_step": 94835, "epoch": 1142} {"train_loss": -22.188993453979492, "global_step": 94836, "epoch": 1142} {"train_loss": -21.881704330444336, "global_step": 94837, "epoch": 1142} {"train_loss": -21.486419677734375, "global_step": 94838, "epoch": 1142} {"train_loss": -21.650653839111328, "global_step": 94839, "epoch": 1142} {"train_loss": -21.504066467285156, "global_step": 94840, "epoch": 1142} {"train_loss": -21.452375411987305, "global_step": 94841, "epoch": 1142} {"train_loss": -21.573137283325195, "global_step": 94842, "epoch": 1142} {"train_loss": -21.74744987487793, "global_step": 94843, "epoch": 1142} {"train_loss": -21.67085838317871, "global_step": 94844, "epoch": 1142} {"train_loss": -21.50621795654297, "global_step": 94845, "epoch": 1142} {"train_loss": -21.687902450561523, "global_step": 94846, "epoch": 1142} {"train_loss": -21.674959182739258, "global_step": 94847, "epoch": 1142} {"train_loss": -21.805326461791992, "global_step": 94848, "epoch": 1142} {"train_loss": -21.673614501953125, "global_step": 94849, "epoch": 1142} {"train_loss": -21.855661392211914, "global_step": 94850, "epoch": 1142} {"train_loss": -21.736328125, "global_step": 94851, "epoch": 1142} {"train_loss": -21.79010581970215, "global_step": 94852, "epoch": 1142} {"train_loss": -21.921955108642578, "global_step": 94853, "epoch": 1142} {"train_loss": -21.774015426635742, "global_step": 94854, "epoch": 1142} {"train_loss": -21.42622184753418, "global_step": 94855, "epoch": 1142} {"train_loss": -22.10233497619629, "global_step": 94856, "epoch": 1142} {"train_loss": -21.658483505249023, "global_step": 94857, "epoch": 1142} {"train_loss": -21.892667770385742, "global_step": 94858, "epoch": 1142} {"train_loss": -22.001562118530273, "global_step": 94859, "epoch": 1142} {"train_loss": -21.856861114501953, "global_step": 94860, "epoch": 1142} {"train_loss": -21.639902114868164, "global_step": 94861, "epoch": 1142} {"train_loss": -21.727584838867188, "global_step": 94862, "epoch": 1142} {"train_loss": -21.705556869506836, "global_step": 94863, "epoch": 1142} {"train_loss": -21.617895126342773, "global_step": 94864, "epoch": 1142} {"train_loss": -21.42063331604004, "global_step": 94865, "epoch": 1142} {"train_loss": -21.88787269592285, "global_step": 94866, "epoch": 1142} {"train_loss": -21.800451278686523, "global_step": 94867, "epoch": 1142} {"train_loss": -21.66494633778032, "global_step": 94868, "epoch": 1142, "val_loss": 6079233.0} {"train_loss": -21.525232315063477, "global_step": 94869, "epoch": 1143} {"train_loss": -21.313232421875, "global_step": 94870, "epoch": 1143} {"train_loss": -21.3077449798584, "global_step": 94871, "epoch": 1143} {"train_loss": -21.61703872680664, "global_step": 94872, "epoch": 1143} {"train_loss": -21.57147789001465, "global_step": 94873, "epoch": 1143} {"train_loss": -21.72814178466797, "global_step": 94874, "epoch": 1143} {"train_loss": -21.669437408447266, "global_step": 94875, "epoch": 1143} {"train_loss": -21.915790557861328, "global_step": 94876, "epoch": 1143} {"train_loss": -21.629730224609375, "global_step": 94877, "epoch": 1143} {"train_loss": -21.43146324157715, "global_step": 94878, "epoch": 1143} {"train_loss": -21.55441665649414, "global_step": 94879, "epoch": 1143} {"train_loss": -21.77008628845215, "global_step": 94880, "epoch": 1143} {"train_loss": -21.321937561035156, "global_step": 94881, "epoch": 1143} {"train_loss": -21.872114181518555, "global_step": 94882, "epoch": 1143} {"train_loss": -21.417194366455078, "global_step": 94883, "epoch": 1143} {"train_loss": -21.550601959228516, "global_step": 94884, "epoch": 1143} {"train_loss": -21.576210021972656, "global_step": 94885, "epoch": 1143} {"train_loss": -21.502653121948242, "global_step": 94886, "epoch": 1143} {"train_loss": -21.88825225830078, "global_step": 94887, "epoch": 1143} {"train_loss": -21.30389404296875, "global_step": 94888, "epoch": 1143} {"train_loss": -21.74272918701172, "global_step": 94889, "epoch": 1143} {"train_loss": -21.56039810180664, "global_step": 94890, "epoch": 1143} {"train_loss": -21.85443687438965, "global_step": 94891, "epoch": 1143} {"train_loss": -21.684009552001953, "global_step": 94892, "epoch": 1143} {"train_loss": -21.140316009521484, "global_step": 94893, "epoch": 1143} {"train_loss": -21.503904342651367, "global_step": 94894, "epoch": 1143} {"train_loss": -21.736196517944336, "global_step": 94895, "epoch": 1143} {"train_loss": -22.010839462280273, "global_step": 94896, "epoch": 1143} {"train_loss": -21.708341598510742, "global_step": 94897, "epoch": 1143} {"train_loss": -21.541929244995117, "global_step": 94898, "epoch": 1143} {"train_loss": -21.90407943725586, "global_step": 94899, "epoch": 1143} {"train_loss": -21.585050582885742, "global_step": 94900, "epoch": 1143} {"train_loss": -21.951719284057617, "global_step": 94901, "epoch": 1143} {"train_loss": -21.856801986694336, "global_step": 94902, "epoch": 1143} {"train_loss": -21.57000732421875, "global_step": 94903, "epoch": 1143} {"train_loss": -21.797483444213867, "global_step": 94904, "epoch": 1143} {"train_loss": -21.76161766052246, "global_step": 94905, "epoch": 1143} {"train_loss": -21.65877342224121, "global_step": 94906, "epoch": 1143} {"train_loss": -22.10040855407715, "global_step": 94907, "epoch": 1143} {"train_loss": -21.61172866821289, "global_step": 94908, "epoch": 1143} {"train_loss": -21.71578025817871, "global_step": 94909, "epoch": 1143} {"train_loss": -21.910730361938477, "global_step": 94910, "epoch": 1143} {"train_loss": -21.735485076904297, "global_step": 94911, "epoch": 1143} {"train_loss": -21.9439754486084, "global_step": 94912, "epoch": 1143} {"train_loss": -22.02391815185547, "global_step": 94913, "epoch": 1143} {"train_loss": -21.164148330688477, "global_step": 94914, "epoch": 1143} {"train_loss": -22.100971221923828, "global_step": 94915, "epoch": 1143} {"train_loss": -21.92119598388672, "global_step": 94916, "epoch": 1143} {"train_loss": -21.673187255859375, "global_step": 94917, "epoch": 1143} {"train_loss": -21.32594108581543, "global_step": 94918, "epoch": 1143} {"train_loss": -21.780920028686523, "global_step": 94919, "epoch": 1143} {"train_loss": -21.7801513671875, "global_step": 94920, "epoch": 1143} {"train_loss": -21.8700008392334, "global_step": 94921, "epoch": 1143} {"train_loss": -21.963134765625, "global_step": 94922, "epoch": 1143} {"train_loss": -21.916168212890625, "global_step": 94923, "epoch": 1143} {"train_loss": -21.538375854492188, "global_step": 94924, "epoch": 1143} {"train_loss": -21.611791610717773, "global_step": 94925, "epoch": 1143} {"train_loss": -21.390512466430664, "global_step": 94926, "epoch": 1143} {"train_loss": -21.66668701171875, "global_step": 94927, "epoch": 1143} {"train_loss": -21.889951705932617, "global_step": 94928, "epoch": 1143} {"train_loss": -21.373584747314453, "global_step": 94929, "epoch": 1143} {"train_loss": -21.54977798461914, "global_step": 94930, "epoch": 1143} {"train_loss": -21.866790771484375, "global_step": 94931, "epoch": 1143} {"train_loss": -21.53276252746582, "global_step": 94932, "epoch": 1143} {"train_loss": -21.49207878112793, "global_step": 94933, "epoch": 1143} {"train_loss": -21.56727409362793, "global_step": 94934, "epoch": 1143} {"train_loss": -21.94964027404785, "global_step": 94935, "epoch": 1143} {"train_loss": -21.930017471313477, "global_step": 94936, "epoch": 1143} {"train_loss": -21.97525978088379, "global_step": 94937, "epoch": 1143} {"train_loss": -21.89679527282715, "global_step": 94938, "epoch": 1143} {"train_loss": -21.727659225463867, "global_step": 94939, "epoch": 1143} {"train_loss": -21.928218841552734, "global_step": 94940, "epoch": 1143} {"train_loss": -21.705814361572266, "global_step": 94941, "epoch": 1143} {"train_loss": -22.09612464904785, "global_step": 94942, "epoch": 1143} {"train_loss": -22.0600528717041, "global_step": 94943, "epoch": 1143} {"train_loss": -21.694353103637695, "global_step": 94944, "epoch": 1143} {"train_loss": -21.898008346557617, "global_step": 94945, "epoch": 1143} {"train_loss": -22.032163619995117, "global_step": 94946, "epoch": 1143} {"train_loss": -21.9844970703125, "global_step": 94947, "epoch": 1143} {"train_loss": -21.754980087280273, "global_step": 94948, "epoch": 1143} {"train_loss": -21.91407585144043, "global_step": 94949, "epoch": 1143} {"train_loss": -21.87989616394043, "global_step": 94950, "epoch": 1143} {"train_loss": -21.716276950146778, "global_step": 94951, "epoch": 1143, "val_loss": 6136470.0} {"train_loss": -20.74139976501465, "global_step": 94952, "epoch": 1144} {"train_loss": -20.952871322631836, "global_step": 94953, "epoch": 1144} {"train_loss": -21.17287254333496, "global_step": 94954, "epoch": 1144} {"train_loss": -21.031522750854492, "global_step": 94955, "epoch": 1144} {"train_loss": -20.929901123046875, "global_step": 94956, "epoch": 1144} {"train_loss": -21.66892433166504, "global_step": 94957, "epoch": 1144} {"train_loss": -21.012617111206055, "global_step": 94958, "epoch": 1144} {"train_loss": -21.1171932220459, "global_step": 94959, "epoch": 1144} {"train_loss": -21.271474838256836, "global_step": 94960, "epoch": 1144} {"train_loss": -21.657621383666992, "global_step": 94961, "epoch": 1144} {"train_loss": -21.310565948486328, "global_step": 94962, "epoch": 1144} {"train_loss": -21.343881607055664, "global_step": 94963, "epoch": 1144} {"train_loss": -21.24108123779297, "global_step": 94964, "epoch": 1144} {"train_loss": -21.406009674072266, "global_step": 94965, "epoch": 1144} {"train_loss": -21.69516372680664, "global_step": 94966, "epoch": 1144} {"train_loss": -21.769702911376953, "global_step": 94967, "epoch": 1144} {"train_loss": -21.773252487182617, "global_step": 94968, "epoch": 1144} {"train_loss": -21.668466567993164, "global_step": 94969, "epoch": 1144} {"train_loss": -21.633726119995117, "global_step": 94970, "epoch": 1144} {"train_loss": -21.690412521362305, "global_step": 94971, "epoch": 1144} {"train_loss": -21.367586135864258, "global_step": 94972, "epoch": 1144} {"train_loss": -21.585590362548828, "global_step": 94973, "epoch": 1144} {"train_loss": -21.617172241210938, "global_step": 94974, "epoch": 1144} {"train_loss": -21.89736557006836, "global_step": 94975, "epoch": 1144} {"train_loss": -21.799951553344727, "global_step": 94976, "epoch": 1144} {"train_loss": -21.655134201049805, "global_step": 94977, "epoch": 1144} {"train_loss": -21.885766983032227, "global_step": 94978, "epoch": 1144} {"train_loss": -21.58603858947754, "global_step": 94979, "epoch": 1144} {"train_loss": -21.88283348083496, "global_step": 94980, "epoch": 1144} {"train_loss": -21.862960815429688, "global_step": 94981, "epoch": 1144} {"train_loss": -21.908926010131836, "global_step": 94982, "epoch": 1144} {"train_loss": -21.675451278686523, "global_step": 94983, "epoch": 1144} {"train_loss": -21.510778427124023, "global_step": 94984, "epoch": 1144} {"train_loss": -21.699586868286133, "global_step": 94985, "epoch": 1144} {"train_loss": -21.5563907623291, "global_step": 94986, "epoch": 1144} {"train_loss": -22.21450424194336, "global_step": 94987, "epoch": 1144} {"train_loss": -21.555456161499023, "global_step": 94988, "epoch": 1144} {"train_loss": -21.636865615844727, "global_step": 94989, "epoch": 1144} {"train_loss": -21.91950798034668, "global_step": 94990, "epoch": 1144} {"train_loss": -21.320966720581055, "global_step": 94991, "epoch": 1144} {"train_loss": -21.77791404724121, "global_step": 94992, "epoch": 1144} {"train_loss": -21.776567459106445, "global_step": 94993, "epoch": 1144} {"train_loss": -21.903982162475586, "global_step": 94994, "epoch": 1144} {"train_loss": -21.712223052978516, "global_step": 94995, "epoch": 1144} {"train_loss": -21.508413314819336, "global_step": 94996, "epoch": 1144} {"train_loss": -21.8186092376709, "global_step": 94997, "epoch": 1144} {"train_loss": -21.55071449279785, "global_step": 94998, "epoch": 1144} {"train_loss": -21.83547019958496, "global_step": 94999, "epoch": 1144} {"train_loss": -21.801877975463867, "global_step": 95000, "epoch": 1144} {"train_loss": -21.7004337310791, "global_step": 95001, "epoch": 1144} {"train_loss": -21.666418075561523, "global_step": 95002, "epoch": 1144} {"train_loss": -21.74555778503418, "global_step": 95003, "epoch": 1144} {"train_loss": -22.00254249572754, "global_step": 95004, "epoch": 1144} {"train_loss": -21.523544311523438, "global_step": 95005, "epoch": 1144} {"train_loss": -21.785322189331055, "global_step": 95006, "epoch": 1144} {"train_loss": -21.6523380279541, "global_step": 95007, "epoch": 1144} {"train_loss": -21.879186630249023, "global_step": 95008, "epoch": 1144} {"train_loss": -21.71327781677246, "global_step": 95009, "epoch": 1144} {"train_loss": -21.716833114624023, "global_step": 95010, "epoch": 1144} {"train_loss": -21.51094627380371, "global_step": 95011, "epoch": 1144} {"train_loss": -21.904945373535156, "global_step": 95012, "epoch": 1144} {"train_loss": -21.494962692260742, "global_step": 95013, "epoch": 1144} {"train_loss": -21.66231346130371, "global_step": 95014, "epoch": 1144} {"train_loss": -21.69624900817871, "global_step": 95015, "epoch": 1144} {"train_loss": -21.82796287536621, "global_step": 95016, "epoch": 1144} {"train_loss": -21.741493225097656, "global_step": 95017, "epoch": 1144} {"train_loss": -21.7152156829834, "global_step": 95018, "epoch": 1144} {"train_loss": -21.741458892822266, "global_step": 95019, "epoch": 1144} {"train_loss": -21.937543869018555, "global_step": 95020, "epoch": 1144} {"train_loss": -21.94820213317871, "global_step": 95021, "epoch": 1144} {"train_loss": -21.921646118164062, "global_step": 95022, "epoch": 1144} {"train_loss": -22.136404037475586, "global_step": 95023, "epoch": 1144} {"train_loss": -21.71055793762207, "global_step": 95024, "epoch": 1144} {"train_loss": -22.026004791259766, "global_step": 95025, "epoch": 1144} {"train_loss": -21.692096710205078, "global_step": 95026, "epoch": 1144} {"train_loss": -21.921777725219727, "global_step": 95027, "epoch": 1144} {"train_loss": -21.48229217529297, "global_step": 95028, "epoch": 1144} {"train_loss": -22.064054489135742, "global_step": 95029, "epoch": 1144} {"train_loss": -21.787458419799805, "global_step": 95030, "epoch": 1144} {"train_loss": -22.017868041992188, "global_step": 95031, "epoch": 1144} {"train_loss": -21.744462966918945, "global_step": 95032, "epoch": 1144} {"train_loss": -21.368942260742188, "global_step": 95033, "epoch": 1144} {"train_loss": -21.667096218430853, "global_step": 95034, "epoch": 1144, "val_loss": 5986309.0} {"train_loss": -21.61604881286621, "global_step": 95035, "epoch": 1145} {"train_loss": -21.62598991394043, "global_step": 95036, "epoch": 1145} {"train_loss": -21.440723419189453, "global_step": 95037, "epoch": 1145} {"train_loss": -21.436920166015625, "global_step": 95038, "epoch": 1145} {"train_loss": -21.614505767822266, "global_step": 95039, "epoch": 1145} {"train_loss": -21.520559310913086, "global_step": 95040, "epoch": 1145} {"train_loss": -21.662181854248047, "global_step": 95041, "epoch": 1145} {"train_loss": -21.074636459350586, "global_step": 95042, "epoch": 1145} {"train_loss": -21.580001831054688, "global_step": 95043, "epoch": 1145} {"train_loss": -21.70120620727539, "global_step": 95044, "epoch": 1145} {"train_loss": -21.725725173950195, "global_step": 95045, "epoch": 1145} {"train_loss": -21.501201629638672, "global_step": 95046, "epoch": 1145} {"train_loss": -21.60939598083496, "global_step": 95047, "epoch": 1145} {"train_loss": -21.71048927307129, "global_step": 95048, "epoch": 1145} {"train_loss": -21.79523277282715, "global_step": 95049, "epoch": 1145} {"train_loss": -21.475006103515625, "global_step": 95050, "epoch": 1145} {"train_loss": -21.494741439819336, "global_step": 95051, "epoch": 1145} {"train_loss": -21.39667510986328, "global_step": 95052, "epoch": 1145} {"train_loss": -21.748428344726562, "global_step": 95053, "epoch": 1145} {"train_loss": -21.576969146728516, "global_step": 95054, "epoch": 1145} {"train_loss": -21.86620330810547, "global_step": 95055, "epoch": 1145} {"train_loss": -21.791536331176758, "global_step": 95056, "epoch": 1145} {"train_loss": -21.626859664916992, "global_step": 95057, "epoch": 1145} {"train_loss": -21.59991455078125, "global_step": 95058, "epoch": 1145} {"train_loss": -21.51837921142578, "global_step": 95059, "epoch": 1145} {"train_loss": -21.691747665405273, "global_step": 95060, "epoch": 1145} {"train_loss": -21.75660514831543, "global_step": 95061, "epoch": 1145} {"train_loss": -21.886384963989258, "global_step": 95062, "epoch": 1145} {"train_loss": -21.711074829101562, "global_step": 95063, "epoch": 1145} {"train_loss": -21.652708053588867, "global_step": 95064, "epoch": 1145} {"train_loss": -21.646909713745117, "global_step": 95065, "epoch": 1145} {"train_loss": -21.73792266845703, "global_step": 95066, "epoch": 1145} {"train_loss": -21.779993057250977, "global_step": 95067, "epoch": 1145} {"train_loss": -21.50299835205078, "global_step": 95068, "epoch": 1145} {"train_loss": -21.635730743408203, "global_step": 95069, "epoch": 1145} {"train_loss": -21.237890243530273, "global_step": 95070, "epoch": 1145} {"train_loss": -21.76759910583496, "global_step": 95071, "epoch": 1145} {"train_loss": -21.843854904174805, "global_step": 95072, "epoch": 1145} {"train_loss": -21.743364334106445, "global_step": 95073, "epoch": 1145} {"train_loss": -22.13616943359375, "global_step": 95074, "epoch": 1145} {"train_loss": -21.819555282592773, "global_step": 95075, "epoch": 1145} {"train_loss": -21.735578536987305, "global_step": 95076, "epoch": 1145} {"train_loss": -22.248517990112305, "global_step": 95077, "epoch": 1145} {"train_loss": -21.665374755859375, "global_step": 95078, "epoch": 1145} {"train_loss": -21.727041244506836, "global_step": 95079, "epoch": 1145} {"train_loss": -22.084115982055664, "global_step": 95080, "epoch": 1145} {"train_loss": -21.879396438598633, "global_step": 95081, "epoch": 1145} {"train_loss": -21.689424514770508, "global_step": 95082, "epoch": 1145} {"train_loss": -21.785837173461914, "global_step": 95083, "epoch": 1145} {"train_loss": -21.920656204223633, "global_step": 95084, "epoch": 1145} {"train_loss": -21.8933162689209, "global_step": 95085, "epoch": 1145} {"train_loss": -21.571321487426758, "global_step": 95086, "epoch": 1145} {"train_loss": -21.899879455566406, "global_step": 95087, "epoch": 1145} {"train_loss": -21.585540771484375, "global_step": 95088, "epoch": 1145} {"train_loss": -21.617958068847656, "global_step": 95089, "epoch": 1145} {"train_loss": -21.565046310424805, "global_step": 95090, "epoch": 1145} {"train_loss": -21.644521713256836, "global_step": 95091, "epoch": 1145} {"train_loss": -21.812305450439453, "global_step": 95092, "epoch": 1145} {"train_loss": -21.912004470825195, "global_step": 95093, "epoch": 1145} {"train_loss": -21.583927154541016, "global_step": 95094, "epoch": 1145} {"train_loss": -21.418777465820312, "global_step": 95095, "epoch": 1145} {"train_loss": -21.504972457885742, "global_step": 95096, "epoch": 1145} {"train_loss": -21.82706642150879, "global_step": 95097, "epoch": 1145} {"train_loss": -21.944549560546875, "global_step": 95098, "epoch": 1145} {"train_loss": -21.956573486328125, "global_step": 95099, "epoch": 1145} {"train_loss": -21.616071701049805, "global_step": 95100, "epoch": 1145} {"train_loss": -21.141008377075195, "global_step": 95101, "epoch": 1145} {"train_loss": -22.007593154907227, "global_step": 95102, "epoch": 1145} {"train_loss": -21.849197387695312, "global_step": 95103, "epoch": 1145} {"train_loss": -21.684650421142578, "global_step": 95104, "epoch": 1145} {"train_loss": -21.76472282409668, "global_step": 95105, "epoch": 1145} {"train_loss": -22.044416427612305, "global_step": 95106, "epoch": 1145} {"train_loss": -21.86028480529785, "global_step": 95107, "epoch": 1145} {"train_loss": -21.83564567565918, "global_step": 95108, "epoch": 1145} {"train_loss": -21.7961483001709, "global_step": 95109, "epoch": 1145} {"train_loss": -21.933151245117188, "global_step": 95110, "epoch": 1145} {"train_loss": -22.069236755371094, "global_step": 95111, "epoch": 1145} {"train_loss": -21.709697723388672, "global_step": 95112, "epoch": 1145} {"train_loss": -21.692384719848633, "global_step": 95113, "epoch": 1145} {"train_loss": -21.760501861572266, "global_step": 95114, "epoch": 1145} {"train_loss": -21.88161849975586, "global_step": 95115, "epoch": 1145} {"train_loss": -21.93984603881836, "global_step": 95116, "epoch": 1145} {"train_loss": -21.718445697462702, "global_step": 95117, "epoch": 1145, "val_loss": 6279574.0} {"train_loss": -20.971946716308594, "global_step": 95118, "epoch": 1146} {"train_loss": -21.70187759399414, "global_step": 95119, "epoch": 1146} {"train_loss": -21.258691787719727, "global_step": 95120, "epoch": 1146} {"train_loss": -21.47821807861328, "global_step": 95121, "epoch": 1146} {"train_loss": -21.4945068359375, "global_step": 95122, "epoch": 1146} {"train_loss": -21.217195510864258, "global_step": 95123, "epoch": 1146} {"train_loss": -21.523767471313477, "global_step": 95124, "epoch": 1146} {"train_loss": -21.308212280273438, "global_step": 95125, "epoch": 1146} {"train_loss": -21.255672454833984, "global_step": 95126, "epoch": 1146} {"train_loss": -21.70692253112793, "global_step": 95127, "epoch": 1146} {"train_loss": -21.279035568237305, "global_step": 95128, "epoch": 1146} {"train_loss": -21.54286003112793, "global_step": 95129, "epoch": 1146} {"train_loss": -21.50180435180664, "global_step": 95130, "epoch": 1146} {"train_loss": -21.618589401245117, "global_step": 95131, "epoch": 1146} {"train_loss": -21.525466918945312, "global_step": 95132, "epoch": 1146} {"train_loss": -21.566999435424805, "global_step": 95133, "epoch": 1146} {"train_loss": -21.727067947387695, "global_step": 95134, "epoch": 1146} {"train_loss": -21.645523071289062, "global_step": 95135, "epoch": 1146} {"train_loss": -21.6029109954834, "global_step": 95136, "epoch": 1146} {"train_loss": -21.874862670898438, "global_step": 95137, "epoch": 1146} {"train_loss": -22.033918380737305, "global_step": 95138, "epoch": 1146} {"train_loss": -21.801006317138672, "global_step": 95139, "epoch": 1146} {"train_loss": -21.404333114624023, "global_step": 95140, "epoch": 1146} {"train_loss": -21.85028076171875, "global_step": 95141, "epoch": 1146} {"train_loss": -21.34014892578125, "global_step": 95142, "epoch": 1146} {"train_loss": -21.59638786315918, "global_step": 95143, "epoch": 1146} {"train_loss": -21.783580780029297, "global_step": 95144, "epoch": 1146} {"train_loss": -21.50371742248535, "global_step": 95145, "epoch": 1146} {"train_loss": -21.512516021728516, "global_step": 95146, "epoch": 1146} {"train_loss": -21.995542526245117, "global_step": 95147, "epoch": 1146} {"train_loss": -21.397781372070312, "global_step": 95148, "epoch": 1146} {"train_loss": -21.59918785095215, "global_step": 95149, "epoch": 1146} {"train_loss": -21.363256454467773, "global_step": 95150, "epoch": 1146} {"train_loss": -21.746726989746094, "global_step": 95151, "epoch": 1146} {"train_loss": -21.394285202026367, "global_step": 95152, "epoch": 1146} {"train_loss": -21.389142990112305, "global_step": 95153, "epoch": 1146} {"train_loss": -21.871868133544922, "global_step": 95154, "epoch": 1146} {"train_loss": -21.54572105407715, "global_step": 95155, "epoch": 1146} {"train_loss": -21.640697479248047, "global_step": 95156, "epoch": 1146} {"train_loss": -21.399967193603516, "global_step": 95157, "epoch": 1146} {"train_loss": -21.448633193969727, "global_step": 95158, "epoch": 1146} {"train_loss": -22.079435348510742, "global_step": 95159, "epoch": 1146} {"train_loss": -21.56991195678711, "global_step": 95160, "epoch": 1146} {"train_loss": -22.260862350463867, "global_step": 95161, "epoch": 1146} {"train_loss": -21.930227279663086, "global_step": 95162, "epoch": 1146} {"train_loss": -21.699312210083008, "global_step": 95163, "epoch": 1146} {"train_loss": -21.64984703063965, "global_step": 95164, "epoch": 1146} {"train_loss": -22.124053955078125, "global_step": 95165, "epoch": 1146} {"train_loss": -22.117290496826172, "global_step": 95166, "epoch": 1146} {"train_loss": -21.703088760375977, "global_step": 95167, "epoch": 1146} {"train_loss": -22.175092697143555, "global_step": 95168, "epoch": 1146} {"train_loss": -22.0408992767334, "global_step": 95169, "epoch": 1146} {"train_loss": -21.543001174926758, "global_step": 95170, "epoch": 1146} {"train_loss": -21.6446533203125, "global_step": 95171, "epoch": 1146} {"train_loss": -21.732254028320312, "global_step": 95172, "epoch": 1146} {"train_loss": -21.705184936523438, "global_step": 95173, "epoch": 1146} {"train_loss": -21.689712524414062, "global_step": 95174, "epoch": 1146} {"train_loss": -21.550565719604492, "global_step": 95175, "epoch": 1146} {"train_loss": -21.564067840576172, "global_step": 95176, "epoch": 1146} {"train_loss": -21.75949478149414, "global_step": 95177, "epoch": 1146} {"train_loss": -22.015626907348633, "global_step": 95178, "epoch": 1146} {"train_loss": -21.83834457397461, "global_step": 95179, "epoch": 1146} {"train_loss": -21.46978187561035, "global_step": 95180, "epoch": 1146} {"train_loss": -21.653215408325195, "global_step": 95181, "epoch": 1146} {"train_loss": -21.6578311920166, "global_step": 95182, "epoch": 1146} {"train_loss": -22.184904098510742, "global_step": 95183, "epoch": 1146} {"train_loss": -21.88209342956543, "global_step": 95184, "epoch": 1146} {"train_loss": -21.6239013671875, "global_step": 95185, "epoch": 1146} {"train_loss": -21.335729598999023, "global_step": 95186, "epoch": 1146} {"train_loss": -21.882125854492188, "global_step": 95187, "epoch": 1146} {"train_loss": -22.018659591674805, "global_step": 95188, "epoch": 1146} {"train_loss": -21.73992919921875, "global_step": 95189, "epoch": 1146} {"train_loss": -21.821624755859375, "global_step": 95190, "epoch": 1146} {"train_loss": -21.298131942749023, "global_step": 95191, "epoch": 1146} {"train_loss": -21.804458618164062, "global_step": 95192, "epoch": 1146} {"train_loss": -21.5732364654541, "global_step": 95193, "epoch": 1146} {"train_loss": -21.870447158813477, "global_step": 95194, "epoch": 1146} {"train_loss": -21.593713760375977, "global_step": 95195, "epoch": 1146} {"train_loss": -21.832319259643555, "global_step": 95196, "epoch": 1146} {"train_loss": -21.803163528442383, "global_step": 95197, "epoch": 1146} {"train_loss": -21.86031150817871, "global_step": 95198, "epoch": 1146} {"train_loss": -22.03475570678711, "global_step": 95199, "epoch": 1146} {"train_loss": -21.691740909254694, "global_step": 95200, "epoch": 1146, "val_loss": 6053491.5} {"train_loss": -21.045265197753906, "global_step": 95201, "epoch": 1147} {"train_loss": -21.035078048706055, "global_step": 95202, "epoch": 1147} {"train_loss": -21.232126235961914, "global_step": 95203, "epoch": 1147} {"train_loss": -21.267423629760742, "global_step": 95204, "epoch": 1147} {"train_loss": -21.74172019958496, "global_step": 95205, "epoch": 1147} {"train_loss": -21.486867904663086, "global_step": 95206, "epoch": 1147} {"train_loss": -21.57827377319336, "global_step": 95207, "epoch": 1147} {"train_loss": -21.439119338989258, "global_step": 95208, "epoch": 1147} {"train_loss": -21.346391677856445, "global_step": 95209, "epoch": 1147} {"train_loss": -21.376413345336914, "global_step": 95210, "epoch": 1147} {"train_loss": -21.629405975341797, "global_step": 95211, "epoch": 1147} {"train_loss": -21.37642478942871, "global_step": 95212, "epoch": 1147} {"train_loss": -21.734827041625977, "global_step": 95213, "epoch": 1147} {"train_loss": -21.67144203186035, "global_step": 95214, "epoch": 1147} {"train_loss": -21.419485092163086, "global_step": 95215, "epoch": 1147} {"train_loss": -21.367115020751953, "global_step": 95216, "epoch": 1147} {"train_loss": -21.661014556884766, "global_step": 95217, "epoch": 1147} {"train_loss": -21.578115463256836, "global_step": 95218, "epoch": 1147} {"train_loss": -21.638511657714844, "global_step": 95219, "epoch": 1147} {"train_loss": -21.713842391967773, "global_step": 95220, "epoch": 1147} {"train_loss": -21.891027450561523, "global_step": 95221, "epoch": 1147} {"train_loss": -21.95020866394043, "global_step": 95222, "epoch": 1147} {"train_loss": -21.833742141723633, "global_step": 95223, "epoch": 1147} {"train_loss": -22.260549545288086, "global_step": 95224, "epoch": 1147} {"train_loss": -21.870786666870117, "global_step": 95225, "epoch": 1147} {"train_loss": -21.879819869995117, "global_step": 95226, "epoch": 1147} {"train_loss": -21.657194137573242, "global_step": 95227, "epoch": 1147} {"train_loss": -22.20949363708496, "global_step": 95228, "epoch": 1147} {"train_loss": -21.5445613861084, "global_step": 95229, "epoch": 1147} {"train_loss": -21.80367088317871, "global_step": 95230, "epoch": 1147} {"train_loss": -21.9874267578125, "global_step": 95231, "epoch": 1147} {"train_loss": -21.58818244934082, "global_step": 95232, "epoch": 1147} {"train_loss": -21.704193115234375, "global_step": 95233, "epoch": 1147} {"train_loss": -21.608060836791992, "global_step": 95234, "epoch": 1147} {"train_loss": -21.17992401123047, "global_step": 95235, "epoch": 1147} {"train_loss": -21.43087387084961, "global_step": 95236, "epoch": 1147} {"train_loss": -21.934354782104492, "global_step": 95237, "epoch": 1147} {"train_loss": -21.652435302734375, "global_step": 95238, "epoch": 1147} {"train_loss": -22.031681060791016, "global_step": 95239, "epoch": 1147} {"train_loss": -21.74667739868164, "global_step": 95240, "epoch": 1147} {"train_loss": -22.138151168823242, "global_step": 95241, "epoch": 1147} {"train_loss": -21.738859176635742, "global_step": 95242, "epoch": 1147} {"train_loss": -21.898155212402344, "global_step": 95243, "epoch": 1147} {"train_loss": -21.5681095123291, "global_step": 95244, "epoch": 1147} {"train_loss": -21.794635772705078, "global_step": 95245, "epoch": 1147} {"train_loss": -21.645780563354492, "global_step": 95246, "epoch": 1147} {"train_loss": -21.49460220336914, "global_step": 95247, "epoch": 1147} {"train_loss": -21.90587615966797, "global_step": 95248, "epoch": 1147} {"train_loss": -21.50969886779785, "global_step": 95249, "epoch": 1147} {"train_loss": -21.505104064941406, "global_step": 95250, "epoch": 1147} {"train_loss": -21.98408317565918, "global_step": 95251, "epoch": 1147} {"train_loss": -21.67465591430664, "global_step": 95252, "epoch": 1147} {"train_loss": -21.635435104370117, "global_step": 95253, "epoch": 1147} {"train_loss": -21.890172958374023, "global_step": 95254, "epoch": 1147} {"train_loss": -21.810087203979492, "global_step": 95255, "epoch": 1147} {"train_loss": -21.873153686523438, "global_step": 95256, "epoch": 1147} {"train_loss": -22.098155975341797, "global_step": 95257, "epoch": 1147} {"train_loss": -21.746692657470703, "global_step": 95258, "epoch": 1147} {"train_loss": -22.160106658935547, "global_step": 95259, "epoch": 1147} {"train_loss": -22.204998016357422, "global_step": 95260, "epoch": 1147} {"train_loss": -21.39013671875, "global_step": 95261, "epoch": 1147} {"train_loss": -21.611417770385742, "global_step": 95262, "epoch": 1147} {"train_loss": -22.219724655151367, "global_step": 95263, "epoch": 1147} {"train_loss": -22.0615177154541, "global_step": 95264, "epoch": 1147} {"train_loss": -21.93534278869629, "global_step": 95265, "epoch": 1147} {"train_loss": -21.77773094177246, "global_step": 95266, "epoch": 1147} {"train_loss": -21.589941024780273, "global_step": 95267, "epoch": 1147} {"train_loss": -21.80054473876953, "global_step": 95268, "epoch": 1147} {"train_loss": -21.621814727783203, "global_step": 95269, "epoch": 1147} {"train_loss": -21.626388549804688, "global_step": 95270, "epoch": 1147} {"train_loss": -22.087112426757812, "global_step": 95271, "epoch": 1147} {"train_loss": -21.953250885009766, "global_step": 95272, "epoch": 1147} {"train_loss": -21.69884490966797, "global_step": 95273, "epoch": 1147} {"train_loss": -21.81270980834961, "global_step": 95274, "epoch": 1147} {"train_loss": -22.010324478149414, "global_step": 95275, "epoch": 1147} {"train_loss": -21.730398178100586, "global_step": 95276, "epoch": 1147} {"train_loss": -21.582626342773438, "global_step": 95277, "epoch": 1147} {"train_loss": -21.7309627532959, "global_step": 95278, "epoch": 1147} {"train_loss": -21.997861862182617, "global_step": 95279, "epoch": 1147} {"train_loss": -21.414794921875, "global_step": 95280, "epoch": 1147} {"train_loss": -21.826099395751953, "global_step": 95281, "epoch": 1147} {"train_loss": -21.60321044921875, "global_step": 95282, "epoch": 1147} {"train_loss": -21.70601605794516, "global_step": 95283, "epoch": 1147, "val_loss": 6153185.0} {"train_loss": -20.580541610717773, "global_step": 95284, "epoch": 1148} {"train_loss": -20.524694442749023, "global_step": 95285, "epoch": 1148} {"train_loss": -21.209074020385742, "global_step": 95286, "epoch": 1148} {"train_loss": -21.21754264831543, "global_step": 95287, "epoch": 1148} {"train_loss": -21.080041885375977, "global_step": 95288, "epoch": 1148} {"train_loss": -21.449241638183594, "global_step": 95289, "epoch": 1148} {"train_loss": -21.352575302124023, "global_step": 95290, "epoch": 1148} {"train_loss": -21.148311614990234, "global_step": 95291, "epoch": 1148} {"train_loss": -21.39881134033203, "global_step": 95292, "epoch": 1148} {"train_loss": -21.70145606994629, "global_step": 95293, "epoch": 1148} {"train_loss": -21.565536499023438, "global_step": 95294, "epoch": 1148} {"train_loss": -21.622018814086914, "global_step": 95295, "epoch": 1148} {"train_loss": -21.586463928222656, "global_step": 95296, "epoch": 1148} {"train_loss": -21.537790298461914, "global_step": 95297, "epoch": 1148} {"train_loss": -21.435504913330078, "global_step": 95298, "epoch": 1148} {"train_loss": -21.428997039794922, "global_step": 95299, "epoch": 1148} {"train_loss": -21.68707847595215, "global_step": 95300, "epoch": 1148} {"train_loss": -21.13080406188965, "global_step": 95301, "epoch": 1148} {"train_loss": -21.600507736206055, "global_step": 95302, "epoch": 1148} {"train_loss": -21.416990280151367, "global_step": 95303, "epoch": 1148} {"train_loss": -21.715986251831055, "global_step": 95304, "epoch": 1148} {"train_loss": -21.698471069335938, "global_step": 95305, "epoch": 1148} {"train_loss": -21.785995483398438, "global_step": 95306, "epoch": 1148} {"train_loss": -21.661792755126953, "global_step": 95307, "epoch": 1148} {"train_loss": -21.753122329711914, "global_step": 95308, "epoch": 1148} {"train_loss": -21.665363311767578, "global_step": 95309, "epoch": 1148} {"train_loss": -22.056394577026367, "global_step": 95310, "epoch": 1148} {"train_loss": -21.531869888305664, "global_step": 95311, "epoch": 1148} {"train_loss": -21.999134063720703, "global_step": 95312, "epoch": 1148} {"train_loss": -21.752105712890625, "global_step": 95313, "epoch": 1148} {"train_loss": -22.032873153686523, "global_step": 95314, "epoch": 1148} {"train_loss": -21.56304359436035, "global_step": 95315, "epoch": 1148} {"train_loss": -21.735910415649414, "global_step": 95316, "epoch": 1148} {"train_loss": -21.976531982421875, "global_step": 95317, "epoch": 1148} {"train_loss": -21.816381454467773, "global_step": 95318, "epoch": 1148} {"train_loss": -22.126760482788086, "global_step": 95319, "epoch": 1148} {"train_loss": -21.755813598632812, "global_step": 95320, "epoch": 1148} {"train_loss": -22.19270896911621, "global_step": 95321, "epoch": 1148} {"train_loss": -21.833364486694336, "global_step": 95322, "epoch": 1148} {"train_loss": -21.583036422729492, "global_step": 95323, "epoch": 1148} {"train_loss": -21.755910873413086, "global_step": 95324, "epoch": 1148} {"train_loss": -21.830307006835938, "global_step": 95325, "epoch": 1148} {"train_loss": -21.496074676513672, "global_step": 95326, "epoch": 1148} {"train_loss": -21.440462112426758, "global_step": 95327, "epoch": 1148} {"train_loss": -21.706464767456055, "global_step": 95328, "epoch": 1148} {"train_loss": -21.642709732055664, "global_step": 95329, "epoch": 1148} {"train_loss": -21.80582046508789, "global_step": 95330, "epoch": 1148} {"train_loss": -21.84537696838379, "global_step": 95331, "epoch": 1148} {"train_loss": -21.613576889038086, "global_step": 95332, "epoch": 1148} {"train_loss": -21.33249282836914, "global_step": 95333, "epoch": 1148} {"train_loss": -21.490589141845703, "global_step": 95334, "epoch": 1148} {"train_loss": -21.917888641357422, "global_step": 95335, "epoch": 1148} {"train_loss": -21.623947143554688, "global_step": 95336, "epoch": 1148} {"train_loss": -22.0821590423584, "global_step": 95337, "epoch": 1148} {"train_loss": -21.90216064453125, "global_step": 95338, "epoch": 1148} {"train_loss": -22.247928619384766, "global_step": 95339, "epoch": 1148} {"train_loss": -21.73906898498535, "global_step": 95340, "epoch": 1148} {"train_loss": -21.793912887573242, "global_step": 95341, "epoch": 1148} {"train_loss": -22.00949478149414, "global_step": 95342, "epoch": 1148} {"train_loss": -21.95659828186035, "global_step": 95343, "epoch": 1148} {"train_loss": -22.250614166259766, "global_step": 95344, "epoch": 1148} {"train_loss": -21.83866310119629, "global_step": 95345, "epoch": 1148} {"train_loss": -21.571659088134766, "global_step": 95346, "epoch": 1148} {"train_loss": -21.810758590698242, "global_step": 95347, "epoch": 1148} {"train_loss": -21.74416160583496, "global_step": 95348, "epoch": 1148} {"train_loss": -21.497509002685547, "global_step": 95349, "epoch": 1148} {"train_loss": -21.59041976928711, "global_step": 95350, "epoch": 1148} {"train_loss": -22.045394897460938, "global_step": 95351, "epoch": 1148} {"train_loss": -21.920549392700195, "global_step": 95352, "epoch": 1148} {"train_loss": -21.864288330078125, "global_step": 95353, "epoch": 1148} {"train_loss": -21.95590591430664, "global_step": 95354, "epoch": 1148} {"train_loss": -21.600719451904297, "global_step": 95355, "epoch": 1148} {"train_loss": -21.670682907104492, "global_step": 95356, "epoch": 1148} {"train_loss": -21.68560791015625, "global_step": 95357, "epoch": 1148} {"train_loss": -21.437292098999023, "global_step": 95358, "epoch": 1148} {"train_loss": -21.829936981201172, "global_step": 95359, "epoch": 1148} {"train_loss": -21.33341407775879, "global_step": 95360, "epoch": 1148} {"train_loss": -21.749120712280273, "global_step": 95361, "epoch": 1148} {"train_loss": -21.974760055541992, "global_step": 95362, "epoch": 1148} {"train_loss": -21.824926376342773, "global_step": 95363, "epoch": 1148} {"train_loss": -21.3767147064209, "global_step": 95364, "epoch": 1148} {"train_loss": -21.92682456970215, "global_step": 95365, "epoch": 1148} {"train_loss": -21.688712154526307, "global_step": 95366, "epoch": 1148, "val_loss": 6091323.5} {"train_loss": -20.918180465698242, "global_step": 95367, "epoch": 1149} {"train_loss": -21.441574096679688, "global_step": 95368, "epoch": 1149} {"train_loss": -21.577138900756836, "global_step": 95369, "epoch": 1149} {"train_loss": -21.473703384399414, "global_step": 95370, "epoch": 1149} {"train_loss": -20.907485961914062, "global_step": 95371, "epoch": 1149} {"train_loss": -21.812814712524414, "global_step": 95372, "epoch": 1149} {"train_loss": -21.567445755004883, "global_step": 95373, "epoch": 1149} {"train_loss": -21.63384246826172, "global_step": 95374, "epoch": 1149} {"train_loss": -21.8801326751709, "global_step": 95375, "epoch": 1149} {"train_loss": -21.409589767456055, "global_step": 95376, "epoch": 1149} {"train_loss": -21.618003845214844, "global_step": 95377, "epoch": 1149} {"train_loss": -21.653554916381836, "global_step": 95378, "epoch": 1149} {"train_loss": -21.594511032104492, "global_step": 95379, "epoch": 1149} {"train_loss": -21.3173885345459, "global_step": 95380, "epoch": 1149} {"train_loss": -21.672809600830078, "global_step": 95381, "epoch": 1149} {"train_loss": -21.4371337890625, "global_step": 95382, "epoch": 1149} {"train_loss": -21.99165916442871, "global_step": 95383, "epoch": 1149} {"train_loss": -21.67781639099121, "global_step": 95384, "epoch": 1149} {"train_loss": -21.59322166442871, "global_step": 95385, "epoch": 1149} {"train_loss": -21.874530792236328, "global_step": 95386, "epoch": 1149} {"train_loss": -21.715749740600586, "global_step": 95387, "epoch": 1149} {"train_loss": -21.723569869995117, "global_step": 95388, "epoch": 1149} {"train_loss": -21.794178009033203, "global_step": 95389, "epoch": 1149} {"train_loss": -21.9321346282959, "global_step": 95390, "epoch": 1149} {"train_loss": -21.608726501464844, "global_step": 95391, "epoch": 1149} {"train_loss": -21.72316551208496, "global_step": 95392, "epoch": 1149} {"train_loss": -21.770200729370117, "global_step": 95393, "epoch": 1149} {"train_loss": -21.68134880065918, "global_step": 95394, "epoch": 1149} {"train_loss": -21.7318172454834, "global_step": 95395, "epoch": 1149} {"train_loss": -21.812347412109375, "global_step": 95396, "epoch": 1149} {"train_loss": -21.67642593383789, "global_step": 95397, "epoch": 1149} {"train_loss": -21.55841636657715, "global_step": 95398, "epoch": 1149} {"train_loss": -21.71303367614746, "global_step": 95399, "epoch": 1149} {"train_loss": -21.71382713317871, "global_step": 95400, "epoch": 1149} {"train_loss": -21.92911148071289, "global_step": 95401, "epoch": 1149} {"train_loss": -21.814416885375977, "global_step": 95402, "epoch": 1149} {"train_loss": -21.670461654663086, "global_step": 95403, "epoch": 1149} {"train_loss": -21.649394989013672, "global_step": 95404, "epoch": 1149} {"train_loss": -21.416532516479492, "global_step": 95405, "epoch": 1149} {"train_loss": -21.91489028930664, "global_step": 95406, "epoch": 1149} {"train_loss": -21.723276138305664, "global_step": 95407, "epoch": 1149} {"train_loss": -21.766677856445312, "global_step": 95408, "epoch": 1149} {"train_loss": -21.815017700195312, "global_step": 95409, "epoch": 1149} {"train_loss": -21.87653350830078, "global_step": 95410, "epoch": 1149} {"train_loss": -22.183853149414062, "global_step": 95411, "epoch": 1149} {"train_loss": -21.9188232421875, "global_step": 95412, "epoch": 1149} {"train_loss": -21.934972763061523, "global_step": 95413, "epoch": 1149} {"train_loss": -21.62880516052246, "global_step": 95414, "epoch": 1149} {"train_loss": -21.242883682250977, "global_step": 95415, "epoch": 1149} {"train_loss": -21.74916648864746, "global_step": 95416, "epoch": 1149} {"train_loss": -21.633665084838867, "global_step": 95417, "epoch": 1149} {"train_loss": -22.05253028869629, "global_step": 95418, "epoch": 1149} {"train_loss": -22.06198501586914, "global_step": 95419, "epoch": 1149} {"train_loss": -22.046539306640625, "global_step": 95420, "epoch": 1149} {"train_loss": -22.050125122070312, "global_step": 95421, "epoch": 1149} {"train_loss": -21.605422973632812, "global_step": 95422, "epoch": 1149} {"train_loss": -22.39688491821289, "global_step": 95423, "epoch": 1149} {"train_loss": -21.53464126586914, "global_step": 95424, "epoch": 1149} {"train_loss": -21.45261573791504, "global_step": 95425, "epoch": 1149} {"train_loss": -22.06959342956543, "global_step": 95426, "epoch": 1149} {"train_loss": -22.016828536987305, "global_step": 95427, "epoch": 1149} {"train_loss": -21.784372329711914, "global_step": 95428, "epoch": 1149} {"train_loss": -21.763219833374023, "global_step": 95429, "epoch": 1149} {"train_loss": -21.8321533203125, "global_step": 95430, "epoch": 1149} {"train_loss": -21.544031143188477, "global_step": 95431, "epoch": 1149} {"train_loss": -21.542654037475586, "global_step": 95432, "epoch": 1149} {"train_loss": -22.249408721923828, "global_step": 95433, "epoch": 1149} {"train_loss": -21.6219482421875, "global_step": 95434, "epoch": 1149} {"train_loss": -22.17549705505371, "global_step": 95435, "epoch": 1149} {"train_loss": -21.987947463989258, "global_step": 95436, "epoch": 1149} {"train_loss": -21.560911178588867, "global_step": 95437, "epoch": 1149} {"train_loss": -21.82612419128418, "global_step": 95438, "epoch": 1149} {"train_loss": -21.700275421142578, "global_step": 95439, "epoch": 1149} {"train_loss": -21.538875579833984, "global_step": 95440, "epoch": 1149} {"train_loss": -21.73219108581543, "global_step": 95441, "epoch": 1149} {"train_loss": -21.83700942993164, "global_step": 95442, "epoch": 1149} {"train_loss": -21.81184196472168, "global_step": 95443, "epoch": 1149} {"train_loss": -21.987043380737305, "global_step": 95444, "epoch": 1149} {"train_loss": -21.994535446166992, "global_step": 95445, "epoch": 1149} {"train_loss": -21.671796798706055, "global_step": 95446, "epoch": 1149} {"train_loss": -21.754423141479492, "global_step": 95447, "epoch": 1149} {"train_loss": -21.803909301757812, "global_step": 95448, "epoch": 1149} {"train_loss": -21.733911606202643, "global_step": 95449, "epoch": 1149, "val_loss": 6050797.5} {"train_loss": -21.52882957458496, "global_step": 95450, "epoch": 1150} {"train_loss": -21.22022247314453, "global_step": 95451, "epoch": 1150} {"train_loss": -21.87569236755371, "global_step": 95452, "epoch": 1150} {"train_loss": -21.133386611938477, "global_step": 95453, "epoch": 1150} {"train_loss": -21.361661911010742, "global_step": 95454, "epoch": 1150} {"train_loss": -21.469953536987305, "global_step": 95455, "epoch": 1150} {"train_loss": -21.328161239624023, "global_step": 95456, "epoch": 1150} {"train_loss": -21.745359420776367, "global_step": 95457, "epoch": 1150} {"train_loss": -21.267955780029297, "global_step": 95458, "epoch": 1150} {"train_loss": -21.28700828552246, "global_step": 95459, "epoch": 1150} {"train_loss": -21.610794067382812, "global_step": 95460, "epoch": 1150} {"train_loss": -21.518291473388672, "global_step": 95461, "epoch": 1150} {"train_loss": -21.106698989868164, "global_step": 95462, "epoch": 1150} {"train_loss": -21.421693801879883, "global_step": 95463, "epoch": 1150} {"train_loss": -21.12921142578125, "global_step": 95464, "epoch": 1150} {"train_loss": -21.58515739440918, "global_step": 95465, "epoch": 1150} {"train_loss": -21.648983001708984, "global_step": 95466, "epoch": 1150} {"train_loss": -21.577165603637695, "global_step": 95467, "epoch": 1150} {"train_loss": -21.510637283325195, "global_step": 95468, "epoch": 1150} {"train_loss": -21.64809226989746, "global_step": 95469, "epoch": 1150} {"train_loss": -21.67780876159668, "global_step": 95470, "epoch": 1150} {"train_loss": -21.386474609375, "global_step": 95471, "epoch": 1150} {"train_loss": -21.680130004882812, "global_step": 95472, "epoch": 1150} {"train_loss": -21.096174240112305, "global_step": 95473, "epoch": 1150} {"train_loss": -21.89702033996582, "global_step": 95474, "epoch": 1150} {"train_loss": -21.705204010009766, "global_step": 95475, "epoch": 1150} {"train_loss": -21.18107032775879, "global_step": 95476, "epoch": 1150} {"train_loss": -21.821096420288086, "global_step": 95477, "epoch": 1150} {"train_loss": -21.84556770324707, "global_step": 95478, "epoch": 1150} {"train_loss": -21.94108772277832, "global_step": 95479, "epoch": 1150} {"train_loss": -21.619462966918945, "global_step": 95480, "epoch": 1150} {"train_loss": -21.842575073242188, "global_step": 95481, "epoch": 1150} {"train_loss": -21.71339988708496, "global_step": 95482, "epoch": 1150} {"train_loss": -21.760889053344727, "global_step": 95483, "epoch": 1150} {"train_loss": -21.91594696044922, "global_step": 95484, "epoch": 1150} {"train_loss": -21.99227523803711, "global_step": 95485, "epoch": 1150} {"train_loss": -21.403913497924805, "global_step": 95486, "epoch": 1150} {"train_loss": -21.85888671875, "global_step": 95487, "epoch": 1150} {"train_loss": -21.68524742126465, "global_step": 95488, "epoch": 1150} {"train_loss": -21.769195556640625, "global_step": 95489, "epoch": 1150} {"train_loss": -21.712411880493164, "global_step": 95490, "epoch": 1150} {"train_loss": -22.029891967773438, "global_step": 95491, "epoch": 1150} {"train_loss": -21.442922592163086, "global_step": 95492, "epoch": 1150} {"train_loss": -22.2541561126709, "global_step": 95493, "epoch": 1150} {"train_loss": -21.8198184967041, "global_step": 95494, "epoch": 1150} {"train_loss": -21.80165672302246, "global_step": 95495, "epoch": 1150} {"train_loss": -21.318927764892578, "global_step": 95496, "epoch": 1150} {"train_loss": -21.99705696105957, "global_step": 95497, "epoch": 1150} {"train_loss": -21.455434799194336, "global_step": 95498, "epoch": 1150} {"train_loss": -21.956195831298828, "global_step": 95499, "epoch": 1150} {"train_loss": -21.630126953125, "global_step": 95500, "epoch": 1150} {"train_loss": -21.81797981262207, "global_step": 95501, "epoch": 1150} {"train_loss": -22.028911590576172, "global_step": 95502, "epoch": 1150} {"train_loss": -21.66470718383789, "global_step": 95503, "epoch": 1150} {"train_loss": -21.851531982421875, "global_step": 95504, "epoch": 1150} {"train_loss": -21.556068420410156, "global_step": 95505, "epoch": 1150} {"train_loss": -21.74005126953125, "global_step": 95506, "epoch": 1150} {"train_loss": -21.48390769958496, "global_step": 95507, "epoch": 1150} {"train_loss": -21.90194320678711, "global_step": 95508, "epoch": 1150} {"train_loss": -22.04117774963379, "global_step": 95509, "epoch": 1150} {"train_loss": -21.903396606445312, "global_step": 95510, "epoch": 1150} {"train_loss": -21.433441162109375, "global_step": 95511, "epoch": 1150} {"train_loss": -21.924697875976562, "global_step": 95512, "epoch": 1150} {"train_loss": -21.97490882873535, "global_step": 95513, "epoch": 1150} {"train_loss": -21.670364379882812, "global_step": 95514, "epoch": 1150} {"train_loss": -21.87122917175293, "global_step": 95515, "epoch": 1150} {"train_loss": -21.550607681274414, "global_step": 95516, "epoch": 1150} {"train_loss": -21.928720474243164, "global_step": 95517, "epoch": 1150} {"train_loss": -21.991601943969727, "global_step": 95518, "epoch": 1150} {"train_loss": -21.5156192779541, "global_step": 95519, "epoch": 1150} {"train_loss": -21.68292808532715, "global_step": 95520, "epoch": 1150} {"train_loss": -21.837820053100586, "global_step": 95521, "epoch": 1150} {"train_loss": -22.28057861328125, "global_step": 95522, "epoch": 1150} {"train_loss": -21.65280532836914, "global_step": 95523, "epoch": 1150} {"train_loss": -22.1463680267334, "global_step": 95524, "epoch": 1150} {"train_loss": -21.773330688476562, "global_step": 95525, "epoch": 1150} {"train_loss": -21.94185447692871, "global_step": 95526, "epoch": 1150} {"train_loss": -21.797435760498047, "global_step": 95527, "epoch": 1150} {"train_loss": -22.02866554260254, "global_step": 95528, "epoch": 1150} {"train_loss": -22.12862205505371, "global_step": 95529, "epoch": 1150} {"train_loss": -21.9100341796875, "global_step": 95530, "epoch": 1150} {"train_loss": -21.817901611328125, "global_step": 95531, "epoch": 1150} {"train_loss": -21.69295092663133, "global_step": 95532, "epoch": 1150, "train/sim_max_reward_0": 1.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4500000": 1.0, "test/sim_max_reward_4500001": 1.0, "test/sim_max_reward_4500002": 1.0, "test/sim_max_reward_4500003": 1.0, "test/sim_max_reward_4500004": 1.0, "test/sim_max_reward_4500005": 1.0, "test/sim_max_reward_4500006": 1.0, "test/sim_max_reward_4500007": 1.0, "test/sim_max_reward_4500008": 1.0, "test/sim_max_reward_4500009": 1.0, "test/sim_max_reward_4500010": 1.0, "test/sim_max_reward_4500011": 1.0, "test/sim_max_reward_4500012": 1.0, "test/sim_max_reward_4500013": 1.0, "test/sim_max_reward_4500014": 1.0, "test/sim_max_reward_4500015": 1.0, "test/sim_max_reward_4500016": 1.0, "test/sim_max_reward_4500017": 1.0, "test/sim_max_reward_4500018": 1.0, "test/sim_max_reward_4500019": 1.0, "test/sim_max_reward_4500020": 1.0, "test/sim_max_reward_4500021": 1.0, "train/mean_score": 1.0, "test/mean_score": 1.0, "val_loss": 6003769.0} {"train_loss": -21.932130813598633, "global_step": 95533, "epoch": 1151} {"train_loss": -21.69419288635254, "global_step": 95534, "epoch": 1151} {"train_loss": -21.886133193969727, "global_step": 95535, "epoch": 1151} {"train_loss": -21.665237426757812, "global_step": 95536, "epoch": 1151} {"train_loss": -22.014774322509766, "global_step": 95537, "epoch": 1151} {"train_loss": -21.649017333984375, "global_step": 95538, "epoch": 1151} {"train_loss": -21.9112606048584, "global_step": 95539, "epoch": 1151} {"train_loss": -21.8443660736084, "global_step": 95540, "epoch": 1151} {"train_loss": -21.759002685546875, "global_step": 95541, "epoch": 1151} {"train_loss": -21.569547653198242, "global_step": 95542, "epoch": 1151} {"train_loss": -21.786319732666016, "global_step": 95543, "epoch": 1151} {"train_loss": -21.957427978515625, "global_step": 95544, "epoch": 1151} {"train_loss": -21.485698699951172, "global_step": 95545, "epoch": 1151} {"train_loss": -21.446813583374023, "global_step": 95546, "epoch": 1151} {"train_loss": -21.66278648376465, "global_step": 95547, "epoch": 1151} {"train_loss": -22.129899978637695, "global_step": 95548, "epoch": 1151} {"train_loss": -21.718942642211914, "global_step": 95549, "epoch": 1151} {"train_loss": -21.640565872192383, "global_step": 95550, "epoch": 1151} {"train_loss": -22.261920928955078, "global_step": 95551, "epoch": 1151} {"train_loss": -21.611770629882812, "global_step": 95552, "epoch": 1151} {"train_loss": -21.9773006439209, "global_step": 95553, "epoch": 1151} {"train_loss": -21.833566665649414, "global_step": 95554, "epoch": 1151} {"train_loss": -21.402347564697266, "global_step": 95555, "epoch": 1151} {"train_loss": -21.67100715637207, "global_step": 95556, "epoch": 1151} {"train_loss": -22.035490036010742, "global_step": 95557, "epoch": 1151} {"train_loss": -21.68281364440918, "global_step": 95558, "epoch": 1151} {"train_loss": -21.497756958007812, "global_step": 95559, "epoch": 1151} {"train_loss": -21.511154174804688, "global_step": 95560, "epoch": 1151} {"train_loss": -21.199308395385742, "global_step": 95561, "epoch": 1151} {"train_loss": -21.580615997314453, "global_step": 95562, "epoch": 1151} {"train_loss": -21.969480514526367, "global_step": 95563, "epoch": 1151} {"train_loss": -21.990446090698242, "global_step": 95564, "epoch": 1151} {"train_loss": -22.06662940979004, "global_step": 95565, "epoch": 1151} {"train_loss": -21.974916458129883, "global_step": 95566, "epoch": 1151} {"train_loss": -21.766759872436523, "global_step": 95567, "epoch": 1151} {"train_loss": -22.207937240600586, "global_step": 95568, "epoch": 1151} {"train_loss": -21.93086051940918, "global_step": 95569, "epoch": 1151} {"train_loss": -21.994218826293945, "global_step": 95570, "epoch": 1151} {"train_loss": -22.03212547302246, "global_step": 95571, "epoch": 1151} {"train_loss": -21.668241500854492, "global_step": 95572, "epoch": 1151} {"train_loss": -21.70254135131836, "global_step": 95573, "epoch": 1151} {"train_loss": -22.022647857666016, "global_step": 95574, "epoch": 1151} {"train_loss": -21.922948837280273, "global_step": 95575, "epoch": 1151} {"train_loss": -21.774404525756836, "global_step": 95576, "epoch": 1151} {"train_loss": -21.88471794128418, "global_step": 95577, "epoch": 1151} {"train_loss": -21.911352157592773, "global_step": 95578, "epoch": 1151} {"train_loss": -21.743864059448242, "global_step": 95579, "epoch": 1151} {"train_loss": -21.842863082885742, "global_step": 95580, "epoch": 1151} {"train_loss": -21.972265243530273, "global_step": 95581, "epoch": 1151} {"train_loss": -21.522905349731445, "global_step": 95582, "epoch": 1151} {"train_loss": -21.809839248657227, "global_step": 95583, "epoch": 1151} {"train_loss": -21.869739532470703, "global_step": 95584, "epoch": 1151} {"train_loss": -21.77644157409668, "global_step": 95585, "epoch": 1151} {"train_loss": -21.89432144165039, "global_step": 95586, "epoch": 1151} {"train_loss": -21.85503387451172, "global_step": 95587, "epoch": 1151} {"train_loss": -22.167997360229492, "global_step": 95588, "epoch": 1151} {"train_loss": -22.006397247314453, "global_step": 95589, "epoch": 1151} {"train_loss": -22.16901969909668, "global_step": 95590, "epoch": 1151} {"train_loss": -21.71803092956543, "global_step": 95591, "epoch": 1151} {"train_loss": -22.155033111572266, "global_step": 95592, "epoch": 1151} {"train_loss": -22.01764488220215, "global_step": 95593, "epoch": 1151} {"train_loss": -21.717199325561523, "global_step": 95594, "epoch": 1151} {"train_loss": -22.059110641479492, "global_step": 95595, "epoch": 1151} {"train_loss": -21.587980270385742, "global_step": 95596, "epoch": 1151} {"train_loss": -21.66570281982422, "global_step": 95597, "epoch": 1151} {"train_loss": -21.486572265625, "global_step": 95598, "epoch": 1151} {"train_loss": -21.769229888916016, "global_step": 95599, "epoch": 1151} {"train_loss": -21.628957748413086, "global_step": 95600, "epoch": 1151} {"train_loss": -21.791757583618164, "global_step": 95601, "epoch": 1151} {"train_loss": -21.72646141052246, "global_step": 95602, "epoch": 1151} {"train_loss": -21.594532012939453, "global_step": 95603, "epoch": 1151} {"train_loss": -22.15607261657715, "global_step": 95604, "epoch": 1151} {"train_loss": -22.02992057800293, "global_step": 95605, "epoch": 1151} {"train_loss": -21.72433090209961, "global_step": 95606, "epoch": 1151} {"train_loss": -21.651094436645508, "global_step": 95607, "epoch": 1151} {"train_loss": -21.773351669311523, "global_step": 95608, "epoch": 1151} {"train_loss": -21.927865982055664, "global_step": 95609, "epoch": 1151} {"train_loss": -21.823068618774414, "global_step": 95610, "epoch": 1151} {"train_loss": -22.167102813720703, "global_step": 95611, "epoch": 1151} {"train_loss": -21.592792510986328, "global_step": 95612, "epoch": 1151} {"train_loss": -21.65595054626465, "global_step": 95613, "epoch": 1151} {"train_loss": -21.665958404541016, "global_step": 95614, "epoch": 1151} {"train_loss": -21.80945706654744, "global_step": 95615, "epoch": 1151, "val_loss": 6161602.5} {"train_loss": -21.77429962158203, "global_step": 95616, "epoch": 1152} {"train_loss": -22.0275936126709, "global_step": 95617, "epoch": 1152} {"train_loss": -21.286611557006836, "global_step": 95618, "epoch": 1152} {"train_loss": -21.485727310180664, "global_step": 95619, "epoch": 1152} {"train_loss": -21.88143539428711, "global_step": 95620, "epoch": 1152} {"train_loss": -21.46759033203125, "global_step": 95621, "epoch": 1152} {"train_loss": -21.79779052734375, "global_step": 95622, "epoch": 1152} {"train_loss": -21.601802825927734, "global_step": 95623, "epoch": 1152} {"train_loss": -21.73285484313965, "global_step": 95624, "epoch": 1152} {"train_loss": -21.63735008239746, "global_step": 95625, "epoch": 1152} {"train_loss": -21.823339462280273, "global_step": 95626, "epoch": 1152} {"train_loss": -22.160724639892578, "global_step": 95627, "epoch": 1152} {"train_loss": -21.844144821166992, "global_step": 95628, "epoch": 1152} {"train_loss": -21.717458724975586, "global_step": 95629, "epoch": 1152} {"train_loss": -21.707063674926758, "global_step": 95630, "epoch": 1152} {"train_loss": -21.88150978088379, "global_step": 95631, "epoch": 1152} {"train_loss": -21.610517501831055, "global_step": 95632, "epoch": 1152} {"train_loss": -21.93134307861328, "global_step": 95633, "epoch": 1152} {"train_loss": -21.960189819335938, "global_step": 95634, "epoch": 1152} {"train_loss": -21.45355796813965, "global_step": 95635, "epoch": 1152} {"train_loss": -21.700660705566406, "global_step": 95636, "epoch": 1152} {"train_loss": -21.465824127197266, "global_step": 95637, "epoch": 1152} {"train_loss": -21.734098434448242, "global_step": 95638, "epoch": 1152} {"train_loss": -21.813703536987305, "global_step": 95639, "epoch": 1152} {"train_loss": -21.832509994506836, "global_step": 95640, "epoch": 1152} {"train_loss": -21.649911880493164, "global_step": 95641, "epoch": 1152} {"train_loss": -21.900501251220703, "global_step": 95642, "epoch": 1152} {"train_loss": -21.9924373626709, "global_step": 95643, "epoch": 1152} {"train_loss": -21.619604110717773, "global_step": 95644, "epoch": 1152} {"train_loss": -22.00589370727539, "global_step": 95645, "epoch": 1152} {"train_loss": -21.893936157226562, "global_step": 95646, "epoch": 1152} {"train_loss": -21.213415145874023, "global_step": 95647, "epoch": 1152} {"train_loss": -21.974977493286133, "global_step": 95648, "epoch": 1152} {"train_loss": -21.38449478149414, "global_step": 95649, "epoch": 1152} {"train_loss": -21.683582305908203, "global_step": 95650, "epoch": 1152} {"train_loss": -21.92597770690918, "global_step": 95651, "epoch": 1152} {"train_loss": -21.643583297729492, "global_step": 95652, "epoch": 1152} {"train_loss": -21.986509323120117, "global_step": 95653, "epoch": 1152} {"train_loss": -21.54239273071289, "global_step": 95654, "epoch": 1152} {"train_loss": -21.75339126586914, "global_step": 95655, "epoch": 1152} {"train_loss": -21.707006454467773, "global_step": 95656, "epoch": 1152} {"train_loss": -21.523670196533203, "global_step": 95657, "epoch": 1152} {"train_loss": -21.490915298461914, "global_step": 95658, "epoch": 1152} {"train_loss": -21.827672958374023, "global_step": 95659, "epoch": 1152} {"train_loss": -21.878089904785156, "global_step": 95660, "epoch": 1152} {"train_loss": -21.98072624206543, "global_step": 95661, "epoch": 1152} {"train_loss": -21.7440242767334, "global_step": 95662, "epoch": 1152} {"train_loss": -22.179706573486328, "global_step": 95663, "epoch": 1152} {"train_loss": -21.553909301757812, "global_step": 95664, "epoch": 1152} {"train_loss": -21.8336238861084, "global_step": 95665, "epoch": 1152} {"train_loss": -22.019804000854492, "global_step": 95666, "epoch": 1152} {"train_loss": -21.859594345092773, "global_step": 95667, "epoch": 1152} {"train_loss": -21.926965713500977, "global_step": 95668, "epoch": 1152} {"train_loss": -21.75599479675293, "global_step": 95669, "epoch": 1152} {"train_loss": -21.77928352355957, "global_step": 95670, "epoch": 1152} {"train_loss": -21.677001953125, "global_step": 95671, "epoch": 1152} {"train_loss": -21.463363647460938, "global_step": 95672, "epoch": 1152} {"train_loss": -21.899444580078125, "global_step": 95673, "epoch": 1152} {"train_loss": -21.558334350585938, "global_step": 95674, "epoch": 1152} {"train_loss": -21.544986724853516, "global_step": 95675, "epoch": 1152} {"train_loss": -21.940401077270508, "global_step": 95676, "epoch": 1152} {"train_loss": -21.874784469604492, "global_step": 95677, "epoch": 1152} {"train_loss": -22.17278289794922, "global_step": 95678, "epoch": 1152} {"train_loss": -21.711231231689453, "global_step": 95679, "epoch": 1152} {"train_loss": -21.654081344604492, "global_step": 95680, "epoch": 1152} {"train_loss": -21.820486068725586, "global_step": 95681, "epoch": 1152} {"train_loss": -21.815221786499023, "global_step": 95682, "epoch": 1152} {"train_loss": -21.808317184448242, "global_step": 95683, "epoch": 1152} {"train_loss": -22.038742065429688, "global_step": 95684, "epoch": 1152} {"train_loss": -21.743112564086914, "global_step": 95685, "epoch": 1152} {"train_loss": -22.039777755737305, "global_step": 95686, "epoch": 1152} {"train_loss": -21.61260986328125, "global_step": 95687, "epoch": 1152} {"train_loss": -22.228086471557617, "global_step": 95688, "epoch": 1152} {"train_loss": -21.6304931640625, "global_step": 95689, "epoch": 1152} {"train_loss": -21.627099990844727, "global_step": 95690, "epoch": 1152} {"train_loss": -21.83638572692871, "global_step": 95691, "epoch": 1152} {"train_loss": -21.436504364013672, "global_step": 95692, "epoch": 1152} {"train_loss": -21.911155700683594, "global_step": 95693, "epoch": 1152} {"train_loss": -21.9606876373291, "global_step": 95694, "epoch": 1152} {"train_loss": -21.7686710357666, "global_step": 95695, "epoch": 1152} {"train_loss": -21.81233024597168, "global_step": 95696, "epoch": 1152} {"train_loss": -21.800338745117188, "global_step": 95697, "epoch": 1152} {"train_loss": -21.756906118737646, "global_step": 95698, "epoch": 1152, "val_loss": 6173016.0} {"train_loss": -21.775583267211914, "global_step": 95699, "epoch": 1153} {"train_loss": -21.223440170288086, "global_step": 95700, "epoch": 1153} {"train_loss": -21.374658584594727, "global_step": 95701, "epoch": 1153} {"train_loss": -21.617307662963867, "global_step": 95702, "epoch": 1153} {"train_loss": -21.2471981048584, "global_step": 95703, "epoch": 1153} {"train_loss": -21.07830238342285, "global_step": 95704, "epoch": 1153} {"train_loss": -21.12687110900879, "global_step": 95705, "epoch": 1153} {"train_loss": -21.13935661315918, "global_step": 95706, "epoch": 1153} {"train_loss": -21.008275985717773, "global_step": 95707, "epoch": 1153} {"train_loss": -21.44154930114746, "global_step": 95708, "epoch": 1153} {"train_loss": -21.570341110229492, "global_step": 95709, "epoch": 1153} {"train_loss": -21.423696517944336, "global_step": 95710, "epoch": 1153} {"train_loss": -21.886444091796875, "global_step": 95711, "epoch": 1153} {"train_loss": -21.450605392456055, "global_step": 95712, "epoch": 1153} {"train_loss": -21.74151611328125, "global_step": 95713, "epoch": 1153} {"train_loss": -21.494478225708008, "global_step": 95714, "epoch": 1153} {"train_loss": -21.7875919342041, "global_step": 95715, "epoch": 1153} {"train_loss": -21.758934020996094, "global_step": 95716, "epoch": 1153} {"train_loss": -21.70585823059082, "global_step": 95717, "epoch": 1153} {"train_loss": -21.719449996948242, "global_step": 95718, "epoch": 1153} {"train_loss": -21.9598445892334, "global_step": 95719, "epoch": 1153} {"train_loss": -21.632917404174805, "global_step": 95720, "epoch": 1153} {"train_loss": -21.99924087524414, "global_step": 95721, "epoch": 1153} {"train_loss": -21.87689781188965, "global_step": 95722, "epoch": 1153} {"train_loss": -21.904159545898438, "global_step": 95723, "epoch": 1153} {"train_loss": -21.911684036254883, "global_step": 95724, "epoch": 1153} {"train_loss": -21.675954818725586, "global_step": 95725, "epoch": 1153} {"train_loss": -22.13591957092285, "global_step": 95726, "epoch": 1153} {"train_loss": -22.026975631713867, "global_step": 95727, "epoch": 1153} {"train_loss": -21.475866317749023, "global_step": 95728, "epoch": 1153} {"train_loss": -21.970972061157227, "global_step": 95729, "epoch": 1153} {"train_loss": -21.612937927246094, "global_step": 95730, "epoch": 1153} {"train_loss": -21.741254806518555, "global_step": 95731, "epoch": 1153} {"train_loss": -22.03148651123047, "global_step": 95732, "epoch": 1153} {"train_loss": -21.882740020751953, "global_step": 95733, "epoch": 1153} {"train_loss": -22.08509635925293, "global_step": 95734, "epoch": 1153} {"train_loss": -22.0794734954834, "global_step": 95735, "epoch": 1153} {"train_loss": -22.007665634155273, "global_step": 95736, "epoch": 1153} {"train_loss": -21.97377586364746, "global_step": 95737, "epoch": 1153} {"train_loss": -21.4306697845459, "global_step": 95738, "epoch": 1153} {"train_loss": -21.955976486206055, "global_step": 95739, "epoch": 1153} {"train_loss": -21.997182846069336, "global_step": 95740, "epoch": 1153} {"train_loss": -21.557254791259766, "global_step": 95741, "epoch": 1153} {"train_loss": -22.012147903442383, "global_step": 95742, "epoch": 1153} {"train_loss": -21.578445434570312, "global_step": 95743, "epoch": 1153} {"train_loss": -21.85854721069336, "global_step": 95744, "epoch": 1153} {"train_loss": -21.765989303588867, "global_step": 95745, "epoch": 1153} {"train_loss": -22.205928802490234, "global_step": 95746, "epoch": 1153} {"train_loss": -22.13919448852539, "global_step": 95747, "epoch": 1153} {"train_loss": -21.692949295043945, "global_step": 95748, "epoch": 1153} {"train_loss": -22.16292381286621, "global_step": 95749, "epoch": 1153} {"train_loss": -21.930992126464844, "global_step": 95750, "epoch": 1153} {"train_loss": -21.908628463745117, "global_step": 95751, "epoch": 1153} {"train_loss": -21.900089263916016, "global_step": 95752, "epoch": 1153} {"train_loss": -21.755878448486328, "global_step": 95753, "epoch": 1153} {"train_loss": -21.933691024780273, "global_step": 95754, "epoch": 1153} {"train_loss": -21.880163192749023, "global_step": 95755, "epoch": 1153} {"train_loss": -21.51891326904297, "global_step": 95756, "epoch": 1153} {"train_loss": -21.8313045501709, "global_step": 95757, "epoch": 1153} {"train_loss": -22.26036834716797, "global_step": 95758, "epoch": 1153} {"train_loss": -21.83145523071289, "global_step": 95759, "epoch": 1153} {"train_loss": -21.75288963317871, "global_step": 95760, "epoch": 1153} {"train_loss": -21.40195083618164, "global_step": 95761, "epoch": 1153} {"train_loss": -21.8006534576416, "global_step": 95762, "epoch": 1153} {"train_loss": -21.78126335144043, "global_step": 95763, "epoch": 1153} {"train_loss": -21.6547794342041, "global_step": 95764, "epoch": 1153} {"train_loss": -21.71406364440918, "global_step": 95765, "epoch": 1153} {"train_loss": -21.548192977905273, "global_step": 95766, "epoch": 1153} {"train_loss": -21.60474395751953, "global_step": 95767, "epoch": 1153} {"train_loss": -21.937393188476562, "global_step": 95768, "epoch": 1153} {"train_loss": -21.6687068939209, "global_step": 95769, "epoch": 1153} {"train_loss": -22.004409790039062, "global_step": 95770, "epoch": 1153} {"train_loss": -21.571308135986328, "global_step": 95771, "epoch": 1153} {"train_loss": -21.76230812072754, "global_step": 95772, "epoch": 1153} {"train_loss": -21.73866844177246, "global_step": 95773, "epoch": 1153} {"train_loss": -21.45337677001953, "global_step": 95774, "epoch": 1153} {"train_loss": -21.950851440429688, "global_step": 95775, "epoch": 1153} {"train_loss": -21.539915084838867, "global_step": 95776, "epoch": 1153} {"train_loss": -21.99921989440918, "global_step": 95777, "epoch": 1153} {"train_loss": -21.9058895111084, "global_step": 95778, "epoch": 1153} {"train_loss": -21.722095489501953, "global_step": 95779, "epoch": 1153} {"train_loss": -21.562074661254883, "global_step": 95780, "epoch": 1153} {"train_loss": -21.76946791683335, "global_step": 95781, "epoch": 1153, "val_loss": 6137041.0} {"train_loss": -20.933393478393555, "global_step": 95782, "epoch": 1154} {"train_loss": -20.413673400878906, "global_step": 95783, "epoch": 1154} {"train_loss": -21.98029136657715, "global_step": 95784, "epoch": 1154} {"train_loss": -20.786855697631836, "global_step": 95785, "epoch": 1154} {"train_loss": -20.8143310546875, "global_step": 95786, "epoch": 1154} {"train_loss": -21.732248306274414, "global_step": 95787, "epoch": 1154} {"train_loss": -21.17543601989746, "global_step": 95788, "epoch": 1154} {"train_loss": -21.33025550842285, "global_step": 95789, "epoch": 1154} {"train_loss": -21.38346290588379, "global_step": 95790, "epoch": 1154} {"train_loss": -20.959482192993164, "global_step": 95791, "epoch": 1154} {"train_loss": -21.1320858001709, "global_step": 95792, "epoch": 1154} {"train_loss": -21.138540267944336, "global_step": 95793, "epoch": 1154} {"train_loss": -21.684446334838867, "global_step": 95794, "epoch": 1154} {"train_loss": -21.28727149963379, "global_step": 95795, "epoch": 1154} {"train_loss": -21.518798828125, "global_step": 95796, "epoch": 1154} {"train_loss": -21.401580810546875, "global_step": 95797, "epoch": 1154} {"train_loss": -21.80491828918457, "global_step": 95798, "epoch": 1154} {"train_loss": -21.61823081970215, "global_step": 95799, "epoch": 1154} {"train_loss": -21.48465347290039, "global_step": 95800, "epoch": 1154} {"train_loss": -21.817039489746094, "global_step": 95801, "epoch": 1154} {"train_loss": -21.638446807861328, "global_step": 95802, "epoch": 1154} {"train_loss": -21.38238525390625, "global_step": 95803, "epoch": 1154} {"train_loss": -21.499488830566406, "global_step": 95804, "epoch": 1154} {"train_loss": -21.821842193603516, "global_step": 95805, "epoch": 1154} {"train_loss": -21.677642822265625, "global_step": 95806, "epoch": 1154} {"train_loss": -21.676828384399414, "global_step": 95807, "epoch": 1154} {"train_loss": -21.9107723236084, "global_step": 95808, "epoch": 1154} {"train_loss": -21.967613220214844, "global_step": 95809, "epoch": 1154} {"train_loss": -21.557241439819336, "global_step": 95810, "epoch": 1154} {"train_loss": -21.85959243774414, "global_step": 95811, "epoch": 1154} {"train_loss": -21.727218627929688, "global_step": 95812, "epoch": 1154} {"train_loss": -21.868024826049805, "global_step": 95813, "epoch": 1154} {"train_loss": -22.024932861328125, "global_step": 95814, "epoch": 1154} {"train_loss": -21.550216674804688, "global_step": 95815, "epoch": 1154} {"train_loss": -21.979726791381836, "global_step": 95816, "epoch": 1154} {"train_loss": -21.63984489440918, "global_step": 95817, "epoch": 1154} {"train_loss": -21.729520797729492, "global_step": 95818, "epoch": 1154} {"train_loss": -22.044452667236328, "global_step": 95819, "epoch": 1154} {"train_loss": -21.833526611328125, "global_step": 95820, "epoch": 1154} {"train_loss": -21.592008590698242, "global_step": 95821, "epoch": 1154} {"train_loss": -21.574861526489258, "global_step": 95822, "epoch": 1154} {"train_loss": -21.847532272338867, "global_step": 95823, "epoch": 1154} {"train_loss": -22.105443954467773, "global_step": 95824, "epoch": 1154} {"train_loss": -22.050331115722656, "global_step": 95825, "epoch": 1154} {"train_loss": -21.505783081054688, "global_step": 95826, "epoch": 1154} {"train_loss": -22.07071304321289, "global_step": 95827, "epoch": 1154} {"train_loss": -21.533048629760742, "global_step": 95828, "epoch": 1154} {"train_loss": -22.19996452331543, "global_step": 95829, "epoch": 1154} {"train_loss": -21.795591354370117, "global_step": 95830, "epoch": 1154} {"train_loss": -22.17595100402832, "global_step": 95831, "epoch": 1154} {"train_loss": -21.608375549316406, "global_step": 95832, "epoch": 1154} {"train_loss": -21.8486385345459, "global_step": 95833, "epoch": 1154} {"train_loss": -21.72698211669922, "global_step": 95834, "epoch": 1154} {"train_loss": -22.076974868774414, "global_step": 95835, "epoch": 1154} {"train_loss": -22.182437896728516, "global_step": 95836, "epoch": 1154} {"train_loss": -21.61075210571289, "global_step": 95837, "epoch": 1154} {"train_loss": -22.009235382080078, "global_step": 95838, "epoch": 1154} {"train_loss": -21.99800682067871, "global_step": 95839, "epoch": 1154} {"train_loss": -21.74611473083496, "global_step": 95840, "epoch": 1154} {"train_loss": -22.054485321044922, "global_step": 95841, "epoch": 1154} {"train_loss": -21.704364776611328, "global_step": 95842, "epoch": 1154} {"train_loss": -22.0548152923584, "global_step": 95843, "epoch": 1154} {"train_loss": -21.720754623413086, "global_step": 95844, "epoch": 1154} {"train_loss": -21.977413177490234, "global_step": 95845, "epoch": 1154} {"train_loss": -21.64255142211914, "global_step": 95846, "epoch": 1154} {"train_loss": -21.6595401763916, "global_step": 95847, "epoch": 1154} {"train_loss": -21.907339096069336, "global_step": 95848, "epoch": 1154} {"train_loss": -21.9990291595459, "global_step": 95849, "epoch": 1154} {"train_loss": -21.630870819091797, "global_step": 95850, "epoch": 1154} {"train_loss": -21.98551368713379, "global_step": 95851, "epoch": 1154} {"train_loss": -21.656631469726562, "global_step": 95852, "epoch": 1154} {"train_loss": -22.056615829467773, "global_step": 95853, "epoch": 1154} {"train_loss": -22.13678550720215, "global_step": 95854, "epoch": 1154} {"train_loss": -21.76773452758789, "global_step": 95855, "epoch": 1154} {"train_loss": -21.135339736938477, "global_step": 95856, "epoch": 1154} {"train_loss": -21.436445236206055, "global_step": 95857, "epoch": 1154} {"train_loss": -21.833871841430664, "global_step": 95858, "epoch": 1154} {"train_loss": -21.560789108276367, "global_step": 95859, "epoch": 1154} {"train_loss": -21.99214744567871, "global_step": 95860, "epoch": 1154} {"train_loss": -21.56197166442871, "global_step": 95861, "epoch": 1154} {"train_loss": -21.860801696777344, "global_step": 95862, "epoch": 1154} {"train_loss": -21.886926651000977, "global_step": 95863, "epoch": 1154} {"train_loss": -21.686584495636353, "global_step": 95864, "epoch": 1154, "val_loss": 6158777.0} {"train_loss": -21.217113494873047, "global_step": 95865, "epoch": 1155} {"train_loss": -21.52665138244629, "global_step": 95866, "epoch": 1155} {"train_loss": -21.442569732666016, "global_step": 95867, "epoch": 1155} {"train_loss": -21.51263999938965, "global_step": 95868, "epoch": 1155} {"train_loss": -21.494874954223633, "global_step": 95869, "epoch": 1155} {"train_loss": -21.67638397216797, "global_step": 95870, "epoch": 1155} {"train_loss": -21.46626853942871, "global_step": 95871, "epoch": 1155} {"train_loss": -21.585973739624023, "global_step": 95872, "epoch": 1155} {"train_loss": -21.435510635375977, "global_step": 95873, "epoch": 1155} {"train_loss": -21.645376205444336, "global_step": 95874, "epoch": 1155} {"train_loss": -21.86493492126465, "global_step": 95875, "epoch": 1155} {"train_loss": -21.840614318847656, "global_step": 95876, "epoch": 1155} {"train_loss": -21.647598266601562, "global_step": 95877, "epoch": 1155} {"train_loss": -21.208112716674805, "global_step": 95878, "epoch": 1155} {"train_loss": -21.835824966430664, "global_step": 95879, "epoch": 1155} {"train_loss": -21.9190731048584, "global_step": 95880, "epoch": 1155} {"train_loss": -21.19874382019043, "global_step": 95881, "epoch": 1155} {"train_loss": -21.6916561126709, "global_step": 95882, "epoch": 1155} {"train_loss": -21.71817398071289, "global_step": 95883, "epoch": 1155} {"train_loss": -21.702722549438477, "global_step": 95884, "epoch": 1155} {"train_loss": -21.985082626342773, "global_step": 95885, "epoch": 1155} {"train_loss": -22.02544593811035, "global_step": 95886, "epoch": 1155} {"train_loss": -21.603870391845703, "global_step": 95887, "epoch": 1155} {"train_loss": -22.00030517578125, "global_step": 95888, "epoch": 1155} {"train_loss": -21.86998748779297, "global_step": 95889, "epoch": 1155} {"train_loss": -21.54096794128418, "global_step": 95890, "epoch": 1155} {"train_loss": -21.73550796508789, "global_step": 95891, "epoch": 1155} {"train_loss": -21.97734260559082, "global_step": 95892, "epoch": 1155} {"train_loss": -21.912702560424805, "global_step": 95893, "epoch": 1155} {"train_loss": -21.704153060913086, "global_step": 95894, "epoch": 1155} {"train_loss": -21.696657180786133, "global_step": 95895, "epoch": 1155} {"train_loss": -21.364036560058594, "global_step": 95896, "epoch": 1155} {"train_loss": -21.961204528808594, "global_step": 95897, "epoch": 1155} {"train_loss": -21.857542037963867, "global_step": 95898, "epoch": 1155} {"train_loss": -21.523725509643555, "global_step": 95899, "epoch": 1155} {"train_loss": -21.656105041503906, "global_step": 95900, "epoch": 1155} {"train_loss": -21.835439682006836, "global_step": 95901, "epoch": 1155} {"train_loss": -21.873550415039062, "global_step": 95902, "epoch": 1155} {"train_loss": -21.947891235351562, "global_step": 95903, "epoch": 1155} {"train_loss": -21.49256706237793, "global_step": 95904, "epoch": 1155} {"train_loss": -22.182086944580078, "global_step": 95905, "epoch": 1155} {"train_loss": -21.927677154541016, "global_step": 95906, "epoch": 1155} {"train_loss": -22.072946548461914, "global_step": 95907, "epoch": 1155} {"train_loss": -21.706350326538086, "global_step": 95908, "epoch": 1155} {"train_loss": -21.892385482788086, "global_step": 95909, "epoch": 1155} {"train_loss": -22.13738441467285, "global_step": 95910, "epoch": 1155} {"train_loss": -21.603286743164062, "global_step": 95911, "epoch": 1155} {"train_loss": -21.800378799438477, "global_step": 95912, "epoch": 1155} {"train_loss": -21.54201889038086, "global_step": 95913, "epoch": 1155} {"train_loss": -21.744674682617188, "global_step": 95914, "epoch": 1155} {"train_loss": -22.1735782623291, "global_step": 95915, "epoch": 1155} {"train_loss": -21.782455444335938, "global_step": 95916, "epoch": 1155} {"train_loss": -21.935405731201172, "global_step": 95917, "epoch": 1155} {"train_loss": -21.939685821533203, "global_step": 95918, "epoch": 1155} {"train_loss": -21.44941520690918, "global_step": 95919, "epoch": 1155} {"train_loss": -21.757688522338867, "global_step": 95920, "epoch": 1155} {"train_loss": -21.959062576293945, "global_step": 95921, "epoch": 1155} {"train_loss": -21.70454216003418, "global_step": 95922, "epoch": 1155} {"train_loss": -21.354415893554688, "global_step": 95923, "epoch": 1155} {"train_loss": -21.481016159057617, "global_step": 95924, "epoch": 1155} {"train_loss": -21.859529495239258, "global_step": 95925, "epoch": 1155} {"train_loss": -21.420337677001953, "global_step": 95926, "epoch": 1155} {"train_loss": -21.77695655822754, "global_step": 95927, "epoch": 1155} {"train_loss": -21.515668869018555, "global_step": 95928, "epoch": 1155} {"train_loss": -21.56647300720215, "global_step": 95929, "epoch": 1155} {"train_loss": -21.539348602294922, "global_step": 95930, "epoch": 1155} {"train_loss": -21.7554988861084, "global_step": 95931, "epoch": 1155} {"train_loss": -21.677671432495117, "global_step": 95932, "epoch": 1155} {"train_loss": -21.95832061767578, "global_step": 95933, "epoch": 1155} {"train_loss": -21.408079147338867, "global_step": 95934, "epoch": 1155} {"train_loss": -21.282453536987305, "global_step": 95935, "epoch": 1155} {"train_loss": -21.923280715942383, "global_step": 95936, "epoch": 1155} {"train_loss": -21.352161407470703, "global_step": 95937, "epoch": 1155} {"train_loss": -21.634504318237305, "global_step": 95938, "epoch": 1155} {"train_loss": -21.562641143798828, "global_step": 95939, "epoch": 1155} {"train_loss": -21.64727210998535, "global_step": 95940, "epoch": 1155} {"train_loss": -21.89295768737793, "global_step": 95941, "epoch": 1155} {"train_loss": -21.919906616210938, "global_step": 95942, "epoch": 1155} {"train_loss": -21.797948837280273, "global_step": 95943, "epoch": 1155} {"train_loss": -22.04860496520996, "global_step": 95944, "epoch": 1155} {"train_loss": -21.875883102416992, "global_step": 95945, "epoch": 1155} {"train_loss": -21.558948516845703, "global_step": 95946, "epoch": 1155} {"train_loss": -21.71054732081402, "global_step": 95947, "epoch": 1155, "val_loss": 6166505.0} {"train_loss": -21.12141227722168, "global_step": 95948, "epoch": 1156} {"train_loss": -21.46272087097168, "global_step": 95949, "epoch": 1156} {"train_loss": -21.665746688842773, "global_step": 95950, "epoch": 1156} {"train_loss": -21.355663299560547, "global_step": 95951, "epoch": 1156} {"train_loss": -21.704181671142578, "global_step": 95952, "epoch": 1156} {"train_loss": -21.175657272338867, "global_step": 95953, "epoch": 1156} {"train_loss": -21.63428497314453, "global_step": 95954, "epoch": 1156} {"train_loss": -21.8292236328125, "global_step": 95955, "epoch": 1156} {"train_loss": -21.438922882080078, "global_step": 95956, "epoch": 1156} {"train_loss": -21.966907501220703, "global_step": 95957, "epoch": 1156} {"train_loss": -21.796436309814453, "global_step": 95958, "epoch": 1156} {"train_loss": -21.866559982299805, "global_step": 95959, "epoch": 1156} {"train_loss": -21.63873863220215, "global_step": 95960, "epoch": 1156} {"train_loss": -21.595386505126953, "global_step": 95961, "epoch": 1156} {"train_loss": -21.753753662109375, "global_step": 95962, "epoch": 1156} {"train_loss": -21.774938583374023, "global_step": 95963, "epoch": 1156} {"train_loss": -21.822919845581055, "global_step": 95964, "epoch": 1156} {"train_loss": -21.490907669067383, "global_step": 95965, "epoch": 1156} {"train_loss": -21.693883895874023, "global_step": 95966, "epoch": 1156} {"train_loss": -21.765399932861328, "global_step": 95967, "epoch": 1156} {"train_loss": -21.651065826416016, "global_step": 95968, "epoch": 1156} {"train_loss": -21.862089157104492, "global_step": 95969, "epoch": 1156} {"train_loss": -21.922277450561523, "global_step": 95970, "epoch": 1156} {"train_loss": -21.974308013916016, "global_step": 95971, "epoch": 1156} {"train_loss": -21.775508880615234, "global_step": 95972, "epoch": 1156} {"train_loss": -21.683103561401367, "global_step": 95973, "epoch": 1156} {"train_loss": -22.002920150756836, "global_step": 95974, "epoch": 1156} {"train_loss": -21.691608428955078, "global_step": 95975, "epoch": 1156} {"train_loss": -21.6298828125, "global_step": 95976, "epoch": 1156} {"train_loss": -21.983877182006836, "global_step": 95977, "epoch": 1156} {"train_loss": -21.863571166992188, "global_step": 95978, "epoch": 1156} {"train_loss": -21.459110260009766, "global_step": 95979, "epoch": 1156} {"train_loss": -22.112192153930664, "global_step": 95980, "epoch": 1156} {"train_loss": -21.86578369140625, "global_step": 95981, "epoch": 1156} {"train_loss": -22.01860809326172, "global_step": 95982, "epoch": 1156} {"train_loss": -22.09022331237793, "global_step": 95983, "epoch": 1156} {"train_loss": -21.91921615600586, "global_step": 95984, "epoch": 1156} {"train_loss": -21.57796859741211, "global_step": 95985, "epoch": 1156} {"train_loss": -22.05428123474121, "global_step": 95986, "epoch": 1156} {"train_loss": -21.77618980407715, "global_step": 95987, "epoch": 1156} {"train_loss": -22.098190307617188, "global_step": 95988, "epoch": 1156} {"train_loss": -21.71100425720215, "global_step": 95989, "epoch": 1156} {"train_loss": -21.979515075683594, "global_step": 95990, "epoch": 1156} {"train_loss": -21.852197647094727, "global_step": 95991, "epoch": 1156} {"train_loss": -21.965763092041016, "global_step": 95992, "epoch": 1156} {"train_loss": -22.01039695739746, "global_step": 95993, "epoch": 1156} {"train_loss": -21.903409957885742, "global_step": 95994, "epoch": 1156} {"train_loss": -21.66349220275879, "global_step": 95995, "epoch": 1156} {"train_loss": -21.67583656311035, "global_step": 95996, "epoch": 1156} {"train_loss": -21.653366088867188, "global_step": 95997, "epoch": 1156} {"train_loss": -21.90135955810547, "global_step": 95998, "epoch": 1156} {"train_loss": -21.867393493652344, "global_step": 95999, "epoch": 1156} {"train_loss": -21.429723739624023, "global_step": 96000, "epoch": 1156} {"train_loss": -22.028165817260742, "global_step": 96001, "epoch": 1156} {"train_loss": -21.281814575195312, "global_step": 96002, "epoch": 1156} {"train_loss": -21.849689483642578, "global_step": 96003, "epoch": 1156} {"train_loss": -21.617511749267578, "global_step": 96004, "epoch": 1156} {"train_loss": -21.55748748779297, "global_step": 96005, "epoch": 1156} {"train_loss": -21.539281845092773, "global_step": 96006, "epoch": 1156} {"train_loss": -21.584125518798828, "global_step": 96007, "epoch": 1156} {"train_loss": -21.51264762878418, "global_step": 96008, "epoch": 1156} {"train_loss": -21.923227310180664, "global_step": 96009, "epoch": 1156} {"train_loss": -21.3498477935791, "global_step": 96010, "epoch": 1156} {"train_loss": -21.597448348999023, "global_step": 96011, "epoch": 1156} {"train_loss": -21.79816246032715, "global_step": 96012, "epoch": 1156} {"train_loss": -21.813922882080078, "global_step": 96013, "epoch": 1156} {"train_loss": -21.51478385925293, "global_step": 96014, "epoch": 1156} {"train_loss": -21.643924713134766, "global_step": 96015, "epoch": 1156} {"train_loss": -21.662595748901367, "global_step": 96016, "epoch": 1156} {"train_loss": -21.496273040771484, "global_step": 96017, "epoch": 1156} {"train_loss": -22.009153366088867, "global_step": 96018, "epoch": 1156} {"train_loss": -21.721389770507812, "global_step": 96019, "epoch": 1156} {"train_loss": -21.94923210144043, "global_step": 96020, "epoch": 1156} {"train_loss": -21.603612899780273, "global_step": 96021, "epoch": 1156} {"train_loss": -21.759029388427734, "global_step": 96022, "epoch": 1156} {"train_loss": -21.87529754638672, "global_step": 96023, "epoch": 1156} {"train_loss": -22.06844711303711, "global_step": 96024, "epoch": 1156} {"train_loss": -21.50091552734375, "global_step": 96025, "epoch": 1156} {"train_loss": -21.766895294189453, "global_step": 96026, "epoch": 1156} {"train_loss": -22.34788703918457, "global_step": 96027, "epoch": 1156} {"train_loss": -21.81863784790039, "global_step": 96028, "epoch": 1156} {"train_loss": -21.998260498046875, "global_step": 96029, "epoch": 1156} {"train_loss": -21.743302908288427, "global_step": 96030, "epoch": 1156, "val_loss": 6142521.0} {"train_loss": -21.356595993041992, "global_step": 96031, "epoch": 1157} {"train_loss": -21.561481475830078, "global_step": 96032, "epoch": 1157} {"train_loss": -21.321348190307617, "global_step": 96033, "epoch": 1157} {"train_loss": -21.232755661010742, "global_step": 96034, "epoch": 1157} {"train_loss": -21.48468017578125, "global_step": 96035, "epoch": 1157} {"train_loss": -21.057157516479492, "global_step": 96036, "epoch": 1157} {"train_loss": -21.652538299560547, "global_step": 96037, "epoch": 1157} {"train_loss": -21.762311935424805, "global_step": 96038, "epoch": 1157} {"train_loss": -21.062345504760742, "global_step": 96039, "epoch": 1157} {"train_loss": -21.153366088867188, "global_step": 96040, "epoch": 1157} {"train_loss": -21.488845825195312, "global_step": 96041, "epoch": 1157} {"train_loss": -21.404685974121094, "global_step": 96042, "epoch": 1157} {"train_loss": -21.7565860748291, "global_step": 96043, "epoch": 1157} {"train_loss": -21.600072860717773, "global_step": 96044, "epoch": 1157} {"train_loss": -21.6290283203125, "global_step": 96045, "epoch": 1157} {"train_loss": -21.570600509643555, "global_step": 96046, "epoch": 1157} {"train_loss": -21.453414916992188, "global_step": 96047, "epoch": 1157} {"train_loss": -21.66364097595215, "global_step": 96048, "epoch": 1157} {"train_loss": -21.21712303161621, "global_step": 96049, "epoch": 1157} {"train_loss": -21.696136474609375, "global_step": 96050, "epoch": 1157} {"train_loss": -21.621875762939453, "global_step": 96051, "epoch": 1157} {"train_loss": -21.82171630859375, "global_step": 96052, "epoch": 1157} {"train_loss": -21.990339279174805, "global_step": 96053, "epoch": 1157} {"train_loss": -21.688669204711914, "global_step": 96054, "epoch": 1157} {"train_loss": -21.455663681030273, "global_step": 96055, "epoch": 1157} {"train_loss": -21.782678604125977, "global_step": 96056, "epoch": 1157} {"train_loss": -21.696414947509766, "global_step": 96057, "epoch": 1157} {"train_loss": -21.76352882385254, "global_step": 96058, "epoch": 1157} {"train_loss": -21.6398868560791, "global_step": 96059, "epoch": 1157} {"train_loss": -21.667987823486328, "global_step": 96060, "epoch": 1157} {"train_loss": -21.567378997802734, "global_step": 96061, "epoch": 1157} {"train_loss": -21.826007843017578, "global_step": 96062, "epoch": 1157} {"train_loss": -21.53627586364746, "global_step": 96063, "epoch": 1157} {"train_loss": -21.715805053710938, "global_step": 96064, "epoch": 1157} {"train_loss": -21.85195541381836, "global_step": 96065, "epoch": 1157} {"train_loss": -22.076257705688477, "global_step": 96066, "epoch": 1157} {"train_loss": -21.628759384155273, "global_step": 96067, "epoch": 1157} {"train_loss": -21.86317253112793, "global_step": 96068, "epoch": 1157} {"train_loss": -21.834339141845703, "global_step": 96069, "epoch": 1157} {"train_loss": -21.949939727783203, "global_step": 96070, "epoch": 1157} {"train_loss": -21.752729415893555, "global_step": 96071, "epoch": 1157} {"train_loss": -21.900924682617188, "global_step": 96072, "epoch": 1157} {"train_loss": -21.407838821411133, "global_step": 96073, "epoch": 1157} {"train_loss": -22.073673248291016, "global_step": 96074, "epoch": 1157} {"train_loss": -21.88953399658203, "global_step": 96075, "epoch": 1157} {"train_loss": -21.45708656311035, "global_step": 96076, "epoch": 1157} {"train_loss": -22.06658935546875, "global_step": 96077, "epoch": 1157} {"train_loss": -21.841781616210938, "global_step": 96078, "epoch": 1157} {"train_loss": -21.711225509643555, "global_step": 96079, "epoch": 1157} {"train_loss": -21.741430282592773, "global_step": 96080, "epoch": 1157} {"train_loss": -21.54374122619629, "global_step": 96081, "epoch": 1157} {"train_loss": -21.91766357421875, "global_step": 96082, "epoch": 1157} {"train_loss": -21.859987258911133, "global_step": 96083, "epoch": 1157} {"train_loss": -21.862089157104492, "global_step": 96084, "epoch": 1157} {"train_loss": -21.861961364746094, "global_step": 96085, "epoch": 1157} {"train_loss": -21.80405044555664, "global_step": 96086, "epoch": 1157} {"train_loss": -21.54608154296875, "global_step": 96087, "epoch": 1157} {"train_loss": -21.377870559692383, "global_step": 96088, "epoch": 1157} {"train_loss": -21.919387817382812, "global_step": 96089, "epoch": 1157} {"train_loss": -21.873205184936523, "global_step": 96090, "epoch": 1157} {"train_loss": -21.58927345275879, "global_step": 96091, "epoch": 1157} {"train_loss": -22.00971031188965, "global_step": 96092, "epoch": 1157} {"train_loss": -21.946142196655273, "global_step": 96093, "epoch": 1157} {"train_loss": -21.45509910583496, "global_step": 96094, "epoch": 1157} {"train_loss": -22.079269409179688, "global_step": 96095, "epoch": 1157} {"train_loss": -21.678083419799805, "global_step": 96096, "epoch": 1157} {"train_loss": -22.046354293823242, "global_step": 96097, "epoch": 1157} {"train_loss": -21.763809204101562, "global_step": 96098, "epoch": 1157} {"train_loss": -21.815279006958008, "global_step": 96099, "epoch": 1157} {"train_loss": -21.831850051879883, "global_step": 96100, "epoch": 1157} {"train_loss": -21.808574676513672, "global_step": 96101, "epoch": 1157} {"train_loss": -21.340497970581055, "global_step": 96102, "epoch": 1157} {"train_loss": -22.04974937438965, "global_step": 96103, "epoch": 1157} {"train_loss": -21.771987915039062, "global_step": 96104, "epoch": 1157} {"train_loss": -21.861921310424805, "global_step": 96105, "epoch": 1157} {"train_loss": -21.935922622680664, "global_step": 96106, "epoch": 1157} {"train_loss": -21.346899032592773, "global_step": 96107, "epoch": 1157} {"train_loss": -21.546422958374023, "global_step": 96108, "epoch": 1157} {"train_loss": -21.907251358032227, "global_step": 96109, "epoch": 1157} {"train_loss": -22.03604507446289, "global_step": 96110, "epoch": 1157} {"train_loss": -21.740659713745117, "global_step": 96111, "epoch": 1157} {"train_loss": -22.058313369750977, "global_step": 96112, "epoch": 1157} {"train_loss": -21.690753362264978, "global_step": 96113, "epoch": 1157, "val_loss": 6047883.5} {"train_loss": -21.30251121520996, "global_step": 96114, "epoch": 1158} {"train_loss": -21.31336784362793, "global_step": 96115, "epoch": 1158} {"train_loss": -21.030532836914062, "global_step": 96116, "epoch": 1158} {"train_loss": -21.631057739257812, "global_step": 96117, "epoch": 1158} {"train_loss": -21.157350540161133, "global_step": 96118, "epoch": 1158} {"train_loss": -21.501401901245117, "global_step": 96119, "epoch": 1158} {"train_loss": -21.83091926574707, "global_step": 96120, "epoch": 1158} {"train_loss": -21.755224227905273, "global_step": 96121, "epoch": 1158} {"train_loss": -21.35556983947754, "global_step": 96122, "epoch": 1158} {"train_loss": -22.131574630737305, "global_step": 96123, "epoch": 1158} {"train_loss": -21.732206344604492, "global_step": 96124, "epoch": 1158} {"train_loss": -21.501422882080078, "global_step": 96125, "epoch": 1158} {"train_loss": -21.264760971069336, "global_step": 96126, "epoch": 1158} {"train_loss": -21.520238876342773, "global_step": 96127, "epoch": 1158} {"train_loss": -22.20594596862793, "global_step": 96128, "epoch": 1158} {"train_loss": -21.73065757751465, "global_step": 96129, "epoch": 1158} {"train_loss": -21.599096298217773, "global_step": 96130, "epoch": 1158} {"train_loss": -22.030109405517578, "global_step": 96131, "epoch": 1158} {"train_loss": -21.930490493774414, "global_step": 96132, "epoch": 1158} {"train_loss": -21.905460357666016, "global_step": 96133, "epoch": 1158} {"train_loss": -21.804763793945312, "global_step": 96134, "epoch": 1158} {"train_loss": -22.08265495300293, "global_step": 96135, "epoch": 1158} {"train_loss": -21.70893669128418, "global_step": 96136, "epoch": 1158} {"train_loss": -21.977893829345703, "global_step": 96137, "epoch": 1158} {"train_loss": -21.56711196899414, "global_step": 96138, "epoch": 1158} {"train_loss": -21.450876235961914, "global_step": 96139, "epoch": 1158} {"train_loss": -21.856060028076172, "global_step": 96140, "epoch": 1158} {"train_loss": -21.703102111816406, "global_step": 96141, "epoch": 1158} {"train_loss": -21.547086715698242, "global_step": 96142, "epoch": 1158} {"train_loss": -21.79914665222168, "global_step": 96143, "epoch": 1158} {"train_loss": -21.721363067626953, "global_step": 96144, "epoch": 1158} {"train_loss": -21.818191528320312, "global_step": 96145, "epoch": 1158} {"train_loss": -21.716032028198242, "global_step": 96146, "epoch": 1158} {"train_loss": -21.611671447753906, "global_step": 96147, "epoch": 1158} {"train_loss": -22.133825302124023, "global_step": 96148, "epoch": 1158} {"train_loss": -21.718921661376953, "global_step": 96149, "epoch": 1158} {"train_loss": -21.5408992767334, "global_step": 96150, "epoch": 1158} {"train_loss": -21.691404342651367, "global_step": 96151, "epoch": 1158} {"train_loss": -21.82387351989746, "global_step": 96152, "epoch": 1158} {"train_loss": -21.935253143310547, "global_step": 96153, "epoch": 1158} {"train_loss": -21.540433883666992, "global_step": 96154, "epoch": 1158} {"train_loss": -21.88199234008789, "global_step": 96155, "epoch": 1158} {"train_loss": -21.432897567749023, "global_step": 96156, "epoch": 1158} {"train_loss": -21.381322860717773, "global_step": 96157, "epoch": 1158} {"train_loss": -21.99126625061035, "global_step": 96158, "epoch": 1158} {"train_loss": -21.506092071533203, "global_step": 96159, "epoch": 1158} {"train_loss": -21.840011596679688, "global_step": 96160, "epoch": 1158} {"train_loss": -21.560209274291992, "global_step": 96161, "epoch": 1158} {"train_loss": -21.745113372802734, "global_step": 96162, "epoch": 1158} {"train_loss": -21.511180877685547, "global_step": 96163, "epoch": 1158} {"train_loss": -21.9649658203125, "global_step": 96164, "epoch": 1158} {"train_loss": -21.8365421295166, "global_step": 96165, "epoch": 1158} {"train_loss": -21.776212692260742, "global_step": 96166, "epoch": 1158} {"train_loss": -21.92875862121582, "global_step": 96167, "epoch": 1158} {"train_loss": -21.18912124633789, "global_step": 96168, "epoch": 1158} {"train_loss": -21.900318145751953, "global_step": 96169, "epoch": 1158} {"train_loss": -21.99589729309082, "global_step": 96170, "epoch": 1158} {"train_loss": -21.510540008544922, "global_step": 96171, "epoch": 1158} {"train_loss": -21.873476028442383, "global_step": 96172, "epoch": 1158} {"train_loss": -21.4260196685791, "global_step": 96173, "epoch": 1158} {"train_loss": -21.710264205932617, "global_step": 96174, "epoch": 1158} {"train_loss": -21.85129737854004, "global_step": 96175, "epoch": 1158} {"train_loss": -21.876188278198242, "global_step": 96176, "epoch": 1158} {"train_loss": -22.002212524414062, "global_step": 96177, "epoch": 1158} {"train_loss": -21.23361587524414, "global_step": 96178, "epoch": 1158} {"train_loss": -21.9361629486084, "global_step": 96179, "epoch": 1158} {"train_loss": -21.709165573120117, "global_step": 96180, "epoch": 1158} {"train_loss": -21.701169967651367, "global_step": 96181, "epoch": 1158} {"train_loss": -22.038665771484375, "global_step": 96182, "epoch": 1158} {"train_loss": -21.77117347717285, "global_step": 96183, "epoch": 1158} {"train_loss": -21.7917537689209, "global_step": 96184, "epoch": 1158} {"train_loss": -21.780012130737305, "global_step": 96185, "epoch": 1158} {"train_loss": -21.675729751586914, "global_step": 96186, "epoch": 1158} {"train_loss": -21.82126235961914, "global_step": 96187, "epoch": 1158} {"train_loss": -22.069135665893555, "global_step": 96188, "epoch": 1158} {"train_loss": -21.983686447143555, "global_step": 96189, "epoch": 1158} {"train_loss": -21.571426391601562, "global_step": 96190, "epoch": 1158} {"train_loss": -21.716657638549805, "global_step": 96191, "epoch": 1158} {"train_loss": -22.137243270874023, "global_step": 96192, "epoch": 1158} {"train_loss": -21.71571159362793, "global_step": 96193, "epoch": 1158} {"train_loss": -22.277172088623047, "global_step": 96194, "epoch": 1158} {"train_loss": -21.575729370117188, "global_step": 96195, "epoch": 1158} {"train_loss": -21.715673354734857, "global_step": 96196, "epoch": 1158, "val_loss": 6067502.0} {"train_loss": -21.296972274780273, "global_step": 96197, "epoch": 1159} {"train_loss": -21.763891220092773, "global_step": 96198, "epoch": 1159} {"train_loss": -21.03929328918457, "global_step": 96199, "epoch": 1159} {"train_loss": -21.57036018371582, "global_step": 96200, "epoch": 1159} {"train_loss": -21.679960250854492, "global_step": 96201, "epoch": 1159} {"train_loss": -21.365161895751953, "global_step": 96202, "epoch": 1159} {"train_loss": -21.561697006225586, "global_step": 96203, "epoch": 1159} {"train_loss": -21.33579444885254, "global_step": 96204, "epoch": 1159} {"train_loss": -21.445743560791016, "global_step": 96205, "epoch": 1159} {"train_loss": -21.564714431762695, "global_step": 96206, "epoch": 1159} {"train_loss": -21.739334106445312, "global_step": 96207, "epoch": 1159} {"train_loss": -21.490097045898438, "global_step": 96208, "epoch": 1159} {"train_loss": -21.5540828704834, "global_step": 96209, "epoch": 1159} {"train_loss": -21.83551597595215, "global_step": 96210, "epoch": 1159} {"train_loss": -21.58649253845215, "global_step": 96211, "epoch": 1159} {"train_loss": -21.339441299438477, "global_step": 96212, "epoch": 1159} {"train_loss": -21.372669219970703, "global_step": 96213, "epoch": 1159} {"train_loss": -21.790632247924805, "global_step": 96214, "epoch": 1159} {"train_loss": -21.604650497436523, "global_step": 96215, "epoch": 1159} {"train_loss": -21.443578720092773, "global_step": 96216, "epoch": 1159} {"train_loss": -21.766555786132812, "global_step": 96217, "epoch": 1159} {"train_loss": -21.535411834716797, "global_step": 96218, "epoch": 1159} {"train_loss": -21.59992027282715, "global_step": 96219, "epoch": 1159} {"train_loss": -21.872201919555664, "global_step": 96220, "epoch": 1159} {"train_loss": -21.854984283447266, "global_step": 96221, "epoch": 1159} {"train_loss": -21.850753784179688, "global_step": 96222, "epoch": 1159} {"train_loss": -21.658857345581055, "global_step": 96223, "epoch": 1159} {"train_loss": -22.11739158630371, "global_step": 96224, "epoch": 1159} {"train_loss": -22.22585678100586, "global_step": 96225, "epoch": 1159} {"train_loss": -22.07711410522461, "global_step": 96226, "epoch": 1159} {"train_loss": -21.57822608947754, "global_step": 96227, "epoch": 1159} {"train_loss": -21.52981948852539, "global_step": 96228, "epoch": 1159} {"train_loss": -21.76309585571289, "global_step": 96229, "epoch": 1159} {"train_loss": -22.11311912536621, "global_step": 96230, "epoch": 1159} {"train_loss": -21.91694450378418, "global_step": 96231, "epoch": 1159} {"train_loss": -21.772262573242188, "global_step": 96232, "epoch": 1159} {"train_loss": -21.753713607788086, "global_step": 96233, "epoch": 1159} {"train_loss": -21.65707778930664, "global_step": 96234, "epoch": 1159} {"train_loss": -21.95208740234375, "global_step": 96235, "epoch": 1159} {"train_loss": -21.91025161743164, "global_step": 96236, "epoch": 1159} {"train_loss": -21.54444694519043, "global_step": 96237, "epoch": 1159} {"train_loss": -21.746240615844727, "global_step": 96238, "epoch": 1159} {"train_loss": -21.85338020324707, "global_step": 96239, "epoch": 1159} {"train_loss": -22.019804000854492, "global_step": 96240, "epoch": 1159} {"train_loss": -21.785402297973633, "global_step": 96241, "epoch": 1159} {"train_loss": -21.8091983795166, "global_step": 96242, "epoch": 1159} {"train_loss": -21.549856185913086, "global_step": 96243, "epoch": 1159} {"train_loss": -22.20452308654785, "global_step": 96244, "epoch": 1159} {"train_loss": -21.9056339263916, "global_step": 96245, "epoch": 1159} {"train_loss": -21.602706909179688, "global_step": 96246, "epoch": 1159} {"train_loss": -21.611005783081055, "global_step": 96247, "epoch": 1159} {"train_loss": -21.575895309448242, "global_step": 96248, "epoch": 1159} {"train_loss": -21.8848819732666, "global_step": 96249, "epoch": 1159} {"train_loss": -21.779541015625, "global_step": 96250, "epoch": 1159} {"train_loss": -21.940515518188477, "global_step": 96251, "epoch": 1159} {"train_loss": -22.203107833862305, "global_step": 96252, "epoch": 1159} {"train_loss": -21.890758514404297, "global_step": 96253, "epoch": 1159} {"train_loss": -21.973310470581055, "global_step": 96254, "epoch": 1159} {"train_loss": -22.302364349365234, "global_step": 96255, "epoch": 1159} {"train_loss": -22.0761775970459, "global_step": 96256, "epoch": 1159} {"train_loss": -22.25908851623535, "global_step": 96257, "epoch": 1159} {"train_loss": -21.90085792541504, "global_step": 96258, "epoch": 1159} {"train_loss": -22.02804946899414, "global_step": 96259, "epoch": 1159} {"train_loss": -21.606964111328125, "global_step": 96260, "epoch": 1159} {"train_loss": -21.907224655151367, "global_step": 96261, "epoch": 1159} {"train_loss": -22.250728607177734, "global_step": 96262, "epoch": 1159} {"train_loss": -21.89548683166504, "global_step": 96263, "epoch": 1159} {"train_loss": -21.97216796875, "global_step": 96264, "epoch": 1159} {"train_loss": -21.890661239624023, "global_step": 96265, "epoch": 1159} {"train_loss": -22.26311683654785, "global_step": 96266, "epoch": 1159} {"train_loss": -21.870758056640625, "global_step": 96267, "epoch": 1159} {"train_loss": -21.664098739624023, "global_step": 96268, "epoch": 1159} {"train_loss": -22.14769744873047, "global_step": 96269, "epoch": 1159} {"train_loss": -21.751134872436523, "global_step": 96270, "epoch": 1159} {"train_loss": -21.962427139282227, "global_step": 96271, "epoch": 1159} {"train_loss": -22.095495223999023, "global_step": 96272, "epoch": 1159} {"train_loss": -21.68450927734375, "global_step": 96273, "epoch": 1159} {"train_loss": -21.553266525268555, "global_step": 96274, "epoch": 1159} {"train_loss": -21.979013442993164, "global_step": 96275, "epoch": 1159} {"train_loss": -21.79960060119629, "global_step": 96276, "epoch": 1159} {"train_loss": -22.078935623168945, "global_step": 96277, "epoch": 1159} {"train_loss": -22.266706466674805, "global_step": 96278, "epoch": 1159} {"train_loss": -21.790218973734294, "global_step": 96279, "epoch": 1159, "val_loss": 6266058.0} {"train_loss": -21.848020553588867, "global_step": 96280, "epoch": 1160} {"train_loss": -21.655651092529297, "global_step": 96281, "epoch": 1160} {"train_loss": -21.766448974609375, "global_step": 96282, "epoch": 1160} {"train_loss": -21.431310653686523, "global_step": 96283, "epoch": 1160} {"train_loss": -21.745737075805664, "global_step": 96284, "epoch": 1160} {"train_loss": -21.591201782226562, "global_step": 96285, "epoch": 1160} {"train_loss": -21.755542755126953, "global_step": 96286, "epoch": 1160} {"train_loss": -21.538496017456055, "global_step": 96287, "epoch": 1160} {"train_loss": -21.75091552734375, "global_step": 96288, "epoch": 1160} {"train_loss": -22.014806747436523, "global_step": 96289, "epoch": 1160} {"train_loss": -21.803701400756836, "global_step": 96290, "epoch": 1160} {"train_loss": -21.628965377807617, "global_step": 96291, "epoch": 1160} {"train_loss": -21.73947525024414, "global_step": 96292, "epoch": 1160} {"train_loss": -21.776947021484375, "global_step": 96293, "epoch": 1160} {"train_loss": -21.956979751586914, "global_step": 96294, "epoch": 1160} {"train_loss": -21.619964599609375, "global_step": 96295, "epoch": 1160} {"train_loss": -21.733646392822266, "global_step": 96296, "epoch": 1160} {"train_loss": -21.89376449584961, "global_step": 96297, "epoch": 1160} {"train_loss": -21.876611709594727, "global_step": 96298, "epoch": 1160} {"train_loss": -22.209760665893555, "global_step": 96299, "epoch": 1160} {"train_loss": -21.859107971191406, "global_step": 96300, "epoch": 1160} {"train_loss": -21.74994659423828, "global_step": 96301, "epoch": 1160} {"train_loss": -21.858720779418945, "global_step": 96302, "epoch": 1160} {"train_loss": -21.924314498901367, "global_step": 96303, "epoch": 1160} {"train_loss": -22.02313804626465, "global_step": 96304, "epoch": 1160} {"train_loss": -21.776174545288086, "global_step": 96305, "epoch": 1160} {"train_loss": -22.012479782104492, "global_step": 96306, "epoch": 1160} {"train_loss": -21.949481964111328, "global_step": 96307, "epoch": 1160} {"train_loss": -21.914997100830078, "global_step": 96308, "epoch": 1160} {"train_loss": -21.654970169067383, "global_step": 96309, "epoch": 1160} {"train_loss": -21.966693878173828, "global_step": 96310, "epoch": 1160} {"train_loss": -21.868515014648438, "global_step": 96311, "epoch": 1160} {"train_loss": -21.915210723876953, "global_step": 96312, "epoch": 1160} {"train_loss": -21.87578582763672, "global_step": 96313, "epoch": 1160} {"train_loss": -22.194461822509766, "global_step": 96314, "epoch": 1160} {"train_loss": -22.015029907226562, "global_step": 96315, "epoch": 1160} {"train_loss": -21.939056396484375, "global_step": 96316, "epoch": 1160} {"train_loss": -21.71172523498535, "global_step": 96317, "epoch": 1160} {"train_loss": -21.483015060424805, "global_step": 96318, "epoch": 1160} {"train_loss": -21.770307540893555, "global_step": 96319, "epoch": 1160} {"train_loss": -22.04400062561035, "global_step": 96320, "epoch": 1160} {"train_loss": -22.142850875854492, "global_step": 96321, "epoch": 1160} {"train_loss": -21.844942092895508, "global_step": 96322, "epoch": 1160} {"train_loss": -22.004568099975586, "global_step": 96323, "epoch": 1160} {"train_loss": -21.872522354125977, "global_step": 96324, "epoch": 1160} {"train_loss": -21.25528907775879, "global_step": 96325, "epoch": 1160} {"train_loss": -21.670663833618164, "global_step": 96326, "epoch": 1160} {"train_loss": -21.597999572753906, "global_step": 96327, "epoch": 1160} {"train_loss": -21.70052146911621, "global_step": 96328, "epoch": 1160} {"train_loss": -21.22848892211914, "global_step": 96329, "epoch": 1160} {"train_loss": -22.096256256103516, "global_step": 96330, "epoch": 1160} {"train_loss": -21.719213485717773, "global_step": 96331, "epoch": 1160} {"train_loss": -21.587024688720703, "global_step": 96332, "epoch": 1160} {"train_loss": -22.004240036010742, "global_step": 96333, "epoch": 1160} {"train_loss": -21.690696716308594, "global_step": 96334, "epoch": 1160} {"train_loss": -21.970205307006836, "global_step": 96335, "epoch": 1160} {"train_loss": -21.84197425842285, "global_step": 96336, "epoch": 1160} {"train_loss": -21.90669059753418, "global_step": 96337, "epoch": 1160} {"train_loss": -22.20186424255371, "global_step": 96338, "epoch": 1160} {"train_loss": -22.00508689880371, "global_step": 96339, "epoch": 1160} {"train_loss": -21.9119930267334, "global_step": 96340, "epoch": 1160} {"train_loss": -21.483285903930664, "global_step": 96341, "epoch": 1160} {"train_loss": -22.056825637817383, "global_step": 96342, "epoch": 1160} {"train_loss": -21.29462242126465, "global_step": 96343, "epoch": 1160} {"train_loss": -21.329425811767578, "global_step": 96344, "epoch": 1160} {"train_loss": -21.215490341186523, "global_step": 96345, "epoch": 1160} {"train_loss": -21.720624923706055, "global_step": 96346, "epoch": 1160} {"train_loss": -21.69975471496582, "global_step": 96347, "epoch": 1160} {"train_loss": -21.38804054260254, "global_step": 96348, "epoch": 1160} {"train_loss": -21.824453353881836, "global_step": 96349, "epoch": 1160} {"train_loss": -21.912878036499023, "global_step": 96350, "epoch": 1160} {"train_loss": -21.94281005859375, "global_step": 96351, "epoch": 1160} {"train_loss": -22.145233154296875, "global_step": 96352, "epoch": 1160} {"train_loss": -21.87391471862793, "global_step": 96353, "epoch": 1160} {"train_loss": -21.731794357299805, "global_step": 96354, "epoch": 1160} {"train_loss": -21.81688690185547, "global_step": 96355, "epoch": 1160} {"train_loss": -21.951749801635742, "global_step": 96356, "epoch": 1160} {"train_loss": -21.6768798828125, "global_step": 96357, "epoch": 1160} {"train_loss": -21.59840202331543, "global_step": 96358, "epoch": 1160} {"train_loss": -22.20858383178711, "global_step": 96359, "epoch": 1160} {"train_loss": -22.091466903686523, "global_step": 96360, "epoch": 1160} {"train_loss": -22.16755485534668, "global_step": 96361, "epoch": 1160} {"train_loss": -21.779176022633013, "global_step": 96362, "epoch": 1160, "val_loss": 6170985.0} {"train_loss": -21.402833938598633, "global_step": 96363, "epoch": 1161} {"train_loss": -21.540063858032227, "global_step": 96364, "epoch": 1161} {"train_loss": -21.649030685424805, "global_step": 96365, "epoch": 1161} {"train_loss": -21.56964683532715, "global_step": 96366, "epoch": 1161} {"train_loss": -21.789596557617188, "global_step": 96367, "epoch": 1161} {"train_loss": -21.157651901245117, "global_step": 96368, "epoch": 1161} {"train_loss": -21.714832305908203, "global_step": 96369, "epoch": 1161} {"train_loss": -21.652667999267578, "global_step": 96370, "epoch": 1161} {"train_loss": -21.668174743652344, "global_step": 96371, "epoch": 1161} {"train_loss": -21.656707763671875, "global_step": 96372, "epoch": 1161} {"train_loss": -21.62580108642578, "global_step": 96373, "epoch": 1161} {"train_loss": -21.51346778869629, "global_step": 96374, "epoch": 1161} {"train_loss": -21.60837173461914, "global_step": 96375, "epoch": 1161} {"train_loss": -21.924028396606445, "global_step": 96376, "epoch": 1161} {"train_loss": -21.99924659729004, "global_step": 96377, "epoch": 1161} {"train_loss": -21.675016403198242, "global_step": 96378, "epoch": 1161} {"train_loss": -21.68587303161621, "global_step": 96379, "epoch": 1161} {"train_loss": -21.388914108276367, "global_step": 96380, "epoch": 1161} {"train_loss": -21.912094116210938, "global_step": 96381, "epoch": 1161} {"train_loss": -21.8212947845459, "global_step": 96382, "epoch": 1161} {"train_loss": -21.364957809448242, "global_step": 96383, "epoch": 1161} {"train_loss": -21.844030380249023, "global_step": 96384, "epoch": 1161} {"train_loss": -21.63517189025879, "global_step": 96385, "epoch": 1161} {"train_loss": -21.73931884765625, "global_step": 96386, "epoch": 1161} {"train_loss": -22.213987350463867, "global_step": 96387, "epoch": 1161} {"train_loss": -21.941396713256836, "global_step": 96388, "epoch": 1161} {"train_loss": -21.881866455078125, "global_step": 96389, "epoch": 1161} {"train_loss": -21.952558517456055, "global_step": 96390, "epoch": 1161} {"train_loss": -21.953481674194336, "global_step": 96391, "epoch": 1161} {"train_loss": -21.691530227661133, "global_step": 96392, "epoch": 1161} {"train_loss": -21.64516258239746, "global_step": 96393, "epoch": 1161} {"train_loss": -21.98834800720215, "global_step": 96394, "epoch": 1161} {"train_loss": -21.790390014648438, "global_step": 96395, "epoch": 1161} {"train_loss": -21.83673858642578, "global_step": 96396, "epoch": 1161} {"train_loss": -21.596101760864258, "global_step": 96397, "epoch": 1161} {"train_loss": -21.552122116088867, "global_step": 96398, "epoch": 1161} {"train_loss": -21.718427658081055, "global_step": 96399, "epoch": 1161} {"train_loss": -21.67068099975586, "global_step": 96400, "epoch": 1161} {"train_loss": -22.008682250976562, "global_step": 96401, "epoch": 1161} {"train_loss": -21.734970092773438, "global_step": 96402, "epoch": 1161} {"train_loss": -21.663267135620117, "global_step": 96403, "epoch": 1161} {"train_loss": -21.607200622558594, "global_step": 96404, "epoch": 1161} {"train_loss": -21.882312774658203, "global_step": 96405, "epoch": 1161} {"train_loss": -21.931745529174805, "global_step": 96406, "epoch": 1161} {"train_loss": -21.911848068237305, "global_step": 96407, "epoch": 1161} {"train_loss": -21.624216079711914, "global_step": 96408, "epoch": 1161} {"train_loss": -22.18207359313965, "global_step": 96409, "epoch": 1161} {"train_loss": -22.14122200012207, "global_step": 96410, "epoch": 1161} {"train_loss": -21.850854873657227, "global_step": 96411, "epoch": 1161} {"train_loss": -22.11436653137207, "global_step": 96412, "epoch": 1161} {"train_loss": -21.674795150756836, "global_step": 96413, "epoch": 1161} {"train_loss": -21.726001739501953, "global_step": 96414, "epoch": 1161} {"train_loss": -21.80769157409668, "global_step": 96415, "epoch": 1161} {"train_loss": -21.779890060424805, "global_step": 96416, "epoch": 1161} {"train_loss": -21.82673454284668, "global_step": 96417, "epoch": 1161} {"train_loss": -22.233755111694336, "global_step": 96418, "epoch": 1161} {"train_loss": -21.734699249267578, "global_step": 96419, "epoch": 1161} {"train_loss": -22.05240821838379, "global_step": 96420, "epoch": 1161} {"train_loss": -21.722747802734375, "global_step": 96421, "epoch": 1161} {"train_loss": -22.06977653503418, "global_step": 96422, "epoch": 1161} {"train_loss": -21.957223892211914, "global_step": 96423, "epoch": 1161} {"train_loss": -21.747617721557617, "global_step": 96424, "epoch": 1161} {"train_loss": -21.665029525756836, "global_step": 96425, "epoch": 1161} {"train_loss": -21.989072799682617, "global_step": 96426, "epoch": 1161} {"train_loss": -21.748188018798828, "global_step": 96427, "epoch": 1161} {"train_loss": -21.562931060791016, "global_step": 96428, "epoch": 1161} {"train_loss": -21.657087326049805, "global_step": 96429, "epoch": 1161} {"train_loss": -21.332569122314453, "global_step": 96430, "epoch": 1161} {"train_loss": -21.965505599975586, "global_step": 96431, "epoch": 1161} {"train_loss": -21.914091110229492, "global_step": 96432, "epoch": 1161} {"train_loss": -21.450551986694336, "global_step": 96433, "epoch": 1161} {"train_loss": -21.12642478942871, "global_step": 96434, "epoch": 1161} {"train_loss": -21.792163848876953, "global_step": 96435, "epoch": 1161} {"train_loss": -21.296098709106445, "global_step": 96436, "epoch": 1161} {"train_loss": -21.92824363708496, "global_step": 96437, "epoch": 1161} {"train_loss": -21.926828384399414, "global_step": 96438, "epoch": 1161} {"train_loss": -21.48577308654785, "global_step": 96439, "epoch": 1161} {"train_loss": -22.024917602539062, "global_step": 96440, "epoch": 1161} {"train_loss": -21.50644302368164, "global_step": 96441, "epoch": 1161} {"train_loss": -21.631193161010742, "global_step": 96442, "epoch": 1161} {"train_loss": -21.663434982299805, "global_step": 96443, "epoch": 1161} {"train_loss": -21.684799194335938, "global_step": 96444, "epoch": 1161} {"train_loss": -21.73551954706031, "global_step": 96445, "epoch": 1161, "val_loss": 5990456.0} {"train_loss": -21.095537185668945, "global_step": 96446, "epoch": 1162} {"train_loss": -21.619474411010742, "global_step": 96447, "epoch": 1162} {"train_loss": -21.442617416381836, "global_step": 96448, "epoch": 1162} {"train_loss": -21.359525680541992, "global_step": 96449, "epoch": 1162} {"train_loss": -21.827136993408203, "global_step": 96450, "epoch": 1162} {"train_loss": -21.29803466796875, "global_step": 96451, "epoch": 1162} {"train_loss": -21.257421493530273, "global_step": 96452, "epoch": 1162} {"train_loss": -21.676410675048828, "global_step": 96453, "epoch": 1162} {"train_loss": -21.726703643798828, "global_step": 96454, "epoch": 1162} {"train_loss": -21.461162567138672, "global_step": 96455, "epoch": 1162} {"train_loss": -21.65964698791504, "global_step": 96456, "epoch": 1162} {"train_loss": -20.8217716217041, "global_step": 96457, "epoch": 1162} {"train_loss": -21.885238647460938, "global_step": 96458, "epoch": 1162} {"train_loss": -21.521930694580078, "global_step": 96459, "epoch": 1162} {"train_loss": -21.636869430541992, "global_step": 96460, "epoch": 1162} {"train_loss": -21.898481369018555, "global_step": 96461, "epoch": 1162} {"train_loss": -21.806642532348633, "global_step": 96462, "epoch": 1162} {"train_loss": -21.758106231689453, "global_step": 96463, "epoch": 1162} {"train_loss": -21.537382125854492, "global_step": 96464, "epoch": 1162} {"train_loss": -21.5191593170166, "global_step": 96465, "epoch": 1162} {"train_loss": -21.522356033325195, "global_step": 96466, "epoch": 1162} {"train_loss": -21.776866912841797, "global_step": 96467, "epoch": 1162} {"train_loss": -21.35129165649414, "global_step": 96468, "epoch": 1162} {"train_loss": -21.52667808532715, "global_step": 96469, "epoch": 1162} {"train_loss": -21.74837303161621, "global_step": 96470, "epoch": 1162} {"train_loss": -21.28559112548828, "global_step": 96471, "epoch": 1162} {"train_loss": -21.926258087158203, "global_step": 96472, "epoch": 1162} {"train_loss": -22.02715492248535, "global_step": 96473, "epoch": 1162} {"train_loss": -21.55854606628418, "global_step": 96474, "epoch": 1162} {"train_loss": -22.149267196655273, "global_step": 96475, "epoch": 1162} {"train_loss": -21.504117965698242, "global_step": 96476, "epoch": 1162} {"train_loss": -22.015195846557617, "global_step": 96477, "epoch": 1162} {"train_loss": -21.92888832092285, "global_step": 96478, "epoch": 1162} {"train_loss": -21.66737174987793, "global_step": 96479, "epoch": 1162} {"train_loss": -21.742799758911133, "global_step": 96480, "epoch": 1162} {"train_loss": -21.693082809448242, "global_step": 96481, "epoch": 1162} {"train_loss": -22.182083129882812, "global_step": 96482, "epoch": 1162} {"train_loss": -21.837146759033203, "global_step": 96483, "epoch": 1162} {"train_loss": -21.915515899658203, "global_step": 96484, "epoch": 1162} {"train_loss": -21.5296630859375, "global_step": 96485, "epoch": 1162} {"train_loss": -21.800058364868164, "global_step": 96486, "epoch": 1162} {"train_loss": -21.87037467956543, "global_step": 96487, "epoch": 1162} {"train_loss": -21.919300079345703, "global_step": 96488, "epoch": 1162} {"train_loss": -21.802509307861328, "global_step": 96489, "epoch": 1162} {"train_loss": -21.622467041015625, "global_step": 96490, "epoch": 1162} {"train_loss": -22.266300201416016, "global_step": 96491, "epoch": 1162} {"train_loss": -21.632261276245117, "global_step": 96492, "epoch": 1162} {"train_loss": -21.632787704467773, "global_step": 96493, "epoch": 1162} {"train_loss": -21.965171813964844, "global_step": 96494, "epoch": 1162} {"train_loss": -21.58487319946289, "global_step": 96495, "epoch": 1162} {"train_loss": -21.46159553527832, "global_step": 96496, "epoch": 1162} {"train_loss": -21.65743064880371, "global_step": 96497, "epoch": 1162} {"train_loss": -22.25811004638672, "global_step": 96498, "epoch": 1162} {"train_loss": -22.050790786743164, "global_step": 96499, "epoch": 1162} {"train_loss": -21.88546371459961, "global_step": 96500, "epoch": 1162} {"train_loss": -21.69056510925293, "global_step": 96501, "epoch": 1162} {"train_loss": -21.970935821533203, "global_step": 96502, "epoch": 1162} {"train_loss": -22.0301513671875, "global_step": 96503, "epoch": 1162} {"train_loss": -21.834705352783203, "global_step": 96504, "epoch": 1162} {"train_loss": -21.926694869995117, "global_step": 96505, "epoch": 1162} {"train_loss": -21.884275436401367, "global_step": 96506, "epoch": 1162} {"train_loss": -21.68743324279785, "global_step": 96507, "epoch": 1162} {"train_loss": -21.473291397094727, "global_step": 96508, "epoch": 1162} {"train_loss": -21.8059139251709, "global_step": 96509, "epoch": 1162} {"train_loss": -21.520483016967773, "global_step": 96510, "epoch": 1162} {"train_loss": -21.811735153198242, "global_step": 96511, "epoch": 1162} {"train_loss": -21.964141845703125, "global_step": 96512, "epoch": 1162} {"train_loss": -22.0977840423584, "global_step": 96513, "epoch": 1162} {"train_loss": -21.62409782409668, "global_step": 96514, "epoch": 1162} {"train_loss": -21.794950485229492, "global_step": 96515, "epoch": 1162} {"train_loss": -22.04401206970215, "global_step": 96516, "epoch": 1162} {"train_loss": -21.66329574584961, "global_step": 96517, "epoch": 1162} {"train_loss": -21.81536865234375, "global_step": 96518, "epoch": 1162} {"train_loss": -22.112709045410156, "global_step": 96519, "epoch": 1162} {"train_loss": -21.709739685058594, "global_step": 96520, "epoch": 1162} {"train_loss": -21.54080581665039, "global_step": 96521, "epoch": 1162} {"train_loss": -21.765716552734375, "global_step": 96522, "epoch": 1162} {"train_loss": -21.754728317260742, "global_step": 96523, "epoch": 1162} {"train_loss": -21.659170150756836, "global_step": 96524, "epoch": 1162} {"train_loss": -21.417430877685547, "global_step": 96525, "epoch": 1162} {"train_loss": -21.528106689453125, "global_step": 96526, "epoch": 1162} {"train_loss": -21.949691772460938, "global_step": 96527, "epoch": 1162} {"train_loss": -21.728245861559028, "global_step": 96528, "epoch": 1162, "val_loss": 6069755.5} {"train_loss": -21.06656265258789, "global_step": 96529, "epoch": 1163} {"train_loss": -21.050222396850586, "global_step": 96530, "epoch": 1163} {"train_loss": -21.904157638549805, "global_step": 96531, "epoch": 1163} {"train_loss": -21.184600830078125, "global_step": 96532, "epoch": 1163} {"train_loss": -21.390790939331055, "global_step": 96533, "epoch": 1163} {"train_loss": -20.756093978881836, "global_step": 96534, "epoch": 1163} {"train_loss": -21.186843872070312, "global_step": 96535, "epoch": 1163} {"train_loss": -21.64468765258789, "global_step": 96536, "epoch": 1163} {"train_loss": -21.706579208374023, "global_step": 96537, "epoch": 1163} {"train_loss": -21.60414695739746, "global_step": 96538, "epoch": 1163} {"train_loss": -21.727773666381836, "global_step": 96539, "epoch": 1163} {"train_loss": -21.654775619506836, "global_step": 96540, "epoch": 1163} {"train_loss": -21.667173385620117, "global_step": 96541, "epoch": 1163} {"train_loss": -21.62501335144043, "global_step": 96542, "epoch": 1163} {"train_loss": -21.473173141479492, "global_step": 96543, "epoch": 1163} {"train_loss": -21.701284408569336, "global_step": 96544, "epoch": 1163} {"train_loss": -21.655534744262695, "global_step": 96545, "epoch": 1163} {"train_loss": -21.848234176635742, "global_step": 96546, "epoch": 1163} {"train_loss": -21.66449546813965, "global_step": 96547, "epoch": 1163} {"train_loss": -21.851856231689453, "global_step": 96548, "epoch": 1163} {"train_loss": -21.871557235717773, "global_step": 96549, "epoch": 1163} {"train_loss": -21.63907814025879, "global_step": 96550, "epoch": 1163} {"train_loss": -21.927993774414062, "global_step": 96551, "epoch": 1163} {"train_loss": -21.808080673217773, "global_step": 96552, "epoch": 1163} {"train_loss": -21.577913284301758, "global_step": 96553, "epoch": 1163} {"train_loss": -21.64973258972168, "global_step": 96554, "epoch": 1163} {"train_loss": -21.988597869873047, "global_step": 96555, "epoch": 1163} {"train_loss": -21.652801513671875, "global_step": 96556, "epoch": 1163} {"train_loss": -21.65443992614746, "global_step": 96557, "epoch": 1163} {"train_loss": -21.67939567565918, "global_step": 96558, "epoch": 1163} {"train_loss": -22.19596290588379, "global_step": 96559, "epoch": 1163} {"train_loss": -21.90288734436035, "global_step": 96560, "epoch": 1163} {"train_loss": -21.74724769592285, "global_step": 96561, "epoch": 1163} {"train_loss": -21.512653350830078, "global_step": 96562, "epoch": 1163} {"train_loss": -21.890256881713867, "global_step": 96563, "epoch": 1163} {"train_loss": -21.855806350708008, "global_step": 96564, "epoch": 1163} {"train_loss": -21.903120040893555, "global_step": 96565, "epoch": 1163} {"train_loss": -22.171911239624023, "global_step": 96566, "epoch": 1163} {"train_loss": -21.860551834106445, "global_step": 96567, "epoch": 1163} {"train_loss": -22.18613052368164, "global_step": 96568, "epoch": 1163} {"train_loss": -21.79408836364746, "global_step": 96569, "epoch": 1163} {"train_loss": -21.673599243164062, "global_step": 96570, "epoch": 1163} {"train_loss": -21.818815231323242, "global_step": 96571, "epoch": 1163} {"train_loss": -21.86554527282715, "global_step": 96572, "epoch": 1163} {"train_loss": -21.742971420288086, "global_step": 96573, "epoch": 1163} {"train_loss": -21.773954391479492, "global_step": 96574, "epoch": 1163} {"train_loss": -21.905996322631836, "global_step": 96575, "epoch": 1163} {"train_loss": -21.559762954711914, "global_step": 96576, "epoch": 1163} {"train_loss": -21.698562622070312, "global_step": 96577, "epoch": 1163} {"train_loss": -21.89699935913086, "global_step": 96578, "epoch": 1163} {"train_loss": -21.500694274902344, "global_step": 96579, "epoch": 1163} {"train_loss": -21.84589958190918, "global_step": 96580, "epoch": 1163} {"train_loss": -22.002012252807617, "global_step": 96581, "epoch": 1163} {"train_loss": -21.821664810180664, "global_step": 96582, "epoch": 1163} {"train_loss": -21.972021102905273, "global_step": 96583, "epoch": 1163} {"train_loss": -21.360610961914062, "global_step": 96584, "epoch": 1163} {"train_loss": -21.612462997436523, "global_step": 96585, "epoch": 1163} {"train_loss": -21.91823387145996, "global_step": 96586, "epoch": 1163} {"train_loss": -21.6362247467041, "global_step": 96587, "epoch": 1163} {"train_loss": -21.8144588470459, "global_step": 96588, "epoch": 1163} {"train_loss": -21.6281795501709, "global_step": 96589, "epoch": 1163} {"train_loss": -21.64255142211914, "global_step": 96590, "epoch": 1163} {"train_loss": -22.055322647094727, "global_step": 96591, "epoch": 1163} {"train_loss": -21.752960205078125, "global_step": 96592, "epoch": 1163} {"train_loss": -22.367664337158203, "global_step": 96593, "epoch": 1163} {"train_loss": -21.670148849487305, "global_step": 96594, "epoch": 1163} {"train_loss": -22.01673126220703, "global_step": 96595, "epoch": 1163} {"train_loss": -21.534528732299805, "global_step": 96596, "epoch": 1163} {"train_loss": -21.783517837524414, "global_step": 96597, "epoch": 1163} {"train_loss": -21.554828643798828, "global_step": 96598, "epoch": 1163} {"train_loss": -21.797916412353516, "global_step": 96599, "epoch": 1163} {"train_loss": -21.649368286132812, "global_step": 96600, "epoch": 1163} {"train_loss": -21.928525924682617, "global_step": 96601, "epoch": 1163} {"train_loss": -21.759830474853516, "global_step": 96602, "epoch": 1163} {"train_loss": -21.883785247802734, "global_step": 96603, "epoch": 1163} {"train_loss": -21.3762149810791, "global_step": 96604, "epoch": 1163} {"train_loss": -21.635072708129883, "global_step": 96605, "epoch": 1163} {"train_loss": -21.74196434020996, "global_step": 96606, "epoch": 1163} {"train_loss": -22.13922691345215, "global_step": 96607, "epoch": 1163} {"train_loss": -21.734350204467773, "global_step": 96608, "epoch": 1163} {"train_loss": -21.965646743774414, "global_step": 96609, "epoch": 1163} {"train_loss": -21.891508102416992, "global_step": 96610, "epoch": 1163} {"train_loss": -21.72937315056123, "global_step": 96611, "epoch": 1163, "val_loss": 6117026.5} {"train_loss": -21.407291412353516, "global_step": 96612, "epoch": 1164} {"train_loss": -21.702199935913086, "global_step": 96613, "epoch": 1164} {"train_loss": -21.730871200561523, "global_step": 96614, "epoch": 1164} {"train_loss": -21.557714462280273, "global_step": 96615, "epoch": 1164} {"train_loss": -21.965524673461914, "global_step": 96616, "epoch": 1164} {"train_loss": -21.82746696472168, "global_step": 96617, "epoch": 1164} {"train_loss": -21.527578353881836, "global_step": 96618, "epoch": 1164} {"train_loss": -21.742189407348633, "global_step": 96619, "epoch": 1164} {"train_loss": -21.694021224975586, "global_step": 96620, "epoch": 1164} {"train_loss": -21.174789428710938, "global_step": 96621, "epoch": 1164} {"train_loss": -21.60567283630371, "global_step": 96622, "epoch": 1164} {"train_loss": -21.658140182495117, "global_step": 96623, "epoch": 1164} {"train_loss": -21.502700805664062, "global_step": 96624, "epoch": 1164} {"train_loss": -21.840171813964844, "global_step": 96625, "epoch": 1164} {"train_loss": -21.929555892944336, "global_step": 96626, "epoch": 1164} {"train_loss": -21.660846710205078, "global_step": 96627, "epoch": 1164} {"train_loss": -22.046789169311523, "global_step": 96628, "epoch": 1164} {"train_loss": -21.38058853149414, "global_step": 96629, "epoch": 1164} {"train_loss": -21.750913619995117, "global_step": 96630, "epoch": 1164} {"train_loss": -22.024688720703125, "global_step": 96631, "epoch": 1164} {"train_loss": -21.682607650756836, "global_step": 96632, "epoch": 1164} {"train_loss": -21.894285202026367, "global_step": 96633, "epoch": 1164} {"train_loss": -21.80376625061035, "global_step": 96634, "epoch": 1164} {"train_loss": -21.99410057067871, "global_step": 96635, "epoch": 1164} {"train_loss": -21.686737060546875, "global_step": 96636, "epoch": 1164} {"train_loss": -21.654539108276367, "global_step": 96637, "epoch": 1164} {"train_loss": -21.44841766357422, "global_step": 96638, "epoch": 1164} {"train_loss": -21.333240509033203, "global_step": 96639, "epoch": 1164} {"train_loss": -21.716114044189453, "global_step": 96640, "epoch": 1164} {"train_loss": -21.815956115722656, "global_step": 96641, "epoch": 1164} {"train_loss": -21.990034103393555, "global_step": 96642, "epoch": 1164} {"train_loss": -21.75396156311035, "global_step": 96643, "epoch": 1164} {"train_loss": -22.02235984802246, "global_step": 96644, "epoch": 1164} {"train_loss": -21.566564559936523, "global_step": 96645, "epoch": 1164} {"train_loss": -21.54383087158203, "global_step": 96646, "epoch": 1164} {"train_loss": -21.507246017456055, "global_step": 96647, "epoch": 1164} {"train_loss": -21.860010147094727, "global_step": 96648, "epoch": 1164} {"train_loss": -22.01708984375, "global_step": 96649, "epoch": 1164} {"train_loss": -22.085996627807617, "global_step": 96650, "epoch": 1164} {"train_loss": -21.966859817504883, "global_step": 96651, "epoch": 1164} {"train_loss": -22.160110473632812, "global_step": 96652, "epoch": 1164} {"train_loss": -21.801719665527344, "global_step": 96653, "epoch": 1164} {"train_loss": -21.692720413208008, "global_step": 96654, "epoch": 1164} {"train_loss": -21.796926498413086, "global_step": 96655, "epoch": 1164} {"train_loss": -21.45612144470215, "global_step": 96656, "epoch": 1164} {"train_loss": -21.697769165039062, "global_step": 96657, "epoch": 1164} {"train_loss": -21.821069717407227, "global_step": 96658, "epoch": 1164} {"train_loss": -21.70041847229004, "global_step": 96659, "epoch": 1164} {"train_loss": -21.777658462524414, "global_step": 96660, "epoch": 1164} {"train_loss": -21.738117218017578, "global_step": 96661, "epoch": 1164} {"train_loss": -21.904870986938477, "global_step": 96662, "epoch": 1164} {"train_loss": -21.60554313659668, "global_step": 96663, "epoch": 1164} {"train_loss": -21.66010284423828, "global_step": 96664, "epoch": 1164} {"train_loss": -21.934093475341797, "global_step": 96665, "epoch": 1164} {"train_loss": -21.69845962524414, "global_step": 96666, "epoch": 1164} {"train_loss": -21.96632194519043, "global_step": 96667, "epoch": 1164} {"train_loss": -21.845855712890625, "global_step": 96668, "epoch": 1164} {"train_loss": -21.690397262573242, "global_step": 96669, "epoch": 1164} {"train_loss": -21.82138442993164, "global_step": 96670, "epoch": 1164} {"train_loss": -21.785886764526367, "global_step": 96671, "epoch": 1164} {"train_loss": -21.66140365600586, "global_step": 96672, "epoch": 1164} {"train_loss": -21.831939697265625, "global_step": 96673, "epoch": 1164} {"train_loss": -21.922178268432617, "global_step": 96674, "epoch": 1164} {"train_loss": -21.630680084228516, "global_step": 96675, "epoch": 1164} {"train_loss": -22.104267120361328, "global_step": 96676, "epoch": 1164} {"train_loss": -21.389427185058594, "global_step": 96677, "epoch": 1164} {"train_loss": -21.770557403564453, "global_step": 96678, "epoch": 1164} {"train_loss": -21.707487106323242, "global_step": 96679, "epoch": 1164} {"train_loss": -21.934133529663086, "global_step": 96680, "epoch": 1164} {"train_loss": -21.911785125732422, "global_step": 96681, "epoch": 1164} {"train_loss": -21.573923110961914, "global_step": 96682, "epoch": 1164} {"train_loss": -22.005361557006836, "global_step": 96683, "epoch": 1164} {"train_loss": -21.27817153930664, "global_step": 96684, "epoch": 1164} {"train_loss": -21.623380661010742, "global_step": 96685, "epoch": 1164} {"train_loss": -21.8375244140625, "global_step": 96686, "epoch": 1164} {"train_loss": -21.841310501098633, "global_step": 96687, "epoch": 1164} {"train_loss": -21.834836959838867, "global_step": 96688, "epoch": 1164} {"train_loss": -21.54071617126465, "global_step": 96689, "epoch": 1164} {"train_loss": -21.70621681213379, "global_step": 96690, "epoch": 1164} {"train_loss": -21.77878189086914, "global_step": 96691, "epoch": 1164} {"train_loss": -21.438138961791992, "global_step": 96692, "epoch": 1164} {"train_loss": -21.804166793823242, "global_step": 96693, "epoch": 1164} {"train_loss": -21.749029894909228, "global_step": 96694, "epoch": 1164, "val_loss": 6047542.5} {"train_loss": -21.48577117919922, "global_step": 96695, "epoch": 1165} {"train_loss": -21.725387573242188, "global_step": 96696, "epoch": 1165} {"train_loss": -21.370803833007812, "global_step": 96697, "epoch": 1165} {"train_loss": -21.680082321166992, "global_step": 96698, "epoch": 1165} {"train_loss": -21.957571029663086, "global_step": 96699, "epoch": 1165} {"train_loss": -21.446456909179688, "global_step": 96700, "epoch": 1165} {"train_loss": -21.376176834106445, "global_step": 96701, "epoch": 1165} {"train_loss": -21.662158966064453, "global_step": 96702, "epoch": 1165} {"train_loss": -21.467336654663086, "global_step": 96703, "epoch": 1165} {"train_loss": -21.673643112182617, "global_step": 96704, "epoch": 1165} {"train_loss": -21.77707862854004, "global_step": 96705, "epoch": 1165} {"train_loss": -21.721364974975586, "global_step": 96706, "epoch": 1165} {"train_loss": -21.419010162353516, "global_step": 96707, "epoch": 1165} {"train_loss": -21.85567283630371, "global_step": 96708, "epoch": 1165} {"train_loss": -21.936365127563477, "global_step": 96709, "epoch": 1165} {"train_loss": -21.760190963745117, "global_step": 96710, "epoch": 1165} {"train_loss": -22.137971878051758, "global_step": 96711, "epoch": 1165} {"train_loss": -21.514129638671875, "global_step": 96712, "epoch": 1165} {"train_loss": -21.983243942260742, "global_step": 96713, "epoch": 1165} {"train_loss": -21.63374900817871, "global_step": 96714, "epoch": 1165} {"train_loss": -21.60726547241211, "global_step": 96715, "epoch": 1165} {"train_loss": -21.67713737487793, "global_step": 96716, "epoch": 1165} {"train_loss": -21.64960289001465, "global_step": 96717, "epoch": 1165} {"train_loss": -21.908119201660156, "global_step": 96718, "epoch": 1165} {"train_loss": -21.96664810180664, "global_step": 96719, "epoch": 1165} {"train_loss": -21.829214096069336, "global_step": 96720, "epoch": 1165} {"train_loss": -21.91985511779785, "global_step": 96721, "epoch": 1165} {"train_loss": -21.43956184387207, "global_step": 96722, "epoch": 1165} {"train_loss": -21.553001403808594, "global_step": 96723, "epoch": 1165} {"train_loss": -22.084218978881836, "global_step": 96724, "epoch": 1165} {"train_loss": -21.91291618347168, "global_step": 96725, "epoch": 1165} {"train_loss": -21.86905288696289, "global_step": 96726, "epoch": 1165} {"train_loss": -22.08566665649414, "global_step": 96727, "epoch": 1165} {"train_loss": -21.751022338867188, "global_step": 96728, "epoch": 1165} {"train_loss": -21.71090316772461, "global_step": 96729, "epoch": 1165} {"train_loss": -21.575136184692383, "global_step": 96730, "epoch": 1165} {"train_loss": -21.575481414794922, "global_step": 96731, "epoch": 1165} {"train_loss": -21.97054100036621, "global_step": 96732, "epoch": 1165} {"train_loss": -21.74427604675293, "global_step": 96733, "epoch": 1165} {"train_loss": -21.819425582885742, "global_step": 96734, "epoch": 1165} {"train_loss": -21.93505859375, "global_step": 96735, "epoch": 1165} {"train_loss": -21.62965965270996, "global_step": 96736, "epoch": 1165} {"train_loss": -21.779218673706055, "global_step": 96737, "epoch": 1165} {"train_loss": -21.732458114624023, "global_step": 96738, "epoch": 1165} {"train_loss": -21.847227096557617, "global_step": 96739, "epoch": 1165} {"train_loss": -21.482019424438477, "global_step": 96740, "epoch": 1165} {"train_loss": -22.175966262817383, "global_step": 96741, "epoch": 1165} {"train_loss": -21.671056747436523, "global_step": 96742, "epoch": 1165} {"train_loss": -21.470367431640625, "global_step": 96743, "epoch": 1165} {"train_loss": -22.269315719604492, "global_step": 96744, "epoch": 1165} {"train_loss": -21.866830825805664, "global_step": 96745, "epoch": 1165} {"train_loss": -21.76837730407715, "global_step": 96746, "epoch": 1165} {"train_loss": -22.01678466796875, "global_step": 96747, "epoch": 1165} {"train_loss": -22.01995277404785, "global_step": 96748, "epoch": 1165} {"train_loss": -21.84259605407715, "global_step": 96749, "epoch": 1165} {"train_loss": -21.850706100463867, "global_step": 96750, "epoch": 1165} {"train_loss": -21.856769561767578, "global_step": 96751, "epoch": 1165} {"train_loss": -22.061548233032227, "global_step": 96752, "epoch": 1165} {"train_loss": -21.57368278503418, "global_step": 96753, "epoch": 1165} {"train_loss": -22.015506744384766, "global_step": 96754, "epoch": 1165} {"train_loss": -22.278762817382812, "global_step": 96755, "epoch": 1165} {"train_loss": -21.86551284790039, "global_step": 96756, "epoch": 1165} {"train_loss": -21.86246109008789, "global_step": 96757, "epoch": 1165} {"train_loss": -21.941665649414062, "global_step": 96758, "epoch": 1165} {"train_loss": -21.659103393554688, "global_step": 96759, "epoch": 1165} {"train_loss": -22.075565338134766, "global_step": 96760, "epoch": 1165} {"train_loss": -22.217330932617188, "global_step": 96761, "epoch": 1165} {"train_loss": -21.734647750854492, "global_step": 96762, "epoch": 1165} {"train_loss": -22.072248458862305, "global_step": 96763, "epoch": 1165} {"train_loss": -21.808828353881836, "global_step": 96764, "epoch": 1165} {"train_loss": -21.826383590698242, "global_step": 96765, "epoch": 1165} {"train_loss": -21.61467933654785, "global_step": 96766, "epoch": 1165} {"train_loss": -22.080320358276367, "global_step": 96767, "epoch": 1165} {"train_loss": -21.9468936920166, "global_step": 96768, "epoch": 1165} {"train_loss": -21.791015625, "global_step": 96769, "epoch": 1165} {"train_loss": -21.990449905395508, "global_step": 96770, "epoch": 1165} {"train_loss": -21.669031143188477, "global_step": 96771, "epoch": 1165} {"train_loss": -21.903060913085938, "global_step": 96772, "epoch": 1165} {"train_loss": -21.960790634155273, "global_step": 96773, "epoch": 1165} {"train_loss": -21.877758026123047, "global_step": 96774, "epoch": 1165} {"train_loss": -22.062744140625, "global_step": 96775, "epoch": 1165} {"train_loss": -22.1334285736084, "global_step": 96776, "epoch": 1165} {"train_loss": -21.807060103818596, "global_step": 96777, "epoch": 1165, "val_loss": 6032785.0} {"train_loss": -21.715042114257812, "global_step": 96778, "epoch": 1166} {"train_loss": -21.71744155883789, "global_step": 96779, "epoch": 1166} {"train_loss": -21.810216903686523, "global_step": 96780, "epoch": 1166} {"train_loss": -21.613529205322266, "global_step": 96781, "epoch": 1166} {"train_loss": -21.316879272460938, "global_step": 96782, "epoch": 1166} {"train_loss": -21.349811553955078, "global_step": 96783, "epoch": 1166} {"train_loss": -21.52655601501465, "global_step": 96784, "epoch": 1166} {"train_loss": -21.8673038482666, "global_step": 96785, "epoch": 1166} {"train_loss": -21.935575485229492, "global_step": 96786, "epoch": 1166} {"train_loss": -21.569765090942383, "global_step": 96787, "epoch": 1166} {"train_loss": -22.127647399902344, "global_step": 96788, "epoch": 1166} {"train_loss": -22.141590118408203, "global_step": 96789, "epoch": 1166} {"train_loss": -21.79862403869629, "global_step": 96790, "epoch": 1166} {"train_loss": -21.925260543823242, "global_step": 96791, "epoch": 1166} {"train_loss": -21.703622817993164, "global_step": 96792, "epoch": 1166} {"train_loss": -22.283756256103516, "global_step": 96793, "epoch": 1166} {"train_loss": -21.798826217651367, "global_step": 96794, "epoch": 1166} {"train_loss": -22.101425170898438, "global_step": 96795, "epoch": 1166} {"train_loss": -22.105411529541016, "global_step": 96796, "epoch": 1166} {"train_loss": -21.649587631225586, "global_step": 96797, "epoch": 1166} {"train_loss": -21.475929260253906, "global_step": 96798, "epoch": 1166} {"train_loss": -21.70071792602539, "global_step": 96799, "epoch": 1166} {"train_loss": -22.042936325073242, "global_step": 96800, "epoch": 1166} {"train_loss": -21.954648971557617, "global_step": 96801, "epoch": 1166} {"train_loss": -21.857454299926758, "global_step": 96802, "epoch": 1166} {"train_loss": -21.533246994018555, "global_step": 96803, "epoch": 1166} {"train_loss": -21.72730827331543, "global_step": 96804, "epoch": 1166} {"train_loss": -21.651203155517578, "global_step": 96805, "epoch": 1166} {"train_loss": -21.785306930541992, "global_step": 96806, "epoch": 1166} {"train_loss": -22.024497985839844, "global_step": 96807, "epoch": 1166} {"train_loss": -21.887325286865234, "global_step": 96808, "epoch": 1166} {"train_loss": -21.952909469604492, "global_step": 96809, "epoch": 1166} {"train_loss": -21.801084518432617, "global_step": 96810, "epoch": 1166} {"train_loss": -22.008527755737305, "global_step": 96811, "epoch": 1166} {"train_loss": -21.800273895263672, "global_step": 96812, "epoch": 1166} {"train_loss": -21.945783615112305, "global_step": 96813, "epoch": 1166} {"train_loss": -21.965368270874023, "global_step": 96814, "epoch": 1166} {"train_loss": -21.9879207611084, "global_step": 96815, "epoch": 1166} {"train_loss": -21.947193145751953, "global_step": 96816, "epoch": 1166} {"train_loss": -21.90262222290039, "global_step": 96817, "epoch": 1166} {"train_loss": -22.100933074951172, "global_step": 96818, "epoch": 1166} {"train_loss": -22.07399559020996, "global_step": 96819, "epoch": 1166} {"train_loss": -22.011842727661133, "global_step": 96820, "epoch": 1166} {"train_loss": -21.674890518188477, "global_step": 96821, "epoch": 1166} {"train_loss": -21.99355697631836, "global_step": 96822, "epoch": 1166} {"train_loss": -21.883983612060547, "global_step": 96823, "epoch": 1166} {"train_loss": -21.64006233215332, "global_step": 96824, "epoch": 1166} {"train_loss": -22.05084800720215, "global_step": 96825, "epoch": 1166} {"train_loss": -21.875946044921875, "global_step": 96826, "epoch": 1166} {"train_loss": -21.80457878112793, "global_step": 96827, "epoch": 1166} {"train_loss": -21.651084899902344, "global_step": 96828, "epoch": 1166} {"train_loss": -21.68085289001465, "global_step": 96829, "epoch": 1166} {"train_loss": -21.753128051757812, "global_step": 96830, "epoch": 1166} {"train_loss": -21.878921508789062, "global_step": 96831, "epoch": 1166} {"train_loss": -21.533823013305664, "global_step": 96832, "epoch": 1166} {"train_loss": -21.69538116455078, "global_step": 96833, "epoch": 1166} {"train_loss": -21.95829200744629, "global_step": 96834, "epoch": 1166} {"train_loss": -21.560758590698242, "global_step": 96835, "epoch": 1166} {"train_loss": -21.828022003173828, "global_step": 96836, "epoch": 1166} {"train_loss": -21.551551818847656, "global_step": 96837, "epoch": 1166} {"train_loss": -21.848251342773438, "global_step": 96838, "epoch": 1166} {"train_loss": -21.818880081176758, "global_step": 96839, "epoch": 1166} {"train_loss": -21.30963897705078, "global_step": 96840, "epoch": 1166} {"train_loss": -21.6722469329834, "global_step": 96841, "epoch": 1166} {"train_loss": -21.716428756713867, "global_step": 96842, "epoch": 1166} {"train_loss": -21.1726016998291, "global_step": 96843, "epoch": 1166} {"train_loss": -22.04523277282715, "global_step": 96844, "epoch": 1166} {"train_loss": -21.766117095947266, "global_step": 96845, "epoch": 1166} {"train_loss": -21.55149269104004, "global_step": 96846, "epoch": 1166} {"train_loss": -21.923385620117188, "global_step": 96847, "epoch": 1166} {"train_loss": -21.662731170654297, "global_step": 96848, "epoch": 1166} {"train_loss": -21.6256103515625, "global_step": 96849, "epoch": 1166} {"train_loss": -21.75116539001465, "global_step": 96850, "epoch": 1166} {"train_loss": -21.58498191833496, "global_step": 96851, "epoch": 1166} {"train_loss": -21.490354537963867, "global_step": 96852, "epoch": 1166} {"train_loss": -21.867666244506836, "global_step": 96853, "epoch": 1166} {"train_loss": -21.62943458557129, "global_step": 96854, "epoch": 1166} {"train_loss": -21.6575927734375, "global_step": 96855, "epoch": 1166} {"train_loss": -21.819610595703125, "global_step": 96856, "epoch": 1166} {"train_loss": -21.768571853637695, "global_step": 96857, "epoch": 1166} {"train_loss": -21.55472183227539, "global_step": 96858, "epoch": 1166} {"train_loss": -21.483524322509766, "global_step": 96859, "epoch": 1166} {"train_loss": -21.799628682883387, "global_step": 96860, "epoch": 1166, "val_loss": 6090145.5} {"train_loss": -21.38665008544922, "global_step": 96861, "epoch": 1167} {"train_loss": -21.483564376831055, "global_step": 96862, "epoch": 1167} {"train_loss": -21.008586883544922, "global_step": 96863, "epoch": 1167} {"train_loss": -21.351282119750977, "global_step": 96864, "epoch": 1167} {"train_loss": -21.575481414794922, "global_step": 96865, "epoch": 1167} {"train_loss": -21.19745445251465, "global_step": 96866, "epoch": 1167} {"train_loss": -22.132184982299805, "global_step": 96867, "epoch": 1167} {"train_loss": -21.7462215423584, "global_step": 96868, "epoch": 1167} {"train_loss": -22.0237979888916, "global_step": 96869, "epoch": 1167} {"train_loss": -21.661405563354492, "global_step": 96870, "epoch": 1167} {"train_loss": -21.44902992248535, "global_step": 96871, "epoch": 1167} {"train_loss": -21.480581283569336, "global_step": 96872, "epoch": 1167} {"train_loss": -21.571392059326172, "global_step": 96873, "epoch": 1167} {"train_loss": -21.71287727355957, "global_step": 96874, "epoch": 1167} {"train_loss": -21.695058822631836, "global_step": 96875, "epoch": 1167} {"train_loss": -21.8522891998291, "global_step": 96876, "epoch": 1167} {"train_loss": -21.398216247558594, "global_step": 96877, "epoch": 1167} {"train_loss": -21.88179588317871, "global_step": 96878, "epoch": 1167} {"train_loss": -21.659961700439453, "global_step": 96879, "epoch": 1167} {"train_loss": -21.63614845275879, "global_step": 96880, "epoch": 1167} {"train_loss": -22.030118942260742, "global_step": 96881, "epoch": 1167} {"train_loss": -21.707603454589844, "global_step": 96882, "epoch": 1167} {"train_loss": -22.064512252807617, "global_step": 96883, "epoch": 1167} {"train_loss": -21.833173751831055, "global_step": 96884, "epoch": 1167} {"train_loss": -22.04851531982422, "global_step": 96885, "epoch": 1167} {"train_loss": -21.73211669921875, "global_step": 96886, "epoch": 1167} {"train_loss": -21.791269302368164, "global_step": 96887, "epoch": 1167} {"train_loss": -21.79416275024414, "global_step": 96888, "epoch": 1167} {"train_loss": -21.75461196899414, "global_step": 96889, "epoch": 1167} {"train_loss": -22.065946578979492, "global_step": 96890, "epoch": 1167} {"train_loss": -21.70938491821289, "global_step": 96891, "epoch": 1167} {"train_loss": -21.633726119995117, "global_step": 96892, "epoch": 1167} {"train_loss": -21.742277145385742, "global_step": 96893, "epoch": 1167} {"train_loss": -21.96702003479004, "global_step": 96894, "epoch": 1167} {"train_loss": -21.876384735107422, "global_step": 96895, "epoch": 1167} {"train_loss": -21.995166778564453, "global_step": 96896, "epoch": 1167} {"train_loss": -21.989721298217773, "global_step": 96897, "epoch": 1167} {"train_loss": -21.591238021850586, "global_step": 96898, "epoch": 1167} {"train_loss": -21.791837692260742, "global_step": 96899, "epoch": 1167} {"train_loss": -21.82037925720215, "global_step": 96900, "epoch": 1167} {"train_loss": -21.908605575561523, "global_step": 96901, "epoch": 1167} {"train_loss": -21.53455924987793, "global_step": 96902, "epoch": 1167} {"train_loss": -21.80439567565918, "global_step": 96903, "epoch": 1167} {"train_loss": -21.938886642456055, "global_step": 96904, "epoch": 1167} {"train_loss": -21.8012752532959, "global_step": 96905, "epoch": 1167} {"train_loss": -21.722488403320312, "global_step": 96906, "epoch": 1167} {"train_loss": -21.602767944335938, "global_step": 96907, "epoch": 1167} {"train_loss": -21.882230758666992, "global_step": 96908, "epoch": 1167} {"train_loss": -21.994617462158203, "global_step": 96909, "epoch": 1167} {"train_loss": -21.798023223876953, "global_step": 96910, "epoch": 1167} {"train_loss": -21.973440170288086, "global_step": 96911, "epoch": 1167} {"train_loss": -21.905729293823242, "global_step": 96912, "epoch": 1167} {"train_loss": -21.712055206298828, "global_step": 96913, "epoch": 1167} {"train_loss": -21.8419189453125, "global_step": 96914, "epoch": 1167} {"train_loss": -22.00539207458496, "global_step": 96915, "epoch": 1167} {"train_loss": -21.562618255615234, "global_step": 96916, "epoch": 1167} {"train_loss": -21.77435302734375, "global_step": 96917, "epoch": 1167} {"train_loss": -21.9034366607666, "global_step": 96918, "epoch": 1167} {"train_loss": -21.97211265563965, "global_step": 96919, "epoch": 1167} {"train_loss": -21.92158317565918, "global_step": 96920, "epoch": 1167} {"train_loss": -22.025775909423828, "global_step": 96921, "epoch": 1167} {"train_loss": -21.989337921142578, "global_step": 96922, "epoch": 1167} {"train_loss": -21.919775009155273, "global_step": 96923, "epoch": 1167} {"train_loss": -21.780319213867188, "global_step": 96924, "epoch": 1167} {"train_loss": -22.125442504882812, "global_step": 96925, "epoch": 1167} {"train_loss": -21.691259384155273, "global_step": 96926, "epoch": 1167} {"train_loss": -22.217628479003906, "global_step": 96927, "epoch": 1167} {"train_loss": -21.908367156982422, "global_step": 96928, "epoch": 1167} {"train_loss": -21.458023071289062, "global_step": 96929, "epoch": 1167} {"train_loss": -21.905298233032227, "global_step": 96930, "epoch": 1167} {"train_loss": -21.692384719848633, "global_step": 96931, "epoch": 1167} {"train_loss": -21.7249813079834, "global_step": 96932, "epoch": 1167} {"train_loss": -21.85964584350586, "global_step": 96933, "epoch": 1167} {"train_loss": -21.660152435302734, "global_step": 96934, "epoch": 1167} {"train_loss": -22.110885620117188, "global_step": 96935, "epoch": 1167} {"train_loss": -22.254301071166992, "global_step": 96936, "epoch": 1167} {"train_loss": -21.762592315673828, "global_step": 96937, "epoch": 1167} {"train_loss": -21.61733055114746, "global_step": 96938, "epoch": 1167} {"train_loss": -21.915067672729492, "global_step": 96939, "epoch": 1167} {"train_loss": -21.69221305847168, "global_step": 96940, "epoch": 1167} {"train_loss": -21.73746109008789, "global_step": 96941, "epoch": 1167} {"train_loss": -21.653446197509766, "global_step": 96942, "epoch": 1167} {"train_loss": -21.780981914106622, "global_step": 96943, "epoch": 1167, "val_loss": 6040307.0} {"train_loss": -21.773441314697266, "global_step": 96944, "epoch": 1168} {"train_loss": -21.56253433227539, "global_step": 96945, "epoch": 1168} {"train_loss": -21.193283081054688, "global_step": 96946, "epoch": 1168} {"train_loss": -21.75208854675293, "global_step": 96947, "epoch": 1168} {"train_loss": -21.5889835357666, "global_step": 96948, "epoch": 1168} {"train_loss": -21.373971939086914, "global_step": 96949, "epoch": 1168} {"train_loss": -21.190153121948242, "global_step": 96950, "epoch": 1168} {"train_loss": -21.186460494995117, "global_step": 96951, "epoch": 1168} {"train_loss": -21.532150268554688, "global_step": 96952, "epoch": 1168} {"train_loss": -21.293766021728516, "global_step": 96953, "epoch": 1168} {"train_loss": -21.476694107055664, "global_step": 96954, "epoch": 1168} {"train_loss": -21.419662475585938, "global_step": 96955, "epoch": 1168} {"train_loss": -21.602140426635742, "global_step": 96956, "epoch": 1168} {"train_loss": -21.672834396362305, "global_step": 96957, "epoch": 1168} {"train_loss": -21.456995010375977, "global_step": 96958, "epoch": 1168} {"train_loss": -22.05282211303711, "global_step": 96959, "epoch": 1168} {"train_loss": -21.6407527923584, "global_step": 96960, "epoch": 1168} {"train_loss": -21.924062728881836, "global_step": 96961, "epoch": 1168} {"train_loss": -21.752695083618164, "global_step": 96962, "epoch": 1168} {"train_loss": -21.711271286010742, "global_step": 96963, "epoch": 1168} {"train_loss": -21.825193405151367, "global_step": 96964, "epoch": 1168} {"train_loss": -21.819400787353516, "global_step": 96965, "epoch": 1168} {"train_loss": -21.62598991394043, "global_step": 96966, "epoch": 1168} {"train_loss": -21.888046264648438, "global_step": 96967, "epoch": 1168} {"train_loss": -22.01338005065918, "global_step": 96968, "epoch": 1168} {"train_loss": -21.849956512451172, "global_step": 96969, "epoch": 1168} {"train_loss": -21.791873931884766, "global_step": 96970, "epoch": 1168} {"train_loss": -22.12264060974121, "global_step": 96971, "epoch": 1168} {"train_loss": -21.62636375427246, "global_step": 96972, "epoch": 1168} {"train_loss": -21.45615005493164, "global_step": 96973, "epoch": 1168} {"train_loss": -22.125205993652344, "global_step": 96974, "epoch": 1168} {"train_loss": -21.78960609436035, "global_step": 96975, "epoch": 1168} {"train_loss": -21.469797134399414, "global_step": 96976, "epoch": 1168} {"train_loss": -21.87417221069336, "global_step": 96977, "epoch": 1168} {"train_loss": -22.159862518310547, "global_step": 96978, "epoch": 1168} {"train_loss": -21.73590087890625, "global_step": 96979, "epoch": 1168} {"train_loss": -21.680044174194336, "global_step": 96980, "epoch": 1168} {"train_loss": -21.864553451538086, "global_step": 96981, "epoch": 1168} {"train_loss": -21.82309913635254, "global_step": 96982, "epoch": 1168} {"train_loss": -21.440221786499023, "global_step": 96983, "epoch": 1168} {"train_loss": -21.97319984436035, "global_step": 96984, "epoch": 1168} {"train_loss": -22.092992782592773, "global_step": 96985, "epoch": 1168} {"train_loss": -21.995649337768555, "global_step": 96986, "epoch": 1168} {"train_loss": -21.92598533630371, "global_step": 96987, "epoch": 1168} {"train_loss": -21.9476375579834, "global_step": 96988, "epoch": 1168} {"train_loss": -21.906557083129883, "global_step": 96989, "epoch": 1168} {"train_loss": -21.514596939086914, "global_step": 96990, "epoch": 1168} {"train_loss": -21.784528732299805, "global_step": 96991, "epoch": 1168} {"train_loss": -21.922359466552734, "global_step": 96992, "epoch": 1168} {"train_loss": -21.898366928100586, "global_step": 96993, "epoch": 1168} {"train_loss": -21.964200973510742, "global_step": 96994, "epoch": 1168} {"train_loss": -21.862520217895508, "global_step": 96995, "epoch": 1168} {"train_loss": -21.860233306884766, "global_step": 96996, "epoch": 1168} {"train_loss": -22.22705078125, "global_step": 96997, "epoch": 1168} {"train_loss": -21.851226806640625, "global_step": 96998, "epoch": 1168} {"train_loss": -22.067358016967773, "global_step": 96999, "epoch": 1168} {"train_loss": -21.9494686126709, "global_step": 97000, "epoch": 1168} {"train_loss": -21.959903717041016, "global_step": 97001, "epoch": 1168} {"train_loss": -22.17268943786621, "global_step": 97002, "epoch": 1168} {"train_loss": -21.8203182220459, "global_step": 97003, "epoch": 1168} {"train_loss": -22.072824478149414, "global_step": 97004, "epoch": 1168} {"train_loss": -21.96670150756836, "global_step": 97005, "epoch": 1168} {"train_loss": -21.858640670776367, "global_step": 97006, "epoch": 1168} {"train_loss": -21.822660446166992, "global_step": 97007, "epoch": 1168} {"train_loss": -22.195714950561523, "global_step": 97008, "epoch": 1168} {"train_loss": -21.844043731689453, "global_step": 97009, "epoch": 1168} {"train_loss": -21.782323837280273, "global_step": 97010, "epoch": 1168} {"train_loss": -21.620471954345703, "global_step": 97011, "epoch": 1168} {"train_loss": -21.671663284301758, "global_step": 97012, "epoch": 1168} {"train_loss": -21.962783813476562, "global_step": 97013, "epoch": 1168} {"train_loss": -21.824655532836914, "global_step": 97014, "epoch": 1168} {"train_loss": -21.623132705688477, "global_step": 97015, "epoch": 1168} {"train_loss": -22.056520462036133, "global_step": 97016, "epoch": 1168} {"train_loss": -22.114652633666992, "global_step": 97017, "epoch": 1168} {"train_loss": -21.686561584472656, "global_step": 97018, "epoch": 1168} {"train_loss": -21.979223251342773, "global_step": 97019, "epoch": 1168} {"train_loss": -21.8933048248291, "global_step": 97020, "epoch": 1168} {"train_loss": -21.71101188659668, "global_step": 97021, "epoch": 1168} {"train_loss": -21.782194137573242, "global_step": 97022, "epoch": 1168} {"train_loss": -22.004852294921875, "global_step": 97023, "epoch": 1168} {"train_loss": -22.009170532226562, "global_step": 97024, "epoch": 1168} {"train_loss": -21.781248092651367, "global_step": 97025, "epoch": 1168} {"train_loss": -21.81444487514266, "global_step": 97026, "epoch": 1168, "val_loss": 6021623.0} {"train_loss": -21.32950782775879, "global_step": 97027, "epoch": 1169} {"train_loss": -21.448484420776367, "global_step": 97028, "epoch": 1169} {"train_loss": -21.6361083984375, "global_step": 97029, "epoch": 1169} {"train_loss": -21.94399642944336, "global_step": 97030, "epoch": 1169} {"train_loss": -21.58657455444336, "global_step": 97031, "epoch": 1169} {"train_loss": -21.73842430114746, "global_step": 97032, "epoch": 1169} {"train_loss": -21.630788803100586, "global_step": 97033, "epoch": 1169} {"train_loss": -21.710298538208008, "global_step": 97034, "epoch": 1169} {"train_loss": -21.767236709594727, "global_step": 97035, "epoch": 1169} {"train_loss": -21.95759391784668, "global_step": 97036, "epoch": 1169} {"train_loss": -21.51393699645996, "global_step": 97037, "epoch": 1169} {"train_loss": -21.68716812133789, "global_step": 97038, "epoch": 1169} {"train_loss": -21.921884536743164, "global_step": 97039, "epoch": 1169} {"train_loss": -21.756948471069336, "global_step": 97040, "epoch": 1169} {"train_loss": -21.898160934448242, "global_step": 97041, "epoch": 1169} {"train_loss": -21.9033203125, "global_step": 97042, "epoch": 1169} {"train_loss": -21.498517990112305, "global_step": 97043, "epoch": 1169} {"train_loss": -21.900543212890625, "global_step": 97044, "epoch": 1169} {"train_loss": -21.224130630493164, "global_step": 97045, "epoch": 1169} {"train_loss": -21.779905319213867, "global_step": 97046, "epoch": 1169} {"train_loss": -21.692533493041992, "global_step": 97047, "epoch": 1169} {"train_loss": -21.47892189025879, "global_step": 97048, "epoch": 1169} {"train_loss": -21.68129539489746, "global_step": 97049, "epoch": 1169} {"train_loss": -21.87977409362793, "global_step": 97050, "epoch": 1169} {"train_loss": -21.65447425842285, "global_step": 97051, "epoch": 1169} {"train_loss": -21.672527313232422, "global_step": 97052, "epoch": 1169} {"train_loss": -21.70625114440918, "global_step": 97053, "epoch": 1169} {"train_loss": -21.730627059936523, "global_step": 97054, "epoch": 1169} {"train_loss": -21.807523727416992, "global_step": 97055, "epoch": 1169} {"train_loss": -21.927013397216797, "global_step": 97056, "epoch": 1169} {"train_loss": -22.0600528717041, "global_step": 97057, "epoch": 1169} {"train_loss": -21.702157974243164, "global_step": 97058, "epoch": 1169} {"train_loss": -21.911701202392578, "global_step": 97059, "epoch": 1169} {"train_loss": -22.135377883911133, "global_step": 97060, "epoch": 1169} {"train_loss": -21.842512130737305, "global_step": 97061, "epoch": 1169} {"train_loss": -21.540151596069336, "global_step": 97062, "epoch": 1169} {"train_loss": -21.525110244750977, "global_step": 97063, "epoch": 1169} {"train_loss": -21.819358825683594, "global_step": 97064, "epoch": 1169} {"train_loss": -21.851125717163086, "global_step": 97065, "epoch": 1169} {"train_loss": -21.640287399291992, "global_step": 97066, "epoch": 1169} {"train_loss": -22.00645637512207, "global_step": 97067, "epoch": 1169} {"train_loss": -22.109760284423828, "global_step": 97068, "epoch": 1169} {"train_loss": -22.044635772705078, "global_step": 97069, "epoch": 1169} {"train_loss": -21.926761627197266, "global_step": 97070, "epoch": 1169} {"train_loss": -21.602346420288086, "global_step": 97071, "epoch": 1169} {"train_loss": -21.808073043823242, "global_step": 97072, "epoch": 1169} {"train_loss": -22.02992057800293, "global_step": 97073, "epoch": 1169} {"train_loss": -21.628299713134766, "global_step": 97074, "epoch": 1169} {"train_loss": -22.098926544189453, "global_step": 97075, "epoch": 1169} {"train_loss": -22.39850616455078, "global_step": 97076, "epoch": 1169} {"train_loss": -21.61635398864746, "global_step": 97077, "epoch": 1169} {"train_loss": -21.60670280456543, "global_step": 97078, "epoch": 1169} {"train_loss": -21.62307357788086, "global_step": 97079, "epoch": 1169} {"train_loss": -21.90184783935547, "global_step": 97080, "epoch": 1169} {"train_loss": -22.000391006469727, "global_step": 97081, "epoch": 1169} {"train_loss": -21.877986907958984, "global_step": 97082, "epoch": 1169} {"train_loss": -21.97361946105957, "global_step": 97083, "epoch": 1169} {"train_loss": -22.057586669921875, "global_step": 97084, "epoch": 1169} {"train_loss": -21.597116470336914, "global_step": 97085, "epoch": 1169} {"train_loss": -21.67264175415039, "global_step": 97086, "epoch": 1169} {"train_loss": -21.83376121520996, "global_step": 97087, "epoch": 1169} {"train_loss": -21.792062759399414, "global_step": 97088, "epoch": 1169} {"train_loss": -22.13980484008789, "global_step": 97089, "epoch": 1169} {"train_loss": -21.644590377807617, "global_step": 97090, "epoch": 1169} {"train_loss": -22.092435836791992, "global_step": 97091, "epoch": 1169} {"train_loss": -21.841388702392578, "global_step": 97092, "epoch": 1169} {"train_loss": -22.1975040435791, "global_step": 97093, "epoch": 1169} {"train_loss": -21.990131378173828, "global_step": 97094, "epoch": 1169} {"train_loss": -21.933420181274414, "global_step": 97095, "epoch": 1169} {"train_loss": -21.472597122192383, "global_step": 97096, "epoch": 1169} {"train_loss": -22.086111068725586, "global_step": 97097, "epoch": 1169} {"train_loss": -22.101917266845703, "global_step": 97098, "epoch": 1169} {"train_loss": -22.008190155029297, "global_step": 97099, "epoch": 1169} {"train_loss": -21.67082405090332, "global_step": 97100, "epoch": 1169} {"train_loss": -21.854053497314453, "global_step": 97101, "epoch": 1169} {"train_loss": -22.117156982421875, "global_step": 97102, "epoch": 1169} {"train_loss": -22.053142547607422, "global_step": 97103, "epoch": 1169} {"train_loss": -21.69655418395996, "global_step": 97104, "epoch": 1169} {"train_loss": -21.9986572265625, "global_step": 97105, "epoch": 1169} {"train_loss": -22.0723876953125, "global_step": 97106, "epoch": 1169} {"train_loss": -22.089752197265625, "global_step": 97107, "epoch": 1169} {"train_loss": -21.57999610900879, "global_step": 97108, "epoch": 1169} {"train_loss": -21.814741755106365, "global_step": 97109, "epoch": 1169, "val_loss": 6126649.5} {"train_loss": -21.16947364807129, "global_step": 97110, "epoch": 1170} {"train_loss": -21.049959182739258, "global_step": 97111, "epoch": 1170} {"train_loss": -21.35313606262207, "global_step": 97112, "epoch": 1170} {"train_loss": -21.581602096557617, "global_step": 97113, "epoch": 1170} {"train_loss": -21.269323348999023, "global_step": 97114, "epoch": 1170} {"train_loss": -21.216135025024414, "global_step": 97115, "epoch": 1170} {"train_loss": -21.697647094726562, "global_step": 97116, "epoch": 1170} {"train_loss": -21.4362850189209, "global_step": 97117, "epoch": 1170} {"train_loss": -21.633729934692383, "global_step": 97118, "epoch": 1170} {"train_loss": -21.30014419555664, "global_step": 97119, "epoch": 1170} {"train_loss": -21.53072166442871, "global_step": 97120, "epoch": 1170} {"train_loss": -21.69629669189453, "global_step": 97121, "epoch": 1170} {"train_loss": -21.7085018157959, "global_step": 97122, "epoch": 1170} {"train_loss": -21.459415435791016, "global_step": 97123, "epoch": 1170} {"train_loss": -21.937841415405273, "global_step": 97124, "epoch": 1170} {"train_loss": -21.867277145385742, "global_step": 97125, "epoch": 1170} {"train_loss": -21.520431518554688, "global_step": 97126, "epoch": 1170} {"train_loss": -21.632047653198242, "global_step": 97127, "epoch": 1170} {"train_loss": -21.579299926757812, "global_step": 97128, "epoch": 1170} {"train_loss": -21.977325439453125, "global_step": 97129, "epoch": 1170} {"train_loss": -21.898151397705078, "global_step": 97130, "epoch": 1170} {"train_loss": -21.972515106201172, "global_step": 97131, "epoch": 1170} {"train_loss": -21.415929794311523, "global_step": 97132, "epoch": 1170} {"train_loss": -21.900503158569336, "global_step": 97133, "epoch": 1170} {"train_loss": -21.98673439025879, "global_step": 97134, "epoch": 1170} {"train_loss": -21.378597259521484, "global_step": 97135, "epoch": 1170} {"train_loss": -21.669240951538086, "global_step": 97136, "epoch": 1170} {"train_loss": -21.771589279174805, "global_step": 97137, "epoch": 1170} {"train_loss": -22.176284790039062, "global_step": 97138, "epoch": 1170} {"train_loss": -21.942541122436523, "global_step": 97139, "epoch": 1170} {"train_loss": -22.109317779541016, "global_step": 97140, "epoch": 1170} {"train_loss": -22.029815673828125, "global_step": 97141, "epoch": 1170} {"train_loss": -21.995983123779297, "global_step": 97142, "epoch": 1170} {"train_loss": -22.249975204467773, "global_step": 97143, "epoch": 1170} {"train_loss": -21.90947914123535, "global_step": 97144, "epoch": 1170} {"train_loss": -21.82266616821289, "global_step": 97145, "epoch": 1170} {"train_loss": -22.015304565429688, "global_step": 97146, "epoch": 1170} {"train_loss": -21.923376083374023, "global_step": 97147, "epoch": 1170} {"train_loss": -22.13200569152832, "global_step": 97148, "epoch": 1170} {"train_loss": -22.190608978271484, "global_step": 97149, "epoch": 1170} {"train_loss": -21.526981353759766, "global_step": 97150, "epoch": 1170} {"train_loss": -21.94660186767578, "global_step": 97151, "epoch": 1170} {"train_loss": -21.655715942382812, "global_step": 97152, "epoch": 1170} {"train_loss": -21.847965240478516, "global_step": 97153, "epoch": 1170} {"train_loss": -22.28976821899414, "global_step": 97154, "epoch": 1170} {"train_loss": -21.94379234313965, "global_step": 97155, "epoch": 1170} {"train_loss": -22.214353561401367, "global_step": 97156, "epoch": 1170} {"train_loss": -21.989648818969727, "global_step": 97157, "epoch": 1170} {"train_loss": -21.878488540649414, "global_step": 97158, "epoch": 1170} {"train_loss": -21.92054557800293, "global_step": 97159, "epoch": 1170} {"train_loss": -21.658010482788086, "global_step": 97160, "epoch": 1170} {"train_loss": -21.89745330810547, "global_step": 97161, "epoch": 1170} {"train_loss": -21.581777572631836, "global_step": 97162, "epoch": 1170} {"train_loss": -21.408185958862305, "global_step": 97163, "epoch": 1170} {"train_loss": -21.913074493408203, "global_step": 97164, "epoch": 1170} {"train_loss": -21.53274917602539, "global_step": 97165, "epoch": 1170} {"train_loss": -21.517093658447266, "global_step": 97166, "epoch": 1170} {"train_loss": -21.84498405456543, "global_step": 97167, "epoch": 1170} {"train_loss": -21.493513107299805, "global_step": 97168, "epoch": 1170} {"train_loss": -21.897512435913086, "global_step": 97169, "epoch": 1170} {"train_loss": -21.75941276550293, "global_step": 97170, "epoch": 1170} {"train_loss": -21.977407455444336, "global_step": 97171, "epoch": 1170} {"train_loss": -22.034832000732422, "global_step": 97172, "epoch": 1170} {"train_loss": -21.831363677978516, "global_step": 97173, "epoch": 1170} {"train_loss": -21.582965850830078, "global_step": 97174, "epoch": 1170} {"train_loss": -21.80378532409668, "global_step": 97175, "epoch": 1170} {"train_loss": -21.155683517456055, "global_step": 97176, "epoch": 1170} {"train_loss": -21.5145263671875, "global_step": 97177, "epoch": 1170} {"train_loss": -21.915876388549805, "global_step": 97178, "epoch": 1170} {"train_loss": -21.777809143066406, "global_step": 97179, "epoch": 1170} {"train_loss": -21.64533805847168, "global_step": 97180, "epoch": 1170} {"train_loss": -22.04738426208496, "global_step": 97181, "epoch": 1170} {"train_loss": -21.71526336669922, "global_step": 97182, "epoch": 1170} {"train_loss": -21.748342514038086, "global_step": 97183, "epoch": 1170} {"train_loss": -21.771215438842773, "global_step": 97184, "epoch": 1170} {"train_loss": -21.894704818725586, "global_step": 97185, "epoch": 1170} {"train_loss": -21.776769638061523, "global_step": 97186, "epoch": 1170} {"train_loss": -21.890958786010742, "global_step": 97187, "epoch": 1170} {"train_loss": -21.908550262451172, "global_step": 97188, "epoch": 1170} {"train_loss": -21.871618270874023, "global_step": 97189, "epoch": 1170} {"train_loss": -22.0446834564209, "global_step": 97190, "epoch": 1170} {"train_loss": -21.953380584716797, "global_step": 97191, "epoch": 1170} {"train_loss": -21.760466150490636, "global_step": 97192, "epoch": 1170, "val_loss": 5992013.0} {"train_loss": -21.239965438842773, "global_step": 97193, "epoch": 1171} {"train_loss": -20.909244537353516, "global_step": 97194, "epoch": 1171} {"train_loss": -21.26211166381836, "global_step": 97195, "epoch": 1171} {"train_loss": -21.0335636138916, "global_step": 97196, "epoch": 1171} {"train_loss": -21.510433197021484, "global_step": 97197, "epoch": 1171} {"train_loss": -21.244094848632812, "global_step": 97198, "epoch": 1171} {"train_loss": -21.174427032470703, "global_step": 97199, "epoch": 1171} {"train_loss": -21.47356414794922, "global_step": 97200, "epoch": 1171} {"train_loss": -21.221546173095703, "global_step": 97201, "epoch": 1171} {"train_loss": -21.2268123626709, "global_step": 97202, "epoch": 1171} {"train_loss": -21.25282859802246, "global_step": 97203, "epoch": 1171} {"train_loss": -21.771488189697266, "global_step": 97204, "epoch": 1171} {"train_loss": -21.805261611938477, "global_step": 97205, "epoch": 1171} {"train_loss": -21.797008514404297, "global_step": 97206, "epoch": 1171} {"train_loss": -21.620512008666992, "global_step": 97207, "epoch": 1171} {"train_loss": -21.7695369720459, "global_step": 97208, "epoch": 1171} {"train_loss": -21.440885543823242, "global_step": 97209, "epoch": 1171} {"train_loss": -21.66082191467285, "global_step": 97210, "epoch": 1171} {"train_loss": -21.794452667236328, "global_step": 97211, "epoch": 1171} {"train_loss": -21.296598434448242, "global_step": 97212, "epoch": 1171} {"train_loss": -21.232345581054688, "global_step": 97213, "epoch": 1171} {"train_loss": -22.01812744140625, "global_step": 97214, "epoch": 1171} {"train_loss": -21.720104217529297, "global_step": 97215, "epoch": 1171} {"train_loss": -21.542129516601562, "global_step": 97216, "epoch": 1171} {"train_loss": -21.84287452697754, "global_step": 97217, "epoch": 1171} {"train_loss": -21.641128540039062, "global_step": 97218, "epoch": 1171} {"train_loss": -21.697294235229492, "global_step": 97219, "epoch": 1171} {"train_loss": -22.03276252746582, "global_step": 97220, "epoch": 1171} {"train_loss": -22.074121475219727, "global_step": 97221, "epoch": 1171} {"train_loss": -21.701236724853516, "global_step": 97222, "epoch": 1171} {"train_loss": -21.688339233398438, "global_step": 97223, "epoch": 1171} {"train_loss": -21.803190231323242, "global_step": 97224, "epoch": 1171} {"train_loss": -21.840299606323242, "global_step": 97225, "epoch": 1171} {"train_loss": -21.641460418701172, "global_step": 97226, "epoch": 1171} {"train_loss": -21.58828353881836, "global_step": 97227, "epoch": 1171} {"train_loss": -22.066974639892578, "global_step": 97228, "epoch": 1171} {"train_loss": -21.81012535095215, "global_step": 97229, "epoch": 1171} {"train_loss": -21.69028663635254, "global_step": 97230, "epoch": 1171} {"train_loss": -22.047008514404297, "global_step": 97231, "epoch": 1171} {"train_loss": -21.837162017822266, "global_step": 97232, "epoch": 1171} {"train_loss": -21.51027488708496, "global_step": 97233, "epoch": 1171} {"train_loss": -22.295686721801758, "global_step": 97234, "epoch": 1171} {"train_loss": -21.904338836669922, "global_step": 97235, "epoch": 1171} {"train_loss": -21.666025161743164, "global_step": 97236, "epoch": 1171} {"train_loss": -21.802824020385742, "global_step": 97237, "epoch": 1171} {"train_loss": -22.11264419555664, "global_step": 97238, "epoch": 1171} {"train_loss": -21.96921730041504, "global_step": 97239, "epoch": 1171} {"train_loss": -21.947532653808594, "global_step": 97240, "epoch": 1171} {"train_loss": -21.67817497253418, "global_step": 97241, "epoch": 1171} {"train_loss": -21.833843231201172, "global_step": 97242, "epoch": 1171} {"train_loss": -22.08307456970215, "global_step": 97243, "epoch": 1171} {"train_loss": -21.926328659057617, "global_step": 97244, "epoch": 1171} {"train_loss": -21.970895767211914, "global_step": 97245, "epoch": 1171} {"train_loss": -21.84742546081543, "global_step": 97246, "epoch": 1171} {"train_loss": -21.6263427734375, "global_step": 97247, "epoch": 1171} {"train_loss": -21.81917381286621, "global_step": 97248, "epoch": 1171} {"train_loss": -21.862831115722656, "global_step": 97249, "epoch": 1171} {"train_loss": -21.743682861328125, "global_step": 97250, "epoch": 1171} {"train_loss": -22.123397827148438, "global_step": 97251, "epoch": 1171} {"train_loss": -21.63469886779785, "global_step": 97252, "epoch": 1171} {"train_loss": -22.151920318603516, "global_step": 97253, "epoch": 1171} {"train_loss": -22.04000473022461, "global_step": 97254, "epoch": 1171} {"train_loss": -21.69838523864746, "global_step": 97255, "epoch": 1171} {"train_loss": -21.69904136657715, "global_step": 97256, "epoch": 1171} {"train_loss": -22.1519775390625, "global_step": 97257, "epoch": 1171} {"train_loss": -21.881704330444336, "global_step": 97258, "epoch": 1171} {"train_loss": -21.79730224609375, "global_step": 97259, "epoch": 1171} {"train_loss": -21.891111373901367, "global_step": 97260, "epoch": 1171} {"train_loss": -21.871482849121094, "global_step": 97261, "epoch": 1171} {"train_loss": -21.776142120361328, "global_step": 97262, "epoch": 1171} {"train_loss": -22.062641143798828, "global_step": 97263, "epoch": 1171} {"train_loss": -22.0710391998291, "global_step": 97264, "epoch": 1171} {"train_loss": -21.864452362060547, "global_step": 97265, "epoch": 1171} {"train_loss": -21.930824279785156, "global_step": 97266, "epoch": 1171} {"train_loss": -21.788654327392578, "global_step": 97267, "epoch": 1171} {"train_loss": -21.787891387939453, "global_step": 97268, "epoch": 1171} {"train_loss": -22.2272891998291, "global_step": 97269, "epoch": 1171} {"train_loss": -21.976755142211914, "global_step": 97270, "epoch": 1171} {"train_loss": -21.88433265686035, "global_step": 97271, "epoch": 1171} {"train_loss": -22.140470504760742, "global_step": 97272, "epoch": 1171} {"train_loss": -21.929553985595703, "global_step": 97273, "epoch": 1171} {"train_loss": -21.851686477661133, "global_step": 97274, "epoch": 1171} {"train_loss": -21.760948525853905, "global_step": 97275, "epoch": 1171, "val_loss": 6188275.0} {"train_loss": -21.200592041015625, "global_step": 97276, "epoch": 1172} {"train_loss": -21.14373016357422, "global_step": 97277, "epoch": 1172} {"train_loss": -21.37700080871582, "global_step": 97278, "epoch": 1172} {"train_loss": -21.335346221923828, "global_step": 97279, "epoch": 1172} {"train_loss": -21.86391830444336, "global_step": 97280, "epoch": 1172} {"train_loss": -21.40760040283203, "global_step": 97281, "epoch": 1172} {"train_loss": -21.868942260742188, "global_step": 97282, "epoch": 1172} {"train_loss": -21.690378189086914, "global_step": 97283, "epoch": 1172} {"train_loss": -21.35426902770996, "global_step": 97284, "epoch": 1172} {"train_loss": -21.758024215698242, "global_step": 97285, "epoch": 1172} {"train_loss": -21.517009735107422, "global_step": 97286, "epoch": 1172} {"train_loss": -21.545347213745117, "global_step": 97287, "epoch": 1172} {"train_loss": -21.8275089263916, "global_step": 97288, "epoch": 1172} {"train_loss": -21.549585342407227, "global_step": 97289, "epoch": 1172} {"train_loss": -21.846899032592773, "global_step": 97290, "epoch": 1172} {"train_loss": -22.05156135559082, "global_step": 97291, "epoch": 1172} {"train_loss": -21.398855209350586, "global_step": 97292, "epoch": 1172} {"train_loss": -22.074295043945312, "global_step": 97293, "epoch": 1172} {"train_loss": -21.777271270751953, "global_step": 97294, "epoch": 1172} {"train_loss": -21.784914016723633, "global_step": 97295, "epoch": 1172} {"train_loss": -21.746124267578125, "global_step": 97296, "epoch": 1172} {"train_loss": -21.652677536010742, "global_step": 97297, "epoch": 1172} {"train_loss": -21.51224136352539, "global_step": 97298, "epoch": 1172} {"train_loss": -21.505970001220703, "global_step": 97299, "epoch": 1172} {"train_loss": -21.929044723510742, "global_step": 97300, "epoch": 1172} {"train_loss": -21.91849708557129, "global_step": 97301, "epoch": 1172} {"train_loss": -22.1180362701416, "global_step": 97302, "epoch": 1172} {"train_loss": -21.77099609375, "global_step": 97303, "epoch": 1172} {"train_loss": -21.720487594604492, "global_step": 97304, "epoch": 1172} {"train_loss": -21.79376792907715, "global_step": 97305, "epoch": 1172} {"train_loss": -21.301374435424805, "global_step": 97306, "epoch": 1172} {"train_loss": -21.999799728393555, "global_step": 97307, "epoch": 1172} {"train_loss": -21.750150680541992, "global_step": 97308, "epoch": 1172} {"train_loss": -21.699228286743164, "global_step": 97309, "epoch": 1172} {"train_loss": -22.0064754486084, "global_step": 97310, "epoch": 1172} {"train_loss": -21.441917419433594, "global_step": 97311, "epoch": 1172} {"train_loss": -21.958139419555664, "global_step": 97312, "epoch": 1172} {"train_loss": -21.6655216217041, "global_step": 97313, "epoch": 1172} {"train_loss": -21.816543579101562, "global_step": 97314, "epoch": 1172} {"train_loss": -22.30716323852539, "global_step": 97315, "epoch": 1172} {"train_loss": -21.502351760864258, "global_step": 97316, "epoch": 1172} {"train_loss": -22.12034797668457, "global_step": 97317, "epoch": 1172} {"train_loss": -21.5534725189209, "global_step": 97318, "epoch": 1172} {"train_loss": -21.435253143310547, "global_step": 97319, "epoch": 1172} {"train_loss": -21.250577926635742, "global_step": 97320, "epoch": 1172} {"train_loss": -21.575223922729492, "global_step": 97321, "epoch": 1172} {"train_loss": -22.030385971069336, "global_step": 97322, "epoch": 1172} {"train_loss": -21.636350631713867, "global_step": 97323, "epoch": 1172} {"train_loss": -21.625675201416016, "global_step": 97324, "epoch": 1172} {"train_loss": -22.127920150756836, "global_step": 97325, "epoch": 1172} {"train_loss": -21.9194278717041, "global_step": 97326, "epoch": 1172} {"train_loss": -21.852603912353516, "global_step": 97327, "epoch": 1172} {"train_loss": -21.944875717163086, "global_step": 97328, "epoch": 1172} {"train_loss": -21.764497756958008, "global_step": 97329, "epoch": 1172} {"train_loss": -21.975446701049805, "global_step": 97330, "epoch": 1172} {"train_loss": -21.628070831298828, "global_step": 97331, "epoch": 1172} {"train_loss": -22.018526077270508, "global_step": 97332, "epoch": 1172} {"train_loss": -21.81230926513672, "global_step": 97333, "epoch": 1172} {"train_loss": -21.780439376831055, "global_step": 97334, "epoch": 1172} {"train_loss": -21.879100799560547, "global_step": 97335, "epoch": 1172} {"train_loss": -22.07299041748047, "global_step": 97336, "epoch": 1172} {"train_loss": -22.011611938476562, "global_step": 97337, "epoch": 1172} {"train_loss": -21.759891510009766, "global_step": 97338, "epoch": 1172} {"train_loss": -22.035308837890625, "global_step": 97339, "epoch": 1172} {"train_loss": -22.002851486206055, "global_step": 97340, "epoch": 1172} {"train_loss": -21.782068252563477, "global_step": 97341, "epoch": 1172} {"train_loss": -21.770401000976562, "global_step": 97342, "epoch": 1172} {"train_loss": -21.46040916442871, "global_step": 97343, "epoch": 1172} {"train_loss": -21.951623916625977, "global_step": 97344, "epoch": 1172} {"train_loss": -21.75819206237793, "global_step": 97345, "epoch": 1172} {"train_loss": -21.94129753112793, "global_step": 97346, "epoch": 1172} {"train_loss": -21.876239776611328, "global_step": 97347, "epoch": 1172} {"train_loss": -21.93245506286621, "global_step": 97348, "epoch": 1172} {"train_loss": -21.80805206298828, "global_step": 97349, "epoch": 1172} {"train_loss": -21.75208854675293, "global_step": 97350, "epoch": 1172} {"train_loss": -21.7614688873291, "global_step": 97351, "epoch": 1172} {"train_loss": -22.014169692993164, "global_step": 97352, "epoch": 1172} {"train_loss": -21.885520935058594, "global_step": 97353, "epoch": 1172} {"train_loss": -21.741724014282227, "global_step": 97354, "epoch": 1172} {"train_loss": -22.10654640197754, "global_step": 97355, "epoch": 1172} {"train_loss": -21.738309860229492, "global_step": 97356, "epoch": 1172} {"train_loss": -21.960437774658203, "global_step": 97357, "epoch": 1172} {"train_loss": -21.767242086939063, "global_step": 97358, "epoch": 1172, "val_loss": 6183630.0} {"train_loss": -21.47587013244629, "global_step": 97359, "epoch": 1173} {"train_loss": -21.355947494506836, "global_step": 97360, "epoch": 1173} {"train_loss": -21.555496215820312, "global_step": 97361, "epoch": 1173} {"train_loss": -21.486125946044922, "global_step": 97362, "epoch": 1173} {"train_loss": -21.916906356811523, "global_step": 97363, "epoch": 1173} {"train_loss": -21.24282455444336, "global_step": 97364, "epoch": 1173} {"train_loss": -21.64347267150879, "global_step": 97365, "epoch": 1173} {"train_loss": -21.72214126586914, "global_step": 97366, "epoch": 1173} {"train_loss": -21.90479850769043, "global_step": 97367, "epoch": 1173} {"train_loss": -21.364831924438477, "global_step": 97368, "epoch": 1173} {"train_loss": -21.666580200195312, "global_step": 97369, "epoch": 1173} {"train_loss": -21.632741928100586, "global_step": 97370, "epoch": 1173} {"train_loss": -21.698476791381836, "global_step": 97371, "epoch": 1173} {"train_loss": -21.620532989501953, "global_step": 97372, "epoch": 1173} {"train_loss": -21.55619239807129, "global_step": 97373, "epoch": 1173} {"train_loss": -21.496593475341797, "global_step": 97374, "epoch": 1173} {"train_loss": -21.443870544433594, "global_step": 97375, "epoch": 1173} {"train_loss": -21.836902618408203, "global_step": 97376, "epoch": 1173} {"train_loss": -21.82210922241211, "global_step": 97377, "epoch": 1173} {"train_loss": -21.4555721282959, "global_step": 97378, "epoch": 1173} {"train_loss": -22.032169342041016, "global_step": 97379, "epoch": 1173} {"train_loss": -21.953718185424805, "global_step": 97380, "epoch": 1173} {"train_loss": -21.58353042602539, "global_step": 97381, "epoch": 1173} {"train_loss": -21.80860710144043, "global_step": 97382, "epoch": 1173} {"train_loss": -22.13837242126465, "global_step": 97383, "epoch": 1173} {"train_loss": -21.808671951293945, "global_step": 97384, "epoch": 1173} {"train_loss": -21.789813995361328, "global_step": 97385, "epoch": 1173} {"train_loss": -21.810239791870117, "global_step": 97386, "epoch": 1173} {"train_loss": -22.156450271606445, "global_step": 97387, "epoch": 1173} {"train_loss": -21.740747451782227, "global_step": 97388, "epoch": 1173} {"train_loss": -22.156286239624023, "global_step": 97389, "epoch": 1173} {"train_loss": -21.46237564086914, "global_step": 97390, "epoch": 1173} {"train_loss": -21.99452018737793, "global_step": 97391, "epoch": 1173} {"train_loss": -21.610916137695312, "global_step": 97392, "epoch": 1173} {"train_loss": -21.93321418762207, "global_step": 97393, "epoch": 1173} {"train_loss": -22.093276977539062, "global_step": 97394, "epoch": 1173} {"train_loss": -21.840909957885742, "global_step": 97395, "epoch": 1173} {"train_loss": -21.584671020507812, "global_step": 97396, "epoch": 1173} {"train_loss": -21.533294677734375, "global_step": 97397, "epoch": 1173} {"train_loss": -21.952518463134766, "global_step": 97398, "epoch": 1173} {"train_loss": -21.85342788696289, "global_step": 97399, "epoch": 1173} {"train_loss": -21.701292037963867, "global_step": 97400, "epoch": 1173} {"train_loss": -21.935850143432617, "global_step": 97401, "epoch": 1173} {"train_loss": -22.165800094604492, "global_step": 97402, "epoch": 1173} {"train_loss": -22.089923858642578, "global_step": 97403, "epoch": 1173} {"train_loss": -21.9639949798584, "global_step": 97404, "epoch": 1173} {"train_loss": -21.83582878112793, "global_step": 97405, "epoch": 1173} {"train_loss": -22.060468673706055, "global_step": 97406, "epoch": 1173} {"train_loss": -21.37517547607422, "global_step": 97407, "epoch": 1173} {"train_loss": -21.793588638305664, "global_step": 97408, "epoch": 1173} {"train_loss": -22.180307388305664, "global_step": 97409, "epoch": 1173} {"train_loss": -22.097997665405273, "global_step": 97410, "epoch": 1173} {"train_loss": -21.640090942382812, "global_step": 97411, "epoch": 1173} {"train_loss": -21.70102310180664, "global_step": 97412, "epoch": 1173} {"train_loss": -21.521215438842773, "global_step": 97413, "epoch": 1173} {"train_loss": -21.850372314453125, "global_step": 97414, "epoch": 1173} {"train_loss": -21.38258934020996, "global_step": 97415, "epoch": 1173} {"train_loss": -21.791807174682617, "global_step": 97416, "epoch": 1173} {"train_loss": -21.894121170043945, "global_step": 97417, "epoch": 1173} {"train_loss": -21.94608497619629, "global_step": 97418, "epoch": 1173} {"train_loss": -22.29802894592285, "global_step": 97419, "epoch": 1173} {"train_loss": -21.854026794433594, "global_step": 97420, "epoch": 1173} {"train_loss": -22.00876808166504, "global_step": 97421, "epoch": 1173} {"train_loss": -21.891433715820312, "global_step": 97422, "epoch": 1173} {"train_loss": -21.955158233642578, "global_step": 97423, "epoch": 1173} {"train_loss": -22.023725509643555, "global_step": 97424, "epoch": 1173} {"train_loss": -22.14957618713379, "global_step": 97425, "epoch": 1173} {"train_loss": -21.788679122924805, "global_step": 97426, "epoch": 1173} {"train_loss": -21.806699752807617, "global_step": 97427, "epoch": 1173} {"train_loss": -21.757184982299805, "global_step": 97428, "epoch": 1173} {"train_loss": -21.660097122192383, "global_step": 97429, "epoch": 1173} {"train_loss": -21.81341552734375, "global_step": 97430, "epoch": 1173} {"train_loss": -21.645740509033203, "global_step": 97431, "epoch": 1173} {"train_loss": -22.098876953125, "global_step": 97432, "epoch": 1173} {"train_loss": -21.874914169311523, "global_step": 97433, "epoch": 1173} {"train_loss": -21.785808563232422, "global_step": 97434, "epoch": 1173} {"train_loss": -22.23990821838379, "global_step": 97435, "epoch": 1173} {"train_loss": -21.581697463989258, "global_step": 97436, "epoch": 1173} {"train_loss": -21.903453826904297, "global_step": 97437, "epoch": 1173} {"train_loss": -21.92296028137207, "global_step": 97438, "epoch": 1173} {"train_loss": -21.915393829345703, "global_step": 97439, "epoch": 1173} {"train_loss": -22.174896240234375, "global_step": 97440, "epoch": 1173} {"train_loss": -21.801253514117505, "global_step": 97441, "epoch": 1173, "val_loss": 6211693.5} {"train_loss": -22.099628448486328, "global_step": 97442, "epoch": 1174} {"train_loss": -21.723556518554688, "global_step": 97443, "epoch": 1174} {"train_loss": -22.199460983276367, "global_step": 97444, "epoch": 1174} {"train_loss": -21.82167625427246, "global_step": 97445, "epoch": 1174} {"train_loss": -21.8713321685791, "global_step": 97446, "epoch": 1174} {"train_loss": -21.588088989257812, "global_step": 97447, "epoch": 1174} {"train_loss": -21.816530227661133, "global_step": 97448, "epoch": 1174} {"train_loss": -21.443939208984375, "global_step": 97449, "epoch": 1174} {"train_loss": -21.51736831665039, "global_step": 97450, "epoch": 1174} {"train_loss": -21.958141326904297, "global_step": 97451, "epoch": 1174} {"train_loss": -21.69023895263672, "global_step": 97452, "epoch": 1174} {"train_loss": -21.755361557006836, "global_step": 97453, "epoch": 1174} {"train_loss": -21.169828414916992, "global_step": 97454, "epoch": 1174} {"train_loss": -22.14052391052246, "global_step": 97455, "epoch": 1174} {"train_loss": -22.201475143432617, "global_step": 97456, "epoch": 1174} {"train_loss": -21.685747146606445, "global_step": 97457, "epoch": 1174} {"train_loss": -21.753931045532227, "global_step": 97458, "epoch": 1174} {"train_loss": -21.752792358398438, "global_step": 97459, "epoch": 1174} {"train_loss": -21.498289108276367, "global_step": 97460, "epoch": 1174} {"train_loss": -21.770063400268555, "global_step": 97461, "epoch": 1174} {"train_loss": -22.277877807617188, "global_step": 97462, "epoch": 1174} {"train_loss": -21.902997970581055, "global_step": 97463, "epoch": 1174} {"train_loss": -21.612607955932617, "global_step": 97464, "epoch": 1174} {"train_loss": -21.755361557006836, "global_step": 97465, "epoch": 1174} {"train_loss": -21.96964454650879, "global_step": 97466, "epoch": 1174} {"train_loss": -22.15266990661621, "global_step": 97467, "epoch": 1174} {"train_loss": -22.103994369506836, "global_step": 97468, "epoch": 1174} {"train_loss": -21.919021606445312, "global_step": 97469, "epoch": 1174} {"train_loss": -21.90496253967285, "global_step": 97470, "epoch": 1174} {"train_loss": -21.56217384338379, "global_step": 97471, "epoch": 1174} {"train_loss": -21.99124526977539, "global_step": 97472, "epoch": 1174} {"train_loss": -21.872976303100586, "global_step": 97473, "epoch": 1174} {"train_loss": -21.918516159057617, "global_step": 97474, "epoch": 1174} {"train_loss": -21.74029541015625, "global_step": 97475, "epoch": 1174} {"train_loss": -21.880651473999023, "global_step": 97476, "epoch": 1174} {"train_loss": -21.704641342163086, "global_step": 97477, "epoch": 1174} {"train_loss": -22.036651611328125, "global_step": 97478, "epoch": 1174} {"train_loss": -21.94774055480957, "global_step": 97479, "epoch": 1174} {"train_loss": -21.77130699157715, "global_step": 97480, "epoch": 1174} {"train_loss": -22.085208892822266, "global_step": 97481, "epoch": 1174} {"train_loss": -21.686796188354492, "global_step": 97482, "epoch": 1174} {"train_loss": -22.102445602416992, "global_step": 97483, "epoch": 1174} {"train_loss": -21.877483367919922, "global_step": 97484, "epoch": 1174} {"train_loss": -21.37476348876953, "global_step": 97485, "epoch": 1174} {"train_loss": -21.7547550201416, "global_step": 97486, "epoch": 1174} {"train_loss": -21.86981773376465, "global_step": 97487, "epoch": 1174} {"train_loss": -21.506031036376953, "global_step": 97488, "epoch": 1174} {"train_loss": -22.257728576660156, "global_step": 97489, "epoch": 1174} {"train_loss": -21.700565338134766, "global_step": 97490, "epoch": 1174} {"train_loss": -21.700031280517578, "global_step": 97491, "epoch": 1174} {"train_loss": -22.112808227539062, "global_step": 97492, "epoch": 1174} {"train_loss": -22.043622970581055, "global_step": 97493, "epoch": 1174} {"train_loss": -22.10491180419922, "global_step": 97494, "epoch": 1174} {"train_loss": -21.549131393432617, "global_step": 97495, "epoch": 1174} {"train_loss": -21.727903366088867, "global_step": 97496, "epoch": 1174} {"train_loss": -21.828866958618164, "global_step": 97497, "epoch": 1174} {"train_loss": -21.752845764160156, "global_step": 97498, "epoch": 1174} {"train_loss": -21.87129020690918, "global_step": 97499, "epoch": 1174} {"train_loss": -21.894611358642578, "global_step": 97500, "epoch": 1174} {"train_loss": -21.865020751953125, "global_step": 97501, "epoch": 1174} {"train_loss": -21.756153106689453, "global_step": 97502, "epoch": 1174} {"train_loss": -22.29115867614746, "global_step": 97503, "epoch": 1174} {"train_loss": -21.960304260253906, "global_step": 97504, "epoch": 1174} {"train_loss": -22.063871383666992, "global_step": 97505, "epoch": 1174} {"train_loss": -21.851015090942383, "global_step": 97506, "epoch": 1174} {"train_loss": -22.067411422729492, "global_step": 97507, "epoch": 1174} {"train_loss": -21.702823638916016, "global_step": 97508, "epoch": 1174} {"train_loss": -21.620746612548828, "global_step": 97509, "epoch": 1174} {"train_loss": -21.809873580932617, "global_step": 97510, "epoch": 1174} {"train_loss": -21.834014892578125, "global_step": 97511, "epoch": 1174} {"train_loss": -22.058744430541992, "global_step": 97512, "epoch": 1174} {"train_loss": -21.764867782592773, "global_step": 97513, "epoch": 1174} {"train_loss": -21.95073127746582, "global_step": 97514, "epoch": 1174} {"train_loss": -21.94676971435547, "global_step": 97515, "epoch": 1174} {"train_loss": -22.056554794311523, "global_step": 97516, "epoch": 1174} {"train_loss": -21.9473819732666, "global_step": 97517, "epoch": 1174} {"train_loss": -21.98957633972168, "global_step": 97518, "epoch": 1174} {"train_loss": -22.071842193603516, "global_step": 97519, "epoch": 1174} {"train_loss": -21.733078002929688, "global_step": 97520, "epoch": 1174} {"train_loss": -21.743179321289062, "global_step": 97521, "epoch": 1174} {"train_loss": -21.55799674987793, "global_step": 97522, "epoch": 1174} {"train_loss": -22.213293075561523, "global_step": 97523, "epoch": 1174} {"train_loss": -21.85869141084602, "global_step": 97524, "epoch": 1174, "val_loss": 6025802.0} {"train_loss": -21.2106990814209, "global_step": 97525, "epoch": 1175} {"train_loss": -21.104394912719727, "global_step": 97526, "epoch": 1175} {"train_loss": -21.399921417236328, "global_step": 97527, "epoch": 1175} {"train_loss": -20.812910079956055, "global_step": 97528, "epoch": 1175} {"train_loss": -21.470186233520508, "global_step": 97529, "epoch": 1175} {"train_loss": -21.45705223083496, "global_step": 97530, "epoch": 1175} {"train_loss": -21.5649471282959, "global_step": 97531, "epoch": 1175} {"train_loss": -21.67110252380371, "global_step": 97532, "epoch": 1175} {"train_loss": -21.375131607055664, "global_step": 97533, "epoch": 1175} {"train_loss": -21.677522659301758, "global_step": 97534, "epoch": 1175} {"train_loss": -21.524274826049805, "global_step": 97535, "epoch": 1175} {"train_loss": -21.745412826538086, "global_step": 97536, "epoch": 1175} {"train_loss": -21.897876739501953, "global_step": 97537, "epoch": 1175} {"train_loss": -21.57649040222168, "global_step": 97538, "epoch": 1175} {"train_loss": -21.66749382019043, "global_step": 97539, "epoch": 1175} {"train_loss": -21.43881607055664, "global_step": 97540, "epoch": 1175} {"train_loss": -22.04257583618164, "global_step": 97541, "epoch": 1175} {"train_loss": -21.580495834350586, "global_step": 97542, "epoch": 1175} {"train_loss": -21.829919815063477, "global_step": 97543, "epoch": 1175} {"train_loss": -22.021713256835938, "global_step": 97544, "epoch": 1175} {"train_loss": -21.294422149658203, "global_step": 97545, "epoch": 1175} {"train_loss": -21.66221046447754, "global_step": 97546, "epoch": 1175} {"train_loss": -21.528329849243164, "global_step": 97547, "epoch": 1175} {"train_loss": -21.7905216217041, "global_step": 97548, "epoch": 1175} {"train_loss": -21.70186424255371, "global_step": 97549, "epoch": 1175} {"train_loss": -21.76462745666504, "global_step": 97550, "epoch": 1175} {"train_loss": -21.717893600463867, "global_step": 97551, "epoch": 1175} {"train_loss": -21.678699493408203, "global_step": 97552, "epoch": 1175} {"train_loss": -21.80580711364746, "global_step": 97553, "epoch": 1175} {"train_loss": -21.872825622558594, "global_step": 97554, "epoch": 1175} {"train_loss": -21.553041458129883, "global_step": 97555, "epoch": 1175} {"train_loss": -22.006834030151367, "global_step": 97556, "epoch": 1175} {"train_loss": -21.72393035888672, "global_step": 97557, "epoch": 1175} {"train_loss": -21.937681198120117, "global_step": 97558, "epoch": 1175} {"train_loss": -22.1700496673584, "global_step": 97559, "epoch": 1175} {"train_loss": -21.860965728759766, "global_step": 97560, "epoch": 1175} {"train_loss": -21.692331314086914, "global_step": 97561, "epoch": 1175} {"train_loss": -22.142946243286133, "global_step": 97562, "epoch": 1175} {"train_loss": -21.78352928161621, "global_step": 97563, "epoch": 1175} {"train_loss": -21.94628143310547, "global_step": 97564, "epoch": 1175} {"train_loss": -21.99551010131836, "global_step": 97565, "epoch": 1175} {"train_loss": -21.656206130981445, "global_step": 97566, "epoch": 1175} {"train_loss": -21.81187629699707, "global_step": 97567, "epoch": 1175} {"train_loss": -21.777475357055664, "global_step": 97568, "epoch": 1175} {"train_loss": -21.754789352416992, "global_step": 97569, "epoch": 1175} {"train_loss": -21.886220932006836, "global_step": 97570, "epoch": 1175} {"train_loss": -21.817129135131836, "global_step": 97571, "epoch": 1175} {"train_loss": -22.0781307220459, "global_step": 97572, "epoch": 1175} {"train_loss": -21.856948852539062, "global_step": 97573, "epoch": 1175} {"train_loss": -22.037473678588867, "global_step": 97574, "epoch": 1175} {"train_loss": -21.940641403198242, "global_step": 97575, "epoch": 1175} {"train_loss": -22.215818405151367, "global_step": 97576, "epoch": 1175} {"train_loss": -21.628646850585938, "global_step": 97577, "epoch": 1175} {"train_loss": -21.977094650268555, "global_step": 97578, "epoch": 1175} {"train_loss": -21.97928237915039, "global_step": 97579, "epoch": 1175} {"train_loss": -22.074909210205078, "global_step": 97580, "epoch": 1175} {"train_loss": -21.899250030517578, "global_step": 97581, "epoch": 1175} {"train_loss": -22.219999313354492, "global_step": 97582, "epoch": 1175} {"train_loss": -21.73176383972168, "global_step": 97583, "epoch": 1175} {"train_loss": -22.091970443725586, "global_step": 97584, "epoch": 1175} {"train_loss": -22.16185188293457, "global_step": 97585, "epoch": 1175} {"train_loss": -22.110759735107422, "global_step": 97586, "epoch": 1175} {"train_loss": -21.9778995513916, "global_step": 97587, "epoch": 1175} {"train_loss": -21.868499755859375, "global_step": 97588, "epoch": 1175} {"train_loss": -22.19685173034668, "global_step": 97589, "epoch": 1175} {"train_loss": -22.446395874023438, "global_step": 97590, "epoch": 1175} {"train_loss": -21.904911041259766, "global_step": 97591, "epoch": 1175} {"train_loss": -21.953210830688477, "global_step": 97592, "epoch": 1175} {"train_loss": -21.888839721679688, "global_step": 97593, "epoch": 1175} {"train_loss": -21.779043197631836, "global_step": 97594, "epoch": 1175} {"train_loss": -21.674732208251953, "global_step": 97595, "epoch": 1175} {"train_loss": -21.807191848754883, "global_step": 97596, "epoch": 1175} {"train_loss": -21.915740966796875, "global_step": 97597, "epoch": 1175} {"train_loss": -22.09773063659668, "global_step": 97598, "epoch": 1175} {"train_loss": -21.55615234375, "global_step": 97599, "epoch": 1175} {"train_loss": -21.755252838134766, "global_step": 97600, "epoch": 1175} {"train_loss": -21.961166381835938, "global_step": 97601, "epoch": 1175} {"train_loss": -21.619749069213867, "global_step": 97602, "epoch": 1175} {"train_loss": -21.808422088623047, "global_step": 97603, "epoch": 1175} {"train_loss": -21.926868438720703, "global_step": 97604, "epoch": 1175} {"train_loss": -22.212451934814453, "global_step": 97605, "epoch": 1175} {"train_loss": -22.064666748046875, "global_step": 97606, "epoch": 1175} {"train_loss": -21.79096713698054, "global_step": 97607, "epoch": 1175, "val_loss": 6141508.5} {"train_loss": -21.1970272064209, "global_step": 97608, "epoch": 1176} {"train_loss": -21.637258529663086, "global_step": 97609, "epoch": 1176} {"train_loss": -21.729440689086914, "global_step": 97610, "epoch": 1176} {"train_loss": -20.975875854492188, "global_step": 97611, "epoch": 1176} {"train_loss": -21.7000732421875, "global_step": 97612, "epoch": 1176} {"train_loss": -21.996551513671875, "global_step": 97613, "epoch": 1176} {"train_loss": -21.9161376953125, "global_step": 97614, "epoch": 1176} {"train_loss": -22.098594665527344, "global_step": 97615, "epoch": 1176} {"train_loss": -21.80244255065918, "global_step": 97616, "epoch": 1176} {"train_loss": -21.639629364013672, "global_step": 97617, "epoch": 1176} {"train_loss": -21.748600006103516, "global_step": 97618, "epoch": 1176} {"train_loss": -21.7991943359375, "global_step": 97619, "epoch": 1176} {"train_loss": -21.982959747314453, "global_step": 97620, "epoch": 1176} {"train_loss": -21.83794593811035, "global_step": 97621, "epoch": 1176} {"train_loss": -22.012042999267578, "global_step": 97622, "epoch": 1176} {"train_loss": -22.17072105407715, "global_step": 97623, "epoch": 1176} {"train_loss": -21.68846321105957, "global_step": 97624, "epoch": 1176} {"train_loss": -21.943517684936523, "global_step": 97625, "epoch": 1176} {"train_loss": -21.74033546447754, "global_step": 97626, "epoch": 1176} {"train_loss": -21.620620727539062, "global_step": 97627, "epoch": 1176} {"train_loss": -21.876083374023438, "global_step": 97628, "epoch": 1176} {"train_loss": -21.700519561767578, "global_step": 97629, "epoch": 1176} {"train_loss": -22.091217041015625, "global_step": 97630, "epoch": 1176} {"train_loss": -21.727941513061523, "global_step": 97631, "epoch": 1176} {"train_loss": -21.876602172851562, "global_step": 97632, "epoch": 1176} {"train_loss": -21.588504791259766, "global_step": 97633, "epoch": 1176} {"train_loss": -21.68354606628418, "global_step": 97634, "epoch": 1176} {"train_loss": -22.293344497680664, "global_step": 97635, "epoch": 1176} {"train_loss": -21.476200103759766, "global_step": 97636, "epoch": 1176} {"train_loss": -21.781230926513672, "global_step": 97637, "epoch": 1176} {"train_loss": -22.15052032470703, "global_step": 97638, "epoch": 1176} {"train_loss": -21.79432487487793, "global_step": 97639, "epoch": 1176} {"train_loss": -22.10039710998535, "global_step": 97640, "epoch": 1176} {"train_loss": -21.84445571899414, "global_step": 97641, "epoch": 1176} {"train_loss": -21.638364791870117, "global_step": 97642, "epoch": 1176} {"train_loss": -21.854679107666016, "global_step": 97643, "epoch": 1176} {"train_loss": -22.069765090942383, "global_step": 97644, "epoch": 1176} {"train_loss": -22.01741600036621, "global_step": 97645, "epoch": 1176} {"train_loss": -22.345285415649414, "global_step": 97646, "epoch": 1176} {"train_loss": -21.694982528686523, "global_step": 97647, "epoch": 1176} {"train_loss": -21.714984893798828, "global_step": 97648, "epoch": 1176} {"train_loss": -21.98955535888672, "global_step": 97649, "epoch": 1176} {"train_loss": -21.677499771118164, "global_step": 97650, "epoch": 1176} {"train_loss": -21.755512237548828, "global_step": 97651, "epoch": 1176} {"train_loss": -21.906057357788086, "global_step": 97652, "epoch": 1176} {"train_loss": -21.865615844726562, "global_step": 97653, "epoch": 1176} {"train_loss": -21.817777633666992, "global_step": 97654, "epoch": 1176} {"train_loss": -21.88265609741211, "global_step": 97655, "epoch": 1176} {"train_loss": -21.683258056640625, "global_step": 97656, "epoch": 1176} {"train_loss": -21.812131881713867, "global_step": 97657, "epoch": 1176} {"train_loss": -22.129779815673828, "global_step": 97658, "epoch": 1176} {"train_loss": -21.603164672851562, "global_step": 97659, "epoch": 1176} {"train_loss": -21.873422622680664, "global_step": 97660, "epoch": 1176} {"train_loss": -21.847427368164062, "global_step": 97661, "epoch": 1176} {"train_loss": -21.858829498291016, "global_step": 97662, "epoch": 1176} {"train_loss": -22.03594207763672, "global_step": 97663, "epoch": 1176} {"train_loss": -21.7929744720459, "global_step": 97664, "epoch": 1176} {"train_loss": -21.749088287353516, "global_step": 97665, "epoch": 1176} {"train_loss": -22.007902145385742, "global_step": 97666, "epoch": 1176} {"train_loss": -21.63764762878418, "global_step": 97667, "epoch": 1176} {"train_loss": -21.753889083862305, "global_step": 97668, "epoch": 1176} {"train_loss": -21.8741397857666, "global_step": 97669, "epoch": 1176} {"train_loss": -21.898151397705078, "global_step": 97670, "epoch": 1176} {"train_loss": -21.795392990112305, "global_step": 97671, "epoch": 1176} {"train_loss": -22.223440170288086, "global_step": 97672, "epoch": 1176} {"train_loss": -22.182743072509766, "global_step": 97673, "epoch": 1176} {"train_loss": -21.75812339782715, "global_step": 97674, "epoch": 1176} {"train_loss": -21.564165115356445, "global_step": 97675, "epoch": 1176} {"train_loss": -21.874027252197266, "global_step": 97676, "epoch": 1176} {"train_loss": -21.72989273071289, "global_step": 97677, "epoch": 1176} {"train_loss": -21.267520904541016, "global_step": 97678, "epoch": 1176} {"train_loss": -22.136722564697266, "global_step": 97679, "epoch": 1176} {"train_loss": -21.54807472229004, "global_step": 97680, "epoch": 1176} {"train_loss": -22.078899383544922, "global_step": 97681, "epoch": 1176} {"train_loss": -21.512540817260742, "global_step": 97682, "epoch": 1176} {"train_loss": -21.75748634338379, "global_step": 97683, "epoch": 1176} {"train_loss": -22.013662338256836, "global_step": 97684, "epoch": 1176} {"train_loss": -22.049936294555664, "global_step": 97685, "epoch": 1176} {"train_loss": -21.748945236206055, "global_step": 97686, "epoch": 1176} {"train_loss": -21.48256492614746, "global_step": 97687, "epoch": 1176} {"train_loss": -21.713151931762695, "global_step": 97688, "epoch": 1176} {"train_loss": -21.92136573791504, "global_step": 97689, "epoch": 1176} {"train_loss": -21.82457997425493, "global_step": 97690, "epoch": 1176, "val_loss": 6158723.0} {"train_loss": -21.639402389526367, "global_step": 97691, "epoch": 1177} {"train_loss": -21.662626266479492, "global_step": 97692, "epoch": 1177} {"train_loss": -21.617549896240234, "global_step": 97693, "epoch": 1177} {"train_loss": -22.132339477539062, "global_step": 97694, "epoch": 1177} {"train_loss": -21.901527404785156, "global_step": 97695, "epoch": 1177} {"train_loss": -21.969894409179688, "global_step": 97696, "epoch": 1177} {"train_loss": -21.83314323425293, "global_step": 97697, "epoch": 1177} {"train_loss": -21.832788467407227, "global_step": 97698, "epoch": 1177} {"train_loss": -21.46804428100586, "global_step": 97699, "epoch": 1177} {"train_loss": -21.68988609313965, "global_step": 97700, "epoch": 1177} {"train_loss": -21.8624324798584, "global_step": 97701, "epoch": 1177} {"train_loss": -21.66977310180664, "global_step": 97702, "epoch": 1177} {"train_loss": -21.865530014038086, "global_step": 97703, "epoch": 1177} {"train_loss": -21.903270721435547, "global_step": 97704, "epoch": 1177} {"train_loss": -21.571365356445312, "global_step": 97705, "epoch": 1177} {"train_loss": -21.865570068359375, "global_step": 97706, "epoch": 1177} {"train_loss": -22.037870407104492, "global_step": 97707, "epoch": 1177} {"train_loss": -21.61847686767578, "global_step": 97708, "epoch": 1177} {"train_loss": -21.668901443481445, "global_step": 97709, "epoch": 1177} {"train_loss": -21.85230255126953, "global_step": 97710, "epoch": 1177} {"train_loss": -21.930631637573242, "global_step": 97711, "epoch": 1177} {"train_loss": -21.974599838256836, "global_step": 97712, "epoch": 1177} {"train_loss": -21.963119506835938, "global_step": 97713, "epoch": 1177} {"train_loss": -21.717138290405273, "global_step": 97714, "epoch": 1177} {"train_loss": -22.040788650512695, "global_step": 97715, "epoch": 1177} {"train_loss": -22.306554794311523, "global_step": 97716, "epoch": 1177} {"train_loss": -21.785505294799805, "global_step": 97717, "epoch": 1177} {"train_loss": -21.781673431396484, "global_step": 97718, "epoch": 1177} {"train_loss": -21.948129653930664, "global_step": 97719, "epoch": 1177} {"train_loss": -21.511707305908203, "global_step": 97720, "epoch": 1177} {"train_loss": -21.90672492980957, "global_step": 97721, "epoch": 1177} {"train_loss": -21.828275680541992, "global_step": 97722, "epoch": 1177} {"train_loss": -21.29439353942871, "global_step": 97723, "epoch": 1177} {"train_loss": -21.77370262145996, "global_step": 97724, "epoch": 1177} {"train_loss": -21.80044937133789, "global_step": 97725, "epoch": 1177} {"train_loss": -21.790924072265625, "global_step": 97726, "epoch": 1177} {"train_loss": -22.040586471557617, "global_step": 97727, "epoch": 1177} {"train_loss": -21.541841506958008, "global_step": 97728, "epoch": 1177} {"train_loss": -21.763652801513672, "global_step": 97729, "epoch": 1177} {"train_loss": -21.41239356994629, "global_step": 97730, "epoch": 1177} {"train_loss": -21.836904525756836, "global_step": 97731, "epoch": 1177} {"train_loss": -21.52176856994629, "global_step": 97732, "epoch": 1177} {"train_loss": -21.55278968811035, "global_step": 97733, "epoch": 1177} {"train_loss": -21.922481536865234, "global_step": 97734, "epoch": 1177} {"train_loss": -21.929723739624023, "global_step": 97735, "epoch": 1177} {"train_loss": -21.906240463256836, "global_step": 97736, "epoch": 1177} {"train_loss": -21.871665954589844, "global_step": 97737, "epoch": 1177} {"train_loss": -22.013919830322266, "global_step": 97738, "epoch": 1177} {"train_loss": -21.752628326416016, "global_step": 97739, "epoch": 1177} {"train_loss": -21.809720993041992, "global_step": 97740, "epoch": 1177} {"train_loss": -21.985370635986328, "global_step": 97741, "epoch": 1177} {"train_loss": -21.626317977905273, "global_step": 97742, "epoch": 1177} {"train_loss": -21.941232681274414, "global_step": 97743, "epoch": 1177} {"train_loss": -21.913818359375, "global_step": 97744, "epoch": 1177} {"train_loss": -21.658233642578125, "global_step": 97745, "epoch": 1177} {"train_loss": -21.7656307220459, "global_step": 97746, "epoch": 1177} {"train_loss": -21.87774658203125, "global_step": 97747, "epoch": 1177} {"train_loss": -22.09504508972168, "global_step": 97748, "epoch": 1177} {"train_loss": -22.063005447387695, "global_step": 97749, "epoch": 1177} {"train_loss": -22.395614624023438, "global_step": 97750, "epoch": 1177} {"train_loss": -22.045804977416992, "global_step": 97751, "epoch": 1177} {"train_loss": -22.00032615661621, "global_step": 97752, "epoch": 1177} {"train_loss": -21.67911148071289, "global_step": 97753, "epoch": 1177} {"train_loss": -22.454666137695312, "global_step": 97754, "epoch": 1177} {"train_loss": -22.38163948059082, "global_step": 97755, "epoch": 1177} {"train_loss": -21.776418685913086, "global_step": 97756, "epoch": 1177} {"train_loss": -21.9836368560791, "global_step": 97757, "epoch": 1177} {"train_loss": -21.6992130279541, "global_step": 97758, "epoch": 1177} {"train_loss": -21.845033645629883, "global_step": 97759, "epoch": 1177} {"train_loss": -22.078031539916992, "global_step": 97760, "epoch": 1177} {"train_loss": -21.87811851501465, "global_step": 97761, "epoch": 1177} {"train_loss": -21.505603790283203, "global_step": 97762, "epoch": 1177} {"train_loss": -22.034698486328125, "global_step": 97763, "epoch": 1177} {"train_loss": -22.2094783782959, "global_step": 97764, "epoch": 1177} {"train_loss": -21.614152908325195, "global_step": 97765, "epoch": 1177} {"train_loss": -21.70577049255371, "global_step": 97766, "epoch": 1177} {"train_loss": -21.84619903564453, "global_step": 97767, "epoch": 1177} {"train_loss": -21.769733428955078, "global_step": 97768, "epoch": 1177} {"train_loss": -21.8488826751709, "global_step": 97769, "epoch": 1177} {"train_loss": -21.849349975585938, "global_step": 97770, "epoch": 1177} {"train_loss": -21.804664611816406, "global_step": 97771, "epoch": 1177} {"train_loss": -22.081579208374023, "global_step": 97772, "epoch": 1177} {"train_loss": -21.836742079401592, "global_step": 97773, "epoch": 1177, "val_loss": 6082038.5} {"train_loss": -21.578645706176758, "global_step": 97774, "epoch": 1178} {"train_loss": -21.323362350463867, "global_step": 97775, "epoch": 1178} {"train_loss": -21.405637741088867, "global_step": 97776, "epoch": 1178} {"train_loss": -20.941286087036133, "global_step": 97777, "epoch": 1178} {"train_loss": -21.28644371032715, "global_step": 97778, "epoch": 1178} {"train_loss": -21.282583236694336, "global_step": 97779, "epoch": 1178} {"train_loss": -21.548582077026367, "global_step": 97780, "epoch": 1178} {"train_loss": -21.641942977905273, "global_step": 97781, "epoch": 1178} {"train_loss": -21.248371124267578, "global_step": 97782, "epoch": 1178} {"train_loss": -21.71345329284668, "global_step": 97783, "epoch": 1178} {"train_loss": -21.242895126342773, "global_step": 97784, "epoch": 1178} {"train_loss": -21.681156158447266, "global_step": 97785, "epoch": 1178} {"train_loss": -21.417478561401367, "global_step": 97786, "epoch": 1178} {"train_loss": -21.41763687133789, "global_step": 97787, "epoch": 1178} {"train_loss": -21.92023277282715, "global_step": 97788, "epoch": 1178} {"train_loss": -21.482946395874023, "global_step": 97789, "epoch": 1178} {"train_loss": -21.490053176879883, "global_step": 97790, "epoch": 1178} {"train_loss": -21.90390396118164, "global_step": 97791, "epoch": 1178} {"train_loss": -21.234338760375977, "global_step": 97792, "epoch": 1178} {"train_loss": -21.61629295349121, "global_step": 97793, "epoch": 1178} {"train_loss": -21.792430877685547, "global_step": 97794, "epoch": 1178} {"train_loss": -21.767868041992188, "global_step": 97795, "epoch": 1178} {"train_loss": -21.70639419555664, "global_step": 97796, "epoch": 1178} {"train_loss": -21.924854278564453, "global_step": 97797, "epoch": 1178} {"train_loss": -21.57561492919922, "global_step": 97798, "epoch": 1178} {"train_loss": -21.60237693786621, "global_step": 97799, "epoch": 1178} {"train_loss": -21.420974731445312, "global_step": 97800, "epoch": 1178} {"train_loss": -21.386144638061523, "global_step": 97801, "epoch": 1178} {"train_loss": -21.725229263305664, "global_step": 97802, "epoch": 1178} {"train_loss": -21.636032104492188, "global_step": 97803, "epoch": 1178} {"train_loss": -21.703659057617188, "global_step": 97804, "epoch": 1178} {"train_loss": -21.625717163085938, "global_step": 97805, "epoch": 1178} {"train_loss": -22.086265563964844, "global_step": 97806, "epoch": 1178} {"train_loss": -21.523500442504883, "global_step": 97807, "epoch": 1178} {"train_loss": -21.870372772216797, "global_step": 97808, "epoch": 1178} {"train_loss": -22.0880069732666, "global_step": 97809, "epoch": 1178} {"train_loss": -21.54188346862793, "global_step": 97810, "epoch": 1178} {"train_loss": -21.872833251953125, "global_step": 97811, "epoch": 1178} {"train_loss": -21.81776237487793, "global_step": 97812, "epoch": 1178} {"train_loss": -21.661090850830078, "global_step": 97813, "epoch": 1178} {"train_loss": -22.394428253173828, "global_step": 97814, "epoch": 1178} {"train_loss": -21.91145133972168, "global_step": 97815, "epoch": 1178} {"train_loss": -22.039203643798828, "global_step": 97816, "epoch": 1178} {"train_loss": -21.588394165039062, "global_step": 97817, "epoch": 1178} {"train_loss": -21.732744216918945, "global_step": 97818, "epoch": 1178} {"train_loss": -21.9421329498291, "global_step": 97819, "epoch": 1178} {"train_loss": -21.686254501342773, "global_step": 97820, "epoch": 1178} {"train_loss": -21.491397857666016, "global_step": 97821, "epoch": 1178} {"train_loss": -22.049169540405273, "global_step": 97822, "epoch": 1178} {"train_loss": -21.974620819091797, "global_step": 97823, "epoch": 1178} {"train_loss": -22.27975845336914, "global_step": 97824, "epoch": 1178} {"train_loss": -21.422494888305664, "global_step": 97825, "epoch": 1178} {"train_loss": -21.802690505981445, "global_step": 97826, "epoch": 1178} {"train_loss": -21.949445724487305, "global_step": 97827, "epoch": 1178} {"train_loss": -22.010498046875, "global_step": 97828, "epoch": 1178} {"train_loss": -21.64266014099121, "global_step": 97829, "epoch": 1178} {"train_loss": -22.114107131958008, "global_step": 97830, "epoch": 1178} {"train_loss": -21.579092025756836, "global_step": 97831, "epoch": 1178} {"train_loss": -22.155288696289062, "global_step": 97832, "epoch": 1178} {"train_loss": -21.94355010986328, "global_step": 97833, "epoch": 1178} {"train_loss": -21.80000114440918, "global_step": 97834, "epoch": 1178} {"train_loss": -21.578744888305664, "global_step": 97835, "epoch": 1178} {"train_loss": -21.616552352905273, "global_step": 97836, "epoch": 1178} {"train_loss": -22.0875186920166, "global_step": 97837, "epoch": 1178} {"train_loss": -21.776029586791992, "global_step": 97838, "epoch": 1178} {"train_loss": -22.14313507080078, "global_step": 97839, "epoch": 1178} {"train_loss": -21.9372615814209, "global_step": 97840, "epoch": 1178} {"train_loss": -21.574987411499023, "global_step": 97841, "epoch": 1178} {"train_loss": -21.39838981628418, "global_step": 97842, "epoch": 1178} {"train_loss": -21.638202667236328, "global_step": 97843, "epoch": 1178} {"train_loss": -21.503236770629883, "global_step": 97844, "epoch": 1178} {"train_loss": -21.703739166259766, "global_step": 97845, "epoch": 1178} {"train_loss": -21.9788761138916, "global_step": 97846, "epoch": 1178} {"train_loss": -21.867042541503906, "global_step": 97847, "epoch": 1178} {"train_loss": -21.785167694091797, "global_step": 97848, "epoch": 1178} {"train_loss": -22.179458618164062, "global_step": 97849, "epoch": 1178} {"train_loss": -21.959693908691406, "global_step": 97850, "epoch": 1178} {"train_loss": -22.1103458404541, "global_step": 97851, "epoch": 1178} {"train_loss": -21.729251861572266, "global_step": 97852, "epoch": 1178} {"train_loss": -22.059173583984375, "global_step": 97853, "epoch": 1178} {"train_loss": -21.922910690307617, "global_step": 97854, "epoch": 1178} {"train_loss": -21.709625244140625, "global_step": 97855, "epoch": 1178} {"train_loss": -21.73351002888507, "global_step": 97856, "epoch": 1178, "val_loss": 6079257.0} {"train_loss": -21.466594696044922, "global_step": 97857, "epoch": 1179} {"train_loss": -21.354293823242188, "global_step": 97858, "epoch": 1179} {"train_loss": -21.657928466796875, "global_step": 97859, "epoch": 1179} {"train_loss": -21.721084594726562, "global_step": 97860, "epoch": 1179} {"train_loss": -21.9245548248291, "global_step": 97861, "epoch": 1179} {"train_loss": -21.548288345336914, "global_step": 97862, "epoch": 1179} {"train_loss": -21.797582626342773, "global_step": 97863, "epoch": 1179} {"train_loss": -21.526742935180664, "global_step": 97864, "epoch": 1179} {"train_loss": -22.146371841430664, "global_step": 97865, "epoch": 1179} {"train_loss": -21.5284366607666, "global_step": 97866, "epoch": 1179} {"train_loss": -21.624530792236328, "global_step": 97867, "epoch": 1179} {"train_loss": -21.72772216796875, "global_step": 97868, "epoch": 1179} {"train_loss": -21.713699340820312, "global_step": 97869, "epoch": 1179} {"train_loss": -21.813501358032227, "global_step": 97870, "epoch": 1179} {"train_loss": -21.692970275878906, "global_step": 97871, "epoch": 1179} {"train_loss": -21.60420799255371, "global_step": 97872, "epoch": 1179} {"train_loss": -21.525333404541016, "global_step": 97873, "epoch": 1179} {"train_loss": -21.562618255615234, "global_step": 97874, "epoch": 1179} {"train_loss": -21.64711570739746, "global_step": 97875, "epoch": 1179} {"train_loss": -21.675745010375977, "global_step": 97876, "epoch": 1179} {"train_loss": -21.879179000854492, "global_step": 97877, "epoch": 1179} {"train_loss": -21.516836166381836, "global_step": 97878, "epoch": 1179} {"train_loss": -21.74184799194336, "global_step": 97879, "epoch": 1179} {"train_loss": -21.90890884399414, "global_step": 97880, "epoch": 1179} {"train_loss": -21.773048400878906, "global_step": 97881, "epoch": 1179} {"train_loss": -22.05280303955078, "global_step": 97882, "epoch": 1179} {"train_loss": -22.124723434448242, "global_step": 97883, "epoch": 1179} {"train_loss": -21.937820434570312, "global_step": 97884, "epoch": 1179} {"train_loss": -21.637100219726562, "global_step": 97885, "epoch": 1179} {"train_loss": -21.44593620300293, "global_step": 97886, "epoch": 1179} {"train_loss": -22.038806915283203, "global_step": 97887, "epoch": 1179} {"train_loss": -21.73457145690918, "global_step": 97888, "epoch": 1179} {"train_loss": -21.721500396728516, "global_step": 97889, "epoch": 1179} {"train_loss": -21.712799072265625, "global_step": 97890, "epoch": 1179} {"train_loss": -21.586328506469727, "global_step": 97891, "epoch": 1179} {"train_loss": -22.143491744995117, "global_step": 97892, "epoch": 1179} {"train_loss": -21.491554260253906, "global_step": 97893, "epoch": 1179} {"train_loss": -22.002925872802734, "global_step": 97894, "epoch": 1179} {"train_loss": -21.844356536865234, "global_step": 97895, "epoch": 1179} {"train_loss": -21.811594009399414, "global_step": 97896, "epoch": 1179} {"train_loss": -21.481855392456055, "global_step": 97897, "epoch": 1179} {"train_loss": -21.898117065429688, "global_step": 97898, "epoch": 1179} {"train_loss": -21.737560272216797, "global_step": 97899, "epoch": 1179} {"train_loss": -22.143064498901367, "global_step": 97900, "epoch": 1179} {"train_loss": -21.873258590698242, "global_step": 97901, "epoch": 1179} {"train_loss": -21.88270378112793, "global_step": 97902, "epoch": 1179} {"train_loss": -21.907150268554688, "global_step": 97903, "epoch": 1179} {"train_loss": -22.030454635620117, "global_step": 97904, "epoch": 1179} {"train_loss": -21.774288177490234, "global_step": 97905, "epoch": 1179} {"train_loss": -21.863422393798828, "global_step": 97906, "epoch": 1179} {"train_loss": -22.231033325195312, "global_step": 97907, "epoch": 1179} {"train_loss": -21.911376953125, "global_step": 97908, "epoch": 1179} {"train_loss": -21.021162033081055, "global_step": 97909, "epoch": 1179} {"train_loss": -21.669815063476562, "global_step": 97910, "epoch": 1179} {"train_loss": -21.700483322143555, "global_step": 97911, "epoch": 1179} {"train_loss": -21.79315757751465, "global_step": 97912, "epoch": 1179} {"train_loss": -21.788227081298828, "global_step": 97913, "epoch": 1179} {"train_loss": -21.854984283447266, "global_step": 97914, "epoch": 1179} {"train_loss": -21.7738094329834, "global_step": 97915, "epoch": 1179} {"train_loss": -21.818883895874023, "global_step": 97916, "epoch": 1179} {"train_loss": -21.858762741088867, "global_step": 97917, "epoch": 1179} {"train_loss": -21.66410255432129, "global_step": 97918, "epoch": 1179} {"train_loss": -21.453027725219727, "global_step": 97919, "epoch": 1179} {"train_loss": -21.760833740234375, "global_step": 97920, "epoch": 1179} {"train_loss": -21.559431076049805, "global_step": 97921, "epoch": 1179} {"train_loss": -21.868215560913086, "global_step": 97922, "epoch": 1179} {"train_loss": -21.764917373657227, "global_step": 97923, "epoch": 1179} {"train_loss": -21.703737258911133, "global_step": 97924, "epoch": 1179} {"train_loss": -22.181781768798828, "global_step": 97925, "epoch": 1179} {"train_loss": -21.718595504760742, "global_step": 97926, "epoch": 1179} {"train_loss": -22.30886459350586, "global_step": 97927, "epoch": 1179} {"train_loss": -21.885135650634766, "global_step": 97928, "epoch": 1179} {"train_loss": -22.05170249938965, "global_step": 97929, "epoch": 1179} {"train_loss": -21.87672996520996, "global_step": 97930, "epoch": 1179} {"train_loss": -21.717575073242188, "global_step": 97931, "epoch": 1179} {"train_loss": -21.656803131103516, "global_step": 97932, "epoch": 1179} {"train_loss": -22.470537185668945, "global_step": 97933, "epoch": 1179} {"train_loss": -21.84480094909668, "global_step": 97934, "epoch": 1179} {"train_loss": -21.876420974731445, "global_step": 97935, "epoch": 1179} {"train_loss": -21.54457664489746, "global_step": 97936, "epoch": 1179} {"train_loss": -22.230321884155273, "global_step": 97937, "epoch": 1179} {"train_loss": -21.885696411132812, "global_step": 97938, "epoch": 1179} {"train_loss": -21.786356339971704, "global_step": 97939, "epoch": 1179, "val_loss": 6285058.0} {"train_loss": -21.303958892822266, "global_step": 97940, "epoch": 1180} {"train_loss": -21.825176239013672, "global_step": 97941, "epoch": 1180} {"train_loss": -21.42116355895996, "global_step": 97942, "epoch": 1180} {"train_loss": -21.507549285888672, "global_step": 97943, "epoch": 1180} {"train_loss": -21.479393005371094, "global_step": 97944, "epoch": 1180} {"train_loss": -21.502254486083984, "global_step": 97945, "epoch": 1180} {"train_loss": -21.49234390258789, "global_step": 97946, "epoch": 1180} {"train_loss": -21.65384292602539, "global_step": 97947, "epoch": 1180} {"train_loss": -21.3521728515625, "global_step": 97948, "epoch": 1180} {"train_loss": -21.61502456665039, "global_step": 97949, "epoch": 1180} {"train_loss": -21.50143051147461, "global_step": 97950, "epoch": 1180} {"train_loss": -21.19380760192871, "global_step": 97951, "epoch": 1180} {"train_loss": -21.611547470092773, "global_step": 97952, "epoch": 1180} {"train_loss": -21.650232315063477, "global_step": 97953, "epoch": 1180} {"train_loss": -21.186420440673828, "global_step": 97954, "epoch": 1180} {"train_loss": -21.63566017150879, "global_step": 97955, "epoch": 1180} {"train_loss": -21.500221252441406, "global_step": 97956, "epoch": 1180} {"train_loss": -21.999826431274414, "global_step": 97957, "epoch": 1180} {"train_loss": -21.342208862304688, "global_step": 97958, "epoch": 1180} {"train_loss": -21.830007553100586, "global_step": 97959, "epoch": 1180} {"train_loss": -22.264570236206055, "global_step": 97960, "epoch": 1180} {"train_loss": -21.490873336791992, "global_step": 97961, "epoch": 1180} {"train_loss": -21.75632095336914, "global_step": 97962, "epoch": 1180} {"train_loss": -21.625747680664062, "global_step": 97963, "epoch": 1180} {"train_loss": -21.63138198852539, "global_step": 97964, "epoch": 1180} {"train_loss": -22.119840621948242, "global_step": 97965, "epoch": 1180} {"train_loss": -21.74374771118164, "global_step": 97966, "epoch": 1180} {"train_loss": -22.103830337524414, "global_step": 97967, "epoch": 1180} {"train_loss": -22.25777244567871, "global_step": 97968, "epoch": 1180} {"train_loss": -21.873260498046875, "global_step": 97969, "epoch": 1180} {"train_loss": -22.16883659362793, "global_step": 97970, "epoch": 1180} {"train_loss": -21.948728561401367, "global_step": 97971, "epoch": 1180} {"train_loss": -22.057886123657227, "global_step": 97972, "epoch": 1180} {"train_loss": -21.85240936279297, "global_step": 97973, "epoch": 1180} {"train_loss": -21.754608154296875, "global_step": 97974, "epoch": 1180} {"train_loss": -21.9334716796875, "global_step": 97975, "epoch": 1180} {"train_loss": -21.788820266723633, "global_step": 97976, "epoch": 1180} {"train_loss": -21.83490562438965, "global_step": 97977, "epoch": 1180} {"train_loss": -22.097253799438477, "global_step": 97978, "epoch": 1180} {"train_loss": -21.873865127563477, "global_step": 97979, "epoch": 1180} {"train_loss": -21.95867347717285, "global_step": 97980, "epoch": 1180} {"train_loss": -21.697153091430664, "global_step": 97981, "epoch": 1180} {"train_loss": -21.87677764892578, "global_step": 97982, "epoch": 1180} {"train_loss": -22.15866470336914, "global_step": 97983, "epoch": 1180} {"train_loss": -22.0726318359375, "global_step": 97984, "epoch": 1180} {"train_loss": -21.546098709106445, "global_step": 97985, "epoch": 1180} {"train_loss": -21.974750518798828, "global_step": 97986, "epoch": 1180} {"train_loss": -21.672977447509766, "global_step": 97987, "epoch": 1180} {"train_loss": -21.527114868164062, "global_step": 97988, "epoch": 1180} {"train_loss": -21.926651000976562, "global_step": 97989, "epoch": 1180} {"train_loss": -21.705045700073242, "global_step": 97990, "epoch": 1180} {"train_loss": -21.951698303222656, "global_step": 97991, "epoch": 1180} {"train_loss": -21.44624900817871, "global_step": 97992, "epoch": 1180} {"train_loss": -21.539201736450195, "global_step": 97993, "epoch": 1180} {"train_loss": -21.72071647644043, "global_step": 97994, "epoch": 1180} {"train_loss": -21.746225357055664, "global_step": 97995, "epoch": 1180} {"train_loss": -22.273563385009766, "global_step": 97996, "epoch": 1180} {"train_loss": -21.626333236694336, "global_step": 97997, "epoch": 1180} {"train_loss": -21.888105392456055, "global_step": 97998, "epoch": 1180} {"train_loss": -21.691850662231445, "global_step": 97999, "epoch": 1180} {"train_loss": -21.849599838256836, "global_step": 98000, "epoch": 1180} {"train_loss": -22.061405181884766, "global_step": 98001, "epoch": 1180} {"train_loss": -22.20045280456543, "global_step": 98002, "epoch": 1180} {"train_loss": -21.54622459411621, "global_step": 98003, "epoch": 1180} {"train_loss": -22.110876083374023, "global_step": 98004, "epoch": 1180} {"train_loss": -21.850011825561523, "global_step": 98005, "epoch": 1180} {"train_loss": -21.917503356933594, "global_step": 98006, "epoch": 1180} {"train_loss": -21.60906410217285, "global_step": 98007, "epoch": 1180} {"train_loss": -21.388654708862305, "global_step": 98008, "epoch": 1180} {"train_loss": -22.03169059753418, "global_step": 98009, "epoch": 1180} {"train_loss": -21.85784339904785, "global_step": 98010, "epoch": 1180} {"train_loss": -21.793066024780273, "global_step": 98011, "epoch": 1180} {"train_loss": -21.98587417602539, "global_step": 98012, "epoch": 1180} {"train_loss": -21.850128173828125, "global_step": 98013, "epoch": 1180} {"train_loss": -21.67826271057129, "global_step": 98014, "epoch": 1180} {"train_loss": -22.1038875579834, "global_step": 98015, "epoch": 1180} {"train_loss": -21.897905349731445, "global_step": 98016, "epoch": 1180} {"train_loss": -21.911725997924805, "global_step": 98017, "epoch": 1180} {"train_loss": -21.778573989868164, "global_step": 98018, "epoch": 1180} {"train_loss": -22.032699584960938, "global_step": 98019, "epoch": 1180} {"train_loss": -21.93805503845215, "global_step": 98020, "epoch": 1180} {"train_loss": -22.044330596923828, "global_step": 98021, "epoch": 1180} {"train_loss": -21.794580896216704, "global_step": 98022, "epoch": 1180, "val_loss": 5973390.5} {"train_loss": -21.365800857543945, "global_step": 98023, "epoch": 1181} {"train_loss": -21.75989532470703, "global_step": 98024, "epoch": 1181} {"train_loss": -21.794450759887695, "global_step": 98025, "epoch": 1181} {"train_loss": -21.528478622436523, "global_step": 98026, "epoch": 1181} {"train_loss": -21.515380859375, "global_step": 98027, "epoch": 1181} {"train_loss": -21.362579345703125, "global_step": 98028, "epoch": 1181} {"train_loss": -21.9298095703125, "global_step": 98029, "epoch": 1181} {"train_loss": -21.649240493774414, "global_step": 98030, "epoch": 1181} {"train_loss": -21.878101348876953, "global_step": 98031, "epoch": 1181} {"train_loss": -21.749258041381836, "global_step": 98032, "epoch": 1181} {"train_loss": -21.573183059692383, "global_step": 98033, "epoch": 1181} {"train_loss": -21.545745849609375, "global_step": 98034, "epoch": 1181} {"train_loss": -21.912446975708008, "global_step": 98035, "epoch": 1181} {"train_loss": -21.655691146850586, "global_step": 98036, "epoch": 1181} {"train_loss": -22.018787384033203, "global_step": 98037, "epoch": 1181} {"train_loss": -21.595434188842773, "global_step": 98038, "epoch": 1181} {"train_loss": -21.799665451049805, "global_step": 98039, "epoch": 1181} {"train_loss": -21.801301956176758, "global_step": 98040, "epoch": 1181} {"train_loss": -21.638532638549805, "global_step": 98041, "epoch": 1181} {"train_loss": -21.780410766601562, "global_step": 98042, "epoch": 1181} {"train_loss": -22.04607391357422, "global_step": 98043, "epoch": 1181} {"train_loss": -21.941884994506836, "global_step": 98044, "epoch": 1181} {"train_loss": -21.838977813720703, "global_step": 98045, "epoch": 1181} {"train_loss": -21.92958641052246, "global_step": 98046, "epoch": 1181} {"train_loss": -21.3875789642334, "global_step": 98047, "epoch": 1181} {"train_loss": -21.73023796081543, "global_step": 98048, "epoch": 1181} {"train_loss": -21.928546905517578, "global_step": 98049, "epoch": 1181} {"train_loss": -21.395254135131836, "global_step": 98050, "epoch": 1181} {"train_loss": -21.90301513671875, "global_step": 98051, "epoch": 1181} {"train_loss": -21.475391387939453, "global_step": 98052, "epoch": 1181} {"train_loss": -21.765623092651367, "global_step": 98053, "epoch": 1181} {"train_loss": -21.65758514404297, "global_step": 98054, "epoch": 1181} {"train_loss": -21.630990982055664, "global_step": 98055, "epoch": 1181} {"train_loss": -21.729154586791992, "global_step": 98056, "epoch": 1181} {"train_loss": -21.787445068359375, "global_step": 98057, "epoch": 1181} {"train_loss": -22.11301040649414, "global_step": 98058, "epoch": 1181} {"train_loss": -21.51905632019043, "global_step": 98059, "epoch": 1181} {"train_loss": -21.909765243530273, "global_step": 98060, "epoch": 1181} {"train_loss": -21.865781784057617, "global_step": 98061, "epoch": 1181} {"train_loss": -21.700927734375, "global_step": 98062, "epoch": 1181} {"train_loss": -21.37978744506836, "global_step": 98063, "epoch": 1181} {"train_loss": -21.699052810668945, "global_step": 98064, "epoch": 1181} {"train_loss": -22.151466369628906, "global_step": 98065, "epoch": 1181} {"train_loss": -22.116031646728516, "global_step": 98066, "epoch": 1181} {"train_loss": -21.638275146484375, "global_step": 98067, "epoch": 1181} {"train_loss": -21.487869262695312, "global_step": 98068, "epoch": 1181} {"train_loss": -21.77541732788086, "global_step": 98069, "epoch": 1181} {"train_loss": -21.951007843017578, "global_step": 98070, "epoch": 1181} {"train_loss": -21.93360710144043, "global_step": 98071, "epoch": 1181} {"train_loss": -22.013792037963867, "global_step": 98072, "epoch": 1181} {"train_loss": -22.13937759399414, "global_step": 98073, "epoch": 1181} {"train_loss": -21.839616775512695, "global_step": 98074, "epoch": 1181} {"train_loss": -21.8223819732666, "global_step": 98075, "epoch": 1181} {"train_loss": -21.451961517333984, "global_step": 98076, "epoch": 1181} {"train_loss": -21.729463577270508, "global_step": 98077, "epoch": 1181} {"train_loss": -22.036060333251953, "global_step": 98078, "epoch": 1181} {"train_loss": -21.682043075561523, "global_step": 98079, "epoch": 1181} {"train_loss": -22.082822799682617, "global_step": 98080, "epoch": 1181} {"train_loss": -21.794389724731445, "global_step": 98081, "epoch": 1181} {"train_loss": -21.657217025756836, "global_step": 98082, "epoch": 1181} {"train_loss": -21.991300582885742, "global_step": 98083, "epoch": 1181} {"train_loss": -21.92042350769043, "global_step": 98084, "epoch": 1181} {"train_loss": -22.250192642211914, "global_step": 98085, "epoch": 1181} {"train_loss": -21.932058334350586, "global_step": 98086, "epoch": 1181} {"train_loss": -21.844282150268555, "global_step": 98087, "epoch": 1181} {"train_loss": -22.003612518310547, "global_step": 98088, "epoch": 1181} {"train_loss": -21.68307876586914, "global_step": 98089, "epoch": 1181} {"train_loss": -22.025455474853516, "global_step": 98090, "epoch": 1181} {"train_loss": -21.4730224609375, "global_step": 98091, "epoch": 1181} {"train_loss": -21.733596801757812, "global_step": 98092, "epoch": 1181} {"train_loss": -22.333234786987305, "global_step": 98093, "epoch": 1181} {"train_loss": -22.018217086791992, "global_step": 98094, "epoch": 1181} {"train_loss": -22.161725997924805, "global_step": 98095, "epoch": 1181} {"train_loss": -22.02341079711914, "global_step": 98096, "epoch": 1181} {"train_loss": -21.85483169555664, "global_step": 98097, "epoch": 1181} {"train_loss": -21.826534271240234, "global_step": 98098, "epoch": 1181} {"train_loss": -21.715070724487305, "global_step": 98099, "epoch": 1181} {"train_loss": -21.881689071655273, "global_step": 98100, "epoch": 1181} {"train_loss": -21.72885513305664, "global_step": 98101, "epoch": 1181} {"train_loss": -21.854290008544922, "global_step": 98102, "epoch": 1181} {"train_loss": -21.872730255126953, "global_step": 98103, "epoch": 1181} {"train_loss": -22.001083374023438, "global_step": 98104, "epoch": 1181} {"train_loss": -21.823621726897827, "global_step": 98105, "epoch": 1181, "val_loss": 6082165.5} {"train_loss": -20.76265525817871, "global_step": 98106, "epoch": 1182} {"train_loss": -21.72623062133789, "global_step": 98107, "epoch": 1182} {"train_loss": -21.58906364440918, "global_step": 98108, "epoch": 1182} {"train_loss": -21.43570327758789, "global_step": 98109, "epoch": 1182} {"train_loss": -21.415754318237305, "global_step": 98110, "epoch": 1182} {"train_loss": -21.892850875854492, "global_step": 98111, "epoch": 1182} {"train_loss": -20.883283615112305, "global_step": 98112, "epoch": 1182} {"train_loss": -21.66698455810547, "global_step": 98113, "epoch": 1182} {"train_loss": -21.644453048706055, "global_step": 98114, "epoch": 1182} {"train_loss": -21.672651290893555, "global_step": 98115, "epoch": 1182} {"train_loss": -21.292633056640625, "global_step": 98116, "epoch": 1182} {"train_loss": -21.760656356811523, "global_step": 98117, "epoch": 1182} {"train_loss": -21.27255630493164, "global_step": 98118, "epoch": 1182} {"train_loss": -21.448522567749023, "global_step": 98119, "epoch": 1182} {"train_loss": -21.707763671875, "global_step": 98120, "epoch": 1182} {"train_loss": -21.30562973022461, "global_step": 98121, "epoch": 1182} {"train_loss": -21.593473434448242, "global_step": 98122, "epoch": 1182} {"train_loss": -21.903776168823242, "global_step": 98123, "epoch": 1182} {"train_loss": -21.658248901367188, "global_step": 98124, "epoch": 1182} {"train_loss": -21.56864356994629, "global_step": 98125, "epoch": 1182} {"train_loss": -21.748279571533203, "global_step": 98126, "epoch": 1182} {"train_loss": -21.875097274780273, "global_step": 98127, "epoch": 1182} {"train_loss": -22.040470123291016, "global_step": 98128, "epoch": 1182} {"train_loss": -21.72252082824707, "global_step": 98129, "epoch": 1182} {"train_loss": -21.574838638305664, "global_step": 98130, "epoch": 1182} {"train_loss": -21.376665115356445, "global_step": 98131, "epoch": 1182} {"train_loss": -22.031373977661133, "global_step": 98132, "epoch": 1182} {"train_loss": -22.140270233154297, "global_step": 98133, "epoch": 1182} {"train_loss": -22.05963134765625, "global_step": 98134, "epoch": 1182} {"train_loss": -21.621082305908203, "global_step": 98135, "epoch": 1182} {"train_loss": -21.932065963745117, "global_step": 98136, "epoch": 1182} {"train_loss": -21.75344467163086, "global_step": 98137, "epoch": 1182} {"train_loss": -21.914384841918945, "global_step": 98138, "epoch": 1182} {"train_loss": -21.61916160583496, "global_step": 98139, "epoch": 1182} {"train_loss": -22.314165115356445, "global_step": 98140, "epoch": 1182} {"train_loss": -22.16084098815918, "global_step": 98141, "epoch": 1182} {"train_loss": -21.914817810058594, "global_step": 98142, "epoch": 1182} {"train_loss": -21.948453903198242, "global_step": 98143, "epoch": 1182} {"train_loss": -21.85799789428711, "global_step": 98144, "epoch": 1182} {"train_loss": -21.58258628845215, "global_step": 98145, "epoch": 1182} {"train_loss": -21.66350555419922, "global_step": 98146, "epoch": 1182} {"train_loss": -21.490537643432617, "global_step": 98147, "epoch": 1182} {"train_loss": -21.81778335571289, "global_step": 98148, "epoch": 1182} {"train_loss": -21.972064971923828, "global_step": 98149, "epoch": 1182} {"train_loss": -21.7338809967041, "global_step": 98150, "epoch": 1182} {"train_loss": -21.670419692993164, "global_step": 98151, "epoch": 1182} {"train_loss": -21.731952667236328, "global_step": 98152, "epoch": 1182} {"train_loss": -21.761215209960938, "global_step": 98153, "epoch": 1182} {"train_loss": -22.10691261291504, "global_step": 98154, "epoch": 1182} {"train_loss": -21.941181182861328, "global_step": 98155, "epoch": 1182} {"train_loss": -21.71534538269043, "global_step": 98156, "epoch": 1182} {"train_loss": -21.61078453063965, "global_step": 98157, "epoch": 1182} {"train_loss": -21.73862075805664, "global_step": 98158, "epoch": 1182} {"train_loss": -21.9068660736084, "global_step": 98159, "epoch": 1182} {"train_loss": -21.83820915222168, "global_step": 98160, "epoch": 1182} {"train_loss": -21.762205123901367, "global_step": 98161, "epoch": 1182} {"train_loss": -21.899017333984375, "global_step": 98162, "epoch": 1182} {"train_loss": -21.89764976501465, "global_step": 98163, "epoch": 1182} {"train_loss": -21.891651153564453, "global_step": 98164, "epoch": 1182} {"train_loss": -21.703176498413086, "global_step": 98165, "epoch": 1182} {"train_loss": -21.90724754333496, "global_step": 98166, "epoch": 1182} {"train_loss": -22.019264221191406, "global_step": 98167, "epoch": 1182} {"train_loss": -21.90719985961914, "global_step": 98168, "epoch": 1182} {"train_loss": -21.782968521118164, "global_step": 98169, "epoch": 1182} {"train_loss": -22.302780151367188, "global_step": 98170, "epoch": 1182} {"train_loss": -21.587095260620117, "global_step": 98171, "epoch": 1182} {"train_loss": -21.520187377929688, "global_step": 98172, "epoch": 1182} {"train_loss": -22.011980056762695, "global_step": 98173, "epoch": 1182} {"train_loss": -22.314908981323242, "global_step": 98174, "epoch": 1182} {"train_loss": -21.917987823486328, "global_step": 98175, "epoch": 1182} {"train_loss": -22.383869171142578, "global_step": 98176, "epoch": 1182} {"train_loss": -22.065296173095703, "global_step": 98177, "epoch": 1182} {"train_loss": -22.064701080322266, "global_step": 98178, "epoch": 1182} {"train_loss": -21.74736213684082, "global_step": 98179, "epoch": 1182} {"train_loss": -22.082416534423828, "global_step": 98180, "epoch": 1182} {"train_loss": -22.26122283935547, "global_step": 98181, "epoch": 1182} {"train_loss": -22.01386833190918, "global_step": 98182, "epoch": 1182} {"train_loss": -21.937108993530273, "global_step": 98183, "epoch": 1182} {"train_loss": -21.86524772644043, "global_step": 98184, "epoch": 1182} {"train_loss": -22.102216720581055, "global_step": 98185, "epoch": 1182} {"train_loss": -21.423906326293945, "global_step": 98186, "epoch": 1182} {"train_loss": -21.58022117614746, "global_step": 98187, "epoch": 1182} {"train_loss": -21.794190395309265, "global_step": 98188, "epoch": 1182, "val_loss": 6035517.0} {"train_loss": -21.182355880737305, "global_step": 98189, "epoch": 1183} {"train_loss": -19.897153854370117, "global_step": 98190, "epoch": 1183} {"train_loss": -21.038894653320312, "global_step": 98191, "epoch": 1183} {"train_loss": -20.845211029052734, "global_step": 98192, "epoch": 1183} {"train_loss": -20.617406845092773, "global_step": 98193, "epoch": 1183} {"train_loss": -21.308841705322266, "global_step": 98194, "epoch": 1183} {"train_loss": -21.100492477416992, "global_step": 98195, "epoch": 1183} {"train_loss": -21.397520065307617, "global_step": 98196, "epoch": 1183} {"train_loss": -21.07415771484375, "global_step": 98197, "epoch": 1183} {"train_loss": -21.10092544555664, "global_step": 98198, "epoch": 1183} {"train_loss": -21.400527954101562, "global_step": 98199, "epoch": 1183} {"train_loss": -21.341781616210938, "global_step": 98200, "epoch": 1183} {"train_loss": -21.198715209960938, "global_step": 98201, "epoch": 1183} {"train_loss": -21.359657287597656, "global_step": 98202, "epoch": 1183} {"train_loss": -21.601491928100586, "global_step": 98203, "epoch": 1183} {"train_loss": -21.813331604003906, "global_step": 98204, "epoch": 1183} {"train_loss": -21.376937866210938, "global_step": 98205, "epoch": 1183} {"train_loss": -21.610065460205078, "global_step": 98206, "epoch": 1183} {"train_loss": -21.55306053161621, "global_step": 98207, "epoch": 1183} {"train_loss": -21.554901123046875, "global_step": 98208, "epoch": 1183} {"train_loss": -21.3468074798584, "global_step": 98209, "epoch": 1183} {"train_loss": -21.363611221313477, "global_step": 98210, "epoch": 1183} {"train_loss": -21.526073455810547, "global_step": 98211, "epoch": 1183} {"train_loss": -21.523923873901367, "global_step": 98212, "epoch": 1183} {"train_loss": -21.582172393798828, "global_step": 98213, "epoch": 1183} {"train_loss": -21.332889556884766, "global_step": 98214, "epoch": 1183} {"train_loss": -21.882627487182617, "global_step": 98215, "epoch": 1183} {"train_loss": -21.686941146850586, "global_step": 98216, "epoch": 1183} {"train_loss": -21.623388290405273, "global_step": 98217, "epoch": 1183} {"train_loss": -21.93556785583496, "global_step": 98218, "epoch": 1183} {"train_loss": -21.82843017578125, "global_step": 98219, "epoch": 1183} {"train_loss": -21.607952117919922, "global_step": 98220, "epoch": 1183} {"train_loss": -21.914907455444336, "global_step": 98221, "epoch": 1183} {"train_loss": -21.46099090576172, "global_step": 98222, "epoch": 1183} {"train_loss": -21.589216232299805, "global_step": 98223, "epoch": 1183} {"train_loss": -21.77181053161621, "global_step": 98224, "epoch": 1183} {"train_loss": -21.60392189025879, "global_step": 98225, "epoch": 1183} {"train_loss": -22.014484405517578, "global_step": 98226, "epoch": 1183} {"train_loss": -22.04001808166504, "global_step": 98227, "epoch": 1183} {"train_loss": -22.00736427307129, "global_step": 98228, "epoch": 1183} {"train_loss": -21.867643356323242, "global_step": 98229, "epoch": 1183} {"train_loss": -21.813520431518555, "global_step": 98230, "epoch": 1183} {"train_loss": -21.776582717895508, "global_step": 98231, "epoch": 1183} {"train_loss": -21.696304321289062, "global_step": 98232, "epoch": 1183} {"train_loss": -21.543659210205078, "global_step": 98233, "epoch": 1183} {"train_loss": -21.820466995239258, "global_step": 98234, "epoch": 1183} {"train_loss": -21.79554557800293, "global_step": 98235, "epoch": 1183} {"train_loss": -21.977819442749023, "global_step": 98236, "epoch": 1183} {"train_loss": -21.836584091186523, "global_step": 98237, "epoch": 1183} {"train_loss": -22.07978630065918, "global_step": 98238, "epoch": 1183} {"train_loss": -21.6384334564209, "global_step": 98239, "epoch": 1183} {"train_loss": -21.57608985900879, "global_step": 98240, "epoch": 1183} {"train_loss": -22.05740737915039, "global_step": 98241, "epoch": 1183} {"train_loss": -21.829517364501953, "global_step": 98242, "epoch": 1183} {"train_loss": -21.535314559936523, "global_step": 98243, "epoch": 1183} {"train_loss": -21.932493209838867, "global_step": 98244, "epoch": 1183} {"train_loss": -21.99073028564453, "global_step": 98245, "epoch": 1183} {"train_loss": -22.162057876586914, "global_step": 98246, "epoch": 1183} {"train_loss": -21.822223663330078, "global_step": 98247, "epoch": 1183} {"train_loss": -22.039594650268555, "global_step": 98248, "epoch": 1183} {"train_loss": -21.920034408569336, "global_step": 98249, "epoch": 1183} {"train_loss": -21.97078514099121, "global_step": 98250, "epoch": 1183} {"train_loss": -21.795391082763672, "global_step": 98251, "epoch": 1183} {"train_loss": -21.981786727905273, "global_step": 98252, "epoch": 1183} {"train_loss": -21.783872604370117, "global_step": 98253, "epoch": 1183} {"train_loss": -21.84682273864746, "global_step": 98254, "epoch": 1183} {"train_loss": -22.018274307250977, "global_step": 98255, "epoch": 1183} {"train_loss": -21.60041618347168, "global_step": 98256, "epoch": 1183} {"train_loss": -21.84799575805664, "global_step": 98257, "epoch": 1183} {"train_loss": -21.811017990112305, "global_step": 98258, "epoch": 1183} {"train_loss": -21.792552947998047, "global_step": 98259, "epoch": 1183} {"train_loss": -22.066261291503906, "global_step": 98260, "epoch": 1183} {"train_loss": -21.923856735229492, "global_step": 98261, "epoch": 1183} {"train_loss": -22.137563705444336, "global_step": 98262, "epoch": 1183} {"train_loss": -22.05954933166504, "global_step": 98263, "epoch": 1183} {"train_loss": -21.9471492767334, "global_step": 98264, "epoch": 1183} {"train_loss": -21.787918090820312, "global_step": 98265, "epoch": 1183} {"train_loss": -21.80225944519043, "global_step": 98266, "epoch": 1183} {"train_loss": -21.73369598388672, "global_step": 98267, "epoch": 1183} {"train_loss": -22.097333908081055, "global_step": 98268, "epoch": 1183} {"train_loss": -21.74356460571289, "global_step": 98269, "epoch": 1183} {"train_loss": -21.970788955688477, "global_step": 98270, "epoch": 1183} {"train_loss": -21.668485021016682, "global_step": 98271, "epoch": 1183, "val_loss": 6196104.5} {"train_loss": -21.715700149536133, "global_step": 98272, "epoch": 1184} {"train_loss": -21.67435646057129, "global_step": 98273, "epoch": 1184} {"train_loss": -21.31551170349121, "global_step": 98274, "epoch": 1184} {"train_loss": -21.822677612304688, "global_step": 98275, "epoch": 1184} {"train_loss": -21.678443908691406, "global_step": 98276, "epoch": 1184} {"train_loss": -21.52029800415039, "global_step": 98277, "epoch": 1184} {"train_loss": -21.900177001953125, "global_step": 98278, "epoch": 1184} {"train_loss": -21.795480728149414, "global_step": 98279, "epoch": 1184} {"train_loss": -21.688032150268555, "global_step": 98280, "epoch": 1184} {"train_loss": -21.874414443969727, "global_step": 98281, "epoch": 1184} {"train_loss": -21.681718826293945, "global_step": 98282, "epoch": 1184} {"train_loss": -21.83454704284668, "global_step": 98283, "epoch": 1184} {"train_loss": -21.86466407775879, "global_step": 98284, "epoch": 1184} {"train_loss": -22.071985244750977, "global_step": 98285, "epoch": 1184} {"train_loss": -21.659225463867188, "global_step": 98286, "epoch": 1184} {"train_loss": -21.995162963867188, "global_step": 98287, "epoch": 1184} {"train_loss": -22.029813766479492, "global_step": 98288, "epoch": 1184} {"train_loss": -22.088598251342773, "global_step": 98289, "epoch": 1184} {"train_loss": -21.403318405151367, "global_step": 98290, "epoch": 1184} {"train_loss": -21.619047164916992, "global_step": 98291, "epoch": 1184} {"train_loss": -21.937637329101562, "global_step": 98292, "epoch": 1184} {"train_loss": -21.737232208251953, "global_step": 98293, "epoch": 1184} {"train_loss": -22.15912437438965, "global_step": 98294, "epoch": 1184} {"train_loss": -22.19158935546875, "global_step": 98295, "epoch": 1184} {"train_loss": -21.91023826599121, "global_step": 98296, "epoch": 1184} {"train_loss": -21.802160263061523, "global_step": 98297, "epoch": 1184} {"train_loss": -21.99530792236328, "global_step": 98298, "epoch": 1184} {"train_loss": -22.041616439819336, "global_step": 98299, "epoch": 1184} {"train_loss": -21.466663360595703, "global_step": 98300, "epoch": 1184} {"train_loss": -21.731754302978516, "global_step": 98301, "epoch": 1184} {"train_loss": -22.02802848815918, "global_step": 98302, "epoch": 1184} {"train_loss": -21.64104652404785, "global_step": 98303, "epoch": 1184} {"train_loss": -22.042570114135742, "global_step": 98304, "epoch": 1184} {"train_loss": -22.115949630737305, "global_step": 98305, "epoch": 1184} {"train_loss": -21.796464920043945, "global_step": 98306, "epoch": 1184} {"train_loss": -22.138954162597656, "global_step": 98307, "epoch": 1184} {"train_loss": -21.62163734436035, "global_step": 98308, "epoch": 1184} {"train_loss": -21.540937423706055, "global_step": 98309, "epoch": 1184} {"train_loss": -21.55246925354004, "global_step": 98310, "epoch": 1184} {"train_loss": -21.888412475585938, "global_step": 98311, "epoch": 1184} {"train_loss": -22.074750900268555, "global_step": 98312, "epoch": 1184} {"train_loss": -21.71156120300293, "global_step": 98313, "epoch": 1184} {"train_loss": -21.26648712158203, "global_step": 98314, "epoch": 1184} {"train_loss": -21.95119857788086, "global_step": 98315, "epoch": 1184} {"train_loss": -21.659717559814453, "global_step": 98316, "epoch": 1184} {"train_loss": -21.878034591674805, "global_step": 98317, "epoch": 1184} {"train_loss": -21.7333927154541, "global_step": 98318, "epoch": 1184} {"train_loss": -21.857746124267578, "global_step": 98319, "epoch": 1184} {"train_loss": -21.831480026245117, "global_step": 98320, "epoch": 1184} {"train_loss": -21.85190773010254, "global_step": 98321, "epoch": 1184} {"train_loss": -21.883081436157227, "global_step": 98322, "epoch": 1184} {"train_loss": -21.859615325927734, "global_step": 98323, "epoch": 1184} {"train_loss": -21.793638229370117, "global_step": 98324, "epoch": 1184} {"train_loss": -21.70753288269043, "global_step": 98325, "epoch": 1184} {"train_loss": -21.97173500061035, "global_step": 98326, "epoch": 1184} {"train_loss": -21.949743270874023, "global_step": 98327, "epoch": 1184} {"train_loss": -21.968647003173828, "global_step": 98328, "epoch": 1184} {"train_loss": -21.90802001953125, "global_step": 98329, "epoch": 1184} {"train_loss": -21.83224868774414, "global_step": 98330, "epoch": 1184} {"train_loss": -21.63691520690918, "global_step": 98331, "epoch": 1184} {"train_loss": -21.806427001953125, "global_step": 98332, "epoch": 1184} {"train_loss": -21.640493392944336, "global_step": 98333, "epoch": 1184} {"train_loss": -22.022232055664062, "global_step": 98334, "epoch": 1184} {"train_loss": -21.893564224243164, "global_step": 98335, "epoch": 1184} {"train_loss": -21.6742000579834, "global_step": 98336, "epoch": 1184} {"train_loss": -22.05464744567871, "global_step": 98337, "epoch": 1184} {"train_loss": -22.03940773010254, "global_step": 98338, "epoch": 1184} {"train_loss": -21.835378646850586, "global_step": 98339, "epoch": 1184} {"train_loss": -21.772079467773438, "global_step": 98340, "epoch": 1184} {"train_loss": -22.21072769165039, "global_step": 98341, "epoch": 1184} {"train_loss": -21.96368980407715, "global_step": 98342, "epoch": 1184} {"train_loss": -21.97292137145996, "global_step": 98343, "epoch": 1184} {"train_loss": -21.961048126220703, "global_step": 98344, "epoch": 1184} {"train_loss": -21.864564895629883, "global_step": 98345, "epoch": 1184} {"train_loss": -21.955835342407227, "global_step": 98346, "epoch": 1184} {"train_loss": -21.81504249572754, "global_step": 98347, "epoch": 1184} {"train_loss": -21.93970489501953, "global_step": 98348, "epoch": 1184} {"train_loss": -22.500722885131836, "global_step": 98349, "epoch": 1184} {"train_loss": -21.900375366210938, "global_step": 98350, "epoch": 1184} {"train_loss": -22.209081649780273, "global_step": 98351, "epoch": 1184} {"train_loss": -21.783533096313477, "global_step": 98352, "epoch": 1184} {"train_loss": -21.561546325683594, "global_step": 98353, "epoch": 1184} {"train_loss": -21.846348107579242, "global_step": 98354, "epoch": 1184, "val_loss": 6024304.5} {"train_loss": -21.44205093383789, "global_step": 98355, "epoch": 1185} {"train_loss": -21.372291564941406, "global_step": 98356, "epoch": 1185} {"train_loss": -21.687559127807617, "global_step": 98357, "epoch": 1185} {"train_loss": -21.552541732788086, "global_step": 98358, "epoch": 1185} {"train_loss": -21.48007583618164, "global_step": 98359, "epoch": 1185} {"train_loss": -22.0195255279541, "global_step": 98360, "epoch": 1185} {"train_loss": -21.32932472229004, "global_step": 98361, "epoch": 1185} {"train_loss": -21.69386100769043, "global_step": 98362, "epoch": 1185} {"train_loss": -21.59316062927246, "global_step": 98363, "epoch": 1185} {"train_loss": -21.527414321899414, "global_step": 98364, "epoch": 1185} {"train_loss": -21.655057907104492, "global_step": 98365, "epoch": 1185} {"train_loss": -21.96238136291504, "global_step": 98366, "epoch": 1185} {"train_loss": -21.696582794189453, "global_step": 98367, "epoch": 1185} {"train_loss": -21.912322998046875, "global_step": 98368, "epoch": 1185} {"train_loss": -21.640140533447266, "global_step": 98369, "epoch": 1185} {"train_loss": -21.85213279724121, "global_step": 98370, "epoch": 1185} {"train_loss": -21.976749420166016, "global_step": 98371, "epoch": 1185} {"train_loss": -21.775381088256836, "global_step": 98372, "epoch": 1185} {"train_loss": -21.485422134399414, "global_step": 98373, "epoch": 1185} {"train_loss": -21.736560821533203, "global_step": 98374, "epoch": 1185} {"train_loss": -21.932296752929688, "global_step": 98375, "epoch": 1185} {"train_loss": -21.709171295166016, "global_step": 98376, "epoch": 1185} {"train_loss": -21.908836364746094, "global_step": 98377, "epoch": 1185} {"train_loss": -21.731382369995117, "global_step": 98378, "epoch": 1185} {"train_loss": -21.891998291015625, "global_step": 98379, "epoch": 1185} {"train_loss": -21.84952735900879, "global_step": 98380, "epoch": 1185} {"train_loss": -21.545473098754883, "global_step": 98381, "epoch": 1185} {"train_loss": -21.804792404174805, "global_step": 98382, "epoch": 1185} {"train_loss": -21.8768367767334, "global_step": 98383, "epoch": 1185} {"train_loss": -22.087913513183594, "global_step": 98384, "epoch": 1185} {"train_loss": -21.8963680267334, "global_step": 98385, "epoch": 1185} {"train_loss": -21.89639663696289, "global_step": 98386, "epoch": 1185} {"train_loss": -21.790761947631836, "global_step": 98387, "epoch": 1185} {"train_loss": -22.155118942260742, "global_step": 98388, "epoch": 1185} {"train_loss": -21.60688591003418, "global_step": 98389, "epoch": 1185} {"train_loss": -21.83504295349121, "global_step": 98390, "epoch": 1185} {"train_loss": -21.74854850769043, "global_step": 98391, "epoch": 1185} {"train_loss": -22.00382423400879, "global_step": 98392, "epoch": 1185} {"train_loss": -21.786239624023438, "global_step": 98393, "epoch": 1185} {"train_loss": -21.80182456970215, "global_step": 98394, "epoch": 1185} {"train_loss": -21.90302085876465, "global_step": 98395, "epoch": 1185} {"train_loss": -21.83068084716797, "global_step": 98396, "epoch": 1185} {"train_loss": -22.018798828125, "global_step": 98397, "epoch": 1185} {"train_loss": -22.17237091064453, "global_step": 98398, "epoch": 1185} {"train_loss": -21.635177612304688, "global_step": 98399, "epoch": 1185} {"train_loss": -22.1235294342041, "global_step": 98400, "epoch": 1185} {"train_loss": -21.674802780151367, "global_step": 98401, "epoch": 1185} {"train_loss": -21.770517349243164, "global_step": 98402, "epoch": 1185} {"train_loss": -21.667633056640625, "global_step": 98403, "epoch": 1185} {"train_loss": -21.51563835144043, "global_step": 98404, "epoch": 1185} {"train_loss": -22.262338638305664, "global_step": 98405, "epoch": 1185} {"train_loss": -21.975934982299805, "global_step": 98406, "epoch": 1185} {"train_loss": -22.053836822509766, "global_step": 98407, "epoch": 1185} {"train_loss": -22.036884307861328, "global_step": 98408, "epoch": 1185} {"train_loss": -22.066394805908203, "global_step": 98409, "epoch": 1185} {"train_loss": -21.893571853637695, "global_step": 98410, "epoch": 1185} {"train_loss": -21.739377975463867, "global_step": 98411, "epoch": 1185} {"train_loss": -21.969482421875, "global_step": 98412, "epoch": 1185} {"train_loss": -21.647199630737305, "global_step": 98413, "epoch": 1185} {"train_loss": -21.634166717529297, "global_step": 98414, "epoch": 1185} {"train_loss": -21.495712280273438, "global_step": 98415, "epoch": 1185} {"train_loss": -21.815671920776367, "global_step": 98416, "epoch": 1185} {"train_loss": -22.058195114135742, "global_step": 98417, "epoch": 1185} {"train_loss": -21.989227294921875, "global_step": 98418, "epoch": 1185} {"train_loss": -21.867733001708984, "global_step": 98419, "epoch": 1185} {"train_loss": -21.675085067749023, "global_step": 98420, "epoch": 1185} {"train_loss": -21.846479415893555, "global_step": 98421, "epoch": 1185} {"train_loss": -21.92024040222168, "global_step": 98422, "epoch": 1185} {"train_loss": -21.826889038085938, "global_step": 98423, "epoch": 1185} {"train_loss": -22.1257266998291, "global_step": 98424, "epoch": 1185} {"train_loss": -21.64411735534668, "global_step": 98425, "epoch": 1185} {"train_loss": -21.86366844177246, "global_step": 98426, "epoch": 1185} {"train_loss": -21.798383712768555, "global_step": 98427, "epoch": 1185} {"train_loss": -21.651575088500977, "global_step": 98428, "epoch": 1185} {"train_loss": -22.061614990234375, "global_step": 98429, "epoch": 1185} {"train_loss": -22.131391525268555, "global_step": 98430, "epoch": 1185} {"train_loss": -22.070301055908203, "global_step": 98431, "epoch": 1185} {"train_loss": -22.066944122314453, "global_step": 98432, "epoch": 1185} {"train_loss": -21.92091178894043, "global_step": 98433, "epoch": 1185} {"train_loss": -21.657194137573242, "global_step": 98434, "epoch": 1185} {"train_loss": -21.81947898864746, "global_step": 98435, "epoch": 1185} {"train_loss": -21.937965393066406, "global_step": 98436, "epoch": 1185} {"train_loss": -21.814970269260638, "global_step": 98437, "epoch": 1185, "val_loss": 6090419.0} {"train_loss": -20.791025161743164, "global_step": 98438, "epoch": 1186} {"train_loss": -21.187833786010742, "global_step": 98439, "epoch": 1186} {"train_loss": -20.926477432250977, "global_step": 98440, "epoch": 1186} {"train_loss": -21.410940170288086, "global_step": 98441, "epoch": 1186} {"train_loss": -20.84840202331543, "global_step": 98442, "epoch": 1186} {"train_loss": -21.49611473083496, "global_step": 98443, "epoch": 1186} {"train_loss": -21.201467514038086, "global_step": 98444, "epoch": 1186} {"train_loss": -21.628183364868164, "global_step": 98445, "epoch": 1186} {"train_loss": -21.67079734802246, "global_step": 98446, "epoch": 1186} {"train_loss": -21.64092254638672, "global_step": 98447, "epoch": 1186} {"train_loss": -21.560590744018555, "global_step": 98448, "epoch": 1186} {"train_loss": -21.66956329345703, "global_step": 98449, "epoch": 1186} {"train_loss": -21.35236167907715, "global_step": 98450, "epoch": 1186} {"train_loss": -21.61138153076172, "global_step": 98451, "epoch": 1186} {"train_loss": -21.847387313842773, "global_step": 98452, "epoch": 1186} {"train_loss": -21.521474838256836, "global_step": 98453, "epoch": 1186} {"train_loss": -21.66731071472168, "global_step": 98454, "epoch": 1186} {"train_loss": -21.929798126220703, "global_step": 98455, "epoch": 1186} {"train_loss": -21.442485809326172, "global_step": 98456, "epoch": 1186} {"train_loss": -21.80266571044922, "global_step": 98457, "epoch": 1186} {"train_loss": -21.540882110595703, "global_step": 98458, "epoch": 1186} {"train_loss": -21.85709571838379, "global_step": 98459, "epoch": 1186} {"train_loss": -21.59415626525879, "global_step": 98460, "epoch": 1186} {"train_loss": -21.975263595581055, "global_step": 98461, "epoch": 1186} {"train_loss": -22.119688034057617, "global_step": 98462, "epoch": 1186} {"train_loss": -21.655454635620117, "global_step": 98463, "epoch": 1186} {"train_loss": -21.99226188659668, "global_step": 98464, "epoch": 1186} {"train_loss": -21.63800048828125, "global_step": 98465, "epoch": 1186} {"train_loss": -21.89266586303711, "global_step": 98466, "epoch": 1186} {"train_loss": -21.498565673828125, "global_step": 98467, "epoch": 1186} {"train_loss": -21.719160079956055, "global_step": 98468, "epoch": 1186} {"train_loss": -21.92537498474121, "global_step": 98469, "epoch": 1186} {"train_loss": -21.998355865478516, "global_step": 98470, "epoch": 1186} {"train_loss": -21.925119400024414, "global_step": 98471, "epoch": 1186} {"train_loss": -21.91645622253418, "global_step": 98472, "epoch": 1186} {"train_loss": -21.8629093170166, "global_step": 98473, "epoch": 1186} {"train_loss": -21.795894622802734, "global_step": 98474, "epoch": 1186} {"train_loss": -21.79476547241211, "global_step": 98475, "epoch": 1186} {"train_loss": -21.94293212890625, "global_step": 98476, "epoch": 1186} {"train_loss": -21.674081802368164, "global_step": 98477, "epoch": 1186} {"train_loss": -21.937898635864258, "global_step": 98478, "epoch": 1186} {"train_loss": -21.859363555908203, "global_step": 98479, "epoch": 1186} {"train_loss": -21.961294174194336, "global_step": 98480, "epoch": 1186} {"train_loss": -21.965909957885742, "global_step": 98481, "epoch": 1186} {"train_loss": -21.921384811401367, "global_step": 98482, "epoch": 1186} {"train_loss": -21.747894287109375, "global_step": 98483, "epoch": 1186} {"train_loss": -22.26996421813965, "global_step": 98484, "epoch": 1186} {"train_loss": -21.800079345703125, "global_step": 98485, "epoch": 1186} {"train_loss": -21.768096923828125, "global_step": 98486, "epoch": 1186} {"train_loss": -21.961217880249023, "global_step": 98487, "epoch": 1186} {"train_loss": -22.051118850708008, "global_step": 98488, "epoch": 1186} {"train_loss": -21.773107528686523, "global_step": 98489, "epoch": 1186} {"train_loss": -21.829483032226562, "global_step": 98490, "epoch": 1186} {"train_loss": -21.77968978881836, "global_step": 98491, "epoch": 1186} {"train_loss": -21.87112045288086, "global_step": 98492, "epoch": 1186} {"train_loss": -21.886388778686523, "global_step": 98493, "epoch": 1186} {"train_loss": -21.3701114654541, "global_step": 98494, "epoch": 1186} {"train_loss": -21.88957405090332, "global_step": 98495, "epoch": 1186} {"train_loss": -21.73786163330078, "global_step": 98496, "epoch": 1186} {"train_loss": -22.18580436706543, "global_step": 98497, "epoch": 1186} {"train_loss": -21.891794204711914, "global_step": 98498, "epoch": 1186} {"train_loss": -21.96858024597168, "global_step": 98499, "epoch": 1186} {"train_loss": -22.050790786743164, "global_step": 98500, "epoch": 1186} {"train_loss": -21.71208953857422, "global_step": 98501, "epoch": 1186} {"train_loss": -21.9671688079834, "global_step": 98502, "epoch": 1186} {"train_loss": -21.496976852416992, "global_step": 98503, "epoch": 1186} {"train_loss": -22.155807495117188, "global_step": 98504, "epoch": 1186} {"train_loss": -21.89520835876465, "global_step": 98505, "epoch": 1186} {"train_loss": -21.601654052734375, "global_step": 98506, "epoch": 1186} {"train_loss": -22.02294921875, "global_step": 98507, "epoch": 1186} {"train_loss": -21.88210105895996, "global_step": 98508, "epoch": 1186} {"train_loss": -22.25522232055664, "global_step": 98509, "epoch": 1186} {"train_loss": -21.997798919677734, "global_step": 98510, "epoch": 1186} {"train_loss": -21.67961883544922, "global_step": 98511, "epoch": 1186} {"train_loss": -21.764572143554688, "global_step": 98512, "epoch": 1186} {"train_loss": -22.207626342773438, "global_step": 98513, "epoch": 1186} {"train_loss": -22.109725952148438, "global_step": 98514, "epoch": 1186} {"train_loss": -21.660663604736328, "global_step": 98515, "epoch": 1186} {"train_loss": -21.820396423339844, "global_step": 98516, "epoch": 1186} {"train_loss": -21.975393295288086, "global_step": 98517, "epoch": 1186} {"train_loss": -22.17402458190918, "global_step": 98518, "epoch": 1186} {"train_loss": -22.22768211364746, "global_step": 98519, "epoch": 1186} {"train_loss": -21.773557088461267, "global_step": 98520, "epoch": 1186, "val_loss": 6093112.5} {"train_loss": -22.367162704467773, "global_step": 98521, "epoch": 1187} {"train_loss": -21.883792877197266, "global_step": 98522, "epoch": 1187} {"train_loss": -21.86368179321289, "global_step": 98523, "epoch": 1187} {"train_loss": -22.140430450439453, "global_step": 98524, "epoch": 1187} {"train_loss": -22.07137107849121, "global_step": 98525, "epoch": 1187} {"train_loss": -21.71046257019043, "global_step": 98526, "epoch": 1187} {"train_loss": -21.967803955078125, "global_step": 98527, "epoch": 1187} {"train_loss": -22.273086547851562, "global_step": 98528, "epoch": 1187} {"train_loss": -22.17180061340332, "global_step": 98529, "epoch": 1187} {"train_loss": -21.693220138549805, "global_step": 98530, "epoch": 1187} {"train_loss": -21.895709991455078, "global_step": 98531, "epoch": 1187} {"train_loss": -21.91663932800293, "global_step": 98532, "epoch": 1187} {"train_loss": -21.775232315063477, "global_step": 98533, "epoch": 1187} {"train_loss": -21.843536376953125, "global_step": 98534, "epoch": 1187} {"train_loss": -21.975040435791016, "global_step": 98535, "epoch": 1187} {"train_loss": -21.90456199645996, "global_step": 98536, "epoch": 1187} {"train_loss": -21.985794067382812, "global_step": 98537, "epoch": 1187} {"train_loss": -21.97994041442871, "global_step": 98538, "epoch": 1187} {"train_loss": -22.00932502746582, "global_step": 98539, "epoch": 1187} {"train_loss": -21.834426879882812, "global_step": 98540, "epoch": 1187} {"train_loss": -21.688344955444336, "global_step": 98541, "epoch": 1187} {"train_loss": -21.9082088470459, "global_step": 98542, "epoch": 1187} {"train_loss": -21.692514419555664, "global_step": 98543, "epoch": 1187} {"train_loss": -21.877899169921875, "global_step": 98544, "epoch": 1187} {"train_loss": -21.988431930541992, "global_step": 98545, "epoch": 1187} {"train_loss": -21.827346801757812, "global_step": 98546, "epoch": 1187} {"train_loss": -22.208507537841797, "global_step": 98547, "epoch": 1187} {"train_loss": -22.019927978515625, "global_step": 98548, "epoch": 1187} {"train_loss": -21.8150691986084, "global_step": 98549, "epoch": 1187} {"train_loss": -22.06914710998535, "global_step": 98550, "epoch": 1187} {"train_loss": -22.092243194580078, "global_step": 98551, "epoch": 1187} {"train_loss": -21.428804397583008, "global_step": 98552, "epoch": 1187} {"train_loss": -22.18958854675293, "global_step": 98553, "epoch": 1187} {"train_loss": -22.223371505737305, "global_step": 98554, "epoch": 1187} {"train_loss": -21.668790817260742, "global_step": 98555, "epoch": 1187} {"train_loss": -21.979978561401367, "global_step": 98556, "epoch": 1187} {"train_loss": -22.309446334838867, "global_step": 98557, "epoch": 1187} {"train_loss": -21.836933135986328, "global_step": 98558, "epoch": 1187} {"train_loss": -21.898582458496094, "global_step": 98559, "epoch": 1187} {"train_loss": -22.34852409362793, "global_step": 98560, "epoch": 1187} {"train_loss": -22.16971778869629, "global_step": 98561, "epoch": 1187} {"train_loss": -21.753454208374023, "global_step": 98562, "epoch": 1187} {"train_loss": -21.95961570739746, "global_step": 98563, "epoch": 1187} {"train_loss": -21.943096160888672, "global_step": 98564, "epoch": 1187} {"train_loss": -21.50836944580078, "global_step": 98565, "epoch": 1187} {"train_loss": -21.865434646606445, "global_step": 98566, "epoch": 1187} {"train_loss": -22.048669815063477, "global_step": 98567, "epoch": 1187} {"train_loss": -21.735837936401367, "global_step": 98568, "epoch": 1187} {"train_loss": -21.941848754882812, "global_step": 98569, "epoch": 1187} {"train_loss": -21.855817794799805, "global_step": 98570, "epoch": 1187} {"train_loss": -21.762611389160156, "global_step": 98571, "epoch": 1187} {"train_loss": -21.65984535217285, "global_step": 98572, "epoch": 1187} {"train_loss": -21.91706657409668, "global_step": 98573, "epoch": 1187} {"train_loss": -22.4346981048584, "global_step": 98574, "epoch": 1187} {"train_loss": -21.77714729309082, "global_step": 98575, "epoch": 1187} {"train_loss": -21.992618560791016, "global_step": 98576, "epoch": 1187} {"train_loss": -22.202011108398438, "global_step": 98577, "epoch": 1187} {"train_loss": -21.597578048706055, "global_step": 98578, "epoch": 1187} {"train_loss": -22.054962158203125, "global_step": 98579, "epoch": 1187} {"train_loss": -21.812864303588867, "global_step": 98580, "epoch": 1187} {"train_loss": -22.027523040771484, "global_step": 98581, "epoch": 1187} {"train_loss": -21.818735122680664, "global_step": 98582, "epoch": 1187} {"train_loss": -22.008190155029297, "global_step": 98583, "epoch": 1187} {"train_loss": -21.57162857055664, "global_step": 98584, "epoch": 1187} {"train_loss": -21.998300552368164, "global_step": 98585, "epoch": 1187} {"train_loss": -21.886693954467773, "global_step": 98586, "epoch": 1187} {"train_loss": -22.0684871673584, "global_step": 98587, "epoch": 1187} {"train_loss": -21.46455192565918, "global_step": 98588, "epoch": 1187} {"train_loss": -21.699066162109375, "global_step": 98589, "epoch": 1187} {"train_loss": -22.135517120361328, "global_step": 98590, "epoch": 1187} {"train_loss": -21.90227699279785, "global_step": 98591, "epoch": 1187} {"train_loss": -21.931333541870117, "global_step": 98592, "epoch": 1187} {"train_loss": -21.84507179260254, "global_step": 98593, "epoch": 1187} {"train_loss": -21.973276138305664, "global_step": 98594, "epoch": 1187} {"train_loss": -22.124574661254883, "global_step": 98595, "epoch": 1187} {"train_loss": -22.165206909179688, "global_step": 98596, "epoch": 1187} {"train_loss": -22.037818908691406, "global_step": 98597, "epoch": 1187} {"train_loss": -21.639251708984375, "global_step": 98598, "epoch": 1187} {"train_loss": -22.135986328125, "global_step": 98599, "epoch": 1187} {"train_loss": -21.918668746948242, "global_step": 98600, "epoch": 1187} {"train_loss": -22.041378021240234, "global_step": 98601, "epoch": 1187} {"train_loss": -21.986587524414062, "global_step": 98602, "epoch": 1187} {"train_loss": -21.934395709669733, "global_step": 98603, "epoch": 1187, "val_loss": 6141506.0} {"train_loss": -21.747777938842773, "global_step": 98604, "epoch": 1188} {"train_loss": -21.264707565307617, "global_step": 98605, "epoch": 1188} {"train_loss": -21.7294979095459, "global_step": 98606, "epoch": 1188} {"train_loss": -22.055988311767578, "global_step": 98607, "epoch": 1188} {"train_loss": -21.70516014099121, "global_step": 98608, "epoch": 1188} {"train_loss": -21.38394546508789, "global_step": 98609, "epoch": 1188} {"train_loss": -22.028202056884766, "global_step": 98610, "epoch": 1188} {"train_loss": -21.733488082885742, "global_step": 98611, "epoch": 1188} {"train_loss": -21.66546630859375, "global_step": 98612, "epoch": 1188} {"train_loss": -21.787084579467773, "global_step": 98613, "epoch": 1188} {"train_loss": -21.671781539916992, "global_step": 98614, "epoch": 1188} {"train_loss": -21.641860961914062, "global_step": 98615, "epoch": 1188} {"train_loss": -21.609272003173828, "global_step": 98616, "epoch": 1188} {"train_loss": -21.97475242614746, "global_step": 98617, "epoch": 1188} {"train_loss": -21.471067428588867, "global_step": 98618, "epoch": 1188} {"train_loss": -21.809799194335938, "global_step": 98619, "epoch": 1188} {"train_loss": -21.69222068786621, "global_step": 98620, "epoch": 1188} {"train_loss": -21.714706420898438, "global_step": 98621, "epoch": 1188} {"train_loss": -21.888416290283203, "global_step": 98622, "epoch": 1188} {"train_loss": -21.991886138916016, "global_step": 98623, "epoch": 1188} {"train_loss": -21.952436447143555, "global_step": 98624, "epoch": 1188} {"train_loss": -21.675399780273438, "global_step": 98625, "epoch": 1188} {"train_loss": -21.883625030517578, "global_step": 98626, "epoch": 1188} {"train_loss": -21.69009017944336, "global_step": 98627, "epoch": 1188} {"train_loss": -22.445446014404297, "global_step": 98628, "epoch": 1188} {"train_loss": -21.813657760620117, "global_step": 98629, "epoch": 1188} {"train_loss": -21.741905212402344, "global_step": 98630, "epoch": 1188} {"train_loss": -21.981536865234375, "global_step": 98631, "epoch": 1188} {"train_loss": -21.78857421875, "global_step": 98632, "epoch": 1188} {"train_loss": -22.242124557495117, "global_step": 98633, "epoch": 1188} {"train_loss": -21.7735595703125, "global_step": 98634, "epoch": 1188} {"train_loss": -21.88755989074707, "global_step": 98635, "epoch": 1188} {"train_loss": -21.861358642578125, "global_step": 98636, "epoch": 1188} {"train_loss": -22.209646224975586, "global_step": 98637, "epoch": 1188} {"train_loss": -21.74586296081543, "global_step": 98638, "epoch": 1188} {"train_loss": -21.747631072998047, "global_step": 98639, "epoch": 1188} {"train_loss": -22.02410316467285, "global_step": 98640, "epoch": 1188} {"train_loss": -21.41351318359375, "global_step": 98641, "epoch": 1188} {"train_loss": -21.993221282958984, "global_step": 98642, "epoch": 1188} {"train_loss": -21.925352096557617, "global_step": 98643, "epoch": 1188} {"train_loss": -21.586776733398438, "global_step": 98644, "epoch": 1188} {"train_loss": -21.77243423461914, "global_step": 98645, "epoch": 1188} {"train_loss": -21.862646102905273, "global_step": 98646, "epoch": 1188} {"train_loss": -21.90057945251465, "global_step": 98647, "epoch": 1188} {"train_loss": -21.92203712463379, "global_step": 98648, "epoch": 1188} {"train_loss": -21.918725967407227, "global_step": 98649, "epoch": 1188} {"train_loss": -21.96519660949707, "global_step": 98650, "epoch": 1188} {"train_loss": -22.09235954284668, "global_step": 98651, "epoch": 1188} {"train_loss": -21.744348526000977, "global_step": 98652, "epoch": 1188} {"train_loss": -21.208635330200195, "global_step": 98653, "epoch": 1188} {"train_loss": -21.876022338867188, "global_step": 98654, "epoch": 1188} {"train_loss": -21.41338539123535, "global_step": 98655, "epoch": 1188} {"train_loss": -21.497905731201172, "global_step": 98656, "epoch": 1188} {"train_loss": -22.0178279876709, "global_step": 98657, "epoch": 1188} {"train_loss": -22.083242416381836, "global_step": 98658, "epoch": 1188} {"train_loss": -21.966501235961914, "global_step": 98659, "epoch": 1188} {"train_loss": -21.783021926879883, "global_step": 98660, "epoch": 1188} {"train_loss": -21.813024520874023, "global_step": 98661, "epoch": 1188} {"train_loss": -21.699186325073242, "global_step": 98662, "epoch": 1188} {"train_loss": -21.783533096313477, "global_step": 98663, "epoch": 1188} {"train_loss": -21.782211303710938, "global_step": 98664, "epoch": 1188} {"train_loss": -21.729482650756836, "global_step": 98665, "epoch": 1188} {"train_loss": -22.019804000854492, "global_step": 98666, "epoch": 1188} {"train_loss": -21.903757095336914, "global_step": 98667, "epoch": 1188} {"train_loss": -21.977811813354492, "global_step": 98668, "epoch": 1188} {"train_loss": -21.963048934936523, "global_step": 98669, "epoch": 1188} {"train_loss": -21.6568660736084, "global_step": 98670, "epoch": 1188} {"train_loss": -21.790842056274414, "global_step": 98671, "epoch": 1188} {"train_loss": -21.79926109313965, "global_step": 98672, "epoch": 1188} {"train_loss": -21.878219604492188, "global_step": 98673, "epoch": 1188} {"train_loss": -21.972089767456055, "global_step": 98674, "epoch": 1188} {"train_loss": -22.037996292114258, "global_step": 98675, "epoch": 1188} {"train_loss": -21.738967895507812, "global_step": 98676, "epoch": 1188} {"train_loss": -21.81593894958496, "global_step": 98677, "epoch": 1188} {"train_loss": -21.929574966430664, "global_step": 98678, "epoch": 1188} {"train_loss": -22.092891693115234, "global_step": 98679, "epoch": 1188} {"train_loss": -21.765869140625, "global_step": 98680, "epoch": 1188} {"train_loss": -21.90351676940918, "global_step": 98681, "epoch": 1188} {"train_loss": -21.860626220703125, "global_step": 98682, "epoch": 1188} {"train_loss": -21.433086395263672, "global_step": 98683, "epoch": 1188} {"train_loss": -22.11604881286621, "global_step": 98684, "epoch": 1188} {"train_loss": -21.81243896484375, "global_step": 98685, "epoch": 1188} {"train_loss": -21.82567658481828, "global_step": 98686, "epoch": 1188, "val_loss": 5973031.0} {"train_loss": -21.350440979003906, "global_step": 98687, "epoch": 1189} {"train_loss": -21.671485900878906, "global_step": 98688, "epoch": 1189} {"train_loss": -21.359943389892578, "global_step": 98689, "epoch": 1189} {"train_loss": -21.783695220947266, "global_step": 98690, "epoch": 1189} {"train_loss": -21.468097686767578, "global_step": 98691, "epoch": 1189} {"train_loss": -21.51893424987793, "global_step": 98692, "epoch": 1189} {"train_loss": -21.498519897460938, "global_step": 98693, "epoch": 1189} {"train_loss": -21.724077224731445, "global_step": 98694, "epoch": 1189} {"train_loss": -21.5861759185791, "global_step": 98695, "epoch": 1189} {"train_loss": -21.326696395874023, "global_step": 98696, "epoch": 1189} {"train_loss": -21.712060928344727, "global_step": 98697, "epoch": 1189} {"train_loss": -21.73528289794922, "global_step": 98698, "epoch": 1189} {"train_loss": -22.042110443115234, "global_step": 98699, "epoch": 1189} {"train_loss": -21.99765396118164, "global_step": 98700, "epoch": 1189} {"train_loss": -21.4776611328125, "global_step": 98701, "epoch": 1189} {"train_loss": -21.725521087646484, "global_step": 98702, "epoch": 1189} {"train_loss": -21.354724884033203, "global_step": 98703, "epoch": 1189} {"train_loss": -21.945175170898438, "global_step": 98704, "epoch": 1189} {"train_loss": -22.135648727416992, "global_step": 98705, "epoch": 1189} {"train_loss": -21.299781799316406, "global_step": 98706, "epoch": 1189} {"train_loss": -21.94594383239746, "global_step": 98707, "epoch": 1189} {"train_loss": -21.686553955078125, "global_step": 98708, "epoch": 1189} {"train_loss": -21.64558982849121, "global_step": 98709, "epoch": 1189} {"train_loss": -21.833526611328125, "global_step": 98710, "epoch": 1189} {"train_loss": -21.61423683166504, "global_step": 98711, "epoch": 1189} {"train_loss": -21.56827163696289, "global_step": 98712, "epoch": 1189} {"train_loss": -21.906919479370117, "global_step": 98713, "epoch": 1189} {"train_loss": -22.02597999572754, "global_step": 98714, "epoch": 1189} {"train_loss": -21.7877254486084, "global_step": 98715, "epoch": 1189} {"train_loss": -21.858747482299805, "global_step": 98716, "epoch": 1189} {"train_loss": -21.778736114501953, "global_step": 98717, "epoch": 1189} {"train_loss": -21.790494918823242, "global_step": 98718, "epoch": 1189} {"train_loss": -22.068178176879883, "global_step": 98719, "epoch": 1189} {"train_loss": -21.63888931274414, "global_step": 98720, "epoch": 1189} {"train_loss": -22.06508445739746, "global_step": 98721, "epoch": 1189} {"train_loss": -21.557973861694336, "global_step": 98722, "epoch": 1189} {"train_loss": -21.86176109313965, "global_step": 98723, "epoch": 1189} {"train_loss": -22.0245418548584, "global_step": 98724, "epoch": 1189} {"train_loss": -21.756103515625, "global_step": 98725, "epoch": 1189} {"train_loss": -21.524137496948242, "global_step": 98726, "epoch": 1189} {"train_loss": -21.540632247924805, "global_step": 98727, "epoch": 1189} {"train_loss": -21.41242027282715, "global_step": 98728, "epoch": 1189} {"train_loss": -22.04570960998535, "global_step": 98729, "epoch": 1189} {"train_loss": -21.75324249267578, "global_step": 98730, "epoch": 1189} {"train_loss": -21.913711547851562, "global_step": 98731, "epoch": 1189} {"train_loss": -21.786457061767578, "global_step": 98732, "epoch": 1189} {"train_loss": -21.963106155395508, "global_step": 98733, "epoch": 1189} {"train_loss": -21.907424926757812, "global_step": 98734, "epoch": 1189} {"train_loss": -22.048276901245117, "global_step": 98735, "epoch": 1189} {"train_loss": -21.632179260253906, "global_step": 98736, "epoch": 1189} {"train_loss": -22.082210540771484, "global_step": 98737, "epoch": 1189} {"train_loss": -21.820371627807617, "global_step": 98738, "epoch": 1189} {"train_loss": -22.051668167114258, "global_step": 98739, "epoch": 1189} {"train_loss": -22.400466918945312, "global_step": 98740, "epoch": 1189} {"train_loss": -21.977590560913086, "global_step": 98741, "epoch": 1189} {"train_loss": -21.59964942932129, "global_step": 98742, "epoch": 1189} {"train_loss": -22.08998680114746, "global_step": 98743, "epoch": 1189} {"train_loss": -21.623088836669922, "global_step": 98744, "epoch": 1189} {"train_loss": -21.78290367126465, "global_step": 98745, "epoch": 1189} {"train_loss": -21.665189743041992, "global_step": 98746, "epoch": 1189} {"train_loss": -22.01655387878418, "global_step": 98747, "epoch": 1189} {"train_loss": -21.560443878173828, "global_step": 98748, "epoch": 1189} {"train_loss": -21.978796005249023, "global_step": 98749, "epoch": 1189} {"train_loss": -21.92780876159668, "global_step": 98750, "epoch": 1189} {"train_loss": -21.95404624938965, "global_step": 98751, "epoch": 1189} {"train_loss": -21.820554733276367, "global_step": 98752, "epoch": 1189} {"train_loss": -22.07477569580078, "global_step": 98753, "epoch": 1189} {"train_loss": -21.91971206665039, "global_step": 98754, "epoch": 1189} {"train_loss": -21.951385498046875, "global_step": 98755, "epoch": 1189} {"train_loss": -22.139188766479492, "global_step": 98756, "epoch": 1189} {"train_loss": -21.728281021118164, "global_step": 98757, "epoch": 1189} {"train_loss": -21.975980758666992, "global_step": 98758, "epoch": 1189} {"train_loss": -22.09096336364746, "global_step": 98759, "epoch": 1189} {"train_loss": -22.064481735229492, "global_step": 98760, "epoch": 1189} {"train_loss": -22.13910484313965, "global_step": 98761, "epoch": 1189} {"train_loss": -22.052505493164062, "global_step": 98762, "epoch": 1189} {"train_loss": -22.033859252929688, "global_step": 98763, "epoch": 1189} {"train_loss": -21.850509643554688, "global_step": 98764, "epoch": 1189} {"train_loss": -21.559022903442383, "global_step": 98765, "epoch": 1189} {"train_loss": -22.13585090637207, "global_step": 98766, "epoch": 1189} {"train_loss": -22.105825424194336, "global_step": 98767, "epoch": 1189} {"train_loss": -21.617870330810547, "global_step": 98768, "epoch": 1189} {"train_loss": -21.786906920283673, "global_step": 98769, "epoch": 1189, "val_loss": 6217238.0} {"train_loss": -21.730690002441406, "global_step": 98770, "epoch": 1190} {"train_loss": -21.77562141418457, "global_step": 98771, "epoch": 1190} {"train_loss": -21.84932518005371, "global_step": 98772, "epoch": 1190} {"train_loss": -21.6505184173584, "global_step": 98773, "epoch": 1190} {"train_loss": -21.640674591064453, "global_step": 98774, "epoch": 1190} {"train_loss": -21.744190216064453, "global_step": 98775, "epoch": 1190} {"train_loss": -21.627490997314453, "global_step": 98776, "epoch": 1190} {"train_loss": -21.475088119506836, "global_step": 98777, "epoch": 1190} {"train_loss": -21.903446197509766, "global_step": 98778, "epoch": 1190} {"train_loss": -21.588388442993164, "global_step": 98779, "epoch": 1190} {"train_loss": -21.519987106323242, "global_step": 98780, "epoch": 1190} {"train_loss": -21.643903732299805, "global_step": 98781, "epoch": 1190} {"train_loss": -21.728052139282227, "global_step": 98782, "epoch": 1190} {"train_loss": -22.019058227539062, "global_step": 98783, "epoch": 1190} {"train_loss": -21.8076229095459, "global_step": 98784, "epoch": 1190} {"train_loss": -21.761947631835938, "global_step": 98785, "epoch": 1190} {"train_loss": -21.985668182373047, "global_step": 98786, "epoch": 1190} {"train_loss": -22.393659591674805, "global_step": 98787, "epoch": 1190} {"train_loss": -22.01816177368164, "global_step": 98788, "epoch": 1190} {"train_loss": -21.871557235717773, "global_step": 98789, "epoch": 1190} {"train_loss": -22.042749404907227, "global_step": 98790, "epoch": 1190} {"train_loss": -21.86813735961914, "global_step": 98791, "epoch": 1190} {"train_loss": -21.90516471862793, "global_step": 98792, "epoch": 1190} {"train_loss": -21.848249435424805, "global_step": 98793, "epoch": 1190} {"train_loss": -21.945371627807617, "global_step": 98794, "epoch": 1190} {"train_loss": -21.956560134887695, "global_step": 98795, "epoch": 1190} {"train_loss": -22.00628089904785, "global_step": 98796, "epoch": 1190} {"train_loss": -21.88448715209961, "global_step": 98797, "epoch": 1190} {"train_loss": -21.96738052368164, "global_step": 98798, "epoch": 1190} {"train_loss": -22.12308692932129, "global_step": 98799, "epoch": 1190} {"train_loss": -22.063016891479492, "global_step": 98800, "epoch": 1190} {"train_loss": -21.964948654174805, "global_step": 98801, "epoch": 1190} {"train_loss": -22.08674430847168, "global_step": 98802, "epoch": 1190} {"train_loss": -21.8095645904541, "global_step": 98803, "epoch": 1190} {"train_loss": -21.992170333862305, "global_step": 98804, "epoch": 1190} {"train_loss": -22.11958885192871, "global_step": 98805, "epoch": 1190} {"train_loss": -21.871158599853516, "global_step": 98806, "epoch": 1190} {"train_loss": -22.3234920501709, "global_step": 98807, "epoch": 1190} {"train_loss": -22.28043556213379, "global_step": 98808, "epoch": 1190} {"train_loss": -22.13783073425293, "global_step": 98809, "epoch": 1190} {"train_loss": -22.10138702392578, "global_step": 98810, "epoch": 1190} {"train_loss": -21.76791763305664, "global_step": 98811, "epoch": 1190} {"train_loss": -21.692235946655273, "global_step": 98812, "epoch": 1190} {"train_loss": -21.48847007751465, "global_step": 98813, "epoch": 1190} {"train_loss": -21.519184112548828, "global_step": 98814, "epoch": 1190} {"train_loss": -21.7919864654541, "global_step": 98815, "epoch": 1190} {"train_loss": -22.046903610229492, "global_step": 98816, "epoch": 1190} {"train_loss": -21.794429779052734, "global_step": 98817, "epoch": 1190} {"train_loss": -21.19960594177246, "global_step": 98818, "epoch": 1190} {"train_loss": -21.92830467224121, "global_step": 98819, "epoch": 1190} {"train_loss": -21.593698501586914, "global_step": 98820, "epoch": 1190} {"train_loss": -21.664627075195312, "global_step": 98821, "epoch": 1190} {"train_loss": -22.002634048461914, "global_step": 98822, "epoch": 1190} {"train_loss": -22.00299644470215, "global_step": 98823, "epoch": 1190} {"train_loss": -22.09710693359375, "global_step": 98824, "epoch": 1190} {"train_loss": -22.4068660736084, "global_step": 98825, "epoch": 1190} {"train_loss": -22.081344604492188, "global_step": 98826, "epoch": 1190} {"train_loss": -21.62013816833496, "global_step": 98827, "epoch": 1190} {"train_loss": -22.0568904876709, "global_step": 98828, "epoch": 1190} {"train_loss": -21.9713191986084, "global_step": 98829, "epoch": 1190} {"train_loss": -21.734622955322266, "global_step": 98830, "epoch": 1190} {"train_loss": -21.925386428833008, "global_step": 98831, "epoch": 1190} {"train_loss": -21.756528854370117, "global_step": 98832, "epoch": 1190} {"train_loss": -22.091262817382812, "global_step": 98833, "epoch": 1190} {"train_loss": -22.147005081176758, "global_step": 98834, "epoch": 1190} {"train_loss": -22.115694046020508, "global_step": 98835, "epoch": 1190} {"train_loss": -22.23603630065918, "global_step": 98836, "epoch": 1190} {"train_loss": -22.215274810791016, "global_step": 98837, "epoch": 1190} {"train_loss": -21.94167709350586, "global_step": 98838, "epoch": 1190} {"train_loss": -21.871004104614258, "global_step": 98839, "epoch": 1190} {"train_loss": -21.740955352783203, "global_step": 98840, "epoch": 1190} {"train_loss": -22.015954971313477, "global_step": 98841, "epoch": 1190} {"train_loss": -21.680158615112305, "global_step": 98842, "epoch": 1190} {"train_loss": -22.10854148864746, "global_step": 98843, "epoch": 1190} {"train_loss": -22.008989334106445, "global_step": 98844, "epoch": 1190} {"train_loss": -21.962173461914062, "global_step": 98845, "epoch": 1190} {"train_loss": -21.929275512695312, "global_step": 98846, "epoch": 1190} {"train_loss": -22.084400177001953, "global_step": 98847, "epoch": 1190} {"train_loss": -21.980281829833984, "global_step": 98848, "epoch": 1190} {"train_loss": -21.68653678894043, "global_step": 98849, "epoch": 1190} {"train_loss": -22.000417709350586, "global_step": 98850, "epoch": 1190} {"train_loss": -22.08514976501465, "global_step": 98851, "epoch": 1190} {"train_loss": -21.88207908998053, "global_step": 98852, "epoch": 1190, "val_loss": 6153791.5} {"train_loss": -22.015792846679688, "global_step": 98853, "epoch": 1191} {"train_loss": -21.530963897705078, "global_step": 98854, "epoch": 1191} {"train_loss": -21.85746955871582, "global_step": 98855, "epoch": 1191} {"train_loss": -21.17243194580078, "global_step": 98856, "epoch": 1191} {"train_loss": -21.742856979370117, "global_step": 98857, "epoch": 1191} {"train_loss": -21.286457061767578, "global_step": 98858, "epoch": 1191} {"train_loss": -21.711483001708984, "global_step": 98859, "epoch": 1191} {"train_loss": -21.92366600036621, "global_step": 98860, "epoch": 1191} {"train_loss": -21.291156768798828, "global_step": 98861, "epoch": 1191} {"train_loss": -21.741905212402344, "global_step": 98862, "epoch": 1191} {"train_loss": -21.69041633605957, "global_step": 98863, "epoch": 1191} {"train_loss": -21.702411651611328, "global_step": 98864, "epoch": 1191} {"train_loss": -21.549713134765625, "global_step": 98865, "epoch": 1191} {"train_loss": -21.979663848876953, "global_step": 98866, "epoch": 1191} {"train_loss": -21.690458297729492, "global_step": 98867, "epoch": 1191} {"train_loss": -21.693937301635742, "global_step": 98868, "epoch": 1191} {"train_loss": -21.886075973510742, "global_step": 98869, "epoch": 1191} {"train_loss": -21.88878631591797, "global_step": 98870, "epoch": 1191} {"train_loss": -21.98334312438965, "global_step": 98871, "epoch": 1191} {"train_loss": -21.590383529663086, "global_step": 98872, "epoch": 1191} {"train_loss": -21.55634117126465, "global_step": 98873, "epoch": 1191} {"train_loss": -21.690759658813477, "global_step": 98874, "epoch": 1191} {"train_loss": -21.950178146362305, "global_step": 98875, "epoch": 1191} {"train_loss": -22.11418342590332, "global_step": 98876, "epoch": 1191} {"train_loss": -21.642507553100586, "global_step": 98877, "epoch": 1191} {"train_loss": -21.68715476989746, "global_step": 98878, "epoch": 1191} {"train_loss": -21.86390495300293, "global_step": 98879, "epoch": 1191} {"train_loss": -21.677879333496094, "global_step": 98880, "epoch": 1191} {"train_loss": -22.116960525512695, "global_step": 98881, "epoch": 1191} {"train_loss": -21.51770782470703, "global_step": 98882, "epoch": 1191} {"train_loss": -22.06770896911621, "global_step": 98883, "epoch": 1191} {"train_loss": -21.911405563354492, "global_step": 98884, "epoch": 1191} {"train_loss": -21.951601028442383, "global_step": 98885, "epoch": 1191} {"train_loss": -21.403539657592773, "global_step": 98886, "epoch": 1191} {"train_loss": -21.970508575439453, "global_step": 98887, "epoch": 1191} {"train_loss": -21.599489212036133, "global_step": 98888, "epoch": 1191} {"train_loss": -21.821626663208008, "global_step": 98889, "epoch": 1191} {"train_loss": -22.092233657836914, "global_step": 98890, "epoch": 1191} {"train_loss": -21.94866371154785, "global_step": 98891, "epoch": 1191} {"train_loss": -22.138118743896484, "global_step": 98892, "epoch": 1191} {"train_loss": -22.114757537841797, "global_step": 98893, "epoch": 1191} {"train_loss": -21.725543975830078, "global_step": 98894, "epoch": 1191} {"train_loss": -21.8874454498291, "global_step": 98895, "epoch": 1191} {"train_loss": -22.1901912689209, "global_step": 98896, "epoch": 1191} {"train_loss": -22.156604766845703, "global_step": 98897, "epoch": 1191} {"train_loss": -22.220563888549805, "global_step": 98898, "epoch": 1191} {"train_loss": -21.549482345581055, "global_step": 98899, "epoch": 1191} {"train_loss": -21.93553352355957, "global_step": 98900, "epoch": 1191} {"train_loss": -22.06430435180664, "global_step": 98901, "epoch": 1191} {"train_loss": -22.334583282470703, "global_step": 98902, "epoch": 1191} {"train_loss": -21.505910873413086, "global_step": 98903, "epoch": 1191} {"train_loss": -22.175399780273438, "global_step": 98904, "epoch": 1191} {"train_loss": -21.785940170288086, "global_step": 98905, "epoch": 1191} {"train_loss": -21.961580276489258, "global_step": 98906, "epoch": 1191} {"train_loss": -21.5891170501709, "global_step": 98907, "epoch": 1191} {"train_loss": -21.7167911529541, "global_step": 98908, "epoch": 1191} {"train_loss": -22.151098251342773, "global_step": 98909, "epoch": 1191} {"train_loss": -21.774600982666016, "global_step": 98910, "epoch": 1191} {"train_loss": -21.771562576293945, "global_step": 98911, "epoch": 1191} {"train_loss": -21.58578872680664, "global_step": 98912, "epoch": 1191} {"train_loss": -21.67814826965332, "global_step": 98913, "epoch": 1191} {"train_loss": -21.90662384033203, "global_step": 98914, "epoch": 1191} {"train_loss": -22.165605545043945, "global_step": 98915, "epoch": 1191} {"train_loss": -22.012531280517578, "global_step": 98916, "epoch": 1191} {"train_loss": -21.563047409057617, "global_step": 98917, "epoch": 1191} {"train_loss": -21.533832550048828, "global_step": 98918, "epoch": 1191} {"train_loss": -21.97884178161621, "global_step": 98919, "epoch": 1191} {"train_loss": -22.155149459838867, "global_step": 98920, "epoch": 1191} {"train_loss": -21.809656143188477, "global_step": 98921, "epoch": 1191} {"train_loss": -22.277002334594727, "global_step": 98922, "epoch": 1191} {"train_loss": -21.668643951416016, "global_step": 98923, "epoch": 1191} {"train_loss": -22.307504653930664, "global_step": 98924, "epoch": 1191} {"train_loss": -21.84275245666504, "global_step": 98925, "epoch": 1191} {"train_loss": -22.271886825561523, "global_step": 98926, "epoch": 1191} {"train_loss": -22.064725875854492, "global_step": 98927, "epoch": 1191} {"train_loss": -21.919355392456055, "global_step": 98928, "epoch": 1191} {"train_loss": -21.813718795776367, "global_step": 98929, "epoch": 1191} {"train_loss": -21.92841911315918, "global_step": 98930, "epoch": 1191} {"train_loss": -22.19830894470215, "global_step": 98931, "epoch": 1191} {"train_loss": -21.976160049438477, "global_step": 98932, "epoch": 1191} {"train_loss": -22.049142837524414, "global_step": 98933, "epoch": 1191} {"train_loss": -22.034440994262695, "global_step": 98934, "epoch": 1191} {"train_loss": -21.85020798372935, "global_step": 98935, "epoch": 1191, "val_loss": 6099036.0} {"train_loss": -20.862430572509766, "global_step": 98936, "epoch": 1192} {"train_loss": -21.304018020629883, "global_step": 98937, "epoch": 1192} {"train_loss": -21.3425350189209, "global_step": 98938, "epoch": 1192} {"train_loss": -21.351978302001953, "global_step": 98939, "epoch": 1192} {"train_loss": -21.604293823242188, "global_step": 98940, "epoch": 1192} {"train_loss": -21.539533615112305, "global_step": 98941, "epoch": 1192} {"train_loss": -21.926788330078125, "global_step": 98942, "epoch": 1192} {"train_loss": -21.46687126159668, "global_step": 98943, "epoch": 1192} {"train_loss": -21.480350494384766, "global_step": 98944, "epoch": 1192} {"train_loss": -21.726703643798828, "global_step": 98945, "epoch": 1192} {"train_loss": -21.18885040283203, "global_step": 98946, "epoch": 1192} {"train_loss": -21.34340476989746, "global_step": 98947, "epoch": 1192} {"train_loss": -21.591650009155273, "global_step": 98948, "epoch": 1192} {"train_loss": -21.178022384643555, "global_step": 98949, "epoch": 1192} {"train_loss": -21.326885223388672, "global_step": 98950, "epoch": 1192} {"train_loss": -21.874197006225586, "global_step": 98951, "epoch": 1192} {"train_loss": -21.413747787475586, "global_step": 98952, "epoch": 1192} {"train_loss": -21.702451705932617, "global_step": 98953, "epoch": 1192} {"train_loss": -22.10648536682129, "global_step": 98954, "epoch": 1192} {"train_loss": -21.714492797851562, "global_step": 98955, "epoch": 1192} {"train_loss": -22.132572174072266, "global_step": 98956, "epoch": 1192} {"train_loss": -21.846311569213867, "global_step": 98957, "epoch": 1192} {"train_loss": -21.83233070373535, "global_step": 98958, "epoch": 1192} {"train_loss": -21.85558319091797, "global_step": 98959, "epoch": 1192} {"train_loss": -22.112892150878906, "global_step": 98960, "epoch": 1192} {"train_loss": -22.2268009185791, "global_step": 98961, "epoch": 1192} {"train_loss": -21.54067039489746, "global_step": 98962, "epoch": 1192} {"train_loss": -21.996755599975586, "global_step": 98963, "epoch": 1192} {"train_loss": -21.938718795776367, "global_step": 98964, "epoch": 1192} {"train_loss": -21.862714767456055, "global_step": 98965, "epoch": 1192} {"train_loss": -22.035924911499023, "global_step": 98966, "epoch": 1192} {"train_loss": -21.941205978393555, "global_step": 98967, "epoch": 1192} {"train_loss": -21.776914596557617, "global_step": 98968, "epoch": 1192} {"train_loss": -22.17006492614746, "global_step": 98969, "epoch": 1192} {"train_loss": -22.15481185913086, "global_step": 98970, "epoch": 1192} {"train_loss": -22.245769500732422, "global_step": 98971, "epoch": 1192} {"train_loss": -21.782209396362305, "global_step": 98972, "epoch": 1192} {"train_loss": -21.58528709411621, "global_step": 98973, "epoch": 1192} {"train_loss": -21.49575424194336, "global_step": 98974, "epoch": 1192} {"train_loss": -21.959903717041016, "global_step": 98975, "epoch": 1192} {"train_loss": -21.733545303344727, "global_step": 98976, "epoch": 1192} {"train_loss": -21.896207809448242, "global_step": 98977, "epoch": 1192} {"train_loss": -21.851877212524414, "global_step": 98978, "epoch": 1192} {"train_loss": -21.993581771850586, "global_step": 98979, "epoch": 1192} {"train_loss": -21.921072006225586, "global_step": 98980, "epoch": 1192} {"train_loss": -21.762962341308594, "global_step": 98981, "epoch": 1192} {"train_loss": -21.930143356323242, "global_step": 98982, "epoch": 1192} {"train_loss": -21.861783981323242, "global_step": 98983, "epoch": 1192} {"train_loss": -22.01503562927246, "global_step": 98984, "epoch": 1192} {"train_loss": -21.70442771911621, "global_step": 98985, "epoch": 1192} {"train_loss": -21.95102882385254, "global_step": 98986, "epoch": 1192} {"train_loss": -21.55976676940918, "global_step": 98987, "epoch": 1192} {"train_loss": -22.21829605102539, "global_step": 98988, "epoch": 1192} {"train_loss": -21.679141998291016, "global_step": 98989, "epoch": 1192} {"train_loss": -21.892332077026367, "global_step": 98990, "epoch": 1192} {"train_loss": -21.802331924438477, "global_step": 98991, "epoch": 1192} {"train_loss": -21.894102096557617, "global_step": 98992, "epoch": 1192} {"train_loss": -21.73282814025879, "global_step": 98993, "epoch": 1192} {"train_loss": -21.847393035888672, "global_step": 98994, "epoch": 1192} {"train_loss": -22.101348876953125, "global_step": 98995, "epoch": 1192} {"train_loss": -21.998308181762695, "global_step": 98996, "epoch": 1192} {"train_loss": -22.167728424072266, "global_step": 98997, "epoch": 1192} {"train_loss": -22.027067184448242, "global_step": 98998, "epoch": 1192} {"train_loss": -21.841764450073242, "global_step": 98999, "epoch": 1192} {"train_loss": -21.782026290893555, "global_step": 99000, "epoch": 1192} {"train_loss": -21.912540435791016, "global_step": 99001, "epoch": 1192} {"train_loss": -21.75718116760254, "global_step": 99002, "epoch": 1192} {"train_loss": -21.724319458007812, "global_step": 99003, "epoch": 1192} {"train_loss": -21.776559829711914, "global_step": 99004, "epoch": 1192} {"train_loss": -21.994293212890625, "global_step": 99005, "epoch": 1192} {"train_loss": -22.01980972290039, "global_step": 99006, "epoch": 1192} {"train_loss": -22.08380126953125, "global_step": 99007, "epoch": 1192} {"train_loss": -22.022993087768555, "global_step": 99008, "epoch": 1192} {"train_loss": -22.143728256225586, "global_step": 99009, "epoch": 1192} {"train_loss": -22.076618194580078, "global_step": 99010, "epoch": 1192} {"train_loss": -21.979129791259766, "global_step": 99011, "epoch": 1192} {"train_loss": -21.83098793029785, "global_step": 99012, "epoch": 1192} {"train_loss": -21.973134994506836, "global_step": 99013, "epoch": 1192} {"train_loss": -22.061416625976562, "global_step": 99014, "epoch": 1192} {"train_loss": -21.95599365234375, "global_step": 99015, "epoch": 1192} {"train_loss": -22.261371612548828, "global_step": 99016, "epoch": 1192} {"train_loss": -22.074769973754883, "global_step": 99017, "epoch": 1192} {"train_loss": -21.825994928199126, "global_step": 99018, "epoch": 1192, "val_loss": 6016393.0} {"train_loss": -21.486011505126953, "global_step": 99019, "epoch": 1193} {"train_loss": -21.05958366394043, "global_step": 99020, "epoch": 1193} {"train_loss": -21.347951889038086, "global_step": 99021, "epoch": 1193} {"train_loss": -21.76294708251953, "global_step": 99022, "epoch": 1193} {"train_loss": -21.700040817260742, "global_step": 99023, "epoch": 1193} {"train_loss": -21.9853515625, "global_step": 99024, "epoch": 1193} {"train_loss": -21.811100006103516, "global_step": 99025, "epoch": 1193} {"train_loss": -21.474044799804688, "global_step": 99026, "epoch": 1193} {"train_loss": -21.717655181884766, "global_step": 99027, "epoch": 1193} {"train_loss": -21.778818130493164, "global_step": 99028, "epoch": 1193} {"train_loss": -21.87075424194336, "global_step": 99029, "epoch": 1193} {"train_loss": -21.783740997314453, "global_step": 99030, "epoch": 1193} {"train_loss": -21.93168067932129, "global_step": 99031, "epoch": 1193} {"train_loss": -21.835285186767578, "global_step": 99032, "epoch": 1193} {"train_loss": -21.8010196685791, "global_step": 99033, "epoch": 1193} {"train_loss": -21.523488998413086, "global_step": 99034, "epoch": 1193} {"train_loss": -21.848316192626953, "global_step": 99035, "epoch": 1193} {"train_loss": -21.831012725830078, "global_step": 99036, "epoch": 1193} {"train_loss": -21.945568084716797, "global_step": 99037, "epoch": 1193} {"train_loss": -21.60957145690918, "global_step": 99038, "epoch": 1193} {"train_loss": -21.700485229492188, "global_step": 99039, "epoch": 1193} {"train_loss": -21.727575302124023, "global_step": 99040, "epoch": 1193} {"train_loss": -21.929794311523438, "global_step": 99041, "epoch": 1193} {"train_loss": -21.84870147705078, "global_step": 99042, "epoch": 1193} {"train_loss": -21.778671264648438, "global_step": 99043, "epoch": 1193} {"train_loss": -21.47116470336914, "global_step": 99044, "epoch": 1193} {"train_loss": -21.81736183166504, "global_step": 99045, "epoch": 1193} {"train_loss": -21.611974716186523, "global_step": 99046, "epoch": 1193} {"train_loss": -21.909826278686523, "global_step": 99047, "epoch": 1193} {"train_loss": -22.294485092163086, "global_step": 99048, "epoch": 1193} {"train_loss": -21.82648468017578, "global_step": 99049, "epoch": 1193} {"train_loss": -21.927490234375, "global_step": 99050, "epoch": 1193} {"train_loss": -21.88751792907715, "global_step": 99051, "epoch": 1193} {"train_loss": -21.711780548095703, "global_step": 99052, "epoch": 1193} {"train_loss": -22.045095443725586, "global_step": 99053, "epoch": 1193} {"train_loss": -22.031818389892578, "global_step": 99054, "epoch": 1193} {"train_loss": -21.850244522094727, "global_step": 99055, "epoch": 1193} {"train_loss": -21.459775924682617, "global_step": 99056, "epoch": 1193} {"train_loss": -21.96059226989746, "global_step": 99057, "epoch": 1193} {"train_loss": -22.083942413330078, "global_step": 99058, "epoch": 1193} {"train_loss": -21.851110458374023, "global_step": 99059, "epoch": 1193} {"train_loss": -22.04474639892578, "global_step": 99060, "epoch": 1193} {"train_loss": -21.813182830810547, "global_step": 99061, "epoch": 1193} {"train_loss": -21.94695281982422, "global_step": 99062, "epoch": 1193} {"train_loss": -22.05255889892578, "global_step": 99063, "epoch": 1193} {"train_loss": -21.380277633666992, "global_step": 99064, "epoch": 1193} {"train_loss": -21.9919376373291, "global_step": 99065, "epoch": 1193} {"train_loss": -22.067676544189453, "global_step": 99066, "epoch": 1193} {"train_loss": -21.8299503326416, "global_step": 99067, "epoch": 1193} {"train_loss": -22.113101959228516, "global_step": 99068, "epoch": 1193} {"train_loss": -21.829145431518555, "global_step": 99069, "epoch": 1193} {"train_loss": -21.80594825744629, "global_step": 99070, "epoch": 1193} {"train_loss": -22.235885620117188, "global_step": 99071, "epoch": 1193} {"train_loss": -21.583484649658203, "global_step": 99072, "epoch": 1193} {"train_loss": -22.21167755126953, "global_step": 99073, "epoch": 1193} {"train_loss": -22.020002365112305, "global_step": 99074, "epoch": 1193} {"train_loss": -21.6303653717041, "global_step": 99075, "epoch": 1193} {"train_loss": -21.636730194091797, "global_step": 99076, "epoch": 1193} {"train_loss": -21.881515502929688, "global_step": 99077, "epoch": 1193} {"train_loss": -21.489286422729492, "global_step": 99078, "epoch": 1193} {"train_loss": -21.829587936401367, "global_step": 99079, "epoch": 1193} {"train_loss": -22.149127960205078, "global_step": 99080, "epoch": 1193} {"train_loss": -21.791868209838867, "global_step": 99081, "epoch": 1193} {"train_loss": -21.93317985534668, "global_step": 99082, "epoch": 1193} {"train_loss": -21.676645278930664, "global_step": 99083, "epoch": 1193} {"train_loss": -21.95844078063965, "global_step": 99084, "epoch": 1193} {"train_loss": -21.717397689819336, "global_step": 99085, "epoch": 1193} {"train_loss": -21.467870712280273, "global_step": 99086, "epoch": 1193} {"train_loss": -21.937524795532227, "global_step": 99087, "epoch": 1193} {"train_loss": -22.080238342285156, "global_step": 99088, "epoch": 1193} {"train_loss": -21.584266662597656, "global_step": 99089, "epoch": 1193} {"train_loss": -22.080123901367188, "global_step": 99090, "epoch": 1193} {"train_loss": -22.043964385986328, "global_step": 99091, "epoch": 1193} {"train_loss": -21.91680908203125, "global_step": 99092, "epoch": 1193} {"train_loss": -21.85248374938965, "global_step": 99093, "epoch": 1193} {"train_loss": -21.686519622802734, "global_step": 99094, "epoch": 1193} {"train_loss": -21.889158248901367, "global_step": 99095, "epoch": 1193} {"train_loss": -22.024402618408203, "global_step": 99096, "epoch": 1193} {"train_loss": -21.74440574645996, "global_step": 99097, "epoch": 1193} {"train_loss": -21.76936912536621, "global_step": 99098, "epoch": 1193} {"train_loss": -21.887022018432617, "global_step": 99099, "epoch": 1193} {"train_loss": -22.087499618530273, "global_step": 99100, "epoch": 1193} {"train_loss": -21.818827502698785, "global_step": 99101, "epoch": 1193, "val_loss": 6220317.0} {"train_loss": -21.453397750854492, "global_step": 99102, "epoch": 1194} {"train_loss": -21.884592056274414, "global_step": 99103, "epoch": 1194} {"train_loss": -21.412982940673828, "global_step": 99104, "epoch": 1194} {"train_loss": -21.936349868774414, "global_step": 99105, "epoch": 1194} {"train_loss": -21.361955642700195, "global_step": 99106, "epoch": 1194} {"train_loss": -21.860700607299805, "global_step": 99107, "epoch": 1194} {"train_loss": -21.521892547607422, "global_step": 99108, "epoch": 1194} {"train_loss": -22.042802810668945, "global_step": 99109, "epoch": 1194} {"train_loss": -21.949106216430664, "global_step": 99110, "epoch": 1194} {"train_loss": -22.213293075561523, "global_step": 99111, "epoch": 1194} {"train_loss": -21.699979782104492, "global_step": 99112, "epoch": 1194} {"train_loss": -21.86380958557129, "global_step": 99113, "epoch": 1194} {"train_loss": -21.017732620239258, "global_step": 99114, "epoch": 1194} {"train_loss": -21.526111602783203, "global_step": 99115, "epoch": 1194} {"train_loss": -21.676313400268555, "global_step": 99116, "epoch": 1194} {"train_loss": -21.771686553955078, "global_step": 99117, "epoch": 1194} {"train_loss": -21.669086456298828, "global_step": 99118, "epoch": 1194} {"train_loss": -21.928550720214844, "global_step": 99119, "epoch": 1194} {"train_loss": -21.689420700073242, "global_step": 99120, "epoch": 1194} {"train_loss": -21.634496688842773, "global_step": 99121, "epoch": 1194} {"train_loss": -22.11909294128418, "global_step": 99122, "epoch": 1194} {"train_loss": -22.03782081604004, "global_step": 99123, "epoch": 1194} {"train_loss": -22.001876831054688, "global_step": 99124, "epoch": 1194} {"train_loss": -22.129602432250977, "global_step": 99125, "epoch": 1194} {"train_loss": -21.90555763244629, "global_step": 99126, "epoch": 1194} {"train_loss": -21.97041130065918, "global_step": 99127, "epoch": 1194} {"train_loss": -22.03084945678711, "global_step": 99128, "epoch": 1194} {"train_loss": -22.148550033569336, "global_step": 99129, "epoch": 1194} {"train_loss": -21.82752799987793, "global_step": 99130, "epoch": 1194} {"train_loss": -21.968591690063477, "global_step": 99131, "epoch": 1194} {"train_loss": -22.140060424804688, "global_step": 99132, "epoch": 1194} {"train_loss": -21.65172576904297, "global_step": 99133, "epoch": 1194} {"train_loss": -21.990705490112305, "global_step": 99134, "epoch": 1194} {"train_loss": -22.035139083862305, "global_step": 99135, "epoch": 1194} {"train_loss": -21.767810821533203, "global_step": 99136, "epoch": 1194} {"train_loss": -21.787519454956055, "global_step": 99137, "epoch": 1194} {"train_loss": -21.62169075012207, "global_step": 99138, "epoch": 1194} {"train_loss": -21.94072723388672, "global_step": 99139, "epoch": 1194} {"train_loss": -21.897607803344727, "global_step": 99140, "epoch": 1194} {"train_loss": -21.659849166870117, "global_step": 99141, "epoch": 1194} {"train_loss": -21.87775993347168, "global_step": 99142, "epoch": 1194} {"train_loss": -21.945274353027344, "global_step": 99143, "epoch": 1194} {"train_loss": -21.931705474853516, "global_step": 99144, "epoch": 1194} {"train_loss": -21.866846084594727, "global_step": 99145, "epoch": 1194} {"train_loss": -21.851675033569336, "global_step": 99146, "epoch": 1194} {"train_loss": -21.598007202148438, "global_step": 99147, "epoch": 1194} {"train_loss": -22.361021041870117, "global_step": 99148, "epoch": 1194} {"train_loss": -22.063573837280273, "global_step": 99149, "epoch": 1194} {"train_loss": -21.958566665649414, "global_step": 99150, "epoch": 1194} {"train_loss": -21.894472122192383, "global_step": 99151, "epoch": 1194} {"train_loss": -21.204177856445312, "global_step": 99152, "epoch": 1194} {"train_loss": -21.95731544494629, "global_step": 99153, "epoch": 1194} {"train_loss": -21.791255950927734, "global_step": 99154, "epoch": 1194} {"train_loss": -21.885955810546875, "global_step": 99155, "epoch": 1194} {"train_loss": -21.388208389282227, "global_step": 99156, "epoch": 1194} {"train_loss": -22.024391174316406, "global_step": 99157, "epoch": 1194} {"train_loss": -21.500141143798828, "global_step": 99158, "epoch": 1194} {"train_loss": -22.05472755432129, "global_step": 99159, "epoch": 1194} {"train_loss": -21.435596466064453, "global_step": 99160, "epoch": 1194} {"train_loss": -22.325109481811523, "global_step": 99161, "epoch": 1194} {"train_loss": -21.719131469726562, "global_step": 99162, "epoch": 1194} {"train_loss": -21.672903060913086, "global_step": 99163, "epoch": 1194} {"train_loss": -21.954927444458008, "global_step": 99164, "epoch": 1194} {"train_loss": -21.762006759643555, "global_step": 99165, "epoch": 1194} {"train_loss": -21.995731353759766, "global_step": 99166, "epoch": 1194} {"train_loss": -22.147436141967773, "global_step": 99167, "epoch": 1194} {"train_loss": -21.839826583862305, "global_step": 99168, "epoch": 1194} {"train_loss": -22.199445724487305, "global_step": 99169, "epoch": 1194} {"train_loss": -21.896162033081055, "global_step": 99170, "epoch": 1194} {"train_loss": -22.113128662109375, "global_step": 99171, "epoch": 1194} {"train_loss": -21.8295955657959, "global_step": 99172, "epoch": 1194} {"train_loss": -21.865842819213867, "global_step": 99173, "epoch": 1194} {"train_loss": -21.855941772460938, "global_step": 99174, "epoch": 1194} {"train_loss": -21.80673599243164, "global_step": 99175, "epoch": 1194} {"train_loss": -21.931640625, "global_step": 99176, "epoch": 1194} {"train_loss": -21.96986961364746, "global_step": 99177, "epoch": 1194} {"train_loss": -21.94878387451172, "global_step": 99178, "epoch": 1194} {"train_loss": -21.92873191833496, "global_step": 99179, "epoch": 1194} {"train_loss": -21.988027572631836, "global_step": 99180, "epoch": 1194} {"train_loss": -21.90021324157715, "global_step": 99181, "epoch": 1194} {"train_loss": -22.279678344726562, "global_step": 99182, "epoch": 1194} {"train_loss": -22.038455963134766, "global_step": 99183, "epoch": 1194} {"train_loss": -21.853475915380272, "global_step": 99184, "epoch": 1194, "val_loss": 6067646.0} {"train_loss": -21.454633712768555, "global_step": 99185, "epoch": 1195} {"train_loss": -21.872543334960938, "global_step": 99186, "epoch": 1195} {"train_loss": -21.751218795776367, "global_step": 99187, "epoch": 1195} {"train_loss": -21.4859619140625, "global_step": 99188, "epoch": 1195} {"train_loss": -21.83942985534668, "global_step": 99189, "epoch": 1195} {"train_loss": -21.565235137939453, "global_step": 99190, "epoch": 1195} {"train_loss": -21.953100204467773, "global_step": 99191, "epoch": 1195} {"train_loss": -22.28271484375, "global_step": 99192, "epoch": 1195} {"train_loss": -22.010046005249023, "global_step": 99193, "epoch": 1195} {"train_loss": -21.809200286865234, "global_step": 99194, "epoch": 1195} {"train_loss": -21.63178825378418, "global_step": 99195, "epoch": 1195} {"train_loss": -21.638145446777344, "global_step": 99196, "epoch": 1195} {"train_loss": -21.836332321166992, "global_step": 99197, "epoch": 1195} {"train_loss": -22.270231246948242, "global_step": 99198, "epoch": 1195} {"train_loss": -21.679441452026367, "global_step": 99199, "epoch": 1195} {"train_loss": -22.020963668823242, "global_step": 99200, "epoch": 1195} {"train_loss": -21.80282211303711, "global_step": 99201, "epoch": 1195} {"train_loss": -21.894468307495117, "global_step": 99202, "epoch": 1195} {"train_loss": -21.787630081176758, "global_step": 99203, "epoch": 1195} {"train_loss": -22.14436149597168, "global_step": 99204, "epoch": 1195} {"train_loss": -21.736448287963867, "global_step": 99205, "epoch": 1195} {"train_loss": -21.908361434936523, "global_step": 99206, "epoch": 1195} {"train_loss": -21.44993782043457, "global_step": 99207, "epoch": 1195} {"train_loss": -21.58255386352539, "global_step": 99208, "epoch": 1195} {"train_loss": -21.719038009643555, "global_step": 99209, "epoch": 1195} {"train_loss": -21.686880111694336, "global_step": 99210, "epoch": 1195} {"train_loss": -21.88838768005371, "global_step": 99211, "epoch": 1195} {"train_loss": -21.77924156188965, "global_step": 99212, "epoch": 1195} {"train_loss": -21.606298446655273, "global_step": 99213, "epoch": 1195} {"train_loss": -21.368072509765625, "global_step": 99214, "epoch": 1195} {"train_loss": -21.85231590270996, "global_step": 99215, "epoch": 1195} {"train_loss": -21.80021858215332, "global_step": 99216, "epoch": 1195} {"train_loss": -21.5859432220459, "global_step": 99217, "epoch": 1195} {"train_loss": -21.669260025024414, "global_step": 99218, "epoch": 1195} {"train_loss": -21.659757614135742, "global_step": 99219, "epoch": 1195} {"train_loss": -21.98375701904297, "global_step": 99220, "epoch": 1195} {"train_loss": -21.669981002807617, "global_step": 99221, "epoch": 1195} {"train_loss": -21.537145614624023, "global_step": 99222, "epoch": 1195} {"train_loss": -21.97894287109375, "global_step": 99223, "epoch": 1195} {"train_loss": -21.97354507446289, "global_step": 99224, "epoch": 1195} {"train_loss": -21.789554595947266, "global_step": 99225, "epoch": 1195} {"train_loss": -22.22694206237793, "global_step": 99226, "epoch": 1195} {"train_loss": -21.6777400970459, "global_step": 99227, "epoch": 1195} {"train_loss": -21.72798728942871, "global_step": 99228, "epoch": 1195} {"train_loss": -21.958860397338867, "global_step": 99229, "epoch": 1195} {"train_loss": -22.076595306396484, "global_step": 99230, "epoch": 1195} {"train_loss": -22.0384578704834, "global_step": 99231, "epoch": 1195} {"train_loss": -21.972700119018555, "global_step": 99232, "epoch": 1195} {"train_loss": -21.533689498901367, "global_step": 99233, "epoch": 1195} {"train_loss": -21.725101470947266, "global_step": 99234, "epoch": 1195} {"train_loss": -21.920562744140625, "global_step": 99235, "epoch": 1195} {"train_loss": -21.858121871948242, "global_step": 99236, "epoch": 1195} {"train_loss": -21.87112045288086, "global_step": 99237, "epoch": 1195} {"train_loss": -21.974838256835938, "global_step": 99238, "epoch": 1195} {"train_loss": -21.831233978271484, "global_step": 99239, "epoch": 1195} {"train_loss": -22.098112106323242, "global_step": 99240, "epoch": 1195} {"train_loss": -21.87190055847168, "global_step": 99241, "epoch": 1195} {"train_loss": -22.130359649658203, "global_step": 99242, "epoch": 1195} {"train_loss": -21.701017379760742, "global_step": 99243, "epoch": 1195} {"train_loss": -22.104219436645508, "global_step": 99244, "epoch": 1195} {"train_loss": -21.81780242919922, "global_step": 99245, "epoch": 1195} {"train_loss": -21.784818649291992, "global_step": 99246, "epoch": 1195} {"train_loss": -22.42060661315918, "global_step": 99247, "epoch": 1195} {"train_loss": -21.863296508789062, "global_step": 99248, "epoch": 1195} {"train_loss": -21.627187728881836, "global_step": 99249, "epoch": 1195} {"train_loss": -21.988636016845703, "global_step": 99250, "epoch": 1195} {"train_loss": -21.902433395385742, "global_step": 99251, "epoch": 1195} {"train_loss": -22.115049362182617, "global_step": 99252, "epoch": 1195} {"train_loss": -22.11745262145996, "global_step": 99253, "epoch": 1195} {"train_loss": -21.884122848510742, "global_step": 99254, "epoch": 1195} {"train_loss": -21.579273223876953, "global_step": 99255, "epoch": 1195} {"train_loss": -21.662546157836914, "global_step": 99256, "epoch": 1195} {"train_loss": -21.97088050842285, "global_step": 99257, "epoch": 1195} {"train_loss": -21.94508171081543, "global_step": 99258, "epoch": 1195} {"train_loss": -21.646100997924805, "global_step": 99259, "epoch": 1195} {"train_loss": -21.791257858276367, "global_step": 99260, "epoch": 1195} {"train_loss": -22.098602294921875, "global_step": 99261, "epoch": 1195} {"train_loss": -21.748998641967773, "global_step": 99262, "epoch": 1195} {"train_loss": -21.80085563659668, "global_step": 99263, "epoch": 1195} {"train_loss": -22.033376693725586, "global_step": 99264, "epoch": 1195} {"train_loss": -21.918378829956055, "global_step": 99265, "epoch": 1195} {"train_loss": -21.536203384399414, "global_step": 99266, "epoch": 1195} {"train_loss": -21.818632424595844, "global_step": 99267, "epoch": 1195, "val_loss": 6119854.0} {"train_loss": -19.50309181213379, "global_step": 99268, "epoch": 1196} {"train_loss": -21.1118221282959, "global_step": 99269, "epoch": 1196} {"train_loss": -20.30545425415039, "global_step": 99270, "epoch": 1196} {"train_loss": -21.393457412719727, "global_step": 99271, "epoch": 1196} {"train_loss": -20.871929168701172, "global_step": 99272, "epoch": 1196} {"train_loss": -21.029634475708008, "global_step": 99273, "epoch": 1196} {"train_loss": -21.200393676757812, "global_step": 99274, "epoch": 1196} {"train_loss": -21.16780662536621, "global_step": 99275, "epoch": 1196} {"train_loss": -20.971540451049805, "global_step": 99276, "epoch": 1196} {"train_loss": -21.505905151367188, "global_step": 99277, "epoch": 1196} {"train_loss": -20.912147521972656, "global_step": 99278, "epoch": 1196} {"train_loss": -21.304800033569336, "global_step": 99279, "epoch": 1196} {"train_loss": -20.96369743347168, "global_step": 99280, "epoch": 1196} {"train_loss": -21.519485473632812, "global_step": 99281, "epoch": 1196} {"train_loss": -21.306703567504883, "global_step": 99282, "epoch": 1196} {"train_loss": -21.315549850463867, "global_step": 99283, "epoch": 1196} {"train_loss": -21.40604591369629, "global_step": 99284, "epoch": 1196} {"train_loss": -21.400888442993164, "global_step": 99285, "epoch": 1196} {"train_loss": -21.756378173828125, "global_step": 99286, "epoch": 1196} {"train_loss": -21.65671730041504, "global_step": 99287, "epoch": 1196} {"train_loss": -21.727811813354492, "global_step": 99288, "epoch": 1196} {"train_loss": -21.7314395904541, "global_step": 99289, "epoch": 1196} {"train_loss": -21.53619956970215, "global_step": 99290, "epoch": 1196} {"train_loss": -22.102672576904297, "global_step": 99291, "epoch": 1196} {"train_loss": -21.696115493774414, "global_step": 99292, "epoch": 1196} {"train_loss": -21.821765899658203, "global_step": 99293, "epoch": 1196} {"train_loss": -21.40163803100586, "global_step": 99294, "epoch": 1196} {"train_loss": -21.634119033813477, "global_step": 99295, "epoch": 1196} {"train_loss": -22.008596420288086, "global_step": 99296, "epoch": 1196} {"train_loss": -21.811004638671875, "global_step": 99297, "epoch": 1196} {"train_loss": -21.921762466430664, "global_step": 99298, "epoch": 1196} {"train_loss": -21.8546085357666, "global_step": 99299, "epoch": 1196} {"train_loss": -22.00843620300293, "global_step": 99300, "epoch": 1196} {"train_loss": -21.74056053161621, "global_step": 99301, "epoch": 1196} {"train_loss": -21.891416549682617, "global_step": 99302, "epoch": 1196} {"train_loss": -21.81307029724121, "global_step": 99303, "epoch": 1196} {"train_loss": -21.611392974853516, "global_step": 99304, "epoch": 1196} {"train_loss": -21.741676330566406, "global_step": 99305, "epoch": 1196} {"train_loss": -21.847675323486328, "global_step": 99306, "epoch": 1196} {"train_loss": -21.617647171020508, "global_step": 99307, "epoch": 1196} {"train_loss": -22.09299087524414, "global_step": 99308, "epoch": 1196} {"train_loss": -21.78541374206543, "global_step": 99309, "epoch": 1196} {"train_loss": -22.272314071655273, "global_step": 99310, "epoch": 1196} {"train_loss": -21.565580368041992, "global_step": 99311, "epoch": 1196} {"train_loss": -21.91498374938965, "global_step": 99312, "epoch": 1196} {"train_loss": -22.068506240844727, "global_step": 99313, "epoch": 1196} {"train_loss": -22.251779556274414, "global_step": 99314, "epoch": 1196} {"train_loss": -21.817447662353516, "global_step": 99315, "epoch": 1196} {"train_loss": -22.02863121032715, "global_step": 99316, "epoch": 1196} {"train_loss": -21.629831314086914, "global_step": 99317, "epoch": 1196} {"train_loss": -21.607501983642578, "global_step": 99318, "epoch": 1196} {"train_loss": -22.224912643432617, "global_step": 99319, "epoch": 1196} {"train_loss": -21.748891830444336, "global_step": 99320, "epoch": 1196} {"train_loss": -22.077207565307617, "global_step": 99321, "epoch": 1196} {"train_loss": -21.737430572509766, "global_step": 99322, "epoch": 1196} {"train_loss": -21.625699996948242, "global_step": 99323, "epoch": 1196} {"train_loss": -21.68861198425293, "global_step": 99324, "epoch": 1196} {"train_loss": -21.970947265625, "global_step": 99325, "epoch": 1196} {"train_loss": -21.913511276245117, "global_step": 99326, "epoch": 1196} {"train_loss": -21.637630462646484, "global_step": 99327, "epoch": 1196} {"train_loss": -21.79221534729004, "global_step": 99328, "epoch": 1196} {"train_loss": -22.114091873168945, "global_step": 99329, "epoch": 1196} {"train_loss": -21.828838348388672, "global_step": 99330, "epoch": 1196} {"train_loss": -22.016706466674805, "global_step": 99331, "epoch": 1196} {"train_loss": -21.9189395904541, "global_step": 99332, "epoch": 1196} {"train_loss": -21.996801376342773, "global_step": 99333, "epoch": 1196} {"train_loss": -22.129270553588867, "global_step": 99334, "epoch": 1196} {"train_loss": -21.916589736938477, "global_step": 99335, "epoch": 1196} {"train_loss": -21.811059951782227, "global_step": 99336, "epoch": 1196} {"train_loss": -21.832128524780273, "global_step": 99337, "epoch": 1196} {"train_loss": -21.778263092041016, "global_step": 99338, "epoch": 1196} {"train_loss": -22.105514526367188, "global_step": 99339, "epoch": 1196} {"train_loss": -21.86556053161621, "global_step": 99340, "epoch": 1196} {"train_loss": -21.939849853515625, "global_step": 99341, "epoch": 1196} {"train_loss": -21.857709884643555, "global_step": 99342, "epoch": 1196} {"train_loss": -21.79508399963379, "global_step": 99343, "epoch": 1196} {"train_loss": -22.248228073120117, "global_step": 99344, "epoch": 1196} {"train_loss": -21.60646629333496, "global_step": 99345, "epoch": 1196} {"train_loss": -21.8190975189209, "global_step": 99346, "epoch": 1196} {"train_loss": -21.72772979736328, "global_step": 99347, "epoch": 1196} {"train_loss": -22.275222778320312, "global_step": 99348, "epoch": 1196} {"train_loss": -22.210729598999023, "global_step": 99349, "epoch": 1196} {"train_loss": -21.690151283539922, "global_step": 99350, "epoch": 1196, "val_loss": 6177962.0} {"train_loss": -21.068567276000977, "global_step": 99351, "epoch": 1197} {"train_loss": -21.442951202392578, "global_step": 99352, "epoch": 1197} {"train_loss": -21.749656677246094, "global_step": 99353, "epoch": 1197} {"train_loss": -21.34398651123047, "global_step": 99354, "epoch": 1197} {"train_loss": -21.179336547851562, "global_step": 99355, "epoch": 1197} {"train_loss": -21.46766471862793, "global_step": 99356, "epoch": 1197} {"train_loss": -21.462352752685547, "global_step": 99357, "epoch": 1197} {"train_loss": -21.547622680664062, "global_step": 99358, "epoch": 1197} {"train_loss": -21.911426544189453, "global_step": 99359, "epoch": 1197} {"train_loss": -21.5268497467041, "global_step": 99360, "epoch": 1197} {"train_loss": -21.66385269165039, "global_step": 99361, "epoch": 1197} {"train_loss": -21.622098922729492, "global_step": 99362, "epoch": 1197} {"train_loss": -21.752803802490234, "global_step": 99363, "epoch": 1197} {"train_loss": -21.606319427490234, "global_step": 99364, "epoch": 1197} {"train_loss": -21.691574096679688, "global_step": 99365, "epoch": 1197} {"train_loss": -21.79608726501465, "global_step": 99366, "epoch": 1197} {"train_loss": -21.99188232421875, "global_step": 99367, "epoch": 1197} {"train_loss": -21.45648765563965, "global_step": 99368, "epoch": 1197} {"train_loss": -21.47364616394043, "global_step": 99369, "epoch": 1197} {"train_loss": -21.741256713867188, "global_step": 99370, "epoch": 1197} {"train_loss": -21.987092971801758, "global_step": 99371, "epoch": 1197} {"train_loss": -21.49466323852539, "global_step": 99372, "epoch": 1197} {"train_loss": -21.904834747314453, "global_step": 99373, "epoch": 1197} {"train_loss": -22.21415138244629, "global_step": 99374, "epoch": 1197} {"train_loss": -21.962345123291016, "global_step": 99375, "epoch": 1197} {"train_loss": -21.45029640197754, "global_step": 99376, "epoch": 1197} {"train_loss": -21.77309799194336, "global_step": 99377, "epoch": 1197} {"train_loss": -22.277830123901367, "global_step": 99378, "epoch": 1197} {"train_loss": -21.921466827392578, "global_step": 99379, "epoch": 1197} {"train_loss": -22.032636642456055, "global_step": 99380, "epoch": 1197} {"train_loss": -21.914777755737305, "global_step": 99381, "epoch": 1197} {"train_loss": -22.0936336517334, "global_step": 99382, "epoch": 1197} {"train_loss": -21.67573356628418, "global_step": 99383, "epoch": 1197} {"train_loss": -21.879417419433594, "global_step": 99384, "epoch": 1197} {"train_loss": -21.61579704284668, "global_step": 99385, "epoch": 1197} {"train_loss": -22.247297286987305, "global_step": 99386, "epoch": 1197} {"train_loss": -22.018888473510742, "global_step": 99387, "epoch": 1197} {"train_loss": -21.891468048095703, "global_step": 99388, "epoch": 1197} {"train_loss": -21.799772262573242, "global_step": 99389, "epoch": 1197} {"train_loss": -21.95613670349121, "global_step": 99390, "epoch": 1197} {"train_loss": -21.61626625061035, "global_step": 99391, "epoch": 1197} {"train_loss": -21.55086898803711, "global_step": 99392, "epoch": 1197} {"train_loss": -21.993139266967773, "global_step": 99393, "epoch": 1197} {"train_loss": -21.93036460876465, "global_step": 99394, "epoch": 1197} {"train_loss": -21.995695114135742, "global_step": 99395, "epoch": 1197} {"train_loss": -21.753995895385742, "global_step": 99396, "epoch": 1197} {"train_loss": -21.850690841674805, "global_step": 99397, "epoch": 1197} {"train_loss": -21.924856185913086, "global_step": 99398, "epoch": 1197} {"train_loss": -21.54047203063965, "global_step": 99399, "epoch": 1197} {"train_loss": -21.685693740844727, "global_step": 99400, "epoch": 1197} {"train_loss": -21.724210739135742, "global_step": 99401, "epoch": 1197} {"train_loss": -21.951496124267578, "global_step": 99402, "epoch": 1197} {"train_loss": -21.918235778808594, "global_step": 99403, "epoch": 1197} {"train_loss": -21.83591079711914, "global_step": 99404, "epoch": 1197} {"train_loss": -21.7432804107666, "global_step": 99405, "epoch": 1197} {"train_loss": -21.776243209838867, "global_step": 99406, "epoch": 1197} {"train_loss": -21.964967727661133, "global_step": 99407, "epoch": 1197} {"train_loss": -21.616926193237305, "global_step": 99408, "epoch": 1197} {"train_loss": -22.111967086791992, "global_step": 99409, "epoch": 1197} {"train_loss": -21.759923934936523, "global_step": 99410, "epoch": 1197} {"train_loss": -22.047439575195312, "global_step": 99411, "epoch": 1197} {"train_loss": -22.096080780029297, "global_step": 99412, "epoch": 1197} {"train_loss": -21.808584213256836, "global_step": 99413, "epoch": 1197} {"train_loss": -21.6923885345459, "global_step": 99414, "epoch": 1197} {"train_loss": -21.953079223632812, "global_step": 99415, "epoch": 1197} {"train_loss": -21.68083953857422, "global_step": 99416, "epoch": 1197} {"train_loss": -21.812191009521484, "global_step": 99417, "epoch": 1197} {"train_loss": -21.649826049804688, "global_step": 99418, "epoch": 1197} {"train_loss": -21.90689468383789, "global_step": 99419, "epoch": 1197} {"train_loss": -22.254901885986328, "global_step": 99420, "epoch": 1197} {"train_loss": -21.887643814086914, "global_step": 99421, "epoch": 1197} {"train_loss": -21.8734073638916, "global_step": 99422, "epoch": 1197} {"train_loss": -22.08926773071289, "global_step": 99423, "epoch": 1197} {"train_loss": -22.34309959411621, "global_step": 99424, "epoch": 1197} {"train_loss": -21.95193862915039, "global_step": 99425, "epoch": 1197} {"train_loss": -21.93172264099121, "global_step": 99426, "epoch": 1197} {"train_loss": -21.6774845123291, "global_step": 99427, "epoch": 1197} {"train_loss": -22.064565658569336, "global_step": 99428, "epoch": 1197} {"train_loss": -21.96713638305664, "global_step": 99429, "epoch": 1197} {"train_loss": -21.817153930664062, "global_step": 99430, "epoch": 1197} {"train_loss": -21.964069366455078, "global_step": 99431, "epoch": 1197} {"train_loss": -22.127017974853516, "global_step": 99432, "epoch": 1197} {"train_loss": -21.815084227596422, "global_step": 99433, "epoch": 1197, "val_loss": 5985022.5} {"train_loss": -21.9228458404541, "global_step": 99434, "epoch": 1198} {"train_loss": -21.862064361572266, "global_step": 99435, "epoch": 1198} {"train_loss": -21.8405704498291, "global_step": 99436, "epoch": 1198} {"train_loss": -21.928152084350586, "global_step": 99437, "epoch": 1198} {"train_loss": -21.899707794189453, "global_step": 99438, "epoch": 1198} {"train_loss": -21.644197463989258, "global_step": 99439, "epoch": 1198} {"train_loss": -22.089197158813477, "global_step": 99440, "epoch": 1198} {"train_loss": -21.787710189819336, "global_step": 99441, "epoch": 1198} {"train_loss": -21.746198654174805, "global_step": 99442, "epoch": 1198} {"train_loss": -21.5726375579834, "global_step": 99443, "epoch": 1198} {"train_loss": -21.832412719726562, "global_step": 99444, "epoch": 1198} {"train_loss": -21.78114891052246, "global_step": 99445, "epoch": 1198} {"train_loss": -21.830236434936523, "global_step": 99446, "epoch": 1198} {"train_loss": -21.746700286865234, "global_step": 99447, "epoch": 1198} {"train_loss": -22.09110450744629, "global_step": 99448, "epoch": 1198} {"train_loss": -21.567729949951172, "global_step": 99449, "epoch": 1198} {"train_loss": -21.891443252563477, "global_step": 99450, "epoch": 1198} {"train_loss": -22.074888229370117, "global_step": 99451, "epoch": 1198} {"train_loss": -21.5694637298584, "global_step": 99452, "epoch": 1198} {"train_loss": -21.901777267456055, "global_step": 99453, "epoch": 1198} {"train_loss": -22.037240982055664, "global_step": 99454, "epoch": 1198} {"train_loss": -21.77687644958496, "global_step": 99455, "epoch": 1198} {"train_loss": -21.8099365234375, "global_step": 99456, "epoch": 1198} {"train_loss": -21.901126861572266, "global_step": 99457, "epoch": 1198} {"train_loss": -21.617097854614258, "global_step": 99458, "epoch": 1198} {"train_loss": -21.838319778442383, "global_step": 99459, "epoch": 1198} {"train_loss": -21.82600212097168, "global_step": 99460, "epoch": 1198} {"train_loss": -21.95699119567871, "global_step": 99461, "epoch": 1198} {"train_loss": -21.90304946899414, "global_step": 99462, "epoch": 1198} {"train_loss": -21.522132873535156, "global_step": 99463, "epoch": 1198} {"train_loss": -21.92388916015625, "global_step": 99464, "epoch": 1198} {"train_loss": -22.13948631286621, "global_step": 99465, "epoch": 1198} {"train_loss": -21.674936294555664, "global_step": 99466, "epoch": 1198} {"train_loss": -21.718551635742188, "global_step": 99467, "epoch": 1198} {"train_loss": -21.61655044555664, "global_step": 99468, "epoch": 1198} {"train_loss": -21.85112953186035, "global_step": 99469, "epoch": 1198} {"train_loss": -21.815183639526367, "global_step": 99470, "epoch": 1198} {"train_loss": -21.865652084350586, "global_step": 99471, "epoch": 1198} {"train_loss": -21.781347274780273, "global_step": 99472, "epoch": 1198} {"train_loss": -21.818710327148438, "global_step": 99473, "epoch": 1198} {"train_loss": -21.91098403930664, "global_step": 99474, "epoch": 1198} {"train_loss": -21.920143127441406, "global_step": 99475, "epoch": 1198} {"train_loss": -21.5853328704834, "global_step": 99476, "epoch": 1198} {"train_loss": -21.589162826538086, "global_step": 99477, "epoch": 1198} {"train_loss": -21.75347328186035, "global_step": 99478, "epoch": 1198} {"train_loss": -21.807111740112305, "global_step": 99479, "epoch": 1198} {"train_loss": -21.5196533203125, "global_step": 99480, "epoch": 1198} {"train_loss": -21.703720092773438, "global_step": 99481, "epoch": 1198} {"train_loss": -22.107770919799805, "global_step": 99482, "epoch": 1198} {"train_loss": -22.145160675048828, "global_step": 99483, "epoch": 1198} {"train_loss": -22.12653160095215, "global_step": 99484, "epoch": 1198} {"train_loss": -21.794309616088867, "global_step": 99485, "epoch": 1198} {"train_loss": -22.14151954650879, "global_step": 99486, "epoch": 1198} {"train_loss": -21.54643440246582, "global_step": 99487, "epoch": 1198} {"train_loss": -21.835102081298828, "global_step": 99488, "epoch": 1198} {"train_loss": -22.05087661743164, "global_step": 99489, "epoch": 1198} {"train_loss": -22.11168098449707, "global_step": 99490, "epoch": 1198} {"train_loss": -21.770404815673828, "global_step": 99491, "epoch": 1198} {"train_loss": -21.80746841430664, "global_step": 99492, "epoch": 1198} {"train_loss": -22.0240478515625, "global_step": 99493, "epoch": 1198} {"train_loss": -22.584768295288086, "global_step": 99494, "epoch": 1198} {"train_loss": -22.01296043395996, "global_step": 99495, "epoch": 1198} {"train_loss": -21.57942008972168, "global_step": 99496, "epoch": 1198} {"train_loss": -21.75857925415039, "global_step": 99497, "epoch": 1198} {"train_loss": -22.27020263671875, "global_step": 99498, "epoch": 1198} {"train_loss": -21.55824851989746, "global_step": 99499, "epoch": 1198} {"train_loss": -21.717456817626953, "global_step": 99500, "epoch": 1198} {"train_loss": -22.0116024017334, "global_step": 99501, "epoch": 1198} {"train_loss": -21.928150177001953, "global_step": 99502, "epoch": 1198} {"train_loss": -22.202787399291992, "global_step": 99503, "epoch": 1198} {"train_loss": -22.120361328125, "global_step": 99504, "epoch": 1198} {"train_loss": -21.65623664855957, "global_step": 99505, "epoch": 1198} {"train_loss": -22.0046443939209, "global_step": 99506, "epoch": 1198} {"train_loss": -21.729825973510742, "global_step": 99507, "epoch": 1198} {"train_loss": -21.943559646606445, "global_step": 99508, "epoch": 1198} {"train_loss": -22.111740112304688, "global_step": 99509, "epoch": 1198} {"train_loss": -22.207487106323242, "global_step": 99510, "epoch": 1198} {"train_loss": -21.99667739868164, "global_step": 99511, "epoch": 1198} {"train_loss": -22.067441940307617, "global_step": 99512, "epoch": 1198} {"train_loss": -21.644718170166016, "global_step": 99513, "epoch": 1198} {"train_loss": -21.527109146118164, "global_step": 99514, "epoch": 1198} {"train_loss": -22.263748168945312, "global_step": 99515, "epoch": 1198} {"train_loss": -21.873967182205384, "global_step": 99516, "epoch": 1198, "val_loss": 6133649.0} {"train_loss": -21.494850158691406, "global_step": 99517, "epoch": 1199} {"train_loss": -21.70200538635254, "global_step": 99518, "epoch": 1199} {"train_loss": -21.75498390197754, "global_step": 99519, "epoch": 1199} {"train_loss": -21.573698043823242, "global_step": 99520, "epoch": 1199} {"train_loss": -21.815475463867188, "global_step": 99521, "epoch": 1199} {"train_loss": -21.73785972595215, "global_step": 99522, "epoch": 1199} {"train_loss": -21.698625564575195, "global_step": 99523, "epoch": 1199} {"train_loss": -21.645727157592773, "global_step": 99524, "epoch": 1199} {"train_loss": -21.642057418823242, "global_step": 99525, "epoch": 1199} {"train_loss": -21.866426467895508, "global_step": 99526, "epoch": 1199} {"train_loss": -22.174875259399414, "global_step": 99527, "epoch": 1199} {"train_loss": -21.754791259765625, "global_step": 99528, "epoch": 1199} {"train_loss": -21.74306297302246, "global_step": 99529, "epoch": 1199} {"train_loss": -22.35617446899414, "global_step": 99530, "epoch": 1199} {"train_loss": -21.583335876464844, "global_step": 99531, "epoch": 1199} {"train_loss": -21.541536331176758, "global_step": 99532, "epoch": 1199} {"train_loss": -21.7474308013916, "global_step": 99533, "epoch": 1199} {"train_loss": -21.753625869750977, "global_step": 99534, "epoch": 1199} {"train_loss": -22.061811447143555, "global_step": 99535, "epoch": 1199} {"train_loss": -21.716766357421875, "global_step": 99536, "epoch": 1199} {"train_loss": -21.798662185668945, "global_step": 99537, "epoch": 1199} {"train_loss": -22.1833553314209, "global_step": 99538, "epoch": 1199} {"train_loss": -22.036916732788086, "global_step": 99539, "epoch": 1199} {"train_loss": -21.76409149169922, "global_step": 99540, "epoch": 1199} {"train_loss": -21.942655563354492, "global_step": 99541, "epoch": 1199} {"train_loss": -22.106855392456055, "global_step": 99542, "epoch": 1199} {"train_loss": -21.91861915588379, "global_step": 99543, "epoch": 1199} {"train_loss": -21.815526962280273, "global_step": 99544, "epoch": 1199} {"train_loss": -22.18710708618164, "global_step": 99545, "epoch": 1199} {"train_loss": -22.11433219909668, "global_step": 99546, "epoch": 1199} {"train_loss": -21.81020164489746, "global_step": 99547, "epoch": 1199} {"train_loss": -22.057903289794922, "global_step": 99548, "epoch": 1199} {"train_loss": -21.58596420288086, "global_step": 99549, "epoch": 1199} {"train_loss": -22.08269691467285, "global_step": 99550, "epoch": 1199} {"train_loss": -21.721710205078125, "global_step": 99551, "epoch": 1199} {"train_loss": -21.45863914489746, "global_step": 99552, "epoch": 1199} {"train_loss": -22.189489364624023, "global_step": 99553, "epoch": 1199} {"train_loss": -21.98245620727539, "global_step": 99554, "epoch": 1199} {"train_loss": -21.848432540893555, "global_step": 99555, "epoch": 1199} {"train_loss": -21.71782875061035, "global_step": 99556, "epoch": 1199} {"train_loss": -21.940916061401367, "global_step": 99557, "epoch": 1199} {"train_loss": -21.643701553344727, "global_step": 99558, "epoch": 1199} {"train_loss": -21.63947105407715, "global_step": 99559, "epoch": 1199} {"train_loss": -21.809268951416016, "global_step": 99560, "epoch": 1199} {"train_loss": -21.545650482177734, "global_step": 99561, "epoch": 1199} {"train_loss": -21.695768356323242, "global_step": 99562, "epoch": 1199} {"train_loss": -21.80344009399414, "global_step": 99563, "epoch": 1199} {"train_loss": -22.000654220581055, "global_step": 99564, "epoch": 1199} {"train_loss": -21.7523250579834, "global_step": 99565, "epoch": 1199} {"train_loss": -21.732328414916992, "global_step": 99566, "epoch": 1199} {"train_loss": -21.885013580322266, "global_step": 99567, "epoch": 1199} {"train_loss": -21.77028465270996, "global_step": 99568, "epoch": 1199} {"train_loss": -21.664609909057617, "global_step": 99569, "epoch": 1199} {"train_loss": -22.06439781188965, "global_step": 99570, "epoch": 1199} {"train_loss": -22.03765106201172, "global_step": 99571, "epoch": 1199} {"train_loss": -21.835561752319336, "global_step": 99572, "epoch": 1199} {"train_loss": -22.099647521972656, "global_step": 99573, "epoch": 1199} {"train_loss": -21.73833656311035, "global_step": 99574, "epoch": 1199} {"train_loss": -22.144994735717773, "global_step": 99575, "epoch": 1199} {"train_loss": -21.553512573242188, "global_step": 99576, "epoch": 1199} {"train_loss": -21.972219467163086, "global_step": 99577, "epoch": 1199} {"train_loss": -21.86544418334961, "global_step": 99578, "epoch": 1199} {"train_loss": -22.03969383239746, "global_step": 99579, "epoch": 1199} {"train_loss": -21.782934188842773, "global_step": 99580, "epoch": 1199} {"train_loss": -21.89216423034668, "global_step": 99581, "epoch": 1199} {"train_loss": -22.04659080505371, "global_step": 99582, "epoch": 1199} {"train_loss": -22.181116104125977, "global_step": 99583, "epoch": 1199} {"train_loss": -21.9488468170166, "global_step": 99584, "epoch": 1199} {"train_loss": -22.106708526611328, "global_step": 99585, "epoch": 1199} {"train_loss": -22.28684425354004, "global_step": 99586, "epoch": 1199} {"train_loss": -22.12653923034668, "global_step": 99587, "epoch": 1199} {"train_loss": -22.016183853149414, "global_step": 99588, "epoch": 1199} {"train_loss": -21.850133895874023, "global_step": 99589, "epoch": 1199} {"train_loss": -22.15492820739746, "global_step": 99590, "epoch": 1199} {"train_loss": -21.8973388671875, "global_step": 99591, "epoch": 1199} {"train_loss": -22.399532318115234, "global_step": 99592, "epoch": 1199} {"train_loss": -22.110260009765625, "global_step": 99593, "epoch": 1199} {"train_loss": -22.135116577148438, "global_step": 99594, "epoch": 1199} {"train_loss": -21.667442321777344, "global_step": 99595, "epoch": 1199} {"train_loss": -22.120153427124023, "global_step": 99596, "epoch": 1199} {"train_loss": -21.653406143188477, "global_step": 99597, "epoch": 1199} {"train_loss": -22.060800552368164, "global_step": 99598, "epoch": 1199} {"train_loss": -21.881945989218103, "global_step": 99599, "epoch": 1199, "val_loss": 6097763.5} {"train_loss": -21.304763793945312, "global_step": 99600, "epoch": 1200} {"train_loss": -21.729665756225586, "global_step": 99601, "epoch": 1200} {"train_loss": -21.55665397644043, "global_step": 99602, "epoch": 1200} {"train_loss": -21.337162017822266, "global_step": 99603, "epoch": 1200} {"train_loss": -21.664932250976562, "global_step": 99604, "epoch": 1200} {"train_loss": -21.3756160736084, "global_step": 99605, "epoch": 1200} {"train_loss": -21.580928802490234, "global_step": 99606, "epoch": 1200} {"train_loss": -21.3608455657959, "global_step": 99607, "epoch": 1200} {"train_loss": -21.840381622314453, "global_step": 99608, "epoch": 1200} {"train_loss": -21.591001510620117, "global_step": 99609, "epoch": 1200} {"train_loss": -21.474519729614258, "global_step": 99610, "epoch": 1200} {"train_loss": -22.10224151611328, "global_step": 99611, "epoch": 1200} {"train_loss": -21.905059814453125, "global_step": 99612, "epoch": 1200} {"train_loss": -21.68707847595215, "global_step": 99613, "epoch": 1200} {"train_loss": -21.601821899414062, "global_step": 99614, "epoch": 1200} {"train_loss": -21.693143844604492, "global_step": 99615, "epoch": 1200} {"train_loss": -21.597614288330078, "global_step": 99616, "epoch": 1200} {"train_loss": -21.862058639526367, "global_step": 99617, "epoch": 1200} {"train_loss": -22.030942916870117, "global_step": 99618, "epoch": 1200} {"train_loss": -22.019399642944336, "global_step": 99619, "epoch": 1200} {"train_loss": -21.967056274414062, "global_step": 99620, "epoch": 1200} {"train_loss": -21.84383201599121, "global_step": 99621, "epoch": 1200} {"train_loss": -21.851165771484375, "global_step": 99622, "epoch": 1200} {"train_loss": -21.80232048034668, "global_step": 99623, "epoch": 1200} {"train_loss": -21.96658706665039, "global_step": 99624, "epoch": 1200} {"train_loss": -21.90567970275879, "global_step": 99625, "epoch": 1200} {"train_loss": -21.770652770996094, "global_step": 99626, "epoch": 1200} {"train_loss": -21.86150550842285, "global_step": 99627, "epoch": 1200} {"train_loss": -21.801712036132812, "global_step": 99628, "epoch": 1200} {"train_loss": -21.9559383392334, "global_step": 99629, "epoch": 1200} {"train_loss": -21.908447265625, "global_step": 99630, "epoch": 1200} {"train_loss": -21.571252822875977, "global_step": 99631, "epoch": 1200} {"train_loss": -22.19591522216797, "global_step": 99632, "epoch": 1200} {"train_loss": -22.046239852905273, "global_step": 99633, "epoch": 1200} {"train_loss": -21.672666549682617, "global_step": 99634, "epoch": 1200} {"train_loss": -21.915958404541016, "global_step": 99635, "epoch": 1200} {"train_loss": -22.083005905151367, "global_step": 99636, "epoch": 1200} {"train_loss": -21.87173843383789, "global_step": 99637, "epoch": 1200} {"train_loss": -22.037010192871094, "global_step": 99638, "epoch": 1200} {"train_loss": -22.03347396850586, "global_step": 99639, "epoch": 1200} {"train_loss": -21.852354049682617, "global_step": 99640, "epoch": 1200} {"train_loss": -22.110517501831055, "global_step": 99641, "epoch": 1200} {"train_loss": -22.38484001159668, "global_step": 99642, "epoch": 1200} {"train_loss": -22.01576042175293, "global_step": 99643, "epoch": 1200} {"train_loss": -21.729604721069336, "global_step": 99644, "epoch": 1200} {"train_loss": -21.804088592529297, "global_step": 99645, "epoch": 1200} {"train_loss": -21.82929039001465, "global_step": 99646, "epoch": 1200} {"train_loss": -22.164859771728516, "global_step": 99647, "epoch": 1200} {"train_loss": -22.012121200561523, "global_step": 99648, "epoch": 1200} {"train_loss": -21.986526489257812, "global_step": 99649, "epoch": 1200} {"train_loss": -21.953014373779297, "global_step": 99650, "epoch": 1200} {"train_loss": -21.99072265625, "global_step": 99651, "epoch": 1200} {"train_loss": -22.341590881347656, "global_step": 99652, "epoch": 1200} {"train_loss": -22.145883560180664, "global_step": 99653, "epoch": 1200} {"train_loss": -22.07193946838379, "global_step": 99654, "epoch": 1200} {"train_loss": -22.010047912597656, "global_step": 99655, "epoch": 1200} {"train_loss": -21.82539939880371, "global_step": 99656, "epoch": 1200} {"train_loss": -22.110498428344727, "global_step": 99657, "epoch": 1200} {"train_loss": -22.2518310546875, "global_step": 99658, "epoch": 1200} {"train_loss": -22.227670669555664, "global_step": 99659, "epoch": 1200} {"train_loss": -21.999374389648438, "global_step": 99660, "epoch": 1200} {"train_loss": -21.847766876220703, "global_step": 99661, "epoch": 1200} {"train_loss": -22.01764488220215, "global_step": 99662, "epoch": 1200} {"train_loss": -22.249788284301758, "global_step": 99663, "epoch": 1200} {"train_loss": -22.022275924682617, "global_step": 99664, "epoch": 1200} {"train_loss": -22.019039154052734, "global_step": 99665, "epoch": 1200} {"train_loss": -21.800827026367188, "global_step": 99666, "epoch": 1200} {"train_loss": -22.07213020324707, "global_step": 99667, "epoch": 1200} {"train_loss": -22.129491806030273, "global_step": 99668, "epoch": 1200} {"train_loss": -21.775192260742188, "global_step": 99669, "epoch": 1200} {"train_loss": -22.021217346191406, "global_step": 99670, "epoch": 1200} {"train_loss": -22.132389068603516, "global_step": 99671, "epoch": 1200} {"train_loss": -21.770971298217773, "global_step": 99672, "epoch": 1200} {"train_loss": -21.530967712402344, "global_step": 99673, "epoch": 1200} {"train_loss": -22.206708908081055, "global_step": 99674, "epoch": 1200} {"train_loss": -21.834623336791992, "global_step": 99675, "epoch": 1200} {"train_loss": -22.134353637695312, "global_step": 99676, "epoch": 1200} {"train_loss": -21.6882381439209, "global_step": 99677, "epoch": 1200} {"train_loss": -21.927658081054688, "global_step": 99678, "epoch": 1200} {"train_loss": -21.97549819946289, "global_step": 99679, "epoch": 1200} {"train_loss": -21.993959426879883, "global_step": 99680, "epoch": 1200} {"train_loss": -22.096155166625977, "global_step": 99681, "epoch": 1200} {"train_loss": -21.909483806196466, "global_step": 99682, "epoch": 1200, "train/sim_max_reward_0": 1.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4500000": 1.0, "test/sim_max_reward_4500001": 1.0, "test/sim_max_reward_4500002": 1.0, "test/sim_max_reward_4500003": 1.0, "test/sim_max_reward_4500004": 1.0, "test/sim_max_reward_4500005": 1.0, "test/sim_max_reward_4500006": 1.0, "test/sim_max_reward_4500007": 1.0, "test/sim_max_reward_4500008": 1.0, "test/sim_max_reward_4500009": 1.0, "test/sim_max_reward_4500010": 1.0, "test/sim_max_reward_4500011": 1.0, "test/sim_max_reward_4500012": 1.0, "test/sim_max_reward_4500013": 1.0, "test/sim_max_reward_4500014": 1.0, "test/sim_max_reward_4500015": 1.0, "test/sim_max_reward_4500016": 1.0, "test/sim_max_reward_4500017": 1.0, "test/sim_max_reward_4500018": 1.0, "test/sim_max_reward_4500019": 1.0, "test/sim_max_reward_4500020": 1.0, "test/sim_max_reward_4500021": 1.0, "train/mean_score": 1.0, "test/mean_score": 1.0, "val_loss": 6071896.0} {"train_loss": -19.294189453125, "global_step": 99683, "epoch": 1201} {"train_loss": -20.87957000732422, "global_step": 99684, "epoch": 1201} {"train_loss": -20.871999740600586, "global_step": 99685, "epoch": 1201} {"train_loss": -20.748634338378906, "global_step": 99686, "epoch": 1201} {"train_loss": -20.85098648071289, "global_step": 99687, "epoch": 1201} {"train_loss": -20.920888900756836, "global_step": 99688, "epoch": 1201} {"train_loss": -21.212993621826172, "global_step": 99689, "epoch": 1201} {"train_loss": -21.212526321411133, "global_step": 99690, "epoch": 1201} {"train_loss": -21.115814208984375, "global_step": 99691, "epoch": 1201} {"train_loss": -20.872718811035156, "global_step": 99692, "epoch": 1201} {"train_loss": -21.250349044799805, "global_step": 99693, "epoch": 1201} {"train_loss": -20.9553165435791, "global_step": 99694, "epoch": 1201} {"train_loss": -21.03778648376465, "global_step": 99695, "epoch": 1201} {"train_loss": -21.255897521972656, "global_step": 99696, "epoch": 1201} {"train_loss": -20.99489974975586, "global_step": 99697, "epoch": 1201} {"train_loss": -20.99759292602539, "global_step": 99698, "epoch": 1201} {"train_loss": -21.47083854675293, "global_step": 99699, "epoch": 1201} {"train_loss": -21.49488639831543, "global_step": 99700, "epoch": 1201} {"train_loss": -21.193729400634766, "global_step": 99701, "epoch": 1201} {"train_loss": -21.243295669555664, "global_step": 99702, "epoch": 1201} {"train_loss": -21.747922897338867, "global_step": 99703, "epoch": 1201} {"train_loss": -21.3692684173584, "global_step": 99704, "epoch": 1201} {"train_loss": -21.812204360961914, "global_step": 99705, "epoch": 1201} {"train_loss": -21.67609214782715, "global_step": 99706, "epoch": 1201} {"train_loss": -21.44319725036621, "global_step": 99707, "epoch": 1201} {"train_loss": -21.421260833740234, "global_step": 99708, "epoch": 1201} {"train_loss": -21.4532527923584, "global_step": 99709, "epoch": 1201} {"train_loss": -21.531770706176758, "global_step": 99710, "epoch": 1201} {"train_loss": -21.2995548248291, "global_step": 99711, "epoch": 1201} {"train_loss": -21.77471923828125, "global_step": 99712, "epoch": 1201} {"train_loss": -21.879047393798828, "global_step": 99713, "epoch": 1201} {"train_loss": -21.909021377563477, "global_step": 99714, "epoch": 1201} {"train_loss": -21.64468765258789, "global_step": 99715, "epoch": 1201} {"train_loss": -21.677043914794922, "global_step": 99716, "epoch": 1201} {"train_loss": -21.734237670898438, "global_step": 99717, "epoch": 1201} {"train_loss": -21.712467193603516, "global_step": 99718, "epoch": 1201} {"train_loss": -21.46809196472168, "global_step": 99719, "epoch": 1201} {"train_loss": -22.220062255859375, "global_step": 99720, "epoch": 1201} {"train_loss": -22.012910842895508, "global_step": 99721, "epoch": 1201} {"train_loss": -21.750242233276367, "global_step": 99722, "epoch": 1201} {"train_loss": -21.71748161315918, "global_step": 99723, "epoch": 1201} {"train_loss": -21.892393112182617, "global_step": 99724, "epoch": 1201} {"train_loss": -21.919754028320312, "global_step": 99725, "epoch": 1201} {"train_loss": -21.91225242614746, "global_step": 99726, "epoch": 1201} {"train_loss": -22.119495391845703, "global_step": 99727, "epoch": 1201} {"train_loss": -21.90371322631836, "global_step": 99728, "epoch": 1201} {"train_loss": -21.648242950439453, "global_step": 99729, "epoch": 1201} {"train_loss": -22.050521850585938, "global_step": 99730, "epoch": 1201} {"train_loss": -21.404855728149414, "global_step": 99731, "epoch": 1201} {"train_loss": -21.640666961669922, "global_step": 99732, "epoch": 1201} {"train_loss": -22.338821411132812, "global_step": 99733, "epoch": 1201} {"train_loss": -21.91988182067871, "global_step": 99734, "epoch": 1201} {"train_loss": -22.48516273498535, "global_step": 99735, "epoch": 1201} {"train_loss": -22.011865615844727, "global_step": 99736, "epoch": 1201} {"train_loss": -21.826074600219727, "global_step": 99737, "epoch": 1201} {"train_loss": -21.6535587310791, "global_step": 99738, "epoch": 1201} {"train_loss": -22.017393112182617, "global_step": 99739, "epoch": 1201} {"train_loss": -21.909942626953125, "global_step": 99740, "epoch": 1201} {"train_loss": -22.260324478149414, "global_step": 99741, "epoch": 1201} {"train_loss": -21.67827796936035, "global_step": 99742, "epoch": 1201} {"train_loss": -21.326292037963867, "global_step": 99743, "epoch": 1201} {"train_loss": -21.6912841796875, "global_step": 99744, "epoch": 1201} {"train_loss": -21.523706436157227, "global_step": 99745, "epoch": 1201} {"train_loss": -21.76546287536621, "global_step": 99746, "epoch": 1201} {"train_loss": -22.12029266357422, "global_step": 99747, "epoch": 1201} {"train_loss": -22.112958908081055, "global_step": 99748, "epoch": 1201} {"train_loss": -21.788724899291992, "global_step": 99749, "epoch": 1201} {"train_loss": -21.878942489624023, "global_step": 99750, "epoch": 1201} {"train_loss": -22.021778106689453, "global_step": 99751, "epoch": 1201} {"train_loss": -21.671499252319336, "global_step": 99752, "epoch": 1201} {"train_loss": -21.438339233398438, "global_step": 99753, "epoch": 1201} {"train_loss": -21.733415603637695, "global_step": 99754, "epoch": 1201} {"train_loss": -22.16587257385254, "global_step": 99755, "epoch": 1201} {"train_loss": -21.997501373291016, "global_step": 99756, "epoch": 1201} {"train_loss": -21.82615089416504, "global_step": 99757, "epoch": 1201} {"train_loss": -21.687314987182617, "global_step": 99758, "epoch": 1201} {"train_loss": -21.73230743408203, "global_step": 99759, "epoch": 1201} {"train_loss": -21.54157066345215, "global_step": 99760, "epoch": 1201} {"train_loss": -21.924182891845703, "global_step": 99761, "epoch": 1201} {"train_loss": -21.95254135131836, "global_step": 99762, "epoch": 1201} {"train_loss": -22.306560516357422, "global_step": 99763, "epoch": 1201} {"train_loss": -22.03150749206543, "global_step": 99764, "epoch": 1201} {"train_loss": -21.623698705650238, "global_step": 99765, "epoch": 1201, "val_loss": 6423200.0} {"train_loss": -21.017210006713867, "global_step": 99766, "epoch": 1202} {"train_loss": -21.062402725219727, "global_step": 99767, "epoch": 1202} {"train_loss": -21.361740112304688, "global_step": 99768, "epoch": 1202} {"train_loss": -21.2056827545166, "global_step": 99769, "epoch": 1202} {"train_loss": -20.70482635498047, "global_step": 99770, "epoch": 1202} {"train_loss": -20.85395050048828, "global_step": 99771, "epoch": 1202} {"train_loss": -21.697996139526367, "global_step": 99772, "epoch": 1202} {"train_loss": -21.15195655822754, "global_step": 99773, "epoch": 1202} {"train_loss": -21.189983367919922, "global_step": 99774, "epoch": 1202} {"train_loss": -21.341148376464844, "global_step": 99775, "epoch": 1202} {"train_loss": -21.454448699951172, "global_step": 99776, "epoch": 1202} {"train_loss": -21.349767684936523, "global_step": 99777, "epoch": 1202} {"train_loss": -21.20216178894043, "global_step": 99778, "epoch": 1202} {"train_loss": -21.64251708984375, "global_step": 99779, "epoch": 1202} {"train_loss": -21.274091720581055, "global_step": 99780, "epoch": 1202} {"train_loss": -21.50077247619629, "global_step": 99781, "epoch": 1202} {"train_loss": -21.587844848632812, "global_step": 99782, "epoch": 1202} {"train_loss": -21.039121627807617, "global_step": 99783, "epoch": 1202} {"train_loss": -21.732439041137695, "global_step": 99784, "epoch": 1202} {"train_loss": -21.79157829284668, "global_step": 99785, "epoch": 1202} {"train_loss": -21.236249923706055, "global_step": 99786, "epoch": 1202} {"train_loss": -21.738330841064453, "global_step": 99787, "epoch": 1202} {"train_loss": -21.622129440307617, "global_step": 99788, "epoch": 1202} {"train_loss": -21.586036682128906, "global_step": 99789, "epoch": 1202} {"train_loss": -21.78914451599121, "global_step": 99790, "epoch": 1202} {"train_loss": -22.017343521118164, "global_step": 99791, "epoch": 1202} {"train_loss": -21.764652252197266, "global_step": 99792, "epoch": 1202} {"train_loss": -21.341365814208984, "global_step": 99793, "epoch": 1202} {"train_loss": -21.963703155517578, "global_step": 99794, "epoch": 1202} {"train_loss": -21.826297760009766, "global_step": 99795, "epoch": 1202} {"train_loss": -21.680410385131836, "global_step": 99796, "epoch": 1202} {"train_loss": -21.690244674682617, "global_step": 99797, "epoch": 1202} {"train_loss": -21.824440002441406, "global_step": 99798, "epoch": 1202} {"train_loss": -21.911191940307617, "global_step": 99799, "epoch": 1202} {"train_loss": -21.983463287353516, "global_step": 99800, "epoch": 1202} {"train_loss": -21.770044326782227, "global_step": 99801, "epoch": 1202} {"train_loss": -21.886877059936523, "global_step": 99802, "epoch": 1202} {"train_loss": -21.837976455688477, "global_step": 99803, "epoch": 1202} {"train_loss": -21.77880096435547, "global_step": 99804, "epoch": 1202} {"train_loss": -21.686492919921875, "global_step": 99805, "epoch": 1202} {"train_loss": -22.084768295288086, "global_step": 99806, "epoch": 1202} {"train_loss": -21.649703979492188, "global_step": 99807, "epoch": 1202} {"train_loss": -21.966970443725586, "global_step": 99808, "epoch": 1202} {"train_loss": -21.9942569732666, "global_step": 99809, "epoch": 1202} {"train_loss": -21.86578369140625, "global_step": 99810, "epoch": 1202} {"train_loss": -22.033960342407227, "global_step": 99811, "epoch": 1202} {"train_loss": -21.93890953063965, "global_step": 99812, "epoch": 1202} {"train_loss": -22.00992774963379, "global_step": 99813, "epoch": 1202} {"train_loss": -22.00369644165039, "global_step": 99814, "epoch": 1202} {"train_loss": -21.52341651916504, "global_step": 99815, "epoch": 1202} {"train_loss": -22.051809310913086, "global_step": 99816, "epoch": 1202} {"train_loss": -21.80422019958496, "global_step": 99817, "epoch": 1202} {"train_loss": -21.705001831054688, "global_step": 99818, "epoch": 1202} {"train_loss": -21.80976676940918, "global_step": 99819, "epoch": 1202} {"train_loss": -21.71503257751465, "global_step": 99820, "epoch": 1202} {"train_loss": -22.323795318603516, "global_step": 99821, "epoch": 1202} {"train_loss": -21.727415084838867, "global_step": 99822, "epoch": 1202} {"train_loss": -21.71744155883789, "global_step": 99823, "epoch": 1202} {"train_loss": -22.048006057739258, "global_step": 99824, "epoch": 1202} {"train_loss": -21.71965980529785, "global_step": 99825, "epoch": 1202} {"train_loss": -21.858844757080078, "global_step": 99826, "epoch": 1202} {"train_loss": -21.85275650024414, "global_step": 99827, "epoch": 1202} {"train_loss": -21.778263092041016, "global_step": 99828, "epoch": 1202} {"train_loss": -22.067129135131836, "global_step": 99829, "epoch": 1202} {"train_loss": -22.260475158691406, "global_step": 99830, "epoch": 1202} {"train_loss": -22.030948638916016, "global_step": 99831, "epoch": 1202} {"train_loss": -22.19571304321289, "global_step": 99832, "epoch": 1202} {"train_loss": -21.840322494506836, "global_step": 99833, "epoch": 1202} {"train_loss": -22.074705123901367, "global_step": 99834, "epoch": 1202} {"train_loss": -22.17817497253418, "global_step": 99835, "epoch": 1202} {"train_loss": -21.929807662963867, "global_step": 99836, "epoch": 1202} {"train_loss": -22.05483055114746, "global_step": 99837, "epoch": 1202} {"train_loss": -21.889572143554688, "global_step": 99838, "epoch": 1202} {"train_loss": -21.820451736450195, "global_step": 99839, "epoch": 1202} {"train_loss": -22.126827239990234, "global_step": 99840, "epoch": 1202} {"train_loss": -21.900476455688477, "global_step": 99841, "epoch": 1202} {"train_loss": -22.006507873535156, "global_step": 99842, "epoch": 1202} {"train_loss": -21.95633316040039, "global_step": 99843, "epoch": 1202} {"train_loss": -22.20074462890625, "global_step": 99844, "epoch": 1202} {"train_loss": -21.962289810180664, "global_step": 99845, "epoch": 1202} {"train_loss": -21.832590103149414, "global_step": 99846, "epoch": 1202} {"train_loss": -21.714801788330078, "global_step": 99847, "epoch": 1202} {"train_loss": -21.729391465704126, "global_step": 99848, "epoch": 1202, "val_loss": 6189114.5} {"train_loss": -21.56477165222168, "global_step": 99849, "epoch": 1203} {"train_loss": -21.32980728149414, "global_step": 99850, "epoch": 1203} {"train_loss": -21.833654403686523, "global_step": 99851, "epoch": 1203} {"train_loss": -21.713848114013672, "global_step": 99852, "epoch": 1203} {"train_loss": -21.811716079711914, "global_step": 99853, "epoch": 1203} {"train_loss": -21.67952537536621, "global_step": 99854, "epoch": 1203} {"train_loss": -21.68124771118164, "global_step": 99855, "epoch": 1203} {"train_loss": -21.854642868041992, "global_step": 99856, "epoch": 1203} {"train_loss": -22.010929107666016, "global_step": 99857, "epoch": 1203} {"train_loss": -21.756620407104492, "global_step": 99858, "epoch": 1203} {"train_loss": -21.59783363342285, "global_step": 99859, "epoch": 1203} {"train_loss": -21.84148406982422, "global_step": 99860, "epoch": 1203} {"train_loss": -21.808917999267578, "global_step": 99861, "epoch": 1203} {"train_loss": -22.149171829223633, "global_step": 99862, "epoch": 1203} {"train_loss": -22.19205093383789, "global_step": 99863, "epoch": 1203} {"train_loss": -22.28766441345215, "global_step": 99864, "epoch": 1203} {"train_loss": -21.983152389526367, "global_step": 99865, "epoch": 1203} {"train_loss": -22.469669342041016, "global_step": 99866, "epoch": 1203} {"train_loss": -21.9134464263916, "global_step": 99867, "epoch": 1203} {"train_loss": -21.885433197021484, "global_step": 99868, "epoch": 1203} {"train_loss": -21.91724967956543, "global_step": 99869, "epoch": 1203} {"train_loss": -22.362314224243164, "global_step": 99870, "epoch": 1203} {"train_loss": -21.9553279876709, "global_step": 99871, "epoch": 1203} {"train_loss": -21.730125427246094, "global_step": 99872, "epoch": 1203} {"train_loss": -22.113147735595703, "global_step": 99873, "epoch": 1203} {"train_loss": -22.23869514465332, "global_step": 99874, "epoch": 1203} {"train_loss": -21.808929443359375, "global_step": 99875, "epoch": 1203} {"train_loss": -22.137136459350586, "global_step": 99876, "epoch": 1203} {"train_loss": -21.820289611816406, "global_step": 99877, "epoch": 1203} {"train_loss": -21.729787826538086, "global_step": 99878, "epoch": 1203} {"train_loss": -22.24500846862793, "global_step": 99879, "epoch": 1203} {"train_loss": -22.09320068359375, "global_step": 99880, "epoch": 1203} {"train_loss": -22.014562606811523, "global_step": 99881, "epoch": 1203} {"train_loss": -21.78969383239746, "global_step": 99882, "epoch": 1203} {"train_loss": -22.361074447631836, "global_step": 99883, "epoch": 1203} {"train_loss": -21.881237030029297, "global_step": 99884, "epoch": 1203} {"train_loss": -21.811185836791992, "global_step": 99885, "epoch": 1203} {"train_loss": -22.021682739257812, "global_step": 99886, "epoch": 1203} {"train_loss": -21.952829360961914, "global_step": 99887, "epoch": 1203} {"train_loss": -22.161529541015625, "global_step": 99888, "epoch": 1203} {"train_loss": -22.20082664489746, "global_step": 99889, "epoch": 1203} {"train_loss": -21.967880249023438, "global_step": 99890, "epoch": 1203} {"train_loss": -22.08973503112793, "global_step": 99891, "epoch": 1203} {"train_loss": -21.689857482910156, "global_step": 99892, "epoch": 1203} {"train_loss": -21.712949752807617, "global_step": 99893, "epoch": 1203} {"train_loss": -22.050939559936523, "global_step": 99894, "epoch": 1203} {"train_loss": -21.89747428894043, "global_step": 99895, "epoch": 1203} {"train_loss": -21.984262466430664, "global_step": 99896, "epoch": 1203} {"train_loss": -22.276226043701172, "global_step": 99897, "epoch": 1203} {"train_loss": -21.853551864624023, "global_step": 99898, "epoch": 1203} {"train_loss": -22.28760528564453, "global_step": 99899, "epoch": 1203} {"train_loss": -21.969440460205078, "global_step": 99900, "epoch": 1203} {"train_loss": -22.114267349243164, "global_step": 99901, "epoch": 1203} {"train_loss": -21.772808074951172, "global_step": 99902, "epoch": 1203} {"train_loss": -21.802793502807617, "global_step": 99903, "epoch": 1203} {"train_loss": -22.22405242919922, "global_step": 99904, "epoch": 1203} {"train_loss": -22.061500549316406, "global_step": 99905, "epoch": 1203} {"train_loss": -22.099346160888672, "global_step": 99906, "epoch": 1203} {"train_loss": -22.020864486694336, "global_step": 99907, "epoch": 1203} {"train_loss": -21.659746170043945, "global_step": 99908, "epoch": 1203} {"train_loss": -21.99051856994629, "global_step": 99909, "epoch": 1203} {"train_loss": -21.832735061645508, "global_step": 99910, "epoch": 1203} {"train_loss": -21.778139114379883, "global_step": 99911, "epoch": 1203} {"train_loss": -21.760282516479492, "global_step": 99912, "epoch": 1203} {"train_loss": -21.818639755249023, "global_step": 99913, "epoch": 1203} {"train_loss": -21.964710235595703, "global_step": 99914, "epoch": 1203} {"train_loss": -21.899242401123047, "global_step": 99915, "epoch": 1203} {"train_loss": -22.259057998657227, "global_step": 99916, "epoch": 1203} {"train_loss": -21.876386642456055, "global_step": 99917, "epoch": 1203} {"train_loss": -22.05415153503418, "global_step": 99918, "epoch": 1203} {"train_loss": -22.482486724853516, "global_step": 99919, "epoch": 1203} {"train_loss": -22.12833595275879, "global_step": 99920, "epoch": 1203} {"train_loss": -21.887380599975586, "global_step": 99921, "epoch": 1203} {"train_loss": -22.33515739440918, "global_step": 99922, "epoch": 1203} {"train_loss": -22.04640007019043, "global_step": 99923, "epoch": 1203} {"train_loss": -21.687299728393555, "global_step": 99924, "epoch": 1203} {"train_loss": -22.126073837280273, "global_step": 99925, "epoch": 1203} {"train_loss": -22.197067260742188, "global_step": 99926, "epoch": 1203} {"train_loss": -21.761301040649414, "global_step": 99927, "epoch": 1203} {"train_loss": -21.67008399963379, "global_step": 99928, "epoch": 1203} {"train_loss": -21.90922737121582, "global_step": 99929, "epoch": 1203} {"train_loss": -22.454700469970703, "global_step": 99930, "epoch": 1203} {"train_loss": -21.955117306077337, "global_step": 99931, "epoch": 1203, "val_loss": 6099597.0} {"train_loss": -22.17173957824707, "global_step": 99932, "epoch": 1204} {"train_loss": -21.624114990234375, "global_step": 99933, "epoch": 1204} {"train_loss": -21.838912963867188, "global_step": 99934, "epoch": 1204} {"train_loss": -21.8535099029541, "global_step": 99935, "epoch": 1204} {"train_loss": -21.525230407714844, "global_step": 99936, "epoch": 1204} {"train_loss": -21.940309524536133, "global_step": 99937, "epoch": 1204} {"train_loss": -21.95207405090332, "global_step": 99938, "epoch": 1204} {"train_loss": -22.00227928161621, "global_step": 99939, "epoch": 1204} {"train_loss": -22.317398071289062, "global_step": 99940, "epoch": 1204} {"train_loss": -22.128332138061523, "global_step": 99941, "epoch": 1204} {"train_loss": -21.776947021484375, "global_step": 99942, "epoch": 1204} {"train_loss": -22.11615562438965, "global_step": 99943, "epoch": 1204} {"train_loss": -22.075504302978516, "global_step": 99944, "epoch": 1204} {"train_loss": -21.7513370513916, "global_step": 99945, "epoch": 1204} {"train_loss": -22.0831241607666, "global_step": 99946, "epoch": 1204} {"train_loss": -21.777944564819336, "global_step": 99947, "epoch": 1204} {"train_loss": -22.028440475463867, "global_step": 99948, "epoch": 1204} {"train_loss": -22.139724731445312, "global_step": 99949, "epoch": 1204} {"train_loss": -22.175697326660156, "global_step": 99950, "epoch": 1204} {"train_loss": -21.935068130493164, "global_step": 99951, "epoch": 1204} {"train_loss": -22.1547908782959, "global_step": 99952, "epoch": 1204} {"train_loss": -22.21657371520996, "global_step": 99953, "epoch": 1204} {"train_loss": -22.081308364868164, "global_step": 99954, "epoch": 1204} {"train_loss": -21.912275314331055, "global_step": 99955, "epoch": 1204} {"train_loss": -22.188133239746094, "global_step": 99956, "epoch": 1204} {"train_loss": -22.17632484436035, "global_step": 99957, "epoch": 1204} {"train_loss": -21.582971572875977, "global_step": 99958, "epoch": 1204} {"train_loss": -22.034536361694336, "global_step": 99959, "epoch": 1204} {"train_loss": -21.608800888061523, "global_step": 99960, "epoch": 1204} {"train_loss": -21.750137329101562, "global_step": 99961, "epoch": 1204} {"train_loss": -22.106807708740234, "global_step": 99962, "epoch": 1204} {"train_loss": -21.745325088500977, "global_step": 99963, "epoch": 1204} {"train_loss": -21.800334930419922, "global_step": 99964, "epoch": 1204} {"train_loss": -21.861637115478516, "global_step": 99965, "epoch": 1204} {"train_loss": -21.67840576171875, "global_step": 99966, "epoch": 1204} {"train_loss": -21.577314376831055, "global_step": 99967, "epoch": 1204} {"train_loss": -21.621320724487305, "global_step": 99968, "epoch": 1204} {"train_loss": -21.583850860595703, "global_step": 99969, "epoch": 1204} {"train_loss": -21.71339988708496, "global_step": 99970, "epoch": 1204} {"train_loss": -21.763439178466797, "global_step": 99971, "epoch": 1204} {"train_loss": -21.657155990600586, "global_step": 99972, "epoch": 1204} {"train_loss": -21.984052658081055, "global_step": 99973, "epoch": 1204} {"train_loss": -21.23687171936035, "global_step": 99974, "epoch": 1204} {"train_loss": -22.118703842163086, "global_step": 99975, "epoch": 1204} {"train_loss": -22.078720092773438, "global_step": 99976, "epoch": 1204} {"train_loss": -21.90425682067871, "global_step": 99977, "epoch": 1204} {"train_loss": -22.08864402770996, "global_step": 99978, "epoch": 1204} {"train_loss": -21.687780380249023, "global_step": 99979, "epoch": 1204} {"train_loss": -21.920495986938477, "global_step": 99980, "epoch": 1204} {"train_loss": -22.09322166442871, "global_step": 99981, "epoch": 1204} {"train_loss": -21.850013732910156, "global_step": 99982, "epoch": 1204} {"train_loss": -21.803380966186523, "global_step": 99983, "epoch": 1204} {"train_loss": -22.011316299438477, "global_step": 99984, "epoch": 1204} {"train_loss": -21.87492561340332, "global_step": 99985, "epoch": 1204} {"train_loss": -21.829740524291992, "global_step": 99986, "epoch": 1204} {"train_loss": -21.59278678894043, "global_step": 99987, "epoch": 1204} {"train_loss": -21.844724655151367, "global_step": 99988, "epoch": 1204} {"train_loss": -22.326034545898438, "global_step": 99989, "epoch": 1204} {"train_loss": -21.887107849121094, "global_step": 99990, "epoch": 1204} {"train_loss": -22.163522720336914, "global_step": 99991, "epoch": 1204} {"train_loss": -22.09614372253418, "global_step": 99992, "epoch": 1204} {"train_loss": -21.822813034057617, "global_step": 99993, "epoch": 1204} {"train_loss": -21.591489791870117, "global_step": 99994, "epoch": 1204} {"train_loss": -21.68522071838379, "global_step": 99995, "epoch": 1204} {"train_loss": -22.286619186401367, "global_step": 99996, "epoch": 1204} {"train_loss": -21.757850646972656, "global_step": 99997, "epoch": 1204} {"train_loss": -21.77565574645996, "global_step": 99998, "epoch": 1204} {"train_loss": -21.747474670410156, "global_step": 99999, "epoch": 1204} {"train_loss": -21.90779685974121, "global_step": 100000, "epoch": 1204} {"train_loss": -21.76327896118164, "global_step": 100001, "epoch": 1204} {"train_loss": -21.797800064086914, "global_step": 100002, "epoch": 1204} {"train_loss": -21.875587463378906, "global_step": 100003, "epoch": 1204} {"train_loss": -22.150413513183594, "global_step": 100004, "epoch": 1204} {"train_loss": -22.054922103881836, "global_step": 100005, "epoch": 1204} {"train_loss": -21.986446380615234, "global_step": 100006, "epoch": 1204} {"train_loss": -22.10481071472168, "global_step": 100007, "epoch": 1204} {"train_loss": -22.150964736938477, "global_step": 100008, "epoch": 1204} {"train_loss": -21.53377342224121, "global_step": 100009, "epoch": 1204} {"train_loss": -22.133764266967773, "global_step": 100010, "epoch": 1204} {"train_loss": -22.125816345214844, "global_step": 100011, "epoch": 1204} {"train_loss": -21.999866485595703, "global_step": 100012, "epoch": 1204} {"train_loss": -22.158971786499023, "global_step": 100013, "epoch": 1204} {"train_loss": -21.912749485797193, "global_step": 100014, "epoch": 1204, "val_loss": 6066158.5} {"train_loss": -21.39875602722168, "global_step": 100015, "epoch": 1205} {"train_loss": -21.464603424072266, "global_step": 100016, "epoch": 1205} {"train_loss": -21.6581974029541, "global_step": 100017, "epoch": 1205} {"train_loss": -21.769996643066406, "global_step": 100018, "epoch": 1205} {"train_loss": -21.579837799072266, "global_step": 100019, "epoch": 1205} {"train_loss": -21.3060359954834, "global_step": 100020, "epoch": 1205} {"train_loss": -21.630985260009766, "global_step": 100021, "epoch": 1205} {"train_loss": -21.9135799407959, "global_step": 100022, "epoch": 1205} {"train_loss": -21.539968490600586, "global_step": 100023, "epoch": 1205} {"train_loss": -21.47871971130371, "global_step": 100024, "epoch": 1205} {"train_loss": -21.451656341552734, "global_step": 100025, "epoch": 1205} {"train_loss": -21.799915313720703, "global_step": 100026, "epoch": 1205} {"train_loss": -21.855892181396484, "global_step": 100027, "epoch": 1205} {"train_loss": -21.62932777404785, "global_step": 100028, "epoch": 1205} {"train_loss": -21.821168899536133, "global_step": 100029, "epoch": 1205} {"train_loss": -21.8131046295166, "global_step": 100030, "epoch": 1205} {"train_loss": -21.948644638061523, "global_step": 100031, "epoch": 1205} {"train_loss": -21.905956268310547, "global_step": 100032, "epoch": 1205} {"train_loss": -22.070947647094727, "global_step": 100033, "epoch": 1205} {"train_loss": -21.874927520751953, "global_step": 100034, "epoch": 1205} {"train_loss": -21.788034439086914, "global_step": 100035, "epoch": 1205} {"train_loss": -21.955507278442383, "global_step": 100036, "epoch": 1205} {"train_loss": -22.09551429748535, "global_step": 100037, "epoch": 1205} {"train_loss": -21.812091827392578, "global_step": 100038, "epoch": 1205} {"train_loss": -21.8586483001709, "global_step": 100039, "epoch": 1205} {"train_loss": -22.053600311279297, "global_step": 100040, "epoch": 1205} {"train_loss": -21.715951919555664, "global_step": 100041, "epoch": 1205} {"train_loss": -21.91806983947754, "global_step": 100042, "epoch": 1205} {"train_loss": -22.257246017456055, "global_step": 100043, "epoch": 1205} {"train_loss": -22.004453659057617, "global_step": 100044, "epoch": 1205} {"train_loss": -21.9621524810791, "global_step": 100045, "epoch": 1205} {"train_loss": -21.741979598999023, "global_step": 100046, "epoch": 1205} {"train_loss": -22.32964515686035, "global_step": 100047, "epoch": 1205} {"train_loss": -22.180315017700195, "global_step": 100048, "epoch": 1205} {"train_loss": -22.304458618164062, "global_step": 100049, "epoch": 1205} {"train_loss": -22.130277633666992, "global_step": 100050, "epoch": 1205} {"train_loss": -21.743881225585938, "global_step": 100051, "epoch": 1205} {"train_loss": -21.815624237060547, "global_step": 100052, "epoch": 1205} {"train_loss": -22.339269638061523, "global_step": 100053, "epoch": 1205} {"train_loss": -21.870155334472656, "global_step": 100054, "epoch": 1205} {"train_loss": -22.164342880249023, "global_step": 100055, "epoch": 1205} {"train_loss": -21.655399322509766, "global_step": 100056, "epoch": 1205} {"train_loss": -22.348621368408203, "global_step": 100057, "epoch": 1205} {"train_loss": -22.025720596313477, "global_step": 100058, "epoch": 1205} {"train_loss": -22.18223762512207, "global_step": 100059, "epoch": 1205} {"train_loss": -21.720884323120117, "global_step": 100060, "epoch": 1205} {"train_loss": -21.899471282958984, "global_step": 100061, "epoch": 1205} {"train_loss": -21.667797088623047, "global_step": 100062, "epoch": 1205} {"train_loss": -21.89705467224121, "global_step": 100063, "epoch": 1205} {"train_loss": -21.82979393005371, "global_step": 100064, "epoch": 1205} {"train_loss": -22.09513282775879, "global_step": 100065, "epoch": 1205} {"train_loss": -22.30678939819336, "global_step": 100066, "epoch": 1205} {"train_loss": -22.046762466430664, "global_step": 100067, "epoch": 1205} {"train_loss": -22.178813934326172, "global_step": 100068, "epoch": 1205} {"train_loss": -21.752826690673828, "global_step": 100069, "epoch": 1205} {"train_loss": -21.997295379638672, "global_step": 100070, "epoch": 1205} {"train_loss": -21.69573211669922, "global_step": 100071, "epoch": 1205} {"train_loss": -21.817720413208008, "global_step": 100072, "epoch": 1205} {"train_loss": -22.021366119384766, "global_step": 100073, "epoch": 1205} {"train_loss": -22.020797729492188, "global_step": 100074, "epoch": 1205} {"train_loss": -21.6673526763916, "global_step": 100075, "epoch": 1205} {"train_loss": -21.897287368774414, "global_step": 100076, "epoch": 1205} {"train_loss": -21.745885848999023, "global_step": 100077, "epoch": 1205} {"train_loss": -21.9130859375, "global_step": 100078, "epoch": 1205} {"train_loss": -21.9632511138916, "global_step": 100079, "epoch": 1205} {"train_loss": -21.690143585205078, "global_step": 100080, "epoch": 1205} {"train_loss": -22.62332534790039, "global_step": 100081, "epoch": 1205} {"train_loss": -21.549678802490234, "global_step": 100082, "epoch": 1205} {"train_loss": -21.415395736694336, "global_step": 100083, "epoch": 1205} {"train_loss": -21.862178802490234, "global_step": 100084, "epoch": 1205} {"train_loss": -21.875137329101562, "global_step": 100085, "epoch": 1205} {"train_loss": -22.086017608642578, "global_step": 100086, "epoch": 1205} {"train_loss": -21.432079315185547, "global_step": 100087, "epoch": 1205} {"train_loss": -22.23000144958496, "global_step": 100088, "epoch": 1205} {"train_loss": -21.975513458251953, "global_step": 100089, "epoch": 1205} {"train_loss": -21.946653366088867, "global_step": 100090, "epoch": 1205} {"train_loss": -21.940143585205078, "global_step": 100091, "epoch": 1205} {"train_loss": -22.0985164642334, "global_step": 100092, "epoch": 1205} {"train_loss": -21.947240829467773, "global_step": 100093, "epoch": 1205} {"train_loss": -22.08953285217285, "global_step": 100094, "epoch": 1205} {"train_loss": -21.70865249633789, "global_step": 100095, "epoch": 1205} {"train_loss": -21.926162719726562, "global_step": 100096, "epoch": 1205} {"train_loss": -21.872076310307147, "global_step": 100097, "epoch": 1205, "val_loss": 6271398.0} {"train_loss": -21.52411460876465, "global_step": 100098, "epoch": 1206} {"train_loss": -21.80079460144043, "global_step": 100099, "epoch": 1206} {"train_loss": -21.61922264099121, "global_step": 100100, "epoch": 1206} {"train_loss": -21.048648834228516, "global_step": 100101, "epoch": 1206} {"train_loss": -21.84421730041504, "global_step": 100102, "epoch": 1206} {"train_loss": -21.684337615966797, "global_step": 100103, "epoch": 1206} {"train_loss": -21.354337692260742, "global_step": 100104, "epoch": 1206} {"train_loss": -21.902141571044922, "global_step": 100105, "epoch": 1206} {"train_loss": -21.68726921081543, "global_step": 100106, "epoch": 1206} {"train_loss": -21.796384811401367, "global_step": 100107, "epoch": 1206} {"train_loss": -21.68890380859375, "global_step": 100108, "epoch": 1206} {"train_loss": -21.8586483001709, "global_step": 100109, "epoch": 1206} {"train_loss": -21.80156898498535, "global_step": 100110, "epoch": 1206} {"train_loss": -21.758703231811523, "global_step": 100111, "epoch": 1206} {"train_loss": -21.83050537109375, "global_step": 100112, "epoch": 1206} {"train_loss": -21.824356079101562, "global_step": 100113, "epoch": 1206} {"train_loss": -22.141315460205078, "global_step": 100114, "epoch": 1206} {"train_loss": -21.741592407226562, "global_step": 100115, "epoch": 1206} {"train_loss": -21.731874465942383, "global_step": 100116, "epoch": 1206} {"train_loss": -21.98109245300293, "global_step": 100117, "epoch": 1206} {"train_loss": -21.75943946838379, "global_step": 100118, "epoch": 1206} {"train_loss": -22.163877487182617, "global_step": 100119, "epoch": 1206} {"train_loss": -22.433349609375, "global_step": 100120, "epoch": 1206} {"train_loss": -22.217409133911133, "global_step": 100121, "epoch": 1206} {"train_loss": -21.95090103149414, "global_step": 100122, "epoch": 1206} {"train_loss": -21.707576751708984, "global_step": 100123, "epoch": 1206} {"train_loss": -22.173633575439453, "global_step": 100124, "epoch": 1206} {"train_loss": -21.531513214111328, "global_step": 100125, "epoch": 1206} {"train_loss": -21.733922958374023, "global_step": 100126, "epoch": 1206} {"train_loss": -21.69921875, "global_step": 100127, "epoch": 1206} {"train_loss": -21.77663803100586, "global_step": 100128, "epoch": 1206} {"train_loss": -22.023908615112305, "global_step": 100129, "epoch": 1206} {"train_loss": -21.596355438232422, "global_step": 100130, "epoch": 1206} {"train_loss": -21.909317016601562, "global_step": 100131, "epoch": 1206} {"train_loss": -22.06443977355957, "global_step": 100132, "epoch": 1206} {"train_loss": -21.950651168823242, "global_step": 100133, "epoch": 1206} {"train_loss": -21.740447998046875, "global_step": 100134, "epoch": 1206} {"train_loss": -22.232229232788086, "global_step": 100135, "epoch": 1206} {"train_loss": -21.914472579956055, "global_step": 100136, "epoch": 1206} {"train_loss": -21.80470085144043, "global_step": 100137, "epoch": 1206} {"train_loss": -22.256933212280273, "global_step": 100138, "epoch": 1206} {"train_loss": -21.974761962890625, "global_step": 100139, "epoch": 1206} {"train_loss": -22.29412841796875, "global_step": 100140, "epoch": 1206} {"train_loss": -21.877944946289062, "global_step": 100141, "epoch": 1206} {"train_loss": -21.862791061401367, "global_step": 100142, "epoch": 1206} {"train_loss": -21.883031845092773, "global_step": 100143, "epoch": 1206} {"train_loss": -22.25494384765625, "global_step": 100144, "epoch": 1206} {"train_loss": -21.9492244720459, "global_step": 100145, "epoch": 1206} {"train_loss": -21.852758407592773, "global_step": 100146, "epoch": 1206} {"train_loss": -22.142831802368164, "global_step": 100147, "epoch": 1206} {"train_loss": -22.042905807495117, "global_step": 100148, "epoch": 1206} {"train_loss": -21.716468811035156, "global_step": 100149, "epoch": 1206} {"train_loss": -21.58746910095215, "global_step": 100150, "epoch": 1206} {"train_loss": -21.915098190307617, "global_step": 100151, "epoch": 1206} {"train_loss": -22.032983779907227, "global_step": 100152, "epoch": 1206} {"train_loss": -22.04370880126953, "global_step": 100153, "epoch": 1206} {"train_loss": -21.536495208740234, "global_step": 100154, "epoch": 1206} {"train_loss": -21.80668067932129, "global_step": 100155, "epoch": 1206} {"train_loss": -21.451704025268555, "global_step": 100156, "epoch": 1206} {"train_loss": -22.14566421508789, "global_step": 100157, "epoch": 1206} {"train_loss": -22.03413200378418, "global_step": 100158, "epoch": 1206} {"train_loss": -22.029422760009766, "global_step": 100159, "epoch": 1206} {"train_loss": -21.536102294921875, "global_step": 100160, "epoch": 1206} {"train_loss": -22.07158851623535, "global_step": 100161, "epoch": 1206} {"train_loss": -21.9987850189209, "global_step": 100162, "epoch": 1206} {"train_loss": -21.562822341918945, "global_step": 100163, "epoch": 1206} {"train_loss": -21.715757369995117, "global_step": 100164, "epoch": 1206} {"train_loss": -21.96919059753418, "global_step": 100165, "epoch": 1206} {"train_loss": -21.859073638916016, "global_step": 100166, "epoch": 1206} {"train_loss": -21.949426651000977, "global_step": 100167, "epoch": 1206} {"train_loss": -21.761625289916992, "global_step": 100168, "epoch": 1206} {"train_loss": -21.67702293395996, "global_step": 100169, "epoch": 1206} {"train_loss": -21.975309371948242, "global_step": 100170, "epoch": 1206} {"train_loss": -22.17658042907715, "global_step": 100171, "epoch": 1206} {"train_loss": -21.85291862487793, "global_step": 100172, "epoch": 1206} {"train_loss": -21.933496475219727, "global_step": 100173, "epoch": 1206} {"train_loss": -21.94995880126953, "global_step": 100174, "epoch": 1206} {"train_loss": -22.234140396118164, "global_step": 100175, "epoch": 1206} {"train_loss": -21.651351928710938, "global_step": 100176, "epoch": 1206} {"train_loss": -21.831777572631836, "global_step": 100177, "epoch": 1206} {"train_loss": -22.153881072998047, "global_step": 100178, "epoch": 1206} {"train_loss": -22.04098892211914, "global_step": 100179, "epoch": 1206} {"train_loss": -21.856906362326747, "global_step": 100180, "epoch": 1206, "val_loss": 6091740.0} {"train_loss": -21.497804641723633, "global_step": 100181, "epoch": 1207} {"train_loss": -21.559823989868164, "global_step": 100182, "epoch": 1207} {"train_loss": -21.73818016052246, "global_step": 100183, "epoch": 1207} {"train_loss": -21.83408546447754, "global_step": 100184, "epoch": 1207} {"train_loss": -21.6308650970459, "global_step": 100185, "epoch": 1207} {"train_loss": -22.026018142700195, "global_step": 100186, "epoch": 1207} {"train_loss": -21.841581344604492, "global_step": 100187, "epoch": 1207} {"train_loss": -21.87179946899414, "global_step": 100188, "epoch": 1207} {"train_loss": -21.690292358398438, "global_step": 100189, "epoch": 1207} {"train_loss": -21.945199966430664, "global_step": 100190, "epoch": 1207} {"train_loss": -21.71588706970215, "global_step": 100191, "epoch": 1207} {"train_loss": -21.938520431518555, "global_step": 100192, "epoch": 1207} {"train_loss": -21.976892471313477, "global_step": 100193, "epoch": 1207} {"train_loss": -21.926311492919922, "global_step": 100194, "epoch": 1207} {"train_loss": -21.70440673828125, "global_step": 100195, "epoch": 1207} {"train_loss": -21.82879638671875, "global_step": 100196, "epoch": 1207} {"train_loss": -22.221487045288086, "global_step": 100197, "epoch": 1207} {"train_loss": -21.930191040039062, "global_step": 100198, "epoch": 1207} {"train_loss": -22.04509735107422, "global_step": 100199, "epoch": 1207} {"train_loss": -21.70956039428711, "global_step": 100200, "epoch": 1207} {"train_loss": -22.133602142333984, "global_step": 100201, "epoch": 1207} {"train_loss": -21.999326705932617, "global_step": 100202, "epoch": 1207} {"train_loss": -22.341672897338867, "global_step": 100203, "epoch": 1207} {"train_loss": -22.04324722290039, "global_step": 100204, "epoch": 1207} {"train_loss": -21.770891189575195, "global_step": 100205, "epoch": 1207} {"train_loss": -21.935636520385742, "global_step": 100206, "epoch": 1207} {"train_loss": -22.17734718322754, "global_step": 100207, "epoch": 1207} {"train_loss": -21.73179054260254, "global_step": 100208, "epoch": 1207} {"train_loss": -21.919954299926758, "global_step": 100209, "epoch": 1207} {"train_loss": -21.967451095581055, "global_step": 100210, "epoch": 1207} {"train_loss": -22.158597946166992, "global_step": 100211, "epoch": 1207} {"train_loss": -21.908464431762695, "global_step": 100212, "epoch": 1207} {"train_loss": -21.630878448486328, "global_step": 100213, "epoch": 1207} {"train_loss": -21.990201950073242, "global_step": 100214, "epoch": 1207} {"train_loss": -22.052268981933594, "global_step": 100215, "epoch": 1207} {"train_loss": -21.759775161743164, "global_step": 100216, "epoch": 1207} {"train_loss": -21.88472557067871, "global_step": 100217, "epoch": 1207} {"train_loss": -22.039777755737305, "global_step": 100218, "epoch": 1207} {"train_loss": -21.893362045288086, "global_step": 100219, "epoch": 1207} {"train_loss": -21.681976318359375, "global_step": 100220, "epoch": 1207} {"train_loss": -21.5696964263916, "global_step": 100221, "epoch": 1207} {"train_loss": -21.886083602905273, "global_step": 100222, "epoch": 1207} {"train_loss": -21.827007293701172, "global_step": 100223, "epoch": 1207} {"train_loss": -22.154645919799805, "global_step": 100224, "epoch": 1207} {"train_loss": -21.47245979309082, "global_step": 100225, "epoch": 1207} {"train_loss": -22.084136962890625, "global_step": 100226, "epoch": 1207} {"train_loss": -22.17112159729004, "global_step": 100227, "epoch": 1207} {"train_loss": -22.016332626342773, "global_step": 100228, "epoch": 1207} {"train_loss": -21.62740135192871, "global_step": 100229, "epoch": 1207} {"train_loss": -21.872238159179688, "global_step": 100230, "epoch": 1207} {"train_loss": -22.16483497619629, "global_step": 100231, "epoch": 1207} {"train_loss": -21.87661361694336, "global_step": 100232, "epoch": 1207} {"train_loss": -21.859769821166992, "global_step": 100233, "epoch": 1207} {"train_loss": -21.9891414642334, "global_step": 100234, "epoch": 1207} {"train_loss": -21.981401443481445, "global_step": 100235, "epoch": 1207} {"train_loss": -22.050918579101562, "global_step": 100236, "epoch": 1207} {"train_loss": -21.743370056152344, "global_step": 100237, "epoch": 1207} {"train_loss": -21.93581199645996, "global_step": 100238, "epoch": 1207} {"train_loss": -21.97732925415039, "global_step": 100239, "epoch": 1207} {"train_loss": -21.79768180847168, "global_step": 100240, "epoch": 1207} {"train_loss": -21.919281005859375, "global_step": 100241, "epoch": 1207} {"train_loss": -22.2327938079834, "global_step": 100242, "epoch": 1207} {"train_loss": -22.35725975036621, "global_step": 100243, "epoch": 1207} {"train_loss": -21.490476608276367, "global_step": 100244, "epoch": 1207} {"train_loss": -21.654516220092773, "global_step": 100245, "epoch": 1207} {"train_loss": -22.373680114746094, "global_step": 100246, "epoch": 1207} {"train_loss": -21.824859619140625, "global_step": 100247, "epoch": 1207} {"train_loss": -21.37953758239746, "global_step": 100248, "epoch": 1207} {"train_loss": -22.04145050048828, "global_step": 100249, "epoch": 1207} {"train_loss": -22.013656616210938, "global_step": 100250, "epoch": 1207} {"train_loss": -22.09357261657715, "global_step": 100251, "epoch": 1207} {"train_loss": -21.911752700805664, "global_step": 100252, "epoch": 1207} {"train_loss": -22.437274932861328, "global_step": 100253, "epoch": 1207} {"train_loss": -21.816940307617188, "global_step": 100254, "epoch": 1207} {"train_loss": -21.817066192626953, "global_step": 100255, "epoch": 1207} {"train_loss": -21.948244094848633, "global_step": 100256, "epoch": 1207} {"train_loss": -22.19764518737793, "global_step": 100257, "epoch": 1207} {"train_loss": -22.033668518066406, "global_step": 100258, "epoch": 1207} {"train_loss": -21.811656951904297, "global_step": 100259, "epoch": 1207} {"train_loss": -22.413909912109375, "global_step": 100260, "epoch": 1207} {"train_loss": -22.153318405151367, "global_step": 100261, "epoch": 1207} {"train_loss": -21.680450439453125, "global_step": 100262, "epoch": 1207} {"train_loss": -21.9191029100533, "global_step": 100263, "epoch": 1207, "val_loss": 6146595.0} {"train_loss": -21.38840675354004, "global_step": 100264, "epoch": 1208} {"train_loss": -21.30165672302246, "global_step": 100265, "epoch": 1208} {"train_loss": -21.888347625732422, "global_step": 100266, "epoch": 1208} {"train_loss": -21.305133819580078, "global_step": 100267, "epoch": 1208} {"train_loss": -21.66727066040039, "global_step": 100268, "epoch": 1208} {"train_loss": -21.93582534790039, "global_step": 100269, "epoch": 1208} {"train_loss": -21.44881248474121, "global_step": 100270, "epoch": 1208} {"train_loss": -21.957921981811523, "global_step": 100271, "epoch": 1208} {"train_loss": -21.785009384155273, "global_step": 100272, "epoch": 1208} {"train_loss": -21.359024047851562, "global_step": 100273, "epoch": 1208} {"train_loss": -21.866262435913086, "global_step": 100274, "epoch": 1208} {"train_loss": -21.94759178161621, "global_step": 100275, "epoch": 1208} {"train_loss": -21.564788818359375, "global_step": 100276, "epoch": 1208} {"train_loss": -21.880359649658203, "global_step": 100277, "epoch": 1208} {"train_loss": -21.51507568359375, "global_step": 100278, "epoch": 1208} {"train_loss": -22.18233299255371, "global_step": 100279, "epoch": 1208} {"train_loss": -21.723068237304688, "global_step": 100280, "epoch": 1208} {"train_loss": -21.552753448486328, "global_step": 100281, "epoch": 1208} {"train_loss": -21.835878372192383, "global_step": 100282, "epoch": 1208} {"train_loss": -21.87649917602539, "global_step": 100283, "epoch": 1208} {"train_loss": -22.0810546875, "global_step": 100284, "epoch": 1208} {"train_loss": -21.67011833190918, "global_step": 100285, "epoch": 1208} {"train_loss": -21.962848663330078, "global_step": 100286, "epoch": 1208} {"train_loss": -21.628067016601562, "global_step": 100287, "epoch": 1208} {"train_loss": -21.623998641967773, "global_step": 100288, "epoch": 1208} {"train_loss": -21.819080352783203, "global_step": 100289, "epoch": 1208} {"train_loss": -21.682514190673828, "global_step": 100290, "epoch": 1208} {"train_loss": -21.881723403930664, "global_step": 100291, "epoch": 1208} {"train_loss": -21.70184898376465, "global_step": 100292, "epoch": 1208} {"train_loss": -21.78859519958496, "global_step": 100293, "epoch": 1208} {"train_loss": -21.894882202148438, "global_step": 100294, "epoch": 1208} {"train_loss": -22.190032958984375, "global_step": 100295, "epoch": 1208} {"train_loss": -22.15712547302246, "global_step": 100296, "epoch": 1208} {"train_loss": -22.016685485839844, "global_step": 100297, "epoch": 1208} {"train_loss": -21.90397071838379, "global_step": 100298, "epoch": 1208} {"train_loss": -21.915180206298828, "global_step": 100299, "epoch": 1208} {"train_loss": -21.943805694580078, "global_step": 100300, "epoch": 1208} {"train_loss": -22.19745445251465, "global_step": 100301, "epoch": 1208} {"train_loss": -21.846647262573242, "global_step": 100302, "epoch": 1208} {"train_loss": -22.095869064331055, "global_step": 100303, "epoch": 1208} {"train_loss": -22.247011184692383, "global_step": 100304, "epoch": 1208} {"train_loss": -21.912540435791016, "global_step": 100305, "epoch": 1208} {"train_loss": -22.104284286499023, "global_step": 100306, "epoch": 1208} {"train_loss": -21.779159545898438, "global_step": 100307, "epoch": 1208} {"train_loss": -21.658103942871094, "global_step": 100308, "epoch": 1208} {"train_loss": -21.463592529296875, "global_step": 100309, "epoch": 1208} {"train_loss": -21.98457145690918, "global_step": 100310, "epoch": 1208} {"train_loss": -22.062780380249023, "global_step": 100311, "epoch": 1208} {"train_loss": -22.023962020874023, "global_step": 100312, "epoch": 1208} {"train_loss": -21.76736831665039, "global_step": 100313, "epoch": 1208} {"train_loss": -22.070514678955078, "global_step": 100314, "epoch": 1208} {"train_loss": -22.138904571533203, "global_step": 100315, "epoch": 1208} {"train_loss": -21.80181884765625, "global_step": 100316, "epoch": 1208} {"train_loss": -22.051315307617188, "global_step": 100317, "epoch": 1208} {"train_loss": -21.978403091430664, "global_step": 100318, "epoch": 1208} {"train_loss": -21.720335006713867, "global_step": 100319, "epoch": 1208} {"train_loss": -21.8613224029541, "global_step": 100320, "epoch": 1208} {"train_loss": -22.221214294433594, "global_step": 100321, "epoch": 1208} {"train_loss": -22.100784301757812, "global_step": 100322, "epoch": 1208} {"train_loss": -21.708057403564453, "global_step": 100323, "epoch": 1208} {"train_loss": -22.44916343688965, "global_step": 100324, "epoch": 1208} {"train_loss": -22.036991119384766, "global_step": 100325, "epoch": 1208} {"train_loss": -22.072601318359375, "global_step": 100326, "epoch": 1208} {"train_loss": -22.13852310180664, "global_step": 100327, "epoch": 1208} {"train_loss": -21.886734008789062, "global_step": 100328, "epoch": 1208} {"train_loss": -21.88068199157715, "global_step": 100329, "epoch": 1208} {"train_loss": -21.92038917541504, "global_step": 100330, "epoch": 1208} {"train_loss": -22.093591690063477, "global_step": 100331, "epoch": 1208} {"train_loss": -22.192548751831055, "global_step": 100332, "epoch": 1208} {"train_loss": -22.107351303100586, "global_step": 100333, "epoch": 1208} {"train_loss": -22.063230514526367, "global_step": 100334, "epoch": 1208} {"train_loss": -21.669391632080078, "global_step": 100335, "epoch": 1208} {"train_loss": -21.589487075805664, "global_step": 100336, "epoch": 1208} {"train_loss": -22.137847900390625, "global_step": 100337, "epoch": 1208} {"train_loss": -22.124967575073242, "global_step": 100338, "epoch": 1208} {"train_loss": -21.513702392578125, "global_step": 100339, "epoch": 1208} {"train_loss": -22.01300621032715, "global_step": 100340, "epoch": 1208} {"train_loss": -22.035688400268555, "global_step": 100341, "epoch": 1208} {"train_loss": -21.657590866088867, "global_step": 100342, "epoch": 1208} {"train_loss": -21.753175735473633, "global_step": 100343, "epoch": 1208} {"train_loss": -22.12134552001953, "global_step": 100344, "epoch": 1208} {"train_loss": -21.881765365600586, "global_step": 100345, "epoch": 1208} {"train_loss": -21.886037343955902, "global_step": 100346, "epoch": 1208, "val_loss": 6277387.0} {"train_loss": -21.263517379760742, "global_step": 100347, "epoch": 1209} {"train_loss": -21.270183563232422, "global_step": 100348, "epoch": 1209} {"train_loss": -21.331348419189453, "global_step": 100349, "epoch": 1209} {"train_loss": -21.312833786010742, "global_step": 100350, "epoch": 1209} {"train_loss": -21.410024642944336, "global_step": 100351, "epoch": 1209} {"train_loss": -21.245214462280273, "global_step": 100352, "epoch": 1209} {"train_loss": -22.098588943481445, "global_step": 100353, "epoch": 1209} {"train_loss": -21.644134521484375, "global_step": 100354, "epoch": 1209} {"train_loss": -21.803030014038086, "global_step": 100355, "epoch": 1209} {"train_loss": -22.04293441772461, "global_step": 100356, "epoch": 1209} {"train_loss": -21.88296890258789, "global_step": 100357, "epoch": 1209} {"train_loss": -21.657392501831055, "global_step": 100358, "epoch": 1209} {"train_loss": -21.8139705657959, "global_step": 100359, "epoch": 1209} {"train_loss": -21.83289337158203, "global_step": 100360, "epoch": 1209} {"train_loss": -21.72440528869629, "global_step": 100361, "epoch": 1209} {"train_loss": -22.04847526550293, "global_step": 100362, "epoch": 1209} {"train_loss": -22.204744338989258, "global_step": 100363, "epoch": 1209} {"train_loss": -21.779226303100586, "global_step": 100364, "epoch": 1209} {"train_loss": -21.76605796813965, "global_step": 100365, "epoch": 1209} {"train_loss": -21.74518394470215, "global_step": 100366, "epoch": 1209} {"train_loss": -22.15682029724121, "global_step": 100367, "epoch": 1209} {"train_loss": -21.984207153320312, "global_step": 100368, "epoch": 1209} {"train_loss": -21.93671989440918, "global_step": 100369, "epoch": 1209} {"train_loss": -21.865510940551758, "global_step": 100370, "epoch": 1209} {"train_loss": -22.241363525390625, "global_step": 100371, "epoch": 1209} {"train_loss": -21.832366943359375, "global_step": 100372, "epoch": 1209} {"train_loss": -21.821264266967773, "global_step": 100373, "epoch": 1209} {"train_loss": -21.85706901550293, "global_step": 100374, "epoch": 1209} {"train_loss": -21.9741153717041, "global_step": 100375, "epoch": 1209} {"train_loss": -21.85302734375, "global_step": 100376, "epoch": 1209} {"train_loss": -21.751678466796875, "global_step": 100377, "epoch": 1209} {"train_loss": -22.050687789916992, "global_step": 100378, "epoch": 1209} {"train_loss": -21.77756690979004, "global_step": 100379, "epoch": 1209} {"train_loss": -21.907697677612305, "global_step": 100380, "epoch": 1209} {"train_loss": -22.15455436706543, "global_step": 100381, "epoch": 1209} {"train_loss": -21.883216857910156, "global_step": 100382, "epoch": 1209} {"train_loss": -22.022186279296875, "global_step": 100383, "epoch": 1209} {"train_loss": -22.005456924438477, "global_step": 100384, "epoch": 1209} {"train_loss": -21.600095748901367, "global_step": 100385, "epoch": 1209} {"train_loss": -21.714086532592773, "global_step": 100386, "epoch": 1209} {"train_loss": -21.89462661743164, "global_step": 100387, "epoch": 1209} {"train_loss": -21.9067440032959, "global_step": 100388, "epoch": 1209} {"train_loss": -22.041696548461914, "global_step": 100389, "epoch": 1209} {"train_loss": -22.033000946044922, "global_step": 100390, "epoch": 1209} {"train_loss": -21.51883316040039, "global_step": 100391, "epoch": 1209} {"train_loss": -22.03680419921875, "global_step": 100392, "epoch": 1209} {"train_loss": -21.783090591430664, "global_step": 100393, "epoch": 1209} {"train_loss": -22.10224723815918, "global_step": 100394, "epoch": 1209} {"train_loss": -21.8781681060791, "global_step": 100395, "epoch": 1209} {"train_loss": -21.837085723876953, "global_step": 100396, "epoch": 1209} {"train_loss": -22.131025314331055, "global_step": 100397, "epoch": 1209} {"train_loss": -21.88350486755371, "global_step": 100398, "epoch": 1209} {"train_loss": -22.149961471557617, "global_step": 100399, "epoch": 1209} {"train_loss": -21.864164352416992, "global_step": 100400, "epoch": 1209} {"train_loss": -21.837018966674805, "global_step": 100401, "epoch": 1209} {"train_loss": -21.476974487304688, "global_step": 100402, "epoch": 1209} {"train_loss": -21.9411678314209, "global_step": 100403, "epoch": 1209} {"train_loss": -22.081926345825195, "global_step": 100404, "epoch": 1209} {"train_loss": -21.90471649169922, "global_step": 100405, "epoch": 1209} {"train_loss": -22.221492767333984, "global_step": 100406, "epoch": 1209} {"train_loss": -22.53519058227539, "global_step": 100407, "epoch": 1209} {"train_loss": -22.059539794921875, "global_step": 100408, "epoch": 1209} {"train_loss": -21.789215087890625, "global_step": 100409, "epoch": 1209} {"train_loss": -22.074613571166992, "global_step": 100410, "epoch": 1209} {"train_loss": -21.759353637695312, "global_step": 100411, "epoch": 1209} {"train_loss": -22.082454681396484, "global_step": 100412, "epoch": 1209} {"train_loss": -21.996967315673828, "global_step": 100413, "epoch": 1209} {"train_loss": -22.142553329467773, "global_step": 100414, "epoch": 1209} {"train_loss": -22.0642032623291, "global_step": 100415, "epoch": 1209} {"train_loss": -22.21189308166504, "global_step": 100416, "epoch": 1209} {"train_loss": -21.78645896911621, "global_step": 100417, "epoch": 1209} {"train_loss": -22.199039459228516, "global_step": 100418, "epoch": 1209} {"train_loss": -22.373167037963867, "global_step": 100419, "epoch": 1209} {"train_loss": -21.878742218017578, "global_step": 100420, "epoch": 1209} {"train_loss": -22.196386337280273, "global_step": 100421, "epoch": 1209} {"train_loss": -22.18219566345215, "global_step": 100422, "epoch": 1209} {"train_loss": -21.926849365234375, "global_step": 100423, "epoch": 1209} {"train_loss": -21.87613296508789, "global_step": 100424, "epoch": 1209} {"train_loss": -22.12222671508789, "global_step": 100425, "epoch": 1209} {"train_loss": -22.24078941345215, "global_step": 100426, "epoch": 1209} {"train_loss": -22.22707176208496, "global_step": 100427, "epoch": 1209} {"train_loss": -21.946544647216797, "global_step": 100428, "epoch": 1209} {"train_loss": -21.89389005913792, "global_step": 100429, "epoch": 1209, "val_loss": 6247190.0} {"train_loss": -20.558731079101562, "global_step": 100430, "epoch": 1210} {"train_loss": -21.297290802001953, "global_step": 100431, "epoch": 1210} {"train_loss": -21.28244972229004, "global_step": 100432, "epoch": 1210} {"train_loss": -21.628416061401367, "global_step": 100433, "epoch": 1210} {"train_loss": -21.2054386138916, "global_step": 100434, "epoch": 1210} {"train_loss": -21.4393367767334, "global_step": 100435, "epoch": 1210} {"train_loss": -21.36260414123535, "global_step": 100436, "epoch": 1210} {"train_loss": -21.599374771118164, "global_step": 100437, "epoch": 1210} {"train_loss": -21.780744552612305, "global_step": 100438, "epoch": 1210} {"train_loss": -21.76506233215332, "global_step": 100439, "epoch": 1210} {"train_loss": -21.5914249420166, "global_step": 100440, "epoch": 1210} {"train_loss": -21.869243621826172, "global_step": 100441, "epoch": 1210} {"train_loss": -22.045774459838867, "global_step": 100442, "epoch": 1210} {"train_loss": -21.705093383789062, "global_step": 100443, "epoch": 1210} {"train_loss": -21.722339630126953, "global_step": 100444, "epoch": 1210} {"train_loss": -21.93385124206543, "global_step": 100445, "epoch": 1210} {"train_loss": -21.78614616394043, "global_step": 100446, "epoch": 1210} {"train_loss": -22.012271881103516, "global_step": 100447, "epoch": 1210} {"train_loss": -22.032005310058594, "global_step": 100448, "epoch": 1210} {"train_loss": -21.52216911315918, "global_step": 100449, "epoch": 1210} {"train_loss": -21.470983505249023, "global_step": 100450, "epoch": 1210} {"train_loss": -21.340734481811523, "global_step": 100451, "epoch": 1210} {"train_loss": -22.102155685424805, "global_step": 100452, "epoch": 1210} {"train_loss": -22.2388973236084, "global_step": 100453, "epoch": 1210} {"train_loss": -21.804994583129883, "global_step": 100454, "epoch": 1210} {"train_loss": -21.894027709960938, "global_step": 100455, "epoch": 1210} {"train_loss": -21.6143856048584, "global_step": 100456, "epoch": 1210} {"train_loss": -21.5920467376709, "global_step": 100457, "epoch": 1210} {"train_loss": -22.093524932861328, "global_step": 100458, "epoch": 1210} {"train_loss": -22.216205596923828, "global_step": 100459, "epoch": 1210} {"train_loss": -21.6278133392334, "global_step": 100460, "epoch": 1210} {"train_loss": -21.835065841674805, "global_step": 100461, "epoch": 1210} {"train_loss": -21.399295806884766, "global_step": 100462, "epoch": 1210} {"train_loss": -21.886011123657227, "global_step": 100463, "epoch": 1210} {"train_loss": -21.882932662963867, "global_step": 100464, "epoch": 1210} {"train_loss": -21.577802658081055, "global_step": 100465, "epoch": 1210} {"train_loss": -21.994457244873047, "global_step": 100466, "epoch": 1210} {"train_loss": -21.87725067138672, "global_step": 100467, "epoch": 1210} {"train_loss": -21.999183654785156, "global_step": 100468, "epoch": 1210} {"train_loss": -21.571218490600586, "global_step": 100469, "epoch": 1210} {"train_loss": -21.776124954223633, "global_step": 100470, "epoch": 1210} {"train_loss": -21.707138061523438, "global_step": 100471, "epoch": 1210} {"train_loss": -21.491044998168945, "global_step": 100472, "epoch": 1210} {"train_loss": -22.22470474243164, "global_step": 100473, "epoch": 1210} {"train_loss": -22.09980583190918, "global_step": 100474, "epoch": 1210} {"train_loss": -22.0499324798584, "global_step": 100475, "epoch": 1210} {"train_loss": -21.936235427856445, "global_step": 100476, "epoch": 1210} {"train_loss": -21.786710739135742, "global_step": 100477, "epoch": 1210} {"train_loss": -21.92767333984375, "global_step": 100478, "epoch": 1210} {"train_loss": -21.858152389526367, "global_step": 100479, "epoch": 1210} {"train_loss": -22.328279495239258, "global_step": 100480, "epoch": 1210} {"train_loss": -22.141820907592773, "global_step": 100481, "epoch": 1210} {"train_loss": -21.651975631713867, "global_step": 100482, "epoch": 1210} {"train_loss": -21.896635055541992, "global_step": 100483, "epoch": 1210} {"train_loss": -22.109628677368164, "global_step": 100484, "epoch": 1210} {"train_loss": -22.290407180786133, "global_step": 100485, "epoch": 1210} {"train_loss": -21.90791130065918, "global_step": 100486, "epoch": 1210} {"train_loss": -21.892187118530273, "global_step": 100487, "epoch": 1210} {"train_loss": -21.856908798217773, "global_step": 100488, "epoch": 1210} {"train_loss": -21.48884391784668, "global_step": 100489, "epoch": 1210} {"train_loss": -21.706235885620117, "global_step": 100490, "epoch": 1210} {"train_loss": -21.810890197753906, "global_step": 100491, "epoch": 1210} {"train_loss": -22.081754684448242, "global_step": 100492, "epoch": 1210} {"train_loss": -21.7508487701416, "global_step": 100493, "epoch": 1210} {"train_loss": -21.73074722290039, "global_step": 100494, "epoch": 1210} {"train_loss": -22.242130279541016, "global_step": 100495, "epoch": 1210} {"train_loss": -22.083267211914062, "global_step": 100496, "epoch": 1210} {"train_loss": -21.913301467895508, "global_step": 100497, "epoch": 1210} {"train_loss": -21.897504806518555, "global_step": 100498, "epoch": 1210} {"train_loss": -21.82513999938965, "global_step": 100499, "epoch": 1210} {"train_loss": -21.99907684326172, "global_step": 100500, "epoch": 1210} {"train_loss": -21.943639755249023, "global_step": 100501, "epoch": 1210} {"train_loss": -21.950225830078125, "global_step": 100502, "epoch": 1210} {"train_loss": -22.002439498901367, "global_step": 100503, "epoch": 1210} {"train_loss": -21.77957534790039, "global_step": 100504, "epoch": 1210} {"train_loss": -21.819143295288086, "global_step": 100505, "epoch": 1210} {"train_loss": -21.79328727722168, "global_step": 100506, "epoch": 1210} {"train_loss": -22.125072479248047, "global_step": 100507, "epoch": 1210} {"train_loss": -21.72482681274414, "global_step": 100508, "epoch": 1210} {"train_loss": -21.887847900390625, "global_step": 100509, "epoch": 1210} {"train_loss": -21.704696655273438, "global_step": 100510, "epoch": 1210} {"train_loss": -21.771080017089844, "global_step": 100511, "epoch": 1210} {"train_loss": -21.819267755531403, "global_step": 100512, "epoch": 1210, "val_loss": 6186926.0} {"train_loss": -21.259550094604492, "global_step": 100513, "epoch": 1211} {"train_loss": -21.798582077026367, "global_step": 100514, "epoch": 1211} {"train_loss": -22.124414443969727, "global_step": 100515, "epoch": 1211} {"train_loss": -21.67279624938965, "global_step": 100516, "epoch": 1211} {"train_loss": -21.89255142211914, "global_step": 100517, "epoch": 1211} {"train_loss": -21.74686050415039, "global_step": 100518, "epoch": 1211} {"train_loss": -21.51203155517578, "global_step": 100519, "epoch": 1211} {"train_loss": -21.94454002380371, "global_step": 100520, "epoch": 1211} {"train_loss": -21.34339141845703, "global_step": 100521, "epoch": 1211} {"train_loss": -21.275205612182617, "global_step": 100522, "epoch": 1211} {"train_loss": -21.673856735229492, "global_step": 100523, "epoch": 1211} {"train_loss": -22.06553077697754, "global_step": 100524, "epoch": 1211} {"train_loss": -21.940095901489258, "global_step": 100525, "epoch": 1211} {"train_loss": -21.61871337890625, "global_step": 100526, "epoch": 1211} {"train_loss": -21.683897018432617, "global_step": 100527, "epoch": 1211} {"train_loss": -22.10672378540039, "global_step": 100528, "epoch": 1211} {"train_loss": -21.508867263793945, "global_step": 100529, "epoch": 1211} {"train_loss": -21.789331436157227, "global_step": 100530, "epoch": 1211} {"train_loss": -21.728357315063477, "global_step": 100531, "epoch": 1211} {"train_loss": -21.727323532104492, "global_step": 100532, "epoch": 1211} {"train_loss": -21.952360153198242, "global_step": 100533, "epoch": 1211} {"train_loss": -22.100446701049805, "global_step": 100534, "epoch": 1211} {"train_loss": -22.06816291809082, "global_step": 100535, "epoch": 1211} {"train_loss": -22.410120010375977, "global_step": 100536, "epoch": 1211} {"train_loss": -22.040668487548828, "global_step": 100537, "epoch": 1211} {"train_loss": -22.002887725830078, "global_step": 100538, "epoch": 1211} {"train_loss": -21.916051864624023, "global_step": 100539, "epoch": 1211} {"train_loss": -22.282392501831055, "global_step": 100540, "epoch": 1211} {"train_loss": -21.6563777923584, "global_step": 100541, "epoch": 1211} {"train_loss": -21.414636611938477, "global_step": 100542, "epoch": 1211} {"train_loss": -21.865375518798828, "global_step": 100543, "epoch": 1211} {"train_loss": -21.87681007385254, "global_step": 100544, "epoch": 1211} {"train_loss": -21.96811866760254, "global_step": 100545, "epoch": 1211} {"train_loss": -22.124937057495117, "global_step": 100546, "epoch": 1211} {"train_loss": -21.811338424682617, "global_step": 100547, "epoch": 1211} {"train_loss": -21.29245376586914, "global_step": 100548, "epoch": 1211} {"train_loss": -21.75328254699707, "global_step": 100549, "epoch": 1211} {"train_loss": -22.131322860717773, "global_step": 100550, "epoch": 1211} {"train_loss": -21.93744468688965, "global_step": 100551, "epoch": 1211} {"train_loss": -21.98064422607422, "global_step": 100552, "epoch": 1211} {"train_loss": -21.99622917175293, "global_step": 100553, "epoch": 1211} {"train_loss": -21.799367904663086, "global_step": 100554, "epoch": 1211} {"train_loss": -21.967498779296875, "global_step": 100555, "epoch": 1211} {"train_loss": -21.538700103759766, "global_step": 100556, "epoch": 1211} {"train_loss": -21.990488052368164, "global_step": 100557, "epoch": 1211} {"train_loss": -21.908235549926758, "global_step": 100558, "epoch": 1211} {"train_loss": -21.74907875061035, "global_step": 100559, "epoch": 1211} {"train_loss": -21.832181930541992, "global_step": 100560, "epoch": 1211} {"train_loss": -21.697723388671875, "global_step": 100561, "epoch": 1211} {"train_loss": -21.74302101135254, "global_step": 100562, "epoch": 1211} {"train_loss": -22.08258628845215, "global_step": 100563, "epoch": 1211} {"train_loss": -22.021848678588867, "global_step": 100564, "epoch": 1211} {"train_loss": -21.757062911987305, "global_step": 100565, "epoch": 1211} {"train_loss": -22.285062789916992, "global_step": 100566, "epoch": 1211} {"train_loss": -21.881071090698242, "global_step": 100567, "epoch": 1211} {"train_loss": -22.06190299987793, "global_step": 100568, "epoch": 1211} {"train_loss": -21.739177703857422, "global_step": 100569, "epoch": 1211} {"train_loss": -21.978647232055664, "global_step": 100570, "epoch": 1211} {"train_loss": -22.08711051940918, "global_step": 100571, "epoch": 1211} {"train_loss": -21.8985595703125, "global_step": 100572, "epoch": 1211} {"train_loss": -21.831560134887695, "global_step": 100573, "epoch": 1211} {"train_loss": -22.126102447509766, "global_step": 100574, "epoch": 1211} {"train_loss": -21.875564575195312, "global_step": 100575, "epoch": 1211} {"train_loss": -22.12033462524414, "global_step": 100576, "epoch": 1211} {"train_loss": -21.801725387573242, "global_step": 100577, "epoch": 1211} {"train_loss": -21.775772094726562, "global_step": 100578, "epoch": 1211} {"train_loss": -22.132246017456055, "global_step": 100579, "epoch": 1211} {"train_loss": -21.889917373657227, "global_step": 100580, "epoch": 1211} {"train_loss": -22.043930053710938, "global_step": 100581, "epoch": 1211} {"train_loss": -22.351076126098633, "global_step": 100582, "epoch": 1211} {"train_loss": -22.332990646362305, "global_step": 100583, "epoch": 1211} {"train_loss": -21.811159133911133, "global_step": 100584, "epoch": 1211} {"train_loss": -21.93157386779785, "global_step": 100585, "epoch": 1211} {"train_loss": -21.849008560180664, "global_step": 100586, "epoch": 1211} {"train_loss": -22.118467330932617, "global_step": 100587, "epoch": 1211} {"train_loss": -21.36586570739746, "global_step": 100588, "epoch": 1211} {"train_loss": -21.800569534301758, "global_step": 100589, "epoch": 1211} {"train_loss": -21.88237953186035, "global_step": 100590, "epoch": 1211} {"train_loss": -22.059560775756836, "global_step": 100591, "epoch": 1211} {"train_loss": -22.30022621154785, "global_step": 100592, "epoch": 1211} {"train_loss": -21.876087188720703, "global_step": 100593, "epoch": 1211} {"train_loss": -22.020782470703125, "global_step": 100594, "epoch": 1211} {"train_loss": -21.88485811991864, "global_step": 100595, "epoch": 1211, "val_loss": 6155477.5} {"train_loss": -21.94282341003418, "global_step": 100596, "epoch": 1212} {"train_loss": -21.754491806030273, "global_step": 100597, "epoch": 1212} {"train_loss": -21.38345718383789, "global_step": 100598, "epoch": 1212} {"train_loss": -21.466224670410156, "global_step": 100599, "epoch": 1212} {"train_loss": -21.533042907714844, "global_step": 100600, "epoch": 1212} {"train_loss": -21.382999420166016, "global_step": 100601, "epoch": 1212} {"train_loss": -21.339378356933594, "global_step": 100602, "epoch": 1212} {"train_loss": -21.734590530395508, "global_step": 100603, "epoch": 1212} {"train_loss": -21.811277389526367, "global_step": 100604, "epoch": 1212} {"train_loss": -21.853601455688477, "global_step": 100605, "epoch": 1212} {"train_loss": -21.716676712036133, "global_step": 100606, "epoch": 1212} {"train_loss": -21.69309425354004, "global_step": 100607, "epoch": 1212} {"train_loss": -21.939926147460938, "global_step": 100608, "epoch": 1212} {"train_loss": -21.653345108032227, "global_step": 100609, "epoch": 1212} {"train_loss": -21.681814193725586, "global_step": 100610, "epoch": 1212} {"train_loss": -21.676877975463867, "global_step": 100611, "epoch": 1212} {"train_loss": -21.6898136138916, "global_step": 100612, "epoch": 1212} {"train_loss": -21.84581756591797, "global_step": 100613, "epoch": 1212} {"train_loss": -21.85115623474121, "global_step": 100614, "epoch": 1212} {"train_loss": -21.77677345275879, "global_step": 100615, "epoch": 1212} {"train_loss": -21.92588996887207, "global_step": 100616, "epoch": 1212} {"train_loss": -21.84427833557129, "global_step": 100617, "epoch": 1212} {"train_loss": -21.87664794921875, "global_step": 100618, "epoch": 1212} {"train_loss": -21.831209182739258, "global_step": 100619, "epoch": 1212} {"train_loss": -21.664993286132812, "global_step": 100620, "epoch": 1212} {"train_loss": -21.777938842773438, "global_step": 100621, "epoch": 1212} {"train_loss": -22.384262084960938, "global_step": 100622, "epoch": 1212} {"train_loss": -21.914382934570312, "global_step": 100623, "epoch": 1212} {"train_loss": -21.536605834960938, "global_step": 100624, "epoch": 1212} {"train_loss": -22.060100555419922, "global_step": 100625, "epoch": 1212} {"train_loss": -21.766788482666016, "global_step": 100626, "epoch": 1212} {"train_loss": -22.021413803100586, "global_step": 100627, "epoch": 1212} {"train_loss": -21.757028579711914, "global_step": 100628, "epoch": 1212} {"train_loss": -22.273473739624023, "global_step": 100629, "epoch": 1212} {"train_loss": -22.003070831298828, "global_step": 100630, "epoch": 1212} {"train_loss": -21.874372482299805, "global_step": 100631, "epoch": 1212} {"train_loss": -21.87191390991211, "global_step": 100632, "epoch": 1212} {"train_loss": -21.86890983581543, "global_step": 100633, "epoch": 1212} {"train_loss": -22.285202026367188, "global_step": 100634, "epoch": 1212} {"train_loss": -21.574586868286133, "global_step": 100635, "epoch": 1212} {"train_loss": -22.026304244995117, "global_step": 100636, "epoch": 1212} {"train_loss": -22.006540298461914, "global_step": 100637, "epoch": 1212} {"train_loss": -21.905656814575195, "global_step": 100638, "epoch": 1212} {"train_loss": -21.98908042907715, "global_step": 100639, "epoch": 1212} {"train_loss": -21.662839889526367, "global_step": 100640, "epoch": 1212} {"train_loss": -22.087514877319336, "global_step": 100641, "epoch": 1212} {"train_loss": -21.563983917236328, "global_step": 100642, "epoch": 1212} {"train_loss": -21.607336044311523, "global_step": 100643, "epoch": 1212} {"train_loss": -21.91737174987793, "global_step": 100644, "epoch": 1212} {"train_loss": -21.838552474975586, "global_step": 100645, "epoch": 1212} {"train_loss": -21.732833862304688, "global_step": 100646, "epoch": 1212} {"train_loss": -21.798267364501953, "global_step": 100647, "epoch": 1212} {"train_loss": -21.53957176208496, "global_step": 100648, "epoch": 1212} {"train_loss": -21.76116943359375, "global_step": 100649, "epoch": 1212} {"train_loss": -22.2202091217041, "global_step": 100650, "epoch": 1212} {"train_loss": -21.794538497924805, "global_step": 100651, "epoch": 1212} {"train_loss": -21.96092414855957, "global_step": 100652, "epoch": 1212} {"train_loss": -21.656126022338867, "global_step": 100653, "epoch": 1212} {"train_loss": -21.636301040649414, "global_step": 100654, "epoch": 1212} {"train_loss": -21.589231491088867, "global_step": 100655, "epoch": 1212} {"train_loss": -22.29773712158203, "global_step": 100656, "epoch": 1212} {"train_loss": -22.12469482421875, "global_step": 100657, "epoch": 1212} {"train_loss": -21.74566650390625, "global_step": 100658, "epoch": 1212} {"train_loss": -22.090492248535156, "global_step": 100659, "epoch": 1212} {"train_loss": -21.706466674804688, "global_step": 100660, "epoch": 1212} {"train_loss": -21.713943481445312, "global_step": 100661, "epoch": 1212} {"train_loss": -21.39326286315918, "global_step": 100662, "epoch": 1212} {"train_loss": -21.84462547302246, "global_step": 100663, "epoch": 1212} {"train_loss": -22.480609893798828, "global_step": 100664, "epoch": 1212} {"train_loss": -21.971923828125, "global_step": 100665, "epoch": 1212} {"train_loss": -21.448200225830078, "global_step": 100666, "epoch": 1212} {"train_loss": -21.88433265686035, "global_step": 100667, "epoch": 1212} {"train_loss": -22.024539947509766, "global_step": 100668, "epoch": 1212} {"train_loss": -21.927143096923828, "global_step": 100669, "epoch": 1212} {"train_loss": -21.700096130371094, "global_step": 100670, "epoch": 1212} {"train_loss": -22.140954971313477, "global_step": 100671, "epoch": 1212} {"train_loss": -21.849925994873047, "global_step": 100672, "epoch": 1212} {"train_loss": -21.740314483642578, "global_step": 100673, "epoch": 1212} {"train_loss": -22.17230987548828, "global_step": 100674, "epoch": 1212} {"train_loss": -21.935867309570312, "global_step": 100675, "epoch": 1212} {"train_loss": -22.282148361206055, "global_step": 100676, "epoch": 1212} {"train_loss": -22.004301071166992, "global_step": 100677, "epoch": 1212} {"train_loss": -21.83682917399579, "global_step": 100678, "epoch": 1212, "val_loss": 6044355.0} {"train_loss": -21.336149215698242, "global_step": 100679, "epoch": 1213} {"train_loss": -21.838211059570312, "global_step": 100680, "epoch": 1213} {"train_loss": -21.342275619506836, "global_step": 100681, "epoch": 1213} {"train_loss": -21.307231903076172, "global_step": 100682, "epoch": 1213} {"train_loss": -21.219572067260742, "global_step": 100683, "epoch": 1213} {"train_loss": -21.550703048706055, "global_step": 100684, "epoch": 1213} {"train_loss": -21.878376007080078, "global_step": 100685, "epoch": 1213} {"train_loss": -21.773366928100586, "global_step": 100686, "epoch": 1213} {"train_loss": -21.506423950195312, "global_step": 100687, "epoch": 1213} {"train_loss": -21.64566421508789, "global_step": 100688, "epoch": 1213} {"train_loss": -21.56318473815918, "global_step": 100689, "epoch": 1213} {"train_loss": -21.2480411529541, "global_step": 100690, "epoch": 1213} {"train_loss": -21.90187644958496, "global_step": 100691, "epoch": 1213} {"train_loss": -21.60015869140625, "global_step": 100692, "epoch": 1213} {"train_loss": -21.860916137695312, "global_step": 100693, "epoch": 1213} {"train_loss": -21.967741012573242, "global_step": 100694, "epoch": 1213} {"train_loss": -21.776277542114258, "global_step": 100695, "epoch": 1213} {"train_loss": -21.58231544494629, "global_step": 100696, "epoch": 1213} {"train_loss": -21.84366798400879, "global_step": 100697, "epoch": 1213} {"train_loss": -21.821014404296875, "global_step": 100698, "epoch": 1213} {"train_loss": -22.163772583007812, "global_step": 100699, "epoch": 1213} {"train_loss": -21.50987434387207, "global_step": 100700, "epoch": 1213} {"train_loss": -21.819265365600586, "global_step": 100701, "epoch": 1213} {"train_loss": -21.97537612915039, "global_step": 100702, "epoch": 1213} {"train_loss": -22.113019943237305, "global_step": 100703, "epoch": 1213} {"train_loss": -21.80389976501465, "global_step": 100704, "epoch": 1213} {"train_loss": -22.074207305908203, "global_step": 100705, "epoch": 1213} {"train_loss": -21.873685836791992, "global_step": 100706, "epoch": 1213} {"train_loss": -21.878129959106445, "global_step": 100707, "epoch": 1213} {"train_loss": -21.498254776000977, "global_step": 100708, "epoch": 1213} {"train_loss": -21.970930099487305, "global_step": 100709, "epoch": 1213} {"train_loss": -22.183156967163086, "global_step": 100710, "epoch": 1213} {"train_loss": -21.544973373413086, "global_step": 100711, "epoch": 1213} {"train_loss": -21.9022216796875, "global_step": 100712, "epoch": 1213} {"train_loss": -22.02145767211914, "global_step": 100713, "epoch": 1213} {"train_loss": -21.93697166442871, "global_step": 100714, "epoch": 1213} {"train_loss": -21.519489288330078, "global_step": 100715, "epoch": 1213} {"train_loss": -21.859397888183594, "global_step": 100716, "epoch": 1213} {"train_loss": -22.229537963867188, "global_step": 100717, "epoch": 1213} {"train_loss": -21.866697311401367, "global_step": 100718, "epoch": 1213} {"train_loss": -21.44587516784668, "global_step": 100719, "epoch": 1213} {"train_loss": -21.9989070892334, "global_step": 100720, "epoch": 1213} {"train_loss": -21.848285675048828, "global_step": 100721, "epoch": 1213} {"train_loss": -21.842744827270508, "global_step": 100722, "epoch": 1213} {"train_loss": -21.819984436035156, "global_step": 100723, "epoch": 1213} {"train_loss": -22.02578353881836, "global_step": 100724, "epoch": 1213} {"train_loss": -21.867919921875, "global_step": 100725, "epoch": 1213} {"train_loss": -22.002531051635742, "global_step": 100726, "epoch": 1213} {"train_loss": -21.737327575683594, "global_step": 100727, "epoch": 1213} {"train_loss": -21.80975341796875, "global_step": 100728, "epoch": 1213} {"train_loss": -21.924747467041016, "global_step": 100729, "epoch": 1213} {"train_loss": -22.014572143554688, "global_step": 100730, "epoch": 1213} {"train_loss": -21.662931442260742, "global_step": 100731, "epoch": 1213} {"train_loss": -22.06796646118164, "global_step": 100732, "epoch": 1213} {"train_loss": -21.940401077270508, "global_step": 100733, "epoch": 1213} {"train_loss": -21.44974708557129, "global_step": 100734, "epoch": 1213} {"train_loss": -21.8148193359375, "global_step": 100735, "epoch": 1213} {"train_loss": -21.57392692565918, "global_step": 100736, "epoch": 1213} {"train_loss": -21.880552291870117, "global_step": 100737, "epoch": 1213} {"train_loss": -21.45784568786621, "global_step": 100738, "epoch": 1213} {"train_loss": -21.82826042175293, "global_step": 100739, "epoch": 1213} {"train_loss": -22.08617401123047, "global_step": 100740, "epoch": 1213} {"train_loss": -21.898202896118164, "global_step": 100741, "epoch": 1213} {"train_loss": -21.836410522460938, "global_step": 100742, "epoch": 1213} {"train_loss": -21.79664421081543, "global_step": 100743, "epoch": 1213} {"train_loss": -21.760963439941406, "global_step": 100744, "epoch": 1213} {"train_loss": -22.318044662475586, "global_step": 100745, "epoch": 1213} {"train_loss": -21.719104766845703, "global_step": 100746, "epoch": 1213} {"train_loss": -21.721521377563477, "global_step": 100747, "epoch": 1213} {"train_loss": -21.89459800720215, "global_step": 100748, "epoch": 1213} {"train_loss": -21.616872787475586, "global_step": 100749, "epoch": 1213} {"train_loss": -21.852413177490234, "global_step": 100750, "epoch": 1213} {"train_loss": -22.071897506713867, "global_step": 100751, "epoch": 1213} {"train_loss": -21.74985694885254, "global_step": 100752, "epoch": 1213} {"train_loss": -21.861547470092773, "global_step": 100753, "epoch": 1213} {"train_loss": -21.924575805664062, "global_step": 100754, "epoch": 1213} {"train_loss": -22.032339096069336, "global_step": 100755, "epoch": 1213} {"train_loss": -22.09601402282715, "global_step": 100756, "epoch": 1213} {"train_loss": -22.04855728149414, "global_step": 100757, "epoch": 1213} {"train_loss": -22.048187255859375, "global_step": 100758, "epoch": 1213} {"train_loss": -22.009960174560547, "global_step": 100759, "epoch": 1213} {"train_loss": -22.262500762939453, "global_step": 100760, "epoch": 1213} {"train_loss": -21.81326130786574, "global_step": 100761, "epoch": 1213, "val_loss": 6036903.0} {"train_loss": -21.61504364013672, "global_step": 100762, "epoch": 1214} {"train_loss": -21.87616539001465, "global_step": 100763, "epoch": 1214} {"train_loss": -21.467769622802734, "global_step": 100764, "epoch": 1214} {"train_loss": -21.615354537963867, "global_step": 100765, "epoch": 1214} {"train_loss": -21.775344848632812, "global_step": 100766, "epoch": 1214} {"train_loss": -21.666044235229492, "global_step": 100767, "epoch": 1214} {"train_loss": -21.883344650268555, "global_step": 100768, "epoch": 1214} {"train_loss": -21.841161727905273, "global_step": 100769, "epoch": 1214} {"train_loss": -21.607696533203125, "global_step": 100770, "epoch": 1214} {"train_loss": -21.811939239501953, "global_step": 100771, "epoch": 1214} {"train_loss": -21.820539474487305, "global_step": 100772, "epoch": 1214} {"train_loss": -21.92411231994629, "global_step": 100773, "epoch": 1214} {"train_loss": -21.89388084411621, "global_step": 100774, "epoch": 1214} {"train_loss": -22.03352928161621, "global_step": 100775, "epoch": 1214} {"train_loss": -22.0711727142334, "global_step": 100776, "epoch": 1214} {"train_loss": -22.076732635498047, "global_step": 100777, "epoch": 1214} {"train_loss": -21.72610855102539, "global_step": 100778, "epoch": 1214} {"train_loss": -21.78238296508789, "global_step": 100779, "epoch": 1214} {"train_loss": -21.42698097229004, "global_step": 100780, "epoch": 1214} {"train_loss": -21.4656982421875, "global_step": 100781, "epoch": 1214} {"train_loss": -21.760971069335938, "global_step": 100782, "epoch": 1214} {"train_loss": -21.932371139526367, "global_step": 100783, "epoch": 1214} {"train_loss": -21.884519577026367, "global_step": 100784, "epoch": 1214} {"train_loss": -22.043933868408203, "global_step": 100785, "epoch": 1214} {"train_loss": -21.86809539794922, "global_step": 100786, "epoch": 1214} {"train_loss": -22.31986427307129, "global_step": 100787, "epoch": 1214} {"train_loss": -22.004404067993164, "global_step": 100788, "epoch": 1214} {"train_loss": -21.873567581176758, "global_step": 100789, "epoch": 1214} {"train_loss": -21.912233352661133, "global_step": 100790, "epoch": 1214} {"train_loss": -21.92449951171875, "global_step": 100791, "epoch": 1214} {"train_loss": -21.97406578063965, "global_step": 100792, "epoch": 1214} {"train_loss": -21.938634872436523, "global_step": 100793, "epoch": 1214} {"train_loss": -21.84137725830078, "global_step": 100794, "epoch": 1214} {"train_loss": -21.988235473632812, "global_step": 100795, "epoch": 1214} {"train_loss": -21.916133880615234, "global_step": 100796, "epoch": 1214} {"train_loss": -21.47881507873535, "global_step": 100797, "epoch": 1214} {"train_loss": -21.801010131835938, "global_step": 100798, "epoch": 1214} {"train_loss": -21.373493194580078, "global_step": 100799, "epoch": 1214} {"train_loss": -21.758501052856445, "global_step": 100800, "epoch": 1214} {"train_loss": -22.2470703125, "global_step": 100801, "epoch": 1214} {"train_loss": -21.974407196044922, "global_step": 100802, "epoch": 1214} {"train_loss": -21.830659866333008, "global_step": 100803, "epoch": 1214} {"train_loss": -22.23099136352539, "global_step": 100804, "epoch": 1214} {"train_loss": -21.715429306030273, "global_step": 100805, "epoch": 1214} {"train_loss": -21.911396026611328, "global_step": 100806, "epoch": 1214} {"train_loss": -22.10894203186035, "global_step": 100807, "epoch": 1214} {"train_loss": -22.064697265625, "global_step": 100808, "epoch": 1214} {"train_loss": -21.98048973083496, "global_step": 100809, "epoch": 1214} {"train_loss": -22.051687240600586, "global_step": 100810, "epoch": 1214} {"train_loss": -21.958532333374023, "global_step": 100811, "epoch": 1214} {"train_loss": -21.972936630249023, "global_step": 100812, "epoch": 1214} {"train_loss": -22.099828720092773, "global_step": 100813, "epoch": 1214} {"train_loss": -22.018863677978516, "global_step": 100814, "epoch": 1214} {"train_loss": -21.831161499023438, "global_step": 100815, "epoch": 1214} {"train_loss": -22.140047073364258, "global_step": 100816, "epoch": 1214} {"train_loss": -22.190492630004883, "global_step": 100817, "epoch": 1214} {"train_loss": -21.79609489440918, "global_step": 100818, "epoch": 1214} {"train_loss": -21.9200439453125, "global_step": 100819, "epoch": 1214} {"train_loss": -22.02797508239746, "global_step": 100820, "epoch": 1214} {"train_loss": -22.113691329956055, "global_step": 100821, "epoch": 1214} {"train_loss": -21.657276153564453, "global_step": 100822, "epoch": 1214} {"train_loss": -21.97022247314453, "global_step": 100823, "epoch": 1214} {"train_loss": -21.93234634399414, "global_step": 100824, "epoch": 1214} {"train_loss": -22.01873207092285, "global_step": 100825, "epoch": 1214} {"train_loss": -21.946319580078125, "global_step": 100826, "epoch": 1214} {"train_loss": -22.060945510864258, "global_step": 100827, "epoch": 1214} {"train_loss": -22.020483016967773, "global_step": 100828, "epoch": 1214} {"train_loss": -22.319259643554688, "global_step": 100829, "epoch": 1214} {"train_loss": -22.214466094970703, "global_step": 100830, "epoch": 1214} {"train_loss": -21.818246841430664, "global_step": 100831, "epoch": 1214} {"train_loss": -22.07022476196289, "global_step": 100832, "epoch": 1214} {"train_loss": -21.901472091674805, "global_step": 100833, "epoch": 1214} {"train_loss": -21.76360511779785, "global_step": 100834, "epoch": 1214} {"train_loss": -22.065702438354492, "global_step": 100835, "epoch": 1214} {"train_loss": -22.251319885253906, "global_step": 100836, "epoch": 1214} {"train_loss": -21.569021224975586, "global_step": 100837, "epoch": 1214} {"train_loss": -22.04484748840332, "global_step": 100838, "epoch": 1214} {"train_loss": -21.874862670898438, "global_step": 100839, "epoch": 1214} {"train_loss": -21.920654296875, "global_step": 100840, "epoch": 1214} {"train_loss": -21.615829467773438, "global_step": 100841, "epoch": 1214} {"train_loss": -22.259510040283203, "global_step": 100842, "epoch": 1214} {"train_loss": -21.698598861694336, "global_step": 100843, "epoch": 1214} {"train_loss": -21.90318530438894, "global_step": 100844, "epoch": 1214, "val_loss": 6284707.0} {"train_loss": -21.794540405273438, "global_step": 100845, "epoch": 1215} {"train_loss": -21.9588623046875, "global_step": 100846, "epoch": 1215} {"train_loss": -21.178388595581055, "global_step": 100847, "epoch": 1215} {"train_loss": -21.83449935913086, "global_step": 100848, "epoch": 1215} {"train_loss": -21.39129066467285, "global_step": 100849, "epoch": 1215} {"train_loss": -21.57734489440918, "global_step": 100850, "epoch": 1215} {"train_loss": -21.974056243896484, "global_step": 100851, "epoch": 1215} {"train_loss": -21.568252563476562, "global_step": 100852, "epoch": 1215} {"train_loss": -21.644052505493164, "global_step": 100853, "epoch": 1215} {"train_loss": -21.974191665649414, "global_step": 100854, "epoch": 1215} {"train_loss": -21.46246910095215, "global_step": 100855, "epoch": 1215} {"train_loss": -22.21375846862793, "global_step": 100856, "epoch": 1215} {"train_loss": -21.49640464782715, "global_step": 100857, "epoch": 1215} {"train_loss": -21.775039672851562, "global_step": 100858, "epoch": 1215} {"train_loss": -21.807464599609375, "global_step": 100859, "epoch": 1215} {"train_loss": -21.68291664123535, "global_step": 100860, "epoch": 1215} {"train_loss": -21.82919692993164, "global_step": 100861, "epoch": 1215} {"train_loss": -22.080692291259766, "global_step": 100862, "epoch": 1215} {"train_loss": -22.001785278320312, "global_step": 100863, "epoch": 1215} {"train_loss": -22.11268424987793, "global_step": 100864, "epoch": 1215} {"train_loss": -21.666318893432617, "global_step": 100865, "epoch": 1215} {"train_loss": -21.893537521362305, "global_step": 100866, "epoch": 1215} {"train_loss": -21.83538246154785, "global_step": 100867, "epoch": 1215} {"train_loss": -22.189056396484375, "global_step": 100868, "epoch": 1215} {"train_loss": -22.097976684570312, "global_step": 100869, "epoch": 1215} {"train_loss": -22.434921264648438, "global_step": 100870, "epoch": 1215} {"train_loss": -22.15188980102539, "global_step": 100871, "epoch": 1215} {"train_loss": -21.74990463256836, "global_step": 100872, "epoch": 1215} {"train_loss": -22.297632217407227, "global_step": 100873, "epoch": 1215} {"train_loss": -21.69277000427246, "global_step": 100874, "epoch": 1215} {"train_loss": -21.95414924621582, "global_step": 100875, "epoch": 1215} {"train_loss": -22.389375686645508, "global_step": 100876, "epoch": 1215} {"train_loss": -22.032194137573242, "global_step": 100877, "epoch": 1215} {"train_loss": -22.2930850982666, "global_step": 100878, "epoch": 1215} {"train_loss": -22.11903190612793, "global_step": 100879, "epoch": 1215} {"train_loss": -21.52274513244629, "global_step": 100880, "epoch": 1215} {"train_loss": -21.59832763671875, "global_step": 100881, "epoch": 1215} {"train_loss": -22.15155029296875, "global_step": 100882, "epoch": 1215} {"train_loss": -22.050689697265625, "global_step": 100883, "epoch": 1215} {"train_loss": -21.6444091796875, "global_step": 100884, "epoch": 1215} {"train_loss": -21.629749298095703, "global_step": 100885, "epoch": 1215} {"train_loss": -22.28126335144043, "global_step": 100886, "epoch": 1215} {"train_loss": -21.718265533447266, "global_step": 100887, "epoch": 1215} {"train_loss": -22.34671401977539, "global_step": 100888, "epoch": 1215} {"train_loss": -21.883399963378906, "global_step": 100889, "epoch": 1215} {"train_loss": -22.189298629760742, "global_step": 100890, "epoch": 1215} {"train_loss": -22.041763305664062, "global_step": 100891, "epoch": 1215} {"train_loss": -21.591934204101562, "global_step": 100892, "epoch": 1215} {"train_loss": -21.546560287475586, "global_step": 100893, "epoch": 1215} {"train_loss": -21.658557891845703, "global_step": 100894, "epoch": 1215} {"train_loss": -22.18938636779785, "global_step": 100895, "epoch": 1215} {"train_loss": -21.874317169189453, "global_step": 100896, "epoch": 1215} {"train_loss": -22.129215240478516, "global_step": 100897, "epoch": 1215} {"train_loss": -21.72266960144043, "global_step": 100898, "epoch": 1215} {"train_loss": -21.790237426757812, "global_step": 100899, "epoch": 1215} {"train_loss": -22.52408218383789, "global_step": 100900, "epoch": 1215} {"train_loss": -21.99167251586914, "global_step": 100901, "epoch": 1215} {"train_loss": -22.20450210571289, "global_step": 100902, "epoch": 1215} {"train_loss": -21.775535583496094, "global_step": 100903, "epoch": 1215} {"train_loss": -22.157419204711914, "global_step": 100904, "epoch": 1215} {"train_loss": -21.974851608276367, "global_step": 100905, "epoch": 1215} {"train_loss": -22.1281681060791, "global_step": 100906, "epoch": 1215} {"train_loss": -21.982084274291992, "global_step": 100907, "epoch": 1215} {"train_loss": -22.092939376831055, "global_step": 100908, "epoch": 1215} {"train_loss": -21.978652954101562, "global_step": 100909, "epoch": 1215} {"train_loss": -22.504873275756836, "global_step": 100910, "epoch": 1215} {"train_loss": -22.075407028198242, "global_step": 100911, "epoch": 1215} {"train_loss": -21.55342674255371, "global_step": 100912, "epoch": 1215} {"train_loss": -21.88966941833496, "global_step": 100913, "epoch": 1215} {"train_loss": -21.963869094848633, "global_step": 100914, "epoch": 1215} {"train_loss": -21.892751693725586, "global_step": 100915, "epoch": 1215} {"train_loss": -22.271074295043945, "global_step": 100916, "epoch": 1215} {"train_loss": -21.708402633666992, "global_step": 100917, "epoch": 1215} {"train_loss": -21.95840835571289, "global_step": 100918, "epoch": 1215} {"train_loss": -22.20890998840332, "global_step": 100919, "epoch": 1215} {"train_loss": -21.723526000976562, "global_step": 100920, "epoch": 1215} {"train_loss": -22.090173721313477, "global_step": 100921, "epoch": 1215} {"train_loss": -21.892353057861328, "global_step": 100922, "epoch": 1215} {"train_loss": -22.014297485351562, "global_step": 100923, "epoch": 1215} {"train_loss": -21.93268394470215, "global_step": 100924, "epoch": 1215} {"train_loss": -21.932575225830078, "global_step": 100925, "epoch": 1215} {"train_loss": -21.664106369018555, "global_step": 100926, "epoch": 1215} {"train_loss": -21.92060465985034, "global_step": 100927, "epoch": 1215, "val_loss": 6178726.0} {"train_loss": -21.270883560180664, "global_step": 100928, "epoch": 1216} {"train_loss": -21.731191635131836, "global_step": 100929, "epoch": 1216} {"train_loss": -21.618722915649414, "global_step": 100930, "epoch": 1216} {"train_loss": -21.738685607910156, "global_step": 100931, "epoch": 1216} {"train_loss": -21.749568939208984, "global_step": 100932, "epoch": 1216} {"train_loss": -21.82624626159668, "global_step": 100933, "epoch": 1216} {"train_loss": -21.827810287475586, "global_step": 100934, "epoch": 1216} {"train_loss": -21.675649642944336, "global_step": 100935, "epoch": 1216} {"train_loss": -21.888269424438477, "global_step": 100936, "epoch": 1216} {"train_loss": -21.93739891052246, "global_step": 100937, "epoch": 1216} {"train_loss": -22.124897003173828, "global_step": 100938, "epoch": 1216} {"train_loss": -21.881933212280273, "global_step": 100939, "epoch": 1216} {"train_loss": -21.84182357788086, "global_step": 100940, "epoch": 1216} {"train_loss": -21.72524642944336, "global_step": 100941, "epoch": 1216} {"train_loss": -21.748010635375977, "global_step": 100942, "epoch": 1216} {"train_loss": -21.833463668823242, "global_step": 100943, "epoch": 1216} {"train_loss": -21.863718032836914, "global_step": 100944, "epoch": 1216} {"train_loss": -21.582101821899414, "global_step": 100945, "epoch": 1216} {"train_loss": -21.95650291442871, "global_step": 100946, "epoch": 1216} {"train_loss": -21.77613639831543, "global_step": 100947, "epoch": 1216} {"train_loss": -21.731414794921875, "global_step": 100948, "epoch": 1216} {"train_loss": -22.102466583251953, "global_step": 100949, "epoch": 1216} {"train_loss": -21.69525718688965, "global_step": 100950, "epoch": 1216} {"train_loss": -22.266952514648438, "global_step": 100951, "epoch": 1216} {"train_loss": -21.820974349975586, "global_step": 100952, "epoch": 1216} {"train_loss": -22.027271270751953, "global_step": 100953, "epoch": 1216} {"train_loss": -21.915206909179688, "global_step": 100954, "epoch": 1216} {"train_loss": -22.110008239746094, "global_step": 100955, "epoch": 1216} {"train_loss": -22.004337310791016, "global_step": 100956, "epoch": 1216} {"train_loss": -21.884159088134766, "global_step": 100957, "epoch": 1216} {"train_loss": -22.13277244567871, "global_step": 100958, "epoch": 1216} {"train_loss": -22.07688331604004, "global_step": 100959, "epoch": 1216} {"train_loss": -21.826343536376953, "global_step": 100960, "epoch": 1216} {"train_loss": -21.751134872436523, "global_step": 100961, "epoch": 1216} {"train_loss": -21.847761154174805, "global_step": 100962, "epoch": 1216} {"train_loss": -22.177358627319336, "global_step": 100963, "epoch": 1216} {"train_loss": -21.793380737304688, "global_step": 100964, "epoch": 1216} {"train_loss": -21.616647720336914, "global_step": 100965, "epoch": 1216} {"train_loss": -21.87140655517578, "global_step": 100966, "epoch": 1216} {"train_loss": -21.57708740234375, "global_step": 100967, "epoch": 1216} {"train_loss": -22.16254234313965, "global_step": 100968, "epoch": 1216} {"train_loss": -21.79525375366211, "global_step": 100969, "epoch": 1216} {"train_loss": -21.669376373291016, "global_step": 100970, "epoch": 1216} {"train_loss": -21.860029220581055, "global_step": 100971, "epoch": 1216} {"train_loss": -21.86309051513672, "global_step": 100972, "epoch": 1216} {"train_loss": -22.258657455444336, "global_step": 100973, "epoch": 1216} {"train_loss": -21.741992950439453, "global_step": 100974, "epoch": 1216} {"train_loss": -21.912107467651367, "global_step": 100975, "epoch": 1216} {"train_loss": -21.770429611206055, "global_step": 100976, "epoch": 1216} {"train_loss": -21.781606674194336, "global_step": 100977, "epoch": 1216} {"train_loss": -22.17255210876465, "global_step": 100978, "epoch": 1216} {"train_loss": -21.926279067993164, "global_step": 100979, "epoch": 1216} {"train_loss": -21.749475479125977, "global_step": 100980, "epoch": 1216} {"train_loss": -21.836009979248047, "global_step": 100981, "epoch": 1216} {"train_loss": -22.247411727905273, "global_step": 100982, "epoch": 1216} {"train_loss": -21.924047470092773, "global_step": 100983, "epoch": 1216} {"train_loss": -21.363117218017578, "global_step": 100984, "epoch": 1216} {"train_loss": -21.703588485717773, "global_step": 100985, "epoch": 1216} {"train_loss": -21.942808151245117, "global_step": 100986, "epoch": 1216} {"train_loss": -22.068971633911133, "global_step": 100987, "epoch": 1216} {"train_loss": -21.796201705932617, "global_step": 100988, "epoch": 1216} {"train_loss": -22.190229415893555, "global_step": 100989, "epoch": 1216} {"train_loss": -21.999971389770508, "global_step": 100990, "epoch": 1216} {"train_loss": -21.93663215637207, "global_step": 100991, "epoch": 1216} {"train_loss": -22.334585189819336, "global_step": 100992, "epoch": 1216} {"train_loss": -21.805532455444336, "global_step": 100993, "epoch": 1216} {"train_loss": -22.260305404663086, "global_step": 100994, "epoch": 1216} {"train_loss": -22.147602081298828, "global_step": 100995, "epoch": 1216} {"train_loss": -22.294647216796875, "global_step": 100996, "epoch": 1216} {"train_loss": -21.9407958984375, "global_step": 100997, "epoch": 1216} {"train_loss": -22.427322387695312, "global_step": 100998, "epoch": 1216} {"train_loss": -22.22797203063965, "global_step": 100999, "epoch": 1216} {"train_loss": -21.636106491088867, "global_step": 101000, "epoch": 1216} {"train_loss": -21.814250946044922, "global_step": 101001, "epoch": 1216} {"train_loss": -22.053571701049805, "global_step": 101002, "epoch": 1216} {"train_loss": -21.98158836364746, "global_step": 101003, "epoch": 1216} {"train_loss": -21.9918270111084, "global_step": 101004, "epoch": 1216} {"train_loss": -21.714553833007812, "global_step": 101005, "epoch": 1216} {"train_loss": -22.292272567749023, "global_step": 101006, "epoch": 1216} {"train_loss": -22.110319137573242, "global_step": 101007, "epoch": 1216} {"train_loss": -21.995473861694336, "global_step": 101008, "epoch": 1216} {"train_loss": -22.131772994995117, "global_step": 101009, "epoch": 1216} {"train_loss": -21.91078140074948, "global_step": 101010, "epoch": 1216, "val_loss": 6192116.0} {"train_loss": -21.900272369384766, "global_step": 101011, "epoch": 1217} {"train_loss": -21.64955711364746, "global_step": 101012, "epoch": 1217} {"train_loss": -21.571563720703125, "global_step": 101013, "epoch": 1217} {"train_loss": -22.00082778930664, "global_step": 101014, "epoch": 1217} {"train_loss": -22.077505111694336, "global_step": 101015, "epoch": 1217} {"train_loss": -22.045093536376953, "global_step": 101016, "epoch": 1217} {"train_loss": -21.812707901000977, "global_step": 101017, "epoch": 1217} {"train_loss": -22.060026168823242, "global_step": 101018, "epoch": 1217} {"train_loss": -21.961082458496094, "global_step": 101019, "epoch": 1217} {"train_loss": -21.64236831665039, "global_step": 101020, "epoch": 1217} {"train_loss": -21.79608726501465, "global_step": 101021, "epoch": 1217} {"train_loss": -22.0335750579834, "global_step": 101022, "epoch": 1217} {"train_loss": -21.873056411743164, "global_step": 101023, "epoch": 1217} {"train_loss": -21.840864181518555, "global_step": 101024, "epoch": 1217} {"train_loss": -21.8121337890625, "global_step": 101025, "epoch": 1217} {"train_loss": -21.644298553466797, "global_step": 101026, "epoch": 1217} {"train_loss": -22.374643325805664, "global_step": 101027, "epoch": 1217} {"train_loss": -21.814661026000977, "global_step": 101028, "epoch": 1217} {"train_loss": -22.160123825073242, "global_step": 101029, "epoch": 1217} {"train_loss": -22.038923263549805, "global_step": 101030, "epoch": 1217} {"train_loss": -22.088958740234375, "global_step": 101031, "epoch": 1217} {"train_loss": -22.211132049560547, "global_step": 101032, "epoch": 1217} {"train_loss": -22.032894134521484, "global_step": 101033, "epoch": 1217} {"train_loss": -22.03564453125, "global_step": 101034, "epoch": 1217} {"train_loss": -22.151466369628906, "global_step": 101035, "epoch": 1217} {"train_loss": -21.821828842163086, "global_step": 101036, "epoch": 1217} {"train_loss": -21.727331161499023, "global_step": 101037, "epoch": 1217} {"train_loss": -22.099002838134766, "global_step": 101038, "epoch": 1217} {"train_loss": -21.76629066467285, "global_step": 101039, "epoch": 1217} {"train_loss": -21.51963996887207, "global_step": 101040, "epoch": 1217} {"train_loss": -21.834869384765625, "global_step": 101041, "epoch": 1217} {"train_loss": -21.6201171875, "global_step": 101042, "epoch": 1217} {"train_loss": -22.25574493408203, "global_step": 101043, "epoch": 1217} {"train_loss": -21.745975494384766, "global_step": 101044, "epoch": 1217} {"train_loss": -21.952537536621094, "global_step": 101045, "epoch": 1217} {"train_loss": -22.019304275512695, "global_step": 101046, "epoch": 1217} {"train_loss": -21.813919067382812, "global_step": 101047, "epoch": 1217} {"train_loss": -21.781522750854492, "global_step": 101048, "epoch": 1217} {"train_loss": -22.019744873046875, "global_step": 101049, "epoch": 1217} {"train_loss": -22.128210067749023, "global_step": 101050, "epoch": 1217} {"train_loss": -21.846952438354492, "global_step": 101051, "epoch": 1217} {"train_loss": -22.185827255249023, "global_step": 101052, "epoch": 1217} {"train_loss": -22.107263565063477, "global_step": 101053, "epoch": 1217} {"train_loss": -22.04121971130371, "global_step": 101054, "epoch": 1217} {"train_loss": -21.80555534362793, "global_step": 101055, "epoch": 1217} {"train_loss": -21.61163330078125, "global_step": 101056, "epoch": 1217} {"train_loss": -21.760791778564453, "global_step": 101057, "epoch": 1217} {"train_loss": -22.160741806030273, "global_step": 101058, "epoch": 1217} {"train_loss": -21.816190719604492, "global_step": 101059, "epoch": 1217} {"train_loss": -21.93623161315918, "global_step": 101060, "epoch": 1217} {"train_loss": -22.10406494140625, "global_step": 101061, "epoch": 1217} {"train_loss": -21.712434768676758, "global_step": 101062, "epoch": 1217} {"train_loss": -22.436227798461914, "global_step": 101063, "epoch": 1217} {"train_loss": -22.14173698425293, "global_step": 101064, "epoch": 1217} {"train_loss": -22.43916130065918, "global_step": 101065, "epoch": 1217} {"train_loss": -22.20077896118164, "global_step": 101066, "epoch": 1217} {"train_loss": -22.144500732421875, "global_step": 101067, "epoch": 1217} {"train_loss": -21.950214385986328, "global_step": 101068, "epoch": 1217} {"train_loss": -21.66056251525879, "global_step": 101069, "epoch": 1217} {"train_loss": -22.229137420654297, "global_step": 101070, "epoch": 1217} {"train_loss": -21.950971603393555, "global_step": 101071, "epoch": 1217} {"train_loss": -22.004980087280273, "global_step": 101072, "epoch": 1217} {"train_loss": -22.05006980895996, "global_step": 101073, "epoch": 1217} {"train_loss": -22.090850830078125, "global_step": 101074, "epoch": 1217} {"train_loss": -22.11655044555664, "global_step": 101075, "epoch": 1217} {"train_loss": -22.182764053344727, "global_step": 101076, "epoch": 1217} {"train_loss": -22.195209503173828, "global_step": 101077, "epoch": 1217} {"train_loss": -21.906211853027344, "global_step": 101078, "epoch": 1217} {"train_loss": -22.312307357788086, "global_step": 101079, "epoch": 1217} {"train_loss": -22.000926971435547, "global_step": 101080, "epoch": 1217} {"train_loss": -21.56099510192871, "global_step": 101081, "epoch": 1217} {"train_loss": -22.0220890045166, "global_step": 101082, "epoch": 1217} {"train_loss": -21.79636573791504, "global_step": 101083, "epoch": 1217} {"train_loss": -21.658843994140625, "global_step": 101084, "epoch": 1217} {"train_loss": -22.410552978515625, "global_step": 101085, "epoch": 1217} {"train_loss": -21.88237190246582, "global_step": 101086, "epoch": 1217} {"train_loss": -22.129531860351562, "global_step": 101087, "epoch": 1217} {"train_loss": -21.839324951171875, "global_step": 101088, "epoch": 1217} {"train_loss": -22.058744430541992, "global_step": 101089, "epoch": 1217} {"train_loss": -21.70755958557129, "global_step": 101090, "epoch": 1217} {"train_loss": -21.69973373413086, "global_step": 101091, "epoch": 1217} {"train_loss": -22.12992286682129, "global_step": 101092, "epoch": 1217} {"train_loss": -21.964159264621966, "global_step": 101093, "epoch": 1217, "val_loss": 6129683.5} {"train_loss": -21.743459701538086, "global_step": 101094, "epoch": 1218} {"train_loss": -21.785079956054688, "global_step": 101095, "epoch": 1218} {"train_loss": -21.472448348999023, "global_step": 101096, "epoch": 1218} {"train_loss": -21.51268196105957, "global_step": 101097, "epoch": 1218} {"train_loss": -21.134023666381836, "global_step": 101098, "epoch": 1218} {"train_loss": -21.838031768798828, "global_step": 101099, "epoch": 1218} {"train_loss": -21.510854721069336, "global_step": 101100, "epoch": 1218} {"train_loss": -21.54371452331543, "global_step": 101101, "epoch": 1218} {"train_loss": -21.486310958862305, "global_step": 101102, "epoch": 1218} {"train_loss": -22.11320686340332, "global_step": 101103, "epoch": 1218} {"train_loss": -21.731111526489258, "global_step": 101104, "epoch": 1218} {"train_loss": -22.024259567260742, "global_step": 101105, "epoch": 1218} {"train_loss": -21.370763778686523, "global_step": 101106, "epoch": 1218} {"train_loss": -21.898038864135742, "global_step": 101107, "epoch": 1218} {"train_loss": -21.63080406188965, "global_step": 101108, "epoch": 1218} {"train_loss": -21.58743667602539, "global_step": 101109, "epoch": 1218} {"train_loss": -21.967517852783203, "global_step": 101110, "epoch": 1218} {"train_loss": -21.5949764251709, "global_step": 101111, "epoch": 1218} {"train_loss": -21.981603622436523, "global_step": 101112, "epoch": 1218} {"train_loss": -21.74503517150879, "global_step": 101113, "epoch": 1218} {"train_loss": -21.99089241027832, "global_step": 101114, "epoch": 1218} {"train_loss": -21.88169288635254, "global_step": 101115, "epoch": 1218} {"train_loss": -21.84465217590332, "global_step": 101116, "epoch": 1218} {"train_loss": -21.927675247192383, "global_step": 101117, "epoch": 1218} {"train_loss": -21.97452735900879, "global_step": 101118, "epoch": 1218} {"train_loss": -21.706317901611328, "global_step": 101119, "epoch": 1218} {"train_loss": -22.06117057800293, "global_step": 101120, "epoch": 1218} {"train_loss": -22.098201751708984, "global_step": 101121, "epoch": 1218} {"train_loss": -22.196176528930664, "global_step": 101122, "epoch": 1218} {"train_loss": -22.22867774963379, "global_step": 101123, "epoch": 1218} {"train_loss": -21.933032989501953, "global_step": 101124, "epoch": 1218} {"train_loss": -21.740468978881836, "global_step": 101125, "epoch": 1218} {"train_loss": -22.058744430541992, "global_step": 101126, "epoch": 1218} {"train_loss": -22.17087745666504, "global_step": 101127, "epoch": 1218} {"train_loss": -21.994421005249023, "global_step": 101128, "epoch": 1218} {"train_loss": -21.89454460144043, "global_step": 101129, "epoch": 1218} {"train_loss": -21.718069076538086, "global_step": 101130, "epoch": 1218} {"train_loss": -21.70071792602539, "global_step": 101131, "epoch": 1218} {"train_loss": -21.64168357849121, "global_step": 101132, "epoch": 1218} {"train_loss": -21.805435180664062, "global_step": 101133, "epoch": 1218} {"train_loss": -21.772546768188477, "global_step": 101134, "epoch": 1218} {"train_loss": -21.714067459106445, "global_step": 101135, "epoch": 1218} {"train_loss": -22.22214126586914, "global_step": 101136, "epoch": 1218} {"train_loss": -21.63643455505371, "global_step": 101137, "epoch": 1218} {"train_loss": -21.764673233032227, "global_step": 101138, "epoch": 1218} {"train_loss": -21.89464569091797, "global_step": 101139, "epoch": 1218} {"train_loss": -22.29820442199707, "global_step": 101140, "epoch": 1218} {"train_loss": -22.07548713684082, "global_step": 101141, "epoch": 1218} {"train_loss": -22.185226440429688, "global_step": 101142, "epoch": 1218} {"train_loss": -22.199827194213867, "global_step": 101143, "epoch": 1218} {"train_loss": -21.993085861206055, "global_step": 101144, "epoch": 1218} {"train_loss": -21.925247192382812, "global_step": 101145, "epoch": 1218} {"train_loss": -22.02076530456543, "global_step": 101146, "epoch": 1218} {"train_loss": -21.893720626831055, "global_step": 101147, "epoch": 1218} {"train_loss": -22.151342391967773, "global_step": 101148, "epoch": 1218} {"train_loss": -21.715009689331055, "global_step": 101149, "epoch": 1218} {"train_loss": -22.371030807495117, "global_step": 101150, "epoch": 1218} {"train_loss": -22.016246795654297, "global_step": 101151, "epoch": 1218} {"train_loss": -21.716108322143555, "global_step": 101152, "epoch": 1218} {"train_loss": -21.8720703125, "global_step": 101153, "epoch": 1218} {"train_loss": -21.650358200073242, "global_step": 101154, "epoch": 1218} {"train_loss": -22.034460067749023, "global_step": 101155, "epoch": 1218} {"train_loss": -21.72163963317871, "global_step": 101156, "epoch": 1218} {"train_loss": -22.062414169311523, "global_step": 101157, "epoch": 1218} {"train_loss": -21.912342071533203, "global_step": 101158, "epoch": 1218} {"train_loss": -22.16688346862793, "global_step": 101159, "epoch": 1218} {"train_loss": -22.14118003845215, "global_step": 101160, "epoch": 1218} {"train_loss": -22.385183334350586, "global_step": 101161, "epoch": 1218} {"train_loss": -21.848743438720703, "global_step": 101162, "epoch": 1218} {"train_loss": -22.142723083496094, "global_step": 101163, "epoch": 1218} {"train_loss": -22.2025146484375, "global_step": 101164, "epoch": 1218} {"train_loss": -22.327322006225586, "global_step": 101165, "epoch": 1218} {"train_loss": -21.96441078186035, "global_step": 101166, "epoch": 1218} {"train_loss": -22.01409912109375, "global_step": 101167, "epoch": 1218} {"train_loss": -21.995534896850586, "global_step": 101168, "epoch": 1218} {"train_loss": -21.608564376831055, "global_step": 101169, "epoch": 1218} {"train_loss": -21.670700073242188, "global_step": 101170, "epoch": 1218} {"train_loss": -21.719579696655273, "global_step": 101171, "epoch": 1218} {"train_loss": -21.661970138549805, "global_step": 101172, "epoch": 1218} {"train_loss": -21.637632369995117, "global_step": 101173, "epoch": 1218} {"train_loss": -22.02638053894043, "global_step": 101174, "epoch": 1218} {"train_loss": -21.498626708984375, "global_step": 101175, "epoch": 1218} {"train_loss": -21.88056853880365, "global_step": 101176, "epoch": 1218, "val_loss": 6153673.0} {"train_loss": -21.42922592163086, "global_step": 101177, "epoch": 1219} {"train_loss": -21.900623321533203, "global_step": 101178, "epoch": 1219} {"train_loss": -21.416112899780273, "global_step": 101179, "epoch": 1219} {"train_loss": -21.315635681152344, "global_step": 101180, "epoch": 1219} {"train_loss": -21.8206844329834, "global_step": 101181, "epoch": 1219} {"train_loss": -21.627059936523438, "global_step": 101182, "epoch": 1219} {"train_loss": -21.800626754760742, "global_step": 101183, "epoch": 1219} {"train_loss": -21.914274215698242, "global_step": 101184, "epoch": 1219} {"train_loss": -21.54148292541504, "global_step": 101185, "epoch": 1219} {"train_loss": -21.592580795288086, "global_step": 101186, "epoch": 1219} {"train_loss": -21.698843002319336, "global_step": 101187, "epoch": 1219} {"train_loss": -21.393373489379883, "global_step": 101188, "epoch": 1219} {"train_loss": -21.897062301635742, "global_step": 101189, "epoch": 1219} {"train_loss": -21.678346633911133, "global_step": 101190, "epoch": 1219} {"train_loss": -21.870594024658203, "global_step": 101191, "epoch": 1219} {"train_loss": -21.572607040405273, "global_step": 101192, "epoch": 1219} {"train_loss": -21.684234619140625, "global_step": 101193, "epoch": 1219} {"train_loss": -21.464344024658203, "global_step": 101194, "epoch": 1219} {"train_loss": -21.506818771362305, "global_step": 101195, "epoch": 1219} {"train_loss": -21.67158317565918, "global_step": 101196, "epoch": 1219} {"train_loss": -22.00537109375, "global_step": 101197, "epoch": 1219} {"train_loss": -21.939889907836914, "global_step": 101198, "epoch": 1219} {"train_loss": -21.82533836364746, "global_step": 101199, "epoch": 1219} {"train_loss": -21.805076599121094, "global_step": 101200, "epoch": 1219} {"train_loss": -21.36863136291504, "global_step": 101201, "epoch": 1219} {"train_loss": -21.96108055114746, "global_step": 101202, "epoch": 1219} {"train_loss": -22.152427673339844, "global_step": 101203, "epoch": 1219} {"train_loss": -21.76717758178711, "global_step": 101204, "epoch": 1219} {"train_loss": -22.004688262939453, "global_step": 101205, "epoch": 1219} {"train_loss": -22.013639450073242, "global_step": 101206, "epoch": 1219} {"train_loss": -21.693809509277344, "global_step": 101207, "epoch": 1219} {"train_loss": -21.975372314453125, "global_step": 101208, "epoch": 1219} {"train_loss": -22.126218795776367, "global_step": 101209, "epoch": 1219} {"train_loss": -21.791122436523438, "global_step": 101210, "epoch": 1219} {"train_loss": -21.965970993041992, "global_step": 101211, "epoch": 1219} {"train_loss": -21.93788719177246, "global_step": 101212, "epoch": 1219} {"train_loss": -21.78074073791504, "global_step": 101213, "epoch": 1219} {"train_loss": -22.51563262939453, "global_step": 101214, "epoch": 1219} {"train_loss": -21.891019821166992, "global_step": 101215, "epoch": 1219} {"train_loss": -22.219778060913086, "global_step": 101216, "epoch": 1219} {"train_loss": -21.838027954101562, "global_step": 101217, "epoch": 1219} {"train_loss": -22.183393478393555, "global_step": 101218, "epoch": 1219} {"train_loss": -21.9801082611084, "global_step": 101219, "epoch": 1219} {"train_loss": -21.99987030029297, "global_step": 101220, "epoch": 1219} {"train_loss": -22.231412887573242, "global_step": 101221, "epoch": 1219} {"train_loss": -21.981107711791992, "global_step": 101222, "epoch": 1219} {"train_loss": -22.315114974975586, "global_step": 101223, "epoch": 1219} {"train_loss": -21.91080093383789, "global_step": 101224, "epoch": 1219} {"train_loss": -21.83326530456543, "global_step": 101225, "epoch": 1219} {"train_loss": -22.029531478881836, "global_step": 101226, "epoch": 1219} {"train_loss": -21.848846435546875, "global_step": 101227, "epoch": 1219} {"train_loss": -22.041767120361328, "global_step": 101228, "epoch": 1219} {"train_loss": -22.1663761138916, "global_step": 101229, "epoch": 1219} {"train_loss": -22.010116577148438, "global_step": 101230, "epoch": 1219} {"train_loss": -21.950428009033203, "global_step": 101231, "epoch": 1219} {"train_loss": -22.145008087158203, "global_step": 101232, "epoch": 1219} {"train_loss": -22.194673538208008, "global_step": 101233, "epoch": 1219} {"train_loss": -21.855342864990234, "global_step": 101234, "epoch": 1219} {"train_loss": -22.050994873046875, "global_step": 101235, "epoch": 1219} {"train_loss": -22.423982620239258, "global_step": 101236, "epoch": 1219} {"train_loss": -22.211210250854492, "global_step": 101237, "epoch": 1219} {"train_loss": -21.741104125976562, "global_step": 101238, "epoch": 1219} {"train_loss": -21.85273551940918, "global_step": 101239, "epoch": 1219} {"train_loss": -21.937944412231445, "global_step": 101240, "epoch": 1219} {"train_loss": -22.130529403686523, "global_step": 101241, "epoch": 1219} {"train_loss": -21.84694480895996, "global_step": 101242, "epoch": 1219} {"train_loss": -21.79356575012207, "global_step": 101243, "epoch": 1219} {"train_loss": -22.21693992614746, "global_step": 101244, "epoch": 1219} {"train_loss": -22.147436141967773, "global_step": 101245, "epoch": 1219} {"train_loss": -22.13926124572754, "global_step": 101246, "epoch": 1219} {"train_loss": -22.106643676757812, "global_step": 101247, "epoch": 1219} {"train_loss": -22.040184020996094, "global_step": 101248, "epoch": 1219} {"train_loss": -22.459264755249023, "global_step": 101249, "epoch": 1219} {"train_loss": -22.49889373779297, "global_step": 101250, "epoch": 1219} {"train_loss": -21.997690200805664, "global_step": 101251, "epoch": 1219} {"train_loss": -22.1518611907959, "global_step": 101252, "epoch": 1219} {"train_loss": -22.302902221679688, "global_step": 101253, "epoch": 1219} {"train_loss": -21.964630126953125, "global_step": 101254, "epoch": 1219} {"train_loss": -21.874353408813477, "global_step": 101255, "epoch": 1219} {"train_loss": -22.17378807067871, "global_step": 101256, "epoch": 1219} {"train_loss": -21.85079002380371, "global_step": 101257, "epoch": 1219} {"train_loss": -21.71355628967285, "global_step": 101258, "epoch": 1219} {"train_loss": -21.920466618365552, "global_step": 101259, "epoch": 1219, "val_loss": 6073894.0} {"train_loss": -21.662113189697266, "global_step": 101260, "epoch": 1220} {"train_loss": -21.911176681518555, "global_step": 101261, "epoch": 1220} {"train_loss": -21.880115509033203, "global_step": 101262, "epoch": 1220} {"train_loss": -21.70237922668457, "global_step": 101263, "epoch": 1220} {"train_loss": -21.799217224121094, "global_step": 101264, "epoch": 1220} {"train_loss": -21.712263107299805, "global_step": 101265, "epoch": 1220} {"train_loss": -21.414859771728516, "global_step": 101266, "epoch": 1220} {"train_loss": -21.922378540039062, "global_step": 101267, "epoch": 1220} {"train_loss": -22.12668228149414, "global_step": 101268, "epoch": 1220} {"train_loss": -21.949735641479492, "global_step": 101269, "epoch": 1220} {"train_loss": -21.9044189453125, "global_step": 101270, "epoch": 1220} {"train_loss": -21.77569580078125, "global_step": 101271, "epoch": 1220} {"train_loss": -22.13592529296875, "global_step": 101272, "epoch": 1220} {"train_loss": -21.773969650268555, "global_step": 101273, "epoch": 1220} {"train_loss": -22.172473907470703, "global_step": 101274, "epoch": 1220} {"train_loss": -21.988859176635742, "global_step": 101275, "epoch": 1220} {"train_loss": -21.73343276977539, "global_step": 101276, "epoch": 1220} {"train_loss": -22.103967666625977, "global_step": 101277, "epoch": 1220} {"train_loss": -21.7004337310791, "global_step": 101278, "epoch": 1220} {"train_loss": -21.871097564697266, "global_step": 101279, "epoch": 1220} {"train_loss": -21.851070404052734, "global_step": 101280, "epoch": 1220} {"train_loss": -22.08648681640625, "global_step": 101281, "epoch": 1220} {"train_loss": -22.310636520385742, "global_step": 101282, "epoch": 1220} {"train_loss": -22.112638473510742, "global_step": 101283, "epoch": 1220} {"train_loss": -21.76617431640625, "global_step": 101284, "epoch": 1220} {"train_loss": -21.631834030151367, "global_step": 101285, "epoch": 1220} {"train_loss": -21.911157608032227, "global_step": 101286, "epoch": 1220} {"train_loss": -21.794710159301758, "global_step": 101287, "epoch": 1220} {"train_loss": -21.75250244140625, "global_step": 101288, "epoch": 1220} {"train_loss": -21.88392448425293, "global_step": 101289, "epoch": 1220} {"train_loss": -21.720983505249023, "global_step": 101290, "epoch": 1220} {"train_loss": -22.028417587280273, "global_step": 101291, "epoch": 1220} {"train_loss": -22.086641311645508, "global_step": 101292, "epoch": 1220} {"train_loss": -21.640165328979492, "global_step": 101293, "epoch": 1220} {"train_loss": -21.98093605041504, "global_step": 101294, "epoch": 1220} {"train_loss": -21.642635345458984, "global_step": 101295, "epoch": 1220} {"train_loss": -21.97214698791504, "global_step": 101296, "epoch": 1220} {"train_loss": -21.96379852294922, "global_step": 101297, "epoch": 1220} {"train_loss": -21.958105087280273, "global_step": 101298, "epoch": 1220} {"train_loss": -21.96132469177246, "global_step": 101299, "epoch": 1220} {"train_loss": -21.988677978515625, "global_step": 101300, "epoch": 1220} {"train_loss": -22.236881256103516, "global_step": 101301, "epoch": 1220} {"train_loss": -22.0766544342041, "global_step": 101302, "epoch": 1220} {"train_loss": -21.763105392456055, "global_step": 101303, "epoch": 1220} {"train_loss": -21.94478416442871, "global_step": 101304, "epoch": 1220} {"train_loss": -21.94182777404785, "global_step": 101305, "epoch": 1220} {"train_loss": -22.133106231689453, "global_step": 101306, "epoch": 1220} {"train_loss": -22.191625595092773, "global_step": 101307, "epoch": 1220} {"train_loss": -22.174678802490234, "global_step": 101308, "epoch": 1220} {"train_loss": -21.779048919677734, "global_step": 101309, "epoch": 1220} {"train_loss": -21.75046157836914, "global_step": 101310, "epoch": 1220} {"train_loss": -22.140993118286133, "global_step": 101311, "epoch": 1220} {"train_loss": -22.292240142822266, "global_step": 101312, "epoch": 1220} {"train_loss": -21.714094161987305, "global_step": 101313, "epoch": 1220} {"train_loss": -22.0745792388916, "global_step": 101314, "epoch": 1220} {"train_loss": -21.78034019470215, "global_step": 101315, "epoch": 1220} {"train_loss": -22.079145431518555, "global_step": 101316, "epoch": 1220} {"train_loss": -21.7761173248291, "global_step": 101317, "epoch": 1220} {"train_loss": -21.88167381286621, "global_step": 101318, "epoch": 1220} {"train_loss": -21.785892486572266, "global_step": 101319, "epoch": 1220} {"train_loss": -21.699100494384766, "global_step": 101320, "epoch": 1220} {"train_loss": -22.027624130249023, "global_step": 101321, "epoch": 1220} {"train_loss": -22.12696647644043, "global_step": 101322, "epoch": 1220} {"train_loss": -21.82976722717285, "global_step": 101323, "epoch": 1220} {"train_loss": -21.861032485961914, "global_step": 101324, "epoch": 1220} {"train_loss": -22.202733993530273, "global_step": 101325, "epoch": 1220} {"train_loss": -22.349838256835938, "global_step": 101326, "epoch": 1220} {"train_loss": -21.917346954345703, "global_step": 101327, "epoch": 1220} {"train_loss": -22.246501922607422, "global_step": 101328, "epoch": 1220} {"train_loss": -22.02499771118164, "global_step": 101329, "epoch": 1220} {"train_loss": -22.14270782470703, "global_step": 101330, "epoch": 1220} {"train_loss": -22.16530418395996, "global_step": 101331, "epoch": 1220} {"train_loss": -22.28706932067871, "global_step": 101332, "epoch": 1220} {"train_loss": -21.905080795288086, "global_step": 101333, "epoch": 1220} {"train_loss": -21.891462326049805, "global_step": 101334, "epoch": 1220} {"train_loss": -21.95881462097168, "global_step": 101335, "epoch": 1220} {"train_loss": -22.313720703125, "global_step": 101336, "epoch": 1220} {"train_loss": -22.0241641998291, "global_step": 101337, "epoch": 1220} {"train_loss": -21.868528366088867, "global_step": 101338, "epoch": 1220} {"train_loss": -22.00052261352539, "global_step": 101339, "epoch": 1220} {"train_loss": -21.831533432006836, "global_step": 101340, "epoch": 1220} {"train_loss": -22.046255111694336, "global_step": 101341, "epoch": 1220} {"train_loss": -21.950178996626153, "global_step": 101342, "epoch": 1220, "val_loss": 6149151.0} {"train_loss": -22.12167739868164, "global_step": 101343, "epoch": 1221} {"train_loss": -21.912763595581055, "global_step": 101344, "epoch": 1221} {"train_loss": -21.615354537963867, "global_step": 101345, "epoch": 1221} {"train_loss": -21.57717514038086, "global_step": 101346, "epoch": 1221} {"train_loss": -21.684568405151367, "global_step": 101347, "epoch": 1221} {"train_loss": -21.930927276611328, "global_step": 101348, "epoch": 1221} {"train_loss": -21.357824325561523, "global_step": 101349, "epoch": 1221} {"train_loss": -21.586166381835938, "global_step": 101350, "epoch": 1221} {"train_loss": -21.624032974243164, "global_step": 101351, "epoch": 1221} {"train_loss": -21.792606353759766, "global_step": 101352, "epoch": 1221} {"train_loss": -21.658710479736328, "global_step": 101353, "epoch": 1221} {"train_loss": -21.200029373168945, "global_step": 101354, "epoch": 1221} {"train_loss": -21.62245750427246, "global_step": 101355, "epoch": 1221} {"train_loss": -21.32805633544922, "global_step": 101356, "epoch": 1221} {"train_loss": -21.428220748901367, "global_step": 101357, "epoch": 1221} {"train_loss": -21.716230392456055, "global_step": 101358, "epoch": 1221} {"train_loss": -21.30508804321289, "global_step": 101359, "epoch": 1221} {"train_loss": -21.775829315185547, "global_step": 101360, "epoch": 1221} {"train_loss": -21.205297470092773, "global_step": 101361, "epoch": 1221} {"train_loss": -21.757944107055664, "global_step": 101362, "epoch": 1221} {"train_loss": -21.611631393432617, "global_step": 101363, "epoch": 1221} {"train_loss": -21.841012954711914, "global_step": 101364, "epoch": 1221} {"train_loss": -21.675573348999023, "global_step": 101365, "epoch": 1221} {"train_loss": -22.17367172241211, "global_step": 101366, "epoch": 1221} {"train_loss": -21.68514060974121, "global_step": 101367, "epoch": 1221} {"train_loss": -21.61332893371582, "global_step": 101368, "epoch": 1221} {"train_loss": -21.76531219482422, "global_step": 101369, "epoch": 1221} {"train_loss": -21.65096092224121, "global_step": 101370, "epoch": 1221} {"train_loss": -21.97559928894043, "global_step": 101371, "epoch": 1221} {"train_loss": -21.835494995117188, "global_step": 101372, "epoch": 1221} {"train_loss": -21.705448150634766, "global_step": 101373, "epoch": 1221} {"train_loss": -21.821027755737305, "global_step": 101374, "epoch": 1221} {"train_loss": -21.797821044921875, "global_step": 101375, "epoch": 1221} {"train_loss": -22.0022029876709, "global_step": 101376, "epoch": 1221} {"train_loss": -22.166812896728516, "global_step": 101377, "epoch": 1221} {"train_loss": -21.9849853515625, "global_step": 101378, "epoch": 1221} {"train_loss": -22.159780502319336, "global_step": 101379, "epoch": 1221} {"train_loss": -21.960180282592773, "global_step": 101380, "epoch": 1221} {"train_loss": -21.68267250061035, "global_step": 101381, "epoch": 1221} {"train_loss": -22.072772979736328, "global_step": 101382, "epoch": 1221} {"train_loss": -21.79909896850586, "global_step": 101383, "epoch": 1221} {"train_loss": -22.31495475769043, "global_step": 101384, "epoch": 1221} {"train_loss": -21.95172119140625, "global_step": 101385, "epoch": 1221} {"train_loss": -21.823806762695312, "global_step": 101386, "epoch": 1221} {"train_loss": -22.047901153564453, "global_step": 101387, "epoch": 1221} {"train_loss": -22.093833923339844, "global_step": 101388, "epoch": 1221} {"train_loss": -22.02809715270996, "global_step": 101389, "epoch": 1221} {"train_loss": -22.07948112487793, "global_step": 101390, "epoch": 1221} {"train_loss": -21.991270065307617, "global_step": 101391, "epoch": 1221} {"train_loss": -21.918495178222656, "global_step": 101392, "epoch": 1221} {"train_loss": -22.1397762298584, "global_step": 101393, "epoch": 1221} {"train_loss": -21.987096786499023, "global_step": 101394, "epoch": 1221} {"train_loss": -22.0227108001709, "global_step": 101395, "epoch": 1221} {"train_loss": -21.531230926513672, "global_step": 101396, "epoch": 1221} {"train_loss": -21.786298751831055, "global_step": 101397, "epoch": 1221} {"train_loss": -22.098892211914062, "global_step": 101398, "epoch": 1221} {"train_loss": -22.216638565063477, "global_step": 101399, "epoch": 1221} {"train_loss": -21.789453506469727, "global_step": 101400, "epoch": 1221} {"train_loss": -22.278806686401367, "global_step": 101401, "epoch": 1221} {"train_loss": -22.358182907104492, "global_step": 101402, "epoch": 1221} {"train_loss": -21.903898239135742, "global_step": 101403, "epoch": 1221} {"train_loss": -22.393476486206055, "global_step": 101404, "epoch": 1221} {"train_loss": -21.905521392822266, "global_step": 101405, "epoch": 1221} {"train_loss": -22.23487091064453, "global_step": 101406, "epoch": 1221} {"train_loss": -22.092313766479492, "global_step": 101407, "epoch": 1221} {"train_loss": -21.983566284179688, "global_step": 101408, "epoch": 1221} {"train_loss": -22.153074264526367, "global_step": 101409, "epoch": 1221} {"train_loss": -22.086669921875, "global_step": 101410, "epoch": 1221} {"train_loss": -21.996559143066406, "global_step": 101411, "epoch": 1221} {"train_loss": -21.968847274780273, "global_step": 101412, "epoch": 1221} {"train_loss": -21.96742820739746, "global_step": 101413, "epoch": 1221} {"train_loss": -22.105670928955078, "global_step": 101414, "epoch": 1221} {"train_loss": -21.84548568725586, "global_step": 101415, "epoch": 1221} {"train_loss": -22.123239517211914, "global_step": 101416, "epoch": 1221} {"train_loss": -22.213897705078125, "global_step": 101417, "epoch": 1221} {"train_loss": -22.05118751525879, "global_step": 101418, "epoch": 1221} {"train_loss": -21.613309860229492, "global_step": 101419, "epoch": 1221} {"train_loss": -21.81174659729004, "global_step": 101420, "epoch": 1221} {"train_loss": -22.075847625732422, "global_step": 101421, "epoch": 1221} {"train_loss": -21.88834571838379, "global_step": 101422, "epoch": 1221} {"train_loss": -22.138395309448242, "global_step": 101423, "epoch": 1221} {"train_loss": -22.129701614379883, "global_step": 101424, "epoch": 1221} {"train_loss": -21.871788162782966, "global_step": 101425, "epoch": 1221, "val_loss": 6470210.0} {"train_loss": -20.672956466674805, "global_step": 101426, "epoch": 1222} {"train_loss": -21.512874603271484, "global_step": 101427, "epoch": 1222} {"train_loss": -21.196775436401367, "global_step": 101428, "epoch": 1222} {"train_loss": -21.364967346191406, "global_step": 101429, "epoch": 1222} {"train_loss": -20.630491256713867, "global_step": 101430, "epoch": 1222} {"train_loss": -21.561065673828125, "global_step": 101431, "epoch": 1222} {"train_loss": -21.010250091552734, "global_step": 101432, "epoch": 1222} {"train_loss": -21.458751678466797, "global_step": 101433, "epoch": 1222} {"train_loss": -21.57796287536621, "global_step": 101434, "epoch": 1222} {"train_loss": -21.57828140258789, "global_step": 101435, "epoch": 1222} {"train_loss": -21.27309226989746, "global_step": 101436, "epoch": 1222} {"train_loss": -21.630155563354492, "global_step": 101437, "epoch": 1222} {"train_loss": -21.47593879699707, "global_step": 101438, "epoch": 1222} {"train_loss": -21.704757690429688, "global_step": 101439, "epoch": 1222} {"train_loss": -21.863492965698242, "global_step": 101440, "epoch": 1222} {"train_loss": -21.460519790649414, "global_step": 101441, "epoch": 1222} {"train_loss": -21.88711929321289, "global_step": 101442, "epoch": 1222} {"train_loss": -21.62641716003418, "global_step": 101443, "epoch": 1222} {"train_loss": -21.464122772216797, "global_step": 101444, "epoch": 1222} {"train_loss": -21.624618530273438, "global_step": 101445, "epoch": 1222} {"train_loss": -21.754127502441406, "global_step": 101446, "epoch": 1222} {"train_loss": -21.82183837890625, "global_step": 101447, "epoch": 1222} {"train_loss": -21.831497192382812, "global_step": 101448, "epoch": 1222} {"train_loss": -21.856962203979492, "global_step": 101449, "epoch": 1222} {"train_loss": -21.52392578125, "global_step": 101450, "epoch": 1222} {"train_loss": -22.04537582397461, "global_step": 101451, "epoch": 1222} {"train_loss": -21.830406188964844, "global_step": 101452, "epoch": 1222} {"train_loss": -21.684951782226562, "global_step": 101453, "epoch": 1222} {"train_loss": -22.22673988342285, "global_step": 101454, "epoch": 1222} {"train_loss": -22.117826461791992, "global_step": 101455, "epoch": 1222} {"train_loss": -22.1926212310791, "global_step": 101456, "epoch": 1222} {"train_loss": -21.827905654907227, "global_step": 101457, "epoch": 1222} {"train_loss": -22.2159481048584, "global_step": 101458, "epoch": 1222} {"train_loss": -21.97538948059082, "global_step": 101459, "epoch": 1222} {"train_loss": -22.105182647705078, "global_step": 101460, "epoch": 1222} {"train_loss": -21.698530197143555, "global_step": 101461, "epoch": 1222} {"train_loss": -21.30607032775879, "global_step": 101462, "epoch": 1222} {"train_loss": -22.174577713012695, "global_step": 101463, "epoch": 1222} {"train_loss": -21.93453025817871, "global_step": 101464, "epoch": 1222} {"train_loss": -22.103364944458008, "global_step": 101465, "epoch": 1222} {"train_loss": -22.298444747924805, "global_step": 101466, "epoch": 1222} {"train_loss": -21.719697952270508, "global_step": 101467, "epoch": 1222} {"train_loss": -22.112119674682617, "global_step": 101468, "epoch": 1222} {"train_loss": -21.755216598510742, "global_step": 101469, "epoch": 1222} {"train_loss": -21.96363067626953, "global_step": 101470, "epoch": 1222} {"train_loss": -21.86354637145996, "global_step": 101471, "epoch": 1222} {"train_loss": -21.899368286132812, "global_step": 101472, "epoch": 1222} {"train_loss": -21.74868392944336, "global_step": 101473, "epoch": 1222} {"train_loss": -21.983699798583984, "global_step": 101474, "epoch": 1222} {"train_loss": -21.824630737304688, "global_step": 101475, "epoch": 1222} {"train_loss": -21.793264389038086, "global_step": 101476, "epoch": 1222} {"train_loss": -21.91097068786621, "global_step": 101477, "epoch": 1222} {"train_loss": -21.81658363342285, "global_step": 101478, "epoch": 1222} {"train_loss": -22.219099044799805, "global_step": 101479, "epoch": 1222} {"train_loss": -21.48992919921875, "global_step": 101480, "epoch": 1222} {"train_loss": -21.935909271240234, "global_step": 101481, "epoch": 1222} {"train_loss": -22.091289520263672, "global_step": 101482, "epoch": 1222} {"train_loss": -21.90053367614746, "global_step": 101483, "epoch": 1222} {"train_loss": -22.184370040893555, "global_step": 101484, "epoch": 1222} {"train_loss": -22.070119857788086, "global_step": 101485, "epoch": 1222} {"train_loss": -22.038227081298828, "global_step": 101486, "epoch": 1222} {"train_loss": -22.18037223815918, "global_step": 101487, "epoch": 1222} {"train_loss": -22.115198135375977, "global_step": 101488, "epoch": 1222} {"train_loss": -22.017236709594727, "global_step": 101489, "epoch": 1222} {"train_loss": -22.174217224121094, "global_step": 101490, "epoch": 1222} {"train_loss": -21.76160430908203, "global_step": 101491, "epoch": 1222} {"train_loss": -22.315519332885742, "global_step": 101492, "epoch": 1222} {"train_loss": -21.96892738342285, "global_step": 101493, "epoch": 1222} {"train_loss": -22.26218605041504, "global_step": 101494, "epoch": 1222} {"train_loss": -21.968557357788086, "global_step": 101495, "epoch": 1222} {"train_loss": -22.12758445739746, "global_step": 101496, "epoch": 1222} {"train_loss": -22.011856079101562, "global_step": 101497, "epoch": 1222} {"train_loss": -22.19693946838379, "global_step": 101498, "epoch": 1222} {"train_loss": -21.789443969726562, "global_step": 101499, "epoch": 1222} {"train_loss": -22.166120529174805, "global_step": 101500, "epoch": 1222} {"train_loss": -21.769193649291992, "global_step": 101501, "epoch": 1222} {"train_loss": -21.862430572509766, "global_step": 101502, "epoch": 1222} {"train_loss": -22.166019439697266, "global_step": 101503, "epoch": 1222} {"train_loss": -22.06102752685547, "global_step": 101504, "epoch": 1222} {"train_loss": -22.14754295349121, "global_step": 101505, "epoch": 1222} {"train_loss": -22.103290557861328, "global_step": 101506, "epoch": 1222} {"train_loss": -21.91794204711914, "global_step": 101507, "epoch": 1222} {"train_loss": -21.833637789071325, "global_step": 101508, "epoch": 1222, "val_loss": 6208096.0} {"train_loss": -21.394208908081055, "global_step": 101509, "epoch": 1223} {"train_loss": -21.41607093811035, "global_step": 101510, "epoch": 1223} {"train_loss": -21.633018493652344, "global_step": 101511, "epoch": 1223} {"train_loss": -21.461965560913086, "global_step": 101512, "epoch": 1223} {"train_loss": -21.643774032592773, "global_step": 101513, "epoch": 1223} {"train_loss": -21.645645141601562, "global_step": 101514, "epoch": 1223} {"train_loss": -21.699934005737305, "global_step": 101515, "epoch": 1223} {"train_loss": -21.51466178894043, "global_step": 101516, "epoch": 1223} {"train_loss": -21.657812118530273, "global_step": 101517, "epoch": 1223} {"train_loss": -21.95231819152832, "global_step": 101518, "epoch": 1223} {"train_loss": -21.509931564331055, "global_step": 101519, "epoch": 1223} {"train_loss": -21.53511619567871, "global_step": 101520, "epoch": 1223} {"train_loss": -22.012487411499023, "global_step": 101521, "epoch": 1223} {"train_loss": -21.997970581054688, "global_step": 101522, "epoch": 1223} {"train_loss": -21.6557674407959, "global_step": 101523, "epoch": 1223} {"train_loss": -21.762189865112305, "global_step": 101524, "epoch": 1223} {"train_loss": -21.564132690429688, "global_step": 101525, "epoch": 1223} {"train_loss": -21.86860466003418, "global_step": 101526, "epoch": 1223} {"train_loss": -21.80474853515625, "global_step": 101527, "epoch": 1223} {"train_loss": -22.080324172973633, "global_step": 101528, "epoch": 1223} {"train_loss": -21.929920196533203, "global_step": 101529, "epoch": 1223} {"train_loss": -22.087968826293945, "global_step": 101530, "epoch": 1223} {"train_loss": -21.633392333984375, "global_step": 101531, "epoch": 1223} {"train_loss": -21.92679214477539, "global_step": 101532, "epoch": 1223} {"train_loss": -21.56682777404785, "global_step": 101533, "epoch": 1223} {"train_loss": -22.116357803344727, "global_step": 101534, "epoch": 1223} {"train_loss": -21.939647674560547, "global_step": 101535, "epoch": 1223} {"train_loss": -21.92305564880371, "global_step": 101536, "epoch": 1223} {"train_loss": -21.8907470703125, "global_step": 101537, "epoch": 1223} {"train_loss": -22.335933685302734, "global_step": 101538, "epoch": 1223} {"train_loss": -22.07244300842285, "global_step": 101539, "epoch": 1223} {"train_loss": -22.131439208984375, "global_step": 101540, "epoch": 1223} {"train_loss": -21.833602905273438, "global_step": 101541, "epoch": 1223} {"train_loss": -21.912622451782227, "global_step": 101542, "epoch": 1223} {"train_loss": -22.108854293823242, "global_step": 101543, "epoch": 1223} {"train_loss": -22.08647346496582, "global_step": 101544, "epoch": 1223} {"train_loss": -22.082162857055664, "global_step": 101545, "epoch": 1223} {"train_loss": -21.85146141052246, "global_step": 101546, "epoch": 1223} {"train_loss": -22.120716094970703, "global_step": 101547, "epoch": 1223} {"train_loss": -21.814651489257812, "global_step": 101548, "epoch": 1223} {"train_loss": -21.72331428527832, "global_step": 101549, "epoch": 1223} {"train_loss": -21.773672103881836, "global_step": 101550, "epoch": 1223} {"train_loss": -22.307531356811523, "global_step": 101551, "epoch": 1223} {"train_loss": -22.163257598876953, "global_step": 101552, "epoch": 1223} {"train_loss": -22.022510528564453, "global_step": 101553, "epoch": 1223} {"train_loss": -22.14590835571289, "global_step": 101554, "epoch": 1223} {"train_loss": -21.832162857055664, "global_step": 101555, "epoch": 1223} {"train_loss": -21.973655700683594, "global_step": 101556, "epoch": 1223} {"train_loss": -21.82095718383789, "global_step": 101557, "epoch": 1223} {"train_loss": -21.781232833862305, "global_step": 101558, "epoch": 1223} {"train_loss": -21.71170997619629, "global_step": 101559, "epoch": 1223} {"train_loss": -21.7623291015625, "global_step": 101560, "epoch": 1223} {"train_loss": -21.95122528076172, "global_step": 101561, "epoch": 1223} {"train_loss": -21.953367233276367, "global_step": 101562, "epoch": 1223} {"train_loss": -21.93548011779785, "global_step": 101563, "epoch": 1223} {"train_loss": -21.900596618652344, "global_step": 101564, "epoch": 1223} {"train_loss": -21.595521926879883, "global_step": 101565, "epoch": 1223} {"train_loss": -21.811567306518555, "global_step": 101566, "epoch": 1223} {"train_loss": -21.499563217163086, "global_step": 101567, "epoch": 1223} {"train_loss": -22.180593490600586, "global_step": 101568, "epoch": 1223} {"train_loss": -21.896520614624023, "global_step": 101569, "epoch": 1223} {"train_loss": -22.424985885620117, "global_step": 101570, "epoch": 1223} {"train_loss": -21.993717193603516, "global_step": 101571, "epoch": 1223} {"train_loss": -22.114397048950195, "global_step": 101572, "epoch": 1223} {"train_loss": -21.94742202758789, "global_step": 101573, "epoch": 1223} {"train_loss": -22.45902442932129, "global_step": 101574, "epoch": 1223} {"train_loss": -21.86229705810547, "global_step": 101575, "epoch": 1223} {"train_loss": -21.83757781982422, "global_step": 101576, "epoch": 1223} {"train_loss": -21.786779403686523, "global_step": 101577, "epoch": 1223} {"train_loss": -21.889535903930664, "global_step": 101578, "epoch": 1223} {"train_loss": -22.264541625976562, "global_step": 101579, "epoch": 1223} {"train_loss": -21.69001579284668, "global_step": 101580, "epoch": 1223} {"train_loss": -21.982421875, "global_step": 101581, "epoch": 1223} {"train_loss": -22.236295700073242, "global_step": 101582, "epoch": 1223} {"train_loss": -21.36944007873535, "global_step": 101583, "epoch": 1223} {"train_loss": -22.218591690063477, "global_step": 101584, "epoch": 1223} {"train_loss": -21.959091186523438, "global_step": 101585, "epoch": 1223} {"train_loss": -22.26038932800293, "global_step": 101586, "epoch": 1223} {"train_loss": -22.291156768798828, "global_step": 101587, "epoch": 1223} {"train_loss": -22.043048858642578, "global_step": 101588, "epoch": 1223} {"train_loss": -21.921722412109375, "global_step": 101589, "epoch": 1223} {"train_loss": -21.85064125061035, "global_step": 101590, "epoch": 1223} {"train_loss": -21.905260591621857, "global_step": 101591, "epoch": 1223, "val_loss": 6044911.0} {"train_loss": -21.686290740966797, "global_step": 101592, "epoch": 1224} {"train_loss": -21.79302406311035, "global_step": 101593, "epoch": 1224} {"train_loss": -21.471586227416992, "global_step": 101594, "epoch": 1224} {"train_loss": -21.422788619995117, "global_step": 101595, "epoch": 1224} {"train_loss": -21.894826889038086, "global_step": 101596, "epoch": 1224} {"train_loss": -21.505596160888672, "global_step": 101597, "epoch": 1224} {"train_loss": -21.608253479003906, "global_step": 101598, "epoch": 1224} {"train_loss": -21.94626235961914, "global_step": 101599, "epoch": 1224} {"train_loss": -21.728057861328125, "global_step": 101600, "epoch": 1224} {"train_loss": -21.864164352416992, "global_step": 101601, "epoch": 1224} {"train_loss": -21.8829402923584, "global_step": 101602, "epoch": 1224} {"train_loss": -22.262413024902344, "global_step": 101603, "epoch": 1224} {"train_loss": -22.027664184570312, "global_step": 101604, "epoch": 1224} {"train_loss": -21.663022994995117, "global_step": 101605, "epoch": 1224} {"train_loss": -21.800065994262695, "global_step": 101606, "epoch": 1224} {"train_loss": -22.106489181518555, "global_step": 101607, "epoch": 1224} {"train_loss": -21.95163345336914, "global_step": 101608, "epoch": 1224} {"train_loss": -22.08070945739746, "global_step": 101609, "epoch": 1224} {"train_loss": -21.904447555541992, "global_step": 101610, "epoch": 1224} {"train_loss": -22.038869857788086, "global_step": 101611, "epoch": 1224} {"train_loss": -21.88970375061035, "global_step": 101612, "epoch": 1224} {"train_loss": -22.255340576171875, "global_step": 101613, "epoch": 1224} {"train_loss": -22.155710220336914, "global_step": 101614, "epoch": 1224} {"train_loss": -21.88873291015625, "global_step": 101615, "epoch": 1224} {"train_loss": -22.24814224243164, "global_step": 101616, "epoch": 1224} {"train_loss": -22.13093376159668, "global_step": 101617, "epoch": 1224} {"train_loss": -22.648351669311523, "global_step": 101618, "epoch": 1224} {"train_loss": -22.2535400390625, "global_step": 101619, "epoch": 1224} {"train_loss": -22.093442916870117, "global_step": 101620, "epoch": 1224} {"train_loss": -22.0765323638916, "global_step": 101621, "epoch": 1224} {"train_loss": -22.27484130859375, "global_step": 101622, "epoch": 1224} {"train_loss": -21.763059616088867, "global_step": 101623, "epoch": 1224} {"train_loss": -22.017749786376953, "global_step": 101624, "epoch": 1224} {"train_loss": -22.14048194885254, "global_step": 101625, "epoch": 1224} {"train_loss": -21.972747802734375, "global_step": 101626, "epoch": 1224} {"train_loss": -22.017333984375, "global_step": 101627, "epoch": 1224} {"train_loss": -22.23208999633789, "global_step": 101628, "epoch": 1224} {"train_loss": -22.37460708618164, "global_step": 101629, "epoch": 1224} {"train_loss": -22.021564483642578, "global_step": 101630, "epoch": 1224} {"train_loss": -22.413564682006836, "global_step": 101631, "epoch": 1224} {"train_loss": -22.14454460144043, "global_step": 101632, "epoch": 1224} {"train_loss": -22.03768539428711, "global_step": 101633, "epoch": 1224} {"train_loss": -21.77724266052246, "global_step": 101634, "epoch": 1224} {"train_loss": -22.142471313476562, "global_step": 101635, "epoch": 1224} {"train_loss": -22.428844451904297, "global_step": 101636, "epoch": 1224} {"train_loss": -22.32150650024414, "global_step": 101637, "epoch": 1224} {"train_loss": -22.11455535888672, "global_step": 101638, "epoch": 1224} {"train_loss": -21.999526977539062, "global_step": 101639, "epoch": 1224} {"train_loss": -21.706235885620117, "global_step": 101640, "epoch": 1224} {"train_loss": -21.75080680847168, "global_step": 101641, "epoch": 1224} {"train_loss": -21.768512725830078, "global_step": 101642, "epoch": 1224} {"train_loss": -21.8923397064209, "global_step": 101643, "epoch": 1224} {"train_loss": -21.97700309753418, "global_step": 101644, "epoch": 1224} {"train_loss": -22.052593231201172, "global_step": 101645, "epoch": 1224} {"train_loss": -21.858278274536133, "global_step": 101646, "epoch": 1224} {"train_loss": -21.75581169128418, "global_step": 101647, "epoch": 1224} {"train_loss": -21.900970458984375, "global_step": 101648, "epoch": 1224} {"train_loss": -22.108415603637695, "global_step": 101649, "epoch": 1224} {"train_loss": -21.98979949951172, "global_step": 101650, "epoch": 1224} {"train_loss": -21.860639572143555, "global_step": 101651, "epoch": 1224} {"train_loss": -21.944730758666992, "global_step": 101652, "epoch": 1224} {"train_loss": -22.081125259399414, "global_step": 101653, "epoch": 1224} {"train_loss": -22.196218490600586, "global_step": 101654, "epoch": 1224} {"train_loss": -21.661603927612305, "global_step": 101655, "epoch": 1224} {"train_loss": -22.23231315612793, "global_step": 101656, "epoch": 1224} {"train_loss": -22.095321655273438, "global_step": 101657, "epoch": 1224} {"train_loss": -21.850317001342773, "global_step": 101658, "epoch": 1224} {"train_loss": -22.58613395690918, "global_step": 101659, "epoch": 1224} {"train_loss": -21.689701080322266, "global_step": 101660, "epoch": 1224} {"train_loss": -21.97743797302246, "global_step": 101661, "epoch": 1224} {"train_loss": -22.07545280456543, "global_step": 101662, "epoch": 1224} {"train_loss": -22.241825103759766, "global_step": 101663, "epoch": 1224} {"train_loss": -22.013864517211914, "global_step": 101664, "epoch": 1224} {"train_loss": -21.898305892944336, "global_step": 101665, "epoch": 1224} {"train_loss": -21.9773006439209, "global_step": 101666, "epoch": 1224} {"train_loss": -21.802478790283203, "global_step": 101667, "epoch": 1224} {"train_loss": -22.160648345947266, "global_step": 101668, "epoch": 1224} {"train_loss": -21.672372817993164, "global_step": 101669, "epoch": 1224} {"train_loss": -21.58493423461914, "global_step": 101670, "epoch": 1224} {"train_loss": -21.915119171142578, "global_step": 101671, "epoch": 1224} {"train_loss": -22.199426651000977, "global_step": 101672, "epoch": 1224} {"train_loss": -21.98128890991211, "global_step": 101673, "epoch": 1224} {"train_loss": -21.98988742138966, "global_step": 101674, "epoch": 1224, "val_loss": 6019502.0} {"train_loss": -20.725357055664062, "global_step": 101675, "epoch": 1225} {"train_loss": -21.666635513305664, "global_step": 101676, "epoch": 1225} {"train_loss": -20.975418090820312, "global_step": 101677, "epoch": 1225} {"train_loss": -21.76626968383789, "global_step": 101678, "epoch": 1225} {"train_loss": -21.562719345092773, "global_step": 101679, "epoch": 1225} {"train_loss": -21.798358917236328, "global_step": 101680, "epoch": 1225} {"train_loss": -21.40827751159668, "global_step": 101681, "epoch": 1225} {"train_loss": -21.242645263671875, "global_step": 101682, "epoch": 1225} {"train_loss": -21.522573471069336, "global_step": 101683, "epoch": 1225} {"train_loss": -21.78910255432129, "global_step": 101684, "epoch": 1225} {"train_loss": -21.545915603637695, "global_step": 101685, "epoch": 1225} {"train_loss": -21.281579971313477, "global_step": 101686, "epoch": 1225} {"train_loss": -21.587446212768555, "global_step": 101687, "epoch": 1225} {"train_loss": -21.45075798034668, "global_step": 101688, "epoch": 1225} {"train_loss": -21.725833892822266, "global_step": 101689, "epoch": 1225} {"train_loss": -21.617353439331055, "global_step": 101690, "epoch": 1225} {"train_loss": -21.307294845581055, "global_step": 101691, "epoch": 1225} {"train_loss": -22.02056312561035, "global_step": 101692, "epoch": 1225} {"train_loss": -21.57254981994629, "global_step": 101693, "epoch": 1225} {"train_loss": -21.85833168029785, "global_step": 101694, "epoch": 1225} {"train_loss": -21.6147518157959, "global_step": 101695, "epoch": 1225} {"train_loss": -21.331151962280273, "global_step": 101696, "epoch": 1225} {"train_loss": -21.674314498901367, "global_step": 101697, "epoch": 1225} {"train_loss": -21.55881690979004, "global_step": 101698, "epoch": 1225} {"train_loss": -21.70555305480957, "global_step": 101699, "epoch": 1225} {"train_loss": -21.9307861328125, "global_step": 101700, "epoch": 1225} {"train_loss": -21.614477157592773, "global_step": 101701, "epoch": 1225} {"train_loss": -22.012351989746094, "global_step": 101702, "epoch": 1225} {"train_loss": -21.9007625579834, "global_step": 101703, "epoch": 1225} {"train_loss": -22.03166961669922, "global_step": 101704, "epoch": 1225} {"train_loss": -21.85310173034668, "global_step": 101705, "epoch": 1225} {"train_loss": -21.953514099121094, "global_step": 101706, "epoch": 1225} {"train_loss": -21.999252319335938, "global_step": 101707, "epoch": 1225} {"train_loss": -22.04793357849121, "global_step": 101708, "epoch": 1225} {"train_loss": -22.05133056640625, "global_step": 101709, "epoch": 1225} {"train_loss": -21.812915802001953, "global_step": 101710, "epoch": 1225} {"train_loss": -21.97665023803711, "global_step": 101711, "epoch": 1225} {"train_loss": -22.111915588378906, "global_step": 101712, "epoch": 1225} {"train_loss": -21.969167709350586, "global_step": 101713, "epoch": 1225} {"train_loss": -22.22317886352539, "global_step": 101714, "epoch": 1225} {"train_loss": -22.147165298461914, "global_step": 101715, "epoch": 1225} {"train_loss": -22.07309913635254, "global_step": 101716, "epoch": 1225} {"train_loss": -22.000717163085938, "global_step": 101717, "epoch": 1225} {"train_loss": -21.58700942993164, "global_step": 101718, "epoch": 1225} {"train_loss": -22.23638153076172, "global_step": 101719, "epoch": 1225} {"train_loss": -22.14736557006836, "global_step": 101720, "epoch": 1225} {"train_loss": -22.252220153808594, "global_step": 101721, "epoch": 1225} {"train_loss": -22.22321891784668, "global_step": 101722, "epoch": 1225} {"train_loss": -21.827733993530273, "global_step": 101723, "epoch": 1225} {"train_loss": -22.01787567138672, "global_step": 101724, "epoch": 1225} {"train_loss": -21.90424919128418, "global_step": 101725, "epoch": 1225} {"train_loss": -21.751934051513672, "global_step": 101726, "epoch": 1225} {"train_loss": -21.730854034423828, "global_step": 101727, "epoch": 1225} {"train_loss": -21.912948608398438, "global_step": 101728, "epoch": 1225} {"train_loss": -22.339126586914062, "global_step": 101729, "epoch": 1225} {"train_loss": -21.953933715820312, "global_step": 101730, "epoch": 1225} {"train_loss": -21.630897521972656, "global_step": 101731, "epoch": 1225} {"train_loss": -21.895004272460938, "global_step": 101732, "epoch": 1225} {"train_loss": -21.429458618164062, "global_step": 101733, "epoch": 1225} {"train_loss": -21.97038459777832, "global_step": 101734, "epoch": 1225} {"train_loss": -21.804927825927734, "global_step": 101735, "epoch": 1225} {"train_loss": -21.608200073242188, "global_step": 101736, "epoch": 1225} {"train_loss": -21.604827880859375, "global_step": 101737, "epoch": 1225} {"train_loss": -21.674213409423828, "global_step": 101738, "epoch": 1225} {"train_loss": -22.00847816467285, "global_step": 101739, "epoch": 1225} {"train_loss": -22.08757972717285, "global_step": 101740, "epoch": 1225} {"train_loss": -22.008304595947266, "global_step": 101741, "epoch": 1225} {"train_loss": -22.292573928833008, "global_step": 101742, "epoch": 1225} {"train_loss": -21.87554931640625, "global_step": 101743, "epoch": 1225} {"train_loss": -22.0301570892334, "global_step": 101744, "epoch": 1225} {"train_loss": -21.909706115722656, "global_step": 101745, "epoch": 1225} {"train_loss": -22.136241912841797, "global_step": 101746, "epoch": 1225} {"train_loss": -21.862060546875, "global_step": 101747, "epoch": 1225} {"train_loss": -21.9934024810791, "global_step": 101748, "epoch": 1225} {"train_loss": -21.721778869628906, "global_step": 101749, "epoch": 1225} {"train_loss": -22.16521453857422, "global_step": 101750, "epoch": 1225} {"train_loss": -22.06859016418457, "global_step": 101751, "epoch": 1225} {"train_loss": -21.907758712768555, "global_step": 101752, "epoch": 1225} {"train_loss": -21.96482276916504, "global_step": 101753, "epoch": 1225} {"train_loss": -22.19553565979004, "global_step": 101754, "epoch": 1225} {"train_loss": -21.933414459228516, "global_step": 101755, "epoch": 1225} {"train_loss": -22.375659942626953, "global_step": 101756, "epoch": 1225} {"train_loss": -21.83790712471468, "global_step": 101757, "epoch": 1225, "val_loss": 6127646.0} {"train_loss": -21.912296295166016, "global_step": 101758, "epoch": 1226} {"train_loss": -21.554061889648438, "global_step": 101759, "epoch": 1226} {"train_loss": -21.573810577392578, "global_step": 101760, "epoch": 1226} {"train_loss": -21.90838623046875, "global_step": 101761, "epoch": 1226} {"train_loss": -21.820911407470703, "global_step": 101762, "epoch": 1226} {"train_loss": -21.71563720703125, "global_step": 101763, "epoch": 1226} {"train_loss": -21.51862907409668, "global_step": 101764, "epoch": 1226} {"train_loss": -21.7850341796875, "global_step": 101765, "epoch": 1226} {"train_loss": -22.31235694885254, "global_step": 101766, "epoch": 1226} {"train_loss": -21.648792266845703, "global_step": 101767, "epoch": 1226} {"train_loss": -21.884063720703125, "global_step": 101768, "epoch": 1226} {"train_loss": -22.070987701416016, "global_step": 101769, "epoch": 1226} {"train_loss": -21.943981170654297, "global_step": 101770, "epoch": 1226} {"train_loss": -21.704116821289062, "global_step": 101771, "epoch": 1226} {"train_loss": -21.784194946289062, "global_step": 101772, "epoch": 1226} {"train_loss": -22.00027847290039, "global_step": 101773, "epoch": 1226} {"train_loss": -21.88041114807129, "global_step": 101774, "epoch": 1226} {"train_loss": -21.929946899414062, "global_step": 101775, "epoch": 1226} {"train_loss": -21.71869468688965, "global_step": 101776, "epoch": 1226} {"train_loss": -22.15669059753418, "global_step": 101777, "epoch": 1226} {"train_loss": -21.979385375976562, "global_step": 101778, "epoch": 1226} {"train_loss": -22.000940322875977, "global_step": 101779, "epoch": 1226} {"train_loss": -22.049219131469727, "global_step": 101780, "epoch": 1226} {"train_loss": -21.69392204284668, "global_step": 101781, "epoch": 1226} {"train_loss": -22.324277877807617, "global_step": 101782, "epoch": 1226} {"train_loss": -21.92536735534668, "global_step": 101783, "epoch": 1226} {"train_loss": -21.844091415405273, "global_step": 101784, "epoch": 1226} {"train_loss": -21.937509536743164, "global_step": 101785, "epoch": 1226} {"train_loss": -21.857961654663086, "global_step": 101786, "epoch": 1226} {"train_loss": -22.29648780822754, "global_step": 101787, "epoch": 1226} {"train_loss": -21.6822452545166, "global_step": 101788, "epoch": 1226} {"train_loss": -21.94664764404297, "global_step": 101789, "epoch": 1226} {"train_loss": -22.0543212890625, "global_step": 101790, "epoch": 1226} {"train_loss": -21.91120719909668, "global_step": 101791, "epoch": 1226} {"train_loss": -22.204538345336914, "global_step": 101792, "epoch": 1226} {"train_loss": -22.023855209350586, "global_step": 101793, "epoch": 1226} {"train_loss": -22.338132858276367, "global_step": 101794, "epoch": 1226} {"train_loss": -22.085081100463867, "global_step": 101795, "epoch": 1226} {"train_loss": -22.143091201782227, "global_step": 101796, "epoch": 1226} {"train_loss": -22.06861686706543, "global_step": 101797, "epoch": 1226} {"train_loss": -21.953289031982422, "global_step": 101798, "epoch": 1226} {"train_loss": -22.211538314819336, "global_step": 101799, "epoch": 1226} {"train_loss": -21.94137191772461, "global_step": 101800, "epoch": 1226} {"train_loss": -22.034772872924805, "global_step": 101801, "epoch": 1226} {"train_loss": -21.840267181396484, "global_step": 101802, "epoch": 1226} {"train_loss": -21.474515914916992, "global_step": 101803, "epoch": 1226} {"train_loss": -21.62736701965332, "global_step": 101804, "epoch": 1226} {"train_loss": -22.123891830444336, "global_step": 101805, "epoch": 1226} {"train_loss": -22.322296142578125, "global_step": 101806, "epoch": 1226} {"train_loss": -21.749914169311523, "global_step": 101807, "epoch": 1226} {"train_loss": -22.28678321838379, "global_step": 101808, "epoch": 1226} {"train_loss": -22.455135345458984, "global_step": 101809, "epoch": 1226} {"train_loss": -21.961688995361328, "global_step": 101810, "epoch": 1226} {"train_loss": -22.41820526123047, "global_step": 101811, "epoch": 1226} {"train_loss": -21.832595825195312, "global_step": 101812, "epoch": 1226} {"train_loss": -21.262521743774414, "global_step": 101813, "epoch": 1226} {"train_loss": -21.88321304321289, "global_step": 101814, "epoch": 1226} {"train_loss": -22.20018768310547, "global_step": 101815, "epoch": 1226} {"train_loss": -21.66828727722168, "global_step": 101816, "epoch": 1226} {"train_loss": -22.2091007232666, "global_step": 101817, "epoch": 1226} {"train_loss": -21.96668815612793, "global_step": 101818, "epoch": 1226} {"train_loss": -22.172719955444336, "global_step": 101819, "epoch": 1226} {"train_loss": -21.612506866455078, "global_step": 101820, "epoch": 1226} {"train_loss": -21.924091339111328, "global_step": 101821, "epoch": 1226} {"train_loss": -21.96784782409668, "global_step": 101822, "epoch": 1226} {"train_loss": -21.8376407623291, "global_step": 101823, "epoch": 1226} {"train_loss": -21.617414474487305, "global_step": 101824, "epoch": 1226} {"train_loss": -22.142784118652344, "global_step": 101825, "epoch": 1226} {"train_loss": -21.93198013305664, "global_step": 101826, "epoch": 1226} {"train_loss": -21.701631546020508, "global_step": 101827, "epoch": 1226} {"train_loss": -22.159460067749023, "global_step": 101828, "epoch": 1226} {"train_loss": -22.063032150268555, "global_step": 101829, "epoch": 1226} {"train_loss": -22.279600143432617, "global_step": 101830, "epoch": 1226} {"train_loss": -21.870899200439453, "global_step": 101831, "epoch": 1226} {"train_loss": -21.862207412719727, "global_step": 101832, "epoch": 1226} {"train_loss": -22.002439498901367, "global_step": 101833, "epoch": 1226} {"train_loss": -22.167613983154297, "global_step": 101834, "epoch": 1226} {"train_loss": -22.150150299072266, "global_step": 101835, "epoch": 1226} {"train_loss": -22.2153377532959, "global_step": 101836, "epoch": 1226} {"train_loss": -21.983800888061523, "global_step": 101837, "epoch": 1226} {"train_loss": -22.4151611328125, "global_step": 101838, "epoch": 1226} {"train_loss": -22.36367416381836, "global_step": 101839, "epoch": 1226} {"train_loss": -21.96162745464279, "global_step": 101840, "epoch": 1226, "val_loss": 6105123.0} {"train_loss": -21.652711868286133, "global_step": 101841, "epoch": 1227} {"train_loss": -21.53748893737793, "global_step": 101842, "epoch": 1227} {"train_loss": -21.286270141601562, "global_step": 101843, "epoch": 1227} {"train_loss": -22.047548294067383, "global_step": 101844, "epoch": 1227} {"train_loss": -21.602750778198242, "global_step": 101845, "epoch": 1227} {"train_loss": -21.46375846862793, "global_step": 101846, "epoch": 1227} {"train_loss": -22.082006454467773, "global_step": 101847, "epoch": 1227} {"train_loss": -21.944543838500977, "global_step": 101848, "epoch": 1227} {"train_loss": -21.768203735351562, "global_step": 101849, "epoch": 1227} {"train_loss": -22.017152786254883, "global_step": 101850, "epoch": 1227} {"train_loss": -22.24769401550293, "global_step": 101851, "epoch": 1227} {"train_loss": -22.130056381225586, "global_step": 101852, "epoch": 1227} {"train_loss": -22.041946411132812, "global_step": 101853, "epoch": 1227} {"train_loss": -21.831235885620117, "global_step": 101854, "epoch": 1227} {"train_loss": -21.992475509643555, "global_step": 101855, "epoch": 1227} {"train_loss": -21.924636840820312, "global_step": 101856, "epoch": 1227} {"train_loss": -22.09903907775879, "global_step": 101857, "epoch": 1227} {"train_loss": -21.881681442260742, "global_step": 101858, "epoch": 1227} {"train_loss": -21.9937801361084, "global_step": 101859, "epoch": 1227} {"train_loss": -22.061513900756836, "global_step": 101860, "epoch": 1227} {"train_loss": -22.06867790222168, "global_step": 101861, "epoch": 1227} {"train_loss": -21.849756240844727, "global_step": 101862, "epoch": 1227} {"train_loss": -22.022253036499023, "global_step": 101863, "epoch": 1227} {"train_loss": -21.852933883666992, "global_step": 101864, "epoch": 1227} {"train_loss": -21.87102699279785, "global_step": 101865, "epoch": 1227} {"train_loss": -21.950040817260742, "global_step": 101866, "epoch": 1227} {"train_loss": -22.08469581604004, "global_step": 101867, "epoch": 1227} {"train_loss": -21.84620475769043, "global_step": 101868, "epoch": 1227} {"train_loss": -21.993764877319336, "global_step": 101869, "epoch": 1227} {"train_loss": -22.129053115844727, "global_step": 101870, "epoch": 1227} {"train_loss": -22.441904067993164, "global_step": 101871, "epoch": 1227} {"train_loss": -22.216947555541992, "global_step": 101872, "epoch": 1227} {"train_loss": -22.118270874023438, "global_step": 101873, "epoch": 1227} {"train_loss": -21.74466896057129, "global_step": 101874, "epoch": 1227} {"train_loss": -21.782169342041016, "global_step": 101875, "epoch": 1227} {"train_loss": -21.849695205688477, "global_step": 101876, "epoch": 1227} {"train_loss": -22.061737060546875, "global_step": 101877, "epoch": 1227} {"train_loss": -21.969303131103516, "global_step": 101878, "epoch": 1227} {"train_loss": -21.947378158569336, "global_step": 101879, "epoch": 1227} {"train_loss": -21.62544059753418, "global_step": 101880, "epoch": 1227} {"train_loss": -22.37108039855957, "global_step": 101881, "epoch": 1227} {"train_loss": -22.02406120300293, "global_step": 101882, "epoch": 1227} {"train_loss": -22.08466911315918, "global_step": 101883, "epoch": 1227} {"train_loss": -21.804332733154297, "global_step": 101884, "epoch": 1227} {"train_loss": -22.089069366455078, "global_step": 101885, "epoch": 1227} {"train_loss": -22.02103614807129, "global_step": 101886, "epoch": 1227} {"train_loss": -22.11231803894043, "global_step": 101887, "epoch": 1227} {"train_loss": -21.944293975830078, "global_step": 101888, "epoch": 1227} {"train_loss": -21.883005142211914, "global_step": 101889, "epoch": 1227} {"train_loss": -22.16621208190918, "global_step": 101890, "epoch": 1227} {"train_loss": -21.985904693603516, "global_step": 101891, "epoch": 1227} {"train_loss": -21.912954330444336, "global_step": 101892, "epoch": 1227} {"train_loss": -21.985300064086914, "global_step": 101893, "epoch": 1227} {"train_loss": -22.57391929626465, "global_step": 101894, "epoch": 1227} {"train_loss": -22.010303497314453, "global_step": 101895, "epoch": 1227} {"train_loss": -21.643566131591797, "global_step": 101896, "epoch": 1227} {"train_loss": -21.802892684936523, "global_step": 101897, "epoch": 1227} {"train_loss": -21.929433822631836, "global_step": 101898, "epoch": 1227} {"train_loss": -21.968305587768555, "global_step": 101899, "epoch": 1227} {"train_loss": -22.270084381103516, "global_step": 101900, "epoch": 1227} {"train_loss": -21.94472312927246, "global_step": 101901, "epoch": 1227} {"train_loss": -22.253543853759766, "global_step": 101902, "epoch": 1227} {"train_loss": -22.011014938354492, "global_step": 101903, "epoch": 1227} {"train_loss": -22.09556007385254, "global_step": 101904, "epoch": 1227} {"train_loss": -22.20130729675293, "global_step": 101905, "epoch": 1227} {"train_loss": -22.237024307250977, "global_step": 101906, "epoch": 1227} {"train_loss": -21.917890548706055, "global_step": 101907, "epoch": 1227} {"train_loss": -22.036558151245117, "global_step": 101908, "epoch": 1227} {"train_loss": -22.190052032470703, "global_step": 101909, "epoch": 1227} {"train_loss": -22.182050704956055, "global_step": 101910, "epoch": 1227} {"train_loss": -22.437631607055664, "global_step": 101911, "epoch": 1227} {"train_loss": -22.135677337646484, "global_step": 101912, "epoch": 1227} {"train_loss": -22.228830337524414, "global_step": 101913, "epoch": 1227} {"train_loss": -21.840360641479492, "global_step": 101914, "epoch": 1227} {"train_loss": -21.7805233001709, "global_step": 101915, "epoch": 1227} {"train_loss": -22.05368995666504, "global_step": 101916, "epoch": 1227} {"train_loss": -21.864948272705078, "global_step": 101917, "epoch": 1227} {"train_loss": -22.103729248046875, "global_step": 101918, "epoch": 1227} {"train_loss": -22.01380729675293, "global_step": 101919, "epoch": 1227} {"train_loss": -21.67426109313965, "global_step": 101920, "epoch": 1227} {"train_loss": -22.169174194335938, "global_step": 101921, "epoch": 1227} {"train_loss": -22.022489547729492, "global_step": 101922, "epoch": 1227} {"train_loss": -21.9774215882083, "global_step": 101923, "epoch": 1227, "val_loss": 6153083.0} {"train_loss": -21.764455795288086, "global_step": 101924, "epoch": 1228} {"train_loss": -21.910551071166992, "global_step": 101925, "epoch": 1228} {"train_loss": -21.217548370361328, "global_step": 101926, "epoch": 1228} {"train_loss": -21.398460388183594, "global_step": 101927, "epoch": 1228} {"train_loss": -21.595945358276367, "global_step": 101928, "epoch": 1228} {"train_loss": -21.708955764770508, "global_step": 101929, "epoch": 1228} {"train_loss": -21.58551025390625, "global_step": 101930, "epoch": 1228} {"train_loss": -21.67535972595215, "global_step": 101931, "epoch": 1228} {"train_loss": -21.931257247924805, "global_step": 101932, "epoch": 1228} {"train_loss": -21.842941284179688, "global_step": 101933, "epoch": 1228} {"train_loss": -21.915372848510742, "global_step": 101934, "epoch": 1228} {"train_loss": -21.88382339477539, "global_step": 101935, "epoch": 1228} {"train_loss": -21.668094635009766, "global_step": 101936, "epoch": 1228} {"train_loss": -21.834674835205078, "global_step": 101937, "epoch": 1228} {"train_loss": -22.19041633605957, "global_step": 101938, "epoch": 1228} {"train_loss": -21.931976318359375, "global_step": 101939, "epoch": 1228} {"train_loss": -21.795291900634766, "global_step": 101940, "epoch": 1228} {"train_loss": -21.795339584350586, "global_step": 101941, "epoch": 1228} {"train_loss": -22.005924224853516, "global_step": 101942, "epoch": 1228} {"train_loss": -21.99053382873535, "global_step": 101943, "epoch": 1228} {"train_loss": -21.708908081054688, "global_step": 101944, "epoch": 1228} {"train_loss": -22.615198135375977, "global_step": 101945, "epoch": 1228} {"train_loss": -22.066469192504883, "global_step": 101946, "epoch": 1228} {"train_loss": -22.02832794189453, "global_step": 101947, "epoch": 1228} {"train_loss": -21.84564208984375, "global_step": 101948, "epoch": 1228} {"train_loss": -21.927127838134766, "global_step": 101949, "epoch": 1228} {"train_loss": -21.913999557495117, "global_step": 101950, "epoch": 1228} {"train_loss": -21.949310302734375, "global_step": 101951, "epoch": 1228} {"train_loss": -22.056325912475586, "global_step": 101952, "epoch": 1228} {"train_loss": -21.283655166625977, "global_step": 101953, "epoch": 1228} {"train_loss": -21.56590461730957, "global_step": 101954, "epoch": 1228} {"train_loss": -21.974044799804688, "global_step": 101955, "epoch": 1228} {"train_loss": -21.86127281188965, "global_step": 101956, "epoch": 1228} {"train_loss": -21.89082145690918, "global_step": 101957, "epoch": 1228} {"train_loss": -21.812246322631836, "global_step": 101958, "epoch": 1228} {"train_loss": -21.750680923461914, "global_step": 101959, "epoch": 1228} {"train_loss": -21.92433738708496, "global_step": 101960, "epoch": 1228} {"train_loss": -21.408510208129883, "global_step": 101961, "epoch": 1228} {"train_loss": -21.75201988220215, "global_step": 101962, "epoch": 1228} {"train_loss": -21.40973472595215, "global_step": 101963, "epoch": 1228} {"train_loss": -21.84699058532715, "global_step": 101964, "epoch": 1228} {"train_loss": -21.7633113861084, "global_step": 101965, "epoch": 1228} {"train_loss": -21.855819702148438, "global_step": 101966, "epoch": 1228} {"train_loss": -22.23761749267578, "global_step": 101967, "epoch": 1228} {"train_loss": -22.22955322265625, "global_step": 101968, "epoch": 1228} {"train_loss": -21.815269470214844, "global_step": 101969, "epoch": 1228} {"train_loss": -21.822450637817383, "global_step": 101970, "epoch": 1228} {"train_loss": -21.88549041748047, "global_step": 101971, "epoch": 1228} {"train_loss": -22.075435638427734, "global_step": 101972, "epoch": 1228} {"train_loss": -22.04481315612793, "global_step": 101973, "epoch": 1228} {"train_loss": -21.948501586914062, "global_step": 101974, "epoch": 1228} {"train_loss": -22.33903694152832, "global_step": 101975, "epoch": 1228} {"train_loss": -22.019819259643555, "global_step": 101976, "epoch": 1228} {"train_loss": -21.926166534423828, "global_step": 101977, "epoch": 1228} {"train_loss": -21.830244064331055, "global_step": 101978, "epoch": 1228} {"train_loss": -21.799612045288086, "global_step": 101979, "epoch": 1228} {"train_loss": -22.071210861206055, "global_step": 101980, "epoch": 1228} {"train_loss": -22.009902954101562, "global_step": 101981, "epoch": 1228} {"train_loss": -21.956899642944336, "global_step": 101982, "epoch": 1228} {"train_loss": -22.063093185424805, "global_step": 101983, "epoch": 1228} {"train_loss": -22.04421043395996, "global_step": 101984, "epoch": 1228} {"train_loss": -21.893657684326172, "global_step": 101985, "epoch": 1228} {"train_loss": -21.901601791381836, "global_step": 101986, "epoch": 1228} {"train_loss": -22.09000015258789, "global_step": 101987, "epoch": 1228} {"train_loss": -22.040897369384766, "global_step": 101988, "epoch": 1228} {"train_loss": -21.82099151611328, "global_step": 101989, "epoch": 1228} {"train_loss": -22.03958511352539, "global_step": 101990, "epoch": 1228} {"train_loss": -21.70697593688965, "global_step": 101991, "epoch": 1228} {"train_loss": -21.92067527770996, "global_step": 101992, "epoch": 1228} {"train_loss": -21.752368927001953, "global_step": 101993, "epoch": 1228} {"train_loss": -22.155771255493164, "global_step": 101994, "epoch": 1228} {"train_loss": -21.923259735107422, "global_step": 101995, "epoch": 1228} {"train_loss": -22.365339279174805, "global_step": 101996, "epoch": 1228} {"train_loss": -22.153749465942383, "global_step": 101997, "epoch": 1228} {"train_loss": -21.955909729003906, "global_step": 101998, "epoch": 1228} {"train_loss": -22.135774612426758, "global_step": 101999, "epoch": 1228} {"train_loss": -22.06444549560547, "global_step": 102000, "epoch": 1228} {"train_loss": -22.075828552246094, "global_step": 102001, "epoch": 1228} {"train_loss": -21.701894760131836, "global_step": 102002, "epoch": 1228} {"train_loss": -21.668920516967773, "global_step": 102003, "epoch": 1228} {"train_loss": -22.143800735473633, "global_step": 102004, "epoch": 1228} {"train_loss": -21.935522079467773, "global_step": 102005, "epoch": 1228} {"train_loss": -21.90305679964732, "global_step": 102006, "epoch": 1228, "val_loss": 6098704.0} {"train_loss": -21.680923461914062, "global_step": 102007, "epoch": 1229} {"train_loss": -21.936920166015625, "global_step": 102008, "epoch": 1229} {"train_loss": -21.747671127319336, "global_step": 102009, "epoch": 1229} {"train_loss": -21.84596824645996, "global_step": 102010, "epoch": 1229} {"train_loss": -21.852432250976562, "global_step": 102011, "epoch": 1229} {"train_loss": -21.9819393157959, "global_step": 102012, "epoch": 1229} {"train_loss": -21.90595817565918, "global_step": 102013, "epoch": 1229} {"train_loss": -21.22518539428711, "global_step": 102014, "epoch": 1229} {"train_loss": -22.044431686401367, "global_step": 102015, "epoch": 1229} {"train_loss": -21.751413345336914, "global_step": 102016, "epoch": 1229} {"train_loss": -21.986875534057617, "global_step": 102017, "epoch": 1229} {"train_loss": -21.632482528686523, "global_step": 102018, "epoch": 1229} {"train_loss": -22.304624557495117, "global_step": 102019, "epoch": 1229} {"train_loss": -21.81525993347168, "global_step": 102020, "epoch": 1229} {"train_loss": -21.958932876586914, "global_step": 102021, "epoch": 1229} {"train_loss": -21.707807540893555, "global_step": 102022, "epoch": 1229} {"train_loss": -22.109663009643555, "global_step": 102023, "epoch": 1229} {"train_loss": -22.104902267456055, "global_step": 102024, "epoch": 1229} {"train_loss": -22.283340454101562, "global_step": 102025, "epoch": 1229} {"train_loss": -21.454334259033203, "global_step": 102026, "epoch": 1229} {"train_loss": -22.053937911987305, "global_step": 102027, "epoch": 1229} {"train_loss": -22.119619369506836, "global_step": 102028, "epoch": 1229} {"train_loss": -22.00031852722168, "global_step": 102029, "epoch": 1229} {"train_loss": -22.24355125427246, "global_step": 102030, "epoch": 1229} {"train_loss": -21.8713321685791, "global_step": 102031, "epoch": 1229} {"train_loss": -22.027667999267578, "global_step": 102032, "epoch": 1229} {"train_loss": -22.222530364990234, "global_step": 102033, "epoch": 1229} {"train_loss": -21.7525691986084, "global_step": 102034, "epoch": 1229} {"train_loss": -22.19583511352539, "global_step": 102035, "epoch": 1229} {"train_loss": -21.93174171447754, "global_step": 102036, "epoch": 1229} {"train_loss": -22.024946212768555, "global_step": 102037, "epoch": 1229} {"train_loss": -21.901811599731445, "global_step": 102038, "epoch": 1229} {"train_loss": -22.132299423217773, "global_step": 102039, "epoch": 1229} {"train_loss": -21.847753524780273, "global_step": 102040, "epoch": 1229} {"train_loss": -22.157590866088867, "global_step": 102041, "epoch": 1229} {"train_loss": -22.293514251708984, "global_step": 102042, "epoch": 1229} {"train_loss": -22.075836181640625, "global_step": 102043, "epoch": 1229} {"train_loss": -21.936851501464844, "global_step": 102044, "epoch": 1229} {"train_loss": -21.749923706054688, "global_step": 102045, "epoch": 1229} {"train_loss": -22.12204360961914, "global_step": 102046, "epoch": 1229} {"train_loss": -22.081079483032227, "global_step": 102047, "epoch": 1229} {"train_loss": -22.00575828552246, "global_step": 102048, "epoch": 1229} {"train_loss": -21.817472457885742, "global_step": 102049, "epoch": 1229} {"train_loss": -22.3330135345459, "global_step": 102050, "epoch": 1229} {"train_loss": -21.952978134155273, "global_step": 102051, "epoch": 1229} {"train_loss": -21.501407623291016, "global_step": 102052, "epoch": 1229} {"train_loss": -22.22014617919922, "global_step": 102053, "epoch": 1229} {"train_loss": -22.053205490112305, "global_step": 102054, "epoch": 1229} {"train_loss": -21.668033599853516, "global_step": 102055, "epoch": 1229} {"train_loss": -22.24614143371582, "global_step": 102056, "epoch": 1229} {"train_loss": -22.290143966674805, "global_step": 102057, "epoch": 1229} {"train_loss": -22.027647018432617, "global_step": 102058, "epoch": 1229} {"train_loss": -21.971643447875977, "global_step": 102059, "epoch": 1229} {"train_loss": -21.901653289794922, "global_step": 102060, "epoch": 1229} {"train_loss": -22.313919067382812, "global_step": 102061, "epoch": 1229} {"train_loss": -21.766767501831055, "global_step": 102062, "epoch": 1229} {"train_loss": -21.87540054321289, "global_step": 102063, "epoch": 1229} {"train_loss": -21.76987648010254, "global_step": 102064, "epoch": 1229} {"train_loss": -22.236234664916992, "global_step": 102065, "epoch": 1229} {"train_loss": -21.99440574645996, "global_step": 102066, "epoch": 1229} {"train_loss": -22.214454650878906, "global_step": 102067, "epoch": 1229} {"train_loss": -22.0509033203125, "global_step": 102068, "epoch": 1229} {"train_loss": -22.11200523376465, "global_step": 102069, "epoch": 1229} {"train_loss": -22.2014102935791, "global_step": 102070, "epoch": 1229} {"train_loss": -21.934804916381836, "global_step": 102071, "epoch": 1229} {"train_loss": -21.87959861755371, "global_step": 102072, "epoch": 1229} {"train_loss": -22.16067886352539, "global_step": 102073, "epoch": 1229} {"train_loss": -22.016836166381836, "global_step": 102074, "epoch": 1229} {"train_loss": -21.785037994384766, "global_step": 102075, "epoch": 1229} {"train_loss": -21.901357650756836, "global_step": 102076, "epoch": 1229} {"train_loss": -21.946374893188477, "global_step": 102077, "epoch": 1229} {"train_loss": -21.957521438598633, "global_step": 102078, "epoch": 1229} {"train_loss": -22.11891746520996, "global_step": 102079, "epoch": 1229} {"train_loss": -22.19740104675293, "global_step": 102080, "epoch": 1229} {"train_loss": -22.01498794555664, "global_step": 102081, "epoch": 1229} {"train_loss": -22.15760612487793, "global_step": 102082, "epoch": 1229} {"train_loss": -22.18977928161621, "global_step": 102083, "epoch": 1229} {"train_loss": -22.106521606445312, "global_step": 102084, "epoch": 1229} {"train_loss": -21.832426071166992, "global_step": 102085, "epoch": 1229} {"train_loss": -22.116483688354492, "global_step": 102086, "epoch": 1229} {"train_loss": -21.858036041259766, "global_step": 102087, "epoch": 1229} {"train_loss": -22.032724380493164, "global_step": 102088, "epoch": 1229} {"train_loss": -21.952221789992, "global_step": 102089, "epoch": 1229, "val_loss": 6159397.0} {"train_loss": -20.566390991210938, "global_step": 102090, "epoch": 1230} {"train_loss": -20.324054718017578, "global_step": 102091, "epoch": 1230} {"train_loss": -21.03851890563965, "global_step": 102092, "epoch": 1230} {"train_loss": -21.325307846069336, "global_step": 102093, "epoch": 1230} {"train_loss": -20.574247360229492, "global_step": 102094, "epoch": 1230} {"train_loss": -21.51531410217285, "global_step": 102095, "epoch": 1230} {"train_loss": -20.823463439941406, "global_step": 102096, "epoch": 1230} {"train_loss": -21.173513412475586, "global_step": 102097, "epoch": 1230} {"train_loss": -20.911426544189453, "global_step": 102098, "epoch": 1230} {"train_loss": -21.586389541625977, "global_step": 102099, "epoch": 1230} {"train_loss": -21.647354125976562, "global_step": 102100, "epoch": 1230} {"train_loss": -21.466611862182617, "global_step": 102101, "epoch": 1230} {"train_loss": -21.442129135131836, "global_step": 102102, "epoch": 1230} {"train_loss": -21.575376510620117, "global_step": 102103, "epoch": 1230} {"train_loss": -21.42828941345215, "global_step": 102104, "epoch": 1230} {"train_loss": -21.747257232666016, "global_step": 102105, "epoch": 1230} {"train_loss": -21.403085708618164, "global_step": 102106, "epoch": 1230} {"train_loss": -21.670547485351562, "global_step": 102107, "epoch": 1230} {"train_loss": -21.623201370239258, "global_step": 102108, "epoch": 1230} {"train_loss": -21.465497970581055, "global_step": 102109, "epoch": 1230} {"train_loss": -21.86305809020996, "global_step": 102110, "epoch": 1230} {"train_loss": -22.056058883666992, "global_step": 102111, "epoch": 1230} {"train_loss": -21.806791305541992, "global_step": 102112, "epoch": 1230} {"train_loss": -22.05624008178711, "global_step": 102113, "epoch": 1230} {"train_loss": -21.846097946166992, "global_step": 102114, "epoch": 1230} {"train_loss": -21.79806900024414, "global_step": 102115, "epoch": 1230} {"train_loss": -21.88680076599121, "global_step": 102116, "epoch": 1230} {"train_loss": -21.72471046447754, "global_step": 102117, "epoch": 1230} {"train_loss": -22.141706466674805, "global_step": 102118, "epoch": 1230} {"train_loss": -22.138656616210938, "global_step": 102119, "epoch": 1230} {"train_loss": -22.22688865661621, "global_step": 102120, "epoch": 1230} {"train_loss": -21.819122314453125, "global_step": 102121, "epoch": 1230} {"train_loss": -22.236101150512695, "global_step": 102122, "epoch": 1230} {"train_loss": -22.09415626525879, "global_step": 102123, "epoch": 1230} {"train_loss": -22.08405113220215, "global_step": 102124, "epoch": 1230} {"train_loss": -22.096227645874023, "global_step": 102125, "epoch": 1230} {"train_loss": -21.760574340820312, "global_step": 102126, "epoch": 1230} {"train_loss": -22.096364974975586, "global_step": 102127, "epoch": 1230} {"train_loss": -22.1829891204834, "global_step": 102128, "epoch": 1230} {"train_loss": -21.977237701416016, "global_step": 102129, "epoch": 1230} {"train_loss": -21.952619552612305, "global_step": 102130, "epoch": 1230} {"train_loss": -22.273035049438477, "global_step": 102131, "epoch": 1230} {"train_loss": -21.7940673828125, "global_step": 102132, "epoch": 1230} {"train_loss": -22.189512252807617, "global_step": 102133, "epoch": 1230} {"train_loss": -21.776548385620117, "global_step": 102134, "epoch": 1230} {"train_loss": -22.24506950378418, "global_step": 102135, "epoch": 1230} {"train_loss": -21.846290588378906, "global_step": 102136, "epoch": 1230} {"train_loss": -22.284122467041016, "global_step": 102137, "epoch": 1230} {"train_loss": -22.257490158081055, "global_step": 102138, "epoch": 1230} {"train_loss": -21.87622833251953, "global_step": 102139, "epoch": 1230} {"train_loss": -22.31083106994629, "global_step": 102140, "epoch": 1230} {"train_loss": -21.935394287109375, "global_step": 102141, "epoch": 1230} {"train_loss": -21.64692497253418, "global_step": 102142, "epoch": 1230} {"train_loss": -21.77631950378418, "global_step": 102143, "epoch": 1230} {"train_loss": -22.10029411315918, "global_step": 102144, "epoch": 1230} {"train_loss": -22.167104721069336, "global_step": 102145, "epoch": 1230} {"train_loss": -21.636459350585938, "global_step": 102146, "epoch": 1230} {"train_loss": -21.949230194091797, "global_step": 102147, "epoch": 1230} {"train_loss": -22.025360107421875, "global_step": 102148, "epoch": 1230} {"train_loss": -21.81415367126465, "global_step": 102149, "epoch": 1230} {"train_loss": -21.60063934326172, "global_step": 102150, "epoch": 1230} {"train_loss": -22.081985473632812, "global_step": 102151, "epoch": 1230} {"train_loss": -21.718046188354492, "global_step": 102152, "epoch": 1230} {"train_loss": -21.38971519470215, "global_step": 102153, "epoch": 1230} {"train_loss": -21.522428512573242, "global_step": 102154, "epoch": 1230} {"train_loss": -21.85872459411621, "global_step": 102155, "epoch": 1230} {"train_loss": -22.27935791015625, "global_step": 102156, "epoch": 1230} {"train_loss": -21.83719253540039, "global_step": 102157, "epoch": 1230} {"train_loss": -22.020172119140625, "global_step": 102158, "epoch": 1230} {"train_loss": -21.86810302734375, "global_step": 102159, "epoch": 1230} {"train_loss": -22.121826171875, "global_step": 102160, "epoch": 1230} {"train_loss": -21.58917808532715, "global_step": 102161, "epoch": 1230} {"train_loss": -22.036483764648438, "global_step": 102162, "epoch": 1230} {"train_loss": -21.91423797607422, "global_step": 102163, "epoch": 1230} {"train_loss": -22.13431167602539, "global_step": 102164, "epoch": 1230} {"train_loss": -21.917667388916016, "global_step": 102165, "epoch": 1230} {"train_loss": -21.6600399017334, "global_step": 102166, "epoch": 1230} {"train_loss": -21.79073143005371, "global_step": 102167, "epoch": 1230} {"train_loss": -21.828651428222656, "global_step": 102168, "epoch": 1230} {"train_loss": -22.009145736694336, "global_step": 102169, "epoch": 1230} {"train_loss": -21.638338088989258, "global_step": 102170, "epoch": 1230} {"train_loss": -22.073617935180664, "global_step": 102171, "epoch": 1230} {"train_loss": -21.766396924673792, "global_step": 102172, "epoch": 1230, "val_loss": 6194125.5} {"train_loss": -21.765640258789062, "global_step": 102173, "epoch": 1231} {"train_loss": -22.205524444580078, "global_step": 102174, "epoch": 1231} {"train_loss": -21.79469871520996, "global_step": 102175, "epoch": 1231} {"train_loss": -21.94373893737793, "global_step": 102176, "epoch": 1231} {"train_loss": -21.8072452545166, "global_step": 102177, "epoch": 1231} {"train_loss": -21.816617965698242, "global_step": 102178, "epoch": 1231} {"train_loss": -22.180295944213867, "global_step": 102179, "epoch": 1231} {"train_loss": -22.2872257232666, "global_step": 102180, "epoch": 1231} {"train_loss": -21.79795265197754, "global_step": 102181, "epoch": 1231} {"train_loss": -22.11530113220215, "global_step": 102182, "epoch": 1231} {"train_loss": -21.653074264526367, "global_step": 102183, "epoch": 1231} {"train_loss": -21.9932861328125, "global_step": 102184, "epoch": 1231} {"train_loss": -22.509546279907227, "global_step": 102185, "epoch": 1231} {"train_loss": -21.5531063079834, "global_step": 102186, "epoch": 1231} {"train_loss": -22.098773956298828, "global_step": 102187, "epoch": 1231} {"train_loss": -22.183521270751953, "global_step": 102188, "epoch": 1231} {"train_loss": -21.818822860717773, "global_step": 102189, "epoch": 1231} {"train_loss": -21.87327003479004, "global_step": 102190, "epoch": 1231} {"train_loss": -21.678829193115234, "global_step": 102191, "epoch": 1231} {"train_loss": -22.015947341918945, "global_step": 102192, "epoch": 1231} {"train_loss": -21.893238067626953, "global_step": 102193, "epoch": 1231} {"train_loss": -22.09747886657715, "global_step": 102194, "epoch": 1231} {"train_loss": -21.971357345581055, "global_step": 102195, "epoch": 1231} {"train_loss": -22.050487518310547, "global_step": 102196, "epoch": 1231} {"train_loss": -22.086654663085938, "global_step": 102197, "epoch": 1231} {"train_loss": -21.935108184814453, "global_step": 102198, "epoch": 1231} {"train_loss": -21.873075485229492, "global_step": 102199, "epoch": 1231} {"train_loss": -22.014785766601562, "global_step": 102200, "epoch": 1231} {"train_loss": -22.071935653686523, "global_step": 102201, "epoch": 1231} {"train_loss": -22.115026473999023, "global_step": 102202, "epoch": 1231} {"train_loss": -22.083993911743164, "global_step": 102203, "epoch": 1231} {"train_loss": -22.19623374938965, "global_step": 102204, "epoch": 1231} {"train_loss": -22.07069969177246, "global_step": 102205, "epoch": 1231} {"train_loss": -22.13387107849121, "global_step": 102206, "epoch": 1231} {"train_loss": -21.87750816345215, "global_step": 102207, "epoch": 1231} {"train_loss": -21.952342987060547, "global_step": 102208, "epoch": 1231} {"train_loss": -22.086231231689453, "global_step": 102209, "epoch": 1231} {"train_loss": -21.78512954711914, "global_step": 102210, "epoch": 1231} {"train_loss": -21.828577041625977, "global_step": 102211, "epoch": 1231} {"train_loss": -22.02753257751465, "global_step": 102212, "epoch": 1231} {"train_loss": -21.961286544799805, "global_step": 102213, "epoch": 1231} {"train_loss": -22.322078704833984, "global_step": 102214, "epoch": 1231} {"train_loss": -22.18208122253418, "global_step": 102215, "epoch": 1231} {"train_loss": -22.03193473815918, "global_step": 102216, "epoch": 1231} {"train_loss": -22.351158142089844, "global_step": 102217, "epoch": 1231} {"train_loss": -22.118595123291016, "global_step": 102218, "epoch": 1231} {"train_loss": -21.727725982666016, "global_step": 102219, "epoch": 1231} {"train_loss": -22.0726375579834, "global_step": 102220, "epoch": 1231} {"train_loss": -22.235315322875977, "global_step": 102221, "epoch": 1231} {"train_loss": -21.861125946044922, "global_step": 102222, "epoch": 1231} {"train_loss": -22.056079864501953, "global_step": 102223, "epoch": 1231} {"train_loss": -22.418888092041016, "global_step": 102224, "epoch": 1231} {"train_loss": -21.62018394470215, "global_step": 102225, "epoch": 1231} {"train_loss": -22.206867218017578, "global_step": 102226, "epoch": 1231} {"train_loss": -21.700742721557617, "global_step": 102227, "epoch": 1231} {"train_loss": -22.369022369384766, "global_step": 102228, "epoch": 1231} {"train_loss": -21.66011619567871, "global_step": 102229, "epoch": 1231} {"train_loss": -21.945974349975586, "global_step": 102230, "epoch": 1231} {"train_loss": -22.0581111907959, "global_step": 102231, "epoch": 1231} {"train_loss": -22.271963119506836, "global_step": 102232, "epoch": 1231} {"train_loss": -21.607473373413086, "global_step": 102233, "epoch": 1231} {"train_loss": -21.780441284179688, "global_step": 102234, "epoch": 1231} {"train_loss": -22.17722511291504, "global_step": 102235, "epoch": 1231} {"train_loss": -22.007291793823242, "global_step": 102236, "epoch": 1231} {"train_loss": -21.769336700439453, "global_step": 102237, "epoch": 1231} {"train_loss": -22.18316078186035, "global_step": 102238, "epoch": 1231} {"train_loss": -22.132892608642578, "global_step": 102239, "epoch": 1231} {"train_loss": -21.791175842285156, "global_step": 102240, "epoch": 1231} {"train_loss": -21.964130401611328, "global_step": 102241, "epoch": 1231} {"train_loss": -22.11106300354004, "global_step": 102242, "epoch": 1231} {"train_loss": -22.09379005432129, "global_step": 102243, "epoch": 1231} {"train_loss": -21.986785888671875, "global_step": 102244, "epoch": 1231} {"train_loss": -22.14694595336914, "global_step": 102245, "epoch": 1231} {"train_loss": -21.698469161987305, "global_step": 102246, "epoch": 1231} {"train_loss": -22.09490966796875, "global_step": 102247, "epoch": 1231} {"train_loss": -21.775236129760742, "global_step": 102248, "epoch": 1231} {"train_loss": -21.848249435424805, "global_step": 102249, "epoch": 1231} {"train_loss": -22.218229293823242, "global_step": 102250, "epoch": 1231} {"train_loss": -21.928457260131836, "global_step": 102251, "epoch": 1231} {"train_loss": -22.21868896484375, "global_step": 102252, "epoch": 1231} {"train_loss": -22.344648361206055, "global_step": 102253, "epoch": 1231} {"train_loss": -22.03389549255371, "global_step": 102254, "epoch": 1231} {"train_loss": -22.015103351638977, "global_step": 102255, "epoch": 1231, "val_loss": 6130168.0} {"train_loss": -21.392276763916016, "global_step": 102256, "epoch": 1232} {"train_loss": -20.610639572143555, "global_step": 102257, "epoch": 1232} {"train_loss": -21.961593627929688, "global_step": 102258, "epoch": 1232} {"train_loss": -21.316537857055664, "global_step": 102259, "epoch": 1232} {"train_loss": -21.366127014160156, "global_step": 102260, "epoch": 1232} {"train_loss": -21.915019989013672, "global_step": 102261, "epoch": 1232} {"train_loss": -21.70625114440918, "global_step": 102262, "epoch": 1232} {"train_loss": -21.892621994018555, "global_step": 102263, "epoch": 1232} {"train_loss": -21.855422973632812, "global_step": 102264, "epoch": 1232} {"train_loss": -22.092880249023438, "global_step": 102265, "epoch": 1232} {"train_loss": -21.77147102355957, "global_step": 102266, "epoch": 1232} {"train_loss": -21.73531150817871, "global_step": 102267, "epoch": 1232} {"train_loss": -21.360929489135742, "global_step": 102268, "epoch": 1232} {"train_loss": -21.781665802001953, "global_step": 102269, "epoch": 1232} {"train_loss": -21.835968017578125, "global_step": 102270, "epoch": 1232} {"train_loss": -21.584150314331055, "global_step": 102271, "epoch": 1232} {"train_loss": -21.870920181274414, "global_step": 102272, "epoch": 1232} {"train_loss": -21.985366821289062, "global_step": 102273, "epoch": 1232} {"train_loss": -22.13227653503418, "global_step": 102274, "epoch": 1232} {"train_loss": -21.716506958007812, "global_step": 102275, "epoch": 1232} {"train_loss": -21.730178833007812, "global_step": 102276, "epoch": 1232} {"train_loss": -21.907421112060547, "global_step": 102277, "epoch": 1232} {"train_loss": -21.811681747436523, "global_step": 102278, "epoch": 1232} {"train_loss": -22.3167781829834, "global_step": 102279, "epoch": 1232} {"train_loss": -21.98237419128418, "global_step": 102280, "epoch": 1232} {"train_loss": -21.794660568237305, "global_step": 102281, "epoch": 1232} {"train_loss": -21.85865020751953, "global_step": 102282, "epoch": 1232} {"train_loss": -21.741830825805664, "global_step": 102283, "epoch": 1232} {"train_loss": -22.104509353637695, "global_step": 102284, "epoch": 1232} {"train_loss": -21.525814056396484, "global_step": 102285, "epoch": 1232} {"train_loss": -22.03609275817871, "global_step": 102286, "epoch": 1232} {"train_loss": -21.779953002929688, "global_step": 102287, "epoch": 1232} {"train_loss": -22.433147430419922, "global_step": 102288, "epoch": 1232} {"train_loss": -22.022430419921875, "global_step": 102289, "epoch": 1232} {"train_loss": -21.685636520385742, "global_step": 102290, "epoch": 1232} {"train_loss": -22.18086814880371, "global_step": 102291, "epoch": 1232} {"train_loss": -22.18292999267578, "global_step": 102292, "epoch": 1232} {"train_loss": -21.97995948791504, "global_step": 102293, "epoch": 1232} {"train_loss": -22.053482055664062, "global_step": 102294, "epoch": 1232} {"train_loss": -22.1981201171875, "global_step": 102295, "epoch": 1232} {"train_loss": -21.7929630279541, "global_step": 102296, "epoch": 1232} {"train_loss": -21.707075119018555, "global_step": 102297, "epoch": 1232} {"train_loss": -22.092382431030273, "global_step": 102298, "epoch": 1232} {"train_loss": -22.106815338134766, "global_step": 102299, "epoch": 1232} {"train_loss": -22.10188865661621, "global_step": 102300, "epoch": 1232} {"train_loss": -21.957693099975586, "global_step": 102301, "epoch": 1232} {"train_loss": -22.024477005004883, "global_step": 102302, "epoch": 1232} {"train_loss": -21.825809478759766, "global_step": 102303, "epoch": 1232} {"train_loss": -21.865833282470703, "global_step": 102304, "epoch": 1232} {"train_loss": -22.31549644470215, "global_step": 102305, "epoch": 1232} {"train_loss": -22.230619430541992, "global_step": 102306, "epoch": 1232} {"train_loss": -22.35772705078125, "global_step": 102307, "epoch": 1232} {"train_loss": -21.96539878845215, "global_step": 102308, "epoch": 1232} {"train_loss": -22.294591903686523, "global_step": 102309, "epoch": 1232} {"train_loss": -21.90650749206543, "global_step": 102310, "epoch": 1232} {"train_loss": -21.991003036499023, "global_step": 102311, "epoch": 1232} {"train_loss": -22.05177116394043, "global_step": 102312, "epoch": 1232} {"train_loss": -21.9732608795166, "global_step": 102313, "epoch": 1232} {"train_loss": -22.131900787353516, "global_step": 102314, "epoch": 1232} {"train_loss": -22.137781143188477, "global_step": 102315, "epoch": 1232} {"train_loss": -22.09996223449707, "global_step": 102316, "epoch": 1232} {"train_loss": -22.09071159362793, "global_step": 102317, "epoch": 1232} {"train_loss": -21.86778450012207, "global_step": 102318, "epoch": 1232} {"train_loss": -21.75054168701172, "global_step": 102319, "epoch": 1232} {"train_loss": -21.751953125, "global_step": 102320, "epoch": 1232} {"train_loss": -22.311769485473633, "global_step": 102321, "epoch": 1232} {"train_loss": -22.02312660217285, "global_step": 102322, "epoch": 1232} {"train_loss": -21.889726638793945, "global_step": 102323, "epoch": 1232} {"train_loss": -21.800809860229492, "global_step": 102324, "epoch": 1232} {"train_loss": -21.866777420043945, "global_step": 102325, "epoch": 1232} {"train_loss": -21.60921287536621, "global_step": 102326, "epoch": 1232} {"train_loss": -22.033994674682617, "global_step": 102327, "epoch": 1232} {"train_loss": -21.88408660888672, "global_step": 102328, "epoch": 1232} {"train_loss": -21.976654052734375, "global_step": 102329, "epoch": 1232} {"train_loss": -21.474714279174805, "global_step": 102330, "epoch": 1232} {"train_loss": -22.01767921447754, "global_step": 102331, "epoch": 1232} {"train_loss": -21.53017234802246, "global_step": 102332, "epoch": 1232} {"train_loss": -21.77271842956543, "global_step": 102333, "epoch": 1232} {"train_loss": -21.774473190307617, "global_step": 102334, "epoch": 1232} {"train_loss": -21.869604110717773, "global_step": 102335, "epoch": 1232} {"train_loss": -21.838064193725586, "global_step": 102336, "epoch": 1232} {"train_loss": -22.102888107299805, "global_step": 102337, "epoch": 1232} {"train_loss": -21.90879352983222, "global_step": 102338, "epoch": 1232, "val_loss": 6180605.0} {"train_loss": -21.895015716552734, "global_step": 102339, "epoch": 1233} {"train_loss": -21.918048858642578, "global_step": 102340, "epoch": 1233} {"train_loss": -21.713346481323242, "global_step": 102341, "epoch": 1233} {"train_loss": -21.858428955078125, "global_step": 102342, "epoch": 1233} {"train_loss": -21.241910934448242, "global_step": 102343, "epoch": 1233} {"train_loss": -21.99802589416504, "global_step": 102344, "epoch": 1233} {"train_loss": -22.03055191040039, "global_step": 102345, "epoch": 1233} {"train_loss": -21.99965476989746, "global_step": 102346, "epoch": 1233} {"train_loss": -22.024028778076172, "global_step": 102347, "epoch": 1233} {"train_loss": -21.834901809692383, "global_step": 102348, "epoch": 1233} {"train_loss": -21.989484786987305, "global_step": 102349, "epoch": 1233} {"train_loss": -21.875404357910156, "global_step": 102350, "epoch": 1233} {"train_loss": -21.791122436523438, "global_step": 102351, "epoch": 1233} {"train_loss": -21.87369155883789, "global_step": 102352, "epoch": 1233} {"train_loss": -22.236251831054688, "global_step": 102353, "epoch": 1233} {"train_loss": -22.03805923461914, "global_step": 102354, "epoch": 1233} {"train_loss": -21.949832916259766, "global_step": 102355, "epoch": 1233} {"train_loss": -22.454099655151367, "global_step": 102356, "epoch": 1233} {"train_loss": -22.057636260986328, "global_step": 102357, "epoch": 1233} {"train_loss": -22.264318466186523, "global_step": 102358, "epoch": 1233} {"train_loss": -21.951597213745117, "global_step": 102359, "epoch": 1233} {"train_loss": -22.01689910888672, "global_step": 102360, "epoch": 1233} {"train_loss": -22.11351203918457, "global_step": 102361, "epoch": 1233} {"train_loss": -22.266456604003906, "global_step": 102362, "epoch": 1233} {"train_loss": -21.9923038482666, "global_step": 102363, "epoch": 1233} {"train_loss": -21.854711532592773, "global_step": 102364, "epoch": 1233} {"train_loss": -22.225332260131836, "global_step": 102365, "epoch": 1233} {"train_loss": -21.863849639892578, "global_step": 102366, "epoch": 1233} {"train_loss": -21.931859970092773, "global_step": 102367, "epoch": 1233} {"train_loss": -21.953327178955078, "global_step": 102368, "epoch": 1233} {"train_loss": -22.006866455078125, "global_step": 102369, "epoch": 1233} {"train_loss": -22.1518497467041, "global_step": 102370, "epoch": 1233} {"train_loss": -22.11060905456543, "global_step": 102371, "epoch": 1233} {"train_loss": -22.37872314453125, "global_step": 102372, "epoch": 1233} {"train_loss": -22.281604766845703, "global_step": 102373, "epoch": 1233} {"train_loss": -21.978614807128906, "global_step": 102374, "epoch": 1233} {"train_loss": -21.685955047607422, "global_step": 102375, "epoch": 1233} {"train_loss": -21.737274169921875, "global_step": 102376, "epoch": 1233} {"train_loss": -22.085176467895508, "global_step": 102377, "epoch": 1233} {"train_loss": -21.95722770690918, "global_step": 102378, "epoch": 1233} {"train_loss": -21.766284942626953, "global_step": 102379, "epoch": 1233} {"train_loss": -22.1556453704834, "global_step": 102380, "epoch": 1233} {"train_loss": -21.920499801635742, "global_step": 102381, "epoch": 1233} {"train_loss": -22.149065017700195, "global_step": 102382, "epoch": 1233} {"train_loss": -22.328655242919922, "global_step": 102383, "epoch": 1233} {"train_loss": -21.830032348632812, "global_step": 102384, "epoch": 1233} {"train_loss": -21.797574996948242, "global_step": 102385, "epoch": 1233} {"train_loss": -21.594205856323242, "global_step": 102386, "epoch": 1233} {"train_loss": -21.87211036682129, "global_step": 102387, "epoch": 1233} {"train_loss": -21.921300888061523, "global_step": 102388, "epoch": 1233} {"train_loss": -22.09623146057129, "global_step": 102389, "epoch": 1233} {"train_loss": -21.86146354675293, "global_step": 102390, "epoch": 1233} {"train_loss": -22.217714309692383, "global_step": 102391, "epoch": 1233} {"train_loss": -22.348791122436523, "global_step": 102392, "epoch": 1233} {"train_loss": -21.94072914123535, "global_step": 102393, "epoch": 1233} {"train_loss": -22.36598014831543, "global_step": 102394, "epoch": 1233} {"train_loss": -21.90276527404785, "global_step": 102395, "epoch": 1233} {"train_loss": -21.99509620666504, "global_step": 102396, "epoch": 1233} {"train_loss": -22.13910484313965, "global_step": 102397, "epoch": 1233} {"train_loss": -22.25153923034668, "global_step": 102398, "epoch": 1233} {"train_loss": -22.26973533630371, "global_step": 102399, "epoch": 1233} {"train_loss": -21.846418380737305, "global_step": 102400, "epoch": 1233} {"train_loss": -21.79852867126465, "global_step": 102401, "epoch": 1233} {"train_loss": -22.18364715576172, "global_step": 102402, "epoch": 1233} {"train_loss": -22.042808532714844, "global_step": 102403, "epoch": 1233} {"train_loss": -22.25416374206543, "global_step": 102404, "epoch": 1233} {"train_loss": -21.750381469726562, "global_step": 102405, "epoch": 1233} {"train_loss": -21.94831657409668, "global_step": 102406, "epoch": 1233} {"train_loss": -22.184547424316406, "global_step": 102407, "epoch": 1233} {"train_loss": -22.16676902770996, "global_step": 102408, "epoch": 1233} {"train_loss": -22.074798583984375, "global_step": 102409, "epoch": 1233} {"train_loss": -22.039424896240234, "global_step": 102410, "epoch": 1233} {"train_loss": -21.736351013183594, "global_step": 102411, "epoch": 1233} {"train_loss": -21.78230094909668, "global_step": 102412, "epoch": 1233} {"train_loss": -21.642303466796875, "global_step": 102413, "epoch": 1233} {"train_loss": -22.046472549438477, "global_step": 102414, "epoch": 1233} {"train_loss": -21.944387435913086, "global_step": 102415, "epoch": 1233} {"train_loss": -22.18438720703125, "global_step": 102416, "epoch": 1233} {"train_loss": -21.99605369567871, "global_step": 102417, "epoch": 1233} {"train_loss": -22.049375534057617, "global_step": 102418, "epoch": 1233} {"train_loss": -21.47712516784668, "global_step": 102419, "epoch": 1233} {"train_loss": -21.89430809020996, "global_step": 102420, "epoch": 1233} {"train_loss": -21.99266516444195, "global_step": 102421, "epoch": 1233, "val_loss": 6071637.0} {"train_loss": -21.3704891204834, "global_step": 102422, "epoch": 1234} {"train_loss": -21.32411003112793, "global_step": 102423, "epoch": 1234} {"train_loss": -21.34781837463379, "global_step": 102424, "epoch": 1234} {"train_loss": -21.772424697875977, "global_step": 102425, "epoch": 1234} {"train_loss": -22.138010025024414, "global_step": 102426, "epoch": 1234} {"train_loss": -22.012868881225586, "global_step": 102427, "epoch": 1234} {"train_loss": -21.879962921142578, "global_step": 102428, "epoch": 1234} {"train_loss": -21.618513107299805, "global_step": 102429, "epoch": 1234} {"train_loss": -21.614276885986328, "global_step": 102430, "epoch": 1234} {"train_loss": -22.037893295288086, "global_step": 102431, "epoch": 1234} {"train_loss": -22.040454864501953, "global_step": 102432, "epoch": 1234} {"train_loss": -21.966354370117188, "global_step": 102433, "epoch": 1234} {"train_loss": -21.803319931030273, "global_step": 102434, "epoch": 1234} {"train_loss": -22.17705726623535, "global_step": 102435, "epoch": 1234} {"train_loss": -22.085317611694336, "global_step": 102436, "epoch": 1234} {"train_loss": -21.94789695739746, "global_step": 102437, "epoch": 1234} {"train_loss": -21.825870513916016, "global_step": 102438, "epoch": 1234} {"train_loss": -22.033355712890625, "global_step": 102439, "epoch": 1234} {"train_loss": -21.688613891601562, "global_step": 102440, "epoch": 1234} {"train_loss": -22.04878044128418, "global_step": 102441, "epoch": 1234} {"train_loss": -21.964643478393555, "global_step": 102442, "epoch": 1234} {"train_loss": -22.02610969543457, "global_step": 102443, "epoch": 1234} {"train_loss": -22.152318954467773, "global_step": 102444, "epoch": 1234} {"train_loss": -21.98683738708496, "global_step": 102445, "epoch": 1234} {"train_loss": -22.2535457611084, "global_step": 102446, "epoch": 1234} {"train_loss": -22.322874069213867, "global_step": 102447, "epoch": 1234} {"train_loss": -21.933027267456055, "global_step": 102448, "epoch": 1234} {"train_loss": -22.05154800415039, "global_step": 102449, "epoch": 1234} {"train_loss": -21.915929794311523, "global_step": 102450, "epoch": 1234} {"train_loss": -21.895803451538086, "global_step": 102451, "epoch": 1234} {"train_loss": -22.057592391967773, "global_step": 102452, "epoch": 1234} {"train_loss": -22.6258487701416, "global_step": 102453, "epoch": 1234} {"train_loss": -21.934972763061523, "global_step": 102454, "epoch": 1234} {"train_loss": -22.013734817504883, "global_step": 102455, "epoch": 1234} {"train_loss": -21.741621017456055, "global_step": 102456, "epoch": 1234} {"train_loss": -21.940961837768555, "global_step": 102457, "epoch": 1234} {"train_loss": -21.961597442626953, "global_step": 102458, "epoch": 1234} {"train_loss": -21.724706649780273, "global_step": 102459, "epoch": 1234} {"train_loss": -21.713287353515625, "global_step": 102460, "epoch": 1234} {"train_loss": -21.538667678833008, "global_step": 102461, "epoch": 1234} {"train_loss": -21.814977645874023, "global_step": 102462, "epoch": 1234} {"train_loss": -22.305591583251953, "global_step": 102463, "epoch": 1234} {"train_loss": -22.230026245117188, "global_step": 102464, "epoch": 1234} {"train_loss": -21.8490047454834, "global_step": 102465, "epoch": 1234} {"train_loss": -21.84366798400879, "global_step": 102466, "epoch": 1234} {"train_loss": -21.902563095092773, "global_step": 102467, "epoch": 1234} {"train_loss": -21.91937828063965, "global_step": 102468, "epoch": 1234} {"train_loss": -21.60115623474121, "global_step": 102469, "epoch": 1234} {"train_loss": -22.353527069091797, "global_step": 102470, "epoch": 1234} {"train_loss": -21.81290054321289, "global_step": 102471, "epoch": 1234} {"train_loss": -22.485292434692383, "global_step": 102472, "epoch": 1234} {"train_loss": -21.853506088256836, "global_step": 102473, "epoch": 1234} {"train_loss": -22.278623580932617, "global_step": 102474, "epoch": 1234} {"train_loss": -22.0062313079834, "global_step": 102475, "epoch": 1234} {"train_loss": -22.395362854003906, "global_step": 102476, "epoch": 1234} {"train_loss": -22.258785247802734, "global_step": 102477, "epoch": 1234} {"train_loss": -21.95957374572754, "global_step": 102478, "epoch": 1234} {"train_loss": -22.29511833190918, "global_step": 102479, "epoch": 1234} {"train_loss": -21.85392951965332, "global_step": 102480, "epoch": 1234} {"train_loss": -22.49308204650879, "global_step": 102481, "epoch": 1234} {"train_loss": -21.995525360107422, "global_step": 102482, "epoch": 1234} {"train_loss": -22.03693962097168, "global_step": 102483, "epoch": 1234} {"train_loss": -22.029897689819336, "global_step": 102484, "epoch": 1234} {"train_loss": -22.515546798706055, "global_step": 102485, "epoch": 1234} {"train_loss": -21.776966094970703, "global_step": 102486, "epoch": 1234} {"train_loss": -21.672666549682617, "global_step": 102487, "epoch": 1234} {"train_loss": -22.086740493774414, "global_step": 102488, "epoch": 1234} {"train_loss": -22.147602081298828, "global_step": 102489, "epoch": 1234} {"train_loss": -21.965808868408203, "global_step": 102490, "epoch": 1234} {"train_loss": -22.102590560913086, "global_step": 102491, "epoch": 1234} {"train_loss": -21.9562931060791, "global_step": 102492, "epoch": 1234} {"train_loss": -21.543766021728516, "global_step": 102493, "epoch": 1234} {"train_loss": -21.476001739501953, "global_step": 102494, "epoch": 1234} {"train_loss": -22.29432487487793, "global_step": 102495, "epoch": 1234} {"train_loss": -21.947750091552734, "global_step": 102496, "epoch": 1234} {"train_loss": -21.950050354003906, "global_step": 102497, "epoch": 1234} {"train_loss": -21.86913299560547, "global_step": 102498, "epoch": 1234} {"train_loss": -21.96036148071289, "global_step": 102499, "epoch": 1234} {"train_loss": -22.024169921875, "global_step": 102500, "epoch": 1234} {"train_loss": -22.044620513916016, "global_step": 102501, "epoch": 1234} {"train_loss": -21.9544620513916, "global_step": 102502, "epoch": 1234} {"train_loss": -22.32497787475586, "global_step": 102503, "epoch": 1234} {"train_loss": -21.97412355262113, "global_step": 102504, "epoch": 1234, "val_loss": 6128204.5} {"train_loss": -21.691102981567383, "global_step": 102505, "epoch": 1235} {"train_loss": -21.695051193237305, "global_step": 102506, "epoch": 1235} {"train_loss": -21.981304168701172, "global_step": 102507, "epoch": 1235} {"train_loss": -22.03063201904297, "global_step": 102508, "epoch": 1235} {"train_loss": -21.36160659790039, "global_step": 102509, "epoch": 1235} {"train_loss": -21.81810760498047, "global_step": 102510, "epoch": 1235} {"train_loss": -21.5281982421875, "global_step": 102511, "epoch": 1235} {"train_loss": -21.82681655883789, "global_step": 102512, "epoch": 1235} {"train_loss": -21.925230026245117, "global_step": 102513, "epoch": 1235} {"train_loss": -21.92675018310547, "global_step": 102514, "epoch": 1235} {"train_loss": -21.884721755981445, "global_step": 102515, "epoch": 1235} {"train_loss": -21.71653938293457, "global_step": 102516, "epoch": 1235} {"train_loss": -21.66434669494629, "global_step": 102517, "epoch": 1235} {"train_loss": -21.92236328125, "global_step": 102518, "epoch": 1235} {"train_loss": -21.740692138671875, "global_step": 102519, "epoch": 1235} {"train_loss": -21.66253662109375, "global_step": 102520, "epoch": 1235} {"train_loss": -21.98683738708496, "global_step": 102521, "epoch": 1235} {"train_loss": -21.709623336791992, "global_step": 102522, "epoch": 1235} {"train_loss": -21.647968292236328, "global_step": 102523, "epoch": 1235} {"train_loss": -22.140995025634766, "global_step": 102524, "epoch": 1235} {"train_loss": -21.58414077758789, "global_step": 102525, "epoch": 1235} {"train_loss": -21.90940284729004, "global_step": 102526, "epoch": 1235} {"train_loss": -21.922475814819336, "global_step": 102527, "epoch": 1235} {"train_loss": -22.076826095581055, "global_step": 102528, "epoch": 1235} {"train_loss": -22.107370376586914, "global_step": 102529, "epoch": 1235} {"train_loss": -21.752445220947266, "global_step": 102530, "epoch": 1235} {"train_loss": -22.22751235961914, "global_step": 102531, "epoch": 1235} {"train_loss": -22.259492874145508, "global_step": 102532, "epoch": 1235} {"train_loss": -22.145076751708984, "global_step": 102533, "epoch": 1235} {"train_loss": -22.08011817932129, "global_step": 102534, "epoch": 1235} {"train_loss": -21.9924373626709, "global_step": 102535, "epoch": 1235} {"train_loss": -21.857376098632812, "global_step": 102536, "epoch": 1235} {"train_loss": -22.169994354248047, "global_step": 102537, "epoch": 1235} {"train_loss": -21.912857055664062, "global_step": 102538, "epoch": 1235} {"train_loss": -22.255489349365234, "global_step": 102539, "epoch": 1235} {"train_loss": -22.273191452026367, "global_step": 102540, "epoch": 1235} {"train_loss": -21.870407104492188, "global_step": 102541, "epoch": 1235} {"train_loss": -21.907978057861328, "global_step": 102542, "epoch": 1235} {"train_loss": -22.25716209411621, "global_step": 102543, "epoch": 1235} {"train_loss": -21.961305618286133, "global_step": 102544, "epoch": 1235} {"train_loss": -22.057769775390625, "global_step": 102545, "epoch": 1235} {"train_loss": -22.20562171936035, "global_step": 102546, "epoch": 1235} {"train_loss": -22.20063591003418, "global_step": 102547, "epoch": 1235} {"train_loss": -21.92477035522461, "global_step": 102548, "epoch": 1235} {"train_loss": -21.97100257873535, "global_step": 102549, "epoch": 1235} {"train_loss": -21.868911743164062, "global_step": 102550, "epoch": 1235} {"train_loss": -21.98160743713379, "global_step": 102551, "epoch": 1235} {"train_loss": -21.859886169433594, "global_step": 102552, "epoch": 1235} {"train_loss": -21.970144271850586, "global_step": 102553, "epoch": 1235} {"train_loss": -22.05618667602539, "global_step": 102554, "epoch": 1235} {"train_loss": -22.075010299682617, "global_step": 102555, "epoch": 1235} {"train_loss": -22.084671020507812, "global_step": 102556, "epoch": 1235} {"train_loss": -21.88690185546875, "global_step": 102557, "epoch": 1235} {"train_loss": -22.47055435180664, "global_step": 102558, "epoch": 1235} {"train_loss": -22.18153953552246, "global_step": 102559, "epoch": 1235} {"train_loss": -22.214038848876953, "global_step": 102560, "epoch": 1235} {"train_loss": -22.06051254272461, "global_step": 102561, "epoch": 1235} {"train_loss": -22.077255249023438, "global_step": 102562, "epoch": 1235} {"train_loss": -21.857826232910156, "global_step": 102563, "epoch": 1235} {"train_loss": -22.02065086364746, "global_step": 102564, "epoch": 1235} {"train_loss": -21.58783531188965, "global_step": 102565, "epoch": 1235} {"train_loss": -21.918582916259766, "global_step": 102566, "epoch": 1235} {"train_loss": -22.071195602416992, "global_step": 102567, "epoch": 1235} {"train_loss": -21.712867736816406, "global_step": 102568, "epoch": 1235} {"train_loss": -22.11372947692871, "global_step": 102569, "epoch": 1235} {"train_loss": -22.02628517150879, "global_step": 102570, "epoch": 1235} {"train_loss": -22.076486587524414, "global_step": 102571, "epoch": 1235} {"train_loss": -22.070585250854492, "global_step": 102572, "epoch": 1235} {"train_loss": -21.81260108947754, "global_step": 102573, "epoch": 1235} {"train_loss": -21.860538482666016, "global_step": 102574, "epoch": 1235} {"train_loss": -22.164554595947266, "global_step": 102575, "epoch": 1235} {"train_loss": -22.19318199157715, "global_step": 102576, "epoch": 1235} {"train_loss": -22.412748336791992, "global_step": 102577, "epoch": 1235} {"train_loss": -22.15082359313965, "global_step": 102578, "epoch": 1235} {"train_loss": -22.297344207763672, "global_step": 102579, "epoch": 1235} {"train_loss": -22.347972869873047, "global_step": 102580, "epoch": 1235} {"train_loss": -22.386249542236328, "global_step": 102581, "epoch": 1235} {"train_loss": -21.98744010925293, "global_step": 102582, "epoch": 1235} {"train_loss": -21.648609161376953, "global_step": 102583, "epoch": 1235} {"train_loss": -22.14700698852539, "global_step": 102584, "epoch": 1235} {"train_loss": -22.235918045043945, "global_step": 102585, "epoch": 1235} {"train_loss": -22.183818817138672, "global_step": 102586, "epoch": 1235} {"train_loss": -21.98393801034215, "global_step": 102587, "epoch": 1235, "val_loss": 6107509.5} {"train_loss": -21.820632934570312, "global_step": 102588, "epoch": 1236} {"train_loss": -21.701873779296875, "global_step": 102589, "epoch": 1236} {"train_loss": -21.789403915405273, "global_step": 102590, "epoch": 1236} {"train_loss": -21.66411590576172, "global_step": 102591, "epoch": 1236} {"train_loss": -21.94804573059082, "global_step": 102592, "epoch": 1236} {"train_loss": -21.670255661010742, "global_step": 102593, "epoch": 1236} {"train_loss": -21.84086036682129, "global_step": 102594, "epoch": 1236} {"train_loss": -21.6840763092041, "global_step": 102595, "epoch": 1236} {"train_loss": -22.129608154296875, "global_step": 102596, "epoch": 1236} {"train_loss": -21.99139976501465, "global_step": 102597, "epoch": 1236} {"train_loss": -22.042186737060547, "global_step": 102598, "epoch": 1236} {"train_loss": -22.163591384887695, "global_step": 102599, "epoch": 1236} {"train_loss": -22.012968063354492, "global_step": 102600, "epoch": 1236} {"train_loss": -22.10003662109375, "global_step": 102601, "epoch": 1236} {"train_loss": -21.882251739501953, "global_step": 102602, "epoch": 1236} {"train_loss": -21.890663146972656, "global_step": 102603, "epoch": 1236} {"train_loss": -21.76851463317871, "global_step": 102604, "epoch": 1236} {"train_loss": -22.17164421081543, "global_step": 102605, "epoch": 1236} {"train_loss": -21.97688102722168, "global_step": 102606, "epoch": 1236} {"train_loss": -21.598724365234375, "global_step": 102607, "epoch": 1236} {"train_loss": -21.962345123291016, "global_step": 102608, "epoch": 1236} {"train_loss": -21.8856201171875, "global_step": 102609, "epoch": 1236} {"train_loss": -21.741016387939453, "global_step": 102610, "epoch": 1236} {"train_loss": -21.605146408081055, "global_step": 102611, "epoch": 1236} {"train_loss": -22.007436752319336, "global_step": 102612, "epoch": 1236} {"train_loss": -22.199235916137695, "global_step": 102613, "epoch": 1236} {"train_loss": -21.84406280517578, "global_step": 102614, "epoch": 1236} {"train_loss": -21.959081649780273, "global_step": 102615, "epoch": 1236} {"train_loss": -21.743579864501953, "global_step": 102616, "epoch": 1236} {"train_loss": -21.885286331176758, "global_step": 102617, "epoch": 1236} {"train_loss": -21.846166610717773, "global_step": 102618, "epoch": 1236} {"train_loss": -21.6735897064209, "global_step": 102619, "epoch": 1236} {"train_loss": -22.20794105529785, "global_step": 102620, "epoch": 1236} {"train_loss": -21.846261978149414, "global_step": 102621, "epoch": 1236} {"train_loss": -21.895702362060547, "global_step": 102622, "epoch": 1236} {"train_loss": -22.003049850463867, "global_step": 102623, "epoch": 1236} {"train_loss": -21.923871994018555, "global_step": 102624, "epoch": 1236} {"train_loss": -22.15281867980957, "global_step": 102625, "epoch": 1236} {"train_loss": -22.023651123046875, "global_step": 102626, "epoch": 1236} {"train_loss": -22.256553649902344, "global_step": 102627, "epoch": 1236} {"train_loss": -21.713659286499023, "global_step": 102628, "epoch": 1236} {"train_loss": -22.066221237182617, "global_step": 102629, "epoch": 1236} {"train_loss": -22.219999313354492, "global_step": 102630, "epoch": 1236} {"train_loss": -22.19223976135254, "global_step": 102631, "epoch": 1236} {"train_loss": -22.137908935546875, "global_step": 102632, "epoch": 1236} {"train_loss": -21.844831466674805, "global_step": 102633, "epoch": 1236} {"train_loss": -22.054330825805664, "global_step": 102634, "epoch": 1236} {"train_loss": -22.022613525390625, "global_step": 102635, "epoch": 1236} {"train_loss": -21.880220413208008, "global_step": 102636, "epoch": 1236} {"train_loss": -22.112701416015625, "global_step": 102637, "epoch": 1236} {"train_loss": -22.403894424438477, "global_step": 102638, "epoch": 1236} {"train_loss": -22.080337524414062, "global_step": 102639, "epoch": 1236} {"train_loss": -21.850805282592773, "global_step": 102640, "epoch": 1236} {"train_loss": -21.767885208129883, "global_step": 102641, "epoch": 1236} {"train_loss": -22.108896255493164, "global_step": 102642, "epoch": 1236} {"train_loss": -21.96455955505371, "global_step": 102643, "epoch": 1236} {"train_loss": -22.197542190551758, "global_step": 102644, "epoch": 1236} {"train_loss": -22.143402099609375, "global_step": 102645, "epoch": 1236} {"train_loss": -22.367156982421875, "global_step": 102646, "epoch": 1236} {"train_loss": -22.008344650268555, "global_step": 102647, "epoch": 1236} {"train_loss": -22.2194881439209, "global_step": 102648, "epoch": 1236} {"train_loss": -21.9608097076416, "global_step": 102649, "epoch": 1236} {"train_loss": -22.097564697265625, "global_step": 102650, "epoch": 1236} {"train_loss": -22.02833366394043, "global_step": 102651, "epoch": 1236} {"train_loss": -21.632221221923828, "global_step": 102652, "epoch": 1236} {"train_loss": -22.042951583862305, "global_step": 102653, "epoch": 1236} {"train_loss": -22.147611618041992, "global_step": 102654, "epoch": 1236} {"train_loss": -21.64414405822754, "global_step": 102655, "epoch": 1236} {"train_loss": -22.063617706298828, "global_step": 102656, "epoch": 1236} {"train_loss": -22.31876564025879, "global_step": 102657, "epoch": 1236} {"train_loss": -22.1392879486084, "global_step": 102658, "epoch": 1236} {"train_loss": -21.487916946411133, "global_step": 102659, "epoch": 1236} {"train_loss": -21.895383834838867, "global_step": 102660, "epoch": 1236} {"train_loss": -22.09830093383789, "global_step": 102661, "epoch": 1236} {"train_loss": -21.774402618408203, "global_step": 102662, "epoch": 1236} {"train_loss": -21.90675926208496, "global_step": 102663, "epoch": 1236} {"train_loss": -22.16539764404297, "global_step": 102664, "epoch": 1236} {"train_loss": -21.637451171875, "global_step": 102665, "epoch": 1236} {"train_loss": -21.95719337463379, "global_step": 102666, "epoch": 1236} {"train_loss": -21.980356216430664, "global_step": 102667, "epoch": 1236} {"train_loss": -21.943286895751953, "global_step": 102668, "epoch": 1236} {"train_loss": -22.02950096130371, "global_step": 102669, "epoch": 1236} {"train_loss": -21.95159241090338, "global_step": 102670, "epoch": 1236, "val_loss": 6017901.0} {"train_loss": -21.60846710205078, "global_step": 102671, "epoch": 1237} {"train_loss": -21.842405319213867, "global_step": 102672, "epoch": 1237} {"train_loss": -21.867517471313477, "global_step": 102673, "epoch": 1237} {"train_loss": -21.85548973083496, "global_step": 102674, "epoch": 1237} {"train_loss": -21.615272521972656, "global_step": 102675, "epoch": 1237} {"train_loss": -21.701244354248047, "global_step": 102676, "epoch": 1237} {"train_loss": -21.75318717956543, "global_step": 102677, "epoch": 1237} {"train_loss": -21.641080856323242, "global_step": 102678, "epoch": 1237} {"train_loss": -21.98749351501465, "global_step": 102679, "epoch": 1237} {"train_loss": -21.801218032836914, "global_step": 102680, "epoch": 1237} {"train_loss": -21.96619987487793, "global_step": 102681, "epoch": 1237} {"train_loss": -21.836088180541992, "global_step": 102682, "epoch": 1237} {"train_loss": -21.896543502807617, "global_step": 102683, "epoch": 1237} {"train_loss": -22.156356811523438, "global_step": 102684, "epoch": 1237} {"train_loss": -22.00482749938965, "global_step": 102685, "epoch": 1237} {"train_loss": -21.857419967651367, "global_step": 102686, "epoch": 1237} {"train_loss": -21.840219497680664, "global_step": 102687, "epoch": 1237} {"train_loss": -22.011920928955078, "global_step": 102688, "epoch": 1237} {"train_loss": -21.883834838867188, "global_step": 102689, "epoch": 1237} {"train_loss": -21.9996280670166, "global_step": 102690, "epoch": 1237} {"train_loss": -21.917898178100586, "global_step": 102691, "epoch": 1237} {"train_loss": -21.793325424194336, "global_step": 102692, "epoch": 1237} {"train_loss": -21.77950096130371, "global_step": 102693, "epoch": 1237} {"train_loss": -22.109296798706055, "global_step": 102694, "epoch": 1237} {"train_loss": -21.815404891967773, "global_step": 102695, "epoch": 1237} {"train_loss": -22.328750610351562, "global_step": 102696, "epoch": 1237} {"train_loss": -21.90882110595703, "global_step": 102697, "epoch": 1237} {"train_loss": -21.978452682495117, "global_step": 102698, "epoch": 1237} {"train_loss": -22.092180252075195, "global_step": 102699, "epoch": 1237} {"train_loss": -21.991880416870117, "global_step": 102700, "epoch": 1237} {"train_loss": -21.98768424987793, "global_step": 102701, "epoch": 1237} {"train_loss": -21.972993850708008, "global_step": 102702, "epoch": 1237} {"train_loss": -21.602277755737305, "global_step": 102703, "epoch": 1237} {"train_loss": -21.802227020263672, "global_step": 102704, "epoch": 1237} {"train_loss": -22.036457061767578, "global_step": 102705, "epoch": 1237} {"train_loss": -21.947973251342773, "global_step": 102706, "epoch": 1237} {"train_loss": -22.24192237854004, "global_step": 102707, "epoch": 1237} {"train_loss": -22.05730628967285, "global_step": 102708, "epoch": 1237} {"train_loss": -22.20760154724121, "global_step": 102709, "epoch": 1237} {"train_loss": -22.185428619384766, "global_step": 102710, "epoch": 1237} {"train_loss": -22.406261444091797, "global_step": 102711, "epoch": 1237} {"train_loss": -21.956954956054688, "global_step": 102712, "epoch": 1237} {"train_loss": -22.412015914916992, "global_step": 102713, "epoch": 1237} {"train_loss": -21.94537353515625, "global_step": 102714, "epoch": 1237} {"train_loss": -21.952861785888672, "global_step": 102715, "epoch": 1237} {"train_loss": -22.169729232788086, "global_step": 102716, "epoch": 1237} {"train_loss": -22.06269645690918, "global_step": 102717, "epoch": 1237} {"train_loss": -22.03369140625, "global_step": 102718, "epoch": 1237} {"train_loss": -22.2300968170166, "global_step": 102719, "epoch": 1237} {"train_loss": -22.262582778930664, "global_step": 102720, "epoch": 1237} {"train_loss": -22.265947341918945, "global_step": 102721, "epoch": 1237} {"train_loss": -22.1224422454834, "global_step": 102722, "epoch": 1237} {"train_loss": -22.021677017211914, "global_step": 102723, "epoch": 1237} {"train_loss": -21.954286575317383, "global_step": 102724, "epoch": 1237} {"train_loss": -21.87814712524414, "global_step": 102725, "epoch": 1237} {"train_loss": -21.949844360351562, "global_step": 102726, "epoch": 1237} {"train_loss": -22.190914154052734, "global_step": 102727, "epoch": 1237} {"train_loss": -21.4859561920166, "global_step": 102728, "epoch": 1237} {"train_loss": -22.142990112304688, "global_step": 102729, "epoch": 1237} {"train_loss": -22.231657028198242, "global_step": 102730, "epoch": 1237} {"train_loss": -22.41603660583496, "global_step": 102731, "epoch": 1237} {"train_loss": -22.102466583251953, "global_step": 102732, "epoch": 1237} {"train_loss": -21.721467971801758, "global_step": 102733, "epoch": 1237} {"train_loss": -22.049184799194336, "global_step": 102734, "epoch": 1237} {"train_loss": -22.359655380249023, "global_step": 102735, "epoch": 1237} {"train_loss": -21.972583770751953, "global_step": 102736, "epoch": 1237} {"train_loss": -22.165124893188477, "global_step": 102737, "epoch": 1237} {"train_loss": -22.208091735839844, "global_step": 102738, "epoch": 1237} {"train_loss": -22.190336227416992, "global_step": 102739, "epoch": 1237} {"train_loss": -21.608888626098633, "global_step": 102740, "epoch": 1237} {"train_loss": -22.101099014282227, "global_step": 102741, "epoch": 1237} {"train_loss": -22.130563735961914, "global_step": 102742, "epoch": 1237} {"train_loss": -21.866235733032227, "global_step": 102743, "epoch": 1237} {"train_loss": -21.987682342529297, "global_step": 102744, "epoch": 1237} {"train_loss": -22.162508010864258, "global_step": 102745, "epoch": 1237} {"train_loss": -22.053468704223633, "global_step": 102746, "epoch": 1237} {"train_loss": -22.01566505432129, "global_step": 102747, "epoch": 1237} {"train_loss": -22.302194595336914, "global_step": 102748, "epoch": 1237} {"train_loss": -21.910871505737305, "global_step": 102749, "epoch": 1237} {"train_loss": -21.706968307495117, "global_step": 102750, "epoch": 1237} {"train_loss": -22.236127853393555, "global_step": 102751, "epoch": 1237} {"train_loss": -22.142724990844727, "global_step": 102752, "epoch": 1237} {"train_loss": -21.998659662453527, "global_step": 102753, "epoch": 1237, "val_loss": 6174450.0} {"train_loss": -21.57970428466797, "global_step": 102754, "epoch": 1238} {"train_loss": -21.049850463867188, "global_step": 102755, "epoch": 1238} {"train_loss": -21.616796493530273, "global_step": 102756, "epoch": 1238} {"train_loss": -21.372488021850586, "global_step": 102757, "epoch": 1238} {"train_loss": -21.932416915893555, "global_step": 102758, "epoch": 1238} {"train_loss": -21.12636375427246, "global_step": 102759, "epoch": 1238} {"train_loss": -21.60992431640625, "global_step": 102760, "epoch": 1238} {"train_loss": -21.890079498291016, "global_step": 102761, "epoch": 1238} {"train_loss": -21.522884368896484, "global_step": 102762, "epoch": 1238} {"train_loss": -21.74428367614746, "global_step": 102763, "epoch": 1238} {"train_loss": -21.722166061401367, "global_step": 102764, "epoch": 1238} {"train_loss": -21.535181045532227, "global_step": 102765, "epoch": 1238} {"train_loss": -21.616811752319336, "global_step": 102766, "epoch": 1238} {"train_loss": -21.542945861816406, "global_step": 102767, "epoch": 1238} {"train_loss": -21.5318660736084, "global_step": 102768, "epoch": 1238} {"train_loss": -21.482864379882812, "global_step": 102769, "epoch": 1238} {"train_loss": -21.609519958496094, "global_step": 102770, "epoch": 1238} {"train_loss": -21.44865608215332, "global_step": 102771, "epoch": 1238} {"train_loss": -21.9323787689209, "global_step": 102772, "epoch": 1238} {"train_loss": -21.673566818237305, "global_step": 102773, "epoch": 1238} {"train_loss": -21.719282150268555, "global_step": 102774, "epoch": 1238} {"train_loss": -21.414113998413086, "global_step": 102775, "epoch": 1238} {"train_loss": -21.559953689575195, "global_step": 102776, "epoch": 1238} {"train_loss": -21.853172302246094, "global_step": 102777, "epoch": 1238} {"train_loss": -21.928180694580078, "global_step": 102778, "epoch": 1238} {"train_loss": -21.580402374267578, "global_step": 102779, "epoch": 1238} {"train_loss": -21.90903091430664, "global_step": 102780, "epoch": 1238} {"train_loss": -21.929931640625, "global_step": 102781, "epoch": 1238} {"train_loss": -21.75495147705078, "global_step": 102782, "epoch": 1238} {"train_loss": -22.39889144897461, "global_step": 102783, "epoch": 1238} {"train_loss": -21.848529815673828, "global_step": 102784, "epoch": 1238} {"train_loss": -22.42871856689453, "global_step": 102785, "epoch": 1238} {"train_loss": -21.53523063659668, "global_step": 102786, "epoch": 1238} {"train_loss": -21.798439025878906, "global_step": 102787, "epoch": 1238} {"train_loss": -21.38760757446289, "global_step": 102788, "epoch": 1238} {"train_loss": -21.850252151489258, "global_step": 102789, "epoch": 1238} {"train_loss": -22.170154571533203, "global_step": 102790, "epoch": 1238} {"train_loss": -22.05384635925293, "global_step": 102791, "epoch": 1238} {"train_loss": -22.190961837768555, "global_step": 102792, "epoch": 1238} {"train_loss": -22.24318504333496, "global_step": 102793, "epoch": 1238} {"train_loss": -21.94425392150879, "global_step": 102794, "epoch": 1238} {"train_loss": -21.666749954223633, "global_step": 102795, "epoch": 1238} {"train_loss": -22.09456443786621, "global_step": 102796, "epoch": 1238} {"train_loss": -21.934322357177734, "global_step": 102797, "epoch": 1238} {"train_loss": -22.2905216217041, "global_step": 102798, "epoch": 1238} {"train_loss": -22.013198852539062, "global_step": 102799, "epoch": 1238} {"train_loss": -22.2293758392334, "global_step": 102800, "epoch": 1238} {"train_loss": -22.07345962524414, "global_step": 102801, "epoch": 1238} {"train_loss": -21.978784561157227, "global_step": 102802, "epoch": 1238} {"train_loss": -22.026275634765625, "global_step": 102803, "epoch": 1238} {"train_loss": -21.966093063354492, "global_step": 102804, "epoch": 1238} {"train_loss": -22.21896743774414, "global_step": 102805, "epoch": 1238} {"train_loss": -21.76201057434082, "global_step": 102806, "epoch": 1238} {"train_loss": -22.07929229736328, "global_step": 102807, "epoch": 1238} {"train_loss": -22.165128707885742, "global_step": 102808, "epoch": 1238} {"train_loss": -22.05428123474121, "global_step": 102809, "epoch": 1238} {"train_loss": -22.27382469177246, "global_step": 102810, "epoch": 1238} {"train_loss": -22.542184829711914, "global_step": 102811, "epoch": 1238} {"train_loss": -22.237974166870117, "global_step": 102812, "epoch": 1238} {"train_loss": -21.797565460205078, "global_step": 102813, "epoch": 1238} {"train_loss": -21.77915382385254, "global_step": 102814, "epoch": 1238} {"train_loss": -22.215497970581055, "global_step": 102815, "epoch": 1238} {"train_loss": -21.5304012298584, "global_step": 102816, "epoch": 1238} {"train_loss": -22.143789291381836, "global_step": 102817, "epoch": 1238} {"train_loss": -21.773841857910156, "global_step": 102818, "epoch": 1238} {"train_loss": -22.16070556640625, "global_step": 102819, "epoch": 1238} {"train_loss": -22.123464584350586, "global_step": 102820, "epoch": 1238} {"train_loss": -22.04289436340332, "global_step": 102821, "epoch": 1238} {"train_loss": -22.114286422729492, "global_step": 102822, "epoch": 1238} {"train_loss": -21.837072372436523, "global_step": 102823, "epoch": 1238} {"train_loss": -22.266931533813477, "global_step": 102824, "epoch": 1238} {"train_loss": -22.129302978515625, "global_step": 102825, "epoch": 1238} {"train_loss": -22.194231033325195, "global_step": 102826, "epoch": 1238} {"train_loss": -22.264699935913086, "global_step": 102827, "epoch": 1238} {"train_loss": -22.542028427124023, "global_step": 102828, "epoch": 1238} {"train_loss": -21.691747665405273, "global_step": 102829, "epoch": 1238} {"train_loss": -21.83032989501953, "global_step": 102830, "epoch": 1238} {"train_loss": -21.9499454498291, "global_step": 102831, "epoch": 1238} {"train_loss": -22.136667251586914, "global_step": 102832, "epoch": 1238} {"train_loss": -22.156770706176758, "global_step": 102833, "epoch": 1238} {"train_loss": -22.517438888549805, "global_step": 102834, "epoch": 1238} {"train_loss": -21.958234786987305, "global_step": 102835, "epoch": 1238} {"train_loss": -21.8874718080084, "global_step": 102836, "epoch": 1238, "val_loss": 6156474.5} {"train_loss": -21.822998046875, "global_step": 102837, "epoch": 1239} {"train_loss": -21.702686309814453, "global_step": 102838, "epoch": 1239} {"train_loss": -21.579904556274414, "global_step": 102839, "epoch": 1239} {"train_loss": -21.533620834350586, "global_step": 102840, "epoch": 1239} {"train_loss": -21.947629928588867, "global_step": 102841, "epoch": 1239} {"train_loss": -21.422748565673828, "global_step": 102842, "epoch": 1239} {"train_loss": -21.675825119018555, "global_step": 102843, "epoch": 1239} {"train_loss": -22.1007022857666, "global_step": 102844, "epoch": 1239} {"train_loss": -21.58875846862793, "global_step": 102845, "epoch": 1239} {"train_loss": -21.467283248901367, "global_step": 102846, "epoch": 1239} {"train_loss": -21.605884552001953, "global_step": 102847, "epoch": 1239} {"train_loss": -21.818252563476562, "global_step": 102848, "epoch": 1239} {"train_loss": -21.722665786743164, "global_step": 102849, "epoch": 1239} {"train_loss": -22.05817985534668, "global_step": 102850, "epoch": 1239} {"train_loss": -22.10894775390625, "global_step": 102851, "epoch": 1239} {"train_loss": -21.735971450805664, "global_step": 102852, "epoch": 1239} {"train_loss": -21.918731689453125, "global_step": 102853, "epoch": 1239} {"train_loss": -22.2332820892334, "global_step": 102854, "epoch": 1239} {"train_loss": -22.275928497314453, "global_step": 102855, "epoch": 1239} {"train_loss": -21.476093292236328, "global_step": 102856, "epoch": 1239} {"train_loss": -21.9787540435791, "global_step": 102857, "epoch": 1239} {"train_loss": -22.032546997070312, "global_step": 102858, "epoch": 1239} {"train_loss": -21.869171142578125, "global_step": 102859, "epoch": 1239} {"train_loss": -22.077150344848633, "global_step": 102860, "epoch": 1239} {"train_loss": -21.770355224609375, "global_step": 102861, "epoch": 1239} {"train_loss": -22.239124298095703, "global_step": 102862, "epoch": 1239} {"train_loss": -21.699813842773438, "global_step": 102863, "epoch": 1239} {"train_loss": -22.21592140197754, "global_step": 102864, "epoch": 1239} {"train_loss": -22.117530822753906, "global_step": 102865, "epoch": 1239} {"train_loss": -22.090557098388672, "global_step": 102866, "epoch": 1239} {"train_loss": -21.888952255249023, "global_step": 102867, "epoch": 1239} {"train_loss": -22.033864974975586, "global_step": 102868, "epoch": 1239} {"train_loss": -22.081573486328125, "global_step": 102869, "epoch": 1239} {"train_loss": -22.09222412109375, "global_step": 102870, "epoch": 1239} {"train_loss": -21.872121810913086, "global_step": 102871, "epoch": 1239} {"train_loss": -22.035940170288086, "global_step": 102872, "epoch": 1239} {"train_loss": -22.5130615234375, "global_step": 102873, "epoch": 1239} {"train_loss": -21.973648071289062, "global_step": 102874, "epoch": 1239} {"train_loss": -21.9333553314209, "global_step": 102875, "epoch": 1239} {"train_loss": -22.079252243041992, "global_step": 102876, "epoch": 1239} {"train_loss": -21.995817184448242, "global_step": 102877, "epoch": 1239} {"train_loss": -22.021041870117188, "global_step": 102878, "epoch": 1239} {"train_loss": -21.923263549804688, "global_step": 102879, "epoch": 1239} {"train_loss": -22.30780601501465, "global_step": 102880, "epoch": 1239} {"train_loss": -21.97566795349121, "global_step": 102881, "epoch": 1239} {"train_loss": -22.08686637878418, "global_step": 102882, "epoch": 1239} {"train_loss": -22.221830368041992, "global_step": 102883, "epoch": 1239} {"train_loss": -21.954957962036133, "global_step": 102884, "epoch": 1239} {"train_loss": -22.111495971679688, "global_step": 102885, "epoch": 1239} {"train_loss": -21.99989891052246, "global_step": 102886, "epoch": 1239} {"train_loss": -21.692752838134766, "global_step": 102887, "epoch": 1239} {"train_loss": -21.78272819519043, "global_step": 102888, "epoch": 1239} {"train_loss": -22.00626564025879, "global_step": 102889, "epoch": 1239} {"train_loss": -21.9162654876709, "global_step": 102890, "epoch": 1239} {"train_loss": -22.2069034576416, "global_step": 102891, "epoch": 1239} {"train_loss": -22.208133697509766, "global_step": 102892, "epoch": 1239} {"train_loss": -22.02101707458496, "global_step": 102893, "epoch": 1239} {"train_loss": -22.043874740600586, "global_step": 102894, "epoch": 1239} {"train_loss": -22.156600952148438, "global_step": 102895, "epoch": 1239} {"train_loss": -22.070920944213867, "global_step": 102896, "epoch": 1239} {"train_loss": -22.173185348510742, "global_step": 102897, "epoch": 1239} {"train_loss": -22.05609130859375, "global_step": 102898, "epoch": 1239} {"train_loss": -22.293704986572266, "global_step": 102899, "epoch": 1239} {"train_loss": -22.10389518737793, "global_step": 102900, "epoch": 1239} {"train_loss": -22.237340927124023, "global_step": 102901, "epoch": 1239} {"train_loss": -22.272153854370117, "global_step": 102902, "epoch": 1239} {"train_loss": -21.89161491394043, "global_step": 102903, "epoch": 1239} {"train_loss": -22.19573974609375, "global_step": 102904, "epoch": 1239} {"train_loss": -21.9959659576416, "global_step": 102905, "epoch": 1239} {"train_loss": -22.318002700805664, "global_step": 102906, "epoch": 1239} {"train_loss": -22.02737808227539, "global_step": 102907, "epoch": 1239} {"train_loss": -22.087369918823242, "global_step": 102908, "epoch": 1239} {"train_loss": -22.230758666992188, "global_step": 102909, "epoch": 1239} {"train_loss": -22.43107032775879, "global_step": 102910, "epoch": 1239} {"train_loss": -22.106708526611328, "global_step": 102911, "epoch": 1239} {"train_loss": -22.207914352416992, "global_step": 102912, "epoch": 1239} {"train_loss": -22.37462043762207, "global_step": 102913, "epoch": 1239} {"train_loss": -22.214115142822266, "global_step": 102914, "epoch": 1239} {"train_loss": -22.185178756713867, "global_step": 102915, "epoch": 1239} {"train_loss": -22.132068634033203, "global_step": 102916, "epoch": 1239} {"train_loss": -21.774778366088867, "global_step": 102917, "epoch": 1239} {"train_loss": -22.273588180541992, "global_step": 102918, "epoch": 1239} {"train_loss": -22.00694116339626, "global_step": 102919, "epoch": 1239, "val_loss": 6078226.0} {"train_loss": -22.050861358642578, "global_step": 102920, "epoch": 1240} {"train_loss": -21.78072166442871, "global_step": 102921, "epoch": 1240} {"train_loss": -21.460866928100586, "global_step": 102922, "epoch": 1240} {"train_loss": -21.556516647338867, "global_step": 102923, "epoch": 1240} {"train_loss": -22.06264305114746, "global_step": 102924, "epoch": 1240} {"train_loss": -21.57480239868164, "global_step": 102925, "epoch": 1240} {"train_loss": -21.730236053466797, "global_step": 102926, "epoch": 1240} {"train_loss": -21.82491111755371, "global_step": 102927, "epoch": 1240} {"train_loss": -21.885778427124023, "global_step": 102928, "epoch": 1240} {"train_loss": -22.03232192993164, "global_step": 102929, "epoch": 1240} {"train_loss": -21.932828903198242, "global_step": 102930, "epoch": 1240} {"train_loss": -21.627166748046875, "global_step": 102931, "epoch": 1240} {"train_loss": -21.908432006835938, "global_step": 102932, "epoch": 1240} {"train_loss": -22.136274337768555, "global_step": 102933, "epoch": 1240} {"train_loss": -21.823501586914062, "global_step": 102934, "epoch": 1240} {"train_loss": -21.89033317565918, "global_step": 102935, "epoch": 1240} {"train_loss": -21.8978214263916, "global_step": 102936, "epoch": 1240} {"train_loss": -22.004974365234375, "global_step": 102937, "epoch": 1240} {"train_loss": -22.07132339477539, "global_step": 102938, "epoch": 1240} {"train_loss": -21.980497360229492, "global_step": 102939, "epoch": 1240} {"train_loss": -21.9639949798584, "global_step": 102940, "epoch": 1240} {"train_loss": -21.868356704711914, "global_step": 102941, "epoch": 1240} {"train_loss": -21.802724838256836, "global_step": 102942, "epoch": 1240} {"train_loss": -22.174781799316406, "global_step": 102943, "epoch": 1240} {"train_loss": -21.849740982055664, "global_step": 102944, "epoch": 1240} {"train_loss": -22.074129104614258, "global_step": 102945, "epoch": 1240} {"train_loss": -22.00030517578125, "global_step": 102946, "epoch": 1240} {"train_loss": -22.09058380126953, "global_step": 102947, "epoch": 1240} {"train_loss": -21.693206787109375, "global_step": 102948, "epoch": 1240} {"train_loss": -22.050752639770508, "global_step": 102949, "epoch": 1240} {"train_loss": -21.443370819091797, "global_step": 102950, "epoch": 1240} {"train_loss": -22.09937286376953, "global_step": 102951, "epoch": 1240} {"train_loss": -22.166223526000977, "global_step": 102952, "epoch": 1240} {"train_loss": -22.2235050201416, "global_step": 102953, "epoch": 1240} {"train_loss": -22.058683395385742, "global_step": 102954, "epoch": 1240} {"train_loss": -21.956830978393555, "global_step": 102955, "epoch": 1240} {"train_loss": -21.97835350036621, "global_step": 102956, "epoch": 1240} {"train_loss": -22.34738540649414, "global_step": 102957, "epoch": 1240} {"train_loss": -22.463153839111328, "global_step": 102958, "epoch": 1240} {"train_loss": -22.07449722290039, "global_step": 102959, "epoch": 1240} {"train_loss": -22.23960304260254, "global_step": 102960, "epoch": 1240} {"train_loss": -21.899362564086914, "global_step": 102961, "epoch": 1240} {"train_loss": -22.232324600219727, "global_step": 102962, "epoch": 1240} {"train_loss": -22.15924644470215, "global_step": 102963, "epoch": 1240} {"train_loss": -21.780332565307617, "global_step": 102964, "epoch": 1240} {"train_loss": -22.243738174438477, "global_step": 102965, "epoch": 1240} {"train_loss": -22.071212768554688, "global_step": 102966, "epoch": 1240} {"train_loss": -22.08247184753418, "global_step": 102967, "epoch": 1240} {"train_loss": -22.0688533782959, "global_step": 102968, "epoch": 1240} {"train_loss": -22.102569580078125, "global_step": 102969, "epoch": 1240} {"train_loss": -21.80949592590332, "global_step": 102970, "epoch": 1240} {"train_loss": -21.99265480041504, "global_step": 102971, "epoch": 1240} {"train_loss": -22.066858291625977, "global_step": 102972, "epoch": 1240} {"train_loss": -22.08328628540039, "global_step": 102973, "epoch": 1240} {"train_loss": -21.756393432617188, "global_step": 102974, "epoch": 1240} {"train_loss": -22.04069709777832, "global_step": 102975, "epoch": 1240} {"train_loss": -21.980403900146484, "global_step": 102976, "epoch": 1240} {"train_loss": -22.101858139038086, "global_step": 102977, "epoch": 1240} {"train_loss": -21.981794357299805, "global_step": 102978, "epoch": 1240} {"train_loss": -22.087202072143555, "global_step": 102979, "epoch": 1240} {"train_loss": -22.393779754638672, "global_step": 102980, "epoch": 1240} {"train_loss": -21.908071517944336, "global_step": 102981, "epoch": 1240} {"train_loss": -21.94187355041504, "global_step": 102982, "epoch": 1240} {"train_loss": -22.1925106048584, "global_step": 102983, "epoch": 1240} {"train_loss": -22.146215438842773, "global_step": 102984, "epoch": 1240} {"train_loss": -22.049976348876953, "global_step": 102985, "epoch": 1240} {"train_loss": -22.049131393432617, "global_step": 102986, "epoch": 1240} {"train_loss": -22.308164596557617, "global_step": 102987, "epoch": 1240} {"train_loss": -21.99115562438965, "global_step": 102988, "epoch": 1240} {"train_loss": -21.82887077331543, "global_step": 102989, "epoch": 1240} {"train_loss": -21.658109664916992, "global_step": 102990, "epoch": 1240} {"train_loss": -21.847614288330078, "global_step": 102991, "epoch": 1240} {"train_loss": -22.28424644470215, "global_step": 102992, "epoch": 1240} {"train_loss": -21.8577938079834, "global_step": 102993, "epoch": 1240} {"train_loss": -21.969446182250977, "global_step": 102994, "epoch": 1240} {"train_loss": -22.235036849975586, "global_step": 102995, "epoch": 1240} {"train_loss": -21.694599151611328, "global_step": 102996, "epoch": 1240} {"train_loss": -21.62849998474121, "global_step": 102997, "epoch": 1240} {"train_loss": -21.90220069885254, "global_step": 102998, "epoch": 1240} {"train_loss": -22.006105422973633, "global_step": 102999, "epoch": 1240} {"train_loss": -22.075170516967773, "global_step": 103000, "epoch": 1240} {"train_loss": -22.53700828552246, "global_step": 103001, "epoch": 1240} {"train_loss": -21.987499283020753, "global_step": 103002, "epoch": 1240, "val_loss": 6081826.5} {"train_loss": -21.606826782226562, "global_step": 103003, "epoch": 1241} {"train_loss": -22.16437339782715, "global_step": 103004, "epoch": 1241} {"train_loss": -22.0654354095459, "global_step": 103005, "epoch": 1241} {"train_loss": -21.446155548095703, "global_step": 103006, "epoch": 1241} {"train_loss": -22.156232833862305, "global_step": 103007, "epoch": 1241} {"train_loss": -21.892841339111328, "global_step": 103008, "epoch": 1241} {"train_loss": -21.82757568359375, "global_step": 103009, "epoch": 1241} {"train_loss": -21.667577743530273, "global_step": 103010, "epoch": 1241} {"train_loss": -22.11960792541504, "global_step": 103011, "epoch": 1241} {"train_loss": -21.95383644104004, "global_step": 103012, "epoch": 1241} {"train_loss": -22.09854507446289, "global_step": 103013, "epoch": 1241} {"train_loss": -21.866697311401367, "global_step": 103014, "epoch": 1241} {"train_loss": -22.0643253326416, "global_step": 103015, "epoch": 1241} {"train_loss": -22.26727294921875, "global_step": 103016, "epoch": 1241} {"train_loss": -21.83949851989746, "global_step": 103017, "epoch": 1241} {"train_loss": -22.106918334960938, "global_step": 103018, "epoch": 1241} {"train_loss": -21.862674713134766, "global_step": 103019, "epoch": 1241} {"train_loss": -21.94738006591797, "global_step": 103020, "epoch": 1241} {"train_loss": -22.033828735351562, "global_step": 103021, "epoch": 1241} {"train_loss": -21.67900848388672, "global_step": 103022, "epoch": 1241} {"train_loss": -22.114492416381836, "global_step": 103023, "epoch": 1241} {"train_loss": -21.989673614501953, "global_step": 103024, "epoch": 1241} {"train_loss": -22.291776657104492, "global_step": 103025, "epoch": 1241} {"train_loss": -22.044530868530273, "global_step": 103026, "epoch": 1241} {"train_loss": -22.150636672973633, "global_step": 103027, "epoch": 1241} {"train_loss": -22.081960678100586, "global_step": 103028, "epoch": 1241} {"train_loss": -22.200246810913086, "global_step": 103029, "epoch": 1241} {"train_loss": -21.887733459472656, "global_step": 103030, "epoch": 1241} {"train_loss": -22.355497360229492, "global_step": 103031, "epoch": 1241} {"train_loss": -22.341251373291016, "global_step": 103032, "epoch": 1241} {"train_loss": -22.11238670349121, "global_step": 103033, "epoch": 1241} {"train_loss": -21.853796005249023, "global_step": 103034, "epoch": 1241} {"train_loss": -21.91042137145996, "global_step": 103035, "epoch": 1241} {"train_loss": -22.331588745117188, "global_step": 103036, "epoch": 1241} {"train_loss": -21.801008224487305, "global_step": 103037, "epoch": 1241} {"train_loss": -22.220449447631836, "global_step": 103038, "epoch": 1241} {"train_loss": -22.209068298339844, "global_step": 103039, "epoch": 1241} {"train_loss": -22.01453399658203, "global_step": 103040, "epoch": 1241} {"train_loss": -22.12955665588379, "global_step": 103041, "epoch": 1241} {"train_loss": -21.667203903198242, "global_step": 103042, "epoch": 1241} {"train_loss": -22.276060104370117, "global_step": 103043, "epoch": 1241} {"train_loss": -21.97974967956543, "global_step": 103044, "epoch": 1241} {"train_loss": -22.127822875976562, "global_step": 103045, "epoch": 1241} {"train_loss": -22.05809783935547, "global_step": 103046, "epoch": 1241} {"train_loss": -22.135513305664062, "global_step": 103047, "epoch": 1241} {"train_loss": -22.332059860229492, "global_step": 103048, "epoch": 1241} {"train_loss": -21.85463523864746, "global_step": 103049, "epoch": 1241} {"train_loss": -21.885480880737305, "global_step": 103050, "epoch": 1241} {"train_loss": -21.86643409729004, "global_step": 103051, "epoch": 1241} {"train_loss": -21.464303970336914, "global_step": 103052, "epoch": 1241} {"train_loss": -21.79311752319336, "global_step": 103053, "epoch": 1241} {"train_loss": -21.90229034423828, "global_step": 103054, "epoch": 1241} {"train_loss": -21.534622192382812, "global_step": 103055, "epoch": 1241} {"train_loss": -21.6669921875, "global_step": 103056, "epoch": 1241} {"train_loss": -22.1689453125, "global_step": 103057, "epoch": 1241} {"train_loss": -22.357770919799805, "global_step": 103058, "epoch": 1241} {"train_loss": -22.154882431030273, "global_step": 103059, "epoch": 1241} {"train_loss": -21.845523834228516, "global_step": 103060, "epoch": 1241} {"train_loss": -21.90260124206543, "global_step": 103061, "epoch": 1241} {"train_loss": -22.3385066986084, "global_step": 103062, "epoch": 1241} {"train_loss": -22.084043502807617, "global_step": 103063, "epoch": 1241} {"train_loss": -21.791532516479492, "global_step": 103064, "epoch": 1241} {"train_loss": -22.13376808166504, "global_step": 103065, "epoch": 1241} {"train_loss": -22.008895874023438, "global_step": 103066, "epoch": 1241} {"train_loss": -21.79646873474121, "global_step": 103067, "epoch": 1241} {"train_loss": -22.155771255493164, "global_step": 103068, "epoch": 1241} {"train_loss": -21.956594467163086, "global_step": 103069, "epoch": 1241} {"train_loss": -21.983057022094727, "global_step": 103070, "epoch": 1241} {"train_loss": -22.265714645385742, "global_step": 103071, "epoch": 1241} {"train_loss": -22.103994369506836, "global_step": 103072, "epoch": 1241} {"train_loss": -21.98143196105957, "global_step": 103073, "epoch": 1241} {"train_loss": -22.247344970703125, "global_step": 103074, "epoch": 1241} {"train_loss": -21.711685180664062, "global_step": 103075, "epoch": 1241} {"train_loss": -21.96745491027832, "global_step": 103076, "epoch": 1241} {"train_loss": -22.137863159179688, "global_step": 103077, "epoch": 1241} {"train_loss": -22.519210815429688, "global_step": 103078, "epoch": 1241} {"train_loss": -22.062345504760742, "global_step": 103079, "epoch": 1241} {"train_loss": -22.195493698120117, "global_step": 103080, "epoch": 1241} {"train_loss": -22.21305274963379, "global_step": 103081, "epoch": 1241} {"train_loss": -21.922588348388672, "global_step": 103082, "epoch": 1241} {"train_loss": -21.843168258666992, "global_step": 103083, "epoch": 1241} {"train_loss": -21.92325782775879, "global_step": 103084, "epoch": 1241} {"train_loss": -22.025842023183063, "global_step": 103085, "epoch": 1241, "val_loss": 6123793.0} {"train_loss": -20.657638549804688, "global_step": 103086, "epoch": 1242} {"train_loss": -21.32370948791504, "global_step": 103087, "epoch": 1242} {"train_loss": -21.467056274414062, "global_step": 103088, "epoch": 1242} {"train_loss": -21.082242965698242, "global_step": 103089, "epoch": 1242} {"train_loss": -21.924985885620117, "global_step": 103090, "epoch": 1242} {"train_loss": -21.462814331054688, "global_step": 103091, "epoch": 1242} {"train_loss": -21.596433639526367, "global_step": 103092, "epoch": 1242} {"train_loss": -21.282041549682617, "global_step": 103093, "epoch": 1242} {"train_loss": -21.661741256713867, "global_step": 103094, "epoch": 1242} {"train_loss": -21.610960006713867, "global_step": 103095, "epoch": 1242} {"train_loss": -21.476835250854492, "global_step": 103096, "epoch": 1242} {"train_loss": -21.848907470703125, "global_step": 103097, "epoch": 1242} {"train_loss": -21.545495986938477, "global_step": 103098, "epoch": 1242} {"train_loss": -21.66351318359375, "global_step": 103099, "epoch": 1242} {"train_loss": -21.4406681060791, "global_step": 103100, "epoch": 1242} {"train_loss": -21.197420120239258, "global_step": 103101, "epoch": 1242} {"train_loss": -21.622900009155273, "global_step": 103102, "epoch": 1242} {"train_loss": -21.66175651550293, "global_step": 103103, "epoch": 1242} {"train_loss": -21.780319213867188, "global_step": 103104, "epoch": 1242} {"train_loss": -21.76190757751465, "global_step": 103105, "epoch": 1242} {"train_loss": -21.57658576965332, "global_step": 103106, "epoch": 1242} {"train_loss": -21.7330265045166, "global_step": 103107, "epoch": 1242} {"train_loss": -21.739484786987305, "global_step": 103108, "epoch": 1242} {"train_loss": -21.71019744873047, "global_step": 103109, "epoch": 1242} {"train_loss": -21.853424072265625, "global_step": 103110, "epoch": 1242} {"train_loss": -22.053264617919922, "global_step": 103111, "epoch": 1242} {"train_loss": -21.8427791595459, "global_step": 103112, "epoch": 1242} {"train_loss": -21.731956481933594, "global_step": 103113, "epoch": 1242} {"train_loss": -21.938322067260742, "global_step": 103114, "epoch": 1242} {"train_loss": -21.8166446685791, "global_step": 103115, "epoch": 1242} {"train_loss": -22.000757217407227, "global_step": 103116, "epoch": 1242} {"train_loss": -21.595321655273438, "global_step": 103117, "epoch": 1242} {"train_loss": -22.07144546508789, "global_step": 103118, "epoch": 1242} {"train_loss": -22.0307559967041, "global_step": 103119, "epoch": 1242} {"train_loss": -21.85445213317871, "global_step": 103120, "epoch": 1242} {"train_loss": -21.85658836364746, "global_step": 103121, "epoch": 1242} {"train_loss": -21.978776931762695, "global_step": 103122, "epoch": 1242} {"train_loss": -22.097036361694336, "global_step": 103123, "epoch": 1242} {"train_loss": -21.703645706176758, "global_step": 103124, "epoch": 1242} {"train_loss": -21.806264877319336, "global_step": 103125, "epoch": 1242} {"train_loss": -22.456005096435547, "global_step": 103126, "epoch": 1242} {"train_loss": -22.03370475769043, "global_step": 103127, "epoch": 1242} {"train_loss": -21.910627365112305, "global_step": 103128, "epoch": 1242} {"train_loss": -21.787647247314453, "global_step": 103129, "epoch": 1242} {"train_loss": -22.437402725219727, "global_step": 103130, "epoch": 1242} {"train_loss": -22.167236328125, "global_step": 103131, "epoch": 1242} {"train_loss": -22.31231689453125, "global_step": 103132, "epoch": 1242} {"train_loss": -21.88027000427246, "global_step": 103133, "epoch": 1242} {"train_loss": -22.080326080322266, "global_step": 103134, "epoch": 1242} {"train_loss": -22.03977394104004, "global_step": 103135, "epoch": 1242} {"train_loss": -22.059131622314453, "global_step": 103136, "epoch": 1242} {"train_loss": -22.216337203979492, "global_step": 103137, "epoch": 1242} {"train_loss": -22.416135787963867, "global_step": 103138, "epoch": 1242} {"train_loss": -22.033334732055664, "global_step": 103139, "epoch": 1242} {"train_loss": -22.31900978088379, "global_step": 103140, "epoch": 1242} {"train_loss": -22.010501861572266, "global_step": 103141, "epoch": 1242} {"train_loss": -22.166492462158203, "global_step": 103142, "epoch": 1242} {"train_loss": -22.03441619873047, "global_step": 103143, "epoch": 1242} {"train_loss": -22.203216552734375, "global_step": 103144, "epoch": 1242} {"train_loss": -22.52850341796875, "global_step": 103145, "epoch": 1242} {"train_loss": -22.10713005065918, "global_step": 103146, "epoch": 1242} {"train_loss": -21.784833908081055, "global_step": 103147, "epoch": 1242} {"train_loss": -21.70547866821289, "global_step": 103148, "epoch": 1242} {"train_loss": -22.122285842895508, "global_step": 103149, "epoch": 1242} {"train_loss": -22.391759872436523, "global_step": 103150, "epoch": 1242} {"train_loss": -21.931631088256836, "global_step": 103151, "epoch": 1242} {"train_loss": -22.01198387145996, "global_step": 103152, "epoch": 1242} {"train_loss": -21.860254287719727, "global_step": 103153, "epoch": 1242} {"train_loss": -22.036352157592773, "global_step": 103154, "epoch": 1242} {"train_loss": -22.192411422729492, "global_step": 103155, "epoch": 1242} {"train_loss": -21.833845138549805, "global_step": 103156, "epoch": 1242} {"train_loss": -21.885786056518555, "global_step": 103157, "epoch": 1242} {"train_loss": -21.977941513061523, "global_step": 103158, "epoch": 1242} {"train_loss": -22.0784912109375, "global_step": 103159, "epoch": 1242} {"train_loss": -21.860685348510742, "global_step": 103160, "epoch": 1242} {"train_loss": -21.946279525756836, "global_step": 103161, "epoch": 1242} {"train_loss": -21.77911376953125, "global_step": 103162, "epoch": 1242} {"train_loss": -21.775714874267578, "global_step": 103163, "epoch": 1242} {"train_loss": -22.045303344726562, "global_step": 103164, "epoch": 1242} {"train_loss": -22.3275203704834, "global_step": 103165, "epoch": 1242} {"train_loss": -22.23278045654297, "global_step": 103166, "epoch": 1242} {"train_loss": -22.276288986206055, "global_step": 103167, "epoch": 1242} {"train_loss": -21.89937669685088, "global_step": 103168, "epoch": 1242, "val_loss": 6091921.0} {"train_loss": -22.000553131103516, "global_step": 103169, "epoch": 1243} {"train_loss": -21.480756759643555, "global_step": 103170, "epoch": 1243} {"train_loss": -21.560077667236328, "global_step": 103171, "epoch": 1243} {"train_loss": -21.505836486816406, "global_step": 103172, "epoch": 1243} {"train_loss": -21.369020462036133, "global_step": 103173, "epoch": 1243} {"train_loss": -21.82026481628418, "global_step": 103174, "epoch": 1243} {"train_loss": -21.503808975219727, "global_step": 103175, "epoch": 1243} {"train_loss": -22.132963180541992, "global_step": 103176, "epoch": 1243} {"train_loss": -21.975311279296875, "global_step": 103177, "epoch": 1243} {"train_loss": -21.524627685546875, "global_step": 103178, "epoch": 1243} {"train_loss": -21.725011825561523, "global_step": 103179, "epoch": 1243} {"train_loss": -21.72420310974121, "global_step": 103180, "epoch": 1243} {"train_loss": -21.81329917907715, "global_step": 103181, "epoch": 1243} {"train_loss": -22.035375595092773, "global_step": 103182, "epoch": 1243} {"train_loss": -21.60382652282715, "global_step": 103183, "epoch": 1243} {"train_loss": -22.087263107299805, "global_step": 103184, "epoch": 1243} {"train_loss": -21.96143341064453, "global_step": 103185, "epoch": 1243} {"train_loss": -21.843826293945312, "global_step": 103186, "epoch": 1243} {"train_loss": -21.63626480102539, "global_step": 103187, "epoch": 1243} {"train_loss": -22.048355102539062, "global_step": 103188, "epoch": 1243} {"train_loss": -21.940673828125, "global_step": 103189, "epoch": 1243} {"train_loss": -21.652511596679688, "global_step": 103190, "epoch": 1243} {"train_loss": -21.907155990600586, "global_step": 103191, "epoch": 1243} {"train_loss": -22.4583740234375, "global_step": 103192, "epoch": 1243} {"train_loss": -21.986555099487305, "global_step": 103193, "epoch": 1243} {"train_loss": -22.12493896484375, "global_step": 103194, "epoch": 1243} {"train_loss": -21.931320190429688, "global_step": 103195, "epoch": 1243} {"train_loss": -21.937162399291992, "global_step": 103196, "epoch": 1243} {"train_loss": -22.0986385345459, "global_step": 103197, "epoch": 1243} {"train_loss": -21.639806747436523, "global_step": 103198, "epoch": 1243} {"train_loss": -22.036991119384766, "global_step": 103199, "epoch": 1243} {"train_loss": -22.1569766998291, "global_step": 103200, "epoch": 1243} {"train_loss": -21.837976455688477, "global_step": 103201, "epoch": 1243} {"train_loss": -22.28334617614746, "global_step": 103202, "epoch": 1243} {"train_loss": -22.0792293548584, "global_step": 103203, "epoch": 1243} {"train_loss": -22.041467666625977, "global_step": 103204, "epoch": 1243} {"train_loss": -21.73090171813965, "global_step": 103205, "epoch": 1243} {"train_loss": -21.820419311523438, "global_step": 103206, "epoch": 1243} {"train_loss": -21.858844757080078, "global_step": 103207, "epoch": 1243} {"train_loss": -22.31024742126465, "global_step": 103208, "epoch": 1243} {"train_loss": -22.306886672973633, "global_step": 103209, "epoch": 1243} {"train_loss": -22.26080322265625, "global_step": 103210, "epoch": 1243} {"train_loss": -21.79117774963379, "global_step": 103211, "epoch": 1243} {"train_loss": -21.91737174987793, "global_step": 103212, "epoch": 1243} {"train_loss": -21.84450340270996, "global_step": 103213, "epoch": 1243} {"train_loss": -21.824918746948242, "global_step": 103214, "epoch": 1243} {"train_loss": -22.32450294494629, "global_step": 103215, "epoch": 1243} {"train_loss": -21.981786727905273, "global_step": 103216, "epoch": 1243} {"train_loss": -22.19557762145996, "global_step": 103217, "epoch": 1243} {"train_loss": -22.417926788330078, "global_step": 103218, "epoch": 1243} {"train_loss": -22.193540573120117, "global_step": 103219, "epoch": 1243} {"train_loss": -22.00006103515625, "global_step": 103220, "epoch": 1243} {"train_loss": -21.998950958251953, "global_step": 103221, "epoch": 1243} {"train_loss": -22.140499114990234, "global_step": 103222, "epoch": 1243} {"train_loss": -22.495304107666016, "global_step": 103223, "epoch": 1243} {"train_loss": -22.108535766601562, "global_step": 103224, "epoch": 1243} {"train_loss": -21.900545120239258, "global_step": 103225, "epoch": 1243} {"train_loss": -21.793357849121094, "global_step": 103226, "epoch": 1243} {"train_loss": -21.90297508239746, "global_step": 103227, "epoch": 1243} {"train_loss": -22.390689849853516, "global_step": 103228, "epoch": 1243} {"train_loss": -22.131547927856445, "global_step": 103229, "epoch": 1243} {"train_loss": -22.2271785736084, "global_step": 103230, "epoch": 1243} {"train_loss": -21.907167434692383, "global_step": 103231, "epoch": 1243} {"train_loss": -22.102903366088867, "global_step": 103232, "epoch": 1243} {"train_loss": -21.89608383178711, "global_step": 103233, "epoch": 1243} {"train_loss": -22.07204246520996, "global_step": 103234, "epoch": 1243} {"train_loss": -21.697782516479492, "global_step": 103235, "epoch": 1243} {"train_loss": -22.234342575073242, "global_step": 103236, "epoch": 1243} {"train_loss": -22.118640899658203, "global_step": 103237, "epoch": 1243} {"train_loss": -21.952407836914062, "global_step": 103238, "epoch": 1243} {"train_loss": -21.779956817626953, "global_step": 103239, "epoch": 1243} {"train_loss": -22.12133026123047, "global_step": 103240, "epoch": 1243} {"train_loss": -21.95233154296875, "global_step": 103241, "epoch": 1243} {"train_loss": -22.189401626586914, "global_step": 103242, "epoch": 1243} {"train_loss": -22.137134552001953, "global_step": 103243, "epoch": 1243} {"train_loss": -22.408369064331055, "global_step": 103244, "epoch": 1243} {"train_loss": -21.905393600463867, "global_step": 103245, "epoch": 1243} {"train_loss": -21.980823516845703, "global_step": 103246, "epoch": 1243} {"train_loss": -22.086715698242188, "global_step": 103247, "epoch": 1243} {"train_loss": -22.34922981262207, "global_step": 103248, "epoch": 1243} {"train_loss": -22.017772674560547, "global_step": 103249, "epoch": 1243} {"train_loss": -22.10738182067871, "global_step": 103250, "epoch": 1243} {"train_loss": -21.983161282826618, "global_step": 103251, "epoch": 1243, "val_loss": 6127950.0} {"train_loss": -21.75372886657715, "global_step": 103252, "epoch": 1244} {"train_loss": -21.90040397644043, "global_step": 103253, "epoch": 1244} {"train_loss": -21.3699951171875, "global_step": 103254, "epoch": 1244} {"train_loss": -21.314966201782227, "global_step": 103255, "epoch": 1244} {"train_loss": -21.81165885925293, "global_step": 103256, "epoch": 1244} {"train_loss": -21.73801612854004, "global_step": 103257, "epoch": 1244} {"train_loss": -21.949419021606445, "global_step": 103258, "epoch": 1244} {"train_loss": -21.67659568786621, "global_step": 103259, "epoch": 1244} {"train_loss": -21.827163696289062, "global_step": 103260, "epoch": 1244} {"train_loss": -21.509140014648438, "global_step": 103261, "epoch": 1244} {"train_loss": -22.231021881103516, "global_step": 103262, "epoch": 1244} {"train_loss": -21.75077247619629, "global_step": 103263, "epoch": 1244} {"train_loss": -22.015626907348633, "global_step": 103264, "epoch": 1244} {"train_loss": -21.970523834228516, "global_step": 103265, "epoch": 1244} {"train_loss": -21.87423324584961, "global_step": 103266, "epoch": 1244} {"train_loss": -21.92128562927246, "global_step": 103267, "epoch": 1244} {"train_loss": -22.06058692932129, "global_step": 103268, "epoch": 1244} {"train_loss": -22.049453735351562, "global_step": 103269, "epoch": 1244} {"train_loss": -21.995746612548828, "global_step": 103270, "epoch": 1244} {"train_loss": -21.86128807067871, "global_step": 103271, "epoch": 1244} {"train_loss": -21.914161682128906, "global_step": 103272, "epoch": 1244} {"train_loss": -21.63165283203125, "global_step": 103273, "epoch": 1244} {"train_loss": -21.694875717163086, "global_step": 103274, "epoch": 1244} {"train_loss": -22.10253143310547, "global_step": 103275, "epoch": 1244} {"train_loss": -21.6350040435791, "global_step": 103276, "epoch": 1244} {"train_loss": -22.086652755737305, "global_step": 103277, "epoch": 1244} {"train_loss": -21.766220092773438, "global_step": 103278, "epoch": 1244} {"train_loss": -22.15481185913086, "global_step": 103279, "epoch": 1244} {"train_loss": -21.606948852539062, "global_step": 103280, "epoch": 1244} {"train_loss": -21.917837142944336, "global_step": 103281, "epoch": 1244} {"train_loss": -22.323152542114258, "global_step": 103282, "epoch": 1244} {"train_loss": -21.996679306030273, "global_step": 103283, "epoch": 1244} {"train_loss": -22.102725982666016, "global_step": 103284, "epoch": 1244} {"train_loss": -22.325231552124023, "global_step": 103285, "epoch": 1244} {"train_loss": -21.92532730102539, "global_step": 103286, "epoch": 1244} {"train_loss": -22.17005729675293, "global_step": 103287, "epoch": 1244} {"train_loss": -22.231964111328125, "global_step": 103288, "epoch": 1244} {"train_loss": -22.048748016357422, "global_step": 103289, "epoch": 1244} {"train_loss": -22.19732093811035, "global_step": 103290, "epoch": 1244} {"train_loss": -22.009891510009766, "global_step": 103291, "epoch": 1244} {"train_loss": -21.68252182006836, "global_step": 103292, "epoch": 1244} {"train_loss": -22.162647247314453, "global_step": 103293, "epoch": 1244} {"train_loss": -22.05889892578125, "global_step": 103294, "epoch": 1244} {"train_loss": -22.24420166015625, "global_step": 103295, "epoch": 1244} {"train_loss": -21.868799209594727, "global_step": 103296, "epoch": 1244} {"train_loss": -22.246633529663086, "global_step": 103297, "epoch": 1244} {"train_loss": -21.892738342285156, "global_step": 103298, "epoch": 1244} {"train_loss": -21.756196975708008, "global_step": 103299, "epoch": 1244} {"train_loss": -22.0743465423584, "global_step": 103300, "epoch": 1244} {"train_loss": -22.09124183654785, "global_step": 103301, "epoch": 1244} {"train_loss": -22.19990348815918, "global_step": 103302, "epoch": 1244} {"train_loss": -22.137866973876953, "global_step": 103303, "epoch": 1244} {"train_loss": -21.665660858154297, "global_step": 103304, "epoch": 1244} {"train_loss": -22.225522994995117, "global_step": 103305, "epoch": 1244} {"train_loss": -22.01494026184082, "global_step": 103306, "epoch": 1244} {"train_loss": -22.355640411376953, "global_step": 103307, "epoch": 1244} {"train_loss": -22.072900772094727, "global_step": 103308, "epoch": 1244} {"train_loss": -22.23797035217285, "global_step": 103309, "epoch": 1244} {"train_loss": -22.484012603759766, "global_step": 103310, "epoch": 1244} {"train_loss": -21.99245262145996, "global_step": 103311, "epoch": 1244} {"train_loss": -21.647907257080078, "global_step": 103312, "epoch": 1244} {"train_loss": -21.793142318725586, "global_step": 103313, "epoch": 1244} {"train_loss": -21.82889175415039, "global_step": 103314, "epoch": 1244} {"train_loss": -22.171955108642578, "global_step": 103315, "epoch": 1244} {"train_loss": -22.070344924926758, "global_step": 103316, "epoch": 1244} {"train_loss": -22.060073852539062, "global_step": 103317, "epoch": 1244} {"train_loss": -21.85872459411621, "global_step": 103318, "epoch": 1244} {"train_loss": -22.261693954467773, "global_step": 103319, "epoch": 1244} {"train_loss": -21.983083724975586, "global_step": 103320, "epoch": 1244} {"train_loss": -22.252344131469727, "global_step": 103321, "epoch": 1244} {"train_loss": -22.206266403198242, "global_step": 103322, "epoch": 1244} {"train_loss": -21.834436416625977, "global_step": 103323, "epoch": 1244} {"train_loss": -21.96933364868164, "global_step": 103324, "epoch": 1244} {"train_loss": -21.98691177368164, "global_step": 103325, "epoch": 1244} {"train_loss": -21.856914520263672, "global_step": 103326, "epoch": 1244} {"train_loss": -21.700397491455078, "global_step": 103327, "epoch": 1244} {"train_loss": -21.775793075561523, "global_step": 103328, "epoch": 1244} {"train_loss": -21.873403549194336, "global_step": 103329, "epoch": 1244} {"train_loss": -22.20327377319336, "global_step": 103330, "epoch": 1244} {"train_loss": -21.891630172729492, "global_step": 103331, "epoch": 1244} {"train_loss": -22.166532516479492, "global_step": 103332, "epoch": 1244} {"train_loss": -21.914993286132812, "global_step": 103333, "epoch": 1244} {"train_loss": -21.967973548245716, "global_step": 103334, "epoch": 1244, "val_loss": 6155042.0} {"train_loss": -21.644428253173828, "global_step": 103335, "epoch": 1245} {"train_loss": -21.638357162475586, "global_step": 103336, "epoch": 1245} {"train_loss": -21.867908477783203, "global_step": 103337, "epoch": 1245} {"train_loss": -21.81817626953125, "global_step": 103338, "epoch": 1245} {"train_loss": -21.84681510925293, "global_step": 103339, "epoch": 1245} {"train_loss": -21.9691104888916, "global_step": 103340, "epoch": 1245} {"train_loss": -21.870092391967773, "global_step": 103341, "epoch": 1245} {"train_loss": -21.766393661499023, "global_step": 103342, "epoch": 1245} {"train_loss": -22.07032585144043, "global_step": 103343, "epoch": 1245} {"train_loss": -21.488218307495117, "global_step": 103344, "epoch": 1245} {"train_loss": -21.82418441772461, "global_step": 103345, "epoch": 1245} {"train_loss": -21.889442443847656, "global_step": 103346, "epoch": 1245} {"train_loss": -21.93182373046875, "global_step": 103347, "epoch": 1245} {"train_loss": -22.002058029174805, "global_step": 103348, "epoch": 1245} {"train_loss": -22.02170181274414, "global_step": 103349, "epoch": 1245} {"train_loss": -21.693368911743164, "global_step": 103350, "epoch": 1245} {"train_loss": -22.132450103759766, "global_step": 103351, "epoch": 1245} {"train_loss": -22.03424072265625, "global_step": 103352, "epoch": 1245} {"train_loss": -21.475751876831055, "global_step": 103353, "epoch": 1245} {"train_loss": -22.176740646362305, "global_step": 103354, "epoch": 1245} {"train_loss": -22.277877807617188, "global_step": 103355, "epoch": 1245} {"train_loss": -22.178739547729492, "global_step": 103356, "epoch": 1245} {"train_loss": -22.16031837463379, "global_step": 103357, "epoch": 1245} {"train_loss": -22.021268844604492, "global_step": 103358, "epoch": 1245} {"train_loss": -22.525493621826172, "global_step": 103359, "epoch": 1245} {"train_loss": -22.066328048706055, "global_step": 103360, "epoch": 1245} {"train_loss": -21.874181747436523, "global_step": 103361, "epoch": 1245} {"train_loss": -21.93793296813965, "global_step": 103362, "epoch": 1245} {"train_loss": -22.162200927734375, "global_step": 103363, "epoch": 1245} {"train_loss": -22.060508728027344, "global_step": 103364, "epoch": 1245} {"train_loss": -22.124481201171875, "global_step": 103365, "epoch": 1245} {"train_loss": -22.39699363708496, "global_step": 103366, "epoch": 1245} {"train_loss": -21.9887752532959, "global_step": 103367, "epoch": 1245} {"train_loss": -21.722190856933594, "global_step": 103368, "epoch": 1245} {"train_loss": -22.423492431640625, "global_step": 103369, "epoch": 1245} {"train_loss": -22.155899047851562, "global_step": 103370, "epoch": 1245} {"train_loss": -22.420040130615234, "global_step": 103371, "epoch": 1245} {"train_loss": -22.041797637939453, "global_step": 103372, "epoch": 1245} {"train_loss": -22.245351791381836, "global_step": 103373, "epoch": 1245} {"train_loss": -22.429569244384766, "global_step": 103374, "epoch": 1245} {"train_loss": -22.229284286499023, "global_step": 103375, "epoch": 1245} {"train_loss": -22.187101364135742, "global_step": 103376, "epoch": 1245} {"train_loss": -22.124998092651367, "global_step": 103377, "epoch": 1245} {"train_loss": -21.97479820251465, "global_step": 103378, "epoch": 1245} {"train_loss": -21.941848754882812, "global_step": 103379, "epoch": 1245} {"train_loss": -22.432432174682617, "global_step": 103380, "epoch": 1245} {"train_loss": -21.817516326904297, "global_step": 103381, "epoch": 1245} {"train_loss": -21.99803352355957, "global_step": 103382, "epoch": 1245} {"train_loss": -22.38263511657715, "global_step": 103383, "epoch": 1245} {"train_loss": -21.95271110534668, "global_step": 103384, "epoch": 1245} {"train_loss": -21.633853912353516, "global_step": 103385, "epoch": 1245} {"train_loss": -22.339216232299805, "global_step": 103386, "epoch": 1245} {"train_loss": -22.06434440612793, "global_step": 103387, "epoch": 1245} {"train_loss": -21.975576400756836, "global_step": 103388, "epoch": 1245} {"train_loss": -22.17486572265625, "global_step": 103389, "epoch": 1245} {"train_loss": -22.220157623291016, "global_step": 103390, "epoch": 1245} {"train_loss": -22.048954010009766, "global_step": 103391, "epoch": 1245} {"train_loss": -21.934452056884766, "global_step": 103392, "epoch": 1245} {"train_loss": -22.286848068237305, "global_step": 103393, "epoch": 1245} {"train_loss": -21.753332138061523, "global_step": 103394, "epoch": 1245} {"train_loss": -21.276880264282227, "global_step": 103395, "epoch": 1245} {"train_loss": -21.710477828979492, "global_step": 103396, "epoch": 1245} {"train_loss": -22.191165924072266, "global_step": 103397, "epoch": 1245} {"train_loss": -21.687047958374023, "global_step": 103398, "epoch": 1245} {"train_loss": -21.86789894104004, "global_step": 103399, "epoch": 1245} {"train_loss": -21.99220848083496, "global_step": 103400, "epoch": 1245} {"train_loss": -22.132822036743164, "global_step": 103401, "epoch": 1245} {"train_loss": -21.610715866088867, "global_step": 103402, "epoch": 1245} {"train_loss": -21.60109519958496, "global_step": 103403, "epoch": 1245} {"train_loss": -21.7437686920166, "global_step": 103404, "epoch": 1245} {"train_loss": -22.077590942382812, "global_step": 103405, "epoch": 1245} {"train_loss": -22.54952621459961, "global_step": 103406, "epoch": 1245} {"train_loss": -21.892929077148438, "global_step": 103407, "epoch": 1245} {"train_loss": -22.312116622924805, "global_step": 103408, "epoch": 1245} {"train_loss": -21.810068130493164, "global_step": 103409, "epoch": 1245} {"train_loss": -21.7384090423584, "global_step": 103410, "epoch": 1245} {"train_loss": -21.56325340270996, "global_step": 103411, "epoch": 1245} {"train_loss": -21.596296310424805, "global_step": 103412, "epoch": 1245} {"train_loss": -21.849538803100586, "global_step": 103413, "epoch": 1245} {"train_loss": -21.655277252197266, "global_step": 103414, "epoch": 1245} {"train_loss": -22.026853561401367, "global_step": 103415, "epoch": 1245} {"train_loss": -21.963964462280273, "global_step": 103416, "epoch": 1245} {"train_loss": -21.95577129685735, "global_step": 103417, "epoch": 1245, "val_loss": 6223921.0} {"train_loss": -21.51416015625, "global_step": 103418, "epoch": 1246} {"train_loss": -21.259023666381836, "global_step": 103419, "epoch": 1246} {"train_loss": -21.763736724853516, "global_step": 103420, "epoch": 1246} {"train_loss": -21.87156105041504, "global_step": 103421, "epoch": 1246} {"train_loss": -21.92230796813965, "global_step": 103422, "epoch": 1246} {"train_loss": -21.7138614654541, "global_step": 103423, "epoch": 1246} {"train_loss": -21.662944793701172, "global_step": 103424, "epoch": 1246} {"train_loss": -21.691787719726562, "global_step": 103425, "epoch": 1246} {"train_loss": -21.8941650390625, "global_step": 103426, "epoch": 1246} {"train_loss": -21.764997482299805, "global_step": 103427, "epoch": 1246} {"train_loss": -22.133974075317383, "global_step": 103428, "epoch": 1246} {"train_loss": -21.864166259765625, "global_step": 103429, "epoch": 1246} {"train_loss": -21.91036033630371, "global_step": 103430, "epoch": 1246} {"train_loss": -21.62721824645996, "global_step": 103431, "epoch": 1246} {"train_loss": -21.722009658813477, "global_step": 103432, "epoch": 1246} {"train_loss": -22.230466842651367, "global_step": 103433, "epoch": 1246} {"train_loss": -21.92253875732422, "global_step": 103434, "epoch": 1246} {"train_loss": -22.3445987701416, "global_step": 103435, "epoch": 1246} {"train_loss": -21.961156845092773, "global_step": 103436, "epoch": 1246} {"train_loss": -22.063661575317383, "global_step": 103437, "epoch": 1246} {"train_loss": -21.796955108642578, "global_step": 103438, "epoch": 1246} {"train_loss": -22.463998794555664, "global_step": 103439, "epoch": 1246} {"train_loss": -22.064300537109375, "global_step": 103440, "epoch": 1246} {"train_loss": -21.839765548706055, "global_step": 103441, "epoch": 1246} {"train_loss": -22.021263122558594, "global_step": 103442, "epoch": 1246} {"train_loss": -22.272403717041016, "global_step": 103443, "epoch": 1246} {"train_loss": -21.92806053161621, "global_step": 103444, "epoch": 1246} {"train_loss": -22.02113151550293, "global_step": 103445, "epoch": 1246} {"train_loss": -22.131938934326172, "global_step": 103446, "epoch": 1246} {"train_loss": -22.2457332611084, "global_step": 103447, "epoch": 1246} {"train_loss": -22.218164443969727, "global_step": 103448, "epoch": 1246} {"train_loss": -21.905393600463867, "global_step": 103449, "epoch": 1246} {"train_loss": -21.98853874206543, "global_step": 103450, "epoch": 1246} {"train_loss": -22.07331657409668, "global_step": 103451, "epoch": 1246} {"train_loss": -22.16375160217285, "global_step": 103452, "epoch": 1246} {"train_loss": -22.004592895507812, "global_step": 103453, "epoch": 1246} {"train_loss": -22.07423973083496, "global_step": 103454, "epoch": 1246} {"train_loss": -22.113584518432617, "global_step": 103455, "epoch": 1246} {"train_loss": -21.83921241760254, "global_step": 103456, "epoch": 1246} {"train_loss": -21.91664695739746, "global_step": 103457, "epoch": 1246} {"train_loss": -22.172861099243164, "global_step": 103458, "epoch": 1246} {"train_loss": -22.267690658569336, "global_step": 103459, "epoch": 1246} {"train_loss": -22.149396896362305, "global_step": 103460, "epoch": 1246} {"train_loss": -21.936878204345703, "global_step": 103461, "epoch": 1246} {"train_loss": -21.892484664916992, "global_step": 103462, "epoch": 1246} {"train_loss": -22.32693862915039, "global_step": 103463, "epoch": 1246} {"train_loss": -22.091251373291016, "global_step": 103464, "epoch": 1246} {"train_loss": -21.944751739501953, "global_step": 103465, "epoch": 1246} {"train_loss": -22.07784080505371, "global_step": 103466, "epoch": 1246} {"train_loss": -21.851945877075195, "global_step": 103467, "epoch": 1246} {"train_loss": -21.716169357299805, "global_step": 103468, "epoch": 1246} {"train_loss": -22.10690689086914, "global_step": 103469, "epoch": 1246} {"train_loss": -21.844806671142578, "global_step": 103470, "epoch": 1246} {"train_loss": -21.99839210510254, "global_step": 103471, "epoch": 1246} {"train_loss": -21.976598739624023, "global_step": 103472, "epoch": 1246} {"train_loss": -22.26222038269043, "global_step": 103473, "epoch": 1246} {"train_loss": -22.288501739501953, "global_step": 103474, "epoch": 1246} {"train_loss": -21.5960750579834, "global_step": 103475, "epoch": 1246} {"train_loss": -22.301727294921875, "global_step": 103476, "epoch": 1246} {"train_loss": -22.233272552490234, "global_step": 103477, "epoch": 1246} {"train_loss": -21.999258041381836, "global_step": 103478, "epoch": 1246} {"train_loss": -22.142637252807617, "global_step": 103479, "epoch": 1246} {"train_loss": -21.934816360473633, "global_step": 103480, "epoch": 1246} {"train_loss": -22.03182601928711, "global_step": 103481, "epoch": 1246} {"train_loss": -21.95453453063965, "global_step": 103482, "epoch": 1246} {"train_loss": -22.063695907592773, "global_step": 103483, "epoch": 1246} {"train_loss": -21.75728416442871, "global_step": 103484, "epoch": 1246} {"train_loss": -22.047224044799805, "global_step": 103485, "epoch": 1246} {"train_loss": -22.415267944335938, "global_step": 103486, "epoch": 1246} {"train_loss": -22.10835075378418, "global_step": 103487, "epoch": 1246} {"train_loss": -22.448596954345703, "global_step": 103488, "epoch": 1246} {"train_loss": -22.05013084411621, "global_step": 103489, "epoch": 1246} {"train_loss": -21.820316314697266, "global_step": 103490, "epoch": 1246} {"train_loss": -21.999025344848633, "global_step": 103491, "epoch": 1246} {"train_loss": -22.14581298828125, "global_step": 103492, "epoch": 1246} {"train_loss": -21.69937515258789, "global_step": 103493, "epoch": 1246} {"train_loss": -22.218664169311523, "global_step": 103494, "epoch": 1246} {"train_loss": -21.924238204956055, "global_step": 103495, "epoch": 1246} {"train_loss": -22.18963623046875, "global_step": 103496, "epoch": 1246} {"train_loss": -21.942724227905273, "global_step": 103497, "epoch": 1246} {"train_loss": -22.119220733642578, "global_step": 103498, "epoch": 1246} {"train_loss": -21.533334732055664, "global_step": 103499, "epoch": 1246} {"train_loss": -21.98518410648208, "global_step": 103500, "epoch": 1246, "val_loss": 5979859.5} {"train_loss": -21.642332077026367, "global_step": 103501, "epoch": 1247} {"train_loss": -21.80453872680664, "global_step": 103502, "epoch": 1247} {"train_loss": -22.050601959228516, "global_step": 103503, "epoch": 1247} {"train_loss": -21.673593521118164, "global_step": 103504, "epoch": 1247} {"train_loss": -21.62324333190918, "global_step": 103505, "epoch": 1247} {"train_loss": -21.492877960205078, "global_step": 103506, "epoch": 1247} {"train_loss": -21.580190658569336, "global_step": 103507, "epoch": 1247} {"train_loss": -21.876461029052734, "global_step": 103508, "epoch": 1247} {"train_loss": -21.424602508544922, "global_step": 103509, "epoch": 1247} {"train_loss": -21.88993263244629, "global_step": 103510, "epoch": 1247} {"train_loss": -22.04227638244629, "global_step": 103511, "epoch": 1247} {"train_loss": -21.777935028076172, "global_step": 103512, "epoch": 1247} {"train_loss": -22.063438415527344, "global_step": 103513, "epoch": 1247} {"train_loss": -21.657962799072266, "global_step": 103514, "epoch": 1247} {"train_loss": -21.887847900390625, "global_step": 103515, "epoch": 1247} {"train_loss": -21.951881408691406, "global_step": 103516, "epoch": 1247} {"train_loss": -22.21686363220215, "global_step": 103517, "epoch": 1247} {"train_loss": -21.901588439941406, "global_step": 103518, "epoch": 1247} {"train_loss": -21.843875885009766, "global_step": 103519, "epoch": 1247} {"train_loss": -21.972036361694336, "global_step": 103520, "epoch": 1247} {"train_loss": -22.02330207824707, "global_step": 103521, "epoch": 1247} {"train_loss": -22.47193145751953, "global_step": 103522, "epoch": 1247} {"train_loss": -22.028934478759766, "global_step": 103523, "epoch": 1247} {"train_loss": -22.04482078552246, "global_step": 103524, "epoch": 1247} {"train_loss": -21.599342346191406, "global_step": 103525, "epoch": 1247} {"train_loss": -22.245847702026367, "global_step": 103526, "epoch": 1247} {"train_loss": -22.012577056884766, "global_step": 103527, "epoch": 1247} {"train_loss": -22.103891372680664, "global_step": 103528, "epoch": 1247} {"train_loss": -22.1048583984375, "global_step": 103529, "epoch": 1247} {"train_loss": -21.928903579711914, "global_step": 103530, "epoch": 1247} {"train_loss": -22.30901336669922, "global_step": 103531, "epoch": 1247} {"train_loss": -21.786609649658203, "global_step": 103532, "epoch": 1247} {"train_loss": -22.146472930908203, "global_step": 103533, "epoch": 1247} {"train_loss": -21.885610580444336, "global_step": 103534, "epoch": 1247} {"train_loss": -22.197988510131836, "global_step": 103535, "epoch": 1247} {"train_loss": -22.083776473999023, "global_step": 103536, "epoch": 1247} {"train_loss": -22.087583541870117, "global_step": 103537, "epoch": 1247} {"train_loss": -22.23872184753418, "global_step": 103538, "epoch": 1247} {"train_loss": -22.2241153717041, "global_step": 103539, "epoch": 1247} {"train_loss": -22.046308517456055, "global_step": 103540, "epoch": 1247} {"train_loss": -22.236059188842773, "global_step": 103541, "epoch": 1247} {"train_loss": -22.074634552001953, "global_step": 103542, "epoch": 1247} {"train_loss": -22.353971481323242, "global_step": 103543, "epoch": 1247} {"train_loss": -21.805526733398438, "global_step": 103544, "epoch": 1247} {"train_loss": -22.269357681274414, "global_step": 103545, "epoch": 1247} {"train_loss": -22.618444442749023, "global_step": 103546, "epoch": 1247} {"train_loss": -22.059680938720703, "global_step": 103547, "epoch": 1247} {"train_loss": -21.94474220275879, "global_step": 103548, "epoch": 1247} {"train_loss": -21.712940216064453, "global_step": 103549, "epoch": 1247} {"train_loss": -21.880523681640625, "global_step": 103550, "epoch": 1247} {"train_loss": -21.743207931518555, "global_step": 103551, "epoch": 1247} {"train_loss": -21.921348571777344, "global_step": 103552, "epoch": 1247} {"train_loss": -21.953840255737305, "global_step": 103553, "epoch": 1247} {"train_loss": -22.128507614135742, "global_step": 103554, "epoch": 1247} {"train_loss": -22.409997940063477, "global_step": 103555, "epoch": 1247} {"train_loss": -22.141271591186523, "global_step": 103556, "epoch": 1247} {"train_loss": -22.013710021972656, "global_step": 103557, "epoch": 1247} {"train_loss": -22.18007469177246, "global_step": 103558, "epoch": 1247} {"train_loss": -22.25763511657715, "global_step": 103559, "epoch": 1247} {"train_loss": -22.057226181030273, "global_step": 103560, "epoch": 1247} {"train_loss": -22.200639724731445, "global_step": 103561, "epoch": 1247} {"train_loss": -21.90484619140625, "global_step": 103562, "epoch": 1247} {"train_loss": -22.173959732055664, "global_step": 103563, "epoch": 1247} {"train_loss": -21.862539291381836, "global_step": 103564, "epoch": 1247} {"train_loss": -21.818721771240234, "global_step": 103565, "epoch": 1247} {"train_loss": -22.378421783447266, "global_step": 103566, "epoch": 1247} {"train_loss": -22.218433380126953, "global_step": 103567, "epoch": 1247} {"train_loss": -22.027694702148438, "global_step": 103568, "epoch": 1247} {"train_loss": -21.990550994873047, "global_step": 103569, "epoch": 1247} {"train_loss": -22.08222007751465, "global_step": 103570, "epoch": 1247} {"train_loss": -21.980085372924805, "global_step": 103571, "epoch": 1247} {"train_loss": -22.161014556884766, "global_step": 103572, "epoch": 1247} {"train_loss": -22.558155059814453, "global_step": 103573, "epoch": 1247} {"train_loss": -22.206567764282227, "global_step": 103574, "epoch": 1247} {"train_loss": -22.127981185913086, "global_step": 103575, "epoch": 1247} {"train_loss": -22.054241180419922, "global_step": 103576, "epoch": 1247} {"train_loss": -21.925731658935547, "global_step": 103577, "epoch": 1247} {"train_loss": -21.828386306762695, "global_step": 103578, "epoch": 1247} {"train_loss": -22.391870498657227, "global_step": 103579, "epoch": 1247} {"train_loss": -21.93711280822754, "global_step": 103580, "epoch": 1247} {"train_loss": -22.100305557250977, "global_step": 103581, "epoch": 1247} {"train_loss": -22.175046920776367, "global_step": 103582, "epoch": 1247} {"train_loss": -22.024967814066326, "global_step": 103583, "epoch": 1247, "val_loss": 6184167.5} {"train_loss": -21.563356399536133, "global_step": 103584, "epoch": 1248} {"train_loss": -22.079164505004883, "global_step": 103585, "epoch": 1248} {"train_loss": -21.462438583374023, "global_step": 103586, "epoch": 1248} {"train_loss": -21.814176559448242, "global_step": 103587, "epoch": 1248} {"train_loss": -21.485876083374023, "global_step": 103588, "epoch": 1248} {"train_loss": -21.43242835998535, "global_step": 103589, "epoch": 1248} {"train_loss": -21.984777450561523, "global_step": 103590, "epoch": 1248} {"train_loss": -21.481382369995117, "global_step": 103591, "epoch": 1248} {"train_loss": -21.669713973999023, "global_step": 103592, "epoch": 1248} {"train_loss": -22.009008407592773, "global_step": 103593, "epoch": 1248} {"train_loss": -21.922842025756836, "global_step": 103594, "epoch": 1248} {"train_loss": -21.774696350097656, "global_step": 103595, "epoch": 1248} {"train_loss": -21.873991012573242, "global_step": 103596, "epoch": 1248} {"train_loss": -21.58720588684082, "global_step": 103597, "epoch": 1248} {"train_loss": -21.70354652404785, "global_step": 103598, "epoch": 1248} {"train_loss": -22.168685913085938, "global_step": 103599, "epoch": 1248} {"train_loss": -21.610198974609375, "global_step": 103600, "epoch": 1248} {"train_loss": -22.034353256225586, "global_step": 103601, "epoch": 1248} {"train_loss": -22.042373657226562, "global_step": 103602, "epoch": 1248} {"train_loss": -21.856321334838867, "global_step": 103603, "epoch": 1248} {"train_loss": -21.9261417388916, "global_step": 103604, "epoch": 1248} {"train_loss": -21.9344539642334, "global_step": 103605, "epoch": 1248} {"train_loss": -21.781068801879883, "global_step": 103606, "epoch": 1248} {"train_loss": -22.031652450561523, "global_step": 103607, "epoch": 1248} {"train_loss": -22.134092330932617, "global_step": 103608, "epoch": 1248} {"train_loss": -22.065204620361328, "global_step": 103609, "epoch": 1248} {"train_loss": -21.83665657043457, "global_step": 103610, "epoch": 1248} {"train_loss": -21.97269058227539, "global_step": 103611, "epoch": 1248} {"train_loss": -22.13029670715332, "global_step": 103612, "epoch": 1248} {"train_loss": -21.922780990600586, "global_step": 103613, "epoch": 1248} {"train_loss": -22.293128967285156, "global_step": 103614, "epoch": 1248} {"train_loss": -22.11441993713379, "global_step": 103615, "epoch": 1248} {"train_loss": -22.099475860595703, "global_step": 103616, "epoch": 1248} {"train_loss": -22.065305709838867, "global_step": 103617, "epoch": 1248} {"train_loss": -21.78762435913086, "global_step": 103618, "epoch": 1248} {"train_loss": -21.984546661376953, "global_step": 103619, "epoch": 1248} {"train_loss": -22.337324142456055, "global_step": 103620, "epoch": 1248} {"train_loss": -22.0516357421875, "global_step": 103621, "epoch": 1248} {"train_loss": -22.00505256652832, "global_step": 103622, "epoch": 1248} {"train_loss": -22.081594467163086, "global_step": 103623, "epoch": 1248} {"train_loss": -22.07682228088379, "global_step": 103624, "epoch": 1248} {"train_loss": -21.9968318939209, "global_step": 103625, "epoch": 1248} {"train_loss": -21.86644172668457, "global_step": 103626, "epoch": 1248} {"train_loss": -22.039350509643555, "global_step": 103627, "epoch": 1248} {"train_loss": -21.96544075012207, "global_step": 103628, "epoch": 1248} {"train_loss": -22.091876983642578, "global_step": 103629, "epoch": 1248} {"train_loss": -22.02347755432129, "global_step": 103630, "epoch": 1248} {"train_loss": -21.982730865478516, "global_step": 103631, "epoch": 1248} {"train_loss": -22.179067611694336, "global_step": 103632, "epoch": 1248} {"train_loss": -22.036651611328125, "global_step": 103633, "epoch": 1248} {"train_loss": -22.03809356689453, "global_step": 103634, "epoch": 1248} {"train_loss": -21.916940689086914, "global_step": 103635, "epoch": 1248} {"train_loss": -21.927108764648438, "global_step": 103636, "epoch": 1248} {"train_loss": -22.169174194335938, "global_step": 103637, "epoch": 1248} {"train_loss": -22.269323348999023, "global_step": 103638, "epoch": 1248} {"train_loss": -22.060522079467773, "global_step": 103639, "epoch": 1248} {"train_loss": -22.279653549194336, "global_step": 103640, "epoch": 1248} {"train_loss": -22.156347274780273, "global_step": 103641, "epoch": 1248} {"train_loss": -22.058202743530273, "global_step": 103642, "epoch": 1248} {"train_loss": -22.51312255859375, "global_step": 103643, "epoch": 1248} {"train_loss": -21.969778060913086, "global_step": 103644, "epoch": 1248} {"train_loss": -22.4194278717041, "global_step": 103645, "epoch": 1248} {"train_loss": -22.304956436157227, "global_step": 103646, "epoch": 1248} {"train_loss": -22.090740203857422, "global_step": 103647, "epoch": 1248} {"train_loss": -22.044973373413086, "global_step": 103648, "epoch": 1248} {"train_loss": -22.443531036376953, "global_step": 103649, "epoch": 1248} {"train_loss": -22.14420509338379, "global_step": 103650, "epoch": 1248} {"train_loss": -22.012205123901367, "global_step": 103651, "epoch": 1248} {"train_loss": -22.22908592224121, "global_step": 103652, "epoch": 1248} {"train_loss": -21.834590911865234, "global_step": 103653, "epoch": 1248} {"train_loss": -22.238805770874023, "global_step": 103654, "epoch": 1248} {"train_loss": -22.081787109375, "global_step": 103655, "epoch": 1248} {"train_loss": -22.19209098815918, "global_step": 103656, "epoch": 1248} {"train_loss": -21.951889038085938, "global_step": 103657, "epoch": 1248} {"train_loss": -22.078229904174805, "global_step": 103658, "epoch": 1248} {"train_loss": -22.197128295898438, "global_step": 103659, "epoch": 1248} {"train_loss": -21.71453857421875, "global_step": 103660, "epoch": 1248} {"train_loss": -22.087491989135742, "global_step": 103661, "epoch": 1248} {"train_loss": -22.408418655395508, "global_step": 103662, "epoch": 1248} {"train_loss": -21.99026870727539, "global_step": 103663, "epoch": 1248} {"train_loss": -21.73915672302246, "global_step": 103664, "epoch": 1248} {"train_loss": -22.152936935424805, "global_step": 103665, "epoch": 1248} {"train_loss": -22.012685936617565, "global_step": 103666, "epoch": 1248, "val_loss": 6086655.0} {"train_loss": -21.922773361206055, "global_step": 103667, "epoch": 1249} {"train_loss": -21.64287757873535, "global_step": 103668, "epoch": 1249} {"train_loss": -21.529422760009766, "global_step": 103669, "epoch": 1249} {"train_loss": -21.725505828857422, "global_step": 103670, "epoch": 1249} {"train_loss": -21.777772903442383, "global_step": 103671, "epoch": 1249} {"train_loss": -21.663543701171875, "global_step": 103672, "epoch": 1249} {"train_loss": -21.864459991455078, "global_step": 103673, "epoch": 1249} {"train_loss": -21.927419662475586, "global_step": 103674, "epoch": 1249} {"train_loss": -21.800031661987305, "global_step": 103675, "epoch": 1249} {"train_loss": -21.940343856811523, "global_step": 103676, "epoch": 1249} {"train_loss": -21.80224609375, "global_step": 103677, "epoch": 1249} {"train_loss": -21.999422073364258, "global_step": 103678, "epoch": 1249} {"train_loss": -21.976036071777344, "global_step": 103679, "epoch": 1249} {"train_loss": -21.915273666381836, "global_step": 103680, "epoch": 1249} {"train_loss": -21.74029541015625, "global_step": 103681, "epoch": 1249} {"train_loss": -21.838546752929688, "global_step": 103682, "epoch": 1249} {"train_loss": -22.35752296447754, "global_step": 103683, "epoch": 1249} {"train_loss": -21.697607040405273, "global_step": 103684, "epoch": 1249} {"train_loss": -22.11655616760254, "global_step": 103685, "epoch": 1249} {"train_loss": -21.965272903442383, "global_step": 103686, "epoch": 1249} {"train_loss": -21.73554801940918, "global_step": 103687, "epoch": 1249} {"train_loss": -22.06443214416504, "global_step": 103688, "epoch": 1249} {"train_loss": -22.086111068725586, "global_step": 103689, "epoch": 1249} {"train_loss": -21.974958419799805, "global_step": 103690, "epoch": 1249} {"train_loss": -22.213783264160156, "global_step": 103691, "epoch": 1249} {"train_loss": -21.870128631591797, "global_step": 103692, "epoch": 1249} {"train_loss": -22.218265533447266, "global_step": 103693, "epoch": 1249} {"train_loss": -22.018749237060547, "global_step": 103694, "epoch": 1249} {"train_loss": -22.5313777923584, "global_step": 103695, "epoch": 1249} {"train_loss": -22.118581771850586, "global_step": 103696, "epoch": 1249} {"train_loss": -21.903167724609375, "global_step": 103697, "epoch": 1249} {"train_loss": -22.237804412841797, "global_step": 103698, "epoch": 1249} {"train_loss": -22.006103515625, "global_step": 103699, "epoch": 1249} {"train_loss": -22.131641387939453, "global_step": 103700, "epoch": 1249} {"train_loss": -22.0918025970459, "global_step": 103701, "epoch": 1249} {"train_loss": -22.10297966003418, "global_step": 103702, "epoch": 1249} {"train_loss": -22.307119369506836, "global_step": 103703, "epoch": 1249} {"train_loss": -22.205997467041016, "global_step": 103704, "epoch": 1249} {"train_loss": -22.24542808532715, "global_step": 103705, "epoch": 1249} {"train_loss": -22.061246871948242, "global_step": 103706, "epoch": 1249} {"train_loss": -21.70539665222168, "global_step": 103707, "epoch": 1249} {"train_loss": -22.32927894592285, "global_step": 103708, "epoch": 1249} {"train_loss": -21.763486862182617, "global_step": 103709, "epoch": 1249} {"train_loss": -22.266925811767578, "global_step": 103710, "epoch": 1249} {"train_loss": -21.820661544799805, "global_step": 103711, "epoch": 1249} {"train_loss": -21.975988388061523, "global_step": 103712, "epoch": 1249} {"train_loss": -22.14945411682129, "global_step": 103713, "epoch": 1249} {"train_loss": -22.29490089416504, "global_step": 103714, "epoch": 1249} {"train_loss": -22.31422996520996, "global_step": 103715, "epoch": 1249} {"train_loss": -22.3212947845459, "global_step": 103716, "epoch": 1249} {"train_loss": -22.506519317626953, "global_step": 103717, "epoch": 1249} {"train_loss": -21.760648727416992, "global_step": 103718, "epoch": 1249} {"train_loss": -21.676912307739258, "global_step": 103719, "epoch": 1249} {"train_loss": -22.35284996032715, "global_step": 103720, "epoch": 1249} {"train_loss": -21.869977951049805, "global_step": 103721, "epoch": 1249} {"train_loss": -22.49214744567871, "global_step": 103722, "epoch": 1249} {"train_loss": -22.056079864501953, "global_step": 103723, "epoch": 1249} {"train_loss": -21.633481979370117, "global_step": 103724, "epoch": 1249} {"train_loss": -21.692768096923828, "global_step": 103725, "epoch": 1249} {"train_loss": -21.828012466430664, "global_step": 103726, "epoch": 1249} {"train_loss": -22.128780364990234, "global_step": 103727, "epoch": 1249} {"train_loss": -22.51920509338379, "global_step": 103728, "epoch": 1249} {"train_loss": -21.899953842163086, "global_step": 103729, "epoch": 1249} {"train_loss": -22.25680160522461, "global_step": 103730, "epoch": 1249} {"train_loss": -22.273099899291992, "global_step": 103731, "epoch": 1249} {"train_loss": -22.068700790405273, "global_step": 103732, "epoch": 1249} {"train_loss": -21.970762252807617, "global_step": 103733, "epoch": 1249} {"train_loss": -21.937456130981445, "global_step": 103734, "epoch": 1249} {"train_loss": -21.992212295532227, "global_step": 103735, "epoch": 1249} {"train_loss": -21.87647247314453, "global_step": 103736, "epoch": 1249} {"train_loss": -22.183807373046875, "global_step": 103737, "epoch": 1249} {"train_loss": -22.065486907958984, "global_step": 103738, "epoch": 1249} {"train_loss": -21.784013748168945, "global_step": 103739, "epoch": 1249} {"train_loss": -22.00740623474121, "global_step": 103740, "epoch": 1249} {"train_loss": -22.202890396118164, "global_step": 103741, "epoch": 1249} {"train_loss": -22.062484741210938, "global_step": 103742, "epoch": 1249} {"train_loss": -22.393207550048828, "global_step": 103743, "epoch": 1249} {"train_loss": -21.83822250366211, "global_step": 103744, "epoch": 1249} {"train_loss": -22.29569435119629, "global_step": 103745, "epoch": 1249} {"train_loss": -21.731664657592773, "global_step": 103746, "epoch": 1249} {"train_loss": -22.083114624023438, "global_step": 103747, "epoch": 1249} {"train_loss": -21.971176147460938, "global_step": 103748, "epoch": 1249} {"train_loss": -22.03088105443012, "global_step": 103749, "epoch": 1249, "val_loss": 5995771.0} {"train_loss": -21.38346290588379, "global_step": 103750, "epoch": 1250} {"train_loss": -21.023605346679688, "global_step": 103751, "epoch": 1250} {"train_loss": -21.162006378173828, "global_step": 103752, "epoch": 1250} {"train_loss": -21.85450553894043, "global_step": 103753, "epoch": 1250} {"train_loss": -21.211421966552734, "global_step": 103754, "epoch": 1250} {"train_loss": -21.04359245300293, "global_step": 103755, "epoch": 1250} {"train_loss": -21.800573348999023, "global_step": 103756, "epoch": 1250} {"train_loss": -21.38956069946289, "global_step": 103757, "epoch": 1250} {"train_loss": -21.7797794342041, "global_step": 103758, "epoch": 1250} {"train_loss": -21.617813110351562, "global_step": 103759, "epoch": 1250} {"train_loss": -21.786386489868164, "global_step": 103760, "epoch": 1250} {"train_loss": -22.11197280883789, "global_step": 103761, "epoch": 1250} {"train_loss": -21.426191329956055, "global_step": 103762, "epoch": 1250} {"train_loss": -21.91619873046875, "global_step": 103763, "epoch": 1250} {"train_loss": -21.746971130371094, "global_step": 103764, "epoch": 1250} {"train_loss": -21.6473331451416, "global_step": 103765, "epoch": 1250} {"train_loss": -22.081941604614258, "global_step": 103766, "epoch": 1250} {"train_loss": -21.72757339477539, "global_step": 103767, "epoch": 1250} {"train_loss": -21.858108520507812, "global_step": 103768, "epoch": 1250} {"train_loss": -21.518688201904297, "global_step": 103769, "epoch": 1250} {"train_loss": -21.95234489440918, "global_step": 103770, "epoch": 1250} {"train_loss": -22.16644859313965, "global_step": 103771, "epoch": 1250} {"train_loss": -21.84134864807129, "global_step": 103772, "epoch": 1250} {"train_loss": -21.8112735748291, "global_step": 103773, "epoch": 1250} {"train_loss": -21.899822235107422, "global_step": 103774, "epoch": 1250} {"train_loss": -21.853368759155273, "global_step": 103775, "epoch": 1250} {"train_loss": -21.914329528808594, "global_step": 103776, "epoch": 1250} {"train_loss": -21.7094783782959, "global_step": 103777, "epoch": 1250} {"train_loss": -22.268320083618164, "global_step": 103778, "epoch": 1250} {"train_loss": -22.388639450073242, "global_step": 103779, "epoch": 1250} {"train_loss": -21.953039169311523, "global_step": 103780, "epoch": 1250} {"train_loss": -22.03912925720215, "global_step": 103781, "epoch": 1250} {"train_loss": -21.961864471435547, "global_step": 103782, "epoch": 1250} {"train_loss": -21.829933166503906, "global_step": 103783, "epoch": 1250} {"train_loss": -21.966880798339844, "global_step": 103784, "epoch": 1250} {"train_loss": -21.89801025390625, "global_step": 103785, "epoch": 1250} {"train_loss": -22.450653076171875, "global_step": 103786, "epoch": 1250} {"train_loss": -22.099639892578125, "global_step": 103787, "epoch": 1250} {"train_loss": -22.249099731445312, "global_step": 103788, "epoch": 1250} {"train_loss": -22.170604705810547, "global_step": 103789, "epoch": 1250} {"train_loss": -22.219478607177734, "global_step": 103790, "epoch": 1250} {"train_loss": -21.65834617614746, "global_step": 103791, "epoch": 1250} {"train_loss": -22.04296112060547, "global_step": 103792, "epoch": 1250} {"train_loss": -22.120567321777344, "global_step": 103793, "epoch": 1250} {"train_loss": -21.78919792175293, "global_step": 103794, "epoch": 1250} {"train_loss": -21.783119201660156, "global_step": 103795, "epoch": 1250} {"train_loss": -22.388486862182617, "global_step": 103796, "epoch": 1250} {"train_loss": -21.85208511352539, "global_step": 103797, "epoch": 1250} {"train_loss": -22.126482009887695, "global_step": 103798, "epoch": 1250} {"train_loss": -21.56402587890625, "global_step": 103799, "epoch": 1250} {"train_loss": -22.009979248046875, "global_step": 103800, "epoch": 1250} {"train_loss": -22.05415153503418, "global_step": 103801, "epoch": 1250} {"train_loss": -21.796945571899414, "global_step": 103802, "epoch": 1250} {"train_loss": -22.128543853759766, "global_step": 103803, "epoch": 1250} {"train_loss": -22.063343048095703, "global_step": 103804, "epoch": 1250} {"train_loss": -22.10251235961914, "global_step": 103805, "epoch": 1250} {"train_loss": -22.116451263427734, "global_step": 103806, "epoch": 1250} {"train_loss": -22.30476188659668, "global_step": 103807, "epoch": 1250} {"train_loss": -22.061071395874023, "global_step": 103808, "epoch": 1250} {"train_loss": -22.245412826538086, "global_step": 103809, "epoch": 1250} {"train_loss": -22.16259002685547, "global_step": 103810, "epoch": 1250} {"train_loss": -22.0483341217041, "global_step": 103811, "epoch": 1250} {"train_loss": -22.001066207885742, "global_step": 103812, "epoch": 1250} {"train_loss": -21.856796264648438, "global_step": 103813, "epoch": 1250} {"train_loss": -22.215953826904297, "global_step": 103814, "epoch": 1250} {"train_loss": -22.147321701049805, "global_step": 103815, "epoch": 1250} {"train_loss": -22.511756896972656, "global_step": 103816, "epoch": 1250} {"train_loss": -21.87044906616211, "global_step": 103817, "epoch": 1250} {"train_loss": -21.89566421508789, "global_step": 103818, "epoch": 1250} {"train_loss": -21.725444793701172, "global_step": 103819, "epoch": 1250} {"train_loss": -21.93181800842285, "global_step": 103820, "epoch": 1250} {"train_loss": -21.97637939453125, "global_step": 103821, "epoch": 1250} {"train_loss": -22.282941818237305, "global_step": 103822, "epoch": 1250} {"train_loss": -22.132190704345703, "global_step": 103823, "epoch": 1250} {"train_loss": -21.85854721069336, "global_step": 103824, "epoch": 1250} {"train_loss": -21.93645477294922, "global_step": 103825, "epoch": 1250} {"train_loss": -22.142911911010742, "global_step": 103826, "epoch": 1250} {"train_loss": -21.852949142456055, "global_step": 103827, "epoch": 1250} {"train_loss": -21.850812911987305, "global_step": 103828, "epoch": 1250} {"train_loss": -21.976062774658203, "global_step": 103829, "epoch": 1250} {"train_loss": -21.96715545654297, "global_step": 103830, "epoch": 1250} {"train_loss": -22.113956451416016, "global_step": 103831, "epoch": 1250} {"train_loss": -21.91536188700113, "global_step": 103832, "epoch": 1250, "train/sim_max_reward_0": 1.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4500000": 1.0, "test/sim_max_reward_4500001": 1.0, "test/sim_max_reward_4500002": 1.0, "test/sim_max_reward_4500003": 1.0, "test/sim_max_reward_4500004": 1.0, "test/sim_max_reward_4500005": 1.0, "test/sim_max_reward_4500006": 0.0, "test/sim_max_reward_4500007": 1.0, "test/sim_max_reward_4500008": 1.0, "test/sim_max_reward_4500009": 1.0, "test/sim_max_reward_4500010": 1.0, "test/sim_max_reward_4500011": 1.0, "test/sim_max_reward_4500012": 1.0, "test/sim_max_reward_4500013": 1.0, "test/sim_max_reward_4500014": 1.0, "test/sim_max_reward_4500015": 1.0, "test/sim_max_reward_4500016": 1.0, "test/sim_max_reward_4500017": 1.0, "test/sim_max_reward_4500018": 1.0, "test/sim_max_reward_4500019": 1.0, "test/sim_max_reward_4500020": 1.0, "test/sim_max_reward_4500021": 1.0, "train/mean_score": 1.0, "test/mean_score": 0.9545454545454546, "val_loss": 6103503.5} {"train_loss": -22.346227645874023, "global_step": 103833, "epoch": 1251} {"train_loss": -21.796863555908203, "global_step": 103834, "epoch": 1251} {"train_loss": -22.0153865814209, "global_step": 103835, "epoch": 1251} {"train_loss": -21.328128814697266, "global_step": 103836, "epoch": 1251} {"train_loss": -21.771486282348633, "global_step": 103837, "epoch": 1251} {"train_loss": -21.89471435546875, "global_step": 103838, "epoch": 1251} {"train_loss": -22.198476791381836, "global_step": 103839, "epoch": 1251} {"train_loss": -22.00753402709961, "global_step": 103840, "epoch": 1251} {"train_loss": -21.89958381652832, "global_step": 103841, "epoch": 1251} {"train_loss": -21.456497192382812, "global_step": 103842, "epoch": 1251} {"train_loss": -21.785018920898438, "global_step": 103843, "epoch": 1251} {"train_loss": -21.79737663269043, "global_step": 103844, "epoch": 1251} {"train_loss": -22.150787353515625, "global_step": 103845, "epoch": 1251} {"train_loss": -22.11153221130371, "global_step": 103846, "epoch": 1251} {"train_loss": -21.863567352294922, "global_step": 103847, "epoch": 1251} {"train_loss": -21.5743350982666, "global_step": 103848, "epoch": 1251} {"train_loss": -22.020023345947266, "global_step": 103849, "epoch": 1251} {"train_loss": -21.78553581237793, "global_step": 103850, "epoch": 1251} {"train_loss": -22.24166488647461, "global_step": 103851, "epoch": 1251} {"train_loss": -22.174692153930664, "global_step": 103852, "epoch": 1251} {"train_loss": -21.814762115478516, "global_step": 103853, "epoch": 1251} {"train_loss": -22.096601486206055, "global_step": 103854, "epoch": 1251} {"train_loss": -21.997922897338867, "global_step": 103855, "epoch": 1251} {"train_loss": -22.054859161376953, "global_step": 103856, "epoch": 1251} {"train_loss": -22.119672775268555, "global_step": 103857, "epoch": 1251} {"train_loss": -22.0738582611084, "global_step": 103858, "epoch": 1251} {"train_loss": -22.29652214050293, "global_step": 103859, "epoch": 1251} {"train_loss": -21.8978271484375, "global_step": 103860, "epoch": 1251} {"train_loss": -22.052274703979492, "global_step": 103861, "epoch": 1251} {"train_loss": -22.2252254486084, "global_step": 103862, "epoch": 1251} {"train_loss": -22.008893966674805, "global_step": 103863, "epoch": 1251} {"train_loss": -22.32782554626465, "global_step": 103864, "epoch": 1251} {"train_loss": -22.4089412689209, "global_step": 103865, "epoch": 1251} {"train_loss": -22.503576278686523, "global_step": 103866, "epoch": 1251} {"train_loss": -21.912504196166992, "global_step": 103867, "epoch": 1251} {"train_loss": -22.10572624206543, "global_step": 103868, "epoch": 1251} {"train_loss": -22.155324935913086, "global_step": 103869, "epoch": 1251} {"train_loss": -22.04798698425293, "global_step": 103870, "epoch": 1251} {"train_loss": -21.827428817749023, "global_step": 103871, "epoch": 1251} {"train_loss": -21.95212173461914, "global_step": 103872, "epoch": 1251} {"train_loss": -21.91462516784668, "global_step": 103873, "epoch": 1251} {"train_loss": -21.594648361206055, "global_step": 103874, "epoch": 1251} {"train_loss": -22.003923416137695, "global_step": 103875, "epoch": 1251} {"train_loss": -22.23720932006836, "global_step": 103876, "epoch": 1251} {"train_loss": -22.621484756469727, "global_step": 103877, "epoch": 1251} {"train_loss": -22.246658325195312, "global_step": 103878, "epoch": 1251} {"train_loss": -22.207027435302734, "global_step": 103879, "epoch": 1251} {"train_loss": -22.210041046142578, "global_step": 103880, "epoch": 1251} {"train_loss": -21.882282257080078, "global_step": 103881, "epoch": 1251} {"train_loss": -21.930694580078125, "global_step": 103882, "epoch": 1251} {"train_loss": -21.72376823425293, "global_step": 103883, "epoch": 1251} {"train_loss": -22.015491485595703, "global_step": 103884, "epoch": 1251} {"train_loss": -21.812414169311523, "global_step": 103885, "epoch": 1251} {"train_loss": -22.205989837646484, "global_step": 103886, "epoch": 1251} {"train_loss": -22.25054931640625, "global_step": 103887, "epoch": 1251} {"train_loss": -22.3132381439209, "global_step": 103888, "epoch": 1251} {"train_loss": -22.127521514892578, "global_step": 103889, "epoch": 1251} {"train_loss": -21.904584884643555, "global_step": 103890, "epoch": 1251} {"train_loss": -21.90644645690918, "global_step": 103891, "epoch": 1251} {"train_loss": -22.186304092407227, "global_step": 103892, "epoch": 1251} {"train_loss": -22.048723220825195, "global_step": 103893, "epoch": 1251} {"train_loss": -21.828262329101562, "global_step": 103894, "epoch": 1251} {"train_loss": -21.9404354095459, "global_step": 103895, "epoch": 1251} {"train_loss": -22.21046257019043, "global_step": 103896, "epoch": 1251} {"train_loss": -22.011625289916992, "global_step": 103897, "epoch": 1251} {"train_loss": -22.33416175842285, "global_step": 103898, "epoch": 1251} {"train_loss": -22.254011154174805, "global_step": 103899, "epoch": 1251} {"train_loss": -21.915836334228516, "global_step": 103900, "epoch": 1251} {"train_loss": -21.8454532623291, "global_step": 103901, "epoch": 1251} {"train_loss": -22.697072982788086, "global_step": 103902, "epoch": 1251} {"train_loss": -22.59100914001465, "global_step": 103903, "epoch": 1251} {"train_loss": -21.762683868408203, "global_step": 103904, "epoch": 1251} {"train_loss": -22.063901901245117, "global_step": 103905, "epoch": 1251} {"train_loss": -21.814847946166992, "global_step": 103906, "epoch": 1251} {"train_loss": -22.112035751342773, "global_step": 103907, "epoch": 1251} {"train_loss": -21.944364547729492, "global_step": 103908, "epoch": 1251} {"train_loss": -22.010141372680664, "global_step": 103909, "epoch": 1251} {"train_loss": -22.178842544555664, "global_step": 103910, "epoch": 1251} {"train_loss": -22.40114402770996, "global_step": 103911, "epoch": 1251} {"train_loss": -22.37839698791504, "global_step": 103912, "epoch": 1251} {"train_loss": -22.158300399780273, "global_step": 103913, "epoch": 1251} {"train_loss": -22.141921997070312, "global_step": 103914, "epoch": 1251} {"train_loss": -22.040407548467797, "global_step": 103915, "epoch": 1251, "val_loss": 6241220.5} {"train_loss": -21.53908348083496, "global_step": 103916, "epoch": 1252} {"train_loss": -21.572830200195312, "global_step": 103917, "epoch": 1252} {"train_loss": -21.050437927246094, "global_step": 103918, "epoch": 1252} {"train_loss": -21.77964210510254, "global_step": 103919, "epoch": 1252} {"train_loss": -21.821142196655273, "global_step": 103920, "epoch": 1252} {"train_loss": -21.198200225830078, "global_step": 103921, "epoch": 1252} {"train_loss": -21.988656997680664, "global_step": 103922, "epoch": 1252} {"train_loss": -21.533302307128906, "global_step": 103923, "epoch": 1252} {"train_loss": -21.6104793548584, "global_step": 103924, "epoch": 1252} {"train_loss": -21.68290138244629, "global_step": 103925, "epoch": 1252} {"train_loss": -21.526874542236328, "global_step": 103926, "epoch": 1252} {"train_loss": -21.48145866394043, "global_step": 103927, "epoch": 1252} {"train_loss": -21.77296257019043, "global_step": 103928, "epoch": 1252} {"train_loss": -21.556249618530273, "global_step": 103929, "epoch": 1252} {"train_loss": -22.023794174194336, "global_step": 103930, "epoch": 1252} {"train_loss": -21.886734008789062, "global_step": 103931, "epoch": 1252} {"train_loss": -21.88300895690918, "global_step": 103932, "epoch": 1252} {"train_loss": -21.81365394592285, "global_step": 103933, "epoch": 1252} {"train_loss": -21.839468002319336, "global_step": 103934, "epoch": 1252} {"train_loss": -21.84705924987793, "global_step": 103935, "epoch": 1252} {"train_loss": -21.54703140258789, "global_step": 103936, "epoch": 1252} {"train_loss": -22.122182846069336, "global_step": 103937, "epoch": 1252} {"train_loss": -21.578996658325195, "global_step": 103938, "epoch": 1252} {"train_loss": -21.827905654907227, "global_step": 103939, "epoch": 1252} {"train_loss": -21.838224411010742, "global_step": 103940, "epoch": 1252} {"train_loss": -21.784242630004883, "global_step": 103941, "epoch": 1252} {"train_loss": -22.192380905151367, "global_step": 103942, "epoch": 1252} {"train_loss": -22.202268600463867, "global_step": 103943, "epoch": 1252} {"train_loss": -21.93714141845703, "global_step": 103944, "epoch": 1252} {"train_loss": -22.237836837768555, "global_step": 103945, "epoch": 1252} {"train_loss": -22.303709030151367, "global_step": 103946, "epoch": 1252} {"train_loss": -21.80939292907715, "global_step": 103947, "epoch": 1252} {"train_loss": -21.995052337646484, "global_step": 103948, "epoch": 1252} {"train_loss": -22.247066497802734, "global_step": 103949, "epoch": 1252} {"train_loss": -22.066242218017578, "global_step": 103950, "epoch": 1252} {"train_loss": -22.367826461791992, "global_step": 103951, "epoch": 1252} {"train_loss": -21.855224609375, "global_step": 103952, "epoch": 1252} {"train_loss": -22.01466178894043, "global_step": 103953, "epoch": 1252} {"train_loss": -22.33475685119629, "global_step": 103954, "epoch": 1252} {"train_loss": -22.03500747680664, "global_step": 103955, "epoch": 1252} {"train_loss": -21.915842056274414, "global_step": 103956, "epoch": 1252} {"train_loss": -22.02743911743164, "global_step": 103957, "epoch": 1252} {"train_loss": -21.97705078125, "global_step": 103958, "epoch": 1252} {"train_loss": -21.636306762695312, "global_step": 103959, "epoch": 1252} {"train_loss": -22.087743759155273, "global_step": 103960, "epoch": 1252} {"train_loss": -22.080615997314453, "global_step": 103961, "epoch": 1252} {"train_loss": -21.97173500061035, "global_step": 103962, "epoch": 1252} {"train_loss": -22.00346565246582, "global_step": 103963, "epoch": 1252} {"train_loss": -22.243268966674805, "global_step": 103964, "epoch": 1252} {"train_loss": -22.241891860961914, "global_step": 103965, "epoch": 1252} {"train_loss": -21.95956039428711, "global_step": 103966, "epoch": 1252} {"train_loss": -21.795007705688477, "global_step": 103967, "epoch": 1252} {"train_loss": -22.132776260375977, "global_step": 103968, "epoch": 1252} {"train_loss": -22.141328811645508, "global_step": 103969, "epoch": 1252} {"train_loss": -21.57330322265625, "global_step": 103970, "epoch": 1252} {"train_loss": -22.210041046142578, "global_step": 103971, "epoch": 1252} {"train_loss": -21.952056884765625, "global_step": 103972, "epoch": 1252} {"train_loss": -22.026132583618164, "global_step": 103973, "epoch": 1252} {"train_loss": -22.329763412475586, "global_step": 103974, "epoch": 1252} {"train_loss": -22.0585994720459, "global_step": 103975, "epoch": 1252} {"train_loss": -22.00150489807129, "global_step": 103976, "epoch": 1252} {"train_loss": -22.307050704956055, "global_step": 103977, "epoch": 1252} {"train_loss": -21.831541061401367, "global_step": 103978, "epoch": 1252} {"train_loss": -22.164875030517578, "global_step": 103979, "epoch": 1252} {"train_loss": -21.971317291259766, "global_step": 103980, "epoch": 1252} {"train_loss": -22.11957359313965, "global_step": 103981, "epoch": 1252} {"train_loss": -22.195009231567383, "global_step": 103982, "epoch": 1252} {"train_loss": -22.25496482849121, "global_step": 103983, "epoch": 1252} {"train_loss": -22.410551071166992, "global_step": 103984, "epoch": 1252} {"train_loss": -21.881103515625, "global_step": 103985, "epoch": 1252} {"train_loss": -21.69354820251465, "global_step": 103986, "epoch": 1252} {"train_loss": -21.95718765258789, "global_step": 103987, "epoch": 1252} {"train_loss": -22.19491958618164, "global_step": 103988, "epoch": 1252} {"train_loss": -22.087726593017578, "global_step": 103989, "epoch": 1252} {"train_loss": -21.96366310119629, "global_step": 103990, "epoch": 1252} {"train_loss": -22.051706314086914, "global_step": 103991, "epoch": 1252} {"train_loss": -22.098501205444336, "global_step": 103992, "epoch": 1252} {"train_loss": -21.81922721862793, "global_step": 103993, "epoch": 1252} {"train_loss": -22.157926559448242, "global_step": 103994, "epoch": 1252} {"train_loss": -22.207294464111328, "global_step": 103995, "epoch": 1252} {"train_loss": -21.986270904541016, "global_step": 103996, "epoch": 1252} {"train_loss": -22.284072875976562, "global_step": 103997, "epoch": 1252} {"train_loss": -21.944994409400298, "global_step": 103998, "epoch": 1252, "val_loss": 6325607.0} {"train_loss": -21.934017181396484, "global_step": 103999, "epoch": 1253} {"train_loss": -21.76750373840332, "global_step": 104000, "epoch": 1253} {"train_loss": -21.818740844726562, "global_step": 104001, "epoch": 1253} {"train_loss": -21.56621742248535, "global_step": 104002, "epoch": 1253} {"train_loss": -21.679893493652344, "global_step": 104003, "epoch": 1253} {"train_loss": -21.512081146240234, "global_step": 104004, "epoch": 1253} {"train_loss": -21.94905662536621, "global_step": 104005, "epoch": 1253} {"train_loss": -21.73802947998047, "global_step": 104006, "epoch": 1253} {"train_loss": -21.686941146850586, "global_step": 104007, "epoch": 1253} {"train_loss": -22.23287010192871, "global_step": 104008, "epoch": 1253} {"train_loss": -21.778640747070312, "global_step": 104009, "epoch": 1253} {"train_loss": -21.93888282775879, "global_step": 104010, "epoch": 1253} {"train_loss": -21.90771484375, "global_step": 104011, "epoch": 1253} {"train_loss": -21.71763801574707, "global_step": 104012, "epoch": 1253} {"train_loss": -22.198755264282227, "global_step": 104013, "epoch": 1253} {"train_loss": -21.905363082885742, "global_step": 104014, "epoch": 1253} {"train_loss": -21.576377868652344, "global_step": 104015, "epoch": 1253} {"train_loss": -21.926218032836914, "global_step": 104016, "epoch": 1253} {"train_loss": -21.933313369750977, "global_step": 104017, "epoch": 1253} {"train_loss": -22.214536666870117, "global_step": 104018, "epoch": 1253} {"train_loss": -21.94514274597168, "global_step": 104019, "epoch": 1253} {"train_loss": -22.110883712768555, "global_step": 104020, "epoch": 1253} {"train_loss": -21.992305755615234, "global_step": 104021, "epoch": 1253} {"train_loss": -21.985788345336914, "global_step": 104022, "epoch": 1253} {"train_loss": -21.80556297302246, "global_step": 104023, "epoch": 1253} {"train_loss": -22.06952476501465, "global_step": 104024, "epoch": 1253} {"train_loss": -22.281675338745117, "global_step": 104025, "epoch": 1253} {"train_loss": -22.020549774169922, "global_step": 104026, "epoch": 1253} {"train_loss": -22.136215209960938, "global_step": 104027, "epoch": 1253} {"train_loss": -22.517608642578125, "global_step": 104028, "epoch": 1253} {"train_loss": -22.37674903869629, "global_step": 104029, "epoch": 1253} {"train_loss": -21.95197868347168, "global_step": 104030, "epoch": 1253} {"train_loss": -22.295133590698242, "global_step": 104031, "epoch": 1253} {"train_loss": -21.938440322875977, "global_step": 104032, "epoch": 1253} {"train_loss": -22.0255069732666, "global_step": 104033, "epoch": 1253} {"train_loss": -22.174123764038086, "global_step": 104034, "epoch": 1253} {"train_loss": -21.90692901611328, "global_step": 104035, "epoch": 1253} {"train_loss": -22.03074836730957, "global_step": 104036, "epoch": 1253} {"train_loss": -22.20132827758789, "global_step": 104037, "epoch": 1253} {"train_loss": -21.933475494384766, "global_step": 104038, "epoch": 1253} {"train_loss": -21.887487411499023, "global_step": 104039, "epoch": 1253} {"train_loss": -22.111539840698242, "global_step": 104040, "epoch": 1253} {"train_loss": -22.00994110107422, "global_step": 104041, "epoch": 1253} {"train_loss": -22.410964965820312, "global_step": 104042, "epoch": 1253} {"train_loss": -22.30550193786621, "global_step": 104043, "epoch": 1253} {"train_loss": -22.229238510131836, "global_step": 104044, "epoch": 1253} {"train_loss": -22.721097946166992, "global_step": 104045, "epoch": 1253} {"train_loss": -22.15996742248535, "global_step": 104046, "epoch": 1253} {"train_loss": -21.943159103393555, "global_step": 104047, "epoch": 1253} {"train_loss": -22.05086326599121, "global_step": 104048, "epoch": 1253} {"train_loss": -21.947650909423828, "global_step": 104049, "epoch": 1253} {"train_loss": -21.916406631469727, "global_step": 104050, "epoch": 1253} {"train_loss": -22.2125186920166, "global_step": 104051, "epoch": 1253} {"train_loss": -21.863672256469727, "global_step": 104052, "epoch": 1253} {"train_loss": -22.250883102416992, "global_step": 104053, "epoch": 1253} {"train_loss": -21.86356544494629, "global_step": 104054, "epoch": 1253} {"train_loss": -22.09357452392578, "global_step": 104055, "epoch": 1253} {"train_loss": -22.185659408569336, "global_step": 104056, "epoch": 1253} {"train_loss": -21.916650772094727, "global_step": 104057, "epoch": 1253} {"train_loss": -22.070703506469727, "global_step": 104058, "epoch": 1253} {"train_loss": -22.0687313079834, "global_step": 104059, "epoch": 1253} {"train_loss": -22.483707427978516, "global_step": 104060, "epoch": 1253} {"train_loss": -22.006122589111328, "global_step": 104061, "epoch": 1253} {"train_loss": -22.398019790649414, "global_step": 104062, "epoch": 1253} {"train_loss": -21.976579666137695, "global_step": 104063, "epoch": 1253} {"train_loss": -22.012372970581055, "global_step": 104064, "epoch": 1253} {"train_loss": -21.703123092651367, "global_step": 104065, "epoch": 1253} {"train_loss": -22.312978744506836, "global_step": 104066, "epoch": 1253} {"train_loss": -22.23079490661621, "global_step": 104067, "epoch": 1253} {"train_loss": -22.186445236206055, "global_step": 104068, "epoch": 1253} {"train_loss": -22.302518844604492, "global_step": 104069, "epoch": 1253} {"train_loss": -21.87604331970215, "global_step": 104070, "epoch": 1253} {"train_loss": -22.09571647644043, "global_step": 104071, "epoch": 1253} {"train_loss": -22.136526107788086, "global_step": 104072, "epoch": 1253} {"train_loss": -22.22067642211914, "global_step": 104073, "epoch": 1253} {"train_loss": -21.976444244384766, "global_step": 104074, "epoch": 1253} {"train_loss": -21.85955810546875, "global_step": 104075, "epoch": 1253} {"train_loss": -22.07477378845215, "global_step": 104076, "epoch": 1253} {"train_loss": -22.279218673706055, "global_step": 104077, "epoch": 1253} {"train_loss": -21.922916412353516, "global_step": 104078, "epoch": 1253} {"train_loss": -21.90334129333496, "global_step": 104079, "epoch": 1253} {"train_loss": -21.512815475463867, "global_step": 104080, "epoch": 1253} {"train_loss": -22.044565844248577, "global_step": 104081, "epoch": 1253, "val_loss": 6303432.0} {"train_loss": -19.06476402282715, "global_step": 104082, "epoch": 1254} {"train_loss": -21.137584686279297, "global_step": 104083, "epoch": 1254} {"train_loss": -19.64702796936035, "global_step": 104084, "epoch": 1254} {"train_loss": -20.829397201538086, "global_step": 104085, "epoch": 1254} {"train_loss": -20.161205291748047, "global_step": 104086, "epoch": 1254} {"train_loss": -20.927597045898438, "global_step": 104087, "epoch": 1254} {"train_loss": -20.737316131591797, "global_step": 104088, "epoch": 1254} {"train_loss": -20.952594757080078, "global_step": 104089, "epoch": 1254} {"train_loss": -21.137277603149414, "global_step": 104090, "epoch": 1254} {"train_loss": -21.0395565032959, "global_step": 104091, "epoch": 1254} {"train_loss": -21.081987380981445, "global_step": 104092, "epoch": 1254} {"train_loss": -21.040996551513672, "global_step": 104093, "epoch": 1254} {"train_loss": -21.0650691986084, "global_step": 104094, "epoch": 1254} {"train_loss": -20.992252349853516, "global_step": 104095, "epoch": 1254} {"train_loss": -21.39666748046875, "global_step": 104096, "epoch": 1254} {"train_loss": -21.559446334838867, "global_step": 104097, "epoch": 1254} {"train_loss": -21.282907485961914, "global_step": 104098, "epoch": 1254} {"train_loss": -21.191913604736328, "global_step": 104099, "epoch": 1254} {"train_loss": -21.670358657836914, "global_step": 104100, "epoch": 1254} {"train_loss": -21.42744255065918, "global_step": 104101, "epoch": 1254} {"train_loss": -21.268573760986328, "global_step": 104102, "epoch": 1254} {"train_loss": -21.54188346862793, "global_step": 104103, "epoch": 1254} {"train_loss": -21.64869499206543, "global_step": 104104, "epoch": 1254} {"train_loss": -21.876548767089844, "global_step": 104105, "epoch": 1254} {"train_loss": -21.90447998046875, "global_step": 104106, "epoch": 1254} {"train_loss": -21.486923217773438, "global_step": 104107, "epoch": 1254} {"train_loss": -21.589353561401367, "global_step": 104108, "epoch": 1254} {"train_loss": -21.532428741455078, "global_step": 104109, "epoch": 1254} {"train_loss": -21.940176010131836, "global_step": 104110, "epoch": 1254} {"train_loss": -21.50071907043457, "global_step": 104111, "epoch": 1254} {"train_loss": -21.647380828857422, "global_step": 104112, "epoch": 1254} {"train_loss": -21.3773136138916, "global_step": 104113, "epoch": 1254} {"train_loss": -21.82415771484375, "global_step": 104114, "epoch": 1254} {"train_loss": -21.304319381713867, "global_step": 104115, "epoch": 1254} {"train_loss": -21.78795623779297, "global_step": 104116, "epoch": 1254} {"train_loss": -21.5526180267334, "global_step": 104117, "epoch": 1254} {"train_loss": -21.36919403076172, "global_step": 104118, "epoch": 1254} {"train_loss": -21.85782814025879, "global_step": 104119, "epoch": 1254} {"train_loss": -21.98581314086914, "global_step": 104120, "epoch": 1254} {"train_loss": -21.779895782470703, "global_step": 104121, "epoch": 1254} {"train_loss": -22.3023738861084, "global_step": 104122, "epoch": 1254} {"train_loss": -21.850229263305664, "global_step": 104123, "epoch": 1254} {"train_loss": -21.8920841217041, "global_step": 104124, "epoch": 1254} {"train_loss": -21.895137786865234, "global_step": 104125, "epoch": 1254} {"train_loss": -21.769742965698242, "global_step": 104126, "epoch": 1254} {"train_loss": -22.0755672454834, "global_step": 104127, "epoch": 1254} {"train_loss": -21.800945281982422, "global_step": 104128, "epoch": 1254} {"train_loss": -22.053815841674805, "global_step": 104129, "epoch": 1254} {"train_loss": -21.921396255493164, "global_step": 104130, "epoch": 1254} {"train_loss": -21.705089569091797, "global_step": 104131, "epoch": 1254} {"train_loss": -21.659093856811523, "global_step": 104132, "epoch": 1254} {"train_loss": -21.724262237548828, "global_step": 104133, "epoch": 1254} {"train_loss": -21.795957565307617, "global_step": 104134, "epoch": 1254} {"train_loss": -22.194334030151367, "global_step": 104135, "epoch": 1254} {"train_loss": -22.020771026611328, "global_step": 104136, "epoch": 1254} {"train_loss": -22.01498031616211, "global_step": 104137, "epoch": 1254} {"train_loss": -22.43305778503418, "global_step": 104138, "epoch": 1254} {"train_loss": -22.03059959411621, "global_step": 104139, "epoch": 1254} {"train_loss": -22.109756469726562, "global_step": 104140, "epoch": 1254} {"train_loss": -22.071073532104492, "global_step": 104141, "epoch": 1254} {"train_loss": -22.113935470581055, "global_step": 104142, "epoch": 1254} {"train_loss": -21.521560668945312, "global_step": 104143, "epoch": 1254} {"train_loss": -22.330209732055664, "global_step": 104144, "epoch": 1254} {"train_loss": -22.185138702392578, "global_step": 104145, "epoch": 1254} {"train_loss": -22.10451889038086, "global_step": 104146, "epoch": 1254} {"train_loss": -21.883390426635742, "global_step": 104147, "epoch": 1254} {"train_loss": -22.068340301513672, "global_step": 104148, "epoch": 1254} {"train_loss": -21.899873733520508, "global_step": 104149, "epoch": 1254} {"train_loss": -21.908185958862305, "global_step": 104150, "epoch": 1254} {"train_loss": -22.403305053710938, "global_step": 104151, "epoch": 1254} {"train_loss": -22.120807647705078, "global_step": 104152, "epoch": 1254} {"train_loss": -21.978038787841797, "global_step": 104153, "epoch": 1254} {"train_loss": -22.436931610107422, "global_step": 104154, "epoch": 1254} {"train_loss": -21.961835861206055, "global_step": 104155, "epoch": 1254} {"train_loss": -22.15468978881836, "global_step": 104156, "epoch": 1254} {"train_loss": -22.085983276367188, "global_step": 104157, "epoch": 1254} {"train_loss": -22.101198196411133, "global_step": 104158, "epoch": 1254} {"train_loss": -22.04055404663086, "global_step": 104159, "epoch": 1254} {"train_loss": -21.905447006225586, "global_step": 104160, "epoch": 1254} {"train_loss": -21.963638305664062, "global_step": 104161, "epoch": 1254} {"train_loss": -22.1387939453125, "global_step": 104162, "epoch": 1254} {"train_loss": -22.251962661743164, "global_step": 104163, "epoch": 1254} {"train_loss": -21.67820339892284, "global_step": 104164, "epoch": 1254, "val_loss": 6044595.0} {"train_loss": -21.53959083557129, "global_step": 104165, "epoch": 1255} {"train_loss": -22.06252670288086, "global_step": 104166, "epoch": 1255} {"train_loss": -21.533445358276367, "global_step": 104167, "epoch": 1255} {"train_loss": -21.727664947509766, "global_step": 104168, "epoch": 1255} {"train_loss": -21.18511390686035, "global_step": 104169, "epoch": 1255} {"train_loss": -21.508432388305664, "global_step": 104170, "epoch": 1255} {"train_loss": -21.605854034423828, "global_step": 104171, "epoch": 1255} {"train_loss": -21.94463539123535, "global_step": 104172, "epoch": 1255} {"train_loss": -21.821720123291016, "global_step": 104173, "epoch": 1255} {"train_loss": -21.7447566986084, "global_step": 104174, "epoch": 1255} {"train_loss": -21.750024795532227, "global_step": 104175, "epoch": 1255} {"train_loss": -21.75446891784668, "global_step": 104176, "epoch": 1255} {"train_loss": -21.37354278564453, "global_step": 104177, "epoch": 1255} {"train_loss": -21.519624710083008, "global_step": 104178, "epoch": 1255} {"train_loss": -21.553701400756836, "global_step": 104179, "epoch": 1255} {"train_loss": -21.67690658569336, "global_step": 104180, "epoch": 1255} {"train_loss": -21.777454376220703, "global_step": 104181, "epoch": 1255} {"train_loss": -21.77040672302246, "global_step": 104182, "epoch": 1255} {"train_loss": -21.811424255371094, "global_step": 104183, "epoch": 1255} {"train_loss": -21.800262451171875, "global_step": 104184, "epoch": 1255} {"train_loss": -21.689697265625, "global_step": 104185, "epoch": 1255} {"train_loss": -22.13113021850586, "global_step": 104186, "epoch": 1255} {"train_loss": -21.75522804260254, "global_step": 104187, "epoch": 1255} {"train_loss": -22.267160415649414, "global_step": 104188, "epoch": 1255} {"train_loss": -22.54975700378418, "global_step": 104189, "epoch": 1255} {"train_loss": -21.793315887451172, "global_step": 104190, "epoch": 1255} {"train_loss": -22.08100128173828, "global_step": 104191, "epoch": 1255} {"train_loss": -21.31766128540039, "global_step": 104192, "epoch": 1255} {"train_loss": -22.346141815185547, "global_step": 104193, "epoch": 1255} {"train_loss": -21.98851776123047, "global_step": 104194, "epoch": 1255} {"train_loss": -21.828428268432617, "global_step": 104195, "epoch": 1255} {"train_loss": -22.029333114624023, "global_step": 104196, "epoch": 1255} {"train_loss": -21.839134216308594, "global_step": 104197, "epoch": 1255} {"train_loss": -22.106531143188477, "global_step": 104198, "epoch": 1255} {"train_loss": -21.875646591186523, "global_step": 104199, "epoch": 1255} {"train_loss": -22.217756271362305, "global_step": 104200, "epoch": 1255} {"train_loss": -21.764297485351562, "global_step": 104201, "epoch": 1255} {"train_loss": -22.05784034729004, "global_step": 104202, "epoch": 1255} {"train_loss": -21.650379180908203, "global_step": 104203, "epoch": 1255} {"train_loss": -22.274459838867188, "global_step": 104204, "epoch": 1255} {"train_loss": -22.498611450195312, "global_step": 104205, "epoch": 1255} {"train_loss": -22.279407501220703, "global_step": 104206, "epoch": 1255} {"train_loss": -21.92996597290039, "global_step": 104207, "epoch": 1255} {"train_loss": -22.178544998168945, "global_step": 104208, "epoch": 1255} {"train_loss": -22.410409927368164, "global_step": 104209, "epoch": 1255} {"train_loss": -21.863189697265625, "global_step": 104210, "epoch": 1255} {"train_loss": -22.00722312927246, "global_step": 104211, "epoch": 1255} {"train_loss": -21.986913681030273, "global_step": 104212, "epoch": 1255} {"train_loss": -21.951824188232422, "global_step": 104213, "epoch": 1255} {"train_loss": -21.96459197998047, "global_step": 104214, "epoch": 1255} {"train_loss": -22.411664962768555, "global_step": 104215, "epoch": 1255} {"train_loss": -21.983196258544922, "global_step": 104216, "epoch": 1255} {"train_loss": -21.9725399017334, "global_step": 104217, "epoch": 1255} {"train_loss": -21.701379776000977, "global_step": 104218, "epoch": 1255} {"train_loss": -22.04876708984375, "global_step": 104219, "epoch": 1255} {"train_loss": -21.99922752380371, "global_step": 104220, "epoch": 1255} {"train_loss": -22.21823501586914, "global_step": 104221, "epoch": 1255} {"train_loss": -21.9920597076416, "global_step": 104222, "epoch": 1255} {"train_loss": -22.460205078125, "global_step": 104223, "epoch": 1255} {"train_loss": -22.604551315307617, "global_step": 104224, "epoch": 1255} {"train_loss": -22.2493896484375, "global_step": 104225, "epoch": 1255} {"train_loss": -21.810667037963867, "global_step": 104226, "epoch": 1255} {"train_loss": -21.9682674407959, "global_step": 104227, "epoch": 1255} {"train_loss": -22.260330200195312, "global_step": 104228, "epoch": 1255} {"train_loss": -22.11811065673828, "global_step": 104229, "epoch": 1255} {"train_loss": -22.209203720092773, "global_step": 104230, "epoch": 1255} {"train_loss": -22.355985641479492, "global_step": 104231, "epoch": 1255} {"train_loss": -22.10868263244629, "global_step": 104232, "epoch": 1255} {"train_loss": -21.902956008911133, "global_step": 104233, "epoch": 1255} {"train_loss": -22.622766494750977, "global_step": 104234, "epoch": 1255} {"train_loss": -21.690887451171875, "global_step": 104235, "epoch": 1255} {"train_loss": -22.24277114868164, "global_step": 104236, "epoch": 1255} {"train_loss": -21.39919090270996, "global_step": 104237, "epoch": 1255} {"train_loss": -22.253849029541016, "global_step": 104238, "epoch": 1255} {"train_loss": -21.75679588317871, "global_step": 104239, "epoch": 1255} {"train_loss": -21.858707427978516, "global_step": 104240, "epoch": 1255} {"train_loss": -21.897714614868164, "global_step": 104241, "epoch": 1255} {"train_loss": -22.14154624938965, "global_step": 104242, "epoch": 1255} {"train_loss": -21.867380142211914, "global_step": 104243, "epoch": 1255} {"train_loss": -21.88617706298828, "global_step": 104244, "epoch": 1255} {"train_loss": -21.85888671875, "global_step": 104245, "epoch": 1255} {"train_loss": -21.990461349487305, "global_step": 104246, "epoch": 1255} {"train_loss": -21.953908506646215, "global_step": 104247, "epoch": 1255, "val_loss": 6215451.5} {"train_loss": -21.320341110229492, "global_step": 104248, "epoch": 1256} {"train_loss": -20.83320426940918, "global_step": 104249, "epoch": 1256} {"train_loss": -21.801420211791992, "global_step": 104250, "epoch": 1256} {"train_loss": -20.773908615112305, "global_step": 104251, "epoch": 1256} {"train_loss": -21.27907371520996, "global_step": 104252, "epoch": 1256} {"train_loss": -21.36421012878418, "global_step": 104253, "epoch": 1256} {"train_loss": -21.16526222229004, "global_step": 104254, "epoch": 1256} {"train_loss": -21.702865600585938, "global_step": 104255, "epoch": 1256} {"train_loss": -21.434412002563477, "global_step": 104256, "epoch": 1256} {"train_loss": -21.4813289642334, "global_step": 104257, "epoch": 1256} {"train_loss": -21.425357818603516, "global_step": 104258, "epoch": 1256} {"train_loss": -21.761133193969727, "global_step": 104259, "epoch": 1256} {"train_loss": -21.884714126586914, "global_step": 104260, "epoch": 1256} {"train_loss": -21.65543556213379, "global_step": 104261, "epoch": 1256} {"train_loss": -21.89911460876465, "global_step": 104262, "epoch": 1256} {"train_loss": -21.614139556884766, "global_step": 104263, "epoch": 1256} {"train_loss": -22.073341369628906, "global_step": 104264, "epoch": 1256} {"train_loss": -21.612255096435547, "global_step": 104265, "epoch": 1256} {"train_loss": -21.5345458984375, "global_step": 104266, "epoch": 1256} {"train_loss": -21.677207946777344, "global_step": 104267, "epoch": 1256} {"train_loss": -22.009353637695312, "global_step": 104268, "epoch": 1256} {"train_loss": -21.71626853942871, "global_step": 104269, "epoch": 1256} {"train_loss": -21.608348846435547, "global_step": 104270, "epoch": 1256} {"train_loss": -21.821714401245117, "global_step": 104271, "epoch": 1256} {"train_loss": -21.763547897338867, "global_step": 104272, "epoch": 1256} {"train_loss": -21.864028930664062, "global_step": 104273, "epoch": 1256} {"train_loss": -21.973535537719727, "global_step": 104274, "epoch": 1256} {"train_loss": -21.638883590698242, "global_step": 104275, "epoch": 1256} {"train_loss": -22.057374954223633, "global_step": 104276, "epoch": 1256} {"train_loss": -21.95789909362793, "global_step": 104277, "epoch": 1256} {"train_loss": -21.932828903198242, "global_step": 104278, "epoch": 1256} {"train_loss": -22.005136489868164, "global_step": 104279, "epoch": 1256} {"train_loss": -22.661054611206055, "global_step": 104280, "epoch": 1256} {"train_loss": -22.26266860961914, "global_step": 104281, "epoch": 1256} {"train_loss": -22.482681274414062, "global_step": 104282, "epoch": 1256} {"train_loss": -22.02602767944336, "global_step": 104283, "epoch": 1256} {"train_loss": -22.128177642822266, "global_step": 104284, "epoch": 1256} {"train_loss": -22.46431541442871, "global_step": 104285, "epoch": 1256} {"train_loss": -22.288496017456055, "global_step": 104286, "epoch": 1256} {"train_loss": -21.907642364501953, "global_step": 104287, "epoch": 1256} {"train_loss": -21.896726608276367, "global_step": 104288, "epoch": 1256} {"train_loss": -22.149917602539062, "global_step": 104289, "epoch": 1256} {"train_loss": -22.268726348876953, "global_step": 104290, "epoch": 1256} {"train_loss": -22.718385696411133, "global_step": 104291, "epoch": 1256} {"train_loss": -21.884469985961914, "global_step": 104292, "epoch": 1256} {"train_loss": -22.062692642211914, "global_step": 104293, "epoch": 1256} {"train_loss": -22.131614685058594, "global_step": 104294, "epoch": 1256} {"train_loss": -22.140121459960938, "global_step": 104295, "epoch": 1256} {"train_loss": -21.871252059936523, "global_step": 104296, "epoch": 1256} {"train_loss": -21.854175567626953, "global_step": 104297, "epoch": 1256} {"train_loss": -22.14926528930664, "global_step": 104298, "epoch": 1256} {"train_loss": -21.99907875061035, "global_step": 104299, "epoch": 1256} {"train_loss": -22.340133666992188, "global_step": 104300, "epoch": 1256} {"train_loss": -21.869993209838867, "global_step": 104301, "epoch": 1256} {"train_loss": -22.163206100463867, "global_step": 104302, "epoch": 1256} {"train_loss": -22.15382957458496, "global_step": 104303, "epoch": 1256} {"train_loss": -21.976743698120117, "global_step": 104304, "epoch": 1256} {"train_loss": -22.180139541625977, "global_step": 104305, "epoch": 1256} {"train_loss": -22.339359283447266, "global_step": 104306, "epoch": 1256} {"train_loss": -21.86635971069336, "global_step": 104307, "epoch": 1256} {"train_loss": -21.97119140625, "global_step": 104308, "epoch": 1256} {"train_loss": -21.68767547607422, "global_step": 104309, "epoch": 1256} {"train_loss": -22.20163345336914, "global_step": 104310, "epoch": 1256} {"train_loss": -22.182180404663086, "global_step": 104311, "epoch": 1256} {"train_loss": -22.42605972290039, "global_step": 104312, "epoch": 1256} {"train_loss": -22.10357093811035, "global_step": 104313, "epoch": 1256} {"train_loss": -22.001571655273438, "global_step": 104314, "epoch": 1256} {"train_loss": -21.969173431396484, "global_step": 104315, "epoch": 1256} {"train_loss": -21.6818904876709, "global_step": 104316, "epoch": 1256} {"train_loss": -22.01187515258789, "global_step": 104317, "epoch": 1256} {"train_loss": -21.983762741088867, "global_step": 104318, "epoch": 1256} {"train_loss": -22.189977645874023, "global_step": 104319, "epoch": 1256} {"train_loss": -21.910573959350586, "global_step": 104320, "epoch": 1256} {"train_loss": -22.062702178955078, "global_step": 104321, "epoch": 1256} {"train_loss": -21.762319564819336, "global_step": 104322, "epoch": 1256} {"train_loss": -22.2853946685791, "global_step": 104323, "epoch": 1256} {"train_loss": -22.137086868286133, "global_step": 104324, "epoch": 1256} {"train_loss": -22.15193748474121, "global_step": 104325, "epoch": 1256} {"train_loss": -22.2458438873291, "global_step": 104326, "epoch": 1256} {"train_loss": -22.418201446533203, "global_step": 104327, "epoch": 1256} {"train_loss": -21.8905086517334, "global_step": 104328, "epoch": 1256} {"train_loss": -22.080463409423828, "global_step": 104329, "epoch": 1256} {"train_loss": -21.923763183226068, "global_step": 104330, "epoch": 1256, "val_loss": 6097150.0} {"train_loss": -22.071584701538086, "global_step": 104331, "epoch": 1257} {"train_loss": -22.42486000061035, "global_step": 104332, "epoch": 1257} {"train_loss": -21.7220401763916, "global_step": 104333, "epoch": 1257} {"train_loss": -21.97736167907715, "global_step": 104334, "epoch": 1257} {"train_loss": -22.16291618347168, "global_step": 104335, "epoch": 1257} {"train_loss": -21.996999740600586, "global_step": 104336, "epoch": 1257} {"train_loss": -22.178333282470703, "global_step": 104337, "epoch": 1257} {"train_loss": -21.96953582763672, "global_step": 104338, "epoch": 1257} {"train_loss": -22.344575881958008, "global_step": 104339, "epoch": 1257} {"train_loss": -22.167539596557617, "global_step": 104340, "epoch": 1257} {"train_loss": -22.081464767456055, "global_step": 104341, "epoch": 1257} {"train_loss": -22.02793312072754, "global_step": 104342, "epoch": 1257} {"train_loss": -21.933486938476562, "global_step": 104343, "epoch": 1257} {"train_loss": -21.938861846923828, "global_step": 104344, "epoch": 1257} {"train_loss": -21.90218162536621, "global_step": 104345, "epoch": 1257} {"train_loss": -22.348007202148438, "global_step": 104346, "epoch": 1257} {"train_loss": -22.049930572509766, "global_step": 104347, "epoch": 1257} {"train_loss": -22.25018882751465, "global_step": 104348, "epoch": 1257} {"train_loss": -22.347549438476562, "global_step": 104349, "epoch": 1257} {"train_loss": -22.024002075195312, "global_step": 104350, "epoch": 1257} {"train_loss": -22.023685455322266, "global_step": 104351, "epoch": 1257} {"train_loss": -22.021224975585938, "global_step": 104352, "epoch": 1257} {"train_loss": -22.197912216186523, "global_step": 104353, "epoch": 1257} {"train_loss": -21.858854293823242, "global_step": 104354, "epoch": 1257} {"train_loss": -21.809919357299805, "global_step": 104355, "epoch": 1257} {"train_loss": -21.73421287536621, "global_step": 104356, "epoch": 1257} {"train_loss": -21.880075454711914, "global_step": 104357, "epoch": 1257} {"train_loss": -21.457273483276367, "global_step": 104358, "epoch": 1257} {"train_loss": -22.32148551940918, "global_step": 104359, "epoch": 1257} {"train_loss": -21.93619728088379, "global_step": 104360, "epoch": 1257} {"train_loss": -22.201026916503906, "global_step": 104361, "epoch": 1257} {"train_loss": -21.86446189880371, "global_step": 104362, "epoch": 1257} {"train_loss": -22.396774291992188, "global_step": 104363, "epoch": 1257} {"train_loss": -21.834623336791992, "global_step": 104364, "epoch": 1257} {"train_loss": -21.787410736083984, "global_step": 104365, "epoch": 1257} {"train_loss": -22.1008243560791, "global_step": 104366, "epoch": 1257} {"train_loss": -21.60570526123047, "global_step": 104367, "epoch": 1257} {"train_loss": -22.059951782226562, "global_step": 104368, "epoch": 1257} {"train_loss": -22.313695907592773, "global_step": 104369, "epoch": 1257} {"train_loss": -22.34324836730957, "global_step": 104370, "epoch": 1257} {"train_loss": -21.877124786376953, "global_step": 104371, "epoch": 1257} {"train_loss": -22.164234161376953, "global_step": 104372, "epoch": 1257} {"train_loss": -21.862911224365234, "global_step": 104373, "epoch": 1257} {"train_loss": -21.952390670776367, "global_step": 104374, "epoch": 1257} {"train_loss": -22.124479293823242, "global_step": 104375, "epoch": 1257} {"train_loss": -22.212726593017578, "global_step": 104376, "epoch": 1257} {"train_loss": -22.114356994628906, "global_step": 104377, "epoch": 1257} {"train_loss": -22.003219604492188, "global_step": 104378, "epoch": 1257} {"train_loss": -22.071208953857422, "global_step": 104379, "epoch": 1257} {"train_loss": -22.063886642456055, "global_step": 104380, "epoch": 1257} {"train_loss": -21.96543312072754, "global_step": 104381, "epoch": 1257} {"train_loss": -21.579870223999023, "global_step": 104382, "epoch": 1257} {"train_loss": -21.880544662475586, "global_step": 104383, "epoch": 1257} {"train_loss": -22.089599609375, "global_step": 104384, "epoch": 1257} {"train_loss": -21.89499282836914, "global_step": 104385, "epoch": 1257} {"train_loss": -21.440204620361328, "global_step": 104386, "epoch": 1257} {"train_loss": -22.02322769165039, "global_step": 104387, "epoch": 1257} {"train_loss": -22.091083526611328, "global_step": 104388, "epoch": 1257} {"train_loss": -21.79384422302246, "global_step": 104389, "epoch": 1257} {"train_loss": -21.832143783569336, "global_step": 104390, "epoch": 1257} {"train_loss": -22.003273010253906, "global_step": 104391, "epoch": 1257} {"train_loss": -21.772336959838867, "global_step": 104392, "epoch": 1257} {"train_loss": -22.201644897460938, "global_step": 104393, "epoch": 1257} {"train_loss": -21.9342098236084, "global_step": 104394, "epoch": 1257} {"train_loss": -21.843236923217773, "global_step": 104395, "epoch": 1257} {"train_loss": -21.853235244750977, "global_step": 104396, "epoch": 1257} {"train_loss": -22.372472763061523, "global_step": 104397, "epoch": 1257} {"train_loss": -21.732160568237305, "global_step": 104398, "epoch": 1257} {"train_loss": -22.072572708129883, "global_step": 104399, "epoch": 1257} {"train_loss": -22.2570858001709, "global_step": 104400, "epoch": 1257} {"train_loss": -21.897737503051758, "global_step": 104401, "epoch": 1257} {"train_loss": -22.43241310119629, "global_step": 104402, "epoch": 1257} {"train_loss": -22.05249786376953, "global_step": 104403, "epoch": 1257} {"train_loss": -22.404279708862305, "global_step": 104404, "epoch": 1257} {"train_loss": -21.86653709411621, "global_step": 104405, "epoch": 1257} {"train_loss": -22.04970932006836, "global_step": 104406, "epoch": 1257} {"train_loss": -22.065523147583008, "global_step": 104407, "epoch": 1257} {"train_loss": -22.276287078857422, "global_step": 104408, "epoch": 1257} {"train_loss": -22.245174407958984, "global_step": 104409, "epoch": 1257} {"train_loss": -22.18805503845215, "global_step": 104410, "epoch": 1257} {"train_loss": -21.952194213867188, "global_step": 104411, "epoch": 1257} {"train_loss": -21.989856719970703, "global_step": 104412, "epoch": 1257} {"train_loss": -22.03071674668645, "global_step": 104413, "epoch": 1257, "val_loss": 6170071.5} {"train_loss": -21.376609802246094, "global_step": 104414, "epoch": 1258} {"train_loss": -21.253376007080078, "global_step": 104415, "epoch": 1258} {"train_loss": -21.319807052612305, "global_step": 104416, "epoch": 1258} {"train_loss": -21.80923843383789, "global_step": 104417, "epoch": 1258} {"train_loss": -21.718381881713867, "global_step": 104418, "epoch": 1258} {"train_loss": -21.740299224853516, "global_step": 104419, "epoch": 1258} {"train_loss": -21.730012893676758, "global_step": 104420, "epoch": 1258} {"train_loss": -21.637052536010742, "global_step": 104421, "epoch": 1258} {"train_loss": -21.88702964782715, "global_step": 104422, "epoch": 1258} {"train_loss": -22.026811599731445, "global_step": 104423, "epoch": 1258} {"train_loss": -21.652883529663086, "global_step": 104424, "epoch": 1258} {"train_loss": -22.004276275634766, "global_step": 104425, "epoch": 1258} {"train_loss": -21.79619789123535, "global_step": 104426, "epoch": 1258} {"train_loss": -21.95099449157715, "global_step": 104427, "epoch": 1258} {"train_loss": -21.89251136779785, "global_step": 104428, "epoch": 1258} {"train_loss": -21.9743709564209, "global_step": 104429, "epoch": 1258} {"train_loss": -22.032791137695312, "global_step": 104430, "epoch": 1258} {"train_loss": -22.45344352722168, "global_step": 104431, "epoch": 1258} {"train_loss": -21.92057228088379, "global_step": 104432, "epoch": 1258} {"train_loss": -22.117712020874023, "global_step": 104433, "epoch": 1258} {"train_loss": -22.402908325195312, "global_step": 104434, "epoch": 1258} {"train_loss": -22.613039016723633, "global_step": 104435, "epoch": 1258} {"train_loss": -22.000110626220703, "global_step": 104436, "epoch": 1258} {"train_loss": -22.1403865814209, "global_step": 104437, "epoch": 1258} {"train_loss": -21.837303161621094, "global_step": 104438, "epoch": 1258} {"train_loss": -22.023563385009766, "global_step": 104439, "epoch": 1258} {"train_loss": -22.158967971801758, "global_step": 104440, "epoch": 1258} {"train_loss": -22.054887771606445, "global_step": 104441, "epoch": 1258} {"train_loss": -22.031126022338867, "global_step": 104442, "epoch": 1258} {"train_loss": -22.124013900756836, "global_step": 104443, "epoch": 1258} {"train_loss": -21.95013999938965, "global_step": 104444, "epoch": 1258} {"train_loss": -22.169849395751953, "global_step": 104445, "epoch": 1258} {"train_loss": -21.995298385620117, "global_step": 104446, "epoch": 1258} {"train_loss": -22.4749755859375, "global_step": 104447, "epoch": 1258} {"train_loss": -21.620410919189453, "global_step": 104448, "epoch": 1258} {"train_loss": -21.696720123291016, "global_step": 104449, "epoch": 1258} {"train_loss": -21.81793975830078, "global_step": 104450, "epoch": 1258} {"train_loss": -21.77960777282715, "global_step": 104451, "epoch": 1258} {"train_loss": -21.75418472290039, "global_step": 104452, "epoch": 1258} {"train_loss": -22.25974464416504, "global_step": 104453, "epoch": 1258} {"train_loss": -22.41744041442871, "global_step": 104454, "epoch": 1258} {"train_loss": -22.11466407775879, "global_step": 104455, "epoch": 1258} {"train_loss": -22.415847778320312, "global_step": 104456, "epoch": 1258} {"train_loss": -21.565080642700195, "global_step": 104457, "epoch": 1258} {"train_loss": -22.159137725830078, "global_step": 104458, "epoch": 1258} {"train_loss": -22.105627059936523, "global_step": 104459, "epoch": 1258} {"train_loss": -22.23236656188965, "global_step": 104460, "epoch": 1258} {"train_loss": -22.46844482421875, "global_step": 104461, "epoch": 1258} {"train_loss": -22.383047103881836, "global_step": 104462, "epoch": 1258} {"train_loss": -22.147953033447266, "global_step": 104463, "epoch": 1258} {"train_loss": -21.973501205444336, "global_step": 104464, "epoch": 1258} {"train_loss": -22.28876304626465, "global_step": 104465, "epoch": 1258} {"train_loss": -22.102916717529297, "global_step": 104466, "epoch": 1258} {"train_loss": -22.32212257385254, "global_step": 104467, "epoch": 1258} {"train_loss": -21.886062622070312, "global_step": 104468, "epoch": 1258} {"train_loss": -22.276601791381836, "global_step": 104469, "epoch": 1258} {"train_loss": -21.83778953552246, "global_step": 104470, "epoch": 1258} {"train_loss": -21.909738540649414, "global_step": 104471, "epoch": 1258} {"train_loss": -22.028736114501953, "global_step": 104472, "epoch": 1258} {"train_loss": -22.050466537475586, "global_step": 104473, "epoch": 1258} {"train_loss": -22.156904220581055, "global_step": 104474, "epoch": 1258} {"train_loss": -21.95958709716797, "global_step": 104475, "epoch": 1258} {"train_loss": -22.011281967163086, "global_step": 104476, "epoch": 1258} {"train_loss": -21.862401962280273, "global_step": 104477, "epoch": 1258} {"train_loss": -22.079334259033203, "global_step": 104478, "epoch": 1258} {"train_loss": -22.44670295715332, "global_step": 104479, "epoch": 1258} {"train_loss": -22.005008697509766, "global_step": 104480, "epoch": 1258} {"train_loss": -22.106191635131836, "global_step": 104481, "epoch": 1258} {"train_loss": -21.785249710083008, "global_step": 104482, "epoch": 1258} {"train_loss": -22.04904556274414, "global_step": 104483, "epoch": 1258} {"train_loss": -22.0930233001709, "global_step": 104484, "epoch": 1258} {"train_loss": -21.984771728515625, "global_step": 104485, "epoch": 1258} {"train_loss": -21.98910140991211, "global_step": 104486, "epoch": 1258} {"train_loss": -22.079816818237305, "global_step": 104487, "epoch": 1258} {"train_loss": -21.724515914916992, "global_step": 104488, "epoch": 1258} {"train_loss": -21.79249382019043, "global_step": 104489, "epoch": 1258} {"train_loss": -22.04741859436035, "global_step": 104490, "epoch": 1258} {"train_loss": -22.013090133666992, "global_step": 104491, "epoch": 1258} {"train_loss": -21.73896598815918, "global_step": 104492, "epoch": 1258} {"train_loss": -21.98209571838379, "global_step": 104493, "epoch": 1258} {"train_loss": -22.02290153503418, "global_step": 104494, "epoch": 1258} {"train_loss": -21.872486114501953, "global_step": 104495, "epoch": 1258} {"train_loss": -22.00258795037327, "global_step": 104496, "epoch": 1258, "val_loss": 6112920.0} {"train_loss": -22.293222427368164, "global_step": 104497, "epoch": 1259} {"train_loss": -21.8062686920166, "global_step": 104498, "epoch": 1259} {"train_loss": -22.317951202392578, "global_step": 104499, "epoch": 1259} {"train_loss": -22.121932983398438, "global_step": 104500, "epoch": 1259} {"train_loss": -21.889577865600586, "global_step": 104501, "epoch": 1259} {"train_loss": -21.965238571166992, "global_step": 104502, "epoch": 1259} {"train_loss": -21.923646926879883, "global_step": 104503, "epoch": 1259} {"train_loss": -22.145980834960938, "global_step": 104504, "epoch": 1259} {"train_loss": -22.02540397644043, "global_step": 104505, "epoch": 1259} {"train_loss": -21.56498908996582, "global_step": 104506, "epoch": 1259} {"train_loss": -21.83814811706543, "global_step": 104507, "epoch": 1259} {"train_loss": -21.95343780517578, "global_step": 104508, "epoch": 1259} {"train_loss": -21.734060287475586, "global_step": 104509, "epoch": 1259} {"train_loss": -22.043458938598633, "global_step": 104510, "epoch": 1259} {"train_loss": -21.918352127075195, "global_step": 104511, "epoch": 1259} {"train_loss": -21.644485473632812, "global_step": 104512, "epoch": 1259} {"train_loss": -21.800506591796875, "global_step": 104513, "epoch": 1259} {"train_loss": -21.97478675842285, "global_step": 104514, "epoch": 1259} {"train_loss": -21.968856811523438, "global_step": 104515, "epoch": 1259} {"train_loss": -22.262924194335938, "global_step": 104516, "epoch": 1259} {"train_loss": -21.87420082092285, "global_step": 104517, "epoch": 1259} {"train_loss": -22.101587295532227, "global_step": 104518, "epoch": 1259} {"train_loss": -22.08906364440918, "global_step": 104519, "epoch": 1259} {"train_loss": -22.000492095947266, "global_step": 104520, "epoch": 1259} {"train_loss": -21.887287139892578, "global_step": 104521, "epoch": 1259} {"train_loss": -22.274580001831055, "global_step": 104522, "epoch": 1259} {"train_loss": -22.39128875732422, "global_step": 104523, "epoch": 1259} {"train_loss": -22.062652587890625, "global_step": 104524, "epoch": 1259} {"train_loss": -22.218069076538086, "global_step": 104525, "epoch": 1259} {"train_loss": -22.412216186523438, "global_step": 104526, "epoch": 1259} {"train_loss": -22.292699813842773, "global_step": 104527, "epoch": 1259} {"train_loss": -22.148330688476562, "global_step": 104528, "epoch": 1259} {"train_loss": -22.01051902770996, "global_step": 104529, "epoch": 1259} {"train_loss": -22.27237319946289, "global_step": 104530, "epoch": 1259} {"train_loss": -21.952417373657227, "global_step": 104531, "epoch": 1259} {"train_loss": -22.325176239013672, "global_step": 104532, "epoch": 1259} {"train_loss": -22.016401290893555, "global_step": 104533, "epoch": 1259} {"train_loss": -22.4857234954834, "global_step": 104534, "epoch": 1259} {"train_loss": -22.394500732421875, "global_step": 104535, "epoch": 1259} {"train_loss": -22.120019912719727, "global_step": 104536, "epoch": 1259} {"train_loss": -21.94632339477539, "global_step": 104537, "epoch": 1259} {"train_loss": -21.73920249938965, "global_step": 104538, "epoch": 1259} {"train_loss": -21.78778648376465, "global_step": 104539, "epoch": 1259} {"train_loss": -22.278593063354492, "global_step": 104540, "epoch": 1259} {"train_loss": -21.989511489868164, "global_step": 104541, "epoch": 1259} {"train_loss": -22.40790557861328, "global_step": 104542, "epoch": 1259} {"train_loss": -21.98288345336914, "global_step": 104543, "epoch": 1259} {"train_loss": -21.809162139892578, "global_step": 104544, "epoch": 1259} {"train_loss": -22.321210861206055, "global_step": 104545, "epoch": 1259} {"train_loss": -22.18222999572754, "global_step": 104546, "epoch": 1259} {"train_loss": -22.19496726989746, "global_step": 104547, "epoch": 1259} {"train_loss": -22.045438766479492, "global_step": 104548, "epoch": 1259} {"train_loss": -21.994054794311523, "global_step": 104549, "epoch": 1259} {"train_loss": -22.381471633911133, "global_step": 104550, "epoch": 1259} {"train_loss": -22.209341049194336, "global_step": 104551, "epoch": 1259} {"train_loss": -22.007131576538086, "global_step": 104552, "epoch": 1259} {"train_loss": -22.11389923095703, "global_step": 104553, "epoch": 1259} {"train_loss": -21.973115921020508, "global_step": 104554, "epoch": 1259} {"train_loss": -21.77535057067871, "global_step": 104555, "epoch": 1259} {"train_loss": -22.011167526245117, "global_step": 104556, "epoch": 1259} {"train_loss": -22.076650619506836, "global_step": 104557, "epoch": 1259} {"train_loss": -21.886362075805664, "global_step": 104558, "epoch": 1259} {"train_loss": -22.412546157836914, "global_step": 104559, "epoch": 1259} {"train_loss": -21.960948944091797, "global_step": 104560, "epoch": 1259} {"train_loss": -21.903635025024414, "global_step": 104561, "epoch": 1259} {"train_loss": -22.13818359375, "global_step": 104562, "epoch": 1259} {"train_loss": -22.145795822143555, "global_step": 104563, "epoch": 1259} {"train_loss": -22.429248809814453, "global_step": 104564, "epoch": 1259} {"train_loss": -21.88442039489746, "global_step": 104565, "epoch": 1259} {"train_loss": -22.35239028930664, "global_step": 104566, "epoch": 1259} {"train_loss": -22.34783935546875, "global_step": 104567, "epoch": 1259} {"train_loss": -21.925739288330078, "global_step": 104568, "epoch": 1259} {"train_loss": -21.953149795532227, "global_step": 104569, "epoch": 1259} {"train_loss": -21.925058364868164, "global_step": 104570, "epoch": 1259} {"train_loss": -22.445707321166992, "global_step": 104571, "epoch": 1259} {"train_loss": -22.074996948242188, "global_step": 104572, "epoch": 1259} {"train_loss": -21.960447311401367, "global_step": 104573, "epoch": 1259} {"train_loss": -21.821596145629883, "global_step": 104574, "epoch": 1259} {"train_loss": -21.97469139099121, "global_step": 104575, "epoch": 1259} {"train_loss": -22.278934478759766, "global_step": 104576, "epoch": 1259} {"train_loss": -22.118139266967773, "global_step": 104577, "epoch": 1259} {"train_loss": -21.99847984313965, "global_step": 104578, "epoch": 1259} {"train_loss": -22.078518878982727, "global_step": 104579, "epoch": 1259, "val_loss": 6012527.0} {"train_loss": -21.261962890625, "global_step": 104580, "epoch": 1260} {"train_loss": -21.405920028686523, "global_step": 104581, "epoch": 1260} {"train_loss": -20.972881317138672, "global_step": 104582, "epoch": 1260} {"train_loss": -21.65549087524414, "global_step": 104583, "epoch": 1260} {"train_loss": -21.699331283569336, "global_step": 104584, "epoch": 1260} {"train_loss": -21.23087501525879, "global_step": 104585, "epoch": 1260} {"train_loss": -21.740055084228516, "global_step": 104586, "epoch": 1260} {"train_loss": -21.61005973815918, "global_step": 104587, "epoch": 1260} {"train_loss": -21.46607780456543, "global_step": 104588, "epoch": 1260} {"train_loss": -21.819570541381836, "global_step": 104589, "epoch": 1260} {"train_loss": -21.721298217773438, "global_step": 104590, "epoch": 1260} {"train_loss": -21.487443923950195, "global_step": 104591, "epoch": 1260} {"train_loss": -21.897916793823242, "global_step": 104592, "epoch": 1260} {"train_loss": -21.569686889648438, "global_step": 104593, "epoch": 1260} {"train_loss": -21.81427001953125, "global_step": 104594, "epoch": 1260} {"train_loss": -22.048078536987305, "global_step": 104595, "epoch": 1260} {"train_loss": -21.877531051635742, "global_step": 104596, "epoch": 1260} {"train_loss": -21.818233489990234, "global_step": 104597, "epoch": 1260} {"train_loss": -21.56422233581543, "global_step": 104598, "epoch": 1260} {"train_loss": -21.682292938232422, "global_step": 104599, "epoch": 1260} {"train_loss": -21.943878173828125, "global_step": 104600, "epoch": 1260} {"train_loss": -22.137218475341797, "global_step": 104601, "epoch": 1260} {"train_loss": -21.990942001342773, "global_step": 104602, "epoch": 1260} {"train_loss": -21.739084243774414, "global_step": 104603, "epoch": 1260} {"train_loss": -22.279306411743164, "global_step": 104604, "epoch": 1260} {"train_loss": -21.875930786132812, "global_step": 104605, "epoch": 1260} {"train_loss": -22.456884384155273, "global_step": 104606, "epoch": 1260} {"train_loss": -21.90223503112793, "global_step": 104607, "epoch": 1260} {"train_loss": -22.38093376159668, "global_step": 104608, "epoch": 1260} {"train_loss": -21.978300094604492, "global_step": 104609, "epoch": 1260} {"train_loss": -21.787220001220703, "global_step": 104610, "epoch": 1260} {"train_loss": -22.197736740112305, "global_step": 104611, "epoch": 1260} {"train_loss": -21.927915573120117, "global_step": 104612, "epoch": 1260} {"train_loss": -22.499731063842773, "global_step": 104613, "epoch": 1260} {"train_loss": -21.936172485351562, "global_step": 104614, "epoch": 1260} {"train_loss": -22.292200088500977, "global_step": 104615, "epoch": 1260} {"train_loss": -22.007909774780273, "global_step": 104616, "epoch": 1260} {"train_loss": -22.020282745361328, "global_step": 104617, "epoch": 1260} {"train_loss": -22.028207778930664, "global_step": 104618, "epoch": 1260} {"train_loss": -22.106426239013672, "global_step": 104619, "epoch": 1260} {"train_loss": -21.777969360351562, "global_step": 104620, "epoch": 1260} {"train_loss": -21.81792640686035, "global_step": 104621, "epoch": 1260} {"train_loss": -21.957212448120117, "global_step": 104622, "epoch": 1260} {"train_loss": -21.953771591186523, "global_step": 104623, "epoch": 1260} {"train_loss": -22.113544464111328, "global_step": 104624, "epoch": 1260} {"train_loss": -22.130680084228516, "global_step": 104625, "epoch": 1260} {"train_loss": -22.156463623046875, "global_step": 104626, "epoch": 1260} {"train_loss": -22.118701934814453, "global_step": 104627, "epoch": 1260} {"train_loss": -22.027223587036133, "global_step": 104628, "epoch": 1260} {"train_loss": -22.14127540588379, "global_step": 104629, "epoch": 1260} {"train_loss": -22.098926544189453, "global_step": 104630, "epoch": 1260} {"train_loss": -22.220943450927734, "global_step": 104631, "epoch": 1260} {"train_loss": -22.014842987060547, "global_step": 104632, "epoch": 1260} {"train_loss": -22.46893310546875, "global_step": 104633, "epoch": 1260} {"train_loss": -21.81988525390625, "global_step": 104634, "epoch": 1260} {"train_loss": -22.42483901977539, "global_step": 104635, "epoch": 1260} {"train_loss": -21.810632705688477, "global_step": 104636, "epoch": 1260} {"train_loss": -22.14171600341797, "global_step": 104637, "epoch": 1260} {"train_loss": -21.88703727722168, "global_step": 104638, "epoch": 1260} {"train_loss": -22.03632926940918, "global_step": 104639, "epoch": 1260} {"train_loss": -21.816091537475586, "global_step": 104640, "epoch": 1260} {"train_loss": -21.78788185119629, "global_step": 104641, "epoch": 1260} {"train_loss": -21.869844436645508, "global_step": 104642, "epoch": 1260} {"train_loss": -22.133106231689453, "global_step": 104643, "epoch": 1260} {"train_loss": -21.94466781616211, "global_step": 104644, "epoch": 1260} {"train_loss": -22.050609588623047, "global_step": 104645, "epoch": 1260} {"train_loss": -21.991796493530273, "global_step": 104646, "epoch": 1260} {"train_loss": -21.958066940307617, "global_step": 104647, "epoch": 1260} {"train_loss": -22.303077697753906, "global_step": 104648, "epoch": 1260} {"train_loss": -22.050634384155273, "global_step": 104649, "epoch": 1260} {"train_loss": -21.955617904663086, "global_step": 104650, "epoch": 1260} {"train_loss": -21.588611602783203, "global_step": 104651, "epoch": 1260} {"train_loss": -22.056211471557617, "global_step": 104652, "epoch": 1260} {"train_loss": -21.677474975585938, "global_step": 104653, "epoch": 1260} {"train_loss": -22.514223098754883, "global_step": 104654, "epoch": 1260} {"train_loss": -22.18104362487793, "global_step": 104655, "epoch": 1260} {"train_loss": -22.293941497802734, "global_step": 104656, "epoch": 1260} {"train_loss": -22.392166137695312, "global_step": 104657, "epoch": 1260} {"train_loss": -21.724363327026367, "global_step": 104658, "epoch": 1260} {"train_loss": -21.984268188476562, "global_step": 104659, "epoch": 1260} {"train_loss": -21.981393814086914, "global_step": 104660, "epoch": 1260} {"train_loss": -22.07633399963379, "global_step": 104661, "epoch": 1260} {"train_loss": -21.949400108980846, "global_step": 104662, "epoch": 1260, "val_loss": 6229293.0} {"train_loss": -20.727807998657227, "global_step": 104663, "epoch": 1261} {"train_loss": -20.853775024414062, "global_step": 104664, "epoch": 1261} {"train_loss": -21.272541046142578, "global_step": 104665, "epoch": 1261} {"train_loss": -20.822349548339844, "global_step": 104666, "epoch": 1261} {"train_loss": -21.730985641479492, "global_step": 104667, "epoch": 1261} {"train_loss": -20.93912124633789, "global_step": 104668, "epoch": 1261} {"train_loss": -21.418516159057617, "global_step": 104669, "epoch": 1261} {"train_loss": -21.398639678955078, "global_step": 104670, "epoch": 1261} {"train_loss": -21.485212326049805, "global_step": 104671, "epoch": 1261} {"train_loss": -21.5820255279541, "global_step": 104672, "epoch": 1261} {"train_loss": -21.4949893951416, "global_step": 104673, "epoch": 1261} {"train_loss": -21.64381980895996, "global_step": 104674, "epoch": 1261} {"train_loss": -21.480173110961914, "global_step": 104675, "epoch": 1261} {"train_loss": -21.567365646362305, "global_step": 104676, "epoch": 1261} {"train_loss": -21.532224655151367, "global_step": 104677, "epoch": 1261} {"train_loss": -21.401334762573242, "global_step": 104678, "epoch": 1261} {"train_loss": -21.69106674194336, "global_step": 104679, "epoch": 1261} {"train_loss": -21.634328842163086, "global_step": 104680, "epoch": 1261} {"train_loss": -21.699953079223633, "global_step": 104681, "epoch": 1261} {"train_loss": -21.58188247680664, "global_step": 104682, "epoch": 1261} {"train_loss": -21.872838973999023, "global_step": 104683, "epoch": 1261} {"train_loss": -22.037893295288086, "global_step": 104684, "epoch": 1261} {"train_loss": -21.8806209564209, "global_step": 104685, "epoch": 1261} {"train_loss": -21.6414852142334, "global_step": 104686, "epoch": 1261} {"train_loss": -21.659067153930664, "global_step": 104687, "epoch": 1261} {"train_loss": -21.595232009887695, "global_step": 104688, "epoch": 1261} {"train_loss": -21.76742172241211, "global_step": 104689, "epoch": 1261} {"train_loss": -21.864099502563477, "global_step": 104690, "epoch": 1261} {"train_loss": -22.343475341796875, "global_step": 104691, "epoch": 1261} {"train_loss": -22.08376121520996, "global_step": 104692, "epoch": 1261} {"train_loss": -22.124738693237305, "global_step": 104693, "epoch": 1261} {"train_loss": -21.976001739501953, "global_step": 104694, "epoch": 1261} {"train_loss": -22.075294494628906, "global_step": 104695, "epoch": 1261} {"train_loss": -22.433029174804688, "global_step": 104696, "epoch": 1261} {"train_loss": -21.868762969970703, "global_step": 104697, "epoch": 1261} {"train_loss": -22.190092086791992, "global_step": 104698, "epoch": 1261} {"train_loss": -21.98780632019043, "global_step": 104699, "epoch": 1261} {"train_loss": -22.3615665435791, "global_step": 104700, "epoch": 1261} {"train_loss": -22.1660213470459, "global_step": 104701, "epoch": 1261} {"train_loss": -22.173751831054688, "global_step": 104702, "epoch": 1261} {"train_loss": -22.11200523376465, "global_step": 104703, "epoch": 1261} {"train_loss": -22.253210067749023, "global_step": 104704, "epoch": 1261} {"train_loss": -22.213632583618164, "global_step": 104705, "epoch": 1261} {"train_loss": -21.870534896850586, "global_step": 104706, "epoch": 1261} {"train_loss": -22.43341636657715, "global_step": 104707, "epoch": 1261} {"train_loss": -22.169862747192383, "global_step": 104708, "epoch": 1261} {"train_loss": -22.003110885620117, "global_step": 104709, "epoch": 1261} {"train_loss": -21.99151039123535, "global_step": 104710, "epoch": 1261} {"train_loss": -22.1599063873291, "global_step": 104711, "epoch": 1261} {"train_loss": -21.962942123413086, "global_step": 104712, "epoch": 1261} {"train_loss": -21.877548217773438, "global_step": 104713, "epoch": 1261} {"train_loss": -22.209035873413086, "global_step": 104714, "epoch": 1261} {"train_loss": -22.249069213867188, "global_step": 104715, "epoch": 1261} {"train_loss": -22.320144653320312, "global_step": 104716, "epoch": 1261} {"train_loss": -21.807302474975586, "global_step": 104717, "epoch": 1261} {"train_loss": -22.260570526123047, "global_step": 104718, "epoch": 1261} {"train_loss": -22.23516273498535, "global_step": 104719, "epoch": 1261} {"train_loss": -22.284942626953125, "global_step": 104720, "epoch": 1261} {"train_loss": -22.1286678314209, "global_step": 104721, "epoch": 1261} {"train_loss": -21.809371948242188, "global_step": 104722, "epoch": 1261} {"train_loss": -21.92734718322754, "global_step": 104723, "epoch": 1261} {"train_loss": -22.211750030517578, "global_step": 104724, "epoch": 1261} {"train_loss": -22.04587745666504, "global_step": 104725, "epoch": 1261} {"train_loss": -22.048696517944336, "global_step": 104726, "epoch": 1261} {"train_loss": -22.2940673828125, "global_step": 104727, "epoch": 1261} {"train_loss": -21.950363159179688, "global_step": 104728, "epoch": 1261} {"train_loss": -21.649005889892578, "global_step": 104729, "epoch": 1261} {"train_loss": -22.068723678588867, "global_step": 104730, "epoch": 1261} {"train_loss": -22.30826759338379, "global_step": 104731, "epoch": 1261} {"train_loss": -21.794504165649414, "global_step": 104732, "epoch": 1261} {"train_loss": -21.938091278076172, "global_step": 104733, "epoch": 1261} {"train_loss": -21.8470516204834, "global_step": 104734, "epoch": 1261} {"train_loss": -21.88686752319336, "global_step": 104735, "epoch": 1261} {"train_loss": -21.89813232421875, "global_step": 104736, "epoch": 1261} {"train_loss": -21.673398971557617, "global_step": 104737, "epoch": 1261} {"train_loss": -22.445188522338867, "global_step": 104738, "epoch": 1261} {"train_loss": -22.345458984375, "global_step": 104739, "epoch": 1261} {"train_loss": -21.84050941467285, "global_step": 104740, "epoch": 1261} {"train_loss": -21.858959197998047, "global_step": 104741, "epoch": 1261} {"train_loss": -21.700960159301758, "global_step": 104742, "epoch": 1261} {"train_loss": -22.058874130249023, "global_step": 104743, "epoch": 1261} {"train_loss": -21.896577835083008, "global_step": 104744, "epoch": 1261} {"train_loss": -21.883917291480376, "global_step": 104745, "epoch": 1261, "val_loss": 6249891.0} {"train_loss": -21.71511459350586, "global_step": 104746, "epoch": 1262} {"train_loss": -21.719480514526367, "global_step": 104747, "epoch": 1262} {"train_loss": -21.470840454101562, "global_step": 104748, "epoch": 1262} {"train_loss": -21.236494064331055, "global_step": 104749, "epoch": 1262} {"train_loss": -21.87546157836914, "global_step": 104750, "epoch": 1262} {"train_loss": -21.703527450561523, "global_step": 104751, "epoch": 1262} {"train_loss": -21.845691680908203, "global_step": 104752, "epoch": 1262} {"train_loss": -21.908248901367188, "global_step": 104753, "epoch": 1262} {"train_loss": -21.91948890686035, "global_step": 104754, "epoch": 1262} {"train_loss": -21.589567184448242, "global_step": 104755, "epoch": 1262} {"train_loss": -21.354324340820312, "global_step": 104756, "epoch": 1262} {"train_loss": -22.07324981689453, "global_step": 104757, "epoch": 1262} {"train_loss": -21.939559936523438, "global_step": 104758, "epoch": 1262} {"train_loss": -21.762781143188477, "global_step": 104759, "epoch": 1262} {"train_loss": -21.828231811523438, "global_step": 104760, "epoch": 1262} {"train_loss": -22.013090133666992, "global_step": 104761, "epoch": 1262} {"train_loss": -21.67972755432129, "global_step": 104762, "epoch": 1262} {"train_loss": -21.688688278198242, "global_step": 104763, "epoch": 1262} {"train_loss": -21.358604431152344, "global_step": 104764, "epoch": 1262} {"train_loss": -21.468229293823242, "global_step": 104765, "epoch": 1262} {"train_loss": -21.680387496948242, "global_step": 104766, "epoch": 1262} {"train_loss": -21.75516700744629, "global_step": 104767, "epoch": 1262} {"train_loss": -21.85880470275879, "global_step": 104768, "epoch": 1262} {"train_loss": -21.481016159057617, "global_step": 104769, "epoch": 1262} {"train_loss": -21.966623306274414, "global_step": 104770, "epoch": 1262} {"train_loss": -22.277212142944336, "global_step": 104771, "epoch": 1262} {"train_loss": -22.10873031616211, "global_step": 104772, "epoch": 1262} {"train_loss": -21.822416305541992, "global_step": 104773, "epoch": 1262} {"train_loss": -22.163562774658203, "global_step": 104774, "epoch": 1262} {"train_loss": -22.04559326171875, "global_step": 104775, "epoch": 1262} {"train_loss": -22.02071189880371, "global_step": 104776, "epoch": 1262} {"train_loss": -21.90250015258789, "global_step": 104777, "epoch": 1262} {"train_loss": -22.02721405029297, "global_step": 104778, "epoch": 1262} {"train_loss": -22.081274032592773, "global_step": 104779, "epoch": 1262} {"train_loss": -22.283727645874023, "global_step": 104780, "epoch": 1262} {"train_loss": -21.86174774169922, "global_step": 104781, "epoch": 1262} {"train_loss": -22.177030563354492, "global_step": 104782, "epoch": 1262} {"train_loss": -21.866384506225586, "global_step": 104783, "epoch": 1262} {"train_loss": -22.38532257080078, "global_step": 104784, "epoch": 1262} {"train_loss": -22.295541763305664, "global_step": 104785, "epoch": 1262} {"train_loss": -22.456939697265625, "global_step": 104786, "epoch": 1262} {"train_loss": -22.07533073425293, "global_step": 104787, "epoch": 1262} {"train_loss": -21.96790885925293, "global_step": 104788, "epoch": 1262} {"train_loss": -22.120811462402344, "global_step": 104789, "epoch": 1262} {"train_loss": -22.25370216369629, "global_step": 104790, "epoch": 1262} {"train_loss": -21.979963302612305, "global_step": 104791, "epoch": 1262} {"train_loss": -22.36195182800293, "global_step": 104792, "epoch": 1262} {"train_loss": -22.103899002075195, "global_step": 104793, "epoch": 1262} {"train_loss": -22.1646785736084, "global_step": 104794, "epoch": 1262} {"train_loss": -22.1416072845459, "global_step": 104795, "epoch": 1262} {"train_loss": -22.08243179321289, "global_step": 104796, "epoch": 1262} {"train_loss": -21.880483627319336, "global_step": 104797, "epoch": 1262} {"train_loss": -21.788681030273438, "global_step": 104798, "epoch": 1262} {"train_loss": -22.45404624938965, "global_step": 104799, "epoch": 1262} {"train_loss": -22.248159408569336, "global_step": 104800, "epoch": 1262} {"train_loss": -22.084897994995117, "global_step": 104801, "epoch": 1262} {"train_loss": -22.379240036010742, "global_step": 104802, "epoch": 1262} {"train_loss": -22.255842208862305, "global_step": 104803, "epoch": 1262} {"train_loss": -21.89165687561035, "global_step": 104804, "epoch": 1262} {"train_loss": -21.69887351989746, "global_step": 104805, "epoch": 1262} {"train_loss": -22.287107467651367, "global_step": 104806, "epoch": 1262} {"train_loss": -21.931163787841797, "global_step": 104807, "epoch": 1262} {"train_loss": -22.020849227905273, "global_step": 104808, "epoch": 1262} {"train_loss": -22.063562393188477, "global_step": 104809, "epoch": 1262} {"train_loss": -21.896162033081055, "global_step": 104810, "epoch": 1262} {"train_loss": -21.82122802734375, "global_step": 104811, "epoch": 1262} {"train_loss": -22.224111557006836, "global_step": 104812, "epoch": 1262} {"train_loss": -21.76356315612793, "global_step": 104813, "epoch": 1262} {"train_loss": -21.791492462158203, "global_step": 104814, "epoch": 1262} {"train_loss": -22.184194564819336, "global_step": 104815, "epoch": 1262} {"train_loss": -22.28817367553711, "global_step": 104816, "epoch": 1262} {"train_loss": -22.29627799987793, "global_step": 104817, "epoch": 1262} {"train_loss": -22.238595962524414, "global_step": 104818, "epoch": 1262} {"train_loss": -22.13309097290039, "global_step": 104819, "epoch": 1262} {"train_loss": -22.131601333618164, "global_step": 104820, "epoch": 1262} {"train_loss": -22.022958755493164, "global_step": 104821, "epoch": 1262} {"train_loss": -22.118839263916016, "global_step": 104822, "epoch": 1262} {"train_loss": -21.933712005615234, "global_step": 104823, "epoch": 1262} {"train_loss": -21.865873336791992, "global_step": 104824, "epoch": 1262} {"train_loss": -21.8489990234375, "global_step": 104825, "epoch": 1262} {"train_loss": -22.167356491088867, "global_step": 104826, "epoch": 1262} {"train_loss": -21.710041046142578, "global_step": 104827, "epoch": 1262} {"train_loss": -21.977608715195252, "global_step": 104828, "epoch": 1262, "val_loss": 6141216.0} {"train_loss": -21.884830474853516, "global_step": 104829, "epoch": 1263} {"train_loss": -21.70680809020996, "global_step": 104830, "epoch": 1263} {"train_loss": -21.600921630859375, "global_step": 104831, "epoch": 1263} {"train_loss": -21.58491325378418, "global_step": 104832, "epoch": 1263} {"train_loss": -21.660751342773438, "global_step": 104833, "epoch": 1263} {"train_loss": -21.83893585205078, "global_step": 104834, "epoch": 1263} {"train_loss": -22.444686889648438, "global_step": 104835, "epoch": 1263} {"train_loss": -21.840869903564453, "global_step": 104836, "epoch": 1263} {"train_loss": -21.699010848999023, "global_step": 104837, "epoch": 1263} {"train_loss": -21.68983268737793, "global_step": 104838, "epoch": 1263} {"train_loss": -21.782535552978516, "global_step": 104839, "epoch": 1263} {"train_loss": -21.957622528076172, "global_step": 104840, "epoch": 1263} {"train_loss": -21.901025772094727, "global_step": 104841, "epoch": 1263} {"train_loss": -22.00653076171875, "global_step": 104842, "epoch": 1263} {"train_loss": -22.288251876831055, "global_step": 104843, "epoch": 1263} {"train_loss": -21.885854721069336, "global_step": 104844, "epoch": 1263} {"train_loss": -21.928237915039062, "global_step": 104845, "epoch": 1263} {"train_loss": -21.939496994018555, "global_step": 104846, "epoch": 1263} {"train_loss": -21.67098617553711, "global_step": 104847, "epoch": 1263} {"train_loss": -22.03731346130371, "global_step": 104848, "epoch": 1263} {"train_loss": -22.090133666992188, "global_step": 104849, "epoch": 1263} {"train_loss": -21.782047271728516, "global_step": 104850, "epoch": 1263} {"train_loss": -22.002607345581055, "global_step": 104851, "epoch": 1263} {"train_loss": -21.859643936157227, "global_step": 104852, "epoch": 1263} {"train_loss": -21.668516159057617, "global_step": 104853, "epoch": 1263} {"train_loss": -22.15810203552246, "global_step": 104854, "epoch": 1263} {"train_loss": -22.013675689697266, "global_step": 104855, "epoch": 1263} {"train_loss": -21.947233200073242, "global_step": 104856, "epoch": 1263} {"train_loss": -22.049951553344727, "global_step": 104857, "epoch": 1263} {"train_loss": -22.18426513671875, "global_step": 104858, "epoch": 1263} {"train_loss": -21.680063247680664, "global_step": 104859, "epoch": 1263} {"train_loss": -22.063013076782227, "global_step": 104860, "epoch": 1263} {"train_loss": -22.100698471069336, "global_step": 104861, "epoch": 1263} {"train_loss": -22.097410202026367, "global_step": 104862, "epoch": 1263} {"train_loss": -22.181751251220703, "global_step": 104863, "epoch": 1263} {"train_loss": -22.320653915405273, "global_step": 104864, "epoch": 1263} {"train_loss": -21.92687225341797, "global_step": 104865, "epoch": 1263} {"train_loss": -22.064960479736328, "global_step": 104866, "epoch": 1263} {"train_loss": -22.40302085876465, "global_step": 104867, "epoch": 1263} {"train_loss": -21.725326538085938, "global_step": 104868, "epoch": 1263} {"train_loss": -22.216276168823242, "global_step": 104869, "epoch": 1263} {"train_loss": -21.940784454345703, "global_step": 104870, "epoch": 1263} {"train_loss": -22.055173873901367, "global_step": 104871, "epoch": 1263} {"train_loss": -22.12047004699707, "global_step": 104872, "epoch": 1263} {"train_loss": -22.013259887695312, "global_step": 104873, "epoch": 1263} {"train_loss": -22.033639907836914, "global_step": 104874, "epoch": 1263} {"train_loss": -22.121845245361328, "global_step": 104875, "epoch": 1263} {"train_loss": -21.98408317565918, "global_step": 104876, "epoch": 1263} {"train_loss": -22.216663360595703, "global_step": 104877, "epoch": 1263} {"train_loss": -22.369550704956055, "global_step": 104878, "epoch": 1263} {"train_loss": -22.354145050048828, "global_step": 104879, "epoch": 1263} {"train_loss": -22.33908462524414, "global_step": 104880, "epoch": 1263} {"train_loss": -22.096372604370117, "global_step": 104881, "epoch": 1263} {"train_loss": -22.46601676940918, "global_step": 104882, "epoch": 1263} {"train_loss": -22.03362464904785, "global_step": 104883, "epoch": 1263} {"train_loss": -22.254484176635742, "global_step": 104884, "epoch": 1263} {"train_loss": -21.77012062072754, "global_step": 104885, "epoch": 1263} {"train_loss": -22.431791305541992, "global_step": 104886, "epoch": 1263} {"train_loss": -22.019107818603516, "global_step": 104887, "epoch": 1263} {"train_loss": -22.008926391601562, "global_step": 104888, "epoch": 1263} {"train_loss": -22.243558883666992, "global_step": 104889, "epoch": 1263} {"train_loss": -22.121084213256836, "global_step": 104890, "epoch": 1263} {"train_loss": -21.87932777404785, "global_step": 104891, "epoch": 1263} {"train_loss": -21.934505462646484, "global_step": 104892, "epoch": 1263} {"train_loss": -21.824377059936523, "global_step": 104893, "epoch": 1263} {"train_loss": -22.43179702758789, "global_step": 104894, "epoch": 1263} {"train_loss": -21.958580017089844, "global_step": 104895, "epoch": 1263} {"train_loss": -22.357187271118164, "global_step": 104896, "epoch": 1263} {"train_loss": -22.53804588317871, "global_step": 104897, "epoch": 1263} {"train_loss": -22.11215591430664, "global_step": 104898, "epoch": 1263} {"train_loss": -22.012659072875977, "global_step": 104899, "epoch": 1263} {"train_loss": -22.229482650756836, "global_step": 104900, "epoch": 1263} {"train_loss": -22.34987449645996, "global_step": 104901, "epoch": 1263} {"train_loss": -21.85878562927246, "global_step": 104902, "epoch": 1263} {"train_loss": -21.88296890258789, "global_step": 104903, "epoch": 1263} {"train_loss": -22.240827560424805, "global_step": 104904, "epoch": 1263} {"train_loss": -22.389755249023438, "global_step": 104905, "epoch": 1263} {"train_loss": -21.95118522644043, "global_step": 104906, "epoch": 1263} {"train_loss": -21.853090286254883, "global_step": 104907, "epoch": 1263} {"train_loss": -21.94708824157715, "global_step": 104908, "epoch": 1263} {"train_loss": -22.10035514831543, "global_step": 104909, "epoch": 1263} {"train_loss": -21.830224990844727, "global_step": 104910, "epoch": 1263} {"train_loss": -22.019190110355975, "global_step": 104911, "epoch": 1263, "val_loss": 6121598.5} {"train_loss": -21.396575927734375, "global_step": 104912, "epoch": 1264} {"train_loss": -21.533462524414062, "global_step": 104913, "epoch": 1264} {"train_loss": -21.764944076538086, "global_step": 104914, "epoch": 1264} {"train_loss": -21.59248161315918, "global_step": 104915, "epoch": 1264} {"train_loss": -21.538848876953125, "global_step": 104916, "epoch": 1264} {"train_loss": -21.776561737060547, "global_step": 104917, "epoch": 1264} {"train_loss": -21.420394897460938, "global_step": 104918, "epoch": 1264} {"train_loss": -21.961597442626953, "global_step": 104919, "epoch": 1264} {"train_loss": -21.655841827392578, "global_step": 104920, "epoch": 1264} {"train_loss": -21.879959106445312, "global_step": 104921, "epoch": 1264} {"train_loss": -21.892736434936523, "global_step": 104922, "epoch": 1264} {"train_loss": -21.715782165527344, "global_step": 104923, "epoch": 1264} {"train_loss": -21.855545043945312, "global_step": 104924, "epoch": 1264} {"train_loss": -21.536096572875977, "global_step": 104925, "epoch": 1264} {"train_loss": -21.53095817565918, "global_step": 104926, "epoch": 1264} {"train_loss": -21.79865264892578, "global_step": 104927, "epoch": 1264} {"train_loss": -21.982160568237305, "global_step": 104928, "epoch": 1264} {"train_loss": -21.767597198486328, "global_step": 104929, "epoch": 1264} {"train_loss": -21.89115333557129, "global_step": 104930, "epoch": 1264} {"train_loss": -21.90423011779785, "global_step": 104931, "epoch": 1264} {"train_loss": -21.97773551940918, "global_step": 104932, "epoch": 1264} {"train_loss": -21.68820571899414, "global_step": 104933, "epoch": 1264} {"train_loss": -21.777551651000977, "global_step": 104934, "epoch": 1264} {"train_loss": -21.881505966186523, "global_step": 104935, "epoch": 1264} {"train_loss": -21.915985107421875, "global_step": 104936, "epoch": 1264} {"train_loss": -21.813745498657227, "global_step": 104937, "epoch": 1264} {"train_loss": -22.18678092956543, "global_step": 104938, "epoch": 1264} {"train_loss": -22.134510040283203, "global_step": 104939, "epoch": 1264} {"train_loss": -21.96329116821289, "global_step": 104940, "epoch": 1264} {"train_loss": -22.42622947692871, "global_step": 104941, "epoch": 1264} {"train_loss": -21.979333877563477, "global_step": 104942, "epoch": 1264} {"train_loss": -22.209762573242188, "global_step": 104943, "epoch": 1264} {"train_loss": -22.1651554107666, "global_step": 104944, "epoch": 1264} {"train_loss": -21.961261749267578, "global_step": 104945, "epoch": 1264} {"train_loss": -22.045591354370117, "global_step": 104946, "epoch": 1264} {"train_loss": -21.95948600769043, "global_step": 104947, "epoch": 1264} {"train_loss": -21.818899154663086, "global_step": 104948, "epoch": 1264} {"train_loss": -21.851667404174805, "global_step": 104949, "epoch": 1264} {"train_loss": -22.229856491088867, "global_step": 104950, "epoch": 1264} {"train_loss": -22.062162399291992, "global_step": 104951, "epoch": 1264} {"train_loss": -21.739791870117188, "global_step": 104952, "epoch": 1264} {"train_loss": -22.1502685546875, "global_step": 104953, "epoch": 1264} {"train_loss": -22.389936447143555, "global_step": 104954, "epoch": 1264} {"train_loss": -22.096511840820312, "global_step": 104955, "epoch": 1264} {"train_loss": -22.512104034423828, "global_step": 104956, "epoch": 1264} {"train_loss": -21.83082389831543, "global_step": 104957, "epoch": 1264} {"train_loss": -22.149736404418945, "global_step": 104958, "epoch": 1264} {"train_loss": -21.97772789001465, "global_step": 104959, "epoch": 1264} {"train_loss": -21.77469825744629, "global_step": 104960, "epoch": 1264} {"train_loss": -21.891630172729492, "global_step": 104961, "epoch": 1264} {"train_loss": -21.905303955078125, "global_step": 104962, "epoch": 1264} {"train_loss": -22.143545150756836, "global_step": 104963, "epoch": 1264} {"train_loss": -22.384756088256836, "global_step": 104964, "epoch": 1264} {"train_loss": -21.87959098815918, "global_step": 104965, "epoch": 1264} {"train_loss": -22.19253921508789, "global_step": 104966, "epoch": 1264} {"train_loss": -22.028858184814453, "global_step": 104967, "epoch": 1264} {"train_loss": -21.97202491760254, "global_step": 104968, "epoch": 1264} {"train_loss": -22.41339111328125, "global_step": 104969, "epoch": 1264} {"train_loss": -21.994626998901367, "global_step": 104970, "epoch": 1264} {"train_loss": -22.609729766845703, "global_step": 104971, "epoch": 1264} {"train_loss": -22.2000732421875, "global_step": 104972, "epoch": 1264} {"train_loss": -22.39954376220703, "global_step": 104973, "epoch": 1264} {"train_loss": -22.1693115234375, "global_step": 104974, "epoch": 1264} {"train_loss": -22.26513671875, "global_step": 104975, "epoch": 1264} {"train_loss": -22.263553619384766, "global_step": 104976, "epoch": 1264} {"train_loss": -22.31694793701172, "global_step": 104977, "epoch": 1264} {"train_loss": -22.23711585998535, "global_step": 104978, "epoch": 1264} {"train_loss": -22.21278953552246, "global_step": 104979, "epoch": 1264} {"train_loss": -22.05055809020996, "global_step": 104980, "epoch": 1264} {"train_loss": -22.143362045288086, "global_step": 104981, "epoch": 1264} {"train_loss": -21.837244033813477, "global_step": 104982, "epoch": 1264} {"train_loss": -22.289005279541016, "global_step": 104983, "epoch": 1264} {"train_loss": -21.6975040435791, "global_step": 104984, "epoch": 1264} {"train_loss": -22.135602951049805, "global_step": 104985, "epoch": 1264} {"train_loss": -22.41020393371582, "global_step": 104986, "epoch": 1264} {"train_loss": -21.984830856323242, "global_step": 104987, "epoch": 1264} {"train_loss": -21.933053970336914, "global_step": 104988, "epoch": 1264} {"train_loss": -21.906530380249023, "global_step": 104989, "epoch": 1264} {"train_loss": -22.44011878967285, "global_step": 104990, "epoch": 1264} {"train_loss": -22.133527755737305, "global_step": 104991, "epoch": 1264} {"train_loss": -21.92644691467285, "global_step": 104992, "epoch": 1264} {"train_loss": -22.184200286865234, "global_step": 104993, "epoch": 1264} {"train_loss": -22.01111568313047, "global_step": 104994, "epoch": 1264, "val_loss": 6011363.0} {"train_loss": -21.749191284179688, "global_step": 104995, "epoch": 1265} {"train_loss": -20.94245147705078, "global_step": 104996, "epoch": 1265} {"train_loss": -21.597686767578125, "global_step": 104997, "epoch": 1265} {"train_loss": -20.42732810974121, "global_step": 104998, "epoch": 1265} {"train_loss": -21.139699935913086, "global_step": 104999, "epoch": 1265} {"train_loss": -21.948209762573242, "global_step": 105000, "epoch": 1265} {"train_loss": -21.10419273376465, "global_step": 105001, "epoch": 1265} {"train_loss": -21.738107681274414, "global_step": 105002, "epoch": 1265} {"train_loss": -21.43233299255371, "global_step": 105003, "epoch": 1265} {"train_loss": -21.35767936706543, "global_step": 105004, "epoch": 1265} {"train_loss": -21.604116439819336, "global_step": 105005, "epoch": 1265} {"train_loss": -21.677227020263672, "global_step": 105006, "epoch": 1265} {"train_loss": -21.781238555908203, "global_step": 105007, "epoch": 1265} {"train_loss": -22.04095458984375, "global_step": 105008, "epoch": 1265} {"train_loss": -21.537250518798828, "global_step": 105009, "epoch": 1265} {"train_loss": -21.665494918823242, "global_step": 105010, "epoch": 1265} {"train_loss": -21.47027015686035, "global_step": 105011, "epoch": 1265} {"train_loss": -21.75611686706543, "global_step": 105012, "epoch": 1265} {"train_loss": -21.725210189819336, "global_step": 105013, "epoch": 1265} {"train_loss": -21.871671676635742, "global_step": 105014, "epoch": 1265} {"train_loss": -21.831167221069336, "global_step": 105015, "epoch": 1265} {"train_loss": -21.840301513671875, "global_step": 105016, "epoch": 1265} {"train_loss": -22.109119415283203, "global_step": 105017, "epoch": 1265} {"train_loss": -21.974355697631836, "global_step": 105018, "epoch": 1265} {"train_loss": -21.868408203125, "global_step": 105019, "epoch": 1265} {"train_loss": -21.93550682067871, "global_step": 105020, "epoch": 1265} {"train_loss": -22.046499252319336, "global_step": 105021, "epoch": 1265} {"train_loss": -22.031118392944336, "global_step": 105022, "epoch": 1265} {"train_loss": -21.944021224975586, "global_step": 105023, "epoch": 1265} {"train_loss": -22.4312686920166, "global_step": 105024, "epoch": 1265} {"train_loss": -22.431882858276367, "global_step": 105025, "epoch": 1265} {"train_loss": -22.250732421875, "global_step": 105026, "epoch": 1265} {"train_loss": -22.10445213317871, "global_step": 105027, "epoch": 1265} {"train_loss": -22.323232650756836, "global_step": 105028, "epoch": 1265} {"train_loss": -21.999197006225586, "global_step": 105029, "epoch": 1265} {"train_loss": -21.995471954345703, "global_step": 105030, "epoch": 1265} {"train_loss": -22.12285614013672, "global_step": 105031, "epoch": 1265} {"train_loss": -22.008468627929688, "global_step": 105032, "epoch": 1265} {"train_loss": -22.075971603393555, "global_step": 105033, "epoch": 1265} {"train_loss": -22.4158935546875, "global_step": 105034, "epoch": 1265} {"train_loss": -21.749996185302734, "global_step": 105035, "epoch": 1265} {"train_loss": -22.488235473632812, "global_step": 105036, "epoch": 1265} {"train_loss": -22.18617820739746, "global_step": 105037, "epoch": 1265} {"train_loss": -22.15113639831543, "global_step": 105038, "epoch": 1265} {"train_loss": -21.798521041870117, "global_step": 105039, "epoch": 1265} {"train_loss": -22.14994239807129, "global_step": 105040, "epoch": 1265} {"train_loss": -22.175405502319336, "global_step": 105041, "epoch": 1265} {"train_loss": -22.528593063354492, "global_step": 105042, "epoch": 1265} {"train_loss": -22.2202091217041, "global_step": 105043, "epoch": 1265} {"train_loss": -21.899494171142578, "global_step": 105044, "epoch": 1265} {"train_loss": -22.218856811523438, "global_step": 105045, "epoch": 1265} {"train_loss": -22.341026306152344, "global_step": 105046, "epoch": 1265} {"train_loss": -22.074522018432617, "global_step": 105047, "epoch": 1265} {"train_loss": -21.81744956970215, "global_step": 105048, "epoch": 1265} {"train_loss": -22.267393112182617, "global_step": 105049, "epoch": 1265} {"train_loss": -22.082286834716797, "global_step": 105050, "epoch": 1265} {"train_loss": -22.021223068237305, "global_step": 105051, "epoch": 1265} {"train_loss": -22.47446060180664, "global_step": 105052, "epoch": 1265} {"train_loss": -21.92137908935547, "global_step": 105053, "epoch": 1265} {"train_loss": -22.24220848083496, "global_step": 105054, "epoch": 1265} {"train_loss": -22.1589298248291, "global_step": 105055, "epoch": 1265} {"train_loss": -21.804580688476562, "global_step": 105056, "epoch": 1265} {"train_loss": -22.004772186279297, "global_step": 105057, "epoch": 1265} {"train_loss": -22.272754669189453, "global_step": 105058, "epoch": 1265} {"train_loss": -22.52016830444336, "global_step": 105059, "epoch": 1265} {"train_loss": -22.402578353881836, "global_step": 105060, "epoch": 1265} {"train_loss": -22.000137329101562, "global_step": 105061, "epoch": 1265} {"train_loss": -21.898006439208984, "global_step": 105062, "epoch": 1265} {"train_loss": -22.14735221862793, "global_step": 105063, "epoch": 1265} {"train_loss": -22.127532958984375, "global_step": 105064, "epoch": 1265} {"train_loss": -22.06351661682129, "global_step": 105065, "epoch": 1265} {"train_loss": -21.861858367919922, "global_step": 105066, "epoch": 1265} {"train_loss": -21.92096519470215, "global_step": 105067, "epoch": 1265} {"train_loss": -22.144250869750977, "global_step": 105068, "epoch": 1265} {"train_loss": -22.172998428344727, "global_step": 105069, "epoch": 1265} {"train_loss": -21.587514877319336, "global_step": 105070, "epoch": 1265} {"train_loss": -22.111581802368164, "global_step": 105071, "epoch": 1265} {"train_loss": -22.10769271850586, "global_step": 105072, "epoch": 1265} {"train_loss": -21.989553451538086, "global_step": 105073, "epoch": 1265} {"train_loss": -22.062726974487305, "global_step": 105074, "epoch": 1265} {"train_loss": -22.093297958374023, "global_step": 105075, "epoch": 1265} {"train_loss": -22.042097091674805, "global_step": 105076, "epoch": 1265} {"train_loss": -21.97781151461314, "global_step": 105077, "epoch": 1265, "val_loss": 6175349.0} {"train_loss": -21.0731258392334, "global_step": 105078, "epoch": 1266} {"train_loss": -21.64768409729004, "global_step": 105079, "epoch": 1266} {"train_loss": -21.3941707611084, "global_step": 105080, "epoch": 1266} {"train_loss": -21.550695419311523, "global_step": 105081, "epoch": 1266} {"train_loss": -22.074970245361328, "global_step": 105082, "epoch": 1266} {"train_loss": -21.76513671875, "global_step": 105083, "epoch": 1266} {"train_loss": -21.660381317138672, "global_step": 105084, "epoch": 1266} {"train_loss": -21.944185256958008, "global_step": 105085, "epoch": 1266} {"train_loss": -21.42282485961914, "global_step": 105086, "epoch": 1266} {"train_loss": -21.83659553527832, "global_step": 105087, "epoch": 1266} {"train_loss": -21.805334091186523, "global_step": 105088, "epoch": 1266} {"train_loss": -21.82167625427246, "global_step": 105089, "epoch": 1266} {"train_loss": -21.884660720825195, "global_step": 105090, "epoch": 1266} {"train_loss": -22.0504093170166, "global_step": 105091, "epoch": 1266} {"train_loss": -22.1863956451416, "global_step": 105092, "epoch": 1266} {"train_loss": -22.027084350585938, "global_step": 105093, "epoch": 1266} {"train_loss": -21.9061336517334, "global_step": 105094, "epoch": 1266} {"train_loss": -21.83028793334961, "global_step": 105095, "epoch": 1266} {"train_loss": -21.802783966064453, "global_step": 105096, "epoch": 1266} {"train_loss": -22.0313777923584, "global_step": 105097, "epoch": 1266} {"train_loss": -21.764057159423828, "global_step": 105098, "epoch": 1266} {"train_loss": -22.085111618041992, "global_step": 105099, "epoch": 1266} {"train_loss": -22.21343994140625, "global_step": 105100, "epoch": 1266} {"train_loss": -22.021329879760742, "global_step": 105101, "epoch": 1266} {"train_loss": -22.022672653198242, "global_step": 105102, "epoch": 1266} {"train_loss": -21.915700912475586, "global_step": 105103, "epoch": 1266} {"train_loss": -22.132266998291016, "global_step": 105104, "epoch": 1266} {"train_loss": -21.89552116394043, "global_step": 105105, "epoch": 1266} {"train_loss": -21.995115280151367, "global_step": 105106, "epoch": 1266} {"train_loss": -22.256546020507812, "global_step": 105107, "epoch": 1266} {"train_loss": -22.045801162719727, "global_step": 105108, "epoch": 1266} {"train_loss": -21.841060638427734, "global_step": 105109, "epoch": 1266} {"train_loss": -22.11932373046875, "global_step": 105110, "epoch": 1266} {"train_loss": -21.98828125, "global_step": 105111, "epoch": 1266} {"train_loss": -21.95086097717285, "global_step": 105112, "epoch": 1266} {"train_loss": -21.94630241394043, "global_step": 105113, "epoch": 1266} {"train_loss": -21.9129581451416, "global_step": 105114, "epoch": 1266} {"train_loss": -22.201154708862305, "global_step": 105115, "epoch": 1266} {"train_loss": -22.078266143798828, "global_step": 105116, "epoch": 1266} {"train_loss": -22.296890258789062, "global_step": 105117, "epoch": 1266} {"train_loss": -22.080488204956055, "global_step": 105118, "epoch": 1266} {"train_loss": -22.261022567749023, "global_step": 105119, "epoch": 1266} {"train_loss": -22.024703979492188, "global_step": 105120, "epoch": 1266} {"train_loss": -22.24562644958496, "global_step": 105121, "epoch": 1266} {"train_loss": -22.20022964477539, "global_step": 105122, "epoch": 1266} {"train_loss": -22.28866958618164, "global_step": 105123, "epoch": 1266} {"train_loss": -22.402090072631836, "global_step": 105124, "epoch": 1266} {"train_loss": -21.97001838684082, "global_step": 105125, "epoch": 1266} {"train_loss": -21.983152389526367, "global_step": 105126, "epoch": 1266} {"train_loss": -21.900564193725586, "global_step": 105127, "epoch": 1266} {"train_loss": -22.273130416870117, "global_step": 105128, "epoch": 1266} {"train_loss": -22.03870391845703, "global_step": 105129, "epoch": 1266} {"train_loss": -21.91908836364746, "global_step": 105130, "epoch": 1266} {"train_loss": -21.56669044494629, "global_step": 105131, "epoch": 1266} {"train_loss": -21.991682052612305, "global_step": 105132, "epoch": 1266} {"train_loss": -21.518762588500977, "global_step": 105133, "epoch": 1266} {"train_loss": -21.75362205505371, "global_step": 105134, "epoch": 1266} {"train_loss": -22.061115264892578, "global_step": 105135, "epoch": 1266} {"train_loss": -21.616924285888672, "global_step": 105136, "epoch": 1266} {"train_loss": -22.170156478881836, "global_step": 105137, "epoch": 1266} {"train_loss": -21.872854232788086, "global_step": 105138, "epoch": 1266} {"train_loss": -22.095563888549805, "global_step": 105139, "epoch": 1266} {"train_loss": -21.998239517211914, "global_step": 105140, "epoch": 1266} {"train_loss": -22.106338500976562, "global_step": 105141, "epoch": 1266} {"train_loss": -22.141454696655273, "global_step": 105142, "epoch": 1266} {"train_loss": -21.933317184448242, "global_step": 105143, "epoch": 1266} {"train_loss": -22.2629451751709, "global_step": 105144, "epoch": 1266} {"train_loss": -22.225040435791016, "global_step": 105145, "epoch": 1266} {"train_loss": -21.768001556396484, "global_step": 105146, "epoch": 1266} {"train_loss": -21.92643928527832, "global_step": 105147, "epoch": 1266} {"train_loss": -21.84368133544922, "global_step": 105148, "epoch": 1266} {"train_loss": -22.103893280029297, "global_step": 105149, "epoch": 1266} {"train_loss": -21.64644432067871, "global_step": 105150, "epoch": 1266} {"train_loss": -22.173311233520508, "global_step": 105151, "epoch": 1266} {"train_loss": -22.198190689086914, "global_step": 105152, "epoch": 1266} {"train_loss": -22.0139102935791, "global_step": 105153, "epoch": 1266} {"train_loss": -21.789461135864258, "global_step": 105154, "epoch": 1266} {"train_loss": -21.752897262573242, "global_step": 105155, "epoch": 1266} {"train_loss": -21.888395309448242, "global_step": 105156, "epoch": 1266} {"train_loss": -21.705698013305664, "global_step": 105157, "epoch": 1266} {"train_loss": -22.179656982421875, "global_step": 105158, "epoch": 1266} {"train_loss": -22.210830688476562, "global_step": 105159, "epoch": 1266} {"train_loss": -21.97456210492605, "global_step": 105160, "epoch": 1266, "val_loss": 6196825.0} {"train_loss": -21.525442123413086, "global_step": 105161, "epoch": 1267} {"train_loss": -22.00642204284668, "global_step": 105162, "epoch": 1267} {"train_loss": -21.57450294494629, "global_step": 105163, "epoch": 1267} {"train_loss": -21.605161666870117, "global_step": 105164, "epoch": 1267} {"train_loss": -21.64166831970215, "global_step": 105165, "epoch": 1267} {"train_loss": -21.676807403564453, "global_step": 105166, "epoch": 1267} {"train_loss": -22.005996704101562, "global_step": 105167, "epoch": 1267} {"train_loss": -21.750877380371094, "global_step": 105168, "epoch": 1267} {"train_loss": -21.1981258392334, "global_step": 105169, "epoch": 1267} {"train_loss": -21.952804565429688, "global_step": 105170, "epoch": 1267} {"train_loss": -22.256742477416992, "global_step": 105171, "epoch": 1267} {"train_loss": -21.81813621520996, "global_step": 105172, "epoch": 1267} {"train_loss": -22.150386810302734, "global_step": 105173, "epoch": 1267} {"train_loss": -21.992002487182617, "global_step": 105174, "epoch": 1267} {"train_loss": -21.700883865356445, "global_step": 105175, "epoch": 1267} {"train_loss": -21.659870147705078, "global_step": 105176, "epoch": 1267} {"train_loss": -21.88237953186035, "global_step": 105177, "epoch": 1267} {"train_loss": -22.067075729370117, "global_step": 105178, "epoch": 1267} {"train_loss": -22.197620391845703, "global_step": 105179, "epoch": 1267} {"train_loss": -22.236013412475586, "global_step": 105180, "epoch": 1267} {"train_loss": -22.067602157592773, "global_step": 105181, "epoch": 1267} {"train_loss": -22.257282257080078, "global_step": 105182, "epoch": 1267} {"train_loss": -22.34901237487793, "global_step": 105183, "epoch": 1267} {"train_loss": -21.774213790893555, "global_step": 105184, "epoch": 1267} {"train_loss": -22.082639694213867, "global_step": 105185, "epoch": 1267} {"train_loss": -21.76838493347168, "global_step": 105186, "epoch": 1267} {"train_loss": -22.421396255493164, "global_step": 105187, "epoch": 1267} {"train_loss": -22.01185417175293, "global_step": 105188, "epoch": 1267} {"train_loss": -22.041053771972656, "global_step": 105189, "epoch": 1267} {"train_loss": -22.012033462524414, "global_step": 105190, "epoch": 1267} {"train_loss": -22.29896354675293, "global_step": 105191, "epoch": 1267} {"train_loss": -22.366558074951172, "global_step": 105192, "epoch": 1267} {"train_loss": -22.11785125732422, "global_step": 105193, "epoch": 1267} {"train_loss": -22.21010398864746, "global_step": 105194, "epoch": 1267} {"train_loss": -22.211017608642578, "global_step": 105195, "epoch": 1267} {"train_loss": -21.862747192382812, "global_step": 105196, "epoch": 1267} {"train_loss": -22.095489501953125, "global_step": 105197, "epoch": 1267} {"train_loss": -21.812183380126953, "global_step": 105198, "epoch": 1267} {"train_loss": -22.307077407836914, "global_step": 105199, "epoch": 1267} {"train_loss": -22.213647842407227, "global_step": 105200, "epoch": 1267} {"train_loss": -22.253551483154297, "global_step": 105201, "epoch": 1267} {"train_loss": -22.0493221282959, "global_step": 105202, "epoch": 1267} {"train_loss": -22.55455207824707, "global_step": 105203, "epoch": 1267} {"train_loss": -22.482709884643555, "global_step": 105204, "epoch": 1267} {"train_loss": -21.98210906982422, "global_step": 105205, "epoch": 1267} {"train_loss": -21.902236938476562, "global_step": 105206, "epoch": 1267} {"train_loss": -21.959575653076172, "global_step": 105207, "epoch": 1267} {"train_loss": -21.81144905090332, "global_step": 105208, "epoch": 1267} {"train_loss": -22.306013107299805, "global_step": 105209, "epoch": 1267} {"train_loss": -22.126867294311523, "global_step": 105210, "epoch": 1267} {"train_loss": -21.850168228149414, "global_step": 105211, "epoch": 1267} {"train_loss": -22.249792098999023, "global_step": 105212, "epoch": 1267} {"train_loss": -22.199399948120117, "global_step": 105213, "epoch": 1267} {"train_loss": -22.347896575927734, "global_step": 105214, "epoch": 1267} {"train_loss": -22.03484344482422, "global_step": 105215, "epoch": 1267} {"train_loss": -22.446115493774414, "global_step": 105216, "epoch": 1267} {"train_loss": -22.15164566040039, "global_step": 105217, "epoch": 1267} {"train_loss": -22.375701904296875, "global_step": 105218, "epoch": 1267} {"train_loss": -22.15180778503418, "global_step": 105219, "epoch": 1267} {"train_loss": -21.91653060913086, "global_step": 105220, "epoch": 1267} {"train_loss": -21.877212524414062, "global_step": 105221, "epoch": 1267} {"train_loss": -22.023653030395508, "global_step": 105222, "epoch": 1267} {"train_loss": -22.291301727294922, "global_step": 105223, "epoch": 1267} {"train_loss": -22.04606056213379, "global_step": 105224, "epoch": 1267} {"train_loss": -22.03594970703125, "global_step": 105225, "epoch": 1267} {"train_loss": -22.3056583404541, "global_step": 105226, "epoch": 1267} {"train_loss": -21.82561683654785, "global_step": 105227, "epoch": 1267} {"train_loss": -22.301132202148438, "global_step": 105228, "epoch": 1267} {"train_loss": -21.961292266845703, "global_step": 105229, "epoch": 1267} {"train_loss": -21.961240768432617, "global_step": 105230, "epoch": 1267} {"train_loss": -22.2636775970459, "global_step": 105231, "epoch": 1267} {"train_loss": -22.246728897094727, "global_step": 105232, "epoch": 1267} {"train_loss": -22.066511154174805, "global_step": 105233, "epoch": 1267} {"train_loss": -22.074018478393555, "global_step": 105234, "epoch": 1267} {"train_loss": -22.253931045532227, "global_step": 105235, "epoch": 1267} {"train_loss": -21.95589256286621, "global_step": 105236, "epoch": 1267} {"train_loss": -21.656957626342773, "global_step": 105237, "epoch": 1267} {"train_loss": -22.029064178466797, "global_step": 105238, "epoch": 1267} {"train_loss": -22.23103141784668, "global_step": 105239, "epoch": 1267} {"train_loss": -22.10845375061035, "global_step": 105240, "epoch": 1267} {"train_loss": -21.687593460083008, "global_step": 105241, "epoch": 1267} {"train_loss": -22.054786682128906, "global_step": 105242, "epoch": 1267} {"train_loss": -22.051275643957666, "global_step": 105243, "epoch": 1267, "val_loss": 6125486.0} {"train_loss": -21.651508331298828, "global_step": 105244, "epoch": 1268} {"train_loss": -21.301151275634766, "global_step": 105245, "epoch": 1268} {"train_loss": -21.54732894897461, "global_step": 105246, "epoch": 1268} {"train_loss": -21.38720703125, "global_step": 105247, "epoch": 1268} {"train_loss": -21.341922760009766, "global_step": 105248, "epoch": 1268} {"train_loss": -21.632892608642578, "global_step": 105249, "epoch": 1268} {"train_loss": -22.014606475830078, "global_step": 105250, "epoch": 1268} {"train_loss": -21.782766342163086, "global_step": 105251, "epoch": 1268} {"train_loss": -21.927650451660156, "global_step": 105252, "epoch": 1268} {"train_loss": -21.580785751342773, "global_step": 105253, "epoch": 1268} {"train_loss": -21.76865005493164, "global_step": 105254, "epoch": 1268} {"train_loss": -22.027002334594727, "global_step": 105255, "epoch": 1268} {"train_loss": -21.749067306518555, "global_step": 105256, "epoch": 1268} {"train_loss": -21.72463607788086, "global_step": 105257, "epoch": 1268} {"train_loss": -22.005918502807617, "global_step": 105258, "epoch": 1268} {"train_loss": -21.98832130432129, "global_step": 105259, "epoch": 1268} {"train_loss": -21.807844161987305, "global_step": 105260, "epoch": 1268} {"train_loss": -22.066509246826172, "global_step": 105261, "epoch": 1268} {"train_loss": -21.64021873474121, "global_step": 105262, "epoch": 1268} {"train_loss": -22.110136032104492, "global_step": 105263, "epoch": 1268} {"train_loss": -22.157827377319336, "global_step": 105264, "epoch": 1268} {"train_loss": -22.03464126586914, "global_step": 105265, "epoch": 1268} {"train_loss": -22.34976577758789, "global_step": 105266, "epoch": 1268} {"train_loss": -22.06293487548828, "global_step": 105267, "epoch": 1268} {"train_loss": -22.22113037109375, "global_step": 105268, "epoch": 1268} {"train_loss": -21.932682037353516, "global_step": 105269, "epoch": 1268} {"train_loss": -22.184171676635742, "global_step": 105270, "epoch": 1268} {"train_loss": -21.983234405517578, "global_step": 105271, "epoch": 1268} {"train_loss": -22.064855575561523, "global_step": 105272, "epoch": 1268} {"train_loss": -21.501604080200195, "global_step": 105273, "epoch": 1268} {"train_loss": -22.236818313598633, "global_step": 105274, "epoch": 1268} {"train_loss": -22.062177658081055, "global_step": 105275, "epoch": 1268} {"train_loss": -21.930627822875977, "global_step": 105276, "epoch": 1268} {"train_loss": -22.1932373046875, "global_step": 105277, "epoch": 1268} {"train_loss": -22.329092025756836, "global_step": 105278, "epoch": 1268} {"train_loss": -22.057729721069336, "global_step": 105279, "epoch": 1268} {"train_loss": -22.302444458007812, "global_step": 105280, "epoch": 1268} {"train_loss": -22.29718780517578, "global_step": 105281, "epoch": 1268} {"train_loss": -21.757104873657227, "global_step": 105282, "epoch": 1268} {"train_loss": -22.40848731994629, "global_step": 105283, "epoch": 1268} {"train_loss": -22.271570205688477, "global_step": 105284, "epoch": 1268} {"train_loss": -22.155292510986328, "global_step": 105285, "epoch": 1268} {"train_loss": -22.31696891784668, "global_step": 105286, "epoch": 1268} {"train_loss": -22.32558250427246, "global_step": 105287, "epoch": 1268} {"train_loss": -21.79486656188965, "global_step": 105288, "epoch": 1268} {"train_loss": -22.009769439697266, "global_step": 105289, "epoch": 1268} {"train_loss": -22.237232208251953, "global_step": 105290, "epoch": 1268} {"train_loss": -22.288551330566406, "global_step": 105291, "epoch": 1268} {"train_loss": -22.582962036132812, "global_step": 105292, "epoch": 1268} {"train_loss": -22.07086753845215, "global_step": 105293, "epoch": 1268} {"train_loss": -21.500844955444336, "global_step": 105294, "epoch": 1268} {"train_loss": -22.405963897705078, "global_step": 105295, "epoch": 1268} {"train_loss": -22.602874755859375, "global_step": 105296, "epoch": 1268} {"train_loss": -22.263042449951172, "global_step": 105297, "epoch": 1268} {"train_loss": -22.41727066040039, "global_step": 105298, "epoch": 1268} {"train_loss": -22.297916412353516, "global_step": 105299, "epoch": 1268} {"train_loss": -21.967790603637695, "global_step": 105300, "epoch": 1268} {"train_loss": -22.015417098999023, "global_step": 105301, "epoch": 1268} {"train_loss": -22.059736251831055, "global_step": 105302, "epoch": 1268} {"train_loss": -22.065837860107422, "global_step": 105303, "epoch": 1268} {"train_loss": -22.0621280670166, "global_step": 105304, "epoch": 1268} {"train_loss": -22.43978500366211, "global_step": 105305, "epoch": 1268} {"train_loss": -22.374235153198242, "global_step": 105306, "epoch": 1268} {"train_loss": -22.068883895874023, "global_step": 105307, "epoch": 1268} {"train_loss": -22.240407943725586, "global_step": 105308, "epoch": 1268} {"train_loss": -22.44717788696289, "global_step": 105309, "epoch": 1268} {"train_loss": -22.196979522705078, "global_step": 105310, "epoch": 1268} {"train_loss": -21.810880661010742, "global_step": 105311, "epoch": 1268} {"train_loss": -22.126474380493164, "global_step": 105312, "epoch": 1268} {"train_loss": -22.21717643737793, "global_step": 105313, "epoch": 1268} {"train_loss": -22.199209213256836, "global_step": 105314, "epoch": 1268} {"train_loss": -21.68834114074707, "global_step": 105315, "epoch": 1268} {"train_loss": -21.830320358276367, "global_step": 105316, "epoch": 1268} {"train_loss": -21.98774528503418, "global_step": 105317, "epoch": 1268} {"train_loss": -22.076568603515625, "global_step": 105318, "epoch": 1268} {"train_loss": -21.82769012451172, "global_step": 105319, "epoch": 1268} {"train_loss": -22.30495262145996, "global_step": 105320, "epoch": 1268} {"train_loss": -21.841262817382812, "global_step": 105321, "epoch": 1268} {"train_loss": -21.52545166015625, "global_step": 105322, "epoch": 1268} {"train_loss": -21.901329040527344, "global_step": 105323, "epoch": 1268} {"train_loss": -21.85468292236328, "global_step": 105324, "epoch": 1268} {"train_loss": -21.794876098632812, "global_step": 105325, "epoch": 1268} {"train_loss": -22.022229803613868, "global_step": 105326, "epoch": 1268, "val_loss": 6120164.0} {"train_loss": -21.117515563964844, "global_step": 105327, "epoch": 1269} {"train_loss": -21.713159561157227, "global_step": 105328, "epoch": 1269} {"train_loss": -21.49759864807129, "global_step": 105329, "epoch": 1269} {"train_loss": -21.624662399291992, "global_step": 105330, "epoch": 1269} {"train_loss": -21.347925186157227, "global_step": 105331, "epoch": 1269} {"train_loss": -21.930648803710938, "global_step": 105332, "epoch": 1269} {"train_loss": -21.526357650756836, "global_step": 105333, "epoch": 1269} {"train_loss": -21.959903717041016, "global_step": 105334, "epoch": 1269} {"train_loss": -21.978172302246094, "global_step": 105335, "epoch": 1269} {"train_loss": -21.867599487304688, "global_step": 105336, "epoch": 1269} {"train_loss": -22.0093936920166, "global_step": 105337, "epoch": 1269} {"train_loss": -21.778675079345703, "global_step": 105338, "epoch": 1269} {"train_loss": -21.766769409179688, "global_step": 105339, "epoch": 1269} {"train_loss": -22.156614303588867, "global_step": 105340, "epoch": 1269} {"train_loss": -21.664037704467773, "global_step": 105341, "epoch": 1269} {"train_loss": -21.719802856445312, "global_step": 105342, "epoch": 1269} {"train_loss": -22.160717010498047, "global_step": 105343, "epoch": 1269} {"train_loss": -22.029088973999023, "global_step": 105344, "epoch": 1269} {"train_loss": -22.168418884277344, "global_step": 105345, "epoch": 1269} {"train_loss": -22.40787696838379, "global_step": 105346, "epoch": 1269} {"train_loss": -22.093467712402344, "global_step": 105347, "epoch": 1269} {"train_loss": -21.986692428588867, "global_step": 105348, "epoch": 1269} {"train_loss": -22.2348690032959, "global_step": 105349, "epoch": 1269} {"train_loss": -22.04990005493164, "global_step": 105350, "epoch": 1269} {"train_loss": -22.216224670410156, "global_step": 105351, "epoch": 1269} {"train_loss": -21.849868774414062, "global_step": 105352, "epoch": 1269} {"train_loss": -21.85024070739746, "global_step": 105353, "epoch": 1269} {"train_loss": -22.17023277282715, "global_step": 105354, "epoch": 1269} {"train_loss": -22.110443115234375, "global_step": 105355, "epoch": 1269} {"train_loss": -22.333921432495117, "global_step": 105356, "epoch": 1269} {"train_loss": -22.07435417175293, "global_step": 105357, "epoch": 1269} {"train_loss": -22.16571044921875, "global_step": 105358, "epoch": 1269} {"train_loss": -22.458005905151367, "global_step": 105359, "epoch": 1269} {"train_loss": -21.818910598754883, "global_step": 105360, "epoch": 1269} {"train_loss": -22.1368408203125, "global_step": 105361, "epoch": 1269} {"train_loss": -22.123641967773438, "global_step": 105362, "epoch": 1269} {"train_loss": -22.032052993774414, "global_step": 105363, "epoch": 1269} {"train_loss": -22.119840621948242, "global_step": 105364, "epoch": 1269} {"train_loss": -21.96687889099121, "global_step": 105365, "epoch": 1269} {"train_loss": -22.036422729492188, "global_step": 105366, "epoch": 1269} {"train_loss": -22.535694122314453, "global_step": 105367, "epoch": 1269} {"train_loss": -22.443204879760742, "global_step": 105368, "epoch": 1269} {"train_loss": -22.264074325561523, "global_step": 105369, "epoch": 1269} {"train_loss": -21.998727798461914, "global_step": 105370, "epoch": 1269} {"train_loss": -22.08847427368164, "global_step": 105371, "epoch": 1269} {"train_loss": -22.16720962524414, "global_step": 105372, "epoch": 1269} {"train_loss": -22.5495662689209, "global_step": 105373, "epoch": 1269} {"train_loss": -22.135446548461914, "global_step": 105374, "epoch": 1269} {"train_loss": -22.22853660583496, "global_step": 105375, "epoch": 1269} {"train_loss": -21.71854019165039, "global_step": 105376, "epoch": 1269} {"train_loss": -22.079212188720703, "global_step": 105377, "epoch": 1269} {"train_loss": -22.054946899414062, "global_step": 105378, "epoch": 1269} {"train_loss": -21.9658145904541, "global_step": 105379, "epoch": 1269} {"train_loss": -22.23300552368164, "global_step": 105380, "epoch": 1269} {"train_loss": -22.25820541381836, "global_step": 105381, "epoch": 1269} {"train_loss": -22.21847152709961, "global_step": 105382, "epoch": 1269} {"train_loss": -21.695011138916016, "global_step": 105383, "epoch": 1269} {"train_loss": -21.864702224731445, "global_step": 105384, "epoch": 1269} {"train_loss": -22.297605514526367, "global_step": 105385, "epoch": 1269} {"train_loss": -22.023391723632812, "global_step": 105386, "epoch": 1269} {"train_loss": -22.040868759155273, "global_step": 105387, "epoch": 1269} {"train_loss": -21.779151916503906, "global_step": 105388, "epoch": 1269} {"train_loss": -22.028966903686523, "global_step": 105389, "epoch": 1269} {"train_loss": -22.110044479370117, "global_step": 105390, "epoch": 1269} {"train_loss": -22.48381805419922, "global_step": 105391, "epoch": 1269} {"train_loss": -21.874114990234375, "global_step": 105392, "epoch": 1269} {"train_loss": -22.040454864501953, "global_step": 105393, "epoch": 1269} {"train_loss": -22.279333114624023, "global_step": 105394, "epoch": 1269} {"train_loss": -21.9887752532959, "global_step": 105395, "epoch": 1269} {"train_loss": -22.199512481689453, "global_step": 105396, "epoch": 1269} {"train_loss": -22.069326400756836, "global_step": 105397, "epoch": 1269} {"train_loss": -22.166624069213867, "global_step": 105398, "epoch": 1269} {"train_loss": -22.062332153320312, "global_step": 105399, "epoch": 1269} {"train_loss": -22.1621150970459, "global_step": 105400, "epoch": 1269} {"train_loss": -21.93499755859375, "global_step": 105401, "epoch": 1269} {"train_loss": -22.13224220275879, "global_step": 105402, "epoch": 1269} {"train_loss": -22.0756778717041, "global_step": 105403, "epoch": 1269} {"train_loss": -21.826507568359375, "global_step": 105404, "epoch": 1269} {"train_loss": -22.126834869384766, "global_step": 105405, "epoch": 1269} {"train_loss": -22.052658081054688, "global_step": 105406, "epoch": 1269} {"train_loss": -22.3162784576416, "global_step": 105407, "epoch": 1269} {"train_loss": -22.095518112182617, "global_step": 105408, "epoch": 1269} {"train_loss": -22.0166090080537, "global_step": 105409, "epoch": 1269, "val_loss": 6137696.5} {"train_loss": -22.325088500976562, "global_step": 105410, "epoch": 1270} {"train_loss": -21.73459243774414, "global_step": 105411, "epoch": 1270} {"train_loss": -21.948209762573242, "global_step": 105412, "epoch": 1270} {"train_loss": -21.95792007446289, "global_step": 105413, "epoch": 1270} {"train_loss": -22.250219345092773, "global_step": 105414, "epoch": 1270} {"train_loss": -21.71498680114746, "global_step": 105415, "epoch": 1270} {"train_loss": -21.958303451538086, "global_step": 105416, "epoch": 1270} {"train_loss": -22.194055557250977, "global_step": 105417, "epoch": 1270} {"train_loss": -21.581090927124023, "global_step": 105418, "epoch": 1270} {"train_loss": -21.87054443359375, "global_step": 105419, "epoch": 1270} {"train_loss": -21.55927848815918, "global_step": 105420, "epoch": 1270} {"train_loss": -21.978729248046875, "global_step": 105421, "epoch": 1270} {"train_loss": -21.68903350830078, "global_step": 105422, "epoch": 1270} {"train_loss": -22.223373413085938, "global_step": 105423, "epoch": 1270} {"train_loss": -21.70879554748535, "global_step": 105424, "epoch": 1270} {"train_loss": -21.89293670654297, "global_step": 105425, "epoch": 1270} {"train_loss": -21.957345962524414, "global_step": 105426, "epoch": 1270} {"train_loss": -22.16788673400879, "global_step": 105427, "epoch": 1270} {"train_loss": -21.692459106445312, "global_step": 105428, "epoch": 1270} {"train_loss": -21.92171287536621, "global_step": 105429, "epoch": 1270} {"train_loss": -22.303964614868164, "global_step": 105430, "epoch": 1270} {"train_loss": -22.047807693481445, "global_step": 105431, "epoch": 1270} {"train_loss": -21.836349487304688, "global_step": 105432, "epoch": 1270} {"train_loss": -21.92193031311035, "global_step": 105433, "epoch": 1270} {"train_loss": -22.077072143554688, "global_step": 105434, "epoch": 1270} {"train_loss": -22.048730850219727, "global_step": 105435, "epoch": 1270} {"train_loss": -22.045658111572266, "global_step": 105436, "epoch": 1270} {"train_loss": -22.192901611328125, "global_step": 105437, "epoch": 1270} {"train_loss": -22.145971298217773, "global_step": 105438, "epoch": 1270} {"train_loss": -21.946842193603516, "global_step": 105439, "epoch": 1270} {"train_loss": -22.382633209228516, "global_step": 105440, "epoch": 1270} {"train_loss": -22.196985244750977, "global_step": 105441, "epoch": 1270} {"train_loss": -22.2033748626709, "global_step": 105442, "epoch": 1270} {"train_loss": -22.288881301879883, "global_step": 105443, "epoch": 1270} {"train_loss": -21.815216064453125, "global_step": 105444, "epoch": 1270} {"train_loss": -22.115272521972656, "global_step": 105445, "epoch": 1270} {"train_loss": -22.19231605529785, "global_step": 105446, "epoch": 1270} {"train_loss": -22.41255760192871, "global_step": 105447, "epoch": 1270} {"train_loss": -21.864538192749023, "global_step": 105448, "epoch": 1270} {"train_loss": -22.027984619140625, "global_step": 105449, "epoch": 1270} {"train_loss": -22.166318893432617, "global_step": 105450, "epoch": 1270} {"train_loss": -22.171337127685547, "global_step": 105451, "epoch": 1270} {"train_loss": -22.232553482055664, "global_step": 105452, "epoch": 1270} {"train_loss": -22.147022247314453, "global_step": 105453, "epoch": 1270} {"train_loss": -22.023033142089844, "global_step": 105454, "epoch": 1270} {"train_loss": -22.40943717956543, "global_step": 105455, "epoch": 1270} {"train_loss": -21.999414443969727, "global_step": 105456, "epoch": 1270} {"train_loss": -22.693567276000977, "global_step": 105457, "epoch": 1270} {"train_loss": -22.035659790039062, "global_step": 105458, "epoch": 1270} {"train_loss": -22.247495651245117, "global_step": 105459, "epoch": 1270} {"train_loss": -21.92612648010254, "global_step": 105460, "epoch": 1270} {"train_loss": -22.130125045776367, "global_step": 105461, "epoch": 1270} {"train_loss": -21.83698081970215, "global_step": 105462, "epoch": 1270} {"train_loss": -22.24268341064453, "global_step": 105463, "epoch": 1270} {"train_loss": -21.989633560180664, "global_step": 105464, "epoch": 1270} {"train_loss": -22.379858016967773, "global_step": 105465, "epoch": 1270} {"train_loss": -22.301183700561523, "global_step": 105466, "epoch": 1270} {"train_loss": -22.594074249267578, "global_step": 105467, "epoch": 1270} {"train_loss": -22.267616271972656, "global_step": 105468, "epoch": 1270} {"train_loss": -22.145898818969727, "global_step": 105469, "epoch": 1270} {"train_loss": -22.402231216430664, "global_step": 105470, "epoch": 1270} {"train_loss": -22.243366241455078, "global_step": 105471, "epoch": 1270} {"train_loss": -22.01296043395996, "global_step": 105472, "epoch": 1270} {"train_loss": -22.477598190307617, "global_step": 105473, "epoch": 1270} {"train_loss": -21.933298110961914, "global_step": 105474, "epoch": 1270} {"train_loss": -22.569984436035156, "global_step": 105475, "epoch": 1270} {"train_loss": -21.95556640625, "global_step": 105476, "epoch": 1270} {"train_loss": -21.97372817993164, "global_step": 105477, "epoch": 1270} {"train_loss": -22.15390396118164, "global_step": 105478, "epoch": 1270} {"train_loss": -21.777469635009766, "global_step": 105479, "epoch": 1270} {"train_loss": -22.028928756713867, "global_step": 105480, "epoch": 1270} {"train_loss": -21.965839385986328, "global_step": 105481, "epoch": 1270} {"train_loss": -22.410903930664062, "global_step": 105482, "epoch": 1270} {"train_loss": -22.077760696411133, "global_step": 105483, "epoch": 1270} {"train_loss": -22.006732940673828, "global_step": 105484, "epoch": 1270} {"train_loss": -21.748180389404297, "global_step": 105485, "epoch": 1270} {"train_loss": -21.881940841674805, "global_step": 105486, "epoch": 1270} {"train_loss": -22.045028686523438, "global_step": 105487, "epoch": 1270} {"train_loss": -22.310394287109375, "global_step": 105488, "epoch": 1270} {"train_loss": -21.81260108947754, "global_step": 105489, "epoch": 1270} {"train_loss": -21.82369041442871, "global_step": 105490, "epoch": 1270} {"train_loss": -22.246076583862305, "global_step": 105491, "epoch": 1270} {"train_loss": -22.08420204254518, "global_step": 105492, "epoch": 1270, "val_loss": 6253075.5} {"train_loss": -21.67289161682129, "global_step": 105493, "epoch": 1271} {"train_loss": -22.130130767822266, "global_step": 105494, "epoch": 1271} {"train_loss": -22.008291244506836, "global_step": 105495, "epoch": 1271} {"train_loss": -22.184778213500977, "global_step": 105496, "epoch": 1271} {"train_loss": -21.82005500793457, "global_step": 105497, "epoch": 1271} {"train_loss": -22.022323608398438, "global_step": 105498, "epoch": 1271} {"train_loss": -21.61635398864746, "global_step": 105499, "epoch": 1271} {"train_loss": -21.34442710876465, "global_step": 105500, "epoch": 1271} {"train_loss": -22.076139450073242, "global_step": 105501, "epoch": 1271} {"train_loss": -21.919544219970703, "global_step": 105502, "epoch": 1271} {"train_loss": -22.206125259399414, "global_step": 105503, "epoch": 1271} {"train_loss": -21.79448699951172, "global_step": 105504, "epoch": 1271} {"train_loss": -21.770084381103516, "global_step": 105505, "epoch": 1271} {"train_loss": -22.066726684570312, "global_step": 105506, "epoch": 1271} {"train_loss": -21.9381160736084, "global_step": 105507, "epoch": 1271} {"train_loss": -21.792821884155273, "global_step": 105508, "epoch": 1271} {"train_loss": -21.86400032043457, "global_step": 105509, "epoch": 1271} {"train_loss": -22.14678382873535, "global_step": 105510, "epoch": 1271} {"train_loss": -22.154523849487305, "global_step": 105511, "epoch": 1271} {"train_loss": -22.2299861907959, "global_step": 105512, "epoch": 1271} {"train_loss": -22.03771209716797, "global_step": 105513, "epoch": 1271} {"train_loss": -22.19392204284668, "global_step": 105514, "epoch": 1271} {"train_loss": -22.23185157775879, "global_step": 105515, "epoch": 1271} {"train_loss": -22.02408218383789, "global_step": 105516, "epoch": 1271} {"train_loss": -21.755247116088867, "global_step": 105517, "epoch": 1271} {"train_loss": -22.016050338745117, "global_step": 105518, "epoch": 1271} {"train_loss": -22.29867935180664, "global_step": 105519, "epoch": 1271} {"train_loss": -22.564266204833984, "global_step": 105520, "epoch": 1271} {"train_loss": -21.85732650756836, "global_step": 105521, "epoch": 1271} {"train_loss": -22.372312545776367, "global_step": 105522, "epoch": 1271} {"train_loss": -22.105337142944336, "global_step": 105523, "epoch": 1271} {"train_loss": -22.062515258789062, "global_step": 105524, "epoch": 1271} {"train_loss": -21.81695556640625, "global_step": 105525, "epoch": 1271} {"train_loss": -21.995264053344727, "global_step": 105526, "epoch": 1271} {"train_loss": -21.942819595336914, "global_step": 105527, "epoch": 1271} {"train_loss": -22.31734848022461, "global_step": 105528, "epoch": 1271} {"train_loss": -21.672945022583008, "global_step": 105529, "epoch": 1271} {"train_loss": -21.849435806274414, "global_step": 105530, "epoch": 1271} {"train_loss": -22.184595108032227, "global_step": 105531, "epoch": 1271} {"train_loss": -21.74686050415039, "global_step": 105532, "epoch": 1271} {"train_loss": -21.728303909301758, "global_step": 105533, "epoch": 1271} {"train_loss": -22.084197998046875, "global_step": 105534, "epoch": 1271} {"train_loss": -22.25830078125, "global_step": 105535, "epoch": 1271} {"train_loss": -21.794559478759766, "global_step": 105536, "epoch": 1271} {"train_loss": -21.97188377380371, "global_step": 105537, "epoch": 1271} {"train_loss": -22.153596878051758, "global_step": 105538, "epoch": 1271} {"train_loss": -22.170373916625977, "global_step": 105539, "epoch": 1271} {"train_loss": -21.895751953125, "global_step": 105540, "epoch": 1271} {"train_loss": -22.40028190612793, "global_step": 105541, "epoch": 1271} {"train_loss": -22.21380043029785, "global_step": 105542, "epoch": 1271} {"train_loss": -21.845346450805664, "global_step": 105543, "epoch": 1271} {"train_loss": -21.830801010131836, "global_step": 105544, "epoch": 1271} {"train_loss": -22.260433197021484, "global_step": 105545, "epoch": 1271} {"train_loss": -22.001901626586914, "global_step": 105546, "epoch": 1271} {"train_loss": -22.256820678710938, "global_step": 105547, "epoch": 1271} {"train_loss": -22.003650665283203, "global_step": 105548, "epoch": 1271} {"train_loss": -22.026123046875, "global_step": 105549, "epoch": 1271} {"train_loss": -22.11773681640625, "global_step": 105550, "epoch": 1271} {"train_loss": -22.1315860748291, "global_step": 105551, "epoch": 1271} {"train_loss": -22.177165985107422, "global_step": 105552, "epoch": 1271} {"train_loss": -22.2180233001709, "global_step": 105553, "epoch": 1271} {"train_loss": -21.95808219909668, "global_step": 105554, "epoch": 1271} {"train_loss": -22.466629028320312, "global_step": 105555, "epoch": 1271} {"train_loss": -21.85414695739746, "global_step": 105556, "epoch": 1271} {"train_loss": -22.28989028930664, "global_step": 105557, "epoch": 1271} {"train_loss": -21.78114128112793, "global_step": 105558, "epoch": 1271} {"train_loss": -21.98818588256836, "global_step": 105559, "epoch": 1271} {"train_loss": -22.286527633666992, "global_step": 105560, "epoch": 1271} {"train_loss": -22.23910140991211, "global_step": 105561, "epoch": 1271} {"train_loss": -22.260955810546875, "global_step": 105562, "epoch": 1271} {"train_loss": -22.29109764099121, "global_step": 105563, "epoch": 1271} {"train_loss": -22.184246063232422, "global_step": 105564, "epoch": 1271} {"train_loss": -22.312654495239258, "global_step": 105565, "epoch": 1271} {"train_loss": -21.591703414916992, "global_step": 105566, "epoch": 1271} {"train_loss": -21.937231063842773, "global_step": 105567, "epoch": 1271} {"train_loss": -21.983633041381836, "global_step": 105568, "epoch": 1271} {"train_loss": -21.949726104736328, "global_step": 105569, "epoch": 1271} {"train_loss": -22.024124145507812, "global_step": 105570, "epoch": 1271} {"train_loss": -22.43609619140625, "global_step": 105571, "epoch": 1271} {"train_loss": -22.18274688720703, "global_step": 105572, "epoch": 1271} {"train_loss": -21.800432205200195, "global_step": 105573, "epoch": 1271} {"train_loss": -22.364826202392578, "global_step": 105574, "epoch": 1271} {"train_loss": -22.056399494768627, "global_step": 105575, "epoch": 1271, "val_loss": 5978169.0} {"train_loss": -21.48142433166504, "global_step": 105576, "epoch": 1272} {"train_loss": -21.988239288330078, "global_step": 105577, "epoch": 1272} {"train_loss": -21.69868278503418, "global_step": 105578, "epoch": 1272} {"train_loss": -21.690771102905273, "global_step": 105579, "epoch": 1272} {"train_loss": -22.051633834838867, "global_step": 105580, "epoch": 1272} {"train_loss": -21.814916610717773, "global_step": 105581, "epoch": 1272} {"train_loss": -21.467782974243164, "global_step": 105582, "epoch": 1272} {"train_loss": -21.670059204101562, "global_step": 105583, "epoch": 1272} {"train_loss": -21.71232032775879, "global_step": 105584, "epoch": 1272} {"train_loss": -21.832355499267578, "global_step": 105585, "epoch": 1272} {"train_loss": -21.985097885131836, "global_step": 105586, "epoch": 1272} {"train_loss": -22.001501083374023, "global_step": 105587, "epoch": 1272} {"train_loss": -22.044652938842773, "global_step": 105588, "epoch": 1272} {"train_loss": -22.319324493408203, "global_step": 105589, "epoch": 1272} {"train_loss": -21.917510986328125, "global_step": 105590, "epoch": 1272} {"train_loss": -22.139850616455078, "global_step": 105591, "epoch": 1272} {"train_loss": -21.901119232177734, "global_step": 105592, "epoch": 1272} {"train_loss": -22.1136474609375, "global_step": 105593, "epoch": 1272} {"train_loss": -22.03717803955078, "global_step": 105594, "epoch": 1272} {"train_loss": -22.039880752563477, "global_step": 105595, "epoch": 1272} {"train_loss": -21.752960205078125, "global_step": 105596, "epoch": 1272} {"train_loss": -21.9260311126709, "global_step": 105597, "epoch": 1272} {"train_loss": -21.910959243774414, "global_step": 105598, "epoch": 1272} {"train_loss": -22.0433349609375, "global_step": 105599, "epoch": 1272} {"train_loss": -22.147884368896484, "global_step": 105600, "epoch": 1272} {"train_loss": -22.303869247436523, "global_step": 105601, "epoch": 1272} {"train_loss": -22.21564292907715, "global_step": 105602, "epoch": 1272} {"train_loss": -22.139263153076172, "global_step": 105603, "epoch": 1272} {"train_loss": -21.913686752319336, "global_step": 105604, "epoch": 1272} {"train_loss": -22.289398193359375, "global_step": 105605, "epoch": 1272} {"train_loss": -21.895505905151367, "global_step": 105606, "epoch": 1272} {"train_loss": -21.782957077026367, "global_step": 105607, "epoch": 1272} {"train_loss": -21.90435791015625, "global_step": 105608, "epoch": 1272} {"train_loss": -21.989545822143555, "global_step": 105609, "epoch": 1272} {"train_loss": -22.150903701782227, "global_step": 105610, "epoch": 1272} {"train_loss": -22.308691024780273, "global_step": 105611, "epoch": 1272} {"train_loss": -22.235504150390625, "global_step": 105612, "epoch": 1272} {"train_loss": -22.26017189025879, "global_step": 105613, "epoch": 1272} {"train_loss": -22.062952041625977, "global_step": 105614, "epoch": 1272} {"train_loss": -21.854854583740234, "global_step": 105615, "epoch": 1272} {"train_loss": -22.52165985107422, "global_step": 105616, "epoch": 1272} {"train_loss": -22.054838180541992, "global_step": 105617, "epoch": 1272} {"train_loss": -22.163297653198242, "global_step": 105618, "epoch": 1272} {"train_loss": -22.096181869506836, "global_step": 105619, "epoch": 1272} {"train_loss": -22.213876724243164, "global_step": 105620, "epoch": 1272} {"train_loss": -21.993179321289062, "global_step": 105621, "epoch": 1272} {"train_loss": -22.5640869140625, "global_step": 105622, "epoch": 1272} {"train_loss": -21.921138763427734, "global_step": 105623, "epoch": 1272} {"train_loss": -22.284570693969727, "global_step": 105624, "epoch": 1272} {"train_loss": -22.218490600585938, "global_step": 105625, "epoch": 1272} {"train_loss": -22.027698516845703, "global_step": 105626, "epoch": 1272} {"train_loss": -21.974876403808594, "global_step": 105627, "epoch": 1272} {"train_loss": -22.304183959960938, "global_step": 105628, "epoch": 1272} {"train_loss": -22.34462547302246, "global_step": 105629, "epoch": 1272} {"train_loss": -21.83536148071289, "global_step": 105630, "epoch": 1272} {"train_loss": -22.120079040527344, "global_step": 105631, "epoch": 1272} {"train_loss": -22.005422592163086, "global_step": 105632, "epoch": 1272} {"train_loss": -22.022537231445312, "global_step": 105633, "epoch": 1272} {"train_loss": -21.885366439819336, "global_step": 105634, "epoch": 1272} {"train_loss": -21.927072525024414, "global_step": 105635, "epoch": 1272} {"train_loss": -21.973600387573242, "global_step": 105636, "epoch": 1272} {"train_loss": -22.051008224487305, "global_step": 105637, "epoch": 1272} {"train_loss": -22.124847412109375, "global_step": 105638, "epoch": 1272} {"train_loss": -22.302032470703125, "global_step": 105639, "epoch": 1272} {"train_loss": -22.511550903320312, "global_step": 105640, "epoch": 1272} {"train_loss": -22.202030181884766, "global_step": 105641, "epoch": 1272} {"train_loss": -22.137737274169922, "global_step": 105642, "epoch": 1272} {"train_loss": -21.7691707611084, "global_step": 105643, "epoch": 1272} {"train_loss": -22.093198776245117, "global_step": 105644, "epoch": 1272} {"train_loss": -21.96831512451172, "global_step": 105645, "epoch": 1272} {"train_loss": -22.415695190429688, "global_step": 105646, "epoch": 1272} {"train_loss": -22.259904861450195, "global_step": 105647, "epoch": 1272} {"train_loss": -22.22893524169922, "global_step": 105648, "epoch": 1272} {"train_loss": -22.423288345336914, "global_step": 105649, "epoch": 1272} {"train_loss": -22.091751098632812, "global_step": 105650, "epoch": 1272} {"train_loss": -22.556875228881836, "global_step": 105651, "epoch": 1272} {"train_loss": -21.655630111694336, "global_step": 105652, "epoch": 1272} {"train_loss": -22.30023193359375, "global_step": 105653, "epoch": 1272} {"train_loss": -22.09572982788086, "global_step": 105654, "epoch": 1272} {"train_loss": -22.133026123046875, "global_step": 105655, "epoch": 1272} {"train_loss": -22.681310653686523, "global_step": 105656, "epoch": 1272} {"train_loss": -22.42388916015625, "global_step": 105657, "epoch": 1272} {"train_loss": -22.0618942444583, "global_step": 105658, "epoch": 1272, "val_loss": 6108780.0} {"train_loss": -21.826492309570312, "global_step": 105659, "epoch": 1273} {"train_loss": -22.076292037963867, "global_step": 105660, "epoch": 1273} {"train_loss": -21.799362182617188, "global_step": 105661, "epoch": 1273} {"train_loss": -21.735021591186523, "global_step": 105662, "epoch": 1273} {"train_loss": -22.006290435791016, "global_step": 105663, "epoch": 1273} {"train_loss": -22.206960678100586, "global_step": 105664, "epoch": 1273} {"train_loss": -22.112394332885742, "global_step": 105665, "epoch": 1273} {"train_loss": -22.188344955444336, "global_step": 105666, "epoch": 1273} {"train_loss": -22.21354103088379, "global_step": 105667, "epoch": 1273} {"train_loss": -21.63558006286621, "global_step": 105668, "epoch": 1273} {"train_loss": -22.063711166381836, "global_step": 105669, "epoch": 1273} {"train_loss": -21.668073654174805, "global_step": 105670, "epoch": 1273} {"train_loss": -22.47365379333496, "global_step": 105671, "epoch": 1273} {"train_loss": -22.16934585571289, "global_step": 105672, "epoch": 1273} {"train_loss": -21.9332218170166, "global_step": 105673, "epoch": 1273} {"train_loss": -21.879413604736328, "global_step": 105674, "epoch": 1273} {"train_loss": -22.129423141479492, "global_step": 105675, "epoch": 1273} {"train_loss": -21.934263229370117, "global_step": 105676, "epoch": 1273} {"train_loss": -22.41109275817871, "global_step": 105677, "epoch": 1273} {"train_loss": -22.228347778320312, "global_step": 105678, "epoch": 1273} {"train_loss": -21.798368453979492, "global_step": 105679, "epoch": 1273} {"train_loss": -22.36477279663086, "global_step": 105680, "epoch": 1273} {"train_loss": -22.002042770385742, "global_step": 105681, "epoch": 1273} {"train_loss": -22.171669006347656, "global_step": 105682, "epoch": 1273} {"train_loss": -22.476211547851562, "global_step": 105683, "epoch": 1273} {"train_loss": -21.877344131469727, "global_step": 105684, "epoch": 1273} {"train_loss": -22.35707664489746, "global_step": 105685, "epoch": 1273} {"train_loss": -22.076704025268555, "global_step": 105686, "epoch": 1273} {"train_loss": -22.453153610229492, "global_step": 105687, "epoch": 1273} {"train_loss": -22.51667594909668, "global_step": 105688, "epoch": 1273} {"train_loss": -21.705087661743164, "global_step": 105689, "epoch": 1273} {"train_loss": -22.071622848510742, "global_step": 105690, "epoch": 1273} {"train_loss": -22.17909049987793, "global_step": 105691, "epoch": 1273} {"train_loss": -21.724760055541992, "global_step": 105692, "epoch": 1273} {"train_loss": -21.710418701171875, "global_step": 105693, "epoch": 1273} {"train_loss": -22.12689781188965, "global_step": 105694, "epoch": 1273} {"train_loss": -22.20478630065918, "global_step": 105695, "epoch": 1273} {"train_loss": -22.506208419799805, "global_step": 105696, "epoch": 1273} {"train_loss": -22.176847457885742, "global_step": 105697, "epoch": 1273} {"train_loss": -22.259302139282227, "global_step": 105698, "epoch": 1273} {"train_loss": -22.320024490356445, "global_step": 105699, "epoch": 1273} {"train_loss": -22.179840087890625, "global_step": 105700, "epoch": 1273} {"train_loss": -22.548282623291016, "global_step": 105701, "epoch": 1273} {"train_loss": -22.00191307067871, "global_step": 105702, "epoch": 1273} {"train_loss": -22.420751571655273, "global_step": 105703, "epoch": 1273} {"train_loss": -22.260223388671875, "global_step": 105704, "epoch": 1273} {"train_loss": -22.1957950592041, "global_step": 105705, "epoch": 1273} {"train_loss": -22.012205123901367, "global_step": 105706, "epoch": 1273} {"train_loss": -22.314834594726562, "global_step": 105707, "epoch": 1273} {"train_loss": -22.43892478942871, "global_step": 105708, "epoch": 1273} {"train_loss": -22.11191749572754, "global_step": 105709, "epoch": 1273} {"train_loss": -22.010019302368164, "global_step": 105710, "epoch": 1273} {"train_loss": -21.8775577545166, "global_step": 105711, "epoch": 1273} {"train_loss": -22.12145233154297, "global_step": 105712, "epoch": 1273} {"train_loss": -22.390514373779297, "global_step": 105713, "epoch": 1273} {"train_loss": -22.037580490112305, "global_step": 105714, "epoch": 1273} {"train_loss": -22.456525802612305, "global_step": 105715, "epoch": 1273} {"train_loss": -22.188419342041016, "global_step": 105716, "epoch": 1273} {"train_loss": -22.625539779663086, "global_step": 105717, "epoch": 1273} {"train_loss": -22.306655883789062, "global_step": 105718, "epoch": 1273} {"train_loss": -22.17359733581543, "global_step": 105719, "epoch": 1273} {"train_loss": -22.04583168029785, "global_step": 105720, "epoch": 1273} {"train_loss": -22.162097930908203, "global_step": 105721, "epoch": 1273} {"train_loss": -22.09440040588379, "global_step": 105722, "epoch": 1273} {"train_loss": -22.15526008605957, "global_step": 105723, "epoch": 1273} {"train_loss": -22.06577491760254, "global_step": 105724, "epoch": 1273} {"train_loss": -21.797962188720703, "global_step": 105725, "epoch": 1273} {"train_loss": -22.066741943359375, "global_step": 105726, "epoch": 1273} {"train_loss": -21.702945709228516, "global_step": 105727, "epoch": 1273} {"train_loss": -22.17267417907715, "global_step": 105728, "epoch": 1273} {"train_loss": -22.05685043334961, "global_step": 105729, "epoch": 1273} {"train_loss": -22.08929443359375, "global_step": 105730, "epoch": 1273} {"train_loss": -22.25896644592285, "global_step": 105731, "epoch": 1273} {"train_loss": -22.30900001525879, "global_step": 105732, "epoch": 1273} {"train_loss": -22.150482177734375, "global_step": 105733, "epoch": 1273} {"train_loss": -22.172544479370117, "global_step": 105734, "epoch": 1273} {"train_loss": -21.939990997314453, "global_step": 105735, "epoch": 1273} {"train_loss": -22.12592887878418, "global_step": 105736, "epoch": 1273} {"train_loss": -22.058326721191406, "global_step": 105737, "epoch": 1273} {"train_loss": -22.18113136291504, "global_step": 105738, "epoch": 1273} {"train_loss": -22.073518753051758, "global_step": 105739, "epoch": 1273} {"train_loss": -22.197696685791016, "global_step": 105740, "epoch": 1273} {"train_loss": -22.1225121739399, "global_step": 105741, "epoch": 1273, "val_loss": 6133453.0} {"train_loss": -21.690732955932617, "global_step": 105742, "epoch": 1274} {"train_loss": -21.7674617767334, "global_step": 105743, "epoch": 1274} {"train_loss": -21.994430541992188, "global_step": 105744, "epoch": 1274} {"train_loss": -22.0396728515625, "global_step": 105745, "epoch": 1274} {"train_loss": -22.07097053527832, "global_step": 105746, "epoch": 1274} {"train_loss": -21.856918334960938, "global_step": 105747, "epoch": 1274} {"train_loss": -21.77252197265625, "global_step": 105748, "epoch": 1274} {"train_loss": -21.988208770751953, "global_step": 105749, "epoch": 1274} {"train_loss": -22.236400604248047, "global_step": 105750, "epoch": 1274} {"train_loss": -21.65716552734375, "global_step": 105751, "epoch": 1274} {"train_loss": -22.094654083251953, "global_step": 105752, "epoch": 1274} {"train_loss": -22.02655029296875, "global_step": 105753, "epoch": 1274} {"train_loss": -22.044967651367188, "global_step": 105754, "epoch": 1274} {"train_loss": -22.091062545776367, "global_step": 105755, "epoch": 1274} {"train_loss": -22.223766326904297, "global_step": 105756, "epoch": 1274} {"train_loss": -21.934751510620117, "global_step": 105757, "epoch": 1274} {"train_loss": -21.550445556640625, "global_step": 105758, "epoch": 1274} {"train_loss": -21.36329460144043, "global_step": 105759, "epoch": 1274} {"train_loss": -21.99878692626953, "global_step": 105760, "epoch": 1274} {"train_loss": -22.085355758666992, "global_step": 105761, "epoch": 1274} {"train_loss": -21.917346954345703, "global_step": 105762, "epoch": 1274} {"train_loss": -22.34647560119629, "global_step": 105763, "epoch": 1274} {"train_loss": -22.001327514648438, "global_step": 105764, "epoch": 1274} {"train_loss": -22.070287704467773, "global_step": 105765, "epoch": 1274} {"train_loss": -21.803558349609375, "global_step": 105766, "epoch": 1274} {"train_loss": -22.270456314086914, "global_step": 105767, "epoch": 1274} {"train_loss": -22.00787353515625, "global_step": 105768, "epoch": 1274} {"train_loss": -21.905502319335938, "global_step": 105769, "epoch": 1274} {"train_loss": -21.66385269165039, "global_step": 105770, "epoch": 1274} {"train_loss": -21.778308868408203, "global_step": 105771, "epoch": 1274} {"train_loss": -21.736108779907227, "global_step": 105772, "epoch": 1274} {"train_loss": -21.97818946838379, "global_step": 105773, "epoch": 1274} {"train_loss": -21.687231063842773, "global_step": 105774, "epoch": 1274} {"train_loss": -22.12135887145996, "global_step": 105775, "epoch": 1274} {"train_loss": -22.082111358642578, "global_step": 105776, "epoch": 1274} {"train_loss": -21.942426681518555, "global_step": 105777, "epoch": 1274} {"train_loss": -21.64361000061035, "global_step": 105778, "epoch": 1274} {"train_loss": -21.803308486938477, "global_step": 105779, "epoch": 1274} {"train_loss": -22.33447265625, "global_step": 105780, "epoch": 1274} {"train_loss": -21.982786178588867, "global_step": 105781, "epoch": 1274} {"train_loss": -21.609962463378906, "global_step": 105782, "epoch": 1274} {"train_loss": -21.968778610229492, "global_step": 105783, "epoch": 1274} {"train_loss": -22.007652282714844, "global_step": 105784, "epoch": 1274} {"train_loss": -21.93336296081543, "global_step": 105785, "epoch": 1274} {"train_loss": -22.037673950195312, "global_step": 105786, "epoch": 1274} {"train_loss": -22.513473510742188, "global_step": 105787, "epoch": 1274} {"train_loss": -21.998634338378906, "global_step": 105788, "epoch": 1274} {"train_loss": -22.26093864440918, "global_step": 105789, "epoch": 1274} {"train_loss": -21.973066329956055, "global_step": 105790, "epoch": 1274} {"train_loss": -22.13348960876465, "global_step": 105791, "epoch": 1274} {"train_loss": -22.211091995239258, "global_step": 105792, "epoch": 1274} {"train_loss": -22.196687698364258, "global_step": 105793, "epoch": 1274} {"train_loss": -22.41913604736328, "global_step": 105794, "epoch": 1274} {"train_loss": -22.145580291748047, "global_step": 105795, "epoch": 1274} {"train_loss": -22.35682487487793, "global_step": 105796, "epoch": 1274} {"train_loss": -22.14311981201172, "global_step": 105797, "epoch": 1274} {"train_loss": -21.95341682434082, "global_step": 105798, "epoch": 1274} {"train_loss": -22.57974624633789, "global_step": 105799, "epoch": 1274} {"train_loss": -22.420652389526367, "global_step": 105800, "epoch": 1274} {"train_loss": -22.003812789916992, "global_step": 105801, "epoch": 1274} {"train_loss": -22.5089111328125, "global_step": 105802, "epoch": 1274} {"train_loss": -22.086029052734375, "global_step": 105803, "epoch": 1274} {"train_loss": -22.003904342651367, "global_step": 105804, "epoch": 1274} {"train_loss": -21.949045181274414, "global_step": 105805, "epoch": 1274} {"train_loss": -22.24536895751953, "global_step": 105806, "epoch": 1274} {"train_loss": -22.228614807128906, "global_step": 105807, "epoch": 1274} {"train_loss": -22.248672485351562, "global_step": 105808, "epoch": 1274} {"train_loss": -22.064388275146484, "global_step": 105809, "epoch": 1274} {"train_loss": -21.877424240112305, "global_step": 105810, "epoch": 1274} {"train_loss": -21.61541175842285, "global_step": 105811, "epoch": 1274} {"train_loss": -22.29705810546875, "global_step": 105812, "epoch": 1274} {"train_loss": -21.975543975830078, "global_step": 105813, "epoch": 1274} {"train_loss": -21.82951545715332, "global_step": 105814, "epoch": 1274} {"train_loss": -21.941083908081055, "global_step": 105815, "epoch": 1274} {"train_loss": -22.26986312866211, "global_step": 105816, "epoch": 1274} {"train_loss": -21.82138442993164, "global_step": 105817, "epoch": 1274} {"train_loss": -22.082040786743164, "global_step": 105818, "epoch": 1274} {"train_loss": -22.13641929626465, "global_step": 105819, "epoch": 1274} {"train_loss": -22.03828239440918, "global_step": 105820, "epoch": 1274} {"train_loss": -21.920034408569336, "global_step": 105821, "epoch": 1274} {"train_loss": -22.218276977539062, "global_step": 105822, "epoch": 1274} {"train_loss": -22.165220260620117, "global_step": 105823, "epoch": 1274} {"train_loss": -22.021804120167193, "global_step": 105824, "epoch": 1274, "val_loss": 6141334.0} {"train_loss": -21.74164390563965, "global_step": 105825, "epoch": 1275} {"train_loss": -21.475751876831055, "global_step": 105826, "epoch": 1275} {"train_loss": -21.87923240661621, "global_step": 105827, "epoch": 1275} {"train_loss": -21.628507614135742, "global_step": 105828, "epoch": 1275} {"train_loss": -21.817968368530273, "global_step": 105829, "epoch": 1275} {"train_loss": -21.760120391845703, "global_step": 105830, "epoch": 1275} {"train_loss": -21.958295822143555, "global_step": 105831, "epoch": 1275} {"train_loss": -21.769725799560547, "global_step": 105832, "epoch": 1275} {"train_loss": -21.919130325317383, "global_step": 105833, "epoch": 1275} {"train_loss": -21.936111450195312, "global_step": 105834, "epoch": 1275} {"train_loss": -22.216665267944336, "global_step": 105835, "epoch": 1275} {"train_loss": -21.9033145904541, "global_step": 105836, "epoch": 1275} {"train_loss": -21.910749435424805, "global_step": 105837, "epoch": 1275} {"train_loss": -21.73725700378418, "global_step": 105838, "epoch": 1275} {"train_loss": -21.701513290405273, "global_step": 105839, "epoch": 1275} {"train_loss": -21.90848159790039, "global_step": 105840, "epoch": 1275} {"train_loss": -21.870038986206055, "global_step": 105841, "epoch": 1275} {"train_loss": -22.188983917236328, "global_step": 105842, "epoch": 1275} {"train_loss": -21.744274139404297, "global_step": 105843, "epoch": 1275} {"train_loss": -22.15526008605957, "global_step": 105844, "epoch": 1275} {"train_loss": -21.79927635192871, "global_step": 105845, "epoch": 1275} {"train_loss": -21.938791275024414, "global_step": 105846, "epoch": 1275} {"train_loss": -21.868741989135742, "global_step": 105847, "epoch": 1275} {"train_loss": -21.805212020874023, "global_step": 105848, "epoch": 1275} {"train_loss": -22.047849655151367, "global_step": 105849, "epoch": 1275} {"train_loss": -22.071165084838867, "global_step": 105850, "epoch": 1275} {"train_loss": -21.994457244873047, "global_step": 105851, "epoch": 1275} {"train_loss": -22.180692672729492, "global_step": 105852, "epoch": 1275} {"train_loss": -22.32407569885254, "global_step": 105853, "epoch": 1275} {"train_loss": -21.852718353271484, "global_step": 105854, "epoch": 1275} {"train_loss": -22.407089233398438, "global_step": 105855, "epoch": 1275} {"train_loss": -22.002613067626953, "global_step": 105856, "epoch": 1275} {"train_loss": -22.338058471679688, "global_step": 105857, "epoch": 1275} {"train_loss": -22.177778244018555, "global_step": 105858, "epoch": 1275} {"train_loss": -21.92430305480957, "global_step": 105859, "epoch": 1275} {"train_loss": -21.858747482299805, "global_step": 105860, "epoch": 1275} {"train_loss": -22.58582878112793, "global_step": 105861, "epoch": 1275} {"train_loss": -22.319337844848633, "global_step": 105862, "epoch": 1275} {"train_loss": -22.187808990478516, "global_step": 105863, "epoch": 1275} {"train_loss": -22.23162269592285, "global_step": 105864, "epoch": 1275} {"train_loss": -22.112340927124023, "global_step": 105865, "epoch": 1275} {"train_loss": -22.09145164489746, "global_step": 105866, "epoch": 1275} {"train_loss": -21.63641929626465, "global_step": 105867, "epoch": 1275} {"train_loss": -22.434131622314453, "global_step": 105868, "epoch": 1275} {"train_loss": -21.923233032226562, "global_step": 105869, "epoch": 1275} {"train_loss": -22.25153160095215, "global_step": 105870, "epoch": 1275} {"train_loss": -22.282262802124023, "global_step": 105871, "epoch": 1275} {"train_loss": -22.186288833618164, "global_step": 105872, "epoch": 1275} {"train_loss": -22.259521484375, "global_step": 105873, "epoch": 1275} {"train_loss": -21.957494735717773, "global_step": 105874, "epoch": 1275} {"train_loss": -22.249156951904297, "global_step": 105875, "epoch": 1275} {"train_loss": -22.6125431060791, "global_step": 105876, "epoch": 1275} {"train_loss": -22.1335391998291, "global_step": 105877, "epoch": 1275} {"train_loss": -22.05084800720215, "global_step": 105878, "epoch": 1275} {"train_loss": -22.381559371948242, "global_step": 105879, "epoch": 1275} {"train_loss": -21.82343864440918, "global_step": 105880, "epoch": 1275} {"train_loss": -21.938583374023438, "global_step": 105881, "epoch": 1275} {"train_loss": -22.09820556640625, "global_step": 105882, "epoch": 1275} {"train_loss": -21.948017120361328, "global_step": 105883, "epoch": 1275} {"train_loss": -22.323232650756836, "global_step": 105884, "epoch": 1275} {"train_loss": -22.309757232666016, "global_step": 105885, "epoch": 1275} {"train_loss": -21.950796127319336, "global_step": 105886, "epoch": 1275} {"train_loss": -22.0512752532959, "global_step": 105887, "epoch": 1275} {"train_loss": -22.373592376708984, "global_step": 105888, "epoch": 1275} {"train_loss": -22.012365341186523, "global_step": 105889, "epoch": 1275} {"train_loss": -21.889001846313477, "global_step": 105890, "epoch": 1275} {"train_loss": -21.9198055267334, "global_step": 105891, "epoch": 1275} {"train_loss": -22.32599639892578, "global_step": 105892, "epoch": 1275} {"train_loss": -21.962528228759766, "global_step": 105893, "epoch": 1275} {"train_loss": -21.878406524658203, "global_step": 105894, "epoch": 1275} {"train_loss": -22.289024353027344, "global_step": 105895, "epoch": 1275} {"train_loss": -22.647199630737305, "global_step": 105896, "epoch": 1275} {"train_loss": -22.014068603515625, "global_step": 105897, "epoch": 1275} {"train_loss": -22.5325870513916, "global_step": 105898, "epoch": 1275} {"train_loss": -21.97368049621582, "global_step": 105899, "epoch": 1275} {"train_loss": -21.642032623291016, "global_step": 105900, "epoch": 1275} {"train_loss": -22.069459915161133, "global_step": 105901, "epoch": 1275} {"train_loss": -22.248058319091797, "global_step": 105902, "epoch": 1275} {"train_loss": -22.12420654296875, "global_step": 105903, "epoch": 1275} {"train_loss": -21.948108673095703, "global_step": 105904, "epoch": 1275} {"train_loss": -22.043725967407227, "global_step": 105905, "epoch": 1275} {"train_loss": -21.958770751953125, "global_step": 105906, "epoch": 1275} {"train_loss": -22.068800868758235, "global_step": 105907, "epoch": 1275, "val_loss": 6064092.0} {"train_loss": -21.23641014099121, "global_step": 105908, "epoch": 1276} {"train_loss": -21.78645133972168, "global_step": 105909, "epoch": 1276} {"train_loss": -21.43320655822754, "global_step": 105910, "epoch": 1276} {"train_loss": -21.39569091796875, "global_step": 105911, "epoch": 1276} {"train_loss": -21.50811767578125, "global_step": 105912, "epoch": 1276} {"train_loss": -21.51213836669922, "global_step": 105913, "epoch": 1276} {"train_loss": -21.596858978271484, "global_step": 105914, "epoch": 1276} {"train_loss": -21.672739028930664, "global_step": 105915, "epoch": 1276} {"train_loss": -21.722082138061523, "global_step": 105916, "epoch": 1276} {"train_loss": -21.607654571533203, "global_step": 105917, "epoch": 1276} {"train_loss": -21.561330795288086, "global_step": 105918, "epoch": 1276} {"train_loss": -21.818681716918945, "global_step": 105919, "epoch": 1276} {"train_loss": -21.70290184020996, "global_step": 105920, "epoch": 1276} {"train_loss": -21.729063034057617, "global_step": 105921, "epoch": 1276} {"train_loss": -22.059179306030273, "global_step": 105922, "epoch": 1276} {"train_loss": -22.09085464477539, "global_step": 105923, "epoch": 1276} {"train_loss": -21.904346466064453, "global_step": 105924, "epoch": 1276} {"train_loss": -21.676589965820312, "global_step": 105925, "epoch": 1276} {"train_loss": -21.71672248840332, "global_step": 105926, "epoch": 1276} {"train_loss": -21.922277450561523, "global_step": 105927, "epoch": 1276} {"train_loss": -22.07394790649414, "global_step": 105928, "epoch": 1276} {"train_loss": -21.949499130249023, "global_step": 105929, "epoch": 1276} {"train_loss": -21.981800079345703, "global_step": 105930, "epoch": 1276} {"train_loss": -21.872713088989258, "global_step": 105931, "epoch": 1276} {"train_loss": -22.195823669433594, "global_step": 105932, "epoch": 1276} {"train_loss": -21.852869033813477, "global_step": 105933, "epoch": 1276} {"train_loss": -22.291208267211914, "global_step": 105934, "epoch": 1276} {"train_loss": -21.73975944519043, "global_step": 105935, "epoch": 1276} {"train_loss": -22.033170700073242, "global_step": 105936, "epoch": 1276} {"train_loss": -22.10227394104004, "global_step": 105937, "epoch": 1276} {"train_loss": -22.029972076416016, "global_step": 105938, "epoch": 1276} {"train_loss": -21.845212936401367, "global_step": 105939, "epoch": 1276} {"train_loss": -21.91233253479004, "global_step": 105940, "epoch": 1276} {"train_loss": -22.550979614257812, "global_step": 105941, "epoch": 1276} {"train_loss": -22.05762481689453, "global_step": 105942, "epoch": 1276} {"train_loss": -21.95751953125, "global_step": 105943, "epoch": 1276} {"train_loss": -22.213272094726562, "global_step": 105944, "epoch": 1276} {"train_loss": -22.182525634765625, "global_step": 105945, "epoch": 1276} {"train_loss": -22.4263916015625, "global_step": 105946, "epoch": 1276} {"train_loss": -22.186613082885742, "global_step": 105947, "epoch": 1276} {"train_loss": -22.19399070739746, "global_step": 105948, "epoch": 1276} {"train_loss": -22.281814575195312, "global_step": 105949, "epoch": 1276} {"train_loss": -21.627639770507812, "global_step": 105950, "epoch": 1276} {"train_loss": -22.403867721557617, "global_step": 105951, "epoch": 1276} {"train_loss": -22.0864315032959, "global_step": 105952, "epoch": 1276} {"train_loss": -22.10835075378418, "global_step": 105953, "epoch": 1276} {"train_loss": -22.032390594482422, "global_step": 105954, "epoch": 1276} {"train_loss": -22.15443229675293, "global_step": 105955, "epoch": 1276} {"train_loss": -22.20102882385254, "global_step": 105956, "epoch": 1276} {"train_loss": -22.383609771728516, "global_step": 105957, "epoch": 1276} {"train_loss": -21.938892364501953, "global_step": 105958, "epoch": 1276} {"train_loss": -22.119733810424805, "global_step": 105959, "epoch": 1276} {"train_loss": -22.01462173461914, "global_step": 105960, "epoch": 1276} {"train_loss": -21.92774772644043, "global_step": 105961, "epoch": 1276} {"train_loss": -22.15486717224121, "global_step": 105962, "epoch": 1276} {"train_loss": -22.383975982666016, "global_step": 105963, "epoch": 1276} {"train_loss": -22.164655685424805, "global_step": 105964, "epoch": 1276} {"train_loss": -22.232038497924805, "global_step": 105965, "epoch": 1276} {"train_loss": -21.828907012939453, "global_step": 105966, "epoch": 1276} {"train_loss": -22.313547134399414, "global_step": 105967, "epoch": 1276} {"train_loss": -22.502538681030273, "global_step": 105968, "epoch": 1276} {"train_loss": -21.955915451049805, "global_step": 105969, "epoch": 1276} {"train_loss": -21.85697364807129, "global_step": 105970, "epoch": 1276} {"train_loss": -22.26637840270996, "global_step": 105971, "epoch": 1276} {"train_loss": -22.157468795776367, "global_step": 105972, "epoch": 1276} {"train_loss": -21.668115615844727, "global_step": 105973, "epoch": 1276} {"train_loss": -22.103437423706055, "global_step": 105974, "epoch": 1276} {"train_loss": -22.165348052978516, "global_step": 105975, "epoch": 1276} {"train_loss": -22.151233673095703, "global_step": 105976, "epoch": 1276} {"train_loss": -22.40562629699707, "global_step": 105977, "epoch": 1276} {"train_loss": -22.34397315979004, "global_step": 105978, "epoch": 1276} {"train_loss": -21.947839736938477, "global_step": 105979, "epoch": 1276} {"train_loss": -22.144105911254883, "global_step": 105980, "epoch": 1276} {"train_loss": -21.792287826538086, "global_step": 105981, "epoch": 1276} {"train_loss": -22.034143447875977, "global_step": 105982, "epoch": 1276} {"train_loss": -21.66935920715332, "global_step": 105983, "epoch": 1276} {"train_loss": -21.58766746520996, "global_step": 105984, "epoch": 1276} {"train_loss": -21.68781089782715, "global_step": 105985, "epoch": 1276} {"train_loss": -21.965879440307617, "global_step": 105986, "epoch": 1276} {"train_loss": -22.17217445373535, "global_step": 105987, "epoch": 1276} {"train_loss": -22.01592445373535, "global_step": 105988, "epoch": 1276} {"train_loss": -22.43613052368164, "global_step": 105989, "epoch": 1276} {"train_loss": -21.992938076157166, "global_step": 105990, "epoch": 1276, "val_loss": 6195090.5} {"train_loss": -21.62525177001953, "global_step": 105991, "epoch": 1277} {"train_loss": -22.023990631103516, "global_step": 105992, "epoch": 1277} {"train_loss": -21.67734718322754, "global_step": 105993, "epoch": 1277} {"train_loss": -21.79010009765625, "global_step": 105994, "epoch": 1277} {"train_loss": -21.97540855407715, "global_step": 105995, "epoch": 1277} {"train_loss": -22.175439834594727, "global_step": 105996, "epoch": 1277} {"train_loss": -21.68256950378418, "global_step": 105997, "epoch": 1277} {"train_loss": -22.116348266601562, "global_step": 105998, "epoch": 1277} {"train_loss": -22.287433624267578, "global_step": 105999, "epoch": 1277} {"train_loss": -22.10557746887207, "global_step": 106000, "epoch": 1277} {"train_loss": -22.345121383666992, "global_step": 106001, "epoch": 1277} {"train_loss": -21.749364852905273, "global_step": 106002, "epoch": 1277} {"train_loss": -22.264408111572266, "global_step": 106003, "epoch": 1277} {"train_loss": -21.968515396118164, "global_step": 106004, "epoch": 1277} {"train_loss": -22.13771629333496, "global_step": 106005, "epoch": 1277} {"train_loss": -22.157733917236328, "global_step": 106006, "epoch": 1277} {"train_loss": -22.184675216674805, "global_step": 106007, "epoch": 1277} {"train_loss": -22.13574981689453, "global_step": 106008, "epoch": 1277} {"train_loss": -22.182355880737305, "global_step": 106009, "epoch": 1277} {"train_loss": -22.144718170166016, "global_step": 106010, "epoch": 1277} {"train_loss": -22.188947677612305, "global_step": 106011, "epoch": 1277} {"train_loss": -21.76589012145996, "global_step": 106012, "epoch": 1277} {"train_loss": -22.16571044921875, "global_step": 106013, "epoch": 1277} {"train_loss": -21.976348876953125, "global_step": 106014, "epoch": 1277} {"train_loss": -22.23508644104004, "global_step": 106015, "epoch": 1277} {"train_loss": -21.8483943939209, "global_step": 106016, "epoch": 1277} {"train_loss": -21.995681762695312, "global_step": 106017, "epoch": 1277} {"train_loss": -22.082782745361328, "global_step": 106018, "epoch": 1277} {"train_loss": -22.373960494995117, "global_step": 106019, "epoch": 1277} {"train_loss": -22.19314956665039, "global_step": 106020, "epoch": 1277} {"train_loss": -22.134384155273438, "global_step": 106021, "epoch": 1277} {"train_loss": -22.092897415161133, "global_step": 106022, "epoch": 1277} {"train_loss": -22.370229721069336, "global_step": 106023, "epoch": 1277} {"train_loss": -22.082426071166992, "global_step": 106024, "epoch": 1277} {"train_loss": -22.003755569458008, "global_step": 106025, "epoch": 1277} {"train_loss": -22.004064559936523, "global_step": 106026, "epoch": 1277} {"train_loss": -22.635746002197266, "global_step": 106027, "epoch": 1277} {"train_loss": -21.77414321899414, "global_step": 106028, "epoch": 1277} {"train_loss": -21.867918014526367, "global_step": 106029, "epoch": 1277} {"train_loss": -22.408361434936523, "global_step": 106030, "epoch": 1277} {"train_loss": -22.0609188079834, "global_step": 106031, "epoch": 1277} {"train_loss": -22.328868865966797, "global_step": 106032, "epoch": 1277} {"train_loss": -21.927175521850586, "global_step": 106033, "epoch": 1277} {"train_loss": -22.22012710571289, "global_step": 106034, "epoch": 1277} {"train_loss": -22.04498863220215, "global_step": 106035, "epoch": 1277} {"train_loss": -22.117469787597656, "global_step": 106036, "epoch": 1277} {"train_loss": -21.735870361328125, "global_step": 106037, "epoch": 1277} {"train_loss": -21.991355895996094, "global_step": 106038, "epoch": 1277} {"train_loss": -21.946630477905273, "global_step": 106039, "epoch": 1277} {"train_loss": -22.286733627319336, "global_step": 106040, "epoch": 1277} {"train_loss": -22.031835556030273, "global_step": 106041, "epoch": 1277} {"train_loss": -21.805988311767578, "global_step": 106042, "epoch": 1277} {"train_loss": -21.99818229675293, "global_step": 106043, "epoch": 1277} {"train_loss": -22.35940933227539, "global_step": 106044, "epoch": 1277} {"train_loss": -22.11539077758789, "global_step": 106045, "epoch": 1277} {"train_loss": -22.0872802734375, "global_step": 106046, "epoch": 1277} {"train_loss": -22.05674934387207, "global_step": 106047, "epoch": 1277} {"train_loss": -21.97995948791504, "global_step": 106048, "epoch": 1277} {"train_loss": -22.188339233398438, "global_step": 106049, "epoch": 1277} {"train_loss": -21.988012313842773, "global_step": 106050, "epoch": 1277} {"train_loss": -21.98701286315918, "global_step": 106051, "epoch": 1277} {"train_loss": -22.17247200012207, "global_step": 106052, "epoch": 1277} {"train_loss": -22.080501556396484, "global_step": 106053, "epoch": 1277} {"train_loss": -22.313400268554688, "global_step": 106054, "epoch": 1277} {"train_loss": -22.147855758666992, "global_step": 106055, "epoch": 1277} {"train_loss": -22.122949600219727, "global_step": 106056, "epoch": 1277} {"train_loss": -22.366430282592773, "global_step": 106057, "epoch": 1277} {"train_loss": -22.085851669311523, "global_step": 106058, "epoch": 1277} {"train_loss": -22.166330337524414, "global_step": 106059, "epoch": 1277} {"train_loss": -21.87253761291504, "global_step": 106060, "epoch": 1277} {"train_loss": -21.90338706970215, "global_step": 106061, "epoch": 1277} {"train_loss": -22.305212020874023, "global_step": 106062, "epoch": 1277} {"train_loss": -22.385900497436523, "global_step": 106063, "epoch": 1277} {"train_loss": -22.485204696655273, "global_step": 106064, "epoch": 1277} {"train_loss": -22.0167293548584, "global_step": 106065, "epoch": 1277} {"train_loss": -22.661508560180664, "global_step": 106066, "epoch": 1277} {"train_loss": -22.35400390625, "global_step": 106067, "epoch": 1277} {"train_loss": -22.107486724853516, "global_step": 106068, "epoch": 1277} {"train_loss": -21.89425277709961, "global_step": 106069, "epoch": 1277} {"train_loss": -21.95476531982422, "global_step": 106070, "epoch": 1277} {"train_loss": -22.439464569091797, "global_step": 106071, "epoch": 1277} {"train_loss": -21.8475341796875, "global_step": 106072, "epoch": 1277} {"train_loss": -22.083166857799853, "global_step": 106073, "epoch": 1277, "val_loss": 6250017.0} {"train_loss": -21.672121047973633, "global_step": 106074, "epoch": 1278} {"train_loss": -21.423507690429688, "global_step": 106075, "epoch": 1278} {"train_loss": -21.379657745361328, "global_step": 106076, "epoch": 1278} {"train_loss": -21.269575119018555, "global_step": 106077, "epoch": 1278} {"train_loss": -21.892715454101562, "global_step": 106078, "epoch": 1278} {"train_loss": -21.46420669555664, "global_step": 106079, "epoch": 1278} {"train_loss": -21.839420318603516, "global_step": 106080, "epoch": 1278} {"train_loss": -21.18536376953125, "global_step": 106081, "epoch": 1278} {"train_loss": -21.63671112060547, "global_step": 106082, "epoch": 1278} {"train_loss": -21.823049545288086, "global_step": 106083, "epoch": 1278} {"train_loss": -22.017724990844727, "global_step": 106084, "epoch": 1278} {"train_loss": -21.774396896362305, "global_step": 106085, "epoch": 1278} {"train_loss": -22.223005294799805, "global_step": 106086, "epoch": 1278} {"train_loss": -21.479633331298828, "global_step": 106087, "epoch": 1278} {"train_loss": -21.81733512878418, "global_step": 106088, "epoch": 1278} {"train_loss": -21.83590316772461, "global_step": 106089, "epoch": 1278} {"train_loss": -22.059804916381836, "global_step": 106090, "epoch": 1278} {"train_loss": -22.009258270263672, "global_step": 106091, "epoch": 1278} {"train_loss": -21.69083595275879, "global_step": 106092, "epoch": 1278} {"train_loss": -22.248016357421875, "global_step": 106093, "epoch": 1278} {"train_loss": -21.89761734008789, "global_step": 106094, "epoch": 1278} {"train_loss": -22.03590202331543, "global_step": 106095, "epoch": 1278} {"train_loss": -21.844491958618164, "global_step": 106096, "epoch": 1278} {"train_loss": -22.129241943359375, "global_step": 106097, "epoch": 1278} {"train_loss": -22.31572914123535, "global_step": 106098, "epoch": 1278} {"train_loss": -22.01885986328125, "global_step": 106099, "epoch": 1278} {"train_loss": -22.018325805664062, "global_step": 106100, "epoch": 1278} {"train_loss": -22.035350799560547, "global_step": 106101, "epoch": 1278} {"train_loss": -22.369338989257812, "global_step": 106102, "epoch": 1278} {"train_loss": -21.91583824157715, "global_step": 106103, "epoch": 1278} {"train_loss": -22.032201766967773, "global_step": 106104, "epoch": 1278} {"train_loss": -22.059925079345703, "global_step": 106105, "epoch": 1278} {"train_loss": -22.431257247924805, "global_step": 106106, "epoch": 1278} {"train_loss": -22.142004013061523, "global_step": 106107, "epoch": 1278} {"train_loss": -22.306360244750977, "global_step": 106108, "epoch": 1278} {"train_loss": -22.34910011291504, "global_step": 106109, "epoch": 1278} {"train_loss": -22.127979278564453, "global_step": 106110, "epoch": 1278} {"train_loss": -22.205230712890625, "global_step": 106111, "epoch": 1278} {"train_loss": -22.028549194335938, "global_step": 106112, "epoch": 1278} {"train_loss": -22.02809715270996, "global_step": 106113, "epoch": 1278} {"train_loss": -22.152555465698242, "global_step": 106114, "epoch": 1278} {"train_loss": -22.19312858581543, "global_step": 106115, "epoch": 1278} {"train_loss": -22.088403701782227, "global_step": 106116, "epoch": 1278} {"train_loss": -22.33586311340332, "global_step": 106117, "epoch": 1278} {"train_loss": -21.915502548217773, "global_step": 106118, "epoch": 1278} {"train_loss": -22.02788543701172, "global_step": 106119, "epoch": 1278} {"train_loss": -22.154468536376953, "global_step": 106120, "epoch": 1278} {"train_loss": -22.436756134033203, "global_step": 106121, "epoch": 1278} {"train_loss": -21.66206932067871, "global_step": 106122, "epoch": 1278} {"train_loss": -22.03885269165039, "global_step": 106123, "epoch": 1278} {"train_loss": -22.276792526245117, "global_step": 106124, "epoch": 1278} {"train_loss": -21.881811141967773, "global_step": 106125, "epoch": 1278} {"train_loss": -22.443225860595703, "global_step": 106126, "epoch": 1278} {"train_loss": -22.260557174682617, "global_step": 106127, "epoch": 1278} {"train_loss": -22.19624900817871, "global_step": 106128, "epoch": 1278} {"train_loss": -21.878530502319336, "global_step": 106129, "epoch": 1278} {"train_loss": -22.226900100708008, "global_step": 106130, "epoch": 1278} {"train_loss": -22.25211524963379, "global_step": 106131, "epoch": 1278} {"train_loss": -22.04266929626465, "global_step": 106132, "epoch": 1278} {"train_loss": -22.223777770996094, "global_step": 106133, "epoch": 1278} {"train_loss": -22.041929244995117, "global_step": 106134, "epoch": 1278} {"train_loss": -21.884756088256836, "global_step": 106135, "epoch": 1278} {"train_loss": -22.0191650390625, "global_step": 106136, "epoch": 1278} {"train_loss": -22.052053451538086, "global_step": 106137, "epoch": 1278} {"train_loss": -22.016653060913086, "global_step": 106138, "epoch": 1278} {"train_loss": -22.200252532958984, "global_step": 106139, "epoch": 1278} {"train_loss": -22.07464599609375, "global_step": 106140, "epoch": 1278} {"train_loss": -22.27728843688965, "global_step": 106141, "epoch": 1278} {"train_loss": -22.072851181030273, "global_step": 106142, "epoch": 1278} {"train_loss": -21.769977569580078, "global_step": 106143, "epoch": 1278} {"train_loss": -22.003877639770508, "global_step": 106144, "epoch": 1278} {"train_loss": -22.309478759765625, "global_step": 106145, "epoch": 1278} {"train_loss": -22.128524780273438, "global_step": 106146, "epoch": 1278} {"train_loss": -22.216970443725586, "global_step": 106147, "epoch": 1278} {"train_loss": -22.07505989074707, "global_step": 106148, "epoch": 1278} {"train_loss": -21.909902572631836, "global_step": 106149, "epoch": 1278} {"train_loss": -22.26612663269043, "global_step": 106150, "epoch": 1278} {"train_loss": -22.078142166137695, "global_step": 106151, "epoch": 1278} {"train_loss": -22.5600643157959, "global_step": 106152, "epoch": 1278} {"train_loss": -22.033554077148438, "global_step": 106153, "epoch": 1278} {"train_loss": -22.01266860961914, "global_step": 106154, "epoch": 1278} {"train_loss": -22.151430130004883, "global_step": 106155, "epoch": 1278} {"train_loss": -22.01326864311494, "global_step": 106156, "epoch": 1278, "val_loss": 6257951.0} {"train_loss": -21.683250427246094, "global_step": 106157, "epoch": 1279} {"train_loss": -21.287353515625, "global_step": 106158, "epoch": 1279} {"train_loss": -21.5433406829834, "global_step": 106159, "epoch": 1279} {"train_loss": -21.973087310791016, "global_step": 106160, "epoch": 1279} {"train_loss": -21.820083618164062, "global_step": 106161, "epoch": 1279} {"train_loss": -21.81379508972168, "global_step": 106162, "epoch": 1279} {"train_loss": -21.95193862915039, "global_step": 106163, "epoch": 1279} {"train_loss": -21.86459732055664, "global_step": 106164, "epoch": 1279} {"train_loss": -22.08758544921875, "global_step": 106165, "epoch": 1279} {"train_loss": -21.76370620727539, "global_step": 106166, "epoch": 1279} {"train_loss": -21.729583740234375, "global_step": 106167, "epoch": 1279} {"train_loss": -22.012609481811523, "global_step": 106168, "epoch": 1279} {"train_loss": -21.91860580444336, "global_step": 106169, "epoch": 1279} {"train_loss": -22.1370849609375, "global_step": 106170, "epoch": 1279} {"train_loss": -21.936655044555664, "global_step": 106171, "epoch": 1279} {"train_loss": -22.10972023010254, "global_step": 106172, "epoch": 1279} {"train_loss": -21.981897354125977, "global_step": 106173, "epoch": 1279} {"train_loss": -22.31911277770996, "global_step": 106174, "epoch": 1279} {"train_loss": -22.01430320739746, "global_step": 106175, "epoch": 1279} {"train_loss": -22.031349182128906, "global_step": 106176, "epoch": 1279} {"train_loss": -22.332387924194336, "global_step": 106177, "epoch": 1279} {"train_loss": -22.206907272338867, "global_step": 106178, "epoch": 1279} {"train_loss": -22.298248291015625, "global_step": 106179, "epoch": 1279} {"train_loss": -22.32659339904785, "global_step": 106180, "epoch": 1279} {"train_loss": -22.108121871948242, "global_step": 106181, "epoch": 1279} {"train_loss": -22.086233139038086, "global_step": 106182, "epoch": 1279} {"train_loss": -22.145299911499023, "global_step": 106183, "epoch": 1279} {"train_loss": -22.138412475585938, "global_step": 106184, "epoch": 1279} {"train_loss": -22.22639274597168, "global_step": 106185, "epoch": 1279} {"train_loss": -22.23990249633789, "global_step": 106186, "epoch": 1279} {"train_loss": -21.910993576049805, "global_step": 106187, "epoch": 1279} {"train_loss": -21.97345542907715, "global_step": 106188, "epoch": 1279} {"train_loss": -22.115413665771484, "global_step": 106189, "epoch": 1279} {"train_loss": -21.6370849609375, "global_step": 106190, "epoch": 1279} {"train_loss": -22.507360458374023, "global_step": 106191, "epoch": 1279} {"train_loss": -22.078935623168945, "global_step": 106192, "epoch": 1279} {"train_loss": -22.301956176757812, "global_step": 106193, "epoch": 1279} {"train_loss": -22.379072189331055, "global_step": 106194, "epoch": 1279} {"train_loss": -22.169445037841797, "global_step": 106195, "epoch": 1279} {"train_loss": -21.8902645111084, "global_step": 106196, "epoch": 1279} {"train_loss": -22.175615310668945, "global_step": 106197, "epoch": 1279} {"train_loss": -21.75043487548828, "global_step": 106198, "epoch": 1279} {"train_loss": -21.625158309936523, "global_step": 106199, "epoch": 1279} {"train_loss": -22.26851463317871, "global_step": 106200, "epoch": 1279} {"train_loss": -22.06717300415039, "global_step": 106201, "epoch": 1279} {"train_loss": -22.03409767150879, "global_step": 106202, "epoch": 1279} {"train_loss": -21.801420211791992, "global_step": 106203, "epoch": 1279} {"train_loss": -21.992612838745117, "global_step": 106204, "epoch": 1279} {"train_loss": -21.502574920654297, "global_step": 106205, "epoch": 1279} {"train_loss": -22.092878341674805, "global_step": 106206, "epoch": 1279} {"train_loss": -21.63632583618164, "global_step": 106207, "epoch": 1279} {"train_loss": -22.08163070678711, "global_step": 106208, "epoch": 1279} {"train_loss": -22.005096435546875, "global_step": 106209, "epoch": 1279} {"train_loss": -21.564640045166016, "global_step": 106210, "epoch": 1279} {"train_loss": -21.911907196044922, "global_step": 106211, "epoch": 1279} {"train_loss": -21.976083755493164, "global_step": 106212, "epoch": 1279} {"train_loss": -22.24380874633789, "global_step": 106213, "epoch": 1279} {"train_loss": -22.06107521057129, "global_step": 106214, "epoch": 1279} {"train_loss": -22.29903221130371, "global_step": 106215, "epoch": 1279} {"train_loss": -21.982585906982422, "global_step": 106216, "epoch": 1279} {"train_loss": -21.760498046875, "global_step": 106217, "epoch": 1279} {"train_loss": -22.199810028076172, "global_step": 106218, "epoch": 1279} {"train_loss": -21.991546630859375, "global_step": 106219, "epoch": 1279} {"train_loss": -21.764678955078125, "global_step": 106220, "epoch": 1279} {"train_loss": -22.45343589782715, "global_step": 106221, "epoch": 1279} {"train_loss": -22.275632858276367, "global_step": 106222, "epoch": 1279} {"train_loss": -21.77423667907715, "global_step": 106223, "epoch": 1279} {"train_loss": -22.09905242919922, "global_step": 106224, "epoch": 1279} {"train_loss": -21.698354721069336, "global_step": 106225, "epoch": 1279} {"train_loss": -22.202411651611328, "global_step": 106226, "epoch": 1279} {"train_loss": -22.219928741455078, "global_step": 106227, "epoch": 1279} {"train_loss": -22.217824935913086, "global_step": 106228, "epoch": 1279} {"train_loss": -21.89448356628418, "global_step": 106229, "epoch": 1279} {"train_loss": -21.92911720275879, "global_step": 106230, "epoch": 1279} {"train_loss": -22.455183029174805, "global_step": 106231, "epoch": 1279} {"train_loss": -22.2202205657959, "global_step": 106232, "epoch": 1279} {"train_loss": -22.01841163635254, "global_step": 106233, "epoch": 1279} {"train_loss": -21.715917587280273, "global_step": 106234, "epoch": 1279} {"train_loss": -22.128019332885742, "global_step": 106235, "epoch": 1279} {"train_loss": -22.042991638183594, "global_step": 106236, "epoch": 1279} {"train_loss": -22.080703735351562, "global_step": 106237, "epoch": 1279} {"train_loss": -21.93946647644043, "global_step": 106238, "epoch": 1279} {"train_loss": -22.011026819068267, "global_step": 106239, "epoch": 1279, "val_loss": 6180253.0} {"train_loss": -21.856298446655273, "global_step": 106240, "epoch": 1280} {"train_loss": -22.26124382019043, "global_step": 106241, "epoch": 1280} {"train_loss": -22.10788917541504, "global_step": 106242, "epoch": 1280} {"train_loss": -21.949064254760742, "global_step": 106243, "epoch": 1280} {"train_loss": -21.968576431274414, "global_step": 106244, "epoch": 1280} {"train_loss": -21.966970443725586, "global_step": 106245, "epoch": 1280} {"train_loss": -22.317981719970703, "global_step": 106246, "epoch": 1280} {"train_loss": -22.04561424255371, "global_step": 106247, "epoch": 1280} {"train_loss": -21.986328125, "global_step": 106248, "epoch": 1280} {"train_loss": -22.431425094604492, "global_step": 106249, "epoch": 1280} {"train_loss": -22.01495933532715, "global_step": 106250, "epoch": 1280} {"train_loss": -21.82423973083496, "global_step": 106251, "epoch": 1280} {"train_loss": -22.06549644470215, "global_step": 106252, "epoch": 1280} {"train_loss": -22.22300148010254, "global_step": 106253, "epoch": 1280} {"train_loss": -22.01222038269043, "global_step": 106254, "epoch": 1280} {"train_loss": -21.935047149658203, "global_step": 106255, "epoch": 1280} {"train_loss": -21.762954711914062, "global_step": 106256, "epoch": 1280} {"train_loss": -22.070077896118164, "global_step": 106257, "epoch": 1280} {"train_loss": -21.8436336517334, "global_step": 106258, "epoch": 1280} {"train_loss": -22.191694259643555, "global_step": 106259, "epoch": 1280} {"train_loss": -21.895498275756836, "global_step": 106260, "epoch": 1280} {"train_loss": -21.67641258239746, "global_step": 106261, "epoch": 1280} {"train_loss": -22.128990173339844, "global_step": 106262, "epoch": 1280} {"train_loss": -21.929922103881836, "global_step": 106263, "epoch": 1280} {"train_loss": -22.187284469604492, "global_step": 106264, "epoch": 1280} {"train_loss": -22.264841079711914, "global_step": 106265, "epoch": 1280} {"train_loss": -22.01283836364746, "global_step": 106266, "epoch": 1280} {"train_loss": -22.048551559448242, "global_step": 106267, "epoch": 1280} {"train_loss": -22.196130752563477, "global_step": 106268, "epoch": 1280} {"train_loss": -22.07220458984375, "global_step": 106269, "epoch": 1280} {"train_loss": -22.300168991088867, "global_step": 106270, "epoch": 1280} {"train_loss": -22.116071701049805, "global_step": 106271, "epoch": 1280} {"train_loss": -21.92534828186035, "global_step": 106272, "epoch": 1280} {"train_loss": -22.16552734375, "global_step": 106273, "epoch": 1280} {"train_loss": -21.970949172973633, "global_step": 106274, "epoch": 1280} {"train_loss": -22.252111434936523, "global_step": 106275, "epoch": 1280} {"train_loss": -22.128036499023438, "global_step": 106276, "epoch": 1280} {"train_loss": -22.41312599182129, "global_step": 106277, "epoch": 1280} {"train_loss": -21.697790145874023, "global_step": 106278, "epoch": 1280} {"train_loss": -22.21581268310547, "global_step": 106279, "epoch": 1280} {"train_loss": -21.970136642456055, "global_step": 106280, "epoch": 1280} {"train_loss": -22.2963809967041, "global_step": 106281, "epoch": 1280} {"train_loss": -22.047361373901367, "global_step": 106282, "epoch": 1280} {"train_loss": -22.29656982421875, "global_step": 106283, "epoch": 1280} {"train_loss": -22.182743072509766, "global_step": 106284, "epoch": 1280} {"train_loss": -22.271636962890625, "global_step": 106285, "epoch": 1280} {"train_loss": -21.939537048339844, "global_step": 106286, "epoch": 1280} {"train_loss": -22.34482192993164, "global_step": 106287, "epoch": 1280} {"train_loss": -21.825714111328125, "global_step": 106288, "epoch": 1280} {"train_loss": -22.371416091918945, "global_step": 106289, "epoch": 1280} {"train_loss": -22.398523330688477, "global_step": 106290, "epoch": 1280} {"train_loss": -22.252004623413086, "global_step": 106291, "epoch": 1280} {"train_loss": -21.471853256225586, "global_step": 106292, "epoch": 1280} {"train_loss": -22.149030685424805, "global_step": 106293, "epoch": 1280} {"train_loss": -22.070659637451172, "global_step": 106294, "epoch": 1280} {"train_loss": -22.383493423461914, "global_step": 106295, "epoch": 1280} {"train_loss": -22.129087448120117, "global_step": 106296, "epoch": 1280} {"train_loss": -22.406539916992188, "global_step": 106297, "epoch": 1280} {"train_loss": -22.734424591064453, "global_step": 106298, "epoch": 1280} {"train_loss": -22.135929107666016, "global_step": 106299, "epoch": 1280} {"train_loss": -22.05368995666504, "global_step": 106300, "epoch": 1280} {"train_loss": -22.59453582763672, "global_step": 106301, "epoch": 1280} {"train_loss": -22.255279541015625, "global_step": 106302, "epoch": 1280} {"train_loss": -22.15696907043457, "global_step": 106303, "epoch": 1280} {"train_loss": -22.146718978881836, "global_step": 106304, "epoch": 1280} {"train_loss": -22.492746353149414, "global_step": 106305, "epoch": 1280} {"train_loss": -22.22426986694336, "global_step": 106306, "epoch": 1280} {"train_loss": -21.912189483642578, "global_step": 106307, "epoch": 1280} {"train_loss": -22.210447311401367, "global_step": 106308, "epoch": 1280} {"train_loss": -22.225004196166992, "global_step": 106309, "epoch": 1280} {"train_loss": -22.33363151550293, "global_step": 106310, "epoch": 1280} {"train_loss": -22.090444564819336, "global_step": 106311, "epoch": 1280} {"train_loss": -21.958847045898438, "global_step": 106312, "epoch": 1280} {"train_loss": -22.27862548828125, "global_step": 106313, "epoch": 1280} {"train_loss": -22.34639549255371, "global_step": 106314, "epoch": 1280} {"train_loss": -22.09043312072754, "global_step": 106315, "epoch": 1280} {"train_loss": -22.051952362060547, "global_step": 106316, "epoch": 1280} {"train_loss": -22.812650680541992, "global_step": 106317, "epoch": 1280} {"train_loss": -22.0588321685791, "global_step": 106318, "epoch": 1280} {"train_loss": -22.377639770507812, "global_step": 106319, "epoch": 1280} {"train_loss": -21.946094512939453, "global_step": 106320, "epoch": 1280} {"train_loss": -22.154207229614258, "global_step": 106321, "epoch": 1280} {"train_loss": -22.10058205386242, "global_step": 106322, "epoch": 1280, "val_loss": 6204022.0} {"train_loss": -22.184274673461914, "global_step": 106323, "epoch": 1281} {"train_loss": -21.95599937438965, "global_step": 106324, "epoch": 1281} {"train_loss": -21.994855880737305, "global_step": 106325, "epoch": 1281} {"train_loss": -21.869600296020508, "global_step": 106326, "epoch": 1281} {"train_loss": -22.165861129760742, "global_step": 106327, "epoch": 1281} {"train_loss": -22.024946212768555, "global_step": 106328, "epoch": 1281} {"train_loss": -22.183042526245117, "global_step": 106329, "epoch": 1281} {"train_loss": -22.138090133666992, "global_step": 106330, "epoch": 1281} {"train_loss": -22.169631958007812, "global_step": 106331, "epoch": 1281} {"train_loss": -21.649616241455078, "global_step": 106332, "epoch": 1281} {"train_loss": -22.08479118347168, "global_step": 106333, "epoch": 1281} {"train_loss": -22.182693481445312, "global_step": 106334, "epoch": 1281} {"train_loss": -22.230100631713867, "global_step": 106335, "epoch": 1281} {"train_loss": -22.1433048248291, "global_step": 106336, "epoch": 1281} {"train_loss": -21.83397102355957, "global_step": 106337, "epoch": 1281} {"train_loss": -22.25058364868164, "global_step": 106338, "epoch": 1281} {"train_loss": -22.15308952331543, "global_step": 106339, "epoch": 1281} {"train_loss": -21.996692657470703, "global_step": 106340, "epoch": 1281} {"train_loss": -22.203659057617188, "global_step": 106341, "epoch": 1281} {"train_loss": -22.28986930847168, "global_step": 106342, "epoch": 1281} {"train_loss": -22.182409286499023, "global_step": 106343, "epoch": 1281} {"train_loss": -22.087064743041992, "global_step": 106344, "epoch": 1281} {"train_loss": -21.59055519104004, "global_step": 106345, "epoch": 1281} {"train_loss": -22.06385040283203, "global_step": 106346, "epoch": 1281} {"train_loss": -21.997608184814453, "global_step": 106347, "epoch": 1281} {"train_loss": -21.98615074157715, "global_step": 106348, "epoch": 1281} {"train_loss": -22.47144889831543, "global_step": 106349, "epoch": 1281} {"train_loss": -21.772083282470703, "global_step": 106350, "epoch": 1281} {"train_loss": -22.08335304260254, "global_step": 106351, "epoch": 1281} {"train_loss": -22.0165958404541, "global_step": 106352, "epoch": 1281} {"train_loss": -22.26841163635254, "global_step": 106353, "epoch": 1281} {"train_loss": -22.040258407592773, "global_step": 106354, "epoch": 1281} {"train_loss": -22.447864532470703, "global_step": 106355, "epoch": 1281} {"train_loss": -22.313434600830078, "global_step": 106356, "epoch": 1281} {"train_loss": -22.185335159301758, "global_step": 106357, "epoch": 1281} {"train_loss": -22.131357192993164, "global_step": 106358, "epoch": 1281} {"train_loss": -22.15125846862793, "global_step": 106359, "epoch": 1281} {"train_loss": -22.26418113708496, "global_step": 106360, "epoch": 1281} {"train_loss": -22.113866806030273, "global_step": 106361, "epoch": 1281} {"train_loss": -22.178903579711914, "global_step": 106362, "epoch": 1281} {"train_loss": -22.31711196899414, "global_step": 106363, "epoch": 1281} {"train_loss": -22.078977584838867, "global_step": 106364, "epoch": 1281} {"train_loss": -21.9609432220459, "global_step": 106365, "epoch": 1281} {"train_loss": -22.148099899291992, "global_step": 106366, "epoch": 1281} {"train_loss": -22.389394760131836, "global_step": 106367, "epoch": 1281} {"train_loss": -21.91255760192871, "global_step": 106368, "epoch": 1281} {"train_loss": -22.026119232177734, "global_step": 106369, "epoch": 1281} {"train_loss": -22.178396224975586, "global_step": 106370, "epoch": 1281} {"train_loss": -22.176029205322266, "global_step": 106371, "epoch": 1281} {"train_loss": -22.094533920288086, "global_step": 106372, "epoch": 1281} {"train_loss": -22.239059448242188, "global_step": 106373, "epoch": 1281} {"train_loss": -22.30929946899414, "global_step": 106374, "epoch": 1281} {"train_loss": -22.030826568603516, "global_step": 106375, "epoch": 1281} {"train_loss": -22.182897567749023, "global_step": 106376, "epoch": 1281} {"train_loss": -22.375389099121094, "global_step": 106377, "epoch": 1281} {"train_loss": -22.08902931213379, "global_step": 106378, "epoch": 1281} {"train_loss": -22.070341110229492, "global_step": 106379, "epoch": 1281} {"train_loss": -22.11298370361328, "global_step": 106380, "epoch": 1281} {"train_loss": -21.922698974609375, "global_step": 106381, "epoch": 1281} {"train_loss": -22.218473434448242, "global_step": 106382, "epoch": 1281} {"train_loss": -21.872373580932617, "global_step": 106383, "epoch": 1281} {"train_loss": -22.461034774780273, "global_step": 106384, "epoch": 1281} {"train_loss": -22.173093795776367, "global_step": 106385, "epoch": 1281} {"train_loss": -21.96219253540039, "global_step": 106386, "epoch": 1281} {"train_loss": -21.092763900756836, "global_step": 106387, "epoch": 1281} {"train_loss": -22.00665855407715, "global_step": 106388, "epoch": 1281} {"train_loss": -21.893474578857422, "global_step": 106389, "epoch": 1281} {"train_loss": -22.11030387878418, "global_step": 106390, "epoch": 1281} {"train_loss": -22.058298110961914, "global_step": 106391, "epoch": 1281} {"train_loss": -21.97344970703125, "global_step": 106392, "epoch": 1281} {"train_loss": -22.158676147460938, "global_step": 106393, "epoch": 1281} {"train_loss": -22.13092613220215, "global_step": 106394, "epoch": 1281} {"train_loss": -22.167264938354492, "global_step": 106395, "epoch": 1281} {"train_loss": -22.342248916625977, "global_step": 106396, "epoch": 1281} {"train_loss": -22.160306930541992, "global_step": 106397, "epoch": 1281} {"train_loss": -22.072891235351562, "global_step": 106398, "epoch": 1281} {"train_loss": -22.34751319885254, "global_step": 106399, "epoch": 1281} {"train_loss": -22.135549545288086, "global_step": 106400, "epoch": 1281} {"train_loss": -22.16518211364746, "global_step": 106401, "epoch": 1281} {"train_loss": -22.352203369140625, "global_step": 106402, "epoch": 1281} {"train_loss": -21.919525146484375, "global_step": 106403, "epoch": 1281} {"train_loss": -22.165761947631836, "global_step": 106404, "epoch": 1281} {"train_loss": -22.113560205482575, "global_step": 106405, "epoch": 1281, "val_loss": 6166187.5} {"train_loss": -22.18922996520996, "global_step": 106406, "epoch": 1282} {"train_loss": -21.80103874206543, "global_step": 106407, "epoch": 1282} {"train_loss": -22.061187744140625, "global_step": 106408, "epoch": 1282} {"train_loss": -22.36542510986328, "global_step": 106409, "epoch": 1282} {"train_loss": -22.333383560180664, "global_step": 106410, "epoch": 1282} {"train_loss": -22.392288208007812, "global_step": 106411, "epoch": 1282} {"train_loss": -22.094167709350586, "global_step": 106412, "epoch": 1282} {"train_loss": -22.262752532958984, "global_step": 106413, "epoch": 1282} {"train_loss": -22.394567489624023, "global_step": 106414, "epoch": 1282} {"train_loss": -22.139387130737305, "global_step": 106415, "epoch": 1282} {"train_loss": -22.013208389282227, "global_step": 106416, "epoch": 1282} {"train_loss": -22.201671600341797, "global_step": 106417, "epoch": 1282} {"train_loss": -22.203716278076172, "global_step": 106418, "epoch": 1282} {"train_loss": -22.009572982788086, "global_step": 106419, "epoch": 1282} {"train_loss": -21.332433700561523, "global_step": 106420, "epoch": 1282} {"train_loss": -21.98933982849121, "global_step": 106421, "epoch": 1282} {"train_loss": -22.18276596069336, "global_step": 106422, "epoch": 1282} {"train_loss": -22.271400451660156, "global_step": 106423, "epoch": 1282} {"train_loss": -21.94382667541504, "global_step": 106424, "epoch": 1282} {"train_loss": -22.39318084716797, "global_step": 106425, "epoch": 1282} {"train_loss": -22.13642692565918, "global_step": 106426, "epoch": 1282} {"train_loss": -21.83955192565918, "global_step": 106427, "epoch": 1282} {"train_loss": -21.903427124023438, "global_step": 106428, "epoch": 1282} {"train_loss": -21.973176956176758, "global_step": 106429, "epoch": 1282} {"train_loss": -22.231061935424805, "global_step": 106430, "epoch": 1282} {"train_loss": -22.188793182373047, "global_step": 106431, "epoch": 1282} {"train_loss": -22.287372589111328, "global_step": 106432, "epoch": 1282} {"train_loss": -21.972793579101562, "global_step": 106433, "epoch": 1282} {"train_loss": -22.098602294921875, "global_step": 106434, "epoch": 1282} {"train_loss": -22.18720817565918, "global_step": 106435, "epoch": 1282} {"train_loss": -21.816835403442383, "global_step": 106436, "epoch": 1282} {"train_loss": -21.828994750976562, "global_step": 106437, "epoch": 1282} {"train_loss": -22.13434410095215, "global_step": 106438, "epoch": 1282} {"train_loss": -21.87509536743164, "global_step": 106439, "epoch": 1282} {"train_loss": -22.489553451538086, "global_step": 106440, "epoch": 1282} {"train_loss": -22.138959884643555, "global_step": 106441, "epoch": 1282} {"train_loss": -22.04831886291504, "global_step": 106442, "epoch": 1282} {"train_loss": -22.195539474487305, "global_step": 106443, "epoch": 1282} {"train_loss": -22.18153190612793, "global_step": 106444, "epoch": 1282} {"train_loss": -21.99850845336914, "global_step": 106445, "epoch": 1282} {"train_loss": -21.97321891784668, "global_step": 106446, "epoch": 1282} {"train_loss": -22.297901153564453, "global_step": 106447, "epoch": 1282} {"train_loss": -22.10379409790039, "global_step": 106448, "epoch": 1282} {"train_loss": -22.005069732666016, "global_step": 106449, "epoch": 1282} {"train_loss": -21.863245010375977, "global_step": 106450, "epoch": 1282} {"train_loss": -22.282995223999023, "global_step": 106451, "epoch": 1282} {"train_loss": -22.339841842651367, "global_step": 106452, "epoch": 1282} {"train_loss": -22.00233268737793, "global_step": 106453, "epoch": 1282} {"train_loss": -21.984182357788086, "global_step": 106454, "epoch": 1282} {"train_loss": -21.95631217956543, "global_step": 106455, "epoch": 1282} {"train_loss": -21.923051834106445, "global_step": 106456, "epoch": 1282} {"train_loss": -22.366613388061523, "global_step": 106457, "epoch": 1282} {"train_loss": -22.209775924682617, "global_step": 106458, "epoch": 1282} {"train_loss": -21.77678680419922, "global_step": 106459, "epoch": 1282} {"train_loss": -22.127897262573242, "global_step": 106460, "epoch": 1282} {"train_loss": -21.99423599243164, "global_step": 106461, "epoch": 1282} {"train_loss": -21.94010353088379, "global_step": 106462, "epoch": 1282} {"train_loss": -22.414342880249023, "global_step": 106463, "epoch": 1282} {"train_loss": -22.687646865844727, "global_step": 106464, "epoch": 1282} {"train_loss": -22.09638786315918, "global_step": 106465, "epoch": 1282} {"train_loss": -22.234371185302734, "global_step": 106466, "epoch": 1282} {"train_loss": -22.293067932128906, "global_step": 106467, "epoch": 1282} {"train_loss": -22.246503829956055, "global_step": 106468, "epoch": 1282} {"train_loss": -22.094533920288086, "global_step": 106469, "epoch": 1282} {"train_loss": -22.298076629638672, "global_step": 106470, "epoch": 1282} {"train_loss": -22.486927032470703, "global_step": 106471, "epoch": 1282} {"train_loss": -21.881893157958984, "global_step": 106472, "epoch": 1282} {"train_loss": -21.931394577026367, "global_step": 106473, "epoch": 1282} {"train_loss": -22.464147567749023, "global_step": 106474, "epoch": 1282} {"train_loss": -22.108259201049805, "global_step": 106475, "epoch": 1282} {"train_loss": -22.029401779174805, "global_step": 106476, "epoch": 1282} {"train_loss": -22.212915420532227, "global_step": 106477, "epoch": 1282} {"train_loss": -22.13434410095215, "global_step": 106478, "epoch": 1282} {"train_loss": -22.376426696777344, "global_step": 106479, "epoch": 1282} {"train_loss": -21.990707397460938, "global_step": 106480, "epoch": 1282} {"train_loss": -22.093530654907227, "global_step": 106481, "epoch": 1282} {"train_loss": -22.352529525756836, "global_step": 106482, "epoch": 1282} {"train_loss": -22.001972198486328, "global_step": 106483, "epoch": 1282} {"train_loss": -22.212926864624023, "global_step": 106484, "epoch": 1282} {"train_loss": -22.075803756713867, "global_step": 106485, "epoch": 1282} {"train_loss": -22.188098907470703, "global_step": 106486, "epoch": 1282} {"train_loss": -21.922813415527344, "global_step": 106487, "epoch": 1282} {"train_loss": -22.120998658329608, "global_step": 106488, "epoch": 1282, "val_loss": 6083973.0} {"train_loss": -22.07820701599121, "global_step": 106489, "epoch": 1283} {"train_loss": -21.968975067138672, "global_step": 106490, "epoch": 1283} {"train_loss": -21.933935165405273, "global_step": 106491, "epoch": 1283} {"train_loss": -22.09244728088379, "global_step": 106492, "epoch": 1283} {"train_loss": -22.022991180419922, "global_step": 106493, "epoch": 1283} {"train_loss": -21.65308380126953, "global_step": 106494, "epoch": 1283} {"train_loss": -21.75160026550293, "global_step": 106495, "epoch": 1283} {"train_loss": -22.199703216552734, "global_step": 106496, "epoch": 1283} {"train_loss": -21.747495651245117, "global_step": 106497, "epoch": 1283} {"train_loss": -21.863821029663086, "global_step": 106498, "epoch": 1283} {"train_loss": -22.092439651489258, "global_step": 106499, "epoch": 1283} {"train_loss": -21.791370391845703, "global_step": 106500, "epoch": 1283} {"train_loss": -21.903255462646484, "global_step": 106501, "epoch": 1283} {"train_loss": -22.221464157104492, "global_step": 106502, "epoch": 1283} {"train_loss": -22.33062744140625, "global_step": 106503, "epoch": 1283} {"train_loss": -22.021183013916016, "global_step": 106504, "epoch": 1283} {"train_loss": -21.938465118408203, "global_step": 106505, "epoch": 1283} {"train_loss": -21.87546157836914, "global_step": 106506, "epoch": 1283} {"train_loss": -22.05780601501465, "global_step": 106507, "epoch": 1283} {"train_loss": -21.985326766967773, "global_step": 106508, "epoch": 1283} {"train_loss": -22.24744987487793, "global_step": 106509, "epoch": 1283} {"train_loss": -22.089487075805664, "global_step": 106510, "epoch": 1283} {"train_loss": -22.2515811920166, "global_step": 106511, "epoch": 1283} {"train_loss": -22.312862396240234, "global_step": 106512, "epoch": 1283} {"train_loss": -22.041276931762695, "global_step": 106513, "epoch": 1283} {"train_loss": -21.799671173095703, "global_step": 106514, "epoch": 1283} {"train_loss": -22.08004379272461, "global_step": 106515, "epoch": 1283} {"train_loss": -22.35789680480957, "global_step": 106516, "epoch": 1283} {"train_loss": -22.23155403137207, "global_step": 106517, "epoch": 1283} {"train_loss": -22.293298721313477, "global_step": 106518, "epoch": 1283} {"train_loss": -21.79652214050293, "global_step": 106519, "epoch": 1283} {"train_loss": -22.1942195892334, "global_step": 106520, "epoch": 1283} {"train_loss": -22.065017700195312, "global_step": 106521, "epoch": 1283} {"train_loss": -22.408493041992188, "global_step": 106522, "epoch": 1283} {"train_loss": -22.359607696533203, "global_step": 106523, "epoch": 1283} {"train_loss": -22.346878051757812, "global_step": 106524, "epoch": 1283} {"train_loss": -21.654708862304688, "global_step": 106525, "epoch": 1283} {"train_loss": -22.104093551635742, "global_step": 106526, "epoch": 1283} {"train_loss": -21.6818904876709, "global_step": 106527, "epoch": 1283} {"train_loss": -21.97389030456543, "global_step": 106528, "epoch": 1283} {"train_loss": -22.452438354492188, "global_step": 106529, "epoch": 1283} {"train_loss": -21.84392547607422, "global_step": 106530, "epoch": 1283} {"train_loss": -22.24360466003418, "global_step": 106531, "epoch": 1283} {"train_loss": -22.303747177124023, "global_step": 106532, "epoch": 1283} {"train_loss": -22.416563034057617, "global_step": 106533, "epoch": 1283} {"train_loss": -22.409467697143555, "global_step": 106534, "epoch": 1283} {"train_loss": -22.103469848632812, "global_step": 106535, "epoch": 1283} {"train_loss": -22.203123092651367, "global_step": 106536, "epoch": 1283} {"train_loss": -22.108280181884766, "global_step": 106537, "epoch": 1283} {"train_loss": -22.40212059020996, "global_step": 106538, "epoch": 1283} {"train_loss": -22.388084411621094, "global_step": 106539, "epoch": 1283} {"train_loss": -22.264270782470703, "global_step": 106540, "epoch": 1283} {"train_loss": -21.905681610107422, "global_step": 106541, "epoch": 1283} {"train_loss": -22.209014892578125, "global_step": 106542, "epoch": 1283} {"train_loss": -22.431303024291992, "global_step": 106543, "epoch": 1283} {"train_loss": -22.417251586914062, "global_step": 106544, "epoch": 1283} {"train_loss": -22.414546966552734, "global_step": 106545, "epoch": 1283} {"train_loss": -21.864789962768555, "global_step": 106546, "epoch": 1283} {"train_loss": -22.075300216674805, "global_step": 106547, "epoch": 1283} {"train_loss": -22.088825225830078, "global_step": 106548, "epoch": 1283} {"train_loss": -22.12924575805664, "global_step": 106549, "epoch": 1283} {"train_loss": -22.06535530090332, "global_step": 106550, "epoch": 1283} {"train_loss": -22.163846969604492, "global_step": 106551, "epoch": 1283} {"train_loss": -21.860754013061523, "global_step": 106552, "epoch": 1283} {"train_loss": -22.08367347717285, "global_step": 106553, "epoch": 1283} {"train_loss": -22.195951461791992, "global_step": 106554, "epoch": 1283} {"train_loss": -22.054895401000977, "global_step": 106555, "epoch": 1283} {"train_loss": -21.97174072265625, "global_step": 106556, "epoch": 1283} {"train_loss": -21.888471603393555, "global_step": 106557, "epoch": 1283} {"train_loss": -22.523046493530273, "global_step": 106558, "epoch": 1283} {"train_loss": -22.330055236816406, "global_step": 106559, "epoch": 1283} {"train_loss": -22.666053771972656, "global_step": 106560, "epoch": 1283} {"train_loss": -22.15822410583496, "global_step": 106561, "epoch": 1283} {"train_loss": -22.268651962280273, "global_step": 106562, "epoch": 1283} {"train_loss": -22.5518856048584, "global_step": 106563, "epoch": 1283} {"train_loss": -22.08738899230957, "global_step": 106564, "epoch": 1283} {"train_loss": -22.142492294311523, "global_step": 106565, "epoch": 1283} {"train_loss": -22.189231872558594, "global_step": 106566, "epoch": 1283} {"train_loss": -21.991849899291992, "global_step": 106567, "epoch": 1283} {"train_loss": -22.2053165435791, "global_step": 106568, "epoch": 1283} {"train_loss": -22.141769409179688, "global_step": 106569, "epoch": 1283} {"train_loss": -22.22328758239746, "global_step": 106570, "epoch": 1283} {"train_loss": -22.130766535379802, "global_step": 106571, "epoch": 1283, "val_loss": 6221825.0} {"train_loss": -21.59174346923828, "global_step": 106572, "epoch": 1284} {"train_loss": -21.346817016601562, "global_step": 106573, "epoch": 1284} {"train_loss": -21.878385543823242, "global_step": 106574, "epoch": 1284} {"train_loss": -21.735692977905273, "global_step": 106575, "epoch": 1284} {"train_loss": -21.424619674682617, "global_step": 106576, "epoch": 1284} {"train_loss": -22.195545196533203, "global_step": 106577, "epoch": 1284} {"train_loss": -21.924978256225586, "global_step": 106578, "epoch": 1284} {"train_loss": -21.515117645263672, "global_step": 106579, "epoch": 1284} {"train_loss": -22.102811813354492, "global_step": 106580, "epoch": 1284} {"train_loss": -22.226531982421875, "global_step": 106581, "epoch": 1284} {"train_loss": -22.149038314819336, "global_step": 106582, "epoch": 1284} {"train_loss": -21.58562660217285, "global_step": 106583, "epoch": 1284} {"train_loss": -22.078577041625977, "global_step": 106584, "epoch": 1284} {"train_loss": -21.86005401611328, "global_step": 106585, "epoch": 1284} {"train_loss": -22.00395965576172, "global_step": 106586, "epoch": 1284} {"train_loss": -21.418102264404297, "global_step": 106587, "epoch": 1284} {"train_loss": -21.812902450561523, "global_step": 106588, "epoch": 1284} {"train_loss": -21.730924606323242, "global_step": 106589, "epoch": 1284} {"train_loss": -21.78980827331543, "global_step": 106590, "epoch": 1284} {"train_loss": -22.06875991821289, "global_step": 106591, "epoch": 1284} {"train_loss": -21.766843795776367, "global_step": 106592, "epoch": 1284} {"train_loss": -21.945415496826172, "global_step": 106593, "epoch": 1284} {"train_loss": -21.65175437927246, "global_step": 106594, "epoch": 1284} {"train_loss": -21.956619262695312, "global_step": 106595, "epoch": 1284} {"train_loss": -22.162487030029297, "global_step": 106596, "epoch": 1284} {"train_loss": -22.3686466217041, "global_step": 106597, "epoch": 1284} {"train_loss": -21.899539947509766, "global_step": 106598, "epoch": 1284} {"train_loss": -22.23902702331543, "global_step": 106599, "epoch": 1284} {"train_loss": -22.15492820739746, "global_step": 106600, "epoch": 1284} {"train_loss": -22.238866806030273, "global_step": 106601, "epoch": 1284} {"train_loss": -22.04999542236328, "global_step": 106602, "epoch": 1284} {"train_loss": -22.18963623046875, "global_step": 106603, "epoch": 1284} {"train_loss": -22.551786422729492, "global_step": 106604, "epoch": 1284} {"train_loss": -22.204736709594727, "global_step": 106605, "epoch": 1284} {"train_loss": -22.62094497680664, "global_step": 106606, "epoch": 1284} {"train_loss": -22.143171310424805, "global_step": 106607, "epoch": 1284} {"train_loss": -22.4708309173584, "global_step": 106608, "epoch": 1284} {"train_loss": -22.280715942382812, "global_step": 106609, "epoch": 1284} {"train_loss": -22.241361618041992, "global_step": 106610, "epoch": 1284} {"train_loss": -22.313257217407227, "global_step": 106611, "epoch": 1284} {"train_loss": -22.078760147094727, "global_step": 106612, "epoch": 1284} {"train_loss": -22.293577194213867, "global_step": 106613, "epoch": 1284} {"train_loss": -21.98603630065918, "global_step": 106614, "epoch": 1284} {"train_loss": -22.24747657775879, "global_step": 106615, "epoch": 1284} {"train_loss": -21.837196350097656, "global_step": 106616, "epoch": 1284} {"train_loss": -22.15725326538086, "global_step": 106617, "epoch": 1284} {"train_loss": -21.560945510864258, "global_step": 106618, "epoch": 1284} {"train_loss": -21.93059730529785, "global_step": 106619, "epoch": 1284} {"train_loss": -21.85467529296875, "global_step": 106620, "epoch": 1284} {"train_loss": -21.855859756469727, "global_step": 106621, "epoch": 1284} {"train_loss": -21.675565719604492, "global_step": 106622, "epoch": 1284} {"train_loss": -21.941587448120117, "global_step": 106623, "epoch": 1284} {"train_loss": -21.9829158782959, "global_step": 106624, "epoch": 1284} {"train_loss": -21.9090633392334, "global_step": 106625, "epoch": 1284} {"train_loss": -22.131017684936523, "global_step": 106626, "epoch": 1284} {"train_loss": -22.06717872619629, "global_step": 106627, "epoch": 1284} {"train_loss": -22.053197860717773, "global_step": 106628, "epoch": 1284} {"train_loss": -21.996244430541992, "global_step": 106629, "epoch": 1284} {"train_loss": -22.19312286376953, "global_step": 106630, "epoch": 1284} {"train_loss": -21.9158992767334, "global_step": 106631, "epoch": 1284} {"train_loss": -21.947050094604492, "global_step": 106632, "epoch": 1284} {"train_loss": -21.84558868408203, "global_step": 106633, "epoch": 1284} {"train_loss": -21.958433151245117, "global_step": 106634, "epoch": 1284} {"train_loss": -22.255041122436523, "global_step": 106635, "epoch": 1284} {"train_loss": -22.33145523071289, "global_step": 106636, "epoch": 1284} {"train_loss": -22.258071899414062, "global_step": 106637, "epoch": 1284} {"train_loss": -21.89231300354004, "global_step": 106638, "epoch": 1284} {"train_loss": -22.170429229736328, "global_step": 106639, "epoch": 1284} {"train_loss": -22.296598434448242, "global_step": 106640, "epoch": 1284} {"train_loss": -22.11348533630371, "global_step": 106641, "epoch": 1284} {"train_loss": -22.296504974365234, "global_step": 106642, "epoch": 1284} {"train_loss": -22.248929977416992, "global_step": 106643, "epoch": 1284} {"train_loss": -21.943090438842773, "global_step": 106644, "epoch": 1284} {"train_loss": -21.99966812133789, "global_step": 106645, "epoch": 1284} {"train_loss": -22.38467788696289, "global_step": 106646, "epoch": 1284} {"train_loss": -22.13680076599121, "global_step": 106647, "epoch": 1284} {"train_loss": -22.18461799621582, "global_step": 106648, "epoch": 1284} {"train_loss": -22.58881950378418, "global_step": 106649, "epoch": 1284} {"train_loss": -21.91318130493164, "global_step": 106650, "epoch": 1284} {"train_loss": -22.047508239746094, "global_step": 106651, "epoch": 1284} {"train_loss": -22.36480140686035, "global_step": 106652, "epoch": 1284} {"train_loss": -22.059667587280273, "global_step": 106653, "epoch": 1284} {"train_loss": -22.01338039536074, "global_step": 106654, "epoch": 1284, "val_loss": 6144162.0} {"train_loss": -21.54853630065918, "global_step": 106655, "epoch": 1285} {"train_loss": -21.587596893310547, "global_step": 106656, "epoch": 1285} {"train_loss": -21.966724395751953, "global_step": 106657, "epoch": 1285} {"train_loss": -21.92119598388672, "global_step": 106658, "epoch": 1285} {"train_loss": -21.520200729370117, "global_step": 106659, "epoch": 1285} {"train_loss": -22.294265747070312, "global_step": 106660, "epoch": 1285} {"train_loss": -21.784521102905273, "global_step": 106661, "epoch": 1285} {"train_loss": -21.956815719604492, "global_step": 106662, "epoch": 1285} {"train_loss": -22.077707290649414, "global_step": 106663, "epoch": 1285} {"train_loss": -22.106107711791992, "global_step": 106664, "epoch": 1285} {"train_loss": -21.9858341217041, "global_step": 106665, "epoch": 1285} {"train_loss": -21.89111328125, "global_step": 106666, "epoch": 1285} {"train_loss": -21.972293853759766, "global_step": 106667, "epoch": 1285} {"train_loss": -22.030710220336914, "global_step": 106668, "epoch": 1285} {"train_loss": -21.828832626342773, "global_step": 106669, "epoch": 1285} {"train_loss": -22.02172088623047, "global_step": 106670, "epoch": 1285} {"train_loss": -21.982769012451172, "global_step": 106671, "epoch": 1285} {"train_loss": -21.892263412475586, "global_step": 106672, "epoch": 1285} {"train_loss": -22.245132446289062, "global_step": 106673, "epoch": 1285} {"train_loss": -22.60345458984375, "global_step": 106674, "epoch": 1285} {"train_loss": -21.97763442993164, "global_step": 106675, "epoch": 1285} {"train_loss": -22.154083251953125, "global_step": 106676, "epoch": 1285} {"train_loss": -22.12259292602539, "global_step": 106677, "epoch": 1285} {"train_loss": -22.18404197692871, "global_step": 106678, "epoch": 1285} {"train_loss": -22.10629653930664, "global_step": 106679, "epoch": 1285} {"train_loss": -22.12396812438965, "global_step": 106680, "epoch": 1285} {"train_loss": -22.04279136657715, "global_step": 106681, "epoch": 1285} {"train_loss": -22.190237045288086, "global_step": 106682, "epoch": 1285} {"train_loss": -22.1075439453125, "global_step": 106683, "epoch": 1285} {"train_loss": -22.043989181518555, "global_step": 106684, "epoch": 1285} {"train_loss": -22.006383895874023, "global_step": 106685, "epoch": 1285} {"train_loss": -21.84332847595215, "global_step": 106686, "epoch": 1285} {"train_loss": -21.945945739746094, "global_step": 106687, "epoch": 1285} {"train_loss": -21.888004302978516, "global_step": 106688, "epoch": 1285} {"train_loss": -22.383121490478516, "global_step": 106689, "epoch": 1285} {"train_loss": -21.848127365112305, "global_step": 106690, "epoch": 1285} {"train_loss": -21.961624145507812, "global_step": 106691, "epoch": 1285} {"train_loss": -22.459009170532227, "global_step": 106692, "epoch": 1285} {"train_loss": -22.371191024780273, "global_step": 106693, "epoch": 1285} {"train_loss": -22.319189071655273, "global_step": 106694, "epoch": 1285} {"train_loss": -22.216970443725586, "global_step": 106695, "epoch": 1285} {"train_loss": -22.40403175354004, "global_step": 106696, "epoch": 1285} {"train_loss": -22.02115249633789, "global_step": 106697, "epoch": 1285} {"train_loss": -22.399328231811523, "global_step": 106698, "epoch": 1285} {"train_loss": -22.36408805847168, "global_step": 106699, "epoch": 1285} {"train_loss": -22.28079605102539, "global_step": 106700, "epoch": 1285} {"train_loss": -21.858951568603516, "global_step": 106701, "epoch": 1285} {"train_loss": -21.91866111755371, "global_step": 106702, "epoch": 1285} {"train_loss": -22.204137802124023, "global_step": 106703, "epoch": 1285} {"train_loss": -22.140546798706055, "global_step": 106704, "epoch": 1285} {"train_loss": -21.578577041625977, "global_step": 106705, "epoch": 1285} {"train_loss": -21.890243530273438, "global_step": 106706, "epoch": 1285} {"train_loss": -22.307193756103516, "global_step": 106707, "epoch": 1285} {"train_loss": -22.507970809936523, "global_step": 106708, "epoch": 1285} {"train_loss": -22.22014808654785, "global_step": 106709, "epoch": 1285} {"train_loss": -22.044231414794922, "global_step": 106710, "epoch": 1285} {"train_loss": -22.075178146362305, "global_step": 106711, "epoch": 1285} {"train_loss": -21.93305015563965, "global_step": 106712, "epoch": 1285} {"train_loss": -21.86014747619629, "global_step": 106713, "epoch": 1285} {"train_loss": -22.24264144897461, "global_step": 106714, "epoch": 1285} {"train_loss": -22.1759033203125, "global_step": 106715, "epoch": 1285} {"train_loss": -22.165246963500977, "global_step": 106716, "epoch": 1285} {"train_loss": -22.313840866088867, "global_step": 106717, "epoch": 1285} {"train_loss": -22.093400955200195, "global_step": 106718, "epoch": 1285} {"train_loss": -22.301929473876953, "global_step": 106719, "epoch": 1285} {"train_loss": -22.331464767456055, "global_step": 106720, "epoch": 1285} {"train_loss": -22.158206939697266, "global_step": 106721, "epoch": 1285} {"train_loss": -22.086246490478516, "global_step": 106722, "epoch": 1285} {"train_loss": -22.306488037109375, "global_step": 106723, "epoch": 1285} {"train_loss": -22.040571212768555, "global_step": 106724, "epoch": 1285} {"train_loss": -22.389799118041992, "global_step": 106725, "epoch": 1285} {"train_loss": -22.16000747680664, "global_step": 106726, "epoch": 1285} {"train_loss": -22.50650978088379, "global_step": 106727, "epoch": 1285} {"train_loss": -22.236656188964844, "global_step": 106728, "epoch": 1285} {"train_loss": -22.565078735351562, "global_step": 106729, "epoch": 1285} {"train_loss": -22.3575439453125, "global_step": 106730, "epoch": 1285} {"train_loss": -22.321897506713867, "global_step": 106731, "epoch": 1285} {"train_loss": -21.955198287963867, "global_step": 106732, "epoch": 1285} {"train_loss": -21.925708770751953, "global_step": 106733, "epoch": 1285} {"train_loss": -22.096332550048828, "global_step": 106734, "epoch": 1285} {"train_loss": -22.045194625854492, "global_step": 106735, "epoch": 1285} {"train_loss": -22.366073608398438, "global_step": 106736, "epoch": 1285} {"train_loss": -22.097001592796968, "global_step": 106737, "epoch": 1285, "val_loss": 6229842.5} {"train_loss": -21.11237907409668, "global_step": 106738, "epoch": 1286} {"train_loss": -21.809499740600586, "global_step": 106739, "epoch": 1286} {"train_loss": -21.48770523071289, "global_step": 106740, "epoch": 1286} {"train_loss": -21.406936645507812, "global_step": 106741, "epoch": 1286} {"train_loss": -21.748064041137695, "global_step": 106742, "epoch": 1286} {"train_loss": -21.70961570739746, "global_step": 106743, "epoch": 1286} {"train_loss": -21.613773345947266, "global_step": 106744, "epoch": 1286} {"train_loss": -21.920175552368164, "global_step": 106745, "epoch": 1286} {"train_loss": -21.366363525390625, "global_step": 106746, "epoch": 1286} {"train_loss": -21.849294662475586, "global_step": 106747, "epoch": 1286} {"train_loss": -21.661727905273438, "global_step": 106748, "epoch": 1286} {"train_loss": -22.0483455657959, "global_step": 106749, "epoch": 1286} {"train_loss": -21.85749053955078, "global_step": 106750, "epoch": 1286} {"train_loss": -21.490877151489258, "global_step": 106751, "epoch": 1286} {"train_loss": -21.83087730407715, "global_step": 106752, "epoch": 1286} {"train_loss": -22.322460174560547, "global_step": 106753, "epoch": 1286} {"train_loss": -21.856313705444336, "global_step": 106754, "epoch": 1286} {"train_loss": -22.003660202026367, "global_step": 106755, "epoch": 1286} {"train_loss": -21.585599899291992, "global_step": 106756, "epoch": 1286} {"train_loss": -21.71239471435547, "global_step": 106757, "epoch": 1286} {"train_loss": -21.683141708374023, "global_step": 106758, "epoch": 1286} {"train_loss": -21.829355239868164, "global_step": 106759, "epoch": 1286} {"train_loss": -21.795766830444336, "global_step": 106760, "epoch": 1286} {"train_loss": -22.01202392578125, "global_step": 106761, "epoch": 1286} {"train_loss": -21.60400390625, "global_step": 106762, "epoch": 1286} {"train_loss": -22.283855438232422, "global_step": 106763, "epoch": 1286} {"train_loss": -22.4322452545166, "global_step": 106764, "epoch": 1286} {"train_loss": -22.106395721435547, "global_step": 106765, "epoch": 1286} {"train_loss": -21.54128074645996, "global_step": 106766, "epoch": 1286} {"train_loss": -22.399612426757812, "global_step": 106767, "epoch": 1286} {"train_loss": -22.289220809936523, "global_step": 106768, "epoch": 1286} {"train_loss": -22.469453811645508, "global_step": 106769, "epoch": 1286} {"train_loss": -22.145139694213867, "global_step": 106770, "epoch": 1286} {"train_loss": -22.475433349609375, "global_step": 106771, "epoch": 1286} {"train_loss": -22.46432876586914, "global_step": 106772, "epoch": 1286} {"train_loss": -22.542112350463867, "global_step": 106773, "epoch": 1286} {"train_loss": -22.05657386779785, "global_step": 106774, "epoch": 1286} {"train_loss": -21.871519088745117, "global_step": 106775, "epoch": 1286} {"train_loss": -21.761991500854492, "global_step": 106776, "epoch": 1286} {"train_loss": -22.3712100982666, "global_step": 106777, "epoch": 1286} {"train_loss": -21.696836471557617, "global_step": 106778, "epoch": 1286} {"train_loss": -22.1361141204834, "global_step": 106779, "epoch": 1286} {"train_loss": -22.275362014770508, "global_step": 106780, "epoch": 1286} {"train_loss": -21.84347152709961, "global_step": 106781, "epoch": 1286} {"train_loss": -22.451597213745117, "global_step": 106782, "epoch": 1286} {"train_loss": -21.769811630249023, "global_step": 106783, "epoch": 1286} {"train_loss": -22.018478393554688, "global_step": 106784, "epoch": 1286} {"train_loss": -22.273347854614258, "global_step": 106785, "epoch": 1286} {"train_loss": -21.890539169311523, "global_step": 106786, "epoch": 1286} {"train_loss": -22.042875289916992, "global_step": 106787, "epoch": 1286} {"train_loss": -22.327112197875977, "global_step": 106788, "epoch": 1286} {"train_loss": -22.14588165283203, "global_step": 106789, "epoch": 1286} {"train_loss": -22.314706802368164, "global_step": 106790, "epoch": 1286} {"train_loss": -21.980627059936523, "global_step": 106791, "epoch": 1286} {"train_loss": -22.106077194213867, "global_step": 106792, "epoch": 1286} {"train_loss": -22.25684928894043, "global_step": 106793, "epoch": 1286} {"train_loss": -22.252134323120117, "global_step": 106794, "epoch": 1286} {"train_loss": -21.94906997680664, "global_step": 106795, "epoch": 1286} {"train_loss": -21.827707290649414, "global_step": 106796, "epoch": 1286} {"train_loss": -22.035146713256836, "global_step": 106797, "epoch": 1286} {"train_loss": -22.22873878479004, "global_step": 106798, "epoch": 1286} {"train_loss": -21.664514541625977, "global_step": 106799, "epoch": 1286} {"train_loss": -22.187326431274414, "global_step": 106800, "epoch": 1286} {"train_loss": -21.947864532470703, "global_step": 106801, "epoch": 1286} {"train_loss": -22.3623104095459, "global_step": 106802, "epoch": 1286} {"train_loss": -22.446826934814453, "global_step": 106803, "epoch": 1286} {"train_loss": -22.038461685180664, "global_step": 106804, "epoch": 1286} {"train_loss": -22.082965850830078, "global_step": 106805, "epoch": 1286} {"train_loss": -22.538877487182617, "global_step": 106806, "epoch": 1286} {"train_loss": -22.025054931640625, "global_step": 106807, "epoch": 1286} {"train_loss": -22.10611915588379, "global_step": 106808, "epoch": 1286} {"train_loss": -22.309003829956055, "global_step": 106809, "epoch": 1286} {"train_loss": -22.317913055419922, "global_step": 106810, "epoch": 1286} {"train_loss": -22.16001319885254, "global_step": 106811, "epoch": 1286} {"train_loss": -21.8541259765625, "global_step": 106812, "epoch": 1286} {"train_loss": -22.1533260345459, "global_step": 106813, "epoch": 1286} {"train_loss": -22.334171295166016, "global_step": 106814, "epoch": 1286} {"train_loss": -22.268224716186523, "global_step": 106815, "epoch": 1286} {"train_loss": -22.08225440979004, "global_step": 106816, "epoch": 1286} {"train_loss": -22.412546157836914, "global_step": 106817, "epoch": 1286} {"train_loss": -22.117252349853516, "global_step": 106818, "epoch": 1286} {"train_loss": -22.468923568725586, "global_step": 106819, "epoch": 1286} {"train_loss": -22.025896348148944, "global_step": 106820, "epoch": 1286, "val_loss": 6089339.0} {"train_loss": -21.43324851989746, "global_step": 106821, "epoch": 1287} {"train_loss": -22.107484817504883, "global_step": 106822, "epoch": 1287} {"train_loss": -21.9669132232666, "global_step": 106823, "epoch": 1287} {"train_loss": -21.765653610229492, "global_step": 106824, "epoch": 1287} {"train_loss": -21.703857421875, "global_step": 106825, "epoch": 1287} {"train_loss": -21.8165340423584, "global_step": 106826, "epoch": 1287} {"train_loss": -22.269773483276367, "global_step": 106827, "epoch": 1287} {"train_loss": -22.139490127563477, "global_step": 106828, "epoch": 1287} {"train_loss": -22.018598556518555, "global_step": 106829, "epoch": 1287} {"train_loss": -22.211339950561523, "global_step": 106830, "epoch": 1287} {"train_loss": -21.8134708404541, "global_step": 106831, "epoch": 1287} {"train_loss": -21.536069869995117, "global_step": 106832, "epoch": 1287} {"train_loss": -22.028003692626953, "global_step": 106833, "epoch": 1287} {"train_loss": -22.230451583862305, "global_step": 106834, "epoch": 1287} {"train_loss": -22.274700164794922, "global_step": 106835, "epoch": 1287} {"train_loss": -22.306718826293945, "global_step": 106836, "epoch": 1287} {"train_loss": -22.481033325195312, "global_step": 106837, "epoch": 1287} {"train_loss": -22.315393447875977, "global_step": 106838, "epoch": 1287} {"train_loss": -21.802030563354492, "global_step": 106839, "epoch": 1287} {"train_loss": -22.054956436157227, "global_step": 106840, "epoch": 1287} {"train_loss": -22.03726577758789, "global_step": 106841, "epoch": 1287} {"train_loss": -21.777421951293945, "global_step": 106842, "epoch": 1287} {"train_loss": -22.442630767822266, "global_step": 106843, "epoch": 1287} {"train_loss": -21.949966430664062, "global_step": 106844, "epoch": 1287} {"train_loss": -22.091440200805664, "global_step": 106845, "epoch": 1287} {"train_loss": -22.178983688354492, "global_step": 106846, "epoch": 1287} {"train_loss": -22.350061416625977, "global_step": 106847, "epoch": 1287} {"train_loss": -22.32820701599121, "global_step": 106848, "epoch": 1287} {"train_loss": -22.562061309814453, "global_step": 106849, "epoch": 1287} {"train_loss": -22.513072967529297, "global_step": 106850, "epoch": 1287} {"train_loss": -22.09964370727539, "global_step": 106851, "epoch": 1287} {"train_loss": -22.369380950927734, "global_step": 106852, "epoch": 1287} {"train_loss": -22.26393699645996, "global_step": 106853, "epoch": 1287} {"train_loss": -21.997451782226562, "global_step": 106854, "epoch": 1287} {"train_loss": -22.00011444091797, "global_step": 106855, "epoch": 1287} {"train_loss": -22.169179916381836, "global_step": 106856, "epoch": 1287} {"train_loss": -22.341886520385742, "global_step": 106857, "epoch": 1287} {"train_loss": -22.194005966186523, "global_step": 106858, "epoch": 1287} {"train_loss": -22.248106002807617, "global_step": 106859, "epoch": 1287} {"train_loss": -21.926076889038086, "global_step": 106860, "epoch": 1287} {"train_loss": -22.242116928100586, "global_step": 106861, "epoch": 1287} {"train_loss": -22.13031005859375, "global_step": 106862, "epoch": 1287} {"train_loss": -22.30767822265625, "global_step": 106863, "epoch": 1287} {"train_loss": -22.25052833557129, "global_step": 106864, "epoch": 1287} {"train_loss": -22.142454147338867, "global_step": 106865, "epoch": 1287} {"train_loss": -22.19400405883789, "global_step": 106866, "epoch": 1287} {"train_loss": -22.289907455444336, "global_step": 106867, "epoch": 1287} {"train_loss": -22.101398468017578, "global_step": 106868, "epoch": 1287} {"train_loss": -22.526355743408203, "global_step": 106869, "epoch": 1287} {"train_loss": -22.184396743774414, "global_step": 106870, "epoch": 1287} {"train_loss": -21.91023826599121, "global_step": 106871, "epoch": 1287} {"train_loss": -22.26983642578125, "global_step": 106872, "epoch": 1287} {"train_loss": -22.156265258789062, "global_step": 106873, "epoch": 1287} {"train_loss": -22.470144271850586, "global_step": 106874, "epoch": 1287} {"train_loss": -22.166898727416992, "global_step": 106875, "epoch": 1287} {"train_loss": -22.14794921875, "global_step": 106876, "epoch": 1287} {"train_loss": -21.971071243286133, "global_step": 106877, "epoch": 1287} {"train_loss": -21.781234741210938, "global_step": 106878, "epoch": 1287} {"train_loss": -21.933320999145508, "global_step": 106879, "epoch": 1287} {"train_loss": -22.267898559570312, "global_step": 106880, "epoch": 1287} {"train_loss": -22.160818099975586, "global_step": 106881, "epoch": 1287} {"train_loss": -21.818815231323242, "global_step": 106882, "epoch": 1287} {"train_loss": -22.075407028198242, "global_step": 106883, "epoch": 1287} {"train_loss": -22.18686866760254, "global_step": 106884, "epoch": 1287} {"train_loss": -22.328214645385742, "global_step": 106885, "epoch": 1287} {"train_loss": -22.23124122619629, "global_step": 106886, "epoch": 1287} {"train_loss": -22.1763973236084, "global_step": 106887, "epoch": 1287} {"train_loss": -22.39893341064453, "global_step": 106888, "epoch": 1287} {"train_loss": -22.53554344177246, "global_step": 106889, "epoch": 1287} {"train_loss": -22.36555290222168, "global_step": 106890, "epoch": 1287} {"train_loss": -22.02488136291504, "global_step": 106891, "epoch": 1287} {"train_loss": -21.99822998046875, "global_step": 106892, "epoch": 1287} {"train_loss": -22.043212890625, "global_step": 106893, "epoch": 1287} {"train_loss": -22.27094841003418, "global_step": 106894, "epoch": 1287} {"train_loss": -22.267370223999023, "global_step": 106895, "epoch": 1287} {"train_loss": -21.985071182250977, "global_step": 106896, "epoch": 1287} {"train_loss": -21.9454288482666, "global_step": 106897, "epoch": 1287} {"train_loss": -22.222848892211914, "global_step": 106898, "epoch": 1287} {"train_loss": -22.150041580200195, "global_step": 106899, "epoch": 1287} {"train_loss": -21.95092010498047, "global_step": 106900, "epoch": 1287} {"train_loss": -21.855743408203125, "global_step": 106901, "epoch": 1287} {"train_loss": -21.792728424072266, "global_step": 106902, "epoch": 1287} {"train_loss": -22.141236224806452, "global_step": 106903, "epoch": 1287, "val_loss": 6242184.0} {"train_loss": -21.769145965576172, "global_step": 106904, "epoch": 1288} {"train_loss": -21.86702537536621, "global_step": 106905, "epoch": 1288} {"train_loss": -21.628524780273438, "global_step": 106906, "epoch": 1288} {"train_loss": -22.18552589416504, "global_step": 106907, "epoch": 1288} {"train_loss": -21.40899658203125, "global_step": 106908, "epoch": 1288} {"train_loss": -21.32611656188965, "global_step": 106909, "epoch": 1288} {"train_loss": -21.721017837524414, "global_step": 106910, "epoch": 1288} {"train_loss": -21.448217391967773, "global_step": 106911, "epoch": 1288} {"train_loss": -21.460886001586914, "global_step": 106912, "epoch": 1288} {"train_loss": -21.679288864135742, "global_step": 106913, "epoch": 1288} {"train_loss": -21.88699722290039, "global_step": 106914, "epoch": 1288} {"train_loss": -22.033952713012695, "global_step": 106915, "epoch": 1288} {"train_loss": -22.124271392822266, "global_step": 106916, "epoch": 1288} {"train_loss": -22.139921188354492, "global_step": 106917, "epoch": 1288} {"train_loss": -21.94110679626465, "global_step": 106918, "epoch": 1288} {"train_loss": -21.85617446899414, "global_step": 106919, "epoch": 1288} {"train_loss": -21.838016510009766, "global_step": 106920, "epoch": 1288} {"train_loss": -21.761459350585938, "global_step": 106921, "epoch": 1288} {"train_loss": -21.61891746520996, "global_step": 106922, "epoch": 1288} {"train_loss": -21.685585021972656, "global_step": 106923, "epoch": 1288} {"train_loss": -22.074277877807617, "global_step": 106924, "epoch": 1288} {"train_loss": -21.88580894470215, "global_step": 106925, "epoch": 1288} {"train_loss": -21.93951416015625, "global_step": 106926, "epoch": 1288} {"train_loss": -22.03140640258789, "global_step": 106927, "epoch": 1288} {"train_loss": -22.20460319519043, "global_step": 106928, "epoch": 1288} {"train_loss": -22.037982940673828, "global_step": 106929, "epoch": 1288} {"train_loss": -21.97078514099121, "global_step": 106930, "epoch": 1288} {"train_loss": -21.982290267944336, "global_step": 106931, "epoch": 1288} {"train_loss": -22.356237411499023, "global_step": 106932, "epoch": 1288} {"train_loss": -22.227535247802734, "global_step": 106933, "epoch": 1288} {"train_loss": -22.01873207092285, "global_step": 106934, "epoch": 1288} {"train_loss": -22.48589515686035, "global_step": 106935, "epoch": 1288} {"train_loss": -22.2844295501709, "global_step": 106936, "epoch": 1288} {"train_loss": -22.15345573425293, "global_step": 106937, "epoch": 1288} {"train_loss": -22.294057846069336, "global_step": 106938, "epoch": 1288} {"train_loss": -22.14072036743164, "global_step": 106939, "epoch": 1288} {"train_loss": -22.228790283203125, "global_step": 106940, "epoch": 1288} {"train_loss": -22.367597579956055, "global_step": 106941, "epoch": 1288} {"train_loss": -22.062957763671875, "global_step": 106942, "epoch": 1288} {"train_loss": -22.226669311523438, "global_step": 106943, "epoch": 1288} {"train_loss": -21.90492057800293, "global_step": 106944, "epoch": 1288} {"train_loss": -22.65640640258789, "global_step": 106945, "epoch": 1288} {"train_loss": -21.709199905395508, "global_step": 106946, "epoch": 1288} {"train_loss": -22.20660972595215, "global_step": 106947, "epoch": 1288} {"train_loss": -22.062320709228516, "global_step": 106948, "epoch": 1288} {"train_loss": -22.426191329956055, "global_step": 106949, "epoch": 1288} {"train_loss": -22.144399642944336, "global_step": 106950, "epoch": 1288} {"train_loss": -21.874332427978516, "global_step": 106951, "epoch": 1288} {"train_loss": -22.085737228393555, "global_step": 106952, "epoch": 1288} {"train_loss": -22.400606155395508, "global_step": 106953, "epoch": 1288} {"train_loss": -22.48068618774414, "global_step": 106954, "epoch": 1288} {"train_loss": -22.467880249023438, "global_step": 106955, "epoch": 1288} {"train_loss": -22.334091186523438, "global_step": 106956, "epoch": 1288} {"train_loss": -22.203664779663086, "global_step": 106957, "epoch": 1288} {"train_loss": -22.217330932617188, "global_step": 106958, "epoch": 1288} {"train_loss": -22.49799156188965, "global_step": 106959, "epoch": 1288} {"train_loss": -21.86224365234375, "global_step": 106960, "epoch": 1288} {"train_loss": -22.250564575195312, "global_step": 106961, "epoch": 1288} {"train_loss": -22.253232955932617, "global_step": 106962, "epoch": 1288} {"train_loss": -22.327829360961914, "global_step": 106963, "epoch": 1288} {"train_loss": -22.232318878173828, "global_step": 106964, "epoch": 1288} {"train_loss": -22.533267974853516, "global_step": 106965, "epoch": 1288} {"train_loss": -22.181079864501953, "global_step": 106966, "epoch": 1288} {"train_loss": -22.212080001831055, "global_step": 106967, "epoch": 1288} {"train_loss": -22.098148345947266, "global_step": 106968, "epoch": 1288} {"train_loss": -22.358577728271484, "global_step": 106969, "epoch": 1288} {"train_loss": -22.383834838867188, "global_step": 106970, "epoch": 1288} {"train_loss": -21.98896598815918, "global_step": 106971, "epoch": 1288} {"train_loss": -21.82893180847168, "global_step": 106972, "epoch": 1288} {"train_loss": -21.95344352722168, "global_step": 106973, "epoch": 1288} {"train_loss": -21.970355987548828, "global_step": 106974, "epoch": 1288} {"train_loss": -22.163768768310547, "global_step": 106975, "epoch": 1288} {"train_loss": -22.100177764892578, "global_step": 106976, "epoch": 1288} {"train_loss": -22.03989028930664, "global_step": 106977, "epoch": 1288} {"train_loss": -22.427799224853516, "global_step": 106978, "epoch": 1288} {"train_loss": -22.307392120361328, "global_step": 106979, "epoch": 1288} {"train_loss": -22.250194549560547, "global_step": 106980, "epoch": 1288} {"train_loss": -22.017044067382812, "global_step": 106981, "epoch": 1288} {"train_loss": -21.97833251953125, "global_step": 106982, "epoch": 1288} {"train_loss": -22.209095001220703, "global_step": 106983, "epoch": 1288} {"train_loss": -21.824216842651367, "global_step": 106984, "epoch": 1288} {"train_loss": -22.380958557128906, "global_step": 106985, "epoch": 1288} {"train_loss": -22.069380518901777, "global_step": 106986, "epoch": 1288, "val_loss": 6122136.5} {"train_loss": -21.91794204711914, "global_step": 106987, "epoch": 1289} {"train_loss": -21.235275268554688, "global_step": 106988, "epoch": 1289} {"train_loss": -21.258445739746094, "global_step": 106989, "epoch": 1289} {"train_loss": -21.624692916870117, "global_step": 106990, "epoch": 1289} {"train_loss": -21.75484275817871, "global_step": 106991, "epoch": 1289} {"train_loss": -21.639516830444336, "global_step": 106992, "epoch": 1289} {"train_loss": -21.723783493041992, "global_step": 106993, "epoch": 1289} {"train_loss": -21.684608459472656, "global_step": 106994, "epoch": 1289} {"train_loss": -21.822818756103516, "global_step": 106995, "epoch": 1289} {"train_loss": -21.31888771057129, "global_step": 106996, "epoch": 1289} {"train_loss": -21.349592208862305, "global_step": 106997, "epoch": 1289} {"train_loss": -21.249923706054688, "global_step": 106998, "epoch": 1289} {"train_loss": -21.80739402770996, "global_step": 106999, "epoch": 1289} {"train_loss": -21.9617862701416, "global_step": 107000, "epoch": 1289} {"train_loss": -21.95684814453125, "global_step": 107001, "epoch": 1289} {"train_loss": -21.643518447875977, "global_step": 107002, "epoch": 1289} {"train_loss": -21.769922256469727, "global_step": 107003, "epoch": 1289} {"train_loss": -21.594301223754883, "global_step": 107004, "epoch": 1289} {"train_loss": -21.644704818725586, "global_step": 107005, "epoch": 1289} {"train_loss": -21.468198776245117, "global_step": 107006, "epoch": 1289} {"train_loss": -21.74652671813965, "global_step": 107007, "epoch": 1289} {"train_loss": -22.012351989746094, "global_step": 107008, "epoch": 1289} {"train_loss": -22.200719833374023, "global_step": 107009, "epoch": 1289} {"train_loss": -21.95774269104004, "global_step": 107010, "epoch": 1289} {"train_loss": -21.846452713012695, "global_step": 107011, "epoch": 1289} {"train_loss": -22.2147274017334, "global_step": 107012, "epoch": 1289} {"train_loss": -21.829191207885742, "global_step": 107013, "epoch": 1289} {"train_loss": -21.744733810424805, "global_step": 107014, "epoch": 1289} {"train_loss": -22.135595321655273, "global_step": 107015, "epoch": 1289} {"train_loss": -22.316625595092773, "global_step": 107016, "epoch": 1289} {"train_loss": -21.661087036132812, "global_step": 107017, "epoch": 1289} {"train_loss": -22.310636520385742, "global_step": 107018, "epoch": 1289} {"train_loss": -22.16437530517578, "global_step": 107019, "epoch": 1289} {"train_loss": -22.01740074157715, "global_step": 107020, "epoch": 1289} {"train_loss": -21.9072322845459, "global_step": 107021, "epoch": 1289} {"train_loss": -22.199827194213867, "global_step": 107022, "epoch": 1289} {"train_loss": -21.915693283081055, "global_step": 107023, "epoch": 1289} {"train_loss": -22.315574645996094, "global_step": 107024, "epoch": 1289} {"train_loss": -22.386798858642578, "global_step": 107025, "epoch": 1289} {"train_loss": -22.45842933654785, "global_step": 107026, "epoch": 1289} {"train_loss": -22.116819381713867, "global_step": 107027, "epoch": 1289} {"train_loss": -22.069578170776367, "global_step": 107028, "epoch": 1289} {"train_loss": -22.391368865966797, "global_step": 107029, "epoch": 1289} {"train_loss": -22.285526275634766, "global_step": 107030, "epoch": 1289} {"train_loss": -22.177671432495117, "global_step": 107031, "epoch": 1289} {"train_loss": -22.087722778320312, "global_step": 107032, "epoch": 1289} {"train_loss": -22.248262405395508, "global_step": 107033, "epoch": 1289} {"train_loss": -22.06659507751465, "global_step": 107034, "epoch": 1289} {"train_loss": -22.3113956451416, "global_step": 107035, "epoch": 1289} {"train_loss": -22.41267204284668, "global_step": 107036, "epoch": 1289} {"train_loss": -22.311195373535156, "global_step": 107037, "epoch": 1289} {"train_loss": -22.25558853149414, "global_step": 107038, "epoch": 1289} {"train_loss": -22.219741821289062, "global_step": 107039, "epoch": 1289} {"train_loss": -22.434858322143555, "global_step": 107040, "epoch": 1289} {"train_loss": -22.402097702026367, "global_step": 107041, "epoch": 1289} {"train_loss": -22.087757110595703, "global_step": 107042, "epoch": 1289} {"train_loss": -22.12708854675293, "global_step": 107043, "epoch": 1289} {"train_loss": -22.262165069580078, "global_step": 107044, "epoch": 1289} {"train_loss": -22.50203514099121, "global_step": 107045, "epoch": 1289} {"train_loss": -22.342527389526367, "global_step": 107046, "epoch": 1289} {"train_loss": -22.273197174072266, "global_step": 107047, "epoch": 1289} {"train_loss": -22.536527633666992, "global_step": 107048, "epoch": 1289} {"train_loss": -21.979511260986328, "global_step": 107049, "epoch": 1289} {"train_loss": -21.97109031677246, "global_step": 107050, "epoch": 1289} {"train_loss": -21.91318702697754, "global_step": 107051, "epoch": 1289} {"train_loss": -22.40656852722168, "global_step": 107052, "epoch": 1289} {"train_loss": -22.088010787963867, "global_step": 107053, "epoch": 1289} {"train_loss": -22.308813095092773, "global_step": 107054, "epoch": 1289} {"train_loss": -22.241708755493164, "global_step": 107055, "epoch": 1289} {"train_loss": -22.27127456665039, "global_step": 107056, "epoch": 1289} {"train_loss": -22.33867073059082, "global_step": 107057, "epoch": 1289} {"train_loss": -22.23646354675293, "global_step": 107058, "epoch": 1289} {"train_loss": -22.470422744750977, "global_step": 107059, "epoch": 1289} {"train_loss": -22.3633975982666, "global_step": 107060, "epoch": 1289} {"train_loss": -22.15036964416504, "global_step": 107061, "epoch": 1289} {"train_loss": -22.20833396911621, "global_step": 107062, "epoch": 1289} {"train_loss": -22.603591918945312, "global_step": 107063, "epoch": 1289} {"train_loss": -22.039276123046875, "global_step": 107064, "epoch": 1289} {"train_loss": -22.32911491394043, "global_step": 107065, "epoch": 1289} {"train_loss": -22.277002334594727, "global_step": 107066, "epoch": 1289} {"train_loss": -22.401622772216797, "global_step": 107067, "epoch": 1289} {"train_loss": -22.10511589050293, "global_step": 107068, "epoch": 1289} {"train_loss": -22.06970529671175, "global_step": 107069, "epoch": 1289, "val_loss": 6124091.5} {"train_loss": -21.717113494873047, "global_step": 107070, "epoch": 1290} {"train_loss": -21.733966827392578, "global_step": 107071, "epoch": 1290} {"train_loss": -21.656829833984375, "global_step": 107072, "epoch": 1290} {"train_loss": -21.707616806030273, "global_step": 107073, "epoch": 1290} {"train_loss": -22.058826446533203, "global_step": 107074, "epoch": 1290} {"train_loss": -21.917203903198242, "global_step": 107075, "epoch": 1290} {"train_loss": -22.02644157409668, "global_step": 107076, "epoch": 1290} {"train_loss": -22.08351707458496, "global_step": 107077, "epoch": 1290} {"train_loss": -22.631954193115234, "global_step": 107078, "epoch": 1290} {"train_loss": -21.81056022644043, "global_step": 107079, "epoch": 1290} {"train_loss": -21.7138729095459, "global_step": 107080, "epoch": 1290} {"train_loss": -22.06732177734375, "global_step": 107081, "epoch": 1290} {"train_loss": -22.430532455444336, "global_step": 107082, "epoch": 1290} {"train_loss": -22.31283950805664, "global_step": 107083, "epoch": 1290} {"train_loss": -22.38610076904297, "global_step": 107084, "epoch": 1290} {"train_loss": -21.652633666992188, "global_step": 107085, "epoch": 1290} {"train_loss": -21.732349395751953, "global_step": 107086, "epoch": 1290} {"train_loss": -21.952533721923828, "global_step": 107087, "epoch": 1290} {"train_loss": -22.175861358642578, "global_step": 107088, "epoch": 1290} {"train_loss": -21.948270797729492, "global_step": 107089, "epoch": 1290} {"train_loss": -22.24359703063965, "global_step": 107090, "epoch": 1290} {"train_loss": -22.008968353271484, "global_step": 107091, "epoch": 1290} {"train_loss": -22.086515426635742, "global_step": 107092, "epoch": 1290} {"train_loss": -22.07322883605957, "global_step": 107093, "epoch": 1290} {"train_loss": -22.030746459960938, "global_step": 107094, "epoch": 1290} {"train_loss": -22.255615234375, "global_step": 107095, "epoch": 1290} {"train_loss": -22.167430877685547, "global_step": 107096, "epoch": 1290} {"train_loss": -21.792316436767578, "global_step": 107097, "epoch": 1290} {"train_loss": -22.163787841796875, "global_step": 107098, "epoch": 1290} {"train_loss": -22.413536071777344, "global_step": 107099, "epoch": 1290} {"train_loss": -22.1026668548584, "global_step": 107100, "epoch": 1290} {"train_loss": -22.16330909729004, "global_step": 107101, "epoch": 1290} {"train_loss": -21.9702091217041, "global_step": 107102, "epoch": 1290} {"train_loss": -21.778345108032227, "global_step": 107103, "epoch": 1290} {"train_loss": -22.302297592163086, "global_step": 107104, "epoch": 1290} {"train_loss": -22.205060958862305, "global_step": 107105, "epoch": 1290} {"train_loss": -22.119230270385742, "global_step": 107106, "epoch": 1290} {"train_loss": -22.37067222595215, "global_step": 107107, "epoch": 1290} {"train_loss": -22.233814239501953, "global_step": 107108, "epoch": 1290} {"train_loss": -22.317190170288086, "global_step": 107109, "epoch": 1290} {"train_loss": -22.136281967163086, "global_step": 107110, "epoch": 1290} {"train_loss": -21.805952072143555, "global_step": 107111, "epoch": 1290} {"train_loss": -21.98344612121582, "global_step": 107112, "epoch": 1290} {"train_loss": -22.23807716369629, "global_step": 107113, "epoch": 1290} {"train_loss": -21.927034378051758, "global_step": 107114, "epoch": 1290} {"train_loss": -22.051029205322266, "global_step": 107115, "epoch": 1290} {"train_loss": -22.105527877807617, "global_step": 107116, "epoch": 1290} {"train_loss": -22.273880004882812, "global_step": 107117, "epoch": 1290} {"train_loss": -22.448017120361328, "global_step": 107118, "epoch": 1290} {"train_loss": -22.206872940063477, "global_step": 107119, "epoch": 1290} {"train_loss": -22.355947494506836, "global_step": 107120, "epoch": 1290} {"train_loss": -22.33136558532715, "global_step": 107121, "epoch": 1290} {"train_loss": -22.443735122680664, "global_step": 107122, "epoch": 1290} {"train_loss": -22.0294189453125, "global_step": 107123, "epoch": 1290} {"train_loss": -22.01030921936035, "global_step": 107124, "epoch": 1290} {"train_loss": -22.50284767150879, "global_step": 107125, "epoch": 1290} {"train_loss": -21.897825241088867, "global_step": 107126, "epoch": 1290} {"train_loss": -22.17960548400879, "global_step": 107127, "epoch": 1290} {"train_loss": -22.503253936767578, "global_step": 107128, "epoch": 1290} {"train_loss": -22.1398983001709, "global_step": 107129, "epoch": 1290} {"train_loss": -22.538564682006836, "global_step": 107130, "epoch": 1290} {"train_loss": -22.28838539123535, "global_step": 107131, "epoch": 1290} {"train_loss": -22.12176513671875, "global_step": 107132, "epoch": 1290} {"train_loss": -22.34565544128418, "global_step": 107133, "epoch": 1290} {"train_loss": -22.01719093322754, "global_step": 107134, "epoch": 1290} {"train_loss": -22.543628692626953, "global_step": 107135, "epoch": 1290} {"train_loss": -22.33644676208496, "global_step": 107136, "epoch": 1290} {"train_loss": -22.02498435974121, "global_step": 107137, "epoch": 1290} {"train_loss": -21.81074333190918, "global_step": 107138, "epoch": 1290} {"train_loss": -22.048444747924805, "global_step": 107139, "epoch": 1290} {"train_loss": -21.840341567993164, "global_step": 107140, "epoch": 1290} {"train_loss": -22.44951820373535, "global_step": 107141, "epoch": 1290} {"train_loss": -22.470726013183594, "global_step": 107142, "epoch": 1290} {"train_loss": -22.18269920349121, "global_step": 107143, "epoch": 1290} {"train_loss": -22.368648529052734, "global_step": 107144, "epoch": 1290} {"train_loss": -21.998836517333984, "global_step": 107145, "epoch": 1290} {"train_loss": -22.310483932495117, "global_step": 107146, "epoch": 1290} {"train_loss": -21.901620864868164, "global_step": 107147, "epoch": 1290} {"train_loss": -22.304203033447266, "global_step": 107148, "epoch": 1290} {"train_loss": -22.230276107788086, "global_step": 107149, "epoch": 1290} {"train_loss": -22.058698654174805, "global_step": 107150, "epoch": 1290} {"train_loss": -22.532804489135742, "global_step": 107151, "epoch": 1290} {"train_loss": -22.13379885202431, "global_step": 107152, "epoch": 1290, "val_loss": 6114934.0} {"train_loss": -21.89980697631836, "global_step": 107153, "epoch": 1291} {"train_loss": -21.83632469177246, "global_step": 107154, "epoch": 1291} {"train_loss": -21.936689376831055, "global_step": 107155, "epoch": 1291} {"train_loss": -21.84823989868164, "global_step": 107156, "epoch": 1291} {"train_loss": -21.984098434448242, "global_step": 107157, "epoch": 1291} {"train_loss": -21.42693519592285, "global_step": 107158, "epoch": 1291} {"train_loss": -21.763334274291992, "global_step": 107159, "epoch": 1291} {"train_loss": -21.774845123291016, "global_step": 107160, "epoch": 1291} {"train_loss": -21.87766456604004, "global_step": 107161, "epoch": 1291} {"train_loss": -21.48679542541504, "global_step": 107162, "epoch": 1291} {"train_loss": -21.869197845458984, "global_step": 107163, "epoch": 1291} {"train_loss": -21.924270629882812, "global_step": 107164, "epoch": 1291} {"train_loss": -22.071537017822266, "global_step": 107165, "epoch": 1291} {"train_loss": -21.392826080322266, "global_step": 107166, "epoch": 1291} {"train_loss": -22.332483291625977, "global_step": 107167, "epoch": 1291} {"train_loss": -21.923053741455078, "global_step": 107168, "epoch": 1291} {"train_loss": -22.03087615966797, "global_step": 107169, "epoch": 1291} {"train_loss": -21.759963989257812, "global_step": 107170, "epoch": 1291} {"train_loss": -21.834989547729492, "global_step": 107171, "epoch": 1291} {"train_loss": -22.165891647338867, "global_step": 107172, "epoch": 1291} {"train_loss": -21.80548095703125, "global_step": 107173, "epoch": 1291} {"train_loss": -22.07386589050293, "global_step": 107174, "epoch": 1291} {"train_loss": -22.05953598022461, "global_step": 107175, "epoch": 1291} {"train_loss": -22.0213623046875, "global_step": 107176, "epoch": 1291} {"train_loss": -22.018402099609375, "global_step": 107177, "epoch": 1291} {"train_loss": -21.692981719970703, "global_step": 107178, "epoch": 1291} {"train_loss": -21.61939811706543, "global_step": 107179, "epoch": 1291} {"train_loss": -22.090478897094727, "global_step": 107180, "epoch": 1291} {"train_loss": -22.158248901367188, "global_step": 107181, "epoch": 1291} {"train_loss": -22.30598258972168, "global_step": 107182, "epoch": 1291} {"train_loss": -22.60615348815918, "global_step": 107183, "epoch": 1291} {"train_loss": -22.40577507019043, "global_step": 107184, "epoch": 1291} {"train_loss": -22.06268882751465, "global_step": 107185, "epoch": 1291} {"train_loss": -22.099899291992188, "global_step": 107186, "epoch": 1291} {"train_loss": -21.90260887145996, "global_step": 107187, "epoch": 1291} {"train_loss": -22.479736328125, "global_step": 107188, "epoch": 1291} {"train_loss": -22.556583404541016, "global_step": 107189, "epoch": 1291} {"train_loss": -22.357559204101562, "global_step": 107190, "epoch": 1291} {"train_loss": -22.01653480529785, "global_step": 107191, "epoch": 1291} {"train_loss": -22.280874252319336, "global_step": 107192, "epoch": 1291} {"train_loss": -21.9702091217041, "global_step": 107193, "epoch": 1291} {"train_loss": -21.988285064697266, "global_step": 107194, "epoch": 1291} {"train_loss": -22.305891036987305, "global_step": 107195, "epoch": 1291} {"train_loss": -22.37806510925293, "global_step": 107196, "epoch": 1291} {"train_loss": -21.97499656677246, "global_step": 107197, "epoch": 1291} {"train_loss": -22.07839584350586, "global_step": 107198, "epoch": 1291} {"train_loss": -22.361995697021484, "global_step": 107199, "epoch": 1291} {"train_loss": -22.156230926513672, "global_step": 107200, "epoch": 1291} {"train_loss": -22.34524917602539, "global_step": 107201, "epoch": 1291} {"train_loss": -22.017868041992188, "global_step": 107202, "epoch": 1291} {"train_loss": -22.4226016998291, "global_step": 107203, "epoch": 1291} {"train_loss": -22.572010040283203, "global_step": 107204, "epoch": 1291} {"train_loss": -22.4561767578125, "global_step": 107205, "epoch": 1291} {"train_loss": -21.8533878326416, "global_step": 107206, "epoch": 1291} {"train_loss": -21.83258819580078, "global_step": 107207, "epoch": 1291} {"train_loss": -21.997854232788086, "global_step": 107208, "epoch": 1291} {"train_loss": -21.951887130737305, "global_step": 107209, "epoch": 1291} {"train_loss": -21.954010009765625, "global_step": 107210, "epoch": 1291} {"train_loss": -22.152469635009766, "global_step": 107211, "epoch": 1291} {"train_loss": -22.13335609436035, "global_step": 107212, "epoch": 1291} {"train_loss": -22.030550003051758, "global_step": 107213, "epoch": 1291} {"train_loss": -22.13533592224121, "global_step": 107214, "epoch": 1291} {"train_loss": -22.35654640197754, "global_step": 107215, "epoch": 1291} {"train_loss": -22.53908348083496, "global_step": 107216, "epoch": 1291} {"train_loss": -22.551794052124023, "global_step": 107217, "epoch": 1291} {"train_loss": -22.41641616821289, "global_step": 107218, "epoch": 1291} {"train_loss": -22.03389549255371, "global_step": 107219, "epoch": 1291} {"train_loss": -21.989282608032227, "global_step": 107220, "epoch": 1291} {"train_loss": -21.849651336669922, "global_step": 107221, "epoch": 1291} {"train_loss": -22.30367088317871, "global_step": 107222, "epoch": 1291} {"train_loss": -22.067291259765625, "global_step": 107223, "epoch": 1291} {"train_loss": -22.148845672607422, "global_step": 107224, "epoch": 1291} {"train_loss": -22.109867095947266, "global_step": 107225, "epoch": 1291} {"train_loss": -22.617494583129883, "global_step": 107226, "epoch": 1291} {"train_loss": -22.217365264892578, "global_step": 107227, "epoch": 1291} {"train_loss": -22.3792724609375, "global_step": 107228, "epoch": 1291} {"train_loss": -21.9505558013916, "global_step": 107229, "epoch": 1291} {"train_loss": -22.105600357055664, "global_step": 107230, "epoch": 1291} {"train_loss": -22.136146545410156, "global_step": 107231, "epoch": 1291} {"train_loss": -22.2871036529541, "global_step": 107232, "epoch": 1291} {"train_loss": -22.013729095458984, "global_step": 107233, "epoch": 1291} {"train_loss": -22.240936279296875, "global_step": 107234, "epoch": 1291} {"train_loss": -22.095721440142896, "global_step": 107235, "epoch": 1291, "val_loss": 6126658.0} {"train_loss": -21.594745635986328, "global_step": 107236, "epoch": 1292} {"train_loss": -21.844100952148438, "global_step": 107237, "epoch": 1292} {"train_loss": -21.341087341308594, "global_step": 107238, "epoch": 1292} {"train_loss": -21.618839263916016, "global_step": 107239, "epoch": 1292} {"train_loss": -21.733413696289062, "global_step": 107240, "epoch": 1292} {"train_loss": -21.956466674804688, "global_step": 107241, "epoch": 1292} {"train_loss": -21.73373794555664, "global_step": 107242, "epoch": 1292} {"train_loss": -22.08514976501465, "global_step": 107243, "epoch": 1292} {"train_loss": -22.27431297302246, "global_step": 107244, "epoch": 1292} {"train_loss": -21.96849250793457, "global_step": 107245, "epoch": 1292} {"train_loss": -22.263376235961914, "global_step": 107246, "epoch": 1292} {"train_loss": -22.18426513671875, "global_step": 107247, "epoch": 1292} {"train_loss": -22.181272506713867, "global_step": 107248, "epoch": 1292} {"train_loss": -21.96071434020996, "global_step": 107249, "epoch": 1292} {"train_loss": -22.12691879272461, "global_step": 107250, "epoch": 1292} {"train_loss": -22.043447494506836, "global_step": 107251, "epoch": 1292} {"train_loss": -22.053089141845703, "global_step": 107252, "epoch": 1292} {"train_loss": -22.242212295532227, "global_step": 107253, "epoch": 1292} {"train_loss": -22.02204704284668, "global_step": 107254, "epoch": 1292} {"train_loss": -21.868642807006836, "global_step": 107255, "epoch": 1292} {"train_loss": -21.979337692260742, "global_step": 107256, "epoch": 1292} {"train_loss": -21.922292709350586, "global_step": 107257, "epoch": 1292} {"train_loss": -22.092309951782227, "global_step": 107258, "epoch": 1292} {"train_loss": -22.380599975585938, "global_step": 107259, "epoch": 1292} {"train_loss": -22.245330810546875, "global_step": 107260, "epoch": 1292} {"train_loss": -22.194189071655273, "global_step": 107261, "epoch": 1292} {"train_loss": -22.18674659729004, "global_step": 107262, "epoch": 1292} {"train_loss": -21.998355865478516, "global_step": 107263, "epoch": 1292} {"train_loss": -22.47930335998535, "global_step": 107264, "epoch": 1292} {"train_loss": -22.19281578063965, "global_step": 107265, "epoch": 1292} {"train_loss": -22.550519943237305, "global_step": 107266, "epoch": 1292} {"train_loss": -22.216068267822266, "global_step": 107267, "epoch": 1292} {"train_loss": -22.336118698120117, "global_step": 107268, "epoch": 1292} {"train_loss": -22.027841567993164, "global_step": 107269, "epoch": 1292} {"train_loss": -22.36823081970215, "global_step": 107270, "epoch": 1292} {"train_loss": -22.32415771484375, "global_step": 107271, "epoch": 1292} {"train_loss": -22.504819869995117, "global_step": 107272, "epoch": 1292} {"train_loss": -22.152559280395508, "global_step": 107273, "epoch": 1292} {"train_loss": -21.95625877380371, "global_step": 107274, "epoch": 1292} {"train_loss": -22.000226974487305, "global_step": 107275, "epoch": 1292} {"train_loss": -22.184188842773438, "global_step": 107276, "epoch": 1292} {"train_loss": -21.930566787719727, "global_step": 107277, "epoch": 1292} {"train_loss": -22.249631881713867, "global_step": 107278, "epoch": 1292} {"train_loss": -22.234891891479492, "global_step": 107279, "epoch": 1292} {"train_loss": -22.142108917236328, "global_step": 107280, "epoch": 1292} {"train_loss": -22.451303482055664, "global_step": 107281, "epoch": 1292} {"train_loss": -22.157913208007812, "global_step": 107282, "epoch": 1292} {"train_loss": -22.255891799926758, "global_step": 107283, "epoch": 1292} {"train_loss": -21.90682029724121, "global_step": 107284, "epoch": 1292} {"train_loss": -22.183612823486328, "global_step": 107285, "epoch": 1292} {"train_loss": -22.418689727783203, "global_step": 107286, "epoch": 1292} {"train_loss": -22.218643188476562, "global_step": 107287, "epoch": 1292} {"train_loss": -22.444087982177734, "global_step": 107288, "epoch": 1292} {"train_loss": -22.13588523864746, "global_step": 107289, "epoch": 1292} {"train_loss": -22.170095443725586, "global_step": 107290, "epoch": 1292} {"train_loss": -22.30255889892578, "global_step": 107291, "epoch": 1292} {"train_loss": -22.15883445739746, "global_step": 107292, "epoch": 1292} {"train_loss": -22.08758544921875, "global_step": 107293, "epoch": 1292} {"train_loss": -22.44049835205078, "global_step": 107294, "epoch": 1292} {"train_loss": -21.657485961914062, "global_step": 107295, "epoch": 1292} {"train_loss": -22.22210693359375, "global_step": 107296, "epoch": 1292} {"train_loss": -22.087675094604492, "global_step": 107297, "epoch": 1292} {"train_loss": -21.913501739501953, "global_step": 107298, "epoch": 1292} {"train_loss": -22.236663818359375, "global_step": 107299, "epoch": 1292} {"train_loss": -22.17762565612793, "global_step": 107300, "epoch": 1292} {"train_loss": -22.19775390625, "global_step": 107301, "epoch": 1292} {"train_loss": -22.178653717041016, "global_step": 107302, "epoch": 1292} {"train_loss": -21.92677116394043, "global_step": 107303, "epoch": 1292} {"train_loss": -22.05280876159668, "global_step": 107304, "epoch": 1292} {"train_loss": -22.172718048095703, "global_step": 107305, "epoch": 1292} {"train_loss": -21.88466453552246, "global_step": 107306, "epoch": 1292} {"train_loss": -22.200963973999023, "global_step": 107307, "epoch": 1292} {"train_loss": -22.180387496948242, "global_step": 107308, "epoch": 1292} {"train_loss": -22.11454200744629, "global_step": 107309, "epoch": 1292} {"train_loss": -21.868741989135742, "global_step": 107310, "epoch": 1292} {"train_loss": -22.041086196899414, "global_step": 107311, "epoch": 1292} {"train_loss": -21.877851486206055, "global_step": 107312, "epoch": 1292} {"train_loss": -22.324750900268555, "global_step": 107313, "epoch": 1292} {"train_loss": -22.310871124267578, "global_step": 107314, "epoch": 1292} {"train_loss": -22.484785079956055, "global_step": 107315, "epoch": 1292} {"train_loss": -22.11638069152832, "global_step": 107316, "epoch": 1292} {"train_loss": -22.172794342041016, "global_step": 107317, "epoch": 1292} {"train_loss": -22.106507289840515, "global_step": 107318, "epoch": 1292, "val_loss": 5971125.5} {"train_loss": -22.3664608001709, "global_step": 107319, "epoch": 1293} {"train_loss": -22.07282829284668, "global_step": 107320, "epoch": 1293} {"train_loss": -21.929410934448242, "global_step": 107321, "epoch": 1293} {"train_loss": -22.0112361907959, "global_step": 107322, "epoch": 1293} {"train_loss": -21.72017478942871, "global_step": 107323, "epoch": 1293} {"train_loss": -21.858428955078125, "global_step": 107324, "epoch": 1293} {"train_loss": -22.31625747680664, "global_step": 107325, "epoch": 1293} {"train_loss": -22.25155258178711, "global_step": 107326, "epoch": 1293} {"train_loss": -22.10438346862793, "global_step": 107327, "epoch": 1293} {"train_loss": -22.355249404907227, "global_step": 107328, "epoch": 1293} {"train_loss": -21.757709503173828, "global_step": 107329, "epoch": 1293} {"train_loss": -22.161226272583008, "global_step": 107330, "epoch": 1293} {"train_loss": -22.090219497680664, "global_step": 107331, "epoch": 1293} {"train_loss": -22.32244300842285, "global_step": 107332, "epoch": 1293} {"train_loss": -22.023069381713867, "global_step": 107333, "epoch": 1293} {"train_loss": -22.11997413635254, "global_step": 107334, "epoch": 1293} {"train_loss": -22.286270141601562, "global_step": 107335, "epoch": 1293} {"train_loss": -22.108251571655273, "global_step": 107336, "epoch": 1293} {"train_loss": -22.150421142578125, "global_step": 107337, "epoch": 1293} {"train_loss": -22.18292999267578, "global_step": 107338, "epoch": 1293} {"train_loss": -22.602619171142578, "global_step": 107339, "epoch": 1293} {"train_loss": -22.30317497253418, "global_step": 107340, "epoch": 1293} {"train_loss": -21.970102310180664, "global_step": 107341, "epoch": 1293} {"train_loss": -22.12914276123047, "global_step": 107342, "epoch": 1293} {"train_loss": -22.27435302734375, "global_step": 107343, "epoch": 1293} {"train_loss": -22.405181884765625, "global_step": 107344, "epoch": 1293} {"train_loss": -22.07513427734375, "global_step": 107345, "epoch": 1293} {"train_loss": -22.14980125427246, "global_step": 107346, "epoch": 1293} {"train_loss": -22.289630889892578, "global_step": 107347, "epoch": 1293} {"train_loss": -22.806241989135742, "global_step": 107348, "epoch": 1293} {"train_loss": -22.298587799072266, "global_step": 107349, "epoch": 1293} {"train_loss": -22.093725204467773, "global_step": 107350, "epoch": 1293} {"train_loss": -22.187885284423828, "global_step": 107351, "epoch": 1293} {"train_loss": -22.405563354492188, "global_step": 107352, "epoch": 1293} {"train_loss": -22.056381225585938, "global_step": 107353, "epoch": 1293} {"train_loss": -22.148099899291992, "global_step": 107354, "epoch": 1293} {"train_loss": -22.323698043823242, "global_step": 107355, "epoch": 1293} {"train_loss": -22.193058013916016, "global_step": 107356, "epoch": 1293} {"train_loss": -22.192630767822266, "global_step": 107357, "epoch": 1293} {"train_loss": -22.153162002563477, "global_step": 107358, "epoch": 1293} {"train_loss": -22.54794692993164, "global_step": 107359, "epoch": 1293} {"train_loss": -22.343698501586914, "global_step": 107360, "epoch": 1293} {"train_loss": -22.19929313659668, "global_step": 107361, "epoch": 1293} {"train_loss": -22.385940551757812, "global_step": 107362, "epoch": 1293} {"train_loss": -21.81288719177246, "global_step": 107363, "epoch": 1293} {"train_loss": -22.153156280517578, "global_step": 107364, "epoch": 1293} {"train_loss": -22.088624954223633, "global_step": 107365, "epoch": 1293} {"train_loss": -22.011533737182617, "global_step": 107366, "epoch": 1293} {"train_loss": -22.206865310668945, "global_step": 107367, "epoch": 1293} {"train_loss": -21.929441452026367, "global_step": 107368, "epoch": 1293} {"train_loss": -21.774370193481445, "global_step": 107369, "epoch": 1293} {"train_loss": -22.292129516601562, "global_step": 107370, "epoch": 1293} {"train_loss": -22.156354904174805, "global_step": 107371, "epoch": 1293} {"train_loss": -22.08809471130371, "global_step": 107372, "epoch": 1293} {"train_loss": -22.284666061401367, "global_step": 107373, "epoch": 1293} {"train_loss": -22.227005004882812, "global_step": 107374, "epoch": 1293} {"train_loss": -22.107473373413086, "global_step": 107375, "epoch": 1293} {"train_loss": -21.984027862548828, "global_step": 107376, "epoch": 1293} {"train_loss": -22.100126266479492, "global_step": 107377, "epoch": 1293} {"train_loss": -22.209714889526367, "global_step": 107378, "epoch": 1293} {"train_loss": -22.373397827148438, "global_step": 107379, "epoch": 1293} {"train_loss": -21.96779441833496, "global_step": 107380, "epoch": 1293} {"train_loss": -21.859952926635742, "global_step": 107381, "epoch": 1293} {"train_loss": -22.223047256469727, "global_step": 107382, "epoch": 1293} {"train_loss": -22.098539352416992, "global_step": 107383, "epoch": 1293} {"train_loss": -22.077533721923828, "global_step": 107384, "epoch": 1293} {"train_loss": -21.998239517211914, "global_step": 107385, "epoch": 1293} {"train_loss": -22.004173278808594, "global_step": 107386, "epoch": 1293} {"train_loss": -21.9549617767334, "global_step": 107387, "epoch": 1293} {"train_loss": -21.964536666870117, "global_step": 107388, "epoch": 1293} {"train_loss": -22.037878036499023, "global_step": 107389, "epoch": 1293} {"train_loss": -22.045780181884766, "global_step": 107390, "epoch": 1293} {"train_loss": -21.881086349487305, "global_step": 107391, "epoch": 1293} {"train_loss": -22.007781982421875, "global_step": 107392, "epoch": 1293} {"train_loss": -22.10578727722168, "global_step": 107393, "epoch": 1293} {"train_loss": -22.00459861755371, "global_step": 107394, "epoch": 1293} {"train_loss": -22.3474178314209, "global_step": 107395, "epoch": 1293} {"train_loss": -22.42234230041504, "global_step": 107396, "epoch": 1293} {"train_loss": -22.315832138061523, "global_step": 107397, "epoch": 1293} {"train_loss": -22.083005905151367, "global_step": 107398, "epoch": 1293} {"train_loss": -22.160932540893555, "global_step": 107399, "epoch": 1293} {"train_loss": -22.1938533782959, "global_step": 107400, "epoch": 1293} {"train_loss": -22.169042380459338, "global_step": 107401, "epoch": 1293, "val_loss": 6139361.0} {"train_loss": -21.369869232177734, "global_step": 107402, "epoch": 1294} {"train_loss": -21.4172420501709, "global_step": 107403, "epoch": 1294} {"train_loss": -21.571027755737305, "global_step": 107404, "epoch": 1294} {"train_loss": -21.948776245117188, "global_step": 107405, "epoch": 1294} {"train_loss": -21.493568420410156, "global_step": 107406, "epoch": 1294} {"train_loss": -21.936786651611328, "global_step": 107407, "epoch": 1294} {"train_loss": -22.55018424987793, "global_step": 107408, "epoch": 1294} {"train_loss": -21.89288902282715, "global_step": 107409, "epoch": 1294} {"train_loss": -22.120712280273438, "global_step": 107410, "epoch": 1294} {"train_loss": -21.767349243164062, "global_step": 107411, "epoch": 1294} {"train_loss": -21.812036514282227, "global_step": 107412, "epoch": 1294} {"train_loss": -22.297178268432617, "global_step": 107413, "epoch": 1294} {"train_loss": -21.838254928588867, "global_step": 107414, "epoch": 1294} {"train_loss": -22.481603622436523, "global_step": 107415, "epoch": 1294} {"train_loss": -21.83315086364746, "global_step": 107416, "epoch": 1294} {"train_loss": -22.372121810913086, "global_step": 107417, "epoch": 1294} {"train_loss": -22.019529342651367, "global_step": 107418, "epoch": 1294} {"train_loss": -22.390361785888672, "global_step": 107419, "epoch": 1294} {"train_loss": -21.695220947265625, "global_step": 107420, "epoch": 1294} {"train_loss": -22.501081466674805, "global_step": 107421, "epoch": 1294} {"train_loss": -21.7898006439209, "global_step": 107422, "epoch": 1294} {"train_loss": -22.215280532836914, "global_step": 107423, "epoch": 1294} {"train_loss": -21.992082595825195, "global_step": 107424, "epoch": 1294} {"train_loss": -21.97561264038086, "global_step": 107425, "epoch": 1294} {"train_loss": -22.326597213745117, "global_step": 107426, "epoch": 1294} {"train_loss": -22.26480484008789, "global_step": 107427, "epoch": 1294} {"train_loss": -22.279361724853516, "global_step": 107428, "epoch": 1294} {"train_loss": -22.49625587463379, "global_step": 107429, "epoch": 1294} {"train_loss": -21.933837890625, "global_step": 107430, "epoch": 1294} {"train_loss": -22.091934204101562, "global_step": 107431, "epoch": 1294} {"train_loss": -22.22356414794922, "global_step": 107432, "epoch": 1294} {"train_loss": -21.924448013305664, "global_step": 107433, "epoch": 1294} {"train_loss": -22.156015396118164, "global_step": 107434, "epoch": 1294} {"train_loss": -22.06935691833496, "global_step": 107435, "epoch": 1294} {"train_loss": -22.158954620361328, "global_step": 107436, "epoch": 1294} {"train_loss": -22.220233917236328, "global_step": 107437, "epoch": 1294} {"train_loss": -22.150012969970703, "global_step": 107438, "epoch": 1294} {"train_loss": -22.351303100585938, "global_step": 107439, "epoch": 1294} {"train_loss": -22.18793296813965, "global_step": 107440, "epoch": 1294} {"train_loss": -22.426401138305664, "global_step": 107441, "epoch": 1294} {"train_loss": -22.3349666595459, "global_step": 107442, "epoch": 1294} {"train_loss": -22.10986328125, "global_step": 107443, "epoch": 1294} {"train_loss": -22.21233367919922, "global_step": 107444, "epoch": 1294} {"train_loss": -22.221948623657227, "global_step": 107445, "epoch": 1294} {"train_loss": -22.231597900390625, "global_step": 107446, "epoch": 1294} {"train_loss": -22.34654998779297, "global_step": 107447, "epoch": 1294} {"train_loss": -21.806901931762695, "global_step": 107448, "epoch": 1294} {"train_loss": -22.157209396362305, "global_step": 107449, "epoch": 1294} {"train_loss": -22.387514114379883, "global_step": 107450, "epoch": 1294} {"train_loss": -22.187101364135742, "global_step": 107451, "epoch": 1294} {"train_loss": -22.28645896911621, "global_step": 107452, "epoch": 1294} {"train_loss": -22.119932174682617, "global_step": 107453, "epoch": 1294} {"train_loss": -22.045862197875977, "global_step": 107454, "epoch": 1294} {"train_loss": -21.898160934448242, "global_step": 107455, "epoch": 1294} {"train_loss": -22.032127380371094, "global_step": 107456, "epoch": 1294} {"train_loss": -22.38979148864746, "global_step": 107457, "epoch": 1294} {"train_loss": -22.10542106628418, "global_step": 107458, "epoch": 1294} {"train_loss": -22.353275299072266, "global_step": 107459, "epoch": 1294} {"train_loss": -21.874605178833008, "global_step": 107460, "epoch": 1294} {"train_loss": -21.80679702758789, "global_step": 107461, "epoch": 1294} {"train_loss": -22.439476013183594, "global_step": 107462, "epoch": 1294} {"train_loss": -22.25897216796875, "global_step": 107463, "epoch": 1294} {"train_loss": -22.34750747680664, "global_step": 107464, "epoch": 1294} {"train_loss": -21.95264434814453, "global_step": 107465, "epoch": 1294} {"train_loss": -22.329328536987305, "global_step": 107466, "epoch": 1294} {"train_loss": -22.006378173828125, "global_step": 107467, "epoch": 1294} {"train_loss": -22.375722885131836, "global_step": 107468, "epoch": 1294} {"train_loss": -22.00135040283203, "global_step": 107469, "epoch": 1294} {"train_loss": -22.447832107543945, "global_step": 107470, "epoch": 1294} {"train_loss": -22.016584396362305, "global_step": 107471, "epoch": 1294} {"train_loss": -22.123003005981445, "global_step": 107472, "epoch": 1294} {"train_loss": -22.4208984375, "global_step": 107473, "epoch": 1294} {"train_loss": -21.837100982666016, "global_step": 107474, "epoch": 1294} {"train_loss": -22.221803665161133, "global_step": 107475, "epoch": 1294} {"train_loss": -22.053537368774414, "global_step": 107476, "epoch": 1294} {"train_loss": -22.237119674682617, "global_step": 107477, "epoch": 1294} {"train_loss": -21.996444702148438, "global_step": 107478, "epoch": 1294} {"train_loss": -21.90478515625, "global_step": 107479, "epoch": 1294} {"train_loss": -22.620515823364258, "global_step": 107480, "epoch": 1294} {"train_loss": -22.014446258544922, "global_step": 107481, "epoch": 1294} {"train_loss": -22.307126998901367, "global_step": 107482, "epoch": 1294} {"train_loss": -22.178985595703125, "global_step": 107483, "epoch": 1294} {"train_loss": -22.125538814498718, "global_step": 107484, "epoch": 1294, "val_loss": 6351074.5} {"train_loss": -21.724790573120117, "global_step": 107485, "epoch": 1295} {"train_loss": -21.334392547607422, "global_step": 107486, "epoch": 1295} {"train_loss": -21.027843475341797, "global_step": 107487, "epoch": 1295} {"train_loss": -22.031457901000977, "global_step": 107488, "epoch": 1295} {"train_loss": -21.98357391357422, "global_step": 107489, "epoch": 1295} {"train_loss": -21.39594841003418, "global_step": 107490, "epoch": 1295} {"train_loss": -21.95700454711914, "global_step": 107491, "epoch": 1295} {"train_loss": -21.616836547851562, "global_step": 107492, "epoch": 1295} {"train_loss": -21.528074264526367, "global_step": 107493, "epoch": 1295} {"train_loss": -21.939258575439453, "global_step": 107494, "epoch": 1295} {"train_loss": -22.151691436767578, "global_step": 107495, "epoch": 1295} {"train_loss": -22.287487030029297, "global_step": 107496, "epoch": 1295} {"train_loss": -21.8790340423584, "global_step": 107497, "epoch": 1295} {"train_loss": -21.832778930664062, "global_step": 107498, "epoch": 1295} {"train_loss": -22.343860626220703, "global_step": 107499, "epoch": 1295} {"train_loss": -22.24306869506836, "global_step": 107500, "epoch": 1295} {"train_loss": -21.717016220092773, "global_step": 107501, "epoch": 1295} {"train_loss": -22.384775161743164, "global_step": 107502, "epoch": 1295} {"train_loss": -21.993999481201172, "global_step": 107503, "epoch": 1295} {"train_loss": -22.255422592163086, "global_step": 107504, "epoch": 1295} {"train_loss": -21.9283390045166, "global_step": 107505, "epoch": 1295} {"train_loss": -22.24628257751465, "global_step": 107506, "epoch": 1295} {"train_loss": -21.6351375579834, "global_step": 107507, "epoch": 1295} {"train_loss": -22.23233413696289, "global_step": 107508, "epoch": 1295} {"train_loss": -21.98487663269043, "global_step": 107509, "epoch": 1295} {"train_loss": -22.31230354309082, "global_step": 107510, "epoch": 1295} {"train_loss": -22.284034729003906, "global_step": 107511, "epoch": 1295} {"train_loss": -22.032386779785156, "global_step": 107512, "epoch": 1295} {"train_loss": -22.380006790161133, "global_step": 107513, "epoch": 1295} {"train_loss": -21.538679122924805, "global_step": 107514, "epoch": 1295} {"train_loss": -21.841894149780273, "global_step": 107515, "epoch": 1295} {"train_loss": -22.334369659423828, "global_step": 107516, "epoch": 1295} {"train_loss": -22.235565185546875, "global_step": 107517, "epoch": 1295} {"train_loss": -22.100709915161133, "global_step": 107518, "epoch": 1295} {"train_loss": -22.12208366394043, "global_step": 107519, "epoch": 1295} {"train_loss": -22.309921264648438, "global_step": 107520, "epoch": 1295} {"train_loss": -21.893465042114258, "global_step": 107521, "epoch": 1295} {"train_loss": -22.125019073486328, "global_step": 107522, "epoch": 1295} {"train_loss": -21.977563858032227, "global_step": 107523, "epoch": 1295} {"train_loss": -22.408140182495117, "global_step": 107524, "epoch": 1295} {"train_loss": -22.10163688659668, "global_step": 107525, "epoch": 1295} {"train_loss": -22.539033889770508, "global_step": 107526, "epoch": 1295} {"train_loss": -22.183053970336914, "global_step": 107527, "epoch": 1295} {"train_loss": -22.163381576538086, "global_step": 107528, "epoch": 1295} {"train_loss": -21.94293212890625, "global_step": 107529, "epoch": 1295} {"train_loss": -22.627500534057617, "global_step": 107530, "epoch": 1295} {"train_loss": -22.197311401367188, "global_step": 107531, "epoch": 1295} {"train_loss": -22.307161331176758, "global_step": 107532, "epoch": 1295} {"train_loss": -22.195974349975586, "global_step": 107533, "epoch": 1295} {"train_loss": -22.149784088134766, "global_step": 107534, "epoch": 1295} {"train_loss": -22.382104873657227, "global_step": 107535, "epoch": 1295} {"train_loss": -22.41751480102539, "global_step": 107536, "epoch": 1295} {"train_loss": -21.97509002685547, "global_step": 107537, "epoch": 1295} {"train_loss": -22.467594146728516, "global_step": 107538, "epoch": 1295} {"train_loss": -22.234708786010742, "global_step": 107539, "epoch": 1295} {"train_loss": -22.18558120727539, "global_step": 107540, "epoch": 1295} {"train_loss": -21.89345359802246, "global_step": 107541, "epoch": 1295} {"train_loss": -22.31325340270996, "global_step": 107542, "epoch": 1295} {"train_loss": -22.3345890045166, "global_step": 107543, "epoch": 1295} {"train_loss": -22.36074447631836, "global_step": 107544, "epoch": 1295} {"train_loss": -22.19955062866211, "global_step": 107545, "epoch": 1295} {"train_loss": -22.293394088745117, "global_step": 107546, "epoch": 1295} {"train_loss": -22.231992721557617, "global_step": 107547, "epoch": 1295} {"train_loss": -22.16359519958496, "global_step": 107548, "epoch": 1295} {"train_loss": -22.31781005859375, "global_step": 107549, "epoch": 1295} {"train_loss": -22.407262802124023, "global_step": 107550, "epoch": 1295} {"train_loss": -22.088088989257812, "global_step": 107551, "epoch": 1295} {"train_loss": -22.086820602416992, "global_step": 107552, "epoch": 1295} {"train_loss": -22.337326049804688, "global_step": 107553, "epoch": 1295} {"train_loss": -22.14360237121582, "global_step": 107554, "epoch": 1295} {"train_loss": -22.186498641967773, "global_step": 107555, "epoch": 1295} {"train_loss": -22.195772171020508, "global_step": 107556, "epoch": 1295} {"train_loss": -22.302566528320312, "global_step": 107557, "epoch": 1295} {"train_loss": -22.064224243164062, "global_step": 107558, "epoch": 1295} {"train_loss": -22.34309959411621, "global_step": 107559, "epoch": 1295} {"train_loss": -22.092527389526367, "global_step": 107560, "epoch": 1295} {"train_loss": -21.85517692565918, "global_step": 107561, "epoch": 1295} {"train_loss": -22.053787231445312, "global_step": 107562, "epoch": 1295} {"train_loss": -22.216825485229492, "global_step": 107563, "epoch": 1295} {"train_loss": -22.09333610534668, "global_step": 107564, "epoch": 1295} {"train_loss": -21.804813385009766, "global_step": 107565, "epoch": 1295} {"train_loss": -22.30535125732422, "global_step": 107566, "epoch": 1295} {"train_loss": -22.11583601710308, "global_step": 107567, "epoch": 1295, "val_loss": 6124313.5} {"train_loss": -21.772459030151367, "global_step": 107568, "epoch": 1296} {"train_loss": -21.82927131652832, "global_step": 107569, "epoch": 1296} {"train_loss": -22.21976661682129, "global_step": 107570, "epoch": 1296} {"train_loss": -21.78653335571289, "global_step": 107571, "epoch": 1296} {"train_loss": -22.03435707092285, "global_step": 107572, "epoch": 1296} {"train_loss": -21.816518783569336, "global_step": 107573, "epoch": 1296} {"train_loss": -21.833267211914062, "global_step": 107574, "epoch": 1296} {"train_loss": -21.885053634643555, "global_step": 107575, "epoch": 1296} {"train_loss": -22.160852432250977, "global_step": 107576, "epoch": 1296} {"train_loss": -21.947378158569336, "global_step": 107577, "epoch": 1296} {"train_loss": -21.962432861328125, "global_step": 107578, "epoch": 1296} {"train_loss": -22.24372673034668, "global_step": 107579, "epoch": 1296} {"train_loss": -22.30158805847168, "global_step": 107580, "epoch": 1296} {"train_loss": -22.11818504333496, "global_step": 107581, "epoch": 1296} {"train_loss": -21.782855987548828, "global_step": 107582, "epoch": 1296} {"train_loss": -22.129100799560547, "global_step": 107583, "epoch": 1296} {"train_loss": -22.19471549987793, "global_step": 107584, "epoch": 1296} {"train_loss": -22.101755142211914, "global_step": 107585, "epoch": 1296} {"train_loss": -21.9116153717041, "global_step": 107586, "epoch": 1296} {"train_loss": -22.263517379760742, "global_step": 107587, "epoch": 1296} {"train_loss": -21.98968505859375, "global_step": 107588, "epoch": 1296} {"train_loss": -21.601680755615234, "global_step": 107589, "epoch": 1296} {"train_loss": -21.827255249023438, "global_step": 107590, "epoch": 1296} {"train_loss": -21.991979598999023, "global_step": 107591, "epoch": 1296} {"train_loss": -21.8784236907959, "global_step": 107592, "epoch": 1296} {"train_loss": -21.923702239990234, "global_step": 107593, "epoch": 1296} {"train_loss": -22.092151641845703, "global_step": 107594, "epoch": 1296} {"train_loss": -22.454435348510742, "global_step": 107595, "epoch": 1296} {"train_loss": -22.234342575073242, "global_step": 107596, "epoch": 1296} {"train_loss": -22.043216705322266, "global_step": 107597, "epoch": 1296} {"train_loss": -21.894941329956055, "global_step": 107598, "epoch": 1296} {"train_loss": -22.102174758911133, "global_step": 107599, "epoch": 1296} {"train_loss": -21.95052146911621, "global_step": 107600, "epoch": 1296} {"train_loss": -22.33575439453125, "global_step": 107601, "epoch": 1296} {"train_loss": -22.1097469329834, "global_step": 107602, "epoch": 1296} {"train_loss": -22.340770721435547, "global_step": 107603, "epoch": 1296} {"train_loss": -21.96084213256836, "global_step": 107604, "epoch": 1296} {"train_loss": -21.943513870239258, "global_step": 107605, "epoch": 1296} {"train_loss": -22.384347915649414, "global_step": 107606, "epoch": 1296} {"train_loss": -22.339548110961914, "global_step": 107607, "epoch": 1296} {"train_loss": -22.06351661682129, "global_step": 107608, "epoch": 1296} {"train_loss": -21.678449630737305, "global_step": 107609, "epoch": 1296} {"train_loss": -22.392744064331055, "global_step": 107610, "epoch": 1296} {"train_loss": -21.97930908203125, "global_step": 107611, "epoch": 1296} {"train_loss": -22.0249080657959, "global_step": 107612, "epoch": 1296} {"train_loss": -22.448461532592773, "global_step": 107613, "epoch": 1296} {"train_loss": -22.109176635742188, "global_step": 107614, "epoch": 1296} {"train_loss": -22.115327835083008, "global_step": 107615, "epoch": 1296} {"train_loss": -21.980504989624023, "global_step": 107616, "epoch": 1296} {"train_loss": -22.014413833618164, "global_step": 107617, "epoch": 1296} {"train_loss": -22.157939910888672, "global_step": 107618, "epoch": 1296} {"train_loss": -22.483381271362305, "global_step": 107619, "epoch": 1296} {"train_loss": -22.287220001220703, "global_step": 107620, "epoch": 1296} {"train_loss": -21.897451400756836, "global_step": 107621, "epoch": 1296} {"train_loss": -21.979005813598633, "global_step": 107622, "epoch": 1296} {"train_loss": -22.37055778503418, "global_step": 107623, "epoch": 1296} {"train_loss": -21.875471115112305, "global_step": 107624, "epoch": 1296} {"train_loss": -22.451261520385742, "global_step": 107625, "epoch": 1296} {"train_loss": -22.249839782714844, "global_step": 107626, "epoch": 1296} {"train_loss": -21.943220138549805, "global_step": 107627, "epoch": 1296} {"train_loss": -22.03876304626465, "global_step": 107628, "epoch": 1296} {"train_loss": -21.950977325439453, "global_step": 107629, "epoch": 1296} {"train_loss": -21.96575927734375, "global_step": 107630, "epoch": 1296} {"train_loss": -22.673999786376953, "global_step": 107631, "epoch": 1296} {"train_loss": -21.967662811279297, "global_step": 107632, "epoch": 1296} {"train_loss": -22.2808895111084, "global_step": 107633, "epoch": 1296} {"train_loss": -22.128437042236328, "global_step": 107634, "epoch": 1296} {"train_loss": -22.32444190979004, "global_step": 107635, "epoch": 1296} {"train_loss": -22.280487060546875, "global_step": 107636, "epoch": 1296} {"train_loss": -22.4499568939209, "global_step": 107637, "epoch": 1296} {"train_loss": -22.385421752929688, "global_step": 107638, "epoch": 1296} {"train_loss": -22.428829193115234, "global_step": 107639, "epoch": 1296} {"train_loss": -22.57773208618164, "global_step": 107640, "epoch": 1296} {"train_loss": -22.099599838256836, "global_step": 107641, "epoch": 1296} {"train_loss": -22.417531967163086, "global_step": 107642, "epoch": 1296} {"train_loss": -21.893047332763672, "global_step": 107643, "epoch": 1296} {"train_loss": -22.3878173828125, "global_step": 107644, "epoch": 1296} {"train_loss": -22.229473114013672, "global_step": 107645, "epoch": 1296} {"train_loss": -21.891639709472656, "global_step": 107646, "epoch": 1296} {"train_loss": -22.10235595703125, "global_step": 107647, "epoch": 1296} {"train_loss": -22.166662216186523, "global_step": 107648, "epoch": 1296} {"train_loss": -22.64925193786621, "global_step": 107649, "epoch": 1296} {"train_loss": -22.110899247318866, "global_step": 107650, "epoch": 1296, "val_loss": 6071395.5} {"train_loss": -21.999204635620117, "global_step": 107651, "epoch": 1297} {"train_loss": -21.4619140625, "global_step": 107652, "epoch": 1297} {"train_loss": -21.473203659057617, "global_step": 107653, "epoch": 1297} {"train_loss": -21.8424072265625, "global_step": 107654, "epoch": 1297} {"train_loss": -21.427839279174805, "global_step": 107655, "epoch": 1297} {"train_loss": -21.67542266845703, "global_step": 107656, "epoch": 1297} {"train_loss": -21.71603775024414, "global_step": 107657, "epoch": 1297} {"train_loss": -21.816579818725586, "global_step": 107658, "epoch": 1297} {"train_loss": -21.82399559020996, "global_step": 107659, "epoch": 1297} {"train_loss": -22.176471710205078, "global_step": 107660, "epoch": 1297} {"train_loss": -21.626163482666016, "global_step": 107661, "epoch": 1297} {"train_loss": -21.863113403320312, "global_step": 107662, "epoch": 1297} {"train_loss": -22.056432723999023, "global_step": 107663, "epoch": 1297} {"train_loss": -21.707794189453125, "global_step": 107664, "epoch": 1297} {"train_loss": -22.371994018554688, "global_step": 107665, "epoch": 1297} {"train_loss": -21.894868850708008, "global_step": 107666, "epoch": 1297} {"train_loss": -21.947263717651367, "global_step": 107667, "epoch": 1297} {"train_loss": -21.68215560913086, "global_step": 107668, "epoch": 1297} {"train_loss": -22.042387008666992, "global_step": 107669, "epoch": 1297} {"train_loss": -21.831323623657227, "global_step": 107670, "epoch": 1297} {"train_loss": -22.1532039642334, "global_step": 107671, "epoch": 1297} {"train_loss": -21.94639015197754, "global_step": 107672, "epoch": 1297} {"train_loss": -21.79395866394043, "global_step": 107673, "epoch": 1297} {"train_loss": -22.289127349853516, "global_step": 107674, "epoch": 1297} {"train_loss": -21.94900894165039, "global_step": 107675, "epoch": 1297} {"train_loss": -22.016881942749023, "global_step": 107676, "epoch": 1297} {"train_loss": -22.240327835083008, "global_step": 107677, "epoch": 1297} {"train_loss": -22.001773834228516, "global_step": 107678, "epoch": 1297} {"train_loss": -22.036331176757812, "global_step": 107679, "epoch": 1297} {"train_loss": -21.95264434814453, "global_step": 107680, "epoch": 1297} {"train_loss": -21.83632469177246, "global_step": 107681, "epoch": 1297} {"train_loss": -22.263517379760742, "global_step": 107682, "epoch": 1297} {"train_loss": -22.49338150024414, "global_step": 107683, "epoch": 1297} {"train_loss": -22.788938522338867, "global_step": 107684, "epoch": 1297} {"train_loss": -21.67448616027832, "global_step": 107685, "epoch": 1297} {"train_loss": -22.45688819885254, "global_step": 107686, "epoch": 1297} {"train_loss": -22.224084854125977, "global_step": 107687, "epoch": 1297} {"train_loss": -22.206647872924805, "global_step": 107688, "epoch": 1297} {"train_loss": -21.601285934448242, "global_step": 107689, "epoch": 1297} {"train_loss": -21.949838638305664, "global_step": 107690, "epoch": 1297} {"train_loss": -21.93950080871582, "global_step": 107691, "epoch": 1297} {"train_loss": -22.089365005493164, "global_step": 107692, "epoch": 1297} {"train_loss": -22.196012496948242, "global_step": 107693, "epoch": 1297} {"train_loss": -21.701351165771484, "global_step": 107694, "epoch": 1297} {"train_loss": -21.673526763916016, "global_step": 107695, "epoch": 1297} {"train_loss": -21.95509910583496, "global_step": 107696, "epoch": 1297} {"train_loss": -21.983068466186523, "global_step": 107697, "epoch": 1297} {"train_loss": -21.894445419311523, "global_step": 107698, "epoch": 1297} {"train_loss": -21.838716506958008, "global_step": 107699, "epoch": 1297} {"train_loss": -22.310535430908203, "global_step": 107700, "epoch": 1297} {"train_loss": -21.966705322265625, "global_step": 107701, "epoch": 1297} {"train_loss": -22.1146240234375, "global_step": 107702, "epoch": 1297} {"train_loss": -22.52722930908203, "global_step": 107703, "epoch": 1297} {"train_loss": -22.043807983398438, "global_step": 107704, "epoch": 1297} {"train_loss": -21.91900062561035, "global_step": 107705, "epoch": 1297} {"train_loss": -22.06663703918457, "global_step": 107706, "epoch": 1297} {"train_loss": -22.040563583374023, "global_step": 107707, "epoch": 1297} {"train_loss": -22.147558212280273, "global_step": 107708, "epoch": 1297} {"train_loss": -22.025541305541992, "global_step": 107709, "epoch": 1297} {"train_loss": -22.002513885498047, "global_step": 107710, "epoch": 1297} {"train_loss": -21.969257354736328, "global_step": 107711, "epoch": 1297} {"train_loss": -22.268117904663086, "global_step": 107712, "epoch": 1297} {"train_loss": -21.730289459228516, "global_step": 107713, "epoch": 1297} {"train_loss": -21.963520050048828, "global_step": 107714, "epoch": 1297} {"train_loss": -22.207502365112305, "global_step": 107715, "epoch": 1297} {"train_loss": -22.00052833557129, "global_step": 107716, "epoch": 1297} {"train_loss": -22.217945098876953, "global_step": 107717, "epoch": 1297} {"train_loss": -22.170825958251953, "global_step": 107718, "epoch": 1297} {"train_loss": -22.04432487487793, "global_step": 107719, "epoch": 1297} {"train_loss": -21.876577377319336, "global_step": 107720, "epoch": 1297} {"train_loss": -21.97650718688965, "global_step": 107721, "epoch": 1297} {"train_loss": -22.042865753173828, "global_step": 107722, "epoch": 1297} {"train_loss": -22.23316764831543, "global_step": 107723, "epoch": 1297} {"train_loss": -22.553192138671875, "global_step": 107724, "epoch": 1297} {"train_loss": -21.913253784179688, "global_step": 107725, "epoch": 1297} {"train_loss": -22.18840980529785, "global_step": 107726, "epoch": 1297} {"train_loss": -22.580429077148438, "global_step": 107727, "epoch": 1297} {"train_loss": -22.323286056518555, "global_step": 107728, "epoch": 1297} {"train_loss": -22.341848373413086, "global_step": 107729, "epoch": 1297} {"train_loss": -22.228315353393555, "global_step": 107730, "epoch": 1297} {"train_loss": -22.0888729095459, "global_step": 107731, "epoch": 1297} {"train_loss": -22.148571014404297, "global_step": 107732, "epoch": 1297} {"train_loss": -22.018184432064196, "global_step": 107733, "epoch": 1297, "val_loss": 6182275.5} {"train_loss": -21.646804809570312, "global_step": 107734, "epoch": 1298} {"train_loss": -21.914098739624023, "global_step": 107735, "epoch": 1298} {"train_loss": -22.028766632080078, "global_step": 107736, "epoch": 1298} {"train_loss": -21.967605590820312, "global_step": 107737, "epoch": 1298} {"train_loss": -21.838397979736328, "global_step": 107738, "epoch": 1298} {"train_loss": -22.034650802612305, "global_step": 107739, "epoch": 1298} {"train_loss": -22.07636070251465, "global_step": 107740, "epoch": 1298} {"train_loss": -21.475753784179688, "global_step": 107741, "epoch": 1298} {"train_loss": -22.05517578125, "global_step": 107742, "epoch": 1298} {"train_loss": -22.204408645629883, "global_step": 107743, "epoch": 1298} {"train_loss": -21.6986141204834, "global_step": 107744, "epoch": 1298} {"train_loss": -22.149213790893555, "global_step": 107745, "epoch": 1298} {"train_loss": -22.139841079711914, "global_step": 107746, "epoch": 1298} {"train_loss": -21.90362548828125, "global_step": 107747, "epoch": 1298} {"train_loss": -21.573415756225586, "global_step": 107748, "epoch": 1298} {"train_loss": -22.045686721801758, "global_step": 107749, "epoch": 1298} {"train_loss": -22.051633834838867, "global_step": 107750, "epoch": 1298} {"train_loss": -21.8873348236084, "global_step": 107751, "epoch": 1298} {"train_loss": -22.047842025756836, "global_step": 107752, "epoch": 1298} {"train_loss": -22.077880859375, "global_step": 107753, "epoch": 1298} {"train_loss": -21.877222061157227, "global_step": 107754, "epoch": 1298} {"train_loss": -22.097105026245117, "global_step": 107755, "epoch": 1298} {"train_loss": -22.02158546447754, "global_step": 107756, "epoch": 1298} {"train_loss": -21.691913604736328, "global_step": 107757, "epoch": 1298} {"train_loss": -22.076690673828125, "global_step": 107758, "epoch": 1298} {"train_loss": -22.09442710876465, "global_step": 107759, "epoch": 1298} {"train_loss": -22.159950256347656, "global_step": 107760, "epoch": 1298} {"train_loss": -22.3179988861084, "global_step": 107761, "epoch": 1298} {"train_loss": -22.15607261657715, "global_step": 107762, "epoch": 1298} {"train_loss": -21.994159698486328, "global_step": 107763, "epoch": 1298} {"train_loss": -22.567834854125977, "global_step": 107764, "epoch": 1298} {"train_loss": -22.157743453979492, "global_step": 107765, "epoch": 1298} {"train_loss": -22.392560958862305, "global_step": 107766, "epoch": 1298} {"train_loss": -22.341793060302734, "global_step": 107767, "epoch": 1298} {"train_loss": -22.05242347717285, "global_step": 107768, "epoch": 1298} {"train_loss": -22.153982162475586, "global_step": 107769, "epoch": 1298} {"train_loss": -21.949792861938477, "global_step": 107770, "epoch": 1298} {"train_loss": -22.0982608795166, "global_step": 107771, "epoch": 1298} {"train_loss": -22.197673797607422, "global_step": 107772, "epoch": 1298} {"train_loss": -22.298477172851562, "global_step": 107773, "epoch": 1298} {"train_loss": -22.365320205688477, "global_step": 107774, "epoch": 1298} {"train_loss": -22.087182998657227, "global_step": 107775, "epoch": 1298} {"train_loss": -22.23200798034668, "global_step": 107776, "epoch": 1298} {"train_loss": -22.47225570678711, "global_step": 107777, "epoch": 1298} {"train_loss": -22.21278953552246, "global_step": 107778, "epoch": 1298} {"train_loss": -21.89451026916504, "global_step": 107779, "epoch": 1298} {"train_loss": -21.98988914489746, "global_step": 107780, "epoch": 1298} {"train_loss": -22.359886169433594, "global_step": 107781, "epoch": 1298} {"train_loss": -22.238798141479492, "global_step": 107782, "epoch": 1298} {"train_loss": -22.22336769104004, "global_step": 107783, "epoch": 1298} {"train_loss": -22.006608963012695, "global_step": 107784, "epoch": 1298} {"train_loss": -22.617055892944336, "global_step": 107785, "epoch": 1298} {"train_loss": -21.85706901550293, "global_step": 107786, "epoch": 1298} {"train_loss": -22.062868118286133, "global_step": 107787, "epoch": 1298} {"train_loss": -22.50020408630371, "global_step": 107788, "epoch": 1298} {"train_loss": -21.681005477905273, "global_step": 107789, "epoch": 1298} {"train_loss": -22.087875366210938, "global_step": 107790, "epoch": 1298} {"train_loss": -22.672407150268555, "global_step": 107791, "epoch": 1298} {"train_loss": -22.288894653320312, "global_step": 107792, "epoch": 1298} {"train_loss": -21.454015731811523, "global_step": 107793, "epoch": 1298} {"train_loss": -21.837635040283203, "global_step": 107794, "epoch": 1298} {"train_loss": -21.95222282409668, "global_step": 107795, "epoch": 1298} {"train_loss": -22.008438110351562, "global_step": 107796, "epoch": 1298} {"train_loss": -22.135787963867188, "global_step": 107797, "epoch": 1298} {"train_loss": -22.024179458618164, "global_step": 107798, "epoch": 1298} {"train_loss": -21.671751022338867, "global_step": 107799, "epoch": 1298} {"train_loss": -21.799264907836914, "global_step": 107800, "epoch": 1298} {"train_loss": -22.32813835144043, "global_step": 107801, "epoch": 1298} {"train_loss": -22.162662506103516, "global_step": 107802, "epoch": 1298} {"train_loss": -21.860715866088867, "global_step": 107803, "epoch": 1298} {"train_loss": -21.91596031188965, "global_step": 107804, "epoch": 1298} {"train_loss": -22.16615867614746, "global_step": 107805, "epoch": 1298} {"train_loss": -22.20254898071289, "global_step": 107806, "epoch": 1298} {"train_loss": -22.19989585876465, "global_step": 107807, "epoch": 1298} {"train_loss": -22.379657745361328, "global_step": 107808, "epoch": 1298} {"train_loss": -21.836130142211914, "global_step": 107809, "epoch": 1298} {"train_loss": -22.586776733398438, "global_step": 107810, "epoch": 1298} {"train_loss": -21.7069034576416, "global_step": 107811, "epoch": 1298} {"train_loss": -22.15928077697754, "global_step": 107812, "epoch": 1298} {"train_loss": -22.18242835998535, "global_step": 107813, "epoch": 1298} {"train_loss": -22.0819034576416, "global_step": 107814, "epoch": 1298} {"train_loss": -22.052661895751953, "global_step": 107815, "epoch": 1298} {"train_loss": -22.088277839752564, "global_step": 107816, "epoch": 1298, "val_loss": 6110951.0} {"train_loss": -21.418476104736328, "global_step": 107817, "epoch": 1299} {"train_loss": -21.697803497314453, "global_step": 107818, "epoch": 1299} {"train_loss": -22.013629913330078, "global_step": 107819, "epoch": 1299} {"train_loss": -22.059167861938477, "global_step": 107820, "epoch": 1299} {"train_loss": -21.76357650756836, "global_step": 107821, "epoch": 1299} {"train_loss": -21.83559799194336, "global_step": 107822, "epoch": 1299} {"train_loss": -22.266965866088867, "global_step": 107823, "epoch": 1299} {"train_loss": -21.86326026916504, "global_step": 107824, "epoch": 1299} {"train_loss": -22.07069969177246, "global_step": 107825, "epoch": 1299} {"train_loss": -21.79302978515625, "global_step": 107826, "epoch": 1299} {"train_loss": -21.61469268798828, "global_step": 107827, "epoch": 1299} {"train_loss": -21.921817779541016, "global_step": 107828, "epoch": 1299} {"train_loss": -21.98823356628418, "global_step": 107829, "epoch": 1299} {"train_loss": -21.751577377319336, "global_step": 107830, "epoch": 1299} {"train_loss": -21.898101806640625, "global_step": 107831, "epoch": 1299} {"train_loss": -22.17452049255371, "global_step": 107832, "epoch": 1299} {"train_loss": -21.69367027282715, "global_step": 107833, "epoch": 1299} {"train_loss": -22.140249252319336, "global_step": 107834, "epoch": 1299} {"train_loss": -21.8795223236084, "global_step": 107835, "epoch": 1299} {"train_loss": -22.429615020751953, "global_step": 107836, "epoch": 1299} {"train_loss": -22.134201049804688, "global_step": 107837, "epoch": 1299} {"train_loss": -22.099538803100586, "global_step": 107838, "epoch": 1299} {"train_loss": -22.052457809448242, "global_step": 107839, "epoch": 1299} {"train_loss": -22.094724655151367, "global_step": 107840, "epoch": 1299} {"train_loss": -21.86773681640625, "global_step": 107841, "epoch": 1299} {"train_loss": -22.290760040283203, "global_step": 107842, "epoch": 1299} {"train_loss": -21.77105712890625, "global_step": 107843, "epoch": 1299} {"train_loss": -21.795690536499023, "global_step": 107844, "epoch": 1299} {"train_loss": -22.247726440429688, "global_step": 107845, "epoch": 1299} {"train_loss": -22.123855590820312, "global_step": 107846, "epoch": 1299} {"train_loss": -22.273670196533203, "global_step": 107847, "epoch": 1299} {"train_loss": -21.92681884765625, "global_step": 107848, "epoch": 1299} {"train_loss": -22.046842575073242, "global_step": 107849, "epoch": 1299} {"train_loss": -22.305103302001953, "global_step": 107850, "epoch": 1299} {"train_loss": -22.189550399780273, "global_step": 107851, "epoch": 1299} {"train_loss": -22.159719467163086, "global_step": 107852, "epoch": 1299} {"train_loss": -21.981172561645508, "global_step": 107853, "epoch": 1299} {"train_loss": -22.211977005004883, "global_step": 107854, "epoch": 1299} {"train_loss": -22.1506290435791, "global_step": 107855, "epoch": 1299} {"train_loss": -22.377897262573242, "global_step": 107856, "epoch": 1299} {"train_loss": -22.2077693939209, "global_step": 107857, "epoch": 1299} {"train_loss": -22.1860294342041, "global_step": 107858, "epoch": 1299} {"train_loss": -21.983049392700195, "global_step": 107859, "epoch": 1299} {"train_loss": -22.19049835205078, "global_step": 107860, "epoch": 1299} {"train_loss": -22.315114974975586, "global_step": 107861, "epoch": 1299} {"train_loss": -21.840282440185547, "global_step": 107862, "epoch": 1299} {"train_loss": -22.04974937438965, "global_step": 107863, "epoch": 1299} {"train_loss": -22.44535255432129, "global_step": 107864, "epoch": 1299} {"train_loss": -21.984819412231445, "global_step": 107865, "epoch": 1299} {"train_loss": -22.090673446655273, "global_step": 107866, "epoch": 1299} {"train_loss": -22.09073257446289, "global_step": 107867, "epoch": 1299} {"train_loss": -22.067707061767578, "global_step": 107868, "epoch": 1299} {"train_loss": -22.386417388916016, "global_step": 107869, "epoch": 1299} {"train_loss": -22.132383346557617, "global_step": 107870, "epoch": 1299} {"train_loss": -21.860523223876953, "global_step": 107871, "epoch": 1299} {"train_loss": -21.91573715209961, "global_step": 107872, "epoch": 1299} {"train_loss": -22.537256240844727, "global_step": 107873, "epoch": 1299} {"train_loss": -22.02528953552246, "global_step": 107874, "epoch": 1299} {"train_loss": -22.11154556274414, "global_step": 107875, "epoch": 1299} {"train_loss": -22.080629348754883, "global_step": 107876, "epoch": 1299} {"train_loss": -22.097030639648438, "global_step": 107877, "epoch": 1299} {"train_loss": -22.50221061706543, "global_step": 107878, "epoch": 1299} {"train_loss": -22.031057357788086, "global_step": 107879, "epoch": 1299} {"train_loss": -22.16517448425293, "global_step": 107880, "epoch": 1299} {"train_loss": -22.245248794555664, "global_step": 107881, "epoch": 1299} {"train_loss": -22.66660499572754, "global_step": 107882, "epoch": 1299} {"train_loss": -21.988361358642578, "global_step": 107883, "epoch": 1299} {"train_loss": -22.086896896362305, "global_step": 107884, "epoch": 1299} {"train_loss": -22.281164169311523, "global_step": 107885, "epoch": 1299} {"train_loss": -22.50791358947754, "global_step": 107886, "epoch": 1299} {"train_loss": -22.463830947875977, "global_step": 107887, "epoch": 1299} {"train_loss": -22.17156982421875, "global_step": 107888, "epoch": 1299} {"train_loss": -21.811460494995117, "global_step": 107889, "epoch": 1299} {"train_loss": -22.314897537231445, "global_step": 107890, "epoch": 1299} {"train_loss": -22.104129791259766, "global_step": 107891, "epoch": 1299} {"train_loss": -21.95120620727539, "global_step": 107892, "epoch": 1299} {"train_loss": -22.03719139099121, "global_step": 107893, "epoch": 1299} {"train_loss": -22.20211410522461, "global_step": 107894, "epoch": 1299} {"train_loss": -22.10327911376953, "global_step": 107895, "epoch": 1299} {"train_loss": -22.083629608154297, "global_step": 107896, "epoch": 1299} {"train_loss": -21.929386138916016, "global_step": 107897, "epoch": 1299} {"train_loss": -22.021482467651367, "global_step": 107898, "epoch": 1299} {"train_loss": -22.076535856867412, "global_step": 107899, "epoch": 1299, "val_loss": 6082566.0} {"train_loss": -21.519132614135742, "global_step": 107900, "epoch": 1300} {"train_loss": -22.354501724243164, "global_step": 107901, "epoch": 1300} {"train_loss": -21.716949462890625, "global_step": 107902, "epoch": 1300} {"train_loss": -21.942052841186523, "global_step": 107903, "epoch": 1300} {"train_loss": -21.878726959228516, "global_step": 107904, "epoch": 1300} {"train_loss": -21.92777442932129, "global_step": 107905, "epoch": 1300} {"train_loss": -21.82765007019043, "global_step": 107906, "epoch": 1300} {"train_loss": -22.331756591796875, "global_step": 107907, "epoch": 1300} {"train_loss": -21.911928176879883, "global_step": 107908, "epoch": 1300} {"train_loss": -22.359716415405273, "global_step": 107909, "epoch": 1300} {"train_loss": -22.840761184692383, "global_step": 107910, "epoch": 1300} {"train_loss": -22.442312240600586, "global_step": 107911, "epoch": 1300} {"train_loss": -22.234777450561523, "global_step": 107912, "epoch": 1300} {"train_loss": -22.564239501953125, "global_step": 107913, "epoch": 1300} {"train_loss": -21.880203247070312, "global_step": 107914, "epoch": 1300} {"train_loss": -22.23178482055664, "global_step": 107915, "epoch": 1300} {"train_loss": -22.301769256591797, "global_step": 107916, "epoch": 1300} {"train_loss": -22.323928833007812, "global_step": 107917, "epoch": 1300} {"train_loss": -22.08934783935547, "global_step": 107918, "epoch": 1300} {"train_loss": -22.527610778808594, "global_step": 107919, "epoch": 1300} {"train_loss": -22.232664108276367, "global_step": 107920, "epoch": 1300} {"train_loss": -21.716445922851562, "global_step": 107921, "epoch": 1300} {"train_loss": -22.165367126464844, "global_step": 107922, "epoch": 1300} {"train_loss": -21.717330932617188, "global_step": 107923, "epoch": 1300} {"train_loss": -22.12824821472168, "global_step": 107924, "epoch": 1300} {"train_loss": -22.200986862182617, "global_step": 107925, "epoch": 1300} {"train_loss": -22.19521141052246, "global_step": 107926, "epoch": 1300} {"train_loss": -22.283376693725586, "global_step": 107927, "epoch": 1300} {"train_loss": -22.296924591064453, "global_step": 107928, "epoch": 1300} {"train_loss": -21.9636173248291, "global_step": 107929, "epoch": 1300} {"train_loss": -22.133832931518555, "global_step": 107930, "epoch": 1300} {"train_loss": -22.08043670654297, "global_step": 107931, "epoch": 1300} {"train_loss": -21.94842529296875, "global_step": 107932, "epoch": 1300} {"train_loss": -22.607572555541992, "global_step": 107933, "epoch": 1300} {"train_loss": -21.942129135131836, "global_step": 107934, "epoch": 1300} {"train_loss": -22.62929916381836, "global_step": 107935, "epoch": 1300} {"train_loss": -22.033971786499023, "global_step": 107936, "epoch": 1300} {"train_loss": -22.29537582397461, "global_step": 107937, "epoch": 1300} {"train_loss": -22.494508743286133, "global_step": 107938, "epoch": 1300} {"train_loss": -22.583301544189453, "global_step": 107939, "epoch": 1300} {"train_loss": -22.022680282592773, "global_step": 107940, "epoch": 1300} {"train_loss": -22.262907028198242, "global_step": 107941, "epoch": 1300} {"train_loss": -22.5851993560791, "global_step": 107942, "epoch": 1300} {"train_loss": -22.02328109741211, "global_step": 107943, "epoch": 1300} {"train_loss": -23.04353141784668, "global_step": 107944, "epoch": 1300} {"train_loss": -22.14373779296875, "global_step": 107945, "epoch": 1300} {"train_loss": -22.282411575317383, "global_step": 107946, "epoch": 1300} {"train_loss": -22.327899932861328, "global_step": 107947, "epoch": 1300} {"train_loss": -21.66823387145996, "global_step": 107948, "epoch": 1300} {"train_loss": -22.151639938354492, "global_step": 107949, "epoch": 1300} {"train_loss": -22.273719787597656, "global_step": 107950, "epoch": 1300} {"train_loss": -22.250263214111328, "global_step": 107951, "epoch": 1300} {"train_loss": -22.325485229492188, "global_step": 107952, "epoch": 1300} {"train_loss": -22.334293365478516, "global_step": 107953, "epoch": 1300} {"train_loss": -22.22074317932129, "global_step": 107954, "epoch": 1300} {"train_loss": -22.378164291381836, "global_step": 107955, "epoch": 1300} {"train_loss": -22.2244930267334, "global_step": 107956, "epoch": 1300} {"train_loss": -22.2951602935791, "global_step": 107957, "epoch": 1300} {"train_loss": -22.24202537536621, "global_step": 107958, "epoch": 1300} {"train_loss": -22.286949157714844, "global_step": 107959, "epoch": 1300} {"train_loss": -22.17120361328125, "global_step": 107960, "epoch": 1300} {"train_loss": -22.01392936706543, "global_step": 107961, "epoch": 1300} {"train_loss": -22.532230377197266, "global_step": 107962, "epoch": 1300} {"train_loss": -22.17667579650879, "global_step": 107963, "epoch": 1300} {"train_loss": -22.240026473999023, "global_step": 107964, "epoch": 1300} {"train_loss": -22.052988052368164, "global_step": 107965, "epoch": 1300} {"train_loss": -22.052932739257812, "global_step": 107966, "epoch": 1300} {"train_loss": -22.14734649658203, "global_step": 107967, "epoch": 1300} {"train_loss": -22.154560089111328, "global_step": 107968, "epoch": 1300} {"train_loss": -21.967390060424805, "global_step": 107969, "epoch": 1300} {"train_loss": -21.885740280151367, "global_step": 107970, "epoch": 1300} {"train_loss": -22.269460678100586, "global_step": 107971, "epoch": 1300} {"train_loss": -22.47489356994629, "global_step": 107972, "epoch": 1300} {"train_loss": -21.988693237304688, "global_step": 107973, "epoch": 1300} {"train_loss": -22.164844512939453, "global_step": 107974, "epoch": 1300} {"train_loss": -22.484392166137695, "global_step": 107975, "epoch": 1300} {"train_loss": -22.47488021850586, "global_step": 107976, "epoch": 1300} {"train_loss": -22.356739044189453, "global_step": 107977, "epoch": 1300} {"train_loss": -22.176664352416992, "global_step": 107978, "epoch": 1300} {"train_loss": -22.477294921875, "global_step": 107979, "epoch": 1300} {"train_loss": -22.075435638427734, "global_step": 107980, "epoch": 1300} {"train_loss": -22.197782516479492, "global_step": 107981, "epoch": 1300} {"train_loss": -22.220372073621636, "global_step": 107982, "epoch": 1300, "train/sim_max_reward_0": 1.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4500000": 1.0, "test/sim_max_reward_4500001": 1.0, "test/sim_max_reward_4500002": 1.0, "test/sim_max_reward_4500003": 1.0, "test/sim_max_reward_4500004": 1.0, "test/sim_max_reward_4500005": 1.0, "test/sim_max_reward_4500006": 1.0, "test/sim_max_reward_4500007": 1.0, "test/sim_max_reward_4500008": 1.0, "test/sim_max_reward_4500009": 1.0, "test/sim_max_reward_4500010": 1.0, "test/sim_max_reward_4500011": 1.0, "test/sim_max_reward_4500012": 1.0, "test/sim_max_reward_4500013": 1.0, "test/sim_max_reward_4500014": 1.0, "test/sim_max_reward_4500015": 1.0, "test/sim_max_reward_4500016": 1.0, "test/sim_max_reward_4500017": 1.0, "test/sim_max_reward_4500018": 1.0, "test/sim_max_reward_4500019": 1.0, "test/sim_max_reward_4500020": 1.0, "test/sim_max_reward_4500021": 1.0, "train/mean_score": 1.0, "test/mean_score": 1.0, "val_loss": 6119555.5} {"train_loss": -22.071517944335938, "global_step": 107983, "epoch": 1301} {"train_loss": -22.02235221862793, "global_step": 107984, "epoch": 1301} {"train_loss": -22.33125877380371, "global_step": 107985, "epoch": 1301} {"train_loss": -22.093164443969727, "global_step": 107986, "epoch": 1301} {"train_loss": -21.983060836791992, "global_step": 107987, "epoch": 1301} {"train_loss": -22.662290573120117, "global_step": 107988, "epoch": 1301} {"train_loss": -22.0334529876709, "global_step": 107989, "epoch": 1301} {"train_loss": -22.101917266845703, "global_step": 107990, "epoch": 1301} {"train_loss": -22.16985321044922, "global_step": 107991, "epoch": 1301} {"train_loss": -21.94903564453125, "global_step": 107992, "epoch": 1301} {"train_loss": -21.827926635742188, "global_step": 107993, "epoch": 1301} {"train_loss": -22.008955001831055, "global_step": 107994, "epoch": 1301} {"train_loss": -22.276113510131836, "global_step": 107995, "epoch": 1301} {"train_loss": -22.054595947265625, "global_step": 107996, "epoch": 1301} {"train_loss": -22.2894229888916, "global_step": 107997, "epoch": 1301} {"train_loss": -22.21083641052246, "global_step": 107998, "epoch": 1301} {"train_loss": -21.979717254638672, "global_step": 107999, "epoch": 1301} {"train_loss": -21.95013999938965, "global_step": 108000, "epoch": 1301} {"train_loss": -22.45113754272461, "global_step": 108001, "epoch": 1301} {"train_loss": -21.977712631225586, "global_step": 108002, "epoch": 1301} {"train_loss": -21.64668846130371, "global_step": 108003, "epoch": 1301} {"train_loss": -22.184823989868164, "global_step": 108004, "epoch": 1301} {"train_loss": -22.16328239440918, "global_step": 108005, "epoch": 1301} {"train_loss": -22.023420333862305, "global_step": 108006, "epoch": 1301} {"train_loss": -22.137739181518555, "global_step": 108007, "epoch": 1301} {"train_loss": -22.258827209472656, "global_step": 108008, "epoch": 1301} {"train_loss": -22.16266441345215, "global_step": 108009, "epoch": 1301} {"train_loss": -22.176071166992188, "global_step": 108010, "epoch": 1301} {"train_loss": -22.25631332397461, "global_step": 108011, "epoch": 1301} {"train_loss": -21.840734481811523, "global_step": 108012, "epoch": 1301} {"train_loss": -22.106597900390625, "global_step": 108013, "epoch": 1301} {"train_loss": -22.054622650146484, "global_step": 108014, "epoch": 1301} {"train_loss": -22.072147369384766, "global_step": 108015, "epoch": 1301} {"train_loss": -22.319869995117188, "global_step": 108016, "epoch": 1301} {"train_loss": -21.96646499633789, "global_step": 108017, "epoch": 1301} {"train_loss": -22.100528717041016, "global_step": 108018, "epoch": 1301} {"train_loss": -22.325098037719727, "global_step": 108019, "epoch": 1301} {"train_loss": -22.027294158935547, "global_step": 108020, "epoch": 1301} {"train_loss": -22.919830322265625, "global_step": 108021, "epoch": 1301} {"train_loss": -22.381546020507812, "global_step": 108022, "epoch": 1301} {"train_loss": -22.234174728393555, "global_step": 108023, "epoch": 1301} {"train_loss": -22.3187313079834, "global_step": 108024, "epoch": 1301} {"train_loss": -22.255517959594727, "global_step": 108025, "epoch": 1301} {"train_loss": -21.89841651916504, "global_step": 108026, "epoch": 1301} {"train_loss": -22.079143524169922, "global_step": 108027, "epoch": 1301} {"train_loss": -22.19037437438965, "global_step": 108028, "epoch": 1301} {"train_loss": -22.255603790283203, "global_step": 108029, "epoch": 1301} {"train_loss": -22.597232818603516, "global_step": 108030, "epoch": 1301} {"train_loss": -22.46589469909668, "global_step": 108031, "epoch": 1301} {"train_loss": -22.494277954101562, "global_step": 108032, "epoch": 1301} {"train_loss": -21.998823165893555, "global_step": 108033, "epoch": 1301} {"train_loss": -22.264062881469727, "global_step": 108034, "epoch": 1301} {"train_loss": -22.164966583251953, "global_step": 108035, "epoch": 1301} {"train_loss": -22.725414276123047, "global_step": 108036, "epoch": 1301} {"train_loss": -22.116683959960938, "global_step": 108037, "epoch": 1301} {"train_loss": -22.098264694213867, "global_step": 108038, "epoch": 1301} {"train_loss": -22.25404167175293, "global_step": 108039, "epoch": 1301} {"train_loss": -22.2093505859375, "global_step": 108040, "epoch": 1301} {"train_loss": -22.387359619140625, "global_step": 108041, "epoch": 1301} {"train_loss": -22.218896865844727, "global_step": 108042, "epoch": 1301} {"train_loss": -22.0123233795166, "global_step": 108043, "epoch": 1301} {"train_loss": -22.01030158996582, "global_step": 108044, "epoch": 1301} {"train_loss": -22.221641540527344, "global_step": 108045, "epoch": 1301} {"train_loss": -22.429845809936523, "global_step": 108046, "epoch": 1301} {"train_loss": -21.822107315063477, "global_step": 108047, "epoch": 1301} {"train_loss": -22.068710327148438, "global_step": 108048, "epoch": 1301} {"train_loss": -22.112775802612305, "global_step": 108049, "epoch": 1301} {"train_loss": -21.970090866088867, "global_step": 108050, "epoch": 1301} {"train_loss": -22.394248962402344, "global_step": 108051, "epoch": 1301} {"train_loss": -22.050941467285156, "global_step": 108052, "epoch": 1301} {"train_loss": -22.201539993286133, "global_step": 108053, "epoch": 1301} {"train_loss": -22.426862716674805, "global_step": 108054, "epoch": 1301} {"train_loss": -22.19339942932129, "global_step": 108055, "epoch": 1301} {"train_loss": -22.440948486328125, "global_step": 108056, "epoch": 1301} {"train_loss": -22.456541061401367, "global_step": 108057, "epoch": 1301} {"train_loss": -22.09212875366211, "global_step": 108058, "epoch": 1301} {"train_loss": -22.006803512573242, "global_step": 108059, "epoch": 1301} {"train_loss": -22.46833038330078, "global_step": 108060, "epoch": 1301} {"train_loss": -22.370634078979492, "global_step": 108061, "epoch": 1301} {"train_loss": -22.3729305267334, "global_step": 108062, "epoch": 1301} {"train_loss": -22.325626373291016, "global_step": 108063, "epoch": 1301} {"train_loss": -22.126279830932617, "global_step": 108064, "epoch": 1301} {"train_loss": -22.191103349249047, "global_step": 108065, "epoch": 1301, "val_loss": 6165505.5} {"train_loss": -20.491195678710938, "global_step": 108066, "epoch": 1302} {"train_loss": -20.626449584960938, "global_step": 108067, "epoch": 1302} {"train_loss": -21.18433952331543, "global_step": 108068, "epoch": 1302} {"train_loss": -21.26959228515625, "global_step": 108069, "epoch": 1302} {"train_loss": -21.090179443359375, "global_step": 108070, "epoch": 1302} {"train_loss": -21.460599899291992, "global_step": 108071, "epoch": 1302} {"train_loss": -20.94807243347168, "global_step": 108072, "epoch": 1302} {"train_loss": -21.706127166748047, "global_step": 108073, "epoch": 1302} {"train_loss": -21.060529708862305, "global_step": 108074, "epoch": 1302} {"train_loss": -21.915489196777344, "global_step": 108075, "epoch": 1302} {"train_loss": -21.77536392211914, "global_step": 108076, "epoch": 1302} {"train_loss": -21.740009307861328, "global_step": 108077, "epoch": 1302} {"train_loss": -21.594528198242188, "global_step": 108078, "epoch": 1302} {"train_loss": -21.71515464782715, "global_step": 108079, "epoch": 1302} {"train_loss": -21.718381881713867, "global_step": 108080, "epoch": 1302} {"train_loss": -21.604658126831055, "global_step": 108081, "epoch": 1302} {"train_loss": -21.955581665039062, "global_step": 108082, "epoch": 1302} {"train_loss": -21.750751495361328, "global_step": 108083, "epoch": 1302} {"train_loss": -21.88595962524414, "global_step": 108084, "epoch": 1302} {"train_loss": -21.643352508544922, "global_step": 108085, "epoch": 1302} {"train_loss": -21.964582443237305, "global_step": 108086, "epoch": 1302} {"train_loss": -22.029226303100586, "global_step": 108087, "epoch": 1302} {"train_loss": -22.229721069335938, "global_step": 108088, "epoch": 1302} {"train_loss": -21.84872817993164, "global_step": 108089, "epoch": 1302} {"train_loss": -22.18671226501465, "global_step": 108090, "epoch": 1302} {"train_loss": -21.9198055267334, "global_step": 108091, "epoch": 1302} {"train_loss": -21.99820899963379, "global_step": 108092, "epoch": 1302} {"train_loss": -21.681549072265625, "global_step": 108093, "epoch": 1302} {"train_loss": -22.54248046875, "global_step": 108094, "epoch": 1302} {"train_loss": -22.12122917175293, "global_step": 108095, "epoch": 1302} {"train_loss": -21.976760864257812, "global_step": 108096, "epoch": 1302} {"train_loss": -21.750097274780273, "global_step": 108097, "epoch": 1302} {"train_loss": -21.866559982299805, "global_step": 108098, "epoch": 1302} {"train_loss": -22.193429946899414, "global_step": 108099, "epoch": 1302} {"train_loss": -22.06158447265625, "global_step": 108100, "epoch": 1302} {"train_loss": -22.506877899169922, "global_step": 108101, "epoch": 1302} {"train_loss": -22.02898597717285, "global_step": 108102, "epoch": 1302} {"train_loss": -22.02425765991211, "global_step": 108103, "epoch": 1302} {"train_loss": -22.604141235351562, "global_step": 108104, "epoch": 1302} {"train_loss": -22.213483810424805, "global_step": 108105, "epoch": 1302} {"train_loss": -22.722623825073242, "global_step": 108106, "epoch": 1302} {"train_loss": -21.955778121948242, "global_step": 108107, "epoch": 1302} {"train_loss": -22.35662269592285, "global_step": 108108, "epoch": 1302} {"train_loss": -22.099069595336914, "global_step": 108109, "epoch": 1302} {"train_loss": -22.06877326965332, "global_step": 108110, "epoch": 1302} {"train_loss": -21.894027709960938, "global_step": 108111, "epoch": 1302} {"train_loss": -22.478862762451172, "global_step": 108112, "epoch": 1302} {"train_loss": -22.41004753112793, "global_step": 108113, "epoch": 1302} {"train_loss": -22.250385284423828, "global_step": 108114, "epoch": 1302} {"train_loss": -22.228042602539062, "global_step": 108115, "epoch": 1302} {"train_loss": -22.329076766967773, "global_step": 108116, "epoch": 1302} {"train_loss": -22.304080963134766, "global_step": 108117, "epoch": 1302} {"train_loss": -22.307313919067383, "global_step": 108118, "epoch": 1302} {"train_loss": -22.28973960876465, "global_step": 108119, "epoch": 1302} {"train_loss": -21.833683013916016, "global_step": 108120, "epoch": 1302} {"train_loss": -22.5253963470459, "global_step": 108121, "epoch": 1302} {"train_loss": -21.672380447387695, "global_step": 108122, "epoch": 1302} {"train_loss": -22.291318893432617, "global_step": 108123, "epoch": 1302} {"train_loss": -22.418004989624023, "global_step": 108124, "epoch": 1302} {"train_loss": -22.43173599243164, "global_step": 108125, "epoch": 1302} {"train_loss": -22.32425880432129, "global_step": 108126, "epoch": 1302} {"train_loss": -22.21187400817871, "global_step": 108127, "epoch": 1302} {"train_loss": -22.037378311157227, "global_step": 108128, "epoch": 1302} {"train_loss": -22.585063934326172, "global_step": 108129, "epoch": 1302} {"train_loss": -22.36318016052246, "global_step": 108130, "epoch": 1302} {"train_loss": -21.993106842041016, "global_step": 108131, "epoch": 1302} {"train_loss": -22.149627685546875, "global_step": 108132, "epoch": 1302} {"train_loss": -22.140195846557617, "global_step": 108133, "epoch": 1302} {"train_loss": -22.373640060424805, "global_step": 108134, "epoch": 1302} {"train_loss": -22.405445098876953, "global_step": 108135, "epoch": 1302} {"train_loss": -22.420085906982422, "global_step": 108136, "epoch": 1302} {"train_loss": -21.937240600585938, "global_step": 108137, "epoch": 1302} {"train_loss": -22.20911979675293, "global_step": 108138, "epoch": 1302} {"train_loss": -22.060333251953125, "global_step": 108139, "epoch": 1302} {"train_loss": -22.73538589477539, "global_step": 108140, "epoch": 1302} {"train_loss": -22.58877944946289, "global_step": 108141, "epoch": 1302} {"train_loss": -21.99260902404785, "global_step": 108142, "epoch": 1302} {"train_loss": -22.1749324798584, "global_step": 108143, "epoch": 1302} {"train_loss": -22.23653793334961, "global_step": 108144, "epoch": 1302} {"train_loss": -22.136539459228516, "global_step": 108145, "epoch": 1302} {"train_loss": -22.43184471130371, "global_step": 108146, "epoch": 1302} {"train_loss": -22.428579330444336, "global_step": 108147, "epoch": 1302} {"train_loss": -22.019847869873047, "global_step": 108148, "epoch": 1302, "val_loss": 6179233.0} {"train_loss": -19.811147689819336, "global_step": 108149, "epoch": 1303} {"train_loss": -21.267349243164062, "global_step": 108150, "epoch": 1303} {"train_loss": -21.303842544555664, "global_step": 108151, "epoch": 1303} {"train_loss": -21.437257766723633, "global_step": 108152, "epoch": 1303} {"train_loss": -21.331937789916992, "global_step": 108153, "epoch": 1303} {"train_loss": -21.454755783081055, "global_step": 108154, "epoch": 1303} {"train_loss": -21.389446258544922, "global_step": 108155, "epoch": 1303} {"train_loss": -21.351350784301758, "global_step": 108156, "epoch": 1303} {"train_loss": -21.734394073486328, "global_step": 108157, "epoch": 1303} {"train_loss": -21.13679313659668, "global_step": 108158, "epoch": 1303} {"train_loss": -21.982860565185547, "global_step": 108159, "epoch": 1303} {"train_loss": -21.6717586517334, "global_step": 108160, "epoch": 1303} {"train_loss": -21.829004287719727, "global_step": 108161, "epoch": 1303} {"train_loss": -21.597217559814453, "global_step": 108162, "epoch": 1303} {"train_loss": -21.682626724243164, "global_step": 108163, "epoch": 1303} {"train_loss": -21.686405181884766, "global_step": 108164, "epoch": 1303} {"train_loss": -22.06102752685547, "global_step": 108165, "epoch": 1303} {"train_loss": -21.60013771057129, "global_step": 108166, "epoch": 1303} {"train_loss": -21.551464080810547, "global_step": 108167, "epoch": 1303} {"train_loss": -21.6134090423584, "global_step": 108168, "epoch": 1303} {"train_loss": -21.914274215698242, "global_step": 108169, "epoch": 1303} {"train_loss": -22.363039016723633, "global_step": 108170, "epoch": 1303} {"train_loss": -21.814329147338867, "global_step": 108171, "epoch": 1303} {"train_loss": -22.1885929107666, "global_step": 108172, "epoch": 1303} {"train_loss": -22.18729591369629, "global_step": 108173, "epoch": 1303} {"train_loss": -21.70368194580078, "global_step": 108174, "epoch": 1303} {"train_loss": -21.94268798828125, "global_step": 108175, "epoch": 1303} {"train_loss": -22.004520416259766, "global_step": 108176, "epoch": 1303} {"train_loss": -21.86285400390625, "global_step": 108177, "epoch": 1303} {"train_loss": -22.230499267578125, "global_step": 108178, "epoch": 1303} {"train_loss": -22.406850814819336, "global_step": 108179, "epoch": 1303} {"train_loss": -22.188446044921875, "global_step": 108180, "epoch": 1303} {"train_loss": -21.862165451049805, "global_step": 108181, "epoch": 1303} {"train_loss": -22.588048934936523, "global_step": 108182, "epoch": 1303} {"train_loss": -22.173538208007812, "global_step": 108183, "epoch": 1303} {"train_loss": -22.4935302734375, "global_step": 108184, "epoch": 1303} {"train_loss": -21.896739959716797, "global_step": 108185, "epoch": 1303} {"train_loss": -22.1152286529541, "global_step": 108186, "epoch": 1303} {"train_loss": -22.37477684020996, "global_step": 108187, "epoch": 1303} {"train_loss": -22.250831604003906, "global_step": 108188, "epoch": 1303} {"train_loss": -22.009387969970703, "global_step": 108189, "epoch": 1303} {"train_loss": -21.8714542388916, "global_step": 108190, "epoch": 1303} {"train_loss": -21.969728469848633, "global_step": 108191, "epoch": 1303} {"train_loss": -22.117963790893555, "global_step": 108192, "epoch": 1303} {"train_loss": -22.15512466430664, "global_step": 108193, "epoch": 1303} {"train_loss": -21.973066329956055, "global_step": 108194, "epoch": 1303} {"train_loss": -22.304962158203125, "global_step": 108195, "epoch": 1303} {"train_loss": -22.216867446899414, "global_step": 108196, "epoch": 1303} {"train_loss": -22.202476501464844, "global_step": 108197, "epoch": 1303} {"train_loss": -22.177541732788086, "global_step": 108198, "epoch": 1303} {"train_loss": -22.235849380493164, "global_step": 108199, "epoch": 1303} {"train_loss": -22.105295181274414, "global_step": 108200, "epoch": 1303} {"train_loss": -21.92274284362793, "global_step": 108201, "epoch": 1303} {"train_loss": -22.13521385192871, "global_step": 108202, "epoch": 1303} {"train_loss": -22.145160675048828, "global_step": 108203, "epoch": 1303} {"train_loss": -22.186767578125, "global_step": 108204, "epoch": 1303} {"train_loss": -22.292036056518555, "global_step": 108205, "epoch": 1303} {"train_loss": -22.293725967407227, "global_step": 108206, "epoch": 1303} {"train_loss": -22.077926635742188, "global_step": 108207, "epoch": 1303} {"train_loss": -22.361257553100586, "global_step": 108208, "epoch": 1303} {"train_loss": -22.137893676757812, "global_step": 108209, "epoch": 1303} {"train_loss": -22.21014404296875, "global_step": 108210, "epoch": 1303} {"train_loss": -22.353099822998047, "global_step": 108211, "epoch": 1303} {"train_loss": -22.33954429626465, "global_step": 108212, "epoch": 1303} {"train_loss": -22.20961570739746, "global_step": 108213, "epoch": 1303} {"train_loss": -22.35323715209961, "global_step": 108214, "epoch": 1303} {"train_loss": -21.965417861938477, "global_step": 108215, "epoch": 1303} {"train_loss": -21.88275146484375, "global_step": 108216, "epoch": 1303} {"train_loss": -22.044715881347656, "global_step": 108217, "epoch": 1303} {"train_loss": -22.333702087402344, "global_step": 108218, "epoch": 1303} {"train_loss": -22.082473754882812, "global_step": 108219, "epoch": 1303} {"train_loss": -21.884231567382812, "global_step": 108220, "epoch": 1303} {"train_loss": -22.23036003112793, "global_step": 108221, "epoch": 1303} {"train_loss": -22.461576461791992, "global_step": 108222, "epoch": 1303} {"train_loss": -22.259632110595703, "global_step": 108223, "epoch": 1303} {"train_loss": -22.18313980102539, "global_step": 108224, "epoch": 1303} {"train_loss": -22.20752716064453, "global_step": 108225, "epoch": 1303} {"train_loss": -22.326139450073242, "global_step": 108226, "epoch": 1303} {"train_loss": -22.100645065307617, "global_step": 108227, "epoch": 1303} {"train_loss": -22.231290817260742, "global_step": 108228, "epoch": 1303} {"train_loss": -22.25244140625, "global_step": 108229, "epoch": 1303} {"train_loss": -22.021963119506836, "global_step": 108230, "epoch": 1303} {"train_loss": -22.014148781098516, "global_step": 108231, "epoch": 1303, "val_loss": 6194854.0} {"train_loss": -21.412263870239258, "global_step": 108232, "epoch": 1304} {"train_loss": -22.24243927001953, "global_step": 108233, "epoch": 1304} {"train_loss": -21.34473419189453, "global_step": 108234, "epoch": 1304} {"train_loss": -21.523256301879883, "global_step": 108235, "epoch": 1304} {"train_loss": -21.836261749267578, "global_step": 108236, "epoch": 1304} {"train_loss": -21.885318756103516, "global_step": 108237, "epoch": 1304} {"train_loss": -22.083925247192383, "global_step": 108238, "epoch": 1304} {"train_loss": -21.73915672302246, "global_step": 108239, "epoch": 1304} {"train_loss": -21.6898136138916, "global_step": 108240, "epoch": 1304} {"train_loss": -22.089214324951172, "global_step": 108241, "epoch": 1304} {"train_loss": -21.9823055267334, "global_step": 108242, "epoch": 1304} {"train_loss": -21.922109603881836, "global_step": 108243, "epoch": 1304} {"train_loss": -22.226716995239258, "global_step": 108244, "epoch": 1304} {"train_loss": -21.830425262451172, "global_step": 108245, "epoch": 1304} {"train_loss": -22.179452896118164, "global_step": 108246, "epoch": 1304} {"train_loss": -21.878742218017578, "global_step": 108247, "epoch": 1304} {"train_loss": -22.04066276550293, "global_step": 108248, "epoch": 1304} {"train_loss": -22.058462142944336, "global_step": 108249, "epoch": 1304} {"train_loss": -22.099943161010742, "global_step": 108250, "epoch": 1304} {"train_loss": -22.018354415893555, "global_step": 108251, "epoch": 1304} {"train_loss": -22.37183952331543, "global_step": 108252, "epoch": 1304} {"train_loss": -21.612098693847656, "global_step": 108253, "epoch": 1304} {"train_loss": -22.19087791442871, "global_step": 108254, "epoch": 1304} {"train_loss": -22.143537521362305, "global_step": 108255, "epoch": 1304} {"train_loss": -21.81198501586914, "global_step": 108256, "epoch": 1304} {"train_loss": -22.157285690307617, "global_step": 108257, "epoch": 1304} {"train_loss": -22.16374969482422, "global_step": 108258, "epoch": 1304} {"train_loss": -22.524930953979492, "global_step": 108259, "epoch": 1304} {"train_loss": -22.395498275756836, "global_step": 108260, "epoch": 1304} {"train_loss": -22.388904571533203, "global_step": 108261, "epoch": 1304} {"train_loss": -21.915573120117188, "global_step": 108262, "epoch": 1304} {"train_loss": -21.89619255065918, "global_step": 108263, "epoch": 1304} {"train_loss": -22.366132736206055, "global_step": 108264, "epoch": 1304} {"train_loss": -22.220661163330078, "global_step": 108265, "epoch": 1304} {"train_loss": -22.339740753173828, "global_step": 108266, "epoch": 1304} {"train_loss": -21.968992233276367, "global_step": 108267, "epoch": 1304} {"train_loss": -21.972110748291016, "global_step": 108268, "epoch": 1304} {"train_loss": -22.034931182861328, "global_step": 108269, "epoch": 1304} {"train_loss": -22.446928024291992, "global_step": 108270, "epoch": 1304} {"train_loss": -22.31941032409668, "global_step": 108271, "epoch": 1304} {"train_loss": -22.30495262145996, "global_step": 108272, "epoch": 1304} {"train_loss": -22.2242431640625, "global_step": 108273, "epoch": 1304} {"train_loss": -22.312034606933594, "global_step": 108274, "epoch": 1304} {"train_loss": -22.036428451538086, "global_step": 108275, "epoch": 1304} {"train_loss": -22.1894474029541, "global_step": 108276, "epoch": 1304} {"train_loss": -21.94775390625, "global_step": 108277, "epoch": 1304} {"train_loss": -22.408987045288086, "global_step": 108278, "epoch": 1304} {"train_loss": -22.21744728088379, "global_step": 108279, "epoch": 1304} {"train_loss": -22.006242752075195, "global_step": 108280, "epoch": 1304} {"train_loss": -22.10883140563965, "global_step": 108281, "epoch": 1304} {"train_loss": -22.28891372680664, "global_step": 108282, "epoch": 1304} {"train_loss": -22.059616088867188, "global_step": 108283, "epoch": 1304} {"train_loss": -22.330801010131836, "global_step": 108284, "epoch": 1304} {"train_loss": -22.146831512451172, "global_step": 108285, "epoch": 1304} {"train_loss": -22.211050033569336, "global_step": 108286, "epoch": 1304} {"train_loss": -21.9962215423584, "global_step": 108287, "epoch": 1304} {"train_loss": -22.137521743774414, "global_step": 108288, "epoch": 1304} {"train_loss": -22.314250946044922, "global_step": 108289, "epoch": 1304} {"train_loss": -22.236923217773438, "global_step": 108290, "epoch": 1304} {"train_loss": -22.1535701751709, "global_step": 108291, "epoch": 1304} {"train_loss": -22.29997444152832, "global_step": 108292, "epoch": 1304} {"train_loss": -22.391355514526367, "global_step": 108293, "epoch": 1304} {"train_loss": -22.55571174621582, "global_step": 108294, "epoch": 1304} {"train_loss": -22.353666305541992, "global_step": 108295, "epoch": 1304} {"train_loss": -22.356271743774414, "global_step": 108296, "epoch": 1304} {"train_loss": -22.121164321899414, "global_step": 108297, "epoch": 1304} {"train_loss": -22.58534049987793, "global_step": 108298, "epoch": 1304} {"train_loss": -22.305681228637695, "global_step": 108299, "epoch": 1304} {"train_loss": -22.276473999023438, "global_step": 108300, "epoch": 1304} {"train_loss": -22.426849365234375, "global_step": 108301, "epoch": 1304} {"train_loss": -22.14949607849121, "global_step": 108302, "epoch": 1304} {"train_loss": -22.10121726989746, "global_step": 108303, "epoch": 1304} {"train_loss": -22.068866729736328, "global_step": 108304, "epoch": 1304} {"train_loss": -22.123037338256836, "global_step": 108305, "epoch": 1304} {"train_loss": -21.807193756103516, "global_step": 108306, "epoch": 1304} {"train_loss": -22.144763946533203, "global_step": 108307, "epoch": 1304} {"train_loss": -22.351167678833008, "global_step": 108308, "epoch": 1304} {"train_loss": -22.185876846313477, "global_step": 108309, "epoch": 1304} {"train_loss": -22.325531005859375, "global_step": 108310, "epoch": 1304} {"train_loss": -22.39570426940918, "global_step": 108311, "epoch": 1304} {"train_loss": -22.09868812561035, "global_step": 108312, "epoch": 1304} {"train_loss": -21.86665916442871, "global_step": 108313, "epoch": 1304} {"train_loss": -22.11707145047475, "global_step": 108314, "epoch": 1304, "val_loss": 6138629.0} {"train_loss": -21.165555953979492, "global_step": 108315, "epoch": 1305} {"train_loss": -21.77659797668457, "global_step": 108316, "epoch": 1305} {"train_loss": -21.300098419189453, "global_step": 108317, "epoch": 1305} {"train_loss": -21.95974349975586, "global_step": 108318, "epoch": 1305} {"train_loss": -21.35995864868164, "global_step": 108319, "epoch": 1305} {"train_loss": -21.839807510375977, "global_step": 108320, "epoch": 1305} {"train_loss": -21.875524520874023, "global_step": 108321, "epoch": 1305} {"train_loss": -21.825769424438477, "global_step": 108322, "epoch": 1305} {"train_loss": -21.827865600585938, "global_step": 108323, "epoch": 1305} {"train_loss": -21.691831588745117, "global_step": 108324, "epoch": 1305} {"train_loss": -21.571165084838867, "global_step": 108325, "epoch": 1305} {"train_loss": -22.041601181030273, "global_step": 108326, "epoch": 1305} {"train_loss": -22.06954002380371, "global_step": 108327, "epoch": 1305} {"train_loss": -22.09539222717285, "global_step": 108328, "epoch": 1305} {"train_loss": -21.883506774902344, "global_step": 108329, "epoch": 1305} {"train_loss": -22.16941261291504, "global_step": 108330, "epoch": 1305} {"train_loss": -21.908109664916992, "global_step": 108331, "epoch": 1305} {"train_loss": -21.75360107421875, "global_step": 108332, "epoch": 1305} {"train_loss": -22.099672317504883, "global_step": 108333, "epoch": 1305} {"train_loss": -22.00233268737793, "global_step": 108334, "epoch": 1305} {"train_loss": -21.892080307006836, "global_step": 108335, "epoch": 1305} {"train_loss": -22.346744537353516, "global_step": 108336, "epoch": 1305} {"train_loss": -22.252519607543945, "global_step": 108337, "epoch": 1305} {"train_loss": -22.133955001831055, "global_step": 108338, "epoch": 1305} {"train_loss": -22.17522621154785, "global_step": 108339, "epoch": 1305} {"train_loss": -22.035959243774414, "global_step": 108340, "epoch": 1305} {"train_loss": -22.070655822753906, "global_step": 108341, "epoch": 1305} {"train_loss": -22.0771427154541, "global_step": 108342, "epoch": 1305} {"train_loss": -22.296924591064453, "global_step": 108343, "epoch": 1305} {"train_loss": -22.442235946655273, "global_step": 108344, "epoch": 1305} {"train_loss": -22.24991798400879, "global_step": 108345, "epoch": 1305} {"train_loss": -21.982145309448242, "global_step": 108346, "epoch": 1305} {"train_loss": -22.118284225463867, "global_step": 108347, "epoch": 1305} {"train_loss": -22.3295955657959, "global_step": 108348, "epoch": 1305} {"train_loss": -21.925378799438477, "global_step": 108349, "epoch": 1305} {"train_loss": -22.42366600036621, "global_step": 108350, "epoch": 1305} {"train_loss": -22.366106033325195, "global_step": 108351, "epoch": 1305} {"train_loss": -21.68751335144043, "global_step": 108352, "epoch": 1305} {"train_loss": -22.03493881225586, "global_step": 108353, "epoch": 1305} {"train_loss": -22.389827728271484, "global_step": 108354, "epoch": 1305} {"train_loss": -22.307443618774414, "global_step": 108355, "epoch": 1305} {"train_loss": -22.424026489257812, "global_step": 108356, "epoch": 1305} {"train_loss": -22.110885620117188, "global_step": 108357, "epoch": 1305} {"train_loss": -22.272048950195312, "global_step": 108358, "epoch": 1305} {"train_loss": -22.184711456298828, "global_step": 108359, "epoch": 1305} {"train_loss": -21.953962326049805, "global_step": 108360, "epoch": 1305} {"train_loss": -21.9516658782959, "global_step": 108361, "epoch": 1305} {"train_loss": -21.98558235168457, "global_step": 108362, "epoch": 1305} {"train_loss": -22.19095802307129, "global_step": 108363, "epoch": 1305} {"train_loss": -22.332176208496094, "global_step": 108364, "epoch": 1305} {"train_loss": -21.882482528686523, "global_step": 108365, "epoch": 1305} {"train_loss": -22.266586303710938, "global_step": 108366, "epoch": 1305} {"train_loss": -22.444616317749023, "global_step": 108367, "epoch": 1305} {"train_loss": -22.246694564819336, "global_step": 108368, "epoch": 1305} {"train_loss": -21.995349884033203, "global_step": 108369, "epoch": 1305} {"train_loss": -22.355512619018555, "global_step": 108370, "epoch": 1305} {"train_loss": -22.111364364624023, "global_step": 108371, "epoch": 1305} {"train_loss": -21.7513427734375, "global_step": 108372, "epoch": 1305} {"train_loss": -22.268735885620117, "global_step": 108373, "epoch": 1305} {"train_loss": -22.533084869384766, "global_step": 108374, "epoch": 1305} {"train_loss": -21.931041717529297, "global_step": 108375, "epoch": 1305} {"train_loss": -22.26349449157715, "global_step": 108376, "epoch": 1305} {"train_loss": -22.571304321289062, "global_step": 108377, "epoch": 1305} {"train_loss": -21.940092086791992, "global_step": 108378, "epoch": 1305} {"train_loss": -21.908187866210938, "global_step": 108379, "epoch": 1305} {"train_loss": -22.443344116210938, "global_step": 108380, "epoch": 1305} {"train_loss": -21.833972930908203, "global_step": 108381, "epoch": 1305} {"train_loss": -22.352596282958984, "global_step": 108382, "epoch": 1305} {"train_loss": -22.025251388549805, "global_step": 108383, "epoch": 1305} {"train_loss": -22.179975509643555, "global_step": 108384, "epoch": 1305} {"train_loss": -22.73127555847168, "global_step": 108385, "epoch": 1305} {"train_loss": -22.118762969970703, "global_step": 108386, "epoch": 1305} {"train_loss": -22.364564895629883, "global_step": 108387, "epoch": 1305} {"train_loss": -22.009122848510742, "global_step": 108388, "epoch": 1305} {"train_loss": -22.116933822631836, "global_step": 108389, "epoch": 1305} {"train_loss": -22.386512756347656, "global_step": 108390, "epoch": 1305} {"train_loss": -22.251800537109375, "global_step": 108391, "epoch": 1305} {"train_loss": -22.26422691345215, "global_step": 108392, "epoch": 1305} {"train_loss": -22.391443252563477, "global_step": 108393, "epoch": 1305} {"train_loss": -22.289405822753906, "global_step": 108394, "epoch": 1305} {"train_loss": -22.199247360229492, "global_step": 108395, "epoch": 1305} {"train_loss": -22.034475326538086, "global_step": 108396, "epoch": 1305} {"train_loss": -22.11683280209461, "global_step": 108397, "epoch": 1305, "val_loss": 6067269.0} {"train_loss": -21.686216354370117, "global_step": 108398, "epoch": 1306} {"train_loss": -20.262401580810547, "global_step": 108399, "epoch": 1306} {"train_loss": -21.471542358398438, "global_step": 108400, "epoch": 1306} {"train_loss": -21.088693618774414, "global_step": 108401, "epoch": 1306} {"train_loss": -21.670791625976562, "global_step": 108402, "epoch": 1306} {"train_loss": -21.214380264282227, "global_step": 108403, "epoch": 1306} {"train_loss": -21.585411071777344, "global_step": 108404, "epoch": 1306} {"train_loss": -21.35247802734375, "global_step": 108405, "epoch": 1306} {"train_loss": -21.7992000579834, "global_step": 108406, "epoch": 1306} {"train_loss": -21.737890243530273, "global_step": 108407, "epoch": 1306} {"train_loss": -21.924299240112305, "global_step": 108408, "epoch": 1306} {"train_loss": -21.498144149780273, "global_step": 108409, "epoch": 1306} {"train_loss": -21.843320846557617, "global_step": 108410, "epoch": 1306} {"train_loss": -22.010583877563477, "global_step": 108411, "epoch": 1306} {"train_loss": -21.643495559692383, "global_step": 108412, "epoch": 1306} {"train_loss": -22.08219337463379, "global_step": 108413, "epoch": 1306} {"train_loss": -21.529613494873047, "global_step": 108414, "epoch": 1306} {"train_loss": -21.8378963470459, "global_step": 108415, "epoch": 1306} {"train_loss": -21.957616806030273, "global_step": 108416, "epoch": 1306} {"train_loss": -21.540910720825195, "global_step": 108417, "epoch": 1306} {"train_loss": -22.235509872436523, "global_step": 108418, "epoch": 1306} {"train_loss": -21.663400650024414, "global_step": 108419, "epoch": 1306} {"train_loss": -22.059932708740234, "global_step": 108420, "epoch": 1306} {"train_loss": -21.987979888916016, "global_step": 108421, "epoch": 1306} {"train_loss": -22.485624313354492, "global_step": 108422, "epoch": 1306} {"train_loss": -22.217926025390625, "global_step": 108423, "epoch": 1306} {"train_loss": -22.129770278930664, "global_step": 108424, "epoch": 1306} {"train_loss": -22.092777252197266, "global_step": 108425, "epoch": 1306} {"train_loss": -22.02327537536621, "global_step": 108426, "epoch": 1306} {"train_loss": -22.334653854370117, "global_step": 108427, "epoch": 1306} {"train_loss": -22.17140007019043, "global_step": 108428, "epoch": 1306} {"train_loss": -22.361501693725586, "global_step": 108429, "epoch": 1306} {"train_loss": -22.15462303161621, "global_step": 108430, "epoch": 1306} {"train_loss": -21.810333251953125, "global_step": 108431, "epoch": 1306} {"train_loss": -22.046131134033203, "global_step": 108432, "epoch": 1306} {"train_loss": -22.2910099029541, "global_step": 108433, "epoch": 1306} {"train_loss": -22.03668785095215, "global_step": 108434, "epoch": 1306} {"train_loss": -22.17554473876953, "global_step": 108435, "epoch": 1306} {"train_loss": -22.518266677856445, "global_step": 108436, "epoch": 1306} {"train_loss": -22.09059715270996, "global_step": 108437, "epoch": 1306} {"train_loss": -22.31215476989746, "global_step": 108438, "epoch": 1306} {"train_loss": -22.083984375, "global_step": 108439, "epoch": 1306} {"train_loss": -22.42561912536621, "global_step": 108440, "epoch": 1306} {"train_loss": -22.487377166748047, "global_step": 108441, "epoch": 1306} {"train_loss": -21.95499038696289, "global_step": 108442, "epoch": 1306} {"train_loss": -22.3966064453125, "global_step": 108443, "epoch": 1306} {"train_loss": -22.167524337768555, "global_step": 108444, "epoch": 1306} {"train_loss": -22.337970733642578, "global_step": 108445, "epoch": 1306} {"train_loss": -21.8089656829834, "global_step": 108446, "epoch": 1306} {"train_loss": -22.276273727416992, "global_step": 108447, "epoch": 1306} {"train_loss": -22.008127212524414, "global_step": 108448, "epoch": 1306} {"train_loss": -22.1899471282959, "global_step": 108449, "epoch": 1306} {"train_loss": -22.444934844970703, "global_step": 108450, "epoch": 1306} {"train_loss": -22.319272994995117, "global_step": 108451, "epoch": 1306} {"train_loss": -22.34462547302246, "global_step": 108452, "epoch": 1306} {"train_loss": -21.98932456970215, "global_step": 108453, "epoch": 1306} {"train_loss": -21.814151763916016, "global_step": 108454, "epoch": 1306} {"train_loss": -22.9614200592041, "global_step": 108455, "epoch": 1306} {"train_loss": -22.364971160888672, "global_step": 108456, "epoch": 1306} {"train_loss": -22.44065284729004, "global_step": 108457, "epoch": 1306} {"train_loss": -22.44151496887207, "global_step": 108458, "epoch": 1306} {"train_loss": -22.466459274291992, "global_step": 108459, "epoch": 1306} {"train_loss": -22.264251708984375, "global_step": 108460, "epoch": 1306} {"train_loss": -22.04024314880371, "global_step": 108461, "epoch": 1306} {"train_loss": -22.16610336303711, "global_step": 108462, "epoch": 1306} {"train_loss": -22.2065372467041, "global_step": 108463, "epoch": 1306} {"train_loss": -22.36368751525879, "global_step": 108464, "epoch": 1306} {"train_loss": -22.140674591064453, "global_step": 108465, "epoch": 1306} {"train_loss": -22.05689239501953, "global_step": 108466, "epoch": 1306} {"train_loss": -22.100696563720703, "global_step": 108467, "epoch": 1306} {"train_loss": -22.4011287689209, "global_step": 108468, "epoch": 1306} {"train_loss": -22.350067138671875, "global_step": 108469, "epoch": 1306} {"train_loss": -22.27359962463379, "global_step": 108470, "epoch": 1306} {"train_loss": -22.680824279785156, "global_step": 108471, "epoch": 1306} {"train_loss": -22.017845153808594, "global_step": 108472, "epoch": 1306} {"train_loss": -22.13929557800293, "global_step": 108473, "epoch": 1306} {"train_loss": -22.083066940307617, "global_step": 108474, "epoch": 1306} {"train_loss": -22.206809997558594, "global_step": 108475, "epoch": 1306} {"train_loss": -22.143600463867188, "global_step": 108476, "epoch": 1306} {"train_loss": -22.07659912109375, "global_step": 108477, "epoch": 1306} {"train_loss": -21.832571029663086, "global_step": 108478, "epoch": 1306} {"train_loss": -22.341955184936523, "global_step": 108479, "epoch": 1306} {"train_loss": -22.069673745028943, "global_step": 108480, "epoch": 1306, "val_loss": 6230555.5} {"train_loss": -21.770854949951172, "global_step": 108481, "epoch": 1307} {"train_loss": -21.388019561767578, "global_step": 108482, "epoch": 1307} {"train_loss": -21.3571834564209, "global_step": 108483, "epoch": 1307} {"train_loss": -21.72525405883789, "global_step": 108484, "epoch": 1307} {"train_loss": -21.663373947143555, "global_step": 108485, "epoch": 1307} {"train_loss": -22.233091354370117, "global_step": 108486, "epoch": 1307} {"train_loss": -21.70030975341797, "global_step": 108487, "epoch": 1307} {"train_loss": -21.66988754272461, "global_step": 108488, "epoch": 1307} {"train_loss": -22.01383399963379, "global_step": 108489, "epoch": 1307} {"train_loss": -21.757572174072266, "global_step": 108490, "epoch": 1307} {"train_loss": -21.956144332885742, "global_step": 108491, "epoch": 1307} {"train_loss": -21.93404769897461, "global_step": 108492, "epoch": 1307} {"train_loss": -21.698627471923828, "global_step": 108493, "epoch": 1307} {"train_loss": -22.1041202545166, "global_step": 108494, "epoch": 1307} {"train_loss": -21.85004997253418, "global_step": 108495, "epoch": 1307} {"train_loss": -21.657222747802734, "global_step": 108496, "epoch": 1307} {"train_loss": -22.037586212158203, "global_step": 108497, "epoch": 1307} {"train_loss": -22.1125545501709, "global_step": 108498, "epoch": 1307} {"train_loss": -22.465038299560547, "global_step": 108499, "epoch": 1307} {"train_loss": -22.058399200439453, "global_step": 108500, "epoch": 1307} {"train_loss": -21.844572067260742, "global_step": 108501, "epoch": 1307} {"train_loss": -22.01407814025879, "global_step": 108502, "epoch": 1307} {"train_loss": -22.223709106445312, "global_step": 108503, "epoch": 1307} {"train_loss": -22.31045913696289, "global_step": 108504, "epoch": 1307} {"train_loss": -22.42055320739746, "global_step": 108505, "epoch": 1307} {"train_loss": -22.409605026245117, "global_step": 108506, "epoch": 1307} {"train_loss": -22.182228088378906, "global_step": 108507, "epoch": 1307} {"train_loss": -22.357908248901367, "global_step": 108508, "epoch": 1307} {"train_loss": -22.38844871520996, "global_step": 108509, "epoch": 1307} {"train_loss": -22.2215518951416, "global_step": 108510, "epoch": 1307} {"train_loss": -22.469213485717773, "global_step": 108511, "epoch": 1307} {"train_loss": -22.20001220703125, "global_step": 108512, "epoch": 1307} {"train_loss": -22.307138442993164, "global_step": 108513, "epoch": 1307} {"train_loss": -22.39053726196289, "global_step": 108514, "epoch": 1307} {"train_loss": -22.066560745239258, "global_step": 108515, "epoch": 1307} {"train_loss": -21.934968948364258, "global_step": 108516, "epoch": 1307} {"train_loss": -22.353055953979492, "global_step": 108517, "epoch": 1307} {"train_loss": -22.311809539794922, "global_step": 108518, "epoch": 1307} {"train_loss": -22.12222671508789, "global_step": 108519, "epoch": 1307} {"train_loss": -22.19571876525879, "global_step": 108520, "epoch": 1307} {"train_loss": -22.388229370117188, "global_step": 108521, "epoch": 1307} {"train_loss": -22.4084529876709, "global_step": 108522, "epoch": 1307} {"train_loss": -21.90618896484375, "global_step": 108523, "epoch": 1307} {"train_loss": -21.983936309814453, "global_step": 108524, "epoch": 1307} {"train_loss": -22.189844131469727, "global_step": 108525, "epoch": 1307} {"train_loss": -22.349000930786133, "global_step": 108526, "epoch": 1307} {"train_loss": -22.198514938354492, "global_step": 108527, "epoch": 1307} {"train_loss": -22.777463912963867, "global_step": 108528, "epoch": 1307} {"train_loss": -22.491636276245117, "global_step": 108529, "epoch": 1307} {"train_loss": -22.31524085998535, "global_step": 108530, "epoch": 1307} {"train_loss": -22.145959854125977, "global_step": 108531, "epoch": 1307} {"train_loss": -22.356521606445312, "global_step": 108532, "epoch": 1307} {"train_loss": -22.380176544189453, "global_step": 108533, "epoch": 1307} {"train_loss": -22.4769344329834, "global_step": 108534, "epoch": 1307} {"train_loss": -22.53156852722168, "global_step": 108535, "epoch": 1307} {"train_loss": -22.261070251464844, "global_step": 108536, "epoch": 1307} {"train_loss": -22.40350914001465, "global_step": 108537, "epoch": 1307} {"train_loss": -22.540603637695312, "global_step": 108538, "epoch": 1307} {"train_loss": -22.284616470336914, "global_step": 108539, "epoch": 1307} {"train_loss": -22.224836349487305, "global_step": 108540, "epoch": 1307} {"train_loss": -21.954639434814453, "global_step": 108541, "epoch": 1307} {"train_loss": -22.060382843017578, "global_step": 108542, "epoch": 1307} {"train_loss": -22.585952758789062, "global_step": 108543, "epoch": 1307} {"train_loss": -22.435285568237305, "global_step": 108544, "epoch": 1307} {"train_loss": -21.919279098510742, "global_step": 108545, "epoch": 1307} {"train_loss": -22.381120681762695, "global_step": 108546, "epoch": 1307} {"train_loss": -22.578678131103516, "global_step": 108547, "epoch": 1307} {"train_loss": -22.055097579956055, "global_step": 108548, "epoch": 1307} {"train_loss": -22.466684341430664, "global_step": 108549, "epoch": 1307} {"train_loss": -22.464954376220703, "global_step": 108550, "epoch": 1307} {"train_loss": -22.091182708740234, "global_step": 108551, "epoch": 1307} {"train_loss": -22.35422134399414, "global_step": 108552, "epoch": 1307} {"train_loss": -22.171735763549805, "global_step": 108553, "epoch": 1307} {"train_loss": -22.08150291442871, "global_step": 108554, "epoch": 1307} {"train_loss": -21.89696502685547, "global_step": 108555, "epoch": 1307} {"train_loss": -22.121782302856445, "global_step": 108556, "epoch": 1307} {"train_loss": -22.479581832885742, "global_step": 108557, "epoch": 1307} {"train_loss": -22.283573150634766, "global_step": 108558, "epoch": 1307} {"train_loss": -22.112035751342773, "global_step": 108559, "epoch": 1307} {"train_loss": -22.07392692565918, "global_step": 108560, "epoch": 1307} {"train_loss": -22.026838302612305, "global_step": 108561, "epoch": 1307} {"train_loss": -22.292980194091797, "global_step": 108562, "epoch": 1307} {"train_loss": -22.1572334335511, "global_step": 108563, "epoch": 1307, "val_loss": 6207654.0} {"train_loss": -21.72954750061035, "global_step": 108564, "epoch": 1308} {"train_loss": -21.725364685058594, "global_step": 108565, "epoch": 1308} {"train_loss": -22.053625106811523, "global_step": 108566, "epoch": 1308} {"train_loss": -21.618642807006836, "global_step": 108567, "epoch": 1308} {"train_loss": -21.766477584838867, "global_step": 108568, "epoch": 1308} {"train_loss": -21.486860275268555, "global_step": 108569, "epoch": 1308} {"train_loss": -21.818960189819336, "global_step": 108570, "epoch": 1308} {"train_loss": -21.34137535095215, "global_step": 108571, "epoch": 1308} {"train_loss": -21.82421875, "global_step": 108572, "epoch": 1308} {"train_loss": -21.767797470092773, "global_step": 108573, "epoch": 1308} {"train_loss": -22.00490379333496, "global_step": 108574, "epoch": 1308} {"train_loss": -21.89833641052246, "global_step": 108575, "epoch": 1308} {"train_loss": -21.815492630004883, "global_step": 108576, "epoch": 1308} {"train_loss": -22.134010314941406, "global_step": 108577, "epoch": 1308} {"train_loss": -21.922903060913086, "global_step": 108578, "epoch": 1308} {"train_loss": -21.801366806030273, "global_step": 108579, "epoch": 1308} {"train_loss": -21.933908462524414, "global_step": 108580, "epoch": 1308} {"train_loss": -21.859058380126953, "global_step": 108581, "epoch": 1308} {"train_loss": -21.600688934326172, "global_step": 108582, "epoch": 1308} {"train_loss": -21.806594848632812, "global_step": 108583, "epoch": 1308} {"train_loss": -21.834274291992188, "global_step": 108584, "epoch": 1308} {"train_loss": -22.003503799438477, "global_step": 108585, "epoch": 1308} {"train_loss": -22.248991012573242, "global_step": 108586, "epoch": 1308} {"train_loss": -22.12967300415039, "global_step": 108587, "epoch": 1308} {"train_loss": -22.038684844970703, "global_step": 108588, "epoch": 1308} {"train_loss": -22.263080596923828, "global_step": 108589, "epoch": 1308} {"train_loss": -22.283721923828125, "global_step": 108590, "epoch": 1308} {"train_loss": -21.976011276245117, "global_step": 108591, "epoch": 1308} {"train_loss": -22.225568771362305, "global_step": 108592, "epoch": 1308} {"train_loss": -22.054363250732422, "global_step": 108593, "epoch": 1308} {"train_loss": -22.050689697265625, "global_step": 108594, "epoch": 1308} {"train_loss": -22.013469696044922, "global_step": 108595, "epoch": 1308} {"train_loss": -22.434219360351562, "global_step": 108596, "epoch": 1308} {"train_loss": -22.258525848388672, "global_step": 108597, "epoch": 1308} {"train_loss": -22.03348159790039, "global_step": 108598, "epoch": 1308} {"train_loss": -22.170312881469727, "global_step": 108599, "epoch": 1308} {"train_loss": -22.25421142578125, "global_step": 108600, "epoch": 1308} {"train_loss": -22.10127067565918, "global_step": 108601, "epoch": 1308} {"train_loss": -22.067049026489258, "global_step": 108602, "epoch": 1308} {"train_loss": -21.662832260131836, "global_step": 108603, "epoch": 1308} {"train_loss": -22.154325485229492, "global_step": 108604, "epoch": 1308} {"train_loss": -22.281518936157227, "global_step": 108605, "epoch": 1308} {"train_loss": -21.911502838134766, "global_step": 108606, "epoch": 1308} {"train_loss": -21.941818237304688, "global_step": 108607, "epoch": 1308} {"train_loss": -21.820363998413086, "global_step": 108608, "epoch": 1308} {"train_loss": -22.103296279907227, "global_step": 108609, "epoch": 1308} {"train_loss": -21.782012939453125, "global_step": 108610, "epoch": 1308} {"train_loss": -22.166629791259766, "global_step": 108611, "epoch": 1308} {"train_loss": -22.1391658782959, "global_step": 108612, "epoch": 1308} {"train_loss": -21.954055786132812, "global_step": 108613, "epoch": 1308} {"train_loss": -22.24812889099121, "global_step": 108614, "epoch": 1308} {"train_loss": -21.885360717773438, "global_step": 108615, "epoch": 1308} {"train_loss": -22.19474220275879, "global_step": 108616, "epoch": 1308} {"train_loss": -22.50556182861328, "global_step": 108617, "epoch": 1308} {"train_loss": -22.44639015197754, "global_step": 108618, "epoch": 1308} {"train_loss": -22.365243911743164, "global_step": 108619, "epoch": 1308} {"train_loss": -22.501001358032227, "global_step": 108620, "epoch": 1308} {"train_loss": -21.99196434020996, "global_step": 108621, "epoch": 1308} {"train_loss": -21.779998779296875, "global_step": 108622, "epoch": 1308} {"train_loss": -22.191497802734375, "global_step": 108623, "epoch": 1308} {"train_loss": -21.850238800048828, "global_step": 108624, "epoch": 1308} {"train_loss": -22.421873092651367, "global_step": 108625, "epoch": 1308} {"train_loss": -22.2465877532959, "global_step": 108626, "epoch": 1308} {"train_loss": -22.231164932250977, "global_step": 108627, "epoch": 1308} {"train_loss": -21.876724243164062, "global_step": 108628, "epoch": 1308} {"train_loss": -22.475406646728516, "global_step": 108629, "epoch": 1308} {"train_loss": -22.074289321899414, "global_step": 108630, "epoch": 1308} {"train_loss": -22.45633888244629, "global_step": 108631, "epoch": 1308} {"train_loss": -22.30738639831543, "global_step": 108632, "epoch": 1308} {"train_loss": -22.0186824798584, "global_step": 108633, "epoch": 1308} {"train_loss": -22.322446823120117, "global_step": 108634, "epoch": 1308} {"train_loss": -22.378278732299805, "global_step": 108635, "epoch": 1308} {"train_loss": -21.88942527770996, "global_step": 108636, "epoch": 1308} {"train_loss": -22.582904815673828, "global_step": 108637, "epoch": 1308} {"train_loss": -22.373252868652344, "global_step": 108638, "epoch": 1308} {"train_loss": -22.435094833374023, "global_step": 108639, "epoch": 1308} {"train_loss": -22.010604858398438, "global_step": 108640, "epoch": 1308} {"train_loss": -21.847938537597656, "global_step": 108641, "epoch": 1308} {"train_loss": -22.277746200561523, "global_step": 108642, "epoch": 1308} {"train_loss": -21.856977462768555, "global_step": 108643, "epoch": 1308} {"train_loss": -22.6386661529541, "global_step": 108644, "epoch": 1308} {"train_loss": -21.839338302612305, "global_step": 108645, "epoch": 1308} {"train_loss": -22.05874819927905, "global_step": 108646, "epoch": 1308, "val_loss": 6224263.0} {"train_loss": -21.632755279541016, "global_step": 108647, "epoch": 1309} {"train_loss": -21.728315353393555, "global_step": 108648, "epoch": 1309} {"train_loss": -21.99979019165039, "global_step": 108649, "epoch": 1309} {"train_loss": -21.62640953063965, "global_step": 108650, "epoch": 1309} {"train_loss": -22.06146240234375, "global_step": 108651, "epoch": 1309} {"train_loss": -22.239212036132812, "global_step": 108652, "epoch": 1309} {"train_loss": -22.128936767578125, "global_step": 108653, "epoch": 1309} {"train_loss": -22.02449607849121, "global_step": 108654, "epoch": 1309} {"train_loss": -22.00662612915039, "global_step": 108655, "epoch": 1309} {"train_loss": -21.808738708496094, "global_step": 108656, "epoch": 1309} {"train_loss": -22.128917694091797, "global_step": 108657, "epoch": 1309} {"train_loss": -22.01240348815918, "global_step": 108658, "epoch": 1309} {"train_loss": -22.226896286010742, "global_step": 108659, "epoch": 1309} {"train_loss": -21.9404296875, "global_step": 108660, "epoch": 1309} {"train_loss": -21.860212326049805, "global_step": 108661, "epoch": 1309} {"train_loss": -21.951570510864258, "global_step": 108662, "epoch": 1309} {"train_loss": -22.1395206451416, "global_step": 108663, "epoch": 1309} {"train_loss": -21.901641845703125, "global_step": 108664, "epoch": 1309} {"train_loss": -22.0406436920166, "global_step": 108665, "epoch": 1309} {"train_loss": -21.979806900024414, "global_step": 108666, "epoch": 1309} {"train_loss": -22.054784774780273, "global_step": 108667, "epoch": 1309} {"train_loss": -22.18850326538086, "global_step": 108668, "epoch": 1309} {"train_loss": -22.175703048706055, "global_step": 108669, "epoch": 1309} {"train_loss": -22.210739135742188, "global_step": 108670, "epoch": 1309} {"train_loss": -22.175291061401367, "global_step": 108671, "epoch": 1309} {"train_loss": -22.05342674255371, "global_step": 108672, "epoch": 1309} {"train_loss": -22.401748657226562, "global_step": 108673, "epoch": 1309} {"train_loss": -22.197107315063477, "global_step": 108674, "epoch": 1309} {"train_loss": -22.091840744018555, "global_step": 108675, "epoch": 1309} {"train_loss": -22.41798210144043, "global_step": 108676, "epoch": 1309} {"train_loss": -22.14125633239746, "global_step": 108677, "epoch": 1309} {"train_loss": -22.0916748046875, "global_step": 108678, "epoch": 1309} {"train_loss": -22.201093673706055, "global_step": 108679, "epoch": 1309} {"train_loss": -22.450193405151367, "global_step": 108680, "epoch": 1309} {"train_loss": -22.200971603393555, "global_step": 108681, "epoch": 1309} {"train_loss": -21.851964950561523, "global_step": 108682, "epoch": 1309} {"train_loss": -22.322370529174805, "global_step": 108683, "epoch": 1309} {"train_loss": -22.446622848510742, "global_step": 108684, "epoch": 1309} {"train_loss": -22.209836959838867, "global_step": 108685, "epoch": 1309} {"train_loss": -22.21591567993164, "global_step": 108686, "epoch": 1309} {"train_loss": -22.402219772338867, "global_step": 108687, "epoch": 1309} {"train_loss": -22.20734214782715, "global_step": 108688, "epoch": 1309} {"train_loss": -22.44717788696289, "global_step": 108689, "epoch": 1309} {"train_loss": -22.3070011138916, "global_step": 108690, "epoch": 1309} {"train_loss": -22.53415298461914, "global_step": 108691, "epoch": 1309} {"train_loss": -22.458677291870117, "global_step": 108692, "epoch": 1309} {"train_loss": -22.266056060791016, "global_step": 108693, "epoch": 1309} {"train_loss": -22.530881881713867, "global_step": 108694, "epoch": 1309} {"train_loss": -22.274490356445312, "global_step": 108695, "epoch": 1309} {"train_loss": -22.19637107849121, "global_step": 108696, "epoch": 1309} {"train_loss": -22.157161712646484, "global_step": 108697, "epoch": 1309} {"train_loss": -22.481027603149414, "global_step": 108698, "epoch": 1309} {"train_loss": -22.20442008972168, "global_step": 108699, "epoch": 1309} {"train_loss": -22.140094757080078, "global_step": 108700, "epoch": 1309} {"train_loss": -22.204833984375, "global_step": 108701, "epoch": 1309} {"train_loss": -22.383031845092773, "global_step": 108702, "epoch": 1309} {"train_loss": -22.50486183166504, "global_step": 108703, "epoch": 1309} {"train_loss": -21.714189529418945, "global_step": 108704, "epoch": 1309} {"train_loss": -22.352628707885742, "global_step": 108705, "epoch": 1309} {"train_loss": -22.031631469726562, "global_step": 108706, "epoch": 1309} {"train_loss": -22.274526596069336, "global_step": 108707, "epoch": 1309} {"train_loss": -22.369529724121094, "global_step": 108708, "epoch": 1309} {"train_loss": -22.451011657714844, "global_step": 108709, "epoch": 1309} {"train_loss": -22.35709571838379, "global_step": 108710, "epoch": 1309} {"train_loss": -22.515621185302734, "global_step": 108711, "epoch": 1309} {"train_loss": -22.090423583984375, "global_step": 108712, "epoch": 1309} {"train_loss": -22.348392486572266, "global_step": 108713, "epoch": 1309} {"train_loss": -22.65511703491211, "global_step": 108714, "epoch": 1309} {"train_loss": -22.136478424072266, "global_step": 108715, "epoch": 1309} {"train_loss": -22.104074478149414, "global_step": 108716, "epoch": 1309} {"train_loss": -22.026182174682617, "global_step": 108717, "epoch": 1309} {"train_loss": -22.166791915893555, "global_step": 108718, "epoch": 1309} {"train_loss": -22.073150634765625, "global_step": 108719, "epoch": 1309} {"train_loss": -22.526212692260742, "global_step": 108720, "epoch": 1309} {"train_loss": -22.48590087890625, "global_step": 108721, "epoch": 1309} {"train_loss": -21.795042037963867, "global_step": 108722, "epoch": 1309} {"train_loss": -22.111534118652344, "global_step": 108723, "epoch": 1309} {"train_loss": -21.812204360961914, "global_step": 108724, "epoch": 1309} {"train_loss": -22.048948287963867, "global_step": 108725, "epoch": 1309} {"train_loss": -22.314722061157227, "global_step": 108726, "epoch": 1309} {"train_loss": -21.828893661499023, "global_step": 108727, "epoch": 1309} {"train_loss": -22.140111923217773, "global_step": 108728, "epoch": 1309} {"train_loss": -22.17571506730045, "global_step": 108729, "epoch": 1309, "val_loss": 6242001.0} {"train_loss": -21.86750602722168, "global_step": 108730, "epoch": 1310} {"train_loss": -21.342731475830078, "global_step": 108731, "epoch": 1310} {"train_loss": -21.77054214477539, "global_step": 108732, "epoch": 1310} {"train_loss": -22.086267471313477, "global_step": 108733, "epoch": 1310} {"train_loss": -21.659082412719727, "global_step": 108734, "epoch": 1310} {"train_loss": -21.69044303894043, "global_step": 108735, "epoch": 1310} {"train_loss": -22.088117599487305, "global_step": 108736, "epoch": 1310} {"train_loss": -21.89605712890625, "global_step": 108737, "epoch": 1310} {"train_loss": -22.045007705688477, "global_step": 108738, "epoch": 1310} {"train_loss": -22.24920082092285, "global_step": 108739, "epoch": 1310} {"train_loss": -22.05555534362793, "global_step": 108740, "epoch": 1310} {"train_loss": -21.793798446655273, "global_step": 108741, "epoch": 1310} {"train_loss": -22.31936264038086, "global_step": 108742, "epoch": 1310} {"train_loss": -21.958276748657227, "global_step": 108743, "epoch": 1310} {"train_loss": -22.29471206665039, "global_step": 108744, "epoch": 1310} {"train_loss": -22.306055068969727, "global_step": 108745, "epoch": 1310} {"train_loss": -21.900339126586914, "global_step": 108746, "epoch": 1310} {"train_loss": -22.0081844329834, "global_step": 108747, "epoch": 1310} {"train_loss": -22.120792388916016, "global_step": 108748, "epoch": 1310} {"train_loss": -21.97313690185547, "global_step": 108749, "epoch": 1310} {"train_loss": -22.19403076171875, "global_step": 108750, "epoch": 1310} {"train_loss": -22.11773109436035, "global_step": 108751, "epoch": 1310} {"train_loss": -22.165115356445312, "global_step": 108752, "epoch": 1310} {"train_loss": -22.204029083251953, "global_step": 108753, "epoch": 1310} {"train_loss": -22.17518424987793, "global_step": 108754, "epoch": 1310} {"train_loss": -22.00844383239746, "global_step": 108755, "epoch": 1310} {"train_loss": -21.895788192749023, "global_step": 108756, "epoch": 1310} {"train_loss": -21.883604049682617, "global_step": 108757, "epoch": 1310} {"train_loss": -22.44338035583496, "global_step": 108758, "epoch": 1310} {"train_loss": -22.1654109954834, "global_step": 108759, "epoch": 1310} {"train_loss": -22.234577178955078, "global_step": 108760, "epoch": 1310} {"train_loss": -22.15204429626465, "global_step": 108761, "epoch": 1310} {"train_loss": -22.111766815185547, "global_step": 108762, "epoch": 1310} {"train_loss": -22.273651123046875, "global_step": 108763, "epoch": 1310} {"train_loss": -22.465055465698242, "global_step": 108764, "epoch": 1310} {"train_loss": -22.094459533691406, "global_step": 108765, "epoch": 1310} {"train_loss": -22.2373104095459, "global_step": 108766, "epoch": 1310} {"train_loss": -21.955215454101562, "global_step": 108767, "epoch": 1310} {"train_loss": -22.41822624206543, "global_step": 108768, "epoch": 1310} {"train_loss": -22.546445846557617, "global_step": 108769, "epoch": 1310} {"train_loss": -21.96343994140625, "global_step": 108770, "epoch": 1310} {"train_loss": -22.050050735473633, "global_step": 108771, "epoch": 1310} {"train_loss": -22.561798095703125, "global_step": 108772, "epoch": 1310} {"train_loss": -22.22903823852539, "global_step": 108773, "epoch": 1310} {"train_loss": -22.574787139892578, "global_step": 108774, "epoch": 1310} {"train_loss": -22.23431968688965, "global_step": 108775, "epoch": 1310} {"train_loss": -22.334501266479492, "global_step": 108776, "epoch": 1310} {"train_loss": -22.289609909057617, "global_step": 108777, "epoch": 1310} {"train_loss": -22.431406021118164, "global_step": 108778, "epoch": 1310} {"train_loss": -22.135217666625977, "global_step": 108779, "epoch": 1310} {"train_loss": -22.098865509033203, "global_step": 108780, "epoch": 1310} {"train_loss": -22.158859252929688, "global_step": 108781, "epoch": 1310} {"train_loss": -22.20438003540039, "global_step": 108782, "epoch": 1310} {"train_loss": -22.2738094329834, "global_step": 108783, "epoch": 1310} {"train_loss": -22.06964683532715, "global_step": 108784, "epoch": 1310} {"train_loss": -22.051042556762695, "global_step": 108785, "epoch": 1310} {"train_loss": -22.435070037841797, "global_step": 108786, "epoch": 1310} {"train_loss": -22.19539451599121, "global_step": 108787, "epoch": 1310} {"train_loss": -22.299518585205078, "global_step": 108788, "epoch": 1310} {"train_loss": -22.342424392700195, "global_step": 108789, "epoch": 1310} {"train_loss": -22.640443801879883, "global_step": 108790, "epoch": 1310} {"train_loss": -22.31438636779785, "global_step": 108791, "epoch": 1310} {"train_loss": -22.5068359375, "global_step": 108792, "epoch": 1310} {"train_loss": -22.195371627807617, "global_step": 108793, "epoch": 1310} {"train_loss": -22.56087875366211, "global_step": 108794, "epoch": 1310} {"train_loss": -22.257492065429688, "global_step": 108795, "epoch": 1310} {"train_loss": -22.711109161376953, "global_step": 108796, "epoch": 1310} {"train_loss": -21.92854881286621, "global_step": 108797, "epoch": 1310} {"train_loss": -22.438777923583984, "global_step": 108798, "epoch": 1310} {"train_loss": -21.899412155151367, "global_step": 108799, "epoch": 1310} {"train_loss": -21.96792221069336, "global_step": 108800, "epoch": 1310} {"train_loss": -22.071121215820312, "global_step": 108801, "epoch": 1310} {"train_loss": -22.186206817626953, "global_step": 108802, "epoch": 1310} {"train_loss": -22.24517250061035, "global_step": 108803, "epoch": 1310} {"train_loss": -22.097942352294922, "global_step": 108804, "epoch": 1310} {"train_loss": -21.866384506225586, "global_step": 108805, "epoch": 1310} {"train_loss": -22.390369415283203, "global_step": 108806, "epoch": 1310} {"train_loss": -22.073627471923828, "global_step": 108807, "epoch": 1310} {"train_loss": -22.04120445251465, "global_step": 108808, "epoch": 1310} {"train_loss": -22.037893295288086, "global_step": 108809, "epoch": 1310} {"train_loss": -22.054027557373047, "global_step": 108810, "epoch": 1310} {"train_loss": -22.131025314331055, "global_step": 108811, "epoch": 1310} {"train_loss": -22.15221239572548, "global_step": 108812, "epoch": 1310, "val_loss": 6237104.0} {"train_loss": -21.89847755432129, "global_step": 108813, "epoch": 1311} {"train_loss": -21.954004287719727, "global_step": 108814, "epoch": 1311} {"train_loss": -21.899887084960938, "global_step": 108815, "epoch": 1311} {"train_loss": -21.94089698791504, "global_step": 108816, "epoch": 1311} {"train_loss": -22.011259078979492, "global_step": 108817, "epoch": 1311} {"train_loss": -21.335477828979492, "global_step": 108818, "epoch": 1311} {"train_loss": -21.960643768310547, "global_step": 108819, "epoch": 1311} {"train_loss": -21.84864616394043, "global_step": 108820, "epoch": 1311} {"train_loss": -21.915639877319336, "global_step": 108821, "epoch": 1311} {"train_loss": -22.323871612548828, "global_step": 108822, "epoch": 1311} {"train_loss": -21.945316314697266, "global_step": 108823, "epoch": 1311} {"train_loss": -22.375885009765625, "global_step": 108824, "epoch": 1311} {"train_loss": -22.004316329956055, "global_step": 108825, "epoch": 1311} {"train_loss": -21.866130828857422, "global_step": 108826, "epoch": 1311} {"train_loss": -22.650474548339844, "global_step": 108827, "epoch": 1311} {"train_loss": -22.228559494018555, "global_step": 108828, "epoch": 1311} {"train_loss": -21.95692253112793, "global_step": 108829, "epoch": 1311} {"train_loss": -22.377180099487305, "global_step": 108830, "epoch": 1311} {"train_loss": -22.415878295898438, "global_step": 108831, "epoch": 1311} {"train_loss": -22.2108154296875, "global_step": 108832, "epoch": 1311} {"train_loss": -22.163665771484375, "global_step": 108833, "epoch": 1311} {"train_loss": -22.004362106323242, "global_step": 108834, "epoch": 1311} {"train_loss": -22.371938705444336, "global_step": 108835, "epoch": 1311} {"train_loss": -22.150833129882812, "global_step": 108836, "epoch": 1311} {"train_loss": -22.360654830932617, "global_step": 108837, "epoch": 1311} {"train_loss": -22.07176399230957, "global_step": 108838, "epoch": 1311} {"train_loss": -22.231908798217773, "global_step": 108839, "epoch": 1311} {"train_loss": -22.225313186645508, "global_step": 108840, "epoch": 1311} {"train_loss": -22.549657821655273, "global_step": 108841, "epoch": 1311} {"train_loss": -22.04412841796875, "global_step": 108842, "epoch": 1311} {"train_loss": -22.35284996032715, "global_step": 108843, "epoch": 1311} {"train_loss": -22.364849090576172, "global_step": 108844, "epoch": 1311} {"train_loss": -22.230897903442383, "global_step": 108845, "epoch": 1311} {"train_loss": -22.017894744873047, "global_step": 108846, "epoch": 1311} {"train_loss": -22.517471313476562, "global_step": 108847, "epoch": 1311} {"train_loss": -22.238859176635742, "global_step": 108848, "epoch": 1311} {"train_loss": -22.036048889160156, "global_step": 108849, "epoch": 1311} {"train_loss": -22.462568283081055, "global_step": 108850, "epoch": 1311} {"train_loss": -21.946683883666992, "global_step": 108851, "epoch": 1311} {"train_loss": -22.049560546875, "global_step": 108852, "epoch": 1311} {"train_loss": -22.537134170532227, "global_step": 108853, "epoch": 1311} {"train_loss": -22.518030166625977, "global_step": 108854, "epoch": 1311} {"train_loss": -22.01180648803711, "global_step": 108855, "epoch": 1311} {"train_loss": -21.917932510375977, "global_step": 108856, "epoch": 1311} {"train_loss": -22.103408813476562, "global_step": 108857, "epoch": 1311} {"train_loss": -22.48121452331543, "global_step": 108858, "epoch": 1311} {"train_loss": -22.032161712646484, "global_step": 108859, "epoch": 1311} {"train_loss": -22.05348014831543, "global_step": 108860, "epoch": 1311} {"train_loss": -21.99509048461914, "global_step": 108861, "epoch": 1311} {"train_loss": -22.085187911987305, "global_step": 108862, "epoch": 1311} {"train_loss": -22.322254180908203, "global_step": 108863, "epoch": 1311} {"train_loss": -22.30323600769043, "global_step": 108864, "epoch": 1311} {"train_loss": -21.968280792236328, "global_step": 108865, "epoch": 1311} {"train_loss": -22.404659271240234, "global_step": 108866, "epoch": 1311} {"train_loss": -22.131084442138672, "global_step": 108867, "epoch": 1311} {"train_loss": -22.204984664916992, "global_step": 108868, "epoch": 1311} {"train_loss": -22.154142379760742, "global_step": 108869, "epoch": 1311} {"train_loss": -22.659046173095703, "global_step": 108870, "epoch": 1311} {"train_loss": -22.178939819335938, "global_step": 108871, "epoch": 1311} {"train_loss": -21.905752182006836, "global_step": 108872, "epoch": 1311} {"train_loss": -22.26650047302246, "global_step": 108873, "epoch": 1311} {"train_loss": -22.16167640686035, "global_step": 108874, "epoch": 1311} {"train_loss": -22.4139404296875, "global_step": 108875, "epoch": 1311} {"train_loss": -22.2860164642334, "global_step": 108876, "epoch": 1311} {"train_loss": -21.940603256225586, "global_step": 108877, "epoch": 1311} {"train_loss": -22.272092819213867, "global_step": 108878, "epoch": 1311} {"train_loss": -22.075654983520508, "global_step": 108879, "epoch": 1311} {"train_loss": -22.12721824645996, "global_step": 108880, "epoch": 1311} {"train_loss": -22.250614166259766, "global_step": 108881, "epoch": 1311} {"train_loss": -22.136423110961914, "global_step": 108882, "epoch": 1311} {"train_loss": -22.20918083190918, "global_step": 108883, "epoch": 1311} {"train_loss": -22.33310317993164, "global_step": 108884, "epoch": 1311} {"train_loss": -22.53070068359375, "global_step": 108885, "epoch": 1311} {"train_loss": -22.091856002807617, "global_step": 108886, "epoch": 1311} {"train_loss": -21.958593368530273, "global_step": 108887, "epoch": 1311} {"train_loss": -22.202167510986328, "global_step": 108888, "epoch": 1311} {"train_loss": -21.94879722595215, "global_step": 108889, "epoch": 1311} {"train_loss": -22.162145614624023, "global_step": 108890, "epoch": 1311} {"train_loss": -22.51411247253418, "global_step": 108891, "epoch": 1311} {"train_loss": -22.327362060546875, "global_step": 108892, "epoch": 1311} {"train_loss": -22.249530792236328, "global_step": 108893, "epoch": 1311} {"train_loss": -22.208662033081055, "global_step": 108894, "epoch": 1311} {"train_loss": -22.177453535148896, "global_step": 108895, "epoch": 1311, "val_loss": 6196715.5} {"train_loss": -21.14801597595215, "global_step": 108896, "epoch": 1312} {"train_loss": -21.790878295898438, "global_step": 108897, "epoch": 1312} {"train_loss": -21.980926513671875, "global_step": 108898, "epoch": 1312} {"train_loss": -22.121206283569336, "global_step": 108899, "epoch": 1312} {"train_loss": -21.74846839904785, "global_step": 108900, "epoch": 1312} {"train_loss": -21.6846923828125, "global_step": 108901, "epoch": 1312} {"train_loss": -22.27751350402832, "global_step": 108902, "epoch": 1312} {"train_loss": -22.327756881713867, "global_step": 108903, "epoch": 1312} {"train_loss": -21.928281784057617, "global_step": 108904, "epoch": 1312} {"train_loss": -22.029691696166992, "global_step": 108905, "epoch": 1312} {"train_loss": -22.159719467163086, "global_step": 108906, "epoch": 1312} {"train_loss": -22.08102798461914, "global_step": 108907, "epoch": 1312} {"train_loss": -22.18137550354004, "global_step": 108908, "epoch": 1312} {"train_loss": -22.366064071655273, "global_step": 108909, "epoch": 1312} {"train_loss": -21.986406326293945, "global_step": 108910, "epoch": 1312} {"train_loss": -22.29541015625, "global_step": 108911, "epoch": 1312} {"train_loss": -21.982818603515625, "global_step": 108912, "epoch": 1312} {"train_loss": -22.065393447875977, "global_step": 108913, "epoch": 1312} {"train_loss": -22.20341682434082, "global_step": 108914, "epoch": 1312} {"train_loss": -21.830509185791016, "global_step": 108915, "epoch": 1312} {"train_loss": -21.911182403564453, "global_step": 108916, "epoch": 1312} {"train_loss": -22.0450496673584, "global_step": 108917, "epoch": 1312} {"train_loss": -21.937002182006836, "global_step": 108918, "epoch": 1312} {"train_loss": -22.316741943359375, "global_step": 108919, "epoch": 1312} {"train_loss": -22.24676513671875, "global_step": 108920, "epoch": 1312} {"train_loss": -21.93277359008789, "global_step": 108921, "epoch": 1312} {"train_loss": -21.875795364379883, "global_step": 108922, "epoch": 1312} {"train_loss": -22.141725540161133, "global_step": 108923, "epoch": 1312} {"train_loss": -21.9403018951416, "global_step": 108924, "epoch": 1312} {"train_loss": -22.15623664855957, "global_step": 108925, "epoch": 1312} {"train_loss": -22.06467628479004, "global_step": 108926, "epoch": 1312} {"train_loss": -22.31900978088379, "global_step": 108927, "epoch": 1312} {"train_loss": -22.130386352539062, "global_step": 108928, "epoch": 1312} {"train_loss": -22.036977767944336, "global_step": 108929, "epoch": 1312} {"train_loss": -22.12882423400879, "global_step": 108930, "epoch": 1312} {"train_loss": -22.12618064880371, "global_step": 108931, "epoch": 1312} {"train_loss": -21.9549617767334, "global_step": 108932, "epoch": 1312} {"train_loss": -22.114709854125977, "global_step": 108933, "epoch": 1312} {"train_loss": -21.59053611755371, "global_step": 108934, "epoch": 1312} {"train_loss": -22.286794662475586, "global_step": 108935, "epoch": 1312} {"train_loss": -22.619041442871094, "global_step": 108936, "epoch": 1312} {"train_loss": -22.242177963256836, "global_step": 108937, "epoch": 1312} {"train_loss": -22.026948928833008, "global_step": 108938, "epoch": 1312} {"train_loss": -22.04660987854004, "global_step": 108939, "epoch": 1312} {"train_loss": -21.83058738708496, "global_step": 108940, "epoch": 1312} {"train_loss": -22.166833877563477, "global_step": 108941, "epoch": 1312} {"train_loss": -21.82044792175293, "global_step": 108942, "epoch": 1312} {"train_loss": -22.56275749206543, "global_step": 108943, "epoch": 1312} {"train_loss": -22.431509017944336, "global_step": 108944, "epoch": 1312} {"train_loss": -22.302358627319336, "global_step": 108945, "epoch": 1312} {"train_loss": -22.638029098510742, "global_step": 108946, "epoch": 1312} {"train_loss": -22.260921478271484, "global_step": 108947, "epoch": 1312} {"train_loss": -22.556669235229492, "global_step": 108948, "epoch": 1312} {"train_loss": -22.398542404174805, "global_step": 108949, "epoch": 1312} {"train_loss": -22.337665557861328, "global_step": 108950, "epoch": 1312} {"train_loss": -22.236921310424805, "global_step": 108951, "epoch": 1312} {"train_loss": -21.985036849975586, "global_step": 108952, "epoch": 1312} {"train_loss": -21.89004135131836, "global_step": 108953, "epoch": 1312} {"train_loss": -22.00240135192871, "global_step": 108954, "epoch": 1312} {"train_loss": -22.158918380737305, "global_step": 108955, "epoch": 1312} {"train_loss": -22.064510345458984, "global_step": 108956, "epoch": 1312} {"train_loss": -22.497150421142578, "global_step": 108957, "epoch": 1312} {"train_loss": -22.253284454345703, "global_step": 108958, "epoch": 1312} {"train_loss": -22.732349395751953, "global_step": 108959, "epoch": 1312} {"train_loss": -22.441015243530273, "global_step": 108960, "epoch": 1312} {"train_loss": -22.05343246459961, "global_step": 108961, "epoch": 1312} {"train_loss": -22.104299545288086, "global_step": 108962, "epoch": 1312} {"train_loss": -22.192716598510742, "global_step": 108963, "epoch": 1312} {"train_loss": -22.69910430908203, "global_step": 108964, "epoch": 1312} {"train_loss": -22.46555519104004, "global_step": 108965, "epoch": 1312} {"train_loss": -22.414039611816406, "global_step": 108966, "epoch": 1312} {"train_loss": -22.249736785888672, "global_step": 108967, "epoch": 1312} {"train_loss": -22.429718017578125, "global_step": 108968, "epoch": 1312} {"train_loss": -22.037466049194336, "global_step": 108969, "epoch": 1312} {"train_loss": -22.276123046875, "global_step": 108970, "epoch": 1312} {"train_loss": -22.15761375427246, "global_step": 108971, "epoch": 1312} {"train_loss": -22.208282470703125, "global_step": 108972, "epoch": 1312} {"train_loss": -22.3740291595459, "global_step": 108973, "epoch": 1312} {"train_loss": -22.51788902282715, "global_step": 108974, "epoch": 1312} {"train_loss": -22.244001388549805, "global_step": 108975, "epoch": 1312} {"train_loss": -22.259384155273438, "global_step": 108976, "epoch": 1312} {"train_loss": -22.45131492614746, "global_step": 108977, "epoch": 1312} {"train_loss": -22.16724161354892, "global_step": 108978, "epoch": 1312, "val_loss": 6059492.0} {"train_loss": -21.860321044921875, "global_step": 108979, "epoch": 1313} {"train_loss": -21.295377731323242, "global_step": 108980, "epoch": 1313} {"train_loss": -21.443313598632812, "global_step": 108981, "epoch": 1313} {"train_loss": -22.319046020507812, "global_step": 108982, "epoch": 1313} {"train_loss": -22.152271270751953, "global_step": 108983, "epoch": 1313} {"train_loss": -21.70246124267578, "global_step": 108984, "epoch": 1313} {"train_loss": -21.97944450378418, "global_step": 108985, "epoch": 1313} {"train_loss": -21.5355224609375, "global_step": 108986, "epoch": 1313} {"train_loss": -21.858678817749023, "global_step": 108987, "epoch": 1313} {"train_loss": -22.198713302612305, "global_step": 108988, "epoch": 1313} {"train_loss": -22.264938354492188, "global_step": 108989, "epoch": 1313} {"train_loss": -22.266698837280273, "global_step": 108990, "epoch": 1313} {"train_loss": -22.243396759033203, "global_step": 108991, "epoch": 1313} {"train_loss": -22.162763595581055, "global_step": 108992, "epoch": 1313} {"train_loss": -22.25492286682129, "global_step": 108993, "epoch": 1313} {"train_loss": -22.169307708740234, "global_step": 108994, "epoch": 1313} {"train_loss": -22.243616104125977, "global_step": 108995, "epoch": 1313} {"train_loss": -22.063602447509766, "global_step": 108996, "epoch": 1313} {"train_loss": -22.265857696533203, "global_step": 108997, "epoch": 1313} {"train_loss": -21.976795196533203, "global_step": 108998, "epoch": 1313} {"train_loss": -22.45015525817871, "global_step": 108999, "epoch": 1313} {"train_loss": -22.297199249267578, "global_step": 109000, "epoch": 1313} {"train_loss": -22.212419509887695, "global_step": 109001, "epoch": 1313} {"train_loss": -22.354938507080078, "global_step": 109002, "epoch": 1313} {"train_loss": -22.113874435424805, "global_step": 109003, "epoch": 1313} {"train_loss": -22.478565216064453, "global_step": 109004, "epoch": 1313} {"train_loss": -22.042272567749023, "global_step": 109005, "epoch": 1313} {"train_loss": -22.274057388305664, "global_step": 109006, "epoch": 1313} {"train_loss": -22.41597557067871, "global_step": 109007, "epoch": 1313} {"train_loss": -21.841373443603516, "global_step": 109008, "epoch": 1313} {"train_loss": -22.142953872680664, "global_step": 109009, "epoch": 1313} {"train_loss": -22.07478141784668, "global_step": 109010, "epoch": 1313} {"train_loss": -22.342992782592773, "global_step": 109011, "epoch": 1313} {"train_loss": -22.49493408203125, "global_step": 109012, "epoch": 1313} {"train_loss": -22.205142974853516, "global_step": 109013, "epoch": 1313} {"train_loss": -22.413599014282227, "global_step": 109014, "epoch": 1313} {"train_loss": -22.135290145874023, "global_step": 109015, "epoch": 1313} {"train_loss": -22.262842178344727, "global_step": 109016, "epoch": 1313} {"train_loss": -22.5452823638916, "global_step": 109017, "epoch": 1313} {"train_loss": -22.231473922729492, "global_step": 109018, "epoch": 1313} {"train_loss": -22.206953048706055, "global_step": 109019, "epoch": 1313} {"train_loss": -22.24150276184082, "global_step": 109020, "epoch": 1313} {"train_loss": -22.19252586364746, "global_step": 109021, "epoch": 1313} {"train_loss": -22.49074935913086, "global_step": 109022, "epoch": 1313} {"train_loss": -22.28602409362793, "global_step": 109023, "epoch": 1313} {"train_loss": -21.882123947143555, "global_step": 109024, "epoch": 1313} {"train_loss": -22.152572631835938, "global_step": 109025, "epoch": 1313} {"train_loss": -22.108963012695312, "global_step": 109026, "epoch": 1313} {"train_loss": -22.285551071166992, "global_step": 109027, "epoch": 1313} {"train_loss": -22.297697067260742, "global_step": 109028, "epoch": 1313} {"train_loss": -22.15789222717285, "global_step": 109029, "epoch": 1313} {"train_loss": -21.93562126159668, "global_step": 109030, "epoch": 1313} {"train_loss": -22.28839111328125, "global_step": 109031, "epoch": 1313} {"train_loss": -22.419029235839844, "global_step": 109032, "epoch": 1313} {"train_loss": -22.109357833862305, "global_step": 109033, "epoch": 1313} {"train_loss": -22.20949363708496, "global_step": 109034, "epoch": 1313} {"train_loss": -22.34465980529785, "global_step": 109035, "epoch": 1313} {"train_loss": -22.13521385192871, "global_step": 109036, "epoch": 1313} {"train_loss": -22.294523239135742, "global_step": 109037, "epoch": 1313} {"train_loss": -22.184446334838867, "global_step": 109038, "epoch": 1313} {"train_loss": -22.311725616455078, "global_step": 109039, "epoch": 1313} {"train_loss": -21.94045066833496, "global_step": 109040, "epoch": 1313} {"train_loss": -21.951492309570312, "global_step": 109041, "epoch": 1313} {"train_loss": -22.019872665405273, "global_step": 109042, "epoch": 1313} {"train_loss": -22.40070915222168, "global_step": 109043, "epoch": 1313} {"train_loss": -22.114055633544922, "global_step": 109044, "epoch": 1313} {"train_loss": -21.802412033081055, "global_step": 109045, "epoch": 1313} {"train_loss": -21.8162841796875, "global_step": 109046, "epoch": 1313} {"train_loss": -22.0072078704834, "global_step": 109047, "epoch": 1313} {"train_loss": -22.437992095947266, "global_step": 109048, "epoch": 1313} {"train_loss": -22.201778411865234, "global_step": 109049, "epoch": 1313} {"train_loss": -22.186185836791992, "global_step": 109050, "epoch": 1313} {"train_loss": -22.126684188842773, "global_step": 109051, "epoch": 1313} {"train_loss": -22.38213348388672, "global_step": 109052, "epoch": 1313} {"train_loss": -22.36862564086914, "global_step": 109053, "epoch": 1313} {"train_loss": -21.9518985748291, "global_step": 109054, "epoch": 1313} {"train_loss": -21.698774337768555, "global_step": 109055, "epoch": 1313} {"train_loss": -22.33061981201172, "global_step": 109056, "epoch": 1313} {"train_loss": -21.7916202545166, "global_step": 109057, "epoch": 1313} {"train_loss": -22.4417781829834, "global_step": 109058, "epoch": 1313} {"train_loss": -22.599334716796875, "global_step": 109059, "epoch": 1313} {"train_loss": -22.30032730102539, "global_step": 109060, "epoch": 1313} {"train_loss": -22.15088469723621, "global_step": 109061, "epoch": 1313, "val_loss": 6252223.0} {"train_loss": -21.078710556030273, "global_step": 109062, "epoch": 1314} {"train_loss": -21.401723861694336, "global_step": 109063, "epoch": 1314} {"train_loss": -21.78383445739746, "global_step": 109064, "epoch": 1314} {"train_loss": -21.91436767578125, "global_step": 109065, "epoch": 1314} {"train_loss": -21.445770263671875, "global_step": 109066, "epoch": 1314} {"train_loss": -21.745010375976562, "global_step": 109067, "epoch": 1314} {"train_loss": -21.751678466796875, "global_step": 109068, "epoch": 1314} {"train_loss": -21.993207931518555, "global_step": 109069, "epoch": 1314} {"train_loss": -21.87350082397461, "global_step": 109070, "epoch": 1314} {"train_loss": -22.27682876586914, "global_step": 109071, "epoch": 1314} {"train_loss": -22.182355880737305, "global_step": 109072, "epoch": 1314} {"train_loss": -22.069995880126953, "global_step": 109073, "epoch": 1314} {"train_loss": -22.101533889770508, "global_step": 109074, "epoch": 1314} {"train_loss": -22.217884063720703, "global_step": 109075, "epoch": 1314} {"train_loss": -21.87194061279297, "global_step": 109076, "epoch": 1314} {"train_loss": -22.139606475830078, "global_step": 109077, "epoch": 1314} {"train_loss": -21.883607864379883, "global_step": 109078, "epoch": 1314} {"train_loss": -22.43181610107422, "global_step": 109079, "epoch": 1314} {"train_loss": -22.284259796142578, "global_step": 109080, "epoch": 1314} {"train_loss": -22.192928314208984, "global_step": 109081, "epoch": 1314} {"train_loss": -21.811201095581055, "global_step": 109082, "epoch": 1314} {"train_loss": -22.042417526245117, "global_step": 109083, "epoch": 1314} {"train_loss": -21.931310653686523, "global_step": 109084, "epoch": 1314} {"train_loss": -21.92901611328125, "global_step": 109085, "epoch": 1314} {"train_loss": -22.076684951782227, "global_step": 109086, "epoch": 1314} {"train_loss": -22.289247512817383, "global_step": 109087, "epoch": 1314} {"train_loss": -21.98348045349121, "global_step": 109088, "epoch": 1314} {"train_loss": -22.170888900756836, "global_step": 109089, "epoch": 1314} {"train_loss": -21.96413803100586, "global_step": 109090, "epoch": 1314} {"train_loss": -22.167146682739258, "global_step": 109091, "epoch": 1314} {"train_loss": -22.28534507751465, "global_step": 109092, "epoch": 1314} {"train_loss": -22.03705406188965, "global_step": 109093, "epoch": 1314} {"train_loss": -22.21507453918457, "global_step": 109094, "epoch": 1314} {"train_loss": -22.31076431274414, "global_step": 109095, "epoch": 1314} {"train_loss": -22.055423736572266, "global_step": 109096, "epoch": 1314} {"train_loss": -22.26919937133789, "global_step": 109097, "epoch": 1314} {"train_loss": -22.205114364624023, "global_step": 109098, "epoch": 1314} {"train_loss": -22.424543380737305, "global_step": 109099, "epoch": 1314} {"train_loss": -22.069660186767578, "global_step": 109100, "epoch": 1314} {"train_loss": -22.07349967956543, "global_step": 109101, "epoch": 1314} {"train_loss": -22.58415985107422, "global_step": 109102, "epoch": 1314} {"train_loss": -21.986215591430664, "global_step": 109103, "epoch": 1314} {"train_loss": -22.088315963745117, "global_step": 109104, "epoch": 1314} {"train_loss": -22.306886672973633, "global_step": 109105, "epoch": 1314} {"train_loss": -22.259836196899414, "global_step": 109106, "epoch": 1314} {"train_loss": -22.200105667114258, "global_step": 109107, "epoch": 1314} {"train_loss": -22.271873474121094, "global_step": 109108, "epoch": 1314} {"train_loss": -22.258893966674805, "global_step": 109109, "epoch": 1314} {"train_loss": -22.45619773864746, "global_step": 109110, "epoch": 1314} {"train_loss": -22.322574615478516, "global_step": 109111, "epoch": 1314} {"train_loss": -22.374183654785156, "global_step": 109112, "epoch": 1314} {"train_loss": -22.529891967773438, "global_step": 109113, "epoch": 1314} {"train_loss": -22.791635513305664, "global_step": 109114, "epoch": 1314} {"train_loss": -22.329504013061523, "global_step": 109115, "epoch": 1314} {"train_loss": -22.410785675048828, "global_step": 109116, "epoch": 1314} {"train_loss": -22.2843074798584, "global_step": 109117, "epoch": 1314} {"train_loss": -22.190387725830078, "global_step": 109118, "epoch": 1314} {"train_loss": -22.732519149780273, "global_step": 109119, "epoch": 1314} {"train_loss": -22.479110717773438, "global_step": 109120, "epoch": 1314} {"train_loss": -22.13677215576172, "global_step": 109121, "epoch": 1314} {"train_loss": -22.168119430541992, "global_step": 109122, "epoch": 1314} {"train_loss": -22.42534065246582, "global_step": 109123, "epoch": 1314} {"train_loss": -22.307981491088867, "global_step": 109124, "epoch": 1314} {"train_loss": -22.02509880065918, "global_step": 109125, "epoch": 1314} {"train_loss": -22.43115997314453, "global_step": 109126, "epoch": 1314} {"train_loss": -22.282827377319336, "global_step": 109127, "epoch": 1314} {"train_loss": -22.544530868530273, "global_step": 109128, "epoch": 1314} {"train_loss": -22.235883712768555, "global_step": 109129, "epoch": 1314} {"train_loss": -22.07732582092285, "global_step": 109130, "epoch": 1314} {"train_loss": -22.342864990234375, "global_step": 109131, "epoch": 1314} {"train_loss": -22.567609786987305, "global_step": 109132, "epoch": 1314} {"train_loss": -22.136865615844727, "global_step": 109133, "epoch": 1314} {"train_loss": -21.7376651763916, "global_step": 109134, "epoch": 1314} {"train_loss": -22.323606491088867, "global_step": 109135, "epoch": 1314} {"train_loss": -22.14683723449707, "global_step": 109136, "epoch": 1314} {"train_loss": -22.041189193725586, "global_step": 109137, "epoch": 1314} {"train_loss": -22.489418029785156, "global_step": 109138, "epoch": 1314} {"train_loss": -22.487716674804688, "global_step": 109139, "epoch": 1314} {"train_loss": -22.34992218017578, "global_step": 109140, "epoch": 1314} {"train_loss": -22.26313591003418, "global_step": 109141, "epoch": 1314} {"train_loss": -22.36362075805664, "global_step": 109142, "epoch": 1314} {"train_loss": -22.4034481048584, "global_step": 109143, "epoch": 1314} {"train_loss": -22.154611472623895, "global_step": 109144, "epoch": 1314, "val_loss": 6124942.0} {"train_loss": -22.000818252563477, "global_step": 109145, "epoch": 1315} {"train_loss": -21.86165428161621, "global_step": 109146, "epoch": 1315} {"train_loss": -21.803926467895508, "global_step": 109147, "epoch": 1315} {"train_loss": -22.54359245300293, "global_step": 109148, "epoch": 1315} {"train_loss": -21.564044952392578, "global_step": 109149, "epoch": 1315} {"train_loss": -22.14305877685547, "global_step": 109150, "epoch": 1315} {"train_loss": -22.00843048095703, "global_step": 109151, "epoch": 1315} {"train_loss": -21.814558029174805, "global_step": 109152, "epoch": 1315} {"train_loss": -22.078540802001953, "global_step": 109153, "epoch": 1315} {"train_loss": -21.846176147460938, "global_step": 109154, "epoch": 1315} {"train_loss": -22.245769500732422, "global_step": 109155, "epoch": 1315} {"train_loss": -22.46082878112793, "global_step": 109156, "epoch": 1315} {"train_loss": -22.280248641967773, "global_step": 109157, "epoch": 1315} {"train_loss": -22.155216217041016, "global_step": 109158, "epoch": 1315} {"train_loss": -22.192956924438477, "global_step": 109159, "epoch": 1315} {"train_loss": -22.106876373291016, "global_step": 109160, "epoch": 1315} {"train_loss": -21.79114532470703, "global_step": 109161, "epoch": 1315} {"train_loss": -22.51013946533203, "global_step": 109162, "epoch": 1315} {"train_loss": -22.152568817138672, "global_step": 109163, "epoch": 1315} {"train_loss": -22.601408004760742, "global_step": 109164, "epoch": 1315} {"train_loss": -22.276138305664062, "global_step": 109165, "epoch": 1315} {"train_loss": -22.691415786743164, "global_step": 109166, "epoch": 1315} {"train_loss": -22.15509605407715, "global_step": 109167, "epoch": 1315} {"train_loss": -22.5112247467041, "global_step": 109168, "epoch": 1315} {"train_loss": -22.066572189331055, "global_step": 109169, "epoch": 1315} {"train_loss": -22.1380615234375, "global_step": 109170, "epoch": 1315} {"train_loss": -22.50855827331543, "global_step": 109171, "epoch": 1315} {"train_loss": -22.301273345947266, "global_step": 109172, "epoch": 1315} {"train_loss": -21.985916137695312, "global_step": 109173, "epoch": 1315} {"train_loss": -22.508737564086914, "global_step": 109174, "epoch": 1315} {"train_loss": -22.39760398864746, "global_step": 109175, "epoch": 1315} {"train_loss": -22.444124221801758, "global_step": 109176, "epoch": 1315} {"train_loss": -22.089630126953125, "global_step": 109177, "epoch": 1315} {"train_loss": -22.377817153930664, "global_step": 109178, "epoch": 1315} {"train_loss": -22.253604888916016, "global_step": 109179, "epoch": 1315} {"train_loss": -21.98662757873535, "global_step": 109180, "epoch": 1315} {"train_loss": -22.219985961914062, "global_step": 109181, "epoch": 1315} {"train_loss": -22.300689697265625, "global_step": 109182, "epoch": 1315} {"train_loss": -22.0577449798584, "global_step": 109183, "epoch": 1315} {"train_loss": -22.161680221557617, "global_step": 109184, "epoch": 1315} {"train_loss": -22.49799919128418, "global_step": 109185, "epoch": 1315} {"train_loss": -22.226409912109375, "global_step": 109186, "epoch": 1315} {"train_loss": -22.01197624206543, "global_step": 109187, "epoch": 1315} {"train_loss": -22.118955612182617, "global_step": 109188, "epoch": 1315} {"train_loss": -22.394113540649414, "global_step": 109189, "epoch": 1315} {"train_loss": -22.2810115814209, "global_step": 109190, "epoch": 1315} {"train_loss": -22.19502067565918, "global_step": 109191, "epoch": 1315} {"train_loss": -21.695484161376953, "global_step": 109192, "epoch": 1315} {"train_loss": -22.690603256225586, "global_step": 109193, "epoch": 1315} {"train_loss": -22.673091888427734, "global_step": 109194, "epoch": 1315} {"train_loss": -22.17945671081543, "global_step": 109195, "epoch": 1315} {"train_loss": -21.990325927734375, "global_step": 109196, "epoch": 1315} {"train_loss": -22.12062644958496, "global_step": 109197, "epoch": 1315} {"train_loss": -22.161174774169922, "global_step": 109198, "epoch": 1315} {"train_loss": -22.175765991210938, "global_step": 109199, "epoch": 1315} {"train_loss": -21.82334327697754, "global_step": 109200, "epoch": 1315} {"train_loss": -22.306119918823242, "global_step": 109201, "epoch": 1315} {"train_loss": -22.355859756469727, "global_step": 109202, "epoch": 1315} {"train_loss": -22.36008071899414, "global_step": 109203, "epoch": 1315} {"train_loss": -22.23615837097168, "global_step": 109204, "epoch": 1315} {"train_loss": -22.048755645751953, "global_step": 109205, "epoch": 1315} {"train_loss": -22.275114059448242, "global_step": 109206, "epoch": 1315} {"train_loss": -21.9454288482666, "global_step": 109207, "epoch": 1315} {"train_loss": -22.286035537719727, "global_step": 109208, "epoch": 1315} {"train_loss": -22.294275283813477, "global_step": 109209, "epoch": 1315} {"train_loss": -22.275291442871094, "global_step": 109210, "epoch": 1315} {"train_loss": -22.92361831665039, "global_step": 109211, "epoch": 1315} {"train_loss": -22.613916397094727, "global_step": 109212, "epoch": 1315} {"train_loss": -22.091291427612305, "global_step": 109213, "epoch": 1315} {"train_loss": -22.199485778808594, "global_step": 109214, "epoch": 1315} {"train_loss": -22.41602897644043, "global_step": 109215, "epoch": 1315} {"train_loss": -22.01234245300293, "global_step": 109216, "epoch": 1315} {"train_loss": -21.566434860229492, "global_step": 109217, "epoch": 1315} {"train_loss": -22.087961196899414, "global_step": 109218, "epoch": 1315} {"train_loss": -22.34885597229004, "global_step": 109219, "epoch": 1315} {"train_loss": -22.107351303100586, "global_step": 109220, "epoch": 1315} {"train_loss": -22.161996841430664, "global_step": 109221, "epoch": 1315} {"train_loss": -21.719701766967773, "global_step": 109222, "epoch": 1315} {"train_loss": -22.042776107788086, "global_step": 109223, "epoch": 1315} {"train_loss": -22.06015396118164, "global_step": 109224, "epoch": 1315} {"train_loss": -21.756601333618164, "global_step": 109225, "epoch": 1315} {"train_loss": -21.950170516967773, "global_step": 109226, "epoch": 1315} {"train_loss": -22.198629976755164, "global_step": 109227, "epoch": 1315, "val_loss": 6245254.0} {"train_loss": -21.813983917236328, "global_step": 109228, "epoch": 1316} {"train_loss": -21.793476104736328, "global_step": 109229, "epoch": 1316} {"train_loss": -21.962900161743164, "global_step": 109230, "epoch": 1316} {"train_loss": -21.829164505004883, "global_step": 109231, "epoch": 1316} {"train_loss": -21.715795516967773, "global_step": 109232, "epoch": 1316} {"train_loss": -21.916593551635742, "global_step": 109233, "epoch": 1316} {"train_loss": -21.429533004760742, "global_step": 109234, "epoch": 1316} {"train_loss": -22.408714294433594, "global_step": 109235, "epoch": 1316} {"train_loss": -21.761167526245117, "global_step": 109236, "epoch": 1316} {"train_loss": -21.86421012878418, "global_step": 109237, "epoch": 1316} {"train_loss": -22.22481346130371, "global_step": 109238, "epoch": 1316} {"train_loss": -22.093475341796875, "global_step": 109239, "epoch": 1316} {"train_loss": -22.190183639526367, "global_step": 109240, "epoch": 1316} {"train_loss": -21.958288192749023, "global_step": 109241, "epoch": 1316} {"train_loss": -22.202070236206055, "global_step": 109242, "epoch": 1316} {"train_loss": -22.17190933227539, "global_step": 109243, "epoch": 1316} {"train_loss": -22.111007690429688, "global_step": 109244, "epoch": 1316} {"train_loss": -22.247913360595703, "global_step": 109245, "epoch": 1316} {"train_loss": -22.396390914916992, "global_step": 109246, "epoch": 1316} {"train_loss": -21.81600570678711, "global_step": 109247, "epoch": 1316} {"train_loss": -21.869285583496094, "global_step": 109248, "epoch": 1316} {"train_loss": -22.41501808166504, "global_step": 109249, "epoch": 1316} {"train_loss": -22.22235679626465, "global_step": 109250, "epoch": 1316} {"train_loss": -22.02863883972168, "global_step": 109251, "epoch": 1316} {"train_loss": -22.017393112182617, "global_step": 109252, "epoch": 1316} {"train_loss": -22.20956802368164, "global_step": 109253, "epoch": 1316} {"train_loss": -22.591928482055664, "global_step": 109254, "epoch": 1316} {"train_loss": -22.184446334838867, "global_step": 109255, "epoch": 1316} {"train_loss": -22.358999252319336, "global_step": 109256, "epoch": 1316} {"train_loss": -22.073444366455078, "global_step": 109257, "epoch": 1316} {"train_loss": -22.013751983642578, "global_step": 109258, "epoch": 1316} {"train_loss": -22.47401237487793, "global_step": 109259, "epoch": 1316} {"train_loss": -22.15656852722168, "global_step": 109260, "epoch": 1316} {"train_loss": -22.470705032348633, "global_step": 109261, "epoch": 1316} {"train_loss": -21.99970817565918, "global_step": 109262, "epoch": 1316} {"train_loss": -22.415664672851562, "global_step": 109263, "epoch": 1316} {"train_loss": -22.112585067749023, "global_step": 109264, "epoch": 1316} {"train_loss": -22.483762741088867, "global_step": 109265, "epoch": 1316} {"train_loss": -22.034969329833984, "global_step": 109266, "epoch": 1316} {"train_loss": -22.18513298034668, "global_step": 109267, "epoch": 1316} {"train_loss": -21.756322860717773, "global_step": 109268, "epoch": 1316} {"train_loss": -22.23111343383789, "global_step": 109269, "epoch": 1316} {"train_loss": -22.49481773376465, "global_step": 109270, "epoch": 1316} {"train_loss": -22.289886474609375, "global_step": 109271, "epoch": 1316} {"train_loss": -22.384939193725586, "global_step": 109272, "epoch": 1316} {"train_loss": -22.39320945739746, "global_step": 109273, "epoch": 1316} {"train_loss": -22.263099670410156, "global_step": 109274, "epoch": 1316} {"train_loss": -22.27546501159668, "global_step": 109275, "epoch": 1316} {"train_loss": -22.371707916259766, "global_step": 109276, "epoch": 1316} {"train_loss": -22.167661666870117, "global_step": 109277, "epoch": 1316} {"train_loss": -22.371408462524414, "global_step": 109278, "epoch": 1316} {"train_loss": -22.412736892700195, "global_step": 109279, "epoch": 1316} {"train_loss": -22.42036247253418, "global_step": 109280, "epoch": 1316} {"train_loss": -22.15907859802246, "global_step": 109281, "epoch": 1316} {"train_loss": -22.748966217041016, "global_step": 109282, "epoch": 1316} {"train_loss": -21.97531509399414, "global_step": 109283, "epoch": 1316} {"train_loss": -22.190523147583008, "global_step": 109284, "epoch": 1316} {"train_loss": -22.41105079650879, "global_step": 109285, "epoch": 1316} {"train_loss": -22.117095947265625, "global_step": 109286, "epoch": 1316} {"train_loss": -22.55146026611328, "global_step": 109287, "epoch": 1316} {"train_loss": -22.239295959472656, "global_step": 109288, "epoch": 1316} {"train_loss": -22.02271842956543, "global_step": 109289, "epoch": 1316} {"train_loss": -22.51168441772461, "global_step": 109290, "epoch": 1316} {"train_loss": -21.905351638793945, "global_step": 109291, "epoch": 1316} {"train_loss": -22.27260971069336, "global_step": 109292, "epoch": 1316} {"train_loss": -22.38484001159668, "global_step": 109293, "epoch": 1316} {"train_loss": -22.368955612182617, "global_step": 109294, "epoch": 1316} {"train_loss": -22.539594650268555, "global_step": 109295, "epoch": 1316} {"train_loss": -21.9815616607666, "global_step": 109296, "epoch": 1316} {"train_loss": -22.321874618530273, "global_step": 109297, "epoch": 1316} {"train_loss": -22.311954498291016, "global_step": 109298, "epoch": 1316} {"train_loss": -22.05341148376465, "global_step": 109299, "epoch": 1316} {"train_loss": -22.604089736938477, "global_step": 109300, "epoch": 1316} {"train_loss": -22.321659088134766, "global_step": 109301, "epoch": 1316} {"train_loss": -22.039281845092773, "global_step": 109302, "epoch": 1316} {"train_loss": -21.83613395690918, "global_step": 109303, "epoch": 1316} {"train_loss": -21.477357864379883, "global_step": 109304, "epoch": 1316} {"train_loss": -22.053077697753906, "global_step": 109305, "epoch": 1316} {"train_loss": -22.185941696166992, "global_step": 109306, "epoch": 1316} {"train_loss": -22.062816619873047, "global_step": 109307, "epoch": 1316} {"train_loss": -22.002988815307617, "global_step": 109308, "epoch": 1316} {"train_loss": -21.886192321777344, "global_step": 109309, "epoch": 1316} {"train_loss": -22.16330808616546, "global_step": 109310, "epoch": 1316, "val_loss": 6154677.0} {"train_loss": -21.599485397338867, "global_step": 109311, "epoch": 1317} {"train_loss": -21.740617752075195, "global_step": 109312, "epoch": 1317} {"train_loss": -21.765047073364258, "global_step": 109313, "epoch": 1317} {"train_loss": -21.81662940979004, "global_step": 109314, "epoch": 1317} {"train_loss": -21.67793083190918, "global_step": 109315, "epoch": 1317} {"train_loss": -21.790090560913086, "global_step": 109316, "epoch": 1317} {"train_loss": -21.668249130249023, "global_step": 109317, "epoch": 1317} {"train_loss": -21.72020721435547, "global_step": 109318, "epoch": 1317} {"train_loss": -21.833251953125, "global_step": 109319, "epoch": 1317} {"train_loss": -21.779157638549805, "global_step": 109320, "epoch": 1317} {"train_loss": -21.40846824645996, "global_step": 109321, "epoch": 1317} {"train_loss": -21.804244995117188, "global_step": 109322, "epoch": 1317} {"train_loss": -22.223669052124023, "global_step": 109323, "epoch": 1317} {"train_loss": -21.827102661132812, "global_step": 109324, "epoch": 1317} {"train_loss": -21.905820846557617, "global_step": 109325, "epoch": 1317} {"train_loss": -22.586219787597656, "global_step": 109326, "epoch": 1317} {"train_loss": -21.913869857788086, "global_step": 109327, "epoch": 1317} {"train_loss": -22.09214210510254, "global_step": 109328, "epoch": 1317} {"train_loss": -22.176536560058594, "global_step": 109329, "epoch": 1317} {"train_loss": -21.887781143188477, "global_step": 109330, "epoch": 1317} {"train_loss": -22.18391990661621, "global_step": 109331, "epoch": 1317} {"train_loss": -22.08518409729004, "global_step": 109332, "epoch": 1317} {"train_loss": -22.135709762573242, "global_step": 109333, "epoch": 1317} {"train_loss": -22.35302734375, "global_step": 109334, "epoch": 1317} {"train_loss": -22.465011596679688, "global_step": 109335, "epoch": 1317} {"train_loss": -22.023469924926758, "global_step": 109336, "epoch": 1317} {"train_loss": -22.121435165405273, "global_step": 109337, "epoch": 1317} {"train_loss": -22.28213119506836, "global_step": 109338, "epoch": 1317} {"train_loss": -22.40460205078125, "global_step": 109339, "epoch": 1317} {"train_loss": -22.186059951782227, "global_step": 109340, "epoch": 1317} {"train_loss": -22.015335083007812, "global_step": 109341, "epoch": 1317} {"train_loss": -21.948556900024414, "global_step": 109342, "epoch": 1317} {"train_loss": -22.487415313720703, "global_step": 109343, "epoch": 1317} {"train_loss": -22.128454208374023, "global_step": 109344, "epoch": 1317} {"train_loss": -22.485570907592773, "global_step": 109345, "epoch": 1317} {"train_loss": -22.068384170532227, "global_step": 109346, "epoch": 1317} {"train_loss": -22.14198112487793, "global_step": 109347, "epoch": 1317} {"train_loss": -22.092666625976562, "global_step": 109348, "epoch": 1317} {"train_loss": -22.295316696166992, "global_step": 109349, "epoch": 1317} {"train_loss": -22.359994888305664, "global_step": 109350, "epoch": 1317} {"train_loss": -22.20499038696289, "global_step": 109351, "epoch": 1317} {"train_loss": -22.069337844848633, "global_step": 109352, "epoch": 1317} {"train_loss": -22.40900230407715, "global_step": 109353, "epoch": 1317} {"train_loss": -22.285429000854492, "global_step": 109354, "epoch": 1317} {"train_loss": -22.153518676757812, "global_step": 109355, "epoch": 1317} {"train_loss": -21.78585433959961, "global_step": 109356, "epoch": 1317} {"train_loss": -22.502471923828125, "global_step": 109357, "epoch": 1317} {"train_loss": -21.856416702270508, "global_step": 109358, "epoch": 1317} {"train_loss": -22.141210556030273, "global_step": 109359, "epoch": 1317} {"train_loss": -22.182926177978516, "global_step": 109360, "epoch": 1317} {"train_loss": -22.700345993041992, "global_step": 109361, "epoch": 1317} {"train_loss": -22.08342742919922, "global_step": 109362, "epoch": 1317} {"train_loss": -22.498361587524414, "global_step": 109363, "epoch": 1317} {"train_loss": -21.941944122314453, "global_step": 109364, "epoch": 1317} {"train_loss": -22.174943923950195, "global_step": 109365, "epoch": 1317} {"train_loss": -22.195180892944336, "global_step": 109366, "epoch": 1317} {"train_loss": -22.530771255493164, "global_step": 109367, "epoch": 1317} {"train_loss": -22.306379318237305, "global_step": 109368, "epoch": 1317} {"train_loss": -22.313749313354492, "global_step": 109369, "epoch": 1317} {"train_loss": -22.446313858032227, "global_step": 109370, "epoch": 1317} {"train_loss": -22.4642276763916, "global_step": 109371, "epoch": 1317} {"train_loss": -22.252843856811523, "global_step": 109372, "epoch": 1317} {"train_loss": -22.389808654785156, "global_step": 109373, "epoch": 1317} {"train_loss": -22.50873374938965, "global_step": 109374, "epoch": 1317} {"train_loss": -22.589679718017578, "global_step": 109375, "epoch": 1317} {"train_loss": -22.190837860107422, "global_step": 109376, "epoch": 1317} {"train_loss": -22.158857345581055, "global_step": 109377, "epoch": 1317} {"train_loss": -22.116466522216797, "global_step": 109378, "epoch": 1317} {"train_loss": -22.314563751220703, "global_step": 109379, "epoch": 1317} {"train_loss": -22.50440788269043, "global_step": 109380, "epoch": 1317} {"train_loss": -22.354215621948242, "global_step": 109381, "epoch": 1317} {"train_loss": -22.201847076416016, "global_step": 109382, "epoch": 1317} {"train_loss": -22.507246017456055, "global_step": 109383, "epoch": 1317} {"train_loss": -21.997114181518555, "global_step": 109384, "epoch": 1317} {"train_loss": -22.489089965820312, "global_step": 109385, "epoch": 1317} {"train_loss": -22.053159713745117, "global_step": 109386, "epoch": 1317} {"train_loss": -22.33553123474121, "global_step": 109387, "epoch": 1317} {"train_loss": -22.44720458984375, "global_step": 109388, "epoch": 1317} {"train_loss": -21.992752075195312, "global_step": 109389, "epoch": 1317} {"train_loss": -22.142118453979492, "global_step": 109390, "epoch": 1317} {"train_loss": -22.180007934570312, "global_step": 109391, "epoch": 1317} {"train_loss": -22.45686149597168, "global_step": 109392, "epoch": 1317} {"train_loss": -22.15728173772973, "global_step": 109393, "epoch": 1317, "val_loss": 6304685.0} {"train_loss": -20.680612564086914, "global_step": 109394, "epoch": 1318} {"train_loss": -21.55388069152832, "global_step": 109395, "epoch": 1318} {"train_loss": -21.11246681213379, "global_step": 109396, "epoch": 1318} {"train_loss": -21.439786911010742, "global_step": 109397, "epoch": 1318} {"train_loss": -21.54817771911621, "global_step": 109398, "epoch": 1318} {"train_loss": -21.591779708862305, "global_step": 109399, "epoch": 1318} {"train_loss": -21.71449089050293, "global_step": 109400, "epoch": 1318} {"train_loss": -22.061254501342773, "global_step": 109401, "epoch": 1318} {"train_loss": -21.45833396911621, "global_step": 109402, "epoch": 1318} {"train_loss": -21.263797760009766, "global_step": 109403, "epoch": 1318} {"train_loss": -21.910715103149414, "global_step": 109404, "epoch": 1318} {"train_loss": -21.647192001342773, "global_step": 109405, "epoch": 1318} {"train_loss": -22.008394241333008, "global_step": 109406, "epoch": 1318} {"train_loss": -21.84112548828125, "global_step": 109407, "epoch": 1318} {"train_loss": -21.78815460205078, "global_step": 109408, "epoch": 1318} {"train_loss": -21.83387565612793, "global_step": 109409, "epoch": 1318} {"train_loss": -21.823591232299805, "global_step": 109410, "epoch": 1318} {"train_loss": -21.799509048461914, "global_step": 109411, "epoch": 1318} {"train_loss": -21.70866584777832, "global_step": 109412, "epoch": 1318} {"train_loss": -21.964317321777344, "global_step": 109413, "epoch": 1318} {"train_loss": -21.89694595336914, "global_step": 109414, "epoch": 1318} {"train_loss": -22.215497970581055, "global_step": 109415, "epoch": 1318} {"train_loss": -21.893457412719727, "global_step": 109416, "epoch": 1318} {"train_loss": -21.939441680908203, "global_step": 109417, "epoch": 1318} {"train_loss": -21.727914810180664, "global_step": 109418, "epoch": 1318} {"train_loss": -22.133695602416992, "global_step": 109419, "epoch": 1318} {"train_loss": -22.436853408813477, "global_step": 109420, "epoch": 1318} {"train_loss": -22.225656509399414, "global_step": 109421, "epoch": 1318} {"train_loss": -21.96160125732422, "global_step": 109422, "epoch": 1318} {"train_loss": -22.180160522460938, "global_step": 109423, "epoch": 1318} {"train_loss": -22.106876373291016, "global_step": 109424, "epoch": 1318} {"train_loss": -22.13957405090332, "global_step": 109425, "epoch": 1318} {"train_loss": -22.35972785949707, "global_step": 109426, "epoch": 1318} {"train_loss": -22.235076904296875, "global_step": 109427, "epoch": 1318} {"train_loss": -22.691638946533203, "global_step": 109428, "epoch": 1318} {"train_loss": -22.580245971679688, "global_step": 109429, "epoch": 1318} {"train_loss": -22.15985107421875, "global_step": 109430, "epoch": 1318} {"train_loss": -22.54265785217285, "global_step": 109431, "epoch": 1318} {"train_loss": -22.690961837768555, "global_step": 109432, "epoch": 1318} {"train_loss": -22.19174575805664, "global_step": 109433, "epoch": 1318} {"train_loss": -22.350788116455078, "global_step": 109434, "epoch": 1318} {"train_loss": -22.325620651245117, "global_step": 109435, "epoch": 1318} {"train_loss": -22.69514274597168, "global_step": 109436, "epoch": 1318} {"train_loss": -22.3525447845459, "global_step": 109437, "epoch": 1318} {"train_loss": -22.408618927001953, "global_step": 109438, "epoch": 1318} {"train_loss": -22.826505661010742, "global_step": 109439, "epoch": 1318} {"train_loss": -22.100311279296875, "global_step": 109440, "epoch": 1318} {"train_loss": -22.42618751525879, "global_step": 109441, "epoch": 1318} {"train_loss": -22.452102661132812, "global_step": 109442, "epoch": 1318} {"train_loss": -22.517858505249023, "global_step": 109443, "epoch": 1318} {"train_loss": -22.65622329711914, "global_step": 109444, "epoch": 1318} {"train_loss": -22.456735610961914, "global_step": 109445, "epoch": 1318} {"train_loss": -22.22938346862793, "global_step": 109446, "epoch": 1318} {"train_loss": -21.919816970825195, "global_step": 109447, "epoch": 1318} {"train_loss": -21.928115844726562, "global_step": 109448, "epoch": 1318} {"train_loss": -22.774372100830078, "global_step": 109449, "epoch": 1318} {"train_loss": -22.450960159301758, "global_step": 109450, "epoch": 1318} {"train_loss": -22.31376075744629, "global_step": 109451, "epoch": 1318} {"train_loss": -22.270736694335938, "global_step": 109452, "epoch": 1318} {"train_loss": -22.333681106567383, "global_step": 109453, "epoch": 1318} {"train_loss": -22.133987426757812, "global_step": 109454, "epoch": 1318} {"train_loss": -22.023344039916992, "global_step": 109455, "epoch": 1318} {"train_loss": -22.366546630859375, "global_step": 109456, "epoch": 1318} {"train_loss": -22.305356979370117, "global_step": 109457, "epoch": 1318} {"train_loss": -22.42436408996582, "global_step": 109458, "epoch": 1318} {"train_loss": -22.43961524963379, "global_step": 109459, "epoch": 1318} {"train_loss": -22.058103561401367, "global_step": 109460, "epoch": 1318} {"train_loss": -22.53521728515625, "global_step": 109461, "epoch": 1318} {"train_loss": -22.188560485839844, "global_step": 109462, "epoch": 1318} {"train_loss": -22.36625099182129, "global_step": 109463, "epoch": 1318} {"train_loss": -22.13483238220215, "global_step": 109464, "epoch": 1318} {"train_loss": -22.119287490844727, "global_step": 109465, "epoch": 1318} {"train_loss": -21.912282943725586, "global_step": 109466, "epoch": 1318} {"train_loss": -21.889158248901367, "global_step": 109467, "epoch": 1318} {"train_loss": -22.513477325439453, "global_step": 109468, "epoch": 1318} {"train_loss": -22.292951583862305, "global_step": 109469, "epoch": 1318} {"train_loss": -22.294057846069336, "global_step": 109470, "epoch": 1318} {"train_loss": -22.061107635498047, "global_step": 109471, "epoch": 1318} {"train_loss": -22.096330642700195, "global_step": 109472, "epoch": 1318} {"train_loss": -22.149213790893555, "global_step": 109473, "epoch": 1318} {"train_loss": -22.036304473876953, "global_step": 109474, "epoch": 1318} {"train_loss": -22.38397789001465, "global_step": 109475, "epoch": 1318} {"train_loss": -22.10397943243923, "global_step": 109476, "epoch": 1318, "val_loss": 6135353.5} {"train_loss": -22.037839889526367, "global_step": 109477, "epoch": 1319} {"train_loss": -21.685958862304688, "global_step": 109478, "epoch": 1319} {"train_loss": -22.02279281616211, "global_step": 109479, "epoch": 1319} {"train_loss": -21.719816207885742, "global_step": 109480, "epoch": 1319} {"train_loss": -22.032636642456055, "global_step": 109481, "epoch": 1319} {"train_loss": -21.812604904174805, "global_step": 109482, "epoch": 1319} {"train_loss": -22.184757232666016, "global_step": 109483, "epoch": 1319} {"train_loss": -21.636445999145508, "global_step": 109484, "epoch": 1319} {"train_loss": -22.25018310546875, "global_step": 109485, "epoch": 1319} {"train_loss": -22.044565200805664, "global_step": 109486, "epoch": 1319} {"train_loss": -22.37587547302246, "global_step": 109487, "epoch": 1319} {"train_loss": -21.847139358520508, "global_step": 109488, "epoch": 1319} {"train_loss": -22.216060638427734, "global_step": 109489, "epoch": 1319} {"train_loss": -21.846662521362305, "global_step": 109490, "epoch": 1319} {"train_loss": -22.024442672729492, "global_step": 109491, "epoch": 1319} {"train_loss": -21.940702438354492, "global_step": 109492, "epoch": 1319} {"train_loss": -21.980268478393555, "global_step": 109493, "epoch": 1319} {"train_loss": -22.2331600189209, "global_step": 109494, "epoch": 1319} {"train_loss": -22.065855026245117, "global_step": 109495, "epoch": 1319} {"train_loss": -21.914730072021484, "global_step": 109496, "epoch": 1319} {"train_loss": -22.322431564331055, "global_step": 109497, "epoch": 1319} {"train_loss": -22.3242130279541, "global_step": 109498, "epoch": 1319} {"train_loss": -22.11675453186035, "global_step": 109499, "epoch": 1319} {"train_loss": -22.39581871032715, "global_step": 109500, "epoch": 1319} {"train_loss": -22.53776741027832, "global_step": 109501, "epoch": 1319} {"train_loss": -22.00680923461914, "global_step": 109502, "epoch": 1319} {"train_loss": -22.58509635925293, "global_step": 109503, "epoch": 1319} {"train_loss": -22.424192428588867, "global_step": 109504, "epoch": 1319} {"train_loss": -22.361234664916992, "global_step": 109505, "epoch": 1319} {"train_loss": -22.18317222595215, "global_step": 109506, "epoch": 1319} {"train_loss": -22.18863296508789, "global_step": 109507, "epoch": 1319} {"train_loss": -22.088176727294922, "global_step": 109508, "epoch": 1319} {"train_loss": -22.17926025390625, "global_step": 109509, "epoch": 1319} {"train_loss": -22.069807052612305, "global_step": 109510, "epoch": 1319} {"train_loss": -22.2349796295166, "global_step": 109511, "epoch": 1319} {"train_loss": -22.058996200561523, "global_step": 109512, "epoch": 1319} {"train_loss": -22.138858795166016, "global_step": 109513, "epoch": 1319} {"train_loss": -21.786418914794922, "global_step": 109514, "epoch": 1319} {"train_loss": -21.82823371887207, "global_step": 109515, "epoch": 1319} {"train_loss": -21.980112075805664, "global_step": 109516, "epoch": 1319} {"train_loss": -22.266098022460938, "global_step": 109517, "epoch": 1319} {"train_loss": -21.959867477416992, "global_step": 109518, "epoch": 1319} {"train_loss": -22.05533790588379, "global_step": 109519, "epoch": 1319} {"train_loss": -21.862838745117188, "global_step": 109520, "epoch": 1319} {"train_loss": -22.054542541503906, "global_step": 109521, "epoch": 1319} {"train_loss": -22.036779403686523, "global_step": 109522, "epoch": 1319} {"train_loss": -22.131759643554688, "global_step": 109523, "epoch": 1319} {"train_loss": -21.988346099853516, "global_step": 109524, "epoch": 1319} {"train_loss": -22.385637283325195, "global_step": 109525, "epoch": 1319} {"train_loss": -22.09360694885254, "global_step": 109526, "epoch": 1319} {"train_loss": -21.882160186767578, "global_step": 109527, "epoch": 1319} {"train_loss": -22.39803123474121, "global_step": 109528, "epoch": 1319} {"train_loss": -21.7260684967041, "global_step": 109529, "epoch": 1319} {"train_loss": -22.522607803344727, "global_step": 109530, "epoch": 1319} {"train_loss": -22.240407943725586, "global_step": 109531, "epoch": 1319} {"train_loss": -21.880659103393555, "global_step": 109532, "epoch": 1319} {"train_loss": -22.323486328125, "global_step": 109533, "epoch": 1319} {"train_loss": -22.850019454956055, "global_step": 109534, "epoch": 1319} {"train_loss": -22.397565841674805, "global_step": 109535, "epoch": 1319} {"train_loss": -22.299619674682617, "global_step": 109536, "epoch": 1319} {"train_loss": -22.436147689819336, "global_step": 109537, "epoch": 1319} {"train_loss": -22.43573570251465, "global_step": 109538, "epoch": 1319} {"train_loss": -22.14893341064453, "global_step": 109539, "epoch": 1319} {"train_loss": -22.684112548828125, "global_step": 109540, "epoch": 1319} {"train_loss": -22.017690658569336, "global_step": 109541, "epoch": 1319} {"train_loss": -22.070356369018555, "global_step": 109542, "epoch": 1319} {"train_loss": -22.271316528320312, "global_step": 109543, "epoch": 1319} {"train_loss": -22.0647029876709, "global_step": 109544, "epoch": 1319} {"train_loss": -22.1905517578125, "global_step": 109545, "epoch": 1319} {"train_loss": -21.979888916015625, "global_step": 109546, "epoch": 1319} {"train_loss": -22.413829803466797, "global_step": 109547, "epoch": 1319} {"train_loss": -22.335481643676758, "global_step": 109548, "epoch": 1319} {"train_loss": -22.200307846069336, "global_step": 109549, "epoch": 1319} {"train_loss": -22.248315811157227, "global_step": 109550, "epoch": 1319} {"train_loss": -22.11875343322754, "global_step": 109551, "epoch": 1319} {"train_loss": -22.34872817993164, "global_step": 109552, "epoch": 1319} {"train_loss": -21.93539810180664, "global_step": 109553, "epoch": 1319} {"train_loss": -22.00436782836914, "global_step": 109554, "epoch": 1319} {"train_loss": -22.14278221130371, "global_step": 109555, "epoch": 1319} {"train_loss": -22.466054916381836, "global_step": 109556, "epoch": 1319} {"train_loss": -22.148046493530273, "global_step": 109557, "epoch": 1319} {"train_loss": -21.899246215820312, "global_step": 109558, "epoch": 1319} {"train_loss": -22.14127869203866, "global_step": 109559, "epoch": 1319, "val_loss": 6140687.5} {"train_loss": -21.92763328552246, "global_step": 109560, "epoch": 1320} {"train_loss": -21.384918212890625, "global_step": 109561, "epoch": 1320} {"train_loss": -21.487394332885742, "global_step": 109562, "epoch": 1320} {"train_loss": -22.380847930908203, "global_step": 109563, "epoch": 1320} {"train_loss": -21.797313690185547, "global_step": 109564, "epoch": 1320} {"train_loss": -22.292043685913086, "global_step": 109565, "epoch": 1320} {"train_loss": -21.86482810974121, "global_step": 109566, "epoch": 1320} {"train_loss": -22.013534545898438, "global_step": 109567, "epoch": 1320} {"train_loss": -21.976781845092773, "global_step": 109568, "epoch": 1320} {"train_loss": -21.69709587097168, "global_step": 109569, "epoch": 1320} {"train_loss": -22.050018310546875, "global_step": 109570, "epoch": 1320} {"train_loss": -21.813772201538086, "global_step": 109571, "epoch": 1320} {"train_loss": -21.766284942626953, "global_step": 109572, "epoch": 1320} {"train_loss": -21.81683921813965, "global_step": 109573, "epoch": 1320} {"train_loss": -22.330366134643555, "global_step": 109574, "epoch": 1320} {"train_loss": -22.326814651489258, "global_step": 109575, "epoch": 1320} {"train_loss": -22.044300079345703, "global_step": 109576, "epoch": 1320} {"train_loss": -22.279571533203125, "global_step": 109577, "epoch": 1320} {"train_loss": -22.398208618164062, "global_step": 109578, "epoch": 1320} {"train_loss": -22.169004440307617, "global_step": 109579, "epoch": 1320} {"train_loss": -22.249971389770508, "global_step": 109580, "epoch": 1320} {"train_loss": -22.200170516967773, "global_step": 109581, "epoch": 1320} {"train_loss": -22.185672760009766, "global_step": 109582, "epoch": 1320} {"train_loss": -22.45816993713379, "global_step": 109583, "epoch": 1320} {"train_loss": -22.368375778198242, "global_step": 109584, "epoch": 1320} {"train_loss": -22.252628326416016, "global_step": 109585, "epoch": 1320} {"train_loss": -21.81764030456543, "global_step": 109586, "epoch": 1320} {"train_loss": -21.989835739135742, "global_step": 109587, "epoch": 1320} {"train_loss": -22.29831314086914, "global_step": 109588, "epoch": 1320} {"train_loss": -22.11250114440918, "global_step": 109589, "epoch": 1320} {"train_loss": -22.04901123046875, "global_step": 109590, "epoch": 1320} {"train_loss": -22.444181442260742, "global_step": 109591, "epoch": 1320} {"train_loss": -21.697813034057617, "global_step": 109592, "epoch": 1320} {"train_loss": -21.932207107543945, "global_step": 109593, "epoch": 1320} {"train_loss": -21.755142211914062, "global_step": 109594, "epoch": 1320} {"train_loss": -21.864233016967773, "global_step": 109595, "epoch": 1320} {"train_loss": -22.015859603881836, "global_step": 109596, "epoch": 1320} {"train_loss": -22.17363166809082, "global_step": 109597, "epoch": 1320} {"train_loss": -22.082468032836914, "global_step": 109598, "epoch": 1320} {"train_loss": -22.114913940429688, "global_step": 109599, "epoch": 1320} {"train_loss": -21.90462303161621, "global_step": 109600, "epoch": 1320} {"train_loss": -22.424842834472656, "global_step": 109601, "epoch": 1320} {"train_loss": -22.01756477355957, "global_step": 109602, "epoch": 1320} {"train_loss": -22.145376205444336, "global_step": 109603, "epoch": 1320} {"train_loss": -22.470291137695312, "global_step": 109604, "epoch": 1320} {"train_loss": -21.993270874023438, "global_step": 109605, "epoch": 1320} {"train_loss": -22.462692260742188, "global_step": 109606, "epoch": 1320} {"train_loss": -22.262008666992188, "global_step": 109607, "epoch": 1320} {"train_loss": -22.164077758789062, "global_step": 109608, "epoch": 1320} {"train_loss": -22.13201332092285, "global_step": 109609, "epoch": 1320} {"train_loss": -21.875625610351562, "global_step": 109610, "epoch": 1320} {"train_loss": -22.460126876831055, "global_step": 109611, "epoch": 1320} {"train_loss": -22.46722984313965, "global_step": 109612, "epoch": 1320} {"train_loss": -22.414718627929688, "global_step": 109613, "epoch": 1320} {"train_loss": -21.96835708618164, "global_step": 109614, "epoch": 1320} {"train_loss": -22.192792892456055, "global_step": 109615, "epoch": 1320} {"train_loss": -22.380352020263672, "global_step": 109616, "epoch": 1320} {"train_loss": -22.649274826049805, "global_step": 109617, "epoch": 1320} {"train_loss": -22.065061569213867, "global_step": 109618, "epoch": 1320} {"train_loss": -22.135244369506836, "global_step": 109619, "epoch": 1320} {"train_loss": -22.04768943786621, "global_step": 109620, "epoch": 1320} {"train_loss": -22.522907257080078, "global_step": 109621, "epoch": 1320} {"train_loss": -22.30787467956543, "global_step": 109622, "epoch": 1320} {"train_loss": -22.250089645385742, "global_step": 109623, "epoch": 1320} {"train_loss": -22.33485984802246, "global_step": 109624, "epoch": 1320} {"train_loss": -22.194869995117188, "global_step": 109625, "epoch": 1320} {"train_loss": -22.251413345336914, "global_step": 109626, "epoch": 1320} {"train_loss": -21.838897705078125, "global_step": 109627, "epoch": 1320} {"train_loss": -22.05264663696289, "global_step": 109628, "epoch": 1320} {"train_loss": -21.991907119750977, "global_step": 109629, "epoch": 1320} {"train_loss": -22.488004684448242, "global_step": 109630, "epoch": 1320} {"train_loss": -22.193830490112305, "global_step": 109631, "epoch": 1320} {"train_loss": -22.1270809173584, "global_step": 109632, "epoch": 1320} {"train_loss": -22.07105827331543, "global_step": 109633, "epoch": 1320} {"train_loss": -22.218421936035156, "global_step": 109634, "epoch": 1320} {"train_loss": -22.55389976501465, "global_step": 109635, "epoch": 1320} {"train_loss": -22.355649948120117, "global_step": 109636, "epoch": 1320} {"train_loss": -22.58173179626465, "global_step": 109637, "epoch": 1320} {"train_loss": -22.23792839050293, "global_step": 109638, "epoch": 1320} {"train_loss": -22.635953903198242, "global_step": 109639, "epoch": 1320} {"train_loss": -22.485193252563477, "global_step": 109640, "epoch": 1320} {"train_loss": -22.734399795532227, "global_step": 109641, "epoch": 1320} {"train_loss": -22.154767185808666, "global_step": 109642, "epoch": 1320, "val_loss": 6277107.0} {"train_loss": -21.646608352661133, "global_step": 109643, "epoch": 1321} {"train_loss": -22.078031539916992, "global_step": 109644, "epoch": 1321} {"train_loss": -21.743532180786133, "global_step": 109645, "epoch": 1321} {"train_loss": -21.65553092956543, "global_step": 109646, "epoch": 1321} {"train_loss": -21.7705135345459, "global_step": 109647, "epoch": 1321} {"train_loss": -22.146881103515625, "global_step": 109648, "epoch": 1321} {"train_loss": -21.946426391601562, "global_step": 109649, "epoch": 1321} {"train_loss": -21.599611282348633, "global_step": 109650, "epoch": 1321} {"train_loss": -21.893510818481445, "global_step": 109651, "epoch": 1321} {"train_loss": -21.90152359008789, "global_step": 109652, "epoch": 1321} {"train_loss": -22.156789779663086, "global_step": 109653, "epoch": 1321} {"train_loss": -21.963665008544922, "global_step": 109654, "epoch": 1321} {"train_loss": -21.978635787963867, "global_step": 109655, "epoch": 1321} {"train_loss": -22.228195190429688, "global_step": 109656, "epoch": 1321} {"train_loss": -22.30223846435547, "global_step": 109657, "epoch": 1321} {"train_loss": -22.118581771850586, "global_step": 109658, "epoch": 1321} {"train_loss": -22.32575798034668, "global_step": 109659, "epoch": 1321} {"train_loss": -22.11528968811035, "global_step": 109660, "epoch": 1321} {"train_loss": -22.164600372314453, "global_step": 109661, "epoch": 1321} {"train_loss": -22.219858169555664, "global_step": 109662, "epoch": 1321} {"train_loss": -22.17377281188965, "global_step": 109663, "epoch": 1321} {"train_loss": -22.231353759765625, "global_step": 109664, "epoch": 1321} {"train_loss": -22.201074600219727, "global_step": 109665, "epoch": 1321} {"train_loss": -22.205060958862305, "global_step": 109666, "epoch": 1321} {"train_loss": -22.032512664794922, "global_step": 109667, "epoch": 1321} {"train_loss": -22.049238204956055, "global_step": 109668, "epoch": 1321} {"train_loss": -22.129066467285156, "global_step": 109669, "epoch": 1321} {"train_loss": -22.447229385375977, "global_step": 109670, "epoch": 1321} {"train_loss": -22.180973052978516, "global_step": 109671, "epoch": 1321} {"train_loss": -22.462310791015625, "global_step": 109672, "epoch": 1321} {"train_loss": -22.41407585144043, "global_step": 109673, "epoch": 1321} {"train_loss": -22.332059860229492, "global_step": 109674, "epoch": 1321} {"train_loss": -22.28048324584961, "global_step": 109675, "epoch": 1321} {"train_loss": -22.305208206176758, "global_step": 109676, "epoch": 1321} {"train_loss": -22.2338924407959, "global_step": 109677, "epoch": 1321} {"train_loss": -22.527219772338867, "global_step": 109678, "epoch": 1321} {"train_loss": -22.387903213500977, "global_step": 109679, "epoch": 1321} {"train_loss": -22.535505294799805, "global_step": 109680, "epoch": 1321} {"train_loss": -22.079151153564453, "global_step": 109681, "epoch": 1321} {"train_loss": -22.248193740844727, "global_step": 109682, "epoch": 1321} {"train_loss": -22.423397064208984, "global_step": 109683, "epoch": 1321} {"train_loss": -22.141698837280273, "global_step": 109684, "epoch": 1321} {"train_loss": -22.82118034362793, "global_step": 109685, "epoch": 1321} {"train_loss": -22.2002010345459, "global_step": 109686, "epoch": 1321} {"train_loss": -22.331409454345703, "global_step": 109687, "epoch": 1321} {"train_loss": -22.344999313354492, "global_step": 109688, "epoch": 1321} {"train_loss": -22.619945526123047, "global_step": 109689, "epoch": 1321} {"train_loss": -21.732065200805664, "global_step": 109690, "epoch": 1321} {"train_loss": -22.272764205932617, "global_step": 109691, "epoch": 1321} {"train_loss": -22.136720657348633, "global_step": 109692, "epoch": 1321} {"train_loss": -22.403350830078125, "global_step": 109693, "epoch": 1321} {"train_loss": -22.14784812927246, "global_step": 109694, "epoch": 1321} {"train_loss": -22.413305282592773, "global_step": 109695, "epoch": 1321} {"train_loss": -22.310083389282227, "global_step": 109696, "epoch": 1321} {"train_loss": -22.213796615600586, "global_step": 109697, "epoch": 1321} {"train_loss": -22.059341430664062, "global_step": 109698, "epoch": 1321} {"train_loss": -22.17154312133789, "global_step": 109699, "epoch": 1321} {"train_loss": -22.409910202026367, "global_step": 109700, "epoch": 1321} {"train_loss": -22.083810806274414, "global_step": 109701, "epoch": 1321} {"train_loss": -22.2716064453125, "global_step": 109702, "epoch": 1321} {"train_loss": -22.05333137512207, "global_step": 109703, "epoch": 1321} {"train_loss": -22.239397048950195, "global_step": 109704, "epoch": 1321} {"train_loss": -22.329219818115234, "global_step": 109705, "epoch": 1321} {"train_loss": -22.369388580322266, "global_step": 109706, "epoch": 1321} {"train_loss": -22.296459197998047, "global_step": 109707, "epoch": 1321} {"train_loss": -22.124393463134766, "global_step": 109708, "epoch": 1321} {"train_loss": -22.410104751586914, "global_step": 109709, "epoch": 1321} {"train_loss": -21.929609298706055, "global_step": 109710, "epoch": 1321} {"train_loss": -22.233469009399414, "global_step": 109711, "epoch": 1321} {"train_loss": -21.94182586669922, "global_step": 109712, "epoch": 1321} {"train_loss": -22.010135650634766, "global_step": 109713, "epoch": 1321} {"train_loss": -22.021404266357422, "global_step": 109714, "epoch": 1321} {"train_loss": -22.15163230895996, "global_step": 109715, "epoch": 1321} {"train_loss": -22.155065536499023, "global_step": 109716, "epoch": 1321} {"train_loss": -22.046894073486328, "global_step": 109717, "epoch": 1321} {"train_loss": -22.216856002807617, "global_step": 109718, "epoch": 1321} {"train_loss": -22.316823959350586, "global_step": 109719, "epoch": 1321} {"train_loss": -21.98177719116211, "global_step": 109720, "epoch": 1321} {"train_loss": -22.191633224487305, "global_step": 109721, "epoch": 1321} {"train_loss": -22.231931686401367, "global_step": 109722, "epoch": 1321} {"train_loss": -21.898649215698242, "global_step": 109723, "epoch": 1321} {"train_loss": -22.0797176361084, "global_step": 109724, "epoch": 1321} {"train_loss": -22.198467323578985, "global_step": 109725, "epoch": 1321, "val_loss": 6065514.0} {"train_loss": -22.43901252746582, "global_step": 109726, "epoch": 1322} {"train_loss": -21.94508934020996, "global_step": 109727, "epoch": 1322} {"train_loss": -22.181278228759766, "global_step": 109728, "epoch": 1322} {"train_loss": -21.80051040649414, "global_step": 109729, "epoch": 1322} {"train_loss": -21.867237091064453, "global_step": 109730, "epoch": 1322} {"train_loss": -21.881940841674805, "global_step": 109731, "epoch": 1322} {"train_loss": -21.851337432861328, "global_step": 109732, "epoch": 1322} {"train_loss": -22.361652374267578, "global_step": 109733, "epoch": 1322} {"train_loss": -22.02248764038086, "global_step": 109734, "epoch": 1322} {"train_loss": -22.511186599731445, "global_step": 109735, "epoch": 1322} {"train_loss": -22.325101852416992, "global_step": 109736, "epoch": 1322} {"train_loss": -22.03301429748535, "global_step": 109737, "epoch": 1322} {"train_loss": -22.147432327270508, "global_step": 109738, "epoch": 1322} {"train_loss": -21.75809097290039, "global_step": 109739, "epoch": 1322} {"train_loss": -22.20916748046875, "global_step": 109740, "epoch": 1322} {"train_loss": -22.25212287902832, "global_step": 109741, "epoch": 1322} {"train_loss": -22.377883911132812, "global_step": 109742, "epoch": 1322} {"train_loss": -21.94550132751465, "global_step": 109743, "epoch": 1322} {"train_loss": -22.505022048950195, "global_step": 109744, "epoch": 1322} {"train_loss": -22.318653106689453, "global_step": 109745, "epoch": 1322} {"train_loss": -22.35519790649414, "global_step": 109746, "epoch": 1322} {"train_loss": -22.26978302001953, "global_step": 109747, "epoch": 1322} {"train_loss": -22.319644927978516, "global_step": 109748, "epoch": 1322} {"train_loss": -22.093076705932617, "global_step": 109749, "epoch": 1322} {"train_loss": -22.41316032409668, "global_step": 109750, "epoch": 1322} {"train_loss": -22.031396865844727, "global_step": 109751, "epoch": 1322} {"train_loss": -22.178503036499023, "global_step": 109752, "epoch": 1322} {"train_loss": -22.092172622680664, "global_step": 109753, "epoch": 1322} {"train_loss": -22.145734786987305, "global_step": 109754, "epoch": 1322} {"train_loss": -22.162433624267578, "global_step": 109755, "epoch": 1322} {"train_loss": -22.386756896972656, "global_step": 109756, "epoch": 1322} {"train_loss": -22.379776000976562, "global_step": 109757, "epoch": 1322} {"train_loss": -22.52271842956543, "global_step": 109758, "epoch": 1322} {"train_loss": -21.976186752319336, "global_step": 109759, "epoch": 1322} {"train_loss": -22.174779891967773, "global_step": 109760, "epoch": 1322} {"train_loss": -22.312253952026367, "global_step": 109761, "epoch": 1322} {"train_loss": -22.181072235107422, "global_step": 109762, "epoch": 1322} {"train_loss": -22.28087043762207, "global_step": 109763, "epoch": 1322} {"train_loss": -22.406789779663086, "global_step": 109764, "epoch": 1322} {"train_loss": -22.210134506225586, "global_step": 109765, "epoch": 1322} {"train_loss": -22.39162254333496, "global_step": 109766, "epoch": 1322} {"train_loss": -22.009862899780273, "global_step": 109767, "epoch": 1322} {"train_loss": -22.61283302307129, "global_step": 109768, "epoch": 1322} {"train_loss": -22.346708297729492, "global_step": 109769, "epoch": 1322} {"train_loss": -21.959516525268555, "global_step": 109770, "epoch": 1322} {"train_loss": -22.351579666137695, "global_step": 109771, "epoch": 1322} {"train_loss": -21.92061424255371, "global_step": 109772, "epoch": 1322} {"train_loss": -22.102773666381836, "global_step": 109773, "epoch": 1322} {"train_loss": -22.470075607299805, "global_step": 109774, "epoch": 1322} {"train_loss": -22.196081161499023, "global_step": 109775, "epoch": 1322} {"train_loss": -22.417768478393555, "global_step": 109776, "epoch": 1322} {"train_loss": -22.319835662841797, "global_step": 109777, "epoch": 1322} {"train_loss": -22.067276000976562, "global_step": 109778, "epoch": 1322} {"train_loss": -22.121023178100586, "global_step": 109779, "epoch": 1322} {"train_loss": -21.9968318939209, "global_step": 109780, "epoch": 1322} {"train_loss": -22.08660888671875, "global_step": 109781, "epoch": 1322} {"train_loss": -21.691848754882812, "global_step": 109782, "epoch": 1322} {"train_loss": -22.01151466369629, "global_step": 109783, "epoch": 1322} {"train_loss": -22.085046768188477, "global_step": 109784, "epoch": 1322} {"train_loss": -22.117727279663086, "global_step": 109785, "epoch": 1322} {"train_loss": -22.181848526000977, "global_step": 109786, "epoch": 1322} {"train_loss": -22.121320724487305, "global_step": 109787, "epoch": 1322} {"train_loss": -22.174543380737305, "global_step": 109788, "epoch": 1322} {"train_loss": -22.0355224609375, "global_step": 109789, "epoch": 1322} {"train_loss": -22.32391357421875, "global_step": 109790, "epoch": 1322} {"train_loss": -21.741125106811523, "global_step": 109791, "epoch": 1322} {"train_loss": -22.139982223510742, "global_step": 109792, "epoch": 1322} {"train_loss": -21.97553062438965, "global_step": 109793, "epoch": 1322} {"train_loss": -22.30828857421875, "global_step": 109794, "epoch": 1322} {"train_loss": -22.30689811706543, "global_step": 109795, "epoch": 1322} {"train_loss": -22.344566345214844, "global_step": 109796, "epoch": 1322} {"train_loss": -22.008018493652344, "global_step": 109797, "epoch": 1322} {"train_loss": -21.996301651000977, "global_step": 109798, "epoch": 1322} {"train_loss": -22.53188133239746, "global_step": 109799, "epoch": 1322} {"train_loss": -22.26703453063965, "global_step": 109800, "epoch": 1322} {"train_loss": -22.421249389648438, "global_step": 109801, "epoch": 1322} {"train_loss": -22.363204956054688, "global_step": 109802, "epoch": 1322} {"train_loss": -22.026023864746094, "global_step": 109803, "epoch": 1322} {"train_loss": -22.283105850219727, "global_step": 109804, "epoch": 1322} {"train_loss": -22.297840118408203, "global_step": 109805, "epoch": 1322} {"train_loss": -22.38336181640625, "global_step": 109806, "epoch": 1322} {"train_loss": -22.43851661682129, "global_step": 109807, "epoch": 1322} {"train_loss": -22.190391701388073, "global_step": 109808, "epoch": 1322, "val_loss": 6202276.5} {"train_loss": -21.993993759155273, "global_step": 109809, "epoch": 1323} {"train_loss": -21.157920837402344, "global_step": 109810, "epoch": 1323} {"train_loss": -21.720426559448242, "global_step": 109811, "epoch": 1323} {"train_loss": -22.084060668945312, "global_step": 109812, "epoch": 1323} {"train_loss": -21.859378814697266, "global_step": 109813, "epoch": 1323} {"train_loss": -22.222137451171875, "global_step": 109814, "epoch": 1323} {"train_loss": -22.183500289916992, "global_step": 109815, "epoch": 1323} {"train_loss": -21.95514488220215, "global_step": 109816, "epoch": 1323} {"train_loss": -22.12034797668457, "global_step": 109817, "epoch": 1323} {"train_loss": -22.132829666137695, "global_step": 109818, "epoch": 1323} {"train_loss": -22.025741577148438, "global_step": 109819, "epoch": 1323} {"train_loss": -21.956987380981445, "global_step": 109820, "epoch": 1323} {"train_loss": -22.155494689941406, "global_step": 109821, "epoch": 1323} {"train_loss": -22.00200080871582, "global_step": 109822, "epoch": 1323} {"train_loss": -22.199350357055664, "global_step": 109823, "epoch": 1323} {"train_loss": -21.726404190063477, "global_step": 109824, "epoch": 1323} {"train_loss": -22.333309173583984, "global_step": 109825, "epoch": 1323} {"train_loss": -22.18132209777832, "global_step": 109826, "epoch": 1323} {"train_loss": -22.33576011657715, "global_step": 109827, "epoch": 1323} {"train_loss": -21.967309951782227, "global_step": 109828, "epoch": 1323} {"train_loss": -21.877744674682617, "global_step": 109829, "epoch": 1323} {"train_loss": -22.275373458862305, "global_step": 109830, "epoch": 1323} {"train_loss": -22.205350875854492, "global_step": 109831, "epoch": 1323} {"train_loss": -22.352201461791992, "global_step": 109832, "epoch": 1323} {"train_loss": -22.5223388671875, "global_step": 109833, "epoch": 1323} {"train_loss": -21.805479049682617, "global_step": 109834, "epoch": 1323} {"train_loss": -22.25461196899414, "global_step": 109835, "epoch": 1323} {"train_loss": -22.489267349243164, "global_step": 109836, "epoch": 1323} {"train_loss": -22.193965911865234, "global_step": 109837, "epoch": 1323} {"train_loss": -22.344507217407227, "global_step": 109838, "epoch": 1323} {"train_loss": -22.139453887939453, "global_step": 109839, "epoch": 1323} {"train_loss": -22.294179916381836, "global_step": 109840, "epoch": 1323} {"train_loss": -22.430280685424805, "global_step": 109841, "epoch": 1323} {"train_loss": -22.476634979248047, "global_step": 109842, "epoch": 1323} {"train_loss": -22.05023956298828, "global_step": 109843, "epoch": 1323} {"train_loss": -22.383853912353516, "global_step": 109844, "epoch": 1323} {"train_loss": -22.429237365722656, "global_step": 109845, "epoch": 1323} {"train_loss": -22.177404403686523, "global_step": 109846, "epoch": 1323} {"train_loss": -22.09664535522461, "global_step": 109847, "epoch": 1323} {"train_loss": -22.123661041259766, "global_step": 109848, "epoch": 1323} {"train_loss": -22.09334373474121, "global_step": 109849, "epoch": 1323} {"train_loss": -22.209228515625, "global_step": 109850, "epoch": 1323} {"train_loss": -21.863927841186523, "global_step": 109851, "epoch": 1323} {"train_loss": -22.047245025634766, "global_step": 109852, "epoch": 1323} {"train_loss": -22.281789779663086, "global_step": 109853, "epoch": 1323} {"train_loss": -22.0051326751709, "global_step": 109854, "epoch": 1323} {"train_loss": -22.026248931884766, "global_step": 109855, "epoch": 1323} {"train_loss": -22.18327522277832, "global_step": 109856, "epoch": 1323} {"train_loss": -22.020261764526367, "global_step": 109857, "epoch": 1323} {"train_loss": -22.400806427001953, "global_step": 109858, "epoch": 1323} {"train_loss": -21.937185287475586, "global_step": 109859, "epoch": 1323} {"train_loss": -22.230663299560547, "global_step": 109860, "epoch": 1323} {"train_loss": -22.094409942626953, "global_step": 109861, "epoch": 1323} {"train_loss": -21.641132354736328, "global_step": 109862, "epoch": 1323} {"train_loss": -22.012800216674805, "global_step": 109863, "epoch": 1323} {"train_loss": -22.16643714904785, "global_step": 109864, "epoch": 1323} {"train_loss": -21.917762756347656, "global_step": 109865, "epoch": 1323} {"train_loss": -21.980382919311523, "global_step": 109866, "epoch": 1323} {"train_loss": -22.562597274780273, "global_step": 109867, "epoch": 1323} {"train_loss": -22.170164108276367, "global_step": 109868, "epoch": 1323} {"train_loss": -22.1628475189209, "global_step": 109869, "epoch": 1323} {"train_loss": -22.52451515197754, "global_step": 109870, "epoch": 1323} {"train_loss": -22.117496490478516, "global_step": 109871, "epoch": 1323} {"train_loss": -22.25448989868164, "global_step": 109872, "epoch": 1323} {"train_loss": -22.08919334411621, "global_step": 109873, "epoch": 1323} {"train_loss": -22.25714111328125, "global_step": 109874, "epoch": 1323} {"train_loss": -22.519075393676758, "global_step": 109875, "epoch": 1323} {"train_loss": -22.071203231811523, "global_step": 109876, "epoch": 1323} {"train_loss": -22.4005069732666, "global_step": 109877, "epoch": 1323} {"train_loss": -22.219785690307617, "global_step": 109878, "epoch": 1323} {"train_loss": -22.00908851623535, "global_step": 109879, "epoch": 1323} {"train_loss": -22.305326461791992, "global_step": 109880, "epoch": 1323} {"train_loss": -22.185941696166992, "global_step": 109881, "epoch": 1323} {"train_loss": -22.003875732421875, "global_step": 109882, "epoch": 1323} {"train_loss": -21.997678756713867, "global_step": 109883, "epoch": 1323} {"train_loss": -22.506790161132812, "global_step": 109884, "epoch": 1323} {"train_loss": -22.332624435424805, "global_step": 109885, "epoch": 1323} {"train_loss": -22.35341453552246, "global_step": 109886, "epoch": 1323} {"train_loss": -22.58237648010254, "global_step": 109887, "epoch": 1323} {"train_loss": -22.183597564697266, "global_step": 109888, "epoch": 1323} {"train_loss": -22.114286422729492, "global_step": 109889, "epoch": 1323} {"train_loss": -22.606630325317383, "global_step": 109890, "epoch": 1323} {"train_loss": -22.16159553987434, "global_step": 109891, "epoch": 1323, "val_loss": 6332127.5} {"train_loss": -21.745635986328125, "global_step": 109892, "epoch": 1324} {"train_loss": -21.58733558654785, "global_step": 109893, "epoch": 1324} {"train_loss": -21.768207550048828, "global_step": 109894, "epoch": 1324} {"train_loss": -21.77800750732422, "global_step": 109895, "epoch": 1324} {"train_loss": -21.933908462524414, "global_step": 109896, "epoch": 1324} {"train_loss": -21.947372436523438, "global_step": 109897, "epoch": 1324} {"train_loss": -21.94610023498535, "global_step": 109898, "epoch": 1324} {"train_loss": -22.31795310974121, "global_step": 109899, "epoch": 1324} {"train_loss": -22.00188636779785, "global_step": 109900, "epoch": 1324} {"train_loss": -21.852453231811523, "global_step": 109901, "epoch": 1324} {"train_loss": -22.037649154663086, "global_step": 109902, "epoch": 1324} {"train_loss": -22.203502655029297, "global_step": 109903, "epoch": 1324} {"train_loss": -22.33521842956543, "global_step": 109904, "epoch": 1324} {"train_loss": -21.94151496887207, "global_step": 109905, "epoch": 1324} {"train_loss": -21.74274444580078, "global_step": 109906, "epoch": 1324} {"train_loss": -22.24938201904297, "global_step": 109907, "epoch": 1324} {"train_loss": -21.987058639526367, "global_step": 109908, "epoch": 1324} {"train_loss": -22.32179069519043, "global_step": 109909, "epoch": 1324} {"train_loss": -22.411481857299805, "global_step": 109910, "epoch": 1324} {"train_loss": -22.259675979614258, "global_step": 109911, "epoch": 1324} {"train_loss": -22.292953491210938, "global_step": 109912, "epoch": 1324} {"train_loss": -21.879104614257812, "global_step": 109913, "epoch": 1324} {"train_loss": -22.4370059967041, "global_step": 109914, "epoch": 1324} {"train_loss": -22.193906784057617, "global_step": 109915, "epoch": 1324} {"train_loss": -21.837116241455078, "global_step": 109916, "epoch": 1324} {"train_loss": -22.216001510620117, "global_step": 109917, "epoch": 1324} {"train_loss": -22.141386032104492, "global_step": 109918, "epoch": 1324} {"train_loss": -22.7915096282959, "global_step": 109919, "epoch": 1324} {"train_loss": -22.509281158447266, "global_step": 109920, "epoch": 1324} {"train_loss": -22.23012351989746, "global_step": 109921, "epoch": 1324} {"train_loss": -22.34634780883789, "global_step": 109922, "epoch": 1324} {"train_loss": -22.41101837158203, "global_step": 109923, "epoch": 1324} {"train_loss": -22.079238891601562, "global_step": 109924, "epoch": 1324} {"train_loss": -22.364288330078125, "global_step": 109925, "epoch": 1324} {"train_loss": -22.49020004272461, "global_step": 109926, "epoch": 1324} {"train_loss": -22.035337448120117, "global_step": 109927, "epoch": 1324} {"train_loss": -22.451162338256836, "global_step": 109928, "epoch": 1324} {"train_loss": -22.091873168945312, "global_step": 109929, "epoch": 1324} {"train_loss": -22.02796745300293, "global_step": 109930, "epoch": 1324} {"train_loss": -22.398448944091797, "global_step": 109931, "epoch": 1324} {"train_loss": -22.2816219329834, "global_step": 109932, "epoch": 1324} {"train_loss": -21.84268569946289, "global_step": 109933, "epoch": 1324} {"train_loss": -21.98809242248535, "global_step": 109934, "epoch": 1324} {"train_loss": -22.08089256286621, "global_step": 109935, "epoch": 1324} {"train_loss": -22.147993087768555, "global_step": 109936, "epoch": 1324} {"train_loss": -22.0156192779541, "global_step": 109937, "epoch": 1324} {"train_loss": -22.131895065307617, "global_step": 109938, "epoch": 1324} {"train_loss": -22.29947853088379, "global_step": 109939, "epoch": 1324} {"train_loss": -22.27834129333496, "global_step": 109940, "epoch": 1324} {"train_loss": -22.402286529541016, "global_step": 109941, "epoch": 1324} {"train_loss": -22.007587432861328, "global_step": 109942, "epoch": 1324} {"train_loss": -22.4305419921875, "global_step": 109943, "epoch": 1324} {"train_loss": -22.215747833251953, "global_step": 109944, "epoch": 1324} {"train_loss": -22.083093643188477, "global_step": 109945, "epoch": 1324} {"train_loss": -21.902999877929688, "global_step": 109946, "epoch": 1324} {"train_loss": -22.199005126953125, "global_step": 109947, "epoch": 1324} {"train_loss": -22.02219581604004, "global_step": 109948, "epoch": 1324} {"train_loss": -22.46925926208496, "global_step": 109949, "epoch": 1324} {"train_loss": -22.069589614868164, "global_step": 109950, "epoch": 1324} {"train_loss": -22.38347816467285, "global_step": 109951, "epoch": 1324} {"train_loss": -22.410005569458008, "global_step": 109952, "epoch": 1324} {"train_loss": -22.31544303894043, "global_step": 109953, "epoch": 1324} {"train_loss": -21.953649520874023, "global_step": 109954, "epoch": 1324} {"train_loss": -22.379098892211914, "global_step": 109955, "epoch": 1324} {"train_loss": -22.518558502197266, "global_step": 109956, "epoch": 1324} {"train_loss": -22.35035514831543, "global_step": 109957, "epoch": 1324} {"train_loss": -22.313730239868164, "global_step": 109958, "epoch": 1324} {"train_loss": -22.026334762573242, "global_step": 109959, "epoch": 1324} {"train_loss": -22.55699920654297, "global_step": 109960, "epoch": 1324} {"train_loss": -22.019672393798828, "global_step": 109961, "epoch": 1324} {"train_loss": -22.390310287475586, "global_step": 109962, "epoch": 1324} {"train_loss": -22.117813110351562, "global_step": 109963, "epoch": 1324} {"train_loss": -22.26410675048828, "global_step": 109964, "epoch": 1324} {"train_loss": -22.556318283081055, "global_step": 109965, "epoch": 1324} {"train_loss": -22.124908447265625, "global_step": 109966, "epoch": 1324} {"train_loss": -22.45918083190918, "global_step": 109967, "epoch": 1324} {"train_loss": -21.844839096069336, "global_step": 109968, "epoch": 1324} {"train_loss": -22.37312889099121, "global_step": 109969, "epoch": 1324} {"train_loss": -22.220962524414062, "global_step": 109970, "epoch": 1324} {"train_loss": -21.938974380493164, "global_step": 109971, "epoch": 1324} {"train_loss": -22.319171905517578, "global_step": 109972, "epoch": 1324} {"train_loss": -22.193939208984375, "global_step": 109973, "epoch": 1324} {"train_loss": -22.17507955252406, "global_step": 109974, "epoch": 1324, "val_loss": 6212427.5} {"train_loss": -21.477697372436523, "global_step": 109975, "epoch": 1325} {"train_loss": -21.680776596069336, "global_step": 109976, "epoch": 1325} {"train_loss": -21.82343864440918, "global_step": 109977, "epoch": 1325} {"train_loss": -22.049142837524414, "global_step": 109978, "epoch": 1325} {"train_loss": -22.09914207458496, "global_step": 109979, "epoch": 1325} {"train_loss": -22.122940063476562, "global_step": 109980, "epoch": 1325} {"train_loss": -22.026243209838867, "global_step": 109981, "epoch": 1325} {"train_loss": -21.738037109375, "global_step": 109982, "epoch": 1325} {"train_loss": -22.023910522460938, "global_step": 109983, "epoch": 1325} {"train_loss": -21.58262062072754, "global_step": 109984, "epoch": 1325} {"train_loss": -21.987258911132812, "global_step": 109985, "epoch": 1325} {"train_loss": -22.111133575439453, "global_step": 109986, "epoch": 1325} {"train_loss": -22.464014053344727, "global_step": 109987, "epoch": 1325} {"train_loss": -22.095556259155273, "global_step": 109988, "epoch": 1325} {"train_loss": -22.351194381713867, "global_step": 109989, "epoch": 1325} {"train_loss": -22.162139892578125, "global_step": 109990, "epoch": 1325} {"train_loss": -22.1005916595459, "global_step": 109991, "epoch": 1325} {"train_loss": -22.165769577026367, "global_step": 109992, "epoch": 1325} {"train_loss": -22.195478439331055, "global_step": 109993, "epoch": 1325} {"train_loss": -22.271764755249023, "global_step": 109994, "epoch": 1325} {"train_loss": -22.3962459564209, "global_step": 109995, "epoch": 1325} {"train_loss": -22.447786331176758, "global_step": 109996, "epoch": 1325} {"train_loss": -22.355268478393555, "global_step": 109997, "epoch": 1325} {"train_loss": -22.39637565612793, "global_step": 109998, "epoch": 1325} {"train_loss": -22.067840576171875, "global_step": 109999, "epoch": 1325} {"train_loss": -22.611005783081055, "global_step": 110000, "epoch": 1325} {"train_loss": -22.467451095581055, "global_step": 110001, "epoch": 1325} {"train_loss": -22.43414306640625, "global_step": 110002, "epoch": 1325} {"train_loss": -22.448637008666992, "global_step": 110003, "epoch": 1325} {"train_loss": -22.328683853149414, "global_step": 110004, "epoch": 1325} {"train_loss": -22.323137283325195, "global_step": 110005, "epoch": 1325} {"train_loss": -22.24942970275879, "global_step": 110006, "epoch": 1325} {"train_loss": -22.360065460205078, "global_step": 110007, "epoch": 1325} {"train_loss": -22.290122985839844, "global_step": 110008, "epoch": 1325} {"train_loss": -22.410829544067383, "global_step": 110009, "epoch": 1325} {"train_loss": -22.174890518188477, "global_step": 110010, "epoch": 1325} {"train_loss": -22.18006706237793, "global_step": 110011, "epoch": 1325} {"train_loss": -22.418807983398438, "global_step": 110012, "epoch": 1325} {"train_loss": -22.364774703979492, "global_step": 110013, "epoch": 1325} {"train_loss": -22.33955192565918, "global_step": 110014, "epoch": 1325} {"train_loss": -22.453237533569336, "global_step": 110015, "epoch": 1325} {"train_loss": -22.232900619506836, "global_step": 110016, "epoch": 1325} {"train_loss": -22.172595977783203, "global_step": 110017, "epoch": 1325} {"train_loss": -22.152790069580078, "global_step": 110018, "epoch": 1325} {"train_loss": -21.988651275634766, "global_step": 110019, "epoch": 1325} {"train_loss": -22.057722091674805, "global_step": 110020, "epoch": 1325} {"train_loss": -22.289417266845703, "global_step": 110021, "epoch": 1325} {"train_loss": -22.132434844970703, "global_step": 110022, "epoch": 1325} {"train_loss": -22.34650993347168, "global_step": 110023, "epoch": 1325} {"train_loss": -22.277690887451172, "global_step": 110024, "epoch": 1325} {"train_loss": -22.13931655883789, "global_step": 110025, "epoch": 1325} {"train_loss": -22.552045822143555, "global_step": 110026, "epoch": 1325} {"train_loss": -22.12692642211914, "global_step": 110027, "epoch": 1325} {"train_loss": -22.101743698120117, "global_step": 110028, "epoch": 1325} {"train_loss": -22.220312118530273, "global_step": 110029, "epoch": 1325} {"train_loss": -22.632904052734375, "global_step": 110030, "epoch": 1325} {"train_loss": -22.333070755004883, "global_step": 110031, "epoch": 1325} {"train_loss": -22.240816116333008, "global_step": 110032, "epoch": 1325} {"train_loss": -22.301605224609375, "global_step": 110033, "epoch": 1325} {"train_loss": -22.231582641601562, "global_step": 110034, "epoch": 1325} {"train_loss": -22.32136344909668, "global_step": 110035, "epoch": 1325} {"train_loss": -22.5654296875, "global_step": 110036, "epoch": 1325} {"train_loss": -22.198406219482422, "global_step": 110037, "epoch": 1325} {"train_loss": -22.36820411682129, "global_step": 110038, "epoch": 1325} {"train_loss": -22.28441047668457, "global_step": 110039, "epoch": 1325} {"train_loss": -22.449052810668945, "global_step": 110040, "epoch": 1325} {"train_loss": -22.667800903320312, "global_step": 110041, "epoch": 1325} {"train_loss": -22.083921432495117, "global_step": 110042, "epoch": 1325} {"train_loss": -22.481164932250977, "global_step": 110043, "epoch": 1325} {"train_loss": -22.24249839782715, "global_step": 110044, "epoch": 1325} {"train_loss": -22.472848892211914, "global_step": 110045, "epoch": 1325} {"train_loss": -21.970346450805664, "global_step": 110046, "epoch": 1325} {"train_loss": -22.050771713256836, "global_step": 110047, "epoch": 1325} {"train_loss": -22.12972068786621, "global_step": 110048, "epoch": 1325} {"train_loss": -22.256399154663086, "global_step": 110049, "epoch": 1325} {"train_loss": -22.338848114013672, "global_step": 110050, "epoch": 1325} {"train_loss": -22.54501724243164, "global_step": 110051, "epoch": 1325} {"train_loss": -22.051969528198242, "global_step": 110052, "epoch": 1325} {"train_loss": -22.300561904907227, "global_step": 110053, "epoch": 1325} {"train_loss": -22.256305694580078, "global_step": 110054, "epoch": 1325} {"train_loss": -22.575624465942383, "global_step": 110055, "epoch": 1325} {"train_loss": -22.0953369140625, "global_step": 110056, "epoch": 1325} {"train_loss": -22.26075696370688, "global_step": 110057, "epoch": 1325, "val_loss": 6167092.0} {"train_loss": -22.144954681396484, "global_step": 110058, "epoch": 1326} {"train_loss": -22.400999069213867, "global_step": 110059, "epoch": 1326} {"train_loss": -22.10992431640625, "global_step": 110060, "epoch": 1326} {"train_loss": -21.932897567749023, "global_step": 110061, "epoch": 1326} {"train_loss": -22.318241119384766, "global_step": 110062, "epoch": 1326} {"train_loss": -22.040674209594727, "global_step": 110063, "epoch": 1326} {"train_loss": -22.227766036987305, "global_step": 110064, "epoch": 1326} {"train_loss": -21.75935173034668, "global_step": 110065, "epoch": 1326} {"train_loss": -22.058547973632812, "global_step": 110066, "epoch": 1326} {"train_loss": -22.02913475036621, "global_step": 110067, "epoch": 1326} {"train_loss": -21.98026466369629, "global_step": 110068, "epoch": 1326} {"train_loss": -22.19068717956543, "global_step": 110069, "epoch": 1326} {"train_loss": -21.95832633972168, "global_step": 110070, "epoch": 1326} {"train_loss": -22.81937599182129, "global_step": 110071, "epoch": 1326} {"train_loss": -22.21254539489746, "global_step": 110072, "epoch": 1326} {"train_loss": -22.233219146728516, "global_step": 110073, "epoch": 1326} {"train_loss": -22.027311325073242, "global_step": 110074, "epoch": 1326} {"train_loss": -22.614856719970703, "global_step": 110075, "epoch": 1326} {"train_loss": -22.3076171875, "global_step": 110076, "epoch": 1326} {"train_loss": -22.44593048095703, "global_step": 110077, "epoch": 1326} {"train_loss": -21.889209747314453, "global_step": 110078, "epoch": 1326} {"train_loss": -21.89542579650879, "global_step": 110079, "epoch": 1326} {"train_loss": -22.394102096557617, "global_step": 110080, "epoch": 1326} {"train_loss": -22.2696590423584, "global_step": 110081, "epoch": 1326} {"train_loss": -21.767616271972656, "global_step": 110082, "epoch": 1326} {"train_loss": -22.219343185424805, "global_step": 110083, "epoch": 1326} {"train_loss": -21.904525756835938, "global_step": 110084, "epoch": 1326} {"train_loss": -22.526819229125977, "global_step": 110085, "epoch": 1326} {"train_loss": -22.225061416625977, "global_step": 110086, "epoch": 1326} {"train_loss": -21.9805965423584, "global_step": 110087, "epoch": 1326} {"train_loss": -22.136938095092773, "global_step": 110088, "epoch": 1326} {"train_loss": -22.2243709564209, "global_step": 110089, "epoch": 1326} {"train_loss": -22.340967178344727, "global_step": 110090, "epoch": 1326} {"train_loss": -22.035511016845703, "global_step": 110091, "epoch": 1326} {"train_loss": -21.918575286865234, "global_step": 110092, "epoch": 1326} {"train_loss": -22.20011329650879, "global_step": 110093, "epoch": 1326} {"train_loss": -21.963464736938477, "global_step": 110094, "epoch": 1326} {"train_loss": -21.963138580322266, "global_step": 110095, "epoch": 1326} {"train_loss": -22.24342918395996, "global_step": 110096, "epoch": 1326} {"train_loss": -21.957799911499023, "global_step": 110097, "epoch": 1326} {"train_loss": -22.27651023864746, "global_step": 110098, "epoch": 1326} {"train_loss": -22.135786056518555, "global_step": 110099, "epoch": 1326} {"train_loss": -22.18238639831543, "global_step": 110100, "epoch": 1326} {"train_loss": -22.4258975982666, "global_step": 110101, "epoch": 1326} {"train_loss": -22.39556121826172, "global_step": 110102, "epoch": 1326} {"train_loss": -22.206701278686523, "global_step": 110103, "epoch": 1326} {"train_loss": -22.293249130249023, "global_step": 110104, "epoch": 1326} {"train_loss": -22.52590560913086, "global_step": 110105, "epoch": 1326} {"train_loss": -21.77582550048828, "global_step": 110106, "epoch": 1326} {"train_loss": -22.11152458190918, "global_step": 110107, "epoch": 1326} {"train_loss": -22.02284049987793, "global_step": 110108, "epoch": 1326} {"train_loss": -22.109405517578125, "global_step": 110109, "epoch": 1326} {"train_loss": -21.943374633789062, "global_step": 110110, "epoch": 1326} {"train_loss": -22.20832061767578, "global_step": 110111, "epoch": 1326} {"train_loss": -22.161128997802734, "global_step": 110112, "epoch": 1326} {"train_loss": -22.79513168334961, "global_step": 110113, "epoch": 1326} {"train_loss": -22.27872657775879, "global_step": 110114, "epoch": 1326} {"train_loss": -22.312055587768555, "global_step": 110115, "epoch": 1326} {"train_loss": -21.980398178100586, "global_step": 110116, "epoch": 1326} {"train_loss": -22.6738224029541, "global_step": 110117, "epoch": 1326} {"train_loss": -22.551559448242188, "global_step": 110118, "epoch": 1326} {"train_loss": -22.49028968811035, "global_step": 110119, "epoch": 1326} {"train_loss": -22.145103454589844, "global_step": 110120, "epoch": 1326} {"train_loss": -22.338733673095703, "global_step": 110121, "epoch": 1326} {"train_loss": -22.17301368713379, "global_step": 110122, "epoch": 1326} {"train_loss": -22.347644805908203, "global_step": 110123, "epoch": 1326} {"train_loss": -22.19594383239746, "global_step": 110124, "epoch": 1326} {"train_loss": -22.354644775390625, "global_step": 110125, "epoch": 1326} {"train_loss": -22.38752555847168, "global_step": 110126, "epoch": 1326} {"train_loss": -22.36734962463379, "global_step": 110127, "epoch": 1326} {"train_loss": -22.259716033935547, "global_step": 110128, "epoch": 1326} {"train_loss": -22.296445846557617, "global_step": 110129, "epoch": 1326} {"train_loss": -22.419479370117188, "global_step": 110130, "epoch": 1326} {"train_loss": -22.390501022338867, "global_step": 110131, "epoch": 1326} {"train_loss": -22.36493682861328, "global_step": 110132, "epoch": 1326} {"train_loss": -22.62375831604004, "global_step": 110133, "epoch": 1326} {"train_loss": -22.150392532348633, "global_step": 110134, "epoch": 1326} {"train_loss": -22.353559494018555, "global_step": 110135, "epoch": 1326} {"train_loss": -22.18885612487793, "global_step": 110136, "epoch": 1326} {"train_loss": -22.48046875, "global_step": 110137, "epoch": 1326} {"train_loss": -22.143192291259766, "global_step": 110138, "epoch": 1326} {"train_loss": -22.407499313354492, "global_step": 110139, "epoch": 1326} {"train_loss": -22.216038255806428, "global_step": 110140, "epoch": 1326, "val_loss": 6175521.0} {"train_loss": -21.78374671936035, "global_step": 110141, "epoch": 1327} {"train_loss": -21.392065048217773, "global_step": 110142, "epoch": 1327} {"train_loss": -22.132286071777344, "global_step": 110143, "epoch": 1327} {"train_loss": -21.742828369140625, "global_step": 110144, "epoch": 1327} {"train_loss": -21.998876571655273, "global_step": 110145, "epoch": 1327} {"train_loss": -22.18935775756836, "global_step": 110146, "epoch": 1327} {"train_loss": -21.877765655517578, "global_step": 110147, "epoch": 1327} {"train_loss": -21.785324096679688, "global_step": 110148, "epoch": 1327} {"train_loss": -21.736108779907227, "global_step": 110149, "epoch": 1327} {"train_loss": -21.84528160095215, "global_step": 110150, "epoch": 1327} {"train_loss": -22.2006893157959, "global_step": 110151, "epoch": 1327} {"train_loss": -22.046384811401367, "global_step": 110152, "epoch": 1327} {"train_loss": -21.832006454467773, "global_step": 110153, "epoch": 1327} {"train_loss": -22.1439151763916, "global_step": 110154, "epoch": 1327} {"train_loss": -21.897817611694336, "global_step": 110155, "epoch": 1327} {"train_loss": -21.982580184936523, "global_step": 110156, "epoch": 1327} {"train_loss": -22.120512008666992, "global_step": 110157, "epoch": 1327} {"train_loss": -22.11717414855957, "global_step": 110158, "epoch": 1327} {"train_loss": -22.092618942260742, "global_step": 110159, "epoch": 1327} {"train_loss": -22.048166275024414, "global_step": 110160, "epoch": 1327} {"train_loss": -22.258041381835938, "global_step": 110161, "epoch": 1327} {"train_loss": -22.59625816345215, "global_step": 110162, "epoch": 1327} {"train_loss": -22.188459396362305, "global_step": 110163, "epoch": 1327} {"train_loss": -22.09168243408203, "global_step": 110164, "epoch": 1327} {"train_loss": -22.539093017578125, "global_step": 110165, "epoch": 1327} {"train_loss": -22.130979537963867, "global_step": 110166, "epoch": 1327} {"train_loss": -22.479246139526367, "global_step": 110167, "epoch": 1327} {"train_loss": -22.391189575195312, "global_step": 110168, "epoch": 1327} {"train_loss": -21.973661422729492, "global_step": 110169, "epoch": 1327} {"train_loss": -22.184423446655273, "global_step": 110170, "epoch": 1327} {"train_loss": -22.639484405517578, "global_step": 110171, "epoch": 1327} {"train_loss": -22.388898849487305, "global_step": 110172, "epoch": 1327} {"train_loss": -21.872148513793945, "global_step": 110173, "epoch": 1327} {"train_loss": -22.34625816345215, "global_step": 110174, "epoch": 1327} {"train_loss": -22.311630249023438, "global_step": 110175, "epoch": 1327} {"train_loss": -22.375350952148438, "global_step": 110176, "epoch": 1327} {"train_loss": -22.296329498291016, "global_step": 110177, "epoch": 1327} {"train_loss": -22.007537841796875, "global_step": 110178, "epoch": 1327} {"train_loss": -22.362314224243164, "global_step": 110179, "epoch": 1327} {"train_loss": -22.222867965698242, "global_step": 110180, "epoch": 1327} {"train_loss": -22.04670524597168, "global_step": 110181, "epoch": 1327} {"train_loss": -22.697998046875, "global_step": 110182, "epoch": 1327} {"train_loss": -22.39738655090332, "global_step": 110183, "epoch": 1327} {"train_loss": -22.12911033630371, "global_step": 110184, "epoch": 1327} {"train_loss": -22.474374771118164, "global_step": 110185, "epoch": 1327} {"train_loss": -22.26869010925293, "global_step": 110186, "epoch": 1327} {"train_loss": -21.936277389526367, "global_step": 110187, "epoch": 1327} {"train_loss": -22.178476333618164, "global_step": 110188, "epoch": 1327} {"train_loss": -22.273521423339844, "global_step": 110189, "epoch": 1327} {"train_loss": -22.453439712524414, "global_step": 110190, "epoch": 1327} {"train_loss": -22.620206832885742, "global_step": 110191, "epoch": 1327} {"train_loss": -22.544967651367188, "global_step": 110192, "epoch": 1327} {"train_loss": -22.455808639526367, "global_step": 110193, "epoch": 1327} {"train_loss": -22.326107025146484, "global_step": 110194, "epoch": 1327} {"train_loss": -21.917470932006836, "global_step": 110195, "epoch": 1327} {"train_loss": -22.220823287963867, "global_step": 110196, "epoch": 1327} {"train_loss": -22.328168869018555, "global_step": 110197, "epoch": 1327} {"train_loss": -22.430871963500977, "global_step": 110198, "epoch": 1327} {"train_loss": -22.230432510375977, "global_step": 110199, "epoch": 1327} {"train_loss": -22.17871856689453, "global_step": 110200, "epoch": 1327} {"train_loss": -22.1800479888916, "global_step": 110201, "epoch": 1327} {"train_loss": -22.46107292175293, "global_step": 110202, "epoch": 1327} {"train_loss": -22.57393455505371, "global_step": 110203, "epoch": 1327} {"train_loss": -22.197404861450195, "global_step": 110204, "epoch": 1327} {"train_loss": -22.141244888305664, "global_step": 110205, "epoch": 1327} {"train_loss": -22.247060775756836, "global_step": 110206, "epoch": 1327} {"train_loss": -22.11627769470215, "global_step": 110207, "epoch": 1327} {"train_loss": -22.082612991333008, "global_step": 110208, "epoch": 1327} {"train_loss": -22.3018856048584, "global_step": 110209, "epoch": 1327} {"train_loss": -22.255722045898438, "global_step": 110210, "epoch": 1327} {"train_loss": -21.8405818939209, "global_step": 110211, "epoch": 1327} {"train_loss": -22.24163818359375, "global_step": 110212, "epoch": 1327} {"train_loss": -22.160959243774414, "global_step": 110213, "epoch": 1327} {"train_loss": -22.39215660095215, "global_step": 110214, "epoch": 1327} {"train_loss": -22.334877014160156, "global_step": 110215, "epoch": 1327} {"train_loss": -22.069366455078125, "global_step": 110216, "epoch": 1327} {"train_loss": -22.3554630279541, "global_step": 110217, "epoch": 1327} {"train_loss": -21.817750930786133, "global_step": 110218, "epoch": 1327} {"train_loss": -22.711225509643555, "global_step": 110219, "epoch": 1327} {"train_loss": -21.925588607788086, "global_step": 110220, "epoch": 1327} {"train_loss": -21.933313369750977, "global_step": 110221, "epoch": 1327} {"train_loss": -22.25491714477539, "global_step": 110222, "epoch": 1327} {"train_loss": -22.183845497039428, "global_step": 110223, "epoch": 1327, "val_loss": 6038081.0} {"train_loss": -21.886877059936523, "global_step": 110224, "epoch": 1328} {"train_loss": -22.226703643798828, "global_step": 110225, "epoch": 1328} {"train_loss": -22.299732208251953, "global_step": 110226, "epoch": 1328} {"train_loss": -21.848297119140625, "global_step": 110227, "epoch": 1328} {"train_loss": -21.74623680114746, "global_step": 110228, "epoch": 1328} {"train_loss": -21.515100479125977, "global_step": 110229, "epoch": 1328} {"train_loss": -21.96027946472168, "global_step": 110230, "epoch": 1328} {"train_loss": -22.073835372924805, "global_step": 110231, "epoch": 1328} {"train_loss": -22.176462173461914, "global_step": 110232, "epoch": 1328} {"train_loss": -22.40193748474121, "global_step": 110233, "epoch": 1328} {"train_loss": -22.210803985595703, "global_step": 110234, "epoch": 1328} {"train_loss": -22.17714500427246, "global_step": 110235, "epoch": 1328} {"train_loss": -22.457948684692383, "global_step": 110236, "epoch": 1328} {"train_loss": -21.962034225463867, "global_step": 110237, "epoch": 1328} {"train_loss": -22.174266815185547, "global_step": 110238, "epoch": 1328} {"train_loss": -21.78604507446289, "global_step": 110239, "epoch": 1328} {"train_loss": -21.91883087158203, "global_step": 110240, "epoch": 1328} {"train_loss": -22.122085571289062, "global_step": 110241, "epoch": 1328} {"train_loss": -22.324613571166992, "global_step": 110242, "epoch": 1328} {"train_loss": -22.183181762695312, "global_step": 110243, "epoch": 1328} {"train_loss": -22.410009384155273, "global_step": 110244, "epoch": 1328} {"train_loss": -22.11354637145996, "global_step": 110245, "epoch": 1328} {"train_loss": -22.41904067993164, "global_step": 110246, "epoch": 1328} {"train_loss": -22.623950958251953, "global_step": 110247, "epoch": 1328} {"train_loss": -22.069534301757812, "global_step": 110248, "epoch": 1328} {"train_loss": -22.138416290283203, "global_step": 110249, "epoch": 1328} {"train_loss": -22.203577041625977, "global_step": 110250, "epoch": 1328} {"train_loss": -22.261415481567383, "global_step": 110251, "epoch": 1328} {"train_loss": -22.31912612915039, "global_step": 110252, "epoch": 1328} {"train_loss": -22.577672958374023, "global_step": 110253, "epoch": 1328} {"train_loss": -22.046131134033203, "global_step": 110254, "epoch": 1328} {"train_loss": -22.724306106567383, "global_step": 110255, "epoch": 1328} {"train_loss": -22.095413208007812, "global_step": 110256, "epoch": 1328} {"train_loss": -22.09075355529785, "global_step": 110257, "epoch": 1328} {"train_loss": -22.14996337890625, "global_step": 110258, "epoch": 1328} {"train_loss": -21.918598175048828, "global_step": 110259, "epoch": 1328} {"train_loss": -21.940048217773438, "global_step": 110260, "epoch": 1328} {"train_loss": -22.307294845581055, "global_step": 110261, "epoch": 1328} {"train_loss": -22.130863189697266, "global_step": 110262, "epoch": 1328} {"train_loss": -22.304059982299805, "global_step": 110263, "epoch": 1328} {"train_loss": -22.123218536376953, "global_step": 110264, "epoch": 1328} {"train_loss": -22.3712215423584, "global_step": 110265, "epoch": 1328} {"train_loss": -21.777063369750977, "global_step": 110266, "epoch": 1328} {"train_loss": -22.06830596923828, "global_step": 110267, "epoch": 1328} {"train_loss": -21.920642852783203, "global_step": 110268, "epoch": 1328} {"train_loss": -22.121397018432617, "global_step": 110269, "epoch": 1328} {"train_loss": -22.25861930847168, "global_step": 110270, "epoch": 1328} {"train_loss": -22.36801528930664, "global_step": 110271, "epoch": 1328} {"train_loss": -22.178808212280273, "global_step": 110272, "epoch": 1328} {"train_loss": -22.303770065307617, "global_step": 110273, "epoch": 1328} {"train_loss": -22.24068260192871, "global_step": 110274, "epoch": 1328} {"train_loss": -22.102094650268555, "global_step": 110275, "epoch": 1328} {"train_loss": -22.21793556213379, "global_step": 110276, "epoch": 1328} {"train_loss": -21.820785522460938, "global_step": 110277, "epoch": 1328} {"train_loss": -21.929765701293945, "global_step": 110278, "epoch": 1328} {"train_loss": -22.458118438720703, "global_step": 110279, "epoch": 1328} {"train_loss": -22.349958419799805, "global_step": 110280, "epoch": 1328} {"train_loss": -22.50126075744629, "global_step": 110281, "epoch": 1328} {"train_loss": -21.984350204467773, "global_step": 110282, "epoch": 1328} {"train_loss": -22.340646743774414, "global_step": 110283, "epoch": 1328} {"train_loss": -22.16847801208496, "global_step": 110284, "epoch": 1328} {"train_loss": -22.123262405395508, "global_step": 110285, "epoch": 1328} {"train_loss": -22.008758544921875, "global_step": 110286, "epoch": 1328} {"train_loss": -22.14944839477539, "global_step": 110287, "epoch": 1328} {"train_loss": -22.285425186157227, "global_step": 110288, "epoch": 1328} {"train_loss": -22.248823165893555, "global_step": 110289, "epoch": 1328} {"train_loss": -22.296072006225586, "global_step": 110290, "epoch": 1328} {"train_loss": -22.330196380615234, "global_step": 110291, "epoch": 1328} {"train_loss": -22.235950469970703, "global_step": 110292, "epoch": 1328} {"train_loss": -22.044832229614258, "global_step": 110293, "epoch": 1328} {"train_loss": -22.146360397338867, "global_step": 110294, "epoch": 1328} {"train_loss": -22.40346336364746, "global_step": 110295, "epoch": 1328} {"train_loss": -22.33138084411621, "global_step": 110296, "epoch": 1328} {"train_loss": -22.210285186767578, "global_step": 110297, "epoch": 1328} {"train_loss": -22.480005264282227, "global_step": 110298, "epoch": 1328} {"train_loss": -22.11307144165039, "global_step": 110299, "epoch": 1328} {"train_loss": -21.9215145111084, "global_step": 110300, "epoch": 1328} {"train_loss": -22.408506393432617, "global_step": 110301, "epoch": 1328} {"train_loss": -22.170785903930664, "global_step": 110302, "epoch": 1328} {"train_loss": -22.18428611755371, "global_step": 110303, "epoch": 1328} {"train_loss": -22.171117782592773, "global_step": 110304, "epoch": 1328} {"train_loss": -22.105823516845703, "global_step": 110305, "epoch": 1328} {"train_loss": -22.177238625216198, "global_step": 110306, "epoch": 1328, "val_loss": 6067726.0} {"train_loss": -21.72934913635254, "global_step": 110307, "epoch": 1329} {"train_loss": -21.888879776000977, "global_step": 110308, "epoch": 1329} {"train_loss": -22.084224700927734, "global_step": 110309, "epoch": 1329} {"train_loss": -22.020231246948242, "global_step": 110310, "epoch": 1329} {"train_loss": -22.06659507751465, "global_step": 110311, "epoch": 1329} {"train_loss": -22.28264808654785, "global_step": 110312, "epoch": 1329} {"train_loss": -22.318151473999023, "global_step": 110313, "epoch": 1329} {"train_loss": -22.178327560424805, "global_step": 110314, "epoch": 1329} {"train_loss": -21.987733840942383, "global_step": 110315, "epoch": 1329} {"train_loss": -22.19032096862793, "global_step": 110316, "epoch": 1329} {"train_loss": -22.078855514526367, "global_step": 110317, "epoch": 1329} {"train_loss": -21.814992904663086, "global_step": 110318, "epoch": 1329} {"train_loss": -22.071796417236328, "global_step": 110319, "epoch": 1329} {"train_loss": -21.984193801879883, "global_step": 110320, "epoch": 1329} {"train_loss": -22.03586769104004, "global_step": 110321, "epoch": 1329} {"train_loss": -22.11604881286621, "global_step": 110322, "epoch": 1329} {"train_loss": -22.168384552001953, "global_step": 110323, "epoch": 1329} {"train_loss": -22.691268920898438, "global_step": 110324, "epoch": 1329} {"train_loss": -22.153152465820312, "global_step": 110325, "epoch": 1329} {"train_loss": -22.51944351196289, "global_step": 110326, "epoch": 1329} {"train_loss": -22.177383422851562, "global_step": 110327, "epoch": 1329} {"train_loss": -22.32244110107422, "global_step": 110328, "epoch": 1329} {"train_loss": -22.2591609954834, "global_step": 110329, "epoch": 1329} {"train_loss": -22.30771255493164, "global_step": 110330, "epoch": 1329} {"train_loss": -21.83064079284668, "global_step": 110331, "epoch": 1329} {"train_loss": -22.530256271362305, "global_step": 110332, "epoch": 1329} {"train_loss": -22.140228271484375, "global_step": 110333, "epoch": 1329} {"train_loss": -22.252628326416016, "global_step": 110334, "epoch": 1329} {"train_loss": -22.341129302978516, "global_step": 110335, "epoch": 1329} {"train_loss": -22.03980255126953, "global_step": 110336, "epoch": 1329} {"train_loss": -22.329835891723633, "global_step": 110337, "epoch": 1329} {"train_loss": -22.026290893554688, "global_step": 110338, "epoch": 1329} {"train_loss": -22.15853500366211, "global_step": 110339, "epoch": 1329} {"train_loss": -22.547388076782227, "global_step": 110340, "epoch": 1329} {"train_loss": -22.643573760986328, "global_step": 110341, "epoch": 1329} {"train_loss": -22.132644653320312, "global_step": 110342, "epoch": 1329} {"train_loss": -22.460840225219727, "global_step": 110343, "epoch": 1329} {"train_loss": -22.388229370117188, "global_step": 110344, "epoch": 1329} {"train_loss": -22.37106704711914, "global_step": 110345, "epoch": 1329} {"train_loss": -22.58406639099121, "global_step": 110346, "epoch": 1329} {"train_loss": -22.207332611083984, "global_step": 110347, "epoch": 1329} {"train_loss": -22.155118942260742, "global_step": 110348, "epoch": 1329} {"train_loss": -22.434616088867188, "global_step": 110349, "epoch": 1329} {"train_loss": -22.42232322692871, "global_step": 110350, "epoch": 1329} {"train_loss": -22.1878719329834, "global_step": 110351, "epoch": 1329} {"train_loss": -21.992721557617188, "global_step": 110352, "epoch": 1329} {"train_loss": -22.538185119628906, "global_step": 110353, "epoch": 1329} {"train_loss": -22.518184661865234, "global_step": 110354, "epoch": 1329} {"train_loss": -22.104219436645508, "global_step": 110355, "epoch": 1329} {"train_loss": -22.78375816345215, "global_step": 110356, "epoch": 1329} {"train_loss": -22.065584182739258, "global_step": 110357, "epoch": 1329} {"train_loss": -22.266477584838867, "global_step": 110358, "epoch": 1329} {"train_loss": -22.194141387939453, "global_step": 110359, "epoch": 1329} {"train_loss": -22.3995418548584, "global_step": 110360, "epoch": 1329} {"train_loss": -22.367380142211914, "global_step": 110361, "epoch": 1329} {"train_loss": -22.502140045166016, "global_step": 110362, "epoch": 1329} {"train_loss": -22.106077194213867, "global_step": 110363, "epoch": 1329} {"train_loss": -22.571998596191406, "global_step": 110364, "epoch": 1329} {"train_loss": -22.340505599975586, "global_step": 110365, "epoch": 1329} {"train_loss": -22.720129013061523, "global_step": 110366, "epoch": 1329} {"train_loss": -22.455524444580078, "global_step": 110367, "epoch": 1329} {"train_loss": -21.94527816772461, "global_step": 110368, "epoch": 1329} {"train_loss": -22.68266487121582, "global_step": 110369, "epoch": 1329} {"train_loss": -22.407730102539062, "global_step": 110370, "epoch": 1329} {"train_loss": -22.292089462280273, "global_step": 110371, "epoch": 1329} {"train_loss": -22.2477970123291, "global_step": 110372, "epoch": 1329} {"train_loss": -22.305124282836914, "global_step": 110373, "epoch": 1329} {"train_loss": -22.2779541015625, "global_step": 110374, "epoch": 1329} {"train_loss": -22.4411678314209, "global_step": 110375, "epoch": 1329} {"train_loss": -22.385770797729492, "global_step": 110376, "epoch": 1329} {"train_loss": -22.446298599243164, "global_step": 110377, "epoch": 1329} {"train_loss": -22.121191024780273, "global_step": 110378, "epoch": 1329} {"train_loss": -22.216209411621094, "global_step": 110379, "epoch": 1329} {"train_loss": -22.5019474029541, "global_step": 110380, "epoch": 1329} {"train_loss": -22.032970428466797, "global_step": 110381, "epoch": 1329} {"train_loss": -22.78012466430664, "global_step": 110382, "epoch": 1329} {"train_loss": -22.269229888916016, "global_step": 110383, "epoch": 1329} {"train_loss": -22.06610679626465, "global_step": 110384, "epoch": 1329} {"train_loss": -22.355615615844727, "global_step": 110385, "epoch": 1329} {"train_loss": -22.341175079345703, "global_step": 110386, "epoch": 1329} {"train_loss": -21.804433822631836, "global_step": 110387, "epoch": 1329} {"train_loss": -21.950420379638672, "global_step": 110388, "epoch": 1329} {"train_loss": -22.259426645485753, "global_step": 110389, "epoch": 1329, "val_loss": 6191579.0} {"train_loss": -21.990631103515625, "global_step": 110390, "epoch": 1330} {"train_loss": -22.281213760375977, "global_step": 110391, "epoch": 1330} {"train_loss": -21.966632843017578, "global_step": 110392, "epoch": 1330} {"train_loss": -22.29660415649414, "global_step": 110393, "epoch": 1330} {"train_loss": -22.15829849243164, "global_step": 110394, "epoch": 1330} {"train_loss": -22.081003189086914, "global_step": 110395, "epoch": 1330} {"train_loss": -22.10672378540039, "global_step": 110396, "epoch": 1330} {"train_loss": -21.76215934753418, "global_step": 110397, "epoch": 1330} {"train_loss": -22.162290573120117, "global_step": 110398, "epoch": 1330} {"train_loss": -21.882259368896484, "global_step": 110399, "epoch": 1330} {"train_loss": -21.82771873474121, "global_step": 110400, "epoch": 1330} {"train_loss": -21.983585357666016, "global_step": 110401, "epoch": 1330} {"train_loss": -22.02826499938965, "global_step": 110402, "epoch": 1330} {"train_loss": -22.003589630126953, "global_step": 110403, "epoch": 1330} {"train_loss": -21.83512306213379, "global_step": 110404, "epoch": 1330} {"train_loss": -22.421735763549805, "global_step": 110405, "epoch": 1330} {"train_loss": -22.150297164916992, "global_step": 110406, "epoch": 1330} {"train_loss": -22.317691802978516, "global_step": 110407, "epoch": 1330} {"train_loss": -22.070032119750977, "global_step": 110408, "epoch": 1330} {"train_loss": -22.412527084350586, "global_step": 110409, "epoch": 1330} {"train_loss": -22.020246505737305, "global_step": 110410, "epoch": 1330} {"train_loss": -22.512475967407227, "global_step": 110411, "epoch": 1330} {"train_loss": -21.961267471313477, "global_step": 110412, "epoch": 1330} {"train_loss": -22.340112686157227, "global_step": 110413, "epoch": 1330} {"train_loss": -22.046382904052734, "global_step": 110414, "epoch": 1330} {"train_loss": -22.039173126220703, "global_step": 110415, "epoch": 1330} {"train_loss": -21.634798049926758, "global_step": 110416, "epoch": 1330} {"train_loss": -22.036273956298828, "global_step": 110417, "epoch": 1330} {"train_loss": -22.328954696655273, "global_step": 110418, "epoch": 1330} {"train_loss": -22.478803634643555, "global_step": 110419, "epoch": 1330} {"train_loss": -22.125425338745117, "global_step": 110420, "epoch": 1330} {"train_loss": -21.73941421508789, "global_step": 110421, "epoch": 1330} {"train_loss": -22.136396408081055, "global_step": 110422, "epoch": 1330} {"train_loss": -22.119678497314453, "global_step": 110423, "epoch": 1330} {"train_loss": -22.135007858276367, "global_step": 110424, "epoch": 1330} {"train_loss": -22.128625869750977, "global_step": 110425, "epoch": 1330} {"train_loss": -22.226659774780273, "global_step": 110426, "epoch": 1330} {"train_loss": -22.088132858276367, "global_step": 110427, "epoch": 1330} {"train_loss": -22.767976760864258, "global_step": 110428, "epoch": 1330} {"train_loss": -21.682987213134766, "global_step": 110429, "epoch": 1330} {"train_loss": -22.594839096069336, "global_step": 110430, "epoch": 1330} {"train_loss": -22.559629440307617, "global_step": 110431, "epoch": 1330} {"train_loss": -22.07158088684082, "global_step": 110432, "epoch": 1330} {"train_loss": -22.345849990844727, "global_step": 110433, "epoch": 1330} {"train_loss": -22.34259605407715, "global_step": 110434, "epoch": 1330} {"train_loss": -22.1142520904541, "global_step": 110435, "epoch": 1330} {"train_loss": -22.20503807067871, "global_step": 110436, "epoch": 1330} {"train_loss": -22.257118225097656, "global_step": 110437, "epoch": 1330} {"train_loss": -22.493024826049805, "global_step": 110438, "epoch": 1330} {"train_loss": -22.294233322143555, "global_step": 110439, "epoch": 1330} {"train_loss": -22.010339736938477, "global_step": 110440, "epoch": 1330} {"train_loss": -22.272491455078125, "global_step": 110441, "epoch": 1330} {"train_loss": -22.315750122070312, "global_step": 110442, "epoch": 1330} {"train_loss": -22.170560836791992, "global_step": 110443, "epoch": 1330} {"train_loss": -22.443090438842773, "global_step": 110444, "epoch": 1330} {"train_loss": -22.419965744018555, "global_step": 110445, "epoch": 1330} {"train_loss": -22.5221004486084, "global_step": 110446, "epoch": 1330} {"train_loss": -22.445249557495117, "global_step": 110447, "epoch": 1330} {"train_loss": -22.45172691345215, "global_step": 110448, "epoch": 1330} {"train_loss": -22.444833755493164, "global_step": 110449, "epoch": 1330} {"train_loss": -22.508228302001953, "global_step": 110450, "epoch": 1330} {"train_loss": -22.417461395263672, "global_step": 110451, "epoch": 1330} {"train_loss": -22.28325653076172, "global_step": 110452, "epoch": 1330} {"train_loss": -22.41291046142578, "global_step": 110453, "epoch": 1330} {"train_loss": -22.501083374023438, "global_step": 110454, "epoch": 1330} {"train_loss": -22.54576873779297, "global_step": 110455, "epoch": 1330} {"train_loss": -22.229278564453125, "global_step": 110456, "epoch": 1330} {"train_loss": -22.193958282470703, "global_step": 110457, "epoch": 1330} {"train_loss": -22.686107635498047, "global_step": 110458, "epoch": 1330} {"train_loss": -22.018085479736328, "global_step": 110459, "epoch": 1330} {"train_loss": -22.094144821166992, "global_step": 110460, "epoch": 1330} {"train_loss": -22.018625259399414, "global_step": 110461, "epoch": 1330} {"train_loss": -22.147743225097656, "global_step": 110462, "epoch": 1330} {"train_loss": -21.938016891479492, "global_step": 110463, "epoch": 1330} {"train_loss": -21.80323028564453, "global_step": 110464, "epoch": 1330} {"train_loss": -21.941287994384766, "global_step": 110465, "epoch": 1330} {"train_loss": -21.853622436523438, "global_step": 110466, "epoch": 1330} {"train_loss": -22.21617889404297, "global_step": 110467, "epoch": 1330} {"train_loss": -22.241174697875977, "global_step": 110468, "epoch": 1330} {"train_loss": -22.01488494873047, "global_step": 110469, "epoch": 1330} {"train_loss": -22.33780288696289, "global_step": 110470, "epoch": 1330} {"train_loss": -22.1835880279541, "global_step": 110471, "epoch": 1330} {"train_loss": -22.199211051665156, "global_step": 110472, "epoch": 1330, "val_loss": 6098484.0} {"train_loss": -21.364322662353516, "global_step": 110473, "epoch": 1331} {"train_loss": -21.773252487182617, "global_step": 110474, "epoch": 1331} {"train_loss": -21.51930046081543, "global_step": 110475, "epoch": 1331} {"train_loss": -21.350980758666992, "global_step": 110476, "epoch": 1331} {"train_loss": -21.587141036987305, "global_step": 110477, "epoch": 1331} {"train_loss": -22.098876953125, "global_step": 110478, "epoch": 1331} {"train_loss": -21.47942543029785, "global_step": 110479, "epoch": 1331} {"train_loss": -22.003433227539062, "global_step": 110480, "epoch": 1331} {"train_loss": -21.826536178588867, "global_step": 110481, "epoch": 1331} {"train_loss": -21.927444458007812, "global_step": 110482, "epoch": 1331} {"train_loss": -21.852468490600586, "global_step": 110483, "epoch": 1331} {"train_loss": -21.824045181274414, "global_step": 110484, "epoch": 1331} {"train_loss": -21.808292388916016, "global_step": 110485, "epoch": 1331} {"train_loss": -21.400009155273438, "global_step": 110486, "epoch": 1331} {"train_loss": -21.69239616394043, "global_step": 110487, "epoch": 1331} {"train_loss": -22.075536727905273, "global_step": 110488, "epoch": 1331} {"train_loss": -22.428848266601562, "global_step": 110489, "epoch": 1331} {"train_loss": -21.635696411132812, "global_step": 110490, "epoch": 1331} {"train_loss": -21.984556198120117, "global_step": 110491, "epoch": 1331} {"train_loss": -22.00516128540039, "global_step": 110492, "epoch": 1331} {"train_loss": -22.255847930908203, "global_step": 110493, "epoch": 1331} {"train_loss": -22.057336807250977, "global_step": 110494, "epoch": 1331} {"train_loss": -22.127527236938477, "global_step": 110495, "epoch": 1331} {"train_loss": -22.30223846435547, "global_step": 110496, "epoch": 1331} {"train_loss": -22.18745994567871, "global_step": 110497, "epoch": 1331} {"train_loss": -22.10390281677246, "global_step": 110498, "epoch": 1331} {"train_loss": -22.28313446044922, "global_step": 110499, "epoch": 1331} {"train_loss": -22.3701229095459, "global_step": 110500, "epoch": 1331} {"train_loss": -21.99946403503418, "global_step": 110501, "epoch": 1331} {"train_loss": -21.87785530090332, "global_step": 110502, "epoch": 1331} {"train_loss": -22.03281021118164, "global_step": 110503, "epoch": 1331} {"train_loss": -22.326433181762695, "global_step": 110504, "epoch": 1331} {"train_loss": -22.07221794128418, "global_step": 110505, "epoch": 1331} {"train_loss": -22.2181453704834, "global_step": 110506, "epoch": 1331} {"train_loss": -22.52547264099121, "global_step": 110507, "epoch": 1331} {"train_loss": -22.327922821044922, "global_step": 110508, "epoch": 1331} {"train_loss": -21.956815719604492, "global_step": 110509, "epoch": 1331} {"train_loss": -22.37840461730957, "global_step": 110510, "epoch": 1331} {"train_loss": -22.307348251342773, "global_step": 110511, "epoch": 1331} {"train_loss": -22.631103515625, "global_step": 110512, "epoch": 1331} {"train_loss": -22.062179565429688, "global_step": 110513, "epoch": 1331} {"train_loss": -22.211965560913086, "global_step": 110514, "epoch": 1331} {"train_loss": -22.024477005004883, "global_step": 110515, "epoch": 1331} {"train_loss": -22.613630294799805, "global_step": 110516, "epoch": 1331} {"train_loss": -21.93438720703125, "global_step": 110517, "epoch": 1331} {"train_loss": -22.383821487426758, "global_step": 110518, "epoch": 1331} {"train_loss": -22.157821655273438, "global_step": 110519, "epoch": 1331} {"train_loss": -22.402353286743164, "global_step": 110520, "epoch": 1331} {"train_loss": -22.362323760986328, "global_step": 110521, "epoch": 1331} {"train_loss": -22.17669677734375, "global_step": 110522, "epoch": 1331} {"train_loss": -21.90865135192871, "global_step": 110523, "epoch": 1331} {"train_loss": -21.99819564819336, "global_step": 110524, "epoch": 1331} {"train_loss": -21.952268600463867, "global_step": 110525, "epoch": 1331} {"train_loss": -22.065107345581055, "global_step": 110526, "epoch": 1331} {"train_loss": -22.139240264892578, "global_step": 110527, "epoch": 1331} {"train_loss": -22.233205795288086, "global_step": 110528, "epoch": 1331} {"train_loss": -22.037372589111328, "global_step": 110529, "epoch": 1331} {"train_loss": -22.53223991394043, "global_step": 110530, "epoch": 1331} {"train_loss": -22.214628219604492, "global_step": 110531, "epoch": 1331} {"train_loss": -22.122663497924805, "global_step": 110532, "epoch": 1331} {"train_loss": -21.911392211914062, "global_step": 110533, "epoch": 1331} {"train_loss": -22.206857681274414, "global_step": 110534, "epoch": 1331} {"train_loss": -22.315767288208008, "global_step": 110535, "epoch": 1331} {"train_loss": -22.50941276550293, "global_step": 110536, "epoch": 1331} {"train_loss": -22.267297744750977, "global_step": 110537, "epoch": 1331} {"train_loss": -22.25065040588379, "global_step": 110538, "epoch": 1331} {"train_loss": -22.20494842529297, "global_step": 110539, "epoch": 1331} {"train_loss": -22.26546287536621, "global_step": 110540, "epoch": 1331} {"train_loss": -22.201461791992188, "global_step": 110541, "epoch": 1331} {"train_loss": -21.897939682006836, "global_step": 110542, "epoch": 1331} {"train_loss": -22.50691032409668, "global_step": 110543, "epoch": 1331} {"train_loss": -22.23708152770996, "global_step": 110544, "epoch": 1331} {"train_loss": -22.418289184570312, "global_step": 110545, "epoch": 1331} {"train_loss": -22.27520179748535, "global_step": 110546, "epoch": 1331} {"train_loss": -22.119659423828125, "global_step": 110547, "epoch": 1331} {"train_loss": -22.09222984313965, "global_step": 110548, "epoch": 1331} {"train_loss": -22.1127872467041, "global_step": 110549, "epoch": 1331} {"train_loss": -21.849355697631836, "global_step": 110550, "epoch": 1331} {"train_loss": -22.14126968383789, "global_step": 110551, "epoch": 1331} {"train_loss": -22.34028434753418, "global_step": 110552, "epoch": 1331} {"train_loss": -22.18521499633789, "global_step": 110553, "epoch": 1331} {"train_loss": -22.275785446166992, "global_step": 110554, "epoch": 1331} {"train_loss": -22.080583756228528, "global_step": 110555, "epoch": 1331, "val_loss": 6165294.5} {"train_loss": -22.231868743896484, "global_step": 110556, "epoch": 1332} {"train_loss": -21.727142333984375, "global_step": 110557, "epoch": 1332} {"train_loss": -22.35359001159668, "global_step": 110558, "epoch": 1332} {"train_loss": -22.390716552734375, "global_step": 110559, "epoch": 1332} {"train_loss": -22.109312057495117, "global_step": 110560, "epoch": 1332} {"train_loss": -22.159536361694336, "global_step": 110561, "epoch": 1332} {"train_loss": -22.28016471862793, "global_step": 110562, "epoch": 1332} {"train_loss": -22.476478576660156, "global_step": 110563, "epoch": 1332} {"train_loss": -22.53736686706543, "global_step": 110564, "epoch": 1332} {"train_loss": -22.60268211364746, "global_step": 110565, "epoch": 1332} {"train_loss": -22.20429801940918, "global_step": 110566, "epoch": 1332} {"train_loss": -22.190860748291016, "global_step": 110567, "epoch": 1332} {"train_loss": -22.33381462097168, "global_step": 110568, "epoch": 1332} {"train_loss": -22.64627456665039, "global_step": 110569, "epoch": 1332} {"train_loss": -22.469030380249023, "global_step": 110570, "epoch": 1332} {"train_loss": -22.174942016601562, "global_step": 110571, "epoch": 1332} {"train_loss": -22.387821197509766, "global_step": 110572, "epoch": 1332} {"train_loss": -22.039077758789062, "global_step": 110573, "epoch": 1332} {"train_loss": -22.436704635620117, "global_step": 110574, "epoch": 1332} {"train_loss": -22.250253677368164, "global_step": 110575, "epoch": 1332} {"train_loss": -22.216516494750977, "global_step": 110576, "epoch": 1332} {"train_loss": -22.323762893676758, "global_step": 110577, "epoch": 1332} {"train_loss": -21.991392135620117, "global_step": 110578, "epoch": 1332} {"train_loss": -22.034748077392578, "global_step": 110579, "epoch": 1332} {"train_loss": -21.896154403686523, "global_step": 110580, "epoch": 1332} {"train_loss": -22.447980880737305, "global_step": 110581, "epoch": 1332} {"train_loss": -22.02879524230957, "global_step": 110582, "epoch": 1332} {"train_loss": -21.98615074157715, "global_step": 110583, "epoch": 1332} {"train_loss": -22.266098022460938, "global_step": 110584, "epoch": 1332} {"train_loss": -22.051923751831055, "global_step": 110585, "epoch": 1332} {"train_loss": -22.48114585876465, "global_step": 110586, "epoch": 1332} {"train_loss": -21.829580307006836, "global_step": 110587, "epoch": 1332} {"train_loss": -22.599477767944336, "global_step": 110588, "epoch": 1332} {"train_loss": -22.482458114624023, "global_step": 110589, "epoch": 1332} {"train_loss": -22.06114387512207, "global_step": 110590, "epoch": 1332} {"train_loss": -22.397817611694336, "global_step": 110591, "epoch": 1332} {"train_loss": -22.271406173706055, "global_step": 110592, "epoch": 1332} {"train_loss": -22.094100952148438, "global_step": 110593, "epoch": 1332} {"train_loss": -22.569711685180664, "global_step": 110594, "epoch": 1332} {"train_loss": -22.529926300048828, "global_step": 110595, "epoch": 1332} {"train_loss": -22.770565032958984, "global_step": 110596, "epoch": 1332} {"train_loss": -22.521581649780273, "global_step": 110597, "epoch": 1332} {"train_loss": -22.327802658081055, "global_step": 110598, "epoch": 1332} {"train_loss": -22.336973190307617, "global_step": 110599, "epoch": 1332} {"train_loss": -21.98945426940918, "global_step": 110600, "epoch": 1332} {"train_loss": -22.209522247314453, "global_step": 110601, "epoch": 1332} {"train_loss": -22.355125427246094, "global_step": 110602, "epoch": 1332} {"train_loss": -22.191791534423828, "global_step": 110603, "epoch": 1332} {"train_loss": -22.297569274902344, "global_step": 110604, "epoch": 1332} {"train_loss": -22.235754013061523, "global_step": 110605, "epoch": 1332} {"train_loss": -22.361181259155273, "global_step": 110606, "epoch": 1332} {"train_loss": -22.103286743164062, "global_step": 110607, "epoch": 1332} {"train_loss": -22.571752548217773, "global_step": 110608, "epoch": 1332} {"train_loss": -22.002866744995117, "global_step": 110609, "epoch": 1332} {"train_loss": -22.30694580078125, "global_step": 110610, "epoch": 1332} {"train_loss": -22.622711181640625, "global_step": 110611, "epoch": 1332} {"train_loss": -22.260208129882812, "global_step": 110612, "epoch": 1332} {"train_loss": -22.498205184936523, "global_step": 110613, "epoch": 1332} {"train_loss": -21.998689651489258, "global_step": 110614, "epoch": 1332} {"train_loss": -22.290891647338867, "global_step": 110615, "epoch": 1332} {"train_loss": -22.33910369873047, "global_step": 110616, "epoch": 1332} {"train_loss": -22.041522979736328, "global_step": 110617, "epoch": 1332} {"train_loss": -22.465497970581055, "global_step": 110618, "epoch": 1332} {"train_loss": -22.46869468688965, "global_step": 110619, "epoch": 1332} {"train_loss": -22.032764434814453, "global_step": 110620, "epoch": 1332} {"train_loss": -22.4039249420166, "global_step": 110621, "epoch": 1332} {"train_loss": -22.258665084838867, "global_step": 110622, "epoch": 1332} {"train_loss": -22.260061264038086, "global_step": 110623, "epoch": 1332} {"train_loss": -22.40397071838379, "global_step": 110624, "epoch": 1332} {"train_loss": -22.483970642089844, "global_step": 110625, "epoch": 1332} {"train_loss": -22.1531982421875, "global_step": 110626, "epoch": 1332} {"train_loss": -22.121225357055664, "global_step": 110627, "epoch": 1332} {"train_loss": -22.19764518737793, "global_step": 110628, "epoch": 1332} {"train_loss": -22.18714714050293, "global_step": 110629, "epoch": 1332} {"train_loss": -21.911529541015625, "global_step": 110630, "epoch": 1332} {"train_loss": -22.201269149780273, "global_step": 110631, "epoch": 1332} {"train_loss": -22.476865768432617, "global_step": 110632, "epoch": 1332} {"train_loss": -22.407594680786133, "global_step": 110633, "epoch": 1332} {"train_loss": -22.190143585205078, "global_step": 110634, "epoch": 1332} {"train_loss": -22.274499893188477, "global_step": 110635, "epoch": 1332} {"train_loss": -22.350406646728516, "global_step": 110636, "epoch": 1332} {"train_loss": -22.173709869384766, "global_step": 110637, "epoch": 1332} {"train_loss": -22.284848109785333, "global_step": 110638, "epoch": 1332, "val_loss": 6243728.5} {"train_loss": -21.394651412963867, "global_step": 110639, "epoch": 1333} {"train_loss": -22.259998321533203, "global_step": 110640, "epoch": 1333} {"train_loss": -21.951980590820312, "global_step": 110641, "epoch": 1333} {"train_loss": -21.808807373046875, "global_step": 110642, "epoch": 1333} {"train_loss": -21.894012451171875, "global_step": 110643, "epoch": 1333} {"train_loss": -21.74897575378418, "global_step": 110644, "epoch": 1333} {"train_loss": -22.05801010131836, "global_step": 110645, "epoch": 1333} {"train_loss": -21.98626136779785, "global_step": 110646, "epoch": 1333} {"train_loss": -22.12025260925293, "global_step": 110647, "epoch": 1333} {"train_loss": -22.089202880859375, "global_step": 110648, "epoch": 1333} {"train_loss": -21.83611488342285, "global_step": 110649, "epoch": 1333} {"train_loss": -22.440942764282227, "global_step": 110650, "epoch": 1333} {"train_loss": -22.06390380859375, "global_step": 110651, "epoch": 1333} {"train_loss": -21.91613006591797, "global_step": 110652, "epoch": 1333} {"train_loss": -21.952407836914062, "global_step": 110653, "epoch": 1333} {"train_loss": -22.3944091796875, "global_step": 110654, "epoch": 1333} {"train_loss": -22.456344604492188, "global_step": 110655, "epoch": 1333} {"train_loss": -22.228193283081055, "global_step": 110656, "epoch": 1333} {"train_loss": -22.266286849975586, "global_step": 110657, "epoch": 1333} {"train_loss": -22.251001358032227, "global_step": 110658, "epoch": 1333} {"train_loss": -22.508352279663086, "global_step": 110659, "epoch": 1333} {"train_loss": -22.35982322692871, "global_step": 110660, "epoch": 1333} {"train_loss": -22.160049438476562, "global_step": 110661, "epoch": 1333} {"train_loss": -22.222721099853516, "global_step": 110662, "epoch": 1333} {"train_loss": -22.4671630859375, "global_step": 110663, "epoch": 1333} {"train_loss": -22.462949752807617, "global_step": 110664, "epoch": 1333} {"train_loss": -22.14164161682129, "global_step": 110665, "epoch": 1333} {"train_loss": -22.340850830078125, "global_step": 110666, "epoch": 1333} {"train_loss": -22.215776443481445, "global_step": 110667, "epoch": 1333} {"train_loss": -22.307966232299805, "global_step": 110668, "epoch": 1333} {"train_loss": -22.17746353149414, "global_step": 110669, "epoch": 1333} {"train_loss": -22.63497543334961, "global_step": 110670, "epoch": 1333} {"train_loss": -22.645307540893555, "global_step": 110671, "epoch": 1333} {"train_loss": -21.91847038269043, "global_step": 110672, "epoch": 1333} {"train_loss": -22.162504196166992, "global_step": 110673, "epoch": 1333} {"train_loss": -22.184009552001953, "global_step": 110674, "epoch": 1333} {"train_loss": -22.445789337158203, "global_step": 110675, "epoch": 1333} {"train_loss": -21.985626220703125, "global_step": 110676, "epoch": 1333} {"train_loss": -21.974929809570312, "global_step": 110677, "epoch": 1333} {"train_loss": -22.310611724853516, "global_step": 110678, "epoch": 1333} {"train_loss": -22.384571075439453, "global_step": 110679, "epoch": 1333} {"train_loss": -22.227636337280273, "global_step": 110680, "epoch": 1333} {"train_loss": -22.103857040405273, "global_step": 110681, "epoch": 1333} {"train_loss": -22.30901527404785, "global_step": 110682, "epoch": 1333} {"train_loss": -22.1625919342041, "global_step": 110683, "epoch": 1333} {"train_loss": -22.290470123291016, "global_step": 110684, "epoch": 1333} {"train_loss": -22.171661376953125, "global_step": 110685, "epoch": 1333} {"train_loss": -22.205900192260742, "global_step": 110686, "epoch": 1333} {"train_loss": -22.418861389160156, "global_step": 110687, "epoch": 1333} {"train_loss": -22.26628875732422, "global_step": 110688, "epoch": 1333} {"train_loss": -22.307565689086914, "global_step": 110689, "epoch": 1333} {"train_loss": -22.465330123901367, "global_step": 110690, "epoch": 1333} {"train_loss": -22.424551010131836, "global_step": 110691, "epoch": 1333} {"train_loss": -22.526660919189453, "global_step": 110692, "epoch": 1333} {"train_loss": -22.034513473510742, "global_step": 110693, "epoch": 1333} {"train_loss": -22.312088012695312, "global_step": 110694, "epoch": 1333} {"train_loss": -22.098365783691406, "global_step": 110695, "epoch": 1333} {"train_loss": -22.404953002929688, "global_step": 110696, "epoch": 1333} {"train_loss": -22.197505950927734, "global_step": 110697, "epoch": 1333} {"train_loss": -22.4255313873291, "global_step": 110698, "epoch": 1333} {"train_loss": -22.42239761352539, "global_step": 110699, "epoch": 1333} {"train_loss": -22.522314071655273, "global_step": 110700, "epoch": 1333} {"train_loss": -22.535995483398438, "global_step": 110701, "epoch": 1333} {"train_loss": -22.324146270751953, "global_step": 110702, "epoch": 1333} {"train_loss": -22.330524444580078, "global_step": 110703, "epoch": 1333} {"train_loss": -22.296798706054688, "global_step": 110704, "epoch": 1333} {"train_loss": -22.359182357788086, "global_step": 110705, "epoch": 1333} {"train_loss": -22.312923431396484, "global_step": 110706, "epoch": 1333} {"train_loss": -22.35120964050293, "global_step": 110707, "epoch": 1333} {"train_loss": -22.382551193237305, "global_step": 110708, "epoch": 1333} {"train_loss": -22.514169692993164, "global_step": 110709, "epoch": 1333} {"train_loss": -22.176868438720703, "global_step": 110710, "epoch": 1333} {"train_loss": -22.045438766479492, "global_step": 110711, "epoch": 1333} {"train_loss": -22.45485496520996, "global_step": 110712, "epoch": 1333} {"train_loss": -22.289756774902344, "global_step": 110713, "epoch": 1333} {"train_loss": -22.397626876831055, "global_step": 110714, "epoch": 1333} {"train_loss": -22.316267013549805, "global_step": 110715, "epoch": 1333} {"train_loss": -22.21600341796875, "global_step": 110716, "epoch": 1333} {"train_loss": -22.267057418823242, "global_step": 110717, "epoch": 1333} {"train_loss": -22.131452560424805, "global_step": 110718, "epoch": 1333} {"train_loss": -22.389692306518555, "global_step": 110719, "epoch": 1333} {"train_loss": -21.97059440612793, "global_step": 110720, "epoch": 1333} {"train_loss": -22.23054559546781, "global_step": 110721, "epoch": 1333, "val_loss": 6112578.0} {"train_loss": -20.8216495513916, "global_step": 110722, "epoch": 1334} {"train_loss": -21.777780532836914, "global_step": 110723, "epoch": 1334} {"train_loss": -21.400283813476562, "global_step": 110724, "epoch": 1334} {"train_loss": -21.543594360351562, "global_step": 110725, "epoch": 1334} {"train_loss": -21.307449340820312, "global_step": 110726, "epoch": 1334} {"train_loss": -21.08173942565918, "global_step": 110727, "epoch": 1334} {"train_loss": -21.27045249938965, "global_step": 110728, "epoch": 1334} {"train_loss": -21.673765182495117, "global_step": 110729, "epoch": 1334} {"train_loss": -21.643529891967773, "global_step": 110730, "epoch": 1334} {"train_loss": -21.523900985717773, "global_step": 110731, "epoch": 1334} {"train_loss": -21.775836944580078, "global_step": 110732, "epoch": 1334} {"train_loss": -21.815948486328125, "global_step": 110733, "epoch": 1334} {"train_loss": -21.440549850463867, "global_step": 110734, "epoch": 1334} {"train_loss": -21.92784881591797, "global_step": 110735, "epoch": 1334} {"train_loss": -21.716581344604492, "global_step": 110736, "epoch": 1334} {"train_loss": -21.589252471923828, "global_step": 110737, "epoch": 1334} {"train_loss": -21.861433029174805, "global_step": 110738, "epoch": 1334} {"train_loss": -21.756118774414062, "global_step": 110739, "epoch": 1334} {"train_loss": -21.8707332611084, "global_step": 110740, "epoch": 1334} {"train_loss": -22.038604736328125, "global_step": 110741, "epoch": 1334} {"train_loss": -21.662519454956055, "global_step": 110742, "epoch": 1334} {"train_loss": -21.94980812072754, "global_step": 110743, "epoch": 1334} {"train_loss": -21.83197593688965, "global_step": 110744, "epoch": 1334} {"train_loss": -22.025726318359375, "global_step": 110745, "epoch": 1334} {"train_loss": -22.05487060546875, "global_step": 110746, "epoch": 1334} {"train_loss": -22.041990280151367, "global_step": 110747, "epoch": 1334} {"train_loss": -21.831228256225586, "global_step": 110748, "epoch": 1334} {"train_loss": -21.88360023498535, "global_step": 110749, "epoch": 1334} {"train_loss": -21.81793212890625, "global_step": 110750, "epoch": 1334} {"train_loss": -22.182409286499023, "global_step": 110751, "epoch": 1334} {"train_loss": -21.88239097595215, "global_step": 110752, "epoch": 1334} {"train_loss": -22.0773868560791, "global_step": 110753, "epoch": 1334} {"train_loss": -21.927093505859375, "global_step": 110754, "epoch": 1334} {"train_loss": -22.295284271240234, "global_step": 110755, "epoch": 1334} {"train_loss": -21.955331802368164, "global_step": 110756, "epoch": 1334} {"train_loss": -21.85824966430664, "global_step": 110757, "epoch": 1334} {"train_loss": -22.06464195251465, "global_step": 110758, "epoch": 1334} {"train_loss": -22.141918182373047, "global_step": 110759, "epoch": 1334} {"train_loss": -21.935787200927734, "global_step": 110760, "epoch": 1334} {"train_loss": -22.32882308959961, "global_step": 110761, "epoch": 1334} {"train_loss": -22.549116134643555, "global_step": 110762, "epoch": 1334} {"train_loss": -22.339000701904297, "global_step": 110763, "epoch": 1334} {"train_loss": -22.194034576416016, "global_step": 110764, "epoch": 1334} {"train_loss": -22.05018424987793, "global_step": 110765, "epoch": 1334} {"train_loss": -22.417814254760742, "global_step": 110766, "epoch": 1334} {"train_loss": -21.982635498046875, "global_step": 110767, "epoch": 1334} {"train_loss": -21.89029884338379, "global_step": 110768, "epoch": 1334} {"train_loss": -22.568256378173828, "global_step": 110769, "epoch": 1334} {"train_loss": -21.70159912109375, "global_step": 110770, "epoch": 1334} {"train_loss": -21.65203285217285, "global_step": 110771, "epoch": 1334} {"train_loss": -22.12788963317871, "global_step": 110772, "epoch": 1334} {"train_loss": -22.512893676757812, "global_step": 110773, "epoch": 1334} {"train_loss": -22.382387161254883, "global_step": 110774, "epoch": 1334} {"train_loss": -22.32529067993164, "global_step": 110775, "epoch": 1334} {"train_loss": -21.739009857177734, "global_step": 110776, "epoch": 1334} {"train_loss": -21.97919464111328, "global_step": 110777, "epoch": 1334} {"train_loss": -22.28278923034668, "global_step": 110778, "epoch": 1334} {"train_loss": -21.9392147064209, "global_step": 110779, "epoch": 1334} {"train_loss": -22.287357330322266, "global_step": 110780, "epoch": 1334} {"train_loss": -22.359283447265625, "global_step": 110781, "epoch": 1334} {"train_loss": -22.143726348876953, "global_step": 110782, "epoch": 1334} {"train_loss": -22.19581413269043, "global_step": 110783, "epoch": 1334} {"train_loss": -22.184919357299805, "global_step": 110784, "epoch": 1334} {"train_loss": -22.070072174072266, "global_step": 110785, "epoch": 1334} {"train_loss": -22.040611267089844, "global_step": 110786, "epoch": 1334} {"train_loss": -22.401655197143555, "global_step": 110787, "epoch": 1334} {"train_loss": -22.121814727783203, "global_step": 110788, "epoch": 1334} {"train_loss": -22.415958404541016, "global_step": 110789, "epoch": 1334} {"train_loss": -22.271825790405273, "global_step": 110790, "epoch": 1334} {"train_loss": -22.290699005126953, "global_step": 110791, "epoch": 1334} {"train_loss": -22.517879486083984, "global_step": 110792, "epoch": 1334} {"train_loss": -22.415592193603516, "global_step": 110793, "epoch": 1334} {"train_loss": -22.26555061340332, "global_step": 110794, "epoch": 1334} {"train_loss": -22.278913497924805, "global_step": 110795, "epoch": 1334} {"train_loss": -22.0048770904541, "global_step": 110796, "epoch": 1334} {"train_loss": -21.921865463256836, "global_step": 110797, "epoch": 1334} {"train_loss": -22.522350311279297, "global_step": 110798, "epoch": 1334} {"train_loss": -21.9713191986084, "global_step": 110799, "epoch": 1334} {"train_loss": -21.547077178955078, "global_step": 110800, "epoch": 1334} {"train_loss": -22.28240394592285, "global_step": 110801, "epoch": 1334} {"train_loss": -22.126623153686523, "global_step": 110802, "epoch": 1334} {"train_loss": -22.165931701660156, "global_step": 110803, "epoch": 1334} {"train_loss": -21.991786014602845, "global_step": 110804, "epoch": 1334, "val_loss": 6210932.5} {"train_loss": -22.17081069946289, "global_step": 110805, "epoch": 1335} {"train_loss": -21.727977752685547, "global_step": 110806, "epoch": 1335} {"train_loss": -22.114500045776367, "global_step": 110807, "epoch": 1335} {"train_loss": -21.789657592773438, "global_step": 110808, "epoch": 1335} {"train_loss": -21.55691909790039, "global_step": 110809, "epoch": 1335} {"train_loss": -22.01199722290039, "global_step": 110810, "epoch": 1335} {"train_loss": -22.38010597229004, "global_step": 110811, "epoch": 1335} {"train_loss": -21.781963348388672, "global_step": 110812, "epoch": 1335} {"train_loss": -21.82297134399414, "global_step": 110813, "epoch": 1335} {"train_loss": -21.857519149780273, "global_step": 110814, "epoch": 1335} {"train_loss": -22.3365535736084, "global_step": 110815, "epoch": 1335} {"train_loss": -22.073740005493164, "global_step": 110816, "epoch": 1335} {"train_loss": -22.097972869873047, "global_step": 110817, "epoch": 1335} {"train_loss": -22.197595596313477, "global_step": 110818, "epoch": 1335} {"train_loss": -21.928319931030273, "global_step": 110819, "epoch": 1335} {"train_loss": -22.246158599853516, "global_step": 110820, "epoch": 1335} {"train_loss": -21.866811752319336, "global_step": 110821, "epoch": 1335} {"train_loss": -22.184873580932617, "global_step": 110822, "epoch": 1335} {"train_loss": -22.366029739379883, "global_step": 110823, "epoch": 1335} {"train_loss": -22.245285034179688, "global_step": 110824, "epoch": 1335} {"train_loss": -22.230836868286133, "global_step": 110825, "epoch": 1335} {"train_loss": -22.194595336914062, "global_step": 110826, "epoch": 1335} {"train_loss": -22.269420623779297, "global_step": 110827, "epoch": 1335} {"train_loss": -22.384586334228516, "global_step": 110828, "epoch": 1335} {"train_loss": -22.308691024780273, "global_step": 110829, "epoch": 1335} {"train_loss": -22.276548385620117, "global_step": 110830, "epoch": 1335} {"train_loss": -22.58064079284668, "global_step": 110831, "epoch": 1335} {"train_loss": -22.267560958862305, "global_step": 110832, "epoch": 1335} {"train_loss": -22.739532470703125, "global_step": 110833, "epoch": 1335} {"train_loss": -22.23285484313965, "global_step": 110834, "epoch": 1335} {"train_loss": -22.050207138061523, "global_step": 110835, "epoch": 1335} {"train_loss": -22.202299118041992, "global_step": 110836, "epoch": 1335} {"train_loss": -22.315256118774414, "global_step": 110837, "epoch": 1335} {"train_loss": -22.142534255981445, "global_step": 110838, "epoch": 1335} {"train_loss": -22.32245445251465, "global_step": 110839, "epoch": 1335} {"train_loss": -22.390090942382812, "global_step": 110840, "epoch": 1335} {"train_loss": -21.853221893310547, "global_step": 110841, "epoch": 1335} {"train_loss": -22.079008102416992, "global_step": 110842, "epoch": 1335} {"train_loss": -21.913976669311523, "global_step": 110843, "epoch": 1335} {"train_loss": -22.371042251586914, "global_step": 110844, "epoch": 1335} {"train_loss": -22.183515548706055, "global_step": 110845, "epoch": 1335} {"train_loss": -22.221548080444336, "global_step": 110846, "epoch": 1335} {"train_loss": -22.508825302124023, "global_step": 110847, "epoch": 1335} {"train_loss": -22.131938934326172, "global_step": 110848, "epoch": 1335} {"train_loss": -22.204355239868164, "global_step": 110849, "epoch": 1335} {"train_loss": -21.598024368286133, "global_step": 110850, "epoch": 1335} {"train_loss": -22.29750633239746, "global_step": 110851, "epoch": 1335} {"train_loss": -21.80633544921875, "global_step": 110852, "epoch": 1335} {"train_loss": -22.267486572265625, "global_step": 110853, "epoch": 1335} {"train_loss": -22.359548568725586, "global_step": 110854, "epoch": 1335} {"train_loss": -22.185699462890625, "global_step": 110855, "epoch": 1335} {"train_loss": -22.44124412536621, "global_step": 110856, "epoch": 1335} {"train_loss": -22.158184051513672, "global_step": 110857, "epoch": 1335} {"train_loss": -22.1904296875, "global_step": 110858, "epoch": 1335} {"train_loss": -22.54267692565918, "global_step": 110859, "epoch": 1335} {"train_loss": -21.944364547729492, "global_step": 110860, "epoch": 1335} {"train_loss": -22.086654663085938, "global_step": 110861, "epoch": 1335} {"train_loss": -22.424701690673828, "global_step": 110862, "epoch": 1335} {"train_loss": -21.982946395874023, "global_step": 110863, "epoch": 1335} {"train_loss": -22.391651153564453, "global_step": 110864, "epoch": 1335} {"train_loss": -22.1928768157959, "global_step": 110865, "epoch": 1335} {"train_loss": -22.470895767211914, "global_step": 110866, "epoch": 1335} {"train_loss": -22.303009033203125, "global_step": 110867, "epoch": 1335} {"train_loss": -22.226734161376953, "global_step": 110868, "epoch": 1335} {"train_loss": -22.524412155151367, "global_step": 110869, "epoch": 1335} {"train_loss": -22.101884841918945, "global_step": 110870, "epoch": 1335} {"train_loss": -22.56974983215332, "global_step": 110871, "epoch": 1335} {"train_loss": -21.72426414489746, "global_step": 110872, "epoch": 1335} {"train_loss": -22.315759658813477, "global_step": 110873, "epoch": 1335} {"train_loss": -22.049413681030273, "global_step": 110874, "epoch": 1335} {"train_loss": -22.771169662475586, "global_step": 110875, "epoch": 1335} {"train_loss": -22.131114959716797, "global_step": 110876, "epoch": 1335} {"train_loss": -22.149160385131836, "global_step": 110877, "epoch": 1335} {"train_loss": -22.22086524963379, "global_step": 110878, "epoch": 1335} {"train_loss": -22.162504196166992, "global_step": 110879, "epoch": 1335} {"train_loss": -22.419879913330078, "global_step": 110880, "epoch": 1335} {"train_loss": -22.33260154724121, "global_step": 110881, "epoch": 1335} {"train_loss": -22.153676986694336, "global_step": 110882, "epoch": 1335} {"train_loss": -22.347816467285156, "global_step": 110883, "epoch": 1335} {"train_loss": -22.42214012145996, "global_step": 110884, "epoch": 1335} {"train_loss": -22.198522567749023, "global_step": 110885, "epoch": 1335} {"train_loss": -22.2200984954834, "global_step": 110886, "epoch": 1335} {"train_loss": -22.18595251979598, "global_step": 110887, "epoch": 1335, "val_loss": 6141099.0} {"train_loss": -21.63824462890625, "global_step": 110888, "epoch": 1336} {"train_loss": -22.225723266601562, "global_step": 110889, "epoch": 1336} {"train_loss": -21.723508834838867, "global_step": 110890, "epoch": 1336} {"train_loss": -22.21953582763672, "global_step": 110891, "epoch": 1336} {"train_loss": -21.909652709960938, "global_step": 110892, "epoch": 1336} {"train_loss": -21.966066360473633, "global_step": 110893, "epoch": 1336} {"train_loss": -22.33782386779785, "global_step": 110894, "epoch": 1336} {"train_loss": -21.557388305664062, "global_step": 110895, "epoch": 1336} {"train_loss": -22.04783058166504, "global_step": 110896, "epoch": 1336} {"train_loss": -22.202293395996094, "global_step": 110897, "epoch": 1336} {"train_loss": -22.103384017944336, "global_step": 110898, "epoch": 1336} {"train_loss": -22.21299171447754, "global_step": 110899, "epoch": 1336} {"train_loss": -22.256898880004883, "global_step": 110900, "epoch": 1336} {"train_loss": -21.51975440979004, "global_step": 110901, "epoch": 1336} {"train_loss": -21.9910888671875, "global_step": 110902, "epoch": 1336} {"train_loss": -21.991374969482422, "global_step": 110903, "epoch": 1336} {"train_loss": -22.089879989624023, "global_step": 110904, "epoch": 1336} {"train_loss": -21.940441131591797, "global_step": 110905, "epoch": 1336} {"train_loss": -22.13709831237793, "global_step": 110906, "epoch": 1336} {"train_loss": -22.450878143310547, "global_step": 110907, "epoch": 1336} {"train_loss": -22.18126678466797, "global_step": 110908, "epoch": 1336} {"train_loss": -22.22885513305664, "global_step": 110909, "epoch": 1336} {"train_loss": -22.141592025756836, "global_step": 110910, "epoch": 1336} {"train_loss": -22.107603073120117, "global_step": 110911, "epoch": 1336} {"train_loss": -22.153867721557617, "global_step": 110912, "epoch": 1336} {"train_loss": -22.036157608032227, "global_step": 110913, "epoch": 1336} {"train_loss": -21.923654556274414, "global_step": 110914, "epoch": 1336} {"train_loss": -22.075345993041992, "global_step": 110915, "epoch": 1336} {"train_loss": -22.39691162109375, "global_step": 110916, "epoch": 1336} {"train_loss": -22.00239372253418, "global_step": 110917, "epoch": 1336} {"train_loss": -22.259286880493164, "global_step": 110918, "epoch": 1336} {"train_loss": -22.423620223999023, "global_step": 110919, "epoch": 1336} {"train_loss": -22.0738582611084, "global_step": 110920, "epoch": 1336} {"train_loss": -22.40289306640625, "global_step": 110921, "epoch": 1336} {"train_loss": -22.374032974243164, "global_step": 110922, "epoch": 1336} {"train_loss": -22.09573745727539, "global_step": 110923, "epoch": 1336} {"train_loss": -22.58426856994629, "global_step": 110924, "epoch": 1336} {"train_loss": -22.25920295715332, "global_step": 110925, "epoch": 1336} {"train_loss": -21.999107360839844, "global_step": 110926, "epoch": 1336} {"train_loss": -22.13454246520996, "global_step": 110927, "epoch": 1336} {"train_loss": -22.091798782348633, "global_step": 110928, "epoch": 1336} {"train_loss": -22.357385635375977, "global_step": 110929, "epoch": 1336} {"train_loss": -22.916709899902344, "global_step": 110930, "epoch": 1336} {"train_loss": -22.457212448120117, "global_step": 110931, "epoch": 1336} {"train_loss": -22.440078735351562, "global_step": 110932, "epoch": 1336} {"train_loss": -21.934661865234375, "global_step": 110933, "epoch": 1336} {"train_loss": -22.088546752929688, "global_step": 110934, "epoch": 1336} {"train_loss": -22.444156646728516, "global_step": 110935, "epoch": 1336} {"train_loss": -22.55340003967285, "global_step": 110936, "epoch": 1336} {"train_loss": -22.272132873535156, "global_step": 110937, "epoch": 1336} {"train_loss": -22.267898559570312, "global_step": 110938, "epoch": 1336} {"train_loss": -22.423917770385742, "global_step": 110939, "epoch": 1336} {"train_loss": -22.196876525878906, "global_step": 110940, "epoch": 1336} {"train_loss": -22.386987686157227, "global_step": 110941, "epoch": 1336} {"train_loss": -22.24357032775879, "global_step": 110942, "epoch": 1336} {"train_loss": -22.274587631225586, "global_step": 110943, "epoch": 1336} {"train_loss": -22.451932907104492, "global_step": 110944, "epoch": 1336} {"train_loss": -22.333284378051758, "global_step": 110945, "epoch": 1336} {"train_loss": -22.109893798828125, "global_step": 110946, "epoch": 1336} {"train_loss": -22.053922653198242, "global_step": 110947, "epoch": 1336} {"train_loss": -22.415969848632812, "global_step": 110948, "epoch": 1336} {"train_loss": -21.97823143005371, "global_step": 110949, "epoch": 1336} {"train_loss": -22.09002685546875, "global_step": 110950, "epoch": 1336} {"train_loss": -22.074560165405273, "global_step": 110951, "epoch": 1336} {"train_loss": -22.4023494720459, "global_step": 110952, "epoch": 1336} {"train_loss": -22.211942672729492, "global_step": 110953, "epoch": 1336} {"train_loss": -22.371967315673828, "global_step": 110954, "epoch": 1336} {"train_loss": -22.4657039642334, "global_step": 110955, "epoch": 1336} {"train_loss": -22.057401657104492, "global_step": 110956, "epoch": 1336} {"train_loss": -22.330026626586914, "global_step": 110957, "epoch": 1336} {"train_loss": -22.18922233581543, "global_step": 110958, "epoch": 1336} {"train_loss": -22.53248405456543, "global_step": 110959, "epoch": 1336} {"train_loss": -22.438945770263672, "global_step": 110960, "epoch": 1336} {"train_loss": -22.6878662109375, "global_step": 110961, "epoch": 1336} {"train_loss": -22.5476131439209, "global_step": 110962, "epoch": 1336} {"train_loss": -22.502880096435547, "global_step": 110963, "epoch": 1336} {"train_loss": -22.771202087402344, "global_step": 110964, "epoch": 1336} {"train_loss": -22.005924224853516, "global_step": 110965, "epoch": 1336} {"train_loss": -22.0526180267334, "global_step": 110966, "epoch": 1336} {"train_loss": -22.384069442749023, "global_step": 110967, "epoch": 1336} {"train_loss": -22.44474220275879, "global_step": 110968, "epoch": 1336} {"train_loss": -22.512582778930664, "global_step": 110969, "epoch": 1336} {"train_loss": -22.22492560421128, "global_step": 110970, "epoch": 1336, "val_loss": 6198943.5} {"train_loss": -21.77398109436035, "global_step": 110971, "epoch": 1337} {"train_loss": -20.818044662475586, "global_step": 110972, "epoch": 1337} {"train_loss": -21.541112899780273, "global_step": 110973, "epoch": 1337} {"train_loss": -21.990568161010742, "global_step": 110974, "epoch": 1337} {"train_loss": -21.65810203552246, "global_step": 110975, "epoch": 1337} {"train_loss": -21.7545166015625, "global_step": 110976, "epoch": 1337} {"train_loss": -21.771434783935547, "global_step": 110977, "epoch": 1337} {"train_loss": -21.920000076293945, "global_step": 110978, "epoch": 1337} {"train_loss": -21.91059112548828, "global_step": 110979, "epoch": 1337} {"train_loss": -21.831085205078125, "global_step": 110980, "epoch": 1337} {"train_loss": -22.0194149017334, "global_step": 110981, "epoch": 1337} {"train_loss": -22.10854148864746, "global_step": 110982, "epoch": 1337} {"train_loss": -21.935209274291992, "global_step": 110983, "epoch": 1337} {"train_loss": -22.134437561035156, "global_step": 110984, "epoch": 1337} {"train_loss": -21.957792282104492, "global_step": 110985, "epoch": 1337} {"train_loss": -21.745691299438477, "global_step": 110986, "epoch": 1337} {"train_loss": -22.217435836791992, "global_step": 110987, "epoch": 1337} {"train_loss": -22.364545822143555, "global_step": 110988, "epoch": 1337} {"train_loss": -21.86774253845215, "global_step": 110989, "epoch": 1337} {"train_loss": -22.015872955322266, "global_step": 110990, "epoch": 1337} {"train_loss": -21.924253463745117, "global_step": 110991, "epoch": 1337} {"train_loss": -21.95185089111328, "global_step": 110992, "epoch": 1337} {"train_loss": -22.063814163208008, "global_step": 110993, "epoch": 1337} {"train_loss": -22.317142486572266, "global_step": 110994, "epoch": 1337} {"train_loss": -22.033935546875, "global_step": 110995, "epoch": 1337} {"train_loss": -22.37623405456543, "global_step": 110996, "epoch": 1337} {"train_loss": -22.479408264160156, "global_step": 110997, "epoch": 1337} {"train_loss": -22.258136749267578, "global_step": 110998, "epoch": 1337} {"train_loss": -22.251697540283203, "global_step": 110999, "epoch": 1337} {"train_loss": -21.59065055847168, "global_step": 111000, "epoch": 1337} {"train_loss": -22.347867965698242, "global_step": 111001, "epoch": 1337} {"train_loss": -22.05377769470215, "global_step": 111002, "epoch": 1337} {"train_loss": -22.29478645324707, "global_step": 111003, "epoch": 1337} {"train_loss": -22.414451599121094, "global_step": 111004, "epoch": 1337} {"train_loss": -21.872404098510742, "global_step": 111005, "epoch": 1337} {"train_loss": -22.205129623413086, "global_step": 111006, "epoch": 1337} {"train_loss": -22.410232543945312, "global_step": 111007, "epoch": 1337} {"train_loss": -22.415311813354492, "global_step": 111008, "epoch": 1337} {"train_loss": -22.47188949584961, "global_step": 111009, "epoch": 1337} {"train_loss": -22.676639556884766, "global_step": 111010, "epoch": 1337} {"train_loss": -22.483163833618164, "global_step": 111011, "epoch": 1337} {"train_loss": -21.77420425415039, "global_step": 111012, "epoch": 1337} {"train_loss": -22.480512619018555, "global_step": 111013, "epoch": 1337} {"train_loss": -22.248275756835938, "global_step": 111014, "epoch": 1337} {"train_loss": -21.947290420532227, "global_step": 111015, "epoch": 1337} {"train_loss": -22.63741111755371, "global_step": 111016, "epoch": 1337} {"train_loss": -22.153608322143555, "global_step": 111017, "epoch": 1337} {"train_loss": -22.17603874206543, "global_step": 111018, "epoch": 1337} {"train_loss": -21.80451202392578, "global_step": 111019, "epoch": 1337} {"train_loss": -22.454975128173828, "global_step": 111020, "epoch": 1337} {"train_loss": -22.435693740844727, "global_step": 111021, "epoch": 1337} {"train_loss": -22.146530151367188, "global_step": 111022, "epoch": 1337} {"train_loss": -22.196500778198242, "global_step": 111023, "epoch": 1337} {"train_loss": -21.913461685180664, "global_step": 111024, "epoch": 1337} {"train_loss": -22.14962387084961, "global_step": 111025, "epoch": 1337} {"train_loss": -22.270023345947266, "global_step": 111026, "epoch": 1337} {"train_loss": -21.871417999267578, "global_step": 111027, "epoch": 1337} {"train_loss": -22.2199649810791, "global_step": 111028, "epoch": 1337} {"train_loss": -22.31952476501465, "global_step": 111029, "epoch": 1337} {"train_loss": -21.84381675720215, "global_step": 111030, "epoch": 1337} {"train_loss": -22.36709976196289, "global_step": 111031, "epoch": 1337} {"train_loss": -22.179636001586914, "global_step": 111032, "epoch": 1337} {"train_loss": -22.32996940612793, "global_step": 111033, "epoch": 1337} {"train_loss": -22.536670684814453, "global_step": 111034, "epoch": 1337} {"train_loss": -21.756160736083984, "global_step": 111035, "epoch": 1337} {"train_loss": -22.303192138671875, "global_step": 111036, "epoch": 1337} {"train_loss": -22.655790328979492, "global_step": 111037, "epoch": 1337} {"train_loss": -22.25048828125, "global_step": 111038, "epoch": 1337} {"train_loss": -21.99022674560547, "global_step": 111039, "epoch": 1337} {"train_loss": -22.41773796081543, "global_step": 111040, "epoch": 1337} {"train_loss": -22.072250366210938, "global_step": 111041, "epoch": 1337} {"train_loss": -21.95339584350586, "global_step": 111042, "epoch": 1337} {"train_loss": -21.966745376586914, "global_step": 111043, "epoch": 1337} {"train_loss": -22.438940048217773, "global_step": 111044, "epoch": 1337} {"train_loss": -22.23624038696289, "global_step": 111045, "epoch": 1337} {"train_loss": -22.012752532958984, "global_step": 111046, "epoch": 1337} {"train_loss": -22.597091674804688, "global_step": 111047, "epoch": 1337} {"train_loss": -22.321496963500977, "global_step": 111048, "epoch": 1337} {"train_loss": -22.480587005615234, "global_step": 111049, "epoch": 1337} {"train_loss": -21.91688346862793, "global_step": 111050, "epoch": 1337} {"train_loss": -22.18717384338379, "global_step": 111051, "epoch": 1337} {"train_loss": -22.507314682006836, "global_step": 111052, "epoch": 1337} {"train_loss": -22.139988818800592, "global_step": 111053, "epoch": 1337, "val_loss": 6217817.5} {"train_loss": -21.620262145996094, "global_step": 111054, "epoch": 1338} {"train_loss": -21.743595123291016, "global_step": 111055, "epoch": 1338} {"train_loss": -21.725154876708984, "global_step": 111056, "epoch": 1338} {"train_loss": -22.00449562072754, "global_step": 111057, "epoch": 1338} {"train_loss": -21.650781631469727, "global_step": 111058, "epoch": 1338} {"train_loss": -21.64111328125, "global_step": 111059, "epoch": 1338} {"train_loss": -22.096113204956055, "global_step": 111060, "epoch": 1338} {"train_loss": -22.11154556274414, "global_step": 111061, "epoch": 1338} {"train_loss": -21.935405731201172, "global_step": 111062, "epoch": 1338} {"train_loss": -21.86683464050293, "global_step": 111063, "epoch": 1338} {"train_loss": -22.111242294311523, "global_step": 111064, "epoch": 1338} {"train_loss": -22.078144073486328, "global_step": 111065, "epoch": 1338} {"train_loss": -21.961050033569336, "global_step": 111066, "epoch": 1338} {"train_loss": -22.214927673339844, "global_step": 111067, "epoch": 1338} {"train_loss": -22.04991340637207, "global_step": 111068, "epoch": 1338} {"train_loss": -22.02530288696289, "global_step": 111069, "epoch": 1338} {"train_loss": -21.85761070251465, "global_step": 111070, "epoch": 1338} {"train_loss": -21.971113204956055, "global_step": 111071, "epoch": 1338} {"train_loss": -22.32283592224121, "global_step": 111072, "epoch": 1338} {"train_loss": -21.87436866760254, "global_step": 111073, "epoch": 1338} {"train_loss": -21.764432907104492, "global_step": 111074, "epoch": 1338} {"train_loss": -22.15134048461914, "global_step": 111075, "epoch": 1338} {"train_loss": -21.715335845947266, "global_step": 111076, "epoch": 1338} {"train_loss": -21.969419479370117, "global_step": 111077, "epoch": 1338} {"train_loss": -22.187042236328125, "global_step": 111078, "epoch": 1338} {"train_loss": -22.565763473510742, "global_step": 111079, "epoch": 1338} {"train_loss": -22.049840927124023, "global_step": 111080, "epoch": 1338} {"train_loss": -22.451292037963867, "global_step": 111081, "epoch": 1338} {"train_loss": -22.498414993286133, "global_step": 111082, "epoch": 1338} {"train_loss": -22.041873931884766, "global_step": 111083, "epoch": 1338} {"train_loss": -22.42214584350586, "global_step": 111084, "epoch": 1338} {"train_loss": -22.530094146728516, "global_step": 111085, "epoch": 1338} {"train_loss": -22.343210220336914, "global_step": 111086, "epoch": 1338} {"train_loss": -22.47881507873535, "global_step": 111087, "epoch": 1338} {"train_loss": -22.113157272338867, "global_step": 111088, "epoch": 1338} {"train_loss": -22.320602416992188, "global_step": 111089, "epoch": 1338} {"train_loss": -22.15279197692871, "global_step": 111090, "epoch": 1338} {"train_loss": -22.477825164794922, "global_step": 111091, "epoch": 1338} {"train_loss": -22.295682907104492, "global_step": 111092, "epoch": 1338} {"train_loss": -21.727100372314453, "global_step": 111093, "epoch": 1338} {"train_loss": -22.493444442749023, "global_step": 111094, "epoch": 1338} {"train_loss": -22.44822120666504, "global_step": 111095, "epoch": 1338} {"train_loss": -22.406620025634766, "global_step": 111096, "epoch": 1338} {"train_loss": -22.374343872070312, "global_step": 111097, "epoch": 1338} {"train_loss": -22.215534210205078, "global_step": 111098, "epoch": 1338} {"train_loss": -22.085447311401367, "global_step": 111099, "epoch": 1338} {"train_loss": -22.574974060058594, "global_step": 111100, "epoch": 1338} {"train_loss": -22.330326080322266, "global_step": 111101, "epoch": 1338} {"train_loss": -22.576892852783203, "global_step": 111102, "epoch": 1338} {"train_loss": -22.51739501953125, "global_step": 111103, "epoch": 1338} {"train_loss": -22.37653350830078, "global_step": 111104, "epoch": 1338} {"train_loss": -22.15984535217285, "global_step": 111105, "epoch": 1338} {"train_loss": -22.258472442626953, "global_step": 111106, "epoch": 1338} {"train_loss": -22.375526428222656, "global_step": 111107, "epoch": 1338} {"train_loss": -22.254030227661133, "global_step": 111108, "epoch": 1338} {"train_loss": -22.465925216674805, "global_step": 111109, "epoch": 1338} {"train_loss": -22.129535675048828, "global_step": 111110, "epoch": 1338} {"train_loss": -22.072315216064453, "global_step": 111111, "epoch": 1338} {"train_loss": -22.534351348876953, "global_step": 111112, "epoch": 1338} {"train_loss": -22.38405418395996, "global_step": 111113, "epoch": 1338} {"train_loss": -22.03070640563965, "global_step": 111114, "epoch": 1338} {"train_loss": -22.22899627685547, "global_step": 111115, "epoch": 1338} {"train_loss": -22.026527404785156, "global_step": 111116, "epoch": 1338} {"train_loss": -22.382192611694336, "global_step": 111117, "epoch": 1338} {"train_loss": -22.361637115478516, "global_step": 111118, "epoch": 1338} {"train_loss": -22.22825050354004, "global_step": 111119, "epoch": 1338} {"train_loss": -22.27231788635254, "global_step": 111120, "epoch": 1338} {"train_loss": -22.314130783081055, "global_step": 111121, "epoch": 1338} {"train_loss": -22.248537063598633, "global_step": 111122, "epoch": 1338} {"train_loss": -21.658313751220703, "global_step": 111123, "epoch": 1338} {"train_loss": -22.146804809570312, "global_step": 111124, "epoch": 1338} {"train_loss": -22.199451446533203, "global_step": 111125, "epoch": 1338} {"train_loss": -21.833728790283203, "global_step": 111126, "epoch": 1338} {"train_loss": -21.823057174682617, "global_step": 111127, "epoch": 1338} {"train_loss": -22.27008628845215, "global_step": 111128, "epoch": 1338} {"train_loss": -22.090213775634766, "global_step": 111129, "epoch": 1338} {"train_loss": -22.24867057800293, "global_step": 111130, "epoch": 1338} {"train_loss": -22.317407608032227, "global_step": 111131, "epoch": 1338} {"train_loss": -21.582443237304688, "global_step": 111132, "epoch": 1338} {"train_loss": -22.198720932006836, "global_step": 111133, "epoch": 1338} {"train_loss": -21.636760711669922, "global_step": 111134, "epoch": 1338} {"train_loss": -21.819522857666016, "global_step": 111135, "epoch": 1338} {"train_loss": -22.149079058543744, "global_step": 111136, "epoch": 1338, "val_loss": 6154951.0} {"train_loss": -21.48223304748535, "global_step": 111137, "epoch": 1339} {"train_loss": -22.22344970703125, "global_step": 111138, "epoch": 1339} {"train_loss": -21.829008102416992, "global_step": 111139, "epoch": 1339} {"train_loss": -21.88558006286621, "global_step": 111140, "epoch": 1339} {"train_loss": -21.92535400390625, "global_step": 111141, "epoch": 1339} {"train_loss": -22.10475730895996, "global_step": 111142, "epoch": 1339} {"train_loss": -22.244415283203125, "global_step": 111143, "epoch": 1339} {"train_loss": -22.151498794555664, "global_step": 111144, "epoch": 1339} {"train_loss": -22.207672119140625, "global_step": 111145, "epoch": 1339} {"train_loss": -22.29889488220215, "global_step": 111146, "epoch": 1339} {"train_loss": -22.2878475189209, "global_step": 111147, "epoch": 1339} {"train_loss": -21.876813888549805, "global_step": 111148, "epoch": 1339} {"train_loss": -22.315710067749023, "global_step": 111149, "epoch": 1339} {"train_loss": -22.209341049194336, "global_step": 111150, "epoch": 1339} {"train_loss": -22.650373458862305, "global_step": 111151, "epoch": 1339} {"train_loss": -22.10700798034668, "global_step": 111152, "epoch": 1339} {"train_loss": -22.094745635986328, "global_step": 111153, "epoch": 1339} {"train_loss": -22.35972023010254, "global_step": 111154, "epoch": 1339} {"train_loss": -22.105344772338867, "global_step": 111155, "epoch": 1339} {"train_loss": -22.169034957885742, "global_step": 111156, "epoch": 1339} {"train_loss": -22.372873306274414, "global_step": 111157, "epoch": 1339} {"train_loss": -22.418466567993164, "global_step": 111158, "epoch": 1339} {"train_loss": -22.33761978149414, "global_step": 111159, "epoch": 1339} {"train_loss": -22.220077514648438, "global_step": 111160, "epoch": 1339} {"train_loss": -22.144256591796875, "global_step": 111161, "epoch": 1339} {"train_loss": -22.175884246826172, "global_step": 111162, "epoch": 1339} {"train_loss": -22.365131378173828, "global_step": 111163, "epoch": 1339} {"train_loss": -22.317893981933594, "global_step": 111164, "epoch": 1339} {"train_loss": -22.39923667907715, "global_step": 111165, "epoch": 1339} {"train_loss": -22.168813705444336, "global_step": 111166, "epoch": 1339} {"train_loss": -22.117095947265625, "global_step": 111167, "epoch": 1339} {"train_loss": -22.082481384277344, "global_step": 111168, "epoch": 1339} {"train_loss": -22.233436584472656, "global_step": 111169, "epoch": 1339} {"train_loss": -22.404104232788086, "global_step": 111170, "epoch": 1339} {"train_loss": -22.152118682861328, "global_step": 111171, "epoch": 1339} {"train_loss": -22.28342628479004, "global_step": 111172, "epoch": 1339} {"train_loss": -22.391366958618164, "global_step": 111173, "epoch": 1339} {"train_loss": -22.35487174987793, "global_step": 111174, "epoch": 1339} {"train_loss": -22.17852210998535, "global_step": 111175, "epoch": 1339} {"train_loss": -22.30926513671875, "global_step": 111176, "epoch": 1339} {"train_loss": -22.038782119750977, "global_step": 111177, "epoch": 1339} {"train_loss": -22.41412353515625, "global_step": 111178, "epoch": 1339} {"train_loss": -22.461044311523438, "global_step": 111179, "epoch": 1339} {"train_loss": -22.107351303100586, "global_step": 111180, "epoch": 1339} {"train_loss": -21.943241119384766, "global_step": 111181, "epoch": 1339} {"train_loss": -22.28803253173828, "global_step": 111182, "epoch": 1339} {"train_loss": -22.080381393432617, "global_step": 111183, "epoch": 1339} {"train_loss": -22.541311264038086, "global_step": 111184, "epoch": 1339} {"train_loss": -22.26320457458496, "global_step": 111185, "epoch": 1339} {"train_loss": -22.397104263305664, "global_step": 111186, "epoch": 1339} {"train_loss": -22.012786865234375, "global_step": 111187, "epoch": 1339} {"train_loss": -22.333873748779297, "global_step": 111188, "epoch": 1339} {"train_loss": -22.41608428955078, "global_step": 111189, "epoch": 1339} {"train_loss": -22.528064727783203, "global_step": 111190, "epoch": 1339} {"train_loss": -22.214189529418945, "global_step": 111191, "epoch": 1339} {"train_loss": -22.874149322509766, "global_step": 111192, "epoch": 1339} {"train_loss": -22.576335906982422, "global_step": 111193, "epoch": 1339} {"train_loss": -22.382585525512695, "global_step": 111194, "epoch": 1339} {"train_loss": -22.339298248291016, "global_step": 111195, "epoch": 1339} {"train_loss": -22.827810287475586, "global_step": 111196, "epoch": 1339} {"train_loss": -22.289051055908203, "global_step": 111197, "epoch": 1339} {"train_loss": -22.31572914123535, "global_step": 111198, "epoch": 1339} {"train_loss": -22.413497924804688, "global_step": 111199, "epoch": 1339} {"train_loss": -22.2744197845459, "global_step": 111200, "epoch": 1339} {"train_loss": -22.237747192382812, "global_step": 111201, "epoch": 1339} {"train_loss": -22.464670181274414, "global_step": 111202, "epoch": 1339} {"train_loss": -22.53699493408203, "global_step": 111203, "epoch": 1339} {"train_loss": -22.2601261138916, "global_step": 111204, "epoch": 1339} {"train_loss": -21.860679626464844, "global_step": 111205, "epoch": 1339} {"train_loss": -22.265918731689453, "global_step": 111206, "epoch": 1339} {"train_loss": -22.538589477539062, "global_step": 111207, "epoch": 1339} {"train_loss": -22.506391525268555, "global_step": 111208, "epoch": 1339} {"train_loss": -22.779678344726562, "global_step": 111209, "epoch": 1339} {"train_loss": -22.740171432495117, "global_step": 111210, "epoch": 1339} {"train_loss": -22.57948112487793, "global_step": 111211, "epoch": 1339} {"train_loss": -22.196760177612305, "global_step": 111212, "epoch": 1339} {"train_loss": -22.16595458984375, "global_step": 111213, "epoch": 1339} {"train_loss": -22.26423454284668, "global_step": 111214, "epoch": 1339} {"train_loss": -21.906126022338867, "global_step": 111215, "epoch": 1339} {"train_loss": -21.839462280273438, "global_step": 111216, "epoch": 1339} {"train_loss": -22.376272201538086, "global_step": 111217, "epoch": 1339} {"train_loss": -21.914106369018555, "global_step": 111218, "epoch": 1339} {"train_loss": -22.26507235147867, "global_step": 111219, "epoch": 1339, "val_loss": 6194938.0} {"train_loss": -21.389999389648438, "global_step": 111220, "epoch": 1340} {"train_loss": -21.7193546295166, "global_step": 111221, "epoch": 1340} {"train_loss": -21.616147994995117, "global_step": 111222, "epoch": 1340} {"train_loss": -22.432655334472656, "global_step": 111223, "epoch": 1340} {"train_loss": -21.789804458618164, "global_step": 111224, "epoch": 1340} {"train_loss": -22.282337188720703, "global_step": 111225, "epoch": 1340} {"train_loss": -21.80552101135254, "global_step": 111226, "epoch": 1340} {"train_loss": -22.111051559448242, "global_step": 111227, "epoch": 1340} {"train_loss": -22.066665649414062, "global_step": 111228, "epoch": 1340} {"train_loss": -21.923812866210938, "global_step": 111229, "epoch": 1340} {"train_loss": -21.924659729003906, "global_step": 111230, "epoch": 1340} {"train_loss": -22.126989364624023, "global_step": 111231, "epoch": 1340} {"train_loss": -22.334360122680664, "global_step": 111232, "epoch": 1340} {"train_loss": -22.16873550415039, "global_step": 111233, "epoch": 1340} {"train_loss": -21.996423721313477, "global_step": 111234, "epoch": 1340} {"train_loss": -22.34000015258789, "global_step": 111235, "epoch": 1340} {"train_loss": -22.196760177612305, "global_step": 111236, "epoch": 1340} {"train_loss": -22.0512752532959, "global_step": 111237, "epoch": 1340} {"train_loss": -22.326276779174805, "global_step": 111238, "epoch": 1340} {"train_loss": -22.11557960510254, "global_step": 111239, "epoch": 1340} {"train_loss": -22.05917739868164, "global_step": 111240, "epoch": 1340} {"train_loss": -21.93715476989746, "global_step": 111241, "epoch": 1340} {"train_loss": -22.21048355102539, "global_step": 111242, "epoch": 1340} {"train_loss": -21.99149513244629, "global_step": 111243, "epoch": 1340} {"train_loss": -22.324565887451172, "global_step": 111244, "epoch": 1340} {"train_loss": -22.3579158782959, "global_step": 111245, "epoch": 1340} {"train_loss": -22.236783981323242, "global_step": 111246, "epoch": 1340} {"train_loss": -22.166181564331055, "global_step": 111247, "epoch": 1340} {"train_loss": -22.38789176940918, "global_step": 111248, "epoch": 1340} {"train_loss": -22.524259567260742, "global_step": 111249, "epoch": 1340} {"train_loss": -22.29624366760254, "global_step": 111250, "epoch": 1340} {"train_loss": -22.53632164001465, "global_step": 111251, "epoch": 1340} {"train_loss": -21.938291549682617, "global_step": 111252, "epoch": 1340} {"train_loss": -22.061079025268555, "global_step": 111253, "epoch": 1340} {"train_loss": -22.29952049255371, "global_step": 111254, "epoch": 1340} {"train_loss": -22.238901138305664, "global_step": 111255, "epoch": 1340} {"train_loss": -22.293445587158203, "global_step": 111256, "epoch": 1340} {"train_loss": -21.996938705444336, "global_step": 111257, "epoch": 1340} {"train_loss": -22.521713256835938, "global_step": 111258, "epoch": 1340} {"train_loss": -22.519628524780273, "global_step": 111259, "epoch": 1340} {"train_loss": -22.20442771911621, "global_step": 111260, "epoch": 1340} {"train_loss": -22.146738052368164, "global_step": 111261, "epoch": 1340} {"train_loss": -22.6262264251709, "global_step": 111262, "epoch": 1340} {"train_loss": -22.066171646118164, "global_step": 111263, "epoch": 1340} {"train_loss": -22.375675201416016, "global_step": 111264, "epoch": 1340} {"train_loss": -22.424970626831055, "global_step": 111265, "epoch": 1340} {"train_loss": -22.257047653198242, "global_step": 111266, "epoch": 1340} {"train_loss": -22.254592895507812, "global_step": 111267, "epoch": 1340} {"train_loss": -22.25970458984375, "global_step": 111268, "epoch": 1340} {"train_loss": -22.583417892456055, "global_step": 111269, "epoch": 1340} {"train_loss": -22.107513427734375, "global_step": 111270, "epoch": 1340} {"train_loss": -22.108617782592773, "global_step": 111271, "epoch": 1340} {"train_loss": -22.321468353271484, "global_step": 111272, "epoch": 1340} {"train_loss": -22.33066177368164, "global_step": 111273, "epoch": 1340} {"train_loss": -22.40040397644043, "global_step": 111274, "epoch": 1340} {"train_loss": -22.09357261657715, "global_step": 111275, "epoch": 1340} {"train_loss": -22.3720645904541, "global_step": 111276, "epoch": 1340} {"train_loss": -21.964092254638672, "global_step": 111277, "epoch": 1340} {"train_loss": -22.2132511138916, "global_step": 111278, "epoch": 1340} {"train_loss": -22.08277130126953, "global_step": 111279, "epoch": 1340} {"train_loss": -22.33635139465332, "global_step": 111280, "epoch": 1340} {"train_loss": -22.30721092224121, "global_step": 111281, "epoch": 1340} {"train_loss": -22.14400291442871, "global_step": 111282, "epoch": 1340} {"train_loss": -22.526382446289062, "global_step": 111283, "epoch": 1340} {"train_loss": -22.33722496032715, "global_step": 111284, "epoch": 1340} {"train_loss": -22.547208786010742, "global_step": 111285, "epoch": 1340} {"train_loss": -22.153059005737305, "global_step": 111286, "epoch": 1340} {"train_loss": -22.557153701782227, "global_step": 111287, "epoch": 1340} {"train_loss": -22.4853458404541, "global_step": 111288, "epoch": 1340} {"train_loss": -22.38472557067871, "global_step": 111289, "epoch": 1340} {"train_loss": -22.241161346435547, "global_step": 111290, "epoch": 1340} {"train_loss": -22.126544952392578, "global_step": 111291, "epoch": 1340} {"train_loss": -22.538909912109375, "global_step": 111292, "epoch": 1340} {"train_loss": -22.05426597595215, "global_step": 111293, "epoch": 1340} {"train_loss": -22.227453231811523, "global_step": 111294, "epoch": 1340} {"train_loss": -22.108057022094727, "global_step": 111295, "epoch": 1340} {"train_loss": -22.353185653686523, "global_step": 111296, "epoch": 1340} {"train_loss": -22.83944320678711, "global_step": 111297, "epoch": 1340} {"train_loss": -22.3169002532959, "global_step": 111298, "epoch": 1340} {"train_loss": -22.27638816833496, "global_step": 111299, "epoch": 1340} {"train_loss": -22.392026901245117, "global_step": 111300, "epoch": 1340} {"train_loss": -22.328458786010742, "global_step": 111301, "epoch": 1340} {"train_loss": -22.21343617266919, "global_step": 111302, "epoch": 1340, "val_loss": 5902468.0} {"train_loss": -21.050670623779297, "global_step": 111303, "epoch": 1341} {"train_loss": -21.9564266204834, "global_step": 111304, "epoch": 1341} {"train_loss": -21.809412002563477, "global_step": 111305, "epoch": 1341} {"train_loss": -21.6784725189209, "global_step": 111306, "epoch": 1341} {"train_loss": -21.764509201049805, "global_step": 111307, "epoch": 1341} {"train_loss": -21.941455841064453, "global_step": 111308, "epoch": 1341} {"train_loss": -21.611064910888672, "global_step": 111309, "epoch": 1341} {"train_loss": -21.646438598632812, "global_step": 111310, "epoch": 1341} {"train_loss": -21.812742233276367, "global_step": 111311, "epoch": 1341} {"train_loss": -22.00208282470703, "global_step": 111312, "epoch": 1341} {"train_loss": -22.151033401489258, "global_step": 111313, "epoch": 1341} {"train_loss": -22.04623794555664, "global_step": 111314, "epoch": 1341} {"train_loss": -22.134811401367188, "global_step": 111315, "epoch": 1341} {"train_loss": -22.091537475585938, "global_step": 111316, "epoch": 1341} {"train_loss": -21.95454978942871, "global_step": 111317, "epoch": 1341} {"train_loss": -22.124282836914062, "global_step": 111318, "epoch": 1341} {"train_loss": -22.346912384033203, "global_step": 111319, "epoch": 1341} {"train_loss": -22.113889694213867, "global_step": 111320, "epoch": 1341} {"train_loss": -21.77613639831543, "global_step": 111321, "epoch": 1341} {"train_loss": -22.123878479003906, "global_step": 111322, "epoch": 1341} {"train_loss": -21.93277359008789, "global_step": 111323, "epoch": 1341} {"train_loss": -22.05535316467285, "global_step": 111324, "epoch": 1341} {"train_loss": -22.333274841308594, "global_step": 111325, "epoch": 1341} {"train_loss": -22.209671020507812, "global_step": 111326, "epoch": 1341} {"train_loss": -22.183446884155273, "global_step": 111327, "epoch": 1341} {"train_loss": -22.055662155151367, "global_step": 111328, "epoch": 1341} {"train_loss": -22.26665687561035, "global_step": 111329, "epoch": 1341} {"train_loss": -22.02164649963379, "global_step": 111330, "epoch": 1341} {"train_loss": -22.178176879882812, "global_step": 111331, "epoch": 1341} {"train_loss": -22.32023048400879, "global_step": 111332, "epoch": 1341} {"train_loss": -22.053062438964844, "global_step": 111333, "epoch": 1341} {"train_loss": -22.323043823242188, "global_step": 111334, "epoch": 1341} {"train_loss": -22.416860580444336, "global_step": 111335, "epoch": 1341} {"train_loss": -22.58830451965332, "global_step": 111336, "epoch": 1341} {"train_loss": -22.342844009399414, "global_step": 111337, "epoch": 1341} {"train_loss": -22.15177345275879, "global_step": 111338, "epoch": 1341} {"train_loss": -22.58002281188965, "global_step": 111339, "epoch": 1341} {"train_loss": -22.389005661010742, "global_step": 111340, "epoch": 1341} {"train_loss": -22.75682830810547, "global_step": 111341, "epoch": 1341} {"train_loss": -22.284027099609375, "global_step": 111342, "epoch": 1341} {"train_loss": -22.382638931274414, "global_step": 111343, "epoch": 1341} {"train_loss": -22.27688217163086, "global_step": 111344, "epoch": 1341} {"train_loss": -22.300064086914062, "global_step": 111345, "epoch": 1341} {"train_loss": -22.33221435546875, "global_step": 111346, "epoch": 1341} {"train_loss": -22.216541290283203, "global_step": 111347, "epoch": 1341} {"train_loss": -22.501239776611328, "global_step": 111348, "epoch": 1341} {"train_loss": -22.341129302978516, "global_step": 111349, "epoch": 1341} {"train_loss": -22.232046127319336, "global_step": 111350, "epoch": 1341} {"train_loss": -22.162540435791016, "global_step": 111351, "epoch": 1341} {"train_loss": -22.257505416870117, "global_step": 111352, "epoch": 1341} {"train_loss": -21.946630477905273, "global_step": 111353, "epoch": 1341} {"train_loss": -22.25843048095703, "global_step": 111354, "epoch": 1341} {"train_loss": -22.305524826049805, "global_step": 111355, "epoch": 1341} {"train_loss": -22.130292892456055, "global_step": 111356, "epoch": 1341} {"train_loss": -22.329435348510742, "global_step": 111357, "epoch": 1341} {"train_loss": -22.554052352905273, "global_step": 111358, "epoch": 1341} {"train_loss": -22.298368453979492, "global_step": 111359, "epoch": 1341} {"train_loss": -21.985891342163086, "global_step": 111360, "epoch": 1341} {"train_loss": -22.62210464477539, "global_step": 111361, "epoch": 1341} {"train_loss": -21.978940963745117, "global_step": 111362, "epoch": 1341} {"train_loss": -22.504459381103516, "global_step": 111363, "epoch": 1341} {"train_loss": -22.530611038208008, "global_step": 111364, "epoch": 1341} {"train_loss": -22.30491065979004, "global_step": 111365, "epoch": 1341} {"train_loss": -22.540746688842773, "global_step": 111366, "epoch": 1341} {"train_loss": -22.210294723510742, "global_step": 111367, "epoch": 1341} {"train_loss": -22.229955673217773, "global_step": 111368, "epoch": 1341} {"train_loss": -22.41382598876953, "global_step": 111369, "epoch": 1341} {"train_loss": -22.69951820373535, "global_step": 111370, "epoch": 1341} {"train_loss": -22.292911529541016, "global_step": 111371, "epoch": 1341} {"train_loss": -22.400054931640625, "global_step": 111372, "epoch": 1341} {"train_loss": -22.45896339416504, "global_step": 111373, "epoch": 1341} {"train_loss": -22.47067642211914, "global_step": 111374, "epoch": 1341} {"train_loss": -22.641773223876953, "global_step": 111375, "epoch": 1341} {"train_loss": -22.40570640563965, "global_step": 111376, "epoch": 1341} {"train_loss": -22.306928634643555, "global_step": 111377, "epoch": 1341} {"train_loss": -22.391151428222656, "global_step": 111378, "epoch": 1341} {"train_loss": -22.4205265045166, "global_step": 111379, "epoch": 1341} {"train_loss": -22.23093032836914, "global_step": 111380, "epoch": 1341} {"train_loss": -22.557987213134766, "global_step": 111381, "epoch": 1341} {"train_loss": -22.149105072021484, "global_step": 111382, "epoch": 1341} {"train_loss": -22.40858268737793, "global_step": 111383, "epoch": 1341} {"train_loss": -21.933679580688477, "global_step": 111384, "epoch": 1341} {"train_loss": -22.210955998983728, "global_step": 111385, "epoch": 1341, "val_loss": 6194736.0} {"train_loss": -22.156442642211914, "global_step": 111386, "epoch": 1342} {"train_loss": -21.910825729370117, "global_step": 111387, "epoch": 1342} {"train_loss": -21.691877365112305, "global_step": 111388, "epoch": 1342} {"train_loss": -22.10202980041504, "global_step": 111389, "epoch": 1342} {"train_loss": -21.819459915161133, "global_step": 111390, "epoch": 1342} {"train_loss": -22.131147384643555, "global_step": 111391, "epoch": 1342} {"train_loss": -21.885541915893555, "global_step": 111392, "epoch": 1342} {"train_loss": -21.820072174072266, "global_step": 111393, "epoch": 1342} {"train_loss": -21.995025634765625, "global_step": 111394, "epoch": 1342} {"train_loss": -22.192276000976562, "global_step": 111395, "epoch": 1342} {"train_loss": -22.252958297729492, "global_step": 111396, "epoch": 1342} {"train_loss": -22.111730575561523, "global_step": 111397, "epoch": 1342} {"train_loss": -21.95798683166504, "global_step": 111398, "epoch": 1342} {"train_loss": -22.213239669799805, "global_step": 111399, "epoch": 1342} {"train_loss": -22.000659942626953, "global_step": 111400, "epoch": 1342} {"train_loss": -22.29800033569336, "global_step": 111401, "epoch": 1342} {"train_loss": -22.307714462280273, "global_step": 111402, "epoch": 1342} {"train_loss": -22.206453323364258, "global_step": 111403, "epoch": 1342} {"train_loss": -21.970640182495117, "global_step": 111404, "epoch": 1342} {"train_loss": -22.27068519592285, "global_step": 111405, "epoch": 1342} {"train_loss": -22.087268829345703, "global_step": 111406, "epoch": 1342} {"train_loss": -22.227039337158203, "global_step": 111407, "epoch": 1342} {"train_loss": -22.28593635559082, "global_step": 111408, "epoch": 1342} {"train_loss": -22.160314559936523, "global_step": 111409, "epoch": 1342} {"train_loss": -22.12306785583496, "global_step": 111410, "epoch": 1342} {"train_loss": -22.22019386291504, "global_step": 111411, "epoch": 1342} {"train_loss": -22.264493942260742, "global_step": 111412, "epoch": 1342} {"train_loss": -22.231124877929688, "global_step": 111413, "epoch": 1342} {"train_loss": -22.330472946166992, "global_step": 111414, "epoch": 1342} {"train_loss": -22.17340660095215, "global_step": 111415, "epoch": 1342} {"train_loss": -22.35145378112793, "global_step": 111416, "epoch": 1342} {"train_loss": -22.438186645507812, "global_step": 111417, "epoch": 1342} {"train_loss": -22.258880615234375, "global_step": 111418, "epoch": 1342} {"train_loss": -22.086196899414062, "global_step": 111419, "epoch": 1342} {"train_loss": -22.159788131713867, "global_step": 111420, "epoch": 1342} {"train_loss": -22.24568748474121, "global_step": 111421, "epoch": 1342} {"train_loss": -22.05788230895996, "global_step": 111422, "epoch": 1342} {"train_loss": -22.561397552490234, "global_step": 111423, "epoch": 1342} {"train_loss": -22.270944595336914, "global_step": 111424, "epoch": 1342} {"train_loss": -22.146650314331055, "global_step": 111425, "epoch": 1342} {"train_loss": -22.36868667602539, "global_step": 111426, "epoch": 1342} {"train_loss": -22.090805053710938, "global_step": 111427, "epoch": 1342} {"train_loss": -22.22638511657715, "global_step": 111428, "epoch": 1342} {"train_loss": -22.115623474121094, "global_step": 111429, "epoch": 1342} {"train_loss": -22.395517349243164, "global_step": 111430, "epoch": 1342} {"train_loss": -22.179630279541016, "global_step": 111431, "epoch": 1342} {"train_loss": -22.48410415649414, "global_step": 111432, "epoch": 1342} {"train_loss": -22.410634994506836, "global_step": 111433, "epoch": 1342} {"train_loss": -22.42718505859375, "global_step": 111434, "epoch": 1342} {"train_loss": -22.354063034057617, "global_step": 111435, "epoch": 1342} {"train_loss": -22.33562660217285, "global_step": 111436, "epoch": 1342} {"train_loss": -22.177839279174805, "global_step": 111437, "epoch": 1342} {"train_loss": -22.409276962280273, "global_step": 111438, "epoch": 1342} {"train_loss": -22.345972061157227, "global_step": 111439, "epoch": 1342} {"train_loss": -22.381057739257812, "global_step": 111440, "epoch": 1342} {"train_loss": -22.46885108947754, "global_step": 111441, "epoch": 1342} {"train_loss": -22.57883644104004, "global_step": 111442, "epoch": 1342} {"train_loss": -22.329198837280273, "global_step": 111443, "epoch": 1342} {"train_loss": -22.394882202148438, "global_step": 111444, "epoch": 1342} {"train_loss": -22.058713912963867, "global_step": 111445, "epoch": 1342} {"train_loss": -22.224763870239258, "global_step": 111446, "epoch": 1342} {"train_loss": -22.21503257751465, "global_step": 111447, "epoch": 1342} {"train_loss": -22.452545166015625, "global_step": 111448, "epoch": 1342} {"train_loss": -22.266935348510742, "global_step": 111449, "epoch": 1342} {"train_loss": -22.255897521972656, "global_step": 111450, "epoch": 1342} {"train_loss": -22.230974197387695, "global_step": 111451, "epoch": 1342} {"train_loss": -22.650388717651367, "global_step": 111452, "epoch": 1342} {"train_loss": -22.36756706237793, "global_step": 111453, "epoch": 1342} {"train_loss": -22.134611129760742, "global_step": 111454, "epoch": 1342} {"train_loss": -22.324674606323242, "global_step": 111455, "epoch": 1342} {"train_loss": -22.689756393432617, "global_step": 111456, "epoch": 1342} {"train_loss": -22.024431228637695, "global_step": 111457, "epoch": 1342} {"train_loss": -21.989288330078125, "global_step": 111458, "epoch": 1342} {"train_loss": -22.58686637878418, "global_step": 111459, "epoch": 1342} {"train_loss": -22.344390869140625, "global_step": 111460, "epoch": 1342} {"train_loss": -22.30877685546875, "global_step": 111461, "epoch": 1342} {"train_loss": -22.229516983032227, "global_step": 111462, "epoch": 1342} {"train_loss": -22.00014305114746, "global_step": 111463, "epoch": 1342} {"train_loss": -22.493215560913086, "global_step": 111464, "epoch": 1342} {"train_loss": -22.425121307373047, "global_step": 111465, "epoch": 1342} {"train_loss": -22.33258628845215, "global_step": 111466, "epoch": 1342} {"train_loss": -21.76349449157715, "global_step": 111467, "epoch": 1342} {"train_loss": -22.23510213645108, "global_step": 111468, "epoch": 1342, "val_loss": 6220830.5} {"train_loss": -22.092164993286133, "global_step": 111469, "epoch": 1343} {"train_loss": -21.748249053955078, "global_step": 111470, "epoch": 1343} {"train_loss": -21.736337661743164, "global_step": 111471, "epoch": 1343} {"train_loss": -22.055538177490234, "global_step": 111472, "epoch": 1343} {"train_loss": -21.713499069213867, "global_step": 111473, "epoch": 1343} {"train_loss": -22.09027099609375, "global_step": 111474, "epoch": 1343} {"train_loss": -21.98896598815918, "global_step": 111475, "epoch": 1343} {"train_loss": -22.14696502685547, "global_step": 111476, "epoch": 1343} {"train_loss": -22.406606674194336, "global_step": 111477, "epoch": 1343} {"train_loss": -21.8596248626709, "global_step": 111478, "epoch": 1343} {"train_loss": -22.090383529663086, "global_step": 111479, "epoch": 1343} {"train_loss": -22.105499267578125, "global_step": 111480, "epoch": 1343} {"train_loss": -22.038711547851562, "global_step": 111481, "epoch": 1343} {"train_loss": -22.391355514526367, "global_step": 111482, "epoch": 1343} {"train_loss": -22.305614471435547, "global_step": 111483, "epoch": 1343} {"train_loss": -22.197689056396484, "global_step": 111484, "epoch": 1343} {"train_loss": -22.29938507080078, "global_step": 111485, "epoch": 1343} {"train_loss": -22.25693130493164, "global_step": 111486, "epoch": 1343} {"train_loss": -22.309417724609375, "global_step": 111487, "epoch": 1343} {"train_loss": -22.027128219604492, "global_step": 111488, "epoch": 1343} {"train_loss": -22.162582397460938, "global_step": 111489, "epoch": 1343} {"train_loss": -22.40096092224121, "global_step": 111490, "epoch": 1343} {"train_loss": -22.35671615600586, "global_step": 111491, "epoch": 1343} {"train_loss": -22.27510643005371, "global_step": 111492, "epoch": 1343} {"train_loss": -22.218263626098633, "global_step": 111493, "epoch": 1343} {"train_loss": -22.16143798828125, "global_step": 111494, "epoch": 1343} {"train_loss": -21.879047393798828, "global_step": 111495, "epoch": 1343} {"train_loss": -22.628053665161133, "global_step": 111496, "epoch": 1343} {"train_loss": -22.148012161254883, "global_step": 111497, "epoch": 1343} {"train_loss": -22.34990692138672, "global_step": 111498, "epoch": 1343} {"train_loss": -22.10135841369629, "global_step": 111499, "epoch": 1343} {"train_loss": -22.195791244506836, "global_step": 111500, "epoch": 1343} {"train_loss": -22.619678497314453, "global_step": 111501, "epoch": 1343} {"train_loss": -22.627286911010742, "global_step": 111502, "epoch": 1343} {"train_loss": -22.26072120666504, "global_step": 111503, "epoch": 1343} {"train_loss": -22.312341690063477, "global_step": 111504, "epoch": 1343} {"train_loss": -22.165685653686523, "global_step": 111505, "epoch": 1343} {"train_loss": -21.973358154296875, "global_step": 111506, "epoch": 1343} {"train_loss": -22.1892147064209, "global_step": 111507, "epoch": 1343} {"train_loss": -22.10794448852539, "global_step": 111508, "epoch": 1343} {"train_loss": -21.91455078125, "global_step": 111509, "epoch": 1343} {"train_loss": -22.562942504882812, "global_step": 111510, "epoch": 1343} {"train_loss": -22.404329299926758, "global_step": 111511, "epoch": 1343} {"train_loss": -22.17418670654297, "global_step": 111512, "epoch": 1343} {"train_loss": -22.26027488708496, "global_step": 111513, "epoch": 1343} {"train_loss": -22.212011337280273, "global_step": 111514, "epoch": 1343} {"train_loss": -22.441650390625, "global_step": 111515, "epoch": 1343} {"train_loss": -22.577198028564453, "global_step": 111516, "epoch": 1343} {"train_loss": -22.1510066986084, "global_step": 111517, "epoch": 1343} {"train_loss": -22.51276969909668, "global_step": 111518, "epoch": 1343} {"train_loss": -22.350936889648438, "global_step": 111519, "epoch": 1343} {"train_loss": -22.3155574798584, "global_step": 111520, "epoch": 1343} {"train_loss": -22.37701416015625, "global_step": 111521, "epoch": 1343} {"train_loss": -22.425853729248047, "global_step": 111522, "epoch": 1343} {"train_loss": -22.411367416381836, "global_step": 111523, "epoch": 1343} {"train_loss": -22.20720672607422, "global_step": 111524, "epoch": 1343} {"train_loss": -22.142099380493164, "global_step": 111525, "epoch": 1343} {"train_loss": -22.646005630493164, "global_step": 111526, "epoch": 1343} {"train_loss": -22.16337013244629, "global_step": 111527, "epoch": 1343} {"train_loss": -22.113536834716797, "global_step": 111528, "epoch": 1343} {"train_loss": -22.260412216186523, "global_step": 111529, "epoch": 1343} {"train_loss": -22.59026527404785, "global_step": 111530, "epoch": 1343} {"train_loss": -22.531661987304688, "global_step": 111531, "epoch": 1343} {"train_loss": -22.055740356445312, "global_step": 111532, "epoch": 1343} {"train_loss": -22.21473503112793, "global_step": 111533, "epoch": 1343} {"train_loss": -22.200098037719727, "global_step": 111534, "epoch": 1343} {"train_loss": -21.93278694152832, "global_step": 111535, "epoch": 1343} {"train_loss": -22.24607276916504, "global_step": 111536, "epoch": 1343} {"train_loss": -22.106842041015625, "global_step": 111537, "epoch": 1343} {"train_loss": -22.240386962890625, "global_step": 111538, "epoch": 1343} {"train_loss": -22.208219528198242, "global_step": 111539, "epoch": 1343} {"train_loss": -22.728933334350586, "global_step": 111540, "epoch": 1343} {"train_loss": -22.260160446166992, "global_step": 111541, "epoch": 1343} {"train_loss": -22.418582916259766, "global_step": 111542, "epoch": 1343} {"train_loss": -21.968469619750977, "global_step": 111543, "epoch": 1343} {"train_loss": -22.58186912536621, "global_step": 111544, "epoch": 1343} {"train_loss": -22.807762145996094, "global_step": 111545, "epoch": 1343} {"train_loss": -22.222003936767578, "global_step": 111546, "epoch": 1343} {"train_loss": -21.982452392578125, "global_step": 111547, "epoch": 1343} {"train_loss": -22.134613037109375, "global_step": 111548, "epoch": 1343} {"train_loss": -22.326995849609375, "global_step": 111549, "epoch": 1343} {"train_loss": -22.1107234954834, "global_step": 111550, "epoch": 1343} {"train_loss": -22.2407851161727, "global_step": 111551, "epoch": 1343, "val_loss": 6166299.5} {"train_loss": -21.787952423095703, "global_step": 111552, "epoch": 1344} {"train_loss": -21.80076026916504, "global_step": 111553, "epoch": 1344} {"train_loss": -22.061187744140625, "global_step": 111554, "epoch": 1344} {"train_loss": -21.74683952331543, "global_step": 111555, "epoch": 1344} {"train_loss": -21.84270668029785, "global_step": 111556, "epoch": 1344} {"train_loss": -21.994272232055664, "global_step": 111557, "epoch": 1344} {"train_loss": -21.643125534057617, "global_step": 111558, "epoch": 1344} {"train_loss": -22.01820182800293, "global_step": 111559, "epoch": 1344} {"train_loss": -21.52605628967285, "global_step": 111560, "epoch": 1344} {"train_loss": -21.48814582824707, "global_step": 111561, "epoch": 1344} {"train_loss": -22.011259078979492, "global_step": 111562, "epoch": 1344} {"train_loss": -21.88112449645996, "global_step": 111563, "epoch": 1344} {"train_loss": -22.301237106323242, "global_step": 111564, "epoch": 1344} {"train_loss": -22.183820724487305, "global_step": 111565, "epoch": 1344} {"train_loss": -22.185474395751953, "global_step": 111566, "epoch": 1344} {"train_loss": -22.12602424621582, "global_step": 111567, "epoch": 1344} {"train_loss": -21.584354400634766, "global_step": 111568, "epoch": 1344} {"train_loss": -22.14853858947754, "global_step": 111569, "epoch": 1344} {"train_loss": -22.015995025634766, "global_step": 111570, "epoch": 1344} {"train_loss": -22.1317195892334, "global_step": 111571, "epoch": 1344} {"train_loss": -22.032390594482422, "global_step": 111572, "epoch": 1344} {"train_loss": -21.89993667602539, "global_step": 111573, "epoch": 1344} {"train_loss": -22.001249313354492, "global_step": 111574, "epoch": 1344} {"train_loss": -21.940977096557617, "global_step": 111575, "epoch": 1344} {"train_loss": -22.27396583557129, "global_step": 111576, "epoch": 1344} {"train_loss": -22.539560317993164, "global_step": 111577, "epoch": 1344} {"train_loss": -22.246850967407227, "global_step": 111578, "epoch": 1344} {"train_loss": -22.5947208404541, "global_step": 111579, "epoch": 1344} {"train_loss": -22.466798782348633, "global_step": 111580, "epoch": 1344} {"train_loss": -22.325510025024414, "global_step": 111581, "epoch": 1344} {"train_loss": -22.09244155883789, "global_step": 111582, "epoch": 1344} {"train_loss": -22.258024215698242, "global_step": 111583, "epoch": 1344} {"train_loss": -22.794200897216797, "global_step": 111584, "epoch": 1344} {"train_loss": -22.200429916381836, "global_step": 111585, "epoch": 1344} {"train_loss": -22.20253562927246, "global_step": 111586, "epoch": 1344} {"train_loss": -22.523635864257812, "global_step": 111587, "epoch": 1344} {"train_loss": -22.22914695739746, "global_step": 111588, "epoch": 1344} {"train_loss": -22.53806495666504, "global_step": 111589, "epoch": 1344} {"train_loss": -22.372243881225586, "global_step": 111590, "epoch": 1344} {"train_loss": -22.02124786376953, "global_step": 111591, "epoch": 1344} {"train_loss": -22.005773544311523, "global_step": 111592, "epoch": 1344} {"train_loss": -22.3310604095459, "global_step": 111593, "epoch": 1344} {"train_loss": -22.2783203125, "global_step": 111594, "epoch": 1344} {"train_loss": -22.249235153198242, "global_step": 111595, "epoch": 1344} {"train_loss": -22.037446975708008, "global_step": 111596, "epoch": 1344} {"train_loss": -22.049551010131836, "global_step": 111597, "epoch": 1344} {"train_loss": -22.199369430541992, "global_step": 111598, "epoch": 1344} {"train_loss": -22.623056411743164, "global_step": 111599, "epoch": 1344} {"train_loss": -21.980636596679688, "global_step": 111600, "epoch": 1344} {"train_loss": -22.35313606262207, "global_step": 111601, "epoch": 1344} {"train_loss": -22.29566764831543, "global_step": 111602, "epoch": 1344} {"train_loss": -22.20272445678711, "global_step": 111603, "epoch": 1344} {"train_loss": -22.400291442871094, "global_step": 111604, "epoch": 1344} {"train_loss": -22.653423309326172, "global_step": 111605, "epoch": 1344} {"train_loss": -22.459970474243164, "global_step": 111606, "epoch": 1344} {"train_loss": -22.36388397216797, "global_step": 111607, "epoch": 1344} {"train_loss": -22.09364128112793, "global_step": 111608, "epoch": 1344} {"train_loss": -22.21611976623535, "global_step": 111609, "epoch": 1344} {"train_loss": -22.204160690307617, "global_step": 111610, "epoch": 1344} {"train_loss": -22.17014503479004, "global_step": 111611, "epoch": 1344} {"train_loss": -22.297086715698242, "global_step": 111612, "epoch": 1344} {"train_loss": -22.66619110107422, "global_step": 111613, "epoch": 1344} {"train_loss": -22.626632690429688, "global_step": 111614, "epoch": 1344} {"train_loss": -22.22930145263672, "global_step": 111615, "epoch": 1344} {"train_loss": -22.50447654724121, "global_step": 111616, "epoch": 1344} {"train_loss": -22.274076461791992, "global_step": 111617, "epoch": 1344} {"train_loss": -22.336477279663086, "global_step": 111618, "epoch": 1344} {"train_loss": -22.62030029296875, "global_step": 111619, "epoch": 1344} {"train_loss": -21.999032974243164, "global_step": 111620, "epoch": 1344} {"train_loss": -22.61804962158203, "global_step": 111621, "epoch": 1344} {"train_loss": -22.728097915649414, "global_step": 111622, "epoch": 1344} {"train_loss": -22.195783615112305, "global_step": 111623, "epoch": 1344} {"train_loss": -22.123798370361328, "global_step": 111624, "epoch": 1344} {"train_loss": -22.278064727783203, "global_step": 111625, "epoch": 1344} {"train_loss": -22.534709930419922, "global_step": 111626, "epoch": 1344} {"train_loss": -22.22058868408203, "global_step": 111627, "epoch": 1344} {"train_loss": -22.15291404724121, "global_step": 111628, "epoch": 1344} {"train_loss": -22.4044246673584, "global_step": 111629, "epoch": 1344} {"train_loss": -22.489377975463867, "global_step": 111630, "epoch": 1344} {"train_loss": -22.26873779296875, "global_step": 111631, "epoch": 1344} {"train_loss": -22.365800857543945, "global_step": 111632, "epoch": 1344} {"train_loss": -22.266122817993164, "global_step": 111633, "epoch": 1344} {"train_loss": -22.212287236409015, "global_step": 111634, "epoch": 1344, "val_loss": 6259625.0} {"train_loss": -21.83233642578125, "global_step": 111635, "epoch": 1345} {"train_loss": -21.561355590820312, "global_step": 111636, "epoch": 1345} {"train_loss": -22.14762306213379, "global_step": 111637, "epoch": 1345} {"train_loss": -21.73320770263672, "global_step": 111638, "epoch": 1345} {"train_loss": -21.772924423217773, "global_step": 111639, "epoch": 1345} {"train_loss": -21.7071590423584, "global_step": 111640, "epoch": 1345} {"train_loss": -21.923831939697266, "global_step": 111641, "epoch": 1345} {"train_loss": -21.94780921936035, "global_step": 111642, "epoch": 1345} {"train_loss": -21.95241355895996, "global_step": 111643, "epoch": 1345} {"train_loss": -21.415515899658203, "global_step": 111644, "epoch": 1345} {"train_loss": -21.908674240112305, "global_step": 111645, "epoch": 1345} {"train_loss": -21.874540328979492, "global_step": 111646, "epoch": 1345} {"train_loss": -22.433359146118164, "global_step": 111647, "epoch": 1345} {"train_loss": -22.231212615966797, "global_step": 111648, "epoch": 1345} {"train_loss": -21.496091842651367, "global_step": 111649, "epoch": 1345} {"train_loss": -21.992477416992188, "global_step": 111650, "epoch": 1345} {"train_loss": -21.62244987487793, "global_step": 111651, "epoch": 1345} {"train_loss": -22.317590713500977, "global_step": 111652, "epoch": 1345} {"train_loss": -22.157360076904297, "global_step": 111653, "epoch": 1345} {"train_loss": -22.25069236755371, "global_step": 111654, "epoch": 1345} {"train_loss": -22.043745040893555, "global_step": 111655, "epoch": 1345} {"train_loss": -22.041532516479492, "global_step": 111656, "epoch": 1345} {"train_loss": -22.53550148010254, "global_step": 111657, "epoch": 1345} {"train_loss": -21.830541610717773, "global_step": 111658, "epoch": 1345} {"train_loss": -22.513858795166016, "global_step": 111659, "epoch": 1345} {"train_loss": -22.46807861328125, "global_step": 111660, "epoch": 1345} {"train_loss": -22.02240753173828, "global_step": 111661, "epoch": 1345} {"train_loss": -22.159008026123047, "global_step": 111662, "epoch": 1345} {"train_loss": -22.439979553222656, "global_step": 111663, "epoch": 1345} {"train_loss": -22.20680046081543, "global_step": 111664, "epoch": 1345} {"train_loss": -22.503332138061523, "global_step": 111665, "epoch": 1345} {"train_loss": -22.124685287475586, "global_step": 111666, "epoch": 1345} {"train_loss": -22.2312068939209, "global_step": 111667, "epoch": 1345} {"train_loss": -22.665205001831055, "global_step": 111668, "epoch": 1345} {"train_loss": -22.289384841918945, "global_step": 111669, "epoch": 1345} {"train_loss": -22.340587615966797, "global_step": 111670, "epoch": 1345} {"train_loss": -22.271026611328125, "global_step": 111671, "epoch": 1345} {"train_loss": -22.3414363861084, "global_step": 111672, "epoch": 1345} {"train_loss": -22.235376358032227, "global_step": 111673, "epoch": 1345} {"train_loss": -22.16145133972168, "global_step": 111674, "epoch": 1345} {"train_loss": -22.362197875976562, "global_step": 111675, "epoch": 1345} {"train_loss": -22.261747360229492, "global_step": 111676, "epoch": 1345} {"train_loss": -22.350271224975586, "global_step": 111677, "epoch": 1345} {"train_loss": -22.262901306152344, "global_step": 111678, "epoch": 1345} {"train_loss": -22.35701560974121, "global_step": 111679, "epoch": 1345} {"train_loss": -22.279300689697266, "global_step": 111680, "epoch": 1345} {"train_loss": -22.123273849487305, "global_step": 111681, "epoch": 1345} {"train_loss": -22.657155990600586, "global_step": 111682, "epoch": 1345} {"train_loss": -22.228055953979492, "global_step": 111683, "epoch": 1345} {"train_loss": -22.14389991760254, "global_step": 111684, "epoch": 1345} {"train_loss": -22.486295700073242, "global_step": 111685, "epoch": 1345} {"train_loss": -22.35275650024414, "global_step": 111686, "epoch": 1345} {"train_loss": -22.11177635192871, "global_step": 111687, "epoch": 1345} {"train_loss": -22.0513858795166, "global_step": 111688, "epoch": 1345} {"train_loss": -21.812379837036133, "global_step": 111689, "epoch": 1345} {"train_loss": -22.33673858642578, "global_step": 111690, "epoch": 1345} {"train_loss": -22.439434051513672, "global_step": 111691, "epoch": 1345} {"train_loss": -22.610536575317383, "global_step": 111692, "epoch": 1345} {"train_loss": -22.466405868530273, "global_step": 111693, "epoch": 1345} {"train_loss": -22.539892196655273, "global_step": 111694, "epoch": 1345} {"train_loss": -22.15471839904785, "global_step": 111695, "epoch": 1345} {"train_loss": -22.25920295715332, "global_step": 111696, "epoch": 1345} {"train_loss": -22.43172264099121, "global_step": 111697, "epoch": 1345} {"train_loss": -22.37946128845215, "global_step": 111698, "epoch": 1345} {"train_loss": -22.35435676574707, "global_step": 111699, "epoch": 1345} {"train_loss": -22.230398178100586, "global_step": 111700, "epoch": 1345} {"train_loss": -22.24568748474121, "global_step": 111701, "epoch": 1345} {"train_loss": -22.195138931274414, "global_step": 111702, "epoch": 1345} {"train_loss": -22.416854858398438, "global_step": 111703, "epoch": 1345} {"train_loss": -21.865909576416016, "global_step": 111704, "epoch": 1345} {"train_loss": -22.055740356445312, "global_step": 111705, "epoch": 1345} {"train_loss": -22.2878360748291, "global_step": 111706, "epoch": 1345} {"train_loss": -21.772418975830078, "global_step": 111707, "epoch": 1345} {"train_loss": -21.788475036621094, "global_step": 111708, "epoch": 1345} {"train_loss": -21.90243911743164, "global_step": 111709, "epoch": 1345} {"train_loss": -22.246854782104492, "global_step": 111710, "epoch": 1345} {"train_loss": -21.92896270751953, "global_step": 111711, "epoch": 1345} {"train_loss": -21.86109733581543, "global_step": 111712, "epoch": 1345} {"train_loss": -22.343355178833008, "global_step": 111713, "epoch": 1345} {"train_loss": -22.328908920288086, "global_step": 111714, "epoch": 1345} {"train_loss": -22.6828556060791, "global_step": 111715, "epoch": 1345} {"train_loss": -22.41031265258789, "global_step": 111716, "epoch": 1345} {"train_loss": -22.17078572008983, "global_step": 111717, "epoch": 1345, "val_loss": 6071874.0} {"train_loss": -21.94377899169922, "global_step": 111718, "epoch": 1346} {"train_loss": -21.706253051757812, "global_step": 111719, "epoch": 1346} {"train_loss": -22.225833892822266, "global_step": 111720, "epoch": 1346} {"train_loss": -21.7093505859375, "global_step": 111721, "epoch": 1346} {"train_loss": -21.999738693237305, "global_step": 111722, "epoch": 1346} {"train_loss": -22.152057647705078, "global_step": 111723, "epoch": 1346} {"train_loss": -21.97657585144043, "global_step": 111724, "epoch": 1346} {"train_loss": -21.996702194213867, "global_step": 111725, "epoch": 1346} {"train_loss": -21.488256454467773, "global_step": 111726, "epoch": 1346} {"train_loss": -21.99433708190918, "global_step": 111727, "epoch": 1346} {"train_loss": -21.954151153564453, "global_step": 111728, "epoch": 1346} {"train_loss": -21.865598678588867, "global_step": 111729, "epoch": 1346} {"train_loss": -21.771276473999023, "global_step": 111730, "epoch": 1346} {"train_loss": -22.274608612060547, "global_step": 111731, "epoch": 1346} {"train_loss": -22.1672306060791, "global_step": 111732, "epoch": 1346} {"train_loss": -21.918045043945312, "global_step": 111733, "epoch": 1346} {"train_loss": -22.26495361328125, "global_step": 111734, "epoch": 1346} {"train_loss": -21.80723762512207, "global_step": 111735, "epoch": 1346} {"train_loss": -22.59956169128418, "global_step": 111736, "epoch": 1346} {"train_loss": -22.30582046508789, "global_step": 111737, "epoch": 1346} {"train_loss": -21.76719093322754, "global_step": 111738, "epoch": 1346} {"train_loss": -21.946378707885742, "global_step": 111739, "epoch": 1346} {"train_loss": -22.175561904907227, "global_step": 111740, "epoch": 1346} {"train_loss": -22.691360473632812, "global_step": 111741, "epoch": 1346} {"train_loss": -22.20704460144043, "global_step": 111742, "epoch": 1346} {"train_loss": -21.889432907104492, "global_step": 111743, "epoch": 1346} {"train_loss": -22.237232208251953, "global_step": 111744, "epoch": 1346} {"train_loss": -22.583559036254883, "global_step": 111745, "epoch": 1346} {"train_loss": -22.30610466003418, "global_step": 111746, "epoch": 1346} {"train_loss": -22.045503616333008, "global_step": 111747, "epoch": 1346} {"train_loss": -22.159849166870117, "global_step": 111748, "epoch": 1346} {"train_loss": -22.40015983581543, "global_step": 111749, "epoch": 1346} {"train_loss": -22.070026397705078, "global_step": 111750, "epoch": 1346} {"train_loss": -22.081079483032227, "global_step": 111751, "epoch": 1346} {"train_loss": -22.518888473510742, "global_step": 111752, "epoch": 1346} {"train_loss": -22.146865844726562, "global_step": 111753, "epoch": 1346} {"train_loss": -22.22377586364746, "global_step": 111754, "epoch": 1346} {"train_loss": -22.18988609313965, "global_step": 111755, "epoch": 1346} {"train_loss": -22.294038772583008, "global_step": 111756, "epoch": 1346} {"train_loss": -22.459449768066406, "global_step": 111757, "epoch": 1346} {"train_loss": -22.507671356201172, "global_step": 111758, "epoch": 1346} {"train_loss": -22.5502986907959, "global_step": 111759, "epoch": 1346} {"train_loss": -22.577411651611328, "global_step": 111760, "epoch": 1346} {"train_loss": -22.52849578857422, "global_step": 111761, "epoch": 1346} {"train_loss": -22.50870132446289, "global_step": 111762, "epoch": 1346} {"train_loss": -22.202468872070312, "global_step": 111763, "epoch": 1346} {"train_loss": -22.940921783447266, "global_step": 111764, "epoch": 1346} {"train_loss": -22.113737106323242, "global_step": 111765, "epoch": 1346} {"train_loss": -22.242490768432617, "global_step": 111766, "epoch": 1346} {"train_loss": -22.239789962768555, "global_step": 111767, "epoch": 1346} {"train_loss": -22.669960021972656, "global_step": 111768, "epoch": 1346} {"train_loss": -22.467329025268555, "global_step": 111769, "epoch": 1346} {"train_loss": -22.424386978149414, "global_step": 111770, "epoch": 1346} {"train_loss": -22.387475967407227, "global_step": 111771, "epoch": 1346} {"train_loss": -22.41046142578125, "global_step": 111772, "epoch": 1346} {"train_loss": -22.219348907470703, "global_step": 111773, "epoch": 1346} {"train_loss": -22.331893920898438, "global_step": 111774, "epoch": 1346} {"train_loss": -22.20345687866211, "global_step": 111775, "epoch": 1346} {"train_loss": -21.93294334411621, "global_step": 111776, "epoch": 1346} {"train_loss": -21.95100975036621, "global_step": 111777, "epoch": 1346} {"train_loss": -21.92938232421875, "global_step": 111778, "epoch": 1346} {"train_loss": -22.721126556396484, "global_step": 111779, "epoch": 1346} {"train_loss": -22.26845359802246, "global_step": 111780, "epoch": 1346} {"train_loss": -22.41577911376953, "global_step": 111781, "epoch": 1346} {"train_loss": -21.98954200744629, "global_step": 111782, "epoch": 1346} {"train_loss": -22.0941162109375, "global_step": 111783, "epoch": 1346} {"train_loss": -22.258764266967773, "global_step": 111784, "epoch": 1346} {"train_loss": -22.103412628173828, "global_step": 111785, "epoch": 1346} {"train_loss": -22.32736587524414, "global_step": 111786, "epoch": 1346} {"train_loss": -21.957075119018555, "global_step": 111787, "epoch": 1346} {"train_loss": -22.38039779663086, "global_step": 111788, "epoch": 1346} {"train_loss": -22.498178482055664, "global_step": 111789, "epoch": 1346} {"train_loss": -22.46062469482422, "global_step": 111790, "epoch": 1346} {"train_loss": -22.37909507751465, "global_step": 111791, "epoch": 1346} {"train_loss": -22.364301681518555, "global_step": 111792, "epoch": 1346} {"train_loss": -22.37264060974121, "global_step": 111793, "epoch": 1346} {"train_loss": -22.105619430541992, "global_step": 111794, "epoch": 1346} {"train_loss": -22.490665435791016, "global_step": 111795, "epoch": 1346} {"train_loss": -22.176198959350586, "global_step": 111796, "epoch": 1346} {"train_loss": -22.44059181213379, "global_step": 111797, "epoch": 1346} {"train_loss": -22.533334732055664, "global_step": 111798, "epoch": 1346} {"train_loss": -22.165727615356445, "global_step": 111799, "epoch": 1346} {"train_loss": -22.241189474082855, "global_step": 111800, "epoch": 1346, "val_loss": 6069552.5} {"train_loss": -22.032331466674805, "global_step": 111801, "epoch": 1347} {"train_loss": -21.70515251159668, "global_step": 111802, "epoch": 1347} {"train_loss": -22.011613845825195, "global_step": 111803, "epoch": 1347} {"train_loss": -21.880138397216797, "global_step": 111804, "epoch": 1347} {"train_loss": -22.49784278869629, "global_step": 111805, "epoch": 1347} {"train_loss": -21.93455696105957, "global_step": 111806, "epoch": 1347} {"train_loss": -22.08742904663086, "global_step": 111807, "epoch": 1347} {"train_loss": -22.49812889099121, "global_step": 111808, "epoch": 1347} {"train_loss": -22.0755672454834, "global_step": 111809, "epoch": 1347} {"train_loss": -22.32008171081543, "global_step": 111810, "epoch": 1347} {"train_loss": -22.158977508544922, "global_step": 111811, "epoch": 1347} {"train_loss": -22.273191452026367, "global_step": 111812, "epoch": 1347} {"train_loss": -22.297527313232422, "global_step": 111813, "epoch": 1347} {"train_loss": -22.3240909576416, "global_step": 111814, "epoch": 1347} {"train_loss": -22.456701278686523, "global_step": 111815, "epoch": 1347} {"train_loss": -22.11097526550293, "global_step": 111816, "epoch": 1347} {"train_loss": -22.543493270874023, "global_step": 111817, "epoch": 1347} {"train_loss": -22.244796752929688, "global_step": 111818, "epoch": 1347} {"train_loss": -22.351638793945312, "global_step": 111819, "epoch": 1347} {"train_loss": -22.174665451049805, "global_step": 111820, "epoch": 1347} {"train_loss": -21.998991012573242, "global_step": 111821, "epoch": 1347} {"train_loss": -22.308134078979492, "global_step": 111822, "epoch": 1347} {"train_loss": -22.518877029418945, "global_step": 111823, "epoch": 1347} {"train_loss": -22.41078758239746, "global_step": 111824, "epoch": 1347} {"train_loss": -22.133346557617188, "global_step": 111825, "epoch": 1347} {"train_loss": -22.301706314086914, "global_step": 111826, "epoch": 1347} {"train_loss": -22.24822998046875, "global_step": 111827, "epoch": 1347} {"train_loss": -22.25692367553711, "global_step": 111828, "epoch": 1347} {"train_loss": -22.438642501831055, "global_step": 111829, "epoch": 1347} {"train_loss": -22.649581909179688, "global_step": 111830, "epoch": 1347} {"train_loss": -22.414243698120117, "global_step": 111831, "epoch": 1347} {"train_loss": -22.14703941345215, "global_step": 111832, "epoch": 1347} {"train_loss": -22.03118133544922, "global_step": 111833, "epoch": 1347} {"train_loss": -22.16102409362793, "global_step": 111834, "epoch": 1347} {"train_loss": -22.487628936767578, "global_step": 111835, "epoch": 1347} {"train_loss": -21.92721939086914, "global_step": 111836, "epoch": 1347} {"train_loss": -22.288700103759766, "global_step": 111837, "epoch": 1347} {"train_loss": -22.09609603881836, "global_step": 111838, "epoch": 1347} {"train_loss": -22.562314987182617, "global_step": 111839, "epoch": 1347} {"train_loss": -22.481842041015625, "global_step": 111840, "epoch": 1347} {"train_loss": -22.098377227783203, "global_step": 111841, "epoch": 1347} {"train_loss": -22.10859489440918, "global_step": 111842, "epoch": 1347} {"train_loss": -22.388303756713867, "global_step": 111843, "epoch": 1347} {"train_loss": -22.011119842529297, "global_step": 111844, "epoch": 1347} {"train_loss": -21.928457260131836, "global_step": 111845, "epoch": 1347} {"train_loss": -22.264978408813477, "global_step": 111846, "epoch": 1347} {"train_loss": -22.23164939880371, "global_step": 111847, "epoch": 1347} {"train_loss": -21.9842472076416, "global_step": 111848, "epoch": 1347} {"train_loss": -22.49090003967285, "global_step": 111849, "epoch": 1347} {"train_loss": -22.12607765197754, "global_step": 111850, "epoch": 1347} {"train_loss": -22.17671775817871, "global_step": 111851, "epoch": 1347} {"train_loss": -22.69278335571289, "global_step": 111852, "epoch": 1347} {"train_loss": -22.172386169433594, "global_step": 111853, "epoch": 1347} {"train_loss": -22.445363998413086, "global_step": 111854, "epoch": 1347} {"train_loss": -22.310083389282227, "global_step": 111855, "epoch": 1347} {"train_loss": -22.304670333862305, "global_step": 111856, "epoch": 1347} {"train_loss": -22.375226974487305, "global_step": 111857, "epoch": 1347} {"train_loss": -22.594587326049805, "global_step": 111858, "epoch": 1347} {"train_loss": -22.399864196777344, "global_step": 111859, "epoch": 1347} {"train_loss": -22.290754318237305, "global_step": 111860, "epoch": 1347} {"train_loss": -21.896190643310547, "global_step": 111861, "epoch": 1347} {"train_loss": -22.137792587280273, "global_step": 111862, "epoch": 1347} {"train_loss": -22.285425186157227, "global_step": 111863, "epoch": 1347} {"train_loss": -22.730226516723633, "global_step": 111864, "epoch": 1347} {"train_loss": -22.278884887695312, "global_step": 111865, "epoch": 1347} {"train_loss": -22.499910354614258, "global_step": 111866, "epoch": 1347} {"train_loss": -22.07642936706543, "global_step": 111867, "epoch": 1347} {"train_loss": -22.28554344177246, "global_step": 111868, "epoch": 1347} {"train_loss": -22.30649185180664, "global_step": 111869, "epoch": 1347} {"train_loss": -21.19734764099121, "global_step": 111870, "epoch": 1347} {"train_loss": -21.483356475830078, "global_step": 111871, "epoch": 1347} {"train_loss": -22.18438148498535, "global_step": 111872, "epoch": 1347} {"train_loss": -22.277833938598633, "global_step": 111873, "epoch": 1347} {"train_loss": -22.12835693359375, "global_step": 111874, "epoch": 1347} {"train_loss": -22.523263931274414, "global_step": 111875, "epoch": 1347} {"train_loss": -22.04830551147461, "global_step": 111876, "epoch": 1347} {"train_loss": -22.31882667541504, "global_step": 111877, "epoch": 1347} {"train_loss": -22.027374267578125, "global_step": 111878, "epoch": 1347} {"train_loss": -22.38256072998047, "global_step": 111879, "epoch": 1347} {"train_loss": -22.262022018432617, "global_step": 111880, "epoch": 1347} {"train_loss": -21.74567985534668, "global_step": 111881, "epoch": 1347} {"train_loss": -22.483068466186523, "global_step": 111882, "epoch": 1347} {"train_loss": -22.225164689213397, "global_step": 111883, "epoch": 1347, "val_loss": 6136868.0} {"train_loss": -21.761966705322266, "global_step": 111884, "epoch": 1348} {"train_loss": -21.753448486328125, "global_step": 111885, "epoch": 1348} {"train_loss": -21.739545822143555, "global_step": 111886, "epoch": 1348} {"train_loss": -21.489858627319336, "global_step": 111887, "epoch": 1348} {"train_loss": -21.491559982299805, "global_step": 111888, "epoch": 1348} {"train_loss": -21.6382999420166, "global_step": 111889, "epoch": 1348} {"train_loss": -22.285511016845703, "global_step": 111890, "epoch": 1348} {"train_loss": -22.00745964050293, "global_step": 111891, "epoch": 1348} {"train_loss": -22.2000675201416, "global_step": 111892, "epoch": 1348} {"train_loss": -21.864500045776367, "global_step": 111893, "epoch": 1348} {"train_loss": -22.484277725219727, "global_step": 111894, "epoch": 1348} {"train_loss": -22.173694610595703, "global_step": 111895, "epoch": 1348} {"train_loss": -21.97060203552246, "global_step": 111896, "epoch": 1348} {"train_loss": -22.121723175048828, "global_step": 111897, "epoch": 1348} {"train_loss": -22.202533721923828, "global_step": 111898, "epoch": 1348} {"train_loss": -22.048654556274414, "global_step": 111899, "epoch": 1348} {"train_loss": -21.964603424072266, "global_step": 111900, "epoch": 1348} {"train_loss": -22.06218147277832, "global_step": 111901, "epoch": 1348} {"train_loss": -22.414474487304688, "global_step": 111902, "epoch": 1348} {"train_loss": -21.892505645751953, "global_step": 111903, "epoch": 1348} {"train_loss": -21.97481346130371, "global_step": 111904, "epoch": 1348} {"train_loss": -22.503488540649414, "global_step": 111905, "epoch": 1348} {"train_loss": -22.135099411010742, "global_step": 111906, "epoch": 1348} {"train_loss": -22.4455623626709, "global_step": 111907, "epoch": 1348} {"train_loss": -21.90164566040039, "global_step": 111908, "epoch": 1348} {"train_loss": -22.332265853881836, "global_step": 111909, "epoch": 1348} {"train_loss": -22.12143898010254, "global_step": 111910, "epoch": 1348} {"train_loss": -22.04791259765625, "global_step": 111911, "epoch": 1348} {"train_loss": -22.399131774902344, "global_step": 111912, "epoch": 1348} {"train_loss": -22.2724666595459, "global_step": 111913, "epoch": 1348} {"train_loss": -22.51565933227539, "global_step": 111914, "epoch": 1348} {"train_loss": -21.952634811401367, "global_step": 111915, "epoch": 1348} {"train_loss": -22.60801124572754, "global_step": 111916, "epoch": 1348} {"train_loss": -22.180761337280273, "global_step": 111917, "epoch": 1348} {"train_loss": -22.494157791137695, "global_step": 111918, "epoch": 1348} {"train_loss": -22.30401611328125, "global_step": 111919, "epoch": 1348} {"train_loss": -22.223554611206055, "global_step": 111920, "epoch": 1348} {"train_loss": -22.362655639648438, "global_step": 111921, "epoch": 1348} {"train_loss": -22.19359588623047, "global_step": 111922, "epoch": 1348} {"train_loss": -22.208702087402344, "global_step": 111923, "epoch": 1348} {"train_loss": -22.19788360595703, "global_step": 111924, "epoch": 1348} {"train_loss": -22.564937591552734, "global_step": 111925, "epoch": 1348} {"train_loss": -22.692333221435547, "global_step": 111926, "epoch": 1348} {"train_loss": -22.273221969604492, "global_step": 111927, "epoch": 1348} {"train_loss": -22.56314468383789, "global_step": 111928, "epoch": 1348} {"train_loss": -22.379169464111328, "global_step": 111929, "epoch": 1348} {"train_loss": -22.30058479309082, "global_step": 111930, "epoch": 1348} {"train_loss": -22.68233299255371, "global_step": 111931, "epoch": 1348} {"train_loss": -22.61409568786621, "global_step": 111932, "epoch": 1348} {"train_loss": -22.376296997070312, "global_step": 111933, "epoch": 1348} {"train_loss": -22.175586700439453, "global_step": 111934, "epoch": 1348} {"train_loss": -22.18204689025879, "global_step": 111935, "epoch": 1348} {"train_loss": -22.290416717529297, "global_step": 111936, "epoch": 1348} {"train_loss": -22.092954635620117, "global_step": 111937, "epoch": 1348} {"train_loss": -21.97224998474121, "global_step": 111938, "epoch": 1348} {"train_loss": -22.33912467956543, "global_step": 111939, "epoch": 1348} {"train_loss": -22.286691665649414, "global_step": 111940, "epoch": 1348} {"train_loss": -22.37993812561035, "global_step": 111941, "epoch": 1348} {"train_loss": -22.24190330505371, "global_step": 111942, "epoch": 1348} {"train_loss": -22.168254852294922, "global_step": 111943, "epoch": 1348} {"train_loss": -22.374189376831055, "global_step": 111944, "epoch": 1348} {"train_loss": -22.33057975769043, "global_step": 111945, "epoch": 1348} {"train_loss": -22.725276947021484, "global_step": 111946, "epoch": 1348} {"train_loss": -21.961833953857422, "global_step": 111947, "epoch": 1348} {"train_loss": -22.032075881958008, "global_step": 111948, "epoch": 1348} {"train_loss": -22.231616973876953, "global_step": 111949, "epoch": 1348} {"train_loss": -22.1076717376709, "global_step": 111950, "epoch": 1348} {"train_loss": -22.174423217773438, "global_step": 111951, "epoch": 1348} {"train_loss": -22.42128562927246, "global_step": 111952, "epoch": 1348} {"train_loss": -22.635501861572266, "global_step": 111953, "epoch": 1348} {"train_loss": -22.439252853393555, "global_step": 111954, "epoch": 1348} {"train_loss": -22.204896926879883, "global_step": 111955, "epoch": 1348} {"train_loss": -22.20842933654785, "global_step": 111956, "epoch": 1348} {"train_loss": -22.132736206054688, "global_step": 111957, "epoch": 1348} {"train_loss": -22.578393936157227, "global_step": 111958, "epoch": 1348} {"train_loss": -22.06893539428711, "global_step": 111959, "epoch": 1348} {"train_loss": -22.206146240234375, "global_step": 111960, "epoch": 1348} {"train_loss": -22.24944496154785, "global_step": 111961, "epoch": 1348} {"train_loss": -22.46065330505371, "global_step": 111962, "epoch": 1348} {"train_loss": -22.186115264892578, "global_step": 111963, "epoch": 1348} {"train_loss": -21.82465171813965, "global_step": 111964, "epoch": 1348} {"train_loss": -21.96730613708496, "global_step": 111965, "epoch": 1348} {"train_loss": -22.19827279699854, "global_step": 111966, "epoch": 1348, "val_loss": 6155679.0} {"train_loss": -21.779346466064453, "global_step": 111967, "epoch": 1349} {"train_loss": -22.266159057617188, "global_step": 111968, "epoch": 1349} {"train_loss": -22.094558715820312, "global_step": 111969, "epoch": 1349} {"train_loss": -22.002363204956055, "global_step": 111970, "epoch": 1349} {"train_loss": -21.786258697509766, "global_step": 111971, "epoch": 1349} {"train_loss": -21.629976272583008, "global_step": 111972, "epoch": 1349} {"train_loss": -21.604740142822266, "global_step": 111973, "epoch": 1349} {"train_loss": -22.064701080322266, "global_step": 111974, "epoch": 1349} {"train_loss": -22.097782135009766, "global_step": 111975, "epoch": 1349} {"train_loss": -22.47308349609375, "global_step": 111976, "epoch": 1349} {"train_loss": -21.816476821899414, "global_step": 111977, "epoch": 1349} {"train_loss": -22.086118698120117, "global_step": 111978, "epoch": 1349} {"train_loss": -21.610410690307617, "global_step": 111979, "epoch": 1349} {"train_loss": -22.13234519958496, "global_step": 111980, "epoch": 1349} {"train_loss": -22.276561737060547, "global_step": 111981, "epoch": 1349} {"train_loss": -21.992313385009766, "global_step": 111982, "epoch": 1349} {"train_loss": -22.0624942779541, "global_step": 111983, "epoch": 1349} {"train_loss": -21.968786239624023, "global_step": 111984, "epoch": 1349} {"train_loss": -22.455244064331055, "global_step": 111985, "epoch": 1349} {"train_loss": -22.065153121948242, "global_step": 111986, "epoch": 1349} {"train_loss": -22.042980194091797, "global_step": 111987, "epoch": 1349} {"train_loss": -21.92154312133789, "global_step": 111988, "epoch": 1349} {"train_loss": -22.0579891204834, "global_step": 111989, "epoch": 1349} {"train_loss": -22.369705200195312, "global_step": 111990, "epoch": 1349} {"train_loss": -22.18800163269043, "global_step": 111991, "epoch": 1349} {"train_loss": -22.42050552368164, "global_step": 111992, "epoch": 1349} {"train_loss": -22.254308700561523, "global_step": 111993, "epoch": 1349} {"train_loss": -22.054519653320312, "global_step": 111994, "epoch": 1349} {"train_loss": -22.1992244720459, "global_step": 111995, "epoch": 1349} {"train_loss": -22.21344757080078, "global_step": 111996, "epoch": 1349} {"train_loss": -22.127059936523438, "global_step": 111997, "epoch": 1349} {"train_loss": -22.58212661743164, "global_step": 111998, "epoch": 1349} {"train_loss": -22.200300216674805, "global_step": 111999, "epoch": 1349} {"train_loss": -22.32077980041504, "global_step": 112000, "epoch": 1349} {"train_loss": -22.176513671875, "global_step": 112001, "epoch": 1349} {"train_loss": -22.226852416992188, "global_step": 112002, "epoch": 1349} {"train_loss": -22.37994384765625, "global_step": 112003, "epoch": 1349} {"train_loss": -22.440717697143555, "global_step": 112004, "epoch": 1349} {"train_loss": -22.531932830810547, "global_step": 112005, "epoch": 1349} {"train_loss": -22.488515853881836, "global_step": 112006, "epoch": 1349} {"train_loss": -22.28360939025879, "global_step": 112007, "epoch": 1349} {"train_loss": -22.740859985351562, "global_step": 112008, "epoch": 1349} {"train_loss": -22.140460968017578, "global_step": 112009, "epoch": 1349} {"train_loss": -22.44205093383789, "global_step": 112010, "epoch": 1349} {"train_loss": -22.52950096130371, "global_step": 112011, "epoch": 1349} {"train_loss": -22.222558975219727, "global_step": 112012, "epoch": 1349} {"train_loss": -22.53012466430664, "global_step": 112013, "epoch": 1349} {"train_loss": -22.57001304626465, "global_step": 112014, "epoch": 1349} {"train_loss": -22.24960708618164, "global_step": 112015, "epoch": 1349} {"train_loss": -22.41510009765625, "global_step": 112016, "epoch": 1349} {"train_loss": -22.339183807373047, "global_step": 112017, "epoch": 1349} {"train_loss": -22.449005126953125, "global_step": 112018, "epoch": 1349} {"train_loss": -22.197437286376953, "global_step": 112019, "epoch": 1349} {"train_loss": -22.833608627319336, "global_step": 112020, "epoch": 1349} {"train_loss": -22.403762817382812, "global_step": 112021, "epoch": 1349} {"train_loss": -22.571866989135742, "global_step": 112022, "epoch": 1349} {"train_loss": -22.068405151367188, "global_step": 112023, "epoch": 1349} {"train_loss": -22.619909286499023, "global_step": 112024, "epoch": 1349} {"train_loss": -22.368322372436523, "global_step": 112025, "epoch": 1349} {"train_loss": -22.16611671447754, "global_step": 112026, "epoch": 1349} {"train_loss": -22.538427352905273, "global_step": 112027, "epoch": 1349} {"train_loss": -22.125829696655273, "global_step": 112028, "epoch": 1349} {"train_loss": -22.34822654724121, "global_step": 112029, "epoch": 1349} {"train_loss": -22.183914184570312, "global_step": 112030, "epoch": 1349} {"train_loss": -22.213134765625, "global_step": 112031, "epoch": 1349} {"train_loss": -22.305904388427734, "global_step": 112032, "epoch": 1349} {"train_loss": -22.507261276245117, "global_step": 112033, "epoch": 1349} {"train_loss": -22.245800018310547, "global_step": 112034, "epoch": 1349} {"train_loss": -22.10245132446289, "global_step": 112035, "epoch": 1349} {"train_loss": -22.424375534057617, "global_step": 112036, "epoch": 1349} {"train_loss": -22.41030502319336, "global_step": 112037, "epoch": 1349} {"train_loss": -22.077880859375, "global_step": 112038, "epoch": 1349} {"train_loss": -22.371458053588867, "global_step": 112039, "epoch": 1349} {"train_loss": -22.636899948120117, "global_step": 112040, "epoch": 1349} {"train_loss": -22.264862060546875, "global_step": 112041, "epoch": 1349} {"train_loss": -22.238317489624023, "global_step": 112042, "epoch": 1349} {"train_loss": -22.399555206298828, "global_step": 112043, "epoch": 1349} {"train_loss": -22.064922332763672, "global_step": 112044, "epoch": 1349} {"train_loss": -22.147851943969727, "global_step": 112045, "epoch": 1349} {"train_loss": -22.314821243286133, "global_step": 112046, "epoch": 1349} {"train_loss": -22.192588806152344, "global_step": 112047, "epoch": 1349} {"train_loss": -22.26854705810547, "global_step": 112048, "epoch": 1349} {"train_loss": -22.225382678480035, "global_step": 112049, "epoch": 1349, "val_loss": 6358028.0} {"train_loss": -21.437349319458008, "global_step": 112050, "epoch": 1350} {"train_loss": -21.377065658569336, "global_step": 112051, "epoch": 1350} {"train_loss": -21.72690200805664, "global_step": 112052, "epoch": 1350} {"train_loss": -21.459569931030273, "global_step": 112053, "epoch": 1350} {"train_loss": -21.644643783569336, "global_step": 112054, "epoch": 1350} {"train_loss": -21.822202682495117, "global_step": 112055, "epoch": 1350} {"train_loss": -21.91328239440918, "global_step": 112056, "epoch": 1350} {"train_loss": -21.914175033569336, "global_step": 112057, "epoch": 1350} {"train_loss": -21.691864013671875, "global_step": 112058, "epoch": 1350} {"train_loss": -21.999183654785156, "global_step": 112059, "epoch": 1350} {"train_loss": -22.08316421508789, "global_step": 112060, "epoch": 1350} {"train_loss": -21.644969940185547, "global_step": 112061, "epoch": 1350} {"train_loss": -21.98824691772461, "global_step": 112062, "epoch": 1350} {"train_loss": -21.88262939453125, "global_step": 112063, "epoch": 1350} {"train_loss": -21.867734909057617, "global_step": 112064, "epoch": 1350} {"train_loss": -22.0640811920166, "global_step": 112065, "epoch": 1350} {"train_loss": -21.90863037109375, "global_step": 112066, "epoch": 1350} {"train_loss": -22.063682556152344, "global_step": 112067, "epoch": 1350} {"train_loss": -22.2327938079834, "global_step": 112068, "epoch": 1350} {"train_loss": -21.82427406311035, "global_step": 112069, "epoch": 1350} {"train_loss": -21.993188858032227, "global_step": 112070, "epoch": 1350} {"train_loss": -22.34395408630371, "global_step": 112071, "epoch": 1350} {"train_loss": -22.537006378173828, "global_step": 112072, "epoch": 1350} {"train_loss": -22.073883056640625, "global_step": 112073, "epoch": 1350} {"train_loss": -22.34430503845215, "global_step": 112074, "epoch": 1350} {"train_loss": -22.158716201782227, "global_step": 112075, "epoch": 1350} {"train_loss": -22.174488067626953, "global_step": 112076, "epoch": 1350} {"train_loss": -22.314298629760742, "global_step": 112077, "epoch": 1350} {"train_loss": -22.28818702697754, "global_step": 112078, "epoch": 1350} {"train_loss": -22.059249877929688, "global_step": 112079, "epoch": 1350} {"train_loss": -22.70029067993164, "global_step": 112080, "epoch": 1350} {"train_loss": -22.13924217224121, "global_step": 112081, "epoch": 1350} {"train_loss": -22.50031089782715, "global_step": 112082, "epoch": 1350} {"train_loss": -22.72503662109375, "global_step": 112083, "epoch": 1350} {"train_loss": -21.9169864654541, "global_step": 112084, "epoch": 1350} {"train_loss": -22.224802017211914, "global_step": 112085, "epoch": 1350} {"train_loss": -22.438833236694336, "global_step": 112086, "epoch": 1350} {"train_loss": -22.167768478393555, "global_step": 112087, "epoch": 1350} {"train_loss": -22.016687393188477, "global_step": 112088, "epoch": 1350} {"train_loss": -22.534826278686523, "global_step": 112089, "epoch": 1350} {"train_loss": -22.377267837524414, "global_step": 112090, "epoch": 1350} {"train_loss": -22.20258140563965, "global_step": 112091, "epoch": 1350} {"train_loss": -22.438796997070312, "global_step": 112092, "epoch": 1350} {"train_loss": -22.377042770385742, "global_step": 112093, "epoch": 1350} {"train_loss": -22.453752517700195, "global_step": 112094, "epoch": 1350} {"train_loss": -22.51531219482422, "global_step": 112095, "epoch": 1350} {"train_loss": -22.004484176635742, "global_step": 112096, "epoch": 1350} {"train_loss": -22.022043228149414, "global_step": 112097, "epoch": 1350} {"train_loss": -22.102785110473633, "global_step": 112098, "epoch": 1350} {"train_loss": -22.4390811920166, "global_step": 112099, "epoch": 1350} {"train_loss": -22.08037757873535, "global_step": 112100, "epoch": 1350} {"train_loss": -22.124975204467773, "global_step": 112101, "epoch": 1350} {"train_loss": -22.1351375579834, "global_step": 112102, "epoch": 1350} {"train_loss": -22.508148193359375, "global_step": 112103, "epoch": 1350} {"train_loss": -22.013948440551758, "global_step": 112104, "epoch": 1350} {"train_loss": -22.44516944885254, "global_step": 112105, "epoch": 1350} {"train_loss": -22.102134704589844, "global_step": 112106, "epoch": 1350} {"train_loss": -21.96943473815918, "global_step": 112107, "epoch": 1350} {"train_loss": -22.22861671447754, "global_step": 112108, "epoch": 1350} {"train_loss": -22.309049606323242, "global_step": 112109, "epoch": 1350} {"train_loss": -22.37590980529785, "global_step": 112110, "epoch": 1350} {"train_loss": -22.243167877197266, "global_step": 112111, "epoch": 1350} {"train_loss": -22.268844604492188, "global_step": 112112, "epoch": 1350} {"train_loss": -22.209239959716797, "global_step": 112113, "epoch": 1350} {"train_loss": -22.68292236328125, "global_step": 112114, "epoch": 1350} {"train_loss": -22.61678123474121, "global_step": 112115, "epoch": 1350} {"train_loss": -22.214101791381836, "global_step": 112116, "epoch": 1350} {"train_loss": -22.355329513549805, "global_step": 112117, "epoch": 1350} {"train_loss": -22.316499710083008, "global_step": 112118, "epoch": 1350} {"train_loss": -22.319257736206055, "global_step": 112119, "epoch": 1350} {"train_loss": -22.41396141052246, "global_step": 112120, "epoch": 1350} {"train_loss": -22.178686141967773, "global_step": 112121, "epoch": 1350} {"train_loss": -22.578672409057617, "global_step": 112122, "epoch": 1350} {"train_loss": -22.360807418823242, "global_step": 112123, "epoch": 1350} {"train_loss": -22.330060958862305, "global_step": 112124, "epoch": 1350} {"train_loss": -22.0900936126709, "global_step": 112125, "epoch": 1350} {"train_loss": -22.53070068359375, "global_step": 112126, "epoch": 1350} {"train_loss": -22.611446380615234, "global_step": 112127, "epoch": 1350} {"train_loss": -22.269865036010742, "global_step": 112128, "epoch": 1350} {"train_loss": -22.38808822631836, "global_step": 112129, "epoch": 1350} {"train_loss": -22.507413864135742, "global_step": 112130, "epoch": 1350} {"train_loss": -22.32261085510254, "global_step": 112131, "epoch": 1350} {"train_loss": -22.18393854348056, "global_step": 112132, "epoch": 1350, "train/sim_max_reward_0": 1.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4500000": 1.0, "test/sim_max_reward_4500001": 1.0, "test/sim_max_reward_4500002": 1.0, "test/sim_max_reward_4500003": 1.0, "test/sim_max_reward_4500004": 1.0, "test/sim_max_reward_4500005": 1.0, "test/sim_max_reward_4500006": 1.0, "test/sim_max_reward_4500007": 1.0, "test/sim_max_reward_4500008": 1.0, "test/sim_max_reward_4500009": 1.0, "test/sim_max_reward_4500010": 1.0, "test/sim_max_reward_4500011": 1.0, "test/sim_max_reward_4500012": 1.0, "test/sim_max_reward_4500013": 1.0, "test/sim_max_reward_4500014": 1.0, "test/sim_max_reward_4500015": 1.0, "test/sim_max_reward_4500016": 1.0, "test/sim_max_reward_4500017": 1.0, "test/sim_max_reward_4500018": 1.0, "test/sim_max_reward_4500019": 1.0, "test/sim_max_reward_4500020": 1.0, "test/sim_max_reward_4500021": 1.0, "train/mean_score": 1.0, "test/mean_score": 1.0, "val_loss": 6287222.0} {"train_loss": -22.149682998657227, "global_step": 112133, "epoch": 1351} {"train_loss": -22.11635398864746, "global_step": 112134, "epoch": 1351} {"train_loss": -22.504053115844727, "global_step": 112135, "epoch": 1351} {"train_loss": -21.661691665649414, "global_step": 112136, "epoch": 1351} {"train_loss": -22.17007064819336, "global_step": 112137, "epoch": 1351} {"train_loss": -22.325849533081055, "global_step": 112138, "epoch": 1351} {"train_loss": -22.366865158081055, "global_step": 112139, "epoch": 1351} {"train_loss": -22.173505783081055, "global_step": 112140, "epoch": 1351} {"train_loss": -22.08701515197754, "global_step": 112141, "epoch": 1351} {"train_loss": -22.3001766204834, "global_step": 112142, "epoch": 1351} {"train_loss": -21.868139266967773, "global_step": 112143, "epoch": 1351} {"train_loss": -21.98521614074707, "global_step": 112144, "epoch": 1351} {"train_loss": -22.415578842163086, "global_step": 112145, "epoch": 1351} {"train_loss": -22.51915168762207, "global_step": 112146, "epoch": 1351} {"train_loss": -22.223196029663086, "global_step": 112147, "epoch": 1351} {"train_loss": -21.982263565063477, "global_step": 112148, "epoch": 1351} {"train_loss": -22.094541549682617, "global_step": 112149, "epoch": 1351} {"train_loss": -22.441770553588867, "global_step": 112150, "epoch": 1351} {"train_loss": -22.509479522705078, "global_step": 112151, "epoch": 1351} {"train_loss": -22.31571388244629, "global_step": 112152, "epoch": 1351} {"train_loss": -22.567842483520508, "global_step": 112153, "epoch": 1351} {"train_loss": -22.484922409057617, "global_step": 112154, "epoch": 1351} {"train_loss": -22.39788055419922, "global_step": 112155, "epoch": 1351} {"train_loss": -22.45170021057129, "global_step": 112156, "epoch": 1351} {"train_loss": -22.592050552368164, "global_step": 112157, "epoch": 1351} {"train_loss": -22.237468719482422, "global_step": 112158, "epoch": 1351} {"train_loss": -22.520526885986328, "global_step": 112159, "epoch": 1351} {"train_loss": -22.2710018157959, "global_step": 112160, "epoch": 1351} {"train_loss": -22.334339141845703, "global_step": 112161, "epoch": 1351} {"train_loss": -22.367534637451172, "global_step": 112162, "epoch": 1351} {"train_loss": -22.61229133605957, "global_step": 112163, "epoch": 1351} {"train_loss": -22.230688095092773, "global_step": 112164, "epoch": 1351} {"train_loss": -22.210540771484375, "global_step": 112165, "epoch": 1351} {"train_loss": -22.041248321533203, "global_step": 112166, "epoch": 1351} {"train_loss": -22.265457153320312, "global_step": 112167, "epoch": 1351} {"train_loss": -22.230728149414062, "global_step": 112168, "epoch": 1351} {"train_loss": -22.001718521118164, "global_step": 112169, "epoch": 1351} {"train_loss": -22.428247451782227, "global_step": 112170, "epoch": 1351} {"train_loss": -22.40227699279785, "global_step": 112171, "epoch": 1351} {"train_loss": -22.37921905517578, "global_step": 112172, "epoch": 1351} {"train_loss": -22.244997024536133, "global_step": 112173, "epoch": 1351} {"train_loss": -22.408544540405273, "global_step": 112174, "epoch": 1351} {"train_loss": -22.108783721923828, "global_step": 112175, "epoch": 1351} {"train_loss": -22.32184410095215, "global_step": 112176, "epoch": 1351} {"train_loss": -22.3603458404541, "global_step": 112177, "epoch": 1351} {"train_loss": -22.548681259155273, "global_step": 112178, "epoch": 1351} {"train_loss": -22.39020347595215, "global_step": 112179, "epoch": 1351} {"train_loss": -21.96169662475586, "global_step": 112180, "epoch": 1351} {"train_loss": -22.269227981567383, "global_step": 112181, "epoch": 1351} {"train_loss": -22.193967819213867, "global_step": 112182, "epoch": 1351} {"train_loss": -22.235227584838867, "global_step": 112183, "epoch": 1351} {"train_loss": -22.42635154724121, "global_step": 112184, "epoch": 1351} {"train_loss": -22.111478805541992, "global_step": 112185, "epoch": 1351} {"train_loss": -22.359373092651367, "global_step": 112186, "epoch": 1351} {"train_loss": -22.20543098449707, "global_step": 112187, "epoch": 1351} {"train_loss": -22.237302780151367, "global_step": 112188, "epoch": 1351} {"train_loss": -22.189985275268555, "global_step": 112189, "epoch": 1351} {"train_loss": -22.135696411132812, "global_step": 112190, "epoch": 1351} {"train_loss": -22.040809631347656, "global_step": 112191, "epoch": 1351} {"train_loss": -22.427642822265625, "global_step": 112192, "epoch": 1351} {"train_loss": -21.719274520874023, "global_step": 112193, "epoch": 1351} {"train_loss": -22.255386352539062, "global_step": 112194, "epoch": 1351} {"train_loss": -21.890085220336914, "global_step": 112195, "epoch": 1351} {"train_loss": -22.355588912963867, "global_step": 112196, "epoch": 1351} {"train_loss": -22.4127254486084, "global_step": 112197, "epoch": 1351} {"train_loss": -22.0280818939209, "global_step": 112198, "epoch": 1351} {"train_loss": -22.382497787475586, "global_step": 112199, "epoch": 1351} {"train_loss": -22.198368072509766, "global_step": 112200, "epoch": 1351} {"train_loss": -22.59541130065918, "global_step": 112201, "epoch": 1351} {"train_loss": -22.270627975463867, "global_step": 112202, "epoch": 1351} {"train_loss": -22.270917892456055, "global_step": 112203, "epoch": 1351} {"train_loss": -22.154356002807617, "global_step": 112204, "epoch": 1351} {"train_loss": -22.53244972229004, "global_step": 112205, "epoch": 1351} {"train_loss": -22.0457820892334, "global_step": 112206, "epoch": 1351} {"train_loss": -22.5175838470459, "global_step": 112207, "epoch": 1351} {"train_loss": -22.219377517700195, "global_step": 112208, "epoch": 1351} {"train_loss": -22.443628311157227, "global_step": 112209, "epoch": 1351} {"train_loss": -22.36789894104004, "global_step": 112210, "epoch": 1351} {"train_loss": -22.21303939819336, "global_step": 112211, "epoch": 1351} {"train_loss": -22.27756118774414, "global_step": 112212, "epoch": 1351} {"train_loss": -22.316221237182617, "global_step": 112213, "epoch": 1351} {"train_loss": -21.85652732849121, "global_step": 112214, "epoch": 1351} {"train_loss": -22.241802813058875, "global_step": 112215, "epoch": 1351, "val_loss": 6281816.0} {"train_loss": -22.07063865661621, "global_step": 112216, "epoch": 1352} {"train_loss": -22.202503204345703, "global_step": 112217, "epoch": 1352} {"train_loss": -22.105098724365234, "global_step": 112218, "epoch": 1352} {"train_loss": -22.11248779296875, "global_step": 112219, "epoch": 1352} {"train_loss": -22.22684097290039, "global_step": 112220, "epoch": 1352} {"train_loss": -22.18048095703125, "global_step": 112221, "epoch": 1352} {"train_loss": -22.175477981567383, "global_step": 112222, "epoch": 1352} {"train_loss": -22.14765739440918, "global_step": 112223, "epoch": 1352} {"train_loss": -22.06492805480957, "global_step": 112224, "epoch": 1352} {"train_loss": -22.125112533569336, "global_step": 112225, "epoch": 1352} {"train_loss": -22.646026611328125, "global_step": 112226, "epoch": 1352} {"train_loss": -22.283634185791016, "global_step": 112227, "epoch": 1352} {"train_loss": -22.576099395751953, "global_step": 112228, "epoch": 1352} {"train_loss": -22.22035026550293, "global_step": 112229, "epoch": 1352} {"train_loss": -22.16190528869629, "global_step": 112230, "epoch": 1352} {"train_loss": -22.333120346069336, "global_step": 112231, "epoch": 1352} {"train_loss": -22.36762046813965, "global_step": 112232, "epoch": 1352} {"train_loss": -22.184146881103516, "global_step": 112233, "epoch": 1352} {"train_loss": -22.110214233398438, "global_step": 112234, "epoch": 1352} {"train_loss": -22.325164794921875, "global_step": 112235, "epoch": 1352} {"train_loss": -22.03727149963379, "global_step": 112236, "epoch": 1352} {"train_loss": -22.329496383666992, "global_step": 112237, "epoch": 1352} {"train_loss": -22.677305221557617, "global_step": 112238, "epoch": 1352} {"train_loss": -22.232324600219727, "global_step": 112239, "epoch": 1352} {"train_loss": -22.310422897338867, "global_step": 112240, "epoch": 1352} {"train_loss": -22.629770278930664, "global_step": 112241, "epoch": 1352} {"train_loss": -22.248313903808594, "global_step": 112242, "epoch": 1352} {"train_loss": -22.431371688842773, "global_step": 112243, "epoch": 1352} {"train_loss": -22.46168327331543, "global_step": 112244, "epoch": 1352} {"train_loss": -22.00421905517578, "global_step": 112245, "epoch": 1352} {"train_loss": -22.277156829833984, "global_step": 112246, "epoch": 1352} {"train_loss": -22.367889404296875, "global_step": 112247, "epoch": 1352} {"train_loss": -22.54230308532715, "global_step": 112248, "epoch": 1352} {"train_loss": -22.255395889282227, "global_step": 112249, "epoch": 1352} {"train_loss": -22.276395797729492, "global_step": 112250, "epoch": 1352} {"train_loss": -22.410024642944336, "global_step": 112251, "epoch": 1352} {"train_loss": -22.469327926635742, "global_step": 112252, "epoch": 1352} {"train_loss": -22.22920036315918, "global_step": 112253, "epoch": 1352} {"train_loss": -22.395610809326172, "global_step": 112254, "epoch": 1352} {"train_loss": -22.02685546875, "global_step": 112255, "epoch": 1352} {"train_loss": -22.496274948120117, "global_step": 112256, "epoch": 1352} {"train_loss": -22.21235466003418, "global_step": 112257, "epoch": 1352} {"train_loss": -22.020971298217773, "global_step": 112258, "epoch": 1352} {"train_loss": -22.322111129760742, "global_step": 112259, "epoch": 1352} {"train_loss": -22.299619674682617, "global_step": 112260, "epoch": 1352} {"train_loss": -22.348798751831055, "global_step": 112261, "epoch": 1352} {"train_loss": -22.367446899414062, "global_step": 112262, "epoch": 1352} {"train_loss": -21.76599884033203, "global_step": 112263, "epoch": 1352} {"train_loss": -22.152650833129883, "global_step": 112264, "epoch": 1352} {"train_loss": -22.203794479370117, "global_step": 112265, "epoch": 1352} {"train_loss": -21.8713436126709, "global_step": 112266, "epoch": 1352} {"train_loss": -21.926734924316406, "global_step": 112267, "epoch": 1352} {"train_loss": -22.434850692749023, "global_step": 112268, "epoch": 1352} {"train_loss": -22.44720458984375, "global_step": 112269, "epoch": 1352} {"train_loss": -22.375131607055664, "global_step": 112270, "epoch": 1352} {"train_loss": -22.066776275634766, "global_step": 112271, "epoch": 1352} {"train_loss": -22.32623863220215, "global_step": 112272, "epoch": 1352} {"train_loss": -22.176868438720703, "global_step": 112273, "epoch": 1352} {"train_loss": -22.18608283996582, "global_step": 112274, "epoch": 1352} {"train_loss": -22.277013778686523, "global_step": 112275, "epoch": 1352} {"train_loss": -22.687963485717773, "global_step": 112276, "epoch": 1352} {"train_loss": -22.443805694580078, "global_step": 112277, "epoch": 1352} {"train_loss": -22.14056396484375, "global_step": 112278, "epoch": 1352} {"train_loss": -22.480152130126953, "global_step": 112279, "epoch": 1352} {"train_loss": -22.08595085144043, "global_step": 112280, "epoch": 1352} {"train_loss": -22.297433853149414, "global_step": 112281, "epoch": 1352} {"train_loss": -22.571359634399414, "global_step": 112282, "epoch": 1352} {"train_loss": -22.694477081298828, "global_step": 112283, "epoch": 1352} {"train_loss": -22.08230972290039, "global_step": 112284, "epoch": 1352} {"train_loss": -22.38079071044922, "global_step": 112285, "epoch": 1352} {"train_loss": -22.315366744995117, "global_step": 112286, "epoch": 1352} {"train_loss": -22.5467472076416, "global_step": 112287, "epoch": 1352} {"train_loss": -22.27025032043457, "global_step": 112288, "epoch": 1352} {"train_loss": -21.682491302490234, "global_step": 112289, "epoch": 1352} {"train_loss": -22.351415634155273, "global_step": 112290, "epoch": 1352} {"train_loss": -22.095197677612305, "global_step": 112291, "epoch": 1352} {"train_loss": -22.273883819580078, "global_step": 112292, "epoch": 1352} {"train_loss": -22.67231559753418, "global_step": 112293, "epoch": 1352} {"train_loss": -22.02219009399414, "global_step": 112294, "epoch": 1352} {"train_loss": -22.335983276367188, "global_step": 112295, "epoch": 1352} {"train_loss": -22.16419792175293, "global_step": 112296, "epoch": 1352} {"train_loss": -22.371789932250977, "global_step": 112297, "epoch": 1352} {"train_loss": -22.246339981814465, "global_step": 112298, "epoch": 1352, "val_loss": 6114195.0} {"train_loss": -21.813322067260742, "global_step": 112299, "epoch": 1353} {"train_loss": -21.5306453704834, "global_step": 112300, "epoch": 1353} {"train_loss": -21.50459861755371, "global_step": 112301, "epoch": 1353} {"train_loss": -22.096635818481445, "global_step": 112302, "epoch": 1353} {"train_loss": -21.952009201049805, "global_step": 112303, "epoch": 1353} {"train_loss": -21.65233612060547, "global_step": 112304, "epoch": 1353} {"train_loss": -22.263391494750977, "global_step": 112305, "epoch": 1353} {"train_loss": -21.896377563476562, "global_step": 112306, "epoch": 1353} {"train_loss": -22.01526641845703, "global_step": 112307, "epoch": 1353} {"train_loss": -21.87055015563965, "global_step": 112308, "epoch": 1353} {"train_loss": -22.21333122253418, "global_step": 112309, "epoch": 1353} {"train_loss": -22.520374298095703, "global_step": 112310, "epoch": 1353} {"train_loss": -22.625059127807617, "global_step": 112311, "epoch": 1353} {"train_loss": -21.90555763244629, "global_step": 112312, "epoch": 1353} {"train_loss": -21.836843490600586, "global_step": 112313, "epoch": 1353} {"train_loss": -22.176162719726562, "global_step": 112314, "epoch": 1353} {"train_loss": -22.050683975219727, "global_step": 112315, "epoch": 1353} {"train_loss": -22.001724243164062, "global_step": 112316, "epoch": 1353} {"train_loss": -22.112897872924805, "global_step": 112317, "epoch": 1353} {"train_loss": -21.946514129638672, "global_step": 112318, "epoch": 1353} {"train_loss": -21.9205265045166, "global_step": 112319, "epoch": 1353} {"train_loss": -22.141315460205078, "global_step": 112320, "epoch": 1353} {"train_loss": -22.32857322692871, "global_step": 112321, "epoch": 1353} {"train_loss": -22.353429794311523, "global_step": 112322, "epoch": 1353} {"train_loss": -22.432661056518555, "global_step": 112323, "epoch": 1353} {"train_loss": -22.308786392211914, "global_step": 112324, "epoch": 1353} {"train_loss": -22.220346450805664, "global_step": 112325, "epoch": 1353} {"train_loss": -22.40220069885254, "global_step": 112326, "epoch": 1353} {"train_loss": -22.456989288330078, "global_step": 112327, "epoch": 1353} {"train_loss": -22.343597412109375, "global_step": 112328, "epoch": 1353} {"train_loss": -22.640422821044922, "global_step": 112329, "epoch": 1353} {"train_loss": -22.049047470092773, "global_step": 112330, "epoch": 1353} {"train_loss": -22.16594886779785, "global_step": 112331, "epoch": 1353} {"train_loss": -22.358753204345703, "global_step": 112332, "epoch": 1353} {"train_loss": -22.42071533203125, "global_step": 112333, "epoch": 1353} {"train_loss": -22.43338966369629, "global_step": 112334, "epoch": 1353} {"train_loss": -22.407596588134766, "global_step": 112335, "epoch": 1353} {"train_loss": -22.17494010925293, "global_step": 112336, "epoch": 1353} {"train_loss": -22.544315338134766, "global_step": 112337, "epoch": 1353} {"train_loss": -22.171972274780273, "global_step": 112338, "epoch": 1353} {"train_loss": -22.547739028930664, "global_step": 112339, "epoch": 1353} {"train_loss": -22.29261016845703, "global_step": 112340, "epoch": 1353} {"train_loss": -22.244075775146484, "global_step": 112341, "epoch": 1353} {"train_loss": -22.495248794555664, "global_step": 112342, "epoch": 1353} {"train_loss": -22.1889705657959, "global_step": 112343, "epoch": 1353} {"train_loss": -22.706172943115234, "global_step": 112344, "epoch": 1353} {"train_loss": -22.462677001953125, "global_step": 112345, "epoch": 1353} {"train_loss": -22.3514404296875, "global_step": 112346, "epoch": 1353} {"train_loss": -22.150632858276367, "global_step": 112347, "epoch": 1353} {"train_loss": -22.580965042114258, "global_step": 112348, "epoch": 1353} {"train_loss": -22.2523250579834, "global_step": 112349, "epoch": 1353} {"train_loss": -22.269550323486328, "global_step": 112350, "epoch": 1353} {"train_loss": -22.201221466064453, "global_step": 112351, "epoch": 1353} {"train_loss": -22.39501953125, "global_step": 112352, "epoch": 1353} {"train_loss": -22.562206268310547, "global_step": 112353, "epoch": 1353} {"train_loss": -22.376134872436523, "global_step": 112354, "epoch": 1353} {"train_loss": -22.279945373535156, "global_step": 112355, "epoch": 1353} {"train_loss": -22.266845703125, "global_step": 112356, "epoch": 1353} {"train_loss": -21.856563568115234, "global_step": 112357, "epoch": 1353} {"train_loss": -22.300373077392578, "global_step": 112358, "epoch": 1353} {"train_loss": -22.478139877319336, "global_step": 112359, "epoch": 1353} {"train_loss": -22.278013229370117, "global_step": 112360, "epoch": 1353} {"train_loss": -22.2246036529541, "global_step": 112361, "epoch": 1353} {"train_loss": -22.410022735595703, "global_step": 112362, "epoch": 1353} {"train_loss": -22.314102172851562, "global_step": 112363, "epoch": 1353} {"train_loss": -22.1179256439209, "global_step": 112364, "epoch": 1353} {"train_loss": -22.346498489379883, "global_step": 112365, "epoch": 1353} {"train_loss": -22.28533935546875, "global_step": 112366, "epoch": 1353} {"train_loss": -22.028690338134766, "global_step": 112367, "epoch": 1353} {"train_loss": -21.9227352142334, "global_step": 112368, "epoch": 1353} {"train_loss": -22.2504940032959, "global_step": 112369, "epoch": 1353} {"train_loss": -22.112667083740234, "global_step": 112370, "epoch": 1353} {"train_loss": -22.01666259765625, "global_step": 112371, "epoch": 1353} {"train_loss": -22.173198699951172, "global_step": 112372, "epoch": 1353} {"train_loss": -22.297998428344727, "global_step": 112373, "epoch": 1353} {"train_loss": -22.724964141845703, "global_step": 112374, "epoch": 1353} {"train_loss": -22.285511016845703, "global_step": 112375, "epoch": 1353} {"train_loss": -22.347105026245117, "global_step": 112376, "epoch": 1353} {"train_loss": -21.88858985900879, "global_step": 112377, "epoch": 1353} {"train_loss": -22.19722557067871, "global_step": 112378, "epoch": 1353} {"train_loss": -22.520767211914062, "global_step": 112379, "epoch": 1353} {"train_loss": -22.32179832458496, "global_step": 112380, "epoch": 1353} {"train_loss": -22.229609018348786, "global_step": 112381, "epoch": 1353, "val_loss": 6183980.0} {"train_loss": -21.320022583007812, "global_step": 112382, "epoch": 1354} {"train_loss": -21.654447555541992, "global_step": 112383, "epoch": 1354} {"train_loss": -21.784330368041992, "global_step": 112384, "epoch": 1354} {"train_loss": -21.352418899536133, "global_step": 112385, "epoch": 1354} {"train_loss": -21.5914363861084, "global_step": 112386, "epoch": 1354} {"train_loss": -21.859121322631836, "global_step": 112387, "epoch": 1354} {"train_loss": -21.46358299255371, "global_step": 112388, "epoch": 1354} {"train_loss": -21.766197204589844, "global_step": 112389, "epoch": 1354} {"train_loss": -21.774555206298828, "global_step": 112390, "epoch": 1354} {"train_loss": -22.041730880737305, "global_step": 112391, "epoch": 1354} {"train_loss": -21.647199630737305, "global_step": 112392, "epoch": 1354} {"train_loss": -21.791484832763672, "global_step": 112393, "epoch": 1354} {"train_loss": -21.62772560119629, "global_step": 112394, "epoch": 1354} {"train_loss": -21.711074829101562, "global_step": 112395, "epoch": 1354} {"train_loss": -21.882537841796875, "global_step": 112396, "epoch": 1354} {"train_loss": -21.92540168762207, "global_step": 112397, "epoch": 1354} {"train_loss": -22.0260009765625, "global_step": 112398, "epoch": 1354} {"train_loss": -22.300642013549805, "global_step": 112399, "epoch": 1354} {"train_loss": -22.067991256713867, "global_step": 112400, "epoch": 1354} {"train_loss": -21.999404907226562, "global_step": 112401, "epoch": 1354} {"train_loss": -22.049108505249023, "global_step": 112402, "epoch": 1354} {"train_loss": -21.88994026184082, "global_step": 112403, "epoch": 1354} {"train_loss": -22.09896469116211, "global_step": 112404, "epoch": 1354} {"train_loss": -22.458267211914062, "global_step": 112405, "epoch": 1354} {"train_loss": -22.147842407226562, "global_step": 112406, "epoch": 1354} {"train_loss": -21.892187118530273, "global_step": 112407, "epoch": 1354} {"train_loss": -22.25607681274414, "global_step": 112408, "epoch": 1354} {"train_loss": -22.544939041137695, "global_step": 112409, "epoch": 1354} {"train_loss": -22.120046615600586, "global_step": 112410, "epoch": 1354} {"train_loss": -22.571971893310547, "global_step": 112411, "epoch": 1354} {"train_loss": -22.385690689086914, "global_step": 112412, "epoch": 1354} {"train_loss": -22.40164566040039, "global_step": 112413, "epoch": 1354} {"train_loss": -22.174402236938477, "global_step": 112414, "epoch": 1354} {"train_loss": -22.550512313842773, "global_step": 112415, "epoch": 1354} {"train_loss": -22.517057418823242, "global_step": 112416, "epoch": 1354} {"train_loss": -22.40225601196289, "global_step": 112417, "epoch": 1354} {"train_loss": -22.607576370239258, "global_step": 112418, "epoch": 1354} {"train_loss": -22.468839645385742, "global_step": 112419, "epoch": 1354} {"train_loss": -22.347143173217773, "global_step": 112420, "epoch": 1354} {"train_loss": -22.530179977416992, "global_step": 112421, "epoch": 1354} {"train_loss": -22.208152770996094, "global_step": 112422, "epoch": 1354} {"train_loss": -22.549306869506836, "global_step": 112423, "epoch": 1354} {"train_loss": -22.682653427124023, "global_step": 112424, "epoch": 1354} {"train_loss": -22.60348892211914, "global_step": 112425, "epoch": 1354} {"train_loss": -22.244314193725586, "global_step": 112426, "epoch": 1354} {"train_loss": -22.416296005249023, "global_step": 112427, "epoch": 1354} {"train_loss": -22.235782623291016, "global_step": 112428, "epoch": 1354} {"train_loss": -21.998849868774414, "global_step": 112429, "epoch": 1354} {"train_loss": -22.481578826904297, "global_step": 112430, "epoch": 1354} {"train_loss": -22.20071029663086, "global_step": 112431, "epoch": 1354} {"train_loss": -22.52402114868164, "global_step": 112432, "epoch": 1354} {"train_loss": -22.079248428344727, "global_step": 112433, "epoch": 1354} {"train_loss": -22.498075485229492, "global_step": 112434, "epoch": 1354} {"train_loss": -22.687124252319336, "global_step": 112435, "epoch": 1354} {"train_loss": -22.584115982055664, "global_step": 112436, "epoch": 1354} {"train_loss": -22.08066177368164, "global_step": 112437, "epoch": 1354} {"train_loss": -22.212926864624023, "global_step": 112438, "epoch": 1354} {"train_loss": -22.116117477416992, "global_step": 112439, "epoch": 1354} {"train_loss": -22.472869873046875, "global_step": 112440, "epoch": 1354} {"train_loss": -22.357501983642578, "global_step": 112441, "epoch": 1354} {"train_loss": -22.40472412109375, "global_step": 112442, "epoch": 1354} {"train_loss": -22.461950302124023, "global_step": 112443, "epoch": 1354} {"train_loss": -22.000516891479492, "global_step": 112444, "epoch": 1354} {"train_loss": -22.420948028564453, "global_step": 112445, "epoch": 1354} {"train_loss": -22.940322875976562, "global_step": 112446, "epoch": 1354} {"train_loss": -22.368934631347656, "global_step": 112447, "epoch": 1354} {"train_loss": -21.93505859375, "global_step": 112448, "epoch": 1354} {"train_loss": -22.50800132751465, "global_step": 112449, "epoch": 1354} {"train_loss": -22.224029541015625, "global_step": 112450, "epoch": 1354} {"train_loss": -22.010059356689453, "global_step": 112451, "epoch": 1354} {"train_loss": -22.326391220092773, "global_step": 112452, "epoch": 1354} {"train_loss": -22.57894515991211, "global_step": 112453, "epoch": 1354} {"train_loss": -22.001264572143555, "global_step": 112454, "epoch": 1354} {"train_loss": -22.645280838012695, "global_step": 112455, "epoch": 1354} {"train_loss": -22.200355529785156, "global_step": 112456, "epoch": 1354} {"train_loss": -21.892778396606445, "global_step": 112457, "epoch": 1354} {"train_loss": -22.478479385375977, "global_step": 112458, "epoch": 1354} {"train_loss": -22.073333740234375, "global_step": 112459, "epoch": 1354} {"train_loss": -22.390661239624023, "global_step": 112460, "epoch": 1354} {"train_loss": -22.308300018310547, "global_step": 112461, "epoch": 1354} {"train_loss": -22.187936782836914, "global_step": 112462, "epoch": 1354} {"train_loss": -22.542221069335938, "global_step": 112463, "epoch": 1354} {"train_loss": -22.217667407300098, "global_step": 112464, "epoch": 1354, "val_loss": 6281934.0} {"train_loss": -21.016159057617188, "global_step": 112465, "epoch": 1355} {"train_loss": -21.517446517944336, "global_step": 112466, "epoch": 1355} {"train_loss": -21.849958419799805, "global_step": 112467, "epoch": 1355} {"train_loss": -21.941482543945312, "global_step": 112468, "epoch": 1355} {"train_loss": -21.533456802368164, "global_step": 112469, "epoch": 1355} {"train_loss": -22.019451141357422, "global_step": 112470, "epoch": 1355} {"train_loss": -22.171951293945312, "global_step": 112471, "epoch": 1355} {"train_loss": -21.60109519958496, "global_step": 112472, "epoch": 1355} {"train_loss": -22.13163185119629, "global_step": 112473, "epoch": 1355} {"train_loss": -21.841266632080078, "global_step": 112474, "epoch": 1355} {"train_loss": -21.994796752929688, "global_step": 112475, "epoch": 1355} {"train_loss": -22.079069137573242, "global_step": 112476, "epoch": 1355} {"train_loss": -22.068225860595703, "global_step": 112477, "epoch": 1355} {"train_loss": -21.864492416381836, "global_step": 112478, "epoch": 1355} {"train_loss": -22.010190963745117, "global_step": 112479, "epoch": 1355} {"train_loss": -22.170827865600586, "global_step": 112480, "epoch": 1355} {"train_loss": -22.064640045166016, "global_step": 112481, "epoch": 1355} {"train_loss": -21.875354766845703, "global_step": 112482, "epoch": 1355} {"train_loss": -22.041221618652344, "global_step": 112483, "epoch": 1355} {"train_loss": -22.14069938659668, "global_step": 112484, "epoch": 1355} {"train_loss": -21.95867347717285, "global_step": 112485, "epoch": 1355} {"train_loss": -22.09394645690918, "global_step": 112486, "epoch": 1355} {"train_loss": -22.122787475585938, "global_step": 112487, "epoch": 1355} {"train_loss": -22.296222686767578, "global_step": 112488, "epoch": 1355} {"train_loss": -22.435989379882812, "global_step": 112489, "epoch": 1355} {"train_loss": -22.334272384643555, "global_step": 112490, "epoch": 1355} {"train_loss": -22.43588638305664, "global_step": 112491, "epoch": 1355} {"train_loss": -22.301095962524414, "global_step": 112492, "epoch": 1355} {"train_loss": -22.393007278442383, "global_step": 112493, "epoch": 1355} {"train_loss": -22.221269607543945, "global_step": 112494, "epoch": 1355} {"train_loss": -22.494897842407227, "global_step": 112495, "epoch": 1355} {"train_loss": -22.279268264770508, "global_step": 112496, "epoch": 1355} {"train_loss": -22.61884117126465, "global_step": 112497, "epoch": 1355} {"train_loss": -22.49159049987793, "global_step": 112498, "epoch": 1355} {"train_loss": -22.1365966796875, "global_step": 112499, "epoch": 1355} {"train_loss": -22.627225875854492, "global_step": 112500, "epoch": 1355} {"train_loss": -22.377796173095703, "global_step": 112501, "epoch": 1355} {"train_loss": -22.170352935791016, "global_step": 112502, "epoch": 1355} {"train_loss": -22.331541061401367, "global_step": 112503, "epoch": 1355} {"train_loss": -22.113340377807617, "global_step": 112504, "epoch": 1355} {"train_loss": -22.448514938354492, "global_step": 112505, "epoch": 1355} {"train_loss": -22.50459861755371, "global_step": 112506, "epoch": 1355} {"train_loss": -22.40313720703125, "global_step": 112507, "epoch": 1355} {"train_loss": -21.956220626831055, "global_step": 112508, "epoch": 1355} {"train_loss": -22.653982162475586, "global_step": 112509, "epoch": 1355} {"train_loss": -22.19900131225586, "global_step": 112510, "epoch": 1355} {"train_loss": -22.22623634338379, "global_step": 112511, "epoch": 1355} {"train_loss": -21.936960220336914, "global_step": 112512, "epoch": 1355} {"train_loss": -22.12052345275879, "global_step": 112513, "epoch": 1355} {"train_loss": -22.39065933227539, "global_step": 112514, "epoch": 1355} {"train_loss": -22.241910934448242, "global_step": 112515, "epoch": 1355} {"train_loss": -22.269166946411133, "global_step": 112516, "epoch": 1355} {"train_loss": -22.69541358947754, "global_step": 112517, "epoch": 1355} {"train_loss": -22.298227310180664, "global_step": 112518, "epoch": 1355} {"train_loss": -22.42279624938965, "global_step": 112519, "epoch": 1355} {"train_loss": -22.299793243408203, "global_step": 112520, "epoch": 1355} {"train_loss": -22.561574935913086, "global_step": 112521, "epoch": 1355} {"train_loss": -22.721363067626953, "global_step": 112522, "epoch": 1355} {"train_loss": -22.349512100219727, "global_step": 112523, "epoch": 1355} {"train_loss": -22.48013687133789, "global_step": 112524, "epoch": 1355} {"train_loss": -22.203479766845703, "global_step": 112525, "epoch": 1355} {"train_loss": -22.41092872619629, "global_step": 112526, "epoch": 1355} {"train_loss": -22.25775909423828, "global_step": 112527, "epoch": 1355} {"train_loss": -22.588741302490234, "global_step": 112528, "epoch": 1355} {"train_loss": -22.511632919311523, "global_step": 112529, "epoch": 1355} {"train_loss": -22.728851318359375, "global_step": 112530, "epoch": 1355} {"train_loss": -22.510923385620117, "global_step": 112531, "epoch": 1355} {"train_loss": -22.425077438354492, "global_step": 112532, "epoch": 1355} {"train_loss": -22.769882202148438, "global_step": 112533, "epoch": 1355} {"train_loss": -22.171329498291016, "global_step": 112534, "epoch": 1355} {"train_loss": -22.231494903564453, "global_step": 112535, "epoch": 1355} {"train_loss": -22.231168746948242, "global_step": 112536, "epoch": 1355} {"train_loss": -22.234060287475586, "global_step": 112537, "epoch": 1355} {"train_loss": -22.44085693359375, "global_step": 112538, "epoch": 1355} {"train_loss": -22.256916046142578, "global_step": 112539, "epoch": 1355} {"train_loss": -22.014324188232422, "global_step": 112540, "epoch": 1355} {"train_loss": -22.23369789123535, "global_step": 112541, "epoch": 1355} {"train_loss": -22.166095733642578, "global_step": 112542, "epoch": 1355} {"train_loss": -22.096965789794922, "global_step": 112543, "epoch": 1355} {"train_loss": -22.343000411987305, "global_step": 112544, "epoch": 1355} {"train_loss": -22.38591957092285, "global_step": 112545, "epoch": 1355} {"train_loss": -22.521581649780273, "global_step": 112546, "epoch": 1355} {"train_loss": -22.255250609064678, "global_step": 112547, "epoch": 1355, "val_loss": 6321563.0} {"train_loss": -21.399625778198242, "global_step": 112548, "epoch": 1356} {"train_loss": -21.182830810546875, "global_step": 112549, "epoch": 1356} {"train_loss": -21.942777633666992, "global_step": 112550, "epoch": 1356} {"train_loss": -21.415637969970703, "global_step": 112551, "epoch": 1356} {"train_loss": -21.605514526367188, "global_step": 112552, "epoch": 1356} {"train_loss": -22.023168563842773, "global_step": 112553, "epoch": 1356} {"train_loss": -21.31195640563965, "global_step": 112554, "epoch": 1356} {"train_loss": -21.698564529418945, "global_step": 112555, "epoch": 1356} {"train_loss": -21.824644088745117, "global_step": 112556, "epoch": 1356} {"train_loss": -21.797773361206055, "global_step": 112557, "epoch": 1356} {"train_loss": -21.784521102905273, "global_step": 112558, "epoch": 1356} {"train_loss": -22.018354415893555, "global_step": 112559, "epoch": 1356} {"train_loss": -21.76799201965332, "global_step": 112560, "epoch": 1356} {"train_loss": -22.13786506652832, "global_step": 112561, "epoch": 1356} {"train_loss": -21.739879608154297, "global_step": 112562, "epoch": 1356} {"train_loss": -21.90577507019043, "global_step": 112563, "epoch": 1356} {"train_loss": -22.380491256713867, "global_step": 112564, "epoch": 1356} {"train_loss": -21.751493453979492, "global_step": 112565, "epoch": 1356} {"train_loss": -21.76914405822754, "global_step": 112566, "epoch": 1356} {"train_loss": -22.4776611328125, "global_step": 112567, "epoch": 1356} {"train_loss": -21.902721405029297, "global_step": 112568, "epoch": 1356} {"train_loss": -22.242145538330078, "global_step": 112569, "epoch": 1356} {"train_loss": -22.605627059936523, "global_step": 112570, "epoch": 1356} {"train_loss": -22.495595932006836, "global_step": 112571, "epoch": 1356} {"train_loss": -22.308168411254883, "global_step": 112572, "epoch": 1356} {"train_loss": -22.3612060546875, "global_step": 112573, "epoch": 1356} {"train_loss": -22.470022201538086, "global_step": 112574, "epoch": 1356} {"train_loss": -21.888620376586914, "global_step": 112575, "epoch": 1356} {"train_loss": -22.410762786865234, "global_step": 112576, "epoch": 1356} {"train_loss": -22.343626022338867, "global_step": 112577, "epoch": 1356} {"train_loss": -22.52251434326172, "global_step": 112578, "epoch": 1356} {"train_loss": -22.266403198242188, "global_step": 112579, "epoch": 1356} {"train_loss": -22.401166915893555, "global_step": 112580, "epoch": 1356} {"train_loss": -22.250240325927734, "global_step": 112581, "epoch": 1356} {"train_loss": -21.93068504333496, "global_step": 112582, "epoch": 1356} {"train_loss": -22.60861587524414, "global_step": 112583, "epoch": 1356} {"train_loss": -22.6088924407959, "global_step": 112584, "epoch": 1356} {"train_loss": -22.096532821655273, "global_step": 112585, "epoch": 1356} {"train_loss": -22.52931785583496, "global_step": 112586, "epoch": 1356} {"train_loss": -22.294998168945312, "global_step": 112587, "epoch": 1356} {"train_loss": -22.28708267211914, "global_step": 112588, "epoch": 1356} {"train_loss": -22.092205047607422, "global_step": 112589, "epoch": 1356} {"train_loss": -22.502622604370117, "global_step": 112590, "epoch": 1356} {"train_loss": -22.033424377441406, "global_step": 112591, "epoch": 1356} {"train_loss": -21.962696075439453, "global_step": 112592, "epoch": 1356} {"train_loss": -22.627592086791992, "global_step": 112593, "epoch": 1356} {"train_loss": -22.483850479125977, "global_step": 112594, "epoch": 1356} {"train_loss": -22.464506149291992, "global_step": 112595, "epoch": 1356} {"train_loss": -22.11496353149414, "global_step": 112596, "epoch": 1356} {"train_loss": -22.369827270507812, "global_step": 112597, "epoch": 1356} {"train_loss": -22.178762435913086, "global_step": 112598, "epoch": 1356} {"train_loss": -22.4139461517334, "global_step": 112599, "epoch": 1356} {"train_loss": -22.573522567749023, "global_step": 112600, "epoch": 1356} {"train_loss": -22.524442672729492, "global_step": 112601, "epoch": 1356} {"train_loss": -22.515310287475586, "global_step": 112602, "epoch": 1356} {"train_loss": -22.50772476196289, "global_step": 112603, "epoch": 1356} {"train_loss": -21.97031021118164, "global_step": 112604, "epoch": 1356} {"train_loss": -21.939725875854492, "global_step": 112605, "epoch": 1356} {"train_loss": -22.147974014282227, "global_step": 112606, "epoch": 1356} {"train_loss": -22.269916534423828, "global_step": 112607, "epoch": 1356} {"train_loss": -22.113697052001953, "global_step": 112608, "epoch": 1356} {"train_loss": -22.39898109436035, "global_step": 112609, "epoch": 1356} {"train_loss": -22.346759796142578, "global_step": 112610, "epoch": 1356} {"train_loss": -22.069555282592773, "global_step": 112611, "epoch": 1356} {"train_loss": -22.27913475036621, "global_step": 112612, "epoch": 1356} {"train_loss": -22.00282096862793, "global_step": 112613, "epoch": 1356} {"train_loss": -22.277420043945312, "global_step": 112614, "epoch": 1356} {"train_loss": -21.931520462036133, "global_step": 112615, "epoch": 1356} {"train_loss": -22.592863082885742, "global_step": 112616, "epoch": 1356} {"train_loss": -22.18115234375, "global_step": 112617, "epoch": 1356} {"train_loss": -22.224506378173828, "global_step": 112618, "epoch": 1356} {"train_loss": -22.122739791870117, "global_step": 112619, "epoch": 1356} {"train_loss": -22.648466110229492, "global_step": 112620, "epoch": 1356} {"train_loss": -22.08139419555664, "global_step": 112621, "epoch": 1356} {"train_loss": -22.080917358398438, "global_step": 112622, "epoch": 1356} {"train_loss": -22.165212631225586, "global_step": 112623, "epoch": 1356} {"train_loss": -22.003326416015625, "global_step": 112624, "epoch": 1356} {"train_loss": -22.509326934814453, "global_step": 112625, "epoch": 1356} {"train_loss": -22.236604690551758, "global_step": 112626, "epoch": 1356} {"train_loss": -22.30156898498535, "global_step": 112627, "epoch": 1356} {"train_loss": -22.319578170776367, "global_step": 112628, "epoch": 1356} {"train_loss": -22.068090438842773, "global_step": 112629, "epoch": 1356} {"train_loss": -22.16096597694489, "global_step": 112630, "epoch": 1356, "val_loss": 6293893.5} {"train_loss": -21.711624145507812, "global_step": 112631, "epoch": 1357} {"train_loss": -22.105039596557617, "global_step": 112632, "epoch": 1357} {"train_loss": -22.147079467773438, "global_step": 112633, "epoch": 1357} {"train_loss": -22.32832145690918, "global_step": 112634, "epoch": 1357} {"train_loss": -21.911169052124023, "global_step": 112635, "epoch": 1357} {"train_loss": -22.567365646362305, "global_step": 112636, "epoch": 1357} {"train_loss": -22.03946304321289, "global_step": 112637, "epoch": 1357} {"train_loss": -22.05931854248047, "global_step": 112638, "epoch": 1357} {"train_loss": -21.974292755126953, "global_step": 112639, "epoch": 1357} {"train_loss": -22.117143630981445, "global_step": 112640, "epoch": 1357} {"train_loss": -21.651716232299805, "global_step": 112641, "epoch": 1357} {"train_loss": -22.6206111907959, "global_step": 112642, "epoch": 1357} {"train_loss": -22.211156845092773, "global_step": 112643, "epoch": 1357} {"train_loss": -22.373640060424805, "global_step": 112644, "epoch": 1357} {"train_loss": -22.597984313964844, "global_step": 112645, "epoch": 1357} {"train_loss": -22.006927490234375, "global_step": 112646, "epoch": 1357} {"train_loss": -22.10772132873535, "global_step": 112647, "epoch": 1357} {"train_loss": -22.437776565551758, "global_step": 112648, "epoch": 1357} {"train_loss": -22.361074447631836, "global_step": 112649, "epoch": 1357} {"train_loss": -21.766098022460938, "global_step": 112650, "epoch": 1357} {"train_loss": -22.25600814819336, "global_step": 112651, "epoch": 1357} {"train_loss": -22.11379051208496, "global_step": 112652, "epoch": 1357} {"train_loss": -22.060352325439453, "global_step": 112653, "epoch": 1357} {"train_loss": -22.396530151367188, "global_step": 112654, "epoch": 1357} {"train_loss": -22.340566635131836, "global_step": 112655, "epoch": 1357} {"train_loss": -22.553237915039062, "global_step": 112656, "epoch": 1357} {"train_loss": -22.005720138549805, "global_step": 112657, "epoch": 1357} {"train_loss": -22.451732635498047, "global_step": 112658, "epoch": 1357} {"train_loss": -22.398019790649414, "global_step": 112659, "epoch": 1357} {"train_loss": -22.20285415649414, "global_step": 112660, "epoch": 1357} {"train_loss": -22.45965576171875, "global_step": 112661, "epoch": 1357} {"train_loss": -22.492319107055664, "global_step": 112662, "epoch": 1357} {"train_loss": -22.179319381713867, "global_step": 112663, "epoch": 1357} {"train_loss": -22.463937759399414, "global_step": 112664, "epoch": 1357} {"train_loss": -22.430795669555664, "global_step": 112665, "epoch": 1357} {"train_loss": -22.42671012878418, "global_step": 112666, "epoch": 1357} {"train_loss": -22.534107208251953, "global_step": 112667, "epoch": 1357} {"train_loss": -22.398326873779297, "global_step": 112668, "epoch": 1357} {"train_loss": -22.25333023071289, "global_step": 112669, "epoch": 1357} {"train_loss": -22.356231689453125, "global_step": 112670, "epoch": 1357} {"train_loss": -22.21645164489746, "global_step": 112671, "epoch": 1357} {"train_loss": -22.254776000976562, "global_step": 112672, "epoch": 1357} {"train_loss": -22.15511131286621, "global_step": 112673, "epoch": 1357} {"train_loss": -22.078550338745117, "global_step": 112674, "epoch": 1357} {"train_loss": -22.416006088256836, "global_step": 112675, "epoch": 1357} {"train_loss": -22.82046890258789, "global_step": 112676, "epoch": 1357} {"train_loss": -22.328079223632812, "global_step": 112677, "epoch": 1357} {"train_loss": -22.103113174438477, "global_step": 112678, "epoch": 1357} {"train_loss": -22.267169952392578, "global_step": 112679, "epoch": 1357} {"train_loss": -22.407678604125977, "global_step": 112680, "epoch": 1357} {"train_loss": -22.814376831054688, "global_step": 112681, "epoch": 1357} {"train_loss": -22.553674697875977, "global_step": 112682, "epoch": 1357} {"train_loss": -21.7109317779541, "global_step": 112683, "epoch": 1357} {"train_loss": -22.398073196411133, "global_step": 112684, "epoch": 1357} {"train_loss": -22.45241355895996, "global_step": 112685, "epoch": 1357} {"train_loss": -22.428464889526367, "global_step": 112686, "epoch": 1357} {"train_loss": -22.295795440673828, "global_step": 112687, "epoch": 1357} {"train_loss": -22.423202514648438, "global_step": 112688, "epoch": 1357} {"train_loss": -21.735374450683594, "global_step": 112689, "epoch": 1357} {"train_loss": -22.064956665039062, "global_step": 112690, "epoch": 1357} {"train_loss": -22.160829544067383, "global_step": 112691, "epoch": 1357} {"train_loss": -22.143630981445312, "global_step": 112692, "epoch": 1357} {"train_loss": -22.513463973999023, "global_step": 112693, "epoch": 1357} {"train_loss": -21.86014747619629, "global_step": 112694, "epoch": 1357} {"train_loss": -21.99310874938965, "global_step": 112695, "epoch": 1357} {"train_loss": -22.00990104675293, "global_step": 112696, "epoch": 1357} {"train_loss": -22.26638412475586, "global_step": 112697, "epoch": 1357} {"train_loss": -21.9586181640625, "global_step": 112698, "epoch": 1357} {"train_loss": -22.544540405273438, "global_step": 112699, "epoch": 1357} {"train_loss": -21.96501350402832, "global_step": 112700, "epoch": 1357} {"train_loss": -22.28130340576172, "global_step": 112701, "epoch": 1357} {"train_loss": -22.175039291381836, "global_step": 112702, "epoch": 1357} {"train_loss": -22.670190811157227, "global_step": 112703, "epoch": 1357} {"train_loss": -22.408130645751953, "global_step": 112704, "epoch": 1357} {"train_loss": -22.276134490966797, "global_step": 112705, "epoch": 1357} {"train_loss": -22.244613647460938, "global_step": 112706, "epoch": 1357} {"train_loss": -22.341093063354492, "global_step": 112707, "epoch": 1357} {"train_loss": -22.406269073486328, "global_step": 112708, "epoch": 1357} {"train_loss": -22.080739974975586, "global_step": 112709, "epoch": 1357} {"train_loss": -22.38454246520996, "global_step": 112710, "epoch": 1357} {"train_loss": -22.34869956970215, "global_step": 112711, "epoch": 1357} {"train_loss": -22.397354125976562, "global_step": 112712, "epoch": 1357} {"train_loss": -22.268793312900037, "global_step": 112713, "epoch": 1357, "val_loss": 6339797.0} {"train_loss": -22.02034568786621, "global_step": 112714, "epoch": 1358} {"train_loss": -22.00716209411621, "global_step": 112715, "epoch": 1358} {"train_loss": -21.817548751831055, "global_step": 112716, "epoch": 1358} {"train_loss": -21.60823631286621, "global_step": 112717, "epoch": 1358} {"train_loss": -21.898168563842773, "global_step": 112718, "epoch": 1358} {"train_loss": -21.830350875854492, "global_step": 112719, "epoch": 1358} {"train_loss": -21.663833618164062, "global_step": 112720, "epoch": 1358} {"train_loss": -21.95853042602539, "global_step": 112721, "epoch": 1358} {"train_loss": -22.046947479248047, "global_step": 112722, "epoch": 1358} {"train_loss": -22.061878204345703, "global_step": 112723, "epoch": 1358} {"train_loss": -22.434186935424805, "global_step": 112724, "epoch": 1358} {"train_loss": -21.98761558532715, "global_step": 112725, "epoch": 1358} {"train_loss": -22.002288818359375, "global_step": 112726, "epoch": 1358} {"train_loss": -22.115198135375977, "global_step": 112727, "epoch": 1358} {"train_loss": -22.23555564880371, "global_step": 112728, "epoch": 1358} {"train_loss": -21.964052200317383, "global_step": 112729, "epoch": 1358} {"train_loss": -21.99675941467285, "global_step": 112730, "epoch": 1358} {"train_loss": -22.206327438354492, "global_step": 112731, "epoch": 1358} {"train_loss": -22.28709602355957, "global_step": 112732, "epoch": 1358} {"train_loss": -22.034738540649414, "global_step": 112733, "epoch": 1358} {"train_loss": -22.2751522064209, "global_step": 112734, "epoch": 1358} {"train_loss": -22.283828735351562, "global_step": 112735, "epoch": 1358} {"train_loss": -21.990568161010742, "global_step": 112736, "epoch": 1358} {"train_loss": -22.19879722595215, "global_step": 112737, "epoch": 1358} {"train_loss": -21.90641212463379, "global_step": 112738, "epoch": 1358} {"train_loss": -22.295623779296875, "global_step": 112739, "epoch": 1358} {"train_loss": -22.441558837890625, "global_step": 112740, "epoch": 1358} {"train_loss": -22.27019691467285, "global_step": 112741, "epoch": 1358} {"train_loss": -22.33770179748535, "global_step": 112742, "epoch": 1358} {"train_loss": -22.493377685546875, "global_step": 112743, "epoch": 1358} {"train_loss": -22.619958877563477, "global_step": 112744, "epoch": 1358} {"train_loss": -22.282550811767578, "global_step": 112745, "epoch": 1358} {"train_loss": -22.359479904174805, "global_step": 112746, "epoch": 1358} {"train_loss": -22.109073638916016, "global_step": 112747, "epoch": 1358} {"train_loss": -22.300195693969727, "global_step": 112748, "epoch": 1358} {"train_loss": -22.12186050415039, "global_step": 112749, "epoch": 1358} {"train_loss": -22.569107055664062, "global_step": 112750, "epoch": 1358} {"train_loss": -22.494020462036133, "global_step": 112751, "epoch": 1358} {"train_loss": -22.387968063354492, "global_step": 112752, "epoch": 1358} {"train_loss": -22.49195671081543, "global_step": 112753, "epoch": 1358} {"train_loss": -22.091825485229492, "global_step": 112754, "epoch": 1358} {"train_loss": -22.40346336364746, "global_step": 112755, "epoch": 1358} {"train_loss": -22.13378143310547, "global_step": 112756, "epoch": 1358} {"train_loss": -22.11212730407715, "global_step": 112757, "epoch": 1358} {"train_loss": -22.579273223876953, "global_step": 112758, "epoch": 1358} {"train_loss": -22.508405685424805, "global_step": 112759, "epoch": 1358} {"train_loss": -22.447763442993164, "global_step": 112760, "epoch": 1358} {"train_loss": -22.37330436706543, "global_step": 112761, "epoch": 1358} {"train_loss": -22.14155387878418, "global_step": 112762, "epoch": 1358} {"train_loss": -22.572927474975586, "global_step": 112763, "epoch": 1358} {"train_loss": -22.507295608520508, "global_step": 112764, "epoch": 1358} {"train_loss": -21.906309127807617, "global_step": 112765, "epoch": 1358} {"train_loss": -22.408559799194336, "global_step": 112766, "epoch": 1358} {"train_loss": -22.0419864654541, "global_step": 112767, "epoch": 1358} {"train_loss": -22.430143356323242, "global_step": 112768, "epoch": 1358} {"train_loss": -22.187152862548828, "global_step": 112769, "epoch": 1358} {"train_loss": -22.212871551513672, "global_step": 112770, "epoch": 1358} {"train_loss": -22.275226593017578, "global_step": 112771, "epoch": 1358} {"train_loss": -22.228548049926758, "global_step": 112772, "epoch": 1358} {"train_loss": -22.221715927124023, "global_step": 112773, "epoch": 1358} {"train_loss": -22.317773818969727, "global_step": 112774, "epoch": 1358} {"train_loss": -22.5047550201416, "global_step": 112775, "epoch": 1358} {"train_loss": -22.42658042907715, "global_step": 112776, "epoch": 1358} {"train_loss": -22.63735008239746, "global_step": 112777, "epoch": 1358} {"train_loss": -22.394750595092773, "global_step": 112778, "epoch": 1358} {"train_loss": -22.783283233642578, "global_step": 112779, "epoch": 1358} {"train_loss": -22.43045425415039, "global_step": 112780, "epoch": 1358} {"train_loss": -22.54159927368164, "global_step": 112781, "epoch": 1358} {"train_loss": -22.36354637145996, "global_step": 112782, "epoch": 1358} {"train_loss": -22.218944549560547, "global_step": 112783, "epoch": 1358} {"train_loss": -22.391687393188477, "global_step": 112784, "epoch": 1358} {"train_loss": -22.014760971069336, "global_step": 112785, "epoch": 1358} {"train_loss": -22.226804733276367, "global_step": 112786, "epoch": 1358} {"train_loss": -22.59330177307129, "global_step": 112787, "epoch": 1358} {"train_loss": -22.3446102142334, "global_step": 112788, "epoch": 1358} {"train_loss": -22.014883041381836, "global_step": 112789, "epoch": 1358} {"train_loss": -22.433393478393555, "global_step": 112790, "epoch": 1358} {"train_loss": -22.5797061920166, "global_step": 112791, "epoch": 1358} {"train_loss": -22.38875961303711, "global_step": 112792, "epoch": 1358} {"train_loss": -22.464679718017578, "global_step": 112793, "epoch": 1358} {"train_loss": -22.267688751220703, "global_step": 112794, "epoch": 1358} {"train_loss": -22.310222625732422, "global_step": 112795, "epoch": 1358} {"train_loss": -22.264456438731, "global_step": 112796, "epoch": 1358, "val_loss": 6435801.0} {"train_loss": -21.830900192260742, "global_step": 112797, "epoch": 1359} {"train_loss": -22.076904296875, "global_step": 112798, "epoch": 1359} {"train_loss": -22.10398292541504, "global_step": 112799, "epoch": 1359} {"train_loss": -21.7879638671875, "global_step": 112800, "epoch": 1359} {"train_loss": -21.849246978759766, "global_step": 112801, "epoch": 1359} {"train_loss": -22.118694305419922, "global_step": 112802, "epoch": 1359} {"train_loss": -22.04066276550293, "global_step": 112803, "epoch": 1359} {"train_loss": -22.074087142944336, "global_step": 112804, "epoch": 1359} {"train_loss": -22.163496017456055, "global_step": 112805, "epoch": 1359} {"train_loss": -21.783100128173828, "global_step": 112806, "epoch": 1359} {"train_loss": -22.158605575561523, "global_step": 112807, "epoch": 1359} {"train_loss": -21.860782623291016, "global_step": 112808, "epoch": 1359} {"train_loss": -21.870859146118164, "global_step": 112809, "epoch": 1359} {"train_loss": -21.97121238708496, "global_step": 112810, "epoch": 1359} {"train_loss": -22.01771354675293, "global_step": 112811, "epoch": 1359} {"train_loss": -22.403671264648438, "global_step": 112812, "epoch": 1359} {"train_loss": -21.992481231689453, "global_step": 112813, "epoch": 1359} {"train_loss": -22.637596130371094, "global_step": 112814, "epoch": 1359} {"train_loss": -21.920974731445312, "global_step": 112815, "epoch": 1359} {"train_loss": -21.930036544799805, "global_step": 112816, "epoch": 1359} {"train_loss": -22.09432601928711, "global_step": 112817, "epoch": 1359} {"train_loss": -22.333768844604492, "global_step": 112818, "epoch": 1359} {"train_loss": -21.989572525024414, "global_step": 112819, "epoch": 1359} {"train_loss": -21.92728614807129, "global_step": 112820, "epoch": 1359} {"train_loss": -22.3644962310791, "global_step": 112821, "epoch": 1359} {"train_loss": -22.306751251220703, "global_step": 112822, "epoch": 1359} {"train_loss": -22.337682723999023, "global_step": 112823, "epoch": 1359} {"train_loss": -21.95481300354004, "global_step": 112824, "epoch": 1359} {"train_loss": -22.4982967376709, "global_step": 112825, "epoch": 1359} {"train_loss": -22.522708892822266, "global_step": 112826, "epoch": 1359} {"train_loss": -22.423940658569336, "global_step": 112827, "epoch": 1359} {"train_loss": -22.022554397583008, "global_step": 112828, "epoch": 1359} {"train_loss": -22.121585845947266, "global_step": 112829, "epoch": 1359} {"train_loss": -22.22705078125, "global_step": 112830, "epoch": 1359} {"train_loss": -22.44495964050293, "global_step": 112831, "epoch": 1359} {"train_loss": -22.12588119506836, "global_step": 112832, "epoch": 1359} {"train_loss": -22.18279266357422, "global_step": 112833, "epoch": 1359} {"train_loss": -22.500925064086914, "global_step": 112834, "epoch": 1359} {"train_loss": -22.371267318725586, "global_step": 112835, "epoch": 1359} {"train_loss": -22.24679946899414, "global_step": 112836, "epoch": 1359} {"train_loss": -22.200733184814453, "global_step": 112837, "epoch": 1359} {"train_loss": -22.524763107299805, "global_step": 112838, "epoch": 1359} {"train_loss": -22.20725440979004, "global_step": 112839, "epoch": 1359} {"train_loss": -22.056081771850586, "global_step": 112840, "epoch": 1359} {"train_loss": -22.387216567993164, "global_step": 112841, "epoch": 1359} {"train_loss": -22.495819091796875, "global_step": 112842, "epoch": 1359} {"train_loss": -22.151657104492188, "global_step": 112843, "epoch": 1359} {"train_loss": -22.531660079956055, "global_step": 112844, "epoch": 1359} {"train_loss": -22.43474769592285, "global_step": 112845, "epoch": 1359} {"train_loss": -22.266324996948242, "global_step": 112846, "epoch": 1359} {"train_loss": -22.36104393005371, "global_step": 112847, "epoch": 1359} {"train_loss": -22.287267684936523, "global_step": 112848, "epoch": 1359} {"train_loss": -22.265979766845703, "global_step": 112849, "epoch": 1359} {"train_loss": -22.39296531677246, "global_step": 112850, "epoch": 1359} {"train_loss": -22.464933395385742, "global_step": 112851, "epoch": 1359} {"train_loss": -22.557401657104492, "global_step": 112852, "epoch": 1359} {"train_loss": -22.221601486206055, "global_step": 112853, "epoch": 1359} {"train_loss": -22.302892684936523, "global_step": 112854, "epoch": 1359} {"train_loss": -22.517297744750977, "global_step": 112855, "epoch": 1359} {"train_loss": -22.171489715576172, "global_step": 112856, "epoch": 1359} {"train_loss": -22.4290828704834, "global_step": 112857, "epoch": 1359} {"train_loss": -22.30318832397461, "global_step": 112858, "epoch": 1359} {"train_loss": -22.35037612915039, "global_step": 112859, "epoch": 1359} {"train_loss": -22.20684242248535, "global_step": 112860, "epoch": 1359} {"train_loss": -22.312129974365234, "global_step": 112861, "epoch": 1359} {"train_loss": -21.856901168823242, "global_step": 112862, "epoch": 1359} {"train_loss": -22.317066192626953, "global_step": 112863, "epoch": 1359} {"train_loss": -22.635879516601562, "global_step": 112864, "epoch": 1359} {"train_loss": -22.300649642944336, "global_step": 112865, "epoch": 1359} {"train_loss": -22.195566177368164, "global_step": 112866, "epoch": 1359} {"train_loss": -22.350202560424805, "global_step": 112867, "epoch": 1359} {"train_loss": -22.416715621948242, "global_step": 112868, "epoch": 1359} {"train_loss": -22.359161376953125, "global_step": 112869, "epoch": 1359} {"train_loss": -22.093408584594727, "global_step": 112870, "epoch": 1359} {"train_loss": -22.230960845947266, "global_step": 112871, "epoch": 1359} {"train_loss": -22.381546020507812, "global_step": 112872, "epoch": 1359} {"train_loss": -22.0821533203125, "global_step": 112873, "epoch": 1359} {"train_loss": -22.008790969848633, "global_step": 112874, "epoch": 1359} {"train_loss": -21.8826904296875, "global_step": 112875, "epoch": 1359} {"train_loss": -22.442975997924805, "global_step": 112876, "epoch": 1359} {"train_loss": -22.567129135131836, "global_step": 112877, "epoch": 1359} {"train_loss": -22.37952423095703, "global_step": 112878, "epoch": 1359} {"train_loss": -22.213218757905157, "global_step": 112879, "epoch": 1359, "val_loss": 6166204.0} {"train_loss": -22.26097297668457, "global_step": 112880, "epoch": 1360} {"train_loss": -22.275117874145508, "global_step": 112881, "epoch": 1360} {"train_loss": -21.839725494384766, "global_step": 112882, "epoch": 1360} {"train_loss": -22.473758697509766, "global_step": 112883, "epoch": 1360} {"train_loss": -22.325956344604492, "global_step": 112884, "epoch": 1360} {"train_loss": -21.945165634155273, "global_step": 112885, "epoch": 1360} {"train_loss": -21.964561462402344, "global_step": 112886, "epoch": 1360} {"train_loss": -22.00528907775879, "global_step": 112887, "epoch": 1360} {"train_loss": -22.152118682861328, "global_step": 112888, "epoch": 1360} {"train_loss": -22.518110275268555, "global_step": 112889, "epoch": 1360} {"train_loss": -22.521854400634766, "global_step": 112890, "epoch": 1360} {"train_loss": -22.3226261138916, "global_step": 112891, "epoch": 1360} {"train_loss": -22.292234420776367, "global_step": 112892, "epoch": 1360} {"train_loss": -22.12531089782715, "global_step": 112893, "epoch": 1360} {"train_loss": -22.15144920349121, "global_step": 112894, "epoch": 1360} {"train_loss": -22.52737045288086, "global_step": 112895, "epoch": 1360} {"train_loss": -22.194345474243164, "global_step": 112896, "epoch": 1360} {"train_loss": -22.347023010253906, "global_step": 112897, "epoch": 1360} {"train_loss": -22.257665634155273, "global_step": 112898, "epoch": 1360} {"train_loss": -21.98512840270996, "global_step": 112899, "epoch": 1360} {"train_loss": -22.409650802612305, "global_step": 112900, "epoch": 1360} {"train_loss": -22.290632247924805, "global_step": 112901, "epoch": 1360} {"train_loss": -22.468952178955078, "global_step": 112902, "epoch": 1360} {"train_loss": -22.157917022705078, "global_step": 112903, "epoch": 1360} {"train_loss": -22.289899826049805, "global_step": 112904, "epoch": 1360} {"train_loss": -22.035139083862305, "global_step": 112905, "epoch": 1360} {"train_loss": -22.53403091430664, "global_step": 112906, "epoch": 1360} {"train_loss": -21.996469497680664, "global_step": 112907, "epoch": 1360} {"train_loss": -22.211353302001953, "global_step": 112908, "epoch": 1360} {"train_loss": -22.037946701049805, "global_step": 112909, "epoch": 1360} {"train_loss": -22.78742027282715, "global_step": 112910, "epoch": 1360} {"train_loss": -22.324857711791992, "global_step": 112911, "epoch": 1360} {"train_loss": -22.21474266052246, "global_step": 112912, "epoch": 1360} {"train_loss": -22.73784065246582, "global_step": 112913, "epoch": 1360} {"train_loss": -22.12137794494629, "global_step": 112914, "epoch": 1360} {"train_loss": -22.368473052978516, "global_step": 112915, "epoch": 1360} {"train_loss": -22.29001235961914, "global_step": 112916, "epoch": 1360} {"train_loss": -22.03580665588379, "global_step": 112917, "epoch": 1360} {"train_loss": -22.2716121673584, "global_step": 112918, "epoch": 1360} {"train_loss": -22.601865768432617, "global_step": 112919, "epoch": 1360} {"train_loss": -22.483259201049805, "global_step": 112920, "epoch": 1360} {"train_loss": -22.274024963378906, "global_step": 112921, "epoch": 1360} {"train_loss": -22.608980178833008, "global_step": 112922, "epoch": 1360} {"train_loss": -22.392133712768555, "global_step": 112923, "epoch": 1360} {"train_loss": -22.701343536376953, "global_step": 112924, "epoch": 1360} {"train_loss": -22.580419540405273, "global_step": 112925, "epoch": 1360} {"train_loss": -22.310819625854492, "global_step": 112926, "epoch": 1360} {"train_loss": -22.525955200195312, "global_step": 112927, "epoch": 1360} {"train_loss": -22.343921661376953, "global_step": 112928, "epoch": 1360} {"train_loss": -22.856401443481445, "global_step": 112929, "epoch": 1360} {"train_loss": -22.283071517944336, "global_step": 112930, "epoch": 1360} {"train_loss": -22.50497817993164, "global_step": 112931, "epoch": 1360} {"train_loss": -22.785755157470703, "global_step": 112932, "epoch": 1360} {"train_loss": -22.262928009033203, "global_step": 112933, "epoch": 1360} {"train_loss": -22.435443878173828, "global_step": 112934, "epoch": 1360} {"train_loss": -22.66100311279297, "global_step": 112935, "epoch": 1360} {"train_loss": -22.480010986328125, "global_step": 112936, "epoch": 1360} {"train_loss": -22.264768600463867, "global_step": 112937, "epoch": 1360} {"train_loss": -22.506261825561523, "global_step": 112938, "epoch": 1360} {"train_loss": -22.39896011352539, "global_step": 112939, "epoch": 1360} {"train_loss": -22.207508087158203, "global_step": 112940, "epoch": 1360} {"train_loss": -22.622156143188477, "global_step": 112941, "epoch": 1360} {"train_loss": -22.246353149414062, "global_step": 112942, "epoch": 1360} {"train_loss": -22.17306137084961, "global_step": 112943, "epoch": 1360} {"train_loss": -22.706586837768555, "global_step": 112944, "epoch": 1360} {"train_loss": -22.179601669311523, "global_step": 112945, "epoch": 1360} {"train_loss": -22.513141632080078, "global_step": 112946, "epoch": 1360} {"train_loss": -22.118558883666992, "global_step": 112947, "epoch": 1360} {"train_loss": -22.71009635925293, "global_step": 112948, "epoch": 1360} {"train_loss": -22.694425582885742, "global_step": 112949, "epoch": 1360} {"train_loss": -22.39126968383789, "global_step": 112950, "epoch": 1360} {"train_loss": -22.086145401000977, "global_step": 112951, "epoch": 1360} {"train_loss": -21.98481559753418, "global_step": 112952, "epoch": 1360} {"train_loss": -22.243284225463867, "global_step": 112953, "epoch": 1360} {"train_loss": -22.28973960876465, "global_step": 112954, "epoch": 1360} {"train_loss": -22.45896339416504, "global_step": 112955, "epoch": 1360} {"train_loss": -22.24814224243164, "global_step": 112956, "epoch": 1360} {"train_loss": -22.286327362060547, "global_step": 112957, "epoch": 1360} {"train_loss": -22.57541847229004, "global_step": 112958, "epoch": 1360} {"train_loss": -22.253625869750977, "global_step": 112959, "epoch": 1360} {"train_loss": -22.490407943725586, "global_step": 112960, "epoch": 1360} {"train_loss": -22.30951499938965, "global_step": 112961, "epoch": 1360} {"train_loss": -22.349309254841632, "global_step": 112962, "epoch": 1360, "val_loss": 6132028.5} {"train_loss": -22.01969337463379, "global_step": 112963, "epoch": 1361} {"train_loss": -22.16509246826172, "global_step": 112964, "epoch": 1361} {"train_loss": -22.275672912597656, "global_step": 112965, "epoch": 1361} {"train_loss": -21.58057403564453, "global_step": 112966, "epoch": 1361} {"train_loss": -22.01689338684082, "global_step": 112967, "epoch": 1361} {"train_loss": -22.766361236572266, "global_step": 112968, "epoch": 1361} {"train_loss": -22.4835147857666, "global_step": 112969, "epoch": 1361} {"train_loss": -22.197507858276367, "global_step": 112970, "epoch": 1361} {"train_loss": -22.185728073120117, "global_step": 112971, "epoch": 1361} {"train_loss": -21.818777084350586, "global_step": 112972, "epoch": 1361} {"train_loss": -22.18596839904785, "global_step": 112973, "epoch": 1361} {"train_loss": -22.199798583984375, "global_step": 112974, "epoch": 1361} {"train_loss": -22.493005752563477, "global_step": 112975, "epoch": 1361} {"train_loss": -22.348098754882812, "global_step": 112976, "epoch": 1361} {"train_loss": -22.35392189025879, "global_step": 112977, "epoch": 1361} {"train_loss": -21.93914222717285, "global_step": 112978, "epoch": 1361} {"train_loss": -22.18451690673828, "global_step": 112979, "epoch": 1361} {"train_loss": -22.3182373046875, "global_step": 112980, "epoch": 1361} {"train_loss": -22.135971069335938, "global_step": 112981, "epoch": 1361} {"train_loss": -22.66328239440918, "global_step": 112982, "epoch": 1361} {"train_loss": -22.45275115966797, "global_step": 112983, "epoch": 1361} {"train_loss": -22.527828216552734, "global_step": 112984, "epoch": 1361} {"train_loss": -22.334238052368164, "global_step": 112985, "epoch": 1361} {"train_loss": -22.305194854736328, "global_step": 112986, "epoch": 1361} {"train_loss": -22.46036720275879, "global_step": 112987, "epoch": 1361} {"train_loss": -22.448766708374023, "global_step": 112988, "epoch": 1361} {"train_loss": -22.101545333862305, "global_step": 112989, "epoch": 1361} {"train_loss": -22.35943603515625, "global_step": 112990, "epoch": 1361} {"train_loss": -22.119571685791016, "global_step": 112991, "epoch": 1361} {"train_loss": -22.043807983398438, "global_step": 112992, "epoch": 1361} {"train_loss": -22.4778995513916, "global_step": 112993, "epoch": 1361} {"train_loss": -22.204870223999023, "global_step": 112994, "epoch": 1361} {"train_loss": -22.010360717773438, "global_step": 112995, "epoch": 1361} {"train_loss": -22.40004539489746, "global_step": 112996, "epoch": 1361} {"train_loss": -22.11964988708496, "global_step": 112997, "epoch": 1361} {"train_loss": -22.21154022216797, "global_step": 112998, "epoch": 1361} {"train_loss": -21.919431686401367, "global_step": 112999, "epoch": 1361} {"train_loss": -21.991641998291016, "global_step": 113000, "epoch": 1361} {"train_loss": -22.23213768005371, "global_step": 113001, "epoch": 1361} {"train_loss": -22.290075302124023, "global_step": 113002, "epoch": 1361} {"train_loss": -21.994537353515625, "global_step": 113003, "epoch": 1361} {"train_loss": -22.493871688842773, "global_step": 113004, "epoch": 1361} {"train_loss": -22.154932022094727, "global_step": 113005, "epoch": 1361} {"train_loss": -22.392602920532227, "global_step": 113006, "epoch": 1361} {"train_loss": -22.15144920349121, "global_step": 113007, "epoch": 1361} {"train_loss": -22.47957420349121, "global_step": 113008, "epoch": 1361} {"train_loss": -22.21491813659668, "global_step": 113009, "epoch": 1361} {"train_loss": -22.438785552978516, "global_step": 113010, "epoch": 1361} {"train_loss": -22.665700912475586, "global_step": 113011, "epoch": 1361} {"train_loss": -22.386594772338867, "global_step": 113012, "epoch": 1361} {"train_loss": -22.409530639648438, "global_step": 113013, "epoch": 1361} {"train_loss": -22.103456497192383, "global_step": 113014, "epoch": 1361} {"train_loss": -22.520191192626953, "global_step": 113015, "epoch": 1361} {"train_loss": -22.507858276367188, "global_step": 113016, "epoch": 1361} {"train_loss": -22.271995544433594, "global_step": 113017, "epoch": 1361} {"train_loss": -22.134763717651367, "global_step": 113018, "epoch": 1361} {"train_loss": -22.120161056518555, "global_step": 113019, "epoch": 1361} {"train_loss": -22.0927677154541, "global_step": 113020, "epoch": 1361} {"train_loss": -22.107019424438477, "global_step": 113021, "epoch": 1361} {"train_loss": -22.064838409423828, "global_step": 113022, "epoch": 1361} {"train_loss": -22.334110260009766, "global_step": 113023, "epoch": 1361} {"train_loss": -22.444244384765625, "global_step": 113024, "epoch": 1361} {"train_loss": -22.909347534179688, "global_step": 113025, "epoch": 1361} {"train_loss": -22.289165496826172, "global_step": 113026, "epoch": 1361} {"train_loss": -22.06390953063965, "global_step": 113027, "epoch": 1361} {"train_loss": -22.3122615814209, "global_step": 113028, "epoch": 1361} {"train_loss": -22.81978416442871, "global_step": 113029, "epoch": 1361} {"train_loss": -22.590702056884766, "global_step": 113030, "epoch": 1361} {"train_loss": -22.009973526000977, "global_step": 113031, "epoch": 1361} {"train_loss": -22.41510581970215, "global_step": 113032, "epoch": 1361} {"train_loss": -22.37545394897461, "global_step": 113033, "epoch": 1361} {"train_loss": -22.466299057006836, "global_step": 113034, "epoch": 1361} {"train_loss": -22.3897705078125, "global_step": 113035, "epoch": 1361} {"train_loss": -22.531591415405273, "global_step": 113036, "epoch": 1361} {"train_loss": -22.396413803100586, "global_step": 113037, "epoch": 1361} {"train_loss": -22.554101943969727, "global_step": 113038, "epoch": 1361} {"train_loss": -22.334829330444336, "global_step": 113039, "epoch": 1361} {"train_loss": -22.38309097290039, "global_step": 113040, "epoch": 1361} {"train_loss": -22.182077407836914, "global_step": 113041, "epoch": 1361} {"train_loss": -22.38266944885254, "global_step": 113042, "epoch": 1361} {"train_loss": -22.256938934326172, "global_step": 113043, "epoch": 1361} {"train_loss": -22.22890281677246, "global_step": 113044, "epoch": 1361} {"train_loss": -22.301774220294263, "global_step": 113045, "epoch": 1361, "val_loss": 6179954.0} {"train_loss": -21.112991333007812, "global_step": 113046, "epoch": 1362} {"train_loss": -20.099050521850586, "global_step": 113047, "epoch": 1362} {"train_loss": -21.07942771911621, "global_step": 113048, "epoch": 1362} {"train_loss": -21.808399200439453, "global_step": 113049, "epoch": 1362} {"train_loss": -21.20616340637207, "global_step": 113050, "epoch": 1362} {"train_loss": -22.101566314697266, "global_step": 113051, "epoch": 1362} {"train_loss": -21.5851993560791, "global_step": 113052, "epoch": 1362} {"train_loss": -21.97049903869629, "global_step": 113053, "epoch": 1362} {"train_loss": -21.56777000427246, "global_step": 113054, "epoch": 1362} {"train_loss": -22.05396842956543, "global_step": 113055, "epoch": 1362} {"train_loss": -21.697341918945312, "global_step": 113056, "epoch": 1362} {"train_loss": -21.78470230102539, "global_step": 113057, "epoch": 1362} {"train_loss": -22.187992095947266, "global_step": 113058, "epoch": 1362} {"train_loss": -21.835542678833008, "global_step": 113059, "epoch": 1362} {"train_loss": -22.09572410583496, "global_step": 113060, "epoch": 1362} {"train_loss": -21.8166446685791, "global_step": 113061, "epoch": 1362} {"train_loss": -22.090728759765625, "global_step": 113062, "epoch": 1362} {"train_loss": -21.997060775756836, "global_step": 113063, "epoch": 1362} {"train_loss": -22.178123474121094, "global_step": 113064, "epoch": 1362} {"train_loss": -22.043920516967773, "global_step": 113065, "epoch": 1362} {"train_loss": -22.031057357788086, "global_step": 113066, "epoch": 1362} {"train_loss": -22.090578079223633, "global_step": 113067, "epoch": 1362} {"train_loss": -22.000350952148438, "global_step": 113068, "epoch": 1362} {"train_loss": -22.1364803314209, "global_step": 113069, "epoch": 1362} {"train_loss": -22.288000106811523, "global_step": 113070, "epoch": 1362} {"train_loss": -22.27423667907715, "global_step": 113071, "epoch": 1362} {"train_loss": -22.283483505249023, "global_step": 113072, "epoch": 1362} {"train_loss": -22.045698165893555, "global_step": 113073, "epoch": 1362} {"train_loss": -22.2900390625, "global_step": 113074, "epoch": 1362} {"train_loss": -22.22395896911621, "global_step": 113075, "epoch": 1362} {"train_loss": -22.054227828979492, "global_step": 113076, "epoch": 1362} {"train_loss": -22.09879493713379, "global_step": 113077, "epoch": 1362} {"train_loss": -22.0482120513916, "global_step": 113078, "epoch": 1362} {"train_loss": -22.42148780822754, "global_step": 113079, "epoch": 1362} {"train_loss": -22.575712203979492, "global_step": 113080, "epoch": 1362} {"train_loss": -22.216520309448242, "global_step": 113081, "epoch": 1362} {"train_loss": -22.443641662597656, "global_step": 113082, "epoch": 1362} {"train_loss": -22.52412986755371, "global_step": 113083, "epoch": 1362} {"train_loss": -22.486467361450195, "global_step": 113084, "epoch": 1362} {"train_loss": -22.377275466918945, "global_step": 113085, "epoch": 1362} {"train_loss": -22.17556381225586, "global_step": 113086, "epoch": 1362} {"train_loss": -22.187610626220703, "global_step": 113087, "epoch": 1362} {"train_loss": -22.5402774810791, "global_step": 113088, "epoch": 1362} {"train_loss": -22.312637329101562, "global_step": 113089, "epoch": 1362} {"train_loss": -22.773681640625, "global_step": 113090, "epoch": 1362} {"train_loss": -22.269943237304688, "global_step": 113091, "epoch": 1362} {"train_loss": -22.336172103881836, "global_step": 113092, "epoch": 1362} {"train_loss": -22.24710464477539, "global_step": 113093, "epoch": 1362} {"train_loss": -22.364990234375, "global_step": 113094, "epoch": 1362} {"train_loss": -22.381269454956055, "global_step": 113095, "epoch": 1362} {"train_loss": -22.642187118530273, "global_step": 113096, "epoch": 1362} {"train_loss": -22.268957138061523, "global_step": 113097, "epoch": 1362} {"train_loss": -22.290576934814453, "global_step": 113098, "epoch": 1362} {"train_loss": -22.42728042602539, "global_step": 113099, "epoch": 1362} {"train_loss": -22.53608512878418, "global_step": 113100, "epoch": 1362} {"train_loss": -22.15671157836914, "global_step": 113101, "epoch": 1362} {"train_loss": -21.946496963500977, "global_step": 113102, "epoch": 1362} {"train_loss": -22.181894302368164, "global_step": 113103, "epoch": 1362} {"train_loss": -22.32441520690918, "global_step": 113104, "epoch": 1362} {"train_loss": -22.433948516845703, "global_step": 113105, "epoch": 1362} {"train_loss": -22.557552337646484, "global_step": 113106, "epoch": 1362} {"train_loss": -22.376802444458008, "global_step": 113107, "epoch": 1362} {"train_loss": -22.463605880737305, "global_step": 113108, "epoch": 1362} {"train_loss": -22.82579803466797, "global_step": 113109, "epoch": 1362} {"train_loss": -22.287399291992188, "global_step": 113110, "epoch": 1362} {"train_loss": -22.311147689819336, "global_step": 113111, "epoch": 1362} {"train_loss": -22.2890567779541, "global_step": 113112, "epoch": 1362} {"train_loss": -22.080848693847656, "global_step": 113113, "epoch": 1362} {"train_loss": -22.351490020751953, "global_step": 113114, "epoch": 1362} {"train_loss": -22.584341049194336, "global_step": 113115, "epoch": 1362} {"train_loss": -22.220916748046875, "global_step": 113116, "epoch": 1362} {"train_loss": -22.37577247619629, "global_step": 113117, "epoch": 1362} {"train_loss": -22.061933517456055, "global_step": 113118, "epoch": 1362} {"train_loss": -22.05116081237793, "global_step": 113119, "epoch": 1362} {"train_loss": -22.325220108032227, "global_step": 113120, "epoch": 1362} {"train_loss": -22.09256935119629, "global_step": 113121, "epoch": 1362} {"train_loss": -22.332927703857422, "global_step": 113122, "epoch": 1362} {"train_loss": -22.2769832611084, "global_step": 113123, "epoch": 1362} {"train_loss": -22.349445343017578, "global_step": 113124, "epoch": 1362} {"train_loss": -22.54780387878418, "global_step": 113125, "epoch": 1362} {"train_loss": -22.625858306884766, "global_step": 113126, "epoch": 1362} {"train_loss": -22.197479248046875, "global_step": 113127, "epoch": 1362} {"train_loss": -22.17924226048481, "global_step": 113128, "epoch": 1362, "val_loss": 6178015.0} {"train_loss": -22.014829635620117, "global_step": 113129, "epoch": 1363} {"train_loss": -22.3104305267334, "global_step": 113130, "epoch": 1363} {"train_loss": -22.131107330322266, "global_step": 113131, "epoch": 1363} {"train_loss": -22.113262176513672, "global_step": 113132, "epoch": 1363} {"train_loss": -22.216154098510742, "global_step": 113133, "epoch": 1363} {"train_loss": -21.85384178161621, "global_step": 113134, "epoch": 1363} {"train_loss": -22.578556060791016, "global_step": 113135, "epoch": 1363} {"train_loss": -22.363693237304688, "global_step": 113136, "epoch": 1363} {"train_loss": -22.49778938293457, "global_step": 113137, "epoch": 1363} {"train_loss": -22.38935661315918, "global_step": 113138, "epoch": 1363} {"train_loss": -22.133216857910156, "global_step": 113139, "epoch": 1363} {"train_loss": -22.413541793823242, "global_step": 113140, "epoch": 1363} {"train_loss": -22.231130599975586, "global_step": 113141, "epoch": 1363} {"train_loss": -22.260839462280273, "global_step": 113142, "epoch": 1363} {"train_loss": -21.95115852355957, "global_step": 113143, "epoch": 1363} {"train_loss": -21.58384895324707, "global_step": 113144, "epoch": 1363} {"train_loss": -22.538654327392578, "global_step": 113145, "epoch": 1363} {"train_loss": -22.431116104125977, "global_step": 113146, "epoch": 1363} {"train_loss": -22.3687686920166, "global_step": 113147, "epoch": 1363} {"train_loss": -22.35762596130371, "global_step": 113148, "epoch": 1363} {"train_loss": -22.2981014251709, "global_step": 113149, "epoch": 1363} {"train_loss": -22.62905502319336, "global_step": 113150, "epoch": 1363} {"train_loss": -22.23133659362793, "global_step": 113151, "epoch": 1363} {"train_loss": -22.455371856689453, "global_step": 113152, "epoch": 1363} {"train_loss": -22.276493072509766, "global_step": 113153, "epoch": 1363} {"train_loss": -22.336402893066406, "global_step": 113154, "epoch": 1363} {"train_loss": -22.165061950683594, "global_step": 113155, "epoch": 1363} {"train_loss": -22.563257217407227, "global_step": 113156, "epoch": 1363} {"train_loss": -21.88819694519043, "global_step": 113157, "epoch": 1363} {"train_loss": -21.808347702026367, "global_step": 113158, "epoch": 1363} {"train_loss": -22.232484817504883, "global_step": 113159, "epoch": 1363} {"train_loss": -22.446725845336914, "global_step": 113160, "epoch": 1363} {"train_loss": -22.710813522338867, "global_step": 113161, "epoch": 1363} {"train_loss": -22.600004196166992, "global_step": 113162, "epoch": 1363} {"train_loss": -22.288131713867188, "global_step": 113163, "epoch": 1363} {"train_loss": -22.350576400756836, "global_step": 113164, "epoch": 1363} {"train_loss": -22.002792358398438, "global_step": 113165, "epoch": 1363} {"train_loss": -22.172929763793945, "global_step": 113166, "epoch": 1363} {"train_loss": -22.54234504699707, "global_step": 113167, "epoch": 1363} {"train_loss": -22.21930694580078, "global_step": 113168, "epoch": 1363} {"train_loss": -22.22268295288086, "global_step": 113169, "epoch": 1363} {"train_loss": -22.173307418823242, "global_step": 113170, "epoch": 1363} {"train_loss": -22.336389541625977, "global_step": 113171, "epoch": 1363} {"train_loss": -22.040246963500977, "global_step": 113172, "epoch": 1363} {"train_loss": -22.22401237487793, "global_step": 113173, "epoch": 1363} {"train_loss": -22.457233428955078, "global_step": 113174, "epoch": 1363} {"train_loss": -22.4130916595459, "global_step": 113175, "epoch": 1363} {"train_loss": -21.928585052490234, "global_step": 113176, "epoch": 1363} {"train_loss": -22.302810668945312, "global_step": 113177, "epoch": 1363} {"train_loss": -22.112686157226562, "global_step": 113178, "epoch": 1363} {"train_loss": -22.306180953979492, "global_step": 113179, "epoch": 1363} {"train_loss": -22.29131507873535, "global_step": 113180, "epoch": 1363} {"train_loss": -22.16335105895996, "global_step": 113181, "epoch": 1363} {"train_loss": -22.20670509338379, "global_step": 113182, "epoch": 1363} {"train_loss": -21.79127311706543, "global_step": 113183, "epoch": 1363} {"train_loss": -22.4241886138916, "global_step": 113184, "epoch": 1363} {"train_loss": -22.7717227935791, "global_step": 113185, "epoch": 1363} {"train_loss": -22.143369674682617, "global_step": 113186, "epoch": 1363} {"train_loss": -22.22942543029785, "global_step": 113187, "epoch": 1363} {"train_loss": -22.457361221313477, "global_step": 113188, "epoch": 1363} {"train_loss": -22.669050216674805, "global_step": 113189, "epoch": 1363} {"train_loss": -22.147380828857422, "global_step": 113190, "epoch": 1363} {"train_loss": -22.181570053100586, "global_step": 113191, "epoch": 1363} {"train_loss": -22.433948516845703, "global_step": 113192, "epoch": 1363} {"train_loss": -22.20857048034668, "global_step": 113193, "epoch": 1363} {"train_loss": -22.386947631835938, "global_step": 113194, "epoch": 1363} {"train_loss": -22.376596450805664, "global_step": 113195, "epoch": 1363} {"train_loss": -22.293991088867188, "global_step": 113196, "epoch": 1363} {"train_loss": -22.48238182067871, "global_step": 113197, "epoch": 1363} {"train_loss": -22.320661544799805, "global_step": 113198, "epoch": 1363} {"train_loss": -22.68094825744629, "global_step": 113199, "epoch": 1363} {"train_loss": -22.488149642944336, "global_step": 113200, "epoch": 1363} {"train_loss": -22.586023330688477, "global_step": 113201, "epoch": 1363} {"train_loss": -22.135923385620117, "global_step": 113202, "epoch": 1363} {"train_loss": -22.372522354125977, "global_step": 113203, "epoch": 1363} {"train_loss": -22.355749130249023, "global_step": 113204, "epoch": 1363} {"train_loss": -22.515594482421875, "global_step": 113205, "epoch": 1363} {"train_loss": -22.52095603942871, "global_step": 113206, "epoch": 1363} {"train_loss": -22.14611053466797, "global_step": 113207, "epoch": 1363} {"train_loss": -22.64768409729004, "global_step": 113208, "epoch": 1363} {"train_loss": -22.14164161682129, "global_step": 113209, "epoch": 1363} {"train_loss": -22.27320671081543, "global_step": 113210, "epoch": 1363} {"train_loss": -22.314870076007153, "global_step": 113211, "epoch": 1363, "val_loss": 6177102.5} {"train_loss": -21.715503692626953, "global_step": 113212, "epoch": 1364} {"train_loss": -21.830984115600586, "global_step": 113213, "epoch": 1364} {"train_loss": -21.731456756591797, "global_step": 113214, "epoch": 1364} {"train_loss": -21.893224716186523, "global_step": 113215, "epoch": 1364} {"train_loss": -22.173431396484375, "global_step": 113216, "epoch": 1364} {"train_loss": -21.463504791259766, "global_step": 113217, "epoch": 1364} {"train_loss": -22.041412353515625, "global_step": 113218, "epoch": 1364} {"train_loss": -21.522384643554688, "global_step": 113219, "epoch": 1364} {"train_loss": -21.91573143005371, "global_step": 113220, "epoch": 1364} {"train_loss": -21.716266632080078, "global_step": 113221, "epoch": 1364} {"train_loss": -22.02174949645996, "global_step": 113222, "epoch": 1364} {"train_loss": -21.686819076538086, "global_step": 113223, "epoch": 1364} {"train_loss": -21.922109603881836, "global_step": 113224, "epoch": 1364} {"train_loss": -21.932554244995117, "global_step": 113225, "epoch": 1364} {"train_loss": -21.698972702026367, "global_step": 113226, "epoch": 1364} {"train_loss": -21.69068717956543, "global_step": 113227, "epoch": 1364} {"train_loss": -22.25684928894043, "global_step": 113228, "epoch": 1364} {"train_loss": -22.006772994995117, "global_step": 113229, "epoch": 1364} {"train_loss": -22.28974723815918, "global_step": 113230, "epoch": 1364} {"train_loss": -22.012601852416992, "global_step": 113231, "epoch": 1364} {"train_loss": -22.447994232177734, "global_step": 113232, "epoch": 1364} {"train_loss": -22.10789680480957, "global_step": 113233, "epoch": 1364} {"train_loss": -22.064441680908203, "global_step": 113234, "epoch": 1364} {"train_loss": -22.166790008544922, "global_step": 113235, "epoch": 1364} {"train_loss": -22.194828033447266, "global_step": 113236, "epoch": 1364} {"train_loss": -22.303091049194336, "global_step": 113237, "epoch": 1364} {"train_loss": -22.24207878112793, "global_step": 113238, "epoch": 1364} {"train_loss": -21.713117599487305, "global_step": 113239, "epoch": 1364} {"train_loss": -22.209056854248047, "global_step": 113240, "epoch": 1364} {"train_loss": -22.175607681274414, "global_step": 113241, "epoch": 1364} {"train_loss": -22.196514129638672, "global_step": 113242, "epoch": 1364} {"train_loss": -22.177106857299805, "global_step": 113243, "epoch": 1364} {"train_loss": -22.087234497070312, "global_step": 113244, "epoch": 1364} {"train_loss": -22.39052391052246, "global_step": 113245, "epoch": 1364} {"train_loss": -22.614938735961914, "global_step": 113246, "epoch": 1364} {"train_loss": -22.28520393371582, "global_step": 113247, "epoch": 1364} {"train_loss": -22.179412841796875, "global_step": 113248, "epoch": 1364} {"train_loss": -22.562440872192383, "global_step": 113249, "epoch": 1364} {"train_loss": -22.61115837097168, "global_step": 113250, "epoch": 1364} {"train_loss": -22.584346771240234, "global_step": 113251, "epoch": 1364} {"train_loss": -22.7138729095459, "global_step": 113252, "epoch": 1364} {"train_loss": -22.317466735839844, "global_step": 113253, "epoch": 1364} {"train_loss": -22.398723602294922, "global_step": 113254, "epoch": 1364} {"train_loss": -22.521020889282227, "global_step": 113255, "epoch": 1364} {"train_loss": -22.204975128173828, "global_step": 113256, "epoch": 1364} {"train_loss": -22.163724899291992, "global_step": 113257, "epoch": 1364} {"train_loss": -22.20985221862793, "global_step": 113258, "epoch": 1364} {"train_loss": -22.260984420776367, "global_step": 113259, "epoch": 1364} {"train_loss": -22.1428279876709, "global_step": 113260, "epoch": 1364} {"train_loss": -22.27156639099121, "global_step": 113261, "epoch": 1364} {"train_loss": -22.536041259765625, "global_step": 113262, "epoch": 1364} {"train_loss": -22.324996948242188, "global_step": 113263, "epoch": 1364} {"train_loss": -22.505430221557617, "global_step": 113264, "epoch": 1364} {"train_loss": -22.25450325012207, "global_step": 113265, "epoch": 1364} {"train_loss": -22.265655517578125, "global_step": 113266, "epoch": 1364} {"train_loss": -22.117490768432617, "global_step": 113267, "epoch": 1364} {"train_loss": -22.36786460876465, "global_step": 113268, "epoch": 1364} {"train_loss": -22.294736862182617, "global_step": 113269, "epoch": 1364} {"train_loss": -22.359525680541992, "global_step": 113270, "epoch": 1364} {"train_loss": -22.222702026367188, "global_step": 113271, "epoch": 1364} {"train_loss": -22.215045928955078, "global_step": 113272, "epoch": 1364} {"train_loss": -22.536977767944336, "global_step": 113273, "epoch": 1364} {"train_loss": -22.432706832885742, "global_step": 113274, "epoch": 1364} {"train_loss": -22.19182777404785, "global_step": 113275, "epoch": 1364} {"train_loss": -22.35069465637207, "global_step": 113276, "epoch": 1364} {"train_loss": -22.18012809753418, "global_step": 113277, "epoch": 1364} {"train_loss": -22.199186325073242, "global_step": 113278, "epoch": 1364} {"train_loss": -22.6136531829834, "global_step": 113279, "epoch": 1364} {"train_loss": -22.246288299560547, "global_step": 113280, "epoch": 1364} {"train_loss": -22.427305221557617, "global_step": 113281, "epoch": 1364} {"train_loss": -22.6656494140625, "global_step": 113282, "epoch": 1364} {"train_loss": -22.600046157836914, "global_step": 113283, "epoch": 1364} {"train_loss": -21.88007926940918, "global_step": 113284, "epoch": 1364} {"train_loss": -22.31406021118164, "global_step": 113285, "epoch": 1364} {"train_loss": -22.285215377807617, "global_step": 113286, "epoch": 1364} {"train_loss": -22.25411033630371, "global_step": 113287, "epoch": 1364} {"train_loss": -22.460895538330078, "global_step": 113288, "epoch": 1364} {"train_loss": -22.540494918823242, "global_step": 113289, "epoch": 1364} {"train_loss": -22.409038543701172, "global_step": 113290, "epoch": 1364} {"train_loss": -22.130786895751953, "global_step": 113291, "epoch": 1364} {"train_loss": -22.945453643798828, "global_step": 113292, "epoch": 1364} {"train_loss": -22.499723434448242, "global_step": 113293, "epoch": 1364} {"train_loss": -22.215272099138744, "global_step": 113294, "epoch": 1364, "val_loss": 6061929.0} {"train_loss": -22.056421279907227, "global_step": 113295, "epoch": 1365} {"train_loss": -21.730072021484375, "global_step": 113296, "epoch": 1365} {"train_loss": -21.833520889282227, "global_step": 113297, "epoch": 1365} {"train_loss": -22.308279037475586, "global_step": 113298, "epoch": 1365} {"train_loss": -21.324039459228516, "global_step": 113299, "epoch": 1365} {"train_loss": -22.0164737701416, "global_step": 113300, "epoch": 1365} {"train_loss": -22.28327751159668, "global_step": 113301, "epoch": 1365} {"train_loss": -22.212039947509766, "global_step": 113302, "epoch": 1365} {"train_loss": -22.19289207458496, "global_step": 113303, "epoch": 1365} {"train_loss": -21.86598014831543, "global_step": 113304, "epoch": 1365} {"train_loss": -22.231538772583008, "global_step": 113305, "epoch": 1365} {"train_loss": -22.302114486694336, "global_step": 113306, "epoch": 1365} {"train_loss": -22.28822135925293, "global_step": 113307, "epoch": 1365} {"train_loss": -21.988506317138672, "global_step": 113308, "epoch": 1365} {"train_loss": -22.01249122619629, "global_step": 113309, "epoch": 1365} {"train_loss": -22.05169105529785, "global_step": 113310, "epoch": 1365} {"train_loss": -22.115631103515625, "global_step": 113311, "epoch": 1365} {"train_loss": -22.29436683654785, "global_step": 113312, "epoch": 1365} {"train_loss": -21.956762313842773, "global_step": 113313, "epoch": 1365} {"train_loss": -22.19868278503418, "global_step": 113314, "epoch": 1365} {"train_loss": -22.341169357299805, "global_step": 113315, "epoch": 1365} {"train_loss": -21.585721969604492, "global_step": 113316, "epoch": 1365} {"train_loss": -22.32315444946289, "global_step": 113317, "epoch": 1365} {"train_loss": -22.491567611694336, "global_step": 113318, "epoch": 1365} {"train_loss": -22.252355575561523, "global_step": 113319, "epoch": 1365} {"train_loss": -22.377029418945312, "global_step": 113320, "epoch": 1365} {"train_loss": -22.097381591796875, "global_step": 113321, "epoch": 1365} {"train_loss": -22.370956420898438, "global_step": 113322, "epoch": 1365} {"train_loss": -22.64145851135254, "global_step": 113323, "epoch": 1365} {"train_loss": -22.464521408081055, "global_step": 113324, "epoch": 1365} {"train_loss": -22.453237533569336, "global_step": 113325, "epoch": 1365} {"train_loss": -22.639902114868164, "global_step": 113326, "epoch": 1365} {"train_loss": -22.382102966308594, "global_step": 113327, "epoch": 1365} {"train_loss": -22.26543617248535, "global_step": 113328, "epoch": 1365} {"train_loss": -22.555837631225586, "global_step": 113329, "epoch": 1365} {"train_loss": -22.462146759033203, "global_step": 113330, "epoch": 1365} {"train_loss": -22.29386329650879, "global_step": 113331, "epoch": 1365} {"train_loss": -22.267786026000977, "global_step": 113332, "epoch": 1365} {"train_loss": -22.233692169189453, "global_step": 113333, "epoch": 1365} {"train_loss": -21.981037139892578, "global_step": 113334, "epoch": 1365} {"train_loss": -22.567974090576172, "global_step": 113335, "epoch": 1365} {"train_loss": -22.40632438659668, "global_step": 113336, "epoch": 1365} {"train_loss": -22.087390899658203, "global_step": 113337, "epoch": 1365} {"train_loss": -22.422311782836914, "global_step": 113338, "epoch": 1365} {"train_loss": -22.49355697631836, "global_step": 113339, "epoch": 1365} {"train_loss": -22.613357543945312, "global_step": 113340, "epoch": 1365} {"train_loss": -22.587644577026367, "global_step": 113341, "epoch": 1365} {"train_loss": -21.977252960205078, "global_step": 113342, "epoch": 1365} {"train_loss": -22.38376235961914, "global_step": 113343, "epoch": 1365} {"train_loss": -22.13807487487793, "global_step": 113344, "epoch": 1365} {"train_loss": -22.451404571533203, "global_step": 113345, "epoch": 1365} {"train_loss": -22.312047958374023, "global_step": 113346, "epoch": 1365} {"train_loss": -22.123790740966797, "global_step": 113347, "epoch": 1365} {"train_loss": -22.262014389038086, "global_step": 113348, "epoch": 1365} {"train_loss": -22.19070816040039, "global_step": 113349, "epoch": 1365} {"train_loss": -22.258512496948242, "global_step": 113350, "epoch": 1365} {"train_loss": -22.196210861206055, "global_step": 113351, "epoch": 1365} {"train_loss": -22.1851806640625, "global_step": 113352, "epoch": 1365} {"train_loss": -22.078020095825195, "global_step": 113353, "epoch": 1365} {"train_loss": -22.343637466430664, "global_step": 113354, "epoch": 1365} {"train_loss": -22.29427719116211, "global_step": 113355, "epoch": 1365} {"train_loss": -21.762683868408203, "global_step": 113356, "epoch": 1365} {"train_loss": -21.96847915649414, "global_step": 113357, "epoch": 1365} {"train_loss": -22.10580062866211, "global_step": 113358, "epoch": 1365} {"train_loss": -22.070850372314453, "global_step": 113359, "epoch": 1365} {"train_loss": -22.48590850830078, "global_step": 113360, "epoch": 1365} {"train_loss": -22.53061294555664, "global_step": 113361, "epoch": 1365} {"train_loss": -22.09653663635254, "global_step": 113362, "epoch": 1365} {"train_loss": -22.181427001953125, "global_step": 113363, "epoch": 1365} {"train_loss": -22.109403610229492, "global_step": 113364, "epoch": 1365} {"train_loss": -22.439987182617188, "global_step": 113365, "epoch": 1365} {"train_loss": -22.24995994567871, "global_step": 113366, "epoch": 1365} {"train_loss": -22.348419189453125, "global_step": 113367, "epoch": 1365} {"train_loss": -22.134262084960938, "global_step": 113368, "epoch": 1365} {"train_loss": -22.484132766723633, "global_step": 113369, "epoch": 1365} {"train_loss": -22.438291549682617, "global_step": 113370, "epoch": 1365} {"train_loss": -21.92094612121582, "global_step": 113371, "epoch": 1365} {"train_loss": -22.103900909423828, "global_step": 113372, "epoch": 1365} {"train_loss": -22.341367721557617, "global_step": 113373, "epoch": 1365} {"train_loss": -22.38288688659668, "global_step": 113374, "epoch": 1365} {"train_loss": -22.097333908081055, "global_step": 113375, "epoch": 1365} {"train_loss": -22.386302947998047, "global_step": 113376, "epoch": 1365} {"train_loss": -22.23046256835202, "global_step": 113377, "epoch": 1365, "val_loss": 6205160.0} {"train_loss": -22.059980392456055, "global_step": 113378, "epoch": 1366} {"train_loss": -22.54652976989746, "global_step": 113379, "epoch": 1366} {"train_loss": -22.07078742980957, "global_step": 113380, "epoch": 1366} {"train_loss": -22.219228744506836, "global_step": 113381, "epoch": 1366} {"train_loss": -22.193979263305664, "global_step": 113382, "epoch": 1366} {"train_loss": -22.438804626464844, "global_step": 113383, "epoch": 1366} {"train_loss": -22.46097183227539, "global_step": 113384, "epoch": 1366} {"train_loss": -22.21475601196289, "global_step": 113385, "epoch": 1366} {"train_loss": -22.079893112182617, "global_step": 113386, "epoch": 1366} {"train_loss": -22.112024307250977, "global_step": 113387, "epoch": 1366} {"train_loss": -22.48018455505371, "global_step": 113388, "epoch": 1366} {"train_loss": -22.041473388671875, "global_step": 113389, "epoch": 1366} {"train_loss": -22.204578399658203, "global_step": 113390, "epoch": 1366} {"train_loss": -22.119400024414062, "global_step": 113391, "epoch": 1366} {"train_loss": -22.375696182250977, "global_step": 113392, "epoch": 1366} {"train_loss": -22.258737564086914, "global_step": 113393, "epoch": 1366} {"train_loss": -22.205419540405273, "global_step": 113394, "epoch": 1366} {"train_loss": -22.348737716674805, "global_step": 113395, "epoch": 1366} {"train_loss": -22.323280334472656, "global_step": 113396, "epoch": 1366} {"train_loss": -22.104284286499023, "global_step": 113397, "epoch": 1366} {"train_loss": -22.186779022216797, "global_step": 113398, "epoch": 1366} {"train_loss": -22.14444923400879, "global_step": 113399, "epoch": 1366} {"train_loss": -22.526168823242188, "global_step": 113400, "epoch": 1366} {"train_loss": -22.2786922454834, "global_step": 113401, "epoch": 1366} {"train_loss": -22.581405639648438, "global_step": 113402, "epoch": 1366} {"train_loss": -22.5811710357666, "global_step": 113403, "epoch": 1366} {"train_loss": -22.491968154907227, "global_step": 113404, "epoch": 1366} {"train_loss": -22.72684097290039, "global_step": 113405, "epoch": 1366} {"train_loss": -22.052648544311523, "global_step": 113406, "epoch": 1366} {"train_loss": -22.18310546875, "global_step": 113407, "epoch": 1366} {"train_loss": -22.103622436523438, "global_step": 113408, "epoch": 1366} {"train_loss": -22.387174606323242, "global_step": 113409, "epoch": 1366} {"train_loss": -22.50618553161621, "global_step": 113410, "epoch": 1366} {"train_loss": -22.37999725341797, "global_step": 113411, "epoch": 1366} {"train_loss": -22.309743881225586, "global_step": 113412, "epoch": 1366} {"train_loss": -22.490121841430664, "global_step": 113413, "epoch": 1366} {"train_loss": -22.604650497436523, "global_step": 113414, "epoch": 1366} {"train_loss": -22.246641159057617, "global_step": 113415, "epoch": 1366} {"train_loss": -22.647260665893555, "global_step": 113416, "epoch": 1366} {"train_loss": -22.192411422729492, "global_step": 113417, "epoch": 1366} {"train_loss": -22.327749252319336, "global_step": 113418, "epoch": 1366} {"train_loss": -22.351749420166016, "global_step": 113419, "epoch": 1366} {"train_loss": -22.54408073425293, "global_step": 113420, "epoch": 1366} {"train_loss": -22.457178115844727, "global_step": 113421, "epoch": 1366} {"train_loss": -22.477670669555664, "global_step": 113422, "epoch": 1366} {"train_loss": -22.08819580078125, "global_step": 113423, "epoch": 1366} {"train_loss": -22.317371368408203, "global_step": 113424, "epoch": 1366} {"train_loss": -22.489225387573242, "global_step": 113425, "epoch": 1366} {"train_loss": -22.293813705444336, "global_step": 113426, "epoch": 1366} {"train_loss": -22.03790855407715, "global_step": 113427, "epoch": 1366} {"train_loss": -22.44075584411621, "global_step": 113428, "epoch": 1366} {"train_loss": -22.1796817779541, "global_step": 113429, "epoch": 1366} {"train_loss": -22.1931095123291, "global_step": 113430, "epoch": 1366} {"train_loss": -22.099016189575195, "global_step": 113431, "epoch": 1366} {"train_loss": -22.538244247436523, "global_step": 113432, "epoch": 1366} {"train_loss": -22.376083374023438, "global_step": 113433, "epoch": 1366} {"train_loss": -21.821975708007812, "global_step": 113434, "epoch": 1366} {"train_loss": -22.3317928314209, "global_step": 113435, "epoch": 1366} {"train_loss": -22.368030548095703, "global_step": 113436, "epoch": 1366} {"train_loss": -22.12230110168457, "global_step": 113437, "epoch": 1366} {"train_loss": -22.38179588317871, "global_step": 113438, "epoch": 1366} {"train_loss": -22.040807723999023, "global_step": 113439, "epoch": 1366} {"train_loss": -22.746551513671875, "global_step": 113440, "epoch": 1366} {"train_loss": -22.61347770690918, "global_step": 113441, "epoch": 1366} {"train_loss": -22.573335647583008, "global_step": 113442, "epoch": 1366} {"train_loss": -22.65896987915039, "global_step": 113443, "epoch": 1366} {"train_loss": -22.461645126342773, "global_step": 113444, "epoch": 1366} {"train_loss": -22.671253204345703, "global_step": 113445, "epoch": 1366} {"train_loss": -22.608457565307617, "global_step": 113446, "epoch": 1366} {"train_loss": -22.499845504760742, "global_step": 113447, "epoch": 1366} {"train_loss": -22.377750396728516, "global_step": 113448, "epoch": 1366} {"train_loss": -22.29950714111328, "global_step": 113449, "epoch": 1366} {"train_loss": -22.632444381713867, "global_step": 113450, "epoch": 1366} {"train_loss": -22.298383712768555, "global_step": 113451, "epoch": 1366} {"train_loss": -22.200305938720703, "global_step": 113452, "epoch": 1366} {"train_loss": -22.22825050354004, "global_step": 113453, "epoch": 1366} {"train_loss": -22.101421356201172, "global_step": 113454, "epoch": 1366} {"train_loss": -22.529905319213867, "global_step": 113455, "epoch": 1366} {"train_loss": -22.418569564819336, "global_step": 113456, "epoch": 1366} {"train_loss": -22.25312614440918, "global_step": 113457, "epoch": 1366} {"train_loss": -22.31917381286621, "global_step": 113458, "epoch": 1366} {"train_loss": -22.53829002380371, "global_step": 113459, "epoch": 1366} {"train_loss": -22.34503104887813, "global_step": 113460, "epoch": 1366, "val_loss": 6160610.5} {"train_loss": -22.13651466369629, "global_step": 113461, "epoch": 1367} {"train_loss": -21.736896514892578, "global_step": 113462, "epoch": 1367} {"train_loss": -21.943984985351562, "global_step": 113463, "epoch": 1367} {"train_loss": -21.504972457885742, "global_step": 113464, "epoch": 1367} {"train_loss": -22.10562515258789, "global_step": 113465, "epoch": 1367} {"train_loss": -21.706212997436523, "global_step": 113466, "epoch": 1367} {"train_loss": -22.29227638244629, "global_step": 113467, "epoch": 1367} {"train_loss": -21.561933517456055, "global_step": 113468, "epoch": 1367} {"train_loss": -22.231061935424805, "global_step": 113469, "epoch": 1367} {"train_loss": -21.713159561157227, "global_step": 113470, "epoch": 1367} {"train_loss": -21.975088119506836, "global_step": 113471, "epoch": 1367} {"train_loss": -22.002538681030273, "global_step": 113472, "epoch": 1367} {"train_loss": -22.08417320251465, "global_step": 113473, "epoch": 1367} {"train_loss": -22.217580795288086, "global_step": 113474, "epoch": 1367} {"train_loss": -22.081554412841797, "global_step": 113475, "epoch": 1367} {"train_loss": -22.086393356323242, "global_step": 113476, "epoch": 1367} {"train_loss": -22.10738754272461, "global_step": 113477, "epoch": 1367} {"train_loss": -22.375898361206055, "global_step": 113478, "epoch": 1367} {"train_loss": -21.796123504638672, "global_step": 113479, "epoch": 1367} {"train_loss": -22.216367721557617, "global_step": 113480, "epoch": 1367} {"train_loss": -22.2874813079834, "global_step": 113481, "epoch": 1367} {"train_loss": -22.320865631103516, "global_step": 113482, "epoch": 1367} {"train_loss": -22.244083404541016, "global_step": 113483, "epoch": 1367} {"train_loss": -22.384824752807617, "global_step": 113484, "epoch": 1367} {"train_loss": -22.044050216674805, "global_step": 113485, "epoch": 1367} {"train_loss": -22.2508487701416, "global_step": 113486, "epoch": 1367} {"train_loss": -22.531583786010742, "global_step": 113487, "epoch": 1367} {"train_loss": -22.525636672973633, "global_step": 113488, "epoch": 1367} {"train_loss": -22.55404281616211, "global_step": 113489, "epoch": 1367} {"train_loss": -22.563093185424805, "global_step": 113490, "epoch": 1367} {"train_loss": -21.85615348815918, "global_step": 113491, "epoch": 1367} {"train_loss": -22.494901657104492, "global_step": 113492, "epoch": 1367} {"train_loss": -22.411287307739258, "global_step": 113493, "epoch": 1367} {"train_loss": -22.228790283203125, "global_step": 113494, "epoch": 1367} {"train_loss": -22.4704647064209, "global_step": 113495, "epoch": 1367} {"train_loss": -22.11350440979004, "global_step": 113496, "epoch": 1367} {"train_loss": -22.169767379760742, "global_step": 113497, "epoch": 1367} {"train_loss": -22.05306053161621, "global_step": 113498, "epoch": 1367} {"train_loss": -22.273788452148438, "global_step": 113499, "epoch": 1367} {"train_loss": -22.291624069213867, "global_step": 113500, "epoch": 1367} {"train_loss": -22.257184982299805, "global_step": 113501, "epoch": 1367} {"train_loss": -22.04193115234375, "global_step": 113502, "epoch": 1367} {"train_loss": -22.193510055541992, "global_step": 113503, "epoch": 1367} {"train_loss": -22.333986282348633, "global_step": 113504, "epoch": 1367} {"train_loss": -22.235370635986328, "global_step": 113505, "epoch": 1367} {"train_loss": -22.784748077392578, "global_step": 113506, "epoch": 1367} {"train_loss": -22.530637741088867, "global_step": 113507, "epoch": 1367} {"train_loss": -22.354028701782227, "global_step": 113508, "epoch": 1367} {"train_loss": -22.360471725463867, "global_step": 113509, "epoch": 1367} {"train_loss": -22.707624435424805, "global_step": 113510, "epoch": 1367} {"train_loss": -22.266050338745117, "global_step": 113511, "epoch": 1367} {"train_loss": -22.380395889282227, "global_step": 113512, "epoch": 1367} {"train_loss": -22.649911880493164, "global_step": 113513, "epoch": 1367} {"train_loss": -22.520889282226562, "global_step": 113514, "epoch": 1367} {"train_loss": -22.682525634765625, "global_step": 113515, "epoch": 1367} {"train_loss": -22.77652931213379, "global_step": 113516, "epoch": 1367} {"train_loss": -22.56992530822754, "global_step": 113517, "epoch": 1367} {"train_loss": -22.508310317993164, "global_step": 113518, "epoch": 1367} {"train_loss": -22.048480987548828, "global_step": 113519, "epoch": 1367} {"train_loss": -22.26559066772461, "global_step": 113520, "epoch": 1367} {"train_loss": -22.125944137573242, "global_step": 113521, "epoch": 1367} {"train_loss": -22.153398513793945, "global_step": 113522, "epoch": 1367} {"train_loss": -22.276748657226562, "global_step": 113523, "epoch": 1367} {"train_loss": -22.587135314941406, "global_step": 113524, "epoch": 1367} {"train_loss": -22.577054977416992, "global_step": 113525, "epoch": 1367} {"train_loss": -22.321691513061523, "global_step": 113526, "epoch": 1367} {"train_loss": -22.31313133239746, "global_step": 113527, "epoch": 1367} {"train_loss": -22.262149810791016, "global_step": 113528, "epoch": 1367} {"train_loss": -22.60398292541504, "global_step": 113529, "epoch": 1367} {"train_loss": -22.505910873413086, "global_step": 113530, "epoch": 1367} {"train_loss": -22.460857391357422, "global_step": 113531, "epoch": 1367} {"train_loss": -22.660551071166992, "global_step": 113532, "epoch": 1367} {"train_loss": -22.365446090698242, "global_step": 113533, "epoch": 1367} {"train_loss": -21.928890228271484, "global_step": 113534, "epoch": 1367} {"train_loss": -22.241666793823242, "global_step": 113535, "epoch": 1367} {"train_loss": -22.251953125, "global_step": 113536, "epoch": 1367} {"train_loss": -22.45452880859375, "global_step": 113537, "epoch": 1367} {"train_loss": -22.642974853515625, "global_step": 113538, "epoch": 1367} {"train_loss": -22.545738220214844, "global_step": 113539, "epoch": 1367} {"train_loss": -22.373807907104492, "global_step": 113540, "epoch": 1367} {"train_loss": -22.38396644592285, "global_step": 113541, "epoch": 1367} {"train_loss": -22.24267578125, "global_step": 113542, "epoch": 1367} {"train_loss": -22.263421001204524, "global_step": 113543, "epoch": 1367, "val_loss": 6261426.5} {"train_loss": -22.066190719604492, "global_step": 113544, "epoch": 1368} {"train_loss": -22.271427154541016, "global_step": 113545, "epoch": 1368} {"train_loss": -21.58741569519043, "global_step": 113546, "epoch": 1368} {"train_loss": -22.258956909179688, "global_step": 113547, "epoch": 1368} {"train_loss": -21.6538028717041, "global_step": 113548, "epoch": 1368} {"train_loss": -22.140737533569336, "global_step": 113549, "epoch": 1368} {"train_loss": -22.21283531188965, "global_step": 113550, "epoch": 1368} {"train_loss": -22.14841651916504, "global_step": 113551, "epoch": 1368} {"train_loss": -22.214170455932617, "global_step": 113552, "epoch": 1368} {"train_loss": -22.267236709594727, "global_step": 113553, "epoch": 1368} {"train_loss": -22.328731536865234, "global_step": 113554, "epoch": 1368} {"train_loss": -21.471057891845703, "global_step": 113555, "epoch": 1368} {"train_loss": -22.162893295288086, "global_step": 113556, "epoch": 1368} {"train_loss": -21.942890167236328, "global_step": 113557, "epoch": 1368} {"train_loss": -22.018280029296875, "global_step": 113558, "epoch": 1368} {"train_loss": -22.27623176574707, "global_step": 113559, "epoch": 1368} {"train_loss": -22.39190673828125, "global_step": 113560, "epoch": 1368} {"train_loss": -22.19891929626465, "global_step": 113561, "epoch": 1368} {"train_loss": -22.0061092376709, "global_step": 113562, "epoch": 1368} {"train_loss": -22.462635040283203, "global_step": 113563, "epoch": 1368} {"train_loss": -22.152957916259766, "global_step": 113564, "epoch": 1368} {"train_loss": -22.284128189086914, "global_step": 113565, "epoch": 1368} {"train_loss": -22.4229736328125, "global_step": 113566, "epoch": 1368} {"train_loss": -22.500629425048828, "global_step": 113567, "epoch": 1368} {"train_loss": -22.557077407836914, "global_step": 113568, "epoch": 1368} {"train_loss": -22.35268211364746, "global_step": 113569, "epoch": 1368} {"train_loss": -22.157960891723633, "global_step": 113570, "epoch": 1368} {"train_loss": -22.291654586791992, "global_step": 113571, "epoch": 1368} {"train_loss": -22.65141487121582, "global_step": 113572, "epoch": 1368} {"train_loss": -22.50813865661621, "global_step": 113573, "epoch": 1368} {"train_loss": -22.461416244506836, "global_step": 113574, "epoch": 1368} {"train_loss": -22.119115829467773, "global_step": 113575, "epoch": 1368} {"train_loss": -22.544443130493164, "global_step": 113576, "epoch": 1368} {"train_loss": -22.121688842773438, "global_step": 113577, "epoch": 1368} {"train_loss": -22.216196060180664, "global_step": 113578, "epoch": 1368} {"train_loss": -22.639097213745117, "global_step": 113579, "epoch": 1368} {"train_loss": -22.017797470092773, "global_step": 113580, "epoch": 1368} {"train_loss": -22.311893463134766, "global_step": 113581, "epoch": 1368} {"train_loss": -22.345579147338867, "global_step": 113582, "epoch": 1368} {"train_loss": -22.379501342773438, "global_step": 113583, "epoch": 1368} {"train_loss": -22.404748916625977, "global_step": 113584, "epoch": 1368} {"train_loss": -22.340808868408203, "global_step": 113585, "epoch": 1368} {"train_loss": -22.321964263916016, "global_step": 113586, "epoch": 1368} {"train_loss": -22.073104858398438, "global_step": 113587, "epoch": 1368} {"train_loss": -22.209348678588867, "global_step": 113588, "epoch": 1368} {"train_loss": -22.5654354095459, "global_step": 113589, "epoch": 1368} {"train_loss": -22.384735107421875, "global_step": 113590, "epoch": 1368} {"train_loss": -21.98561668395996, "global_step": 113591, "epoch": 1368} {"train_loss": -22.085302352905273, "global_step": 113592, "epoch": 1368} {"train_loss": -22.061857223510742, "global_step": 113593, "epoch": 1368} {"train_loss": -22.349557876586914, "global_step": 113594, "epoch": 1368} {"train_loss": -22.368497848510742, "global_step": 113595, "epoch": 1368} {"train_loss": -22.576169967651367, "global_step": 113596, "epoch": 1368} {"train_loss": -22.560861587524414, "global_step": 113597, "epoch": 1368} {"train_loss": -22.513593673706055, "global_step": 113598, "epoch": 1368} {"train_loss": -22.21709632873535, "global_step": 113599, "epoch": 1368} {"train_loss": -22.50844955444336, "global_step": 113600, "epoch": 1368} {"train_loss": -22.587284088134766, "global_step": 113601, "epoch": 1368} {"train_loss": -22.34834861755371, "global_step": 113602, "epoch": 1368} {"train_loss": -22.70932388305664, "global_step": 113603, "epoch": 1368} {"train_loss": -22.620473861694336, "global_step": 113604, "epoch": 1368} {"train_loss": -22.53708839416504, "global_step": 113605, "epoch": 1368} {"train_loss": -22.126047134399414, "global_step": 113606, "epoch": 1368} {"train_loss": -22.921363830566406, "global_step": 113607, "epoch": 1368} {"train_loss": -22.264509201049805, "global_step": 113608, "epoch": 1368} {"train_loss": -22.442724227905273, "global_step": 113609, "epoch": 1368} {"train_loss": -22.7321834564209, "global_step": 113610, "epoch": 1368} {"train_loss": -22.450021743774414, "global_step": 113611, "epoch": 1368} {"train_loss": -22.145620346069336, "global_step": 113612, "epoch": 1368} {"train_loss": -22.29271697998047, "global_step": 113613, "epoch": 1368} {"train_loss": -22.48415184020996, "global_step": 113614, "epoch": 1368} {"train_loss": -22.723209381103516, "global_step": 113615, "epoch": 1368} {"train_loss": -22.279495239257812, "global_step": 113616, "epoch": 1368} {"train_loss": -22.517187118530273, "global_step": 113617, "epoch": 1368} {"train_loss": -22.779401779174805, "global_step": 113618, "epoch": 1368} {"train_loss": -22.74628257751465, "global_step": 113619, "epoch": 1368} {"train_loss": -22.542560577392578, "global_step": 113620, "epoch": 1368} {"train_loss": -22.52461051940918, "global_step": 113621, "epoch": 1368} {"train_loss": -22.12727165222168, "global_step": 113622, "epoch": 1368} {"train_loss": -22.28201675415039, "global_step": 113623, "epoch": 1368} {"train_loss": -22.26883888244629, "global_step": 113624, "epoch": 1368} {"train_loss": -22.458526611328125, "global_step": 113625, "epoch": 1368} {"train_loss": -22.328370266650097, "global_step": 113626, "epoch": 1368, "val_loss": 6088295.0} {"train_loss": -21.90108871459961, "global_step": 113627, "epoch": 1369} {"train_loss": -22.256675720214844, "global_step": 113628, "epoch": 1369} {"train_loss": -21.497756958007812, "global_step": 113629, "epoch": 1369} {"train_loss": -21.616329193115234, "global_step": 113630, "epoch": 1369} {"train_loss": -21.71531105041504, "global_step": 113631, "epoch": 1369} {"train_loss": -22.289291381835938, "global_step": 113632, "epoch": 1369} {"train_loss": -21.831785202026367, "global_step": 113633, "epoch": 1369} {"train_loss": -22.104087829589844, "global_step": 113634, "epoch": 1369} {"train_loss": -22.034770965576172, "global_step": 113635, "epoch": 1369} {"train_loss": -21.93634796142578, "global_step": 113636, "epoch": 1369} {"train_loss": -22.290672302246094, "global_step": 113637, "epoch": 1369} {"train_loss": -22.358694076538086, "global_step": 113638, "epoch": 1369} {"train_loss": -22.008752822875977, "global_step": 113639, "epoch": 1369} {"train_loss": -22.29172134399414, "global_step": 113640, "epoch": 1369} {"train_loss": -22.43877601623535, "global_step": 113641, "epoch": 1369} {"train_loss": -22.117704391479492, "global_step": 113642, "epoch": 1369} {"train_loss": -22.183570861816406, "global_step": 113643, "epoch": 1369} {"train_loss": -22.401926040649414, "global_step": 113644, "epoch": 1369} {"train_loss": -22.489803314208984, "global_step": 113645, "epoch": 1369} {"train_loss": -22.480859756469727, "global_step": 113646, "epoch": 1369} {"train_loss": -22.475025177001953, "global_step": 113647, "epoch": 1369} {"train_loss": -22.074411392211914, "global_step": 113648, "epoch": 1369} {"train_loss": -22.235048294067383, "global_step": 113649, "epoch": 1369} {"train_loss": -22.45330238342285, "global_step": 113650, "epoch": 1369} {"train_loss": -22.38515853881836, "global_step": 113651, "epoch": 1369} {"train_loss": -22.371402740478516, "global_step": 113652, "epoch": 1369} {"train_loss": -22.50864601135254, "global_step": 113653, "epoch": 1369} {"train_loss": -22.22248649597168, "global_step": 113654, "epoch": 1369} {"train_loss": -22.16143226623535, "global_step": 113655, "epoch": 1369} {"train_loss": -21.817729949951172, "global_step": 113656, "epoch": 1369} {"train_loss": -21.979551315307617, "global_step": 113657, "epoch": 1369} {"train_loss": -22.124919891357422, "global_step": 113658, "epoch": 1369} {"train_loss": -22.273086547851562, "global_step": 113659, "epoch": 1369} {"train_loss": -22.085607528686523, "global_step": 113660, "epoch": 1369} {"train_loss": -22.371828079223633, "global_step": 113661, "epoch": 1369} {"train_loss": -22.37554931640625, "global_step": 113662, "epoch": 1369} {"train_loss": -22.386810302734375, "global_step": 113663, "epoch": 1369} {"train_loss": -21.819217681884766, "global_step": 113664, "epoch": 1369} {"train_loss": -22.560928344726562, "global_step": 113665, "epoch": 1369} {"train_loss": -22.13248062133789, "global_step": 113666, "epoch": 1369} {"train_loss": -22.22962760925293, "global_step": 113667, "epoch": 1369} {"train_loss": -22.579959869384766, "global_step": 113668, "epoch": 1369} {"train_loss": -22.160053253173828, "global_step": 113669, "epoch": 1369} {"train_loss": -22.302194595336914, "global_step": 113670, "epoch": 1369} {"train_loss": -21.979782104492188, "global_step": 113671, "epoch": 1369} {"train_loss": -22.1945858001709, "global_step": 113672, "epoch": 1369} {"train_loss": -21.98912239074707, "global_step": 113673, "epoch": 1369} {"train_loss": -22.416217803955078, "global_step": 113674, "epoch": 1369} {"train_loss": -22.48529052734375, "global_step": 113675, "epoch": 1369} {"train_loss": -22.255434036254883, "global_step": 113676, "epoch": 1369} {"train_loss": -22.391197204589844, "global_step": 113677, "epoch": 1369} {"train_loss": -22.36964225769043, "global_step": 113678, "epoch": 1369} {"train_loss": -22.642797470092773, "global_step": 113679, "epoch": 1369} {"train_loss": -22.70656394958496, "global_step": 113680, "epoch": 1369} {"train_loss": -22.074722290039062, "global_step": 113681, "epoch": 1369} {"train_loss": -21.997028350830078, "global_step": 113682, "epoch": 1369} {"train_loss": -22.662891387939453, "global_step": 113683, "epoch": 1369} {"train_loss": -22.54546546936035, "global_step": 113684, "epoch": 1369} {"train_loss": -21.9974422454834, "global_step": 113685, "epoch": 1369} {"train_loss": -22.500181198120117, "global_step": 113686, "epoch": 1369} {"train_loss": -22.436214447021484, "global_step": 113687, "epoch": 1369} {"train_loss": -22.16568946838379, "global_step": 113688, "epoch": 1369} {"train_loss": -22.377328872680664, "global_step": 113689, "epoch": 1369} {"train_loss": -22.33696174621582, "global_step": 113690, "epoch": 1369} {"train_loss": -22.13466453552246, "global_step": 113691, "epoch": 1369} {"train_loss": -22.402294158935547, "global_step": 113692, "epoch": 1369} {"train_loss": -22.23834800720215, "global_step": 113693, "epoch": 1369} {"train_loss": -22.434789657592773, "global_step": 113694, "epoch": 1369} {"train_loss": -22.118680953979492, "global_step": 113695, "epoch": 1369} {"train_loss": -22.516294479370117, "global_step": 113696, "epoch": 1369} {"train_loss": -22.188447952270508, "global_step": 113697, "epoch": 1369} {"train_loss": -22.487722396850586, "global_step": 113698, "epoch": 1369} {"train_loss": -22.401105880737305, "global_step": 113699, "epoch": 1369} {"train_loss": -22.699739456176758, "global_step": 113700, "epoch": 1369} {"train_loss": -22.148548126220703, "global_step": 113701, "epoch": 1369} {"train_loss": -21.992874145507812, "global_step": 113702, "epoch": 1369} {"train_loss": -22.251697540283203, "global_step": 113703, "epoch": 1369} {"train_loss": -22.222627639770508, "global_step": 113704, "epoch": 1369} {"train_loss": -22.4490909576416, "global_step": 113705, "epoch": 1369} {"train_loss": -22.516103744506836, "global_step": 113706, "epoch": 1369} {"train_loss": -22.287755966186523, "global_step": 113707, "epoch": 1369} {"train_loss": -22.27314567565918, "global_step": 113708, "epoch": 1369} {"train_loss": -22.243173369442125, "global_step": 113709, "epoch": 1369, "val_loss": 6268675.0} {"train_loss": -21.804767608642578, "global_step": 113710, "epoch": 1370} {"train_loss": -20.561731338500977, "global_step": 113711, "epoch": 1370} {"train_loss": -21.77532386779785, "global_step": 113712, "epoch": 1370} {"train_loss": -21.306079864501953, "global_step": 113713, "epoch": 1370} {"train_loss": -21.819015502929688, "global_step": 113714, "epoch": 1370} {"train_loss": -21.377317428588867, "global_step": 113715, "epoch": 1370} {"train_loss": -21.692251205444336, "global_step": 113716, "epoch": 1370} {"train_loss": -21.613737106323242, "global_step": 113717, "epoch": 1370} {"train_loss": -21.710796356201172, "global_step": 113718, "epoch": 1370} {"train_loss": -21.57440757751465, "global_step": 113719, "epoch": 1370} {"train_loss": -21.848669052124023, "global_step": 113720, "epoch": 1370} {"train_loss": -21.557323455810547, "global_step": 113721, "epoch": 1370} {"train_loss": -22.115957260131836, "global_step": 113722, "epoch": 1370} {"train_loss": -22.102527618408203, "global_step": 113723, "epoch": 1370} {"train_loss": -22.056232452392578, "global_step": 113724, "epoch": 1370} {"train_loss": -21.938413619995117, "global_step": 113725, "epoch": 1370} {"train_loss": -22.081697463989258, "global_step": 113726, "epoch": 1370} {"train_loss": -22.134166717529297, "global_step": 113727, "epoch": 1370} {"train_loss": -22.2927303314209, "global_step": 113728, "epoch": 1370} {"train_loss": -21.990285873413086, "global_step": 113729, "epoch": 1370} {"train_loss": -22.282957077026367, "global_step": 113730, "epoch": 1370} {"train_loss": -22.280187606811523, "global_step": 113731, "epoch": 1370} {"train_loss": -22.061288833618164, "global_step": 113732, "epoch": 1370} {"train_loss": -22.441688537597656, "global_step": 113733, "epoch": 1370} {"train_loss": -22.370559692382812, "global_step": 113734, "epoch": 1370} {"train_loss": -22.237478256225586, "global_step": 113735, "epoch": 1370} {"train_loss": -22.624364852905273, "global_step": 113736, "epoch": 1370} {"train_loss": -22.23526382446289, "global_step": 113737, "epoch": 1370} {"train_loss": -22.403669357299805, "global_step": 113738, "epoch": 1370} {"train_loss": -22.468616485595703, "global_step": 113739, "epoch": 1370} {"train_loss": -21.877309799194336, "global_step": 113740, "epoch": 1370} {"train_loss": -22.477373123168945, "global_step": 113741, "epoch": 1370} {"train_loss": -22.353437423706055, "global_step": 113742, "epoch": 1370} {"train_loss": -22.04747772216797, "global_step": 113743, "epoch": 1370} {"train_loss": -22.039289474487305, "global_step": 113744, "epoch": 1370} {"train_loss": -22.55950355529785, "global_step": 113745, "epoch": 1370} {"train_loss": -22.54215431213379, "global_step": 113746, "epoch": 1370} {"train_loss": -22.359954833984375, "global_step": 113747, "epoch": 1370} {"train_loss": -22.317777633666992, "global_step": 113748, "epoch": 1370} {"train_loss": -22.71763038635254, "global_step": 113749, "epoch": 1370} {"train_loss": -22.52389907836914, "global_step": 113750, "epoch": 1370} {"train_loss": -22.2814884185791, "global_step": 113751, "epoch": 1370} {"train_loss": -22.34331703186035, "global_step": 113752, "epoch": 1370} {"train_loss": -22.321964263916016, "global_step": 113753, "epoch": 1370} {"train_loss": -22.281253814697266, "global_step": 113754, "epoch": 1370} {"train_loss": -22.18684196472168, "global_step": 113755, "epoch": 1370} {"train_loss": -22.688642501831055, "global_step": 113756, "epoch": 1370} {"train_loss": -22.532033920288086, "global_step": 113757, "epoch": 1370} {"train_loss": -22.475887298583984, "global_step": 113758, "epoch": 1370} {"train_loss": -22.568302154541016, "global_step": 113759, "epoch": 1370} {"train_loss": -22.469589233398438, "global_step": 113760, "epoch": 1370} {"train_loss": -22.413888931274414, "global_step": 113761, "epoch": 1370} {"train_loss": -22.360904693603516, "global_step": 113762, "epoch": 1370} {"train_loss": -22.411489486694336, "global_step": 113763, "epoch": 1370} {"train_loss": -22.26728630065918, "global_step": 113764, "epoch": 1370} {"train_loss": -22.418964385986328, "global_step": 113765, "epoch": 1370} {"train_loss": -22.63052749633789, "global_step": 113766, "epoch": 1370} {"train_loss": -22.333236694335938, "global_step": 113767, "epoch": 1370} {"train_loss": -22.366666793823242, "global_step": 113768, "epoch": 1370} {"train_loss": -22.447559356689453, "global_step": 113769, "epoch": 1370} {"train_loss": -22.56694984436035, "global_step": 113770, "epoch": 1370} {"train_loss": -22.26904296875, "global_step": 113771, "epoch": 1370} {"train_loss": -22.67494773864746, "global_step": 113772, "epoch": 1370} {"train_loss": -22.257064819335938, "global_step": 113773, "epoch": 1370} {"train_loss": -22.396276473999023, "global_step": 113774, "epoch": 1370} {"train_loss": -22.25111961364746, "global_step": 113775, "epoch": 1370} {"train_loss": -22.39053726196289, "global_step": 113776, "epoch": 1370} {"train_loss": -21.985685348510742, "global_step": 113777, "epoch": 1370} {"train_loss": -22.397567749023438, "global_step": 113778, "epoch": 1370} {"train_loss": -22.3414249420166, "global_step": 113779, "epoch": 1370} {"train_loss": -21.963909149169922, "global_step": 113780, "epoch": 1370} {"train_loss": -22.53228759765625, "global_step": 113781, "epoch": 1370} {"train_loss": -22.0628662109375, "global_step": 113782, "epoch": 1370} {"train_loss": -22.324649810791016, "global_step": 113783, "epoch": 1370} {"train_loss": -22.254150390625, "global_step": 113784, "epoch": 1370} {"train_loss": -22.043241500854492, "global_step": 113785, "epoch": 1370} {"train_loss": -22.596525192260742, "global_step": 113786, "epoch": 1370} {"train_loss": -22.2333984375, "global_step": 113787, "epoch": 1370} {"train_loss": -21.781890869140625, "global_step": 113788, "epoch": 1370} {"train_loss": -22.787656784057617, "global_step": 113789, "epoch": 1370} {"train_loss": -22.12055778503418, "global_step": 113790, "epoch": 1370} {"train_loss": -22.350448608398438, "global_step": 113791, "epoch": 1370} {"train_loss": -22.2011913621282, "global_step": 113792, "epoch": 1370, "val_loss": 6103915.5} {"train_loss": -22.39084243774414, "global_step": 113793, "epoch": 1371} {"train_loss": -22.105802536010742, "global_step": 113794, "epoch": 1371} {"train_loss": -22.216524124145508, "global_step": 113795, "epoch": 1371} {"train_loss": -22.54817008972168, "global_step": 113796, "epoch": 1371} {"train_loss": -22.24057960510254, "global_step": 113797, "epoch": 1371} {"train_loss": -22.323755264282227, "global_step": 113798, "epoch": 1371} {"train_loss": -22.375293731689453, "global_step": 113799, "epoch": 1371} {"train_loss": -22.177021026611328, "global_step": 113800, "epoch": 1371} {"train_loss": -22.360937118530273, "global_step": 113801, "epoch": 1371} {"train_loss": -22.607343673706055, "global_step": 113802, "epoch": 1371} {"train_loss": -22.35784149169922, "global_step": 113803, "epoch": 1371} {"train_loss": -22.199806213378906, "global_step": 113804, "epoch": 1371} {"train_loss": -22.473358154296875, "global_step": 113805, "epoch": 1371} {"train_loss": -22.01666831970215, "global_step": 113806, "epoch": 1371} {"train_loss": -22.31958770751953, "global_step": 113807, "epoch": 1371} {"train_loss": -22.501039505004883, "global_step": 113808, "epoch": 1371} {"train_loss": -22.515451431274414, "global_step": 113809, "epoch": 1371} {"train_loss": -21.924854278564453, "global_step": 113810, "epoch": 1371} {"train_loss": -22.27033042907715, "global_step": 113811, "epoch": 1371} {"train_loss": -22.456083297729492, "global_step": 113812, "epoch": 1371} {"train_loss": -21.996007919311523, "global_step": 113813, "epoch": 1371} {"train_loss": -22.163806915283203, "global_step": 113814, "epoch": 1371} {"train_loss": -22.37774085998535, "global_step": 113815, "epoch": 1371} {"train_loss": -22.48746681213379, "global_step": 113816, "epoch": 1371} {"train_loss": -22.22944450378418, "global_step": 113817, "epoch": 1371} {"train_loss": -22.393522262573242, "global_step": 113818, "epoch": 1371} {"train_loss": -22.508752822875977, "global_step": 113819, "epoch": 1371} {"train_loss": -22.231563568115234, "global_step": 113820, "epoch": 1371} {"train_loss": -22.418678283691406, "global_step": 113821, "epoch": 1371} {"train_loss": -22.371112823486328, "global_step": 113822, "epoch": 1371} {"train_loss": -21.96932029724121, "global_step": 113823, "epoch": 1371} {"train_loss": -22.306577682495117, "global_step": 113824, "epoch": 1371} {"train_loss": -22.230426788330078, "global_step": 113825, "epoch": 1371} {"train_loss": -22.356311798095703, "global_step": 113826, "epoch": 1371} {"train_loss": -22.063955307006836, "global_step": 113827, "epoch": 1371} {"train_loss": -22.549131393432617, "global_step": 113828, "epoch": 1371} {"train_loss": -21.750341415405273, "global_step": 113829, "epoch": 1371} {"train_loss": -22.198644638061523, "global_step": 113830, "epoch": 1371} {"train_loss": -22.665573120117188, "global_step": 113831, "epoch": 1371} {"train_loss": -22.297626495361328, "global_step": 113832, "epoch": 1371} {"train_loss": -22.711463928222656, "global_step": 113833, "epoch": 1371} {"train_loss": -22.47486686706543, "global_step": 113834, "epoch": 1371} {"train_loss": -22.592802047729492, "global_step": 113835, "epoch": 1371} {"train_loss": -22.66261863708496, "global_step": 113836, "epoch": 1371} {"train_loss": -22.360698699951172, "global_step": 113837, "epoch": 1371} {"train_loss": -22.362272262573242, "global_step": 113838, "epoch": 1371} {"train_loss": -22.528371810913086, "global_step": 113839, "epoch": 1371} {"train_loss": -22.264434814453125, "global_step": 113840, "epoch": 1371} {"train_loss": -22.221710205078125, "global_step": 113841, "epoch": 1371} {"train_loss": -22.545400619506836, "global_step": 113842, "epoch": 1371} {"train_loss": -22.142112731933594, "global_step": 113843, "epoch": 1371} {"train_loss": -22.418264389038086, "global_step": 113844, "epoch": 1371} {"train_loss": -22.54714012145996, "global_step": 113845, "epoch": 1371} {"train_loss": -22.55498695373535, "global_step": 113846, "epoch": 1371} {"train_loss": -22.52454948425293, "global_step": 113847, "epoch": 1371} {"train_loss": -22.610219955444336, "global_step": 113848, "epoch": 1371} {"train_loss": -22.20339012145996, "global_step": 113849, "epoch": 1371} {"train_loss": -22.587142944335938, "global_step": 113850, "epoch": 1371} {"train_loss": -22.290742874145508, "global_step": 113851, "epoch": 1371} {"train_loss": -22.537809371948242, "global_step": 113852, "epoch": 1371} {"train_loss": -22.478078842163086, "global_step": 113853, "epoch": 1371} {"train_loss": -22.34351921081543, "global_step": 113854, "epoch": 1371} {"train_loss": -22.140716552734375, "global_step": 113855, "epoch": 1371} {"train_loss": -22.290292739868164, "global_step": 113856, "epoch": 1371} {"train_loss": -22.376211166381836, "global_step": 113857, "epoch": 1371} {"train_loss": -22.417993545532227, "global_step": 113858, "epoch": 1371} {"train_loss": -22.331342697143555, "global_step": 113859, "epoch": 1371} {"train_loss": -22.456344604492188, "global_step": 113860, "epoch": 1371} {"train_loss": -22.200843811035156, "global_step": 113861, "epoch": 1371} {"train_loss": -22.282791137695312, "global_step": 113862, "epoch": 1371} {"train_loss": -22.32587242126465, "global_step": 113863, "epoch": 1371} {"train_loss": -22.308917999267578, "global_step": 113864, "epoch": 1371} {"train_loss": -22.039045333862305, "global_step": 113865, "epoch": 1371} {"train_loss": -22.50595474243164, "global_step": 113866, "epoch": 1371} {"train_loss": -22.323074340820312, "global_step": 113867, "epoch": 1371} {"train_loss": -22.918893814086914, "global_step": 113868, "epoch": 1371} {"train_loss": -22.33917236328125, "global_step": 113869, "epoch": 1371} {"train_loss": -22.028268814086914, "global_step": 113870, "epoch": 1371} {"train_loss": -22.531597137451172, "global_step": 113871, "epoch": 1371} {"train_loss": -22.089689254760742, "global_step": 113872, "epoch": 1371} {"train_loss": -22.159940719604492, "global_step": 113873, "epoch": 1371} {"train_loss": -22.61536979675293, "global_step": 113874, "epoch": 1371} {"train_loss": -22.356707538466857, "global_step": 113875, "epoch": 1371, "val_loss": 6037558.0} {"train_loss": -21.795654296875, "global_step": 113876, "epoch": 1372} {"train_loss": -21.533279418945312, "global_step": 113877, "epoch": 1372} {"train_loss": -21.991125106811523, "global_step": 113878, "epoch": 1372} {"train_loss": -21.643709182739258, "global_step": 113879, "epoch": 1372} {"train_loss": -21.55893898010254, "global_step": 113880, "epoch": 1372} {"train_loss": -22.236997604370117, "global_step": 113881, "epoch": 1372} {"train_loss": -21.61030387878418, "global_step": 113882, "epoch": 1372} {"train_loss": -21.5019588470459, "global_step": 113883, "epoch": 1372} {"train_loss": -21.875045776367188, "global_step": 113884, "epoch": 1372} {"train_loss": -21.484195709228516, "global_step": 113885, "epoch": 1372} {"train_loss": -22.16621208190918, "global_step": 113886, "epoch": 1372} {"train_loss": -21.92152976989746, "global_step": 113887, "epoch": 1372} {"train_loss": -22.122053146362305, "global_step": 113888, "epoch": 1372} {"train_loss": -21.662771224975586, "global_step": 113889, "epoch": 1372} {"train_loss": -22.033666610717773, "global_step": 113890, "epoch": 1372} {"train_loss": -22.038846969604492, "global_step": 113891, "epoch": 1372} {"train_loss": -22.040447235107422, "global_step": 113892, "epoch": 1372} {"train_loss": -21.93735694885254, "global_step": 113893, "epoch": 1372} {"train_loss": -22.200515747070312, "global_step": 113894, "epoch": 1372} {"train_loss": -21.9216365814209, "global_step": 113895, "epoch": 1372} {"train_loss": -22.3529109954834, "global_step": 113896, "epoch": 1372} {"train_loss": -21.9796199798584, "global_step": 113897, "epoch": 1372} {"train_loss": -22.671756744384766, "global_step": 113898, "epoch": 1372} {"train_loss": -22.206130981445312, "global_step": 113899, "epoch": 1372} {"train_loss": -22.179677963256836, "global_step": 113900, "epoch": 1372} {"train_loss": -22.238235473632812, "global_step": 113901, "epoch": 1372} {"train_loss": -22.1553955078125, "global_step": 113902, "epoch": 1372} {"train_loss": -22.19099235534668, "global_step": 113903, "epoch": 1372} {"train_loss": -22.362478256225586, "global_step": 113904, "epoch": 1372} {"train_loss": -22.480850219726562, "global_step": 113905, "epoch": 1372} {"train_loss": -22.418954849243164, "global_step": 113906, "epoch": 1372} {"train_loss": -22.50136375427246, "global_step": 113907, "epoch": 1372} {"train_loss": -22.643888473510742, "global_step": 113908, "epoch": 1372} {"train_loss": -22.254425048828125, "global_step": 113909, "epoch": 1372} {"train_loss": -22.377927780151367, "global_step": 113910, "epoch": 1372} {"train_loss": -22.232603073120117, "global_step": 113911, "epoch": 1372} {"train_loss": -22.354278564453125, "global_step": 113912, "epoch": 1372} {"train_loss": -22.27602195739746, "global_step": 113913, "epoch": 1372} {"train_loss": -22.2286434173584, "global_step": 113914, "epoch": 1372} {"train_loss": -22.300094604492188, "global_step": 113915, "epoch": 1372} {"train_loss": -22.136402130126953, "global_step": 113916, "epoch": 1372} {"train_loss": -22.14185905456543, "global_step": 113917, "epoch": 1372} {"train_loss": -22.06340980529785, "global_step": 113918, "epoch": 1372} {"train_loss": -22.507080078125, "global_step": 113919, "epoch": 1372} {"train_loss": -22.008352279663086, "global_step": 113920, "epoch": 1372} {"train_loss": -22.105792999267578, "global_step": 113921, "epoch": 1372} {"train_loss": -22.126699447631836, "global_step": 113922, "epoch": 1372} {"train_loss": -22.378889083862305, "global_step": 113923, "epoch": 1372} {"train_loss": -22.366792678833008, "global_step": 113924, "epoch": 1372} {"train_loss": -22.080814361572266, "global_step": 113925, "epoch": 1372} {"train_loss": -22.126739501953125, "global_step": 113926, "epoch": 1372} {"train_loss": -21.83016014099121, "global_step": 113927, "epoch": 1372} {"train_loss": -22.06012725830078, "global_step": 113928, "epoch": 1372} {"train_loss": -22.6743106842041, "global_step": 113929, "epoch": 1372} {"train_loss": -22.336029052734375, "global_step": 113930, "epoch": 1372} {"train_loss": -22.6429500579834, "global_step": 113931, "epoch": 1372} {"train_loss": -22.315975189208984, "global_step": 113932, "epoch": 1372} {"train_loss": -22.486249923706055, "global_step": 113933, "epoch": 1372} {"train_loss": -22.397523880004883, "global_step": 113934, "epoch": 1372} {"train_loss": -22.468984603881836, "global_step": 113935, "epoch": 1372} {"train_loss": -22.168500900268555, "global_step": 113936, "epoch": 1372} {"train_loss": -22.696043014526367, "global_step": 113937, "epoch": 1372} {"train_loss": -22.695159912109375, "global_step": 113938, "epoch": 1372} {"train_loss": -22.153377532958984, "global_step": 113939, "epoch": 1372} {"train_loss": -22.339426040649414, "global_step": 113940, "epoch": 1372} {"train_loss": -22.486406326293945, "global_step": 113941, "epoch": 1372} {"train_loss": -22.352214813232422, "global_step": 113942, "epoch": 1372} {"train_loss": -22.47648048400879, "global_step": 113943, "epoch": 1372} {"train_loss": -22.196542739868164, "global_step": 113944, "epoch": 1372} {"train_loss": -22.30414390563965, "global_step": 113945, "epoch": 1372} {"train_loss": -22.407878875732422, "global_step": 113946, "epoch": 1372} {"train_loss": -22.434934616088867, "global_step": 113947, "epoch": 1372} {"train_loss": -22.23708152770996, "global_step": 113948, "epoch": 1372} {"train_loss": -22.575523376464844, "global_step": 113949, "epoch": 1372} {"train_loss": -22.187246322631836, "global_step": 113950, "epoch": 1372} {"train_loss": -22.39815330505371, "global_step": 113951, "epoch": 1372} {"train_loss": -22.4365291595459, "global_step": 113952, "epoch": 1372} {"train_loss": -22.607608795166016, "global_step": 113953, "epoch": 1372} {"train_loss": -22.4329891204834, "global_step": 113954, "epoch": 1372} {"train_loss": -22.41912269592285, "global_step": 113955, "epoch": 1372} {"train_loss": -22.4575252532959, "global_step": 113956, "epoch": 1372} {"train_loss": -22.431364059448242, "global_step": 113957, "epoch": 1372} {"train_loss": -22.211791601525732, "global_step": 113958, "epoch": 1372, "val_loss": 6306795.0} {"train_loss": -22.094482421875, "global_step": 113959, "epoch": 1373} {"train_loss": -21.496952056884766, "global_step": 113960, "epoch": 1373} {"train_loss": -21.754867553710938, "global_step": 113961, "epoch": 1373} {"train_loss": -22.016159057617188, "global_step": 113962, "epoch": 1373} {"train_loss": -21.840681076049805, "global_step": 113963, "epoch": 1373} {"train_loss": -21.711576461791992, "global_step": 113964, "epoch": 1373} {"train_loss": -21.820032119750977, "global_step": 113965, "epoch": 1373} {"train_loss": -22.05860710144043, "global_step": 113966, "epoch": 1373} {"train_loss": -22.264846801757812, "global_step": 113967, "epoch": 1373} {"train_loss": -21.655611038208008, "global_step": 113968, "epoch": 1373} {"train_loss": -21.89254379272461, "global_step": 113969, "epoch": 1373} {"train_loss": -21.874235153198242, "global_step": 113970, "epoch": 1373} {"train_loss": -21.7982120513916, "global_step": 113971, "epoch": 1373} {"train_loss": -22.226959228515625, "global_step": 113972, "epoch": 1373} {"train_loss": -21.760116577148438, "global_step": 113973, "epoch": 1373} {"train_loss": -22.0218505859375, "global_step": 113974, "epoch": 1373} {"train_loss": -22.04559898376465, "global_step": 113975, "epoch": 1373} {"train_loss": -21.65581703186035, "global_step": 113976, "epoch": 1373} {"train_loss": -22.08340835571289, "global_step": 113977, "epoch": 1373} {"train_loss": -22.291685104370117, "global_step": 113978, "epoch": 1373} {"train_loss": -22.179492950439453, "global_step": 113979, "epoch": 1373} {"train_loss": -22.16134262084961, "global_step": 113980, "epoch": 1373} {"train_loss": -21.99436378479004, "global_step": 113981, "epoch": 1373} {"train_loss": -21.998226165771484, "global_step": 113982, "epoch": 1373} {"train_loss": -21.950403213500977, "global_step": 113983, "epoch": 1373} {"train_loss": -22.403427124023438, "global_step": 113984, "epoch": 1373} {"train_loss": -22.23509407043457, "global_step": 113985, "epoch": 1373} {"train_loss": -21.832996368408203, "global_step": 113986, "epoch": 1373} {"train_loss": -22.468847274780273, "global_step": 113987, "epoch": 1373} {"train_loss": -22.2656192779541, "global_step": 113988, "epoch": 1373} {"train_loss": -22.626840591430664, "global_step": 113989, "epoch": 1373} {"train_loss": -22.021732330322266, "global_step": 113990, "epoch": 1373} {"train_loss": -21.922285079956055, "global_step": 113991, "epoch": 1373} {"train_loss": -21.75434684753418, "global_step": 113992, "epoch": 1373} {"train_loss": -22.4410457611084, "global_step": 113993, "epoch": 1373} {"train_loss": -22.631622314453125, "global_step": 113994, "epoch": 1373} {"train_loss": -22.26108169555664, "global_step": 113995, "epoch": 1373} {"train_loss": -22.3311767578125, "global_step": 113996, "epoch": 1373} {"train_loss": -22.468320846557617, "global_step": 113997, "epoch": 1373} {"train_loss": -22.393869400024414, "global_step": 113998, "epoch": 1373} {"train_loss": -22.22865104675293, "global_step": 113999, "epoch": 1373} {"train_loss": -22.041181564331055, "global_step": 114000, "epoch": 1373} {"train_loss": -22.156936645507812, "global_step": 114001, "epoch": 1373} {"train_loss": -22.19781494140625, "global_step": 114002, "epoch": 1373} {"train_loss": -22.361255645751953, "global_step": 114003, "epoch": 1373} {"train_loss": -22.44573402404785, "global_step": 114004, "epoch": 1373} {"train_loss": -22.49629020690918, "global_step": 114005, "epoch": 1373} {"train_loss": -22.401594161987305, "global_step": 114006, "epoch": 1373} {"train_loss": -22.559083938598633, "global_step": 114007, "epoch": 1373} {"train_loss": -22.703723907470703, "global_step": 114008, "epoch": 1373} {"train_loss": -22.62163734436035, "global_step": 114009, "epoch": 1373} {"train_loss": -22.480798721313477, "global_step": 114010, "epoch": 1373} {"train_loss": -22.41269874572754, "global_step": 114011, "epoch": 1373} {"train_loss": -22.253149032592773, "global_step": 114012, "epoch": 1373} {"train_loss": -22.418888092041016, "global_step": 114013, "epoch": 1373} {"train_loss": -22.56500816345215, "global_step": 114014, "epoch": 1373} {"train_loss": -22.625389099121094, "global_step": 114015, "epoch": 1373} {"train_loss": -22.49280548095703, "global_step": 114016, "epoch": 1373} {"train_loss": -22.243932723999023, "global_step": 114017, "epoch": 1373} {"train_loss": -22.140094757080078, "global_step": 114018, "epoch": 1373} {"train_loss": -22.340591430664062, "global_step": 114019, "epoch": 1373} {"train_loss": -22.33491325378418, "global_step": 114020, "epoch": 1373} {"train_loss": -22.384855270385742, "global_step": 114021, "epoch": 1373} {"train_loss": -22.931289672851562, "global_step": 114022, "epoch": 1373} {"train_loss": -22.09605598449707, "global_step": 114023, "epoch": 1373} {"train_loss": -21.97856903076172, "global_step": 114024, "epoch": 1373} {"train_loss": -22.371496200561523, "global_step": 114025, "epoch": 1373} {"train_loss": -22.78973960876465, "global_step": 114026, "epoch": 1373} {"train_loss": -22.128047943115234, "global_step": 114027, "epoch": 1373} {"train_loss": -22.019472122192383, "global_step": 114028, "epoch": 1373} {"train_loss": -22.198532104492188, "global_step": 114029, "epoch": 1373} {"train_loss": -22.375532150268555, "global_step": 114030, "epoch": 1373} {"train_loss": -22.5391845703125, "global_step": 114031, "epoch": 1373} {"train_loss": -21.713510513305664, "global_step": 114032, "epoch": 1373} {"train_loss": -22.613157272338867, "global_step": 114033, "epoch": 1373} {"train_loss": -22.45870018005371, "global_step": 114034, "epoch": 1373} {"train_loss": -22.05152702331543, "global_step": 114035, "epoch": 1373} {"train_loss": -22.19409942626953, "global_step": 114036, "epoch": 1373} {"train_loss": -22.489728927612305, "global_step": 114037, "epoch": 1373} {"train_loss": -22.540821075439453, "global_step": 114038, "epoch": 1373} {"train_loss": -22.285367965698242, "global_step": 114039, "epoch": 1373} {"train_loss": -22.59751319885254, "global_step": 114040, "epoch": 1373} {"train_loss": -22.213164662740315, "global_step": 114041, "epoch": 1373, "val_loss": 6201240.0} {"train_loss": -22.251148223876953, "global_step": 114042, "epoch": 1374} {"train_loss": -22.205835342407227, "global_step": 114043, "epoch": 1374} {"train_loss": -22.470808029174805, "global_step": 114044, "epoch": 1374} {"train_loss": -22.091047286987305, "global_step": 114045, "epoch": 1374} {"train_loss": -22.3909912109375, "global_step": 114046, "epoch": 1374} {"train_loss": -21.876331329345703, "global_step": 114047, "epoch": 1374} {"train_loss": -22.157583236694336, "global_step": 114048, "epoch": 1374} {"train_loss": -22.356796264648438, "global_step": 114049, "epoch": 1374} {"train_loss": -22.61552619934082, "global_step": 114050, "epoch": 1374} {"train_loss": -22.345373153686523, "global_step": 114051, "epoch": 1374} {"train_loss": -22.417875289916992, "global_step": 114052, "epoch": 1374} {"train_loss": -22.637174606323242, "global_step": 114053, "epoch": 1374} {"train_loss": -22.202375411987305, "global_step": 114054, "epoch": 1374} {"train_loss": -22.32400894165039, "global_step": 114055, "epoch": 1374} {"train_loss": -22.46335792541504, "global_step": 114056, "epoch": 1374} {"train_loss": -22.334308624267578, "global_step": 114057, "epoch": 1374} {"train_loss": -22.081947326660156, "global_step": 114058, "epoch": 1374} {"train_loss": -22.3631534576416, "global_step": 114059, "epoch": 1374} {"train_loss": -22.271461486816406, "global_step": 114060, "epoch": 1374} {"train_loss": -22.5805606842041, "global_step": 114061, "epoch": 1374} {"train_loss": -22.5155029296875, "global_step": 114062, "epoch": 1374} {"train_loss": -22.4097900390625, "global_step": 114063, "epoch": 1374} {"train_loss": -22.273916244506836, "global_step": 114064, "epoch": 1374} {"train_loss": -22.07295036315918, "global_step": 114065, "epoch": 1374} {"train_loss": -22.067161560058594, "global_step": 114066, "epoch": 1374} {"train_loss": -22.092676162719727, "global_step": 114067, "epoch": 1374} {"train_loss": -22.040685653686523, "global_step": 114068, "epoch": 1374} {"train_loss": -22.519615173339844, "global_step": 114069, "epoch": 1374} {"train_loss": -22.59250831604004, "global_step": 114070, "epoch": 1374} {"train_loss": -22.608816146850586, "global_step": 114071, "epoch": 1374} {"train_loss": -22.234987258911133, "global_step": 114072, "epoch": 1374} {"train_loss": -22.467512130737305, "global_step": 114073, "epoch": 1374} {"train_loss": -22.21695899963379, "global_step": 114074, "epoch": 1374} {"train_loss": -22.160871505737305, "global_step": 114075, "epoch": 1374} {"train_loss": -21.792495727539062, "global_step": 114076, "epoch": 1374} {"train_loss": -22.584470748901367, "global_step": 114077, "epoch": 1374} {"train_loss": -22.329004287719727, "global_step": 114078, "epoch": 1374} {"train_loss": -22.527685165405273, "global_step": 114079, "epoch": 1374} {"train_loss": -22.5771484375, "global_step": 114080, "epoch": 1374} {"train_loss": -22.23012351989746, "global_step": 114081, "epoch": 1374} {"train_loss": -22.234750747680664, "global_step": 114082, "epoch": 1374} {"train_loss": -22.148571014404297, "global_step": 114083, "epoch": 1374} {"train_loss": -22.60382080078125, "global_step": 114084, "epoch": 1374} {"train_loss": -22.285364151000977, "global_step": 114085, "epoch": 1374} {"train_loss": -22.459692001342773, "global_step": 114086, "epoch": 1374} {"train_loss": -22.26885414123535, "global_step": 114087, "epoch": 1374} {"train_loss": -22.107547760009766, "global_step": 114088, "epoch": 1374} {"train_loss": -22.487564086914062, "global_step": 114089, "epoch": 1374} {"train_loss": -22.383459091186523, "global_step": 114090, "epoch": 1374} {"train_loss": -22.22157096862793, "global_step": 114091, "epoch": 1374} {"train_loss": -22.46979331970215, "global_step": 114092, "epoch": 1374} {"train_loss": -22.607921600341797, "global_step": 114093, "epoch": 1374} {"train_loss": -22.370880126953125, "global_step": 114094, "epoch": 1374} {"train_loss": -22.658443450927734, "global_step": 114095, "epoch": 1374} {"train_loss": -22.09488296508789, "global_step": 114096, "epoch": 1374} {"train_loss": -22.277273178100586, "global_step": 114097, "epoch": 1374} {"train_loss": -22.319997787475586, "global_step": 114098, "epoch": 1374} {"train_loss": -22.407468795776367, "global_step": 114099, "epoch": 1374} {"train_loss": -22.401601791381836, "global_step": 114100, "epoch": 1374} {"train_loss": -22.60857582092285, "global_step": 114101, "epoch": 1374} {"train_loss": -22.348867416381836, "global_step": 114102, "epoch": 1374} {"train_loss": -22.094892501831055, "global_step": 114103, "epoch": 1374} {"train_loss": -22.576526641845703, "global_step": 114104, "epoch": 1374} {"train_loss": -22.571142196655273, "global_step": 114105, "epoch": 1374} {"train_loss": -22.484844207763672, "global_step": 114106, "epoch": 1374} {"train_loss": -22.220413208007812, "global_step": 114107, "epoch": 1374} {"train_loss": -22.38874626159668, "global_step": 114108, "epoch": 1374} {"train_loss": -22.298940658569336, "global_step": 114109, "epoch": 1374} {"train_loss": -22.67743492126465, "global_step": 114110, "epoch": 1374} {"train_loss": -22.50371742248535, "global_step": 114111, "epoch": 1374} {"train_loss": -22.1868896484375, "global_step": 114112, "epoch": 1374} {"train_loss": -22.215120315551758, "global_step": 114113, "epoch": 1374} {"train_loss": -22.378170013427734, "global_step": 114114, "epoch": 1374} {"train_loss": -22.462299346923828, "global_step": 114115, "epoch": 1374} {"train_loss": -22.09419822692871, "global_step": 114116, "epoch": 1374} {"train_loss": -22.51875877380371, "global_step": 114117, "epoch": 1374} {"train_loss": -22.569137573242188, "global_step": 114118, "epoch": 1374} {"train_loss": -22.20103645324707, "global_step": 114119, "epoch": 1374} {"train_loss": -22.17958641052246, "global_step": 114120, "epoch": 1374} {"train_loss": -22.415510177612305, "global_step": 114121, "epoch": 1374} {"train_loss": -22.345815658569336, "global_step": 114122, "epoch": 1374} {"train_loss": -22.60595703125, "global_step": 114123, "epoch": 1374} {"train_loss": -22.32966360988387, "global_step": 114124, "epoch": 1374, "val_loss": 6189435.0} {"train_loss": -22.00736427307129, "global_step": 114125, "epoch": 1375} {"train_loss": -22.252538681030273, "global_step": 114126, "epoch": 1375} {"train_loss": -21.811477661132812, "global_step": 114127, "epoch": 1375} {"train_loss": -22.121326446533203, "global_step": 114128, "epoch": 1375} {"train_loss": -22.323129653930664, "global_step": 114129, "epoch": 1375} {"train_loss": -22.637954711914062, "global_step": 114130, "epoch": 1375} {"train_loss": -22.125553131103516, "global_step": 114131, "epoch": 1375} {"train_loss": -22.442115783691406, "global_step": 114132, "epoch": 1375} {"train_loss": -22.36270523071289, "global_step": 114133, "epoch": 1375} {"train_loss": -22.39377784729004, "global_step": 114134, "epoch": 1375} {"train_loss": -22.510202407836914, "global_step": 114135, "epoch": 1375} {"train_loss": -22.265649795532227, "global_step": 114136, "epoch": 1375} {"train_loss": -22.704557418823242, "global_step": 114137, "epoch": 1375} {"train_loss": -22.169071197509766, "global_step": 114138, "epoch": 1375} {"train_loss": -22.271015167236328, "global_step": 114139, "epoch": 1375} {"train_loss": -22.463058471679688, "global_step": 114140, "epoch": 1375} {"train_loss": -22.25978660583496, "global_step": 114141, "epoch": 1375} {"train_loss": -22.66111946105957, "global_step": 114142, "epoch": 1375} {"train_loss": -21.926511764526367, "global_step": 114143, "epoch": 1375} {"train_loss": -22.154325485229492, "global_step": 114144, "epoch": 1375} {"train_loss": -22.21748924255371, "global_step": 114145, "epoch": 1375} {"train_loss": -22.04868507385254, "global_step": 114146, "epoch": 1375} {"train_loss": -22.676136016845703, "global_step": 114147, "epoch": 1375} {"train_loss": -22.281057357788086, "global_step": 114148, "epoch": 1375} {"train_loss": -22.333436965942383, "global_step": 114149, "epoch": 1375} {"train_loss": -22.622873306274414, "global_step": 114150, "epoch": 1375} {"train_loss": -21.848543167114258, "global_step": 114151, "epoch": 1375} {"train_loss": -22.366697311401367, "global_step": 114152, "epoch": 1375} {"train_loss": -22.39373779296875, "global_step": 114153, "epoch": 1375} {"train_loss": -21.91029930114746, "global_step": 114154, "epoch": 1375} {"train_loss": -22.116670608520508, "global_step": 114155, "epoch": 1375} {"train_loss": -22.936166763305664, "global_step": 114156, "epoch": 1375} {"train_loss": -22.50160026550293, "global_step": 114157, "epoch": 1375} {"train_loss": -22.5665225982666, "global_step": 114158, "epoch": 1375} {"train_loss": -22.83060646057129, "global_step": 114159, "epoch": 1375} {"train_loss": -22.232454299926758, "global_step": 114160, "epoch": 1375} {"train_loss": -22.528099060058594, "global_step": 114161, "epoch": 1375} {"train_loss": -22.463918685913086, "global_step": 114162, "epoch": 1375} {"train_loss": -22.611862182617188, "global_step": 114163, "epoch": 1375} {"train_loss": -22.220121383666992, "global_step": 114164, "epoch": 1375} {"train_loss": -22.41846466064453, "global_step": 114165, "epoch": 1375} {"train_loss": -22.47307777404785, "global_step": 114166, "epoch": 1375} {"train_loss": -22.239643096923828, "global_step": 114167, "epoch": 1375} {"train_loss": -22.204111099243164, "global_step": 114168, "epoch": 1375} {"train_loss": -21.982715606689453, "global_step": 114169, "epoch": 1375} {"train_loss": -22.3469295501709, "global_step": 114170, "epoch": 1375} {"train_loss": -22.531789779663086, "global_step": 114171, "epoch": 1375} {"train_loss": -22.41334342956543, "global_step": 114172, "epoch": 1375} {"train_loss": -22.491140365600586, "global_step": 114173, "epoch": 1375} {"train_loss": -22.15549659729004, "global_step": 114174, "epoch": 1375} {"train_loss": -22.141918182373047, "global_step": 114175, "epoch": 1375} {"train_loss": -22.02352523803711, "global_step": 114176, "epoch": 1375} {"train_loss": -22.34879493713379, "global_step": 114177, "epoch": 1375} {"train_loss": -22.474498748779297, "global_step": 114178, "epoch": 1375} {"train_loss": -22.120771408081055, "global_step": 114179, "epoch": 1375} {"train_loss": -22.312082290649414, "global_step": 114180, "epoch": 1375} {"train_loss": -22.393150329589844, "global_step": 114181, "epoch": 1375} {"train_loss": -22.2142391204834, "global_step": 114182, "epoch": 1375} {"train_loss": -22.310720443725586, "global_step": 114183, "epoch": 1375} {"train_loss": -22.219322204589844, "global_step": 114184, "epoch": 1375} {"train_loss": -22.032485961914062, "global_step": 114185, "epoch": 1375} {"train_loss": -22.47981834411621, "global_step": 114186, "epoch": 1375} {"train_loss": -22.14012908935547, "global_step": 114187, "epoch": 1375} {"train_loss": -22.208654403686523, "global_step": 114188, "epoch": 1375} {"train_loss": -22.540746688842773, "global_step": 114189, "epoch": 1375} {"train_loss": -22.236427307128906, "global_step": 114190, "epoch": 1375} {"train_loss": -22.232595443725586, "global_step": 114191, "epoch": 1375} {"train_loss": -22.298309326171875, "global_step": 114192, "epoch": 1375} {"train_loss": -22.232685089111328, "global_step": 114193, "epoch": 1375} {"train_loss": -22.202558517456055, "global_step": 114194, "epoch": 1375} {"train_loss": -22.071121215820312, "global_step": 114195, "epoch": 1375} {"train_loss": -22.255447387695312, "global_step": 114196, "epoch": 1375} {"train_loss": -22.148481369018555, "global_step": 114197, "epoch": 1375} {"train_loss": -22.70485496520996, "global_step": 114198, "epoch": 1375} {"train_loss": -22.065839767456055, "global_step": 114199, "epoch": 1375} {"train_loss": -22.2887020111084, "global_step": 114200, "epoch": 1375} {"train_loss": -22.174999237060547, "global_step": 114201, "epoch": 1375} {"train_loss": -22.312049865722656, "global_step": 114202, "epoch": 1375} {"train_loss": -22.259267807006836, "global_step": 114203, "epoch": 1375} {"train_loss": -22.373207092285156, "global_step": 114204, "epoch": 1375} {"train_loss": -22.473840713500977, "global_step": 114205, "epoch": 1375} {"train_loss": -22.497234344482422, "global_step": 114206, "epoch": 1375} {"train_loss": -22.31441794246076, "global_step": 114207, "epoch": 1375, "val_loss": 6140211.5} {"train_loss": -21.190937042236328, "global_step": 114208, "epoch": 1376} {"train_loss": -21.79136848449707, "global_step": 114209, "epoch": 1376} {"train_loss": -21.82537269592285, "global_step": 114210, "epoch": 1376} {"train_loss": -20.988792419433594, "global_step": 114211, "epoch": 1376} {"train_loss": -21.779674530029297, "global_step": 114212, "epoch": 1376} {"train_loss": -21.286869049072266, "global_step": 114213, "epoch": 1376} {"train_loss": -21.567184448242188, "global_step": 114214, "epoch": 1376} {"train_loss": -21.74827766418457, "global_step": 114215, "epoch": 1376} {"train_loss": -21.668176651000977, "global_step": 114216, "epoch": 1376} {"train_loss": -22.046560287475586, "global_step": 114217, "epoch": 1376} {"train_loss": -21.962934494018555, "global_step": 114218, "epoch": 1376} {"train_loss": -21.98325538635254, "global_step": 114219, "epoch": 1376} {"train_loss": -21.8950252532959, "global_step": 114220, "epoch": 1376} {"train_loss": -21.940677642822266, "global_step": 114221, "epoch": 1376} {"train_loss": -21.93543815612793, "global_step": 114222, "epoch": 1376} {"train_loss": -22.124521255493164, "global_step": 114223, "epoch": 1376} {"train_loss": -22.227622985839844, "global_step": 114224, "epoch": 1376} {"train_loss": -22.04206657409668, "global_step": 114225, "epoch": 1376} {"train_loss": -21.943937301635742, "global_step": 114226, "epoch": 1376} {"train_loss": -22.281370162963867, "global_step": 114227, "epoch": 1376} {"train_loss": -22.17417335510254, "global_step": 114228, "epoch": 1376} {"train_loss": -21.876007080078125, "global_step": 114229, "epoch": 1376} {"train_loss": -22.25432014465332, "global_step": 114230, "epoch": 1376} {"train_loss": -22.136709213256836, "global_step": 114231, "epoch": 1376} {"train_loss": -22.529996871948242, "global_step": 114232, "epoch": 1376} {"train_loss": -22.158422470092773, "global_step": 114233, "epoch": 1376} {"train_loss": -22.11182975769043, "global_step": 114234, "epoch": 1376} {"train_loss": -22.362295150756836, "global_step": 114235, "epoch": 1376} {"train_loss": -22.40297508239746, "global_step": 114236, "epoch": 1376} {"train_loss": -22.68060874938965, "global_step": 114237, "epoch": 1376} {"train_loss": -21.970579147338867, "global_step": 114238, "epoch": 1376} {"train_loss": -22.273191452026367, "global_step": 114239, "epoch": 1376} {"train_loss": -21.99531364440918, "global_step": 114240, "epoch": 1376} {"train_loss": -22.25784683227539, "global_step": 114241, "epoch": 1376} {"train_loss": -22.16335105895996, "global_step": 114242, "epoch": 1376} {"train_loss": -22.011728286743164, "global_step": 114243, "epoch": 1376} {"train_loss": -22.827533721923828, "global_step": 114244, "epoch": 1376} {"train_loss": -22.38663101196289, "global_step": 114245, "epoch": 1376} {"train_loss": -22.31717872619629, "global_step": 114246, "epoch": 1376} {"train_loss": -22.21932029724121, "global_step": 114247, "epoch": 1376} {"train_loss": -22.292707443237305, "global_step": 114248, "epoch": 1376} {"train_loss": -22.07081413269043, "global_step": 114249, "epoch": 1376} {"train_loss": -22.347143173217773, "global_step": 114250, "epoch": 1376} {"train_loss": -22.335912704467773, "global_step": 114251, "epoch": 1376} {"train_loss": -21.96750831604004, "global_step": 114252, "epoch": 1376} {"train_loss": -21.690250396728516, "global_step": 114253, "epoch": 1376} {"train_loss": -22.566513061523438, "global_step": 114254, "epoch": 1376} {"train_loss": -22.202762603759766, "global_step": 114255, "epoch": 1376} {"train_loss": -22.606773376464844, "global_step": 114256, "epoch": 1376} {"train_loss": -22.272130966186523, "global_step": 114257, "epoch": 1376} {"train_loss": -22.29288101196289, "global_step": 114258, "epoch": 1376} {"train_loss": -22.175676345825195, "global_step": 114259, "epoch": 1376} {"train_loss": -22.336627960205078, "global_step": 114260, "epoch": 1376} {"train_loss": -22.355939865112305, "global_step": 114261, "epoch": 1376} {"train_loss": -22.253787994384766, "global_step": 114262, "epoch": 1376} {"train_loss": -22.279773712158203, "global_step": 114263, "epoch": 1376} {"train_loss": -22.61949920654297, "global_step": 114264, "epoch": 1376} {"train_loss": -22.648090362548828, "global_step": 114265, "epoch": 1376} {"train_loss": -22.19599723815918, "global_step": 114266, "epoch": 1376} {"train_loss": -22.123384475708008, "global_step": 114267, "epoch": 1376} {"train_loss": -22.304798126220703, "global_step": 114268, "epoch": 1376} {"train_loss": -22.47049331665039, "global_step": 114269, "epoch": 1376} {"train_loss": -22.402502059936523, "global_step": 114270, "epoch": 1376} {"train_loss": -22.404037475585938, "global_step": 114271, "epoch": 1376} {"train_loss": -22.178131103515625, "global_step": 114272, "epoch": 1376} {"train_loss": -22.391698837280273, "global_step": 114273, "epoch": 1376} {"train_loss": -22.445249557495117, "global_step": 114274, "epoch": 1376} {"train_loss": -22.52383804321289, "global_step": 114275, "epoch": 1376} {"train_loss": -22.802379608154297, "global_step": 114276, "epoch": 1376} {"train_loss": -22.511289596557617, "global_step": 114277, "epoch": 1376} {"train_loss": -22.436908721923828, "global_step": 114278, "epoch": 1376} {"train_loss": -22.160404205322266, "global_step": 114279, "epoch": 1376} {"train_loss": -22.26497459411621, "global_step": 114280, "epoch": 1376} {"train_loss": -22.113248825073242, "global_step": 114281, "epoch": 1376} {"train_loss": -22.435909271240234, "global_step": 114282, "epoch": 1376} {"train_loss": -22.69972038269043, "global_step": 114283, "epoch": 1376} {"train_loss": -22.15052604675293, "global_step": 114284, "epoch": 1376} {"train_loss": -22.617883682250977, "global_step": 114285, "epoch": 1376} {"train_loss": -22.747222900390625, "global_step": 114286, "epoch": 1376} {"train_loss": -22.737075805664062, "global_step": 114287, "epoch": 1376} {"train_loss": -22.272375106811523, "global_step": 114288, "epoch": 1376} {"train_loss": -22.563156127929688, "global_step": 114289, "epoch": 1376} {"train_loss": -22.198210543896778, "global_step": 114290, "epoch": 1376, "val_loss": 6228174.0} {"train_loss": -22.213424682617188, "global_step": 114291, "epoch": 1377} {"train_loss": -22.176660537719727, "global_step": 114292, "epoch": 1377} {"train_loss": -21.906755447387695, "global_step": 114293, "epoch": 1377} {"train_loss": -22.353879928588867, "global_step": 114294, "epoch": 1377} {"train_loss": -22.303939819335938, "global_step": 114295, "epoch": 1377} {"train_loss": -21.897939682006836, "global_step": 114296, "epoch": 1377} {"train_loss": -22.333051681518555, "global_step": 114297, "epoch": 1377} {"train_loss": -22.18051528930664, "global_step": 114298, "epoch": 1377} {"train_loss": -22.277374267578125, "global_step": 114299, "epoch": 1377} {"train_loss": -22.491071701049805, "global_step": 114300, "epoch": 1377} {"train_loss": -22.48215675354004, "global_step": 114301, "epoch": 1377} {"train_loss": -22.106069564819336, "global_step": 114302, "epoch": 1377} {"train_loss": -22.447357177734375, "global_step": 114303, "epoch": 1377} {"train_loss": -22.01068115234375, "global_step": 114304, "epoch": 1377} {"train_loss": -22.233835220336914, "global_step": 114305, "epoch": 1377} {"train_loss": -22.054574966430664, "global_step": 114306, "epoch": 1377} {"train_loss": -22.160045623779297, "global_step": 114307, "epoch": 1377} {"train_loss": -22.430606842041016, "global_step": 114308, "epoch": 1377} {"train_loss": -22.41107177734375, "global_step": 114309, "epoch": 1377} {"train_loss": -22.21042823791504, "global_step": 114310, "epoch": 1377} {"train_loss": -21.779991149902344, "global_step": 114311, "epoch": 1377} {"train_loss": -22.32285499572754, "global_step": 114312, "epoch": 1377} {"train_loss": -21.766910552978516, "global_step": 114313, "epoch": 1377} {"train_loss": -22.134252548217773, "global_step": 114314, "epoch": 1377} {"train_loss": -22.258636474609375, "global_step": 114315, "epoch": 1377} {"train_loss": -22.25432014465332, "global_step": 114316, "epoch": 1377} {"train_loss": -22.334115982055664, "global_step": 114317, "epoch": 1377} {"train_loss": -22.36655616760254, "global_step": 114318, "epoch": 1377} {"train_loss": -22.409395217895508, "global_step": 114319, "epoch": 1377} {"train_loss": -22.14089012145996, "global_step": 114320, "epoch": 1377} {"train_loss": -22.38907241821289, "global_step": 114321, "epoch": 1377} {"train_loss": -22.749746322631836, "global_step": 114322, "epoch": 1377} {"train_loss": -22.349750518798828, "global_step": 114323, "epoch": 1377} {"train_loss": -22.40157127380371, "global_step": 114324, "epoch": 1377} {"train_loss": -22.38730239868164, "global_step": 114325, "epoch": 1377} {"train_loss": -22.346328735351562, "global_step": 114326, "epoch": 1377} {"train_loss": -22.643964767456055, "global_step": 114327, "epoch": 1377} {"train_loss": -22.32131004333496, "global_step": 114328, "epoch": 1377} {"train_loss": -22.609189987182617, "global_step": 114329, "epoch": 1377} {"train_loss": -22.636825561523438, "global_step": 114330, "epoch": 1377} {"train_loss": -22.637521743774414, "global_step": 114331, "epoch": 1377} {"train_loss": -22.3723087310791, "global_step": 114332, "epoch": 1377} {"train_loss": -22.472640991210938, "global_step": 114333, "epoch": 1377} {"train_loss": -22.424875259399414, "global_step": 114334, "epoch": 1377} {"train_loss": -22.507715225219727, "global_step": 114335, "epoch": 1377} {"train_loss": -22.16071891784668, "global_step": 114336, "epoch": 1377} {"train_loss": -22.38972282409668, "global_step": 114337, "epoch": 1377} {"train_loss": -22.338863372802734, "global_step": 114338, "epoch": 1377} {"train_loss": -22.48670768737793, "global_step": 114339, "epoch": 1377} {"train_loss": -22.400293350219727, "global_step": 114340, "epoch": 1377} {"train_loss": -22.484949111938477, "global_step": 114341, "epoch": 1377} {"train_loss": -22.641569137573242, "global_step": 114342, "epoch": 1377} {"train_loss": -22.216110229492188, "global_step": 114343, "epoch": 1377} {"train_loss": -22.406736373901367, "global_step": 114344, "epoch": 1377} {"train_loss": -22.943655014038086, "global_step": 114345, "epoch": 1377} {"train_loss": -22.634191513061523, "global_step": 114346, "epoch": 1377} {"train_loss": -22.316452026367188, "global_step": 114347, "epoch": 1377} {"train_loss": -22.21544075012207, "global_step": 114348, "epoch": 1377} {"train_loss": -22.44731330871582, "global_step": 114349, "epoch": 1377} {"train_loss": -22.530942916870117, "global_step": 114350, "epoch": 1377} {"train_loss": -22.471349716186523, "global_step": 114351, "epoch": 1377} {"train_loss": -21.987241744995117, "global_step": 114352, "epoch": 1377} {"train_loss": -22.658493041992188, "global_step": 114353, "epoch": 1377} {"train_loss": -22.545917510986328, "global_step": 114354, "epoch": 1377} {"train_loss": -22.702939987182617, "global_step": 114355, "epoch": 1377} {"train_loss": -22.45587730407715, "global_step": 114356, "epoch": 1377} {"train_loss": -22.37322425842285, "global_step": 114357, "epoch": 1377} {"train_loss": -22.282773971557617, "global_step": 114358, "epoch": 1377} {"train_loss": -22.26480484008789, "global_step": 114359, "epoch": 1377} {"train_loss": -22.533733367919922, "global_step": 114360, "epoch": 1377} {"train_loss": -22.043563842773438, "global_step": 114361, "epoch": 1377} {"train_loss": -21.977201461791992, "global_step": 114362, "epoch": 1377} {"train_loss": -22.594568252563477, "global_step": 114363, "epoch": 1377} {"train_loss": -22.33224868774414, "global_step": 114364, "epoch": 1377} {"train_loss": -22.519071578979492, "global_step": 114365, "epoch": 1377} {"train_loss": -22.386966705322266, "global_step": 114366, "epoch": 1377} {"train_loss": -22.471670150756836, "global_step": 114367, "epoch": 1377} {"train_loss": -22.441465377807617, "global_step": 114368, "epoch": 1377} {"train_loss": -22.649145126342773, "global_step": 114369, "epoch": 1377} {"train_loss": -22.29621696472168, "global_step": 114370, "epoch": 1377} {"train_loss": -22.500272750854492, "global_step": 114371, "epoch": 1377} {"train_loss": -22.299924850463867, "global_step": 114372, "epoch": 1377} {"train_loss": -22.345463189734033, "global_step": 114373, "epoch": 1377, "val_loss": 6223526.0} {"train_loss": -22.337858200073242, "global_step": 114374, "epoch": 1378} {"train_loss": -21.902523040771484, "global_step": 114375, "epoch": 1378} {"train_loss": -22.175642013549805, "global_step": 114376, "epoch": 1378} {"train_loss": -22.42701530456543, "global_step": 114377, "epoch": 1378} {"train_loss": -22.41704750061035, "global_step": 114378, "epoch": 1378} {"train_loss": -22.62417984008789, "global_step": 114379, "epoch": 1378} {"train_loss": -22.281217575073242, "global_step": 114380, "epoch": 1378} {"train_loss": -22.342214584350586, "global_step": 114381, "epoch": 1378} {"train_loss": -21.908979415893555, "global_step": 114382, "epoch": 1378} {"train_loss": -22.544973373413086, "global_step": 114383, "epoch": 1378} {"train_loss": -22.29265785217285, "global_step": 114384, "epoch": 1378} {"train_loss": -22.11184310913086, "global_step": 114385, "epoch": 1378} {"train_loss": -22.140592575073242, "global_step": 114386, "epoch": 1378} {"train_loss": -22.223852157592773, "global_step": 114387, "epoch": 1378} {"train_loss": -22.20111083984375, "global_step": 114388, "epoch": 1378} {"train_loss": -22.374265670776367, "global_step": 114389, "epoch": 1378} {"train_loss": -22.252843856811523, "global_step": 114390, "epoch": 1378} {"train_loss": -22.251306533813477, "global_step": 114391, "epoch": 1378} {"train_loss": -22.174762725830078, "global_step": 114392, "epoch": 1378} {"train_loss": -22.637418746948242, "global_step": 114393, "epoch": 1378} {"train_loss": -22.091079711914062, "global_step": 114394, "epoch": 1378} {"train_loss": -22.36347770690918, "global_step": 114395, "epoch": 1378} {"train_loss": -22.47834587097168, "global_step": 114396, "epoch": 1378} {"train_loss": -22.337560653686523, "global_step": 114397, "epoch": 1378} {"train_loss": -22.4123592376709, "global_step": 114398, "epoch": 1378} {"train_loss": -22.453428268432617, "global_step": 114399, "epoch": 1378} {"train_loss": -22.37702751159668, "global_step": 114400, "epoch": 1378} {"train_loss": -21.939382553100586, "global_step": 114401, "epoch": 1378} {"train_loss": -22.36515235900879, "global_step": 114402, "epoch": 1378} {"train_loss": -22.240262985229492, "global_step": 114403, "epoch": 1378} {"train_loss": -22.353418350219727, "global_step": 114404, "epoch": 1378} {"train_loss": -22.391399383544922, "global_step": 114405, "epoch": 1378} {"train_loss": -22.219669342041016, "global_step": 114406, "epoch": 1378} {"train_loss": -22.444761276245117, "global_step": 114407, "epoch": 1378} {"train_loss": -22.328519821166992, "global_step": 114408, "epoch": 1378} {"train_loss": -22.517053604125977, "global_step": 114409, "epoch": 1378} {"train_loss": -22.681365966796875, "global_step": 114410, "epoch": 1378} {"train_loss": -22.24086570739746, "global_step": 114411, "epoch": 1378} {"train_loss": -22.5394287109375, "global_step": 114412, "epoch": 1378} {"train_loss": -22.17388916015625, "global_step": 114413, "epoch": 1378} {"train_loss": -22.857107162475586, "global_step": 114414, "epoch": 1378} {"train_loss": -22.666671752929688, "global_step": 114415, "epoch": 1378} {"train_loss": -22.084020614624023, "global_step": 114416, "epoch": 1378} {"train_loss": -22.551111221313477, "global_step": 114417, "epoch": 1378} {"train_loss": -22.271154403686523, "global_step": 114418, "epoch": 1378} {"train_loss": -22.52902603149414, "global_step": 114419, "epoch": 1378} {"train_loss": -22.216909408569336, "global_step": 114420, "epoch": 1378} {"train_loss": -22.621164321899414, "global_step": 114421, "epoch": 1378} {"train_loss": -22.368091583251953, "global_step": 114422, "epoch": 1378} {"train_loss": -22.44122886657715, "global_step": 114423, "epoch": 1378} {"train_loss": -21.97538185119629, "global_step": 114424, "epoch": 1378} {"train_loss": -22.351577758789062, "global_step": 114425, "epoch": 1378} {"train_loss": -22.27056121826172, "global_step": 114426, "epoch": 1378} {"train_loss": -22.260690689086914, "global_step": 114427, "epoch": 1378} {"train_loss": -22.0539493560791, "global_step": 114428, "epoch": 1378} {"train_loss": -22.191726684570312, "global_step": 114429, "epoch": 1378} {"train_loss": -22.666778564453125, "global_step": 114430, "epoch": 1378} {"train_loss": -22.2853946685791, "global_step": 114431, "epoch": 1378} {"train_loss": -21.80173683166504, "global_step": 114432, "epoch": 1378} {"train_loss": -22.115732192993164, "global_step": 114433, "epoch": 1378} {"train_loss": -22.25654411315918, "global_step": 114434, "epoch": 1378} {"train_loss": -22.211339950561523, "global_step": 114435, "epoch": 1378} {"train_loss": -22.297988891601562, "global_step": 114436, "epoch": 1378} {"train_loss": -22.054994583129883, "global_step": 114437, "epoch": 1378} {"train_loss": -22.76852798461914, "global_step": 114438, "epoch": 1378} {"train_loss": -22.478946685791016, "global_step": 114439, "epoch": 1378} {"train_loss": -21.933032989501953, "global_step": 114440, "epoch": 1378} {"train_loss": -22.080699920654297, "global_step": 114441, "epoch": 1378} {"train_loss": -21.915922164916992, "global_step": 114442, "epoch": 1378} {"train_loss": -22.201501846313477, "global_step": 114443, "epoch": 1378} {"train_loss": -22.45033073425293, "global_step": 114444, "epoch": 1378} {"train_loss": -22.747020721435547, "global_step": 114445, "epoch": 1378} {"train_loss": -22.3609561920166, "global_step": 114446, "epoch": 1378} {"train_loss": -22.303529739379883, "global_step": 114447, "epoch": 1378} {"train_loss": -22.526611328125, "global_step": 114448, "epoch": 1378} {"train_loss": -22.299373626708984, "global_step": 114449, "epoch": 1378} {"train_loss": -22.00278091430664, "global_step": 114450, "epoch": 1378} {"train_loss": -21.737932205200195, "global_step": 114451, "epoch": 1378} {"train_loss": -22.22149658203125, "global_step": 114452, "epoch": 1378} {"train_loss": -22.500707626342773, "global_step": 114453, "epoch": 1378} {"train_loss": -22.3624324798584, "global_step": 114454, "epoch": 1378} {"train_loss": -22.277080535888672, "global_step": 114455, "epoch": 1378} {"train_loss": -22.311446201370423, "global_step": 114456, "epoch": 1378, "val_loss": 6201999.5} {"train_loss": -21.487045288085938, "global_step": 114457, "epoch": 1379} {"train_loss": -22.204225540161133, "global_step": 114458, "epoch": 1379} {"train_loss": -21.98541831970215, "global_step": 114459, "epoch": 1379} {"train_loss": -21.67911720275879, "global_step": 114460, "epoch": 1379} {"train_loss": -22.024229049682617, "global_step": 114461, "epoch": 1379} {"train_loss": -21.93208885192871, "global_step": 114462, "epoch": 1379} {"train_loss": -22.209928512573242, "global_step": 114463, "epoch": 1379} {"train_loss": -22.225435256958008, "global_step": 114464, "epoch": 1379} {"train_loss": -22.42083740234375, "global_step": 114465, "epoch": 1379} {"train_loss": -22.264968872070312, "global_step": 114466, "epoch": 1379} {"train_loss": -21.78656578063965, "global_step": 114467, "epoch": 1379} {"train_loss": -22.10577392578125, "global_step": 114468, "epoch": 1379} {"train_loss": -22.071435928344727, "global_step": 114469, "epoch": 1379} {"train_loss": -22.35609245300293, "global_step": 114470, "epoch": 1379} {"train_loss": -21.749677658081055, "global_step": 114471, "epoch": 1379} {"train_loss": -22.231658935546875, "global_step": 114472, "epoch": 1379} {"train_loss": -22.299970626831055, "global_step": 114473, "epoch": 1379} {"train_loss": -22.079439163208008, "global_step": 114474, "epoch": 1379} {"train_loss": -22.51189422607422, "global_step": 114475, "epoch": 1379} {"train_loss": -22.103605270385742, "global_step": 114476, "epoch": 1379} {"train_loss": -22.590778350830078, "global_step": 114477, "epoch": 1379} {"train_loss": -21.88838768005371, "global_step": 114478, "epoch": 1379} {"train_loss": -22.34842300415039, "global_step": 114479, "epoch": 1379} {"train_loss": -22.553804397583008, "global_step": 114480, "epoch": 1379} {"train_loss": -22.464380264282227, "global_step": 114481, "epoch": 1379} {"train_loss": -22.482885360717773, "global_step": 114482, "epoch": 1379} {"train_loss": -22.744997024536133, "global_step": 114483, "epoch": 1379} {"train_loss": -22.157384872436523, "global_step": 114484, "epoch": 1379} {"train_loss": -22.57745933532715, "global_step": 114485, "epoch": 1379} {"train_loss": -22.328275680541992, "global_step": 114486, "epoch": 1379} {"train_loss": -22.362899780273438, "global_step": 114487, "epoch": 1379} {"train_loss": -21.819135665893555, "global_step": 114488, "epoch": 1379} {"train_loss": -22.354412078857422, "global_step": 114489, "epoch": 1379} {"train_loss": -22.093576431274414, "global_step": 114490, "epoch": 1379} {"train_loss": -22.21723747253418, "global_step": 114491, "epoch": 1379} {"train_loss": -22.34372329711914, "global_step": 114492, "epoch": 1379} {"train_loss": -22.489471435546875, "global_step": 114493, "epoch": 1379} {"train_loss": -22.218494415283203, "global_step": 114494, "epoch": 1379} {"train_loss": -22.34133529663086, "global_step": 114495, "epoch": 1379} {"train_loss": -22.236242294311523, "global_step": 114496, "epoch": 1379} {"train_loss": -22.148462295532227, "global_step": 114497, "epoch": 1379} {"train_loss": -22.079866409301758, "global_step": 114498, "epoch": 1379} {"train_loss": -22.270116806030273, "global_step": 114499, "epoch": 1379} {"train_loss": -22.560707092285156, "global_step": 114500, "epoch": 1379} {"train_loss": -22.538312911987305, "global_step": 114501, "epoch": 1379} {"train_loss": -22.48443603515625, "global_step": 114502, "epoch": 1379} {"train_loss": -22.294586181640625, "global_step": 114503, "epoch": 1379} {"train_loss": -22.403724670410156, "global_step": 114504, "epoch": 1379} {"train_loss": -22.347517013549805, "global_step": 114505, "epoch": 1379} {"train_loss": -22.452558517456055, "global_step": 114506, "epoch": 1379} {"train_loss": -22.172021865844727, "global_step": 114507, "epoch": 1379} {"train_loss": -22.18317413330078, "global_step": 114508, "epoch": 1379} {"train_loss": -22.508712768554688, "global_step": 114509, "epoch": 1379} {"train_loss": -22.36317253112793, "global_step": 114510, "epoch": 1379} {"train_loss": -22.577136993408203, "global_step": 114511, "epoch": 1379} {"train_loss": -22.23701286315918, "global_step": 114512, "epoch": 1379} {"train_loss": -22.172353744506836, "global_step": 114513, "epoch": 1379} {"train_loss": -22.36954116821289, "global_step": 114514, "epoch": 1379} {"train_loss": -22.427366256713867, "global_step": 114515, "epoch": 1379} {"train_loss": -22.279102325439453, "global_step": 114516, "epoch": 1379} {"train_loss": -22.304203033447266, "global_step": 114517, "epoch": 1379} {"train_loss": -22.37689971923828, "global_step": 114518, "epoch": 1379} {"train_loss": -22.25726890563965, "global_step": 114519, "epoch": 1379} {"train_loss": -22.60048484802246, "global_step": 114520, "epoch": 1379} {"train_loss": -22.234325408935547, "global_step": 114521, "epoch": 1379} {"train_loss": -22.656835556030273, "global_step": 114522, "epoch": 1379} {"train_loss": -22.334312438964844, "global_step": 114523, "epoch": 1379} {"train_loss": -22.519058227539062, "global_step": 114524, "epoch": 1379} {"train_loss": -22.271583557128906, "global_step": 114525, "epoch": 1379} {"train_loss": -21.933927536010742, "global_step": 114526, "epoch": 1379} {"train_loss": -22.403154373168945, "global_step": 114527, "epoch": 1379} {"train_loss": -22.508291244506836, "global_step": 114528, "epoch": 1379} {"train_loss": -22.376859664916992, "global_step": 114529, "epoch": 1379} {"train_loss": -22.231552124023438, "global_step": 114530, "epoch": 1379} {"train_loss": -22.550312042236328, "global_step": 114531, "epoch": 1379} {"train_loss": -22.750202178955078, "global_step": 114532, "epoch": 1379} {"train_loss": -22.223255157470703, "global_step": 114533, "epoch": 1379} {"train_loss": -22.188867568969727, "global_step": 114534, "epoch": 1379} {"train_loss": -22.200836181640625, "global_step": 114535, "epoch": 1379} {"train_loss": -22.380077362060547, "global_step": 114536, "epoch": 1379} {"train_loss": -22.533740997314453, "global_step": 114537, "epoch": 1379} {"train_loss": -22.277578353881836, "global_step": 114538, "epoch": 1379} {"train_loss": -22.280275988291546, "global_step": 114539, "epoch": 1379, "val_loss": 6171454.5} {"train_loss": -22.31793212890625, "global_step": 114540, "epoch": 1380} {"train_loss": -21.919998168945312, "global_step": 114541, "epoch": 1380} {"train_loss": -22.383609771728516, "global_step": 114542, "epoch": 1380} {"train_loss": -22.34299659729004, "global_step": 114543, "epoch": 1380} {"train_loss": -22.262592315673828, "global_step": 114544, "epoch": 1380} {"train_loss": -22.036008834838867, "global_step": 114545, "epoch": 1380} {"train_loss": -22.65251922607422, "global_step": 114546, "epoch": 1380} {"train_loss": -22.615983963012695, "global_step": 114547, "epoch": 1380} {"train_loss": -22.57878303527832, "global_step": 114548, "epoch": 1380} {"train_loss": -22.37563133239746, "global_step": 114549, "epoch": 1380} {"train_loss": -22.354352951049805, "global_step": 114550, "epoch": 1380} {"train_loss": -22.218244552612305, "global_step": 114551, "epoch": 1380} {"train_loss": -22.12598991394043, "global_step": 114552, "epoch": 1380} {"train_loss": -22.380481719970703, "global_step": 114553, "epoch": 1380} {"train_loss": -22.40191078186035, "global_step": 114554, "epoch": 1380} {"train_loss": -22.089252471923828, "global_step": 114555, "epoch": 1380} {"train_loss": -22.20184898376465, "global_step": 114556, "epoch": 1380} {"train_loss": -22.378602981567383, "global_step": 114557, "epoch": 1380} {"train_loss": -22.494497299194336, "global_step": 114558, "epoch": 1380} {"train_loss": -22.100204467773438, "global_step": 114559, "epoch": 1380} {"train_loss": -22.58342933654785, "global_step": 114560, "epoch": 1380} {"train_loss": -22.224679946899414, "global_step": 114561, "epoch": 1380} {"train_loss": -22.4830265045166, "global_step": 114562, "epoch": 1380} {"train_loss": -22.093063354492188, "global_step": 114563, "epoch": 1380} {"train_loss": -22.501543045043945, "global_step": 114564, "epoch": 1380} {"train_loss": -22.566572189331055, "global_step": 114565, "epoch": 1380} {"train_loss": -22.27159881591797, "global_step": 114566, "epoch": 1380} {"train_loss": -22.291351318359375, "global_step": 114567, "epoch": 1380} {"train_loss": -22.175870895385742, "global_step": 114568, "epoch": 1380} {"train_loss": -22.417638778686523, "global_step": 114569, "epoch": 1380} {"train_loss": -22.4237117767334, "global_step": 114570, "epoch": 1380} {"train_loss": -22.102781295776367, "global_step": 114571, "epoch": 1380} {"train_loss": -22.328325271606445, "global_step": 114572, "epoch": 1380} {"train_loss": -22.215682983398438, "global_step": 114573, "epoch": 1380} {"train_loss": -22.532804489135742, "global_step": 114574, "epoch": 1380} {"train_loss": -22.4874267578125, "global_step": 114575, "epoch": 1380} {"train_loss": -22.07736587524414, "global_step": 114576, "epoch": 1380} {"train_loss": -22.24827766418457, "global_step": 114577, "epoch": 1380} {"train_loss": -22.368051528930664, "global_step": 114578, "epoch": 1380} {"train_loss": -22.677820205688477, "global_step": 114579, "epoch": 1380} {"train_loss": -22.621564865112305, "global_step": 114580, "epoch": 1380} {"train_loss": -22.479469299316406, "global_step": 114581, "epoch": 1380} {"train_loss": -22.438278198242188, "global_step": 114582, "epoch": 1380} {"train_loss": -22.60365104675293, "global_step": 114583, "epoch": 1380} {"train_loss": -22.818899154663086, "global_step": 114584, "epoch": 1380} {"train_loss": -22.204191207885742, "global_step": 114585, "epoch": 1380} {"train_loss": -22.45966911315918, "global_step": 114586, "epoch": 1380} {"train_loss": -22.544340133666992, "global_step": 114587, "epoch": 1380} {"train_loss": -22.849679946899414, "global_step": 114588, "epoch": 1380} {"train_loss": -22.331079483032227, "global_step": 114589, "epoch": 1380} {"train_loss": -22.50830078125, "global_step": 114590, "epoch": 1380} {"train_loss": -22.840606689453125, "global_step": 114591, "epoch": 1380} {"train_loss": -22.462329864501953, "global_step": 114592, "epoch": 1380} {"train_loss": -22.58477210998535, "global_step": 114593, "epoch": 1380} {"train_loss": -22.409902572631836, "global_step": 114594, "epoch": 1380} {"train_loss": -22.35711669921875, "global_step": 114595, "epoch": 1380} {"train_loss": -21.919519424438477, "global_step": 114596, "epoch": 1380} {"train_loss": -22.56320571899414, "global_step": 114597, "epoch": 1380} {"train_loss": -22.1569881439209, "global_step": 114598, "epoch": 1380} {"train_loss": -21.95009422302246, "global_step": 114599, "epoch": 1380} {"train_loss": -21.757314682006836, "global_step": 114600, "epoch": 1380} {"train_loss": -21.969532012939453, "global_step": 114601, "epoch": 1380} {"train_loss": -22.232540130615234, "global_step": 114602, "epoch": 1380} {"train_loss": -22.369935989379883, "global_step": 114603, "epoch": 1380} {"train_loss": -22.10622215270996, "global_step": 114604, "epoch": 1380} {"train_loss": -22.604284286499023, "global_step": 114605, "epoch": 1380} {"train_loss": -21.9969425201416, "global_step": 114606, "epoch": 1380} {"train_loss": -22.271160125732422, "global_step": 114607, "epoch": 1380} {"train_loss": -22.4334659576416, "global_step": 114608, "epoch": 1380} {"train_loss": -22.568601608276367, "global_step": 114609, "epoch": 1380} {"train_loss": -22.355863571166992, "global_step": 114610, "epoch": 1380} {"train_loss": -22.020559310913086, "global_step": 114611, "epoch": 1380} {"train_loss": -22.491657257080078, "global_step": 114612, "epoch": 1380} {"train_loss": -22.59710693359375, "global_step": 114613, "epoch": 1380} {"train_loss": -22.40542221069336, "global_step": 114614, "epoch": 1380} {"train_loss": -22.78868865966797, "global_step": 114615, "epoch": 1380} {"train_loss": -22.249929428100586, "global_step": 114616, "epoch": 1380} {"train_loss": -22.74273109436035, "global_step": 114617, "epoch": 1380} {"train_loss": -22.521608352661133, "global_step": 114618, "epoch": 1380} {"train_loss": -22.020523071289062, "global_step": 114619, "epoch": 1380} {"train_loss": -22.65285301208496, "global_step": 114620, "epoch": 1380} {"train_loss": -22.580801010131836, "global_step": 114621, "epoch": 1380} {"train_loss": -22.375686990209374, "global_step": 114622, "epoch": 1380, "val_loss": 6077087.0} {"train_loss": -22.193716049194336, "global_step": 114623, "epoch": 1381} {"train_loss": -22.06593132019043, "global_step": 114624, "epoch": 1381} {"train_loss": -22.490737915039062, "global_step": 114625, "epoch": 1381} {"train_loss": -22.315750122070312, "global_step": 114626, "epoch": 1381} {"train_loss": -22.3464298248291, "global_step": 114627, "epoch": 1381} {"train_loss": -22.369373321533203, "global_step": 114628, "epoch": 1381} {"train_loss": -22.337757110595703, "global_step": 114629, "epoch": 1381} {"train_loss": -22.095458984375, "global_step": 114630, "epoch": 1381} {"train_loss": -22.668838500976562, "global_step": 114631, "epoch": 1381} {"train_loss": -22.245149612426758, "global_step": 114632, "epoch": 1381} {"train_loss": -22.673139572143555, "global_step": 114633, "epoch": 1381} {"train_loss": -21.980091094970703, "global_step": 114634, "epoch": 1381} {"train_loss": -22.390899658203125, "global_step": 114635, "epoch": 1381} {"train_loss": -22.182844161987305, "global_step": 114636, "epoch": 1381} {"train_loss": -22.139692306518555, "global_step": 114637, "epoch": 1381} {"train_loss": -22.40150260925293, "global_step": 114638, "epoch": 1381} {"train_loss": -22.291929244995117, "global_step": 114639, "epoch": 1381} {"train_loss": -22.351346969604492, "global_step": 114640, "epoch": 1381} {"train_loss": -21.99053382873535, "global_step": 114641, "epoch": 1381} {"train_loss": -22.233169555664062, "global_step": 114642, "epoch": 1381} {"train_loss": -22.31900405883789, "global_step": 114643, "epoch": 1381} {"train_loss": -22.445737838745117, "global_step": 114644, "epoch": 1381} {"train_loss": -22.39413833618164, "global_step": 114645, "epoch": 1381} {"train_loss": -22.39830780029297, "global_step": 114646, "epoch": 1381} {"train_loss": -22.47090721130371, "global_step": 114647, "epoch": 1381} {"train_loss": -22.58620834350586, "global_step": 114648, "epoch": 1381} {"train_loss": -22.5592098236084, "global_step": 114649, "epoch": 1381} {"train_loss": -22.467355728149414, "global_step": 114650, "epoch": 1381} {"train_loss": -22.3846435546875, "global_step": 114651, "epoch": 1381} {"train_loss": -22.34918212890625, "global_step": 114652, "epoch": 1381} {"train_loss": -22.678556442260742, "global_step": 114653, "epoch": 1381} {"train_loss": -22.441612243652344, "global_step": 114654, "epoch": 1381} {"train_loss": -22.17998504638672, "global_step": 114655, "epoch": 1381} {"train_loss": -22.478429794311523, "global_step": 114656, "epoch": 1381} {"train_loss": -22.397380828857422, "global_step": 114657, "epoch": 1381} {"train_loss": -22.510650634765625, "global_step": 114658, "epoch": 1381} {"train_loss": -22.19635581970215, "global_step": 114659, "epoch": 1381} {"train_loss": -22.459991455078125, "global_step": 114660, "epoch": 1381} {"train_loss": -22.376771926879883, "global_step": 114661, "epoch": 1381} {"train_loss": -22.410572052001953, "global_step": 114662, "epoch": 1381} {"train_loss": -22.27284049987793, "global_step": 114663, "epoch": 1381} {"train_loss": -22.82840347290039, "global_step": 114664, "epoch": 1381} {"train_loss": -22.27393913269043, "global_step": 114665, "epoch": 1381} {"train_loss": -22.086294174194336, "global_step": 114666, "epoch": 1381} {"train_loss": -21.897357940673828, "global_step": 114667, "epoch": 1381} {"train_loss": -22.380842208862305, "global_step": 114668, "epoch": 1381} {"train_loss": -22.325592041015625, "global_step": 114669, "epoch": 1381} {"train_loss": -22.36336326599121, "global_step": 114670, "epoch": 1381} {"train_loss": -22.409305572509766, "global_step": 114671, "epoch": 1381} {"train_loss": -22.932392120361328, "global_step": 114672, "epoch": 1381} {"train_loss": -22.28182029724121, "global_step": 114673, "epoch": 1381} {"train_loss": -22.155200958251953, "global_step": 114674, "epoch": 1381} {"train_loss": -22.444808959960938, "global_step": 114675, "epoch": 1381} {"train_loss": -22.51905632019043, "global_step": 114676, "epoch": 1381} {"train_loss": -22.272085189819336, "global_step": 114677, "epoch": 1381} {"train_loss": -22.258453369140625, "global_step": 114678, "epoch": 1381} {"train_loss": -22.75058364868164, "global_step": 114679, "epoch": 1381} {"train_loss": -22.39112091064453, "global_step": 114680, "epoch": 1381} {"train_loss": -22.520788192749023, "global_step": 114681, "epoch": 1381} {"train_loss": -22.762929916381836, "global_step": 114682, "epoch": 1381} {"train_loss": -22.20271110534668, "global_step": 114683, "epoch": 1381} {"train_loss": -21.860361099243164, "global_step": 114684, "epoch": 1381} {"train_loss": -22.26978874206543, "global_step": 114685, "epoch": 1381} {"train_loss": -22.341434478759766, "global_step": 114686, "epoch": 1381} {"train_loss": -22.00874900817871, "global_step": 114687, "epoch": 1381} {"train_loss": -22.133182525634766, "global_step": 114688, "epoch": 1381} {"train_loss": -22.235605239868164, "global_step": 114689, "epoch": 1381} {"train_loss": -22.227540969848633, "global_step": 114690, "epoch": 1381} {"train_loss": -22.79780387878418, "global_step": 114691, "epoch": 1381} {"train_loss": -22.475278854370117, "global_step": 114692, "epoch": 1381} {"train_loss": -22.496578216552734, "global_step": 114693, "epoch": 1381} {"train_loss": -22.447343826293945, "global_step": 114694, "epoch": 1381} {"train_loss": -22.280166625976562, "global_step": 114695, "epoch": 1381} {"train_loss": -22.707691192626953, "global_step": 114696, "epoch": 1381} {"train_loss": -22.037885665893555, "global_step": 114697, "epoch": 1381} {"train_loss": -22.620765686035156, "global_step": 114698, "epoch": 1381} {"train_loss": -22.114999771118164, "global_step": 114699, "epoch": 1381} {"train_loss": -22.5048885345459, "global_step": 114700, "epoch": 1381} {"train_loss": -22.15724754333496, "global_step": 114701, "epoch": 1381} {"train_loss": -22.148136138916016, "global_step": 114702, "epoch": 1381} {"train_loss": -22.186017990112305, "global_step": 114703, "epoch": 1381} {"train_loss": -22.547170639038086, "global_step": 114704, "epoch": 1381} {"train_loss": -22.361579090715892, "global_step": 114705, "epoch": 1381, "val_loss": 6214625.0} {"train_loss": -22.088306427001953, "global_step": 114706, "epoch": 1382} {"train_loss": -21.944812774658203, "global_step": 114707, "epoch": 1382} {"train_loss": -22.200658798217773, "global_step": 114708, "epoch": 1382} {"train_loss": -22.136051177978516, "global_step": 114709, "epoch": 1382} {"train_loss": -22.494665145874023, "global_step": 114710, "epoch": 1382} {"train_loss": -22.10647964477539, "global_step": 114711, "epoch": 1382} {"train_loss": -22.037500381469727, "global_step": 114712, "epoch": 1382} {"train_loss": -22.206541061401367, "global_step": 114713, "epoch": 1382} {"train_loss": -21.97361183166504, "global_step": 114714, "epoch": 1382} {"train_loss": -22.412668228149414, "global_step": 114715, "epoch": 1382} {"train_loss": -22.926294326782227, "global_step": 114716, "epoch": 1382} {"train_loss": -22.40900993347168, "global_step": 114717, "epoch": 1382} {"train_loss": -22.49216651916504, "global_step": 114718, "epoch": 1382} {"train_loss": -22.060564041137695, "global_step": 114719, "epoch": 1382} {"train_loss": -22.223852157592773, "global_step": 114720, "epoch": 1382} {"train_loss": -22.001352310180664, "global_step": 114721, "epoch": 1382} {"train_loss": -22.174604415893555, "global_step": 114722, "epoch": 1382} {"train_loss": -21.93994903564453, "global_step": 114723, "epoch": 1382} {"train_loss": -22.6856746673584, "global_step": 114724, "epoch": 1382} {"train_loss": -22.585193634033203, "global_step": 114725, "epoch": 1382} {"train_loss": -22.258777618408203, "global_step": 114726, "epoch": 1382} {"train_loss": -22.547866821289062, "global_step": 114727, "epoch": 1382} {"train_loss": -22.45465087890625, "global_step": 114728, "epoch": 1382} {"train_loss": -22.44563102722168, "global_step": 114729, "epoch": 1382} {"train_loss": -22.42140769958496, "global_step": 114730, "epoch": 1382} {"train_loss": -22.120304107666016, "global_step": 114731, "epoch": 1382} {"train_loss": -22.160573959350586, "global_step": 114732, "epoch": 1382} {"train_loss": -22.572704315185547, "global_step": 114733, "epoch": 1382} {"train_loss": -22.500497817993164, "global_step": 114734, "epoch": 1382} {"train_loss": -22.377517700195312, "global_step": 114735, "epoch": 1382} {"train_loss": -22.17868423461914, "global_step": 114736, "epoch": 1382} {"train_loss": -22.36507225036621, "global_step": 114737, "epoch": 1382} {"train_loss": -22.29678726196289, "global_step": 114738, "epoch": 1382} {"train_loss": -22.230716705322266, "global_step": 114739, "epoch": 1382} {"train_loss": -22.557907104492188, "global_step": 114740, "epoch": 1382} {"train_loss": -22.08979034423828, "global_step": 114741, "epoch": 1382} {"train_loss": -22.29254722595215, "global_step": 114742, "epoch": 1382} {"train_loss": -22.373823165893555, "global_step": 114743, "epoch": 1382} {"train_loss": -22.52260971069336, "global_step": 114744, "epoch": 1382} {"train_loss": -22.40974235534668, "global_step": 114745, "epoch": 1382} {"train_loss": -22.472087860107422, "global_step": 114746, "epoch": 1382} {"train_loss": -22.495845794677734, "global_step": 114747, "epoch": 1382} {"train_loss": -22.616626739501953, "global_step": 114748, "epoch": 1382} {"train_loss": -22.36334800720215, "global_step": 114749, "epoch": 1382} {"train_loss": -22.577367782592773, "global_step": 114750, "epoch": 1382} {"train_loss": -22.549304962158203, "global_step": 114751, "epoch": 1382} {"train_loss": -22.542226791381836, "global_step": 114752, "epoch": 1382} {"train_loss": -22.110509872436523, "global_step": 114753, "epoch": 1382} {"train_loss": -22.950002670288086, "global_step": 114754, "epoch": 1382} {"train_loss": -22.61700439453125, "global_step": 114755, "epoch": 1382} {"train_loss": -22.53510284423828, "global_step": 114756, "epoch": 1382} {"train_loss": -22.832632064819336, "global_step": 114757, "epoch": 1382} {"train_loss": -22.56026840209961, "global_step": 114758, "epoch": 1382} {"train_loss": -22.52272605895996, "global_step": 114759, "epoch": 1382} {"train_loss": -22.71047019958496, "global_step": 114760, "epoch": 1382} {"train_loss": -22.570363998413086, "global_step": 114761, "epoch": 1382} {"train_loss": -22.44031524658203, "global_step": 114762, "epoch": 1382} {"train_loss": -22.382658004760742, "global_step": 114763, "epoch": 1382} {"train_loss": -22.65301513671875, "global_step": 114764, "epoch": 1382} {"train_loss": -22.414274215698242, "global_step": 114765, "epoch": 1382} {"train_loss": -22.33610725402832, "global_step": 114766, "epoch": 1382} {"train_loss": -22.44241714477539, "global_step": 114767, "epoch": 1382} {"train_loss": -22.151416778564453, "global_step": 114768, "epoch": 1382} {"train_loss": -22.66506004333496, "global_step": 114769, "epoch": 1382} {"train_loss": -22.31330680847168, "global_step": 114770, "epoch": 1382} {"train_loss": -22.2404727935791, "global_step": 114771, "epoch": 1382} {"train_loss": -22.528532028198242, "global_step": 114772, "epoch": 1382} {"train_loss": -22.084081649780273, "global_step": 114773, "epoch": 1382} {"train_loss": -22.484149932861328, "global_step": 114774, "epoch": 1382} {"train_loss": -22.39263916015625, "global_step": 114775, "epoch": 1382} {"train_loss": -22.533109664916992, "global_step": 114776, "epoch": 1382} {"train_loss": -22.209810256958008, "global_step": 114777, "epoch": 1382} {"train_loss": -22.193429946899414, "global_step": 114778, "epoch": 1382} {"train_loss": -22.133573532104492, "global_step": 114779, "epoch": 1382} {"train_loss": -22.16253089904785, "global_step": 114780, "epoch": 1382} {"train_loss": -22.727691650390625, "global_step": 114781, "epoch": 1382} {"train_loss": -22.473474502563477, "global_step": 114782, "epoch": 1382} {"train_loss": -22.179197311401367, "global_step": 114783, "epoch": 1382} {"train_loss": -22.272628784179688, "global_step": 114784, "epoch": 1382} {"train_loss": -22.3040714263916, "global_step": 114785, "epoch": 1382} {"train_loss": -22.48862075805664, "global_step": 114786, "epoch": 1382} {"train_loss": -22.112567901611328, "global_step": 114787, "epoch": 1382} {"train_loss": -22.36679853875953, "global_step": 114788, "epoch": 1382, "val_loss": 6081097.0} {"train_loss": -22.18097496032715, "global_step": 114789, "epoch": 1383} {"train_loss": -22.10983657836914, "global_step": 114790, "epoch": 1383} {"train_loss": -21.878589630126953, "global_step": 114791, "epoch": 1383} {"train_loss": -22.304325103759766, "global_step": 114792, "epoch": 1383} {"train_loss": -22.202903747558594, "global_step": 114793, "epoch": 1383} {"train_loss": -22.15811538696289, "global_step": 114794, "epoch": 1383} {"train_loss": -22.235143661499023, "global_step": 114795, "epoch": 1383} {"train_loss": -22.4450626373291, "global_step": 114796, "epoch": 1383} {"train_loss": -22.554166793823242, "global_step": 114797, "epoch": 1383} {"train_loss": -22.447973251342773, "global_step": 114798, "epoch": 1383} {"train_loss": -22.68068504333496, "global_step": 114799, "epoch": 1383} {"train_loss": -22.45410919189453, "global_step": 114800, "epoch": 1383} {"train_loss": -22.649106979370117, "global_step": 114801, "epoch": 1383} {"train_loss": -22.2349910736084, "global_step": 114802, "epoch": 1383} {"train_loss": -22.314722061157227, "global_step": 114803, "epoch": 1383} {"train_loss": -22.193845748901367, "global_step": 114804, "epoch": 1383} {"train_loss": -22.63222885131836, "global_step": 114805, "epoch": 1383} {"train_loss": -22.51405906677246, "global_step": 114806, "epoch": 1383} {"train_loss": -22.203664779663086, "global_step": 114807, "epoch": 1383} {"train_loss": -22.337228775024414, "global_step": 114808, "epoch": 1383} {"train_loss": -22.369375228881836, "global_step": 114809, "epoch": 1383} {"train_loss": -22.418609619140625, "global_step": 114810, "epoch": 1383} {"train_loss": -22.49350357055664, "global_step": 114811, "epoch": 1383} {"train_loss": -22.386686325073242, "global_step": 114812, "epoch": 1383} {"train_loss": -22.524105072021484, "global_step": 114813, "epoch": 1383} {"train_loss": -22.87192726135254, "global_step": 114814, "epoch": 1383} {"train_loss": -22.62442398071289, "global_step": 114815, "epoch": 1383} {"train_loss": -22.245149612426758, "global_step": 114816, "epoch": 1383} {"train_loss": -22.281827926635742, "global_step": 114817, "epoch": 1383} {"train_loss": -22.110502243041992, "global_step": 114818, "epoch": 1383} {"train_loss": -22.19684410095215, "global_step": 114819, "epoch": 1383} {"train_loss": -22.606046676635742, "global_step": 114820, "epoch": 1383} {"train_loss": -22.057104110717773, "global_step": 114821, "epoch": 1383} {"train_loss": -22.523757934570312, "global_step": 114822, "epoch": 1383} {"train_loss": -22.6951961517334, "global_step": 114823, "epoch": 1383} {"train_loss": -22.218521118164062, "global_step": 114824, "epoch": 1383} {"train_loss": -22.43189811706543, "global_step": 114825, "epoch": 1383} {"train_loss": -22.535242080688477, "global_step": 114826, "epoch": 1383} {"train_loss": -22.690954208374023, "global_step": 114827, "epoch": 1383} {"train_loss": -22.498188018798828, "global_step": 114828, "epoch": 1383} {"train_loss": -22.211353302001953, "global_step": 114829, "epoch": 1383} {"train_loss": -22.4943904876709, "global_step": 114830, "epoch": 1383} {"train_loss": -22.05702018737793, "global_step": 114831, "epoch": 1383} {"train_loss": -22.760547637939453, "global_step": 114832, "epoch": 1383} {"train_loss": -22.22820472717285, "global_step": 114833, "epoch": 1383} {"train_loss": -22.318510055541992, "global_step": 114834, "epoch": 1383} {"train_loss": -22.35235023498535, "global_step": 114835, "epoch": 1383} {"train_loss": -22.14824104309082, "global_step": 114836, "epoch": 1383} {"train_loss": -22.574848175048828, "global_step": 114837, "epoch": 1383} {"train_loss": -22.460357666015625, "global_step": 114838, "epoch": 1383} {"train_loss": -22.369733810424805, "global_step": 114839, "epoch": 1383} {"train_loss": -22.09795570373535, "global_step": 114840, "epoch": 1383} {"train_loss": -22.225971221923828, "global_step": 114841, "epoch": 1383} {"train_loss": -21.857925415039062, "global_step": 114842, "epoch": 1383} {"train_loss": -22.25241470336914, "global_step": 114843, "epoch": 1383} {"train_loss": -22.296964645385742, "global_step": 114844, "epoch": 1383} {"train_loss": -22.280109405517578, "global_step": 114845, "epoch": 1383} {"train_loss": -22.322153091430664, "global_step": 114846, "epoch": 1383} {"train_loss": -22.471975326538086, "global_step": 114847, "epoch": 1383} {"train_loss": -22.30816650390625, "global_step": 114848, "epoch": 1383} {"train_loss": -22.495588302612305, "global_step": 114849, "epoch": 1383} {"train_loss": -22.14391326904297, "global_step": 114850, "epoch": 1383} {"train_loss": -22.36342430114746, "global_step": 114851, "epoch": 1383} {"train_loss": -22.045217514038086, "global_step": 114852, "epoch": 1383} {"train_loss": -22.355070114135742, "global_step": 114853, "epoch": 1383} {"train_loss": -22.30142593383789, "global_step": 114854, "epoch": 1383} {"train_loss": -22.44576072692871, "global_step": 114855, "epoch": 1383} {"train_loss": -22.60206413269043, "global_step": 114856, "epoch": 1383} {"train_loss": -21.943498611450195, "global_step": 114857, "epoch": 1383} {"train_loss": -22.415416717529297, "global_step": 114858, "epoch": 1383} {"train_loss": -22.478851318359375, "global_step": 114859, "epoch": 1383} {"train_loss": -22.69840431213379, "global_step": 114860, "epoch": 1383} {"train_loss": -22.482009887695312, "global_step": 114861, "epoch": 1383} {"train_loss": -22.886648178100586, "global_step": 114862, "epoch": 1383} {"train_loss": -22.55727195739746, "global_step": 114863, "epoch": 1383} {"train_loss": -22.588529586791992, "global_step": 114864, "epoch": 1383} {"train_loss": -22.60138702392578, "global_step": 114865, "epoch": 1383} {"train_loss": -22.55154037475586, "global_step": 114866, "epoch": 1383} {"train_loss": -22.571096420288086, "global_step": 114867, "epoch": 1383} {"train_loss": -22.106691360473633, "global_step": 114868, "epoch": 1383} {"train_loss": -22.08995819091797, "global_step": 114869, "epoch": 1383} {"train_loss": -22.24846649169922, "global_step": 114870, "epoch": 1383} {"train_loss": -22.365773051618092, "global_step": 114871, "epoch": 1383, "val_loss": 6141774.0} {"train_loss": -22.26357650756836, "global_step": 114872, "epoch": 1384} {"train_loss": -21.999399185180664, "global_step": 114873, "epoch": 1384} {"train_loss": -22.36629295349121, "global_step": 114874, "epoch": 1384} {"train_loss": -22.387060165405273, "global_step": 114875, "epoch": 1384} {"train_loss": -22.215091705322266, "global_step": 114876, "epoch": 1384} {"train_loss": -22.51396369934082, "global_step": 114877, "epoch": 1384} {"train_loss": -22.71454429626465, "global_step": 114878, "epoch": 1384} {"train_loss": -22.255603790283203, "global_step": 114879, "epoch": 1384} {"train_loss": -22.118694305419922, "global_step": 114880, "epoch": 1384} {"train_loss": -22.561233520507812, "global_step": 114881, "epoch": 1384} {"train_loss": -21.944772720336914, "global_step": 114882, "epoch": 1384} {"train_loss": -22.29349136352539, "global_step": 114883, "epoch": 1384} {"train_loss": -22.066953659057617, "global_step": 114884, "epoch": 1384} {"train_loss": -22.069677352905273, "global_step": 114885, "epoch": 1384} {"train_loss": -22.254194259643555, "global_step": 114886, "epoch": 1384} {"train_loss": -22.29058265686035, "global_step": 114887, "epoch": 1384} {"train_loss": -22.20230484008789, "global_step": 114888, "epoch": 1384} {"train_loss": -21.935068130493164, "global_step": 114889, "epoch": 1384} {"train_loss": -22.138654708862305, "global_step": 114890, "epoch": 1384} {"train_loss": -22.076383590698242, "global_step": 114891, "epoch": 1384} {"train_loss": -22.01004981994629, "global_step": 114892, "epoch": 1384} {"train_loss": -22.411327362060547, "global_step": 114893, "epoch": 1384} {"train_loss": -22.315078735351562, "global_step": 114894, "epoch": 1384} {"train_loss": -22.62209701538086, "global_step": 114895, "epoch": 1384} {"train_loss": -22.314117431640625, "global_step": 114896, "epoch": 1384} {"train_loss": -22.666181564331055, "global_step": 114897, "epoch": 1384} {"train_loss": -22.108278274536133, "global_step": 114898, "epoch": 1384} {"train_loss": -22.555831909179688, "global_step": 114899, "epoch": 1384} {"train_loss": -22.475431442260742, "global_step": 114900, "epoch": 1384} {"train_loss": -22.398744583129883, "global_step": 114901, "epoch": 1384} {"train_loss": -22.4539737701416, "global_step": 114902, "epoch": 1384} {"train_loss": -22.585966110229492, "global_step": 114903, "epoch": 1384} {"train_loss": -22.185285568237305, "global_step": 114904, "epoch": 1384} {"train_loss": -22.32098388671875, "global_step": 114905, "epoch": 1384} {"train_loss": -22.577722549438477, "global_step": 114906, "epoch": 1384} {"train_loss": -22.339597702026367, "global_step": 114907, "epoch": 1384} {"train_loss": -22.334829330444336, "global_step": 114908, "epoch": 1384} {"train_loss": -22.50440788269043, "global_step": 114909, "epoch": 1384} {"train_loss": -22.352872848510742, "global_step": 114910, "epoch": 1384} {"train_loss": -22.31702995300293, "global_step": 114911, "epoch": 1384} {"train_loss": -22.343793869018555, "global_step": 114912, "epoch": 1384} {"train_loss": -22.334842681884766, "global_step": 114913, "epoch": 1384} {"train_loss": -22.28780174255371, "global_step": 114914, "epoch": 1384} {"train_loss": -22.078994750976562, "global_step": 114915, "epoch": 1384} {"train_loss": -22.558652877807617, "global_step": 114916, "epoch": 1384} {"train_loss": -22.3126163482666, "global_step": 114917, "epoch": 1384} {"train_loss": -22.318592071533203, "global_step": 114918, "epoch": 1384} {"train_loss": -22.2574405670166, "global_step": 114919, "epoch": 1384} {"train_loss": -22.049951553344727, "global_step": 114920, "epoch": 1384} {"train_loss": -22.4216365814209, "global_step": 114921, "epoch": 1384} {"train_loss": -22.55787467956543, "global_step": 114922, "epoch": 1384} {"train_loss": -22.31331443786621, "global_step": 114923, "epoch": 1384} {"train_loss": -22.399417877197266, "global_step": 114924, "epoch": 1384} {"train_loss": -22.44599723815918, "global_step": 114925, "epoch": 1384} {"train_loss": -22.329870223999023, "global_step": 114926, "epoch": 1384} {"train_loss": -22.406431198120117, "global_step": 114927, "epoch": 1384} {"train_loss": -22.327299118041992, "global_step": 114928, "epoch": 1384} {"train_loss": -22.51979637145996, "global_step": 114929, "epoch": 1384} {"train_loss": -22.17256736755371, "global_step": 114930, "epoch": 1384} {"train_loss": -22.494657516479492, "global_step": 114931, "epoch": 1384} {"train_loss": -22.177915573120117, "global_step": 114932, "epoch": 1384} {"train_loss": -22.612211227416992, "global_step": 114933, "epoch": 1384} {"train_loss": -22.56340980529785, "global_step": 114934, "epoch": 1384} {"train_loss": -22.29033851623535, "global_step": 114935, "epoch": 1384} {"train_loss": -22.166303634643555, "global_step": 114936, "epoch": 1384} {"train_loss": -22.62568473815918, "global_step": 114937, "epoch": 1384} {"train_loss": -22.48321533203125, "global_step": 114938, "epoch": 1384} {"train_loss": -21.849210739135742, "global_step": 114939, "epoch": 1384} {"train_loss": -22.168628692626953, "global_step": 114940, "epoch": 1384} {"train_loss": -22.519859313964844, "global_step": 114941, "epoch": 1384} {"train_loss": -22.129728317260742, "global_step": 114942, "epoch": 1384} {"train_loss": -22.03060531616211, "global_step": 114943, "epoch": 1384} {"train_loss": -22.45947265625, "global_step": 114944, "epoch": 1384} {"train_loss": -22.559972763061523, "global_step": 114945, "epoch": 1384} {"train_loss": -22.50982666015625, "global_step": 114946, "epoch": 1384} {"train_loss": -22.397489547729492, "global_step": 114947, "epoch": 1384} {"train_loss": -21.91535186767578, "global_step": 114948, "epoch": 1384} {"train_loss": -22.554183959960938, "global_step": 114949, "epoch": 1384} {"train_loss": -22.482009887695312, "global_step": 114950, "epoch": 1384} {"train_loss": -22.218273162841797, "global_step": 114951, "epoch": 1384} {"train_loss": -22.81971549987793, "global_step": 114952, "epoch": 1384} {"train_loss": -22.347461700439453, "global_step": 114953, "epoch": 1384} {"train_loss": -22.30900684034968, "global_step": 114954, "epoch": 1384, "val_loss": 6205506.0} {"train_loss": -22.55327033996582, "global_step": 114955, "epoch": 1385} {"train_loss": -21.564504623413086, "global_step": 114956, "epoch": 1385} {"train_loss": -21.85287857055664, "global_step": 114957, "epoch": 1385} {"train_loss": -22.048908233642578, "global_step": 114958, "epoch": 1385} {"train_loss": -21.641468048095703, "global_step": 114959, "epoch": 1385} {"train_loss": -22.029226303100586, "global_step": 114960, "epoch": 1385} {"train_loss": -21.83938980102539, "global_step": 114961, "epoch": 1385} {"train_loss": -22.27703857421875, "global_step": 114962, "epoch": 1385} {"train_loss": -22.380117416381836, "global_step": 114963, "epoch": 1385} {"train_loss": -21.938589096069336, "global_step": 114964, "epoch": 1385} {"train_loss": -22.28216552734375, "global_step": 114965, "epoch": 1385} {"train_loss": -22.314950942993164, "global_step": 114966, "epoch": 1385} {"train_loss": -21.876495361328125, "global_step": 114967, "epoch": 1385} {"train_loss": -21.887516021728516, "global_step": 114968, "epoch": 1385} {"train_loss": -22.22408103942871, "global_step": 114969, "epoch": 1385} {"train_loss": -22.14069175720215, "global_step": 114970, "epoch": 1385} {"train_loss": -22.47029685974121, "global_step": 114971, "epoch": 1385} {"train_loss": -22.506650924682617, "global_step": 114972, "epoch": 1385} {"train_loss": -22.169363021850586, "global_step": 114973, "epoch": 1385} {"train_loss": -22.399988174438477, "global_step": 114974, "epoch": 1385} {"train_loss": -22.228347778320312, "global_step": 114975, "epoch": 1385} {"train_loss": -22.103696823120117, "global_step": 114976, "epoch": 1385} {"train_loss": -22.26784896850586, "global_step": 114977, "epoch": 1385} {"train_loss": -22.612276077270508, "global_step": 114978, "epoch": 1385} {"train_loss": -22.391632080078125, "global_step": 114979, "epoch": 1385} {"train_loss": -22.250150680541992, "global_step": 114980, "epoch": 1385} {"train_loss": -22.556379318237305, "global_step": 114981, "epoch": 1385} {"train_loss": -22.572214126586914, "global_step": 114982, "epoch": 1385} {"train_loss": -22.216760635375977, "global_step": 114983, "epoch": 1385} {"train_loss": -22.22882080078125, "global_step": 114984, "epoch": 1385} {"train_loss": -22.26021385192871, "global_step": 114985, "epoch": 1385} {"train_loss": -22.303565979003906, "global_step": 114986, "epoch": 1385} {"train_loss": -22.619123458862305, "global_step": 114987, "epoch": 1385} {"train_loss": -22.797033309936523, "global_step": 114988, "epoch": 1385} {"train_loss": -22.268428802490234, "global_step": 114989, "epoch": 1385} {"train_loss": -22.533721923828125, "global_step": 114990, "epoch": 1385} {"train_loss": -21.96856117248535, "global_step": 114991, "epoch": 1385} {"train_loss": -22.097518920898438, "global_step": 114992, "epoch": 1385} {"train_loss": -22.27784538269043, "global_step": 114993, "epoch": 1385} {"train_loss": -22.41455078125, "global_step": 114994, "epoch": 1385} {"train_loss": -22.508209228515625, "global_step": 114995, "epoch": 1385} {"train_loss": -22.494983673095703, "global_step": 114996, "epoch": 1385} {"train_loss": -22.724876403808594, "global_step": 114997, "epoch": 1385} {"train_loss": -22.187593460083008, "global_step": 114998, "epoch": 1385} {"train_loss": -22.814258575439453, "global_step": 114999, "epoch": 1385} {"train_loss": -22.46882438659668, "global_step": 115000, "epoch": 1385} {"train_loss": -22.787870407104492, "global_step": 115001, "epoch": 1385} {"train_loss": -22.15702247619629, "global_step": 115002, "epoch": 1385} {"train_loss": -22.429447174072266, "global_step": 115003, "epoch": 1385} {"train_loss": -22.507389068603516, "global_step": 115004, "epoch": 1385} {"train_loss": -22.26942253112793, "global_step": 115005, "epoch": 1385} {"train_loss": -22.398466110229492, "global_step": 115006, "epoch": 1385} {"train_loss": -22.557891845703125, "global_step": 115007, "epoch": 1385} {"train_loss": -22.591354370117188, "global_step": 115008, "epoch": 1385} {"train_loss": -22.179563522338867, "global_step": 115009, "epoch": 1385} {"train_loss": -22.258777618408203, "global_step": 115010, "epoch": 1385} {"train_loss": -22.17481803894043, "global_step": 115011, "epoch": 1385} {"train_loss": -22.14517593383789, "global_step": 115012, "epoch": 1385} {"train_loss": -22.392568588256836, "global_step": 115013, "epoch": 1385} {"train_loss": -22.4418888092041, "global_step": 115014, "epoch": 1385} {"train_loss": -22.374841690063477, "global_step": 115015, "epoch": 1385} {"train_loss": -22.269180297851562, "global_step": 115016, "epoch": 1385} {"train_loss": -22.500669479370117, "global_step": 115017, "epoch": 1385} {"train_loss": -22.247331619262695, "global_step": 115018, "epoch": 1385} {"train_loss": -22.419240951538086, "global_step": 115019, "epoch": 1385} {"train_loss": -22.51975440979004, "global_step": 115020, "epoch": 1385} {"train_loss": -22.767759323120117, "global_step": 115021, "epoch": 1385} {"train_loss": -22.647418975830078, "global_step": 115022, "epoch": 1385} {"train_loss": -22.581968307495117, "global_step": 115023, "epoch": 1385} {"train_loss": -22.079147338867188, "global_step": 115024, "epoch": 1385} {"train_loss": -22.1280460357666, "global_step": 115025, "epoch": 1385} {"train_loss": -22.206945419311523, "global_step": 115026, "epoch": 1385} {"train_loss": -22.242338180541992, "global_step": 115027, "epoch": 1385} {"train_loss": -22.354843139648438, "global_step": 115028, "epoch": 1385} {"train_loss": -22.63011932373047, "global_step": 115029, "epoch": 1385} {"train_loss": -22.293018341064453, "global_step": 115030, "epoch": 1385} {"train_loss": -22.24787712097168, "global_step": 115031, "epoch": 1385} {"train_loss": -22.464262008666992, "global_step": 115032, "epoch": 1385} {"train_loss": -22.921594619750977, "global_step": 115033, "epoch": 1385} {"train_loss": -22.633182525634766, "global_step": 115034, "epoch": 1385} {"train_loss": -22.295331954956055, "global_step": 115035, "epoch": 1385} {"train_loss": -22.23834800720215, "global_step": 115036, "epoch": 1385} {"train_loss": -22.31616256897708, "global_step": 115037, "epoch": 1385, "val_loss": 6181179.5} {"train_loss": -21.89279556274414, "global_step": 115038, "epoch": 1386} {"train_loss": -21.95747947692871, "global_step": 115039, "epoch": 1386} {"train_loss": -22.15028953552246, "global_step": 115040, "epoch": 1386} {"train_loss": -22.15985107421875, "global_step": 115041, "epoch": 1386} {"train_loss": -22.204742431640625, "global_step": 115042, "epoch": 1386} {"train_loss": -21.740291595458984, "global_step": 115043, "epoch": 1386} {"train_loss": -22.36932373046875, "global_step": 115044, "epoch": 1386} {"train_loss": -21.97981071472168, "global_step": 115045, "epoch": 1386} {"train_loss": -22.32294464111328, "global_step": 115046, "epoch": 1386} {"train_loss": -22.179397583007812, "global_step": 115047, "epoch": 1386} {"train_loss": -21.88454246520996, "global_step": 115048, "epoch": 1386} {"train_loss": -22.300701141357422, "global_step": 115049, "epoch": 1386} {"train_loss": -22.61726188659668, "global_step": 115050, "epoch": 1386} {"train_loss": -21.946924209594727, "global_step": 115051, "epoch": 1386} {"train_loss": -22.226327896118164, "global_step": 115052, "epoch": 1386} {"train_loss": -22.340627670288086, "global_step": 115053, "epoch": 1386} {"train_loss": -22.45406150817871, "global_step": 115054, "epoch": 1386} {"train_loss": -21.965330123901367, "global_step": 115055, "epoch": 1386} {"train_loss": -22.310546875, "global_step": 115056, "epoch": 1386} {"train_loss": -22.552248001098633, "global_step": 115057, "epoch": 1386} {"train_loss": -22.32497215270996, "global_step": 115058, "epoch": 1386} {"train_loss": -22.43502426147461, "global_step": 115059, "epoch": 1386} {"train_loss": -22.78691864013672, "global_step": 115060, "epoch": 1386} {"train_loss": -22.27927589416504, "global_step": 115061, "epoch": 1386} {"train_loss": -22.247602462768555, "global_step": 115062, "epoch": 1386} {"train_loss": -22.032657623291016, "global_step": 115063, "epoch": 1386} {"train_loss": -22.160011291503906, "global_step": 115064, "epoch": 1386} {"train_loss": -22.233768463134766, "global_step": 115065, "epoch": 1386} {"train_loss": -22.266780853271484, "global_step": 115066, "epoch": 1386} {"train_loss": -22.492603302001953, "global_step": 115067, "epoch": 1386} {"train_loss": -22.807615280151367, "global_step": 115068, "epoch": 1386} {"train_loss": -22.246091842651367, "global_step": 115069, "epoch": 1386} {"train_loss": -22.653156280517578, "global_step": 115070, "epoch": 1386} {"train_loss": -22.615278244018555, "global_step": 115071, "epoch": 1386} {"train_loss": -22.773847579956055, "global_step": 115072, "epoch": 1386} {"train_loss": -22.48879051208496, "global_step": 115073, "epoch": 1386} {"train_loss": -22.502824783325195, "global_step": 115074, "epoch": 1386} {"train_loss": -22.279508590698242, "global_step": 115075, "epoch": 1386} {"train_loss": -22.756330490112305, "global_step": 115076, "epoch": 1386} {"train_loss": -22.54608726501465, "global_step": 115077, "epoch": 1386} {"train_loss": -22.116825103759766, "global_step": 115078, "epoch": 1386} {"train_loss": -22.56136703491211, "global_step": 115079, "epoch": 1386} {"train_loss": -22.54417610168457, "global_step": 115080, "epoch": 1386} {"train_loss": -21.95550537109375, "global_step": 115081, "epoch": 1386} {"train_loss": -22.247861862182617, "global_step": 115082, "epoch": 1386} {"train_loss": -22.054304122924805, "global_step": 115083, "epoch": 1386} {"train_loss": -21.636091232299805, "global_step": 115084, "epoch": 1386} {"train_loss": -22.131362915039062, "global_step": 115085, "epoch": 1386} {"train_loss": -22.306116104125977, "global_step": 115086, "epoch": 1386} {"train_loss": -22.11832046508789, "global_step": 115087, "epoch": 1386} {"train_loss": -22.16207504272461, "global_step": 115088, "epoch": 1386} {"train_loss": -22.695966720581055, "global_step": 115089, "epoch": 1386} {"train_loss": -21.845844268798828, "global_step": 115090, "epoch": 1386} {"train_loss": -22.213300704956055, "global_step": 115091, "epoch": 1386} {"train_loss": -22.03419303894043, "global_step": 115092, "epoch": 1386} {"train_loss": -22.430007934570312, "global_step": 115093, "epoch": 1386} {"train_loss": -22.197982788085938, "global_step": 115094, "epoch": 1386} {"train_loss": -22.263858795166016, "global_step": 115095, "epoch": 1386} {"train_loss": -22.17911720275879, "global_step": 115096, "epoch": 1386} {"train_loss": -21.897703170776367, "global_step": 115097, "epoch": 1386} {"train_loss": -22.424091339111328, "global_step": 115098, "epoch": 1386} {"train_loss": -22.183095932006836, "global_step": 115099, "epoch": 1386} {"train_loss": -22.061248779296875, "global_step": 115100, "epoch": 1386} {"train_loss": -22.414167404174805, "global_step": 115101, "epoch": 1386} {"train_loss": -21.896574020385742, "global_step": 115102, "epoch": 1386} {"train_loss": -22.67285919189453, "global_step": 115103, "epoch": 1386} {"train_loss": -22.055179595947266, "global_step": 115104, "epoch": 1386} {"train_loss": -22.42828369140625, "global_step": 115105, "epoch": 1386} {"train_loss": -22.015361785888672, "global_step": 115106, "epoch": 1386} {"train_loss": -22.035568237304688, "global_step": 115107, "epoch": 1386} {"train_loss": -22.10282325744629, "global_step": 115108, "epoch": 1386} {"train_loss": -22.197118759155273, "global_step": 115109, "epoch": 1386} {"train_loss": -22.24399185180664, "global_step": 115110, "epoch": 1386} {"train_loss": -22.046873092651367, "global_step": 115111, "epoch": 1386} {"train_loss": -22.52511215209961, "global_step": 115112, "epoch": 1386} {"train_loss": -22.35793113708496, "global_step": 115113, "epoch": 1386} {"train_loss": -22.420137405395508, "global_step": 115114, "epoch": 1386} {"train_loss": -22.52003288269043, "global_step": 115115, "epoch": 1386} {"train_loss": -22.5364990234375, "global_step": 115116, "epoch": 1386} {"train_loss": -22.200307846069336, "global_step": 115117, "epoch": 1386} {"train_loss": -22.24098777770996, "global_step": 115118, "epoch": 1386} {"train_loss": -22.607696533203125, "global_step": 115119, "epoch": 1386} {"train_loss": -22.284550632338927, "global_step": 115120, "epoch": 1386, "val_loss": 6154012.5} {"train_loss": -22.358951568603516, "global_step": 115121, "epoch": 1387} {"train_loss": -22.084684371948242, "global_step": 115122, "epoch": 1387} {"train_loss": -22.209613800048828, "global_step": 115123, "epoch": 1387} {"train_loss": -22.00877571105957, "global_step": 115124, "epoch": 1387} {"train_loss": -22.461193084716797, "global_step": 115125, "epoch": 1387} {"train_loss": -22.412809371948242, "global_step": 115126, "epoch": 1387} {"train_loss": -22.238990783691406, "global_step": 115127, "epoch": 1387} {"train_loss": -22.41712188720703, "global_step": 115128, "epoch": 1387} {"train_loss": -22.363431930541992, "global_step": 115129, "epoch": 1387} {"train_loss": -22.27010154724121, "global_step": 115130, "epoch": 1387} {"train_loss": -22.605335235595703, "global_step": 115131, "epoch": 1387} {"train_loss": -22.749204635620117, "global_step": 115132, "epoch": 1387} {"train_loss": -22.56764030456543, "global_step": 115133, "epoch": 1387} {"train_loss": -22.743093490600586, "global_step": 115134, "epoch": 1387} {"train_loss": -22.68071937561035, "global_step": 115135, "epoch": 1387} {"train_loss": -22.3525333404541, "global_step": 115136, "epoch": 1387} {"train_loss": -22.460901260375977, "global_step": 115137, "epoch": 1387} {"train_loss": -22.38568878173828, "global_step": 115138, "epoch": 1387} {"train_loss": -22.264312744140625, "global_step": 115139, "epoch": 1387} {"train_loss": -22.210487365722656, "global_step": 115140, "epoch": 1387} {"train_loss": -22.541929244995117, "global_step": 115141, "epoch": 1387} {"train_loss": -22.60993003845215, "global_step": 115142, "epoch": 1387} {"train_loss": -22.604578018188477, "global_step": 115143, "epoch": 1387} {"train_loss": -22.31648826599121, "global_step": 115144, "epoch": 1387} {"train_loss": -22.472238540649414, "global_step": 115145, "epoch": 1387} {"train_loss": -22.432138442993164, "global_step": 115146, "epoch": 1387} {"train_loss": -22.465368270874023, "global_step": 115147, "epoch": 1387} {"train_loss": -22.57011604309082, "global_step": 115148, "epoch": 1387} {"train_loss": -22.109472274780273, "global_step": 115149, "epoch": 1387} {"train_loss": -22.520694732666016, "global_step": 115150, "epoch": 1387} {"train_loss": -22.686832427978516, "global_step": 115151, "epoch": 1387} {"train_loss": -22.26026725769043, "global_step": 115152, "epoch": 1387} {"train_loss": -22.067773818969727, "global_step": 115153, "epoch": 1387} {"train_loss": -22.234363555908203, "global_step": 115154, "epoch": 1387} {"train_loss": -22.368696212768555, "global_step": 115155, "epoch": 1387} {"train_loss": -22.342802047729492, "global_step": 115156, "epoch": 1387} {"train_loss": -22.599348068237305, "global_step": 115157, "epoch": 1387} {"train_loss": -22.51596450805664, "global_step": 115158, "epoch": 1387} {"train_loss": -22.422975540161133, "global_step": 115159, "epoch": 1387} {"train_loss": -22.179073333740234, "global_step": 115160, "epoch": 1387} {"train_loss": -22.210500717163086, "global_step": 115161, "epoch": 1387} {"train_loss": -22.596004486083984, "global_step": 115162, "epoch": 1387} {"train_loss": -22.80417251586914, "global_step": 115163, "epoch": 1387} {"train_loss": -22.848796844482422, "global_step": 115164, "epoch": 1387} {"train_loss": -22.604455947875977, "global_step": 115165, "epoch": 1387} {"train_loss": -22.472768783569336, "global_step": 115166, "epoch": 1387} {"train_loss": -22.522119522094727, "global_step": 115167, "epoch": 1387} {"train_loss": -22.519025802612305, "global_step": 115168, "epoch": 1387} {"train_loss": -22.32344627380371, "global_step": 115169, "epoch": 1387} {"train_loss": -22.143232345581055, "global_step": 115170, "epoch": 1387} {"train_loss": -22.641693115234375, "global_step": 115171, "epoch": 1387} {"train_loss": -22.3249454498291, "global_step": 115172, "epoch": 1387} {"train_loss": -22.270902633666992, "global_step": 115173, "epoch": 1387} {"train_loss": -21.994094848632812, "global_step": 115174, "epoch": 1387} {"train_loss": -22.167325973510742, "global_step": 115175, "epoch": 1387} {"train_loss": -22.497135162353516, "global_step": 115176, "epoch": 1387} {"train_loss": -22.36972427368164, "global_step": 115177, "epoch": 1387} {"train_loss": -22.495824813842773, "global_step": 115178, "epoch": 1387} {"train_loss": -22.325525283813477, "global_step": 115179, "epoch": 1387} {"train_loss": -22.24949073791504, "global_step": 115180, "epoch": 1387} {"train_loss": -22.36993980407715, "global_step": 115181, "epoch": 1387} {"train_loss": -22.39625358581543, "global_step": 115182, "epoch": 1387} {"train_loss": -22.46590232849121, "global_step": 115183, "epoch": 1387} {"train_loss": -22.541461944580078, "global_step": 115184, "epoch": 1387} {"train_loss": -22.140520095825195, "global_step": 115185, "epoch": 1387} {"train_loss": -22.49408721923828, "global_step": 115186, "epoch": 1387} {"train_loss": -22.104719161987305, "global_step": 115187, "epoch": 1387} {"train_loss": -21.98587417602539, "global_step": 115188, "epoch": 1387} {"train_loss": -22.570634841918945, "global_step": 115189, "epoch": 1387} {"train_loss": -22.51397705078125, "global_step": 115190, "epoch": 1387} {"train_loss": -22.324193954467773, "global_step": 115191, "epoch": 1387} {"train_loss": -22.19324493408203, "global_step": 115192, "epoch": 1387} {"train_loss": -22.256576538085938, "global_step": 115193, "epoch": 1387} {"train_loss": -22.488990783691406, "global_step": 115194, "epoch": 1387} {"train_loss": -22.428178787231445, "global_step": 115195, "epoch": 1387} {"train_loss": -22.43061065673828, "global_step": 115196, "epoch": 1387} {"train_loss": -22.545867919921875, "global_step": 115197, "epoch": 1387} {"train_loss": -22.53309440612793, "global_step": 115198, "epoch": 1387} {"train_loss": -22.42208480834961, "global_step": 115199, "epoch": 1387} {"train_loss": -22.457931518554688, "global_step": 115200, "epoch": 1387} {"train_loss": -22.615543365478516, "global_step": 115201, "epoch": 1387} {"train_loss": -22.343252182006836, "global_step": 115202, "epoch": 1387} {"train_loss": -22.416185447968633, "global_step": 115203, "epoch": 1387, "val_loss": 6147430.0} {"train_loss": -21.89444351196289, "global_step": 115204, "epoch": 1388} {"train_loss": -22.011350631713867, "global_step": 115205, "epoch": 1388} {"train_loss": -22.271596908569336, "global_step": 115206, "epoch": 1388} {"train_loss": -22.501094818115234, "global_step": 115207, "epoch": 1388} {"train_loss": -22.190032958984375, "global_step": 115208, "epoch": 1388} {"train_loss": -21.567096710205078, "global_step": 115209, "epoch": 1388} {"train_loss": -22.266536712646484, "global_step": 115210, "epoch": 1388} {"train_loss": -22.232807159423828, "global_step": 115211, "epoch": 1388} {"train_loss": -22.024749755859375, "global_step": 115212, "epoch": 1388} {"train_loss": -22.05489158630371, "global_step": 115213, "epoch": 1388} {"train_loss": -22.17525291442871, "global_step": 115214, "epoch": 1388} {"train_loss": -21.973764419555664, "global_step": 115215, "epoch": 1388} {"train_loss": -21.822460174560547, "global_step": 115216, "epoch": 1388} {"train_loss": -22.137327194213867, "global_step": 115217, "epoch": 1388} {"train_loss": -22.45098876953125, "global_step": 115218, "epoch": 1388} {"train_loss": -22.386280059814453, "global_step": 115219, "epoch": 1388} {"train_loss": -22.768720626831055, "global_step": 115220, "epoch": 1388} {"train_loss": -22.12248420715332, "global_step": 115221, "epoch": 1388} {"train_loss": -22.36794090270996, "global_step": 115222, "epoch": 1388} {"train_loss": -22.569517135620117, "global_step": 115223, "epoch": 1388} {"train_loss": -22.286802291870117, "global_step": 115224, "epoch": 1388} {"train_loss": -22.409439086914062, "global_step": 115225, "epoch": 1388} {"train_loss": -22.29921531677246, "global_step": 115226, "epoch": 1388} {"train_loss": -21.921585083007812, "global_step": 115227, "epoch": 1388} {"train_loss": -22.11474609375, "global_step": 115228, "epoch": 1388} {"train_loss": -21.869489669799805, "global_step": 115229, "epoch": 1388} {"train_loss": -21.8459529876709, "global_step": 115230, "epoch": 1388} {"train_loss": -22.187246322631836, "global_step": 115231, "epoch": 1388} {"train_loss": -22.557130813598633, "global_step": 115232, "epoch": 1388} {"train_loss": -22.22589683532715, "global_step": 115233, "epoch": 1388} {"train_loss": -22.344606399536133, "global_step": 115234, "epoch": 1388} {"train_loss": -22.3751220703125, "global_step": 115235, "epoch": 1388} {"train_loss": -22.407276153564453, "global_step": 115236, "epoch": 1388} {"train_loss": -22.331899642944336, "global_step": 115237, "epoch": 1388} {"train_loss": -22.075925827026367, "global_step": 115238, "epoch": 1388} {"train_loss": -22.432226181030273, "global_step": 115239, "epoch": 1388} {"train_loss": -22.2640438079834, "global_step": 115240, "epoch": 1388} {"train_loss": -22.50313377380371, "global_step": 115241, "epoch": 1388} {"train_loss": -22.122373580932617, "global_step": 115242, "epoch": 1388} {"train_loss": -22.39240074157715, "global_step": 115243, "epoch": 1388} {"train_loss": -22.369970321655273, "global_step": 115244, "epoch": 1388} {"train_loss": -22.176538467407227, "global_step": 115245, "epoch": 1388} {"train_loss": -22.39598274230957, "global_step": 115246, "epoch": 1388} {"train_loss": -22.384868621826172, "global_step": 115247, "epoch": 1388} {"train_loss": -22.681997299194336, "global_step": 115248, "epoch": 1388} {"train_loss": -22.335477828979492, "global_step": 115249, "epoch": 1388} {"train_loss": -22.173093795776367, "global_step": 115250, "epoch": 1388} {"train_loss": -22.34076690673828, "global_step": 115251, "epoch": 1388} {"train_loss": -22.745031356811523, "global_step": 115252, "epoch": 1388} {"train_loss": -22.533498764038086, "global_step": 115253, "epoch": 1388} {"train_loss": -22.45478630065918, "global_step": 115254, "epoch": 1388} {"train_loss": -22.586095809936523, "global_step": 115255, "epoch": 1388} {"train_loss": -22.675994873046875, "global_step": 115256, "epoch": 1388} {"train_loss": -22.128530502319336, "global_step": 115257, "epoch": 1388} {"train_loss": -22.450864791870117, "global_step": 115258, "epoch": 1388} {"train_loss": -22.39048957824707, "global_step": 115259, "epoch": 1388} {"train_loss": -22.530433654785156, "global_step": 115260, "epoch": 1388} {"train_loss": -22.38304328918457, "global_step": 115261, "epoch": 1388} {"train_loss": -22.404067993164062, "global_step": 115262, "epoch": 1388} {"train_loss": -22.478225708007812, "global_step": 115263, "epoch": 1388} {"train_loss": -22.61244773864746, "global_step": 115264, "epoch": 1388} {"train_loss": -22.812368392944336, "global_step": 115265, "epoch": 1388} {"train_loss": -22.537796020507812, "global_step": 115266, "epoch": 1388} {"train_loss": -22.471710205078125, "global_step": 115267, "epoch": 1388} {"train_loss": -22.304851531982422, "global_step": 115268, "epoch": 1388} {"train_loss": -22.340614318847656, "global_step": 115269, "epoch": 1388} {"train_loss": -22.302288055419922, "global_step": 115270, "epoch": 1388} {"train_loss": -22.034656524658203, "global_step": 115271, "epoch": 1388} {"train_loss": -22.467893600463867, "global_step": 115272, "epoch": 1388} {"train_loss": -22.515522003173828, "global_step": 115273, "epoch": 1388} {"train_loss": -22.607559204101562, "global_step": 115274, "epoch": 1388} {"train_loss": -22.750329971313477, "global_step": 115275, "epoch": 1388} {"train_loss": -22.027599334716797, "global_step": 115276, "epoch": 1388} {"train_loss": -22.279741287231445, "global_step": 115277, "epoch": 1388} {"train_loss": -21.97100257873535, "global_step": 115278, "epoch": 1388} {"train_loss": -22.395309448242188, "global_step": 115279, "epoch": 1388} {"train_loss": -22.603900909423828, "global_step": 115280, "epoch": 1388} {"train_loss": -22.289480209350586, "global_step": 115281, "epoch": 1388} {"train_loss": -22.479490280151367, "global_step": 115282, "epoch": 1388} {"train_loss": -22.02679443359375, "global_step": 115283, "epoch": 1388} {"train_loss": -22.51909828186035, "global_step": 115284, "epoch": 1388} {"train_loss": -22.274818420410156, "global_step": 115285, "epoch": 1388} {"train_loss": -22.33473187182323, "global_step": 115286, "epoch": 1388, "val_loss": 6203244.5} {"train_loss": -21.72090721130371, "global_step": 115287, "epoch": 1389} {"train_loss": -21.367788314819336, "global_step": 115288, "epoch": 1389} {"train_loss": -22.23505973815918, "global_step": 115289, "epoch": 1389} {"train_loss": -21.625503540039062, "global_step": 115290, "epoch": 1389} {"train_loss": -21.961761474609375, "global_step": 115291, "epoch": 1389} {"train_loss": -21.798633575439453, "global_step": 115292, "epoch": 1389} {"train_loss": -21.7968692779541, "global_step": 115293, "epoch": 1389} {"train_loss": -21.55508804321289, "global_step": 115294, "epoch": 1389} {"train_loss": -21.781341552734375, "global_step": 115295, "epoch": 1389} {"train_loss": -21.82634162902832, "global_step": 115296, "epoch": 1389} {"train_loss": -21.82263946533203, "global_step": 115297, "epoch": 1389} {"train_loss": -21.985986709594727, "global_step": 115298, "epoch": 1389} {"train_loss": -22.50126075744629, "global_step": 115299, "epoch": 1389} {"train_loss": -21.966962814331055, "global_step": 115300, "epoch": 1389} {"train_loss": -21.88839340209961, "global_step": 115301, "epoch": 1389} {"train_loss": -21.861879348754883, "global_step": 115302, "epoch": 1389} {"train_loss": -22.235599517822266, "global_step": 115303, "epoch": 1389} {"train_loss": -22.086063385009766, "global_step": 115304, "epoch": 1389} {"train_loss": -22.195907592773438, "global_step": 115305, "epoch": 1389} {"train_loss": -21.95458984375, "global_step": 115306, "epoch": 1389} {"train_loss": -22.053531646728516, "global_step": 115307, "epoch": 1389} {"train_loss": -22.066036224365234, "global_step": 115308, "epoch": 1389} {"train_loss": -22.280380249023438, "global_step": 115309, "epoch": 1389} {"train_loss": -22.207763671875, "global_step": 115310, "epoch": 1389} {"train_loss": -22.33064079284668, "global_step": 115311, "epoch": 1389} {"train_loss": -21.81621742248535, "global_step": 115312, "epoch": 1389} {"train_loss": -22.33233642578125, "global_step": 115313, "epoch": 1389} {"train_loss": -22.472251892089844, "global_step": 115314, "epoch": 1389} {"train_loss": -22.520557403564453, "global_step": 115315, "epoch": 1389} {"train_loss": -22.172378540039062, "global_step": 115316, "epoch": 1389} {"train_loss": -22.667499542236328, "global_step": 115317, "epoch": 1389} {"train_loss": -22.036130905151367, "global_step": 115318, "epoch": 1389} {"train_loss": -21.957761764526367, "global_step": 115319, "epoch": 1389} {"train_loss": -22.005949020385742, "global_step": 115320, "epoch": 1389} {"train_loss": -22.326616287231445, "global_step": 115321, "epoch": 1389} {"train_loss": -22.35526466369629, "global_step": 115322, "epoch": 1389} {"train_loss": -22.408491134643555, "global_step": 115323, "epoch": 1389} {"train_loss": -22.29963493347168, "global_step": 115324, "epoch": 1389} {"train_loss": -22.59124183654785, "global_step": 115325, "epoch": 1389} {"train_loss": -22.3138370513916, "global_step": 115326, "epoch": 1389} {"train_loss": -22.381710052490234, "global_step": 115327, "epoch": 1389} {"train_loss": -22.090938568115234, "global_step": 115328, "epoch": 1389} {"train_loss": -22.453136444091797, "global_step": 115329, "epoch": 1389} {"train_loss": -22.510225296020508, "global_step": 115330, "epoch": 1389} {"train_loss": -22.533817291259766, "global_step": 115331, "epoch": 1389} {"train_loss": -22.56087303161621, "global_step": 115332, "epoch": 1389} {"train_loss": -22.547399520874023, "global_step": 115333, "epoch": 1389} {"train_loss": -22.43548011779785, "global_step": 115334, "epoch": 1389} {"train_loss": -22.35116195678711, "global_step": 115335, "epoch": 1389} {"train_loss": -22.624746322631836, "global_step": 115336, "epoch": 1389} {"train_loss": -22.530664443969727, "global_step": 115337, "epoch": 1389} {"train_loss": -22.694547653198242, "global_step": 115338, "epoch": 1389} {"train_loss": -22.39325523376465, "global_step": 115339, "epoch": 1389} {"train_loss": -22.907421112060547, "global_step": 115340, "epoch": 1389} {"train_loss": -22.36195182800293, "global_step": 115341, "epoch": 1389} {"train_loss": -22.407506942749023, "global_step": 115342, "epoch": 1389} {"train_loss": -22.452213287353516, "global_step": 115343, "epoch": 1389} {"train_loss": -22.426477432250977, "global_step": 115344, "epoch": 1389} {"train_loss": -22.594924926757812, "global_step": 115345, "epoch": 1389} {"train_loss": -22.337453842163086, "global_step": 115346, "epoch": 1389} {"train_loss": -22.527454376220703, "global_step": 115347, "epoch": 1389} {"train_loss": -22.270139694213867, "global_step": 115348, "epoch": 1389} {"train_loss": -22.397720336914062, "global_step": 115349, "epoch": 1389} {"train_loss": -22.041179656982422, "global_step": 115350, "epoch": 1389} {"train_loss": -22.564659118652344, "global_step": 115351, "epoch": 1389} {"train_loss": -22.737289428710938, "global_step": 115352, "epoch": 1389} {"train_loss": -22.634502410888672, "global_step": 115353, "epoch": 1389} {"train_loss": -22.60219955444336, "global_step": 115354, "epoch": 1389} {"train_loss": -22.67696189880371, "global_step": 115355, "epoch": 1389} {"train_loss": -22.578174591064453, "global_step": 115356, "epoch": 1389} {"train_loss": -22.40370750427246, "global_step": 115357, "epoch": 1389} {"train_loss": -22.646732330322266, "global_step": 115358, "epoch": 1389} {"train_loss": -22.51543426513672, "global_step": 115359, "epoch": 1389} {"train_loss": -22.16533660888672, "global_step": 115360, "epoch": 1389} {"train_loss": -22.69141960144043, "global_step": 115361, "epoch": 1389} {"train_loss": -22.110916137695312, "global_step": 115362, "epoch": 1389} {"train_loss": -22.7388973236084, "global_step": 115363, "epoch": 1389} {"train_loss": -22.458572387695312, "global_step": 115364, "epoch": 1389} {"train_loss": -22.261869430541992, "global_step": 115365, "epoch": 1389} {"train_loss": -22.076993942260742, "global_step": 115366, "epoch": 1389} {"train_loss": -21.70546531677246, "global_step": 115367, "epoch": 1389} {"train_loss": -21.79896354675293, "global_step": 115368, "epoch": 1389} {"train_loss": -22.251972244446534, "global_step": 115369, "epoch": 1389, "val_loss": 6173684.0} {"train_loss": -21.978450775146484, "global_step": 115370, "epoch": 1390} {"train_loss": -21.798492431640625, "global_step": 115371, "epoch": 1390} {"train_loss": -21.8983097076416, "global_step": 115372, "epoch": 1390} {"train_loss": -22.08860206604004, "global_step": 115373, "epoch": 1390} {"train_loss": -21.896324157714844, "global_step": 115374, "epoch": 1390} {"train_loss": -21.822282791137695, "global_step": 115375, "epoch": 1390} {"train_loss": -22.17959976196289, "global_step": 115376, "epoch": 1390} {"train_loss": -21.876813888549805, "global_step": 115377, "epoch": 1390} {"train_loss": -21.77780532836914, "global_step": 115378, "epoch": 1390} {"train_loss": -21.939050674438477, "global_step": 115379, "epoch": 1390} {"train_loss": -21.636274337768555, "global_step": 115380, "epoch": 1390} {"train_loss": -22.194080352783203, "global_step": 115381, "epoch": 1390} {"train_loss": -22.29928970336914, "global_step": 115382, "epoch": 1390} {"train_loss": -22.275711059570312, "global_step": 115383, "epoch": 1390} {"train_loss": -21.991025924682617, "global_step": 115384, "epoch": 1390} {"train_loss": -21.89371109008789, "global_step": 115385, "epoch": 1390} {"train_loss": -21.941125869750977, "global_step": 115386, "epoch": 1390} {"train_loss": -21.999868392944336, "global_step": 115387, "epoch": 1390} {"train_loss": -21.894058227539062, "global_step": 115388, "epoch": 1390} {"train_loss": -22.426132202148438, "global_step": 115389, "epoch": 1390} {"train_loss": -22.31207847595215, "global_step": 115390, "epoch": 1390} {"train_loss": -21.79206657409668, "global_step": 115391, "epoch": 1390} {"train_loss": -22.275243759155273, "global_step": 115392, "epoch": 1390} {"train_loss": -22.150196075439453, "global_step": 115393, "epoch": 1390} {"train_loss": -22.0245361328125, "global_step": 115394, "epoch": 1390} {"train_loss": -22.385648727416992, "global_step": 115395, "epoch": 1390} {"train_loss": -22.335718154907227, "global_step": 115396, "epoch": 1390} {"train_loss": -22.549652099609375, "global_step": 115397, "epoch": 1390} {"train_loss": -22.493371963500977, "global_step": 115398, "epoch": 1390} {"train_loss": -22.465579986572266, "global_step": 115399, "epoch": 1390} {"train_loss": -22.33095359802246, "global_step": 115400, "epoch": 1390} {"train_loss": -22.67899513244629, "global_step": 115401, "epoch": 1390} {"train_loss": -22.16067886352539, "global_step": 115402, "epoch": 1390} {"train_loss": -22.147308349609375, "global_step": 115403, "epoch": 1390} {"train_loss": -22.467451095581055, "global_step": 115404, "epoch": 1390} {"train_loss": -22.602155685424805, "global_step": 115405, "epoch": 1390} {"train_loss": -22.467866897583008, "global_step": 115406, "epoch": 1390} {"train_loss": -22.410873413085938, "global_step": 115407, "epoch": 1390} {"train_loss": -22.37929916381836, "global_step": 115408, "epoch": 1390} {"train_loss": -22.330123901367188, "global_step": 115409, "epoch": 1390} {"train_loss": -22.262441635131836, "global_step": 115410, "epoch": 1390} {"train_loss": -21.90926170349121, "global_step": 115411, "epoch": 1390} {"train_loss": -22.63050079345703, "global_step": 115412, "epoch": 1390} {"train_loss": -22.098875045776367, "global_step": 115413, "epoch": 1390} {"train_loss": -22.293441772460938, "global_step": 115414, "epoch": 1390} {"train_loss": -22.44215202331543, "global_step": 115415, "epoch": 1390} {"train_loss": -22.210132598876953, "global_step": 115416, "epoch": 1390} {"train_loss": -22.123558044433594, "global_step": 115417, "epoch": 1390} {"train_loss": -22.11223602294922, "global_step": 115418, "epoch": 1390} {"train_loss": -22.36092185974121, "global_step": 115419, "epoch": 1390} {"train_loss": -22.42282485961914, "global_step": 115420, "epoch": 1390} {"train_loss": -22.004926681518555, "global_step": 115421, "epoch": 1390} {"train_loss": -21.900815963745117, "global_step": 115422, "epoch": 1390} {"train_loss": -22.15894317626953, "global_step": 115423, "epoch": 1390} {"train_loss": -22.71742820739746, "global_step": 115424, "epoch": 1390} {"train_loss": -21.845455169677734, "global_step": 115425, "epoch": 1390} {"train_loss": -22.02534294128418, "global_step": 115426, "epoch": 1390} {"train_loss": -22.256296157836914, "global_step": 115427, "epoch": 1390} {"train_loss": -22.057355880737305, "global_step": 115428, "epoch": 1390} {"train_loss": -22.64095687866211, "global_step": 115429, "epoch": 1390} {"train_loss": -22.183292388916016, "global_step": 115430, "epoch": 1390} {"train_loss": -22.273670196533203, "global_step": 115431, "epoch": 1390} {"train_loss": -22.324588775634766, "global_step": 115432, "epoch": 1390} {"train_loss": -22.29157066345215, "global_step": 115433, "epoch": 1390} {"train_loss": -22.45113754272461, "global_step": 115434, "epoch": 1390} {"train_loss": -22.308761596679688, "global_step": 115435, "epoch": 1390} {"train_loss": -22.590147018432617, "global_step": 115436, "epoch": 1390} {"train_loss": -22.235782623291016, "global_step": 115437, "epoch": 1390} {"train_loss": -22.83436393737793, "global_step": 115438, "epoch": 1390} {"train_loss": -22.378376007080078, "global_step": 115439, "epoch": 1390} {"train_loss": -22.309772491455078, "global_step": 115440, "epoch": 1390} {"train_loss": -22.44122886657715, "global_step": 115441, "epoch": 1390} {"train_loss": -22.0756893157959, "global_step": 115442, "epoch": 1390} {"train_loss": -22.087303161621094, "global_step": 115443, "epoch": 1390} {"train_loss": -22.545076370239258, "global_step": 115444, "epoch": 1390} {"train_loss": -22.269535064697266, "global_step": 115445, "epoch": 1390} {"train_loss": -22.318933486938477, "global_step": 115446, "epoch": 1390} {"train_loss": -22.085010528564453, "global_step": 115447, "epoch": 1390} {"train_loss": -21.962499618530273, "global_step": 115448, "epoch": 1390} {"train_loss": -22.105161666870117, "global_step": 115449, "epoch": 1390} {"train_loss": -22.129186630249023, "global_step": 115450, "epoch": 1390} {"train_loss": -22.303909301757812, "global_step": 115451, "epoch": 1390} {"train_loss": -22.20640582348927, "global_step": 115452, "epoch": 1390, "val_loss": 6207114.0} {"train_loss": -21.690933227539062, "global_step": 115453, "epoch": 1391} {"train_loss": -22.058866500854492, "global_step": 115454, "epoch": 1391} {"train_loss": -22.0670223236084, "global_step": 115455, "epoch": 1391} {"train_loss": -21.885066986083984, "global_step": 115456, "epoch": 1391} {"train_loss": -21.601659774780273, "global_step": 115457, "epoch": 1391} {"train_loss": -21.846267700195312, "global_step": 115458, "epoch": 1391} {"train_loss": -22.044736862182617, "global_step": 115459, "epoch": 1391} {"train_loss": -22.002445220947266, "global_step": 115460, "epoch": 1391} {"train_loss": -21.95713996887207, "global_step": 115461, "epoch": 1391} {"train_loss": -22.400922775268555, "global_step": 115462, "epoch": 1391} {"train_loss": -21.909194946289062, "global_step": 115463, "epoch": 1391} {"train_loss": -22.164796829223633, "global_step": 115464, "epoch": 1391} {"train_loss": -21.75580406188965, "global_step": 115465, "epoch": 1391} {"train_loss": -22.06928825378418, "global_step": 115466, "epoch": 1391} {"train_loss": -22.54563331604004, "global_step": 115467, "epoch": 1391} {"train_loss": -22.194847106933594, "global_step": 115468, "epoch": 1391} {"train_loss": -22.26227378845215, "global_step": 115469, "epoch": 1391} {"train_loss": -22.132055282592773, "global_step": 115470, "epoch": 1391} {"train_loss": -22.43257713317871, "global_step": 115471, "epoch": 1391} {"train_loss": -22.149442672729492, "global_step": 115472, "epoch": 1391} {"train_loss": -22.362716674804688, "global_step": 115473, "epoch": 1391} {"train_loss": -22.19373893737793, "global_step": 115474, "epoch": 1391} {"train_loss": -22.2596492767334, "global_step": 115475, "epoch": 1391} {"train_loss": -22.39284324645996, "global_step": 115476, "epoch": 1391} {"train_loss": -22.46872329711914, "global_step": 115477, "epoch": 1391} {"train_loss": -22.410146713256836, "global_step": 115478, "epoch": 1391} {"train_loss": -22.23945426940918, "global_step": 115479, "epoch": 1391} {"train_loss": -22.454328536987305, "global_step": 115480, "epoch": 1391} {"train_loss": -22.22285270690918, "global_step": 115481, "epoch": 1391} {"train_loss": -22.410850524902344, "global_step": 115482, "epoch": 1391} {"train_loss": -22.148916244506836, "global_step": 115483, "epoch": 1391} {"train_loss": -22.395429611206055, "global_step": 115484, "epoch": 1391} {"train_loss": -22.25274085998535, "global_step": 115485, "epoch": 1391} {"train_loss": -22.476253509521484, "global_step": 115486, "epoch": 1391} {"train_loss": -22.280134201049805, "global_step": 115487, "epoch": 1391} {"train_loss": -22.189361572265625, "global_step": 115488, "epoch": 1391} {"train_loss": -22.264310836791992, "global_step": 115489, "epoch": 1391} {"train_loss": -22.131132125854492, "global_step": 115490, "epoch": 1391} {"train_loss": -22.20105743408203, "global_step": 115491, "epoch": 1391} {"train_loss": -22.343896865844727, "global_step": 115492, "epoch": 1391} {"train_loss": -22.43402671813965, "global_step": 115493, "epoch": 1391} {"train_loss": -22.477392196655273, "global_step": 115494, "epoch": 1391} {"train_loss": -22.48842430114746, "global_step": 115495, "epoch": 1391} {"train_loss": -22.23305320739746, "global_step": 115496, "epoch": 1391} {"train_loss": -22.0916690826416, "global_step": 115497, "epoch": 1391} {"train_loss": -22.27802085876465, "global_step": 115498, "epoch": 1391} {"train_loss": -22.372663497924805, "global_step": 115499, "epoch": 1391} {"train_loss": -22.36244773864746, "global_step": 115500, "epoch": 1391} {"train_loss": -22.659658432006836, "global_step": 115501, "epoch": 1391} {"train_loss": -22.012964248657227, "global_step": 115502, "epoch": 1391} {"train_loss": -21.95387077331543, "global_step": 115503, "epoch": 1391} {"train_loss": -22.102569580078125, "global_step": 115504, "epoch": 1391} {"train_loss": -22.383193969726562, "global_step": 115505, "epoch": 1391} {"train_loss": -22.37508201599121, "global_step": 115506, "epoch": 1391} {"train_loss": -22.101699829101562, "global_step": 115507, "epoch": 1391} {"train_loss": -22.710786819458008, "global_step": 115508, "epoch": 1391} {"train_loss": -22.553396224975586, "global_step": 115509, "epoch": 1391} {"train_loss": -22.437053680419922, "global_step": 115510, "epoch": 1391} {"train_loss": -22.321393966674805, "global_step": 115511, "epoch": 1391} {"train_loss": -22.34157371520996, "global_step": 115512, "epoch": 1391} {"train_loss": -22.743667602539062, "global_step": 115513, "epoch": 1391} {"train_loss": -22.483732223510742, "global_step": 115514, "epoch": 1391} {"train_loss": -22.507726669311523, "global_step": 115515, "epoch": 1391} {"train_loss": -22.368017196655273, "global_step": 115516, "epoch": 1391} {"train_loss": -22.312864303588867, "global_step": 115517, "epoch": 1391} {"train_loss": -22.49930763244629, "global_step": 115518, "epoch": 1391} {"train_loss": -22.937807083129883, "global_step": 115519, "epoch": 1391} {"train_loss": -22.624052047729492, "global_step": 115520, "epoch": 1391} {"train_loss": -22.28291130065918, "global_step": 115521, "epoch": 1391} {"train_loss": -22.5683536529541, "global_step": 115522, "epoch": 1391} {"train_loss": -22.54606056213379, "global_step": 115523, "epoch": 1391} {"train_loss": -22.401294708251953, "global_step": 115524, "epoch": 1391} {"train_loss": -22.491331100463867, "global_step": 115525, "epoch": 1391} {"train_loss": -22.476362228393555, "global_step": 115526, "epoch": 1391} {"train_loss": -22.58321189880371, "global_step": 115527, "epoch": 1391} {"train_loss": -22.588581085205078, "global_step": 115528, "epoch": 1391} {"train_loss": -22.245885848999023, "global_step": 115529, "epoch": 1391} {"train_loss": -22.360855102539062, "global_step": 115530, "epoch": 1391} {"train_loss": -22.36813735961914, "global_step": 115531, "epoch": 1391} {"train_loss": -22.294519424438477, "global_step": 115532, "epoch": 1391} {"train_loss": -22.36606788635254, "global_step": 115533, "epoch": 1391} {"train_loss": -22.318452835083008, "global_step": 115534, "epoch": 1391} {"train_loss": -22.294348521404956, "global_step": 115535, "epoch": 1391, "val_loss": 6334107.0} {"train_loss": -22.456674575805664, "global_step": 115536, "epoch": 1392} {"train_loss": -21.787988662719727, "global_step": 115537, "epoch": 1392} {"train_loss": -21.969608306884766, "global_step": 115538, "epoch": 1392} {"train_loss": -22.096220016479492, "global_step": 115539, "epoch": 1392} {"train_loss": -21.984609603881836, "global_step": 115540, "epoch": 1392} {"train_loss": -22.18308448791504, "global_step": 115541, "epoch": 1392} {"train_loss": -21.865528106689453, "global_step": 115542, "epoch": 1392} {"train_loss": -22.057348251342773, "global_step": 115543, "epoch": 1392} {"train_loss": -22.250625610351562, "global_step": 115544, "epoch": 1392} {"train_loss": -22.043699264526367, "global_step": 115545, "epoch": 1392} {"train_loss": -22.70895767211914, "global_step": 115546, "epoch": 1392} {"train_loss": -22.25312614440918, "global_step": 115547, "epoch": 1392} {"train_loss": -22.088973999023438, "global_step": 115548, "epoch": 1392} {"train_loss": -22.168231964111328, "global_step": 115549, "epoch": 1392} {"train_loss": -22.37849998474121, "global_step": 115550, "epoch": 1392} {"train_loss": -22.246854782104492, "global_step": 115551, "epoch": 1392} {"train_loss": -22.283416748046875, "global_step": 115552, "epoch": 1392} {"train_loss": -22.33860206604004, "global_step": 115553, "epoch": 1392} {"train_loss": -22.435468673706055, "global_step": 115554, "epoch": 1392} {"train_loss": -22.739246368408203, "global_step": 115555, "epoch": 1392} {"train_loss": -22.28076171875, "global_step": 115556, "epoch": 1392} {"train_loss": -22.321521759033203, "global_step": 115557, "epoch": 1392} {"train_loss": -21.977079391479492, "global_step": 115558, "epoch": 1392} {"train_loss": -22.295228958129883, "global_step": 115559, "epoch": 1392} {"train_loss": -22.542224884033203, "global_step": 115560, "epoch": 1392} {"train_loss": -22.493122100830078, "global_step": 115561, "epoch": 1392} {"train_loss": -22.099817276000977, "global_step": 115562, "epoch": 1392} {"train_loss": -22.42826271057129, "global_step": 115563, "epoch": 1392} {"train_loss": -22.312726974487305, "global_step": 115564, "epoch": 1392} {"train_loss": -22.502674102783203, "global_step": 115565, "epoch": 1392} {"train_loss": -22.21603775024414, "global_step": 115566, "epoch": 1392} {"train_loss": -22.615707397460938, "global_step": 115567, "epoch": 1392} {"train_loss": -22.40382957458496, "global_step": 115568, "epoch": 1392} {"train_loss": -22.64094352722168, "global_step": 115569, "epoch": 1392} {"train_loss": -22.47559928894043, "global_step": 115570, "epoch": 1392} {"train_loss": -22.2283935546875, "global_step": 115571, "epoch": 1392} {"train_loss": -22.526559829711914, "global_step": 115572, "epoch": 1392} {"train_loss": -22.388038635253906, "global_step": 115573, "epoch": 1392} {"train_loss": -22.84689712524414, "global_step": 115574, "epoch": 1392} {"train_loss": -22.51925277709961, "global_step": 115575, "epoch": 1392} {"train_loss": -22.234006881713867, "global_step": 115576, "epoch": 1392} {"train_loss": -22.530630111694336, "global_step": 115577, "epoch": 1392} {"train_loss": -22.261037826538086, "global_step": 115578, "epoch": 1392} {"train_loss": -22.531904220581055, "global_step": 115579, "epoch": 1392} {"train_loss": -22.638864517211914, "global_step": 115580, "epoch": 1392} {"train_loss": -22.48883628845215, "global_step": 115581, "epoch": 1392} {"train_loss": -22.238014221191406, "global_step": 115582, "epoch": 1392} {"train_loss": -22.429813385009766, "global_step": 115583, "epoch": 1392} {"train_loss": -22.384098052978516, "global_step": 115584, "epoch": 1392} {"train_loss": -22.129085540771484, "global_step": 115585, "epoch": 1392} {"train_loss": -22.68747901916504, "global_step": 115586, "epoch": 1392} {"train_loss": -22.630617141723633, "global_step": 115587, "epoch": 1392} {"train_loss": -22.875354766845703, "global_step": 115588, "epoch": 1392} {"train_loss": -22.732952117919922, "global_step": 115589, "epoch": 1392} {"train_loss": -22.510150909423828, "global_step": 115590, "epoch": 1392} {"train_loss": -22.475393295288086, "global_step": 115591, "epoch": 1392} {"train_loss": -22.385465621948242, "global_step": 115592, "epoch": 1392} {"train_loss": -22.4717960357666, "global_step": 115593, "epoch": 1392} {"train_loss": -22.48579978942871, "global_step": 115594, "epoch": 1392} {"train_loss": -22.410612106323242, "global_step": 115595, "epoch": 1392} {"train_loss": -22.45070457458496, "global_step": 115596, "epoch": 1392} {"train_loss": -22.220252990722656, "global_step": 115597, "epoch": 1392} {"train_loss": -22.530912399291992, "global_step": 115598, "epoch": 1392} {"train_loss": -22.69528579711914, "global_step": 115599, "epoch": 1392} {"train_loss": -22.436424255371094, "global_step": 115600, "epoch": 1392} {"train_loss": -22.553730010986328, "global_step": 115601, "epoch": 1392} {"train_loss": -22.248523712158203, "global_step": 115602, "epoch": 1392} {"train_loss": -22.344482421875, "global_step": 115603, "epoch": 1392} {"train_loss": -22.1924991607666, "global_step": 115604, "epoch": 1392} {"train_loss": -22.31927490234375, "global_step": 115605, "epoch": 1392} {"train_loss": -22.618528366088867, "global_step": 115606, "epoch": 1392} {"train_loss": -22.462799072265625, "global_step": 115607, "epoch": 1392} {"train_loss": -22.657611846923828, "global_step": 115608, "epoch": 1392} {"train_loss": -22.22681999206543, "global_step": 115609, "epoch": 1392} {"train_loss": -22.05128288269043, "global_step": 115610, "epoch": 1392} {"train_loss": -22.283384323120117, "global_step": 115611, "epoch": 1392} {"train_loss": -22.44525909423828, "global_step": 115612, "epoch": 1392} {"train_loss": -22.41193962097168, "global_step": 115613, "epoch": 1392} {"train_loss": -22.236515045166016, "global_step": 115614, "epoch": 1392} {"train_loss": -22.45601463317871, "global_step": 115615, "epoch": 1392} {"train_loss": -22.541778564453125, "global_step": 115616, "epoch": 1392} {"train_loss": -22.433788299560547, "global_step": 115617, "epoch": 1392} {"train_loss": -22.38795981349715, "global_step": 115618, "epoch": 1392, "val_loss": 6121297.5} {"train_loss": -21.55299186706543, "global_step": 115619, "epoch": 1393} {"train_loss": -21.705036163330078, "global_step": 115620, "epoch": 1393} {"train_loss": -21.843740463256836, "global_step": 115621, "epoch": 1393} {"train_loss": -21.675687789916992, "global_step": 115622, "epoch": 1393} {"train_loss": -21.711639404296875, "global_step": 115623, "epoch": 1393} {"train_loss": -22.217060089111328, "global_step": 115624, "epoch": 1393} {"train_loss": -22.106595993041992, "global_step": 115625, "epoch": 1393} {"train_loss": -21.60362434387207, "global_step": 115626, "epoch": 1393} {"train_loss": -22.45832633972168, "global_step": 115627, "epoch": 1393} {"train_loss": -22.181562423706055, "global_step": 115628, "epoch": 1393} {"train_loss": -22.3074951171875, "global_step": 115629, "epoch": 1393} {"train_loss": -22.073169708251953, "global_step": 115630, "epoch": 1393} {"train_loss": -22.171533584594727, "global_step": 115631, "epoch": 1393} {"train_loss": -22.397825241088867, "global_step": 115632, "epoch": 1393} {"train_loss": -22.29092788696289, "global_step": 115633, "epoch": 1393} {"train_loss": -21.987085342407227, "global_step": 115634, "epoch": 1393} {"train_loss": -22.14242935180664, "global_step": 115635, "epoch": 1393} {"train_loss": -22.162601470947266, "global_step": 115636, "epoch": 1393} {"train_loss": -22.212202072143555, "global_step": 115637, "epoch": 1393} {"train_loss": -22.095233917236328, "global_step": 115638, "epoch": 1393} {"train_loss": -22.42439842224121, "global_step": 115639, "epoch": 1393} {"train_loss": -22.473434448242188, "global_step": 115640, "epoch": 1393} {"train_loss": -22.178443908691406, "global_step": 115641, "epoch": 1393} {"train_loss": -22.152334213256836, "global_step": 115642, "epoch": 1393} {"train_loss": -22.4427433013916, "global_step": 115643, "epoch": 1393} {"train_loss": -22.4846134185791, "global_step": 115644, "epoch": 1393} {"train_loss": -22.442401885986328, "global_step": 115645, "epoch": 1393} {"train_loss": -22.459001541137695, "global_step": 115646, "epoch": 1393} {"train_loss": -22.62355613708496, "global_step": 115647, "epoch": 1393} {"train_loss": -22.833845138549805, "global_step": 115648, "epoch": 1393} {"train_loss": -22.29239273071289, "global_step": 115649, "epoch": 1393} {"train_loss": -22.11272430419922, "global_step": 115650, "epoch": 1393} {"train_loss": -22.045520782470703, "global_step": 115651, "epoch": 1393} {"train_loss": -22.591495513916016, "global_step": 115652, "epoch": 1393} {"train_loss": -22.634897232055664, "global_step": 115653, "epoch": 1393} {"train_loss": -21.900592803955078, "global_step": 115654, "epoch": 1393} {"train_loss": -21.60501480102539, "global_step": 115655, "epoch": 1393} {"train_loss": -22.645601272583008, "global_step": 115656, "epoch": 1393} {"train_loss": -22.35214614868164, "global_step": 115657, "epoch": 1393} {"train_loss": -22.003583908081055, "global_step": 115658, "epoch": 1393} {"train_loss": -22.384321212768555, "global_step": 115659, "epoch": 1393} {"train_loss": -22.290597915649414, "global_step": 115660, "epoch": 1393} {"train_loss": -22.230375289916992, "global_step": 115661, "epoch": 1393} {"train_loss": -22.20762062072754, "global_step": 115662, "epoch": 1393} {"train_loss": -22.274206161499023, "global_step": 115663, "epoch": 1393} {"train_loss": -22.149444580078125, "global_step": 115664, "epoch": 1393} {"train_loss": -22.110105514526367, "global_step": 115665, "epoch": 1393} {"train_loss": -22.414094924926758, "global_step": 115666, "epoch": 1393} {"train_loss": -22.564054489135742, "global_step": 115667, "epoch": 1393} {"train_loss": -22.432453155517578, "global_step": 115668, "epoch": 1393} {"train_loss": -22.1361083984375, "global_step": 115669, "epoch": 1393} {"train_loss": -22.323623657226562, "global_step": 115670, "epoch": 1393} {"train_loss": -22.1478214263916, "global_step": 115671, "epoch": 1393} {"train_loss": -22.432819366455078, "global_step": 115672, "epoch": 1393} {"train_loss": -22.205135345458984, "global_step": 115673, "epoch": 1393} {"train_loss": -22.268661499023438, "global_step": 115674, "epoch": 1393} {"train_loss": -22.62367057800293, "global_step": 115675, "epoch": 1393} {"train_loss": -22.09248924255371, "global_step": 115676, "epoch": 1393} {"train_loss": -22.291797637939453, "global_step": 115677, "epoch": 1393} {"train_loss": -22.553861618041992, "global_step": 115678, "epoch": 1393} {"train_loss": -22.976903915405273, "global_step": 115679, "epoch": 1393} {"train_loss": -21.900615692138672, "global_step": 115680, "epoch": 1393} {"train_loss": -22.252777099609375, "global_step": 115681, "epoch": 1393} {"train_loss": -22.38285255432129, "global_step": 115682, "epoch": 1393} {"train_loss": -22.422182083129883, "global_step": 115683, "epoch": 1393} {"train_loss": -22.189680099487305, "global_step": 115684, "epoch": 1393} {"train_loss": -22.873863220214844, "global_step": 115685, "epoch": 1393} {"train_loss": -22.402984619140625, "global_step": 115686, "epoch": 1393} {"train_loss": -22.926172256469727, "global_step": 115687, "epoch": 1393} {"train_loss": -22.419267654418945, "global_step": 115688, "epoch": 1393} {"train_loss": -22.455881118774414, "global_step": 115689, "epoch": 1393} {"train_loss": -22.725088119506836, "global_step": 115690, "epoch": 1393} {"train_loss": -22.296022415161133, "global_step": 115691, "epoch": 1393} {"train_loss": -22.29467010498047, "global_step": 115692, "epoch": 1393} {"train_loss": -22.75380516052246, "global_step": 115693, "epoch": 1393} {"train_loss": -22.43316078186035, "global_step": 115694, "epoch": 1393} {"train_loss": -22.20889663696289, "global_step": 115695, "epoch": 1393} {"train_loss": -22.320297241210938, "global_step": 115696, "epoch": 1393} {"train_loss": -22.175167083740234, "global_step": 115697, "epoch": 1393} {"train_loss": -22.36212730407715, "global_step": 115698, "epoch": 1393} {"train_loss": -22.533557891845703, "global_step": 115699, "epoch": 1393} {"train_loss": -22.26630210876465, "global_step": 115700, "epoch": 1393} {"train_loss": -22.28830218027873, "global_step": 115701, "epoch": 1393, "val_loss": 6174603.0} {"train_loss": -21.84078598022461, "global_step": 115702, "epoch": 1394} {"train_loss": -21.351741790771484, "global_step": 115703, "epoch": 1394} {"train_loss": -22.117273330688477, "global_step": 115704, "epoch": 1394} {"train_loss": -22.314319610595703, "global_step": 115705, "epoch": 1394} {"train_loss": -21.55806541442871, "global_step": 115706, "epoch": 1394} {"train_loss": -21.912948608398438, "global_step": 115707, "epoch": 1394} {"train_loss": -21.778444290161133, "global_step": 115708, "epoch": 1394} {"train_loss": -22.279245376586914, "global_step": 115709, "epoch": 1394} {"train_loss": -22.159452438354492, "global_step": 115710, "epoch": 1394} {"train_loss": -22.039209365844727, "global_step": 115711, "epoch": 1394} {"train_loss": -22.258134841918945, "global_step": 115712, "epoch": 1394} {"train_loss": -22.098644256591797, "global_step": 115713, "epoch": 1394} {"train_loss": -22.182682037353516, "global_step": 115714, "epoch": 1394} {"train_loss": -21.9688777923584, "global_step": 115715, "epoch": 1394} {"train_loss": -21.887916564941406, "global_step": 115716, "epoch": 1394} {"train_loss": -22.50239372253418, "global_step": 115717, "epoch": 1394} {"train_loss": -22.462560653686523, "global_step": 115718, "epoch": 1394} {"train_loss": -22.135568618774414, "global_step": 115719, "epoch": 1394} {"train_loss": -22.381267547607422, "global_step": 115720, "epoch": 1394} {"train_loss": -22.438459396362305, "global_step": 115721, "epoch": 1394} {"train_loss": -22.518831253051758, "global_step": 115722, "epoch": 1394} {"train_loss": -22.41652488708496, "global_step": 115723, "epoch": 1394} {"train_loss": -22.234601974487305, "global_step": 115724, "epoch": 1394} {"train_loss": -22.139148712158203, "global_step": 115725, "epoch": 1394} {"train_loss": -22.726961135864258, "global_step": 115726, "epoch": 1394} {"train_loss": -22.32904624938965, "global_step": 115727, "epoch": 1394} {"train_loss": -22.325414657592773, "global_step": 115728, "epoch": 1394} {"train_loss": -22.221006393432617, "global_step": 115729, "epoch": 1394} {"train_loss": -22.50564193725586, "global_step": 115730, "epoch": 1394} {"train_loss": -22.275959014892578, "global_step": 115731, "epoch": 1394} {"train_loss": -22.533079147338867, "global_step": 115732, "epoch": 1394} {"train_loss": -22.54676628112793, "global_step": 115733, "epoch": 1394} {"train_loss": -22.281471252441406, "global_step": 115734, "epoch": 1394} {"train_loss": -22.756742477416992, "global_step": 115735, "epoch": 1394} {"train_loss": -22.474843978881836, "global_step": 115736, "epoch": 1394} {"train_loss": -22.68703269958496, "global_step": 115737, "epoch": 1394} {"train_loss": -22.265274047851562, "global_step": 115738, "epoch": 1394} {"train_loss": -22.493106842041016, "global_step": 115739, "epoch": 1394} {"train_loss": -22.561237335205078, "global_step": 115740, "epoch": 1394} {"train_loss": -22.524253845214844, "global_step": 115741, "epoch": 1394} {"train_loss": -22.388883590698242, "global_step": 115742, "epoch": 1394} {"train_loss": -22.57852554321289, "global_step": 115743, "epoch": 1394} {"train_loss": -22.700117111206055, "global_step": 115744, "epoch": 1394} {"train_loss": -22.345102310180664, "global_step": 115745, "epoch": 1394} {"train_loss": -22.561628341674805, "global_step": 115746, "epoch": 1394} {"train_loss": -22.1792049407959, "global_step": 115747, "epoch": 1394} {"train_loss": -22.637113571166992, "global_step": 115748, "epoch": 1394} {"train_loss": -22.661291122436523, "global_step": 115749, "epoch": 1394} {"train_loss": -22.126615524291992, "global_step": 115750, "epoch": 1394} {"train_loss": -22.634183883666992, "global_step": 115751, "epoch": 1394} {"train_loss": -22.446897506713867, "global_step": 115752, "epoch": 1394} {"train_loss": -22.342571258544922, "global_step": 115753, "epoch": 1394} {"train_loss": -22.265703201293945, "global_step": 115754, "epoch": 1394} {"train_loss": -22.395111083984375, "global_step": 115755, "epoch": 1394} {"train_loss": -22.490047454833984, "global_step": 115756, "epoch": 1394} {"train_loss": -22.673566818237305, "global_step": 115757, "epoch": 1394} {"train_loss": -22.280426025390625, "global_step": 115758, "epoch": 1394} {"train_loss": -22.42256736755371, "global_step": 115759, "epoch": 1394} {"train_loss": -22.337900161743164, "global_step": 115760, "epoch": 1394} {"train_loss": -22.5714168548584, "global_step": 115761, "epoch": 1394} {"train_loss": -22.7376766204834, "global_step": 115762, "epoch": 1394} {"train_loss": -22.328353881835938, "global_step": 115763, "epoch": 1394} {"train_loss": -22.768407821655273, "global_step": 115764, "epoch": 1394} {"train_loss": -23.041311264038086, "global_step": 115765, "epoch": 1394} {"train_loss": -22.6350154876709, "global_step": 115766, "epoch": 1394} {"train_loss": -22.349573135375977, "global_step": 115767, "epoch": 1394} {"train_loss": -22.44838523864746, "global_step": 115768, "epoch": 1394} {"train_loss": -22.519229888916016, "global_step": 115769, "epoch": 1394} {"train_loss": -22.469892501831055, "global_step": 115770, "epoch": 1394} {"train_loss": -22.253080368041992, "global_step": 115771, "epoch": 1394} {"train_loss": -22.117630004882812, "global_step": 115772, "epoch": 1394} {"train_loss": -22.79463005065918, "global_step": 115773, "epoch": 1394} {"train_loss": -22.567119598388672, "global_step": 115774, "epoch": 1394} {"train_loss": -22.736183166503906, "global_step": 115775, "epoch": 1394} {"train_loss": -22.414579391479492, "global_step": 115776, "epoch": 1394} {"train_loss": -22.31812858581543, "global_step": 115777, "epoch": 1394} {"train_loss": -22.325918197631836, "global_step": 115778, "epoch": 1394} {"train_loss": -22.142221450805664, "global_step": 115779, "epoch": 1394} {"train_loss": -22.699222564697266, "global_step": 115780, "epoch": 1394} {"train_loss": -22.481088638305664, "global_step": 115781, "epoch": 1394} {"train_loss": -22.04066276550293, "global_step": 115782, "epoch": 1394} {"train_loss": -22.1925106048584, "global_step": 115783, "epoch": 1394} {"train_loss": -22.3598443686244, "global_step": 115784, "epoch": 1394, "val_loss": 6205297.5} {"train_loss": -22.052886962890625, "global_step": 115785, "epoch": 1395} {"train_loss": -21.238197326660156, "global_step": 115786, "epoch": 1395} {"train_loss": -21.800901412963867, "global_step": 115787, "epoch": 1395} {"train_loss": -21.8065185546875, "global_step": 115788, "epoch": 1395} {"train_loss": -22.23573875427246, "global_step": 115789, "epoch": 1395} {"train_loss": -21.876861572265625, "global_step": 115790, "epoch": 1395} {"train_loss": -22.089340209960938, "global_step": 115791, "epoch": 1395} {"train_loss": -22.17085838317871, "global_step": 115792, "epoch": 1395} {"train_loss": -22.306577682495117, "global_step": 115793, "epoch": 1395} {"train_loss": -21.917264938354492, "global_step": 115794, "epoch": 1395} {"train_loss": -22.118057250976562, "global_step": 115795, "epoch": 1395} {"train_loss": -22.12178611755371, "global_step": 115796, "epoch": 1395} {"train_loss": -22.1004695892334, "global_step": 115797, "epoch": 1395} {"train_loss": -22.1380558013916, "global_step": 115798, "epoch": 1395} {"train_loss": -22.010751724243164, "global_step": 115799, "epoch": 1395} {"train_loss": -22.34231948852539, "global_step": 115800, "epoch": 1395} {"train_loss": -22.30031967163086, "global_step": 115801, "epoch": 1395} {"train_loss": -22.029165267944336, "global_step": 115802, "epoch": 1395} {"train_loss": -22.09355354309082, "global_step": 115803, "epoch": 1395} {"train_loss": -22.127012252807617, "global_step": 115804, "epoch": 1395} {"train_loss": -22.19476318359375, "global_step": 115805, "epoch": 1395} {"train_loss": -22.340866088867188, "global_step": 115806, "epoch": 1395} {"train_loss": -22.17008399963379, "global_step": 115807, "epoch": 1395} {"train_loss": -22.217041015625, "global_step": 115808, "epoch": 1395} {"train_loss": -22.352121353149414, "global_step": 115809, "epoch": 1395} {"train_loss": -22.322011947631836, "global_step": 115810, "epoch": 1395} {"train_loss": -22.214677810668945, "global_step": 115811, "epoch": 1395} {"train_loss": -22.25999641418457, "global_step": 115812, "epoch": 1395} {"train_loss": -22.335296630859375, "global_step": 115813, "epoch": 1395} {"train_loss": -22.576078414916992, "global_step": 115814, "epoch": 1395} {"train_loss": -22.514892578125, "global_step": 115815, "epoch": 1395} {"train_loss": -22.097667694091797, "global_step": 115816, "epoch": 1395} {"train_loss": -22.39304542541504, "global_step": 115817, "epoch": 1395} {"train_loss": -22.538419723510742, "global_step": 115818, "epoch": 1395} {"train_loss": -22.39410972595215, "global_step": 115819, "epoch": 1395} {"train_loss": -22.5212459564209, "global_step": 115820, "epoch": 1395} {"train_loss": -22.774290084838867, "global_step": 115821, "epoch": 1395} {"train_loss": -22.121152877807617, "global_step": 115822, "epoch": 1395} {"train_loss": -22.397171020507812, "global_step": 115823, "epoch": 1395} {"train_loss": -22.614439010620117, "global_step": 115824, "epoch": 1395} {"train_loss": -22.281478881835938, "global_step": 115825, "epoch": 1395} {"train_loss": -22.274412155151367, "global_step": 115826, "epoch": 1395} {"train_loss": -22.325725555419922, "global_step": 115827, "epoch": 1395} {"train_loss": -22.277326583862305, "global_step": 115828, "epoch": 1395} {"train_loss": -22.05118179321289, "global_step": 115829, "epoch": 1395} {"train_loss": -22.33748435974121, "global_step": 115830, "epoch": 1395} {"train_loss": -22.199277877807617, "global_step": 115831, "epoch": 1395} {"train_loss": -22.509199142456055, "global_step": 115832, "epoch": 1395} {"train_loss": -22.69159507751465, "global_step": 115833, "epoch": 1395} {"train_loss": -21.967844009399414, "global_step": 115834, "epoch": 1395} {"train_loss": -22.50665283203125, "global_step": 115835, "epoch": 1395} {"train_loss": -22.530967712402344, "global_step": 115836, "epoch": 1395} {"train_loss": -22.313159942626953, "global_step": 115837, "epoch": 1395} {"train_loss": -22.26544761657715, "global_step": 115838, "epoch": 1395} {"train_loss": -22.347122192382812, "global_step": 115839, "epoch": 1395} {"train_loss": -22.341642379760742, "global_step": 115840, "epoch": 1395} {"train_loss": -22.49348258972168, "global_step": 115841, "epoch": 1395} {"train_loss": -22.279525756835938, "global_step": 115842, "epoch": 1395} {"train_loss": -22.900497436523438, "global_step": 115843, "epoch": 1395} {"train_loss": -22.249296188354492, "global_step": 115844, "epoch": 1395} {"train_loss": -22.69257926940918, "global_step": 115845, "epoch": 1395} {"train_loss": -22.676559448242188, "global_step": 115846, "epoch": 1395} {"train_loss": -22.10242462158203, "global_step": 115847, "epoch": 1395} {"train_loss": -22.382369995117188, "global_step": 115848, "epoch": 1395} {"train_loss": -22.432601928710938, "global_step": 115849, "epoch": 1395} {"train_loss": -22.34351921081543, "global_step": 115850, "epoch": 1395} {"train_loss": -22.338926315307617, "global_step": 115851, "epoch": 1395} {"train_loss": -22.445066452026367, "global_step": 115852, "epoch": 1395} {"train_loss": -22.72464942932129, "global_step": 115853, "epoch": 1395} {"train_loss": -22.504182815551758, "global_step": 115854, "epoch": 1395} {"train_loss": -23.11268424987793, "global_step": 115855, "epoch": 1395} {"train_loss": -22.595779418945312, "global_step": 115856, "epoch": 1395} {"train_loss": -22.567106246948242, "global_step": 115857, "epoch": 1395} {"train_loss": -22.78851318359375, "global_step": 115858, "epoch": 1395} {"train_loss": -22.483232498168945, "global_step": 115859, "epoch": 1395} {"train_loss": -22.871936798095703, "global_step": 115860, "epoch": 1395} {"train_loss": -22.333473205566406, "global_step": 115861, "epoch": 1395} {"train_loss": -22.532123565673828, "global_step": 115862, "epoch": 1395} {"train_loss": -22.310894012451172, "global_step": 115863, "epoch": 1395} {"train_loss": -22.590822219848633, "global_step": 115864, "epoch": 1395} {"train_loss": -22.33855628967285, "global_step": 115865, "epoch": 1395} {"train_loss": -22.46500587463379, "global_step": 115866, "epoch": 1395} {"train_loss": -22.33312972195177, "global_step": 115867, "epoch": 1395, "val_loss": 6126132.0} {"train_loss": -22.07611083984375, "global_step": 115868, "epoch": 1396} {"train_loss": -22.2274227142334, "global_step": 115869, "epoch": 1396} {"train_loss": -21.75203514099121, "global_step": 115870, "epoch": 1396} {"train_loss": -22.025732040405273, "global_step": 115871, "epoch": 1396} {"train_loss": -22.643712997436523, "global_step": 115872, "epoch": 1396} {"train_loss": -22.515914916992188, "global_step": 115873, "epoch": 1396} {"train_loss": -22.479345321655273, "global_step": 115874, "epoch": 1396} {"train_loss": -22.119529724121094, "global_step": 115875, "epoch": 1396} {"train_loss": -22.47565269470215, "global_step": 115876, "epoch": 1396} {"train_loss": -22.383403778076172, "global_step": 115877, "epoch": 1396} {"train_loss": -22.400718688964844, "global_step": 115878, "epoch": 1396} {"train_loss": -22.336654663085938, "global_step": 115879, "epoch": 1396} {"train_loss": -22.268573760986328, "global_step": 115880, "epoch": 1396} {"train_loss": -22.35485076904297, "global_step": 115881, "epoch": 1396} {"train_loss": -22.639219284057617, "global_step": 115882, "epoch": 1396} {"train_loss": -22.44599723815918, "global_step": 115883, "epoch": 1396} {"train_loss": -22.277509689331055, "global_step": 115884, "epoch": 1396} {"train_loss": -22.559419631958008, "global_step": 115885, "epoch": 1396} {"train_loss": -22.352115631103516, "global_step": 115886, "epoch": 1396} {"train_loss": -22.760520935058594, "global_step": 115887, "epoch": 1396} {"train_loss": -22.181215286254883, "global_step": 115888, "epoch": 1396} {"train_loss": -22.26173210144043, "global_step": 115889, "epoch": 1396} {"train_loss": -22.379283905029297, "global_step": 115890, "epoch": 1396} {"train_loss": -22.084274291992188, "global_step": 115891, "epoch": 1396} {"train_loss": -22.855382919311523, "global_step": 115892, "epoch": 1396} {"train_loss": -21.972375869750977, "global_step": 115893, "epoch": 1396} {"train_loss": -22.450777053833008, "global_step": 115894, "epoch": 1396} {"train_loss": -22.306615829467773, "global_step": 115895, "epoch": 1396} {"train_loss": -22.056365966796875, "global_step": 115896, "epoch": 1396} {"train_loss": -21.962064743041992, "global_step": 115897, "epoch": 1396} {"train_loss": -22.69289207458496, "global_step": 115898, "epoch": 1396} {"train_loss": -22.30500030517578, "global_step": 115899, "epoch": 1396} {"train_loss": -22.461563110351562, "global_step": 115900, "epoch": 1396} {"train_loss": -22.186548233032227, "global_step": 115901, "epoch": 1396} {"train_loss": -22.128149032592773, "global_step": 115902, "epoch": 1396} {"train_loss": -22.520496368408203, "global_step": 115903, "epoch": 1396} {"train_loss": -22.64432716369629, "global_step": 115904, "epoch": 1396} {"train_loss": -22.662586212158203, "global_step": 115905, "epoch": 1396} {"train_loss": -22.21390724182129, "global_step": 115906, "epoch": 1396} {"train_loss": -22.762937545776367, "global_step": 115907, "epoch": 1396} {"train_loss": -22.178354263305664, "global_step": 115908, "epoch": 1396} {"train_loss": -22.467437744140625, "global_step": 115909, "epoch": 1396} {"train_loss": -22.321989059448242, "global_step": 115910, "epoch": 1396} {"train_loss": -22.481365203857422, "global_step": 115911, "epoch": 1396} {"train_loss": -22.754119873046875, "global_step": 115912, "epoch": 1396} {"train_loss": -22.595327377319336, "global_step": 115913, "epoch": 1396} {"train_loss": -22.61773681640625, "global_step": 115914, "epoch": 1396} {"train_loss": -22.578847885131836, "global_step": 115915, "epoch": 1396} {"train_loss": -22.448856353759766, "global_step": 115916, "epoch": 1396} {"train_loss": -22.662626266479492, "global_step": 115917, "epoch": 1396} {"train_loss": -22.578540802001953, "global_step": 115918, "epoch": 1396} {"train_loss": -22.390268325805664, "global_step": 115919, "epoch": 1396} {"train_loss": -22.392982482910156, "global_step": 115920, "epoch": 1396} {"train_loss": -22.51637840270996, "global_step": 115921, "epoch": 1396} {"train_loss": -22.400861740112305, "global_step": 115922, "epoch": 1396} {"train_loss": -22.198020935058594, "global_step": 115923, "epoch": 1396} {"train_loss": -22.385421752929688, "global_step": 115924, "epoch": 1396} {"train_loss": -22.48579216003418, "global_step": 115925, "epoch": 1396} {"train_loss": -22.493778228759766, "global_step": 115926, "epoch": 1396} {"train_loss": -22.017818450927734, "global_step": 115927, "epoch": 1396} {"train_loss": -22.611265182495117, "global_step": 115928, "epoch": 1396} {"train_loss": -22.41474723815918, "global_step": 115929, "epoch": 1396} {"train_loss": -22.5819091796875, "global_step": 115930, "epoch": 1396} {"train_loss": -22.61954689025879, "global_step": 115931, "epoch": 1396} {"train_loss": -22.65869903564453, "global_step": 115932, "epoch": 1396} {"train_loss": -21.95037269592285, "global_step": 115933, "epoch": 1396} {"train_loss": -22.354089736938477, "global_step": 115934, "epoch": 1396} {"train_loss": -22.259475708007812, "global_step": 115935, "epoch": 1396} {"train_loss": -22.221410751342773, "global_step": 115936, "epoch": 1396} {"train_loss": -22.834928512573242, "global_step": 115937, "epoch": 1396} {"train_loss": -22.42864418029785, "global_step": 115938, "epoch": 1396} {"train_loss": -22.487415313720703, "global_step": 115939, "epoch": 1396} {"train_loss": -22.787643432617188, "global_step": 115940, "epoch": 1396} {"train_loss": -22.368898391723633, "global_step": 115941, "epoch": 1396} {"train_loss": -22.529088973999023, "global_step": 115942, "epoch": 1396} {"train_loss": -22.45778465270996, "global_step": 115943, "epoch": 1396} {"train_loss": -22.552127838134766, "global_step": 115944, "epoch": 1396} {"train_loss": -22.492422103881836, "global_step": 115945, "epoch": 1396} {"train_loss": -22.573972702026367, "global_step": 115946, "epoch": 1396} {"train_loss": -22.397489547729492, "global_step": 115947, "epoch": 1396} {"train_loss": -22.148895263671875, "global_step": 115948, "epoch": 1396} {"train_loss": -22.1661434173584, "global_step": 115949, "epoch": 1396} {"train_loss": -22.407358858958784, "global_step": 115950, "epoch": 1396, "val_loss": 6267531.0} {"train_loss": -22.059898376464844, "global_step": 115951, "epoch": 1397} {"train_loss": -22.08188247680664, "global_step": 115952, "epoch": 1397} {"train_loss": -21.8586483001709, "global_step": 115953, "epoch": 1397} {"train_loss": -21.77852439880371, "global_step": 115954, "epoch": 1397} {"train_loss": -22.106351852416992, "global_step": 115955, "epoch": 1397} {"train_loss": -22.068689346313477, "global_step": 115956, "epoch": 1397} {"train_loss": -21.967863082885742, "global_step": 115957, "epoch": 1397} {"train_loss": -22.077688217163086, "global_step": 115958, "epoch": 1397} {"train_loss": -22.231307983398438, "global_step": 115959, "epoch": 1397} {"train_loss": -22.11464500427246, "global_step": 115960, "epoch": 1397} {"train_loss": -22.301244735717773, "global_step": 115961, "epoch": 1397} {"train_loss": -22.095914840698242, "global_step": 115962, "epoch": 1397} {"train_loss": -21.7994384765625, "global_step": 115963, "epoch": 1397} {"train_loss": -22.23158073425293, "global_step": 115964, "epoch": 1397} {"train_loss": -22.097946166992188, "global_step": 115965, "epoch": 1397} {"train_loss": -22.035173416137695, "global_step": 115966, "epoch": 1397} {"train_loss": -22.37087631225586, "global_step": 115967, "epoch": 1397} {"train_loss": -22.42305564880371, "global_step": 115968, "epoch": 1397} {"train_loss": -22.209030151367188, "global_step": 115969, "epoch": 1397} {"train_loss": -22.1032772064209, "global_step": 115970, "epoch": 1397} {"train_loss": -22.2216739654541, "global_step": 115971, "epoch": 1397} {"train_loss": -22.441967010498047, "global_step": 115972, "epoch": 1397} {"train_loss": -22.383481979370117, "global_step": 115973, "epoch": 1397} {"train_loss": -22.51399040222168, "global_step": 115974, "epoch": 1397} {"train_loss": -22.270145416259766, "global_step": 115975, "epoch": 1397} {"train_loss": -22.202835083007812, "global_step": 115976, "epoch": 1397} {"train_loss": -22.645599365234375, "global_step": 115977, "epoch": 1397} {"train_loss": -22.642126083374023, "global_step": 115978, "epoch": 1397} {"train_loss": -22.5500545501709, "global_step": 115979, "epoch": 1397} {"train_loss": -22.591981887817383, "global_step": 115980, "epoch": 1397} {"train_loss": -22.757543563842773, "global_step": 115981, "epoch": 1397} {"train_loss": -22.10321044921875, "global_step": 115982, "epoch": 1397} {"train_loss": -22.471288681030273, "global_step": 115983, "epoch": 1397} {"train_loss": -22.98601722717285, "global_step": 115984, "epoch": 1397} {"train_loss": -22.567214965820312, "global_step": 115985, "epoch": 1397} {"train_loss": -22.35536003112793, "global_step": 115986, "epoch": 1397} {"train_loss": -22.334388732910156, "global_step": 115987, "epoch": 1397} {"train_loss": -22.294803619384766, "global_step": 115988, "epoch": 1397} {"train_loss": -22.160400390625, "global_step": 115989, "epoch": 1397} {"train_loss": -22.380216598510742, "global_step": 115990, "epoch": 1397} {"train_loss": -22.233652114868164, "global_step": 115991, "epoch": 1397} {"train_loss": -22.255306243896484, "global_step": 115992, "epoch": 1397} {"train_loss": -22.276809692382812, "global_step": 115993, "epoch": 1397} {"train_loss": -22.629493713378906, "global_step": 115994, "epoch": 1397} {"train_loss": -22.563987731933594, "global_step": 115995, "epoch": 1397} {"train_loss": -22.376522064208984, "global_step": 115996, "epoch": 1397} {"train_loss": -22.712202072143555, "global_step": 115997, "epoch": 1397} {"train_loss": -22.113798141479492, "global_step": 115998, "epoch": 1397} {"train_loss": -22.58133888244629, "global_step": 115999, "epoch": 1397} {"train_loss": -22.57600212097168, "global_step": 116000, "epoch": 1397} {"train_loss": -22.430578231811523, "global_step": 116001, "epoch": 1397} {"train_loss": -22.56726837158203, "global_step": 116002, "epoch": 1397} {"train_loss": -22.350189208984375, "global_step": 116003, "epoch": 1397} {"train_loss": -22.682416915893555, "global_step": 116004, "epoch": 1397} {"train_loss": -22.687536239624023, "global_step": 116005, "epoch": 1397} {"train_loss": -22.524463653564453, "global_step": 116006, "epoch": 1397} {"train_loss": -22.78011131286621, "global_step": 116007, "epoch": 1397} {"train_loss": -22.870206832885742, "global_step": 116008, "epoch": 1397} {"train_loss": -22.448421478271484, "global_step": 116009, "epoch": 1397} {"train_loss": -22.24337387084961, "global_step": 116010, "epoch": 1397} {"train_loss": -22.595579147338867, "global_step": 116011, "epoch": 1397} {"train_loss": -22.68306541442871, "global_step": 116012, "epoch": 1397} {"train_loss": -22.348201751708984, "global_step": 116013, "epoch": 1397} {"train_loss": -22.441211700439453, "global_step": 116014, "epoch": 1397} {"train_loss": -22.68419647216797, "global_step": 116015, "epoch": 1397} {"train_loss": -22.688190460205078, "global_step": 116016, "epoch": 1397} {"train_loss": -22.277835845947266, "global_step": 116017, "epoch": 1397} {"train_loss": -22.709619522094727, "global_step": 116018, "epoch": 1397} {"train_loss": -22.28778076171875, "global_step": 116019, "epoch": 1397} {"train_loss": -22.346708297729492, "global_step": 116020, "epoch": 1397} {"train_loss": -22.620304107666016, "global_step": 116021, "epoch": 1397} {"train_loss": -22.582660675048828, "global_step": 116022, "epoch": 1397} {"train_loss": -22.413232803344727, "global_step": 116023, "epoch": 1397} {"train_loss": -22.32858657836914, "global_step": 116024, "epoch": 1397} {"train_loss": -22.260480880737305, "global_step": 116025, "epoch": 1397} {"train_loss": -22.140295028686523, "global_step": 116026, "epoch": 1397} {"train_loss": -22.47549819946289, "global_step": 116027, "epoch": 1397} {"train_loss": -22.3577880859375, "global_step": 116028, "epoch": 1397} {"train_loss": -22.21864891052246, "global_step": 116029, "epoch": 1397} {"train_loss": -22.421960830688477, "global_step": 116030, "epoch": 1397} {"train_loss": -22.3940372467041, "global_step": 116031, "epoch": 1397} {"train_loss": -22.286901473999023, "global_step": 116032, "epoch": 1397} {"train_loss": -22.372383186616094, "global_step": 116033, "epoch": 1397, "val_loss": 6196142.5} {"train_loss": -22.543609619140625, "global_step": 116034, "epoch": 1398} {"train_loss": -22.06342887878418, "global_step": 116035, "epoch": 1398} {"train_loss": -21.879037857055664, "global_step": 116036, "epoch": 1398} {"train_loss": -21.8363094329834, "global_step": 116037, "epoch": 1398} {"train_loss": -22.157129287719727, "global_step": 116038, "epoch": 1398} {"train_loss": -22.248716354370117, "global_step": 116039, "epoch": 1398} {"train_loss": -22.06129264831543, "global_step": 116040, "epoch": 1398} {"train_loss": -22.624326705932617, "global_step": 116041, "epoch": 1398} {"train_loss": -22.267454147338867, "global_step": 116042, "epoch": 1398} {"train_loss": -22.337846755981445, "global_step": 116043, "epoch": 1398} {"train_loss": -22.16850471496582, "global_step": 116044, "epoch": 1398} {"train_loss": -22.377546310424805, "global_step": 116045, "epoch": 1398} {"train_loss": -22.172155380249023, "global_step": 116046, "epoch": 1398} {"train_loss": -22.817556381225586, "global_step": 116047, "epoch": 1398} {"train_loss": -22.21084976196289, "global_step": 116048, "epoch": 1398} {"train_loss": -22.480939865112305, "global_step": 116049, "epoch": 1398} {"train_loss": -22.253646850585938, "global_step": 116050, "epoch": 1398} {"train_loss": -22.515369415283203, "global_step": 116051, "epoch": 1398} {"train_loss": -22.31540870666504, "global_step": 116052, "epoch": 1398} {"train_loss": -22.749013900756836, "global_step": 116053, "epoch": 1398} {"train_loss": -22.342885971069336, "global_step": 116054, "epoch": 1398} {"train_loss": -22.306421279907227, "global_step": 116055, "epoch": 1398} {"train_loss": -22.258756637573242, "global_step": 116056, "epoch": 1398} {"train_loss": -22.707271575927734, "global_step": 116057, "epoch": 1398} {"train_loss": -22.17481231689453, "global_step": 116058, "epoch": 1398} {"train_loss": -22.532407760620117, "global_step": 116059, "epoch": 1398} {"train_loss": -22.556333541870117, "global_step": 116060, "epoch": 1398} {"train_loss": -22.65692710876465, "global_step": 116061, "epoch": 1398} {"train_loss": -21.88148307800293, "global_step": 116062, "epoch": 1398} {"train_loss": -22.32440757751465, "global_step": 116063, "epoch": 1398} {"train_loss": -22.418699264526367, "global_step": 116064, "epoch": 1398} {"train_loss": -22.3658447265625, "global_step": 116065, "epoch": 1398} {"train_loss": -22.077016830444336, "global_step": 116066, "epoch": 1398} {"train_loss": -22.544452667236328, "global_step": 116067, "epoch": 1398} {"train_loss": -22.45704460144043, "global_step": 116068, "epoch": 1398} {"train_loss": -22.484081268310547, "global_step": 116069, "epoch": 1398} {"train_loss": -22.175735473632812, "global_step": 116070, "epoch": 1398} {"train_loss": -22.49979591369629, "global_step": 116071, "epoch": 1398} {"train_loss": -22.493560791015625, "global_step": 116072, "epoch": 1398} {"train_loss": -22.347902297973633, "global_step": 116073, "epoch": 1398} {"train_loss": -22.615020751953125, "global_step": 116074, "epoch": 1398} {"train_loss": -22.74832534790039, "global_step": 116075, "epoch": 1398} {"train_loss": -22.458160400390625, "global_step": 116076, "epoch": 1398} {"train_loss": -22.72492027282715, "global_step": 116077, "epoch": 1398} {"train_loss": -22.402860641479492, "global_step": 116078, "epoch": 1398} {"train_loss": -22.242843627929688, "global_step": 116079, "epoch": 1398} {"train_loss": -22.54156494140625, "global_step": 116080, "epoch": 1398} {"train_loss": -22.887365341186523, "global_step": 116081, "epoch": 1398} {"train_loss": -22.6187686920166, "global_step": 116082, "epoch": 1398} {"train_loss": -22.07710075378418, "global_step": 116083, "epoch": 1398} {"train_loss": -22.609039306640625, "global_step": 116084, "epoch": 1398} {"train_loss": -22.31842041015625, "global_step": 116085, "epoch": 1398} {"train_loss": -22.31597328186035, "global_step": 116086, "epoch": 1398} {"train_loss": -22.136688232421875, "global_step": 116087, "epoch": 1398} {"train_loss": -23.05365753173828, "global_step": 116088, "epoch": 1398} {"train_loss": -22.602426528930664, "global_step": 116089, "epoch": 1398} {"train_loss": -22.62129783630371, "global_step": 116090, "epoch": 1398} {"train_loss": -22.601537704467773, "global_step": 116091, "epoch": 1398} {"train_loss": -22.289899826049805, "global_step": 116092, "epoch": 1398} {"train_loss": -22.34801483154297, "global_step": 116093, "epoch": 1398} {"train_loss": -22.3914852142334, "global_step": 116094, "epoch": 1398} {"train_loss": -22.65041160583496, "global_step": 116095, "epoch": 1398} {"train_loss": -22.304336547851562, "global_step": 116096, "epoch": 1398} {"train_loss": -22.50516700744629, "global_step": 116097, "epoch": 1398} {"train_loss": -22.37431526184082, "global_step": 116098, "epoch": 1398} {"train_loss": -22.145639419555664, "global_step": 116099, "epoch": 1398} {"train_loss": -22.550338745117188, "global_step": 116100, "epoch": 1398} {"train_loss": -22.302600860595703, "global_step": 116101, "epoch": 1398} {"train_loss": -22.342893600463867, "global_step": 116102, "epoch": 1398} {"train_loss": -22.568260192871094, "global_step": 116103, "epoch": 1398} {"train_loss": -22.47579002380371, "global_step": 116104, "epoch": 1398} {"train_loss": -22.027620315551758, "global_step": 116105, "epoch": 1398} {"train_loss": -22.419652938842773, "global_step": 116106, "epoch": 1398} {"train_loss": -22.81892204284668, "global_step": 116107, "epoch": 1398} {"train_loss": -22.165067672729492, "global_step": 116108, "epoch": 1398} {"train_loss": -22.43938636779785, "global_step": 116109, "epoch": 1398} {"train_loss": -22.411701202392578, "global_step": 116110, "epoch": 1398} {"train_loss": -22.3560848236084, "global_step": 116111, "epoch": 1398} {"train_loss": -22.728307723999023, "global_step": 116112, "epoch": 1398} {"train_loss": -22.452634811401367, "global_step": 116113, "epoch": 1398} {"train_loss": -22.22670555114746, "global_step": 116114, "epoch": 1398} {"train_loss": -22.51787567138672, "global_step": 116115, "epoch": 1398} {"train_loss": -22.401483673647224, "global_step": 116116, "epoch": 1398, "val_loss": 6160849.0} {"train_loss": -22.21337890625, "global_step": 116117, "epoch": 1399} {"train_loss": -21.506223678588867, "global_step": 116118, "epoch": 1399} {"train_loss": -22.590017318725586, "global_step": 116119, "epoch": 1399} {"train_loss": -22.166929244995117, "global_step": 116120, "epoch": 1399} {"train_loss": -22.332664489746094, "global_step": 116121, "epoch": 1399} {"train_loss": -22.287839889526367, "global_step": 116122, "epoch": 1399} {"train_loss": -22.17726707458496, "global_step": 116123, "epoch": 1399} {"train_loss": -22.690332412719727, "global_step": 116124, "epoch": 1399} {"train_loss": -22.117935180664062, "global_step": 116125, "epoch": 1399} {"train_loss": -22.00107192993164, "global_step": 116126, "epoch": 1399} {"train_loss": -22.39483070373535, "global_step": 116127, "epoch": 1399} {"train_loss": -22.69477653503418, "global_step": 116128, "epoch": 1399} {"train_loss": -22.24495506286621, "global_step": 116129, "epoch": 1399} {"train_loss": -22.288583755493164, "global_step": 116130, "epoch": 1399} {"train_loss": -22.37325668334961, "global_step": 116131, "epoch": 1399} {"train_loss": -22.597280502319336, "global_step": 116132, "epoch": 1399} {"train_loss": -22.399677276611328, "global_step": 116133, "epoch": 1399} {"train_loss": -22.59678077697754, "global_step": 116134, "epoch": 1399} {"train_loss": -22.59939193725586, "global_step": 116135, "epoch": 1399} {"train_loss": -22.471179962158203, "global_step": 116136, "epoch": 1399} {"train_loss": -22.474084854125977, "global_step": 116137, "epoch": 1399} {"train_loss": -22.603681564331055, "global_step": 116138, "epoch": 1399} {"train_loss": -22.74837875366211, "global_step": 116139, "epoch": 1399} {"train_loss": -22.741140365600586, "global_step": 116140, "epoch": 1399} {"train_loss": -22.601886749267578, "global_step": 116141, "epoch": 1399} {"train_loss": -22.034446716308594, "global_step": 116142, "epoch": 1399} {"train_loss": -21.98577880859375, "global_step": 116143, "epoch": 1399} {"train_loss": -22.423877716064453, "global_step": 116144, "epoch": 1399} {"train_loss": -22.465145111083984, "global_step": 116145, "epoch": 1399} {"train_loss": -22.396289825439453, "global_step": 116146, "epoch": 1399} {"train_loss": -22.243886947631836, "global_step": 116147, "epoch": 1399} {"train_loss": -22.458791732788086, "global_step": 116148, "epoch": 1399} {"train_loss": -22.947025299072266, "global_step": 116149, "epoch": 1399} {"train_loss": -22.58511734008789, "global_step": 116150, "epoch": 1399} {"train_loss": -22.58751678466797, "global_step": 116151, "epoch": 1399} {"train_loss": -22.287250518798828, "global_step": 116152, "epoch": 1399} {"train_loss": -22.31263542175293, "global_step": 116153, "epoch": 1399} {"train_loss": -22.312789916992188, "global_step": 116154, "epoch": 1399} {"train_loss": -22.15907859802246, "global_step": 116155, "epoch": 1399} {"train_loss": -22.293264389038086, "global_step": 116156, "epoch": 1399} {"train_loss": -22.519983291625977, "global_step": 116157, "epoch": 1399} {"train_loss": -22.3322811126709, "global_step": 116158, "epoch": 1399} {"train_loss": -22.228605270385742, "global_step": 116159, "epoch": 1399} {"train_loss": -22.17152214050293, "global_step": 116160, "epoch": 1399} {"train_loss": -21.883045196533203, "global_step": 116161, "epoch": 1399} {"train_loss": -22.510812759399414, "global_step": 116162, "epoch": 1399} {"train_loss": -22.516210556030273, "global_step": 116163, "epoch": 1399} {"train_loss": -22.354368209838867, "global_step": 116164, "epoch": 1399} {"train_loss": -22.555339813232422, "global_step": 116165, "epoch": 1399} {"train_loss": -22.315916061401367, "global_step": 116166, "epoch": 1399} {"train_loss": -22.257848739624023, "global_step": 116167, "epoch": 1399} {"train_loss": -22.367883682250977, "global_step": 116168, "epoch": 1399} {"train_loss": -22.323623657226562, "global_step": 116169, "epoch": 1399} {"train_loss": -22.444419860839844, "global_step": 116170, "epoch": 1399} {"train_loss": -22.390140533447266, "global_step": 116171, "epoch": 1399} {"train_loss": -22.228635787963867, "global_step": 116172, "epoch": 1399} {"train_loss": -22.009763717651367, "global_step": 116173, "epoch": 1399} {"train_loss": -22.36030387878418, "global_step": 116174, "epoch": 1399} {"train_loss": -22.40313148498535, "global_step": 116175, "epoch": 1399} {"train_loss": -22.447904586791992, "global_step": 116176, "epoch": 1399} {"train_loss": -22.601877212524414, "global_step": 116177, "epoch": 1399} {"train_loss": -22.762651443481445, "global_step": 116178, "epoch": 1399} {"train_loss": -22.548768997192383, "global_step": 116179, "epoch": 1399} {"train_loss": -22.545276641845703, "global_step": 116180, "epoch": 1399} {"train_loss": -22.31270408630371, "global_step": 116181, "epoch": 1399} {"train_loss": -22.270294189453125, "global_step": 116182, "epoch": 1399} {"train_loss": -22.4849796295166, "global_step": 116183, "epoch": 1399} {"train_loss": -22.096572875976562, "global_step": 116184, "epoch": 1399} {"train_loss": -22.322010040283203, "global_step": 116185, "epoch": 1399} {"train_loss": -22.930335998535156, "global_step": 116186, "epoch": 1399} {"train_loss": -22.67938804626465, "global_step": 116187, "epoch": 1399} {"train_loss": -22.386381149291992, "global_step": 116188, "epoch": 1399} {"train_loss": -22.536611557006836, "global_step": 116189, "epoch": 1399} {"train_loss": -22.464033126831055, "global_step": 116190, "epoch": 1399} {"train_loss": -22.61187171936035, "global_step": 116191, "epoch": 1399} {"train_loss": -22.483118057250977, "global_step": 116192, "epoch": 1399} {"train_loss": -22.969318389892578, "global_step": 116193, "epoch": 1399} {"train_loss": -22.659482955932617, "global_step": 116194, "epoch": 1399} {"train_loss": -22.383922576904297, "global_step": 116195, "epoch": 1399} {"train_loss": -22.50905418395996, "global_step": 116196, "epoch": 1399} {"train_loss": -22.42738914489746, "global_step": 116197, "epoch": 1399} {"train_loss": -22.315725326538086, "global_step": 116198, "epoch": 1399} {"train_loss": -22.414746410875434, "global_step": 116199, "epoch": 1399, "val_loss": 6163805.0} {"train_loss": -21.730119705200195, "global_step": 116200, "epoch": 1400} {"train_loss": -22.32512855529785, "global_step": 116201, "epoch": 1400} {"train_loss": -22.02442169189453, "global_step": 116202, "epoch": 1400} {"train_loss": -21.598234176635742, "global_step": 116203, "epoch": 1400} {"train_loss": -22.183942794799805, "global_step": 116204, "epoch": 1400} {"train_loss": -21.546133041381836, "global_step": 116205, "epoch": 1400} {"train_loss": -21.756277084350586, "global_step": 116206, "epoch": 1400} {"train_loss": -21.733549118041992, "global_step": 116207, "epoch": 1400} {"train_loss": -22.15147590637207, "global_step": 116208, "epoch": 1400} {"train_loss": -22.215967178344727, "global_step": 116209, "epoch": 1400} {"train_loss": -22.5025634765625, "global_step": 116210, "epoch": 1400} {"train_loss": -22.291767120361328, "global_step": 116211, "epoch": 1400} {"train_loss": -22.267480850219727, "global_step": 116212, "epoch": 1400} {"train_loss": -22.012378692626953, "global_step": 116213, "epoch": 1400} {"train_loss": -22.0701847076416, "global_step": 116214, "epoch": 1400} {"train_loss": -22.367443084716797, "global_step": 116215, "epoch": 1400} {"train_loss": -21.990327835083008, "global_step": 116216, "epoch": 1400} {"train_loss": -22.46877670288086, "global_step": 116217, "epoch": 1400} {"train_loss": -22.155826568603516, "global_step": 116218, "epoch": 1400} {"train_loss": -22.148818969726562, "global_step": 116219, "epoch": 1400} {"train_loss": -21.61130714416504, "global_step": 116220, "epoch": 1400} {"train_loss": -22.68453025817871, "global_step": 116221, "epoch": 1400} {"train_loss": -22.184370040893555, "global_step": 116222, "epoch": 1400} {"train_loss": -22.251182556152344, "global_step": 116223, "epoch": 1400} {"train_loss": -22.122928619384766, "global_step": 116224, "epoch": 1400} {"train_loss": -22.51874351501465, "global_step": 116225, "epoch": 1400} {"train_loss": -22.818038940429688, "global_step": 116226, "epoch": 1400} {"train_loss": -22.345731735229492, "global_step": 116227, "epoch": 1400} {"train_loss": -22.09166717529297, "global_step": 116228, "epoch": 1400} {"train_loss": -22.410465240478516, "global_step": 116229, "epoch": 1400} {"train_loss": -22.37690544128418, "global_step": 116230, "epoch": 1400} {"train_loss": -22.40252113342285, "global_step": 116231, "epoch": 1400} {"train_loss": -22.529775619506836, "global_step": 116232, "epoch": 1400} {"train_loss": -22.357223510742188, "global_step": 116233, "epoch": 1400} {"train_loss": -22.42439079284668, "global_step": 116234, "epoch": 1400} {"train_loss": -22.73337745666504, "global_step": 116235, "epoch": 1400} {"train_loss": -22.784040451049805, "global_step": 116236, "epoch": 1400} {"train_loss": -22.474029541015625, "global_step": 116237, "epoch": 1400} {"train_loss": -22.497509002685547, "global_step": 116238, "epoch": 1400} {"train_loss": -22.48677635192871, "global_step": 116239, "epoch": 1400} {"train_loss": -21.92237091064453, "global_step": 116240, "epoch": 1400} {"train_loss": -22.182252883911133, "global_step": 116241, "epoch": 1400} {"train_loss": -22.306135177612305, "global_step": 116242, "epoch": 1400} {"train_loss": -22.422697067260742, "global_step": 116243, "epoch": 1400} {"train_loss": -22.442975997924805, "global_step": 116244, "epoch": 1400} {"train_loss": -22.5155029296875, "global_step": 116245, "epoch": 1400} {"train_loss": -22.000133514404297, "global_step": 116246, "epoch": 1400} {"train_loss": -22.216405868530273, "global_step": 116247, "epoch": 1400} {"train_loss": -22.110586166381836, "global_step": 116248, "epoch": 1400} {"train_loss": -22.254087448120117, "global_step": 116249, "epoch": 1400} {"train_loss": -22.418149948120117, "global_step": 116250, "epoch": 1400} {"train_loss": -22.239530563354492, "global_step": 116251, "epoch": 1400} {"train_loss": -22.070341110229492, "global_step": 116252, "epoch": 1400} {"train_loss": -22.50118064880371, "global_step": 116253, "epoch": 1400} {"train_loss": -22.470094680786133, "global_step": 116254, "epoch": 1400} {"train_loss": -22.359275817871094, "global_step": 116255, "epoch": 1400} {"train_loss": -22.384824752807617, "global_step": 116256, "epoch": 1400} {"train_loss": -22.103437423706055, "global_step": 116257, "epoch": 1400} {"train_loss": -22.308822631835938, "global_step": 116258, "epoch": 1400} {"train_loss": -22.45322608947754, "global_step": 116259, "epoch": 1400} {"train_loss": -22.268081665039062, "global_step": 116260, "epoch": 1400} {"train_loss": -22.175867080688477, "global_step": 116261, "epoch": 1400} {"train_loss": -22.23784637451172, "global_step": 116262, "epoch": 1400} {"train_loss": -22.113380432128906, "global_step": 116263, "epoch": 1400} {"train_loss": -22.345096588134766, "global_step": 116264, "epoch": 1400} {"train_loss": -22.522600173950195, "global_step": 116265, "epoch": 1400} {"train_loss": -22.457210540771484, "global_step": 116266, "epoch": 1400} {"train_loss": -22.195348739624023, "global_step": 116267, "epoch": 1400} {"train_loss": -22.103376388549805, "global_step": 116268, "epoch": 1400} {"train_loss": -22.2244815826416, "global_step": 116269, "epoch": 1400} {"train_loss": -22.13355827331543, "global_step": 116270, "epoch": 1400} {"train_loss": -22.443464279174805, "global_step": 116271, "epoch": 1400} {"train_loss": -22.397747039794922, "global_step": 116272, "epoch": 1400} {"train_loss": -22.29547119140625, "global_step": 116273, "epoch": 1400} {"train_loss": -22.228872299194336, "global_step": 116274, "epoch": 1400} {"train_loss": -22.751110076904297, "global_step": 116275, "epoch": 1400} {"train_loss": -22.57710838317871, "global_step": 116276, "epoch": 1400} {"train_loss": -22.601320266723633, "global_step": 116277, "epoch": 1400} {"train_loss": -22.13793182373047, "global_step": 116278, "epoch": 1400} {"train_loss": -22.511899948120117, "global_step": 116279, "epoch": 1400} {"train_loss": -22.295856475830078, "global_step": 116280, "epoch": 1400} {"train_loss": -22.6602725982666, "global_step": 116281, "epoch": 1400} {"train_loss": -22.274935550000293, "global_step": 116282, "epoch": 1400, "train/sim_max_reward_0": 1.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4500000": 1.0, "test/sim_max_reward_4500001": 0.0, "test/sim_max_reward_4500002": 1.0, "test/sim_max_reward_4500003": 1.0, "test/sim_max_reward_4500004": 1.0, "test/sim_max_reward_4500005": 1.0, "test/sim_max_reward_4500006": 1.0, "test/sim_max_reward_4500007": 1.0, "test/sim_max_reward_4500008": 1.0, "test/sim_max_reward_4500009": 1.0, "test/sim_max_reward_4500010": 1.0, "test/sim_max_reward_4500011": 1.0, "test/sim_max_reward_4500012": 1.0, "test/sim_max_reward_4500013": 1.0, "test/sim_max_reward_4500014": 1.0, "test/sim_max_reward_4500015": 1.0, "test/sim_max_reward_4500016": 1.0, "test/sim_max_reward_4500017": 1.0, "test/sim_max_reward_4500018": 1.0, "test/sim_max_reward_4500019": 1.0, "test/sim_max_reward_4500020": 1.0, "test/sim_max_reward_4500021": 1.0, "train/mean_score": 1.0, "test/mean_score": 0.9545454545454546, "val_loss": 6328569.0} {"train_loss": -21.191009521484375, "global_step": 116283, "epoch": 1401} {"train_loss": -21.83982276916504, "global_step": 116284, "epoch": 1401} {"train_loss": -21.471044540405273, "global_step": 116285, "epoch": 1401} {"train_loss": -21.83146858215332, "global_step": 116286, "epoch": 1401} {"train_loss": -21.50921058654785, "global_step": 116287, "epoch": 1401} {"train_loss": -21.67766571044922, "global_step": 116288, "epoch": 1401} {"train_loss": -22.0858211517334, "global_step": 116289, "epoch": 1401} {"train_loss": -21.9953556060791, "global_step": 116290, "epoch": 1401} {"train_loss": -22.292593002319336, "global_step": 116291, "epoch": 1401} {"train_loss": -21.857709884643555, "global_step": 116292, "epoch": 1401} {"train_loss": -21.999839782714844, "global_step": 116293, "epoch": 1401} {"train_loss": -21.931806564331055, "global_step": 116294, "epoch": 1401} {"train_loss": -21.76677894592285, "global_step": 116295, "epoch": 1401} {"train_loss": -21.96346092224121, "global_step": 116296, "epoch": 1401} {"train_loss": -21.912508010864258, "global_step": 116297, "epoch": 1401} {"train_loss": -21.966941833496094, "global_step": 116298, "epoch": 1401} {"train_loss": -22.16459846496582, "global_step": 116299, "epoch": 1401} {"train_loss": -22.098947525024414, "global_step": 116300, "epoch": 1401} {"train_loss": -22.027217864990234, "global_step": 116301, "epoch": 1401} {"train_loss": -21.691638946533203, "global_step": 116302, "epoch": 1401} {"train_loss": -22.200170516967773, "global_step": 116303, "epoch": 1401} {"train_loss": -22.447439193725586, "global_step": 116304, "epoch": 1401} {"train_loss": -22.23012924194336, "global_step": 116305, "epoch": 1401} {"train_loss": -22.20343017578125, "global_step": 116306, "epoch": 1401} {"train_loss": -22.287092208862305, "global_step": 116307, "epoch": 1401} {"train_loss": -22.657194137573242, "global_step": 116308, "epoch": 1401} {"train_loss": -22.162687301635742, "global_step": 116309, "epoch": 1401} {"train_loss": -22.472248077392578, "global_step": 116310, "epoch": 1401} {"train_loss": -22.422168731689453, "global_step": 116311, "epoch": 1401} {"train_loss": -22.611677169799805, "global_step": 116312, "epoch": 1401} {"train_loss": -22.220151901245117, "global_step": 116313, "epoch": 1401} {"train_loss": -22.5693359375, "global_step": 116314, "epoch": 1401} {"train_loss": -22.528934478759766, "global_step": 116315, "epoch": 1401} {"train_loss": -22.077957153320312, "global_step": 116316, "epoch": 1401} {"train_loss": -22.563400268554688, "global_step": 116317, "epoch": 1401} {"train_loss": -22.32986831665039, "global_step": 116318, "epoch": 1401} {"train_loss": -22.528425216674805, "global_step": 116319, "epoch": 1401} {"train_loss": -22.408578872680664, "global_step": 116320, "epoch": 1401} {"train_loss": -22.399118423461914, "global_step": 116321, "epoch": 1401} {"train_loss": -22.396387100219727, "global_step": 116322, "epoch": 1401} {"train_loss": -22.30918312072754, "global_step": 116323, "epoch": 1401} {"train_loss": -22.791778564453125, "global_step": 116324, "epoch": 1401} {"train_loss": -22.247257232666016, "global_step": 116325, "epoch": 1401} {"train_loss": -22.678096771240234, "global_step": 116326, "epoch": 1401} {"train_loss": -22.216495513916016, "global_step": 116327, "epoch": 1401} {"train_loss": -22.05924415588379, "global_step": 116328, "epoch": 1401} {"train_loss": -22.118139266967773, "global_step": 116329, "epoch": 1401} {"train_loss": -22.619991302490234, "global_step": 116330, "epoch": 1401} {"train_loss": -22.420751571655273, "global_step": 116331, "epoch": 1401} {"train_loss": -22.820722579956055, "global_step": 116332, "epoch": 1401} {"train_loss": -22.491622924804688, "global_step": 116333, "epoch": 1401} {"train_loss": -22.20050048828125, "global_step": 116334, "epoch": 1401} {"train_loss": -22.321517944335938, "global_step": 116335, "epoch": 1401} {"train_loss": -22.432842254638672, "global_step": 116336, "epoch": 1401} {"train_loss": -22.108678817749023, "global_step": 116337, "epoch": 1401} {"train_loss": -22.507017135620117, "global_step": 116338, "epoch": 1401} {"train_loss": -22.40240478515625, "global_step": 116339, "epoch": 1401} {"train_loss": -22.054874420166016, "global_step": 116340, "epoch": 1401} {"train_loss": -22.183303833007812, "global_step": 116341, "epoch": 1401} {"train_loss": -22.23505973815918, "global_step": 116342, "epoch": 1401} {"train_loss": -22.519800186157227, "global_step": 116343, "epoch": 1401} {"train_loss": -22.07868194580078, "global_step": 116344, "epoch": 1401} {"train_loss": -22.25830078125, "global_step": 116345, "epoch": 1401} {"train_loss": -22.010507583618164, "global_step": 116346, "epoch": 1401} {"train_loss": -22.48756980895996, "global_step": 116347, "epoch": 1401} {"train_loss": -22.142963409423828, "global_step": 116348, "epoch": 1401} {"train_loss": -22.12960433959961, "global_step": 116349, "epoch": 1401} {"train_loss": -22.328765869140625, "global_step": 116350, "epoch": 1401} {"train_loss": -22.573469161987305, "global_step": 116351, "epoch": 1401} {"train_loss": -22.087888717651367, "global_step": 116352, "epoch": 1401} {"train_loss": -22.47290802001953, "global_step": 116353, "epoch": 1401} {"train_loss": -22.30740737915039, "global_step": 116354, "epoch": 1401} {"train_loss": -22.588293075561523, "global_step": 116355, "epoch": 1401} {"train_loss": -22.5804443359375, "global_step": 116356, "epoch": 1401} {"train_loss": -22.029123306274414, "global_step": 116357, "epoch": 1401} {"train_loss": -22.65453338623047, "global_step": 116358, "epoch": 1401} {"train_loss": -22.250953674316406, "global_step": 116359, "epoch": 1401} {"train_loss": -22.62257194519043, "global_step": 116360, "epoch": 1401} {"train_loss": -22.477964401245117, "global_step": 116361, "epoch": 1401} {"train_loss": -22.54974365234375, "global_step": 116362, "epoch": 1401} {"train_loss": -22.061309814453125, "global_step": 116363, "epoch": 1401} {"train_loss": -22.082529067993164, "global_step": 116364, "epoch": 1401} {"train_loss": -22.246297284781214, "global_step": 116365, "epoch": 1401, "val_loss": 6243090.0} {"train_loss": -22.266050338745117, "global_step": 116366, "epoch": 1402} {"train_loss": -22.375656127929688, "global_step": 116367, "epoch": 1402} {"train_loss": -22.17875862121582, "global_step": 116368, "epoch": 1402} {"train_loss": -22.09246826171875, "global_step": 116369, "epoch": 1402} {"train_loss": -22.157819747924805, "global_step": 116370, "epoch": 1402} {"train_loss": -22.146135330200195, "global_step": 116371, "epoch": 1402} {"train_loss": -22.390830993652344, "global_step": 116372, "epoch": 1402} {"train_loss": -22.065828323364258, "global_step": 116373, "epoch": 1402} {"train_loss": -22.071592330932617, "global_step": 116374, "epoch": 1402} {"train_loss": -22.491418838500977, "global_step": 116375, "epoch": 1402} {"train_loss": -22.32881736755371, "global_step": 116376, "epoch": 1402} {"train_loss": -22.388992309570312, "global_step": 116377, "epoch": 1402} {"train_loss": -22.53860855102539, "global_step": 116378, "epoch": 1402} {"train_loss": -21.812007904052734, "global_step": 116379, "epoch": 1402} {"train_loss": -22.548553466796875, "global_step": 116380, "epoch": 1402} {"train_loss": -22.649799346923828, "global_step": 116381, "epoch": 1402} {"train_loss": -22.176782608032227, "global_step": 116382, "epoch": 1402} {"train_loss": -22.506437301635742, "global_step": 116383, "epoch": 1402} {"train_loss": -22.36728286743164, "global_step": 116384, "epoch": 1402} {"train_loss": -22.47732162475586, "global_step": 116385, "epoch": 1402} {"train_loss": -22.566831588745117, "global_step": 116386, "epoch": 1402} {"train_loss": -22.195817947387695, "global_step": 116387, "epoch": 1402} {"train_loss": -22.3558406829834, "global_step": 116388, "epoch": 1402} {"train_loss": -22.885942459106445, "global_step": 116389, "epoch": 1402} {"train_loss": -22.555707931518555, "global_step": 116390, "epoch": 1402} {"train_loss": -22.098281860351562, "global_step": 116391, "epoch": 1402} {"train_loss": -22.830095291137695, "global_step": 116392, "epoch": 1402} {"train_loss": -22.786544799804688, "global_step": 116393, "epoch": 1402} {"train_loss": -22.745779037475586, "global_step": 116394, "epoch": 1402} {"train_loss": -23.033666610717773, "global_step": 116395, "epoch": 1402} {"train_loss": -22.320547103881836, "global_step": 116396, "epoch": 1402} {"train_loss": -22.50217628479004, "global_step": 116397, "epoch": 1402} {"train_loss": -22.285037994384766, "global_step": 116398, "epoch": 1402} {"train_loss": -22.218765258789062, "global_step": 116399, "epoch": 1402} {"train_loss": -22.2838077545166, "global_step": 116400, "epoch": 1402} {"train_loss": -22.488218307495117, "global_step": 116401, "epoch": 1402} {"train_loss": -22.455896377563477, "global_step": 116402, "epoch": 1402} {"train_loss": -22.260385513305664, "global_step": 116403, "epoch": 1402} {"train_loss": -22.529277801513672, "global_step": 116404, "epoch": 1402} {"train_loss": -22.35125160217285, "global_step": 116405, "epoch": 1402} {"train_loss": -22.75912094116211, "global_step": 116406, "epoch": 1402} {"train_loss": -22.66226577758789, "global_step": 116407, "epoch": 1402} {"train_loss": -22.283109664916992, "global_step": 116408, "epoch": 1402} {"train_loss": -22.275068283081055, "global_step": 116409, "epoch": 1402} {"train_loss": -22.159574508666992, "global_step": 116410, "epoch": 1402} {"train_loss": -22.13019371032715, "global_step": 116411, "epoch": 1402} {"train_loss": -22.808643341064453, "global_step": 116412, "epoch": 1402} {"train_loss": -21.97487449645996, "global_step": 116413, "epoch": 1402} {"train_loss": -22.76296043395996, "global_step": 116414, "epoch": 1402} {"train_loss": -22.2576847076416, "global_step": 116415, "epoch": 1402} {"train_loss": -22.382200241088867, "global_step": 116416, "epoch": 1402} {"train_loss": -22.2740535736084, "global_step": 116417, "epoch": 1402} {"train_loss": -22.680418014526367, "global_step": 116418, "epoch": 1402} {"train_loss": -22.695606231689453, "global_step": 116419, "epoch": 1402} {"train_loss": -22.802522659301758, "global_step": 116420, "epoch": 1402} {"train_loss": -22.502832412719727, "global_step": 116421, "epoch": 1402} {"train_loss": -22.56599235534668, "global_step": 116422, "epoch": 1402} {"train_loss": -22.4239501953125, "global_step": 116423, "epoch": 1402} {"train_loss": -22.372713088989258, "global_step": 116424, "epoch": 1402} {"train_loss": -21.898029327392578, "global_step": 116425, "epoch": 1402} {"train_loss": -22.632400512695312, "global_step": 116426, "epoch": 1402} {"train_loss": -22.580486297607422, "global_step": 116427, "epoch": 1402} {"train_loss": -22.326231002807617, "global_step": 116428, "epoch": 1402} {"train_loss": -22.326862335205078, "global_step": 116429, "epoch": 1402} {"train_loss": -22.177717208862305, "global_step": 116430, "epoch": 1402} {"train_loss": -22.787872314453125, "global_step": 116431, "epoch": 1402} {"train_loss": -22.6163330078125, "global_step": 116432, "epoch": 1402} {"train_loss": -22.362096786499023, "global_step": 116433, "epoch": 1402} {"train_loss": -21.989622116088867, "global_step": 116434, "epoch": 1402} {"train_loss": -22.650760650634766, "global_step": 116435, "epoch": 1402} {"train_loss": -22.327896118164062, "global_step": 116436, "epoch": 1402} {"train_loss": -22.645904541015625, "global_step": 116437, "epoch": 1402} {"train_loss": -21.931676864624023, "global_step": 116438, "epoch": 1402} {"train_loss": -22.05533218383789, "global_step": 116439, "epoch": 1402} {"train_loss": -22.43208885192871, "global_step": 116440, "epoch": 1402} {"train_loss": -22.60658836364746, "global_step": 116441, "epoch": 1402} {"train_loss": -22.33791160583496, "global_step": 116442, "epoch": 1402} {"train_loss": -22.28949737548828, "global_step": 116443, "epoch": 1402} {"train_loss": -22.23661994934082, "global_step": 116444, "epoch": 1402} {"train_loss": -22.356082916259766, "global_step": 116445, "epoch": 1402} {"train_loss": -22.567914962768555, "global_step": 116446, "epoch": 1402} {"train_loss": -22.164731979370117, "global_step": 116447, "epoch": 1402} {"train_loss": -22.403558914919934, "global_step": 116448, "epoch": 1402, "val_loss": 6208282.0} {"train_loss": -21.736072540283203, "global_step": 116449, "epoch": 1403} {"train_loss": -21.74861717224121, "global_step": 116450, "epoch": 1403} {"train_loss": -21.702707290649414, "global_step": 116451, "epoch": 1403} {"train_loss": -21.986379623413086, "global_step": 116452, "epoch": 1403} {"train_loss": -21.928205490112305, "global_step": 116453, "epoch": 1403} {"train_loss": -21.835180282592773, "global_step": 116454, "epoch": 1403} {"train_loss": -22.16812515258789, "global_step": 116455, "epoch": 1403} {"train_loss": -21.8575439453125, "global_step": 116456, "epoch": 1403} {"train_loss": -22.03009796142578, "global_step": 116457, "epoch": 1403} {"train_loss": -22.24738883972168, "global_step": 116458, "epoch": 1403} {"train_loss": -22.37190818786621, "global_step": 116459, "epoch": 1403} {"train_loss": -22.049936294555664, "global_step": 116460, "epoch": 1403} {"train_loss": -21.98127555847168, "global_step": 116461, "epoch": 1403} {"train_loss": -21.82061195373535, "global_step": 116462, "epoch": 1403} {"train_loss": -21.746551513671875, "global_step": 116463, "epoch": 1403} {"train_loss": -22.14250373840332, "global_step": 116464, "epoch": 1403} {"train_loss": -22.330646514892578, "global_step": 116465, "epoch": 1403} {"train_loss": -22.251480102539062, "global_step": 116466, "epoch": 1403} {"train_loss": -22.15365982055664, "global_step": 116467, "epoch": 1403} {"train_loss": -22.226581573486328, "global_step": 116468, "epoch": 1403} {"train_loss": -22.43421745300293, "global_step": 116469, "epoch": 1403} {"train_loss": -22.356857299804688, "global_step": 116470, "epoch": 1403} {"train_loss": -22.095182418823242, "global_step": 116471, "epoch": 1403} {"train_loss": -22.477935791015625, "global_step": 116472, "epoch": 1403} {"train_loss": -22.3900089263916, "global_step": 116473, "epoch": 1403} {"train_loss": -22.464336395263672, "global_step": 116474, "epoch": 1403} {"train_loss": -22.371740341186523, "global_step": 116475, "epoch": 1403} {"train_loss": -22.339895248413086, "global_step": 116476, "epoch": 1403} {"train_loss": -22.585432052612305, "global_step": 116477, "epoch": 1403} {"train_loss": -22.352649688720703, "global_step": 116478, "epoch": 1403} {"train_loss": -22.654502868652344, "global_step": 116479, "epoch": 1403} {"train_loss": -22.34186363220215, "global_step": 116480, "epoch": 1403} {"train_loss": -22.410730361938477, "global_step": 116481, "epoch": 1403} {"train_loss": -22.399999618530273, "global_step": 116482, "epoch": 1403} {"train_loss": -22.195859909057617, "global_step": 116483, "epoch": 1403} {"train_loss": -22.35374641418457, "global_step": 116484, "epoch": 1403} {"train_loss": -22.53423309326172, "global_step": 116485, "epoch": 1403} {"train_loss": -22.409372329711914, "global_step": 116486, "epoch": 1403} {"train_loss": -22.20878028869629, "global_step": 116487, "epoch": 1403} {"train_loss": -22.135826110839844, "global_step": 116488, "epoch": 1403} {"train_loss": -22.15180778503418, "global_step": 116489, "epoch": 1403} {"train_loss": -22.45833396911621, "global_step": 116490, "epoch": 1403} {"train_loss": -22.479528427124023, "global_step": 116491, "epoch": 1403} {"train_loss": -22.781295776367188, "global_step": 116492, "epoch": 1403} {"train_loss": -22.901594161987305, "global_step": 116493, "epoch": 1403} {"train_loss": -22.271047592163086, "global_step": 116494, "epoch": 1403} {"train_loss": -22.632863998413086, "global_step": 116495, "epoch": 1403} {"train_loss": -22.748065948486328, "global_step": 116496, "epoch": 1403} {"train_loss": -22.502111434936523, "global_step": 116497, "epoch": 1403} {"train_loss": -22.298376083374023, "global_step": 116498, "epoch": 1403} {"train_loss": -22.47994041442871, "global_step": 116499, "epoch": 1403} {"train_loss": -22.158849716186523, "global_step": 116500, "epoch": 1403} {"train_loss": -22.611915588378906, "global_step": 116501, "epoch": 1403} {"train_loss": -22.56070899963379, "global_step": 116502, "epoch": 1403} {"train_loss": -22.505979537963867, "global_step": 116503, "epoch": 1403} {"train_loss": -22.294696807861328, "global_step": 116504, "epoch": 1403} {"train_loss": -22.48036766052246, "global_step": 116505, "epoch": 1403} {"train_loss": -22.69258689880371, "global_step": 116506, "epoch": 1403} {"train_loss": -22.363304138183594, "global_step": 116507, "epoch": 1403} {"train_loss": -21.959455490112305, "global_step": 116508, "epoch": 1403} {"train_loss": -22.483976364135742, "global_step": 116509, "epoch": 1403} {"train_loss": -22.39645767211914, "global_step": 116510, "epoch": 1403} {"train_loss": -22.263717651367188, "global_step": 116511, "epoch": 1403} {"train_loss": -22.536897659301758, "global_step": 116512, "epoch": 1403} {"train_loss": -22.524717330932617, "global_step": 116513, "epoch": 1403} {"train_loss": -22.53883171081543, "global_step": 116514, "epoch": 1403} {"train_loss": -22.545141220092773, "global_step": 116515, "epoch": 1403} {"train_loss": -22.277042388916016, "global_step": 116516, "epoch": 1403} {"train_loss": -22.121536254882812, "global_step": 116517, "epoch": 1403} {"train_loss": -22.831449508666992, "global_step": 116518, "epoch": 1403} {"train_loss": -22.252479553222656, "global_step": 116519, "epoch": 1403} {"train_loss": -22.56608772277832, "global_step": 116520, "epoch": 1403} {"train_loss": -22.597570419311523, "global_step": 116521, "epoch": 1403} {"train_loss": -22.042957305908203, "global_step": 116522, "epoch": 1403} {"train_loss": -22.50173568725586, "global_step": 116523, "epoch": 1403} {"train_loss": -22.30399513244629, "global_step": 116524, "epoch": 1403} {"train_loss": -22.771833419799805, "global_step": 116525, "epoch": 1403} {"train_loss": -22.473403930664062, "global_step": 116526, "epoch": 1403} {"train_loss": -22.544889450073242, "global_step": 116527, "epoch": 1403} {"train_loss": -22.3839111328125, "global_step": 116528, "epoch": 1403} {"train_loss": -22.681241989135742, "global_step": 116529, "epoch": 1403} {"train_loss": -22.427534103393555, "global_step": 116530, "epoch": 1403} {"train_loss": -22.332284421805877, "global_step": 116531, "epoch": 1403, "val_loss": 6156682.0} {"train_loss": -22.042692184448242, "global_step": 116532, "epoch": 1404} {"train_loss": -22.343948364257812, "global_step": 116533, "epoch": 1404} {"train_loss": -22.5057373046875, "global_step": 116534, "epoch": 1404} {"train_loss": -22.360464096069336, "global_step": 116535, "epoch": 1404} {"train_loss": -22.583356857299805, "global_step": 116536, "epoch": 1404} {"train_loss": -22.20649528503418, "global_step": 116537, "epoch": 1404} {"train_loss": -22.398263931274414, "global_step": 116538, "epoch": 1404} {"train_loss": -22.595478057861328, "global_step": 116539, "epoch": 1404} {"train_loss": -22.14361000061035, "global_step": 116540, "epoch": 1404} {"train_loss": -22.433908462524414, "global_step": 116541, "epoch": 1404} {"train_loss": -22.64154624938965, "global_step": 116542, "epoch": 1404} {"train_loss": -22.068906784057617, "global_step": 116543, "epoch": 1404} {"train_loss": -22.365686416625977, "global_step": 116544, "epoch": 1404} {"train_loss": -22.379682540893555, "global_step": 116545, "epoch": 1404} {"train_loss": -22.546049118041992, "global_step": 116546, "epoch": 1404} {"train_loss": -22.059419631958008, "global_step": 116547, "epoch": 1404} {"train_loss": -22.398603439331055, "global_step": 116548, "epoch": 1404} {"train_loss": -22.345966339111328, "global_step": 116549, "epoch": 1404} {"train_loss": -22.540388107299805, "global_step": 116550, "epoch": 1404} {"train_loss": -22.056272506713867, "global_step": 116551, "epoch": 1404} {"train_loss": -22.343841552734375, "global_step": 116552, "epoch": 1404} {"train_loss": -22.765626907348633, "global_step": 116553, "epoch": 1404} {"train_loss": -22.116933822631836, "global_step": 116554, "epoch": 1404} {"train_loss": -22.446365356445312, "global_step": 116555, "epoch": 1404} {"train_loss": -22.007549285888672, "global_step": 116556, "epoch": 1404} {"train_loss": -22.478591918945312, "global_step": 116557, "epoch": 1404} {"train_loss": -22.53167152404785, "global_step": 116558, "epoch": 1404} {"train_loss": -22.292905807495117, "global_step": 116559, "epoch": 1404} {"train_loss": -22.682422637939453, "global_step": 116560, "epoch": 1404} {"train_loss": -22.431182861328125, "global_step": 116561, "epoch": 1404} {"train_loss": -22.832460403442383, "global_step": 116562, "epoch": 1404} {"train_loss": -22.450408935546875, "global_step": 116563, "epoch": 1404} {"train_loss": -22.67051124572754, "global_step": 116564, "epoch": 1404} {"train_loss": -22.484272003173828, "global_step": 116565, "epoch": 1404} {"train_loss": -22.27439308166504, "global_step": 116566, "epoch": 1404} {"train_loss": -22.271453857421875, "global_step": 116567, "epoch": 1404} {"train_loss": -21.786178588867188, "global_step": 116568, "epoch": 1404} {"train_loss": -22.54927635192871, "global_step": 116569, "epoch": 1404} {"train_loss": -22.363269805908203, "global_step": 116570, "epoch": 1404} {"train_loss": -22.335058212280273, "global_step": 116571, "epoch": 1404} {"train_loss": -22.085763931274414, "global_step": 116572, "epoch": 1404} {"train_loss": -22.32318687438965, "global_step": 116573, "epoch": 1404} {"train_loss": -22.623153686523438, "global_step": 116574, "epoch": 1404} {"train_loss": -22.45002555847168, "global_step": 116575, "epoch": 1404} {"train_loss": -22.326454162597656, "global_step": 116576, "epoch": 1404} {"train_loss": -22.2805233001709, "global_step": 116577, "epoch": 1404} {"train_loss": -22.103479385375977, "global_step": 116578, "epoch": 1404} {"train_loss": -22.26613426208496, "global_step": 116579, "epoch": 1404} {"train_loss": -22.280567169189453, "global_step": 116580, "epoch": 1404} {"train_loss": -22.153501510620117, "global_step": 116581, "epoch": 1404} {"train_loss": -22.520559310913086, "global_step": 116582, "epoch": 1404} {"train_loss": -22.695425033569336, "global_step": 116583, "epoch": 1404} {"train_loss": -22.536558151245117, "global_step": 116584, "epoch": 1404} {"train_loss": -22.416452407836914, "global_step": 116585, "epoch": 1404} {"train_loss": -22.738676071166992, "global_step": 116586, "epoch": 1404} {"train_loss": -22.390283584594727, "global_step": 116587, "epoch": 1404} {"train_loss": -22.57639503479004, "global_step": 116588, "epoch": 1404} {"train_loss": -22.828584671020508, "global_step": 116589, "epoch": 1404} {"train_loss": -22.20289421081543, "global_step": 116590, "epoch": 1404} {"train_loss": -22.66034507751465, "global_step": 116591, "epoch": 1404} {"train_loss": -22.40680694580078, "global_step": 116592, "epoch": 1404} {"train_loss": -22.482818603515625, "global_step": 116593, "epoch": 1404} {"train_loss": -22.64894676208496, "global_step": 116594, "epoch": 1404} {"train_loss": -22.82373809814453, "global_step": 116595, "epoch": 1404} {"train_loss": -22.459239959716797, "global_step": 116596, "epoch": 1404} {"train_loss": -22.176809310913086, "global_step": 116597, "epoch": 1404} {"train_loss": -22.482181549072266, "global_step": 116598, "epoch": 1404} {"train_loss": -22.329425811767578, "global_step": 116599, "epoch": 1404} {"train_loss": -22.483976364135742, "global_step": 116600, "epoch": 1404} {"train_loss": -22.883771896362305, "global_step": 116601, "epoch": 1404} {"train_loss": -22.49072265625, "global_step": 116602, "epoch": 1404} {"train_loss": -22.387714385986328, "global_step": 116603, "epoch": 1404} {"train_loss": -22.11164665222168, "global_step": 116604, "epoch": 1404} {"train_loss": -22.404020309448242, "global_step": 116605, "epoch": 1404} {"train_loss": -22.845733642578125, "global_step": 116606, "epoch": 1404} {"train_loss": -22.292219161987305, "global_step": 116607, "epoch": 1404} {"train_loss": -22.085447311401367, "global_step": 116608, "epoch": 1404} {"train_loss": -22.356740951538086, "global_step": 116609, "epoch": 1404} {"train_loss": -22.833660125732422, "global_step": 116610, "epoch": 1404} {"train_loss": -22.410259246826172, "global_step": 116611, "epoch": 1404} {"train_loss": -22.648651123046875, "global_step": 116612, "epoch": 1404} {"train_loss": -22.129308700561523, "global_step": 116613, "epoch": 1404} {"train_loss": -22.426466194980115, "global_step": 116614, "epoch": 1404, "val_loss": 6204842.0} {"train_loss": -21.81181526184082, "global_step": 116615, "epoch": 1405} {"train_loss": -21.704790115356445, "global_step": 116616, "epoch": 1405} {"train_loss": -21.647336959838867, "global_step": 116617, "epoch": 1405} {"train_loss": -22.01970863342285, "global_step": 116618, "epoch": 1405} {"train_loss": -22.0387020111084, "global_step": 116619, "epoch": 1405} {"train_loss": -22.033056259155273, "global_step": 116620, "epoch": 1405} {"train_loss": -22.113880157470703, "global_step": 116621, "epoch": 1405} {"train_loss": -21.919416427612305, "global_step": 116622, "epoch": 1405} {"train_loss": -22.36417579650879, "global_step": 116623, "epoch": 1405} {"train_loss": -21.97305679321289, "global_step": 116624, "epoch": 1405} {"train_loss": -22.23818016052246, "global_step": 116625, "epoch": 1405} {"train_loss": -21.92957878112793, "global_step": 116626, "epoch": 1405} {"train_loss": -21.66571617126465, "global_step": 116627, "epoch": 1405} {"train_loss": -22.108182907104492, "global_step": 116628, "epoch": 1405} {"train_loss": -22.038631439208984, "global_step": 116629, "epoch": 1405} {"train_loss": -22.06727409362793, "global_step": 116630, "epoch": 1405} {"train_loss": -22.286787033081055, "global_step": 116631, "epoch": 1405} {"train_loss": -21.976926803588867, "global_step": 116632, "epoch": 1405} {"train_loss": -22.3510684967041, "global_step": 116633, "epoch": 1405} {"train_loss": -22.216896057128906, "global_step": 116634, "epoch": 1405} {"train_loss": -22.329063415527344, "global_step": 116635, "epoch": 1405} {"train_loss": -22.751407623291016, "global_step": 116636, "epoch": 1405} {"train_loss": -22.352596282958984, "global_step": 116637, "epoch": 1405} {"train_loss": -22.546247482299805, "global_step": 116638, "epoch": 1405} {"train_loss": -22.450273513793945, "global_step": 116639, "epoch": 1405} {"train_loss": -22.19306182861328, "global_step": 116640, "epoch": 1405} {"train_loss": -22.46232032775879, "global_step": 116641, "epoch": 1405} {"train_loss": -22.020483016967773, "global_step": 116642, "epoch": 1405} {"train_loss": -22.76688575744629, "global_step": 116643, "epoch": 1405} {"train_loss": -22.27123260498047, "global_step": 116644, "epoch": 1405} {"train_loss": -22.620792388916016, "global_step": 116645, "epoch": 1405} {"train_loss": -22.329833984375, "global_step": 116646, "epoch": 1405} {"train_loss": -22.094371795654297, "global_step": 116647, "epoch": 1405} {"train_loss": -22.6524715423584, "global_step": 116648, "epoch": 1405} {"train_loss": -22.823596954345703, "global_step": 116649, "epoch": 1405} {"train_loss": -22.434375762939453, "global_step": 116650, "epoch": 1405} {"train_loss": -22.42166519165039, "global_step": 116651, "epoch": 1405} {"train_loss": -22.2469482421875, "global_step": 116652, "epoch": 1405} {"train_loss": -22.25210952758789, "global_step": 116653, "epoch": 1405} {"train_loss": -22.701805114746094, "global_step": 116654, "epoch": 1405} {"train_loss": -22.349977493286133, "global_step": 116655, "epoch": 1405} {"train_loss": -22.639009475708008, "global_step": 116656, "epoch": 1405} {"train_loss": -22.458393096923828, "global_step": 116657, "epoch": 1405} {"train_loss": -22.41878318786621, "global_step": 116658, "epoch": 1405} {"train_loss": -22.603681564331055, "global_step": 116659, "epoch": 1405} {"train_loss": -22.435089111328125, "global_step": 116660, "epoch": 1405} {"train_loss": -22.38556480407715, "global_step": 116661, "epoch": 1405} {"train_loss": -22.457983016967773, "global_step": 116662, "epoch": 1405} {"train_loss": -22.21394157409668, "global_step": 116663, "epoch": 1405} {"train_loss": -22.5401611328125, "global_step": 116664, "epoch": 1405} {"train_loss": -22.38160514831543, "global_step": 116665, "epoch": 1405} {"train_loss": -22.45775032043457, "global_step": 116666, "epoch": 1405} {"train_loss": -22.3250789642334, "global_step": 116667, "epoch": 1405} {"train_loss": -22.35378074645996, "global_step": 116668, "epoch": 1405} {"train_loss": -22.67816162109375, "global_step": 116669, "epoch": 1405} {"train_loss": -22.866275787353516, "global_step": 116670, "epoch": 1405} {"train_loss": -22.34969711303711, "global_step": 116671, "epoch": 1405} {"train_loss": -22.636091232299805, "global_step": 116672, "epoch": 1405} {"train_loss": -22.463855743408203, "global_step": 116673, "epoch": 1405} {"train_loss": -22.67746353149414, "global_step": 116674, "epoch": 1405} {"train_loss": -22.295705795288086, "global_step": 116675, "epoch": 1405} {"train_loss": -22.421491622924805, "global_step": 116676, "epoch": 1405} {"train_loss": -22.360641479492188, "global_step": 116677, "epoch": 1405} {"train_loss": -22.411170959472656, "global_step": 116678, "epoch": 1405} {"train_loss": -22.151166915893555, "global_step": 116679, "epoch": 1405} {"train_loss": -22.21129608154297, "global_step": 116680, "epoch": 1405} {"train_loss": -22.561538696289062, "global_step": 116681, "epoch": 1405} {"train_loss": -22.726318359375, "global_step": 116682, "epoch": 1405} {"train_loss": -22.304668426513672, "global_step": 116683, "epoch": 1405} {"train_loss": -22.49407958984375, "global_step": 116684, "epoch": 1405} {"train_loss": -22.72884178161621, "global_step": 116685, "epoch": 1405} {"train_loss": -22.59696388244629, "global_step": 116686, "epoch": 1405} {"train_loss": -22.413877487182617, "global_step": 116687, "epoch": 1405} {"train_loss": -22.9605712890625, "global_step": 116688, "epoch": 1405} {"train_loss": -22.872024536132812, "global_step": 116689, "epoch": 1405} {"train_loss": -22.431161880493164, "global_step": 116690, "epoch": 1405} {"train_loss": -22.389554977416992, "global_step": 116691, "epoch": 1405} {"train_loss": -22.662616729736328, "global_step": 116692, "epoch": 1405} {"train_loss": -22.69251823425293, "global_step": 116693, "epoch": 1405} {"train_loss": -22.213308334350586, "global_step": 116694, "epoch": 1405} {"train_loss": -22.516923904418945, "global_step": 116695, "epoch": 1405} {"train_loss": -22.606897354125977, "global_step": 116696, "epoch": 1405} {"train_loss": -22.35916964979057, "global_step": 116697, "epoch": 1405, "val_loss": 6211948.0} {"train_loss": -22.41248893737793, "global_step": 116698, "epoch": 1406} {"train_loss": -22.222482681274414, "global_step": 116699, "epoch": 1406} {"train_loss": -22.558107376098633, "global_step": 116700, "epoch": 1406} {"train_loss": -22.072153091430664, "global_step": 116701, "epoch": 1406} {"train_loss": -22.628110885620117, "global_step": 116702, "epoch": 1406} {"train_loss": -21.974822998046875, "global_step": 116703, "epoch": 1406} {"train_loss": -22.391956329345703, "global_step": 116704, "epoch": 1406} {"train_loss": -22.07447624206543, "global_step": 116705, "epoch": 1406} {"train_loss": -22.00639533996582, "global_step": 116706, "epoch": 1406} {"train_loss": -22.817203521728516, "global_step": 116707, "epoch": 1406} {"train_loss": -22.246910095214844, "global_step": 116708, "epoch": 1406} {"train_loss": -22.202232360839844, "global_step": 116709, "epoch": 1406} {"train_loss": -22.2946834564209, "global_step": 116710, "epoch": 1406} {"train_loss": -22.347997665405273, "global_step": 116711, "epoch": 1406} {"train_loss": -22.48876953125, "global_step": 116712, "epoch": 1406} {"train_loss": -22.2005615234375, "global_step": 116713, "epoch": 1406} {"train_loss": -22.449716567993164, "global_step": 116714, "epoch": 1406} {"train_loss": -22.439428329467773, "global_step": 116715, "epoch": 1406} {"train_loss": -22.31800079345703, "global_step": 116716, "epoch": 1406} {"train_loss": -22.223745346069336, "global_step": 116717, "epoch": 1406} {"train_loss": -22.3341121673584, "global_step": 116718, "epoch": 1406} {"train_loss": -22.7215576171875, "global_step": 116719, "epoch": 1406} {"train_loss": -22.378625869750977, "global_step": 116720, "epoch": 1406} {"train_loss": -22.31392478942871, "global_step": 116721, "epoch": 1406} {"train_loss": -22.45578956604004, "global_step": 116722, "epoch": 1406} {"train_loss": -22.55355453491211, "global_step": 116723, "epoch": 1406} {"train_loss": -22.305822372436523, "global_step": 116724, "epoch": 1406} {"train_loss": -22.495729446411133, "global_step": 116725, "epoch": 1406} {"train_loss": -22.46282196044922, "global_step": 116726, "epoch": 1406} {"train_loss": -22.39187240600586, "global_step": 116727, "epoch": 1406} {"train_loss": -22.339704513549805, "global_step": 116728, "epoch": 1406} {"train_loss": -21.945100784301758, "global_step": 116729, "epoch": 1406} {"train_loss": -22.52826499938965, "global_step": 116730, "epoch": 1406} {"train_loss": -22.707538604736328, "global_step": 116731, "epoch": 1406} {"train_loss": -22.50181770324707, "global_step": 116732, "epoch": 1406} {"train_loss": -22.444503784179688, "global_step": 116733, "epoch": 1406} {"train_loss": -22.5429630279541, "global_step": 116734, "epoch": 1406} {"train_loss": -22.3560791015625, "global_step": 116735, "epoch": 1406} {"train_loss": -22.623136520385742, "global_step": 116736, "epoch": 1406} {"train_loss": -22.343856811523438, "global_step": 116737, "epoch": 1406} {"train_loss": -22.314483642578125, "global_step": 116738, "epoch": 1406} {"train_loss": -22.969919204711914, "global_step": 116739, "epoch": 1406} {"train_loss": -22.56061363220215, "global_step": 116740, "epoch": 1406} {"train_loss": -22.756742477416992, "global_step": 116741, "epoch": 1406} {"train_loss": -21.765661239624023, "global_step": 116742, "epoch": 1406} {"train_loss": -22.539396286010742, "global_step": 116743, "epoch": 1406} {"train_loss": -22.433218002319336, "global_step": 116744, "epoch": 1406} {"train_loss": -22.953826904296875, "global_step": 116745, "epoch": 1406} {"train_loss": -22.31537628173828, "global_step": 116746, "epoch": 1406} {"train_loss": -22.699752807617188, "global_step": 116747, "epoch": 1406} {"train_loss": -22.27073860168457, "global_step": 116748, "epoch": 1406} {"train_loss": -22.220230102539062, "global_step": 116749, "epoch": 1406} {"train_loss": -22.36263084411621, "global_step": 116750, "epoch": 1406} {"train_loss": -22.291715621948242, "global_step": 116751, "epoch": 1406} {"train_loss": -22.39242172241211, "global_step": 116752, "epoch": 1406} {"train_loss": -22.51409339904785, "global_step": 116753, "epoch": 1406} {"train_loss": -22.176374435424805, "global_step": 116754, "epoch": 1406} {"train_loss": -22.502639770507812, "global_step": 116755, "epoch": 1406} {"train_loss": -22.702985763549805, "global_step": 116756, "epoch": 1406} {"train_loss": -22.083356857299805, "global_step": 116757, "epoch": 1406} {"train_loss": -22.270597457885742, "global_step": 116758, "epoch": 1406} {"train_loss": -22.153120040893555, "global_step": 116759, "epoch": 1406} {"train_loss": -22.188201904296875, "global_step": 116760, "epoch": 1406} {"train_loss": -22.106351852416992, "global_step": 116761, "epoch": 1406} {"train_loss": -22.362043380737305, "global_step": 116762, "epoch": 1406} {"train_loss": -22.45490074157715, "global_step": 116763, "epoch": 1406} {"train_loss": -22.155075073242188, "global_step": 116764, "epoch": 1406} {"train_loss": -22.378948211669922, "global_step": 116765, "epoch": 1406} {"train_loss": -22.5264949798584, "global_step": 116766, "epoch": 1406} {"train_loss": -22.45680046081543, "global_step": 116767, "epoch": 1406} {"train_loss": -22.517061233520508, "global_step": 116768, "epoch": 1406} {"train_loss": -22.415000915527344, "global_step": 116769, "epoch": 1406} {"train_loss": -22.579442977905273, "global_step": 116770, "epoch": 1406} {"train_loss": -22.450422286987305, "global_step": 116771, "epoch": 1406} {"train_loss": -22.59087371826172, "global_step": 116772, "epoch": 1406} {"train_loss": -22.46540641784668, "global_step": 116773, "epoch": 1406} {"train_loss": -22.583343505859375, "global_step": 116774, "epoch": 1406} {"train_loss": -22.31851577758789, "global_step": 116775, "epoch": 1406} {"train_loss": -22.709993362426758, "global_step": 116776, "epoch": 1406} {"train_loss": -22.624073028564453, "global_step": 116777, "epoch": 1406} {"train_loss": -22.425867080688477, "global_step": 116778, "epoch": 1406} {"train_loss": -22.516029357910156, "global_step": 116779, "epoch": 1406} {"train_loss": -22.41649271493935, "global_step": 116780, "epoch": 1406, "val_loss": 6411342.0} {"train_loss": -20.709156036376953, "global_step": 116781, "epoch": 1407} {"train_loss": -21.80259132385254, "global_step": 116782, "epoch": 1407} {"train_loss": -21.348388671875, "global_step": 116783, "epoch": 1407} {"train_loss": -21.690946578979492, "global_step": 116784, "epoch": 1407} {"train_loss": -21.667726516723633, "global_step": 116785, "epoch": 1407} {"train_loss": -21.52984046936035, "global_step": 116786, "epoch": 1407} {"train_loss": -21.82107925415039, "global_step": 116787, "epoch": 1407} {"train_loss": -22.233129501342773, "global_step": 116788, "epoch": 1407} {"train_loss": -21.959218978881836, "global_step": 116789, "epoch": 1407} {"train_loss": -22.21209144592285, "global_step": 116790, "epoch": 1407} {"train_loss": -22.014585494995117, "global_step": 116791, "epoch": 1407} {"train_loss": -22.12777328491211, "global_step": 116792, "epoch": 1407} {"train_loss": -21.67758560180664, "global_step": 116793, "epoch": 1407} {"train_loss": -22.070310592651367, "global_step": 116794, "epoch": 1407} {"train_loss": -22.121810913085938, "global_step": 116795, "epoch": 1407} {"train_loss": -22.04397964477539, "global_step": 116796, "epoch": 1407} {"train_loss": -22.086923599243164, "global_step": 116797, "epoch": 1407} {"train_loss": -22.074987411499023, "global_step": 116798, "epoch": 1407} {"train_loss": -22.26074981689453, "global_step": 116799, "epoch": 1407} {"train_loss": -22.114553451538086, "global_step": 116800, "epoch": 1407} {"train_loss": -22.433088302612305, "global_step": 116801, "epoch": 1407} {"train_loss": -22.392271041870117, "global_step": 116802, "epoch": 1407} {"train_loss": -22.24161720275879, "global_step": 116803, "epoch": 1407} {"train_loss": -22.08306312561035, "global_step": 116804, "epoch": 1407} {"train_loss": -22.31574821472168, "global_step": 116805, "epoch": 1407} {"train_loss": -22.44788932800293, "global_step": 116806, "epoch": 1407} {"train_loss": -22.35472297668457, "global_step": 116807, "epoch": 1407} {"train_loss": -22.1263427734375, "global_step": 116808, "epoch": 1407} {"train_loss": -22.59375, "global_step": 116809, "epoch": 1407} {"train_loss": -22.390186309814453, "global_step": 116810, "epoch": 1407} {"train_loss": -22.54503059387207, "global_step": 116811, "epoch": 1407} {"train_loss": -22.168455123901367, "global_step": 116812, "epoch": 1407} {"train_loss": -22.361759185791016, "global_step": 116813, "epoch": 1407} {"train_loss": -22.376428604125977, "global_step": 116814, "epoch": 1407} {"train_loss": -22.218875885009766, "global_step": 116815, "epoch": 1407} {"train_loss": -22.145910263061523, "global_step": 116816, "epoch": 1407} {"train_loss": -22.3836727142334, "global_step": 116817, "epoch": 1407} {"train_loss": -22.556821823120117, "global_step": 116818, "epoch": 1407} {"train_loss": -22.501707077026367, "global_step": 116819, "epoch": 1407} {"train_loss": -22.25324249267578, "global_step": 116820, "epoch": 1407} {"train_loss": -22.153972625732422, "global_step": 116821, "epoch": 1407} {"train_loss": -22.5931396484375, "global_step": 116822, "epoch": 1407} {"train_loss": -22.35137939453125, "global_step": 116823, "epoch": 1407} {"train_loss": -22.164518356323242, "global_step": 116824, "epoch": 1407} {"train_loss": -22.222501754760742, "global_step": 116825, "epoch": 1407} {"train_loss": -22.46099853515625, "global_step": 116826, "epoch": 1407} {"train_loss": -22.08339500427246, "global_step": 116827, "epoch": 1407} {"train_loss": -22.34979820251465, "global_step": 116828, "epoch": 1407} {"train_loss": -22.09510612487793, "global_step": 116829, "epoch": 1407} {"train_loss": -21.822845458984375, "global_step": 116830, "epoch": 1407} {"train_loss": -22.36294937133789, "global_step": 116831, "epoch": 1407} {"train_loss": -22.527502059936523, "global_step": 116832, "epoch": 1407} {"train_loss": -22.576597213745117, "global_step": 116833, "epoch": 1407} {"train_loss": -22.044605255126953, "global_step": 116834, "epoch": 1407} {"train_loss": -22.221031188964844, "global_step": 116835, "epoch": 1407} {"train_loss": -22.340036392211914, "global_step": 116836, "epoch": 1407} {"train_loss": -22.35956382751465, "global_step": 116837, "epoch": 1407} {"train_loss": -22.2832088470459, "global_step": 116838, "epoch": 1407} {"train_loss": -22.7070255279541, "global_step": 116839, "epoch": 1407} {"train_loss": -22.581960678100586, "global_step": 116840, "epoch": 1407} {"train_loss": -22.481889724731445, "global_step": 116841, "epoch": 1407} {"train_loss": -22.512510299682617, "global_step": 116842, "epoch": 1407} {"train_loss": -22.36279296875, "global_step": 116843, "epoch": 1407} {"train_loss": -22.67665672302246, "global_step": 116844, "epoch": 1407} {"train_loss": -22.451156616210938, "global_step": 116845, "epoch": 1407} {"train_loss": -22.434057235717773, "global_step": 116846, "epoch": 1407} {"train_loss": -22.70777702331543, "global_step": 116847, "epoch": 1407} {"train_loss": -22.914052963256836, "global_step": 116848, "epoch": 1407} {"train_loss": -22.56110382080078, "global_step": 116849, "epoch": 1407} {"train_loss": -22.578338623046875, "global_step": 116850, "epoch": 1407} {"train_loss": -22.667116165161133, "global_step": 116851, "epoch": 1407} {"train_loss": -22.727243423461914, "global_step": 116852, "epoch": 1407} {"train_loss": -22.355154037475586, "global_step": 116853, "epoch": 1407} {"train_loss": -22.135530471801758, "global_step": 116854, "epoch": 1407} {"train_loss": -22.63648796081543, "global_step": 116855, "epoch": 1407} {"train_loss": -22.746047973632812, "global_step": 116856, "epoch": 1407} {"train_loss": -22.263792037963867, "global_step": 116857, "epoch": 1407} {"train_loss": -22.462100982666016, "global_step": 116858, "epoch": 1407} {"train_loss": -22.60304069519043, "global_step": 116859, "epoch": 1407} {"train_loss": -22.536588668823242, "global_step": 116860, "epoch": 1407} {"train_loss": -22.66868019104004, "global_step": 116861, "epoch": 1407} {"train_loss": -22.565488815307617, "global_step": 116862, "epoch": 1407} {"train_loss": -22.284732680722893, "global_step": 116863, "epoch": 1407, "val_loss": 6191018.5} {"train_loss": -21.93902587890625, "global_step": 116864, "epoch": 1408} {"train_loss": -22.344385147094727, "global_step": 116865, "epoch": 1408} {"train_loss": -22.08381462097168, "global_step": 116866, "epoch": 1408} {"train_loss": -22.015478134155273, "global_step": 116867, "epoch": 1408} {"train_loss": -22.048263549804688, "global_step": 116868, "epoch": 1408} {"train_loss": -21.81184959411621, "global_step": 116869, "epoch": 1408} {"train_loss": -22.00485610961914, "global_step": 116870, "epoch": 1408} {"train_loss": -22.477142333984375, "global_step": 116871, "epoch": 1408} {"train_loss": -22.517948150634766, "global_step": 116872, "epoch": 1408} {"train_loss": -22.226865768432617, "global_step": 116873, "epoch": 1408} {"train_loss": -22.334762573242188, "global_step": 116874, "epoch": 1408} {"train_loss": -22.125253677368164, "global_step": 116875, "epoch": 1408} {"train_loss": -22.291257858276367, "global_step": 116876, "epoch": 1408} {"train_loss": -22.12293815612793, "global_step": 116877, "epoch": 1408} {"train_loss": -22.196735382080078, "global_step": 116878, "epoch": 1408} {"train_loss": -22.47234344482422, "global_step": 116879, "epoch": 1408} {"train_loss": -22.05133056640625, "global_step": 116880, "epoch": 1408} {"train_loss": -22.55860710144043, "global_step": 116881, "epoch": 1408} {"train_loss": -22.33729362487793, "global_step": 116882, "epoch": 1408} {"train_loss": -22.72804832458496, "global_step": 116883, "epoch": 1408} {"train_loss": -22.560869216918945, "global_step": 116884, "epoch": 1408} {"train_loss": -22.336978912353516, "global_step": 116885, "epoch": 1408} {"train_loss": -22.749465942382812, "global_step": 116886, "epoch": 1408} {"train_loss": -22.16535758972168, "global_step": 116887, "epoch": 1408} {"train_loss": -22.749954223632812, "global_step": 116888, "epoch": 1408} {"train_loss": -22.55135154724121, "global_step": 116889, "epoch": 1408} {"train_loss": -22.23402976989746, "global_step": 116890, "epoch": 1408} {"train_loss": -22.564990997314453, "global_step": 116891, "epoch": 1408} {"train_loss": -22.66168785095215, "global_step": 116892, "epoch": 1408} {"train_loss": -22.25796890258789, "global_step": 116893, "epoch": 1408} {"train_loss": -22.669843673706055, "global_step": 116894, "epoch": 1408} {"train_loss": -22.39358901977539, "global_step": 116895, "epoch": 1408} {"train_loss": -21.978361129760742, "global_step": 116896, "epoch": 1408} {"train_loss": -22.296140670776367, "global_step": 116897, "epoch": 1408} {"train_loss": -22.583995819091797, "global_step": 116898, "epoch": 1408} {"train_loss": -22.269702911376953, "global_step": 116899, "epoch": 1408} {"train_loss": -22.7022647857666, "global_step": 116900, "epoch": 1408} {"train_loss": -22.489551544189453, "global_step": 116901, "epoch": 1408} {"train_loss": -22.849702835083008, "global_step": 116902, "epoch": 1408} {"train_loss": -22.805702209472656, "global_step": 116903, "epoch": 1408} {"train_loss": -22.26388168334961, "global_step": 116904, "epoch": 1408} {"train_loss": -22.60409164428711, "global_step": 116905, "epoch": 1408} {"train_loss": -22.58493995666504, "global_step": 116906, "epoch": 1408} {"train_loss": -22.280990600585938, "global_step": 116907, "epoch": 1408} {"train_loss": -22.495452880859375, "global_step": 116908, "epoch": 1408} {"train_loss": -22.418228149414062, "global_step": 116909, "epoch": 1408} {"train_loss": -22.581586837768555, "global_step": 116910, "epoch": 1408} {"train_loss": -22.34482765197754, "global_step": 116911, "epoch": 1408} {"train_loss": -22.660491943359375, "global_step": 116912, "epoch": 1408} {"train_loss": -22.517786026000977, "global_step": 116913, "epoch": 1408} {"train_loss": -22.53631019592285, "global_step": 116914, "epoch": 1408} {"train_loss": -22.060394287109375, "global_step": 116915, "epoch": 1408} {"train_loss": -22.446653366088867, "global_step": 116916, "epoch": 1408} {"train_loss": -22.427509307861328, "global_step": 116917, "epoch": 1408} {"train_loss": -22.297657012939453, "global_step": 116918, "epoch": 1408} {"train_loss": -22.722970962524414, "global_step": 116919, "epoch": 1408} {"train_loss": -22.505273818969727, "global_step": 116920, "epoch": 1408} {"train_loss": -22.4449405670166, "global_step": 116921, "epoch": 1408} {"train_loss": -22.00275993347168, "global_step": 116922, "epoch": 1408} {"train_loss": -22.470563888549805, "global_step": 116923, "epoch": 1408} {"train_loss": -22.165630340576172, "global_step": 116924, "epoch": 1408} {"train_loss": -22.14253044128418, "global_step": 116925, "epoch": 1408} {"train_loss": -22.513620376586914, "global_step": 116926, "epoch": 1408} {"train_loss": -22.40595817565918, "global_step": 116927, "epoch": 1408} {"train_loss": -22.50836753845215, "global_step": 116928, "epoch": 1408} {"train_loss": -22.314008712768555, "global_step": 116929, "epoch": 1408} {"train_loss": -22.39569091796875, "global_step": 116930, "epoch": 1408} {"train_loss": -22.54969024658203, "global_step": 116931, "epoch": 1408} {"train_loss": -22.456790924072266, "global_step": 116932, "epoch": 1408} {"train_loss": -22.49504852294922, "global_step": 116933, "epoch": 1408} {"train_loss": -22.31537628173828, "global_step": 116934, "epoch": 1408} {"train_loss": -22.383209228515625, "global_step": 116935, "epoch": 1408} {"train_loss": -22.687618255615234, "global_step": 116936, "epoch": 1408} {"train_loss": -22.46092987060547, "global_step": 116937, "epoch": 1408} {"train_loss": -22.475849151611328, "global_step": 116938, "epoch": 1408} {"train_loss": -22.455604553222656, "global_step": 116939, "epoch": 1408} {"train_loss": -22.672897338867188, "global_step": 116940, "epoch": 1408} {"train_loss": -22.51567840576172, "global_step": 116941, "epoch": 1408} {"train_loss": -22.410776138305664, "global_step": 116942, "epoch": 1408} {"train_loss": -22.720014572143555, "global_step": 116943, "epoch": 1408} {"train_loss": -22.580305099487305, "global_step": 116944, "epoch": 1408} {"train_loss": -22.406919479370117, "global_step": 116945, "epoch": 1408} {"train_loss": -22.401244014142506, "global_step": 116946, "epoch": 1408, "val_loss": 6102962.5} {"train_loss": -20.974254608154297, "global_step": 116947, "epoch": 1409} {"train_loss": -21.448745727539062, "global_step": 116948, "epoch": 1409} {"train_loss": -21.825162887573242, "global_step": 116949, "epoch": 1409} {"train_loss": -22.085128784179688, "global_step": 116950, "epoch": 1409} {"train_loss": -22.019948959350586, "global_step": 116951, "epoch": 1409} {"train_loss": -22.02947998046875, "global_step": 116952, "epoch": 1409} {"train_loss": -22.376367568969727, "global_step": 116953, "epoch": 1409} {"train_loss": -21.64275550842285, "global_step": 116954, "epoch": 1409} {"train_loss": -22.2355899810791, "global_step": 116955, "epoch": 1409} {"train_loss": -22.154829025268555, "global_step": 116956, "epoch": 1409} {"train_loss": -22.0885009765625, "global_step": 116957, "epoch": 1409} {"train_loss": -22.102924346923828, "global_step": 116958, "epoch": 1409} {"train_loss": -21.849645614624023, "global_step": 116959, "epoch": 1409} {"train_loss": -21.992040634155273, "global_step": 116960, "epoch": 1409} {"train_loss": -22.443140029907227, "global_step": 116961, "epoch": 1409} {"train_loss": -22.381362915039062, "global_step": 116962, "epoch": 1409} {"train_loss": -22.510478973388672, "global_step": 116963, "epoch": 1409} {"train_loss": -22.26302146911621, "global_step": 116964, "epoch": 1409} {"train_loss": -22.01032829284668, "global_step": 116965, "epoch": 1409} {"train_loss": -22.393295288085938, "global_step": 116966, "epoch": 1409} {"train_loss": -22.413223266601562, "global_step": 116967, "epoch": 1409} {"train_loss": -22.5069580078125, "global_step": 116968, "epoch": 1409} {"train_loss": -21.73396873474121, "global_step": 116969, "epoch": 1409} {"train_loss": -22.670766830444336, "global_step": 116970, "epoch": 1409} {"train_loss": -22.48004150390625, "global_step": 116971, "epoch": 1409} {"train_loss": -22.25200080871582, "global_step": 116972, "epoch": 1409} {"train_loss": -22.193471908569336, "global_step": 116973, "epoch": 1409} {"train_loss": -22.41416358947754, "global_step": 116974, "epoch": 1409} {"train_loss": -22.471820831298828, "global_step": 116975, "epoch": 1409} {"train_loss": -22.262231826782227, "global_step": 116976, "epoch": 1409} {"train_loss": -22.27663230895996, "global_step": 116977, "epoch": 1409} {"train_loss": -22.27311134338379, "global_step": 116978, "epoch": 1409} {"train_loss": -22.477434158325195, "global_step": 116979, "epoch": 1409} {"train_loss": -22.35123062133789, "global_step": 116980, "epoch": 1409} {"train_loss": -22.040800094604492, "global_step": 116981, "epoch": 1409} {"train_loss": -22.189512252807617, "global_step": 116982, "epoch": 1409} {"train_loss": -22.490201950073242, "global_step": 116983, "epoch": 1409} {"train_loss": -22.43737030029297, "global_step": 116984, "epoch": 1409} {"train_loss": -22.269607543945312, "global_step": 116985, "epoch": 1409} {"train_loss": -22.363632202148438, "global_step": 116986, "epoch": 1409} {"train_loss": -22.432674407958984, "global_step": 116987, "epoch": 1409} {"train_loss": -22.755857467651367, "global_step": 116988, "epoch": 1409} {"train_loss": -22.253387451171875, "global_step": 116989, "epoch": 1409} {"train_loss": -22.489282608032227, "global_step": 116990, "epoch": 1409} {"train_loss": -22.433147430419922, "global_step": 116991, "epoch": 1409} {"train_loss": -22.790695190429688, "global_step": 116992, "epoch": 1409} {"train_loss": -22.515460968017578, "global_step": 116993, "epoch": 1409} {"train_loss": -22.68460464477539, "global_step": 116994, "epoch": 1409} {"train_loss": -22.055522918701172, "global_step": 116995, "epoch": 1409} {"train_loss": -21.81172752380371, "global_step": 116996, "epoch": 1409} {"train_loss": -22.36517333984375, "global_step": 116997, "epoch": 1409} {"train_loss": -22.746734619140625, "global_step": 116998, "epoch": 1409} {"train_loss": -22.380836486816406, "global_step": 116999, "epoch": 1409} {"train_loss": -22.12016487121582, "global_step": 117000, "epoch": 1409} {"train_loss": -22.563268661499023, "global_step": 117001, "epoch": 1409} {"train_loss": -21.98727798461914, "global_step": 117002, "epoch": 1409} {"train_loss": -22.47750473022461, "global_step": 117003, "epoch": 1409} {"train_loss": -22.95686149597168, "global_step": 117004, "epoch": 1409} {"train_loss": -22.76497459411621, "global_step": 117005, "epoch": 1409} {"train_loss": -22.648054122924805, "global_step": 117006, "epoch": 1409} {"train_loss": -22.44244956970215, "global_step": 117007, "epoch": 1409} {"train_loss": -22.508182525634766, "global_step": 117008, "epoch": 1409} {"train_loss": -22.65655517578125, "global_step": 117009, "epoch": 1409} {"train_loss": -22.667301177978516, "global_step": 117010, "epoch": 1409} {"train_loss": -22.151107788085938, "global_step": 117011, "epoch": 1409} {"train_loss": -22.099395751953125, "global_step": 117012, "epoch": 1409} {"train_loss": -22.994232177734375, "global_step": 117013, "epoch": 1409} {"train_loss": -22.961002349853516, "global_step": 117014, "epoch": 1409} {"train_loss": -22.261154174804688, "global_step": 117015, "epoch": 1409} {"train_loss": -22.55870819091797, "global_step": 117016, "epoch": 1409} {"train_loss": -22.69603157043457, "global_step": 117017, "epoch": 1409} {"train_loss": -22.52132225036621, "global_step": 117018, "epoch": 1409} {"train_loss": -22.839033126831055, "global_step": 117019, "epoch": 1409} {"train_loss": -22.21539306640625, "global_step": 117020, "epoch": 1409} {"train_loss": -22.54128074645996, "global_step": 117021, "epoch": 1409} {"train_loss": -22.949010848999023, "global_step": 117022, "epoch": 1409} {"train_loss": -22.464618682861328, "global_step": 117023, "epoch": 1409} {"train_loss": -22.558425903320312, "global_step": 117024, "epoch": 1409} {"train_loss": -22.783313751220703, "global_step": 117025, "epoch": 1409} {"train_loss": -22.98095703125, "global_step": 117026, "epoch": 1409} {"train_loss": -22.228652954101562, "global_step": 117027, "epoch": 1409} {"train_loss": -22.0922908782959, "global_step": 117028, "epoch": 1409} {"train_loss": -22.343073350837432, "global_step": 117029, "epoch": 1409, "val_loss": 6154724.0} {"train_loss": -21.657331466674805, "global_step": 117030, "epoch": 1410} {"train_loss": -20.998458862304688, "global_step": 117031, "epoch": 1410} {"train_loss": -21.48931121826172, "global_step": 117032, "epoch": 1410} {"train_loss": -21.671781539916992, "global_step": 117033, "epoch": 1410} {"train_loss": -21.57493019104004, "global_step": 117034, "epoch": 1410} {"train_loss": -21.529102325439453, "global_step": 117035, "epoch": 1410} {"train_loss": -21.865644454956055, "global_step": 117036, "epoch": 1410} {"train_loss": -22.141172409057617, "global_step": 117037, "epoch": 1410} {"train_loss": -21.905227661132812, "global_step": 117038, "epoch": 1410} {"train_loss": -21.937711715698242, "global_step": 117039, "epoch": 1410} {"train_loss": -21.88044548034668, "global_step": 117040, "epoch": 1410} {"train_loss": -21.841665267944336, "global_step": 117041, "epoch": 1410} {"train_loss": -22.08064079284668, "global_step": 117042, "epoch": 1410} {"train_loss": -21.837430953979492, "global_step": 117043, "epoch": 1410} {"train_loss": -21.80150032043457, "global_step": 117044, "epoch": 1410} {"train_loss": -22.179113388061523, "global_step": 117045, "epoch": 1410} {"train_loss": -21.830108642578125, "global_step": 117046, "epoch": 1410} {"train_loss": -21.88974952697754, "global_step": 117047, "epoch": 1410} {"train_loss": -22.317386627197266, "global_step": 117048, "epoch": 1410} {"train_loss": -21.92303466796875, "global_step": 117049, "epoch": 1410} {"train_loss": -22.39534568786621, "global_step": 117050, "epoch": 1410} {"train_loss": -22.199201583862305, "global_step": 117051, "epoch": 1410} {"train_loss": -22.365293502807617, "global_step": 117052, "epoch": 1410} {"train_loss": -22.571874618530273, "global_step": 117053, "epoch": 1410} {"train_loss": -22.2325496673584, "global_step": 117054, "epoch": 1410} {"train_loss": -21.982263565063477, "global_step": 117055, "epoch": 1410} {"train_loss": -21.728403091430664, "global_step": 117056, "epoch": 1410} {"train_loss": -22.25555992126465, "global_step": 117057, "epoch": 1410} {"train_loss": -22.470815658569336, "global_step": 117058, "epoch": 1410} {"train_loss": -22.231462478637695, "global_step": 117059, "epoch": 1410} {"train_loss": -22.363676071166992, "global_step": 117060, "epoch": 1410} {"train_loss": -22.122060775756836, "global_step": 117061, "epoch": 1410} {"train_loss": -22.769582748413086, "global_step": 117062, "epoch": 1410} {"train_loss": -22.40296745300293, "global_step": 117063, "epoch": 1410} {"train_loss": -22.273874282836914, "global_step": 117064, "epoch": 1410} {"train_loss": -22.510534286499023, "global_step": 117065, "epoch": 1410} {"train_loss": -22.2701358795166, "global_step": 117066, "epoch": 1410} {"train_loss": -22.46512794494629, "global_step": 117067, "epoch": 1410} {"train_loss": -22.642623901367188, "global_step": 117068, "epoch": 1410} {"train_loss": -22.49597930908203, "global_step": 117069, "epoch": 1410} {"train_loss": -22.651260375976562, "global_step": 117070, "epoch": 1410} {"train_loss": -22.74321937561035, "global_step": 117071, "epoch": 1410} {"train_loss": -22.780057907104492, "global_step": 117072, "epoch": 1410} {"train_loss": -22.69839096069336, "global_step": 117073, "epoch": 1410} {"train_loss": -22.404020309448242, "global_step": 117074, "epoch": 1410} {"train_loss": -22.347305297851562, "global_step": 117075, "epoch": 1410} {"train_loss": -22.350011825561523, "global_step": 117076, "epoch": 1410} {"train_loss": -22.323251724243164, "global_step": 117077, "epoch": 1410} {"train_loss": -22.27533721923828, "global_step": 117078, "epoch": 1410} {"train_loss": -22.773767471313477, "global_step": 117079, "epoch": 1410} {"train_loss": -22.73320960998535, "global_step": 117080, "epoch": 1410} {"train_loss": -22.485349655151367, "global_step": 117081, "epoch": 1410} {"train_loss": -22.371946334838867, "global_step": 117082, "epoch": 1410} {"train_loss": -22.51190185546875, "global_step": 117083, "epoch": 1410} {"train_loss": -22.565824508666992, "global_step": 117084, "epoch": 1410} {"train_loss": -22.24408531188965, "global_step": 117085, "epoch": 1410} {"train_loss": -22.275571823120117, "global_step": 117086, "epoch": 1410} {"train_loss": -22.4669132232666, "global_step": 117087, "epoch": 1410} {"train_loss": -22.159650802612305, "global_step": 117088, "epoch": 1410} {"train_loss": -22.51988983154297, "global_step": 117089, "epoch": 1410} {"train_loss": -22.746078491210938, "global_step": 117090, "epoch": 1410} {"train_loss": -22.720657348632812, "global_step": 117091, "epoch": 1410} {"train_loss": -22.474838256835938, "global_step": 117092, "epoch": 1410} {"train_loss": -22.355571746826172, "global_step": 117093, "epoch": 1410} {"train_loss": -22.383466720581055, "global_step": 117094, "epoch": 1410} {"train_loss": -22.1956729888916, "global_step": 117095, "epoch": 1410} {"train_loss": -22.787023544311523, "global_step": 117096, "epoch": 1410} {"train_loss": -22.220335006713867, "global_step": 117097, "epoch": 1410} {"train_loss": -22.55482292175293, "global_step": 117098, "epoch": 1410} {"train_loss": -22.678476333618164, "global_step": 117099, "epoch": 1410} {"train_loss": -22.845462799072266, "global_step": 117100, "epoch": 1410} {"train_loss": -22.663143157958984, "global_step": 117101, "epoch": 1410} {"train_loss": -22.822330474853516, "global_step": 117102, "epoch": 1410} {"train_loss": -22.471220016479492, "global_step": 117103, "epoch": 1410} {"train_loss": -22.506330490112305, "global_step": 117104, "epoch": 1410} {"train_loss": -22.15398406982422, "global_step": 117105, "epoch": 1410} {"train_loss": -22.304574966430664, "global_step": 117106, "epoch": 1410} {"train_loss": -22.500263214111328, "global_step": 117107, "epoch": 1410} {"train_loss": -22.481660842895508, "global_step": 117108, "epoch": 1410} {"train_loss": -22.872234344482422, "global_step": 117109, "epoch": 1410} {"train_loss": -22.178024291992188, "global_step": 117110, "epoch": 1410} {"train_loss": -21.829395294189453, "global_step": 117111, "epoch": 1410} {"train_loss": -22.28311166418604, "global_step": 117112, "epoch": 1410, "val_loss": 6255679.0} {"train_loss": -21.736108779907227, "global_step": 117113, "epoch": 1411} {"train_loss": -21.214141845703125, "global_step": 117114, "epoch": 1411} {"train_loss": -21.690387725830078, "global_step": 117115, "epoch": 1411} {"train_loss": -21.710712432861328, "global_step": 117116, "epoch": 1411} {"train_loss": -21.656713485717773, "global_step": 117117, "epoch": 1411} {"train_loss": -21.846717834472656, "global_step": 117118, "epoch": 1411} {"train_loss": -21.74308204650879, "global_step": 117119, "epoch": 1411} {"train_loss": -21.911401748657227, "global_step": 117120, "epoch": 1411} {"train_loss": -22.398300170898438, "global_step": 117121, "epoch": 1411} {"train_loss": -21.952800750732422, "global_step": 117122, "epoch": 1411} {"train_loss": -22.12262535095215, "global_step": 117123, "epoch": 1411} {"train_loss": -22.418325424194336, "global_step": 117124, "epoch": 1411} {"train_loss": -22.299571990966797, "global_step": 117125, "epoch": 1411} {"train_loss": -21.615554809570312, "global_step": 117126, "epoch": 1411} {"train_loss": -22.112388610839844, "global_step": 117127, "epoch": 1411} {"train_loss": -22.201963424682617, "global_step": 117128, "epoch": 1411} {"train_loss": -22.07624626159668, "global_step": 117129, "epoch": 1411} {"train_loss": -22.23368263244629, "global_step": 117130, "epoch": 1411} {"train_loss": -22.283740997314453, "global_step": 117131, "epoch": 1411} {"train_loss": -22.052698135375977, "global_step": 117132, "epoch": 1411} {"train_loss": -22.194244384765625, "global_step": 117133, "epoch": 1411} {"train_loss": -22.438322067260742, "global_step": 117134, "epoch": 1411} {"train_loss": -22.28160285949707, "global_step": 117135, "epoch": 1411} {"train_loss": -22.184486389160156, "global_step": 117136, "epoch": 1411} {"train_loss": -22.485260009765625, "global_step": 117137, "epoch": 1411} {"train_loss": -22.282306671142578, "global_step": 117138, "epoch": 1411} {"train_loss": -22.218847274780273, "global_step": 117139, "epoch": 1411} {"train_loss": -22.956878662109375, "global_step": 117140, "epoch": 1411} {"train_loss": -22.35552978515625, "global_step": 117141, "epoch": 1411} {"train_loss": -22.385913848876953, "global_step": 117142, "epoch": 1411} {"train_loss": -22.734609603881836, "global_step": 117143, "epoch": 1411} {"train_loss": -22.500532150268555, "global_step": 117144, "epoch": 1411} {"train_loss": -22.215633392333984, "global_step": 117145, "epoch": 1411} {"train_loss": -22.20991325378418, "global_step": 117146, "epoch": 1411} {"train_loss": -22.19301986694336, "global_step": 117147, "epoch": 1411} {"train_loss": -22.514692306518555, "global_step": 117148, "epoch": 1411} {"train_loss": -22.358762741088867, "global_step": 117149, "epoch": 1411} {"train_loss": -22.59073829650879, "global_step": 117150, "epoch": 1411} {"train_loss": -22.4678955078125, "global_step": 117151, "epoch": 1411} {"train_loss": -22.809003829956055, "global_step": 117152, "epoch": 1411} {"train_loss": -22.190549850463867, "global_step": 117153, "epoch": 1411} {"train_loss": -22.66464614868164, "global_step": 117154, "epoch": 1411} {"train_loss": -22.869277954101562, "global_step": 117155, "epoch": 1411} {"train_loss": -22.717548370361328, "global_step": 117156, "epoch": 1411} {"train_loss": -22.415292739868164, "global_step": 117157, "epoch": 1411} {"train_loss": -22.591651916503906, "global_step": 117158, "epoch": 1411} {"train_loss": -22.460363388061523, "global_step": 117159, "epoch": 1411} {"train_loss": -23.03203773498535, "global_step": 117160, "epoch": 1411} {"train_loss": -22.318653106689453, "global_step": 117161, "epoch": 1411} {"train_loss": -22.50650978088379, "global_step": 117162, "epoch": 1411} {"train_loss": -22.55402183532715, "global_step": 117163, "epoch": 1411} {"train_loss": -22.374216079711914, "global_step": 117164, "epoch": 1411} {"train_loss": -22.286230087280273, "global_step": 117165, "epoch": 1411} {"train_loss": -22.318674087524414, "global_step": 117166, "epoch": 1411} {"train_loss": -22.080440521240234, "global_step": 117167, "epoch": 1411} {"train_loss": -22.593564987182617, "global_step": 117168, "epoch": 1411} {"train_loss": -22.659818649291992, "global_step": 117169, "epoch": 1411} {"train_loss": -22.24538803100586, "global_step": 117170, "epoch": 1411} {"train_loss": -22.18623161315918, "global_step": 117171, "epoch": 1411} {"train_loss": -22.067001342773438, "global_step": 117172, "epoch": 1411} {"train_loss": -21.91279411315918, "global_step": 117173, "epoch": 1411} {"train_loss": -22.516918182373047, "global_step": 117174, "epoch": 1411} {"train_loss": -22.499755859375, "global_step": 117175, "epoch": 1411} {"train_loss": -22.61065673828125, "global_step": 117176, "epoch": 1411} {"train_loss": -22.197528839111328, "global_step": 117177, "epoch": 1411} {"train_loss": -22.535293579101562, "global_step": 117178, "epoch": 1411} {"train_loss": -22.02448081970215, "global_step": 117179, "epoch": 1411} {"train_loss": -22.520437240600586, "global_step": 117180, "epoch": 1411} {"train_loss": -22.125104904174805, "global_step": 117181, "epoch": 1411} {"train_loss": -22.593320846557617, "global_step": 117182, "epoch": 1411} {"train_loss": -22.311298370361328, "global_step": 117183, "epoch": 1411} {"train_loss": -22.677000045776367, "global_step": 117184, "epoch": 1411} {"train_loss": -22.53070831298828, "global_step": 117185, "epoch": 1411} {"train_loss": -22.427082061767578, "global_step": 117186, "epoch": 1411} {"train_loss": -22.498859405517578, "global_step": 117187, "epoch": 1411} {"train_loss": -22.351573944091797, "global_step": 117188, "epoch": 1411} {"train_loss": -22.28118324279785, "global_step": 117189, "epoch": 1411} {"train_loss": -22.566638946533203, "global_step": 117190, "epoch": 1411} {"train_loss": -22.390621185302734, "global_step": 117191, "epoch": 1411} {"train_loss": -22.5147647857666, "global_step": 117192, "epoch": 1411} {"train_loss": -22.405256271362305, "global_step": 117193, "epoch": 1411} {"train_loss": -22.60883903503418, "global_step": 117194, "epoch": 1411} {"train_loss": -22.317002813500093, "global_step": 117195, "epoch": 1411, "val_loss": 6277456.0} {"train_loss": -22.15448570251465, "global_step": 117196, "epoch": 1412} {"train_loss": -22.025758743286133, "global_step": 117197, "epoch": 1412} {"train_loss": -22.282398223876953, "global_step": 117198, "epoch": 1412} {"train_loss": -22.13799476623535, "global_step": 117199, "epoch": 1412} {"train_loss": -22.33987808227539, "global_step": 117200, "epoch": 1412} {"train_loss": -22.240894317626953, "global_step": 117201, "epoch": 1412} {"train_loss": -22.082666397094727, "global_step": 117202, "epoch": 1412} {"train_loss": -22.49629783630371, "global_step": 117203, "epoch": 1412} {"train_loss": -21.91973304748535, "global_step": 117204, "epoch": 1412} {"train_loss": -21.9146785736084, "global_step": 117205, "epoch": 1412} {"train_loss": -22.12504005432129, "global_step": 117206, "epoch": 1412} {"train_loss": -22.51085662841797, "global_step": 117207, "epoch": 1412} {"train_loss": -22.714902877807617, "global_step": 117208, "epoch": 1412} {"train_loss": -22.204227447509766, "global_step": 117209, "epoch": 1412} {"train_loss": -22.337589263916016, "global_step": 117210, "epoch": 1412} {"train_loss": -22.595401763916016, "global_step": 117211, "epoch": 1412} {"train_loss": -22.622716903686523, "global_step": 117212, "epoch": 1412} {"train_loss": -22.362850189208984, "global_step": 117213, "epoch": 1412} {"train_loss": -22.809398651123047, "global_step": 117214, "epoch": 1412} {"train_loss": -22.25504493713379, "global_step": 117215, "epoch": 1412} {"train_loss": -22.136816024780273, "global_step": 117216, "epoch": 1412} {"train_loss": -22.572778701782227, "global_step": 117217, "epoch": 1412} {"train_loss": -22.5831356048584, "global_step": 117218, "epoch": 1412} {"train_loss": -22.45623016357422, "global_step": 117219, "epoch": 1412} {"train_loss": -22.251615524291992, "global_step": 117220, "epoch": 1412} {"train_loss": -22.56805419921875, "global_step": 117221, "epoch": 1412} {"train_loss": -22.39686393737793, "global_step": 117222, "epoch": 1412} {"train_loss": -22.291881561279297, "global_step": 117223, "epoch": 1412} {"train_loss": -22.21030044555664, "global_step": 117224, "epoch": 1412} {"train_loss": -22.28376007080078, "global_step": 117225, "epoch": 1412} {"train_loss": -22.417285919189453, "global_step": 117226, "epoch": 1412} {"train_loss": -22.919984817504883, "global_step": 117227, "epoch": 1412} {"train_loss": -22.410978317260742, "global_step": 117228, "epoch": 1412} {"train_loss": -22.555133819580078, "global_step": 117229, "epoch": 1412} {"train_loss": -22.00956916809082, "global_step": 117230, "epoch": 1412} {"train_loss": -22.607866287231445, "global_step": 117231, "epoch": 1412} {"train_loss": -22.717529296875, "global_step": 117232, "epoch": 1412} {"train_loss": -22.606163024902344, "global_step": 117233, "epoch": 1412} {"train_loss": -22.753122329711914, "global_step": 117234, "epoch": 1412} {"train_loss": -22.769628524780273, "global_step": 117235, "epoch": 1412} {"train_loss": -22.66448974609375, "global_step": 117236, "epoch": 1412} {"train_loss": -22.4320011138916, "global_step": 117237, "epoch": 1412} {"train_loss": -22.5363826751709, "global_step": 117238, "epoch": 1412} {"train_loss": -22.841711044311523, "global_step": 117239, "epoch": 1412} {"train_loss": -22.665485382080078, "global_step": 117240, "epoch": 1412} {"train_loss": -22.425413131713867, "global_step": 117241, "epoch": 1412} {"train_loss": -22.83669090270996, "global_step": 117242, "epoch": 1412} {"train_loss": -22.410877227783203, "global_step": 117243, "epoch": 1412} {"train_loss": -22.645294189453125, "global_step": 117244, "epoch": 1412} {"train_loss": -22.412206649780273, "global_step": 117245, "epoch": 1412} {"train_loss": -22.491865158081055, "global_step": 117246, "epoch": 1412} {"train_loss": -22.647781372070312, "global_step": 117247, "epoch": 1412} {"train_loss": -22.409143447875977, "global_step": 117248, "epoch": 1412} {"train_loss": -22.533401489257812, "global_step": 117249, "epoch": 1412} {"train_loss": -22.445955276489258, "global_step": 117250, "epoch": 1412} {"train_loss": -22.838123321533203, "global_step": 117251, "epoch": 1412} {"train_loss": -22.43549919128418, "global_step": 117252, "epoch": 1412} {"train_loss": -22.493824005126953, "global_step": 117253, "epoch": 1412} {"train_loss": -22.31658363342285, "global_step": 117254, "epoch": 1412} {"train_loss": -22.55434226989746, "global_step": 117255, "epoch": 1412} {"train_loss": -22.932199478149414, "global_step": 117256, "epoch": 1412} {"train_loss": -22.13768768310547, "global_step": 117257, "epoch": 1412} {"train_loss": -22.43986701965332, "global_step": 117258, "epoch": 1412} {"train_loss": -22.851566314697266, "global_step": 117259, "epoch": 1412} {"train_loss": -22.137208938598633, "global_step": 117260, "epoch": 1412} {"train_loss": -22.484298706054688, "global_step": 117261, "epoch": 1412} {"train_loss": -22.272756576538086, "global_step": 117262, "epoch": 1412} {"train_loss": -22.606586456298828, "global_step": 117263, "epoch": 1412} {"train_loss": -22.05038833618164, "global_step": 117264, "epoch": 1412} {"train_loss": -22.378969192504883, "global_step": 117265, "epoch": 1412} {"train_loss": -22.332597732543945, "global_step": 117266, "epoch": 1412} {"train_loss": -22.536834716796875, "global_step": 117267, "epoch": 1412} {"train_loss": -22.62765884399414, "global_step": 117268, "epoch": 1412} {"train_loss": -22.515161514282227, "global_step": 117269, "epoch": 1412} {"train_loss": -22.1859188079834, "global_step": 117270, "epoch": 1412} {"train_loss": -22.635528564453125, "global_step": 117271, "epoch": 1412} {"train_loss": -22.325576782226562, "global_step": 117272, "epoch": 1412} {"train_loss": -22.31097984313965, "global_step": 117273, "epoch": 1412} {"train_loss": -22.444120407104492, "global_step": 117274, "epoch": 1412} {"train_loss": -22.232318878173828, "global_step": 117275, "epoch": 1412} {"train_loss": -22.39109230041504, "global_step": 117276, "epoch": 1412} {"train_loss": -22.11966323852539, "global_step": 117277, "epoch": 1412} {"train_loss": -22.420216020331324, "global_step": 117278, "epoch": 1412, "val_loss": 6120123.5} {"train_loss": -22.135122299194336, "global_step": 117279, "epoch": 1413} {"train_loss": -22.39274787902832, "global_step": 117280, "epoch": 1413} {"train_loss": -21.798351287841797, "global_step": 117281, "epoch": 1413} {"train_loss": -22.017601013183594, "global_step": 117282, "epoch": 1413} {"train_loss": -22.297531127929688, "global_step": 117283, "epoch": 1413} {"train_loss": -21.80071449279785, "global_step": 117284, "epoch": 1413} {"train_loss": -21.85968017578125, "global_step": 117285, "epoch": 1413} {"train_loss": -22.17951011657715, "global_step": 117286, "epoch": 1413} {"train_loss": -22.312015533447266, "global_step": 117287, "epoch": 1413} {"train_loss": -22.524564743041992, "global_step": 117288, "epoch": 1413} {"train_loss": -22.19821548461914, "global_step": 117289, "epoch": 1413} {"train_loss": -22.564294815063477, "global_step": 117290, "epoch": 1413} {"train_loss": -22.146535873413086, "global_step": 117291, "epoch": 1413} {"train_loss": -22.270893096923828, "global_step": 117292, "epoch": 1413} {"train_loss": -22.17715835571289, "global_step": 117293, "epoch": 1413} {"train_loss": -22.408233642578125, "global_step": 117294, "epoch": 1413} {"train_loss": -22.116193771362305, "global_step": 117295, "epoch": 1413} {"train_loss": -22.302974700927734, "global_step": 117296, "epoch": 1413} {"train_loss": -22.335004806518555, "global_step": 117297, "epoch": 1413} {"train_loss": -22.25598907470703, "global_step": 117298, "epoch": 1413} {"train_loss": -22.361433029174805, "global_step": 117299, "epoch": 1413} {"train_loss": -21.98871421813965, "global_step": 117300, "epoch": 1413} {"train_loss": -22.143156051635742, "global_step": 117301, "epoch": 1413} {"train_loss": -22.105609893798828, "global_step": 117302, "epoch": 1413} {"train_loss": -21.97397232055664, "global_step": 117303, "epoch": 1413} {"train_loss": -22.582765579223633, "global_step": 117304, "epoch": 1413} {"train_loss": -22.735919952392578, "global_step": 117305, "epoch": 1413} {"train_loss": -22.51106834411621, "global_step": 117306, "epoch": 1413} {"train_loss": -22.37868309020996, "global_step": 117307, "epoch": 1413} {"train_loss": -22.263507843017578, "global_step": 117308, "epoch": 1413} {"train_loss": -22.493432998657227, "global_step": 117309, "epoch": 1413} {"train_loss": -22.113895416259766, "global_step": 117310, "epoch": 1413} {"train_loss": -22.644163131713867, "global_step": 117311, "epoch": 1413} {"train_loss": -22.8704833984375, "global_step": 117312, "epoch": 1413} {"train_loss": -22.50238037109375, "global_step": 117313, "epoch": 1413} {"train_loss": -22.438674926757812, "global_step": 117314, "epoch": 1413} {"train_loss": -22.648000717163086, "global_step": 117315, "epoch": 1413} {"train_loss": -22.610761642456055, "global_step": 117316, "epoch": 1413} {"train_loss": -21.98286247253418, "global_step": 117317, "epoch": 1413} {"train_loss": -22.505102157592773, "global_step": 117318, "epoch": 1413} {"train_loss": -22.52828025817871, "global_step": 117319, "epoch": 1413} {"train_loss": -22.580310821533203, "global_step": 117320, "epoch": 1413} {"train_loss": -22.202665328979492, "global_step": 117321, "epoch": 1413} {"train_loss": -22.751371383666992, "global_step": 117322, "epoch": 1413} {"train_loss": -22.712533950805664, "global_step": 117323, "epoch": 1413} {"train_loss": -22.652334213256836, "global_step": 117324, "epoch": 1413} {"train_loss": -22.434091567993164, "global_step": 117325, "epoch": 1413} {"train_loss": -22.226438522338867, "global_step": 117326, "epoch": 1413} {"train_loss": -22.5678768157959, "global_step": 117327, "epoch": 1413} {"train_loss": -22.47639274597168, "global_step": 117328, "epoch": 1413} {"train_loss": -22.178203582763672, "global_step": 117329, "epoch": 1413} {"train_loss": -22.738691329956055, "global_step": 117330, "epoch": 1413} {"train_loss": -22.043909072875977, "global_step": 117331, "epoch": 1413} {"train_loss": -22.452880859375, "global_step": 117332, "epoch": 1413} {"train_loss": -22.644546508789062, "global_step": 117333, "epoch": 1413} {"train_loss": -22.228845596313477, "global_step": 117334, "epoch": 1413} {"train_loss": -22.675809860229492, "global_step": 117335, "epoch": 1413} {"train_loss": -22.562353134155273, "global_step": 117336, "epoch": 1413} {"train_loss": -22.220794677734375, "global_step": 117337, "epoch": 1413} {"train_loss": -22.412965774536133, "global_step": 117338, "epoch": 1413} {"train_loss": -22.72014617919922, "global_step": 117339, "epoch": 1413} {"train_loss": -22.066062927246094, "global_step": 117340, "epoch": 1413} {"train_loss": -22.366283416748047, "global_step": 117341, "epoch": 1413} {"train_loss": -22.0731201171875, "global_step": 117342, "epoch": 1413} {"train_loss": -22.398773193359375, "global_step": 117343, "epoch": 1413} {"train_loss": -22.152175903320312, "global_step": 117344, "epoch": 1413} {"train_loss": -22.728567123413086, "global_step": 117345, "epoch": 1413} {"train_loss": -22.4514102935791, "global_step": 117346, "epoch": 1413} {"train_loss": -22.454374313354492, "global_step": 117347, "epoch": 1413} {"train_loss": -22.10153579711914, "global_step": 117348, "epoch": 1413} {"train_loss": -22.41704559326172, "global_step": 117349, "epoch": 1413} {"train_loss": -22.10005760192871, "global_step": 117350, "epoch": 1413} {"train_loss": -22.343276977539062, "global_step": 117351, "epoch": 1413} {"train_loss": -22.636356353759766, "global_step": 117352, "epoch": 1413} {"train_loss": -22.532438278198242, "global_step": 117353, "epoch": 1413} {"train_loss": -22.808563232421875, "global_step": 117354, "epoch": 1413} {"train_loss": -22.638071060180664, "global_step": 117355, "epoch": 1413} {"train_loss": -22.4440860748291, "global_step": 117356, "epoch": 1413} {"train_loss": -22.452091217041016, "global_step": 117357, "epoch": 1413} {"train_loss": -22.579944610595703, "global_step": 117358, "epoch": 1413} {"train_loss": -22.852136611938477, "global_step": 117359, "epoch": 1413} {"train_loss": -22.552505493164062, "global_step": 117360, "epoch": 1413} {"train_loss": -22.374907528061463, "global_step": 117361, "epoch": 1413, "val_loss": 6264189.0} {"train_loss": -22.40519142150879, "global_step": 117362, "epoch": 1414} {"train_loss": -21.940847396850586, "global_step": 117363, "epoch": 1414} {"train_loss": -22.123029708862305, "global_step": 117364, "epoch": 1414} {"train_loss": -21.9189395904541, "global_step": 117365, "epoch": 1414} {"train_loss": -22.163698196411133, "global_step": 117366, "epoch": 1414} {"train_loss": -22.238454818725586, "global_step": 117367, "epoch": 1414} {"train_loss": -22.318111419677734, "global_step": 117368, "epoch": 1414} {"train_loss": -22.435571670532227, "global_step": 117369, "epoch": 1414} {"train_loss": -22.14069938659668, "global_step": 117370, "epoch": 1414} {"train_loss": -22.332489013671875, "global_step": 117371, "epoch": 1414} {"train_loss": -22.205007553100586, "global_step": 117372, "epoch": 1414} {"train_loss": -21.968175888061523, "global_step": 117373, "epoch": 1414} {"train_loss": -22.307287216186523, "global_step": 117374, "epoch": 1414} {"train_loss": -22.19624900817871, "global_step": 117375, "epoch": 1414} {"train_loss": -22.420764923095703, "global_step": 117376, "epoch": 1414} {"train_loss": -22.30638313293457, "global_step": 117377, "epoch": 1414} {"train_loss": -22.411535263061523, "global_step": 117378, "epoch": 1414} {"train_loss": -22.385183334350586, "global_step": 117379, "epoch": 1414} {"train_loss": -22.31935691833496, "global_step": 117380, "epoch": 1414} {"train_loss": -22.52811050415039, "global_step": 117381, "epoch": 1414} {"train_loss": -22.30291175842285, "global_step": 117382, "epoch": 1414} {"train_loss": -22.648033142089844, "global_step": 117383, "epoch": 1414} {"train_loss": -22.449941635131836, "global_step": 117384, "epoch": 1414} {"train_loss": -22.713581085205078, "global_step": 117385, "epoch": 1414} {"train_loss": -22.781843185424805, "global_step": 117386, "epoch": 1414} {"train_loss": -22.54151725769043, "global_step": 117387, "epoch": 1414} {"train_loss": -22.37994956970215, "global_step": 117388, "epoch": 1414} {"train_loss": -22.634740829467773, "global_step": 117389, "epoch": 1414} {"train_loss": -22.04498863220215, "global_step": 117390, "epoch": 1414} {"train_loss": -22.6127872467041, "global_step": 117391, "epoch": 1414} {"train_loss": -22.48773765563965, "global_step": 117392, "epoch": 1414} {"train_loss": -22.675161361694336, "global_step": 117393, "epoch": 1414} {"train_loss": -22.77615737915039, "global_step": 117394, "epoch": 1414} {"train_loss": -22.742477416992188, "global_step": 117395, "epoch": 1414} {"train_loss": -22.468257904052734, "global_step": 117396, "epoch": 1414} {"train_loss": -22.24186134338379, "global_step": 117397, "epoch": 1414} {"train_loss": -22.67189598083496, "global_step": 117398, "epoch": 1414} {"train_loss": -22.649633407592773, "global_step": 117399, "epoch": 1414} {"train_loss": -22.25307846069336, "global_step": 117400, "epoch": 1414} {"train_loss": -22.444730758666992, "global_step": 117401, "epoch": 1414} {"train_loss": -22.761594772338867, "global_step": 117402, "epoch": 1414} {"train_loss": -22.683473587036133, "global_step": 117403, "epoch": 1414} {"train_loss": -22.72603416442871, "global_step": 117404, "epoch": 1414} {"train_loss": -22.37148094177246, "global_step": 117405, "epoch": 1414} {"train_loss": -22.566539764404297, "global_step": 117406, "epoch": 1414} {"train_loss": -22.676433563232422, "global_step": 117407, "epoch": 1414} {"train_loss": -22.75737190246582, "global_step": 117408, "epoch": 1414} {"train_loss": -21.916990280151367, "global_step": 117409, "epoch": 1414} {"train_loss": -22.568592071533203, "global_step": 117410, "epoch": 1414} {"train_loss": -22.09689712524414, "global_step": 117411, "epoch": 1414} {"train_loss": -22.3443603515625, "global_step": 117412, "epoch": 1414} {"train_loss": -22.450366973876953, "global_step": 117413, "epoch": 1414} {"train_loss": -22.501134872436523, "global_step": 117414, "epoch": 1414} {"train_loss": -22.775392532348633, "global_step": 117415, "epoch": 1414} {"train_loss": -22.51721954345703, "global_step": 117416, "epoch": 1414} {"train_loss": -22.75522232055664, "global_step": 117417, "epoch": 1414} {"train_loss": -22.542917251586914, "global_step": 117418, "epoch": 1414} {"train_loss": -22.53059196472168, "global_step": 117419, "epoch": 1414} {"train_loss": -22.279788970947266, "global_step": 117420, "epoch": 1414} {"train_loss": -22.60851287841797, "global_step": 117421, "epoch": 1414} {"train_loss": -22.234392166137695, "global_step": 117422, "epoch": 1414} {"train_loss": -22.76721954345703, "global_step": 117423, "epoch": 1414} {"train_loss": -22.14180564880371, "global_step": 117424, "epoch": 1414} {"train_loss": -22.279626846313477, "global_step": 117425, "epoch": 1414} {"train_loss": -22.815860748291016, "global_step": 117426, "epoch": 1414} {"train_loss": -22.539020538330078, "global_step": 117427, "epoch": 1414} {"train_loss": -22.920461654663086, "global_step": 117428, "epoch": 1414} {"train_loss": -22.64468002319336, "global_step": 117429, "epoch": 1414} {"train_loss": -22.664228439331055, "global_step": 117430, "epoch": 1414} {"train_loss": -22.755077362060547, "global_step": 117431, "epoch": 1414} {"train_loss": -22.51227378845215, "global_step": 117432, "epoch": 1414} {"train_loss": -22.02021598815918, "global_step": 117433, "epoch": 1414} {"train_loss": -22.35548210144043, "global_step": 117434, "epoch": 1414} {"train_loss": -22.582643508911133, "global_step": 117435, "epoch": 1414} {"train_loss": -22.11260414123535, "global_step": 117436, "epoch": 1414} {"train_loss": -22.49055290222168, "global_step": 117437, "epoch": 1414} {"train_loss": -22.55458641052246, "global_step": 117438, "epoch": 1414} {"train_loss": -22.329509735107422, "global_step": 117439, "epoch": 1414} {"train_loss": -22.473493576049805, "global_step": 117440, "epoch": 1414} {"train_loss": -22.352828979492188, "global_step": 117441, "epoch": 1414} {"train_loss": -22.300344467163086, "global_step": 117442, "epoch": 1414} {"train_loss": -22.608015060424805, "global_step": 117443, "epoch": 1414} {"train_loss": -22.45522363501859, "global_step": 117444, "epoch": 1414, "val_loss": 6297261.0} {"train_loss": -22.41366195678711, "global_step": 117445, "epoch": 1415} {"train_loss": -22.177505493164062, "global_step": 117446, "epoch": 1415} {"train_loss": -22.37749481201172, "global_step": 117447, "epoch": 1415} {"train_loss": -22.06609535217285, "global_step": 117448, "epoch": 1415} {"train_loss": -22.031328201293945, "global_step": 117449, "epoch": 1415} {"train_loss": -22.297443389892578, "global_step": 117450, "epoch": 1415} {"train_loss": -22.2253360748291, "global_step": 117451, "epoch": 1415} {"train_loss": -22.15655517578125, "global_step": 117452, "epoch": 1415} {"train_loss": -22.129077911376953, "global_step": 117453, "epoch": 1415} {"train_loss": -22.187023162841797, "global_step": 117454, "epoch": 1415} {"train_loss": -22.644622802734375, "global_step": 117455, "epoch": 1415} {"train_loss": -22.131805419921875, "global_step": 117456, "epoch": 1415} {"train_loss": -22.52804946899414, "global_step": 117457, "epoch": 1415} {"train_loss": -22.38331413269043, "global_step": 117458, "epoch": 1415} {"train_loss": -22.50101089477539, "global_step": 117459, "epoch": 1415} {"train_loss": -22.864316940307617, "global_step": 117460, "epoch": 1415} {"train_loss": -22.292545318603516, "global_step": 117461, "epoch": 1415} {"train_loss": -22.17401695251465, "global_step": 117462, "epoch": 1415} {"train_loss": -22.474781036376953, "global_step": 117463, "epoch": 1415} {"train_loss": -22.537805557250977, "global_step": 117464, "epoch": 1415} {"train_loss": -22.56371307373047, "global_step": 117465, "epoch": 1415} {"train_loss": -22.337629318237305, "global_step": 117466, "epoch": 1415} {"train_loss": -22.51155662536621, "global_step": 117467, "epoch": 1415} {"train_loss": -22.459854125976562, "global_step": 117468, "epoch": 1415} {"train_loss": -22.463489532470703, "global_step": 117469, "epoch": 1415} {"train_loss": -21.870521545410156, "global_step": 117470, "epoch": 1415} {"train_loss": -22.547286987304688, "global_step": 117471, "epoch": 1415} {"train_loss": -22.464778900146484, "global_step": 117472, "epoch": 1415} {"train_loss": -22.394962310791016, "global_step": 117473, "epoch": 1415} {"train_loss": -22.38551902770996, "global_step": 117474, "epoch": 1415} {"train_loss": -22.25320816040039, "global_step": 117475, "epoch": 1415} {"train_loss": -22.695053100585938, "global_step": 117476, "epoch": 1415} {"train_loss": -22.3792667388916, "global_step": 117477, "epoch": 1415} {"train_loss": -22.366535186767578, "global_step": 117478, "epoch": 1415} {"train_loss": -22.25787353515625, "global_step": 117479, "epoch": 1415} {"train_loss": -22.117324829101562, "global_step": 117480, "epoch": 1415} {"train_loss": -22.519872665405273, "global_step": 117481, "epoch": 1415} {"train_loss": -22.48931884765625, "global_step": 117482, "epoch": 1415} {"train_loss": -22.456851959228516, "global_step": 117483, "epoch": 1415} {"train_loss": -22.37721824645996, "global_step": 117484, "epoch": 1415} {"train_loss": -22.608667373657227, "global_step": 117485, "epoch": 1415} {"train_loss": -22.224016189575195, "global_step": 117486, "epoch": 1415} {"train_loss": -22.252286911010742, "global_step": 117487, "epoch": 1415} {"train_loss": -22.366262435913086, "global_step": 117488, "epoch": 1415} {"train_loss": -22.29882049560547, "global_step": 117489, "epoch": 1415} {"train_loss": -22.13930892944336, "global_step": 117490, "epoch": 1415} {"train_loss": -21.989505767822266, "global_step": 117491, "epoch": 1415} {"train_loss": -22.29599952697754, "global_step": 117492, "epoch": 1415} {"train_loss": -22.486997604370117, "global_step": 117493, "epoch": 1415} {"train_loss": -22.46179962158203, "global_step": 117494, "epoch": 1415} {"train_loss": -22.191997528076172, "global_step": 117495, "epoch": 1415} {"train_loss": -22.133346557617188, "global_step": 117496, "epoch": 1415} {"train_loss": -22.547348022460938, "global_step": 117497, "epoch": 1415} {"train_loss": -22.051965713500977, "global_step": 117498, "epoch": 1415} {"train_loss": -22.243366241455078, "global_step": 117499, "epoch": 1415} {"train_loss": -22.336957931518555, "global_step": 117500, "epoch": 1415} {"train_loss": -22.374521255493164, "global_step": 117501, "epoch": 1415} {"train_loss": -22.271976470947266, "global_step": 117502, "epoch": 1415} {"train_loss": -22.378957748413086, "global_step": 117503, "epoch": 1415} {"train_loss": -22.587533950805664, "global_step": 117504, "epoch": 1415} {"train_loss": -22.710390090942383, "global_step": 117505, "epoch": 1415} {"train_loss": -22.493953704833984, "global_step": 117506, "epoch": 1415} {"train_loss": -22.145919799804688, "global_step": 117507, "epoch": 1415} {"train_loss": -22.5787353515625, "global_step": 117508, "epoch": 1415} {"train_loss": -22.149906158447266, "global_step": 117509, "epoch": 1415} {"train_loss": -22.235088348388672, "global_step": 117510, "epoch": 1415} {"train_loss": -22.62131690979004, "global_step": 117511, "epoch": 1415} {"train_loss": -22.521371841430664, "global_step": 117512, "epoch": 1415} {"train_loss": -22.663206100463867, "global_step": 117513, "epoch": 1415} {"train_loss": -22.536832809448242, "global_step": 117514, "epoch": 1415} {"train_loss": -22.355812072753906, "global_step": 117515, "epoch": 1415} {"train_loss": -22.427236557006836, "global_step": 117516, "epoch": 1415} {"train_loss": -22.660085678100586, "global_step": 117517, "epoch": 1415} {"train_loss": -22.230854034423828, "global_step": 117518, "epoch": 1415} {"train_loss": -22.906238555908203, "global_step": 117519, "epoch": 1415} {"train_loss": -22.758508682250977, "global_step": 117520, "epoch": 1415} {"train_loss": -22.733304977416992, "global_step": 117521, "epoch": 1415} {"train_loss": -22.738035202026367, "global_step": 117522, "epoch": 1415} {"train_loss": -22.141157150268555, "global_step": 117523, "epoch": 1415} {"train_loss": -22.811967849731445, "global_step": 117524, "epoch": 1415} {"train_loss": -22.711210250854492, "global_step": 117525, "epoch": 1415} {"train_loss": -22.553091049194336, "global_step": 117526, "epoch": 1415} {"train_loss": -22.406139052057842, "global_step": 117527, "epoch": 1415, "val_loss": 6087336.0} {"train_loss": -21.83253288269043, "global_step": 117528, "epoch": 1416} {"train_loss": -22.091739654541016, "global_step": 117529, "epoch": 1416} {"train_loss": -22.140613555908203, "global_step": 117530, "epoch": 1416} {"train_loss": -22.268537521362305, "global_step": 117531, "epoch": 1416} {"train_loss": -22.058231353759766, "global_step": 117532, "epoch": 1416} {"train_loss": -22.48915672302246, "global_step": 117533, "epoch": 1416} {"train_loss": -21.874313354492188, "global_step": 117534, "epoch": 1416} {"train_loss": -21.978939056396484, "global_step": 117535, "epoch": 1416} {"train_loss": -22.179439544677734, "global_step": 117536, "epoch": 1416} {"train_loss": -22.26618003845215, "global_step": 117537, "epoch": 1416} {"train_loss": -22.060474395751953, "global_step": 117538, "epoch": 1416} {"train_loss": -22.74379539489746, "global_step": 117539, "epoch": 1416} {"train_loss": -22.189346313476562, "global_step": 117540, "epoch": 1416} {"train_loss": -22.48837661743164, "global_step": 117541, "epoch": 1416} {"train_loss": -22.40154457092285, "global_step": 117542, "epoch": 1416} {"train_loss": -22.34462547302246, "global_step": 117543, "epoch": 1416} {"train_loss": -22.31142234802246, "global_step": 117544, "epoch": 1416} {"train_loss": -22.600584030151367, "global_step": 117545, "epoch": 1416} {"train_loss": -22.796606063842773, "global_step": 117546, "epoch": 1416} {"train_loss": -22.223661422729492, "global_step": 117547, "epoch": 1416} {"train_loss": -22.652498245239258, "global_step": 117548, "epoch": 1416} {"train_loss": -22.428091049194336, "global_step": 117549, "epoch": 1416} {"train_loss": -22.695207595825195, "global_step": 117550, "epoch": 1416} {"train_loss": -21.91786766052246, "global_step": 117551, "epoch": 1416} {"train_loss": -22.63416290283203, "global_step": 117552, "epoch": 1416} {"train_loss": -22.287363052368164, "global_step": 117553, "epoch": 1416} {"train_loss": -22.45551109313965, "global_step": 117554, "epoch": 1416} {"train_loss": -22.947355270385742, "global_step": 117555, "epoch": 1416} {"train_loss": -22.138225555419922, "global_step": 117556, "epoch": 1416} {"train_loss": -22.304407119750977, "global_step": 117557, "epoch": 1416} {"train_loss": -22.362552642822266, "global_step": 117558, "epoch": 1416} {"train_loss": -22.31854820251465, "global_step": 117559, "epoch": 1416} {"train_loss": -22.394968032836914, "global_step": 117560, "epoch": 1416} {"train_loss": -22.523529052734375, "global_step": 117561, "epoch": 1416} {"train_loss": -22.196516036987305, "global_step": 117562, "epoch": 1416} {"train_loss": -22.712064743041992, "global_step": 117563, "epoch": 1416} {"train_loss": -22.54340934753418, "global_step": 117564, "epoch": 1416} {"train_loss": -22.41587257385254, "global_step": 117565, "epoch": 1416} {"train_loss": -22.14705467224121, "global_step": 117566, "epoch": 1416} {"train_loss": -22.242454528808594, "global_step": 117567, "epoch": 1416} {"train_loss": -22.56802749633789, "global_step": 117568, "epoch": 1416} {"train_loss": -21.922391891479492, "global_step": 117569, "epoch": 1416} {"train_loss": -22.258577346801758, "global_step": 117570, "epoch": 1416} {"train_loss": -22.799657821655273, "global_step": 117571, "epoch": 1416} {"train_loss": -22.448915481567383, "global_step": 117572, "epoch": 1416} {"train_loss": -22.48541831970215, "global_step": 117573, "epoch": 1416} {"train_loss": -22.68459129333496, "global_step": 117574, "epoch": 1416} {"train_loss": -22.45747184753418, "global_step": 117575, "epoch": 1416} {"train_loss": -22.44470977783203, "global_step": 117576, "epoch": 1416} {"train_loss": -22.302295684814453, "global_step": 117577, "epoch": 1416} {"train_loss": -22.51227378845215, "global_step": 117578, "epoch": 1416} {"train_loss": -22.169843673706055, "global_step": 117579, "epoch": 1416} {"train_loss": -22.188064575195312, "global_step": 117580, "epoch": 1416} {"train_loss": -22.748703002929688, "global_step": 117581, "epoch": 1416} {"train_loss": -22.51727867126465, "global_step": 117582, "epoch": 1416} {"train_loss": -22.511001586914062, "global_step": 117583, "epoch": 1416} {"train_loss": -22.27955436706543, "global_step": 117584, "epoch": 1416} {"train_loss": -22.405925750732422, "global_step": 117585, "epoch": 1416} {"train_loss": -22.15972137451172, "global_step": 117586, "epoch": 1416} {"train_loss": -22.536869049072266, "global_step": 117587, "epoch": 1416} {"train_loss": -22.270872116088867, "global_step": 117588, "epoch": 1416} {"train_loss": -22.369043350219727, "global_step": 117589, "epoch": 1416} {"train_loss": -22.46895980834961, "global_step": 117590, "epoch": 1416} {"train_loss": -22.46442985534668, "global_step": 117591, "epoch": 1416} {"train_loss": -22.338682174682617, "global_step": 117592, "epoch": 1416} {"train_loss": -22.49907875061035, "global_step": 117593, "epoch": 1416} {"train_loss": -22.33542251586914, "global_step": 117594, "epoch": 1416} {"train_loss": -22.36469841003418, "global_step": 117595, "epoch": 1416} {"train_loss": -22.358551025390625, "global_step": 117596, "epoch": 1416} {"train_loss": -22.65777587890625, "global_step": 117597, "epoch": 1416} {"train_loss": -22.449710845947266, "global_step": 117598, "epoch": 1416} {"train_loss": -22.549802780151367, "global_step": 117599, "epoch": 1416} {"train_loss": -22.717416763305664, "global_step": 117600, "epoch": 1416} {"train_loss": -22.535581588745117, "global_step": 117601, "epoch": 1416} {"train_loss": -22.073095321655273, "global_step": 117602, "epoch": 1416} {"train_loss": -22.33765411376953, "global_step": 117603, "epoch": 1416} {"train_loss": -22.685026168823242, "global_step": 117604, "epoch": 1416} {"train_loss": -22.553651809692383, "global_step": 117605, "epoch": 1416} {"train_loss": -22.81056022644043, "global_step": 117606, "epoch": 1416} {"train_loss": -22.6584529876709, "global_step": 117607, "epoch": 1416} {"train_loss": -22.786029815673828, "global_step": 117608, "epoch": 1416} {"train_loss": -22.57434844970703, "global_step": 117609, "epoch": 1416} {"train_loss": -22.40232318280691, "global_step": 117610, "epoch": 1416, "val_loss": 6145158.0} {"train_loss": -21.614715576171875, "global_step": 117611, "epoch": 1417} {"train_loss": -21.546424865722656, "global_step": 117612, "epoch": 1417} {"train_loss": -21.705490112304688, "global_step": 117613, "epoch": 1417} {"train_loss": -22.161888122558594, "global_step": 117614, "epoch": 1417} {"train_loss": -21.971569061279297, "global_step": 117615, "epoch": 1417} {"train_loss": -22.37863540649414, "global_step": 117616, "epoch": 1417} {"train_loss": -22.49039649963379, "global_step": 117617, "epoch": 1417} {"train_loss": -22.181596755981445, "global_step": 117618, "epoch": 1417} {"train_loss": -21.85273551940918, "global_step": 117619, "epoch": 1417} {"train_loss": -22.36724853515625, "global_step": 117620, "epoch": 1417} {"train_loss": -22.005346298217773, "global_step": 117621, "epoch": 1417} {"train_loss": -22.343542098999023, "global_step": 117622, "epoch": 1417} {"train_loss": -22.205041885375977, "global_step": 117623, "epoch": 1417} {"train_loss": -22.008438110351562, "global_step": 117624, "epoch": 1417} {"train_loss": -22.522008895874023, "global_step": 117625, "epoch": 1417} {"train_loss": -22.405445098876953, "global_step": 117626, "epoch": 1417} {"train_loss": -22.406240463256836, "global_step": 117627, "epoch": 1417} {"train_loss": -22.25115203857422, "global_step": 117628, "epoch": 1417} {"train_loss": -22.134695053100586, "global_step": 117629, "epoch": 1417} {"train_loss": -22.344106674194336, "global_step": 117630, "epoch": 1417} {"train_loss": -22.55729103088379, "global_step": 117631, "epoch": 1417} {"train_loss": -22.281965255737305, "global_step": 117632, "epoch": 1417} {"train_loss": -22.00241470336914, "global_step": 117633, "epoch": 1417} {"train_loss": -22.403156280517578, "global_step": 117634, "epoch": 1417} {"train_loss": -21.98074722290039, "global_step": 117635, "epoch": 1417} {"train_loss": -22.260671615600586, "global_step": 117636, "epoch": 1417} {"train_loss": -22.08949089050293, "global_step": 117637, "epoch": 1417} {"train_loss": -22.2679500579834, "global_step": 117638, "epoch": 1417} {"train_loss": -22.500797271728516, "global_step": 117639, "epoch": 1417} {"train_loss": -22.27861976623535, "global_step": 117640, "epoch": 1417} {"train_loss": -22.305484771728516, "global_step": 117641, "epoch": 1417} {"train_loss": -22.37009620666504, "global_step": 117642, "epoch": 1417} {"train_loss": -22.208600997924805, "global_step": 117643, "epoch": 1417} {"train_loss": -22.19276237487793, "global_step": 117644, "epoch": 1417} {"train_loss": -22.424169540405273, "global_step": 117645, "epoch": 1417} {"train_loss": -22.049833297729492, "global_step": 117646, "epoch": 1417} {"train_loss": -22.190479278564453, "global_step": 117647, "epoch": 1417} {"train_loss": -22.6622257232666, "global_step": 117648, "epoch": 1417} {"train_loss": -22.269559860229492, "global_step": 117649, "epoch": 1417} {"train_loss": -21.981359481811523, "global_step": 117650, "epoch": 1417} {"train_loss": -22.416362762451172, "global_step": 117651, "epoch": 1417} {"train_loss": -22.71550178527832, "global_step": 117652, "epoch": 1417} {"train_loss": -22.596471786499023, "global_step": 117653, "epoch": 1417} {"train_loss": -22.37892723083496, "global_step": 117654, "epoch": 1417} {"train_loss": -22.31821632385254, "global_step": 117655, "epoch": 1417} {"train_loss": -22.142230987548828, "global_step": 117656, "epoch": 1417} {"train_loss": -22.69777488708496, "global_step": 117657, "epoch": 1417} {"train_loss": -22.75809669494629, "global_step": 117658, "epoch": 1417} {"train_loss": -22.309295654296875, "global_step": 117659, "epoch": 1417} {"train_loss": -22.6342830657959, "global_step": 117660, "epoch": 1417} {"train_loss": -22.56129264831543, "global_step": 117661, "epoch": 1417} {"train_loss": -22.683645248413086, "global_step": 117662, "epoch": 1417} {"train_loss": -22.566543579101562, "global_step": 117663, "epoch": 1417} {"train_loss": -22.630325317382812, "global_step": 117664, "epoch": 1417} {"train_loss": -22.5240421295166, "global_step": 117665, "epoch": 1417} {"train_loss": -22.24808120727539, "global_step": 117666, "epoch": 1417} {"train_loss": -22.564640045166016, "global_step": 117667, "epoch": 1417} {"train_loss": -22.211030960083008, "global_step": 117668, "epoch": 1417} {"train_loss": -22.723098754882812, "global_step": 117669, "epoch": 1417} {"train_loss": -22.3590145111084, "global_step": 117670, "epoch": 1417} {"train_loss": -22.66019630432129, "global_step": 117671, "epoch": 1417} {"train_loss": -22.409442901611328, "global_step": 117672, "epoch": 1417} {"train_loss": -22.641021728515625, "global_step": 117673, "epoch": 1417} {"train_loss": -22.649629592895508, "global_step": 117674, "epoch": 1417} {"train_loss": -22.554479598999023, "global_step": 117675, "epoch": 1417} {"train_loss": -22.555652618408203, "global_step": 117676, "epoch": 1417} {"train_loss": -22.780235290527344, "global_step": 117677, "epoch": 1417} {"train_loss": -22.525665283203125, "global_step": 117678, "epoch": 1417} {"train_loss": -22.396203994750977, "global_step": 117679, "epoch": 1417} {"train_loss": -22.57459259033203, "global_step": 117680, "epoch": 1417} {"train_loss": -22.5347957611084, "global_step": 117681, "epoch": 1417} {"train_loss": -22.50946044921875, "global_step": 117682, "epoch": 1417} {"train_loss": -22.363828659057617, "global_step": 117683, "epoch": 1417} {"train_loss": -22.67829132080078, "global_step": 117684, "epoch": 1417} {"train_loss": -22.619796752929688, "global_step": 117685, "epoch": 1417} {"train_loss": -22.630409240722656, "global_step": 117686, "epoch": 1417} {"train_loss": -22.38040542602539, "global_step": 117687, "epoch": 1417} {"train_loss": -22.84589958190918, "global_step": 117688, "epoch": 1417} {"train_loss": -22.38006019592285, "global_step": 117689, "epoch": 1417} {"train_loss": -22.669084548950195, "global_step": 117690, "epoch": 1417} {"train_loss": -22.620834350585938, "global_step": 117691, "epoch": 1417} {"train_loss": -22.047727584838867, "global_step": 117692, "epoch": 1417} {"train_loss": -22.369462622217384, "global_step": 117693, "epoch": 1417, "val_loss": 6259816.0} {"train_loss": -22.120573043823242, "global_step": 117694, "epoch": 1418} {"train_loss": -21.47272300720215, "global_step": 117695, "epoch": 1418} {"train_loss": -22.034215927124023, "global_step": 117696, "epoch": 1418} {"train_loss": -22.022130966186523, "global_step": 117697, "epoch": 1418} {"train_loss": -22.264448165893555, "global_step": 117698, "epoch": 1418} {"train_loss": -22.245704650878906, "global_step": 117699, "epoch": 1418} {"train_loss": -22.258886337280273, "global_step": 117700, "epoch": 1418} {"train_loss": -22.210468292236328, "global_step": 117701, "epoch": 1418} {"train_loss": -21.91143798828125, "global_step": 117702, "epoch": 1418} {"train_loss": -22.38039207458496, "global_step": 117703, "epoch": 1418} {"train_loss": -22.282270431518555, "global_step": 117704, "epoch": 1418} {"train_loss": -22.356647491455078, "global_step": 117705, "epoch": 1418} {"train_loss": -22.296842575073242, "global_step": 117706, "epoch": 1418} {"train_loss": -22.537307739257812, "global_step": 117707, "epoch": 1418} {"train_loss": -22.370588302612305, "global_step": 117708, "epoch": 1418} {"train_loss": -22.139345169067383, "global_step": 117709, "epoch": 1418} {"train_loss": -22.387470245361328, "global_step": 117710, "epoch": 1418} {"train_loss": -22.692180633544922, "global_step": 117711, "epoch": 1418} {"train_loss": -22.305692672729492, "global_step": 117712, "epoch": 1418} {"train_loss": -22.525434494018555, "global_step": 117713, "epoch": 1418} {"train_loss": -22.163532257080078, "global_step": 117714, "epoch": 1418} {"train_loss": -22.414854049682617, "global_step": 117715, "epoch": 1418} {"train_loss": -22.30953598022461, "global_step": 117716, "epoch": 1418} {"train_loss": -22.595367431640625, "global_step": 117717, "epoch": 1418} {"train_loss": -22.392751693725586, "global_step": 117718, "epoch": 1418} {"train_loss": -22.5494327545166, "global_step": 117719, "epoch": 1418} {"train_loss": -22.66959571838379, "global_step": 117720, "epoch": 1418} {"train_loss": -22.50020408630371, "global_step": 117721, "epoch": 1418} {"train_loss": -22.37494659423828, "global_step": 117722, "epoch": 1418} {"train_loss": -22.613269805908203, "global_step": 117723, "epoch": 1418} {"train_loss": -22.290790557861328, "global_step": 117724, "epoch": 1418} {"train_loss": -22.502769470214844, "global_step": 117725, "epoch": 1418} {"train_loss": -22.449344635009766, "global_step": 117726, "epoch": 1418} {"train_loss": -22.581159591674805, "global_step": 117727, "epoch": 1418} {"train_loss": -22.342639923095703, "global_step": 117728, "epoch": 1418} {"train_loss": -22.654172897338867, "global_step": 117729, "epoch": 1418} {"train_loss": -22.501235961914062, "global_step": 117730, "epoch": 1418} {"train_loss": -22.594099044799805, "global_step": 117731, "epoch": 1418} {"train_loss": -22.62086296081543, "global_step": 117732, "epoch": 1418} {"train_loss": -22.691129684448242, "global_step": 117733, "epoch": 1418} {"train_loss": -22.524076461791992, "global_step": 117734, "epoch": 1418} {"train_loss": -22.572946548461914, "global_step": 117735, "epoch": 1418} {"train_loss": -22.216550827026367, "global_step": 117736, "epoch": 1418} {"train_loss": -22.664350509643555, "global_step": 117737, "epoch": 1418} {"train_loss": -22.6071834564209, "global_step": 117738, "epoch": 1418} {"train_loss": -22.30520248413086, "global_step": 117739, "epoch": 1418} {"train_loss": -22.143495559692383, "global_step": 117740, "epoch": 1418} {"train_loss": -22.692537307739258, "global_step": 117741, "epoch": 1418} {"train_loss": -22.616130828857422, "global_step": 117742, "epoch": 1418} {"train_loss": -22.707523345947266, "global_step": 117743, "epoch": 1418} {"train_loss": -22.628936767578125, "global_step": 117744, "epoch": 1418} {"train_loss": -22.341632843017578, "global_step": 117745, "epoch": 1418} {"train_loss": -22.528844833374023, "global_step": 117746, "epoch": 1418} {"train_loss": -22.5808048248291, "global_step": 117747, "epoch": 1418} {"train_loss": -22.642438888549805, "global_step": 117748, "epoch": 1418} {"train_loss": -22.58962059020996, "global_step": 117749, "epoch": 1418} {"train_loss": -22.40802574157715, "global_step": 117750, "epoch": 1418} {"train_loss": -22.194843292236328, "global_step": 117751, "epoch": 1418} {"train_loss": -22.315853118896484, "global_step": 117752, "epoch": 1418} {"train_loss": -22.216184616088867, "global_step": 117753, "epoch": 1418} {"train_loss": -22.344934463500977, "global_step": 117754, "epoch": 1418} {"train_loss": -22.607345581054688, "global_step": 117755, "epoch": 1418} {"train_loss": -22.60486602783203, "global_step": 117756, "epoch": 1418} {"train_loss": -22.249683380126953, "global_step": 117757, "epoch": 1418} {"train_loss": -22.74529457092285, "global_step": 117758, "epoch": 1418} {"train_loss": -22.205707550048828, "global_step": 117759, "epoch": 1418} {"train_loss": -22.420108795166016, "global_step": 117760, "epoch": 1418} {"train_loss": -22.416275024414062, "global_step": 117761, "epoch": 1418} {"train_loss": -22.25257110595703, "global_step": 117762, "epoch": 1418} {"train_loss": -22.25112533569336, "global_step": 117763, "epoch": 1418} {"train_loss": -22.29775047302246, "global_step": 117764, "epoch": 1418} {"train_loss": -22.18138885498047, "global_step": 117765, "epoch": 1418} {"train_loss": -22.379350662231445, "global_step": 117766, "epoch": 1418} {"train_loss": -22.749425888061523, "global_step": 117767, "epoch": 1418} {"train_loss": -22.5841121673584, "global_step": 117768, "epoch": 1418} {"train_loss": -22.665231704711914, "global_step": 117769, "epoch": 1418} {"train_loss": -22.441919326782227, "global_step": 117770, "epoch": 1418} {"train_loss": -22.287094116210938, "global_step": 117771, "epoch": 1418} {"train_loss": -22.40485954284668, "global_step": 117772, "epoch": 1418} {"train_loss": -22.470441818237305, "global_step": 117773, "epoch": 1418} {"train_loss": -22.276840209960938, "global_step": 117774, "epoch": 1418} {"train_loss": -22.319551467895508, "global_step": 117775, "epoch": 1418} {"train_loss": -22.40003937411021, "global_step": 117776, "epoch": 1418, "val_loss": 6183575.0} {"train_loss": -22.106916427612305, "global_step": 117777, "epoch": 1419} {"train_loss": -21.55690574645996, "global_step": 117778, "epoch": 1419} {"train_loss": -22.50998878479004, "global_step": 117779, "epoch": 1419} {"train_loss": -22.031957626342773, "global_step": 117780, "epoch": 1419} {"train_loss": -21.71157455444336, "global_step": 117781, "epoch": 1419} {"train_loss": -22.346311569213867, "global_step": 117782, "epoch": 1419} {"train_loss": -22.049375534057617, "global_step": 117783, "epoch": 1419} {"train_loss": -21.860471725463867, "global_step": 117784, "epoch": 1419} {"train_loss": -22.354013442993164, "global_step": 117785, "epoch": 1419} {"train_loss": -22.23163414001465, "global_step": 117786, "epoch": 1419} {"train_loss": -22.199899673461914, "global_step": 117787, "epoch": 1419} {"train_loss": -21.990110397338867, "global_step": 117788, "epoch": 1419} {"train_loss": -22.064943313598633, "global_step": 117789, "epoch": 1419} {"train_loss": -22.158300399780273, "global_step": 117790, "epoch": 1419} {"train_loss": -21.91446304321289, "global_step": 117791, "epoch": 1419} {"train_loss": -22.404508590698242, "global_step": 117792, "epoch": 1419} {"train_loss": -22.045190811157227, "global_step": 117793, "epoch": 1419} {"train_loss": -22.308326721191406, "global_step": 117794, "epoch": 1419} {"train_loss": -22.21748924255371, "global_step": 117795, "epoch": 1419} {"train_loss": -22.35904312133789, "global_step": 117796, "epoch": 1419} {"train_loss": -22.00213623046875, "global_step": 117797, "epoch": 1419} {"train_loss": -21.967931747436523, "global_step": 117798, "epoch": 1419} {"train_loss": -22.543054580688477, "global_step": 117799, "epoch": 1419} {"train_loss": -22.348806381225586, "global_step": 117800, "epoch": 1419} {"train_loss": -22.02201271057129, "global_step": 117801, "epoch": 1419} {"train_loss": -22.742069244384766, "global_step": 117802, "epoch": 1419} {"train_loss": -21.907907485961914, "global_step": 117803, "epoch": 1419} {"train_loss": -22.439359664916992, "global_step": 117804, "epoch": 1419} {"train_loss": -22.473451614379883, "global_step": 117805, "epoch": 1419} {"train_loss": -22.354467391967773, "global_step": 117806, "epoch": 1419} {"train_loss": -22.370962142944336, "global_step": 117807, "epoch": 1419} {"train_loss": -22.371931076049805, "global_step": 117808, "epoch": 1419} {"train_loss": -22.67911720275879, "global_step": 117809, "epoch": 1419} {"train_loss": -22.46245002746582, "global_step": 117810, "epoch": 1419} {"train_loss": -22.563724517822266, "global_step": 117811, "epoch": 1419} {"train_loss": -22.72210693359375, "global_step": 117812, "epoch": 1419} {"train_loss": -22.396554946899414, "global_step": 117813, "epoch": 1419} {"train_loss": -22.68916130065918, "global_step": 117814, "epoch": 1419} {"train_loss": -22.012975692749023, "global_step": 117815, "epoch": 1419} {"train_loss": -22.270185470581055, "global_step": 117816, "epoch": 1419} {"train_loss": -22.494922637939453, "global_step": 117817, "epoch": 1419} {"train_loss": -22.547475814819336, "global_step": 117818, "epoch": 1419} {"train_loss": -22.538503646850586, "global_step": 117819, "epoch": 1419} {"train_loss": -22.47104263305664, "global_step": 117820, "epoch": 1419} {"train_loss": -22.48227310180664, "global_step": 117821, "epoch": 1419} {"train_loss": -22.34596061706543, "global_step": 117822, "epoch": 1419} {"train_loss": -22.50567626953125, "global_step": 117823, "epoch": 1419} {"train_loss": -22.342748641967773, "global_step": 117824, "epoch": 1419} {"train_loss": -22.962295532226562, "global_step": 117825, "epoch": 1419} {"train_loss": -22.557798385620117, "global_step": 117826, "epoch": 1419} {"train_loss": -22.373266220092773, "global_step": 117827, "epoch": 1419} {"train_loss": -22.251419067382812, "global_step": 117828, "epoch": 1419} {"train_loss": -22.410341262817383, "global_step": 117829, "epoch": 1419} {"train_loss": -22.448959350585938, "global_step": 117830, "epoch": 1419} {"train_loss": -22.5169734954834, "global_step": 117831, "epoch": 1419} {"train_loss": -22.369876861572266, "global_step": 117832, "epoch": 1419} {"train_loss": -22.34609031677246, "global_step": 117833, "epoch": 1419} {"train_loss": -22.811155319213867, "global_step": 117834, "epoch": 1419} {"train_loss": -22.81694984436035, "global_step": 117835, "epoch": 1419} {"train_loss": -22.180524826049805, "global_step": 117836, "epoch": 1419} {"train_loss": -22.555952072143555, "global_step": 117837, "epoch": 1419} {"train_loss": -22.408193588256836, "global_step": 117838, "epoch": 1419} {"train_loss": -22.538002014160156, "global_step": 117839, "epoch": 1419} {"train_loss": -22.66493797302246, "global_step": 117840, "epoch": 1419} {"train_loss": -22.3074951171875, "global_step": 117841, "epoch": 1419} {"train_loss": -22.65043067932129, "global_step": 117842, "epoch": 1419} {"train_loss": -22.3268985748291, "global_step": 117843, "epoch": 1419} {"train_loss": -22.57124137878418, "global_step": 117844, "epoch": 1419} {"train_loss": -22.719371795654297, "global_step": 117845, "epoch": 1419} {"train_loss": -22.510576248168945, "global_step": 117846, "epoch": 1419} {"train_loss": -22.7562313079834, "global_step": 117847, "epoch": 1419} {"train_loss": -22.877988815307617, "global_step": 117848, "epoch": 1419} {"train_loss": -22.7034912109375, "global_step": 117849, "epoch": 1419} {"train_loss": -22.642005920410156, "global_step": 117850, "epoch": 1419} {"train_loss": -22.53431510925293, "global_step": 117851, "epoch": 1419} {"train_loss": -22.29781723022461, "global_step": 117852, "epoch": 1419} {"train_loss": -22.304983139038086, "global_step": 117853, "epoch": 1419} {"train_loss": -22.321388244628906, "global_step": 117854, "epoch": 1419} {"train_loss": -22.525537490844727, "global_step": 117855, "epoch": 1419} {"train_loss": -22.188730239868164, "global_step": 117856, "epoch": 1419} {"train_loss": -22.435997009277344, "global_step": 117857, "epoch": 1419} {"train_loss": -22.377540588378906, "global_step": 117858, "epoch": 1419} {"train_loss": -22.376498969204455, "global_step": 117859, "epoch": 1419, "val_loss": 6451635.0} {"train_loss": -21.842266082763672, "global_step": 117860, "epoch": 1420} {"train_loss": -22.234161376953125, "global_step": 117861, "epoch": 1420} {"train_loss": -22.16639518737793, "global_step": 117862, "epoch": 1420} {"train_loss": -22.392547607421875, "global_step": 117863, "epoch": 1420} {"train_loss": -22.0777645111084, "global_step": 117864, "epoch": 1420} {"train_loss": -22.068864822387695, "global_step": 117865, "epoch": 1420} {"train_loss": -22.32840347290039, "global_step": 117866, "epoch": 1420} {"train_loss": -22.12345314025879, "global_step": 117867, "epoch": 1420} {"train_loss": -22.368083953857422, "global_step": 117868, "epoch": 1420} {"train_loss": -22.051549911499023, "global_step": 117869, "epoch": 1420} {"train_loss": -22.50788688659668, "global_step": 117870, "epoch": 1420} {"train_loss": -21.947433471679688, "global_step": 117871, "epoch": 1420} {"train_loss": -22.47138786315918, "global_step": 117872, "epoch": 1420} {"train_loss": -22.06404685974121, "global_step": 117873, "epoch": 1420} {"train_loss": -22.52838134765625, "global_step": 117874, "epoch": 1420} {"train_loss": -22.104990005493164, "global_step": 117875, "epoch": 1420} {"train_loss": -22.162508010864258, "global_step": 117876, "epoch": 1420} {"train_loss": -22.189199447631836, "global_step": 117877, "epoch": 1420} {"train_loss": -22.22419548034668, "global_step": 117878, "epoch": 1420} {"train_loss": -22.237682342529297, "global_step": 117879, "epoch": 1420} {"train_loss": -22.612722396850586, "global_step": 117880, "epoch": 1420} {"train_loss": -22.145843505859375, "global_step": 117881, "epoch": 1420} {"train_loss": -22.444751739501953, "global_step": 117882, "epoch": 1420} {"train_loss": -22.058725357055664, "global_step": 117883, "epoch": 1420} {"train_loss": -22.460372924804688, "global_step": 117884, "epoch": 1420} {"train_loss": -22.22673988342285, "global_step": 117885, "epoch": 1420} {"train_loss": -22.368528366088867, "global_step": 117886, "epoch": 1420} {"train_loss": -22.422210693359375, "global_step": 117887, "epoch": 1420} {"train_loss": -22.721357345581055, "global_step": 117888, "epoch": 1420} {"train_loss": -22.31380271911621, "global_step": 117889, "epoch": 1420} {"train_loss": -22.77625274658203, "global_step": 117890, "epoch": 1420} {"train_loss": -22.420398712158203, "global_step": 117891, "epoch": 1420} {"train_loss": -22.302091598510742, "global_step": 117892, "epoch": 1420} {"train_loss": -22.57111358642578, "global_step": 117893, "epoch": 1420} {"train_loss": -22.224332809448242, "global_step": 117894, "epoch": 1420} {"train_loss": -22.456342697143555, "global_step": 117895, "epoch": 1420} {"train_loss": -22.818716049194336, "global_step": 117896, "epoch": 1420} {"train_loss": -22.35239601135254, "global_step": 117897, "epoch": 1420} {"train_loss": -22.76479721069336, "global_step": 117898, "epoch": 1420} {"train_loss": -22.320566177368164, "global_step": 117899, "epoch": 1420} {"train_loss": -22.824010848999023, "global_step": 117900, "epoch": 1420} {"train_loss": -22.40505027770996, "global_step": 117901, "epoch": 1420} {"train_loss": -22.33759880065918, "global_step": 117902, "epoch": 1420} {"train_loss": -22.45045280456543, "global_step": 117903, "epoch": 1420} {"train_loss": -22.317228317260742, "global_step": 117904, "epoch": 1420} {"train_loss": -22.693710327148438, "global_step": 117905, "epoch": 1420} {"train_loss": -22.767210006713867, "global_step": 117906, "epoch": 1420} {"train_loss": -22.38408660888672, "global_step": 117907, "epoch": 1420} {"train_loss": -22.53168487548828, "global_step": 117908, "epoch": 1420} {"train_loss": -22.61339569091797, "global_step": 117909, "epoch": 1420} {"train_loss": -22.576574325561523, "global_step": 117910, "epoch": 1420} {"train_loss": -21.967748641967773, "global_step": 117911, "epoch": 1420} {"train_loss": -22.09429931640625, "global_step": 117912, "epoch": 1420} {"train_loss": -22.35602378845215, "global_step": 117913, "epoch": 1420} {"train_loss": -22.214262008666992, "global_step": 117914, "epoch": 1420} {"train_loss": -22.457632064819336, "global_step": 117915, "epoch": 1420} {"train_loss": -22.43485450744629, "global_step": 117916, "epoch": 1420} {"train_loss": -22.296422958374023, "global_step": 117917, "epoch": 1420} {"train_loss": -22.365966796875, "global_step": 117918, "epoch": 1420} {"train_loss": -22.577117919921875, "global_step": 117919, "epoch": 1420} {"train_loss": -22.111095428466797, "global_step": 117920, "epoch": 1420} {"train_loss": -22.509355545043945, "global_step": 117921, "epoch": 1420} {"train_loss": -22.323720932006836, "global_step": 117922, "epoch": 1420} {"train_loss": -22.63920021057129, "global_step": 117923, "epoch": 1420} {"train_loss": -22.327667236328125, "global_step": 117924, "epoch": 1420} {"train_loss": -22.236970901489258, "global_step": 117925, "epoch": 1420} {"train_loss": -22.22538948059082, "global_step": 117926, "epoch": 1420} {"train_loss": -22.327199935913086, "global_step": 117927, "epoch": 1420} {"train_loss": -22.25506591796875, "global_step": 117928, "epoch": 1420} {"train_loss": -22.260770797729492, "global_step": 117929, "epoch": 1420} {"train_loss": -22.750595092773438, "global_step": 117930, "epoch": 1420} {"train_loss": -22.418243408203125, "global_step": 117931, "epoch": 1420} {"train_loss": -21.891584396362305, "global_step": 117932, "epoch": 1420} {"train_loss": -22.633010864257812, "global_step": 117933, "epoch": 1420} {"train_loss": -22.647876739501953, "global_step": 117934, "epoch": 1420} {"train_loss": -22.68726348876953, "global_step": 117935, "epoch": 1420} {"train_loss": -22.37493324279785, "global_step": 117936, "epoch": 1420} {"train_loss": -22.37408447265625, "global_step": 117937, "epoch": 1420} {"train_loss": -22.27748680114746, "global_step": 117938, "epoch": 1420} {"train_loss": -22.44809341430664, "global_step": 117939, "epoch": 1420} {"train_loss": -22.646238327026367, "global_step": 117940, "epoch": 1420} {"train_loss": -22.388286590576172, "global_step": 117941, "epoch": 1420} {"train_loss": -22.38173438842038, "global_step": 117942, "epoch": 1420, "val_loss": 6254151.5} {"train_loss": -22.194005966186523, "global_step": 117943, "epoch": 1421} {"train_loss": -22.01251220703125, "global_step": 117944, "epoch": 1421} {"train_loss": -22.329242706298828, "global_step": 117945, "epoch": 1421} {"train_loss": -22.54006004333496, "global_step": 117946, "epoch": 1421} {"train_loss": -22.334102630615234, "global_step": 117947, "epoch": 1421} {"train_loss": -22.25367546081543, "global_step": 117948, "epoch": 1421} {"train_loss": -22.267566680908203, "global_step": 117949, "epoch": 1421} {"train_loss": -22.590396881103516, "global_step": 117950, "epoch": 1421} {"train_loss": -22.445938110351562, "global_step": 117951, "epoch": 1421} {"train_loss": -22.633176803588867, "global_step": 117952, "epoch": 1421} {"train_loss": -22.34669303894043, "global_step": 117953, "epoch": 1421} {"train_loss": -22.74161148071289, "global_step": 117954, "epoch": 1421} {"train_loss": -22.25458526611328, "global_step": 117955, "epoch": 1421} {"train_loss": -22.451889038085938, "global_step": 117956, "epoch": 1421} {"train_loss": -22.543506622314453, "global_step": 117957, "epoch": 1421} {"train_loss": -22.506650924682617, "global_step": 117958, "epoch": 1421} {"train_loss": -22.628162384033203, "global_step": 117959, "epoch": 1421} {"train_loss": -22.63042640686035, "global_step": 117960, "epoch": 1421} {"train_loss": -22.916444778442383, "global_step": 117961, "epoch": 1421} {"train_loss": -22.5097599029541, "global_step": 117962, "epoch": 1421} {"train_loss": -22.276382446289062, "global_step": 117963, "epoch": 1421} {"train_loss": -22.584400177001953, "global_step": 117964, "epoch": 1421} {"train_loss": -22.690574645996094, "global_step": 117965, "epoch": 1421} {"train_loss": -22.7789249420166, "global_step": 117966, "epoch": 1421} {"train_loss": -22.50005531311035, "global_step": 117967, "epoch": 1421} {"train_loss": -22.296749114990234, "global_step": 117968, "epoch": 1421} {"train_loss": -22.52450180053711, "global_step": 117969, "epoch": 1421} {"train_loss": -22.348011016845703, "global_step": 117970, "epoch": 1421} {"train_loss": -22.12772560119629, "global_step": 117971, "epoch": 1421} {"train_loss": -22.08328628540039, "global_step": 117972, "epoch": 1421} {"train_loss": -22.497098922729492, "global_step": 117973, "epoch": 1421} {"train_loss": -22.525495529174805, "global_step": 117974, "epoch": 1421} {"train_loss": -22.513751983642578, "global_step": 117975, "epoch": 1421} {"train_loss": -22.13251495361328, "global_step": 117976, "epoch": 1421} {"train_loss": -22.281763076782227, "global_step": 117977, "epoch": 1421} {"train_loss": -22.683500289916992, "global_step": 117978, "epoch": 1421} {"train_loss": -22.312978744506836, "global_step": 117979, "epoch": 1421} {"train_loss": -22.482702255249023, "global_step": 117980, "epoch": 1421} {"train_loss": -22.199304580688477, "global_step": 117981, "epoch": 1421} {"train_loss": -22.47221565246582, "global_step": 117982, "epoch": 1421} {"train_loss": -22.539478302001953, "global_step": 117983, "epoch": 1421} {"train_loss": -21.896560668945312, "global_step": 117984, "epoch": 1421} {"train_loss": -22.06692886352539, "global_step": 117985, "epoch": 1421} {"train_loss": -22.358287811279297, "global_step": 117986, "epoch": 1421} {"train_loss": -22.18970489501953, "global_step": 117987, "epoch": 1421} {"train_loss": -22.467885971069336, "global_step": 117988, "epoch": 1421} {"train_loss": -22.645038604736328, "global_step": 117989, "epoch": 1421} {"train_loss": -22.594961166381836, "global_step": 117990, "epoch": 1421} {"train_loss": -22.775392532348633, "global_step": 117991, "epoch": 1421} {"train_loss": -22.537588119506836, "global_step": 117992, "epoch": 1421} {"train_loss": -22.34516716003418, "global_step": 117993, "epoch": 1421} {"train_loss": -22.216873168945312, "global_step": 117994, "epoch": 1421} {"train_loss": -22.615041732788086, "global_step": 117995, "epoch": 1421} {"train_loss": -23.13623046875, "global_step": 117996, "epoch": 1421} {"train_loss": -22.8726863861084, "global_step": 117997, "epoch": 1421} {"train_loss": -22.407352447509766, "global_step": 117998, "epoch": 1421} {"train_loss": -22.496213912963867, "global_step": 117999, "epoch": 1421} {"train_loss": -22.449298858642578, "global_step": 118000, "epoch": 1421} {"train_loss": -22.824756622314453, "global_step": 118001, "epoch": 1421} {"train_loss": -22.603322982788086, "global_step": 118002, "epoch": 1421} {"train_loss": -22.33200454711914, "global_step": 118003, "epoch": 1421} {"train_loss": -22.627355575561523, "global_step": 118004, "epoch": 1421} {"train_loss": -22.82658576965332, "global_step": 118005, "epoch": 1421} {"train_loss": -22.4908504486084, "global_step": 118006, "epoch": 1421} {"train_loss": -22.31501579284668, "global_step": 118007, "epoch": 1421} {"train_loss": -22.652639389038086, "global_step": 118008, "epoch": 1421} {"train_loss": -22.618741989135742, "global_step": 118009, "epoch": 1421} {"train_loss": -22.844192504882812, "global_step": 118010, "epoch": 1421} {"train_loss": -22.786396026611328, "global_step": 118011, "epoch": 1421} {"train_loss": -22.192712783813477, "global_step": 118012, "epoch": 1421} {"train_loss": -22.747861862182617, "global_step": 118013, "epoch": 1421} {"train_loss": -22.446735382080078, "global_step": 118014, "epoch": 1421} {"train_loss": -22.554901123046875, "global_step": 118015, "epoch": 1421} {"train_loss": -22.403255462646484, "global_step": 118016, "epoch": 1421} {"train_loss": -22.2192440032959, "global_step": 118017, "epoch": 1421} {"train_loss": -22.370941162109375, "global_step": 118018, "epoch": 1421} {"train_loss": -21.99973487854004, "global_step": 118019, "epoch": 1421} {"train_loss": -22.439376831054688, "global_step": 118020, "epoch": 1421} {"train_loss": -22.05930519104004, "global_step": 118021, "epoch": 1421} {"train_loss": -22.61520767211914, "global_step": 118022, "epoch": 1421} {"train_loss": -22.479320526123047, "global_step": 118023, "epoch": 1421} {"train_loss": -22.31308937072754, "global_step": 118024, "epoch": 1421} {"train_loss": -22.453719334430005, "global_step": 118025, "epoch": 1421, "val_loss": 6324631.0} {"train_loss": -21.833951950073242, "global_step": 118026, "epoch": 1422} {"train_loss": -22.250703811645508, "global_step": 118027, "epoch": 1422} {"train_loss": -22.22528076171875, "global_step": 118028, "epoch": 1422} {"train_loss": -21.880483627319336, "global_step": 118029, "epoch": 1422} {"train_loss": -22.012319564819336, "global_step": 118030, "epoch": 1422} {"train_loss": -22.385791778564453, "global_step": 118031, "epoch": 1422} {"train_loss": -21.816476821899414, "global_step": 118032, "epoch": 1422} {"train_loss": -21.98650550842285, "global_step": 118033, "epoch": 1422} {"train_loss": -22.34502410888672, "global_step": 118034, "epoch": 1422} {"train_loss": -22.067005157470703, "global_step": 118035, "epoch": 1422} {"train_loss": -22.357328414916992, "global_step": 118036, "epoch": 1422} {"train_loss": -22.042152404785156, "global_step": 118037, "epoch": 1422} {"train_loss": -22.13357925415039, "global_step": 118038, "epoch": 1422} {"train_loss": -22.4649600982666, "global_step": 118039, "epoch": 1422} {"train_loss": -22.111066818237305, "global_step": 118040, "epoch": 1422} {"train_loss": -22.322874069213867, "global_step": 118041, "epoch": 1422} {"train_loss": -22.391773223876953, "global_step": 118042, "epoch": 1422} {"train_loss": -22.535552978515625, "global_step": 118043, "epoch": 1422} {"train_loss": -22.35920524597168, "global_step": 118044, "epoch": 1422} {"train_loss": -22.18647575378418, "global_step": 118045, "epoch": 1422} {"train_loss": -22.297819137573242, "global_step": 118046, "epoch": 1422} {"train_loss": -22.458648681640625, "global_step": 118047, "epoch": 1422} {"train_loss": -22.34097671508789, "global_step": 118048, "epoch": 1422} {"train_loss": -21.87810707092285, "global_step": 118049, "epoch": 1422} {"train_loss": -22.466707229614258, "global_step": 118050, "epoch": 1422} {"train_loss": -22.455642700195312, "global_step": 118051, "epoch": 1422} {"train_loss": -22.780256271362305, "global_step": 118052, "epoch": 1422} {"train_loss": -22.479291915893555, "global_step": 118053, "epoch": 1422} {"train_loss": -22.592519760131836, "global_step": 118054, "epoch": 1422} {"train_loss": -22.4360408782959, "global_step": 118055, "epoch": 1422} {"train_loss": -22.370487213134766, "global_step": 118056, "epoch": 1422} {"train_loss": -22.408750534057617, "global_step": 118057, "epoch": 1422} {"train_loss": -22.51531219482422, "global_step": 118058, "epoch": 1422} {"train_loss": -22.13885498046875, "global_step": 118059, "epoch": 1422} {"train_loss": -22.299388885498047, "global_step": 118060, "epoch": 1422} {"train_loss": -22.522842407226562, "global_step": 118061, "epoch": 1422} {"train_loss": -22.603469848632812, "global_step": 118062, "epoch": 1422} {"train_loss": -22.435754776000977, "global_step": 118063, "epoch": 1422} {"train_loss": -22.611106872558594, "global_step": 118064, "epoch": 1422} {"train_loss": -22.433609008789062, "global_step": 118065, "epoch": 1422} {"train_loss": -22.67421531677246, "global_step": 118066, "epoch": 1422} {"train_loss": -22.559289932250977, "global_step": 118067, "epoch": 1422} {"train_loss": -22.094451904296875, "global_step": 118068, "epoch": 1422} {"train_loss": -22.4207706451416, "global_step": 118069, "epoch": 1422} {"train_loss": -22.602636337280273, "global_step": 118070, "epoch": 1422} {"train_loss": -22.82938003540039, "global_step": 118071, "epoch": 1422} {"train_loss": -22.174901962280273, "global_step": 118072, "epoch": 1422} {"train_loss": -22.832836151123047, "global_step": 118073, "epoch": 1422} {"train_loss": -22.52387046813965, "global_step": 118074, "epoch": 1422} {"train_loss": -22.521320343017578, "global_step": 118075, "epoch": 1422} {"train_loss": -22.367923736572266, "global_step": 118076, "epoch": 1422} {"train_loss": -22.268836975097656, "global_step": 118077, "epoch": 1422} {"train_loss": -22.56724739074707, "global_step": 118078, "epoch": 1422} {"train_loss": -22.621606826782227, "global_step": 118079, "epoch": 1422} {"train_loss": -22.682979583740234, "global_step": 118080, "epoch": 1422} {"train_loss": -22.42536163330078, "global_step": 118081, "epoch": 1422} {"train_loss": -22.352872848510742, "global_step": 118082, "epoch": 1422} {"train_loss": -22.8131103515625, "global_step": 118083, "epoch": 1422} {"train_loss": -22.249053955078125, "global_step": 118084, "epoch": 1422} {"train_loss": -22.566686630249023, "global_step": 118085, "epoch": 1422} {"train_loss": -22.621938705444336, "global_step": 118086, "epoch": 1422} {"train_loss": -22.77976417541504, "global_step": 118087, "epoch": 1422} {"train_loss": -22.722698211669922, "global_step": 118088, "epoch": 1422} {"train_loss": -22.51472282409668, "global_step": 118089, "epoch": 1422} {"train_loss": -22.2943115234375, "global_step": 118090, "epoch": 1422} {"train_loss": -22.662538528442383, "global_step": 118091, "epoch": 1422} {"train_loss": -22.60216522216797, "global_step": 118092, "epoch": 1422} {"train_loss": -22.478925704956055, "global_step": 118093, "epoch": 1422} {"train_loss": -22.408313751220703, "global_step": 118094, "epoch": 1422} {"train_loss": -22.40304183959961, "global_step": 118095, "epoch": 1422} {"train_loss": -22.620361328125, "global_step": 118096, "epoch": 1422} {"train_loss": -22.588842391967773, "global_step": 118097, "epoch": 1422} {"train_loss": -22.22415542602539, "global_step": 118098, "epoch": 1422} {"train_loss": -22.585784912109375, "global_step": 118099, "epoch": 1422} {"train_loss": -22.428247451782227, "global_step": 118100, "epoch": 1422} {"train_loss": -22.71266746520996, "global_step": 118101, "epoch": 1422} {"train_loss": -22.417142868041992, "global_step": 118102, "epoch": 1422} {"train_loss": -23.031665802001953, "global_step": 118103, "epoch": 1422} {"train_loss": -22.45381736755371, "global_step": 118104, "epoch": 1422} {"train_loss": -22.17935562133789, "global_step": 118105, "epoch": 1422} {"train_loss": -22.320798873901367, "global_step": 118106, "epoch": 1422} {"train_loss": -22.477235794067383, "global_step": 118107, "epoch": 1422} {"train_loss": -22.413330790508223, "global_step": 118108, "epoch": 1422, "val_loss": 6192439.0} {"train_loss": -21.313426971435547, "global_step": 118109, "epoch": 1423} {"train_loss": -21.423248291015625, "global_step": 118110, "epoch": 1423} {"train_loss": -21.361040115356445, "global_step": 118111, "epoch": 1423} {"train_loss": -21.529987335205078, "global_step": 118112, "epoch": 1423} {"train_loss": -21.94842529296875, "global_step": 118113, "epoch": 1423} {"train_loss": -21.63338279724121, "global_step": 118114, "epoch": 1423} {"train_loss": -21.611989974975586, "global_step": 118115, "epoch": 1423} {"train_loss": -22.036113739013672, "global_step": 118116, "epoch": 1423} {"train_loss": -22.09760856628418, "global_step": 118117, "epoch": 1423} {"train_loss": -21.855607986450195, "global_step": 118118, "epoch": 1423} {"train_loss": -21.99765396118164, "global_step": 118119, "epoch": 1423} {"train_loss": -21.915088653564453, "global_step": 118120, "epoch": 1423} {"train_loss": -22.00734519958496, "global_step": 118121, "epoch": 1423} {"train_loss": -22.21193504333496, "global_step": 118122, "epoch": 1423} {"train_loss": -22.748666763305664, "global_step": 118123, "epoch": 1423} {"train_loss": -22.007583618164062, "global_step": 118124, "epoch": 1423} {"train_loss": -22.151533126831055, "global_step": 118125, "epoch": 1423} {"train_loss": -22.507822036743164, "global_step": 118126, "epoch": 1423} {"train_loss": -22.09701156616211, "global_step": 118127, "epoch": 1423} {"train_loss": -22.022151947021484, "global_step": 118128, "epoch": 1423} {"train_loss": -22.67573356628418, "global_step": 118129, "epoch": 1423} {"train_loss": -22.07473373413086, "global_step": 118130, "epoch": 1423} {"train_loss": -22.237842559814453, "global_step": 118131, "epoch": 1423} {"train_loss": -22.569087982177734, "global_step": 118132, "epoch": 1423} {"train_loss": -22.44175148010254, "global_step": 118133, "epoch": 1423} {"train_loss": -22.412450790405273, "global_step": 118134, "epoch": 1423} {"train_loss": -22.150609970092773, "global_step": 118135, "epoch": 1423} {"train_loss": -22.270877838134766, "global_step": 118136, "epoch": 1423} {"train_loss": -22.451675415039062, "global_step": 118137, "epoch": 1423} {"train_loss": -22.488157272338867, "global_step": 118138, "epoch": 1423} {"train_loss": -22.946590423583984, "global_step": 118139, "epoch": 1423} {"train_loss": -21.964204788208008, "global_step": 118140, "epoch": 1423} {"train_loss": -22.49115562438965, "global_step": 118141, "epoch": 1423} {"train_loss": -22.51570701599121, "global_step": 118142, "epoch": 1423} {"train_loss": -22.50140953063965, "global_step": 118143, "epoch": 1423} {"train_loss": -22.35457420349121, "global_step": 118144, "epoch": 1423} {"train_loss": -22.50225067138672, "global_step": 118145, "epoch": 1423} {"train_loss": -22.235454559326172, "global_step": 118146, "epoch": 1423} {"train_loss": -22.310718536376953, "global_step": 118147, "epoch": 1423} {"train_loss": -22.163043975830078, "global_step": 118148, "epoch": 1423} {"train_loss": -22.594472885131836, "global_step": 118149, "epoch": 1423} {"train_loss": -22.16585350036621, "global_step": 118150, "epoch": 1423} {"train_loss": -22.51393699645996, "global_step": 118151, "epoch": 1423} {"train_loss": -23.11264991760254, "global_step": 118152, "epoch": 1423} {"train_loss": -22.71772003173828, "global_step": 118153, "epoch": 1423} {"train_loss": -22.492746353149414, "global_step": 118154, "epoch": 1423} {"train_loss": -22.50433349609375, "global_step": 118155, "epoch": 1423} {"train_loss": -22.753787994384766, "global_step": 118156, "epoch": 1423} {"train_loss": -22.56924819946289, "global_step": 118157, "epoch": 1423} {"train_loss": -22.727142333984375, "global_step": 118158, "epoch": 1423} {"train_loss": -22.488025665283203, "global_step": 118159, "epoch": 1423} {"train_loss": -22.57533073425293, "global_step": 118160, "epoch": 1423} {"train_loss": -22.443218231201172, "global_step": 118161, "epoch": 1423} {"train_loss": -22.451425552368164, "global_step": 118162, "epoch": 1423} {"train_loss": -22.455442428588867, "global_step": 118163, "epoch": 1423} {"train_loss": -22.227571487426758, "global_step": 118164, "epoch": 1423} {"train_loss": -22.327878952026367, "global_step": 118165, "epoch": 1423} {"train_loss": -22.528959274291992, "global_step": 118166, "epoch": 1423} {"train_loss": -22.308883666992188, "global_step": 118167, "epoch": 1423} {"train_loss": -22.499279022216797, "global_step": 118168, "epoch": 1423} {"train_loss": -22.700042724609375, "global_step": 118169, "epoch": 1423} {"train_loss": -22.42421531677246, "global_step": 118170, "epoch": 1423} {"train_loss": -22.7486515045166, "global_step": 118171, "epoch": 1423} {"train_loss": -22.419883728027344, "global_step": 118172, "epoch": 1423} {"train_loss": -22.59716033935547, "global_step": 118173, "epoch": 1423} {"train_loss": -22.867698669433594, "global_step": 118174, "epoch": 1423} {"train_loss": -22.926565170288086, "global_step": 118175, "epoch": 1423} {"train_loss": -21.967864990234375, "global_step": 118176, "epoch": 1423} {"train_loss": -22.740568161010742, "global_step": 118177, "epoch": 1423} {"train_loss": -22.513103485107422, "global_step": 118178, "epoch": 1423} {"train_loss": -22.521041870117188, "global_step": 118179, "epoch": 1423} {"train_loss": -22.47125816345215, "global_step": 118180, "epoch": 1423} {"train_loss": -22.376005172729492, "global_step": 118181, "epoch": 1423} {"train_loss": -22.45833396911621, "global_step": 118182, "epoch": 1423} {"train_loss": -22.951152801513672, "global_step": 118183, "epoch": 1423} {"train_loss": -22.541711807250977, "global_step": 118184, "epoch": 1423} {"train_loss": -22.468473434448242, "global_step": 118185, "epoch": 1423} {"train_loss": -22.68024253845215, "global_step": 118186, "epoch": 1423} {"train_loss": -22.381717681884766, "global_step": 118187, "epoch": 1423} {"train_loss": -22.369714736938477, "global_step": 118188, "epoch": 1423} {"train_loss": -22.882421493530273, "global_step": 118189, "epoch": 1423} {"train_loss": -22.2226505279541, "global_step": 118190, "epoch": 1423} {"train_loss": -22.346368973513684, "global_step": 118191, "epoch": 1423, "val_loss": 6171805.0} {"train_loss": -22.235586166381836, "global_step": 118192, "epoch": 1424} {"train_loss": -22.420392990112305, "global_step": 118193, "epoch": 1424} {"train_loss": -22.459716796875, "global_step": 118194, "epoch": 1424} {"train_loss": -22.199970245361328, "global_step": 118195, "epoch": 1424} {"train_loss": -22.1771240234375, "global_step": 118196, "epoch": 1424} {"train_loss": -22.589115142822266, "global_step": 118197, "epoch": 1424} {"train_loss": -22.37715721130371, "global_step": 118198, "epoch": 1424} {"train_loss": -22.697324752807617, "global_step": 118199, "epoch": 1424} {"train_loss": -22.43903350830078, "global_step": 118200, "epoch": 1424} {"train_loss": -22.486553192138672, "global_step": 118201, "epoch": 1424} {"train_loss": -22.258621215820312, "global_step": 118202, "epoch": 1424} {"train_loss": -22.531618118286133, "global_step": 118203, "epoch": 1424} {"train_loss": -22.229278564453125, "global_step": 118204, "epoch": 1424} {"train_loss": -22.50324249267578, "global_step": 118205, "epoch": 1424} {"train_loss": -22.507726669311523, "global_step": 118206, "epoch": 1424} {"train_loss": -22.321334838867188, "global_step": 118207, "epoch": 1424} {"train_loss": -22.291656494140625, "global_step": 118208, "epoch": 1424} {"train_loss": -22.62394142150879, "global_step": 118209, "epoch": 1424} {"train_loss": -22.557296752929688, "global_step": 118210, "epoch": 1424} {"train_loss": -22.203378677368164, "global_step": 118211, "epoch": 1424} {"train_loss": -22.357147216796875, "global_step": 118212, "epoch": 1424} {"train_loss": -22.75032615661621, "global_step": 118213, "epoch": 1424} {"train_loss": -22.55174446105957, "global_step": 118214, "epoch": 1424} {"train_loss": -22.26058006286621, "global_step": 118215, "epoch": 1424} {"train_loss": -22.596973419189453, "global_step": 118216, "epoch": 1424} {"train_loss": -21.766590118408203, "global_step": 118217, "epoch": 1424} {"train_loss": -22.466527938842773, "global_step": 118218, "epoch": 1424} {"train_loss": -22.370914459228516, "global_step": 118219, "epoch": 1424} {"train_loss": -22.743925094604492, "global_step": 118220, "epoch": 1424} {"train_loss": -22.715078353881836, "global_step": 118221, "epoch": 1424} {"train_loss": -22.746824264526367, "global_step": 118222, "epoch": 1424} {"train_loss": -22.163572311401367, "global_step": 118223, "epoch": 1424} {"train_loss": -22.844528198242188, "global_step": 118224, "epoch": 1424} {"train_loss": -22.514450073242188, "global_step": 118225, "epoch": 1424} {"train_loss": -22.520950317382812, "global_step": 118226, "epoch": 1424} {"train_loss": -22.453384399414062, "global_step": 118227, "epoch": 1424} {"train_loss": -22.35561180114746, "global_step": 118228, "epoch": 1424} {"train_loss": -22.20139503479004, "global_step": 118229, "epoch": 1424} {"train_loss": -22.54767608642578, "global_step": 118230, "epoch": 1424} {"train_loss": -22.79425048828125, "global_step": 118231, "epoch": 1424} {"train_loss": -22.61396598815918, "global_step": 118232, "epoch": 1424} {"train_loss": -22.443639755249023, "global_step": 118233, "epoch": 1424} {"train_loss": -22.720609664916992, "global_step": 118234, "epoch": 1424} {"train_loss": -22.42421531677246, "global_step": 118235, "epoch": 1424} {"train_loss": -22.524412155151367, "global_step": 118236, "epoch": 1424} {"train_loss": -22.720550537109375, "global_step": 118237, "epoch": 1424} {"train_loss": -22.37728500366211, "global_step": 118238, "epoch": 1424} {"train_loss": -22.502859115600586, "global_step": 118239, "epoch": 1424} {"train_loss": -22.393293380737305, "global_step": 118240, "epoch": 1424} {"train_loss": -22.7324161529541, "global_step": 118241, "epoch": 1424} {"train_loss": -22.3056583404541, "global_step": 118242, "epoch": 1424} {"train_loss": -22.339147567749023, "global_step": 118243, "epoch": 1424} {"train_loss": -22.50969886779785, "global_step": 118244, "epoch": 1424} {"train_loss": -22.67441177368164, "global_step": 118245, "epoch": 1424} {"train_loss": -22.448726654052734, "global_step": 118246, "epoch": 1424} {"train_loss": -22.616857528686523, "global_step": 118247, "epoch": 1424} {"train_loss": -22.91817283630371, "global_step": 118248, "epoch": 1424} {"train_loss": -22.145170211791992, "global_step": 118249, "epoch": 1424} {"train_loss": -22.378488540649414, "global_step": 118250, "epoch": 1424} {"train_loss": -22.609663009643555, "global_step": 118251, "epoch": 1424} {"train_loss": -22.65449333190918, "global_step": 118252, "epoch": 1424} {"train_loss": -22.518692016601562, "global_step": 118253, "epoch": 1424} {"train_loss": -22.564529418945312, "global_step": 118254, "epoch": 1424} {"train_loss": -22.465444564819336, "global_step": 118255, "epoch": 1424} {"train_loss": -22.87279510498047, "global_step": 118256, "epoch": 1424} {"train_loss": -22.404956817626953, "global_step": 118257, "epoch": 1424} {"train_loss": -22.46443748474121, "global_step": 118258, "epoch": 1424} {"train_loss": -22.35831642150879, "global_step": 118259, "epoch": 1424} {"train_loss": -22.8376522064209, "global_step": 118260, "epoch": 1424} {"train_loss": -22.335119247436523, "global_step": 118261, "epoch": 1424} {"train_loss": -22.561330795288086, "global_step": 118262, "epoch": 1424} {"train_loss": -22.356496810913086, "global_step": 118263, "epoch": 1424} {"train_loss": -22.167150497436523, "global_step": 118264, "epoch": 1424} {"train_loss": -22.618947982788086, "global_step": 118265, "epoch": 1424} {"train_loss": -22.618192672729492, "global_step": 118266, "epoch": 1424} {"train_loss": -22.355497360229492, "global_step": 118267, "epoch": 1424} {"train_loss": -22.260089874267578, "global_step": 118268, "epoch": 1424} {"train_loss": -22.283117294311523, "global_step": 118269, "epoch": 1424} {"train_loss": -22.36997413635254, "global_step": 118270, "epoch": 1424} {"train_loss": -22.35855484008789, "global_step": 118271, "epoch": 1424} {"train_loss": -22.677349090576172, "global_step": 118272, "epoch": 1424} {"train_loss": -22.33832550048828, "global_step": 118273, "epoch": 1424} {"train_loss": -22.472426127238446, "global_step": 118274, "epoch": 1424, "val_loss": 6299118.0} {"train_loss": -22.16409683227539, "global_step": 118275, "epoch": 1425} {"train_loss": -22.069150924682617, "global_step": 118276, "epoch": 1425} {"train_loss": -22.112747192382812, "global_step": 118277, "epoch": 1425} {"train_loss": -22.41042137145996, "global_step": 118278, "epoch": 1425} {"train_loss": -22.178762435913086, "global_step": 118279, "epoch": 1425} {"train_loss": -22.285053253173828, "global_step": 118280, "epoch": 1425} {"train_loss": -22.2749080657959, "global_step": 118281, "epoch": 1425} {"train_loss": -22.205032348632812, "global_step": 118282, "epoch": 1425} {"train_loss": -22.37294578552246, "global_step": 118283, "epoch": 1425} {"train_loss": -22.435909271240234, "global_step": 118284, "epoch": 1425} {"train_loss": -22.12269401550293, "global_step": 118285, "epoch": 1425} {"train_loss": -22.633346557617188, "global_step": 118286, "epoch": 1425} {"train_loss": -22.419469833374023, "global_step": 118287, "epoch": 1425} {"train_loss": -22.78203773498535, "global_step": 118288, "epoch": 1425} {"train_loss": -22.24958610534668, "global_step": 118289, "epoch": 1425} {"train_loss": -22.439626693725586, "global_step": 118290, "epoch": 1425} {"train_loss": -22.37484359741211, "global_step": 118291, "epoch": 1425} {"train_loss": -22.195768356323242, "global_step": 118292, "epoch": 1425} {"train_loss": -22.67867088317871, "global_step": 118293, "epoch": 1425} {"train_loss": -22.29125213623047, "global_step": 118294, "epoch": 1425} {"train_loss": -22.492053985595703, "global_step": 118295, "epoch": 1425} {"train_loss": -22.488569259643555, "global_step": 118296, "epoch": 1425} {"train_loss": -22.440641403198242, "global_step": 118297, "epoch": 1425} {"train_loss": -22.53338623046875, "global_step": 118298, "epoch": 1425} {"train_loss": -22.698984146118164, "global_step": 118299, "epoch": 1425} {"train_loss": -22.511804580688477, "global_step": 118300, "epoch": 1425} {"train_loss": -22.57533836364746, "global_step": 118301, "epoch": 1425} {"train_loss": -22.423629760742188, "global_step": 118302, "epoch": 1425} {"train_loss": -22.58021354675293, "global_step": 118303, "epoch": 1425} {"train_loss": -22.217580795288086, "global_step": 118304, "epoch": 1425} {"train_loss": -22.47847557067871, "global_step": 118305, "epoch": 1425} {"train_loss": -22.162885665893555, "global_step": 118306, "epoch": 1425} {"train_loss": -22.304391860961914, "global_step": 118307, "epoch": 1425} {"train_loss": -22.599340438842773, "global_step": 118308, "epoch": 1425} {"train_loss": -22.954267501831055, "global_step": 118309, "epoch": 1425} {"train_loss": -22.258214950561523, "global_step": 118310, "epoch": 1425} {"train_loss": -22.76163673400879, "global_step": 118311, "epoch": 1425} {"train_loss": -22.17609214782715, "global_step": 118312, "epoch": 1425} {"train_loss": -22.470733642578125, "global_step": 118313, "epoch": 1425} {"train_loss": -22.334707260131836, "global_step": 118314, "epoch": 1425} {"train_loss": -22.571945190429688, "global_step": 118315, "epoch": 1425} {"train_loss": -22.255483627319336, "global_step": 118316, "epoch": 1425} {"train_loss": -22.52288055419922, "global_step": 118317, "epoch": 1425} {"train_loss": -22.150768280029297, "global_step": 118318, "epoch": 1425} {"train_loss": -22.591087341308594, "global_step": 118319, "epoch": 1425} {"train_loss": -22.24505043029785, "global_step": 118320, "epoch": 1425} {"train_loss": -22.690269470214844, "global_step": 118321, "epoch": 1425} {"train_loss": -22.241987228393555, "global_step": 118322, "epoch": 1425} {"train_loss": -22.392759323120117, "global_step": 118323, "epoch": 1425} {"train_loss": -22.624479293823242, "global_step": 118324, "epoch": 1425} {"train_loss": -22.309152603149414, "global_step": 118325, "epoch": 1425} {"train_loss": -22.35162925720215, "global_step": 118326, "epoch": 1425} {"train_loss": -22.353994369506836, "global_step": 118327, "epoch": 1425} {"train_loss": -22.678211212158203, "global_step": 118328, "epoch": 1425} {"train_loss": -22.300682067871094, "global_step": 118329, "epoch": 1425} {"train_loss": -22.513031005859375, "global_step": 118330, "epoch": 1425} {"train_loss": -22.471155166625977, "global_step": 118331, "epoch": 1425} {"train_loss": -22.151155471801758, "global_step": 118332, "epoch": 1425} {"train_loss": -22.078033447265625, "global_step": 118333, "epoch": 1425} {"train_loss": -22.29572296142578, "global_step": 118334, "epoch": 1425} {"train_loss": -22.015777587890625, "global_step": 118335, "epoch": 1425} {"train_loss": -22.79136085510254, "global_step": 118336, "epoch": 1425} {"train_loss": -22.201065063476562, "global_step": 118337, "epoch": 1425} {"train_loss": -22.567102432250977, "global_step": 118338, "epoch": 1425} {"train_loss": -22.551239013671875, "global_step": 118339, "epoch": 1425} {"train_loss": -22.86629295349121, "global_step": 118340, "epoch": 1425} {"train_loss": -22.676549911499023, "global_step": 118341, "epoch": 1425} {"train_loss": -22.24799156188965, "global_step": 118342, "epoch": 1425} {"train_loss": -22.607223510742188, "global_step": 118343, "epoch": 1425} {"train_loss": -22.565093994140625, "global_step": 118344, "epoch": 1425} {"train_loss": -22.459552764892578, "global_step": 118345, "epoch": 1425} {"train_loss": -22.94860076904297, "global_step": 118346, "epoch": 1425} {"train_loss": -22.551177978515625, "global_step": 118347, "epoch": 1425} {"train_loss": -22.55854606628418, "global_step": 118348, "epoch": 1425} {"train_loss": -22.382898330688477, "global_step": 118349, "epoch": 1425} {"train_loss": -22.72523307800293, "global_step": 118350, "epoch": 1425} {"train_loss": -22.91029930114746, "global_step": 118351, "epoch": 1425} {"train_loss": -22.372514724731445, "global_step": 118352, "epoch": 1425} {"train_loss": -22.495548248291016, "global_step": 118353, "epoch": 1425} {"train_loss": -22.39924430847168, "global_step": 118354, "epoch": 1425} {"train_loss": -22.700475692749023, "global_step": 118355, "epoch": 1425} {"train_loss": -22.07906150817871, "global_step": 118356, "epoch": 1425} {"train_loss": -22.457621425031178, "global_step": 118357, "epoch": 1425, "val_loss": 6205161.5} {"train_loss": -22.236093521118164, "global_step": 118358, "epoch": 1426} {"train_loss": -22.31719207763672, "global_step": 118359, "epoch": 1426} {"train_loss": -22.34687614440918, "global_step": 118360, "epoch": 1426} {"train_loss": -22.399127960205078, "global_step": 118361, "epoch": 1426} {"train_loss": -22.286453247070312, "global_step": 118362, "epoch": 1426} {"train_loss": -22.08905601501465, "global_step": 118363, "epoch": 1426} {"train_loss": -22.40582847595215, "global_step": 118364, "epoch": 1426} {"train_loss": -22.177026748657227, "global_step": 118365, "epoch": 1426} {"train_loss": -21.989656448364258, "global_step": 118366, "epoch": 1426} {"train_loss": -22.046192169189453, "global_step": 118367, "epoch": 1426} {"train_loss": -22.200729370117188, "global_step": 118368, "epoch": 1426} {"train_loss": -22.51894187927246, "global_step": 118369, "epoch": 1426} {"train_loss": -22.53333854675293, "global_step": 118370, "epoch": 1426} {"train_loss": -22.629852294921875, "global_step": 118371, "epoch": 1426} {"train_loss": -22.91737174987793, "global_step": 118372, "epoch": 1426} {"train_loss": -22.435806274414062, "global_step": 118373, "epoch": 1426} {"train_loss": -22.43842124938965, "global_step": 118374, "epoch": 1426} {"train_loss": -22.647138595581055, "global_step": 118375, "epoch": 1426} {"train_loss": -22.62360191345215, "global_step": 118376, "epoch": 1426} {"train_loss": -22.411855697631836, "global_step": 118377, "epoch": 1426} {"train_loss": -22.442480087280273, "global_step": 118378, "epoch": 1426} {"train_loss": -22.55280303955078, "global_step": 118379, "epoch": 1426} {"train_loss": -22.402711868286133, "global_step": 118380, "epoch": 1426} {"train_loss": -22.237842559814453, "global_step": 118381, "epoch": 1426} {"train_loss": -22.43903350830078, "global_step": 118382, "epoch": 1426} {"train_loss": -22.23389434814453, "global_step": 118383, "epoch": 1426} {"train_loss": -22.306692123413086, "global_step": 118384, "epoch": 1426} {"train_loss": -22.557836532592773, "global_step": 118385, "epoch": 1426} {"train_loss": -22.29038429260254, "global_step": 118386, "epoch": 1426} {"train_loss": -22.54338264465332, "global_step": 118387, "epoch": 1426} {"train_loss": -22.714262008666992, "global_step": 118388, "epoch": 1426} {"train_loss": -22.416431427001953, "global_step": 118389, "epoch": 1426} {"train_loss": -22.77560806274414, "global_step": 118390, "epoch": 1426} {"train_loss": -22.8648738861084, "global_step": 118391, "epoch": 1426} {"train_loss": -22.269559860229492, "global_step": 118392, "epoch": 1426} {"train_loss": -22.43376350402832, "global_step": 118393, "epoch": 1426} {"train_loss": -22.56696891784668, "global_step": 118394, "epoch": 1426} {"train_loss": -22.507291793823242, "global_step": 118395, "epoch": 1426} {"train_loss": -22.44663429260254, "global_step": 118396, "epoch": 1426} {"train_loss": -22.45155143737793, "global_step": 118397, "epoch": 1426} {"train_loss": -23.06959342956543, "global_step": 118398, "epoch": 1426} {"train_loss": -22.622314453125, "global_step": 118399, "epoch": 1426} {"train_loss": -22.1922664642334, "global_step": 118400, "epoch": 1426} {"train_loss": -22.286710739135742, "global_step": 118401, "epoch": 1426} {"train_loss": -22.1419734954834, "global_step": 118402, "epoch": 1426} {"train_loss": -22.431636810302734, "global_step": 118403, "epoch": 1426} {"train_loss": -22.438785552978516, "global_step": 118404, "epoch": 1426} {"train_loss": -22.12650489807129, "global_step": 118405, "epoch": 1426} {"train_loss": -22.08957290649414, "global_step": 118406, "epoch": 1426} {"train_loss": -22.222644805908203, "global_step": 118407, "epoch": 1426} {"train_loss": -22.293710708618164, "global_step": 118408, "epoch": 1426} {"train_loss": -22.84665870666504, "global_step": 118409, "epoch": 1426} {"train_loss": -22.41224479675293, "global_step": 118410, "epoch": 1426} {"train_loss": -22.22620964050293, "global_step": 118411, "epoch": 1426} {"train_loss": -22.33133888244629, "global_step": 118412, "epoch": 1426} {"train_loss": -22.24186897277832, "global_step": 118413, "epoch": 1426} {"train_loss": -22.83955192565918, "global_step": 118414, "epoch": 1426} {"train_loss": -22.210294723510742, "global_step": 118415, "epoch": 1426} {"train_loss": -22.2911319732666, "global_step": 118416, "epoch": 1426} {"train_loss": -22.60523796081543, "global_step": 118417, "epoch": 1426} {"train_loss": -22.66458511352539, "global_step": 118418, "epoch": 1426} {"train_loss": -22.660018920898438, "global_step": 118419, "epoch": 1426} {"train_loss": -22.459014892578125, "global_step": 118420, "epoch": 1426} {"train_loss": -22.447824478149414, "global_step": 118421, "epoch": 1426} {"train_loss": -22.7766170501709, "global_step": 118422, "epoch": 1426} {"train_loss": -22.46626853942871, "global_step": 118423, "epoch": 1426} {"train_loss": -22.422225952148438, "global_step": 118424, "epoch": 1426} {"train_loss": -22.36600685119629, "global_step": 118425, "epoch": 1426} {"train_loss": -22.817121505737305, "global_step": 118426, "epoch": 1426} {"train_loss": -22.592390060424805, "global_step": 118427, "epoch": 1426} {"train_loss": -22.587020874023438, "global_step": 118428, "epoch": 1426} {"train_loss": -22.49496841430664, "global_step": 118429, "epoch": 1426} {"train_loss": -22.581151962280273, "global_step": 118430, "epoch": 1426} {"train_loss": -22.163806915283203, "global_step": 118431, "epoch": 1426} {"train_loss": -22.466293334960938, "global_step": 118432, "epoch": 1426} {"train_loss": -22.264537811279297, "global_step": 118433, "epoch": 1426} {"train_loss": -21.888338088989258, "global_step": 118434, "epoch": 1426} {"train_loss": -22.713911056518555, "global_step": 118435, "epoch": 1426} {"train_loss": -22.55103874206543, "global_step": 118436, "epoch": 1426} {"train_loss": -22.17093276977539, "global_step": 118437, "epoch": 1426} {"train_loss": -22.4478816986084, "global_step": 118438, "epoch": 1426} {"train_loss": -22.256750106811523, "global_step": 118439, "epoch": 1426} {"train_loss": -22.43499990256436, "global_step": 118440, "epoch": 1426, "val_loss": 6172199.5} {"train_loss": -21.62477684020996, "global_step": 118441, "epoch": 1427} {"train_loss": -21.52799415588379, "global_step": 118442, "epoch": 1427} {"train_loss": -22.149856567382812, "global_step": 118443, "epoch": 1427} {"train_loss": -22.081573486328125, "global_step": 118444, "epoch": 1427} {"train_loss": -22.06764793395996, "global_step": 118445, "epoch": 1427} {"train_loss": -21.97233009338379, "global_step": 118446, "epoch": 1427} {"train_loss": -22.345388412475586, "global_step": 118447, "epoch": 1427} {"train_loss": -21.842580795288086, "global_step": 118448, "epoch": 1427} {"train_loss": -22.392704010009766, "global_step": 118449, "epoch": 1427} {"train_loss": -21.956825256347656, "global_step": 118450, "epoch": 1427} {"train_loss": -22.193140029907227, "global_step": 118451, "epoch": 1427} {"train_loss": -22.49028968811035, "global_step": 118452, "epoch": 1427} {"train_loss": -22.381071090698242, "global_step": 118453, "epoch": 1427} {"train_loss": -22.356840133666992, "global_step": 118454, "epoch": 1427} {"train_loss": -22.33065414428711, "global_step": 118455, "epoch": 1427} {"train_loss": -22.1989688873291, "global_step": 118456, "epoch": 1427} {"train_loss": -22.13266944885254, "global_step": 118457, "epoch": 1427} {"train_loss": -22.634307861328125, "global_step": 118458, "epoch": 1427} {"train_loss": -22.537797927856445, "global_step": 118459, "epoch": 1427} {"train_loss": -22.439943313598633, "global_step": 118460, "epoch": 1427} {"train_loss": -22.542604446411133, "global_step": 118461, "epoch": 1427} {"train_loss": -22.33473777770996, "global_step": 118462, "epoch": 1427} {"train_loss": -22.33391761779785, "global_step": 118463, "epoch": 1427} {"train_loss": -22.2291316986084, "global_step": 118464, "epoch": 1427} {"train_loss": -22.301992416381836, "global_step": 118465, "epoch": 1427} {"train_loss": -22.706687927246094, "global_step": 118466, "epoch": 1427} {"train_loss": -22.2208194732666, "global_step": 118467, "epoch": 1427} {"train_loss": -22.431114196777344, "global_step": 118468, "epoch": 1427} {"train_loss": -22.700469970703125, "global_step": 118469, "epoch": 1427} {"train_loss": -22.352703094482422, "global_step": 118470, "epoch": 1427} {"train_loss": -22.531187057495117, "global_step": 118471, "epoch": 1427} {"train_loss": -22.409595489501953, "global_step": 118472, "epoch": 1427} {"train_loss": -22.302616119384766, "global_step": 118473, "epoch": 1427} {"train_loss": -22.61054039001465, "global_step": 118474, "epoch": 1427} {"train_loss": -22.911603927612305, "global_step": 118475, "epoch": 1427} {"train_loss": -22.092391967773438, "global_step": 118476, "epoch": 1427} {"train_loss": -22.51885986328125, "global_step": 118477, "epoch": 1427} {"train_loss": -22.505752563476562, "global_step": 118478, "epoch": 1427} {"train_loss": -22.500818252563477, "global_step": 118479, "epoch": 1427} {"train_loss": -22.672271728515625, "global_step": 118480, "epoch": 1427} {"train_loss": -22.313297271728516, "global_step": 118481, "epoch": 1427} {"train_loss": -22.56134033203125, "global_step": 118482, "epoch": 1427} {"train_loss": -23.088407516479492, "global_step": 118483, "epoch": 1427} {"train_loss": -22.360448837280273, "global_step": 118484, "epoch": 1427} {"train_loss": -22.45840835571289, "global_step": 118485, "epoch": 1427} {"train_loss": -22.289567947387695, "global_step": 118486, "epoch": 1427} {"train_loss": -22.768136978149414, "global_step": 118487, "epoch": 1427} {"train_loss": -22.907339096069336, "global_step": 118488, "epoch": 1427} {"train_loss": -22.617216110229492, "global_step": 118489, "epoch": 1427} {"train_loss": -22.54867172241211, "global_step": 118490, "epoch": 1427} {"train_loss": -22.68332862854004, "global_step": 118491, "epoch": 1427} {"train_loss": -22.514928817749023, "global_step": 118492, "epoch": 1427} {"train_loss": -22.3966121673584, "global_step": 118493, "epoch": 1427} {"train_loss": -22.01093864440918, "global_step": 118494, "epoch": 1427} {"train_loss": -22.215829849243164, "global_step": 118495, "epoch": 1427} {"train_loss": -22.71260643005371, "global_step": 118496, "epoch": 1427} {"train_loss": -22.391786575317383, "global_step": 118497, "epoch": 1427} {"train_loss": -22.066526412963867, "global_step": 118498, "epoch": 1427} {"train_loss": -22.114561080932617, "global_step": 118499, "epoch": 1427} {"train_loss": -22.435720443725586, "global_step": 118500, "epoch": 1427} {"train_loss": -22.46066665649414, "global_step": 118501, "epoch": 1427} {"train_loss": -22.25539779663086, "global_step": 118502, "epoch": 1427} {"train_loss": -22.16031837463379, "global_step": 118503, "epoch": 1427} {"train_loss": -22.465845108032227, "global_step": 118504, "epoch": 1427} {"train_loss": -22.362895965576172, "global_step": 118505, "epoch": 1427} {"train_loss": -22.50986671447754, "global_step": 118506, "epoch": 1427} {"train_loss": -22.111356735229492, "global_step": 118507, "epoch": 1427} {"train_loss": -22.629291534423828, "global_step": 118508, "epoch": 1427} {"train_loss": -22.14759635925293, "global_step": 118509, "epoch": 1427} {"train_loss": -22.094324111938477, "global_step": 118510, "epoch": 1427} {"train_loss": -22.511228561401367, "global_step": 118511, "epoch": 1427} {"train_loss": -22.48322868347168, "global_step": 118512, "epoch": 1427} {"train_loss": -22.237878799438477, "global_step": 118513, "epoch": 1427} {"train_loss": -22.545034408569336, "global_step": 118514, "epoch": 1427} {"train_loss": -22.526309967041016, "global_step": 118515, "epoch": 1427} {"train_loss": -22.470895767211914, "global_step": 118516, "epoch": 1427} {"train_loss": -22.475412368774414, "global_step": 118517, "epoch": 1427} {"train_loss": -22.3754940032959, "global_step": 118518, "epoch": 1427} {"train_loss": -22.743017196655273, "global_step": 118519, "epoch": 1427} {"train_loss": -22.46110725402832, "global_step": 118520, "epoch": 1427} {"train_loss": -22.484882354736328, "global_step": 118521, "epoch": 1427} {"train_loss": -22.223989486694336, "global_step": 118522, "epoch": 1427} {"train_loss": -22.390039535890143, "global_step": 118523, "epoch": 1427, "val_loss": 6269334.0} {"train_loss": -21.93460464477539, "global_step": 118524, "epoch": 1428} {"train_loss": -22.537582397460938, "global_step": 118525, "epoch": 1428} {"train_loss": -22.197683334350586, "global_step": 118526, "epoch": 1428} {"train_loss": -22.17894744873047, "global_step": 118527, "epoch": 1428} {"train_loss": -22.444366455078125, "global_step": 118528, "epoch": 1428} {"train_loss": -22.138689041137695, "global_step": 118529, "epoch": 1428} {"train_loss": -22.2241153717041, "global_step": 118530, "epoch": 1428} {"train_loss": -22.45660400390625, "global_step": 118531, "epoch": 1428} {"train_loss": -22.125333786010742, "global_step": 118532, "epoch": 1428} {"train_loss": -22.658334732055664, "global_step": 118533, "epoch": 1428} {"train_loss": -22.355417251586914, "global_step": 118534, "epoch": 1428} {"train_loss": -22.398672103881836, "global_step": 118535, "epoch": 1428} {"train_loss": -22.341419219970703, "global_step": 118536, "epoch": 1428} {"train_loss": -22.135833740234375, "global_step": 118537, "epoch": 1428} {"train_loss": -22.5739803314209, "global_step": 118538, "epoch": 1428} {"train_loss": -22.342308044433594, "global_step": 118539, "epoch": 1428} {"train_loss": -22.450366973876953, "global_step": 118540, "epoch": 1428} {"train_loss": -22.542709350585938, "global_step": 118541, "epoch": 1428} {"train_loss": -22.390838623046875, "global_step": 118542, "epoch": 1428} {"train_loss": -22.71717643737793, "global_step": 118543, "epoch": 1428} {"train_loss": -22.54903221130371, "global_step": 118544, "epoch": 1428} {"train_loss": -22.49427604675293, "global_step": 118545, "epoch": 1428} {"train_loss": -22.762371063232422, "global_step": 118546, "epoch": 1428} {"train_loss": -22.430814743041992, "global_step": 118547, "epoch": 1428} {"train_loss": -22.534210205078125, "global_step": 118548, "epoch": 1428} {"train_loss": -22.273956298828125, "global_step": 118549, "epoch": 1428} {"train_loss": -22.5650691986084, "global_step": 118550, "epoch": 1428} {"train_loss": -22.389402389526367, "global_step": 118551, "epoch": 1428} {"train_loss": -22.2182674407959, "global_step": 118552, "epoch": 1428} {"train_loss": -22.654361724853516, "global_step": 118553, "epoch": 1428} {"train_loss": -22.27217674255371, "global_step": 118554, "epoch": 1428} {"train_loss": -22.469541549682617, "global_step": 118555, "epoch": 1428} {"train_loss": -22.323339462280273, "global_step": 118556, "epoch": 1428} {"train_loss": -22.678998947143555, "global_step": 118557, "epoch": 1428} {"train_loss": -22.365049362182617, "global_step": 118558, "epoch": 1428} {"train_loss": -23.043628692626953, "global_step": 118559, "epoch": 1428} {"train_loss": -22.363557815551758, "global_step": 118560, "epoch": 1428} {"train_loss": -22.646677017211914, "global_step": 118561, "epoch": 1428} {"train_loss": -22.37770652770996, "global_step": 118562, "epoch": 1428} {"train_loss": -22.699193954467773, "global_step": 118563, "epoch": 1428} {"train_loss": -21.84165382385254, "global_step": 118564, "epoch": 1428} {"train_loss": -22.614622116088867, "global_step": 118565, "epoch": 1428} {"train_loss": -22.37624168395996, "global_step": 118566, "epoch": 1428} {"train_loss": -22.778915405273438, "global_step": 118567, "epoch": 1428} {"train_loss": -22.051746368408203, "global_step": 118568, "epoch": 1428} {"train_loss": -22.13747215270996, "global_step": 118569, "epoch": 1428} {"train_loss": -22.08528709411621, "global_step": 118570, "epoch": 1428} {"train_loss": -22.724576950073242, "global_step": 118571, "epoch": 1428} {"train_loss": -22.48314094543457, "global_step": 118572, "epoch": 1428} {"train_loss": -22.28948211669922, "global_step": 118573, "epoch": 1428} {"train_loss": -22.749025344848633, "global_step": 118574, "epoch": 1428} {"train_loss": -22.40874671936035, "global_step": 118575, "epoch": 1428} {"train_loss": -22.538740158081055, "global_step": 118576, "epoch": 1428} {"train_loss": -22.421768188476562, "global_step": 118577, "epoch": 1428} {"train_loss": -22.503101348876953, "global_step": 118578, "epoch": 1428} {"train_loss": -22.591392517089844, "global_step": 118579, "epoch": 1428} {"train_loss": -22.585050582885742, "global_step": 118580, "epoch": 1428} {"train_loss": -22.172765731811523, "global_step": 118581, "epoch": 1428} {"train_loss": -22.376710891723633, "global_step": 118582, "epoch": 1428} {"train_loss": -22.759387969970703, "global_step": 118583, "epoch": 1428} {"train_loss": -22.78826332092285, "global_step": 118584, "epoch": 1428} {"train_loss": -23.0334529876709, "global_step": 118585, "epoch": 1428} {"train_loss": -22.835208892822266, "global_step": 118586, "epoch": 1428} {"train_loss": -22.653470993041992, "global_step": 118587, "epoch": 1428} {"train_loss": -22.527381896972656, "global_step": 118588, "epoch": 1428} {"train_loss": -22.76771354675293, "global_step": 118589, "epoch": 1428} {"train_loss": -22.619129180908203, "global_step": 118590, "epoch": 1428} {"train_loss": -23.0152645111084, "global_step": 118591, "epoch": 1428} {"train_loss": -22.737653732299805, "global_step": 118592, "epoch": 1428} {"train_loss": -22.43344497680664, "global_step": 118593, "epoch": 1428} {"train_loss": -22.581207275390625, "global_step": 118594, "epoch": 1428} {"train_loss": -22.394168853759766, "global_step": 118595, "epoch": 1428} {"train_loss": -22.44365119934082, "global_step": 118596, "epoch": 1428} {"train_loss": -22.515216827392578, "global_step": 118597, "epoch": 1428} {"train_loss": -22.472646713256836, "global_step": 118598, "epoch": 1428} {"train_loss": -22.119298934936523, "global_step": 118599, "epoch": 1428} {"train_loss": -22.773880004882812, "global_step": 118600, "epoch": 1428} {"train_loss": -22.9060115814209, "global_step": 118601, "epoch": 1428} {"train_loss": -22.809125900268555, "global_step": 118602, "epoch": 1428} {"train_loss": -22.21806526184082, "global_step": 118603, "epoch": 1428} {"train_loss": -22.400537490844727, "global_step": 118604, "epoch": 1428} {"train_loss": -22.493497848510742, "global_step": 118605, "epoch": 1428} {"train_loss": -22.471535533307545, "global_step": 118606, "epoch": 1428, "val_loss": 6320458.0} {"train_loss": -22.039785385131836, "global_step": 118607, "epoch": 1429} {"train_loss": -21.538604736328125, "global_step": 118608, "epoch": 1429} {"train_loss": -21.7574462890625, "global_step": 118609, "epoch": 1429} {"train_loss": -21.839513778686523, "global_step": 118610, "epoch": 1429} {"train_loss": -22.449766159057617, "global_step": 118611, "epoch": 1429} {"train_loss": -22.052494049072266, "global_step": 118612, "epoch": 1429} {"train_loss": -22.189167022705078, "global_step": 118613, "epoch": 1429} {"train_loss": -21.717924118041992, "global_step": 118614, "epoch": 1429} {"train_loss": -22.127012252807617, "global_step": 118615, "epoch": 1429} {"train_loss": -22.35097885131836, "global_step": 118616, "epoch": 1429} {"train_loss": -22.151660919189453, "global_step": 118617, "epoch": 1429} {"train_loss": -22.25722312927246, "global_step": 118618, "epoch": 1429} {"train_loss": -22.271238327026367, "global_step": 118619, "epoch": 1429} {"train_loss": -22.3521785736084, "global_step": 118620, "epoch": 1429} {"train_loss": -22.48172378540039, "global_step": 118621, "epoch": 1429} {"train_loss": -22.654468536376953, "global_step": 118622, "epoch": 1429} {"train_loss": -22.524822235107422, "global_step": 118623, "epoch": 1429} {"train_loss": -22.48642349243164, "global_step": 118624, "epoch": 1429} {"train_loss": -22.67610740661621, "global_step": 118625, "epoch": 1429} {"train_loss": -22.386497497558594, "global_step": 118626, "epoch": 1429} {"train_loss": -22.294048309326172, "global_step": 118627, "epoch": 1429} {"train_loss": -22.408245086669922, "global_step": 118628, "epoch": 1429} {"train_loss": -22.348411560058594, "global_step": 118629, "epoch": 1429} {"train_loss": -22.75167465209961, "global_step": 118630, "epoch": 1429} {"train_loss": -22.427522659301758, "global_step": 118631, "epoch": 1429} {"train_loss": -22.402559280395508, "global_step": 118632, "epoch": 1429} {"train_loss": -22.30624008178711, "global_step": 118633, "epoch": 1429} {"train_loss": -22.669206619262695, "global_step": 118634, "epoch": 1429} {"train_loss": -22.388011932373047, "global_step": 118635, "epoch": 1429} {"train_loss": -22.51185417175293, "global_step": 118636, "epoch": 1429} {"train_loss": -22.39565086364746, "global_step": 118637, "epoch": 1429} {"train_loss": -22.47941017150879, "global_step": 118638, "epoch": 1429} {"train_loss": -22.64301109313965, "global_step": 118639, "epoch": 1429} {"train_loss": -22.331708908081055, "global_step": 118640, "epoch": 1429} {"train_loss": -22.385007858276367, "global_step": 118641, "epoch": 1429} {"train_loss": -22.596694946289062, "global_step": 118642, "epoch": 1429} {"train_loss": -22.25655174255371, "global_step": 118643, "epoch": 1429} {"train_loss": -22.661479949951172, "global_step": 118644, "epoch": 1429} {"train_loss": -22.618637084960938, "global_step": 118645, "epoch": 1429} {"train_loss": -22.77834129333496, "global_step": 118646, "epoch": 1429} {"train_loss": -22.635360717773438, "global_step": 118647, "epoch": 1429} {"train_loss": -22.35786247253418, "global_step": 118648, "epoch": 1429} {"train_loss": -22.267335891723633, "global_step": 118649, "epoch": 1429} {"train_loss": -22.14716911315918, "global_step": 118650, "epoch": 1429} {"train_loss": -22.371416091918945, "global_step": 118651, "epoch": 1429} {"train_loss": -22.558515548706055, "global_step": 118652, "epoch": 1429} {"train_loss": -22.817533493041992, "global_step": 118653, "epoch": 1429} {"train_loss": -22.022546768188477, "global_step": 118654, "epoch": 1429} {"train_loss": -21.939279556274414, "global_step": 118655, "epoch": 1429} {"train_loss": -22.15338134765625, "global_step": 118656, "epoch": 1429} {"train_loss": -22.668039321899414, "global_step": 118657, "epoch": 1429} {"train_loss": -22.613523483276367, "global_step": 118658, "epoch": 1429} {"train_loss": -22.290380477905273, "global_step": 118659, "epoch": 1429} {"train_loss": -22.392812728881836, "global_step": 118660, "epoch": 1429} {"train_loss": -22.500389099121094, "global_step": 118661, "epoch": 1429} {"train_loss": -22.033981323242188, "global_step": 118662, "epoch": 1429} {"train_loss": -22.31825828552246, "global_step": 118663, "epoch": 1429} {"train_loss": -22.73773193359375, "global_step": 118664, "epoch": 1429} {"train_loss": -22.206499099731445, "global_step": 118665, "epoch": 1429} {"train_loss": -22.8508358001709, "global_step": 118666, "epoch": 1429} {"train_loss": -22.511789321899414, "global_step": 118667, "epoch": 1429} {"train_loss": -22.558013916015625, "global_step": 118668, "epoch": 1429} {"train_loss": -22.471698760986328, "global_step": 118669, "epoch": 1429} {"train_loss": -22.367971420288086, "global_step": 118670, "epoch": 1429} {"train_loss": -22.571544647216797, "global_step": 118671, "epoch": 1429} {"train_loss": -22.184127807617188, "global_step": 118672, "epoch": 1429} {"train_loss": -22.535062789916992, "global_step": 118673, "epoch": 1429} {"train_loss": -22.766395568847656, "global_step": 118674, "epoch": 1429} {"train_loss": -22.568132400512695, "global_step": 118675, "epoch": 1429} {"train_loss": -22.54945182800293, "global_step": 118676, "epoch": 1429} {"train_loss": -22.375192642211914, "global_step": 118677, "epoch": 1429} {"train_loss": -22.466716766357422, "global_step": 118678, "epoch": 1429} {"train_loss": -22.648061752319336, "global_step": 118679, "epoch": 1429} {"train_loss": -22.698617935180664, "global_step": 118680, "epoch": 1429} {"train_loss": -22.509363174438477, "global_step": 118681, "epoch": 1429} {"train_loss": -22.308704376220703, "global_step": 118682, "epoch": 1429} {"train_loss": -22.513355255126953, "global_step": 118683, "epoch": 1429} {"train_loss": -22.778915405273438, "global_step": 118684, "epoch": 1429} {"train_loss": -22.28450584411621, "global_step": 118685, "epoch": 1429} {"train_loss": -22.029088973999023, "global_step": 118686, "epoch": 1429} {"train_loss": -22.4625244140625, "global_step": 118687, "epoch": 1429} {"train_loss": -22.319416046142578, "global_step": 118688, "epoch": 1429} {"train_loss": -22.398939914013965, "global_step": 118689, "epoch": 1429, "val_loss": 6163877.5} {"train_loss": -22.38968849182129, "global_step": 118690, "epoch": 1430} {"train_loss": -22.391338348388672, "global_step": 118691, "epoch": 1430} {"train_loss": -22.405288696289062, "global_step": 118692, "epoch": 1430} {"train_loss": -22.348098754882812, "global_step": 118693, "epoch": 1430} {"train_loss": -22.39859962463379, "global_step": 118694, "epoch": 1430} {"train_loss": -22.49012565612793, "global_step": 118695, "epoch": 1430} {"train_loss": -22.41780662536621, "global_step": 118696, "epoch": 1430} {"train_loss": -22.424646377563477, "global_step": 118697, "epoch": 1430} {"train_loss": -22.185985565185547, "global_step": 118698, "epoch": 1430} {"train_loss": -22.68863868713379, "global_step": 118699, "epoch": 1430} {"train_loss": -22.45517921447754, "global_step": 118700, "epoch": 1430} {"train_loss": -22.452390670776367, "global_step": 118701, "epoch": 1430} {"train_loss": -22.496143341064453, "global_step": 118702, "epoch": 1430} {"train_loss": -22.255859375, "global_step": 118703, "epoch": 1430} {"train_loss": -22.63452911376953, "global_step": 118704, "epoch": 1430} {"train_loss": -22.2756404876709, "global_step": 118705, "epoch": 1430} {"train_loss": -22.71213722229004, "global_step": 118706, "epoch": 1430} {"train_loss": -21.920642852783203, "global_step": 118707, "epoch": 1430} {"train_loss": -22.186859130859375, "global_step": 118708, "epoch": 1430} {"train_loss": -22.365215301513672, "global_step": 118709, "epoch": 1430} {"train_loss": -22.152629852294922, "global_step": 118710, "epoch": 1430} {"train_loss": -22.17597007751465, "global_step": 118711, "epoch": 1430} {"train_loss": -22.59486198425293, "global_step": 118712, "epoch": 1430} {"train_loss": -22.636734008789062, "global_step": 118713, "epoch": 1430} {"train_loss": -22.39319610595703, "global_step": 118714, "epoch": 1430} {"train_loss": -22.13308334350586, "global_step": 118715, "epoch": 1430} {"train_loss": -22.52057456970215, "global_step": 118716, "epoch": 1430} {"train_loss": -22.544919967651367, "global_step": 118717, "epoch": 1430} {"train_loss": -22.599233627319336, "global_step": 118718, "epoch": 1430} {"train_loss": -22.572572708129883, "global_step": 118719, "epoch": 1430} {"train_loss": -22.843910217285156, "global_step": 118720, "epoch": 1430} {"train_loss": -22.333023071289062, "global_step": 118721, "epoch": 1430} {"train_loss": -22.488767623901367, "global_step": 118722, "epoch": 1430} {"train_loss": -22.57452964782715, "global_step": 118723, "epoch": 1430} {"train_loss": -22.511066436767578, "global_step": 118724, "epoch": 1430} {"train_loss": -22.558198928833008, "global_step": 118725, "epoch": 1430} {"train_loss": -22.40713882446289, "global_step": 118726, "epoch": 1430} {"train_loss": -22.165695190429688, "global_step": 118727, "epoch": 1430} {"train_loss": -22.45417022705078, "global_step": 118728, "epoch": 1430} {"train_loss": -22.515836715698242, "global_step": 118729, "epoch": 1430} {"train_loss": -22.15193748474121, "global_step": 118730, "epoch": 1430} {"train_loss": -22.69539451599121, "global_step": 118731, "epoch": 1430} {"train_loss": -22.244115829467773, "global_step": 118732, "epoch": 1430} {"train_loss": -22.81379508972168, "global_step": 118733, "epoch": 1430} {"train_loss": -22.19085693359375, "global_step": 118734, "epoch": 1430} {"train_loss": -22.54501724243164, "global_step": 118735, "epoch": 1430} {"train_loss": -22.419570922851562, "global_step": 118736, "epoch": 1430} {"train_loss": -22.0867862701416, "global_step": 118737, "epoch": 1430} {"train_loss": -22.528385162353516, "global_step": 118738, "epoch": 1430} {"train_loss": -22.51002311706543, "global_step": 118739, "epoch": 1430} {"train_loss": -22.651142120361328, "global_step": 118740, "epoch": 1430} {"train_loss": -22.412168502807617, "global_step": 118741, "epoch": 1430} {"train_loss": -22.280454635620117, "global_step": 118742, "epoch": 1430} {"train_loss": -22.103662490844727, "global_step": 118743, "epoch": 1430} {"train_loss": -22.407337188720703, "global_step": 118744, "epoch": 1430} {"train_loss": -22.579030990600586, "global_step": 118745, "epoch": 1430} {"train_loss": -22.47930145263672, "global_step": 118746, "epoch": 1430} {"train_loss": -22.454870223999023, "global_step": 118747, "epoch": 1430} {"train_loss": -22.789533615112305, "global_step": 118748, "epoch": 1430} {"train_loss": -22.610637664794922, "global_step": 118749, "epoch": 1430} {"train_loss": -22.309730529785156, "global_step": 118750, "epoch": 1430} {"train_loss": -22.592609405517578, "global_step": 118751, "epoch": 1430} {"train_loss": -22.403894424438477, "global_step": 118752, "epoch": 1430} {"train_loss": -22.39025115966797, "global_step": 118753, "epoch": 1430} {"train_loss": -22.449243545532227, "global_step": 118754, "epoch": 1430} {"train_loss": -22.477436065673828, "global_step": 118755, "epoch": 1430} {"train_loss": -22.182861328125, "global_step": 118756, "epoch": 1430} {"train_loss": -22.58894157409668, "global_step": 118757, "epoch": 1430} {"train_loss": -22.833234786987305, "global_step": 118758, "epoch": 1430} {"train_loss": -22.6014461517334, "global_step": 118759, "epoch": 1430} {"train_loss": -22.70577621459961, "global_step": 118760, "epoch": 1430} {"train_loss": -22.283308029174805, "global_step": 118761, "epoch": 1430} {"train_loss": -22.731203079223633, "global_step": 118762, "epoch": 1430} {"train_loss": -22.82172966003418, "global_step": 118763, "epoch": 1430} {"train_loss": -22.600324630737305, "global_step": 118764, "epoch": 1430} {"train_loss": -22.533666610717773, "global_step": 118765, "epoch": 1430} {"train_loss": -22.712387084960938, "global_step": 118766, "epoch": 1430} {"train_loss": -22.3533878326416, "global_step": 118767, "epoch": 1430} {"train_loss": -22.5239315032959, "global_step": 118768, "epoch": 1430} {"train_loss": -22.193132400512695, "global_step": 118769, "epoch": 1430} {"train_loss": -22.71207618713379, "global_step": 118770, "epoch": 1430} {"train_loss": -22.27179527282715, "global_step": 118771, "epoch": 1430} {"train_loss": -22.462856522525648, "global_step": 118772, "epoch": 1430, "val_loss": 6239581.5} {"train_loss": -22.016401290893555, "global_step": 118773, "epoch": 1431} {"train_loss": -22.25503921508789, "global_step": 118774, "epoch": 1431} {"train_loss": -22.131832122802734, "global_step": 118775, "epoch": 1431} {"train_loss": -22.07576560974121, "global_step": 118776, "epoch": 1431} {"train_loss": -22.574480056762695, "global_step": 118777, "epoch": 1431} {"train_loss": -22.456558227539062, "global_step": 118778, "epoch": 1431} {"train_loss": -22.455114364624023, "global_step": 118779, "epoch": 1431} {"train_loss": -22.253965377807617, "global_step": 118780, "epoch": 1431} {"train_loss": -22.410619735717773, "global_step": 118781, "epoch": 1431} {"train_loss": -22.627431869506836, "global_step": 118782, "epoch": 1431} {"train_loss": -22.302490234375, "global_step": 118783, "epoch": 1431} {"train_loss": -22.05825424194336, "global_step": 118784, "epoch": 1431} {"train_loss": -22.370006561279297, "global_step": 118785, "epoch": 1431} {"train_loss": -22.32449722290039, "global_step": 118786, "epoch": 1431} {"train_loss": -22.015287399291992, "global_step": 118787, "epoch": 1431} {"train_loss": -22.319976806640625, "global_step": 118788, "epoch": 1431} {"train_loss": -22.47426986694336, "global_step": 118789, "epoch": 1431} {"train_loss": -22.437808990478516, "global_step": 118790, "epoch": 1431} {"train_loss": -22.506916046142578, "global_step": 118791, "epoch": 1431} {"train_loss": -22.557655334472656, "global_step": 118792, "epoch": 1431} {"train_loss": -22.321989059448242, "global_step": 118793, "epoch": 1431} {"train_loss": -22.43455696105957, "global_step": 118794, "epoch": 1431} {"train_loss": -22.500564575195312, "global_step": 118795, "epoch": 1431} {"train_loss": -22.24526596069336, "global_step": 118796, "epoch": 1431} {"train_loss": -22.761127471923828, "global_step": 118797, "epoch": 1431} {"train_loss": -22.488224029541016, "global_step": 118798, "epoch": 1431} {"train_loss": -22.62055206298828, "global_step": 118799, "epoch": 1431} {"train_loss": -22.710721969604492, "global_step": 118800, "epoch": 1431} {"train_loss": -22.30866050720215, "global_step": 118801, "epoch": 1431} {"train_loss": -22.304805755615234, "global_step": 118802, "epoch": 1431} {"train_loss": -22.75246238708496, "global_step": 118803, "epoch": 1431} {"train_loss": -22.543710708618164, "global_step": 118804, "epoch": 1431} {"train_loss": -22.706745147705078, "global_step": 118805, "epoch": 1431} {"train_loss": -22.428207397460938, "global_step": 118806, "epoch": 1431} {"train_loss": -22.509000778198242, "global_step": 118807, "epoch": 1431} {"train_loss": -22.479612350463867, "global_step": 118808, "epoch": 1431} {"train_loss": -22.32749366760254, "global_step": 118809, "epoch": 1431} {"train_loss": -22.597105026245117, "global_step": 118810, "epoch": 1431} {"train_loss": -22.747665405273438, "global_step": 118811, "epoch": 1431} {"train_loss": -22.843896865844727, "global_step": 118812, "epoch": 1431} {"train_loss": -22.47199821472168, "global_step": 118813, "epoch": 1431} {"train_loss": -22.54030418395996, "global_step": 118814, "epoch": 1431} {"train_loss": -22.424848556518555, "global_step": 118815, "epoch": 1431} {"train_loss": -22.269195556640625, "global_step": 118816, "epoch": 1431} {"train_loss": -22.761476516723633, "global_step": 118817, "epoch": 1431} {"train_loss": -22.35491371154785, "global_step": 118818, "epoch": 1431} {"train_loss": -22.442855834960938, "global_step": 118819, "epoch": 1431} {"train_loss": -22.817415237426758, "global_step": 118820, "epoch": 1431} {"train_loss": -22.331127166748047, "global_step": 118821, "epoch": 1431} {"train_loss": -22.265380859375, "global_step": 118822, "epoch": 1431} {"train_loss": -22.400711059570312, "global_step": 118823, "epoch": 1431} {"train_loss": -22.294696807861328, "global_step": 118824, "epoch": 1431} {"train_loss": -21.952550888061523, "global_step": 118825, "epoch": 1431} {"train_loss": -22.451475143432617, "global_step": 118826, "epoch": 1431} {"train_loss": -22.008773803710938, "global_step": 118827, "epoch": 1431} {"train_loss": -22.200571060180664, "global_step": 118828, "epoch": 1431} {"train_loss": -22.160192489624023, "global_step": 118829, "epoch": 1431} {"train_loss": -22.6971492767334, "global_step": 118830, "epoch": 1431} {"train_loss": -22.665180206298828, "global_step": 118831, "epoch": 1431} {"train_loss": -22.467344284057617, "global_step": 118832, "epoch": 1431} {"train_loss": -22.402002334594727, "global_step": 118833, "epoch": 1431} {"train_loss": -22.097185134887695, "global_step": 118834, "epoch": 1431} {"train_loss": -22.239622116088867, "global_step": 118835, "epoch": 1431} {"train_loss": -22.81583595275879, "global_step": 118836, "epoch": 1431} {"train_loss": -22.25761604309082, "global_step": 118837, "epoch": 1431} {"train_loss": -22.438535690307617, "global_step": 118838, "epoch": 1431} {"train_loss": -22.67458724975586, "global_step": 118839, "epoch": 1431} {"train_loss": -22.33888053894043, "global_step": 118840, "epoch": 1431} {"train_loss": -22.561487197875977, "global_step": 118841, "epoch": 1431} {"train_loss": -22.329866409301758, "global_step": 118842, "epoch": 1431} {"train_loss": -22.362823486328125, "global_step": 118843, "epoch": 1431} {"train_loss": -22.554218292236328, "global_step": 118844, "epoch": 1431} {"train_loss": -22.60135841369629, "global_step": 118845, "epoch": 1431} {"train_loss": -22.58491325378418, "global_step": 118846, "epoch": 1431} {"train_loss": -22.253704071044922, "global_step": 118847, "epoch": 1431} {"train_loss": -22.375091552734375, "global_step": 118848, "epoch": 1431} {"train_loss": -22.375694274902344, "global_step": 118849, "epoch": 1431} {"train_loss": -22.767648696899414, "global_step": 118850, "epoch": 1431} {"train_loss": -22.655431747436523, "global_step": 118851, "epoch": 1431} {"train_loss": -22.548524856567383, "global_step": 118852, "epoch": 1431} {"train_loss": -22.70710563659668, "global_step": 118853, "epoch": 1431} {"train_loss": -23.03744125366211, "global_step": 118854, "epoch": 1431} {"train_loss": -22.46634795866817, "global_step": 118855, "epoch": 1431, "val_loss": 6219991.0} {"train_loss": -22.031309127807617, "global_step": 118856, "epoch": 1432} {"train_loss": -21.844877243041992, "global_step": 118857, "epoch": 1432} {"train_loss": -22.634092330932617, "global_step": 118858, "epoch": 1432} {"train_loss": -22.50103759765625, "global_step": 118859, "epoch": 1432} {"train_loss": -22.10371208190918, "global_step": 118860, "epoch": 1432} {"train_loss": -22.22701072692871, "global_step": 118861, "epoch": 1432} {"train_loss": -22.148595809936523, "global_step": 118862, "epoch": 1432} {"train_loss": -22.38593292236328, "global_step": 118863, "epoch": 1432} {"train_loss": -22.263813018798828, "global_step": 118864, "epoch": 1432} {"train_loss": -22.465009689331055, "global_step": 118865, "epoch": 1432} {"train_loss": -22.303714752197266, "global_step": 118866, "epoch": 1432} {"train_loss": -22.261699676513672, "global_step": 118867, "epoch": 1432} {"train_loss": -22.85594367980957, "global_step": 118868, "epoch": 1432} {"train_loss": -22.915143966674805, "global_step": 118869, "epoch": 1432} {"train_loss": -22.28045082092285, "global_step": 118870, "epoch": 1432} {"train_loss": -22.324514389038086, "global_step": 118871, "epoch": 1432} {"train_loss": -22.45609474182129, "global_step": 118872, "epoch": 1432} {"train_loss": -22.287063598632812, "global_step": 118873, "epoch": 1432} {"train_loss": -22.17963981628418, "global_step": 118874, "epoch": 1432} {"train_loss": -22.21766471862793, "global_step": 118875, "epoch": 1432} {"train_loss": -22.258350372314453, "global_step": 118876, "epoch": 1432} {"train_loss": -22.449939727783203, "global_step": 118877, "epoch": 1432} {"train_loss": -22.31062126159668, "global_step": 118878, "epoch": 1432} {"train_loss": -22.55743408203125, "global_step": 118879, "epoch": 1432} {"train_loss": -21.99468994140625, "global_step": 118880, "epoch": 1432} {"train_loss": -22.526151657104492, "global_step": 118881, "epoch": 1432} {"train_loss": -22.574094772338867, "global_step": 118882, "epoch": 1432} {"train_loss": -22.189453125, "global_step": 118883, "epoch": 1432} {"train_loss": -22.740982055664062, "global_step": 118884, "epoch": 1432} {"train_loss": -22.063108444213867, "global_step": 118885, "epoch": 1432} {"train_loss": -22.291051864624023, "global_step": 118886, "epoch": 1432} {"train_loss": -22.479787826538086, "global_step": 118887, "epoch": 1432} {"train_loss": -22.75592613220215, "global_step": 118888, "epoch": 1432} {"train_loss": -22.656431198120117, "global_step": 118889, "epoch": 1432} {"train_loss": -22.40232276916504, "global_step": 118890, "epoch": 1432} {"train_loss": -22.466686248779297, "global_step": 118891, "epoch": 1432} {"train_loss": -22.67340850830078, "global_step": 118892, "epoch": 1432} {"train_loss": -22.40216636657715, "global_step": 118893, "epoch": 1432} {"train_loss": -22.910390853881836, "global_step": 118894, "epoch": 1432} {"train_loss": -22.983322143554688, "global_step": 118895, "epoch": 1432} {"train_loss": -22.284143447875977, "global_step": 118896, "epoch": 1432} {"train_loss": -22.35233497619629, "global_step": 118897, "epoch": 1432} {"train_loss": -22.445219039916992, "global_step": 118898, "epoch": 1432} {"train_loss": -22.736740112304688, "global_step": 118899, "epoch": 1432} {"train_loss": -22.63763999938965, "global_step": 118900, "epoch": 1432} {"train_loss": -22.931537628173828, "global_step": 118901, "epoch": 1432} {"train_loss": -22.56732177734375, "global_step": 118902, "epoch": 1432} {"train_loss": -22.88253402709961, "global_step": 118903, "epoch": 1432} {"train_loss": -22.693954467773438, "global_step": 118904, "epoch": 1432} {"train_loss": -22.45590591430664, "global_step": 118905, "epoch": 1432} {"train_loss": -22.449914932250977, "global_step": 118906, "epoch": 1432} {"train_loss": -22.490768432617188, "global_step": 118907, "epoch": 1432} {"train_loss": -22.84588623046875, "global_step": 118908, "epoch": 1432} {"train_loss": -22.538101196289062, "global_step": 118909, "epoch": 1432} {"train_loss": -22.3353328704834, "global_step": 118910, "epoch": 1432} {"train_loss": -22.129159927368164, "global_step": 118911, "epoch": 1432} {"train_loss": -22.340646743774414, "global_step": 118912, "epoch": 1432} {"train_loss": -22.4046688079834, "global_step": 118913, "epoch": 1432} {"train_loss": -22.4364070892334, "global_step": 118914, "epoch": 1432} {"train_loss": -22.50008773803711, "global_step": 118915, "epoch": 1432} {"train_loss": -22.324657440185547, "global_step": 118916, "epoch": 1432} {"train_loss": -23.044464111328125, "global_step": 118917, "epoch": 1432} {"train_loss": -22.792217254638672, "global_step": 118918, "epoch": 1432} {"train_loss": -22.54811668395996, "global_step": 118919, "epoch": 1432} {"train_loss": -22.176450729370117, "global_step": 118920, "epoch": 1432} {"train_loss": -22.568723678588867, "global_step": 118921, "epoch": 1432} {"train_loss": -22.51982879638672, "global_step": 118922, "epoch": 1432} {"train_loss": -22.63112449645996, "global_step": 118923, "epoch": 1432} {"train_loss": -22.5507869720459, "global_step": 118924, "epoch": 1432} {"train_loss": -22.84651756286621, "global_step": 118925, "epoch": 1432} {"train_loss": -22.70229148864746, "global_step": 118926, "epoch": 1432} {"train_loss": -22.777923583984375, "global_step": 118927, "epoch": 1432} {"train_loss": -22.482593536376953, "global_step": 118928, "epoch": 1432} {"train_loss": -22.292451858520508, "global_step": 118929, "epoch": 1432} {"train_loss": -22.5841121673584, "global_step": 118930, "epoch": 1432} {"train_loss": -22.99629783630371, "global_step": 118931, "epoch": 1432} {"train_loss": -22.79389762878418, "global_step": 118932, "epoch": 1432} {"train_loss": -22.341161727905273, "global_step": 118933, "epoch": 1432} {"train_loss": -22.680156707763672, "global_step": 118934, "epoch": 1432} {"train_loss": -22.51597023010254, "global_step": 118935, "epoch": 1432} {"train_loss": -22.644664764404297, "global_step": 118936, "epoch": 1432} {"train_loss": -22.44215965270996, "global_step": 118937, "epoch": 1432} {"train_loss": -22.501659508211066, "global_step": 118938, "epoch": 1432, "val_loss": 6226634.0} {"train_loss": -22.117990493774414, "global_step": 118939, "epoch": 1433} {"train_loss": -22.224416732788086, "global_step": 118940, "epoch": 1433} {"train_loss": -22.189233779907227, "global_step": 118941, "epoch": 1433} {"train_loss": -22.20574951171875, "global_step": 118942, "epoch": 1433} {"train_loss": -22.24083137512207, "global_step": 118943, "epoch": 1433} {"train_loss": -22.313718795776367, "global_step": 118944, "epoch": 1433} {"train_loss": -22.614713668823242, "global_step": 118945, "epoch": 1433} {"train_loss": -22.842273712158203, "global_step": 118946, "epoch": 1433} {"train_loss": -22.534772872924805, "global_step": 118947, "epoch": 1433} {"train_loss": -22.293548583984375, "global_step": 118948, "epoch": 1433} {"train_loss": -22.418676376342773, "global_step": 118949, "epoch": 1433} {"train_loss": -22.463218688964844, "global_step": 118950, "epoch": 1433} {"train_loss": -22.564624786376953, "global_step": 118951, "epoch": 1433} {"train_loss": -22.392881393432617, "global_step": 118952, "epoch": 1433} {"train_loss": -22.382932662963867, "global_step": 118953, "epoch": 1433} {"train_loss": -22.5394287109375, "global_step": 118954, "epoch": 1433} {"train_loss": -22.277280807495117, "global_step": 118955, "epoch": 1433} {"train_loss": -22.25083351135254, "global_step": 118956, "epoch": 1433} {"train_loss": -22.39371109008789, "global_step": 118957, "epoch": 1433} {"train_loss": -22.496877670288086, "global_step": 118958, "epoch": 1433} {"train_loss": -22.16969871520996, "global_step": 118959, "epoch": 1433} {"train_loss": -22.45235824584961, "global_step": 118960, "epoch": 1433} {"train_loss": -22.779966354370117, "global_step": 118961, "epoch": 1433} {"train_loss": -22.392271041870117, "global_step": 118962, "epoch": 1433} {"train_loss": -22.941375732421875, "global_step": 118963, "epoch": 1433} {"train_loss": -22.371402740478516, "global_step": 118964, "epoch": 1433} {"train_loss": -22.496662139892578, "global_step": 118965, "epoch": 1433} {"train_loss": -22.808048248291016, "global_step": 118966, "epoch": 1433} {"train_loss": -22.66658592224121, "global_step": 118967, "epoch": 1433} {"train_loss": -22.54755210876465, "global_step": 118968, "epoch": 1433} {"train_loss": -22.058759689331055, "global_step": 118969, "epoch": 1433} {"train_loss": -22.480772018432617, "global_step": 118970, "epoch": 1433} {"train_loss": -22.282245635986328, "global_step": 118971, "epoch": 1433} {"train_loss": -22.52046012878418, "global_step": 118972, "epoch": 1433} {"train_loss": -22.10011863708496, "global_step": 118973, "epoch": 1433} {"train_loss": -22.159358978271484, "global_step": 118974, "epoch": 1433} {"train_loss": -22.442401885986328, "global_step": 118975, "epoch": 1433} {"train_loss": -22.49886703491211, "global_step": 118976, "epoch": 1433} {"train_loss": -22.400318145751953, "global_step": 118977, "epoch": 1433} {"train_loss": -22.342233657836914, "global_step": 118978, "epoch": 1433} {"train_loss": -22.49958610534668, "global_step": 118979, "epoch": 1433} {"train_loss": -22.73252296447754, "global_step": 118980, "epoch": 1433} {"train_loss": -22.566686630249023, "global_step": 118981, "epoch": 1433} {"train_loss": -22.55458641052246, "global_step": 118982, "epoch": 1433} {"train_loss": -22.40089988708496, "global_step": 118983, "epoch": 1433} {"train_loss": -22.50948715209961, "global_step": 118984, "epoch": 1433} {"train_loss": -22.419963836669922, "global_step": 118985, "epoch": 1433} {"train_loss": -22.348453521728516, "global_step": 118986, "epoch": 1433} {"train_loss": -22.347694396972656, "global_step": 118987, "epoch": 1433} {"train_loss": -22.454334259033203, "global_step": 118988, "epoch": 1433} {"train_loss": -22.599435806274414, "global_step": 118989, "epoch": 1433} {"train_loss": -21.816728591918945, "global_step": 118990, "epoch": 1433} {"train_loss": -22.46396827697754, "global_step": 118991, "epoch": 1433} {"train_loss": -22.435739517211914, "global_step": 118992, "epoch": 1433} {"train_loss": -22.462148666381836, "global_step": 118993, "epoch": 1433} {"train_loss": -22.389636993408203, "global_step": 118994, "epoch": 1433} {"train_loss": -21.959163665771484, "global_step": 118995, "epoch": 1433} {"train_loss": -22.80038070678711, "global_step": 118996, "epoch": 1433} {"train_loss": -22.3428897857666, "global_step": 118997, "epoch": 1433} {"train_loss": -22.4122257232666, "global_step": 118998, "epoch": 1433} {"train_loss": -22.52394676208496, "global_step": 118999, "epoch": 1433} {"train_loss": -22.542007446289062, "global_step": 119000, "epoch": 1433} {"train_loss": -22.309682846069336, "global_step": 119001, "epoch": 1433} {"train_loss": -22.404706954956055, "global_step": 119002, "epoch": 1433} {"train_loss": -22.549489974975586, "global_step": 119003, "epoch": 1433} {"train_loss": -22.644840240478516, "global_step": 119004, "epoch": 1433} {"train_loss": -22.39108657836914, "global_step": 119005, "epoch": 1433} {"train_loss": -22.30303955078125, "global_step": 119006, "epoch": 1433} {"train_loss": -22.766664505004883, "global_step": 119007, "epoch": 1433} {"train_loss": -22.376510620117188, "global_step": 119008, "epoch": 1433} {"train_loss": -22.456825256347656, "global_step": 119009, "epoch": 1433} {"train_loss": -22.471240997314453, "global_step": 119010, "epoch": 1433} {"train_loss": -22.26540184020996, "global_step": 119011, "epoch": 1433} {"train_loss": -22.70025062561035, "global_step": 119012, "epoch": 1433} {"train_loss": -22.317047119140625, "global_step": 119013, "epoch": 1433} {"train_loss": -22.377349853515625, "global_step": 119014, "epoch": 1433} {"train_loss": -22.67900848388672, "global_step": 119015, "epoch": 1433} {"train_loss": -22.409704208374023, "global_step": 119016, "epoch": 1433} {"train_loss": -22.599624633789062, "global_step": 119017, "epoch": 1433} {"train_loss": -22.75921630859375, "global_step": 119018, "epoch": 1433} {"train_loss": -22.53468894958496, "global_step": 119019, "epoch": 1433} {"train_loss": -22.491012573242188, "global_step": 119020, "epoch": 1433} {"train_loss": -22.439386046076397, "global_step": 119021, "epoch": 1433, "val_loss": 6104385.0} {"train_loss": -22.182836532592773, "global_step": 119022, "epoch": 1434} {"train_loss": -21.836956024169922, "global_step": 119023, "epoch": 1434} {"train_loss": -22.202009201049805, "global_step": 119024, "epoch": 1434} {"train_loss": -22.05962562561035, "global_step": 119025, "epoch": 1434} {"train_loss": -22.362241744995117, "global_step": 119026, "epoch": 1434} {"train_loss": -22.012161254882812, "global_step": 119027, "epoch": 1434} {"train_loss": -22.363910675048828, "global_step": 119028, "epoch": 1434} {"train_loss": -22.236703872680664, "global_step": 119029, "epoch": 1434} {"train_loss": -21.97501564025879, "global_step": 119030, "epoch": 1434} {"train_loss": -22.182241439819336, "global_step": 119031, "epoch": 1434} {"train_loss": -22.346494674682617, "global_step": 119032, "epoch": 1434} {"train_loss": -22.3610897064209, "global_step": 119033, "epoch": 1434} {"train_loss": -22.24723243713379, "global_step": 119034, "epoch": 1434} {"train_loss": -22.045801162719727, "global_step": 119035, "epoch": 1434} {"train_loss": -22.43940544128418, "global_step": 119036, "epoch": 1434} {"train_loss": -22.191558837890625, "global_step": 119037, "epoch": 1434} {"train_loss": -22.570783615112305, "global_step": 119038, "epoch": 1434} {"train_loss": -22.612869262695312, "global_step": 119039, "epoch": 1434} {"train_loss": -22.599529266357422, "global_step": 119040, "epoch": 1434} {"train_loss": -22.64853858947754, "global_step": 119041, "epoch": 1434} {"train_loss": -22.23710060119629, "global_step": 119042, "epoch": 1434} {"train_loss": -22.41323471069336, "global_step": 119043, "epoch": 1434} {"train_loss": -22.78879165649414, "global_step": 119044, "epoch": 1434} {"train_loss": -22.33921241760254, "global_step": 119045, "epoch": 1434} {"train_loss": -22.58782386779785, "global_step": 119046, "epoch": 1434} {"train_loss": -22.432281494140625, "global_step": 119047, "epoch": 1434} {"train_loss": -22.276124954223633, "global_step": 119048, "epoch": 1434} {"train_loss": -22.1043758392334, "global_step": 119049, "epoch": 1434} {"train_loss": -22.43752098083496, "global_step": 119050, "epoch": 1434} {"train_loss": -22.421661376953125, "global_step": 119051, "epoch": 1434} {"train_loss": -22.66158103942871, "global_step": 119052, "epoch": 1434} {"train_loss": -22.976072311401367, "global_step": 119053, "epoch": 1434} {"train_loss": -22.21746826171875, "global_step": 119054, "epoch": 1434} {"train_loss": -22.351102828979492, "global_step": 119055, "epoch": 1434} {"train_loss": -22.891733169555664, "global_step": 119056, "epoch": 1434} {"train_loss": -22.23836326599121, "global_step": 119057, "epoch": 1434} {"train_loss": -22.457868576049805, "global_step": 119058, "epoch": 1434} {"train_loss": -22.414052963256836, "global_step": 119059, "epoch": 1434} {"train_loss": -22.179346084594727, "global_step": 119060, "epoch": 1434} {"train_loss": -22.5825252532959, "global_step": 119061, "epoch": 1434} {"train_loss": -22.52848243713379, "global_step": 119062, "epoch": 1434} {"train_loss": -22.580541610717773, "global_step": 119063, "epoch": 1434} {"train_loss": -22.498580932617188, "global_step": 119064, "epoch": 1434} {"train_loss": -22.510591506958008, "global_step": 119065, "epoch": 1434} {"train_loss": -22.710792541503906, "global_step": 119066, "epoch": 1434} {"train_loss": -22.584325790405273, "global_step": 119067, "epoch": 1434} {"train_loss": -22.34471321105957, "global_step": 119068, "epoch": 1434} {"train_loss": -22.45244789123535, "global_step": 119069, "epoch": 1434} {"train_loss": -22.58637809753418, "global_step": 119070, "epoch": 1434} {"train_loss": -22.285964965820312, "global_step": 119071, "epoch": 1434} {"train_loss": -22.313549041748047, "global_step": 119072, "epoch": 1434} {"train_loss": -22.46802520751953, "global_step": 119073, "epoch": 1434} {"train_loss": -22.604618072509766, "global_step": 119074, "epoch": 1434} {"train_loss": -22.59590721130371, "global_step": 119075, "epoch": 1434} {"train_loss": -22.58754539489746, "global_step": 119076, "epoch": 1434} {"train_loss": -22.47032928466797, "global_step": 119077, "epoch": 1434} {"train_loss": -22.457895278930664, "global_step": 119078, "epoch": 1434} {"train_loss": -22.916349411010742, "global_step": 119079, "epoch": 1434} {"train_loss": -22.87080192565918, "global_step": 119080, "epoch": 1434} {"train_loss": -22.33517837524414, "global_step": 119081, "epoch": 1434} {"train_loss": -22.21637535095215, "global_step": 119082, "epoch": 1434} {"train_loss": -22.517017364501953, "global_step": 119083, "epoch": 1434} {"train_loss": -22.612003326416016, "global_step": 119084, "epoch": 1434} {"train_loss": -22.447330474853516, "global_step": 119085, "epoch": 1434} {"train_loss": -22.50396156311035, "global_step": 119086, "epoch": 1434} {"train_loss": -22.7475643157959, "global_step": 119087, "epoch": 1434} {"train_loss": -22.39955711364746, "global_step": 119088, "epoch": 1434} {"train_loss": -22.375661849975586, "global_step": 119089, "epoch": 1434} {"train_loss": -22.5465030670166, "global_step": 119090, "epoch": 1434} {"train_loss": -22.673322677612305, "global_step": 119091, "epoch": 1434} {"train_loss": -22.256006240844727, "global_step": 119092, "epoch": 1434} {"train_loss": -22.90936279296875, "global_step": 119093, "epoch": 1434} {"train_loss": -22.23648452758789, "global_step": 119094, "epoch": 1434} {"train_loss": -22.635374069213867, "global_step": 119095, "epoch": 1434} {"train_loss": -22.592416763305664, "global_step": 119096, "epoch": 1434} {"train_loss": -22.152799606323242, "global_step": 119097, "epoch": 1434} {"train_loss": -22.4217586517334, "global_step": 119098, "epoch": 1434} {"train_loss": -22.412519454956055, "global_step": 119099, "epoch": 1434} {"train_loss": -22.021329879760742, "global_step": 119100, "epoch": 1434} {"train_loss": -22.687524795532227, "global_step": 119101, "epoch": 1434} {"train_loss": -22.274566650390625, "global_step": 119102, "epoch": 1434} {"train_loss": -22.174779891967773, "global_step": 119103, "epoch": 1434} {"train_loss": -22.411742681480316, "global_step": 119104, "epoch": 1434, "val_loss": 6162491.0} {"train_loss": -21.9100399017334, "global_step": 119105, "epoch": 1435} {"train_loss": -21.88262367248535, "global_step": 119106, "epoch": 1435} {"train_loss": -21.84396743774414, "global_step": 119107, "epoch": 1435} {"train_loss": -22.19635581970215, "global_step": 119108, "epoch": 1435} {"train_loss": -22.149873733520508, "global_step": 119109, "epoch": 1435} {"train_loss": -21.553844451904297, "global_step": 119110, "epoch": 1435} {"train_loss": -21.585020065307617, "global_step": 119111, "epoch": 1435} {"train_loss": -22.19046974182129, "global_step": 119112, "epoch": 1435} {"train_loss": -21.992637634277344, "global_step": 119113, "epoch": 1435} {"train_loss": -22.33180046081543, "global_step": 119114, "epoch": 1435} {"train_loss": -22.20456314086914, "global_step": 119115, "epoch": 1435} {"train_loss": -22.02288246154785, "global_step": 119116, "epoch": 1435} {"train_loss": -22.269935607910156, "global_step": 119117, "epoch": 1435} {"train_loss": -22.1373291015625, "global_step": 119118, "epoch": 1435} {"train_loss": -22.43556785583496, "global_step": 119119, "epoch": 1435} {"train_loss": -22.74141502380371, "global_step": 119120, "epoch": 1435} {"train_loss": -22.23288917541504, "global_step": 119121, "epoch": 1435} {"train_loss": -22.421194076538086, "global_step": 119122, "epoch": 1435} {"train_loss": -21.88214111328125, "global_step": 119123, "epoch": 1435} {"train_loss": -22.047452926635742, "global_step": 119124, "epoch": 1435} {"train_loss": -22.47914695739746, "global_step": 119125, "epoch": 1435} {"train_loss": -22.51602554321289, "global_step": 119126, "epoch": 1435} {"train_loss": -22.104354858398438, "global_step": 119127, "epoch": 1435} {"train_loss": -22.567358016967773, "global_step": 119128, "epoch": 1435} {"train_loss": -22.7147274017334, "global_step": 119129, "epoch": 1435} {"train_loss": -22.4923152923584, "global_step": 119130, "epoch": 1435} {"train_loss": -22.529449462890625, "global_step": 119131, "epoch": 1435} {"train_loss": -22.662038803100586, "global_step": 119132, "epoch": 1435} {"train_loss": -22.630855560302734, "global_step": 119133, "epoch": 1435} {"train_loss": -23.063886642456055, "global_step": 119134, "epoch": 1435} {"train_loss": -22.601308822631836, "global_step": 119135, "epoch": 1435} {"train_loss": -22.484161376953125, "global_step": 119136, "epoch": 1435} {"train_loss": -22.401121139526367, "global_step": 119137, "epoch": 1435} {"train_loss": -22.348417282104492, "global_step": 119138, "epoch": 1435} {"train_loss": -22.552453994750977, "global_step": 119139, "epoch": 1435} {"train_loss": -22.202884674072266, "global_step": 119140, "epoch": 1435} {"train_loss": -22.064197540283203, "global_step": 119141, "epoch": 1435} {"train_loss": -22.56049156188965, "global_step": 119142, "epoch": 1435} {"train_loss": -22.62203025817871, "global_step": 119143, "epoch": 1435} {"train_loss": -22.52404022216797, "global_step": 119144, "epoch": 1435} {"train_loss": -22.312314987182617, "global_step": 119145, "epoch": 1435} {"train_loss": -22.546131134033203, "global_step": 119146, "epoch": 1435} {"train_loss": -22.474308013916016, "global_step": 119147, "epoch": 1435} {"train_loss": -22.006723403930664, "global_step": 119148, "epoch": 1435} {"train_loss": -22.855955123901367, "global_step": 119149, "epoch": 1435} {"train_loss": -22.350162506103516, "global_step": 119150, "epoch": 1435} {"train_loss": -22.823444366455078, "global_step": 119151, "epoch": 1435} {"train_loss": -22.738279342651367, "global_step": 119152, "epoch": 1435} {"train_loss": -22.60982322692871, "global_step": 119153, "epoch": 1435} {"train_loss": -22.816242218017578, "global_step": 119154, "epoch": 1435} {"train_loss": -22.505428314208984, "global_step": 119155, "epoch": 1435} {"train_loss": -22.706674575805664, "global_step": 119156, "epoch": 1435} {"train_loss": -22.76227378845215, "global_step": 119157, "epoch": 1435} {"train_loss": -22.463109970092773, "global_step": 119158, "epoch": 1435} {"train_loss": -22.44481658935547, "global_step": 119159, "epoch": 1435} {"train_loss": -22.328022003173828, "global_step": 119160, "epoch": 1435} {"train_loss": -22.472431182861328, "global_step": 119161, "epoch": 1435} {"train_loss": -22.25048828125, "global_step": 119162, "epoch": 1435} {"train_loss": -22.788372039794922, "global_step": 119163, "epoch": 1435} {"train_loss": -22.469526290893555, "global_step": 119164, "epoch": 1435} {"train_loss": -22.475847244262695, "global_step": 119165, "epoch": 1435} {"train_loss": -22.574003219604492, "global_step": 119166, "epoch": 1435} {"train_loss": -22.311750411987305, "global_step": 119167, "epoch": 1435} {"train_loss": -22.39641761779785, "global_step": 119168, "epoch": 1435} {"train_loss": -22.42626953125, "global_step": 119169, "epoch": 1435} {"train_loss": -22.500165939331055, "global_step": 119170, "epoch": 1435} {"train_loss": -22.511661529541016, "global_step": 119171, "epoch": 1435} {"train_loss": -22.272991180419922, "global_step": 119172, "epoch": 1435} {"train_loss": -22.439029693603516, "global_step": 119173, "epoch": 1435} {"train_loss": -22.599227905273438, "global_step": 119174, "epoch": 1435} {"train_loss": -22.23594093322754, "global_step": 119175, "epoch": 1435} {"train_loss": -23.14438247680664, "global_step": 119176, "epoch": 1435} {"train_loss": -22.37481689453125, "global_step": 119177, "epoch": 1435} {"train_loss": -22.625965118408203, "global_step": 119178, "epoch": 1435} {"train_loss": -22.452129364013672, "global_step": 119179, "epoch": 1435} {"train_loss": -22.56658935546875, "global_step": 119180, "epoch": 1435} {"train_loss": -22.398733139038086, "global_step": 119181, "epoch": 1435} {"train_loss": -22.52462387084961, "global_step": 119182, "epoch": 1435} {"train_loss": -22.72236442565918, "global_step": 119183, "epoch": 1435} {"train_loss": -22.51598358154297, "global_step": 119184, "epoch": 1435} {"train_loss": -22.54949951171875, "global_step": 119185, "epoch": 1435} {"train_loss": -22.80910301208496, "global_step": 119186, "epoch": 1435} {"train_loss": -22.41776089495923, "global_step": 119187, "epoch": 1435, "val_loss": 6257826.5} {"train_loss": -22.35426902770996, "global_step": 119188, "epoch": 1436} {"train_loss": -21.498058319091797, "global_step": 119189, "epoch": 1436} {"train_loss": -22.55436134338379, "global_step": 119190, "epoch": 1436} {"train_loss": -21.639631271362305, "global_step": 119191, "epoch": 1436} {"train_loss": -22.11552619934082, "global_step": 119192, "epoch": 1436} {"train_loss": -22.344345092773438, "global_step": 119193, "epoch": 1436} {"train_loss": -22.121191024780273, "global_step": 119194, "epoch": 1436} {"train_loss": -21.99091911315918, "global_step": 119195, "epoch": 1436} {"train_loss": -22.420867919921875, "global_step": 119196, "epoch": 1436} {"train_loss": -22.278066635131836, "global_step": 119197, "epoch": 1436} {"train_loss": -21.995304107666016, "global_step": 119198, "epoch": 1436} {"train_loss": -22.414249420166016, "global_step": 119199, "epoch": 1436} {"train_loss": -22.115148544311523, "global_step": 119200, "epoch": 1436} {"train_loss": -22.405588150024414, "global_step": 119201, "epoch": 1436} {"train_loss": -22.145069122314453, "global_step": 119202, "epoch": 1436} {"train_loss": -22.085363388061523, "global_step": 119203, "epoch": 1436} {"train_loss": -21.932022094726562, "global_step": 119204, "epoch": 1436} {"train_loss": -22.265647888183594, "global_step": 119205, "epoch": 1436} {"train_loss": -22.42994499206543, "global_step": 119206, "epoch": 1436} {"train_loss": -22.478057861328125, "global_step": 119207, "epoch": 1436} {"train_loss": -22.7302188873291, "global_step": 119208, "epoch": 1436} {"train_loss": -22.501874923706055, "global_step": 119209, "epoch": 1436} {"train_loss": -22.26563262939453, "global_step": 119210, "epoch": 1436} {"train_loss": -22.384323120117188, "global_step": 119211, "epoch": 1436} {"train_loss": -22.565855026245117, "global_step": 119212, "epoch": 1436} {"train_loss": -22.36219024658203, "global_step": 119213, "epoch": 1436} {"train_loss": -22.40140724182129, "global_step": 119214, "epoch": 1436} {"train_loss": -22.47320556640625, "global_step": 119215, "epoch": 1436} {"train_loss": -22.38278579711914, "global_step": 119216, "epoch": 1436} {"train_loss": -22.55109214782715, "global_step": 119217, "epoch": 1436} {"train_loss": -22.82825469970703, "global_step": 119218, "epoch": 1436} {"train_loss": -22.259727478027344, "global_step": 119219, "epoch": 1436} {"train_loss": -22.480459213256836, "global_step": 119220, "epoch": 1436} {"train_loss": -22.48661994934082, "global_step": 119221, "epoch": 1436} {"train_loss": -22.652790069580078, "global_step": 119222, "epoch": 1436} {"train_loss": -22.197124481201172, "global_step": 119223, "epoch": 1436} {"train_loss": -22.851295471191406, "global_step": 119224, "epoch": 1436} {"train_loss": -22.685583114624023, "global_step": 119225, "epoch": 1436} {"train_loss": -22.186918258666992, "global_step": 119226, "epoch": 1436} {"train_loss": -22.562368392944336, "global_step": 119227, "epoch": 1436} {"train_loss": -22.472579956054688, "global_step": 119228, "epoch": 1436} {"train_loss": -22.392681121826172, "global_step": 119229, "epoch": 1436} {"train_loss": -22.338428497314453, "global_step": 119230, "epoch": 1436} {"train_loss": -22.899885177612305, "global_step": 119231, "epoch": 1436} {"train_loss": -22.463459014892578, "global_step": 119232, "epoch": 1436} {"train_loss": -22.443029403686523, "global_step": 119233, "epoch": 1436} {"train_loss": -22.518415451049805, "global_step": 119234, "epoch": 1436} {"train_loss": -22.22920036315918, "global_step": 119235, "epoch": 1436} {"train_loss": -21.993677139282227, "global_step": 119236, "epoch": 1436} {"train_loss": -22.33975601196289, "global_step": 119237, "epoch": 1436} {"train_loss": -22.780969619750977, "global_step": 119238, "epoch": 1436} {"train_loss": -22.567148208618164, "global_step": 119239, "epoch": 1436} {"train_loss": -22.17949676513672, "global_step": 119240, "epoch": 1436} {"train_loss": -22.619428634643555, "global_step": 119241, "epoch": 1436} {"train_loss": -22.117284774780273, "global_step": 119242, "epoch": 1436} {"train_loss": -22.325687408447266, "global_step": 119243, "epoch": 1436} {"train_loss": -22.316055297851562, "global_step": 119244, "epoch": 1436} {"train_loss": -21.92572021484375, "global_step": 119245, "epoch": 1436} {"train_loss": -22.431476593017578, "global_step": 119246, "epoch": 1436} {"train_loss": -22.160974502563477, "global_step": 119247, "epoch": 1436} {"train_loss": -22.740032196044922, "global_step": 119248, "epoch": 1436} {"train_loss": -21.7771053314209, "global_step": 119249, "epoch": 1436} {"train_loss": -22.427125930786133, "global_step": 119250, "epoch": 1436} {"train_loss": -22.546178817749023, "global_step": 119251, "epoch": 1436} {"train_loss": -22.369977951049805, "global_step": 119252, "epoch": 1436} {"train_loss": -22.301162719726562, "global_step": 119253, "epoch": 1436} {"train_loss": -22.50520133972168, "global_step": 119254, "epoch": 1436} {"train_loss": -22.4619140625, "global_step": 119255, "epoch": 1436} {"train_loss": -22.6502685546875, "global_step": 119256, "epoch": 1436} {"train_loss": -22.716880798339844, "global_step": 119257, "epoch": 1436} {"train_loss": -22.241575241088867, "global_step": 119258, "epoch": 1436} {"train_loss": -22.633398056030273, "global_step": 119259, "epoch": 1436} {"train_loss": -22.908267974853516, "global_step": 119260, "epoch": 1436} {"train_loss": -22.37965202331543, "global_step": 119261, "epoch": 1436} {"train_loss": -22.552621841430664, "global_step": 119262, "epoch": 1436} {"train_loss": -22.662141799926758, "global_step": 119263, "epoch": 1436} {"train_loss": -22.417865753173828, "global_step": 119264, "epoch": 1436} {"train_loss": -22.074058532714844, "global_step": 119265, "epoch": 1436} {"train_loss": -22.299142837524414, "global_step": 119266, "epoch": 1436} {"train_loss": -22.51267433166504, "global_step": 119267, "epoch": 1436} {"train_loss": -22.432392120361328, "global_step": 119268, "epoch": 1436} {"train_loss": -22.34324073791504, "global_step": 119269, "epoch": 1436} {"train_loss": -22.38076975259436, "global_step": 119270, "epoch": 1436, "val_loss": 6287163.5} {"train_loss": -22.352121353149414, "global_step": 119271, "epoch": 1437} {"train_loss": -21.212554931640625, "global_step": 119272, "epoch": 1437} {"train_loss": -21.994306564331055, "global_step": 119273, "epoch": 1437} {"train_loss": -22.50870704650879, "global_step": 119274, "epoch": 1437} {"train_loss": -22.00990867614746, "global_step": 119275, "epoch": 1437} {"train_loss": -22.042617797851562, "global_step": 119276, "epoch": 1437} {"train_loss": -22.002988815307617, "global_step": 119277, "epoch": 1437} {"train_loss": -22.25592613220215, "global_step": 119278, "epoch": 1437} {"train_loss": -22.144678115844727, "global_step": 119279, "epoch": 1437} {"train_loss": -22.103757858276367, "global_step": 119280, "epoch": 1437} {"train_loss": -22.107845306396484, "global_step": 119281, "epoch": 1437} {"train_loss": -22.371061325073242, "global_step": 119282, "epoch": 1437} {"train_loss": -21.694128036499023, "global_step": 119283, "epoch": 1437} {"train_loss": -22.30752182006836, "global_step": 119284, "epoch": 1437} {"train_loss": -22.21997833251953, "global_step": 119285, "epoch": 1437} {"train_loss": -21.990510940551758, "global_step": 119286, "epoch": 1437} {"train_loss": -22.188608169555664, "global_step": 119287, "epoch": 1437} {"train_loss": -22.249805450439453, "global_step": 119288, "epoch": 1437} {"train_loss": -22.025985717773438, "global_step": 119289, "epoch": 1437} {"train_loss": -22.13997459411621, "global_step": 119290, "epoch": 1437} {"train_loss": -22.4833927154541, "global_step": 119291, "epoch": 1437} {"train_loss": -22.094541549682617, "global_step": 119292, "epoch": 1437} {"train_loss": -22.23367691040039, "global_step": 119293, "epoch": 1437} {"train_loss": -22.3717041015625, "global_step": 119294, "epoch": 1437} {"train_loss": -22.479217529296875, "global_step": 119295, "epoch": 1437} {"train_loss": -22.433456420898438, "global_step": 119296, "epoch": 1437} {"train_loss": -22.457183837890625, "global_step": 119297, "epoch": 1437} {"train_loss": -22.239240646362305, "global_step": 119298, "epoch": 1437} {"train_loss": -22.38994789123535, "global_step": 119299, "epoch": 1437} {"train_loss": -22.415109634399414, "global_step": 119300, "epoch": 1437} {"train_loss": -22.363130569458008, "global_step": 119301, "epoch": 1437} {"train_loss": -22.42578887939453, "global_step": 119302, "epoch": 1437} {"train_loss": -22.50666618347168, "global_step": 119303, "epoch": 1437} {"train_loss": -22.609052658081055, "global_step": 119304, "epoch": 1437} {"train_loss": -22.429935455322266, "global_step": 119305, "epoch": 1437} {"train_loss": -22.516237258911133, "global_step": 119306, "epoch": 1437} {"train_loss": -22.08827018737793, "global_step": 119307, "epoch": 1437} {"train_loss": -22.262434005737305, "global_step": 119308, "epoch": 1437} {"train_loss": -22.265047073364258, "global_step": 119309, "epoch": 1437} {"train_loss": -22.671186447143555, "global_step": 119310, "epoch": 1437} {"train_loss": -22.278043746948242, "global_step": 119311, "epoch": 1437} {"train_loss": -22.44693374633789, "global_step": 119312, "epoch": 1437} {"train_loss": -22.15277671813965, "global_step": 119313, "epoch": 1437} {"train_loss": -22.477325439453125, "global_step": 119314, "epoch": 1437} {"train_loss": -22.232633590698242, "global_step": 119315, "epoch": 1437} {"train_loss": -22.484159469604492, "global_step": 119316, "epoch": 1437} {"train_loss": -22.2005672454834, "global_step": 119317, "epoch": 1437} {"train_loss": -22.00371742248535, "global_step": 119318, "epoch": 1437} {"train_loss": -22.567522048950195, "global_step": 119319, "epoch": 1437} {"train_loss": -22.408987045288086, "global_step": 119320, "epoch": 1437} {"train_loss": -22.4464168548584, "global_step": 119321, "epoch": 1437} {"train_loss": -22.61647605895996, "global_step": 119322, "epoch": 1437} {"train_loss": -22.917219161987305, "global_step": 119323, "epoch": 1437} {"train_loss": -22.839696884155273, "global_step": 119324, "epoch": 1437} {"train_loss": -22.476839065551758, "global_step": 119325, "epoch": 1437} {"train_loss": -22.895278930664062, "global_step": 119326, "epoch": 1437} {"train_loss": -22.337312698364258, "global_step": 119327, "epoch": 1437} {"train_loss": -22.81167984008789, "global_step": 119328, "epoch": 1437} {"train_loss": -22.7231388092041, "global_step": 119329, "epoch": 1437} {"train_loss": -22.5638370513916, "global_step": 119330, "epoch": 1437} {"train_loss": -22.596708297729492, "global_step": 119331, "epoch": 1437} {"train_loss": -22.682653427124023, "global_step": 119332, "epoch": 1437} {"train_loss": -22.410093307495117, "global_step": 119333, "epoch": 1437} {"train_loss": -22.599111557006836, "global_step": 119334, "epoch": 1437} {"train_loss": -22.45075798034668, "global_step": 119335, "epoch": 1437} {"train_loss": -22.92561149597168, "global_step": 119336, "epoch": 1437} {"train_loss": -22.253890991210938, "global_step": 119337, "epoch": 1437} {"train_loss": -22.40907096862793, "global_step": 119338, "epoch": 1437} {"train_loss": -22.567060470581055, "global_step": 119339, "epoch": 1437} {"train_loss": -22.6577091217041, "global_step": 119340, "epoch": 1437} {"train_loss": -22.296968460083008, "global_step": 119341, "epoch": 1437} {"train_loss": -22.4215030670166, "global_step": 119342, "epoch": 1437} {"train_loss": -22.705190658569336, "global_step": 119343, "epoch": 1437} {"train_loss": -22.71437644958496, "global_step": 119344, "epoch": 1437} {"train_loss": -22.774520874023438, "global_step": 119345, "epoch": 1437} {"train_loss": -22.555557250976562, "global_step": 119346, "epoch": 1437} {"train_loss": -22.527851104736328, "global_step": 119347, "epoch": 1437} {"train_loss": -22.61665916442871, "global_step": 119348, "epoch": 1437} {"train_loss": -22.588924407958984, "global_step": 119349, "epoch": 1437} {"train_loss": -22.715717315673828, "global_step": 119350, "epoch": 1437} {"train_loss": -22.478321075439453, "global_step": 119351, "epoch": 1437} {"train_loss": -22.662338256835938, "global_step": 119352, "epoch": 1437} {"train_loss": -22.40561701303505, "global_step": 119353, "epoch": 1437, "val_loss": 6131013.0} {"train_loss": -22.51576805114746, "global_step": 119354, "epoch": 1438} {"train_loss": -22.519254684448242, "global_step": 119355, "epoch": 1438} {"train_loss": -22.67573356628418, "global_step": 119356, "epoch": 1438} {"train_loss": -22.452436447143555, "global_step": 119357, "epoch": 1438} {"train_loss": -22.365558624267578, "global_step": 119358, "epoch": 1438} {"train_loss": -22.28862190246582, "global_step": 119359, "epoch": 1438} {"train_loss": -22.40193748474121, "global_step": 119360, "epoch": 1438} {"train_loss": -22.056819915771484, "global_step": 119361, "epoch": 1438} {"train_loss": -22.205989837646484, "global_step": 119362, "epoch": 1438} {"train_loss": -22.30702018737793, "global_step": 119363, "epoch": 1438} {"train_loss": -22.500389099121094, "global_step": 119364, "epoch": 1438} {"train_loss": -22.454416275024414, "global_step": 119365, "epoch": 1438} {"train_loss": -22.6993408203125, "global_step": 119366, "epoch": 1438} {"train_loss": -22.497526168823242, "global_step": 119367, "epoch": 1438} {"train_loss": -22.414888381958008, "global_step": 119368, "epoch": 1438} {"train_loss": -22.292312622070312, "global_step": 119369, "epoch": 1438} {"train_loss": -22.708036422729492, "global_step": 119370, "epoch": 1438} {"train_loss": -22.294355392456055, "global_step": 119371, "epoch": 1438} {"train_loss": -22.446081161499023, "global_step": 119372, "epoch": 1438} {"train_loss": -22.466327667236328, "global_step": 119373, "epoch": 1438} {"train_loss": -23.020456314086914, "global_step": 119374, "epoch": 1438} {"train_loss": -22.488096237182617, "global_step": 119375, "epoch": 1438} {"train_loss": -22.691890716552734, "global_step": 119376, "epoch": 1438} {"train_loss": -22.73923683166504, "global_step": 119377, "epoch": 1438} {"train_loss": -22.36935806274414, "global_step": 119378, "epoch": 1438} {"train_loss": -22.283830642700195, "global_step": 119379, "epoch": 1438} {"train_loss": -22.357669830322266, "global_step": 119380, "epoch": 1438} {"train_loss": -22.471420288085938, "global_step": 119381, "epoch": 1438} {"train_loss": -22.402482986450195, "global_step": 119382, "epoch": 1438} {"train_loss": -22.46973991394043, "global_step": 119383, "epoch": 1438} {"train_loss": -22.767118453979492, "global_step": 119384, "epoch": 1438} {"train_loss": -22.488967895507812, "global_step": 119385, "epoch": 1438} {"train_loss": -22.342947006225586, "global_step": 119386, "epoch": 1438} {"train_loss": -22.596179962158203, "global_step": 119387, "epoch": 1438} {"train_loss": -22.711776733398438, "global_step": 119388, "epoch": 1438} {"train_loss": -22.498342514038086, "global_step": 119389, "epoch": 1438} {"train_loss": -22.860631942749023, "global_step": 119390, "epoch": 1438} {"train_loss": -22.51727294921875, "global_step": 119391, "epoch": 1438} {"train_loss": -22.296968460083008, "global_step": 119392, "epoch": 1438} {"train_loss": -22.739500045776367, "global_step": 119393, "epoch": 1438} {"train_loss": -22.552030563354492, "global_step": 119394, "epoch": 1438} {"train_loss": -22.643285751342773, "global_step": 119395, "epoch": 1438} {"train_loss": -22.457534790039062, "global_step": 119396, "epoch": 1438} {"train_loss": -22.8145694732666, "global_step": 119397, "epoch": 1438} {"train_loss": -22.388017654418945, "global_step": 119398, "epoch": 1438} {"train_loss": -22.66498565673828, "global_step": 119399, "epoch": 1438} {"train_loss": -22.562238693237305, "global_step": 119400, "epoch": 1438} {"train_loss": -22.912824630737305, "global_step": 119401, "epoch": 1438} {"train_loss": -22.487760543823242, "global_step": 119402, "epoch": 1438} {"train_loss": -22.803260803222656, "global_step": 119403, "epoch": 1438} {"train_loss": -22.389774322509766, "global_step": 119404, "epoch": 1438} {"train_loss": -22.663557052612305, "global_step": 119405, "epoch": 1438} {"train_loss": -22.40668296813965, "global_step": 119406, "epoch": 1438} {"train_loss": -22.619077682495117, "global_step": 119407, "epoch": 1438} {"train_loss": -22.569761276245117, "global_step": 119408, "epoch": 1438} {"train_loss": -22.77833366394043, "global_step": 119409, "epoch": 1438} {"train_loss": -22.624698638916016, "global_step": 119410, "epoch": 1438} {"train_loss": -22.708450317382812, "global_step": 119411, "epoch": 1438} {"train_loss": -22.436857223510742, "global_step": 119412, "epoch": 1438} {"train_loss": -22.730897903442383, "global_step": 119413, "epoch": 1438} {"train_loss": -22.54829978942871, "global_step": 119414, "epoch": 1438} {"train_loss": -22.601673126220703, "global_step": 119415, "epoch": 1438} {"train_loss": -22.80307388305664, "global_step": 119416, "epoch": 1438} {"train_loss": -22.996137619018555, "global_step": 119417, "epoch": 1438} {"train_loss": -22.105327606201172, "global_step": 119418, "epoch": 1438} {"train_loss": -22.964414596557617, "global_step": 119419, "epoch": 1438} {"train_loss": -22.74725341796875, "global_step": 119420, "epoch": 1438} {"train_loss": -22.200897216796875, "global_step": 119421, "epoch": 1438} {"train_loss": -22.929208755493164, "global_step": 119422, "epoch": 1438} {"train_loss": -22.453649520874023, "global_step": 119423, "epoch": 1438} {"train_loss": -22.59614372253418, "global_step": 119424, "epoch": 1438} {"train_loss": -22.704463958740234, "global_step": 119425, "epoch": 1438} {"train_loss": -22.533082962036133, "global_step": 119426, "epoch": 1438} {"train_loss": -22.752416610717773, "global_step": 119427, "epoch": 1438} {"train_loss": -22.45452880859375, "global_step": 119428, "epoch": 1438} {"train_loss": -22.6988525390625, "global_step": 119429, "epoch": 1438} {"train_loss": -22.243703842163086, "global_step": 119430, "epoch": 1438} {"train_loss": -22.55095863342285, "global_step": 119431, "epoch": 1438} {"train_loss": -22.71964454650879, "global_step": 119432, "epoch": 1438} {"train_loss": -22.454923629760742, "global_step": 119433, "epoch": 1438} {"train_loss": -22.62301254272461, "global_step": 119434, "epoch": 1438} {"train_loss": -22.702932357788086, "global_step": 119435, "epoch": 1438} {"train_loss": -22.5398063889469, "global_step": 119436, "epoch": 1438, "val_loss": 6280911.0} {"train_loss": -22.331396102905273, "global_step": 119437, "epoch": 1439} {"train_loss": -22.56878089904785, "global_step": 119438, "epoch": 1439} {"train_loss": -22.45075798034668, "global_step": 119439, "epoch": 1439} {"train_loss": -22.293554306030273, "global_step": 119440, "epoch": 1439} {"train_loss": -22.081388473510742, "global_step": 119441, "epoch": 1439} {"train_loss": -22.142881393432617, "global_step": 119442, "epoch": 1439} {"train_loss": -22.299814224243164, "global_step": 119443, "epoch": 1439} {"train_loss": -22.362085342407227, "global_step": 119444, "epoch": 1439} {"train_loss": -22.657609939575195, "global_step": 119445, "epoch": 1439} {"train_loss": -22.59408950805664, "global_step": 119446, "epoch": 1439} {"train_loss": -22.173215866088867, "global_step": 119447, "epoch": 1439} {"train_loss": -22.49360466003418, "global_step": 119448, "epoch": 1439} {"train_loss": -22.33028221130371, "global_step": 119449, "epoch": 1439} {"train_loss": -22.7391300201416, "global_step": 119450, "epoch": 1439} {"train_loss": -22.620437622070312, "global_step": 119451, "epoch": 1439} {"train_loss": -22.32753562927246, "global_step": 119452, "epoch": 1439} {"train_loss": -22.23954200744629, "global_step": 119453, "epoch": 1439} {"train_loss": -22.471405029296875, "global_step": 119454, "epoch": 1439} {"train_loss": -22.566747665405273, "global_step": 119455, "epoch": 1439} {"train_loss": -22.53045654296875, "global_step": 119456, "epoch": 1439} {"train_loss": -22.671804428100586, "global_step": 119457, "epoch": 1439} {"train_loss": -22.264265060424805, "global_step": 119458, "epoch": 1439} {"train_loss": -22.66958999633789, "global_step": 119459, "epoch": 1439} {"train_loss": -22.307540893554688, "global_step": 119460, "epoch": 1439} {"train_loss": -22.644237518310547, "global_step": 119461, "epoch": 1439} {"train_loss": -22.60715103149414, "global_step": 119462, "epoch": 1439} {"train_loss": -22.43345832824707, "global_step": 119463, "epoch": 1439} {"train_loss": -22.494491577148438, "global_step": 119464, "epoch": 1439} {"train_loss": -22.691057205200195, "global_step": 119465, "epoch": 1439} {"train_loss": -22.375473022460938, "global_step": 119466, "epoch": 1439} {"train_loss": -22.422210693359375, "global_step": 119467, "epoch": 1439} {"train_loss": -22.20244026184082, "global_step": 119468, "epoch": 1439} {"train_loss": -22.630002975463867, "global_step": 119469, "epoch": 1439} {"train_loss": -22.833642959594727, "global_step": 119470, "epoch": 1439} {"train_loss": -22.6366024017334, "global_step": 119471, "epoch": 1439} {"train_loss": -22.188215255737305, "global_step": 119472, "epoch": 1439} {"train_loss": -22.38988494873047, "global_step": 119473, "epoch": 1439} {"train_loss": -22.739652633666992, "global_step": 119474, "epoch": 1439} {"train_loss": -22.2952938079834, "global_step": 119475, "epoch": 1439} {"train_loss": -22.884811401367188, "global_step": 119476, "epoch": 1439} {"train_loss": -22.5137939453125, "global_step": 119477, "epoch": 1439} {"train_loss": -21.9378604888916, "global_step": 119478, "epoch": 1439} {"train_loss": -22.775453567504883, "global_step": 119479, "epoch": 1439} {"train_loss": -22.586063385009766, "global_step": 119480, "epoch": 1439} {"train_loss": -22.78706169128418, "global_step": 119481, "epoch": 1439} {"train_loss": -22.71611785888672, "global_step": 119482, "epoch": 1439} {"train_loss": -22.5261287689209, "global_step": 119483, "epoch": 1439} {"train_loss": -22.752307891845703, "global_step": 119484, "epoch": 1439} {"train_loss": -22.515188217163086, "global_step": 119485, "epoch": 1439} {"train_loss": -23.114294052124023, "global_step": 119486, "epoch": 1439} {"train_loss": -22.856342315673828, "global_step": 119487, "epoch": 1439} {"train_loss": -22.5784969329834, "global_step": 119488, "epoch": 1439} {"train_loss": -22.51087760925293, "global_step": 119489, "epoch": 1439} {"train_loss": -22.731046676635742, "global_step": 119490, "epoch": 1439} {"train_loss": -22.837871551513672, "global_step": 119491, "epoch": 1439} {"train_loss": -22.40616226196289, "global_step": 119492, "epoch": 1439} {"train_loss": -22.370237350463867, "global_step": 119493, "epoch": 1439} {"train_loss": -22.172517776489258, "global_step": 119494, "epoch": 1439} {"train_loss": -22.199935913085938, "global_step": 119495, "epoch": 1439} {"train_loss": -22.42024040222168, "global_step": 119496, "epoch": 1439} {"train_loss": -22.374052047729492, "global_step": 119497, "epoch": 1439} {"train_loss": -22.163185119628906, "global_step": 119498, "epoch": 1439} {"train_loss": -22.2285213470459, "global_step": 119499, "epoch": 1439} {"train_loss": -22.079191207885742, "global_step": 119500, "epoch": 1439} {"train_loss": -22.1854248046875, "global_step": 119501, "epoch": 1439} {"train_loss": -22.046524047851562, "global_step": 119502, "epoch": 1439} {"train_loss": -22.511198043823242, "global_step": 119503, "epoch": 1439} {"train_loss": -22.564130783081055, "global_step": 119504, "epoch": 1439} {"train_loss": -22.27216148376465, "global_step": 119505, "epoch": 1439} {"train_loss": -22.683435440063477, "global_step": 119506, "epoch": 1439} {"train_loss": -22.29072380065918, "global_step": 119507, "epoch": 1439} {"train_loss": -22.348905563354492, "global_step": 119508, "epoch": 1439} {"train_loss": -23.13984489440918, "global_step": 119509, "epoch": 1439} {"train_loss": -22.31883430480957, "global_step": 119510, "epoch": 1439} {"train_loss": -22.19569206237793, "global_step": 119511, "epoch": 1439} {"train_loss": -22.371400833129883, "global_step": 119512, "epoch": 1439} {"train_loss": -22.492399215698242, "global_step": 119513, "epoch": 1439} {"train_loss": -22.37299156188965, "global_step": 119514, "epoch": 1439} {"train_loss": -22.348398208618164, "global_step": 119515, "epoch": 1439} {"train_loss": -22.86404800415039, "global_step": 119516, "epoch": 1439} {"train_loss": -22.27693748474121, "global_step": 119517, "epoch": 1439} {"train_loss": -22.83246421813965, "global_step": 119518, "epoch": 1439} {"train_loss": -22.472343835485987, "global_step": 119519, "epoch": 1439, "val_loss": 6113000.5} {"train_loss": -21.67036247253418, "global_step": 119520, "epoch": 1440} {"train_loss": -21.32961082458496, "global_step": 119521, "epoch": 1440} {"train_loss": -22.2691707611084, "global_step": 119522, "epoch": 1440} {"train_loss": -21.81905746459961, "global_step": 119523, "epoch": 1440} {"train_loss": -21.465295791625977, "global_step": 119524, "epoch": 1440} {"train_loss": -21.89747428894043, "global_step": 119525, "epoch": 1440} {"train_loss": -21.817899703979492, "global_step": 119526, "epoch": 1440} {"train_loss": -21.53031349182129, "global_step": 119527, "epoch": 1440} {"train_loss": -21.945316314697266, "global_step": 119528, "epoch": 1440} {"train_loss": -21.66598129272461, "global_step": 119529, "epoch": 1440} {"train_loss": -21.739517211914062, "global_step": 119530, "epoch": 1440} {"train_loss": -22.085636138916016, "global_step": 119531, "epoch": 1440} {"train_loss": -22.435226440429688, "global_step": 119532, "epoch": 1440} {"train_loss": -21.80879783630371, "global_step": 119533, "epoch": 1440} {"train_loss": -21.881391525268555, "global_step": 119534, "epoch": 1440} {"train_loss": -21.851150512695312, "global_step": 119535, "epoch": 1440} {"train_loss": -21.963205337524414, "global_step": 119536, "epoch": 1440} {"train_loss": -22.35675048828125, "global_step": 119537, "epoch": 1440} {"train_loss": -22.06700325012207, "global_step": 119538, "epoch": 1440} {"train_loss": -22.13477897644043, "global_step": 119539, "epoch": 1440} {"train_loss": -22.116308212280273, "global_step": 119540, "epoch": 1440} {"train_loss": -21.998828887939453, "global_step": 119541, "epoch": 1440} {"train_loss": -22.337060928344727, "global_step": 119542, "epoch": 1440} {"train_loss": -22.264150619506836, "global_step": 119543, "epoch": 1440} {"train_loss": -22.012088775634766, "global_step": 119544, "epoch": 1440} {"train_loss": -22.379858016967773, "global_step": 119545, "epoch": 1440} {"train_loss": -22.36089515686035, "global_step": 119546, "epoch": 1440} {"train_loss": -22.083288192749023, "global_step": 119547, "epoch": 1440} {"train_loss": -22.57134437561035, "global_step": 119548, "epoch": 1440} {"train_loss": -22.502962112426758, "global_step": 119549, "epoch": 1440} {"train_loss": -22.53108024597168, "global_step": 119550, "epoch": 1440} {"train_loss": -22.4211483001709, "global_step": 119551, "epoch": 1440} {"train_loss": -22.49287986755371, "global_step": 119552, "epoch": 1440} {"train_loss": -22.19659996032715, "global_step": 119553, "epoch": 1440} {"train_loss": -22.691003799438477, "global_step": 119554, "epoch": 1440} {"train_loss": -22.23130226135254, "global_step": 119555, "epoch": 1440} {"train_loss": -22.60439109802246, "global_step": 119556, "epoch": 1440} {"train_loss": -22.3699893951416, "global_step": 119557, "epoch": 1440} {"train_loss": -22.016050338745117, "global_step": 119558, "epoch": 1440} {"train_loss": -22.497251510620117, "global_step": 119559, "epoch": 1440} {"train_loss": -22.9739990234375, "global_step": 119560, "epoch": 1440} {"train_loss": -22.345048904418945, "global_step": 119561, "epoch": 1440} {"train_loss": -22.93623924255371, "global_step": 119562, "epoch": 1440} {"train_loss": -22.66664695739746, "global_step": 119563, "epoch": 1440} {"train_loss": -22.7515926361084, "global_step": 119564, "epoch": 1440} {"train_loss": -22.765390396118164, "global_step": 119565, "epoch": 1440} {"train_loss": -22.45045280456543, "global_step": 119566, "epoch": 1440} {"train_loss": -22.370115280151367, "global_step": 119567, "epoch": 1440} {"train_loss": -22.776519775390625, "global_step": 119568, "epoch": 1440} {"train_loss": -22.704137802124023, "global_step": 119569, "epoch": 1440} {"train_loss": -22.99452018737793, "global_step": 119570, "epoch": 1440} {"train_loss": -22.09058952331543, "global_step": 119571, "epoch": 1440} {"train_loss": -22.842735290527344, "global_step": 119572, "epoch": 1440} {"train_loss": -22.76384735107422, "global_step": 119573, "epoch": 1440} {"train_loss": -22.331878662109375, "global_step": 119574, "epoch": 1440} {"train_loss": -22.205106735229492, "global_step": 119575, "epoch": 1440} {"train_loss": -22.788854598999023, "global_step": 119576, "epoch": 1440} {"train_loss": -22.460453033447266, "global_step": 119577, "epoch": 1440} {"train_loss": -22.17921257019043, "global_step": 119578, "epoch": 1440} {"train_loss": -22.343297958374023, "global_step": 119579, "epoch": 1440} {"train_loss": -22.558225631713867, "global_step": 119580, "epoch": 1440} {"train_loss": -22.473867416381836, "global_step": 119581, "epoch": 1440} {"train_loss": -22.428068161010742, "global_step": 119582, "epoch": 1440} {"train_loss": -22.354326248168945, "global_step": 119583, "epoch": 1440} {"train_loss": -22.904495239257812, "global_step": 119584, "epoch": 1440} {"train_loss": -22.330175399780273, "global_step": 119585, "epoch": 1440} {"train_loss": -22.280920028686523, "global_step": 119586, "epoch": 1440} {"train_loss": -22.74770164489746, "global_step": 119587, "epoch": 1440} {"train_loss": -22.44370460510254, "global_step": 119588, "epoch": 1440} {"train_loss": -22.398544311523438, "global_step": 119589, "epoch": 1440} {"train_loss": -22.647123336791992, "global_step": 119590, "epoch": 1440} {"train_loss": -22.361112594604492, "global_step": 119591, "epoch": 1440} {"train_loss": -22.681373596191406, "global_step": 119592, "epoch": 1440} {"train_loss": -22.794105529785156, "global_step": 119593, "epoch": 1440} {"train_loss": -22.39042091369629, "global_step": 119594, "epoch": 1440} {"train_loss": -22.43937873840332, "global_step": 119595, "epoch": 1440} {"train_loss": -22.655420303344727, "global_step": 119596, "epoch": 1440} {"train_loss": -22.47954750061035, "global_step": 119597, "epoch": 1440} {"train_loss": -22.374675750732422, "global_step": 119598, "epoch": 1440} {"train_loss": -22.694381713867188, "global_step": 119599, "epoch": 1440} {"train_loss": -22.392072677612305, "global_step": 119600, "epoch": 1440} {"train_loss": -22.043188095092773, "global_step": 119601, "epoch": 1440} {"train_loss": -22.324632322931866, "global_step": 119602, "epoch": 1440, "val_loss": 6293152.5} {"train_loss": -22.53961753845215, "global_step": 119603, "epoch": 1441} {"train_loss": -21.624923706054688, "global_step": 119604, "epoch": 1441} {"train_loss": -21.728788375854492, "global_step": 119605, "epoch": 1441} {"train_loss": -22.170244216918945, "global_step": 119606, "epoch": 1441} {"train_loss": -22.347488403320312, "global_step": 119607, "epoch": 1441} {"train_loss": -22.25972557067871, "global_step": 119608, "epoch": 1441} {"train_loss": -22.026525497436523, "global_step": 119609, "epoch": 1441} {"train_loss": -22.654905319213867, "global_step": 119610, "epoch": 1441} {"train_loss": -22.054813385009766, "global_step": 119611, "epoch": 1441} {"train_loss": -22.471494674682617, "global_step": 119612, "epoch": 1441} {"train_loss": -22.355783462524414, "global_step": 119613, "epoch": 1441} {"train_loss": -22.22162437438965, "global_step": 119614, "epoch": 1441} {"train_loss": -22.1810359954834, "global_step": 119615, "epoch": 1441} {"train_loss": -22.382394790649414, "global_step": 119616, "epoch": 1441} {"train_loss": -22.406198501586914, "global_step": 119617, "epoch": 1441} {"train_loss": -22.5758056640625, "global_step": 119618, "epoch": 1441} {"train_loss": -22.48246192932129, "global_step": 119619, "epoch": 1441} {"train_loss": -22.534393310546875, "global_step": 119620, "epoch": 1441} {"train_loss": -22.131118774414062, "global_step": 119621, "epoch": 1441} {"train_loss": -22.567703247070312, "global_step": 119622, "epoch": 1441} {"train_loss": -22.498350143432617, "global_step": 119623, "epoch": 1441} {"train_loss": -22.576034545898438, "global_step": 119624, "epoch": 1441} {"train_loss": -22.328876495361328, "global_step": 119625, "epoch": 1441} {"train_loss": -22.20435905456543, "global_step": 119626, "epoch": 1441} {"train_loss": -22.479101181030273, "global_step": 119627, "epoch": 1441} {"train_loss": -22.47014808654785, "global_step": 119628, "epoch": 1441} {"train_loss": -22.78426170349121, "global_step": 119629, "epoch": 1441} {"train_loss": -23.012235641479492, "global_step": 119630, "epoch": 1441} {"train_loss": -22.262861251831055, "global_step": 119631, "epoch": 1441} {"train_loss": -22.49224281311035, "global_step": 119632, "epoch": 1441} {"train_loss": -22.652420043945312, "global_step": 119633, "epoch": 1441} {"train_loss": -22.555038452148438, "global_step": 119634, "epoch": 1441} {"train_loss": -22.70058250427246, "global_step": 119635, "epoch": 1441} {"train_loss": -22.641620635986328, "global_step": 119636, "epoch": 1441} {"train_loss": -22.50520133972168, "global_step": 119637, "epoch": 1441} {"train_loss": -22.659040451049805, "global_step": 119638, "epoch": 1441} {"train_loss": -22.25533103942871, "global_step": 119639, "epoch": 1441} {"train_loss": -22.566673278808594, "global_step": 119640, "epoch": 1441} {"train_loss": -22.114274978637695, "global_step": 119641, "epoch": 1441} {"train_loss": -22.48414421081543, "global_step": 119642, "epoch": 1441} {"train_loss": -22.869638442993164, "global_step": 119643, "epoch": 1441} {"train_loss": -22.505435943603516, "global_step": 119644, "epoch": 1441} {"train_loss": -22.629581451416016, "global_step": 119645, "epoch": 1441} {"train_loss": -22.607013702392578, "global_step": 119646, "epoch": 1441} {"train_loss": -22.536550521850586, "global_step": 119647, "epoch": 1441} {"train_loss": -22.48236846923828, "global_step": 119648, "epoch": 1441} {"train_loss": -22.179405212402344, "global_step": 119649, "epoch": 1441} {"train_loss": -22.633689880371094, "global_step": 119650, "epoch": 1441} {"train_loss": -22.467557907104492, "global_step": 119651, "epoch": 1441} {"train_loss": -22.702640533447266, "global_step": 119652, "epoch": 1441} {"train_loss": -22.675912857055664, "global_step": 119653, "epoch": 1441} {"train_loss": -22.4482364654541, "global_step": 119654, "epoch": 1441} {"train_loss": -22.85320472717285, "global_step": 119655, "epoch": 1441} {"train_loss": -22.638479232788086, "global_step": 119656, "epoch": 1441} {"train_loss": -22.775182723999023, "global_step": 119657, "epoch": 1441} {"train_loss": -22.577327728271484, "global_step": 119658, "epoch": 1441} {"train_loss": -22.826358795166016, "global_step": 119659, "epoch": 1441} {"train_loss": -22.36888313293457, "global_step": 119660, "epoch": 1441} {"train_loss": -22.791019439697266, "global_step": 119661, "epoch": 1441} {"train_loss": -22.48967170715332, "global_step": 119662, "epoch": 1441} {"train_loss": -22.483917236328125, "global_step": 119663, "epoch": 1441} {"train_loss": -22.831697463989258, "global_step": 119664, "epoch": 1441} {"train_loss": -22.472190856933594, "global_step": 119665, "epoch": 1441} {"train_loss": -22.64029884338379, "global_step": 119666, "epoch": 1441} {"train_loss": -22.7345027923584, "global_step": 119667, "epoch": 1441} {"train_loss": -22.584346771240234, "global_step": 119668, "epoch": 1441} {"train_loss": -22.611915588378906, "global_step": 119669, "epoch": 1441} {"train_loss": -22.431005477905273, "global_step": 119670, "epoch": 1441} {"train_loss": -22.39447021484375, "global_step": 119671, "epoch": 1441} {"train_loss": -22.53523063659668, "global_step": 119672, "epoch": 1441} {"train_loss": -22.427465438842773, "global_step": 119673, "epoch": 1441} {"train_loss": -22.03567886352539, "global_step": 119674, "epoch": 1441} {"train_loss": -22.244510650634766, "global_step": 119675, "epoch": 1441} {"train_loss": -22.763635635375977, "global_step": 119676, "epoch": 1441} {"train_loss": -22.709760665893555, "global_step": 119677, "epoch": 1441} {"train_loss": -22.671974182128906, "global_step": 119678, "epoch": 1441} {"train_loss": -22.49466896057129, "global_step": 119679, "epoch": 1441} {"train_loss": -22.898757934570312, "global_step": 119680, "epoch": 1441} {"train_loss": -22.651334762573242, "global_step": 119681, "epoch": 1441} {"train_loss": -22.42153549194336, "global_step": 119682, "epoch": 1441} {"train_loss": -22.48371696472168, "global_step": 119683, "epoch": 1441} {"train_loss": -22.445362091064453, "global_step": 119684, "epoch": 1441} {"train_loss": -22.509509810482164, "global_step": 119685, "epoch": 1441, "val_loss": 6182818.0} {"train_loss": -22.533924102783203, "global_step": 119686, "epoch": 1442} {"train_loss": -22.434892654418945, "global_step": 119687, "epoch": 1442} {"train_loss": -22.632844924926758, "global_step": 119688, "epoch": 1442} {"train_loss": -22.45845603942871, "global_step": 119689, "epoch": 1442} {"train_loss": -22.244382858276367, "global_step": 119690, "epoch": 1442} {"train_loss": -22.64802360534668, "global_step": 119691, "epoch": 1442} {"train_loss": -22.75279426574707, "global_step": 119692, "epoch": 1442} {"train_loss": -22.328506469726562, "global_step": 119693, "epoch": 1442} {"train_loss": -22.33771324157715, "global_step": 119694, "epoch": 1442} {"train_loss": -22.23460578918457, "global_step": 119695, "epoch": 1442} {"train_loss": -22.5252685546875, "global_step": 119696, "epoch": 1442} {"train_loss": -22.316974639892578, "global_step": 119697, "epoch": 1442} {"train_loss": -22.793109893798828, "global_step": 119698, "epoch": 1442} {"train_loss": -22.686445236206055, "global_step": 119699, "epoch": 1442} {"train_loss": -22.806127548217773, "global_step": 119700, "epoch": 1442} {"train_loss": -22.698049545288086, "global_step": 119701, "epoch": 1442} {"train_loss": -22.335250854492188, "global_step": 119702, "epoch": 1442} {"train_loss": -22.44169807434082, "global_step": 119703, "epoch": 1442} {"train_loss": -22.52606773376465, "global_step": 119704, "epoch": 1442} {"train_loss": -22.981002807617188, "global_step": 119705, "epoch": 1442} {"train_loss": -22.795530319213867, "global_step": 119706, "epoch": 1442} {"train_loss": -22.292316436767578, "global_step": 119707, "epoch": 1442} {"train_loss": -22.683786392211914, "global_step": 119708, "epoch": 1442} {"train_loss": -22.204132080078125, "global_step": 119709, "epoch": 1442} {"train_loss": -22.544477462768555, "global_step": 119710, "epoch": 1442} {"train_loss": -22.681324005126953, "global_step": 119711, "epoch": 1442} {"train_loss": -22.692956924438477, "global_step": 119712, "epoch": 1442} {"train_loss": -21.889921188354492, "global_step": 119713, "epoch": 1442} {"train_loss": -22.617904663085938, "global_step": 119714, "epoch": 1442} {"train_loss": -22.228086471557617, "global_step": 119715, "epoch": 1442} {"train_loss": -22.548189163208008, "global_step": 119716, "epoch": 1442} {"train_loss": -22.590139389038086, "global_step": 119717, "epoch": 1442} {"train_loss": -22.52383804321289, "global_step": 119718, "epoch": 1442} {"train_loss": -22.79361915588379, "global_step": 119719, "epoch": 1442} {"train_loss": -22.323453903198242, "global_step": 119720, "epoch": 1442} {"train_loss": -22.126035690307617, "global_step": 119721, "epoch": 1442} {"train_loss": -22.854721069335938, "global_step": 119722, "epoch": 1442} {"train_loss": -22.8789119720459, "global_step": 119723, "epoch": 1442} {"train_loss": -22.154129028320312, "global_step": 119724, "epoch": 1442} {"train_loss": -22.820608139038086, "global_step": 119725, "epoch": 1442} {"train_loss": -22.749435424804688, "global_step": 119726, "epoch": 1442} {"train_loss": -22.905492782592773, "global_step": 119727, "epoch": 1442} {"train_loss": -22.4482421875, "global_step": 119728, "epoch": 1442} {"train_loss": -22.573871612548828, "global_step": 119729, "epoch": 1442} {"train_loss": -22.181371688842773, "global_step": 119730, "epoch": 1442} {"train_loss": -22.425323486328125, "global_step": 119731, "epoch": 1442} {"train_loss": -22.68387794494629, "global_step": 119732, "epoch": 1442} {"train_loss": -22.670063018798828, "global_step": 119733, "epoch": 1442} {"train_loss": -23.133390426635742, "global_step": 119734, "epoch": 1442} {"train_loss": -22.43956184387207, "global_step": 119735, "epoch": 1442} {"train_loss": -22.8494930267334, "global_step": 119736, "epoch": 1442} {"train_loss": -22.76072120666504, "global_step": 119737, "epoch": 1442} {"train_loss": -22.138671875, "global_step": 119738, "epoch": 1442} {"train_loss": -22.292707443237305, "global_step": 119739, "epoch": 1442} {"train_loss": -22.769256591796875, "global_step": 119740, "epoch": 1442} {"train_loss": -22.605077743530273, "global_step": 119741, "epoch": 1442} {"train_loss": -22.2825870513916, "global_step": 119742, "epoch": 1442} {"train_loss": -22.4591007232666, "global_step": 119743, "epoch": 1442} {"train_loss": -22.577634811401367, "global_step": 119744, "epoch": 1442} {"train_loss": -22.634918212890625, "global_step": 119745, "epoch": 1442} {"train_loss": -22.761079788208008, "global_step": 119746, "epoch": 1442} {"train_loss": -22.581693649291992, "global_step": 119747, "epoch": 1442} {"train_loss": -22.502363204956055, "global_step": 119748, "epoch": 1442} {"train_loss": -22.68017578125, "global_step": 119749, "epoch": 1442} {"train_loss": -22.445016860961914, "global_step": 119750, "epoch": 1442} {"train_loss": -22.515676498413086, "global_step": 119751, "epoch": 1442} {"train_loss": -22.40448760986328, "global_step": 119752, "epoch": 1442} {"train_loss": -22.300434112548828, "global_step": 119753, "epoch": 1442} {"train_loss": -22.554264068603516, "global_step": 119754, "epoch": 1442} {"train_loss": -22.588191986083984, "global_step": 119755, "epoch": 1442} {"train_loss": -22.55584144592285, "global_step": 119756, "epoch": 1442} {"train_loss": -22.588882446289062, "global_step": 119757, "epoch": 1442} {"train_loss": -22.585708618164062, "global_step": 119758, "epoch": 1442} {"train_loss": -22.535531997680664, "global_step": 119759, "epoch": 1442} {"train_loss": -22.778121948242188, "global_step": 119760, "epoch": 1442} {"train_loss": -22.558128356933594, "global_step": 119761, "epoch": 1442} {"train_loss": -22.794382095336914, "global_step": 119762, "epoch": 1442} {"train_loss": -22.47065544128418, "global_step": 119763, "epoch": 1442} {"train_loss": -22.4842529296875, "global_step": 119764, "epoch": 1442} {"train_loss": -22.415328979492188, "global_step": 119765, "epoch": 1442} {"train_loss": -22.240442276000977, "global_step": 119766, "epoch": 1442} {"train_loss": -22.597232818603516, "global_step": 119767, "epoch": 1442} {"train_loss": -22.54207385878965, "global_step": 119768, "epoch": 1442, "val_loss": 6232897.0} {"train_loss": -22.202312469482422, "global_step": 119769, "epoch": 1443} {"train_loss": -22.2456111907959, "global_step": 119770, "epoch": 1443} {"train_loss": -21.822675704956055, "global_step": 119771, "epoch": 1443} {"train_loss": -22.386564254760742, "global_step": 119772, "epoch": 1443} {"train_loss": -22.027023315429688, "global_step": 119773, "epoch": 1443} {"train_loss": -22.14300537109375, "global_step": 119774, "epoch": 1443} {"train_loss": -22.139530181884766, "global_step": 119775, "epoch": 1443} {"train_loss": -21.810453414916992, "global_step": 119776, "epoch": 1443} {"train_loss": -22.450353622436523, "global_step": 119777, "epoch": 1443} {"train_loss": -22.175048828125, "global_step": 119778, "epoch": 1443} {"train_loss": -22.174339294433594, "global_step": 119779, "epoch": 1443} {"train_loss": -22.27274513244629, "global_step": 119780, "epoch": 1443} {"train_loss": -22.279067993164062, "global_step": 119781, "epoch": 1443} {"train_loss": -22.21197509765625, "global_step": 119782, "epoch": 1443} {"train_loss": -22.698970794677734, "global_step": 119783, "epoch": 1443} {"train_loss": -22.607473373413086, "global_step": 119784, "epoch": 1443} {"train_loss": -22.489023208618164, "global_step": 119785, "epoch": 1443} {"train_loss": -22.166614532470703, "global_step": 119786, "epoch": 1443} {"train_loss": -22.40695571899414, "global_step": 119787, "epoch": 1443} {"train_loss": -22.061006546020508, "global_step": 119788, "epoch": 1443} {"train_loss": -22.628318786621094, "global_step": 119789, "epoch": 1443} {"train_loss": -22.309476852416992, "global_step": 119790, "epoch": 1443} {"train_loss": -22.539608001708984, "global_step": 119791, "epoch": 1443} {"train_loss": -22.401872634887695, "global_step": 119792, "epoch": 1443} {"train_loss": -22.321674346923828, "global_step": 119793, "epoch": 1443} {"train_loss": -22.4448299407959, "global_step": 119794, "epoch": 1443} {"train_loss": -22.69338035583496, "global_step": 119795, "epoch": 1443} {"train_loss": -22.65260124206543, "global_step": 119796, "epoch": 1443} {"train_loss": -22.437068939208984, "global_step": 119797, "epoch": 1443} {"train_loss": -22.105207443237305, "global_step": 119798, "epoch": 1443} {"train_loss": -22.70814323425293, "global_step": 119799, "epoch": 1443} {"train_loss": -22.154752731323242, "global_step": 119800, "epoch": 1443} {"train_loss": -22.224292755126953, "global_step": 119801, "epoch": 1443} {"train_loss": -21.99956512451172, "global_step": 119802, "epoch": 1443} {"train_loss": -22.2525577545166, "global_step": 119803, "epoch": 1443} {"train_loss": -22.131954193115234, "global_step": 119804, "epoch": 1443} {"train_loss": -23.064661026000977, "global_step": 119805, "epoch": 1443} {"train_loss": -22.389598846435547, "global_step": 119806, "epoch": 1443} {"train_loss": -22.832061767578125, "global_step": 119807, "epoch": 1443} {"train_loss": -22.64291000366211, "global_step": 119808, "epoch": 1443} {"train_loss": -22.68155288696289, "global_step": 119809, "epoch": 1443} {"train_loss": -22.425708770751953, "global_step": 119810, "epoch": 1443} {"train_loss": -22.32175636291504, "global_step": 119811, "epoch": 1443} {"train_loss": -22.490455627441406, "global_step": 119812, "epoch": 1443} {"train_loss": -22.458093643188477, "global_step": 119813, "epoch": 1443} {"train_loss": -22.86202621459961, "global_step": 119814, "epoch": 1443} {"train_loss": -22.63711929321289, "global_step": 119815, "epoch": 1443} {"train_loss": -22.146839141845703, "global_step": 119816, "epoch": 1443} {"train_loss": -22.846933364868164, "global_step": 119817, "epoch": 1443} {"train_loss": -22.610031127929688, "global_step": 119818, "epoch": 1443} {"train_loss": -22.17228126525879, "global_step": 119819, "epoch": 1443} {"train_loss": -22.524473190307617, "global_step": 119820, "epoch": 1443} {"train_loss": -22.677949905395508, "global_step": 119821, "epoch": 1443} {"train_loss": -22.503183364868164, "global_step": 119822, "epoch": 1443} {"train_loss": -22.482149124145508, "global_step": 119823, "epoch": 1443} {"train_loss": -22.139808654785156, "global_step": 119824, "epoch": 1443} {"train_loss": -22.42181968688965, "global_step": 119825, "epoch": 1443} {"train_loss": -22.614709854125977, "global_step": 119826, "epoch": 1443} {"train_loss": -22.634328842163086, "global_step": 119827, "epoch": 1443} {"train_loss": -22.114892959594727, "global_step": 119828, "epoch": 1443} {"train_loss": -22.322021484375, "global_step": 119829, "epoch": 1443} {"train_loss": -22.680530548095703, "global_step": 119830, "epoch": 1443} {"train_loss": -22.395475387573242, "global_step": 119831, "epoch": 1443} {"train_loss": -22.507970809936523, "global_step": 119832, "epoch": 1443} {"train_loss": -22.834775924682617, "global_step": 119833, "epoch": 1443} {"train_loss": -22.38557243347168, "global_step": 119834, "epoch": 1443} {"train_loss": -22.439453125, "global_step": 119835, "epoch": 1443} {"train_loss": -22.59869956970215, "global_step": 119836, "epoch": 1443} {"train_loss": -22.369802474975586, "global_step": 119837, "epoch": 1443} {"train_loss": -22.16016387939453, "global_step": 119838, "epoch": 1443} {"train_loss": -22.21172523498535, "global_step": 119839, "epoch": 1443} {"train_loss": -22.682161331176758, "global_step": 119840, "epoch": 1443} {"train_loss": -22.471725463867188, "global_step": 119841, "epoch": 1443} {"train_loss": -22.524045944213867, "global_step": 119842, "epoch": 1443} {"train_loss": -22.16817283630371, "global_step": 119843, "epoch": 1443} {"train_loss": -22.663780212402344, "global_step": 119844, "epoch": 1443} {"train_loss": -22.58913230895996, "global_step": 119845, "epoch": 1443} {"train_loss": -22.444807052612305, "global_step": 119846, "epoch": 1443} {"train_loss": -22.66423988342285, "global_step": 119847, "epoch": 1443} {"train_loss": -22.354711532592773, "global_step": 119848, "epoch": 1443} {"train_loss": -22.857458114624023, "global_step": 119849, "epoch": 1443} {"train_loss": -22.485797882080078, "global_step": 119850, "epoch": 1443} {"train_loss": -22.423501416861292, "global_step": 119851, "epoch": 1443, "val_loss": 6179102.0} {"train_loss": -22.1972599029541, "global_step": 119852, "epoch": 1444} {"train_loss": -22.194826126098633, "global_step": 119853, "epoch": 1444} {"train_loss": -22.708271026611328, "global_step": 119854, "epoch": 1444} {"train_loss": -21.996305465698242, "global_step": 119855, "epoch": 1444} {"train_loss": -22.446548461914062, "global_step": 119856, "epoch": 1444} {"train_loss": -21.942977905273438, "global_step": 119857, "epoch": 1444} {"train_loss": -22.33270263671875, "global_step": 119858, "epoch": 1444} {"train_loss": -22.664716720581055, "global_step": 119859, "epoch": 1444} {"train_loss": -22.365049362182617, "global_step": 119860, "epoch": 1444} {"train_loss": -22.123809814453125, "global_step": 119861, "epoch": 1444} {"train_loss": -22.325176239013672, "global_step": 119862, "epoch": 1444} {"train_loss": -22.39944839477539, "global_step": 119863, "epoch": 1444} {"train_loss": -22.525197982788086, "global_step": 119864, "epoch": 1444} {"train_loss": -22.620620727539062, "global_step": 119865, "epoch": 1444} {"train_loss": -22.31397819519043, "global_step": 119866, "epoch": 1444} {"train_loss": -22.48036766052246, "global_step": 119867, "epoch": 1444} {"train_loss": -22.24666976928711, "global_step": 119868, "epoch": 1444} {"train_loss": -22.467269897460938, "global_step": 119869, "epoch": 1444} {"train_loss": -22.405405044555664, "global_step": 119870, "epoch": 1444} {"train_loss": -22.78260612487793, "global_step": 119871, "epoch": 1444} {"train_loss": -22.26930809020996, "global_step": 119872, "epoch": 1444} {"train_loss": -22.374954223632812, "global_step": 119873, "epoch": 1444} {"train_loss": -22.68427085876465, "global_step": 119874, "epoch": 1444} {"train_loss": -22.404565811157227, "global_step": 119875, "epoch": 1444} {"train_loss": -22.758581161499023, "global_step": 119876, "epoch": 1444} {"train_loss": -22.541851043701172, "global_step": 119877, "epoch": 1444} {"train_loss": -22.303525924682617, "global_step": 119878, "epoch": 1444} {"train_loss": -22.699996948242188, "global_step": 119879, "epoch": 1444} {"train_loss": -22.253278732299805, "global_step": 119880, "epoch": 1444} {"train_loss": -22.53647232055664, "global_step": 119881, "epoch": 1444} {"train_loss": -22.619205474853516, "global_step": 119882, "epoch": 1444} {"train_loss": -22.28807830810547, "global_step": 119883, "epoch": 1444} {"train_loss": -22.72787094116211, "global_step": 119884, "epoch": 1444} {"train_loss": -22.928176879882812, "global_step": 119885, "epoch": 1444} {"train_loss": -22.578195571899414, "global_step": 119886, "epoch": 1444} {"train_loss": -22.755666732788086, "global_step": 119887, "epoch": 1444} {"train_loss": -22.76517105102539, "global_step": 119888, "epoch": 1444} {"train_loss": -22.404563903808594, "global_step": 119889, "epoch": 1444} {"train_loss": -22.430971145629883, "global_step": 119890, "epoch": 1444} {"train_loss": -22.406997680664062, "global_step": 119891, "epoch": 1444} {"train_loss": -22.451244354248047, "global_step": 119892, "epoch": 1444} {"train_loss": -22.59283447265625, "global_step": 119893, "epoch": 1444} {"train_loss": -22.331520080566406, "global_step": 119894, "epoch": 1444} {"train_loss": -22.232318878173828, "global_step": 119895, "epoch": 1444} {"train_loss": -22.84217643737793, "global_step": 119896, "epoch": 1444} {"train_loss": -22.348905563354492, "global_step": 119897, "epoch": 1444} {"train_loss": -22.779369354248047, "global_step": 119898, "epoch": 1444} {"train_loss": -23.006175994873047, "global_step": 119899, "epoch": 1444} {"train_loss": -22.46535301208496, "global_step": 119900, "epoch": 1444} {"train_loss": -22.690452575683594, "global_step": 119901, "epoch": 1444} {"train_loss": -22.659788131713867, "global_step": 119902, "epoch": 1444} {"train_loss": -22.592918395996094, "global_step": 119903, "epoch": 1444} {"train_loss": -22.439794540405273, "global_step": 119904, "epoch": 1444} {"train_loss": -22.574344635009766, "global_step": 119905, "epoch": 1444} {"train_loss": -22.473468780517578, "global_step": 119906, "epoch": 1444} {"train_loss": -22.66697120666504, "global_step": 119907, "epoch": 1444} {"train_loss": -23.132705688476562, "global_step": 119908, "epoch": 1444} {"train_loss": -22.665821075439453, "global_step": 119909, "epoch": 1444} {"train_loss": -22.64328384399414, "global_step": 119910, "epoch": 1444} {"train_loss": -22.256328582763672, "global_step": 119911, "epoch": 1444} {"train_loss": -22.28580093383789, "global_step": 119912, "epoch": 1444} {"train_loss": -22.64139175415039, "global_step": 119913, "epoch": 1444} {"train_loss": -22.560190200805664, "global_step": 119914, "epoch": 1444} {"train_loss": -22.52410125732422, "global_step": 119915, "epoch": 1444} {"train_loss": -22.66572380065918, "global_step": 119916, "epoch": 1444} {"train_loss": -22.48331069946289, "global_step": 119917, "epoch": 1444} {"train_loss": -22.365079879760742, "global_step": 119918, "epoch": 1444} {"train_loss": -22.65921974182129, "global_step": 119919, "epoch": 1444} {"train_loss": -22.479326248168945, "global_step": 119920, "epoch": 1444} {"train_loss": -21.94154930114746, "global_step": 119921, "epoch": 1444} {"train_loss": -22.25740623474121, "global_step": 119922, "epoch": 1444} {"train_loss": -22.660400390625, "global_step": 119923, "epoch": 1444} {"train_loss": -22.487485885620117, "global_step": 119924, "epoch": 1444} {"train_loss": -22.87278175354004, "global_step": 119925, "epoch": 1444} {"train_loss": -22.472328186035156, "global_step": 119926, "epoch": 1444} {"train_loss": -22.515342712402344, "global_step": 119927, "epoch": 1444} {"train_loss": -22.555517196655273, "global_step": 119928, "epoch": 1444} {"train_loss": -22.544076919555664, "global_step": 119929, "epoch": 1444} {"train_loss": -22.62933349609375, "global_step": 119930, "epoch": 1444} {"train_loss": -22.838802337646484, "global_step": 119931, "epoch": 1444} {"train_loss": -22.363187789916992, "global_step": 119932, "epoch": 1444} {"train_loss": -22.66495704650879, "global_step": 119933, "epoch": 1444} {"train_loss": -22.514100247118847, "global_step": 119934, "epoch": 1444, "val_loss": 6165680.0} {"train_loss": -22.267873764038086, "global_step": 119935, "epoch": 1445} {"train_loss": -22.18773078918457, "global_step": 119936, "epoch": 1445} {"train_loss": -22.415433883666992, "global_step": 119937, "epoch": 1445} {"train_loss": -22.196382522583008, "global_step": 119938, "epoch": 1445} {"train_loss": -22.337371826171875, "global_step": 119939, "epoch": 1445} {"train_loss": -22.067520141601562, "global_step": 119940, "epoch": 1445} {"train_loss": -22.482254028320312, "global_step": 119941, "epoch": 1445} {"train_loss": -22.237071990966797, "global_step": 119942, "epoch": 1445} {"train_loss": -22.52546501159668, "global_step": 119943, "epoch": 1445} {"train_loss": -22.42666244506836, "global_step": 119944, "epoch": 1445} {"train_loss": -22.550125122070312, "global_step": 119945, "epoch": 1445} {"train_loss": -22.34598159790039, "global_step": 119946, "epoch": 1445} {"train_loss": -22.362390518188477, "global_step": 119947, "epoch": 1445} {"train_loss": -22.694849014282227, "global_step": 119948, "epoch": 1445} {"train_loss": -22.211231231689453, "global_step": 119949, "epoch": 1445} {"train_loss": -22.2032413482666, "global_step": 119950, "epoch": 1445} {"train_loss": -22.59712791442871, "global_step": 119951, "epoch": 1445} {"train_loss": -22.67494010925293, "global_step": 119952, "epoch": 1445} {"train_loss": -22.469457626342773, "global_step": 119953, "epoch": 1445} {"train_loss": -22.361448287963867, "global_step": 119954, "epoch": 1445} {"train_loss": -22.1673641204834, "global_step": 119955, "epoch": 1445} {"train_loss": -22.62314796447754, "global_step": 119956, "epoch": 1445} {"train_loss": -22.103219985961914, "global_step": 119957, "epoch": 1445} {"train_loss": -22.111900329589844, "global_step": 119958, "epoch": 1445} {"train_loss": -22.281225204467773, "global_step": 119959, "epoch": 1445} {"train_loss": -22.486942291259766, "global_step": 119960, "epoch": 1445} {"train_loss": -22.442123413085938, "global_step": 119961, "epoch": 1445} {"train_loss": -22.410701751708984, "global_step": 119962, "epoch": 1445} {"train_loss": -22.326934814453125, "global_step": 119963, "epoch": 1445} {"train_loss": -22.725866317749023, "global_step": 119964, "epoch": 1445} {"train_loss": -22.24420738220215, "global_step": 119965, "epoch": 1445} {"train_loss": -22.676864624023438, "global_step": 119966, "epoch": 1445} {"train_loss": -22.445432662963867, "global_step": 119967, "epoch": 1445} {"train_loss": -22.475753784179688, "global_step": 119968, "epoch": 1445} {"train_loss": -22.492511749267578, "global_step": 119969, "epoch": 1445} {"train_loss": -22.240385055541992, "global_step": 119970, "epoch": 1445} {"train_loss": -22.13307762145996, "global_step": 119971, "epoch": 1445} {"train_loss": -22.25992202758789, "global_step": 119972, "epoch": 1445} {"train_loss": -22.744722366333008, "global_step": 119973, "epoch": 1445} {"train_loss": -22.7806453704834, "global_step": 119974, "epoch": 1445} {"train_loss": -22.571699142456055, "global_step": 119975, "epoch": 1445} {"train_loss": -22.61655044555664, "global_step": 119976, "epoch": 1445} {"train_loss": -22.368846893310547, "global_step": 119977, "epoch": 1445} {"train_loss": -22.500431060791016, "global_step": 119978, "epoch": 1445} {"train_loss": -22.728620529174805, "global_step": 119979, "epoch": 1445} {"train_loss": -22.497220993041992, "global_step": 119980, "epoch": 1445} {"train_loss": -22.833459854125977, "global_step": 119981, "epoch": 1445} {"train_loss": -22.8236083984375, "global_step": 119982, "epoch": 1445} {"train_loss": -22.69561195373535, "global_step": 119983, "epoch": 1445} {"train_loss": -22.352298736572266, "global_step": 119984, "epoch": 1445} {"train_loss": -22.579458236694336, "global_step": 119985, "epoch": 1445} {"train_loss": -22.505475997924805, "global_step": 119986, "epoch": 1445} {"train_loss": -22.712553024291992, "global_step": 119987, "epoch": 1445} {"train_loss": -22.60638999938965, "global_step": 119988, "epoch": 1445} {"train_loss": -22.824949264526367, "global_step": 119989, "epoch": 1445} {"train_loss": -22.649280548095703, "global_step": 119990, "epoch": 1445} {"train_loss": -22.478513717651367, "global_step": 119991, "epoch": 1445} {"train_loss": -22.540807723999023, "global_step": 119992, "epoch": 1445} {"train_loss": -22.747976303100586, "global_step": 119993, "epoch": 1445} {"train_loss": -22.373926162719727, "global_step": 119994, "epoch": 1445} {"train_loss": -22.42386245727539, "global_step": 119995, "epoch": 1445} {"train_loss": -22.750547409057617, "global_step": 119996, "epoch": 1445} {"train_loss": -22.53005027770996, "global_step": 119997, "epoch": 1445} {"train_loss": -22.546056747436523, "global_step": 119998, "epoch": 1445} {"train_loss": -22.45351219177246, "global_step": 119999, "epoch": 1445} {"train_loss": -22.721540451049805, "global_step": 120000, "epoch": 1445} {"train_loss": -22.709760665893555, "global_step": 120001, "epoch": 1445} {"train_loss": -22.823898315429688, "global_step": 120002, "epoch": 1445} {"train_loss": -22.457828521728516, "global_step": 120003, "epoch": 1445} {"train_loss": -22.823942184448242, "global_step": 120004, "epoch": 1445} {"train_loss": -22.502368927001953, "global_step": 120005, "epoch": 1445} {"train_loss": -22.505643844604492, "global_step": 120006, "epoch": 1445} {"train_loss": -22.47835350036621, "global_step": 120007, "epoch": 1445} {"train_loss": -22.69097900390625, "global_step": 120008, "epoch": 1445} {"train_loss": -22.702177047729492, "global_step": 120009, "epoch": 1445} {"train_loss": -22.661527633666992, "global_step": 120010, "epoch": 1445} {"train_loss": -22.500364303588867, "global_step": 120011, "epoch": 1445} {"train_loss": -22.62847900390625, "global_step": 120012, "epoch": 1445} {"train_loss": -22.487112045288086, "global_step": 120013, "epoch": 1445} {"train_loss": -22.45306396484375, "global_step": 120014, "epoch": 1445} {"train_loss": -22.624414443969727, "global_step": 120015, "epoch": 1445} {"train_loss": -22.823009490966797, "global_step": 120016, "epoch": 1445} {"train_loss": -22.493700969650085, "global_step": 120017, "epoch": 1445, "val_loss": 6165229.5} {"train_loss": -22.1854305267334, "global_step": 120018, "epoch": 1446} {"train_loss": -22.17494010925293, "global_step": 120019, "epoch": 1446} {"train_loss": -22.713653564453125, "global_step": 120020, "epoch": 1446} {"train_loss": -21.909154891967773, "global_step": 120021, "epoch": 1446} {"train_loss": -22.381067276000977, "global_step": 120022, "epoch": 1446} {"train_loss": -22.261287689208984, "global_step": 120023, "epoch": 1446} {"train_loss": -22.206968307495117, "global_step": 120024, "epoch": 1446} {"train_loss": -22.62104606628418, "global_step": 120025, "epoch": 1446} {"train_loss": -22.775461196899414, "global_step": 120026, "epoch": 1446} {"train_loss": -22.296621322631836, "global_step": 120027, "epoch": 1446} {"train_loss": -22.326597213745117, "global_step": 120028, "epoch": 1446} {"train_loss": -22.14045524597168, "global_step": 120029, "epoch": 1446} {"train_loss": -22.539764404296875, "global_step": 120030, "epoch": 1446} {"train_loss": -22.252538681030273, "global_step": 120031, "epoch": 1446} {"train_loss": -22.421131134033203, "global_step": 120032, "epoch": 1446} {"train_loss": -22.432554244995117, "global_step": 120033, "epoch": 1446} {"train_loss": -22.342432022094727, "global_step": 120034, "epoch": 1446} {"train_loss": -22.461708068847656, "global_step": 120035, "epoch": 1446} {"train_loss": -22.457168579101562, "global_step": 120036, "epoch": 1446} {"train_loss": -22.348203659057617, "global_step": 120037, "epoch": 1446} {"train_loss": -22.176115036010742, "global_step": 120038, "epoch": 1446} {"train_loss": -22.78860092163086, "global_step": 120039, "epoch": 1446} {"train_loss": -22.44339370727539, "global_step": 120040, "epoch": 1446} {"train_loss": -22.30890655517578, "global_step": 120041, "epoch": 1446} {"train_loss": -22.275426864624023, "global_step": 120042, "epoch": 1446} {"train_loss": -22.5635986328125, "global_step": 120043, "epoch": 1446} {"train_loss": -22.65565299987793, "global_step": 120044, "epoch": 1446} {"train_loss": -21.991960525512695, "global_step": 120045, "epoch": 1446} {"train_loss": -22.530649185180664, "global_step": 120046, "epoch": 1446} {"train_loss": -22.371891021728516, "global_step": 120047, "epoch": 1446} {"train_loss": -22.1680850982666, "global_step": 120048, "epoch": 1446} {"train_loss": -22.14691734313965, "global_step": 120049, "epoch": 1446} {"train_loss": -22.569456100463867, "global_step": 120050, "epoch": 1446} {"train_loss": -22.515607833862305, "global_step": 120051, "epoch": 1446} {"train_loss": -22.497411727905273, "global_step": 120052, "epoch": 1446} {"train_loss": -22.41505241394043, "global_step": 120053, "epoch": 1446} {"train_loss": -22.794965744018555, "global_step": 120054, "epoch": 1446} {"train_loss": -22.649991989135742, "global_step": 120055, "epoch": 1446} {"train_loss": -22.681304931640625, "global_step": 120056, "epoch": 1446} {"train_loss": -22.561609268188477, "global_step": 120057, "epoch": 1446} {"train_loss": -22.285202026367188, "global_step": 120058, "epoch": 1446} {"train_loss": -22.59379005432129, "global_step": 120059, "epoch": 1446} {"train_loss": -22.367338180541992, "global_step": 120060, "epoch": 1446} {"train_loss": -22.3651123046875, "global_step": 120061, "epoch": 1446} {"train_loss": -22.658021926879883, "global_step": 120062, "epoch": 1446} {"train_loss": -22.364959716796875, "global_step": 120063, "epoch": 1446} {"train_loss": -22.70745086669922, "global_step": 120064, "epoch": 1446} {"train_loss": -22.7896728515625, "global_step": 120065, "epoch": 1446} {"train_loss": -22.4445858001709, "global_step": 120066, "epoch": 1446} {"train_loss": -22.503231048583984, "global_step": 120067, "epoch": 1446} {"train_loss": -22.33222770690918, "global_step": 120068, "epoch": 1446} {"train_loss": -22.632986068725586, "global_step": 120069, "epoch": 1446} {"train_loss": -22.676572799682617, "global_step": 120070, "epoch": 1446} {"train_loss": -22.767271041870117, "global_step": 120071, "epoch": 1446} {"train_loss": -22.779830932617188, "global_step": 120072, "epoch": 1446} {"train_loss": -22.300769805908203, "global_step": 120073, "epoch": 1446} {"train_loss": -22.478456497192383, "global_step": 120074, "epoch": 1446} {"train_loss": -22.560726165771484, "global_step": 120075, "epoch": 1446} {"train_loss": -22.51361656188965, "global_step": 120076, "epoch": 1446} {"train_loss": -22.380651473999023, "global_step": 120077, "epoch": 1446} {"train_loss": -22.720441818237305, "global_step": 120078, "epoch": 1446} {"train_loss": -22.66413688659668, "global_step": 120079, "epoch": 1446} {"train_loss": -22.683164596557617, "global_step": 120080, "epoch": 1446} {"train_loss": -22.78082847595215, "global_step": 120081, "epoch": 1446} {"train_loss": -22.34322166442871, "global_step": 120082, "epoch": 1446} {"train_loss": -22.325546264648438, "global_step": 120083, "epoch": 1446} {"train_loss": -22.568578720092773, "global_step": 120084, "epoch": 1446} {"train_loss": -22.657880783081055, "global_step": 120085, "epoch": 1446} {"train_loss": -22.2147159576416, "global_step": 120086, "epoch": 1446} {"train_loss": -22.563617706298828, "global_step": 120087, "epoch": 1446} {"train_loss": -22.45186424255371, "global_step": 120088, "epoch": 1446} {"train_loss": -22.2593994140625, "global_step": 120089, "epoch": 1446} {"train_loss": -22.44191551208496, "global_step": 120090, "epoch": 1446} {"train_loss": -22.389005661010742, "global_step": 120091, "epoch": 1446} {"train_loss": -22.56545066833496, "global_step": 120092, "epoch": 1446} {"train_loss": -22.550464630126953, "global_step": 120093, "epoch": 1446} {"train_loss": -22.57992172241211, "global_step": 120094, "epoch": 1446} {"train_loss": -22.403409957885742, "global_step": 120095, "epoch": 1446} {"train_loss": -22.423437118530273, "global_step": 120096, "epoch": 1446} {"train_loss": -22.54732322692871, "global_step": 120097, "epoch": 1446} {"train_loss": -22.64743423461914, "global_step": 120098, "epoch": 1446} {"train_loss": -22.87692642211914, "global_step": 120099, "epoch": 1446} {"train_loss": -22.4813020315515, "global_step": 120100, "epoch": 1446, "val_loss": 6200401.0} {"train_loss": -22.459157943725586, "global_step": 120101, "epoch": 1447} {"train_loss": -22.270414352416992, "global_step": 120102, "epoch": 1447} {"train_loss": -22.338062286376953, "global_step": 120103, "epoch": 1447} {"train_loss": -22.347368240356445, "global_step": 120104, "epoch": 1447} {"train_loss": -21.92440414428711, "global_step": 120105, "epoch": 1447} {"train_loss": -22.51263427734375, "global_step": 120106, "epoch": 1447} {"train_loss": -22.691476821899414, "global_step": 120107, "epoch": 1447} {"train_loss": -22.089448928833008, "global_step": 120108, "epoch": 1447} {"train_loss": -22.559585571289062, "global_step": 120109, "epoch": 1447} {"train_loss": -22.541301727294922, "global_step": 120110, "epoch": 1447} {"train_loss": -22.514209747314453, "global_step": 120111, "epoch": 1447} {"train_loss": -22.473602294921875, "global_step": 120112, "epoch": 1447} {"train_loss": -22.388671875, "global_step": 120113, "epoch": 1447} {"train_loss": -22.338544845581055, "global_step": 120114, "epoch": 1447} {"train_loss": -22.212682723999023, "global_step": 120115, "epoch": 1447} {"train_loss": -22.340499877929688, "global_step": 120116, "epoch": 1447} {"train_loss": -22.020902633666992, "global_step": 120117, "epoch": 1447} {"train_loss": -22.92466163635254, "global_step": 120118, "epoch": 1447} {"train_loss": -22.5860538482666, "global_step": 120119, "epoch": 1447} {"train_loss": -22.63934326171875, "global_step": 120120, "epoch": 1447} {"train_loss": -22.54159164428711, "global_step": 120121, "epoch": 1447} {"train_loss": -22.511117935180664, "global_step": 120122, "epoch": 1447} {"train_loss": -22.29477310180664, "global_step": 120123, "epoch": 1447} {"train_loss": -22.73701286315918, "global_step": 120124, "epoch": 1447} {"train_loss": -22.37082290649414, "global_step": 120125, "epoch": 1447} {"train_loss": -22.461496353149414, "global_step": 120126, "epoch": 1447} {"train_loss": -22.484420776367188, "global_step": 120127, "epoch": 1447} {"train_loss": -22.956098556518555, "global_step": 120128, "epoch": 1447} {"train_loss": -22.65585708618164, "global_step": 120129, "epoch": 1447} {"train_loss": -22.60127067565918, "global_step": 120130, "epoch": 1447} {"train_loss": -22.48995018005371, "global_step": 120131, "epoch": 1447} {"train_loss": -22.87235450744629, "global_step": 120132, "epoch": 1447} {"train_loss": -22.741954803466797, "global_step": 120133, "epoch": 1447} {"train_loss": -22.788915634155273, "global_step": 120134, "epoch": 1447} {"train_loss": -22.658084869384766, "global_step": 120135, "epoch": 1447} {"train_loss": -22.440710067749023, "global_step": 120136, "epoch": 1447} {"train_loss": -22.5417423248291, "global_step": 120137, "epoch": 1447} {"train_loss": -22.571260452270508, "global_step": 120138, "epoch": 1447} {"train_loss": -22.560609817504883, "global_step": 120139, "epoch": 1447} {"train_loss": -22.557254791259766, "global_step": 120140, "epoch": 1447} {"train_loss": -22.405664443969727, "global_step": 120141, "epoch": 1447} {"train_loss": -22.3482723236084, "global_step": 120142, "epoch": 1447} {"train_loss": -22.45376968383789, "global_step": 120143, "epoch": 1447} {"train_loss": -22.73748207092285, "global_step": 120144, "epoch": 1447} {"train_loss": -22.454885482788086, "global_step": 120145, "epoch": 1447} {"train_loss": -22.679101943969727, "global_step": 120146, "epoch": 1447} {"train_loss": -22.738265991210938, "global_step": 120147, "epoch": 1447} {"train_loss": -22.31638526916504, "global_step": 120148, "epoch": 1447} {"train_loss": -22.687406539916992, "global_step": 120149, "epoch": 1447} {"train_loss": -22.504993438720703, "global_step": 120150, "epoch": 1447} {"train_loss": -22.303579330444336, "global_step": 120151, "epoch": 1447} {"train_loss": -22.72835922241211, "global_step": 120152, "epoch": 1447} {"train_loss": -22.520572662353516, "global_step": 120153, "epoch": 1447} {"train_loss": -22.262800216674805, "global_step": 120154, "epoch": 1447} {"train_loss": -22.454608917236328, "global_step": 120155, "epoch": 1447} {"train_loss": -22.241195678710938, "global_step": 120156, "epoch": 1447} {"train_loss": -22.206073760986328, "global_step": 120157, "epoch": 1447} {"train_loss": -22.567142486572266, "global_step": 120158, "epoch": 1447} {"train_loss": -22.221303939819336, "global_step": 120159, "epoch": 1447} {"train_loss": -22.32900047302246, "global_step": 120160, "epoch": 1447} {"train_loss": -22.64991569519043, "global_step": 120161, "epoch": 1447} {"train_loss": -22.761762619018555, "global_step": 120162, "epoch": 1447} {"train_loss": -22.97835922241211, "global_step": 120163, "epoch": 1447} {"train_loss": -22.52520179748535, "global_step": 120164, "epoch": 1447} {"train_loss": -22.793214797973633, "global_step": 120165, "epoch": 1447} {"train_loss": -22.580219268798828, "global_step": 120166, "epoch": 1447} {"train_loss": -22.851511001586914, "global_step": 120167, "epoch": 1447} {"train_loss": -22.411563873291016, "global_step": 120168, "epoch": 1447} {"train_loss": -22.799060821533203, "global_step": 120169, "epoch": 1447} {"train_loss": -22.13863182067871, "global_step": 120170, "epoch": 1447} {"train_loss": -22.681232452392578, "global_step": 120171, "epoch": 1447} {"train_loss": -22.47642707824707, "global_step": 120172, "epoch": 1447} {"train_loss": -22.508258819580078, "global_step": 120173, "epoch": 1447} {"train_loss": -22.547603607177734, "global_step": 120174, "epoch": 1447} {"train_loss": -22.673847198486328, "global_step": 120175, "epoch": 1447} {"train_loss": -22.77521324157715, "global_step": 120176, "epoch": 1447} {"train_loss": -22.489147186279297, "global_step": 120177, "epoch": 1447} {"train_loss": -22.722328186035156, "global_step": 120178, "epoch": 1447} {"train_loss": -22.66120719909668, "global_step": 120179, "epoch": 1447} {"train_loss": -22.88726806640625, "global_step": 120180, "epoch": 1447} {"train_loss": -22.85677719116211, "global_step": 120181, "epoch": 1447} {"train_loss": -22.310205459594727, "global_step": 120182, "epoch": 1447} {"train_loss": -22.525668707238623, "global_step": 120183, "epoch": 1447, "val_loss": 6328053.0} {"train_loss": -20.687328338623047, "global_step": 120184, "epoch": 1448} {"train_loss": -21.706329345703125, "global_step": 120185, "epoch": 1448} {"train_loss": -21.634872436523438, "global_step": 120186, "epoch": 1448} {"train_loss": -21.3833065032959, "global_step": 120187, "epoch": 1448} {"train_loss": -22.095691680908203, "global_step": 120188, "epoch": 1448} {"train_loss": -21.411376953125, "global_step": 120189, "epoch": 1448} {"train_loss": -21.91778564453125, "global_step": 120190, "epoch": 1448} {"train_loss": -21.557701110839844, "global_step": 120191, "epoch": 1448} {"train_loss": -21.95073699951172, "global_step": 120192, "epoch": 1448} {"train_loss": -21.98744773864746, "global_step": 120193, "epoch": 1448} {"train_loss": -22.239059448242188, "global_step": 120194, "epoch": 1448} {"train_loss": -21.712718963623047, "global_step": 120195, "epoch": 1448} {"train_loss": -22.471250534057617, "global_step": 120196, "epoch": 1448} {"train_loss": -21.919862747192383, "global_step": 120197, "epoch": 1448} {"train_loss": -22.260461807250977, "global_step": 120198, "epoch": 1448} {"train_loss": -21.985828399658203, "global_step": 120199, "epoch": 1448} {"train_loss": -22.147083282470703, "global_step": 120200, "epoch": 1448} {"train_loss": -21.79701805114746, "global_step": 120201, "epoch": 1448} {"train_loss": -22.438858032226562, "global_step": 120202, "epoch": 1448} {"train_loss": -22.111557006835938, "global_step": 120203, "epoch": 1448} {"train_loss": -22.265804290771484, "global_step": 120204, "epoch": 1448} {"train_loss": -22.365209579467773, "global_step": 120205, "epoch": 1448} {"train_loss": -22.836807250976562, "global_step": 120206, "epoch": 1448} {"train_loss": -21.687559127807617, "global_step": 120207, "epoch": 1448} {"train_loss": -22.64210319519043, "global_step": 120208, "epoch": 1448} {"train_loss": -22.411813735961914, "global_step": 120209, "epoch": 1448} {"train_loss": -22.300325393676758, "global_step": 120210, "epoch": 1448} {"train_loss": -22.227664947509766, "global_step": 120211, "epoch": 1448} {"train_loss": -22.040327072143555, "global_step": 120212, "epoch": 1448} {"train_loss": -22.382915496826172, "global_step": 120213, "epoch": 1448} {"train_loss": -22.38852882385254, "global_step": 120214, "epoch": 1448} {"train_loss": -22.21524429321289, "global_step": 120215, "epoch": 1448} {"train_loss": -22.635358810424805, "global_step": 120216, "epoch": 1448} {"train_loss": -22.32630729675293, "global_step": 120217, "epoch": 1448} {"train_loss": -22.360258102416992, "global_step": 120218, "epoch": 1448} {"train_loss": -22.445783615112305, "global_step": 120219, "epoch": 1448} {"train_loss": -22.745773315429688, "global_step": 120220, "epoch": 1448} {"train_loss": -22.74691390991211, "global_step": 120221, "epoch": 1448} {"train_loss": -22.42781639099121, "global_step": 120222, "epoch": 1448} {"train_loss": -22.5523681640625, "global_step": 120223, "epoch": 1448} {"train_loss": -22.64471435546875, "global_step": 120224, "epoch": 1448} {"train_loss": -22.928930282592773, "global_step": 120225, "epoch": 1448} {"train_loss": -22.421995162963867, "global_step": 120226, "epoch": 1448} {"train_loss": -22.67682456970215, "global_step": 120227, "epoch": 1448} {"train_loss": -22.508359909057617, "global_step": 120228, "epoch": 1448} {"train_loss": -22.720853805541992, "global_step": 120229, "epoch": 1448} {"train_loss": -22.42555809020996, "global_step": 120230, "epoch": 1448} {"train_loss": -23.00385856628418, "global_step": 120231, "epoch": 1448} {"train_loss": -22.731616973876953, "global_step": 120232, "epoch": 1448} {"train_loss": -22.855966567993164, "global_step": 120233, "epoch": 1448} {"train_loss": -22.73641014099121, "global_step": 120234, "epoch": 1448} {"train_loss": -22.663171768188477, "global_step": 120235, "epoch": 1448} {"train_loss": -22.459402084350586, "global_step": 120236, "epoch": 1448} {"train_loss": -22.37906837463379, "global_step": 120237, "epoch": 1448} {"train_loss": -22.606107711791992, "global_step": 120238, "epoch": 1448} {"train_loss": -22.6584529876709, "global_step": 120239, "epoch": 1448} {"train_loss": -22.903749465942383, "global_step": 120240, "epoch": 1448} {"train_loss": -22.217422485351562, "global_step": 120241, "epoch": 1448} {"train_loss": -22.48038101196289, "global_step": 120242, "epoch": 1448} {"train_loss": -22.776487350463867, "global_step": 120243, "epoch": 1448} {"train_loss": -22.72595977783203, "global_step": 120244, "epoch": 1448} {"train_loss": -22.636463165283203, "global_step": 120245, "epoch": 1448} {"train_loss": -22.517230987548828, "global_step": 120246, "epoch": 1448} {"train_loss": -22.9921932220459, "global_step": 120247, "epoch": 1448} {"train_loss": -22.508943557739258, "global_step": 120248, "epoch": 1448} {"train_loss": -22.4007511138916, "global_step": 120249, "epoch": 1448} {"train_loss": -22.494287490844727, "global_step": 120250, "epoch": 1448} {"train_loss": -22.612577438354492, "global_step": 120251, "epoch": 1448} {"train_loss": -22.628646850585938, "global_step": 120252, "epoch": 1448} {"train_loss": -22.555776596069336, "global_step": 120253, "epoch": 1448} {"train_loss": -22.856840133666992, "global_step": 120254, "epoch": 1448} {"train_loss": -22.818519592285156, "global_step": 120255, "epoch": 1448} {"train_loss": -22.855558395385742, "global_step": 120256, "epoch": 1448} {"train_loss": -22.71262550354004, "global_step": 120257, "epoch": 1448} {"train_loss": -22.648710250854492, "global_step": 120258, "epoch": 1448} {"train_loss": -22.580108642578125, "global_step": 120259, "epoch": 1448} {"train_loss": -22.978322982788086, "global_step": 120260, "epoch": 1448} {"train_loss": -22.438852310180664, "global_step": 120261, "epoch": 1448} {"train_loss": -22.614953994750977, "global_step": 120262, "epoch": 1448} {"train_loss": -22.74394416809082, "global_step": 120263, "epoch": 1448} {"train_loss": -22.71755027770996, "global_step": 120264, "epoch": 1448} {"train_loss": -22.562009811401367, "global_step": 120265, "epoch": 1448} {"train_loss": -22.392554478472974, "global_step": 120266, "epoch": 1448, "val_loss": 6345239.5} {"train_loss": -22.6032772064209, "global_step": 120267, "epoch": 1449} {"train_loss": -22.0626220703125, "global_step": 120268, "epoch": 1449} {"train_loss": -22.463863372802734, "global_step": 120269, "epoch": 1449} {"train_loss": -22.520950317382812, "global_step": 120270, "epoch": 1449} {"train_loss": -22.55311393737793, "global_step": 120271, "epoch": 1449} {"train_loss": -22.6921329498291, "global_step": 120272, "epoch": 1449} {"train_loss": -22.40852928161621, "global_step": 120273, "epoch": 1449} {"train_loss": -22.211950302124023, "global_step": 120274, "epoch": 1449} {"train_loss": -22.054370880126953, "global_step": 120275, "epoch": 1449} {"train_loss": -22.60346221923828, "global_step": 120276, "epoch": 1449} {"train_loss": -22.8446102142334, "global_step": 120277, "epoch": 1449} {"train_loss": -22.43048667907715, "global_step": 120278, "epoch": 1449} {"train_loss": -22.43244171142578, "global_step": 120279, "epoch": 1449} {"train_loss": -22.51055908203125, "global_step": 120280, "epoch": 1449} {"train_loss": -22.66748046875, "global_step": 120281, "epoch": 1449} {"train_loss": -22.497182846069336, "global_step": 120282, "epoch": 1449} {"train_loss": -22.685779571533203, "global_step": 120283, "epoch": 1449} {"train_loss": -22.733007431030273, "global_step": 120284, "epoch": 1449} {"train_loss": -22.368000030517578, "global_step": 120285, "epoch": 1449} {"train_loss": -22.50105857849121, "global_step": 120286, "epoch": 1449} {"train_loss": -22.399492263793945, "global_step": 120287, "epoch": 1449} {"train_loss": -22.301843643188477, "global_step": 120288, "epoch": 1449} {"train_loss": -22.41048240661621, "global_step": 120289, "epoch": 1449} {"train_loss": -22.29781150817871, "global_step": 120290, "epoch": 1449} {"train_loss": -22.42570686340332, "global_step": 120291, "epoch": 1449} {"train_loss": -22.077604293823242, "global_step": 120292, "epoch": 1449} {"train_loss": -22.00528335571289, "global_step": 120293, "epoch": 1449} {"train_loss": -22.951478958129883, "global_step": 120294, "epoch": 1449} {"train_loss": -22.515188217163086, "global_step": 120295, "epoch": 1449} {"train_loss": -22.49616241455078, "global_step": 120296, "epoch": 1449} {"train_loss": -22.41886329650879, "global_step": 120297, "epoch": 1449} {"train_loss": -22.416486740112305, "global_step": 120298, "epoch": 1449} {"train_loss": -22.378469467163086, "global_step": 120299, "epoch": 1449} {"train_loss": -22.357114791870117, "global_step": 120300, "epoch": 1449} {"train_loss": -22.84657859802246, "global_step": 120301, "epoch": 1449} {"train_loss": -22.531864166259766, "global_step": 120302, "epoch": 1449} {"train_loss": -22.671934127807617, "global_step": 120303, "epoch": 1449} {"train_loss": -22.2996768951416, "global_step": 120304, "epoch": 1449} {"train_loss": -22.638290405273438, "global_step": 120305, "epoch": 1449} {"train_loss": -22.590784072875977, "global_step": 120306, "epoch": 1449} {"train_loss": -22.672462463378906, "global_step": 120307, "epoch": 1449} {"train_loss": -22.480871200561523, "global_step": 120308, "epoch": 1449} {"train_loss": -22.572315216064453, "global_step": 120309, "epoch": 1449} {"train_loss": -22.616392135620117, "global_step": 120310, "epoch": 1449} {"train_loss": -22.67275047302246, "global_step": 120311, "epoch": 1449} {"train_loss": -22.420541763305664, "global_step": 120312, "epoch": 1449} {"train_loss": -22.415271759033203, "global_step": 120313, "epoch": 1449} {"train_loss": -22.32142448425293, "global_step": 120314, "epoch": 1449} {"train_loss": -22.270648956298828, "global_step": 120315, "epoch": 1449} {"train_loss": -22.76497459411621, "global_step": 120316, "epoch": 1449} {"train_loss": -22.717884063720703, "global_step": 120317, "epoch": 1449} {"train_loss": -22.331972122192383, "global_step": 120318, "epoch": 1449} {"train_loss": -22.54706573486328, "global_step": 120319, "epoch": 1449} {"train_loss": -22.33576774597168, "global_step": 120320, "epoch": 1449} {"train_loss": -21.954519271850586, "global_step": 120321, "epoch": 1449} {"train_loss": -22.73094367980957, "global_step": 120322, "epoch": 1449} {"train_loss": -22.572860717773438, "global_step": 120323, "epoch": 1449} {"train_loss": -21.998767852783203, "global_step": 120324, "epoch": 1449} {"train_loss": -22.289899826049805, "global_step": 120325, "epoch": 1449} {"train_loss": -22.969745635986328, "global_step": 120326, "epoch": 1449} {"train_loss": -22.05497169494629, "global_step": 120327, "epoch": 1449} {"train_loss": -22.53657341003418, "global_step": 120328, "epoch": 1449} {"train_loss": -22.139381408691406, "global_step": 120329, "epoch": 1449} {"train_loss": -22.401498794555664, "global_step": 120330, "epoch": 1449} {"train_loss": -22.751258850097656, "global_step": 120331, "epoch": 1449} {"train_loss": -22.123804092407227, "global_step": 120332, "epoch": 1449} {"train_loss": -22.24627685546875, "global_step": 120333, "epoch": 1449} {"train_loss": -22.394535064697266, "global_step": 120334, "epoch": 1449} {"train_loss": -22.570072174072266, "global_step": 120335, "epoch": 1449} {"train_loss": -22.361804962158203, "global_step": 120336, "epoch": 1449} {"train_loss": -22.234060287475586, "global_step": 120337, "epoch": 1449} {"train_loss": -22.619638442993164, "global_step": 120338, "epoch": 1449} {"train_loss": -22.145689010620117, "global_step": 120339, "epoch": 1449} {"train_loss": -22.421688079833984, "global_step": 120340, "epoch": 1449} {"train_loss": -22.235919952392578, "global_step": 120341, "epoch": 1449} {"train_loss": -22.444046020507812, "global_step": 120342, "epoch": 1449} {"train_loss": -22.612157821655273, "global_step": 120343, "epoch": 1449} {"train_loss": -22.212778091430664, "global_step": 120344, "epoch": 1449} {"train_loss": -22.376140594482422, "global_step": 120345, "epoch": 1449} {"train_loss": -22.645490646362305, "global_step": 120346, "epoch": 1449} {"train_loss": -22.471288681030273, "global_step": 120347, "epoch": 1449} {"train_loss": -22.322757720947266, "global_step": 120348, "epoch": 1449} {"train_loss": -22.433757690062006, "global_step": 120349, "epoch": 1449, "val_loss": 6193075.0} {"train_loss": -21.400449752807617, "global_step": 120350, "epoch": 1450} {"train_loss": -20.752599716186523, "global_step": 120351, "epoch": 1450} {"train_loss": -22.1837215423584, "global_step": 120352, "epoch": 1450} {"train_loss": -21.640317916870117, "global_step": 120353, "epoch": 1450} {"train_loss": -21.850046157836914, "global_step": 120354, "epoch": 1450} {"train_loss": -21.11322593688965, "global_step": 120355, "epoch": 1450} {"train_loss": -22.24201011657715, "global_step": 120356, "epoch": 1450} {"train_loss": -21.667020797729492, "global_step": 120357, "epoch": 1450} {"train_loss": -21.726125717163086, "global_step": 120358, "epoch": 1450} {"train_loss": -21.751577377319336, "global_step": 120359, "epoch": 1450} {"train_loss": -21.5765323638916, "global_step": 120360, "epoch": 1450} {"train_loss": -22.173675537109375, "global_step": 120361, "epoch": 1450} {"train_loss": -22.026376724243164, "global_step": 120362, "epoch": 1450} {"train_loss": -22.140705108642578, "global_step": 120363, "epoch": 1450} {"train_loss": -22.2056941986084, "global_step": 120364, "epoch": 1450} {"train_loss": -22.37540054321289, "global_step": 120365, "epoch": 1450} {"train_loss": -21.750871658325195, "global_step": 120366, "epoch": 1450} {"train_loss": -21.988080978393555, "global_step": 120367, "epoch": 1450} {"train_loss": -22.1494197845459, "global_step": 120368, "epoch": 1450} {"train_loss": -22.293914794921875, "global_step": 120369, "epoch": 1450} {"train_loss": -22.528295516967773, "global_step": 120370, "epoch": 1450} {"train_loss": -21.969024658203125, "global_step": 120371, "epoch": 1450} {"train_loss": -22.250043869018555, "global_step": 120372, "epoch": 1450} {"train_loss": -22.514530181884766, "global_step": 120373, "epoch": 1450} {"train_loss": -22.858858108520508, "global_step": 120374, "epoch": 1450} {"train_loss": -22.1671199798584, "global_step": 120375, "epoch": 1450} {"train_loss": -22.569482803344727, "global_step": 120376, "epoch": 1450} {"train_loss": -22.39166831970215, "global_step": 120377, "epoch": 1450} {"train_loss": -22.4293212890625, "global_step": 120378, "epoch": 1450} {"train_loss": -22.704160690307617, "global_step": 120379, "epoch": 1450} {"train_loss": -22.32448387145996, "global_step": 120380, "epoch": 1450} {"train_loss": -22.526077270507812, "global_step": 120381, "epoch": 1450} {"train_loss": -22.295068740844727, "global_step": 120382, "epoch": 1450} {"train_loss": -22.813077926635742, "global_step": 120383, "epoch": 1450} {"train_loss": -22.5693302154541, "global_step": 120384, "epoch": 1450} {"train_loss": -22.608301162719727, "global_step": 120385, "epoch": 1450} {"train_loss": -22.51423454284668, "global_step": 120386, "epoch": 1450} {"train_loss": -22.328540802001953, "global_step": 120387, "epoch": 1450} {"train_loss": -22.185659408569336, "global_step": 120388, "epoch": 1450} {"train_loss": -22.5851993560791, "global_step": 120389, "epoch": 1450} {"train_loss": -22.326541900634766, "global_step": 120390, "epoch": 1450} {"train_loss": -22.3309383392334, "global_step": 120391, "epoch": 1450} {"train_loss": -22.598922729492188, "global_step": 120392, "epoch": 1450} {"train_loss": -22.49639320373535, "global_step": 120393, "epoch": 1450} {"train_loss": -22.84151840209961, "global_step": 120394, "epoch": 1450} {"train_loss": -22.8963623046875, "global_step": 120395, "epoch": 1450} {"train_loss": -22.915693283081055, "global_step": 120396, "epoch": 1450} {"train_loss": -22.596094131469727, "global_step": 120397, "epoch": 1450} {"train_loss": -22.372610092163086, "global_step": 120398, "epoch": 1450} {"train_loss": -22.111835479736328, "global_step": 120399, "epoch": 1450} {"train_loss": -22.376062393188477, "global_step": 120400, "epoch": 1450} {"train_loss": -22.293441772460938, "global_step": 120401, "epoch": 1450} {"train_loss": -22.22908592224121, "global_step": 120402, "epoch": 1450} {"train_loss": -22.57026481628418, "global_step": 120403, "epoch": 1450} {"train_loss": -22.389102935791016, "global_step": 120404, "epoch": 1450} {"train_loss": -22.607757568359375, "global_step": 120405, "epoch": 1450} {"train_loss": -22.294057846069336, "global_step": 120406, "epoch": 1450} {"train_loss": -22.38270378112793, "global_step": 120407, "epoch": 1450} {"train_loss": -22.653793334960938, "global_step": 120408, "epoch": 1450} {"train_loss": -22.17760467529297, "global_step": 120409, "epoch": 1450} {"train_loss": -22.368988037109375, "global_step": 120410, "epoch": 1450} {"train_loss": -22.363914489746094, "global_step": 120411, "epoch": 1450} {"train_loss": -22.4420108795166, "global_step": 120412, "epoch": 1450} {"train_loss": -22.829435348510742, "global_step": 120413, "epoch": 1450} {"train_loss": -22.619638442993164, "global_step": 120414, "epoch": 1450} {"train_loss": -22.689083099365234, "global_step": 120415, "epoch": 1450} {"train_loss": -22.758277893066406, "global_step": 120416, "epoch": 1450} {"train_loss": -22.619312286376953, "global_step": 120417, "epoch": 1450} {"train_loss": -22.488548278808594, "global_step": 120418, "epoch": 1450} {"train_loss": -22.654104232788086, "global_step": 120419, "epoch": 1450} {"train_loss": -22.633169174194336, "global_step": 120420, "epoch": 1450} {"train_loss": -22.570880889892578, "global_step": 120421, "epoch": 1450} {"train_loss": -22.617950439453125, "global_step": 120422, "epoch": 1450} {"train_loss": -22.656545639038086, "global_step": 120423, "epoch": 1450} {"train_loss": -22.423627853393555, "global_step": 120424, "epoch": 1450} {"train_loss": -22.5272274017334, "global_step": 120425, "epoch": 1450} {"train_loss": -22.783065795898438, "global_step": 120426, "epoch": 1450} {"train_loss": -22.615619659423828, "global_step": 120427, "epoch": 1450} {"train_loss": -22.447877883911133, "global_step": 120428, "epoch": 1450} {"train_loss": -22.828369140625, "global_step": 120429, "epoch": 1450} {"train_loss": -22.51915168762207, "global_step": 120430, "epoch": 1450} {"train_loss": -22.556411743164062, "global_step": 120431, "epoch": 1450} {"train_loss": -22.36495774050793, "global_step": 120432, "epoch": 1450, "train/sim_max_reward_0": 1.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4500000": 1.0, "test/sim_max_reward_4500001": 1.0, "test/sim_max_reward_4500002": 1.0, "test/sim_max_reward_4500003": 1.0, "test/sim_max_reward_4500004": 1.0, "test/sim_max_reward_4500005": 1.0, "test/sim_max_reward_4500006": 1.0, "test/sim_max_reward_4500007": 1.0, "test/sim_max_reward_4500008": 1.0, "test/sim_max_reward_4500009": 1.0, "test/sim_max_reward_4500010": 1.0, "test/sim_max_reward_4500011": 1.0, "test/sim_max_reward_4500012": 1.0, "test/sim_max_reward_4500013": 1.0, "test/sim_max_reward_4500014": 1.0, "test/sim_max_reward_4500015": 1.0, "test/sim_max_reward_4500016": 1.0, "test/sim_max_reward_4500017": 1.0, "test/sim_max_reward_4500018": 1.0, "test/sim_max_reward_4500019": 1.0, "test/sim_max_reward_4500020": 1.0, "test/sim_max_reward_4500021": 1.0, "train/mean_score": 1.0, "test/mean_score": 1.0, "val_loss": 6291356.0} {"train_loss": -22.19375991821289, "global_step": 120433, "epoch": 1451} {"train_loss": -21.613025665283203, "global_step": 120434, "epoch": 1451} {"train_loss": -21.9577693939209, "global_step": 120435, "epoch": 1451} {"train_loss": -22.280080795288086, "global_step": 120436, "epoch": 1451} {"train_loss": -21.669631958007812, "global_step": 120437, "epoch": 1451} {"train_loss": -22.463481903076172, "global_step": 120438, "epoch": 1451} {"train_loss": -22.426908493041992, "global_step": 120439, "epoch": 1451} {"train_loss": -22.48464012145996, "global_step": 120440, "epoch": 1451} {"train_loss": -21.963760375976562, "global_step": 120441, "epoch": 1451} {"train_loss": -22.369464874267578, "global_step": 120442, "epoch": 1451} {"train_loss": -22.17645835876465, "global_step": 120443, "epoch": 1451} {"train_loss": -22.435123443603516, "global_step": 120444, "epoch": 1451} {"train_loss": -22.600032806396484, "global_step": 120445, "epoch": 1451} {"train_loss": -22.707494735717773, "global_step": 120446, "epoch": 1451} {"train_loss": -22.247394561767578, "global_step": 120447, "epoch": 1451} {"train_loss": -22.153461456298828, "global_step": 120448, "epoch": 1451} {"train_loss": -22.17165184020996, "global_step": 120449, "epoch": 1451} {"train_loss": -22.54715919494629, "global_step": 120450, "epoch": 1451} {"train_loss": -22.867700576782227, "global_step": 120451, "epoch": 1451} {"train_loss": -22.672555923461914, "global_step": 120452, "epoch": 1451} {"train_loss": -22.291257858276367, "global_step": 120453, "epoch": 1451} {"train_loss": -22.02852439880371, "global_step": 120454, "epoch": 1451} {"train_loss": -22.131067276000977, "global_step": 120455, "epoch": 1451} {"train_loss": -21.909912109375, "global_step": 120456, "epoch": 1451} {"train_loss": -22.675722122192383, "global_step": 120457, "epoch": 1451} {"train_loss": -22.559133529663086, "global_step": 120458, "epoch": 1451} {"train_loss": -22.66399383544922, "global_step": 120459, "epoch": 1451} {"train_loss": -22.389814376831055, "global_step": 120460, "epoch": 1451} {"train_loss": -22.63673210144043, "global_step": 120461, "epoch": 1451} {"train_loss": -22.345966339111328, "global_step": 120462, "epoch": 1451} {"train_loss": -22.338769912719727, "global_step": 120463, "epoch": 1451} {"train_loss": -22.559782028198242, "global_step": 120464, "epoch": 1451} {"train_loss": -22.649038314819336, "global_step": 120465, "epoch": 1451} {"train_loss": -22.556039810180664, "global_step": 120466, "epoch": 1451} {"train_loss": -22.708356857299805, "global_step": 120467, "epoch": 1451} {"train_loss": -22.685644149780273, "global_step": 120468, "epoch": 1451} {"train_loss": -22.818458557128906, "global_step": 120469, "epoch": 1451} {"train_loss": -22.774755477905273, "global_step": 120470, "epoch": 1451} {"train_loss": -22.654672622680664, "global_step": 120471, "epoch": 1451} {"train_loss": -23.1040096282959, "global_step": 120472, "epoch": 1451} {"train_loss": -22.47954559326172, "global_step": 120473, "epoch": 1451} {"train_loss": -22.508203506469727, "global_step": 120474, "epoch": 1451} {"train_loss": -22.673568725585938, "global_step": 120475, "epoch": 1451} {"train_loss": -22.13161277770996, "global_step": 120476, "epoch": 1451} {"train_loss": -22.628753662109375, "global_step": 120477, "epoch": 1451} {"train_loss": -22.565088272094727, "global_step": 120478, "epoch": 1451} {"train_loss": -22.429508209228516, "global_step": 120479, "epoch": 1451} {"train_loss": -22.394329071044922, "global_step": 120480, "epoch": 1451} {"train_loss": -22.588274002075195, "global_step": 120481, "epoch": 1451} {"train_loss": -22.487213134765625, "global_step": 120482, "epoch": 1451} {"train_loss": -22.3723087310791, "global_step": 120483, "epoch": 1451} {"train_loss": -22.40772819519043, "global_step": 120484, "epoch": 1451} {"train_loss": -22.377079010009766, "global_step": 120485, "epoch": 1451} {"train_loss": -22.131046295166016, "global_step": 120486, "epoch": 1451} {"train_loss": -22.41596031188965, "global_step": 120487, "epoch": 1451} {"train_loss": -22.79804801940918, "global_step": 120488, "epoch": 1451} {"train_loss": -22.52430534362793, "global_step": 120489, "epoch": 1451} {"train_loss": -22.647323608398438, "global_step": 120490, "epoch": 1451} {"train_loss": -22.418550491333008, "global_step": 120491, "epoch": 1451} {"train_loss": -22.410070419311523, "global_step": 120492, "epoch": 1451} {"train_loss": -22.394495010375977, "global_step": 120493, "epoch": 1451} {"train_loss": -22.492427825927734, "global_step": 120494, "epoch": 1451} {"train_loss": -22.459983825683594, "global_step": 120495, "epoch": 1451} {"train_loss": -22.849990844726562, "global_step": 120496, "epoch": 1451} {"train_loss": -22.609375, "global_step": 120497, "epoch": 1451} {"train_loss": -22.795129776000977, "global_step": 120498, "epoch": 1451} {"train_loss": -22.37494468688965, "global_step": 120499, "epoch": 1451} {"train_loss": -23.02827262878418, "global_step": 120500, "epoch": 1451} {"train_loss": -22.349353790283203, "global_step": 120501, "epoch": 1451} {"train_loss": -22.29813575744629, "global_step": 120502, "epoch": 1451} {"train_loss": -22.729690551757812, "global_step": 120503, "epoch": 1451} {"train_loss": -22.468994140625, "global_step": 120504, "epoch": 1451} {"train_loss": -22.55905532836914, "global_step": 120505, "epoch": 1451} {"train_loss": -22.62830924987793, "global_step": 120506, "epoch": 1451} {"train_loss": -22.76759910583496, "global_step": 120507, "epoch": 1451} {"train_loss": -22.545578002929688, "global_step": 120508, "epoch": 1451} {"train_loss": -22.462875366210938, "global_step": 120509, "epoch": 1451} {"train_loss": -22.542720794677734, "global_step": 120510, "epoch": 1451} {"train_loss": -22.741483688354492, "global_step": 120511, "epoch": 1451} {"train_loss": -22.78579330444336, "global_step": 120512, "epoch": 1451} {"train_loss": -22.6260986328125, "global_step": 120513, "epoch": 1451} {"train_loss": -22.612707138061523, "global_step": 120514, "epoch": 1451} {"train_loss": -22.47447668787945, "global_step": 120515, "epoch": 1451, "val_loss": 6299160.5} {"train_loss": -22.72358512878418, "global_step": 120516, "epoch": 1452} {"train_loss": -22.236188888549805, "global_step": 120517, "epoch": 1452} {"train_loss": -22.118249893188477, "global_step": 120518, "epoch": 1452} {"train_loss": -22.114469528198242, "global_step": 120519, "epoch": 1452} {"train_loss": -22.33844566345215, "global_step": 120520, "epoch": 1452} {"train_loss": -22.336618423461914, "global_step": 120521, "epoch": 1452} {"train_loss": -22.1158447265625, "global_step": 120522, "epoch": 1452} {"train_loss": -22.141582489013672, "global_step": 120523, "epoch": 1452} {"train_loss": -22.10376739501953, "global_step": 120524, "epoch": 1452} {"train_loss": -22.17332649230957, "global_step": 120525, "epoch": 1452} {"train_loss": -22.116168975830078, "global_step": 120526, "epoch": 1452} {"train_loss": -22.788299560546875, "global_step": 120527, "epoch": 1452} {"train_loss": -22.145153045654297, "global_step": 120528, "epoch": 1452} {"train_loss": -22.29218864440918, "global_step": 120529, "epoch": 1452} {"train_loss": -22.383411407470703, "global_step": 120530, "epoch": 1452} {"train_loss": -22.342365264892578, "global_step": 120531, "epoch": 1452} {"train_loss": -22.518936157226562, "global_step": 120532, "epoch": 1452} {"train_loss": -22.562236785888672, "global_step": 120533, "epoch": 1452} {"train_loss": -22.884296417236328, "global_step": 120534, "epoch": 1452} {"train_loss": -21.86220359802246, "global_step": 120535, "epoch": 1452} {"train_loss": -22.18755340576172, "global_step": 120536, "epoch": 1452} {"train_loss": -22.496870040893555, "global_step": 120537, "epoch": 1452} {"train_loss": -22.349058151245117, "global_step": 120538, "epoch": 1452} {"train_loss": -22.345369338989258, "global_step": 120539, "epoch": 1452} {"train_loss": -22.066638946533203, "global_step": 120540, "epoch": 1452} {"train_loss": -22.24452018737793, "global_step": 120541, "epoch": 1452} {"train_loss": -22.397485733032227, "global_step": 120542, "epoch": 1452} {"train_loss": -22.268264770507812, "global_step": 120543, "epoch": 1452} {"train_loss": -22.508926391601562, "global_step": 120544, "epoch": 1452} {"train_loss": -22.87605857849121, "global_step": 120545, "epoch": 1452} {"train_loss": -22.36100959777832, "global_step": 120546, "epoch": 1452} {"train_loss": -22.30264663696289, "global_step": 120547, "epoch": 1452} {"train_loss": -22.52057456970215, "global_step": 120548, "epoch": 1452} {"train_loss": -22.453765869140625, "global_step": 120549, "epoch": 1452} {"train_loss": -22.318172454833984, "global_step": 120550, "epoch": 1452} {"train_loss": -22.395709991455078, "global_step": 120551, "epoch": 1452} {"train_loss": -22.59050941467285, "global_step": 120552, "epoch": 1452} {"train_loss": -22.531803131103516, "global_step": 120553, "epoch": 1452} {"train_loss": -22.53098487854004, "global_step": 120554, "epoch": 1452} {"train_loss": -22.46955108642578, "global_step": 120555, "epoch": 1452} {"train_loss": -22.3436336517334, "global_step": 120556, "epoch": 1452} {"train_loss": -22.414466857910156, "global_step": 120557, "epoch": 1452} {"train_loss": -22.245075225830078, "global_step": 120558, "epoch": 1452} {"train_loss": -22.5637149810791, "global_step": 120559, "epoch": 1452} {"train_loss": -21.960689544677734, "global_step": 120560, "epoch": 1452} {"train_loss": -22.15828514099121, "global_step": 120561, "epoch": 1452} {"train_loss": -22.24751853942871, "global_step": 120562, "epoch": 1452} {"train_loss": -22.223722457885742, "global_step": 120563, "epoch": 1452} {"train_loss": -22.632909774780273, "global_step": 120564, "epoch": 1452} {"train_loss": -22.70026206970215, "global_step": 120565, "epoch": 1452} {"train_loss": -22.588167190551758, "global_step": 120566, "epoch": 1452} {"train_loss": -21.916669845581055, "global_step": 120567, "epoch": 1452} {"train_loss": -22.229705810546875, "global_step": 120568, "epoch": 1452} {"train_loss": -22.3275203704834, "global_step": 120569, "epoch": 1452} {"train_loss": -22.740333557128906, "global_step": 120570, "epoch": 1452} {"train_loss": -22.611528396606445, "global_step": 120571, "epoch": 1452} {"train_loss": -22.546918869018555, "global_step": 120572, "epoch": 1452} {"train_loss": -22.583253860473633, "global_step": 120573, "epoch": 1452} {"train_loss": -22.342939376831055, "global_step": 120574, "epoch": 1452} {"train_loss": -22.725027084350586, "global_step": 120575, "epoch": 1452} {"train_loss": -22.571226119995117, "global_step": 120576, "epoch": 1452} {"train_loss": -23.040496826171875, "global_step": 120577, "epoch": 1452} {"train_loss": -22.77687644958496, "global_step": 120578, "epoch": 1452} {"train_loss": -22.390417098999023, "global_step": 120579, "epoch": 1452} {"train_loss": -22.638486862182617, "global_step": 120580, "epoch": 1452} {"train_loss": -22.3780460357666, "global_step": 120581, "epoch": 1452} {"train_loss": -23.033416748046875, "global_step": 120582, "epoch": 1452} {"train_loss": -22.754343032836914, "global_step": 120583, "epoch": 1452} {"train_loss": -22.268247604370117, "global_step": 120584, "epoch": 1452} {"train_loss": -22.690589904785156, "global_step": 120585, "epoch": 1452} {"train_loss": -22.52289581298828, "global_step": 120586, "epoch": 1452} {"train_loss": -22.75931167602539, "global_step": 120587, "epoch": 1452} {"train_loss": -22.68630027770996, "global_step": 120588, "epoch": 1452} {"train_loss": -22.49514389038086, "global_step": 120589, "epoch": 1452} {"train_loss": -22.568830490112305, "global_step": 120590, "epoch": 1452} {"train_loss": -22.583463668823242, "global_step": 120591, "epoch": 1452} {"train_loss": -22.662687301635742, "global_step": 120592, "epoch": 1452} {"train_loss": -22.354141235351562, "global_step": 120593, "epoch": 1452} {"train_loss": -22.562007904052734, "global_step": 120594, "epoch": 1452} {"train_loss": -22.644859313964844, "global_step": 120595, "epoch": 1452} {"train_loss": -22.73598861694336, "global_step": 120596, "epoch": 1452} {"train_loss": -22.560312271118164, "global_step": 120597, "epoch": 1452} {"train_loss": -22.44273034061294, "global_step": 120598, "epoch": 1452, "val_loss": 6209750.0} {"train_loss": -22.20348358154297, "global_step": 120599, "epoch": 1453} {"train_loss": -22.47675132751465, "global_step": 120600, "epoch": 1453} {"train_loss": -22.635042190551758, "global_step": 120601, "epoch": 1453} {"train_loss": -22.191442489624023, "global_step": 120602, "epoch": 1453} {"train_loss": -22.848323822021484, "global_step": 120603, "epoch": 1453} {"train_loss": -22.558927536010742, "global_step": 120604, "epoch": 1453} {"train_loss": -22.47832679748535, "global_step": 120605, "epoch": 1453} {"train_loss": -22.417699813842773, "global_step": 120606, "epoch": 1453} {"train_loss": -22.355527877807617, "global_step": 120607, "epoch": 1453} {"train_loss": -22.739704132080078, "global_step": 120608, "epoch": 1453} {"train_loss": -22.369714736938477, "global_step": 120609, "epoch": 1453} {"train_loss": -22.35682487487793, "global_step": 120610, "epoch": 1453} {"train_loss": -22.594806671142578, "global_step": 120611, "epoch": 1453} {"train_loss": -22.55311393737793, "global_step": 120612, "epoch": 1453} {"train_loss": -22.757123947143555, "global_step": 120613, "epoch": 1453} {"train_loss": -22.393342971801758, "global_step": 120614, "epoch": 1453} {"train_loss": -22.520776748657227, "global_step": 120615, "epoch": 1453} {"train_loss": -22.696304321289062, "global_step": 120616, "epoch": 1453} {"train_loss": -22.266084671020508, "global_step": 120617, "epoch": 1453} {"train_loss": -22.489185333251953, "global_step": 120618, "epoch": 1453} {"train_loss": -22.58839988708496, "global_step": 120619, "epoch": 1453} {"train_loss": -22.778120040893555, "global_step": 120620, "epoch": 1453} {"train_loss": -22.263214111328125, "global_step": 120621, "epoch": 1453} {"train_loss": -22.66071891784668, "global_step": 120622, "epoch": 1453} {"train_loss": -22.750391006469727, "global_step": 120623, "epoch": 1453} {"train_loss": -22.651336669921875, "global_step": 120624, "epoch": 1453} {"train_loss": -22.443790435791016, "global_step": 120625, "epoch": 1453} {"train_loss": -22.42028045654297, "global_step": 120626, "epoch": 1453} {"train_loss": -22.688549041748047, "global_step": 120627, "epoch": 1453} {"train_loss": -22.181913375854492, "global_step": 120628, "epoch": 1453} {"train_loss": -22.470556259155273, "global_step": 120629, "epoch": 1453} {"train_loss": -22.48575210571289, "global_step": 120630, "epoch": 1453} {"train_loss": -22.798437118530273, "global_step": 120631, "epoch": 1453} {"train_loss": -22.621395111083984, "global_step": 120632, "epoch": 1453} {"train_loss": -22.565567016601562, "global_step": 120633, "epoch": 1453} {"train_loss": -22.479923248291016, "global_step": 120634, "epoch": 1453} {"train_loss": -22.012161254882812, "global_step": 120635, "epoch": 1453} {"train_loss": -22.149993896484375, "global_step": 120636, "epoch": 1453} {"train_loss": -22.397680282592773, "global_step": 120637, "epoch": 1453} {"train_loss": -22.638017654418945, "global_step": 120638, "epoch": 1453} {"train_loss": -22.445436477661133, "global_step": 120639, "epoch": 1453} {"train_loss": -22.785215377807617, "global_step": 120640, "epoch": 1453} {"train_loss": -22.412586212158203, "global_step": 120641, "epoch": 1453} {"train_loss": -22.51118278503418, "global_step": 120642, "epoch": 1453} {"train_loss": -22.51654052734375, "global_step": 120643, "epoch": 1453} {"train_loss": -22.6009578704834, "global_step": 120644, "epoch": 1453} {"train_loss": -22.32234001159668, "global_step": 120645, "epoch": 1453} {"train_loss": -22.629396438598633, "global_step": 120646, "epoch": 1453} {"train_loss": -22.576953887939453, "global_step": 120647, "epoch": 1453} {"train_loss": -22.20162010192871, "global_step": 120648, "epoch": 1453} {"train_loss": -22.883777618408203, "global_step": 120649, "epoch": 1453} {"train_loss": -22.315019607543945, "global_step": 120650, "epoch": 1453} {"train_loss": -22.718395233154297, "global_step": 120651, "epoch": 1453} {"train_loss": -22.53013038635254, "global_step": 120652, "epoch": 1453} {"train_loss": -22.55775260925293, "global_step": 120653, "epoch": 1453} {"train_loss": -22.431129455566406, "global_step": 120654, "epoch": 1453} {"train_loss": -22.64449691772461, "global_step": 120655, "epoch": 1453} {"train_loss": -22.50428581237793, "global_step": 120656, "epoch": 1453} {"train_loss": -22.376222610473633, "global_step": 120657, "epoch": 1453} {"train_loss": -22.282087326049805, "global_step": 120658, "epoch": 1453} {"train_loss": -22.47750473022461, "global_step": 120659, "epoch": 1453} {"train_loss": -22.47664451599121, "global_step": 120660, "epoch": 1453} {"train_loss": -22.60963249206543, "global_step": 120661, "epoch": 1453} {"train_loss": -22.282081604003906, "global_step": 120662, "epoch": 1453} {"train_loss": -22.729936599731445, "global_step": 120663, "epoch": 1453} {"train_loss": -22.723424911499023, "global_step": 120664, "epoch": 1453} {"train_loss": -22.658443450927734, "global_step": 120665, "epoch": 1453} {"train_loss": -22.40694236755371, "global_step": 120666, "epoch": 1453} {"train_loss": -22.718061447143555, "global_step": 120667, "epoch": 1453} {"train_loss": -22.497737884521484, "global_step": 120668, "epoch": 1453} {"train_loss": -22.255983352661133, "global_step": 120669, "epoch": 1453} {"train_loss": -22.880115509033203, "global_step": 120670, "epoch": 1453} {"train_loss": -22.459836959838867, "global_step": 120671, "epoch": 1453} {"train_loss": -22.484561920166016, "global_step": 120672, "epoch": 1453} {"train_loss": -22.63115882873535, "global_step": 120673, "epoch": 1453} {"train_loss": -22.862226486206055, "global_step": 120674, "epoch": 1453} {"train_loss": -22.531362533569336, "global_step": 120675, "epoch": 1453} {"train_loss": -22.366012573242188, "global_step": 120676, "epoch": 1453} {"train_loss": -22.701160430908203, "global_step": 120677, "epoch": 1453} {"train_loss": -22.456947326660156, "global_step": 120678, "epoch": 1453} {"train_loss": -22.63532066345215, "global_step": 120679, "epoch": 1453} {"train_loss": -22.613143920898438, "global_step": 120680, "epoch": 1453} {"train_loss": -22.516755345356035, "global_step": 120681, "epoch": 1453, "val_loss": 6286969.0} {"train_loss": -22.3723201751709, "global_step": 120682, "epoch": 1454} {"train_loss": -22.468978881835938, "global_step": 120683, "epoch": 1454} {"train_loss": -21.7213191986084, "global_step": 120684, "epoch": 1454} {"train_loss": -22.4252872467041, "global_step": 120685, "epoch": 1454} {"train_loss": -22.351316452026367, "global_step": 120686, "epoch": 1454} {"train_loss": -22.318862915039062, "global_step": 120687, "epoch": 1454} {"train_loss": -22.456769943237305, "global_step": 120688, "epoch": 1454} {"train_loss": -22.111326217651367, "global_step": 120689, "epoch": 1454} {"train_loss": -22.3986873626709, "global_step": 120690, "epoch": 1454} {"train_loss": -22.11420440673828, "global_step": 120691, "epoch": 1454} {"train_loss": -22.298927307128906, "global_step": 120692, "epoch": 1454} {"train_loss": -22.117345809936523, "global_step": 120693, "epoch": 1454} {"train_loss": -22.155597686767578, "global_step": 120694, "epoch": 1454} {"train_loss": -22.24191665649414, "global_step": 120695, "epoch": 1454} {"train_loss": -22.457454681396484, "global_step": 120696, "epoch": 1454} {"train_loss": -22.010526657104492, "global_step": 120697, "epoch": 1454} {"train_loss": -22.295141220092773, "global_step": 120698, "epoch": 1454} {"train_loss": -22.173215866088867, "global_step": 120699, "epoch": 1454} {"train_loss": -22.095853805541992, "global_step": 120700, "epoch": 1454} {"train_loss": -22.588586807250977, "global_step": 120701, "epoch": 1454} {"train_loss": -22.3317928314209, "global_step": 120702, "epoch": 1454} {"train_loss": -22.347177505493164, "global_step": 120703, "epoch": 1454} {"train_loss": -22.564062118530273, "global_step": 120704, "epoch": 1454} {"train_loss": -22.174470901489258, "global_step": 120705, "epoch": 1454} {"train_loss": -22.62605857849121, "global_step": 120706, "epoch": 1454} {"train_loss": -22.242868423461914, "global_step": 120707, "epoch": 1454} {"train_loss": -22.131988525390625, "global_step": 120708, "epoch": 1454} {"train_loss": -22.59297752380371, "global_step": 120709, "epoch": 1454} {"train_loss": -22.212209701538086, "global_step": 120710, "epoch": 1454} {"train_loss": -22.50837516784668, "global_step": 120711, "epoch": 1454} {"train_loss": -22.419666290283203, "global_step": 120712, "epoch": 1454} {"train_loss": -22.288122177124023, "global_step": 120713, "epoch": 1454} {"train_loss": -22.710973739624023, "global_step": 120714, "epoch": 1454} {"train_loss": -22.93427085876465, "global_step": 120715, "epoch": 1454} {"train_loss": -22.821096420288086, "global_step": 120716, "epoch": 1454} {"train_loss": -22.55856704711914, "global_step": 120717, "epoch": 1454} {"train_loss": -22.534534454345703, "global_step": 120718, "epoch": 1454} {"train_loss": -22.508272171020508, "global_step": 120719, "epoch": 1454} {"train_loss": -22.772747039794922, "global_step": 120720, "epoch": 1454} {"train_loss": -22.683149337768555, "global_step": 120721, "epoch": 1454} {"train_loss": -22.633298873901367, "global_step": 120722, "epoch": 1454} {"train_loss": -22.410964965820312, "global_step": 120723, "epoch": 1454} {"train_loss": -22.086061477661133, "global_step": 120724, "epoch": 1454} {"train_loss": -22.509693145751953, "global_step": 120725, "epoch": 1454} {"train_loss": -22.764236450195312, "global_step": 120726, "epoch": 1454} {"train_loss": -22.628000259399414, "global_step": 120727, "epoch": 1454} {"train_loss": -23.105411529541016, "global_step": 120728, "epoch": 1454} {"train_loss": -22.614933013916016, "global_step": 120729, "epoch": 1454} {"train_loss": -22.836660385131836, "global_step": 120730, "epoch": 1454} {"train_loss": -22.716678619384766, "global_step": 120731, "epoch": 1454} {"train_loss": -22.779306411743164, "global_step": 120732, "epoch": 1454} {"train_loss": -22.984174728393555, "global_step": 120733, "epoch": 1454} {"train_loss": -22.84175682067871, "global_step": 120734, "epoch": 1454} {"train_loss": -22.807554244995117, "global_step": 120735, "epoch": 1454} {"train_loss": -22.555227279663086, "global_step": 120736, "epoch": 1454} {"train_loss": -22.365224838256836, "global_step": 120737, "epoch": 1454} {"train_loss": -22.050146102905273, "global_step": 120738, "epoch": 1454} {"train_loss": -22.07288932800293, "global_step": 120739, "epoch": 1454} {"train_loss": -22.35407829284668, "global_step": 120740, "epoch": 1454} {"train_loss": -22.73127555847168, "global_step": 120741, "epoch": 1454} {"train_loss": -22.486194610595703, "global_step": 120742, "epoch": 1454} {"train_loss": -22.431568145751953, "global_step": 120743, "epoch": 1454} {"train_loss": -22.460542678833008, "global_step": 120744, "epoch": 1454} {"train_loss": -22.65564727783203, "global_step": 120745, "epoch": 1454} {"train_loss": -22.270450592041016, "global_step": 120746, "epoch": 1454} {"train_loss": -22.539142608642578, "global_step": 120747, "epoch": 1454} {"train_loss": -22.355127334594727, "global_step": 120748, "epoch": 1454} {"train_loss": -22.585182189941406, "global_step": 120749, "epoch": 1454} {"train_loss": -22.80754852294922, "global_step": 120750, "epoch": 1454} {"train_loss": -22.380868911743164, "global_step": 120751, "epoch": 1454} {"train_loss": -22.702640533447266, "global_step": 120752, "epoch": 1454} {"train_loss": -22.243986129760742, "global_step": 120753, "epoch": 1454} {"train_loss": -22.266952514648438, "global_step": 120754, "epoch": 1454} {"train_loss": -22.564817428588867, "global_step": 120755, "epoch": 1454} {"train_loss": -22.69687843322754, "global_step": 120756, "epoch": 1454} {"train_loss": -22.702730178833008, "global_step": 120757, "epoch": 1454} {"train_loss": -22.26763916015625, "global_step": 120758, "epoch": 1454} {"train_loss": -22.112045288085938, "global_step": 120759, "epoch": 1454} {"train_loss": -22.767553329467773, "global_step": 120760, "epoch": 1454} {"train_loss": -22.231428146362305, "global_step": 120761, "epoch": 1454} {"train_loss": -22.411197662353516, "global_step": 120762, "epoch": 1454} {"train_loss": -22.355487823486328, "global_step": 120763, "epoch": 1454} {"train_loss": -22.456393689994353, "global_step": 120764, "epoch": 1454, "val_loss": 6172474.0} {"train_loss": -22.52415657043457, "global_step": 120765, "epoch": 1455} {"train_loss": -22.510560989379883, "global_step": 120766, "epoch": 1455} {"train_loss": -21.89037322998047, "global_step": 120767, "epoch": 1455} {"train_loss": -22.795578002929688, "global_step": 120768, "epoch": 1455} {"train_loss": -22.341123580932617, "global_step": 120769, "epoch": 1455} {"train_loss": -22.566579818725586, "global_step": 120770, "epoch": 1455} {"train_loss": -22.492734909057617, "global_step": 120771, "epoch": 1455} {"train_loss": -22.08510971069336, "global_step": 120772, "epoch": 1455} {"train_loss": -22.545307159423828, "global_step": 120773, "epoch": 1455} {"train_loss": -22.172849655151367, "global_step": 120774, "epoch": 1455} {"train_loss": -22.57526206970215, "global_step": 120775, "epoch": 1455} {"train_loss": -22.652570724487305, "global_step": 120776, "epoch": 1455} {"train_loss": -22.491313934326172, "global_step": 120777, "epoch": 1455} {"train_loss": -22.454875946044922, "global_step": 120778, "epoch": 1455} {"train_loss": -22.278860092163086, "global_step": 120779, "epoch": 1455} {"train_loss": -22.32395362854004, "global_step": 120780, "epoch": 1455} {"train_loss": -22.40854263305664, "global_step": 120781, "epoch": 1455} {"train_loss": -22.195478439331055, "global_step": 120782, "epoch": 1455} {"train_loss": -22.424667358398438, "global_step": 120783, "epoch": 1455} {"train_loss": -22.610179901123047, "global_step": 120784, "epoch": 1455} {"train_loss": -22.53092384338379, "global_step": 120785, "epoch": 1455} {"train_loss": -22.51187515258789, "global_step": 120786, "epoch": 1455} {"train_loss": -22.557661056518555, "global_step": 120787, "epoch": 1455} {"train_loss": -22.601791381835938, "global_step": 120788, "epoch": 1455} {"train_loss": -22.58185386657715, "global_step": 120789, "epoch": 1455} {"train_loss": -22.292234420776367, "global_step": 120790, "epoch": 1455} {"train_loss": -22.373870849609375, "global_step": 120791, "epoch": 1455} {"train_loss": -22.489896774291992, "global_step": 120792, "epoch": 1455} {"train_loss": -22.288389205932617, "global_step": 120793, "epoch": 1455} {"train_loss": -22.701709747314453, "global_step": 120794, "epoch": 1455} {"train_loss": -22.49653434753418, "global_step": 120795, "epoch": 1455} {"train_loss": -22.62607765197754, "global_step": 120796, "epoch": 1455} {"train_loss": -22.40963363647461, "global_step": 120797, "epoch": 1455} {"train_loss": -22.452878952026367, "global_step": 120798, "epoch": 1455} {"train_loss": -22.293100357055664, "global_step": 120799, "epoch": 1455} {"train_loss": -22.11445426940918, "global_step": 120800, "epoch": 1455} {"train_loss": -22.205900192260742, "global_step": 120801, "epoch": 1455} {"train_loss": -22.64678192138672, "global_step": 120802, "epoch": 1455} {"train_loss": -22.367218017578125, "global_step": 120803, "epoch": 1455} {"train_loss": -22.14596939086914, "global_step": 120804, "epoch": 1455} {"train_loss": -22.586261749267578, "global_step": 120805, "epoch": 1455} {"train_loss": -22.63983726501465, "global_step": 120806, "epoch": 1455} {"train_loss": -22.881864547729492, "global_step": 120807, "epoch": 1455} {"train_loss": -22.745874404907227, "global_step": 120808, "epoch": 1455} {"train_loss": -22.84779930114746, "global_step": 120809, "epoch": 1455} {"train_loss": -22.248416900634766, "global_step": 120810, "epoch": 1455} {"train_loss": -22.262378692626953, "global_step": 120811, "epoch": 1455} {"train_loss": -22.90497398376465, "global_step": 120812, "epoch": 1455} {"train_loss": -22.572797775268555, "global_step": 120813, "epoch": 1455} {"train_loss": -22.794431686401367, "global_step": 120814, "epoch": 1455} {"train_loss": -22.889726638793945, "global_step": 120815, "epoch": 1455} {"train_loss": -22.71769905090332, "global_step": 120816, "epoch": 1455} {"train_loss": -22.56251335144043, "global_step": 120817, "epoch": 1455} {"train_loss": -22.573205947875977, "global_step": 120818, "epoch": 1455} {"train_loss": -23.018634796142578, "global_step": 120819, "epoch": 1455} {"train_loss": -22.4595947265625, "global_step": 120820, "epoch": 1455} {"train_loss": -22.417375564575195, "global_step": 120821, "epoch": 1455} {"train_loss": -22.301624298095703, "global_step": 120822, "epoch": 1455} {"train_loss": -22.386999130249023, "global_step": 120823, "epoch": 1455} {"train_loss": -22.20029640197754, "global_step": 120824, "epoch": 1455} {"train_loss": -22.325632095336914, "global_step": 120825, "epoch": 1455} {"train_loss": -22.564910888671875, "global_step": 120826, "epoch": 1455} {"train_loss": -22.45728874206543, "global_step": 120827, "epoch": 1455} {"train_loss": -22.616376876831055, "global_step": 120828, "epoch": 1455} {"train_loss": -22.5684814453125, "global_step": 120829, "epoch": 1455} {"train_loss": -22.41328239440918, "global_step": 120830, "epoch": 1455} {"train_loss": -22.471464157104492, "global_step": 120831, "epoch": 1455} {"train_loss": -22.75094985961914, "global_step": 120832, "epoch": 1455} {"train_loss": -22.456392288208008, "global_step": 120833, "epoch": 1455} {"train_loss": -22.216999053955078, "global_step": 120834, "epoch": 1455} {"train_loss": -21.9352970123291, "global_step": 120835, "epoch": 1455} {"train_loss": -22.538192749023438, "global_step": 120836, "epoch": 1455} {"train_loss": -22.673952102661133, "global_step": 120837, "epoch": 1455} {"train_loss": -22.3936767578125, "global_step": 120838, "epoch": 1455} {"train_loss": -22.702749252319336, "global_step": 120839, "epoch": 1455} {"train_loss": -22.727529525756836, "global_step": 120840, "epoch": 1455} {"train_loss": -22.66798210144043, "global_step": 120841, "epoch": 1455} {"train_loss": -22.427587509155273, "global_step": 120842, "epoch": 1455} {"train_loss": -22.62308120727539, "global_step": 120843, "epoch": 1455} {"train_loss": -22.950347900390625, "global_step": 120844, "epoch": 1455} {"train_loss": -22.897933959960938, "global_step": 120845, "epoch": 1455} {"train_loss": -22.609655380249023, "global_step": 120846, "epoch": 1455} {"train_loss": -22.49890332049634, "global_step": 120847, "epoch": 1455, "val_loss": 6130454.5} {"train_loss": -22.060226440429688, "global_step": 120848, "epoch": 1456} {"train_loss": -22.222858428955078, "global_step": 120849, "epoch": 1456} {"train_loss": -22.316129684448242, "global_step": 120850, "epoch": 1456} {"train_loss": -22.602190017700195, "global_step": 120851, "epoch": 1456} {"train_loss": -22.149580001831055, "global_step": 120852, "epoch": 1456} {"train_loss": -21.998437881469727, "global_step": 120853, "epoch": 1456} {"train_loss": -22.484647750854492, "global_step": 120854, "epoch": 1456} {"train_loss": -22.814119338989258, "global_step": 120855, "epoch": 1456} {"train_loss": -22.29908561706543, "global_step": 120856, "epoch": 1456} {"train_loss": -22.399635314941406, "global_step": 120857, "epoch": 1456} {"train_loss": -22.054054260253906, "global_step": 120858, "epoch": 1456} {"train_loss": -22.26082420349121, "global_step": 120859, "epoch": 1456} {"train_loss": -22.179372787475586, "global_step": 120860, "epoch": 1456} {"train_loss": -22.55457878112793, "global_step": 120861, "epoch": 1456} {"train_loss": -22.536794662475586, "global_step": 120862, "epoch": 1456} {"train_loss": -22.73624038696289, "global_step": 120863, "epoch": 1456} {"train_loss": -22.503828048706055, "global_step": 120864, "epoch": 1456} {"train_loss": -22.550857543945312, "global_step": 120865, "epoch": 1456} {"train_loss": -22.911849975585938, "global_step": 120866, "epoch": 1456} {"train_loss": -22.326932907104492, "global_step": 120867, "epoch": 1456} {"train_loss": -22.391565322875977, "global_step": 120868, "epoch": 1456} {"train_loss": -22.644258499145508, "global_step": 120869, "epoch": 1456} {"train_loss": -22.71626091003418, "global_step": 120870, "epoch": 1456} {"train_loss": -22.103904724121094, "global_step": 120871, "epoch": 1456} {"train_loss": -22.63361930847168, "global_step": 120872, "epoch": 1456} {"train_loss": -22.472753524780273, "global_step": 120873, "epoch": 1456} {"train_loss": -22.769546508789062, "global_step": 120874, "epoch": 1456} {"train_loss": -22.328598022460938, "global_step": 120875, "epoch": 1456} {"train_loss": -22.3518009185791, "global_step": 120876, "epoch": 1456} {"train_loss": -22.70112419128418, "global_step": 120877, "epoch": 1456} {"train_loss": -22.8624210357666, "global_step": 120878, "epoch": 1456} {"train_loss": -22.55988311767578, "global_step": 120879, "epoch": 1456} {"train_loss": -22.940113067626953, "global_step": 120880, "epoch": 1456} {"train_loss": -22.715991973876953, "global_step": 120881, "epoch": 1456} {"train_loss": -22.14515495300293, "global_step": 120882, "epoch": 1456} {"train_loss": -22.619647979736328, "global_step": 120883, "epoch": 1456} {"train_loss": -22.65114402770996, "global_step": 120884, "epoch": 1456} {"train_loss": -22.42017936706543, "global_step": 120885, "epoch": 1456} {"train_loss": -22.821918487548828, "global_step": 120886, "epoch": 1456} {"train_loss": -22.332189559936523, "global_step": 120887, "epoch": 1456} {"train_loss": -22.062271118164062, "global_step": 120888, "epoch": 1456} {"train_loss": -22.429853439331055, "global_step": 120889, "epoch": 1456} {"train_loss": -22.39231300354004, "global_step": 120890, "epoch": 1456} {"train_loss": -22.309707641601562, "global_step": 120891, "epoch": 1456} {"train_loss": -22.263076782226562, "global_step": 120892, "epoch": 1456} {"train_loss": -22.667051315307617, "global_step": 120893, "epoch": 1456} {"train_loss": -22.413564682006836, "global_step": 120894, "epoch": 1456} {"train_loss": -22.40969467163086, "global_step": 120895, "epoch": 1456} {"train_loss": -22.14691734313965, "global_step": 120896, "epoch": 1456} {"train_loss": -22.388858795166016, "global_step": 120897, "epoch": 1456} {"train_loss": -22.76093864440918, "global_step": 120898, "epoch": 1456} {"train_loss": -22.658742904663086, "global_step": 120899, "epoch": 1456} {"train_loss": -22.546663284301758, "global_step": 120900, "epoch": 1456} {"train_loss": -22.741302490234375, "global_step": 120901, "epoch": 1456} {"train_loss": -22.299209594726562, "global_step": 120902, "epoch": 1456} {"train_loss": -22.735836029052734, "global_step": 120903, "epoch": 1456} {"train_loss": -22.615272521972656, "global_step": 120904, "epoch": 1456} {"train_loss": -22.694175720214844, "global_step": 120905, "epoch": 1456} {"train_loss": -22.682931900024414, "global_step": 120906, "epoch": 1456} {"train_loss": -22.368392944335938, "global_step": 120907, "epoch": 1456} {"train_loss": -22.518354415893555, "global_step": 120908, "epoch": 1456} {"train_loss": -22.706085205078125, "global_step": 120909, "epoch": 1456} {"train_loss": -22.586027145385742, "global_step": 120910, "epoch": 1456} {"train_loss": -23.0817928314209, "global_step": 120911, "epoch": 1456} {"train_loss": -22.508920669555664, "global_step": 120912, "epoch": 1456} {"train_loss": -22.313461303710938, "global_step": 120913, "epoch": 1456} {"train_loss": -22.61432647705078, "global_step": 120914, "epoch": 1456} {"train_loss": -22.483369827270508, "global_step": 120915, "epoch": 1456} {"train_loss": -22.87791633605957, "global_step": 120916, "epoch": 1456} {"train_loss": -22.505817413330078, "global_step": 120917, "epoch": 1456} {"train_loss": -22.766170501708984, "global_step": 120918, "epoch": 1456} {"train_loss": -22.895843505859375, "global_step": 120919, "epoch": 1456} {"train_loss": -22.686330795288086, "global_step": 120920, "epoch": 1456} {"train_loss": -22.48829460144043, "global_step": 120921, "epoch": 1456} {"train_loss": -22.564725875854492, "global_step": 120922, "epoch": 1456} {"train_loss": -22.586624145507812, "global_step": 120923, "epoch": 1456} {"train_loss": -22.889307022094727, "global_step": 120924, "epoch": 1456} {"train_loss": -22.58234214782715, "global_step": 120925, "epoch": 1456} {"train_loss": -22.51323127746582, "global_step": 120926, "epoch": 1456} {"train_loss": -22.898441314697266, "global_step": 120927, "epoch": 1456} {"train_loss": -22.368438720703125, "global_step": 120928, "epoch": 1456} {"train_loss": -22.567655563354492, "global_step": 120929, "epoch": 1456} {"train_loss": -22.537089244428888, "global_step": 120930, "epoch": 1456, "val_loss": 6288868.0} {"train_loss": -21.778919219970703, "global_step": 120931, "epoch": 1457} {"train_loss": -22.15116310119629, "global_step": 120932, "epoch": 1457} {"train_loss": -21.686111450195312, "global_step": 120933, "epoch": 1457} {"train_loss": -22.157939910888672, "global_step": 120934, "epoch": 1457} {"train_loss": -21.662147521972656, "global_step": 120935, "epoch": 1457} {"train_loss": -21.927928924560547, "global_step": 120936, "epoch": 1457} {"train_loss": -22.057004928588867, "global_step": 120937, "epoch": 1457} {"train_loss": -22.246885299682617, "global_step": 120938, "epoch": 1457} {"train_loss": -22.271696090698242, "global_step": 120939, "epoch": 1457} {"train_loss": -21.967214584350586, "global_step": 120940, "epoch": 1457} {"train_loss": -22.42991828918457, "global_step": 120941, "epoch": 1457} {"train_loss": -22.5513916015625, "global_step": 120942, "epoch": 1457} {"train_loss": -22.624189376831055, "global_step": 120943, "epoch": 1457} {"train_loss": -22.425914764404297, "global_step": 120944, "epoch": 1457} {"train_loss": -22.616792678833008, "global_step": 120945, "epoch": 1457} {"train_loss": -22.657371520996094, "global_step": 120946, "epoch": 1457} {"train_loss": -22.360727310180664, "global_step": 120947, "epoch": 1457} {"train_loss": -22.32390785217285, "global_step": 120948, "epoch": 1457} {"train_loss": -22.38576316833496, "global_step": 120949, "epoch": 1457} {"train_loss": -22.250282287597656, "global_step": 120950, "epoch": 1457} {"train_loss": -22.73946762084961, "global_step": 120951, "epoch": 1457} {"train_loss": -22.547666549682617, "global_step": 120952, "epoch": 1457} {"train_loss": -22.594221115112305, "global_step": 120953, "epoch": 1457} {"train_loss": -22.278989791870117, "global_step": 120954, "epoch": 1457} {"train_loss": -22.715356826782227, "global_step": 120955, "epoch": 1457} {"train_loss": -22.488855361938477, "global_step": 120956, "epoch": 1457} {"train_loss": -22.400876998901367, "global_step": 120957, "epoch": 1457} {"train_loss": -22.610889434814453, "global_step": 120958, "epoch": 1457} {"train_loss": -22.353788375854492, "global_step": 120959, "epoch": 1457} {"train_loss": -22.80421257019043, "global_step": 120960, "epoch": 1457} {"train_loss": -22.200754165649414, "global_step": 120961, "epoch": 1457} {"train_loss": -22.669170379638672, "global_step": 120962, "epoch": 1457} {"train_loss": -22.186220169067383, "global_step": 120963, "epoch": 1457} {"train_loss": -22.19148063659668, "global_step": 120964, "epoch": 1457} {"train_loss": -22.0572452545166, "global_step": 120965, "epoch": 1457} {"train_loss": -22.02203941345215, "global_step": 120966, "epoch": 1457} {"train_loss": -22.5966739654541, "global_step": 120967, "epoch": 1457} {"train_loss": -22.28916358947754, "global_step": 120968, "epoch": 1457} {"train_loss": -22.725879669189453, "global_step": 120969, "epoch": 1457} {"train_loss": -22.40044403076172, "global_step": 120970, "epoch": 1457} {"train_loss": -22.395206451416016, "global_step": 120971, "epoch": 1457} {"train_loss": -22.880537033081055, "global_step": 120972, "epoch": 1457} {"train_loss": -22.22625160217285, "global_step": 120973, "epoch": 1457} {"train_loss": -22.32225227355957, "global_step": 120974, "epoch": 1457} {"train_loss": -22.387388229370117, "global_step": 120975, "epoch": 1457} {"train_loss": -22.452232360839844, "global_step": 120976, "epoch": 1457} {"train_loss": -22.603361129760742, "global_step": 120977, "epoch": 1457} {"train_loss": -22.453630447387695, "global_step": 120978, "epoch": 1457} {"train_loss": -22.710330963134766, "global_step": 120979, "epoch": 1457} {"train_loss": -22.4222354888916, "global_step": 120980, "epoch": 1457} {"train_loss": -22.028539657592773, "global_step": 120981, "epoch": 1457} {"train_loss": -22.439838409423828, "global_step": 120982, "epoch": 1457} {"train_loss": -22.680801391601562, "global_step": 120983, "epoch": 1457} {"train_loss": -22.7297306060791, "global_step": 120984, "epoch": 1457} {"train_loss": -22.689870834350586, "global_step": 120985, "epoch": 1457} {"train_loss": -22.73029136657715, "global_step": 120986, "epoch": 1457} {"train_loss": -22.519201278686523, "global_step": 120987, "epoch": 1457} {"train_loss": -22.61409568786621, "global_step": 120988, "epoch": 1457} {"train_loss": -22.602825164794922, "global_step": 120989, "epoch": 1457} {"train_loss": -22.684009552001953, "global_step": 120990, "epoch": 1457} {"train_loss": -22.526559829711914, "global_step": 120991, "epoch": 1457} {"train_loss": -22.603513717651367, "global_step": 120992, "epoch": 1457} {"train_loss": -22.93096351623535, "global_step": 120993, "epoch": 1457} {"train_loss": -22.79115104675293, "global_step": 120994, "epoch": 1457} {"train_loss": -23.09271240234375, "global_step": 120995, "epoch": 1457} {"train_loss": -22.202451705932617, "global_step": 120996, "epoch": 1457} {"train_loss": -22.696868896484375, "global_step": 120997, "epoch": 1457} {"train_loss": -22.299314498901367, "global_step": 120998, "epoch": 1457} {"train_loss": -23.049997329711914, "global_step": 120999, "epoch": 1457} {"train_loss": -22.689682006835938, "global_step": 121000, "epoch": 1457} {"train_loss": -22.638874053955078, "global_step": 121001, "epoch": 1457} {"train_loss": -22.57692527770996, "global_step": 121002, "epoch": 1457} {"train_loss": -22.403120040893555, "global_step": 121003, "epoch": 1457} {"train_loss": -23.016559600830078, "global_step": 121004, "epoch": 1457} {"train_loss": -22.608217239379883, "global_step": 121005, "epoch": 1457} {"train_loss": -22.726043701171875, "global_step": 121006, "epoch": 1457} {"train_loss": -22.403884887695312, "global_step": 121007, "epoch": 1457} {"train_loss": -22.338491439819336, "global_step": 121008, "epoch": 1457} {"train_loss": -22.679737091064453, "global_step": 121009, "epoch": 1457} {"train_loss": -22.317914962768555, "global_step": 121010, "epoch": 1457} {"train_loss": -22.485942840576172, "global_step": 121011, "epoch": 1457} {"train_loss": -22.66841697692871, "global_step": 121012, "epoch": 1457} {"train_loss": -22.47382124935288, "global_step": 121013, "epoch": 1457, "val_loss": 6176614.0} {"train_loss": -22.16927146911621, "global_step": 121014, "epoch": 1458} {"train_loss": -22.157079696655273, "global_step": 121015, "epoch": 1458} {"train_loss": -22.04467010498047, "global_step": 121016, "epoch": 1458} {"train_loss": -22.2650146484375, "global_step": 121017, "epoch": 1458} {"train_loss": -22.565147399902344, "global_step": 121018, "epoch": 1458} {"train_loss": -21.92671012878418, "global_step": 121019, "epoch": 1458} {"train_loss": -22.40658187866211, "global_step": 121020, "epoch": 1458} {"train_loss": -22.3109073638916, "global_step": 121021, "epoch": 1458} {"train_loss": -22.013751983642578, "global_step": 121022, "epoch": 1458} {"train_loss": -22.571378707885742, "global_step": 121023, "epoch": 1458} {"train_loss": -21.822431564331055, "global_step": 121024, "epoch": 1458} {"train_loss": -22.582311630249023, "global_step": 121025, "epoch": 1458} {"train_loss": -22.361082077026367, "global_step": 121026, "epoch": 1458} {"train_loss": -22.39759635925293, "global_step": 121027, "epoch": 1458} {"train_loss": -22.129554748535156, "global_step": 121028, "epoch": 1458} {"train_loss": -22.36968421936035, "global_step": 121029, "epoch": 1458} {"train_loss": -22.867563247680664, "global_step": 121030, "epoch": 1458} {"train_loss": -22.559804916381836, "global_step": 121031, "epoch": 1458} {"train_loss": -22.44153594970703, "global_step": 121032, "epoch": 1458} {"train_loss": -22.352691650390625, "global_step": 121033, "epoch": 1458} {"train_loss": -22.546913146972656, "global_step": 121034, "epoch": 1458} {"train_loss": -22.638736724853516, "global_step": 121035, "epoch": 1458} {"train_loss": -22.5340576171875, "global_step": 121036, "epoch": 1458} {"train_loss": -22.649845123291016, "global_step": 121037, "epoch": 1458} {"train_loss": -22.37541961669922, "global_step": 121038, "epoch": 1458} {"train_loss": -22.16718101501465, "global_step": 121039, "epoch": 1458} {"train_loss": -22.672109603881836, "global_step": 121040, "epoch": 1458} {"train_loss": -22.47208595275879, "global_step": 121041, "epoch": 1458} {"train_loss": -22.6356201171875, "global_step": 121042, "epoch": 1458} {"train_loss": -22.734651565551758, "global_step": 121043, "epoch": 1458} {"train_loss": -22.707090377807617, "global_step": 121044, "epoch": 1458} {"train_loss": -22.965871810913086, "global_step": 121045, "epoch": 1458} {"train_loss": -22.87078094482422, "global_step": 121046, "epoch": 1458} {"train_loss": -22.34360694885254, "global_step": 121047, "epoch": 1458} {"train_loss": -22.58106803894043, "global_step": 121048, "epoch": 1458} {"train_loss": -22.778457641601562, "global_step": 121049, "epoch": 1458} {"train_loss": -22.466318130493164, "global_step": 121050, "epoch": 1458} {"train_loss": -22.887575149536133, "global_step": 121051, "epoch": 1458} {"train_loss": -22.510234832763672, "global_step": 121052, "epoch": 1458} {"train_loss": -22.691326141357422, "global_step": 121053, "epoch": 1458} {"train_loss": -22.61513328552246, "global_step": 121054, "epoch": 1458} {"train_loss": -22.61959457397461, "global_step": 121055, "epoch": 1458} {"train_loss": -22.67266845703125, "global_step": 121056, "epoch": 1458} {"train_loss": -22.915796279907227, "global_step": 121057, "epoch": 1458} {"train_loss": -22.62031364440918, "global_step": 121058, "epoch": 1458} {"train_loss": -22.493457794189453, "global_step": 121059, "epoch": 1458} {"train_loss": -22.827741622924805, "global_step": 121060, "epoch": 1458} {"train_loss": -22.74248504638672, "global_step": 121061, "epoch": 1458} {"train_loss": -22.626483917236328, "global_step": 121062, "epoch": 1458} {"train_loss": -22.947734832763672, "global_step": 121063, "epoch": 1458} {"train_loss": -22.668689727783203, "global_step": 121064, "epoch": 1458} {"train_loss": -22.590742111206055, "global_step": 121065, "epoch": 1458} {"train_loss": -22.476408004760742, "global_step": 121066, "epoch": 1458} {"train_loss": -22.718067169189453, "global_step": 121067, "epoch": 1458} {"train_loss": -22.661075592041016, "global_step": 121068, "epoch": 1458} {"train_loss": -22.629541397094727, "global_step": 121069, "epoch": 1458} {"train_loss": -22.503768920898438, "global_step": 121070, "epoch": 1458} {"train_loss": -22.735095977783203, "global_step": 121071, "epoch": 1458} {"train_loss": -22.295042037963867, "global_step": 121072, "epoch": 1458} {"train_loss": -22.383020401000977, "global_step": 121073, "epoch": 1458} {"train_loss": -22.816015243530273, "global_step": 121074, "epoch": 1458} {"train_loss": -22.439558029174805, "global_step": 121075, "epoch": 1458} {"train_loss": -22.38856315612793, "global_step": 121076, "epoch": 1458} {"train_loss": -22.849746704101562, "global_step": 121077, "epoch": 1458} {"train_loss": -22.896209716796875, "global_step": 121078, "epoch": 1458} {"train_loss": -22.2476863861084, "global_step": 121079, "epoch": 1458} {"train_loss": -22.655818939208984, "global_step": 121080, "epoch": 1458} {"train_loss": -22.269140243530273, "global_step": 121081, "epoch": 1458} {"train_loss": -22.712854385375977, "global_step": 121082, "epoch": 1458} {"train_loss": -22.854049682617188, "global_step": 121083, "epoch": 1458} {"train_loss": -22.606565475463867, "global_step": 121084, "epoch": 1458} {"train_loss": -22.75855255126953, "global_step": 121085, "epoch": 1458} {"train_loss": -22.794469833374023, "global_step": 121086, "epoch": 1458} {"train_loss": -22.60831642150879, "global_step": 121087, "epoch": 1458} {"train_loss": -22.913040161132812, "global_step": 121088, "epoch": 1458} {"train_loss": -22.942052841186523, "global_step": 121089, "epoch": 1458} {"train_loss": -22.623382568359375, "global_step": 121090, "epoch": 1458} {"train_loss": -22.58304214477539, "global_step": 121091, "epoch": 1458} {"train_loss": -22.951519012451172, "global_step": 121092, "epoch": 1458} {"train_loss": -22.413997650146484, "global_step": 121093, "epoch": 1458} {"train_loss": -22.504732131958008, "global_step": 121094, "epoch": 1458} {"train_loss": -22.815982818603516, "global_step": 121095, "epoch": 1458} {"train_loss": -22.555537901728986, "global_step": 121096, "epoch": 1458, "val_loss": 6314887.0} {"train_loss": -22.638147354125977, "global_step": 121097, "epoch": 1459} {"train_loss": -22.703365325927734, "global_step": 121098, "epoch": 1459} {"train_loss": -22.392108917236328, "global_step": 121099, "epoch": 1459} {"train_loss": -22.338598251342773, "global_step": 121100, "epoch": 1459} {"train_loss": -22.032489776611328, "global_step": 121101, "epoch": 1459} {"train_loss": -22.498132705688477, "global_step": 121102, "epoch": 1459} {"train_loss": -22.28026580810547, "global_step": 121103, "epoch": 1459} {"train_loss": -22.623586654663086, "global_step": 121104, "epoch": 1459} {"train_loss": -22.371244430541992, "global_step": 121105, "epoch": 1459} {"train_loss": -22.641357421875, "global_step": 121106, "epoch": 1459} {"train_loss": -22.19463539123535, "global_step": 121107, "epoch": 1459} {"train_loss": -22.227514266967773, "global_step": 121108, "epoch": 1459} {"train_loss": -22.755521774291992, "global_step": 121109, "epoch": 1459} {"train_loss": -22.77435874938965, "global_step": 121110, "epoch": 1459} {"train_loss": -22.441762924194336, "global_step": 121111, "epoch": 1459} {"train_loss": -22.128206253051758, "global_step": 121112, "epoch": 1459} {"train_loss": -22.843666076660156, "global_step": 121113, "epoch": 1459} {"train_loss": -22.348989486694336, "global_step": 121114, "epoch": 1459} {"train_loss": -22.361421585083008, "global_step": 121115, "epoch": 1459} {"train_loss": -22.65913200378418, "global_step": 121116, "epoch": 1459} {"train_loss": -22.468463897705078, "global_step": 121117, "epoch": 1459} {"train_loss": -22.639759063720703, "global_step": 121118, "epoch": 1459} {"train_loss": -22.601131439208984, "global_step": 121119, "epoch": 1459} {"train_loss": -22.881452560424805, "global_step": 121120, "epoch": 1459} {"train_loss": -22.558216094970703, "global_step": 121121, "epoch": 1459} {"train_loss": -22.51761817932129, "global_step": 121122, "epoch": 1459} {"train_loss": -22.711973190307617, "global_step": 121123, "epoch": 1459} {"train_loss": -22.398908615112305, "global_step": 121124, "epoch": 1459} {"train_loss": -22.451892852783203, "global_step": 121125, "epoch": 1459} {"train_loss": -22.670164108276367, "global_step": 121126, "epoch": 1459} {"train_loss": -22.937820434570312, "global_step": 121127, "epoch": 1459} {"train_loss": -22.713233947753906, "global_step": 121128, "epoch": 1459} {"train_loss": -22.885990142822266, "global_step": 121129, "epoch": 1459} {"train_loss": -22.783809661865234, "global_step": 121130, "epoch": 1459} {"train_loss": -22.38985252380371, "global_step": 121131, "epoch": 1459} {"train_loss": -22.821067810058594, "global_step": 121132, "epoch": 1459} {"train_loss": -22.74368667602539, "global_step": 121133, "epoch": 1459} {"train_loss": -22.82098388671875, "global_step": 121134, "epoch": 1459} {"train_loss": -22.429899215698242, "global_step": 121135, "epoch": 1459} {"train_loss": -22.453699111938477, "global_step": 121136, "epoch": 1459} {"train_loss": -22.89967155456543, "global_step": 121137, "epoch": 1459} {"train_loss": -22.90292739868164, "global_step": 121138, "epoch": 1459} {"train_loss": -22.21761703491211, "global_step": 121139, "epoch": 1459} {"train_loss": -22.707412719726562, "global_step": 121140, "epoch": 1459} {"train_loss": -22.316993713378906, "global_step": 121141, "epoch": 1459} {"train_loss": -22.505802154541016, "global_step": 121142, "epoch": 1459} {"train_loss": -22.39948272705078, "global_step": 121143, "epoch": 1459} {"train_loss": -22.470916748046875, "global_step": 121144, "epoch": 1459} {"train_loss": -22.237028121948242, "global_step": 121145, "epoch": 1459} {"train_loss": -22.693822860717773, "global_step": 121146, "epoch": 1459} {"train_loss": -22.73464584350586, "global_step": 121147, "epoch": 1459} {"train_loss": -22.3712100982666, "global_step": 121148, "epoch": 1459} {"train_loss": -22.412181854248047, "global_step": 121149, "epoch": 1459} {"train_loss": -22.630788803100586, "global_step": 121150, "epoch": 1459} {"train_loss": -22.42793846130371, "global_step": 121151, "epoch": 1459} {"train_loss": -22.619827270507812, "global_step": 121152, "epoch": 1459} {"train_loss": -22.706348419189453, "global_step": 121153, "epoch": 1459} {"train_loss": -22.5284481048584, "global_step": 121154, "epoch": 1459} {"train_loss": -22.45111846923828, "global_step": 121155, "epoch": 1459} {"train_loss": -22.566675186157227, "global_step": 121156, "epoch": 1459} {"train_loss": -22.50731658935547, "global_step": 121157, "epoch": 1459} {"train_loss": -22.552968978881836, "global_step": 121158, "epoch": 1459} {"train_loss": -22.577289581298828, "global_step": 121159, "epoch": 1459} {"train_loss": -22.65003776550293, "global_step": 121160, "epoch": 1459} {"train_loss": -22.772918701171875, "global_step": 121161, "epoch": 1459} {"train_loss": -22.790895462036133, "global_step": 121162, "epoch": 1459} {"train_loss": -22.801315307617188, "global_step": 121163, "epoch": 1459} {"train_loss": -22.694334030151367, "global_step": 121164, "epoch": 1459} {"train_loss": -22.234615325927734, "global_step": 121165, "epoch": 1459} {"train_loss": -22.5079402923584, "global_step": 121166, "epoch": 1459} {"train_loss": -22.601465225219727, "global_step": 121167, "epoch": 1459} {"train_loss": -22.55535888671875, "global_step": 121168, "epoch": 1459} {"train_loss": -22.373319625854492, "global_step": 121169, "epoch": 1459} {"train_loss": -22.64476776123047, "global_step": 121170, "epoch": 1459} {"train_loss": -22.632192611694336, "global_step": 121171, "epoch": 1459} {"train_loss": -22.256410598754883, "global_step": 121172, "epoch": 1459} {"train_loss": -22.659223556518555, "global_step": 121173, "epoch": 1459} {"train_loss": -22.594907760620117, "global_step": 121174, "epoch": 1459} {"train_loss": -22.173368453979492, "global_step": 121175, "epoch": 1459} {"train_loss": -22.464496612548828, "global_step": 121176, "epoch": 1459} {"train_loss": -22.55500602722168, "global_step": 121177, "epoch": 1459} {"train_loss": -22.5573787689209, "global_step": 121178, "epoch": 1459} {"train_loss": -22.53854792951101, "global_step": 121179, "epoch": 1459, "val_loss": 6298843.0} {"train_loss": -22.671478271484375, "global_step": 121180, "epoch": 1460} {"train_loss": -22.207786560058594, "global_step": 121181, "epoch": 1460} {"train_loss": -21.969623565673828, "global_step": 121182, "epoch": 1460} {"train_loss": -22.354259490966797, "global_step": 121183, "epoch": 1460} {"train_loss": -22.275794982910156, "global_step": 121184, "epoch": 1460} {"train_loss": -22.04047966003418, "global_step": 121185, "epoch": 1460} {"train_loss": -22.211441040039062, "global_step": 121186, "epoch": 1460} {"train_loss": -22.339181900024414, "global_step": 121187, "epoch": 1460} {"train_loss": -22.715824127197266, "global_step": 121188, "epoch": 1460} {"train_loss": -22.056137084960938, "global_step": 121189, "epoch": 1460} {"train_loss": -21.960851669311523, "global_step": 121190, "epoch": 1460} {"train_loss": -22.542280197143555, "global_step": 121191, "epoch": 1460} {"train_loss": -22.211212158203125, "global_step": 121192, "epoch": 1460} {"train_loss": -21.984434127807617, "global_step": 121193, "epoch": 1460} {"train_loss": -21.913745880126953, "global_step": 121194, "epoch": 1460} {"train_loss": -21.941274642944336, "global_step": 121195, "epoch": 1460} {"train_loss": -22.473356246948242, "global_step": 121196, "epoch": 1460} {"train_loss": -22.017778396606445, "global_step": 121197, "epoch": 1460} {"train_loss": -22.75328254699707, "global_step": 121198, "epoch": 1460} {"train_loss": -22.720029830932617, "global_step": 121199, "epoch": 1460} {"train_loss": -22.27178955078125, "global_step": 121200, "epoch": 1460} {"train_loss": -22.351293563842773, "global_step": 121201, "epoch": 1460} {"train_loss": -22.770721435546875, "global_step": 121202, "epoch": 1460} {"train_loss": -22.145231246948242, "global_step": 121203, "epoch": 1460} {"train_loss": -22.59880256652832, "global_step": 121204, "epoch": 1460} {"train_loss": -22.294620513916016, "global_step": 121205, "epoch": 1460} {"train_loss": -22.123598098754883, "global_step": 121206, "epoch": 1460} {"train_loss": -22.31129264831543, "global_step": 121207, "epoch": 1460} {"train_loss": -22.727371215820312, "global_step": 121208, "epoch": 1460} {"train_loss": -22.013914108276367, "global_step": 121209, "epoch": 1460} {"train_loss": -22.086944580078125, "global_step": 121210, "epoch": 1460} {"train_loss": -22.12373161315918, "global_step": 121211, "epoch": 1460} {"train_loss": -22.436391830444336, "global_step": 121212, "epoch": 1460} {"train_loss": -22.434072494506836, "global_step": 121213, "epoch": 1460} {"train_loss": -22.389209747314453, "global_step": 121214, "epoch": 1460} {"train_loss": -22.584365844726562, "global_step": 121215, "epoch": 1460} {"train_loss": -22.236480712890625, "global_step": 121216, "epoch": 1460} {"train_loss": -22.954917907714844, "global_step": 121217, "epoch": 1460} {"train_loss": -22.33009147644043, "global_step": 121218, "epoch": 1460} {"train_loss": -22.50077247619629, "global_step": 121219, "epoch": 1460} {"train_loss": -22.669296264648438, "global_step": 121220, "epoch": 1460} {"train_loss": -22.479095458984375, "global_step": 121221, "epoch": 1460} {"train_loss": -22.86720085144043, "global_step": 121222, "epoch": 1460} {"train_loss": -22.804426193237305, "global_step": 121223, "epoch": 1460} {"train_loss": -22.461549758911133, "global_step": 121224, "epoch": 1460} {"train_loss": -22.525419235229492, "global_step": 121225, "epoch": 1460} {"train_loss": -22.272457122802734, "global_step": 121226, "epoch": 1460} {"train_loss": -22.5143985748291, "global_step": 121227, "epoch": 1460} {"train_loss": -22.33868408203125, "global_step": 121228, "epoch": 1460} {"train_loss": -22.708316802978516, "global_step": 121229, "epoch": 1460} {"train_loss": -22.898090362548828, "global_step": 121230, "epoch": 1460} {"train_loss": -22.728328704833984, "global_step": 121231, "epoch": 1460} {"train_loss": -22.780719757080078, "global_step": 121232, "epoch": 1460} {"train_loss": -22.953100204467773, "global_step": 121233, "epoch": 1460} {"train_loss": -22.08116912841797, "global_step": 121234, "epoch": 1460} {"train_loss": -22.520429611206055, "global_step": 121235, "epoch": 1460} {"train_loss": -22.797203063964844, "global_step": 121236, "epoch": 1460} {"train_loss": -22.515121459960938, "global_step": 121237, "epoch": 1460} {"train_loss": -22.487878799438477, "global_step": 121238, "epoch": 1460} {"train_loss": -22.503376007080078, "global_step": 121239, "epoch": 1460} {"train_loss": -22.77227020263672, "global_step": 121240, "epoch": 1460} {"train_loss": -22.517168045043945, "global_step": 121241, "epoch": 1460} {"train_loss": -22.548046112060547, "global_step": 121242, "epoch": 1460} {"train_loss": -22.43691062927246, "global_step": 121243, "epoch": 1460} {"train_loss": -22.136157989501953, "global_step": 121244, "epoch": 1460} {"train_loss": -22.470458984375, "global_step": 121245, "epoch": 1460} {"train_loss": -22.53243064880371, "global_step": 121246, "epoch": 1460} {"train_loss": -22.86768913269043, "global_step": 121247, "epoch": 1460} {"train_loss": -22.7545223236084, "global_step": 121248, "epoch": 1460} {"train_loss": -22.511341094970703, "global_step": 121249, "epoch": 1460} {"train_loss": -22.460615158081055, "global_step": 121250, "epoch": 1460} {"train_loss": -22.681058883666992, "global_step": 121251, "epoch": 1460} {"train_loss": -22.873172760009766, "global_step": 121252, "epoch": 1460} {"train_loss": -22.522300720214844, "global_step": 121253, "epoch": 1460} {"train_loss": -22.840314865112305, "global_step": 121254, "epoch": 1460} {"train_loss": -22.667377471923828, "global_step": 121255, "epoch": 1460} {"train_loss": -22.697416305541992, "global_step": 121256, "epoch": 1460} {"train_loss": -22.522350311279297, "global_step": 121257, "epoch": 1460} {"train_loss": -22.518878936767578, "global_step": 121258, "epoch": 1460} {"train_loss": -22.534652709960938, "global_step": 121259, "epoch": 1460} {"train_loss": -22.74941062927246, "global_step": 121260, "epoch": 1460} {"train_loss": -22.795175552368164, "global_step": 121261, "epoch": 1460} {"train_loss": -22.468954867627247, "global_step": 121262, "epoch": 1460, "val_loss": 6223063.0} {"train_loss": -21.903827667236328, "global_step": 121263, "epoch": 1461} {"train_loss": -21.74970817565918, "global_step": 121264, "epoch": 1461} {"train_loss": -22.294767379760742, "global_step": 121265, "epoch": 1461} {"train_loss": -22.101486206054688, "global_step": 121266, "epoch": 1461} {"train_loss": -22.64436912536621, "global_step": 121267, "epoch": 1461} {"train_loss": -22.29495620727539, "global_step": 121268, "epoch": 1461} {"train_loss": -22.221668243408203, "global_step": 121269, "epoch": 1461} {"train_loss": -22.593420028686523, "global_step": 121270, "epoch": 1461} {"train_loss": -22.352481842041016, "global_step": 121271, "epoch": 1461} {"train_loss": -22.395954132080078, "global_step": 121272, "epoch": 1461} {"train_loss": -22.528606414794922, "global_step": 121273, "epoch": 1461} {"train_loss": -22.3341007232666, "global_step": 121274, "epoch": 1461} {"train_loss": -22.559011459350586, "global_step": 121275, "epoch": 1461} {"train_loss": -22.607877731323242, "global_step": 121276, "epoch": 1461} {"train_loss": -22.350900650024414, "global_step": 121277, "epoch": 1461} {"train_loss": -22.6824893951416, "global_step": 121278, "epoch": 1461} {"train_loss": -22.390384674072266, "global_step": 121279, "epoch": 1461} {"train_loss": -22.657394409179688, "global_step": 121280, "epoch": 1461} {"train_loss": -22.276975631713867, "global_step": 121281, "epoch": 1461} {"train_loss": -22.453805923461914, "global_step": 121282, "epoch": 1461} {"train_loss": -22.612234115600586, "global_step": 121283, "epoch": 1461} {"train_loss": -22.847986221313477, "global_step": 121284, "epoch": 1461} {"train_loss": -22.604421615600586, "global_step": 121285, "epoch": 1461} {"train_loss": -22.625640869140625, "global_step": 121286, "epoch": 1461} {"train_loss": -22.65461540222168, "global_step": 121287, "epoch": 1461} {"train_loss": -22.341739654541016, "global_step": 121288, "epoch": 1461} {"train_loss": -22.792621612548828, "global_step": 121289, "epoch": 1461} {"train_loss": -22.617116928100586, "global_step": 121290, "epoch": 1461} {"train_loss": -22.80902099609375, "global_step": 121291, "epoch": 1461} {"train_loss": -22.818910598754883, "global_step": 121292, "epoch": 1461} {"train_loss": -22.667484283447266, "global_step": 121293, "epoch": 1461} {"train_loss": -23.011463165283203, "global_step": 121294, "epoch": 1461} {"train_loss": -22.52919578552246, "global_step": 121295, "epoch": 1461} {"train_loss": -22.252897262573242, "global_step": 121296, "epoch": 1461} {"train_loss": -22.562698364257812, "global_step": 121297, "epoch": 1461} {"train_loss": -22.588499069213867, "global_step": 121298, "epoch": 1461} {"train_loss": -22.77557945251465, "global_step": 121299, "epoch": 1461} {"train_loss": -22.23555564880371, "global_step": 121300, "epoch": 1461} {"train_loss": -22.163320541381836, "global_step": 121301, "epoch": 1461} {"train_loss": -21.575456619262695, "global_step": 121302, "epoch": 1461} {"train_loss": -22.159841537475586, "global_step": 121303, "epoch": 1461} {"train_loss": -21.99334716796875, "global_step": 121304, "epoch": 1461} {"train_loss": -21.847816467285156, "global_step": 121305, "epoch": 1461} {"train_loss": -22.303518295288086, "global_step": 121306, "epoch": 1461} {"train_loss": -22.41056251525879, "global_step": 121307, "epoch": 1461} {"train_loss": -22.27924919128418, "global_step": 121308, "epoch": 1461} {"train_loss": -22.589569091796875, "global_step": 121309, "epoch": 1461} {"train_loss": -22.33395767211914, "global_step": 121310, "epoch": 1461} {"train_loss": -21.885025024414062, "global_step": 121311, "epoch": 1461} {"train_loss": -22.334598541259766, "global_step": 121312, "epoch": 1461} {"train_loss": -22.278518676757812, "global_step": 121313, "epoch": 1461} {"train_loss": -22.88899803161621, "global_step": 121314, "epoch": 1461} {"train_loss": -22.292890548706055, "global_step": 121315, "epoch": 1461} {"train_loss": -22.183652877807617, "global_step": 121316, "epoch": 1461} {"train_loss": -22.22086524963379, "global_step": 121317, "epoch": 1461} {"train_loss": -22.684961318969727, "global_step": 121318, "epoch": 1461} {"train_loss": -22.60231590270996, "global_step": 121319, "epoch": 1461} {"train_loss": -22.678516387939453, "global_step": 121320, "epoch": 1461} {"train_loss": -22.71965217590332, "global_step": 121321, "epoch": 1461} {"train_loss": -22.655372619628906, "global_step": 121322, "epoch": 1461} {"train_loss": -22.139493942260742, "global_step": 121323, "epoch": 1461} {"train_loss": -22.419652938842773, "global_step": 121324, "epoch": 1461} {"train_loss": -22.902307510375977, "global_step": 121325, "epoch": 1461} {"train_loss": -22.626333236694336, "global_step": 121326, "epoch": 1461} {"train_loss": -22.704660415649414, "global_step": 121327, "epoch": 1461} {"train_loss": -22.687732696533203, "global_step": 121328, "epoch": 1461} {"train_loss": -22.40865135192871, "global_step": 121329, "epoch": 1461} {"train_loss": -22.56092643737793, "global_step": 121330, "epoch": 1461} {"train_loss": -22.82503318786621, "global_step": 121331, "epoch": 1461} {"train_loss": -22.625009536743164, "global_step": 121332, "epoch": 1461} {"train_loss": -22.515731811523438, "global_step": 121333, "epoch": 1461} {"train_loss": -22.542984008789062, "global_step": 121334, "epoch": 1461} {"train_loss": -22.589162826538086, "global_step": 121335, "epoch": 1461} {"train_loss": -22.89484214782715, "global_step": 121336, "epoch": 1461} {"train_loss": -22.211416244506836, "global_step": 121337, "epoch": 1461} {"train_loss": -22.174158096313477, "global_step": 121338, "epoch": 1461} {"train_loss": -22.063329696655273, "global_step": 121339, "epoch": 1461} {"train_loss": -22.25017738342285, "global_step": 121340, "epoch": 1461} {"train_loss": -22.780771255493164, "global_step": 121341, "epoch": 1461} {"train_loss": -22.73059844970703, "global_step": 121342, "epoch": 1461} {"train_loss": -22.37948989868164, "global_step": 121343, "epoch": 1461} {"train_loss": -22.418228149414062, "global_step": 121344, "epoch": 1461} {"train_loss": -22.448403071208173, "global_step": 121345, "epoch": 1461, "val_loss": 6261405.5} {"train_loss": -22.236190795898438, "global_step": 121346, "epoch": 1462} {"train_loss": -22.50575065612793, "global_step": 121347, "epoch": 1462} {"train_loss": -22.363672256469727, "global_step": 121348, "epoch": 1462} {"train_loss": -22.11474609375, "global_step": 121349, "epoch": 1462} {"train_loss": -22.56470489501953, "global_step": 121350, "epoch": 1462} {"train_loss": -22.15241050720215, "global_step": 121351, "epoch": 1462} {"train_loss": -22.376306533813477, "global_step": 121352, "epoch": 1462} {"train_loss": -22.103158950805664, "global_step": 121353, "epoch": 1462} {"train_loss": -22.1236629486084, "global_step": 121354, "epoch": 1462} {"train_loss": -22.608562469482422, "global_step": 121355, "epoch": 1462} {"train_loss": -22.383909225463867, "global_step": 121356, "epoch": 1462} {"train_loss": -22.4432373046875, "global_step": 121357, "epoch": 1462} {"train_loss": -22.674850463867188, "global_step": 121358, "epoch": 1462} {"train_loss": -22.707626342773438, "global_step": 121359, "epoch": 1462} {"train_loss": -22.518789291381836, "global_step": 121360, "epoch": 1462} {"train_loss": -22.241806030273438, "global_step": 121361, "epoch": 1462} {"train_loss": -22.5837345123291, "global_step": 121362, "epoch": 1462} {"train_loss": -22.502702713012695, "global_step": 121363, "epoch": 1462} {"train_loss": -22.8360538482666, "global_step": 121364, "epoch": 1462} {"train_loss": -22.6062068939209, "global_step": 121365, "epoch": 1462} {"train_loss": -22.720651626586914, "global_step": 121366, "epoch": 1462} {"train_loss": -22.6637020111084, "global_step": 121367, "epoch": 1462} {"train_loss": -22.973844528198242, "global_step": 121368, "epoch": 1462} {"train_loss": -22.412353515625, "global_step": 121369, "epoch": 1462} {"train_loss": -22.77064323425293, "global_step": 121370, "epoch": 1462} {"train_loss": -22.57952117919922, "global_step": 121371, "epoch": 1462} {"train_loss": -22.685504913330078, "global_step": 121372, "epoch": 1462} {"train_loss": -22.613210678100586, "global_step": 121373, "epoch": 1462} {"train_loss": -22.688528060913086, "global_step": 121374, "epoch": 1462} {"train_loss": -22.69831657409668, "global_step": 121375, "epoch": 1462} {"train_loss": -22.5632381439209, "global_step": 121376, "epoch": 1462} {"train_loss": -23.0507869720459, "global_step": 121377, "epoch": 1462} {"train_loss": -22.596750259399414, "global_step": 121378, "epoch": 1462} {"train_loss": -22.465879440307617, "global_step": 121379, "epoch": 1462} {"train_loss": -22.540252685546875, "global_step": 121380, "epoch": 1462} {"train_loss": -22.0841007232666, "global_step": 121381, "epoch": 1462} {"train_loss": -22.69179344177246, "global_step": 121382, "epoch": 1462} {"train_loss": -22.71943473815918, "global_step": 121383, "epoch": 1462} {"train_loss": -22.615812301635742, "global_step": 121384, "epoch": 1462} {"train_loss": -22.627973556518555, "global_step": 121385, "epoch": 1462} {"train_loss": -22.827482223510742, "global_step": 121386, "epoch": 1462} {"train_loss": -22.688920974731445, "global_step": 121387, "epoch": 1462} {"train_loss": -22.88150405883789, "global_step": 121388, "epoch": 1462} {"train_loss": -22.3011474609375, "global_step": 121389, "epoch": 1462} {"train_loss": -22.19659996032715, "global_step": 121390, "epoch": 1462} {"train_loss": -22.540958404541016, "global_step": 121391, "epoch": 1462} {"train_loss": -22.587329864501953, "global_step": 121392, "epoch": 1462} {"train_loss": -22.340763092041016, "global_step": 121393, "epoch": 1462} {"train_loss": -22.60907554626465, "global_step": 121394, "epoch": 1462} {"train_loss": -22.119583129882812, "global_step": 121395, "epoch": 1462} {"train_loss": -22.53619956970215, "global_step": 121396, "epoch": 1462} {"train_loss": -22.302099227905273, "global_step": 121397, "epoch": 1462} {"train_loss": -22.456464767456055, "global_step": 121398, "epoch": 1462} {"train_loss": -22.41737937927246, "global_step": 121399, "epoch": 1462} {"train_loss": -22.163066864013672, "global_step": 121400, "epoch": 1462} {"train_loss": -22.597375869750977, "global_step": 121401, "epoch": 1462} {"train_loss": -22.529468536376953, "global_step": 121402, "epoch": 1462} {"train_loss": -22.736616134643555, "global_step": 121403, "epoch": 1462} {"train_loss": -22.426738739013672, "global_step": 121404, "epoch": 1462} {"train_loss": -22.289798736572266, "global_step": 121405, "epoch": 1462} {"train_loss": -22.830121994018555, "global_step": 121406, "epoch": 1462} {"train_loss": -22.666534423828125, "global_step": 121407, "epoch": 1462} {"train_loss": -22.357099533081055, "global_step": 121408, "epoch": 1462} {"train_loss": -22.765262603759766, "global_step": 121409, "epoch": 1462} {"train_loss": -22.470844268798828, "global_step": 121410, "epoch": 1462} {"train_loss": -22.52321434020996, "global_step": 121411, "epoch": 1462} {"train_loss": -22.613027572631836, "global_step": 121412, "epoch": 1462} {"train_loss": -22.56593894958496, "global_step": 121413, "epoch": 1462} {"train_loss": -22.272171020507812, "global_step": 121414, "epoch": 1462} {"train_loss": -22.869565963745117, "global_step": 121415, "epoch": 1462} {"train_loss": -22.677663803100586, "global_step": 121416, "epoch": 1462} {"train_loss": -22.60377311706543, "global_step": 121417, "epoch": 1462} {"train_loss": -22.717716217041016, "global_step": 121418, "epoch": 1462} {"train_loss": -22.63054656982422, "global_step": 121419, "epoch": 1462} {"train_loss": -22.575132369995117, "global_step": 121420, "epoch": 1462} {"train_loss": -22.786514282226562, "global_step": 121421, "epoch": 1462} {"train_loss": -22.3247127532959, "global_step": 121422, "epoch": 1462} {"train_loss": -22.599599838256836, "global_step": 121423, "epoch": 1462} {"train_loss": -22.223421096801758, "global_step": 121424, "epoch": 1462} {"train_loss": -22.70452117919922, "global_step": 121425, "epoch": 1462} {"train_loss": -22.496274948120117, "global_step": 121426, "epoch": 1462} {"train_loss": -22.786588668823242, "global_step": 121427, "epoch": 1462} {"train_loss": -22.53310132313924, "global_step": 121428, "epoch": 1462, "val_loss": 6271493.0} {"train_loss": -22.035903930664062, "global_step": 121429, "epoch": 1463} {"train_loss": -22.136722564697266, "global_step": 121430, "epoch": 1463} {"train_loss": -21.968509674072266, "global_step": 121431, "epoch": 1463} {"train_loss": -22.5539493560791, "global_step": 121432, "epoch": 1463} {"train_loss": -22.304040908813477, "global_step": 121433, "epoch": 1463} {"train_loss": -21.766353607177734, "global_step": 121434, "epoch": 1463} {"train_loss": -22.17234230041504, "global_step": 121435, "epoch": 1463} {"train_loss": -22.095006942749023, "global_step": 121436, "epoch": 1463} {"train_loss": -21.88081932067871, "global_step": 121437, "epoch": 1463} {"train_loss": -22.39572525024414, "global_step": 121438, "epoch": 1463} {"train_loss": -22.06915855407715, "global_step": 121439, "epoch": 1463} {"train_loss": -22.656633377075195, "global_step": 121440, "epoch": 1463} {"train_loss": -22.528223037719727, "global_step": 121441, "epoch": 1463} {"train_loss": -22.446353912353516, "global_step": 121442, "epoch": 1463} {"train_loss": -22.24945640563965, "global_step": 121443, "epoch": 1463} {"train_loss": -22.539968490600586, "global_step": 121444, "epoch": 1463} {"train_loss": -22.215131759643555, "global_step": 121445, "epoch": 1463} {"train_loss": -22.517202377319336, "global_step": 121446, "epoch": 1463} {"train_loss": -22.5262451171875, "global_step": 121447, "epoch": 1463} {"train_loss": -22.503175735473633, "global_step": 121448, "epoch": 1463} {"train_loss": -22.64451026916504, "global_step": 121449, "epoch": 1463} {"train_loss": -22.186796188354492, "global_step": 121450, "epoch": 1463} {"train_loss": -22.450551986694336, "global_step": 121451, "epoch": 1463} {"train_loss": -22.31918716430664, "global_step": 121452, "epoch": 1463} {"train_loss": -22.422725677490234, "global_step": 121453, "epoch": 1463} {"train_loss": -22.809457778930664, "global_step": 121454, "epoch": 1463} {"train_loss": -22.54816246032715, "global_step": 121455, "epoch": 1463} {"train_loss": -22.478761672973633, "global_step": 121456, "epoch": 1463} {"train_loss": -22.314443588256836, "global_step": 121457, "epoch": 1463} {"train_loss": -22.686229705810547, "global_step": 121458, "epoch": 1463} {"train_loss": -22.51218605041504, "global_step": 121459, "epoch": 1463} {"train_loss": -22.64411735534668, "global_step": 121460, "epoch": 1463} {"train_loss": -22.775339126586914, "global_step": 121461, "epoch": 1463} {"train_loss": -22.52071189880371, "global_step": 121462, "epoch": 1463} {"train_loss": -22.566686630249023, "global_step": 121463, "epoch": 1463} {"train_loss": -22.507028579711914, "global_step": 121464, "epoch": 1463} {"train_loss": -22.829322814941406, "global_step": 121465, "epoch": 1463} {"train_loss": -22.742551803588867, "global_step": 121466, "epoch": 1463} {"train_loss": -22.563739776611328, "global_step": 121467, "epoch": 1463} {"train_loss": -22.540115356445312, "global_step": 121468, "epoch": 1463} {"train_loss": -22.44093894958496, "global_step": 121469, "epoch": 1463} {"train_loss": -22.90363883972168, "global_step": 121470, "epoch": 1463} {"train_loss": -22.705780029296875, "global_step": 121471, "epoch": 1463} {"train_loss": -22.815404891967773, "global_step": 121472, "epoch": 1463} {"train_loss": -22.548677444458008, "global_step": 121473, "epoch": 1463} {"train_loss": -22.902591705322266, "global_step": 121474, "epoch": 1463} {"train_loss": -22.508167266845703, "global_step": 121475, "epoch": 1463} {"train_loss": -22.793180465698242, "global_step": 121476, "epoch": 1463} {"train_loss": -22.47586441040039, "global_step": 121477, "epoch": 1463} {"train_loss": -23.087831497192383, "global_step": 121478, "epoch": 1463} {"train_loss": -22.633955001831055, "global_step": 121479, "epoch": 1463} {"train_loss": -22.902494430541992, "global_step": 121480, "epoch": 1463} {"train_loss": -22.662357330322266, "global_step": 121481, "epoch": 1463} {"train_loss": -22.90851593017578, "global_step": 121482, "epoch": 1463} {"train_loss": -22.672033309936523, "global_step": 121483, "epoch": 1463} {"train_loss": -22.24397087097168, "global_step": 121484, "epoch": 1463} {"train_loss": -22.300098419189453, "global_step": 121485, "epoch": 1463} {"train_loss": -22.65060806274414, "global_step": 121486, "epoch": 1463} {"train_loss": -22.627599716186523, "global_step": 121487, "epoch": 1463} {"train_loss": -22.96793556213379, "global_step": 121488, "epoch": 1463} {"train_loss": -22.39328384399414, "global_step": 121489, "epoch": 1463} {"train_loss": -23.171350479125977, "global_step": 121490, "epoch": 1463} {"train_loss": -22.472333908081055, "global_step": 121491, "epoch": 1463} {"train_loss": -22.54959487915039, "global_step": 121492, "epoch": 1463} {"train_loss": -22.484195709228516, "global_step": 121493, "epoch": 1463} {"train_loss": -22.533100128173828, "global_step": 121494, "epoch": 1463} {"train_loss": -22.665145874023438, "global_step": 121495, "epoch": 1463} {"train_loss": -22.660873413085938, "global_step": 121496, "epoch": 1463} {"train_loss": -22.470022201538086, "global_step": 121497, "epoch": 1463} {"train_loss": -22.55173683166504, "global_step": 121498, "epoch": 1463} {"train_loss": -22.82330894470215, "global_step": 121499, "epoch": 1463} {"train_loss": -22.93001937866211, "global_step": 121500, "epoch": 1463} {"train_loss": -22.341468811035156, "global_step": 121501, "epoch": 1463} {"train_loss": -22.207014083862305, "global_step": 121502, "epoch": 1463} {"train_loss": -22.284744262695312, "global_step": 121503, "epoch": 1463} {"train_loss": -22.895645141601562, "global_step": 121504, "epoch": 1463} {"train_loss": -22.747400283813477, "global_step": 121505, "epoch": 1463} {"train_loss": -22.060346603393555, "global_step": 121506, "epoch": 1463} {"train_loss": -22.542808532714844, "global_step": 121507, "epoch": 1463} {"train_loss": -22.454404830932617, "global_step": 121508, "epoch": 1463} {"train_loss": -22.065053939819336, "global_step": 121509, "epoch": 1463} {"train_loss": -22.466154098510742, "global_step": 121510, "epoch": 1463} {"train_loss": -22.502479438322137, "global_step": 121511, "epoch": 1463, "val_loss": 6120452.0} {"train_loss": -21.839187622070312, "global_step": 121512, "epoch": 1464} {"train_loss": -22.022794723510742, "global_step": 121513, "epoch": 1464} {"train_loss": -22.303630828857422, "global_step": 121514, "epoch": 1464} {"train_loss": -21.8940486907959, "global_step": 121515, "epoch": 1464} {"train_loss": -22.04129409790039, "global_step": 121516, "epoch": 1464} {"train_loss": -22.46927833557129, "global_step": 121517, "epoch": 1464} {"train_loss": -22.26603126525879, "global_step": 121518, "epoch": 1464} {"train_loss": -22.330459594726562, "global_step": 121519, "epoch": 1464} {"train_loss": -22.141386032104492, "global_step": 121520, "epoch": 1464} {"train_loss": -22.43183708190918, "global_step": 121521, "epoch": 1464} {"train_loss": -22.675085067749023, "global_step": 121522, "epoch": 1464} {"train_loss": -22.584638595581055, "global_step": 121523, "epoch": 1464} {"train_loss": -22.844783782958984, "global_step": 121524, "epoch": 1464} {"train_loss": -22.529359817504883, "global_step": 121525, "epoch": 1464} {"train_loss": -22.0, "global_step": 121526, "epoch": 1464} {"train_loss": -22.448659896850586, "global_step": 121527, "epoch": 1464} {"train_loss": -22.335582733154297, "global_step": 121528, "epoch": 1464} {"train_loss": -22.119434356689453, "global_step": 121529, "epoch": 1464} {"train_loss": -22.434307098388672, "global_step": 121530, "epoch": 1464} {"train_loss": -22.850830078125, "global_step": 121531, "epoch": 1464} {"train_loss": -22.567609786987305, "global_step": 121532, "epoch": 1464} {"train_loss": -22.145954132080078, "global_step": 121533, "epoch": 1464} {"train_loss": -22.923450469970703, "global_step": 121534, "epoch": 1464} {"train_loss": -22.606901168823242, "global_step": 121535, "epoch": 1464} {"train_loss": -22.6866512298584, "global_step": 121536, "epoch": 1464} {"train_loss": -22.671560287475586, "global_step": 121537, "epoch": 1464} {"train_loss": -22.57520866394043, "global_step": 121538, "epoch": 1464} {"train_loss": -22.849199295043945, "global_step": 121539, "epoch": 1464} {"train_loss": -22.708402633666992, "global_step": 121540, "epoch": 1464} {"train_loss": -22.386112213134766, "global_step": 121541, "epoch": 1464} {"train_loss": -22.380752563476562, "global_step": 121542, "epoch": 1464} {"train_loss": -22.791345596313477, "global_step": 121543, "epoch": 1464} {"train_loss": -22.606046676635742, "global_step": 121544, "epoch": 1464} {"train_loss": -22.470903396606445, "global_step": 121545, "epoch": 1464} {"train_loss": -22.6782283782959, "global_step": 121546, "epoch": 1464} {"train_loss": -22.746036529541016, "global_step": 121547, "epoch": 1464} {"train_loss": -22.776723861694336, "global_step": 121548, "epoch": 1464} {"train_loss": -22.168994903564453, "global_step": 121549, "epoch": 1464} {"train_loss": -22.30593490600586, "global_step": 121550, "epoch": 1464} {"train_loss": -22.632566452026367, "global_step": 121551, "epoch": 1464} {"train_loss": -22.78952407836914, "global_step": 121552, "epoch": 1464} {"train_loss": -22.441102981567383, "global_step": 121553, "epoch": 1464} {"train_loss": -22.46571159362793, "global_step": 121554, "epoch": 1464} {"train_loss": -22.42386817932129, "global_step": 121555, "epoch": 1464} {"train_loss": -22.537574768066406, "global_step": 121556, "epoch": 1464} {"train_loss": -22.479915618896484, "global_step": 121557, "epoch": 1464} {"train_loss": -22.21485710144043, "global_step": 121558, "epoch": 1464} {"train_loss": -22.395885467529297, "global_step": 121559, "epoch": 1464} {"train_loss": -21.901817321777344, "global_step": 121560, "epoch": 1464} {"train_loss": -22.49938201904297, "global_step": 121561, "epoch": 1464} {"train_loss": -22.354496002197266, "global_step": 121562, "epoch": 1464} {"train_loss": -22.226987838745117, "global_step": 121563, "epoch": 1464} {"train_loss": -22.770170211791992, "global_step": 121564, "epoch": 1464} {"train_loss": -22.305158615112305, "global_step": 121565, "epoch": 1464} {"train_loss": -22.476573944091797, "global_step": 121566, "epoch": 1464} {"train_loss": -22.372791290283203, "global_step": 121567, "epoch": 1464} {"train_loss": -22.0959529876709, "global_step": 121568, "epoch": 1464} {"train_loss": -22.314523696899414, "global_step": 121569, "epoch": 1464} {"train_loss": -22.238590240478516, "global_step": 121570, "epoch": 1464} {"train_loss": -22.485885620117188, "global_step": 121571, "epoch": 1464} {"train_loss": -22.45648765563965, "global_step": 121572, "epoch": 1464} {"train_loss": -22.850996017456055, "global_step": 121573, "epoch": 1464} {"train_loss": -22.566055297851562, "global_step": 121574, "epoch": 1464} {"train_loss": -22.63356590270996, "global_step": 121575, "epoch": 1464} {"train_loss": -22.674360275268555, "global_step": 121576, "epoch": 1464} {"train_loss": -22.246967315673828, "global_step": 121577, "epoch": 1464} {"train_loss": -22.757905960083008, "global_step": 121578, "epoch": 1464} {"train_loss": -22.813236236572266, "global_step": 121579, "epoch": 1464} {"train_loss": -22.51704216003418, "global_step": 121580, "epoch": 1464} {"train_loss": -22.657194137573242, "global_step": 121581, "epoch": 1464} {"train_loss": -22.60569190979004, "global_step": 121582, "epoch": 1464} {"train_loss": -22.332178115844727, "global_step": 121583, "epoch": 1464} {"train_loss": -22.124418258666992, "global_step": 121584, "epoch": 1464} {"train_loss": -22.959232330322266, "global_step": 121585, "epoch": 1464} {"train_loss": -22.824270248413086, "global_step": 121586, "epoch": 1464} {"train_loss": -22.888643264770508, "global_step": 121587, "epoch": 1464} {"train_loss": -22.882532119750977, "global_step": 121588, "epoch": 1464} {"train_loss": -22.695646286010742, "global_step": 121589, "epoch": 1464} {"train_loss": -22.983911514282227, "global_step": 121590, "epoch": 1464} {"train_loss": -22.51063346862793, "global_step": 121591, "epoch": 1464} {"train_loss": -22.193098068237305, "global_step": 121592, "epoch": 1464} {"train_loss": -22.5266056060791, "global_step": 121593, "epoch": 1464} {"train_loss": -22.489014682999578, "global_step": 121594, "epoch": 1464, "val_loss": 6285292.5} {"train_loss": -22.333234786987305, "global_step": 121595, "epoch": 1465} {"train_loss": -22.61829376220703, "global_step": 121596, "epoch": 1465} {"train_loss": -22.255250930786133, "global_step": 121597, "epoch": 1465} {"train_loss": -22.18179702758789, "global_step": 121598, "epoch": 1465} {"train_loss": -22.713258743286133, "global_step": 121599, "epoch": 1465} {"train_loss": -22.917068481445312, "global_step": 121600, "epoch": 1465} {"train_loss": -22.779773712158203, "global_step": 121601, "epoch": 1465} {"train_loss": -22.3470458984375, "global_step": 121602, "epoch": 1465} {"train_loss": -22.369352340698242, "global_step": 121603, "epoch": 1465} {"train_loss": -22.827884674072266, "global_step": 121604, "epoch": 1465} {"train_loss": -22.458799362182617, "global_step": 121605, "epoch": 1465} {"train_loss": -22.389802932739258, "global_step": 121606, "epoch": 1465} {"train_loss": -22.477218627929688, "global_step": 121607, "epoch": 1465} {"train_loss": -22.456579208374023, "global_step": 121608, "epoch": 1465} {"train_loss": -22.497848510742188, "global_step": 121609, "epoch": 1465} {"train_loss": -22.760717391967773, "global_step": 121610, "epoch": 1465} {"train_loss": -22.48879051208496, "global_step": 121611, "epoch": 1465} {"train_loss": -22.60738182067871, "global_step": 121612, "epoch": 1465} {"train_loss": -22.940393447875977, "global_step": 121613, "epoch": 1465} {"train_loss": -22.629575729370117, "global_step": 121614, "epoch": 1465} {"train_loss": -22.175628662109375, "global_step": 121615, "epoch": 1465} {"train_loss": -22.512754440307617, "global_step": 121616, "epoch": 1465} {"train_loss": -22.682876586914062, "global_step": 121617, "epoch": 1465} {"train_loss": -22.54534149169922, "global_step": 121618, "epoch": 1465} {"train_loss": -22.57382583618164, "global_step": 121619, "epoch": 1465} {"train_loss": -22.340890884399414, "global_step": 121620, "epoch": 1465} {"train_loss": -22.61079978942871, "global_step": 121621, "epoch": 1465} {"train_loss": -22.68641471862793, "global_step": 121622, "epoch": 1465} {"train_loss": -22.54389762878418, "global_step": 121623, "epoch": 1465} {"train_loss": -22.665664672851562, "global_step": 121624, "epoch": 1465} {"train_loss": -23.027490615844727, "global_step": 121625, "epoch": 1465} {"train_loss": -22.320985794067383, "global_step": 121626, "epoch": 1465} {"train_loss": -22.62376594543457, "global_step": 121627, "epoch": 1465} {"train_loss": -22.736265182495117, "global_step": 121628, "epoch": 1465} {"train_loss": -22.47887420654297, "global_step": 121629, "epoch": 1465} {"train_loss": -22.56589698791504, "global_step": 121630, "epoch": 1465} {"train_loss": -22.370153427124023, "global_step": 121631, "epoch": 1465} {"train_loss": -22.234357833862305, "global_step": 121632, "epoch": 1465} {"train_loss": -22.388273239135742, "global_step": 121633, "epoch": 1465} {"train_loss": -22.584762573242188, "global_step": 121634, "epoch": 1465} {"train_loss": -22.497283935546875, "global_step": 121635, "epoch": 1465} {"train_loss": -22.610929489135742, "global_step": 121636, "epoch": 1465} {"train_loss": -22.413679122924805, "global_step": 121637, "epoch": 1465} {"train_loss": -22.535415649414062, "global_step": 121638, "epoch": 1465} {"train_loss": -22.775510787963867, "global_step": 121639, "epoch": 1465} {"train_loss": -22.486618041992188, "global_step": 121640, "epoch": 1465} {"train_loss": -22.83066749572754, "global_step": 121641, "epoch": 1465} {"train_loss": -22.42305564880371, "global_step": 121642, "epoch": 1465} {"train_loss": -22.24188804626465, "global_step": 121643, "epoch": 1465} {"train_loss": -22.51445960998535, "global_step": 121644, "epoch": 1465} {"train_loss": -22.739225387573242, "global_step": 121645, "epoch": 1465} {"train_loss": -22.542186737060547, "global_step": 121646, "epoch": 1465} {"train_loss": -22.722187042236328, "global_step": 121647, "epoch": 1465} {"train_loss": -22.82188606262207, "global_step": 121648, "epoch": 1465} {"train_loss": -22.445999145507812, "global_step": 121649, "epoch": 1465} {"train_loss": -22.765302658081055, "global_step": 121650, "epoch": 1465} {"train_loss": -22.580963134765625, "global_step": 121651, "epoch": 1465} {"train_loss": -22.293180465698242, "global_step": 121652, "epoch": 1465} {"train_loss": -22.728750228881836, "global_step": 121653, "epoch": 1465} {"train_loss": -22.368032455444336, "global_step": 121654, "epoch": 1465} {"train_loss": -22.654191970825195, "global_step": 121655, "epoch": 1465} {"train_loss": -22.443235397338867, "global_step": 121656, "epoch": 1465} {"train_loss": -22.646883010864258, "global_step": 121657, "epoch": 1465} {"train_loss": -22.57705307006836, "global_step": 121658, "epoch": 1465} {"train_loss": -22.75580406188965, "global_step": 121659, "epoch": 1465} {"train_loss": -22.22795295715332, "global_step": 121660, "epoch": 1465} {"train_loss": -22.693668365478516, "global_step": 121661, "epoch": 1465} {"train_loss": -21.939102172851562, "global_step": 121662, "epoch": 1465} {"train_loss": -22.609493255615234, "global_step": 121663, "epoch": 1465} {"train_loss": -22.543275833129883, "global_step": 121664, "epoch": 1465} {"train_loss": -22.80750846862793, "global_step": 121665, "epoch": 1465} {"train_loss": -22.498088836669922, "global_step": 121666, "epoch": 1465} {"train_loss": -22.69076919555664, "global_step": 121667, "epoch": 1465} {"train_loss": -22.991910934448242, "global_step": 121668, "epoch": 1465} {"train_loss": -22.33742332458496, "global_step": 121669, "epoch": 1465} {"train_loss": -22.641691207885742, "global_step": 121670, "epoch": 1465} {"train_loss": -22.48099136352539, "global_step": 121671, "epoch": 1465} {"train_loss": -22.58833885192871, "global_step": 121672, "epoch": 1465} {"train_loss": -22.243295669555664, "global_step": 121673, "epoch": 1465} {"train_loss": -22.64307975769043, "global_step": 121674, "epoch": 1465} {"train_loss": -22.58765983581543, "global_step": 121675, "epoch": 1465} {"train_loss": -22.15907859802246, "global_step": 121676, "epoch": 1465} {"train_loss": -22.5516191275723, "global_step": 121677, "epoch": 1465, "val_loss": 6373300.0} {"train_loss": -22.415687561035156, "global_step": 121678, "epoch": 1466} {"train_loss": -21.83869171142578, "global_step": 121679, "epoch": 1466} {"train_loss": -22.19025993347168, "global_step": 121680, "epoch": 1466} {"train_loss": -22.68035316467285, "global_step": 121681, "epoch": 1466} {"train_loss": -22.20790672302246, "global_step": 121682, "epoch": 1466} {"train_loss": -22.560739517211914, "global_step": 121683, "epoch": 1466} {"train_loss": -22.379133224487305, "global_step": 121684, "epoch": 1466} {"train_loss": -22.276771545410156, "global_step": 121685, "epoch": 1466} {"train_loss": -22.502906799316406, "global_step": 121686, "epoch": 1466} {"train_loss": -22.148427963256836, "global_step": 121687, "epoch": 1466} {"train_loss": -22.480894088745117, "global_step": 121688, "epoch": 1466} {"train_loss": -22.335947036743164, "global_step": 121689, "epoch": 1466} {"train_loss": -22.363750457763672, "global_step": 121690, "epoch": 1466} {"train_loss": -22.265783309936523, "global_step": 121691, "epoch": 1466} {"train_loss": -22.731977462768555, "global_step": 121692, "epoch": 1466} {"train_loss": -22.6524600982666, "global_step": 121693, "epoch": 1466} {"train_loss": -22.52042579650879, "global_step": 121694, "epoch": 1466} {"train_loss": -22.124547958374023, "global_step": 121695, "epoch": 1466} {"train_loss": -22.209287643432617, "global_step": 121696, "epoch": 1466} {"train_loss": -22.565420150756836, "global_step": 121697, "epoch": 1466} {"train_loss": -22.163908004760742, "global_step": 121698, "epoch": 1466} {"train_loss": -22.4843807220459, "global_step": 121699, "epoch": 1466} {"train_loss": -22.712759017944336, "global_step": 121700, "epoch": 1466} {"train_loss": -22.784534454345703, "global_step": 121701, "epoch": 1466} {"train_loss": -22.386159896850586, "global_step": 121702, "epoch": 1466} {"train_loss": -22.709671020507812, "global_step": 121703, "epoch": 1466} {"train_loss": -22.17312240600586, "global_step": 121704, "epoch": 1466} {"train_loss": -22.926050186157227, "global_step": 121705, "epoch": 1466} {"train_loss": -22.40150260925293, "global_step": 121706, "epoch": 1466} {"train_loss": -22.4772891998291, "global_step": 121707, "epoch": 1466} {"train_loss": -22.580673217773438, "global_step": 121708, "epoch": 1466} {"train_loss": -22.479581832885742, "global_step": 121709, "epoch": 1466} {"train_loss": -22.764341354370117, "global_step": 121710, "epoch": 1466} {"train_loss": -22.67982292175293, "global_step": 121711, "epoch": 1466} {"train_loss": -22.338743209838867, "global_step": 121712, "epoch": 1466} {"train_loss": -22.25796890258789, "global_step": 121713, "epoch": 1466} {"train_loss": -22.68410301208496, "global_step": 121714, "epoch": 1466} {"train_loss": -22.211181640625, "global_step": 121715, "epoch": 1466} {"train_loss": -22.39102554321289, "global_step": 121716, "epoch": 1466} {"train_loss": -22.35576057434082, "global_step": 121717, "epoch": 1466} {"train_loss": -22.632734298706055, "global_step": 121718, "epoch": 1466} {"train_loss": -22.768970489501953, "global_step": 121719, "epoch": 1466} {"train_loss": -22.326671600341797, "global_step": 121720, "epoch": 1466} {"train_loss": -22.726308822631836, "global_step": 121721, "epoch": 1466} {"train_loss": -22.658681869506836, "global_step": 121722, "epoch": 1466} {"train_loss": -22.894235610961914, "global_step": 121723, "epoch": 1466} {"train_loss": -22.953948974609375, "global_step": 121724, "epoch": 1466} {"train_loss": -22.713043212890625, "global_step": 121725, "epoch": 1466} {"train_loss": -22.715078353881836, "global_step": 121726, "epoch": 1466} {"train_loss": -22.978303909301758, "global_step": 121727, "epoch": 1466} {"train_loss": -22.24714469909668, "global_step": 121728, "epoch": 1466} {"train_loss": -21.88214683532715, "global_step": 121729, "epoch": 1466} {"train_loss": -22.00539207458496, "global_step": 121730, "epoch": 1466} {"train_loss": -22.554956436157227, "global_step": 121731, "epoch": 1466} {"train_loss": -22.548233032226562, "global_step": 121732, "epoch": 1466} {"train_loss": -22.237268447875977, "global_step": 121733, "epoch": 1466} {"train_loss": -22.50806999206543, "global_step": 121734, "epoch": 1466} {"train_loss": -22.50469970703125, "global_step": 121735, "epoch": 1466} {"train_loss": -22.057113647460938, "global_step": 121736, "epoch": 1466} {"train_loss": -22.31584930419922, "global_step": 121737, "epoch": 1466} {"train_loss": -22.5081729888916, "global_step": 121738, "epoch": 1466} {"train_loss": -22.480777740478516, "global_step": 121739, "epoch": 1466} {"train_loss": -22.47772789001465, "global_step": 121740, "epoch": 1466} {"train_loss": -22.713088989257812, "global_step": 121741, "epoch": 1466} {"train_loss": -22.352224349975586, "global_step": 121742, "epoch": 1466} {"train_loss": -22.479219436645508, "global_step": 121743, "epoch": 1466} {"train_loss": -22.484378814697266, "global_step": 121744, "epoch": 1466} {"train_loss": -22.390859603881836, "global_step": 121745, "epoch": 1466} {"train_loss": -22.46893882751465, "global_step": 121746, "epoch": 1466} {"train_loss": -22.1617374420166, "global_step": 121747, "epoch": 1466} {"train_loss": -22.561176300048828, "global_step": 121748, "epoch": 1466} {"train_loss": -22.79096794128418, "global_step": 121749, "epoch": 1466} {"train_loss": -22.525402069091797, "global_step": 121750, "epoch": 1466} {"train_loss": -22.490497589111328, "global_step": 121751, "epoch": 1466} {"train_loss": -22.686298370361328, "global_step": 121752, "epoch": 1466} {"train_loss": -22.725187301635742, "global_step": 121753, "epoch": 1466} {"train_loss": -22.80732536315918, "global_step": 121754, "epoch": 1466} {"train_loss": -22.52414321899414, "global_step": 121755, "epoch": 1466} {"train_loss": -22.587324142456055, "global_step": 121756, "epoch": 1466} {"train_loss": -22.44799041748047, "global_step": 121757, "epoch": 1466} {"train_loss": -22.40265464782715, "global_step": 121758, "epoch": 1466} {"train_loss": -22.80656623840332, "global_step": 121759, "epoch": 1466} {"train_loss": -22.51160957152585, "global_step": 121760, "epoch": 1466, "val_loss": 6346230.0} {"train_loss": -22.27938461303711, "global_step": 121761, "epoch": 1467} {"train_loss": -22.109283447265625, "global_step": 121762, "epoch": 1467} {"train_loss": -22.305187225341797, "global_step": 121763, "epoch": 1467} {"train_loss": -22.303720474243164, "global_step": 121764, "epoch": 1467} {"train_loss": -22.247650146484375, "global_step": 121765, "epoch": 1467} {"train_loss": -22.253334045410156, "global_step": 121766, "epoch": 1467} {"train_loss": -22.182863235473633, "global_step": 121767, "epoch": 1467} {"train_loss": -22.458816528320312, "global_step": 121768, "epoch": 1467} {"train_loss": -22.06412124633789, "global_step": 121769, "epoch": 1467} {"train_loss": -22.53643798828125, "global_step": 121770, "epoch": 1467} {"train_loss": -22.176605224609375, "global_step": 121771, "epoch": 1467} {"train_loss": -22.532373428344727, "global_step": 121772, "epoch": 1467} {"train_loss": -22.532365798950195, "global_step": 121773, "epoch": 1467} {"train_loss": -22.474878311157227, "global_step": 121774, "epoch": 1467} {"train_loss": -22.03973388671875, "global_step": 121775, "epoch": 1467} {"train_loss": -22.52298927307129, "global_step": 121776, "epoch": 1467} {"train_loss": -22.187850952148438, "global_step": 121777, "epoch": 1467} {"train_loss": -22.383195877075195, "global_step": 121778, "epoch": 1467} {"train_loss": -22.67915153503418, "global_step": 121779, "epoch": 1467} {"train_loss": -22.306262969970703, "global_step": 121780, "epoch": 1467} {"train_loss": -22.921878814697266, "global_step": 121781, "epoch": 1467} {"train_loss": -22.671463012695312, "global_step": 121782, "epoch": 1467} {"train_loss": -22.55704689025879, "global_step": 121783, "epoch": 1467} {"train_loss": -22.293399810791016, "global_step": 121784, "epoch": 1467} {"train_loss": -22.799924850463867, "global_step": 121785, "epoch": 1467} {"train_loss": -22.80377769470215, "global_step": 121786, "epoch": 1467} {"train_loss": -22.594772338867188, "global_step": 121787, "epoch": 1467} {"train_loss": -22.538129806518555, "global_step": 121788, "epoch": 1467} {"train_loss": -22.645370483398438, "global_step": 121789, "epoch": 1467} {"train_loss": -22.584171295166016, "global_step": 121790, "epoch": 1467} {"train_loss": -22.786088943481445, "global_step": 121791, "epoch": 1467} {"train_loss": -22.939205169677734, "global_step": 121792, "epoch": 1467} {"train_loss": -22.35115623474121, "global_step": 121793, "epoch": 1467} {"train_loss": -23.021411895751953, "global_step": 121794, "epoch": 1467} {"train_loss": -22.5917911529541, "global_step": 121795, "epoch": 1467} {"train_loss": -22.585622787475586, "global_step": 121796, "epoch": 1467} {"train_loss": -22.59748649597168, "global_step": 121797, "epoch": 1467} {"train_loss": -22.533010482788086, "global_step": 121798, "epoch": 1467} {"train_loss": -22.40273094177246, "global_step": 121799, "epoch": 1467} {"train_loss": -22.779020309448242, "global_step": 121800, "epoch": 1467} {"train_loss": -23.052331924438477, "global_step": 121801, "epoch": 1467} {"train_loss": -22.416208267211914, "global_step": 121802, "epoch": 1467} {"train_loss": -22.459522247314453, "global_step": 121803, "epoch": 1467} {"train_loss": -22.829158782958984, "global_step": 121804, "epoch": 1467} {"train_loss": -22.639150619506836, "global_step": 121805, "epoch": 1467} {"train_loss": -22.172805786132812, "global_step": 121806, "epoch": 1467} {"train_loss": -22.43345069885254, "global_step": 121807, "epoch": 1467} {"train_loss": -22.20740509033203, "global_step": 121808, "epoch": 1467} {"train_loss": -21.995548248291016, "global_step": 121809, "epoch": 1467} {"train_loss": -22.448881149291992, "global_step": 121810, "epoch": 1467} {"train_loss": -22.664093017578125, "global_step": 121811, "epoch": 1467} {"train_loss": -22.369749069213867, "global_step": 121812, "epoch": 1467} {"train_loss": -22.649206161499023, "global_step": 121813, "epoch": 1467} {"train_loss": -22.86200714111328, "global_step": 121814, "epoch": 1467} {"train_loss": -22.25309181213379, "global_step": 121815, "epoch": 1467} {"train_loss": -22.945499420166016, "global_step": 121816, "epoch": 1467} {"train_loss": -22.7206974029541, "global_step": 121817, "epoch": 1467} {"train_loss": -22.75922203063965, "global_step": 121818, "epoch": 1467} {"train_loss": -22.287582397460938, "global_step": 121819, "epoch": 1467} {"train_loss": -22.650676727294922, "global_step": 121820, "epoch": 1467} {"train_loss": -22.68459129333496, "global_step": 121821, "epoch": 1467} {"train_loss": -23.13528060913086, "global_step": 121822, "epoch": 1467} {"train_loss": -22.627370834350586, "global_step": 121823, "epoch": 1467} {"train_loss": -22.86913299560547, "global_step": 121824, "epoch": 1467} {"train_loss": -22.728403091430664, "global_step": 121825, "epoch": 1467} {"train_loss": -22.230117797851562, "global_step": 121826, "epoch": 1467} {"train_loss": -22.869796752929688, "global_step": 121827, "epoch": 1467} {"train_loss": -22.56925392150879, "global_step": 121828, "epoch": 1467} {"train_loss": -22.40968132019043, "global_step": 121829, "epoch": 1467} {"train_loss": -22.70746612548828, "global_step": 121830, "epoch": 1467} {"train_loss": -22.9051456451416, "global_step": 121831, "epoch": 1467} {"train_loss": -22.656919479370117, "global_step": 121832, "epoch": 1467} {"train_loss": -22.6640625, "global_step": 121833, "epoch": 1467} {"train_loss": -22.944486618041992, "global_step": 121834, "epoch": 1467} {"train_loss": -22.537017822265625, "global_step": 121835, "epoch": 1467} {"train_loss": -22.457218170166016, "global_step": 121836, "epoch": 1467} {"train_loss": -22.569372177124023, "global_step": 121837, "epoch": 1467} {"train_loss": -22.681259155273438, "global_step": 121838, "epoch": 1467} {"train_loss": -22.615079879760742, "global_step": 121839, "epoch": 1467} {"train_loss": -22.877521514892578, "global_step": 121840, "epoch": 1467} {"train_loss": -23.027875900268555, "global_step": 121841, "epoch": 1467} {"train_loss": -22.40818214416504, "global_step": 121842, "epoch": 1467} {"train_loss": -22.55636422030897, "global_step": 121843, "epoch": 1467, "val_loss": 6300274.0} {"train_loss": -22.318330764770508, "global_step": 121844, "epoch": 1468} {"train_loss": -22.653661727905273, "global_step": 121845, "epoch": 1468} {"train_loss": -22.441375732421875, "global_step": 121846, "epoch": 1468} {"train_loss": -22.292694091796875, "global_step": 121847, "epoch": 1468} {"train_loss": -22.462064743041992, "global_step": 121848, "epoch": 1468} {"train_loss": -22.3609676361084, "global_step": 121849, "epoch": 1468} {"train_loss": -22.166458129882812, "global_step": 121850, "epoch": 1468} {"train_loss": -22.612319946289062, "global_step": 121851, "epoch": 1468} {"train_loss": -22.283082962036133, "global_step": 121852, "epoch": 1468} {"train_loss": -22.44466209411621, "global_step": 121853, "epoch": 1468} {"train_loss": -22.807355880737305, "global_step": 121854, "epoch": 1468} {"train_loss": -22.56566047668457, "global_step": 121855, "epoch": 1468} {"train_loss": -22.385263442993164, "global_step": 121856, "epoch": 1468} {"train_loss": -22.568483352661133, "global_step": 121857, "epoch": 1468} {"train_loss": -22.75664520263672, "global_step": 121858, "epoch": 1468} {"train_loss": -22.3382511138916, "global_step": 121859, "epoch": 1468} {"train_loss": -22.37409019470215, "global_step": 121860, "epoch": 1468} {"train_loss": -22.873737335205078, "global_step": 121861, "epoch": 1468} {"train_loss": -22.750211715698242, "global_step": 121862, "epoch": 1468} {"train_loss": -22.52716636657715, "global_step": 121863, "epoch": 1468} {"train_loss": -22.703857421875, "global_step": 121864, "epoch": 1468} {"train_loss": -22.42483901977539, "global_step": 121865, "epoch": 1468} {"train_loss": -22.534093856811523, "global_step": 121866, "epoch": 1468} {"train_loss": -22.66892433166504, "global_step": 121867, "epoch": 1468} {"train_loss": -22.23883056640625, "global_step": 121868, "epoch": 1468} {"train_loss": -22.528650283813477, "global_step": 121869, "epoch": 1468} {"train_loss": -22.64455223083496, "global_step": 121870, "epoch": 1468} {"train_loss": -22.38520622253418, "global_step": 121871, "epoch": 1468} {"train_loss": -22.466064453125, "global_step": 121872, "epoch": 1468} {"train_loss": -22.699594497680664, "global_step": 121873, "epoch": 1468} {"train_loss": -23.098405838012695, "global_step": 121874, "epoch": 1468} {"train_loss": -22.35040855407715, "global_step": 121875, "epoch": 1468} {"train_loss": -22.194608688354492, "global_step": 121876, "epoch": 1468} {"train_loss": -22.06892967224121, "global_step": 121877, "epoch": 1468} {"train_loss": -22.656219482421875, "global_step": 121878, "epoch": 1468} {"train_loss": -22.683090209960938, "global_step": 121879, "epoch": 1468} {"train_loss": -22.693546295166016, "global_step": 121880, "epoch": 1468} {"train_loss": -22.656585693359375, "global_step": 121881, "epoch": 1468} {"train_loss": -22.706289291381836, "global_step": 121882, "epoch": 1468} {"train_loss": -22.6322021484375, "global_step": 121883, "epoch": 1468} {"train_loss": -22.16152000427246, "global_step": 121884, "epoch": 1468} {"train_loss": -22.41346549987793, "global_step": 121885, "epoch": 1468} {"train_loss": -22.36368751525879, "global_step": 121886, "epoch": 1468} {"train_loss": -22.487689971923828, "global_step": 121887, "epoch": 1468} {"train_loss": -22.48150634765625, "global_step": 121888, "epoch": 1468} {"train_loss": -22.644193649291992, "global_step": 121889, "epoch": 1468} {"train_loss": -22.62295150756836, "global_step": 121890, "epoch": 1468} {"train_loss": -22.539812088012695, "global_step": 121891, "epoch": 1468} {"train_loss": -22.508623123168945, "global_step": 121892, "epoch": 1468} {"train_loss": -22.976863861083984, "global_step": 121893, "epoch": 1468} {"train_loss": -22.56667137145996, "global_step": 121894, "epoch": 1468} {"train_loss": -22.602102279663086, "global_step": 121895, "epoch": 1468} {"train_loss": -22.918432235717773, "global_step": 121896, "epoch": 1468} {"train_loss": -22.280080795288086, "global_step": 121897, "epoch": 1468} {"train_loss": -22.684741973876953, "global_step": 121898, "epoch": 1468} {"train_loss": -22.582571029663086, "global_step": 121899, "epoch": 1468} {"train_loss": -22.89879608154297, "global_step": 121900, "epoch": 1468} {"train_loss": -22.23661231994629, "global_step": 121901, "epoch": 1468} {"train_loss": -22.45107078552246, "global_step": 121902, "epoch": 1468} {"train_loss": -22.301498413085938, "global_step": 121903, "epoch": 1468} {"train_loss": -22.103591918945312, "global_step": 121904, "epoch": 1468} {"train_loss": -22.806425094604492, "global_step": 121905, "epoch": 1468} {"train_loss": -22.710702896118164, "global_step": 121906, "epoch": 1468} {"train_loss": -22.54660987854004, "global_step": 121907, "epoch": 1468} {"train_loss": -22.70636558532715, "global_step": 121908, "epoch": 1468} {"train_loss": -22.638687133789062, "global_step": 121909, "epoch": 1468} {"train_loss": -22.583677291870117, "global_step": 121910, "epoch": 1468} {"train_loss": -22.81348991394043, "global_step": 121911, "epoch": 1468} {"train_loss": -22.799013137817383, "global_step": 121912, "epoch": 1468} {"train_loss": -23.036163330078125, "global_step": 121913, "epoch": 1468} {"train_loss": -22.529834747314453, "global_step": 121914, "epoch": 1468} {"train_loss": -23.02281951904297, "global_step": 121915, "epoch": 1468} {"train_loss": -22.452648162841797, "global_step": 121916, "epoch": 1468} {"train_loss": -22.649063110351562, "global_step": 121917, "epoch": 1468} {"train_loss": -22.40794563293457, "global_step": 121918, "epoch": 1468} {"train_loss": -22.726104736328125, "global_step": 121919, "epoch": 1468} {"train_loss": -22.303979873657227, "global_step": 121920, "epoch": 1468} {"train_loss": -22.962656021118164, "global_step": 121921, "epoch": 1468} {"train_loss": -22.825098037719727, "global_step": 121922, "epoch": 1468} {"train_loss": -22.429309844970703, "global_step": 121923, "epoch": 1468} {"train_loss": -22.47308921813965, "global_step": 121924, "epoch": 1468} {"train_loss": -22.678646087646484, "global_step": 121925, "epoch": 1468} {"train_loss": -22.55372945946383, "global_step": 121926, "epoch": 1468, "val_loss": 6190634.5} {"train_loss": -21.454675674438477, "global_step": 121927, "epoch": 1469} {"train_loss": -20.657129287719727, "global_step": 121928, "epoch": 1469} {"train_loss": -21.323453903198242, "global_step": 121929, "epoch": 1469} {"train_loss": -20.965938568115234, "global_step": 121930, "epoch": 1469} {"train_loss": -21.953575134277344, "global_step": 121931, "epoch": 1469} {"train_loss": -22.33048439025879, "global_step": 121932, "epoch": 1469} {"train_loss": -21.772146224975586, "global_step": 121933, "epoch": 1469} {"train_loss": -21.90546226501465, "global_step": 121934, "epoch": 1469} {"train_loss": -22.029977798461914, "global_step": 121935, "epoch": 1469} {"train_loss": -22.135684967041016, "global_step": 121936, "epoch": 1469} {"train_loss": -22.158063888549805, "global_step": 121937, "epoch": 1469} {"train_loss": -21.95754051208496, "global_step": 121938, "epoch": 1469} {"train_loss": -21.92585563659668, "global_step": 121939, "epoch": 1469} {"train_loss": -21.992380142211914, "global_step": 121940, "epoch": 1469} {"train_loss": -22.149761199951172, "global_step": 121941, "epoch": 1469} {"train_loss": -22.06262969970703, "global_step": 121942, "epoch": 1469} {"train_loss": -21.949228286743164, "global_step": 121943, "epoch": 1469} {"train_loss": -22.371950149536133, "global_step": 121944, "epoch": 1469} {"train_loss": -22.46502685546875, "global_step": 121945, "epoch": 1469} {"train_loss": -22.008604049682617, "global_step": 121946, "epoch": 1469} {"train_loss": -22.418813705444336, "global_step": 121947, "epoch": 1469} {"train_loss": -22.312376022338867, "global_step": 121948, "epoch": 1469} {"train_loss": -22.535890579223633, "global_step": 121949, "epoch": 1469} {"train_loss": -22.307430267333984, "global_step": 121950, "epoch": 1469} {"train_loss": -22.58624839782715, "global_step": 121951, "epoch": 1469} {"train_loss": -22.5645694732666, "global_step": 121952, "epoch": 1469} {"train_loss": -22.432950973510742, "global_step": 121953, "epoch": 1469} {"train_loss": -22.5164737701416, "global_step": 121954, "epoch": 1469} {"train_loss": -22.760223388671875, "global_step": 121955, "epoch": 1469} {"train_loss": -22.140161514282227, "global_step": 121956, "epoch": 1469} {"train_loss": -22.691078186035156, "global_step": 121957, "epoch": 1469} {"train_loss": -22.44259262084961, "global_step": 121958, "epoch": 1469} {"train_loss": -22.69599723815918, "global_step": 121959, "epoch": 1469} {"train_loss": -22.755390167236328, "global_step": 121960, "epoch": 1469} {"train_loss": -22.65424919128418, "global_step": 121961, "epoch": 1469} {"train_loss": -22.99049949645996, "global_step": 121962, "epoch": 1469} {"train_loss": -22.727460861206055, "global_step": 121963, "epoch": 1469} {"train_loss": -21.7486629486084, "global_step": 121964, "epoch": 1469} {"train_loss": -22.13699722290039, "global_step": 121965, "epoch": 1469} {"train_loss": -22.530841827392578, "global_step": 121966, "epoch": 1469} {"train_loss": -22.24131202697754, "global_step": 121967, "epoch": 1469} {"train_loss": -22.144153594970703, "global_step": 121968, "epoch": 1469} {"train_loss": -22.311321258544922, "global_step": 121969, "epoch": 1469} {"train_loss": -22.45590591430664, "global_step": 121970, "epoch": 1469} {"train_loss": -22.300703048706055, "global_step": 121971, "epoch": 1469} {"train_loss": -22.749370574951172, "global_step": 121972, "epoch": 1469} {"train_loss": -22.095121383666992, "global_step": 121973, "epoch": 1469} {"train_loss": -22.31568717956543, "global_step": 121974, "epoch": 1469} {"train_loss": -22.17072105407715, "global_step": 121975, "epoch": 1469} {"train_loss": -22.352773666381836, "global_step": 121976, "epoch": 1469} {"train_loss": -22.68918800354004, "global_step": 121977, "epoch": 1469} {"train_loss": -22.432233810424805, "global_step": 121978, "epoch": 1469} {"train_loss": -22.522449493408203, "global_step": 121979, "epoch": 1469} {"train_loss": -22.274349212646484, "global_step": 121980, "epoch": 1469} {"train_loss": -22.188373565673828, "global_step": 121981, "epoch": 1469} {"train_loss": -22.904855728149414, "global_step": 121982, "epoch": 1469} {"train_loss": -22.15081214904785, "global_step": 121983, "epoch": 1469} {"train_loss": -22.5583438873291, "global_step": 121984, "epoch": 1469} {"train_loss": -22.346271514892578, "global_step": 121985, "epoch": 1469} {"train_loss": -22.5244197845459, "global_step": 121986, "epoch": 1469} {"train_loss": -22.76311683654785, "global_step": 121987, "epoch": 1469} {"train_loss": -22.832128524780273, "global_step": 121988, "epoch": 1469} {"train_loss": -22.56477165222168, "global_step": 121989, "epoch": 1469} {"train_loss": -22.56441307067871, "global_step": 121990, "epoch": 1469} {"train_loss": -22.651845932006836, "global_step": 121991, "epoch": 1469} {"train_loss": -22.81511878967285, "global_step": 121992, "epoch": 1469} {"train_loss": -22.770936965942383, "global_step": 121993, "epoch": 1469} {"train_loss": -22.698196411132812, "global_step": 121994, "epoch": 1469} {"train_loss": -22.679040908813477, "global_step": 121995, "epoch": 1469} {"train_loss": -22.466541290283203, "global_step": 121996, "epoch": 1469} {"train_loss": -22.412097930908203, "global_step": 121997, "epoch": 1469} {"train_loss": -22.84819984436035, "global_step": 121998, "epoch": 1469} {"train_loss": -22.289947509765625, "global_step": 121999, "epoch": 1469} {"train_loss": -22.666189193725586, "global_step": 122000, "epoch": 1469} {"train_loss": -22.19782066345215, "global_step": 122001, "epoch": 1469} {"train_loss": -22.430265426635742, "global_step": 122002, "epoch": 1469} {"train_loss": -22.16359519958496, "global_step": 122003, "epoch": 1469} {"train_loss": -22.516450881958008, "global_step": 122004, "epoch": 1469} {"train_loss": -22.604188919067383, "global_step": 122005, "epoch": 1469} {"train_loss": -22.654123306274414, "global_step": 122006, "epoch": 1469} {"train_loss": -22.65821647644043, "global_step": 122007, "epoch": 1469} {"train_loss": -22.75664710998535, "global_step": 122008, "epoch": 1469} {"train_loss": -22.354559749005787, "global_step": 122009, "epoch": 1469, "val_loss": 6245126.0} {"train_loss": -22.107955932617188, "global_step": 122010, "epoch": 1470} {"train_loss": -22.26125144958496, "global_step": 122011, "epoch": 1470} {"train_loss": -22.041677474975586, "global_step": 122012, "epoch": 1470} {"train_loss": -21.8010311126709, "global_step": 122013, "epoch": 1470} {"train_loss": -22.3070068359375, "global_step": 122014, "epoch": 1470} {"train_loss": -21.74439239501953, "global_step": 122015, "epoch": 1470} {"train_loss": -22.758249282836914, "global_step": 122016, "epoch": 1470} {"train_loss": -21.720504760742188, "global_step": 122017, "epoch": 1470} {"train_loss": -22.088510513305664, "global_step": 122018, "epoch": 1470} {"train_loss": -22.362388610839844, "global_step": 122019, "epoch": 1470} {"train_loss": -22.076614379882812, "global_step": 122020, "epoch": 1470} {"train_loss": -22.810331344604492, "global_step": 122021, "epoch": 1470} {"train_loss": -22.53317642211914, "global_step": 122022, "epoch": 1470} {"train_loss": -22.292917251586914, "global_step": 122023, "epoch": 1470} {"train_loss": -22.69415283203125, "global_step": 122024, "epoch": 1470} {"train_loss": -22.330947875976562, "global_step": 122025, "epoch": 1470} {"train_loss": -22.443477630615234, "global_step": 122026, "epoch": 1470} {"train_loss": -22.386829376220703, "global_step": 122027, "epoch": 1470} {"train_loss": -22.35848045349121, "global_step": 122028, "epoch": 1470} {"train_loss": -22.709096908569336, "global_step": 122029, "epoch": 1470} {"train_loss": -22.512680053710938, "global_step": 122030, "epoch": 1470} {"train_loss": -22.743154525756836, "global_step": 122031, "epoch": 1470} {"train_loss": -22.262006759643555, "global_step": 122032, "epoch": 1470} {"train_loss": -22.561080932617188, "global_step": 122033, "epoch": 1470} {"train_loss": -22.703428268432617, "global_step": 122034, "epoch": 1470} {"train_loss": -22.510026931762695, "global_step": 122035, "epoch": 1470} {"train_loss": -22.821331024169922, "global_step": 122036, "epoch": 1470} {"train_loss": -22.347211837768555, "global_step": 122037, "epoch": 1470} {"train_loss": -22.263944625854492, "global_step": 122038, "epoch": 1470} {"train_loss": -22.629390716552734, "global_step": 122039, "epoch": 1470} {"train_loss": -22.575607299804688, "global_step": 122040, "epoch": 1470} {"train_loss": -22.663297653198242, "global_step": 122041, "epoch": 1470} {"train_loss": -22.74002456665039, "global_step": 122042, "epoch": 1470} {"train_loss": -22.849172592163086, "global_step": 122043, "epoch": 1470} {"train_loss": -22.415117263793945, "global_step": 122044, "epoch": 1470} {"train_loss": -22.576147079467773, "global_step": 122045, "epoch": 1470} {"train_loss": -22.690176010131836, "global_step": 122046, "epoch": 1470} {"train_loss": -22.864744186401367, "global_step": 122047, "epoch": 1470} {"train_loss": -22.489582061767578, "global_step": 122048, "epoch": 1470} {"train_loss": -22.775999069213867, "global_step": 122049, "epoch": 1470} {"train_loss": -22.51886558532715, "global_step": 122050, "epoch": 1470} {"train_loss": -22.646570205688477, "global_step": 122051, "epoch": 1470} {"train_loss": -22.67457389831543, "global_step": 122052, "epoch": 1470} {"train_loss": -22.666955947875977, "global_step": 122053, "epoch": 1470} {"train_loss": -22.454397201538086, "global_step": 122054, "epoch": 1470} {"train_loss": -22.623682022094727, "global_step": 122055, "epoch": 1470} {"train_loss": -22.643766403198242, "global_step": 122056, "epoch": 1470} {"train_loss": -22.595653533935547, "global_step": 122057, "epoch": 1470} {"train_loss": -22.455463409423828, "global_step": 122058, "epoch": 1470} {"train_loss": -22.416818618774414, "global_step": 122059, "epoch": 1470} {"train_loss": -22.77646255493164, "global_step": 122060, "epoch": 1470} {"train_loss": -22.583703994750977, "global_step": 122061, "epoch": 1470} {"train_loss": -22.750198364257812, "global_step": 122062, "epoch": 1470} {"train_loss": -22.71078872680664, "global_step": 122063, "epoch": 1470} {"train_loss": -22.333084106445312, "global_step": 122064, "epoch": 1470} {"train_loss": -22.34124183654785, "global_step": 122065, "epoch": 1470} {"train_loss": -22.607656478881836, "global_step": 122066, "epoch": 1470} {"train_loss": -22.57395362854004, "global_step": 122067, "epoch": 1470} {"train_loss": -22.606449127197266, "global_step": 122068, "epoch": 1470} {"train_loss": -22.696456909179688, "global_step": 122069, "epoch": 1470} {"train_loss": -22.761383056640625, "global_step": 122070, "epoch": 1470} {"train_loss": -22.15656852722168, "global_step": 122071, "epoch": 1470} {"train_loss": -22.522920608520508, "global_step": 122072, "epoch": 1470} {"train_loss": -22.413293838500977, "global_step": 122073, "epoch": 1470} {"train_loss": -22.814315795898438, "global_step": 122074, "epoch": 1470} {"train_loss": -22.88648796081543, "global_step": 122075, "epoch": 1470} {"train_loss": -22.646703720092773, "global_step": 122076, "epoch": 1470} {"train_loss": -22.51100730895996, "global_step": 122077, "epoch": 1470} {"train_loss": -22.486713409423828, "global_step": 122078, "epoch": 1470} {"train_loss": -22.335163116455078, "global_step": 122079, "epoch": 1470} {"train_loss": -22.384428024291992, "global_step": 122080, "epoch": 1470} {"train_loss": -22.866544723510742, "global_step": 122081, "epoch": 1470} {"train_loss": -22.723600387573242, "global_step": 122082, "epoch": 1470} {"train_loss": -22.770986557006836, "global_step": 122083, "epoch": 1470} {"train_loss": -22.78042221069336, "global_step": 122084, "epoch": 1470} {"train_loss": -22.74167823791504, "global_step": 122085, "epoch": 1470} {"train_loss": -22.70233154296875, "global_step": 122086, "epoch": 1470} {"train_loss": -22.557907104492188, "global_step": 122087, "epoch": 1470} {"train_loss": -22.42246437072754, "global_step": 122088, "epoch": 1470} {"train_loss": -22.625314712524414, "global_step": 122089, "epoch": 1470} {"train_loss": -22.873432159423828, "global_step": 122090, "epoch": 1470} {"train_loss": -22.747421264648438, "global_step": 122091, "epoch": 1470} {"train_loss": -22.523551619196514, "global_step": 122092, "epoch": 1470, "val_loss": 6196592.0} {"train_loss": -22.36640739440918, "global_step": 122093, "epoch": 1471} {"train_loss": -22.299070358276367, "global_step": 122094, "epoch": 1471} {"train_loss": -22.159423828125, "global_step": 122095, "epoch": 1471} {"train_loss": -22.652938842773438, "global_step": 122096, "epoch": 1471} {"train_loss": -22.688339233398438, "global_step": 122097, "epoch": 1471} {"train_loss": -22.335195541381836, "global_step": 122098, "epoch": 1471} {"train_loss": -22.409894943237305, "global_step": 122099, "epoch": 1471} {"train_loss": -22.587514877319336, "global_step": 122100, "epoch": 1471} {"train_loss": -22.486347198486328, "global_step": 122101, "epoch": 1471} {"train_loss": -22.0402774810791, "global_step": 122102, "epoch": 1471} {"train_loss": -22.437475204467773, "global_step": 122103, "epoch": 1471} {"train_loss": -22.264616012573242, "global_step": 122104, "epoch": 1471} {"train_loss": -22.50164031982422, "global_step": 122105, "epoch": 1471} {"train_loss": -22.523761749267578, "global_step": 122106, "epoch": 1471} {"train_loss": -22.613622665405273, "global_step": 122107, "epoch": 1471} {"train_loss": -22.96399688720703, "global_step": 122108, "epoch": 1471} {"train_loss": -22.180999755859375, "global_step": 122109, "epoch": 1471} {"train_loss": -22.283689498901367, "global_step": 122110, "epoch": 1471} {"train_loss": -22.590269088745117, "global_step": 122111, "epoch": 1471} {"train_loss": -22.200305938720703, "global_step": 122112, "epoch": 1471} {"train_loss": -22.213716506958008, "global_step": 122113, "epoch": 1471} {"train_loss": -22.363433837890625, "global_step": 122114, "epoch": 1471} {"train_loss": -22.45404624938965, "global_step": 122115, "epoch": 1471} {"train_loss": -23.005828857421875, "global_step": 122116, "epoch": 1471} {"train_loss": -22.940298080444336, "global_step": 122117, "epoch": 1471} {"train_loss": -22.735382080078125, "global_step": 122118, "epoch": 1471} {"train_loss": -22.70600700378418, "global_step": 122119, "epoch": 1471} {"train_loss": -22.405614852905273, "global_step": 122120, "epoch": 1471} {"train_loss": -22.487516403198242, "global_step": 122121, "epoch": 1471} {"train_loss": -22.746469497680664, "global_step": 122122, "epoch": 1471} {"train_loss": -22.54281997680664, "global_step": 122123, "epoch": 1471} {"train_loss": -22.40752601623535, "global_step": 122124, "epoch": 1471} {"train_loss": -23.087236404418945, "global_step": 122125, "epoch": 1471} {"train_loss": -22.668094635009766, "global_step": 122126, "epoch": 1471} {"train_loss": -22.763376235961914, "global_step": 122127, "epoch": 1471} {"train_loss": -22.759611129760742, "global_step": 122128, "epoch": 1471} {"train_loss": -22.721837997436523, "global_step": 122129, "epoch": 1471} {"train_loss": -22.760467529296875, "global_step": 122130, "epoch": 1471} {"train_loss": -22.37265396118164, "global_step": 122131, "epoch": 1471} {"train_loss": -23.184728622436523, "global_step": 122132, "epoch": 1471} {"train_loss": -22.897750854492188, "global_step": 122133, "epoch": 1471} {"train_loss": -22.704723358154297, "global_step": 122134, "epoch": 1471} {"train_loss": -22.4971923828125, "global_step": 122135, "epoch": 1471} {"train_loss": -22.897790908813477, "global_step": 122136, "epoch": 1471} {"train_loss": -22.678312301635742, "global_step": 122137, "epoch": 1471} {"train_loss": -22.614948272705078, "global_step": 122138, "epoch": 1471} {"train_loss": -21.99383544921875, "global_step": 122139, "epoch": 1471} {"train_loss": -22.367624282836914, "global_step": 122140, "epoch": 1471} {"train_loss": -22.62334632873535, "global_step": 122141, "epoch": 1471} {"train_loss": -22.89707374572754, "global_step": 122142, "epoch": 1471} {"train_loss": -22.480558395385742, "global_step": 122143, "epoch": 1471} {"train_loss": -23.027053833007812, "global_step": 122144, "epoch": 1471} {"train_loss": -22.75532341003418, "global_step": 122145, "epoch": 1471} {"train_loss": -22.857315063476562, "global_step": 122146, "epoch": 1471} {"train_loss": -22.965436935424805, "global_step": 122147, "epoch": 1471} {"train_loss": -22.93071174621582, "global_step": 122148, "epoch": 1471} {"train_loss": -22.832788467407227, "global_step": 122149, "epoch": 1471} {"train_loss": -22.352258682250977, "global_step": 122150, "epoch": 1471} {"train_loss": -22.53342056274414, "global_step": 122151, "epoch": 1471} {"train_loss": -22.909412384033203, "global_step": 122152, "epoch": 1471} {"train_loss": -22.275285720825195, "global_step": 122153, "epoch": 1471} {"train_loss": -22.42919158935547, "global_step": 122154, "epoch": 1471} {"train_loss": -22.455793380737305, "global_step": 122155, "epoch": 1471} {"train_loss": -22.283939361572266, "global_step": 122156, "epoch": 1471} {"train_loss": -22.518293380737305, "global_step": 122157, "epoch": 1471} {"train_loss": -22.95449447631836, "global_step": 122158, "epoch": 1471} {"train_loss": -22.707965850830078, "global_step": 122159, "epoch": 1471} {"train_loss": -22.627544403076172, "global_step": 122160, "epoch": 1471} {"train_loss": -22.634586334228516, "global_step": 122161, "epoch": 1471} {"train_loss": -22.479036331176758, "global_step": 122162, "epoch": 1471} {"train_loss": -22.6287899017334, "global_step": 122163, "epoch": 1471} {"train_loss": -22.66361427307129, "global_step": 122164, "epoch": 1471} {"train_loss": -22.22743797302246, "global_step": 122165, "epoch": 1471} {"train_loss": -22.276872634887695, "global_step": 122166, "epoch": 1471} {"train_loss": -22.22066307067871, "global_step": 122167, "epoch": 1471} {"train_loss": -22.334613800048828, "global_step": 122168, "epoch": 1471} {"train_loss": -23.015220642089844, "global_step": 122169, "epoch": 1471} {"train_loss": -22.616153717041016, "global_step": 122170, "epoch": 1471} {"train_loss": -22.770906448364258, "global_step": 122171, "epoch": 1471} {"train_loss": -22.63285255432129, "global_step": 122172, "epoch": 1471} {"train_loss": -22.70893669128418, "global_step": 122173, "epoch": 1471} {"train_loss": -22.19147491455078, "global_step": 122174, "epoch": 1471} {"train_loss": -22.574201193200537, "global_step": 122175, "epoch": 1471, "val_loss": 6271849.5} {"train_loss": -21.303709030151367, "global_step": 122176, "epoch": 1472} {"train_loss": -21.152616500854492, "global_step": 122177, "epoch": 1472} {"train_loss": -21.3138370513916, "global_step": 122178, "epoch": 1472} {"train_loss": -22.226964950561523, "global_step": 122179, "epoch": 1472} {"train_loss": -21.25625991821289, "global_step": 122180, "epoch": 1472} {"train_loss": -21.98670768737793, "global_step": 122181, "epoch": 1472} {"train_loss": -22.08612060546875, "global_step": 122182, "epoch": 1472} {"train_loss": -22.105443954467773, "global_step": 122183, "epoch": 1472} {"train_loss": -21.54024314880371, "global_step": 122184, "epoch": 1472} {"train_loss": -21.746456146240234, "global_step": 122185, "epoch": 1472} {"train_loss": -22.17078971862793, "global_step": 122186, "epoch": 1472} {"train_loss": -22.07180404663086, "global_step": 122187, "epoch": 1472} {"train_loss": -22.09549903869629, "global_step": 122188, "epoch": 1472} {"train_loss": -21.838350296020508, "global_step": 122189, "epoch": 1472} {"train_loss": -22.131305694580078, "global_step": 122190, "epoch": 1472} {"train_loss": -22.158266067504883, "global_step": 122191, "epoch": 1472} {"train_loss": -22.17079734802246, "global_step": 122192, "epoch": 1472} {"train_loss": -21.963180541992188, "global_step": 122193, "epoch": 1472} {"train_loss": -22.35913848876953, "global_step": 122194, "epoch": 1472} {"train_loss": -22.550168991088867, "global_step": 122195, "epoch": 1472} {"train_loss": -21.72498893737793, "global_step": 122196, "epoch": 1472} {"train_loss": -22.624637603759766, "global_step": 122197, "epoch": 1472} {"train_loss": -22.253826141357422, "global_step": 122198, "epoch": 1472} {"train_loss": -22.284635543823242, "global_step": 122199, "epoch": 1472} {"train_loss": -22.42003631591797, "global_step": 122200, "epoch": 1472} {"train_loss": -22.315170288085938, "global_step": 122201, "epoch": 1472} {"train_loss": -22.288211822509766, "global_step": 122202, "epoch": 1472} {"train_loss": -22.258920669555664, "global_step": 122203, "epoch": 1472} {"train_loss": -22.813770294189453, "global_step": 122204, "epoch": 1472} {"train_loss": -22.562528610229492, "global_step": 122205, "epoch": 1472} {"train_loss": -22.782211303710938, "global_step": 122206, "epoch": 1472} {"train_loss": -22.464365005493164, "global_step": 122207, "epoch": 1472} {"train_loss": -22.76112174987793, "global_step": 122208, "epoch": 1472} {"train_loss": -22.71027183532715, "global_step": 122209, "epoch": 1472} {"train_loss": -22.684518814086914, "global_step": 122210, "epoch": 1472} {"train_loss": -22.857479095458984, "global_step": 122211, "epoch": 1472} {"train_loss": -22.73436164855957, "global_step": 122212, "epoch": 1472} {"train_loss": -22.471874237060547, "global_step": 122213, "epoch": 1472} {"train_loss": -22.39151382446289, "global_step": 122214, "epoch": 1472} {"train_loss": -22.453901290893555, "global_step": 122215, "epoch": 1472} {"train_loss": -22.470932006835938, "global_step": 122216, "epoch": 1472} {"train_loss": -22.68941307067871, "global_step": 122217, "epoch": 1472} {"train_loss": -23.19472312927246, "global_step": 122218, "epoch": 1472} {"train_loss": -22.878210067749023, "global_step": 122219, "epoch": 1472} {"train_loss": -22.784780502319336, "global_step": 122220, "epoch": 1472} {"train_loss": -22.512794494628906, "global_step": 122221, "epoch": 1472} {"train_loss": -22.29483413696289, "global_step": 122222, "epoch": 1472} {"train_loss": -23.14497947692871, "global_step": 122223, "epoch": 1472} {"train_loss": -22.293161392211914, "global_step": 122224, "epoch": 1472} {"train_loss": -22.789888381958008, "global_step": 122225, "epoch": 1472} {"train_loss": -22.548797607421875, "global_step": 122226, "epoch": 1472} {"train_loss": -22.87153434753418, "global_step": 122227, "epoch": 1472} {"train_loss": -22.1679744720459, "global_step": 122228, "epoch": 1472} {"train_loss": -22.69985008239746, "global_step": 122229, "epoch": 1472} {"train_loss": -22.175518035888672, "global_step": 122230, "epoch": 1472} {"train_loss": -22.40021324157715, "global_step": 122231, "epoch": 1472} {"train_loss": -22.633258819580078, "global_step": 122232, "epoch": 1472} {"train_loss": -22.881628036499023, "global_step": 122233, "epoch": 1472} {"train_loss": -22.711658477783203, "global_step": 122234, "epoch": 1472} {"train_loss": -23.049407958984375, "global_step": 122235, "epoch": 1472} {"train_loss": -22.643115997314453, "global_step": 122236, "epoch": 1472} {"train_loss": -22.28955841064453, "global_step": 122237, "epoch": 1472} {"train_loss": -22.584562301635742, "global_step": 122238, "epoch": 1472} {"train_loss": -22.716861724853516, "global_step": 122239, "epoch": 1472} {"train_loss": -22.625425338745117, "global_step": 122240, "epoch": 1472} {"train_loss": -22.74539566040039, "global_step": 122241, "epoch": 1472} {"train_loss": -22.695131301879883, "global_step": 122242, "epoch": 1472} {"train_loss": -22.54199981689453, "global_step": 122243, "epoch": 1472} {"train_loss": -22.324838638305664, "global_step": 122244, "epoch": 1472} {"train_loss": -22.881561279296875, "global_step": 122245, "epoch": 1472} {"train_loss": -22.66324234008789, "global_step": 122246, "epoch": 1472} {"train_loss": -22.77927589416504, "global_step": 122247, "epoch": 1472} {"train_loss": -22.70526695251465, "global_step": 122248, "epoch": 1472} {"train_loss": -22.304105758666992, "global_step": 122249, "epoch": 1472} {"train_loss": -22.909170150756836, "global_step": 122250, "epoch": 1472} {"train_loss": -22.5179500579834, "global_step": 122251, "epoch": 1472} {"train_loss": -22.906492233276367, "global_step": 122252, "epoch": 1472} {"train_loss": -22.42179298400879, "global_step": 122253, "epoch": 1472} {"train_loss": -22.941654205322266, "global_step": 122254, "epoch": 1472} {"train_loss": -22.597076416015625, "global_step": 122255, "epoch": 1472} {"train_loss": -22.598569869995117, "global_step": 122256, "epoch": 1472} {"train_loss": -22.457199096679688, "global_step": 122257, "epoch": 1472} {"train_loss": -22.427739223801947, "global_step": 122258, "epoch": 1472, "val_loss": 6256220.5} {"train_loss": -22.484220504760742, "global_step": 122259, "epoch": 1473} {"train_loss": -21.867101669311523, "global_step": 122260, "epoch": 1473} {"train_loss": -22.54184913635254, "global_step": 122261, "epoch": 1473} {"train_loss": -22.397558212280273, "global_step": 122262, "epoch": 1473} {"train_loss": -22.56851577758789, "global_step": 122263, "epoch": 1473} {"train_loss": -22.18662452697754, "global_step": 122264, "epoch": 1473} {"train_loss": -22.222925186157227, "global_step": 122265, "epoch": 1473} {"train_loss": -22.048721313476562, "global_step": 122266, "epoch": 1473} {"train_loss": -22.351945877075195, "global_step": 122267, "epoch": 1473} {"train_loss": -22.365375518798828, "global_step": 122268, "epoch": 1473} {"train_loss": -22.339401245117188, "global_step": 122269, "epoch": 1473} {"train_loss": -22.1954345703125, "global_step": 122270, "epoch": 1473} {"train_loss": -22.5283145904541, "global_step": 122271, "epoch": 1473} {"train_loss": -22.378591537475586, "global_step": 122272, "epoch": 1473} {"train_loss": -22.487539291381836, "global_step": 122273, "epoch": 1473} {"train_loss": -22.729215621948242, "global_step": 122274, "epoch": 1473} {"train_loss": -22.260496139526367, "global_step": 122275, "epoch": 1473} {"train_loss": -22.709815979003906, "global_step": 122276, "epoch": 1473} {"train_loss": -22.54847526550293, "global_step": 122277, "epoch": 1473} {"train_loss": -22.933517456054688, "global_step": 122278, "epoch": 1473} {"train_loss": -22.635303497314453, "global_step": 122279, "epoch": 1473} {"train_loss": -22.187191009521484, "global_step": 122280, "epoch": 1473} {"train_loss": -22.932950973510742, "global_step": 122281, "epoch": 1473} {"train_loss": -22.54151153564453, "global_step": 122282, "epoch": 1473} {"train_loss": -22.558135986328125, "global_step": 122283, "epoch": 1473} {"train_loss": -22.56447410583496, "global_step": 122284, "epoch": 1473} {"train_loss": -22.5718936920166, "global_step": 122285, "epoch": 1473} {"train_loss": -22.36980438232422, "global_step": 122286, "epoch": 1473} {"train_loss": -22.84935760498047, "global_step": 122287, "epoch": 1473} {"train_loss": -22.329927444458008, "global_step": 122288, "epoch": 1473} {"train_loss": -22.728382110595703, "global_step": 122289, "epoch": 1473} {"train_loss": -22.351896286010742, "global_step": 122290, "epoch": 1473} {"train_loss": -22.466718673706055, "global_step": 122291, "epoch": 1473} {"train_loss": -22.650373458862305, "global_step": 122292, "epoch": 1473} {"train_loss": -22.3762149810791, "global_step": 122293, "epoch": 1473} {"train_loss": -22.73688316345215, "global_step": 122294, "epoch": 1473} {"train_loss": -22.662805557250977, "global_step": 122295, "epoch": 1473} {"train_loss": -22.249374389648438, "global_step": 122296, "epoch": 1473} {"train_loss": -22.46331787109375, "global_step": 122297, "epoch": 1473} {"train_loss": -22.258543014526367, "global_step": 122298, "epoch": 1473} {"train_loss": -22.356388092041016, "global_step": 122299, "epoch": 1473} {"train_loss": -22.608768463134766, "global_step": 122300, "epoch": 1473} {"train_loss": -22.752988815307617, "global_step": 122301, "epoch": 1473} {"train_loss": -22.908231735229492, "global_step": 122302, "epoch": 1473} {"train_loss": -22.64823341369629, "global_step": 122303, "epoch": 1473} {"train_loss": -22.768924713134766, "global_step": 122304, "epoch": 1473} {"train_loss": -22.601259231567383, "global_step": 122305, "epoch": 1473} {"train_loss": -22.26825523376465, "global_step": 122306, "epoch": 1473} {"train_loss": -23.3487548828125, "global_step": 122307, "epoch": 1473} {"train_loss": -22.980195999145508, "global_step": 122308, "epoch": 1473} {"train_loss": -22.489057540893555, "global_step": 122309, "epoch": 1473} {"train_loss": -22.507144927978516, "global_step": 122310, "epoch": 1473} {"train_loss": -23.14310073852539, "global_step": 122311, "epoch": 1473} {"train_loss": -22.4440975189209, "global_step": 122312, "epoch": 1473} {"train_loss": -22.791776657104492, "global_step": 122313, "epoch": 1473} {"train_loss": -22.608760833740234, "global_step": 122314, "epoch": 1473} {"train_loss": -22.555625915527344, "global_step": 122315, "epoch": 1473} {"train_loss": -22.493642807006836, "global_step": 122316, "epoch": 1473} {"train_loss": -22.536109924316406, "global_step": 122317, "epoch": 1473} {"train_loss": -22.61909294128418, "global_step": 122318, "epoch": 1473} {"train_loss": -22.68434715270996, "global_step": 122319, "epoch": 1473} {"train_loss": -22.20167350769043, "global_step": 122320, "epoch": 1473} {"train_loss": -22.235942840576172, "global_step": 122321, "epoch": 1473} {"train_loss": -22.59733009338379, "global_step": 122322, "epoch": 1473} {"train_loss": -22.552993774414062, "global_step": 122323, "epoch": 1473} {"train_loss": -22.788820266723633, "global_step": 122324, "epoch": 1473} {"train_loss": -22.336759567260742, "global_step": 122325, "epoch": 1473} {"train_loss": -22.40178871154785, "global_step": 122326, "epoch": 1473} {"train_loss": -22.623437881469727, "global_step": 122327, "epoch": 1473} {"train_loss": -23.042299270629883, "global_step": 122328, "epoch": 1473} {"train_loss": -22.364133834838867, "global_step": 122329, "epoch": 1473} {"train_loss": -22.538715362548828, "global_step": 122330, "epoch": 1473} {"train_loss": -22.504472732543945, "global_step": 122331, "epoch": 1473} {"train_loss": -22.151281356811523, "global_step": 122332, "epoch": 1473} {"train_loss": -22.50471305847168, "global_step": 122333, "epoch": 1473} {"train_loss": -22.50905418395996, "global_step": 122334, "epoch": 1473} {"train_loss": -23.034332275390625, "global_step": 122335, "epoch": 1473} {"train_loss": -22.590009689331055, "global_step": 122336, "epoch": 1473} {"train_loss": -22.457107543945312, "global_step": 122337, "epoch": 1473} {"train_loss": -22.665979385375977, "global_step": 122338, "epoch": 1473} {"train_loss": -22.679651260375977, "global_step": 122339, "epoch": 1473} {"train_loss": -22.2642879486084, "global_step": 122340, "epoch": 1473} {"train_loss": -22.52842783640666, "global_step": 122341, "epoch": 1473, "val_loss": 6237870.0} {"train_loss": -22.209129333496094, "global_step": 122342, "epoch": 1474} {"train_loss": -22.07657241821289, "global_step": 122343, "epoch": 1474} {"train_loss": -22.713037490844727, "global_step": 122344, "epoch": 1474} {"train_loss": -22.35549545288086, "global_step": 122345, "epoch": 1474} {"train_loss": -22.58158302307129, "global_step": 122346, "epoch": 1474} {"train_loss": -22.599756240844727, "global_step": 122347, "epoch": 1474} {"train_loss": -22.282567977905273, "global_step": 122348, "epoch": 1474} {"train_loss": -22.097856521606445, "global_step": 122349, "epoch": 1474} {"train_loss": -22.52115249633789, "global_step": 122350, "epoch": 1474} {"train_loss": -22.51104164123535, "global_step": 122351, "epoch": 1474} {"train_loss": -22.711265563964844, "global_step": 122352, "epoch": 1474} {"train_loss": -22.837907791137695, "global_step": 122353, "epoch": 1474} {"train_loss": -22.095947265625, "global_step": 122354, "epoch": 1474} {"train_loss": -22.742521286010742, "global_step": 122355, "epoch": 1474} {"train_loss": -22.301443099975586, "global_step": 122356, "epoch": 1474} {"train_loss": -22.442630767822266, "global_step": 122357, "epoch": 1474} {"train_loss": -22.183670043945312, "global_step": 122358, "epoch": 1474} {"train_loss": -22.159748077392578, "global_step": 122359, "epoch": 1474} {"train_loss": -22.525772094726562, "global_step": 122360, "epoch": 1474} {"train_loss": -22.417417526245117, "global_step": 122361, "epoch": 1474} {"train_loss": -22.626251220703125, "global_step": 122362, "epoch": 1474} {"train_loss": -22.604421615600586, "global_step": 122363, "epoch": 1474} {"train_loss": -22.86577606201172, "global_step": 122364, "epoch": 1474} {"train_loss": -22.496126174926758, "global_step": 122365, "epoch": 1474} {"train_loss": -22.625057220458984, "global_step": 122366, "epoch": 1474} {"train_loss": -22.43415641784668, "global_step": 122367, "epoch": 1474} {"train_loss": -22.749914169311523, "global_step": 122368, "epoch": 1474} {"train_loss": -22.829729080200195, "global_step": 122369, "epoch": 1474} {"train_loss": -22.82513999938965, "global_step": 122370, "epoch": 1474} {"train_loss": -22.628820419311523, "global_step": 122371, "epoch": 1474} {"train_loss": -22.79742431640625, "global_step": 122372, "epoch": 1474} {"train_loss": -22.541427612304688, "global_step": 122373, "epoch": 1474} {"train_loss": -22.6738338470459, "global_step": 122374, "epoch": 1474} {"train_loss": -22.628559112548828, "global_step": 122375, "epoch": 1474} {"train_loss": -22.796707153320312, "global_step": 122376, "epoch": 1474} {"train_loss": -22.57464599609375, "global_step": 122377, "epoch": 1474} {"train_loss": -22.572341918945312, "global_step": 122378, "epoch": 1474} {"train_loss": -22.622095108032227, "global_step": 122379, "epoch": 1474} {"train_loss": -22.936185836791992, "global_step": 122380, "epoch": 1474} {"train_loss": -22.620595932006836, "global_step": 122381, "epoch": 1474} {"train_loss": -22.940214157104492, "global_step": 122382, "epoch": 1474} {"train_loss": -22.60447883605957, "global_step": 122383, "epoch": 1474} {"train_loss": -22.790563583374023, "global_step": 122384, "epoch": 1474} {"train_loss": -22.614639282226562, "global_step": 122385, "epoch": 1474} {"train_loss": -22.79341697692871, "global_step": 122386, "epoch": 1474} {"train_loss": -22.8956298828125, "global_step": 122387, "epoch": 1474} {"train_loss": -22.545927047729492, "global_step": 122388, "epoch": 1474} {"train_loss": -22.51658821105957, "global_step": 122389, "epoch": 1474} {"train_loss": -23.00111198425293, "global_step": 122390, "epoch": 1474} {"train_loss": -22.77098846435547, "global_step": 122391, "epoch": 1474} {"train_loss": -22.81553840637207, "global_step": 122392, "epoch": 1474} {"train_loss": -22.384611129760742, "global_step": 122393, "epoch": 1474} {"train_loss": -22.47682762145996, "global_step": 122394, "epoch": 1474} {"train_loss": -22.765655517578125, "global_step": 122395, "epoch": 1474} {"train_loss": -22.757917404174805, "global_step": 122396, "epoch": 1474} {"train_loss": -22.669082641601562, "global_step": 122397, "epoch": 1474} {"train_loss": -22.906360626220703, "global_step": 122398, "epoch": 1474} {"train_loss": -22.719860076904297, "global_step": 122399, "epoch": 1474} {"train_loss": -22.557483673095703, "global_step": 122400, "epoch": 1474} {"train_loss": -22.691843032836914, "global_step": 122401, "epoch": 1474} {"train_loss": -22.744794845581055, "global_step": 122402, "epoch": 1474} {"train_loss": -22.64336585998535, "global_step": 122403, "epoch": 1474} {"train_loss": -22.508899688720703, "global_step": 122404, "epoch": 1474} {"train_loss": -22.252958297729492, "global_step": 122405, "epoch": 1474} {"train_loss": -22.968738555908203, "global_step": 122406, "epoch": 1474} {"train_loss": -22.82377052307129, "global_step": 122407, "epoch": 1474} {"train_loss": -22.441625595092773, "global_step": 122408, "epoch": 1474} {"train_loss": -22.47960090637207, "global_step": 122409, "epoch": 1474} {"train_loss": -22.67055892944336, "global_step": 122410, "epoch": 1474} {"train_loss": -22.512449264526367, "global_step": 122411, "epoch": 1474} {"train_loss": -22.465152740478516, "global_step": 122412, "epoch": 1474} {"train_loss": -22.1881046295166, "global_step": 122413, "epoch": 1474} {"train_loss": -22.021806716918945, "global_step": 122414, "epoch": 1474} {"train_loss": -22.48666763305664, "global_step": 122415, "epoch": 1474} {"train_loss": -22.35483741760254, "global_step": 122416, "epoch": 1474} {"train_loss": -22.463367462158203, "global_step": 122417, "epoch": 1474} {"train_loss": -22.42361831665039, "global_step": 122418, "epoch": 1474} {"train_loss": -22.605844497680664, "global_step": 122419, "epoch": 1474} {"train_loss": -22.525453567504883, "global_step": 122420, "epoch": 1474} {"train_loss": -22.892568588256836, "global_step": 122421, "epoch": 1474} {"train_loss": -22.377689361572266, "global_step": 122422, "epoch": 1474} {"train_loss": -22.396778106689453, "global_step": 122423, "epoch": 1474} {"train_loss": -22.558945069830102, "global_step": 122424, "epoch": 1474, "val_loss": 6183700.0} {"train_loss": -22.0816650390625, "global_step": 122425, "epoch": 1475} {"train_loss": -22.40558624267578, "global_step": 122426, "epoch": 1475} {"train_loss": -22.342086791992188, "global_step": 122427, "epoch": 1475} {"train_loss": -22.465526580810547, "global_step": 122428, "epoch": 1475} {"train_loss": -22.509183883666992, "global_step": 122429, "epoch": 1475} {"train_loss": -22.096593856811523, "global_step": 122430, "epoch": 1475} {"train_loss": -22.761917114257812, "global_step": 122431, "epoch": 1475} {"train_loss": -22.544498443603516, "global_step": 122432, "epoch": 1475} {"train_loss": -22.416645050048828, "global_step": 122433, "epoch": 1475} {"train_loss": -22.079254150390625, "global_step": 122434, "epoch": 1475} {"train_loss": -22.674875259399414, "global_step": 122435, "epoch": 1475} {"train_loss": -22.207279205322266, "global_step": 122436, "epoch": 1475} {"train_loss": -22.53656578063965, "global_step": 122437, "epoch": 1475} {"train_loss": -22.35690689086914, "global_step": 122438, "epoch": 1475} {"train_loss": -22.553518295288086, "global_step": 122439, "epoch": 1475} {"train_loss": -22.571794509887695, "global_step": 122440, "epoch": 1475} {"train_loss": -22.42997932434082, "global_step": 122441, "epoch": 1475} {"train_loss": -22.766164779663086, "global_step": 122442, "epoch": 1475} {"train_loss": -22.287527084350586, "global_step": 122443, "epoch": 1475} {"train_loss": -22.50641441345215, "global_step": 122444, "epoch": 1475} {"train_loss": -22.51078224182129, "global_step": 122445, "epoch": 1475} {"train_loss": -22.67936134338379, "global_step": 122446, "epoch": 1475} {"train_loss": -22.519765853881836, "global_step": 122447, "epoch": 1475} {"train_loss": -22.469738006591797, "global_step": 122448, "epoch": 1475} {"train_loss": -22.235260009765625, "global_step": 122449, "epoch": 1475} {"train_loss": -22.61766242980957, "global_step": 122450, "epoch": 1475} {"train_loss": -22.396032333374023, "global_step": 122451, "epoch": 1475} {"train_loss": -22.75244140625, "global_step": 122452, "epoch": 1475} {"train_loss": -22.31597137451172, "global_step": 122453, "epoch": 1475} {"train_loss": -22.412282943725586, "global_step": 122454, "epoch": 1475} {"train_loss": -22.602731704711914, "global_step": 122455, "epoch": 1475} {"train_loss": -22.53171730041504, "global_step": 122456, "epoch": 1475} {"train_loss": -22.782819747924805, "global_step": 122457, "epoch": 1475} {"train_loss": -22.380863189697266, "global_step": 122458, "epoch": 1475} {"train_loss": -22.562368392944336, "global_step": 122459, "epoch": 1475} {"train_loss": -22.757854461669922, "global_step": 122460, "epoch": 1475} {"train_loss": -22.824155807495117, "global_step": 122461, "epoch": 1475} {"train_loss": -22.7164306640625, "global_step": 122462, "epoch": 1475} {"train_loss": -22.76104736328125, "global_step": 122463, "epoch": 1475} {"train_loss": -22.76010513305664, "global_step": 122464, "epoch": 1475} {"train_loss": -23.028593063354492, "global_step": 122465, "epoch": 1475} {"train_loss": -22.72539710998535, "global_step": 122466, "epoch": 1475} {"train_loss": -22.59389877319336, "global_step": 122467, "epoch": 1475} {"train_loss": -22.202009201049805, "global_step": 122468, "epoch": 1475} {"train_loss": -22.597843170166016, "global_step": 122469, "epoch": 1475} {"train_loss": -22.68951988220215, "global_step": 122470, "epoch": 1475} {"train_loss": -22.63799476623535, "global_step": 122471, "epoch": 1475} {"train_loss": -22.33551025390625, "global_step": 122472, "epoch": 1475} {"train_loss": -22.25, "global_step": 122473, "epoch": 1475} {"train_loss": -22.711912155151367, "global_step": 122474, "epoch": 1475} {"train_loss": -22.380510330200195, "global_step": 122475, "epoch": 1475} {"train_loss": -22.378376007080078, "global_step": 122476, "epoch": 1475} {"train_loss": -22.61830711364746, "global_step": 122477, "epoch": 1475} {"train_loss": -22.659317016601562, "global_step": 122478, "epoch": 1475} {"train_loss": -21.99117660522461, "global_step": 122479, "epoch": 1475} {"train_loss": -22.890052795410156, "global_step": 122480, "epoch": 1475} {"train_loss": -22.589933395385742, "global_step": 122481, "epoch": 1475} {"train_loss": -22.601348876953125, "global_step": 122482, "epoch": 1475} {"train_loss": -22.98455238342285, "global_step": 122483, "epoch": 1475} {"train_loss": -22.909399032592773, "global_step": 122484, "epoch": 1475} {"train_loss": -22.534337997436523, "global_step": 122485, "epoch": 1475} {"train_loss": -22.25844383239746, "global_step": 122486, "epoch": 1475} {"train_loss": -22.455013275146484, "global_step": 122487, "epoch": 1475} {"train_loss": -22.68185806274414, "global_step": 122488, "epoch": 1475} {"train_loss": -22.619359970092773, "global_step": 122489, "epoch": 1475} {"train_loss": -22.459970474243164, "global_step": 122490, "epoch": 1475} {"train_loss": -23.10370445251465, "global_step": 122491, "epoch": 1475} {"train_loss": -22.478147506713867, "global_step": 122492, "epoch": 1475} {"train_loss": -22.635414123535156, "global_step": 122493, "epoch": 1475} {"train_loss": -22.704694747924805, "global_step": 122494, "epoch": 1475} {"train_loss": -22.72685432434082, "global_step": 122495, "epoch": 1475} {"train_loss": -22.734464645385742, "global_step": 122496, "epoch": 1475} {"train_loss": -22.43367576599121, "global_step": 122497, "epoch": 1475} {"train_loss": -22.569547653198242, "global_step": 122498, "epoch": 1475} {"train_loss": -23.089136123657227, "global_step": 122499, "epoch": 1475} {"train_loss": -22.845300674438477, "global_step": 122500, "epoch": 1475} {"train_loss": -22.45253562927246, "global_step": 122501, "epoch": 1475} {"train_loss": -22.62281608581543, "global_step": 122502, "epoch": 1475} {"train_loss": -22.62588882446289, "global_step": 122503, "epoch": 1475} {"train_loss": -22.58350944519043, "global_step": 122504, "epoch": 1475} {"train_loss": -22.73103141784668, "global_step": 122505, "epoch": 1475} {"train_loss": -22.764719009399414, "global_step": 122506, "epoch": 1475} {"train_loss": -22.56458843185241, "global_step": 122507, "epoch": 1475, "val_loss": 6084458.5} {"train_loss": -21.374526977539062, "global_step": 122508, "epoch": 1476} {"train_loss": -21.807601928710938, "global_step": 122509, "epoch": 1476} {"train_loss": -22.597322463989258, "global_step": 122510, "epoch": 1476} {"train_loss": -21.995311737060547, "global_step": 122511, "epoch": 1476} {"train_loss": -21.678293228149414, "global_step": 122512, "epoch": 1476} {"train_loss": -22.402183532714844, "global_step": 122513, "epoch": 1476} {"train_loss": -21.92403221130371, "global_step": 122514, "epoch": 1476} {"train_loss": -22.25611686706543, "global_step": 122515, "epoch": 1476} {"train_loss": -21.95079231262207, "global_step": 122516, "epoch": 1476} {"train_loss": -22.160175323486328, "global_step": 122517, "epoch": 1476} {"train_loss": -22.327816009521484, "global_step": 122518, "epoch": 1476} {"train_loss": -21.9130859375, "global_step": 122519, "epoch": 1476} {"train_loss": -22.388029098510742, "global_step": 122520, "epoch": 1476} {"train_loss": -22.055194854736328, "global_step": 122521, "epoch": 1476} {"train_loss": -22.095075607299805, "global_step": 122522, "epoch": 1476} {"train_loss": -22.233957290649414, "global_step": 122523, "epoch": 1476} {"train_loss": -22.450265884399414, "global_step": 122524, "epoch": 1476} {"train_loss": -22.206205368041992, "global_step": 122525, "epoch": 1476} {"train_loss": -22.363296508789062, "global_step": 122526, "epoch": 1476} {"train_loss": -22.46013832092285, "global_step": 122527, "epoch": 1476} {"train_loss": -22.621925354003906, "global_step": 122528, "epoch": 1476} {"train_loss": -22.5323486328125, "global_step": 122529, "epoch": 1476} {"train_loss": -22.599058151245117, "global_step": 122530, "epoch": 1476} {"train_loss": -22.52571678161621, "global_step": 122531, "epoch": 1476} {"train_loss": -22.693471908569336, "global_step": 122532, "epoch": 1476} {"train_loss": -22.809507369995117, "global_step": 122533, "epoch": 1476} {"train_loss": -22.63901710510254, "global_step": 122534, "epoch": 1476} {"train_loss": -22.94254493713379, "global_step": 122535, "epoch": 1476} {"train_loss": -22.700735092163086, "global_step": 122536, "epoch": 1476} {"train_loss": -22.821609497070312, "global_step": 122537, "epoch": 1476} {"train_loss": -22.41428565979004, "global_step": 122538, "epoch": 1476} {"train_loss": -23.164405822753906, "global_step": 122539, "epoch": 1476} {"train_loss": -22.573461532592773, "global_step": 122540, "epoch": 1476} {"train_loss": -22.704931259155273, "global_step": 122541, "epoch": 1476} {"train_loss": -22.805078506469727, "global_step": 122542, "epoch": 1476} {"train_loss": -22.863924026489258, "global_step": 122543, "epoch": 1476} {"train_loss": -22.558242797851562, "global_step": 122544, "epoch": 1476} {"train_loss": -22.76333999633789, "global_step": 122545, "epoch": 1476} {"train_loss": -22.76326560974121, "global_step": 122546, "epoch": 1476} {"train_loss": -22.89992332458496, "global_step": 122547, "epoch": 1476} {"train_loss": -22.824203491210938, "global_step": 122548, "epoch": 1476} {"train_loss": -22.932098388671875, "global_step": 122549, "epoch": 1476} {"train_loss": -22.530088424682617, "global_step": 122550, "epoch": 1476} {"train_loss": -22.758665084838867, "global_step": 122551, "epoch": 1476} {"train_loss": -22.597412109375, "global_step": 122552, "epoch": 1476} {"train_loss": -22.74983787536621, "global_step": 122553, "epoch": 1476} {"train_loss": -22.766767501831055, "global_step": 122554, "epoch": 1476} {"train_loss": -22.421293258666992, "global_step": 122555, "epoch": 1476} {"train_loss": -22.516653060913086, "global_step": 122556, "epoch": 1476} {"train_loss": -22.37302017211914, "global_step": 122557, "epoch": 1476} {"train_loss": -22.673254013061523, "global_step": 122558, "epoch": 1476} {"train_loss": -22.3408145904541, "global_step": 122559, "epoch": 1476} {"train_loss": -22.56634521484375, "global_step": 122560, "epoch": 1476} {"train_loss": -22.697616577148438, "global_step": 122561, "epoch": 1476} {"train_loss": -22.753814697265625, "global_step": 122562, "epoch": 1476} {"train_loss": -22.664840698242188, "global_step": 122563, "epoch": 1476} {"train_loss": -22.605802536010742, "global_step": 122564, "epoch": 1476} {"train_loss": -22.61484146118164, "global_step": 122565, "epoch": 1476} {"train_loss": -22.612733840942383, "global_step": 122566, "epoch": 1476} {"train_loss": -22.386985778808594, "global_step": 122567, "epoch": 1476} {"train_loss": -22.35511589050293, "global_step": 122568, "epoch": 1476} {"train_loss": -22.687076568603516, "global_step": 122569, "epoch": 1476} {"train_loss": -22.68269920349121, "global_step": 122570, "epoch": 1476} {"train_loss": -22.731369018554688, "global_step": 122571, "epoch": 1476} {"train_loss": -22.29514503479004, "global_step": 122572, "epoch": 1476} {"train_loss": -22.581308364868164, "global_step": 122573, "epoch": 1476} {"train_loss": -22.66336441040039, "global_step": 122574, "epoch": 1476} {"train_loss": -23.12796974182129, "global_step": 122575, "epoch": 1476} {"train_loss": -22.466907501220703, "global_step": 122576, "epoch": 1476} {"train_loss": -22.481399536132812, "global_step": 122577, "epoch": 1476} {"train_loss": -22.99583625793457, "global_step": 122578, "epoch": 1476} {"train_loss": -22.868816375732422, "global_step": 122579, "epoch": 1476} {"train_loss": -22.742595672607422, "global_step": 122580, "epoch": 1476} {"train_loss": -22.702991485595703, "global_step": 122581, "epoch": 1476} {"train_loss": -22.543617248535156, "global_step": 122582, "epoch": 1476} {"train_loss": -22.599184036254883, "global_step": 122583, "epoch": 1476} {"train_loss": -22.404939651489258, "global_step": 122584, "epoch": 1476} {"train_loss": -22.364511489868164, "global_step": 122585, "epoch": 1476} {"train_loss": -22.7722225189209, "global_step": 122586, "epoch": 1476} {"train_loss": -22.685640335083008, "global_step": 122587, "epoch": 1476} {"train_loss": -22.70557975769043, "global_step": 122588, "epoch": 1476} {"train_loss": -23.124897003173828, "global_step": 122589, "epoch": 1476} {"train_loss": -22.530928416424487, "global_step": 122590, "epoch": 1476, "val_loss": 6185895.0} {"train_loss": -21.339384078979492, "global_step": 122591, "epoch": 1477} {"train_loss": -21.64764976501465, "global_step": 122592, "epoch": 1477} {"train_loss": -21.64811134338379, "global_step": 122593, "epoch": 1477} {"train_loss": -21.556812286376953, "global_step": 122594, "epoch": 1477} {"train_loss": -21.567852020263672, "global_step": 122595, "epoch": 1477} {"train_loss": -21.620594024658203, "global_step": 122596, "epoch": 1477} {"train_loss": -21.483440399169922, "global_step": 122597, "epoch": 1477} {"train_loss": -22.133825302124023, "global_step": 122598, "epoch": 1477} {"train_loss": -21.729778289794922, "global_step": 122599, "epoch": 1477} {"train_loss": -21.882644653320312, "global_step": 122600, "epoch": 1477} {"train_loss": -22.061492919921875, "global_step": 122601, "epoch": 1477} {"train_loss": -21.843799591064453, "global_step": 122602, "epoch": 1477} {"train_loss": -22.276826858520508, "global_step": 122603, "epoch": 1477} {"train_loss": -22.192214965820312, "global_step": 122604, "epoch": 1477} {"train_loss": -22.231386184692383, "global_step": 122605, "epoch": 1477} {"train_loss": -22.088029861450195, "global_step": 122606, "epoch": 1477} {"train_loss": -22.047758102416992, "global_step": 122607, "epoch": 1477} {"train_loss": -22.00499725341797, "global_step": 122608, "epoch": 1477} {"train_loss": -22.63558006286621, "global_step": 122609, "epoch": 1477} {"train_loss": -22.44573402404785, "global_step": 122610, "epoch": 1477} {"train_loss": -22.382301330566406, "global_step": 122611, "epoch": 1477} {"train_loss": -22.483367919921875, "global_step": 122612, "epoch": 1477} {"train_loss": -22.53934669494629, "global_step": 122613, "epoch": 1477} {"train_loss": -22.31031608581543, "global_step": 122614, "epoch": 1477} {"train_loss": -22.330236434936523, "global_step": 122615, "epoch": 1477} {"train_loss": -22.41790771484375, "global_step": 122616, "epoch": 1477} {"train_loss": -22.330406188964844, "global_step": 122617, "epoch": 1477} {"train_loss": -22.278839111328125, "global_step": 122618, "epoch": 1477} {"train_loss": -22.544208526611328, "global_step": 122619, "epoch": 1477} {"train_loss": -22.898500442504883, "global_step": 122620, "epoch": 1477} {"train_loss": -22.609039306640625, "global_step": 122621, "epoch": 1477} {"train_loss": -22.90752601623535, "global_step": 122622, "epoch": 1477} {"train_loss": -22.930051803588867, "global_step": 122623, "epoch": 1477} {"train_loss": -22.896074295043945, "global_step": 122624, "epoch": 1477} {"train_loss": -22.668359756469727, "global_step": 122625, "epoch": 1477} {"train_loss": -22.428287506103516, "global_step": 122626, "epoch": 1477} {"train_loss": -22.399648666381836, "global_step": 122627, "epoch": 1477} {"train_loss": -22.588476181030273, "global_step": 122628, "epoch": 1477} {"train_loss": -22.59316635131836, "global_step": 122629, "epoch": 1477} {"train_loss": -22.738414764404297, "global_step": 122630, "epoch": 1477} {"train_loss": -22.501096725463867, "global_step": 122631, "epoch": 1477} {"train_loss": -22.56778907775879, "global_step": 122632, "epoch": 1477} {"train_loss": -22.229536056518555, "global_step": 122633, "epoch": 1477} {"train_loss": -22.677942276000977, "global_step": 122634, "epoch": 1477} {"train_loss": -22.727802276611328, "global_step": 122635, "epoch": 1477} {"train_loss": -22.80803108215332, "global_step": 122636, "epoch": 1477} {"train_loss": -22.40439796447754, "global_step": 122637, "epoch": 1477} {"train_loss": -22.579904556274414, "global_step": 122638, "epoch": 1477} {"train_loss": -22.506275177001953, "global_step": 122639, "epoch": 1477} {"train_loss": -22.056461334228516, "global_step": 122640, "epoch": 1477} {"train_loss": -22.019683837890625, "global_step": 122641, "epoch": 1477} {"train_loss": -22.57337760925293, "global_step": 122642, "epoch": 1477} {"train_loss": -22.657873153686523, "global_step": 122643, "epoch": 1477} {"train_loss": -22.993473052978516, "global_step": 122644, "epoch": 1477} {"train_loss": -22.718463897705078, "global_step": 122645, "epoch": 1477} {"train_loss": -22.145917892456055, "global_step": 122646, "epoch": 1477} {"train_loss": -22.563926696777344, "global_step": 122647, "epoch": 1477} {"train_loss": -21.92169189453125, "global_step": 122648, "epoch": 1477} {"train_loss": -22.698598861694336, "global_step": 122649, "epoch": 1477} {"train_loss": -22.720237731933594, "global_step": 122650, "epoch": 1477} {"train_loss": -22.146879196166992, "global_step": 122651, "epoch": 1477} {"train_loss": -22.608572006225586, "global_step": 122652, "epoch": 1477} {"train_loss": -22.586856842041016, "global_step": 122653, "epoch": 1477} {"train_loss": -22.659378051757812, "global_step": 122654, "epoch": 1477} {"train_loss": -22.148578643798828, "global_step": 122655, "epoch": 1477} {"train_loss": -22.475921630859375, "global_step": 122656, "epoch": 1477} {"train_loss": -22.515161514282227, "global_step": 122657, "epoch": 1477} {"train_loss": -22.668323516845703, "global_step": 122658, "epoch": 1477} {"train_loss": -22.508974075317383, "global_step": 122659, "epoch": 1477} {"train_loss": -22.552377700805664, "global_step": 122660, "epoch": 1477} {"train_loss": -22.806987762451172, "global_step": 122661, "epoch": 1477} {"train_loss": -22.320974349975586, "global_step": 122662, "epoch": 1477} {"train_loss": -22.68526268005371, "global_step": 122663, "epoch": 1477} {"train_loss": -22.851110458374023, "global_step": 122664, "epoch": 1477} {"train_loss": -22.351314544677734, "global_step": 122665, "epoch": 1477} {"train_loss": -22.360008239746094, "global_step": 122666, "epoch": 1477} {"train_loss": -22.47562026977539, "global_step": 122667, "epoch": 1477} {"train_loss": -22.52113914489746, "global_step": 122668, "epoch": 1477} {"train_loss": -22.550827026367188, "global_step": 122669, "epoch": 1477} {"train_loss": -22.664306640625, "global_step": 122670, "epoch": 1477} {"train_loss": -22.624502182006836, "global_step": 122671, "epoch": 1477} {"train_loss": -22.935535430908203, "global_step": 122672, "epoch": 1477} {"train_loss": -22.39210353989199, "global_step": 122673, "epoch": 1477, "val_loss": 6312871.0} {"train_loss": -21.918371200561523, "global_step": 122674, "epoch": 1478} {"train_loss": -22.130992889404297, "global_step": 122675, "epoch": 1478} {"train_loss": -22.018457412719727, "global_step": 122676, "epoch": 1478} {"train_loss": -22.402603149414062, "global_step": 122677, "epoch": 1478} {"train_loss": -22.149351119995117, "global_step": 122678, "epoch": 1478} {"train_loss": -21.87851905822754, "global_step": 122679, "epoch": 1478} {"train_loss": -22.150869369506836, "global_step": 122680, "epoch": 1478} {"train_loss": -22.253040313720703, "global_step": 122681, "epoch": 1478} {"train_loss": -22.083087921142578, "global_step": 122682, "epoch": 1478} {"train_loss": -22.23288917541504, "global_step": 122683, "epoch": 1478} {"train_loss": -22.370346069335938, "global_step": 122684, "epoch": 1478} {"train_loss": -22.279491424560547, "global_step": 122685, "epoch": 1478} {"train_loss": -22.386470794677734, "global_step": 122686, "epoch": 1478} {"train_loss": -22.499406814575195, "global_step": 122687, "epoch": 1478} {"train_loss": -22.432514190673828, "global_step": 122688, "epoch": 1478} {"train_loss": -22.13970947265625, "global_step": 122689, "epoch": 1478} {"train_loss": -22.56461524963379, "global_step": 122690, "epoch": 1478} {"train_loss": -22.581960678100586, "global_step": 122691, "epoch": 1478} {"train_loss": -22.39047622680664, "global_step": 122692, "epoch": 1478} {"train_loss": -22.49492645263672, "global_step": 122693, "epoch": 1478} {"train_loss": -22.303678512573242, "global_step": 122694, "epoch": 1478} {"train_loss": -22.47927474975586, "global_step": 122695, "epoch": 1478} {"train_loss": -22.251340866088867, "global_step": 122696, "epoch": 1478} {"train_loss": -22.73301124572754, "global_step": 122697, "epoch": 1478} {"train_loss": -22.680252075195312, "global_step": 122698, "epoch": 1478} {"train_loss": -22.058025360107422, "global_step": 122699, "epoch": 1478} {"train_loss": -22.224061965942383, "global_step": 122700, "epoch": 1478} {"train_loss": -22.479185104370117, "global_step": 122701, "epoch": 1478} {"train_loss": -22.50665283203125, "global_step": 122702, "epoch": 1478} {"train_loss": -22.670501708984375, "global_step": 122703, "epoch": 1478} {"train_loss": -22.703977584838867, "global_step": 122704, "epoch": 1478} {"train_loss": -22.42531967163086, "global_step": 122705, "epoch": 1478} {"train_loss": -22.64875602722168, "global_step": 122706, "epoch": 1478} {"train_loss": -22.348445892333984, "global_step": 122707, "epoch": 1478} {"train_loss": -22.578441619873047, "global_step": 122708, "epoch": 1478} {"train_loss": -22.58220100402832, "global_step": 122709, "epoch": 1478} {"train_loss": -22.637659072875977, "global_step": 122710, "epoch": 1478} {"train_loss": -22.745641708374023, "global_step": 122711, "epoch": 1478} {"train_loss": -22.582204818725586, "global_step": 122712, "epoch": 1478} {"train_loss": -22.549734115600586, "global_step": 122713, "epoch": 1478} {"train_loss": -22.40900993347168, "global_step": 122714, "epoch": 1478} {"train_loss": -22.769500732421875, "global_step": 122715, "epoch": 1478} {"train_loss": -22.055133819580078, "global_step": 122716, "epoch": 1478} {"train_loss": -23.00340461730957, "global_step": 122717, "epoch": 1478} {"train_loss": -22.568185806274414, "global_step": 122718, "epoch": 1478} {"train_loss": -22.220685958862305, "global_step": 122719, "epoch": 1478} {"train_loss": -22.48309326171875, "global_step": 122720, "epoch": 1478} {"train_loss": -22.23675537109375, "global_step": 122721, "epoch": 1478} {"train_loss": -22.818195343017578, "global_step": 122722, "epoch": 1478} {"train_loss": -22.95370864868164, "global_step": 122723, "epoch": 1478} {"train_loss": -22.6303653717041, "global_step": 122724, "epoch": 1478} {"train_loss": -22.563634872436523, "global_step": 122725, "epoch": 1478} {"train_loss": -22.266965866088867, "global_step": 122726, "epoch": 1478} {"train_loss": -22.92879295349121, "global_step": 122727, "epoch": 1478} {"train_loss": -22.710180282592773, "global_step": 122728, "epoch": 1478} {"train_loss": -22.71286964416504, "global_step": 122729, "epoch": 1478} {"train_loss": -22.6790771484375, "global_step": 122730, "epoch": 1478} {"train_loss": -22.328580856323242, "global_step": 122731, "epoch": 1478} {"train_loss": -22.56513023376465, "global_step": 122732, "epoch": 1478} {"train_loss": -22.75968360900879, "global_step": 122733, "epoch": 1478} {"train_loss": -22.609411239624023, "global_step": 122734, "epoch": 1478} {"train_loss": -22.60468101501465, "global_step": 122735, "epoch": 1478} {"train_loss": -22.64044952392578, "global_step": 122736, "epoch": 1478} {"train_loss": -22.776533126831055, "global_step": 122737, "epoch": 1478} {"train_loss": -22.818037033081055, "global_step": 122738, "epoch": 1478} {"train_loss": -22.55512046813965, "global_step": 122739, "epoch": 1478} {"train_loss": -22.24268341064453, "global_step": 122740, "epoch": 1478} {"train_loss": -22.792987823486328, "global_step": 122741, "epoch": 1478} {"train_loss": -22.498960494995117, "global_step": 122742, "epoch": 1478} {"train_loss": -22.726898193359375, "global_step": 122743, "epoch": 1478} {"train_loss": -22.634004592895508, "global_step": 122744, "epoch": 1478} {"train_loss": -22.431095123291016, "global_step": 122745, "epoch": 1478} {"train_loss": -22.47342872619629, "global_step": 122746, "epoch": 1478} {"train_loss": -22.80647850036621, "global_step": 122747, "epoch": 1478} {"train_loss": -22.637540817260742, "global_step": 122748, "epoch": 1478} {"train_loss": -23.0566349029541, "global_step": 122749, "epoch": 1478} {"train_loss": -22.646839141845703, "global_step": 122750, "epoch": 1478} {"train_loss": -22.5296573638916, "global_step": 122751, "epoch": 1478} {"train_loss": -22.842069625854492, "global_step": 122752, "epoch": 1478} {"train_loss": -22.833633422851562, "global_step": 122753, "epoch": 1478} {"train_loss": -22.925195693969727, "global_step": 122754, "epoch": 1478} {"train_loss": -22.56546401977539, "global_step": 122755, "epoch": 1478} {"train_loss": -22.510169362447346, "global_step": 122756, "epoch": 1478, "val_loss": 6214327.0} {"train_loss": -22.63136100769043, "global_step": 122757, "epoch": 1479} {"train_loss": -21.67059898376465, "global_step": 122758, "epoch": 1479} {"train_loss": -21.755075454711914, "global_step": 122759, "epoch": 1479} {"train_loss": -22.130109786987305, "global_step": 122760, "epoch": 1479} {"train_loss": -22.326602935791016, "global_step": 122761, "epoch": 1479} {"train_loss": -22.008085250854492, "global_step": 122762, "epoch": 1479} {"train_loss": -22.091596603393555, "global_step": 122763, "epoch": 1479} {"train_loss": -22.60055923461914, "global_step": 122764, "epoch": 1479} {"train_loss": -21.873037338256836, "global_step": 122765, "epoch": 1479} {"train_loss": -22.300508499145508, "global_step": 122766, "epoch": 1479} {"train_loss": -22.123666763305664, "global_step": 122767, "epoch": 1479} {"train_loss": -22.15618324279785, "global_step": 122768, "epoch": 1479} {"train_loss": -22.115598678588867, "global_step": 122769, "epoch": 1479} {"train_loss": -22.074888229370117, "global_step": 122770, "epoch": 1479} {"train_loss": -22.322019577026367, "global_step": 122771, "epoch": 1479} {"train_loss": -22.420103073120117, "global_step": 122772, "epoch": 1479} {"train_loss": -22.339574813842773, "global_step": 122773, "epoch": 1479} {"train_loss": -22.461925506591797, "global_step": 122774, "epoch": 1479} {"train_loss": -22.312665939331055, "global_step": 122775, "epoch": 1479} {"train_loss": -22.32407569885254, "global_step": 122776, "epoch": 1479} {"train_loss": -22.202932357788086, "global_step": 122777, "epoch": 1479} {"train_loss": -22.307228088378906, "global_step": 122778, "epoch": 1479} {"train_loss": -22.532379150390625, "global_step": 122779, "epoch": 1479} {"train_loss": -22.474699020385742, "global_step": 122780, "epoch": 1479} {"train_loss": -23.031558990478516, "global_step": 122781, "epoch": 1479} {"train_loss": -22.33680534362793, "global_step": 122782, "epoch": 1479} {"train_loss": -22.41916847229004, "global_step": 122783, "epoch": 1479} {"train_loss": -22.52705955505371, "global_step": 122784, "epoch": 1479} {"train_loss": -22.638975143432617, "global_step": 122785, "epoch": 1479} {"train_loss": -22.57249641418457, "global_step": 122786, "epoch": 1479} {"train_loss": -22.19721794128418, "global_step": 122787, "epoch": 1479} {"train_loss": -22.309986114501953, "global_step": 122788, "epoch": 1479} {"train_loss": -22.659839630126953, "global_step": 122789, "epoch": 1479} {"train_loss": -22.616147994995117, "global_step": 122790, "epoch": 1479} {"train_loss": -22.617109298706055, "global_step": 122791, "epoch": 1479} {"train_loss": -22.97222900390625, "global_step": 122792, "epoch": 1479} {"train_loss": -22.666248321533203, "global_step": 122793, "epoch": 1479} {"train_loss": -22.882217407226562, "global_step": 122794, "epoch": 1479} {"train_loss": -22.576248168945312, "global_step": 122795, "epoch": 1479} {"train_loss": -22.82582664489746, "global_step": 122796, "epoch": 1479} {"train_loss": -22.54636001586914, "global_step": 122797, "epoch": 1479} {"train_loss": -22.734296798706055, "global_step": 122798, "epoch": 1479} {"train_loss": -22.496923446655273, "global_step": 122799, "epoch": 1479} {"train_loss": -22.57663917541504, "global_step": 122800, "epoch": 1479} {"train_loss": -22.611658096313477, "global_step": 122801, "epoch": 1479} {"train_loss": -22.54493522644043, "global_step": 122802, "epoch": 1479} {"train_loss": -22.529447555541992, "global_step": 122803, "epoch": 1479} {"train_loss": -22.77791404724121, "global_step": 122804, "epoch": 1479} {"train_loss": -22.920507431030273, "global_step": 122805, "epoch": 1479} {"train_loss": -22.322980880737305, "global_step": 122806, "epoch": 1479} {"train_loss": -22.863061904907227, "global_step": 122807, "epoch": 1479} {"train_loss": -22.681259155273438, "global_step": 122808, "epoch": 1479} {"train_loss": -22.660409927368164, "global_step": 122809, "epoch": 1479} {"train_loss": -22.61960220336914, "global_step": 122810, "epoch": 1479} {"train_loss": -22.865234375, "global_step": 122811, "epoch": 1479} {"train_loss": -22.5849666595459, "global_step": 122812, "epoch": 1479} {"train_loss": -22.802579879760742, "global_step": 122813, "epoch": 1479} {"train_loss": -23.00554656982422, "global_step": 122814, "epoch": 1479} {"train_loss": -22.65102195739746, "global_step": 122815, "epoch": 1479} {"train_loss": -22.645658493041992, "global_step": 122816, "epoch": 1479} {"train_loss": -22.53565216064453, "global_step": 122817, "epoch": 1479} {"train_loss": -22.743255615234375, "global_step": 122818, "epoch": 1479} {"train_loss": -22.32538414001465, "global_step": 122819, "epoch": 1479} {"train_loss": -21.8969783782959, "global_step": 122820, "epoch": 1479} {"train_loss": -22.54798698425293, "global_step": 122821, "epoch": 1479} {"train_loss": -22.134990692138672, "global_step": 122822, "epoch": 1479} {"train_loss": -22.555419921875, "global_step": 122823, "epoch": 1479} {"train_loss": -22.469640731811523, "global_step": 122824, "epoch": 1479} {"train_loss": -22.718374252319336, "global_step": 122825, "epoch": 1479} {"train_loss": -22.824167251586914, "global_step": 122826, "epoch": 1479} {"train_loss": -22.67618179321289, "global_step": 122827, "epoch": 1479} {"train_loss": -22.895055770874023, "global_step": 122828, "epoch": 1479} {"train_loss": -22.605527877807617, "global_step": 122829, "epoch": 1479} {"train_loss": -22.720712661743164, "global_step": 122830, "epoch": 1479} {"train_loss": -22.64800262451172, "global_step": 122831, "epoch": 1479} {"train_loss": -22.977293014526367, "global_step": 122832, "epoch": 1479} {"train_loss": -22.564565658569336, "global_step": 122833, "epoch": 1479} {"train_loss": -22.661603927612305, "global_step": 122834, "epoch": 1479} {"train_loss": -23.11737060546875, "global_step": 122835, "epoch": 1479} {"train_loss": -22.804121017456055, "global_step": 122836, "epoch": 1479} {"train_loss": -22.520505905151367, "global_step": 122837, "epoch": 1479} {"train_loss": -22.876028060913086, "global_step": 122838, "epoch": 1479} {"train_loss": -22.51658947496529, "global_step": 122839, "epoch": 1479, "val_loss": 6302383.0} {"train_loss": -21.67841148376465, "global_step": 122840, "epoch": 1480} {"train_loss": -22.279193878173828, "global_step": 122841, "epoch": 1480} {"train_loss": -22.501863479614258, "global_step": 122842, "epoch": 1480} {"train_loss": -22.3836612701416, "global_step": 122843, "epoch": 1480} {"train_loss": -22.573177337646484, "global_step": 122844, "epoch": 1480} {"train_loss": -22.270872116088867, "global_step": 122845, "epoch": 1480} {"train_loss": -22.443525314331055, "global_step": 122846, "epoch": 1480} {"train_loss": -22.201480865478516, "global_step": 122847, "epoch": 1480} {"train_loss": -22.739646911621094, "global_step": 122848, "epoch": 1480} {"train_loss": -22.59920310974121, "global_step": 122849, "epoch": 1480} {"train_loss": -22.276535034179688, "global_step": 122850, "epoch": 1480} {"train_loss": -22.86720848083496, "global_step": 122851, "epoch": 1480} {"train_loss": -22.172266006469727, "global_step": 122852, "epoch": 1480} {"train_loss": -22.293514251708984, "global_step": 122853, "epoch": 1480} {"train_loss": -22.361501693725586, "global_step": 122854, "epoch": 1480} {"train_loss": -22.40956687927246, "global_step": 122855, "epoch": 1480} {"train_loss": -22.463998794555664, "global_step": 122856, "epoch": 1480} {"train_loss": -22.79578971862793, "global_step": 122857, "epoch": 1480} {"train_loss": -22.213760375976562, "global_step": 122858, "epoch": 1480} {"train_loss": -22.593515396118164, "global_step": 122859, "epoch": 1480} {"train_loss": -22.481887817382812, "global_step": 122860, "epoch": 1480} {"train_loss": -22.616857528686523, "global_step": 122861, "epoch": 1480} {"train_loss": -22.581878662109375, "global_step": 122862, "epoch": 1480} {"train_loss": -22.271900177001953, "global_step": 122863, "epoch": 1480} {"train_loss": -22.591033935546875, "global_step": 122864, "epoch": 1480} {"train_loss": -22.524831771850586, "global_step": 122865, "epoch": 1480} {"train_loss": -22.877504348754883, "global_step": 122866, "epoch": 1480} {"train_loss": -22.202295303344727, "global_step": 122867, "epoch": 1480} {"train_loss": -22.49860954284668, "global_step": 122868, "epoch": 1480} {"train_loss": -22.696086883544922, "global_step": 122869, "epoch": 1480} {"train_loss": -22.861482620239258, "global_step": 122870, "epoch": 1480} {"train_loss": -22.418319702148438, "global_step": 122871, "epoch": 1480} {"train_loss": -22.72723960876465, "global_step": 122872, "epoch": 1480} {"train_loss": -22.551023483276367, "global_step": 122873, "epoch": 1480} {"train_loss": -22.738433837890625, "global_step": 122874, "epoch": 1480} {"train_loss": -22.767866134643555, "global_step": 122875, "epoch": 1480} {"train_loss": -22.791698455810547, "global_step": 122876, "epoch": 1480} {"train_loss": -22.399503707885742, "global_step": 122877, "epoch": 1480} {"train_loss": -22.59039306640625, "global_step": 122878, "epoch": 1480} {"train_loss": -23.042673110961914, "global_step": 122879, "epoch": 1480} {"train_loss": -22.67949867248535, "global_step": 122880, "epoch": 1480} {"train_loss": -22.64322280883789, "global_step": 122881, "epoch": 1480} {"train_loss": -22.645645141601562, "global_step": 122882, "epoch": 1480} {"train_loss": -22.431612014770508, "global_step": 122883, "epoch": 1480} {"train_loss": -22.818498611450195, "global_step": 122884, "epoch": 1480} {"train_loss": -22.418676376342773, "global_step": 122885, "epoch": 1480} {"train_loss": -22.605260848999023, "global_step": 122886, "epoch": 1480} {"train_loss": -22.652040481567383, "global_step": 122887, "epoch": 1480} {"train_loss": -22.508481979370117, "global_step": 122888, "epoch": 1480} {"train_loss": -22.490835189819336, "global_step": 122889, "epoch": 1480} {"train_loss": -22.830265045166016, "global_step": 122890, "epoch": 1480} {"train_loss": -22.28896141052246, "global_step": 122891, "epoch": 1480} {"train_loss": -22.634319305419922, "global_step": 122892, "epoch": 1480} {"train_loss": -22.764163970947266, "global_step": 122893, "epoch": 1480} {"train_loss": -22.57410430908203, "global_step": 122894, "epoch": 1480} {"train_loss": -22.83439826965332, "global_step": 122895, "epoch": 1480} {"train_loss": -22.582075119018555, "global_step": 122896, "epoch": 1480} {"train_loss": -22.2740535736084, "global_step": 122897, "epoch": 1480} {"train_loss": -22.82753562927246, "global_step": 122898, "epoch": 1480} {"train_loss": -22.67612075805664, "global_step": 122899, "epoch": 1480} {"train_loss": -22.676979064941406, "global_step": 122900, "epoch": 1480} {"train_loss": -22.574684143066406, "global_step": 122901, "epoch": 1480} {"train_loss": -22.60235023498535, "global_step": 122902, "epoch": 1480} {"train_loss": -22.867961883544922, "global_step": 122903, "epoch": 1480} {"train_loss": -22.625852584838867, "global_step": 122904, "epoch": 1480} {"train_loss": -22.79408073425293, "global_step": 122905, "epoch": 1480} {"train_loss": -22.61045265197754, "global_step": 122906, "epoch": 1480} {"train_loss": -22.66705894470215, "global_step": 122907, "epoch": 1480} {"train_loss": -22.414670944213867, "global_step": 122908, "epoch": 1480} {"train_loss": -22.902252197265625, "global_step": 122909, "epoch": 1480} {"train_loss": -22.268781661987305, "global_step": 122910, "epoch": 1480} {"train_loss": -22.082761764526367, "global_step": 122911, "epoch": 1480} {"train_loss": -22.700992584228516, "global_step": 122912, "epoch": 1480} {"train_loss": -22.984615325927734, "global_step": 122913, "epoch": 1480} {"train_loss": -22.620712280273438, "global_step": 122914, "epoch": 1480} {"train_loss": -22.575881958007812, "global_step": 122915, "epoch": 1480} {"train_loss": -22.58907127380371, "global_step": 122916, "epoch": 1480} {"train_loss": -22.40187644958496, "global_step": 122917, "epoch": 1480} {"train_loss": -22.71773338317871, "global_step": 122918, "epoch": 1480} {"train_loss": -22.83540153503418, "global_step": 122919, "epoch": 1480} {"train_loss": -22.954975128173828, "global_step": 122920, "epoch": 1480} {"train_loss": -22.830564498901367, "global_step": 122921, "epoch": 1480} {"train_loss": -22.566546612475292, "global_step": 122922, "epoch": 1480, "val_loss": 6159849.5} {"train_loss": -22.41969871520996, "global_step": 122923, "epoch": 1481} {"train_loss": -22.69221305847168, "global_step": 122924, "epoch": 1481} {"train_loss": -22.42595863342285, "global_step": 122925, "epoch": 1481} {"train_loss": -22.3560791015625, "global_step": 122926, "epoch": 1481} {"train_loss": -22.258426666259766, "global_step": 122927, "epoch": 1481} {"train_loss": -22.118175506591797, "global_step": 122928, "epoch": 1481} {"train_loss": -22.42237663269043, "global_step": 122929, "epoch": 1481} {"train_loss": -22.592161178588867, "global_step": 122930, "epoch": 1481} {"train_loss": -22.91593360900879, "global_step": 122931, "epoch": 1481} {"train_loss": -22.600013732910156, "global_step": 122932, "epoch": 1481} {"train_loss": -22.598791122436523, "global_step": 122933, "epoch": 1481} {"train_loss": -22.34685707092285, "global_step": 122934, "epoch": 1481} {"train_loss": -22.28133773803711, "global_step": 122935, "epoch": 1481} {"train_loss": -22.507532119750977, "global_step": 122936, "epoch": 1481} {"train_loss": -22.602094650268555, "global_step": 122937, "epoch": 1481} {"train_loss": -22.53517723083496, "global_step": 122938, "epoch": 1481} {"train_loss": -22.457111358642578, "global_step": 122939, "epoch": 1481} {"train_loss": -22.149269104003906, "global_step": 122940, "epoch": 1481} {"train_loss": -22.66022491455078, "global_step": 122941, "epoch": 1481} {"train_loss": -22.283615112304688, "global_step": 122942, "epoch": 1481} {"train_loss": -22.35285758972168, "global_step": 122943, "epoch": 1481} {"train_loss": -22.75160026550293, "global_step": 122944, "epoch": 1481} {"train_loss": -22.365392684936523, "global_step": 122945, "epoch": 1481} {"train_loss": -22.26247215270996, "global_step": 122946, "epoch": 1481} {"train_loss": -22.39283561706543, "global_step": 122947, "epoch": 1481} {"train_loss": -22.674182891845703, "global_step": 122948, "epoch": 1481} {"train_loss": -23.264183044433594, "global_step": 122949, "epoch": 1481} {"train_loss": -22.551374435424805, "global_step": 122950, "epoch": 1481} {"train_loss": -22.426376342773438, "global_step": 122951, "epoch": 1481} {"train_loss": -22.518096923828125, "global_step": 122952, "epoch": 1481} {"train_loss": -22.383848190307617, "global_step": 122953, "epoch": 1481} {"train_loss": -22.72517967224121, "global_step": 122954, "epoch": 1481} {"train_loss": -22.789762496948242, "global_step": 122955, "epoch": 1481} {"train_loss": -22.593505859375, "global_step": 122956, "epoch": 1481} {"train_loss": -22.753570556640625, "global_step": 122957, "epoch": 1481} {"train_loss": -22.76142692565918, "global_step": 122958, "epoch": 1481} {"train_loss": -22.70442008972168, "global_step": 122959, "epoch": 1481} {"train_loss": -22.816926956176758, "global_step": 122960, "epoch": 1481} {"train_loss": -22.688844680786133, "global_step": 122961, "epoch": 1481} {"train_loss": -22.624990463256836, "global_step": 122962, "epoch": 1481} {"train_loss": -22.806474685668945, "global_step": 122963, "epoch": 1481} {"train_loss": -22.615102767944336, "global_step": 122964, "epoch": 1481} {"train_loss": -22.90435218811035, "global_step": 122965, "epoch": 1481} {"train_loss": -22.54315757751465, "global_step": 122966, "epoch": 1481} {"train_loss": -22.556730270385742, "global_step": 122967, "epoch": 1481} {"train_loss": -22.69866943359375, "global_step": 122968, "epoch": 1481} {"train_loss": -22.3842716217041, "global_step": 122969, "epoch": 1481} {"train_loss": -22.64717674255371, "global_step": 122970, "epoch": 1481} {"train_loss": -22.554555892944336, "global_step": 122971, "epoch": 1481} {"train_loss": -22.699934005737305, "global_step": 122972, "epoch": 1481} {"train_loss": -22.43061637878418, "global_step": 122973, "epoch": 1481} {"train_loss": -22.151723861694336, "global_step": 122974, "epoch": 1481} {"train_loss": -22.806467056274414, "global_step": 122975, "epoch": 1481} {"train_loss": -22.90945816040039, "global_step": 122976, "epoch": 1481} {"train_loss": -22.282684326171875, "global_step": 122977, "epoch": 1481} {"train_loss": -22.42707633972168, "global_step": 122978, "epoch": 1481} {"train_loss": -22.41399574279785, "global_step": 122979, "epoch": 1481} {"train_loss": -22.48809242248535, "global_step": 122980, "epoch": 1481} {"train_loss": -22.61878776550293, "global_step": 122981, "epoch": 1481} {"train_loss": -22.51032257080078, "global_step": 122982, "epoch": 1481} {"train_loss": -22.480497360229492, "global_step": 122983, "epoch": 1481} {"train_loss": -22.301374435424805, "global_step": 122984, "epoch": 1481} {"train_loss": -22.567834854125977, "global_step": 122985, "epoch": 1481} {"train_loss": -22.586698532104492, "global_step": 122986, "epoch": 1481} {"train_loss": -22.568321228027344, "global_step": 122987, "epoch": 1481} {"train_loss": -22.417871475219727, "global_step": 122988, "epoch": 1481} {"train_loss": -22.441097259521484, "global_step": 122989, "epoch": 1481} {"train_loss": -22.642362594604492, "global_step": 122990, "epoch": 1481} {"train_loss": -22.77387046813965, "global_step": 122991, "epoch": 1481} {"train_loss": -22.533432006835938, "global_step": 122992, "epoch": 1481} {"train_loss": -22.639047622680664, "global_step": 122993, "epoch": 1481} {"train_loss": -23.046911239624023, "global_step": 122994, "epoch": 1481} {"train_loss": -22.639379501342773, "global_step": 122995, "epoch": 1481} {"train_loss": -22.645715713500977, "global_step": 122996, "epoch": 1481} {"train_loss": -22.56043815612793, "global_step": 122997, "epoch": 1481} {"train_loss": -22.441823959350586, "global_step": 122998, "epoch": 1481} {"train_loss": -22.64973258972168, "global_step": 122999, "epoch": 1481} {"train_loss": -22.654905319213867, "global_step": 123000, "epoch": 1481} {"train_loss": -22.65761375427246, "global_step": 123001, "epoch": 1481} {"train_loss": -22.805288314819336, "global_step": 123002, "epoch": 1481} {"train_loss": -22.586191177368164, "global_step": 123003, "epoch": 1481} {"train_loss": -22.621675491333008, "global_step": 123004, "epoch": 1481} {"train_loss": -22.5638536660068, "global_step": 123005, "epoch": 1481, "val_loss": 6202717.0} {"train_loss": -21.947080612182617, "global_step": 123006, "epoch": 1482} {"train_loss": -22.4796142578125, "global_step": 123007, "epoch": 1482} {"train_loss": -22.687925338745117, "global_step": 123008, "epoch": 1482} {"train_loss": -22.53664207458496, "global_step": 123009, "epoch": 1482} {"train_loss": -22.852441787719727, "global_step": 123010, "epoch": 1482} {"train_loss": -22.27522850036621, "global_step": 123011, "epoch": 1482} {"train_loss": -22.550718307495117, "global_step": 123012, "epoch": 1482} {"train_loss": -22.692747116088867, "global_step": 123013, "epoch": 1482} {"train_loss": -22.54276466369629, "global_step": 123014, "epoch": 1482} {"train_loss": -22.290571212768555, "global_step": 123015, "epoch": 1482} {"train_loss": -22.52769660949707, "global_step": 123016, "epoch": 1482} {"train_loss": -22.540191650390625, "global_step": 123017, "epoch": 1482} {"train_loss": -22.538955688476562, "global_step": 123018, "epoch": 1482} {"train_loss": -22.28630828857422, "global_step": 123019, "epoch": 1482} {"train_loss": -22.865102767944336, "global_step": 123020, "epoch": 1482} {"train_loss": -22.2156925201416, "global_step": 123021, "epoch": 1482} {"train_loss": -22.4215030670166, "global_step": 123022, "epoch": 1482} {"train_loss": -22.430112838745117, "global_step": 123023, "epoch": 1482} {"train_loss": -22.36431884765625, "global_step": 123024, "epoch": 1482} {"train_loss": -22.469945907592773, "global_step": 123025, "epoch": 1482} {"train_loss": -22.58406639099121, "global_step": 123026, "epoch": 1482} {"train_loss": -22.536441802978516, "global_step": 123027, "epoch": 1482} {"train_loss": -22.62613868713379, "global_step": 123028, "epoch": 1482} {"train_loss": -22.564542770385742, "global_step": 123029, "epoch": 1482} {"train_loss": -22.697641372680664, "global_step": 123030, "epoch": 1482} {"train_loss": -22.52329444885254, "global_step": 123031, "epoch": 1482} {"train_loss": -22.570178985595703, "global_step": 123032, "epoch": 1482} {"train_loss": -22.363248825073242, "global_step": 123033, "epoch": 1482} {"train_loss": -22.534395217895508, "global_step": 123034, "epoch": 1482} {"train_loss": -22.417654037475586, "global_step": 123035, "epoch": 1482} {"train_loss": -22.9229736328125, "global_step": 123036, "epoch": 1482} {"train_loss": -22.93704605102539, "global_step": 123037, "epoch": 1482} {"train_loss": -22.824209213256836, "global_step": 123038, "epoch": 1482} {"train_loss": -22.665145874023438, "global_step": 123039, "epoch": 1482} {"train_loss": -22.907167434692383, "global_step": 123040, "epoch": 1482} {"train_loss": -22.6522216796875, "global_step": 123041, "epoch": 1482} {"train_loss": -22.68625259399414, "global_step": 123042, "epoch": 1482} {"train_loss": -22.684295654296875, "global_step": 123043, "epoch": 1482} {"train_loss": -22.617368698120117, "global_step": 123044, "epoch": 1482} {"train_loss": -22.54483413696289, "global_step": 123045, "epoch": 1482} {"train_loss": -22.851613998413086, "global_step": 123046, "epoch": 1482} {"train_loss": -22.928516387939453, "global_step": 123047, "epoch": 1482} {"train_loss": -22.62567710876465, "global_step": 123048, "epoch": 1482} {"train_loss": -22.234601974487305, "global_step": 123049, "epoch": 1482} {"train_loss": -22.42337417602539, "global_step": 123050, "epoch": 1482} {"train_loss": -22.72504997253418, "global_step": 123051, "epoch": 1482} {"train_loss": -22.18754005432129, "global_step": 123052, "epoch": 1482} {"train_loss": -22.701932907104492, "global_step": 123053, "epoch": 1482} {"train_loss": -22.476606369018555, "global_step": 123054, "epoch": 1482} {"train_loss": -22.577072143554688, "global_step": 123055, "epoch": 1482} {"train_loss": -22.562803268432617, "global_step": 123056, "epoch": 1482} {"train_loss": -22.56678009033203, "global_step": 123057, "epoch": 1482} {"train_loss": -22.305044174194336, "global_step": 123058, "epoch": 1482} {"train_loss": -22.51730728149414, "global_step": 123059, "epoch": 1482} {"train_loss": -22.019315719604492, "global_step": 123060, "epoch": 1482} {"train_loss": -22.3625545501709, "global_step": 123061, "epoch": 1482} {"train_loss": -22.181396484375, "global_step": 123062, "epoch": 1482} {"train_loss": -22.566234588623047, "global_step": 123063, "epoch": 1482} {"train_loss": -22.408832550048828, "global_step": 123064, "epoch": 1482} {"train_loss": -22.489288330078125, "global_step": 123065, "epoch": 1482} {"train_loss": -22.221216201782227, "global_step": 123066, "epoch": 1482} {"train_loss": -22.470535278320312, "global_step": 123067, "epoch": 1482} {"train_loss": -22.716571807861328, "global_step": 123068, "epoch": 1482} {"train_loss": -22.518239974975586, "global_step": 123069, "epoch": 1482} {"train_loss": -22.709413528442383, "global_step": 123070, "epoch": 1482} {"train_loss": -22.536487579345703, "global_step": 123071, "epoch": 1482} {"train_loss": -22.54693031311035, "global_step": 123072, "epoch": 1482} {"train_loss": -22.247434616088867, "global_step": 123073, "epoch": 1482} {"train_loss": -22.863422393798828, "global_step": 123074, "epoch": 1482} {"train_loss": -22.730018615722656, "global_step": 123075, "epoch": 1482} {"train_loss": -22.64124870300293, "global_step": 123076, "epoch": 1482} {"train_loss": -22.838022232055664, "global_step": 123077, "epoch": 1482} {"train_loss": -22.82973289489746, "global_step": 123078, "epoch": 1482} {"train_loss": -22.422504425048828, "global_step": 123079, "epoch": 1482} {"train_loss": -22.478055953979492, "global_step": 123080, "epoch": 1482} {"train_loss": -22.466489791870117, "global_step": 123081, "epoch": 1482} {"train_loss": -22.60696029663086, "global_step": 123082, "epoch": 1482} {"train_loss": -23.0759220123291, "global_step": 123083, "epoch": 1482} {"train_loss": -22.272680282592773, "global_step": 123084, "epoch": 1482} {"train_loss": -22.553592681884766, "global_step": 123085, "epoch": 1482} {"train_loss": -22.843793869018555, "global_step": 123086, "epoch": 1482} {"train_loss": -22.654645919799805, "global_step": 123087, "epoch": 1482} {"train_loss": -22.553957950638, "global_step": 123088, "epoch": 1482, "val_loss": 6298408.0} {"train_loss": -21.925682067871094, "global_step": 123089, "epoch": 1483} {"train_loss": -22.017414093017578, "global_step": 123090, "epoch": 1483} {"train_loss": -22.23370361328125, "global_step": 123091, "epoch": 1483} {"train_loss": -22.600093841552734, "global_step": 123092, "epoch": 1483} {"train_loss": -22.25446891784668, "global_step": 123093, "epoch": 1483} {"train_loss": -22.092641830444336, "global_step": 123094, "epoch": 1483} {"train_loss": -22.517057418823242, "global_step": 123095, "epoch": 1483} {"train_loss": -22.267629623413086, "global_step": 123096, "epoch": 1483} {"train_loss": -21.979949951171875, "global_step": 123097, "epoch": 1483} {"train_loss": -22.70399284362793, "global_step": 123098, "epoch": 1483} {"train_loss": -22.454477310180664, "global_step": 123099, "epoch": 1483} {"train_loss": -22.23642921447754, "global_step": 123100, "epoch": 1483} {"train_loss": -22.7816219329834, "global_step": 123101, "epoch": 1483} {"train_loss": -22.250370025634766, "global_step": 123102, "epoch": 1483} {"train_loss": -22.729196548461914, "global_step": 123103, "epoch": 1483} {"train_loss": -22.593198776245117, "global_step": 123104, "epoch": 1483} {"train_loss": -22.976423263549805, "global_step": 123105, "epoch": 1483} {"train_loss": -22.64763641357422, "global_step": 123106, "epoch": 1483} {"train_loss": -22.669574737548828, "global_step": 123107, "epoch": 1483} {"train_loss": -22.307905197143555, "global_step": 123108, "epoch": 1483} {"train_loss": -22.344453811645508, "global_step": 123109, "epoch": 1483} {"train_loss": -22.553579330444336, "global_step": 123110, "epoch": 1483} {"train_loss": -22.5107421875, "global_step": 123111, "epoch": 1483} {"train_loss": -22.664236068725586, "global_step": 123112, "epoch": 1483} {"train_loss": -22.674985885620117, "global_step": 123113, "epoch": 1483} {"train_loss": -22.90110206604004, "global_step": 123114, "epoch": 1483} {"train_loss": -22.549238204956055, "global_step": 123115, "epoch": 1483} {"train_loss": -22.763925552368164, "global_step": 123116, "epoch": 1483} {"train_loss": -22.561786651611328, "global_step": 123117, "epoch": 1483} {"train_loss": -22.745136260986328, "global_step": 123118, "epoch": 1483} {"train_loss": -22.49195671081543, "global_step": 123119, "epoch": 1483} {"train_loss": -22.762556076049805, "global_step": 123120, "epoch": 1483} {"train_loss": -22.786941528320312, "global_step": 123121, "epoch": 1483} {"train_loss": -22.494436264038086, "global_step": 123122, "epoch": 1483} {"train_loss": -22.99606704711914, "global_step": 123123, "epoch": 1483} {"train_loss": -22.631162643432617, "global_step": 123124, "epoch": 1483} {"train_loss": -22.71038246154785, "global_step": 123125, "epoch": 1483} {"train_loss": -22.49241065979004, "global_step": 123126, "epoch": 1483} {"train_loss": -22.776174545288086, "global_step": 123127, "epoch": 1483} {"train_loss": -22.785202026367188, "global_step": 123128, "epoch": 1483} {"train_loss": -22.751876831054688, "global_step": 123129, "epoch": 1483} {"train_loss": -22.679309844970703, "global_step": 123130, "epoch": 1483} {"train_loss": -23.05813980102539, "global_step": 123131, "epoch": 1483} {"train_loss": -22.545557022094727, "global_step": 123132, "epoch": 1483} {"train_loss": -22.46308708190918, "global_step": 123133, "epoch": 1483} {"train_loss": -22.729921340942383, "global_step": 123134, "epoch": 1483} {"train_loss": -22.467830657958984, "global_step": 123135, "epoch": 1483} {"train_loss": -22.628896713256836, "global_step": 123136, "epoch": 1483} {"train_loss": -23.1452579498291, "global_step": 123137, "epoch": 1483} {"train_loss": -22.445261001586914, "global_step": 123138, "epoch": 1483} {"train_loss": -22.616647720336914, "global_step": 123139, "epoch": 1483} {"train_loss": -22.915008544921875, "global_step": 123140, "epoch": 1483} {"train_loss": -22.65213394165039, "global_step": 123141, "epoch": 1483} {"train_loss": -22.688068389892578, "global_step": 123142, "epoch": 1483} {"train_loss": -22.8076114654541, "global_step": 123143, "epoch": 1483} {"train_loss": -22.730361938476562, "global_step": 123144, "epoch": 1483} {"train_loss": -22.844934463500977, "global_step": 123145, "epoch": 1483} {"train_loss": -22.628225326538086, "global_step": 123146, "epoch": 1483} {"train_loss": -22.903919219970703, "global_step": 123147, "epoch": 1483} {"train_loss": -22.87546157836914, "global_step": 123148, "epoch": 1483} {"train_loss": -22.833112716674805, "global_step": 123149, "epoch": 1483} {"train_loss": -22.968616485595703, "global_step": 123150, "epoch": 1483} {"train_loss": -22.6376953125, "global_step": 123151, "epoch": 1483} {"train_loss": -22.795604705810547, "global_step": 123152, "epoch": 1483} {"train_loss": -22.658626556396484, "global_step": 123153, "epoch": 1483} {"train_loss": -22.36191749572754, "global_step": 123154, "epoch": 1483} {"train_loss": -22.880550384521484, "global_step": 123155, "epoch": 1483} {"train_loss": -22.338186264038086, "global_step": 123156, "epoch": 1483} {"train_loss": -22.375532150268555, "global_step": 123157, "epoch": 1483} {"train_loss": -22.696273803710938, "global_step": 123158, "epoch": 1483} {"train_loss": -22.834959030151367, "global_step": 123159, "epoch": 1483} {"train_loss": -22.423965454101562, "global_step": 123160, "epoch": 1483} {"train_loss": -22.438858032226562, "global_step": 123161, "epoch": 1483} {"train_loss": -22.333324432373047, "global_step": 123162, "epoch": 1483} {"train_loss": -22.511802673339844, "global_step": 123163, "epoch": 1483} {"train_loss": -22.72243309020996, "global_step": 123164, "epoch": 1483} {"train_loss": -22.189380645751953, "global_step": 123165, "epoch": 1483} {"train_loss": -22.66204833984375, "global_step": 123166, "epoch": 1483} {"train_loss": -22.751401901245117, "global_step": 123167, "epoch": 1483} {"train_loss": -22.277446746826172, "global_step": 123168, "epoch": 1483} {"train_loss": -22.542707443237305, "global_step": 123169, "epoch": 1483} {"train_loss": -22.791919708251953, "global_step": 123170, "epoch": 1483} {"train_loss": -22.606275581451783, "global_step": 123171, "epoch": 1483, "val_loss": 6227118.0} {"train_loss": -22.390125274658203, "global_step": 123172, "epoch": 1484} {"train_loss": -22.54831314086914, "global_step": 123173, "epoch": 1484} {"train_loss": -22.4349422454834, "global_step": 123174, "epoch": 1484} {"train_loss": -22.398706436157227, "global_step": 123175, "epoch": 1484} {"train_loss": -22.4038143157959, "global_step": 123176, "epoch": 1484} {"train_loss": -22.45004653930664, "global_step": 123177, "epoch": 1484} {"train_loss": -22.61870765686035, "global_step": 123178, "epoch": 1484} {"train_loss": -22.73890495300293, "global_step": 123179, "epoch": 1484} {"train_loss": -22.096406936645508, "global_step": 123180, "epoch": 1484} {"train_loss": -22.577163696289062, "global_step": 123181, "epoch": 1484} {"train_loss": -22.649049758911133, "global_step": 123182, "epoch": 1484} {"train_loss": -22.765979766845703, "global_step": 123183, "epoch": 1484} {"train_loss": -22.605941772460938, "global_step": 123184, "epoch": 1484} {"train_loss": -22.480031967163086, "global_step": 123185, "epoch": 1484} {"train_loss": -22.617700576782227, "global_step": 123186, "epoch": 1484} {"train_loss": -22.81556510925293, "global_step": 123187, "epoch": 1484} {"train_loss": -23.00693130493164, "global_step": 123188, "epoch": 1484} {"train_loss": -22.738840103149414, "global_step": 123189, "epoch": 1484} {"train_loss": -22.493619918823242, "global_step": 123190, "epoch": 1484} {"train_loss": -22.50375747680664, "global_step": 123191, "epoch": 1484} {"train_loss": -22.690269470214844, "global_step": 123192, "epoch": 1484} {"train_loss": -22.744186401367188, "global_step": 123193, "epoch": 1484} {"train_loss": -22.606307983398438, "global_step": 123194, "epoch": 1484} {"train_loss": -22.65643882751465, "global_step": 123195, "epoch": 1484} {"train_loss": -22.755578994750977, "global_step": 123196, "epoch": 1484} {"train_loss": -22.777042388916016, "global_step": 123197, "epoch": 1484} {"train_loss": -22.545455932617188, "global_step": 123198, "epoch": 1484} {"train_loss": -22.539663314819336, "global_step": 123199, "epoch": 1484} {"train_loss": -22.332111358642578, "global_step": 123200, "epoch": 1484} {"train_loss": -22.907941818237305, "global_step": 123201, "epoch": 1484} {"train_loss": -22.285003662109375, "global_step": 123202, "epoch": 1484} {"train_loss": -22.455307006835938, "global_step": 123203, "epoch": 1484} {"train_loss": -22.807600021362305, "global_step": 123204, "epoch": 1484} {"train_loss": -22.290237426757812, "global_step": 123205, "epoch": 1484} {"train_loss": -22.662015914916992, "global_step": 123206, "epoch": 1484} {"train_loss": -22.37955665588379, "global_step": 123207, "epoch": 1484} {"train_loss": -22.74420166015625, "global_step": 123208, "epoch": 1484} {"train_loss": -22.633695602416992, "global_step": 123209, "epoch": 1484} {"train_loss": -22.76314926147461, "global_step": 123210, "epoch": 1484} {"train_loss": -22.69635581970215, "global_step": 123211, "epoch": 1484} {"train_loss": -22.48404884338379, "global_step": 123212, "epoch": 1484} {"train_loss": -22.608043670654297, "global_step": 123213, "epoch": 1484} {"train_loss": -22.81667137145996, "global_step": 123214, "epoch": 1484} {"train_loss": -22.41031265258789, "global_step": 123215, "epoch": 1484} {"train_loss": -22.319433212280273, "global_step": 123216, "epoch": 1484} {"train_loss": -23.04804039001465, "global_step": 123217, "epoch": 1484} {"train_loss": -22.547086715698242, "global_step": 123218, "epoch": 1484} {"train_loss": -22.6298770904541, "global_step": 123219, "epoch": 1484} {"train_loss": -22.78460693359375, "global_step": 123220, "epoch": 1484} {"train_loss": -22.503984451293945, "global_step": 123221, "epoch": 1484} {"train_loss": -22.617603302001953, "global_step": 123222, "epoch": 1484} {"train_loss": -23.0600643157959, "global_step": 123223, "epoch": 1484} {"train_loss": -22.437620162963867, "global_step": 123224, "epoch": 1484} {"train_loss": -22.488523483276367, "global_step": 123225, "epoch": 1484} {"train_loss": -22.676475524902344, "global_step": 123226, "epoch": 1484} {"train_loss": -22.72269630432129, "global_step": 123227, "epoch": 1484} {"train_loss": -22.725040435791016, "global_step": 123228, "epoch": 1484} {"train_loss": -22.677579879760742, "global_step": 123229, "epoch": 1484} {"train_loss": -22.824487686157227, "global_step": 123230, "epoch": 1484} {"train_loss": -22.49854850769043, "global_step": 123231, "epoch": 1484} {"train_loss": -22.522266387939453, "global_step": 123232, "epoch": 1484} {"train_loss": -22.738046646118164, "global_step": 123233, "epoch": 1484} {"train_loss": -22.82679557800293, "global_step": 123234, "epoch": 1484} {"train_loss": -22.82517433166504, "global_step": 123235, "epoch": 1484} {"train_loss": -22.689313888549805, "global_step": 123236, "epoch": 1484} {"train_loss": -22.68648338317871, "global_step": 123237, "epoch": 1484} {"train_loss": -22.688570022583008, "global_step": 123238, "epoch": 1484} {"train_loss": -22.93052864074707, "global_step": 123239, "epoch": 1484} {"train_loss": -22.518362045288086, "global_step": 123240, "epoch": 1484} {"train_loss": -22.57503318786621, "global_step": 123241, "epoch": 1484} {"train_loss": -22.80975341796875, "global_step": 123242, "epoch": 1484} {"train_loss": -22.592395782470703, "global_step": 123243, "epoch": 1484} {"train_loss": -22.656940460205078, "global_step": 123244, "epoch": 1484} {"train_loss": -22.871885299682617, "global_step": 123245, "epoch": 1484} {"train_loss": -22.86655044555664, "global_step": 123246, "epoch": 1484} {"train_loss": -22.115915298461914, "global_step": 123247, "epoch": 1484} {"train_loss": -22.718027114868164, "global_step": 123248, "epoch": 1484} {"train_loss": -22.60393524169922, "global_step": 123249, "epoch": 1484} {"train_loss": -22.11317253112793, "global_step": 123250, "epoch": 1484} {"train_loss": -22.690420150756836, "global_step": 123251, "epoch": 1484} {"train_loss": -22.753507614135742, "global_step": 123252, "epoch": 1484} {"train_loss": -22.29703712463379, "global_step": 123253, "epoch": 1484} {"train_loss": -22.605275694146215, "global_step": 123254, "epoch": 1484, "val_loss": 6189745.0} {"train_loss": -22.15517234802246, "global_step": 123255, "epoch": 1485} {"train_loss": -21.622501373291016, "global_step": 123256, "epoch": 1485} {"train_loss": -21.859766006469727, "global_step": 123257, "epoch": 1485} {"train_loss": -22.261186599731445, "global_step": 123258, "epoch": 1485} {"train_loss": -21.730566024780273, "global_step": 123259, "epoch": 1485} {"train_loss": -22.000829696655273, "global_step": 123260, "epoch": 1485} {"train_loss": -22.231794357299805, "global_step": 123261, "epoch": 1485} {"train_loss": -22.390525817871094, "global_step": 123262, "epoch": 1485} {"train_loss": -22.731266021728516, "global_step": 123263, "epoch": 1485} {"train_loss": -22.4134464263916, "global_step": 123264, "epoch": 1485} {"train_loss": -22.42886734008789, "global_step": 123265, "epoch": 1485} {"train_loss": -22.226234436035156, "global_step": 123266, "epoch": 1485} {"train_loss": -22.574291229248047, "global_step": 123267, "epoch": 1485} {"train_loss": -22.357593536376953, "global_step": 123268, "epoch": 1485} {"train_loss": -22.2991886138916, "global_step": 123269, "epoch": 1485} {"train_loss": -22.100975036621094, "global_step": 123270, "epoch": 1485} {"train_loss": -22.619070053100586, "global_step": 123271, "epoch": 1485} {"train_loss": -22.631423950195312, "global_step": 123272, "epoch": 1485} {"train_loss": -22.519174575805664, "global_step": 123273, "epoch": 1485} {"train_loss": -22.683530807495117, "global_step": 123274, "epoch": 1485} {"train_loss": -22.517593383789062, "global_step": 123275, "epoch": 1485} {"train_loss": -22.78947639465332, "global_step": 123276, "epoch": 1485} {"train_loss": -22.286367416381836, "global_step": 123277, "epoch": 1485} {"train_loss": -22.446577072143555, "global_step": 123278, "epoch": 1485} {"train_loss": -22.546125411987305, "global_step": 123279, "epoch": 1485} {"train_loss": -22.795303344726562, "global_step": 123280, "epoch": 1485} {"train_loss": -22.48257827758789, "global_step": 123281, "epoch": 1485} {"train_loss": -22.811918258666992, "global_step": 123282, "epoch": 1485} {"train_loss": -22.549911499023438, "global_step": 123283, "epoch": 1485} {"train_loss": -22.738550186157227, "global_step": 123284, "epoch": 1485} {"train_loss": -22.90741539001465, "global_step": 123285, "epoch": 1485} {"train_loss": -22.66056251525879, "global_step": 123286, "epoch": 1485} {"train_loss": -22.601322174072266, "global_step": 123287, "epoch": 1485} {"train_loss": -22.731719970703125, "global_step": 123288, "epoch": 1485} {"train_loss": -22.905349731445312, "global_step": 123289, "epoch": 1485} {"train_loss": -22.682653427124023, "global_step": 123290, "epoch": 1485} {"train_loss": -22.92555809020996, "global_step": 123291, "epoch": 1485} {"train_loss": -22.36726951599121, "global_step": 123292, "epoch": 1485} {"train_loss": -23.06011199951172, "global_step": 123293, "epoch": 1485} {"train_loss": -22.97849464416504, "global_step": 123294, "epoch": 1485} {"train_loss": -22.692291259765625, "global_step": 123295, "epoch": 1485} {"train_loss": -22.80592918395996, "global_step": 123296, "epoch": 1485} {"train_loss": -22.48906898498535, "global_step": 123297, "epoch": 1485} {"train_loss": -22.585371017456055, "global_step": 123298, "epoch": 1485} {"train_loss": -22.686643600463867, "global_step": 123299, "epoch": 1485} {"train_loss": -22.87922477722168, "global_step": 123300, "epoch": 1485} {"train_loss": -22.726016998291016, "global_step": 123301, "epoch": 1485} {"train_loss": -22.674869537353516, "global_step": 123302, "epoch": 1485} {"train_loss": -22.246328353881836, "global_step": 123303, "epoch": 1485} {"train_loss": -22.603673934936523, "global_step": 123304, "epoch": 1485} {"train_loss": -22.91576385498047, "global_step": 123305, "epoch": 1485} {"train_loss": -22.38433265686035, "global_step": 123306, "epoch": 1485} {"train_loss": -22.610183715820312, "global_step": 123307, "epoch": 1485} {"train_loss": -22.495519638061523, "global_step": 123308, "epoch": 1485} {"train_loss": -22.64697265625, "global_step": 123309, "epoch": 1485} {"train_loss": -22.70084571838379, "global_step": 123310, "epoch": 1485} {"train_loss": -23.133493423461914, "global_step": 123311, "epoch": 1485} {"train_loss": -22.441625595092773, "global_step": 123312, "epoch": 1485} {"train_loss": -22.790884017944336, "global_step": 123313, "epoch": 1485} {"train_loss": -22.34823989868164, "global_step": 123314, "epoch": 1485} {"train_loss": -22.186613082885742, "global_step": 123315, "epoch": 1485} {"train_loss": -22.482641220092773, "global_step": 123316, "epoch": 1485} {"train_loss": -22.532794952392578, "global_step": 123317, "epoch": 1485} {"train_loss": -22.503646850585938, "global_step": 123318, "epoch": 1485} {"train_loss": -22.330110549926758, "global_step": 123319, "epoch": 1485} {"train_loss": -22.39607810974121, "global_step": 123320, "epoch": 1485} {"train_loss": -22.58791160583496, "global_step": 123321, "epoch": 1485} {"train_loss": -22.25389289855957, "global_step": 123322, "epoch": 1485} {"train_loss": -22.594228744506836, "global_step": 123323, "epoch": 1485} {"train_loss": -22.57400894165039, "global_step": 123324, "epoch": 1485} {"train_loss": -22.57633399963379, "global_step": 123325, "epoch": 1485} {"train_loss": -22.30097770690918, "global_step": 123326, "epoch": 1485} {"train_loss": -22.582834243774414, "global_step": 123327, "epoch": 1485} {"train_loss": -22.33331871032715, "global_step": 123328, "epoch": 1485} {"train_loss": -22.83959197998047, "global_step": 123329, "epoch": 1485} {"train_loss": -23.094999313354492, "global_step": 123330, "epoch": 1485} {"train_loss": -22.649141311645508, "global_step": 123331, "epoch": 1485} {"train_loss": -22.669151306152344, "global_step": 123332, "epoch": 1485} {"train_loss": -22.609846115112305, "global_step": 123333, "epoch": 1485} {"train_loss": -22.28675651550293, "global_step": 123334, "epoch": 1485} {"train_loss": -22.500015258789062, "global_step": 123335, "epoch": 1485} {"train_loss": -22.92763328552246, "global_step": 123336, "epoch": 1485} {"train_loss": -22.535055712044958, "global_step": 123337, "epoch": 1485, "val_loss": 6172722.0} {"train_loss": -22.518964767456055, "global_step": 123338, "epoch": 1486} {"train_loss": -22.400320053100586, "global_step": 123339, "epoch": 1486} {"train_loss": -22.337963104248047, "global_step": 123340, "epoch": 1486} {"train_loss": -22.4188232421875, "global_step": 123341, "epoch": 1486} {"train_loss": -22.34520721435547, "global_step": 123342, "epoch": 1486} {"train_loss": -22.307554244995117, "global_step": 123343, "epoch": 1486} {"train_loss": -22.598169326782227, "global_step": 123344, "epoch": 1486} {"train_loss": -22.3829345703125, "global_step": 123345, "epoch": 1486} {"train_loss": -22.428821563720703, "global_step": 123346, "epoch": 1486} {"train_loss": -22.091341018676758, "global_step": 123347, "epoch": 1486} {"train_loss": -22.388286590576172, "global_step": 123348, "epoch": 1486} {"train_loss": -22.376338958740234, "global_step": 123349, "epoch": 1486} {"train_loss": -22.529233932495117, "global_step": 123350, "epoch": 1486} {"train_loss": -23.04976463317871, "global_step": 123351, "epoch": 1486} {"train_loss": -22.312240600585938, "global_step": 123352, "epoch": 1486} {"train_loss": -22.50506591796875, "global_step": 123353, "epoch": 1486} {"train_loss": -22.474645614624023, "global_step": 123354, "epoch": 1486} {"train_loss": -22.801782608032227, "global_step": 123355, "epoch": 1486} {"train_loss": -22.67426872253418, "global_step": 123356, "epoch": 1486} {"train_loss": -22.807191848754883, "global_step": 123357, "epoch": 1486} {"train_loss": -22.69270896911621, "global_step": 123358, "epoch": 1486} {"train_loss": -22.667814254760742, "global_step": 123359, "epoch": 1486} {"train_loss": -22.480154037475586, "global_step": 123360, "epoch": 1486} {"train_loss": -22.373498916625977, "global_step": 123361, "epoch": 1486} {"train_loss": -22.589262008666992, "global_step": 123362, "epoch": 1486} {"train_loss": -22.33920669555664, "global_step": 123363, "epoch": 1486} {"train_loss": -22.584096908569336, "global_step": 123364, "epoch": 1486} {"train_loss": -22.45073127746582, "global_step": 123365, "epoch": 1486} {"train_loss": -22.771223068237305, "global_step": 123366, "epoch": 1486} {"train_loss": -22.46213150024414, "global_step": 123367, "epoch": 1486} {"train_loss": -22.259963989257812, "global_step": 123368, "epoch": 1486} {"train_loss": -22.576025009155273, "global_step": 123369, "epoch": 1486} {"train_loss": -22.580781936645508, "global_step": 123370, "epoch": 1486} {"train_loss": -22.789539337158203, "global_step": 123371, "epoch": 1486} {"train_loss": -22.86604881286621, "global_step": 123372, "epoch": 1486} {"train_loss": -22.892059326171875, "global_step": 123373, "epoch": 1486} {"train_loss": -22.328479766845703, "global_step": 123374, "epoch": 1486} {"train_loss": -22.458898544311523, "global_step": 123375, "epoch": 1486} {"train_loss": -22.440805435180664, "global_step": 123376, "epoch": 1486} {"train_loss": -22.89042091369629, "global_step": 123377, "epoch": 1486} {"train_loss": -22.60580825805664, "global_step": 123378, "epoch": 1486} {"train_loss": -21.951690673828125, "global_step": 123379, "epoch": 1486} {"train_loss": -22.613784790039062, "global_step": 123380, "epoch": 1486} {"train_loss": -22.48322105407715, "global_step": 123381, "epoch": 1486} {"train_loss": -22.568389892578125, "global_step": 123382, "epoch": 1486} {"train_loss": -23.188068389892578, "global_step": 123383, "epoch": 1486} {"train_loss": -22.497272491455078, "global_step": 123384, "epoch": 1486} {"train_loss": -22.589948654174805, "global_step": 123385, "epoch": 1486} {"train_loss": -22.527616500854492, "global_step": 123386, "epoch": 1486} {"train_loss": -22.7003231048584, "global_step": 123387, "epoch": 1486} {"train_loss": -22.76283073425293, "global_step": 123388, "epoch": 1486} {"train_loss": -22.680557250976562, "global_step": 123389, "epoch": 1486} {"train_loss": -22.45305633544922, "global_step": 123390, "epoch": 1486} {"train_loss": -22.944747924804688, "global_step": 123391, "epoch": 1486} {"train_loss": -22.967872619628906, "global_step": 123392, "epoch": 1486} {"train_loss": -22.561613082885742, "global_step": 123393, "epoch": 1486} {"train_loss": -22.820104598999023, "global_step": 123394, "epoch": 1486} {"train_loss": -22.407461166381836, "global_step": 123395, "epoch": 1486} {"train_loss": -22.81558609008789, "global_step": 123396, "epoch": 1486} {"train_loss": -22.907941818237305, "global_step": 123397, "epoch": 1486} {"train_loss": -22.376752853393555, "global_step": 123398, "epoch": 1486} {"train_loss": -22.97559928894043, "global_step": 123399, "epoch": 1486} {"train_loss": -22.62656021118164, "global_step": 123400, "epoch": 1486} {"train_loss": -22.610387802124023, "global_step": 123401, "epoch": 1486} {"train_loss": -22.84869384765625, "global_step": 123402, "epoch": 1486} {"train_loss": -23.07704734802246, "global_step": 123403, "epoch": 1486} {"train_loss": -23.022796630859375, "global_step": 123404, "epoch": 1486} {"train_loss": -22.557161331176758, "global_step": 123405, "epoch": 1486} {"train_loss": -22.539270401000977, "global_step": 123406, "epoch": 1486} {"train_loss": -23.154996871948242, "global_step": 123407, "epoch": 1486} {"train_loss": -22.567523956298828, "global_step": 123408, "epoch": 1486} {"train_loss": -22.58676528930664, "global_step": 123409, "epoch": 1486} {"train_loss": -22.696678161621094, "global_step": 123410, "epoch": 1486} {"train_loss": -22.583688735961914, "global_step": 123411, "epoch": 1486} {"train_loss": -22.911788940429688, "global_step": 123412, "epoch": 1486} {"train_loss": -22.181787490844727, "global_step": 123413, "epoch": 1486} {"train_loss": -22.52880859375, "global_step": 123414, "epoch": 1486} {"train_loss": -22.535648345947266, "global_step": 123415, "epoch": 1486} {"train_loss": -22.656665802001953, "global_step": 123416, "epoch": 1486} {"train_loss": -22.695011138916016, "global_step": 123417, "epoch": 1486} {"train_loss": -22.410842895507812, "global_step": 123418, "epoch": 1486} {"train_loss": -22.63787841796875, "global_step": 123419, "epoch": 1486} {"train_loss": -22.590270168810004, "global_step": 123420, "epoch": 1486, "val_loss": 6242940.5} {"train_loss": -22.784591674804688, "global_step": 123421, "epoch": 1487} {"train_loss": -22.94062614440918, "global_step": 123422, "epoch": 1487} {"train_loss": -22.408578872680664, "global_step": 123423, "epoch": 1487} {"train_loss": -22.470413208007812, "global_step": 123424, "epoch": 1487} {"train_loss": -22.772472381591797, "global_step": 123425, "epoch": 1487} {"train_loss": -22.36134910583496, "global_step": 123426, "epoch": 1487} {"train_loss": -22.70664405822754, "global_step": 123427, "epoch": 1487} {"train_loss": -22.38572120666504, "global_step": 123428, "epoch": 1487} {"train_loss": -22.417184829711914, "global_step": 123429, "epoch": 1487} {"train_loss": -22.653820037841797, "global_step": 123430, "epoch": 1487} {"train_loss": -22.578054428100586, "global_step": 123431, "epoch": 1487} {"train_loss": -22.26011085510254, "global_step": 123432, "epoch": 1487} {"train_loss": -22.43819808959961, "global_step": 123433, "epoch": 1487} {"train_loss": -22.638641357421875, "global_step": 123434, "epoch": 1487} {"train_loss": -22.641080856323242, "global_step": 123435, "epoch": 1487} {"train_loss": -22.17874526977539, "global_step": 123436, "epoch": 1487} {"train_loss": -22.476781845092773, "global_step": 123437, "epoch": 1487} {"train_loss": -22.663646697998047, "global_step": 123438, "epoch": 1487} {"train_loss": -22.594511032104492, "global_step": 123439, "epoch": 1487} {"train_loss": -22.4448184967041, "global_step": 123440, "epoch": 1487} {"train_loss": -22.247373580932617, "global_step": 123441, "epoch": 1487} {"train_loss": -22.5268611907959, "global_step": 123442, "epoch": 1487} {"train_loss": -22.370162963867188, "global_step": 123443, "epoch": 1487} {"train_loss": -22.608301162719727, "global_step": 123444, "epoch": 1487} {"train_loss": -22.70646858215332, "global_step": 123445, "epoch": 1487} {"train_loss": -22.36517333984375, "global_step": 123446, "epoch": 1487} {"train_loss": -22.74512481689453, "global_step": 123447, "epoch": 1487} {"train_loss": -22.628637313842773, "global_step": 123448, "epoch": 1487} {"train_loss": -22.745038986206055, "global_step": 123449, "epoch": 1487} {"train_loss": -22.48025894165039, "global_step": 123450, "epoch": 1487} {"train_loss": -23.06972312927246, "global_step": 123451, "epoch": 1487} {"train_loss": -22.722402572631836, "global_step": 123452, "epoch": 1487} {"train_loss": -23.1407470703125, "global_step": 123453, "epoch": 1487} {"train_loss": -22.90342140197754, "global_step": 123454, "epoch": 1487} {"train_loss": -22.784351348876953, "global_step": 123455, "epoch": 1487} {"train_loss": -22.806913375854492, "global_step": 123456, "epoch": 1487} {"train_loss": -22.362850189208984, "global_step": 123457, "epoch": 1487} {"train_loss": -22.497602462768555, "global_step": 123458, "epoch": 1487} {"train_loss": -22.73630714416504, "global_step": 123459, "epoch": 1487} {"train_loss": -22.605609893798828, "global_step": 123460, "epoch": 1487} {"train_loss": -22.920272827148438, "global_step": 123461, "epoch": 1487} {"train_loss": -22.650426864624023, "global_step": 123462, "epoch": 1487} {"train_loss": -22.808862686157227, "global_step": 123463, "epoch": 1487} {"train_loss": -22.447614669799805, "global_step": 123464, "epoch": 1487} {"train_loss": -22.60209846496582, "global_step": 123465, "epoch": 1487} {"train_loss": -22.821916580200195, "global_step": 123466, "epoch": 1487} {"train_loss": -22.645139694213867, "global_step": 123467, "epoch": 1487} {"train_loss": -22.69525146484375, "global_step": 123468, "epoch": 1487} {"train_loss": -22.202865600585938, "global_step": 123469, "epoch": 1487} {"train_loss": -22.812883377075195, "global_step": 123470, "epoch": 1487} {"train_loss": -22.75269889831543, "global_step": 123471, "epoch": 1487} {"train_loss": -22.6917667388916, "global_step": 123472, "epoch": 1487} {"train_loss": -22.518056869506836, "global_step": 123473, "epoch": 1487} {"train_loss": -22.688312530517578, "global_step": 123474, "epoch": 1487} {"train_loss": -22.271137237548828, "global_step": 123475, "epoch": 1487} {"train_loss": -22.437381744384766, "global_step": 123476, "epoch": 1487} {"train_loss": -22.441450119018555, "global_step": 123477, "epoch": 1487} {"train_loss": -22.46369171142578, "global_step": 123478, "epoch": 1487} {"train_loss": -22.548810958862305, "global_step": 123479, "epoch": 1487} {"train_loss": -22.509992599487305, "global_step": 123480, "epoch": 1487} {"train_loss": -22.577823638916016, "global_step": 123481, "epoch": 1487} {"train_loss": -22.452613830566406, "global_step": 123482, "epoch": 1487} {"train_loss": -22.825963973999023, "global_step": 123483, "epoch": 1487} {"train_loss": -22.586896896362305, "global_step": 123484, "epoch": 1487} {"train_loss": -22.65047264099121, "global_step": 123485, "epoch": 1487} {"train_loss": -22.99591636657715, "global_step": 123486, "epoch": 1487} {"train_loss": -22.761550903320312, "global_step": 123487, "epoch": 1487} {"train_loss": -22.654951095581055, "global_step": 123488, "epoch": 1487} {"train_loss": -22.754056930541992, "global_step": 123489, "epoch": 1487} {"train_loss": -22.627012252807617, "global_step": 123490, "epoch": 1487} {"train_loss": -22.79292106628418, "global_step": 123491, "epoch": 1487} {"train_loss": -22.72161865234375, "global_step": 123492, "epoch": 1487} {"train_loss": -22.16033363342285, "global_step": 123493, "epoch": 1487} {"train_loss": -22.58514976501465, "global_step": 123494, "epoch": 1487} {"train_loss": -22.857131958007812, "global_step": 123495, "epoch": 1487} {"train_loss": -22.700241088867188, "global_step": 123496, "epoch": 1487} {"train_loss": -22.07464027404785, "global_step": 123497, "epoch": 1487} {"train_loss": -22.18471336364746, "global_step": 123498, "epoch": 1487} {"train_loss": -22.78971290588379, "global_step": 123499, "epoch": 1487} {"train_loss": -22.431201934814453, "global_step": 123500, "epoch": 1487} {"train_loss": -21.855859756469727, "global_step": 123501, "epoch": 1487} {"train_loss": -22.449045181274414, "global_step": 123502, "epoch": 1487} {"train_loss": -22.596546908459032, "global_step": 123503, "epoch": 1487, "val_loss": 6219572.0} {"train_loss": -22.455427169799805, "global_step": 123504, "epoch": 1488} {"train_loss": -22.176698684692383, "global_step": 123505, "epoch": 1488} {"train_loss": -22.26766586303711, "global_step": 123506, "epoch": 1488} {"train_loss": -22.191747665405273, "global_step": 123507, "epoch": 1488} {"train_loss": -22.34849739074707, "global_step": 123508, "epoch": 1488} {"train_loss": -22.080896377563477, "global_step": 123509, "epoch": 1488} {"train_loss": -22.54404640197754, "global_step": 123510, "epoch": 1488} {"train_loss": -22.208450317382812, "global_step": 123511, "epoch": 1488} {"train_loss": -22.42026138305664, "global_step": 123512, "epoch": 1488} {"train_loss": -22.272024154663086, "global_step": 123513, "epoch": 1488} {"train_loss": -22.252769470214844, "global_step": 123514, "epoch": 1488} {"train_loss": -22.35212516784668, "global_step": 123515, "epoch": 1488} {"train_loss": -22.13888931274414, "global_step": 123516, "epoch": 1488} {"train_loss": -22.444107055664062, "global_step": 123517, "epoch": 1488} {"train_loss": -22.102807998657227, "global_step": 123518, "epoch": 1488} {"train_loss": -22.698638916015625, "global_step": 123519, "epoch": 1488} {"train_loss": -22.445098876953125, "global_step": 123520, "epoch": 1488} {"train_loss": -22.63252067565918, "global_step": 123521, "epoch": 1488} {"train_loss": -22.44202995300293, "global_step": 123522, "epoch": 1488} {"train_loss": -22.84817886352539, "global_step": 123523, "epoch": 1488} {"train_loss": -22.480072021484375, "global_step": 123524, "epoch": 1488} {"train_loss": -22.520648956298828, "global_step": 123525, "epoch": 1488} {"train_loss": -22.52493667602539, "global_step": 123526, "epoch": 1488} {"train_loss": -22.23131561279297, "global_step": 123527, "epoch": 1488} {"train_loss": -22.91871452331543, "global_step": 123528, "epoch": 1488} {"train_loss": -22.757904052734375, "global_step": 123529, "epoch": 1488} {"train_loss": -22.828100204467773, "global_step": 123530, "epoch": 1488} {"train_loss": -22.64181900024414, "global_step": 123531, "epoch": 1488} {"train_loss": -22.53299903869629, "global_step": 123532, "epoch": 1488} {"train_loss": -22.45528793334961, "global_step": 123533, "epoch": 1488} {"train_loss": -22.487363815307617, "global_step": 123534, "epoch": 1488} {"train_loss": -22.62325096130371, "global_step": 123535, "epoch": 1488} {"train_loss": -22.687606811523438, "global_step": 123536, "epoch": 1488} {"train_loss": -22.681825637817383, "global_step": 123537, "epoch": 1488} {"train_loss": -22.604145050048828, "global_step": 123538, "epoch": 1488} {"train_loss": -22.947158813476562, "global_step": 123539, "epoch": 1488} {"train_loss": -22.788681030273438, "global_step": 123540, "epoch": 1488} {"train_loss": -22.690778732299805, "global_step": 123541, "epoch": 1488} {"train_loss": -22.708511352539062, "global_step": 123542, "epoch": 1488} {"train_loss": -22.78205680847168, "global_step": 123543, "epoch": 1488} {"train_loss": -22.66823387145996, "global_step": 123544, "epoch": 1488} {"train_loss": -22.31835174560547, "global_step": 123545, "epoch": 1488} {"train_loss": -22.63245964050293, "global_step": 123546, "epoch": 1488} {"train_loss": -22.50558853149414, "global_step": 123547, "epoch": 1488} {"train_loss": -22.303081512451172, "global_step": 123548, "epoch": 1488} {"train_loss": -22.189435958862305, "global_step": 123549, "epoch": 1488} {"train_loss": -21.7947940826416, "global_step": 123550, "epoch": 1488} {"train_loss": -22.631742477416992, "global_step": 123551, "epoch": 1488} {"train_loss": -22.35715675354004, "global_step": 123552, "epoch": 1488} {"train_loss": -22.39676856994629, "global_step": 123553, "epoch": 1488} {"train_loss": -22.475772857666016, "global_step": 123554, "epoch": 1488} {"train_loss": -22.711761474609375, "global_step": 123555, "epoch": 1488} {"train_loss": -22.766958236694336, "global_step": 123556, "epoch": 1488} {"train_loss": -22.243722915649414, "global_step": 123557, "epoch": 1488} {"train_loss": -22.695493698120117, "global_step": 123558, "epoch": 1488} {"train_loss": -22.55943489074707, "global_step": 123559, "epoch": 1488} {"train_loss": -22.551130294799805, "global_step": 123560, "epoch": 1488} {"train_loss": -22.790769577026367, "global_step": 123561, "epoch": 1488} {"train_loss": -22.434772491455078, "global_step": 123562, "epoch": 1488} {"train_loss": -22.708234786987305, "global_step": 123563, "epoch": 1488} {"train_loss": -22.164215087890625, "global_step": 123564, "epoch": 1488} {"train_loss": -22.613248825073242, "global_step": 123565, "epoch": 1488} {"train_loss": -22.550827026367188, "global_step": 123566, "epoch": 1488} {"train_loss": -22.628875732421875, "global_step": 123567, "epoch": 1488} {"train_loss": -22.818222045898438, "global_step": 123568, "epoch": 1488} {"train_loss": -22.685365676879883, "global_step": 123569, "epoch": 1488} {"train_loss": -22.53986930847168, "global_step": 123570, "epoch": 1488} {"train_loss": -22.81341552734375, "global_step": 123571, "epoch": 1488} {"train_loss": -23.10409927368164, "global_step": 123572, "epoch": 1488} {"train_loss": -22.570066452026367, "global_step": 123573, "epoch": 1488} {"train_loss": -22.709497451782227, "global_step": 123574, "epoch": 1488} {"train_loss": -22.89679527282715, "global_step": 123575, "epoch": 1488} {"train_loss": -22.5213565826416, "global_step": 123576, "epoch": 1488} {"train_loss": -22.610198974609375, "global_step": 123577, "epoch": 1488} {"train_loss": -22.884929656982422, "global_step": 123578, "epoch": 1488} {"train_loss": -22.638010025024414, "global_step": 123579, "epoch": 1488} {"train_loss": -22.695844650268555, "global_step": 123580, "epoch": 1488} {"train_loss": -22.909833908081055, "global_step": 123581, "epoch": 1488} {"train_loss": -22.40899658203125, "global_step": 123582, "epoch": 1488} {"train_loss": -22.77643394470215, "global_step": 123583, "epoch": 1488} {"train_loss": -23.04026222229004, "global_step": 123584, "epoch": 1488} {"train_loss": -22.9027099609375, "global_step": 123585, "epoch": 1488} {"train_loss": -22.57547279725592, "global_step": 123586, "epoch": 1488, "val_loss": 6197476.5} {"train_loss": -22.23335075378418, "global_step": 123587, "epoch": 1489} {"train_loss": -21.922069549560547, "global_step": 123588, "epoch": 1489} {"train_loss": -21.7506046295166, "global_step": 123589, "epoch": 1489} {"train_loss": -22.759374618530273, "global_step": 123590, "epoch": 1489} {"train_loss": -22.458576202392578, "global_step": 123591, "epoch": 1489} {"train_loss": -22.214614868164062, "global_step": 123592, "epoch": 1489} {"train_loss": -22.411211013793945, "global_step": 123593, "epoch": 1489} {"train_loss": -22.80401611328125, "global_step": 123594, "epoch": 1489} {"train_loss": -21.846942901611328, "global_step": 123595, "epoch": 1489} {"train_loss": -22.38619041442871, "global_step": 123596, "epoch": 1489} {"train_loss": -22.477319717407227, "global_step": 123597, "epoch": 1489} {"train_loss": -21.976905822753906, "global_step": 123598, "epoch": 1489} {"train_loss": -22.352819442749023, "global_step": 123599, "epoch": 1489} {"train_loss": -22.34881591796875, "global_step": 123600, "epoch": 1489} {"train_loss": -22.127809524536133, "global_step": 123601, "epoch": 1489} {"train_loss": -22.911184310913086, "global_step": 123602, "epoch": 1489} {"train_loss": -22.58980369567871, "global_step": 123603, "epoch": 1489} {"train_loss": -22.303510665893555, "global_step": 123604, "epoch": 1489} {"train_loss": -22.4841251373291, "global_step": 123605, "epoch": 1489} {"train_loss": -22.33173179626465, "global_step": 123606, "epoch": 1489} {"train_loss": -22.12588882446289, "global_step": 123607, "epoch": 1489} {"train_loss": -22.483287811279297, "global_step": 123608, "epoch": 1489} {"train_loss": -22.444150924682617, "global_step": 123609, "epoch": 1489} {"train_loss": -22.496042251586914, "global_step": 123610, "epoch": 1489} {"train_loss": -22.675861358642578, "global_step": 123611, "epoch": 1489} {"train_loss": -22.53565788269043, "global_step": 123612, "epoch": 1489} {"train_loss": -22.453447341918945, "global_step": 123613, "epoch": 1489} {"train_loss": -22.381956100463867, "global_step": 123614, "epoch": 1489} {"train_loss": -22.210927963256836, "global_step": 123615, "epoch": 1489} {"train_loss": -22.678176879882812, "global_step": 123616, "epoch": 1489} {"train_loss": -22.695209503173828, "global_step": 123617, "epoch": 1489} {"train_loss": -22.528493881225586, "global_step": 123618, "epoch": 1489} {"train_loss": -22.6434383392334, "global_step": 123619, "epoch": 1489} {"train_loss": -22.644445419311523, "global_step": 123620, "epoch": 1489} {"train_loss": -22.420753479003906, "global_step": 123621, "epoch": 1489} {"train_loss": -22.847383499145508, "global_step": 123622, "epoch": 1489} {"train_loss": -22.618717193603516, "global_step": 123623, "epoch": 1489} {"train_loss": -22.732986450195312, "global_step": 123624, "epoch": 1489} {"train_loss": -22.48459815979004, "global_step": 123625, "epoch": 1489} {"train_loss": -22.380475997924805, "global_step": 123626, "epoch": 1489} {"train_loss": -22.731836318969727, "global_step": 123627, "epoch": 1489} {"train_loss": -22.768598556518555, "global_step": 123628, "epoch": 1489} {"train_loss": -22.62523651123047, "global_step": 123629, "epoch": 1489} {"train_loss": -22.830188751220703, "global_step": 123630, "epoch": 1489} {"train_loss": -22.996397018432617, "global_step": 123631, "epoch": 1489} {"train_loss": -22.53850555419922, "global_step": 123632, "epoch": 1489} {"train_loss": -22.567127227783203, "global_step": 123633, "epoch": 1489} {"train_loss": -22.743274688720703, "global_step": 123634, "epoch": 1489} {"train_loss": -22.699649810791016, "global_step": 123635, "epoch": 1489} {"train_loss": -22.014692306518555, "global_step": 123636, "epoch": 1489} {"train_loss": -22.591516494750977, "global_step": 123637, "epoch": 1489} {"train_loss": -22.394742965698242, "global_step": 123638, "epoch": 1489} {"train_loss": -22.656143188476562, "global_step": 123639, "epoch": 1489} {"train_loss": -22.765073776245117, "global_step": 123640, "epoch": 1489} {"train_loss": -22.315471649169922, "global_step": 123641, "epoch": 1489} {"train_loss": -22.44887351989746, "global_step": 123642, "epoch": 1489} {"train_loss": -22.536605834960938, "global_step": 123643, "epoch": 1489} {"train_loss": -22.654504776000977, "global_step": 123644, "epoch": 1489} {"train_loss": -22.61345100402832, "global_step": 123645, "epoch": 1489} {"train_loss": -22.59528160095215, "global_step": 123646, "epoch": 1489} {"train_loss": -22.616458892822266, "global_step": 123647, "epoch": 1489} {"train_loss": -22.71068572998047, "global_step": 123648, "epoch": 1489} {"train_loss": -22.314441680908203, "global_step": 123649, "epoch": 1489} {"train_loss": -22.831172943115234, "global_step": 123650, "epoch": 1489} {"train_loss": -22.65511131286621, "global_step": 123651, "epoch": 1489} {"train_loss": -22.81178092956543, "global_step": 123652, "epoch": 1489} {"train_loss": -22.618057250976562, "global_step": 123653, "epoch": 1489} {"train_loss": -22.690933227539062, "global_step": 123654, "epoch": 1489} {"train_loss": -23.02329444885254, "global_step": 123655, "epoch": 1489} {"train_loss": -22.816116333007812, "global_step": 123656, "epoch": 1489} {"train_loss": -22.447729110717773, "global_step": 123657, "epoch": 1489} {"train_loss": -23.016754150390625, "global_step": 123658, "epoch": 1489} {"train_loss": -22.778528213500977, "global_step": 123659, "epoch": 1489} {"train_loss": -22.581220626831055, "global_step": 123660, "epoch": 1489} {"train_loss": -22.70334243774414, "global_step": 123661, "epoch": 1489} {"train_loss": -22.759092330932617, "global_step": 123662, "epoch": 1489} {"train_loss": -22.419570922851562, "global_step": 123663, "epoch": 1489} {"train_loss": -22.549551010131836, "global_step": 123664, "epoch": 1489} {"train_loss": -22.823522567749023, "global_step": 123665, "epoch": 1489} {"train_loss": -22.61433219909668, "global_step": 123666, "epoch": 1489} {"train_loss": -22.530071258544922, "global_step": 123667, "epoch": 1489} {"train_loss": -22.78891372680664, "global_step": 123668, "epoch": 1489} {"train_loss": -22.543672653565924, "global_step": 123669, "epoch": 1489, "val_loss": 6187919.5} {"train_loss": -22.702848434448242, "global_step": 123670, "epoch": 1490} {"train_loss": -22.37852668762207, "global_step": 123671, "epoch": 1490} {"train_loss": -22.01237678527832, "global_step": 123672, "epoch": 1490} {"train_loss": -22.546117782592773, "global_step": 123673, "epoch": 1490} {"train_loss": -22.50972557067871, "global_step": 123674, "epoch": 1490} {"train_loss": -22.60009765625, "global_step": 123675, "epoch": 1490} {"train_loss": -22.40113639831543, "global_step": 123676, "epoch": 1490} {"train_loss": -22.692626953125, "global_step": 123677, "epoch": 1490} {"train_loss": -22.508623123168945, "global_step": 123678, "epoch": 1490} {"train_loss": -22.429855346679688, "global_step": 123679, "epoch": 1490} {"train_loss": -22.6812801361084, "global_step": 123680, "epoch": 1490} {"train_loss": -22.228540420532227, "global_step": 123681, "epoch": 1490} {"train_loss": -22.53494644165039, "global_step": 123682, "epoch": 1490} {"train_loss": -23.07444190979004, "global_step": 123683, "epoch": 1490} {"train_loss": -22.548818588256836, "global_step": 123684, "epoch": 1490} {"train_loss": -23.000165939331055, "global_step": 123685, "epoch": 1490} {"train_loss": -22.42130470275879, "global_step": 123686, "epoch": 1490} {"train_loss": -22.034528732299805, "global_step": 123687, "epoch": 1490} {"train_loss": -22.63113021850586, "global_step": 123688, "epoch": 1490} {"train_loss": -22.825958251953125, "global_step": 123689, "epoch": 1490} {"train_loss": -22.856922149658203, "global_step": 123690, "epoch": 1490} {"train_loss": -22.64756965637207, "global_step": 123691, "epoch": 1490} {"train_loss": -22.651811599731445, "global_step": 123692, "epoch": 1490} {"train_loss": -22.409469604492188, "global_step": 123693, "epoch": 1490} {"train_loss": -22.493595123291016, "global_step": 123694, "epoch": 1490} {"train_loss": -22.97706413269043, "global_step": 123695, "epoch": 1490} {"train_loss": -22.729406356811523, "global_step": 123696, "epoch": 1490} {"train_loss": -22.478931427001953, "global_step": 123697, "epoch": 1490} {"train_loss": -22.657936096191406, "global_step": 123698, "epoch": 1490} {"train_loss": -22.565887451171875, "global_step": 123699, "epoch": 1490} {"train_loss": -22.95367431640625, "global_step": 123700, "epoch": 1490} {"train_loss": -22.473600387573242, "global_step": 123701, "epoch": 1490} {"train_loss": -22.4422664642334, "global_step": 123702, "epoch": 1490} {"train_loss": -22.3614501953125, "global_step": 123703, "epoch": 1490} {"train_loss": -22.667348861694336, "global_step": 123704, "epoch": 1490} {"train_loss": -22.56111717224121, "global_step": 123705, "epoch": 1490} {"train_loss": -22.426666259765625, "global_step": 123706, "epoch": 1490} {"train_loss": -22.4014949798584, "global_step": 123707, "epoch": 1490} {"train_loss": -22.708242416381836, "global_step": 123708, "epoch": 1490} {"train_loss": -22.429729461669922, "global_step": 123709, "epoch": 1490} {"train_loss": -22.458444595336914, "global_step": 123710, "epoch": 1490} {"train_loss": -22.4486083984375, "global_step": 123711, "epoch": 1490} {"train_loss": -22.549711227416992, "global_step": 123712, "epoch": 1490} {"train_loss": -22.68548011779785, "global_step": 123713, "epoch": 1490} {"train_loss": -22.631845474243164, "global_step": 123714, "epoch": 1490} {"train_loss": -22.26384925842285, "global_step": 123715, "epoch": 1490} {"train_loss": -22.737722396850586, "global_step": 123716, "epoch": 1490} {"train_loss": -22.478322982788086, "global_step": 123717, "epoch": 1490} {"train_loss": -22.404218673706055, "global_step": 123718, "epoch": 1490} {"train_loss": -22.763490676879883, "global_step": 123719, "epoch": 1490} {"train_loss": -22.592397689819336, "global_step": 123720, "epoch": 1490} {"train_loss": -22.803272247314453, "global_step": 123721, "epoch": 1490} {"train_loss": -22.796892166137695, "global_step": 123722, "epoch": 1490} {"train_loss": -22.443649291992188, "global_step": 123723, "epoch": 1490} {"train_loss": -22.68771743774414, "global_step": 123724, "epoch": 1490} {"train_loss": -22.973674774169922, "global_step": 123725, "epoch": 1490} {"train_loss": -22.749338150024414, "global_step": 123726, "epoch": 1490} {"train_loss": -22.795015335083008, "global_step": 123727, "epoch": 1490} {"train_loss": -22.90010643005371, "global_step": 123728, "epoch": 1490} {"train_loss": -22.79111671447754, "global_step": 123729, "epoch": 1490} {"train_loss": -22.835193634033203, "global_step": 123730, "epoch": 1490} {"train_loss": -22.646862030029297, "global_step": 123731, "epoch": 1490} {"train_loss": -22.354700088500977, "global_step": 123732, "epoch": 1490} {"train_loss": -22.915254592895508, "global_step": 123733, "epoch": 1490} {"train_loss": -22.92658805847168, "global_step": 123734, "epoch": 1490} {"train_loss": -22.608121871948242, "global_step": 123735, "epoch": 1490} {"train_loss": -22.530853271484375, "global_step": 123736, "epoch": 1490} {"train_loss": -22.592355728149414, "global_step": 123737, "epoch": 1490} {"train_loss": -22.86227035522461, "global_step": 123738, "epoch": 1490} {"train_loss": -22.56694793701172, "global_step": 123739, "epoch": 1490} {"train_loss": -22.66351318359375, "global_step": 123740, "epoch": 1490} {"train_loss": -22.29465675354004, "global_step": 123741, "epoch": 1490} {"train_loss": -22.785425186157227, "global_step": 123742, "epoch": 1490} {"train_loss": -22.910451889038086, "global_step": 123743, "epoch": 1490} {"train_loss": -22.844003677368164, "global_step": 123744, "epoch": 1490} {"train_loss": -22.84212875366211, "global_step": 123745, "epoch": 1490} {"train_loss": -22.53553009033203, "global_step": 123746, "epoch": 1490} {"train_loss": -22.670406341552734, "global_step": 123747, "epoch": 1490} {"train_loss": -22.35123634338379, "global_step": 123748, "epoch": 1490} {"train_loss": -22.419042587280273, "global_step": 123749, "epoch": 1490} {"train_loss": -22.291650772094727, "global_step": 123750, "epoch": 1490} {"train_loss": -22.328765869140625, "global_step": 123751, "epoch": 1490} {"train_loss": -22.63910049989999, "global_step": 123752, "epoch": 1490, "val_loss": 6213757.0} {"train_loss": -20.364652633666992, "global_step": 123753, "epoch": 1491} {"train_loss": -20.147863388061523, "global_step": 123754, "epoch": 1491} {"train_loss": -20.454833984375, "global_step": 123755, "epoch": 1491} {"train_loss": -20.880979537963867, "global_step": 123756, "epoch": 1491} {"train_loss": -20.664188385009766, "global_step": 123757, "epoch": 1491} {"train_loss": -21.533781051635742, "global_step": 123758, "epoch": 1491} {"train_loss": -21.087385177612305, "global_step": 123759, "epoch": 1491} {"train_loss": -21.709096908569336, "global_step": 123760, "epoch": 1491} {"train_loss": -21.669401168823242, "global_step": 123761, "epoch": 1491} {"train_loss": -21.8604793548584, "global_step": 123762, "epoch": 1491} {"train_loss": -21.40894889831543, "global_step": 123763, "epoch": 1491} {"train_loss": -21.87381935119629, "global_step": 123764, "epoch": 1491} {"train_loss": -21.5891056060791, "global_step": 123765, "epoch": 1491} {"train_loss": -21.962894439697266, "global_step": 123766, "epoch": 1491} {"train_loss": -21.759653091430664, "global_step": 123767, "epoch": 1491} {"train_loss": -21.91412925720215, "global_step": 123768, "epoch": 1491} {"train_loss": -21.912193298339844, "global_step": 123769, "epoch": 1491} {"train_loss": -21.767866134643555, "global_step": 123770, "epoch": 1491} {"train_loss": -22.135116577148438, "global_step": 123771, "epoch": 1491} {"train_loss": -22.041736602783203, "global_step": 123772, "epoch": 1491} {"train_loss": -22.18535041809082, "global_step": 123773, "epoch": 1491} {"train_loss": -22.054075241088867, "global_step": 123774, "epoch": 1491} {"train_loss": -22.043676376342773, "global_step": 123775, "epoch": 1491} {"train_loss": -22.131072998046875, "global_step": 123776, "epoch": 1491} {"train_loss": -22.33146095275879, "global_step": 123777, "epoch": 1491} {"train_loss": -22.43562889099121, "global_step": 123778, "epoch": 1491} {"train_loss": -22.373748779296875, "global_step": 123779, "epoch": 1491} {"train_loss": -22.39985466003418, "global_step": 123780, "epoch": 1491} {"train_loss": -22.607421875, "global_step": 123781, "epoch": 1491} {"train_loss": -22.22772216796875, "global_step": 123782, "epoch": 1491} {"train_loss": -22.069433212280273, "global_step": 123783, "epoch": 1491} {"train_loss": -22.51649284362793, "global_step": 123784, "epoch": 1491} {"train_loss": -22.377450942993164, "global_step": 123785, "epoch": 1491} {"train_loss": -22.774383544921875, "global_step": 123786, "epoch": 1491} {"train_loss": -22.775609970092773, "global_step": 123787, "epoch": 1491} {"train_loss": -22.59015655517578, "global_step": 123788, "epoch": 1491} {"train_loss": -22.802289962768555, "global_step": 123789, "epoch": 1491} {"train_loss": -22.85993766784668, "global_step": 123790, "epoch": 1491} {"train_loss": -22.434955596923828, "global_step": 123791, "epoch": 1491} {"train_loss": -22.53524398803711, "global_step": 123792, "epoch": 1491} {"train_loss": -22.575881958007812, "global_step": 123793, "epoch": 1491} {"train_loss": -22.37148094177246, "global_step": 123794, "epoch": 1491} {"train_loss": -22.82622528076172, "global_step": 123795, "epoch": 1491} {"train_loss": -22.49311637878418, "global_step": 123796, "epoch": 1491} {"train_loss": -22.613744735717773, "global_step": 123797, "epoch": 1491} {"train_loss": -22.713098526000977, "global_step": 123798, "epoch": 1491} {"train_loss": -22.744800567626953, "global_step": 123799, "epoch": 1491} {"train_loss": -22.56056785583496, "global_step": 123800, "epoch": 1491} {"train_loss": -22.704410552978516, "global_step": 123801, "epoch": 1491} {"train_loss": -22.58006477355957, "global_step": 123802, "epoch": 1491} {"train_loss": -22.463245391845703, "global_step": 123803, "epoch": 1491} {"train_loss": -22.97383689880371, "global_step": 123804, "epoch": 1491} {"train_loss": -22.72905921936035, "global_step": 123805, "epoch": 1491} {"train_loss": -22.5915584564209, "global_step": 123806, "epoch": 1491} {"train_loss": -22.846464157104492, "global_step": 123807, "epoch": 1491} {"train_loss": -22.606599807739258, "global_step": 123808, "epoch": 1491} {"train_loss": -22.774877548217773, "global_step": 123809, "epoch": 1491} {"train_loss": -22.525190353393555, "global_step": 123810, "epoch": 1491} {"train_loss": -22.551288604736328, "global_step": 123811, "epoch": 1491} {"train_loss": -22.674535751342773, "global_step": 123812, "epoch": 1491} {"train_loss": -22.34157371520996, "global_step": 123813, "epoch": 1491} {"train_loss": -22.449554443359375, "global_step": 123814, "epoch": 1491} {"train_loss": -22.688840866088867, "global_step": 123815, "epoch": 1491} {"train_loss": -22.60700798034668, "global_step": 123816, "epoch": 1491} {"train_loss": -22.172941207885742, "global_step": 123817, "epoch": 1491} {"train_loss": -22.495967864990234, "global_step": 123818, "epoch": 1491} {"train_loss": -22.562955856323242, "global_step": 123819, "epoch": 1491} {"train_loss": -22.62381935119629, "global_step": 123820, "epoch": 1491} {"train_loss": -22.4440860748291, "global_step": 123821, "epoch": 1491} {"train_loss": -22.263181686401367, "global_step": 123822, "epoch": 1491} {"train_loss": -22.481225967407227, "global_step": 123823, "epoch": 1491} {"train_loss": -22.518081665039062, "global_step": 123824, "epoch": 1491} {"train_loss": -22.31941795349121, "global_step": 123825, "epoch": 1491} {"train_loss": -22.408016204833984, "global_step": 123826, "epoch": 1491} {"train_loss": -22.893810272216797, "global_step": 123827, "epoch": 1491} {"train_loss": -22.4183292388916, "global_step": 123828, "epoch": 1491} {"train_loss": -22.294631958007812, "global_step": 123829, "epoch": 1491} {"train_loss": -22.349546432495117, "global_step": 123830, "epoch": 1491} {"train_loss": -22.788955688476562, "global_step": 123831, "epoch": 1491} {"train_loss": -22.492441177368164, "global_step": 123832, "epoch": 1491} {"train_loss": -22.50201988220215, "global_step": 123833, "epoch": 1491} {"train_loss": -22.829879760742188, "global_step": 123834, "epoch": 1491} {"train_loss": -22.27004520002618, "global_step": 123835, "epoch": 1491, "val_loss": 6247083.5} {"train_loss": -22.371898651123047, "global_step": 123836, "epoch": 1492} {"train_loss": -22.135961532592773, "global_step": 123837, "epoch": 1492} {"train_loss": -22.497085571289062, "global_step": 123838, "epoch": 1492} {"train_loss": -22.636173248291016, "global_step": 123839, "epoch": 1492} {"train_loss": -22.259435653686523, "global_step": 123840, "epoch": 1492} {"train_loss": -22.527896881103516, "global_step": 123841, "epoch": 1492} {"train_loss": -22.381324768066406, "global_step": 123842, "epoch": 1492} {"train_loss": -21.948223114013672, "global_step": 123843, "epoch": 1492} {"train_loss": -22.52518081665039, "global_step": 123844, "epoch": 1492} {"train_loss": -22.37470054626465, "global_step": 123845, "epoch": 1492} {"train_loss": -22.40878677368164, "global_step": 123846, "epoch": 1492} {"train_loss": -22.59975242614746, "global_step": 123847, "epoch": 1492} {"train_loss": -22.551321029663086, "global_step": 123848, "epoch": 1492} {"train_loss": -23.016372680664062, "global_step": 123849, "epoch": 1492} {"train_loss": -22.396102905273438, "global_step": 123850, "epoch": 1492} {"train_loss": -22.72675895690918, "global_step": 123851, "epoch": 1492} {"train_loss": -22.5966854095459, "global_step": 123852, "epoch": 1492} {"train_loss": -22.76612091064453, "global_step": 123853, "epoch": 1492} {"train_loss": -22.796323776245117, "global_step": 123854, "epoch": 1492} {"train_loss": -22.360511779785156, "global_step": 123855, "epoch": 1492} {"train_loss": -22.665674209594727, "global_step": 123856, "epoch": 1492} {"train_loss": -23.00872230529785, "global_step": 123857, "epoch": 1492} {"train_loss": -22.603885650634766, "global_step": 123858, "epoch": 1492} {"train_loss": -22.995447158813477, "global_step": 123859, "epoch": 1492} {"train_loss": -23.09651756286621, "global_step": 123860, "epoch": 1492} {"train_loss": -22.59854507446289, "global_step": 123861, "epoch": 1492} {"train_loss": -22.753110885620117, "global_step": 123862, "epoch": 1492} {"train_loss": -22.628896713256836, "global_step": 123863, "epoch": 1492} {"train_loss": -22.49544906616211, "global_step": 123864, "epoch": 1492} {"train_loss": -22.686765670776367, "global_step": 123865, "epoch": 1492} {"train_loss": -22.925222396850586, "global_step": 123866, "epoch": 1492} {"train_loss": -22.794267654418945, "global_step": 123867, "epoch": 1492} {"train_loss": -22.822168350219727, "global_step": 123868, "epoch": 1492} {"train_loss": -22.541126251220703, "global_step": 123869, "epoch": 1492} {"train_loss": -22.456016540527344, "global_step": 123870, "epoch": 1492} {"train_loss": -23.003053665161133, "global_step": 123871, "epoch": 1492} {"train_loss": -22.591060638427734, "global_step": 123872, "epoch": 1492} {"train_loss": -22.914716720581055, "global_step": 123873, "epoch": 1492} {"train_loss": -22.693220138549805, "global_step": 123874, "epoch": 1492} {"train_loss": -23.060346603393555, "global_step": 123875, "epoch": 1492} {"train_loss": -22.351852416992188, "global_step": 123876, "epoch": 1492} {"train_loss": -22.63572120666504, "global_step": 123877, "epoch": 1492} {"train_loss": -22.37637710571289, "global_step": 123878, "epoch": 1492} {"train_loss": -22.565034866333008, "global_step": 123879, "epoch": 1492} {"train_loss": -22.790281295776367, "global_step": 123880, "epoch": 1492} {"train_loss": -22.427785873413086, "global_step": 123881, "epoch": 1492} {"train_loss": -22.4462947845459, "global_step": 123882, "epoch": 1492} {"train_loss": -22.62830924987793, "global_step": 123883, "epoch": 1492} {"train_loss": -22.67511558532715, "global_step": 123884, "epoch": 1492} {"train_loss": -22.555849075317383, "global_step": 123885, "epoch": 1492} {"train_loss": -22.98725700378418, "global_step": 123886, "epoch": 1492} {"train_loss": -22.7313175201416, "global_step": 123887, "epoch": 1492} {"train_loss": -22.49615478515625, "global_step": 123888, "epoch": 1492} {"train_loss": -22.7485408782959, "global_step": 123889, "epoch": 1492} {"train_loss": -22.638446807861328, "global_step": 123890, "epoch": 1492} {"train_loss": -22.743064880371094, "global_step": 123891, "epoch": 1492} {"train_loss": -22.724489212036133, "global_step": 123892, "epoch": 1492} {"train_loss": -22.401391983032227, "global_step": 123893, "epoch": 1492} {"train_loss": -22.06545066833496, "global_step": 123894, "epoch": 1492} {"train_loss": -22.644750595092773, "global_step": 123895, "epoch": 1492} {"train_loss": -22.31035804748535, "global_step": 123896, "epoch": 1492} {"train_loss": -22.418210983276367, "global_step": 123897, "epoch": 1492} {"train_loss": -22.562875747680664, "global_step": 123898, "epoch": 1492} {"train_loss": -22.728769302368164, "global_step": 123899, "epoch": 1492} {"train_loss": -22.74017906188965, "global_step": 123900, "epoch": 1492} {"train_loss": -22.623014450073242, "global_step": 123901, "epoch": 1492} {"train_loss": -22.57794189453125, "global_step": 123902, "epoch": 1492} {"train_loss": -22.922935485839844, "global_step": 123903, "epoch": 1492} {"train_loss": -22.7736873626709, "global_step": 123904, "epoch": 1492} {"train_loss": -22.500125885009766, "global_step": 123905, "epoch": 1492} {"train_loss": -22.10181427001953, "global_step": 123906, "epoch": 1492} {"train_loss": -22.034635543823242, "global_step": 123907, "epoch": 1492} {"train_loss": -22.389240264892578, "global_step": 123908, "epoch": 1492} {"train_loss": -22.739681243896484, "global_step": 123909, "epoch": 1492} {"train_loss": -22.650592803955078, "global_step": 123910, "epoch": 1492} {"train_loss": -22.460479736328125, "global_step": 123911, "epoch": 1492} {"train_loss": -22.39398956298828, "global_step": 123912, "epoch": 1492} {"train_loss": -22.598417282104492, "global_step": 123913, "epoch": 1492} {"train_loss": -22.585397720336914, "global_step": 123914, "epoch": 1492} {"train_loss": -22.326602935791016, "global_step": 123915, "epoch": 1492} {"train_loss": -23.085996627807617, "global_step": 123916, "epoch": 1492} {"train_loss": -22.615182876586914, "global_step": 123917, "epoch": 1492} {"train_loss": -22.591441257890448, "global_step": 123918, "epoch": 1492, "val_loss": 6247337.5} {"train_loss": -22.626155853271484, "global_step": 123919, "epoch": 1493} {"train_loss": -22.8974552154541, "global_step": 123920, "epoch": 1493} {"train_loss": -22.40995216369629, "global_step": 123921, "epoch": 1493} {"train_loss": -22.60420799255371, "global_step": 123922, "epoch": 1493} {"train_loss": -22.610984802246094, "global_step": 123923, "epoch": 1493} {"train_loss": -22.73596954345703, "global_step": 123924, "epoch": 1493} {"train_loss": -22.2066707611084, "global_step": 123925, "epoch": 1493} {"train_loss": -22.378732681274414, "global_step": 123926, "epoch": 1493} {"train_loss": -22.554935455322266, "global_step": 123927, "epoch": 1493} {"train_loss": -22.790573120117188, "global_step": 123928, "epoch": 1493} {"train_loss": -22.575658798217773, "global_step": 123929, "epoch": 1493} {"train_loss": -22.50942039489746, "global_step": 123930, "epoch": 1493} {"train_loss": -22.39931869506836, "global_step": 123931, "epoch": 1493} {"train_loss": -22.557287216186523, "global_step": 123932, "epoch": 1493} {"train_loss": -22.937376022338867, "global_step": 123933, "epoch": 1493} {"train_loss": -22.41553497314453, "global_step": 123934, "epoch": 1493} {"train_loss": -22.350553512573242, "global_step": 123935, "epoch": 1493} {"train_loss": -22.843372344970703, "global_step": 123936, "epoch": 1493} {"train_loss": -22.373886108398438, "global_step": 123937, "epoch": 1493} {"train_loss": -22.862756729125977, "global_step": 123938, "epoch": 1493} {"train_loss": -22.339262008666992, "global_step": 123939, "epoch": 1493} {"train_loss": -22.675674438476562, "global_step": 123940, "epoch": 1493} {"train_loss": -22.96816062927246, "global_step": 123941, "epoch": 1493} {"train_loss": -22.982267379760742, "global_step": 123942, "epoch": 1493} {"train_loss": -22.683273315429688, "global_step": 123943, "epoch": 1493} {"train_loss": -22.38238525390625, "global_step": 123944, "epoch": 1493} {"train_loss": -22.581836700439453, "global_step": 123945, "epoch": 1493} {"train_loss": -22.65401268005371, "global_step": 123946, "epoch": 1493} {"train_loss": -21.810800552368164, "global_step": 123947, "epoch": 1493} {"train_loss": -22.656917572021484, "global_step": 123948, "epoch": 1493} {"train_loss": -22.353076934814453, "global_step": 123949, "epoch": 1493} {"train_loss": -22.626235961914062, "global_step": 123950, "epoch": 1493} {"train_loss": -22.612478256225586, "global_step": 123951, "epoch": 1493} {"train_loss": -22.46921730041504, "global_step": 123952, "epoch": 1493} {"train_loss": -22.215547561645508, "global_step": 123953, "epoch": 1493} {"train_loss": -22.943010330200195, "global_step": 123954, "epoch": 1493} {"train_loss": -22.16043472290039, "global_step": 123955, "epoch": 1493} {"train_loss": -22.69771385192871, "global_step": 123956, "epoch": 1493} {"train_loss": -22.82267189025879, "global_step": 123957, "epoch": 1493} {"train_loss": -22.783498764038086, "global_step": 123958, "epoch": 1493} {"train_loss": -22.760028839111328, "global_step": 123959, "epoch": 1493} {"train_loss": -22.301130294799805, "global_step": 123960, "epoch": 1493} {"train_loss": -22.82337188720703, "global_step": 123961, "epoch": 1493} {"train_loss": -22.578540802001953, "global_step": 123962, "epoch": 1493} {"train_loss": -22.573877334594727, "global_step": 123963, "epoch": 1493} {"train_loss": -22.192638397216797, "global_step": 123964, "epoch": 1493} {"train_loss": -22.395370483398438, "global_step": 123965, "epoch": 1493} {"train_loss": -22.74219512939453, "global_step": 123966, "epoch": 1493} {"train_loss": -22.44365882873535, "global_step": 123967, "epoch": 1493} {"train_loss": -22.52364158630371, "global_step": 123968, "epoch": 1493} {"train_loss": -22.539609909057617, "global_step": 123969, "epoch": 1493} {"train_loss": -22.761947631835938, "global_step": 123970, "epoch": 1493} {"train_loss": -22.227664947509766, "global_step": 123971, "epoch": 1493} {"train_loss": -22.709335327148438, "global_step": 123972, "epoch": 1493} {"train_loss": -22.62541389465332, "global_step": 123973, "epoch": 1493} {"train_loss": -22.77192497253418, "global_step": 123974, "epoch": 1493} {"train_loss": -22.701156616210938, "global_step": 123975, "epoch": 1493} {"train_loss": -22.47810935974121, "global_step": 123976, "epoch": 1493} {"train_loss": -22.77151870727539, "global_step": 123977, "epoch": 1493} {"train_loss": -22.447908401489258, "global_step": 123978, "epoch": 1493} {"train_loss": -22.766056060791016, "global_step": 123979, "epoch": 1493} {"train_loss": -22.825725555419922, "global_step": 123980, "epoch": 1493} {"train_loss": -22.8299503326416, "global_step": 123981, "epoch": 1493} {"train_loss": -22.891942977905273, "global_step": 123982, "epoch": 1493} {"train_loss": -22.968647003173828, "global_step": 123983, "epoch": 1493} {"train_loss": -22.576953887939453, "global_step": 123984, "epoch": 1493} {"train_loss": -22.284820556640625, "global_step": 123985, "epoch": 1493} {"train_loss": -22.561094284057617, "global_step": 123986, "epoch": 1493} {"train_loss": -22.806760787963867, "global_step": 123987, "epoch": 1493} {"train_loss": -22.46845817565918, "global_step": 123988, "epoch": 1493} {"train_loss": -22.185087203979492, "global_step": 123989, "epoch": 1493} {"train_loss": -22.306053161621094, "global_step": 123990, "epoch": 1493} {"train_loss": -22.498302459716797, "global_step": 123991, "epoch": 1493} {"train_loss": -21.78464698791504, "global_step": 123992, "epoch": 1493} {"train_loss": -22.598133087158203, "global_step": 123993, "epoch": 1493} {"train_loss": -22.352893829345703, "global_step": 123994, "epoch": 1493} {"train_loss": -22.508525848388672, "global_step": 123995, "epoch": 1493} {"train_loss": -22.49940299987793, "global_step": 123996, "epoch": 1493} {"train_loss": -21.948789596557617, "global_step": 123997, "epoch": 1493} {"train_loss": -22.27133560180664, "global_step": 123998, "epoch": 1493} {"train_loss": -22.08893394470215, "global_step": 123999, "epoch": 1493} {"train_loss": -22.566768646240234, "global_step": 124000, "epoch": 1493} {"train_loss": -22.543128852384637, "global_step": 124001, "epoch": 1493, "val_loss": 6204524.0} {"train_loss": -21.373661041259766, "global_step": 124002, "epoch": 1494} {"train_loss": -22.392593383789062, "global_step": 124003, "epoch": 1494} {"train_loss": -21.213422775268555, "global_step": 124004, "epoch": 1494} {"train_loss": -22.337589263916016, "global_step": 124005, "epoch": 1494} {"train_loss": -21.748106002807617, "global_step": 124006, "epoch": 1494} {"train_loss": -22.228403091430664, "global_step": 124007, "epoch": 1494} {"train_loss": -22.158658981323242, "global_step": 124008, "epoch": 1494} {"train_loss": -22.272171020507812, "global_step": 124009, "epoch": 1494} {"train_loss": -21.902204513549805, "global_step": 124010, "epoch": 1494} {"train_loss": -22.00038719177246, "global_step": 124011, "epoch": 1494} {"train_loss": -22.521610260009766, "global_step": 124012, "epoch": 1494} {"train_loss": -22.277952194213867, "global_step": 124013, "epoch": 1494} {"train_loss": -22.69411277770996, "global_step": 124014, "epoch": 1494} {"train_loss": -22.319599151611328, "global_step": 124015, "epoch": 1494} {"train_loss": -22.47199058532715, "global_step": 124016, "epoch": 1494} {"train_loss": -22.559934616088867, "global_step": 124017, "epoch": 1494} {"train_loss": -22.54558753967285, "global_step": 124018, "epoch": 1494} {"train_loss": -22.503658294677734, "global_step": 124019, "epoch": 1494} {"train_loss": -22.39139175415039, "global_step": 124020, "epoch": 1494} {"train_loss": -22.67721939086914, "global_step": 124021, "epoch": 1494} {"train_loss": -22.445451736450195, "global_step": 124022, "epoch": 1494} {"train_loss": -22.585025787353516, "global_step": 124023, "epoch": 1494} {"train_loss": -22.55953598022461, "global_step": 124024, "epoch": 1494} {"train_loss": -22.46504020690918, "global_step": 124025, "epoch": 1494} {"train_loss": -22.77029800415039, "global_step": 124026, "epoch": 1494} {"train_loss": -22.388578414916992, "global_step": 124027, "epoch": 1494} {"train_loss": -22.562976837158203, "global_step": 124028, "epoch": 1494} {"train_loss": -22.703697204589844, "global_step": 124029, "epoch": 1494} {"train_loss": -22.73263931274414, "global_step": 124030, "epoch": 1494} {"train_loss": -22.91498374938965, "global_step": 124031, "epoch": 1494} {"train_loss": -23.046384811401367, "global_step": 124032, "epoch": 1494} {"train_loss": -22.569862365722656, "global_step": 124033, "epoch": 1494} {"train_loss": -22.710067749023438, "global_step": 124034, "epoch": 1494} {"train_loss": -22.756301879882812, "global_step": 124035, "epoch": 1494} {"train_loss": -22.649213790893555, "global_step": 124036, "epoch": 1494} {"train_loss": -22.679920196533203, "global_step": 124037, "epoch": 1494} {"train_loss": -22.598615646362305, "global_step": 124038, "epoch": 1494} {"train_loss": -22.716493606567383, "global_step": 124039, "epoch": 1494} {"train_loss": -22.671064376831055, "global_step": 124040, "epoch": 1494} {"train_loss": -22.77579116821289, "global_step": 124041, "epoch": 1494} {"train_loss": -22.37470054626465, "global_step": 124042, "epoch": 1494} {"train_loss": -22.654081344604492, "global_step": 124043, "epoch": 1494} {"train_loss": -22.76829719543457, "global_step": 124044, "epoch": 1494} {"train_loss": -22.275075912475586, "global_step": 124045, "epoch": 1494} {"train_loss": -22.76598358154297, "global_step": 124046, "epoch": 1494} {"train_loss": -22.85107421875, "global_step": 124047, "epoch": 1494} {"train_loss": -23.0666446685791, "global_step": 124048, "epoch": 1494} {"train_loss": -22.980005264282227, "global_step": 124049, "epoch": 1494} {"train_loss": -22.978961944580078, "global_step": 124050, "epoch": 1494} {"train_loss": -22.917497634887695, "global_step": 124051, "epoch": 1494} {"train_loss": -22.867937088012695, "global_step": 124052, "epoch": 1494} {"train_loss": -22.59822654724121, "global_step": 124053, "epoch": 1494} {"train_loss": -22.849910736083984, "global_step": 124054, "epoch": 1494} {"train_loss": -22.974546432495117, "global_step": 124055, "epoch": 1494} {"train_loss": -23.041488647460938, "global_step": 124056, "epoch": 1494} {"train_loss": -22.707468032836914, "global_step": 124057, "epoch": 1494} {"train_loss": -22.568506240844727, "global_step": 124058, "epoch": 1494} {"train_loss": -22.6768741607666, "global_step": 124059, "epoch": 1494} {"train_loss": -22.8714599609375, "global_step": 124060, "epoch": 1494} {"train_loss": -22.470762252807617, "global_step": 124061, "epoch": 1494} {"train_loss": -22.736038208007812, "global_step": 124062, "epoch": 1494} {"train_loss": -22.75733757019043, "global_step": 124063, "epoch": 1494} {"train_loss": -22.389957427978516, "global_step": 124064, "epoch": 1494} {"train_loss": -22.74867057800293, "global_step": 124065, "epoch": 1494} {"train_loss": -22.512372970581055, "global_step": 124066, "epoch": 1494} {"train_loss": -22.937347412109375, "global_step": 124067, "epoch": 1494} {"train_loss": -22.4397029876709, "global_step": 124068, "epoch": 1494} {"train_loss": -23.037107467651367, "global_step": 124069, "epoch": 1494} {"train_loss": -22.926294326782227, "global_step": 124070, "epoch": 1494} {"train_loss": -22.949636459350586, "global_step": 124071, "epoch": 1494} {"train_loss": -22.772958755493164, "global_step": 124072, "epoch": 1494} {"train_loss": -22.598098754882812, "global_step": 124073, "epoch": 1494} {"train_loss": -22.622299194335938, "global_step": 124074, "epoch": 1494} {"train_loss": -22.476282119750977, "global_step": 124075, "epoch": 1494} {"train_loss": -22.52328109741211, "global_step": 124076, "epoch": 1494} {"train_loss": -22.93113136291504, "global_step": 124077, "epoch": 1494} {"train_loss": -22.99579429626465, "global_step": 124078, "epoch": 1494} {"train_loss": -22.696847915649414, "global_step": 124079, "epoch": 1494} {"train_loss": -22.539295196533203, "global_step": 124080, "epoch": 1494} {"train_loss": -22.548620223999023, "global_step": 124081, "epoch": 1494} {"train_loss": -22.470680236816406, "global_step": 124082, "epoch": 1494} {"train_loss": -22.733428955078125, "global_step": 124083, "epoch": 1494} {"train_loss": -22.60187650014119, "global_step": 124084, "epoch": 1494, "val_loss": 6259091.5} {"train_loss": -22.275527954101562, "global_step": 124085, "epoch": 1495} {"train_loss": -22.34473991394043, "global_step": 124086, "epoch": 1495} {"train_loss": -21.957815170288086, "global_step": 124087, "epoch": 1495} {"train_loss": -22.249176025390625, "global_step": 124088, "epoch": 1495} {"train_loss": -22.71054458618164, "global_step": 124089, "epoch": 1495} {"train_loss": -21.727415084838867, "global_step": 124090, "epoch": 1495} {"train_loss": -21.73955726623535, "global_step": 124091, "epoch": 1495} {"train_loss": -22.032690048217773, "global_step": 124092, "epoch": 1495} {"train_loss": -22.2721004486084, "global_step": 124093, "epoch": 1495} {"train_loss": -22.261640548706055, "global_step": 124094, "epoch": 1495} {"train_loss": -21.727109909057617, "global_step": 124095, "epoch": 1495} {"train_loss": -22.41550636291504, "global_step": 124096, "epoch": 1495} {"train_loss": -22.591581344604492, "global_step": 124097, "epoch": 1495} {"train_loss": -22.267101287841797, "global_step": 124098, "epoch": 1495} {"train_loss": -22.475452423095703, "global_step": 124099, "epoch": 1495} {"train_loss": -21.9266357421875, "global_step": 124100, "epoch": 1495} {"train_loss": -22.282283782958984, "global_step": 124101, "epoch": 1495} {"train_loss": -22.25177574157715, "global_step": 124102, "epoch": 1495} {"train_loss": -22.571271896362305, "global_step": 124103, "epoch": 1495} {"train_loss": -22.299564361572266, "global_step": 124104, "epoch": 1495} {"train_loss": -22.194461822509766, "global_step": 124105, "epoch": 1495} {"train_loss": -22.550067901611328, "global_step": 124106, "epoch": 1495} {"train_loss": -22.730382919311523, "global_step": 124107, "epoch": 1495} {"train_loss": -22.798982620239258, "global_step": 124108, "epoch": 1495} {"train_loss": -22.55116844177246, "global_step": 124109, "epoch": 1495} {"train_loss": -22.629844665527344, "global_step": 124110, "epoch": 1495} {"train_loss": -22.58403968811035, "global_step": 124111, "epoch": 1495} {"train_loss": -22.640573501586914, "global_step": 124112, "epoch": 1495} {"train_loss": -22.703367233276367, "global_step": 124113, "epoch": 1495} {"train_loss": -22.855411529541016, "global_step": 124114, "epoch": 1495} {"train_loss": -22.69904899597168, "global_step": 124115, "epoch": 1495} {"train_loss": -22.594804763793945, "global_step": 124116, "epoch": 1495} {"train_loss": -22.64223289489746, "global_step": 124117, "epoch": 1495} {"train_loss": -22.89415740966797, "global_step": 124118, "epoch": 1495} {"train_loss": -22.664138793945312, "global_step": 124119, "epoch": 1495} {"train_loss": -22.124282836914062, "global_step": 124120, "epoch": 1495} {"train_loss": -22.636606216430664, "global_step": 124121, "epoch": 1495} {"train_loss": -22.35389518737793, "global_step": 124122, "epoch": 1495} {"train_loss": -22.32209587097168, "global_step": 124123, "epoch": 1495} {"train_loss": -22.6020565032959, "global_step": 124124, "epoch": 1495} {"train_loss": -22.547353744506836, "global_step": 124125, "epoch": 1495} {"train_loss": -22.561973571777344, "global_step": 124126, "epoch": 1495} {"train_loss": -22.617856979370117, "global_step": 124127, "epoch": 1495} {"train_loss": -22.66511344909668, "global_step": 124128, "epoch": 1495} {"train_loss": -22.680448532104492, "global_step": 124129, "epoch": 1495} {"train_loss": -22.452308654785156, "global_step": 124130, "epoch": 1495} {"train_loss": -22.67970848083496, "global_step": 124131, "epoch": 1495} {"train_loss": -22.71573257446289, "global_step": 124132, "epoch": 1495} {"train_loss": -22.707353591918945, "global_step": 124133, "epoch": 1495} {"train_loss": -22.464317321777344, "global_step": 124134, "epoch": 1495} {"train_loss": -22.621383666992188, "global_step": 124135, "epoch": 1495} {"train_loss": -22.44898796081543, "global_step": 124136, "epoch": 1495} {"train_loss": -22.828372955322266, "global_step": 124137, "epoch": 1495} {"train_loss": -22.792877197265625, "global_step": 124138, "epoch": 1495} {"train_loss": -22.763883590698242, "global_step": 124139, "epoch": 1495} {"train_loss": -22.2985897064209, "global_step": 124140, "epoch": 1495} {"train_loss": -22.952953338623047, "global_step": 124141, "epoch": 1495} {"train_loss": -22.741254806518555, "global_step": 124142, "epoch": 1495} {"train_loss": -22.710813522338867, "global_step": 124143, "epoch": 1495} {"train_loss": -22.517986297607422, "global_step": 124144, "epoch": 1495} {"train_loss": -22.438039779663086, "global_step": 124145, "epoch": 1495} {"train_loss": -22.43520736694336, "global_step": 124146, "epoch": 1495} {"train_loss": -22.370670318603516, "global_step": 124147, "epoch": 1495} {"train_loss": -22.257909774780273, "global_step": 124148, "epoch": 1495} {"train_loss": -22.64789581298828, "global_step": 124149, "epoch": 1495} {"train_loss": -22.225473403930664, "global_step": 124150, "epoch": 1495} {"train_loss": -22.624509811401367, "global_step": 124151, "epoch": 1495} {"train_loss": -22.269981384277344, "global_step": 124152, "epoch": 1495} {"train_loss": -23.03055191040039, "global_step": 124153, "epoch": 1495} {"train_loss": -22.604761123657227, "global_step": 124154, "epoch": 1495} {"train_loss": -21.954504013061523, "global_step": 124155, "epoch": 1495} {"train_loss": -22.366792678833008, "global_step": 124156, "epoch": 1495} {"train_loss": -22.420982360839844, "global_step": 124157, "epoch": 1495} {"train_loss": -22.5902156829834, "global_step": 124158, "epoch": 1495} {"train_loss": -22.898456573486328, "global_step": 124159, "epoch": 1495} {"train_loss": -22.472623825073242, "global_step": 124160, "epoch": 1495} {"train_loss": -22.673480987548828, "global_step": 124161, "epoch": 1495} {"train_loss": -22.14595603942871, "global_step": 124162, "epoch": 1495} {"train_loss": -22.860448837280273, "global_step": 124163, "epoch": 1495} {"train_loss": -22.80401039123535, "global_step": 124164, "epoch": 1495} {"train_loss": -22.550430297851562, "global_step": 124165, "epoch": 1495} {"train_loss": -22.556304931640625, "global_step": 124166, "epoch": 1495} {"train_loss": -22.497902353125884, "global_step": 124167, "epoch": 1495, "val_loss": 6211237.0} {"train_loss": -22.017370223999023, "global_step": 124168, "epoch": 1496} {"train_loss": -23.21380615234375, "global_step": 124169, "epoch": 1496} {"train_loss": -22.507049560546875, "global_step": 124170, "epoch": 1496} {"train_loss": -22.312856674194336, "global_step": 124171, "epoch": 1496} {"train_loss": -22.821897506713867, "global_step": 124172, "epoch": 1496} {"train_loss": -22.701208114624023, "global_step": 124173, "epoch": 1496} {"train_loss": -22.033817291259766, "global_step": 124174, "epoch": 1496} {"train_loss": -22.647634506225586, "global_step": 124175, "epoch": 1496} {"train_loss": -22.48410415649414, "global_step": 124176, "epoch": 1496} {"train_loss": -22.365428924560547, "global_step": 124177, "epoch": 1496} {"train_loss": -22.49712562561035, "global_step": 124178, "epoch": 1496} {"train_loss": -22.391386032104492, "global_step": 124179, "epoch": 1496} {"train_loss": -22.750577926635742, "global_step": 124180, "epoch": 1496} {"train_loss": -22.301809310913086, "global_step": 124181, "epoch": 1496} {"train_loss": -22.764490127563477, "global_step": 124182, "epoch": 1496} {"train_loss": -22.803159713745117, "global_step": 124183, "epoch": 1496} {"train_loss": -22.64344596862793, "global_step": 124184, "epoch": 1496} {"train_loss": -22.710735321044922, "global_step": 124185, "epoch": 1496} {"train_loss": -22.71223258972168, "global_step": 124186, "epoch": 1496} {"train_loss": -22.667442321777344, "global_step": 124187, "epoch": 1496} {"train_loss": -22.488988876342773, "global_step": 124188, "epoch": 1496} {"train_loss": -22.488037109375, "global_step": 124189, "epoch": 1496} {"train_loss": -22.678647994995117, "global_step": 124190, "epoch": 1496} {"train_loss": -22.643287658691406, "global_step": 124191, "epoch": 1496} {"train_loss": -22.58379364013672, "global_step": 124192, "epoch": 1496} {"train_loss": -22.501922607421875, "global_step": 124193, "epoch": 1496} {"train_loss": -22.859220504760742, "global_step": 124194, "epoch": 1496} {"train_loss": -22.6431884765625, "global_step": 124195, "epoch": 1496} {"train_loss": -23.125539779663086, "global_step": 124196, "epoch": 1496} {"train_loss": -22.54201316833496, "global_step": 124197, "epoch": 1496} {"train_loss": -22.522886276245117, "global_step": 124198, "epoch": 1496} {"train_loss": -22.70681381225586, "global_step": 124199, "epoch": 1496} {"train_loss": -22.39761734008789, "global_step": 124200, "epoch": 1496} {"train_loss": -22.931459426879883, "global_step": 124201, "epoch": 1496} {"train_loss": -22.65620994567871, "global_step": 124202, "epoch": 1496} {"train_loss": -22.490652084350586, "global_step": 124203, "epoch": 1496} {"train_loss": -22.781667709350586, "global_step": 124204, "epoch": 1496} {"train_loss": -22.306440353393555, "global_step": 124205, "epoch": 1496} {"train_loss": -22.57035255432129, "global_step": 124206, "epoch": 1496} {"train_loss": -23.01734161376953, "global_step": 124207, "epoch": 1496} {"train_loss": -22.705869674682617, "global_step": 124208, "epoch": 1496} {"train_loss": -22.956266403198242, "global_step": 124209, "epoch": 1496} {"train_loss": -22.890348434448242, "global_step": 124210, "epoch": 1496} {"train_loss": -22.559890747070312, "global_step": 124211, "epoch": 1496} {"train_loss": -22.53306770324707, "global_step": 124212, "epoch": 1496} {"train_loss": -22.547561645507812, "global_step": 124213, "epoch": 1496} {"train_loss": -22.695898056030273, "global_step": 124214, "epoch": 1496} {"train_loss": -22.799955368041992, "global_step": 124215, "epoch": 1496} {"train_loss": -22.316577911376953, "global_step": 124216, "epoch": 1496} {"train_loss": -22.982358932495117, "global_step": 124217, "epoch": 1496} {"train_loss": -22.797922134399414, "global_step": 124218, "epoch": 1496} {"train_loss": -22.166629791259766, "global_step": 124219, "epoch": 1496} {"train_loss": -22.803543090820312, "global_step": 124220, "epoch": 1496} {"train_loss": -22.87803077697754, "global_step": 124221, "epoch": 1496} {"train_loss": -22.866750717163086, "global_step": 124222, "epoch": 1496} {"train_loss": -22.611143112182617, "global_step": 124223, "epoch": 1496} {"train_loss": -22.38684844970703, "global_step": 124224, "epoch": 1496} {"train_loss": -22.788625717163086, "global_step": 124225, "epoch": 1496} {"train_loss": -22.520414352416992, "global_step": 124226, "epoch": 1496} {"train_loss": -22.6051025390625, "global_step": 124227, "epoch": 1496} {"train_loss": -22.378698348999023, "global_step": 124228, "epoch": 1496} {"train_loss": -22.543731689453125, "global_step": 124229, "epoch": 1496} {"train_loss": -22.237884521484375, "global_step": 124230, "epoch": 1496} {"train_loss": -22.862241744995117, "global_step": 124231, "epoch": 1496} {"train_loss": -22.439517974853516, "global_step": 124232, "epoch": 1496} {"train_loss": -22.3857421875, "global_step": 124233, "epoch": 1496} {"train_loss": -22.706207275390625, "global_step": 124234, "epoch": 1496} {"train_loss": -22.599157333374023, "global_step": 124235, "epoch": 1496} {"train_loss": -22.310110092163086, "global_step": 124236, "epoch": 1496} {"train_loss": -22.783294677734375, "global_step": 124237, "epoch": 1496} {"train_loss": -22.38655662536621, "global_step": 124238, "epoch": 1496} {"train_loss": -22.70522117614746, "global_step": 124239, "epoch": 1496} {"train_loss": -22.605911254882812, "global_step": 124240, "epoch": 1496} {"train_loss": -22.5815486907959, "global_step": 124241, "epoch": 1496} {"train_loss": -22.786375045776367, "global_step": 124242, "epoch": 1496} {"train_loss": -22.480789184570312, "global_step": 124243, "epoch": 1496} {"train_loss": -22.76618766784668, "global_step": 124244, "epoch": 1496} {"train_loss": -22.74073600769043, "global_step": 124245, "epoch": 1496} {"train_loss": -22.74561882019043, "global_step": 124246, "epoch": 1496} {"train_loss": -23.03434181213379, "global_step": 124247, "epoch": 1496} {"train_loss": -22.76180076599121, "global_step": 124248, "epoch": 1496} {"train_loss": -22.835355758666992, "global_step": 124249, "epoch": 1496} {"train_loss": -22.632100852139025, "global_step": 124250, "epoch": 1496, "val_loss": 6225529.0} {"train_loss": -22.7502498626709, "global_step": 124251, "epoch": 1497} {"train_loss": -22.555782318115234, "global_step": 124252, "epoch": 1497} {"train_loss": -22.242279052734375, "global_step": 124253, "epoch": 1497} {"train_loss": -22.524518966674805, "global_step": 124254, "epoch": 1497} {"train_loss": -22.335134506225586, "global_step": 124255, "epoch": 1497} {"train_loss": -22.96848487854004, "global_step": 124256, "epoch": 1497} {"train_loss": -22.452112197875977, "global_step": 124257, "epoch": 1497} {"train_loss": -22.417709350585938, "global_step": 124258, "epoch": 1497} {"train_loss": -22.504989624023438, "global_step": 124259, "epoch": 1497} {"train_loss": -22.415782928466797, "global_step": 124260, "epoch": 1497} {"train_loss": -22.527420043945312, "global_step": 124261, "epoch": 1497} {"train_loss": -22.08526611328125, "global_step": 124262, "epoch": 1497} {"train_loss": -22.366947174072266, "global_step": 124263, "epoch": 1497} {"train_loss": -22.875232696533203, "global_step": 124264, "epoch": 1497} {"train_loss": -22.288297653198242, "global_step": 124265, "epoch": 1497} {"train_loss": -22.673572540283203, "global_step": 124266, "epoch": 1497} {"train_loss": -22.42580223083496, "global_step": 124267, "epoch": 1497} {"train_loss": -22.10863494873047, "global_step": 124268, "epoch": 1497} {"train_loss": -22.952842712402344, "global_step": 124269, "epoch": 1497} {"train_loss": -22.570222854614258, "global_step": 124270, "epoch": 1497} {"train_loss": -22.853769302368164, "global_step": 124271, "epoch": 1497} {"train_loss": -22.614654541015625, "global_step": 124272, "epoch": 1497} {"train_loss": -22.469985961914062, "global_step": 124273, "epoch": 1497} {"train_loss": -22.542919158935547, "global_step": 124274, "epoch": 1497} {"train_loss": -22.65476417541504, "global_step": 124275, "epoch": 1497} {"train_loss": -22.116819381713867, "global_step": 124276, "epoch": 1497} {"train_loss": -22.646957397460938, "global_step": 124277, "epoch": 1497} {"train_loss": -22.662683486938477, "global_step": 124278, "epoch": 1497} {"train_loss": -22.581445693969727, "global_step": 124279, "epoch": 1497} {"train_loss": -22.74095344543457, "global_step": 124280, "epoch": 1497} {"train_loss": -22.33882713317871, "global_step": 124281, "epoch": 1497} {"train_loss": -22.59578514099121, "global_step": 124282, "epoch": 1497} {"train_loss": -22.76071548461914, "global_step": 124283, "epoch": 1497} {"train_loss": -22.606201171875, "global_step": 124284, "epoch": 1497} {"train_loss": -22.624296188354492, "global_step": 124285, "epoch": 1497} {"train_loss": -22.624074935913086, "global_step": 124286, "epoch": 1497} {"train_loss": -22.789175033569336, "global_step": 124287, "epoch": 1497} {"train_loss": -22.5753116607666, "global_step": 124288, "epoch": 1497} {"train_loss": -22.725311279296875, "global_step": 124289, "epoch": 1497} {"train_loss": -22.68337631225586, "global_step": 124290, "epoch": 1497} {"train_loss": -22.312122344970703, "global_step": 124291, "epoch": 1497} {"train_loss": -22.641284942626953, "global_step": 124292, "epoch": 1497} {"train_loss": -22.507349014282227, "global_step": 124293, "epoch": 1497} {"train_loss": -22.471721649169922, "global_step": 124294, "epoch": 1497} {"train_loss": -22.780790328979492, "global_step": 124295, "epoch": 1497} {"train_loss": -22.560497283935547, "global_step": 124296, "epoch": 1497} {"train_loss": -22.641010284423828, "global_step": 124297, "epoch": 1497} {"train_loss": -22.78713035583496, "global_step": 124298, "epoch": 1497} {"train_loss": -22.740741729736328, "global_step": 124299, "epoch": 1497} {"train_loss": -22.500896453857422, "global_step": 124300, "epoch": 1497} {"train_loss": -23.08928871154785, "global_step": 124301, "epoch": 1497} {"train_loss": -22.667417526245117, "global_step": 124302, "epoch": 1497} {"train_loss": -22.61994743347168, "global_step": 124303, "epoch": 1497} {"train_loss": -22.422080993652344, "global_step": 124304, "epoch": 1497} {"train_loss": -22.707841873168945, "global_step": 124305, "epoch": 1497} {"train_loss": -22.487173080444336, "global_step": 124306, "epoch": 1497} {"train_loss": -22.391098022460938, "global_step": 124307, "epoch": 1497} {"train_loss": -22.851381301879883, "global_step": 124308, "epoch": 1497} {"train_loss": -22.662174224853516, "global_step": 124309, "epoch": 1497} {"train_loss": -22.685644149780273, "global_step": 124310, "epoch": 1497} {"train_loss": -22.535308837890625, "global_step": 124311, "epoch": 1497} {"train_loss": -22.920978546142578, "global_step": 124312, "epoch": 1497} {"train_loss": -22.517377853393555, "global_step": 124313, "epoch": 1497} {"train_loss": -22.774621963500977, "global_step": 124314, "epoch": 1497} {"train_loss": -22.43421173095703, "global_step": 124315, "epoch": 1497} {"train_loss": -22.723087310791016, "global_step": 124316, "epoch": 1497} {"train_loss": -22.77314567565918, "global_step": 124317, "epoch": 1497} {"train_loss": -22.775503158569336, "global_step": 124318, "epoch": 1497} {"train_loss": -22.85808563232422, "global_step": 124319, "epoch": 1497} {"train_loss": -22.63935661315918, "global_step": 124320, "epoch": 1497} {"train_loss": -22.479345321655273, "global_step": 124321, "epoch": 1497} {"train_loss": -22.82729148864746, "global_step": 124322, "epoch": 1497} {"train_loss": -22.812952041625977, "global_step": 124323, "epoch": 1497} {"train_loss": -22.825847625732422, "global_step": 124324, "epoch": 1497} {"train_loss": -22.97040367126465, "global_step": 124325, "epoch": 1497} {"train_loss": -22.931114196777344, "global_step": 124326, "epoch": 1497} {"train_loss": -22.67348289489746, "global_step": 124327, "epoch": 1497} {"train_loss": -22.19561767578125, "global_step": 124328, "epoch": 1497} {"train_loss": -22.5018367767334, "global_step": 124329, "epoch": 1497} {"train_loss": -22.611038208007812, "global_step": 124330, "epoch": 1497} {"train_loss": -22.771881103515625, "global_step": 124331, "epoch": 1497} {"train_loss": -22.758716583251953, "global_step": 124332, "epoch": 1497} {"train_loss": -22.600270236831115, "global_step": 124333, "epoch": 1497, "val_loss": 6241432.5} {"train_loss": -22.4227294921875, "global_step": 124334, "epoch": 1498} {"train_loss": -22.29196548461914, "global_step": 124335, "epoch": 1498} {"train_loss": -22.477792739868164, "global_step": 124336, "epoch": 1498} {"train_loss": -22.31973648071289, "global_step": 124337, "epoch": 1498} {"train_loss": -22.06073570251465, "global_step": 124338, "epoch": 1498} {"train_loss": -22.139026641845703, "global_step": 124339, "epoch": 1498} {"train_loss": -22.23261070251465, "global_step": 124340, "epoch": 1498} {"train_loss": -21.966758728027344, "global_step": 124341, "epoch": 1498} {"train_loss": -22.60560417175293, "global_step": 124342, "epoch": 1498} {"train_loss": -22.462390899658203, "global_step": 124343, "epoch": 1498} {"train_loss": -22.608726501464844, "global_step": 124344, "epoch": 1498} {"train_loss": -22.61317253112793, "global_step": 124345, "epoch": 1498} {"train_loss": -22.42401123046875, "global_step": 124346, "epoch": 1498} {"train_loss": -22.247838973999023, "global_step": 124347, "epoch": 1498} {"train_loss": -22.696077346801758, "global_step": 124348, "epoch": 1498} {"train_loss": -22.796382904052734, "global_step": 124349, "epoch": 1498} {"train_loss": -22.808921813964844, "global_step": 124350, "epoch": 1498} {"train_loss": -22.46763801574707, "global_step": 124351, "epoch": 1498} {"train_loss": -22.897886276245117, "global_step": 124352, "epoch": 1498} {"train_loss": -22.65468406677246, "global_step": 124353, "epoch": 1498} {"train_loss": -22.850168228149414, "global_step": 124354, "epoch": 1498} {"train_loss": -22.866649627685547, "global_step": 124355, "epoch": 1498} {"train_loss": -23.10320472717285, "global_step": 124356, "epoch": 1498} {"train_loss": -22.98427391052246, "global_step": 124357, "epoch": 1498} {"train_loss": -22.53573989868164, "global_step": 124358, "epoch": 1498} {"train_loss": -22.749195098876953, "global_step": 124359, "epoch": 1498} {"train_loss": -22.79361915588379, "global_step": 124360, "epoch": 1498} {"train_loss": -22.58100700378418, "global_step": 124361, "epoch": 1498} {"train_loss": -22.9822940826416, "global_step": 124362, "epoch": 1498} {"train_loss": -22.573169708251953, "global_step": 124363, "epoch": 1498} {"train_loss": -22.572528839111328, "global_step": 124364, "epoch": 1498} {"train_loss": -22.77927017211914, "global_step": 124365, "epoch": 1498} {"train_loss": -22.405353546142578, "global_step": 124366, "epoch": 1498} {"train_loss": -22.845657348632812, "global_step": 124367, "epoch": 1498} {"train_loss": -22.479652404785156, "global_step": 124368, "epoch": 1498} {"train_loss": -22.73945426940918, "global_step": 124369, "epoch": 1498} {"train_loss": -22.9583797454834, "global_step": 124370, "epoch": 1498} {"train_loss": -22.544675827026367, "global_step": 124371, "epoch": 1498} {"train_loss": -22.596994400024414, "global_step": 124372, "epoch": 1498} {"train_loss": -23.17613983154297, "global_step": 124373, "epoch": 1498} {"train_loss": -22.523008346557617, "global_step": 124374, "epoch": 1498} {"train_loss": -22.541460037231445, "global_step": 124375, "epoch": 1498} {"train_loss": -22.527143478393555, "global_step": 124376, "epoch": 1498} {"train_loss": -22.82870101928711, "global_step": 124377, "epoch": 1498} {"train_loss": -22.90304946899414, "global_step": 124378, "epoch": 1498} {"train_loss": -22.946571350097656, "global_step": 124379, "epoch": 1498} {"train_loss": -22.83420181274414, "global_step": 124380, "epoch": 1498} {"train_loss": -22.897586822509766, "global_step": 124381, "epoch": 1498} {"train_loss": -22.17035484313965, "global_step": 124382, "epoch": 1498} {"train_loss": -22.683425903320312, "global_step": 124383, "epoch": 1498} {"train_loss": -22.742923736572266, "global_step": 124384, "epoch": 1498} {"train_loss": -22.59583854675293, "global_step": 124385, "epoch": 1498} {"train_loss": -22.542800903320312, "global_step": 124386, "epoch": 1498} {"train_loss": -22.61046028137207, "global_step": 124387, "epoch": 1498} {"train_loss": -22.48444175720215, "global_step": 124388, "epoch": 1498} {"train_loss": -22.728784561157227, "global_step": 124389, "epoch": 1498} {"train_loss": -22.61004066467285, "global_step": 124390, "epoch": 1498} {"train_loss": -22.72836685180664, "global_step": 124391, "epoch": 1498} {"train_loss": -22.44925308227539, "global_step": 124392, "epoch": 1498} {"train_loss": -22.571304321289062, "global_step": 124393, "epoch": 1498} {"train_loss": -22.517276763916016, "global_step": 124394, "epoch": 1498} {"train_loss": -22.513656616210938, "global_step": 124395, "epoch": 1498} {"train_loss": -22.5455379486084, "global_step": 124396, "epoch": 1498} {"train_loss": -22.46553611755371, "global_step": 124397, "epoch": 1498} {"train_loss": -22.7695255279541, "global_step": 124398, "epoch": 1498} {"train_loss": -23.201139450073242, "global_step": 124399, "epoch": 1498} {"train_loss": -22.85106658935547, "global_step": 124400, "epoch": 1498} {"train_loss": -22.68561363220215, "global_step": 124401, "epoch": 1498} {"train_loss": -22.47043800354004, "global_step": 124402, "epoch": 1498} {"train_loss": -22.938533782958984, "global_step": 124403, "epoch": 1498} {"train_loss": -22.746044158935547, "global_step": 124404, "epoch": 1498} {"train_loss": -23.2879695892334, "global_step": 124405, "epoch": 1498} {"train_loss": -22.568326950073242, "global_step": 124406, "epoch": 1498} {"train_loss": -22.482824325561523, "global_step": 124407, "epoch": 1498} {"train_loss": -23.022226333618164, "global_step": 124408, "epoch": 1498} {"train_loss": -22.822002410888672, "global_step": 124409, "epoch": 1498} {"train_loss": -22.556861877441406, "global_step": 124410, "epoch": 1498} {"train_loss": -22.66302490234375, "global_step": 124411, "epoch": 1498} {"train_loss": -22.385709762573242, "global_step": 124412, "epoch": 1498} {"train_loss": -22.567533493041992, "global_step": 124413, "epoch": 1498} {"train_loss": -22.990934371948242, "global_step": 124414, "epoch": 1498} {"train_loss": -22.536056518554688, "global_step": 124415, "epoch": 1498} {"train_loss": -22.63054468545569, "global_step": 124416, "epoch": 1498, "val_loss": 6197010.0} {"train_loss": -22.00551414489746, "global_step": 124417, "epoch": 1499} {"train_loss": -21.631454467773438, "global_step": 124418, "epoch": 1499} {"train_loss": -22.214506149291992, "global_step": 124419, "epoch": 1499} {"train_loss": -22.00138282775879, "global_step": 124420, "epoch": 1499} {"train_loss": -22.101165771484375, "global_step": 124421, "epoch": 1499} {"train_loss": -22.363195419311523, "global_step": 124422, "epoch": 1499} {"train_loss": -21.466703414916992, "global_step": 124423, "epoch": 1499} {"train_loss": -22.51276206970215, "global_step": 124424, "epoch": 1499} {"train_loss": -21.835641860961914, "global_step": 124425, "epoch": 1499} {"train_loss": -22.253448486328125, "global_step": 124426, "epoch": 1499} {"train_loss": -22.039424896240234, "global_step": 124427, "epoch": 1499} {"train_loss": -22.242612838745117, "global_step": 124428, "epoch": 1499} {"train_loss": -22.261123657226562, "global_step": 124429, "epoch": 1499} {"train_loss": -22.543317794799805, "global_step": 124430, "epoch": 1499} {"train_loss": -21.984384536743164, "global_step": 124431, "epoch": 1499} {"train_loss": -22.641647338867188, "global_step": 124432, "epoch": 1499} {"train_loss": -22.53005027770996, "global_step": 124433, "epoch": 1499} {"train_loss": -22.28261375427246, "global_step": 124434, "epoch": 1499} {"train_loss": -22.40195655822754, "global_step": 124435, "epoch": 1499} {"train_loss": -23.00489044189453, "global_step": 124436, "epoch": 1499} {"train_loss": -22.31378746032715, "global_step": 124437, "epoch": 1499} {"train_loss": -22.483736038208008, "global_step": 124438, "epoch": 1499} {"train_loss": -22.718061447143555, "global_step": 124439, "epoch": 1499} {"train_loss": -22.41599464416504, "global_step": 124440, "epoch": 1499} {"train_loss": -22.807138442993164, "global_step": 124441, "epoch": 1499} {"train_loss": -22.787254333496094, "global_step": 124442, "epoch": 1499} {"train_loss": -22.569421768188477, "global_step": 124443, "epoch": 1499} {"train_loss": -22.60736083984375, "global_step": 124444, "epoch": 1499} {"train_loss": -23.10264015197754, "global_step": 124445, "epoch": 1499} {"train_loss": -22.721206665039062, "global_step": 124446, "epoch": 1499} {"train_loss": -22.873699188232422, "global_step": 124447, "epoch": 1499} {"train_loss": -22.707223892211914, "global_step": 124448, "epoch": 1499} {"train_loss": -22.783742904663086, "global_step": 124449, "epoch": 1499} {"train_loss": -22.315160751342773, "global_step": 124450, "epoch": 1499} {"train_loss": -22.798114776611328, "global_step": 124451, "epoch": 1499} {"train_loss": -22.517301559448242, "global_step": 124452, "epoch": 1499} {"train_loss": -22.40732765197754, "global_step": 124453, "epoch": 1499} {"train_loss": -22.493576049804688, "global_step": 124454, "epoch": 1499} {"train_loss": -22.820377349853516, "global_step": 124455, "epoch": 1499} {"train_loss": -22.379491806030273, "global_step": 124456, "epoch": 1499} {"train_loss": -22.302997589111328, "global_step": 124457, "epoch": 1499} {"train_loss": -22.493438720703125, "global_step": 124458, "epoch": 1499} {"train_loss": -22.50945472717285, "global_step": 124459, "epoch": 1499} {"train_loss": -22.5550537109375, "global_step": 124460, "epoch": 1499} {"train_loss": -22.726547241210938, "global_step": 124461, "epoch": 1499} {"train_loss": -22.87762451171875, "global_step": 124462, "epoch": 1499} {"train_loss": -22.65406608581543, "global_step": 124463, "epoch": 1499} {"train_loss": -22.212230682373047, "global_step": 124464, "epoch": 1499} {"train_loss": -22.652006149291992, "global_step": 124465, "epoch": 1499} {"train_loss": -22.755802154541016, "global_step": 124466, "epoch": 1499} {"train_loss": -23.14906883239746, "global_step": 124467, "epoch": 1499} {"train_loss": -22.717227935791016, "global_step": 124468, "epoch": 1499} {"train_loss": -22.582853317260742, "global_step": 124469, "epoch": 1499} {"train_loss": -22.80958366394043, "global_step": 124470, "epoch": 1499} {"train_loss": -22.886404037475586, "global_step": 124471, "epoch": 1499} {"train_loss": -22.53854751586914, "global_step": 124472, "epoch": 1499} {"train_loss": -22.981143951416016, "global_step": 124473, "epoch": 1499} {"train_loss": -22.69124412536621, "global_step": 124474, "epoch": 1499} {"train_loss": -22.807926177978516, "global_step": 124475, "epoch": 1499} {"train_loss": -22.426971435546875, "global_step": 124476, "epoch": 1499} {"train_loss": -22.40412712097168, "global_step": 124477, "epoch": 1499} {"train_loss": -22.556638717651367, "global_step": 124478, "epoch": 1499} {"train_loss": -22.662168502807617, "global_step": 124479, "epoch": 1499} {"train_loss": -22.617116928100586, "global_step": 124480, "epoch": 1499} {"train_loss": -22.817846298217773, "global_step": 124481, "epoch": 1499} {"train_loss": -22.568256378173828, "global_step": 124482, "epoch": 1499} {"train_loss": -22.646900177001953, "global_step": 124483, "epoch": 1499} {"train_loss": -23.032217025756836, "global_step": 124484, "epoch": 1499} {"train_loss": -22.669574737548828, "global_step": 124485, "epoch": 1499} {"train_loss": -22.43962287902832, "global_step": 124486, "epoch": 1499} {"train_loss": -22.70956802368164, "global_step": 124487, "epoch": 1499} {"train_loss": -22.75339126586914, "global_step": 124488, "epoch": 1499} {"train_loss": -22.890289306640625, "global_step": 124489, "epoch": 1499} {"train_loss": -22.823972702026367, "global_step": 124490, "epoch": 1499} {"train_loss": -22.364782333374023, "global_step": 124491, "epoch": 1499} {"train_loss": -22.57253646850586, "global_step": 124492, "epoch": 1499} {"train_loss": -22.67799186706543, "global_step": 124493, "epoch": 1499} {"train_loss": -22.426145553588867, "global_step": 124494, "epoch": 1499} {"train_loss": -22.78455924987793, "global_step": 124495, "epoch": 1499} {"train_loss": -22.68844985961914, "global_step": 124496, "epoch": 1499} {"train_loss": -22.419057846069336, "global_step": 124497, "epoch": 1499} {"train_loss": -22.805845260620117, "global_step": 124498, "epoch": 1499} {"train_loss": -22.54600876497935, "global_step": 124499, "epoch": 1499, "val_loss": 6245621.0} {"train_loss": -21.800512313842773, "global_step": 124500, "epoch": 1500} {"train_loss": -22.20596694946289, "global_step": 124501, "epoch": 1500} {"train_loss": -22.71748161315918, "global_step": 124502, "epoch": 1500} {"train_loss": -22.141395568847656, "global_step": 124503, "epoch": 1500} {"train_loss": -22.78216552734375, "global_step": 124504, "epoch": 1500} {"train_loss": -22.04863739013672, "global_step": 124505, "epoch": 1500} {"train_loss": -22.186492919921875, "global_step": 124506, "epoch": 1500} {"train_loss": -22.53936195373535, "global_step": 124507, "epoch": 1500} {"train_loss": -21.836122512817383, "global_step": 124508, "epoch": 1500} {"train_loss": -22.263456344604492, "global_step": 124509, "epoch": 1500} {"train_loss": -22.523115158081055, "global_step": 124510, "epoch": 1500} {"train_loss": -22.72722053527832, "global_step": 124511, "epoch": 1500} {"train_loss": -22.411834716796875, "global_step": 124512, "epoch": 1500} {"train_loss": -22.370779037475586, "global_step": 124513, "epoch": 1500} {"train_loss": -22.353986740112305, "global_step": 124514, "epoch": 1500} {"train_loss": -22.453460693359375, "global_step": 124515, "epoch": 1500} {"train_loss": -22.336410522460938, "global_step": 124516, "epoch": 1500} {"train_loss": -22.737939834594727, "global_step": 124517, "epoch": 1500} {"train_loss": -22.541624069213867, "global_step": 124518, "epoch": 1500} {"train_loss": -22.538206100463867, "global_step": 124519, "epoch": 1500} {"train_loss": -22.63922119140625, "global_step": 124520, "epoch": 1500} {"train_loss": -22.7185115814209, "global_step": 124521, "epoch": 1500} {"train_loss": -22.873661041259766, "global_step": 124522, "epoch": 1500} {"train_loss": -22.341209411621094, "global_step": 124523, "epoch": 1500} {"train_loss": -22.786235809326172, "global_step": 124524, "epoch": 1500} {"train_loss": -22.436033248901367, "global_step": 124525, "epoch": 1500} {"train_loss": -22.637073516845703, "global_step": 124526, "epoch": 1500} {"train_loss": -22.713457107543945, "global_step": 124527, "epoch": 1500} {"train_loss": -22.543954849243164, "global_step": 124528, "epoch": 1500} {"train_loss": -22.750654220581055, "global_step": 124529, "epoch": 1500} {"train_loss": -22.165283203125, "global_step": 124530, "epoch": 1500} {"train_loss": -22.206947326660156, "global_step": 124531, "epoch": 1500} {"train_loss": -22.852354049682617, "global_step": 124532, "epoch": 1500} {"train_loss": -22.483564376831055, "global_step": 124533, "epoch": 1500} {"train_loss": -22.83111000061035, "global_step": 124534, "epoch": 1500} {"train_loss": -22.86316680908203, "global_step": 124535, "epoch": 1500} {"train_loss": -22.78944206237793, "global_step": 124536, "epoch": 1500} {"train_loss": -23.064476013183594, "global_step": 124537, "epoch": 1500} {"train_loss": -22.79335594177246, "global_step": 124538, "epoch": 1500} {"train_loss": -22.63132095336914, "global_step": 124539, "epoch": 1500} {"train_loss": -22.404069900512695, "global_step": 124540, "epoch": 1500} {"train_loss": -22.501819610595703, "global_step": 124541, "epoch": 1500} {"train_loss": -22.632694244384766, "global_step": 124542, "epoch": 1500} {"train_loss": -23.199201583862305, "global_step": 124543, "epoch": 1500} {"train_loss": -22.521329879760742, "global_step": 124544, "epoch": 1500} {"train_loss": -22.660917282104492, "global_step": 124545, "epoch": 1500} {"train_loss": -22.61995506286621, "global_step": 124546, "epoch": 1500} {"train_loss": -22.662649154663086, "global_step": 124547, "epoch": 1500} {"train_loss": -22.8178768157959, "global_step": 124548, "epoch": 1500} {"train_loss": -22.586217880249023, "global_step": 124549, "epoch": 1500} {"train_loss": -22.482624053955078, "global_step": 124550, "epoch": 1500} {"train_loss": -23.1318359375, "global_step": 124551, "epoch": 1500} {"train_loss": -22.780094146728516, "global_step": 124552, "epoch": 1500} {"train_loss": -22.743045806884766, "global_step": 124553, "epoch": 1500} {"train_loss": -22.811399459838867, "global_step": 124554, "epoch": 1500} {"train_loss": -22.782331466674805, "global_step": 124555, "epoch": 1500} {"train_loss": -22.643054962158203, "global_step": 124556, "epoch": 1500} {"train_loss": -22.749784469604492, "global_step": 124557, "epoch": 1500} {"train_loss": -22.634323120117188, "global_step": 124558, "epoch": 1500} {"train_loss": -22.72410011291504, "global_step": 124559, "epoch": 1500} {"train_loss": -22.681697845458984, "global_step": 124560, "epoch": 1500} {"train_loss": -22.7141170501709, "global_step": 124561, "epoch": 1500} {"train_loss": -22.339479446411133, "global_step": 124562, "epoch": 1500} {"train_loss": -22.741682052612305, "global_step": 124563, "epoch": 1500} {"train_loss": -22.497982025146484, "global_step": 124564, "epoch": 1500} {"train_loss": -22.48604965209961, "global_step": 124565, "epoch": 1500} {"train_loss": -22.718555450439453, "global_step": 124566, "epoch": 1500} {"train_loss": -22.65653419494629, "global_step": 124567, "epoch": 1500} {"train_loss": -22.623371124267578, "global_step": 124568, "epoch": 1500} {"train_loss": -22.7189884185791, "global_step": 124569, "epoch": 1500} {"train_loss": -22.525190353393555, "global_step": 124570, "epoch": 1500} {"train_loss": -22.731704711914062, "global_step": 124571, "epoch": 1500} {"train_loss": -22.593320846557617, "global_step": 124572, "epoch": 1500} {"train_loss": -22.361494064331055, "global_step": 124573, "epoch": 1500} {"train_loss": -22.60763931274414, "global_step": 124574, "epoch": 1500} {"train_loss": -22.710575103759766, "global_step": 124575, "epoch": 1500} {"train_loss": -22.28031349182129, "global_step": 124576, "epoch": 1500} {"train_loss": -22.656797409057617, "global_step": 124577, "epoch": 1500} {"train_loss": -22.245481491088867, "global_step": 124578, "epoch": 1500} {"train_loss": -22.924070358276367, "global_step": 124579, "epoch": 1500} {"train_loss": -22.62917709350586, "global_step": 124580, "epoch": 1500} {"train_loss": -22.419279098510742, "global_step": 124581, "epoch": 1500} {"train_loss": -22.5722157811544, "global_step": 124582, "epoch": 1500, "train/sim_max_reward_0": 1.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4500000": 1.0, "test/sim_max_reward_4500001": 1.0, "test/sim_max_reward_4500002": 1.0, "test/sim_max_reward_4500003": 1.0, "test/sim_max_reward_4500004": 1.0, "test/sim_max_reward_4500005": 1.0, "test/sim_max_reward_4500006": 1.0, "test/sim_max_reward_4500007": 1.0, "test/sim_max_reward_4500008": 1.0, "test/sim_max_reward_4500009": 1.0, "test/sim_max_reward_4500010": 1.0, "test/sim_max_reward_4500011": 1.0, "test/sim_max_reward_4500012": 1.0, "test/sim_max_reward_4500013": 1.0, "test/sim_max_reward_4500014": 1.0, "test/sim_max_reward_4500015": 1.0, "test/sim_max_reward_4500016": 1.0, "test/sim_max_reward_4500017": 1.0, "test/sim_max_reward_4500018": 1.0, "test/sim_max_reward_4500019": 0.0, "test/sim_max_reward_4500020": 1.0, "test/sim_max_reward_4500021": 1.0, "train/mean_score": 1.0, "test/mean_score": 0.9545454545454546, "val_loss": 6297012.0} {"train_loss": -22.074880599975586, "global_step": 124583, "epoch": 1501} {"train_loss": -22.443620681762695, "global_step": 124584, "epoch": 1501} {"train_loss": -22.08991813659668, "global_step": 124585, "epoch": 1501} {"train_loss": -22.027353286743164, "global_step": 124586, "epoch": 1501} {"train_loss": -22.29620361328125, "global_step": 124587, "epoch": 1501} {"train_loss": -22.00156593322754, "global_step": 124588, "epoch": 1501} {"train_loss": -22.517024993896484, "global_step": 124589, "epoch": 1501} {"train_loss": -22.36236000061035, "global_step": 124590, "epoch": 1501} {"train_loss": -22.01650619506836, "global_step": 124591, "epoch": 1501} {"train_loss": -22.243438720703125, "global_step": 124592, "epoch": 1501} {"train_loss": -22.520849227905273, "global_step": 124593, "epoch": 1501} {"train_loss": -22.455076217651367, "global_step": 124594, "epoch": 1501} {"train_loss": -22.520709991455078, "global_step": 124595, "epoch": 1501} {"train_loss": -22.03325843811035, "global_step": 124596, "epoch": 1501} {"train_loss": -22.368757247924805, "global_step": 124597, "epoch": 1501} {"train_loss": -22.596311569213867, "global_step": 124598, "epoch": 1501} {"train_loss": -22.179365158081055, "global_step": 124599, "epoch": 1501} {"train_loss": -22.445594787597656, "global_step": 124600, "epoch": 1501} {"train_loss": -22.56208610534668, "global_step": 124601, "epoch": 1501} {"train_loss": -22.492721557617188, "global_step": 124602, "epoch": 1501} {"train_loss": -22.467065811157227, "global_step": 124603, "epoch": 1501} {"train_loss": -22.721729278564453, "global_step": 124604, "epoch": 1501} {"train_loss": -22.374608993530273, "global_step": 124605, "epoch": 1501} {"train_loss": -22.402732849121094, "global_step": 124606, "epoch": 1501} {"train_loss": -22.68210220336914, "global_step": 124607, "epoch": 1501} {"train_loss": -22.53360366821289, "global_step": 124608, "epoch": 1501} {"train_loss": -22.507238388061523, "global_step": 124609, "epoch": 1501} {"train_loss": -22.261394500732422, "global_step": 124610, "epoch": 1501} {"train_loss": -22.666757583618164, "global_step": 124611, "epoch": 1501} {"train_loss": -22.31974220275879, "global_step": 124612, "epoch": 1501} {"train_loss": -22.615110397338867, "global_step": 124613, "epoch": 1501} {"train_loss": -22.179996490478516, "global_step": 124614, "epoch": 1501} {"train_loss": -22.819965362548828, "global_step": 124615, "epoch": 1501} {"train_loss": -22.902076721191406, "global_step": 124616, "epoch": 1501} {"train_loss": -22.340707778930664, "global_step": 124617, "epoch": 1501} {"train_loss": -22.727558135986328, "global_step": 124618, "epoch": 1501} {"train_loss": -22.650671005249023, "global_step": 124619, "epoch": 1501} {"train_loss": -22.75174903869629, "global_step": 124620, "epoch": 1501} {"train_loss": -22.437210083007812, "global_step": 124621, "epoch": 1501} {"train_loss": -22.60048484802246, "global_step": 124622, "epoch": 1501} {"train_loss": -22.704322814941406, "global_step": 124623, "epoch": 1501} {"train_loss": -22.5871524810791, "global_step": 124624, "epoch": 1501} {"train_loss": -23.104434967041016, "global_step": 124625, "epoch": 1501} {"train_loss": -22.736848831176758, "global_step": 124626, "epoch": 1501} {"train_loss": -22.752090454101562, "global_step": 124627, "epoch": 1501} {"train_loss": -22.716093063354492, "global_step": 124628, "epoch": 1501} {"train_loss": -22.832521438598633, "global_step": 124629, "epoch": 1501} {"train_loss": -22.557682037353516, "global_step": 124630, "epoch": 1501} {"train_loss": -22.733020782470703, "global_step": 124631, "epoch": 1501} {"train_loss": -22.633085250854492, "global_step": 124632, "epoch": 1501} {"train_loss": -22.460285186767578, "global_step": 124633, "epoch": 1501} {"train_loss": -22.758893966674805, "global_step": 124634, "epoch": 1501} {"train_loss": -22.550901412963867, "global_step": 124635, "epoch": 1501} {"train_loss": -22.559690475463867, "global_step": 124636, "epoch": 1501} {"train_loss": -22.693159103393555, "global_step": 124637, "epoch": 1501} {"train_loss": -23.02223014831543, "global_step": 124638, "epoch": 1501} {"train_loss": -23.100189208984375, "global_step": 124639, "epoch": 1501} {"train_loss": -22.322904586791992, "global_step": 124640, "epoch": 1501} {"train_loss": -22.899656295776367, "global_step": 124641, "epoch": 1501} {"train_loss": -22.613189697265625, "global_step": 124642, "epoch": 1501} {"train_loss": -22.466001510620117, "global_step": 124643, "epoch": 1501} {"train_loss": -22.748991012573242, "global_step": 124644, "epoch": 1501} {"train_loss": -22.610111236572266, "global_step": 124645, "epoch": 1501} {"train_loss": -22.626733779907227, "global_step": 124646, "epoch": 1501} {"train_loss": -22.813344955444336, "global_step": 124647, "epoch": 1501} {"train_loss": -22.675384521484375, "global_step": 124648, "epoch": 1501} {"train_loss": -22.83199119567871, "global_step": 124649, "epoch": 1501} {"train_loss": -22.524824142456055, "global_step": 124650, "epoch": 1501} {"train_loss": -22.43281364440918, "global_step": 124651, "epoch": 1501} {"train_loss": -22.714996337890625, "global_step": 124652, "epoch": 1501} {"train_loss": -22.871042251586914, "global_step": 124653, "epoch": 1501} {"train_loss": -22.728382110595703, "global_step": 124654, "epoch": 1501} {"train_loss": -22.689172744750977, "global_step": 124655, "epoch": 1501} {"train_loss": -22.338558197021484, "global_step": 124656, "epoch": 1501} {"train_loss": -22.530136108398438, "global_step": 124657, "epoch": 1501} {"train_loss": -22.677249908447266, "global_step": 124658, "epoch": 1501} {"train_loss": -22.25517463684082, "global_step": 124659, "epoch": 1501} {"train_loss": -23.01146125793457, "global_step": 124660, "epoch": 1501} {"train_loss": -22.582149505615234, "global_step": 124661, "epoch": 1501} {"train_loss": -22.632089614868164, "global_step": 124662, "epoch": 1501} {"train_loss": -22.872709274291992, "global_step": 124663, "epoch": 1501} {"train_loss": -22.947546005249023, "global_step": 124664, "epoch": 1501} {"train_loss": -22.567046153976257, "global_step": 124665, "epoch": 1501, "val_loss": 6240917.5} {"train_loss": -22.527191162109375, "global_step": 124666, "epoch": 1502} {"train_loss": -21.45618438720703, "global_step": 124667, "epoch": 1502} {"train_loss": -21.996435165405273, "global_step": 124668, "epoch": 1502} {"train_loss": -22.05828857421875, "global_step": 124669, "epoch": 1502} {"train_loss": -22.03406524658203, "global_step": 124670, "epoch": 1502} {"train_loss": -22.585372924804688, "global_step": 124671, "epoch": 1502} {"train_loss": -22.183116912841797, "global_step": 124672, "epoch": 1502} {"train_loss": -22.159093856811523, "global_step": 124673, "epoch": 1502} {"train_loss": -22.31780433654785, "global_step": 124674, "epoch": 1502} {"train_loss": -22.38301658630371, "global_step": 124675, "epoch": 1502} {"train_loss": -22.47430419921875, "global_step": 124676, "epoch": 1502} {"train_loss": -22.244409561157227, "global_step": 124677, "epoch": 1502} {"train_loss": -22.57267189025879, "global_step": 124678, "epoch": 1502} {"train_loss": -22.35341453552246, "global_step": 124679, "epoch": 1502} {"train_loss": -22.309677124023438, "global_step": 124680, "epoch": 1502} {"train_loss": -22.497098922729492, "global_step": 124681, "epoch": 1502} {"train_loss": -22.6140193939209, "global_step": 124682, "epoch": 1502} {"train_loss": -22.76888084411621, "global_step": 124683, "epoch": 1502} {"train_loss": -22.446958541870117, "global_step": 124684, "epoch": 1502} {"train_loss": -22.5150203704834, "global_step": 124685, "epoch": 1502} {"train_loss": -23.007993698120117, "global_step": 124686, "epoch": 1502} {"train_loss": -22.649032592773438, "global_step": 124687, "epoch": 1502} {"train_loss": -22.421554565429688, "global_step": 124688, "epoch": 1502} {"train_loss": -22.775419235229492, "global_step": 124689, "epoch": 1502} {"train_loss": -22.914813995361328, "global_step": 124690, "epoch": 1502} {"train_loss": -22.581533432006836, "global_step": 124691, "epoch": 1502} {"train_loss": -22.608461380004883, "global_step": 124692, "epoch": 1502} {"train_loss": -22.477371215820312, "global_step": 124693, "epoch": 1502} {"train_loss": -22.309188842773438, "global_step": 124694, "epoch": 1502} {"train_loss": -22.518583297729492, "global_step": 124695, "epoch": 1502} {"train_loss": -22.67023277282715, "global_step": 124696, "epoch": 1502} {"train_loss": -22.37879753112793, "global_step": 124697, "epoch": 1502} {"train_loss": -22.681514739990234, "global_step": 124698, "epoch": 1502} {"train_loss": -22.90547752380371, "global_step": 124699, "epoch": 1502} {"train_loss": -22.706541061401367, "global_step": 124700, "epoch": 1502} {"train_loss": -22.928556442260742, "global_step": 124701, "epoch": 1502} {"train_loss": -22.63348960876465, "global_step": 124702, "epoch": 1502} {"train_loss": -22.787899017333984, "global_step": 124703, "epoch": 1502} {"train_loss": -22.7847957611084, "global_step": 124704, "epoch": 1502} {"train_loss": -22.87649154663086, "global_step": 124705, "epoch": 1502} {"train_loss": -22.556913375854492, "global_step": 124706, "epoch": 1502} {"train_loss": -22.66986083984375, "global_step": 124707, "epoch": 1502} {"train_loss": -22.76350975036621, "global_step": 124708, "epoch": 1502} {"train_loss": -23.136688232421875, "global_step": 124709, "epoch": 1502} {"train_loss": -23.15777015686035, "global_step": 124710, "epoch": 1502} {"train_loss": -22.991994857788086, "global_step": 124711, "epoch": 1502} {"train_loss": -22.6048641204834, "global_step": 124712, "epoch": 1502} {"train_loss": -22.702213287353516, "global_step": 124713, "epoch": 1502} {"train_loss": -22.68250846862793, "global_step": 124714, "epoch": 1502} {"train_loss": -22.559646606445312, "global_step": 124715, "epoch": 1502} {"train_loss": -22.56770133972168, "global_step": 124716, "epoch": 1502} {"train_loss": -22.531293869018555, "global_step": 124717, "epoch": 1502} {"train_loss": -22.763172149658203, "global_step": 124718, "epoch": 1502} {"train_loss": -22.822967529296875, "global_step": 124719, "epoch": 1502} {"train_loss": -22.891307830810547, "global_step": 124720, "epoch": 1502} {"train_loss": -22.97928810119629, "global_step": 124721, "epoch": 1502} {"train_loss": -22.67519187927246, "global_step": 124722, "epoch": 1502} {"train_loss": -22.22138023376465, "global_step": 124723, "epoch": 1502} {"train_loss": -22.832046508789062, "global_step": 124724, "epoch": 1502} {"train_loss": -22.55677604675293, "global_step": 124725, "epoch": 1502} {"train_loss": -22.878387451171875, "global_step": 124726, "epoch": 1502} {"train_loss": -22.80548095703125, "global_step": 124727, "epoch": 1502} {"train_loss": -22.957792282104492, "global_step": 124728, "epoch": 1502} {"train_loss": -22.539154052734375, "global_step": 124729, "epoch": 1502} {"train_loss": -22.760000228881836, "global_step": 124730, "epoch": 1502} {"train_loss": -22.39064598083496, "global_step": 124731, "epoch": 1502} {"train_loss": -22.475576400756836, "global_step": 124732, "epoch": 1502} {"train_loss": -22.524518966674805, "global_step": 124733, "epoch": 1502} {"train_loss": -22.65940284729004, "global_step": 124734, "epoch": 1502} {"train_loss": -22.911651611328125, "global_step": 124735, "epoch": 1502} {"train_loss": -22.50221824645996, "global_step": 124736, "epoch": 1502} {"train_loss": -22.637502670288086, "global_step": 124737, "epoch": 1502} {"train_loss": -22.918115615844727, "global_step": 124738, "epoch": 1502} {"train_loss": -22.667858123779297, "global_step": 124739, "epoch": 1502} {"train_loss": -22.4351863861084, "global_step": 124740, "epoch": 1502} {"train_loss": -22.782793045043945, "global_step": 124741, "epoch": 1502} {"train_loss": -22.985843658447266, "global_step": 124742, "epoch": 1502} {"train_loss": -22.356910705566406, "global_step": 124743, "epoch": 1502} {"train_loss": -22.422420501708984, "global_step": 124744, "epoch": 1502} {"train_loss": -22.64240837097168, "global_step": 124745, "epoch": 1502} {"train_loss": -22.598777770996094, "global_step": 124746, "epoch": 1502} {"train_loss": -22.31662368774414, "global_step": 124747, "epoch": 1502} {"train_loss": -22.596579080604645, "global_step": 124748, "epoch": 1502, "val_loss": 6349377.0} {"train_loss": -22.05861473083496, "global_step": 124749, "epoch": 1503} {"train_loss": -21.538618087768555, "global_step": 124750, "epoch": 1503} {"train_loss": -22.284652709960938, "global_step": 124751, "epoch": 1503} {"train_loss": -21.943437576293945, "global_step": 124752, "epoch": 1503} {"train_loss": -21.98609161376953, "global_step": 124753, "epoch": 1503} {"train_loss": -22.059417724609375, "global_step": 124754, "epoch": 1503} {"train_loss": -21.900632858276367, "global_step": 124755, "epoch": 1503} {"train_loss": -22.48114013671875, "global_step": 124756, "epoch": 1503} {"train_loss": -22.204504013061523, "global_step": 124757, "epoch": 1503} {"train_loss": -21.665159225463867, "global_step": 124758, "epoch": 1503} {"train_loss": -22.394405364990234, "global_step": 124759, "epoch": 1503} {"train_loss": -21.8911075592041, "global_step": 124760, "epoch": 1503} {"train_loss": -21.827299118041992, "global_step": 124761, "epoch": 1503} {"train_loss": -22.30315589904785, "global_step": 124762, "epoch": 1503} {"train_loss": -22.308544158935547, "global_step": 124763, "epoch": 1503} {"train_loss": -21.955278396606445, "global_step": 124764, "epoch": 1503} {"train_loss": -22.20692253112793, "global_step": 124765, "epoch": 1503} {"train_loss": -22.363927841186523, "global_step": 124766, "epoch": 1503} {"train_loss": -22.248733520507812, "global_step": 124767, "epoch": 1503} {"train_loss": -22.508623123168945, "global_step": 124768, "epoch": 1503} {"train_loss": -22.303791046142578, "global_step": 124769, "epoch": 1503} {"train_loss": -22.450441360473633, "global_step": 124770, "epoch": 1503} {"train_loss": -22.086292266845703, "global_step": 124771, "epoch": 1503} {"train_loss": -22.340065002441406, "global_step": 124772, "epoch": 1503} {"train_loss": -22.6344051361084, "global_step": 124773, "epoch": 1503} {"train_loss": -22.271299362182617, "global_step": 124774, "epoch": 1503} {"train_loss": -22.353185653686523, "global_step": 124775, "epoch": 1503} {"train_loss": -22.809152603149414, "global_step": 124776, "epoch": 1503} {"train_loss": -22.794055938720703, "global_step": 124777, "epoch": 1503} {"train_loss": -22.67543601989746, "global_step": 124778, "epoch": 1503} {"train_loss": -22.70420265197754, "global_step": 124779, "epoch": 1503} {"train_loss": -22.64116859436035, "global_step": 124780, "epoch": 1503} {"train_loss": -22.74144172668457, "global_step": 124781, "epoch": 1503} {"train_loss": -22.534971237182617, "global_step": 124782, "epoch": 1503} {"train_loss": -22.490367889404297, "global_step": 124783, "epoch": 1503} {"train_loss": -22.609819412231445, "global_step": 124784, "epoch": 1503} {"train_loss": -22.64976692199707, "global_step": 124785, "epoch": 1503} {"train_loss": -22.60317039489746, "global_step": 124786, "epoch": 1503} {"train_loss": -22.874528884887695, "global_step": 124787, "epoch": 1503} {"train_loss": -22.440345764160156, "global_step": 124788, "epoch": 1503} {"train_loss": -22.59452247619629, "global_step": 124789, "epoch": 1503} {"train_loss": -23.129886627197266, "global_step": 124790, "epoch": 1503} {"train_loss": -22.641950607299805, "global_step": 124791, "epoch": 1503} {"train_loss": -22.34381675720215, "global_step": 124792, "epoch": 1503} {"train_loss": -22.525484085083008, "global_step": 124793, "epoch": 1503} {"train_loss": -23.01834487915039, "global_step": 124794, "epoch": 1503} {"train_loss": -22.424930572509766, "global_step": 124795, "epoch": 1503} {"train_loss": -22.809362411499023, "global_step": 124796, "epoch": 1503} {"train_loss": -22.70444107055664, "global_step": 124797, "epoch": 1503} {"train_loss": -22.85040283203125, "global_step": 124798, "epoch": 1503} {"train_loss": -22.75739860534668, "global_step": 124799, "epoch": 1503} {"train_loss": -22.801603317260742, "global_step": 124800, "epoch": 1503} {"train_loss": -22.824016571044922, "global_step": 124801, "epoch": 1503} {"train_loss": -22.656896591186523, "global_step": 124802, "epoch": 1503} {"train_loss": -22.582555770874023, "global_step": 124803, "epoch": 1503} {"train_loss": -22.608963012695312, "global_step": 124804, "epoch": 1503} {"train_loss": -22.836532592773438, "global_step": 124805, "epoch": 1503} {"train_loss": -22.894123077392578, "global_step": 124806, "epoch": 1503} {"train_loss": -23.02132797241211, "global_step": 124807, "epoch": 1503} {"train_loss": -22.896697998046875, "global_step": 124808, "epoch": 1503} {"train_loss": -22.638978958129883, "global_step": 124809, "epoch": 1503} {"train_loss": -22.7921142578125, "global_step": 124810, "epoch": 1503} {"train_loss": -23.0421142578125, "global_step": 124811, "epoch": 1503} {"train_loss": -22.9636173248291, "global_step": 124812, "epoch": 1503} {"train_loss": -22.845088958740234, "global_step": 124813, "epoch": 1503} {"train_loss": -22.738309860229492, "global_step": 124814, "epoch": 1503} {"train_loss": -22.83620262145996, "global_step": 124815, "epoch": 1503} {"train_loss": -22.64228630065918, "global_step": 124816, "epoch": 1503} {"train_loss": -22.635854721069336, "global_step": 124817, "epoch": 1503} {"train_loss": -22.529827117919922, "global_step": 124818, "epoch": 1503} {"train_loss": -22.691890716552734, "global_step": 124819, "epoch": 1503} {"train_loss": -22.720523834228516, "global_step": 124820, "epoch": 1503} {"train_loss": -22.757251739501953, "global_step": 124821, "epoch": 1503} {"train_loss": -22.659215927124023, "global_step": 124822, "epoch": 1503} {"train_loss": -22.84925651550293, "global_step": 124823, "epoch": 1503} {"train_loss": -22.625526428222656, "global_step": 124824, "epoch": 1503} {"train_loss": -22.666614532470703, "global_step": 124825, "epoch": 1503} {"train_loss": -22.820980072021484, "global_step": 124826, "epoch": 1503} {"train_loss": -23.01434326171875, "global_step": 124827, "epoch": 1503} {"train_loss": -22.557004928588867, "global_step": 124828, "epoch": 1503} {"train_loss": -22.49794578552246, "global_step": 124829, "epoch": 1503} {"train_loss": -22.643827438354492, "global_step": 124830, "epoch": 1503} {"train_loss": -22.543815474912346, "global_step": 124831, "epoch": 1503, "val_loss": 6157286.0} {"train_loss": -22.119586944580078, "global_step": 124832, "epoch": 1504} {"train_loss": -22.0483455657959, "global_step": 124833, "epoch": 1504} {"train_loss": -22.30372428894043, "global_step": 124834, "epoch": 1504} {"train_loss": -21.952106475830078, "global_step": 124835, "epoch": 1504} {"train_loss": -22.492218017578125, "global_step": 124836, "epoch": 1504} {"train_loss": -22.261579513549805, "global_step": 124837, "epoch": 1504} {"train_loss": -22.110715866088867, "global_step": 124838, "epoch": 1504} {"train_loss": -22.39121437072754, "global_step": 124839, "epoch": 1504} {"train_loss": -22.06949234008789, "global_step": 124840, "epoch": 1504} {"train_loss": -22.527746200561523, "global_step": 124841, "epoch": 1504} {"train_loss": -22.381305694580078, "global_step": 124842, "epoch": 1504} {"train_loss": -22.438703536987305, "global_step": 124843, "epoch": 1504} {"train_loss": -22.450542449951172, "global_step": 124844, "epoch": 1504} {"train_loss": -22.189939498901367, "global_step": 124845, "epoch": 1504} {"train_loss": -22.403766632080078, "global_step": 124846, "epoch": 1504} {"train_loss": -22.477087020874023, "global_step": 124847, "epoch": 1504} {"train_loss": -22.540822982788086, "global_step": 124848, "epoch": 1504} {"train_loss": -22.36669921875, "global_step": 124849, "epoch": 1504} {"train_loss": -22.305063247680664, "global_step": 124850, "epoch": 1504} {"train_loss": -22.89576530456543, "global_step": 124851, "epoch": 1504} {"train_loss": -22.543750762939453, "global_step": 124852, "epoch": 1504} {"train_loss": -22.779678344726562, "global_step": 124853, "epoch": 1504} {"train_loss": -22.610105514526367, "global_step": 124854, "epoch": 1504} {"train_loss": -22.608869552612305, "global_step": 124855, "epoch": 1504} {"train_loss": -22.830524444580078, "global_step": 124856, "epoch": 1504} {"train_loss": -22.549543380737305, "global_step": 124857, "epoch": 1504} {"train_loss": -22.712560653686523, "global_step": 124858, "epoch": 1504} {"train_loss": -23.110660552978516, "global_step": 124859, "epoch": 1504} {"train_loss": -22.62388038635254, "global_step": 124860, "epoch": 1504} {"train_loss": -22.4649715423584, "global_step": 124861, "epoch": 1504} {"train_loss": -22.587461471557617, "global_step": 124862, "epoch": 1504} {"train_loss": -22.667966842651367, "global_step": 124863, "epoch": 1504} {"train_loss": -22.413328170776367, "global_step": 124864, "epoch": 1504} {"train_loss": -22.30940818786621, "global_step": 124865, "epoch": 1504} {"train_loss": -22.796154022216797, "global_step": 124866, "epoch": 1504} {"train_loss": -22.552236557006836, "global_step": 124867, "epoch": 1504} {"train_loss": -22.4409122467041, "global_step": 124868, "epoch": 1504} {"train_loss": -22.87698745727539, "global_step": 124869, "epoch": 1504} {"train_loss": -22.869394302368164, "global_step": 124870, "epoch": 1504} {"train_loss": -22.716014862060547, "global_step": 124871, "epoch": 1504} {"train_loss": -22.66397476196289, "global_step": 124872, "epoch": 1504} {"train_loss": -22.829145431518555, "global_step": 124873, "epoch": 1504} {"train_loss": -22.629348754882812, "global_step": 124874, "epoch": 1504} {"train_loss": -22.597620010375977, "global_step": 124875, "epoch": 1504} {"train_loss": -22.406524658203125, "global_step": 124876, "epoch": 1504} {"train_loss": -22.449235916137695, "global_step": 124877, "epoch": 1504} {"train_loss": -22.477575302124023, "global_step": 124878, "epoch": 1504} {"train_loss": -22.98558807373047, "global_step": 124879, "epoch": 1504} {"train_loss": -22.48760414123535, "global_step": 124880, "epoch": 1504} {"train_loss": -22.795658111572266, "global_step": 124881, "epoch": 1504} {"train_loss": -22.793420791625977, "global_step": 124882, "epoch": 1504} {"train_loss": -22.615488052368164, "global_step": 124883, "epoch": 1504} {"train_loss": -22.516643524169922, "global_step": 124884, "epoch": 1504} {"train_loss": -22.246395111083984, "global_step": 124885, "epoch": 1504} {"train_loss": -22.363142013549805, "global_step": 124886, "epoch": 1504} {"train_loss": -22.800474166870117, "global_step": 124887, "epoch": 1504} {"train_loss": -22.776927947998047, "global_step": 124888, "epoch": 1504} {"train_loss": -23.00544548034668, "global_step": 124889, "epoch": 1504} {"train_loss": -22.742855072021484, "global_step": 124890, "epoch": 1504} {"train_loss": -22.661640167236328, "global_step": 124891, "epoch": 1504} {"train_loss": -22.685487747192383, "global_step": 124892, "epoch": 1504} {"train_loss": -22.557355880737305, "global_step": 124893, "epoch": 1504} {"train_loss": -22.575361251831055, "global_step": 124894, "epoch": 1504} {"train_loss": -22.575529098510742, "global_step": 124895, "epoch": 1504} {"train_loss": -22.713123321533203, "global_step": 124896, "epoch": 1504} {"train_loss": -22.69294548034668, "global_step": 124897, "epoch": 1504} {"train_loss": -22.571176528930664, "global_step": 124898, "epoch": 1504} {"train_loss": -22.725139617919922, "global_step": 124899, "epoch": 1504} {"train_loss": -22.568016052246094, "global_step": 124900, "epoch": 1504} {"train_loss": -22.672361373901367, "global_step": 124901, "epoch": 1504} {"train_loss": -22.1804141998291, "global_step": 124902, "epoch": 1504} {"train_loss": -22.561965942382812, "global_step": 124903, "epoch": 1504} {"train_loss": -22.354297637939453, "global_step": 124904, "epoch": 1504} {"train_loss": -22.547494888305664, "global_step": 124905, "epoch": 1504} {"train_loss": -22.76760482788086, "global_step": 124906, "epoch": 1504} {"train_loss": -22.77088737487793, "global_step": 124907, "epoch": 1504} {"train_loss": -22.923542022705078, "global_step": 124908, "epoch": 1504} {"train_loss": -22.372756958007812, "global_step": 124909, "epoch": 1504} {"train_loss": -22.50183868408203, "global_step": 124910, "epoch": 1504} {"train_loss": -23.074508666992188, "global_step": 124911, "epoch": 1504} {"train_loss": -22.842512130737305, "global_step": 124912, "epoch": 1504} {"train_loss": -22.745141983032227, "global_step": 124913, "epoch": 1504} {"train_loss": -22.580458238900427, "global_step": 124914, "epoch": 1504, "val_loss": 6341311.0} {"train_loss": -22.364606857299805, "global_step": 124915, "epoch": 1505} {"train_loss": -22.661048889160156, "global_step": 124916, "epoch": 1505} {"train_loss": -22.438405990600586, "global_step": 124917, "epoch": 1505} {"train_loss": -22.499040603637695, "global_step": 124918, "epoch": 1505} {"train_loss": -22.064804077148438, "global_step": 124919, "epoch": 1505} {"train_loss": -22.025827407836914, "global_step": 124920, "epoch": 1505} {"train_loss": -22.327455520629883, "global_step": 124921, "epoch": 1505} {"train_loss": -22.56245994567871, "global_step": 124922, "epoch": 1505} {"train_loss": -22.312366485595703, "global_step": 124923, "epoch": 1505} {"train_loss": -22.48404884338379, "global_step": 124924, "epoch": 1505} {"train_loss": -22.366308212280273, "global_step": 124925, "epoch": 1505} {"train_loss": -22.47735023498535, "global_step": 124926, "epoch": 1505} {"train_loss": -22.757431030273438, "global_step": 124927, "epoch": 1505} {"train_loss": -22.559167861938477, "global_step": 124928, "epoch": 1505} {"train_loss": -22.70018196105957, "global_step": 124929, "epoch": 1505} {"train_loss": -22.3497371673584, "global_step": 124930, "epoch": 1505} {"train_loss": -22.411884307861328, "global_step": 124931, "epoch": 1505} {"train_loss": -22.67026138305664, "global_step": 124932, "epoch": 1505} {"train_loss": -22.878459930419922, "global_step": 124933, "epoch": 1505} {"train_loss": -22.899051666259766, "global_step": 124934, "epoch": 1505} {"train_loss": -22.56203269958496, "global_step": 124935, "epoch": 1505} {"train_loss": -22.368209838867188, "global_step": 124936, "epoch": 1505} {"train_loss": -22.468381881713867, "global_step": 124937, "epoch": 1505} {"train_loss": -22.281816482543945, "global_step": 124938, "epoch": 1505} {"train_loss": -22.73328971862793, "global_step": 124939, "epoch": 1505} {"train_loss": -22.592504501342773, "global_step": 124940, "epoch": 1505} {"train_loss": -22.80318260192871, "global_step": 124941, "epoch": 1505} {"train_loss": -22.277929306030273, "global_step": 124942, "epoch": 1505} {"train_loss": -22.273832321166992, "global_step": 124943, "epoch": 1505} {"train_loss": -22.394119262695312, "global_step": 124944, "epoch": 1505} {"train_loss": -22.422706604003906, "global_step": 124945, "epoch": 1505} {"train_loss": -22.42827033996582, "global_step": 124946, "epoch": 1505} {"train_loss": -22.90057945251465, "global_step": 124947, "epoch": 1505} {"train_loss": -22.83592414855957, "global_step": 124948, "epoch": 1505} {"train_loss": -23.01107406616211, "global_step": 124949, "epoch": 1505} {"train_loss": -22.96527862548828, "global_step": 124950, "epoch": 1505} {"train_loss": -22.854257583618164, "global_step": 124951, "epoch": 1505} {"train_loss": -22.79183578491211, "global_step": 124952, "epoch": 1505} {"train_loss": -22.924043655395508, "global_step": 124953, "epoch": 1505} {"train_loss": -22.52814292907715, "global_step": 124954, "epoch": 1505} {"train_loss": -22.67545509338379, "global_step": 124955, "epoch": 1505} {"train_loss": -22.641616821289062, "global_step": 124956, "epoch": 1505} {"train_loss": -22.510446548461914, "global_step": 124957, "epoch": 1505} {"train_loss": -22.765304565429688, "global_step": 124958, "epoch": 1505} {"train_loss": -22.365928649902344, "global_step": 124959, "epoch": 1505} {"train_loss": -22.921127319335938, "global_step": 124960, "epoch": 1505} {"train_loss": -22.5993595123291, "global_step": 124961, "epoch": 1505} {"train_loss": -22.687030792236328, "global_step": 124962, "epoch": 1505} {"train_loss": -22.717878341674805, "global_step": 124963, "epoch": 1505} {"train_loss": -23.389930725097656, "global_step": 124964, "epoch": 1505} {"train_loss": -22.520889282226562, "global_step": 124965, "epoch": 1505} {"train_loss": -22.62129783630371, "global_step": 124966, "epoch": 1505} {"train_loss": -22.89341926574707, "global_step": 124967, "epoch": 1505} {"train_loss": -22.564184188842773, "global_step": 124968, "epoch": 1505} {"train_loss": -22.540067672729492, "global_step": 124969, "epoch": 1505} {"train_loss": -22.650136947631836, "global_step": 124970, "epoch": 1505} {"train_loss": -22.686378479003906, "global_step": 124971, "epoch": 1505} {"train_loss": -22.7926082611084, "global_step": 124972, "epoch": 1505} {"train_loss": -22.878807067871094, "global_step": 124973, "epoch": 1505} {"train_loss": -22.57918357849121, "global_step": 124974, "epoch": 1505} {"train_loss": -22.60793113708496, "global_step": 124975, "epoch": 1505} {"train_loss": -22.418386459350586, "global_step": 124976, "epoch": 1505} {"train_loss": -22.335752487182617, "global_step": 124977, "epoch": 1505} {"train_loss": -22.785823822021484, "global_step": 124978, "epoch": 1505} {"train_loss": -22.4363956451416, "global_step": 124979, "epoch": 1505} {"train_loss": -22.588685989379883, "global_step": 124980, "epoch": 1505} {"train_loss": -22.647855758666992, "global_step": 124981, "epoch": 1505} {"train_loss": -22.655214309692383, "global_step": 124982, "epoch": 1505} {"train_loss": -22.906330108642578, "global_step": 124983, "epoch": 1505} {"train_loss": -23.022642135620117, "global_step": 124984, "epoch": 1505} {"train_loss": -22.864513397216797, "global_step": 124985, "epoch": 1505} {"train_loss": -22.44700050354004, "global_step": 124986, "epoch": 1505} {"train_loss": -22.73666763305664, "global_step": 124987, "epoch": 1505} {"train_loss": -22.75030517578125, "global_step": 124988, "epoch": 1505} {"train_loss": -22.75210189819336, "global_step": 124989, "epoch": 1505} {"train_loss": -22.822891235351562, "global_step": 124990, "epoch": 1505} {"train_loss": -22.874296188354492, "global_step": 124991, "epoch": 1505} {"train_loss": -22.747562408447266, "global_step": 124992, "epoch": 1505} {"train_loss": -22.78566551208496, "global_step": 124993, "epoch": 1505} {"train_loss": -23.025060653686523, "global_step": 124994, "epoch": 1505} {"train_loss": -22.907564163208008, "global_step": 124995, "epoch": 1505} {"train_loss": -22.914051055908203, "global_step": 124996, "epoch": 1505} {"train_loss": -22.642050203070582, "global_step": 124997, "epoch": 1505, "val_loss": 6183796.0} {"train_loss": -22.28973960876465, "global_step": 124998, "epoch": 1506} {"train_loss": -22.446138381958008, "global_step": 124999, "epoch": 1506} {"train_loss": -22.805561065673828, "global_step": 125000, "epoch": 1506} {"train_loss": -22.316530227661133, "global_step": 125001, "epoch": 1506} {"train_loss": -22.240915298461914, "global_step": 125002, "epoch": 1506} {"train_loss": -22.598356246948242, "global_step": 125003, "epoch": 1506} {"train_loss": -22.685476303100586, "global_step": 125004, "epoch": 1506} {"train_loss": -22.498838424682617, "global_step": 125005, "epoch": 1506} {"train_loss": -22.219350814819336, "global_step": 125006, "epoch": 1506} {"train_loss": -22.643991470336914, "global_step": 125007, "epoch": 1506} {"train_loss": -22.03680992126465, "global_step": 125008, "epoch": 1506} {"train_loss": -22.673236846923828, "global_step": 125009, "epoch": 1506} {"train_loss": -22.699460983276367, "global_step": 125010, "epoch": 1506} {"train_loss": -22.53862953186035, "global_step": 125011, "epoch": 1506} {"train_loss": -22.389326095581055, "global_step": 125012, "epoch": 1506} {"train_loss": -22.5052547454834, "global_step": 125013, "epoch": 1506} {"train_loss": -22.361595153808594, "global_step": 125014, "epoch": 1506} {"train_loss": -22.56583023071289, "global_step": 125015, "epoch": 1506} {"train_loss": -22.043476104736328, "global_step": 125016, "epoch": 1506} {"train_loss": -22.212621688842773, "global_step": 125017, "epoch": 1506} {"train_loss": -22.60515785217285, "global_step": 125018, "epoch": 1506} {"train_loss": -22.3798885345459, "global_step": 125019, "epoch": 1506} {"train_loss": -22.29694938659668, "global_step": 125020, "epoch": 1506} {"train_loss": -22.55300521850586, "global_step": 125021, "epoch": 1506} {"train_loss": -22.56619644165039, "global_step": 125022, "epoch": 1506} {"train_loss": -22.635053634643555, "global_step": 125023, "epoch": 1506} {"train_loss": -22.586923599243164, "global_step": 125024, "epoch": 1506} {"train_loss": -22.813037872314453, "global_step": 125025, "epoch": 1506} {"train_loss": -22.71007537841797, "global_step": 125026, "epoch": 1506} {"train_loss": -23.185510635375977, "global_step": 125027, "epoch": 1506} {"train_loss": -22.59543800354004, "global_step": 125028, "epoch": 1506} {"train_loss": -23.065021514892578, "global_step": 125029, "epoch": 1506} {"train_loss": -23.026330947875977, "global_step": 125030, "epoch": 1506} {"train_loss": -22.972463607788086, "global_step": 125031, "epoch": 1506} {"train_loss": -22.466224670410156, "global_step": 125032, "epoch": 1506} {"train_loss": -23.03767204284668, "global_step": 125033, "epoch": 1506} {"train_loss": -23.18463897705078, "global_step": 125034, "epoch": 1506} {"train_loss": -22.906841278076172, "global_step": 125035, "epoch": 1506} {"train_loss": -22.69754981994629, "global_step": 125036, "epoch": 1506} {"train_loss": -22.703035354614258, "global_step": 125037, "epoch": 1506} {"train_loss": -22.7597713470459, "global_step": 125038, "epoch": 1506} {"train_loss": -22.628204345703125, "global_step": 125039, "epoch": 1506} {"train_loss": -22.414064407348633, "global_step": 125040, "epoch": 1506} {"train_loss": -22.681020736694336, "global_step": 125041, "epoch": 1506} {"train_loss": -22.702133178710938, "global_step": 125042, "epoch": 1506} {"train_loss": -22.836376190185547, "global_step": 125043, "epoch": 1506} {"train_loss": -22.520153045654297, "global_step": 125044, "epoch": 1506} {"train_loss": -22.921730041503906, "global_step": 125045, "epoch": 1506} {"train_loss": -22.848621368408203, "global_step": 125046, "epoch": 1506} {"train_loss": -22.93091583251953, "global_step": 125047, "epoch": 1506} {"train_loss": -22.8009033203125, "global_step": 125048, "epoch": 1506} {"train_loss": -22.551776885986328, "global_step": 125049, "epoch": 1506} {"train_loss": -22.7399845123291, "global_step": 125050, "epoch": 1506} {"train_loss": -23.01691246032715, "global_step": 125051, "epoch": 1506} {"train_loss": -22.86541748046875, "global_step": 125052, "epoch": 1506} {"train_loss": -22.954824447631836, "global_step": 125053, "epoch": 1506} {"train_loss": -22.784343719482422, "global_step": 125054, "epoch": 1506} {"train_loss": -22.412555694580078, "global_step": 125055, "epoch": 1506} {"train_loss": -22.30088233947754, "global_step": 125056, "epoch": 1506} {"train_loss": -22.67746925354004, "global_step": 125057, "epoch": 1506} {"train_loss": -22.574146270751953, "global_step": 125058, "epoch": 1506} {"train_loss": -22.656373977661133, "global_step": 125059, "epoch": 1506} {"train_loss": -22.50701332092285, "global_step": 125060, "epoch": 1506} {"train_loss": -22.503637313842773, "global_step": 125061, "epoch": 1506} {"train_loss": -22.395431518554688, "global_step": 125062, "epoch": 1506} {"train_loss": -22.53232192993164, "global_step": 125063, "epoch": 1506} {"train_loss": -22.717679977416992, "global_step": 125064, "epoch": 1506} {"train_loss": -22.676311492919922, "global_step": 125065, "epoch": 1506} {"train_loss": -22.56251335144043, "global_step": 125066, "epoch": 1506} {"train_loss": -22.407339096069336, "global_step": 125067, "epoch": 1506} {"train_loss": -22.945816040039062, "global_step": 125068, "epoch": 1506} {"train_loss": -22.704999923706055, "global_step": 125069, "epoch": 1506} {"train_loss": -22.717252731323242, "global_step": 125070, "epoch": 1506} {"train_loss": -22.6124267578125, "global_step": 125071, "epoch": 1506} {"train_loss": -22.59833526611328, "global_step": 125072, "epoch": 1506} {"train_loss": -22.671871185302734, "global_step": 125073, "epoch": 1506} {"train_loss": -22.8759708404541, "global_step": 125074, "epoch": 1506} {"train_loss": -22.727252960205078, "global_step": 125075, "epoch": 1506} {"train_loss": -22.5460262298584, "global_step": 125076, "epoch": 1506} {"train_loss": -22.255916595458984, "global_step": 125077, "epoch": 1506} {"train_loss": -22.391925811767578, "global_step": 125078, "epoch": 1506} {"train_loss": -23.049264907836914, "global_step": 125079, "epoch": 1506} {"train_loss": -22.640929348497504, "global_step": 125080, "epoch": 1506, "val_loss": 6242309.5} {"train_loss": -21.45807456970215, "global_step": 125081, "epoch": 1507} {"train_loss": -21.249576568603516, "global_step": 125082, "epoch": 1507} {"train_loss": -22.449329376220703, "global_step": 125083, "epoch": 1507} {"train_loss": -22.33909797668457, "global_step": 125084, "epoch": 1507} {"train_loss": -21.959646224975586, "global_step": 125085, "epoch": 1507} {"train_loss": -22.259260177612305, "global_step": 125086, "epoch": 1507} {"train_loss": -22.436954498291016, "global_step": 125087, "epoch": 1507} {"train_loss": -21.96516227722168, "global_step": 125088, "epoch": 1507} {"train_loss": -22.576717376708984, "global_step": 125089, "epoch": 1507} {"train_loss": -22.745725631713867, "global_step": 125090, "epoch": 1507} {"train_loss": -22.19229507446289, "global_step": 125091, "epoch": 1507} {"train_loss": -22.21748161315918, "global_step": 125092, "epoch": 1507} {"train_loss": -22.589895248413086, "global_step": 125093, "epoch": 1507} {"train_loss": -21.956233978271484, "global_step": 125094, "epoch": 1507} {"train_loss": -22.360090255737305, "global_step": 125095, "epoch": 1507} {"train_loss": -22.757675170898438, "global_step": 125096, "epoch": 1507} {"train_loss": -22.545013427734375, "global_step": 125097, "epoch": 1507} {"train_loss": -22.541372299194336, "global_step": 125098, "epoch": 1507} {"train_loss": -22.78232192993164, "global_step": 125099, "epoch": 1507} {"train_loss": -22.400205612182617, "global_step": 125100, "epoch": 1507} {"train_loss": -22.868549346923828, "global_step": 125101, "epoch": 1507} {"train_loss": -22.5977783203125, "global_step": 125102, "epoch": 1507} {"train_loss": -22.34877586364746, "global_step": 125103, "epoch": 1507} {"train_loss": -22.597293853759766, "global_step": 125104, "epoch": 1507} {"train_loss": -22.748380661010742, "global_step": 125105, "epoch": 1507} {"train_loss": -22.721187591552734, "global_step": 125106, "epoch": 1507} {"train_loss": -22.430667877197266, "global_step": 125107, "epoch": 1507} {"train_loss": -22.27606201171875, "global_step": 125108, "epoch": 1507} {"train_loss": -22.869264602661133, "global_step": 125109, "epoch": 1507} {"train_loss": -22.46234703063965, "global_step": 125110, "epoch": 1507} {"train_loss": -22.61225700378418, "global_step": 125111, "epoch": 1507} {"train_loss": -22.83186912536621, "global_step": 125112, "epoch": 1507} {"train_loss": -22.854780197143555, "global_step": 125113, "epoch": 1507} {"train_loss": -22.750349044799805, "global_step": 125114, "epoch": 1507} {"train_loss": -22.403289794921875, "global_step": 125115, "epoch": 1507} {"train_loss": -22.576826095581055, "global_step": 125116, "epoch": 1507} {"train_loss": -22.103315353393555, "global_step": 125117, "epoch": 1507} {"train_loss": -22.538545608520508, "global_step": 125118, "epoch": 1507} {"train_loss": -22.494253158569336, "global_step": 125119, "epoch": 1507} {"train_loss": -22.94075584411621, "global_step": 125120, "epoch": 1507} {"train_loss": -22.49528694152832, "global_step": 125121, "epoch": 1507} {"train_loss": -22.852062225341797, "global_step": 125122, "epoch": 1507} {"train_loss": -22.729337692260742, "global_step": 125123, "epoch": 1507} {"train_loss": -22.818700790405273, "global_step": 125124, "epoch": 1507} {"train_loss": -22.642868041992188, "global_step": 125125, "epoch": 1507} {"train_loss": -22.237781524658203, "global_step": 125126, "epoch": 1507} {"train_loss": -22.714000701904297, "global_step": 125127, "epoch": 1507} {"train_loss": -22.670780181884766, "global_step": 125128, "epoch": 1507} {"train_loss": -22.507883071899414, "global_step": 125129, "epoch": 1507} {"train_loss": -22.536128997802734, "global_step": 125130, "epoch": 1507} {"train_loss": -22.66751480102539, "global_step": 125131, "epoch": 1507} {"train_loss": -22.743194580078125, "global_step": 125132, "epoch": 1507} {"train_loss": -22.66974639892578, "global_step": 125133, "epoch": 1507} {"train_loss": -23.07701301574707, "global_step": 125134, "epoch": 1507} {"train_loss": -22.6541748046875, "global_step": 125135, "epoch": 1507} {"train_loss": -22.699125289916992, "global_step": 125136, "epoch": 1507} {"train_loss": -23.140106201171875, "global_step": 125137, "epoch": 1507} {"train_loss": -22.996435165405273, "global_step": 125138, "epoch": 1507} {"train_loss": -22.771360397338867, "global_step": 125139, "epoch": 1507} {"train_loss": -23.260953903198242, "global_step": 125140, "epoch": 1507} {"train_loss": -22.667470932006836, "global_step": 125141, "epoch": 1507} {"train_loss": -22.810956954956055, "global_step": 125142, "epoch": 1507} {"train_loss": -22.454734802246094, "global_step": 125143, "epoch": 1507} {"train_loss": -22.79216957092285, "global_step": 125144, "epoch": 1507} {"train_loss": -22.291933059692383, "global_step": 125145, "epoch": 1507} {"train_loss": -22.705034255981445, "global_step": 125146, "epoch": 1507} {"train_loss": -22.65964126586914, "global_step": 125147, "epoch": 1507} {"train_loss": -22.492095947265625, "global_step": 125148, "epoch": 1507} {"train_loss": -22.7309513092041, "global_step": 125149, "epoch": 1507} {"train_loss": -22.8389949798584, "global_step": 125150, "epoch": 1507} {"train_loss": -23.246654510498047, "global_step": 125151, "epoch": 1507} {"train_loss": -22.80354881286621, "global_step": 125152, "epoch": 1507} {"train_loss": -22.649282455444336, "global_step": 125153, "epoch": 1507} {"train_loss": -22.673803329467773, "global_step": 125154, "epoch": 1507} {"train_loss": -22.888124465942383, "global_step": 125155, "epoch": 1507} {"train_loss": -22.82515525817871, "global_step": 125156, "epoch": 1507} {"train_loss": -22.618093490600586, "global_step": 125157, "epoch": 1507} {"train_loss": -22.744794845581055, "global_step": 125158, "epoch": 1507} {"train_loss": -22.625600814819336, "global_step": 125159, "epoch": 1507} {"train_loss": -22.546518325805664, "global_step": 125160, "epoch": 1507} {"train_loss": -22.508466720581055, "global_step": 125161, "epoch": 1507} {"train_loss": -22.615081787109375, "global_step": 125162, "epoch": 1507} {"train_loss": -22.593806760856904, "global_step": 125163, "epoch": 1507, "val_loss": 6138668.0} {"train_loss": -22.25457763671875, "global_step": 125164, "epoch": 1508} {"train_loss": -22.250608444213867, "global_step": 125165, "epoch": 1508} {"train_loss": -22.229812622070312, "global_step": 125166, "epoch": 1508} {"train_loss": -22.34696388244629, "global_step": 125167, "epoch": 1508} {"train_loss": -22.260305404663086, "global_step": 125168, "epoch": 1508} {"train_loss": -22.315351486206055, "global_step": 125169, "epoch": 1508} {"train_loss": -22.139934539794922, "global_step": 125170, "epoch": 1508} {"train_loss": -21.713069915771484, "global_step": 125171, "epoch": 1508} {"train_loss": -21.79051399230957, "global_step": 125172, "epoch": 1508} {"train_loss": -22.53720474243164, "global_step": 125173, "epoch": 1508} {"train_loss": -22.513837814331055, "global_step": 125174, "epoch": 1508} {"train_loss": -22.38245964050293, "global_step": 125175, "epoch": 1508} {"train_loss": -22.408227920532227, "global_step": 125176, "epoch": 1508} {"train_loss": -22.660131454467773, "global_step": 125177, "epoch": 1508} {"train_loss": -22.413373947143555, "global_step": 125178, "epoch": 1508} {"train_loss": -22.284284591674805, "global_step": 125179, "epoch": 1508} {"train_loss": -22.329923629760742, "global_step": 125180, "epoch": 1508} {"train_loss": -22.37432289123535, "global_step": 125181, "epoch": 1508} {"train_loss": -22.694128036499023, "global_step": 125182, "epoch": 1508} {"train_loss": -22.528717041015625, "global_step": 125183, "epoch": 1508} {"train_loss": -22.515438079833984, "global_step": 125184, "epoch": 1508} {"train_loss": -22.625564575195312, "global_step": 125185, "epoch": 1508} {"train_loss": -22.220508575439453, "global_step": 125186, "epoch": 1508} {"train_loss": -22.991575241088867, "global_step": 125187, "epoch": 1508} {"train_loss": -22.846158981323242, "global_step": 125188, "epoch": 1508} {"train_loss": -22.56569480895996, "global_step": 125189, "epoch": 1508} {"train_loss": -22.244457244873047, "global_step": 125190, "epoch": 1508} {"train_loss": -22.510929107666016, "global_step": 125191, "epoch": 1508} {"train_loss": -22.927244186401367, "global_step": 125192, "epoch": 1508} {"train_loss": -22.445539474487305, "global_step": 125193, "epoch": 1508} {"train_loss": -22.8404598236084, "global_step": 125194, "epoch": 1508} {"train_loss": -22.646808624267578, "global_step": 125195, "epoch": 1508} {"train_loss": -23.12666893005371, "global_step": 125196, "epoch": 1508} {"train_loss": -22.512571334838867, "global_step": 125197, "epoch": 1508} {"train_loss": -22.54706573486328, "global_step": 125198, "epoch": 1508} {"train_loss": -22.71945571899414, "global_step": 125199, "epoch": 1508} {"train_loss": -22.920303344726562, "global_step": 125200, "epoch": 1508} {"train_loss": -22.67222023010254, "global_step": 125201, "epoch": 1508} {"train_loss": -23.018896102905273, "global_step": 125202, "epoch": 1508} {"train_loss": -22.55340003967285, "global_step": 125203, "epoch": 1508} {"train_loss": -22.607629776000977, "global_step": 125204, "epoch": 1508} {"train_loss": -22.497421264648438, "global_step": 125205, "epoch": 1508} {"train_loss": -22.47317886352539, "global_step": 125206, "epoch": 1508} {"train_loss": -22.990148544311523, "global_step": 125207, "epoch": 1508} {"train_loss": -22.2989444732666, "global_step": 125208, "epoch": 1508} {"train_loss": -22.670408248901367, "global_step": 125209, "epoch": 1508} {"train_loss": -22.635953903198242, "global_step": 125210, "epoch": 1508} {"train_loss": -22.77046775817871, "global_step": 125211, "epoch": 1508} {"train_loss": -22.6375789642334, "global_step": 125212, "epoch": 1508} {"train_loss": -22.61734390258789, "global_step": 125213, "epoch": 1508} {"train_loss": -22.563861846923828, "global_step": 125214, "epoch": 1508} {"train_loss": -23.101381301879883, "global_step": 125215, "epoch": 1508} {"train_loss": -22.496442794799805, "global_step": 125216, "epoch": 1508} {"train_loss": -22.689931869506836, "global_step": 125217, "epoch": 1508} {"train_loss": -22.638381958007812, "global_step": 125218, "epoch": 1508} {"train_loss": -22.642253875732422, "global_step": 125219, "epoch": 1508} {"train_loss": -22.14578628540039, "global_step": 125220, "epoch": 1508} {"train_loss": -23.05918312072754, "global_step": 125221, "epoch": 1508} {"train_loss": -22.7559757232666, "global_step": 125222, "epoch": 1508} {"train_loss": -22.803653717041016, "global_step": 125223, "epoch": 1508} {"train_loss": -22.704391479492188, "global_step": 125224, "epoch": 1508} {"train_loss": -22.6907901763916, "global_step": 125225, "epoch": 1508} {"train_loss": -23.002819061279297, "global_step": 125226, "epoch": 1508} {"train_loss": -23.31326675415039, "global_step": 125227, "epoch": 1508} {"train_loss": -22.912702560424805, "global_step": 125228, "epoch": 1508} {"train_loss": -22.4619197845459, "global_step": 125229, "epoch": 1508} {"train_loss": -23.265735626220703, "global_step": 125230, "epoch": 1508} {"train_loss": -22.78409194946289, "global_step": 125231, "epoch": 1508} {"train_loss": -22.825000762939453, "global_step": 125232, "epoch": 1508} {"train_loss": -22.99344825744629, "global_step": 125233, "epoch": 1508} {"train_loss": -22.843107223510742, "global_step": 125234, "epoch": 1508} {"train_loss": -23.013111114501953, "global_step": 125235, "epoch": 1508} {"train_loss": -23.183059692382812, "global_step": 125236, "epoch": 1508} {"train_loss": -22.624120712280273, "global_step": 125237, "epoch": 1508} {"train_loss": -22.529239654541016, "global_step": 125238, "epoch": 1508} {"train_loss": -22.597375869750977, "global_step": 125239, "epoch": 1508} {"train_loss": -23.191396713256836, "global_step": 125240, "epoch": 1508} {"train_loss": -22.745832443237305, "global_step": 125241, "epoch": 1508} {"train_loss": -22.55356788635254, "global_step": 125242, "epoch": 1508} {"train_loss": -22.613529205322266, "global_step": 125243, "epoch": 1508} {"train_loss": -22.793882369995117, "global_step": 125244, "epoch": 1508} {"train_loss": -22.667041778564453, "global_step": 125245, "epoch": 1508} {"train_loss": -22.633555998285132, "global_step": 125246, "epoch": 1508, "val_loss": 6150765.5} {"train_loss": -21.58102035522461, "global_step": 125247, "epoch": 1509} {"train_loss": -20.975372314453125, "global_step": 125248, "epoch": 1509} {"train_loss": -21.9775390625, "global_step": 125249, "epoch": 1509} {"train_loss": -21.734668731689453, "global_step": 125250, "epoch": 1509} {"train_loss": -21.88371467590332, "global_step": 125251, "epoch": 1509} {"train_loss": -21.81448745727539, "global_step": 125252, "epoch": 1509} {"train_loss": -22.363996505737305, "global_step": 125253, "epoch": 1509} {"train_loss": -21.604707717895508, "global_step": 125254, "epoch": 1509} {"train_loss": -22.3259334564209, "global_step": 125255, "epoch": 1509} {"train_loss": -22.221603393554688, "global_step": 125256, "epoch": 1509} {"train_loss": -21.87274742126465, "global_step": 125257, "epoch": 1509} {"train_loss": -22.001018524169922, "global_step": 125258, "epoch": 1509} {"train_loss": -22.020872116088867, "global_step": 125259, "epoch": 1509} {"train_loss": -22.38443946838379, "global_step": 125260, "epoch": 1509} {"train_loss": -22.08833122253418, "global_step": 125261, "epoch": 1509} {"train_loss": -22.195241928100586, "global_step": 125262, "epoch": 1509} {"train_loss": -21.887170791625977, "global_step": 125263, "epoch": 1509} {"train_loss": -22.380706787109375, "global_step": 125264, "epoch": 1509} {"train_loss": -22.519277572631836, "global_step": 125265, "epoch": 1509} {"train_loss": -21.814695358276367, "global_step": 125266, "epoch": 1509} {"train_loss": -22.458688735961914, "global_step": 125267, "epoch": 1509} {"train_loss": -22.4747314453125, "global_step": 125268, "epoch": 1509} {"train_loss": -22.42827796936035, "global_step": 125269, "epoch": 1509} {"train_loss": -22.496984481811523, "global_step": 125270, "epoch": 1509} {"train_loss": -22.393205642700195, "global_step": 125271, "epoch": 1509} {"train_loss": -22.532278060913086, "global_step": 125272, "epoch": 1509} {"train_loss": -22.2180233001709, "global_step": 125273, "epoch": 1509} {"train_loss": -22.393415451049805, "global_step": 125274, "epoch": 1509} {"train_loss": -22.572280883789062, "global_step": 125275, "epoch": 1509} {"train_loss": -22.52828025817871, "global_step": 125276, "epoch": 1509} {"train_loss": -22.618331909179688, "global_step": 125277, "epoch": 1509} {"train_loss": -22.654203414916992, "global_step": 125278, "epoch": 1509} {"train_loss": -22.497085571289062, "global_step": 125279, "epoch": 1509} {"train_loss": -22.64487075805664, "global_step": 125280, "epoch": 1509} {"train_loss": -22.79336929321289, "global_step": 125281, "epoch": 1509} {"train_loss": -22.619707107543945, "global_step": 125282, "epoch": 1509} {"train_loss": -22.689775466918945, "global_step": 125283, "epoch": 1509} {"train_loss": -22.672462463378906, "global_step": 125284, "epoch": 1509} {"train_loss": -22.496068954467773, "global_step": 125285, "epoch": 1509} {"train_loss": -22.679861068725586, "global_step": 125286, "epoch": 1509} {"train_loss": -22.73116111755371, "global_step": 125287, "epoch": 1509} {"train_loss": -22.751745223999023, "global_step": 125288, "epoch": 1509} {"train_loss": -22.59885025024414, "global_step": 125289, "epoch": 1509} {"train_loss": -22.59766960144043, "global_step": 125290, "epoch": 1509} {"train_loss": -22.699588775634766, "global_step": 125291, "epoch": 1509} {"train_loss": -22.507658004760742, "global_step": 125292, "epoch": 1509} {"train_loss": -22.611989974975586, "global_step": 125293, "epoch": 1509} {"train_loss": -22.802330017089844, "global_step": 125294, "epoch": 1509} {"train_loss": -22.526933670043945, "global_step": 125295, "epoch": 1509} {"train_loss": -22.7020263671875, "global_step": 125296, "epoch": 1509} {"train_loss": -22.50600242614746, "global_step": 125297, "epoch": 1509} {"train_loss": -22.394163131713867, "global_step": 125298, "epoch": 1509} {"train_loss": -22.766000747680664, "global_step": 125299, "epoch": 1509} {"train_loss": -22.48264503479004, "global_step": 125300, "epoch": 1509} {"train_loss": -22.47957420349121, "global_step": 125301, "epoch": 1509} {"train_loss": -22.39774513244629, "global_step": 125302, "epoch": 1509} {"train_loss": -22.71942138671875, "global_step": 125303, "epoch": 1509} {"train_loss": -22.776660919189453, "global_step": 125304, "epoch": 1509} {"train_loss": -22.593175888061523, "global_step": 125305, "epoch": 1509} {"train_loss": -22.602136611938477, "global_step": 125306, "epoch": 1509} {"train_loss": -22.679288864135742, "global_step": 125307, "epoch": 1509} {"train_loss": -22.724180221557617, "global_step": 125308, "epoch": 1509} {"train_loss": -22.53748893737793, "global_step": 125309, "epoch": 1509} {"train_loss": -22.822158813476562, "global_step": 125310, "epoch": 1509} {"train_loss": -22.69683265686035, "global_step": 125311, "epoch": 1509} {"train_loss": -22.793174743652344, "global_step": 125312, "epoch": 1509} {"train_loss": -22.538427352905273, "global_step": 125313, "epoch": 1509} {"train_loss": -22.801008224487305, "global_step": 125314, "epoch": 1509} {"train_loss": -22.719745635986328, "global_step": 125315, "epoch": 1509} {"train_loss": -22.655820846557617, "global_step": 125316, "epoch": 1509} {"train_loss": -22.481550216674805, "global_step": 125317, "epoch": 1509} {"train_loss": -22.77667236328125, "global_step": 125318, "epoch": 1509} {"train_loss": -23.03106689453125, "global_step": 125319, "epoch": 1509} {"train_loss": -22.35353660583496, "global_step": 125320, "epoch": 1509} {"train_loss": -22.528215408325195, "global_step": 125321, "epoch": 1509} {"train_loss": -22.98838233947754, "global_step": 125322, "epoch": 1509} {"train_loss": -22.826047897338867, "global_step": 125323, "epoch": 1509} {"train_loss": -22.13069725036621, "global_step": 125324, "epoch": 1509} {"train_loss": -22.557140350341797, "global_step": 125325, "epoch": 1509} {"train_loss": -22.832441329956055, "global_step": 125326, "epoch": 1509} {"train_loss": -22.65779685974121, "global_step": 125327, "epoch": 1509} {"train_loss": -22.373279571533203, "global_step": 125328, "epoch": 1509} {"train_loss": -22.449042952204326, "global_step": 125329, "epoch": 1509, "val_loss": 6296338.0} {"train_loss": -22.265689849853516, "global_step": 125330, "epoch": 1510} {"train_loss": -22.035818099975586, "global_step": 125331, "epoch": 1510} {"train_loss": -22.356246948242188, "global_step": 125332, "epoch": 1510} {"train_loss": -22.038259506225586, "global_step": 125333, "epoch": 1510} {"train_loss": -21.660554885864258, "global_step": 125334, "epoch": 1510} {"train_loss": -22.456787109375, "global_step": 125335, "epoch": 1510} {"train_loss": -22.122684478759766, "global_step": 125336, "epoch": 1510} {"train_loss": -22.138408660888672, "global_step": 125337, "epoch": 1510} {"train_loss": -22.201440811157227, "global_step": 125338, "epoch": 1510} {"train_loss": -22.015817642211914, "global_step": 125339, "epoch": 1510} {"train_loss": -22.404891967773438, "global_step": 125340, "epoch": 1510} {"train_loss": -22.4146671295166, "global_step": 125341, "epoch": 1510} {"train_loss": -22.350658416748047, "global_step": 125342, "epoch": 1510} {"train_loss": -22.557621002197266, "global_step": 125343, "epoch": 1510} {"train_loss": -22.438337326049805, "global_step": 125344, "epoch": 1510} {"train_loss": -22.405298233032227, "global_step": 125345, "epoch": 1510} {"train_loss": -22.630037307739258, "global_step": 125346, "epoch": 1510} {"train_loss": -22.30161476135254, "global_step": 125347, "epoch": 1510} {"train_loss": -22.473270416259766, "global_step": 125348, "epoch": 1510} {"train_loss": -22.726226806640625, "global_step": 125349, "epoch": 1510} {"train_loss": -22.734962463378906, "global_step": 125350, "epoch": 1510} {"train_loss": -22.79669189453125, "global_step": 125351, "epoch": 1510} {"train_loss": -22.520456314086914, "global_step": 125352, "epoch": 1510} {"train_loss": -23.019548416137695, "global_step": 125353, "epoch": 1510} {"train_loss": -22.503257751464844, "global_step": 125354, "epoch": 1510} {"train_loss": -22.34587287902832, "global_step": 125355, "epoch": 1510} {"train_loss": -22.509950637817383, "global_step": 125356, "epoch": 1510} {"train_loss": -22.629972457885742, "global_step": 125357, "epoch": 1510} {"train_loss": -22.506620407104492, "global_step": 125358, "epoch": 1510} {"train_loss": -22.566190719604492, "global_step": 125359, "epoch": 1510} {"train_loss": -22.868467330932617, "global_step": 125360, "epoch": 1510} {"train_loss": -22.97614097595215, "global_step": 125361, "epoch": 1510} {"train_loss": -22.38709259033203, "global_step": 125362, "epoch": 1510} {"train_loss": -22.7163143157959, "global_step": 125363, "epoch": 1510} {"train_loss": -22.591672897338867, "global_step": 125364, "epoch": 1510} {"train_loss": -22.460922241210938, "global_step": 125365, "epoch": 1510} {"train_loss": -22.613882064819336, "global_step": 125366, "epoch": 1510} {"train_loss": -22.265581130981445, "global_step": 125367, "epoch": 1510} {"train_loss": -22.797931671142578, "global_step": 125368, "epoch": 1510} {"train_loss": -22.879072189331055, "global_step": 125369, "epoch": 1510} {"train_loss": -22.54168128967285, "global_step": 125370, "epoch": 1510} {"train_loss": -23.018362045288086, "global_step": 125371, "epoch": 1510} {"train_loss": -23.110490798950195, "global_step": 125372, "epoch": 1510} {"train_loss": -22.940622329711914, "global_step": 125373, "epoch": 1510} {"train_loss": -23.043546676635742, "global_step": 125374, "epoch": 1510} {"train_loss": -22.87166404724121, "global_step": 125375, "epoch": 1510} {"train_loss": -22.780746459960938, "global_step": 125376, "epoch": 1510} {"train_loss": -22.80339241027832, "global_step": 125377, "epoch": 1510} {"train_loss": -22.86250877380371, "global_step": 125378, "epoch": 1510} {"train_loss": -22.942628860473633, "global_step": 125379, "epoch": 1510} {"train_loss": -23.138652801513672, "global_step": 125380, "epoch": 1510} {"train_loss": -22.85906982421875, "global_step": 125381, "epoch": 1510} {"train_loss": -22.784372329711914, "global_step": 125382, "epoch": 1510} {"train_loss": -22.845211029052734, "global_step": 125383, "epoch": 1510} {"train_loss": -22.773399353027344, "global_step": 125384, "epoch": 1510} {"train_loss": -22.59099769592285, "global_step": 125385, "epoch": 1510} {"train_loss": -22.425901412963867, "global_step": 125386, "epoch": 1510} {"train_loss": -22.527341842651367, "global_step": 125387, "epoch": 1510} {"train_loss": -22.593313217163086, "global_step": 125388, "epoch": 1510} {"train_loss": -22.546232223510742, "global_step": 125389, "epoch": 1510} {"train_loss": -22.60331153869629, "global_step": 125390, "epoch": 1510} {"train_loss": -22.369543075561523, "global_step": 125391, "epoch": 1510} {"train_loss": -22.633743286132812, "global_step": 125392, "epoch": 1510} {"train_loss": -22.47694206237793, "global_step": 125393, "epoch": 1510} {"train_loss": -22.260883331298828, "global_step": 125394, "epoch": 1510} {"train_loss": -22.568716049194336, "global_step": 125395, "epoch": 1510} {"train_loss": -22.608041763305664, "global_step": 125396, "epoch": 1510} {"train_loss": -22.545042037963867, "global_step": 125397, "epoch": 1510} {"train_loss": -22.375213623046875, "global_step": 125398, "epoch": 1510} {"train_loss": -22.42085838317871, "global_step": 125399, "epoch": 1510} {"train_loss": -22.490530014038086, "global_step": 125400, "epoch": 1510} {"train_loss": -22.342376708984375, "global_step": 125401, "epoch": 1510} {"train_loss": -22.516517639160156, "global_step": 125402, "epoch": 1510} {"train_loss": -22.448740005493164, "global_step": 125403, "epoch": 1510} {"train_loss": -22.490697860717773, "global_step": 125404, "epoch": 1510} {"train_loss": -22.897014617919922, "global_step": 125405, "epoch": 1510} {"train_loss": -22.438461303710938, "global_step": 125406, "epoch": 1510} {"train_loss": -22.673967361450195, "global_step": 125407, "epoch": 1510} {"train_loss": -22.827844619750977, "global_step": 125408, "epoch": 1510} {"train_loss": -22.537372589111328, "global_step": 125409, "epoch": 1510} {"train_loss": -22.877737045288086, "global_step": 125410, "epoch": 1510} {"train_loss": -22.662748336791992, "global_step": 125411, "epoch": 1510} {"train_loss": -22.58721705517137, "global_step": 125412, "epoch": 1510, "val_loss": 6278431.0} {"train_loss": -22.795713424682617, "global_step": 125413, "epoch": 1511} {"train_loss": -22.651775360107422, "global_step": 125414, "epoch": 1511} {"train_loss": -22.301862716674805, "global_step": 125415, "epoch": 1511} {"train_loss": -22.65382957458496, "global_step": 125416, "epoch": 1511} {"train_loss": -22.67380142211914, "global_step": 125417, "epoch": 1511} {"train_loss": -22.401216506958008, "global_step": 125418, "epoch": 1511} {"train_loss": -22.532669067382812, "global_step": 125419, "epoch": 1511} {"train_loss": -22.211469650268555, "global_step": 125420, "epoch": 1511} {"train_loss": -22.691099166870117, "global_step": 125421, "epoch": 1511} {"train_loss": -22.68990135192871, "global_step": 125422, "epoch": 1511} {"train_loss": -22.66211700439453, "global_step": 125423, "epoch": 1511} {"train_loss": -22.383773803710938, "global_step": 125424, "epoch": 1511} {"train_loss": -22.515470504760742, "global_step": 125425, "epoch": 1511} {"train_loss": -22.513235092163086, "global_step": 125426, "epoch": 1511} {"train_loss": -22.367643356323242, "global_step": 125427, "epoch": 1511} {"train_loss": -22.678577423095703, "global_step": 125428, "epoch": 1511} {"train_loss": -22.405414581298828, "global_step": 125429, "epoch": 1511} {"train_loss": -22.620925903320312, "global_step": 125430, "epoch": 1511} {"train_loss": -22.530319213867188, "global_step": 125431, "epoch": 1511} {"train_loss": -22.881370544433594, "global_step": 125432, "epoch": 1511} {"train_loss": -22.434555053710938, "global_step": 125433, "epoch": 1511} {"train_loss": -22.832767486572266, "global_step": 125434, "epoch": 1511} {"train_loss": -22.273244857788086, "global_step": 125435, "epoch": 1511} {"train_loss": -23.009220123291016, "global_step": 125436, "epoch": 1511} {"train_loss": -22.223276138305664, "global_step": 125437, "epoch": 1511} {"train_loss": -22.305017471313477, "global_step": 125438, "epoch": 1511} {"train_loss": -22.632858276367188, "global_step": 125439, "epoch": 1511} {"train_loss": -22.576316833496094, "global_step": 125440, "epoch": 1511} {"train_loss": -22.568796157836914, "global_step": 125441, "epoch": 1511} {"train_loss": -22.62647819519043, "global_step": 125442, "epoch": 1511} {"train_loss": -22.442764282226562, "global_step": 125443, "epoch": 1511} {"train_loss": -22.113449096679688, "global_step": 125444, "epoch": 1511} {"train_loss": -22.653039932250977, "global_step": 125445, "epoch": 1511} {"train_loss": -22.343517303466797, "global_step": 125446, "epoch": 1511} {"train_loss": -22.62172508239746, "global_step": 125447, "epoch": 1511} {"train_loss": -22.404966354370117, "global_step": 125448, "epoch": 1511} {"train_loss": -22.564453125, "global_step": 125449, "epoch": 1511} {"train_loss": -22.614276885986328, "global_step": 125450, "epoch": 1511} {"train_loss": -22.751890182495117, "global_step": 125451, "epoch": 1511} {"train_loss": -22.733386993408203, "global_step": 125452, "epoch": 1511} {"train_loss": -22.595823287963867, "global_step": 125453, "epoch": 1511} {"train_loss": -22.811283111572266, "global_step": 125454, "epoch": 1511} {"train_loss": -22.821447372436523, "global_step": 125455, "epoch": 1511} {"train_loss": -22.551679611206055, "global_step": 125456, "epoch": 1511} {"train_loss": -23.097314834594727, "global_step": 125457, "epoch": 1511} {"train_loss": -22.457212448120117, "global_step": 125458, "epoch": 1511} {"train_loss": -22.548322677612305, "global_step": 125459, "epoch": 1511} {"train_loss": -22.93303871154785, "global_step": 125460, "epoch": 1511} {"train_loss": -22.786113739013672, "global_step": 125461, "epoch": 1511} {"train_loss": -23.21097183227539, "global_step": 125462, "epoch": 1511} {"train_loss": -22.77147674560547, "global_step": 125463, "epoch": 1511} {"train_loss": -22.524444580078125, "global_step": 125464, "epoch": 1511} {"train_loss": -22.567733764648438, "global_step": 125465, "epoch": 1511} {"train_loss": -22.708669662475586, "global_step": 125466, "epoch": 1511} {"train_loss": -22.849512100219727, "global_step": 125467, "epoch": 1511} {"train_loss": -22.34673309326172, "global_step": 125468, "epoch": 1511} {"train_loss": -22.390466690063477, "global_step": 125469, "epoch": 1511} {"train_loss": -22.715124130249023, "global_step": 125470, "epoch": 1511} {"train_loss": -22.697193145751953, "global_step": 125471, "epoch": 1511} {"train_loss": -22.642797470092773, "global_step": 125472, "epoch": 1511} {"train_loss": -22.56264305114746, "global_step": 125473, "epoch": 1511} {"train_loss": -22.323230743408203, "global_step": 125474, "epoch": 1511} {"train_loss": -22.9268856048584, "global_step": 125475, "epoch": 1511} {"train_loss": -22.90028190612793, "global_step": 125476, "epoch": 1511} {"train_loss": -22.949167251586914, "global_step": 125477, "epoch": 1511} {"train_loss": -22.626386642456055, "global_step": 125478, "epoch": 1511} {"train_loss": -22.85492706298828, "global_step": 125479, "epoch": 1511} {"train_loss": -22.941051483154297, "global_step": 125480, "epoch": 1511} {"train_loss": -23.25537109375, "global_step": 125481, "epoch": 1511} {"train_loss": -22.603376388549805, "global_step": 125482, "epoch": 1511} {"train_loss": -22.87810707092285, "global_step": 125483, "epoch": 1511} {"train_loss": -22.759916305541992, "global_step": 125484, "epoch": 1511} {"train_loss": -22.64674949645996, "global_step": 125485, "epoch": 1511} {"train_loss": -22.594663619995117, "global_step": 125486, "epoch": 1511} {"train_loss": -22.87530517578125, "global_step": 125487, "epoch": 1511} {"train_loss": -22.936935424804688, "global_step": 125488, "epoch": 1511} {"train_loss": -22.759437561035156, "global_step": 125489, "epoch": 1511} {"train_loss": -22.663427352905273, "global_step": 125490, "epoch": 1511} {"train_loss": -22.676259994506836, "global_step": 125491, "epoch": 1511} {"train_loss": -22.764028549194336, "global_step": 125492, "epoch": 1511} {"train_loss": -22.289352416992188, "global_step": 125493, "epoch": 1511} {"train_loss": -22.697805404663086, "global_step": 125494, "epoch": 1511} {"train_loss": -22.630631757069782, "global_step": 125495, "epoch": 1511, "val_loss": 6244971.5} {"train_loss": -21.89165687561035, "global_step": 125496, "epoch": 1512} {"train_loss": -22.274063110351562, "global_step": 125497, "epoch": 1512} {"train_loss": -22.676889419555664, "global_step": 125498, "epoch": 1512} {"train_loss": -21.617795944213867, "global_step": 125499, "epoch": 1512} {"train_loss": -22.781118392944336, "global_step": 125500, "epoch": 1512} {"train_loss": -21.55484390258789, "global_step": 125501, "epoch": 1512} {"train_loss": -22.90492057800293, "global_step": 125502, "epoch": 1512} {"train_loss": -22.1125545501709, "global_step": 125503, "epoch": 1512} {"train_loss": -22.560256958007812, "global_step": 125504, "epoch": 1512} {"train_loss": -21.97399139404297, "global_step": 125505, "epoch": 1512} {"train_loss": -22.620058059692383, "global_step": 125506, "epoch": 1512} {"train_loss": -22.767053604125977, "global_step": 125507, "epoch": 1512} {"train_loss": -22.343259811401367, "global_step": 125508, "epoch": 1512} {"train_loss": -22.472604751586914, "global_step": 125509, "epoch": 1512} {"train_loss": -22.007177352905273, "global_step": 125510, "epoch": 1512} {"train_loss": -22.52780532836914, "global_step": 125511, "epoch": 1512} {"train_loss": -22.439414978027344, "global_step": 125512, "epoch": 1512} {"train_loss": -22.500080108642578, "global_step": 125513, "epoch": 1512} {"train_loss": -22.655195236206055, "global_step": 125514, "epoch": 1512} {"train_loss": -22.4507999420166, "global_step": 125515, "epoch": 1512} {"train_loss": -22.03052520751953, "global_step": 125516, "epoch": 1512} {"train_loss": -22.801502227783203, "global_step": 125517, "epoch": 1512} {"train_loss": -22.567907333374023, "global_step": 125518, "epoch": 1512} {"train_loss": -22.37033462524414, "global_step": 125519, "epoch": 1512} {"train_loss": -22.320451736450195, "global_step": 125520, "epoch": 1512} {"train_loss": -23.037940979003906, "global_step": 125521, "epoch": 1512} {"train_loss": -22.346349716186523, "global_step": 125522, "epoch": 1512} {"train_loss": -22.71771812438965, "global_step": 125523, "epoch": 1512} {"train_loss": -22.36104393005371, "global_step": 125524, "epoch": 1512} {"train_loss": -22.861764907836914, "global_step": 125525, "epoch": 1512} {"train_loss": -22.434574127197266, "global_step": 125526, "epoch": 1512} {"train_loss": -22.733779907226562, "global_step": 125527, "epoch": 1512} {"train_loss": -22.43008804321289, "global_step": 125528, "epoch": 1512} {"train_loss": -22.62685203552246, "global_step": 125529, "epoch": 1512} {"train_loss": -23.104310989379883, "global_step": 125530, "epoch": 1512} {"train_loss": -22.51911735534668, "global_step": 125531, "epoch": 1512} {"train_loss": -22.304443359375, "global_step": 125532, "epoch": 1512} {"train_loss": -22.987228393554688, "global_step": 125533, "epoch": 1512} {"train_loss": -22.621244430541992, "global_step": 125534, "epoch": 1512} {"train_loss": -22.656341552734375, "global_step": 125535, "epoch": 1512} {"train_loss": -22.341588973999023, "global_step": 125536, "epoch": 1512} {"train_loss": -22.551349639892578, "global_step": 125537, "epoch": 1512} {"train_loss": -22.503068923950195, "global_step": 125538, "epoch": 1512} {"train_loss": -22.32924461364746, "global_step": 125539, "epoch": 1512} {"train_loss": -22.330970764160156, "global_step": 125540, "epoch": 1512} {"train_loss": -22.52589225769043, "global_step": 125541, "epoch": 1512} {"train_loss": -22.74323272705078, "global_step": 125542, "epoch": 1512} {"train_loss": -22.48984146118164, "global_step": 125543, "epoch": 1512} {"train_loss": -22.668607711791992, "global_step": 125544, "epoch": 1512} {"train_loss": -22.29909324645996, "global_step": 125545, "epoch": 1512} {"train_loss": -22.956647872924805, "global_step": 125546, "epoch": 1512} {"train_loss": -22.797264099121094, "global_step": 125547, "epoch": 1512} {"train_loss": -22.62535285949707, "global_step": 125548, "epoch": 1512} {"train_loss": -22.5892333984375, "global_step": 125549, "epoch": 1512} {"train_loss": -22.799097061157227, "global_step": 125550, "epoch": 1512} {"train_loss": -22.659610748291016, "global_step": 125551, "epoch": 1512} {"train_loss": -22.719703674316406, "global_step": 125552, "epoch": 1512} {"train_loss": -22.83270835876465, "global_step": 125553, "epoch": 1512} {"train_loss": -22.67323875427246, "global_step": 125554, "epoch": 1512} {"train_loss": -22.733333587646484, "global_step": 125555, "epoch": 1512} {"train_loss": -22.718978881835938, "global_step": 125556, "epoch": 1512} {"train_loss": -22.917583465576172, "global_step": 125557, "epoch": 1512} {"train_loss": -22.651508331298828, "global_step": 125558, "epoch": 1512} {"train_loss": -22.80095863342285, "global_step": 125559, "epoch": 1512} {"train_loss": -22.802589416503906, "global_step": 125560, "epoch": 1512} {"train_loss": -22.81077003479004, "global_step": 125561, "epoch": 1512} {"train_loss": -22.34800148010254, "global_step": 125562, "epoch": 1512} {"train_loss": -22.65754508972168, "global_step": 125563, "epoch": 1512} {"train_loss": -22.495731353759766, "global_step": 125564, "epoch": 1512} {"train_loss": -22.66362762451172, "global_step": 125565, "epoch": 1512} {"train_loss": -22.725427627563477, "global_step": 125566, "epoch": 1512} {"train_loss": -22.757339477539062, "global_step": 125567, "epoch": 1512} {"train_loss": -22.7674617767334, "global_step": 125568, "epoch": 1512} {"train_loss": -22.673978805541992, "global_step": 125569, "epoch": 1512} {"train_loss": -22.7713680267334, "global_step": 125570, "epoch": 1512} {"train_loss": -22.461572647094727, "global_step": 125571, "epoch": 1512} {"train_loss": -22.6483097076416, "global_step": 125572, "epoch": 1512} {"train_loss": -22.70118522644043, "global_step": 125573, "epoch": 1512} {"train_loss": -22.86147117614746, "global_step": 125574, "epoch": 1512} {"train_loss": -23.253652572631836, "global_step": 125575, "epoch": 1512} {"train_loss": -22.633939743041992, "global_step": 125576, "epoch": 1512} {"train_loss": -22.504966735839844, "global_step": 125577, "epoch": 1512} {"train_loss": -22.583699077008717, "global_step": 125578, "epoch": 1512, "val_loss": 6239304.5} {"train_loss": -22.799175262451172, "global_step": 125579, "epoch": 1513} {"train_loss": -22.489456176757812, "global_step": 125580, "epoch": 1513} {"train_loss": -22.683380126953125, "global_step": 125581, "epoch": 1513} {"train_loss": -22.14719009399414, "global_step": 125582, "epoch": 1513} {"train_loss": -22.464262008666992, "global_step": 125583, "epoch": 1513} {"train_loss": -22.46644401550293, "global_step": 125584, "epoch": 1513} {"train_loss": -22.267526626586914, "global_step": 125585, "epoch": 1513} {"train_loss": -22.412321090698242, "global_step": 125586, "epoch": 1513} {"train_loss": -22.548601150512695, "global_step": 125587, "epoch": 1513} {"train_loss": -22.6973876953125, "global_step": 125588, "epoch": 1513} {"train_loss": -22.83806037902832, "global_step": 125589, "epoch": 1513} {"train_loss": -22.686874389648438, "global_step": 125590, "epoch": 1513} {"train_loss": -22.24886131286621, "global_step": 125591, "epoch": 1513} {"train_loss": -22.323562622070312, "global_step": 125592, "epoch": 1513} {"train_loss": -22.73786735534668, "global_step": 125593, "epoch": 1513} {"train_loss": -22.620607376098633, "global_step": 125594, "epoch": 1513} {"train_loss": -22.733112335205078, "global_step": 125595, "epoch": 1513} {"train_loss": -22.15187644958496, "global_step": 125596, "epoch": 1513} {"train_loss": -22.5665283203125, "global_step": 125597, "epoch": 1513} {"train_loss": -22.729799270629883, "global_step": 125598, "epoch": 1513} {"train_loss": -22.645952224731445, "global_step": 125599, "epoch": 1513} {"train_loss": -22.304031372070312, "global_step": 125600, "epoch": 1513} {"train_loss": -22.420610427856445, "global_step": 125601, "epoch": 1513} {"train_loss": -22.609922409057617, "global_step": 125602, "epoch": 1513} {"train_loss": -22.672056198120117, "global_step": 125603, "epoch": 1513} {"train_loss": -22.241735458374023, "global_step": 125604, "epoch": 1513} {"train_loss": -22.55083465576172, "global_step": 125605, "epoch": 1513} {"train_loss": -22.68829917907715, "global_step": 125606, "epoch": 1513} {"train_loss": -22.655614852905273, "global_step": 125607, "epoch": 1513} {"train_loss": -22.417682647705078, "global_step": 125608, "epoch": 1513} {"train_loss": -22.78232192993164, "global_step": 125609, "epoch": 1513} {"train_loss": -22.48732566833496, "global_step": 125610, "epoch": 1513} {"train_loss": -22.59804344177246, "global_step": 125611, "epoch": 1513} {"train_loss": -22.636037826538086, "global_step": 125612, "epoch": 1513} {"train_loss": -22.264060974121094, "global_step": 125613, "epoch": 1513} {"train_loss": -22.896055221557617, "global_step": 125614, "epoch": 1513} {"train_loss": -22.38423728942871, "global_step": 125615, "epoch": 1513} {"train_loss": -22.62286376953125, "global_step": 125616, "epoch": 1513} {"train_loss": -22.887226104736328, "global_step": 125617, "epoch": 1513} {"train_loss": -22.7663631439209, "global_step": 125618, "epoch": 1513} {"train_loss": -22.713010787963867, "global_step": 125619, "epoch": 1513} {"train_loss": -22.65195655822754, "global_step": 125620, "epoch": 1513} {"train_loss": -22.13016700744629, "global_step": 125621, "epoch": 1513} {"train_loss": -22.87244987487793, "global_step": 125622, "epoch": 1513} {"train_loss": -22.670682907104492, "global_step": 125623, "epoch": 1513} {"train_loss": -23.245317459106445, "global_step": 125624, "epoch": 1513} {"train_loss": -22.641504287719727, "global_step": 125625, "epoch": 1513} {"train_loss": -22.921585083007812, "global_step": 125626, "epoch": 1513} {"train_loss": -22.6823787689209, "global_step": 125627, "epoch": 1513} {"train_loss": -22.894224166870117, "global_step": 125628, "epoch": 1513} {"train_loss": -22.88307762145996, "global_step": 125629, "epoch": 1513} {"train_loss": -22.486709594726562, "global_step": 125630, "epoch": 1513} {"train_loss": -22.79119110107422, "global_step": 125631, "epoch": 1513} {"train_loss": -22.47705078125, "global_step": 125632, "epoch": 1513} {"train_loss": -22.87334442138672, "global_step": 125633, "epoch": 1513} {"train_loss": -22.680631637573242, "global_step": 125634, "epoch": 1513} {"train_loss": -22.719343185424805, "global_step": 125635, "epoch": 1513} {"train_loss": -22.666580200195312, "global_step": 125636, "epoch": 1513} {"train_loss": -22.90204429626465, "global_step": 125637, "epoch": 1513} {"train_loss": -22.967121124267578, "global_step": 125638, "epoch": 1513} {"train_loss": -22.66343116760254, "global_step": 125639, "epoch": 1513} {"train_loss": -22.782461166381836, "global_step": 125640, "epoch": 1513} {"train_loss": -22.84077262878418, "global_step": 125641, "epoch": 1513} {"train_loss": -22.58298683166504, "global_step": 125642, "epoch": 1513} {"train_loss": -22.859920501708984, "global_step": 125643, "epoch": 1513} {"train_loss": -22.508651733398438, "global_step": 125644, "epoch": 1513} {"train_loss": -22.677518844604492, "global_step": 125645, "epoch": 1513} {"train_loss": -22.701679229736328, "global_step": 125646, "epoch": 1513} {"train_loss": -22.683292388916016, "global_step": 125647, "epoch": 1513} {"train_loss": -22.626331329345703, "global_step": 125648, "epoch": 1513} {"train_loss": -22.595422744750977, "global_step": 125649, "epoch": 1513} {"train_loss": -22.79619789123535, "global_step": 125650, "epoch": 1513} {"train_loss": -22.626083374023438, "global_step": 125651, "epoch": 1513} {"train_loss": -22.76999282836914, "global_step": 125652, "epoch": 1513} {"train_loss": -22.529096603393555, "global_step": 125653, "epoch": 1513} {"train_loss": -22.659027099609375, "global_step": 125654, "epoch": 1513} {"train_loss": -22.981721878051758, "global_step": 125655, "epoch": 1513} {"train_loss": -22.69414710998535, "global_step": 125656, "epoch": 1513} {"train_loss": -22.47159194946289, "global_step": 125657, "epoch": 1513} {"train_loss": -22.546157836914062, "global_step": 125658, "epoch": 1513} {"train_loss": -22.57847785949707, "global_step": 125659, "epoch": 1513} {"train_loss": -22.605220794677734, "global_step": 125660, "epoch": 1513} {"train_loss": -22.624192134443536, "global_step": 125661, "epoch": 1513, "val_loss": 6305668.5} {"train_loss": -22.69854736328125, "global_step": 125662, "epoch": 1514} {"train_loss": -21.85381507873535, "global_step": 125663, "epoch": 1514} {"train_loss": -22.05031967163086, "global_step": 125664, "epoch": 1514} {"train_loss": -22.157394409179688, "global_step": 125665, "epoch": 1514} {"train_loss": -22.455305099487305, "global_step": 125666, "epoch": 1514} {"train_loss": -22.097900390625, "global_step": 125667, "epoch": 1514} {"train_loss": -22.487041473388672, "global_step": 125668, "epoch": 1514} {"train_loss": -22.739582061767578, "global_step": 125669, "epoch": 1514} {"train_loss": -22.555448532104492, "global_step": 125670, "epoch": 1514} {"train_loss": -22.644100189208984, "global_step": 125671, "epoch": 1514} {"train_loss": -22.362546920776367, "global_step": 125672, "epoch": 1514} {"train_loss": -22.390363693237305, "global_step": 125673, "epoch": 1514} {"train_loss": -22.287525177001953, "global_step": 125674, "epoch": 1514} {"train_loss": -22.35727310180664, "global_step": 125675, "epoch": 1514} {"train_loss": -22.368701934814453, "global_step": 125676, "epoch": 1514} {"train_loss": -22.840972900390625, "global_step": 125677, "epoch": 1514} {"train_loss": -22.753522872924805, "global_step": 125678, "epoch": 1514} {"train_loss": -22.76848030090332, "global_step": 125679, "epoch": 1514} {"train_loss": -22.505319595336914, "global_step": 125680, "epoch": 1514} {"train_loss": -22.5527400970459, "global_step": 125681, "epoch": 1514} {"train_loss": -22.835851669311523, "global_step": 125682, "epoch": 1514} {"train_loss": -22.426713943481445, "global_step": 125683, "epoch": 1514} {"train_loss": -22.917211532592773, "global_step": 125684, "epoch": 1514} {"train_loss": -22.933908462524414, "global_step": 125685, "epoch": 1514} {"train_loss": -22.389856338500977, "global_step": 125686, "epoch": 1514} {"train_loss": -22.462255477905273, "global_step": 125687, "epoch": 1514} {"train_loss": -22.869356155395508, "global_step": 125688, "epoch": 1514} {"train_loss": -22.632171630859375, "global_step": 125689, "epoch": 1514} {"train_loss": -22.86214256286621, "global_step": 125690, "epoch": 1514} {"train_loss": -22.74818229675293, "global_step": 125691, "epoch": 1514} {"train_loss": -22.931821823120117, "global_step": 125692, "epoch": 1514} {"train_loss": -22.564138412475586, "global_step": 125693, "epoch": 1514} {"train_loss": -22.174470901489258, "global_step": 125694, "epoch": 1514} {"train_loss": -22.821290969848633, "global_step": 125695, "epoch": 1514} {"train_loss": -22.55649185180664, "global_step": 125696, "epoch": 1514} {"train_loss": -22.503219604492188, "global_step": 125697, "epoch": 1514} {"train_loss": -22.943716049194336, "global_step": 125698, "epoch": 1514} {"train_loss": -23.11860466003418, "global_step": 125699, "epoch": 1514} {"train_loss": -22.609333038330078, "global_step": 125700, "epoch": 1514} {"train_loss": -22.173782348632812, "global_step": 125701, "epoch": 1514} {"train_loss": -22.728900909423828, "global_step": 125702, "epoch": 1514} {"train_loss": -22.745328903198242, "global_step": 125703, "epoch": 1514} {"train_loss": -22.503576278686523, "global_step": 125704, "epoch": 1514} {"train_loss": -22.64986228942871, "global_step": 125705, "epoch": 1514} {"train_loss": -22.844039916992188, "global_step": 125706, "epoch": 1514} {"train_loss": -22.93741798400879, "global_step": 125707, "epoch": 1514} {"train_loss": -22.38272476196289, "global_step": 125708, "epoch": 1514} {"train_loss": -22.429943084716797, "global_step": 125709, "epoch": 1514} {"train_loss": -22.749412536621094, "global_step": 125710, "epoch": 1514} {"train_loss": -22.40911865234375, "global_step": 125711, "epoch": 1514} {"train_loss": -22.9556941986084, "global_step": 125712, "epoch": 1514} {"train_loss": -22.792072296142578, "global_step": 125713, "epoch": 1514} {"train_loss": -22.892499923706055, "global_step": 125714, "epoch": 1514} {"train_loss": -22.85658073425293, "global_step": 125715, "epoch": 1514} {"train_loss": -22.59956932067871, "global_step": 125716, "epoch": 1514} {"train_loss": -22.789173126220703, "global_step": 125717, "epoch": 1514} {"train_loss": -22.8890438079834, "global_step": 125718, "epoch": 1514} {"train_loss": -22.79139518737793, "global_step": 125719, "epoch": 1514} {"train_loss": -23.05055809020996, "global_step": 125720, "epoch": 1514} {"train_loss": -22.71433448791504, "global_step": 125721, "epoch": 1514} {"train_loss": -22.820043563842773, "global_step": 125722, "epoch": 1514} {"train_loss": -22.999780654907227, "global_step": 125723, "epoch": 1514} {"train_loss": -22.64838409423828, "global_step": 125724, "epoch": 1514} {"train_loss": -22.662364959716797, "global_step": 125725, "epoch": 1514} {"train_loss": -22.94594383239746, "global_step": 125726, "epoch": 1514} {"train_loss": -22.420963287353516, "global_step": 125727, "epoch": 1514} {"train_loss": -22.5268611907959, "global_step": 125728, "epoch": 1514} {"train_loss": -22.33922576904297, "global_step": 125729, "epoch": 1514} {"train_loss": -22.7955379486084, "global_step": 125730, "epoch": 1514} {"train_loss": -23.073530197143555, "global_step": 125731, "epoch": 1514} {"train_loss": -22.75688362121582, "global_step": 125732, "epoch": 1514} {"train_loss": -22.5361328125, "global_step": 125733, "epoch": 1514} {"train_loss": -22.42690086364746, "global_step": 125734, "epoch": 1514} {"train_loss": -22.242273330688477, "global_step": 125735, "epoch": 1514} {"train_loss": -22.274805068969727, "global_step": 125736, "epoch": 1514} {"train_loss": -22.279300689697266, "global_step": 125737, "epoch": 1514} {"train_loss": -22.616382598876953, "global_step": 125738, "epoch": 1514} {"train_loss": -22.828683853149414, "global_step": 125739, "epoch": 1514} {"train_loss": -22.851064682006836, "global_step": 125740, "epoch": 1514} {"train_loss": -22.720977783203125, "global_step": 125741, "epoch": 1514} {"train_loss": -22.240644454956055, "global_step": 125742, "epoch": 1514} {"train_loss": -22.465614318847656, "global_step": 125743, "epoch": 1514} {"train_loss": -22.619624126388366, "global_step": 125744, "epoch": 1514, "val_loss": 6252636.0} {"train_loss": -22.560537338256836, "global_step": 125745, "epoch": 1515} {"train_loss": -22.577274322509766, "global_step": 125746, "epoch": 1515} {"train_loss": -22.51063346862793, "global_step": 125747, "epoch": 1515} {"train_loss": -22.14089012145996, "global_step": 125748, "epoch": 1515} {"train_loss": -22.526958465576172, "global_step": 125749, "epoch": 1515} {"train_loss": -22.6381778717041, "global_step": 125750, "epoch": 1515} {"train_loss": -22.864355087280273, "global_step": 125751, "epoch": 1515} {"train_loss": -22.78074836730957, "global_step": 125752, "epoch": 1515} {"train_loss": -22.31795310974121, "global_step": 125753, "epoch": 1515} {"train_loss": -22.27958869934082, "global_step": 125754, "epoch": 1515} {"train_loss": -22.54787826538086, "global_step": 125755, "epoch": 1515} {"train_loss": -22.4263973236084, "global_step": 125756, "epoch": 1515} {"train_loss": -22.48294448852539, "global_step": 125757, "epoch": 1515} {"train_loss": -22.766111373901367, "global_step": 125758, "epoch": 1515} {"train_loss": -22.949731826782227, "global_step": 125759, "epoch": 1515} {"train_loss": -22.456693649291992, "global_step": 125760, "epoch": 1515} {"train_loss": -22.4041690826416, "global_step": 125761, "epoch": 1515} {"train_loss": -22.464521408081055, "global_step": 125762, "epoch": 1515} {"train_loss": -22.725671768188477, "global_step": 125763, "epoch": 1515} {"train_loss": -22.689685821533203, "global_step": 125764, "epoch": 1515} {"train_loss": -22.458362579345703, "global_step": 125765, "epoch": 1515} {"train_loss": -22.605493545532227, "global_step": 125766, "epoch": 1515} {"train_loss": -22.80410385131836, "global_step": 125767, "epoch": 1515} {"train_loss": -22.849634170532227, "global_step": 125768, "epoch": 1515} {"train_loss": -22.60731315612793, "global_step": 125769, "epoch": 1515} {"train_loss": -22.935291290283203, "global_step": 125770, "epoch": 1515} {"train_loss": -22.733972549438477, "global_step": 125771, "epoch": 1515} {"train_loss": -23.239042282104492, "global_step": 125772, "epoch": 1515} {"train_loss": -22.669580459594727, "global_step": 125773, "epoch": 1515} {"train_loss": -22.8720760345459, "global_step": 125774, "epoch": 1515} {"train_loss": -22.883100509643555, "global_step": 125775, "epoch": 1515} {"train_loss": -23.12921714782715, "global_step": 125776, "epoch": 1515} {"train_loss": -22.653335571289062, "global_step": 125777, "epoch": 1515} {"train_loss": -22.877899169921875, "global_step": 125778, "epoch": 1515} {"train_loss": -22.58503532409668, "global_step": 125779, "epoch": 1515} {"train_loss": -22.5167236328125, "global_step": 125780, "epoch": 1515} {"train_loss": -23.00937843322754, "global_step": 125781, "epoch": 1515} {"train_loss": -22.935163497924805, "global_step": 125782, "epoch": 1515} {"train_loss": -22.490934371948242, "global_step": 125783, "epoch": 1515} {"train_loss": -22.848371505737305, "global_step": 125784, "epoch": 1515} {"train_loss": -23.058454513549805, "global_step": 125785, "epoch": 1515} {"train_loss": -22.586936950683594, "global_step": 125786, "epoch": 1515} {"train_loss": -22.311120986938477, "global_step": 125787, "epoch": 1515} {"train_loss": -22.577390670776367, "global_step": 125788, "epoch": 1515} {"train_loss": -22.36879539489746, "global_step": 125789, "epoch": 1515} {"train_loss": -23.101896286010742, "global_step": 125790, "epoch": 1515} {"train_loss": -22.40400505065918, "global_step": 125791, "epoch": 1515} {"train_loss": -22.782169342041016, "global_step": 125792, "epoch": 1515} {"train_loss": -22.126554489135742, "global_step": 125793, "epoch": 1515} {"train_loss": -22.787199020385742, "global_step": 125794, "epoch": 1515} {"train_loss": -22.38545799255371, "global_step": 125795, "epoch": 1515} {"train_loss": -22.4490909576416, "global_step": 125796, "epoch": 1515} {"train_loss": -22.70747184753418, "global_step": 125797, "epoch": 1515} {"train_loss": -22.459501266479492, "global_step": 125798, "epoch": 1515} {"train_loss": -22.596771240234375, "global_step": 125799, "epoch": 1515} {"train_loss": -22.763944625854492, "global_step": 125800, "epoch": 1515} {"train_loss": -22.973901748657227, "global_step": 125801, "epoch": 1515} {"train_loss": -22.43929672241211, "global_step": 125802, "epoch": 1515} {"train_loss": -22.608869552612305, "global_step": 125803, "epoch": 1515} {"train_loss": -22.950698852539062, "global_step": 125804, "epoch": 1515} {"train_loss": -22.88176918029785, "global_step": 125805, "epoch": 1515} {"train_loss": -22.66005516052246, "global_step": 125806, "epoch": 1515} {"train_loss": -22.499914169311523, "global_step": 125807, "epoch": 1515} {"train_loss": -23.173145294189453, "global_step": 125808, "epoch": 1515} {"train_loss": -22.84654998779297, "global_step": 125809, "epoch": 1515} {"train_loss": -23.01506805419922, "global_step": 125810, "epoch": 1515} {"train_loss": -22.651607513427734, "global_step": 125811, "epoch": 1515} {"train_loss": -22.638187408447266, "global_step": 125812, "epoch": 1515} {"train_loss": -22.427061080932617, "global_step": 125813, "epoch": 1515} {"train_loss": -22.698820114135742, "global_step": 125814, "epoch": 1515} {"train_loss": -22.924406051635742, "global_step": 125815, "epoch": 1515} {"train_loss": -22.98390007019043, "global_step": 125816, "epoch": 1515} {"train_loss": -23.05891227722168, "global_step": 125817, "epoch": 1515} {"train_loss": -22.966480255126953, "global_step": 125818, "epoch": 1515} {"train_loss": -22.582666397094727, "global_step": 125819, "epoch": 1515} {"train_loss": -22.322433471679688, "global_step": 125820, "epoch": 1515} {"train_loss": -22.63239860534668, "global_step": 125821, "epoch": 1515} {"train_loss": -22.69308853149414, "global_step": 125822, "epoch": 1515} {"train_loss": -22.86196517944336, "global_step": 125823, "epoch": 1515} {"train_loss": -22.816316604614258, "global_step": 125824, "epoch": 1515} {"train_loss": -22.42440414428711, "global_step": 125825, "epoch": 1515} {"train_loss": -22.754179000854492, "global_step": 125826, "epoch": 1515} {"train_loss": -22.675071992069842, "global_step": 125827, "epoch": 1515, "val_loss": 6283367.5} {"train_loss": -22.557260513305664, "global_step": 125828, "epoch": 1516} {"train_loss": -22.45328140258789, "global_step": 125829, "epoch": 1516} {"train_loss": -22.412702560424805, "global_step": 125830, "epoch": 1516} {"train_loss": -22.424985885620117, "global_step": 125831, "epoch": 1516} {"train_loss": -21.963760375976562, "global_step": 125832, "epoch": 1516} {"train_loss": -23.045089721679688, "global_step": 125833, "epoch": 1516} {"train_loss": -22.457046508789062, "global_step": 125834, "epoch": 1516} {"train_loss": -22.489957809448242, "global_step": 125835, "epoch": 1516} {"train_loss": -22.38380241394043, "global_step": 125836, "epoch": 1516} {"train_loss": -22.43519401550293, "global_step": 125837, "epoch": 1516} {"train_loss": -22.53077507019043, "global_step": 125838, "epoch": 1516} {"train_loss": -22.817291259765625, "global_step": 125839, "epoch": 1516} {"train_loss": -22.408533096313477, "global_step": 125840, "epoch": 1516} {"train_loss": -22.3371639251709, "global_step": 125841, "epoch": 1516} {"train_loss": -22.47406578063965, "global_step": 125842, "epoch": 1516} {"train_loss": -22.58718490600586, "global_step": 125843, "epoch": 1516} {"train_loss": -22.446617126464844, "global_step": 125844, "epoch": 1516} {"train_loss": -23.28346824645996, "global_step": 125845, "epoch": 1516} {"train_loss": -22.82630729675293, "global_step": 125846, "epoch": 1516} {"train_loss": -22.44563102722168, "global_step": 125847, "epoch": 1516} {"train_loss": -22.878692626953125, "global_step": 125848, "epoch": 1516} {"train_loss": -22.451263427734375, "global_step": 125849, "epoch": 1516} {"train_loss": -22.262441635131836, "global_step": 125850, "epoch": 1516} {"train_loss": -22.616474151611328, "global_step": 125851, "epoch": 1516} {"train_loss": -22.687789916992188, "global_step": 125852, "epoch": 1516} {"train_loss": -22.73448944091797, "global_step": 125853, "epoch": 1516} {"train_loss": -22.801599502563477, "global_step": 125854, "epoch": 1516} {"train_loss": -22.782073974609375, "global_step": 125855, "epoch": 1516} {"train_loss": -22.941850662231445, "global_step": 125856, "epoch": 1516} {"train_loss": -22.684720993041992, "global_step": 125857, "epoch": 1516} {"train_loss": -22.98253631591797, "global_step": 125858, "epoch": 1516} {"train_loss": -23.06191062927246, "global_step": 125859, "epoch": 1516} {"train_loss": -22.751806259155273, "global_step": 125860, "epoch": 1516} {"train_loss": -22.733381271362305, "global_step": 125861, "epoch": 1516} {"train_loss": -22.770404815673828, "global_step": 125862, "epoch": 1516} {"train_loss": -22.75682258605957, "global_step": 125863, "epoch": 1516} {"train_loss": -22.75758171081543, "global_step": 125864, "epoch": 1516} {"train_loss": -22.768062591552734, "global_step": 125865, "epoch": 1516} {"train_loss": -22.574338912963867, "global_step": 125866, "epoch": 1516} {"train_loss": -23.109783172607422, "global_step": 125867, "epoch": 1516} {"train_loss": -23.040180206298828, "global_step": 125868, "epoch": 1516} {"train_loss": -22.895368576049805, "global_step": 125869, "epoch": 1516} {"train_loss": -22.282840728759766, "global_step": 125870, "epoch": 1516} {"train_loss": -22.44188690185547, "global_step": 125871, "epoch": 1516} {"train_loss": -22.370777130126953, "global_step": 125872, "epoch": 1516} {"train_loss": -22.5377254486084, "global_step": 125873, "epoch": 1516} {"train_loss": -22.68195152282715, "global_step": 125874, "epoch": 1516} {"train_loss": -22.778913497924805, "global_step": 125875, "epoch": 1516} {"train_loss": -22.60004997253418, "global_step": 125876, "epoch": 1516} {"train_loss": -22.719009399414062, "global_step": 125877, "epoch": 1516} {"train_loss": -22.86699104309082, "global_step": 125878, "epoch": 1516} {"train_loss": -22.526206970214844, "global_step": 125879, "epoch": 1516} {"train_loss": -22.820039749145508, "global_step": 125880, "epoch": 1516} {"train_loss": -22.425790786743164, "global_step": 125881, "epoch": 1516} {"train_loss": -22.92562484741211, "global_step": 125882, "epoch": 1516} {"train_loss": -22.316282272338867, "global_step": 125883, "epoch": 1516} {"train_loss": -22.516324996948242, "global_step": 125884, "epoch": 1516} {"train_loss": -22.71415138244629, "global_step": 125885, "epoch": 1516} {"train_loss": -23.098670959472656, "global_step": 125886, "epoch": 1516} {"train_loss": -22.630521774291992, "global_step": 125887, "epoch": 1516} {"train_loss": -22.55327033996582, "global_step": 125888, "epoch": 1516} {"train_loss": -22.89588165283203, "global_step": 125889, "epoch": 1516} {"train_loss": -22.790700912475586, "global_step": 125890, "epoch": 1516} {"train_loss": -22.585857391357422, "global_step": 125891, "epoch": 1516} {"train_loss": -22.246152877807617, "global_step": 125892, "epoch": 1516} {"train_loss": -22.441619873046875, "global_step": 125893, "epoch": 1516} {"train_loss": -22.64811897277832, "global_step": 125894, "epoch": 1516} {"train_loss": -22.61281394958496, "global_step": 125895, "epoch": 1516} {"train_loss": -22.001768112182617, "global_step": 125896, "epoch": 1516} {"train_loss": -22.525938034057617, "global_step": 125897, "epoch": 1516} {"train_loss": -22.664365768432617, "global_step": 125898, "epoch": 1516} {"train_loss": -22.646650314331055, "global_step": 125899, "epoch": 1516} {"train_loss": -22.886341094970703, "global_step": 125900, "epoch": 1516} {"train_loss": -22.356107711791992, "global_step": 125901, "epoch": 1516} {"train_loss": -22.594961166381836, "global_step": 125902, "epoch": 1516} {"train_loss": -22.584806442260742, "global_step": 125903, "epoch": 1516} {"train_loss": -22.95454978942871, "global_step": 125904, "epoch": 1516} {"train_loss": -22.5395565032959, "global_step": 125905, "epoch": 1516} {"train_loss": -22.841707229614258, "global_step": 125906, "epoch": 1516} {"train_loss": -23.012540817260742, "global_step": 125907, "epoch": 1516} {"train_loss": -22.96885871887207, "global_step": 125908, "epoch": 1516} {"train_loss": -22.75200843811035, "global_step": 125909, "epoch": 1516} {"train_loss": -22.637619684977704, "global_step": 125910, "epoch": 1516, "val_loss": 6389351.0} {"train_loss": -21.694360733032227, "global_step": 125911, "epoch": 1517} {"train_loss": -22.18745994567871, "global_step": 125912, "epoch": 1517} {"train_loss": -21.895965576171875, "global_step": 125913, "epoch": 1517} {"train_loss": -22.259382247924805, "global_step": 125914, "epoch": 1517} {"train_loss": -22.02177619934082, "global_step": 125915, "epoch": 1517} {"train_loss": -22.3936767578125, "global_step": 125916, "epoch": 1517} {"train_loss": -22.498388290405273, "global_step": 125917, "epoch": 1517} {"train_loss": -22.010114669799805, "global_step": 125918, "epoch": 1517} {"train_loss": -22.003768920898438, "global_step": 125919, "epoch": 1517} {"train_loss": -22.274621963500977, "global_step": 125920, "epoch": 1517} {"train_loss": -22.40604019165039, "global_step": 125921, "epoch": 1517} {"train_loss": -22.572601318359375, "global_step": 125922, "epoch": 1517} {"train_loss": -22.571212768554688, "global_step": 125923, "epoch": 1517} {"train_loss": -22.006540298461914, "global_step": 125924, "epoch": 1517} {"train_loss": -22.93004035949707, "global_step": 125925, "epoch": 1517} {"train_loss": -22.511295318603516, "global_step": 125926, "epoch": 1517} {"train_loss": -22.989215850830078, "global_step": 125927, "epoch": 1517} {"train_loss": -22.498929977416992, "global_step": 125928, "epoch": 1517} {"train_loss": -22.23102378845215, "global_step": 125929, "epoch": 1517} {"train_loss": -22.515161514282227, "global_step": 125930, "epoch": 1517} {"train_loss": -22.588415145874023, "global_step": 125931, "epoch": 1517} {"train_loss": -22.24287223815918, "global_step": 125932, "epoch": 1517} {"train_loss": -22.642955780029297, "global_step": 125933, "epoch": 1517} {"train_loss": -22.720001220703125, "global_step": 125934, "epoch": 1517} {"train_loss": -22.553144454956055, "global_step": 125935, "epoch": 1517} {"train_loss": -22.78062629699707, "global_step": 125936, "epoch": 1517} {"train_loss": -22.89491081237793, "global_step": 125937, "epoch": 1517} {"train_loss": -22.376134872436523, "global_step": 125938, "epoch": 1517} {"train_loss": -22.79916000366211, "global_step": 125939, "epoch": 1517} {"train_loss": -22.522485733032227, "global_step": 125940, "epoch": 1517} {"train_loss": -22.731098175048828, "global_step": 125941, "epoch": 1517} {"train_loss": -22.4228458404541, "global_step": 125942, "epoch": 1517} {"train_loss": -23.000415802001953, "global_step": 125943, "epoch": 1517} {"train_loss": -22.762754440307617, "global_step": 125944, "epoch": 1517} {"train_loss": -22.579395294189453, "global_step": 125945, "epoch": 1517} {"train_loss": -22.830707550048828, "global_step": 125946, "epoch": 1517} {"train_loss": -22.85037612915039, "global_step": 125947, "epoch": 1517} {"train_loss": -22.679296493530273, "global_step": 125948, "epoch": 1517} {"train_loss": -22.587238311767578, "global_step": 125949, "epoch": 1517} {"train_loss": -22.89892578125, "global_step": 125950, "epoch": 1517} {"train_loss": -22.639158248901367, "global_step": 125951, "epoch": 1517} {"train_loss": -22.253324508666992, "global_step": 125952, "epoch": 1517} {"train_loss": -22.449060440063477, "global_step": 125953, "epoch": 1517} {"train_loss": -22.440317153930664, "global_step": 125954, "epoch": 1517} {"train_loss": -22.82366371154785, "global_step": 125955, "epoch": 1517} {"train_loss": -22.675783157348633, "global_step": 125956, "epoch": 1517} {"train_loss": -22.86648941040039, "global_step": 125957, "epoch": 1517} {"train_loss": -23.04918670654297, "global_step": 125958, "epoch": 1517} {"train_loss": -22.506183624267578, "global_step": 125959, "epoch": 1517} {"train_loss": -22.73321533203125, "global_step": 125960, "epoch": 1517} {"train_loss": -22.741424560546875, "global_step": 125961, "epoch": 1517} {"train_loss": -22.774179458618164, "global_step": 125962, "epoch": 1517} {"train_loss": -22.83346939086914, "global_step": 125963, "epoch": 1517} {"train_loss": -22.634727478027344, "global_step": 125964, "epoch": 1517} {"train_loss": -22.844985961914062, "global_step": 125965, "epoch": 1517} {"train_loss": -22.7686767578125, "global_step": 125966, "epoch": 1517} {"train_loss": -22.475561141967773, "global_step": 125967, "epoch": 1517} {"train_loss": -22.7102108001709, "global_step": 125968, "epoch": 1517} {"train_loss": -22.971694946289062, "global_step": 125969, "epoch": 1517} {"train_loss": -22.89546012878418, "global_step": 125970, "epoch": 1517} {"train_loss": -22.69739532470703, "global_step": 125971, "epoch": 1517} {"train_loss": -22.568387985229492, "global_step": 125972, "epoch": 1517} {"train_loss": -23.0114688873291, "global_step": 125973, "epoch": 1517} {"train_loss": -22.8043212890625, "global_step": 125974, "epoch": 1517} {"train_loss": -22.668058395385742, "global_step": 125975, "epoch": 1517} {"train_loss": -22.609619140625, "global_step": 125976, "epoch": 1517} {"train_loss": -22.805282592773438, "global_step": 125977, "epoch": 1517} {"train_loss": -23.093482971191406, "global_step": 125978, "epoch": 1517} {"train_loss": -22.64143180847168, "global_step": 125979, "epoch": 1517} {"train_loss": -22.69671058654785, "global_step": 125980, "epoch": 1517} {"train_loss": -22.603925704956055, "global_step": 125981, "epoch": 1517} {"train_loss": -22.723451614379883, "global_step": 125982, "epoch": 1517} {"train_loss": -22.6806640625, "global_step": 125983, "epoch": 1517} {"train_loss": -22.925283432006836, "global_step": 125984, "epoch": 1517} {"train_loss": -22.855310440063477, "global_step": 125985, "epoch": 1517} {"train_loss": -22.723257064819336, "global_step": 125986, "epoch": 1517} {"train_loss": -22.872831344604492, "global_step": 125987, "epoch": 1517} {"train_loss": -22.671966552734375, "global_step": 125988, "epoch": 1517} {"train_loss": -22.328235626220703, "global_step": 125989, "epoch": 1517} {"train_loss": -22.508657455444336, "global_step": 125990, "epoch": 1517} {"train_loss": -22.75242042541504, "global_step": 125991, "epoch": 1517} {"train_loss": -22.453153610229492, "global_step": 125992, "epoch": 1517} {"train_loss": -22.606280453233833, "global_step": 125993, "epoch": 1517, "val_loss": 6278451.0} {"train_loss": -21.608057022094727, "global_step": 125994, "epoch": 1518} {"train_loss": -22.304168701171875, "global_step": 125995, "epoch": 1518} {"train_loss": -21.879318237304688, "global_step": 125996, "epoch": 1518} {"train_loss": -21.848434448242188, "global_step": 125997, "epoch": 1518} {"train_loss": -22.280759811401367, "global_step": 125998, "epoch": 1518} {"train_loss": -22.376493453979492, "global_step": 125999, "epoch": 1518} {"train_loss": -21.787376403808594, "global_step": 126000, "epoch": 1518} {"train_loss": -22.338727951049805, "global_step": 126001, "epoch": 1518} {"train_loss": -22.559412002563477, "global_step": 126002, "epoch": 1518} {"train_loss": -22.996761322021484, "global_step": 126003, "epoch": 1518} {"train_loss": -22.407516479492188, "global_step": 126004, "epoch": 1518} {"train_loss": -22.411096572875977, "global_step": 126005, "epoch": 1518} {"train_loss": -22.215566635131836, "global_step": 126006, "epoch": 1518} {"train_loss": -22.312414169311523, "global_step": 126007, "epoch": 1518} {"train_loss": -22.24968910217285, "global_step": 126008, "epoch": 1518} {"train_loss": -22.37017250061035, "global_step": 126009, "epoch": 1518} {"train_loss": -22.16927146911621, "global_step": 126010, "epoch": 1518} {"train_loss": -22.466957092285156, "global_step": 126011, "epoch": 1518} {"train_loss": -22.558757781982422, "global_step": 126012, "epoch": 1518} {"train_loss": -22.637845993041992, "global_step": 126013, "epoch": 1518} {"train_loss": -22.511564254760742, "global_step": 126014, "epoch": 1518} {"train_loss": -22.437028884887695, "global_step": 126015, "epoch": 1518} {"train_loss": -22.508220672607422, "global_step": 126016, "epoch": 1518} {"train_loss": -22.722333908081055, "global_step": 126017, "epoch": 1518} {"train_loss": -22.807235717773438, "global_step": 126018, "epoch": 1518} {"train_loss": -22.626508712768555, "global_step": 126019, "epoch": 1518} {"train_loss": -22.873199462890625, "global_step": 126020, "epoch": 1518} {"train_loss": -22.614120483398438, "global_step": 126021, "epoch": 1518} {"train_loss": -22.36301040649414, "global_step": 126022, "epoch": 1518} {"train_loss": -22.647668838500977, "global_step": 126023, "epoch": 1518} {"train_loss": -22.512060165405273, "global_step": 126024, "epoch": 1518} {"train_loss": -22.491437911987305, "global_step": 126025, "epoch": 1518} {"train_loss": -22.61173439025879, "global_step": 126026, "epoch": 1518} {"train_loss": -22.568431854248047, "global_step": 126027, "epoch": 1518} {"train_loss": -22.94986343383789, "global_step": 126028, "epoch": 1518} {"train_loss": -22.773468017578125, "global_step": 126029, "epoch": 1518} {"train_loss": -22.66239356994629, "global_step": 126030, "epoch": 1518} {"train_loss": -22.915462493896484, "global_step": 126031, "epoch": 1518} {"train_loss": -22.782899856567383, "global_step": 126032, "epoch": 1518} {"train_loss": -22.303348541259766, "global_step": 126033, "epoch": 1518} {"train_loss": -22.52727699279785, "global_step": 126034, "epoch": 1518} {"train_loss": -22.62107276916504, "global_step": 126035, "epoch": 1518} {"train_loss": -22.88319969177246, "global_step": 126036, "epoch": 1518} {"train_loss": -22.5712833404541, "global_step": 126037, "epoch": 1518} {"train_loss": -22.968568801879883, "global_step": 126038, "epoch": 1518} {"train_loss": -22.76657485961914, "global_step": 126039, "epoch": 1518} {"train_loss": -22.80251121520996, "global_step": 126040, "epoch": 1518} {"train_loss": -22.844158172607422, "global_step": 126041, "epoch": 1518} {"train_loss": -22.772104263305664, "global_step": 126042, "epoch": 1518} {"train_loss": -22.712682723999023, "global_step": 126043, "epoch": 1518} {"train_loss": -22.58326530456543, "global_step": 126044, "epoch": 1518} {"train_loss": -23.238672256469727, "global_step": 126045, "epoch": 1518} {"train_loss": -22.550519943237305, "global_step": 126046, "epoch": 1518} {"train_loss": -23.096206665039062, "global_step": 126047, "epoch": 1518} {"train_loss": -22.770526885986328, "global_step": 126048, "epoch": 1518} {"train_loss": -22.59686279296875, "global_step": 126049, "epoch": 1518} {"train_loss": -22.6254940032959, "global_step": 126050, "epoch": 1518} {"train_loss": -22.625024795532227, "global_step": 126051, "epoch": 1518} {"train_loss": -22.59493064880371, "global_step": 126052, "epoch": 1518} {"train_loss": -23.197004318237305, "global_step": 126053, "epoch": 1518} {"train_loss": -23.082277297973633, "global_step": 126054, "epoch": 1518} {"train_loss": -22.664600372314453, "global_step": 126055, "epoch": 1518} {"train_loss": -22.404874801635742, "global_step": 126056, "epoch": 1518} {"train_loss": -22.964887619018555, "global_step": 126057, "epoch": 1518} {"train_loss": -23.16057777404785, "global_step": 126058, "epoch": 1518} {"train_loss": -23.1153564453125, "global_step": 126059, "epoch": 1518} {"train_loss": -22.923004150390625, "global_step": 126060, "epoch": 1518} {"train_loss": -22.900846481323242, "global_step": 126061, "epoch": 1518} {"train_loss": -23.183761596679688, "global_step": 126062, "epoch": 1518} {"train_loss": -22.673437118530273, "global_step": 126063, "epoch": 1518} {"train_loss": -22.963266372680664, "global_step": 126064, "epoch": 1518} {"train_loss": -22.58570671081543, "global_step": 126065, "epoch": 1518} {"train_loss": -22.971532821655273, "global_step": 126066, "epoch": 1518} {"train_loss": -22.89213752746582, "global_step": 126067, "epoch": 1518} {"train_loss": -22.761302947998047, "global_step": 126068, "epoch": 1518} {"train_loss": -22.65912628173828, "global_step": 126069, "epoch": 1518} {"train_loss": -22.947914123535156, "global_step": 126070, "epoch": 1518} {"train_loss": -22.871644973754883, "global_step": 126071, "epoch": 1518} {"train_loss": -22.74088478088379, "global_step": 126072, "epoch": 1518} {"train_loss": -22.756820678710938, "global_step": 126073, "epoch": 1518} {"train_loss": -22.453149795532227, "global_step": 126074, "epoch": 1518} {"train_loss": -23.03065299987793, "global_step": 126075, "epoch": 1518} {"train_loss": -22.654928529118916, "global_step": 126076, "epoch": 1518, "val_loss": 6200311.0} {"train_loss": -22.820810317993164, "global_step": 126077, "epoch": 1519} {"train_loss": -22.511972427368164, "global_step": 126078, "epoch": 1519} {"train_loss": -22.50094223022461, "global_step": 126079, "epoch": 1519} {"train_loss": -22.73674201965332, "global_step": 126080, "epoch": 1519} {"train_loss": -22.323423385620117, "global_step": 126081, "epoch": 1519} {"train_loss": -22.69720458984375, "global_step": 126082, "epoch": 1519} {"train_loss": -22.817989349365234, "global_step": 126083, "epoch": 1519} {"train_loss": -22.718917846679688, "global_step": 126084, "epoch": 1519} {"train_loss": -22.35261344909668, "global_step": 126085, "epoch": 1519} {"train_loss": -22.28079605102539, "global_step": 126086, "epoch": 1519} {"train_loss": -22.4936580657959, "global_step": 126087, "epoch": 1519} {"train_loss": -22.5607852935791, "global_step": 126088, "epoch": 1519} {"train_loss": -22.51185417175293, "global_step": 126089, "epoch": 1519} {"train_loss": -22.676481246948242, "global_step": 126090, "epoch": 1519} {"train_loss": -22.497028350830078, "global_step": 126091, "epoch": 1519} {"train_loss": -22.780820846557617, "global_step": 126092, "epoch": 1519} {"train_loss": -22.636198043823242, "global_step": 126093, "epoch": 1519} {"train_loss": -22.721731185913086, "global_step": 126094, "epoch": 1519} {"train_loss": -22.635669708251953, "global_step": 126095, "epoch": 1519} {"train_loss": -22.72560691833496, "global_step": 126096, "epoch": 1519} {"train_loss": -22.351667404174805, "global_step": 126097, "epoch": 1519} {"train_loss": -22.773313522338867, "global_step": 126098, "epoch": 1519} {"train_loss": -22.76384925842285, "global_step": 126099, "epoch": 1519} {"train_loss": -22.705413818359375, "global_step": 126100, "epoch": 1519} {"train_loss": -22.639205932617188, "global_step": 126101, "epoch": 1519} {"train_loss": -22.39362335205078, "global_step": 126102, "epoch": 1519} {"train_loss": -22.29576873779297, "global_step": 126103, "epoch": 1519} {"train_loss": -22.852048873901367, "global_step": 126104, "epoch": 1519} {"train_loss": -22.85874366760254, "global_step": 126105, "epoch": 1519} {"train_loss": -23.071168899536133, "global_step": 126106, "epoch": 1519} {"train_loss": -23.082843780517578, "global_step": 126107, "epoch": 1519} {"train_loss": -22.928590774536133, "global_step": 126108, "epoch": 1519} {"train_loss": -22.88205909729004, "global_step": 126109, "epoch": 1519} {"train_loss": -22.96319580078125, "global_step": 126110, "epoch": 1519} {"train_loss": -22.743919372558594, "global_step": 126111, "epoch": 1519} {"train_loss": -22.83768081665039, "global_step": 126112, "epoch": 1519} {"train_loss": -22.861684799194336, "global_step": 126113, "epoch": 1519} {"train_loss": -22.578596115112305, "global_step": 126114, "epoch": 1519} {"train_loss": -22.819393157958984, "global_step": 126115, "epoch": 1519} {"train_loss": -22.675464630126953, "global_step": 126116, "epoch": 1519} {"train_loss": -22.50252342224121, "global_step": 126117, "epoch": 1519} {"train_loss": -22.483366012573242, "global_step": 126118, "epoch": 1519} {"train_loss": -22.68647575378418, "global_step": 126119, "epoch": 1519} {"train_loss": -22.69578742980957, "global_step": 126120, "epoch": 1519} {"train_loss": -22.648832321166992, "global_step": 126121, "epoch": 1519} {"train_loss": -22.93317985534668, "global_step": 126122, "epoch": 1519} {"train_loss": -22.447830200195312, "global_step": 126123, "epoch": 1519} {"train_loss": -22.443939208984375, "global_step": 126124, "epoch": 1519} {"train_loss": -22.75343894958496, "global_step": 126125, "epoch": 1519} {"train_loss": -22.799182891845703, "global_step": 126126, "epoch": 1519} {"train_loss": -22.651168823242188, "global_step": 126127, "epoch": 1519} {"train_loss": -22.4052677154541, "global_step": 126128, "epoch": 1519} {"train_loss": -22.835304260253906, "global_step": 126129, "epoch": 1519} {"train_loss": -22.992856979370117, "global_step": 126130, "epoch": 1519} {"train_loss": -22.66977310180664, "global_step": 126131, "epoch": 1519} {"train_loss": -22.855224609375, "global_step": 126132, "epoch": 1519} {"train_loss": -22.760404586791992, "global_step": 126133, "epoch": 1519} {"train_loss": -22.424962997436523, "global_step": 126134, "epoch": 1519} {"train_loss": -22.786800384521484, "global_step": 126135, "epoch": 1519} {"train_loss": -22.86934471130371, "global_step": 126136, "epoch": 1519} {"train_loss": -22.6595458984375, "global_step": 126137, "epoch": 1519} {"train_loss": -22.641443252563477, "global_step": 126138, "epoch": 1519} {"train_loss": -22.60959815979004, "global_step": 126139, "epoch": 1519} {"train_loss": -22.877771377563477, "global_step": 126140, "epoch": 1519} {"train_loss": -23.117847442626953, "global_step": 126141, "epoch": 1519} {"train_loss": -22.81561851501465, "global_step": 126142, "epoch": 1519} {"train_loss": -22.605728149414062, "global_step": 126143, "epoch": 1519} {"train_loss": -22.521728515625, "global_step": 126144, "epoch": 1519} {"train_loss": -22.868240356445312, "global_step": 126145, "epoch": 1519} {"train_loss": -22.395187377929688, "global_step": 126146, "epoch": 1519} {"train_loss": -22.313230514526367, "global_step": 126147, "epoch": 1519} {"train_loss": -22.527576446533203, "global_step": 126148, "epoch": 1519} {"train_loss": -22.677946090698242, "global_step": 126149, "epoch": 1519} {"train_loss": -22.948867797851562, "global_step": 126150, "epoch": 1519} {"train_loss": -22.577661514282227, "global_step": 126151, "epoch": 1519} {"train_loss": -22.616626739501953, "global_step": 126152, "epoch": 1519} {"train_loss": -22.73902130126953, "global_step": 126153, "epoch": 1519} {"train_loss": -22.840253829956055, "global_step": 126154, "epoch": 1519} {"train_loss": -22.811670303344727, "global_step": 126155, "epoch": 1519} {"train_loss": -22.557531356811523, "global_step": 126156, "epoch": 1519} {"train_loss": -22.792722702026367, "global_step": 126157, "epoch": 1519} {"train_loss": -22.368425369262695, "global_step": 126158, "epoch": 1519} {"train_loss": -22.664829598851952, "global_step": 126159, "epoch": 1519, "val_loss": 6336665.0} {"train_loss": -22.457813262939453, "global_step": 126160, "epoch": 1520} {"train_loss": -22.274738311767578, "global_step": 126161, "epoch": 1520} {"train_loss": -21.76017189025879, "global_step": 126162, "epoch": 1520} {"train_loss": -21.796363830566406, "global_step": 126163, "epoch": 1520} {"train_loss": -22.379207611083984, "global_step": 126164, "epoch": 1520} {"train_loss": -22.091232299804688, "global_step": 126165, "epoch": 1520} {"train_loss": -22.403165817260742, "global_step": 126166, "epoch": 1520} {"train_loss": -22.343475341796875, "global_step": 126167, "epoch": 1520} {"train_loss": -22.619138717651367, "global_step": 126168, "epoch": 1520} {"train_loss": -22.08249855041504, "global_step": 126169, "epoch": 1520} {"train_loss": -22.227014541625977, "global_step": 126170, "epoch": 1520} {"train_loss": -22.70107650756836, "global_step": 126171, "epoch": 1520} {"train_loss": -22.612728118896484, "global_step": 126172, "epoch": 1520} {"train_loss": -22.53672218322754, "global_step": 126173, "epoch": 1520} {"train_loss": -22.5393123626709, "global_step": 126174, "epoch": 1520} {"train_loss": -22.33283805847168, "global_step": 126175, "epoch": 1520} {"train_loss": -22.428470611572266, "global_step": 126176, "epoch": 1520} {"train_loss": -22.534076690673828, "global_step": 126177, "epoch": 1520} {"train_loss": -22.479007720947266, "global_step": 126178, "epoch": 1520} {"train_loss": -22.434640884399414, "global_step": 126179, "epoch": 1520} {"train_loss": -22.564250946044922, "global_step": 126180, "epoch": 1520} {"train_loss": -22.576833724975586, "global_step": 126181, "epoch": 1520} {"train_loss": -22.381271362304688, "global_step": 126182, "epoch": 1520} {"train_loss": -22.544504165649414, "global_step": 126183, "epoch": 1520} {"train_loss": -22.43071937561035, "global_step": 126184, "epoch": 1520} {"train_loss": -22.499897003173828, "global_step": 126185, "epoch": 1520} {"train_loss": -22.80978775024414, "global_step": 126186, "epoch": 1520} {"train_loss": -22.279258728027344, "global_step": 126187, "epoch": 1520} {"train_loss": -22.669586181640625, "global_step": 126188, "epoch": 1520} {"train_loss": -22.67933464050293, "global_step": 126189, "epoch": 1520} {"train_loss": -22.520627975463867, "global_step": 126190, "epoch": 1520} {"train_loss": -22.928342819213867, "global_step": 126191, "epoch": 1520} {"train_loss": -22.98201560974121, "global_step": 126192, "epoch": 1520} {"train_loss": -22.86122703552246, "global_step": 126193, "epoch": 1520} {"train_loss": -23.07872200012207, "global_step": 126194, "epoch": 1520} {"train_loss": -22.252023696899414, "global_step": 126195, "epoch": 1520} {"train_loss": -22.805601119995117, "global_step": 126196, "epoch": 1520} {"train_loss": -22.448225021362305, "global_step": 126197, "epoch": 1520} {"train_loss": -22.463855743408203, "global_step": 126198, "epoch": 1520} {"train_loss": -22.463897705078125, "global_step": 126199, "epoch": 1520} {"train_loss": -22.731647491455078, "global_step": 126200, "epoch": 1520} {"train_loss": -22.759672164916992, "global_step": 126201, "epoch": 1520} {"train_loss": -22.68999671936035, "global_step": 126202, "epoch": 1520} {"train_loss": -22.792869567871094, "global_step": 126203, "epoch": 1520} {"train_loss": -22.39884376525879, "global_step": 126204, "epoch": 1520} {"train_loss": -22.531875610351562, "global_step": 126205, "epoch": 1520} {"train_loss": -22.7008056640625, "global_step": 126206, "epoch": 1520} {"train_loss": -22.737911224365234, "global_step": 126207, "epoch": 1520} {"train_loss": -22.8093204498291, "global_step": 126208, "epoch": 1520} {"train_loss": -23.034467697143555, "global_step": 126209, "epoch": 1520} {"train_loss": -22.426584243774414, "global_step": 126210, "epoch": 1520} {"train_loss": -22.619054794311523, "global_step": 126211, "epoch": 1520} {"train_loss": -22.898286819458008, "global_step": 126212, "epoch": 1520} {"train_loss": -22.64539909362793, "global_step": 126213, "epoch": 1520} {"train_loss": -22.355220794677734, "global_step": 126214, "epoch": 1520} {"train_loss": -22.799480438232422, "global_step": 126215, "epoch": 1520} {"train_loss": -22.699846267700195, "global_step": 126216, "epoch": 1520} {"train_loss": -22.459190368652344, "global_step": 126217, "epoch": 1520} {"train_loss": -22.8660831451416, "global_step": 126218, "epoch": 1520} {"train_loss": -22.645212173461914, "global_step": 126219, "epoch": 1520} {"train_loss": -22.84706687927246, "global_step": 126220, "epoch": 1520} {"train_loss": -22.804731369018555, "global_step": 126221, "epoch": 1520} {"train_loss": -22.97063636779785, "global_step": 126222, "epoch": 1520} {"train_loss": -22.814992904663086, "global_step": 126223, "epoch": 1520} {"train_loss": -22.34287452697754, "global_step": 126224, "epoch": 1520} {"train_loss": -23.102386474609375, "global_step": 126225, "epoch": 1520} {"train_loss": -22.578481674194336, "global_step": 126226, "epoch": 1520} {"train_loss": -22.97077751159668, "global_step": 126227, "epoch": 1520} {"train_loss": -22.59698486328125, "global_step": 126228, "epoch": 1520} {"train_loss": -23.02046012878418, "global_step": 126229, "epoch": 1520} {"train_loss": -22.488998413085938, "global_step": 126230, "epoch": 1520} {"train_loss": -23.18688201904297, "global_step": 126231, "epoch": 1520} {"train_loss": -22.705472946166992, "global_step": 126232, "epoch": 1520} {"train_loss": -22.775484085083008, "global_step": 126233, "epoch": 1520} {"train_loss": -22.373106002807617, "global_step": 126234, "epoch": 1520} {"train_loss": -22.847230911254883, "global_step": 126235, "epoch": 1520} {"train_loss": -22.689300537109375, "global_step": 126236, "epoch": 1520} {"train_loss": -22.84591293334961, "global_step": 126237, "epoch": 1520} {"train_loss": -22.590543746948242, "global_step": 126238, "epoch": 1520} {"train_loss": -22.868680953979492, "global_step": 126239, "epoch": 1520} {"train_loss": -22.439977645874023, "global_step": 126240, "epoch": 1520} {"train_loss": -22.768035888671875, "global_step": 126241, "epoch": 1520} {"train_loss": -22.60903193002724, "global_step": 126242, "epoch": 1520, "val_loss": 6291260.0} {"train_loss": -22.059179306030273, "global_step": 126243, "epoch": 1521} {"train_loss": -21.842885971069336, "global_step": 126244, "epoch": 1521} {"train_loss": -21.132394790649414, "global_step": 126245, "epoch": 1521} {"train_loss": -22.130630493164062, "global_step": 126246, "epoch": 1521} {"train_loss": -22.291812896728516, "global_step": 126247, "epoch": 1521} {"train_loss": -21.924060821533203, "global_step": 126248, "epoch": 1521} {"train_loss": -22.16394805908203, "global_step": 126249, "epoch": 1521} {"train_loss": -22.132688522338867, "global_step": 126250, "epoch": 1521} {"train_loss": -21.935470581054688, "global_step": 126251, "epoch": 1521} {"train_loss": -21.889822006225586, "global_step": 126252, "epoch": 1521} {"train_loss": -22.25301170349121, "global_step": 126253, "epoch": 1521} {"train_loss": -21.997861862182617, "global_step": 126254, "epoch": 1521} {"train_loss": -22.456872940063477, "global_step": 126255, "epoch": 1521} {"train_loss": -22.102561950683594, "global_step": 126256, "epoch": 1521} {"train_loss": -22.309568405151367, "global_step": 126257, "epoch": 1521} {"train_loss": -22.47791290283203, "global_step": 126258, "epoch": 1521} {"train_loss": -22.10748863220215, "global_step": 126259, "epoch": 1521} {"train_loss": -22.275775909423828, "global_step": 126260, "epoch": 1521} {"train_loss": -22.710493087768555, "global_step": 126261, "epoch": 1521} {"train_loss": -22.605710983276367, "global_step": 126262, "epoch": 1521} {"train_loss": -22.228551864624023, "global_step": 126263, "epoch": 1521} {"train_loss": -22.67310905456543, "global_step": 126264, "epoch": 1521} {"train_loss": -22.26888084411621, "global_step": 126265, "epoch": 1521} {"train_loss": -22.058271408081055, "global_step": 126266, "epoch": 1521} {"train_loss": -22.35718536376953, "global_step": 126267, "epoch": 1521} {"train_loss": -22.2342586517334, "global_step": 126268, "epoch": 1521} {"train_loss": -22.825088500976562, "global_step": 126269, "epoch": 1521} {"train_loss": -22.222841262817383, "global_step": 126270, "epoch": 1521} {"train_loss": -22.449670791625977, "global_step": 126271, "epoch": 1521} {"train_loss": -22.624603271484375, "global_step": 126272, "epoch": 1521} {"train_loss": -22.505756378173828, "global_step": 126273, "epoch": 1521} {"train_loss": -22.582218170166016, "global_step": 126274, "epoch": 1521} {"train_loss": -22.368337631225586, "global_step": 126275, "epoch": 1521} {"train_loss": -22.491201400756836, "global_step": 126276, "epoch": 1521} {"train_loss": -22.72284698486328, "global_step": 126277, "epoch": 1521} {"train_loss": -22.413599014282227, "global_step": 126278, "epoch": 1521} {"train_loss": -22.724851608276367, "global_step": 126279, "epoch": 1521} {"train_loss": -22.937164306640625, "global_step": 126280, "epoch": 1521} {"train_loss": -22.540639877319336, "global_step": 126281, "epoch": 1521} {"train_loss": -22.768056869506836, "global_step": 126282, "epoch": 1521} {"train_loss": -23.009252548217773, "global_step": 126283, "epoch": 1521} {"train_loss": -22.826379776000977, "global_step": 126284, "epoch": 1521} {"train_loss": -22.508466720581055, "global_step": 126285, "epoch": 1521} {"train_loss": -22.900177001953125, "global_step": 126286, "epoch": 1521} {"train_loss": -22.710947036743164, "global_step": 126287, "epoch": 1521} {"train_loss": -22.988473892211914, "global_step": 126288, "epoch": 1521} {"train_loss": -22.488370895385742, "global_step": 126289, "epoch": 1521} {"train_loss": -22.255556106567383, "global_step": 126290, "epoch": 1521} {"train_loss": -22.577072143554688, "global_step": 126291, "epoch": 1521} {"train_loss": -23.027313232421875, "global_step": 126292, "epoch": 1521} {"train_loss": -22.69900894165039, "global_step": 126293, "epoch": 1521} {"train_loss": -23.107492446899414, "global_step": 126294, "epoch": 1521} {"train_loss": -22.169437408447266, "global_step": 126295, "epoch": 1521} {"train_loss": -22.715469360351562, "global_step": 126296, "epoch": 1521} {"train_loss": -22.657115936279297, "global_step": 126297, "epoch": 1521} {"train_loss": -22.84663963317871, "global_step": 126298, "epoch": 1521} {"train_loss": -22.331266403198242, "global_step": 126299, "epoch": 1521} {"train_loss": -22.80573844909668, "global_step": 126300, "epoch": 1521} {"train_loss": -22.633222579956055, "global_step": 126301, "epoch": 1521} {"train_loss": -22.609210968017578, "global_step": 126302, "epoch": 1521} {"train_loss": -22.51715087890625, "global_step": 126303, "epoch": 1521} {"train_loss": -22.84104347229004, "global_step": 126304, "epoch": 1521} {"train_loss": -22.917394638061523, "global_step": 126305, "epoch": 1521} {"train_loss": -22.8276424407959, "global_step": 126306, "epoch": 1521} {"train_loss": -22.874032974243164, "global_step": 126307, "epoch": 1521} {"train_loss": -22.69968032836914, "global_step": 126308, "epoch": 1521} {"train_loss": -22.950345993041992, "global_step": 126309, "epoch": 1521} {"train_loss": -22.66691017150879, "global_step": 126310, "epoch": 1521} {"train_loss": -22.888259887695312, "global_step": 126311, "epoch": 1521} {"train_loss": -22.602127075195312, "global_step": 126312, "epoch": 1521} {"train_loss": -23.2694091796875, "global_step": 126313, "epoch": 1521} {"train_loss": -22.6242618560791, "global_step": 126314, "epoch": 1521} {"train_loss": -22.612571716308594, "global_step": 126315, "epoch": 1521} {"train_loss": -22.659086227416992, "global_step": 126316, "epoch": 1521} {"train_loss": -22.35405731201172, "global_step": 126317, "epoch": 1521} {"train_loss": -22.3978214263916, "global_step": 126318, "epoch": 1521} {"train_loss": -22.30255126953125, "global_step": 126319, "epoch": 1521} {"train_loss": -22.478824615478516, "global_step": 126320, "epoch": 1521} {"train_loss": -22.397390365600586, "global_step": 126321, "epoch": 1521} {"train_loss": -22.44814682006836, "global_step": 126322, "epoch": 1521} {"train_loss": -22.377811431884766, "global_step": 126323, "epoch": 1521} {"train_loss": -22.683298110961914, "global_step": 126324, "epoch": 1521} {"train_loss": -22.509110324354058, "global_step": 126325, "epoch": 1521, "val_loss": 6226289.0} {"train_loss": -21.718307495117188, "global_step": 126326, "epoch": 1522} {"train_loss": -21.9549503326416, "global_step": 126327, "epoch": 1522} {"train_loss": -21.823698043823242, "global_step": 126328, "epoch": 1522} {"train_loss": -22.279245376586914, "global_step": 126329, "epoch": 1522} {"train_loss": -22.1114501953125, "global_step": 126330, "epoch": 1522} {"train_loss": -21.876188278198242, "global_step": 126331, "epoch": 1522} {"train_loss": -21.858928680419922, "global_step": 126332, "epoch": 1522} {"train_loss": -21.866445541381836, "global_step": 126333, "epoch": 1522} {"train_loss": -22.086835861206055, "global_step": 126334, "epoch": 1522} {"train_loss": -22.078460693359375, "global_step": 126335, "epoch": 1522} {"train_loss": -22.141315460205078, "global_step": 126336, "epoch": 1522} {"train_loss": -22.160846710205078, "global_step": 126337, "epoch": 1522} {"train_loss": -22.45073890686035, "global_step": 126338, "epoch": 1522} {"train_loss": -22.34571647644043, "global_step": 126339, "epoch": 1522} {"train_loss": -22.18287467956543, "global_step": 126340, "epoch": 1522} {"train_loss": -22.570249557495117, "global_step": 126341, "epoch": 1522} {"train_loss": -22.33894157409668, "global_step": 126342, "epoch": 1522} {"train_loss": -22.42700958251953, "global_step": 126343, "epoch": 1522} {"train_loss": -22.12537956237793, "global_step": 126344, "epoch": 1522} {"train_loss": -22.27178382873535, "global_step": 126345, "epoch": 1522} {"train_loss": -22.494735717773438, "global_step": 126346, "epoch": 1522} {"train_loss": -21.86876678466797, "global_step": 126347, "epoch": 1522} {"train_loss": -22.321584701538086, "global_step": 126348, "epoch": 1522} {"train_loss": -23.043275833129883, "global_step": 126349, "epoch": 1522} {"train_loss": -22.76521110534668, "global_step": 126350, "epoch": 1522} {"train_loss": -22.119504928588867, "global_step": 126351, "epoch": 1522} {"train_loss": -23.04021644592285, "global_step": 126352, "epoch": 1522} {"train_loss": -22.88114356994629, "global_step": 126353, "epoch": 1522} {"train_loss": -22.563268661499023, "global_step": 126354, "epoch": 1522} {"train_loss": -22.758209228515625, "global_step": 126355, "epoch": 1522} {"train_loss": -22.97169303894043, "global_step": 126356, "epoch": 1522} {"train_loss": -22.846853256225586, "global_step": 126357, "epoch": 1522} {"train_loss": -22.429996490478516, "global_step": 126358, "epoch": 1522} {"train_loss": -22.592140197753906, "global_step": 126359, "epoch": 1522} {"train_loss": -22.593460083007812, "global_step": 126360, "epoch": 1522} {"train_loss": -22.857152938842773, "global_step": 126361, "epoch": 1522} {"train_loss": -22.56769371032715, "global_step": 126362, "epoch": 1522} {"train_loss": -23.031049728393555, "global_step": 126363, "epoch": 1522} {"train_loss": -22.902612686157227, "global_step": 126364, "epoch": 1522} {"train_loss": -22.153417587280273, "global_step": 126365, "epoch": 1522} {"train_loss": -22.874948501586914, "global_step": 126366, "epoch": 1522} {"train_loss": -22.723438262939453, "global_step": 126367, "epoch": 1522} {"train_loss": -22.81165313720703, "global_step": 126368, "epoch": 1522} {"train_loss": -22.694955825805664, "global_step": 126369, "epoch": 1522} {"train_loss": -22.683475494384766, "global_step": 126370, "epoch": 1522} {"train_loss": -22.644062042236328, "global_step": 126371, "epoch": 1522} {"train_loss": -22.85743522644043, "global_step": 126372, "epoch": 1522} {"train_loss": -22.547853469848633, "global_step": 126373, "epoch": 1522} {"train_loss": -22.798139572143555, "global_step": 126374, "epoch": 1522} {"train_loss": -22.402490615844727, "global_step": 126375, "epoch": 1522} {"train_loss": -22.7601375579834, "global_step": 126376, "epoch": 1522} {"train_loss": -22.622404098510742, "global_step": 126377, "epoch": 1522} {"train_loss": -22.282384872436523, "global_step": 126378, "epoch": 1522} {"train_loss": -22.69208526611328, "global_step": 126379, "epoch": 1522} {"train_loss": -22.382999420166016, "global_step": 126380, "epoch": 1522} {"train_loss": -22.559873580932617, "global_step": 126381, "epoch": 1522} {"train_loss": -22.43686866760254, "global_step": 126382, "epoch": 1522} {"train_loss": -22.76003074645996, "global_step": 126383, "epoch": 1522} {"train_loss": -22.654266357421875, "global_step": 126384, "epoch": 1522} {"train_loss": -22.511310577392578, "global_step": 126385, "epoch": 1522} {"train_loss": -22.884143829345703, "global_step": 126386, "epoch": 1522} {"train_loss": -22.33416175842285, "global_step": 126387, "epoch": 1522} {"train_loss": -22.91268539428711, "global_step": 126388, "epoch": 1522} {"train_loss": -22.437057495117188, "global_step": 126389, "epoch": 1522} {"train_loss": -22.70185089111328, "global_step": 126390, "epoch": 1522} {"train_loss": -22.71729850769043, "global_step": 126391, "epoch": 1522} {"train_loss": -22.43594741821289, "global_step": 126392, "epoch": 1522} {"train_loss": -22.76973533630371, "global_step": 126393, "epoch": 1522} {"train_loss": -22.598567962646484, "global_step": 126394, "epoch": 1522} {"train_loss": -22.567489624023438, "global_step": 126395, "epoch": 1522} {"train_loss": -22.8866024017334, "global_step": 126396, "epoch": 1522} {"train_loss": -22.819107055664062, "global_step": 126397, "epoch": 1522} {"train_loss": -22.993803024291992, "global_step": 126398, "epoch": 1522} {"train_loss": -22.518146514892578, "global_step": 126399, "epoch": 1522} {"train_loss": -23.046175003051758, "global_step": 126400, "epoch": 1522} {"train_loss": -23.171432495117188, "global_step": 126401, "epoch": 1522} {"train_loss": -22.684995651245117, "global_step": 126402, "epoch": 1522} {"train_loss": -23.212980270385742, "global_step": 126403, "epoch": 1522} {"train_loss": -22.781103134155273, "global_step": 126404, "epoch": 1522} {"train_loss": -22.98097801208496, "global_step": 126405, "epoch": 1522} {"train_loss": -22.793703079223633, "global_step": 126406, "epoch": 1522} {"train_loss": -22.715499877929688, "global_step": 126407, "epoch": 1522} {"train_loss": -22.554042310599822, "global_step": 126408, "epoch": 1522, "val_loss": 6233654.0} {"train_loss": -21.898143768310547, "global_step": 126409, "epoch": 1523} {"train_loss": -21.770061492919922, "global_step": 126410, "epoch": 1523} {"train_loss": -22.105424880981445, "global_step": 126411, "epoch": 1523} {"train_loss": -21.761062622070312, "global_step": 126412, "epoch": 1523} {"train_loss": -22.340087890625, "global_step": 126413, "epoch": 1523} {"train_loss": -22.289974212646484, "global_step": 126414, "epoch": 1523} {"train_loss": -22.56153106689453, "global_step": 126415, "epoch": 1523} {"train_loss": -22.322406768798828, "global_step": 126416, "epoch": 1523} {"train_loss": -22.564970016479492, "global_step": 126417, "epoch": 1523} {"train_loss": -22.355363845825195, "global_step": 126418, "epoch": 1523} {"train_loss": -22.541288375854492, "global_step": 126419, "epoch": 1523} {"train_loss": -22.021438598632812, "global_step": 126420, "epoch": 1523} {"train_loss": -22.213871002197266, "global_step": 126421, "epoch": 1523} {"train_loss": -22.76307487487793, "global_step": 126422, "epoch": 1523} {"train_loss": -22.555639266967773, "global_step": 126423, "epoch": 1523} {"train_loss": -22.39942741394043, "global_step": 126424, "epoch": 1523} {"train_loss": -22.8426513671875, "global_step": 126425, "epoch": 1523} {"train_loss": -22.559358596801758, "global_step": 126426, "epoch": 1523} {"train_loss": -22.667325973510742, "global_step": 126427, "epoch": 1523} {"train_loss": -22.534093856811523, "global_step": 126428, "epoch": 1523} {"train_loss": -22.692541122436523, "global_step": 126429, "epoch": 1523} {"train_loss": -22.58713150024414, "global_step": 126430, "epoch": 1523} {"train_loss": -22.645849227905273, "global_step": 126431, "epoch": 1523} {"train_loss": -22.698450088500977, "global_step": 126432, "epoch": 1523} {"train_loss": -22.556015014648438, "global_step": 126433, "epoch": 1523} {"train_loss": -22.986738204956055, "global_step": 126434, "epoch": 1523} {"train_loss": -22.754404067993164, "global_step": 126435, "epoch": 1523} {"train_loss": -22.80915641784668, "global_step": 126436, "epoch": 1523} {"train_loss": -22.369617462158203, "global_step": 126437, "epoch": 1523} {"train_loss": -22.838871002197266, "global_step": 126438, "epoch": 1523} {"train_loss": -22.831462860107422, "global_step": 126439, "epoch": 1523} {"train_loss": -22.864336013793945, "global_step": 126440, "epoch": 1523} {"train_loss": -22.590917587280273, "global_step": 126441, "epoch": 1523} {"train_loss": -22.46880531311035, "global_step": 126442, "epoch": 1523} {"train_loss": -22.584383010864258, "global_step": 126443, "epoch": 1523} {"train_loss": -22.879493713378906, "global_step": 126444, "epoch": 1523} {"train_loss": -22.952455520629883, "global_step": 126445, "epoch": 1523} {"train_loss": -22.767789840698242, "global_step": 126446, "epoch": 1523} {"train_loss": -22.455167770385742, "global_step": 126447, "epoch": 1523} {"train_loss": -22.784564971923828, "global_step": 126448, "epoch": 1523} {"train_loss": -22.276702880859375, "global_step": 126449, "epoch": 1523} {"train_loss": -22.772184371948242, "global_step": 126450, "epoch": 1523} {"train_loss": -22.92582130432129, "global_step": 126451, "epoch": 1523} {"train_loss": -22.354724884033203, "global_step": 126452, "epoch": 1523} {"train_loss": -22.79425621032715, "global_step": 126453, "epoch": 1523} {"train_loss": -22.755064010620117, "global_step": 126454, "epoch": 1523} {"train_loss": -22.61603355407715, "global_step": 126455, "epoch": 1523} {"train_loss": -22.67461585998535, "global_step": 126456, "epoch": 1523} {"train_loss": -22.440336227416992, "global_step": 126457, "epoch": 1523} {"train_loss": -22.90740966796875, "global_step": 126458, "epoch": 1523} {"train_loss": -22.738628387451172, "global_step": 126459, "epoch": 1523} {"train_loss": -22.751508712768555, "global_step": 126460, "epoch": 1523} {"train_loss": -22.611478805541992, "global_step": 126461, "epoch": 1523} {"train_loss": -22.49284553527832, "global_step": 126462, "epoch": 1523} {"train_loss": -22.45759391784668, "global_step": 126463, "epoch": 1523} {"train_loss": -22.66156578063965, "global_step": 126464, "epoch": 1523} {"train_loss": -22.695188522338867, "global_step": 126465, "epoch": 1523} {"train_loss": -23.03989028930664, "global_step": 126466, "epoch": 1523} {"train_loss": -22.655790328979492, "global_step": 126467, "epoch": 1523} {"train_loss": -22.991134643554688, "global_step": 126468, "epoch": 1523} {"train_loss": -22.725845336914062, "global_step": 126469, "epoch": 1523} {"train_loss": -22.794408798217773, "global_step": 126470, "epoch": 1523} {"train_loss": -22.722875595092773, "global_step": 126471, "epoch": 1523} {"train_loss": -22.9234561920166, "global_step": 126472, "epoch": 1523} {"train_loss": -23.17241859436035, "global_step": 126473, "epoch": 1523} {"train_loss": -22.3703556060791, "global_step": 126474, "epoch": 1523} {"train_loss": -22.67023277282715, "global_step": 126475, "epoch": 1523} {"train_loss": -22.827953338623047, "global_step": 126476, "epoch": 1523} {"train_loss": -22.989551544189453, "global_step": 126477, "epoch": 1523} {"train_loss": -22.973377227783203, "global_step": 126478, "epoch": 1523} {"train_loss": -22.803558349609375, "global_step": 126479, "epoch": 1523} {"train_loss": -22.282934188842773, "global_step": 126480, "epoch": 1523} {"train_loss": -22.66012191772461, "global_step": 126481, "epoch": 1523} {"train_loss": -22.7280216217041, "global_step": 126482, "epoch": 1523} {"train_loss": -22.83653450012207, "global_step": 126483, "epoch": 1523} {"train_loss": -22.690845489501953, "global_step": 126484, "epoch": 1523} {"train_loss": -22.487409591674805, "global_step": 126485, "epoch": 1523} {"train_loss": -22.881855010986328, "global_step": 126486, "epoch": 1523} {"train_loss": -22.728078842163086, "global_step": 126487, "epoch": 1523} {"train_loss": -22.901426315307617, "global_step": 126488, "epoch": 1523} {"train_loss": -23.05960464477539, "global_step": 126489, "epoch": 1523} {"train_loss": -22.766408920288086, "global_step": 126490, "epoch": 1523} {"train_loss": -22.63980729895902, "global_step": 126491, "epoch": 1523, "val_loss": 6342135.0} {"train_loss": -21.930349349975586, "global_step": 126492, "epoch": 1524} {"train_loss": -21.875791549682617, "global_step": 126493, "epoch": 1524} {"train_loss": -22.364648818969727, "global_step": 126494, "epoch": 1524} {"train_loss": -21.8250675201416, "global_step": 126495, "epoch": 1524} {"train_loss": -22.28066062927246, "global_step": 126496, "epoch": 1524} {"train_loss": -22.028451919555664, "global_step": 126497, "epoch": 1524} {"train_loss": -22.191564559936523, "global_step": 126498, "epoch": 1524} {"train_loss": -22.314729690551758, "global_step": 126499, "epoch": 1524} {"train_loss": -22.384033203125, "global_step": 126500, "epoch": 1524} {"train_loss": -22.1696834564209, "global_step": 126501, "epoch": 1524} {"train_loss": -22.239238739013672, "global_step": 126502, "epoch": 1524} {"train_loss": -22.530851364135742, "global_step": 126503, "epoch": 1524} {"train_loss": -22.16859245300293, "global_step": 126504, "epoch": 1524} {"train_loss": -22.286863327026367, "global_step": 126505, "epoch": 1524} {"train_loss": -22.33327293395996, "global_step": 126506, "epoch": 1524} {"train_loss": -22.606779098510742, "global_step": 126507, "epoch": 1524} {"train_loss": -22.40711784362793, "global_step": 126508, "epoch": 1524} {"train_loss": -22.405384063720703, "global_step": 126509, "epoch": 1524} {"train_loss": -22.578500747680664, "global_step": 126510, "epoch": 1524} {"train_loss": -22.449594497680664, "global_step": 126511, "epoch": 1524} {"train_loss": -22.414724349975586, "global_step": 126512, "epoch": 1524} {"train_loss": -22.748754501342773, "global_step": 126513, "epoch": 1524} {"train_loss": -22.627700805664062, "global_step": 126514, "epoch": 1524} {"train_loss": -22.813711166381836, "global_step": 126515, "epoch": 1524} {"train_loss": -22.44141960144043, "global_step": 126516, "epoch": 1524} {"train_loss": -22.65850067138672, "global_step": 126517, "epoch": 1524} {"train_loss": -22.58645248413086, "global_step": 126518, "epoch": 1524} {"train_loss": -22.19260025024414, "global_step": 126519, "epoch": 1524} {"train_loss": -22.73895835876465, "global_step": 126520, "epoch": 1524} {"train_loss": -23.11891746520996, "global_step": 126521, "epoch": 1524} {"train_loss": -22.283435821533203, "global_step": 126522, "epoch": 1524} {"train_loss": -22.584426879882812, "global_step": 126523, "epoch": 1524} {"train_loss": -22.786550521850586, "global_step": 126524, "epoch": 1524} {"train_loss": -23.015562057495117, "global_step": 126525, "epoch": 1524} {"train_loss": -23.035829544067383, "global_step": 126526, "epoch": 1524} {"train_loss": -22.76962661743164, "global_step": 126527, "epoch": 1524} {"train_loss": -22.896570205688477, "global_step": 126528, "epoch": 1524} {"train_loss": -23.05071258544922, "global_step": 126529, "epoch": 1524} {"train_loss": -22.602691650390625, "global_step": 126530, "epoch": 1524} {"train_loss": -22.6234130859375, "global_step": 126531, "epoch": 1524} {"train_loss": -22.954345703125, "global_step": 126532, "epoch": 1524} {"train_loss": -22.643980026245117, "global_step": 126533, "epoch": 1524} {"train_loss": -22.46493148803711, "global_step": 126534, "epoch": 1524} {"train_loss": -22.681903839111328, "global_step": 126535, "epoch": 1524} {"train_loss": -23.028562545776367, "global_step": 126536, "epoch": 1524} {"train_loss": -22.30759048461914, "global_step": 126537, "epoch": 1524} {"train_loss": -22.608280181884766, "global_step": 126538, "epoch": 1524} {"train_loss": -22.959766387939453, "global_step": 126539, "epoch": 1524} {"train_loss": -22.765960693359375, "global_step": 126540, "epoch": 1524} {"train_loss": -22.712514877319336, "global_step": 126541, "epoch": 1524} {"train_loss": -22.732269287109375, "global_step": 126542, "epoch": 1524} {"train_loss": -22.742902755737305, "global_step": 126543, "epoch": 1524} {"train_loss": -22.54134178161621, "global_step": 126544, "epoch": 1524} {"train_loss": -22.827495574951172, "global_step": 126545, "epoch": 1524} {"train_loss": -22.782644271850586, "global_step": 126546, "epoch": 1524} {"train_loss": -22.316877365112305, "global_step": 126547, "epoch": 1524} {"train_loss": -23.06646156311035, "global_step": 126548, "epoch": 1524} {"train_loss": -22.670019149780273, "global_step": 126549, "epoch": 1524} {"train_loss": -22.825307846069336, "global_step": 126550, "epoch": 1524} {"train_loss": -23.095029830932617, "global_step": 126551, "epoch": 1524} {"train_loss": -23.081647872924805, "global_step": 126552, "epoch": 1524} {"train_loss": -22.42911148071289, "global_step": 126553, "epoch": 1524} {"train_loss": -22.661462783813477, "global_step": 126554, "epoch": 1524} {"train_loss": -22.56136131286621, "global_step": 126555, "epoch": 1524} {"train_loss": -22.794179916381836, "global_step": 126556, "epoch": 1524} {"train_loss": -22.675846099853516, "global_step": 126557, "epoch": 1524} {"train_loss": -22.388471603393555, "global_step": 126558, "epoch": 1524} {"train_loss": -22.825098037719727, "global_step": 126559, "epoch": 1524} {"train_loss": -23.07170295715332, "global_step": 126560, "epoch": 1524} {"train_loss": -22.137447357177734, "global_step": 126561, "epoch": 1524} {"train_loss": -22.521337509155273, "global_step": 126562, "epoch": 1524} {"train_loss": -22.370906829833984, "global_step": 126563, "epoch": 1524} {"train_loss": -22.586652755737305, "global_step": 126564, "epoch": 1524} {"train_loss": -22.847787857055664, "global_step": 126565, "epoch": 1524} {"train_loss": -22.631664276123047, "global_step": 126566, "epoch": 1524} {"train_loss": -22.169227600097656, "global_step": 126567, "epoch": 1524} {"train_loss": -22.82579803466797, "global_step": 126568, "epoch": 1524} {"train_loss": -22.59958839416504, "global_step": 126569, "epoch": 1524} {"train_loss": -22.797882080078125, "global_step": 126570, "epoch": 1524} {"train_loss": -22.790319442749023, "global_step": 126571, "epoch": 1524} {"train_loss": -22.425628662109375, "global_step": 126572, "epoch": 1524} {"train_loss": -22.976839065551758, "global_step": 126573, "epoch": 1524} {"train_loss": -22.598629227603773, "global_step": 126574, "epoch": 1524, "val_loss": 6384153.0} {"train_loss": -22.482830047607422, "global_step": 126575, "epoch": 1525} {"train_loss": -22.522497177124023, "global_step": 126576, "epoch": 1525} {"train_loss": -22.547565460205078, "global_step": 126577, "epoch": 1525} {"train_loss": -22.67110824584961, "global_step": 126578, "epoch": 1525} {"train_loss": -22.769412994384766, "global_step": 126579, "epoch": 1525} {"train_loss": -22.61052894592285, "global_step": 126580, "epoch": 1525} {"train_loss": -22.488752365112305, "global_step": 126581, "epoch": 1525} {"train_loss": -22.645978927612305, "global_step": 126582, "epoch": 1525} {"train_loss": -22.7902774810791, "global_step": 126583, "epoch": 1525} {"train_loss": -22.295230865478516, "global_step": 126584, "epoch": 1525} {"train_loss": -22.488012313842773, "global_step": 126585, "epoch": 1525} {"train_loss": -22.455663681030273, "global_step": 126586, "epoch": 1525} {"train_loss": -22.937068939208984, "global_step": 126587, "epoch": 1525} {"train_loss": -22.299108505249023, "global_step": 126588, "epoch": 1525} {"train_loss": -22.58645248413086, "global_step": 126589, "epoch": 1525} {"train_loss": -22.778409957885742, "global_step": 126590, "epoch": 1525} {"train_loss": -22.36664390563965, "global_step": 126591, "epoch": 1525} {"train_loss": -22.843114852905273, "global_step": 126592, "epoch": 1525} {"train_loss": -22.34600830078125, "global_step": 126593, "epoch": 1525} {"train_loss": -22.43828582763672, "global_step": 126594, "epoch": 1525} {"train_loss": -22.729597091674805, "global_step": 126595, "epoch": 1525} {"train_loss": -22.318784713745117, "global_step": 126596, "epoch": 1525} {"train_loss": -22.740026473999023, "global_step": 126597, "epoch": 1525} {"train_loss": -22.747343063354492, "global_step": 126598, "epoch": 1525} {"train_loss": -23.022550582885742, "global_step": 126599, "epoch": 1525} {"train_loss": -22.89407730102539, "global_step": 126600, "epoch": 1525} {"train_loss": -22.740222930908203, "global_step": 126601, "epoch": 1525} {"train_loss": -22.736406326293945, "global_step": 126602, "epoch": 1525} {"train_loss": -22.780250549316406, "global_step": 126603, "epoch": 1525} {"train_loss": -23.012144088745117, "global_step": 126604, "epoch": 1525} {"train_loss": -22.665922164916992, "global_step": 126605, "epoch": 1525} {"train_loss": -22.99970054626465, "global_step": 126606, "epoch": 1525} {"train_loss": -22.604211807250977, "global_step": 126607, "epoch": 1525} {"train_loss": -23.299274444580078, "global_step": 126608, "epoch": 1525} {"train_loss": -22.969459533691406, "global_step": 126609, "epoch": 1525} {"train_loss": -22.619876861572266, "global_step": 126610, "epoch": 1525} {"train_loss": -22.768421173095703, "global_step": 126611, "epoch": 1525} {"train_loss": -22.665136337280273, "global_step": 126612, "epoch": 1525} {"train_loss": -22.339574813842773, "global_step": 126613, "epoch": 1525} {"train_loss": -22.72600746154785, "global_step": 126614, "epoch": 1525} {"train_loss": -22.385055541992188, "global_step": 126615, "epoch": 1525} {"train_loss": -22.685380935668945, "global_step": 126616, "epoch": 1525} {"train_loss": -22.791866302490234, "global_step": 126617, "epoch": 1525} {"train_loss": -23.063444137573242, "global_step": 126618, "epoch": 1525} {"train_loss": -22.868101119995117, "global_step": 126619, "epoch": 1525} {"train_loss": -22.666507720947266, "global_step": 126620, "epoch": 1525} {"train_loss": -22.950407028198242, "global_step": 126621, "epoch": 1525} {"train_loss": -22.257535934448242, "global_step": 126622, "epoch": 1525} {"train_loss": -22.84479331970215, "global_step": 126623, "epoch": 1525} {"train_loss": -22.765295028686523, "global_step": 126624, "epoch": 1525} {"train_loss": -22.671539306640625, "global_step": 126625, "epoch": 1525} {"train_loss": -22.882429122924805, "global_step": 126626, "epoch": 1525} {"train_loss": -22.62302017211914, "global_step": 126627, "epoch": 1525} {"train_loss": -22.69980812072754, "global_step": 126628, "epoch": 1525} {"train_loss": -22.904170989990234, "global_step": 126629, "epoch": 1525} {"train_loss": -22.52522087097168, "global_step": 126630, "epoch": 1525} {"train_loss": -22.67828941345215, "global_step": 126631, "epoch": 1525} {"train_loss": -22.65679931640625, "global_step": 126632, "epoch": 1525} {"train_loss": -22.919034957885742, "global_step": 126633, "epoch": 1525} {"train_loss": -22.697628021240234, "global_step": 126634, "epoch": 1525} {"train_loss": -22.885095596313477, "global_step": 126635, "epoch": 1525} {"train_loss": -22.459165573120117, "global_step": 126636, "epoch": 1525} {"train_loss": -22.800643920898438, "global_step": 126637, "epoch": 1525} {"train_loss": -22.648460388183594, "global_step": 126638, "epoch": 1525} {"train_loss": -22.81208610534668, "global_step": 126639, "epoch": 1525} {"train_loss": -22.668140411376953, "global_step": 126640, "epoch": 1525} {"train_loss": -22.890491485595703, "global_step": 126641, "epoch": 1525} {"train_loss": -22.615726470947266, "global_step": 126642, "epoch": 1525} {"train_loss": -22.44443702697754, "global_step": 126643, "epoch": 1525} {"train_loss": -22.574188232421875, "global_step": 126644, "epoch": 1525} {"train_loss": -22.703916549682617, "global_step": 126645, "epoch": 1525} {"train_loss": -22.829105377197266, "global_step": 126646, "epoch": 1525} {"train_loss": -22.763513565063477, "global_step": 126647, "epoch": 1525} {"train_loss": -22.791351318359375, "global_step": 126648, "epoch": 1525} {"train_loss": -22.782974243164062, "global_step": 126649, "epoch": 1525} {"train_loss": -22.817853927612305, "global_step": 126650, "epoch": 1525} {"train_loss": -22.511165618896484, "global_step": 126651, "epoch": 1525} {"train_loss": -22.928234100341797, "global_step": 126652, "epoch": 1525} {"train_loss": -22.824241638183594, "global_step": 126653, "epoch": 1525} {"train_loss": -23.047069549560547, "global_step": 126654, "epoch": 1525} {"train_loss": -22.463510513305664, "global_step": 126655, "epoch": 1525} {"train_loss": -22.502531051635742, "global_step": 126656, "epoch": 1525} {"train_loss": -22.67963827661721, "global_step": 126657, "epoch": 1525, "val_loss": 6221925.5} {"train_loss": -22.027381896972656, "global_step": 126658, "epoch": 1526} {"train_loss": -21.870548248291016, "global_step": 126659, "epoch": 1526} {"train_loss": -22.217445373535156, "global_step": 126660, "epoch": 1526} {"train_loss": -22.084638595581055, "global_step": 126661, "epoch": 1526} {"train_loss": -21.940265655517578, "global_step": 126662, "epoch": 1526} {"train_loss": -21.963748931884766, "global_step": 126663, "epoch": 1526} {"train_loss": -22.331161499023438, "global_step": 126664, "epoch": 1526} {"train_loss": -21.88527488708496, "global_step": 126665, "epoch": 1526} {"train_loss": -22.0264949798584, "global_step": 126666, "epoch": 1526} {"train_loss": -22.4934024810791, "global_step": 126667, "epoch": 1526} {"train_loss": -22.02528190612793, "global_step": 126668, "epoch": 1526} {"train_loss": -22.507776260375977, "global_step": 126669, "epoch": 1526} {"train_loss": -22.10772132873535, "global_step": 126670, "epoch": 1526} {"train_loss": -22.51568603515625, "global_step": 126671, "epoch": 1526} {"train_loss": -22.42750358581543, "global_step": 126672, "epoch": 1526} {"train_loss": -22.09039878845215, "global_step": 126673, "epoch": 1526} {"train_loss": -22.264734268188477, "global_step": 126674, "epoch": 1526} {"train_loss": -22.12767219543457, "global_step": 126675, "epoch": 1526} {"train_loss": -22.45758628845215, "global_step": 126676, "epoch": 1526} {"train_loss": -22.381866455078125, "global_step": 126677, "epoch": 1526} {"train_loss": -22.739805221557617, "global_step": 126678, "epoch": 1526} {"train_loss": -22.399600982666016, "global_step": 126679, "epoch": 1526} {"train_loss": -22.078271865844727, "global_step": 126680, "epoch": 1526} {"train_loss": -22.583768844604492, "global_step": 126681, "epoch": 1526} {"train_loss": -22.535442352294922, "global_step": 126682, "epoch": 1526} {"train_loss": -22.71124839782715, "global_step": 126683, "epoch": 1526} {"train_loss": -22.652517318725586, "global_step": 126684, "epoch": 1526} {"train_loss": -22.632612228393555, "global_step": 126685, "epoch": 1526} {"train_loss": -22.536609649658203, "global_step": 126686, "epoch": 1526} {"train_loss": -22.17466163635254, "global_step": 126687, "epoch": 1526} {"train_loss": -22.315216064453125, "global_step": 126688, "epoch": 1526} {"train_loss": -22.552045822143555, "global_step": 126689, "epoch": 1526} {"train_loss": -22.848628997802734, "global_step": 126690, "epoch": 1526} {"train_loss": -22.53382682800293, "global_step": 126691, "epoch": 1526} {"train_loss": -22.88777732849121, "global_step": 126692, "epoch": 1526} {"train_loss": -22.524097442626953, "global_step": 126693, "epoch": 1526} {"train_loss": -22.775211334228516, "global_step": 126694, "epoch": 1526} {"train_loss": -22.839874267578125, "global_step": 126695, "epoch": 1526} {"train_loss": -22.809423446655273, "global_step": 126696, "epoch": 1526} {"train_loss": -22.585920333862305, "global_step": 126697, "epoch": 1526} {"train_loss": -23.030832290649414, "global_step": 126698, "epoch": 1526} {"train_loss": -22.65521812438965, "global_step": 126699, "epoch": 1526} {"train_loss": -22.9833927154541, "global_step": 126700, "epoch": 1526} {"train_loss": -22.45083236694336, "global_step": 126701, "epoch": 1526} {"train_loss": -22.71270179748535, "global_step": 126702, "epoch": 1526} {"train_loss": -22.62202262878418, "global_step": 126703, "epoch": 1526} {"train_loss": -22.887638092041016, "global_step": 126704, "epoch": 1526} {"train_loss": -22.75247573852539, "global_step": 126705, "epoch": 1526} {"train_loss": -22.489221572875977, "global_step": 126706, "epoch": 1526} {"train_loss": -22.9456844329834, "global_step": 126707, "epoch": 1526} {"train_loss": -22.312223434448242, "global_step": 126708, "epoch": 1526} {"train_loss": -22.850515365600586, "global_step": 126709, "epoch": 1526} {"train_loss": -22.73200798034668, "global_step": 126710, "epoch": 1526} {"train_loss": -22.34451675415039, "global_step": 126711, "epoch": 1526} {"train_loss": -22.454877853393555, "global_step": 126712, "epoch": 1526} {"train_loss": -22.368940353393555, "global_step": 126713, "epoch": 1526} {"train_loss": -23.140966415405273, "global_step": 126714, "epoch": 1526} {"train_loss": -23.033933639526367, "global_step": 126715, "epoch": 1526} {"train_loss": -23.080562591552734, "global_step": 126716, "epoch": 1526} {"train_loss": -22.53954315185547, "global_step": 126717, "epoch": 1526} {"train_loss": -22.6055908203125, "global_step": 126718, "epoch": 1526} {"train_loss": -23.035490036010742, "global_step": 126719, "epoch": 1526} {"train_loss": -22.841283798217773, "global_step": 126720, "epoch": 1526} {"train_loss": -22.477415084838867, "global_step": 126721, "epoch": 1526} {"train_loss": -22.825910568237305, "global_step": 126722, "epoch": 1526} {"train_loss": -22.9898738861084, "global_step": 126723, "epoch": 1526} {"train_loss": -22.772371292114258, "global_step": 126724, "epoch": 1526} {"train_loss": -22.768421173095703, "global_step": 126725, "epoch": 1526} {"train_loss": -22.736454010009766, "global_step": 126726, "epoch": 1526} {"train_loss": -23.177764892578125, "global_step": 126727, "epoch": 1526} {"train_loss": -22.821950912475586, "global_step": 126728, "epoch": 1526} {"train_loss": -22.66127586364746, "global_step": 126729, "epoch": 1526} {"train_loss": -22.54335594177246, "global_step": 126730, "epoch": 1526} {"train_loss": -23.08302879333496, "global_step": 126731, "epoch": 1526} {"train_loss": -22.720836639404297, "global_step": 126732, "epoch": 1526} {"train_loss": -22.848907470703125, "global_step": 126733, "epoch": 1526} {"train_loss": -22.8299617767334, "global_step": 126734, "epoch": 1526} {"train_loss": -22.72332763671875, "global_step": 126735, "epoch": 1526} {"train_loss": -22.491907119750977, "global_step": 126736, "epoch": 1526} {"train_loss": -22.786165237426758, "global_step": 126737, "epoch": 1526} {"train_loss": -22.57716178894043, "global_step": 126738, "epoch": 1526} {"train_loss": -22.30453872680664, "global_step": 126739, "epoch": 1526} {"train_loss": -22.566759086516967, "global_step": 126740, "epoch": 1526, "val_loss": 6274371.0} {"train_loss": -22.675405502319336, "global_step": 126741, "epoch": 1527} {"train_loss": -21.971067428588867, "global_step": 126742, "epoch": 1527} {"train_loss": -22.26423454284668, "global_step": 126743, "epoch": 1527} {"train_loss": -22.30193519592285, "global_step": 126744, "epoch": 1527} {"train_loss": -22.41265296936035, "global_step": 126745, "epoch": 1527} {"train_loss": -22.092039108276367, "global_step": 126746, "epoch": 1527} {"train_loss": -22.405797958374023, "global_step": 126747, "epoch": 1527} {"train_loss": -22.732376098632812, "global_step": 126748, "epoch": 1527} {"train_loss": -22.312253952026367, "global_step": 126749, "epoch": 1527} {"train_loss": -23.01593017578125, "global_step": 126750, "epoch": 1527} {"train_loss": -22.674325942993164, "global_step": 126751, "epoch": 1527} {"train_loss": -23.169204711914062, "global_step": 126752, "epoch": 1527} {"train_loss": -22.079565048217773, "global_step": 126753, "epoch": 1527} {"train_loss": -22.61726188659668, "global_step": 126754, "epoch": 1527} {"train_loss": -22.490264892578125, "global_step": 126755, "epoch": 1527} {"train_loss": -22.503904342651367, "global_step": 126756, "epoch": 1527} {"train_loss": -22.767240524291992, "global_step": 126757, "epoch": 1527} {"train_loss": -22.001901626586914, "global_step": 126758, "epoch": 1527} {"train_loss": -22.754043579101562, "global_step": 126759, "epoch": 1527} {"train_loss": -22.46497344970703, "global_step": 126760, "epoch": 1527} {"train_loss": -22.65130043029785, "global_step": 126761, "epoch": 1527} {"train_loss": -22.749393463134766, "global_step": 126762, "epoch": 1527} {"train_loss": -22.355133056640625, "global_step": 126763, "epoch": 1527} {"train_loss": -22.697986602783203, "global_step": 126764, "epoch": 1527} {"train_loss": -22.55426597595215, "global_step": 126765, "epoch": 1527} {"train_loss": -22.48639488220215, "global_step": 126766, "epoch": 1527} {"train_loss": -22.62675666809082, "global_step": 126767, "epoch": 1527} {"train_loss": -22.610971450805664, "global_step": 126768, "epoch": 1527} {"train_loss": -22.880355834960938, "global_step": 126769, "epoch": 1527} {"train_loss": -22.659521102905273, "global_step": 126770, "epoch": 1527} {"train_loss": -22.507007598876953, "global_step": 126771, "epoch": 1527} {"train_loss": -22.718093872070312, "global_step": 126772, "epoch": 1527} {"train_loss": -22.9617919921875, "global_step": 126773, "epoch": 1527} {"train_loss": -22.76072120666504, "global_step": 126774, "epoch": 1527} {"train_loss": -22.57564353942871, "global_step": 126775, "epoch": 1527} {"train_loss": -23.05146598815918, "global_step": 126776, "epoch": 1527} {"train_loss": -22.991382598876953, "global_step": 126777, "epoch": 1527} {"train_loss": -22.72696304321289, "global_step": 126778, "epoch": 1527} {"train_loss": -22.507970809936523, "global_step": 126779, "epoch": 1527} {"train_loss": -22.80409049987793, "global_step": 126780, "epoch": 1527} {"train_loss": -22.766782760620117, "global_step": 126781, "epoch": 1527} {"train_loss": -22.73342514038086, "global_step": 126782, "epoch": 1527} {"train_loss": -22.307249069213867, "global_step": 126783, "epoch": 1527} {"train_loss": -22.63775062561035, "global_step": 126784, "epoch": 1527} {"train_loss": -22.221548080444336, "global_step": 126785, "epoch": 1527} {"train_loss": -22.817699432373047, "global_step": 126786, "epoch": 1527} {"train_loss": -22.682228088378906, "global_step": 126787, "epoch": 1527} {"train_loss": -23.144861221313477, "global_step": 126788, "epoch": 1527} {"train_loss": -22.778820037841797, "global_step": 126789, "epoch": 1527} {"train_loss": -22.876569747924805, "global_step": 126790, "epoch": 1527} {"train_loss": -22.787790298461914, "global_step": 126791, "epoch": 1527} {"train_loss": -22.932706832885742, "global_step": 126792, "epoch": 1527} {"train_loss": -22.887004852294922, "global_step": 126793, "epoch": 1527} {"train_loss": -22.679861068725586, "global_step": 126794, "epoch": 1527} {"train_loss": -23.095415115356445, "global_step": 126795, "epoch": 1527} {"train_loss": -22.46185302734375, "global_step": 126796, "epoch": 1527} {"train_loss": -22.718719482421875, "global_step": 126797, "epoch": 1527} {"train_loss": -22.864816665649414, "global_step": 126798, "epoch": 1527} {"train_loss": -22.23481559753418, "global_step": 126799, "epoch": 1527} {"train_loss": -22.766183853149414, "global_step": 126800, "epoch": 1527} {"train_loss": -22.993383407592773, "global_step": 126801, "epoch": 1527} {"train_loss": -22.722139358520508, "global_step": 126802, "epoch": 1527} {"train_loss": -22.760251998901367, "global_step": 126803, "epoch": 1527} {"train_loss": -22.836273193359375, "global_step": 126804, "epoch": 1527} {"train_loss": -23.102975845336914, "global_step": 126805, "epoch": 1527} {"train_loss": -22.654617309570312, "global_step": 126806, "epoch": 1527} {"train_loss": -23.263540267944336, "global_step": 126807, "epoch": 1527} {"train_loss": -22.622516632080078, "global_step": 126808, "epoch": 1527} {"train_loss": -22.905118942260742, "global_step": 126809, "epoch": 1527} {"train_loss": -22.795488357543945, "global_step": 126810, "epoch": 1527} {"train_loss": -23.097911834716797, "global_step": 126811, "epoch": 1527} {"train_loss": -22.92490005493164, "global_step": 126812, "epoch": 1527} {"train_loss": -22.482160568237305, "global_step": 126813, "epoch": 1527} {"train_loss": -22.504648208618164, "global_step": 126814, "epoch": 1527} {"train_loss": -22.58535385131836, "global_step": 126815, "epoch": 1527} {"train_loss": -22.56735610961914, "global_step": 126816, "epoch": 1527} {"train_loss": -22.745450973510742, "global_step": 126817, "epoch": 1527} {"train_loss": -22.737478256225586, "global_step": 126818, "epoch": 1527} {"train_loss": -22.541048049926758, "global_step": 126819, "epoch": 1527} {"train_loss": -22.537368774414062, "global_step": 126820, "epoch": 1527} {"train_loss": -22.896989822387695, "global_step": 126821, "epoch": 1527} {"train_loss": -22.7557373046875, "global_step": 126822, "epoch": 1527} {"train_loss": -22.669084525970092, "global_step": 126823, "epoch": 1527, "val_loss": 6377539.5} {"train_loss": -22.422266006469727, "global_step": 126824, "epoch": 1528} {"train_loss": -22.419397354125977, "global_step": 126825, "epoch": 1528} {"train_loss": -22.675762176513672, "global_step": 126826, "epoch": 1528} {"train_loss": -22.63701820373535, "global_step": 126827, "epoch": 1528} {"train_loss": -22.346891403198242, "global_step": 126828, "epoch": 1528} {"train_loss": -22.649669647216797, "global_step": 126829, "epoch": 1528} {"train_loss": -22.6357421875, "global_step": 126830, "epoch": 1528} {"train_loss": -22.623302459716797, "global_step": 126831, "epoch": 1528} {"train_loss": -22.3489933013916, "global_step": 126832, "epoch": 1528} {"train_loss": -22.731464385986328, "global_step": 126833, "epoch": 1528} {"train_loss": -22.638341903686523, "global_step": 126834, "epoch": 1528} {"train_loss": -22.176166534423828, "global_step": 126835, "epoch": 1528} {"train_loss": -22.63665771484375, "global_step": 126836, "epoch": 1528} {"train_loss": -22.63246726989746, "global_step": 126837, "epoch": 1528} {"train_loss": -22.79035758972168, "global_step": 126838, "epoch": 1528} {"train_loss": -22.548114776611328, "global_step": 126839, "epoch": 1528} {"train_loss": -22.41474151611328, "global_step": 126840, "epoch": 1528} {"train_loss": -22.629657745361328, "global_step": 126841, "epoch": 1528} {"train_loss": -22.70807456970215, "global_step": 126842, "epoch": 1528} {"train_loss": -22.67122459411621, "global_step": 126843, "epoch": 1528} {"train_loss": -22.76771354675293, "global_step": 126844, "epoch": 1528} {"train_loss": -22.577838897705078, "global_step": 126845, "epoch": 1528} {"train_loss": -22.78986167907715, "global_step": 126846, "epoch": 1528} {"train_loss": -22.625463485717773, "global_step": 126847, "epoch": 1528} {"train_loss": -22.720312118530273, "global_step": 126848, "epoch": 1528} {"train_loss": -22.3389892578125, "global_step": 126849, "epoch": 1528} {"train_loss": -22.929737091064453, "global_step": 126850, "epoch": 1528} {"train_loss": -22.907155990600586, "global_step": 126851, "epoch": 1528} {"train_loss": -22.977243423461914, "global_step": 126852, "epoch": 1528} {"train_loss": -22.837614059448242, "global_step": 126853, "epoch": 1528} {"train_loss": -22.762643814086914, "global_step": 126854, "epoch": 1528} {"train_loss": -23.103757858276367, "global_step": 126855, "epoch": 1528} {"train_loss": -22.238296508789062, "global_step": 126856, "epoch": 1528} {"train_loss": -22.807645797729492, "global_step": 126857, "epoch": 1528} {"train_loss": -22.636947631835938, "global_step": 126858, "epoch": 1528} {"train_loss": -22.534269332885742, "global_step": 126859, "epoch": 1528} {"train_loss": -22.965715408325195, "global_step": 126860, "epoch": 1528} {"train_loss": -22.766366958618164, "global_step": 126861, "epoch": 1528} {"train_loss": -23.055564880371094, "global_step": 126862, "epoch": 1528} {"train_loss": -22.40275764465332, "global_step": 126863, "epoch": 1528} {"train_loss": -22.648944854736328, "global_step": 126864, "epoch": 1528} {"train_loss": -22.35687255859375, "global_step": 126865, "epoch": 1528} {"train_loss": -23.078824996948242, "global_step": 126866, "epoch": 1528} {"train_loss": -23.415361404418945, "global_step": 126867, "epoch": 1528} {"train_loss": -22.828502655029297, "global_step": 126868, "epoch": 1528} {"train_loss": -22.669950485229492, "global_step": 126869, "epoch": 1528} {"train_loss": -22.814748764038086, "global_step": 126870, "epoch": 1528} {"train_loss": -22.666120529174805, "global_step": 126871, "epoch": 1528} {"train_loss": -23.11819839477539, "global_step": 126872, "epoch": 1528} {"train_loss": -22.50061798095703, "global_step": 126873, "epoch": 1528} {"train_loss": -22.91240882873535, "global_step": 126874, "epoch": 1528} {"train_loss": -22.634679794311523, "global_step": 126875, "epoch": 1528} {"train_loss": -22.821964263916016, "global_step": 126876, "epoch": 1528} {"train_loss": -22.265377044677734, "global_step": 126877, "epoch": 1528} {"train_loss": -22.699718475341797, "global_step": 126878, "epoch": 1528} {"train_loss": -22.548261642456055, "global_step": 126879, "epoch": 1528} {"train_loss": -22.660764694213867, "global_step": 126880, "epoch": 1528} {"train_loss": -22.86103630065918, "global_step": 126881, "epoch": 1528} {"train_loss": -22.393857955932617, "global_step": 126882, "epoch": 1528} {"train_loss": -22.44939613342285, "global_step": 126883, "epoch": 1528} {"train_loss": -22.554855346679688, "global_step": 126884, "epoch": 1528} {"train_loss": -22.638166427612305, "global_step": 126885, "epoch": 1528} {"train_loss": -22.36800193786621, "global_step": 126886, "epoch": 1528} {"train_loss": -22.849515914916992, "global_step": 126887, "epoch": 1528} {"train_loss": -22.322864532470703, "global_step": 126888, "epoch": 1528} {"train_loss": -23.050317764282227, "global_step": 126889, "epoch": 1528} {"train_loss": -22.577190399169922, "global_step": 126890, "epoch": 1528} {"train_loss": -22.500085830688477, "global_step": 126891, "epoch": 1528} {"train_loss": -22.873741149902344, "global_step": 126892, "epoch": 1528} {"train_loss": -22.96415138244629, "global_step": 126893, "epoch": 1528} {"train_loss": -22.544076919555664, "global_step": 126894, "epoch": 1528} {"train_loss": -22.90168571472168, "global_step": 126895, "epoch": 1528} {"train_loss": -22.514720916748047, "global_step": 126896, "epoch": 1528} {"train_loss": -22.720352172851562, "global_step": 126897, "epoch": 1528} {"train_loss": -22.48499870300293, "global_step": 126898, "epoch": 1528} {"train_loss": -22.933183670043945, "global_step": 126899, "epoch": 1528} {"train_loss": -23.21363639831543, "global_step": 126900, "epoch": 1528} {"train_loss": -23.157367706298828, "global_step": 126901, "epoch": 1528} {"train_loss": -22.673812866210938, "global_step": 126902, "epoch": 1528} {"train_loss": -22.85847282409668, "global_step": 126903, "epoch": 1528} {"train_loss": -22.6622314453125, "global_step": 126904, "epoch": 1528} {"train_loss": -22.63140106201172, "global_step": 126905, "epoch": 1528} {"train_loss": -22.67289042185588, "global_step": 126906, "epoch": 1528, "val_loss": 6228996.0} {"train_loss": -21.80499267578125, "global_step": 126907, "epoch": 1529} {"train_loss": -21.729764938354492, "global_step": 126908, "epoch": 1529} {"train_loss": -22.491531372070312, "global_step": 126909, "epoch": 1529} {"train_loss": -22.535629272460938, "global_step": 126910, "epoch": 1529} {"train_loss": -22.179784774780273, "global_step": 126911, "epoch": 1529} {"train_loss": -22.662015914916992, "global_step": 126912, "epoch": 1529} {"train_loss": -21.908329010009766, "global_step": 126913, "epoch": 1529} {"train_loss": -22.36182975769043, "global_step": 126914, "epoch": 1529} {"train_loss": -22.586200714111328, "global_step": 126915, "epoch": 1529} {"train_loss": -22.20389175415039, "global_step": 126916, "epoch": 1529} {"train_loss": -22.505952835083008, "global_step": 126917, "epoch": 1529} {"train_loss": -22.739240646362305, "global_step": 126918, "epoch": 1529} {"train_loss": -22.227867126464844, "global_step": 126919, "epoch": 1529} {"train_loss": -22.328004837036133, "global_step": 126920, "epoch": 1529} {"train_loss": -22.72850799560547, "global_step": 126921, "epoch": 1529} {"train_loss": -22.57456398010254, "global_step": 126922, "epoch": 1529} {"train_loss": -22.734365463256836, "global_step": 126923, "epoch": 1529} {"train_loss": -22.473806381225586, "global_step": 126924, "epoch": 1529} {"train_loss": -22.7558650970459, "global_step": 126925, "epoch": 1529} {"train_loss": -22.57492446899414, "global_step": 126926, "epoch": 1529} {"train_loss": -22.38241958618164, "global_step": 126927, "epoch": 1529} {"train_loss": -22.439577102661133, "global_step": 126928, "epoch": 1529} {"train_loss": -22.541845321655273, "global_step": 126929, "epoch": 1529} {"train_loss": -22.89855194091797, "global_step": 126930, "epoch": 1529} {"train_loss": -22.83868408203125, "global_step": 126931, "epoch": 1529} {"train_loss": -22.59000015258789, "global_step": 126932, "epoch": 1529} {"train_loss": -22.417646408081055, "global_step": 126933, "epoch": 1529} {"train_loss": -23.11774253845215, "global_step": 126934, "epoch": 1529} {"train_loss": -22.217641830444336, "global_step": 126935, "epoch": 1529} {"train_loss": -22.21192741394043, "global_step": 126936, "epoch": 1529} {"train_loss": -22.572385787963867, "global_step": 126937, "epoch": 1529} {"train_loss": -22.576894760131836, "global_step": 126938, "epoch": 1529} {"train_loss": -22.578582763671875, "global_step": 126939, "epoch": 1529} {"train_loss": -22.703676223754883, "global_step": 126940, "epoch": 1529} {"train_loss": -23.075176239013672, "global_step": 126941, "epoch": 1529} {"train_loss": -22.82753562927246, "global_step": 126942, "epoch": 1529} {"train_loss": -22.787145614624023, "global_step": 126943, "epoch": 1529} {"train_loss": -22.87970542907715, "global_step": 126944, "epoch": 1529} {"train_loss": -22.861204147338867, "global_step": 126945, "epoch": 1529} {"train_loss": -23.059926986694336, "global_step": 126946, "epoch": 1529} {"train_loss": -22.843799591064453, "global_step": 126947, "epoch": 1529} {"train_loss": -22.79059600830078, "global_step": 126948, "epoch": 1529} {"train_loss": -22.868881225585938, "global_step": 126949, "epoch": 1529} {"train_loss": -22.90216636657715, "global_step": 126950, "epoch": 1529} {"train_loss": -22.414033889770508, "global_step": 126951, "epoch": 1529} {"train_loss": -22.975412368774414, "global_step": 126952, "epoch": 1529} {"train_loss": -23.091541290283203, "global_step": 126953, "epoch": 1529} {"train_loss": -22.606962203979492, "global_step": 126954, "epoch": 1529} {"train_loss": -22.87888526916504, "global_step": 126955, "epoch": 1529} {"train_loss": -22.550188064575195, "global_step": 126956, "epoch": 1529} {"train_loss": -22.764083862304688, "global_step": 126957, "epoch": 1529} {"train_loss": -22.744386672973633, "global_step": 126958, "epoch": 1529} {"train_loss": -22.94081687927246, "global_step": 126959, "epoch": 1529} {"train_loss": -22.692182540893555, "global_step": 126960, "epoch": 1529} {"train_loss": -22.446348190307617, "global_step": 126961, "epoch": 1529} {"train_loss": -22.760385513305664, "global_step": 126962, "epoch": 1529} {"train_loss": -22.5555477142334, "global_step": 126963, "epoch": 1529} {"train_loss": -23.03670883178711, "global_step": 126964, "epoch": 1529} {"train_loss": -22.6485652923584, "global_step": 126965, "epoch": 1529} {"train_loss": -22.711864471435547, "global_step": 126966, "epoch": 1529} {"train_loss": -23.046770095825195, "global_step": 126967, "epoch": 1529} {"train_loss": -22.74647331237793, "global_step": 126968, "epoch": 1529} {"train_loss": -22.395360946655273, "global_step": 126969, "epoch": 1529} {"train_loss": -22.55048942565918, "global_step": 126970, "epoch": 1529} {"train_loss": -22.998641967773438, "global_step": 126971, "epoch": 1529} {"train_loss": -22.862668991088867, "global_step": 126972, "epoch": 1529} {"train_loss": -22.6462345123291, "global_step": 126973, "epoch": 1529} {"train_loss": -22.774572372436523, "global_step": 126974, "epoch": 1529} {"train_loss": -22.793577194213867, "global_step": 126975, "epoch": 1529} {"train_loss": -22.894630432128906, "global_step": 126976, "epoch": 1529} {"train_loss": -22.720340728759766, "global_step": 126977, "epoch": 1529} {"train_loss": -22.72759437561035, "global_step": 126978, "epoch": 1529} {"train_loss": -23.081567764282227, "global_step": 126979, "epoch": 1529} {"train_loss": -22.721487045288086, "global_step": 126980, "epoch": 1529} {"train_loss": -22.76679801940918, "global_step": 126981, "epoch": 1529} {"train_loss": -22.939559936523438, "global_step": 126982, "epoch": 1529} {"train_loss": -22.70709228515625, "global_step": 126983, "epoch": 1529} {"train_loss": -22.877769470214844, "global_step": 126984, "epoch": 1529} {"train_loss": -22.625732421875, "global_step": 126985, "epoch": 1529} {"train_loss": -23.037731170654297, "global_step": 126986, "epoch": 1529} {"train_loss": -22.953454971313477, "global_step": 126987, "epoch": 1529} {"train_loss": -22.836288452148438, "global_step": 126988, "epoch": 1529} {"train_loss": -22.670454990432923, "global_step": 126989, "epoch": 1529, "val_loss": 6283115.5} {"train_loss": -21.720417022705078, "global_step": 126990, "epoch": 1530} {"train_loss": -21.70878028869629, "global_step": 126991, "epoch": 1530} {"train_loss": -21.931116104125977, "global_step": 126992, "epoch": 1530} {"train_loss": -21.499845504760742, "global_step": 126993, "epoch": 1530} {"train_loss": -22.172901153564453, "global_step": 126994, "epoch": 1530} {"train_loss": -21.949459075927734, "global_step": 126995, "epoch": 1530} {"train_loss": -22.11334800720215, "global_step": 126996, "epoch": 1530} {"train_loss": -22.158716201782227, "global_step": 126997, "epoch": 1530} {"train_loss": -22.113370895385742, "global_step": 126998, "epoch": 1530} {"train_loss": -22.632877349853516, "global_step": 126999, "epoch": 1530} {"train_loss": -22.728296279907227, "global_step": 127000, "epoch": 1530} {"train_loss": -22.37397575378418, "global_step": 127001, "epoch": 1530} {"train_loss": -22.395008087158203, "global_step": 127002, "epoch": 1530} {"train_loss": -22.026830673217773, "global_step": 127003, "epoch": 1530} {"train_loss": -22.39594841003418, "global_step": 127004, "epoch": 1530} {"train_loss": -22.375293731689453, "global_step": 127005, "epoch": 1530} {"train_loss": -22.320602416992188, "global_step": 127006, "epoch": 1530} {"train_loss": -22.979442596435547, "global_step": 127007, "epoch": 1530} {"train_loss": -22.286169052124023, "global_step": 127008, "epoch": 1530} {"train_loss": -22.367712020874023, "global_step": 127009, "epoch": 1530} {"train_loss": -22.351221084594727, "global_step": 127010, "epoch": 1530} {"train_loss": -22.306188583374023, "global_step": 127011, "epoch": 1530} {"train_loss": -22.631378173828125, "global_step": 127012, "epoch": 1530} {"train_loss": -22.858642578125, "global_step": 127013, "epoch": 1530} {"train_loss": -22.781173706054688, "global_step": 127014, "epoch": 1530} {"train_loss": -22.387537002563477, "global_step": 127015, "epoch": 1530} {"train_loss": -22.633689880371094, "global_step": 127016, "epoch": 1530} {"train_loss": -22.895183563232422, "global_step": 127017, "epoch": 1530} {"train_loss": -22.544042587280273, "global_step": 127018, "epoch": 1530} {"train_loss": -23.009885787963867, "global_step": 127019, "epoch": 1530} {"train_loss": -23.051116943359375, "global_step": 127020, "epoch": 1530} {"train_loss": -22.712610244750977, "global_step": 127021, "epoch": 1530} {"train_loss": -23.076583862304688, "global_step": 127022, "epoch": 1530} {"train_loss": -22.750783920288086, "global_step": 127023, "epoch": 1530} {"train_loss": -22.708444595336914, "global_step": 127024, "epoch": 1530} {"train_loss": -22.468807220458984, "global_step": 127025, "epoch": 1530} {"train_loss": -22.779333114624023, "global_step": 127026, "epoch": 1530} {"train_loss": -22.806495666503906, "global_step": 127027, "epoch": 1530} {"train_loss": -22.695722579956055, "global_step": 127028, "epoch": 1530} {"train_loss": -22.95549964904785, "global_step": 127029, "epoch": 1530} {"train_loss": -23.023279190063477, "global_step": 127030, "epoch": 1530} {"train_loss": -22.78828239440918, "global_step": 127031, "epoch": 1530} {"train_loss": -22.239439010620117, "global_step": 127032, "epoch": 1530} {"train_loss": -22.510459899902344, "global_step": 127033, "epoch": 1530} {"train_loss": -23.11005210876465, "global_step": 127034, "epoch": 1530} {"train_loss": -22.659738540649414, "global_step": 127035, "epoch": 1530} {"train_loss": -22.676023483276367, "global_step": 127036, "epoch": 1530} {"train_loss": -22.657785415649414, "global_step": 127037, "epoch": 1530} {"train_loss": -22.8622989654541, "global_step": 127038, "epoch": 1530} {"train_loss": -22.473831176757812, "global_step": 127039, "epoch": 1530} {"train_loss": -22.61037254333496, "global_step": 127040, "epoch": 1530} {"train_loss": -22.548858642578125, "global_step": 127041, "epoch": 1530} {"train_loss": -22.43586540222168, "global_step": 127042, "epoch": 1530} {"train_loss": -22.58296775817871, "global_step": 127043, "epoch": 1530} {"train_loss": -22.7127742767334, "global_step": 127044, "epoch": 1530} {"train_loss": -22.29049301147461, "global_step": 127045, "epoch": 1530} {"train_loss": -22.100788116455078, "global_step": 127046, "epoch": 1530} {"train_loss": -22.410053253173828, "global_step": 127047, "epoch": 1530} {"train_loss": -22.453113555908203, "global_step": 127048, "epoch": 1530} {"train_loss": -22.633960723876953, "global_step": 127049, "epoch": 1530} {"train_loss": -23.0926456451416, "global_step": 127050, "epoch": 1530} {"train_loss": -22.29169273376465, "global_step": 127051, "epoch": 1530} {"train_loss": -22.205869674682617, "global_step": 127052, "epoch": 1530} {"train_loss": -23.033761978149414, "global_step": 127053, "epoch": 1530} {"train_loss": -22.352582931518555, "global_step": 127054, "epoch": 1530} {"train_loss": -22.377090454101562, "global_step": 127055, "epoch": 1530} {"train_loss": -22.89314079284668, "global_step": 127056, "epoch": 1530} {"train_loss": -22.604183197021484, "global_step": 127057, "epoch": 1530} {"train_loss": -22.47443199157715, "global_step": 127058, "epoch": 1530} {"train_loss": -22.61517906188965, "global_step": 127059, "epoch": 1530} {"train_loss": -22.47321128845215, "global_step": 127060, "epoch": 1530} {"train_loss": -22.902822494506836, "global_step": 127061, "epoch": 1530} {"train_loss": -22.938486099243164, "global_step": 127062, "epoch": 1530} {"train_loss": -22.71410369873047, "global_step": 127063, "epoch": 1530} {"train_loss": -22.612836837768555, "global_step": 127064, "epoch": 1530} {"train_loss": -22.925539016723633, "global_step": 127065, "epoch": 1530} {"train_loss": -22.742069244384766, "global_step": 127066, "epoch": 1530} {"train_loss": -22.655073165893555, "global_step": 127067, "epoch": 1530} {"train_loss": -22.43824577331543, "global_step": 127068, "epoch": 1530} {"train_loss": -22.861326217651367, "global_step": 127069, "epoch": 1530} {"train_loss": -22.75641441345215, "global_step": 127070, "epoch": 1530} {"train_loss": -22.614582061767578, "global_step": 127071, "epoch": 1530} {"train_loss": -22.556851950036474, "global_step": 127072, "epoch": 1530, "val_loss": 6265774.0} {"train_loss": -22.505029678344727, "global_step": 127073, "epoch": 1531} {"train_loss": -22.47848892211914, "global_step": 127074, "epoch": 1531} {"train_loss": -22.636268615722656, "global_step": 127075, "epoch": 1531} {"train_loss": -22.142215728759766, "global_step": 127076, "epoch": 1531} {"train_loss": -22.17057228088379, "global_step": 127077, "epoch": 1531} {"train_loss": -22.616247177124023, "global_step": 127078, "epoch": 1531} {"train_loss": -22.531888961791992, "global_step": 127079, "epoch": 1531} {"train_loss": -22.78670310974121, "global_step": 127080, "epoch": 1531} {"train_loss": -22.543954849243164, "global_step": 127081, "epoch": 1531} {"train_loss": -22.472097396850586, "global_step": 127082, "epoch": 1531} {"train_loss": -22.196203231811523, "global_step": 127083, "epoch": 1531} {"train_loss": -22.475013732910156, "global_step": 127084, "epoch": 1531} {"train_loss": -22.536422729492188, "global_step": 127085, "epoch": 1531} {"train_loss": -22.55739402770996, "global_step": 127086, "epoch": 1531} {"train_loss": -22.322429656982422, "global_step": 127087, "epoch": 1531} {"train_loss": -22.601972579956055, "global_step": 127088, "epoch": 1531} {"train_loss": -22.4890079498291, "global_step": 127089, "epoch": 1531} {"train_loss": -22.80350685119629, "global_step": 127090, "epoch": 1531} {"train_loss": -22.85651206970215, "global_step": 127091, "epoch": 1531} {"train_loss": -22.354185104370117, "global_step": 127092, "epoch": 1531} {"train_loss": -22.660663604736328, "global_step": 127093, "epoch": 1531} {"train_loss": -23.104063034057617, "global_step": 127094, "epoch": 1531} {"train_loss": -22.523855209350586, "global_step": 127095, "epoch": 1531} {"train_loss": -22.5674991607666, "global_step": 127096, "epoch": 1531} {"train_loss": -22.86138916015625, "global_step": 127097, "epoch": 1531} {"train_loss": -22.784955978393555, "global_step": 127098, "epoch": 1531} {"train_loss": -22.615036010742188, "global_step": 127099, "epoch": 1531} {"train_loss": -22.713714599609375, "global_step": 127100, "epoch": 1531} {"train_loss": -22.5394344329834, "global_step": 127101, "epoch": 1531} {"train_loss": -22.809141159057617, "global_step": 127102, "epoch": 1531} {"train_loss": -22.792455673217773, "global_step": 127103, "epoch": 1531} {"train_loss": -22.71882438659668, "global_step": 127104, "epoch": 1531} {"train_loss": -22.63370704650879, "global_step": 127105, "epoch": 1531} {"train_loss": -22.588735580444336, "global_step": 127106, "epoch": 1531} {"train_loss": -22.85945701599121, "global_step": 127107, "epoch": 1531} {"train_loss": -22.696027755737305, "global_step": 127108, "epoch": 1531} {"train_loss": -22.766210556030273, "global_step": 127109, "epoch": 1531} {"train_loss": -22.765363693237305, "global_step": 127110, "epoch": 1531} {"train_loss": -22.735641479492188, "global_step": 127111, "epoch": 1531} {"train_loss": -23.051822662353516, "global_step": 127112, "epoch": 1531} {"train_loss": -22.396194458007812, "global_step": 127113, "epoch": 1531} {"train_loss": -22.831588745117188, "global_step": 127114, "epoch": 1531} {"train_loss": -23.09197425842285, "global_step": 127115, "epoch": 1531} {"train_loss": -23.014602661132812, "global_step": 127116, "epoch": 1531} {"train_loss": -22.82984733581543, "global_step": 127117, "epoch": 1531} {"train_loss": -22.832077026367188, "global_step": 127118, "epoch": 1531} {"train_loss": -22.564437866210938, "global_step": 127119, "epoch": 1531} {"train_loss": -22.941890716552734, "global_step": 127120, "epoch": 1531} {"train_loss": -23.056507110595703, "global_step": 127121, "epoch": 1531} {"train_loss": -22.505199432373047, "global_step": 127122, "epoch": 1531} {"train_loss": -22.598325729370117, "global_step": 127123, "epoch": 1531} {"train_loss": -22.675161361694336, "global_step": 127124, "epoch": 1531} {"train_loss": -22.815147399902344, "global_step": 127125, "epoch": 1531} {"train_loss": -22.89857292175293, "global_step": 127126, "epoch": 1531} {"train_loss": -22.878183364868164, "global_step": 127127, "epoch": 1531} {"train_loss": -22.937650680541992, "global_step": 127128, "epoch": 1531} {"train_loss": -22.70953941345215, "global_step": 127129, "epoch": 1531} {"train_loss": -22.45198631286621, "global_step": 127130, "epoch": 1531} {"train_loss": -22.215238571166992, "global_step": 127131, "epoch": 1531} {"train_loss": -22.182775497436523, "global_step": 127132, "epoch": 1531} {"train_loss": -22.903518676757812, "global_step": 127133, "epoch": 1531} {"train_loss": -22.621912002563477, "global_step": 127134, "epoch": 1531} {"train_loss": -22.834518432617188, "global_step": 127135, "epoch": 1531} {"train_loss": -22.526872634887695, "global_step": 127136, "epoch": 1531} {"train_loss": -22.24861717224121, "global_step": 127137, "epoch": 1531} {"train_loss": -22.720169067382812, "global_step": 127138, "epoch": 1531} {"train_loss": -22.733816146850586, "global_step": 127139, "epoch": 1531} {"train_loss": -23.152204513549805, "global_step": 127140, "epoch": 1531} {"train_loss": -22.659910202026367, "global_step": 127141, "epoch": 1531} {"train_loss": -23.159889221191406, "global_step": 127142, "epoch": 1531} {"train_loss": -22.707040786743164, "global_step": 127143, "epoch": 1531} {"train_loss": -22.73259925842285, "global_step": 127144, "epoch": 1531} {"train_loss": -22.88205337524414, "global_step": 127145, "epoch": 1531} {"train_loss": -22.66779899597168, "global_step": 127146, "epoch": 1531} {"train_loss": -23.117830276489258, "global_step": 127147, "epoch": 1531} {"train_loss": -22.87360954284668, "global_step": 127148, "epoch": 1531} {"train_loss": -22.96896743774414, "global_step": 127149, "epoch": 1531} {"train_loss": -22.944686889648438, "global_step": 127150, "epoch": 1531} {"train_loss": -22.730459213256836, "global_step": 127151, "epoch": 1531} {"train_loss": -22.416091918945312, "global_step": 127152, "epoch": 1531} {"train_loss": -22.592594146728516, "global_step": 127153, "epoch": 1531} {"train_loss": -23.047449111938477, "global_step": 127154, "epoch": 1531} {"train_loss": -22.67710081353245, "global_step": 127155, "epoch": 1531, "val_loss": 6212804.0} {"train_loss": -21.82120132446289, "global_step": 127156, "epoch": 1532} {"train_loss": -22.45768165588379, "global_step": 127157, "epoch": 1532} {"train_loss": -22.680072784423828, "global_step": 127158, "epoch": 1532} {"train_loss": -22.08504295349121, "global_step": 127159, "epoch": 1532} {"train_loss": -21.74142074584961, "global_step": 127160, "epoch": 1532} {"train_loss": -22.168058395385742, "global_step": 127161, "epoch": 1532} {"train_loss": -22.675655364990234, "global_step": 127162, "epoch": 1532} {"train_loss": -22.23885726928711, "global_step": 127163, "epoch": 1532} {"train_loss": -22.43760108947754, "global_step": 127164, "epoch": 1532} {"train_loss": -22.61940574645996, "global_step": 127165, "epoch": 1532} {"train_loss": -22.159656524658203, "global_step": 127166, "epoch": 1532} {"train_loss": -22.716527938842773, "global_step": 127167, "epoch": 1532} {"train_loss": -22.516040802001953, "global_step": 127168, "epoch": 1532} {"train_loss": -22.2113094329834, "global_step": 127169, "epoch": 1532} {"train_loss": -22.932828903198242, "global_step": 127170, "epoch": 1532} {"train_loss": -22.48142433166504, "global_step": 127171, "epoch": 1532} {"train_loss": -22.429325103759766, "global_step": 127172, "epoch": 1532} {"train_loss": -22.775136947631836, "global_step": 127173, "epoch": 1532} {"train_loss": -22.371612548828125, "global_step": 127174, "epoch": 1532} {"train_loss": -22.668737411499023, "global_step": 127175, "epoch": 1532} {"train_loss": -22.526723861694336, "global_step": 127176, "epoch": 1532} {"train_loss": -22.903762817382812, "global_step": 127177, "epoch": 1532} {"train_loss": -22.22554588317871, "global_step": 127178, "epoch": 1532} {"train_loss": -22.46681785583496, "global_step": 127179, "epoch": 1532} {"train_loss": -22.259363174438477, "global_step": 127180, "epoch": 1532} {"train_loss": -22.104352951049805, "global_step": 127181, "epoch": 1532} {"train_loss": -22.663238525390625, "global_step": 127182, "epoch": 1532} {"train_loss": -22.48396873474121, "global_step": 127183, "epoch": 1532} {"train_loss": -22.182559967041016, "global_step": 127184, "epoch": 1532} {"train_loss": -22.426477432250977, "global_step": 127185, "epoch": 1532} {"train_loss": -22.63411521911621, "global_step": 127186, "epoch": 1532} {"train_loss": -22.94642448425293, "global_step": 127187, "epoch": 1532} {"train_loss": -23.04483985900879, "global_step": 127188, "epoch": 1532} {"train_loss": -22.64772605895996, "global_step": 127189, "epoch": 1532} {"train_loss": -22.44766616821289, "global_step": 127190, "epoch": 1532} {"train_loss": -22.982173919677734, "global_step": 127191, "epoch": 1532} {"train_loss": -22.882001876831055, "global_step": 127192, "epoch": 1532} {"train_loss": -22.64579200744629, "global_step": 127193, "epoch": 1532} {"train_loss": -22.421579360961914, "global_step": 127194, "epoch": 1532} {"train_loss": -22.436569213867188, "global_step": 127195, "epoch": 1532} {"train_loss": -22.81430435180664, "global_step": 127196, "epoch": 1532} {"train_loss": -22.678848266601562, "global_step": 127197, "epoch": 1532} {"train_loss": -22.74921989440918, "global_step": 127198, "epoch": 1532} {"train_loss": -22.763269424438477, "global_step": 127199, "epoch": 1532} {"train_loss": -23.02927589416504, "global_step": 127200, "epoch": 1532} {"train_loss": -22.741731643676758, "global_step": 127201, "epoch": 1532} {"train_loss": -22.555021286010742, "global_step": 127202, "epoch": 1532} {"train_loss": -22.449018478393555, "global_step": 127203, "epoch": 1532} {"train_loss": -22.980382919311523, "global_step": 127204, "epoch": 1532} {"train_loss": -22.408910751342773, "global_step": 127205, "epoch": 1532} {"train_loss": -22.793737411499023, "global_step": 127206, "epoch": 1532} {"train_loss": -22.622135162353516, "global_step": 127207, "epoch": 1532} {"train_loss": -22.6690731048584, "global_step": 127208, "epoch": 1532} {"train_loss": -23.17154884338379, "global_step": 127209, "epoch": 1532} {"train_loss": -22.79229164123535, "global_step": 127210, "epoch": 1532} {"train_loss": -22.97334861755371, "global_step": 127211, "epoch": 1532} {"train_loss": -22.56392478942871, "global_step": 127212, "epoch": 1532} {"train_loss": -22.69106101989746, "global_step": 127213, "epoch": 1532} {"train_loss": -22.741701126098633, "global_step": 127214, "epoch": 1532} {"train_loss": -23.007028579711914, "global_step": 127215, "epoch": 1532} {"train_loss": -22.887746810913086, "global_step": 127216, "epoch": 1532} {"train_loss": -22.527265548706055, "global_step": 127217, "epoch": 1532} {"train_loss": -22.469501495361328, "global_step": 127218, "epoch": 1532} {"train_loss": -22.4882869720459, "global_step": 127219, "epoch": 1532} {"train_loss": -22.749027252197266, "global_step": 127220, "epoch": 1532} {"train_loss": -23.11196517944336, "global_step": 127221, "epoch": 1532} {"train_loss": -22.386734008789062, "global_step": 127222, "epoch": 1532} {"train_loss": -22.689212799072266, "global_step": 127223, "epoch": 1532} {"train_loss": -22.91884422302246, "global_step": 127224, "epoch": 1532} {"train_loss": -22.263906478881836, "global_step": 127225, "epoch": 1532} {"train_loss": -22.752056121826172, "global_step": 127226, "epoch": 1532} {"train_loss": -22.7362003326416, "global_step": 127227, "epoch": 1532} {"train_loss": -22.864431381225586, "global_step": 127228, "epoch": 1532} {"train_loss": -22.36673927307129, "global_step": 127229, "epoch": 1532} {"train_loss": -22.759563446044922, "global_step": 127230, "epoch": 1532} {"train_loss": -22.8646297454834, "global_step": 127231, "epoch": 1532} {"train_loss": -22.55536651611328, "global_step": 127232, "epoch": 1532} {"train_loss": -22.527103424072266, "global_step": 127233, "epoch": 1532} {"train_loss": -22.67930030822754, "global_step": 127234, "epoch": 1532} {"train_loss": -22.922016143798828, "global_step": 127235, "epoch": 1532} {"train_loss": -22.756113052368164, "global_step": 127236, "epoch": 1532} {"train_loss": -22.364294052124023, "global_step": 127237, "epoch": 1532} {"train_loss": -22.617476819509484, "global_step": 127238, "epoch": 1532, "val_loss": 6160503.0} {"train_loss": -21.72113037109375, "global_step": 127239, "epoch": 1533} {"train_loss": -21.580671310424805, "global_step": 127240, "epoch": 1533} {"train_loss": -21.797157287597656, "global_step": 127241, "epoch": 1533} {"train_loss": -22.292211532592773, "global_step": 127242, "epoch": 1533} {"train_loss": -21.830305099487305, "global_step": 127243, "epoch": 1533} {"train_loss": -22.190170288085938, "global_step": 127244, "epoch": 1533} {"train_loss": -21.861743927001953, "global_step": 127245, "epoch": 1533} {"train_loss": -21.68985939025879, "global_step": 127246, "epoch": 1533} {"train_loss": -22.463825225830078, "global_step": 127247, "epoch": 1533} {"train_loss": -22.057151794433594, "global_step": 127248, "epoch": 1533} {"train_loss": -21.727941513061523, "global_step": 127249, "epoch": 1533} {"train_loss": -22.01515769958496, "global_step": 127250, "epoch": 1533} {"train_loss": -22.61979866027832, "global_step": 127251, "epoch": 1533} {"train_loss": -22.095752716064453, "global_step": 127252, "epoch": 1533} {"train_loss": -22.385746002197266, "global_step": 127253, "epoch": 1533} {"train_loss": -22.37763023376465, "global_step": 127254, "epoch": 1533} {"train_loss": -22.109363555908203, "global_step": 127255, "epoch": 1533} {"train_loss": -22.682334899902344, "global_step": 127256, "epoch": 1533} {"train_loss": -22.655736923217773, "global_step": 127257, "epoch": 1533} {"train_loss": -22.551490783691406, "global_step": 127258, "epoch": 1533} {"train_loss": -22.089256286621094, "global_step": 127259, "epoch": 1533} {"train_loss": -22.185195922851562, "global_step": 127260, "epoch": 1533} {"train_loss": -22.710695266723633, "global_step": 127261, "epoch": 1533} {"train_loss": -22.3245849609375, "global_step": 127262, "epoch": 1533} {"train_loss": -22.631986618041992, "global_step": 127263, "epoch": 1533} {"train_loss": -22.83084487915039, "global_step": 127264, "epoch": 1533} {"train_loss": -22.54288673400879, "global_step": 127265, "epoch": 1533} {"train_loss": -22.716110229492188, "global_step": 127266, "epoch": 1533} {"train_loss": -22.65519142150879, "global_step": 127267, "epoch": 1533} {"train_loss": -22.744062423706055, "global_step": 127268, "epoch": 1533} {"train_loss": -22.616436004638672, "global_step": 127269, "epoch": 1533} {"train_loss": -22.437923431396484, "global_step": 127270, "epoch": 1533} {"train_loss": -22.523210525512695, "global_step": 127271, "epoch": 1533} {"train_loss": -22.63869285583496, "global_step": 127272, "epoch": 1533} {"train_loss": -22.820358276367188, "global_step": 127273, "epoch": 1533} {"train_loss": -23.06509780883789, "global_step": 127274, "epoch": 1533} {"train_loss": -22.572805404663086, "global_step": 127275, "epoch": 1533} {"train_loss": -22.941614151000977, "global_step": 127276, "epoch": 1533} {"train_loss": -22.466989517211914, "global_step": 127277, "epoch": 1533} {"train_loss": -22.6903018951416, "global_step": 127278, "epoch": 1533} {"train_loss": -22.76205062866211, "global_step": 127279, "epoch": 1533} {"train_loss": -22.887338638305664, "global_step": 127280, "epoch": 1533} {"train_loss": -22.401113510131836, "global_step": 127281, "epoch": 1533} {"train_loss": -22.931421279907227, "global_step": 127282, "epoch": 1533} {"train_loss": -22.7496395111084, "global_step": 127283, "epoch": 1533} {"train_loss": -22.7589168548584, "global_step": 127284, "epoch": 1533} {"train_loss": -22.683958053588867, "global_step": 127285, "epoch": 1533} {"train_loss": -23.13382339477539, "global_step": 127286, "epoch": 1533} {"train_loss": -23.170927047729492, "global_step": 127287, "epoch": 1533} {"train_loss": -22.401260375976562, "global_step": 127288, "epoch": 1533} {"train_loss": -23.046762466430664, "global_step": 127289, "epoch": 1533} {"train_loss": -22.743730545043945, "global_step": 127290, "epoch": 1533} {"train_loss": -23.13970375061035, "global_step": 127291, "epoch": 1533} {"train_loss": -22.765487670898438, "global_step": 127292, "epoch": 1533} {"train_loss": -22.970840454101562, "global_step": 127293, "epoch": 1533} {"train_loss": -22.705345153808594, "global_step": 127294, "epoch": 1533} {"train_loss": -22.673847198486328, "global_step": 127295, "epoch": 1533} {"train_loss": -22.937625885009766, "global_step": 127296, "epoch": 1533} {"train_loss": -22.83663558959961, "global_step": 127297, "epoch": 1533} {"train_loss": -22.40480613708496, "global_step": 127298, "epoch": 1533} {"train_loss": -22.73805809020996, "global_step": 127299, "epoch": 1533} {"train_loss": -22.806737899780273, "global_step": 127300, "epoch": 1533} {"train_loss": -22.98516845703125, "global_step": 127301, "epoch": 1533} {"train_loss": -22.957324981689453, "global_step": 127302, "epoch": 1533} {"train_loss": -22.824670791625977, "global_step": 127303, "epoch": 1533} {"train_loss": -22.767017364501953, "global_step": 127304, "epoch": 1533} {"train_loss": -22.64512062072754, "global_step": 127305, "epoch": 1533} {"train_loss": -22.830669403076172, "global_step": 127306, "epoch": 1533} {"train_loss": -22.709918975830078, "global_step": 127307, "epoch": 1533} {"train_loss": -22.893171310424805, "global_step": 127308, "epoch": 1533} {"train_loss": -22.481491088867188, "global_step": 127309, "epoch": 1533} {"train_loss": -22.86759376525879, "global_step": 127310, "epoch": 1533} {"train_loss": -22.809614181518555, "global_step": 127311, "epoch": 1533} {"train_loss": -22.65455436706543, "global_step": 127312, "epoch": 1533} {"train_loss": -22.867141723632812, "global_step": 127313, "epoch": 1533} {"train_loss": -22.884958267211914, "global_step": 127314, "epoch": 1533} {"train_loss": -22.49947166442871, "global_step": 127315, "epoch": 1533} {"train_loss": -22.458999633789062, "global_step": 127316, "epoch": 1533} {"train_loss": -22.70377540588379, "global_step": 127317, "epoch": 1533} {"train_loss": -22.497594833374023, "global_step": 127318, "epoch": 1533} {"train_loss": -22.761798858642578, "global_step": 127319, "epoch": 1533} {"train_loss": -22.65378189086914, "global_step": 127320, "epoch": 1533} {"train_loss": -22.585880624242577, "global_step": 127321, "epoch": 1533, "val_loss": 6184495.0} {"train_loss": -22.378211975097656, "global_step": 127322, "epoch": 1534} {"train_loss": -21.227325439453125, "global_step": 127323, "epoch": 1534} {"train_loss": -22.233999252319336, "global_step": 127324, "epoch": 1534} {"train_loss": -22.35590171813965, "global_step": 127325, "epoch": 1534} {"train_loss": -21.60928726196289, "global_step": 127326, "epoch": 1534} {"train_loss": -21.88913345336914, "global_step": 127327, "epoch": 1534} {"train_loss": -21.920166015625, "global_step": 127328, "epoch": 1534} {"train_loss": -22.193918228149414, "global_step": 127329, "epoch": 1534} {"train_loss": -22.13323974609375, "global_step": 127330, "epoch": 1534} {"train_loss": -22.25959587097168, "global_step": 127331, "epoch": 1534} {"train_loss": -22.00995445251465, "global_step": 127332, "epoch": 1534} {"train_loss": -22.25967025756836, "global_step": 127333, "epoch": 1534} {"train_loss": -22.146175384521484, "global_step": 127334, "epoch": 1534} {"train_loss": -22.520410537719727, "global_step": 127335, "epoch": 1534} {"train_loss": -22.216995239257812, "global_step": 127336, "epoch": 1534} {"train_loss": -22.231000900268555, "global_step": 127337, "epoch": 1534} {"train_loss": -22.336151123046875, "global_step": 127338, "epoch": 1534} {"train_loss": -22.77596664428711, "global_step": 127339, "epoch": 1534} {"train_loss": -22.292158126831055, "global_step": 127340, "epoch": 1534} {"train_loss": -22.265338897705078, "global_step": 127341, "epoch": 1534} {"train_loss": -22.27167320251465, "global_step": 127342, "epoch": 1534} {"train_loss": -22.53716468811035, "global_step": 127343, "epoch": 1534} {"train_loss": -22.332706451416016, "global_step": 127344, "epoch": 1534} {"train_loss": -22.323713302612305, "global_step": 127345, "epoch": 1534} {"train_loss": -22.924436569213867, "global_step": 127346, "epoch": 1534} {"train_loss": -22.65118980407715, "global_step": 127347, "epoch": 1534} {"train_loss": -22.370038986206055, "global_step": 127348, "epoch": 1534} {"train_loss": -22.685550689697266, "global_step": 127349, "epoch": 1534} {"train_loss": -22.463058471679688, "global_step": 127350, "epoch": 1534} {"train_loss": -22.44888687133789, "global_step": 127351, "epoch": 1534} {"train_loss": -23.34248161315918, "global_step": 127352, "epoch": 1534} {"train_loss": -22.47591209411621, "global_step": 127353, "epoch": 1534} {"train_loss": -22.673789978027344, "global_step": 127354, "epoch": 1534} {"train_loss": -22.86989974975586, "global_step": 127355, "epoch": 1534} {"train_loss": -22.650659561157227, "global_step": 127356, "epoch": 1534} {"train_loss": -23.24761199951172, "global_step": 127357, "epoch": 1534} {"train_loss": -23.01179313659668, "global_step": 127358, "epoch": 1534} {"train_loss": -22.593992233276367, "global_step": 127359, "epoch": 1534} {"train_loss": -22.644445419311523, "global_step": 127360, "epoch": 1534} {"train_loss": -23.21022605895996, "global_step": 127361, "epoch": 1534} {"train_loss": -22.96565818786621, "global_step": 127362, "epoch": 1534} {"train_loss": -22.824527740478516, "global_step": 127363, "epoch": 1534} {"train_loss": -22.477828979492188, "global_step": 127364, "epoch": 1534} {"train_loss": -22.599807739257812, "global_step": 127365, "epoch": 1534} {"train_loss": -23.23746681213379, "global_step": 127366, "epoch": 1534} {"train_loss": -22.48879051208496, "global_step": 127367, "epoch": 1534} {"train_loss": -22.59476661682129, "global_step": 127368, "epoch": 1534} {"train_loss": -22.792125701904297, "global_step": 127369, "epoch": 1534} {"train_loss": -22.769784927368164, "global_step": 127370, "epoch": 1534} {"train_loss": -22.245153427124023, "global_step": 127371, "epoch": 1534} {"train_loss": -22.95345115661621, "global_step": 127372, "epoch": 1534} {"train_loss": -22.92128562927246, "global_step": 127373, "epoch": 1534} {"train_loss": -22.956871032714844, "global_step": 127374, "epoch": 1534} {"train_loss": -22.355382919311523, "global_step": 127375, "epoch": 1534} {"train_loss": -22.656417846679688, "global_step": 127376, "epoch": 1534} {"train_loss": -22.872045516967773, "global_step": 127377, "epoch": 1534} {"train_loss": -22.9067440032959, "global_step": 127378, "epoch": 1534} {"train_loss": -22.782392501831055, "global_step": 127379, "epoch": 1534} {"train_loss": -23.033483505249023, "global_step": 127380, "epoch": 1534} {"train_loss": -22.792129516601562, "global_step": 127381, "epoch": 1534} {"train_loss": -23.14551544189453, "global_step": 127382, "epoch": 1534} {"train_loss": -22.673776626586914, "global_step": 127383, "epoch": 1534} {"train_loss": -22.544824600219727, "global_step": 127384, "epoch": 1534} {"train_loss": -23.005901336669922, "global_step": 127385, "epoch": 1534} {"train_loss": -22.995697021484375, "global_step": 127386, "epoch": 1534} {"train_loss": -22.99625015258789, "global_step": 127387, "epoch": 1534} {"train_loss": -23.22458267211914, "global_step": 127388, "epoch": 1534} {"train_loss": -22.387845993041992, "global_step": 127389, "epoch": 1534} {"train_loss": -22.850046157836914, "global_step": 127390, "epoch": 1534} {"train_loss": -23.162357330322266, "global_step": 127391, "epoch": 1534} {"train_loss": -22.950578689575195, "global_step": 127392, "epoch": 1534} {"train_loss": -22.886638641357422, "global_step": 127393, "epoch": 1534} {"train_loss": -22.79844093322754, "global_step": 127394, "epoch": 1534} {"train_loss": -22.462141036987305, "global_step": 127395, "epoch": 1534} {"train_loss": -22.734603881835938, "global_step": 127396, "epoch": 1534} {"train_loss": -22.717426300048828, "global_step": 127397, "epoch": 1534} {"train_loss": -22.567869186401367, "global_step": 127398, "epoch": 1534} {"train_loss": -22.821319580078125, "global_step": 127399, "epoch": 1534} {"train_loss": -22.893842697143555, "global_step": 127400, "epoch": 1534} {"train_loss": -22.675142288208008, "global_step": 127401, "epoch": 1534} {"train_loss": -22.640443801879883, "global_step": 127402, "epoch": 1534} {"train_loss": -22.629314422607422, "global_step": 127403, "epoch": 1534} {"train_loss": -22.589026922202972, "global_step": 127404, "epoch": 1534, "val_loss": 6387488.5} {"train_loss": -22.765127182006836, "global_step": 127405, "epoch": 1535} {"train_loss": -22.577096939086914, "global_step": 127406, "epoch": 1535} {"train_loss": -22.61594009399414, "global_step": 127407, "epoch": 1535} {"train_loss": -22.680862426757812, "global_step": 127408, "epoch": 1535} {"train_loss": -22.6390380859375, "global_step": 127409, "epoch": 1535} {"train_loss": -22.434173583984375, "global_step": 127410, "epoch": 1535} {"train_loss": -22.369129180908203, "global_step": 127411, "epoch": 1535} {"train_loss": -22.436735153198242, "global_step": 127412, "epoch": 1535} {"train_loss": -22.422510147094727, "global_step": 127413, "epoch": 1535} {"train_loss": -22.321603775024414, "global_step": 127414, "epoch": 1535} {"train_loss": -22.681798934936523, "global_step": 127415, "epoch": 1535} {"train_loss": -22.770681381225586, "global_step": 127416, "epoch": 1535} {"train_loss": -22.71058464050293, "global_step": 127417, "epoch": 1535} {"train_loss": -22.494409561157227, "global_step": 127418, "epoch": 1535} {"train_loss": -22.301176071166992, "global_step": 127419, "epoch": 1535} {"train_loss": -22.467039108276367, "global_step": 127420, "epoch": 1535} {"train_loss": -22.5308837890625, "global_step": 127421, "epoch": 1535} {"train_loss": -22.49660301208496, "global_step": 127422, "epoch": 1535} {"train_loss": -22.5540828704834, "global_step": 127423, "epoch": 1535} {"train_loss": -22.518672943115234, "global_step": 127424, "epoch": 1535} {"train_loss": -22.492673873901367, "global_step": 127425, "epoch": 1535} {"train_loss": -22.532821655273438, "global_step": 127426, "epoch": 1535} {"train_loss": -22.916372299194336, "global_step": 127427, "epoch": 1535} {"train_loss": -22.569913864135742, "global_step": 127428, "epoch": 1535} {"train_loss": -22.947385787963867, "global_step": 127429, "epoch": 1535} {"train_loss": -22.539405822753906, "global_step": 127430, "epoch": 1535} {"train_loss": -22.723440170288086, "global_step": 127431, "epoch": 1535} {"train_loss": -22.858407974243164, "global_step": 127432, "epoch": 1535} {"train_loss": -22.58662223815918, "global_step": 127433, "epoch": 1535} {"train_loss": -22.714033126831055, "global_step": 127434, "epoch": 1535} {"train_loss": -22.9372501373291, "global_step": 127435, "epoch": 1535} {"train_loss": -22.784250259399414, "global_step": 127436, "epoch": 1535} {"train_loss": -23.164159774780273, "global_step": 127437, "epoch": 1535} {"train_loss": -22.6174373626709, "global_step": 127438, "epoch": 1535} {"train_loss": -22.784656524658203, "global_step": 127439, "epoch": 1535} {"train_loss": -23.108238220214844, "global_step": 127440, "epoch": 1535} {"train_loss": -22.683340072631836, "global_step": 127441, "epoch": 1535} {"train_loss": -22.602710723876953, "global_step": 127442, "epoch": 1535} {"train_loss": -22.996091842651367, "global_step": 127443, "epoch": 1535} {"train_loss": -23.02747917175293, "global_step": 127444, "epoch": 1535} {"train_loss": -22.5999813079834, "global_step": 127445, "epoch": 1535} {"train_loss": -22.817312240600586, "global_step": 127446, "epoch": 1535} {"train_loss": -22.567291259765625, "global_step": 127447, "epoch": 1535} {"train_loss": -22.72452163696289, "global_step": 127448, "epoch": 1535} {"train_loss": -22.707904815673828, "global_step": 127449, "epoch": 1535} {"train_loss": -22.8908748626709, "global_step": 127450, "epoch": 1535} {"train_loss": -22.9105224609375, "global_step": 127451, "epoch": 1535} {"train_loss": -22.708097457885742, "global_step": 127452, "epoch": 1535} {"train_loss": -22.665185928344727, "global_step": 127453, "epoch": 1535} {"train_loss": -22.85586166381836, "global_step": 127454, "epoch": 1535} {"train_loss": -22.883544921875, "global_step": 127455, "epoch": 1535} {"train_loss": -22.585519790649414, "global_step": 127456, "epoch": 1535} {"train_loss": -23.110342025756836, "global_step": 127457, "epoch": 1535} {"train_loss": -22.8780574798584, "global_step": 127458, "epoch": 1535} {"train_loss": -23.02545738220215, "global_step": 127459, "epoch": 1535} {"train_loss": -22.669937133789062, "global_step": 127460, "epoch": 1535} {"train_loss": -22.70465087890625, "global_step": 127461, "epoch": 1535} {"train_loss": -22.651865005493164, "global_step": 127462, "epoch": 1535} {"train_loss": -22.510746002197266, "global_step": 127463, "epoch": 1535} {"train_loss": -22.738088607788086, "global_step": 127464, "epoch": 1535} {"train_loss": -22.57245635986328, "global_step": 127465, "epoch": 1535} {"train_loss": -22.996116638183594, "global_step": 127466, "epoch": 1535} {"train_loss": -22.95685386657715, "global_step": 127467, "epoch": 1535} {"train_loss": -22.59681510925293, "global_step": 127468, "epoch": 1535} {"train_loss": -22.971237182617188, "global_step": 127469, "epoch": 1535} {"train_loss": -23.123950958251953, "global_step": 127470, "epoch": 1535} {"train_loss": -23.130407333374023, "global_step": 127471, "epoch": 1535} {"train_loss": -22.9610595703125, "global_step": 127472, "epoch": 1535} {"train_loss": -22.553781509399414, "global_step": 127473, "epoch": 1535} {"train_loss": -22.897241592407227, "global_step": 127474, "epoch": 1535} {"train_loss": -22.68075180053711, "global_step": 127475, "epoch": 1535} {"train_loss": -22.767282485961914, "global_step": 127476, "epoch": 1535} {"train_loss": -22.80373191833496, "global_step": 127477, "epoch": 1535} {"train_loss": -22.80284309387207, "global_step": 127478, "epoch": 1535} {"train_loss": -22.912397384643555, "global_step": 127479, "epoch": 1535} {"train_loss": -22.607431411743164, "global_step": 127480, "epoch": 1535} {"train_loss": -22.897924423217773, "global_step": 127481, "epoch": 1535} {"train_loss": -22.495914459228516, "global_step": 127482, "epoch": 1535} {"train_loss": -22.619375228881836, "global_step": 127483, "epoch": 1535} {"train_loss": -23.08620262145996, "global_step": 127484, "epoch": 1535} {"train_loss": -22.780094146728516, "global_step": 127485, "epoch": 1535} {"train_loss": -23.114242553710938, "global_step": 127486, "epoch": 1535} {"train_loss": -22.749934805444923, "global_step": 127487, "epoch": 1535, "val_loss": 6288254.0} {"train_loss": -22.232364654541016, "global_step": 127488, "epoch": 1536} {"train_loss": -22.469167709350586, "global_step": 127489, "epoch": 1536} {"train_loss": -22.553953170776367, "global_step": 127490, "epoch": 1536} {"train_loss": -22.286211013793945, "global_step": 127491, "epoch": 1536} {"train_loss": -22.549787521362305, "global_step": 127492, "epoch": 1536} {"train_loss": -22.303110122680664, "global_step": 127493, "epoch": 1536} {"train_loss": -22.34734535217285, "global_step": 127494, "epoch": 1536} {"train_loss": -22.944181442260742, "global_step": 127495, "epoch": 1536} {"train_loss": -22.593414306640625, "global_step": 127496, "epoch": 1536} {"train_loss": -22.539752960205078, "global_step": 127497, "epoch": 1536} {"train_loss": -22.724912643432617, "global_step": 127498, "epoch": 1536} {"train_loss": -22.305601119995117, "global_step": 127499, "epoch": 1536} {"train_loss": -22.215614318847656, "global_step": 127500, "epoch": 1536} {"train_loss": -22.729814529418945, "global_step": 127501, "epoch": 1536} {"train_loss": -22.87441062927246, "global_step": 127502, "epoch": 1536} {"train_loss": -22.620019912719727, "global_step": 127503, "epoch": 1536} {"train_loss": -22.886613845825195, "global_step": 127504, "epoch": 1536} {"train_loss": -22.739633560180664, "global_step": 127505, "epoch": 1536} {"train_loss": -22.299484252929688, "global_step": 127506, "epoch": 1536} {"train_loss": -22.827787399291992, "global_step": 127507, "epoch": 1536} {"train_loss": -22.780933380126953, "global_step": 127508, "epoch": 1536} {"train_loss": -22.471393585205078, "global_step": 127509, "epoch": 1536} {"train_loss": -22.835630416870117, "global_step": 127510, "epoch": 1536} {"train_loss": -22.33391761779785, "global_step": 127511, "epoch": 1536} {"train_loss": -22.74650764465332, "global_step": 127512, "epoch": 1536} {"train_loss": -22.577634811401367, "global_step": 127513, "epoch": 1536} {"train_loss": -22.5507869720459, "global_step": 127514, "epoch": 1536} {"train_loss": -22.886377334594727, "global_step": 127515, "epoch": 1536} {"train_loss": -22.847803115844727, "global_step": 127516, "epoch": 1536} {"train_loss": -22.73502540588379, "global_step": 127517, "epoch": 1536} {"train_loss": -22.7393798828125, "global_step": 127518, "epoch": 1536} {"train_loss": -22.4112548828125, "global_step": 127519, "epoch": 1536} {"train_loss": -22.538408279418945, "global_step": 127520, "epoch": 1536} {"train_loss": -22.851978302001953, "global_step": 127521, "epoch": 1536} {"train_loss": -22.527820587158203, "global_step": 127522, "epoch": 1536} {"train_loss": -22.32119369506836, "global_step": 127523, "epoch": 1536} {"train_loss": -22.684524536132812, "global_step": 127524, "epoch": 1536} {"train_loss": -22.607419967651367, "global_step": 127525, "epoch": 1536} {"train_loss": -22.484167098999023, "global_step": 127526, "epoch": 1536} {"train_loss": -22.81403160095215, "global_step": 127527, "epoch": 1536} {"train_loss": -22.642019271850586, "global_step": 127528, "epoch": 1536} {"train_loss": -22.730772018432617, "global_step": 127529, "epoch": 1536} {"train_loss": -22.296913146972656, "global_step": 127530, "epoch": 1536} {"train_loss": -22.483734130859375, "global_step": 127531, "epoch": 1536} {"train_loss": -22.73479652404785, "global_step": 127532, "epoch": 1536} {"train_loss": -22.8331241607666, "global_step": 127533, "epoch": 1536} {"train_loss": -22.974512100219727, "global_step": 127534, "epoch": 1536} {"train_loss": -22.473167419433594, "global_step": 127535, "epoch": 1536} {"train_loss": -23.108963012695312, "global_step": 127536, "epoch": 1536} {"train_loss": -22.58277702331543, "global_step": 127537, "epoch": 1536} {"train_loss": -22.704641342163086, "global_step": 127538, "epoch": 1536} {"train_loss": -22.849592208862305, "global_step": 127539, "epoch": 1536} {"train_loss": -23.091615676879883, "global_step": 127540, "epoch": 1536} {"train_loss": -22.457904815673828, "global_step": 127541, "epoch": 1536} {"train_loss": -22.862077713012695, "global_step": 127542, "epoch": 1536} {"train_loss": -22.902986526489258, "global_step": 127543, "epoch": 1536} {"train_loss": -22.49824333190918, "global_step": 127544, "epoch": 1536} {"train_loss": -22.96140480041504, "global_step": 127545, "epoch": 1536} {"train_loss": -22.85292625427246, "global_step": 127546, "epoch": 1536} {"train_loss": -22.88680076599121, "global_step": 127547, "epoch": 1536} {"train_loss": -22.836118698120117, "global_step": 127548, "epoch": 1536} {"train_loss": -22.7189998626709, "global_step": 127549, "epoch": 1536} {"train_loss": -22.946308135986328, "global_step": 127550, "epoch": 1536} {"train_loss": -22.502506256103516, "global_step": 127551, "epoch": 1536} {"train_loss": -22.963001251220703, "global_step": 127552, "epoch": 1536} {"train_loss": -22.867321014404297, "global_step": 127553, "epoch": 1536} {"train_loss": -22.785438537597656, "global_step": 127554, "epoch": 1536} {"train_loss": -22.936866760253906, "global_step": 127555, "epoch": 1536} {"train_loss": -22.779523849487305, "global_step": 127556, "epoch": 1536} {"train_loss": -22.479047775268555, "global_step": 127557, "epoch": 1536} {"train_loss": -22.646936416625977, "global_step": 127558, "epoch": 1536} {"train_loss": -22.574182510375977, "global_step": 127559, "epoch": 1536} {"train_loss": -22.944555282592773, "global_step": 127560, "epoch": 1536} {"train_loss": -23.093826293945312, "global_step": 127561, "epoch": 1536} {"train_loss": -22.920028686523438, "global_step": 127562, "epoch": 1536} {"train_loss": -22.82573127746582, "global_step": 127563, "epoch": 1536} {"train_loss": -22.7111759185791, "global_step": 127564, "epoch": 1536} {"train_loss": -22.553478240966797, "global_step": 127565, "epoch": 1536} {"train_loss": -22.910968780517578, "global_step": 127566, "epoch": 1536} {"train_loss": -22.500587463378906, "global_step": 127567, "epoch": 1536} {"train_loss": -22.436662673950195, "global_step": 127568, "epoch": 1536} {"train_loss": -22.724836349487305, "global_step": 127569, "epoch": 1536} {"train_loss": -22.68116695909615, "global_step": 127570, "epoch": 1536, "val_loss": 6239969.0} {"train_loss": -22.133220672607422, "global_step": 127571, "epoch": 1537} {"train_loss": -21.89982032775879, "global_step": 127572, "epoch": 1537} {"train_loss": -22.324617385864258, "global_step": 127573, "epoch": 1537} {"train_loss": -22.01266860961914, "global_step": 127574, "epoch": 1537} {"train_loss": -22.163793563842773, "global_step": 127575, "epoch": 1537} {"train_loss": -22.387723922729492, "global_step": 127576, "epoch": 1537} {"train_loss": -22.069168090820312, "global_step": 127577, "epoch": 1537} {"train_loss": -22.307886123657227, "global_step": 127578, "epoch": 1537} {"train_loss": -22.491161346435547, "global_step": 127579, "epoch": 1537} {"train_loss": -22.083648681640625, "global_step": 127580, "epoch": 1537} {"train_loss": -22.486148834228516, "global_step": 127581, "epoch": 1537} {"train_loss": -22.2804012298584, "global_step": 127582, "epoch": 1537} {"train_loss": -22.344472885131836, "global_step": 127583, "epoch": 1537} {"train_loss": -22.49668312072754, "global_step": 127584, "epoch": 1537} {"train_loss": -22.272809982299805, "global_step": 127585, "epoch": 1537} {"train_loss": -22.7187442779541, "global_step": 127586, "epoch": 1537} {"train_loss": -22.686201095581055, "global_step": 127587, "epoch": 1537} {"train_loss": -22.406116485595703, "global_step": 127588, "epoch": 1537} {"train_loss": -22.3988094329834, "global_step": 127589, "epoch": 1537} {"train_loss": -22.623798370361328, "global_step": 127590, "epoch": 1537} {"train_loss": -22.399438858032227, "global_step": 127591, "epoch": 1537} {"train_loss": -22.463159561157227, "global_step": 127592, "epoch": 1537} {"train_loss": -22.60784339904785, "global_step": 127593, "epoch": 1537} {"train_loss": -22.40802001953125, "global_step": 127594, "epoch": 1537} {"train_loss": -22.606014251708984, "global_step": 127595, "epoch": 1537} {"train_loss": -22.91108512878418, "global_step": 127596, "epoch": 1537} {"train_loss": -22.505111694335938, "global_step": 127597, "epoch": 1537} {"train_loss": -22.851268768310547, "global_step": 127598, "epoch": 1537} {"train_loss": -22.954999923706055, "global_step": 127599, "epoch": 1537} {"train_loss": -22.825803756713867, "global_step": 127600, "epoch": 1537} {"train_loss": -22.79933738708496, "global_step": 127601, "epoch": 1537} {"train_loss": -22.854969024658203, "global_step": 127602, "epoch": 1537} {"train_loss": -22.43248748779297, "global_step": 127603, "epoch": 1537} {"train_loss": -22.841934204101562, "global_step": 127604, "epoch": 1537} {"train_loss": -22.385910034179688, "global_step": 127605, "epoch": 1537} {"train_loss": -22.5245361328125, "global_step": 127606, "epoch": 1537} {"train_loss": -22.97181510925293, "global_step": 127607, "epoch": 1537} {"train_loss": -22.303075790405273, "global_step": 127608, "epoch": 1537} {"train_loss": -22.787029266357422, "global_step": 127609, "epoch": 1537} {"train_loss": -22.95188331604004, "global_step": 127610, "epoch": 1537} {"train_loss": -22.337656021118164, "global_step": 127611, "epoch": 1537} {"train_loss": -23.030202865600586, "global_step": 127612, "epoch": 1537} {"train_loss": -22.8548583984375, "global_step": 127613, "epoch": 1537} {"train_loss": -22.719514846801758, "global_step": 127614, "epoch": 1537} {"train_loss": -22.449872970581055, "global_step": 127615, "epoch": 1537} {"train_loss": -22.838119506835938, "global_step": 127616, "epoch": 1537} {"train_loss": -22.774089813232422, "global_step": 127617, "epoch": 1537} {"train_loss": -22.65787124633789, "global_step": 127618, "epoch": 1537} {"train_loss": -22.4643497467041, "global_step": 127619, "epoch": 1537} {"train_loss": -22.47113037109375, "global_step": 127620, "epoch": 1537} {"train_loss": -22.34877586364746, "global_step": 127621, "epoch": 1537} {"train_loss": -22.6476993560791, "global_step": 127622, "epoch": 1537} {"train_loss": -22.921621322631836, "global_step": 127623, "epoch": 1537} {"train_loss": -22.701162338256836, "global_step": 127624, "epoch": 1537} {"train_loss": -22.394140243530273, "global_step": 127625, "epoch": 1537} {"train_loss": -22.435510635375977, "global_step": 127626, "epoch": 1537} {"train_loss": -22.12941551208496, "global_step": 127627, "epoch": 1537} {"train_loss": -22.285526275634766, "global_step": 127628, "epoch": 1537} {"train_loss": -22.704191207885742, "global_step": 127629, "epoch": 1537} {"train_loss": -22.084497451782227, "global_step": 127630, "epoch": 1537} {"train_loss": -22.43939781188965, "global_step": 127631, "epoch": 1537} {"train_loss": -22.62065315246582, "global_step": 127632, "epoch": 1537} {"train_loss": -22.604541778564453, "global_step": 127633, "epoch": 1537} {"train_loss": -22.391271591186523, "global_step": 127634, "epoch": 1537} {"train_loss": -22.525028228759766, "global_step": 127635, "epoch": 1537} {"train_loss": -22.8914852142334, "global_step": 127636, "epoch": 1537} {"train_loss": -22.845640182495117, "global_step": 127637, "epoch": 1537} {"train_loss": -22.741870880126953, "global_step": 127638, "epoch": 1537} {"train_loss": -22.913726806640625, "global_step": 127639, "epoch": 1537} {"train_loss": -23.125638961791992, "global_step": 127640, "epoch": 1537} {"train_loss": -22.83831787109375, "global_step": 127641, "epoch": 1537} {"train_loss": -22.441747665405273, "global_step": 127642, "epoch": 1537} {"train_loss": -22.441165924072266, "global_step": 127643, "epoch": 1537} {"train_loss": -22.929214477539062, "global_step": 127644, "epoch": 1537} {"train_loss": -22.84029769897461, "global_step": 127645, "epoch": 1537} {"train_loss": -22.4757022857666, "global_step": 127646, "epoch": 1537} {"train_loss": -23.14004898071289, "global_step": 127647, "epoch": 1537} {"train_loss": -22.626569747924805, "global_step": 127648, "epoch": 1537} {"train_loss": -22.9541072845459, "global_step": 127649, "epoch": 1537} {"train_loss": -22.964248657226562, "global_step": 127650, "epoch": 1537} {"train_loss": -22.742895126342773, "global_step": 127651, "epoch": 1537} {"train_loss": -22.8731632232666, "global_step": 127652, "epoch": 1537} {"train_loss": -22.59016891847174, "global_step": 127653, "epoch": 1537, "val_loss": 6488892.0} {"train_loss": -21.43024444580078, "global_step": 127654, "epoch": 1538} {"train_loss": -21.99639320373535, "global_step": 127655, "epoch": 1538} {"train_loss": -21.62324333190918, "global_step": 127656, "epoch": 1538} {"train_loss": -22.129682540893555, "global_step": 127657, "epoch": 1538} {"train_loss": -21.690719604492188, "global_step": 127658, "epoch": 1538} {"train_loss": -21.781269073486328, "global_step": 127659, "epoch": 1538} {"train_loss": -22.041406631469727, "global_step": 127660, "epoch": 1538} {"train_loss": -21.938400268554688, "global_step": 127661, "epoch": 1538} {"train_loss": -22.256811141967773, "global_step": 127662, "epoch": 1538} {"train_loss": -22.085424423217773, "global_step": 127663, "epoch": 1538} {"train_loss": -21.92498779296875, "global_step": 127664, "epoch": 1538} {"train_loss": -21.80049705505371, "global_step": 127665, "epoch": 1538} {"train_loss": -22.09117317199707, "global_step": 127666, "epoch": 1538} {"train_loss": -22.1203670501709, "global_step": 127667, "epoch": 1538} {"train_loss": -21.9464054107666, "global_step": 127668, "epoch": 1538} {"train_loss": -22.346662521362305, "global_step": 127669, "epoch": 1538} {"train_loss": -22.242582321166992, "global_step": 127670, "epoch": 1538} {"train_loss": -22.092201232910156, "global_step": 127671, "epoch": 1538} {"train_loss": -22.275558471679688, "global_step": 127672, "epoch": 1538} {"train_loss": -22.230472564697266, "global_step": 127673, "epoch": 1538} {"train_loss": -22.202512741088867, "global_step": 127674, "epoch": 1538} {"train_loss": -22.46058464050293, "global_step": 127675, "epoch": 1538} {"train_loss": -22.714109420776367, "global_step": 127676, "epoch": 1538} {"train_loss": -22.792003631591797, "global_step": 127677, "epoch": 1538} {"train_loss": -22.680723190307617, "global_step": 127678, "epoch": 1538} {"train_loss": -22.540002822875977, "global_step": 127679, "epoch": 1538} {"train_loss": -22.42235565185547, "global_step": 127680, "epoch": 1538} {"train_loss": -22.816028594970703, "global_step": 127681, "epoch": 1538} {"train_loss": -22.808279037475586, "global_step": 127682, "epoch": 1538} {"train_loss": -22.62103271484375, "global_step": 127683, "epoch": 1538} {"train_loss": -22.70992088317871, "global_step": 127684, "epoch": 1538} {"train_loss": -22.819459915161133, "global_step": 127685, "epoch": 1538} {"train_loss": -23.199193954467773, "global_step": 127686, "epoch": 1538} {"train_loss": -22.600793838500977, "global_step": 127687, "epoch": 1538} {"train_loss": -22.406644821166992, "global_step": 127688, "epoch": 1538} {"train_loss": -22.794166564941406, "global_step": 127689, "epoch": 1538} {"train_loss": -22.56532859802246, "global_step": 127690, "epoch": 1538} {"train_loss": -22.42943000793457, "global_step": 127691, "epoch": 1538} {"train_loss": -22.480884552001953, "global_step": 127692, "epoch": 1538} {"train_loss": -22.530790328979492, "global_step": 127693, "epoch": 1538} {"train_loss": -22.79229736328125, "global_step": 127694, "epoch": 1538} {"train_loss": -22.969762802124023, "global_step": 127695, "epoch": 1538} {"train_loss": -22.910648345947266, "global_step": 127696, "epoch": 1538} {"train_loss": -22.721040725708008, "global_step": 127697, "epoch": 1538} {"train_loss": -22.66009521484375, "global_step": 127698, "epoch": 1538} {"train_loss": -22.26688003540039, "global_step": 127699, "epoch": 1538} {"train_loss": -22.95944595336914, "global_step": 127700, "epoch": 1538} {"train_loss": -22.445110321044922, "global_step": 127701, "epoch": 1538} {"train_loss": -22.63963508605957, "global_step": 127702, "epoch": 1538} {"train_loss": -22.708581924438477, "global_step": 127703, "epoch": 1538} {"train_loss": -22.579326629638672, "global_step": 127704, "epoch": 1538} {"train_loss": -22.5872745513916, "global_step": 127705, "epoch": 1538} {"train_loss": -22.591434478759766, "global_step": 127706, "epoch": 1538} {"train_loss": -23.00958824157715, "global_step": 127707, "epoch": 1538} {"train_loss": -22.427148818969727, "global_step": 127708, "epoch": 1538} {"train_loss": -22.787233352661133, "global_step": 127709, "epoch": 1538} {"train_loss": -22.63411521911621, "global_step": 127710, "epoch": 1538} {"train_loss": -22.52193832397461, "global_step": 127711, "epoch": 1538} {"train_loss": -22.680511474609375, "global_step": 127712, "epoch": 1538} {"train_loss": -22.611900329589844, "global_step": 127713, "epoch": 1538} {"train_loss": -22.41421890258789, "global_step": 127714, "epoch": 1538} {"train_loss": -22.284912109375, "global_step": 127715, "epoch": 1538} {"train_loss": -22.738500595092773, "global_step": 127716, "epoch": 1538} {"train_loss": -22.891387939453125, "global_step": 127717, "epoch": 1538} {"train_loss": -22.296092987060547, "global_step": 127718, "epoch": 1538} {"train_loss": -21.987775802612305, "global_step": 127719, "epoch": 1538} {"train_loss": -22.44630241394043, "global_step": 127720, "epoch": 1538} {"train_loss": -22.381622314453125, "global_step": 127721, "epoch": 1538} {"train_loss": -22.673219680786133, "global_step": 127722, "epoch": 1538} {"train_loss": -22.285324096679688, "global_step": 127723, "epoch": 1538} {"train_loss": -22.781692504882812, "global_step": 127724, "epoch": 1538} {"train_loss": -22.641010284423828, "global_step": 127725, "epoch": 1538} {"train_loss": -22.06825828552246, "global_step": 127726, "epoch": 1538} {"train_loss": -22.41319465637207, "global_step": 127727, "epoch": 1538} {"train_loss": -23.084369659423828, "global_step": 127728, "epoch": 1538} {"train_loss": -22.417098999023438, "global_step": 127729, "epoch": 1538} {"train_loss": -22.55341911315918, "global_step": 127730, "epoch": 1538} {"train_loss": -22.889432907104492, "global_step": 127731, "epoch": 1538} {"train_loss": -22.421655654907227, "global_step": 127732, "epoch": 1538} {"train_loss": -22.648242950439453, "global_step": 127733, "epoch": 1538} {"train_loss": -22.31134796142578, "global_step": 127734, "epoch": 1538} {"train_loss": -22.840633392333984, "global_step": 127735, "epoch": 1538} {"train_loss": -22.4691614817424, "global_step": 127736, "epoch": 1538, "val_loss": 6186837.0} {"train_loss": -21.833858489990234, "global_step": 127737, "epoch": 1539} {"train_loss": -22.38268280029297, "global_step": 127738, "epoch": 1539} {"train_loss": -22.159456253051758, "global_step": 127739, "epoch": 1539} {"train_loss": -21.76498031616211, "global_step": 127740, "epoch": 1539} {"train_loss": -22.657697677612305, "global_step": 127741, "epoch": 1539} {"train_loss": -22.4466609954834, "global_step": 127742, "epoch": 1539} {"train_loss": -22.078712463378906, "global_step": 127743, "epoch": 1539} {"train_loss": -22.403350830078125, "global_step": 127744, "epoch": 1539} {"train_loss": -21.739553451538086, "global_step": 127745, "epoch": 1539} {"train_loss": -22.875795364379883, "global_step": 127746, "epoch": 1539} {"train_loss": -22.197969436645508, "global_step": 127747, "epoch": 1539} {"train_loss": -22.24748992919922, "global_step": 127748, "epoch": 1539} {"train_loss": -22.41529655456543, "global_step": 127749, "epoch": 1539} {"train_loss": -22.473875045776367, "global_step": 127750, "epoch": 1539} {"train_loss": -22.43122673034668, "global_step": 127751, "epoch": 1539} {"train_loss": -22.431583404541016, "global_step": 127752, "epoch": 1539} {"train_loss": -22.433195114135742, "global_step": 127753, "epoch": 1539} {"train_loss": -22.521900177001953, "global_step": 127754, "epoch": 1539} {"train_loss": -23.03111457824707, "global_step": 127755, "epoch": 1539} {"train_loss": -22.69256019592285, "global_step": 127756, "epoch": 1539} {"train_loss": -22.492595672607422, "global_step": 127757, "epoch": 1539} {"train_loss": -22.4014835357666, "global_step": 127758, "epoch": 1539} {"train_loss": -22.997373580932617, "global_step": 127759, "epoch": 1539} {"train_loss": -22.63228416442871, "global_step": 127760, "epoch": 1539} {"train_loss": -22.55307388305664, "global_step": 127761, "epoch": 1539} {"train_loss": -22.36522102355957, "global_step": 127762, "epoch": 1539} {"train_loss": -22.68975830078125, "global_step": 127763, "epoch": 1539} {"train_loss": -22.65912437438965, "global_step": 127764, "epoch": 1539} {"train_loss": -22.772300720214844, "global_step": 127765, "epoch": 1539} {"train_loss": -22.950986862182617, "global_step": 127766, "epoch": 1539} {"train_loss": -22.755332946777344, "global_step": 127767, "epoch": 1539} {"train_loss": -22.895671844482422, "global_step": 127768, "epoch": 1539} {"train_loss": -22.91223907470703, "global_step": 127769, "epoch": 1539} {"train_loss": -22.5635986328125, "global_step": 127770, "epoch": 1539} {"train_loss": -23.047164916992188, "global_step": 127771, "epoch": 1539} {"train_loss": -22.202661514282227, "global_step": 127772, "epoch": 1539} {"train_loss": -22.666397094726562, "global_step": 127773, "epoch": 1539} {"train_loss": -23.044178009033203, "global_step": 127774, "epoch": 1539} {"train_loss": -22.937143325805664, "global_step": 127775, "epoch": 1539} {"train_loss": -22.586544036865234, "global_step": 127776, "epoch": 1539} {"train_loss": -22.631940841674805, "global_step": 127777, "epoch": 1539} {"train_loss": -22.85749626159668, "global_step": 127778, "epoch": 1539} {"train_loss": -22.620515823364258, "global_step": 127779, "epoch": 1539} {"train_loss": -22.43657875061035, "global_step": 127780, "epoch": 1539} {"train_loss": -22.877208709716797, "global_step": 127781, "epoch": 1539} {"train_loss": -22.832929611206055, "global_step": 127782, "epoch": 1539} {"train_loss": -22.9150333404541, "global_step": 127783, "epoch": 1539} {"train_loss": -22.7381649017334, "global_step": 127784, "epoch": 1539} {"train_loss": -23.1904296875, "global_step": 127785, "epoch": 1539} {"train_loss": -22.92828941345215, "global_step": 127786, "epoch": 1539} {"train_loss": -23.00896453857422, "global_step": 127787, "epoch": 1539} {"train_loss": -22.726247787475586, "global_step": 127788, "epoch": 1539} {"train_loss": -22.756078720092773, "global_step": 127789, "epoch": 1539} {"train_loss": -22.593955993652344, "global_step": 127790, "epoch": 1539} {"train_loss": -23.092864990234375, "global_step": 127791, "epoch": 1539} {"train_loss": -22.8792724609375, "global_step": 127792, "epoch": 1539} {"train_loss": -22.711177825927734, "global_step": 127793, "epoch": 1539} {"train_loss": -22.730812072753906, "global_step": 127794, "epoch": 1539} {"train_loss": -22.913047790527344, "global_step": 127795, "epoch": 1539} {"train_loss": -22.540254592895508, "global_step": 127796, "epoch": 1539} {"train_loss": -22.549224853515625, "global_step": 127797, "epoch": 1539} {"train_loss": -23.324094772338867, "global_step": 127798, "epoch": 1539} {"train_loss": -22.49216651916504, "global_step": 127799, "epoch": 1539} {"train_loss": -22.556472778320312, "global_step": 127800, "epoch": 1539} {"train_loss": -22.6927490234375, "global_step": 127801, "epoch": 1539} {"train_loss": -22.688663482666016, "global_step": 127802, "epoch": 1539} {"train_loss": -22.999547958374023, "global_step": 127803, "epoch": 1539} {"train_loss": -22.977432250976562, "global_step": 127804, "epoch": 1539} {"train_loss": -22.740488052368164, "global_step": 127805, "epoch": 1539} {"train_loss": -22.579214096069336, "global_step": 127806, "epoch": 1539} {"train_loss": -22.86745262145996, "global_step": 127807, "epoch": 1539} {"train_loss": -22.696151733398438, "global_step": 127808, "epoch": 1539} {"train_loss": -22.492124557495117, "global_step": 127809, "epoch": 1539} {"train_loss": -22.743423461914062, "global_step": 127810, "epoch": 1539} {"train_loss": -22.59228515625, "global_step": 127811, "epoch": 1539} {"train_loss": -22.50680923461914, "global_step": 127812, "epoch": 1539} {"train_loss": -22.73233985900879, "global_step": 127813, "epoch": 1539} {"train_loss": -22.922632217407227, "global_step": 127814, "epoch": 1539} {"train_loss": -23.203052520751953, "global_step": 127815, "epoch": 1539} {"train_loss": -22.646806716918945, "global_step": 127816, "epoch": 1539} {"train_loss": -22.876691818237305, "global_step": 127817, "epoch": 1539} {"train_loss": -22.76287269592285, "global_step": 127818, "epoch": 1539} {"train_loss": -22.65554611941418, "global_step": 127819, "epoch": 1539, "val_loss": 6249740.0} {"train_loss": -21.562639236450195, "global_step": 127820, "epoch": 1540} {"train_loss": -22.43568992614746, "global_step": 127821, "epoch": 1540} {"train_loss": -22.214624404907227, "global_step": 127822, "epoch": 1540} {"train_loss": -22.280818939208984, "global_step": 127823, "epoch": 1540} {"train_loss": -22.479581832885742, "global_step": 127824, "epoch": 1540} {"train_loss": -22.80516242980957, "global_step": 127825, "epoch": 1540} {"train_loss": -22.269895553588867, "global_step": 127826, "epoch": 1540} {"train_loss": -22.493078231811523, "global_step": 127827, "epoch": 1540} {"train_loss": -22.358686447143555, "global_step": 127828, "epoch": 1540} {"train_loss": -22.400190353393555, "global_step": 127829, "epoch": 1540} {"train_loss": -22.66598892211914, "global_step": 127830, "epoch": 1540} {"train_loss": -22.933629989624023, "global_step": 127831, "epoch": 1540} {"train_loss": -22.250036239624023, "global_step": 127832, "epoch": 1540} {"train_loss": -22.5435733795166, "global_step": 127833, "epoch": 1540} {"train_loss": -22.13877296447754, "global_step": 127834, "epoch": 1540} {"train_loss": -22.62289810180664, "global_step": 127835, "epoch": 1540} {"train_loss": -22.75164794921875, "global_step": 127836, "epoch": 1540} {"train_loss": -22.965818405151367, "global_step": 127837, "epoch": 1540} {"train_loss": -22.516748428344727, "global_step": 127838, "epoch": 1540} {"train_loss": -22.379316329956055, "global_step": 127839, "epoch": 1540} {"train_loss": -22.725278854370117, "global_step": 127840, "epoch": 1540} {"train_loss": -22.59323501586914, "global_step": 127841, "epoch": 1540} {"train_loss": -23.134199142456055, "global_step": 127842, "epoch": 1540} {"train_loss": -22.71518898010254, "global_step": 127843, "epoch": 1540} {"train_loss": -22.972129821777344, "global_step": 127844, "epoch": 1540} {"train_loss": -22.88692283630371, "global_step": 127845, "epoch": 1540} {"train_loss": -22.7796688079834, "global_step": 127846, "epoch": 1540} {"train_loss": -22.286176681518555, "global_step": 127847, "epoch": 1540} {"train_loss": -22.590408325195312, "global_step": 127848, "epoch": 1540} {"train_loss": -22.695451736450195, "global_step": 127849, "epoch": 1540} {"train_loss": -22.995899200439453, "global_step": 127850, "epoch": 1540} {"train_loss": -22.879703521728516, "global_step": 127851, "epoch": 1540} {"train_loss": -23.210458755493164, "global_step": 127852, "epoch": 1540} {"train_loss": -22.56209373474121, "global_step": 127853, "epoch": 1540} {"train_loss": -22.983774185180664, "global_step": 127854, "epoch": 1540} {"train_loss": -22.330358505249023, "global_step": 127855, "epoch": 1540} {"train_loss": -22.698713302612305, "global_step": 127856, "epoch": 1540} {"train_loss": -22.651962280273438, "global_step": 127857, "epoch": 1540} {"train_loss": -22.684804916381836, "global_step": 127858, "epoch": 1540} {"train_loss": -22.3789005279541, "global_step": 127859, "epoch": 1540} {"train_loss": -22.576669692993164, "global_step": 127860, "epoch": 1540} {"train_loss": -22.697629928588867, "global_step": 127861, "epoch": 1540} {"train_loss": -22.66800308227539, "global_step": 127862, "epoch": 1540} {"train_loss": -22.71229362487793, "global_step": 127863, "epoch": 1540} {"train_loss": -22.92926597595215, "global_step": 127864, "epoch": 1540} {"train_loss": -22.789236068725586, "global_step": 127865, "epoch": 1540} {"train_loss": -22.794055938720703, "global_step": 127866, "epoch": 1540} {"train_loss": -22.499608993530273, "global_step": 127867, "epoch": 1540} {"train_loss": -22.5897274017334, "global_step": 127868, "epoch": 1540} {"train_loss": -22.28217124938965, "global_step": 127869, "epoch": 1540} {"train_loss": -22.933218002319336, "global_step": 127870, "epoch": 1540} {"train_loss": -22.587604522705078, "global_step": 127871, "epoch": 1540} {"train_loss": -22.998126983642578, "global_step": 127872, "epoch": 1540} {"train_loss": -22.525041580200195, "global_step": 127873, "epoch": 1540} {"train_loss": -22.610881805419922, "global_step": 127874, "epoch": 1540} {"train_loss": -22.783903121948242, "global_step": 127875, "epoch": 1540} {"train_loss": -22.703031539916992, "global_step": 127876, "epoch": 1540} {"train_loss": -22.217641830444336, "global_step": 127877, "epoch": 1540} {"train_loss": -22.70362663269043, "global_step": 127878, "epoch": 1540} {"train_loss": -22.8851375579834, "global_step": 127879, "epoch": 1540} {"train_loss": -22.49677085876465, "global_step": 127880, "epoch": 1540} {"train_loss": -22.526029586791992, "global_step": 127881, "epoch": 1540} {"train_loss": -22.874107360839844, "global_step": 127882, "epoch": 1540} {"train_loss": -23.035795211791992, "global_step": 127883, "epoch": 1540} {"train_loss": -22.64335823059082, "global_step": 127884, "epoch": 1540} {"train_loss": -22.76272964477539, "global_step": 127885, "epoch": 1540} {"train_loss": -22.851545333862305, "global_step": 127886, "epoch": 1540} {"train_loss": -22.968507766723633, "global_step": 127887, "epoch": 1540} {"train_loss": -22.71988296508789, "global_step": 127888, "epoch": 1540} {"train_loss": -22.501996994018555, "global_step": 127889, "epoch": 1540} {"train_loss": -22.854955673217773, "global_step": 127890, "epoch": 1540} {"train_loss": -22.576265335083008, "global_step": 127891, "epoch": 1540} {"train_loss": -22.401823043823242, "global_step": 127892, "epoch": 1540} {"train_loss": -22.936622619628906, "global_step": 127893, "epoch": 1540} {"train_loss": -22.813390731811523, "global_step": 127894, "epoch": 1540} {"train_loss": -22.69386100769043, "global_step": 127895, "epoch": 1540} {"train_loss": -22.80852699279785, "global_step": 127896, "epoch": 1540} {"train_loss": -22.663589477539062, "global_step": 127897, "epoch": 1540} {"train_loss": -23.146480560302734, "global_step": 127898, "epoch": 1540} {"train_loss": -22.73500633239746, "global_step": 127899, "epoch": 1540} {"train_loss": -23.099119186401367, "global_step": 127900, "epoch": 1540} {"train_loss": -22.638288497924805, "global_step": 127901, "epoch": 1540} {"train_loss": -22.660966482507177, "global_step": 127902, "epoch": 1540, "val_loss": 6253899.0} {"train_loss": -21.61768913269043, "global_step": 127903, "epoch": 1541} {"train_loss": -22.583667755126953, "global_step": 127904, "epoch": 1541} {"train_loss": -22.73291015625, "global_step": 127905, "epoch": 1541} {"train_loss": -22.022624969482422, "global_step": 127906, "epoch": 1541} {"train_loss": -22.514850616455078, "global_step": 127907, "epoch": 1541} {"train_loss": -22.26183319091797, "global_step": 127908, "epoch": 1541} {"train_loss": -22.561840057373047, "global_step": 127909, "epoch": 1541} {"train_loss": -22.563505172729492, "global_step": 127910, "epoch": 1541} {"train_loss": -22.217182159423828, "global_step": 127911, "epoch": 1541} {"train_loss": -22.611631393432617, "global_step": 127912, "epoch": 1541} {"train_loss": -22.63938331604004, "global_step": 127913, "epoch": 1541} {"train_loss": -22.39948081970215, "global_step": 127914, "epoch": 1541} {"train_loss": -22.49754524230957, "global_step": 127915, "epoch": 1541} {"train_loss": -22.85553550720215, "global_step": 127916, "epoch": 1541} {"train_loss": -22.684858322143555, "global_step": 127917, "epoch": 1541} {"train_loss": -22.614837646484375, "global_step": 127918, "epoch": 1541} {"train_loss": -22.794689178466797, "global_step": 127919, "epoch": 1541} {"train_loss": -22.828855514526367, "global_step": 127920, "epoch": 1541} {"train_loss": -22.59259605407715, "global_step": 127921, "epoch": 1541} {"train_loss": -22.451387405395508, "global_step": 127922, "epoch": 1541} {"train_loss": -22.80897331237793, "global_step": 127923, "epoch": 1541} {"train_loss": -22.422399520874023, "global_step": 127924, "epoch": 1541} {"train_loss": -22.36102294921875, "global_step": 127925, "epoch": 1541} {"train_loss": -22.738515853881836, "global_step": 127926, "epoch": 1541} {"train_loss": -22.445804595947266, "global_step": 127927, "epoch": 1541} {"train_loss": -22.71905517578125, "global_step": 127928, "epoch": 1541} {"train_loss": -22.852825164794922, "global_step": 127929, "epoch": 1541} {"train_loss": -22.847492218017578, "global_step": 127930, "epoch": 1541} {"train_loss": -22.628013610839844, "global_step": 127931, "epoch": 1541} {"train_loss": -22.594970703125, "global_step": 127932, "epoch": 1541} {"train_loss": -22.31915283203125, "global_step": 127933, "epoch": 1541} {"train_loss": -22.57797622680664, "global_step": 127934, "epoch": 1541} {"train_loss": -22.875396728515625, "global_step": 127935, "epoch": 1541} {"train_loss": -22.42731285095215, "global_step": 127936, "epoch": 1541} {"train_loss": -22.68077850341797, "global_step": 127937, "epoch": 1541} {"train_loss": -22.47377586364746, "global_step": 127938, "epoch": 1541} {"train_loss": -22.975221633911133, "global_step": 127939, "epoch": 1541} {"train_loss": -22.590639114379883, "global_step": 127940, "epoch": 1541} {"train_loss": -22.66231346130371, "global_step": 127941, "epoch": 1541} {"train_loss": -22.792240142822266, "global_step": 127942, "epoch": 1541} {"train_loss": -23.20011329650879, "global_step": 127943, "epoch": 1541} {"train_loss": -22.955583572387695, "global_step": 127944, "epoch": 1541} {"train_loss": -22.782119750976562, "global_step": 127945, "epoch": 1541} {"train_loss": -22.954769134521484, "global_step": 127946, "epoch": 1541} {"train_loss": -23.180740356445312, "global_step": 127947, "epoch": 1541} {"train_loss": -23.282474517822266, "global_step": 127948, "epoch": 1541} {"train_loss": -22.632740020751953, "global_step": 127949, "epoch": 1541} {"train_loss": -23.029199600219727, "global_step": 127950, "epoch": 1541} {"train_loss": -22.642059326171875, "global_step": 127951, "epoch": 1541} {"train_loss": -22.658878326416016, "global_step": 127952, "epoch": 1541} {"train_loss": -22.7623348236084, "global_step": 127953, "epoch": 1541} {"train_loss": -23.18499183654785, "global_step": 127954, "epoch": 1541} {"train_loss": -22.62845230102539, "global_step": 127955, "epoch": 1541} {"train_loss": -22.90741539001465, "global_step": 127956, "epoch": 1541} {"train_loss": -22.844890594482422, "global_step": 127957, "epoch": 1541} {"train_loss": -22.742910385131836, "global_step": 127958, "epoch": 1541} {"train_loss": -22.973251342773438, "global_step": 127959, "epoch": 1541} {"train_loss": -22.98530387878418, "global_step": 127960, "epoch": 1541} {"train_loss": -22.7329158782959, "global_step": 127961, "epoch": 1541} {"train_loss": -23.08755874633789, "global_step": 127962, "epoch": 1541} {"train_loss": -22.828508377075195, "global_step": 127963, "epoch": 1541} {"train_loss": -22.785280227661133, "global_step": 127964, "epoch": 1541} {"train_loss": -22.793331146240234, "global_step": 127965, "epoch": 1541} {"train_loss": -22.857460021972656, "global_step": 127966, "epoch": 1541} {"train_loss": -22.74716567993164, "global_step": 127967, "epoch": 1541} {"train_loss": -22.889421463012695, "global_step": 127968, "epoch": 1541} {"train_loss": -22.631832122802734, "global_step": 127969, "epoch": 1541} {"train_loss": -22.737764358520508, "global_step": 127970, "epoch": 1541} {"train_loss": -22.887439727783203, "global_step": 127971, "epoch": 1541} {"train_loss": -22.425535202026367, "global_step": 127972, "epoch": 1541} {"train_loss": -22.696622848510742, "global_step": 127973, "epoch": 1541} {"train_loss": -23.03853416442871, "global_step": 127974, "epoch": 1541} {"train_loss": -22.5339412689209, "global_step": 127975, "epoch": 1541} {"train_loss": -22.30074119567871, "global_step": 127976, "epoch": 1541} {"train_loss": -22.74341583251953, "global_step": 127977, "epoch": 1541} {"train_loss": -22.53920555114746, "global_step": 127978, "epoch": 1541} {"train_loss": -22.596176147460938, "global_step": 127979, "epoch": 1541} {"train_loss": -22.80118179321289, "global_step": 127980, "epoch": 1541} {"train_loss": -22.68548011779785, "global_step": 127981, "epoch": 1541} {"train_loss": -22.662466049194336, "global_step": 127982, "epoch": 1541} {"train_loss": -22.29390525817871, "global_step": 127983, "epoch": 1541} {"train_loss": -22.24916648864746, "global_step": 127984, "epoch": 1541} {"train_loss": -22.681417212428816, "global_step": 127985, "epoch": 1541, "val_loss": 6245263.5} {"train_loss": -22.456457138061523, "global_step": 127986, "epoch": 1542} {"train_loss": -22.303939819335938, "global_step": 127987, "epoch": 1542} {"train_loss": -22.296049118041992, "global_step": 127988, "epoch": 1542} {"train_loss": -22.515045166015625, "global_step": 127989, "epoch": 1542} {"train_loss": -22.793975830078125, "global_step": 127990, "epoch": 1542} {"train_loss": -22.262495040893555, "global_step": 127991, "epoch": 1542} {"train_loss": -22.354167938232422, "global_step": 127992, "epoch": 1542} {"train_loss": -22.24210548400879, "global_step": 127993, "epoch": 1542} {"train_loss": -22.6922550201416, "global_step": 127994, "epoch": 1542} {"train_loss": -22.690139770507812, "global_step": 127995, "epoch": 1542} {"train_loss": -22.6824893951416, "global_step": 127996, "epoch": 1542} {"train_loss": -22.543853759765625, "global_step": 127997, "epoch": 1542} {"train_loss": -23.113195419311523, "global_step": 127998, "epoch": 1542} {"train_loss": -22.387901306152344, "global_step": 127999, "epoch": 1542} {"train_loss": -22.323644638061523, "global_step": 128000, "epoch": 1542} {"train_loss": -22.250823974609375, "global_step": 128001, "epoch": 1542} {"train_loss": -22.72446632385254, "global_step": 128002, "epoch": 1542} {"train_loss": -22.847482681274414, "global_step": 128003, "epoch": 1542} {"train_loss": -23.048782348632812, "global_step": 128004, "epoch": 1542} {"train_loss": -22.683908462524414, "global_step": 128005, "epoch": 1542} {"train_loss": -22.956451416015625, "global_step": 128006, "epoch": 1542} {"train_loss": -22.639936447143555, "global_step": 128007, "epoch": 1542} {"train_loss": -22.668542861938477, "global_step": 128008, "epoch": 1542} {"train_loss": -22.791812896728516, "global_step": 128009, "epoch": 1542} {"train_loss": -22.805356979370117, "global_step": 128010, "epoch": 1542} {"train_loss": -22.4910831451416, "global_step": 128011, "epoch": 1542} {"train_loss": -22.528730392456055, "global_step": 128012, "epoch": 1542} {"train_loss": -22.54544448852539, "global_step": 128013, "epoch": 1542} {"train_loss": -22.764801025390625, "global_step": 128014, "epoch": 1542} {"train_loss": -22.90876007080078, "global_step": 128015, "epoch": 1542} {"train_loss": -23.24452781677246, "global_step": 128016, "epoch": 1542} {"train_loss": -22.899946212768555, "global_step": 128017, "epoch": 1542} {"train_loss": -22.799057006835938, "global_step": 128018, "epoch": 1542} {"train_loss": -22.47515869140625, "global_step": 128019, "epoch": 1542} {"train_loss": -22.621780395507812, "global_step": 128020, "epoch": 1542} {"train_loss": -22.860036849975586, "global_step": 128021, "epoch": 1542} {"train_loss": -22.489646911621094, "global_step": 128022, "epoch": 1542} {"train_loss": -22.820697784423828, "global_step": 128023, "epoch": 1542} {"train_loss": -22.83448028564453, "global_step": 128024, "epoch": 1542} {"train_loss": -22.614927291870117, "global_step": 128025, "epoch": 1542} {"train_loss": -22.53374671936035, "global_step": 128026, "epoch": 1542} {"train_loss": -22.62725830078125, "global_step": 128027, "epoch": 1542} {"train_loss": -22.733854293823242, "global_step": 128028, "epoch": 1542} {"train_loss": -22.84494972229004, "global_step": 128029, "epoch": 1542} {"train_loss": -22.50312614440918, "global_step": 128030, "epoch": 1542} {"train_loss": -22.938323974609375, "global_step": 128031, "epoch": 1542} {"train_loss": -22.900012969970703, "global_step": 128032, "epoch": 1542} {"train_loss": -22.69185447692871, "global_step": 128033, "epoch": 1542} {"train_loss": -22.819318771362305, "global_step": 128034, "epoch": 1542} {"train_loss": -22.509506225585938, "global_step": 128035, "epoch": 1542} {"train_loss": -23.073318481445312, "global_step": 128036, "epoch": 1542} {"train_loss": -22.537494659423828, "global_step": 128037, "epoch": 1542} {"train_loss": -22.65264129638672, "global_step": 128038, "epoch": 1542} {"train_loss": -22.524738311767578, "global_step": 128039, "epoch": 1542} {"train_loss": -22.676549911499023, "global_step": 128040, "epoch": 1542} {"train_loss": -23.01854705810547, "global_step": 128041, "epoch": 1542} {"train_loss": -22.381032943725586, "global_step": 128042, "epoch": 1542} {"train_loss": -22.972883224487305, "global_step": 128043, "epoch": 1542} {"train_loss": -23.007625579833984, "global_step": 128044, "epoch": 1542} {"train_loss": -22.678476333618164, "global_step": 128045, "epoch": 1542} {"train_loss": -22.53309440612793, "global_step": 128046, "epoch": 1542} {"train_loss": -22.892993927001953, "global_step": 128047, "epoch": 1542} {"train_loss": -22.927785873413086, "global_step": 128048, "epoch": 1542} {"train_loss": -22.933189392089844, "global_step": 128049, "epoch": 1542} {"train_loss": -23.013376235961914, "global_step": 128050, "epoch": 1542} {"train_loss": -22.708295822143555, "global_step": 128051, "epoch": 1542} {"train_loss": -22.79573631286621, "global_step": 128052, "epoch": 1542} {"train_loss": -22.615556716918945, "global_step": 128053, "epoch": 1542} {"train_loss": -22.847370147705078, "global_step": 128054, "epoch": 1542} {"train_loss": -22.892621994018555, "global_step": 128055, "epoch": 1542} {"train_loss": -22.457685470581055, "global_step": 128056, "epoch": 1542} {"train_loss": -23.105154037475586, "global_step": 128057, "epoch": 1542} {"train_loss": -22.773515701293945, "global_step": 128058, "epoch": 1542} {"train_loss": -23.059720993041992, "global_step": 128059, "epoch": 1542} {"train_loss": -22.372264862060547, "global_step": 128060, "epoch": 1542} {"train_loss": -22.697235107421875, "global_step": 128061, "epoch": 1542} {"train_loss": -22.403945922851562, "global_step": 128062, "epoch": 1542} {"train_loss": -22.527891159057617, "global_step": 128063, "epoch": 1542} {"train_loss": -23.01383399963379, "global_step": 128064, "epoch": 1542} {"train_loss": -22.56984519958496, "global_step": 128065, "epoch": 1542} {"train_loss": -22.596694946289062, "global_step": 128066, "epoch": 1542} {"train_loss": -22.763593673706055, "global_step": 128067, "epoch": 1542} {"train_loss": -22.68293171618358, "global_step": 128068, "epoch": 1542, "val_loss": 6172111.5} {"train_loss": -22.114622116088867, "global_step": 128069, "epoch": 1543} {"train_loss": -21.9117374420166, "global_step": 128070, "epoch": 1543} {"train_loss": -22.827966690063477, "global_step": 128071, "epoch": 1543} {"train_loss": -21.840444564819336, "global_step": 128072, "epoch": 1543} {"train_loss": -22.01801872253418, "global_step": 128073, "epoch": 1543} {"train_loss": -22.355566024780273, "global_step": 128074, "epoch": 1543} {"train_loss": -21.785964965820312, "global_step": 128075, "epoch": 1543} {"train_loss": -22.572446823120117, "global_step": 128076, "epoch": 1543} {"train_loss": -22.101348876953125, "global_step": 128077, "epoch": 1543} {"train_loss": -22.48695182800293, "global_step": 128078, "epoch": 1543} {"train_loss": -22.65920639038086, "global_step": 128079, "epoch": 1543} {"train_loss": -22.421245574951172, "global_step": 128080, "epoch": 1543} {"train_loss": -22.24136734008789, "global_step": 128081, "epoch": 1543} {"train_loss": -22.408187866210938, "global_step": 128082, "epoch": 1543} {"train_loss": -22.323287963867188, "global_step": 128083, "epoch": 1543} {"train_loss": -22.67319679260254, "global_step": 128084, "epoch": 1543} {"train_loss": -22.365585327148438, "global_step": 128085, "epoch": 1543} {"train_loss": -22.96017837524414, "global_step": 128086, "epoch": 1543} {"train_loss": -22.243755340576172, "global_step": 128087, "epoch": 1543} {"train_loss": -22.280548095703125, "global_step": 128088, "epoch": 1543} {"train_loss": -22.620737075805664, "global_step": 128089, "epoch": 1543} {"train_loss": -22.368921279907227, "global_step": 128090, "epoch": 1543} {"train_loss": -22.645536422729492, "global_step": 128091, "epoch": 1543} {"train_loss": -22.698081970214844, "global_step": 128092, "epoch": 1543} {"train_loss": -22.746286392211914, "global_step": 128093, "epoch": 1543} {"train_loss": -22.538909912109375, "global_step": 128094, "epoch": 1543} {"train_loss": -23.03110694885254, "global_step": 128095, "epoch": 1543} {"train_loss": -22.642568588256836, "global_step": 128096, "epoch": 1543} {"train_loss": -22.812824249267578, "global_step": 128097, "epoch": 1543} {"train_loss": -22.850454330444336, "global_step": 128098, "epoch": 1543} {"train_loss": -22.757831573486328, "global_step": 128099, "epoch": 1543} {"train_loss": -22.668004989624023, "global_step": 128100, "epoch": 1543} {"train_loss": -22.87698745727539, "global_step": 128101, "epoch": 1543} {"train_loss": -22.8094482421875, "global_step": 128102, "epoch": 1543} {"train_loss": -22.4344482421875, "global_step": 128103, "epoch": 1543} {"train_loss": -22.630767822265625, "global_step": 128104, "epoch": 1543} {"train_loss": -22.6507568359375, "global_step": 128105, "epoch": 1543} {"train_loss": -22.584463119506836, "global_step": 128106, "epoch": 1543} {"train_loss": -22.914085388183594, "global_step": 128107, "epoch": 1543} {"train_loss": -22.7630672454834, "global_step": 128108, "epoch": 1543} {"train_loss": -23.119579315185547, "global_step": 128109, "epoch": 1543} {"train_loss": -22.638408660888672, "global_step": 128110, "epoch": 1543} {"train_loss": -22.70792007446289, "global_step": 128111, "epoch": 1543} {"train_loss": -22.630889892578125, "global_step": 128112, "epoch": 1543} {"train_loss": -22.82460594177246, "global_step": 128113, "epoch": 1543} {"train_loss": -23.043893814086914, "global_step": 128114, "epoch": 1543} {"train_loss": -22.628177642822266, "global_step": 128115, "epoch": 1543} {"train_loss": -22.70071792602539, "global_step": 128116, "epoch": 1543} {"train_loss": -22.48052215576172, "global_step": 128117, "epoch": 1543} {"train_loss": -22.181379318237305, "global_step": 128118, "epoch": 1543} {"train_loss": -22.90760612487793, "global_step": 128119, "epoch": 1543} {"train_loss": -22.4384822845459, "global_step": 128120, "epoch": 1543} {"train_loss": -22.787168502807617, "global_step": 128121, "epoch": 1543} {"train_loss": -22.680404663085938, "global_step": 128122, "epoch": 1543} {"train_loss": -22.74648094177246, "global_step": 128123, "epoch": 1543} {"train_loss": -22.62232780456543, "global_step": 128124, "epoch": 1543} {"train_loss": -23.29604148864746, "global_step": 128125, "epoch": 1543} {"train_loss": -22.608617782592773, "global_step": 128126, "epoch": 1543} {"train_loss": -22.265869140625, "global_step": 128127, "epoch": 1543} {"train_loss": -22.62070083618164, "global_step": 128128, "epoch": 1543} {"train_loss": -22.45088005065918, "global_step": 128129, "epoch": 1543} {"train_loss": -22.65715980529785, "global_step": 128130, "epoch": 1543} {"train_loss": -22.761215209960938, "global_step": 128131, "epoch": 1543} {"train_loss": -22.952350616455078, "global_step": 128132, "epoch": 1543} {"train_loss": -22.767831802368164, "global_step": 128133, "epoch": 1543} {"train_loss": -22.592426300048828, "global_step": 128134, "epoch": 1543} {"train_loss": -22.549652099609375, "global_step": 128135, "epoch": 1543} {"train_loss": -22.831518173217773, "global_step": 128136, "epoch": 1543} {"train_loss": -22.483640670776367, "global_step": 128137, "epoch": 1543} {"train_loss": -22.931936264038086, "global_step": 128138, "epoch": 1543} {"train_loss": -23.037137985229492, "global_step": 128139, "epoch": 1543} {"train_loss": -22.716876983642578, "global_step": 128140, "epoch": 1543} {"train_loss": -23.016332626342773, "global_step": 128141, "epoch": 1543} {"train_loss": -23.1453857421875, "global_step": 128142, "epoch": 1543} {"train_loss": -22.827625274658203, "global_step": 128143, "epoch": 1543} {"train_loss": -22.815261840820312, "global_step": 128144, "epoch": 1543} {"train_loss": -22.813413619995117, "global_step": 128145, "epoch": 1543} {"train_loss": -22.739463806152344, "global_step": 128146, "epoch": 1543} {"train_loss": -23.090667724609375, "global_step": 128147, "epoch": 1543} {"train_loss": -22.29131507873535, "global_step": 128148, "epoch": 1543} {"train_loss": -22.89173698425293, "global_step": 128149, "epoch": 1543} {"train_loss": -23.050168991088867, "global_step": 128150, "epoch": 1543} {"train_loss": -22.63519225063094, "global_step": 128151, "epoch": 1543, "val_loss": 6196263.0} {"train_loss": -22.381895065307617, "global_step": 128152, "epoch": 1544} {"train_loss": -21.428823471069336, "global_step": 128153, "epoch": 1544} {"train_loss": -21.963510513305664, "global_step": 128154, "epoch": 1544} {"train_loss": -22.563190460205078, "global_step": 128155, "epoch": 1544} {"train_loss": -22.198400497436523, "global_step": 128156, "epoch": 1544} {"train_loss": -21.90878677368164, "global_step": 128157, "epoch": 1544} {"train_loss": -22.331205368041992, "global_step": 128158, "epoch": 1544} {"train_loss": -22.527803421020508, "global_step": 128159, "epoch": 1544} {"train_loss": -22.217252731323242, "global_step": 128160, "epoch": 1544} {"train_loss": -22.343585968017578, "global_step": 128161, "epoch": 1544} {"train_loss": -22.079587936401367, "global_step": 128162, "epoch": 1544} {"train_loss": -22.837833404541016, "global_step": 128163, "epoch": 1544} {"train_loss": -22.47202491760254, "global_step": 128164, "epoch": 1544} {"train_loss": -22.526533126831055, "global_step": 128165, "epoch": 1544} {"train_loss": -22.7137451171875, "global_step": 128166, "epoch": 1544} {"train_loss": -22.732542037963867, "global_step": 128167, "epoch": 1544} {"train_loss": -22.44487953186035, "global_step": 128168, "epoch": 1544} {"train_loss": -22.68606948852539, "global_step": 128169, "epoch": 1544} {"train_loss": -22.45393943786621, "global_step": 128170, "epoch": 1544} {"train_loss": -22.636585235595703, "global_step": 128171, "epoch": 1544} {"train_loss": -22.580236434936523, "global_step": 128172, "epoch": 1544} {"train_loss": -22.810949325561523, "global_step": 128173, "epoch": 1544} {"train_loss": -22.96236228942871, "global_step": 128174, "epoch": 1544} {"train_loss": -22.328710556030273, "global_step": 128175, "epoch": 1544} {"train_loss": -22.511754989624023, "global_step": 128176, "epoch": 1544} {"train_loss": -22.720394134521484, "global_step": 128177, "epoch": 1544} {"train_loss": -22.58026695251465, "global_step": 128178, "epoch": 1544} {"train_loss": -22.672704696655273, "global_step": 128179, "epoch": 1544} {"train_loss": -22.68533706665039, "global_step": 128180, "epoch": 1544} {"train_loss": -22.802515029907227, "global_step": 128181, "epoch": 1544} {"train_loss": -23.03493309020996, "global_step": 128182, "epoch": 1544} {"train_loss": -22.469282150268555, "global_step": 128183, "epoch": 1544} {"train_loss": -22.714725494384766, "global_step": 128184, "epoch": 1544} {"train_loss": -22.606708526611328, "global_step": 128185, "epoch": 1544} {"train_loss": -22.979211807250977, "global_step": 128186, "epoch": 1544} {"train_loss": -22.797937393188477, "global_step": 128187, "epoch": 1544} {"train_loss": -23.210691452026367, "global_step": 128188, "epoch": 1544} {"train_loss": -22.48529052734375, "global_step": 128189, "epoch": 1544} {"train_loss": -22.7303466796875, "global_step": 128190, "epoch": 1544} {"train_loss": -22.615764617919922, "global_step": 128191, "epoch": 1544} {"train_loss": -22.63690948486328, "global_step": 128192, "epoch": 1544} {"train_loss": -22.3644962310791, "global_step": 128193, "epoch": 1544} {"train_loss": -22.623809814453125, "global_step": 128194, "epoch": 1544} {"train_loss": -22.548431396484375, "global_step": 128195, "epoch": 1544} {"train_loss": -22.51291847229004, "global_step": 128196, "epoch": 1544} {"train_loss": -22.810226440429688, "global_step": 128197, "epoch": 1544} {"train_loss": -22.793222427368164, "global_step": 128198, "epoch": 1544} {"train_loss": -22.869617462158203, "global_step": 128199, "epoch": 1544} {"train_loss": -22.66463279724121, "global_step": 128200, "epoch": 1544} {"train_loss": -22.513086318969727, "global_step": 128201, "epoch": 1544} {"train_loss": -22.340055465698242, "global_step": 128202, "epoch": 1544} {"train_loss": -22.775869369506836, "global_step": 128203, "epoch": 1544} {"train_loss": -22.490707397460938, "global_step": 128204, "epoch": 1544} {"train_loss": -22.617080688476562, "global_step": 128205, "epoch": 1544} {"train_loss": -22.912412643432617, "global_step": 128206, "epoch": 1544} {"train_loss": -22.766897201538086, "global_step": 128207, "epoch": 1544} {"train_loss": -22.307373046875, "global_step": 128208, "epoch": 1544} {"train_loss": -23.20667839050293, "global_step": 128209, "epoch": 1544} {"train_loss": -22.310361862182617, "global_step": 128210, "epoch": 1544} {"train_loss": -22.386465072631836, "global_step": 128211, "epoch": 1544} {"train_loss": -22.593618392944336, "global_step": 128212, "epoch": 1544} {"train_loss": -22.648330688476562, "global_step": 128213, "epoch": 1544} {"train_loss": -22.682588577270508, "global_step": 128214, "epoch": 1544} {"train_loss": -22.94272804260254, "global_step": 128215, "epoch": 1544} {"train_loss": -22.950944900512695, "global_step": 128216, "epoch": 1544} {"train_loss": -22.839752197265625, "global_step": 128217, "epoch": 1544} {"train_loss": -22.80164909362793, "global_step": 128218, "epoch": 1544} {"train_loss": -22.814382553100586, "global_step": 128219, "epoch": 1544} {"train_loss": -22.84466552734375, "global_step": 128220, "epoch": 1544} {"train_loss": -22.531858444213867, "global_step": 128221, "epoch": 1544} {"train_loss": -22.8343448638916, "global_step": 128222, "epoch": 1544} {"train_loss": -23.066869735717773, "global_step": 128223, "epoch": 1544} {"train_loss": -22.663461685180664, "global_step": 128224, "epoch": 1544} {"train_loss": -22.548093795776367, "global_step": 128225, "epoch": 1544} {"train_loss": -22.769372940063477, "global_step": 128226, "epoch": 1544} {"train_loss": -22.921018600463867, "global_step": 128227, "epoch": 1544} {"train_loss": -22.63738250732422, "global_step": 128228, "epoch": 1544} {"train_loss": -22.946619033813477, "global_step": 128229, "epoch": 1544} {"train_loss": -23.00457191467285, "global_step": 128230, "epoch": 1544} {"train_loss": -22.933897018432617, "global_step": 128231, "epoch": 1544} {"train_loss": -22.683979034423828, "global_step": 128232, "epoch": 1544} {"train_loss": -22.90740394592285, "global_step": 128233, "epoch": 1544} {"train_loss": -22.645346744950995, "global_step": 128234, "epoch": 1544, "val_loss": 6344178.0} {"train_loss": -21.77020263671875, "global_step": 128235, "epoch": 1545} {"train_loss": -22.2453670501709, "global_step": 128236, "epoch": 1545} {"train_loss": -21.870712280273438, "global_step": 128237, "epoch": 1545} {"train_loss": -22.213682174682617, "global_step": 128238, "epoch": 1545} {"train_loss": -22.359359741210938, "global_step": 128239, "epoch": 1545} {"train_loss": -22.587427139282227, "global_step": 128240, "epoch": 1545} {"train_loss": -21.84871482849121, "global_step": 128241, "epoch": 1545} {"train_loss": -22.439273834228516, "global_step": 128242, "epoch": 1545} {"train_loss": -22.141233444213867, "global_step": 128243, "epoch": 1545} {"train_loss": -22.55695152282715, "global_step": 128244, "epoch": 1545} {"train_loss": -22.147022247314453, "global_step": 128245, "epoch": 1545} {"train_loss": -22.15557861328125, "global_step": 128246, "epoch": 1545} {"train_loss": -22.228614807128906, "global_step": 128247, "epoch": 1545} {"train_loss": -22.160436630249023, "global_step": 128248, "epoch": 1545} {"train_loss": -22.635360717773438, "global_step": 128249, "epoch": 1545} {"train_loss": -22.20252799987793, "global_step": 128250, "epoch": 1545} {"train_loss": -22.391435623168945, "global_step": 128251, "epoch": 1545} {"train_loss": -22.224613189697266, "global_step": 128252, "epoch": 1545} {"train_loss": -22.90731430053711, "global_step": 128253, "epoch": 1545} {"train_loss": -22.760114669799805, "global_step": 128254, "epoch": 1545} {"train_loss": -22.461544036865234, "global_step": 128255, "epoch": 1545} {"train_loss": -22.734115600585938, "global_step": 128256, "epoch": 1545} {"train_loss": -22.916515350341797, "global_step": 128257, "epoch": 1545} {"train_loss": -22.86390495300293, "global_step": 128258, "epoch": 1545} {"train_loss": -22.942718505859375, "global_step": 128259, "epoch": 1545} {"train_loss": -22.943485260009766, "global_step": 128260, "epoch": 1545} {"train_loss": -22.711904525756836, "global_step": 128261, "epoch": 1545} {"train_loss": -22.697128295898438, "global_step": 128262, "epoch": 1545} {"train_loss": -22.59381675720215, "global_step": 128263, "epoch": 1545} {"train_loss": -23.08243751525879, "global_step": 128264, "epoch": 1545} {"train_loss": -22.823436737060547, "global_step": 128265, "epoch": 1545} {"train_loss": -22.670698165893555, "global_step": 128266, "epoch": 1545} {"train_loss": -22.335357666015625, "global_step": 128267, "epoch": 1545} {"train_loss": -22.840290069580078, "global_step": 128268, "epoch": 1545} {"train_loss": -22.689340591430664, "global_step": 128269, "epoch": 1545} {"train_loss": -22.695724487304688, "global_step": 128270, "epoch": 1545} {"train_loss": -22.550329208374023, "global_step": 128271, "epoch": 1545} {"train_loss": -22.82634162902832, "global_step": 128272, "epoch": 1545} {"train_loss": -22.702407836914062, "global_step": 128273, "epoch": 1545} {"train_loss": -22.70351219177246, "global_step": 128274, "epoch": 1545} {"train_loss": -22.70873260498047, "global_step": 128275, "epoch": 1545} {"train_loss": -22.59331512451172, "global_step": 128276, "epoch": 1545} {"train_loss": -22.88059425354004, "global_step": 128277, "epoch": 1545} {"train_loss": -22.695514678955078, "global_step": 128278, "epoch": 1545} {"train_loss": -22.68427848815918, "global_step": 128279, "epoch": 1545} {"train_loss": -22.90311050415039, "global_step": 128280, "epoch": 1545} {"train_loss": -22.905981063842773, "global_step": 128281, "epoch": 1545} {"train_loss": -22.83489990234375, "global_step": 128282, "epoch": 1545} {"train_loss": -22.991947174072266, "global_step": 128283, "epoch": 1545} {"train_loss": -22.52057456970215, "global_step": 128284, "epoch": 1545} {"train_loss": -22.673276901245117, "global_step": 128285, "epoch": 1545} {"train_loss": -22.430213928222656, "global_step": 128286, "epoch": 1545} {"train_loss": -22.877180099487305, "global_step": 128287, "epoch": 1545} {"train_loss": -22.64594268798828, "global_step": 128288, "epoch": 1545} {"train_loss": -23.0647029876709, "global_step": 128289, "epoch": 1545} {"train_loss": -22.511686325073242, "global_step": 128290, "epoch": 1545} {"train_loss": -22.869556427001953, "global_step": 128291, "epoch": 1545} {"train_loss": -22.584056854248047, "global_step": 128292, "epoch": 1545} {"train_loss": -22.990745544433594, "global_step": 128293, "epoch": 1545} {"train_loss": -22.293651580810547, "global_step": 128294, "epoch": 1545} {"train_loss": -22.524423599243164, "global_step": 128295, "epoch": 1545} {"train_loss": -22.521799087524414, "global_step": 128296, "epoch": 1545} {"train_loss": -22.71779441833496, "global_step": 128297, "epoch": 1545} {"train_loss": -22.47240447998047, "global_step": 128298, "epoch": 1545} {"train_loss": -22.710126876831055, "global_step": 128299, "epoch": 1545} {"train_loss": -22.572473526000977, "global_step": 128300, "epoch": 1545} {"train_loss": -23.064117431640625, "global_step": 128301, "epoch": 1545} {"train_loss": -22.333105087280273, "global_step": 128302, "epoch": 1545} {"train_loss": -22.4199275970459, "global_step": 128303, "epoch": 1545} {"train_loss": -22.302532196044922, "global_step": 128304, "epoch": 1545} {"train_loss": -22.84554100036621, "global_step": 128305, "epoch": 1545} {"train_loss": -22.708410263061523, "global_step": 128306, "epoch": 1545} {"train_loss": -22.933446884155273, "global_step": 128307, "epoch": 1545} {"train_loss": -22.923978805541992, "global_step": 128308, "epoch": 1545} {"train_loss": -22.371952056884766, "global_step": 128309, "epoch": 1545} {"train_loss": -22.726224899291992, "global_step": 128310, "epoch": 1545} {"train_loss": -22.740222930908203, "global_step": 128311, "epoch": 1545} {"train_loss": -23.06307029724121, "global_step": 128312, "epoch": 1545} {"train_loss": -22.54537010192871, "global_step": 128313, "epoch": 1545} {"train_loss": -22.793119430541992, "global_step": 128314, "epoch": 1545} {"train_loss": -22.411418914794922, "global_step": 128315, "epoch": 1545} {"train_loss": -22.455228805541992, "global_step": 128316, "epoch": 1545} {"train_loss": -22.61356310097568, "global_step": 128317, "epoch": 1545, "val_loss": 6175297.0} {"train_loss": -22.509735107421875, "global_step": 128318, "epoch": 1546} {"train_loss": -22.289661407470703, "global_step": 128319, "epoch": 1546} {"train_loss": -22.662710189819336, "global_step": 128320, "epoch": 1546} {"train_loss": -22.525318145751953, "global_step": 128321, "epoch": 1546} {"train_loss": -22.53046226501465, "global_step": 128322, "epoch": 1546} {"train_loss": -22.55781364440918, "global_step": 128323, "epoch": 1546} {"train_loss": -22.39427947998047, "global_step": 128324, "epoch": 1546} {"train_loss": -22.651111602783203, "global_step": 128325, "epoch": 1546} {"train_loss": -22.679275512695312, "global_step": 128326, "epoch": 1546} {"train_loss": -22.921655654907227, "global_step": 128327, "epoch": 1546} {"train_loss": -22.711973190307617, "global_step": 128328, "epoch": 1546} {"train_loss": -22.326053619384766, "global_step": 128329, "epoch": 1546} {"train_loss": -22.586957931518555, "global_step": 128330, "epoch": 1546} {"train_loss": -22.623220443725586, "global_step": 128331, "epoch": 1546} {"train_loss": -22.425683975219727, "global_step": 128332, "epoch": 1546} {"train_loss": -22.726160049438477, "global_step": 128333, "epoch": 1546} {"train_loss": -22.647123336791992, "global_step": 128334, "epoch": 1546} {"train_loss": -22.514511108398438, "global_step": 128335, "epoch": 1546} {"train_loss": -22.593358993530273, "global_step": 128336, "epoch": 1546} {"train_loss": -22.47872543334961, "global_step": 128337, "epoch": 1546} {"train_loss": -22.745359420776367, "global_step": 128338, "epoch": 1546} {"train_loss": -23.146257400512695, "global_step": 128339, "epoch": 1546} {"train_loss": -22.798784255981445, "global_step": 128340, "epoch": 1546} {"train_loss": -22.957111358642578, "global_step": 128341, "epoch": 1546} {"train_loss": -22.469846725463867, "global_step": 128342, "epoch": 1546} {"train_loss": -22.52887535095215, "global_step": 128343, "epoch": 1546} {"train_loss": -22.946081161499023, "global_step": 128344, "epoch": 1546} {"train_loss": -22.433441162109375, "global_step": 128345, "epoch": 1546} {"train_loss": -22.6195068359375, "global_step": 128346, "epoch": 1546} {"train_loss": -22.53568458557129, "global_step": 128347, "epoch": 1546} {"train_loss": -22.982925415039062, "global_step": 128348, "epoch": 1546} {"train_loss": -22.948740005493164, "global_step": 128349, "epoch": 1546} {"train_loss": -22.983503341674805, "global_step": 128350, "epoch": 1546} {"train_loss": -22.4274959564209, "global_step": 128351, "epoch": 1546} {"train_loss": -22.21476936340332, "global_step": 128352, "epoch": 1546} {"train_loss": -22.93271827697754, "global_step": 128353, "epoch": 1546} {"train_loss": -22.389427185058594, "global_step": 128354, "epoch": 1546} {"train_loss": -22.533838272094727, "global_step": 128355, "epoch": 1546} {"train_loss": -22.795318603515625, "global_step": 128356, "epoch": 1546} {"train_loss": -22.574331283569336, "global_step": 128357, "epoch": 1546} {"train_loss": -22.35944938659668, "global_step": 128358, "epoch": 1546} {"train_loss": -22.61580467224121, "global_step": 128359, "epoch": 1546} {"train_loss": -22.559553146362305, "global_step": 128360, "epoch": 1546} {"train_loss": -22.343338012695312, "global_step": 128361, "epoch": 1546} {"train_loss": -22.622549057006836, "global_step": 128362, "epoch": 1546} {"train_loss": -22.583547592163086, "global_step": 128363, "epoch": 1546} {"train_loss": -22.87053871154785, "global_step": 128364, "epoch": 1546} {"train_loss": -22.741811752319336, "global_step": 128365, "epoch": 1546} {"train_loss": -22.63275718688965, "global_step": 128366, "epoch": 1546} {"train_loss": -23.044912338256836, "global_step": 128367, "epoch": 1546} {"train_loss": -22.822980880737305, "global_step": 128368, "epoch": 1546} {"train_loss": -22.74595069885254, "global_step": 128369, "epoch": 1546} {"train_loss": -22.83516502380371, "global_step": 128370, "epoch": 1546} {"train_loss": -22.384441375732422, "global_step": 128371, "epoch": 1546} {"train_loss": -22.905197143554688, "global_step": 128372, "epoch": 1546} {"train_loss": -22.916929244995117, "global_step": 128373, "epoch": 1546} {"train_loss": -22.567716598510742, "global_step": 128374, "epoch": 1546} {"train_loss": -22.82266616821289, "global_step": 128375, "epoch": 1546} {"train_loss": -23.095218658447266, "global_step": 128376, "epoch": 1546} {"train_loss": -22.511154174804688, "global_step": 128377, "epoch": 1546} {"train_loss": -22.997459411621094, "global_step": 128378, "epoch": 1546} {"train_loss": -22.665876388549805, "global_step": 128379, "epoch": 1546} {"train_loss": -22.621339797973633, "global_step": 128380, "epoch": 1546} {"train_loss": -23.05061149597168, "global_step": 128381, "epoch": 1546} {"train_loss": -22.811376571655273, "global_step": 128382, "epoch": 1546} {"train_loss": -22.313703536987305, "global_step": 128383, "epoch": 1546} {"train_loss": -22.882814407348633, "global_step": 128384, "epoch": 1546} {"train_loss": -22.87480926513672, "global_step": 128385, "epoch": 1546} {"train_loss": -22.886077880859375, "global_step": 128386, "epoch": 1546} {"train_loss": -22.447187423706055, "global_step": 128387, "epoch": 1546} {"train_loss": -23.10182762145996, "global_step": 128388, "epoch": 1546} {"train_loss": -22.781972885131836, "global_step": 128389, "epoch": 1546} {"train_loss": -23.058231353759766, "global_step": 128390, "epoch": 1546} {"train_loss": -23.11954689025879, "global_step": 128391, "epoch": 1546} {"train_loss": -22.509580612182617, "global_step": 128392, "epoch": 1546} {"train_loss": -22.947494506835938, "global_step": 128393, "epoch": 1546} {"train_loss": -23.073339462280273, "global_step": 128394, "epoch": 1546} {"train_loss": -23.063936233520508, "global_step": 128395, "epoch": 1546} {"train_loss": -22.72028160095215, "global_step": 128396, "epoch": 1546} {"train_loss": -22.846384048461914, "global_step": 128397, "epoch": 1546} {"train_loss": -22.53377914428711, "global_step": 128398, "epoch": 1546} {"train_loss": -22.723974227905273, "global_step": 128399, "epoch": 1546} {"train_loss": -22.71187899486128, "global_step": 128400, "epoch": 1546, "val_loss": 6264182.0} {"train_loss": -22.1572322845459, "global_step": 128401, "epoch": 1547} {"train_loss": -22.141202926635742, "global_step": 128402, "epoch": 1547} {"train_loss": -22.094358444213867, "global_step": 128403, "epoch": 1547} {"train_loss": -22.494930267333984, "global_step": 128404, "epoch": 1547} {"train_loss": -22.30795669555664, "global_step": 128405, "epoch": 1547} {"train_loss": -22.511165618896484, "global_step": 128406, "epoch": 1547} {"train_loss": -22.416873931884766, "global_step": 128407, "epoch": 1547} {"train_loss": -22.5880184173584, "global_step": 128408, "epoch": 1547} {"train_loss": -22.5227108001709, "global_step": 128409, "epoch": 1547} {"train_loss": -22.813329696655273, "global_step": 128410, "epoch": 1547} {"train_loss": -22.846738815307617, "global_step": 128411, "epoch": 1547} {"train_loss": -22.856279373168945, "global_step": 128412, "epoch": 1547} {"train_loss": -22.735071182250977, "global_step": 128413, "epoch": 1547} {"train_loss": -22.667007446289062, "global_step": 128414, "epoch": 1547} {"train_loss": -22.677953720092773, "global_step": 128415, "epoch": 1547} {"train_loss": -22.567731857299805, "global_step": 128416, "epoch": 1547} {"train_loss": -22.311315536499023, "global_step": 128417, "epoch": 1547} {"train_loss": -22.744998931884766, "global_step": 128418, "epoch": 1547} {"train_loss": -22.8289737701416, "global_step": 128419, "epoch": 1547} {"train_loss": -22.3586368560791, "global_step": 128420, "epoch": 1547} {"train_loss": -22.82342529296875, "global_step": 128421, "epoch": 1547} {"train_loss": -22.875965118408203, "global_step": 128422, "epoch": 1547} {"train_loss": -22.838409423828125, "global_step": 128423, "epoch": 1547} {"train_loss": -22.551639556884766, "global_step": 128424, "epoch": 1547} {"train_loss": -23.097925186157227, "global_step": 128425, "epoch": 1547} {"train_loss": -22.64858627319336, "global_step": 128426, "epoch": 1547} {"train_loss": -22.791934967041016, "global_step": 128427, "epoch": 1547} {"train_loss": -22.40736198425293, "global_step": 128428, "epoch": 1547} {"train_loss": -22.93765640258789, "global_step": 128429, "epoch": 1547} {"train_loss": -22.49527359008789, "global_step": 128430, "epoch": 1547} {"train_loss": -22.884510040283203, "global_step": 128431, "epoch": 1547} {"train_loss": -22.880239486694336, "global_step": 128432, "epoch": 1547} {"train_loss": -22.59547233581543, "global_step": 128433, "epoch": 1547} {"train_loss": -22.70741844177246, "global_step": 128434, "epoch": 1547} {"train_loss": -22.82570457458496, "global_step": 128435, "epoch": 1547} {"train_loss": -22.932931900024414, "global_step": 128436, "epoch": 1547} {"train_loss": -23.10595703125, "global_step": 128437, "epoch": 1547} {"train_loss": -22.69663429260254, "global_step": 128438, "epoch": 1547} {"train_loss": -22.764741897583008, "global_step": 128439, "epoch": 1547} {"train_loss": -22.62530517578125, "global_step": 128440, "epoch": 1547} {"train_loss": -22.860645294189453, "global_step": 128441, "epoch": 1547} {"train_loss": -22.80621910095215, "global_step": 128442, "epoch": 1547} {"train_loss": -22.756948471069336, "global_step": 128443, "epoch": 1547} {"train_loss": -22.9029541015625, "global_step": 128444, "epoch": 1547} {"train_loss": -22.849191665649414, "global_step": 128445, "epoch": 1547} {"train_loss": -22.696130752563477, "global_step": 128446, "epoch": 1547} {"train_loss": -22.824996948242188, "global_step": 128447, "epoch": 1547} {"train_loss": -22.742380142211914, "global_step": 128448, "epoch": 1547} {"train_loss": -22.78403663635254, "global_step": 128449, "epoch": 1547} {"train_loss": -22.643033981323242, "global_step": 128450, "epoch": 1547} {"train_loss": -22.71766471862793, "global_step": 128451, "epoch": 1547} {"train_loss": -22.75615882873535, "global_step": 128452, "epoch": 1547} {"train_loss": -22.82423210144043, "global_step": 128453, "epoch": 1547} {"train_loss": -22.788471221923828, "global_step": 128454, "epoch": 1547} {"train_loss": -22.642642974853516, "global_step": 128455, "epoch": 1547} {"train_loss": -22.803674697875977, "global_step": 128456, "epoch": 1547} {"train_loss": -22.77377700805664, "global_step": 128457, "epoch": 1547} {"train_loss": -22.957029342651367, "global_step": 128458, "epoch": 1547} {"train_loss": -22.70285415649414, "global_step": 128459, "epoch": 1547} {"train_loss": -22.67275047302246, "global_step": 128460, "epoch": 1547} {"train_loss": -22.668745040893555, "global_step": 128461, "epoch": 1547} {"train_loss": -23.022043228149414, "global_step": 128462, "epoch": 1547} {"train_loss": -22.881967544555664, "global_step": 128463, "epoch": 1547} {"train_loss": -22.877113342285156, "global_step": 128464, "epoch": 1547} {"train_loss": -22.61256217956543, "global_step": 128465, "epoch": 1547} {"train_loss": -22.675514221191406, "global_step": 128466, "epoch": 1547} {"train_loss": -23.051040649414062, "global_step": 128467, "epoch": 1547} {"train_loss": -23.266586303710938, "global_step": 128468, "epoch": 1547} {"train_loss": -22.49192237854004, "global_step": 128469, "epoch": 1547} {"train_loss": -22.710134506225586, "global_step": 128470, "epoch": 1547} {"train_loss": -22.948383331298828, "global_step": 128471, "epoch": 1547} {"train_loss": -22.916309356689453, "global_step": 128472, "epoch": 1547} {"train_loss": -22.3702449798584, "global_step": 128473, "epoch": 1547} {"train_loss": -22.565298080444336, "global_step": 128474, "epoch": 1547} {"train_loss": -22.97039222717285, "global_step": 128475, "epoch": 1547} {"train_loss": -22.50550079345703, "global_step": 128476, "epoch": 1547} {"train_loss": -22.632902145385742, "global_step": 128477, "epoch": 1547} {"train_loss": -22.824417114257812, "global_step": 128478, "epoch": 1547} {"train_loss": -22.79530143737793, "global_step": 128479, "epoch": 1547} {"train_loss": -22.43749237060547, "global_step": 128480, "epoch": 1547} {"train_loss": -22.587329864501953, "global_step": 128481, "epoch": 1547} {"train_loss": -22.913536071777344, "global_step": 128482, "epoch": 1547} {"train_loss": -22.727189581078218, "global_step": 128483, "epoch": 1547, "val_loss": 6207058.0} {"train_loss": -22.239028930664062, "global_step": 128484, "epoch": 1548} {"train_loss": -22.392276763916016, "global_step": 128485, "epoch": 1548} {"train_loss": -21.945913314819336, "global_step": 128486, "epoch": 1548} {"train_loss": -22.36323356628418, "global_step": 128487, "epoch": 1548} {"train_loss": -22.561323165893555, "global_step": 128488, "epoch": 1548} {"train_loss": -22.50779151916504, "global_step": 128489, "epoch": 1548} {"train_loss": -22.3778076171875, "global_step": 128490, "epoch": 1548} {"train_loss": -22.865854263305664, "global_step": 128491, "epoch": 1548} {"train_loss": -22.594444274902344, "global_step": 128492, "epoch": 1548} {"train_loss": -22.510366439819336, "global_step": 128493, "epoch": 1548} {"train_loss": -22.213214874267578, "global_step": 128494, "epoch": 1548} {"train_loss": -22.564634323120117, "global_step": 128495, "epoch": 1548} {"train_loss": -22.56287956237793, "global_step": 128496, "epoch": 1548} {"train_loss": -22.90655517578125, "global_step": 128497, "epoch": 1548} {"train_loss": -22.529836654663086, "global_step": 128498, "epoch": 1548} {"train_loss": -22.834386825561523, "global_step": 128499, "epoch": 1548} {"train_loss": -22.40045166015625, "global_step": 128500, "epoch": 1548} {"train_loss": -22.802692413330078, "global_step": 128501, "epoch": 1548} {"train_loss": -22.660018920898438, "global_step": 128502, "epoch": 1548} {"train_loss": -22.51266098022461, "global_step": 128503, "epoch": 1548} {"train_loss": -22.818710327148438, "global_step": 128504, "epoch": 1548} {"train_loss": -22.45029067993164, "global_step": 128505, "epoch": 1548} {"train_loss": -23.086132049560547, "global_step": 128506, "epoch": 1548} {"train_loss": -22.98860740661621, "global_step": 128507, "epoch": 1548} {"train_loss": -22.775938034057617, "global_step": 128508, "epoch": 1548} {"train_loss": -22.916919708251953, "global_step": 128509, "epoch": 1548} {"train_loss": -22.800434112548828, "global_step": 128510, "epoch": 1548} {"train_loss": -22.747419357299805, "global_step": 128511, "epoch": 1548} {"train_loss": -22.71270179748535, "global_step": 128512, "epoch": 1548} {"train_loss": -22.856534957885742, "global_step": 128513, "epoch": 1548} {"train_loss": -22.919919967651367, "global_step": 128514, "epoch": 1548} {"train_loss": -22.562685012817383, "global_step": 128515, "epoch": 1548} {"train_loss": -22.888023376464844, "global_step": 128516, "epoch": 1548} {"train_loss": -22.626035690307617, "global_step": 128517, "epoch": 1548} {"train_loss": -22.82098960876465, "global_step": 128518, "epoch": 1548} {"train_loss": -22.771108627319336, "global_step": 128519, "epoch": 1548} {"train_loss": -22.717769622802734, "global_step": 128520, "epoch": 1548} {"train_loss": -22.82069206237793, "global_step": 128521, "epoch": 1548} {"train_loss": -22.81414222717285, "global_step": 128522, "epoch": 1548} {"train_loss": -22.732685089111328, "global_step": 128523, "epoch": 1548} {"train_loss": -22.952911376953125, "global_step": 128524, "epoch": 1548} {"train_loss": -22.74371910095215, "global_step": 128525, "epoch": 1548} {"train_loss": -22.87782859802246, "global_step": 128526, "epoch": 1548} {"train_loss": -22.986482620239258, "global_step": 128527, "epoch": 1548} {"train_loss": -22.91458511352539, "global_step": 128528, "epoch": 1548} {"train_loss": -22.902414321899414, "global_step": 128529, "epoch": 1548} {"train_loss": -22.850051879882812, "global_step": 128530, "epoch": 1548} {"train_loss": -22.76309585571289, "global_step": 128531, "epoch": 1548} {"train_loss": -22.34517478942871, "global_step": 128532, "epoch": 1548} {"train_loss": -22.99483299255371, "global_step": 128533, "epoch": 1548} {"train_loss": -22.456212997436523, "global_step": 128534, "epoch": 1548} {"train_loss": -22.970993041992188, "global_step": 128535, "epoch": 1548} {"train_loss": -22.84189224243164, "global_step": 128536, "epoch": 1548} {"train_loss": -22.894184112548828, "global_step": 128537, "epoch": 1548} {"train_loss": -23.023773193359375, "global_step": 128538, "epoch": 1548} {"train_loss": -23.110937118530273, "global_step": 128539, "epoch": 1548} {"train_loss": -22.87009048461914, "global_step": 128540, "epoch": 1548} {"train_loss": -23.079193115234375, "global_step": 128541, "epoch": 1548} {"train_loss": -22.571231842041016, "global_step": 128542, "epoch": 1548} {"train_loss": -23.116456985473633, "global_step": 128543, "epoch": 1548} {"train_loss": -22.17046546936035, "global_step": 128544, "epoch": 1548} {"train_loss": -22.641740798950195, "global_step": 128545, "epoch": 1548} {"train_loss": -23.039058685302734, "global_step": 128546, "epoch": 1548} {"train_loss": -22.751142501831055, "global_step": 128547, "epoch": 1548} {"train_loss": -22.803787231445312, "global_step": 128548, "epoch": 1548} {"train_loss": -22.49689483642578, "global_step": 128549, "epoch": 1548} {"train_loss": -22.83668327331543, "global_step": 128550, "epoch": 1548} {"train_loss": -22.890989303588867, "global_step": 128551, "epoch": 1548} {"train_loss": -22.49576759338379, "global_step": 128552, "epoch": 1548} {"train_loss": -23.008161544799805, "global_step": 128553, "epoch": 1548} {"train_loss": -22.914371490478516, "global_step": 128554, "epoch": 1548} {"train_loss": -22.581192016601562, "global_step": 128555, "epoch": 1548} {"train_loss": -22.71937370300293, "global_step": 128556, "epoch": 1548} {"train_loss": -22.900659561157227, "global_step": 128557, "epoch": 1548} {"train_loss": -22.93922233581543, "global_step": 128558, "epoch": 1548} {"train_loss": -22.449316024780273, "global_step": 128559, "epoch": 1548} {"train_loss": -22.793445587158203, "global_step": 128560, "epoch": 1548} {"train_loss": -22.763751983642578, "global_step": 128561, "epoch": 1548} {"train_loss": -23.064105987548828, "global_step": 128562, "epoch": 1548} {"train_loss": -22.50025749206543, "global_step": 128563, "epoch": 1548} {"train_loss": -22.906143188476562, "global_step": 128564, "epoch": 1548} {"train_loss": -22.99796485900879, "global_step": 128565, "epoch": 1548} {"train_loss": -22.740759952958808, "global_step": 128566, "epoch": 1548, "val_loss": 6256965.0} {"train_loss": -22.647607803344727, "global_step": 128567, "epoch": 1549} {"train_loss": -21.934175491333008, "global_step": 128568, "epoch": 1549} {"train_loss": -21.749435424804688, "global_step": 128569, "epoch": 1549} {"train_loss": -22.272762298583984, "global_step": 128570, "epoch": 1549} {"train_loss": -22.642019271850586, "global_step": 128571, "epoch": 1549} {"train_loss": -22.578739166259766, "global_step": 128572, "epoch": 1549} {"train_loss": -22.6065673828125, "global_step": 128573, "epoch": 1549} {"train_loss": -22.875333786010742, "global_step": 128574, "epoch": 1549} {"train_loss": -22.651142120361328, "global_step": 128575, "epoch": 1549} {"train_loss": -22.46242332458496, "global_step": 128576, "epoch": 1549} {"train_loss": -22.522499084472656, "global_step": 128577, "epoch": 1549} {"train_loss": -22.602840423583984, "global_step": 128578, "epoch": 1549} {"train_loss": -22.90696144104004, "global_step": 128579, "epoch": 1549} {"train_loss": -22.80303382873535, "global_step": 128580, "epoch": 1549} {"train_loss": -22.618209838867188, "global_step": 128581, "epoch": 1549} {"train_loss": -22.28167152404785, "global_step": 128582, "epoch": 1549} {"train_loss": -22.708356857299805, "global_step": 128583, "epoch": 1549} {"train_loss": -22.701885223388672, "global_step": 128584, "epoch": 1549} {"train_loss": -22.504560470581055, "global_step": 128585, "epoch": 1549} {"train_loss": -22.630727767944336, "global_step": 128586, "epoch": 1549} {"train_loss": -23.202091217041016, "global_step": 128587, "epoch": 1549} {"train_loss": -22.835983276367188, "global_step": 128588, "epoch": 1549} {"train_loss": -22.560749053955078, "global_step": 128589, "epoch": 1549} {"train_loss": -22.706079483032227, "global_step": 128590, "epoch": 1549} {"train_loss": -22.757553100585938, "global_step": 128591, "epoch": 1549} {"train_loss": -22.773448944091797, "global_step": 128592, "epoch": 1549} {"train_loss": -22.95450782775879, "global_step": 128593, "epoch": 1549} {"train_loss": -22.619932174682617, "global_step": 128594, "epoch": 1549} {"train_loss": -22.74591064453125, "global_step": 128595, "epoch": 1549} {"train_loss": -22.55109977722168, "global_step": 128596, "epoch": 1549} {"train_loss": -22.67891502380371, "global_step": 128597, "epoch": 1549} {"train_loss": -22.579626083374023, "global_step": 128598, "epoch": 1549} {"train_loss": -22.619539260864258, "global_step": 128599, "epoch": 1549} {"train_loss": -23.063467025756836, "global_step": 128600, "epoch": 1549} {"train_loss": -22.438840866088867, "global_step": 128601, "epoch": 1549} {"train_loss": -23.012802124023438, "global_step": 128602, "epoch": 1549} {"train_loss": -22.89286231994629, "global_step": 128603, "epoch": 1549} {"train_loss": -22.555206298828125, "global_step": 128604, "epoch": 1549} {"train_loss": -22.93368911743164, "global_step": 128605, "epoch": 1549} {"train_loss": -22.706506729125977, "global_step": 128606, "epoch": 1549} {"train_loss": -22.972991943359375, "global_step": 128607, "epoch": 1549} {"train_loss": -22.854297637939453, "global_step": 128608, "epoch": 1549} {"train_loss": -22.575258255004883, "global_step": 128609, "epoch": 1549} {"train_loss": -22.860855102539062, "global_step": 128610, "epoch": 1549} {"train_loss": -22.638132095336914, "global_step": 128611, "epoch": 1549} {"train_loss": -23.033031463623047, "global_step": 128612, "epoch": 1549} {"train_loss": -22.935855865478516, "global_step": 128613, "epoch": 1549} {"train_loss": -23.11933708190918, "global_step": 128614, "epoch": 1549} {"train_loss": -23.059988021850586, "global_step": 128615, "epoch": 1549} {"train_loss": -22.981454849243164, "global_step": 128616, "epoch": 1549} {"train_loss": -22.825620651245117, "global_step": 128617, "epoch": 1549} {"train_loss": -22.7563533782959, "global_step": 128618, "epoch": 1549} {"train_loss": -22.368162155151367, "global_step": 128619, "epoch": 1549} {"train_loss": -22.3094482421875, "global_step": 128620, "epoch": 1549} {"train_loss": -22.45592498779297, "global_step": 128621, "epoch": 1549} {"train_loss": -22.871749877929688, "global_step": 128622, "epoch": 1549} {"train_loss": -22.607088088989258, "global_step": 128623, "epoch": 1549} {"train_loss": -22.170047760009766, "global_step": 128624, "epoch": 1549} {"train_loss": -22.764911651611328, "global_step": 128625, "epoch": 1549} {"train_loss": -22.059234619140625, "global_step": 128626, "epoch": 1549} {"train_loss": -22.628385543823242, "global_step": 128627, "epoch": 1549} {"train_loss": -22.60650634765625, "global_step": 128628, "epoch": 1549} {"train_loss": -22.403608322143555, "global_step": 128629, "epoch": 1549} {"train_loss": -22.636310577392578, "global_step": 128630, "epoch": 1549} {"train_loss": -22.87495231628418, "global_step": 128631, "epoch": 1549} {"train_loss": -22.684478759765625, "global_step": 128632, "epoch": 1549} {"train_loss": -22.674474716186523, "global_step": 128633, "epoch": 1549} {"train_loss": -22.708740234375, "global_step": 128634, "epoch": 1549} {"train_loss": -22.60447120666504, "global_step": 128635, "epoch": 1549} {"train_loss": -22.39985466003418, "global_step": 128636, "epoch": 1549} {"train_loss": -22.61809730529785, "global_step": 128637, "epoch": 1549} {"train_loss": -22.34978675842285, "global_step": 128638, "epoch": 1549} {"train_loss": -22.917818069458008, "global_step": 128639, "epoch": 1549} {"train_loss": -22.4434757232666, "global_step": 128640, "epoch": 1549} {"train_loss": -22.733125686645508, "global_step": 128641, "epoch": 1549} {"train_loss": -22.801546096801758, "global_step": 128642, "epoch": 1549} {"train_loss": -23.151670455932617, "global_step": 128643, "epoch": 1549} {"train_loss": -22.57600975036621, "global_step": 128644, "epoch": 1549} {"train_loss": -22.9133358001709, "global_step": 128645, "epoch": 1549} {"train_loss": -22.723087310791016, "global_step": 128646, "epoch": 1549} {"train_loss": -22.87375259399414, "global_step": 128647, "epoch": 1549} {"train_loss": -22.751209259033203, "global_step": 128648, "epoch": 1549} {"train_loss": -22.671943549650262, "global_step": 128649, "epoch": 1549, "val_loss": 6299530.0} {"train_loss": -21.80218505859375, "global_step": 128650, "epoch": 1550} {"train_loss": -22.235132217407227, "global_step": 128651, "epoch": 1550} {"train_loss": -22.3492374420166, "global_step": 128652, "epoch": 1550} {"train_loss": -22.09235191345215, "global_step": 128653, "epoch": 1550} {"train_loss": -22.62091064453125, "global_step": 128654, "epoch": 1550} {"train_loss": -22.491897583007812, "global_step": 128655, "epoch": 1550} {"train_loss": -22.62471580505371, "global_step": 128656, "epoch": 1550} {"train_loss": -22.74053955078125, "global_step": 128657, "epoch": 1550} {"train_loss": -22.309661865234375, "global_step": 128658, "epoch": 1550} {"train_loss": -22.489810943603516, "global_step": 128659, "epoch": 1550} {"train_loss": -22.682077407836914, "global_step": 128660, "epoch": 1550} {"train_loss": -22.238800048828125, "global_step": 128661, "epoch": 1550} {"train_loss": -22.792760848999023, "global_step": 128662, "epoch": 1550} {"train_loss": -22.448867797851562, "global_step": 128663, "epoch": 1550} {"train_loss": -22.549474716186523, "global_step": 128664, "epoch": 1550} {"train_loss": -22.332937240600586, "global_step": 128665, "epoch": 1550} {"train_loss": -22.618804931640625, "global_step": 128666, "epoch": 1550} {"train_loss": -22.570133209228516, "global_step": 128667, "epoch": 1550} {"train_loss": -22.54072380065918, "global_step": 128668, "epoch": 1550} {"train_loss": -22.591672897338867, "global_step": 128669, "epoch": 1550} {"train_loss": -22.20049285888672, "global_step": 128670, "epoch": 1550} {"train_loss": -22.437726974487305, "global_step": 128671, "epoch": 1550} {"train_loss": -22.579635620117188, "global_step": 128672, "epoch": 1550} {"train_loss": -22.5863037109375, "global_step": 128673, "epoch": 1550} {"train_loss": -22.971647262573242, "global_step": 128674, "epoch": 1550} {"train_loss": -22.588518142700195, "global_step": 128675, "epoch": 1550} {"train_loss": -22.666711807250977, "global_step": 128676, "epoch": 1550} {"train_loss": -22.56220817565918, "global_step": 128677, "epoch": 1550} {"train_loss": -22.57940101623535, "global_step": 128678, "epoch": 1550} {"train_loss": -22.79536247253418, "global_step": 128679, "epoch": 1550} {"train_loss": -22.739179611206055, "global_step": 128680, "epoch": 1550} {"train_loss": -22.664548873901367, "global_step": 128681, "epoch": 1550} {"train_loss": -22.463499069213867, "global_step": 128682, "epoch": 1550} {"train_loss": -22.95148468017578, "global_step": 128683, "epoch": 1550} {"train_loss": -22.831159591674805, "global_step": 128684, "epoch": 1550} {"train_loss": -22.52813148498535, "global_step": 128685, "epoch": 1550} {"train_loss": -22.79828643798828, "global_step": 128686, "epoch": 1550} {"train_loss": -22.51527214050293, "global_step": 128687, "epoch": 1550} {"train_loss": -22.65093994140625, "global_step": 128688, "epoch": 1550} {"train_loss": -22.79908561706543, "global_step": 128689, "epoch": 1550} {"train_loss": -23.026647567749023, "global_step": 128690, "epoch": 1550} {"train_loss": -22.85912322998047, "global_step": 128691, "epoch": 1550} {"train_loss": -22.666513442993164, "global_step": 128692, "epoch": 1550} {"train_loss": -22.820941925048828, "global_step": 128693, "epoch": 1550} {"train_loss": -22.903844833374023, "global_step": 128694, "epoch": 1550} {"train_loss": -22.801177978515625, "global_step": 128695, "epoch": 1550} {"train_loss": -22.528724670410156, "global_step": 128696, "epoch": 1550} {"train_loss": -22.26032829284668, "global_step": 128697, "epoch": 1550} {"train_loss": -22.491779327392578, "global_step": 128698, "epoch": 1550} {"train_loss": -22.308088302612305, "global_step": 128699, "epoch": 1550} {"train_loss": -22.779020309448242, "global_step": 128700, "epoch": 1550} {"train_loss": -22.82484245300293, "global_step": 128701, "epoch": 1550} {"train_loss": -22.497112274169922, "global_step": 128702, "epoch": 1550} {"train_loss": -22.470966339111328, "global_step": 128703, "epoch": 1550} {"train_loss": -22.750686645507812, "global_step": 128704, "epoch": 1550} {"train_loss": -22.86209487915039, "global_step": 128705, "epoch": 1550} {"train_loss": -22.585308074951172, "global_step": 128706, "epoch": 1550} {"train_loss": -22.731199264526367, "global_step": 128707, "epoch": 1550} {"train_loss": -23.030048370361328, "global_step": 128708, "epoch": 1550} {"train_loss": -22.9363956451416, "global_step": 128709, "epoch": 1550} {"train_loss": -23.013925552368164, "global_step": 128710, "epoch": 1550} {"train_loss": -22.890995025634766, "global_step": 128711, "epoch": 1550} {"train_loss": -22.7199764251709, "global_step": 128712, "epoch": 1550} {"train_loss": -22.653141021728516, "global_step": 128713, "epoch": 1550} {"train_loss": -22.816394805908203, "global_step": 128714, "epoch": 1550} {"train_loss": -22.68501091003418, "global_step": 128715, "epoch": 1550} {"train_loss": -22.695634841918945, "global_step": 128716, "epoch": 1550} {"train_loss": -22.371850967407227, "global_step": 128717, "epoch": 1550} {"train_loss": -22.842859268188477, "global_step": 128718, "epoch": 1550} {"train_loss": -22.92511558532715, "global_step": 128719, "epoch": 1550} {"train_loss": -22.970081329345703, "global_step": 128720, "epoch": 1550} {"train_loss": -22.90032958984375, "global_step": 128721, "epoch": 1550} {"train_loss": -22.923999786376953, "global_step": 128722, "epoch": 1550} {"train_loss": -22.67865753173828, "global_step": 128723, "epoch": 1550} {"train_loss": -23.160005569458008, "global_step": 128724, "epoch": 1550} {"train_loss": -22.845720291137695, "global_step": 128725, "epoch": 1550} {"train_loss": -23.107831954956055, "global_step": 128726, "epoch": 1550} {"train_loss": -22.90939712524414, "global_step": 128727, "epoch": 1550} {"train_loss": -22.805137634277344, "global_step": 128728, "epoch": 1550} {"train_loss": -22.567617416381836, "global_step": 128729, "epoch": 1550} {"train_loss": -22.874387741088867, "global_step": 128730, "epoch": 1550} {"train_loss": -22.895042419433594, "global_step": 128731, "epoch": 1550} {"train_loss": -22.67591471844409, "global_step": 128732, "epoch": 1550, "train/sim_max_reward_0": 1.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4500000": 1.0, "test/sim_max_reward_4500001": 1.0, "test/sim_max_reward_4500002": 1.0, "test/sim_max_reward_4500003": 1.0, "test/sim_max_reward_4500004": 1.0, "test/sim_max_reward_4500005": 1.0, "test/sim_max_reward_4500006": 1.0, "test/sim_max_reward_4500007": 1.0, "test/sim_max_reward_4500008": 1.0, "test/sim_max_reward_4500009": 1.0, "test/sim_max_reward_4500010": 1.0, "test/sim_max_reward_4500011": 1.0, "test/sim_max_reward_4500012": 1.0, "test/sim_max_reward_4500013": 1.0, "test/sim_max_reward_4500014": 1.0, "test/sim_max_reward_4500015": 1.0, "test/sim_max_reward_4500016": 1.0, "test/sim_max_reward_4500017": 1.0, "test/sim_max_reward_4500018": 1.0, "test/sim_max_reward_4500019": 1.0, "test/sim_max_reward_4500020": 1.0, "test/sim_max_reward_4500021": 1.0, "train/mean_score": 1.0, "test/mean_score": 1.0, "val_loss": 6225715.5} {"train_loss": -22.415090560913086, "global_step": 128733, "epoch": 1551} {"train_loss": -22.470638275146484, "global_step": 128734, "epoch": 1551} {"train_loss": -22.785343170166016, "global_step": 128735, "epoch": 1551} {"train_loss": -22.81632423400879, "global_step": 128736, "epoch": 1551} {"train_loss": -22.547590255737305, "global_step": 128737, "epoch": 1551} {"train_loss": -22.383098602294922, "global_step": 128738, "epoch": 1551} {"train_loss": -22.547216415405273, "global_step": 128739, "epoch": 1551} {"train_loss": -22.744340896606445, "global_step": 128740, "epoch": 1551} {"train_loss": -22.802337646484375, "global_step": 128741, "epoch": 1551} {"train_loss": -22.925315856933594, "global_step": 128742, "epoch": 1551} {"train_loss": -22.684995651245117, "global_step": 128743, "epoch": 1551} {"train_loss": -22.957334518432617, "global_step": 128744, "epoch": 1551} {"train_loss": -22.42360496520996, "global_step": 128745, "epoch": 1551} {"train_loss": -22.912912368774414, "global_step": 128746, "epoch": 1551} {"train_loss": -22.94813346862793, "global_step": 128747, "epoch": 1551} {"train_loss": -23.071435928344727, "global_step": 128748, "epoch": 1551} {"train_loss": -22.809249877929688, "global_step": 128749, "epoch": 1551} {"train_loss": -22.272581100463867, "global_step": 128750, "epoch": 1551} {"train_loss": -22.60460090637207, "global_step": 128751, "epoch": 1551} {"train_loss": -22.457387924194336, "global_step": 128752, "epoch": 1551} {"train_loss": -22.420286178588867, "global_step": 128753, "epoch": 1551} {"train_loss": -22.57112693786621, "global_step": 128754, "epoch": 1551} {"train_loss": -22.305694580078125, "global_step": 128755, "epoch": 1551} {"train_loss": -22.316659927368164, "global_step": 128756, "epoch": 1551} {"train_loss": -22.486474990844727, "global_step": 128757, "epoch": 1551} {"train_loss": -22.96773910522461, "global_step": 128758, "epoch": 1551} {"train_loss": -22.64841651916504, "global_step": 128759, "epoch": 1551} {"train_loss": -22.676546096801758, "global_step": 128760, "epoch": 1551} {"train_loss": -22.56476593017578, "global_step": 128761, "epoch": 1551} {"train_loss": -22.560577392578125, "global_step": 128762, "epoch": 1551} {"train_loss": -22.75090980529785, "global_step": 128763, "epoch": 1551} {"train_loss": -22.98753547668457, "global_step": 128764, "epoch": 1551} {"train_loss": -22.54266929626465, "global_step": 128765, "epoch": 1551} {"train_loss": -22.717254638671875, "global_step": 128766, "epoch": 1551} {"train_loss": -22.99368667602539, "global_step": 128767, "epoch": 1551} {"train_loss": -22.826568603515625, "global_step": 128768, "epoch": 1551} {"train_loss": -22.657974243164062, "global_step": 128769, "epoch": 1551} {"train_loss": -23.023832321166992, "global_step": 128770, "epoch": 1551} {"train_loss": -22.99003028869629, "global_step": 128771, "epoch": 1551} {"train_loss": -22.982986450195312, "global_step": 128772, "epoch": 1551} {"train_loss": -22.87001609802246, "global_step": 128773, "epoch": 1551} {"train_loss": -22.801361083984375, "global_step": 128774, "epoch": 1551} {"train_loss": -22.932327270507812, "global_step": 128775, "epoch": 1551} {"train_loss": -23.022716522216797, "global_step": 128776, "epoch": 1551} {"train_loss": -22.8665771484375, "global_step": 128777, "epoch": 1551} {"train_loss": -22.77850914001465, "global_step": 128778, "epoch": 1551} {"train_loss": -22.796716690063477, "global_step": 128779, "epoch": 1551} {"train_loss": -22.745101928710938, "global_step": 128780, "epoch": 1551} {"train_loss": -22.90044403076172, "global_step": 128781, "epoch": 1551} {"train_loss": -22.880739212036133, "global_step": 128782, "epoch": 1551} {"train_loss": -22.856433868408203, "global_step": 128783, "epoch": 1551} {"train_loss": -22.708555221557617, "global_step": 128784, "epoch": 1551} {"train_loss": -22.770261764526367, "global_step": 128785, "epoch": 1551} {"train_loss": -22.711454391479492, "global_step": 128786, "epoch": 1551} {"train_loss": -22.84247398376465, "global_step": 128787, "epoch": 1551} {"train_loss": -22.741804122924805, "global_step": 128788, "epoch": 1551} {"train_loss": -22.725845336914062, "global_step": 128789, "epoch": 1551} {"train_loss": -22.711095809936523, "global_step": 128790, "epoch": 1551} {"train_loss": -22.682371139526367, "global_step": 128791, "epoch": 1551} {"train_loss": -22.66168212890625, "global_step": 128792, "epoch": 1551} {"train_loss": -22.8137264251709, "global_step": 128793, "epoch": 1551} {"train_loss": -22.766889572143555, "global_step": 128794, "epoch": 1551} {"train_loss": -22.958316802978516, "global_step": 128795, "epoch": 1551} {"train_loss": -22.904699325561523, "global_step": 128796, "epoch": 1551} {"train_loss": -23.175678253173828, "global_step": 128797, "epoch": 1551} {"train_loss": -23.035831451416016, "global_step": 128798, "epoch": 1551} {"train_loss": -22.836746215820312, "global_step": 128799, "epoch": 1551} {"train_loss": -22.763988494873047, "global_step": 128800, "epoch": 1551} {"train_loss": -22.849393844604492, "global_step": 128801, "epoch": 1551} {"train_loss": -22.7388858795166, "global_step": 128802, "epoch": 1551} {"train_loss": -22.753019332885742, "global_step": 128803, "epoch": 1551} {"train_loss": -22.956836700439453, "global_step": 128804, "epoch": 1551} {"train_loss": -22.866498947143555, "global_step": 128805, "epoch": 1551} {"train_loss": -22.97257423400879, "global_step": 128806, "epoch": 1551} {"train_loss": -23.152633666992188, "global_step": 128807, "epoch": 1551} {"train_loss": -22.579391479492188, "global_step": 128808, "epoch": 1551} {"train_loss": -23.206451416015625, "global_step": 128809, "epoch": 1551} {"train_loss": -22.639989852905273, "global_step": 128810, "epoch": 1551} {"train_loss": -22.66042137145996, "global_step": 128811, "epoch": 1551} {"train_loss": -22.69719886779785, "global_step": 128812, "epoch": 1551} {"train_loss": -22.972387313842773, "global_step": 128813, "epoch": 1551} {"train_loss": -22.713865280151367, "global_step": 128814, "epoch": 1551} {"train_loss": -22.760961877294335, "global_step": 128815, "epoch": 1551, "val_loss": 6363646.0} {"train_loss": -22.40447998046875, "global_step": 128816, "epoch": 1552} {"train_loss": -21.784711837768555, "global_step": 128817, "epoch": 1552} {"train_loss": -22.321022033691406, "global_step": 128818, "epoch": 1552} {"train_loss": -22.249799728393555, "global_step": 128819, "epoch": 1552} {"train_loss": -22.349016189575195, "global_step": 128820, "epoch": 1552} {"train_loss": -22.197446823120117, "global_step": 128821, "epoch": 1552} {"train_loss": -22.487409591674805, "global_step": 128822, "epoch": 1552} {"train_loss": -22.498327255249023, "global_step": 128823, "epoch": 1552} {"train_loss": -22.89710235595703, "global_step": 128824, "epoch": 1552} {"train_loss": -22.56875991821289, "global_step": 128825, "epoch": 1552} {"train_loss": -22.17279052734375, "global_step": 128826, "epoch": 1552} {"train_loss": -22.487821578979492, "global_step": 128827, "epoch": 1552} {"train_loss": -22.497787475585938, "global_step": 128828, "epoch": 1552} {"train_loss": -22.596120834350586, "global_step": 128829, "epoch": 1552} {"train_loss": -22.414899826049805, "global_step": 128830, "epoch": 1552} {"train_loss": -22.49159812927246, "global_step": 128831, "epoch": 1552} {"train_loss": -22.778959274291992, "global_step": 128832, "epoch": 1552} {"train_loss": -22.380517959594727, "global_step": 128833, "epoch": 1552} {"train_loss": -22.4565486907959, "global_step": 128834, "epoch": 1552} {"train_loss": -22.630582809448242, "global_step": 128835, "epoch": 1552} {"train_loss": -23.252405166625977, "global_step": 128836, "epoch": 1552} {"train_loss": -22.867069244384766, "global_step": 128837, "epoch": 1552} {"train_loss": -23.098514556884766, "global_step": 128838, "epoch": 1552} {"train_loss": -22.632564544677734, "global_step": 128839, "epoch": 1552} {"train_loss": -22.50791358947754, "global_step": 128840, "epoch": 1552} {"train_loss": -23.20096206665039, "global_step": 128841, "epoch": 1552} {"train_loss": -22.67815399169922, "global_step": 128842, "epoch": 1552} {"train_loss": -22.65195083618164, "global_step": 128843, "epoch": 1552} {"train_loss": -22.78181266784668, "global_step": 128844, "epoch": 1552} {"train_loss": -22.496244430541992, "global_step": 128845, "epoch": 1552} {"train_loss": -22.77756690979004, "global_step": 128846, "epoch": 1552} {"train_loss": -22.907318115234375, "global_step": 128847, "epoch": 1552} {"train_loss": -22.626331329345703, "global_step": 128848, "epoch": 1552} {"train_loss": -23.149765014648438, "global_step": 128849, "epoch": 1552} {"train_loss": -22.895349502563477, "global_step": 128850, "epoch": 1552} {"train_loss": -22.923887252807617, "global_step": 128851, "epoch": 1552} {"train_loss": -22.999725341796875, "global_step": 128852, "epoch": 1552} {"train_loss": -22.545146942138672, "global_step": 128853, "epoch": 1552} {"train_loss": -22.794553756713867, "global_step": 128854, "epoch": 1552} {"train_loss": -22.75684928894043, "global_step": 128855, "epoch": 1552} {"train_loss": -22.914745330810547, "global_step": 128856, "epoch": 1552} {"train_loss": -22.848037719726562, "global_step": 128857, "epoch": 1552} {"train_loss": -22.674001693725586, "global_step": 128858, "epoch": 1552} {"train_loss": -22.677047729492188, "global_step": 128859, "epoch": 1552} {"train_loss": -22.871925354003906, "global_step": 128860, "epoch": 1552} {"train_loss": -22.722427368164062, "global_step": 128861, "epoch": 1552} {"train_loss": -22.693973541259766, "global_step": 128862, "epoch": 1552} {"train_loss": -23.090635299682617, "global_step": 128863, "epoch": 1552} {"train_loss": -22.734586715698242, "global_step": 128864, "epoch": 1552} {"train_loss": -22.721590042114258, "global_step": 128865, "epoch": 1552} {"train_loss": -22.461702346801758, "global_step": 128866, "epoch": 1552} {"train_loss": -23.07818603515625, "global_step": 128867, "epoch": 1552} {"train_loss": -22.703977584838867, "global_step": 128868, "epoch": 1552} {"train_loss": -22.78335952758789, "global_step": 128869, "epoch": 1552} {"train_loss": -22.658302307128906, "global_step": 128870, "epoch": 1552} {"train_loss": -22.909099578857422, "global_step": 128871, "epoch": 1552} {"train_loss": -23.368024826049805, "global_step": 128872, "epoch": 1552} {"train_loss": -22.646392822265625, "global_step": 128873, "epoch": 1552} {"train_loss": -22.632862091064453, "global_step": 128874, "epoch": 1552} {"train_loss": -22.961782455444336, "global_step": 128875, "epoch": 1552} {"train_loss": -22.499771118164062, "global_step": 128876, "epoch": 1552} {"train_loss": -22.879207611083984, "global_step": 128877, "epoch": 1552} {"train_loss": -22.623096466064453, "global_step": 128878, "epoch": 1552} {"train_loss": -22.800186157226562, "global_step": 128879, "epoch": 1552} {"train_loss": -22.84977149963379, "global_step": 128880, "epoch": 1552} {"train_loss": -23.151891708374023, "global_step": 128881, "epoch": 1552} {"train_loss": -22.58009147644043, "global_step": 128882, "epoch": 1552} {"train_loss": -23.044260025024414, "global_step": 128883, "epoch": 1552} {"train_loss": -22.939329147338867, "global_step": 128884, "epoch": 1552} {"train_loss": -22.817663192749023, "global_step": 128885, "epoch": 1552} {"train_loss": -22.462926864624023, "global_step": 128886, "epoch": 1552} {"train_loss": -22.326709747314453, "global_step": 128887, "epoch": 1552} {"train_loss": -22.348896026611328, "global_step": 128888, "epoch": 1552} {"train_loss": -22.90251922607422, "global_step": 128889, "epoch": 1552} {"train_loss": -22.318029403686523, "global_step": 128890, "epoch": 1552} {"train_loss": -22.52605438232422, "global_step": 128891, "epoch": 1552} {"train_loss": -22.668621063232422, "global_step": 128892, "epoch": 1552} {"train_loss": -22.44744110107422, "global_step": 128893, "epoch": 1552} {"train_loss": -22.567792892456055, "global_step": 128894, "epoch": 1552} {"train_loss": -22.595829010009766, "global_step": 128895, "epoch": 1552} {"train_loss": -22.61427879333496, "global_step": 128896, "epoch": 1552} {"train_loss": -22.958206176757812, "global_step": 128897, "epoch": 1552} {"train_loss": -22.678382184132037, "global_step": 128898, "epoch": 1552, "val_loss": 6272756.0} {"train_loss": -22.747507095336914, "global_step": 128899, "epoch": 1553} {"train_loss": -22.708206176757812, "global_step": 128900, "epoch": 1553} {"train_loss": -22.632707595825195, "global_step": 128901, "epoch": 1553} {"train_loss": -22.270307540893555, "global_step": 128902, "epoch": 1553} {"train_loss": -22.72378921508789, "global_step": 128903, "epoch": 1553} {"train_loss": -22.42736053466797, "global_step": 128904, "epoch": 1553} {"train_loss": -22.634634017944336, "global_step": 128905, "epoch": 1553} {"train_loss": -22.06007194519043, "global_step": 128906, "epoch": 1553} {"train_loss": -22.57611083984375, "global_step": 128907, "epoch": 1553} {"train_loss": -22.385343551635742, "global_step": 128908, "epoch": 1553} {"train_loss": -22.56038475036621, "global_step": 128909, "epoch": 1553} {"train_loss": -22.6007137298584, "global_step": 128910, "epoch": 1553} {"train_loss": -22.113370895385742, "global_step": 128911, "epoch": 1553} {"train_loss": -23.077856063842773, "global_step": 128912, "epoch": 1553} {"train_loss": -22.70267677307129, "global_step": 128913, "epoch": 1553} {"train_loss": -23.0861759185791, "global_step": 128914, "epoch": 1553} {"train_loss": -23.130706787109375, "global_step": 128915, "epoch": 1553} {"train_loss": -23.06205177307129, "global_step": 128916, "epoch": 1553} {"train_loss": -22.33001708984375, "global_step": 128917, "epoch": 1553} {"train_loss": -22.629072189331055, "global_step": 128918, "epoch": 1553} {"train_loss": -22.82930564880371, "global_step": 128919, "epoch": 1553} {"train_loss": -22.841367721557617, "global_step": 128920, "epoch": 1553} {"train_loss": -22.68630027770996, "global_step": 128921, "epoch": 1553} {"train_loss": -22.816781997680664, "global_step": 128922, "epoch": 1553} {"train_loss": -22.85401725769043, "global_step": 128923, "epoch": 1553} {"train_loss": -22.591304779052734, "global_step": 128924, "epoch": 1553} {"train_loss": -22.728254318237305, "global_step": 128925, "epoch": 1553} {"train_loss": -22.37543487548828, "global_step": 128926, "epoch": 1553} {"train_loss": -23.075395584106445, "global_step": 128927, "epoch": 1553} {"train_loss": -22.999774932861328, "global_step": 128928, "epoch": 1553} {"train_loss": -22.83838653564453, "global_step": 128929, "epoch": 1553} {"train_loss": -23.0771484375, "global_step": 128930, "epoch": 1553} {"train_loss": -22.552156448364258, "global_step": 128931, "epoch": 1553} {"train_loss": -22.98414421081543, "global_step": 128932, "epoch": 1553} {"train_loss": -22.39534568786621, "global_step": 128933, "epoch": 1553} {"train_loss": -22.746000289916992, "global_step": 128934, "epoch": 1553} {"train_loss": -22.75557518005371, "global_step": 128935, "epoch": 1553} {"train_loss": -22.550907135009766, "global_step": 128936, "epoch": 1553} {"train_loss": -22.9027042388916, "global_step": 128937, "epoch": 1553} {"train_loss": -22.955867767333984, "global_step": 128938, "epoch": 1553} {"train_loss": -22.65079689025879, "global_step": 128939, "epoch": 1553} {"train_loss": -22.68941307067871, "global_step": 128940, "epoch": 1553} {"train_loss": -22.859445571899414, "global_step": 128941, "epoch": 1553} {"train_loss": -23.049875259399414, "global_step": 128942, "epoch": 1553} {"train_loss": -22.549671173095703, "global_step": 128943, "epoch": 1553} {"train_loss": -22.530988693237305, "global_step": 128944, "epoch": 1553} {"train_loss": -22.714176177978516, "global_step": 128945, "epoch": 1553} {"train_loss": -22.722579956054688, "global_step": 128946, "epoch": 1553} {"train_loss": -22.76587677001953, "global_step": 128947, "epoch": 1553} {"train_loss": -22.356229782104492, "global_step": 128948, "epoch": 1553} {"train_loss": -22.472726821899414, "global_step": 128949, "epoch": 1553} {"train_loss": -22.6713809967041, "global_step": 128950, "epoch": 1553} {"train_loss": -22.64678382873535, "global_step": 128951, "epoch": 1553} {"train_loss": -22.56226921081543, "global_step": 128952, "epoch": 1553} {"train_loss": -22.69782829284668, "global_step": 128953, "epoch": 1553} {"train_loss": -22.728057861328125, "global_step": 128954, "epoch": 1553} {"train_loss": -22.45401954650879, "global_step": 128955, "epoch": 1553} {"train_loss": -22.622913360595703, "global_step": 128956, "epoch": 1553} {"train_loss": -22.67652702331543, "global_step": 128957, "epoch": 1553} {"train_loss": -22.726133346557617, "global_step": 128958, "epoch": 1553} {"train_loss": -22.782779693603516, "global_step": 128959, "epoch": 1553} {"train_loss": -22.815223693847656, "global_step": 128960, "epoch": 1553} {"train_loss": -22.509265899658203, "global_step": 128961, "epoch": 1553} {"train_loss": -22.817642211914062, "global_step": 128962, "epoch": 1553} {"train_loss": -22.70379066467285, "global_step": 128963, "epoch": 1553} {"train_loss": -22.869958877563477, "global_step": 128964, "epoch": 1553} {"train_loss": -22.554513931274414, "global_step": 128965, "epoch": 1553} {"train_loss": -22.999340057373047, "global_step": 128966, "epoch": 1553} {"train_loss": -23.00328826904297, "global_step": 128967, "epoch": 1553} {"train_loss": -22.905044555664062, "global_step": 128968, "epoch": 1553} {"train_loss": -23.032459259033203, "global_step": 128969, "epoch": 1553} {"train_loss": -22.563039779663086, "global_step": 128970, "epoch": 1553} {"train_loss": -23.05582046508789, "global_step": 128971, "epoch": 1553} {"train_loss": -22.596349716186523, "global_step": 128972, "epoch": 1553} {"train_loss": -22.53562355041504, "global_step": 128973, "epoch": 1553} {"train_loss": -22.76571273803711, "global_step": 128974, "epoch": 1553} {"train_loss": -22.760818481445312, "global_step": 128975, "epoch": 1553} {"train_loss": -22.59305763244629, "global_step": 128976, "epoch": 1553} {"train_loss": -22.99818992614746, "global_step": 128977, "epoch": 1553} {"train_loss": -22.810705184936523, "global_step": 128978, "epoch": 1553} {"train_loss": -22.59859275817871, "global_step": 128979, "epoch": 1553} {"train_loss": -23.306129455566406, "global_step": 128980, "epoch": 1553} {"train_loss": -22.70952378698142, "global_step": 128981, "epoch": 1553, "val_loss": 6265573.0} {"train_loss": -22.707212448120117, "global_step": 128982, "epoch": 1554} {"train_loss": -22.444448471069336, "global_step": 128983, "epoch": 1554} {"train_loss": -22.81551170349121, "global_step": 128984, "epoch": 1554} {"train_loss": -22.802160263061523, "global_step": 128985, "epoch": 1554} {"train_loss": -22.646499633789062, "global_step": 128986, "epoch": 1554} {"train_loss": -22.803817749023438, "global_step": 128987, "epoch": 1554} {"train_loss": -22.942344665527344, "global_step": 128988, "epoch": 1554} {"train_loss": -22.886564254760742, "global_step": 128989, "epoch": 1554} {"train_loss": -22.448606491088867, "global_step": 128990, "epoch": 1554} {"train_loss": -22.46770668029785, "global_step": 128991, "epoch": 1554} {"train_loss": -22.848773956298828, "global_step": 128992, "epoch": 1554} {"train_loss": -22.4725341796875, "global_step": 128993, "epoch": 1554} {"train_loss": -22.904088973999023, "global_step": 128994, "epoch": 1554} {"train_loss": -22.6377010345459, "global_step": 128995, "epoch": 1554} {"train_loss": -22.449302673339844, "global_step": 128996, "epoch": 1554} {"train_loss": -22.27829933166504, "global_step": 128997, "epoch": 1554} {"train_loss": -22.673654556274414, "global_step": 128998, "epoch": 1554} {"train_loss": -22.604415893554688, "global_step": 128999, "epoch": 1554} {"train_loss": -22.519948959350586, "global_step": 129000, "epoch": 1554} {"train_loss": -22.66697120666504, "global_step": 129001, "epoch": 1554} {"train_loss": -22.800617218017578, "global_step": 129002, "epoch": 1554} {"train_loss": -23.08417320251465, "global_step": 129003, "epoch": 1554} {"train_loss": -22.870817184448242, "global_step": 129004, "epoch": 1554} {"train_loss": -22.663944244384766, "global_step": 129005, "epoch": 1554} {"train_loss": -23.127300262451172, "global_step": 129006, "epoch": 1554} {"train_loss": -22.34781265258789, "global_step": 129007, "epoch": 1554} {"train_loss": -22.76584815979004, "global_step": 129008, "epoch": 1554} {"train_loss": -22.641637802124023, "global_step": 129009, "epoch": 1554} {"train_loss": -22.907546997070312, "global_step": 129010, "epoch": 1554} {"train_loss": -22.71836280822754, "global_step": 129011, "epoch": 1554} {"train_loss": -22.91316795349121, "global_step": 129012, "epoch": 1554} {"train_loss": -22.71575164794922, "global_step": 129013, "epoch": 1554} {"train_loss": -22.952001571655273, "global_step": 129014, "epoch": 1554} {"train_loss": -22.999740600585938, "global_step": 129015, "epoch": 1554} {"train_loss": -22.906089782714844, "global_step": 129016, "epoch": 1554} {"train_loss": -23.187841415405273, "global_step": 129017, "epoch": 1554} {"train_loss": -22.994983673095703, "global_step": 129018, "epoch": 1554} {"train_loss": -23.072036743164062, "global_step": 129019, "epoch": 1554} {"train_loss": -22.9403076171875, "global_step": 129020, "epoch": 1554} {"train_loss": -22.578519821166992, "global_step": 129021, "epoch": 1554} {"train_loss": -22.8682861328125, "global_step": 129022, "epoch": 1554} {"train_loss": -22.904388427734375, "global_step": 129023, "epoch": 1554} {"train_loss": -22.77406883239746, "global_step": 129024, "epoch": 1554} {"train_loss": -23.008337020874023, "global_step": 129025, "epoch": 1554} {"train_loss": -22.825422286987305, "global_step": 129026, "epoch": 1554} {"train_loss": -22.608718872070312, "global_step": 129027, "epoch": 1554} {"train_loss": -22.58343505859375, "global_step": 129028, "epoch": 1554} {"train_loss": -22.459875106811523, "global_step": 129029, "epoch": 1554} {"train_loss": -23.04304313659668, "global_step": 129030, "epoch": 1554} {"train_loss": -22.53151512145996, "global_step": 129031, "epoch": 1554} {"train_loss": -22.93197250366211, "global_step": 129032, "epoch": 1554} {"train_loss": -22.591474533081055, "global_step": 129033, "epoch": 1554} {"train_loss": -22.49827766418457, "global_step": 129034, "epoch": 1554} {"train_loss": -22.372541427612305, "global_step": 129035, "epoch": 1554} {"train_loss": -22.533512115478516, "global_step": 129036, "epoch": 1554} {"train_loss": -22.85679054260254, "global_step": 129037, "epoch": 1554} {"train_loss": -22.985292434692383, "global_step": 129038, "epoch": 1554} {"train_loss": -22.949674606323242, "global_step": 129039, "epoch": 1554} {"train_loss": -22.550294876098633, "global_step": 129040, "epoch": 1554} {"train_loss": -23.09246063232422, "global_step": 129041, "epoch": 1554} {"train_loss": -22.993330001831055, "global_step": 129042, "epoch": 1554} {"train_loss": -22.892009735107422, "global_step": 129043, "epoch": 1554} {"train_loss": -22.952577590942383, "global_step": 129044, "epoch": 1554} {"train_loss": -22.713308334350586, "global_step": 129045, "epoch": 1554} {"train_loss": -22.891332626342773, "global_step": 129046, "epoch": 1554} {"train_loss": -23.01706314086914, "global_step": 129047, "epoch": 1554} {"train_loss": -22.603260040283203, "global_step": 129048, "epoch": 1554} {"train_loss": -22.549924850463867, "global_step": 129049, "epoch": 1554} {"train_loss": -22.93873405456543, "global_step": 129050, "epoch": 1554} {"train_loss": -22.802677154541016, "global_step": 129051, "epoch": 1554} {"train_loss": -22.47860336303711, "global_step": 129052, "epoch": 1554} {"train_loss": -22.975934982299805, "global_step": 129053, "epoch": 1554} {"train_loss": -22.869821548461914, "global_step": 129054, "epoch": 1554} {"train_loss": -23.07990074157715, "global_step": 129055, "epoch": 1554} {"train_loss": -22.669347763061523, "global_step": 129056, "epoch": 1554} {"train_loss": -22.396207809448242, "global_step": 129057, "epoch": 1554} {"train_loss": -22.752721786499023, "global_step": 129058, "epoch": 1554} {"train_loss": -22.4645938873291, "global_step": 129059, "epoch": 1554} {"train_loss": -22.80307388305664, "global_step": 129060, "epoch": 1554} {"train_loss": -22.777231216430664, "global_step": 129061, "epoch": 1554} {"train_loss": -22.751935958862305, "global_step": 129062, "epoch": 1554} {"train_loss": -22.607120513916016, "global_step": 129063, "epoch": 1554} {"train_loss": -22.74316286753459, "global_step": 129064, "epoch": 1554, "val_loss": 6249569.5} {"train_loss": -22.3485107421875, "global_step": 129065, "epoch": 1555} {"train_loss": -22.418649673461914, "global_step": 129066, "epoch": 1555} {"train_loss": -22.558584213256836, "global_step": 129067, "epoch": 1555} {"train_loss": -22.791051864624023, "global_step": 129068, "epoch": 1555} {"train_loss": -22.469684600830078, "global_step": 129069, "epoch": 1555} {"train_loss": -22.371475219726562, "global_step": 129070, "epoch": 1555} {"train_loss": -22.52715301513672, "global_step": 129071, "epoch": 1555} {"train_loss": -22.79144287109375, "global_step": 129072, "epoch": 1555} {"train_loss": -22.632070541381836, "global_step": 129073, "epoch": 1555} {"train_loss": -22.17768669128418, "global_step": 129074, "epoch": 1555} {"train_loss": -22.702856063842773, "global_step": 129075, "epoch": 1555} {"train_loss": -22.81294822692871, "global_step": 129076, "epoch": 1555} {"train_loss": -22.571861267089844, "global_step": 129077, "epoch": 1555} {"train_loss": -22.65602684020996, "global_step": 129078, "epoch": 1555} {"train_loss": -22.524625778198242, "global_step": 129079, "epoch": 1555} {"train_loss": -22.620929718017578, "global_step": 129080, "epoch": 1555} {"train_loss": -22.514680862426758, "global_step": 129081, "epoch": 1555} {"train_loss": -22.614364624023438, "global_step": 129082, "epoch": 1555} {"train_loss": -23.05629539489746, "global_step": 129083, "epoch": 1555} {"train_loss": -22.719038009643555, "global_step": 129084, "epoch": 1555} {"train_loss": -22.594314575195312, "global_step": 129085, "epoch": 1555} {"train_loss": -22.56100845336914, "global_step": 129086, "epoch": 1555} {"train_loss": -22.68411636352539, "global_step": 129087, "epoch": 1555} {"train_loss": -22.75147819519043, "global_step": 129088, "epoch": 1555} {"train_loss": -23.00223731994629, "global_step": 129089, "epoch": 1555} {"train_loss": -23.038801193237305, "global_step": 129090, "epoch": 1555} {"train_loss": -22.8731632232666, "global_step": 129091, "epoch": 1555} {"train_loss": -22.783735275268555, "global_step": 129092, "epoch": 1555} {"train_loss": -22.594816207885742, "global_step": 129093, "epoch": 1555} {"train_loss": -22.915170669555664, "global_step": 129094, "epoch": 1555} {"train_loss": -22.715513229370117, "global_step": 129095, "epoch": 1555} {"train_loss": -23.060495376586914, "global_step": 129096, "epoch": 1555} {"train_loss": -22.701528549194336, "global_step": 129097, "epoch": 1555} {"train_loss": -22.847583770751953, "global_step": 129098, "epoch": 1555} {"train_loss": -22.88698387145996, "global_step": 129099, "epoch": 1555} {"train_loss": -22.656280517578125, "global_step": 129100, "epoch": 1555} {"train_loss": -22.23890495300293, "global_step": 129101, "epoch": 1555} {"train_loss": -22.797590255737305, "global_step": 129102, "epoch": 1555} {"train_loss": -22.897937774658203, "global_step": 129103, "epoch": 1555} {"train_loss": -22.707088470458984, "global_step": 129104, "epoch": 1555} {"train_loss": -22.908994674682617, "global_step": 129105, "epoch": 1555} {"train_loss": -22.65675163269043, "global_step": 129106, "epoch": 1555} {"train_loss": -22.680997848510742, "global_step": 129107, "epoch": 1555} {"train_loss": -22.803131103515625, "global_step": 129108, "epoch": 1555} {"train_loss": -22.983091354370117, "global_step": 129109, "epoch": 1555} {"train_loss": -22.997709274291992, "global_step": 129110, "epoch": 1555} {"train_loss": -22.422067642211914, "global_step": 129111, "epoch": 1555} {"train_loss": -22.568933486938477, "global_step": 129112, "epoch": 1555} {"train_loss": -23.14680290222168, "global_step": 129113, "epoch": 1555} {"train_loss": -22.698522567749023, "global_step": 129114, "epoch": 1555} {"train_loss": -22.844987869262695, "global_step": 129115, "epoch": 1555} {"train_loss": -22.997392654418945, "global_step": 129116, "epoch": 1555} {"train_loss": -22.684614181518555, "global_step": 129117, "epoch": 1555} {"train_loss": -22.941574096679688, "global_step": 129118, "epoch": 1555} {"train_loss": -22.81984519958496, "global_step": 129119, "epoch": 1555} {"train_loss": -22.981281280517578, "global_step": 129120, "epoch": 1555} {"train_loss": -23.24285125732422, "global_step": 129121, "epoch": 1555} {"train_loss": -22.91242218017578, "global_step": 129122, "epoch": 1555} {"train_loss": -22.537982940673828, "global_step": 129123, "epoch": 1555} {"train_loss": -22.43762969970703, "global_step": 129124, "epoch": 1555} {"train_loss": -22.768939971923828, "global_step": 129125, "epoch": 1555} {"train_loss": -22.85548210144043, "global_step": 129126, "epoch": 1555} {"train_loss": -22.664392471313477, "global_step": 129127, "epoch": 1555} {"train_loss": -22.94236946105957, "global_step": 129128, "epoch": 1555} {"train_loss": -22.964099884033203, "global_step": 129129, "epoch": 1555} {"train_loss": -22.770652770996094, "global_step": 129130, "epoch": 1555} {"train_loss": -22.89494514465332, "global_step": 129131, "epoch": 1555} {"train_loss": -22.85914421081543, "global_step": 129132, "epoch": 1555} {"train_loss": -22.592266082763672, "global_step": 129133, "epoch": 1555} {"train_loss": -23.010526657104492, "global_step": 129134, "epoch": 1555} {"train_loss": -22.6219539642334, "global_step": 129135, "epoch": 1555} {"train_loss": -23.122421264648438, "global_step": 129136, "epoch": 1555} {"train_loss": -22.706010818481445, "global_step": 129137, "epoch": 1555} {"train_loss": -22.886686325073242, "global_step": 129138, "epoch": 1555} {"train_loss": -22.57834243774414, "global_step": 129139, "epoch": 1555} {"train_loss": -22.79884910583496, "global_step": 129140, "epoch": 1555} {"train_loss": -22.609582901000977, "global_step": 129141, "epoch": 1555} {"train_loss": -22.62180519104004, "global_step": 129142, "epoch": 1555} {"train_loss": -23.20245361328125, "global_step": 129143, "epoch": 1555} {"train_loss": -22.81929588317871, "global_step": 129144, "epoch": 1555} {"train_loss": -22.609155654907227, "global_step": 129145, "epoch": 1555} {"train_loss": -22.993711471557617, "global_step": 129146, "epoch": 1555} {"train_loss": -22.746748476143342, "global_step": 129147, "epoch": 1555, "val_loss": 6228240.0} {"train_loss": -22.704822540283203, "global_step": 129148, "epoch": 1556} {"train_loss": -21.864147186279297, "global_step": 129149, "epoch": 1556} {"train_loss": -22.677549362182617, "global_step": 129150, "epoch": 1556} {"train_loss": -22.637678146362305, "global_step": 129151, "epoch": 1556} {"train_loss": -22.65350914001465, "global_step": 129152, "epoch": 1556} {"train_loss": -22.78768539428711, "global_step": 129153, "epoch": 1556} {"train_loss": -22.234189987182617, "global_step": 129154, "epoch": 1556} {"train_loss": -22.7484130859375, "global_step": 129155, "epoch": 1556} {"train_loss": -22.507471084594727, "global_step": 129156, "epoch": 1556} {"train_loss": -22.532896041870117, "global_step": 129157, "epoch": 1556} {"train_loss": -22.774110794067383, "global_step": 129158, "epoch": 1556} {"train_loss": -22.33330726623535, "global_step": 129159, "epoch": 1556} {"train_loss": -22.555240631103516, "global_step": 129160, "epoch": 1556} {"train_loss": -22.21369171142578, "global_step": 129161, "epoch": 1556} {"train_loss": -22.850881576538086, "global_step": 129162, "epoch": 1556} {"train_loss": -22.801679611206055, "global_step": 129163, "epoch": 1556} {"train_loss": -22.479415893554688, "global_step": 129164, "epoch": 1556} {"train_loss": -22.698957443237305, "global_step": 129165, "epoch": 1556} {"train_loss": -22.45785903930664, "global_step": 129166, "epoch": 1556} {"train_loss": -22.614591598510742, "global_step": 129167, "epoch": 1556} {"train_loss": -22.916996002197266, "global_step": 129168, "epoch": 1556} {"train_loss": -22.92731285095215, "global_step": 129169, "epoch": 1556} {"train_loss": -22.54023551940918, "global_step": 129170, "epoch": 1556} {"train_loss": -23.01519775390625, "global_step": 129171, "epoch": 1556} {"train_loss": -22.801467895507812, "global_step": 129172, "epoch": 1556} {"train_loss": -22.854408264160156, "global_step": 129173, "epoch": 1556} {"train_loss": -22.780973434448242, "global_step": 129174, "epoch": 1556} {"train_loss": -22.710859298706055, "global_step": 129175, "epoch": 1556} {"train_loss": -22.608861923217773, "global_step": 129176, "epoch": 1556} {"train_loss": -22.90155601501465, "global_step": 129177, "epoch": 1556} {"train_loss": -22.68443489074707, "global_step": 129178, "epoch": 1556} {"train_loss": -22.680583953857422, "global_step": 129179, "epoch": 1556} {"train_loss": -22.928314208984375, "global_step": 129180, "epoch": 1556} {"train_loss": -22.923397064208984, "global_step": 129181, "epoch": 1556} {"train_loss": -22.83434295654297, "global_step": 129182, "epoch": 1556} {"train_loss": -22.841575622558594, "global_step": 129183, "epoch": 1556} {"train_loss": -23.19683837890625, "global_step": 129184, "epoch": 1556} {"train_loss": -22.84328269958496, "global_step": 129185, "epoch": 1556} {"train_loss": -23.068771362304688, "global_step": 129186, "epoch": 1556} {"train_loss": -22.967947006225586, "global_step": 129187, "epoch": 1556} {"train_loss": -22.722900390625, "global_step": 129188, "epoch": 1556} {"train_loss": -23.10671043395996, "global_step": 129189, "epoch": 1556} {"train_loss": -22.694551467895508, "global_step": 129190, "epoch": 1556} {"train_loss": -22.5282039642334, "global_step": 129191, "epoch": 1556} {"train_loss": -22.710355758666992, "global_step": 129192, "epoch": 1556} {"train_loss": -22.865488052368164, "global_step": 129193, "epoch": 1556} {"train_loss": -22.69369888305664, "global_step": 129194, "epoch": 1556} {"train_loss": -22.704896926879883, "global_step": 129195, "epoch": 1556} {"train_loss": -22.840866088867188, "global_step": 129196, "epoch": 1556} {"train_loss": -23.013179779052734, "global_step": 129197, "epoch": 1556} {"train_loss": -23.09804344177246, "global_step": 129198, "epoch": 1556} {"train_loss": -22.85687828063965, "global_step": 129199, "epoch": 1556} {"train_loss": -22.601837158203125, "global_step": 129200, "epoch": 1556} {"train_loss": -22.836673736572266, "global_step": 129201, "epoch": 1556} {"train_loss": -22.7056941986084, "global_step": 129202, "epoch": 1556} {"train_loss": -22.717687606811523, "global_step": 129203, "epoch": 1556} {"train_loss": -22.510549545288086, "global_step": 129204, "epoch": 1556} {"train_loss": -22.80282974243164, "global_step": 129205, "epoch": 1556} {"train_loss": -22.56258201599121, "global_step": 129206, "epoch": 1556} {"train_loss": -22.40337562561035, "global_step": 129207, "epoch": 1556} {"train_loss": -22.693660736083984, "global_step": 129208, "epoch": 1556} {"train_loss": -22.53704833984375, "global_step": 129209, "epoch": 1556} {"train_loss": -22.27901840209961, "global_step": 129210, "epoch": 1556} {"train_loss": -22.609663009643555, "global_step": 129211, "epoch": 1556} {"train_loss": -23.228958129882812, "global_step": 129212, "epoch": 1556} {"train_loss": -22.577030181884766, "global_step": 129213, "epoch": 1556} {"train_loss": -22.458837509155273, "global_step": 129214, "epoch": 1556} {"train_loss": -22.776622772216797, "global_step": 129215, "epoch": 1556} {"train_loss": -22.973691940307617, "global_step": 129216, "epoch": 1556} {"train_loss": -23.053125381469727, "global_step": 129217, "epoch": 1556} {"train_loss": -22.703954696655273, "global_step": 129218, "epoch": 1556} {"train_loss": -23.282623291015625, "global_step": 129219, "epoch": 1556} {"train_loss": -22.424814224243164, "global_step": 129220, "epoch": 1556} {"train_loss": -22.780155181884766, "global_step": 129221, "epoch": 1556} {"train_loss": -22.48422622680664, "global_step": 129222, "epoch": 1556} {"train_loss": -22.531797409057617, "global_step": 129223, "epoch": 1556} {"train_loss": -22.36122703552246, "global_step": 129224, "epoch": 1556} {"train_loss": -22.71489143371582, "global_step": 129225, "epoch": 1556} {"train_loss": -22.513864517211914, "global_step": 129226, "epoch": 1556} {"train_loss": -22.36107063293457, "global_step": 129227, "epoch": 1556} {"train_loss": -22.56365966796875, "global_step": 129228, "epoch": 1556} {"train_loss": -22.934762954711914, "global_step": 129229, "epoch": 1556} {"train_loss": -22.710963651358362, "global_step": 129230, "epoch": 1556, "val_loss": 6298257.0} {"train_loss": -22.38663673400879, "global_step": 129231, "epoch": 1557} {"train_loss": -22.577428817749023, "global_step": 129232, "epoch": 1557} {"train_loss": -22.29831886291504, "global_step": 129233, "epoch": 1557} {"train_loss": -22.458433151245117, "global_step": 129234, "epoch": 1557} {"train_loss": -22.55126953125, "global_step": 129235, "epoch": 1557} {"train_loss": -22.1396427154541, "global_step": 129236, "epoch": 1557} {"train_loss": -22.409753799438477, "global_step": 129237, "epoch": 1557} {"train_loss": -22.513254165649414, "global_step": 129238, "epoch": 1557} {"train_loss": -22.804641723632812, "global_step": 129239, "epoch": 1557} {"train_loss": -22.423702239990234, "global_step": 129240, "epoch": 1557} {"train_loss": -22.706649780273438, "global_step": 129241, "epoch": 1557} {"train_loss": -22.296001434326172, "global_step": 129242, "epoch": 1557} {"train_loss": -22.51595115661621, "global_step": 129243, "epoch": 1557} {"train_loss": -22.39605712890625, "global_step": 129244, "epoch": 1557} {"train_loss": -22.567935943603516, "global_step": 129245, "epoch": 1557} {"train_loss": -22.71863555908203, "global_step": 129246, "epoch": 1557} {"train_loss": -22.722753524780273, "global_step": 129247, "epoch": 1557} {"train_loss": -23.019948959350586, "global_step": 129248, "epoch": 1557} {"train_loss": -22.591169357299805, "global_step": 129249, "epoch": 1557} {"train_loss": -22.897233963012695, "global_step": 129250, "epoch": 1557} {"train_loss": -22.662710189819336, "global_step": 129251, "epoch": 1557} {"train_loss": -22.838682174682617, "global_step": 129252, "epoch": 1557} {"train_loss": -23.048105239868164, "global_step": 129253, "epoch": 1557} {"train_loss": -22.676645278930664, "global_step": 129254, "epoch": 1557} {"train_loss": -22.654542922973633, "global_step": 129255, "epoch": 1557} {"train_loss": -22.901735305786133, "global_step": 129256, "epoch": 1557} {"train_loss": -22.335023880004883, "global_step": 129257, "epoch": 1557} {"train_loss": -22.208635330200195, "global_step": 129258, "epoch": 1557} {"train_loss": -22.679996490478516, "global_step": 129259, "epoch": 1557} {"train_loss": -22.990568161010742, "global_step": 129260, "epoch": 1557} {"train_loss": -22.86225700378418, "global_step": 129261, "epoch": 1557} {"train_loss": -22.9830379486084, "global_step": 129262, "epoch": 1557} {"train_loss": -22.99519157409668, "global_step": 129263, "epoch": 1557} {"train_loss": -22.73508644104004, "global_step": 129264, "epoch": 1557} {"train_loss": -22.78545570373535, "global_step": 129265, "epoch": 1557} {"train_loss": -23.14090919494629, "global_step": 129266, "epoch": 1557} {"train_loss": -22.946752548217773, "global_step": 129267, "epoch": 1557} {"train_loss": -23.116296768188477, "global_step": 129268, "epoch": 1557} {"train_loss": -23.16590690612793, "global_step": 129269, "epoch": 1557} {"train_loss": -22.852203369140625, "global_step": 129270, "epoch": 1557} {"train_loss": -23.054174423217773, "global_step": 129271, "epoch": 1557} {"train_loss": -22.688024520874023, "global_step": 129272, "epoch": 1557} {"train_loss": -22.87605857849121, "global_step": 129273, "epoch": 1557} {"train_loss": -22.93827247619629, "global_step": 129274, "epoch": 1557} {"train_loss": -22.8708438873291, "global_step": 129275, "epoch": 1557} {"train_loss": -22.779104232788086, "global_step": 129276, "epoch": 1557} {"train_loss": -22.683019638061523, "global_step": 129277, "epoch": 1557} {"train_loss": -22.93561553955078, "global_step": 129278, "epoch": 1557} {"train_loss": -22.773456573486328, "global_step": 129279, "epoch": 1557} {"train_loss": -23.023935317993164, "global_step": 129280, "epoch": 1557} {"train_loss": -22.65610122680664, "global_step": 129281, "epoch": 1557} {"train_loss": -22.87297821044922, "global_step": 129282, "epoch": 1557} {"train_loss": -22.74629020690918, "global_step": 129283, "epoch": 1557} {"train_loss": -22.97159194946289, "global_step": 129284, "epoch": 1557} {"train_loss": -22.89478874206543, "global_step": 129285, "epoch": 1557} {"train_loss": -22.650876998901367, "global_step": 129286, "epoch": 1557} {"train_loss": -22.510269165039062, "global_step": 129287, "epoch": 1557} {"train_loss": -22.58422088623047, "global_step": 129288, "epoch": 1557} {"train_loss": -22.641706466674805, "global_step": 129289, "epoch": 1557} {"train_loss": -22.905277252197266, "global_step": 129290, "epoch": 1557} {"train_loss": -22.7744197845459, "global_step": 129291, "epoch": 1557} {"train_loss": -22.516496658325195, "global_step": 129292, "epoch": 1557} {"train_loss": -23.093408584594727, "global_step": 129293, "epoch": 1557} {"train_loss": -22.82733726501465, "global_step": 129294, "epoch": 1557} {"train_loss": -22.856355667114258, "global_step": 129295, "epoch": 1557} {"train_loss": -23.03079605102539, "global_step": 129296, "epoch": 1557} {"train_loss": -22.695541381835938, "global_step": 129297, "epoch": 1557} {"train_loss": -22.685850143432617, "global_step": 129298, "epoch": 1557} {"train_loss": -22.569725036621094, "global_step": 129299, "epoch": 1557} {"train_loss": -22.047876358032227, "global_step": 129300, "epoch": 1557} {"train_loss": -23.064464569091797, "global_step": 129301, "epoch": 1557} {"train_loss": -22.437450408935547, "global_step": 129302, "epoch": 1557} {"train_loss": -22.363807678222656, "global_step": 129303, "epoch": 1557} {"train_loss": -22.908466339111328, "global_step": 129304, "epoch": 1557} {"train_loss": -22.826736450195312, "global_step": 129305, "epoch": 1557} {"train_loss": -23.0131893157959, "global_step": 129306, "epoch": 1557} {"train_loss": -22.80451011657715, "global_step": 129307, "epoch": 1557} {"train_loss": -23.07701301574707, "global_step": 129308, "epoch": 1557} {"train_loss": -22.90292739868164, "global_step": 129309, "epoch": 1557} {"train_loss": -22.7187557220459, "global_step": 129310, "epoch": 1557} {"train_loss": -22.766408920288086, "global_step": 129311, "epoch": 1557} {"train_loss": -22.855497360229492, "global_step": 129312, "epoch": 1557} {"train_loss": -22.730455950082067, "global_step": 129313, "epoch": 1557, "val_loss": 6201455.0} {"train_loss": -22.66938591003418, "global_step": 129314, "epoch": 1558} {"train_loss": -21.908628463745117, "global_step": 129315, "epoch": 1558} {"train_loss": -22.941123962402344, "global_step": 129316, "epoch": 1558} {"train_loss": -22.20516014099121, "global_step": 129317, "epoch": 1558} {"train_loss": -22.447568893432617, "global_step": 129318, "epoch": 1558} {"train_loss": -22.834089279174805, "global_step": 129319, "epoch": 1558} {"train_loss": -22.384254455566406, "global_step": 129320, "epoch": 1558} {"train_loss": -22.248388290405273, "global_step": 129321, "epoch": 1558} {"train_loss": -22.587331771850586, "global_step": 129322, "epoch": 1558} {"train_loss": -22.716367721557617, "global_step": 129323, "epoch": 1558} {"train_loss": -22.835803985595703, "global_step": 129324, "epoch": 1558} {"train_loss": -22.221296310424805, "global_step": 129325, "epoch": 1558} {"train_loss": -22.079666137695312, "global_step": 129326, "epoch": 1558} {"train_loss": -22.633390426635742, "global_step": 129327, "epoch": 1558} {"train_loss": -21.994873046875, "global_step": 129328, "epoch": 1558} {"train_loss": -22.85687828063965, "global_step": 129329, "epoch": 1558} {"train_loss": -22.320154190063477, "global_step": 129330, "epoch": 1558} {"train_loss": -22.323726654052734, "global_step": 129331, "epoch": 1558} {"train_loss": -22.928449630737305, "global_step": 129332, "epoch": 1558} {"train_loss": -22.789785385131836, "global_step": 129333, "epoch": 1558} {"train_loss": -22.741352081298828, "global_step": 129334, "epoch": 1558} {"train_loss": -22.502933502197266, "global_step": 129335, "epoch": 1558} {"train_loss": -23.025039672851562, "global_step": 129336, "epoch": 1558} {"train_loss": -22.724781036376953, "global_step": 129337, "epoch": 1558} {"train_loss": -22.719640731811523, "global_step": 129338, "epoch": 1558} {"train_loss": -22.251720428466797, "global_step": 129339, "epoch": 1558} {"train_loss": -22.61297607421875, "global_step": 129340, "epoch": 1558} {"train_loss": -22.706823348999023, "global_step": 129341, "epoch": 1558} {"train_loss": -22.967893600463867, "global_step": 129342, "epoch": 1558} {"train_loss": -22.54486846923828, "global_step": 129343, "epoch": 1558} {"train_loss": -22.269865036010742, "global_step": 129344, "epoch": 1558} {"train_loss": -23.081693649291992, "global_step": 129345, "epoch": 1558} {"train_loss": -22.432891845703125, "global_step": 129346, "epoch": 1558} {"train_loss": -22.579587936401367, "global_step": 129347, "epoch": 1558} {"train_loss": -22.833707809448242, "global_step": 129348, "epoch": 1558} {"train_loss": -22.85248374938965, "global_step": 129349, "epoch": 1558} {"train_loss": -22.627391815185547, "global_step": 129350, "epoch": 1558} {"train_loss": -22.996301651000977, "global_step": 129351, "epoch": 1558} {"train_loss": -23.003211975097656, "global_step": 129352, "epoch": 1558} {"train_loss": -22.79538917541504, "global_step": 129353, "epoch": 1558} {"train_loss": -22.505756378173828, "global_step": 129354, "epoch": 1558} {"train_loss": -22.90327262878418, "global_step": 129355, "epoch": 1558} {"train_loss": -23.02933120727539, "global_step": 129356, "epoch": 1558} {"train_loss": -22.710102081298828, "global_step": 129357, "epoch": 1558} {"train_loss": -22.70515251159668, "global_step": 129358, "epoch": 1558} {"train_loss": -23.0574951171875, "global_step": 129359, "epoch": 1558} {"train_loss": -22.92058753967285, "global_step": 129360, "epoch": 1558} {"train_loss": -22.80806541442871, "global_step": 129361, "epoch": 1558} {"train_loss": -22.95845603942871, "global_step": 129362, "epoch": 1558} {"train_loss": -22.9945011138916, "global_step": 129363, "epoch": 1558} {"train_loss": -22.806432723999023, "global_step": 129364, "epoch": 1558} {"train_loss": -23.120878219604492, "global_step": 129365, "epoch": 1558} {"train_loss": -22.863584518432617, "global_step": 129366, "epoch": 1558} {"train_loss": -22.51092529296875, "global_step": 129367, "epoch": 1558} {"train_loss": -22.835464477539062, "global_step": 129368, "epoch": 1558} {"train_loss": -22.862689971923828, "global_step": 129369, "epoch": 1558} {"train_loss": -22.903106689453125, "global_step": 129370, "epoch": 1558} {"train_loss": -22.655996322631836, "global_step": 129371, "epoch": 1558} {"train_loss": -23.081668853759766, "global_step": 129372, "epoch": 1558} {"train_loss": -22.906530380249023, "global_step": 129373, "epoch": 1558} {"train_loss": -22.814170837402344, "global_step": 129374, "epoch": 1558} {"train_loss": -23.065582275390625, "global_step": 129375, "epoch": 1558} {"train_loss": -22.56129264831543, "global_step": 129376, "epoch": 1558} {"train_loss": -22.72777557373047, "global_step": 129377, "epoch": 1558} {"train_loss": -22.871042251586914, "global_step": 129378, "epoch": 1558} {"train_loss": -22.562843322753906, "global_step": 129379, "epoch": 1558} {"train_loss": -22.744430541992188, "global_step": 129380, "epoch": 1558} {"train_loss": -22.856313705444336, "global_step": 129381, "epoch": 1558} {"train_loss": -23.005359649658203, "global_step": 129382, "epoch": 1558} {"train_loss": -22.735492706298828, "global_step": 129383, "epoch": 1558} {"train_loss": -22.85926628112793, "global_step": 129384, "epoch": 1558} {"train_loss": -23.074462890625, "global_step": 129385, "epoch": 1558} {"train_loss": -22.730443954467773, "global_step": 129386, "epoch": 1558} {"train_loss": -22.67762565612793, "global_step": 129387, "epoch": 1558} {"train_loss": -22.36903953552246, "global_step": 129388, "epoch": 1558} {"train_loss": -22.62874412536621, "global_step": 129389, "epoch": 1558} {"train_loss": -22.763263702392578, "global_step": 129390, "epoch": 1558} {"train_loss": -22.330394744873047, "global_step": 129391, "epoch": 1558} {"train_loss": -22.806936264038086, "global_step": 129392, "epoch": 1558} {"train_loss": -22.85053062438965, "global_step": 129393, "epoch": 1558} {"train_loss": -22.343658447265625, "global_step": 129394, "epoch": 1558} {"train_loss": -22.370704650878906, "global_step": 129395, "epoch": 1558} {"train_loss": -22.705022283347255, "global_step": 129396, "epoch": 1558, "val_loss": 6264956.0} {"train_loss": -22.38511085510254, "global_step": 129397, "epoch": 1559} {"train_loss": -22.60994529724121, "global_step": 129398, "epoch": 1559} {"train_loss": -22.729263305664062, "global_step": 129399, "epoch": 1559} {"train_loss": -22.218507766723633, "global_step": 129400, "epoch": 1559} {"train_loss": -22.374849319458008, "global_step": 129401, "epoch": 1559} {"train_loss": -22.302453994750977, "global_step": 129402, "epoch": 1559} {"train_loss": -22.63987922668457, "global_step": 129403, "epoch": 1559} {"train_loss": -22.37152099609375, "global_step": 129404, "epoch": 1559} {"train_loss": -22.608488082885742, "global_step": 129405, "epoch": 1559} {"train_loss": -22.415184020996094, "global_step": 129406, "epoch": 1559} {"train_loss": -22.179224014282227, "global_step": 129407, "epoch": 1559} {"train_loss": -22.37698745727539, "global_step": 129408, "epoch": 1559} {"train_loss": -22.763994216918945, "global_step": 129409, "epoch": 1559} {"train_loss": -22.31989288330078, "global_step": 129410, "epoch": 1559} {"train_loss": -22.948883056640625, "global_step": 129411, "epoch": 1559} {"train_loss": -22.313676834106445, "global_step": 129412, "epoch": 1559} {"train_loss": -22.410873413085938, "global_step": 129413, "epoch": 1559} {"train_loss": -22.888086318969727, "global_step": 129414, "epoch": 1559} {"train_loss": -22.966812133789062, "global_step": 129415, "epoch": 1559} {"train_loss": -22.442956924438477, "global_step": 129416, "epoch": 1559} {"train_loss": -22.7027645111084, "global_step": 129417, "epoch": 1559} {"train_loss": -22.535139083862305, "global_step": 129418, "epoch": 1559} {"train_loss": -22.828317642211914, "global_step": 129419, "epoch": 1559} {"train_loss": -22.723508834838867, "global_step": 129420, "epoch": 1559} {"train_loss": -22.747312545776367, "global_step": 129421, "epoch": 1559} {"train_loss": -22.619184494018555, "global_step": 129422, "epoch": 1559} {"train_loss": -23.33919906616211, "global_step": 129423, "epoch": 1559} {"train_loss": -22.579608917236328, "global_step": 129424, "epoch": 1559} {"train_loss": -22.659549713134766, "global_step": 129425, "epoch": 1559} {"train_loss": -22.80856704711914, "global_step": 129426, "epoch": 1559} {"train_loss": -23.008264541625977, "global_step": 129427, "epoch": 1559} {"train_loss": -22.438318252563477, "global_step": 129428, "epoch": 1559} {"train_loss": -22.604806900024414, "global_step": 129429, "epoch": 1559} {"train_loss": -22.586246490478516, "global_step": 129430, "epoch": 1559} {"train_loss": -22.638935089111328, "global_step": 129431, "epoch": 1559} {"train_loss": -22.42259979248047, "global_step": 129432, "epoch": 1559} {"train_loss": -22.396533966064453, "global_step": 129433, "epoch": 1559} {"train_loss": -22.551223754882812, "global_step": 129434, "epoch": 1559} {"train_loss": -22.64699363708496, "global_step": 129435, "epoch": 1559} {"train_loss": -22.566457748413086, "global_step": 129436, "epoch": 1559} {"train_loss": -22.564163208007812, "global_step": 129437, "epoch": 1559} {"train_loss": -22.958784103393555, "global_step": 129438, "epoch": 1559} {"train_loss": -22.688047409057617, "global_step": 129439, "epoch": 1559} {"train_loss": -22.429723739624023, "global_step": 129440, "epoch": 1559} {"train_loss": -22.573041915893555, "global_step": 129441, "epoch": 1559} {"train_loss": -22.62568473815918, "global_step": 129442, "epoch": 1559} {"train_loss": -22.756357192993164, "global_step": 129443, "epoch": 1559} {"train_loss": -22.73084831237793, "global_step": 129444, "epoch": 1559} {"train_loss": -22.720903396606445, "global_step": 129445, "epoch": 1559} {"train_loss": -22.46790885925293, "global_step": 129446, "epoch": 1559} {"train_loss": -22.8237361907959, "global_step": 129447, "epoch": 1559} {"train_loss": -22.40260124206543, "global_step": 129448, "epoch": 1559} {"train_loss": -22.918676376342773, "global_step": 129449, "epoch": 1559} {"train_loss": -22.633056640625, "global_step": 129450, "epoch": 1559} {"train_loss": -22.66373634338379, "global_step": 129451, "epoch": 1559} {"train_loss": -22.783586502075195, "global_step": 129452, "epoch": 1559} {"train_loss": -22.493072509765625, "global_step": 129453, "epoch": 1559} {"train_loss": -22.5725040435791, "global_step": 129454, "epoch": 1559} {"train_loss": -22.497182846069336, "global_step": 129455, "epoch": 1559} {"train_loss": -22.62103271484375, "global_step": 129456, "epoch": 1559} {"train_loss": -23.14466667175293, "global_step": 129457, "epoch": 1559} {"train_loss": -22.766427993774414, "global_step": 129458, "epoch": 1559} {"train_loss": -22.903799057006836, "global_step": 129459, "epoch": 1559} {"train_loss": -22.82969093322754, "global_step": 129460, "epoch": 1559} {"train_loss": -22.901355743408203, "global_step": 129461, "epoch": 1559} {"train_loss": -22.732879638671875, "global_step": 129462, "epoch": 1559} {"train_loss": -22.607898712158203, "global_step": 129463, "epoch": 1559} {"train_loss": -23.039840698242188, "global_step": 129464, "epoch": 1559} {"train_loss": -22.40280532836914, "global_step": 129465, "epoch": 1559} {"train_loss": -23.04231834411621, "global_step": 129466, "epoch": 1559} {"train_loss": -23.07643699645996, "global_step": 129467, "epoch": 1559} {"train_loss": -22.951078414916992, "global_step": 129468, "epoch": 1559} {"train_loss": -22.59988784790039, "global_step": 129469, "epoch": 1559} {"train_loss": -23.11606788635254, "global_step": 129470, "epoch": 1559} {"train_loss": -22.889753341674805, "global_step": 129471, "epoch": 1559} {"train_loss": -22.686195373535156, "global_step": 129472, "epoch": 1559} {"train_loss": -22.775604248046875, "global_step": 129473, "epoch": 1559} {"train_loss": -22.548131942749023, "global_step": 129474, "epoch": 1559} {"train_loss": -22.83750343322754, "global_step": 129475, "epoch": 1559} {"train_loss": -22.422937393188477, "global_step": 129476, "epoch": 1559} {"train_loss": -22.865476608276367, "global_step": 129477, "epoch": 1559} {"train_loss": -22.955081939697266, "global_step": 129478, "epoch": 1559} {"train_loss": -22.658011356032038, "global_step": 129479, "epoch": 1559, "val_loss": 6233369.0} {"train_loss": -22.586894989013672, "global_step": 129480, "epoch": 1560} {"train_loss": -22.290019989013672, "global_step": 129481, "epoch": 1560} {"train_loss": -21.882389068603516, "global_step": 129482, "epoch": 1560} {"train_loss": -22.80074691772461, "global_step": 129483, "epoch": 1560} {"train_loss": -22.248062133789062, "global_step": 129484, "epoch": 1560} {"train_loss": -22.2237548828125, "global_step": 129485, "epoch": 1560} {"train_loss": -22.506872177124023, "global_step": 129486, "epoch": 1560} {"train_loss": -21.965307235717773, "global_step": 129487, "epoch": 1560} {"train_loss": -22.49212074279785, "global_step": 129488, "epoch": 1560} {"train_loss": -22.24844741821289, "global_step": 129489, "epoch": 1560} {"train_loss": -22.265111923217773, "global_step": 129490, "epoch": 1560} {"train_loss": -22.429580688476562, "global_step": 129491, "epoch": 1560} {"train_loss": -22.03073501586914, "global_step": 129492, "epoch": 1560} {"train_loss": -22.972013473510742, "global_step": 129493, "epoch": 1560} {"train_loss": -22.17092514038086, "global_step": 129494, "epoch": 1560} {"train_loss": -22.686141967773438, "global_step": 129495, "epoch": 1560} {"train_loss": -22.318511962890625, "global_step": 129496, "epoch": 1560} {"train_loss": -22.2376651763916, "global_step": 129497, "epoch": 1560} {"train_loss": -22.641468048095703, "global_step": 129498, "epoch": 1560} {"train_loss": -22.603927612304688, "global_step": 129499, "epoch": 1560} {"train_loss": -22.6393985748291, "global_step": 129500, "epoch": 1560} {"train_loss": -22.318653106689453, "global_step": 129501, "epoch": 1560} {"train_loss": -22.416696548461914, "global_step": 129502, "epoch": 1560} {"train_loss": -22.40828514099121, "global_step": 129503, "epoch": 1560} {"train_loss": -22.810733795166016, "global_step": 129504, "epoch": 1560} {"train_loss": -22.100637435913086, "global_step": 129505, "epoch": 1560} {"train_loss": -22.65205192565918, "global_step": 129506, "epoch": 1560} {"train_loss": -22.788928985595703, "global_step": 129507, "epoch": 1560} {"train_loss": -22.942169189453125, "global_step": 129508, "epoch": 1560} {"train_loss": -22.9083309173584, "global_step": 129509, "epoch": 1560} {"train_loss": -22.690214157104492, "global_step": 129510, "epoch": 1560} {"train_loss": -22.863969802856445, "global_step": 129511, "epoch": 1560} {"train_loss": -22.7205810546875, "global_step": 129512, "epoch": 1560} {"train_loss": -22.983583450317383, "global_step": 129513, "epoch": 1560} {"train_loss": -23.031513214111328, "global_step": 129514, "epoch": 1560} {"train_loss": -22.485137939453125, "global_step": 129515, "epoch": 1560} {"train_loss": -22.87608528137207, "global_step": 129516, "epoch": 1560} {"train_loss": -22.87088966369629, "global_step": 129517, "epoch": 1560} {"train_loss": -22.3012638092041, "global_step": 129518, "epoch": 1560} {"train_loss": -22.95542335510254, "global_step": 129519, "epoch": 1560} {"train_loss": -22.62392234802246, "global_step": 129520, "epoch": 1560} {"train_loss": -23.017135620117188, "global_step": 129521, "epoch": 1560} {"train_loss": -23.125844955444336, "global_step": 129522, "epoch": 1560} {"train_loss": -22.5996150970459, "global_step": 129523, "epoch": 1560} {"train_loss": -22.847854614257812, "global_step": 129524, "epoch": 1560} {"train_loss": -23.18379020690918, "global_step": 129525, "epoch": 1560} {"train_loss": -22.90329360961914, "global_step": 129526, "epoch": 1560} {"train_loss": -22.842374801635742, "global_step": 129527, "epoch": 1560} {"train_loss": -22.891672134399414, "global_step": 129528, "epoch": 1560} {"train_loss": -22.69453239440918, "global_step": 129529, "epoch": 1560} {"train_loss": -22.765182495117188, "global_step": 129530, "epoch": 1560} {"train_loss": -23.031049728393555, "global_step": 129531, "epoch": 1560} {"train_loss": -22.679162979125977, "global_step": 129532, "epoch": 1560} {"train_loss": -22.955577850341797, "global_step": 129533, "epoch": 1560} {"train_loss": -22.637983322143555, "global_step": 129534, "epoch": 1560} {"train_loss": -22.72570037841797, "global_step": 129535, "epoch": 1560} {"train_loss": -22.65971565246582, "global_step": 129536, "epoch": 1560} {"train_loss": -22.851287841796875, "global_step": 129537, "epoch": 1560} {"train_loss": -23.0587100982666, "global_step": 129538, "epoch": 1560} {"train_loss": -22.787076950073242, "global_step": 129539, "epoch": 1560} {"train_loss": -22.835861206054688, "global_step": 129540, "epoch": 1560} {"train_loss": -22.8632755279541, "global_step": 129541, "epoch": 1560} {"train_loss": -22.777915954589844, "global_step": 129542, "epoch": 1560} {"train_loss": -22.923452377319336, "global_step": 129543, "epoch": 1560} {"train_loss": -22.57940673828125, "global_step": 129544, "epoch": 1560} {"train_loss": -22.56355857849121, "global_step": 129545, "epoch": 1560} {"train_loss": -23.054668426513672, "global_step": 129546, "epoch": 1560} {"train_loss": -23.091075897216797, "global_step": 129547, "epoch": 1560} {"train_loss": -22.817564010620117, "global_step": 129548, "epoch": 1560} {"train_loss": -22.832250595092773, "global_step": 129549, "epoch": 1560} {"train_loss": -22.839599609375, "global_step": 129550, "epoch": 1560} {"train_loss": -22.92229652404785, "global_step": 129551, "epoch": 1560} {"train_loss": -22.914697647094727, "global_step": 129552, "epoch": 1560} {"train_loss": -23.082061767578125, "global_step": 129553, "epoch": 1560} {"train_loss": -22.53521156311035, "global_step": 129554, "epoch": 1560} {"train_loss": -22.75472068786621, "global_step": 129555, "epoch": 1560} {"train_loss": -22.598953247070312, "global_step": 129556, "epoch": 1560} {"train_loss": -23.01604461669922, "global_step": 129557, "epoch": 1560} {"train_loss": -22.98695182800293, "global_step": 129558, "epoch": 1560} {"train_loss": -23.175434112548828, "global_step": 129559, "epoch": 1560} {"train_loss": -22.93339729309082, "global_step": 129560, "epoch": 1560} {"train_loss": -22.804208755493164, "global_step": 129561, "epoch": 1560} {"train_loss": -22.70563821907503, "global_step": 129562, "epoch": 1560, "val_loss": 6252252.0} {"train_loss": -20.588483810424805, "global_step": 129563, "epoch": 1561} {"train_loss": -20.284687042236328, "global_step": 129564, "epoch": 1561} {"train_loss": -21.100675582885742, "global_step": 129565, "epoch": 1561} {"train_loss": -21.518360137939453, "global_step": 129566, "epoch": 1561} {"train_loss": -21.127796173095703, "global_step": 129567, "epoch": 1561} {"train_loss": -21.216190338134766, "global_step": 129568, "epoch": 1561} {"train_loss": -21.402446746826172, "global_step": 129569, "epoch": 1561} {"train_loss": -21.826385498046875, "global_step": 129570, "epoch": 1561} {"train_loss": -21.453367233276367, "global_step": 129571, "epoch": 1561} {"train_loss": -21.680551528930664, "global_step": 129572, "epoch": 1561} {"train_loss": -21.724477767944336, "global_step": 129573, "epoch": 1561} {"train_loss": -21.711353302001953, "global_step": 129574, "epoch": 1561} {"train_loss": -22.036344528198242, "global_step": 129575, "epoch": 1561} {"train_loss": -21.944774627685547, "global_step": 129576, "epoch": 1561} {"train_loss": -21.754281997680664, "global_step": 129577, "epoch": 1561} {"train_loss": -21.733646392822266, "global_step": 129578, "epoch": 1561} {"train_loss": -22.23203468322754, "global_step": 129579, "epoch": 1561} {"train_loss": -21.908987045288086, "global_step": 129580, "epoch": 1561} {"train_loss": -21.87748146057129, "global_step": 129581, "epoch": 1561} {"train_loss": -22.157012939453125, "global_step": 129582, "epoch": 1561} {"train_loss": -22.302995681762695, "global_step": 129583, "epoch": 1561} {"train_loss": -22.2955265045166, "global_step": 129584, "epoch": 1561} {"train_loss": -22.5081729888916, "global_step": 129585, "epoch": 1561} {"train_loss": -22.35361099243164, "global_step": 129586, "epoch": 1561} {"train_loss": -22.312721252441406, "global_step": 129587, "epoch": 1561} {"train_loss": -22.095354080200195, "global_step": 129588, "epoch": 1561} {"train_loss": -22.960241317749023, "global_step": 129589, "epoch": 1561} {"train_loss": -22.303287506103516, "global_step": 129590, "epoch": 1561} {"train_loss": -22.588254928588867, "global_step": 129591, "epoch": 1561} {"train_loss": -22.24120330810547, "global_step": 129592, "epoch": 1561} {"train_loss": -22.38828468322754, "global_step": 129593, "epoch": 1561} {"train_loss": -22.165063858032227, "global_step": 129594, "epoch": 1561} {"train_loss": -22.361413955688477, "global_step": 129595, "epoch": 1561} {"train_loss": -22.694141387939453, "global_step": 129596, "epoch": 1561} {"train_loss": -22.65315055847168, "global_step": 129597, "epoch": 1561} {"train_loss": -22.32769775390625, "global_step": 129598, "epoch": 1561} {"train_loss": -22.617935180664062, "global_step": 129599, "epoch": 1561} {"train_loss": -22.571941375732422, "global_step": 129600, "epoch": 1561} {"train_loss": -22.391950607299805, "global_step": 129601, "epoch": 1561} {"train_loss": -22.436445236206055, "global_step": 129602, "epoch": 1561} {"train_loss": -22.63526725769043, "global_step": 129603, "epoch": 1561} {"train_loss": -22.6562557220459, "global_step": 129604, "epoch": 1561} {"train_loss": -22.7427978515625, "global_step": 129605, "epoch": 1561} {"train_loss": -22.316404342651367, "global_step": 129606, "epoch": 1561} {"train_loss": -22.55344581604004, "global_step": 129607, "epoch": 1561} {"train_loss": -23.315921783447266, "global_step": 129608, "epoch": 1561} {"train_loss": -22.341890335083008, "global_step": 129609, "epoch": 1561} {"train_loss": -22.820646286010742, "global_step": 129610, "epoch": 1561} {"train_loss": -22.72629165649414, "global_step": 129611, "epoch": 1561} {"train_loss": -23.030187606811523, "global_step": 129612, "epoch": 1561} {"train_loss": -22.523193359375, "global_step": 129613, "epoch": 1561} {"train_loss": -22.814647674560547, "global_step": 129614, "epoch": 1561} {"train_loss": -22.905393600463867, "global_step": 129615, "epoch": 1561} {"train_loss": -22.77820587158203, "global_step": 129616, "epoch": 1561} {"train_loss": -22.601804733276367, "global_step": 129617, "epoch": 1561} {"train_loss": -22.507593154907227, "global_step": 129618, "epoch": 1561} {"train_loss": -22.766799926757812, "global_step": 129619, "epoch": 1561} {"train_loss": -23.04764747619629, "global_step": 129620, "epoch": 1561} {"train_loss": -22.911935806274414, "global_step": 129621, "epoch": 1561} {"train_loss": -22.612903594970703, "global_step": 129622, "epoch": 1561} {"train_loss": -22.76861000061035, "global_step": 129623, "epoch": 1561} {"train_loss": -22.881397247314453, "global_step": 129624, "epoch": 1561} {"train_loss": -22.535551071166992, "global_step": 129625, "epoch": 1561} {"train_loss": -22.97495460510254, "global_step": 129626, "epoch": 1561} {"train_loss": -22.748783111572266, "global_step": 129627, "epoch": 1561} {"train_loss": -23.14580726623535, "global_step": 129628, "epoch": 1561} {"train_loss": -22.939010620117188, "global_step": 129629, "epoch": 1561} {"train_loss": -23.002843856811523, "global_step": 129630, "epoch": 1561} {"train_loss": -23.15750503540039, "global_step": 129631, "epoch": 1561} {"train_loss": -23.164535522460938, "global_step": 129632, "epoch": 1561} {"train_loss": -23.341506958007812, "global_step": 129633, "epoch": 1561} {"train_loss": -23.042078018188477, "global_step": 129634, "epoch": 1561} {"train_loss": -22.715442657470703, "global_step": 129635, "epoch": 1561} {"train_loss": -22.864171981811523, "global_step": 129636, "epoch": 1561} {"train_loss": -22.837203979492188, "global_step": 129637, "epoch": 1561} {"train_loss": -22.82915687561035, "global_step": 129638, "epoch": 1561} {"train_loss": -22.534189224243164, "global_step": 129639, "epoch": 1561} {"train_loss": -22.8538875579834, "global_step": 129640, "epoch": 1561} {"train_loss": -22.74222183227539, "global_step": 129641, "epoch": 1561} {"train_loss": -22.813888549804688, "global_step": 129642, "epoch": 1561} {"train_loss": -22.957674026489258, "global_step": 129643, "epoch": 1561} {"train_loss": -22.963348388671875, "global_step": 129644, "epoch": 1561} {"train_loss": -22.416655161294592, "global_step": 129645, "epoch": 1561, "val_loss": 6176974.0} {"train_loss": -22.793947219848633, "global_step": 129646, "epoch": 1562} {"train_loss": -22.5804443359375, "global_step": 129647, "epoch": 1562} {"train_loss": -22.48736572265625, "global_step": 129648, "epoch": 1562} {"train_loss": -22.79828643798828, "global_step": 129649, "epoch": 1562} {"train_loss": -22.591474533081055, "global_step": 129650, "epoch": 1562} {"train_loss": -22.88897132873535, "global_step": 129651, "epoch": 1562} {"train_loss": -22.725933074951172, "global_step": 129652, "epoch": 1562} {"train_loss": -22.589513778686523, "global_step": 129653, "epoch": 1562} {"train_loss": -22.392921447753906, "global_step": 129654, "epoch": 1562} {"train_loss": -22.823341369628906, "global_step": 129655, "epoch": 1562} {"train_loss": -22.957996368408203, "global_step": 129656, "epoch": 1562} {"train_loss": -22.251325607299805, "global_step": 129657, "epoch": 1562} {"train_loss": -22.50966453552246, "global_step": 129658, "epoch": 1562} {"train_loss": -22.711959838867188, "global_step": 129659, "epoch": 1562} {"train_loss": -22.32329750061035, "global_step": 129660, "epoch": 1562} {"train_loss": -22.84652328491211, "global_step": 129661, "epoch": 1562} {"train_loss": -22.457626342773438, "global_step": 129662, "epoch": 1562} {"train_loss": -22.57434844970703, "global_step": 129663, "epoch": 1562} {"train_loss": -22.5884952545166, "global_step": 129664, "epoch": 1562} {"train_loss": -22.89723014831543, "global_step": 129665, "epoch": 1562} {"train_loss": -22.58574867248535, "global_step": 129666, "epoch": 1562} {"train_loss": -22.440811157226562, "global_step": 129667, "epoch": 1562} {"train_loss": -22.88985824584961, "global_step": 129668, "epoch": 1562} {"train_loss": -22.640220642089844, "global_step": 129669, "epoch": 1562} {"train_loss": -22.857351303100586, "global_step": 129670, "epoch": 1562} {"train_loss": -22.72494888305664, "global_step": 129671, "epoch": 1562} {"train_loss": -23.002521514892578, "global_step": 129672, "epoch": 1562} {"train_loss": -22.696552276611328, "global_step": 129673, "epoch": 1562} {"train_loss": -22.457120895385742, "global_step": 129674, "epoch": 1562} {"train_loss": -22.675771713256836, "global_step": 129675, "epoch": 1562} {"train_loss": -22.80149269104004, "global_step": 129676, "epoch": 1562} {"train_loss": -22.692581176757812, "global_step": 129677, "epoch": 1562} {"train_loss": -22.535400390625, "global_step": 129678, "epoch": 1562} {"train_loss": -22.853469848632812, "global_step": 129679, "epoch": 1562} {"train_loss": -22.428817749023438, "global_step": 129680, "epoch": 1562} {"train_loss": -22.658658981323242, "global_step": 129681, "epoch": 1562} {"train_loss": -22.7154598236084, "global_step": 129682, "epoch": 1562} {"train_loss": -22.75103759765625, "global_step": 129683, "epoch": 1562} {"train_loss": -22.810232162475586, "global_step": 129684, "epoch": 1562} {"train_loss": -22.65996742248535, "global_step": 129685, "epoch": 1562} {"train_loss": -22.619176864624023, "global_step": 129686, "epoch": 1562} {"train_loss": -22.97587013244629, "global_step": 129687, "epoch": 1562} {"train_loss": -23.226850509643555, "global_step": 129688, "epoch": 1562} {"train_loss": -22.671064376831055, "global_step": 129689, "epoch": 1562} {"train_loss": -22.81608009338379, "global_step": 129690, "epoch": 1562} {"train_loss": -23.10675621032715, "global_step": 129691, "epoch": 1562} {"train_loss": -23.02937126159668, "global_step": 129692, "epoch": 1562} {"train_loss": -23.171722412109375, "global_step": 129693, "epoch": 1562} {"train_loss": -22.919179916381836, "global_step": 129694, "epoch": 1562} {"train_loss": -23.032827377319336, "global_step": 129695, "epoch": 1562} {"train_loss": -22.926069259643555, "global_step": 129696, "epoch": 1562} {"train_loss": -22.901432037353516, "global_step": 129697, "epoch": 1562} {"train_loss": -22.658506393432617, "global_step": 129698, "epoch": 1562} {"train_loss": -22.648828506469727, "global_step": 129699, "epoch": 1562} {"train_loss": -22.588125228881836, "global_step": 129700, "epoch": 1562} {"train_loss": -22.58051109313965, "global_step": 129701, "epoch": 1562} {"train_loss": -22.830936431884766, "global_step": 129702, "epoch": 1562} {"train_loss": -22.855609893798828, "global_step": 129703, "epoch": 1562} {"train_loss": -22.641698837280273, "global_step": 129704, "epoch": 1562} {"train_loss": -22.850805282592773, "global_step": 129705, "epoch": 1562} {"train_loss": -22.46356201171875, "global_step": 129706, "epoch": 1562} {"train_loss": -22.856111526489258, "global_step": 129707, "epoch": 1562} {"train_loss": -22.726472854614258, "global_step": 129708, "epoch": 1562} {"train_loss": -22.628524780273438, "global_step": 129709, "epoch": 1562} {"train_loss": -22.926145553588867, "global_step": 129710, "epoch": 1562} {"train_loss": -23.03055191040039, "global_step": 129711, "epoch": 1562} {"train_loss": -22.801837921142578, "global_step": 129712, "epoch": 1562} {"train_loss": -22.582332611083984, "global_step": 129713, "epoch": 1562} {"train_loss": -22.90825843811035, "global_step": 129714, "epoch": 1562} {"train_loss": -22.69660758972168, "global_step": 129715, "epoch": 1562} {"train_loss": -22.879409790039062, "global_step": 129716, "epoch": 1562} {"train_loss": -23.162277221679688, "global_step": 129717, "epoch": 1562} {"train_loss": -22.892208099365234, "global_step": 129718, "epoch": 1562} {"train_loss": -22.788471221923828, "global_step": 129719, "epoch": 1562} {"train_loss": -23.041473388671875, "global_step": 129720, "epoch": 1562} {"train_loss": -22.677671432495117, "global_step": 129721, "epoch": 1562} {"train_loss": -23.194503784179688, "global_step": 129722, "epoch": 1562} {"train_loss": -22.263051986694336, "global_step": 129723, "epoch": 1562} {"train_loss": -22.724266052246094, "global_step": 129724, "epoch": 1562} {"train_loss": -22.644643783569336, "global_step": 129725, "epoch": 1562} {"train_loss": -22.753387451171875, "global_step": 129726, "epoch": 1562} {"train_loss": -22.64326286315918, "global_step": 129727, "epoch": 1562} {"train_loss": -22.744255180818488, "global_step": 129728, "epoch": 1562, "val_loss": 6343012.0} {"train_loss": -21.246280670166016, "global_step": 129729, "epoch": 1563} {"train_loss": -20.951040267944336, "global_step": 129730, "epoch": 1563} {"train_loss": -22.361230850219727, "global_step": 129731, "epoch": 1563} {"train_loss": -21.521865844726562, "global_step": 129732, "epoch": 1563} {"train_loss": -22.761716842651367, "global_step": 129733, "epoch": 1563} {"train_loss": -21.64668083190918, "global_step": 129734, "epoch": 1563} {"train_loss": -22.082651138305664, "global_step": 129735, "epoch": 1563} {"train_loss": -21.871809005737305, "global_step": 129736, "epoch": 1563} {"train_loss": -22.199268341064453, "global_step": 129737, "epoch": 1563} {"train_loss": -22.360624313354492, "global_step": 129738, "epoch": 1563} {"train_loss": -22.63263702392578, "global_step": 129739, "epoch": 1563} {"train_loss": -22.477510452270508, "global_step": 129740, "epoch": 1563} {"train_loss": -22.698959350585938, "global_step": 129741, "epoch": 1563} {"train_loss": -22.4376163482666, "global_step": 129742, "epoch": 1563} {"train_loss": -22.568178176879883, "global_step": 129743, "epoch": 1563} {"train_loss": -22.25461196899414, "global_step": 129744, "epoch": 1563} {"train_loss": -22.198780059814453, "global_step": 129745, "epoch": 1563} {"train_loss": -22.518651962280273, "global_step": 129746, "epoch": 1563} {"train_loss": -22.35312271118164, "global_step": 129747, "epoch": 1563} {"train_loss": -22.67774772644043, "global_step": 129748, "epoch": 1563} {"train_loss": -22.423791885375977, "global_step": 129749, "epoch": 1563} {"train_loss": -22.83382225036621, "global_step": 129750, "epoch": 1563} {"train_loss": -22.5799560546875, "global_step": 129751, "epoch": 1563} {"train_loss": -23.115524291992188, "global_step": 129752, "epoch": 1563} {"train_loss": -22.788345336914062, "global_step": 129753, "epoch": 1563} {"train_loss": -22.581260681152344, "global_step": 129754, "epoch": 1563} {"train_loss": -22.640100479125977, "global_step": 129755, "epoch": 1563} {"train_loss": -22.847997665405273, "global_step": 129756, "epoch": 1563} {"train_loss": -22.52775764465332, "global_step": 129757, "epoch": 1563} {"train_loss": -22.643735885620117, "global_step": 129758, "epoch": 1563} {"train_loss": -22.837047576904297, "global_step": 129759, "epoch": 1563} {"train_loss": -22.978044509887695, "global_step": 129760, "epoch": 1563} {"train_loss": -22.862751007080078, "global_step": 129761, "epoch": 1563} {"train_loss": -22.6821231842041, "global_step": 129762, "epoch": 1563} {"train_loss": -23.11774444580078, "global_step": 129763, "epoch": 1563} {"train_loss": -22.540817260742188, "global_step": 129764, "epoch": 1563} {"train_loss": -23.207035064697266, "global_step": 129765, "epoch": 1563} {"train_loss": -22.9013729095459, "global_step": 129766, "epoch": 1563} {"train_loss": -23.186315536499023, "global_step": 129767, "epoch": 1563} {"train_loss": -22.868303298950195, "global_step": 129768, "epoch": 1563} {"train_loss": -22.841806411743164, "global_step": 129769, "epoch": 1563} {"train_loss": -22.946836471557617, "global_step": 129770, "epoch": 1563} {"train_loss": -22.734617233276367, "global_step": 129771, "epoch": 1563} {"train_loss": -22.950101852416992, "global_step": 129772, "epoch": 1563} {"train_loss": -23.14701271057129, "global_step": 129773, "epoch": 1563} {"train_loss": -22.468772888183594, "global_step": 129774, "epoch": 1563} {"train_loss": -23.103086471557617, "global_step": 129775, "epoch": 1563} {"train_loss": -22.961196899414062, "global_step": 129776, "epoch": 1563} {"train_loss": -22.961538314819336, "global_step": 129777, "epoch": 1563} {"train_loss": -22.768239974975586, "global_step": 129778, "epoch": 1563} {"train_loss": -22.31479835510254, "global_step": 129779, "epoch": 1563} {"train_loss": -22.820219039916992, "global_step": 129780, "epoch": 1563} {"train_loss": -22.62997817993164, "global_step": 129781, "epoch": 1563} {"train_loss": -22.822933197021484, "global_step": 129782, "epoch": 1563} {"train_loss": -23.01757049560547, "global_step": 129783, "epoch": 1563} {"train_loss": -22.70765495300293, "global_step": 129784, "epoch": 1563} {"train_loss": -23.01779556274414, "global_step": 129785, "epoch": 1563} {"train_loss": -22.807270050048828, "global_step": 129786, "epoch": 1563} {"train_loss": -22.65692710876465, "global_step": 129787, "epoch": 1563} {"train_loss": -22.78446388244629, "global_step": 129788, "epoch": 1563} {"train_loss": -22.96239471435547, "global_step": 129789, "epoch": 1563} {"train_loss": -23.136205673217773, "global_step": 129790, "epoch": 1563} {"train_loss": -22.583229064941406, "global_step": 129791, "epoch": 1563} {"train_loss": -22.91166114807129, "global_step": 129792, "epoch": 1563} {"train_loss": -23.14408302307129, "global_step": 129793, "epoch": 1563} {"train_loss": -22.879213333129883, "global_step": 129794, "epoch": 1563} {"train_loss": -22.657743453979492, "global_step": 129795, "epoch": 1563} {"train_loss": -23.09716796875, "global_step": 129796, "epoch": 1563} {"train_loss": -22.73691749572754, "global_step": 129797, "epoch": 1563} {"train_loss": -22.69167137145996, "global_step": 129798, "epoch": 1563} {"train_loss": -23.01498794555664, "global_step": 129799, "epoch": 1563} {"train_loss": -23.16768455505371, "global_step": 129800, "epoch": 1563} {"train_loss": -23.13469123840332, "global_step": 129801, "epoch": 1563} {"train_loss": -22.843177795410156, "global_step": 129802, "epoch": 1563} {"train_loss": -22.672348022460938, "global_step": 129803, "epoch": 1563} {"train_loss": -22.975934982299805, "global_step": 129804, "epoch": 1563} {"train_loss": -22.752405166625977, "global_step": 129805, "epoch": 1563} {"train_loss": -22.668598175048828, "global_step": 129806, "epoch": 1563} {"train_loss": -23.120817184448242, "global_step": 129807, "epoch": 1563} {"train_loss": -22.90087890625, "global_step": 129808, "epoch": 1563} {"train_loss": -22.988218307495117, "global_step": 129809, "epoch": 1563} {"train_loss": -23.04623794555664, "global_step": 129810, "epoch": 1563} {"train_loss": -22.679409739482832, "global_step": 129811, "epoch": 1563, "val_loss": 6240429.0} {"train_loss": -22.287389755249023, "global_step": 129812, "epoch": 1564} {"train_loss": -22.957345962524414, "global_step": 129813, "epoch": 1564} {"train_loss": -22.078330993652344, "global_step": 129814, "epoch": 1564} {"train_loss": -22.398929595947266, "global_step": 129815, "epoch": 1564} {"train_loss": -22.658863067626953, "global_step": 129816, "epoch": 1564} {"train_loss": -22.2197208404541, "global_step": 129817, "epoch": 1564} {"train_loss": -22.9107666015625, "global_step": 129818, "epoch": 1564} {"train_loss": -22.610671997070312, "global_step": 129819, "epoch": 1564} {"train_loss": -21.974658966064453, "global_step": 129820, "epoch": 1564} {"train_loss": -22.37952423095703, "global_step": 129821, "epoch": 1564} {"train_loss": -22.96356201171875, "global_step": 129822, "epoch": 1564} {"train_loss": -22.60675621032715, "global_step": 129823, "epoch": 1564} {"train_loss": -22.807180404663086, "global_step": 129824, "epoch": 1564} {"train_loss": -23.031139373779297, "global_step": 129825, "epoch": 1564} {"train_loss": -22.73541831970215, "global_step": 129826, "epoch": 1564} {"train_loss": -22.810482025146484, "global_step": 129827, "epoch": 1564} {"train_loss": -22.839519500732422, "global_step": 129828, "epoch": 1564} {"train_loss": -22.521753311157227, "global_step": 129829, "epoch": 1564} {"train_loss": -22.39281463623047, "global_step": 129830, "epoch": 1564} {"train_loss": -22.725629806518555, "global_step": 129831, "epoch": 1564} {"train_loss": -22.79603385925293, "global_step": 129832, "epoch": 1564} {"train_loss": -22.415361404418945, "global_step": 129833, "epoch": 1564} {"train_loss": -23.129776000976562, "global_step": 129834, "epoch": 1564} {"train_loss": -22.8842830657959, "global_step": 129835, "epoch": 1564} {"train_loss": -22.896520614624023, "global_step": 129836, "epoch": 1564} {"train_loss": -22.79874038696289, "global_step": 129837, "epoch": 1564} {"train_loss": -22.84457015991211, "global_step": 129838, "epoch": 1564} {"train_loss": -22.570053100585938, "global_step": 129839, "epoch": 1564} {"train_loss": -23.14681053161621, "global_step": 129840, "epoch": 1564} {"train_loss": -23.03325843811035, "global_step": 129841, "epoch": 1564} {"train_loss": -22.832239151000977, "global_step": 129842, "epoch": 1564} {"train_loss": -22.762121200561523, "global_step": 129843, "epoch": 1564} {"train_loss": -22.690481185913086, "global_step": 129844, "epoch": 1564} {"train_loss": -22.77908706665039, "global_step": 129845, "epoch": 1564} {"train_loss": -22.39013671875, "global_step": 129846, "epoch": 1564} {"train_loss": -22.702594757080078, "global_step": 129847, "epoch": 1564} {"train_loss": -22.73809242248535, "global_step": 129848, "epoch": 1564} {"train_loss": -22.916479110717773, "global_step": 129849, "epoch": 1564} {"train_loss": -23.1660213470459, "global_step": 129850, "epoch": 1564} {"train_loss": -22.613176345825195, "global_step": 129851, "epoch": 1564} {"train_loss": -22.26650047302246, "global_step": 129852, "epoch": 1564} {"train_loss": -22.566207885742188, "global_step": 129853, "epoch": 1564} {"train_loss": -23.025915145874023, "global_step": 129854, "epoch": 1564} {"train_loss": -22.97150993347168, "global_step": 129855, "epoch": 1564} {"train_loss": -22.76470375061035, "global_step": 129856, "epoch": 1564} {"train_loss": -22.658891677856445, "global_step": 129857, "epoch": 1564} {"train_loss": -22.758779525756836, "global_step": 129858, "epoch": 1564} {"train_loss": -23.12146759033203, "global_step": 129859, "epoch": 1564} {"train_loss": -22.977392196655273, "global_step": 129860, "epoch": 1564} {"train_loss": -22.937955856323242, "global_step": 129861, "epoch": 1564} {"train_loss": -22.562604904174805, "global_step": 129862, "epoch": 1564} {"train_loss": -22.899709701538086, "global_step": 129863, "epoch": 1564} {"train_loss": -22.605010986328125, "global_step": 129864, "epoch": 1564} {"train_loss": -22.5546932220459, "global_step": 129865, "epoch": 1564} {"train_loss": -22.735427856445312, "global_step": 129866, "epoch": 1564} {"train_loss": -22.929319381713867, "global_step": 129867, "epoch": 1564} {"train_loss": -22.95250701904297, "global_step": 129868, "epoch": 1564} {"train_loss": -22.607831954956055, "global_step": 129869, "epoch": 1564} {"train_loss": -22.838266372680664, "global_step": 129870, "epoch": 1564} {"train_loss": -22.602537155151367, "global_step": 129871, "epoch": 1564} {"train_loss": -22.840229034423828, "global_step": 129872, "epoch": 1564} {"train_loss": -22.92010498046875, "global_step": 129873, "epoch": 1564} {"train_loss": -22.794382095336914, "global_step": 129874, "epoch": 1564} {"train_loss": -22.6224308013916, "global_step": 129875, "epoch": 1564} {"train_loss": -22.72307777404785, "global_step": 129876, "epoch": 1564} {"train_loss": -23.17691421508789, "global_step": 129877, "epoch": 1564} {"train_loss": -22.797163009643555, "global_step": 129878, "epoch": 1564} {"train_loss": -22.771875381469727, "global_step": 129879, "epoch": 1564} {"train_loss": -22.6473388671875, "global_step": 129880, "epoch": 1564} {"train_loss": -22.445341110229492, "global_step": 129881, "epoch": 1564} {"train_loss": -22.98573112487793, "global_step": 129882, "epoch": 1564} {"train_loss": -22.525304794311523, "global_step": 129883, "epoch": 1564} {"train_loss": -22.902570724487305, "global_step": 129884, "epoch": 1564} {"train_loss": -22.78026008605957, "global_step": 129885, "epoch": 1564} {"train_loss": -23.000293731689453, "global_step": 129886, "epoch": 1564} {"train_loss": -22.417280197143555, "global_step": 129887, "epoch": 1564} {"train_loss": -22.906116485595703, "global_step": 129888, "epoch": 1564} {"train_loss": -22.883386611938477, "global_step": 129889, "epoch": 1564} {"train_loss": -23.21367073059082, "global_step": 129890, "epoch": 1564} {"train_loss": -22.925540924072266, "global_step": 129891, "epoch": 1564} {"train_loss": -22.885183334350586, "global_step": 129892, "epoch": 1564} {"train_loss": -23.05255126953125, "global_step": 129893, "epoch": 1564} {"train_loss": -22.751023533832598, "global_step": 129894, "epoch": 1564, "val_loss": 6206968.5} {"train_loss": -21.8707218170166, "global_step": 129895, "epoch": 1565} {"train_loss": -21.577505111694336, "global_step": 129896, "epoch": 1565} {"train_loss": -21.70233726501465, "global_step": 129897, "epoch": 1565} {"train_loss": -22.401363372802734, "global_step": 129898, "epoch": 1565} {"train_loss": -21.636993408203125, "global_step": 129899, "epoch": 1565} {"train_loss": -22.215850830078125, "global_step": 129900, "epoch": 1565} {"train_loss": -22.58603858947754, "global_step": 129901, "epoch": 1565} {"train_loss": -22.285415649414062, "global_step": 129902, "epoch": 1565} {"train_loss": -22.175256729125977, "global_step": 129903, "epoch": 1565} {"train_loss": -22.37978172302246, "global_step": 129904, "epoch": 1565} {"train_loss": -22.61545753479004, "global_step": 129905, "epoch": 1565} {"train_loss": -22.635610580444336, "global_step": 129906, "epoch": 1565} {"train_loss": -22.333370208740234, "global_step": 129907, "epoch": 1565} {"train_loss": -22.59157371520996, "global_step": 129908, "epoch": 1565} {"train_loss": -22.348419189453125, "global_step": 129909, "epoch": 1565} {"train_loss": -22.73453140258789, "global_step": 129910, "epoch": 1565} {"train_loss": -22.688735961914062, "global_step": 129911, "epoch": 1565} {"train_loss": -22.753158569335938, "global_step": 129912, "epoch": 1565} {"train_loss": -22.361276626586914, "global_step": 129913, "epoch": 1565} {"train_loss": -22.79768943786621, "global_step": 129914, "epoch": 1565} {"train_loss": -22.503808975219727, "global_step": 129915, "epoch": 1565} {"train_loss": -22.718280792236328, "global_step": 129916, "epoch": 1565} {"train_loss": -22.9926700592041, "global_step": 129917, "epoch": 1565} {"train_loss": -23.21336555480957, "global_step": 129918, "epoch": 1565} {"train_loss": -22.608966827392578, "global_step": 129919, "epoch": 1565} {"train_loss": -22.67793846130371, "global_step": 129920, "epoch": 1565} {"train_loss": -22.652145385742188, "global_step": 129921, "epoch": 1565} {"train_loss": -22.622665405273438, "global_step": 129922, "epoch": 1565} {"train_loss": -22.978025436401367, "global_step": 129923, "epoch": 1565} {"train_loss": -22.717763900756836, "global_step": 129924, "epoch": 1565} {"train_loss": -22.731943130493164, "global_step": 129925, "epoch": 1565} {"train_loss": -22.73625373840332, "global_step": 129926, "epoch": 1565} {"train_loss": -23.164926528930664, "global_step": 129927, "epoch": 1565} {"train_loss": -22.75459861755371, "global_step": 129928, "epoch": 1565} {"train_loss": -22.775197982788086, "global_step": 129929, "epoch": 1565} {"train_loss": -22.51786231994629, "global_step": 129930, "epoch": 1565} {"train_loss": -23.076183319091797, "global_step": 129931, "epoch": 1565} {"train_loss": -22.48799705505371, "global_step": 129932, "epoch": 1565} {"train_loss": -22.916549682617188, "global_step": 129933, "epoch": 1565} {"train_loss": -22.958261489868164, "global_step": 129934, "epoch": 1565} {"train_loss": -22.858627319335938, "global_step": 129935, "epoch": 1565} {"train_loss": -23.240161895751953, "global_step": 129936, "epoch": 1565} {"train_loss": -22.495542526245117, "global_step": 129937, "epoch": 1565} {"train_loss": -22.794902801513672, "global_step": 129938, "epoch": 1565} {"train_loss": -22.97523307800293, "global_step": 129939, "epoch": 1565} {"train_loss": -22.537885665893555, "global_step": 129940, "epoch": 1565} {"train_loss": -22.93951416015625, "global_step": 129941, "epoch": 1565} {"train_loss": -22.539533615112305, "global_step": 129942, "epoch": 1565} {"train_loss": -22.839397430419922, "global_step": 129943, "epoch": 1565} {"train_loss": -22.51371955871582, "global_step": 129944, "epoch": 1565} {"train_loss": -22.996686935424805, "global_step": 129945, "epoch": 1565} {"train_loss": -22.562408447265625, "global_step": 129946, "epoch": 1565} {"train_loss": -22.807653427124023, "global_step": 129947, "epoch": 1565} {"train_loss": -22.637609481811523, "global_step": 129948, "epoch": 1565} {"train_loss": -22.857419967651367, "global_step": 129949, "epoch": 1565} {"train_loss": -22.330808639526367, "global_step": 129950, "epoch": 1565} {"train_loss": -22.639537811279297, "global_step": 129951, "epoch": 1565} {"train_loss": -22.220483779907227, "global_step": 129952, "epoch": 1565} {"train_loss": -22.702701568603516, "global_step": 129953, "epoch": 1565} {"train_loss": -22.227806091308594, "global_step": 129954, "epoch": 1565} {"train_loss": -22.27290153503418, "global_step": 129955, "epoch": 1565} {"train_loss": -23.014690399169922, "global_step": 129956, "epoch": 1565} {"train_loss": -22.572490692138672, "global_step": 129957, "epoch": 1565} {"train_loss": -22.217878341674805, "global_step": 129958, "epoch": 1565} {"train_loss": -22.878116607666016, "global_step": 129959, "epoch": 1565} {"train_loss": -22.476057052612305, "global_step": 129960, "epoch": 1565} {"train_loss": -22.52992057800293, "global_step": 129961, "epoch": 1565} {"train_loss": -22.626983642578125, "global_step": 129962, "epoch": 1565} {"train_loss": -22.565765380859375, "global_step": 129963, "epoch": 1565} {"train_loss": -22.871658325195312, "global_step": 129964, "epoch": 1565} {"train_loss": -22.39443588256836, "global_step": 129965, "epoch": 1565} {"train_loss": -22.740068435668945, "global_step": 129966, "epoch": 1565} {"train_loss": -22.78147315979004, "global_step": 129967, "epoch": 1565} {"train_loss": -22.82708740234375, "global_step": 129968, "epoch": 1565} {"train_loss": -22.73665428161621, "global_step": 129969, "epoch": 1565} {"train_loss": -22.965604782104492, "global_step": 129970, "epoch": 1565} {"train_loss": -22.82767677307129, "global_step": 129971, "epoch": 1565} {"train_loss": -22.8465518951416, "global_step": 129972, "epoch": 1565} {"train_loss": -22.4243221282959, "global_step": 129973, "epoch": 1565} {"train_loss": -22.970924377441406, "global_step": 129974, "epoch": 1565} {"train_loss": -22.87265968322754, "global_step": 129975, "epoch": 1565} {"train_loss": -22.336734771728516, "global_step": 129976, "epoch": 1565} {"train_loss": -22.64300020057035, "global_step": 129977, "epoch": 1565, "val_loss": 6276680.0} {"train_loss": -21.847654342651367, "global_step": 129978, "epoch": 1566} {"train_loss": -22.36235809326172, "global_step": 129979, "epoch": 1566} {"train_loss": -22.52045249938965, "global_step": 129980, "epoch": 1566} {"train_loss": -22.30394744873047, "global_step": 129981, "epoch": 1566} {"train_loss": -22.854122161865234, "global_step": 129982, "epoch": 1566} {"train_loss": -22.37173843383789, "global_step": 129983, "epoch": 1566} {"train_loss": -22.63910484313965, "global_step": 129984, "epoch": 1566} {"train_loss": -22.779808044433594, "global_step": 129985, "epoch": 1566} {"train_loss": -22.511377334594727, "global_step": 129986, "epoch": 1566} {"train_loss": -22.708484649658203, "global_step": 129987, "epoch": 1566} {"train_loss": -22.86389923095703, "global_step": 129988, "epoch": 1566} {"train_loss": -22.532583236694336, "global_step": 129989, "epoch": 1566} {"train_loss": -22.468671798706055, "global_step": 129990, "epoch": 1566} {"train_loss": -22.39620018005371, "global_step": 129991, "epoch": 1566} {"train_loss": -22.754669189453125, "global_step": 129992, "epoch": 1566} {"train_loss": -22.715375900268555, "global_step": 129993, "epoch": 1566} {"train_loss": -22.915008544921875, "global_step": 129994, "epoch": 1566} {"train_loss": -22.544118881225586, "global_step": 129995, "epoch": 1566} {"train_loss": -22.679250717163086, "global_step": 129996, "epoch": 1566} {"train_loss": -22.855119705200195, "global_step": 129997, "epoch": 1566} {"train_loss": -22.62404441833496, "global_step": 129998, "epoch": 1566} {"train_loss": -22.6279296875, "global_step": 129999, "epoch": 1566} {"train_loss": -22.98442268371582, "global_step": 130000, "epoch": 1566} {"train_loss": -22.62872886657715, "global_step": 130001, "epoch": 1566} {"train_loss": -22.615468978881836, "global_step": 130002, "epoch": 1566} {"train_loss": -23.065237045288086, "global_step": 130003, "epoch": 1566} {"train_loss": -22.884565353393555, "global_step": 130004, "epoch": 1566} {"train_loss": -22.804203033447266, "global_step": 130005, "epoch": 1566} {"train_loss": -22.488496780395508, "global_step": 130006, "epoch": 1566} {"train_loss": -23.24358558654785, "global_step": 130007, "epoch": 1566} {"train_loss": -22.8587646484375, "global_step": 130008, "epoch": 1566} {"train_loss": -22.452077865600586, "global_step": 130009, "epoch": 1566} {"train_loss": -23.135053634643555, "global_step": 130010, "epoch": 1566} {"train_loss": -22.561796188354492, "global_step": 130011, "epoch": 1566} {"train_loss": -22.98345184326172, "global_step": 130012, "epoch": 1566} {"train_loss": -23.037704467773438, "global_step": 130013, "epoch": 1566} {"train_loss": -22.42752456665039, "global_step": 130014, "epoch": 1566} {"train_loss": -22.94547462463379, "global_step": 130015, "epoch": 1566} {"train_loss": -22.91631317138672, "global_step": 130016, "epoch": 1566} {"train_loss": -22.622970581054688, "global_step": 130017, "epoch": 1566} {"train_loss": -22.654556274414062, "global_step": 130018, "epoch": 1566} {"train_loss": -23.065824508666992, "global_step": 130019, "epoch": 1566} {"train_loss": -23.321393966674805, "global_step": 130020, "epoch": 1566} {"train_loss": -22.856592178344727, "global_step": 130021, "epoch": 1566} {"train_loss": -22.481077194213867, "global_step": 130022, "epoch": 1566} {"train_loss": -22.923175811767578, "global_step": 130023, "epoch": 1566} {"train_loss": -23.190099716186523, "global_step": 130024, "epoch": 1566} {"train_loss": -23.08827781677246, "global_step": 130025, "epoch": 1566} {"train_loss": -23.003684997558594, "global_step": 130026, "epoch": 1566} {"train_loss": -22.95730972290039, "global_step": 130027, "epoch": 1566} {"train_loss": -22.85153579711914, "global_step": 130028, "epoch": 1566} {"train_loss": -22.838104248046875, "global_step": 130029, "epoch": 1566} {"train_loss": -23.138525009155273, "global_step": 130030, "epoch": 1566} {"train_loss": -22.04984474182129, "global_step": 130031, "epoch": 1566} {"train_loss": -23.090986251831055, "global_step": 130032, "epoch": 1566} {"train_loss": -22.830703735351562, "global_step": 130033, "epoch": 1566} {"train_loss": -22.674665451049805, "global_step": 130034, "epoch": 1566} {"train_loss": -22.611560821533203, "global_step": 130035, "epoch": 1566} {"train_loss": -22.899097442626953, "global_step": 130036, "epoch": 1566} {"train_loss": -22.90875816345215, "global_step": 130037, "epoch": 1566} {"train_loss": -23.15945053100586, "global_step": 130038, "epoch": 1566} {"train_loss": -22.800073623657227, "global_step": 130039, "epoch": 1566} {"train_loss": -22.621328353881836, "global_step": 130040, "epoch": 1566} {"train_loss": -22.82943344116211, "global_step": 130041, "epoch": 1566} {"train_loss": -22.47675132751465, "global_step": 130042, "epoch": 1566} {"train_loss": -23.20868492126465, "global_step": 130043, "epoch": 1566} {"train_loss": -22.74806785583496, "global_step": 130044, "epoch": 1566} {"train_loss": -22.92683982849121, "global_step": 130045, "epoch": 1566} {"train_loss": -22.714435577392578, "global_step": 130046, "epoch": 1566} {"train_loss": -22.68438720703125, "global_step": 130047, "epoch": 1566} {"train_loss": -22.971654891967773, "global_step": 130048, "epoch": 1566} {"train_loss": -22.6279354095459, "global_step": 130049, "epoch": 1566} {"train_loss": -23.13503646850586, "global_step": 130050, "epoch": 1566} {"train_loss": -22.638160705566406, "global_step": 130051, "epoch": 1566} {"train_loss": -22.996580123901367, "global_step": 130052, "epoch": 1566} {"train_loss": -22.895973205566406, "global_step": 130053, "epoch": 1566} {"train_loss": -22.58060073852539, "global_step": 130054, "epoch": 1566} {"train_loss": -22.839780807495117, "global_step": 130055, "epoch": 1566} {"train_loss": -22.628122329711914, "global_step": 130056, "epoch": 1566} {"train_loss": -22.6375675201416, "global_step": 130057, "epoch": 1566} {"train_loss": -22.89227294921875, "global_step": 130058, "epoch": 1566} {"train_loss": -22.90268898010254, "global_step": 130059, "epoch": 1566} {"train_loss": -22.76130788872041, "global_step": 130060, "epoch": 1566, "val_loss": 6250787.0} {"train_loss": -21.938650131225586, "global_step": 130061, "epoch": 1567} {"train_loss": -22.70383644104004, "global_step": 130062, "epoch": 1567} {"train_loss": -22.299789428710938, "global_step": 130063, "epoch": 1567} {"train_loss": -22.3636417388916, "global_step": 130064, "epoch": 1567} {"train_loss": -22.506704330444336, "global_step": 130065, "epoch": 1567} {"train_loss": -22.324460983276367, "global_step": 130066, "epoch": 1567} {"train_loss": -22.911874771118164, "global_step": 130067, "epoch": 1567} {"train_loss": -22.739606857299805, "global_step": 130068, "epoch": 1567} {"train_loss": -22.627099990844727, "global_step": 130069, "epoch": 1567} {"train_loss": -22.314838409423828, "global_step": 130070, "epoch": 1567} {"train_loss": -22.513601303100586, "global_step": 130071, "epoch": 1567} {"train_loss": -22.585235595703125, "global_step": 130072, "epoch": 1567} {"train_loss": -22.663480758666992, "global_step": 130073, "epoch": 1567} {"train_loss": -22.759342193603516, "global_step": 130074, "epoch": 1567} {"train_loss": -22.528356552124023, "global_step": 130075, "epoch": 1567} {"train_loss": -22.36334228515625, "global_step": 130076, "epoch": 1567} {"train_loss": -22.78076171875, "global_step": 130077, "epoch": 1567} {"train_loss": -22.63599967956543, "global_step": 130078, "epoch": 1567} {"train_loss": -23.037729263305664, "global_step": 130079, "epoch": 1567} {"train_loss": -22.589590072631836, "global_step": 130080, "epoch": 1567} {"train_loss": -22.64413833618164, "global_step": 130081, "epoch": 1567} {"train_loss": -22.734037399291992, "global_step": 130082, "epoch": 1567} {"train_loss": -22.687326431274414, "global_step": 130083, "epoch": 1567} {"train_loss": -22.95334815979004, "global_step": 130084, "epoch": 1567} {"train_loss": -22.959020614624023, "global_step": 130085, "epoch": 1567} {"train_loss": -22.682348251342773, "global_step": 130086, "epoch": 1567} {"train_loss": -22.66022491455078, "global_step": 130087, "epoch": 1567} {"train_loss": -22.594608306884766, "global_step": 130088, "epoch": 1567} {"train_loss": -22.90675163269043, "global_step": 130089, "epoch": 1567} {"train_loss": -22.390424728393555, "global_step": 130090, "epoch": 1567} {"train_loss": -22.731468200683594, "global_step": 130091, "epoch": 1567} {"train_loss": -22.874469757080078, "global_step": 130092, "epoch": 1567} {"train_loss": -22.580219268798828, "global_step": 130093, "epoch": 1567} {"train_loss": -22.85025978088379, "global_step": 130094, "epoch": 1567} {"train_loss": -22.860729217529297, "global_step": 130095, "epoch": 1567} {"train_loss": -22.331571578979492, "global_step": 130096, "epoch": 1567} {"train_loss": -22.72382164001465, "global_step": 130097, "epoch": 1567} {"train_loss": -22.97262954711914, "global_step": 130098, "epoch": 1567} {"train_loss": -22.799236297607422, "global_step": 130099, "epoch": 1567} {"train_loss": -22.512096405029297, "global_step": 130100, "epoch": 1567} {"train_loss": -22.705442428588867, "global_step": 130101, "epoch": 1567} {"train_loss": -22.857912063598633, "global_step": 130102, "epoch": 1567} {"train_loss": -22.713712692260742, "global_step": 130103, "epoch": 1567} {"train_loss": -22.704345703125, "global_step": 130104, "epoch": 1567} {"train_loss": -22.898468017578125, "global_step": 130105, "epoch": 1567} {"train_loss": -22.43094825744629, "global_step": 130106, "epoch": 1567} {"train_loss": -22.595752716064453, "global_step": 130107, "epoch": 1567} {"train_loss": -22.379179000854492, "global_step": 130108, "epoch": 1567} {"train_loss": -22.624902725219727, "global_step": 130109, "epoch": 1567} {"train_loss": -22.584672927856445, "global_step": 130110, "epoch": 1567} {"train_loss": -22.90918731689453, "global_step": 130111, "epoch": 1567} {"train_loss": -23.000394821166992, "global_step": 130112, "epoch": 1567} {"train_loss": -22.77496910095215, "global_step": 130113, "epoch": 1567} {"train_loss": -22.88589859008789, "global_step": 130114, "epoch": 1567} {"train_loss": -22.98380470275879, "global_step": 130115, "epoch": 1567} {"train_loss": -22.7185001373291, "global_step": 130116, "epoch": 1567} {"train_loss": -22.892255783081055, "global_step": 130117, "epoch": 1567} {"train_loss": -22.626920700073242, "global_step": 130118, "epoch": 1567} {"train_loss": -22.87522315979004, "global_step": 130119, "epoch": 1567} {"train_loss": -22.88106346130371, "global_step": 130120, "epoch": 1567} {"train_loss": -22.956714630126953, "global_step": 130121, "epoch": 1567} {"train_loss": -22.92812156677246, "global_step": 130122, "epoch": 1567} {"train_loss": -22.650297164916992, "global_step": 130123, "epoch": 1567} {"train_loss": -22.90142822265625, "global_step": 130124, "epoch": 1567} {"train_loss": -22.853700637817383, "global_step": 130125, "epoch": 1567} {"train_loss": -22.81578254699707, "global_step": 130126, "epoch": 1567} {"train_loss": -22.963275909423828, "global_step": 130127, "epoch": 1567} {"train_loss": -22.82411766052246, "global_step": 130128, "epoch": 1567} {"train_loss": -22.829008102416992, "global_step": 130129, "epoch": 1567} {"train_loss": -22.855093002319336, "global_step": 130130, "epoch": 1567} {"train_loss": -22.781742095947266, "global_step": 130131, "epoch": 1567} {"train_loss": -22.755069732666016, "global_step": 130132, "epoch": 1567} {"train_loss": -23.161497116088867, "global_step": 130133, "epoch": 1567} {"train_loss": -22.931699752807617, "global_step": 130134, "epoch": 1567} {"train_loss": -22.826833724975586, "global_step": 130135, "epoch": 1567} {"train_loss": -22.645143508911133, "global_step": 130136, "epoch": 1567} {"train_loss": -23.084447860717773, "global_step": 130137, "epoch": 1567} {"train_loss": -22.787235260009766, "global_step": 130138, "epoch": 1567} {"train_loss": -22.403608322143555, "global_step": 130139, "epoch": 1567} {"train_loss": -22.628849029541016, "global_step": 130140, "epoch": 1567} {"train_loss": -22.592134475708008, "global_step": 130141, "epoch": 1567} {"train_loss": -22.975921630859375, "global_step": 130142, "epoch": 1567} {"train_loss": -22.721790198820184, "global_step": 130143, "epoch": 1567, "val_loss": 6151810.0} {"train_loss": -21.815420150756836, "global_step": 130144, "epoch": 1568} {"train_loss": -21.71938133239746, "global_step": 130145, "epoch": 1568} {"train_loss": -21.701757431030273, "global_step": 130146, "epoch": 1568} {"train_loss": -21.458829879760742, "global_step": 130147, "epoch": 1568} {"train_loss": -21.41091537475586, "global_step": 130148, "epoch": 1568} {"train_loss": -21.180599212646484, "global_step": 130149, "epoch": 1568} {"train_loss": -22.018455505371094, "global_step": 130150, "epoch": 1568} {"train_loss": -21.495019912719727, "global_step": 130151, "epoch": 1568} {"train_loss": -21.73305892944336, "global_step": 130152, "epoch": 1568} {"train_loss": -21.93597984313965, "global_step": 130153, "epoch": 1568} {"train_loss": -22.133163452148438, "global_step": 130154, "epoch": 1568} {"train_loss": -21.781713485717773, "global_step": 130155, "epoch": 1568} {"train_loss": -22.00774574279785, "global_step": 130156, "epoch": 1568} {"train_loss": -22.042362213134766, "global_step": 130157, "epoch": 1568} {"train_loss": -22.144901275634766, "global_step": 130158, "epoch": 1568} {"train_loss": -22.05697250366211, "global_step": 130159, "epoch": 1568} {"train_loss": -22.058115005493164, "global_step": 130160, "epoch": 1568} {"train_loss": -21.979719161987305, "global_step": 130161, "epoch": 1568} {"train_loss": -22.26534080505371, "global_step": 130162, "epoch": 1568} {"train_loss": -22.342161178588867, "global_step": 130163, "epoch": 1568} {"train_loss": -22.50235366821289, "global_step": 130164, "epoch": 1568} {"train_loss": -22.173276901245117, "global_step": 130165, "epoch": 1568} {"train_loss": -22.497228622436523, "global_step": 130166, "epoch": 1568} {"train_loss": -22.81398582458496, "global_step": 130167, "epoch": 1568} {"train_loss": -22.17331314086914, "global_step": 130168, "epoch": 1568} {"train_loss": -22.562726974487305, "global_step": 130169, "epoch": 1568} {"train_loss": -22.424484252929688, "global_step": 130170, "epoch": 1568} {"train_loss": -22.409805297851562, "global_step": 130171, "epoch": 1568} {"train_loss": -22.748197555541992, "global_step": 130172, "epoch": 1568} {"train_loss": -22.835416793823242, "global_step": 130173, "epoch": 1568} {"train_loss": -22.500085830688477, "global_step": 130174, "epoch": 1568} {"train_loss": -22.510988235473633, "global_step": 130175, "epoch": 1568} {"train_loss": -22.499067306518555, "global_step": 130176, "epoch": 1568} {"train_loss": -22.930898666381836, "global_step": 130177, "epoch": 1568} {"train_loss": -23.091161727905273, "global_step": 130178, "epoch": 1568} {"train_loss": -22.980350494384766, "global_step": 130179, "epoch": 1568} {"train_loss": -22.80653953552246, "global_step": 130180, "epoch": 1568} {"train_loss": -22.64015007019043, "global_step": 130181, "epoch": 1568} {"train_loss": -22.698427200317383, "global_step": 130182, "epoch": 1568} {"train_loss": -22.245731353759766, "global_step": 130183, "epoch": 1568} {"train_loss": -22.59341049194336, "global_step": 130184, "epoch": 1568} {"train_loss": -23.054672241210938, "global_step": 130185, "epoch": 1568} {"train_loss": -23.235279083251953, "global_step": 130186, "epoch": 1568} {"train_loss": -23.19635581970215, "global_step": 130187, "epoch": 1568} {"train_loss": -23.0087890625, "global_step": 130188, "epoch": 1568} {"train_loss": -22.49043846130371, "global_step": 130189, "epoch": 1568} {"train_loss": -23.017606735229492, "global_step": 130190, "epoch": 1568} {"train_loss": -22.86163902282715, "global_step": 130191, "epoch": 1568} {"train_loss": -22.923696517944336, "global_step": 130192, "epoch": 1568} {"train_loss": -22.8375186920166, "global_step": 130193, "epoch": 1568} {"train_loss": -23.0194091796875, "global_step": 130194, "epoch": 1568} {"train_loss": -23.35279083251953, "global_step": 130195, "epoch": 1568} {"train_loss": -23.0700626373291, "global_step": 130196, "epoch": 1568} {"train_loss": -22.958385467529297, "global_step": 130197, "epoch": 1568} {"train_loss": -22.646127700805664, "global_step": 130198, "epoch": 1568} {"train_loss": -23.040340423583984, "global_step": 130199, "epoch": 1568} {"train_loss": -22.957929611206055, "global_step": 130200, "epoch": 1568} {"train_loss": -23.069326400756836, "global_step": 130201, "epoch": 1568} {"train_loss": -23.045333862304688, "global_step": 130202, "epoch": 1568} {"train_loss": -22.92624282836914, "global_step": 130203, "epoch": 1568} {"train_loss": -22.930662155151367, "global_step": 130204, "epoch": 1568} {"train_loss": -22.596357345581055, "global_step": 130205, "epoch": 1568} {"train_loss": -23.165773391723633, "global_step": 130206, "epoch": 1568} {"train_loss": -22.792495727539062, "global_step": 130207, "epoch": 1568} {"train_loss": -23.003311157226562, "global_step": 130208, "epoch": 1568} {"train_loss": -22.537593841552734, "global_step": 130209, "epoch": 1568} {"train_loss": -22.652021408081055, "global_step": 130210, "epoch": 1568} {"train_loss": -22.812936782836914, "global_step": 130211, "epoch": 1568} {"train_loss": -22.6745548248291, "global_step": 130212, "epoch": 1568} {"train_loss": -22.87504005432129, "global_step": 130213, "epoch": 1568} {"train_loss": -22.346220016479492, "global_step": 130214, "epoch": 1568} {"train_loss": -22.636194229125977, "global_step": 130215, "epoch": 1568} {"train_loss": -22.68993377685547, "global_step": 130216, "epoch": 1568} {"train_loss": -22.62636375427246, "global_step": 130217, "epoch": 1568} {"train_loss": -22.83653450012207, "global_step": 130218, "epoch": 1568} {"train_loss": -22.43596839904785, "global_step": 130219, "epoch": 1568} {"train_loss": -22.854658126831055, "global_step": 130220, "epoch": 1568} {"train_loss": -22.642271041870117, "global_step": 130221, "epoch": 1568} {"train_loss": -22.726974487304688, "global_step": 130222, "epoch": 1568} {"train_loss": -22.843446731567383, "global_step": 130223, "epoch": 1568} {"train_loss": -22.5579776763916, "global_step": 130224, "epoch": 1568} {"train_loss": -22.992795944213867, "global_step": 130225, "epoch": 1568} {"train_loss": -22.550352785960737, "global_step": 130226, "epoch": 1568, "val_loss": 6269721.0} {"train_loss": -22.433551788330078, "global_step": 130227, "epoch": 1569} {"train_loss": -22.573184967041016, "global_step": 130228, "epoch": 1569} {"train_loss": -22.553503036499023, "global_step": 130229, "epoch": 1569} {"train_loss": -22.5518741607666, "global_step": 130230, "epoch": 1569} {"train_loss": -22.80678367614746, "global_step": 130231, "epoch": 1569} {"train_loss": -22.544878005981445, "global_step": 130232, "epoch": 1569} {"train_loss": -22.727888107299805, "global_step": 130233, "epoch": 1569} {"train_loss": -21.865785598754883, "global_step": 130234, "epoch": 1569} {"train_loss": -22.732635498046875, "global_step": 130235, "epoch": 1569} {"train_loss": -22.175830841064453, "global_step": 130236, "epoch": 1569} {"train_loss": -22.871248245239258, "global_step": 130237, "epoch": 1569} {"train_loss": -22.8252010345459, "global_step": 130238, "epoch": 1569} {"train_loss": -22.451587677001953, "global_step": 130239, "epoch": 1569} {"train_loss": -22.188631057739258, "global_step": 130240, "epoch": 1569} {"train_loss": -22.795896530151367, "global_step": 130241, "epoch": 1569} {"train_loss": -22.43604850769043, "global_step": 130242, "epoch": 1569} {"train_loss": -22.403507232666016, "global_step": 130243, "epoch": 1569} {"train_loss": -22.07318878173828, "global_step": 130244, "epoch": 1569} {"train_loss": -22.642301559448242, "global_step": 130245, "epoch": 1569} {"train_loss": -22.556474685668945, "global_step": 130246, "epoch": 1569} {"train_loss": -22.809423446655273, "global_step": 130247, "epoch": 1569} {"train_loss": -22.822111129760742, "global_step": 130248, "epoch": 1569} {"train_loss": -22.490234375, "global_step": 130249, "epoch": 1569} {"train_loss": -22.41710662841797, "global_step": 130250, "epoch": 1569} {"train_loss": -22.32997703552246, "global_step": 130251, "epoch": 1569} {"train_loss": -22.723447799682617, "global_step": 130252, "epoch": 1569} {"train_loss": -22.460119247436523, "global_step": 130253, "epoch": 1569} {"train_loss": -22.961044311523438, "global_step": 130254, "epoch": 1569} {"train_loss": -22.5439510345459, "global_step": 130255, "epoch": 1569} {"train_loss": -22.73555564880371, "global_step": 130256, "epoch": 1569} {"train_loss": -22.403310775756836, "global_step": 130257, "epoch": 1569} {"train_loss": -22.629173278808594, "global_step": 130258, "epoch": 1569} {"train_loss": -22.59499168395996, "global_step": 130259, "epoch": 1569} {"train_loss": -22.674036026000977, "global_step": 130260, "epoch": 1569} {"train_loss": -22.977005004882812, "global_step": 130261, "epoch": 1569} {"train_loss": -22.80985450744629, "global_step": 130262, "epoch": 1569} {"train_loss": -22.648000717163086, "global_step": 130263, "epoch": 1569} {"train_loss": -22.683134078979492, "global_step": 130264, "epoch": 1569} {"train_loss": -22.381078720092773, "global_step": 130265, "epoch": 1569} {"train_loss": -23.24456214904785, "global_step": 130266, "epoch": 1569} {"train_loss": -22.98915672302246, "global_step": 130267, "epoch": 1569} {"train_loss": -22.32847023010254, "global_step": 130268, "epoch": 1569} {"train_loss": -22.60622215270996, "global_step": 130269, "epoch": 1569} {"train_loss": -22.7368221282959, "global_step": 130270, "epoch": 1569} {"train_loss": -22.809850692749023, "global_step": 130271, "epoch": 1569} {"train_loss": -22.661237716674805, "global_step": 130272, "epoch": 1569} {"train_loss": -22.965530395507812, "global_step": 130273, "epoch": 1569} {"train_loss": -22.787900924682617, "global_step": 130274, "epoch": 1569} {"train_loss": -22.498971939086914, "global_step": 130275, "epoch": 1569} {"train_loss": -22.849201202392578, "global_step": 130276, "epoch": 1569} {"train_loss": -23.144481658935547, "global_step": 130277, "epoch": 1569} {"train_loss": -22.67725944519043, "global_step": 130278, "epoch": 1569} {"train_loss": -22.843463897705078, "global_step": 130279, "epoch": 1569} {"train_loss": -22.766311645507812, "global_step": 130280, "epoch": 1569} {"train_loss": -22.780752182006836, "global_step": 130281, "epoch": 1569} {"train_loss": -22.742290496826172, "global_step": 130282, "epoch": 1569} {"train_loss": -23.034862518310547, "global_step": 130283, "epoch": 1569} {"train_loss": -23.37969970703125, "global_step": 130284, "epoch": 1569} {"train_loss": -22.690412521362305, "global_step": 130285, "epoch": 1569} {"train_loss": -22.634525299072266, "global_step": 130286, "epoch": 1569} {"train_loss": -22.779943466186523, "global_step": 130287, "epoch": 1569} {"train_loss": -22.56427574157715, "global_step": 130288, "epoch": 1569} {"train_loss": -22.874544143676758, "global_step": 130289, "epoch": 1569} {"train_loss": -22.766809463500977, "global_step": 130290, "epoch": 1569} {"train_loss": -22.593969345092773, "global_step": 130291, "epoch": 1569} {"train_loss": -23.223630905151367, "global_step": 130292, "epoch": 1569} {"train_loss": -23.009714126586914, "global_step": 130293, "epoch": 1569} {"train_loss": -22.82276725769043, "global_step": 130294, "epoch": 1569} {"train_loss": -22.694013595581055, "global_step": 130295, "epoch": 1569} {"train_loss": -22.507699966430664, "global_step": 130296, "epoch": 1569} {"train_loss": -22.728193283081055, "global_step": 130297, "epoch": 1569} {"train_loss": -22.567319869995117, "global_step": 130298, "epoch": 1569} {"train_loss": -22.796920776367188, "global_step": 130299, "epoch": 1569} {"train_loss": -22.7623233795166, "global_step": 130300, "epoch": 1569} {"train_loss": -23.02832794189453, "global_step": 130301, "epoch": 1569} {"train_loss": -22.858505249023438, "global_step": 130302, "epoch": 1569} {"train_loss": -22.684019088745117, "global_step": 130303, "epoch": 1569} {"train_loss": -22.4477596282959, "global_step": 130304, "epoch": 1569} {"train_loss": -22.85675621032715, "global_step": 130305, "epoch": 1569} {"train_loss": -22.893247604370117, "global_step": 130306, "epoch": 1569} {"train_loss": -23.00232696533203, "global_step": 130307, "epoch": 1569} {"train_loss": -22.33506965637207, "global_step": 130308, "epoch": 1569} {"train_loss": -22.703666388270367, "global_step": 130309, "epoch": 1569, "val_loss": 6395342.0} {"train_loss": -21.82307243347168, "global_step": 130310, "epoch": 1570} {"train_loss": -22.648426055908203, "global_step": 130311, "epoch": 1570} {"train_loss": -21.62651252746582, "global_step": 130312, "epoch": 1570} {"train_loss": -22.264041900634766, "global_step": 130313, "epoch": 1570} {"train_loss": -22.20083999633789, "global_step": 130314, "epoch": 1570} {"train_loss": -22.393922805786133, "global_step": 130315, "epoch": 1570} {"train_loss": -21.978652954101562, "global_step": 130316, "epoch": 1570} {"train_loss": -22.178388595581055, "global_step": 130317, "epoch": 1570} {"train_loss": -22.77998161315918, "global_step": 130318, "epoch": 1570} {"train_loss": -22.221033096313477, "global_step": 130319, "epoch": 1570} {"train_loss": -22.38413429260254, "global_step": 130320, "epoch": 1570} {"train_loss": -22.401456832885742, "global_step": 130321, "epoch": 1570} {"train_loss": -22.424854278564453, "global_step": 130322, "epoch": 1570} {"train_loss": -22.22063446044922, "global_step": 130323, "epoch": 1570} {"train_loss": -22.788549423217773, "global_step": 130324, "epoch": 1570} {"train_loss": -22.981830596923828, "global_step": 130325, "epoch": 1570} {"train_loss": -22.71024513244629, "global_step": 130326, "epoch": 1570} {"train_loss": -22.5200138092041, "global_step": 130327, "epoch": 1570} {"train_loss": -22.597440719604492, "global_step": 130328, "epoch": 1570} {"train_loss": -22.438119888305664, "global_step": 130329, "epoch": 1570} {"train_loss": -22.828271865844727, "global_step": 130330, "epoch": 1570} {"train_loss": -22.648876190185547, "global_step": 130331, "epoch": 1570} {"train_loss": -22.537418365478516, "global_step": 130332, "epoch": 1570} {"train_loss": -22.669403076171875, "global_step": 130333, "epoch": 1570} {"train_loss": -22.890445709228516, "global_step": 130334, "epoch": 1570} {"train_loss": -22.852493286132812, "global_step": 130335, "epoch": 1570} {"train_loss": -22.67713165283203, "global_step": 130336, "epoch": 1570} {"train_loss": -22.732332229614258, "global_step": 130337, "epoch": 1570} {"train_loss": -23.017942428588867, "global_step": 130338, "epoch": 1570} {"train_loss": -22.51081657409668, "global_step": 130339, "epoch": 1570} {"train_loss": -22.4312686920166, "global_step": 130340, "epoch": 1570} {"train_loss": -22.980375289916992, "global_step": 130341, "epoch": 1570} {"train_loss": -23.44307518005371, "global_step": 130342, "epoch": 1570} {"train_loss": -22.89063835144043, "global_step": 130343, "epoch": 1570} {"train_loss": -22.822158813476562, "global_step": 130344, "epoch": 1570} {"train_loss": -22.6113224029541, "global_step": 130345, "epoch": 1570} {"train_loss": -23.081296920776367, "global_step": 130346, "epoch": 1570} {"train_loss": -22.941513061523438, "global_step": 130347, "epoch": 1570} {"train_loss": -23.10799217224121, "global_step": 130348, "epoch": 1570} {"train_loss": -22.813581466674805, "global_step": 130349, "epoch": 1570} {"train_loss": -22.918014526367188, "global_step": 130350, "epoch": 1570} {"train_loss": -23.13278579711914, "global_step": 130351, "epoch": 1570} {"train_loss": -22.51396369934082, "global_step": 130352, "epoch": 1570} {"train_loss": -23.23915672302246, "global_step": 130353, "epoch": 1570} {"train_loss": -23.052209854125977, "global_step": 130354, "epoch": 1570} {"train_loss": -22.596607208251953, "global_step": 130355, "epoch": 1570} {"train_loss": -22.507802963256836, "global_step": 130356, "epoch": 1570} {"train_loss": -22.97090721130371, "global_step": 130357, "epoch": 1570} {"train_loss": -22.823352813720703, "global_step": 130358, "epoch": 1570} {"train_loss": -22.372058868408203, "global_step": 130359, "epoch": 1570} {"train_loss": -23.097917556762695, "global_step": 130360, "epoch": 1570} {"train_loss": -22.847145080566406, "global_step": 130361, "epoch": 1570} {"train_loss": -22.58987808227539, "global_step": 130362, "epoch": 1570} {"train_loss": -22.893117904663086, "global_step": 130363, "epoch": 1570} {"train_loss": -22.82459259033203, "global_step": 130364, "epoch": 1570} {"train_loss": -22.67449188232422, "global_step": 130365, "epoch": 1570} {"train_loss": -22.297868728637695, "global_step": 130366, "epoch": 1570} {"train_loss": -22.897775650024414, "global_step": 130367, "epoch": 1570} {"train_loss": -22.473432540893555, "global_step": 130368, "epoch": 1570} {"train_loss": -22.504667282104492, "global_step": 130369, "epoch": 1570} {"train_loss": -22.52960968017578, "global_step": 130370, "epoch": 1570} {"train_loss": -23.066984176635742, "global_step": 130371, "epoch": 1570} {"train_loss": -22.563098907470703, "global_step": 130372, "epoch": 1570} {"train_loss": -22.9434814453125, "global_step": 130373, "epoch": 1570} {"train_loss": -22.540250778198242, "global_step": 130374, "epoch": 1570} {"train_loss": -22.921865463256836, "global_step": 130375, "epoch": 1570} {"train_loss": -22.62066078186035, "global_step": 130376, "epoch": 1570} {"train_loss": -22.62540054321289, "global_step": 130377, "epoch": 1570} {"train_loss": -22.761825561523438, "global_step": 130378, "epoch": 1570} {"train_loss": -22.775846481323242, "global_step": 130379, "epoch": 1570} {"train_loss": -22.739933013916016, "global_step": 130380, "epoch": 1570} {"train_loss": -22.898595809936523, "global_step": 130381, "epoch": 1570} {"train_loss": -23.01065444946289, "global_step": 130382, "epoch": 1570} {"train_loss": -22.768526077270508, "global_step": 130383, "epoch": 1570} {"train_loss": -22.785236358642578, "global_step": 130384, "epoch": 1570} {"train_loss": -23.039045333862305, "global_step": 130385, "epoch": 1570} {"train_loss": -23.107934951782227, "global_step": 130386, "epoch": 1570} {"train_loss": -22.506834030151367, "global_step": 130387, "epoch": 1570} {"train_loss": -22.622215270996094, "global_step": 130388, "epoch": 1570} {"train_loss": -22.87318992614746, "global_step": 130389, "epoch": 1570} {"train_loss": -22.751174926757812, "global_step": 130390, "epoch": 1570} {"train_loss": -22.723773956298828, "global_step": 130391, "epoch": 1570} {"train_loss": -22.674595660473926, "global_step": 130392, "epoch": 1570, "val_loss": 6153496.0} {"train_loss": -21.36473274230957, "global_step": 130393, "epoch": 1571} {"train_loss": -22.2398738861084, "global_step": 130394, "epoch": 1571} {"train_loss": -21.43000602722168, "global_step": 130395, "epoch": 1571} {"train_loss": -22.63093376159668, "global_step": 130396, "epoch": 1571} {"train_loss": -21.85792350769043, "global_step": 130397, "epoch": 1571} {"train_loss": -22.2818546295166, "global_step": 130398, "epoch": 1571} {"train_loss": -21.751306533813477, "global_step": 130399, "epoch": 1571} {"train_loss": -22.435087203979492, "global_step": 130400, "epoch": 1571} {"train_loss": -22.508237838745117, "global_step": 130401, "epoch": 1571} {"train_loss": -22.055450439453125, "global_step": 130402, "epoch": 1571} {"train_loss": -22.667631149291992, "global_step": 130403, "epoch": 1571} {"train_loss": -22.038434982299805, "global_step": 130404, "epoch": 1571} {"train_loss": -22.38178062438965, "global_step": 130405, "epoch": 1571} {"train_loss": -22.75579071044922, "global_step": 130406, "epoch": 1571} {"train_loss": -22.287012100219727, "global_step": 130407, "epoch": 1571} {"train_loss": -22.50081443786621, "global_step": 130408, "epoch": 1571} {"train_loss": -22.488388061523438, "global_step": 130409, "epoch": 1571} {"train_loss": -22.623828887939453, "global_step": 130410, "epoch": 1571} {"train_loss": -22.841064453125, "global_step": 130411, "epoch": 1571} {"train_loss": -22.350542068481445, "global_step": 130412, "epoch": 1571} {"train_loss": -22.578235626220703, "global_step": 130413, "epoch": 1571} {"train_loss": -22.38466453552246, "global_step": 130414, "epoch": 1571} {"train_loss": -22.68550682067871, "global_step": 130415, "epoch": 1571} {"train_loss": -22.507892608642578, "global_step": 130416, "epoch": 1571} {"train_loss": -22.657663345336914, "global_step": 130417, "epoch": 1571} {"train_loss": -22.636831283569336, "global_step": 130418, "epoch": 1571} {"train_loss": -22.84628677368164, "global_step": 130419, "epoch": 1571} {"train_loss": -22.805072784423828, "global_step": 130420, "epoch": 1571} {"train_loss": -22.411609649658203, "global_step": 130421, "epoch": 1571} {"train_loss": -23.02231216430664, "global_step": 130422, "epoch": 1571} {"train_loss": -22.945892333984375, "global_step": 130423, "epoch": 1571} {"train_loss": -22.636245727539062, "global_step": 130424, "epoch": 1571} {"train_loss": -22.858455657958984, "global_step": 130425, "epoch": 1571} {"train_loss": -22.680007934570312, "global_step": 130426, "epoch": 1571} {"train_loss": -22.657705307006836, "global_step": 130427, "epoch": 1571} {"train_loss": -23.001840591430664, "global_step": 130428, "epoch": 1571} {"train_loss": -23.040258407592773, "global_step": 130429, "epoch": 1571} {"train_loss": -22.659215927124023, "global_step": 130430, "epoch": 1571} {"train_loss": -22.596506118774414, "global_step": 130431, "epoch": 1571} {"train_loss": -22.732938766479492, "global_step": 130432, "epoch": 1571} {"train_loss": -22.583110809326172, "global_step": 130433, "epoch": 1571} {"train_loss": -23.049837112426758, "global_step": 130434, "epoch": 1571} {"train_loss": -22.85230827331543, "global_step": 130435, "epoch": 1571} {"train_loss": -22.77617835998535, "global_step": 130436, "epoch": 1571} {"train_loss": -22.81441307067871, "global_step": 130437, "epoch": 1571} {"train_loss": -22.65707015991211, "global_step": 130438, "epoch": 1571} {"train_loss": -22.92250633239746, "global_step": 130439, "epoch": 1571} {"train_loss": -22.795873641967773, "global_step": 130440, "epoch": 1571} {"train_loss": -22.97849464416504, "global_step": 130441, "epoch": 1571} {"train_loss": -22.928598403930664, "global_step": 130442, "epoch": 1571} {"train_loss": -22.6646728515625, "global_step": 130443, "epoch": 1571} {"train_loss": -22.845809936523438, "global_step": 130444, "epoch": 1571} {"train_loss": -22.892988204956055, "global_step": 130445, "epoch": 1571} {"train_loss": -22.773237228393555, "global_step": 130446, "epoch": 1571} {"train_loss": -22.70734214782715, "global_step": 130447, "epoch": 1571} {"train_loss": -23.189401626586914, "global_step": 130448, "epoch": 1571} {"train_loss": -22.792661666870117, "global_step": 130449, "epoch": 1571} {"train_loss": -22.837081909179688, "global_step": 130450, "epoch": 1571} {"train_loss": -23.202390670776367, "global_step": 130451, "epoch": 1571} {"train_loss": -22.951812744140625, "global_step": 130452, "epoch": 1571} {"train_loss": -23.120044708251953, "global_step": 130453, "epoch": 1571} {"train_loss": -22.727127075195312, "global_step": 130454, "epoch": 1571} {"train_loss": -22.733797073364258, "global_step": 130455, "epoch": 1571} {"train_loss": -22.56276512145996, "global_step": 130456, "epoch": 1571} {"train_loss": -22.72003746032715, "global_step": 130457, "epoch": 1571} {"train_loss": -23.06089210510254, "global_step": 130458, "epoch": 1571} {"train_loss": -22.734189987182617, "global_step": 130459, "epoch": 1571} {"train_loss": -22.66640281677246, "global_step": 130460, "epoch": 1571} {"train_loss": -22.929182052612305, "global_step": 130461, "epoch": 1571} {"train_loss": -22.736724853515625, "global_step": 130462, "epoch": 1571} {"train_loss": -22.867952346801758, "global_step": 130463, "epoch": 1571} {"train_loss": -22.84974479675293, "global_step": 130464, "epoch": 1571} {"train_loss": -23.078392028808594, "global_step": 130465, "epoch": 1571} {"train_loss": -22.91570472717285, "global_step": 130466, "epoch": 1571} {"train_loss": -22.536043167114258, "global_step": 130467, "epoch": 1571} {"train_loss": -22.798925399780273, "global_step": 130468, "epoch": 1571} {"train_loss": -22.824338912963867, "global_step": 130469, "epoch": 1571} {"train_loss": -23.057086944580078, "global_step": 130470, "epoch": 1571} {"train_loss": -22.57444190979004, "global_step": 130471, "epoch": 1571} {"train_loss": -22.752683639526367, "global_step": 130472, "epoch": 1571} {"train_loss": -22.932409286499023, "global_step": 130473, "epoch": 1571} {"train_loss": -22.503881454467773, "global_step": 130474, "epoch": 1571} {"train_loss": -22.670311893325255, "global_step": 130475, "epoch": 1571, "val_loss": 6423751.0} {"train_loss": -22.610082626342773, "global_step": 130476, "epoch": 1572} {"train_loss": -22.569889068603516, "global_step": 130477, "epoch": 1572} {"train_loss": -22.581279754638672, "global_step": 130478, "epoch": 1572} {"train_loss": -22.646568298339844, "global_step": 130479, "epoch": 1572} {"train_loss": -22.396631240844727, "global_step": 130480, "epoch": 1572} {"train_loss": -22.547101974487305, "global_step": 130481, "epoch": 1572} {"train_loss": -22.597919464111328, "global_step": 130482, "epoch": 1572} {"train_loss": -22.736249923706055, "global_step": 130483, "epoch": 1572} {"train_loss": -22.573965072631836, "global_step": 130484, "epoch": 1572} {"train_loss": -22.653167724609375, "global_step": 130485, "epoch": 1572} {"train_loss": -22.475696563720703, "global_step": 130486, "epoch": 1572} {"train_loss": -23.048595428466797, "global_step": 130487, "epoch": 1572} {"train_loss": -22.71577262878418, "global_step": 130488, "epoch": 1572} {"train_loss": -22.440839767456055, "global_step": 130489, "epoch": 1572} {"train_loss": -22.814733505249023, "global_step": 130490, "epoch": 1572} {"train_loss": -23.052701950073242, "global_step": 130491, "epoch": 1572} {"train_loss": -22.886459350585938, "global_step": 130492, "epoch": 1572} {"train_loss": -22.873472213745117, "global_step": 130493, "epoch": 1572} {"train_loss": -22.988248825073242, "global_step": 130494, "epoch": 1572} {"train_loss": -22.693435668945312, "global_step": 130495, "epoch": 1572} {"train_loss": -22.848834991455078, "global_step": 130496, "epoch": 1572} {"train_loss": -22.870519638061523, "global_step": 130497, "epoch": 1572} {"train_loss": -22.620519638061523, "global_step": 130498, "epoch": 1572} {"train_loss": -22.68324851989746, "global_step": 130499, "epoch": 1572} {"train_loss": -22.962430953979492, "global_step": 130500, "epoch": 1572} {"train_loss": -22.706783294677734, "global_step": 130501, "epoch": 1572} {"train_loss": -22.691001892089844, "global_step": 130502, "epoch": 1572} {"train_loss": -22.995065689086914, "global_step": 130503, "epoch": 1572} {"train_loss": -22.686643600463867, "global_step": 130504, "epoch": 1572} {"train_loss": -23.050437927246094, "global_step": 130505, "epoch": 1572} {"train_loss": -22.915143966674805, "global_step": 130506, "epoch": 1572} {"train_loss": -23.066776275634766, "global_step": 130507, "epoch": 1572} {"train_loss": -22.777647018432617, "global_step": 130508, "epoch": 1572} {"train_loss": -22.86859130859375, "global_step": 130509, "epoch": 1572} {"train_loss": -22.92171287536621, "global_step": 130510, "epoch": 1572} {"train_loss": -23.384510040283203, "global_step": 130511, "epoch": 1572} {"train_loss": -22.949310302734375, "global_step": 130512, "epoch": 1572} {"train_loss": -22.789941787719727, "global_step": 130513, "epoch": 1572} {"train_loss": -22.752286911010742, "global_step": 130514, "epoch": 1572} {"train_loss": -22.9088134765625, "global_step": 130515, "epoch": 1572} {"train_loss": -22.874923706054688, "global_step": 130516, "epoch": 1572} {"train_loss": -23.18522834777832, "global_step": 130517, "epoch": 1572} {"train_loss": -22.965167999267578, "global_step": 130518, "epoch": 1572} {"train_loss": -22.779212951660156, "global_step": 130519, "epoch": 1572} {"train_loss": -22.845117568969727, "global_step": 130520, "epoch": 1572} {"train_loss": -22.910015106201172, "global_step": 130521, "epoch": 1572} {"train_loss": -23.021482467651367, "global_step": 130522, "epoch": 1572} {"train_loss": -22.82050323486328, "global_step": 130523, "epoch": 1572} {"train_loss": -22.8700008392334, "global_step": 130524, "epoch": 1572} {"train_loss": -22.910749435424805, "global_step": 130525, "epoch": 1572} {"train_loss": -23.116851806640625, "global_step": 130526, "epoch": 1572} {"train_loss": -23.007688522338867, "global_step": 130527, "epoch": 1572} {"train_loss": -22.735523223876953, "global_step": 130528, "epoch": 1572} {"train_loss": -22.684127807617188, "global_step": 130529, "epoch": 1572} {"train_loss": -22.6466064453125, "global_step": 130530, "epoch": 1572} {"train_loss": -22.745620727539062, "global_step": 130531, "epoch": 1572} {"train_loss": -22.649763107299805, "global_step": 130532, "epoch": 1572} {"train_loss": -22.870426177978516, "global_step": 130533, "epoch": 1572} {"train_loss": -23.10025405883789, "global_step": 130534, "epoch": 1572} {"train_loss": -22.57354164123535, "global_step": 130535, "epoch": 1572} {"train_loss": -22.737424850463867, "global_step": 130536, "epoch": 1572} {"train_loss": -22.723581314086914, "global_step": 130537, "epoch": 1572} {"train_loss": -22.909761428833008, "global_step": 130538, "epoch": 1572} {"train_loss": -23.03902244567871, "global_step": 130539, "epoch": 1572} {"train_loss": -22.81477928161621, "global_step": 130540, "epoch": 1572} {"train_loss": -22.840431213378906, "global_step": 130541, "epoch": 1572} {"train_loss": -23.237810134887695, "global_step": 130542, "epoch": 1572} {"train_loss": -22.567855834960938, "global_step": 130543, "epoch": 1572} {"train_loss": -23.00217628479004, "global_step": 130544, "epoch": 1572} {"train_loss": -22.99855613708496, "global_step": 130545, "epoch": 1572} {"train_loss": -22.858932495117188, "global_step": 130546, "epoch": 1572} {"train_loss": -22.70903205871582, "global_step": 130547, "epoch": 1572} {"train_loss": -22.87594985961914, "global_step": 130548, "epoch": 1572} {"train_loss": -23.36897850036621, "global_step": 130549, "epoch": 1572} {"train_loss": -22.729572296142578, "global_step": 130550, "epoch": 1572} {"train_loss": -22.78656005859375, "global_step": 130551, "epoch": 1572} {"train_loss": -22.84191131591797, "global_step": 130552, "epoch": 1572} {"train_loss": -22.45615577697754, "global_step": 130553, "epoch": 1572} {"train_loss": -22.875478744506836, "global_step": 130554, "epoch": 1572} {"train_loss": -22.656543731689453, "global_step": 130555, "epoch": 1572} {"train_loss": -22.443532943725586, "global_step": 130556, "epoch": 1572} {"train_loss": -22.796112060546875, "global_step": 130557, "epoch": 1572} {"train_loss": -22.840642584375587, "global_step": 130558, "epoch": 1572, "val_loss": 6229226.0} {"train_loss": -21.43513298034668, "global_step": 130559, "epoch": 1573} {"train_loss": -21.85833740234375, "global_step": 130560, "epoch": 1573} {"train_loss": -22.446975708007812, "global_step": 130561, "epoch": 1573} {"train_loss": -22.187850952148438, "global_step": 130562, "epoch": 1573} {"train_loss": -21.89533233642578, "global_step": 130563, "epoch": 1573} {"train_loss": -22.698184967041016, "global_step": 130564, "epoch": 1573} {"train_loss": -22.105005264282227, "global_step": 130565, "epoch": 1573} {"train_loss": -22.80238914489746, "global_step": 130566, "epoch": 1573} {"train_loss": -21.93086814880371, "global_step": 130567, "epoch": 1573} {"train_loss": -22.405698776245117, "global_step": 130568, "epoch": 1573} {"train_loss": -22.319873809814453, "global_step": 130569, "epoch": 1573} {"train_loss": -22.389684677124023, "global_step": 130570, "epoch": 1573} {"train_loss": -22.40436553955078, "global_step": 130571, "epoch": 1573} {"train_loss": -22.404117584228516, "global_step": 130572, "epoch": 1573} {"train_loss": -22.51413917541504, "global_step": 130573, "epoch": 1573} {"train_loss": -22.857833862304688, "global_step": 130574, "epoch": 1573} {"train_loss": -22.595090866088867, "global_step": 130575, "epoch": 1573} {"train_loss": -22.518508911132812, "global_step": 130576, "epoch": 1573} {"train_loss": -22.664478302001953, "global_step": 130577, "epoch": 1573} {"train_loss": -22.548133850097656, "global_step": 130578, "epoch": 1573} {"train_loss": -22.773273468017578, "global_step": 130579, "epoch": 1573} {"train_loss": -22.840219497680664, "global_step": 130580, "epoch": 1573} {"train_loss": -22.44454574584961, "global_step": 130581, "epoch": 1573} {"train_loss": -22.984159469604492, "global_step": 130582, "epoch": 1573} {"train_loss": -22.611371994018555, "global_step": 130583, "epoch": 1573} {"train_loss": -22.502111434936523, "global_step": 130584, "epoch": 1573} {"train_loss": -22.25065040588379, "global_step": 130585, "epoch": 1573} {"train_loss": -22.377029418945312, "global_step": 130586, "epoch": 1573} {"train_loss": -22.873016357421875, "global_step": 130587, "epoch": 1573} {"train_loss": -22.532455444335938, "global_step": 130588, "epoch": 1573} {"train_loss": -22.931081771850586, "global_step": 130589, "epoch": 1573} {"train_loss": -22.835229873657227, "global_step": 130590, "epoch": 1573} {"train_loss": -22.751564025878906, "global_step": 130591, "epoch": 1573} {"train_loss": -22.71001434326172, "global_step": 130592, "epoch": 1573} {"train_loss": -22.758264541625977, "global_step": 130593, "epoch": 1573} {"train_loss": -23.112247467041016, "global_step": 130594, "epoch": 1573} {"train_loss": -23.2012996673584, "global_step": 130595, "epoch": 1573} {"train_loss": -23.03658676147461, "global_step": 130596, "epoch": 1573} {"train_loss": -23.27608299255371, "global_step": 130597, "epoch": 1573} {"train_loss": -22.73954200744629, "global_step": 130598, "epoch": 1573} {"train_loss": -22.574142456054688, "global_step": 130599, "epoch": 1573} {"train_loss": -22.81319236755371, "global_step": 130600, "epoch": 1573} {"train_loss": -22.91437339782715, "global_step": 130601, "epoch": 1573} {"train_loss": -22.827377319335938, "global_step": 130602, "epoch": 1573} {"train_loss": -23.002775192260742, "global_step": 130603, "epoch": 1573} {"train_loss": -22.581924438476562, "global_step": 130604, "epoch": 1573} {"train_loss": -23.117055892944336, "global_step": 130605, "epoch": 1573} {"train_loss": -23.19721794128418, "global_step": 130606, "epoch": 1573} {"train_loss": -23.03761100769043, "global_step": 130607, "epoch": 1573} {"train_loss": -22.598188400268555, "global_step": 130608, "epoch": 1573} {"train_loss": -23.063966751098633, "global_step": 130609, "epoch": 1573} {"train_loss": -22.63512420654297, "global_step": 130610, "epoch": 1573} {"train_loss": -22.83085060119629, "global_step": 130611, "epoch": 1573} {"train_loss": -23.023910522460938, "global_step": 130612, "epoch": 1573} {"train_loss": -22.814533233642578, "global_step": 130613, "epoch": 1573} {"train_loss": -22.9288272857666, "global_step": 130614, "epoch": 1573} {"train_loss": -22.765201568603516, "global_step": 130615, "epoch": 1573} {"train_loss": -23.004566192626953, "global_step": 130616, "epoch": 1573} {"train_loss": -22.889923095703125, "global_step": 130617, "epoch": 1573} {"train_loss": -22.943052291870117, "global_step": 130618, "epoch": 1573} {"train_loss": -22.86916160583496, "global_step": 130619, "epoch": 1573} {"train_loss": -22.64725685119629, "global_step": 130620, "epoch": 1573} {"train_loss": -23.095699310302734, "global_step": 130621, "epoch": 1573} {"train_loss": -22.892179489135742, "global_step": 130622, "epoch": 1573} {"train_loss": -22.756086349487305, "global_step": 130623, "epoch": 1573} {"train_loss": -22.658130645751953, "global_step": 130624, "epoch": 1573} {"train_loss": -22.915021896362305, "global_step": 130625, "epoch": 1573} {"train_loss": -23.123258590698242, "global_step": 130626, "epoch": 1573} {"train_loss": -22.548004150390625, "global_step": 130627, "epoch": 1573} {"train_loss": -22.79012107849121, "global_step": 130628, "epoch": 1573} {"train_loss": -22.83550453186035, "global_step": 130629, "epoch": 1573} {"train_loss": -22.88392448425293, "global_step": 130630, "epoch": 1573} {"train_loss": -22.762638092041016, "global_step": 130631, "epoch": 1573} {"train_loss": -22.501785278320312, "global_step": 130632, "epoch": 1573} {"train_loss": -22.816150665283203, "global_step": 130633, "epoch": 1573} {"train_loss": -23.03824806213379, "global_step": 130634, "epoch": 1573} {"train_loss": -22.879703521728516, "global_step": 130635, "epoch": 1573} {"train_loss": -23.006940841674805, "global_step": 130636, "epoch": 1573} {"train_loss": -22.811267852783203, "global_step": 130637, "epoch": 1573} {"train_loss": -22.487764358520508, "global_step": 130638, "epoch": 1573} {"train_loss": -22.768421173095703, "global_step": 130639, "epoch": 1573} {"train_loss": -22.618051528930664, "global_step": 130640, "epoch": 1573} {"train_loss": -22.69544236056776, "global_step": 130641, "epoch": 1573, "val_loss": 6236085.0} {"train_loss": -21.787235260009766, "global_step": 130642, "epoch": 1574} {"train_loss": -22.45006561279297, "global_step": 130643, "epoch": 1574} {"train_loss": -22.128286361694336, "global_step": 130644, "epoch": 1574} {"train_loss": -22.051950454711914, "global_step": 130645, "epoch": 1574} {"train_loss": -22.61968421936035, "global_step": 130646, "epoch": 1574} {"train_loss": -22.440078735351562, "global_step": 130647, "epoch": 1574} {"train_loss": -22.540700912475586, "global_step": 130648, "epoch": 1574} {"train_loss": -22.75453758239746, "global_step": 130649, "epoch": 1574} {"train_loss": -22.275449752807617, "global_step": 130650, "epoch": 1574} {"train_loss": -22.444074630737305, "global_step": 130651, "epoch": 1574} {"train_loss": -22.78199577331543, "global_step": 130652, "epoch": 1574} {"train_loss": -22.615291595458984, "global_step": 130653, "epoch": 1574} {"train_loss": -22.906951904296875, "global_step": 130654, "epoch": 1574} {"train_loss": -22.473541259765625, "global_step": 130655, "epoch": 1574} {"train_loss": -22.523988723754883, "global_step": 130656, "epoch": 1574} {"train_loss": -22.536596298217773, "global_step": 130657, "epoch": 1574} {"train_loss": -22.49342918395996, "global_step": 130658, "epoch": 1574} {"train_loss": -23.026123046875, "global_step": 130659, "epoch": 1574} {"train_loss": -22.747180938720703, "global_step": 130660, "epoch": 1574} {"train_loss": -22.475614547729492, "global_step": 130661, "epoch": 1574} {"train_loss": -22.995038986206055, "global_step": 130662, "epoch": 1574} {"train_loss": -22.936464309692383, "global_step": 130663, "epoch": 1574} {"train_loss": -23.134401321411133, "global_step": 130664, "epoch": 1574} {"train_loss": -22.658889770507812, "global_step": 130665, "epoch": 1574} {"train_loss": -23.200437545776367, "global_step": 130666, "epoch": 1574} {"train_loss": -22.572050094604492, "global_step": 130667, "epoch": 1574} {"train_loss": -22.46558952331543, "global_step": 130668, "epoch": 1574} {"train_loss": -22.80841636657715, "global_step": 130669, "epoch": 1574} {"train_loss": -22.92188835144043, "global_step": 130670, "epoch": 1574} {"train_loss": -22.99750328063965, "global_step": 130671, "epoch": 1574} {"train_loss": -22.622318267822266, "global_step": 130672, "epoch": 1574} {"train_loss": -22.693906784057617, "global_step": 130673, "epoch": 1574} {"train_loss": -22.647239685058594, "global_step": 130674, "epoch": 1574} {"train_loss": -22.85015869140625, "global_step": 130675, "epoch": 1574} {"train_loss": -22.82561683654785, "global_step": 130676, "epoch": 1574} {"train_loss": -22.964372634887695, "global_step": 130677, "epoch": 1574} {"train_loss": -23.010330200195312, "global_step": 130678, "epoch": 1574} {"train_loss": -23.126684188842773, "global_step": 130679, "epoch": 1574} {"train_loss": -23.053625106811523, "global_step": 130680, "epoch": 1574} {"train_loss": -22.386159896850586, "global_step": 130681, "epoch": 1574} {"train_loss": -23.124502182006836, "global_step": 130682, "epoch": 1574} {"train_loss": -22.79009437561035, "global_step": 130683, "epoch": 1574} {"train_loss": -22.5430965423584, "global_step": 130684, "epoch": 1574} {"train_loss": -22.890167236328125, "global_step": 130685, "epoch": 1574} {"train_loss": -22.837461471557617, "global_step": 130686, "epoch": 1574} {"train_loss": -22.704299926757812, "global_step": 130687, "epoch": 1574} {"train_loss": -22.99462127685547, "global_step": 130688, "epoch": 1574} {"train_loss": -22.848316192626953, "global_step": 130689, "epoch": 1574} {"train_loss": -22.9050350189209, "global_step": 130690, "epoch": 1574} {"train_loss": -22.880268096923828, "global_step": 130691, "epoch": 1574} {"train_loss": -23.027631759643555, "global_step": 130692, "epoch": 1574} {"train_loss": -22.40244483947754, "global_step": 130693, "epoch": 1574} {"train_loss": -22.69789695739746, "global_step": 130694, "epoch": 1574} {"train_loss": -23.073081970214844, "global_step": 130695, "epoch": 1574} {"train_loss": -22.708938598632812, "global_step": 130696, "epoch": 1574} {"train_loss": -22.764944076538086, "global_step": 130697, "epoch": 1574} {"train_loss": -22.624298095703125, "global_step": 130698, "epoch": 1574} {"train_loss": -22.5800724029541, "global_step": 130699, "epoch": 1574} {"train_loss": -23.258405685424805, "global_step": 130700, "epoch": 1574} {"train_loss": -22.795270919799805, "global_step": 130701, "epoch": 1574} {"train_loss": -22.91128921508789, "global_step": 130702, "epoch": 1574} {"train_loss": -23.093429565429688, "global_step": 130703, "epoch": 1574} {"train_loss": -23.064451217651367, "global_step": 130704, "epoch": 1574} {"train_loss": -22.886032104492188, "global_step": 130705, "epoch": 1574} {"train_loss": -22.826812744140625, "global_step": 130706, "epoch": 1574} {"train_loss": -22.903778076171875, "global_step": 130707, "epoch": 1574} {"train_loss": -22.924808502197266, "global_step": 130708, "epoch": 1574} {"train_loss": -22.731353759765625, "global_step": 130709, "epoch": 1574} {"train_loss": -22.925716400146484, "global_step": 130710, "epoch": 1574} {"train_loss": -23.006750106811523, "global_step": 130711, "epoch": 1574} {"train_loss": -22.742923736572266, "global_step": 130712, "epoch": 1574} {"train_loss": -22.897729873657227, "global_step": 130713, "epoch": 1574} {"train_loss": -22.61697769165039, "global_step": 130714, "epoch": 1574} {"train_loss": -22.903562545776367, "global_step": 130715, "epoch": 1574} {"train_loss": -22.959110260009766, "global_step": 130716, "epoch": 1574} {"train_loss": -23.312274932861328, "global_step": 130717, "epoch": 1574} {"train_loss": -22.762815475463867, "global_step": 130718, "epoch": 1574} {"train_loss": -22.96645736694336, "global_step": 130719, "epoch": 1574} {"train_loss": -22.894399642944336, "global_step": 130720, "epoch": 1574} {"train_loss": -22.61115837097168, "global_step": 130721, "epoch": 1574} {"train_loss": -23.222434997558594, "global_step": 130722, "epoch": 1574} {"train_loss": -22.69139289855957, "global_step": 130723, "epoch": 1574} {"train_loss": -22.787062794329174, "global_step": 130724, "epoch": 1574, "val_loss": 6277951.5} {"train_loss": -22.317190170288086, "global_step": 130725, "epoch": 1575} {"train_loss": -22.09954071044922, "global_step": 130726, "epoch": 1575} {"train_loss": -21.908796310424805, "global_step": 130727, "epoch": 1575} {"train_loss": -22.680410385131836, "global_step": 130728, "epoch": 1575} {"train_loss": -22.172046661376953, "global_step": 130729, "epoch": 1575} {"train_loss": -21.65021514892578, "global_step": 130730, "epoch": 1575} {"train_loss": -22.32383155822754, "global_step": 130731, "epoch": 1575} {"train_loss": -22.320524215698242, "global_step": 130732, "epoch": 1575} {"train_loss": -22.384021759033203, "global_step": 130733, "epoch": 1575} {"train_loss": -22.328250885009766, "global_step": 130734, "epoch": 1575} {"train_loss": -22.628026962280273, "global_step": 130735, "epoch": 1575} {"train_loss": -22.52200698852539, "global_step": 130736, "epoch": 1575} {"train_loss": -22.63179588317871, "global_step": 130737, "epoch": 1575} {"train_loss": -22.252674102783203, "global_step": 130738, "epoch": 1575} {"train_loss": -22.4161434173584, "global_step": 130739, "epoch": 1575} {"train_loss": -22.52217674255371, "global_step": 130740, "epoch": 1575} {"train_loss": -22.531801223754883, "global_step": 130741, "epoch": 1575} {"train_loss": -22.532958984375, "global_step": 130742, "epoch": 1575} {"train_loss": -22.446121215820312, "global_step": 130743, "epoch": 1575} {"train_loss": -22.7319393157959, "global_step": 130744, "epoch": 1575} {"train_loss": -22.584562301635742, "global_step": 130745, "epoch": 1575} {"train_loss": -22.57038688659668, "global_step": 130746, "epoch": 1575} {"train_loss": -22.545074462890625, "global_step": 130747, "epoch": 1575} {"train_loss": -22.94439697265625, "global_step": 130748, "epoch": 1575} {"train_loss": -22.785531997680664, "global_step": 130749, "epoch": 1575} {"train_loss": -22.47142219543457, "global_step": 130750, "epoch": 1575} {"train_loss": -22.269739151000977, "global_step": 130751, "epoch": 1575} {"train_loss": -22.973459243774414, "global_step": 130752, "epoch": 1575} {"train_loss": -22.2629451751709, "global_step": 130753, "epoch": 1575} {"train_loss": -22.69754409790039, "global_step": 130754, "epoch": 1575} {"train_loss": -22.746740341186523, "global_step": 130755, "epoch": 1575} {"train_loss": -22.630538940429688, "global_step": 130756, "epoch": 1575} {"train_loss": -22.923830032348633, "global_step": 130757, "epoch": 1575} {"train_loss": -22.793302536010742, "global_step": 130758, "epoch": 1575} {"train_loss": -22.797040939331055, "global_step": 130759, "epoch": 1575} {"train_loss": -22.554458618164062, "global_step": 130760, "epoch": 1575} {"train_loss": -22.767101287841797, "global_step": 130761, "epoch": 1575} {"train_loss": -22.62897300720215, "global_step": 130762, "epoch": 1575} {"train_loss": -22.715513229370117, "global_step": 130763, "epoch": 1575} {"train_loss": -22.727821350097656, "global_step": 130764, "epoch": 1575} {"train_loss": -22.62224769592285, "global_step": 130765, "epoch": 1575} {"train_loss": -22.90610122680664, "global_step": 130766, "epoch": 1575} {"train_loss": -22.82416343688965, "global_step": 130767, "epoch": 1575} {"train_loss": -22.67098045349121, "global_step": 130768, "epoch": 1575} {"train_loss": -22.944673538208008, "global_step": 130769, "epoch": 1575} {"train_loss": -22.468046188354492, "global_step": 130770, "epoch": 1575} {"train_loss": -22.67131805419922, "global_step": 130771, "epoch": 1575} {"train_loss": -22.568639755249023, "global_step": 130772, "epoch": 1575} {"train_loss": -22.393423080444336, "global_step": 130773, "epoch": 1575} {"train_loss": -22.82223892211914, "global_step": 130774, "epoch": 1575} {"train_loss": -22.882526397705078, "global_step": 130775, "epoch": 1575} {"train_loss": -22.83863639831543, "global_step": 130776, "epoch": 1575} {"train_loss": -22.796377182006836, "global_step": 130777, "epoch": 1575} {"train_loss": -22.978687286376953, "global_step": 130778, "epoch": 1575} {"train_loss": -22.67643165588379, "global_step": 130779, "epoch": 1575} {"train_loss": -22.865053176879883, "global_step": 130780, "epoch": 1575} {"train_loss": -22.794103622436523, "global_step": 130781, "epoch": 1575} {"train_loss": -23.049530029296875, "global_step": 130782, "epoch": 1575} {"train_loss": -22.82771873474121, "global_step": 130783, "epoch": 1575} {"train_loss": -23.032398223876953, "global_step": 130784, "epoch": 1575} {"train_loss": -23.00130271911621, "global_step": 130785, "epoch": 1575} {"train_loss": -22.564361572265625, "global_step": 130786, "epoch": 1575} {"train_loss": -23.054317474365234, "global_step": 130787, "epoch": 1575} {"train_loss": -22.556705474853516, "global_step": 130788, "epoch": 1575} {"train_loss": -22.19930076599121, "global_step": 130789, "epoch": 1575} {"train_loss": -22.732328414916992, "global_step": 130790, "epoch": 1575} {"train_loss": -23.06594467163086, "global_step": 130791, "epoch": 1575} {"train_loss": -22.5439395904541, "global_step": 130792, "epoch": 1575} {"train_loss": -23.352598190307617, "global_step": 130793, "epoch": 1575} {"train_loss": -22.810138702392578, "global_step": 130794, "epoch": 1575} {"train_loss": -22.982389450073242, "global_step": 130795, "epoch": 1575} {"train_loss": -23.0045223236084, "global_step": 130796, "epoch": 1575} {"train_loss": -22.91059684753418, "global_step": 130797, "epoch": 1575} {"train_loss": -22.954833984375, "global_step": 130798, "epoch": 1575} {"train_loss": -22.787878036499023, "global_step": 130799, "epoch": 1575} {"train_loss": -22.8096923828125, "global_step": 130800, "epoch": 1575} {"train_loss": -22.844541549682617, "global_step": 130801, "epoch": 1575} {"train_loss": -22.84077262878418, "global_step": 130802, "epoch": 1575} {"train_loss": -23.033161163330078, "global_step": 130803, "epoch": 1575} {"train_loss": -23.16078758239746, "global_step": 130804, "epoch": 1575} {"train_loss": -22.789234161376953, "global_step": 130805, "epoch": 1575} {"train_loss": -23.109922409057617, "global_step": 130806, "epoch": 1575} {"train_loss": -22.687453212508235, "global_step": 130807, "epoch": 1575, "val_loss": 6345932.5} {"train_loss": -22.391559600830078, "global_step": 130808, "epoch": 1576} {"train_loss": -22.81467628479004, "global_step": 130809, "epoch": 1576} {"train_loss": -22.449451446533203, "global_step": 130810, "epoch": 1576} {"train_loss": -22.63705825805664, "global_step": 130811, "epoch": 1576} {"train_loss": -22.52617835998535, "global_step": 130812, "epoch": 1576} {"train_loss": -22.48295021057129, "global_step": 130813, "epoch": 1576} {"train_loss": -22.51856803894043, "global_step": 130814, "epoch": 1576} {"train_loss": -22.830801010131836, "global_step": 130815, "epoch": 1576} {"train_loss": -22.793569564819336, "global_step": 130816, "epoch": 1576} {"train_loss": -22.48615837097168, "global_step": 130817, "epoch": 1576} {"train_loss": -22.371442794799805, "global_step": 130818, "epoch": 1576} {"train_loss": -22.941492080688477, "global_step": 130819, "epoch": 1576} {"train_loss": -22.538434982299805, "global_step": 130820, "epoch": 1576} {"train_loss": -22.512001037597656, "global_step": 130821, "epoch": 1576} {"train_loss": -22.8699893951416, "global_step": 130822, "epoch": 1576} {"train_loss": -23.062957763671875, "global_step": 130823, "epoch": 1576} {"train_loss": -23.2810115814209, "global_step": 130824, "epoch": 1576} {"train_loss": -22.331031799316406, "global_step": 130825, "epoch": 1576} {"train_loss": -22.844961166381836, "global_step": 130826, "epoch": 1576} {"train_loss": -23.152423858642578, "global_step": 130827, "epoch": 1576} {"train_loss": -22.906763076782227, "global_step": 130828, "epoch": 1576} {"train_loss": -23.218496322631836, "global_step": 130829, "epoch": 1576} {"train_loss": -22.627521514892578, "global_step": 130830, "epoch": 1576} {"train_loss": -22.400583267211914, "global_step": 130831, "epoch": 1576} {"train_loss": -22.56153678894043, "global_step": 130832, "epoch": 1576} {"train_loss": -22.575122833251953, "global_step": 130833, "epoch": 1576} {"train_loss": -22.852554321289062, "global_step": 130834, "epoch": 1576} {"train_loss": -22.543304443359375, "global_step": 130835, "epoch": 1576} {"train_loss": -22.790863037109375, "global_step": 130836, "epoch": 1576} {"train_loss": -22.534164428710938, "global_step": 130837, "epoch": 1576} {"train_loss": -22.676767349243164, "global_step": 130838, "epoch": 1576} {"train_loss": -22.80436134338379, "global_step": 130839, "epoch": 1576} {"train_loss": -22.620580673217773, "global_step": 130840, "epoch": 1576} {"train_loss": -23.124080657958984, "global_step": 130841, "epoch": 1576} {"train_loss": -22.374099731445312, "global_step": 130842, "epoch": 1576} {"train_loss": -22.6351375579834, "global_step": 130843, "epoch": 1576} {"train_loss": -22.361066818237305, "global_step": 130844, "epoch": 1576} {"train_loss": -22.96491813659668, "global_step": 130845, "epoch": 1576} {"train_loss": -22.730316162109375, "global_step": 130846, "epoch": 1576} {"train_loss": -23.063756942749023, "global_step": 130847, "epoch": 1576} {"train_loss": -23.18201446533203, "global_step": 130848, "epoch": 1576} {"train_loss": -22.82404899597168, "global_step": 130849, "epoch": 1576} {"train_loss": -22.86982536315918, "global_step": 130850, "epoch": 1576} {"train_loss": -23.112539291381836, "global_step": 130851, "epoch": 1576} {"train_loss": -22.448911666870117, "global_step": 130852, "epoch": 1576} {"train_loss": -22.699838638305664, "global_step": 130853, "epoch": 1576} {"train_loss": -22.718063354492188, "global_step": 130854, "epoch": 1576} {"train_loss": -22.745254516601562, "global_step": 130855, "epoch": 1576} {"train_loss": -22.53443717956543, "global_step": 130856, "epoch": 1576} {"train_loss": -22.330135345458984, "global_step": 130857, "epoch": 1576} {"train_loss": -22.922922134399414, "global_step": 130858, "epoch": 1576} {"train_loss": -22.995075225830078, "global_step": 130859, "epoch": 1576} {"train_loss": -23.036298751831055, "global_step": 130860, "epoch": 1576} {"train_loss": -23.018220901489258, "global_step": 130861, "epoch": 1576} {"train_loss": -23.086515426635742, "global_step": 130862, "epoch": 1576} {"train_loss": -22.52924919128418, "global_step": 130863, "epoch": 1576} {"train_loss": -22.90691375732422, "global_step": 130864, "epoch": 1576} {"train_loss": -23.07817840576172, "global_step": 130865, "epoch": 1576} {"train_loss": -22.87006950378418, "global_step": 130866, "epoch": 1576} {"train_loss": -23.064977645874023, "global_step": 130867, "epoch": 1576} {"train_loss": -22.615406036376953, "global_step": 130868, "epoch": 1576} {"train_loss": -23.233549118041992, "global_step": 130869, "epoch": 1576} {"train_loss": -22.852880477905273, "global_step": 130870, "epoch": 1576} {"train_loss": -23.035541534423828, "global_step": 130871, "epoch": 1576} {"train_loss": -22.90836524963379, "global_step": 130872, "epoch": 1576} {"train_loss": -22.778955459594727, "global_step": 130873, "epoch": 1576} {"train_loss": -22.72537612915039, "global_step": 130874, "epoch": 1576} {"train_loss": -22.783109664916992, "global_step": 130875, "epoch": 1576} {"train_loss": -22.75132942199707, "global_step": 130876, "epoch": 1576} {"train_loss": -22.503318786621094, "global_step": 130877, "epoch": 1576} {"train_loss": -23.011838912963867, "global_step": 130878, "epoch": 1576} {"train_loss": -23.01904296875, "global_step": 130879, "epoch": 1576} {"train_loss": -22.766239166259766, "global_step": 130880, "epoch": 1576} {"train_loss": -22.7363338470459, "global_step": 130881, "epoch": 1576} {"train_loss": -22.690752029418945, "global_step": 130882, "epoch": 1576} {"train_loss": -22.679637908935547, "global_step": 130883, "epoch": 1576} {"train_loss": -22.66377830505371, "global_step": 130884, "epoch": 1576} {"train_loss": -22.619089126586914, "global_step": 130885, "epoch": 1576} {"train_loss": -22.558963775634766, "global_step": 130886, "epoch": 1576} {"train_loss": -22.482290267944336, "global_step": 130887, "epoch": 1576} {"train_loss": -22.656476974487305, "global_step": 130888, "epoch": 1576} {"train_loss": -23.00287437438965, "global_step": 130889, "epoch": 1576} {"train_loss": -22.7658668426146, "global_step": 130890, "epoch": 1576, "val_loss": 6194539.0} {"train_loss": -22.129173278808594, "global_step": 130891, "epoch": 1577} {"train_loss": -22.04388427734375, "global_step": 130892, "epoch": 1577} {"train_loss": -22.340375900268555, "global_step": 130893, "epoch": 1577} {"train_loss": -22.557723999023438, "global_step": 130894, "epoch": 1577} {"train_loss": -22.42544937133789, "global_step": 130895, "epoch": 1577} {"train_loss": -22.367748260498047, "global_step": 130896, "epoch": 1577} {"train_loss": -22.651233673095703, "global_step": 130897, "epoch": 1577} {"train_loss": -22.40767478942871, "global_step": 130898, "epoch": 1577} {"train_loss": -22.79022789001465, "global_step": 130899, "epoch": 1577} {"train_loss": -22.395130157470703, "global_step": 130900, "epoch": 1577} {"train_loss": -22.64466667175293, "global_step": 130901, "epoch": 1577} {"train_loss": -22.487258911132812, "global_step": 130902, "epoch": 1577} {"train_loss": -22.495315551757812, "global_step": 130903, "epoch": 1577} {"train_loss": -22.717561721801758, "global_step": 130904, "epoch": 1577} {"train_loss": -22.735353469848633, "global_step": 130905, "epoch": 1577} {"train_loss": -22.922229766845703, "global_step": 130906, "epoch": 1577} {"train_loss": -22.73270034790039, "global_step": 130907, "epoch": 1577} {"train_loss": -22.50752067565918, "global_step": 130908, "epoch": 1577} {"train_loss": -22.722532272338867, "global_step": 130909, "epoch": 1577} {"train_loss": -22.509519577026367, "global_step": 130910, "epoch": 1577} {"train_loss": -22.80901336669922, "global_step": 130911, "epoch": 1577} {"train_loss": -22.666685104370117, "global_step": 130912, "epoch": 1577} {"train_loss": -22.699209213256836, "global_step": 130913, "epoch": 1577} {"train_loss": -22.373397827148438, "global_step": 130914, "epoch": 1577} {"train_loss": -22.6584529876709, "global_step": 130915, "epoch": 1577} {"train_loss": -22.4169979095459, "global_step": 130916, "epoch": 1577} {"train_loss": -22.372365951538086, "global_step": 130917, "epoch": 1577} {"train_loss": -22.66517448425293, "global_step": 130918, "epoch": 1577} {"train_loss": -22.731552124023438, "global_step": 130919, "epoch": 1577} {"train_loss": -23.016372680664062, "global_step": 130920, "epoch": 1577} {"train_loss": -22.76247215270996, "global_step": 130921, "epoch": 1577} {"train_loss": -22.73957633972168, "global_step": 130922, "epoch": 1577} {"train_loss": -23.136884689331055, "global_step": 130923, "epoch": 1577} {"train_loss": -22.675399780273438, "global_step": 130924, "epoch": 1577} {"train_loss": -22.69627571105957, "global_step": 130925, "epoch": 1577} {"train_loss": -23.009532928466797, "global_step": 130926, "epoch": 1577} {"train_loss": -22.649213790893555, "global_step": 130927, "epoch": 1577} {"train_loss": -23.023752212524414, "global_step": 130928, "epoch": 1577} {"train_loss": -22.918867111206055, "global_step": 130929, "epoch": 1577} {"train_loss": -23.034351348876953, "global_step": 130930, "epoch": 1577} {"train_loss": -23.001569747924805, "global_step": 130931, "epoch": 1577} {"train_loss": -23.100370407104492, "global_step": 130932, "epoch": 1577} {"train_loss": -22.964277267456055, "global_step": 130933, "epoch": 1577} {"train_loss": -22.826160430908203, "global_step": 130934, "epoch": 1577} {"train_loss": -22.681716918945312, "global_step": 130935, "epoch": 1577} {"train_loss": -23.227615356445312, "global_step": 130936, "epoch": 1577} {"train_loss": -22.939889907836914, "global_step": 130937, "epoch": 1577} {"train_loss": -22.73311424255371, "global_step": 130938, "epoch": 1577} {"train_loss": -22.951135635375977, "global_step": 130939, "epoch": 1577} {"train_loss": -22.699167251586914, "global_step": 130940, "epoch": 1577} {"train_loss": -22.64405632019043, "global_step": 130941, "epoch": 1577} {"train_loss": -23.088024139404297, "global_step": 130942, "epoch": 1577} {"train_loss": -23.228710174560547, "global_step": 130943, "epoch": 1577} {"train_loss": -22.703258514404297, "global_step": 130944, "epoch": 1577} {"train_loss": -22.65462303161621, "global_step": 130945, "epoch": 1577} {"train_loss": -23.074846267700195, "global_step": 130946, "epoch": 1577} {"train_loss": -22.73426628112793, "global_step": 130947, "epoch": 1577} {"train_loss": -23.043720245361328, "global_step": 130948, "epoch": 1577} {"train_loss": -22.27182960510254, "global_step": 130949, "epoch": 1577} {"train_loss": -22.942380905151367, "global_step": 130950, "epoch": 1577} {"train_loss": -23.178918838500977, "global_step": 130951, "epoch": 1577} {"train_loss": -22.868131637573242, "global_step": 130952, "epoch": 1577} {"train_loss": -22.4340763092041, "global_step": 130953, "epoch": 1577} {"train_loss": -23.150846481323242, "global_step": 130954, "epoch": 1577} {"train_loss": -22.417280197143555, "global_step": 130955, "epoch": 1577} {"train_loss": -22.927019119262695, "global_step": 130956, "epoch": 1577} {"train_loss": -22.962066650390625, "global_step": 130957, "epoch": 1577} {"train_loss": -22.956552505493164, "global_step": 130958, "epoch": 1577} {"train_loss": -22.803152084350586, "global_step": 130959, "epoch": 1577} {"train_loss": -22.80507469177246, "global_step": 130960, "epoch": 1577} {"train_loss": -22.8885498046875, "global_step": 130961, "epoch": 1577} {"train_loss": -22.460546493530273, "global_step": 130962, "epoch": 1577} {"train_loss": -22.942546844482422, "global_step": 130963, "epoch": 1577} {"train_loss": -22.642454147338867, "global_step": 130964, "epoch": 1577} {"train_loss": -22.960622787475586, "global_step": 130965, "epoch": 1577} {"train_loss": -22.78761100769043, "global_step": 130966, "epoch": 1577} {"train_loss": -22.910964965820312, "global_step": 130967, "epoch": 1577} {"train_loss": -23.111513137817383, "global_step": 130968, "epoch": 1577} {"train_loss": -23.022192001342773, "global_step": 130969, "epoch": 1577} {"train_loss": -22.8349609375, "global_step": 130970, "epoch": 1577} {"train_loss": -22.732646942138672, "global_step": 130971, "epoch": 1577} {"train_loss": -22.74672508239746, "global_step": 130972, "epoch": 1577} {"train_loss": -22.742037646741753, "global_step": 130973, "epoch": 1577, "val_loss": 6430505.0} {"train_loss": -22.769765853881836, "global_step": 130974, "epoch": 1578} {"train_loss": -22.27241325378418, "global_step": 130975, "epoch": 1578} {"train_loss": -22.20444679260254, "global_step": 130976, "epoch": 1578} {"train_loss": -22.948183059692383, "global_step": 130977, "epoch": 1578} {"train_loss": -22.427509307861328, "global_step": 130978, "epoch": 1578} {"train_loss": -22.55645179748535, "global_step": 130979, "epoch": 1578} {"train_loss": -22.5396671295166, "global_step": 130980, "epoch": 1578} {"train_loss": -22.58162498474121, "global_step": 130981, "epoch": 1578} {"train_loss": -23.057031631469727, "global_step": 130982, "epoch": 1578} {"train_loss": -22.245285034179688, "global_step": 130983, "epoch": 1578} {"train_loss": -22.758956909179688, "global_step": 130984, "epoch": 1578} {"train_loss": -22.870786666870117, "global_step": 130985, "epoch": 1578} {"train_loss": -22.500274658203125, "global_step": 130986, "epoch": 1578} {"train_loss": -22.816308975219727, "global_step": 130987, "epoch": 1578} {"train_loss": -22.75214958190918, "global_step": 130988, "epoch": 1578} {"train_loss": -22.710803985595703, "global_step": 130989, "epoch": 1578} {"train_loss": -22.8870849609375, "global_step": 130990, "epoch": 1578} {"train_loss": -22.876230239868164, "global_step": 130991, "epoch": 1578} {"train_loss": -22.94877815246582, "global_step": 130992, "epoch": 1578} {"train_loss": -22.779550552368164, "global_step": 130993, "epoch": 1578} {"train_loss": -22.614328384399414, "global_step": 130994, "epoch": 1578} {"train_loss": -22.99514389038086, "global_step": 130995, "epoch": 1578} {"train_loss": -22.895963668823242, "global_step": 130996, "epoch": 1578} {"train_loss": -23.027969360351562, "global_step": 130997, "epoch": 1578} {"train_loss": -22.76228141784668, "global_step": 130998, "epoch": 1578} {"train_loss": -22.920846939086914, "global_step": 130999, "epoch": 1578} {"train_loss": -23.27558708190918, "global_step": 131000, "epoch": 1578} {"train_loss": -23.114383697509766, "global_step": 131001, "epoch": 1578} {"train_loss": -23.042476654052734, "global_step": 131002, "epoch": 1578} {"train_loss": -23.098119735717773, "global_step": 131003, "epoch": 1578} {"train_loss": -22.74827003479004, "global_step": 131004, "epoch": 1578} {"train_loss": -23.3880615234375, "global_step": 131005, "epoch": 1578} {"train_loss": -23.02248764038086, "global_step": 131006, "epoch": 1578} {"train_loss": -22.77796745300293, "global_step": 131007, "epoch": 1578} {"train_loss": -22.761608123779297, "global_step": 131008, "epoch": 1578} {"train_loss": -22.753681182861328, "global_step": 131009, "epoch": 1578} {"train_loss": -22.611188888549805, "global_step": 131010, "epoch": 1578} {"train_loss": -22.874441146850586, "global_step": 131011, "epoch": 1578} {"train_loss": -22.9077205657959, "global_step": 131012, "epoch": 1578} {"train_loss": -23.2742977142334, "global_step": 131013, "epoch": 1578} {"train_loss": -22.93008041381836, "global_step": 131014, "epoch": 1578} {"train_loss": -22.70850944519043, "global_step": 131015, "epoch": 1578} {"train_loss": -23.027109146118164, "global_step": 131016, "epoch": 1578} {"train_loss": -22.620588302612305, "global_step": 131017, "epoch": 1578} {"train_loss": -22.93964958190918, "global_step": 131018, "epoch": 1578} {"train_loss": -22.90652847290039, "global_step": 131019, "epoch": 1578} {"train_loss": -22.769840240478516, "global_step": 131020, "epoch": 1578} {"train_loss": -22.81012535095215, "global_step": 131021, "epoch": 1578} {"train_loss": -23.04269790649414, "global_step": 131022, "epoch": 1578} {"train_loss": -22.867019653320312, "global_step": 131023, "epoch": 1578} {"train_loss": -22.6599178314209, "global_step": 131024, "epoch": 1578} {"train_loss": -22.526033401489258, "global_step": 131025, "epoch": 1578} {"train_loss": -22.639890670776367, "global_step": 131026, "epoch": 1578} {"train_loss": -22.659351348876953, "global_step": 131027, "epoch": 1578} {"train_loss": -22.969327926635742, "global_step": 131028, "epoch": 1578} {"train_loss": -22.433683395385742, "global_step": 131029, "epoch": 1578} {"train_loss": -22.690725326538086, "global_step": 131030, "epoch": 1578} {"train_loss": -22.5183048248291, "global_step": 131031, "epoch": 1578} {"train_loss": -22.40668296813965, "global_step": 131032, "epoch": 1578} {"train_loss": -22.62503433227539, "global_step": 131033, "epoch": 1578} {"train_loss": -22.73029899597168, "global_step": 131034, "epoch": 1578} {"train_loss": -22.8184814453125, "global_step": 131035, "epoch": 1578} {"train_loss": -22.982492446899414, "global_step": 131036, "epoch": 1578} {"train_loss": -22.67805290222168, "global_step": 131037, "epoch": 1578} {"train_loss": -22.90616226196289, "global_step": 131038, "epoch": 1578} {"train_loss": -23.022541046142578, "global_step": 131039, "epoch": 1578} {"train_loss": -22.57514762878418, "global_step": 131040, "epoch": 1578} {"train_loss": -22.859882354736328, "global_step": 131041, "epoch": 1578} {"train_loss": -22.34832000732422, "global_step": 131042, "epoch": 1578} {"train_loss": -22.647890090942383, "global_step": 131043, "epoch": 1578} {"train_loss": -22.594322204589844, "global_step": 131044, "epoch": 1578} {"train_loss": -22.864456176757812, "global_step": 131045, "epoch": 1578} {"train_loss": -22.460309982299805, "global_step": 131046, "epoch": 1578} {"train_loss": -22.645389556884766, "global_step": 131047, "epoch": 1578} {"train_loss": -22.812240600585938, "global_step": 131048, "epoch": 1578} {"train_loss": -22.6051082611084, "global_step": 131049, "epoch": 1578} {"train_loss": -22.740406036376953, "global_step": 131050, "epoch": 1578} {"train_loss": -23.030038833618164, "global_step": 131051, "epoch": 1578} {"train_loss": -22.642148971557617, "global_step": 131052, "epoch": 1578} {"train_loss": -22.602869033813477, "global_step": 131053, "epoch": 1578} {"train_loss": -22.707252502441406, "global_step": 131054, "epoch": 1578} {"train_loss": -22.92659568786621, "global_step": 131055, "epoch": 1578} {"train_loss": -22.761953009180274, "global_step": 131056, "epoch": 1578, "val_loss": 6295512.0} {"train_loss": -22.350934982299805, "global_step": 131057, "epoch": 1579} {"train_loss": -22.25568962097168, "global_step": 131058, "epoch": 1579} {"train_loss": -22.57863998413086, "global_step": 131059, "epoch": 1579} {"train_loss": -22.09465980529785, "global_step": 131060, "epoch": 1579} {"train_loss": -22.18018913269043, "global_step": 131061, "epoch": 1579} {"train_loss": -22.389585494995117, "global_step": 131062, "epoch": 1579} {"train_loss": -22.593536376953125, "global_step": 131063, "epoch": 1579} {"train_loss": -22.291189193725586, "global_step": 131064, "epoch": 1579} {"train_loss": -22.739473342895508, "global_step": 131065, "epoch": 1579} {"train_loss": -22.559574127197266, "global_step": 131066, "epoch": 1579} {"train_loss": -22.47315788269043, "global_step": 131067, "epoch": 1579} {"train_loss": -22.66657066345215, "global_step": 131068, "epoch": 1579} {"train_loss": -22.341590881347656, "global_step": 131069, "epoch": 1579} {"train_loss": -22.46157455444336, "global_step": 131070, "epoch": 1579} {"train_loss": -22.87979507446289, "global_step": 131071, "epoch": 1579} {"train_loss": -22.948396682739258, "global_step": 131072, "epoch": 1579} {"train_loss": -22.57403564453125, "global_step": 131073, "epoch": 1579} {"train_loss": -23.010229110717773, "global_step": 131074, "epoch": 1579} {"train_loss": -22.524648666381836, "global_step": 131075, "epoch": 1579} {"train_loss": -22.918827056884766, "global_step": 131076, "epoch": 1579} {"train_loss": -23.046812057495117, "global_step": 131077, "epoch": 1579} {"train_loss": -22.6457576751709, "global_step": 131078, "epoch": 1579} {"train_loss": -22.82265853881836, "global_step": 131079, "epoch": 1579} {"train_loss": -22.806081771850586, "global_step": 131080, "epoch": 1579} {"train_loss": -22.76517105102539, "global_step": 131081, "epoch": 1579} {"train_loss": -23.1229305267334, "global_step": 131082, "epoch": 1579} {"train_loss": -22.850112915039062, "global_step": 131083, "epoch": 1579} {"train_loss": -22.898277282714844, "global_step": 131084, "epoch": 1579} {"train_loss": -22.433917999267578, "global_step": 131085, "epoch": 1579} {"train_loss": -22.589868545532227, "global_step": 131086, "epoch": 1579} {"train_loss": -22.802698135375977, "global_step": 131087, "epoch": 1579} {"train_loss": -22.84577751159668, "global_step": 131088, "epoch": 1579} {"train_loss": -23.137470245361328, "global_step": 131089, "epoch": 1579} {"train_loss": -22.93056869506836, "global_step": 131090, "epoch": 1579} {"train_loss": -22.967693328857422, "global_step": 131091, "epoch": 1579} {"train_loss": -22.991857528686523, "global_step": 131092, "epoch": 1579} {"train_loss": -23.203052520751953, "global_step": 131093, "epoch": 1579} {"train_loss": -22.877262115478516, "global_step": 131094, "epoch": 1579} {"train_loss": -23.299375534057617, "global_step": 131095, "epoch": 1579} {"train_loss": -22.889455795288086, "global_step": 131096, "epoch": 1579} {"train_loss": -22.6178035736084, "global_step": 131097, "epoch": 1579} {"train_loss": -22.95863151550293, "global_step": 131098, "epoch": 1579} {"train_loss": -22.929630279541016, "global_step": 131099, "epoch": 1579} {"train_loss": -23.18684196472168, "global_step": 131100, "epoch": 1579} {"train_loss": -23.005895614624023, "global_step": 131101, "epoch": 1579} {"train_loss": -22.716211318969727, "global_step": 131102, "epoch": 1579} {"train_loss": -22.895313262939453, "global_step": 131103, "epoch": 1579} {"train_loss": -22.958423614501953, "global_step": 131104, "epoch": 1579} {"train_loss": -22.949262619018555, "global_step": 131105, "epoch": 1579} {"train_loss": -22.609878540039062, "global_step": 131106, "epoch": 1579} {"train_loss": -22.950536727905273, "global_step": 131107, "epoch": 1579} {"train_loss": -22.798540115356445, "global_step": 131108, "epoch": 1579} {"train_loss": -23.066308975219727, "global_step": 131109, "epoch": 1579} {"train_loss": -22.9211368560791, "global_step": 131110, "epoch": 1579} {"train_loss": -22.606555938720703, "global_step": 131111, "epoch": 1579} {"train_loss": -22.4934139251709, "global_step": 131112, "epoch": 1579} {"train_loss": -22.560636520385742, "global_step": 131113, "epoch": 1579} {"train_loss": -22.79388999938965, "global_step": 131114, "epoch": 1579} {"train_loss": -22.708389282226562, "global_step": 131115, "epoch": 1579} {"train_loss": -22.58234977722168, "global_step": 131116, "epoch": 1579} {"train_loss": -22.766448974609375, "global_step": 131117, "epoch": 1579} {"train_loss": -22.687740325927734, "global_step": 131118, "epoch": 1579} {"train_loss": -22.409467697143555, "global_step": 131119, "epoch": 1579} {"train_loss": -22.830224990844727, "global_step": 131120, "epoch": 1579} {"train_loss": -22.731609344482422, "global_step": 131121, "epoch": 1579} {"train_loss": -22.538393020629883, "global_step": 131122, "epoch": 1579} {"train_loss": -22.982025146484375, "global_step": 131123, "epoch": 1579} {"train_loss": -22.810657501220703, "global_step": 131124, "epoch": 1579} {"train_loss": -22.963552474975586, "global_step": 131125, "epoch": 1579} {"train_loss": -22.616687774658203, "global_step": 131126, "epoch": 1579} {"train_loss": -22.70349884033203, "global_step": 131127, "epoch": 1579} {"train_loss": -22.963232040405273, "global_step": 131128, "epoch": 1579} {"train_loss": -22.7990665435791, "global_step": 131129, "epoch": 1579} {"train_loss": -22.86733055114746, "global_step": 131130, "epoch": 1579} {"train_loss": -22.934234619140625, "global_step": 131131, "epoch": 1579} {"train_loss": -22.442251205444336, "global_step": 131132, "epoch": 1579} {"train_loss": -22.834768295288086, "global_step": 131133, "epoch": 1579} {"train_loss": -22.34836196899414, "global_step": 131134, "epoch": 1579} {"train_loss": -22.6308536529541, "global_step": 131135, "epoch": 1579} {"train_loss": -22.7668514251709, "global_step": 131136, "epoch": 1579} {"train_loss": -22.562042236328125, "global_step": 131137, "epoch": 1579} {"train_loss": -22.78499984741211, "global_step": 131138, "epoch": 1579} {"train_loss": -22.74331812111728, "global_step": 131139, "epoch": 1579, "val_loss": 6256592.0} {"train_loss": -22.862224578857422, "global_step": 131140, "epoch": 1580} {"train_loss": -22.700284957885742, "global_step": 131141, "epoch": 1580} {"train_loss": -22.398462295532227, "global_step": 131142, "epoch": 1580} {"train_loss": -22.70927619934082, "global_step": 131143, "epoch": 1580} {"train_loss": -22.6920166015625, "global_step": 131144, "epoch": 1580} {"train_loss": -22.286296844482422, "global_step": 131145, "epoch": 1580} {"train_loss": -22.495634078979492, "global_step": 131146, "epoch": 1580} {"train_loss": -22.77863883972168, "global_step": 131147, "epoch": 1580} {"train_loss": -22.485654830932617, "global_step": 131148, "epoch": 1580} {"train_loss": -22.380380630493164, "global_step": 131149, "epoch": 1580} {"train_loss": -22.45648765563965, "global_step": 131150, "epoch": 1580} {"train_loss": -22.913015365600586, "global_step": 131151, "epoch": 1580} {"train_loss": -22.567005157470703, "global_step": 131152, "epoch": 1580} {"train_loss": -23.45790672302246, "global_step": 131153, "epoch": 1580} {"train_loss": -23.110706329345703, "global_step": 131154, "epoch": 1580} {"train_loss": -22.933176040649414, "global_step": 131155, "epoch": 1580} {"train_loss": -22.71392822265625, "global_step": 131156, "epoch": 1580} {"train_loss": -22.744491577148438, "global_step": 131157, "epoch": 1580} {"train_loss": -22.636981964111328, "global_step": 131158, "epoch": 1580} {"train_loss": -22.451770782470703, "global_step": 131159, "epoch": 1580} {"train_loss": -22.595739364624023, "global_step": 131160, "epoch": 1580} {"train_loss": -23.040231704711914, "global_step": 131161, "epoch": 1580} {"train_loss": -22.94611167907715, "global_step": 131162, "epoch": 1580} {"train_loss": -22.947568893432617, "global_step": 131163, "epoch": 1580} {"train_loss": -22.79446792602539, "global_step": 131164, "epoch": 1580} {"train_loss": -22.947477340698242, "global_step": 131165, "epoch": 1580} {"train_loss": -23.05210304260254, "global_step": 131166, "epoch": 1580} {"train_loss": -22.92949676513672, "global_step": 131167, "epoch": 1580} {"train_loss": -22.74043083190918, "global_step": 131168, "epoch": 1580} {"train_loss": -22.87689781188965, "global_step": 131169, "epoch": 1580} {"train_loss": -22.772199630737305, "global_step": 131170, "epoch": 1580} {"train_loss": -22.429059982299805, "global_step": 131171, "epoch": 1580} {"train_loss": -23.12073516845703, "global_step": 131172, "epoch": 1580} {"train_loss": -22.52193260192871, "global_step": 131173, "epoch": 1580} {"train_loss": -22.65740394592285, "global_step": 131174, "epoch": 1580} {"train_loss": -22.4962215423584, "global_step": 131175, "epoch": 1580} {"train_loss": -23.35040855407715, "global_step": 131176, "epoch": 1580} {"train_loss": -22.927047729492188, "global_step": 131177, "epoch": 1580} {"train_loss": -22.523120880126953, "global_step": 131178, "epoch": 1580} {"train_loss": -22.6898136138916, "global_step": 131179, "epoch": 1580} {"train_loss": -22.955202102661133, "global_step": 131180, "epoch": 1580} {"train_loss": -22.662158966064453, "global_step": 131181, "epoch": 1580} {"train_loss": -22.809179306030273, "global_step": 131182, "epoch": 1580} {"train_loss": -22.574390411376953, "global_step": 131183, "epoch": 1580} {"train_loss": -22.6636905670166, "global_step": 131184, "epoch": 1580} {"train_loss": -22.95539665222168, "global_step": 131185, "epoch": 1580} {"train_loss": -22.830625534057617, "global_step": 131186, "epoch": 1580} {"train_loss": -22.917020797729492, "global_step": 131187, "epoch": 1580} {"train_loss": -23.082012176513672, "global_step": 131188, "epoch": 1580} {"train_loss": -22.962108612060547, "global_step": 131189, "epoch": 1580} {"train_loss": -22.673511505126953, "global_step": 131190, "epoch": 1580} {"train_loss": -22.809694290161133, "global_step": 131191, "epoch": 1580} {"train_loss": -22.839078903198242, "global_step": 131192, "epoch": 1580} {"train_loss": -22.79257583618164, "global_step": 131193, "epoch": 1580} {"train_loss": -23.031564712524414, "global_step": 131194, "epoch": 1580} {"train_loss": -22.896259307861328, "global_step": 131195, "epoch": 1580} {"train_loss": -22.69049644470215, "global_step": 131196, "epoch": 1580} {"train_loss": -22.836870193481445, "global_step": 131197, "epoch": 1580} {"train_loss": -22.732654571533203, "global_step": 131198, "epoch": 1580} {"train_loss": -22.719717025756836, "global_step": 131199, "epoch": 1580} {"train_loss": -23.094778060913086, "global_step": 131200, "epoch": 1580} {"train_loss": -22.9876708984375, "global_step": 131201, "epoch": 1580} {"train_loss": -22.762619018554688, "global_step": 131202, "epoch": 1580} {"train_loss": -22.750492095947266, "global_step": 131203, "epoch": 1580} {"train_loss": -23.040475845336914, "global_step": 131204, "epoch": 1580} {"train_loss": -22.855987548828125, "global_step": 131205, "epoch": 1580} {"train_loss": -22.87175941467285, "global_step": 131206, "epoch": 1580} {"train_loss": -22.729156494140625, "global_step": 131207, "epoch": 1580} {"train_loss": -22.85184097290039, "global_step": 131208, "epoch": 1580} {"train_loss": -22.902362823486328, "global_step": 131209, "epoch": 1580} {"train_loss": -22.772626876831055, "global_step": 131210, "epoch": 1580} {"train_loss": -22.732675552368164, "global_step": 131211, "epoch": 1580} {"train_loss": -22.95336151123047, "global_step": 131212, "epoch": 1580} {"train_loss": -23.06612205505371, "global_step": 131213, "epoch": 1580} {"train_loss": -23.02338218688965, "global_step": 131214, "epoch": 1580} {"train_loss": -23.069442749023438, "global_step": 131215, "epoch": 1580} {"train_loss": -22.678787231445312, "global_step": 131216, "epoch": 1580} {"train_loss": -22.59038734436035, "global_step": 131217, "epoch": 1580} {"train_loss": -22.74747085571289, "global_step": 131218, "epoch": 1580} {"train_loss": -22.750198364257812, "global_step": 131219, "epoch": 1580} {"train_loss": -23.062152862548828, "global_step": 131220, "epoch": 1580} {"train_loss": -22.64870262145996, "global_step": 131221, "epoch": 1580} {"train_loss": -22.76864771096103, "global_step": 131222, "epoch": 1580, "val_loss": 6370672.0} {"train_loss": -21.954559326171875, "global_step": 131223, "epoch": 1581} {"train_loss": -22.270755767822266, "global_step": 131224, "epoch": 1581} {"train_loss": -22.406204223632812, "global_step": 131225, "epoch": 1581} {"train_loss": -22.8176212310791, "global_step": 131226, "epoch": 1581} {"train_loss": -22.253686904907227, "global_step": 131227, "epoch": 1581} {"train_loss": -22.272058486938477, "global_step": 131228, "epoch": 1581} {"train_loss": -22.360410690307617, "global_step": 131229, "epoch": 1581} {"train_loss": -22.383642196655273, "global_step": 131230, "epoch": 1581} {"train_loss": -22.599349975585938, "global_step": 131231, "epoch": 1581} {"train_loss": -22.50102996826172, "global_step": 131232, "epoch": 1581} {"train_loss": -22.477140426635742, "global_step": 131233, "epoch": 1581} {"train_loss": -22.531259536743164, "global_step": 131234, "epoch": 1581} {"train_loss": -22.783132553100586, "global_step": 131235, "epoch": 1581} {"train_loss": -22.80377769470215, "global_step": 131236, "epoch": 1581} {"train_loss": -22.55162239074707, "global_step": 131237, "epoch": 1581} {"train_loss": -22.789852142333984, "global_step": 131238, "epoch": 1581} {"train_loss": -22.69523811340332, "global_step": 131239, "epoch": 1581} {"train_loss": -22.248369216918945, "global_step": 131240, "epoch": 1581} {"train_loss": -22.82731056213379, "global_step": 131241, "epoch": 1581} {"train_loss": -22.57925796508789, "global_step": 131242, "epoch": 1581} {"train_loss": -22.792665481567383, "global_step": 131243, "epoch": 1581} {"train_loss": -22.8919620513916, "global_step": 131244, "epoch": 1581} {"train_loss": -22.802597045898438, "global_step": 131245, "epoch": 1581} {"train_loss": -22.620492935180664, "global_step": 131246, "epoch": 1581} {"train_loss": -22.770984649658203, "global_step": 131247, "epoch": 1581} {"train_loss": -22.87440299987793, "global_step": 131248, "epoch": 1581} {"train_loss": -22.958744049072266, "global_step": 131249, "epoch": 1581} {"train_loss": -22.99893569946289, "global_step": 131250, "epoch": 1581} {"train_loss": -22.911062240600586, "global_step": 131251, "epoch": 1581} {"train_loss": -22.512638092041016, "global_step": 131252, "epoch": 1581} {"train_loss": -23.320383071899414, "global_step": 131253, "epoch": 1581} {"train_loss": -22.67957305908203, "global_step": 131254, "epoch": 1581} {"train_loss": -22.631376266479492, "global_step": 131255, "epoch": 1581} {"train_loss": -22.6241455078125, "global_step": 131256, "epoch": 1581} {"train_loss": -22.602903366088867, "global_step": 131257, "epoch": 1581} {"train_loss": -22.81839942932129, "global_step": 131258, "epoch": 1581} {"train_loss": -23.1209659576416, "global_step": 131259, "epoch": 1581} {"train_loss": -22.902921676635742, "global_step": 131260, "epoch": 1581} {"train_loss": -22.92819595336914, "global_step": 131261, "epoch": 1581} {"train_loss": -22.872407913208008, "global_step": 131262, "epoch": 1581} {"train_loss": -22.835376739501953, "global_step": 131263, "epoch": 1581} {"train_loss": -22.81759262084961, "global_step": 131264, "epoch": 1581} {"train_loss": -22.86713218688965, "global_step": 131265, "epoch": 1581} {"train_loss": -22.839324951171875, "global_step": 131266, "epoch": 1581} {"train_loss": -22.774641036987305, "global_step": 131267, "epoch": 1581} {"train_loss": -22.707483291625977, "global_step": 131268, "epoch": 1581} {"train_loss": -22.630699157714844, "global_step": 131269, "epoch": 1581} {"train_loss": -22.641294479370117, "global_step": 131270, "epoch": 1581} {"train_loss": -22.663686752319336, "global_step": 131271, "epoch": 1581} {"train_loss": -23.060733795166016, "global_step": 131272, "epoch": 1581} {"train_loss": -23.031354904174805, "global_step": 131273, "epoch": 1581} {"train_loss": -22.847131729125977, "global_step": 131274, "epoch": 1581} {"train_loss": -22.944854736328125, "global_step": 131275, "epoch": 1581} {"train_loss": -23.109086990356445, "global_step": 131276, "epoch": 1581} {"train_loss": -23.137531280517578, "global_step": 131277, "epoch": 1581} {"train_loss": -22.904659271240234, "global_step": 131278, "epoch": 1581} {"train_loss": -22.85396385192871, "global_step": 131279, "epoch": 1581} {"train_loss": -22.80315589904785, "global_step": 131280, "epoch": 1581} {"train_loss": -22.872756958007812, "global_step": 131281, "epoch": 1581} {"train_loss": -22.915552139282227, "global_step": 131282, "epoch": 1581} {"train_loss": -22.751922607421875, "global_step": 131283, "epoch": 1581} {"train_loss": -22.68312644958496, "global_step": 131284, "epoch": 1581} {"train_loss": -23.286781311035156, "global_step": 131285, "epoch": 1581} {"train_loss": -22.948963165283203, "global_step": 131286, "epoch": 1581} {"train_loss": -22.83527183532715, "global_step": 131287, "epoch": 1581} {"train_loss": -22.518251419067383, "global_step": 131288, "epoch": 1581} {"train_loss": -22.850278854370117, "global_step": 131289, "epoch": 1581} {"train_loss": -22.923276901245117, "global_step": 131290, "epoch": 1581} {"train_loss": -22.728208541870117, "global_step": 131291, "epoch": 1581} {"train_loss": -22.928510665893555, "global_step": 131292, "epoch": 1581} {"train_loss": -22.8588809967041, "global_step": 131293, "epoch": 1581} {"train_loss": -23.018863677978516, "global_step": 131294, "epoch": 1581} {"train_loss": -22.977645874023438, "global_step": 131295, "epoch": 1581} {"train_loss": -22.508474349975586, "global_step": 131296, "epoch": 1581} {"train_loss": -22.590545654296875, "global_step": 131297, "epoch": 1581} {"train_loss": -22.573753356933594, "global_step": 131298, "epoch": 1581} {"train_loss": -22.524173736572266, "global_step": 131299, "epoch": 1581} {"train_loss": -22.633310317993164, "global_step": 131300, "epoch": 1581} {"train_loss": -22.52669334411621, "global_step": 131301, "epoch": 1581} {"train_loss": -22.345264434814453, "global_step": 131302, "epoch": 1581} {"train_loss": -22.769636154174805, "global_step": 131303, "epoch": 1581} {"train_loss": -22.680696487426758, "global_step": 131304, "epoch": 1581} {"train_loss": -22.745105122945393, "global_step": 131305, "epoch": 1581, "val_loss": 6173148.0} {"train_loss": -22.49090576171875, "global_step": 131306, "epoch": 1582} {"train_loss": -22.532756805419922, "global_step": 131307, "epoch": 1582} {"train_loss": -22.332752227783203, "global_step": 131308, "epoch": 1582} {"train_loss": -22.45709800720215, "global_step": 131309, "epoch": 1582} {"train_loss": -22.313793182373047, "global_step": 131310, "epoch": 1582} {"train_loss": -22.871301651000977, "global_step": 131311, "epoch": 1582} {"train_loss": -22.456449508666992, "global_step": 131312, "epoch": 1582} {"train_loss": -22.5452938079834, "global_step": 131313, "epoch": 1582} {"train_loss": -22.67816925048828, "global_step": 131314, "epoch": 1582} {"train_loss": -22.595539093017578, "global_step": 131315, "epoch": 1582} {"train_loss": -22.496381759643555, "global_step": 131316, "epoch": 1582} {"train_loss": -22.801382064819336, "global_step": 131317, "epoch": 1582} {"train_loss": -22.594205856323242, "global_step": 131318, "epoch": 1582} {"train_loss": -22.766681671142578, "global_step": 131319, "epoch": 1582} {"train_loss": -22.588926315307617, "global_step": 131320, "epoch": 1582} {"train_loss": -22.877761840820312, "global_step": 131321, "epoch": 1582} {"train_loss": -22.66184425354004, "global_step": 131322, "epoch": 1582} {"train_loss": -22.90989112854004, "global_step": 131323, "epoch": 1582} {"train_loss": -22.920551300048828, "global_step": 131324, "epoch": 1582} {"train_loss": -22.824203491210938, "global_step": 131325, "epoch": 1582} {"train_loss": -22.824020385742188, "global_step": 131326, "epoch": 1582} {"train_loss": -23.028934478759766, "global_step": 131327, "epoch": 1582} {"train_loss": -22.647659301757812, "global_step": 131328, "epoch": 1582} {"train_loss": -22.796463012695312, "global_step": 131329, "epoch": 1582} {"train_loss": -22.27058982849121, "global_step": 131330, "epoch": 1582} {"train_loss": -22.57926368713379, "global_step": 131331, "epoch": 1582} {"train_loss": -22.732105255126953, "global_step": 131332, "epoch": 1582} {"train_loss": -22.65233612060547, "global_step": 131333, "epoch": 1582} {"train_loss": -23.15445899963379, "global_step": 131334, "epoch": 1582} {"train_loss": -22.93906021118164, "global_step": 131335, "epoch": 1582} {"train_loss": -22.785430908203125, "global_step": 131336, "epoch": 1582} {"train_loss": -22.829620361328125, "global_step": 131337, "epoch": 1582} {"train_loss": -22.761920928955078, "global_step": 131338, "epoch": 1582} {"train_loss": -22.963037490844727, "global_step": 131339, "epoch": 1582} {"train_loss": -23.018726348876953, "global_step": 131340, "epoch": 1582} {"train_loss": -22.99590301513672, "global_step": 131341, "epoch": 1582} {"train_loss": -23.17327308654785, "global_step": 131342, "epoch": 1582} {"train_loss": -22.693626403808594, "global_step": 131343, "epoch": 1582} {"train_loss": -22.99660873413086, "global_step": 131344, "epoch": 1582} {"train_loss": -22.985111236572266, "global_step": 131345, "epoch": 1582} {"train_loss": -22.82065773010254, "global_step": 131346, "epoch": 1582} {"train_loss": -23.145923614501953, "global_step": 131347, "epoch": 1582} {"train_loss": -22.692461013793945, "global_step": 131348, "epoch": 1582} {"train_loss": -23.04292106628418, "global_step": 131349, "epoch": 1582} {"train_loss": -23.145708084106445, "global_step": 131350, "epoch": 1582} {"train_loss": -23.004825592041016, "global_step": 131351, "epoch": 1582} {"train_loss": -22.642637252807617, "global_step": 131352, "epoch": 1582} {"train_loss": -22.577985763549805, "global_step": 131353, "epoch": 1582} {"train_loss": -22.924774169921875, "global_step": 131354, "epoch": 1582} {"train_loss": -22.98175621032715, "global_step": 131355, "epoch": 1582} {"train_loss": -22.766786575317383, "global_step": 131356, "epoch": 1582} {"train_loss": -23.199350357055664, "global_step": 131357, "epoch": 1582} {"train_loss": -23.20973014831543, "global_step": 131358, "epoch": 1582} {"train_loss": -22.915815353393555, "global_step": 131359, "epoch": 1582} {"train_loss": -22.834012985229492, "global_step": 131360, "epoch": 1582} {"train_loss": -22.904666900634766, "global_step": 131361, "epoch": 1582} {"train_loss": -22.98431396484375, "global_step": 131362, "epoch": 1582} {"train_loss": -23.085966110229492, "global_step": 131363, "epoch": 1582} {"train_loss": -22.62740135192871, "global_step": 131364, "epoch": 1582} {"train_loss": -22.955154418945312, "global_step": 131365, "epoch": 1582} {"train_loss": -22.71231460571289, "global_step": 131366, "epoch": 1582} {"train_loss": -22.88613510131836, "global_step": 131367, "epoch": 1582} {"train_loss": -22.5914249420166, "global_step": 131368, "epoch": 1582} {"train_loss": -23.047019958496094, "global_step": 131369, "epoch": 1582} {"train_loss": -22.871259689331055, "global_step": 131370, "epoch": 1582} {"train_loss": -23.028841018676758, "global_step": 131371, "epoch": 1582} {"train_loss": -23.013261795043945, "global_step": 131372, "epoch": 1582} {"train_loss": -22.781822204589844, "global_step": 131373, "epoch": 1582} {"train_loss": -23.066635131835938, "global_step": 131374, "epoch": 1582} {"train_loss": -22.89177703857422, "global_step": 131375, "epoch": 1582} {"train_loss": -22.787405014038086, "global_step": 131376, "epoch": 1582} {"train_loss": -22.796504974365234, "global_step": 131377, "epoch": 1582} {"train_loss": -23.212121963500977, "global_step": 131378, "epoch": 1582} {"train_loss": -22.62609100341797, "global_step": 131379, "epoch": 1582} {"train_loss": -22.88678550720215, "global_step": 131380, "epoch": 1582} {"train_loss": -22.90461540222168, "global_step": 131381, "epoch": 1582} {"train_loss": -22.990602493286133, "global_step": 131382, "epoch": 1582} {"train_loss": -22.583181381225586, "global_step": 131383, "epoch": 1582} {"train_loss": -22.71299171447754, "global_step": 131384, "epoch": 1582} {"train_loss": -22.96976089477539, "global_step": 131385, "epoch": 1582} {"train_loss": -22.406591415405273, "global_step": 131386, "epoch": 1582} {"train_loss": -22.752788543701172, "global_step": 131387, "epoch": 1582} {"train_loss": -22.814221416611268, "global_step": 131388, "epoch": 1582, "val_loss": 6351506.0} {"train_loss": -21.5986385345459, "global_step": 131389, "epoch": 1583} {"train_loss": -22.16485023498535, "global_step": 131390, "epoch": 1583} {"train_loss": -21.947900772094727, "global_step": 131391, "epoch": 1583} {"train_loss": -22.400352478027344, "global_step": 131392, "epoch": 1583} {"train_loss": -21.82282066345215, "global_step": 131393, "epoch": 1583} {"train_loss": -22.419904708862305, "global_step": 131394, "epoch": 1583} {"train_loss": -22.139936447143555, "global_step": 131395, "epoch": 1583} {"train_loss": -22.56288719177246, "global_step": 131396, "epoch": 1583} {"train_loss": -22.421720504760742, "global_step": 131397, "epoch": 1583} {"train_loss": -21.8055419921875, "global_step": 131398, "epoch": 1583} {"train_loss": -22.277158737182617, "global_step": 131399, "epoch": 1583} {"train_loss": -22.1373233795166, "global_step": 131400, "epoch": 1583} {"train_loss": -22.637908935546875, "global_step": 131401, "epoch": 1583} {"train_loss": -22.468307495117188, "global_step": 131402, "epoch": 1583} {"train_loss": -22.605993270874023, "global_step": 131403, "epoch": 1583} {"train_loss": -22.574186325073242, "global_step": 131404, "epoch": 1583} {"train_loss": -21.874357223510742, "global_step": 131405, "epoch": 1583} {"train_loss": -22.46718406677246, "global_step": 131406, "epoch": 1583} {"train_loss": -22.43378257751465, "global_step": 131407, "epoch": 1583} {"train_loss": -22.661081314086914, "global_step": 131408, "epoch": 1583} {"train_loss": -22.397201538085938, "global_step": 131409, "epoch": 1583} {"train_loss": -22.711593627929688, "global_step": 131410, "epoch": 1583} {"train_loss": -22.171415328979492, "global_step": 131411, "epoch": 1583} {"train_loss": -22.485422134399414, "global_step": 131412, "epoch": 1583} {"train_loss": -23.01502227783203, "global_step": 131413, "epoch": 1583} {"train_loss": -22.66632080078125, "global_step": 131414, "epoch": 1583} {"train_loss": -22.643049240112305, "global_step": 131415, "epoch": 1583} {"train_loss": -22.61001968383789, "global_step": 131416, "epoch": 1583} {"train_loss": -22.778173446655273, "global_step": 131417, "epoch": 1583} {"train_loss": -22.896465301513672, "global_step": 131418, "epoch": 1583} {"train_loss": -22.824743270874023, "global_step": 131419, "epoch": 1583} {"train_loss": -22.596282958984375, "global_step": 131420, "epoch": 1583} {"train_loss": -22.74066734313965, "global_step": 131421, "epoch": 1583} {"train_loss": -22.621992111206055, "global_step": 131422, "epoch": 1583} {"train_loss": -22.970632553100586, "global_step": 131423, "epoch": 1583} {"train_loss": -22.950088500976562, "global_step": 131424, "epoch": 1583} {"train_loss": -22.719938278198242, "global_step": 131425, "epoch": 1583} {"train_loss": -22.845067977905273, "global_step": 131426, "epoch": 1583} {"train_loss": -22.96164894104004, "global_step": 131427, "epoch": 1583} {"train_loss": -22.782123565673828, "global_step": 131428, "epoch": 1583} {"train_loss": -22.82137107849121, "global_step": 131429, "epoch": 1583} {"train_loss": -22.98448371887207, "global_step": 131430, "epoch": 1583} {"train_loss": -22.598569869995117, "global_step": 131431, "epoch": 1583} {"train_loss": -22.847341537475586, "global_step": 131432, "epoch": 1583} {"train_loss": -22.6650333404541, "global_step": 131433, "epoch": 1583} {"train_loss": -22.759784698486328, "global_step": 131434, "epoch": 1583} {"train_loss": -22.954565048217773, "global_step": 131435, "epoch": 1583} {"train_loss": -23.129186630249023, "global_step": 131436, "epoch": 1583} {"train_loss": -23.108291625976562, "global_step": 131437, "epoch": 1583} {"train_loss": -23.221689224243164, "global_step": 131438, "epoch": 1583} {"train_loss": -22.97255516052246, "global_step": 131439, "epoch": 1583} {"train_loss": -22.69190788269043, "global_step": 131440, "epoch": 1583} {"train_loss": -23.048538208007812, "global_step": 131441, "epoch": 1583} {"train_loss": -22.769208908081055, "global_step": 131442, "epoch": 1583} {"train_loss": -22.778512954711914, "global_step": 131443, "epoch": 1583} {"train_loss": -22.891918182373047, "global_step": 131444, "epoch": 1583} {"train_loss": -22.88508415222168, "global_step": 131445, "epoch": 1583} {"train_loss": -22.810190200805664, "global_step": 131446, "epoch": 1583} {"train_loss": -22.33567237854004, "global_step": 131447, "epoch": 1583} {"train_loss": -22.20803451538086, "global_step": 131448, "epoch": 1583} {"train_loss": -22.4482364654541, "global_step": 131449, "epoch": 1583} {"train_loss": -22.769804000854492, "global_step": 131450, "epoch": 1583} {"train_loss": -22.724180221557617, "global_step": 131451, "epoch": 1583} {"train_loss": -22.839750289916992, "global_step": 131452, "epoch": 1583} {"train_loss": -22.76495933532715, "global_step": 131453, "epoch": 1583} {"train_loss": -23.37931251525879, "global_step": 131454, "epoch": 1583} {"train_loss": -22.96137809753418, "global_step": 131455, "epoch": 1583} {"train_loss": -22.73784065246582, "global_step": 131456, "epoch": 1583} {"train_loss": -22.97652244567871, "global_step": 131457, "epoch": 1583} {"train_loss": -22.974109649658203, "global_step": 131458, "epoch": 1583} {"train_loss": -23.144512176513672, "global_step": 131459, "epoch": 1583} {"train_loss": -22.712549209594727, "global_step": 131460, "epoch": 1583} {"train_loss": -23.025665283203125, "global_step": 131461, "epoch": 1583} {"train_loss": -22.635046005249023, "global_step": 131462, "epoch": 1583} {"train_loss": -22.97834587097168, "global_step": 131463, "epoch": 1583} {"train_loss": -22.704431533813477, "global_step": 131464, "epoch": 1583} {"train_loss": -23.08033561706543, "global_step": 131465, "epoch": 1583} {"train_loss": -22.58131980895996, "global_step": 131466, "epoch": 1583} {"train_loss": -23.263835906982422, "global_step": 131467, "epoch": 1583} {"train_loss": -22.94111442565918, "global_step": 131468, "epoch": 1583} {"train_loss": -22.86969757080078, "global_step": 131469, "epoch": 1583} {"train_loss": -22.91908073425293, "global_step": 131470, "epoch": 1583} {"train_loss": -22.6995333935841, "global_step": 131471, "epoch": 1583, "val_loss": 6253754.0} {"train_loss": -22.292387008666992, "global_step": 131472, "epoch": 1584} {"train_loss": -22.014041900634766, "global_step": 131473, "epoch": 1584} {"train_loss": -22.8013973236084, "global_step": 131474, "epoch": 1584} {"train_loss": -22.483203887939453, "global_step": 131475, "epoch": 1584} {"train_loss": -22.55126953125, "global_step": 131476, "epoch": 1584} {"train_loss": -22.47530174255371, "global_step": 131477, "epoch": 1584} {"train_loss": -22.5609130859375, "global_step": 131478, "epoch": 1584} {"train_loss": -22.550363540649414, "global_step": 131479, "epoch": 1584} {"train_loss": -22.759981155395508, "global_step": 131480, "epoch": 1584} {"train_loss": -22.563932418823242, "global_step": 131481, "epoch": 1584} {"train_loss": -22.647348403930664, "global_step": 131482, "epoch": 1584} {"train_loss": -23.066213607788086, "global_step": 131483, "epoch": 1584} {"train_loss": -22.73528480529785, "global_step": 131484, "epoch": 1584} {"train_loss": -23.132553100585938, "global_step": 131485, "epoch": 1584} {"train_loss": -22.606046676635742, "global_step": 131486, "epoch": 1584} {"train_loss": -22.840484619140625, "global_step": 131487, "epoch": 1584} {"train_loss": -22.823701858520508, "global_step": 131488, "epoch": 1584} {"train_loss": -22.891141891479492, "global_step": 131489, "epoch": 1584} {"train_loss": -22.93497657775879, "global_step": 131490, "epoch": 1584} {"train_loss": -22.935455322265625, "global_step": 131491, "epoch": 1584} {"train_loss": -22.987686157226562, "global_step": 131492, "epoch": 1584} {"train_loss": -22.855783462524414, "global_step": 131493, "epoch": 1584} {"train_loss": -22.823959350585938, "global_step": 131494, "epoch": 1584} {"train_loss": -23.161922454833984, "global_step": 131495, "epoch": 1584} {"train_loss": -22.743783950805664, "global_step": 131496, "epoch": 1584} {"train_loss": -22.77265739440918, "global_step": 131497, "epoch": 1584} {"train_loss": -22.58409309387207, "global_step": 131498, "epoch": 1584} {"train_loss": -22.673444747924805, "global_step": 131499, "epoch": 1584} {"train_loss": -22.82157325744629, "global_step": 131500, "epoch": 1584} {"train_loss": -22.74283218383789, "global_step": 131501, "epoch": 1584} {"train_loss": -22.95783233642578, "global_step": 131502, "epoch": 1584} {"train_loss": -22.62967872619629, "global_step": 131503, "epoch": 1584} {"train_loss": -22.84806251525879, "global_step": 131504, "epoch": 1584} {"train_loss": -22.802762985229492, "global_step": 131505, "epoch": 1584} {"train_loss": -23.123632431030273, "global_step": 131506, "epoch": 1584} {"train_loss": -22.917800903320312, "global_step": 131507, "epoch": 1584} {"train_loss": -22.9780330657959, "global_step": 131508, "epoch": 1584} {"train_loss": -22.97426986694336, "global_step": 131509, "epoch": 1584} {"train_loss": -22.91645622253418, "global_step": 131510, "epoch": 1584} {"train_loss": -22.673669815063477, "global_step": 131511, "epoch": 1584} {"train_loss": -22.807750701904297, "global_step": 131512, "epoch": 1584} {"train_loss": -22.632295608520508, "global_step": 131513, "epoch": 1584} {"train_loss": -22.853757858276367, "global_step": 131514, "epoch": 1584} {"train_loss": -22.922143936157227, "global_step": 131515, "epoch": 1584} {"train_loss": -22.672780990600586, "global_step": 131516, "epoch": 1584} {"train_loss": -22.613569259643555, "global_step": 131517, "epoch": 1584} {"train_loss": -22.980146408081055, "global_step": 131518, "epoch": 1584} {"train_loss": -23.167871475219727, "global_step": 131519, "epoch": 1584} {"train_loss": -23.350923538208008, "global_step": 131520, "epoch": 1584} {"train_loss": -22.865633010864258, "global_step": 131521, "epoch": 1584} {"train_loss": -22.86969566345215, "global_step": 131522, "epoch": 1584} {"train_loss": -22.804229736328125, "global_step": 131523, "epoch": 1584} {"train_loss": -23.02804946899414, "global_step": 131524, "epoch": 1584} {"train_loss": -22.48375701904297, "global_step": 131525, "epoch": 1584} {"train_loss": -22.663801193237305, "global_step": 131526, "epoch": 1584} {"train_loss": -22.464384078979492, "global_step": 131527, "epoch": 1584} {"train_loss": -22.99141502380371, "global_step": 131528, "epoch": 1584} {"train_loss": -22.6074161529541, "global_step": 131529, "epoch": 1584} {"train_loss": -23.1870174407959, "global_step": 131530, "epoch": 1584} {"train_loss": -23.112600326538086, "global_step": 131531, "epoch": 1584} {"train_loss": -22.78152847290039, "global_step": 131532, "epoch": 1584} {"train_loss": -22.910215377807617, "global_step": 131533, "epoch": 1584} {"train_loss": -22.549701690673828, "global_step": 131534, "epoch": 1584} {"train_loss": -22.83612632751465, "global_step": 131535, "epoch": 1584} {"train_loss": -22.649511337280273, "global_step": 131536, "epoch": 1584} {"train_loss": -22.43484878540039, "global_step": 131537, "epoch": 1584} {"train_loss": -22.591272354125977, "global_step": 131538, "epoch": 1584} {"train_loss": -22.409942626953125, "global_step": 131539, "epoch": 1584} {"train_loss": -22.73773765563965, "global_step": 131540, "epoch": 1584} {"train_loss": -22.879878997802734, "global_step": 131541, "epoch": 1584} {"train_loss": -23.12881851196289, "global_step": 131542, "epoch": 1584} {"train_loss": -22.788471221923828, "global_step": 131543, "epoch": 1584} {"train_loss": -22.8421688079834, "global_step": 131544, "epoch": 1584} {"train_loss": -22.817964553833008, "global_step": 131545, "epoch": 1584} {"train_loss": -23.405004501342773, "global_step": 131546, "epoch": 1584} {"train_loss": -22.712438583374023, "global_step": 131547, "epoch": 1584} {"train_loss": -22.700897216796875, "global_step": 131548, "epoch": 1584} {"train_loss": -22.605260848999023, "global_step": 131549, "epoch": 1584} {"train_loss": -22.65159034729004, "global_step": 131550, "epoch": 1584} {"train_loss": -22.808332443237305, "global_step": 131551, "epoch": 1584} {"train_loss": -22.932897567749023, "global_step": 131552, "epoch": 1584} {"train_loss": -23.20882225036621, "global_step": 131553, "epoch": 1584} {"train_loss": -22.799196656928004, "global_step": 131554, "epoch": 1584, "val_loss": 6365224.0} {"train_loss": -22.110383987426758, "global_step": 131555, "epoch": 1585} {"train_loss": -22.956937789916992, "global_step": 131556, "epoch": 1585} {"train_loss": -22.6236572265625, "global_step": 131557, "epoch": 1585} {"train_loss": -22.927003860473633, "global_step": 131558, "epoch": 1585} {"train_loss": -22.742345809936523, "global_step": 131559, "epoch": 1585} {"train_loss": -23.1378116607666, "global_step": 131560, "epoch": 1585} {"train_loss": -22.850446701049805, "global_step": 131561, "epoch": 1585} {"train_loss": -22.517484664916992, "global_step": 131562, "epoch": 1585} {"train_loss": -22.814903259277344, "global_step": 131563, "epoch": 1585} {"train_loss": -22.581453323364258, "global_step": 131564, "epoch": 1585} {"train_loss": -22.45067596435547, "global_step": 131565, "epoch": 1585} {"train_loss": -22.63590431213379, "global_step": 131566, "epoch": 1585} {"train_loss": -22.73274040222168, "global_step": 131567, "epoch": 1585} {"train_loss": -22.909162521362305, "global_step": 131568, "epoch": 1585} {"train_loss": -22.871198654174805, "global_step": 131569, "epoch": 1585} {"train_loss": -22.76556396484375, "global_step": 131570, "epoch": 1585} {"train_loss": -22.9731502532959, "global_step": 131571, "epoch": 1585} {"train_loss": -22.687713623046875, "global_step": 131572, "epoch": 1585} {"train_loss": -22.71854019165039, "global_step": 131573, "epoch": 1585} {"train_loss": -22.741382598876953, "global_step": 131574, "epoch": 1585} {"train_loss": -22.88397216796875, "global_step": 131575, "epoch": 1585} {"train_loss": -23.09601402282715, "global_step": 131576, "epoch": 1585} {"train_loss": -22.483388900756836, "global_step": 131577, "epoch": 1585} {"train_loss": -23.352636337280273, "global_step": 131578, "epoch": 1585} {"train_loss": -22.69032096862793, "global_step": 131579, "epoch": 1585} {"train_loss": -22.719812393188477, "global_step": 131580, "epoch": 1585} {"train_loss": -22.870019912719727, "global_step": 131581, "epoch": 1585} {"train_loss": -22.52309226989746, "global_step": 131582, "epoch": 1585} {"train_loss": -22.913528442382812, "global_step": 131583, "epoch": 1585} {"train_loss": -22.791244506835938, "global_step": 131584, "epoch": 1585} {"train_loss": -22.85658836364746, "global_step": 131585, "epoch": 1585} {"train_loss": -23.03131866455078, "global_step": 131586, "epoch": 1585} {"train_loss": -23.04583168029785, "global_step": 131587, "epoch": 1585} {"train_loss": -22.53049659729004, "global_step": 131588, "epoch": 1585} {"train_loss": -22.886077880859375, "global_step": 131589, "epoch": 1585} {"train_loss": -22.80266571044922, "global_step": 131590, "epoch": 1585} {"train_loss": -22.992130279541016, "global_step": 131591, "epoch": 1585} {"train_loss": -22.579978942871094, "global_step": 131592, "epoch": 1585} {"train_loss": -22.867719650268555, "global_step": 131593, "epoch": 1585} {"train_loss": -22.96491050720215, "global_step": 131594, "epoch": 1585} {"train_loss": -22.34656524658203, "global_step": 131595, "epoch": 1585} {"train_loss": -22.87298011779785, "global_step": 131596, "epoch": 1585} {"train_loss": -22.871875762939453, "global_step": 131597, "epoch": 1585} {"train_loss": -22.592763900756836, "global_step": 131598, "epoch": 1585} {"train_loss": -22.813552856445312, "global_step": 131599, "epoch": 1585} {"train_loss": -22.83045768737793, "global_step": 131600, "epoch": 1585} {"train_loss": -23.09578514099121, "global_step": 131601, "epoch": 1585} {"train_loss": -22.904321670532227, "global_step": 131602, "epoch": 1585} {"train_loss": -23.395627975463867, "global_step": 131603, "epoch": 1585} {"train_loss": -22.992050170898438, "global_step": 131604, "epoch": 1585} {"train_loss": -22.949310302734375, "global_step": 131605, "epoch": 1585} {"train_loss": -23.342336654663086, "global_step": 131606, "epoch": 1585} {"train_loss": -22.837766647338867, "global_step": 131607, "epoch": 1585} {"train_loss": -22.493209838867188, "global_step": 131608, "epoch": 1585} {"train_loss": -22.553760528564453, "global_step": 131609, "epoch": 1585} {"train_loss": -23.37213706970215, "global_step": 131610, "epoch": 1585} {"train_loss": -22.67462730407715, "global_step": 131611, "epoch": 1585} {"train_loss": -23.240692138671875, "global_step": 131612, "epoch": 1585} {"train_loss": -23.113737106323242, "global_step": 131613, "epoch": 1585} {"train_loss": -23.047666549682617, "global_step": 131614, "epoch": 1585} {"train_loss": -22.777034759521484, "global_step": 131615, "epoch": 1585} {"train_loss": -22.725645065307617, "global_step": 131616, "epoch": 1585} {"train_loss": -22.361967086791992, "global_step": 131617, "epoch": 1585} {"train_loss": -22.417882919311523, "global_step": 131618, "epoch": 1585} {"train_loss": -22.861804962158203, "global_step": 131619, "epoch": 1585} {"train_loss": -22.409109115600586, "global_step": 131620, "epoch": 1585} {"train_loss": -22.61734390258789, "global_step": 131621, "epoch": 1585} {"train_loss": -22.544050216674805, "global_step": 131622, "epoch": 1585} {"train_loss": -22.80278968811035, "global_step": 131623, "epoch": 1585} {"train_loss": -22.737409591674805, "global_step": 131624, "epoch": 1585} {"train_loss": -22.92787742614746, "global_step": 131625, "epoch": 1585} {"train_loss": -23.07088279724121, "global_step": 131626, "epoch": 1585} {"train_loss": -23.035425186157227, "global_step": 131627, "epoch": 1585} {"train_loss": -22.809839248657227, "global_step": 131628, "epoch": 1585} {"train_loss": -22.9613094329834, "global_step": 131629, "epoch": 1585} {"train_loss": -22.95175552368164, "global_step": 131630, "epoch": 1585} {"train_loss": -22.83361053466797, "global_step": 131631, "epoch": 1585} {"train_loss": -23.07712745666504, "global_step": 131632, "epoch": 1585} {"train_loss": -22.817935943603516, "global_step": 131633, "epoch": 1585} {"train_loss": -23.079904556274414, "global_step": 131634, "epoch": 1585} {"train_loss": -22.97446060180664, "global_step": 131635, "epoch": 1585} {"train_loss": -22.905574798583984, "global_step": 131636, "epoch": 1585} {"train_loss": -22.821008107748376, "global_step": 131637, "epoch": 1585, "val_loss": 6534768.5} {"train_loss": -22.027511596679688, "global_step": 131638, "epoch": 1586} {"train_loss": -21.630491256713867, "global_step": 131639, "epoch": 1586} {"train_loss": -20.78021240234375, "global_step": 131640, "epoch": 1586} {"train_loss": -21.866886138916016, "global_step": 131641, "epoch": 1586} {"train_loss": -21.865039825439453, "global_step": 131642, "epoch": 1586} {"train_loss": -21.944988250732422, "global_step": 131643, "epoch": 1586} {"train_loss": -21.970945358276367, "global_step": 131644, "epoch": 1586} {"train_loss": -21.76898193359375, "global_step": 131645, "epoch": 1586} {"train_loss": -21.883495330810547, "global_step": 131646, "epoch": 1586} {"train_loss": -22.346832275390625, "global_step": 131647, "epoch": 1586} {"train_loss": -21.980037689208984, "global_step": 131648, "epoch": 1586} {"train_loss": -22.30335807800293, "global_step": 131649, "epoch": 1586} {"train_loss": -21.917020797729492, "global_step": 131650, "epoch": 1586} {"train_loss": -22.336681365966797, "global_step": 131651, "epoch": 1586} {"train_loss": -22.766157150268555, "global_step": 131652, "epoch": 1586} {"train_loss": -22.50567626953125, "global_step": 131653, "epoch": 1586} {"train_loss": -22.603010177612305, "global_step": 131654, "epoch": 1586} {"train_loss": -22.266260147094727, "global_step": 131655, "epoch": 1586} {"train_loss": -22.40414047241211, "global_step": 131656, "epoch": 1586} {"train_loss": -22.478641510009766, "global_step": 131657, "epoch": 1586} {"train_loss": -22.1318416595459, "global_step": 131658, "epoch": 1586} {"train_loss": -22.162845611572266, "global_step": 131659, "epoch": 1586} {"train_loss": -22.526456832885742, "global_step": 131660, "epoch": 1586} {"train_loss": -22.488401412963867, "global_step": 131661, "epoch": 1586} {"train_loss": -22.554214477539062, "global_step": 131662, "epoch": 1586} {"train_loss": -22.299901962280273, "global_step": 131663, "epoch": 1586} {"train_loss": -22.583478927612305, "global_step": 131664, "epoch": 1586} {"train_loss": -22.879993438720703, "global_step": 131665, "epoch": 1586} {"train_loss": -22.586889266967773, "global_step": 131666, "epoch": 1586} {"train_loss": -22.72530174255371, "global_step": 131667, "epoch": 1586} {"train_loss": -22.677879333496094, "global_step": 131668, "epoch": 1586} {"train_loss": -22.868122100830078, "global_step": 131669, "epoch": 1586} {"train_loss": -22.862051010131836, "global_step": 131670, "epoch": 1586} {"train_loss": -22.61455726623535, "global_step": 131671, "epoch": 1586} {"train_loss": -22.732967376708984, "global_step": 131672, "epoch": 1586} {"train_loss": -22.808090209960938, "global_step": 131673, "epoch": 1586} {"train_loss": -22.714948654174805, "global_step": 131674, "epoch": 1586} {"train_loss": -22.68398666381836, "global_step": 131675, "epoch": 1586} {"train_loss": -22.535463333129883, "global_step": 131676, "epoch": 1586} {"train_loss": -23.177534103393555, "global_step": 131677, "epoch": 1586} {"train_loss": -22.780820846557617, "global_step": 131678, "epoch": 1586} {"train_loss": -23.04365348815918, "global_step": 131679, "epoch": 1586} {"train_loss": -23.144407272338867, "global_step": 131680, "epoch": 1586} {"train_loss": -22.830520629882812, "global_step": 131681, "epoch": 1586} {"train_loss": -23.1705322265625, "global_step": 131682, "epoch": 1586} {"train_loss": -22.73053550720215, "global_step": 131683, "epoch": 1586} {"train_loss": -23.097213745117188, "global_step": 131684, "epoch": 1586} {"train_loss": -22.979158401489258, "global_step": 131685, "epoch": 1586} {"train_loss": -22.904592514038086, "global_step": 131686, "epoch": 1586} {"train_loss": -23.06892204284668, "global_step": 131687, "epoch": 1586} {"train_loss": -22.55336570739746, "global_step": 131688, "epoch": 1586} {"train_loss": -22.429529190063477, "global_step": 131689, "epoch": 1586} {"train_loss": -22.761083602905273, "global_step": 131690, "epoch": 1586} {"train_loss": -23.052173614501953, "global_step": 131691, "epoch": 1586} {"train_loss": -22.775306701660156, "global_step": 131692, "epoch": 1586} {"train_loss": -22.715116500854492, "global_step": 131693, "epoch": 1586} {"train_loss": -23.029605865478516, "global_step": 131694, "epoch": 1586} {"train_loss": -22.90176773071289, "global_step": 131695, "epoch": 1586} {"train_loss": -22.788427352905273, "global_step": 131696, "epoch": 1586} {"train_loss": -23.022029876708984, "global_step": 131697, "epoch": 1586} {"train_loss": -23.240339279174805, "global_step": 131698, "epoch": 1586} {"train_loss": -23.023527145385742, "global_step": 131699, "epoch": 1586} {"train_loss": -22.71661949157715, "global_step": 131700, "epoch": 1586} {"train_loss": -22.95665168762207, "global_step": 131701, "epoch": 1586} {"train_loss": -22.907007217407227, "global_step": 131702, "epoch": 1586} {"train_loss": -22.808286666870117, "global_step": 131703, "epoch": 1586} {"train_loss": -22.852680206298828, "global_step": 131704, "epoch": 1586} {"train_loss": -22.615467071533203, "global_step": 131705, "epoch": 1586} {"train_loss": -23.019515991210938, "global_step": 131706, "epoch": 1586} {"train_loss": -22.891183853149414, "global_step": 131707, "epoch": 1586} {"train_loss": -22.87213706970215, "global_step": 131708, "epoch": 1586} {"train_loss": -23.484630584716797, "global_step": 131709, "epoch": 1586} {"train_loss": -23.12264633178711, "global_step": 131710, "epoch": 1586} {"train_loss": -23.2055721282959, "global_step": 131711, "epoch": 1586} {"train_loss": -22.754867553710938, "global_step": 131712, "epoch": 1586} {"train_loss": -22.619535446166992, "global_step": 131713, "epoch": 1586} {"train_loss": -23.168283462524414, "global_step": 131714, "epoch": 1586} {"train_loss": -22.83477783203125, "global_step": 131715, "epoch": 1586} {"train_loss": -22.953092575073242, "global_step": 131716, "epoch": 1586} {"train_loss": -22.478225708007812, "global_step": 131717, "epoch": 1586} {"train_loss": -23.07803726196289, "global_step": 131718, "epoch": 1586} {"train_loss": -22.5721378326416, "global_step": 131719, "epoch": 1586} {"train_loss": -22.630617095763427, "global_step": 131720, "epoch": 1586, "val_loss": 6210656.0} {"train_loss": -22.572038650512695, "global_step": 131721, "epoch": 1587} {"train_loss": -23.043529510498047, "global_step": 131722, "epoch": 1587} {"train_loss": -22.57050132751465, "global_step": 131723, "epoch": 1587} {"train_loss": -22.604736328125, "global_step": 131724, "epoch": 1587} {"train_loss": -22.66355323791504, "global_step": 131725, "epoch": 1587} {"train_loss": -22.6091365814209, "global_step": 131726, "epoch": 1587} {"train_loss": -22.874954223632812, "global_step": 131727, "epoch": 1587} {"train_loss": -22.79847526550293, "global_step": 131728, "epoch": 1587} {"train_loss": -23.111040115356445, "global_step": 131729, "epoch": 1587} {"train_loss": -22.50449562072754, "global_step": 131730, "epoch": 1587} {"train_loss": -22.87734603881836, "global_step": 131731, "epoch": 1587} {"train_loss": -22.974689483642578, "global_step": 131732, "epoch": 1587} {"train_loss": -23.21739387512207, "global_step": 131733, "epoch": 1587} {"train_loss": -23.289024353027344, "global_step": 131734, "epoch": 1587} {"train_loss": -23.19610023498535, "global_step": 131735, "epoch": 1587} {"train_loss": -23.21523094177246, "global_step": 131736, "epoch": 1587} {"train_loss": -22.797056198120117, "global_step": 131737, "epoch": 1587} {"train_loss": -22.968334197998047, "global_step": 131738, "epoch": 1587} {"train_loss": -22.933679580688477, "global_step": 131739, "epoch": 1587} {"train_loss": -23.067642211914062, "global_step": 131740, "epoch": 1587} {"train_loss": -23.02498435974121, "global_step": 131741, "epoch": 1587} {"train_loss": -23.052047729492188, "global_step": 131742, "epoch": 1587} {"train_loss": -22.6721248626709, "global_step": 131743, "epoch": 1587} {"train_loss": -22.826398849487305, "global_step": 131744, "epoch": 1587} {"train_loss": -22.88161277770996, "global_step": 131745, "epoch": 1587} {"train_loss": -22.77861976623535, "global_step": 131746, "epoch": 1587} {"train_loss": -22.541584014892578, "global_step": 131747, "epoch": 1587} {"train_loss": -22.897748947143555, "global_step": 131748, "epoch": 1587} {"train_loss": -22.993688583374023, "global_step": 131749, "epoch": 1587} {"train_loss": -22.60367774963379, "global_step": 131750, "epoch": 1587} {"train_loss": -22.786497116088867, "global_step": 131751, "epoch": 1587} {"train_loss": -22.831897735595703, "global_step": 131752, "epoch": 1587} {"train_loss": -22.61397361755371, "global_step": 131753, "epoch": 1587} {"train_loss": -22.813674926757812, "global_step": 131754, "epoch": 1587} {"train_loss": -22.181655883789062, "global_step": 131755, "epoch": 1587} {"train_loss": -22.736892700195312, "global_step": 131756, "epoch": 1587} {"train_loss": -22.494556427001953, "global_step": 131757, "epoch": 1587} {"train_loss": -22.76384162902832, "global_step": 131758, "epoch": 1587} {"train_loss": -23.2110538482666, "global_step": 131759, "epoch": 1587} {"train_loss": -22.98346519470215, "global_step": 131760, "epoch": 1587} {"train_loss": -23.26759147644043, "global_step": 131761, "epoch": 1587} {"train_loss": -23.138504028320312, "global_step": 131762, "epoch": 1587} {"train_loss": -23.10502052307129, "global_step": 131763, "epoch": 1587} {"train_loss": -22.758499145507812, "global_step": 131764, "epoch": 1587} {"train_loss": -22.990856170654297, "global_step": 131765, "epoch": 1587} {"train_loss": -22.768720626831055, "global_step": 131766, "epoch": 1587} {"train_loss": -22.586591720581055, "global_step": 131767, "epoch": 1587} {"train_loss": -22.414173126220703, "global_step": 131768, "epoch": 1587} {"train_loss": -22.80173683166504, "global_step": 131769, "epoch": 1587} {"train_loss": -23.00116539001465, "global_step": 131770, "epoch": 1587} {"train_loss": -23.023447036743164, "global_step": 131771, "epoch": 1587} {"train_loss": -22.80307388305664, "global_step": 131772, "epoch": 1587} {"train_loss": -22.65795135498047, "global_step": 131773, "epoch": 1587} {"train_loss": -23.24653434753418, "global_step": 131774, "epoch": 1587} {"train_loss": -22.483901977539062, "global_step": 131775, "epoch": 1587} {"train_loss": -22.843042373657227, "global_step": 131776, "epoch": 1587} {"train_loss": -22.980728149414062, "global_step": 131777, "epoch": 1587} {"train_loss": -22.819747924804688, "global_step": 131778, "epoch": 1587} {"train_loss": -22.774703979492188, "global_step": 131779, "epoch": 1587} {"train_loss": -22.590028762817383, "global_step": 131780, "epoch": 1587} {"train_loss": -22.769453048706055, "global_step": 131781, "epoch": 1587} {"train_loss": -23.34065055847168, "global_step": 131782, "epoch": 1587} {"train_loss": -22.857778549194336, "global_step": 131783, "epoch": 1587} {"train_loss": -22.803020477294922, "global_step": 131784, "epoch": 1587} {"train_loss": -22.63490104675293, "global_step": 131785, "epoch": 1587} {"train_loss": -22.885061264038086, "global_step": 131786, "epoch": 1587} {"train_loss": -22.72601890563965, "global_step": 131787, "epoch": 1587} {"train_loss": -22.827600479125977, "global_step": 131788, "epoch": 1587} {"train_loss": -23.017391204833984, "global_step": 131789, "epoch": 1587} {"train_loss": -22.893579483032227, "global_step": 131790, "epoch": 1587} {"train_loss": -23.172718048095703, "global_step": 131791, "epoch": 1587} {"train_loss": -22.91615104675293, "global_step": 131792, "epoch": 1587} {"train_loss": -22.760202407836914, "global_step": 131793, "epoch": 1587} {"train_loss": -23.260358810424805, "global_step": 131794, "epoch": 1587} {"train_loss": -22.73566246032715, "global_step": 131795, "epoch": 1587} {"train_loss": -22.754108428955078, "global_step": 131796, "epoch": 1587} {"train_loss": -22.80019760131836, "global_step": 131797, "epoch": 1587} {"train_loss": -22.62300682067871, "global_step": 131798, "epoch": 1587} {"train_loss": -23.213703155517578, "global_step": 131799, "epoch": 1587} {"train_loss": -22.587566375732422, "global_step": 131800, "epoch": 1587} {"train_loss": -22.979934692382812, "global_step": 131801, "epoch": 1587} {"train_loss": -22.855819702148438, "global_step": 131802, "epoch": 1587} {"train_loss": -22.860871372452703, "global_step": 131803, "epoch": 1587, "val_loss": 6206413.5} {"train_loss": -22.84452247619629, "global_step": 131804, "epoch": 1588} {"train_loss": -22.765640258789062, "global_step": 131805, "epoch": 1588} {"train_loss": -22.580718994140625, "global_step": 131806, "epoch": 1588} {"train_loss": -22.893461227416992, "global_step": 131807, "epoch": 1588} {"train_loss": -22.937602996826172, "global_step": 131808, "epoch": 1588} {"train_loss": -22.870243072509766, "global_step": 131809, "epoch": 1588} {"train_loss": -22.687158584594727, "global_step": 131810, "epoch": 1588} {"train_loss": -22.895349502563477, "global_step": 131811, "epoch": 1588} {"train_loss": -23.081571578979492, "global_step": 131812, "epoch": 1588} {"train_loss": -22.80518913269043, "global_step": 131813, "epoch": 1588} {"train_loss": -22.302392959594727, "global_step": 131814, "epoch": 1588} {"train_loss": -22.646108627319336, "global_step": 131815, "epoch": 1588} {"train_loss": -22.55079460144043, "global_step": 131816, "epoch": 1588} {"train_loss": -22.633136749267578, "global_step": 131817, "epoch": 1588} {"train_loss": -22.4696044921875, "global_step": 131818, "epoch": 1588} {"train_loss": -22.740957260131836, "global_step": 131819, "epoch": 1588} {"train_loss": -22.71161460876465, "global_step": 131820, "epoch": 1588} {"train_loss": -22.614919662475586, "global_step": 131821, "epoch": 1588} {"train_loss": -22.855588912963867, "global_step": 131822, "epoch": 1588} {"train_loss": -22.57760238647461, "global_step": 131823, "epoch": 1588} {"train_loss": -22.863636016845703, "global_step": 131824, "epoch": 1588} {"train_loss": -22.642282485961914, "global_step": 131825, "epoch": 1588} {"train_loss": -23.026580810546875, "global_step": 131826, "epoch": 1588} {"train_loss": -22.741689682006836, "global_step": 131827, "epoch": 1588} {"train_loss": -22.775365829467773, "global_step": 131828, "epoch": 1588} {"train_loss": -22.65677261352539, "global_step": 131829, "epoch": 1588} {"train_loss": -22.857593536376953, "global_step": 131830, "epoch": 1588} {"train_loss": -22.56757354736328, "global_step": 131831, "epoch": 1588} {"train_loss": -22.62041664123535, "global_step": 131832, "epoch": 1588} {"train_loss": -23.20767593383789, "global_step": 131833, "epoch": 1588} {"train_loss": -22.512161254882812, "global_step": 131834, "epoch": 1588} {"train_loss": -22.92036247253418, "global_step": 131835, "epoch": 1588} {"train_loss": -22.712003707885742, "global_step": 131836, "epoch": 1588} {"train_loss": -23.15462303161621, "global_step": 131837, "epoch": 1588} {"train_loss": -22.71446990966797, "global_step": 131838, "epoch": 1588} {"train_loss": -22.944761276245117, "global_step": 131839, "epoch": 1588} {"train_loss": -22.939929962158203, "global_step": 131840, "epoch": 1588} {"train_loss": -22.76235008239746, "global_step": 131841, "epoch": 1588} {"train_loss": -23.1534366607666, "global_step": 131842, "epoch": 1588} {"train_loss": -22.8754825592041, "global_step": 131843, "epoch": 1588} {"train_loss": -23.076148986816406, "global_step": 131844, "epoch": 1588} {"train_loss": -22.642179489135742, "global_step": 131845, "epoch": 1588} {"train_loss": -22.554492950439453, "global_step": 131846, "epoch": 1588} {"train_loss": -22.937665939331055, "global_step": 131847, "epoch": 1588} {"train_loss": -22.6547794342041, "global_step": 131848, "epoch": 1588} {"train_loss": -22.90068244934082, "global_step": 131849, "epoch": 1588} {"train_loss": -22.71952247619629, "global_step": 131850, "epoch": 1588} {"train_loss": -22.65611457824707, "global_step": 131851, "epoch": 1588} {"train_loss": -22.660810470581055, "global_step": 131852, "epoch": 1588} {"train_loss": -23.135610580444336, "global_step": 131853, "epoch": 1588} {"train_loss": -22.96373748779297, "global_step": 131854, "epoch": 1588} {"train_loss": -23.144880294799805, "global_step": 131855, "epoch": 1588} {"train_loss": -23.16202735900879, "global_step": 131856, "epoch": 1588} {"train_loss": -22.806787490844727, "global_step": 131857, "epoch": 1588} {"train_loss": -23.261850357055664, "global_step": 131858, "epoch": 1588} {"train_loss": -22.88797378540039, "global_step": 131859, "epoch": 1588} {"train_loss": -22.715578079223633, "global_step": 131860, "epoch": 1588} {"train_loss": -22.556974411010742, "global_step": 131861, "epoch": 1588} {"train_loss": -22.78501319885254, "global_step": 131862, "epoch": 1588} {"train_loss": -22.84588623046875, "global_step": 131863, "epoch": 1588} {"train_loss": -23.10431671142578, "global_step": 131864, "epoch": 1588} {"train_loss": -23.200162887573242, "global_step": 131865, "epoch": 1588} {"train_loss": -22.7174072265625, "global_step": 131866, "epoch": 1588} {"train_loss": -22.984628677368164, "global_step": 131867, "epoch": 1588} {"train_loss": -23.153305053710938, "global_step": 131868, "epoch": 1588} {"train_loss": -23.17780876159668, "global_step": 131869, "epoch": 1588} {"train_loss": -22.466575622558594, "global_step": 131870, "epoch": 1588} {"train_loss": -23.150634765625, "global_step": 131871, "epoch": 1588} {"train_loss": -22.99306297302246, "global_step": 131872, "epoch": 1588} {"train_loss": -22.993539810180664, "global_step": 131873, "epoch": 1588} {"train_loss": -22.907899856567383, "global_step": 131874, "epoch": 1588} {"train_loss": -23.056928634643555, "global_step": 131875, "epoch": 1588} {"train_loss": -22.682498931884766, "global_step": 131876, "epoch": 1588} {"train_loss": -22.910200119018555, "global_step": 131877, "epoch": 1588} {"train_loss": -23.255090713500977, "global_step": 131878, "epoch": 1588} {"train_loss": -23.04908561706543, "global_step": 131879, "epoch": 1588} {"train_loss": -22.627573013305664, "global_step": 131880, "epoch": 1588} {"train_loss": -22.91570281982422, "global_step": 131881, "epoch": 1588} {"train_loss": -22.900644302368164, "global_step": 131882, "epoch": 1588} {"train_loss": -22.809072494506836, "global_step": 131883, "epoch": 1588} {"train_loss": -23.15215492248535, "global_step": 131884, "epoch": 1588} {"train_loss": -22.79524803161621, "global_step": 131885, "epoch": 1588} {"train_loss": -22.862974373691053, "global_step": 131886, "epoch": 1588, "val_loss": 6267278.0} {"train_loss": -22.852508544921875, "global_step": 131887, "epoch": 1589} {"train_loss": -22.062610626220703, "global_step": 131888, "epoch": 1589} {"train_loss": -22.584463119506836, "global_step": 131889, "epoch": 1589} {"train_loss": -22.559906005859375, "global_step": 131890, "epoch": 1589} {"train_loss": -22.26577377319336, "global_step": 131891, "epoch": 1589} {"train_loss": -22.939123153686523, "global_step": 131892, "epoch": 1589} {"train_loss": -22.8133487701416, "global_step": 131893, "epoch": 1589} {"train_loss": -22.87105941772461, "global_step": 131894, "epoch": 1589} {"train_loss": -22.703733444213867, "global_step": 131895, "epoch": 1589} {"train_loss": -22.925567626953125, "global_step": 131896, "epoch": 1589} {"train_loss": -22.824941635131836, "global_step": 131897, "epoch": 1589} {"train_loss": -22.58926773071289, "global_step": 131898, "epoch": 1589} {"train_loss": -22.613401412963867, "global_step": 131899, "epoch": 1589} {"train_loss": -22.47234535217285, "global_step": 131900, "epoch": 1589} {"train_loss": -22.475650787353516, "global_step": 131901, "epoch": 1589} {"train_loss": -22.38972282409668, "global_step": 131902, "epoch": 1589} {"train_loss": -22.42568016052246, "global_step": 131903, "epoch": 1589} {"train_loss": -22.596418380737305, "global_step": 131904, "epoch": 1589} {"train_loss": -22.92275047302246, "global_step": 131905, "epoch": 1589} {"train_loss": -22.823768615722656, "global_step": 131906, "epoch": 1589} {"train_loss": -22.7215576171875, "global_step": 131907, "epoch": 1589} {"train_loss": -22.750686645507812, "global_step": 131908, "epoch": 1589} {"train_loss": -23.1788387298584, "global_step": 131909, "epoch": 1589} {"train_loss": -22.820491790771484, "global_step": 131910, "epoch": 1589} {"train_loss": -22.656705856323242, "global_step": 131911, "epoch": 1589} {"train_loss": -23.255632400512695, "global_step": 131912, "epoch": 1589} {"train_loss": -23.004140853881836, "global_step": 131913, "epoch": 1589} {"train_loss": -22.6310977935791, "global_step": 131914, "epoch": 1589} {"train_loss": -23.270462036132812, "global_step": 131915, "epoch": 1589} {"train_loss": -23.13114356994629, "global_step": 131916, "epoch": 1589} {"train_loss": -22.81499671936035, "global_step": 131917, "epoch": 1589} {"train_loss": -23.169946670532227, "global_step": 131918, "epoch": 1589} {"train_loss": -22.85677146911621, "global_step": 131919, "epoch": 1589} {"train_loss": -22.937192916870117, "global_step": 131920, "epoch": 1589} {"train_loss": -23.04903793334961, "global_step": 131921, "epoch": 1589} {"train_loss": -22.803979873657227, "global_step": 131922, "epoch": 1589} {"train_loss": -22.848464965820312, "global_step": 131923, "epoch": 1589} {"train_loss": -22.574445724487305, "global_step": 131924, "epoch": 1589} {"train_loss": -22.58476448059082, "global_step": 131925, "epoch": 1589} {"train_loss": -22.4656925201416, "global_step": 131926, "epoch": 1589} {"train_loss": -23.04996109008789, "global_step": 131927, "epoch": 1589} {"train_loss": -22.59481430053711, "global_step": 131928, "epoch": 1589} {"train_loss": -22.839969635009766, "global_step": 131929, "epoch": 1589} {"train_loss": -23.14522361755371, "global_step": 131930, "epoch": 1589} {"train_loss": -22.832773208618164, "global_step": 131931, "epoch": 1589} {"train_loss": -22.88556480407715, "global_step": 131932, "epoch": 1589} {"train_loss": -22.684471130371094, "global_step": 131933, "epoch": 1589} {"train_loss": -22.753324508666992, "global_step": 131934, "epoch": 1589} {"train_loss": -22.910837173461914, "global_step": 131935, "epoch": 1589} {"train_loss": -22.89972496032715, "global_step": 131936, "epoch": 1589} {"train_loss": -22.97203254699707, "global_step": 131937, "epoch": 1589} {"train_loss": -22.903188705444336, "global_step": 131938, "epoch": 1589} {"train_loss": -22.608200073242188, "global_step": 131939, "epoch": 1589} {"train_loss": -22.92966651916504, "global_step": 131940, "epoch": 1589} {"train_loss": -23.122312545776367, "global_step": 131941, "epoch": 1589} {"train_loss": -22.67763328552246, "global_step": 131942, "epoch": 1589} {"train_loss": -22.78544807434082, "global_step": 131943, "epoch": 1589} {"train_loss": -23.300140380859375, "global_step": 131944, "epoch": 1589} {"train_loss": -22.8749942779541, "global_step": 131945, "epoch": 1589} {"train_loss": -23.21857452392578, "global_step": 131946, "epoch": 1589} {"train_loss": -22.51774024963379, "global_step": 131947, "epoch": 1589} {"train_loss": -22.75824737548828, "global_step": 131948, "epoch": 1589} {"train_loss": -23.043447494506836, "global_step": 131949, "epoch": 1589} {"train_loss": -22.619800567626953, "global_step": 131950, "epoch": 1589} {"train_loss": -23.064245223999023, "global_step": 131951, "epoch": 1589} {"train_loss": -23.029855728149414, "global_step": 131952, "epoch": 1589} {"train_loss": -22.66965675354004, "global_step": 131953, "epoch": 1589} {"train_loss": -23.064130783081055, "global_step": 131954, "epoch": 1589} {"train_loss": -22.941614151000977, "global_step": 131955, "epoch": 1589} {"train_loss": -22.748594284057617, "global_step": 131956, "epoch": 1589} {"train_loss": -22.928945541381836, "global_step": 131957, "epoch": 1589} {"train_loss": -22.864126205444336, "global_step": 131958, "epoch": 1589} {"train_loss": -22.836156845092773, "global_step": 131959, "epoch": 1589} {"train_loss": -22.685544967651367, "global_step": 131960, "epoch": 1589} {"train_loss": -23.0116024017334, "global_step": 131961, "epoch": 1589} {"train_loss": -22.73189353942871, "global_step": 131962, "epoch": 1589} {"train_loss": -22.46040916442871, "global_step": 131963, "epoch": 1589} {"train_loss": -22.628528594970703, "global_step": 131964, "epoch": 1589} {"train_loss": -22.800899505615234, "global_step": 131965, "epoch": 1589} {"train_loss": -22.654829025268555, "global_step": 131966, "epoch": 1589} {"train_loss": -22.738759994506836, "global_step": 131967, "epoch": 1589} {"train_loss": -22.558252334594727, "global_step": 131968, "epoch": 1589} {"train_loss": -22.79336065269378, "global_step": 131969, "epoch": 1589, "val_loss": 6362423.5} {"train_loss": -21.617156982421875, "global_step": 131970, "epoch": 1590} {"train_loss": -21.98079490661621, "global_step": 131971, "epoch": 1590} {"train_loss": -22.31474494934082, "global_step": 131972, "epoch": 1590} {"train_loss": -22.05776023864746, "global_step": 131973, "epoch": 1590} {"train_loss": -22.626020431518555, "global_step": 131974, "epoch": 1590} {"train_loss": -22.071001052856445, "global_step": 131975, "epoch": 1590} {"train_loss": -22.578115463256836, "global_step": 131976, "epoch": 1590} {"train_loss": -22.62504005432129, "global_step": 131977, "epoch": 1590} {"train_loss": -22.115116119384766, "global_step": 131978, "epoch": 1590} {"train_loss": -22.475107192993164, "global_step": 131979, "epoch": 1590} {"train_loss": -22.378271102905273, "global_step": 131980, "epoch": 1590} {"train_loss": -22.39807891845703, "global_step": 131981, "epoch": 1590} {"train_loss": -22.70526123046875, "global_step": 131982, "epoch": 1590} {"train_loss": -22.2351016998291, "global_step": 131983, "epoch": 1590} {"train_loss": -22.25083351135254, "global_step": 131984, "epoch": 1590} {"train_loss": -22.224369049072266, "global_step": 131985, "epoch": 1590} {"train_loss": -22.359540939331055, "global_step": 131986, "epoch": 1590} {"train_loss": -22.437265396118164, "global_step": 131987, "epoch": 1590} {"train_loss": -22.12334442138672, "global_step": 131988, "epoch": 1590} {"train_loss": -22.09147071838379, "global_step": 131989, "epoch": 1590} {"train_loss": -22.58390235900879, "global_step": 131990, "epoch": 1590} {"train_loss": -22.743906021118164, "global_step": 131991, "epoch": 1590} {"train_loss": -22.89126968383789, "global_step": 131992, "epoch": 1590} {"train_loss": -22.67913818359375, "global_step": 131993, "epoch": 1590} {"train_loss": -22.783775329589844, "global_step": 131994, "epoch": 1590} {"train_loss": -22.8155460357666, "global_step": 131995, "epoch": 1590} {"train_loss": -22.56122398376465, "global_step": 131996, "epoch": 1590} {"train_loss": -22.744525909423828, "global_step": 131997, "epoch": 1590} {"train_loss": -22.882678985595703, "global_step": 131998, "epoch": 1590} {"train_loss": -22.471784591674805, "global_step": 131999, "epoch": 1590} {"train_loss": -22.86943817138672, "global_step": 132000, "epoch": 1590} {"train_loss": -22.83261489868164, "global_step": 132001, "epoch": 1590} {"train_loss": -22.564247131347656, "global_step": 132002, "epoch": 1590} {"train_loss": -22.64204978942871, "global_step": 132003, "epoch": 1590} {"train_loss": -22.533918380737305, "global_step": 132004, "epoch": 1590} {"train_loss": -22.61488151550293, "global_step": 132005, "epoch": 1590} {"train_loss": -22.81949234008789, "global_step": 132006, "epoch": 1590} {"train_loss": -22.924224853515625, "global_step": 132007, "epoch": 1590} {"train_loss": -22.74116325378418, "global_step": 132008, "epoch": 1590} {"train_loss": -23.10024642944336, "global_step": 132009, "epoch": 1590} {"train_loss": -23.0366153717041, "global_step": 132010, "epoch": 1590} {"train_loss": -22.749286651611328, "global_step": 132011, "epoch": 1590} {"train_loss": -22.797487258911133, "global_step": 132012, "epoch": 1590} {"train_loss": -22.74309539794922, "global_step": 132013, "epoch": 1590} {"train_loss": -22.92789077758789, "global_step": 132014, "epoch": 1590} {"train_loss": -22.71489906311035, "global_step": 132015, "epoch": 1590} {"train_loss": -22.908952713012695, "global_step": 132016, "epoch": 1590} {"train_loss": -22.654014587402344, "global_step": 132017, "epoch": 1590} {"train_loss": -23.09257698059082, "global_step": 132018, "epoch": 1590} {"train_loss": -22.80449867248535, "global_step": 132019, "epoch": 1590} {"train_loss": -23.018030166625977, "global_step": 132020, "epoch": 1590} {"train_loss": -22.890911102294922, "global_step": 132021, "epoch": 1590} {"train_loss": -22.917766571044922, "global_step": 132022, "epoch": 1590} {"train_loss": -23.030582427978516, "global_step": 132023, "epoch": 1590} {"train_loss": -23.366052627563477, "global_step": 132024, "epoch": 1590} {"train_loss": -22.930601119995117, "global_step": 132025, "epoch": 1590} {"train_loss": -23.01161003112793, "global_step": 132026, "epoch": 1590} {"train_loss": -22.774492263793945, "global_step": 132027, "epoch": 1590} {"train_loss": -22.593231201171875, "global_step": 132028, "epoch": 1590} {"train_loss": -22.753768920898438, "global_step": 132029, "epoch": 1590} {"train_loss": -23.118141174316406, "global_step": 132030, "epoch": 1590} {"train_loss": -22.787500381469727, "global_step": 132031, "epoch": 1590} {"train_loss": -22.676544189453125, "global_step": 132032, "epoch": 1590} {"train_loss": -22.734560012817383, "global_step": 132033, "epoch": 1590} {"train_loss": -22.697635650634766, "global_step": 132034, "epoch": 1590} {"train_loss": -23.077632904052734, "global_step": 132035, "epoch": 1590} {"train_loss": -23.336824417114258, "global_step": 132036, "epoch": 1590} {"train_loss": -23.015806198120117, "global_step": 132037, "epoch": 1590} {"train_loss": -22.913288116455078, "global_step": 132038, "epoch": 1590} {"train_loss": -22.91265869140625, "global_step": 132039, "epoch": 1590} {"train_loss": -22.706811904907227, "global_step": 132040, "epoch": 1590} {"train_loss": -22.886552810668945, "global_step": 132041, "epoch": 1590} {"train_loss": -22.656925201416016, "global_step": 132042, "epoch": 1590} {"train_loss": -23.14786148071289, "global_step": 132043, "epoch": 1590} {"train_loss": -22.793310165405273, "global_step": 132044, "epoch": 1590} {"train_loss": -22.737934112548828, "global_step": 132045, "epoch": 1590} {"train_loss": -22.926055908203125, "global_step": 132046, "epoch": 1590} {"train_loss": -22.766998291015625, "global_step": 132047, "epoch": 1590} {"train_loss": -22.7471923828125, "global_step": 132048, "epoch": 1590} {"train_loss": -22.51541519165039, "global_step": 132049, "epoch": 1590} {"train_loss": -23.103668212890625, "global_step": 132050, "epoch": 1590} {"train_loss": -22.966617584228516, "global_step": 132051, "epoch": 1590} {"train_loss": -22.68453873783709, "global_step": 132052, "epoch": 1590, "val_loss": 6260755.0} {"train_loss": -22.09766387939453, "global_step": 132053, "epoch": 1591} {"train_loss": -22.52556037902832, "global_step": 132054, "epoch": 1591} {"train_loss": -22.453969955444336, "global_step": 132055, "epoch": 1591} {"train_loss": -22.459020614624023, "global_step": 132056, "epoch": 1591} {"train_loss": -22.351667404174805, "global_step": 132057, "epoch": 1591} {"train_loss": -22.531646728515625, "global_step": 132058, "epoch": 1591} {"train_loss": -22.473770141601562, "global_step": 132059, "epoch": 1591} {"train_loss": -22.33099365234375, "global_step": 132060, "epoch": 1591} {"train_loss": -22.758649826049805, "global_step": 132061, "epoch": 1591} {"train_loss": -22.476137161254883, "global_step": 132062, "epoch": 1591} {"train_loss": -22.83735466003418, "global_step": 132063, "epoch": 1591} {"train_loss": -22.846240997314453, "global_step": 132064, "epoch": 1591} {"train_loss": -22.56915855407715, "global_step": 132065, "epoch": 1591} {"train_loss": -22.535558700561523, "global_step": 132066, "epoch": 1591} {"train_loss": -22.49148178100586, "global_step": 132067, "epoch": 1591} {"train_loss": -22.556333541870117, "global_step": 132068, "epoch": 1591} {"train_loss": -22.422454833984375, "global_step": 132069, "epoch": 1591} {"train_loss": -22.607440948486328, "global_step": 132070, "epoch": 1591} {"train_loss": -22.76199722290039, "global_step": 132071, "epoch": 1591} {"train_loss": -22.61212730407715, "global_step": 132072, "epoch": 1591} {"train_loss": -22.95008659362793, "global_step": 132073, "epoch": 1591} {"train_loss": -22.51503562927246, "global_step": 132074, "epoch": 1591} {"train_loss": -22.779508590698242, "global_step": 132075, "epoch": 1591} {"train_loss": -22.674779891967773, "global_step": 132076, "epoch": 1591} {"train_loss": -22.98175048828125, "global_step": 132077, "epoch": 1591} {"train_loss": -22.530073165893555, "global_step": 132078, "epoch": 1591} {"train_loss": -23.016515731811523, "global_step": 132079, "epoch": 1591} {"train_loss": -22.847681045532227, "global_step": 132080, "epoch": 1591} {"train_loss": -22.72119903564453, "global_step": 132081, "epoch": 1591} {"train_loss": -23.07395362854004, "global_step": 132082, "epoch": 1591} {"train_loss": -22.785083770751953, "global_step": 132083, "epoch": 1591} {"train_loss": -22.881607055664062, "global_step": 132084, "epoch": 1591} {"train_loss": -22.848527908325195, "global_step": 132085, "epoch": 1591} {"train_loss": -22.531024932861328, "global_step": 132086, "epoch": 1591} {"train_loss": -22.55129623413086, "global_step": 132087, "epoch": 1591} {"train_loss": -23.1722412109375, "global_step": 132088, "epoch": 1591} {"train_loss": -23.365097045898438, "global_step": 132089, "epoch": 1591} {"train_loss": -23.00476837158203, "global_step": 132090, "epoch": 1591} {"train_loss": -23.167911529541016, "global_step": 132091, "epoch": 1591} {"train_loss": -22.884307861328125, "global_step": 132092, "epoch": 1591} {"train_loss": -22.964643478393555, "global_step": 132093, "epoch": 1591} {"train_loss": -23.022058486938477, "global_step": 132094, "epoch": 1591} {"train_loss": -22.760101318359375, "global_step": 132095, "epoch": 1591} {"train_loss": -22.36083984375, "global_step": 132096, "epoch": 1591} {"train_loss": -22.85888671875, "global_step": 132097, "epoch": 1591} {"train_loss": -22.801406860351562, "global_step": 132098, "epoch": 1591} {"train_loss": -23.067472457885742, "global_step": 132099, "epoch": 1591} {"train_loss": -23.351682662963867, "global_step": 132100, "epoch": 1591} {"train_loss": -23.019800186157227, "global_step": 132101, "epoch": 1591} {"train_loss": -22.853849411010742, "global_step": 132102, "epoch": 1591} {"train_loss": -22.822507858276367, "global_step": 132103, "epoch": 1591} {"train_loss": -22.52943992614746, "global_step": 132104, "epoch": 1591} {"train_loss": -22.57343101501465, "global_step": 132105, "epoch": 1591} {"train_loss": -22.909971237182617, "global_step": 132106, "epoch": 1591} {"train_loss": -22.65860939025879, "global_step": 132107, "epoch": 1591} {"train_loss": -23.054325103759766, "global_step": 132108, "epoch": 1591} {"train_loss": -23.150144577026367, "global_step": 132109, "epoch": 1591} {"train_loss": -22.71116065979004, "global_step": 132110, "epoch": 1591} {"train_loss": -23.1523494720459, "global_step": 132111, "epoch": 1591} {"train_loss": -23.137861251831055, "global_step": 132112, "epoch": 1591} {"train_loss": -23.198713302612305, "global_step": 132113, "epoch": 1591} {"train_loss": -22.578794479370117, "global_step": 132114, "epoch": 1591} {"train_loss": -22.831785202026367, "global_step": 132115, "epoch": 1591} {"train_loss": -23.047189712524414, "global_step": 132116, "epoch": 1591} {"train_loss": -22.644453048706055, "global_step": 132117, "epoch": 1591} {"train_loss": -22.82647705078125, "global_step": 132118, "epoch": 1591} {"train_loss": -23.085805892944336, "global_step": 132119, "epoch": 1591} {"train_loss": -22.92262077331543, "global_step": 132120, "epoch": 1591} {"train_loss": -22.86533546447754, "global_step": 132121, "epoch": 1591} {"train_loss": -22.510406494140625, "global_step": 132122, "epoch": 1591} {"train_loss": -23.26825714111328, "global_step": 132123, "epoch": 1591} {"train_loss": -22.819528579711914, "global_step": 132124, "epoch": 1591} {"train_loss": -22.63066864013672, "global_step": 132125, "epoch": 1591} {"train_loss": -22.91952896118164, "global_step": 132126, "epoch": 1591} {"train_loss": -22.886947631835938, "global_step": 132127, "epoch": 1591} {"train_loss": -22.920501708984375, "global_step": 132128, "epoch": 1591} {"train_loss": -22.654226303100586, "global_step": 132129, "epoch": 1591} {"train_loss": -22.134033203125, "global_step": 132130, "epoch": 1591} {"train_loss": -22.48062515258789, "global_step": 132131, "epoch": 1591} {"train_loss": -22.85371208190918, "global_step": 132132, "epoch": 1591} {"train_loss": -22.677993774414062, "global_step": 132133, "epoch": 1591} {"train_loss": -23.045669555664062, "global_step": 132134, "epoch": 1591} {"train_loss": -22.755879229809864, "global_step": 132135, "epoch": 1591, "val_loss": 6316991.0} {"train_loss": -21.745182037353516, "global_step": 132136, "epoch": 1592} {"train_loss": -22.70639991760254, "global_step": 132137, "epoch": 1592} {"train_loss": -23.1225528717041, "global_step": 132138, "epoch": 1592} {"train_loss": -22.549896240234375, "global_step": 132139, "epoch": 1592} {"train_loss": -22.4901065826416, "global_step": 132140, "epoch": 1592} {"train_loss": -22.456756591796875, "global_step": 132141, "epoch": 1592} {"train_loss": -22.662729263305664, "global_step": 132142, "epoch": 1592} {"train_loss": -22.596555709838867, "global_step": 132143, "epoch": 1592} {"train_loss": -22.369304656982422, "global_step": 132144, "epoch": 1592} {"train_loss": -22.319082260131836, "global_step": 132145, "epoch": 1592} {"train_loss": -22.4558048248291, "global_step": 132146, "epoch": 1592} {"train_loss": -22.71124267578125, "global_step": 132147, "epoch": 1592} {"train_loss": -22.78598403930664, "global_step": 132148, "epoch": 1592} {"train_loss": -22.846187591552734, "global_step": 132149, "epoch": 1592} {"train_loss": -22.664030075073242, "global_step": 132150, "epoch": 1592} {"train_loss": -22.801029205322266, "global_step": 132151, "epoch": 1592} {"train_loss": -22.38007164001465, "global_step": 132152, "epoch": 1592} {"train_loss": -22.60091781616211, "global_step": 132153, "epoch": 1592} {"train_loss": -22.674001693725586, "global_step": 132154, "epoch": 1592} {"train_loss": -22.513866424560547, "global_step": 132155, "epoch": 1592} {"train_loss": -22.738113403320312, "global_step": 132156, "epoch": 1592} {"train_loss": -22.857057571411133, "global_step": 132157, "epoch": 1592} {"train_loss": -22.514169692993164, "global_step": 132158, "epoch": 1592} {"train_loss": -22.99867820739746, "global_step": 132159, "epoch": 1592} {"train_loss": -22.740690231323242, "global_step": 132160, "epoch": 1592} {"train_loss": -22.547834396362305, "global_step": 132161, "epoch": 1592} {"train_loss": -23.059507369995117, "global_step": 132162, "epoch": 1592} {"train_loss": -22.572860717773438, "global_step": 132163, "epoch": 1592} {"train_loss": -23.190412521362305, "global_step": 132164, "epoch": 1592} {"train_loss": -22.35590934753418, "global_step": 132165, "epoch": 1592} {"train_loss": -23.2088565826416, "global_step": 132166, "epoch": 1592} {"train_loss": -22.744123458862305, "global_step": 132167, "epoch": 1592} {"train_loss": -22.53931427001953, "global_step": 132168, "epoch": 1592} {"train_loss": -22.999530792236328, "global_step": 132169, "epoch": 1592} {"train_loss": -22.914026260375977, "global_step": 132170, "epoch": 1592} {"train_loss": -22.93402862548828, "global_step": 132171, "epoch": 1592} {"train_loss": -22.783702850341797, "global_step": 132172, "epoch": 1592} {"train_loss": -23.311582565307617, "global_step": 132173, "epoch": 1592} {"train_loss": -22.516462326049805, "global_step": 132174, "epoch": 1592} {"train_loss": -23.299110412597656, "global_step": 132175, "epoch": 1592} {"train_loss": -22.770078659057617, "global_step": 132176, "epoch": 1592} {"train_loss": -22.74784278869629, "global_step": 132177, "epoch": 1592} {"train_loss": -22.403717041015625, "global_step": 132178, "epoch": 1592} {"train_loss": -22.68868064880371, "global_step": 132179, "epoch": 1592} {"train_loss": -22.868085861206055, "global_step": 132180, "epoch": 1592} {"train_loss": -22.581357955932617, "global_step": 132181, "epoch": 1592} {"train_loss": -22.789567947387695, "global_step": 132182, "epoch": 1592} {"train_loss": -22.894372940063477, "global_step": 132183, "epoch": 1592} {"train_loss": -22.94296646118164, "global_step": 132184, "epoch": 1592} {"train_loss": -22.631038665771484, "global_step": 132185, "epoch": 1592} {"train_loss": -22.833768844604492, "global_step": 132186, "epoch": 1592} {"train_loss": -22.983108520507812, "global_step": 132187, "epoch": 1592} {"train_loss": -22.972177505493164, "global_step": 132188, "epoch": 1592} {"train_loss": -22.983474731445312, "global_step": 132189, "epoch": 1592} {"train_loss": -22.79501724243164, "global_step": 132190, "epoch": 1592} {"train_loss": -23.101470947265625, "global_step": 132191, "epoch": 1592} {"train_loss": -22.845653533935547, "global_step": 132192, "epoch": 1592} {"train_loss": -22.915712356567383, "global_step": 132193, "epoch": 1592} {"train_loss": -22.995716094970703, "global_step": 132194, "epoch": 1592} {"train_loss": -22.640417098999023, "global_step": 132195, "epoch": 1592} {"train_loss": -23.237136840820312, "global_step": 132196, "epoch": 1592} {"train_loss": -22.642974853515625, "global_step": 132197, "epoch": 1592} {"train_loss": -23.121877670288086, "global_step": 132198, "epoch": 1592} {"train_loss": -23.024402618408203, "global_step": 132199, "epoch": 1592} {"train_loss": -22.7947940826416, "global_step": 132200, "epoch": 1592} {"train_loss": -22.67217445373535, "global_step": 132201, "epoch": 1592} {"train_loss": -23.143451690673828, "global_step": 132202, "epoch": 1592} {"train_loss": -22.651290893554688, "global_step": 132203, "epoch": 1592} {"train_loss": -23.095951080322266, "global_step": 132204, "epoch": 1592} {"train_loss": -23.056859970092773, "global_step": 132205, "epoch": 1592} {"train_loss": -23.013479232788086, "global_step": 132206, "epoch": 1592} {"train_loss": -22.42603874206543, "global_step": 132207, "epoch": 1592} {"train_loss": -23.128402709960938, "global_step": 132208, "epoch": 1592} {"train_loss": -22.8686580657959, "global_step": 132209, "epoch": 1592} {"train_loss": -23.1076602935791, "global_step": 132210, "epoch": 1592} {"train_loss": -22.974531173706055, "global_step": 132211, "epoch": 1592} {"train_loss": -22.908761978149414, "global_step": 132212, "epoch": 1592} {"train_loss": -22.64158058166504, "global_step": 132213, "epoch": 1592} {"train_loss": -22.76758575439453, "global_step": 132214, "epoch": 1592} {"train_loss": -22.67571449279785, "global_step": 132215, "epoch": 1592} {"train_loss": -22.956954956054688, "global_step": 132216, "epoch": 1592} {"train_loss": -22.728397369384766, "global_step": 132217, "epoch": 1592} {"train_loss": -22.772572850606526, "global_step": 132218, "epoch": 1592, "val_loss": 6274593.5} {"train_loss": -22.492300033569336, "global_step": 132219, "epoch": 1593} {"train_loss": -22.51999855041504, "global_step": 132220, "epoch": 1593} {"train_loss": -22.68562889099121, "global_step": 132221, "epoch": 1593} {"train_loss": -23.07686996459961, "global_step": 132222, "epoch": 1593} {"train_loss": -22.467823028564453, "global_step": 132223, "epoch": 1593} {"train_loss": -22.326984405517578, "global_step": 132224, "epoch": 1593} {"train_loss": -22.86980628967285, "global_step": 132225, "epoch": 1593} {"train_loss": -22.7863826751709, "global_step": 132226, "epoch": 1593} {"train_loss": -22.8031063079834, "global_step": 132227, "epoch": 1593} {"train_loss": -22.642227172851562, "global_step": 132228, "epoch": 1593} {"train_loss": -22.43112564086914, "global_step": 132229, "epoch": 1593} {"train_loss": -22.71798324584961, "global_step": 132230, "epoch": 1593} {"train_loss": -22.428884506225586, "global_step": 132231, "epoch": 1593} {"train_loss": -22.958417892456055, "global_step": 132232, "epoch": 1593} {"train_loss": -22.7808780670166, "global_step": 132233, "epoch": 1593} {"train_loss": -22.527830123901367, "global_step": 132234, "epoch": 1593} {"train_loss": -22.624326705932617, "global_step": 132235, "epoch": 1593} {"train_loss": -22.76248550415039, "global_step": 132236, "epoch": 1593} {"train_loss": -22.664426803588867, "global_step": 132237, "epoch": 1593} {"train_loss": -22.620132446289062, "global_step": 132238, "epoch": 1593} {"train_loss": -22.9029598236084, "global_step": 132239, "epoch": 1593} {"train_loss": -22.936710357666016, "global_step": 132240, "epoch": 1593} {"train_loss": -22.998947143554688, "global_step": 132241, "epoch": 1593} {"train_loss": -22.71792221069336, "global_step": 132242, "epoch": 1593} {"train_loss": -22.815032958984375, "global_step": 132243, "epoch": 1593} {"train_loss": -23.141103744506836, "global_step": 132244, "epoch": 1593} {"train_loss": -22.70136070251465, "global_step": 132245, "epoch": 1593} {"train_loss": -22.733346939086914, "global_step": 132246, "epoch": 1593} {"train_loss": -22.39021110534668, "global_step": 132247, "epoch": 1593} {"train_loss": -23.099626541137695, "global_step": 132248, "epoch": 1593} {"train_loss": -22.717453002929688, "global_step": 132249, "epoch": 1593} {"train_loss": -22.64358901977539, "global_step": 132250, "epoch": 1593} {"train_loss": -23.24883460998535, "global_step": 132251, "epoch": 1593} {"train_loss": -23.01563835144043, "global_step": 132252, "epoch": 1593} {"train_loss": -22.71396255493164, "global_step": 132253, "epoch": 1593} {"train_loss": -22.86762809753418, "global_step": 132254, "epoch": 1593} {"train_loss": -22.995479583740234, "global_step": 132255, "epoch": 1593} {"train_loss": -22.602128982543945, "global_step": 132256, "epoch": 1593} {"train_loss": -22.996259689331055, "global_step": 132257, "epoch": 1593} {"train_loss": -22.766233444213867, "global_step": 132258, "epoch": 1593} {"train_loss": -23.170507431030273, "global_step": 132259, "epoch": 1593} {"train_loss": -23.026220321655273, "global_step": 132260, "epoch": 1593} {"train_loss": -22.853113174438477, "global_step": 132261, "epoch": 1593} {"train_loss": -22.43709373474121, "global_step": 132262, "epoch": 1593} {"train_loss": -23.156362533569336, "global_step": 132263, "epoch": 1593} {"train_loss": -22.828657150268555, "global_step": 132264, "epoch": 1593} {"train_loss": -23.167255401611328, "global_step": 132265, "epoch": 1593} {"train_loss": -22.7729549407959, "global_step": 132266, "epoch": 1593} {"train_loss": -23.021024703979492, "global_step": 132267, "epoch": 1593} {"train_loss": -22.53472137451172, "global_step": 132268, "epoch": 1593} {"train_loss": -22.7371883392334, "global_step": 132269, "epoch": 1593} {"train_loss": -22.82197380065918, "global_step": 132270, "epoch": 1593} {"train_loss": -22.995403289794922, "global_step": 132271, "epoch": 1593} {"train_loss": -22.71038055419922, "global_step": 132272, "epoch": 1593} {"train_loss": -22.788381576538086, "global_step": 132273, "epoch": 1593} {"train_loss": -22.453310012817383, "global_step": 132274, "epoch": 1593} {"train_loss": -22.963184356689453, "global_step": 132275, "epoch": 1593} {"train_loss": -22.784564971923828, "global_step": 132276, "epoch": 1593} {"train_loss": -22.74509620666504, "global_step": 132277, "epoch": 1593} {"train_loss": -23.035001754760742, "global_step": 132278, "epoch": 1593} {"train_loss": -22.750873565673828, "global_step": 132279, "epoch": 1593} {"train_loss": -22.713035583496094, "global_step": 132280, "epoch": 1593} {"train_loss": -22.94057273864746, "global_step": 132281, "epoch": 1593} {"train_loss": -22.78107261657715, "global_step": 132282, "epoch": 1593} {"train_loss": -22.596832275390625, "global_step": 132283, "epoch": 1593} {"train_loss": -22.670211791992188, "global_step": 132284, "epoch": 1593} {"train_loss": -23.021757125854492, "global_step": 132285, "epoch": 1593} {"train_loss": -22.85518455505371, "global_step": 132286, "epoch": 1593} {"train_loss": -22.94671058654785, "global_step": 132287, "epoch": 1593} {"train_loss": -22.440902709960938, "global_step": 132288, "epoch": 1593} {"train_loss": -22.898212432861328, "global_step": 132289, "epoch": 1593} {"train_loss": -22.701919555664062, "global_step": 132290, "epoch": 1593} {"train_loss": -22.571367263793945, "global_step": 132291, "epoch": 1593} {"train_loss": -23.308399200439453, "global_step": 132292, "epoch": 1593} {"train_loss": -23.04144859313965, "global_step": 132293, "epoch": 1593} {"train_loss": -22.965652465820312, "global_step": 132294, "epoch": 1593} {"train_loss": -22.73746109008789, "global_step": 132295, "epoch": 1593} {"train_loss": -22.43337059020996, "global_step": 132296, "epoch": 1593} {"train_loss": -22.97567367553711, "global_step": 132297, "epoch": 1593} {"train_loss": -22.739322662353516, "global_step": 132298, "epoch": 1593} {"train_loss": -22.883893966674805, "global_step": 132299, "epoch": 1593} {"train_loss": -22.988996505737305, "global_step": 132300, "epoch": 1593} {"train_loss": -22.798129552818207, "global_step": 132301, "epoch": 1593, "val_loss": 6357743.0} {"train_loss": -22.334325790405273, "global_step": 132302, "epoch": 1594} {"train_loss": -22.934913635253906, "global_step": 132303, "epoch": 1594} {"train_loss": -22.718847274780273, "global_step": 132304, "epoch": 1594} {"train_loss": -22.488130569458008, "global_step": 132305, "epoch": 1594} {"train_loss": -22.617691040039062, "global_step": 132306, "epoch": 1594} {"train_loss": -22.85895538330078, "global_step": 132307, "epoch": 1594} {"train_loss": -22.651521682739258, "global_step": 132308, "epoch": 1594} {"train_loss": -22.59731674194336, "global_step": 132309, "epoch": 1594} {"train_loss": -22.884796142578125, "global_step": 132310, "epoch": 1594} {"train_loss": -22.670673370361328, "global_step": 132311, "epoch": 1594} {"train_loss": -22.431522369384766, "global_step": 132312, "epoch": 1594} {"train_loss": -22.261396408081055, "global_step": 132313, "epoch": 1594} {"train_loss": -22.810190200805664, "global_step": 132314, "epoch": 1594} {"train_loss": -22.74329376220703, "global_step": 132315, "epoch": 1594} {"train_loss": -22.66834831237793, "global_step": 132316, "epoch": 1594} {"train_loss": -23.014617919921875, "global_step": 132317, "epoch": 1594} {"train_loss": -22.76559829711914, "global_step": 132318, "epoch": 1594} {"train_loss": -22.690664291381836, "global_step": 132319, "epoch": 1594} {"train_loss": -22.57923698425293, "global_step": 132320, "epoch": 1594} {"train_loss": -22.960758209228516, "global_step": 132321, "epoch": 1594} {"train_loss": -22.829593658447266, "global_step": 132322, "epoch": 1594} {"train_loss": -22.827037811279297, "global_step": 132323, "epoch": 1594} {"train_loss": -23.034950256347656, "global_step": 132324, "epoch": 1594} {"train_loss": -22.96736717224121, "global_step": 132325, "epoch": 1594} {"train_loss": -23.02479362487793, "global_step": 132326, "epoch": 1594} {"train_loss": -22.564998626708984, "global_step": 132327, "epoch": 1594} {"train_loss": -22.931406021118164, "global_step": 132328, "epoch": 1594} {"train_loss": -22.75411033630371, "global_step": 132329, "epoch": 1594} {"train_loss": -23.07676887512207, "global_step": 132330, "epoch": 1594} {"train_loss": -22.95602035522461, "global_step": 132331, "epoch": 1594} {"train_loss": -22.83831787109375, "global_step": 132332, "epoch": 1594} {"train_loss": -22.856767654418945, "global_step": 132333, "epoch": 1594} {"train_loss": -22.985506057739258, "global_step": 132334, "epoch": 1594} {"train_loss": -22.69260597229004, "global_step": 132335, "epoch": 1594} {"train_loss": -22.984769821166992, "global_step": 132336, "epoch": 1594} {"train_loss": -23.057079315185547, "global_step": 132337, "epoch": 1594} {"train_loss": -22.628963470458984, "global_step": 132338, "epoch": 1594} {"train_loss": -22.85443115234375, "global_step": 132339, "epoch": 1594} {"train_loss": -23.173812866210938, "global_step": 132340, "epoch": 1594} {"train_loss": -23.02762794494629, "global_step": 132341, "epoch": 1594} {"train_loss": -22.589094161987305, "global_step": 132342, "epoch": 1594} {"train_loss": -22.620655059814453, "global_step": 132343, "epoch": 1594} {"train_loss": -23.071386337280273, "global_step": 132344, "epoch": 1594} {"train_loss": -23.06109046936035, "global_step": 132345, "epoch": 1594} {"train_loss": -22.833402633666992, "global_step": 132346, "epoch": 1594} {"train_loss": -23.02435302734375, "global_step": 132347, "epoch": 1594} {"train_loss": -23.199174880981445, "global_step": 132348, "epoch": 1594} {"train_loss": -22.775545120239258, "global_step": 132349, "epoch": 1594} {"train_loss": -23.075681686401367, "global_step": 132350, "epoch": 1594} {"train_loss": -23.13252067565918, "global_step": 132351, "epoch": 1594} {"train_loss": -23.021392822265625, "global_step": 132352, "epoch": 1594} {"train_loss": -22.969154357910156, "global_step": 132353, "epoch": 1594} {"train_loss": -23.01869010925293, "global_step": 132354, "epoch": 1594} {"train_loss": -22.497129440307617, "global_step": 132355, "epoch": 1594} {"train_loss": -22.275821685791016, "global_step": 132356, "epoch": 1594} {"train_loss": -22.853525161743164, "global_step": 132357, "epoch": 1594} {"train_loss": -22.61263656616211, "global_step": 132358, "epoch": 1594} {"train_loss": -22.904287338256836, "global_step": 132359, "epoch": 1594} {"train_loss": -23.143171310424805, "global_step": 132360, "epoch": 1594} {"train_loss": -22.363880157470703, "global_step": 132361, "epoch": 1594} {"train_loss": -23.02779197692871, "global_step": 132362, "epoch": 1594} {"train_loss": -22.82052993774414, "global_step": 132363, "epoch": 1594} {"train_loss": -22.60382080078125, "global_step": 132364, "epoch": 1594} {"train_loss": -22.933155059814453, "global_step": 132365, "epoch": 1594} {"train_loss": -22.64883804321289, "global_step": 132366, "epoch": 1594} {"train_loss": -22.897289276123047, "global_step": 132367, "epoch": 1594} {"train_loss": -22.818557739257812, "global_step": 132368, "epoch": 1594} {"train_loss": -22.86056900024414, "global_step": 132369, "epoch": 1594} {"train_loss": -22.715551376342773, "global_step": 132370, "epoch": 1594} {"train_loss": -22.972631454467773, "global_step": 132371, "epoch": 1594} {"train_loss": -22.954343795776367, "global_step": 132372, "epoch": 1594} {"train_loss": -22.72464370727539, "global_step": 132373, "epoch": 1594} {"train_loss": -22.25461196899414, "global_step": 132374, "epoch": 1594} {"train_loss": -23.003990173339844, "global_step": 132375, "epoch": 1594} {"train_loss": -23.126447677612305, "global_step": 132376, "epoch": 1594} {"train_loss": -22.83896255493164, "global_step": 132377, "epoch": 1594} {"train_loss": -22.88455581665039, "global_step": 132378, "epoch": 1594} {"train_loss": -23.00760269165039, "global_step": 132379, "epoch": 1594} {"train_loss": -22.81490135192871, "global_step": 132380, "epoch": 1594} {"train_loss": -22.801177978515625, "global_step": 132381, "epoch": 1594} {"train_loss": -22.649513244628906, "global_step": 132382, "epoch": 1594} {"train_loss": -22.93688201904297, "global_step": 132383, "epoch": 1594} {"train_loss": -22.817921558058405, "global_step": 132384, "epoch": 1594, "val_loss": 6319104.5} {"train_loss": -21.67473793029785, "global_step": 132385, "epoch": 1595} {"train_loss": -20.73578453063965, "global_step": 132386, "epoch": 1595} {"train_loss": -22.423200607299805, "global_step": 132387, "epoch": 1595} {"train_loss": -21.534086227416992, "global_step": 132388, "epoch": 1595} {"train_loss": -21.486312866210938, "global_step": 132389, "epoch": 1595} {"train_loss": -21.609010696411133, "global_step": 132390, "epoch": 1595} {"train_loss": -21.933256149291992, "global_step": 132391, "epoch": 1595} {"train_loss": -21.72810935974121, "global_step": 132392, "epoch": 1595} {"train_loss": -22.72102928161621, "global_step": 132393, "epoch": 1595} {"train_loss": -22.360876083374023, "global_step": 132394, "epoch": 1595} {"train_loss": -22.2320613861084, "global_step": 132395, "epoch": 1595} {"train_loss": -22.166242599487305, "global_step": 132396, "epoch": 1595} {"train_loss": -22.12306022644043, "global_step": 132397, "epoch": 1595} {"train_loss": -21.980436325073242, "global_step": 132398, "epoch": 1595} {"train_loss": -22.676525115966797, "global_step": 132399, "epoch": 1595} {"train_loss": -22.329605102539062, "global_step": 132400, "epoch": 1595} {"train_loss": -22.25162696838379, "global_step": 132401, "epoch": 1595} {"train_loss": -22.527324676513672, "global_step": 132402, "epoch": 1595} {"train_loss": -22.245981216430664, "global_step": 132403, "epoch": 1595} {"train_loss": -22.646814346313477, "global_step": 132404, "epoch": 1595} {"train_loss": -22.813398361206055, "global_step": 132405, "epoch": 1595} {"train_loss": -22.26497459411621, "global_step": 132406, "epoch": 1595} {"train_loss": -22.55191421508789, "global_step": 132407, "epoch": 1595} {"train_loss": -22.693531036376953, "global_step": 132408, "epoch": 1595} {"train_loss": -22.650636672973633, "global_step": 132409, "epoch": 1595} {"train_loss": -22.950712203979492, "global_step": 132410, "epoch": 1595} {"train_loss": -22.73390007019043, "global_step": 132411, "epoch": 1595} {"train_loss": -22.777433395385742, "global_step": 132412, "epoch": 1595} {"train_loss": -22.80042839050293, "global_step": 132413, "epoch": 1595} {"train_loss": -22.744653701782227, "global_step": 132414, "epoch": 1595} {"train_loss": -22.84202003479004, "global_step": 132415, "epoch": 1595} {"train_loss": -22.623537063598633, "global_step": 132416, "epoch": 1595} {"train_loss": -22.918109893798828, "global_step": 132417, "epoch": 1595} {"train_loss": -22.58527946472168, "global_step": 132418, "epoch": 1595} {"train_loss": -22.664270401000977, "global_step": 132419, "epoch": 1595} {"train_loss": -22.859304428100586, "global_step": 132420, "epoch": 1595} {"train_loss": -22.971973419189453, "global_step": 132421, "epoch": 1595} {"train_loss": -22.9969539642334, "global_step": 132422, "epoch": 1595} {"train_loss": -22.570276260375977, "global_step": 132423, "epoch": 1595} {"train_loss": -22.842397689819336, "global_step": 132424, "epoch": 1595} {"train_loss": -22.637903213500977, "global_step": 132425, "epoch": 1595} {"train_loss": -22.880229949951172, "global_step": 132426, "epoch": 1595} {"train_loss": -22.60877799987793, "global_step": 132427, "epoch": 1595} {"train_loss": -22.900480270385742, "global_step": 132428, "epoch": 1595} {"train_loss": -22.801090240478516, "global_step": 132429, "epoch": 1595} {"train_loss": -22.88614273071289, "global_step": 132430, "epoch": 1595} {"train_loss": -22.848588943481445, "global_step": 132431, "epoch": 1595} {"train_loss": -23.01617431640625, "global_step": 132432, "epoch": 1595} {"train_loss": -23.017545700073242, "global_step": 132433, "epoch": 1595} {"train_loss": -22.61899185180664, "global_step": 132434, "epoch": 1595} {"train_loss": -23.17847442626953, "global_step": 132435, "epoch": 1595} {"train_loss": -23.128238677978516, "global_step": 132436, "epoch": 1595} {"train_loss": -22.82523536682129, "global_step": 132437, "epoch": 1595} {"train_loss": -22.82908058166504, "global_step": 132438, "epoch": 1595} {"train_loss": -23.094711303710938, "global_step": 132439, "epoch": 1595} {"train_loss": -22.898788452148438, "global_step": 132440, "epoch": 1595} {"train_loss": -23.130735397338867, "global_step": 132441, "epoch": 1595} {"train_loss": -23.357559204101562, "global_step": 132442, "epoch": 1595} {"train_loss": -22.59455108642578, "global_step": 132443, "epoch": 1595} {"train_loss": -22.980377197265625, "global_step": 132444, "epoch": 1595} {"train_loss": -22.513525009155273, "global_step": 132445, "epoch": 1595} {"train_loss": -23.058393478393555, "global_step": 132446, "epoch": 1595} {"train_loss": -22.597139358520508, "global_step": 132447, "epoch": 1595} {"train_loss": -22.740676879882812, "global_step": 132448, "epoch": 1595} {"train_loss": -22.37454605102539, "global_step": 132449, "epoch": 1595} {"train_loss": -23.062000274658203, "global_step": 132450, "epoch": 1595} {"train_loss": -22.294397354125977, "global_step": 132451, "epoch": 1595} {"train_loss": -22.615070343017578, "global_step": 132452, "epoch": 1595} {"train_loss": -22.608966827392578, "global_step": 132453, "epoch": 1595} {"train_loss": -22.7525691986084, "global_step": 132454, "epoch": 1595} {"train_loss": -22.69440269470215, "global_step": 132455, "epoch": 1595} {"train_loss": -22.798566818237305, "global_step": 132456, "epoch": 1595} {"train_loss": -23.101205825805664, "global_step": 132457, "epoch": 1595} {"train_loss": -23.209938049316406, "global_step": 132458, "epoch": 1595} {"train_loss": -22.795297622680664, "global_step": 132459, "epoch": 1595} {"train_loss": -22.97357749938965, "global_step": 132460, "epoch": 1595} {"train_loss": -23.108976364135742, "global_step": 132461, "epoch": 1595} {"train_loss": -22.772132873535156, "global_step": 132462, "epoch": 1595} {"train_loss": -23.05903434753418, "global_step": 132463, "epoch": 1595} {"train_loss": -23.01613426208496, "global_step": 132464, "epoch": 1595} {"train_loss": -23.078947067260742, "global_step": 132465, "epoch": 1595} {"train_loss": -22.475051879882812, "global_step": 132466, "epoch": 1595} {"train_loss": -22.63655678622694, "global_step": 132467, "epoch": 1595, "val_loss": 6474028.0} {"train_loss": -22.37456512451172, "global_step": 132468, "epoch": 1596} {"train_loss": -22.27139663696289, "global_step": 132469, "epoch": 1596} {"train_loss": -22.121450424194336, "global_step": 132470, "epoch": 1596} {"train_loss": -22.28011131286621, "global_step": 132471, "epoch": 1596} {"train_loss": -22.68891716003418, "global_step": 132472, "epoch": 1596} {"train_loss": -22.60066032409668, "global_step": 132473, "epoch": 1596} {"train_loss": -21.959096908569336, "global_step": 132474, "epoch": 1596} {"train_loss": -22.288171768188477, "global_step": 132475, "epoch": 1596} {"train_loss": -22.181360244750977, "global_step": 132476, "epoch": 1596} {"train_loss": -22.566368103027344, "global_step": 132477, "epoch": 1596} {"train_loss": -22.87787437438965, "global_step": 132478, "epoch": 1596} {"train_loss": -22.502260208129883, "global_step": 132479, "epoch": 1596} {"train_loss": -22.552270889282227, "global_step": 132480, "epoch": 1596} {"train_loss": -22.458480834960938, "global_step": 132481, "epoch": 1596} {"train_loss": -22.5358943939209, "global_step": 132482, "epoch": 1596} {"train_loss": -22.476016998291016, "global_step": 132483, "epoch": 1596} {"train_loss": -22.061037063598633, "global_step": 132484, "epoch": 1596} {"train_loss": -22.882123947143555, "global_step": 132485, "epoch": 1596} {"train_loss": -22.54899024963379, "global_step": 132486, "epoch": 1596} {"train_loss": -22.770740509033203, "global_step": 132487, "epoch": 1596} {"train_loss": -22.49380874633789, "global_step": 132488, "epoch": 1596} {"train_loss": -22.931476593017578, "global_step": 132489, "epoch": 1596} {"train_loss": -22.3952579498291, "global_step": 132490, "epoch": 1596} {"train_loss": -22.552627563476562, "global_step": 132491, "epoch": 1596} {"train_loss": -22.802051544189453, "global_step": 132492, "epoch": 1596} {"train_loss": -22.895715713500977, "global_step": 132493, "epoch": 1596} {"train_loss": -22.624845504760742, "global_step": 132494, "epoch": 1596} {"train_loss": -22.911701202392578, "global_step": 132495, "epoch": 1596} {"train_loss": -22.969825744628906, "global_step": 132496, "epoch": 1596} {"train_loss": -22.819669723510742, "global_step": 132497, "epoch": 1596} {"train_loss": -23.260208129882812, "global_step": 132498, "epoch": 1596} {"train_loss": -22.805837631225586, "global_step": 132499, "epoch": 1596} {"train_loss": -23.0181941986084, "global_step": 132500, "epoch": 1596} {"train_loss": -22.942197799682617, "global_step": 132501, "epoch": 1596} {"train_loss": -22.306228637695312, "global_step": 132502, "epoch": 1596} {"train_loss": -22.966707229614258, "global_step": 132503, "epoch": 1596} {"train_loss": -23.057968139648438, "global_step": 132504, "epoch": 1596} {"train_loss": -23.265522003173828, "global_step": 132505, "epoch": 1596} {"train_loss": -22.661718368530273, "global_step": 132506, "epoch": 1596} {"train_loss": -22.84549903869629, "global_step": 132507, "epoch": 1596} {"train_loss": -22.790647506713867, "global_step": 132508, "epoch": 1596} {"train_loss": -22.924558639526367, "global_step": 132509, "epoch": 1596} {"train_loss": -22.818347930908203, "global_step": 132510, "epoch": 1596} {"train_loss": -22.99734878540039, "global_step": 132511, "epoch": 1596} {"train_loss": -22.972522735595703, "global_step": 132512, "epoch": 1596} {"train_loss": -23.107046127319336, "global_step": 132513, "epoch": 1596} {"train_loss": -22.689905166625977, "global_step": 132514, "epoch": 1596} {"train_loss": -23.01286506652832, "global_step": 132515, "epoch": 1596} {"train_loss": -23.017831802368164, "global_step": 132516, "epoch": 1596} {"train_loss": -23.347389221191406, "global_step": 132517, "epoch": 1596} {"train_loss": -23.04488182067871, "global_step": 132518, "epoch": 1596} {"train_loss": -23.15781593322754, "global_step": 132519, "epoch": 1596} {"train_loss": -23.166128158569336, "global_step": 132520, "epoch": 1596} {"train_loss": -23.00263023376465, "global_step": 132521, "epoch": 1596} {"train_loss": -23.050352096557617, "global_step": 132522, "epoch": 1596} {"train_loss": -23.141063690185547, "global_step": 132523, "epoch": 1596} {"train_loss": -22.98148536682129, "global_step": 132524, "epoch": 1596} {"train_loss": -22.84111976623535, "global_step": 132525, "epoch": 1596} {"train_loss": -22.59345245361328, "global_step": 132526, "epoch": 1596} {"train_loss": -22.729751586914062, "global_step": 132527, "epoch": 1596} {"train_loss": -23.127479553222656, "global_step": 132528, "epoch": 1596} {"train_loss": -22.813461303710938, "global_step": 132529, "epoch": 1596} {"train_loss": -22.90262222290039, "global_step": 132530, "epoch": 1596} {"train_loss": -23.208791732788086, "global_step": 132531, "epoch": 1596} {"train_loss": -23.086383819580078, "global_step": 132532, "epoch": 1596} {"train_loss": -22.746625900268555, "global_step": 132533, "epoch": 1596} {"train_loss": -22.88389015197754, "global_step": 132534, "epoch": 1596} {"train_loss": -22.586931228637695, "global_step": 132535, "epoch": 1596} {"train_loss": -23.201379776000977, "global_step": 132536, "epoch": 1596} {"train_loss": -22.89253807067871, "global_step": 132537, "epoch": 1596} {"train_loss": -22.642822265625, "global_step": 132538, "epoch": 1596} {"train_loss": -22.774747848510742, "global_step": 132539, "epoch": 1596} {"train_loss": -22.9320125579834, "global_step": 132540, "epoch": 1596} {"train_loss": -22.703033447265625, "global_step": 132541, "epoch": 1596} {"train_loss": -22.753076553344727, "global_step": 132542, "epoch": 1596} {"train_loss": -23.02141571044922, "global_step": 132543, "epoch": 1596} {"train_loss": -22.54849624633789, "global_step": 132544, "epoch": 1596} {"train_loss": -22.84732437133789, "global_step": 132545, "epoch": 1596} {"train_loss": -22.877479553222656, "global_step": 132546, "epoch": 1596} {"train_loss": -22.52511215209961, "global_step": 132547, "epoch": 1596} {"train_loss": -22.86537742614746, "global_step": 132548, "epoch": 1596} {"train_loss": -22.77674102783203, "global_step": 132549, "epoch": 1596} {"train_loss": -22.767010217689606, "global_step": 132550, "epoch": 1596, "val_loss": 6139254.0} {"train_loss": -21.986440658569336, "global_step": 132551, "epoch": 1597} {"train_loss": -21.79072380065918, "global_step": 132552, "epoch": 1597} {"train_loss": -21.961654663085938, "global_step": 132553, "epoch": 1597} {"train_loss": -21.940122604370117, "global_step": 132554, "epoch": 1597} {"train_loss": -21.624990463256836, "global_step": 132555, "epoch": 1597} {"train_loss": -22.130279541015625, "global_step": 132556, "epoch": 1597} {"train_loss": -22.490751266479492, "global_step": 132557, "epoch": 1597} {"train_loss": -22.541101455688477, "global_step": 132558, "epoch": 1597} {"train_loss": -22.23390007019043, "global_step": 132559, "epoch": 1597} {"train_loss": -22.24782943725586, "global_step": 132560, "epoch": 1597} {"train_loss": -22.460214614868164, "global_step": 132561, "epoch": 1597} {"train_loss": -21.93082618713379, "global_step": 132562, "epoch": 1597} {"train_loss": -22.362899780273438, "global_step": 132563, "epoch": 1597} {"train_loss": -22.38232421875, "global_step": 132564, "epoch": 1597} {"train_loss": -22.48737335205078, "global_step": 132565, "epoch": 1597} {"train_loss": -22.54669189453125, "global_step": 132566, "epoch": 1597} {"train_loss": -22.031652450561523, "global_step": 132567, "epoch": 1597} {"train_loss": -22.437646865844727, "global_step": 132568, "epoch": 1597} {"train_loss": -22.531394958496094, "global_step": 132569, "epoch": 1597} {"train_loss": -22.406553268432617, "global_step": 132570, "epoch": 1597} {"train_loss": -22.59677505493164, "global_step": 132571, "epoch": 1597} {"train_loss": -22.63835334777832, "global_step": 132572, "epoch": 1597} {"train_loss": -22.8890323638916, "global_step": 132573, "epoch": 1597} {"train_loss": -22.745473861694336, "global_step": 132574, "epoch": 1597} {"train_loss": -22.927871704101562, "global_step": 132575, "epoch": 1597} {"train_loss": -22.45143699645996, "global_step": 132576, "epoch": 1597} {"train_loss": -22.78565216064453, "global_step": 132577, "epoch": 1597} {"train_loss": -23.10430335998535, "global_step": 132578, "epoch": 1597} {"train_loss": -22.626895904541016, "global_step": 132579, "epoch": 1597} {"train_loss": -22.58704948425293, "global_step": 132580, "epoch": 1597} {"train_loss": -22.868783950805664, "global_step": 132581, "epoch": 1597} {"train_loss": -22.61274528503418, "global_step": 132582, "epoch": 1597} {"train_loss": -22.5498046875, "global_step": 132583, "epoch": 1597} {"train_loss": -23.1634578704834, "global_step": 132584, "epoch": 1597} {"train_loss": -22.79275894165039, "global_step": 132585, "epoch": 1597} {"train_loss": -22.61867332458496, "global_step": 132586, "epoch": 1597} {"train_loss": -23.02081871032715, "global_step": 132587, "epoch": 1597} {"train_loss": -22.763547897338867, "global_step": 132588, "epoch": 1597} {"train_loss": -23.323305130004883, "global_step": 132589, "epoch": 1597} {"train_loss": -22.81770896911621, "global_step": 132590, "epoch": 1597} {"train_loss": -22.618986129760742, "global_step": 132591, "epoch": 1597} {"train_loss": -22.30243682861328, "global_step": 132592, "epoch": 1597} {"train_loss": -22.979238510131836, "global_step": 132593, "epoch": 1597} {"train_loss": -23.020849227905273, "global_step": 132594, "epoch": 1597} {"train_loss": -22.64091682434082, "global_step": 132595, "epoch": 1597} {"train_loss": -23.1286678314209, "global_step": 132596, "epoch": 1597} {"train_loss": -23.070159912109375, "global_step": 132597, "epoch": 1597} {"train_loss": -22.894269943237305, "global_step": 132598, "epoch": 1597} {"train_loss": -22.561182022094727, "global_step": 132599, "epoch": 1597} {"train_loss": -22.905420303344727, "global_step": 132600, "epoch": 1597} {"train_loss": -22.831085205078125, "global_step": 132601, "epoch": 1597} {"train_loss": -22.835973739624023, "global_step": 132602, "epoch": 1597} {"train_loss": -22.838293075561523, "global_step": 132603, "epoch": 1597} {"train_loss": -22.84422492980957, "global_step": 132604, "epoch": 1597} {"train_loss": -23.059968948364258, "global_step": 132605, "epoch": 1597} {"train_loss": -22.82670021057129, "global_step": 132606, "epoch": 1597} {"train_loss": -22.436275482177734, "global_step": 132607, "epoch": 1597} {"train_loss": -23.194866180419922, "global_step": 132608, "epoch": 1597} {"train_loss": -22.877912521362305, "global_step": 132609, "epoch": 1597} {"train_loss": -23.024991989135742, "global_step": 132610, "epoch": 1597} {"train_loss": -22.950925827026367, "global_step": 132611, "epoch": 1597} {"train_loss": -22.789194107055664, "global_step": 132612, "epoch": 1597} {"train_loss": -22.579578399658203, "global_step": 132613, "epoch": 1597} {"train_loss": -23.128524780273438, "global_step": 132614, "epoch": 1597} {"train_loss": -22.76740264892578, "global_step": 132615, "epoch": 1597} {"train_loss": -23.085241317749023, "global_step": 132616, "epoch": 1597} {"train_loss": -23.030691146850586, "global_step": 132617, "epoch": 1597} {"train_loss": -22.71636199951172, "global_step": 132618, "epoch": 1597} {"train_loss": -22.784772872924805, "global_step": 132619, "epoch": 1597} {"train_loss": -23.171493530273438, "global_step": 132620, "epoch": 1597} {"train_loss": -22.68560218811035, "global_step": 132621, "epoch": 1597} {"train_loss": -23.159488677978516, "global_step": 132622, "epoch": 1597} {"train_loss": -22.70277976989746, "global_step": 132623, "epoch": 1597} {"train_loss": -22.581924438476562, "global_step": 132624, "epoch": 1597} {"train_loss": -22.59733009338379, "global_step": 132625, "epoch": 1597} {"train_loss": -22.858564376831055, "global_step": 132626, "epoch": 1597} {"train_loss": -22.7072811126709, "global_step": 132627, "epoch": 1597} {"train_loss": -23.03302574157715, "global_step": 132628, "epoch": 1597} {"train_loss": -22.889089584350586, "global_step": 132629, "epoch": 1597} {"train_loss": -22.737274169921875, "global_step": 132630, "epoch": 1597} {"train_loss": -22.94354820251465, "global_step": 132631, "epoch": 1597} {"train_loss": -22.869892120361328, "global_step": 132632, "epoch": 1597} {"train_loss": -22.69113322338426, "global_step": 132633, "epoch": 1597, "val_loss": 6291378.0} {"train_loss": -22.6359920501709, "global_step": 132634, "epoch": 1598} {"train_loss": -22.17991065979004, "global_step": 132635, "epoch": 1598} {"train_loss": -22.763675689697266, "global_step": 132636, "epoch": 1598} {"train_loss": -22.05559730529785, "global_step": 132637, "epoch": 1598} {"train_loss": -22.681583404541016, "global_step": 132638, "epoch": 1598} {"train_loss": -22.758861541748047, "global_step": 132639, "epoch": 1598} {"train_loss": -22.740676879882812, "global_step": 132640, "epoch": 1598} {"train_loss": -22.82869529724121, "global_step": 132641, "epoch": 1598} {"train_loss": -22.63349723815918, "global_step": 132642, "epoch": 1598} {"train_loss": -22.87125587463379, "global_step": 132643, "epoch": 1598} {"train_loss": -22.669769287109375, "global_step": 132644, "epoch": 1598} {"train_loss": -22.50119972229004, "global_step": 132645, "epoch": 1598} {"train_loss": -22.940689086914062, "global_step": 132646, "epoch": 1598} {"train_loss": -22.79849624633789, "global_step": 132647, "epoch": 1598} {"train_loss": -22.579137802124023, "global_step": 132648, "epoch": 1598} {"train_loss": -22.699607849121094, "global_step": 132649, "epoch": 1598} {"train_loss": -22.53481101989746, "global_step": 132650, "epoch": 1598} {"train_loss": -22.92131996154785, "global_step": 132651, "epoch": 1598} {"train_loss": -22.87744140625, "global_step": 132652, "epoch": 1598} {"train_loss": -23.163808822631836, "global_step": 132653, "epoch": 1598} {"train_loss": -23.003427505493164, "global_step": 132654, "epoch": 1598} {"train_loss": -22.845544815063477, "global_step": 132655, "epoch": 1598} {"train_loss": -22.519922256469727, "global_step": 132656, "epoch": 1598} {"train_loss": -22.344722747802734, "global_step": 132657, "epoch": 1598} {"train_loss": -22.850479125976562, "global_step": 132658, "epoch": 1598} {"train_loss": -22.37222671508789, "global_step": 132659, "epoch": 1598} {"train_loss": -22.521268844604492, "global_step": 132660, "epoch": 1598} {"train_loss": -22.896509170532227, "global_step": 132661, "epoch": 1598} {"train_loss": -22.799360275268555, "global_step": 132662, "epoch": 1598} {"train_loss": -22.45449447631836, "global_step": 132663, "epoch": 1598} {"train_loss": -22.768692016601562, "global_step": 132664, "epoch": 1598} {"train_loss": -22.714778900146484, "global_step": 132665, "epoch": 1598} {"train_loss": -22.792234420776367, "global_step": 132666, "epoch": 1598} {"train_loss": -23.147563934326172, "global_step": 132667, "epoch": 1598} {"train_loss": -23.078115463256836, "global_step": 132668, "epoch": 1598} {"train_loss": -23.12750244140625, "global_step": 132669, "epoch": 1598} {"train_loss": -22.656293869018555, "global_step": 132670, "epoch": 1598} {"train_loss": -22.86025047302246, "global_step": 132671, "epoch": 1598} {"train_loss": -22.993284225463867, "global_step": 132672, "epoch": 1598} {"train_loss": -22.8598690032959, "global_step": 132673, "epoch": 1598} {"train_loss": -22.98036766052246, "global_step": 132674, "epoch": 1598} {"train_loss": -23.089811325073242, "global_step": 132675, "epoch": 1598} {"train_loss": -22.807884216308594, "global_step": 132676, "epoch": 1598} {"train_loss": -23.047033309936523, "global_step": 132677, "epoch": 1598} {"train_loss": -22.877920150756836, "global_step": 132678, "epoch": 1598} {"train_loss": -23.185354232788086, "global_step": 132679, "epoch": 1598} {"train_loss": -22.857053756713867, "global_step": 132680, "epoch": 1598} {"train_loss": -22.754358291625977, "global_step": 132681, "epoch": 1598} {"train_loss": -22.765893936157227, "global_step": 132682, "epoch": 1598} {"train_loss": -23.2353458404541, "global_step": 132683, "epoch": 1598} {"train_loss": -22.743383407592773, "global_step": 132684, "epoch": 1598} {"train_loss": -23.129491806030273, "global_step": 132685, "epoch": 1598} {"train_loss": -23.227787017822266, "global_step": 132686, "epoch": 1598} {"train_loss": -23.011123657226562, "global_step": 132687, "epoch": 1598} {"train_loss": -22.888378143310547, "global_step": 132688, "epoch": 1598} {"train_loss": -22.885608673095703, "global_step": 132689, "epoch": 1598} {"train_loss": -22.89656639099121, "global_step": 132690, "epoch": 1598} {"train_loss": -22.760786056518555, "global_step": 132691, "epoch": 1598} {"train_loss": -22.878454208374023, "global_step": 132692, "epoch": 1598} {"train_loss": -23.065824508666992, "global_step": 132693, "epoch": 1598} {"train_loss": -23.115720748901367, "global_step": 132694, "epoch": 1598} {"train_loss": -22.92255210876465, "global_step": 132695, "epoch": 1598} {"train_loss": -22.935317993164062, "global_step": 132696, "epoch": 1598} {"train_loss": -22.705289840698242, "global_step": 132697, "epoch": 1598} {"train_loss": -22.802818298339844, "global_step": 132698, "epoch": 1598} {"train_loss": -23.038007736206055, "global_step": 132699, "epoch": 1598} {"train_loss": -22.825454711914062, "global_step": 132700, "epoch": 1598} {"train_loss": -22.830703735351562, "global_step": 132701, "epoch": 1598} {"train_loss": -22.85468864440918, "global_step": 132702, "epoch": 1598} {"train_loss": -22.798654556274414, "global_step": 132703, "epoch": 1598} {"train_loss": -23.12541961669922, "global_step": 132704, "epoch": 1598} {"train_loss": -22.730178833007812, "global_step": 132705, "epoch": 1598} {"train_loss": -22.855958938598633, "global_step": 132706, "epoch": 1598} {"train_loss": -22.797876358032227, "global_step": 132707, "epoch": 1598} {"train_loss": -23.061737060546875, "global_step": 132708, "epoch": 1598} {"train_loss": -22.870710372924805, "global_step": 132709, "epoch": 1598} {"train_loss": -22.95285415649414, "global_step": 132710, "epoch": 1598} {"train_loss": -22.550161361694336, "global_step": 132711, "epoch": 1598} {"train_loss": -22.622074127197266, "global_step": 132712, "epoch": 1598} {"train_loss": -22.879531860351562, "global_step": 132713, "epoch": 1598} {"train_loss": -23.141653060913086, "global_step": 132714, "epoch": 1598} {"train_loss": -22.753604888916016, "global_step": 132715, "epoch": 1598} {"train_loss": -22.819226827966162, "global_step": 132716, "epoch": 1598, "val_loss": 6461019.0} {"train_loss": -20.75668716430664, "global_step": 132717, "epoch": 1599} {"train_loss": -21.742483139038086, "global_step": 132718, "epoch": 1599} {"train_loss": -22.0273380279541, "global_step": 132719, "epoch": 1599} {"train_loss": -22.598241806030273, "global_step": 132720, "epoch": 1599} {"train_loss": -22.65480613708496, "global_step": 132721, "epoch": 1599} {"train_loss": -22.182098388671875, "global_step": 132722, "epoch": 1599} {"train_loss": -22.35550880432129, "global_step": 132723, "epoch": 1599} {"train_loss": -22.711774826049805, "global_step": 132724, "epoch": 1599} {"train_loss": -22.024751663208008, "global_step": 132725, "epoch": 1599} {"train_loss": -22.405031204223633, "global_step": 132726, "epoch": 1599} {"train_loss": -22.384353637695312, "global_step": 132727, "epoch": 1599} {"train_loss": -22.333890914916992, "global_step": 132728, "epoch": 1599} {"train_loss": -22.5591983795166, "global_step": 132729, "epoch": 1599} {"train_loss": -22.321338653564453, "global_step": 132730, "epoch": 1599} {"train_loss": -22.232131958007812, "global_step": 132731, "epoch": 1599} {"train_loss": -22.858463287353516, "global_step": 132732, "epoch": 1599} {"train_loss": -22.265213012695312, "global_step": 132733, "epoch": 1599} {"train_loss": -22.470596313476562, "global_step": 132734, "epoch": 1599} {"train_loss": -22.71581268310547, "global_step": 132735, "epoch": 1599} {"train_loss": -22.748987197875977, "global_step": 132736, "epoch": 1599} {"train_loss": -22.653505325317383, "global_step": 132737, "epoch": 1599} {"train_loss": -22.36871337890625, "global_step": 132738, "epoch": 1599} {"train_loss": -22.54335594177246, "global_step": 132739, "epoch": 1599} {"train_loss": -22.54981803894043, "global_step": 132740, "epoch": 1599} {"train_loss": -22.637014389038086, "global_step": 132741, "epoch": 1599} {"train_loss": -22.8441104888916, "global_step": 132742, "epoch": 1599} {"train_loss": -22.774364471435547, "global_step": 132743, "epoch": 1599} {"train_loss": -23.1726131439209, "global_step": 132744, "epoch": 1599} {"train_loss": -22.677371978759766, "global_step": 132745, "epoch": 1599} {"train_loss": -23.071043014526367, "global_step": 132746, "epoch": 1599} {"train_loss": -22.2371826171875, "global_step": 132747, "epoch": 1599} {"train_loss": -22.515689849853516, "global_step": 132748, "epoch": 1599} {"train_loss": -22.851947784423828, "global_step": 132749, "epoch": 1599} {"train_loss": -22.778106689453125, "global_step": 132750, "epoch": 1599} {"train_loss": -22.691022872924805, "global_step": 132751, "epoch": 1599} {"train_loss": -22.834081649780273, "global_step": 132752, "epoch": 1599} {"train_loss": -22.7359676361084, "global_step": 132753, "epoch": 1599} {"train_loss": -22.862607955932617, "global_step": 132754, "epoch": 1599} {"train_loss": -22.560060501098633, "global_step": 132755, "epoch": 1599} {"train_loss": -23.005615234375, "global_step": 132756, "epoch": 1599} {"train_loss": -22.916885375976562, "global_step": 132757, "epoch": 1599} {"train_loss": -22.835739135742188, "global_step": 132758, "epoch": 1599} {"train_loss": -22.89810562133789, "global_step": 132759, "epoch": 1599} {"train_loss": -22.843252182006836, "global_step": 132760, "epoch": 1599} {"train_loss": -23.016845703125, "global_step": 132761, "epoch": 1599} {"train_loss": -22.553335189819336, "global_step": 132762, "epoch": 1599} {"train_loss": -23.07056427001953, "global_step": 132763, "epoch": 1599} {"train_loss": -22.994050979614258, "global_step": 132764, "epoch": 1599} {"train_loss": -23.08159637451172, "global_step": 132765, "epoch": 1599} {"train_loss": -23.32916831970215, "global_step": 132766, "epoch": 1599} {"train_loss": -22.50102424621582, "global_step": 132767, "epoch": 1599} {"train_loss": -22.79725456237793, "global_step": 132768, "epoch": 1599} {"train_loss": -23.11280632019043, "global_step": 132769, "epoch": 1599} {"train_loss": -23.010496139526367, "global_step": 132770, "epoch": 1599} {"train_loss": -22.70778465270996, "global_step": 132771, "epoch": 1599} {"train_loss": -23.11736488342285, "global_step": 132772, "epoch": 1599} {"train_loss": -23.21703338623047, "global_step": 132773, "epoch": 1599} {"train_loss": -22.81023406982422, "global_step": 132774, "epoch": 1599} {"train_loss": -22.766498565673828, "global_step": 132775, "epoch": 1599} {"train_loss": -22.58489990234375, "global_step": 132776, "epoch": 1599} {"train_loss": -22.655094146728516, "global_step": 132777, "epoch": 1599} {"train_loss": -22.82996368408203, "global_step": 132778, "epoch": 1599} {"train_loss": -22.855100631713867, "global_step": 132779, "epoch": 1599} {"train_loss": -23.051218032836914, "global_step": 132780, "epoch": 1599} {"train_loss": -22.795433044433594, "global_step": 132781, "epoch": 1599} {"train_loss": -22.79914665222168, "global_step": 132782, "epoch": 1599} {"train_loss": -23.1239013671875, "global_step": 132783, "epoch": 1599} {"train_loss": -22.73915672302246, "global_step": 132784, "epoch": 1599} {"train_loss": -22.426422119140625, "global_step": 132785, "epoch": 1599} {"train_loss": -22.783432006835938, "global_step": 132786, "epoch": 1599} {"train_loss": -23.029285430908203, "global_step": 132787, "epoch": 1599} {"train_loss": -23.14445686340332, "global_step": 132788, "epoch": 1599} {"train_loss": -22.76226806640625, "global_step": 132789, "epoch": 1599} {"train_loss": -22.833072662353516, "global_step": 132790, "epoch": 1599} {"train_loss": -23.187152862548828, "global_step": 132791, "epoch": 1599} {"train_loss": -22.795698165893555, "global_step": 132792, "epoch": 1599} {"train_loss": -22.99068832397461, "global_step": 132793, "epoch": 1599} {"train_loss": -22.88328742980957, "global_step": 132794, "epoch": 1599} {"train_loss": -22.862524032592773, "global_step": 132795, "epoch": 1599} {"train_loss": -22.30965232849121, "global_step": 132796, "epoch": 1599} {"train_loss": -22.969125747680664, "global_step": 132797, "epoch": 1599} {"train_loss": -22.61920738220215, "global_step": 132798, "epoch": 1599} {"train_loss": -22.70798076491758, "global_step": 132799, "epoch": 1599, "val_loss": 6309560.0} {"train_loss": -22.594812393188477, "global_step": 132800, "epoch": 1600} {"train_loss": -22.846479415893555, "global_step": 132801, "epoch": 1600} {"train_loss": -22.56331443786621, "global_step": 132802, "epoch": 1600} {"train_loss": -22.765745162963867, "global_step": 132803, "epoch": 1600} {"train_loss": -22.810134887695312, "global_step": 132804, "epoch": 1600} {"train_loss": -22.72464942932129, "global_step": 132805, "epoch": 1600} {"train_loss": -22.576522827148438, "global_step": 132806, "epoch": 1600} {"train_loss": -22.743568420410156, "global_step": 132807, "epoch": 1600} {"train_loss": -22.72383689880371, "global_step": 132808, "epoch": 1600} {"train_loss": -22.76268196105957, "global_step": 132809, "epoch": 1600} {"train_loss": -22.870689392089844, "global_step": 132810, "epoch": 1600} {"train_loss": -22.654346466064453, "global_step": 132811, "epoch": 1600} {"train_loss": -22.493671417236328, "global_step": 132812, "epoch": 1600} {"train_loss": -22.48145866394043, "global_step": 132813, "epoch": 1600} {"train_loss": -22.18029022216797, "global_step": 132814, "epoch": 1600} {"train_loss": -22.459524154663086, "global_step": 132815, "epoch": 1600} {"train_loss": -22.517385482788086, "global_step": 132816, "epoch": 1600} {"train_loss": -22.630908966064453, "global_step": 132817, "epoch": 1600} {"train_loss": -22.685726165771484, "global_step": 132818, "epoch": 1600} {"train_loss": -22.608762741088867, "global_step": 132819, "epoch": 1600} {"train_loss": -22.5848331451416, "global_step": 132820, "epoch": 1600} {"train_loss": -22.746984481811523, "global_step": 132821, "epoch": 1600} {"train_loss": -22.742156982421875, "global_step": 132822, "epoch": 1600} {"train_loss": -22.769773483276367, "global_step": 132823, "epoch": 1600} {"train_loss": -22.546871185302734, "global_step": 132824, "epoch": 1600} {"train_loss": -22.70974349975586, "global_step": 132825, "epoch": 1600} {"train_loss": -22.65604591369629, "global_step": 132826, "epoch": 1600} {"train_loss": -22.634143829345703, "global_step": 132827, "epoch": 1600} {"train_loss": -22.720399856567383, "global_step": 132828, "epoch": 1600} {"train_loss": -22.73457908630371, "global_step": 132829, "epoch": 1600} {"train_loss": -22.959354400634766, "global_step": 132830, "epoch": 1600} {"train_loss": -23.00143051147461, "global_step": 132831, "epoch": 1600} {"train_loss": -22.806364059448242, "global_step": 132832, "epoch": 1600} {"train_loss": -22.837106704711914, "global_step": 132833, "epoch": 1600} {"train_loss": -23.104482650756836, "global_step": 132834, "epoch": 1600} {"train_loss": -23.046178817749023, "global_step": 132835, "epoch": 1600} {"train_loss": -23.164533615112305, "global_step": 132836, "epoch": 1600} {"train_loss": -22.93759536743164, "global_step": 132837, "epoch": 1600} {"train_loss": -22.939809799194336, "global_step": 132838, "epoch": 1600} {"train_loss": -23.133792877197266, "global_step": 132839, "epoch": 1600} {"train_loss": -22.71550941467285, "global_step": 132840, "epoch": 1600} {"train_loss": -22.79888916015625, "global_step": 132841, "epoch": 1600} {"train_loss": -23.015701293945312, "global_step": 132842, "epoch": 1600} {"train_loss": -22.861013412475586, "global_step": 132843, "epoch": 1600} {"train_loss": -22.658063888549805, "global_step": 132844, "epoch": 1600} {"train_loss": -22.808401107788086, "global_step": 132845, "epoch": 1600} {"train_loss": -22.755245208740234, "global_step": 132846, "epoch": 1600} {"train_loss": -23.000951766967773, "global_step": 132847, "epoch": 1600} {"train_loss": -22.983020782470703, "global_step": 132848, "epoch": 1600} {"train_loss": -22.64803123474121, "global_step": 132849, "epoch": 1600} {"train_loss": -22.955305099487305, "global_step": 132850, "epoch": 1600} {"train_loss": -23.201648712158203, "global_step": 132851, "epoch": 1600} {"train_loss": -22.960302352905273, "global_step": 132852, "epoch": 1600} {"train_loss": -23.140579223632812, "global_step": 132853, "epoch": 1600} {"train_loss": -23.08846664428711, "global_step": 132854, "epoch": 1600} {"train_loss": -23.142698287963867, "global_step": 132855, "epoch": 1600} {"train_loss": -22.895145416259766, "global_step": 132856, "epoch": 1600} {"train_loss": -22.965837478637695, "global_step": 132857, "epoch": 1600} {"train_loss": -22.744474411010742, "global_step": 132858, "epoch": 1600} {"train_loss": -23.08436393737793, "global_step": 132859, "epoch": 1600} {"train_loss": -22.998504638671875, "global_step": 132860, "epoch": 1600} {"train_loss": -22.6192626953125, "global_step": 132861, "epoch": 1600} {"train_loss": -22.994983673095703, "global_step": 132862, "epoch": 1600} {"train_loss": -23.10563850402832, "global_step": 132863, "epoch": 1600} {"train_loss": -22.76375389099121, "global_step": 132864, "epoch": 1600} {"train_loss": -22.478296279907227, "global_step": 132865, "epoch": 1600} {"train_loss": -22.64307975769043, "global_step": 132866, "epoch": 1600} {"train_loss": -23.197587966918945, "global_step": 132867, "epoch": 1600} {"train_loss": -22.912513732910156, "global_step": 132868, "epoch": 1600} {"train_loss": -22.95244026184082, "global_step": 132869, "epoch": 1600} {"train_loss": -23.095869064331055, "global_step": 132870, "epoch": 1600} {"train_loss": -22.860158920288086, "global_step": 132871, "epoch": 1600} {"train_loss": -23.09552764892578, "global_step": 132872, "epoch": 1600} {"train_loss": -22.716751098632812, "global_step": 132873, "epoch": 1600} {"train_loss": -22.759506225585938, "global_step": 132874, "epoch": 1600} {"train_loss": -23.08786964416504, "global_step": 132875, "epoch": 1600} {"train_loss": -22.81058120727539, "global_step": 132876, "epoch": 1600} {"train_loss": -23.0638427734375, "global_step": 132877, "epoch": 1600} {"train_loss": -22.875003814697266, "global_step": 132878, "epoch": 1600} {"train_loss": -22.93821144104004, "global_step": 132879, "epoch": 1600} {"train_loss": -23.019872665405273, "global_step": 132880, "epoch": 1600} {"train_loss": -22.67160415649414, "global_step": 132881, "epoch": 1600} {"train_loss": -22.82534930217697, "global_step": 132882, "epoch": 1600, "train/sim_max_reward_0": 1.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4500000": 1.0, "test/sim_max_reward_4500001": 1.0, "test/sim_max_reward_4500002": 1.0, "test/sim_max_reward_4500003": 1.0, "test/sim_max_reward_4500004": 1.0, "test/sim_max_reward_4500005": 1.0, "test/sim_max_reward_4500006": 1.0, "test/sim_max_reward_4500007": 1.0, "test/sim_max_reward_4500008": 1.0, "test/sim_max_reward_4500009": 1.0, "test/sim_max_reward_4500010": 1.0, "test/sim_max_reward_4500011": 1.0, "test/sim_max_reward_4500012": 1.0, "test/sim_max_reward_4500013": 1.0, "test/sim_max_reward_4500014": 1.0, "test/sim_max_reward_4500015": 1.0, "test/sim_max_reward_4500016": 1.0, "test/sim_max_reward_4500017": 1.0, "test/sim_max_reward_4500018": 1.0, "test/sim_max_reward_4500019": 0.0, "test/sim_max_reward_4500020": 1.0, "test/sim_max_reward_4500021": 1.0, "train/mean_score": 1.0, "test/mean_score": 0.9545454545454546, "val_loss": 6238128.0} {"train_loss": -22.60076141357422, "global_step": 132883, "epoch": 1601} {"train_loss": -22.464567184448242, "global_step": 132884, "epoch": 1601} {"train_loss": -22.324556350708008, "global_step": 132885, "epoch": 1601} {"train_loss": -21.96860122680664, "global_step": 132886, "epoch": 1601} {"train_loss": -22.61077880859375, "global_step": 132887, "epoch": 1601} {"train_loss": -22.133304595947266, "global_step": 132888, "epoch": 1601} {"train_loss": -22.279203414916992, "global_step": 132889, "epoch": 1601} {"train_loss": -22.3619384765625, "global_step": 132890, "epoch": 1601} {"train_loss": -22.6571102142334, "global_step": 132891, "epoch": 1601} {"train_loss": -22.480777740478516, "global_step": 132892, "epoch": 1601} {"train_loss": -22.35186767578125, "global_step": 132893, "epoch": 1601} {"train_loss": -22.605985641479492, "global_step": 132894, "epoch": 1601} {"train_loss": -22.396642684936523, "global_step": 132895, "epoch": 1601} {"train_loss": -23.009265899658203, "global_step": 132896, "epoch": 1601} {"train_loss": -22.603723526000977, "global_step": 132897, "epoch": 1601} {"train_loss": -22.213754653930664, "global_step": 132898, "epoch": 1601} {"train_loss": -23.00725746154785, "global_step": 132899, "epoch": 1601} {"train_loss": -22.733503341674805, "global_step": 132900, "epoch": 1601} {"train_loss": -22.60173225402832, "global_step": 132901, "epoch": 1601} {"train_loss": -22.779502868652344, "global_step": 132902, "epoch": 1601} {"train_loss": -22.50636863708496, "global_step": 132903, "epoch": 1601} {"train_loss": -22.55782127380371, "global_step": 132904, "epoch": 1601} {"train_loss": -22.616453170776367, "global_step": 132905, "epoch": 1601} {"train_loss": -22.919506072998047, "global_step": 132906, "epoch": 1601} {"train_loss": -22.786165237426758, "global_step": 132907, "epoch": 1601} {"train_loss": -22.595117568969727, "global_step": 132908, "epoch": 1601} {"train_loss": -23.126821517944336, "global_step": 132909, "epoch": 1601} {"train_loss": -22.694713592529297, "global_step": 132910, "epoch": 1601} {"train_loss": -22.913330078125, "global_step": 132911, "epoch": 1601} {"train_loss": -22.88143539428711, "global_step": 132912, "epoch": 1601} {"train_loss": -22.76515007019043, "global_step": 132913, "epoch": 1601} {"train_loss": -23.185075759887695, "global_step": 132914, "epoch": 1601} {"train_loss": -22.88637351989746, "global_step": 132915, "epoch": 1601} {"train_loss": -22.863576889038086, "global_step": 132916, "epoch": 1601} {"train_loss": -23.062475204467773, "global_step": 132917, "epoch": 1601} {"train_loss": -22.630573272705078, "global_step": 132918, "epoch": 1601} {"train_loss": -22.972745895385742, "global_step": 132919, "epoch": 1601} {"train_loss": -22.55649757385254, "global_step": 132920, "epoch": 1601} {"train_loss": -22.95880889892578, "global_step": 132921, "epoch": 1601} {"train_loss": -22.440649032592773, "global_step": 132922, "epoch": 1601} {"train_loss": -22.607641220092773, "global_step": 132923, "epoch": 1601} {"train_loss": -22.734790802001953, "global_step": 132924, "epoch": 1601} {"train_loss": -22.9138126373291, "global_step": 132925, "epoch": 1601} {"train_loss": -22.599374771118164, "global_step": 132926, "epoch": 1601} {"train_loss": -22.88527488708496, "global_step": 132927, "epoch": 1601} {"train_loss": -22.91371726989746, "global_step": 132928, "epoch": 1601} {"train_loss": -23.145811080932617, "global_step": 132929, "epoch": 1601} {"train_loss": -22.72993278503418, "global_step": 132930, "epoch": 1601} {"train_loss": -22.901809692382812, "global_step": 132931, "epoch": 1601} {"train_loss": -22.716562271118164, "global_step": 132932, "epoch": 1601} {"train_loss": -23.024595260620117, "global_step": 132933, "epoch": 1601} {"train_loss": -22.64687156677246, "global_step": 132934, "epoch": 1601} {"train_loss": -23.28584861755371, "global_step": 132935, "epoch": 1601} {"train_loss": -22.835987091064453, "global_step": 132936, "epoch": 1601} {"train_loss": -23.035932540893555, "global_step": 132937, "epoch": 1601} {"train_loss": -22.970903396606445, "global_step": 132938, "epoch": 1601} {"train_loss": -22.64974021911621, "global_step": 132939, "epoch": 1601} {"train_loss": -22.78413200378418, "global_step": 132940, "epoch": 1601} {"train_loss": -23.27872657775879, "global_step": 132941, "epoch": 1601} {"train_loss": -22.87153434753418, "global_step": 132942, "epoch": 1601} {"train_loss": -22.77382469177246, "global_step": 132943, "epoch": 1601} {"train_loss": -22.787473678588867, "global_step": 132944, "epoch": 1601} {"train_loss": -22.735759735107422, "global_step": 132945, "epoch": 1601} {"train_loss": -23.015918731689453, "global_step": 132946, "epoch": 1601} {"train_loss": -23.181974411010742, "global_step": 132947, "epoch": 1601} {"train_loss": -22.550079345703125, "global_step": 132948, "epoch": 1601} {"train_loss": -22.702917098999023, "global_step": 132949, "epoch": 1601} {"train_loss": -22.913084030151367, "global_step": 132950, "epoch": 1601} {"train_loss": -22.828927993774414, "global_step": 132951, "epoch": 1601} {"train_loss": -22.819509506225586, "global_step": 132952, "epoch": 1601} {"train_loss": -22.901901245117188, "global_step": 132953, "epoch": 1601} {"train_loss": -22.892663955688477, "global_step": 132954, "epoch": 1601} {"train_loss": -22.843326568603516, "global_step": 132955, "epoch": 1601} {"train_loss": -22.87845230102539, "global_step": 132956, "epoch": 1601} {"train_loss": -22.992454528808594, "global_step": 132957, "epoch": 1601} {"train_loss": -22.94858169555664, "global_step": 132958, "epoch": 1601} {"train_loss": -23.1760311126709, "global_step": 132959, "epoch": 1601} {"train_loss": -23.085052490234375, "global_step": 132960, "epoch": 1601} {"train_loss": -22.87752914428711, "global_step": 132961, "epoch": 1601} {"train_loss": -23.31642723083496, "global_step": 132962, "epoch": 1601} {"train_loss": -23.028039932250977, "global_step": 132963, "epoch": 1601} {"train_loss": -23.313629150390625, "global_step": 132964, "epoch": 1601} {"train_loss": -22.80863150631089, "global_step": 132965, "epoch": 1601, "val_loss": 6275210.0} {"train_loss": -22.031234741210938, "global_step": 132966, "epoch": 1602} {"train_loss": -22.6541748046875, "global_step": 132967, "epoch": 1602} {"train_loss": -22.138452529907227, "global_step": 132968, "epoch": 1602} {"train_loss": -22.34541893005371, "global_step": 132969, "epoch": 1602} {"train_loss": -22.50298500061035, "global_step": 132970, "epoch": 1602} {"train_loss": -22.63077163696289, "global_step": 132971, "epoch": 1602} {"train_loss": -22.480514526367188, "global_step": 132972, "epoch": 1602} {"train_loss": -22.450536727905273, "global_step": 132973, "epoch": 1602} {"train_loss": -22.429086685180664, "global_step": 132974, "epoch": 1602} {"train_loss": -22.670106887817383, "global_step": 132975, "epoch": 1602} {"train_loss": -22.660802841186523, "global_step": 132976, "epoch": 1602} {"train_loss": -22.59235954284668, "global_step": 132977, "epoch": 1602} {"train_loss": -22.707517623901367, "global_step": 132978, "epoch": 1602} {"train_loss": -22.670806884765625, "global_step": 132979, "epoch": 1602} {"train_loss": -22.630266189575195, "global_step": 132980, "epoch": 1602} {"train_loss": -22.346845626831055, "global_step": 132981, "epoch": 1602} {"train_loss": -22.692350387573242, "global_step": 132982, "epoch": 1602} {"train_loss": -22.783273696899414, "global_step": 132983, "epoch": 1602} {"train_loss": -23.214675903320312, "global_step": 132984, "epoch": 1602} {"train_loss": -22.948795318603516, "global_step": 132985, "epoch": 1602} {"train_loss": -22.54493522644043, "global_step": 132986, "epoch": 1602} {"train_loss": -22.81208610534668, "global_step": 132987, "epoch": 1602} {"train_loss": -23.112056732177734, "global_step": 132988, "epoch": 1602} {"train_loss": -22.83017921447754, "global_step": 132989, "epoch": 1602} {"train_loss": -22.88423728942871, "global_step": 132990, "epoch": 1602} {"train_loss": -22.872861862182617, "global_step": 132991, "epoch": 1602} {"train_loss": -22.775583267211914, "global_step": 132992, "epoch": 1602} {"train_loss": -22.897581100463867, "global_step": 132993, "epoch": 1602} {"train_loss": -22.78558921813965, "global_step": 132994, "epoch": 1602} {"train_loss": -22.339553833007812, "global_step": 132995, "epoch": 1602} {"train_loss": -22.710031509399414, "global_step": 132996, "epoch": 1602} {"train_loss": -23.148269653320312, "global_step": 132997, "epoch": 1602} {"train_loss": -22.954378128051758, "global_step": 132998, "epoch": 1602} {"train_loss": -22.09514045715332, "global_step": 132999, "epoch": 1602} {"train_loss": -22.538190841674805, "global_step": 133000, "epoch": 1602} {"train_loss": -22.966169357299805, "global_step": 133001, "epoch": 1602} {"train_loss": -22.4045352935791, "global_step": 133002, "epoch": 1602} {"train_loss": -22.380155563354492, "global_step": 133003, "epoch": 1602} {"train_loss": -22.909353256225586, "global_step": 133004, "epoch": 1602} {"train_loss": -22.629138946533203, "global_step": 133005, "epoch": 1602} {"train_loss": -22.454198837280273, "global_step": 133006, "epoch": 1602} {"train_loss": -22.878829956054688, "global_step": 133007, "epoch": 1602} {"train_loss": -22.674707412719727, "global_step": 133008, "epoch": 1602} {"train_loss": -23.39249038696289, "global_step": 133009, "epoch": 1602} {"train_loss": -22.917142868041992, "global_step": 133010, "epoch": 1602} {"train_loss": -23.1319522857666, "global_step": 133011, "epoch": 1602} {"train_loss": -22.51746940612793, "global_step": 133012, "epoch": 1602} {"train_loss": -22.849563598632812, "global_step": 133013, "epoch": 1602} {"train_loss": -23.066478729248047, "global_step": 133014, "epoch": 1602} {"train_loss": -22.877689361572266, "global_step": 133015, "epoch": 1602} {"train_loss": -22.841650009155273, "global_step": 133016, "epoch": 1602} {"train_loss": -22.461898803710938, "global_step": 133017, "epoch": 1602} {"train_loss": -22.46477699279785, "global_step": 133018, "epoch": 1602} {"train_loss": -22.865602493286133, "global_step": 133019, "epoch": 1602} {"train_loss": -23.059101104736328, "global_step": 133020, "epoch": 1602} {"train_loss": -23.138078689575195, "global_step": 133021, "epoch": 1602} {"train_loss": -23.216022491455078, "global_step": 133022, "epoch": 1602} {"train_loss": -23.074535369873047, "global_step": 133023, "epoch": 1602} {"train_loss": -23.118480682373047, "global_step": 133024, "epoch": 1602} {"train_loss": -22.895709991455078, "global_step": 133025, "epoch": 1602} {"train_loss": -22.910398483276367, "global_step": 133026, "epoch": 1602} {"train_loss": -22.736572265625, "global_step": 133027, "epoch": 1602} {"train_loss": -22.947973251342773, "global_step": 133028, "epoch": 1602} {"train_loss": -22.82535743713379, "global_step": 133029, "epoch": 1602} {"train_loss": -23.090110778808594, "global_step": 133030, "epoch": 1602} {"train_loss": -22.61713981628418, "global_step": 133031, "epoch": 1602} {"train_loss": -23.016555786132812, "global_step": 133032, "epoch": 1602} {"train_loss": -22.787860870361328, "global_step": 133033, "epoch": 1602} {"train_loss": -22.99574089050293, "global_step": 133034, "epoch": 1602} {"train_loss": -22.62141227722168, "global_step": 133035, "epoch": 1602} {"train_loss": -22.955936431884766, "global_step": 133036, "epoch": 1602} {"train_loss": -23.193586349487305, "global_step": 133037, "epoch": 1602} {"train_loss": -22.808134078979492, "global_step": 133038, "epoch": 1602} {"train_loss": -23.078405380249023, "global_step": 133039, "epoch": 1602} {"train_loss": -22.9488525390625, "global_step": 133040, "epoch": 1602} {"train_loss": -22.883861541748047, "global_step": 133041, "epoch": 1602} {"train_loss": -23.193267822265625, "global_step": 133042, "epoch": 1602} {"train_loss": -23.118366241455078, "global_step": 133043, "epoch": 1602} {"train_loss": -22.934799194335938, "global_step": 133044, "epoch": 1602} {"train_loss": -23.17817497253418, "global_step": 133045, "epoch": 1602} {"train_loss": -22.885740280151367, "global_step": 133046, "epoch": 1602} {"train_loss": -22.87735366821289, "global_step": 133047, "epoch": 1602} {"train_loss": -22.795201956507672, "global_step": 133048, "epoch": 1602, "val_loss": 6330142.0} {"train_loss": -22.069395065307617, "global_step": 133049, "epoch": 1603} {"train_loss": -22.95829200744629, "global_step": 133050, "epoch": 1603} {"train_loss": -22.308141708374023, "global_step": 133051, "epoch": 1603} {"train_loss": -22.9261417388916, "global_step": 133052, "epoch": 1603} {"train_loss": -22.815919876098633, "global_step": 133053, "epoch": 1603} {"train_loss": -22.442922592163086, "global_step": 133054, "epoch": 1603} {"train_loss": -22.74031639099121, "global_step": 133055, "epoch": 1603} {"train_loss": -22.349668502807617, "global_step": 133056, "epoch": 1603} {"train_loss": -22.687652587890625, "global_step": 133057, "epoch": 1603} {"train_loss": -22.741357803344727, "global_step": 133058, "epoch": 1603} {"train_loss": -22.765127182006836, "global_step": 133059, "epoch": 1603} {"train_loss": -22.58082389831543, "global_step": 133060, "epoch": 1603} {"train_loss": -22.707529067993164, "global_step": 133061, "epoch": 1603} {"train_loss": -23.123884201049805, "global_step": 133062, "epoch": 1603} {"train_loss": -23.000219345092773, "global_step": 133063, "epoch": 1603} {"train_loss": -22.69342041015625, "global_step": 133064, "epoch": 1603} {"train_loss": -22.699909210205078, "global_step": 133065, "epoch": 1603} {"train_loss": -22.476659774780273, "global_step": 133066, "epoch": 1603} {"train_loss": -22.606189727783203, "global_step": 133067, "epoch": 1603} {"train_loss": -22.671682357788086, "global_step": 133068, "epoch": 1603} {"train_loss": -22.753732681274414, "global_step": 133069, "epoch": 1603} {"train_loss": -22.648557662963867, "global_step": 133070, "epoch": 1603} {"train_loss": -22.8337345123291, "global_step": 133071, "epoch": 1603} {"train_loss": -23.022085189819336, "global_step": 133072, "epoch": 1603} {"train_loss": -22.827728271484375, "global_step": 133073, "epoch": 1603} {"train_loss": -22.6781063079834, "global_step": 133074, "epoch": 1603} {"train_loss": -22.720138549804688, "global_step": 133075, "epoch": 1603} {"train_loss": -23.003681182861328, "global_step": 133076, "epoch": 1603} {"train_loss": -23.350589752197266, "global_step": 133077, "epoch": 1603} {"train_loss": -23.0839786529541, "global_step": 133078, "epoch": 1603} {"train_loss": -22.60577964782715, "global_step": 133079, "epoch": 1603} {"train_loss": -22.51277732849121, "global_step": 133080, "epoch": 1603} {"train_loss": -22.849546432495117, "global_step": 133081, "epoch": 1603} {"train_loss": -22.665067672729492, "global_step": 133082, "epoch": 1603} {"train_loss": -22.948883056640625, "global_step": 133083, "epoch": 1603} {"train_loss": -22.548974990844727, "global_step": 133084, "epoch": 1603} {"train_loss": -22.878700256347656, "global_step": 133085, "epoch": 1603} {"train_loss": -22.2109317779541, "global_step": 133086, "epoch": 1603} {"train_loss": -23.115087509155273, "global_step": 133087, "epoch": 1603} {"train_loss": -22.947162628173828, "global_step": 133088, "epoch": 1603} {"train_loss": -22.818525314331055, "global_step": 133089, "epoch": 1603} {"train_loss": -22.67511558532715, "global_step": 133090, "epoch": 1603} {"train_loss": -23.29264259338379, "global_step": 133091, "epoch": 1603} {"train_loss": -23.196603775024414, "global_step": 133092, "epoch": 1603} {"train_loss": -23.196271896362305, "global_step": 133093, "epoch": 1603} {"train_loss": -23.23927879333496, "global_step": 133094, "epoch": 1603} {"train_loss": -23.119897842407227, "global_step": 133095, "epoch": 1603} {"train_loss": -22.714563369750977, "global_step": 133096, "epoch": 1603} {"train_loss": -23.145700454711914, "global_step": 133097, "epoch": 1603} {"train_loss": -23.0369930267334, "global_step": 133098, "epoch": 1603} {"train_loss": -23.12647819519043, "global_step": 133099, "epoch": 1603} {"train_loss": -22.710683822631836, "global_step": 133100, "epoch": 1603} {"train_loss": -22.68121337890625, "global_step": 133101, "epoch": 1603} {"train_loss": -22.95435905456543, "global_step": 133102, "epoch": 1603} {"train_loss": -22.75068473815918, "global_step": 133103, "epoch": 1603} {"train_loss": -22.718172073364258, "global_step": 133104, "epoch": 1603} {"train_loss": -22.76435661315918, "global_step": 133105, "epoch": 1603} {"train_loss": -23.069000244140625, "global_step": 133106, "epoch": 1603} {"train_loss": -23.039369583129883, "global_step": 133107, "epoch": 1603} {"train_loss": -23.04535675048828, "global_step": 133108, "epoch": 1603} {"train_loss": -22.932737350463867, "global_step": 133109, "epoch": 1603} {"train_loss": -23.15109634399414, "global_step": 133110, "epoch": 1603} {"train_loss": -22.67658042907715, "global_step": 133111, "epoch": 1603} {"train_loss": -22.931333541870117, "global_step": 133112, "epoch": 1603} {"train_loss": -22.731542587280273, "global_step": 133113, "epoch": 1603} {"train_loss": -22.624526977539062, "global_step": 133114, "epoch": 1603} {"train_loss": -23.055173873901367, "global_step": 133115, "epoch": 1603} {"train_loss": -22.791189193725586, "global_step": 133116, "epoch": 1603} {"train_loss": -23.475088119506836, "global_step": 133117, "epoch": 1603} {"train_loss": -22.65574073791504, "global_step": 133118, "epoch": 1603} {"train_loss": -22.91451644897461, "global_step": 133119, "epoch": 1603} {"train_loss": -22.875200271606445, "global_step": 133120, "epoch": 1603} {"train_loss": -23.240554809570312, "global_step": 133121, "epoch": 1603} {"train_loss": -23.061071395874023, "global_step": 133122, "epoch": 1603} {"train_loss": -23.226831436157227, "global_step": 133123, "epoch": 1603} {"train_loss": -23.15433692932129, "global_step": 133124, "epoch": 1603} {"train_loss": -23.01540184020996, "global_step": 133125, "epoch": 1603} {"train_loss": -22.520193099975586, "global_step": 133126, "epoch": 1603} {"train_loss": -22.907672882080078, "global_step": 133127, "epoch": 1603} {"train_loss": -22.770172119140625, "global_step": 133128, "epoch": 1603} {"train_loss": -22.929630279541016, "global_step": 133129, "epoch": 1603} {"train_loss": -22.47725486755371, "global_step": 133130, "epoch": 1603} {"train_loss": -22.84817959888872, "global_step": 133131, "epoch": 1603, "val_loss": 6293631.0} {"train_loss": -22.92496681213379, "global_step": 133132, "epoch": 1604} {"train_loss": -22.742238998413086, "global_step": 133133, "epoch": 1604} {"train_loss": -22.607481002807617, "global_step": 133134, "epoch": 1604} {"train_loss": -22.605249404907227, "global_step": 133135, "epoch": 1604} {"train_loss": -22.50786781311035, "global_step": 133136, "epoch": 1604} {"train_loss": -22.989425659179688, "global_step": 133137, "epoch": 1604} {"train_loss": -22.557437896728516, "global_step": 133138, "epoch": 1604} {"train_loss": -22.801055908203125, "global_step": 133139, "epoch": 1604} {"train_loss": -22.54216957092285, "global_step": 133140, "epoch": 1604} {"train_loss": -22.781869888305664, "global_step": 133141, "epoch": 1604} {"train_loss": -22.23235511779785, "global_step": 133142, "epoch": 1604} {"train_loss": -22.770681381225586, "global_step": 133143, "epoch": 1604} {"train_loss": -22.756269454956055, "global_step": 133144, "epoch": 1604} {"train_loss": -22.113969802856445, "global_step": 133145, "epoch": 1604} {"train_loss": -22.7790584564209, "global_step": 133146, "epoch": 1604} {"train_loss": -22.594972610473633, "global_step": 133147, "epoch": 1604} {"train_loss": -22.454782485961914, "global_step": 133148, "epoch": 1604} {"train_loss": -22.85019302368164, "global_step": 133149, "epoch": 1604} {"train_loss": -22.51221466064453, "global_step": 133150, "epoch": 1604} {"train_loss": -22.663999557495117, "global_step": 133151, "epoch": 1604} {"train_loss": -22.67031478881836, "global_step": 133152, "epoch": 1604} {"train_loss": -22.612958908081055, "global_step": 133153, "epoch": 1604} {"train_loss": -22.893251419067383, "global_step": 133154, "epoch": 1604} {"train_loss": -22.492616653442383, "global_step": 133155, "epoch": 1604} {"train_loss": -22.970218658447266, "global_step": 133156, "epoch": 1604} {"train_loss": -23.032470703125, "global_step": 133157, "epoch": 1604} {"train_loss": -22.88899803161621, "global_step": 133158, "epoch": 1604} {"train_loss": -22.96824073791504, "global_step": 133159, "epoch": 1604} {"train_loss": -22.58247184753418, "global_step": 133160, "epoch": 1604} {"train_loss": -22.74909782409668, "global_step": 133161, "epoch": 1604} {"train_loss": -23.08262062072754, "global_step": 133162, "epoch": 1604} {"train_loss": -23.146726608276367, "global_step": 133163, "epoch": 1604} {"train_loss": -22.99955177307129, "global_step": 133164, "epoch": 1604} {"train_loss": -23.07513999938965, "global_step": 133165, "epoch": 1604} {"train_loss": -22.95962905883789, "global_step": 133166, "epoch": 1604} {"train_loss": -23.113862991333008, "global_step": 133167, "epoch": 1604} {"train_loss": -22.731159210205078, "global_step": 133168, "epoch": 1604} {"train_loss": -22.81258773803711, "global_step": 133169, "epoch": 1604} {"train_loss": -23.31549072265625, "global_step": 133170, "epoch": 1604} {"train_loss": -22.99031639099121, "global_step": 133171, "epoch": 1604} {"train_loss": -22.926010131835938, "global_step": 133172, "epoch": 1604} {"train_loss": -22.62251853942871, "global_step": 133173, "epoch": 1604} {"train_loss": -22.779516220092773, "global_step": 133174, "epoch": 1604} {"train_loss": -22.84975242614746, "global_step": 133175, "epoch": 1604} {"train_loss": -22.829822540283203, "global_step": 133176, "epoch": 1604} {"train_loss": -22.740076065063477, "global_step": 133177, "epoch": 1604} {"train_loss": -22.988996505737305, "global_step": 133178, "epoch": 1604} {"train_loss": -22.931608200073242, "global_step": 133179, "epoch": 1604} {"train_loss": -23.0737247467041, "global_step": 133180, "epoch": 1604} {"train_loss": -22.63397216796875, "global_step": 133181, "epoch": 1604} {"train_loss": -22.900121688842773, "global_step": 133182, "epoch": 1604} {"train_loss": -23.222021102905273, "global_step": 133183, "epoch": 1604} {"train_loss": -22.64515495300293, "global_step": 133184, "epoch": 1604} {"train_loss": -23.025373458862305, "global_step": 133185, "epoch": 1604} {"train_loss": -22.706472396850586, "global_step": 133186, "epoch": 1604} {"train_loss": -22.930191040039062, "global_step": 133187, "epoch": 1604} {"train_loss": -22.68863868713379, "global_step": 133188, "epoch": 1604} {"train_loss": -23.097614288330078, "global_step": 133189, "epoch": 1604} {"train_loss": -22.68391227722168, "global_step": 133190, "epoch": 1604} {"train_loss": -22.998119354248047, "global_step": 133191, "epoch": 1604} {"train_loss": -22.7563533782959, "global_step": 133192, "epoch": 1604} {"train_loss": -22.459306716918945, "global_step": 133193, "epoch": 1604} {"train_loss": -23.108308792114258, "global_step": 133194, "epoch": 1604} {"train_loss": -22.51876449584961, "global_step": 133195, "epoch": 1604} {"train_loss": -22.352651596069336, "global_step": 133196, "epoch": 1604} {"train_loss": -22.66526985168457, "global_step": 133197, "epoch": 1604} {"train_loss": -22.55966567993164, "global_step": 133198, "epoch": 1604} {"train_loss": -23.082639694213867, "global_step": 133199, "epoch": 1604} {"train_loss": -22.572484970092773, "global_step": 133200, "epoch": 1604} {"train_loss": -22.290998458862305, "global_step": 133201, "epoch": 1604} {"train_loss": -22.865198135375977, "global_step": 133202, "epoch": 1604} {"train_loss": -22.524930953979492, "global_step": 133203, "epoch": 1604} {"train_loss": -22.7244815826416, "global_step": 133204, "epoch": 1604} {"train_loss": -22.66565704345703, "global_step": 133205, "epoch": 1604} {"train_loss": -22.546802520751953, "global_step": 133206, "epoch": 1604} {"train_loss": -22.68559455871582, "global_step": 133207, "epoch": 1604} {"train_loss": -22.87758445739746, "global_step": 133208, "epoch": 1604} {"train_loss": -22.80651092529297, "global_step": 133209, "epoch": 1604} {"train_loss": -23.022842407226562, "global_step": 133210, "epoch": 1604} {"train_loss": -22.36830711364746, "global_step": 133211, "epoch": 1604} {"train_loss": -22.743276596069336, "global_step": 133212, "epoch": 1604} {"train_loss": -22.60396385192871, "global_step": 133213, "epoch": 1604} {"train_loss": -22.782268822911274, "global_step": 133214, "epoch": 1604, "val_loss": 6285876.0} {"train_loss": -23.123859405517578, "global_step": 133215, "epoch": 1605} {"train_loss": -22.478778839111328, "global_step": 133216, "epoch": 1605} {"train_loss": -22.861417770385742, "global_step": 133217, "epoch": 1605} {"train_loss": -22.599899291992188, "global_step": 133218, "epoch": 1605} {"train_loss": -22.620656967163086, "global_step": 133219, "epoch": 1605} {"train_loss": -22.462295532226562, "global_step": 133220, "epoch": 1605} {"train_loss": -22.718626022338867, "global_step": 133221, "epoch": 1605} {"train_loss": -22.475234985351562, "global_step": 133222, "epoch": 1605} {"train_loss": -22.377180099487305, "global_step": 133223, "epoch": 1605} {"train_loss": -22.898164749145508, "global_step": 133224, "epoch": 1605} {"train_loss": -22.66425323486328, "global_step": 133225, "epoch": 1605} {"train_loss": -22.548486709594727, "global_step": 133226, "epoch": 1605} {"train_loss": -23.2329044342041, "global_step": 133227, "epoch": 1605} {"train_loss": -23.03804588317871, "global_step": 133228, "epoch": 1605} {"train_loss": -22.565937042236328, "global_step": 133229, "epoch": 1605} {"train_loss": -22.93024253845215, "global_step": 133230, "epoch": 1605} {"train_loss": -22.913843154907227, "global_step": 133231, "epoch": 1605} {"train_loss": -23.054990768432617, "global_step": 133232, "epoch": 1605} {"train_loss": -22.971542358398438, "global_step": 133233, "epoch": 1605} {"train_loss": -22.74623680114746, "global_step": 133234, "epoch": 1605} {"train_loss": -23.0743465423584, "global_step": 133235, "epoch": 1605} {"train_loss": -22.711517333984375, "global_step": 133236, "epoch": 1605} {"train_loss": -22.691160202026367, "global_step": 133237, "epoch": 1605} {"train_loss": -22.77254295349121, "global_step": 133238, "epoch": 1605} {"train_loss": -22.916595458984375, "global_step": 133239, "epoch": 1605} {"train_loss": -22.919408798217773, "global_step": 133240, "epoch": 1605} {"train_loss": -23.0213565826416, "global_step": 133241, "epoch": 1605} {"train_loss": -23.053298950195312, "global_step": 133242, "epoch": 1605} {"train_loss": -22.850502014160156, "global_step": 133243, "epoch": 1605} {"train_loss": -22.591026306152344, "global_step": 133244, "epoch": 1605} {"train_loss": -23.00467872619629, "global_step": 133245, "epoch": 1605} {"train_loss": -23.11933135986328, "global_step": 133246, "epoch": 1605} {"train_loss": -22.664714813232422, "global_step": 133247, "epoch": 1605} {"train_loss": -22.919469833374023, "global_step": 133248, "epoch": 1605} {"train_loss": -23.050596237182617, "global_step": 133249, "epoch": 1605} {"train_loss": -22.474538803100586, "global_step": 133250, "epoch": 1605} {"train_loss": -23.10933494567871, "global_step": 133251, "epoch": 1605} {"train_loss": -22.84627342224121, "global_step": 133252, "epoch": 1605} {"train_loss": -22.90101432800293, "global_step": 133253, "epoch": 1605} {"train_loss": -22.97365379333496, "global_step": 133254, "epoch": 1605} {"train_loss": -22.523244857788086, "global_step": 133255, "epoch": 1605} {"train_loss": -22.348114013671875, "global_step": 133256, "epoch": 1605} {"train_loss": -23.30177116394043, "global_step": 133257, "epoch": 1605} {"train_loss": -22.8680419921875, "global_step": 133258, "epoch": 1605} {"train_loss": -22.657907485961914, "global_step": 133259, "epoch": 1605} {"train_loss": -22.868011474609375, "global_step": 133260, "epoch": 1605} {"train_loss": -22.70816993713379, "global_step": 133261, "epoch": 1605} {"train_loss": -22.724123001098633, "global_step": 133262, "epoch": 1605} {"train_loss": -22.57107925415039, "global_step": 133263, "epoch": 1605} {"train_loss": -22.936338424682617, "global_step": 133264, "epoch": 1605} {"train_loss": -22.93890953063965, "global_step": 133265, "epoch": 1605} {"train_loss": -22.667749404907227, "global_step": 133266, "epoch": 1605} {"train_loss": -22.602970123291016, "global_step": 133267, "epoch": 1605} {"train_loss": -22.71967887878418, "global_step": 133268, "epoch": 1605} {"train_loss": -22.89350700378418, "global_step": 133269, "epoch": 1605} {"train_loss": -22.349308013916016, "global_step": 133270, "epoch": 1605} {"train_loss": -22.651987075805664, "global_step": 133271, "epoch": 1605} {"train_loss": -22.811979293823242, "global_step": 133272, "epoch": 1605} {"train_loss": -22.81576919555664, "global_step": 133273, "epoch": 1605} {"train_loss": -23.072351455688477, "global_step": 133274, "epoch": 1605} {"train_loss": -22.647117614746094, "global_step": 133275, "epoch": 1605} {"train_loss": -22.84193992614746, "global_step": 133276, "epoch": 1605} {"train_loss": -22.99419403076172, "global_step": 133277, "epoch": 1605} {"train_loss": -23.07497215270996, "global_step": 133278, "epoch": 1605} {"train_loss": -22.590641021728516, "global_step": 133279, "epoch": 1605} {"train_loss": -22.83028221130371, "global_step": 133280, "epoch": 1605} {"train_loss": -23.295211791992188, "global_step": 133281, "epoch": 1605} {"train_loss": -23.289413452148438, "global_step": 133282, "epoch": 1605} {"train_loss": -22.92087173461914, "global_step": 133283, "epoch": 1605} {"train_loss": -22.568004608154297, "global_step": 133284, "epoch": 1605} {"train_loss": -23.143131256103516, "global_step": 133285, "epoch": 1605} {"train_loss": -22.96164894104004, "global_step": 133286, "epoch": 1605} {"train_loss": -23.08538818359375, "global_step": 133287, "epoch": 1605} {"train_loss": -22.683494567871094, "global_step": 133288, "epoch": 1605} {"train_loss": -22.888166427612305, "global_step": 133289, "epoch": 1605} {"train_loss": -23.45522117614746, "global_step": 133290, "epoch": 1605} {"train_loss": -23.241010665893555, "global_step": 133291, "epoch": 1605} {"train_loss": -23.02435302734375, "global_step": 133292, "epoch": 1605} {"train_loss": -23.066747665405273, "global_step": 133293, "epoch": 1605} {"train_loss": -22.951181411743164, "global_step": 133294, "epoch": 1605} {"train_loss": -23.137807846069336, "global_step": 133295, "epoch": 1605} {"train_loss": -23.334705352783203, "global_step": 133296, "epoch": 1605} {"train_loss": -22.84725067414433, "global_step": 133297, "epoch": 1605, "val_loss": 6339931.0} {"train_loss": -22.061120986938477, "global_step": 133298, "epoch": 1606} {"train_loss": -22.148710250854492, "global_step": 133299, "epoch": 1606} {"train_loss": -23.07110023498535, "global_step": 133300, "epoch": 1606} {"train_loss": -22.01693344116211, "global_step": 133301, "epoch": 1606} {"train_loss": -22.000680923461914, "global_step": 133302, "epoch": 1606} {"train_loss": -22.581378936767578, "global_step": 133303, "epoch": 1606} {"train_loss": -22.577411651611328, "global_step": 133304, "epoch": 1606} {"train_loss": -22.394062042236328, "global_step": 133305, "epoch": 1606} {"train_loss": -22.752111434936523, "global_step": 133306, "epoch": 1606} {"train_loss": -22.605932235717773, "global_step": 133307, "epoch": 1606} {"train_loss": -22.2578182220459, "global_step": 133308, "epoch": 1606} {"train_loss": -22.281360626220703, "global_step": 133309, "epoch": 1606} {"train_loss": -22.62781524658203, "global_step": 133310, "epoch": 1606} {"train_loss": -22.631622314453125, "global_step": 133311, "epoch": 1606} {"train_loss": -22.567846298217773, "global_step": 133312, "epoch": 1606} {"train_loss": -22.47968864440918, "global_step": 133313, "epoch": 1606} {"train_loss": -22.720966339111328, "global_step": 133314, "epoch": 1606} {"train_loss": -22.44111442565918, "global_step": 133315, "epoch": 1606} {"train_loss": -22.130313873291016, "global_step": 133316, "epoch": 1606} {"train_loss": -22.90481948852539, "global_step": 133317, "epoch": 1606} {"train_loss": -22.955732345581055, "global_step": 133318, "epoch": 1606} {"train_loss": -22.689762115478516, "global_step": 133319, "epoch": 1606} {"train_loss": -22.437414169311523, "global_step": 133320, "epoch": 1606} {"train_loss": -22.519948959350586, "global_step": 133321, "epoch": 1606} {"train_loss": -22.860931396484375, "global_step": 133322, "epoch": 1606} {"train_loss": -22.989973068237305, "global_step": 133323, "epoch": 1606} {"train_loss": -22.821182250976562, "global_step": 133324, "epoch": 1606} {"train_loss": -22.748865127563477, "global_step": 133325, "epoch": 1606} {"train_loss": -22.869827270507812, "global_step": 133326, "epoch": 1606} {"train_loss": -23.33858299255371, "global_step": 133327, "epoch": 1606} {"train_loss": -22.42887306213379, "global_step": 133328, "epoch": 1606} {"train_loss": -23.257410049438477, "global_step": 133329, "epoch": 1606} {"train_loss": -22.71218490600586, "global_step": 133330, "epoch": 1606} {"train_loss": -23.154850006103516, "global_step": 133331, "epoch": 1606} {"train_loss": -22.558862686157227, "global_step": 133332, "epoch": 1606} {"train_loss": -23.049367904663086, "global_step": 133333, "epoch": 1606} {"train_loss": -22.95951271057129, "global_step": 133334, "epoch": 1606} {"train_loss": -22.888105392456055, "global_step": 133335, "epoch": 1606} {"train_loss": -22.884689331054688, "global_step": 133336, "epoch": 1606} {"train_loss": -23.218496322631836, "global_step": 133337, "epoch": 1606} {"train_loss": -22.648019790649414, "global_step": 133338, "epoch": 1606} {"train_loss": -23.03757667541504, "global_step": 133339, "epoch": 1606} {"train_loss": -22.75602149963379, "global_step": 133340, "epoch": 1606} {"train_loss": -22.80511474609375, "global_step": 133341, "epoch": 1606} {"train_loss": -22.93143081665039, "global_step": 133342, "epoch": 1606} {"train_loss": -22.928024291992188, "global_step": 133343, "epoch": 1606} {"train_loss": -22.963953018188477, "global_step": 133344, "epoch": 1606} {"train_loss": -22.62498664855957, "global_step": 133345, "epoch": 1606} {"train_loss": -22.960966110229492, "global_step": 133346, "epoch": 1606} {"train_loss": -22.785324096679688, "global_step": 133347, "epoch": 1606} {"train_loss": -23.12745475769043, "global_step": 133348, "epoch": 1606} {"train_loss": -23.19789695739746, "global_step": 133349, "epoch": 1606} {"train_loss": -22.668970108032227, "global_step": 133350, "epoch": 1606} {"train_loss": -22.68867301940918, "global_step": 133351, "epoch": 1606} {"train_loss": -23.14424705505371, "global_step": 133352, "epoch": 1606} {"train_loss": -23.243017196655273, "global_step": 133353, "epoch": 1606} {"train_loss": -22.61416244506836, "global_step": 133354, "epoch": 1606} {"train_loss": -22.911367416381836, "global_step": 133355, "epoch": 1606} {"train_loss": -22.729658126831055, "global_step": 133356, "epoch": 1606} {"train_loss": -23.028961181640625, "global_step": 133357, "epoch": 1606} {"train_loss": -22.944931030273438, "global_step": 133358, "epoch": 1606} {"train_loss": -22.933595657348633, "global_step": 133359, "epoch": 1606} {"train_loss": -23.10503578186035, "global_step": 133360, "epoch": 1606} {"train_loss": -22.994125366210938, "global_step": 133361, "epoch": 1606} {"train_loss": -22.847131729125977, "global_step": 133362, "epoch": 1606} {"train_loss": -23.028898239135742, "global_step": 133363, "epoch": 1606} {"train_loss": -23.107498168945312, "global_step": 133364, "epoch": 1606} {"train_loss": -22.731760025024414, "global_step": 133365, "epoch": 1606} {"train_loss": -22.9173526763916, "global_step": 133366, "epoch": 1606} {"train_loss": -22.916990280151367, "global_step": 133367, "epoch": 1606} {"train_loss": -22.73404312133789, "global_step": 133368, "epoch": 1606} {"train_loss": -22.84739112854004, "global_step": 133369, "epoch": 1606} {"train_loss": -22.51276969909668, "global_step": 133370, "epoch": 1606} {"train_loss": -22.826396942138672, "global_step": 133371, "epoch": 1606} {"train_loss": -22.77976417541504, "global_step": 133372, "epoch": 1606} {"train_loss": -22.736186981201172, "global_step": 133373, "epoch": 1606} {"train_loss": -22.877090454101562, "global_step": 133374, "epoch": 1606} {"train_loss": -22.614286422729492, "global_step": 133375, "epoch": 1606} {"train_loss": -22.427677154541016, "global_step": 133376, "epoch": 1606} {"train_loss": -23.253084182739258, "global_step": 133377, "epoch": 1606} {"train_loss": -22.971776962280273, "global_step": 133378, "epoch": 1606} {"train_loss": -22.844284057617188, "global_step": 133379, "epoch": 1606} {"train_loss": -22.7784452553255, "global_step": 133380, "epoch": 1606, "val_loss": 6278656.5} {"train_loss": -22.72041130065918, "global_step": 133381, "epoch": 1607} {"train_loss": -22.606657028198242, "global_step": 133382, "epoch": 1607} {"train_loss": -22.709945678710938, "global_step": 133383, "epoch": 1607} {"train_loss": -22.199460983276367, "global_step": 133384, "epoch": 1607} {"train_loss": -22.704343795776367, "global_step": 133385, "epoch": 1607} {"train_loss": -22.72933006286621, "global_step": 133386, "epoch": 1607} {"train_loss": -22.651578903198242, "global_step": 133387, "epoch": 1607} {"train_loss": -22.72737693786621, "global_step": 133388, "epoch": 1607} {"train_loss": -22.577959060668945, "global_step": 133389, "epoch": 1607} {"train_loss": -22.918766021728516, "global_step": 133390, "epoch": 1607} {"train_loss": -23.176664352416992, "global_step": 133391, "epoch": 1607} {"train_loss": -22.975629806518555, "global_step": 133392, "epoch": 1607} {"train_loss": -22.97505760192871, "global_step": 133393, "epoch": 1607} {"train_loss": -22.5301456451416, "global_step": 133394, "epoch": 1607} {"train_loss": -23.100820541381836, "global_step": 133395, "epoch": 1607} {"train_loss": -22.593358993530273, "global_step": 133396, "epoch": 1607} {"train_loss": -22.685867309570312, "global_step": 133397, "epoch": 1607} {"train_loss": -22.520353317260742, "global_step": 133398, "epoch": 1607} {"train_loss": -22.7115535736084, "global_step": 133399, "epoch": 1607} {"train_loss": -23.130159378051758, "global_step": 133400, "epoch": 1607} {"train_loss": -22.786361694335938, "global_step": 133401, "epoch": 1607} {"train_loss": -22.741104125976562, "global_step": 133402, "epoch": 1607} {"train_loss": -23.089019775390625, "global_step": 133403, "epoch": 1607} {"train_loss": -22.65923500061035, "global_step": 133404, "epoch": 1607} {"train_loss": -22.686594009399414, "global_step": 133405, "epoch": 1607} {"train_loss": -22.91143035888672, "global_step": 133406, "epoch": 1607} {"train_loss": -22.780216217041016, "global_step": 133407, "epoch": 1607} {"train_loss": -22.72423553466797, "global_step": 133408, "epoch": 1607} {"train_loss": -22.96651268005371, "global_step": 133409, "epoch": 1607} {"train_loss": -22.864049911499023, "global_step": 133410, "epoch": 1607} {"train_loss": -22.92390251159668, "global_step": 133411, "epoch": 1607} {"train_loss": -22.287031173706055, "global_step": 133412, "epoch": 1607} {"train_loss": -22.715940475463867, "global_step": 133413, "epoch": 1607} {"train_loss": -22.908641815185547, "global_step": 133414, "epoch": 1607} {"train_loss": -22.596025466918945, "global_step": 133415, "epoch": 1607} {"train_loss": -22.828041076660156, "global_step": 133416, "epoch": 1607} {"train_loss": -23.213071823120117, "global_step": 133417, "epoch": 1607} {"train_loss": -22.92593765258789, "global_step": 133418, "epoch": 1607} {"train_loss": -22.848676681518555, "global_step": 133419, "epoch": 1607} {"train_loss": -22.79670524597168, "global_step": 133420, "epoch": 1607} {"train_loss": -22.716833114624023, "global_step": 133421, "epoch": 1607} {"train_loss": -22.79633903503418, "global_step": 133422, "epoch": 1607} {"train_loss": -22.636890411376953, "global_step": 133423, "epoch": 1607} {"train_loss": -22.094877243041992, "global_step": 133424, "epoch": 1607} {"train_loss": -22.699981689453125, "global_step": 133425, "epoch": 1607} {"train_loss": -22.57780647277832, "global_step": 133426, "epoch": 1607} {"train_loss": -22.892210006713867, "global_step": 133427, "epoch": 1607} {"train_loss": -23.05101203918457, "global_step": 133428, "epoch": 1607} {"train_loss": -22.755176544189453, "global_step": 133429, "epoch": 1607} {"train_loss": -23.28559684753418, "global_step": 133430, "epoch": 1607} {"train_loss": -22.693994522094727, "global_step": 133431, "epoch": 1607} {"train_loss": -23.0218448638916, "global_step": 133432, "epoch": 1607} {"train_loss": -22.752225875854492, "global_step": 133433, "epoch": 1607} {"train_loss": -23.120393753051758, "global_step": 133434, "epoch": 1607} {"train_loss": -23.07119369506836, "global_step": 133435, "epoch": 1607} {"train_loss": -22.783742904663086, "global_step": 133436, "epoch": 1607} {"train_loss": -22.7542724609375, "global_step": 133437, "epoch": 1607} {"train_loss": -22.703001022338867, "global_step": 133438, "epoch": 1607} {"train_loss": -22.840557098388672, "global_step": 133439, "epoch": 1607} {"train_loss": -23.610822677612305, "global_step": 133440, "epoch": 1607} {"train_loss": -22.684789657592773, "global_step": 133441, "epoch": 1607} {"train_loss": -22.97273063659668, "global_step": 133442, "epoch": 1607} {"train_loss": -22.435047149658203, "global_step": 133443, "epoch": 1607} {"train_loss": -22.753576278686523, "global_step": 133444, "epoch": 1607} {"train_loss": -22.724506378173828, "global_step": 133445, "epoch": 1607} {"train_loss": -22.814146041870117, "global_step": 133446, "epoch": 1607} {"train_loss": -22.872432708740234, "global_step": 133447, "epoch": 1607} {"train_loss": -22.73700523376465, "global_step": 133448, "epoch": 1607} {"train_loss": -22.94685173034668, "global_step": 133449, "epoch": 1607} {"train_loss": -23.17135238647461, "global_step": 133450, "epoch": 1607} {"train_loss": -22.987186431884766, "global_step": 133451, "epoch": 1607} {"train_loss": -22.830760955810547, "global_step": 133452, "epoch": 1607} {"train_loss": -22.92770767211914, "global_step": 133453, "epoch": 1607} {"train_loss": -22.577226638793945, "global_step": 133454, "epoch": 1607} {"train_loss": -22.852811813354492, "global_step": 133455, "epoch": 1607} {"train_loss": -22.72389030456543, "global_step": 133456, "epoch": 1607} {"train_loss": -23.116086959838867, "global_step": 133457, "epoch": 1607} {"train_loss": -23.164487838745117, "global_step": 133458, "epoch": 1607} {"train_loss": -23.41543960571289, "global_step": 133459, "epoch": 1607} {"train_loss": -23.220129013061523, "global_step": 133460, "epoch": 1607} {"train_loss": -23.299314498901367, "global_step": 133461, "epoch": 1607} {"train_loss": -22.995080947875977, "global_step": 133462, "epoch": 1607} {"train_loss": -22.809671195156604, "global_step": 133463, "epoch": 1607, "val_loss": 6216155.0} {"train_loss": -21.84512710571289, "global_step": 133464, "epoch": 1608} {"train_loss": -21.75872230529785, "global_step": 133465, "epoch": 1608} {"train_loss": -22.401805877685547, "global_step": 133466, "epoch": 1608} {"train_loss": -22.19072914123535, "global_step": 133467, "epoch": 1608} {"train_loss": -21.518627166748047, "global_step": 133468, "epoch": 1608} {"train_loss": -22.09854507446289, "global_step": 133469, "epoch": 1608} {"train_loss": -21.699277877807617, "global_step": 133470, "epoch": 1608} {"train_loss": -22.57164192199707, "global_step": 133471, "epoch": 1608} {"train_loss": -22.143264770507812, "global_step": 133472, "epoch": 1608} {"train_loss": -22.428457260131836, "global_step": 133473, "epoch": 1608} {"train_loss": -22.32415199279785, "global_step": 133474, "epoch": 1608} {"train_loss": -22.501596450805664, "global_step": 133475, "epoch": 1608} {"train_loss": -22.495223999023438, "global_step": 133476, "epoch": 1608} {"train_loss": -22.574039459228516, "global_step": 133477, "epoch": 1608} {"train_loss": -22.30992889404297, "global_step": 133478, "epoch": 1608} {"train_loss": -22.42683982849121, "global_step": 133479, "epoch": 1608} {"train_loss": -22.849620819091797, "global_step": 133480, "epoch": 1608} {"train_loss": -22.918785095214844, "global_step": 133481, "epoch": 1608} {"train_loss": -22.2203426361084, "global_step": 133482, "epoch": 1608} {"train_loss": -22.492353439331055, "global_step": 133483, "epoch": 1608} {"train_loss": -22.666671752929688, "global_step": 133484, "epoch": 1608} {"train_loss": -22.37681007385254, "global_step": 133485, "epoch": 1608} {"train_loss": -22.714950561523438, "global_step": 133486, "epoch": 1608} {"train_loss": -22.79665184020996, "global_step": 133487, "epoch": 1608} {"train_loss": -22.517078399658203, "global_step": 133488, "epoch": 1608} {"train_loss": -22.61693572998047, "global_step": 133489, "epoch": 1608} {"train_loss": -22.77349281311035, "global_step": 133490, "epoch": 1608} {"train_loss": -22.570524215698242, "global_step": 133491, "epoch": 1608} {"train_loss": -22.60837745666504, "global_step": 133492, "epoch": 1608} {"train_loss": -22.604007720947266, "global_step": 133493, "epoch": 1608} {"train_loss": -22.897546768188477, "global_step": 133494, "epoch": 1608} {"train_loss": -22.7996826171875, "global_step": 133495, "epoch": 1608} {"train_loss": -22.812976837158203, "global_step": 133496, "epoch": 1608} {"train_loss": -22.76809310913086, "global_step": 133497, "epoch": 1608} {"train_loss": -22.848901748657227, "global_step": 133498, "epoch": 1608} {"train_loss": -22.994417190551758, "global_step": 133499, "epoch": 1608} {"train_loss": -22.9593505859375, "global_step": 133500, "epoch": 1608} {"train_loss": -22.78294563293457, "global_step": 133501, "epoch": 1608} {"train_loss": -23.389822006225586, "global_step": 133502, "epoch": 1608} {"train_loss": -23.02635955810547, "global_step": 133503, "epoch": 1608} {"train_loss": -22.905672073364258, "global_step": 133504, "epoch": 1608} {"train_loss": -22.968706130981445, "global_step": 133505, "epoch": 1608} {"train_loss": -23.079065322875977, "global_step": 133506, "epoch": 1608} {"train_loss": -23.209369659423828, "global_step": 133507, "epoch": 1608} {"train_loss": -22.818103790283203, "global_step": 133508, "epoch": 1608} {"train_loss": -23.31744956970215, "global_step": 133509, "epoch": 1608} {"train_loss": -22.879148483276367, "global_step": 133510, "epoch": 1608} {"train_loss": -22.798330307006836, "global_step": 133511, "epoch": 1608} {"train_loss": -23.00885009765625, "global_step": 133512, "epoch": 1608} {"train_loss": -23.3604793548584, "global_step": 133513, "epoch": 1608} {"train_loss": -23.10688591003418, "global_step": 133514, "epoch": 1608} {"train_loss": -23.351987838745117, "global_step": 133515, "epoch": 1608} {"train_loss": -22.978805541992188, "global_step": 133516, "epoch": 1608} {"train_loss": -23.203624725341797, "global_step": 133517, "epoch": 1608} {"train_loss": -23.15974235534668, "global_step": 133518, "epoch": 1608} {"train_loss": -22.949674606323242, "global_step": 133519, "epoch": 1608} {"train_loss": -23.124263763427734, "global_step": 133520, "epoch": 1608} {"train_loss": -23.078960418701172, "global_step": 133521, "epoch": 1608} {"train_loss": -22.95241355895996, "global_step": 133522, "epoch": 1608} {"train_loss": -22.875045776367188, "global_step": 133523, "epoch": 1608} {"train_loss": -22.86701011657715, "global_step": 133524, "epoch": 1608} {"train_loss": -22.972143173217773, "global_step": 133525, "epoch": 1608} {"train_loss": -22.75119400024414, "global_step": 133526, "epoch": 1608} {"train_loss": -22.70058250427246, "global_step": 133527, "epoch": 1608} {"train_loss": -23.264781951904297, "global_step": 133528, "epoch": 1608} {"train_loss": -22.786365509033203, "global_step": 133529, "epoch": 1608} {"train_loss": -22.7546443939209, "global_step": 133530, "epoch": 1608} {"train_loss": -22.792287826538086, "global_step": 133531, "epoch": 1608} {"train_loss": -22.79910659790039, "global_step": 133532, "epoch": 1608} {"train_loss": -22.49416160583496, "global_step": 133533, "epoch": 1608} {"train_loss": -22.93022346496582, "global_step": 133534, "epoch": 1608} {"train_loss": -22.84130859375, "global_step": 133535, "epoch": 1608} {"train_loss": -22.768674850463867, "global_step": 133536, "epoch": 1608} {"train_loss": -22.75715446472168, "global_step": 133537, "epoch": 1608} {"train_loss": -22.720678329467773, "global_step": 133538, "epoch": 1608} {"train_loss": -23.306943893432617, "global_step": 133539, "epoch": 1608} {"train_loss": -22.6564998626709, "global_step": 133540, "epoch": 1608} {"train_loss": -22.984119415283203, "global_step": 133541, "epoch": 1608} {"train_loss": -23.3668270111084, "global_step": 133542, "epoch": 1608} {"train_loss": -22.981781005859375, "global_step": 133543, "epoch": 1608} {"train_loss": -22.790525436401367, "global_step": 133544, "epoch": 1608} {"train_loss": -22.89087677001953, "global_step": 133545, "epoch": 1608} {"train_loss": -22.74978355040033, "global_step": 133546, "epoch": 1608, "val_loss": 6272064.0} {"train_loss": -22.44013786315918, "global_step": 133547, "epoch": 1609} {"train_loss": -22.43988609313965, "global_step": 133548, "epoch": 1609} {"train_loss": -22.55731773376465, "global_step": 133549, "epoch": 1609} {"train_loss": -22.192676544189453, "global_step": 133550, "epoch": 1609} {"train_loss": -22.893722534179688, "global_step": 133551, "epoch": 1609} {"train_loss": -22.754013061523438, "global_step": 133552, "epoch": 1609} {"train_loss": -22.36054801940918, "global_step": 133553, "epoch": 1609} {"train_loss": -22.830339431762695, "global_step": 133554, "epoch": 1609} {"train_loss": -22.783830642700195, "global_step": 133555, "epoch": 1609} {"train_loss": -22.46249008178711, "global_step": 133556, "epoch": 1609} {"train_loss": -22.80291175842285, "global_step": 133557, "epoch": 1609} {"train_loss": -22.54170799255371, "global_step": 133558, "epoch": 1609} {"train_loss": -22.965612411499023, "global_step": 133559, "epoch": 1609} {"train_loss": -22.74454116821289, "global_step": 133560, "epoch": 1609} {"train_loss": -22.10158348083496, "global_step": 133561, "epoch": 1609} {"train_loss": -22.89498519897461, "global_step": 133562, "epoch": 1609} {"train_loss": -22.574613571166992, "global_step": 133563, "epoch": 1609} {"train_loss": -22.688146591186523, "global_step": 133564, "epoch": 1609} {"train_loss": -22.7305850982666, "global_step": 133565, "epoch": 1609} {"train_loss": -22.634748458862305, "global_step": 133566, "epoch": 1609} {"train_loss": -22.580778121948242, "global_step": 133567, "epoch": 1609} {"train_loss": -22.742589950561523, "global_step": 133568, "epoch": 1609} {"train_loss": -22.76705551147461, "global_step": 133569, "epoch": 1609} {"train_loss": -22.690536499023438, "global_step": 133570, "epoch": 1609} {"train_loss": -22.97113609313965, "global_step": 133571, "epoch": 1609} {"train_loss": -22.627038955688477, "global_step": 133572, "epoch": 1609} {"train_loss": -22.695951461791992, "global_step": 133573, "epoch": 1609} {"train_loss": -22.93418312072754, "global_step": 133574, "epoch": 1609} {"train_loss": -22.708805084228516, "global_step": 133575, "epoch": 1609} {"train_loss": -22.690656661987305, "global_step": 133576, "epoch": 1609} {"train_loss": -22.87669563293457, "global_step": 133577, "epoch": 1609} {"train_loss": -22.680654525756836, "global_step": 133578, "epoch": 1609} {"train_loss": -23.258590698242188, "global_step": 133579, "epoch": 1609} {"train_loss": -23.000995635986328, "global_step": 133580, "epoch": 1609} {"train_loss": -22.62847900390625, "global_step": 133581, "epoch": 1609} {"train_loss": -22.83917808532715, "global_step": 133582, "epoch": 1609} {"train_loss": -23.081045150756836, "global_step": 133583, "epoch": 1609} {"train_loss": -23.075986862182617, "global_step": 133584, "epoch": 1609} {"train_loss": -22.988910675048828, "global_step": 133585, "epoch": 1609} {"train_loss": -22.395950317382812, "global_step": 133586, "epoch": 1609} {"train_loss": -22.954683303833008, "global_step": 133587, "epoch": 1609} {"train_loss": -22.967426300048828, "global_step": 133588, "epoch": 1609} {"train_loss": -22.767122268676758, "global_step": 133589, "epoch": 1609} {"train_loss": -23.112585067749023, "global_step": 133590, "epoch": 1609} {"train_loss": -22.88387107849121, "global_step": 133591, "epoch": 1609} {"train_loss": -22.700469970703125, "global_step": 133592, "epoch": 1609} {"train_loss": -22.834247589111328, "global_step": 133593, "epoch": 1609} {"train_loss": -22.935476303100586, "global_step": 133594, "epoch": 1609} {"train_loss": -22.893564224243164, "global_step": 133595, "epoch": 1609} {"train_loss": -22.354721069335938, "global_step": 133596, "epoch": 1609} {"train_loss": -23.080257415771484, "global_step": 133597, "epoch": 1609} {"train_loss": -23.02420997619629, "global_step": 133598, "epoch": 1609} {"train_loss": -22.53110694885254, "global_step": 133599, "epoch": 1609} {"train_loss": -22.617918014526367, "global_step": 133600, "epoch": 1609} {"train_loss": -22.46919822692871, "global_step": 133601, "epoch": 1609} {"train_loss": -23.09488296508789, "global_step": 133602, "epoch": 1609} {"train_loss": -22.80030632019043, "global_step": 133603, "epoch": 1609} {"train_loss": -22.69081687927246, "global_step": 133604, "epoch": 1609} {"train_loss": -23.164670944213867, "global_step": 133605, "epoch": 1609} {"train_loss": -22.9409236907959, "global_step": 133606, "epoch": 1609} {"train_loss": -22.79591941833496, "global_step": 133607, "epoch": 1609} {"train_loss": -23.067760467529297, "global_step": 133608, "epoch": 1609} {"train_loss": -22.894739151000977, "global_step": 133609, "epoch": 1609} {"train_loss": -23.18158531188965, "global_step": 133610, "epoch": 1609} {"train_loss": -22.676942825317383, "global_step": 133611, "epoch": 1609} {"train_loss": -22.982913970947266, "global_step": 133612, "epoch": 1609} {"train_loss": -22.728458404541016, "global_step": 133613, "epoch": 1609} {"train_loss": -23.400617599487305, "global_step": 133614, "epoch": 1609} {"train_loss": -23.285737991333008, "global_step": 133615, "epoch": 1609} {"train_loss": -23.167926788330078, "global_step": 133616, "epoch": 1609} {"train_loss": -22.881099700927734, "global_step": 133617, "epoch": 1609} {"train_loss": -22.727127075195312, "global_step": 133618, "epoch": 1609} {"train_loss": -22.926143646240234, "global_step": 133619, "epoch": 1609} {"train_loss": -22.846662521362305, "global_step": 133620, "epoch": 1609} {"train_loss": -23.21491813659668, "global_step": 133621, "epoch": 1609} {"train_loss": -23.061307907104492, "global_step": 133622, "epoch": 1609} {"train_loss": -23.12747573852539, "global_step": 133623, "epoch": 1609} {"train_loss": -22.558889389038086, "global_step": 133624, "epoch": 1609} {"train_loss": -22.974632263183594, "global_step": 133625, "epoch": 1609} {"train_loss": -22.623258590698242, "global_step": 133626, "epoch": 1609} {"train_loss": -22.93779754638672, "global_step": 133627, "epoch": 1609} {"train_loss": -22.71961784362793, "global_step": 133628, "epoch": 1609} {"train_loss": -22.811948753265014, "global_step": 133629, "epoch": 1609, "val_loss": 6170157.0} {"train_loss": -22.466373443603516, "global_step": 133630, "epoch": 1610} {"train_loss": -22.556753158569336, "global_step": 133631, "epoch": 1610} {"train_loss": -22.585439682006836, "global_step": 133632, "epoch": 1610} {"train_loss": -22.977041244506836, "global_step": 133633, "epoch": 1610} {"train_loss": -22.710010528564453, "global_step": 133634, "epoch": 1610} {"train_loss": -22.63411521911621, "global_step": 133635, "epoch": 1610} {"train_loss": -22.51462745666504, "global_step": 133636, "epoch": 1610} {"train_loss": -22.96122932434082, "global_step": 133637, "epoch": 1610} {"train_loss": -23.084697723388672, "global_step": 133638, "epoch": 1610} {"train_loss": -22.583776473999023, "global_step": 133639, "epoch": 1610} {"train_loss": -22.3994197845459, "global_step": 133640, "epoch": 1610} {"train_loss": -22.803617477416992, "global_step": 133641, "epoch": 1610} {"train_loss": -22.883474349975586, "global_step": 133642, "epoch": 1610} {"train_loss": -22.844051361083984, "global_step": 133643, "epoch": 1610} {"train_loss": -22.58207130432129, "global_step": 133644, "epoch": 1610} {"train_loss": -23.053730010986328, "global_step": 133645, "epoch": 1610} {"train_loss": -22.625808715820312, "global_step": 133646, "epoch": 1610} {"train_loss": -22.437036514282227, "global_step": 133647, "epoch": 1610} {"train_loss": -22.660625457763672, "global_step": 133648, "epoch": 1610} {"train_loss": -23.04349136352539, "global_step": 133649, "epoch": 1610} {"train_loss": -23.136627197265625, "global_step": 133650, "epoch": 1610} {"train_loss": -22.64219856262207, "global_step": 133651, "epoch": 1610} {"train_loss": -23.32350730895996, "global_step": 133652, "epoch": 1610} {"train_loss": -23.011924743652344, "global_step": 133653, "epoch": 1610} {"train_loss": -22.98811149597168, "global_step": 133654, "epoch": 1610} {"train_loss": -22.80769157409668, "global_step": 133655, "epoch": 1610} {"train_loss": -23.091510772705078, "global_step": 133656, "epoch": 1610} {"train_loss": -22.70849609375, "global_step": 133657, "epoch": 1610} {"train_loss": -22.949792861938477, "global_step": 133658, "epoch": 1610} {"train_loss": -23.11380958557129, "global_step": 133659, "epoch": 1610} {"train_loss": -23.070003509521484, "global_step": 133660, "epoch": 1610} {"train_loss": -22.76189613342285, "global_step": 133661, "epoch": 1610} {"train_loss": -22.972339630126953, "global_step": 133662, "epoch": 1610} {"train_loss": -22.778987884521484, "global_step": 133663, "epoch": 1610} {"train_loss": -22.745309829711914, "global_step": 133664, "epoch": 1610} {"train_loss": -23.293354034423828, "global_step": 133665, "epoch": 1610} {"train_loss": -22.69908332824707, "global_step": 133666, "epoch": 1610} {"train_loss": -22.630552291870117, "global_step": 133667, "epoch": 1610} {"train_loss": -22.733097076416016, "global_step": 133668, "epoch": 1610} {"train_loss": -22.825714111328125, "global_step": 133669, "epoch": 1610} {"train_loss": -22.59085464477539, "global_step": 133670, "epoch": 1610} {"train_loss": -22.66357421875, "global_step": 133671, "epoch": 1610} {"train_loss": -23.17079734802246, "global_step": 133672, "epoch": 1610} {"train_loss": -22.633710861206055, "global_step": 133673, "epoch": 1610} {"train_loss": -22.44023323059082, "global_step": 133674, "epoch": 1610} {"train_loss": -22.899995803833008, "global_step": 133675, "epoch": 1610} {"train_loss": -22.914113998413086, "global_step": 133676, "epoch": 1610} {"train_loss": -22.57089614868164, "global_step": 133677, "epoch": 1610} {"train_loss": -22.716312408447266, "global_step": 133678, "epoch": 1610} {"train_loss": -22.55605125427246, "global_step": 133679, "epoch": 1610} {"train_loss": -22.67547607421875, "global_step": 133680, "epoch": 1610} {"train_loss": -22.751806259155273, "global_step": 133681, "epoch": 1610} {"train_loss": -22.38629913330078, "global_step": 133682, "epoch": 1610} {"train_loss": -22.220294952392578, "global_step": 133683, "epoch": 1610} {"train_loss": -22.823644638061523, "global_step": 133684, "epoch": 1610} {"train_loss": -22.791385650634766, "global_step": 133685, "epoch": 1610} {"train_loss": -22.81291961669922, "global_step": 133686, "epoch": 1610} {"train_loss": -22.67097282409668, "global_step": 133687, "epoch": 1610} {"train_loss": -22.99409294128418, "global_step": 133688, "epoch": 1610} {"train_loss": -22.95639991760254, "global_step": 133689, "epoch": 1610} {"train_loss": -22.69944190979004, "global_step": 133690, "epoch": 1610} {"train_loss": -22.88662338256836, "global_step": 133691, "epoch": 1610} {"train_loss": -23.007495880126953, "global_step": 133692, "epoch": 1610} {"train_loss": -22.90070343017578, "global_step": 133693, "epoch": 1610} {"train_loss": -22.787067413330078, "global_step": 133694, "epoch": 1610} {"train_loss": -22.926076889038086, "global_step": 133695, "epoch": 1610} {"train_loss": -22.79203987121582, "global_step": 133696, "epoch": 1610} {"train_loss": -22.808568954467773, "global_step": 133697, "epoch": 1610} {"train_loss": -22.617250442504883, "global_step": 133698, "epoch": 1610} {"train_loss": -22.70425796508789, "global_step": 133699, "epoch": 1610} {"train_loss": -22.660913467407227, "global_step": 133700, "epoch": 1610} {"train_loss": -22.379383087158203, "global_step": 133701, "epoch": 1610} {"train_loss": -23.042444229125977, "global_step": 133702, "epoch": 1610} {"train_loss": -22.49643898010254, "global_step": 133703, "epoch": 1610} {"train_loss": -22.869504928588867, "global_step": 133704, "epoch": 1610} {"train_loss": -22.94430160522461, "global_step": 133705, "epoch": 1610} {"train_loss": -22.875686645507812, "global_step": 133706, "epoch": 1610} {"train_loss": -22.622737884521484, "global_step": 133707, "epoch": 1610} {"train_loss": -23.17119598388672, "global_step": 133708, "epoch": 1610} {"train_loss": -22.725324630737305, "global_step": 133709, "epoch": 1610} {"train_loss": -22.700286865234375, "global_step": 133710, "epoch": 1610} {"train_loss": -22.71027946472168, "global_step": 133711, "epoch": 1610} {"train_loss": -22.78310231128371, "global_step": 133712, "epoch": 1610, "val_loss": 6421665.0} {"train_loss": -22.4409236907959, "global_step": 133713, "epoch": 1611} {"train_loss": -22.394193649291992, "global_step": 133714, "epoch": 1611} {"train_loss": -22.301841735839844, "global_step": 133715, "epoch": 1611} {"train_loss": -22.580387115478516, "global_step": 133716, "epoch": 1611} {"train_loss": -22.2945613861084, "global_step": 133717, "epoch": 1611} {"train_loss": -22.75882339477539, "global_step": 133718, "epoch": 1611} {"train_loss": -22.42778968811035, "global_step": 133719, "epoch": 1611} {"train_loss": -22.882057189941406, "global_step": 133720, "epoch": 1611} {"train_loss": -22.63111686706543, "global_step": 133721, "epoch": 1611} {"train_loss": -22.499731063842773, "global_step": 133722, "epoch": 1611} {"train_loss": -22.796480178833008, "global_step": 133723, "epoch": 1611} {"train_loss": -22.195554733276367, "global_step": 133724, "epoch": 1611} {"train_loss": -22.201908111572266, "global_step": 133725, "epoch": 1611} {"train_loss": -22.849018096923828, "global_step": 133726, "epoch": 1611} {"train_loss": -22.553142547607422, "global_step": 133727, "epoch": 1611} {"train_loss": -22.87355613708496, "global_step": 133728, "epoch": 1611} {"train_loss": -22.56873321533203, "global_step": 133729, "epoch": 1611} {"train_loss": -22.248401641845703, "global_step": 133730, "epoch": 1611} {"train_loss": -22.500614166259766, "global_step": 133731, "epoch": 1611} {"train_loss": -22.587873458862305, "global_step": 133732, "epoch": 1611} {"train_loss": -22.73566246032715, "global_step": 133733, "epoch": 1611} {"train_loss": -22.739612579345703, "global_step": 133734, "epoch": 1611} {"train_loss": -23.1832218170166, "global_step": 133735, "epoch": 1611} {"train_loss": -23.090808868408203, "global_step": 133736, "epoch": 1611} {"train_loss": -22.946683883666992, "global_step": 133737, "epoch": 1611} {"train_loss": -22.736713409423828, "global_step": 133738, "epoch": 1611} {"train_loss": -23.11902618408203, "global_step": 133739, "epoch": 1611} {"train_loss": -22.72395133972168, "global_step": 133740, "epoch": 1611} {"train_loss": -23.093551635742188, "global_step": 133741, "epoch": 1611} {"train_loss": -22.75310516357422, "global_step": 133742, "epoch": 1611} {"train_loss": -22.76276206970215, "global_step": 133743, "epoch": 1611} {"train_loss": -22.875410079956055, "global_step": 133744, "epoch": 1611} {"train_loss": -23.13409996032715, "global_step": 133745, "epoch": 1611} {"train_loss": -23.267122268676758, "global_step": 133746, "epoch": 1611} {"train_loss": -23.07436180114746, "global_step": 133747, "epoch": 1611} {"train_loss": -23.103717803955078, "global_step": 133748, "epoch": 1611} {"train_loss": -23.01740074157715, "global_step": 133749, "epoch": 1611} {"train_loss": -22.894664764404297, "global_step": 133750, "epoch": 1611} {"train_loss": -23.138919830322266, "global_step": 133751, "epoch": 1611} {"train_loss": -22.597021102905273, "global_step": 133752, "epoch": 1611} {"train_loss": -22.907636642456055, "global_step": 133753, "epoch": 1611} {"train_loss": -23.195755004882812, "global_step": 133754, "epoch": 1611} {"train_loss": -22.8642520904541, "global_step": 133755, "epoch": 1611} {"train_loss": -23.01930046081543, "global_step": 133756, "epoch": 1611} {"train_loss": -22.862838745117188, "global_step": 133757, "epoch": 1611} {"train_loss": -22.999670028686523, "global_step": 133758, "epoch": 1611} {"train_loss": -23.168798446655273, "global_step": 133759, "epoch": 1611} {"train_loss": -23.009401321411133, "global_step": 133760, "epoch": 1611} {"train_loss": -22.90848159790039, "global_step": 133761, "epoch": 1611} {"train_loss": -22.81648826599121, "global_step": 133762, "epoch": 1611} {"train_loss": -23.125411987304688, "global_step": 133763, "epoch": 1611} {"train_loss": -23.1005802154541, "global_step": 133764, "epoch": 1611} {"train_loss": -22.909032821655273, "global_step": 133765, "epoch": 1611} {"train_loss": -23.090993881225586, "global_step": 133766, "epoch": 1611} {"train_loss": -23.06307029724121, "global_step": 133767, "epoch": 1611} {"train_loss": -22.918521881103516, "global_step": 133768, "epoch": 1611} {"train_loss": -22.955215454101562, "global_step": 133769, "epoch": 1611} {"train_loss": -22.809673309326172, "global_step": 133770, "epoch": 1611} {"train_loss": -22.8265438079834, "global_step": 133771, "epoch": 1611} {"train_loss": -23.10120964050293, "global_step": 133772, "epoch": 1611} {"train_loss": -22.84857749938965, "global_step": 133773, "epoch": 1611} {"train_loss": -22.78938865661621, "global_step": 133774, "epoch": 1611} {"train_loss": -22.82526206970215, "global_step": 133775, "epoch": 1611} {"train_loss": -22.376829147338867, "global_step": 133776, "epoch": 1611} {"train_loss": -22.967254638671875, "global_step": 133777, "epoch": 1611} {"train_loss": -23.16554832458496, "global_step": 133778, "epoch": 1611} {"train_loss": -23.062551498413086, "global_step": 133779, "epoch": 1611} {"train_loss": -22.5399112701416, "global_step": 133780, "epoch": 1611} {"train_loss": -22.59357261657715, "global_step": 133781, "epoch": 1611} {"train_loss": -22.86153221130371, "global_step": 133782, "epoch": 1611} {"train_loss": -22.959745407104492, "global_step": 133783, "epoch": 1611} {"train_loss": -23.283828735351562, "global_step": 133784, "epoch": 1611} {"train_loss": -22.900728225708008, "global_step": 133785, "epoch": 1611} {"train_loss": -22.75852394104004, "global_step": 133786, "epoch": 1611} {"train_loss": -22.8060359954834, "global_step": 133787, "epoch": 1611} {"train_loss": -23.189743041992188, "global_step": 133788, "epoch": 1611} {"train_loss": -23.172222137451172, "global_step": 133789, "epoch": 1611} {"train_loss": -23.003244400024414, "global_step": 133790, "epoch": 1611} {"train_loss": -22.930009841918945, "global_step": 133791, "epoch": 1611} {"train_loss": -23.02351188659668, "global_step": 133792, "epoch": 1611} {"train_loss": -22.88558006286621, "global_step": 133793, "epoch": 1611} {"train_loss": -22.903705596923828, "global_step": 133794, "epoch": 1611} {"train_loss": -22.87425360622176, "global_step": 133795, "epoch": 1611, "val_loss": 6182644.0} {"train_loss": -22.565269470214844, "global_step": 133796, "epoch": 1612} {"train_loss": -22.7919864654541, "global_step": 133797, "epoch": 1612} {"train_loss": -22.589323043823242, "global_step": 133798, "epoch": 1612} {"train_loss": -22.682666778564453, "global_step": 133799, "epoch": 1612} {"train_loss": -22.377376556396484, "global_step": 133800, "epoch": 1612} {"train_loss": -22.56924819946289, "global_step": 133801, "epoch": 1612} {"train_loss": -22.226055145263672, "global_step": 133802, "epoch": 1612} {"train_loss": -22.653799057006836, "global_step": 133803, "epoch": 1612} {"train_loss": -23.02647590637207, "global_step": 133804, "epoch": 1612} {"train_loss": -22.60724449157715, "global_step": 133805, "epoch": 1612} {"train_loss": -22.970741271972656, "global_step": 133806, "epoch": 1612} {"train_loss": -22.578662872314453, "global_step": 133807, "epoch": 1612} {"train_loss": -22.71559715270996, "global_step": 133808, "epoch": 1612} {"train_loss": -22.978057861328125, "global_step": 133809, "epoch": 1612} {"train_loss": -22.931577682495117, "global_step": 133810, "epoch": 1612} {"train_loss": -22.778202056884766, "global_step": 133811, "epoch": 1612} {"train_loss": -22.786527633666992, "global_step": 133812, "epoch": 1612} {"train_loss": -22.932588577270508, "global_step": 133813, "epoch": 1612} {"train_loss": -22.587491989135742, "global_step": 133814, "epoch": 1612} {"train_loss": -23.063159942626953, "global_step": 133815, "epoch": 1612} {"train_loss": -22.905384063720703, "global_step": 133816, "epoch": 1612} {"train_loss": -23.156152725219727, "global_step": 133817, "epoch": 1612} {"train_loss": -22.948591232299805, "global_step": 133818, "epoch": 1612} {"train_loss": -23.020410537719727, "global_step": 133819, "epoch": 1612} {"train_loss": -22.981367111206055, "global_step": 133820, "epoch": 1612} {"train_loss": -22.965269088745117, "global_step": 133821, "epoch": 1612} {"train_loss": -23.147022247314453, "global_step": 133822, "epoch": 1612} {"train_loss": -23.325159072875977, "global_step": 133823, "epoch": 1612} {"train_loss": -22.80467987060547, "global_step": 133824, "epoch": 1612} {"train_loss": -23.041467666625977, "global_step": 133825, "epoch": 1612} {"train_loss": -23.00153923034668, "global_step": 133826, "epoch": 1612} {"train_loss": -23.16651725769043, "global_step": 133827, "epoch": 1612} {"train_loss": -22.563573837280273, "global_step": 133828, "epoch": 1612} {"train_loss": -22.81540870666504, "global_step": 133829, "epoch": 1612} {"train_loss": -23.206464767456055, "global_step": 133830, "epoch": 1612} {"train_loss": -22.7562313079834, "global_step": 133831, "epoch": 1612} {"train_loss": -23.010000228881836, "global_step": 133832, "epoch": 1612} {"train_loss": -22.81070899963379, "global_step": 133833, "epoch": 1612} {"train_loss": -22.828550338745117, "global_step": 133834, "epoch": 1612} {"train_loss": -23.038551330566406, "global_step": 133835, "epoch": 1612} {"train_loss": -23.004758834838867, "global_step": 133836, "epoch": 1612} {"train_loss": -23.25564193725586, "global_step": 133837, "epoch": 1612} {"train_loss": -22.7310848236084, "global_step": 133838, "epoch": 1612} {"train_loss": -23.122547149658203, "global_step": 133839, "epoch": 1612} {"train_loss": -22.63968276977539, "global_step": 133840, "epoch": 1612} {"train_loss": -22.794462203979492, "global_step": 133841, "epoch": 1612} {"train_loss": -22.851606369018555, "global_step": 133842, "epoch": 1612} {"train_loss": -22.733457565307617, "global_step": 133843, "epoch": 1612} {"train_loss": -22.954788208007812, "global_step": 133844, "epoch": 1612} {"train_loss": -22.828723907470703, "global_step": 133845, "epoch": 1612} {"train_loss": -22.598052978515625, "global_step": 133846, "epoch": 1612} {"train_loss": -22.762928009033203, "global_step": 133847, "epoch": 1612} {"train_loss": -23.0511531829834, "global_step": 133848, "epoch": 1612} {"train_loss": -23.36728858947754, "global_step": 133849, "epoch": 1612} {"train_loss": -22.734495162963867, "global_step": 133850, "epoch": 1612} {"train_loss": -22.944976806640625, "global_step": 133851, "epoch": 1612} {"train_loss": -23.287343978881836, "global_step": 133852, "epoch": 1612} {"train_loss": -23.096586227416992, "global_step": 133853, "epoch": 1612} {"train_loss": -23.008413314819336, "global_step": 133854, "epoch": 1612} {"train_loss": -22.985774993896484, "global_step": 133855, "epoch": 1612} {"train_loss": -23.128143310546875, "global_step": 133856, "epoch": 1612} {"train_loss": -22.686161041259766, "global_step": 133857, "epoch": 1612} {"train_loss": -22.99320411682129, "global_step": 133858, "epoch": 1612} {"train_loss": -23.414453506469727, "global_step": 133859, "epoch": 1612} {"train_loss": -22.929582595825195, "global_step": 133860, "epoch": 1612} {"train_loss": -23.0206241607666, "global_step": 133861, "epoch": 1612} {"train_loss": -22.73720359802246, "global_step": 133862, "epoch": 1612} {"train_loss": -22.709802627563477, "global_step": 133863, "epoch": 1612} {"train_loss": -23.216596603393555, "global_step": 133864, "epoch": 1612} {"train_loss": -22.79677391052246, "global_step": 133865, "epoch": 1612} {"train_loss": -22.958938598632812, "global_step": 133866, "epoch": 1612} {"train_loss": -22.815277099609375, "global_step": 133867, "epoch": 1612} {"train_loss": -22.683429718017578, "global_step": 133868, "epoch": 1612} {"train_loss": -22.62685203552246, "global_step": 133869, "epoch": 1612} {"train_loss": -22.73526954650879, "global_step": 133870, "epoch": 1612} {"train_loss": -22.65165901184082, "global_step": 133871, "epoch": 1612} {"train_loss": -23.327465057373047, "global_step": 133872, "epoch": 1612} {"train_loss": -22.69207000732422, "global_step": 133873, "epoch": 1612} {"train_loss": -22.827388763427734, "global_step": 133874, "epoch": 1612} {"train_loss": -22.698095321655273, "global_step": 133875, "epoch": 1612} {"train_loss": -23.06996726989746, "global_step": 133876, "epoch": 1612} {"train_loss": -22.47135353088379, "global_step": 133877, "epoch": 1612} {"train_loss": -22.868287488638636, "global_step": 133878, "epoch": 1612, "val_loss": 6242370.0} {"train_loss": -22.64947509765625, "global_step": 133879, "epoch": 1613} {"train_loss": -22.3435001373291, "global_step": 133880, "epoch": 1613} {"train_loss": -22.503768920898438, "global_step": 133881, "epoch": 1613} {"train_loss": -22.68158531188965, "global_step": 133882, "epoch": 1613} {"train_loss": -22.76276969909668, "global_step": 133883, "epoch": 1613} {"train_loss": -22.473920822143555, "global_step": 133884, "epoch": 1613} {"train_loss": -22.923810958862305, "global_step": 133885, "epoch": 1613} {"train_loss": -22.67854881286621, "global_step": 133886, "epoch": 1613} {"train_loss": -23.115489959716797, "global_step": 133887, "epoch": 1613} {"train_loss": -22.637479782104492, "global_step": 133888, "epoch": 1613} {"train_loss": -22.559646606445312, "global_step": 133889, "epoch": 1613} {"train_loss": -22.853160858154297, "global_step": 133890, "epoch": 1613} {"train_loss": -22.70836639404297, "global_step": 133891, "epoch": 1613} {"train_loss": -22.801288604736328, "global_step": 133892, "epoch": 1613} {"train_loss": -23.03382682800293, "global_step": 133893, "epoch": 1613} {"train_loss": -22.681079864501953, "global_step": 133894, "epoch": 1613} {"train_loss": -22.8922119140625, "global_step": 133895, "epoch": 1613} {"train_loss": -22.97552490234375, "global_step": 133896, "epoch": 1613} {"train_loss": -22.832181930541992, "global_step": 133897, "epoch": 1613} {"train_loss": -22.618154525756836, "global_step": 133898, "epoch": 1613} {"train_loss": -23.087785720825195, "global_step": 133899, "epoch": 1613} {"train_loss": -23.083158493041992, "global_step": 133900, "epoch": 1613} {"train_loss": -22.866046905517578, "global_step": 133901, "epoch": 1613} {"train_loss": -22.294893264770508, "global_step": 133902, "epoch": 1613} {"train_loss": -22.937183380126953, "global_step": 133903, "epoch": 1613} {"train_loss": -22.929182052612305, "global_step": 133904, "epoch": 1613} {"train_loss": -23.07718276977539, "global_step": 133905, "epoch": 1613} {"train_loss": -22.79927635192871, "global_step": 133906, "epoch": 1613} {"train_loss": -22.938947677612305, "global_step": 133907, "epoch": 1613} {"train_loss": -23.103307723999023, "global_step": 133908, "epoch": 1613} {"train_loss": -23.400964736938477, "global_step": 133909, "epoch": 1613} {"train_loss": -23.715551376342773, "global_step": 133910, "epoch": 1613} {"train_loss": -22.787805557250977, "global_step": 133911, "epoch": 1613} {"train_loss": -23.269559860229492, "global_step": 133912, "epoch": 1613} {"train_loss": -23.12495231628418, "global_step": 133913, "epoch": 1613} {"train_loss": -22.873794555664062, "global_step": 133914, "epoch": 1613} {"train_loss": -22.846410751342773, "global_step": 133915, "epoch": 1613} {"train_loss": -23.257596969604492, "global_step": 133916, "epoch": 1613} {"train_loss": -22.720600128173828, "global_step": 133917, "epoch": 1613} {"train_loss": -23.10017967224121, "global_step": 133918, "epoch": 1613} {"train_loss": -22.880970001220703, "global_step": 133919, "epoch": 1613} {"train_loss": -22.763490676879883, "global_step": 133920, "epoch": 1613} {"train_loss": -22.691783905029297, "global_step": 133921, "epoch": 1613} {"train_loss": -23.065500259399414, "global_step": 133922, "epoch": 1613} {"train_loss": -22.518795013427734, "global_step": 133923, "epoch": 1613} {"train_loss": -22.808048248291016, "global_step": 133924, "epoch": 1613} {"train_loss": -22.79875373840332, "global_step": 133925, "epoch": 1613} {"train_loss": -23.23333168029785, "global_step": 133926, "epoch": 1613} {"train_loss": -22.71195411682129, "global_step": 133927, "epoch": 1613} {"train_loss": -23.07275390625, "global_step": 133928, "epoch": 1613} {"train_loss": -22.915456771850586, "global_step": 133929, "epoch": 1613} {"train_loss": -22.830646514892578, "global_step": 133930, "epoch": 1613} {"train_loss": -22.8037166595459, "global_step": 133931, "epoch": 1613} {"train_loss": -22.763233184814453, "global_step": 133932, "epoch": 1613} {"train_loss": -22.981365203857422, "global_step": 133933, "epoch": 1613} {"train_loss": -23.11617088317871, "global_step": 133934, "epoch": 1613} {"train_loss": -22.941518783569336, "global_step": 133935, "epoch": 1613} {"train_loss": -23.161849975585938, "global_step": 133936, "epoch": 1613} {"train_loss": -22.472980499267578, "global_step": 133937, "epoch": 1613} {"train_loss": -23.02608299255371, "global_step": 133938, "epoch": 1613} {"train_loss": -22.760465621948242, "global_step": 133939, "epoch": 1613} {"train_loss": -22.942251205444336, "global_step": 133940, "epoch": 1613} {"train_loss": -22.684158325195312, "global_step": 133941, "epoch": 1613} {"train_loss": -22.946537017822266, "global_step": 133942, "epoch": 1613} {"train_loss": -22.576047897338867, "global_step": 133943, "epoch": 1613} {"train_loss": -23.039377212524414, "global_step": 133944, "epoch": 1613} {"train_loss": -22.733823776245117, "global_step": 133945, "epoch": 1613} {"train_loss": -22.77640724182129, "global_step": 133946, "epoch": 1613} {"train_loss": -22.950300216674805, "global_step": 133947, "epoch": 1613} {"train_loss": -22.737218856811523, "global_step": 133948, "epoch": 1613} {"train_loss": -22.555814743041992, "global_step": 133949, "epoch": 1613} {"train_loss": -22.518075942993164, "global_step": 133950, "epoch": 1613} {"train_loss": -22.959646224975586, "global_step": 133951, "epoch": 1613} {"train_loss": -23.258989334106445, "global_step": 133952, "epoch": 1613} {"train_loss": -22.775815963745117, "global_step": 133953, "epoch": 1613} {"train_loss": -22.862058639526367, "global_step": 133954, "epoch": 1613} {"train_loss": -22.871417999267578, "global_step": 133955, "epoch": 1613} {"train_loss": -22.83509635925293, "global_step": 133956, "epoch": 1613} {"train_loss": -23.1361141204834, "global_step": 133957, "epoch": 1613} {"train_loss": -23.27686882019043, "global_step": 133958, "epoch": 1613} {"train_loss": -22.26161003112793, "global_step": 133959, "epoch": 1613} {"train_loss": -23.04184341430664, "global_step": 133960, "epoch": 1613} {"train_loss": -22.867654156972126, "global_step": 133961, "epoch": 1613, "val_loss": 6274789.5} {"train_loss": -22.551877975463867, "global_step": 133962, "epoch": 1614} {"train_loss": -22.423160552978516, "global_step": 133963, "epoch": 1614} {"train_loss": -22.53437614440918, "global_step": 133964, "epoch": 1614} {"train_loss": -22.532529830932617, "global_step": 133965, "epoch": 1614} {"train_loss": -22.606266021728516, "global_step": 133966, "epoch": 1614} {"train_loss": -22.727697372436523, "global_step": 133967, "epoch": 1614} {"train_loss": -22.81845474243164, "global_step": 133968, "epoch": 1614} {"train_loss": -22.803998947143555, "global_step": 133969, "epoch": 1614} {"train_loss": -22.520187377929688, "global_step": 133970, "epoch": 1614} {"train_loss": -23.028173446655273, "global_step": 133971, "epoch": 1614} {"train_loss": -22.75150489807129, "global_step": 133972, "epoch": 1614} {"train_loss": -22.863754272460938, "global_step": 133973, "epoch": 1614} {"train_loss": -22.5306453704834, "global_step": 133974, "epoch": 1614} {"train_loss": -22.98244285583496, "global_step": 133975, "epoch": 1614} {"train_loss": -22.736148834228516, "global_step": 133976, "epoch": 1614} {"train_loss": -23.014474868774414, "global_step": 133977, "epoch": 1614} {"train_loss": -23.078474044799805, "global_step": 133978, "epoch": 1614} {"train_loss": -22.714488983154297, "global_step": 133979, "epoch": 1614} {"train_loss": -22.707782745361328, "global_step": 133980, "epoch": 1614} {"train_loss": -22.884511947631836, "global_step": 133981, "epoch": 1614} {"train_loss": -22.50840187072754, "global_step": 133982, "epoch": 1614} {"train_loss": -22.62801170349121, "global_step": 133983, "epoch": 1614} {"train_loss": -22.666881561279297, "global_step": 133984, "epoch": 1614} {"train_loss": -22.494306564331055, "global_step": 133985, "epoch": 1614} {"train_loss": -23.15118408203125, "global_step": 133986, "epoch": 1614} {"train_loss": -22.93069839477539, "global_step": 133987, "epoch": 1614} {"train_loss": -22.63123321533203, "global_step": 133988, "epoch": 1614} {"train_loss": -22.705896377563477, "global_step": 133989, "epoch": 1614} {"train_loss": -22.65613555908203, "global_step": 133990, "epoch": 1614} {"train_loss": -22.93426513671875, "global_step": 133991, "epoch": 1614} {"train_loss": -22.785709381103516, "global_step": 133992, "epoch": 1614} {"train_loss": -22.92595100402832, "global_step": 133993, "epoch": 1614} {"train_loss": -22.576047897338867, "global_step": 133994, "epoch": 1614} {"train_loss": -22.86360740661621, "global_step": 133995, "epoch": 1614} {"train_loss": -23.103322982788086, "global_step": 133996, "epoch": 1614} {"train_loss": -23.180875778198242, "global_step": 133997, "epoch": 1614} {"train_loss": -22.99117088317871, "global_step": 133998, "epoch": 1614} {"train_loss": -22.690692901611328, "global_step": 133999, "epoch": 1614} {"train_loss": -23.2308349609375, "global_step": 134000, "epoch": 1614} {"train_loss": -23.044811248779297, "global_step": 134001, "epoch": 1614} {"train_loss": -22.597135543823242, "global_step": 134002, "epoch": 1614} {"train_loss": -22.771596908569336, "global_step": 134003, "epoch": 1614} {"train_loss": -22.242679595947266, "global_step": 134004, "epoch": 1614} {"train_loss": -22.647253036499023, "global_step": 134005, "epoch": 1614} {"train_loss": -22.801576614379883, "global_step": 134006, "epoch": 1614} {"train_loss": -22.704877853393555, "global_step": 134007, "epoch": 1614} {"train_loss": -23.012222290039062, "global_step": 134008, "epoch": 1614} {"train_loss": -23.139007568359375, "global_step": 134009, "epoch": 1614} {"train_loss": -23.1055965423584, "global_step": 134010, "epoch": 1614} {"train_loss": -22.688383102416992, "global_step": 134011, "epoch": 1614} {"train_loss": -23.138351440429688, "global_step": 134012, "epoch": 1614} {"train_loss": -22.793933868408203, "global_step": 134013, "epoch": 1614} {"train_loss": -22.634418487548828, "global_step": 134014, "epoch": 1614} {"train_loss": -23.223609924316406, "global_step": 134015, "epoch": 1614} {"train_loss": -22.8184814453125, "global_step": 134016, "epoch": 1614} {"train_loss": -23.036666870117188, "global_step": 134017, "epoch": 1614} {"train_loss": -22.887907028198242, "global_step": 134018, "epoch": 1614} {"train_loss": -23.03080940246582, "global_step": 134019, "epoch": 1614} {"train_loss": -23.136659622192383, "global_step": 134020, "epoch": 1614} {"train_loss": -22.85138511657715, "global_step": 134021, "epoch": 1614} {"train_loss": -23.161802291870117, "global_step": 134022, "epoch": 1614} {"train_loss": -22.899606704711914, "global_step": 134023, "epoch": 1614} {"train_loss": -22.990036010742188, "global_step": 134024, "epoch": 1614} {"train_loss": -22.868589401245117, "global_step": 134025, "epoch": 1614} {"train_loss": -22.854530334472656, "global_step": 134026, "epoch": 1614} {"train_loss": -22.8245849609375, "global_step": 134027, "epoch": 1614} {"train_loss": -22.66290283203125, "global_step": 134028, "epoch": 1614} {"train_loss": -23.078472137451172, "global_step": 134029, "epoch": 1614} {"train_loss": -23.075332641601562, "global_step": 134030, "epoch": 1614} {"train_loss": -23.057859420776367, "global_step": 134031, "epoch": 1614} {"train_loss": -22.880722045898438, "global_step": 134032, "epoch": 1614} {"train_loss": -23.030269622802734, "global_step": 134033, "epoch": 1614} {"train_loss": -23.046838760375977, "global_step": 134034, "epoch": 1614} {"train_loss": -23.155563354492188, "global_step": 134035, "epoch": 1614} {"train_loss": -22.777616500854492, "global_step": 134036, "epoch": 1614} {"train_loss": -23.10548973083496, "global_step": 134037, "epoch": 1614} {"train_loss": -23.08904457092285, "global_step": 134038, "epoch": 1614} {"train_loss": -22.882532119750977, "global_step": 134039, "epoch": 1614} {"train_loss": -22.731342315673828, "global_step": 134040, "epoch": 1614} {"train_loss": -22.947696685791016, "global_step": 134041, "epoch": 1614} {"train_loss": -23.104915618896484, "global_step": 134042, "epoch": 1614} {"train_loss": -23.119747161865234, "global_step": 134043, "epoch": 1614} {"train_loss": -22.850732274802333, "global_step": 134044, "epoch": 1614, "val_loss": 6191767.0} {"train_loss": -22.122146606445312, "global_step": 134045, "epoch": 1615} {"train_loss": -22.146209716796875, "global_step": 134046, "epoch": 1615} {"train_loss": -21.780715942382812, "global_step": 134047, "epoch": 1615} {"train_loss": -22.313657760620117, "global_step": 134048, "epoch": 1615} {"train_loss": -22.508922576904297, "global_step": 134049, "epoch": 1615} {"train_loss": -22.44697380065918, "global_step": 134050, "epoch": 1615} {"train_loss": -22.237213134765625, "global_step": 134051, "epoch": 1615} {"train_loss": -22.570268630981445, "global_step": 134052, "epoch": 1615} {"train_loss": -22.438520431518555, "global_step": 134053, "epoch": 1615} {"train_loss": -22.04036521911621, "global_step": 134054, "epoch": 1615} {"train_loss": -22.563262939453125, "global_step": 134055, "epoch": 1615} {"train_loss": -22.67342185974121, "global_step": 134056, "epoch": 1615} {"train_loss": -22.635787963867188, "global_step": 134057, "epoch": 1615} {"train_loss": -22.154190063476562, "global_step": 134058, "epoch": 1615} {"train_loss": -22.416412353515625, "global_step": 134059, "epoch": 1615} {"train_loss": -22.646591186523438, "global_step": 134060, "epoch": 1615} {"train_loss": -22.2857723236084, "global_step": 134061, "epoch": 1615} {"train_loss": -22.557390213012695, "global_step": 134062, "epoch": 1615} {"train_loss": -22.989110946655273, "global_step": 134063, "epoch": 1615} {"train_loss": -22.366357803344727, "global_step": 134064, "epoch": 1615} {"train_loss": -23.2226619720459, "global_step": 134065, "epoch": 1615} {"train_loss": -22.59230613708496, "global_step": 134066, "epoch": 1615} {"train_loss": -22.894901275634766, "global_step": 134067, "epoch": 1615} {"train_loss": -22.628698348999023, "global_step": 134068, "epoch": 1615} {"train_loss": -23.099212646484375, "global_step": 134069, "epoch": 1615} {"train_loss": -22.984302520751953, "global_step": 134070, "epoch": 1615} {"train_loss": -22.691604614257812, "global_step": 134071, "epoch": 1615} {"train_loss": -22.863101959228516, "global_step": 134072, "epoch": 1615} {"train_loss": -22.67112922668457, "global_step": 134073, "epoch": 1615} {"train_loss": -23.087411880493164, "global_step": 134074, "epoch": 1615} {"train_loss": -23.11279296875, "global_step": 134075, "epoch": 1615} {"train_loss": -22.483016967773438, "global_step": 134076, "epoch": 1615} {"train_loss": -22.76704978942871, "global_step": 134077, "epoch": 1615} {"train_loss": -23.03480339050293, "global_step": 134078, "epoch": 1615} {"train_loss": -22.602293014526367, "global_step": 134079, "epoch": 1615} {"train_loss": -23.198415756225586, "global_step": 134080, "epoch": 1615} {"train_loss": -23.1002254486084, "global_step": 134081, "epoch": 1615} {"train_loss": -23.13911247253418, "global_step": 134082, "epoch": 1615} {"train_loss": -23.089916229248047, "global_step": 134083, "epoch": 1615} {"train_loss": -23.21573257446289, "global_step": 134084, "epoch": 1615} {"train_loss": -23.280170440673828, "global_step": 134085, "epoch": 1615} {"train_loss": -23.144514083862305, "global_step": 134086, "epoch": 1615} {"train_loss": -23.010595321655273, "global_step": 134087, "epoch": 1615} {"train_loss": -23.225656509399414, "global_step": 134088, "epoch": 1615} {"train_loss": -22.762096405029297, "global_step": 134089, "epoch": 1615} {"train_loss": -23.09964942932129, "global_step": 134090, "epoch": 1615} {"train_loss": -22.84602928161621, "global_step": 134091, "epoch": 1615} {"train_loss": -22.904617309570312, "global_step": 134092, "epoch": 1615} {"train_loss": -23.101194381713867, "global_step": 134093, "epoch": 1615} {"train_loss": -23.29030418395996, "global_step": 134094, "epoch": 1615} {"train_loss": -23.02823257446289, "global_step": 134095, "epoch": 1615} {"train_loss": -22.65087127685547, "global_step": 134096, "epoch": 1615} {"train_loss": -22.707138061523438, "global_step": 134097, "epoch": 1615} {"train_loss": -22.787872314453125, "global_step": 134098, "epoch": 1615} {"train_loss": -23.079486846923828, "global_step": 134099, "epoch": 1615} {"train_loss": -22.827268600463867, "global_step": 134100, "epoch": 1615} {"train_loss": -22.648366928100586, "global_step": 134101, "epoch": 1615} {"train_loss": -22.761032104492188, "global_step": 134102, "epoch": 1615} {"train_loss": -22.853225708007812, "global_step": 134103, "epoch": 1615} {"train_loss": -22.61745262145996, "global_step": 134104, "epoch": 1615} {"train_loss": -22.580930709838867, "global_step": 134105, "epoch": 1615} {"train_loss": -22.934574127197266, "global_step": 134106, "epoch": 1615} {"train_loss": -23.165599822998047, "global_step": 134107, "epoch": 1615} {"train_loss": -22.96131706237793, "global_step": 134108, "epoch": 1615} {"train_loss": -22.766321182250977, "global_step": 134109, "epoch": 1615} {"train_loss": -22.7873477935791, "global_step": 134110, "epoch": 1615} {"train_loss": -23.233123779296875, "global_step": 134111, "epoch": 1615} {"train_loss": -22.769330978393555, "global_step": 134112, "epoch": 1615} {"train_loss": -22.849637985229492, "global_step": 134113, "epoch": 1615} {"train_loss": -22.9210262298584, "global_step": 134114, "epoch": 1615} {"train_loss": -22.68055534362793, "global_step": 134115, "epoch": 1615} {"train_loss": -22.92784881591797, "global_step": 134116, "epoch": 1615} {"train_loss": -23.290019989013672, "global_step": 134117, "epoch": 1615} {"train_loss": -23.020193099975586, "global_step": 134118, "epoch": 1615} {"train_loss": -22.737079620361328, "global_step": 134119, "epoch": 1615} {"train_loss": -22.856460571289062, "global_step": 134120, "epoch": 1615} {"train_loss": -22.916166305541992, "global_step": 134121, "epoch": 1615} {"train_loss": -22.801483154296875, "global_step": 134122, "epoch": 1615} {"train_loss": -22.906986236572266, "global_step": 134123, "epoch": 1615} {"train_loss": -22.95262908935547, "global_step": 134124, "epoch": 1615} {"train_loss": -23.025793075561523, "global_step": 134125, "epoch": 1615} {"train_loss": -23.148479461669922, "global_step": 134126, "epoch": 1615} {"train_loss": -22.794743135751013, "global_step": 134127, "epoch": 1615, "val_loss": 6365340.0} {"train_loss": -22.196475982666016, "global_step": 134128, "epoch": 1616} {"train_loss": -22.29019546508789, "global_step": 134129, "epoch": 1616} {"train_loss": -22.506591796875, "global_step": 134130, "epoch": 1616} {"train_loss": -22.8348388671875, "global_step": 134131, "epoch": 1616} {"train_loss": -22.3863525390625, "global_step": 134132, "epoch": 1616} {"train_loss": -22.777355194091797, "global_step": 134133, "epoch": 1616} {"train_loss": -22.84657859802246, "global_step": 134134, "epoch": 1616} {"train_loss": -22.774246215820312, "global_step": 134135, "epoch": 1616} {"train_loss": -22.65157127380371, "global_step": 134136, "epoch": 1616} {"train_loss": -22.694616317749023, "global_step": 134137, "epoch": 1616} {"train_loss": -22.863134384155273, "global_step": 134138, "epoch": 1616} {"train_loss": -22.84584617614746, "global_step": 134139, "epoch": 1616} {"train_loss": -22.773895263671875, "global_step": 134140, "epoch": 1616} {"train_loss": -22.480091094970703, "global_step": 134141, "epoch": 1616} {"train_loss": -22.889602661132812, "global_step": 134142, "epoch": 1616} {"train_loss": -22.77998161315918, "global_step": 134143, "epoch": 1616} {"train_loss": -23.027257919311523, "global_step": 134144, "epoch": 1616} {"train_loss": -23.040512084960938, "global_step": 134145, "epoch": 1616} {"train_loss": -23.013757705688477, "global_step": 134146, "epoch": 1616} {"train_loss": -23.067638397216797, "global_step": 134147, "epoch": 1616} {"train_loss": -22.78913688659668, "global_step": 134148, "epoch": 1616} {"train_loss": -22.885133743286133, "global_step": 134149, "epoch": 1616} {"train_loss": -22.936233520507812, "global_step": 134150, "epoch": 1616} {"train_loss": -22.66240119934082, "global_step": 134151, "epoch": 1616} {"train_loss": -22.734830856323242, "global_step": 134152, "epoch": 1616} {"train_loss": -23.224292755126953, "global_step": 134153, "epoch": 1616} {"train_loss": -22.65217399597168, "global_step": 134154, "epoch": 1616} {"train_loss": -22.92588233947754, "global_step": 134155, "epoch": 1616} {"train_loss": -23.08783531188965, "global_step": 134156, "epoch": 1616} {"train_loss": -22.7008113861084, "global_step": 134157, "epoch": 1616} {"train_loss": -23.385211944580078, "global_step": 134158, "epoch": 1616} {"train_loss": -22.930875778198242, "global_step": 134159, "epoch": 1616} {"train_loss": -22.924495697021484, "global_step": 134160, "epoch": 1616} {"train_loss": -22.61207389831543, "global_step": 134161, "epoch": 1616} {"train_loss": -22.668838500976562, "global_step": 134162, "epoch": 1616} {"train_loss": -23.164350509643555, "global_step": 134163, "epoch": 1616} {"train_loss": -22.885272979736328, "global_step": 134164, "epoch": 1616} {"train_loss": -22.81648826599121, "global_step": 134165, "epoch": 1616} {"train_loss": -22.766881942749023, "global_step": 134166, "epoch": 1616} {"train_loss": -23.01997184753418, "global_step": 134167, "epoch": 1616} {"train_loss": -22.940078735351562, "global_step": 134168, "epoch": 1616} {"train_loss": -23.26482391357422, "global_step": 134169, "epoch": 1616} {"train_loss": -22.951614379882812, "global_step": 134170, "epoch": 1616} {"train_loss": -23.073068618774414, "global_step": 134171, "epoch": 1616} {"train_loss": -22.801916122436523, "global_step": 134172, "epoch": 1616} {"train_loss": -22.453107833862305, "global_step": 134173, "epoch": 1616} {"train_loss": -22.706144332885742, "global_step": 134174, "epoch": 1616} {"train_loss": -22.95453453063965, "global_step": 134175, "epoch": 1616} {"train_loss": -22.9542293548584, "global_step": 134176, "epoch": 1616} {"train_loss": -22.792991638183594, "global_step": 134177, "epoch": 1616} {"train_loss": -22.928686141967773, "global_step": 134178, "epoch": 1616} {"train_loss": -22.54353141784668, "global_step": 134179, "epoch": 1616} {"train_loss": -22.714033126831055, "global_step": 134180, "epoch": 1616} {"train_loss": -22.726730346679688, "global_step": 134181, "epoch": 1616} {"train_loss": -22.665685653686523, "global_step": 134182, "epoch": 1616} {"train_loss": -22.832935333251953, "global_step": 134183, "epoch": 1616} {"train_loss": -22.756729125976562, "global_step": 134184, "epoch": 1616} {"train_loss": -22.57880973815918, "global_step": 134185, "epoch": 1616} {"train_loss": -22.891891479492188, "global_step": 134186, "epoch": 1616} {"train_loss": -23.090320587158203, "global_step": 134187, "epoch": 1616} {"train_loss": -23.087331771850586, "global_step": 134188, "epoch": 1616} {"train_loss": -23.025218963623047, "global_step": 134189, "epoch": 1616} {"train_loss": -23.0488338470459, "global_step": 134190, "epoch": 1616} {"train_loss": -23.21026039123535, "global_step": 134191, "epoch": 1616} {"train_loss": -22.759368896484375, "global_step": 134192, "epoch": 1616} {"train_loss": -23.05156898498535, "global_step": 134193, "epoch": 1616} {"train_loss": -23.470563888549805, "global_step": 134194, "epoch": 1616} {"train_loss": -23.000022888183594, "global_step": 134195, "epoch": 1616} {"train_loss": -22.898853302001953, "global_step": 134196, "epoch": 1616} {"train_loss": -22.63612937927246, "global_step": 134197, "epoch": 1616} {"train_loss": -22.972286224365234, "global_step": 134198, "epoch": 1616} {"train_loss": -22.79818344116211, "global_step": 134199, "epoch": 1616} {"train_loss": -22.95688819885254, "global_step": 134200, "epoch": 1616} {"train_loss": -22.98434829711914, "global_step": 134201, "epoch": 1616} {"train_loss": -22.950864791870117, "global_step": 134202, "epoch": 1616} {"train_loss": -23.187795639038086, "global_step": 134203, "epoch": 1616} {"train_loss": -23.164215087890625, "global_step": 134204, "epoch": 1616} {"train_loss": -22.83973503112793, "global_step": 134205, "epoch": 1616} {"train_loss": -23.073461532592773, "global_step": 134206, "epoch": 1616} {"train_loss": -22.91275978088379, "global_step": 134207, "epoch": 1616} {"train_loss": -23.089969635009766, "global_step": 134208, "epoch": 1616} {"train_loss": -23.2128849029541, "global_step": 134209, "epoch": 1616} {"train_loss": -22.866680329104504, "global_step": 134210, "epoch": 1616, "val_loss": 6412203.0} {"train_loss": -22.946338653564453, "global_step": 134211, "epoch": 1617} {"train_loss": -22.387008666992188, "global_step": 134212, "epoch": 1617} {"train_loss": -22.565717697143555, "global_step": 134213, "epoch": 1617} {"train_loss": -22.772687911987305, "global_step": 134214, "epoch": 1617} {"train_loss": -22.722925186157227, "global_step": 134215, "epoch": 1617} {"train_loss": -22.572406768798828, "global_step": 134216, "epoch": 1617} {"train_loss": -22.69217300415039, "global_step": 134217, "epoch": 1617} {"train_loss": -22.601709365844727, "global_step": 134218, "epoch": 1617} {"train_loss": -23.032018661499023, "global_step": 134219, "epoch": 1617} {"train_loss": -22.533740997314453, "global_step": 134220, "epoch": 1617} {"train_loss": -22.459627151489258, "global_step": 134221, "epoch": 1617} {"train_loss": -22.709972381591797, "global_step": 134222, "epoch": 1617} {"train_loss": -22.681873321533203, "global_step": 134223, "epoch": 1617} {"train_loss": -22.744104385375977, "global_step": 134224, "epoch": 1617} {"train_loss": -22.692811965942383, "global_step": 134225, "epoch": 1617} {"train_loss": -22.747182846069336, "global_step": 134226, "epoch": 1617} {"train_loss": -22.682641983032227, "global_step": 134227, "epoch": 1617} {"train_loss": -23.0185604095459, "global_step": 134228, "epoch": 1617} {"train_loss": -22.85062026977539, "global_step": 134229, "epoch": 1617} {"train_loss": -22.800987243652344, "global_step": 134230, "epoch": 1617} {"train_loss": -22.994943618774414, "global_step": 134231, "epoch": 1617} {"train_loss": -22.5146484375, "global_step": 134232, "epoch": 1617} {"train_loss": -22.847105026245117, "global_step": 134233, "epoch": 1617} {"train_loss": -22.84058380126953, "global_step": 134234, "epoch": 1617} {"train_loss": -22.97092628479004, "global_step": 134235, "epoch": 1617} {"train_loss": -23.04222869873047, "global_step": 134236, "epoch": 1617} {"train_loss": -23.29331398010254, "global_step": 134237, "epoch": 1617} {"train_loss": -22.763399124145508, "global_step": 134238, "epoch": 1617} {"train_loss": -22.855253219604492, "global_step": 134239, "epoch": 1617} {"train_loss": -22.718399047851562, "global_step": 134240, "epoch": 1617} {"train_loss": -23.070905685424805, "global_step": 134241, "epoch": 1617} {"train_loss": -22.88314437866211, "global_step": 134242, "epoch": 1617} {"train_loss": -22.827133178710938, "global_step": 134243, "epoch": 1617} {"train_loss": -22.864364624023438, "global_step": 134244, "epoch": 1617} {"train_loss": -22.795202255249023, "global_step": 134245, "epoch": 1617} {"train_loss": -22.89234733581543, "global_step": 134246, "epoch": 1617} {"train_loss": -22.977956771850586, "global_step": 134247, "epoch": 1617} {"train_loss": -22.86666488647461, "global_step": 134248, "epoch": 1617} {"train_loss": -22.948959350585938, "global_step": 134249, "epoch": 1617} {"train_loss": -22.990598678588867, "global_step": 134250, "epoch": 1617} {"train_loss": -23.00518798828125, "global_step": 134251, "epoch": 1617} {"train_loss": -23.161399841308594, "global_step": 134252, "epoch": 1617} {"train_loss": -22.896949768066406, "global_step": 134253, "epoch": 1617} {"train_loss": -22.902353286743164, "global_step": 134254, "epoch": 1617} {"train_loss": -23.011688232421875, "global_step": 134255, "epoch": 1617} {"train_loss": -22.7775821685791, "global_step": 134256, "epoch": 1617} {"train_loss": -23.12355613708496, "global_step": 134257, "epoch": 1617} {"train_loss": -22.267620086669922, "global_step": 134258, "epoch": 1617} {"train_loss": -23.21125602722168, "global_step": 134259, "epoch": 1617} {"train_loss": -22.708322525024414, "global_step": 134260, "epoch": 1617} {"train_loss": -23.010936737060547, "global_step": 134261, "epoch": 1617} {"train_loss": -22.83888816833496, "global_step": 134262, "epoch": 1617} {"train_loss": -23.01416015625, "global_step": 134263, "epoch": 1617} {"train_loss": -22.760974884033203, "global_step": 134264, "epoch": 1617} {"train_loss": -22.73642349243164, "global_step": 134265, "epoch": 1617} {"train_loss": -22.831361770629883, "global_step": 134266, "epoch": 1617} {"train_loss": -22.987390518188477, "global_step": 134267, "epoch": 1617} {"train_loss": -22.5223445892334, "global_step": 134268, "epoch": 1617} {"train_loss": -22.896636962890625, "global_step": 134269, "epoch": 1617} {"train_loss": -22.60047721862793, "global_step": 134270, "epoch": 1617} {"train_loss": -22.995166778564453, "global_step": 134271, "epoch": 1617} {"train_loss": -22.928001403808594, "global_step": 134272, "epoch": 1617} {"train_loss": -23.086647033691406, "global_step": 134273, "epoch": 1617} {"train_loss": -22.838584899902344, "global_step": 134274, "epoch": 1617} {"train_loss": -22.981534957885742, "global_step": 134275, "epoch": 1617} {"train_loss": -22.590534210205078, "global_step": 134276, "epoch": 1617} {"train_loss": -22.523757934570312, "global_step": 134277, "epoch": 1617} {"train_loss": -23.042207717895508, "global_step": 134278, "epoch": 1617} {"train_loss": -22.684371948242188, "global_step": 134279, "epoch": 1617} {"train_loss": -22.817832946777344, "global_step": 134280, "epoch": 1617} {"train_loss": -23.040319442749023, "global_step": 134281, "epoch": 1617} {"train_loss": -22.798620223999023, "global_step": 134282, "epoch": 1617} {"train_loss": -22.848569869995117, "global_step": 134283, "epoch": 1617} {"train_loss": -22.95084571838379, "global_step": 134284, "epoch": 1617} {"train_loss": -23.039594650268555, "global_step": 134285, "epoch": 1617} {"train_loss": -23.301715850830078, "global_step": 134286, "epoch": 1617} {"train_loss": -22.96699333190918, "global_step": 134287, "epoch": 1617} {"train_loss": -23.09939956665039, "global_step": 134288, "epoch": 1617} {"train_loss": -22.65428352355957, "global_step": 134289, "epoch": 1617} {"train_loss": -22.599206924438477, "global_step": 134290, "epoch": 1617} {"train_loss": -22.731515884399414, "global_step": 134291, "epoch": 1617} {"train_loss": -22.754484176635742, "global_step": 134292, "epoch": 1617} {"train_loss": -22.856178835213903, "global_step": 134293, "epoch": 1617, "val_loss": 6322105.0} {"train_loss": -22.170469284057617, "global_step": 134294, "epoch": 1618} {"train_loss": -22.393163681030273, "global_step": 134295, "epoch": 1618} {"train_loss": -22.47502326965332, "global_step": 134296, "epoch": 1618} {"train_loss": -22.30493927001953, "global_step": 134297, "epoch": 1618} {"train_loss": -22.0164852142334, "global_step": 134298, "epoch": 1618} {"train_loss": -22.532855987548828, "global_step": 134299, "epoch": 1618} {"train_loss": -22.513442993164062, "global_step": 134300, "epoch": 1618} {"train_loss": -22.46939468383789, "global_step": 134301, "epoch": 1618} {"train_loss": -22.323314666748047, "global_step": 134302, "epoch": 1618} {"train_loss": -22.651453018188477, "global_step": 134303, "epoch": 1618} {"train_loss": -22.437358856201172, "global_step": 134304, "epoch": 1618} {"train_loss": -22.602567672729492, "global_step": 134305, "epoch": 1618} {"train_loss": -22.85078239440918, "global_step": 134306, "epoch": 1618} {"train_loss": -22.943700790405273, "global_step": 134307, "epoch": 1618} {"train_loss": -23.118072509765625, "global_step": 134308, "epoch": 1618} {"train_loss": -22.559192657470703, "global_step": 134309, "epoch": 1618} {"train_loss": -22.475126266479492, "global_step": 134310, "epoch": 1618} {"train_loss": -22.58209228515625, "global_step": 134311, "epoch": 1618} {"train_loss": -22.875030517578125, "global_step": 134312, "epoch": 1618} {"train_loss": -22.88431739807129, "global_step": 134313, "epoch": 1618} {"train_loss": -22.699384689331055, "global_step": 134314, "epoch": 1618} {"train_loss": -22.602981567382812, "global_step": 134315, "epoch": 1618} {"train_loss": -22.889001846313477, "global_step": 134316, "epoch": 1618} {"train_loss": -22.9491024017334, "global_step": 134317, "epoch": 1618} {"train_loss": -22.799440383911133, "global_step": 134318, "epoch": 1618} {"train_loss": -23.154598236083984, "global_step": 134319, "epoch": 1618} {"train_loss": -22.749774932861328, "global_step": 134320, "epoch": 1618} {"train_loss": -22.412235260009766, "global_step": 134321, "epoch": 1618} {"train_loss": -22.620094299316406, "global_step": 134322, "epoch": 1618} {"train_loss": -22.90545654296875, "global_step": 134323, "epoch": 1618} {"train_loss": -23.075681686401367, "global_step": 134324, "epoch": 1618} {"train_loss": -23.097864151000977, "global_step": 134325, "epoch": 1618} {"train_loss": -22.930002212524414, "global_step": 134326, "epoch": 1618} {"train_loss": -23.12310028076172, "global_step": 134327, "epoch": 1618} {"train_loss": -22.855518341064453, "global_step": 134328, "epoch": 1618} {"train_loss": -23.308696746826172, "global_step": 134329, "epoch": 1618} {"train_loss": -22.678024291992188, "global_step": 134330, "epoch": 1618} {"train_loss": -22.570085525512695, "global_step": 134331, "epoch": 1618} {"train_loss": -22.526487350463867, "global_step": 134332, "epoch": 1618} {"train_loss": -23.151071548461914, "global_step": 134333, "epoch": 1618} {"train_loss": -22.81627082824707, "global_step": 134334, "epoch": 1618} {"train_loss": -22.62131690979004, "global_step": 134335, "epoch": 1618} {"train_loss": -23.057188034057617, "global_step": 134336, "epoch": 1618} {"train_loss": -22.76065444946289, "global_step": 134337, "epoch": 1618} {"train_loss": -22.91633415222168, "global_step": 134338, "epoch": 1618} {"train_loss": -22.825490951538086, "global_step": 134339, "epoch": 1618} {"train_loss": -22.99247932434082, "global_step": 134340, "epoch": 1618} {"train_loss": -22.892135620117188, "global_step": 134341, "epoch": 1618} {"train_loss": -22.7569580078125, "global_step": 134342, "epoch": 1618} {"train_loss": -22.963634490966797, "global_step": 134343, "epoch": 1618} {"train_loss": -22.564847946166992, "global_step": 134344, "epoch": 1618} {"train_loss": -22.557037353515625, "global_step": 134345, "epoch": 1618} {"train_loss": -23.15409278869629, "global_step": 134346, "epoch": 1618} {"train_loss": -23.215713500976562, "global_step": 134347, "epoch": 1618} {"train_loss": -22.919967651367188, "global_step": 134348, "epoch": 1618} {"train_loss": -22.819990158081055, "global_step": 134349, "epoch": 1618} {"train_loss": -22.73748016357422, "global_step": 134350, "epoch": 1618} {"train_loss": -22.933399200439453, "global_step": 134351, "epoch": 1618} {"train_loss": -23.089445114135742, "global_step": 134352, "epoch": 1618} {"train_loss": -23.013647079467773, "global_step": 134353, "epoch": 1618} {"train_loss": -23.008119583129883, "global_step": 134354, "epoch": 1618} {"train_loss": -22.9334774017334, "global_step": 134355, "epoch": 1618} {"train_loss": -22.90777015686035, "global_step": 134356, "epoch": 1618} {"train_loss": -23.00311851501465, "global_step": 134357, "epoch": 1618} {"train_loss": -22.952350616455078, "global_step": 134358, "epoch": 1618} {"train_loss": -22.83880615234375, "global_step": 134359, "epoch": 1618} {"train_loss": -22.74724578857422, "global_step": 134360, "epoch": 1618} {"train_loss": -22.916545867919922, "global_step": 134361, "epoch": 1618} {"train_loss": -23.09756851196289, "global_step": 134362, "epoch": 1618} {"train_loss": -22.81764030456543, "global_step": 134363, "epoch": 1618} {"train_loss": -23.072364807128906, "global_step": 134364, "epoch": 1618} {"train_loss": -22.8227596282959, "global_step": 134365, "epoch": 1618} {"train_loss": -22.591245651245117, "global_step": 134366, "epoch": 1618} {"train_loss": -22.740463256835938, "global_step": 134367, "epoch": 1618} {"train_loss": -22.728761672973633, "global_step": 134368, "epoch": 1618} {"train_loss": -22.899572372436523, "global_step": 134369, "epoch": 1618} {"train_loss": -23.493196487426758, "global_step": 134370, "epoch": 1618} {"train_loss": -23.153661727905273, "global_step": 134371, "epoch": 1618} {"train_loss": -23.046804428100586, "global_step": 134372, "epoch": 1618} {"train_loss": -22.977550506591797, "global_step": 134373, "epoch": 1618} {"train_loss": -23.18938636779785, "global_step": 134374, "epoch": 1618} {"train_loss": -22.73382568359375, "global_step": 134375, "epoch": 1618} {"train_loss": -22.825099002884095, "global_step": 134376, "epoch": 1618, "val_loss": 6274561.0} {"train_loss": -22.03789710998535, "global_step": 134377, "epoch": 1619} {"train_loss": -22.2686710357666, "global_step": 134378, "epoch": 1619} {"train_loss": -22.397489547729492, "global_step": 134379, "epoch": 1619} {"train_loss": -22.54644203186035, "global_step": 134380, "epoch": 1619} {"train_loss": -22.294822692871094, "global_step": 134381, "epoch": 1619} {"train_loss": -22.59215545654297, "global_step": 134382, "epoch": 1619} {"train_loss": -22.128055572509766, "global_step": 134383, "epoch": 1619} {"train_loss": -22.278549194335938, "global_step": 134384, "epoch": 1619} {"train_loss": -22.209131240844727, "global_step": 134385, "epoch": 1619} {"train_loss": -22.551437377929688, "global_step": 134386, "epoch": 1619} {"train_loss": -22.43304443359375, "global_step": 134387, "epoch": 1619} {"train_loss": -22.46552085876465, "global_step": 134388, "epoch": 1619} {"train_loss": -22.6680850982666, "global_step": 134389, "epoch": 1619} {"train_loss": -22.511287689208984, "global_step": 134390, "epoch": 1619} {"train_loss": -22.71549415588379, "global_step": 134391, "epoch": 1619} {"train_loss": -22.596242904663086, "global_step": 134392, "epoch": 1619} {"train_loss": -22.95476722717285, "global_step": 134393, "epoch": 1619} {"train_loss": -23.07793617248535, "global_step": 134394, "epoch": 1619} {"train_loss": -22.912328720092773, "global_step": 134395, "epoch": 1619} {"train_loss": -22.905614852905273, "global_step": 134396, "epoch": 1619} {"train_loss": -22.581518173217773, "global_step": 134397, "epoch": 1619} {"train_loss": -22.81894302368164, "global_step": 134398, "epoch": 1619} {"train_loss": -22.453176498413086, "global_step": 134399, "epoch": 1619} {"train_loss": -23.030323028564453, "global_step": 134400, "epoch": 1619} {"train_loss": -22.896047592163086, "global_step": 134401, "epoch": 1619} {"train_loss": -22.93020248413086, "global_step": 134402, "epoch": 1619} {"train_loss": -22.61406898498535, "global_step": 134403, "epoch": 1619} {"train_loss": -22.435302734375, "global_step": 134404, "epoch": 1619} {"train_loss": -22.840412139892578, "global_step": 134405, "epoch": 1619} {"train_loss": -22.898456573486328, "global_step": 134406, "epoch": 1619} {"train_loss": -23.059720993041992, "global_step": 134407, "epoch": 1619} {"train_loss": -23.037429809570312, "global_step": 134408, "epoch": 1619} {"train_loss": -22.91421127319336, "global_step": 134409, "epoch": 1619} {"train_loss": -22.707029342651367, "global_step": 134410, "epoch": 1619} {"train_loss": -23.023740768432617, "global_step": 134411, "epoch": 1619} {"train_loss": -22.942960739135742, "global_step": 134412, "epoch": 1619} {"train_loss": -23.202613830566406, "global_step": 134413, "epoch": 1619} {"train_loss": -22.88652992248535, "global_step": 134414, "epoch": 1619} {"train_loss": -22.98857879638672, "global_step": 134415, "epoch": 1619} {"train_loss": -22.974912643432617, "global_step": 134416, "epoch": 1619} {"train_loss": -22.81682014465332, "global_step": 134417, "epoch": 1619} {"train_loss": -23.129898071289062, "global_step": 134418, "epoch": 1619} {"train_loss": -22.998441696166992, "global_step": 134419, "epoch": 1619} {"train_loss": -22.81311798095703, "global_step": 134420, "epoch": 1619} {"train_loss": -23.208402633666992, "global_step": 134421, "epoch": 1619} {"train_loss": -23.151439666748047, "global_step": 134422, "epoch": 1619} {"train_loss": -23.03541374206543, "global_step": 134423, "epoch": 1619} {"train_loss": -23.011022567749023, "global_step": 134424, "epoch": 1619} {"train_loss": -23.13221549987793, "global_step": 134425, "epoch": 1619} {"train_loss": -23.004072189331055, "global_step": 134426, "epoch": 1619} {"train_loss": -23.40595817565918, "global_step": 134427, "epoch": 1619} {"train_loss": -23.201932907104492, "global_step": 134428, "epoch": 1619} {"train_loss": -22.8016414642334, "global_step": 134429, "epoch": 1619} {"train_loss": -23.11797332763672, "global_step": 134430, "epoch": 1619} {"train_loss": -22.726041793823242, "global_step": 134431, "epoch": 1619} {"train_loss": -23.072555541992188, "global_step": 134432, "epoch": 1619} {"train_loss": -22.627859115600586, "global_step": 134433, "epoch": 1619} {"train_loss": -22.899200439453125, "global_step": 134434, "epoch": 1619} {"train_loss": -22.873004913330078, "global_step": 134435, "epoch": 1619} {"train_loss": -22.913084030151367, "global_step": 134436, "epoch": 1619} {"train_loss": -22.8745174407959, "global_step": 134437, "epoch": 1619} {"train_loss": -22.9851131439209, "global_step": 134438, "epoch": 1619} {"train_loss": -22.427814483642578, "global_step": 134439, "epoch": 1619} {"train_loss": -22.542348861694336, "global_step": 134440, "epoch": 1619} {"train_loss": -23.189058303833008, "global_step": 134441, "epoch": 1619} {"train_loss": -23.168872833251953, "global_step": 134442, "epoch": 1619} {"train_loss": -22.525379180908203, "global_step": 134443, "epoch": 1619} {"train_loss": -22.886524200439453, "global_step": 134444, "epoch": 1619} {"train_loss": -23.151596069335938, "global_step": 134445, "epoch": 1619} {"train_loss": -22.764604568481445, "global_step": 134446, "epoch": 1619} {"train_loss": -23.142776489257812, "global_step": 134447, "epoch": 1619} {"train_loss": -22.8066463470459, "global_step": 134448, "epoch": 1619} {"train_loss": -22.943777084350586, "global_step": 134449, "epoch": 1619} {"train_loss": -23.01538848876953, "global_step": 134450, "epoch": 1619} {"train_loss": -22.731735229492188, "global_step": 134451, "epoch": 1619} {"train_loss": -22.804651260375977, "global_step": 134452, "epoch": 1619} {"train_loss": -22.675037384033203, "global_step": 134453, "epoch": 1619} {"train_loss": -22.991817474365234, "global_step": 134454, "epoch": 1619} {"train_loss": -22.84511947631836, "global_step": 134455, "epoch": 1619} {"train_loss": -22.58084487915039, "global_step": 134456, "epoch": 1619} {"train_loss": -22.835205078125, "global_step": 134457, "epoch": 1619} {"train_loss": -22.822551727294922, "global_step": 134458, "epoch": 1619} {"train_loss": -22.795352315328206, "global_step": 134459, "epoch": 1619, "val_loss": 6263736.0} {"train_loss": -22.26059913635254, "global_step": 134460, "epoch": 1620} {"train_loss": -22.256149291992188, "global_step": 134461, "epoch": 1620} {"train_loss": -22.656373977661133, "global_step": 134462, "epoch": 1620} {"train_loss": -22.49435043334961, "global_step": 134463, "epoch": 1620} {"train_loss": -22.866498947143555, "global_step": 134464, "epoch": 1620} {"train_loss": -23.060232162475586, "global_step": 134465, "epoch": 1620} {"train_loss": -22.56294059753418, "global_step": 134466, "epoch": 1620} {"train_loss": -22.779014587402344, "global_step": 134467, "epoch": 1620} {"train_loss": -22.960973739624023, "global_step": 134468, "epoch": 1620} {"train_loss": -22.867677688598633, "global_step": 134469, "epoch": 1620} {"train_loss": -22.817764282226562, "global_step": 134470, "epoch": 1620} {"train_loss": -22.7827091217041, "global_step": 134471, "epoch": 1620} {"train_loss": -22.883466720581055, "global_step": 134472, "epoch": 1620} {"train_loss": -23.05072021484375, "global_step": 134473, "epoch": 1620} {"train_loss": -22.847227096557617, "global_step": 134474, "epoch": 1620} {"train_loss": -23.01372718811035, "global_step": 134475, "epoch": 1620} {"train_loss": -22.396554946899414, "global_step": 134476, "epoch": 1620} {"train_loss": -22.943119049072266, "global_step": 134477, "epoch": 1620} {"train_loss": -23.04177474975586, "global_step": 134478, "epoch": 1620} {"train_loss": -22.7325439453125, "global_step": 134479, "epoch": 1620} {"train_loss": -22.856719970703125, "global_step": 134480, "epoch": 1620} {"train_loss": -22.685611724853516, "global_step": 134481, "epoch": 1620} {"train_loss": -22.88119888305664, "global_step": 134482, "epoch": 1620} {"train_loss": -23.008411407470703, "global_step": 134483, "epoch": 1620} {"train_loss": -22.880884170532227, "global_step": 134484, "epoch": 1620} {"train_loss": -22.824569702148438, "global_step": 134485, "epoch": 1620} {"train_loss": -22.71198081970215, "global_step": 134486, "epoch": 1620} {"train_loss": -22.5351505279541, "global_step": 134487, "epoch": 1620} {"train_loss": -22.472867965698242, "global_step": 134488, "epoch": 1620} {"train_loss": -22.988086700439453, "global_step": 134489, "epoch": 1620} {"train_loss": -22.860858917236328, "global_step": 134490, "epoch": 1620} {"train_loss": -22.73932456970215, "global_step": 134491, "epoch": 1620} {"train_loss": -22.81163215637207, "global_step": 134492, "epoch": 1620} {"train_loss": -22.64581871032715, "global_step": 134493, "epoch": 1620} {"train_loss": -22.686542510986328, "global_step": 134494, "epoch": 1620} {"train_loss": -22.80030632019043, "global_step": 134495, "epoch": 1620} {"train_loss": -22.860429763793945, "global_step": 134496, "epoch": 1620} {"train_loss": -22.672433853149414, "global_step": 134497, "epoch": 1620} {"train_loss": -23.355501174926758, "global_step": 134498, "epoch": 1620} {"train_loss": -23.04364013671875, "global_step": 134499, "epoch": 1620} {"train_loss": -23.191925048828125, "global_step": 134500, "epoch": 1620} {"train_loss": -23.14105224609375, "global_step": 134501, "epoch": 1620} {"train_loss": -22.966100692749023, "global_step": 134502, "epoch": 1620} {"train_loss": -23.10834312438965, "global_step": 134503, "epoch": 1620} {"train_loss": -23.01148796081543, "global_step": 134504, "epoch": 1620} {"train_loss": -22.874481201171875, "global_step": 134505, "epoch": 1620} {"train_loss": -22.482778549194336, "global_step": 134506, "epoch": 1620} {"train_loss": -23.118078231811523, "global_step": 134507, "epoch": 1620} {"train_loss": -22.735631942749023, "global_step": 134508, "epoch": 1620} {"train_loss": -22.864578247070312, "global_step": 134509, "epoch": 1620} {"train_loss": -22.598981857299805, "global_step": 134510, "epoch": 1620} {"train_loss": -22.962217330932617, "global_step": 134511, "epoch": 1620} {"train_loss": -23.002456665039062, "global_step": 134512, "epoch": 1620} {"train_loss": -22.954904556274414, "global_step": 134513, "epoch": 1620} {"train_loss": -22.616846084594727, "global_step": 134514, "epoch": 1620} {"train_loss": -23.058185577392578, "global_step": 134515, "epoch": 1620} {"train_loss": -22.883071899414062, "global_step": 134516, "epoch": 1620} {"train_loss": -22.975996017456055, "global_step": 134517, "epoch": 1620} {"train_loss": -22.9498233795166, "global_step": 134518, "epoch": 1620} {"train_loss": -22.770246505737305, "global_step": 134519, "epoch": 1620} {"train_loss": -22.605314254760742, "global_step": 134520, "epoch": 1620} {"train_loss": -23.123414993286133, "global_step": 134521, "epoch": 1620} {"train_loss": -22.978702545166016, "global_step": 134522, "epoch": 1620} {"train_loss": -23.09173011779785, "global_step": 134523, "epoch": 1620} {"train_loss": -22.8103084564209, "global_step": 134524, "epoch": 1620} {"train_loss": -22.9921932220459, "global_step": 134525, "epoch": 1620} {"train_loss": -22.869033813476562, "global_step": 134526, "epoch": 1620} {"train_loss": -23.091981887817383, "global_step": 134527, "epoch": 1620} {"train_loss": -22.955732345581055, "global_step": 134528, "epoch": 1620} {"train_loss": -22.985780715942383, "global_step": 134529, "epoch": 1620} {"train_loss": -23.074615478515625, "global_step": 134530, "epoch": 1620} {"train_loss": -23.151601791381836, "global_step": 134531, "epoch": 1620} {"train_loss": -23.1919002532959, "global_step": 134532, "epoch": 1620} {"train_loss": -23.051353454589844, "global_step": 134533, "epoch": 1620} {"train_loss": -22.8396053314209, "global_step": 134534, "epoch": 1620} {"train_loss": -22.832990646362305, "global_step": 134535, "epoch": 1620} {"train_loss": -22.656774520874023, "global_step": 134536, "epoch": 1620} {"train_loss": -22.9588623046875, "global_step": 134537, "epoch": 1620} {"train_loss": -22.69501495361328, "global_step": 134538, "epoch": 1620} {"train_loss": -22.907594680786133, "global_step": 134539, "epoch": 1620} {"train_loss": -22.80548667907715, "global_step": 134540, "epoch": 1620} {"train_loss": -23.233154296875, "global_step": 134541, "epoch": 1620} {"train_loss": -22.878844962062605, "global_step": 134542, "epoch": 1620, "val_loss": 6431689.0} {"train_loss": -22.84026527404785, "global_step": 134543, "epoch": 1621} {"train_loss": -22.392215728759766, "global_step": 134544, "epoch": 1621} {"train_loss": -22.788259506225586, "global_step": 134545, "epoch": 1621} {"train_loss": -22.735355377197266, "global_step": 134546, "epoch": 1621} {"train_loss": -22.699478149414062, "global_step": 134547, "epoch": 1621} {"train_loss": -23.151912689208984, "global_step": 134548, "epoch": 1621} {"train_loss": -23.004911422729492, "global_step": 134549, "epoch": 1621} {"train_loss": -22.681270599365234, "global_step": 134550, "epoch": 1621} {"train_loss": -22.936567306518555, "global_step": 134551, "epoch": 1621} {"train_loss": -22.964303970336914, "global_step": 134552, "epoch": 1621} {"train_loss": -22.48973274230957, "global_step": 134553, "epoch": 1621} {"train_loss": -22.800495147705078, "global_step": 134554, "epoch": 1621} {"train_loss": -22.87005615234375, "global_step": 134555, "epoch": 1621} {"train_loss": -22.653778076171875, "global_step": 134556, "epoch": 1621} {"train_loss": -22.63917350769043, "global_step": 134557, "epoch": 1621} {"train_loss": -22.7221736907959, "global_step": 134558, "epoch": 1621} {"train_loss": -22.651365280151367, "global_step": 134559, "epoch": 1621} {"train_loss": -23.15382194519043, "global_step": 134560, "epoch": 1621} {"train_loss": -22.657752990722656, "global_step": 134561, "epoch": 1621} {"train_loss": -22.94721031188965, "global_step": 134562, "epoch": 1621} {"train_loss": -23.100780487060547, "global_step": 134563, "epoch": 1621} {"train_loss": -23.209075927734375, "global_step": 134564, "epoch": 1621} {"train_loss": -22.889860153198242, "global_step": 134565, "epoch": 1621} {"train_loss": -23.06900978088379, "global_step": 134566, "epoch": 1621} {"train_loss": -23.1232967376709, "global_step": 134567, "epoch": 1621} {"train_loss": -23.111705780029297, "global_step": 134568, "epoch": 1621} {"train_loss": -22.869497299194336, "global_step": 134569, "epoch": 1621} {"train_loss": -23.050371170043945, "global_step": 134570, "epoch": 1621} {"train_loss": -22.970346450805664, "global_step": 134571, "epoch": 1621} {"train_loss": -22.766511917114258, "global_step": 134572, "epoch": 1621} {"train_loss": -23.06574821472168, "global_step": 134573, "epoch": 1621} {"train_loss": -23.128263473510742, "global_step": 134574, "epoch": 1621} {"train_loss": -22.856674194335938, "global_step": 134575, "epoch": 1621} {"train_loss": -22.82439613342285, "global_step": 134576, "epoch": 1621} {"train_loss": -22.71926498413086, "global_step": 134577, "epoch": 1621} {"train_loss": -23.237241744995117, "global_step": 134578, "epoch": 1621} {"train_loss": -22.982885360717773, "global_step": 134579, "epoch": 1621} {"train_loss": -22.677677154541016, "global_step": 134580, "epoch": 1621} {"train_loss": -22.403600692749023, "global_step": 134581, "epoch": 1621} {"train_loss": -23.21028709411621, "global_step": 134582, "epoch": 1621} {"train_loss": -23.01106834411621, "global_step": 134583, "epoch": 1621} {"train_loss": -22.76399803161621, "global_step": 134584, "epoch": 1621} {"train_loss": -23.554779052734375, "global_step": 134585, "epoch": 1621} {"train_loss": -22.801345825195312, "global_step": 134586, "epoch": 1621} {"train_loss": -22.757030487060547, "global_step": 134587, "epoch": 1621} {"train_loss": -22.832324981689453, "global_step": 134588, "epoch": 1621} {"train_loss": -23.055707931518555, "global_step": 134589, "epoch": 1621} {"train_loss": -23.282033920288086, "global_step": 134590, "epoch": 1621} {"train_loss": -22.918630599975586, "global_step": 134591, "epoch": 1621} {"train_loss": -22.935998916625977, "global_step": 134592, "epoch": 1621} {"train_loss": -22.869300842285156, "global_step": 134593, "epoch": 1621} {"train_loss": -23.263355255126953, "global_step": 134594, "epoch": 1621} {"train_loss": -23.12784767150879, "global_step": 134595, "epoch": 1621} {"train_loss": -23.0086727142334, "global_step": 134596, "epoch": 1621} {"train_loss": -22.821748733520508, "global_step": 134597, "epoch": 1621} {"train_loss": -22.885778427124023, "global_step": 134598, "epoch": 1621} {"train_loss": -22.774585723876953, "global_step": 134599, "epoch": 1621} {"train_loss": -22.717737197875977, "global_step": 134600, "epoch": 1621} {"train_loss": -23.111392974853516, "global_step": 134601, "epoch": 1621} {"train_loss": -23.44659996032715, "global_step": 134602, "epoch": 1621} {"train_loss": -22.99611473083496, "global_step": 134603, "epoch": 1621} {"train_loss": -22.856700897216797, "global_step": 134604, "epoch": 1621} {"train_loss": -22.913238525390625, "global_step": 134605, "epoch": 1621} {"train_loss": -22.981260299682617, "global_step": 134606, "epoch": 1621} {"train_loss": -23.0555419921875, "global_step": 134607, "epoch": 1621} {"train_loss": -22.843887329101562, "global_step": 134608, "epoch": 1621} {"train_loss": -23.015579223632812, "global_step": 134609, "epoch": 1621} {"train_loss": -22.906719207763672, "global_step": 134610, "epoch": 1621} {"train_loss": -22.93081283569336, "global_step": 134611, "epoch": 1621} {"train_loss": -23.293560028076172, "global_step": 134612, "epoch": 1621} {"train_loss": -23.07501792907715, "global_step": 134613, "epoch": 1621} {"train_loss": -22.81109046936035, "global_step": 134614, "epoch": 1621} {"train_loss": -23.2344970703125, "global_step": 134615, "epoch": 1621} {"train_loss": -23.072341918945312, "global_step": 134616, "epoch": 1621} {"train_loss": -22.814128875732422, "global_step": 134617, "epoch": 1621} {"train_loss": -22.658227920532227, "global_step": 134618, "epoch": 1621} {"train_loss": -22.700687408447266, "global_step": 134619, "epoch": 1621} {"train_loss": -22.95041275024414, "global_step": 134620, "epoch": 1621} {"train_loss": -22.88612937927246, "global_step": 134621, "epoch": 1621} {"train_loss": -22.93375015258789, "global_step": 134622, "epoch": 1621} {"train_loss": -22.780832290649414, "global_step": 134623, "epoch": 1621} {"train_loss": -22.54153060913086, "global_step": 134624, "epoch": 1621} {"train_loss": -22.926843758088996, "global_step": 134625, "epoch": 1621, "val_loss": 6192189.0} {"train_loss": -22.689176559448242, "global_step": 134626, "epoch": 1622} {"train_loss": -22.274768829345703, "global_step": 134627, "epoch": 1622} {"train_loss": -22.02878761291504, "global_step": 134628, "epoch": 1622} {"train_loss": -22.435022354125977, "global_step": 134629, "epoch": 1622} {"train_loss": -22.4750919342041, "global_step": 134630, "epoch": 1622} {"train_loss": -22.983257293701172, "global_step": 134631, "epoch": 1622} {"train_loss": -22.911575317382812, "global_step": 134632, "epoch": 1622} {"train_loss": -23.03450584411621, "global_step": 134633, "epoch": 1622} {"train_loss": -22.620101928710938, "global_step": 134634, "epoch": 1622} {"train_loss": -22.324615478515625, "global_step": 134635, "epoch": 1622} {"train_loss": -22.529497146606445, "global_step": 134636, "epoch": 1622} {"train_loss": -22.59764289855957, "global_step": 134637, "epoch": 1622} {"train_loss": -22.674976348876953, "global_step": 134638, "epoch": 1622} {"train_loss": -23.010526657104492, "global_step": 134639, "epoch": 1622} {"train_loss": -23.01865005493164, "global_step": 134640, "epoch": 1622} {"train_loss": -22.862060546875, "global_step": 134641, "epoch": 1622} {"train_loss": -22.743453979492188, "global_step": 134642, "epoch": 1622} {"train_loss": -22.815420150756836, "global_step": 134643, "epoch": 1622} {"train_loss": -22.901874542236328, "global_step": 134644, "epoch": 1622} {"train_loss": -22.945363998413086, "global_step": 134645, "epoch": 1622} {"train_loss": -22.793508529663086, "global_step": 134646, "epoch": 1622} {"train_loss": -23.030441284179688, "global_step": 134647, "epoch": 1622} {"train_loss": -22.92742347717285, "global_step": 134648, "epoch": 1622} {"train_loss": -23.015207290649414, "global_step": 134649, "epoch": 1622} {"train_loss": -22.997238159179688, "global_step": 134650, "epoch": 1622} {"train_loss": -22.97538948059082, "global_step": 134651, "epoch": 1622} {"train_loss": -23.28388023376465, "global_step": 134652, "epoch": 1622} {"train_loss": -22.78169822692871, "global_step": 134653, "epoch": 1622} {"train_loss": -22.69901466369629, "global_step": 134654, "epoch": 1622} {"train_loss": -22.912647247314453, "global_step": 134655, "epoch": 1622} {"train_loss": -22.885419845581055, "global_step": 134656, "epoch": 1622} {"train_loss": -22.903793334960938, "global_step": 134657, "epoch": 1622} {"train_loss": -22.706897735595703, "global_step": 134658, "epoch": 1622} {"train_loss": -22.636341094970703, "global_step": 134659, "epoch": 1622} {"train_loss": -22.789426803588867, "global_step": 134660, "epoch": 1622} {"train_loss": -22.43167495727539, "global_step": 134661, "epoch": 1622} {"train_loss": -22.967512130737305, "global_step": 134662, "epoch": 1622} {"train_loss": -23.11927604675293, "global_step": 134663, "epoch": 1622} {"train_loss": -22.67561912536621, "global_step": 134664, "epoch": 1622} {"train_loss": -22.736330032348633, "global_step": 134665, "epoch": 1622} {"train_loss": -23.02125358581543, "global_step": 134666, "epoch": 1622} {"train_loss": -22.838165283203125, "global_step": 134667, "epoch": 1622} {"train_loss": -22.69197654724121, "global_step": 134668, "epoch": 1622} {"train_loss": -23.021879196166992, "global_step": 134669, "epoch": 1622} {"train_loss": -23.130659103393555, "global_step": 134670, "epoch": 1622} {"train_loss": -23.283300399780273, "global_step": 134671, "epoch": 1622} {"train_loss": -23.10603141784668, "global_step": 134672, "epoch": 1622} {"train_loss": -23.05437469482422, "global_step": 134673, "epoch": 1622} {"train_loss": -22.828031539916992, "global_step": 134674, "epoch": 1622} {"train_loss": -23.249927520751953, "global_step": 134675, "epoch": 1622} {"train_loss": -23.046537399291992, "global_step": 134676, "epoch": 1622} {"train_loss": -23.195871353149414, "global_step": 134677, "epoch": 1622} {"train_loss": -23.038244247436523, "global_step": 134678, "epoch": 1622} {"train_loss": -23.16522789001465, "global_step": 134679, "epoch": 1622} {"train_loss": -23.32400894165039, "global_step": 134680, "epoch": 1622} {"train_loss": -22.42669105529785, "global_step": 134681, "epoch": 1622} {"train_loss": -22.772489547729492, "global_step": 134682, "epoch": 1622} {"train_loss": -22.97138786315918, "global_step": 134683, "epoch": 1622} {"train_loss": -22.792510986328125, "global_step": 134684, "epoch": 1622} {"train_loss": -22.6333065032959, "global_step": 134685, "epoch": 1622} {"train_loss": -23.1351375579834, "global_step": 134686, "epoch": 1622} {"train_loss": -22.993894577026367, "global_step": 134687, "epoch": 1622} {"train_loss": -22.42915153503418, "global_step": 134688, "epoch": 1622} {"train_loss": -22.857107162475586, "global_step": 134689, "epoch": 1622} {"train_loss": -23.104421615600586, "global_step": 134690, "epoch": 1622} {"train_loss": -22.89759635925293, "global_step": 134691, "epoch": 1622} {"train_loss": -23.055410385131836, "global_step": 134692, "epoch": 1622} {"train_loss": -23.371295928955078, "global_step": 134693, "epoch": 1622} {"train_loss": -22.9639949798584, "global_step": 134694, "epoch": 1622} {"train_loss": -23.022205352783203, "global_step": 134695, "epoch": 1622} {"train_loss": -22.62285804748535, "global_step": 134696, "epoch": 1622} {"train_loss": -23.324146270751953, "global_step": 134697, "epoch": 1622} {"train_loss": -22.80487632751465, "global_step": 134698, "epoch": 1622} {"train_loss": -22.853408813476562, "global_step": 134699, "epoch": 1622} {"train_loss": -22.802682876586914, "global_step": 134700, "epoch": 1622} {"train_loss": -22.425094604492188, "global_step": 134701, "epoch": 1622} {"train_loss": -22.89550018310547, "global_step": 134702, "epoch": 1622} {"train_loss": -22.85892105102539, "global_step": 134703, "epoch": 1622} {"train_loss": -22.713865280151367, "global_step": 134704, "epoch": 1622} {"train_loss": -22.90143394470215, "global_step": 134705, "epoch": 1622} {"train_loss": -23.015853881835938, "global_step": 134706, "epoch": 1622} {"train_loss": -22.888294219970703, "global_step": 134707, "epoch": 1622} {"train_loss": -22.87711828300752, "global_step": 134708, "epoch": 1622, "val_loss": 6303795.0} {"train_loss": -22.40254020690918, "global_step": 134709, "epoch": 1623} {"train_loss": -21.406354904174805, "global_step": 134710, "epoch": 1623} {"train_loss": -22.373579025268555, "global_step": 134711, "epoch": 1623} {"train_loss": -22.311983108520508, "global_step": 134712, "epoch": 1623} {"train_loss": -22.08902931213379, "global_step": 134713, "epoch": 1623} {"train_loss": -22.32869529724121, "global_step": 134714, "epoch": 1623} {"train_loss": -22.68769645690918, "global_step": 134715, "epoch": 1623} {"train_loss": -22.043750762939453, "global_step": 134716, "epoch": 1623} {"train_loss": -22.564674377441406, "global_step": 134717, "epoch": 1623} {"train_loss": -22.43317985534668, "global_step": 134718, "epoch": 1623} {"train_loss": -22.999919891357422, "global_step": 134719, "epoch": 1623} {"train_loss": -22.853803634643555, "global_step": 134720, "epoch": 1623} {"train_loss": -22.625295639038086, "global_step": 134721, "epoch": 1623} {"train_loss": -22.513864517211914, "global_step": 134722, "epoch": 1623} {"train_loss": -22.609800338745117, "global_step": 134723, "epoch": 1623} {"train_loss": -22.443485260009766, "global_step": 134724, "epoch": 1623} {"train_loss": -22.322874069213867, "global_step": 134725, "epoch": 1623} {"train_loss": -22.865100860595703, "global_step": 134726, "epoch": 1623} {"train_loss": -22.794170379638672, "global_step": 134727, "epoch": 1623} {"train_loss": -22.897390365600586, "global_step": 134728, "epoch": 1623} {"train_loss": -22.53030014038086, "global_step": 134729, "epoch": 1623} {"train_loss": -22.898672103881836, "global_step": 134730, "epoch": 1623} {"train_loss": -22.850889205932617, "global_step": 134731, "epoch": 1623} {"train_loss": -23.09607696533203, "global_step": 134732, "epoch": 1623} {"train_loss": -22.89149284362793, "global_step": 134733, "epoch": 1623} {"train_loss": -22.768287658691406, "global_step": 134734, "epoch": 1623} {"train_loss": -22.93149757385254, "global_step": 134735, "epoch": 1623} {"train_loss": -22.86406898498535, "global_step": 134736, "epoch": 1623} {"train_loss": -22.995344161987305, "global_step": 134737, "epoch": 1623} {"train_loss": -23.1854248046875, "global_step": 134738, "epoch": 1623} {"train_loss": -23.075639724731445, "global_step": 134739, "epoch": 1623} {"train_loss": -22.765790939331055, "global_step": 134740, "epoch": 1623} {"train_loss": -22.799985885620117, "global_step": 134741, "epoch": 1623} {"train_loss": -22.93903923034668, "global_step": 134742, "epoch": 1623} {"train_loss": -22.8796443939209, "global_step": 134743, "epoch": 1623} {"train_loss": -22.745010375976562, "global_step": 134744, "epoch": 1623} {"train_loss": -23.01169776916504, "global_step": 134745, "epoch": 1623} {"train_loss": -23.07032585144043, "global_step": 134746, "epoch": 1623} {"train_loss": -22.87044906616211, "global_step": 134747, "epoch": 1623} {"train_loss": -23.111570358276367, "global_step": 134748, "epoch": 1623} {"train_loss": -22.56403923034668, "global_step": 134749, "epoch": 1623} {"train_loss": -23.12057876586914, "global_step": 134750, "epoch": 1623} {"train_loss": -22.87765121459961, "global_step": 134751, "epoch": 1623} {"train_loss": -23.291858673095703, "global_step": 134752, "epoch": 1623} {"train_loss": -22.998594284057617, "global_step": 134753, "epoch": 1623} {"train_loss": -22.746673583984375, "global_step": 134754, "epoch": 1623} {"train_loss": -22.9054012298584, "global_step": 134755, "epoch": 1623} {"train_loss": -23.193601608276367, "global_step": 134756, "epoch": 1623} {"train_loss": -23.02425193786621, "global_step": 134757, "epoch": 1623} {"train_loss": -23.48809242248535, "global_step": 134758, "epoch": 1623} {"train_loss": -22.82080078125, "global_step": 134759, "epoch": 1623} {"train_loss": -23.184656143188477, "global_step": 134760, "epoch": 1623} {"train_loss": -23.100645065307617, "global_step": 134761, "epoch": 1623} {"train_loss": -23.069791793823242, "global_step": 134762, "epoch": 1623} {"train_loss": -23.241575241088867, "global_step": 134763, "epoch": 1623} {"train_loss": -22.73943328857422, "global_step": 134764, "epoch": 1623} {"train_loss": -22.796232223510742, "global_step": 134765, "epoch": 1623} {"train_loss": -23.07840347290039, "global_step": 134766, "epoch": 1623} {"train_loss": -22.9311466217041, "global_step": 134767, "epoch": 1623} {"train_loss": -23.012319564819336, "global_step": 134768, "epoch": 1623} {"train_loss": -22.775856018066406, "global_step": 134769, "epoch": 1623} {"train_loss": -23.070831298828125, "global_step": 134770, "epoch": 1623} {"train_loss": -23.052274703979492, "global_step": 134771, "epoch": 1623} {"train_loss": -22.904104232788086, "global_step": 134772, "epoch": 1623} {"train_loss": -22.755422592163086, "global_step": 134773, "epoch": 1623} {"train_loss": -22.859943389892578, "global_step": 134774, "epoch": 1623} {"train_loss": -22.591150283813477, "global_step": 134775, "epoch": 1623} {"train_loss": -22.878522872924805, "global_step": 134776, "epoch": 1623} {"train_loss": -22.866294860839844, "global_step": 134777, "epoch": 1623} {"train_loss": -22.706253051757812, "global_step": 134778, "epoch": 1623} {"train_loss": -22.974308013916016, "global_step": 134779, "epoch": 1623} {"train_loss": -22.66876220703125, "global_step": 134780, "epoch": 1623} {"train_loss": -22.877517700195312, "global_step": 134781, "epoch": 1623} {"train_loss": -23.021400451660156, "global_step": 134782, "epoch": 1623} {"train_loss": -22.81259536743164, "global_step": 134783, "epoch": 1623} {"train_loss": -23.130346298217773, "global_step": 134784, "epoch": 1623} {"train_loss": -22.79219627380371, "global_step": 134785, "epoch": 1623} {"train_loss": -22.891820907592773, "global_step": 134786, "epoch": 1623} {"train_loss": -23.148839950561523, "global_step": 134787, "epoch": 1623} {"train_loss": -22.90635871887207, "global_step": 134788, "epoch": 1623} {"train_loss": -23.289289474487305, "global_step": 134789, "epoch": 1623} {"train_loss": -23.019062042236328, "global_step": 134790, "epoch": 1623} {"train_loss": -22.827899450279144, "global_step": 134791, "epoch": 1623, "val_loss": 6297854.0} {"train_loss": -22.43666648864746, "global_step": 134792, "epoch": 1624} {"train_loss": -21.945514678955078, "global_step": 134793, "epoch": 1624} {"train_loss": -22.430906295776367, "global_step": 134794, "epoch": 1624} {"train_loss": -22.192790985107422, "global_step": 134795, "epoch": 1624} {"train_loss": -22.4229736328125, "global_step": 134796, "epoch": 1624} {"train_loss": -22.43239402770996, "global_step": 134797, "epoch": 1624} {"train_loss": -22.20766830444336, "global_step": 134798, "epoch": 1624} {"train_loss": -22.467178344726562, "global_step": 134799, "epoch": 1624} {"train_loss": -22.681812286376953, "global_step": 134800, "epoch": 1624} {"train_loss": -22.74359893798828, "global_step": 134801, "epoch": 1624} {"train_loss": -22.6317195892334, "global_step": 134802, "epoch": 1624} {"train_loss": -22.651086807250977, "global_step": 134803, "epoch": 1624} {"train_loss": -22.74810791015625, "global_step": 134804, "epoch": 1624} {"train_loss": -22.54922103881836, "global_step": 134805, "epoch": 1624} {"train_loss": -22.493194580078125, "global_step": 134806, "epoch": 1624} {"train_loss": -22.83272933959961, "global_step": 134807, "epoch": 1624} {"train_loss": -22.734384536743164, "global_step": 134808, "epoch": 1624} {"train_loss": -22.334943771362305, "global_step": 134809, "epoch": 1624} {"train_loss": -23.34779930114746, "global_step": 134810, "epoch": 1624} {"train_loss": -22.6815185546875, "global_step": 134811, "epoch": 1624} {"train_loss": -22.48979949951172, "global_step": 134812, "epoch": 1624} {"train_loss": -22.883621215820312, "global_step": 134813, "epoch": 1624} {"train_loss": -22.90985107421875, "global_step": 134814, "epoch": 1624} {"train_loss": -22.915863037109375, "global_step": 134815, "epoch": 1624} {"train_loss": -22.724905014038086, "global_step": 134816, "epoch": 1624} {"train_loss": -22.942947387695312, "global_step": 134817, "epoch": 1624} {"train_loss": -22.85811424255371, "global_step": 134818, "epoch": 1624} {"train_loss": -23.243803024291992, "global_step": 134819, "epoch": 1624} {"train_loss": -22.697240829467773, "global_step": 134820, "epoch": 1624} {"train_loss": -22.86417007446289, "global_step": 134821, "epoch": 1624} {"train_loss": -22.90921401977539, "global_step": 134822, "epoch": 1624} {"train_loss": -23.07039451599121, "global_step": 134823, "epoch": 1624} {"train_loss": -22.881235122680664, "global_step": 134824, "epoch": 1624} {"train_loss": -22.829771041870117, "global_step": 134825, "epoch": 1624} {"train_loss": -22.54856300354004, "global_step": 134826, "epoch": 1624} {"train_loss": -23.101608276367188, "global_step": 134827, "epoch": 1624} {"train_loss": -22.98383140563965, "global_step": 134828, "epoch": 1624} {"train_loss": -23.24957275390625, "global_step": 134829, "epoch": 1624} {"train_loss": -22.894994735717773, "global_step": 134830, "epoch": 1624} {"train_loss": -22.91035270690918, "global_step": 134831, "epoch": 1624} {"train_loss": -22.88909912109375, "global_step": 134832, "epoch": 1624} {"train_loss": -23.09914207458496, "global_step": 134833, "epoch": 1624} {"train_loss": -23.141416549682617, "global_step": 134834, "epoch": 1624} {"train_loss": -22.870725631713867, "global_step": 134835, "epoch": 1624} {"train_loss": -22.929258346557617, "global_step": 134836, "epoch": 1624} {"train_loss": -23.267627716064453, "global_step": 134837, "epoch": 1624} {"train_loss": -22.931623458862305, "global_step": 134838, "epoch": 1624} {"train_loss": -23.233854293823242, "global_step": 134839, "epoch": 1624} {"train_loss": -22.922269821166992, "global_step": 134840, "epoch": 1624} {"train_loss": -22.862442016601562, "global_step": 134841, "epoch": 1624} {"train_loss": -22.685855865478516, "global_step": 134842, "epoch": 1624} {"train_loss": -21.740934371948242, "global_step": 134843, "epoch": 1624} {"train_loss": -22.605857849121094, "global_step": 134844, "epoch": 1624} {"train_loss": -22.645328521728516, "global_step": 134845, "epoch": 1624} {"train_loss": -23.003665924072266, "global_step": 134846, "epoch": 1624} {"train_loss": -22.7030029296875, "global_step": 134847, "epoch": 1624} {"train_loss": -22.53143882751465, "global_step": 134848, "epoch": 1624} {"train_loss": -23.509275436401367, "global_step": 134849, "epoch": 1624} {"train_loss": -22.672576904296875, "global_step": 134850, "epoch": 1624} {"train_loss": -22.83672523498535, "global_step": 134851, "epoch": 1624} {"train_loss": -22.94776725769043, "global_step": 134852, "epoch": 1624} {"train_loss": -23.189910888671875, "global_step": 134853, "epoch": 1624} {"train_loss": -23.046987533569336, "global_step": 134854, "epoch": 1624} {"train_loss": -22.84527015686035, "global_step": 134855, "epoch": 1624} {"train_loss": -22.872196197509766, "global_step": 134856, "epoch": 1624} {"train_loss": -22.958850860595703, "global_step": 134857, "epoch": 1624} {"train_loss": -22.61130714416504, "global_step": 134858, "epoch": 1624} {"train_loss": -23.199426651000977, "global_step": 134859, "epoch": 1624} {"train_loss": -23.017663955688477, "global_step": 134860, "epoch": 1624} {"train_loss": -23.117307662963867, "global_step": 134861, "epoch": 1624} {"train_loss": -22.960744857788086, "global_step": 134862, "epoch": 1624} {"train_loss": -22.820775985717773, "global_step": 134863, "epoch": 1624} {"train_loss": -22.927494049072266, "global_step": 134864, "epoch": 1624} {"train_loss": -22.925350189208984, "global_step": 134865, "epoch": 1624} {"train_loss": -23.148731231689453, "global_step": 134866, "epoch": 1624} {"train_loss": -23.006271362304688, "global_step": 134867, "epoch": 1624} {"train_loss": -22.657140731811523, "global_step": 134868, "epoch": 1624} {"train_loss": -22.693115234375, "global_step": 134869, "epoch": 1624} {"train_loss": -22.538793563842773, "global_step": 134870, "epoch": 1624} {"train_loss": -22.633466720581055, "global_step": 134871, "epoch": 1624} {"train_loss": -23.095203399658203, "global_step": 134872, "epoch": 1624} {"train_loss": -22.695371627807617, "global_step": 134873, "epoch": 1624} {"train_loss": -22.795873550047357, "global_step": 134874, "epoch": 1624, "val_loss": 6168161.5} {"train_loss": -22.726083755493164, "global_step": 134875, "epoch": 1625} {"train_loss": -22.635791778564453, "global_step": 134876, "epoch": 1625} {"train_loss": -22.712398529052734, "global_step": 134877, "epoch": 1625} {"train_loss": -22.437665939331055, "global_step": 134878, "epoch": 1625} {"train_loss": -22.668249130249023, "global_step": 134879, "epoch": 1625} {"train_loss": -22.74338150024414, "global_step": 134880, "epoch": 1625} {"train_loss": -23.20729637145996, "global_step": 134881, "epoch": 1625} {"train_loss": -22.428237915039062, "global_step": 134882, "epoch": 1625} {"train_loss": -23.113004684448242, "global_step": 134883, "epoch": 1625} {"train_loss": -23.005722045898438, "global_step": 134884, "epoch": 1625} {"train_loss": -22.665483474731445, "global_step": 134885, "epoch": 1625} {"train_loss": -23.081377029418945, "global_step": 134886, "epoch": 1625} {"train_loss": -23.20363426208496, "global_step": 134887, "epoch": 1625} {"train_loss": -22.91691017150879, "global_step": 134888, "epoch": 1625} {"train_loss": -22.812036514282227, "global_step": 134889, "epoch": 1625} {"train_loss": -22.65114402770996, "global_step": 134890, "epoch": 1625} {"train_loss": -22.86838722229004, "global_step": 134891, "epoch": 1625} {"train_loss": -23.188230514526367, "global_step": 134892, "epoch": 1625} {"train_loss": -22.9498348236084, "global_step": 134893, "epoch": 1625} {"train_loss": -23.12647247314453, "global_step": 134894, "epoch": 1625} {"train_loss": -22.738739013671875, "global_step": 134895, "epoch": 1625} {"train_loss": -22.97547721862793, "global_step": 134896, "epoch": 1625} {"train_loss": -22.717283248901367, "global_step": 134897, "epoch": 1625} {"train_loss": -23.07465362548828, "global_step": 134898, "epoch": 1625} {"train_loss": -23.108915328979492, "global_step": 134899, "epoch": 1625} {"train_loss": -22.758583068847656, "global_step": 134900, "epoch": 1625} {"train_loss": -22.918874740600586, "global_step": 134901, "epoch": 1625} {"train_loss": -23.010507583618164, "global_step": 134902, "epoch": 1625} {"train_loss": -22.970746994018555, "global_step": 134903, "epoch": 1625} {"train_loss": -22.74086570739746, "global_step": 134904, "epoch": 1625} {"train_loss": -22.792478561401367, "global_step": 134905, "epoch": 1625} {"train_loss": -23.08218002319336, "global_step": 134906, "epoch": 1625} {"train_loss": -23.318998336791992, "global_step": 134907, "epoch": 1625} {"train_loss": -23.16241455078125, "global_step": 134908, "epoch": 1625} {"train_loss": -22.99075698852539, "global_step": 134909, "epoch": 1625} {"train_loss": -22.738845825195312, "global_step": 134910, "epoch": 1625} {"train_loss": -23.102920532226562, "global_step": 134911, "epoch": 1625} {"train_loss": -22.490461349487305, "global_step": 134912, "epoch": 1625} {"train_loss": -22.570571899414062, "global_step": 134913, "epoch": 1625} {"train_loss": -22.83271598815918, "global_step": 134914, "epoch": 1625} {"train_loss": -22.832767486572266, "global_step": 134915, "epoch": 1625} {"train_loss": -22.610733032226562, "global_step": 134916, "epoch": 1625} {"train_loss": -22.791616439819336, "global_step": 134917, "epoch": 1625} {"train_loss": -23.042734146118164, "global_step": 134918, "epoch": 1625} {"train_loss": -22.718273162841797, "global_step": 134919, "epoch": 1625} {"train_loss": -23.053808212280273, "global_step": 134920, "epoch": 1625} {"train_loss": -22.652267456054688, "global_step": 134921, "epoch": 1625} {"train_loss": -22.78617286682129, "global_step": 134922, "epoch": 1625} {"train_loss": -22.669347763061523, "global_step": 134923, "epoch": 1625} {"train_loss": -22.731000900268555, "global_step": 134924, "epoch": 1625} {"train_loss": -22.629714965820312, "global_step": 134925, "epoch": 1625} {"train_loss": -22.65079689025879, "global_step": 134926, "epoch": 1625} {"train_loss": -22.698558807373047, "global_step": 134927, "epoch": 1625} {"train_loss": -22.83047866821289, "global_step": 134928, "epoch": 1625} {"train_loss": -22.812637329101562, "global_step": 134929, "epoch": 1625} {"train_loss": -23.192190170288086, "global_step": 134930, "epoch": 1625} {"train_loss": -22.67085838317871, "global_step": 134931, "epoch": 1625} {"train_loss": -22.976146697998047, "global_step": 134932, "epoch": 1625} {"train_loss": -22.805469512939453, "global_step": 134933, "epoch": 1625} {"train_loss": -22.920713424682617, "global_step": 134934, "epoch": 1625} {"train_loss": -22.637338638305664, "global_step": 134935, "epoch": 1625} {"train_loss": -22.672758102416992, "global_step": 134936, "epoch": 1625} {"train_loss": -22.991159439086914, "global_step": 134937, "epoch": 1625} {"train_loss": -23.3116397857666, "global_step": 134938, "epoch": 1625} {"train_loss": -23.097732543945312, "global_step": 134939, "epoch": 1625} {"train_loss": -23.026859283447266, "global_step": 134940, "epoch": 1625} {"train_loss": -22.727584838867188, "global_step": 134941, "epoch": 1625} {"train_loss": -23.351886749267578, "global_step": 134942, "epoch": 1625} {"train_loss": -22.76236343383789, "global_step": 134943, "epoch": 1625} {"train_loss": -22.9869441986084, "global_step": 134944, "epoch": 1625} {"train_loss": -23.050474166870117, "global_step": 134945, "epoch": 1625} {"train_loss": -23.11393165588379, "global_step": 134946, "epoch": 1625} {"train_loss": -22.577255249023438, "global_step": 134947, "epoch": 1625} {"train_loss": -22.939538955688477, "global_step": 134948, "epoch": 1625} {"train_loss": -23.239267349243164, "global_step": 134949, "epoch": 1625} {"train_loss": -22.931045532226562, "global_step": 134950, "epoch": 1625} {"train_loss": -22.926429748535156, "global_step": 134951, "epoch": 1625} {"train_loss": -22.548629760742188, "global_step": 134952, "epoch": 1625} {"train_loss": -23.18433952331543, "global_step": 134953, "epoch": 1625} {"train_loss": -22.971202850341797, "global_step": 134954, "epoch": 1625} {"train_loss": -22.795095443725586, "global_step": 134955, "epoch": 1625} {"train_loss": -22.715742111206055, "global_step": 134956, "epoch": 1625} {"train_loss": -22.8758487471615, "global_step": 134957, "epoch": 1625, "val_loss": 6285940.0} {"train_loss": -22.2797794342041, "global_step": 134958, "epoch": 1626} {"train_loss": -22.45334243774414, "global_step": 134959, "epoch": 1626} {"train_loss": -21.978010177612305, "global_step": 134960, "epoch": 1626} {"train_loss": -23.13091468811035, "global_step": 134961, "epoch": 1626} {"train_loss": -22.353879928588867, "global_step": 134962, "epoch": 1626} {"train_loss": -22.346586227416992, "global_step": 134963, "epoch": 1626} {"train_loss": -22.71185302734375, "global_step": 134964, "epoch": 1626} {"train_loss": -22.641071319580078, "global_step": 134965, "epoch": 1626} {"train_loss": -22.664411544799805, "global_step": 134966, "epoch": 1626} {"train_loss": -22.856149673461914, "global_step": 134967, "epoch": 1626} {"train_loss": -22.367795944213867, "global_step": 134968, "epoch": 1626} {"train_loss": -22.683612823486328, "global_step": 134969, "epoch": 1626} {"train_loss": -22.529850006103516, "global_step": 134970, "epoch": 1626} {"train_loss": -22.838748931884766, "global_step": 134971, "epoch": 1626} {"train_loss": -22.59210205078125, "global_step": 134972, "epoch": 1626} {"train_loss": -22.84066390991211, "global_step": 134973, "epoch": 1626} {"train_loss": -22.703271865844727, "global_step": 134974, "epoch": 1626} {"train_loss": -22.93520164489746, "global_step": 134975, "epoch": 1626} {"train_loss": -23.06587028503418, "global_step": 134976, "epoch": 1626} {"train_loss": -22.689302444458008, "global_step": 134977, "epoch": 1626} {"train_loss": -23.091541290283203, "global_step": 134978, "epoch": 1626} {"train_loss": -22.770751953125, "global_step": 134979, "epoch": 1626} {"train_loss": -22.88309669494629, "global_step": 134980, "epoch": 1626} {"train_loss": -22.54859161376953, "global_step": 134981, "epoch": 1626} {"train_loss": -23.093778610229492, "global_step": 134982, "epoch": 1626} {"train_loss": -22.445022583007812, "global_step": 134983, "epoch": 1626} {"train_loss": -22.940814971923828, "global_step": 134984, "epoch": 1626} {"train_loss": -23.041170120239258, "global_step": 134985, "epoch": 1626} {"train_loss": -23.083173751831055, "global_step": 134986, "epoch": 1626} {"train_loss": -22.834447860717773, "global_step": 134987, "epoch": 1626} {"train_loss": -22.91655921936035, "global_step": 134988, "epoch": 1626} {"train_loss": -22.84230613708496, "global_step": 134989, "epoch": 1626} {"train_loss": -22.77193832397461, "global_step": 134990, "epoch": 1626} {"train_loss": -22.984317779541016, "global_step": 134991, "epoch": 1626} {"train_loss": -23.085981369018555, "global_step": 134992, "epoch": 1626} {"train_loss": -23.50050926208496, "global_step": 134993, "epoch": 1626} {"train_loss": -23.06317710876465, "global_step": 134994, "epoch": 1626} {"train_loss": -23.0728759765625, "global_step": 134995, "epoch": 1626} {"train_loss": -23.209747314453125, "global_step": 134996, "epoch": 1626} {"train_loss": -23.085424423217773, "global_step": 134997, "epoch": 1626} {"train_loss": -22.874963760375977, "global_step": 134998, "epoch": 1626} {"train_loss": -22.883712768554688, "global_step": 134999, "epoch": 1626} {"train_loss": -22.605623245239258, "global_step": 135000, "epoch": 1626} {"train_loss": -23.108552932739258, "global_step": 135001, "epoch": 1626} {"train_loss": -23.074569702148438, "global_step": 135002, "epoch": 1626} {"train_loss": -22.958444595336914, "global_step": 135003, "epoch": 1626} {"train_loss": -22.86688232421875, "global_step": 135004, "epoch": 1626} {"train_loss": -22.74834632873535, "global_step": 135005, "epoch": 1626} {"train_loss": -23.02118492126465, "global_step": 135006, "epoch": 1626} {"train_loss": -22.70488929748535, "global_step": 135007, "epoch": 1626} {"train_loss": -22.79355812072754, "global_step": 135008, "epoch": 1626} {"train_loss": -23.118967056274414, "global_step": 135009, "epoch": 1626} {"train_loss": -22.89116096496582, "global_step": 135010, "epoch": 1626} {"train_loss": -23.236865997314453, "global_step": 135011, "epoch": 1626} {"train_loss": -23.142688751220703, "global_step": 135012, "epoch": 1626} {"train_loss": -22.650917053222656, "global_step": 135013, "epoch": 1626} {"train_loss": -22.717761993408203, "global_step": 135014, "epoch": 1626} {"train_loss": -22.89461326599121, "global_step": 135015, "epoch": 1626} {"train_loss": -22.789722442626953, "global_step": 135016, "epoch": 1626} {"train_loss": -22.8359317779541, "global_step": 135017, "epoch": 1626} {"train_loss": -22.702796936035156, "global_step": 135018, "epoch": 1626} {"train_loss": -22.668928146362305, "global_step": 135019, "epoch": 1626} {"train_loss": -23.15481948852539, "global_step": 135020, "epoch": 1626} {"train_loss": -22.870624542236328, "global_step": 135021, "epoch": 1626} {"train_loss": -22.768735885620117, "global_step": 135022, "epoch": 1626} {"train_loss": -23.001022338867188, "global_step": 135023, "epoch": 1626} {"train_loss": -23.32233238220215, "global_step": 135024, "epoch": 1626} {"train_loss": -22.979015350341797, "global_step": 135025, "epoch": 1626} {"train_loss": -23.094097137451172, "global_step": 135026, "epoch": 1626} {"train_loss": -22.983383178710938, "global_step": 135027, "epoch": 1626} {"train_loss": -22.94427490234375, "global_step": 135028, "epoch": 1626} {"train_loss": -22.779727935791016, "global_step": 135029, "epoch": 1626} {"train_loss": -23.178016662597656, "global_step": 135030, "epoch": 1626} {"train_loss": -22.912946701049805, "global_step": 135031, "epoch": 1626} {"train_loss": -22.91229820251465, "global_step": 135032, "epoch": 1626} {"train_loss": -22.99849510192871, "global_step": 135033, "epoch": 1626} {"train_loss": -23.29775047302246, "global_step": 135034, "epoch": 1626} {"train_loss": -22.754758834838867, "global_step": 135035, "epoch": 1626} {"train_loss": -23.62125015258789, "global_step": 135036, "epoch": 1626} {"train_loss": -23.075193405151367, "global_step": 135037, "epoch": 1626} {"train_loss": -22.932415008544922, "global_step": 135038, "epoch": 1626} {"train_loss": -23.168445587158203, "global_step": 135039, "epoch": 1626} {"train_loss": -22.871091543910016, "global_step": 135040, "epoch": 1626, "val_loss": 6524617.0} {"train_loss": -20.90185546875, "global_step": 135041, "epoch": 1627} {"train_loss": -22.21142578125, "global_step": 135042, "epoch": 1627} {"train_loss": -21.596006393432617, "global_step": 135043, "epoch": 1627} {"train_loss": -21.400861740112305, "global_step": 135044, "epoch": 1627} {"train_loss": -21.34928321838379, "global_step": 135045, "epoch": 1627} {"train_loss": -22.166799545288086, "global_step": 135046, "epoch": 1627} {"train_loss": -22.098548889160156, "global_step": 135047, "epoch": 1627} {"train_loss": -22.009485244750977, "global_step": 135048, "epoch": 1627} {"train_loss": -22.164960861206055, "global_step": 135049, "epoch": 1627} {"train_loss": -22.21236228942871, "global_step": 135050, "epoch": 1627} {"train_loss": -21.90916633605957, "global_step": 135051, "epoch": 1627} {"train_loss": -22.15772819519043, "global_step": 135052, "epoch": 1627} {"train_loss": -22.10785484313965, "global_step": 135053, "epoch": 1627} {"train_loss": -21.937694549560547, "global_step": 135054, "epoch": 1627} {"train_loss": -22.385404586791992, "global_step": 135055, "epoch": 1627} {"train_loss": -22.00310707092285, "global_step": 135056, "epoch": 1627} {"train_loss": -22.12366485595703, "global_step": 135057, "epoch": 1627} {"train_loss": -22.63776206970215, "global_step": 135058, "epoch": 1627} {"train_loss": -22.231138229370117, "global_step": 135059, "epoch": 1627} {"train_loss": -22.393665313720703, "global_step": 135060, "epoch": 1627} {"train_loss": -22.461944580078125, "global_step": 135061, "epoch": 1627} {"train_loss": -22.541963577270508, "global_step": 135062, "epoch": 1627} {"train_loss": -22.739925384521484, "global_step": 135063, "epoch": 1627} {"train_loss": -22.42011260986328, "global_step": 135064, "epoch": 1627} {"train_loss": -22.50908088684082, "global_step": 135065, "epoch": 1627} {"train_loss": -23.007375717163086, "global_step": 135066, "epoch": 1627} {"train_loss": -22.556629180908203, "global_step": 135067, "epoch": 1627} {"train_loss": -22.621814727783203, "global_step": 135068, "epoch": 1627} {"train_loss": -22.721439361572266, "global_step": 135069, "epoch": 1627} {"train_loss": -22.982065200805664, "global_step": 135070, "epoch": 1627} {"train_loss": -22.673477172851562, "global_step": 135071, "epoch": 1627} {"train_loss": -22.962112426757812, "global_step": 135072, "epoch": 1627} {"train_loss": -22.51405906677246, "global_step": 135073, "epoch": 1627} {"train_loss": -23.232177734375, "global_step": 135074, "epoch": 1627} {"train_loss": -22.670148849487305, "global_step": 135075, "epoch": 1627} {"train_loss": -22.65640640258789, "global_step": 135076, "epoch": 1627} {"train_loss": -22.85782814025879, "global_step": 135077, "epoch": 1627} {"train_loss": -22.740217208862305, "global_step": 135078, "epoch": 1627} {"train_loss": -22.91524314880371, "global_step": 135079, "epoch": 1627} {"train_loss": -22.89716339111328, "global_step": 135080, "epoch": 1627} {"train_loss": -22.996198654174805, "global_step": 135081, "epoch": 1627} {"train_loss": -23.03260612487793, "global_step": 135082, "epoch": 1627} {"train_loss": -22.71418571472168, "global_step": 135083, "epoch": 1627} {"train_loss": -22.8088321685791, "global_step": 135084, "epoch": 1627} {"train_loss": -23.02954864501953, "global_step": 135085, "epoch": 1627} {"train_loss": -22.7644100189209, "global_step": 135086, "epoch": 1627} {"train_loss": -22.779600143432617, "global_step": 135087, "epoch": 1627} {"train_loss": -22.97348403930664, "global_step": 135088, "epoch": 1627} {"train_loss": -22.968366622924805, "global_step": 135089, "epoch": 1627} {"train_loss": -22.94378662109375, "global_step": 135090, "epoch": 1627} {"train_loss": -22.974363327026367, "global_step": 135091, "epoch": 1627} {"train_loss": -22.719560623168945, "global_step": 135092, "epoch": 1627} {"train_loss": -22.833364486694336, "global_step": 135093, "epoch": 1627} {"train_loss": -23.150806427001953, "global_step": 135094, "epoch": 1627} {"train_loss": -22.595874786376953, "global_step": 135095, "epoch": 1627} {"train_loss": -22.81854820251465, "global_step": 135096, "epoch": 1627} {"train_loss": -23.16096305847168, "global_step": 135097, "epoch": 1627} {"train_loss": -22.73719596862793, "global_step": 135098, "epoch": 1627} {"train_loss": -22.96352195739746, "global_step": 135099, "epoch": 1627} {"train_loss": -22.656057357788086, "global_step": 135100, "epoch": 1627} {"train_loss": -22.867536544799805, "global_step": 135101, "epoch": 1627} {"train_loss": -22.81268882751465, "global_step": 135102, "epoch": 1627} {"train_loss": -22.587230682373047, "global_step": 135103, "epoch": 1627} {"train_loss": -22.76572608947754, "global_step": 135104, "epoch": 1627} {"train_loss": -22.8452205657959, "global_step": 135105, "epoch": 1627} {"train_loss": -22.86993408203125, "global_step": 135106, "epoch": 1627} {"train_loss": -22.845361709594727, "global_step": 135107, "epoch": 1627} {"train_loss": -23.00494956970215, "global_step": 135108, "epoch": 1627} {"train_loss": -22.66868019104004, "global_step": 135109, "epoch": 1627} {"train_loss": -22.68265151977539, "global_step": 135110, "epoch": 1627} {"train_loss": -22.705429077148438, "global_step": 135111, "epoch": 1627} {"train_loss": -22.900985717773438, "global_step": 135112, "epoch": 1627} {"train_loss": -22.639320373535156, "global_step": 135113, "epoch": 1627} {"train_loss": -22.866743087768555, "global_step": 135114, "epoch": 1627} {"train_loss": -22.306119918823242, "global_step": 135115, "epoch": 1627} {"train_loss": -23.06136131286621, "global_step": 135116, "epoch": 1627} {"train_loss": -22.783573150634766, "global_step": 135117, "epoch": 1627} {"train_loss": -22.585102081298828, "global_step": 135118, "epoch": 1627} {"train_loss": -22.848621368408203, "global_step": 135119, "epoch": 1627} {"train_loss": -22.813629150390625, "global_step": 135120, "epoch": 1627} {"train_loss": -22.845474243164062, "global_step": 135121, "epoch": 1627} {"train_loss": -22.959226608276367, "global_step": 135122, "epoch": 1627} {"train_loss": -22.63614084634436, "global_step": 135123, "epoch": 1627, "val_loss": 6301077.0} {"train_loss": -22.883832931518555, "global_step": 135124, "epoch": 1628} {"train_loss": -22.520572662353516, "global_step": 135125, "epoch": 1628} {"train_loss": -22.61244773864746, "global_step": 135126, "epoch": 1628} {"train_loss": -22.423877716064453, "global_step": 135127, "epoch": 1628} {"train_loss": -22.58367919921875, "global_step": 135128, "epoch": 1628} {"train_loss": -22.912418365478516, "global_step": 135129, "epoch": 1628} {"train_loss": -22.714391708374023, "global_step": 135130, "epoch": 1628} {"train_loss": -22.588790893554688, "global_step": 135131, "epoch": 1628} {"train_loss": -22.578184127807617, "global_step": 135132, "epoch": 1628} {"train_loss": -22.81838035583496, "global_step": 135133, "epoch": 1628} {"train_loss": -22.557907104492188, "global_step": 135134, "epoch": 1628} {"train_loss": -22.524269104003906, "global_step": 135135, "epoch": 1628} {"train_loss": -22.728185653686523, "global_step": 135136, "epoch": 1628} {"train_loss": -22.78523063659668, "global_step": 135137, "epoch": 1628} {"train_loss": -22.28749656677246, "global_step": 135138, "epoch": 1628} {"train_loss": -22.681127548217773, "global_step": 135139, "epoch": 1628} {"train_loss": -22.637845993041992, "global_step": 135140, "epoch": 1628} {"train_loss": -22.78838539123535, "global_step": 135141, "epoch": 1628} {"train_loss": -23.25104331970215, "global_step": 135142, "epoch": 1628} {"train_loss": -22.97035789489746, "global_step": 135143, "epoch": 1628} {"train_loss": -22.86545753479004, "global_step": 135144, "epoch": 1628} {"train_loss": -23.045007705688477, "global_step": 135145, "epoch": 1628} {"train_loss": -23.00892448425293, "global_step": 135146, "epoch": 1628} {"train_loss": -22.89727210998535, "global_step": 135147, "epoch": 1628} {"train_loss": -22.875478744506836, "global_step": 135148, "epoch": 1628} {"train_loss": -23.035600662231445, "global_step": 135149, "epoch": 1628} {"train_loss": -22.88625144958496, "global_step": 135150, "epoch": 1628} {"train_loss": -22.9160213470459, "global_step": 135151, "epoch": 1628} {"train_loss": -22.6315975189209, "global_step": 135152, "epoch": 1628} {"train_loss": -23.097360610961914, "global_step": 135153, "epoch": 1628} {"train_loss": -22.785734176635742, "global_step": 135154, "epoch": 1628} {"train_loss": -22.624683380126953, "global_step": 135155, "epoch": 1628} {"train_loss": -22.47258949279785, "global_step": 135156, "epoch": 1628} {"train_loss": -23.131988525390625, "global_step": 135157, "epoch": 1628} {"train_loss": -22.69931411743164, "global_step": 135158, "epoch": 1628} {"train_loss": -23.16119384765625, "global_step": 135159, "epoch": 1628} {"train_loss": -23.009408950805664, "global_step": 135160, "epoch": 1628} {"train_loss": -23.083698272705078, "global_step": 135161, "epoch": 1628} {"train_loss": -22.873807907104492, "global_step": 135162, "epoch": 1628} {"train_loss": -23.343923568725586, "global_step": 135163, "epoch": 1628} {"train_loss": -23.10774803161621, "global_step": 135164, "epoch": 1628} {"train_loss": -23.163890838623047, "global_step": 135165, "epoch": 1628} {"train_loss": -23.052810668945312, "global_step": 135166, "epoch": 1628} {"train_loss": -22.730121612548828, "global_step": 135167, "epoch": 1628} {"train_loss": -23.104093551635742, "global_step": 135168, "epoch": 1628} {"train_loss": -23.078237533569336, "global_step": 135169, "epoch": 1628} {"train_loss": -22.8844051361084, "global_step": 135170, "epoch": 1628} {"train_loss": -22.99385643005371, "global_step": 135171, "epoch": 1628} {"train_loss": -23.325504302978516, "global_step": 135172, "epoch": 1628} {"train_loss": -23.231273651123047, "global_step": 135173, "epoch": 1628} {"train_loss": -23.01007080078125, "global_step": 135174, "epoch": 1628} {"train_loss": -22.8574275970459, "global_step": 135175, "epoch": 1628} {"train_loss": -22.568246841430664, "global_step": 135176, "epoch": 1628} {"train_loss": -22.953683853149414, "global_step": 135177, "epoch": 1628} {"train_loss": -22.99750518798828, "global_step": 135178, "epoch": 1628} {"train_loss": -23.260177612304688, "global_step": 135179, "epoch": 1628} {"train_loss": -22.725921630859375, "global_step": 135180, "epoch": 1628} {"train_loss": -22.74530601501465, "global_step": 135181, "epoch": 1628} {"train_loss": -22.882862091064453, "global_step": 135182, "epoch": 1628} {"train_loss": -23.481874465942383, "global_step": 135183, "epoch": 1628} {"train_loss": -22.824649810791016, "global_step": 135184, "epoch": 1628} {"train_loss": -22.747663497924805, "global_step": 135185, "epoch": 1628} {"train_loss": -22.914888381958008, "global_step": 135186, "epoch": 1628} {"train_loss": -22.989580154418945, "global_step": 135187, "epoch": 1628} {"train_loss": -22.87566566467285, "global_step": 135188, "epoch": 1628} {"train_loss": -23.267194747924805, "global_step": 135189, "epoch": 1628} {"train_loss": -22.723196029663086, "global_step": 135190, "epoch": 1628} {"train_loss": -23.153076171875, "global_step": 135191, "epoch": 1628} {"train_loss": -23.161733627319336, "global_step": 135192, "epoch": 1628} {"train_loss": -23.071523666381836, "global_step": 135193, "epoch": 1628} {"train_loss": -23.18929100036621, "global_step": 135194, "epoch": 1628} {"train_loss": -23.5824031829834, "global_step": 135195, "epoch": 1628} {"train_loss": -22.8365478515625, "global_step": 135196, "epoch": 1628} {"train_loss": -22.850942611694336, "global_step": 135197, "epoch": 1628} {"train_loss": -23.203763961791992, "global_step": 135198, "epoch": 1628} {"train_loss": -23.04267692565918, "global_step": 135199, "epoch": 1628} {"train_loss": -23.002870559692383, "global_step": 135200, "epoch": 1628} {"train_loss": -22.882429122924805, "global_step": 135201, "epoch": 1628} {"train_loss": -22.502538681030273, "global_step": 135202, "epoch": 1628} {"train_loss": -22.857717514038086, "global_step": 135203, "epoch": 1628} {"train_loss": -23.366168975830078, "global_step": 135204, "epoch": 1628} {"train_loss": -22.91716957092285, "global_step": 135205, "epoch": 1628} {"train_loss": -22.914985909519427, "global_step": 135206, "epoch": 1628, "val_loss": 6232625.0} {"train_loss": -22.75090980529785, "global_step": 135207, "epoch": 1629} {"train_loss": -22.753286361694336, "global_step": 135208, "epoch": 1629} {"train_loss": -22.586336135864258, "global_step": 135209, "epoch": 1629} {"train_loss": -22.716388702392578, "global_step": 135210, "epoch": 1629} {"train_loss": -22.634977340698242, "global_step": 135211, "epoch": 1629} {"train_loss": -22.56497573852539, "global_step": 135212, "epoch": 1629} {"train_loss": -23.010595321655273, "global_step": 135213, "epoch": 1629} {"train_loss": -22.806903839111328, "global_step": 135214, "epoch": 1629} {"train_loss": -22.51460838317871, "global_step": 135215, "epoch": 1629} {"train_loss": -22.84256362915039, "global_step": 135216, "epoch": 1629} {"train_loss": -22.737770080566406, "global_step": 135217, "epoch": 1629} {"train_loss": -22.991436004638672, "global_step": 135218, "epoch": 1629} {"train_loss": -22.5684871673584, "global_step": 135219, "epoch": 1629} {"train_loss": -22.874616622924805, "global_step": 135220, "epoch": 1629} {"train_loss": -22.889129638671875, "global_step": 135221, "epoch": 1629} {"train_loss": -22.88365936279297, "global_step": 135222, "epoch": 1629} {"train_loss": -22.71705436706543, "global_step": 135223, "epoch": 1629} {"train_loss": -22.525808334350586, "global_step": 135224, "epoch": 1629} {"train_loss": -22.939687728881836, "global_step": 135225, "epoch": 1629} {"train_loss": -23.254886627197266, "global_step": 135226, "epoch": 1629} {"train_loss": -22.745344161987305, "global_step": 135227, "epoch": 1629} {"train_loss": -22.784860610961914, "global_step": 135228, "epoch": 1629} {"train_loss": -23.07411766052246, "global_step": 135229, "epoch": 1629} {"train_loss": -22.66634178161621, "global_step": 135230, "epoch": 1629} {"train_loss": -23.213346481323242, "global_step": 135231, "epoch": 1629} {"train_loss": -23.200334548950195, "global_step": 135232, "epoch": 1629} {"train_loss": -22.853952407836914, "global_step": 135233, "epoch": 1629} {"train_loss": -23.04462432861328, "global_step": 135234, "epoch": 1629} {"train_loss": -23.127681732177734, "global_step": 135235, "epoch": 1629} {"train_loss": -22.718223571777344, "global_step": 135236, "epoch": 1629} {"train_loss": -22.67729377746582, "global_step": 135237, "epoch": 1629} {"train_loss": -22.880430221557617, "global_step": 135238, "epoch": 1629} {"train_loss": -23.268125534057617, "global_step": 135239, "epoch": 1629} {"train_loss": -22.57417869567871, "global_step": 135240, "epoch": 1629} {"train_loss": -22.430570602416992, "global_step": 135241, "epoch": 1629} {"train_loss": -22.941186904907227, "global_step": 135242, "epoch": 1629} {"train_loss": -22.90839958190918, "global_step": 135243, "epoch": 1629} {"train_loss": -22.504322052001953, "global_step": 135244, "epoch": 1629} {"train_loss": -23.136890411376953, "global_step": 135245, "epoch": 1629} {"train_loss": -23.233152389526367, "global_step": 135246, "epoch": 1629} {"train_loss": -22.407154083251953, "global_step": 135247, "epoch": 1629} {"train_loss": -22.72360610961914, "global_step": 135248, "epoch": 1629} {"train_loss": -22.753320693969727, "global_step": 135249, "epoch": 1629} {"train_loss": -22.797876358032227, "global_step": 135250, "epoch": 1629} {"train_loss": -22.75300407409668, "global_step": 135251, "epoch": 1629} {"train_loss": -22.844024658203125, "global_step": 135252, "epoch": 1629} {"train_loss": -22.495046615600586, "global_step": 135253, "epoch": 1629} {"train_loss": -23.009519577026367, "global_step": 135254, "epoch": 1629} {"train_loss": -22.878103256225586, "global_step": 135255, "epoch": 1629} {"train_loss": -22.723234176635742, "global_step": 135256, "epoch": 1629} {"train_loss": -22.80708122253418, "global_step": 135257, "epoch": 1629} {"train_loss": -22.61335563659668, "global_step": 135258, "epoch": 1629} {"train_loss": -22.811931610107422, "global_step": 135259, "epoch": 1629} {"train_loss": -22.8309268951416, "global_step": 135260, "epoch": 1629} {"train_loss": -23.024669647216797, "global_step": 135261, "epoch": 1629} {"train_loss": -23.11269187927246, "global_step": 135262, "epoch": 1629} {"train_loss": -22.798154830932617, "global_step": 135263, "epoch": 1629} {"train_loss": -23.124340057373047, "global_step": 135264, "epoch": 1629} {"train_loss": -22.867673873901367, "global_step": 135265, "epoch": 1629} {"train_loss": -22.856250762939453, "global_step": 135266, "epoch": 1629} {"train_loss": -22.901865005493164, "global_step": 135267, "epoch": 1629} {"train_loss": -23.145809173583984, "global_step": 135268, "epoch": 1629} {"train_loss": -22.90283203125, "global_step": 135269, "epoch": 1629} {"train_loss": -23.21074867248535, "global_step": 135270, "epoch": 1629} {"train_loss": -22.82680320739746, "global_step": 135271, "epoch": 1629} {"train_loss": -23.145750045776367, "global_step": 135272, "epoch": 1629} {"train_loss": -23.260446548461914, "global_step": 135273, "epoch": 1629} {"train_loss": -23.062959671020508, "global_step": 135274, "epoch": 1629} {"train_loss": -22.833913803100586, "global_step": 135275, "epoch": 1629} {"train_loss": -23.066116333007812, "global_step": 135276, "epoch": 1629} {"train_loss": -23.058256149291992, "global_step": 135277, "epoch": 1629} {"train_loss": -22.89750099182129, "global_step": 135278, "epoch": 1629} {"train_loss": -22.878799438476562, "global_step": 135279, "epoch": 1629} {"train_loss": -23.07474708557129, "global_step": 135280, "epoch": 1629} {"train_loss": -23.0159912109375, "global_step": 135281, "epoch": 1629} {"train_loss": -22.6769962310791, "global_step": 135282, "epoch": 1629} {"train_loss": -22.968759536743164, "global_step": 135283, "epoch": 1629} {"train_loss": -22.594165802001953, "global_step": 135284, "epoch": 1629} {"train_loss": -22.704456329345703, "global_step": 135285, "epoch": 1629} {"train_loss": -22.647356033325195, "global_step": 135286, "epoch": 1629} {"train_loss": -23.178680419921875, "global_step": 135287, "epoch": 1629} {"train_loss": -22.54939842224121, "global_step": 135288, "epoch": 1629} {"train_loss": -22.864765167236328, "global_step": 135289, "epoch": 1629, "val_loss": 6262717.5} {"train_loss": -22.43224334716797, "global_step": 135290, "epoch": 1630} {"train_loss": -22.616384506225586, "global_step": 135291, "epoch": 1630} {"train_loss": -22.152328491210938, "global_step": 135292, "epoch": 1630} {"train_loss": -22.851232528686523, "global_step": 135293, "epoch": 1630} {"train_loss": -22.468292236328125, "global_step": 135294, "epoch": 1630} {"train_loss": -22.262651443481445, "global_step": 135295, "epoch": 1630} {"train_loss": -22.979951858520508, "global_step": 135296, "epoch": 1630} {"train_loss": -22.33070945739746, "global_step": 135297, "epoch": 1630} {"train_loss": -22.202341079711914, "global_step": 135298, "epoch": 1630} {"train_loss": -23.10577964782715, "global_step": 135299, "epoch": 1630} {"train_loss": -22.216495513916016, "global_step": 135300, "epoch": 1630} {"train_loss": -22.707727432250977, "global_step": 135301, "epoch": 1630} {"train_loss": -22.89812469482422, "global_step": 135302, "epoch": 1630} {"train_loss": -22.78104591369629, "global_step": 135303, "epoch": 1630} {"train_loss": -22.64777183532715, "global_step": 135304, "epoch": 1630} {"train_loss": -22.836294174194336, "global_step": 135305, "epoch": 1630} {"train_loss": -22.722488403320312, "global_step": 135306, "epoch": 1630} {"train_loss": -23.006168365478516, "global_step": 135307, "epoch": 1630} {"train_loss": -22.661306381225586, "global_step": 135308, "epoch": 1630} {"train_loss": -22.79465675354004, "global_step": 135309, "epoch": 1630} {"train_loss": -22.919260025024414, "global_step": 135310, "epoch": 1630} {"train_loss": -22.657556533813477, "global_step": 135311, "epoch": 1630} {"train_loss": -23.161056518554688, "global_step": 135312, "epoch": 1630} {"train_loss": -23.067808151245117, "global_step": 135313, "epoch": 1630} {"train_loss": -22.85127830505371, "global_step": 135314, "epoch": 1630} {"train_loss": -23.150188446044922, "global_step": 135315, "epoch": 1630} {"train_loss": -22.44521141052246, "global_step": 135316, "epoch": 1630} {"train_loss": -23.282922744750977, "global_step": 135317, "epoch": 1630} {"train_loss": -22.92685317993164, "global_step": 135318, "epoch": 1630} {"train_loss": -23.023096084594727, "global_step": 135319, "epoch": 1630} {"train_loss": -23.132720947265625, "global_step": 135320, "epoch": 1630} {"train_loss": -22.905925750732422, "global_step": 135321, "epoch": 1630} {"train_loss": -23.143888473510742, "global_step": 135322, "epoch": 1630} {"train_loss": -23.014699935913086, "global_step": 135323, "epoch": 1630} {"train_loss": -23.132137298583984, "global_step": 135324, "epoch": 1630} {"train_loss": -23.00214385986328, "global_step": 135325, "epoch": 1630} {"train_loss": -23.270788192749023, "global_step": 135326, "epoch": 1630} {"train_loss": -23.082630157470703, "global_step": 135327, "epoch": 1630} {"train_loss": -23.16135025024414, "global_step": 135328, "epoch": 1630} {"train_loss": -23.39381217956543, "global_step": 135329, "epoch": 1630} {"train_loss": -23.00773048400879, "global_step": 135330, "epoch": 1630} {"train_loss": -22.967042922973633, "global_step": 135331, "epoch": 1630} {"train_loss": -22.94239616394043, "global_step": 135332, "epoch": 1630} {"train_loss": -22.484678268432617, "global_step": 135333, "epoch": 1630} {"train_loss": -22.80435562133789, "global_step": 135334, "epoch": 1630} {"train_loss": -23.014272689819336, "global_step": 135335, "epoch": 1630} {"train_loss": -23.297822952270508, "global_step": 135336, "epoch": 1630} {"train_loss": -22.441043853759766, "global_step": 135337, "epoch": 1630} {"train_loss": -23.249235153198242, "global_step": 135338, "epoch": 1630} {"train_loss": -23.01971435546875, "global_step": 135339, "epoch": 1630} {"train_loss": -22.962148666381836, "global_step": 135340, "epoch": 1630} {"train_loss": -23.01641082763672, "global_step": 135341, "epoch": 1630} {"train_loss": -22.954853057861328, "global_step": 135342, "epoch": 1630} {"train_loss": -22.96429443359375, "global_step": 135343, "epoch": 1630} {"train_loss": -23.099712371826172, "global_step": 135344, "epoch": 1630} {"train_loss": -22.8710880279541, "global_step": 135345, "epoch": 1630} {"train_loss": -23.01670265197754, "global_step": 135346, "epoch": 1630} {"train_loss": -22.890104293823242, "global_step": 135347, "epoch": 1630} {"train_loss": -23.014081954956055, "global_step": 135348, "epoch": 1630} {"train_loss": -22.961389541625977, "global_step": 135349, "epoch": 1630} {"train_loss": -22.68441390991211, "global_step": 135350, "epoch": 1630} {"train_loss": -22.97615623474121, "global_step": 135351, "epoch": 1630} {"train_loss": -22.92861557006836, "global_step": 135352, "epoch": 1630} {"train_loss": -23.136503219604492, "global_step": 135353, "epoch": 1630} {"train_loss": -23.22981834411621, "global_step": 135354, "epoch": 1630} {"train_loss": -22.974218368530273, "global_step": 135355, "epoch": 1630} {"train_loss": -23.064268112182617, "global_step": 135356, "epoch": 1630} {"train_loss": -23.135828018188477, "global_step": 135357, "epoch": 1630} {"train_loss": -23.061534881591797, "global_step": 135358, "epoch": 1630} {"train_loss": -22.58154296875, "global_step": 135359, "epoch": 1630} {"train_loss": -23.196605682373047, "global_step": 135360, "epoch": 1630} {"train_loss": -22.987579345703125, "global_step": 135361, "epoch": 1630} {"train_loss": -22.81100082397461, "global_step": 135362, "epoch": 1630} {"train_loss": -22.696212768554688, "global_step": 135363, "epoch": 1630} {"train_loss": -23.293657302856445, "global_step": 135364, "epoch": 1630} {"train_loss": -23.136398315429688, "global_step": 135365, "epoch": 1630} {"train_loss": -23.0678653717041, "global_step": 135366, "epoch": 1630} {"train_loss": -23.04739761352539, "global_step": 135367, "epoch": 1630} {"train_loss": -22.775602340698242, "global_step": 135368, "epoch": 1630} {"train_loss": -22.87141227722168, "global_step": 135369, "epoch": 1630} {"train_loss": -22.727718353271484, "global_step": 135370, "epoch": 1630} {"train_loss": -22.993188858032227, "global_step": 135371, "epoch": 1630} {"train_loss": -22.92348215953413, "global_step": 135372, "epoch": 1630, "val_loss": 6310392.0} {"train_loss": -22.278615951538086, "global_step": 135373, "epoch": 1631} {"train_loss": -22.083730697631836, "global_step": 135374, "epoch": 1631} {"train_loss": -22.18161392211914, "global_step": 135375, "epoch": 1631} {"train_loss": -22.18077850341797, "global_step": 135376, "epoch": 1631} {"train_loss": -22.822975158691406, "global_step": 135377, "epoch": 1631} {"train_loss": -22.58970069885254, "global_step": 135378, "epoch": 1631} {"train_loss": -22.429929733276367, "global_step": 135379, "epoch": 1631} {"train_loss": -22.91680335998535, "global_step": 135380, "epoch": 1631} {"train_loss": -22.525724411010742, "global_step": 135381, "epoch": 1631} {"train_loss": -22.465295791625977, "global_step": 135382, "epoch": 1631} {"train_loss": -22.712486267089844, "global_step": 135383, "epoch": 1631} {"train_loss": -22.5197811126709, "global_step": 135384, "epoch": 1631} {"train_loss": -22.918363571166992, "global_step": 135385, "epoch": 1631} {"train_loss": -22.480777740478516, "global_step": 135386, "epoch": 1631} {"train_loss": -22.597829818725586, "global_step": 135387, "epoch": 1631} {"train_loss": -22.895246505737305, "global_step": 135388, "epoch": 1631} {"train_loss": -22.80961036682129, "global_step": 135389, "epoch": 1631} {"train_loss": -22.297941207885742, "global_step": 135390, "epoch": 1631} {"train_loss": -22.821517944335938, "global_step": 135391, "epoch": 1631} {"train_loss": -22.662799835205078, "global_step": 135392, "epoch": 1631} {"train_loss": -22.5983829498291, "global_step": 135393, "epoch": 1631} {"train_loss": -22.949922561645508, "global_step": 135394, "epoch": 1631} {"train_loss": -22.783130645751953, "global_step": 135395, "epoch": 1631} {"train_loss": -23.01749038696289, "global_step": 135396, "epoch": 1631} {"train_loss": -22.622976303100586, "global_step": 135397, "epoch": 1631} {"train_loss": -22.88228416442871, "global_step": 135398, "epoch": 1631} {"train_loss": -22.865325927734375, "global_step": 135399, "epoch": 1631} {"train_loss": -22.60941505432129, "global_step": 135400, "epoch": 1631} {"train_loss": -22.783231735229492, "global_step": 135401, "epoch": 1631} {"train_loss": -23.124149322509766, "global_step": 135402, "epoch": 1631} {"train_loss": -22.779067993164062, "global_step": 135403, "epoch": 1631} {"train_loss": -22.432031631469727, "global_step": 135404, "epoch": 1631} {"train_loss": -22.99738121032715, "global_step": 135405, "epoch": 1631} {"train_loss": -22.92826271057129, "global_step": 135406, "epoch": 1631} {"train_loss": -22.547273635864258, "global_step": 135407, "epoch": 1631} {"train_loss": -22.698871612548828, "global_step": 135408, "epoch": 1631} {"train_loss": -22.912931442260742, "global_step": 135409, "epoch": 1631} {"train_loss": -22.893232345581055, "global_step": 135410, "epoch": 1631} {"train_loss": -22.813945770263672, "global_step": 135411, "epoch": 1631} {"train_loss": -22.531421661376953, "global_step": 135412, "epoch": 1631} {"train_loss": -22.73239517211914, "global_step": 135413, "epoch": 1631} {"train_loss": -22.552427291870117, "global_step": 135414, "epoch": 1631} {"train_loss": -22.634979248046875, "global_step": 135415, "epoch": 1631} {"train_loss": -23.031005859375, "global_step": 135416, "epoch": 1631} {"train_loss": -22.74393653869629, "global_step": 135417, "epoch": 1631} {"train_loss": -22.893918991088867, "global_step": 135418, "epoch": 1631} {"train_loss": -22.59701156616211, "global_step": 135419, "epoch": 1631} {"train_loss": -23.001117706298828, "global_step": 135420, "epoch": 1631} {"train_loss": -22.90288543701172, "global_step": 135421, "epoch": 1631} {"train_loss": -22.984830856323242, "global_step": 135422, "epoch": 1631} {"train_loss": -22.632122039794922, "global_step": 135423, "epoch": 1631} {"train_loss": -22.974607467651367, "global_step": 135424, "epoch": 1631} {"train_loss": -23.205923080444336, "global_step": 135425, "epoch": 1631} {"train_loss": -23.118772506713867, "global_step": 135426, "epoch": 1631} {"train_loss": -22.98252296447754, "global_step": 135427, "epoch": 1631} {"train_loss": -23.104856491088867, "global_step": 135428, "epoch": 1631} {"train_loss": -22.816734313964844, "global_step": 135429, "epoch": 1631} {"train_loss": -22.852079391479492, "global_step": 135430, "epoch": 1631} {"train_loss": -23.117643356323242, "global_step": 135431, "epoch": 1631} {"train_loss": -22.897235870361328, "global_step": 135432, "epoch": 1631} {"train_loss": -22.96134376525879, "global_step": 135433, "epoch": 1631} {"train_loss": -22.939573287963867, "global_step": 135434, "epoch": 1631} {"train_loss": -22.960172653198242, "global_step": 135435, "epoch": 1631} {"train_loss": -22.565692901611328, "global_step": 135436, "epoch": 1631} {"train_loss": -23.06947898864746, "global_step": 135437, "epoch": 1631} {"train_loss": -23.206541061401367, "global_step": 135438, "epoch": 1631} {"train_loss": -23.0285701751709, "global_step": 135439, "epoch": 1631} {"train_loss": -22.862337112426758, "global_step": 135440, "epoch": 1631} {"train_loss": -23.079742431640625, "global_step": 135441, "epoch": 1631} {"train_loss": -23.098058700561523, "global_step": 135442, "epoch": 1631} {"train_loss": -22.738309860229492, "global_step": 135443, "epoch": 1631} {"train_loss": -23.24066734313965, "global_step": 135444, "epoch": 1631} {"train_loss": -22.817935943603516, "global_step": 135445, "epoch": 1631} {"train_loss": -23.217451095581055, "global_step": 135446, "epoch": 1631} {"train_loss": -22.885345458984375, "global_step": 135447, "epoch": 1631} {"train_loss": -23.055395126342773, "global_step": 135448, "epoch": 1631} {"train_loss": -23.250471115112305, "global_step": 135449, "epoch": 1631} {"train_loss": -22.923585891723633, "global_step": 135450, "epoch": 1631} {"train_loss": -22.640350341796875, "global_step": 135451, "epoch": 1631} {"train_loss": -22.92427635192871, "global_step": 135452, "epoch": 1631} {"train_loss": -22.9373722076416, "global_step": 135453, "epoch": 1631} {"train_loss": -23.128469467163086, "global_step": 135454, "epoch": 1631} {"train_loss": -22.812129560723363, "global_step": 135455, "epoch": 1631, "val_loss": 6311879.0} {"train_loss": -22.165014266967773, "global_step": 135456, "epoch": 1632} {"train_loss": -22.039840698242188, "global_step": 135457, "epoch": 1632} {"train_loss": -22.361581802368164, "global_step": 135458, "epoch": 1632} {"train_loss": -22.688007354736328, "global_step": 135459, "epoch": 1632} {"train_loss": -22.541330337524414, "global_step": 135460, "epoch": 1632} {"train_loss": -23.137495040893555, "global_step": 135461, "epoch": 1632} {"train_loss": -22.415958404541016, "global_step": 135462, "epoch": 1632} {"train_loss": -22.43971824645996, "global_step": 135463, "epoch": 1632} {"train_loss": -22.450407028198242, "global_step": 135464, "epoch": 1632} {"train_loss": -22.73373031616211, "global_step": 135465, "epoch": 1632} {"train_loss": -22.53421401977539, "global_step": 135466, "epoch": 1632} {"train_loss": -22.560108184814453, "global_step": 135467, "epoch": 1632} {"train_loss": -22.64347267150879, "global_step": 135468, "epoch": 1632} {"train_loss": -22.474184036254883, "global_step": 135469, "epoch": 1632} {"train_loss": -22.460731506347656, "global_step": 135470, "epoch": 1632} {"train_loss": -22.381383895874023, "global_step": 135471, "epoch": 1632} {"train_loss": -22.713565826416016, "global_step": 135472, "epoch": 1632} {"train_loss": -22.413293838500977, "global_step": 135473, "epoch": 1632} {"train_loss": -22.61890411376953, "global_step": 135474, "epoch": 1632} {"train_loss": -22.703397750854492, "global_step": 135475, "epoch": 1632} {"train_loss": -22.390365600585938, "global_step": 135476, "epoch": 1632} {"train_loss": -23.110374450683594, "global_step": 135477, "epoch": 1632} {"train_loss": -22.849990844726562, "global_step": 135478, "epoch": 1632} {"train_loss": -23.09157943725586, "global_step": 135479, "epoch": 1632} {"train_loss": -22.881839752197266, "global_step": 135480, "epoch": 1632} {"train_loss": -22.8990478515625, "global_step": 135481, "epoch": 1632} {"train_loss": -22.8188419342041, "global_step": 135482, "epoch": 1632} {"train_loss": -22.74353790283203, "global_step": 135483, "epoch": 1632} {"train_loss": -22.8607177734375, "global_step": 135484, "epoch": 1632} {"train_loss": -22.63873863220215, "global_step": 135485, "epoch": 1632} {"train_loss": -23.101993560791016, "global_step": 135486, "epoch": 1632} {"train_loss": -23.085678100585938, "global_step": 135487, "epoch": 1632} {"train_loss": -23.115921020507812, "global_step": 135488, "epoch": 1632} {"train_loss": -23.22394371032715, "global_step": 135489, "epoch": 1632} {"train_loss": -22.856416702270508, "global_step": 135490, "epoch": 1632} {"train_loss": -23.1232852935791, "global_step": 135491, "epoch": 1632} {"train_loss": -23.05073356628418, "global_step": 135492, "epoch": 1632} {"train_loss": -23.075918197631836, "global_step": 135493, "epoch": 1632} {"train_loss": -22.87702178955078, "global_step": 135494, "epoch": 1632} {"train_loss": -22.989416122436523, "global_step": 135495, "epoch": 1632} {"train_loss": -22.837209701538086, "global_step": 135496, "epoch": 1632} {"train_loss": -23.375089645385742, "global_step": 135497, "epoch": 1632} {"train_loss": -23.03641700744629, "global_step": 135498, "epoch": 1632} {"train_loss": -23.227571487426758, "global_step": 135499, "epoch": 1632} {"train_loss": -22.66543960571289, "global_step": 135500, "epoch": 1632} {"train_loss": -23.3607177734375, "global_step": 135501, "epoch": 1632} {"train_loss": -23.040807723999023, "global_step": 135502, "epoch": 1632} {"train_loss": -22.65496826171875, "global_step": 135503, "epoch": 1632} {"train_loss": -22.787755966186523, "global_step": 135504, "epoch": 1632} {"train_loss": -22.822708129882812, "global_step": 135505, "epoch": 1632} {"train_loss": -22.747655868530273, "global_step": 135506, "epoch": 1632} {"train_loss": -23.13404655456543, "global_step": 135507, "epoch": 1632} {"train_loss": -23.227359771728516, "global_step": 135508, "epoch": 1632} {"train_loss": -22.784067153930664, "global_step": 135509, "epoch": 1632} {"train_loss": -22.57310676574707, "global_step": 135510, "epoch": 1632} {"train_loss": -22.31277847290039, "global_step": 135511, "epoch": 1632} {"train_loss": -22.931720733642578, "global_step": 135512, "epoch": 1632} {"train_loss": -22.841562271118164, "global_step": 135513, "epoch": 1632} {"train_loss": -22.358661651611328, "global_step": 135514, "epoch": 1632} {"train_loss": -22.478418350219727, "global_step": 135515, "epoch": 1632} {"train_loss": -22.745878219604492, "global_step": 135516, "epoch": 1632} {"train_loss": -23.07708740234375, "global_step": 135517, "epoch": 1632} {"train_loss": -22.67047691345215, "global_step": 135518, "epoch": 1632} {"train_loss": -23.051591873168945, "global_step": 135519, "epoch": 1632} {"train_loss": -22.751890182495117, "global_step": 135520, "epoch": 1632} {"train_loss": -22.80843162536621, "global_step": 135521, "epoch": 1632} {"train_loss": -22.826034545898438, "global_step": 135522, "epoch": 1632} {"train_loss": -22.838762283325195, "global_step": 135523, "epoch": 1632} {"train_loss": -22.988264083862305, "global_step": 135524, "epoch": 1632} {"train_loss": -23.223907470703125, "global_step": 135525, "epoch": 1632} {"train_loss": -23.0493106842041, "global_step": 135526, "epoch": 1632} {"train_loss": -23.263654708862305, "global_step": 135527, "epoch": 1632} {"train_loss": -22.443012237548828, "global_step": 135528, "epoch": 1632} {"train_loss": -23.098526000976562, "global_step": 135529, "epoch": 1632} {"train_loss": -22.970422744750977, "global_step": 135530, "epoch": 1632} {"train_loss": -22.643569946289062, "global_step": 135531, "epoch": 1632} {"train_loss": -22.985750198364258, "global_step": 135532, "epoch": 1632} {"train_loss": -23.24190330505371, "global_step": 135533, "epoch": 1632} {"train_loss": -22.964868545532227, "global_step": 135534, "epoch": 1632} {"train_loss": -22.860946655273438, "global_step": 135535, "epoch": 1632} {"train_loss": -23.07434844970703, "global_step": 135536, "epoch": 1632} {"train_loss": -22.943967819213867, "global_step": 135537, "epoch": 1632} {"train_loss": -22.82381046249206, "global_step": 135538, "epoch": 1632, "val_loss": 6299522.0} {"train_loss": -22.25752067565918, "global_step": 135539, "epoch": 1633} {"train_loss": -22.601877212524414, "global_step": 135540, "epoch": 1633} {"train_loss": -22.19208335876465, "global_step": 135541, "epoch": 1633} {"train_loss": -22.1488037109375, "global_step": 135542, "epoch": 1633} {"train_loss": -22.780038833618164, "global_step": 135543, "epoch": 1633} {"train_loss": -22.448652267456055, "global_step": 135544, "epoch": 1633} {"train_loss": -22.76917839050293, "global_step": 135545, "epoch": 1633} {"train_loss": -22.673118591308594, "global_step": 135546, "epoch": 1633} {"train_loss": -22.87839698791504, "global_step": 135547, "epoch": 1633} {"train_loss": -22.60853385925293, "global_step": 135548, "epoch": 1633} {"train_loss": -22.953088760375977, "global_step": 135549, "epoch": 1633} {"train_loss": -22.811433792114258, "global_step": 135550, "epoch": 1633} {"train_loss": -22.505956649780273, "global_step": 135551, "epoch": 1633} {"train_loss": -22.617517471313477, "global_step": 135552, "epoch": 1633} {"train_loss": -22.9956111907959, "global_step": 135553, "epoch": 1633} {"train_loss": -22.8341007232666, "global_step": 135554, "epoch": 1633} {"train_loss": -23.07185173034668, "global_step": 135555, "epoch": 1633} {"train_loss": -22.90964698791504, "global_step": 135556, "epoch": 1633} {"train_loss": -22.812532424926758, "global_step": 135557, "epoch": 1633} {"train_loss": -23.11060905456543, "global_step": 135558, "epoch": 1633} {"train_loss": -23.042123794555664, "global_step": 135559, "epoch": 1633} {"train_loss": -22.55959129333496, "global_step": 135560, "epoch": 1633} {"train_loss": -22.940513610839844, "global_step": 135561, "epoch": 1633} {"train_loss": -22.746475219726562, "global_step": 135562, "epoch": 1633} {"train_loss": -22.97500228881836, "global_step": 135563, "epoch": 1633} {"train_loss": -22.842130661010742, "global_step": 135564, "epoch": 1633} {"train_loss": -23.142126083374023, "global_step": 135565, "epoch": 1633} {"train_loss": -22.697994232177734, "global_step": 135566, "epoch": 1633} {"train_loss": -22.8928165435791, "global_step": 135567, "epoch": 1633} {"train_loss": -22.984949111938477, "global_step": 135568, "epoch": 1633} {"train_loss": -22.927978515625, "global_step": 135569, "epoch": 1633} {"train_loss": -22.97232437133789, "global_step": 135570, "epoch": 1633} {"train_loss": -23.150434494018555, "global_step": 135571, "epoch": 1633} {"train_loss": -23.178335189819336, "global_step": 135572, "epoch": 1633} {"train_loss": -22.718135833740234, "global_step": 135573, "epoch": 1633} {"train_loss": -22.963241577148438, "global_step": 135574, "epoch": 1633} {"train_loss": -23.228254318237305, "global_step": 135575, "epoch": 1633} {"train_loss": -22.645532608032227, "global_step": 135576, "epoch": 1633} {"train_loss": -23.2921085357666, "global_step": 135577, "epoch": 1633} {"train_loss": -22.950651168823242, "global_step": 135578, "epoch": 1633} {"train_loss": -22.726964950561523, "global_step": 135579, "epoch": 1633} {"train_loss": -23.05422019958496, "global_step": 135580, "epoch": 1633} {"train_loss": -23.01175308227539, "global_step": 135581, "epoch": 1633} {"train_loss": -23.000600814819336, "global_step": 135582, "epoch": 1633} {"train_loss": -22.445898056030273, "global_step": 135583, "epoch": 1633} {"train_loss": -22.981626510620117, "global_step": 135584, "epoch": 1633} {"train_loss": -23.03989601135254, "global_step": 135585, "epoch": 1633} {"train_loss": -22.688852310180664, "global_step": 135586, "epoch": 1633} {"train_loss": -23.04420280456543, "global_step": 135587, "epoch": 1633} {"train_loss": -22.917545318603516, "global_step": 135588, "epoch": 1633} {"train_loss": -23.036819458007812, "global_step": 135589, "epoch": 1633} {"train_loss": -22.69536590576172, "global_step": 135590, "epoch": 1633} {"train_loss": -22.967100143432617, "global_step": 135591, "epoch": 1633} {"train_loss": -22.982892990112305, "global_step": 135592, "epoch": 1633} {"train_loss": -22.820484161376953, "global_step": 135593, "epoch": 1633} {"train_loss": -22.992582321166992, "global_step": 135594, "epoch": 1633} {"train_loss": -23.10835838317871, "global_step": 135595, "epoch": 1633} {"train_loss": -22.941370010375977, "global_step": 135596, "epoch": 1633} {"train_loss": -23.088266372680664, "global_step": 135597, "epoch": 1633} {"train_loss": -23.289949417114258, "global_step": 135598, "epoch": 1633} {"train_loss": -22.964040756225586, "global_step": 135599, "epoch": 1633} {"train_loss": -22.640295028686523, "global_step": 135600, "epoch": 1633} {"train_loss": -22.672887802124023, "global_step": 135601, "epoch": 1633} {"train_loss": -22.7562313079834, "global_step": 135602, "epoch": 1633} {"train_loss": -22.601200103759766, "global_step": 135603, "epoch": 1633} {"train_loss": -22.753568649291992, "global_step": 135604, "epoch": 1633} {"train_loss": -22.674610137939453, "global_step": 135605, "epoch": 1633} {"train_loss": -22.943450927734375, "global_step": 135606, "epoch": 1633} {"train_loss": -23.006576538085938, "global_step": 135607, "epoch": 1633} {"train_loss": -23.013856887817383, "global_step": 135608, "epoch": 1633} {"train_loss": -22.80868911743164, "global_step": 135609, "epoch": 1633} {"train_loss": -23.238950729370117, "global_step": 135610, "epoch": 1633} {"train_loss": -23.258878707885742, "global_step": 135611, "epoch": 1633} {"train_loss": -22.678720474243164, "global_step": 135612, "epoch": 1633} {"train_loss": -23.091650009155273, "global_step": 135613, "epoch": 1633} {"train_loss": -22.884389877319336, "global_step": 135614, "epoch": 1633} {"train_loss": -23.50003433227539, "global_step": 135615, "epoch": 1633} {"train_loss": -22.666555404663086, "global_step": 135616, "epoch": 1633} {"train_loss": -23.064802169799805, "global_step": 135617, "epoch": 1633} {"train_loss": -23.005542755126953, "global_step": 135618, "epoch": 1633} {"train_loss": -23.133798599243164, "global_step": 135619, "epoch": 1633} {"train_loss": -22.697046279907227, "global_step": 135620, "epoch": 1633} {"train_loss": -22.886334086038982, "global_step": 135621, "epoch": 1633, "val_loss": 6310269.5} {"train_loss": -22.226316452026367, "global_step": 135622, "epoch": 1634} {"train_loss": -22.35064697265625, "global_step": 135623, "epoch": 1634} {"train_loss": -22.54192352294922, "global_step": 135624, "epoch": 1634} {"train_loss": -22.56312370300293, "global_step": 135625, "epoch": 1634} {"train_loss": -22.590757369995117, "global_step": 135626, "epoch": 1634} {"train_loss": -22.43869972229004, "global_step": 135627, "epoch": 1634} {"train_loss": -22.77174186706543, "global_step": 135628, "epoch": 1634} {"train_loss": -22.552326202392578, "global_step": 135629, "epoch": 1634} {"train_loss": -22.8673038482666, "global_step": 135630, "epoch": 1634} {"train_loss": -22.77176856994629, "global_step": 135631, "epoch": 1634} {"train_loss": -22.48958969116211, "global_step": 135632, "epoch": 1634} {"train_loss": -22.705547332763672, "global_step": 135633, "epoch": 1634} {"train_loss": -22.682615280151367, "global_step": 135634, "epoch": 1634} {"train_loss": -22.803171157836914, "global_step": 135635, "epoch": 1634} {"train_loss": -22.998022079467773, "global_step": 135636, "epoch": 1634} {"train_loss": -22.960430145263672, "global_step": 135637, "epoch": 1634} {"train_loss": -23.045446395874023, "global_step": 135638, "epoch": 1634} {"train_loss": -22.688196182250977, "global_step": 135639, "epoch": 1634} {"train_loss": -22.711078643798828, "global_step": 135640, "epoch": 1634} {"train_loss": -22.576631546020508, "global_step": 135641, "epoch": 1634} {"train_loss": -22.96272850036621, "global_step": 135642, "epoch": 1634} {"train_loss": -22.71736717224121, "global_step": 135643, "epoch": 1634} {"train_loss": -22.28244972229004, "global_step": 135644, "epoch": 1634} {"train_loss": -22.80000877380371, "global_step": 135645, "epoch": 1634} {"train_loss": -22.707761764526367, "global_step": 135646, "epoch": 1634} {"train_loss": -22.916051864624023, "global_step": 135647, "epoch": 1634} {"train_loss": -22.43177032470703, "global_step": 135648, "epoch": 1634} {"train_loss": -23.18390464782715, "global_step": 135649, "epoch": 1634} {"train_loss": -22.902667999267578, "global_step": 135650, "epoch": 1634} {"train_loss": -22.687768936157227, "global_step": 135651, "epoch": 1634} {"train_loss": -22.830228805541992, "global_step": 135652, "epoch": 1634} {"train_loss": -22.92523193359375, "global_step": 135653, "epoch": 1634} {"train_loss": -22.913846969604492, "global_step": 135654, "epoch": 1634} {"train_loss": -23.17348289489746, "global_step": 135655, "epoch": 1634} {"train_loss": -22.991743087768555, "global_step": 135656, "epoch": 1634} {"train_loss": -22.72528076171875, "global_step": 135657, "epoch": 1634} {"train_loss": -22.548322677612305, "global_step": 135658, "epoch": 1634} {"train_loss": -22.78147315979004, "global_step": 135659, "epoch": 1634} {"train_loss": -22.825138092041016, "global_step": 135660, "epoch": 1634} {"train_loss": -22.896902084350586, "global_step": 135661, "epoch": 1634} {"train_loss": -22.91994285583496, "global_step": 135662, "epoch": 1634} {"train_loss": -22.859128952026367, "global_step": 135663, "epoch": 1634} {"train_loss": -22.625991821289062, "global_step": 135664, "epoch": 1634} {"train_loss": -22.901561737060547, "global_step": 135665, "epoch": 1634} {"train_loss": -22.696094512939453, "global_step": 135666, "epoch": 1634} {"train_loss": -23.031774520874023, "global_step": 135667, "epoch": 1634} {"train_loss": -22.926048278808594, "global_step": 135668, "epoch": 1634} {"train_loss": -22.617359161376953, "global_step": 135669, "epoch": 1634} {"train_loss": -23.30519676208496, "global_step": 135670, "epoch": 1634} {"train_loss": -22.843469619750977, "global_step": 135671, "epoch": 1634} {"train_loss": -22.584760665893555, "global_step": 135672, "epoch": 1634} {"train_loss": -23.125295639038086, "global_step": 135673, "epoch": 1634} {"train_loss": -23.040977478027344, "global_step": 135674, "epoch": 1634} {"train_loss": -22.742238998413086, "global_step": 135675, "epoch": 1634} {"train_loss": -22.6783447265625, "global_step": 135676, "epoch": 1634} {"train_loss": -22.927030563354492, "global_step": 135677, "epoch": 1634} {"train_loss": -23.03394889831543, "global_step": 135678, "epoch": 1634} {"train_loss": -22.92713737487793, "global_step": 135679, "epoch": 1634} {"train_loss": -22.871158599853516, "global_step": 135680, "epoch": 1634} {"train_loss": -22.96407699584961, "global_step": 135681, "epoch": 1634} {"train_loss": -22.832433700561523, "global_step": 135682, "epoch": 1634} {"train_loss": -23.185983657836914, "global_step": 135683, "epoch": 1634} {"train_loss": -22.977426528930664, "global_step": 135684, "epoch": 1634} {"train_loss": -23.166955947875977, "global_step": 135685, "epoch": 1634} {"train_loss": -23.360403060913086, "global_step": 135686, "epoch": 1634} {"train_loss": -23.113082885742188, "global_step": 135687, "epoch": 1634} {"train_loss": -22.92321014404297, "global_step": 135688, "epoch": 1634} {"train_loss": -23.0174617767334, "global_step": 135689, "epoch": 1634} {"train_loss": -23.246999740600586, "global_step": 135690, "epoch": 1634} {"train_loss": -23.361328125, "global_step": 135691, "epoch": 1634} {"train_loss": -23.35973358154297, "global_step": 135692, "epoch": 1634} {"train_loss": -23.241987228393555, "global_step": 135693, "epoch": 1634} {"train_loss": -23.046857833862305, "global_step": 135694, "epoch": 1634} {"train_loss": -23.016359329223633, "global_step": 135695, "epoch": 1634} {"train_loss": -23.00900650024414, "global_step": 135696, "epoch": 1634} {"train_loss": -23.06827163696289, "global_step": 135697, "epoch": 1634} {"train_loss": -22.81989097595215, "global_step": 135698, "epoch": 1634} {"train_loss": -22.79600715637207, "global_step": 135699, "epoch": 1634} {"train_loss": -23.147838592529297, "global_step": 135700, "epoch": 1634} {"train_loss": -23.06434440612793, "global_step": 135701, "epoch": 1634} {"train_loss": -23.04880142211914, "global_step": 135702, "epoch": 1634} {"train_loss": -22.99481773376465, "global_step": 135703, "epoch": 1634} {"train_loss": -22.88016719128712, "global_step": 135704, "epoch": 1634, "val_loss": 6303175.0} {"train_loss": -22.15781593322754, "global_step": 135705, "epoch": 1635} {"train_loss": -22.349645614624023, "global_step": 135706, "epoch": 1635} {"train_loss": -21.705495834350586, "global_step": 135707, "epoch": 1635} {"train_loss": -22.260250091552734, "global_step": 135708, "epoch": 1635} {"train_loss": -22.88775062561035, "global_step": 135709, "epoch": 1635} {"train_loss": -22.679386138916016, "global_step": 135710, "epoch": 1635} {"train_loss": -22.841419219970703, "global_step": 135711, "epoch": 1635} {"train_loss": -22.76532554626465, "global_step": 135712, "epoch": 1635} {"train_loss": -22.552507400512695, "global_step": 135713, "epoch": 1635} {"train_loss": -22.492307662963867, "global_step": 135714, "epoch": 1635} {"train_loss": -22.612394332885742, "global_step": 135715, "epoch": 1635} {"train_loss": -22.62092399597168, "global_step": 135716, "epoch": 1635} {"train_loss": -22.604963302612305, "global_step": 135717, "epoch": 1635} {"train_loss": -22.902835845947266, "global_step": 135718, "epoch": 1635} {"train_loss": -22.417984008789062, "global_step": 135719, "epoch": 1635} {"train_loss": -22.571704864501953, "global_step": 135720, "epoch": 1635} {"train_loss": -22.676626205444336, "global_step": 135721, "epoch": 1635} {"train_loss": -22.681303024291992, "global_step": 135722, "epoch": 1635} {"train_loss": -22.66910743713379, "global_step": 135723, "epoch": 1635} {"train_loss": -22.865697860717773, "global_step": 135724, "epoch": 1635} {"train_loss": -22.763975143432617, "global_step": 135725, "epoch": 1635} {"train_loss": -22.733251571655273, "global_step": 135726, "epoch": 1635} {"train_loss": -22.74295997619629, "global_step": 135727, "epoch": 1635} {"train_loss": -23.02876091003418, "global_step": 135728, "epoch": 1635} {"train_loss": -22.661680221557617, "global_step": 135729, "epoch": 1635} {"train_loss": -22.25324249267578, "global_step": 135730, "epoch": 1635} {"train_loss": -22.44843101501465, "global_step": 135731, "epoch": 1635} {"train_loss": -22.668832778930664, "global_step": 135732, "epoch": 1635} {"train_loss": -22.620847702026367, "global_step": 135733, "epoch": 1635} {"train_loss": -22.674631118774414, "global_step": 135734, "epoch": 1635} {"train_loss": -22.876922607421875, "global_step": 135735, "epoch": 1635} {"train_loss": -22.66865348815918, "global_step": 135736, "epoch": 1635} {"train_loss": -23.198974609375, "global_step": 135737, "epoch": 1635} {"train_loss": -22.812185287475586, "global_step": 135738, "epoch": 1635} {"train_loss": -22.752788543701172, "global_step": 135739, "epoch": 1635} {"train_loss": -22.8350772857666, "global_step": 135740, "epoch": 1635} {"train_loss": -22.735300064086914, "global_step": 135741, "epoch": 1635} {"train_loss": -22.660011291503906, "global_step": 135742, "epoch": 1635} {"train_loss": -22.92991065979004, "global_step": 135743, "epoch": 1635} {"train_loss": -23.081100463867188, "global_step": 135744, "epoch": 1635} {"train_loss": -22.59072494506836, "global_step": 135745, "epoch": 1635} {"train_loss": -23.153940200805664, "global_step": 135746, "epoch": 1635} {"train_loss": -23.020217895507812, "global_step": 135747, "epoch": 1635} {"train_loss": -23.019214630126953, "global_step": 135748, "epoch": 1635} {"train_loss": -22.971755981445312, "global_step": 135749, "epoch": 1635} {"train_loss": -24.035303115844727, "global_step": 135750, "epoch": 1635} {"train_loss": -22.998249053955078, "global_step": 135751, "epoch": 1635} {"train_loss": -22.948326110839844, "global_step": 135752, "epoch": 1635} {"train_loss": -22.435806274414062, "global_step": 135753, "epoch": 1635} {"train_loss": -23.05482292175293, "global_step": 135754, "epoch": 1635} {"train_loss": -23.10398292541504, "global_step": 135755, "epoch": 1635} {"train_loss": -22.69300079345703, "global_step": 135756, "epoch": 1635} {"train_loss": -22.780975341796875, "global_step": 135757, "epoch": 1635} {"train_loss": -23.00664520263672, "global_step": 135758, "epoch": 1635} {"train_loss": -23.219165802001953, "global_step": 135759, "epoch": 1635} {"train_loss": -22.818891525268555, "global_step": 135760, "epoch": 1635} {"train_loss": -23.098590850830078, "global_step": 135761, "epoch": 1635} {"train_loss": -23.287031173706055, "global_step": 135762, "epoch": 1635} {"train_loss": -22.563711166381836, "global_step": 135763, "epoch": 1635} {"train_loss": -22.68470573425293, "global_step": 135764, "epoch": 1635} {"train_loss": -22.91192054748535, "global_step": 135765, "epoch": 1635} {"train_loss": -23.24833106994629, "global_step": 135766, "epoch": 1635} {"train_loss": -22.998687744140625, "global_step": 135767, "epoch": 1635} {"train_loss": -23.007591247558594, "global_step": 135768, "epoch": 1635} {"train_loss": -23.260334014892578, "global_step": 135769, "epoch": 1635} {"train_loss": -22.9949893951416, "global_step": 135770, "epoch": 1635} {"train_loss": -23.064687728881836, "global_step": 135771, "epoch": 1635} {"train_loss": -23.035430908203125, "global_step": 135772, "epoch": 1635} {"train_loss": -23.151870727539062, "global_step": 135773, "epoch": 1635} {"train_loss": -22.8194637298584, "global_step": 135774, "epoch": 1635} {"train_loss": -23.090551376342773, "global_step": 135775, "epoch": 1635} {"train_loss": -22.823627471923828, "global_step": 135776, "epoch": 1635} {"train_loss": -23.256303787231445, "global_step": 135777, "epoch": 1635} {"train_loss": -23.31622886657715, "global_step": 135778, "epoch": 1635} {"train_loss": -23.203458786010742, "global_step": 135779, "epoch": 1635} {"train_loss": -23.19353675842285, "global_step": 135780, "epoch": 1635} {"train_loss": -22.68556022644043, "global_step": 135781, "epoch": 1635} {"train_loss": -23.054670333862305, "global_step": 135782, "epoch": 1635} {"train_loss": -23.094343185424805, "global_step": 135783, "epoch": 1635} {"train_loss": -23.023189544677734, "global_step": 135784, "epoch": 1635} {"train_loss": -22.942829132080078, "global_step": 135785, "epoch": 1635} {"train_loss": -23.423139572143555, "global_step": 135786, "epoch": 1635} {"train_loss": -22.84267607079931, "global_step": 135787, "epoch": 1635, "val_loss": 6377502.0} {"train_loss": -21.9152889251709, "global_step": 135788, "epoch": 1636} {"train_loss": -21.250144958496094, "global_step": 135789, "epoch": 1636} {"train_loss": -21.965803146362305, "global_step": 135790, "epoch": 1636} {"train_loss": -21.90601348876953, "global_step": 135791, "epoch": 1636} {"train_loss": -21.738874435424805, "global_step": 135792, "epoch": 1636} {"train_loss": -22.218812942504883, "global_step": 135793, "epoch": 1636} {"train_loss": -22.168569564819336, "global_step": 135794, "epoch": 1636} {"train_loss": -22.65829849243164, "global_step": 135795, "epoch": 1636} {"train_loss": -22.221969604492188, "global_step": 135796, "epoch": 1636} {"train_loss": -22.668485641479492, "global_step": 135797, "epoch": 1636} {"train_loss": -22.333742141723633, "global_step": 135798, "epoch": 1636} {"train_loss": -22.148883819580078, "global_step": 135799, "epoch": 1636} {"train_loss": -22.818716049194336, "global_step": 135800, "epoch": 1636} {"train_loss": -22.39869499206543, "global_step": 135801, "epoch": 1636} {"train_loss": -22.606964111328125, "global_step": 135802, "epoch": 1636} {"train_loss": -22.75559425354004, "global_step": 135803, "epoch": 1636} {"train_loss": -22.922880172729492, "global_step": 135804, "epoch": 1636} {"train_loss": -22.744062423706055, "global_step": 135805, "epoch": 1636} {"train_loss": -22.46799659729004, "global_step": 135806, "epoch": 1636} {"train_loss": -22.5, "global_step": 135807, "epoch": 1636} {"train_loss": -22.831090927124023, "global_step": 135808, "epoch": 1636} {"train_loss": -22.733469009399414, "global_step": 135809, "epoch": 1636} {"train_loss": -22.82366371154785, "global_step": 135810, "epoch": 1636} {"train_loss": -22.90498161315918, "global_step": 135811, "epoch": 1636} {"train_loss": -23.184967041015625, "global_step": 135812, "epoch": 1636} {"train_loss": -23.021133422851562, "global_step": 135813, "epoch": 1636} {"train_loss": -22.653684616088867, "global_step": 135814, "epoch": 1636} {"train_loss": -22.74637222290039, "global_step": 135815, "epoch": 1636} {"train_loss": -23.153263092041016, "global_step": 135816, "epoch": 1636} {"train_loss": -22.93716049194336, "global_step": 135817, "epoch": 1636} {"train_loss": -23.099660873413086, "global_step": 135818, "epoch": 1636} {"train_loss": -23.088836669921875, "global_step": 135819, "epoch": 1636} {"train_loss": -22.893754959106445, "global_step": 135820, "epoch": 1636} {"train_loss": -23.024662017822266, "global_step": 135821, "epoch": 1636} {"train_loss": -22.562885284423828, "global_step": 135822, "epoch": 1636} {"train_loss": -22.891407012939453, "global_step": 135823, "epoch": 1636} {"train_loss": -22.85236167907715, "global_step": 135824, "epoch": 1636} {"train_loss": -22.94114112854004, "global_step": 135825, "epoch": 1636} {"train_loss": -22.75765037536621, "global_step": 135826, "epoch": 1636} {"train_loss": -22.82761573791504, "global_step": 135827, "epoch": 1636} {"train_loss": -22.824325561523438, "global_step": 135828, "epoch": 1636} {"train_loss": -23.127887725830078, "global_step": 135829, "epoch": 1636} {"train_loss": -22.92243766784668, "global_step": 135830, "epoch": 1636} {"train_loss": -23.059371948242188, "global_step": 135831, "epoch": 1636} {"train_loss": -23.00402069091797, "global_step": 135832, "epoch": 1636} {"train_loss": -22.926618576049805, "global_step": 135833, "epoch": 1636} {"train_loss": -23.105777740478516, "global_step": 135834, "epoch": 1636} {"train_loss": -22.934215545654297, "global_step": 135835, "epoch": 1636} {"train_loss": -23.068735122680664, "global_step": 135836, "epoch": 1636} {"train_loss": -23.048139572143555, "global_step": 135837, "epoch": 1636} {"train_loss": -23.03044319152832, "global_step": 135838, "epoch": 1636} {"train_loss": -23.023313522338867, "global_step": 135839, "epoch": 1636} {"train_loss": -23.031023025512695, "global_step": 135840, "epoch": 1636} {"train_loss": -22.97254753112793, "global_step": 135841, "epoch": 1636} {"train_loss": -22.77384376525879, "global_step": 135842, "epoch": 1636} {"train_loss": -22.631444931030273, "global_step": 135843, "epoch": 1636} {"train_loss": -23.072633743286133, "global_step": 135844, "epoch": 1636} {"train_loss": -23.024036407470703, "global_step": 135845, "epoch": 1636} {"train_loss": -22.66368293762207, "global_step": 135846, "epoch": 1636} {"train_loss": -22.845531463623047, "global_step": 135847, "epoch": 1636} {"train_loss": -23.028600692749023, "global_step": 135848, "epoch": 1636} {"train_loss": -22.86124038696289, "global_step": 135849, "epoch": 1636} {"train_loss": -23.05121421813965, "global_step": 135850, "epoch": 1636} {"train_loss": -22.849294662475586, "global_step": 135851, "epoch": 1636} {"train_loss": -23.119768142700195, "global_step": 135852, "epoch": 1636} {"train_loss": -23.14614486694336, "global_step": 135853, "epoch": 1636} {"train_loss": -22.73747444152832, "global_step": 135854, "epoch": 1636} {"train_loss": -22.766374588012695, "global_step": 135855, "epoch": 1636} {"train_loss": -22.759489059448242, "global_step": 135856, "epoch": 1636} {"train_loss": -23.39095115661621, "global_step": 135857, "epoch": 1636} {"train_loss": -23.414997100830078, "global_step": 135858, "epoch": 1636} {"train_loss": -22.79499053955078, "global_step": 135859, "epoch": 1636} {"train_loss": -23.102384567260742, "global_step": 135860, "epoch": 1636} {"train_loss": -23.22552490234375, "global_step": 135861, "epoch": 1636} {"train_loss": -22.960102081298828, "global_step": 135862, "epoch": 1636} {"train_loss": -23.1378116607666, "global_step": 135863, "epoch": 1636} {"train_loss": -23.346616744995117, "global_step": 135864, "epoch": 1636} {"train_loss": -22.908973693847656, "global_step": 135865, "epoch": 1636} {"train_loss": -22.868440628051758, "global_step": 135866, "epoch": 1636} {"train_loss": -23.077749252319336, "global_step": 135867, "epoch": 1636} {"train_loss": -23.48591423034668, "global_step": 135868, "epoch": 1636} {"train_loss": -22.87249183654785, "global_step": 135869, "epoch": 1636} {"train_loss": -22.831120502517884, "global_step": 135870, "epoch": 1636, "val_loss": 6217667.0} {"train_loss": -22.988895416259766, "global_step": 135871, "epoch": 1637} {"train_loss": -22.972084045410156, "global_step": 135872, "epoch": 1637} {"train_loss": -22.402074813842773, "global_step": 135873, "epoch": 1637} {"train_loss": -22.761686325073242, "global_step": 135874, "epoch": 1637} {"train_loss": -22.758955001831055, "global_step": 135875, "epoch": 1637} {"train_loss": -22.635665893554688, "global_step": 135876, "epoch": 1637} {"train_loss": -22.37552261352539, "global_step": 135877, "epoch": 1637} {"train_loss": -22.626361846923828, "global_step": 135878, "epoch": 1637} {"train_loss": -22.391345977783203, "global_step": 135879, "epoch": 1637} {"train_loss": -22.537456512451172, "global_step": 135880, "epoch": 1637} {"train_loss": -23.01659393310547, "global_step": 135881, "epoch": 1637} {"train_loss": -22.44399070739746, "global_step": 135882, "epoch": 1637} {"train_loss": -22.681278228759766, "global_step": 135883, "epoch": 1637} {"train_loss": -22.68927001953125, "global_step": 135884, "epoch": 1637} {"train_loss": -22.84292221069336, "global_step": 135885, "epoch": 1637} {"train_loss": -22.59493064880371, "global_step": 135886, "epoch": 1637} {"train_loss": -22.691259384155273, "global_step": 135887, "epoch": 1637} {"train_loss": -22.908910751342773, "global_step": 135888, "epoch": 1637} {"train_loss": -22.902658462524414, "global_step": 135889, "epoch": 1637} {"train_loss": -22.734546661376953, "global_step": 135890, "epoch": 1637} {"train_loss": -23.00711441040039, "global_step": 135891, "epoch": 1637} {"train_loss": -22.737512588500977, "global_step": 135892, "epoch": 1637} {"train_loss": -23.21886444091797, "global_step": 135893, "epoch": 1637} {"train_loss": -22.932363510131836, "global_step": 135894, "epoch": 1637} {"train_loss": -22.984533309936523, "global_step": 135895, "epoch": 1637} {"train_loss": -22.939435958862305, "global_step": 135896, "epoch": 1637} {"train_loss": -22.559038162231445, "global_step": 135897, "epoch": 1637} {"train_loss": -22.80830955505371, "global_step": 135898, "epoch": 1637} {"train_loss": -23.0803279876709, "global_step": 135899, "epoch": 1637} {"train_loss": -23.039535522460938, "global_step": 135900, "epoch": 1637} {"train_loss": -22.954694747924805, "global_step": 135901, "epoch": 1637} {"train_loss": -23.238773345947266, "global_step": 135902, "epoch": 1637} {"train_loss": -23.18929100036621, "global_step": 135903, "epoch": 1637} {"train_loss": -23.13172149658203, "global_step": 135904, "epoch": 1637} {"train_loss": -22.933988571166992, "global_step": 135905, "epoch": 1637} {"train_loss": -22.783294677734375, "global_step": 135906, "epoch": 1637} {"train_loss": -22.65761375427246, "global_step": 135907, "epoch": 1637} {"train_loss": -23.133411407470703, "global_step": 135908, "epoch": 1637} {"train_loss": -23.208690643310547, "global_step": 135909, "epoch": 1637} {"train_loss": -23.148210525512695, "global_step": 135910, "epoch": 1637} {"train_loss": -22.848648071289062, "global_step": 135911, "epoch": 1637} {"train_loss": -23.415002822875977, "global_step": 135912, "epoch": 1637} {"train_loss": -23.171247482299805, "global_step": 135913, "epoch": 1637} {"train_loss": -23.076026916503906, "global_step": 135914, "epoch": 1637} {"train_loss": -22.93123435974121, "global_step": 135915, "epoch": 1637} {"train_loss": -22.746763229370117, "global_step": 135916, "epoch": 1637} {"train_loss": -22.92963409423828, "global_step": 135917, "epoch": 1637} {"train_loss": -23.19584083557129, "global_step": 135918, "epoch": 1637} {"train_loss": -22.540525436401367, "global_step": 135919, "epoch": 1637} {"train_loss": -23.109594345092773, "global_step": 135920, "epoch": 1637} {"train_loss": -22.90067481994629, "global_step": 135921, "epoch": 1637} {"train_loss": -23.004003524780273, "global_step": 135922, "epoch": 1637} {"train_loss": -22.853979110717773, "global_step": 135923, "epoch": 1637} {"train_loss": -22.93147850036621, "global_step": 135924, "epoch": 1637} {"train_loss": -22.745573043823242, "global_step": 135925, "epoch": 1637} {"train_loss": -22.715316772460938, "global_step": 135926, "epoch": 1637} {"train_loss": -22.717971801757812, "global_step": 135927, "epoch": 1637} {"train_loss": -23.178691864013672, "global_step": 135928, "epoch": 1637} {"train_loss": -22.92133903503418, "global_step": 135929, "epoch": 1637} {"train_loss": -23.022314071655273, "global_step": 135930, "epoch": 1637} {"train_loss": -23.034542083740234, "global_step": 135931, "epoch": 1637} {"train_loss": -23.034236907958984, "global_step": 135932, "epoch": 1637} {"train_loss": -22.836164474487305, "global_step": 135933, "epoch": 1637} {"train_loss": -22.75016212463379, "global_step": 135934, "epoch": 1637} {"train_loss": -22.84354591369629, "global_step": 135935, "epoch": 1637} {"train_loss": -22.7553768157959, "global_step": 135936, "epoch": 1637} {"train_loss": -22.796995162963867, "global_step": 135937, "epoch": 1637} {"train_loss": -22.62568473815918, "global_step": 135938, "epoch": 1637} {"train_loss": -23.0531063079834, "global_step": 135939, "epoch": 1637} {"train_loss": -22.947885513305664, "global_step": 135940, "epoch": 1637} {"train_loss": -22.756738662719727, "global_step": 135941, "epoch": 1637} {"train_loss": -22.962209701538086, "global_step": 135942, "epoch": 1637} {"train_loss": -23.035396575927734, "global_step": 135943, "epoch": 1637} {"train_loss": -23.41678237915039, "global_step": 135944, "epoch": 1637} {"train_loss": -23.162450790405273, "global_step": 135945, "epoch": 1637} {"train_loss": -23.249649047851562, "global_step": 135946, "epoch": 1637} {"train_loss": -23.045438766479492, "global_step": 135947, "epoch": 1637} {"train_loss": -23.018747329711914, "global_step": 135948, "epoch": 1637} {"train_loss": -23.43280792236328, "global_step": 135949, "epoch": 1637} {"train_loss": -22.61060905456543, "global_step": 135950, "epoch": 1637} {"train_loss": -22.842248916625977, "global_step": 135951, "epoch": 1637} {"train_loss": -22.903249740600586, "global_step": 135952, "epoch": 1637} {"train_loss": -22.91522979736328, "global_step": 135953, "epoch": 1637, "val_loss": 6373950.5} {"train_loss": -22.148365020751953, "global_step": 135954, "epoch": 1638} {"train_loss": -21.391637802124023, "global_step": 135955, "epoch": 1638} {"train_loss": -22.195514678955078, "global_step": 135956, "epoch": 1638} {"train_loss": -22.289758682250977, "global_step": 135957, "epoch": 1638} {"train_loss": -22.31610870361328, "global_step": 135958, "epoch": 1638} {"train_loss": -22.248212814331055, "global_step": 135959, "epoch": 1638} {"train_loss": -22.143310546875, "global_step": 135960, "epoch": 1638} {"train_loss": -22.23272132873535, "global_step": 135961, "epoch": 1638} {"train_loss": -22.91086769104004, "global_step": 135962, "epoch": 1638} {"train_loss": -22.059255599975586, "global_step": 135963, "epoch": 1638} {"train_loss": -22.550756454467773, "global_step": 135964, "epoch": 1638} {"train_loss": -22.653799057006836, "global_step": 135965, "epoch": 1638} {"train_loss": -22.724523544311523, "global_step": 135966, "epoch": 1638} {"train_loss": -22.73621940612793, "global_step": 135967, "epoch": 1638} {"train_loss": -22.589792251586914, "global_step": 135968, "epoch": 1638} {"train_loss": -22.982757568359375, "global_step": 135969, "epoch": 1638} {"train_loss": -22.70667839050293, "global_step": 135970, "epoch": 1638} {"train_loss": -22.72418785095215, "global_step": 135971, "epoch": 1638} {"train_loss": -22.575586318969727, "global_step": 135972, "epoch": 1638} {"train_loss": -22.686553955078125, "global_step": 135973, "epoch": 1638} {"train_loss": -22.66373062133789, "global_step": 135974, "epoch": 1638} {"train_loss": -23.168210983276367, "global_step": 135975, "epoch": 1638} {"train_loss": -22.81156349182129, "global_step": 135976, "epoch": 1638} {"train_loss": -23.06300926208496, "global_step": 135977, "epoch": 1638} {"train_loss": -22.74476432800293, "global_step": 135978, "epoch": 1638} {"train_loss": -22.894134521484375, "global_step": 135979, "epoch": 1638} {"train_loss": -23.075096130371094, "global_step": 135980, "epoch": 1638} {"train_loss": -22.63222312927246, "global_step": 135981, "epoch": 1638} {"train_loss": -22.846799850463867, "global_step": 135982, "epoch": 1638} {"train_loss": -22.718385696411133, "global_step": 135983, "epoch": 1638} {"train_loss": -23.15421485900879, "global_step": 135984, "epoch": 1638} {"train_loss": -23.010122299194336, "global_step": 135985, "epoch": 1638} {"train_loss": -23.235620498657227, "global_step": 135986, "epoch": 1638} {"train_loss": -22.823740005493164, "global_step": 135987, "epoch": 1638} {"train_loss": -22.785558700561523, "global_step": 135988, "epoch": 1638} {"train_loss": -23.26047706604004, "global_step": 135989, "epoch": 1638} {"train_loss": -22.952116012573242, "global_step": 135990, "epoch": 1638} {"train_loss": -23.113840103149414, "global_step": 135991, "epoch": 1638} {"train_loss": -22.697065353393555, "global_step": 135992, "epoch": 1638} {"train_loss": -22.972204208374023, "global_step": 135993, "epoch": 1638} {"train_loss": -23.212799072265625, "global_step": 135994, "epoch": 1638} {"train_loss": -22.689476013183594, "global_step": 135995, "epoch": 1638} {"train_loss": -22.78681182861328, "global_step": 135996, "epoch": 1638} {"train_loss": -22.7083740234375, "global_step": 135997, "epoch": 1638} {"train_loss": -22.779691696166992, "global_step": 135998, "epoch": 1638} {"train_loss": -22.478843688964844, "global_step": 135999, "epoch": 1638} {"train_loss": -23.110883712768555, "global_step": 136000, "epoch": 1638} {"train_loss": -22.743682861328125, "global_step": 136001, "epoch": 1638} {"train_loss": -22.441984176635742, "global_step": 136002, "epoch": 1638} {"train_loss": -22.764631271362305, "global_step": 136003, "epoch": 1638} {"train_loss": -23.14472770690918, "global_step": 136004, "epoch": 1638} {"train_loss": -22.55611228942871, "global_step": 136005, "epoch": 1638} {"train_loss": -22.796388626098633, "global_step": 136006, "epoch": 1638} {"train_loss": -22.904857635498047, "global_step": 136007, "epoch": 1638} {"train_loss": -22.914527893066406, "global_step": 136008, "epoch": 1638} {"train_loss": -22.941186904907227, "global_step": 136009, "epoch": 1638} {"train_loss": -23.096654891967773, "global_step": 136010, "epoch": 1638} {"train_loss": -23.06522560119629, "global_step": 136011, "epoch": 1638} {"train_loss": -22.8106746673584, "global_step": 136012, "epoch": 1638} {"train_loss": -22.576984405517578, "global_step": 136013, "epoch": 1638} {"train_loss": -23.294265747070312, "global_step": 136014, "epoch": 1638} {"train_loss": -22.86144256591797, "global_step": 136015, "epoch": 1638} {"train_loss": -23.06513023376465, "global_step": 136016, "epoch": 1638} {"train_loss": -22.976272583007812, "global_step": 136017, "epoch": 1638} {"train_loss": -23.005064010620117, "global_step": 136018, "epoch": 1638} {"train_loss": -23.285655975341797, "global_step": 136019, "epoch": 1638} {"train_loss": -22.601762771606445, "global_step": 136020, "epoch": 1638} {"train_loss": -22.984189987182617, "global_step": 136021, "epoch": 1638} {"train_loss": -22.83795738220215, "global_step": 136022, "epoch": 1638} {"train_loss": -23.0345458984375, "global_step": 136023, "epoch": 1638} {"train_loss": -22.825820922851562, "global_step": 136024, "epoch": 1638} {"train_loss": -23.17023277282715, "global_step": 136025, "epoch": 1638} {"train_loss": -22.94015884399414, "global_step": 136026, "epoch": 1638} {"train_loss": -22.994091033935547, "global_step": 136027, "epoch": 1638} {"train_loss": -22.771442413330078, "global_step": 136028, "epoch": 1638} {"train_loss": -22.779346466064453, "global_step": 136029, "epoch": 1638} {"train_loss": -22.976682662963867, "global_step": 136030, "epoch": 1638} {"train_loss": -22.778675079345703, "global_step": 136031, "epoch": 1638} {"train_loss": -23.015241622924805, "global_step": 136032, "epoch": 1638} {"train_loss": -23.06690788269043, "global_step": 136033, "epoch": 1638} {"train_loss": -23.0869197845459, "global_step": 136034, "epoch": 1638} {"train_loss": -23.081281661987305, "global_step": 136035, "epoch": 1638} {"train_loss": -22.797389731349714, "global_step": 136036, "epoch": 1638, "val_loss": 6356373.0} {"train_loss": -22.757585525512695, "global_step": 136037, "epoch": 1639} {"train_loss": -22.85071563720703, "global_step": 136038, "epoch": 1639} {"train_loss": -22.441137313842773, "global_step": 136039, "epoch": 1639} {"train_loss": -23.064563751220703, "global_step": 136040, "epoch": 1639} {"train_loss": -22.84583854675293, "global_step": 136041, "epoch": 1639} {"train_loss": -23.043781280517578, "global_step": 136042, "epoch": 1639} {"train_loss": -22.918256759643555, "global_step": 136043, "epoch": 1639} {"train_loss": -22.857120513916016, "global_step": 136044, "epoch": 1639} {"train_loss": -23.03302764892578, "global_step": 136045, "epoch": 1639} {"train_loss": -22.375181198120117, "global_step": 136046, "epoch": 1639} {"train_loss": -22.513410568237305, "global_step": 136047, "epoch": 1639} {"train_loss": -22.92388343811035, "global_step": 136048, "epoch": 1639} {"train_loss": -22.704330444335938, "global_step": 136049, "epoch": 1639} {"train_loss": -22.774320602416992, "global_step": 136050, "epoch": 1639} {"train_loss": -22.802331924438477, "global_step": 136051, "epoch": 1639} {"train_loss": -22.90953254699707, "global_step": 136052, "epoch": 1639} {"train_loss": -23.143266677856445, "global_step": 136053, "epoch": 1639} {"train_loss": -22.712820053100586, "global_step": 136054, "epoch": 1639} {"train_loss": -22.98856544494629, "global_step": 136055, "epoch": 1639} {"train_loss": -22.632604598999023, "global_step": 136056, "epoch": 1639} {"train_loss": -22.9735164642334, "global_step": 136057, "epoch": 1639} {"train_loss": -23.05080795288086, "global_step": 136058, "epoch": 1639} {"train_loss": -22.917875289916992, "global_step": 136059, "epoch": 1639} {"train_loss": -22.887861251831055, "global_step": 136060, "epoch": 1639} {"train_loss": -23.283676147460938, "global_step": 136061, "epoch": 1639} {"train_loss": -23.043563842773438, "global_step": 136062, "epoch": 1639} {"train_loss": -23.156871795654297, "global_step": 136063, "epoch": 1639} {"train_loss": -23.383848190307617, "global_step": 136064, "epoch": 1639} {"train_loss": -23.01141929626465, "global_step": 136065, "epoch": 1639} {"train_loss": -22.754106521606445, "global_step": 136066, "epoch": 1639} {"train_loss": -23.129138946533203, "global_step": 136067, "epoch": 1639} {"train_loss": -22.713699340820312, "global_step": 136068, "epoch": 1639} {"train_loss": -22.856985092163086, "global_step": 136069, "epoch": 1639} {"train_loss": -22.67026138305664, "global_step": 136070, "epoch": 1639} {"train_loss": -22.451562881469727, "global_step": 136071, "epoch": 1639} {"train_loss": -22.873090744018555, "global_step": 136072, "epoch": 1639} {"train_loss": -22.81331443786621, "global_step": 136073, "epoch": 1639} {"train_loss": -23.071557998657227, "global_step": 136074, "epoch": 1639} {"train_loss": -22.537389755249023, "global_step": 136075, "epoch": 1639} {"train_loss": -22.218120574951172, "global_step": 136076, "epoch": 1639} {"train_loss": -22.967721939086914, "global_step": 136077, "epoch": 1639} {"train_loss": -22.92045783996582, "global_step": 136078, "epoch": 1639} {"train_loss": -22.098270416259766, "global_step": 136079, "epoch": 1639} {"train_loss": -22.529218673706055, "global_step": 136080, "epoch": 1639} {"train_loss": -23.11495018005371, "global_step": 136081, "epoch": 1639} {"train_loss": -22.35249137878418, "global_step": 136082, "epoch": 1639} {"train_loss": -22.95410919189453, "global_step": 136083, "epoch": 1639} {"train_loss": -22.99378776550293, "global_step": 136084, "epoch": 1639} {"train_loss": -23.01908302307129, "global_step": 136085, "epoch": 1639} {"train_loss": -22.695302963256836, "global_step": 136086, "epoch": 1639} {"train_loss": -22.932462692260742, "global_step": 136087, "epoch": 1639} {"train_loss": -22.893835067749023, "global_step": 136088, "epoch": 1639} {"train_loss": -23.11237144470215, "global_step": 136089, "epoch": 1639} {"train_loss": -22.949737548828125, "global_step": 136090, "epoch": 1639} {"train_loss": -22.906347274780273, "global_step": 136091, "epoch": 1639} {"train_loss": -22.472335815429688, "global_step": 136092, "epoch": 1639} {"train_loss": -23.060653686523438, "global_step": 136093, "epoch": 1639} {"train_loss": -23.09853172302246, "global_step": 136094, "epoch": 1639} {"train_loss": -23.044025421142578, "global_step": 136095, "epoch": 1639} {"train_loss": -22.723581314086914, "global_step": 136096, "epoch": 1639} {"train_loss": -22.52888298034668, "global_step": 136097, "epoch": 1639} {"train_loss": -22.663358688354492, "global_step": 136098, "epoch": 1639} {"train_loss": -23.30953025817871, "global_step": 136099, "epoch": 1639} {"train_loss": -22.725717544555664, "global_step": 136100, "epoch": 1639} {"train_loss": -23.254743576049805, "global_step": 136101, "epoch": 1639} {"train_loss": -22.729463577270508, "global_step": 136102, "epoch": 1639} {"train_loss": -22.82404136657715, "global_step": 136103, "epoch": 1639} {"train_loss": -22.768720626831055, "global_step": 136104, "epoch": 1639} {"train_loss": -23.04746437072754, "global_step": 136105, "epoch": 1639} {"train_loss": -23.0367431640625, "global_step": 136106, "epoch": 1639} {"train_loss": -22.464521408081055, "global_step": 136107, "epoch": 1639} {"train_loss": -23.441940307617188, "global_step": 136108, "epoch": 1639} {"train_loss": -23.06746482849121, "global_step": 136109, "epoch": 1639} {"train_loss": -23.063329696655273, "global_step": 136110, "epoch": 1639} {"train_loss": -22.692834854125977, "global_step": 136111, "epoch": 1639} {"train_loss": -22.986902236938477, "global_step": 136112, "epoch": 1639} {"train_loss": -22.759082794189453, "global_step": 136113, "epoch": 1639} {"train_loss": -22.781198501586914, "global_step": 136114, "epoch": 1639} {"train_loss": -22.557449340820312, "global_step": 136115, "epoch": 1639} {"train_loss": -22.80572509765625, "global_step": 136116, "epoch": 1639} {"train_loss": -22.512210845947266, "global_step": 136117, "epoch": 1639} {"train_loss": -22.854127883911133, "global_step": 136118, "epoch": 1639} {"train_loss": -22.83036668616605, "global_step": 136119, "epoch": 1639, "val_loss": 6221146.0} {"train_loss": -22.406076431274414, "global_step": 136120, "epoch": 1640} {"train_loss": -21.8250732421875, "global_step": 136121, "epoch": 1640} {"train_loss": -22.49315643310547, "global_step": 136122, "epoch": 1640} {"train_loss": -22.37760353088379, "global_step": 136123, "epoch": 1640} {"train_loss": -22.317480087280273, "global_step": 136124, "epoch": 1640} {"train_loss": -22.810489654541016, "global_step": 136125, "epoch": 1640} {"train_loss": -22.580434799194336, "global_step": 136126, "epoch": 1640} {"train_loss": -22.50266456604004, "global_step": 136127, "epoch": 1640} {"train_loss": -22.36225700378418, "global_step": 136128, "epoch": 1640} {"train_loss": -22.21217155456543, "global_step": 136129, "epoch": 1640} {"train_loss": -22.43406105041504, "global_step": 136130, "epoch": 1640} {"train_loss": -22.732389450073242, "global_step": 136131, "epoch": 1640} {"train_loss": -22.300033569335938, "global_step": 136132, "epoch": 1640} {"train_loss": -22.051542282104492, "global_step": 136133, "epoch": 1640} {"train_loss": -22.529088973999023, "global_step": 136134, "epoch": 1640} {"train_loss": -22.387405395507812, "global_step": 136135, "epoch": 1640} {"train_loss": -22.497446060180664, "global_step": 136136, "epoch": 1640} {"train_loss": -22.888330459594727, "global_step": 136137, "epoch": 1640} {"train_loss": -22.438716888427734, "global_step": 136138, "epoch": 1640} {"train_loss": -22.573471069335938, "global_step": 136139, "epoch": 1640} {"train_loss": -22.53676414489746, "global_step": 136140, "epoch": 1640} {"train_loss": -22.429086685180664, "global_step": 136141, "epoch": 1640} {"train_loss": -22.8696346282959, "global_step": 136142, "epoch": 1640} {"train_loss": -22.55824089050293, "global_step": 136143, "epoch": 1640} {"train_loss": -22.65816307067871, "global_step": 136144, "epoch": 1640} {"train_loss": -22.909164428710938, "global_step": 136145, "epoch": 1640} {"train_loss": -22.554428100585938, "global_step": 136146, "epoch": 1640} {"train_loss": -23.147144317626953, "global_step": 136147, "epoch": 1640} {"train_loss": -23.01431655883789, "global_step": 136148, "epoch": 1640} {"train_loss": -22.81252670288086, "global_step": 136149, "epoch": 1640} {"train_loss": -23.09812355041504, "global_step": 136150, "epoch": 1640} {"train_loss": -23.02193260192871, "global_step": 136151, "epoch": 1640} {"train_loss": -22.831584930419922, "global_step": 136152, "epoch": 1640} {"train_loss": -22.731908798217773, "global_step": 136153, "epoch": 1640} {"train_loss": -22.98719024658203, "global_step": 136154, "epoch": 1640} {"train_loss": -23.08241081237793, "global_step": 136155, "epoch": 1640} {"train_loss": -22.79110336303711, "global_step": 136156, "epoch": 1640} {"train_loss": -23.118009567260742, "global_step": 136157, "epoch": 1640} {"train_loss": -22.91646957397461, "global_step": 136158, "epoch": 1640} {"train_loss": -23.122465133666992, "global_step": 136159, "epoch": 1640} {"train_loss": -22.71563720703125, "global_step": 136160, "epoch": 1640} {"train_loss": -23.053131103515625, "global_step": 136161, "epoch": 1640} {"train_loss": -22.910734176635742, "global_step": 136162, "epoch": 1640} {"train_loss": -22.815216064453125, "global_step": 136163, "epoch": 1640} {"train_loss": -22.9887638092041, "global_step": 136164, "epoch": 1640} {"train_loss": -22.830936431884766, "global_step": 136165, "epoch": 1640} {"train_loss": -23.106624603271484, "global_step": 136166, "epoch": 1640} {"train_loss": -22.76527214050293, "global_step": 136167, "epoch": 1640} {"train_loss": -22.811779022216797, "global_step": 136168, "epoch": 1640} {"train_loss": -22.954486846923828, "global_step": 136169, "epoch": 1640} {"train_loss": -22.652366638183594, "global_step": 136170, "epoch": 1640} {"train_loss": -22.687978744506836, "global_step": 136171, "epoch": 1640} {"train_loss": -23.257328033447266, "global_step": 136172, "epoch": 1640} {"train_loss": -22.794166564941406, "global_step": 136173, "epoch": 1640} {"train_loss": -23.095632553100586, "global_step": 136174, "epoch": 1640} {"train_loss": -23.221277236938477, "global_step": 136175, "epoch": 1640} {"train_loss": -22.88458251953125, "global_step": 136176, "epoch": 1640} {"train_loss": -23.034299850463867, "global_step": 136177, "epoch": 1640} {"train_loss": -23.069868087768555, "global_step": 136178, "epoch": 1640} {"train_loss": -22.97354507446289, "global_step": 136179, "epoch": 1640} {"train_loss": -23.020170211791992, "global_step": 136180, "epoch": 1640} {"train_loss": -23.11814308166504, "global_step": 136181, "epoch": 1640} {"train_loss": -23.014205932617188, "global_step": 136182, "epoch": 1640} {"train_loss": -22.894046783447266, "global_step": 136183, "epoch": 1640} {"train_loss": -23.194839477539062, "global_step": 136184, "epoch": 1640} {"train_loss": -23.07405662536621, "global_step": 136185, "epoch": 1640} {"train_loss": -22.766313552856445, "global_step": 136186, "epoch": 1640} {"train_loss": -22.765180587768555, "global_step": 136187, "epoch": 1640} {"train_loss": -22.797332763671875, "global_step": 136188, "epoch": 1640} {"train_loss": -22.961301803588867, "global_step": 136189, "epoch": 1640} {"train_loss": -22.638547897338867, "global_step": 136190, "epoch": 1640} {"train_loss": -23.144214630126953, "global_step": 136191, "epoch": 1640} {"train_loss": -23.155363082885742, "global_step": 136192, "epoch": 1640} {"train_loss": -23.304685592651367, "global_step": 136193, "epoch": 1640} {"train_loss": -23.108320236206055, "global_step": 136194, "epoch": 1640} {"train_loss": -23.018667221069336, "global_step": 136195, "epoch": 1640} {"train_loss": -23.33491325378418, "global_step": 136196, "epoch": 1640} {"train_loss": -22.96193504333496, "global_step": 136197, "epoch": 1640} {"train_loss": -23.373394012451172, "global_step": 136198, "epoch": 1640} {"train_loss": -22.748653411865234, "global_step": 136199, "epoch": 1640} {"train_loss": -22.841516494750977, "global_step": 136200, "epoch": 1640} {"train_loss": -23.077566146850586, "global_step": 136201, "epoch": 1640} {"train_loss": -22.808613627789967, "global_step": 136202, "epoch": 1640, "val_loss": 6292923.0} {"train_loss": -22.618783950805664, "global_step": 136203, "epoch": 1641} {"train_loss": -22.667490005493164, "global_step": 136204, "epoch": 1641} {"train_loss": -22.534696578979492, "global_step": 136205, "epoch": 1641} {"train_loss": -22.727365493774414, "global_step": 136206, "epoch": 1641} {"train_loss": -22.646474838256836, "global_step": 136207, "epoch": 1641} {"train_loss": -22.898874282836914, "global_step": 136208, "epoch": 1641} {"train_loss": -22.69684410095215, "global_step": 136209, "epoch": 1641} {"train_loss": -22.22357940673828, "global_step": 136210, "epoch": 1641} {"train_loss": -22.48829460144043, "global_step": 136211, "epoch": 1641} {"train_loss": -22.749656677246094, "global_step": 136212, "epoch": 1641} {"train_loss": -23.03189468383789, "global_step": 136213, "epoch": 1641} {"train_loss": -22.469934463500977, "global_step": 136214, "epoch": 1641} {"train_loss": -22.898914337158203, "global_step": 136215, "epoch": 1641} {"train_loss": -22.299894332885742, "global_step": 136216, "epoch": 1641} {"train_loss": -22.654096603393555, "global_step": 136217, "epoch": 1641} {"train_loss": -22.76905059814453, "global_step": 136218, "epoch": 1641} {"train_loss": -22.454797744750977, "global_step": 136219, "epoch": 1641} {"train_loss": -23.067914962768555, "global_step": 136220, "epoch": 1641} {"train_loss": -22.45697593688965, "global_step": 136221, "epoch": 1641} {"train_loss": -22.24513053894043, "global_step": 136222, "epoch": 1641} {"train_loss": -22.950830459594727, "global_step": 136223, "epoch": 1641} {"train_loss": -22.891172409057617, "global_step": 136224, "epoch": 1641} {"train_loss": -22.50846290588379, "global_step": 136225, "epoch": 1641} {"train_loss": -22.74271011352539, "global_step": 136226, "epoch": 1641} {"train_loss": -23.0743408203125, "global_step": 136227, "epoch": 1641} {"train_loss": -23.068403244018555, "global_step": 136228, "epoch": 1641} {"train_loss": -22.97263526916504, "global_step": 136229, "epoch": 1641} {"train_loss": -23.081161499023438, "global_step": 136230, "epoch": 1641} {"train_loss": -22.861902236938477, "global_step": 136231, "epoch": 1641} {"train_loss": -22.71909523010254, "global_step": 136232, "epoch": 1641} {"train_loss": -23.402393341064453, "global_step": 136233, "epoch": 1641} {"train_loss": -23.285873413085938, "global_step": 136234, "epoch": 1641} {"train_loss": -23.000965118408203, "global_step": 136235, "epoch": 1641} {"train_loss": -22.888050079345703, "global_step": 136236, "epoch": 1641} {"train_loss": -22.915010452270508, "global_step": 136237, "epoch": 1641} {"train_loss": -22.79756736755371, "global_step": 136238, "epoch": 1641} {"train_loss": -22.837621688842773, "global_step": 136239, "epoch": 1641} {"train_loss": -23.082904815673828, "global_step": 136240, "epoch": 1641} {"train_loss": -23.200956344604492, "global_step": 136241, "epoch": 1641} {"train_loss": -23.061664581298828, "global_step": 136242, "epoch": 1641} {"train_loss": -22.655181884765625, "global_step": 136243, "epoch": 1641} {"train_loss": -22.570539474487305, "global_step": 136244, "epoch": 1641} {"train_loss": -22.7381591796875, "global_step": 136245, "epoch": 1641} {"train_loss": -22.777692794799805, "global_step": 136246, "epoch": 1641} {"train_loss": -22.933692932128906, "global_step": 136247, "epoch": 1641} {"train_loss": -22.78371238708496, "global_step": 136248, "epoch": 1641} {"train_loss": -22.518901824951172, "global_step": 136249, "epoch": 1641} {"train_loss": -22.91730308532715, "global_step": 136250, "epoch": 1641} {"train_loss": -23.028182983398438, "global_step": 136251, "epoch": 1641} {"train_loss": -22.910978317260742, "global_step": 136252, "epoch": 1641} {"train_loss": -22.69502830505371, "global_step": 136253, "epoch": 1641} {"train_loss": -22.920907974243164, "global_step": 136254, "epoch": 1641} {"train_loss": -22.93671989440918, "global_step": 136255, "epoch": 1641} {"train_loss": -22.901281356811523, "global_step": 136256, "epoch": 1641} {"train_loss": -23.183990478515625, "global_step": 136257, "epoch": 1641} {"train_loss": -23.0599308013916, "global_step": 136258, "epoch": 1641} {"train_loss": -23.17812156677246, "global_step": 136259, "epoch": 1641} {"train_loss": -22.642213821411133, "global_step": 136260, "epoch": 1641} {"train_loss": -22.495468139648438, "global_step": 136261, "epoch": 1641} {"train_loss": -22.925968170166016, "global_step": 136262, "epoch": 1641} {"train_loss": -22.70004653930664, "global_step": 136263, "epoch": 1641} {"train_loss": -22.829877853393555, "global_step": 136264, "epoch": 1641} {"train_loss": -22.889699935913086, "global_step": 136265, "epoch": 1641} {"train_loss": -22.691373825073242, "global_step": 136266, "epoch": 1641} {"train_loss": -23.060855865478516, "global_step": 136267, "epoch": 1641} {"train_loss": -22.982858657836914, "global_step": 136268, "epoch": 1641} {"train_loss": -23.106563568115234, "global_step": 136269, "epoch": 1641} {"train_loss": -23.509008407592773, "global_step": 136270, "epoch": 1641} {"train_loss": -22.814496994018555, "global_step": 136271, "epoch": 1641} {"train_loss": -23.471729278564453, "global_step": 136272, "epoch": 1641} {"train_loss": -23.031400680541992, "global_step": 136273, "epoch": 1641} {"train_loss": -22.959196090698242, "global_step": 136274, "epoch": 1641} {"train_loss": -23.13574981689453, "global_step": 136275, "epoch": 1641} {"train_loss": -23.03340721130371, "global_step": 136276, "epoch": 1641} {"train_loss": -23.090797424316406, "global_step": 136277, "epoch": 1641} {"train_loss": -22.990737915039062, "global_step": 136278, "epoch": 1641} {"train_loss": -22.886953353881836, "global_step": 136279, "epoch": 1641} {"train_loss": -22.82076072692871, "global_step": 136280, "epoch": 1641} {"train_loss": -23.147348403930664, "global_step": 136281, "epoch": 1641} {"train_loss": -23.08677101135254, "global_step": 136282, "epoch": 1641} {"train_loss": -22.578536987304688, "global_step": 136283, "epoch": 1641} {"train_loss": -23.595123291015625, "global_step": 136284, "epoch": 1641} {"train_loss": -22.841239400656825, "global_step": 136285, "epoch": 1641, "val_loss": 6312976.5} {"train_loss": -22.5794677734375, "global_step": 136286, "epoch": 1642} {"train_loss": -22.641868591308594, "global_step": 136287, "epoch": 1642} {"train_loss": -22.297208786010742, "global_step": 136288, "epoch": 1642} {"train_loss": -22.745532989501953, "global_step": 136289, "epoch": 1642} {"train_loss": -22.55770492553711, "global_step": 136290, "epoch": 1642} {"train_loss": -22.6937255859375, "global_step": 136291, "epoch": 1642} {"train_loss": -22.52027702331543, "global_step": 136292, "epoch": 1642} {"train_loss": -22.651935577392578, "global_step": 136293, "epoch": 1642} {"train_loss": -22.633481979370117, "global_step": 136294, "epoch": 1642} {"train_loss": -22.607349395751953, "global_step": 136295, "epoch": 1642} {"train_loss": -22.64596939086914, "global_step": 136296, "epoch": 1642} {"train_loss": -23.356971740722656, "global_step": 136297, "epoch": 1642} {"train_loss": -22.95395278930664, "global_step": 136298, "epoch": 1642} {"train_loss": -22.392841339111328, "global_step": 136299, "epoch": 1642} {"train_loss": -22.622663497924805, "global_step": 136300, "epoch": 1642} {"train_loss": -22.65787124633789, "global_step": 136301, "epoch": 1642} {"train_loss": -22.776281356811523, "global_step": 136302, "epoch": 1642} {"train_loss": -22.478139877319336, "global_step": 136303, "epoch": 1642} {"train_loss": -22.579906463623047, "global_step": 136304, "epoch": 1642} {"train_loss": -22.93312644958496, "global_step": 136305, "epoch": 1642} {"train_loss": -22.896421432495117, "global_step": 136306, "epoch": 1642} {"train_loss": -23.11237907409668, "global_step": 136307, "epoch": 1642} {"train_loss": -22.68174171447754, "global_step": 136308, "epoch": 1642} {"train_loss": -22.660491943359375, "global_step": 136309, "epoch": 1642} {"train_loss": -22.95733642578125, "global_step": 136310, "epoch": 1642} {"train_loss": -22.935272216796875, "global_step": 136311, "epoch": 1642} {"train_loss": -22.680397033691406, "global_step": 136312, "epoch": 1642} {"train_loss": -22.303619384765625, "global_step": 136313, "epoch": 1642} {"train_loss": -22.825220108032227, "global_step": 136314, "epoch": 1642} {"train_loss": -23.1976318359375, "global_step": 136315, "epoch": 1642} {"train_loss": -22.912439346313477, "global_step": 136316, "epoch": 1642} {"train_loss": -22.763944625854492, "global_step": 136317, "epoch": 1642} {"train_loss": -22.956884384155273, "global_step": 136318, "epoch": 1642} {"train_loss": -23.222143173217773, "global_step": 136319, "epoch": 1642} {"train_loss": -23.01727294921875, "global_step": 136320, "epoch": 1642} {"train_loss": -23.153593063354492, "global_step": 136321, "epoch": 1642} {"train_loss": -23.103185653686523, "global_step": 136322, "epoch": 1642} {"train_loss": -22.81504249572754, "global_step": 136323, "epoch": 1642} {"train_loss": -23.014257431030273, "global_step": 136324, "epoch": 1642} {"train_loss": -22.957189559936523, "global_step": 136325, "epoch": 1642} {"train_loss": -22.919845581054688, "global_step": 136326, "epoch": 1642} {"train_loss": -22.644702911376953, "global_step": 136327, "epoch": 1642} {"train_loss": -22.929716110229492, "global_step": 136328, "epoch": 1642} {"train_loss": -22.903850555419922, "global_step": 136329, "epoch": 1642} {"train_loss": -22.728185653686523, "global_step": 136330, "epoch": 1642} {"train_loss": -23.158872604370117, "global_step": 136331, "epoch": 1642} {"train_loss": -23.044723510742188, "global_step": 136332, "epoch": 1642} {"train_loss": -23.107690811157227, "global_step": 136333, "epoch": 1642} {"train_loss": -23.238601684570312, "global_step": 136334, "epoch": 1642} {"train_loss": -22.65479850769043, "global_step": 136335, "epoch": 1642} {"train_loss": -22.995229721069336, "global_step": 136336, "epoch": 1642} {"train_loss": -22.657184600830078, "global_step": 136337, "epoch": 1642} {"train_loss": -22.505887985229492, "global_step": 136338, "epoch": 1642} {"train_loss": -23.104841232299805, "global_step": 136339, "epoch": 1642} {"train_loss": -23.06195831298828, "global_step": 136340, "epoch": 1642} {"train_loss": -22.726612091064453, "global_step": 136341, "epoch": 1642} {"train_loss": -23.112255096435547, "global_step": 136342, "epoch": 1642} {"train_loss": -23.17780876159668, "global_step": 136343, "epoch": 1642} {"train_loss": -22.889368057250977, "global_step": 136344, "epoch": 1642} {"train_loss": -22.998401641845703, "global_step": 136345, "epoch": 1642} {"train_loss": -22.96269989013672, "global_step": 136346, "epoch": 1642} {"train_loss": -23.022279739379883, "global_step": 136347, "epoch": 1642} {"train_loss": -22.73917579650879, "global_step": 136348, "epoch": 1642} {"train_loss": -22.982641220092773, "global_step": 136349, "epoch": 1642} {"train_loss": -22.551136016845703, "global_step": 136350, "epoch": 1642} {"train_loss": -22.65754508972168, "global_step": 136351, "epoch": 1642} {"train_loss": -22.835046768188477, "global_step": 136352, "epoch": 1642} {"train_loss": -23.11012077331543, "global_step": 136353, "epoch": 1642} {"train_loss": -22.802412033081055, "global_step": 136354, "epoch": 1642} {"train_loss": -23.132417678833008, "global_step": 136355, "epoch": 1642} {"train_loss": -22.920166015625, "global_step": 136356, "epoch": 1642} {"train_loss": -22.99306297302246, "global_step": 136357, "epoch": 1642} {"train_loss": -22.9809627532959, "global_step": 136358, "epoch": 1642} {"train_loss": -22.652345657348633, "global_step": 136359, "epoch": 1642} {"train_loss": -22.988805770874023, "global_step": 136360, "epoch": 1642} {"train_loss": -22.99501609802246, "global_step": 136361, "epoch": 1642} {"train_loss": -22.989622116088867, "global_step": 136362, "epoch": 1642} {"train_loss": -23.407386779785156, "global_step": 136363, "epoch": 1642} {"train_loss": -23.06888771057129, "global_step": 136364, "epoch": 1642} {"train_loss": -23.192062377929688, "global_step": 136365, "epoch": 1642} {"train_loss": -22.8763484954834, "global_step": 136366, "epoch": 1642} {"train_loss": -23.168542861938477, "global_step": 136367, "epoch": 1642} {"train_loss": -22.860778946474372, "global_step": 136368, "epoch": 1642, "val_loss": 6327268.0} {"train_loss": -22.95633888244629, "global_step": 136369, "epoch": 1643} {"train_loss": -22.730384826660156, "global_step": 136370, "epoch": 1643} {"train_loss": -22.670690536499023, "global_step": 136371, "epoch": 1643} {"train_loss": -22.445175170898438, "global_step": 136372, "epoch": 1643} {"train_loss": -22.511173248291016, "global_step": 136373, "epoch": 1643} {"train_loss": -22.680683135986328, "global_step": 136374, "epoch": 1643} {"train_loss": -22.970060348510742, "global_step": 136375, "epoch": 1643} {"train_loss": -23.084074020385742, "global_step": 136376, "epoch": 1643} {"train_loss": -22.958845138549805, "global_step": 136377, "epoch": 1643} {"train_loss": -22.67194938659668, "global_step": 136378, "epoch": 1643} {"train_loss": -23.39105224609375, "global_step": 136379, "epoch": 1643} {"train_loss": -22.805343627929688, "global_step": 136380, "epoch": 1643} {"train_loss": -22.92230796813965, "global_step": 136381, "epoch": 1643} {"train_loss": -22.60947608947754, "global_step": 136382, "epoch": 1643} {"train_loss": -22.545434951782227, "global_step": 136383, "epoch": 1643} {"train_loss": -23.012479782104492, "global_step": 136384, "epoch": 1643} {"train_loss": -23.352136611938477, "global_step": 136385, "epoch": 1643} {"train_loss": -23.006534576416016, "global_step": 136386, "epoch": 1643} {"train_loss": -22.53647804260254, "global_step": 136387, "epoch": 1643} {"train_loss": -22.97446632385254, "global_step": 136388, "epoch": 1643} {"train_loss": -23.01771354675293, "global_step": 136389, "epoch": 1643} {"train_loss": -22.98233413696289, "global_step": 136390, "epoch": 1643} {"train_loss": -22.415241241455078, "global_step": 136391, "epoch": 1643} {"train_loss": -22.34221839904785, "global_step": 136392, "epoch": 1643} {"train_loss": -22.638179779052734, "global_step": 136393, "epoch": 1643} {"train_loss": -22.97844886779785, "global_step": 136394, "epoch": 1643} {"train_loss": -22.78306007385254, "global_step": 136395, "epoch": 1643} {"train_loss": -22.93538475036621, "global_step": 136396, "epoch": 1643} {"train_loss": -23.122751235961914, "global_step": 136397, "epoch": 1643} {"train_loss": -22.794370651245117, "global_step": 136398, "epoch": 1643} {"train_loss": -22.914182662963867, "global_step": 136399, "epoch": 1643} {"train_loss": -22.525487899780273, "global_step": 136400, "epoch": 1643} {"train_loss": -23.174453735351562, "global_step": 136401, "epoch": 1643} {"train_loss": -22.903066635131836, "global_step": 136402, "epoch": 1643} {"train_loss": -22.988739013671875, "global_step": 136403, "epoch": 1643} {"train_loss": -22.758739471435547, "global_step": 136404, "epoch": 1643} {"train_loss": -22.7288818359375, "global_step": 136405, "epoch": 1643} {"train_loss": -22.905906677246094, "global_step": 136406, "epoch": 1643} {"train_loss": -22.803253173828125, "global_step": 136407, "epoch": 1643} {"train_loss": -22.90179443359375, "global_step": 136408, "epoch": 1643} {"train_loss": -23.059946060180664, "global_step": 136409, "epoch": 1643} {"train_loss": -23.1068058013916, "global_step": 136410, "epoch": 1643} {"train_loss": -23.08740234375, "global_step": 136411, "epoch": 1643} {"train_loss": -23.038251876831055, "global_step": 136412, "epoch": 1643} {"train_loss": -23.160083770751953, "global_step": 136413, "epoch": 1643} {"train_loss": -22.929967880249023, "global_step": 136414, "epoch": 1643} {"train_loss": -22.783620834350586, "global_step": 136415, "epoch": 1643} {"train_loss": -22.692951202392578, "global_step": 136416, "epoch": 1643} {"train_loss": -23.022695541381836, "global_step": 136417, "epoch": 1643} {"train_loss": -22.781253814697266, "global_step": 136418, "epoch": 1643} {"train_loss": -23.119855880737305, "global_step": 136419, "epoch": 1643} {"train_loss": -23.303539276123047, "global_step": 136420, "epoch": 1643} {"train_loss": -22.950529098510742, "global_step": 136421, "epoch": 1643} {"train_loss": -23.21553611755371, "global_step": 136422, "epoch": 1643} {"train_loss": -22.84954833984375, "global_step": 136423, "epoch": 1643} {"train_loss": -23.174747467041016, "global_step": 136424, "epoch": 1643} {"train_loss": -23.323246002197266, "global_step": 136425, "epoch": 1643} {"train_loss": -22.969722747802734, "global_step": 136426, "epoch": 1643} {"train_loss": -23.043569564819336, "global_step": 136427, "epoch": 1643} {"train_loss": -22.84185791015625, "global_step": 136428, "epoch": 1643} {"train_loss": -22.59062957763672, "global_step": 136429, "epoch": 1643} {"train_loss": -23.132543563842773, "global_step": 136430, "epoch": 1643} {"train_loss": -22.642742156982422, "global_step": 136431, "epoch": 1643} {"train_loss": -22.55994987487793, "global_step": 136432, "epoch": 1643} {"train_loss": -22.55193519592285, "global_step": 136433, "epoch": 1643} {"train_loss": -22.63825798034668, "global_step": 136434, "epoch": 1643} {"train_loss": -22.909513473510742, "global_step": 136435, "epoch": 1643} {"train_loss": -22.860252380371094, "global_step": 136436, "epoch": 1643} {"train_loss": -22.67239761352539, "global_step": 136437, "epoch": 1643} {"train_loss": -22.94601058959961, "global_step": 136438, "epoch": 1643} {"train_loss": -22.84052085876465, "global_step": 136439, "epoch": 1643} {"train_loss": -22.67543601989746, "global_step": 136440, "epoch": 1643} {"train_loss": -22.61606788635254, "global_step": 136441, "epoch": 1643} {"train_loss": -22.773683547973633, "global_step": 136442, "epoch": 1643} {"train_loss": -22.814619064331055, "global_step": 136443, "epoch": 1643} {"train_loss": -23.0363712310791, "global_step": 136444, "epoch": 1643} {"train_loss": -23.17194938659668, "global_step": 136445, "epoch": 1643} {"train_loss": -22.931135177612305, "global_step": 136446, "epoch": 1643} {"train_loss": -22.95192527770996, "global_step": 136447, "epoch": 1643} {"train_loss": -22.556806564331055, "global_step": 136448, "epoch": 1643} {"train_loss": -22.639738082885742, "global_step": 136449, "epoch": 1643} {"train_loss": -22.538944244384766, "global_step": 136450, "epoch": 1643} {"train_loss": -22.84377789784627, "global_step": 136451, "epoch": 1643, "val_loss": 6333276.0} {"train_loss": -22.200712203979492, "global_step": 136452, "epoch": 1644} {"train_loss": -22.334598541259766, "global_step": 136453, "epoch": 1644} {"train_loss": -22.217626571655273, "global_step": 136454, "epoch": 1644} {"train_loss": -22.856761932373047, "global_step": 136455, "epoch": 1644} {"train_loss": -22.174388885498047, "global_step": 136456, "epoch": 1644} {"train_loss": -22.2282657623291, "global_step": 136457, "epoch": 1644} {"train_loss": -22.479618072509766, "global_step": 136458, "epoch": 1644} {"train_loss": -22.3709659576416, "global_step": 136459, "epoch": 1644} {"train_loss": -22.63541030883789, "global_step": 136460, "epoch": 1644} {"train_loss": -22.52182960510254, "global_step": 136461, "epoch": 1644} {"train_loss": -22.309823989868164, "global_step": 136462, "epoch": 1644} {"train_loss": -22.90859031677246, "global_step": 136463, "epoch": 1644} {"train_loss": -22.83403205871582, "global_step": 136464, "epoch": 1644} {"train_loss": -22.49580955505371, "global_step": 136465, "epoch": 1644} {"train_loss": -23.149921417236328, "global_step": 136466, "epoch": 1644} {"train_loss": -22.80251693725586, "global_step": 136467, "epoch": 1644} {"train_loss": -22.717214584350586, "global_step": 136468, "epoch": 1644} {"train_loss": -22.890527725219727, "global_step": 136469, "epoch": 1644} {"train_loss": -22.970855712890625, "global_step": 136470, "epoch": 1644} {"train_loss": -22.64240837097168, "global_step": 136471, "epoch": 1644} {"train_loss": -23.03896141052246, "global_step": 136472, "epoch": 1644} {"train_loss": -22.8933048248291, "global_step": 136473, "epoch": 1644} {"train_loss": -22.843149185180664, "global_step": 136474, "epoch": 1644} {"train_loss": -23.30491065979004, "global_step": 136475, "epoch": 1644} {"train_loss": -22.92072105407715, "global_step": 136476, "epoch": 1644} {"train_loss": -23.008346557617188, "global_step": 136477, "epoch": 1644} {"train_loss": -22.850692749023438, "global_step": 136478, "epoch": 1644} {"train_loss": -22.8638973236084, "global_step": 136479, "epoch": 1644} {"train_loss": -22.717859268188477, "global_step": 136480, "epoch": 1644} {"train_loss": -22.961774826049805, "global_step": 136481, "epoch": 1644} {"train_loss": -22.97928237915039, "global_step": 136482, "epoch": 1644} {"train_loss": -22.792564392089844, "global_step": 136483, "epoch": 1644} {"train_loss": -22.931367874145508, "global_step": 136484, "epoch": 1644} {"train_loss": -22.388126373291016, "global_step": 136485, "epoch": 1644} {"train_loss": -22.45849609375, "global_step": 136486, "epoch": 1644} {"train_loss": -22.941099166870117, "global_step": 136487, "epoch": 1644} {"train_loss": -22.967546463012695, "global_step": 136488, "epoch": 1644} {"train_loss": -22.752534866333008, "global_step": 136489, "epoch": 1644} {"train_loss": -22.85017967224121, "global_step": 136490, "epoch": 1644} {"train_loss": -23.009389877319336, "global_step": 136491, "epoch": 1644} {"train_loss": -22.791231155395508, "global_step": 136492, "epoch": 1644} {"train_loss": -22.503498077392578, "global_step": 136493, "epoch": 1644} {"train_loss": -22.55877113342285, "global_step": 136494, "epoch": 1644} {"train_loss": -22.407245635986328, "global_step": 136495, "epoch": 1644} {"train_loss": -22.79662322998047, "global_step": 136496, "epoch": 1644} {"train_loss": -22.71260643005371, "global_step": 136497, "epoch": 1644} {"train_loss": -22.666269302368164, "global_step": 136498, "epoch": 1644} {"train_loss": -22.91690444946289, "global_step": 136499, "epoch": 1644} {"train_loss": -22.760923385620117, "global_step": 136500, "epoch": 1644} {"train_loss": -22.61197853088379, "global_step": 136501, "epoch": 1644} {"train_loss": -22.880451202392578, "global_step": 136502, "epoch": 1644} {"train_loss": -22.96841812133789, "global_step": 136503, "epoch": 1644} {"train_loss": -22.748559951782227, "global_step": 136504, "epoch": 1644} {"train_loss": -22.809307098388672, "global_step": 136505, "epoch": 1644} {"train_loss": -23.00422477722168, "global_step": 136506, "epoch": 1644} {"train_loss": -23.112476348876953, "global_step": 136507, "epoch": 1644} {"train_loss": -22.988473892211914, "global_step": 136508, "epoch": 1644} {"train_loss": -22.876684188842773, "global_step": 136509, "epoch": 1644} {"train_loss": -23.060483932495117, "global_step": 136510, "epoch": 1644} {"train_loss": -23.462430953979492, "global_step": 136511, "epoch": 1644} {"train_loss": -23.185760498046875, "global_step": 136512, "epoch": 1644} {"train_loss": -23.12324333190918, "global_step": 136513, "epoch": 1644} {"train_loss": -22.925195693969727, "global_step": 136514, "epoch": 1644} {"train_loss": -23.132633209228516, "global_step": 136515, "epoch": 1644} {"train_loss": -23.317731857299805, "global_step": 136516, "epoch": 1644} {"train_loss": -22.849634170532227, "global_step": 136517, "epoch": 1644} {"train_loss": -23.07387351989746, "global_step": 136518, "epoch": 1644} {"train_loss": -23.029773712158203, "global_step": 136519, "epoch": 1644} {"train_loss": -23.03116798400879, "global_step": 136520, "epoch": 1644} {"train_loss": -23.148944854736328, "global_step": 136521, "epoch": 1644} {"train_loss": -22.66083526611328, "global_step": 136522, "epoch": 1644} {"train_loss": -22.8880672454834, "global_step": 136523, "epoch": 1644} {"train_loss": -22.607425689697266, "global_step": 136524, "epoch": 1644} {"train_loss": -23.017337799072266, "global_step": 136525, "epoch": 1644} {"train_loss": -23.090795516967773, "global_step": 136526, "epoch": 1644} {"train_loss": -22.69782829284668, "global_step": 136527, "epoch": 1644} {"train_loss": -22.92523765563965, "global_step": 136528, "epoch": 1644} {"train_loss": -22.866390228271484, "global_step": 136529, "epoch": 1644} {"train_loss": -22.936513900756836, "global_step": 136530, "epoch": 1644} {"train_loss": -23.135969161987305, "global_step": 136531, "epoch": 1644} {"train_loss": -23.34856605529785, "global_step": 136532, "epoch": 1644} {"train_loss": -22.656539916992188, "global_step": 136533, "epoch": 1644} {"train_loss": -22.82905468308782, "global_step": 136534, "epoch": 1644, "val_loss": 6275884.0} {"train_loss": -22.378009796142578, "global_step": 136535, "epoch": 1645} {"train_loss": -22.044647216796875, "global_step": 136536, "epoch": 1645} {"train_loss": -22.12897300720215, "global_step": 136537, "epoch": 1645} {"train_loss": -22.341033935546875, "global_step": 136538, "epoch": 1645} {"train_loss": -22.340700149536133, "global_step": 136539, "epoch": 1645} {"train_loss": -22.507720947265625, "global_step": 136540, "epoch": 1645} {"train_loss": -22.445966720581055, "global_step": 136541, "epoch": 1645} {"train_loss": -22.73869514465332, "global_step": 136542, "epoch": 1645} {"train_loss": -22.455453872680664, "global_step": 136543, "epoch": 1645} {"train_loss": -22.620683670043945, "global_step": 136544, "epoch": 1645} {"train_loss": -22.483007431030273, "global_step": 136545, "epoch": 1645} {"train_loss": -22.551424026489258, "global_step": 136546, "epoch": 1645} {"train_loss": -22.52988624572754, "global_step": 136547, "epoch": 1645} {"train_loss": -22.397552490234375, "global_step": 136548, "epoch": 1645} {"train_loss": -22.867238998413086, "global_step": 136549, "epoch": 1645} {"train_loss": -22.847166061401367, "global_step": 136550, "epoch": 1645} {"train_loss": -22.85611343383789, "global_step": 136551, "epoch": 1645} {"train_loss": -22.45210838317871, "global_step": 136552, "epoch": 1645} {"train_loss": -23.0559024810791, "global_step": 136553, "epoch": 1645} {"train_loss": -23.0224552154541, "global_step": 136554, "epoch": 1645} {"train_loss": -22.85140609741211, "global_step": 136555, "epoch": 1645} {"train_loss": -22.699275970458984, "global_step": 136556, "epoch": 1645} {"train_loss": -22.770889282226562, "global_step": 136557, "epoch": 1645} {"train_loss": -22.81253433227539, "global_step": 136558, "epoch": 1645} {"train_loss": -22.69244956970215, "global_step": 136559, "epoch": 1645} {"train_loss": -22.99867820739746, "global_step": 136560, "epoch": 1645} {"train_loss": -22.9127254486084, "global_step": 136561, "epoch": 1645} {"train_loss": -22.861499786376953, "global_step": 136562, "epoch": 1645} {"train_loss": -22.853843688964844, "global_step": 136563, "epoch": 1645} {"train_loss": -23.061298370361328, "global_step": 136564, "epoch": 1645} {"train_loss": -22.97466468811035, "global_step": 136565, "epoch": 1645} {"train_loss": -22.903526306152344, "global_step": 136566, "epoch": 1645} {"train_loss": -22.709882736206055, "global_step": 136567, "epoch": 1645} {"train_loss": -22.70261573791504, "global_step": 136568, "epoch": 1645} {"train_loss": -23.153406143188477, "global_step": 136569, "epoch": 1645} {"train_loss": -22.746793746948242, "global_step": 136570, "epoch": 1645} {"train_loss": -23.465160369873047, "global_step": 136571, "epoch": 1645} {"train_loss": -23.15970230102539, "global_step": 136572, "epoch": 1645} {"train_loss": -22.530637741088867, "global_step": 136573, "epoch": 1645} {"train_loss": -22.82343101501465, "global_step": 136574, "epoch": 1645} {"train_loss": -23.2488956451416, "global_step": 136575, "epoch": 1645} {"train_loss": -22.813732147216797, "global_step": 136576, "epoch": 1645} {"train_loss": -22.849454879760742, "global_step": 136577, "epoch": 1645} {"train_loss": -22.82627296447754, "global_step": 136578, "epoch": 1645} {"train_loss": -22.968036651611328, "global_step": 136579, "epoch": 1645} {"train_loss": -23.27251625061035, "global_step": 136580, "epoch": 1645} {"train_loss": -22.973012924194336, "global_step": 136581, "epoch": 1645} {"train_loss": -22.568090438842773, "global_step": 136582, "epoch": 1645} {"train_loss": -23.073827743530273, "global_step": 136583, "epoch": 1645} {"train_loss": -22.837766647338867, "global_step": 136584, "epoch": 1645} {"train_loss": -23.040311813354492, "global_step": 136585, "epoch": 1645} {"train_loss": -22.848413467407227, "global_step": 136586, "epoch": 1645} {"train_loss": -22.488279342651367, "global_step": 136587, "epoch": 1645} {"train_loss": -22.952993392944336, "global_step": 136588, "epoch": 1645} {"train_loss": -23.270261764526367, "global_step": 136589, "epoch": 1645} {"train_loss": -22.957242965698242, "global_step": 136590, "epoch": 1645} {"train_loss": -22.701904296875, "global_step": 136591, "epoch": 1645} {"train_loss": -23.368473052978516, "global_step": 136592, "epoch": 1645} {"train_loss": -22.843700408935547, "global_step": 136593, "epoch": 1645} {"train_loss": -23.12346839904785, "global_step": 136594, "epoch": 1645} {"train_loss": -22.978487014770508, "global_step": 136595, "epoch": 1645} {"train_loss": -22.995880126953125, "global_step": 136596, "epoch": 1645} {"train_loss": -22.995203018188477, "global_step": 136597, "epoch": 1645} {"train_loss": -22.96436882019043, "global_step": 136598, "epoch": 1645} {"train_loss": -22.991058349609375, "global_step": 136599, "epoch": 1645} {"train_loss": -22.477079391479492, "global_step": 136600, "epoch": 1645} {"train_loss": -22.651206970214844, "global_step": 136601, "epoch": 1645} {"train_loss": -22.913345336914062, "global_step": 136602, "epoch": 1645} {"train_loss": -22.97114372253418, "global_step": 136603, "epoch": 1645} {"train_loss": -22.793882369995117, "global_step": 136604, "epoch": 1645} {"train_loss": -23.101768493652344, "global_step": 136605, "epoch": 1645} {"train_loss": -22.923095703125, "global_step": 136606, "epoch": 1645} {"train_loss": -23.20953369140625, "global_step": 136607, "epoch": 1645} {"train_loss": -22.806339263916016, "global_step": 136608, "epoch": 1645} {"train_loss": -23.220592498779297, "global_step": 136609, "epoch": 1645} {"train_loss": -22.940410614013672, "global_step": 136610, "epoch": 1645} {"train_loss": -22.823591232299805, "global_step": 136611, "epoch": 1645} {"train_loss": -23.486591339111328, "global_step": 136612, "epoch": 1645} {"train_loss": -23.320133209228516, "global_step": 136613, "epoch": 1645} {"train_loss": -23.022260665893555, "global_step": 136614, "epoch": 1645} {"train_loss": -23.318241119384766, "global_step": 136615, "epoch": 1645} {"train_loss": -23.386449813842773, "global_step": 136616, "epoch": 1645} {"train_loss": -22.87050065649561, "global_step": 136617, "epoch": 1645, "val_loss": 6375602.0} {"train_loss": -22.28830337524414, "global_step": 136618, "epoch": 1646} {"train_loss": -22.060678482055664, "global_step": 136619, "epoch": 1646} {"train_loss": -22.62872886657715, "global_step": 136620, "epoch": 1646} {"train_loss": -22.898048400878906, "global_step": 136621, "epoch": 1646} {"train_loss": -22.390583038330078, "global_step": 136622, "epoch": 1646} {"train_loss": -22.921722412109375, "global_step": 136623, "epoch": 1646} {"train_loss": -22.561609268188477, "global_step": 136624, "epoch": 1646} {"train_loss": -22.590360641479492, "global_step": 136625, "epoch": 1646} {"train_loss": -22.27840232849121, "global_step": 136626, "epoch": 1646} {"train_loss": -22.89339256286621, "global_step": 136627, "epoch": 1646} {"train_loss": -22.531768798828125, "global_step": 136628, "epoch": 1646} {"train_loss": -22.900266647338867, "global_step": 136629, "epoch": 1646} {"train_loss": -22.689374923706055, "global_step": 136630, "epoch": 1646} {"train_loss": -22.738866806030273, "global_step": 136631, "epoch": 1646} {"train_loss": -22.87824821472168, "global_step": 136632, "epoch": 1646} {"train_loss": -22.918500900268555, "global_step": 136633, "epoch": 1646} {"train_loss": -22.992136001586914, "global_step": 136634, "epoch": 1646} {"train_loss": -23.127347946166992, "global_step": 136635, "epoch": 1646} {"train_loss": -22.94599151611328, "global_step": 136636, "epoch": 1646} {"train_loss": -22.996049880981445, "global_step": 136637, "epoch": 1646} {"train_loss": -22.965316772460938, "global_step": 136638, "epoch": 1646} {"train_loss": -23.063535690307617, "global_step": 136639, "epoch": 1646} {"train_loss": -23.000890731811523, "global_step": 136640, "epoch": 1646} {"train_loss": -23.140165328979492, "global_step": 136641, "epoch": 1646} {"train_loss": -22.976749420166016, "global_step": 136642, "epoch": 1646} {"train_loss": -22.826461791992188, "global_step": 136643, "epoch": 1646} {"train_loss": -22.92667579650879, "global_step": 136644, "epoch": 1646} {"train_loss": -23.296175003051758, "global_step": 136645, "epoch": 1646} {"train_loss": -22.765268325805664, "global_step": 136646, "epoch": 1646} {"train_loss": -22.84545135498047, "global_step": 136647, "epoch": 1646} {"train_loss": -22.851713180541992, "global_step": 136648, "epoch": 1646} {"train_loss": -22.64516830444336, "global_step": 136649, "epoch": 1646} {"train_loss": -22.871976852416992, "global_step": 136650, "epoch": 1646} {"train_loss": -22.924232482910156, "global_step": 136651, "epoch": 1646} {"train_loss": -23.21357536315918, "global_step": 136652, "epoch": 1646} {"train_loss": -22.95446014404297, "global_step": 136653, "epoch": 1646} {"train_loss": -22.93363380432129, "global_step": 136654, "epoch": 1646} {"train_loss": -23.167407989501953, "global_step": 136655, "epoch": 1646} {"train_loss": -23.21872329711914, "global_step": 136656, "epoch": 1646} {"train_loss": -23.121749877929688, "global_step": 136657, "epoch": 1646} {"train_loss": -22.688249588012695, "global_step": 136658, "epoch": 1646} {"train_loss": -22.86932945251465, "global_step": 136659, "epoch": 1646} {"train_loss": -23.013198852539062, "global_step": 136660, "epoch": 1646} {"train_loss": -22.910541534423828, "global_step": 136661, "epoch": 1646} {"train_loss": -22.66605567932129, "global_step": 136662, "epoch": 1646} {"train_loss": -23.024673461914062, "global_step": 136663, "epoch": 1646} {"train_loss": -22.84610366821289, "global_step": 136664, "epoch": 1646} {"train_loss": -22.80599021911621, "global_step": 136665, "epoch": 1646} {"train_loss": -23.24790382385254, "global_step": 136666, "epoch": 1646} {"train_loss": -22.85761833190918, "global_step": 136667, "epoch": 1646} {"train_loss": -22.97858238220215, "global_step": 136668, "epoch": 1646} {"train_loss": -23.044187545776367, "global_step": 136669, "epoch": 1646} {"train_loss": -23.262895584106445, "global_step": 136670, "epoch": 1646} {"train_loss": -23.289169311523438, "global_step": 136671, "epoch": 1646} {"train_loss": -22.998762130737305, "global_step": 136672, "epoch": 1646} {"train_loss": -23.27320671081543, "global_step": 136673, "epoch": 1646} {"train_loss": -22.785512924194336, "global_step": 136674, "epoch": 1646} {"train_loss": -23.084518432617188, "global_step": 136675, "epoch": 1646} {"train_loss": -23.280141830444336, "global_step": 136676, "epoch": 1646} {"train_loss": -23.2612247467041, "global_step": 136677, "epoch": 1646} {"train_loss": -23.068769454956055, "global_step": 136678, "epoch": 1646} {"train_loss": -22.878131866455078, "global_step": 136679, "epoch": 1646} {"train_loss": -22.660892486572266, "global_step": 136680, "epoch": 1646} {"train_loss": -23.043806076049805, "global_step": 136681, "epoch": 1646} {"train_loss": -22.937376022338867, "global_step": 136682, "epoch": 1646} {"train_loss": -22.861949920654297, "global_step": 136683, "epoch": 1646} {"train_loss": -22.856918334960938, "global_step": 136684, "epoch": 1646} {"train_loss": -22.77754020690918, "global_step": 136685, "epoch": 1646} {"train_loss": -22.748619079589844, "global_step": 136686, "epoch": 1646} {"train_loss": -22.948898315429688, "global_step": 136687, "epoch": 1646} {"train_loss": -23.349658966064453, "global_step": 136688, "epoch": 1646} {"train_loss": -23.193695068359375, "global_step": 136689, "epoch": 1646} {"train_loss": -22.753026962280273, "global_step": 136690, "epoch": 1646} {"train_loss": -22.912662506103516, "global_step": 136691, "epoch": 1646} {"train_loss": -23.130475997924805, "global_step": 136692, "epoch": 1646} {"train_loss": -22.5284423828125, "global_step": 136693, "epoch": 1646} {"train_loss": -22.825992584228516, "global_step": 136694, "epoch": 1646} {"train_loss": -23.051654815673828, "global_step": 136695, "epoch": 1646} {"train_loss": -22.891748428344727, "global_step": 136696, "epoch": 1646} {"train_loss": -22.615924835205078, "global_step": 136697, "epoch": 1646} {"train_loss": -22.784067153930664, "global_step": 136698, "epoch": 1646} {"train_loss": -23.182254791259766, "global_step": 136699, "epoch": 1646} {"train_loss": -22.91044136415045, "global_step": 136700, "epoch": 1646, "val_loss": 6373851.0} {"train_loss": -22.70296287536621, "global_step": 136701, "epoch": 1647} {"train_loss": -22.94546890258789, "global_step": 136702, "epoch": 1647} {"train_loss": -22.594533920288086, "global_step": 136703, "epoch": 1647} {"train_loss": -22.949329376220703, "global_step": 136704, "epoch": 1647} {"train_loss": -22.618825912475586, "global_step": 136705, "epoch": 1647} {"train_loss": -22.614791870117188, "global_step": 136706, "epoch": 1647} {"train_loss": -23.005781173706055, "global_step": 136707, "epoch": 1647} {"train_loss": -22.735624313354492, "global_step": 136708, "epoch": 1647} {"train_loss": -22.767532348632812, "global_step": 136709, "epoch": 1647} {"train_loss": -22.83576774597168, "global_step": 136710, "epoch": 1647} {"train_loss": -23.153427124023438, "global_step": 136711, "epoch": 1647} {"train_loss": -23.015281677246094, "global_step": 136712, "epoch": 1647} {"train_loss": -22.904541015625, "global_step": 136713, "epoch": 1647} {"train_loss": -22.93898582458496, "global_step": 136714, "epoch": 1647} {"train_loss": -22.827491760253906, "global_step": 136715, "epoch": 1647} {"train_loss": -22.759262084960938, "global_step": 136716, "epoch": 1647} {"train_loss": -23.223121643066406, "global_step": 136717, "epoch": 1647} {"train_loss": -22.930099487304688, "global_step": 136718, "epoch": 1647} {"train_loss": -22.930706024169922, "global_step": 136719, "epoch": 1647} {"train_loss": -22.89481544494629, "global_step": 136720, "epoch": 1647} {"train_loss": -23.013288497924805, "global_step": 136721, "epoch": 1647} {"train_loss": -22.89994239807129, "global_step": 136722, "epoch": 1647} {"train_loss": -23.124967575073242, "global_step": 136723, "epoch": 1647} {"train_loss": -22.707639694213867, "global_step": 136724, "epoch": 1647} {"train_loss": -22.951871871948242, "global_step": 136725, "epoch": 1647} {"train_loss": -22.956235885620117, "global_step": 136726, "epoch": 1647} {"train_loss": -22.897930145263672, "global_step": 136727, "epoch": 1647} {"train_loss": -22.638532638549805, "global_step": 136728, "epoch": 1647} {"train_loss": -22.611995697021484, "global_step": 136729, "epoch": 1647} {"train_loss": -22.744665145874023, "global_step": 136730, "epoch": 1647} {"train_loss": -22.955406188964844, "global_step": 136731, "epoch": 1647} {"train_loss": -23.199390411376953, "global_step": 136732, "epoch": 1647} {"train_loss": -22.985458374023438, "global_step": 136733, "epoch": 1647} {"train_loss": -23.040128707885742, "global_step": 136734, "epoch": 1647} {"train_loss": -23.061201095581055, "global_step": 136735, "epoch": 1647} {"train_loss": -22.695066452026367, "global_step": 136736, "epoch": 1647} {"train_loss": -22.979333877563477, "global_step": 136737, "epoch": 1647} {"train_loss": -22.875268936157227, "global_step": 136738, "epoch": 1647} {"train_loss": -22.953205108642578, "global_step": 136739, "epoch": 1647} {"train_loss": -23.231260299682617, "global_step": 136740, "epoch": 1647} {"train_loss": -22.9735050201416, "global_step": 136741, "epoch": 1647} {"train_loss": -22.868139266967773, "global_step": 136742, "epoch": 1647} {"train_loss": -22.89827537536621, "global_step": 136743, "epoch": 1647} {"train_loss": -23.078275680541992, "global_step": 136744, "epoch": 1647} {"train_loss": -23.128721237182617, "global_step": 136745, "epoch": 1647} {"train_loss": -23.10595703125, "global_step": 136746, "epoch": 1647} {"train_loss": -23.132612228393555, "global_step": 136747, "epoch": 1647} {"train_loss": -22.913494110107422, "global_step": 136748, "epoch": 1647} {"train_loss": -23.278667449951172, "global_step": 136749, "epoch": 1647} {"train_loss": -22.757204055786133, "global_step": 136750, "epoch": 1647} {"train_loss": -23.02939224243164, "global_step": 136751, "epoch": 1647} {"train_loss": -23.157217025756836, "global_step": 136752, "epoch": 1647} {"train_loss": -23.071491241455078, "global_step": 136753, "epoch": 1647} {"train_loss": -22.885662078857422, "global_step": 136754, "epoch": 1647} {"train_loss": -23.454410552978516, "global_step": 136755, "epoch": 1647} {"train_loss": -22.800134658813477, "global_step": 136756, "epoch": 1647} {"train_loss": -23.134504318237305, "global_step": 136757, "epoch": 1647} {"train_loss": -22.935970306396484, "global_step": 136758, "epoch": 1647} {"train_loss": -22.726842880249023, "global_step": 136759, "epoch": 1647} {"train_loss": -23.12164878845215, "global_step": 136760, "epoch": 1647} {"train_loss": -23.17900276184082, "global_step": 136761, "epoch": 1647} {"train_loss": -23.064908981323242, "global_step": 136762, "epoch": 1647} {"train_loss": -22.776456832885742, "global_step": 136763, "epoch": 1647} {"train_loss": -22.90679359436035, "global_step": 136764, "epoch": 1647} {"train_loss": -22.95548439025879, "global_step": 136765, "epoch": 1647} {"train_loss": -22.886449813842773, "global_step": 136766, "epoch": 1647} {"train_loss": -22.79767417907715, "global_step": 136767, "epoch": 1647} {"train_loss": -22.865238189697266, "global_step": 136768, "epoch": 1647} {"train_loss": -23.010892868041992, "global_step": 136769, "epoch": 1647} {"train_loss": -23.019140243530273, "global_step": 136770, "epoch": 1647} {"train_loss": -22.936613082885742, "global_step": 136771, "epoch": 1647} {"train_loss": -23.07130241394043, "global_step": 136772, "epoch": 1647} {"train_loss": -22.82112693786621, "global_step": 136773, "epoch": 1647} {"train_loss": -22.36897850036621, "global_step": 136774, "epoch": 1647} {"train_loss": -22.987150192260742, "global_step": 136775, "epoch": 1647} {"train_loss": -22.815603256225586, "global_step": 136776, "epoch": 1647} {"train_loss": -23.090473175048828, "global_step": 136777, "epoch": 1647} {"train_loss": -22.70563507080078, "global_step": 136778, "epoch": 1647} {"train_loss": -23.449193954467773, "global_step": 136779, "epoch": 1647} {"train_loss": -22.974523544311523, "global_step": 136780, "epoch": 1647} {"train_loss": -23.038314819335938, "global_step": 136781, "epoch": 1647} {"train_loss": -22.873022079467773, "global_step": 136782, "epoch": 1647} {"train_loss": -22.951905744621552, "global_step": 136783, "epoch": 1647, "val_loss": 6193352.0} {"train_loss": -22.88702964782715, "global_step": 136784, "epoch": 1648} {"train_loss": -23.12447738647461, "global_step": 136785, "epoch": 1648} {"train_loss": -22.754776000976562, "global_step": 136786, "epoch": 1648} {"train_loss": -22.77046012878418, "global_step": 136787, "epoch": 1648} {"train_loss": -22.68770408630371, "global_step": 136788, "epoch": 1648} {"train_loss": -22.893882751464844, "global_step": 136789, "epoch": 1648} {"train_loss": -22.847997665405273, "global_step": 136790, "epoch": 1648} {"train_loss": -22.862394332885742, "global_step": 136791, "epoch": 1648} {"train_loss": -22.60335350036621, "global_step": 136792, "epoch": 1648} {"train_loss": -22.946735382080078, "global_step": 136793, "epoch": 1648} {"train_loss": -22.74163246154785, "global_step": 136794, "epoch": 1648} {"train_loss": -22.734420776367188, "global_step": 136795, "epoch": 1648} {"train_loss": -22.55451774597168, "global_step": 136796, "epoch": 1648} {"train_loss": -22.81488609313965, "global_step": 136797, "epoch": 1648} {"train_loss": -22.808582305908203, "global_step": 136798, "epoch": 1648} {"train_loss": -23.013721466064453, "global_step": 136799, "epoch": 1648} {"train_loss": -22.722061157226562, "global_step": 136800, "epoch": 1648} {"train_loss": -22.725555419921875, "global_step": 136801, "epoch": 1648} {"train_loss": -22.74701499938965, "global_step": 136802, "epoch": 1648} {"train_loss": -22.514122009277344, "global_step": 136803, "epoch": 1648} {"train_loss": -22.762008666992188, "global_step": 136804, "epoch": 1648} {"train_loss": -22.714252471923828, "global_step": 136805, "epoch": 1648} {"train_loss": -22.87421989440918, "global_step": 136806, "epoch": 1648} {"train_loss": -23.306100845336914, "global_step": 136807, "epoch": 1648} {"train_loss": -23.288297653198242, "global_step": 136808, "epoch": 1648} {"train_loss": -22.94379425048828, "global_step": 136809, "epoch": 1648} {"train_loss": -22.89801025390625, "global_step": 136810, "epoch": 1648} {"train_loss": -22.977148056030273, "global_step": 136811, "epoch": 1648} {"train_loss": -23.127300262451172, "global_step": 136812, "epoch": 1648} {"train_loss": -23.170347213745117, "global_step": 136813, "epoch": 1648} {"train_loss": -23.0711727142334, "global_step": 136814, "epoch": 1648} {"train_loss": -23.131277084350586, "global_step": 136815, "epoch": 1648} {"train_loss": -22.80189323425293, "global_step": 136816, "epoch": 1648} {"train_loss": -22.821430206298828, "global_step": 136817, "epoch": 1648} {"train_loss": -23.35137367248535, "global_step": 136818, "epoch": 1648} {"train_loss": -22.713687896728516, "global_step": 136819, "epoch": 1648} {"train_loss": -23.033842086791992, "global_step": 136820, "epoch": 1648} {"train_loss": -22.952238082885742, "global_step": 136821, "epoch": 1648} {"train_loss": -22.800918579101562, "global_step": 136822, "epoch": 1648} {"train_loss": -23.013113021850586, "global_step": 136823, "epoch": 1648} {"train_loss": -23.255096435546875, "global_step": 136824, "epoch": 1648} {"train_loss": -22.95378303527832, "global_step": 136825, "epoch": 1648} {"train_loss": -23.133296966552734, "global_step": 136826, "epoch": 1648} {"train_loss": -22.900495529174805, "global_step": 136827, "epoch": 1648} {"train_loss": -23.345935821533203, "global_step": 136828, "epoch": 1648} {"train_loss": -22.924570083618164, "global_step": 136829, "epoch": 1648} {"train_loss": -22.920473098754883, "global_step": 136830, "epoch": 1648} {"train_loss": -23.131595611572266, "global_step": 136831, "epoch": 1648} {"train_loss": -23.35024070739746, "global_step": 136832, "epoch": 1648} {"train_loss": -23.050621032714844, "global_step": 136833, "epoch": 1648} {"train_loss": -22.99380874633789, "global_step": 136834, "epoch": 1648} {"train_loss": -23.1663761138916, "global_step": 136835, "epoch": 1648} {"train_loss": -23.10451316833496, "global_step": 136836, "epoch": 1648} {"train_loss": -23.124862670898438, "global_step": 136837, "epoch": 1648} {"train_loss": -22.93117332458496, "global_step": 136838, "epoch": 1648} {"train_loss": -23.107826232910156, "global_step": 136839, "epoch": 1648} {"train_loss": -22.785661697387695, "global_step": 136840, "epoch": 1648} {"train_loss": -23.18631362915039, "global_step": 136841, "epoch": 1648} {"train_loss": -22.763830184936523, "global_step": 136842, "epoch": 1648} {"train_loss": -23.34905433654785, "global_step": 136843, "epoch": 1648} {"train_loss": -22.896970748901367, "global_step": 136844, "epoch": 1648} {"train_loss": -23.305051803588867, "global_step": 136845, "epoch": 1648} {"train_loss": -22.91485023498535, "global_step": 136846, "epoch": 1648} {"train_loss": -23.187973022460938, "global_step": 136847, "epoch": 1648} {"train_loss": -22.839635848999023, "global_step": 136848, "epoch": 1648} {"train_loss": -23.088361740112305, "global_step": 136849, "epoch": 1648} {"train_loss": -22.817243576049805, "global_step": 136850, "epoch": 1648} {"train_loss": -22.887081146240234, "global_step": 136851, "epoch": 1648} {"train_loss": -23.319883346557617, "global_step": 136852, "epoch": 1648} {"train_loss": -22.773757934570312, "global_step": 136853, "epoch": 1648} {"train_loss": -22.657812118530273, "global_step": 136854, "epoch": 1648} {"train_loss": -22.15144157409668, "global_step": 136855, "epoch": 1648} {"train_loss": -22.3809814453125, "global_step": 136856, "epoch": 1648} {"train_loss": -22.875707626342773, "global_step": 136857, "epoch": 1648} {"train_loss": -22.988704681396484, "global_step": 136858, "epoch": 1648} {"train_loss": -22.994102478027344, "global_step": 136859, "epoch": 1648} {"train_loss": -23.03841781616211, "global_step": 136860, "epoch": 1648} {"train_loss": -23.060453414916992, "global_step": 136861, "epoch": 1648} {"train_loss": -23.22858238220215, "global_step": 136862, "epoch": 1648} {"train_loss": -22.99616050720215, "global_step": 136863, "epoch": 1648} {"train_loss": -22.985183715820312, "global_step": 136864, "epoch": 1648} {"train_loss": -22.703407287597656, "global_step": 136865, "epoch": 1648} {"train_loss": -22.946456886199584, "global_step": 136866, "epoch": 1648, "val_loss": 6287213.0} {"train_loss": -23.069856643676758, "global_step": 136867, "epoch": 1649} {"train_loss": -22.892520904541016, "global_step": 136868, "epoch": 1649} {"train_loss": -22.65731430053711, "global_step": 136869, "epoch": 1649} {"train_loss": -22.492908477783203, "global_step": 136870, "epoch": 1649} {"train_loss": -22.90774917602539, "global_step": 136871, "epoch": 1649} {"train_loss": -22.847532272338867, "global_step": 136872, "epoch": 1649} {"train_loss": -23.026655197143555, "global_step": 136873, "epoch": 1649} {"train_loss": -22.979623794555664, "global_step": 136874, "epoch": 1649} {"train_loss": -22.797225952148438, "global_step": 136875, "epoch": 1649} {"train_loss": -22.980804443359375, "global_step": 136876, "epoch": 1649} {"train_loss": -22.77004051208496, "global_step": 136877, "epoch": 1649} {"train_loss": -22.772855758666992, "global_step": 136878, "epoch": 1649} {"train_loss": -23.27326774597168, "global_step": 136879, "epoch": 1649} {"train_loss": -23.066226959228516, "global_step": 136880, "epoch": 1649} {"train_loss": -22.839946746826172, "global_step": 136881, "epoch": 1649} {"train_loss": -23.316598892211914, "global_step": 136882, "epoch": 1649} {"train_loss": -22.85529327392578, "global_step": 136883, "epoch": 1649} {"train_loss": -22.96303367614746, "global_step": 136884, "epoch": 1649} {"train_loss": -23.03632926940918, "global_step": 136885, "epoch": 1649} {"train_loss": -22.432973861694336, "global_step": 136886, "epoch": 1649} {"train_loss": -22.85077476501465, "global_step": 136887, "epoch": 1649} {"train_loss": -23.230236053466797, "global_step": 136888, "epoch": 1649} {"train_loss": -22.920225143432617, "global_step": 136889, "epoch": 1649} {"train_loss": -22.913694381713867, "global_step": 136890, "epoch": 1649} {"train_loss": -22.715673446655273, "global_step": 136891, "epoch": 1649} {"train_loss": -22.963499069213867, "global_step": 136892, "epoch": 1649} {"train_loss": -23.01907730102539, "global_step": 136893, "epoch": 1649} {"train_loss": -22.96393394470215, "global_step": 136894, "epoch": 1649} {"train_loss": -22.748022079467773, "global_step": 136895, "epoch": 1649} {"train_loss": -22.82301139831543, "global_step": 136896, "epoch": 1649} {"train_loss": -23.223634719848633, "global_step": 136897, "epoch": 1649} {"train_loss": -22.828317642211914, "global_step": 136898, "epoch": 1649} {"train_loss": -23.29561996459961, "global_step": 136899, "epoch": 1649} {"train_loss": -23.226102828979492, "global_step": 136900, "epoch": 1649} {"train_loss": -23.081785202026367, "global_step": 136901, "epoch": 1649} {"train_loss": -23.009658813476562, "global_step": 136902, "epoch": 1649} {"train_loss": -22.890579223632812, "global_step": 136903, "epoch": 1649} {"train_loss": -23.296218872070312, "global_step": 136904, "epoch": 1649} {"train_loss": -23.11476707458496, "global_step": 136905, "epoch": 1649} {"train_loss": -22.8497257232666, "global_step": 136906, "epoch": 1649} {"train_loss": -23.174325942993164, "global_step": 136907, "epoch": 1649} {"train_loss": -23.357149124145508, "global_step": 136908, "epoch": 1649} {"train_loss": -23.168861389160156, "global_step": 136909, "epoch": 1649} {"train_loss": -23.05536460876465, "global_step": 136910, "epoch": 1649} {"train_loss": -23.09230613708496, "global_step": 136911, "epoch": 1649} {"train_loss": -22.88763999938965, "global_step": 136912, "epoch": 1649} {"train_loss": -23.184982299804688, "global_step": 136913, "epoch": 1649} {"train_loss": -23.049959182739258, "global_step": 136914, "epoch": 1649} {"train_loss": -23.147790908813477, "global_step": 136915, "epoch": 1649} {"train_loss": -22.92518424987793, "global_step": 136916, "epoch": 1649} {"train_loss": -22.97041130065918, "global_step": 136917, "epoch": 1649} {"train_loss": -23.233308792114258, "global_step": 136918, "epoch": 1649} {"train_loss": -23.3740291595459, "global_step": 136919, "epoch": 1649} {"train_loss": -23.091188430786133, "global_step": 136920, "epoch": 1649} {"train_loss": -22.84486961364746, "global_step": 136921, "epoch": 1649} {"train_loss": -22.988370895385742, "global_step": 136922, "epoch": 1649} {"train_loss": -23.133563995361328, "global_step": 136923, "epoch": 1649} {"train_loss": -23.085622787475586, "global_step": 136924, "epoch": 1649} {"train_loss": -22.752775192260742, "global_step": 136925, "epoch": 1649} {"train_loss": -23.01690101623535, "global_step": 136926, "epoch": 1649} {"train_loss": -22.81476402282715, "global_step": 136927, "epoch": 1649} {"train_loss": -22.72173500061035, "global_step": 136928, "epoch": 1649} {"train_loss": -22.826749801635742, "global_step": 136929, "epoch": 1649} {"train_loss": -23.19647216796875, "global_step": 136930, "epoch": 1649} {"train_loss": -22.94814109802246, "global_step": 136931, "epoch": 1649} {"train_loss": -23.048954010009766, "global_step": 136932, "epoch": 1649} {"train_loss": -23.205408096313477, "global_step": 136933, "epoch": 1649} {"train_loss": -22.858835220336914, "global_step": 136934, "epoch": 1649} {"train_loss": -23.062673568725586, "global_step": 136935, "epoch": 1649} {"train_loss": -22.854902267456055, "global_step": 136936, "epoch": 1649} {"train_loss": -23.46800994873047, "global_step": 136937, "epoch": 1649} {"train_loss": -22.909345626831055, "global_step": 136938, "epoch": 1649} {"train_loss": -22.899621963500977, "global_step": 136939, "epoch": 1649} {"train_loss": -23.319860458374023, "global_step": 136940, "epoch": 1649} {"train_loss": -23.0589599609375, "global_step": 136941, "epoch": 1649} {"train_loss": -23.22803497314453, "global_step": 136942, "epoch": 1649} {"train_loss": -22.934314727783203, "global_step": 136943, "epoch": 1649} {"train_loss": -23.068754196166992, "global_step": 136944, "epoch": 1649} {"train_loss": -23.265792846679688, "global_step": 136945, "epoch": 1649} {"train_loss": -22.999982833862305, "global_step": 136946, "epoch": 1649} {"train_loss": -22.743330001831055, "global_step": 136947, "epoch": 1649} {"train_loss": -22.906185150146484, "global_step": 136948, "epoch": 1649} {"train_loss": -23.015069846647332, "global_step": 136949, "epoch": 1649, "val_loss": 6438479.0} {"train_loss": -21.714040756225586, "global_step": 136950, "epoch": 1650} {"train_loss": -22.32513999938965, "global_step": 136951, "epoch": 1650} {"train_loss": -22.707551956176758, "global_step": 136952, "epoch": 1650} {"train_loss": -21.751916885375977, "global_step": 136953, "epoch": 1650} {"train_loss": -22.181888580322266, "global_step": 136954, "epoch": 1650} {"train_loss": -22.093488693237305, "global_step": 136955, "epoch": 1650} {"train_loss": -22.8665771484375, "global_step": 136956, "epoch": 1650} {"train_loss": -22.597097396850586, "global_step": 136957, "epoch": 1650} {"train_loss": -22.551809310913086, "global_step": 136958, "epoch": 1650} {"train_loss": -22.32492446899414, "global_step": 136959, "epoch": 1650} {"train_loss": -22.625701904296875, "global_step": 136960, "epoch": 1650} {"train_loss": -22.567289352416992, "global_step": 136961, "epoch": 1650} {"train_loss": -22.222183227539062, "global_step": 136962, "epoch": 1650} {"train_loss": -22.829288482666016, "global_step": 136963, "epoch": 1650} {"train_loss": -22.739805221557617, "global_step": 136964, "epoch": 1650} {"train_loss": -22.56618881225586, "global_step": 136965, "epoch": 1650} {"train_loss": -22.697187423706055, "global_step": 136966, "epoch": 1650} {"train_loss": -22.643936157226562, "global_step": 136967, "epoch": 1650} {"train_loss": -22.521560668945312, "global_step": 136968, "epoch": 1650} {"train_loss": -22.701236724853516, "global_step": 136969, "epoch": 1650} {"train_loss": -22.427494049072266, "global_step": 136970, "epoch": 1650} {"train_loss": -22.83246612548828, "global_step": 136971, "epoch": 1650} {"train_loss": -22.907461166381836, "global_step": 136972, "epoch": 1650} {"train_loss": -22.50812339782715, "global_step": 136973, "epoch": 1650} {"train_loss": -22.829381942749023, "global_step": 136974, "epoch": 1650} {"train_loss": -22.770261764526367, "global_step": 136975, "epoch": 1650} {"train_loss": -22.788043975830078, "global_step": 136976, "epoch": 1650} {"train_loss": -22.967607498168945, "global_step": 136977, "epoch": 1650} {"train_loss": -22.58316421508789, "global_step": 136978, "epoch": 1650} {"train_loss": -22.96778678894043, "global_step": 136979, "epoch": 1650} {"train_loss": -23.21947479248047, "global_step": 136980, "epoch": 1650} {"train_loss": -22.985227584838867, "global_step": 136981, "epoch": 1650} {"train_loss": -23.08330726623535, "global_step": 136982, "epoch": 1650} {"train_loss": -23.173917770385742, "global_step": 136983, "epoch": 1650} {"train_loss": -22.676172256469727, "global_step": 136984, "epoch": 1650} {"train_loss": -22.861135482788086, "global_step": 136985, "epoch": 1650} {"train_loss": -23.2763614654541, "global_step": 136986, "epoch": 1650} {"train_loss": -23.10483741760254, "global_step": 136987, "epoch": 1650} {"train_loss": -23.105817794799805, "global_step": 136988, "epoch": 1650} {"train_loss": -23.285612106323242, "global_step": 136989, "epoch": 1650} {"train_loss": -22.956876754760742, "global_step": 136990, "epoch": 1650} {"train_loss": -22.94983673095703, "global_step": 136991, "epoch": 1650} {"train_loss": -22.837575912475586, "global_step": 136992, "epoch": 1650} {"train_loss": -22.703937530517578, "global_step": 136993, "epoch": 1650} {"train_loss": -22.697126388549805, "global_step": 136994, "epoch": 1650} {"train_loss": -22.679990768432617, "global_step": 136995, "epoch": 1650} {"train_loss": -22.893178939819336, "global_step": 136996, "epoch": 1650} {"train_loss": -22.644880294799805, "global_step": 136997, "epoch": 1650} {"train_loss": -22.774368286132812, "global_step": 136998, "epoch": 1650} {"train_loss": -22.44062614440918, "global_step": 136999, "epoch": 1650} {"train_loss": -23.289886474609375, "global_step": 137000, "epoch": 1650} {"train_loss": -22.772695541381836, "global_step": 137001, "epoch": 1650} {"train_loss": -23.13766860961914, "global_step": 137002, "epoch": 1650} {"train_loss": -22.993803024291992, "global_step": 137003, "epoch": 1650} {"train_loss": -23.12202262878418, "global_step": 137004, "epoch": 1650} {"train_loss": -23.12190055847168, "global_step": 137005, "epoch": 1650} {"train_loss": -23.043668746948242, "global_step": 137006, "epoch": 1650} {"train_loss": -22.91450309753418, "global_step": 137007, "epoch": 1650} {"train_loss": -22.908615112304688, "global_step": 137008, "epoch": 1650} {"train_loss": -22.966272354125977, "global_step": 137009, "epoch": 1650} {"train_loss": -23.104496002197266, "global_step": 137010, "epoch": 1650} {"train_loss": -22.81634521484375, "global_step": 137011, "epoch": 1650} {"train_loss": -23.011404037475586, "global_step": 137012, "epoch": 1650} {"train_loss": -23.217191696166992, "global_step": 137013, "epoch": 1650} {"train_loss": -23.136337280273438, "global_step": 137014, "epoch": 1650} {"train_loss": -22.975711822509766, "global_step": 137015, "epoch": 1650} {"train_loss": -23.056232452392578, "global_step": 137016, "epoch": 1650} {"train_loss": -23.028806686401367, "global_step": 137017, "epoch": 1650} {"train_loss": -22.561126708984375, "global_step": 137018, "epoch": 1650} {"train_loss": -23.308521270751953, "global_step": 137019, "epoch": 1650} {"train_loss": -22.752197265625, "global_step": 137020, "epoch": 1650} {"train_loss": -22.5968074798584, "global_step": 137021, "epoch": 1650} {"train_loss": -23.472089767456055, "global_step": 137022, "epoch": 1650} {"train_loss": -23.098432540893555, "global_step": 137023, "epoch": 1650} {"train_loss": -23.0696964263916, "global_step": 137024, "epoch": 1650} {"train_loss": -22.312707901000977, "global_step": 137025, "epoch": 1650} {"train_loss": -22.346288681030273, "global_step": 137026, "epoch": 1650} {"train_loss": -22.735864639282227, "global_step": 137027, "epoch": 1650} {"train_loss": -22.994699478149414, "global_step": 137028, "epoch": 1650} {"train_loss": -22.986799240112305, "global_step": 137029, "epoch": 1650} {"train_loss": -22.807907104492188, "global_step": 137030, "epoch": 1650} {"train_loss": -22.996944427490234, "global_step": 137031, "epoch": 1650} {"train_loss": -22.812891420111598, "global_step": 137032, "epoch": 1650, "train/sim_max_reward_0": 1.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 0.0, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 0.0, "test/sim_max_reward_4500000": 1.0, "test/sim_max_reward_4500001": 1.0, "test/sim_max_reward_4500002": 1.0, "test/sim_max_reward_4500003": 1.0, "test/sim_max_reward_4500004": 1.0, "test/sim_max_reward_4500005": 1.0, "test/sim_max_reward_4500006": 1.0, "test/sim_max_reward_4500007": 1.0, "test/sim_max_reward_4500008": 1.0, "test/sim_max_reward_4500009": 1.0, "test/sim_max_reward_4500010": 1.0, "test/sim_max_reward_4500011": 1.0, "test/sim_max_reward_4500012": 1.0, "test/sim_max_reward_4500013": 1.0, "test/sim_max_reward_4500014": 1.0, "test/sim_max_reward_4500015": 1.0, "test/sim_max_reward_4500016": 1.0, "test/sim_max_reward_4500017": 1.0, "test/sim_max_reward_4500018": 1.0, "test/sim_max_reward_4500019": 1.0, "test/sim_max_reward_4500020": 1.0, "test/sim_max_reward_4500021": 1.0, "train/mean_score": 0.6666666666666666, "test/mean_score": 1.0, "val_loss": 6369778.0} {"train_loss": -22.641469955444336, "global_step": 137033, "epoch": 1651} {"train_loss": -22.17715072631836, "global_step": 137034, "epoch": 1651} {"train_loss": -22.702245712280273, "global_step": 137035, "epoch": 1651} {"train_loss": -22.567508697509766, "global_step": 137036, "epoch": 1651} {"train_loss": -22.393653869628906, "global_step": 137037, "epoch": 1651} {"train_loss": -22.587881088256836, "global_step": 137038, "epoch": 1651} {"train_loss": -22.591140747070312, "global_step": 137039, "epoch": 1651} {"train_loss": -22.807302474975586, "global_step": 137040, "epoch": 1651} {"train_loss": -22.293161392211914, "global_step": 137041, "epoch": 1651} {"train_loss": -22.536733627319336, "global_step": 137042, "epoch": 1651} {"train_loss": -23.004514694213867, "global_step": 137043, "epoch": 1651} {"train_loss": -22.548444747924805, "global_step": 137044, "epoch": 1651} {"train_loss": -22.435718536376953, "global_step": 137045, "epoch": 1651} {"train_loss": -22.692657470703125, "global_step": 137046, "epoch": 1651} {"train_loss": -22.926794052124023, "global_step": 137047, "epoch": 1651} {"train_loss": -22.860740661621094, "global_step": 137048, "epoch": 1651} {"train_loss": -22.742658615112305, "global_step": 137049, "epoch": 1651} {"train_loss": -22.89373207092285, "global_step": 137050, "epoch": 1651} {"train_loss": -22.590984344482422, "global_step": 137051, "epoch": 1651} {"train_loss": -22.744810104370117, "global_step": 137052, "epoch": 1651} {"train_loss": -22.662158966064453, "global_step": 137053, "epoch": 1651} {"train_loss": -22.84752082824707, "global_step": 137054, "epoch": 1651} {"train_loss": -22.82260513305664, "global_step": 137055, "epoch": 1651} {"train_loss": -23.1816463470459, "global_step": 137056, "epoch": 1651} {"train_loss": -22.560302734375, "global_step": 137057, "epoch": 1651} {"train_loss": -22.774017333984375, "global_step": 137058, "epoch": 1651} {"train_loss": -23.051740646362305, "global_step": 137059, "epoch": 1651} {"train_loss": -23.163747787475586, "global_step": 137060, "epoch": 1651} {"train_loss": -22.927227020263672, "global_step": 137061, "epoch": 1651} {"train_loss": -23.392471313476562, "global_step": 137062, "epoch": 1651} {"train_loss": -23.126720428466797, "global_step": 137063, "epoch": 1651} {"train_loss": -22.941762924194336, "global_step": 137064, "epoch": 1651} {"train_loss": -22.770771026611328, "global_step": 137065, "epoch": 1651} {"train_loss": -23.011747360229492, "global_step": 137066, "epoch": 1651} {"train_loss": -23.15869903564453, "global_step": 137067, "epoch": 1651} {"train_loss": -22.971569061279297, "global_step": 137068, "epoch": 1651} {"train_loss": -22.83453941345215, "global_step": 137069, "epoch": 1651} {"train_loss": -22.893056869506836, "global_step": 137070, "epoch": 1651} {"train_loss": -22.973819732666016, "global_step": 137071, "epoch": 1651} {"train_loss": -22.96099281311035, "global_step": 137072, "epoch": 1651} {"train_loss": -23.281784057617188, "global_step": 137073, "epoch": 1651} {"train_loss": -23.127370834350586, "global_step": 137074, "epoch": 1651} {"train_loss": -23.219633102416992, "global_step": 137075, "epoch": 1651} {"train_loss": -22.983896255493164, "global_step": 137076, "epoch": 1651} {"train_loss": -23.529794692993164, "global_step": 137077, "epoch": 1651} {"train_loss": -22.931257247924805, "global_step": 137078, "epoch": 1651} {"train_loss": -23.079788208007812, "global_step": 137079, "epoch": 1651} {"train_loss": -23.141557693481445, "global_step": 137080, "epoch": 1651} {"train_loss": -23.390230178833008, "global_step": 137081, "epoch": 1651} {"train_loss": -22.980335235595703, "global_step": 137082, "epoch": 1651} {"train_loss": -22.85455322265625, "global_step": 137083, "epoch": 1651} {"train_loss": -23.302778244018555, "global_step": 137084, "epoch": 1651} {"train_loss": -23.010807037353516, "global_step": 137085, "epoch": 1651} {"train_loss": -22.97796058654785, "global_step": 137086, "epoch": 1651} {"train_loss": -23.053564071655273, "global_step": 137087, "epoch": 1651} {"train_loss": -23.142078399658203, "global_step": 137088, "epoch": 1651} {"train_loss": -22.730342864990234, "global_step": 137089, "epoch": 1651} {"train_loss": -23.054931640625, "global_step": 137090, "epoch": 1651} {"train_loss": -22.942508697509766, "global_step": 137091, "epoch": 1651} {"train_loss": -22.923616409301758, "global_step": 137092, "epoch": 1651} {"train_loss": -22.587011337280273, "global_step": 137093, "epoch": 1651} {"train_loss": -22.681434631347656, "global_step": 137094, "epoch": 1651} {"train_loss": -23.08681297302246, "global_step": 137095, "epoch": 1651} {"train_loss": -23.020296096801758, "global_step": 137096, "epoch": 1651} {"train_loss": -23.236358642578125, "global_step": 137097, "epoch": 1651} {"train_loss": -23.220014572143555, "global_step": 137098, "epoch": 1651} {"train_loss": -22.719242095947266, "global_step": 137099, "epoch": 1651} {"train_loss": -23.21023178100586, "global_step": 137100, "epoch": 1651} {"train_loss": -23.044599533081055, "global_step": 137101, "epoch": 1651} {"train_loss": -23.09943962097168, "global_step": 137102, "epoch": 1651} {"train_loss": -23.064477920532227, "global_step": 137103, "epoch": 1651} {"train_loss": -23.09620475769043, "global_step": 137104, "epoch": 1651} {"train_loss": -23.33645248413086, "global_step": 137105, "epoch": 1651} {"train_loss": -23.196043014526367, "global_step": 137106, "epoch": 1651} {"train_loss": -23.12970733642578, "global_step": 137107, "epoch": 1651} {"train_loss": -23.04498291015625, "global_step": 137108, "epoch": 1651} {"train_loss": -22.865644454956055, "global_step": 137109, "epoch": 1651} {"train_loss": -22.689870834350586, "global_step": 137110, "epoch": 1651} {"train_loss": -22.623031616210938, "global_step": 137111, "epoch": 1651} {"train_loss": -22.934885025024414, "global_step": 137112, "epoch": 1651} {"train_loss": -22.986835479736328, "global_step": 137113, "epoch": 1651} {"train_loss": -22.94402503967285, "global_step": 137114, "epoch": 1651} {"train_loss": -22.91389430861875, "global_step": 137115, "epoch": 1651, "val_loss": 6385827.0} {"train_loss": -22.91297721862793, "global_step": 137116, "epoch": 1652} {"train_loss": -22.503095626831055, "global_step": 137117, "epoch": 1652} {"train_loss": -22.514461517333984, "global_step": 137118, "epoch": 1652} {"train_loss": -22.883325576782227, "global_step": 137119, "epoch": 1652} {"train_loss": -22.968374252319336, "global_step": 137120, "epoch": 1652} {"train_loss": -22.70177459716797, "global_step": 137121, "epoch": 1652} {"train_loss": -22.911718368530273, "global_step": 137122, "epoch": 1652} {"train_loss": -22.889158248901367, "global_step": 137123, "epoch": 1652} {"train_loss": -22.61783218383789, "global_step": 137124, "epoch": 1652} {"train_loss": -23.034305572509766, "global_step": 137125, "epoch": 1652} {"train_loss": -23.315221786499023, "global_step": 137126, "epoch": 1652} {"train_loss": -22.70992088317871, "global_step": 137127, "epoch": 1652} {"train_loss": -22.609588623046875, "global_step": 137128, "epoch": 1652} {"train_loss": -22.52402687072754, "global_step": 137129, "epoch": 1652} {"train_loss": -22.717599868774414, "global_step": 137130, "epoch": 1652} {"train_loss": -23.12892723083496, "global_step": 137131, "epoch": 1652} {"train_loss": -22.915054321289062, "global_step": 137132, "epoch": 1652} {"train_loss": -22.82900047302246, "global_step": 137133, "epoch": 1652} {"train_loss": -23.234922409057617, "global_step": 137134, "epoch": 1652} {"train_loss": -23.109174728393555, "global_step": 137135, "epoch": 1652} {"train_loss": -23.089797973632812, "global_step": 137136, "epoch": 1652} {"train_loss": -23.07706642150879, "global_step": 137137, "epoch": 1652} {"train_loss": -22.869041442871094, "global_step": 137138, "epoch": 1652} {"train_loss": -23.248512268066406, "global_step": 137139, "epoch": 1652} {"train_loss": -22.86643409729004, "global_step": 137140, "epoch": 1652} {"train_loss": -23.12312126159668, "global_step": 137141, "epoch": 1652} {"train_loss": -22.967750549316406, "global_step": 137142, "epoch": 1652} {"train_loss": -22.98550033569336, "global_step": 137143, "epoch": 1652} {"train_loss": -23.261926651000977, "global_step": 137144, "epoch": 1652} {"train_loss": -22.875988006591797, "global_step": 137145, "epoch": 1652} {"train_loss": -23.393917083740234, "global_step": 137146, "epoch": 1652} {"train_loss": -22.727434158325195, "global_step": 137147, "epoch": 1652} {"train_loss": -22.683958053588867, "global_step": 137148, "epoch": 1652} {"train_loss": -23.088193893432617, "global_step": 137149, "epoch": 1652} {"train_loss": -23.062219619750977, "global_step": 137150, "epoch": 1652} {"train_loss": -23.105337142944336, "global_step": 137151, "epoch": 1652} {"train_loss": -22.845808029174805, "global_step": 137152, "epoch": 1652} {"train_loss": -22.720640182495117, "global_step": 137153, "epoch": 1652} {"train_loss": -22.90997886657715, "global_step": 137154, "epoch": 1652} {"train_loss": -22.96142578125, "global_step": 137155, "epoch": 1652} {"train_loss": -22.79690170288086, "global_step": 137156, "epoch": 1652} {"train_loss": -23.129568099975586, "global_step": 137157, "epoch": 1652} {"train_loss": -23.19783592224121, "global_step": 137158, "epoch": 1652} {"train_loss": -23.016956329345703, "global_step": 137159, "epoch": 1652} {"train_loss": -22.96626091003418, "global_step": 137160, "epoch": 1652} {"train_loss": -23.273468017578125, "global_step": 137161, "epoch": 1652} {"train_loss": -23.011938095092773, "global_step": 137162, "epoch": 1652} {"train_loss": -22.882444381713867, "global_step": 137163, "epoch": 1652} {"train_loss": -23.03676414489746, "global_step": 137164, "epoch": 1652} {"train_loss": -23.06952476501465, "global_step": 137165, "epoch": 1652} {"train_loss": -22.963851928710938, "global_step": 137166, "epoch": 1652} {"train_loss": -23.062305450439453, "global_step": 137167, "epoch": 1652} {"train_loss": -23.031604766845703, "global_step": 137168, "epoch": 1652} {"train_loss": -23.141447067260742, "global_step": 137169, "epoch": 1652} {"train_loss": -23.386327743530273, "global_step": 137170, "epoch": 1652} {"train_loss": -22.778852462768555, "global_step": 137171, "epoch": 1652} {"train_loss": -23.07444190979004, "global_step": 137172, "epoch": 1652} {"train_loss": -23.18080711364746, "global_step": 137173, "epoch": 1652} {"train_loss": -23.09559440612793, "global_step": 137174, "epoch": 1652} {"train_loss": -22.8109188079834, "global_step": 137175, "epoch": 1652} {"train_loss": -23.02072525024414, "global_step": 137176, "epoch": 1652} {"train_loss": -22.766530990600586, "global_step": 137177, "epoch": 1652} {"train_loss": -22.65176773071289, "global_step": 137178, "epoch": 1652} {"train_loss": -22.81634521484375, "global_step": 137179, "epoch": 1652} {"train_loss": -23.259389877319336, "global_step": 137180, "epoch": 1652} {"train_loss": -23.30524253845215, "global_step": 137181, "epoch": 1652} {"train_loss": -22.996545791625977, "global_step": 137182, "epoch": 1652} {"train_loss": -23.12723731994629, "global_step": 137183, "epoch": 1652} {"train_loss": -23.337133407592773, "global_step": 137184, "epoch": 1652} {"train_loss": -23.059986114501953, "global_step": 137185, "epoch": 1652} {"train_loss": -23.241724014282227, "global_step": 137186, "epoch": 1652} {"train_loss": -23.547277450561523, "global_step": 137187, "epoch": 1652} {"train_loss": -22.796092987060547, "global_step": 137188, "epoch": 1652} {"train_loss": -23.000751495361328, "global_step": 137189, "epoch": 1652} {"train_loss": -23.00015640258789, "global_step": 137190, "epoch": 1652} {"train_loss": -23.004135131835938, "global_step": 137191, "epoch": 1652} {"train_loss": -23.051782608032227, "global_step": 137192, "epoch": 1652} {"train_loss": -23.382715225219727, "global_step": 137193, "epoch": 1652} {"train_loss": -22.95927619934082, "global_step": 137194, "epoch": 1652} {"train_loss": -22.543371200561523, "global_step": 137195, "epoch": 1652} {"train_loss": -23.044403076171875, "global_step": 137196, "epoch": 1652} {"train_loss": -22.9849853515625, "global_step": 137197, "epoch": 1652} {"train_loss": -22.99071164878018, "global_step": 137198, "epoch": 1652, "val_loss": 6324615.5} {"train_loss": -22.26142120361328, "global_step": 137199, "epoch": 1653} {"train_loss": -21.864086151123047, "global_step": 137200, "epoch": 1653} {"train_loss": -22.667856216430664, "global_step": 137201, "epoch": 1653} {"train_loss": -22.50984764099121, "global_step": 137202, "epoch": 1653} {"train_loss": -22.010221481323242, "global_step": 137203, "epoch": 1653} {"train_loss": -22.79587173461914, "global_step": 137204, "epoch": 1653} {"train_loss": -22.264638900756836, "global_step": 137205, "epoch": 1653} {"train_loss": -22.43649673461914, "global_step": 137206, "epoch": 1653} {"train_loss": -22.509929656982422, "global_step": 137207, "epoch": 1653} {"train_loss": -22.485870361328125, "global_step": 137208, "epoch": 1653} {"train_loss": -22.611745834350586, "global_step": 137209, "epoch": 1653} {"train_loss": -22.72513771057129, "global_step": 137210, "epoch": 1653} {"train_loss": -22.49591064453125, "global_step": 137211, "epoch": 1653} {"train_loss": -22.41474723815918, "global_step": 137212, "epoch": 1653} {"train_loss": -22.127920150756836, "global_step": 137213, "epoch": 1653} {"train_loss": -22.477712631225586, "global_step": 137214, "epoch": 1653} {"train_loss": -22.719867706298828, "global_step": 137215, "epoch": 1653} {"train_loss": -22.744836807250977, "global_step": 137216, "epoch": 1653} {"train_loss": -22.59429931640625, "global_step": 137217, "epoch": 1653} {"train_loss": -22.92039680480957, "global_step": 137218, "epoch": 1653} {"train_loss": -23.004810333251953, "global_step": 137219, "epoch": 1653} {"train_loss": -23.2004337310791, "global_step": 137220, "epoch": 1653} {"train_loss": -22.87409019470215, "global_step": 137221, "epoch": 1653} {"train_loss": -22.914886474609375, "global_step": 137222, "epoch": 1653} {"train_loss": -22.967519760131836, "global_step": 137223, "epoch": 1653} {"train_loss": -22.594263076782227, "global_step": 137224, "epoch": 1653} {"train_loss": -23.010986328125, "global_step": 137225, "epoch": 1653} {"train_loss": -23.001501083374023, "global_step": 137226, "epoch": 1653} {"train_loss": -22.97556495666504, "global_step": 137227, "epoch": 1653} {"train_loss": -22.917394638061523, "global_step": 137228, "epoch": 1653} {"train_loss": -22.570547103881836, "global_step": 137229, "epoch": 1653} {"train_loss": -22.605302810668945, "global_step": 137230, "epoch": 1653} {"train_loss": -22.922286987304688, "global_step": 137231, "epoch": 1653} {"train_loss": -22.766393661499023, "global_step": 137232, "epoch": 1653} {"train_loss": -22.82747459411621, "global_step": 137233, "epoch": 1653} {"train_loss": -23.0828800201416, "global_step": 137234, "epoch": 1653} {"train_loss": -22.99173927307129, "global_step": 137235, "epoch": 1653} {"train_loss": -22.596271514892578, "global_step": 137236, "epoch": 1653} {"train_loss": -22.24784278869629, "global_step": 137237, "epoch": 1653} {"train_loss": -22.874847412109375, "global_step": 137238, "epoch": 1653} {"train_loss": -22.774442672729492, "global_step": 137239, "epoch": 1653} {"train_loss": -22.532320022583008, "global_step": 137240, "epoch": 1653} {"train_loss": -22.862964630126953, "global_step": 137241, "epoch": 1653} {"train_loss": -22.554073333740234, "global_step": 137242, "epoch": 1653} {"train_loss": -22.661977767944336, "global_step": 137243, "epoch": 1653} {"train_loss": -22.819122314453125, "global_step": 137244, "epoch": 1653} {"train_loss": -22.65215492248535, "global_step": 137245, "epoch": 1653} {"train_loss": -22.810625076293945, "global_step": 137246, "epoch": 1653} {"train_loss": -22.736204147338867, "global_step": 137247, "epoch": 1653} {"train_loss": -22.597936630249023, "global_step": 137248, "epoch": 1653} {"train_loss": -22.874378204345703, "global_step": 137249, "epoch": 1653} {"train_loss": -23.05815887451172, "global_step": 137250, "epoch": 1653} {"train_loss": -22.96075439453125, "global_step": 137251, "epoch": 1653} {"train_loss": -23.06315803527832, "global_step": 137252, "epoch": 1653} {"train_loss": -23.034406661987305, "global_step": 137253, "epoch": 1653} {"train_loss": -22.948015213012695, "global_step": 137254, "epoch": 1653} {"train_loss": -23.090879440307617, "global_step": 137255, "epoch": 1653} {"train_loss": -23.154199600219727, "global_step": 137256, "epoch": 1653} {"train_loss": -22.90717887878418, "global_step": 137257, "epoch": 1653} {"train_loss": -22.984004974365234, "global_step": 137258, "epoch": 1653} {"train_loss": -22.749170303344727, "global_step": 137259, "epoch": 1653} {"train_loss": -23.164560317993164, "global_step": 137260, "epoch": 1653} {"train_loss": -22.886280059814453, "global_step": 137261, "epoch": 1653} {"train_loss": -23.018571853637695, "global_step": 137262, "epoch": 1653} {"train_loss": -23.208078384399414, "global_step": 137263, "epoch": 1653} {"train_loss": -23.02702522277832, "global_step": 137264, "epoch": 1653} {"train_loss": -22.90775489807129, "global_step": 137265, "epoch": 1653} {"train_loss": -23.115121841430664, "global_step": 137266, "epoch": 1653} {"train_loss": -22.954050064086914, "global_step": 137267, "epoch": 1653} {"train_loss": -22.885591506958008, "global_step": 137268, "epoch": 1653} {"train_loss": -23.141128540039062, "global_step": 137269, "epoch": 1653} {"train_loss": -23.17313575744629, "global_step": 137270, "epoch": 1653} {"train_loss": -23.419578552246094, "global_step": 137271, "epoch": 1653} {"train_loss": -23.116867065429688, "global_step": 137272, "epoch": 1653} {"train_loss": -22.97205924987793, "global_step": 137273, "epoch": 1653} {"train_loss": -22.90637969970703, "global_step": 137274, "epoch": 1653} {"train_loss": -22.92929458618164, "global_step": 137275, "epoch": 1653} {"train_loss": -22.70614242553711, "global_step": 137276, "epoch": 1653} {"train_loss": -22.819761276245117, "global_step": 137277, "epoch": 1653} {"train_loss": -23.15129852294922, "global_step": 137278, "epoch": 1653} {"train_loss": -23.134241104125977, "global_step": 137279, "epoch": 1653} {"train_loss": -23.232080459594727, "global_step": 137280, "epoch": 1653} {"train_loss": -22.802630022347692, "global_step": 137281, "epoch": 1653, "val_loss": 6262946.5} {"train_loss": -22.505970001220703, "global_step": 137282, "epoch": 1654} {"train_loss": -22.27045249938965, "global_step": 137283, "epoch": 1654} {"train_loss": -22.81924057006836, "global_step": 137284, "epoch": 1654} {"train_loss": -22.707971572875977, "global_step": 137285, "epoch": 1654} {"train_loss": -22.411035537719727, "global_step": 137286, "epoch": 1654} {"train_loss": -22.633089065551758, "global_step": 137287, "epoch": 1654} {"train_loss": -22.946630477905273, "global_step": 137288, "epoch": 1654} {"train_loss": -22.5336971282959, "global_step": 137289, "epoch": 1654} {"train_loss": -22.835254669189453, "global_step": 137290, "epoch": 1654} {"train_loss": -22.69239044189453, "global_step": 137291, "epoch": 1654} {"train_loss": -22.233261108398438, "global_step": 137292, "epoch": 1654} {"train_loss": -22.73078727722168, "global_step": 137293, "epoch": 1654} {"train_loss": -22.71522331237793, "global_step": 137294, "epoch": 1654} {"train_loss": -22.76346778869629, "global_step": 137295, "epoch": 1654} {"train_loss": -22.545024871826172, "global_step": 137296, "epoch": 1654} {"train_loss": -22.99128532409668, "global_step": 137297, "epoch": 1654} {"train_loss": -22.758649826049805, "global_step": 137298, "epoch": 1654} {"train_loss": -23.088165283203125, "global_step": 137299, "epoch": 1654} {"train_loss": -22.92499351501465, "global_step": 137300, "epoch": 1654} {"train_loss": -22.88194465637207, "global_step": 137301, "epoch": 1654} {"train_loss": -22.78920555114746, "global_step": 137302, "epoch": 1654} {"train_loss": -22.983884811401367, "global_step": 137303, "epoch": 1654} {"train_loss": -22.659086227416992, "global_step": 137304, "epoch": 1654} {"train_loss": -22.752187728881836, "global_step": 137305, "epoch": 1654} {"train_loss": -22.831144332885742, "global_step": 137306, "epoch": 1654} {"train_loss": -22.786197662353516, "global_step": 137307, "epoch": 1654} {"train_loss": -22.78394889831543, "global_step": 137308, "epoch": 1654} {"train_loss": -22.88240623474121, "global_step": 137309, "epoch": 1654} {"train_loss": -22.618364334106445, "global_step": 137310, "epoch": 1654} {"train_loss": -22.801877975463867, "global_step": 137311, "epoch": 1654} {"train_loss": -22.91065788269043, "global_step": 137312, "epoch": 1654} {"train_loss": -23.304880142211914, "global_step": 137313, "epoch": 1654} {"train_loss": -23.18100929260254, "global_step": 137314, "epoch": 1654} {"train_loss": -22.974353790283203, "global_step": 137315, "epoch": 1654} {"train_loss": -23.18429946899414, "global_step": 137316, "epoch": 1654} {"train_loss": -23.122928619384766, "global_step": 137317, "epoch": 1654} {"train_loss": -22.876373291015625, "global_step": 137318, "epoch": 1654} {"train_loss": -22.91060447692871, "global_step": 137319, "epoch": 1654} {"train_loss": -23.174209594726562, "global_step": 137320, "epoch": 1654} {"train_loss": -22.445119857788086, "global_step": 137321, "epoch": 1654} {"train_loss": -23.391983032226562, "global_step": 137322, "epoch": 1654} {"train_loss": -22.98348617553711, "global_step": 137323, "epoch": 1654} {"train_loss": -23.468097686767578, "global_step": 137324, "epoch": 1654} {"train_loss": -23.145925521850586, "global_step": 137325, "epoch": 1654} {"train_loss": -23.240346908569336, "global_step": 137326, "epoch": 1654} {"train_loss": -23.059274673461914, "global_step": 137327, "epoch": 1654} {"train_loss": -23.19485855102539, "global_step": 137328, "epoch": 1654} {"train_loss": -22.56871795654297, "global_step": 137329, "epoch": 1654} {"train_loss": -23.27511978149414, "global_step": 137330, "epoch": 1654} {"train_loss": -23.244922637939453, "global_step": 137331, "epoch": 1654} {"train_loss": -23.117895126342773, "global_step": 137332, "epoch": 1654} {"train_loss": -23.116666793823242, "global_step": 137333, "epoch": 1654} {"train_loss": -23.19179344177246, "global_step": 137334, "epoch": 1654} {"train_loss": -22.996097564697266, "global_step": 137335, "epoch": 1654} {"train_loss": -22.956754684448242, "global_step": 137336, "epoch": 1654} {"train_loss": -23.582944869995117, "global_step": 137337, "epoch": 1654} {"train_loss": -22.929855346679688, "global_step": 137338, "epoch": 1654} {"train_loss": -23.004928588867188, "global_step": 137339, "epoch": 1654} {"train_loss": -22.857847213745117, "global_step": 137340, "epoch": 1654} {"train_loss": -22.873403549194336, "global_step": 137341, "epoch": 1654} {"train_loss": -22.90888786315918, "global_step": 137342, "epoch": 1654} {"train_loss": -22.744291305541992, "global_step": 137343, "epoch": 1654} {"train_loss": -23.063899993896484, "global_step": 137344, "epoch": 1654} {"train_loss": -23.207805633544922, "global_step": 137345, "epoch": 1654} {"train_loss": -22.840499877929688, "global_step": 137346, "epoch": 1654} {"train_loss": -22.976465225219727, "global_step": 137347, "epoch": 1654} {"train_loss": -22.916593551635742, "global_step": 137348, "epoch": 1654} {"train_loss": -22.9556827545166, "global_step": 137349, "epoch": 1654} {"train_loss": -23.071142196655273, "global_step": 137350, "epoch": 1654} {"train_loss": -23.135324478149414, "global_step": 137351, "epoch": 1654} {"train_loss": -22.739625930786133, "global_step": 137352, "epoch": 1654} {"train_loss": -23.470523834228516, "global_step": 137353, "epoch": 1654} {"train_loss": -23.125452041625977, "global_step": 137354, "epoch": 1654} {"train_loss": -22.95967674255371, "global_step": 137355, "epoch": 1654} {"train_loss": -23.1190185546875, "global_step": 137356, "epoch": 1654} {"train_loss": -23.295488357543945, "global_step": 137357, "epoch": 1654} {"train_loss": -22.96742820739746, "global_step": 137358, "epoch": 1654} {"train_loss": -23.574914932250977, "global_step": 137359, "epoch": 1654} {"train_loss": -22.624103546142578, "global_step": 137360, "epoch": 1654} {"train_loss": -22.991424560546875, "global_step": 137361, "epoch": 1654} {"train_loss": -22.764404296875, "global_step": 137362, "epoch": 1654} {"train_loss": -23.11322593688965, "global_step": 137363, "epoch": 1654} {"train_loss": -22.934023845626648, "global_step": 137364, "epoch": 1654, "val_loss": 6258276.0} {"train_loss": -22.619688034057617, "global_step": 137365, "epoch": 1655} {"train_loss": -23.07714080810547, "global_step": 137366, "epoch": 1655} {"train_loss": -22.602386474609375, "global_step": 137367, "epoch": 1655} {"train_loss": -22.397445678710938, "global_step": 137368, "epoch": 1655} {"train_loss": -22.524059295654297, "global_step": 137369, "epoch": 1655} {"train_loss": -22.22796630859375, "global_step": 137370, "epoch": 1655} {"train_loss": -22.713293075561523, "global_step": 137371, "epoch": 1655} {"train_loss": -22.704099655151367, "global_step": 137372, "epoch": 1655} {"train_loss": -22.64960289001465, "global_step": 137373, "epoch": 1655} {"train_loss": -22.62640953063965, "global_step": 137374, "epoch": 1655} {"train_loss": -22.7733211517334, "global_step": 137375, "epoch": 1655} {"train_loss": -22.725379943847656, "global_step": 137376, "epoch": 1655} {"train_loss": -23.17371940612793, "global_step": 137377, "epoch": 1655} {"train_loss": -22.796422958374023, "global_step": 137378, "epoch": 1655} {"train_loss": -22.7139892578125, "global_step": 137379, "epoch": 1655} {"train_loss": -22.974246978759766, "global_step": 137380, "epoch": 1655} {"train_loss": -23.069293975830078, "global_step": 137381, "epoch": 1655} {"train_loss": -23.10407257080078, "global_step": 137382, "epoch": 1655} {"train_loss": -22.779521942138672, "global_step": 137383, "epoch": 1655} {"train_loss": -22.551315307617188, "global_step": 137384, "epoch": 1655} {"train_loss": -22.81837272644043, "global_step": 137385, "epoch": 1655} {"train_loss": -23.13309669494629, "global_step": 137386, "epoch": 1655} {"train_loss": -22.658430099487305, "global_step": 137387, "epoch": 1655} {"train_loss": -22.989110946655273, "global_step": 137388, "epoch": 1655} {"train_loss": -23.224960327148438, "global_step": 137389, "epoch": 1655} {"train_loss": -23.13758659362793, "global_step": 137390, "epoch": 1655} {"train_loss": -22.808828353881836, "global_step": 137391, "epoch": 1655} {"train_loss": -22.912343978881836, "global_step": 137392, "epoch": 1655} {"train_loss": -23.130701065063477, "global_step": 137393, "epoch": 1655} {"train_loss": -23.06635284423828, "global_step": 137394, "epoch": 1655} {"train_loss": -22.779417037963867, "global_step": 137395, "epoch": 1655} {"train_loss": -23.224218368530273, "global_step": 137396, "epoch": 1655} {"train_loss": -22.77655601501465, "global_step": 137397, "epoch": 1655} {"train_loss": -23.29023551940918, "global_step": 137398, "epoch": 1655} {"train_loss": -22.605533599853516, "global_step": 137399, "epoch": 1655} {"train_loss": -22.91827964782715, "global_step": 137400, "epoch": 1655} {"train_loss": -23.00894546508789, "global_step": 137401, "epoch": 1655} {"train_loss": -23.235061645507812, "global_step": 137402, "epoch": 1655} {"train_loss": -23.15506935119629, "global_step": 137403, "epoch": 1655} {"train_loss": -22.576520919799805, "global_step": 137404, "epoch": 1655} {"train_loss": -22.99855613708496, "global_step": 137405, "epoch": 1655} {"train_loss": -22.8604736328125, "global_step": 137406, "epoch": 1655} {"train_loss": -23.201065063476562, "global_step": 137407, "epoch": 1655} {"train_loss": -23.08658218383789, "global_step": 137408, "epoch": 1655} {"train_loss": -22.912250518798828, "global_step": 137409, "epoch": 1655} {"train_loss": -22.717737197875977, "global_step": 137410, "epoch": 1655} {"train_loss": -23.39874267578125, "global_step": 137411, "epoch": 1655} {"train_loss": -23.243289947509766, "global_step": 137412, "epoch": 1655} {"train_loss": -22.900156021118164, "global_step": 137413, "epoch": 1655} {"train_loss": -22.706125259399414, "global_step": 137414, "epoch": 1655} {"train_loss": -22.743148803710938, "global_step": 137415, "epoch": 1655} {"train_loss": -22.64912223815918, "global_step": 137416, "epoch": 1655} {"train_loss": -22.810880661010742, "global_step": 137417, "epoch": 1655} {"train_loss": -22.365781784057617, "global_step": 137418, "epoch": 1655} {"train_loss": -23.15437126159668, "global_step": 137419, "epoch": 1655} {"train_loss": -22.650793075561523, "global_step": 137420, "epoch": 1655} {"train_loss": -22.811695098876953, "global_step": 137421, "epoch": 1655} {"train_loss": -22.547378540039062, "global_step": 137422, "epoch": 1655} {"train_loss": -22.99317741394043, "global_step": 137423, "epoch": 1655} {"train_loss": -22.861204147338867, "global_step": 137424, "epoch": 1655} {"train_loss": -22.715417861938477, "global_step": 137425, "epoch": 1655} {"train_loss": -23.23287010192871, "global_step": 137426, "epoch": 1655} {"train_loss": -22.874292373657227, "global_step": 137427, "epoch": 1655} {"train_loss": -22.7441349029541, "global_step": 137428, "epoch": 1655} {"train_loss": -22.784433364868164, "global_step": 137429, "epoch": 1655} {"train_loss": -22.718969345092773, "global_step": 137430, "epoch": 1655} {"train_loss": -23.212574005126953, "global_step": 137431, "epoch": 1655} {"train_loss": -22.87261390686035, "global_step": 137432, "epoch": 1655} {"train_loss": -22.914175033569336, "global_step": 137433, "epoch": 1655} {"train_loss": -22.720989227294922, "global_step": 137434, "epoch": 1655} {"train_loss": -22.79891586303711, "global_step": 137435, "epoch": 1655} {"train_loss": -22.80390167236328, "global_step": 137436, "epoch": 1655} {"train_loss": -22.8063907623291, "global_step": 137437, "epoch": 1655} {"train_loss": -22.88034439086914, "global_step": 137438, "epoch": 1655} {"train_loss": -22.82684898376465, "global_step": 137439, "epoch": 1655} {"train_loss": -22.746917724609375, "global_step": 137440, "epoch": 1655} {"train_loss": -23.248830795288086, "global_step": 137441, "epoch": 1655} {"train_loss": -23.07190704345703, "global_step": 137442, "epoch": 1655} {"train_loss": -22.88559341430664, "global_step": 137443, "epoch": 1655} {"train_loss": -23.133255004882812, "global_step": 137444, "epoch": 1655} {"train_loss": -22.93160629272461, "global_step": 137445, "epoch": 1655} {"train_loss": -22.72609519958496, "global_step": 137446, "epoch": 1655} {"train_loss": -22.872392309717384, "global_step": 137447, "epoch": 1655, "val_loss": 6204264.5} {"train_loss": -23.241113662719727, "global_step": 137448, "epoch": 1656} {"train_loss": -22.643478393554688, "global_step": 137449, "epoch": 1656} {"train_loss": -22.789987564086914, "global_step": 137450, "epoch": 1656} {"train_loss": -22.613183975219727, "global_step": 137451, "epoch": 1656} {"train_loss": -22.86075210571289, "global_step": 137452, "epoch": 1656} {"train_loss": -22.608510971069336, "global_step": 137453, "epoch": 1656} {"train_loss": -23.016857147216797, "global_step": 137454, "epoch": 1656} {"train_loss": -22.97612953186035, "global_step": 137455, "epoch": 1656} {"train_loss": -22.81939697265625, "global_step": 137456, "epoch": 1656} {"train_loss": -22.85053062438965, "global_step": 137457, "epoch": 1656} {"train_loss": -22.15993309020996, "global_step": 137458, "epoch": 1656} {"train_loss": -22.758865356445312, "global_step": 137459, "epoch": 1656} {"train_loss": -22.60972023010254, "global_step": 137460, "epoch": 1656} {"train_loss": -22.637998580932617, "global_step": 137461, "epoch": 1656} {"train_loss": -22.894208908081055, "global_step": 137462, "epoch": 1656} {"train_loss": -22.978271484375, "global_step": 137463, "epoch": 1656} {"train_loss": -23.309720993041992, "global_step": 137464, "epoch": 1656} {"train_loss": -22.423622131347656, "global_step": 137465, "epoch": 1656} {"train_loss": -22.664676666259766, "global_step": 137466, "epoch": 1656} {"train_loss": -23.243576049804688, "global_step": 137467, "epoch": 1656} {"train_loss": -22.87003517150879, "global_step": 137468, "epoch": 1656} {"train_loss": -22.948623657226562, "global_step": 137469, "epoch": 1656} {"train_loss": -22.782155990600586, "global_step": 137470, "epoch": 1656} {"train_loss": -22.985313415527344, "global_step": 137471, "epoch": 1656} {"train_loss": -22.856237411499023, "global_step": 137472, "epoch": 1656} {"train_loss": -23.07661247253418, "global_step": 137473, "epoch": 1656} {"train_loss": -22.635663986206055, "global_step": 137474, "epoch": 1656} {"train_loss": -23.202512741088867, "global_step": 137475, "epoch": 1656} {"train_loss": -23.07924461364746, "global_step": 137476, "epoch": 1656} {"train_loss": -22.950254440307617, "global_step": 137477, "epoch": 1656} {"train_loss": -22.919158935546875, "global_step": 137478, "epoch": 1656} {"train_loss": -23.136938095092773, "global_step": 137479, "epoch": 1656} {"train_loss": -23.26063346862793, "global_step": 137480, "epoch": 1656} {"train_loss": -23.067731857299805, "global_step": 137481, "epoch": 1656} {"train_loss": -22.924406051635742, "global_step": 137482, "epoch": 1656} {"train_loss": -22.74248695373535, "global_step": 137483, "epoch": 1656} {"train_loss": -22.878393173217773, "global_step": 137484, "epoch": 1656} {"train_loss": -23.196393966674805, "global_step": 137485, "epoch": 1656} {"train_loss": -23.252023696899414, "global_step": 137486, "epoch": 1656} {"train_loss": -22.92914581298828, "global_step": 137487, "epoch": 1656} {"train_loss": -22.994115829467773, "global_step": 137488, "epoch": 1656} {"train_loss": -23.120121002197266, "global_step": 137489, "epoch": 1656} {"train_loss": -23.148235321044922, "global_step": 137490, "epoch": 1656} {"train_loss": -22.803224563598633, "global_step": 137491, "epoch": 1656} {"train_loss": -22.862890243530273, "global_step": 137492, "epoch": 1656} {"train_loss": -22.701400756835938, "global_step": 137493, "epoch": 1656} {"train_loss": -23.006711959838867, "global_step": 137494, "epoch": 1656} {"train_loss": -22.760862350463867, "global_step": 137495, "epoch": 1656} {"train_loss": -23.223363876342773, "global_step": 137496, "epoch": 1656} {"train_loss": -22.4879093170166, "global_step": 137497, "epoch": 1656} {"train_loss": -22.6894588470459, "global_step": 137498, "epoch": 1656} {"train_loss": -22.76784324645996, "global_step": 137499, "epoch": 1656} {"train_loss": -22.978506088256836, "global_step": 137500, "epoch": 1656} {"train_loss": -22.642919540405273, "global_step": 137501, "epoch": 1656} {"train_loss": -22.76576042175293, "global_step": 137502, "epoch": 1656} {"train_loss": -22.983524322509766, "global_step": 137503, "epoch": 1656} {"train_loss": -23.003812789916992, "global_step": 137504, "epoch": 1656} {"train_loss": -22.984882354736328, "global_step": 137505, "epoch": 1656} {"train_loss": -22.906091690063477, "global_step": 137506, "epoch": 1656} {"train_loss": -22.847658157348633, "global_step": 137507, "epoch": 1656} {"train_loss": -23.018939971923828, "global_step": 137508, "epoch": 1656} {"train_loss": -23.13515281677246, "global_step": 137509, "epoch": 1656} {"train_loss": -22.959936141967773, "global_step": 137510, "epoch": 1656} {"train_loss": -22.732629776000977, "global_step": 137511, "epoch": 1656} {"train_loss": -22.631717681884766, "global_step": 137512, "epoch": 1656} {"train_loss": -23.187284469604492, "global_step": 137513, "epoch": 1656} {"train_loss": -23.06825065612793, "global_step": 137514, "epoch": 1656} {"train_loss": -23.0721492767334, "global_step": 137515, "epoch": 1656} {"train_loss": -22.573083877563477, "global_step": 137516, "epoch": 1656} {"train_loss": -22.869123458862305, "global_step": 137517, "epoch": 1656} {"train_loss": -22.94719123840332, "global_step": 137518, "epoch": 1656} {"train_loss": -23.35927391052246, "global_step": 137519, "epoch": 1656} {"train_loss": -23.363908767700195, "global_step": 137520, "epoch": 1656} {"train_loss": -23.229209899902344, "global_step": 137521, "epoch": 1656} {"train_loss": -23.17009162902832, "global_step": 137522, "epoch": 1656} {"train_loss": -23.02800941467285, "global_step": 137523, "epoch": 1656} {"train_loss": -23.264984130859375, "global_step": 137524, "epoch": 1656} {"train_loss": -23.097341537475586, "global_step": 137525, "epoch": 1656} {"train_loss": -22.889699935913086, "global_step": 137526, "epoch": 1656} {"train_loss": -22.85858726501465, "global_step": 137527, "epoch": 1656} {"train_loss": -22.754343032836914, "global_step": 137528, "epoch": 1656} {"train_loss": -23.460447311401367, "global_step": 137529, "epoch": 1656} {"train_loss": -22.91295956990805, "global_step": 137530, "epoch": 1656, "val_loss": 6255003.5} {"train_loss": -22.57854461669922, "global_step": 137531, "epoch": 1657} {"train_loss": -22.74169158935547, "global_step": 137532, "epoch": 1657} {"train_loss": -23.106977462768555, "global_step": 137533, "epoch": 1657} {"train_loss": -22.610376358032227, "global_step": 137534, "epoch": 1657} {"train_loss": -22.7357234954834, "global_step": 137535, "epoch": 1657} {"train_loss": -22.730819702148438, "global_step": 137536, "epoch": 1657} {"train_loss": -22.722381591796875, "global_step": 137537, "epoch": 1657} {"train_loss": -22.831623077392578, "global_step": 137538, "epoch": 1657} {"train_loss": -22.729263305664062, "global_step": 137539, "epoch": 1657} {"train_loss": -22.9680233001709, "global_step": 137540, "epoch": 1657} {"train_loss": -22.409883499145508, "global_step": 137541, "epoch": 1657} {"train_loss": -23.082136154174805, "global_step": 137542, "epoch": 1657} {"train_loss": -22.921674728393555, "global_step": 137543, "epoch": 1657} {"train_loss": -23.1715087890625, "global_step": 137544, "epoch": 1657} {"train_loss": -22.79823875427246, "global_step": 137545, "epoch": 1657} {"train_loss": -22.772367477416992, "global_step": 137546, "epoch": 1657} {"train_loss": -23.05882453918457, "global_step": 137547, "epoch": 1657} {"train_loss": -23.387609481811523, "global_step": 137548, "epoch": 1657} {"train_loss": -22.8459529876709, "global_step": 137549, "epoch": 1657} {"train_loss": -22.992685317993164, "global_step": 137550, "epoch": 1657} {"train_loss": -23.06576919555664, "global_step": 137551, "epoch": 1657} {"train_loss": -22.598867416381836, "global_step": 137552, "epoch": 1657} {"train_loss": -22.942232131958008, "global_step": 137553, "epoch": 1657} {"train_loss": -22.87417984008789, "global_step": 137554, "epoch": 1657} {"train_loss": -22.59000587463379, "global_step": 137555, "epoch": 1657} {"train_loss": -23.141498565673828, "global_step": 137556, "epoch": 1657} {"train_loss": -22.9705753326416, "global_step": 137557, "epoch": 1657} {"train_loss": -22.8184757232666, "global_step": 137558, "epoch": 1657} {"train_loss": -23.12417221069336, "global_step": 137559, "epoch": 1657} {"train_loss": -22.785335540771484, "global_step": 137560, "epoch": 1657} {"train_loss": -22.683120727539062, "global_step": 137561, "epoch": 1657} {"train_loss": -22.818939208984375, "global_step": 137562, "epoch": 1657} {"train_loss": -23.10232925415039, "global_step": 137563, "epoch": 1657} {"train_loss": -22.992246627807617, "global_step": 137564, "epoch": 1657} {"train_loss": -23.156295776367188, "global_step": 137565, "epoch": 1657} {"train_loss": -22.84998893737793, "global_step": 137566, "epoch": 1657} {"train_loss": -22.62189292907715, "global_step": 137567, "epoch": 1657} {"train_loss": -23.20012664794922, "global_step": 137568, "epoch": 1657} {"train_loss": -23.014371871948242, "global_step": 137569, "epoch": 1657} {"train_loss": -22.586477279663086, "global_step": 137570, "epoch": 1657} {"train_loss": -22.89039421081543, "global_step": 137571, "epoch": 1657} {"train_loss": -23.10517692565918, "global_step": 137572, "epoch": 1657} {"train_loss": -22.556909561157227, "global_step": 137573, "epoch": 1657} {"train_loss": -23.04802894592285, "global_step": 137574, "epoch": 1657} {"train_loss": -22.774444580078125, "global_step": 137575, "epoch": 1657} {"train_loss": -22.993515014648438, "global_step": 137576, "epoch": 1657} {"train_loss": -22.862462997436523, "global_step": 137577, "epoch": 1657} {"train_loss": -22.886436462402344, "global_step": 137578, "epoch": 1657} {"train_loss": -23.00670051574707, "global_step": 137579, "epoch": 1657} {"train_loss": -23.02764129638672, "global_step": 137580, "epoch": 1657} {"train_loss": -22.9525146484375, "global_step": 137581, "epoch": 1657} {"train_loss": -22.890995025634766, "global_step": 137582, "epoch": 1657} {"train_loss": -22.911880493164062, "global_step": 137583, "epoch": 1657} {"train_loss": -23.179689407348633, "global_step": 137584, "epoch": 1657} {"train_loss": -23.08932113647461, "global_step": 137585, "epoch": 1657} {"train_loss": -23.024381637573242, "global_step": 137586, "epoch": 1657} {"train_loss": -23.117656707763672, "global_step": 137587, "epoch": 1657} {"train_loss": -23.080106735229492, "global_step": 137588, "epoch": 1657} {"train_loss": -23.178348541259766, "global_step": 137589, "epoch": 1657} {"train_loss": -22.697513580322266, "global_step": 137590, "epoch": 1657} {"train_loss": -23.018217086791992, "global_step": 137591, "epoch": 1657} {"train_loss": -23.263242721557617, "global_step": 137592, "epoch": 1657} {"train_loss": -23.38302993774414, "global_step": 137593, "epoch": 1657} {"train_loss": -23.09333610534668, "global_step": 137594, "epoch": 1657} {"train_loss": -23.021915435791016, "global_step": 137595, "epoch": 1657} {"train_loss": -23.421613693237305, "global_step": 137596, "epoch": 1657} {"train_loss": -23.030654907226562, "global_step": 137597, "epoch": 1657} {"train_loss": -22.967145919799805, "global_step": 137598, "epoch": 1657} {"train_loss": -23.027557373046875, "global_step": 137599, "epoch": 1657} {"train_loss": -22.662866592407227, "global_step": 137600, "epoch": 1657} {"train_loss": -22.47306251525879, "global_step": 137601, "epoch": 1657} {"train_loss": -23.102872848510742, "global_step": 137602, "epoch": 1657} {"train_loss": -23.061323165893555, "global_step": 137603, "epoch": 1657} {"train_loss": -23.011157989501953, "global_step": 137604, "epoch": 1657} {"train_loss": -23.133831024169922, "global_step": 137605, "epoch": 1657} {"train_loss": -22.575908660888672, "global_step": 137606, "epoch": 1657} {"train_loss": -23.141225814819336, "global_step": 137607, "epoch": 1657} {"train_loss": -23.075672149658203, "global_step": 137608, "epoch": 1657} {"train_loss": -22.682937622070312, "global_step": 137609, "epoch": 1657} {"train_loss": -22.487783432006836, "global_step": 137610, "epoch": 1657} {"train_loss": -23.225431442260742, "global_step": 137611, "epoch": 1657} {"train_loss": -22.889934539794922, "global_step": 137612, "epoch": 1657} {"train_loss": -22.93068187208061, "global_step": 137613, "epoch": 1657, "val_loss": 6249777.0} {"train_loss": -22.725147247314453, "global_step": 137614, "epoch": 1658} {"train_loss": -22.961809158325195, "global_step": 137615, "epoch": 1658} {"train_loss": -22.40945816040039, "global_step": 137616, "epoch": 1658} {"train_loss": -22.79852294921875, "global_step": 137617, "epoch": 1658} {"train_loss": -22.37457275390625, "global_step": 137618, "epoch": 1658} {"train_loss": -22.904815673828125, "global_step": 137619, "epoch": 1658} {"train_loss": -22.570987701416016, "global_step": 137620, "epoch": 1658} {"train_loss": -22.71199607849121, "global_step": 137621, "epoch": 1658} {"train_loss": -22.443679809570312, "global_step": 137622, "epoch": 1658} {"train_loss": -23.102365493774414, "global_step": 137623, "epoch": 1658} {"train_loss": -22.50774574279785, "global_step": 137624, "epoch": 1658} {"train_loss": -22.695581436157227, "global_step": 137625, "epoch": 1658} {"train_loss": -22.765140533447266, "global_step": 137626, "epoch": 1658} {"train_loss": -22.702905654907227, "global_step": 137627, "epoch": 1658} {"train_loss": -22.69467544555664, "global_step": 137628, "epoch": 1658} {"train_loss": -22.749242782592773, "global_step": 137629, "epoch": 1658} {"train_loss": -22.930316925048828, "global_step": 137630, "epoch": 1658} {"train_loss": -22.84048080444336, "global_step": 137631, "epoch": 1658} {"train_loss": -22.953956604003906, "global_step": 137632, "epoch": 1658} {"train_loss": -23.06077003479004, "global_step": 137633, "epoch": 1658} {"train_loss": -23.429662704467773, "global_step": 137634, "epoch": 1658} {"train_loss": -22.595420837402344, "global_step": 137635, "epoch": 1658} {"train_loss": -22.863840103149414, "global_step": 137636, "epoch": 1658} {"train_loss": -22.786945343017578, "global_step": 137637, "epoch": 1658} {"train_loss": -22.718799591064453, "global_step": 137638, "epoch": 1658} {"train_loss": -22.656980514526367, "global_step": 137639, "epoch": 1658} {"train_loss": -22.877578735351562, "global_step": 137640, "epoch": 1658} {"train_loss": -22.47064208984375, "global_step": 137641, "epoch": 1658} {"train_loss": -23.25099754333496, "global_step": 137642, "epoch": 1658} {"train_loss": -22.96455955505371, "global_step": 137643, "epoch": 1658} {"train_loss": -23.050626754760742, "global_step": 137644, "epoch": 1658} {"train_loss": -23.16081428527832, "global_step": 137645, "epoch": 1658} {"train_loss": -23.06635093688965, "global_step": 137646, "epoch": 1658} {"train_loss": -23.052927017211914, "global_step": 137647, "epoch": 1658} {"train_loss": -22.88254165649414, "global_step": 137648, "epoch": 1658} {"train_loss": -22.863346099853516, "global_step": 137649, "epoch": 1658} {"train_loss": -23.083959579467773, "global_step": 137650, "epoch": 1658} {"train_loss": -23.034122467041016, "global_step": 137651, "epoch": 1658} {"train_loss": -22.832244873046875, "global_step": 137652, "epoch": 1658} {"train_loss": -23.281085968017578, "global_step": 137653, "epoch": 1658} {"train_loss": -22.877338409423828, "global_step": 137654, "epoch": 1658} {"train_loss": -23.293851852416992, "global_step": 137655, "epoch": 1658} {"train_loss": -23.023374557495117, "global_step": 137656, "epoch": 1658} {"train_loss": -23.239688873291016, "global_step": 137657, "epoch": 1658} {"train_loss": -22.92905044555664, "global_step": 137658, "epoch": 1658} {"train_loss": -23.144630432128906, "global_step": 137659, "epoch": 1658} {"train_loss": -22.916086196899414, "global_step": 137660, "epoch": 1658} {"train_loss": -22.807723999023438, "global_step": 137661, "epoch": 1658} {"train_loss": -22.937528610229492, "global_step": 137662, "epoch": 1658} {"train_loss": -22.697389602661133, "global_step": 137663, "epoch": 1658} {"train_loss": -23.3856201171875, "global_step": 137664, "epoch": 1658} {"train_loss": -22.92711067199707, "global_step": 137665, "epoch": 1658} {"train_loss": -23.166854858398438, "global_step": 137666, "epoch": 1658} {"train_loss": -23.0919246673584, "global_step": 137667, "epoch": 1658} {"train_loss": -22.9853572845459, "global_step": 137668, "epoch": 1658} {"train_loss": -23.44285774230957, "global_step": 137669, "epoch": 1658} {"train_loss": -22.818021774291992, "global_step": 137670, "epoch": 1658} {"train_loss": -23.21298599243164, "global_step": 137671, "epoch": 1658} {"train_loss": -22.56715965270996, "global_step": 137672, "epoch": 1658} {"train_loss": -22.82433319091797, "global_step": 137673, "epoch": 1658} {"train_loss": -23.112689971923828, "global_step": 137674, "epoch": 1658} {"train_loss": -22.703468322753906, "global_step": 137675, "epoch": 1658} {"train_loss": -23.342239379882812, "global_step": 137676, "epoch": 1658} {"train_loss": -22.654382705688477, "global_step": 137677, "epoch": 1658} {"train_loss": -22.653715133666992, "global_step": 137678, "epoch": 1658} {"train_loss": -22.871768951416016, "global_step": 137679, "epoch": 1658} {"train_loss": -22.624807357788086, "global_step": 137680, "epoch": 1658} {"train_loss": -23.16196632385254, "global_step": 137681, "epoch": 1658} {"train_loss": -23.248016357421875, "global_step": 137682, "epoch": 1658} {"train_loss": -22.85990333557129, "global_step": 137683, "epoch": 1658} {"train_loss": -22.74238395690918, "global_step": 137684, "epoch": 1658} {"train_loss": -22.869850158691406, "global_step": 137685, "epoch": 1658} {"train_loss": -23.254993438720703, "global_step": 137686, "epoch": 1658} {"train_loss": -23.15985679626465, "global_step": 137687, "epoch": 1658} {"train_loss": -22.881071090698242, "global_step": 137688, "epoch": 1658} {"train_loss": -23.036962509155273, "global_step": 137689, "epoch": 1658} {"train_loss": -22.974653244018555, "global_step": 137690, "epoch": 1658} {"train_loss": -22.966588973999023, "global_step": 137691, "epoch": 1658} {"train_loss": -22.680923461914062, "global_step": 137692, "epoch": 1658} {"train_loss": -23.027982711791992, "global_step": 137693, "epoch": 1658} {"train_loss": -23.086380004882812, "global_step": 137694, "epoch": 1658} {"train_loss": -22.967994689941406, "global_step": 137695, "epoch": 1658} {"train_loss": -22.89765613050346, "global_step": 137696, "epoch": 1658, "val_loss": 6252555.0} {"train_loss": -22.801151275634766, "global_step": 137697, "epoch": 1659} {"train_loss": -22.862133026123047, "global_step": 137698, "epoch": 1659} {"train_loss": -23.113195419311523, "global_step": 137699, "epoch": 1659} {"train_loss": -22.54305076599121, "global_step": 137700, "epoch": 1659} {"train_loss": -22.314611434936523, "global_step": 137701, "epoch": 1659} {"train_loss": -22.668874740600586, "global_step": 137702, "epoch": 1659} {"train_loss": -23.204578399658203, "global_step": 137703, "epoch": 1659} {"train_loss": -22.374298095703125, "global_step": 137704, "epoch": 1659} {"train_loss": -23.328161239624023, "global_step": 137705, "epoch": 1659} {"train_loss": -22.698118209838867, "global_step": 137706, "epoch": 1659} {"train_loss": -23.056669235229492, "global_step": 137707, "epoch": 1659} {"train_loss": -22.94532585144043, "global_step": 137708, "epoch": 1659} {"train_loss": -23.096315383911133, "global_step": 137709, "epoch": 1659} {"train_loss": -22.830184936523438, "global_step": 137710, "epoch": 1659} {"train_loss": -22.860403060913086, "global_step": 137711, "epoch": 1659} {"train_loss": -22.85882568359375, "global_step": 137712, "epoch": 1659} {"train_loss": -22.9238224029541, "global_step": 137713, "epoch": 1659} {"train_loss": -23.04815101623535, "global_step": 137714, "epoch": 1659} {"train_loss": -22.624235153198242, "global_step": 137715, "epoch": 1659} {"train_loss": -22.83111572265625, "global_step": 137716, "epoch": 1659} {"train_loss": -23.372661590576172, "global_step": 137717, "epoch": 1659} {"train_loss": -22.859384536743164, "global_step": 137718, "epoch": 1659} {"train_loss": -23.08782386779785, "global_step": 137719, "epoch": 1659} {"train_loss": -22.794775009155273, "global_step": 137720, "epoch": 1659} {"train_loss": -22.80562400817871, "global_step": 137721, "epoch": 1659} {"train_loss": -23.0330810546875, "global_step": 137722, "epoch": 1659} {"train_loss": -23.12074851989746, "global_step": 137723, "epoch": 1659} {"train_loss": -23.26936912536621, "global_step": 137724, "epoch": 1659} {"train_loss": -22.701749801635742, "global_step": 137725, "epoch": 1659} {"train_loss": -23.19428253173828, "global_step": 137726, "epoch": 1659} {"train_loss": -23.3876953125, "global_step": 137727, "epoch": 1659} {"train_loss": -22.799232482910156, "global_step": 137728, "epoch": 1659} {"train_loss": -23.223285675048828, "global_step": 137729, "epoch": 1659} {"train_loss": -23.02730369567871, "global_step": 137730, "epoch": 1659} {"train_loss": -23.190927505493164, "global_step": 137731, "epoch": 1659} {"train_loss": -23.113069534301758, "global_step": 137732, "epoch": 1659} {"train_loss": -23.331331253051758, "global_step": 137733, "epoch": 1659} {"train_loss": -22.924840927124023, "global_step": 137734, "epoch": 1659} {"train_loss": -23.233068466186523, "global_step": 137735, "epoch": 1659} {"train_loss": -22.98957633972168, "global_step": 137736, "epoch": 1659} {"train_loss": -22.860897064208984, "global_step": 137737, "epoch": 1659} {"train_loss": -23.253082275390625, "global_step": 137738, "epoch": 1659} {"train_loss": -22.93338966369629, "global_step": 137739, "epoch": 1659} {"train_loss": -23.25702667236328, "global_step": 137740, "epoch": 1659} {"train_loss": -22.80214500427246, "global_step": 137741, "epoch": 1659} {"train_loss": -23.2763614654541, "global_step": 137742, "epoch": 1659} {"train_loss": -22.83144187927246, "global_step": 137743, "epoch": 1659} {"train_loss": -23.25680923461914, "global_step": 137744, "epoch": 1659} {"train_loss": -22.8363037109375, "global_step": 137745, "epoch": 1659} {"train_loss": -22.823585510253906, "global_step": 137746, "epoch": 1659} {"train_loss": -22.918703079223633, "global_step": 137747, "epoch": 1659} {"train_loss": -23.026092529296875, "global_step": 137748, "epoch": 1659} {"train_loss": -22.850425720214844, "global_step": 137749, "epoch": 1659} {"train_loss": -22.744457244873047, "global_step": 137750, "epoch": 1659} {"train_loss": -23.42837905883789, "global_step": 137751, "epoch": 1659} {"train_loss": -23.020689010620117, "global_step": 137752, "epoch": 1659} {"train_loss": -22.7337703704834, "global_step": 137753, "epoch": 1659} {"train_loss": -23.10357093811035, "global_step": 137754, "epoch": 1659} {"train_loss": -22.97249412536621, "global_step": 137755, "epoch": 1659} {"train_loss": -23.178077697753906, "global_step": 137756, "epoch": 1659} {"train_loss": -22.642765045166016, "global_step": 137757, "epoch": 1659} {"train_loss": -23.122343063354492, "global_step": 137758, "epoch": 1659} {"train_loss": -22.819480895996094, "global_step": 137759, "epoch": 1659} {"train_loss": -22.547149658203125, "global_step": 137760, "epoch": 1659} {"train_loss": -23.300146102905273, "global_step": 137761, "epoch": 1659} {"train_loss": -23.09956169128418, "global_step": 137762, "epoch": 1659} {"train_loss": -22.691532135009766, "global_step": 137763, "epoch": 1659} {"train_loss": -22.65142250061035, "global_step": 137764, "epoch": 1659} {"train_loss": -22.753372192382812, "global_step": 137765, "epoch": 1659} {"train_loss": -22.887645721435547, "global_step": 137766, "epoch": 1659} {"train_loss": -22.902862548828125, "global_step": 137767, "epoch": 1659} {"train_loss": -22.666149139404297, "global_step": 137768, "epoch": 1659} {"train_loss": -22.65864372253418, "global_step": 137769, "epoch": 1659} {"train_loss": -22.86945152282715, "global_step": 137770, "epoch": 1659} {"train_loss": -22.751752853393555, "global_step": 137771, "epoch": 1659} {"train_loss": -23.16755485534668, "global_step": 137772, "epoch": 1659} {"train_loss": -22.648273468017578, "global_step": 137773, "epoch": 1659} {"train_loss": -22.972412109375, "global_step": 137774, "epoch": 1659} {"train_loss": -22.879453659057617, "global_step": 137775, "epoch": 1659} {"train_loss": -22.640615463256836, "global_step": 137776, "epoch": 1659} {"train_loss": -22.860279083251953, "global_step": 137777, "epoch": 1659} {"train_loss": -22.968381881713867, "global_step": 137778, "epoch": 1659} {"train_loss": -22.95037051281297, "global_step": 137779, "epoch": 1659, "val_loss": 6255284.0} {"train_loss": -23.091856002807617, "global_step": 137780, "epoch": 1660} {"train_loss": -22.369657516479492, "global_step": 137781, "epoch": 1660} {"train_loss": -22.7274169921875, "global_step": 137782, "epoch": 1660} {"train_loss": -22.870620727539062, "global_step": 137783, "epoch": 1660} {"train_loss": -22.84085464477539, "global_step": 137784, "epoch": 1660} {"train_loss": -22.971134185791016, "global_step": 137785, "epoch": 1660} {"train_loss": -22.45358657836914, "global_step": 137786, "epoch": 1660} {"train_loss": -22.7401180267334, "global_step": 137787, "epoch": 1660} {"train_loss": -23.12518310546875, "global_step": 137788, "epoch": 1660} {"train_loss": -23.124452590942383, "global_step": 137789, "epoch": 1660} {"train_loss": -22.640750885009766, "global_step": 137790, "epoch": 1660} {"train_loss": -22.88176155090332, "global_step": 137791, "epoch": 1660} {"train_loss": -22.790172576904297, "global_step": 137792, "epoch": 1660} {"train_loss": -22.77330780029297, "global_step": 137793, "epoch": 1660} {"train_loss": -22.709802627563477, "global_step": 137794, "epoch": 1660} {"train_loss": -22.728076934814453, "global_step": 137795, "epoch": 1660} {"train_loss": -22.495519638061523, "global_step": 137796, "epoch": 1660} {"train_loss": -22.957128524780273, "global_step": 137797, "epoch": 1660} {"train_loss": -22.983789443969727, "global_step": 137798, "epoch": 1660} {"train_loss": -22.749494552612305, "global_step": 137799, "epoch": 1660} {"train_loss": -22.577116012573242, "global_step": 137800, "epoch": 1660} {"train_loss": -22.940128326416016, "global_step": 137801, "epoch": 1660} {"train_loss": -23.366357803344727, "global_step": 137802, "epoch": 1660} {"train_loss": -22.870168685913086, "global_step": 137803, "epoch": 1660} {"train_loss": -22.81418800354004, "global_step": 137804, "epoch": 1660} {"train_loss": -23.129663467407227, "global_step": 137805, "epoch": 1660} {"train_loss": -22.822744369506836, "global_step": 137806, "epoch": 1660} {"train_loss": -23.010971069335938, "global_step": 137807, "epoch": 1660} {"train_loss": -23.204391479492188, "global_step": 137808, "epoch": 1660} {"train_loss": -23.363428115844727, "global_step": 137809, "epoch": 1660} {"train_loss": -22.940963745117188, "global_step": 137810, "epoch": 1660} {"train_loss": -23.117765426635742, "global_step": 137811, "epoch": 1660} {"train_loss": -22.739389419555664, "global_step": 137812, "epoch": 1660} {"train_loss": -22.97397232055664, "global_step": 137813, "epoch": 1660} {"train_loss": -23.012659072875977, "global_step": 137814, "epoch": 1660} {"train_loss": -22.934804916381836, "global_step": 137815, "epoch": 1660} {"train_loss": -23.143917083740234, "global_step": 137816, "epoch": 1660} {"train_loss": -22.85474395751953, "global_step": 137817, "epoch": 1660} {"train_loss": -23.302051544189453, "global_step": 137818, "epoch": 1660} {"train_loss": -23.291202545166016, "global_step": 137819, "epoch": 1660} {"train_loss": -23.121986389160156, "global_step": 137820, "epoch": 1660} {"train_loss": -22.950124740600586, "global_step": 137821, "epoch": 1660} {"train_loss": -23.535184860229492, "global_step": 137822, "epoch": 1660} {"train_loss": -23.184629440307617, "global_step": 137823, "epoch": 1660} {"train_loss": -22.869625091552734, "global_step": 137824, "epoch": 1660} {"train_loss": -22.753171920776367, "global_step": 137825, "epoch": 1660} {"train_loss": -23.103410720825195, "global_step": 137826, "epoch": 1660} {"train_loss": -23.244245529174805, "global_step": 137827, "epoch": 1660} {"train_loss": -23.18111228942871, "global_step": 137828, "epoch": 1660} {"train_loss": -23.193771362304688, "global_step": 137829, "epoch": 1660} {"train_loss": -23.17601776123047, "global_step": 137830, "epoch": 1660} {"train_loss": -22.85731315612793, "global_step": 137831, "epoch": 1660} {"train_loss": -23.01277732849121, "global_step": 137832, "epoch": 1660} {"train_loss": -22.675342559814453, "global_step": 137833, "epoch": 1660} {"train_loss": -22.5479679107666, "global_step": 137834, "epoch": 1660} {"train_loss": -22.110671997070312, "global_step": 137835, "epoch": 1660} {"train_loss": -22.23065948486328, "global_step": 137836, "epoch": 1660} {"train_loss": -22.68947410583496, "global_step": 137837, "epoch": 1660} {"train_loss": -22.426727294921875, "global_step": 137838, "epoch": 1660} {"train_loss": -22.589040756225586, "global_step": 137839, "epoch": 1660} {"train_loss": -22.281082153320312, "global_step": 137840, "epoch": 1660} {"train_loss": -22.609960556030273, "global_step": 137841, "epoch": 1660} {"train_loss": -22.608047485351562, "global_step": 137842, "epoch": 1660} {"train_loss": -22.525634765625, "global_step": 137843, "epoch": 1660} {"train_loss": -22.252134323120117, "global_step": 137844, "epoch": 1660} {"train_loss": -22.78846549987793, "global_step": 137845, "epoch": 1660} {"train_loss": -22.838855743408203, "global_step": 137846, "epoch": 1660} {"train_loss": -22.49411964416504, "global_step": 137847, "epoch": 1660} {"train_loss": -22.763601303100586, "global_step": 137848, "epoch": 1660} {"train_loss": -22.88416862487793, "global_step": 137849, "epoch": 1660} {"train_loss": -22.703157424926758, "global_step": 137850, "epoch": 1660} {"train_loss": -22.779516220092773, "global_step": 137851, "epoch": 1660} {"train_loss": -22.95223045349121, "global_step": 137852, "epoch": 1660} {"train_loss": -22.87632179260254, "global_step": 137853, "epoch": 1660} {"train_loss": -22.804269790649414, "global_step": 137854, "epoch": 1660} {"train_loss": -22.98839569091797, "global_step": 137855, "epoch": 1660} {"train_loss": -22.672576904296875, "global_step": 137856, "epoch": 1660} {"train_loss": -23.260343551635742, "global_step": 137857, "epoch": 1660} {"train_loss": -23.141006469726562, "global_step": 137858, "epoch": 1660} {"train_loss": -22.460519790649414, "global_step": 137859, "epoch": 1660} {"train_loss": -22.918832778930664, "global_step": 137860, "epoch": 1660} {"train_loss": -22.904281616210938, "global_step": 137861, "epoch": 1660} {"train_loss": -22.851958240371154, "global_step": 137862, "epoch": 1660, "val_loss": 6199419.0} {"train_loss": -22.88157081604004, "global_step": 137863, "epoch": 1661} {"train_loss": -22.399789810180664, "global_step": 137864, "epoch": 1661} {"train_loss": -22.925724029541016, "global_step": 137865, "epoch": 1661} {"train_loss": -22.55596923828125, "global_step": 137866, "epoch": 1661} {"train_loss": -22.863601684570312, "global_step": 137867, "epoch": 1661} {"train_loss": -22.8735294342041, "global_step": 137868, "epoch": 1661} {"train_loss": -22.569772720336914, "global_step": 137869, "epoch": 1661} {"train_loss": -22.537723541259766, "global_step": 137870, "epoch": 1661} {"train_loss": -22.817670822143555, "global_step": 137871, "epoch": 1661} {"train_loss": -22.473535537719727, "global_step": 137872, "epoch": 1661} {"train_loss": -22.86031150817871, "global_step": 137873, "epoch": 1661} {"train_loss": -22.52400016784668, "global_step": 137874, "epoch": 1661} {"train_loss": -22.562990188598633, "global_step": 137875, "epoch": 1661} {"train_loss": -22.850223541259766, "global_step": 137876, "epoch": 1661} {"train_loss": -22.392475128173828, "global_step": 137877, "epoch": 1661} {"train_loss": -23.08448600769043, "global_step": 137878, "epoch": 1661} {"train_loss": -22.464567184448242, "global_step": 137879, "epoch": 1661} {"train_loss": -22.95710563659668, "global_step": 137880, "epoch": 1661} {"train_loss": -22.658056259155273, "global_step": 137881, "epoch": 1661} {"train_loss": -22.709196090698242, "global_step": 137882, "epoch": 1661} {"train_loss": -22.50205421447754, "global_step": 137883, "epoch": 1661} {"train_loss": -22.548696517944336, "global_step": 137884, "epoch": 1661} {"train_loss": -22.61474609375, "global_step": 137885, "epoch": 1661} {"train_loss": -22.925146102905273, "global_step": 137886, "epoch": 1661} {"train_loss": -22.924453735351562, "global_step": 137887, "epoch": 1661} {"train_loss": -22.6972713470459, "global_step": 137888, "epoch": 1661} {"train_loss": -22.74214744567871, "global_step": 137889, "epoch": 1661} {"train_loss": -22.76214027404785, "global_step": 137890, "epoch": 1661} {"train_loss": -22.51215934753418, "global_step": 137891, "epoch": 1661} {"train_loss": -23.16261863708496, "global_step": 137892, "epoch": 1661} {"train_loss": -23.165006637573242, "global_step": 137893, "epoch": 1661} {"train_loss": -22.894540786743164, "global_step": 137894, "epoch": 1661} {"train_loss": -22.97035026550293, "global_step": 137895, "epoch": 1661} {"train_loss": -22.79196548461914, "global_step": 137896, "epoch": 1661} {"train_loss": -23.103914260864258, "global_step": 137897, "epoch": 1661} {"train_loss": -22.59539794921875, "global_step": 137898, "epoch": 1661} {"train_loss": -22.971200942993164, "global_step": 137899, "epoch": 1661} {"train_loss": -22.837390899658203, "global_step": 137900, "epoch": 1661} {"train_loss": -22.497432708740234, "global_step": 137901, "epoch": 1661} {"train_loss": -22.919198989868164, "global_step": 137902, "epoch": 1661} {"train_loss": -22.77010154724121, "global_step": 137903, "epoch": 1661} {"train_loss": -23.092302322387695, "global_step": 137904, "epoch": 1661} {"train_loss": -22.936323165893555, "global_step": 137905, "epoch": 1661} {"train_loss": -22.757568359375, "global_step": 137906, "epoch": 1661} {"train_loss": -23.09229850769043, "global_step": 137907, "epoch": 1661} {"train_loss": -22.897281646728516, "global_step": 137908, "epoch": 1661} {"train_loss": -22.912738800048828, "global_step": 137909, "epoch": 1661} {"train_loss": -23.16891860961914, "global_step": 137910, "epoch": 1661} {"train_loss": -22.96927261352539, "global_step": 137911, "epoch": 1661} {"train_loss": -23.044612884521484, "global_step": 137912, "epoch": 1661} {"train_loss": -23.121360778808594, "global_step": 137913, "epoch": 1661} {"train_loss": -23.020618438720703, "global_step": 137914, "epoch": 1661} {"train_loss": -22.844480514526367, "global_step": 137915, "epoch": 1661} {"train_loss": -23.050024032592773, "global_step": 137916, "epoch": 1661} {"train_loss": -23.11384391784668, "global_step": 137917, "epoch": 1661} {"train_loss": -22.68739891052246, "global_step": 137918, "epoch": 1661} {"train_loss": -23.11295509338379, "global_step": 137919, "epoch": 1661} {"train_loss": -23.2179012298584, "global_step": 137920, "epoch": 1661} {"train_loss": -22.882192611694336, "global_step": 137921, "epoch": 1661} {"train_loss": -23.01070213317871, "global_step": 137922, "epoch": 1661} {"train_loss": -23.18718910217285, "global_step": 137923, "epoch": 1661} {"train_loss": -23.061155319213867, "global_step": 137924, "epoch": 1661} {"train_loss": -23.320209503173828, "global_step": 137925, "epoch": 1661} {"train_loss": -23.02653694152832, "global_step": 137926, "epoch": 1661} {"train_loss": -22.869312286376953, "global_step": 137927, "epoch": 1661} {"train_loss": -23.087894439697266, "global_step": 137928, "epoch": 1661} {"train_loss": -23.162158966064453, "global_step": 137929, "epoch": 1661} {"train_loss": -23.18817901611328, "global_step": 137930, "epoch": 1661} {"train_loss": -22.849843978881836, "global_step": 137931, "epoch": 1661} {"train_loss": -23.25428581237793, "global_step": 137932, "epoch": 1661} {"train_loss": -23.188337326049805, "global_step": 137933, "epoch": 1661} {"train_loss": -22.890256881713867, "global_step": 137934, "epoch": 1661} {"train_loss": -23.392675399780273, "global_step": 137935, "epoch": 1661} {"train_loss": -22.91435432434082, "global_step": 137936, "epoch": 1661} {"train_loss": -22.98158836364746, "global_step": 137937, "epoch": 1661} {"train_loss": -23.266843795776367, "global_step": 137938, "epoch": 1661} {"train_loss": -22.92603874206543, "global_step": 137939, "epoch": 1661} {"train_loss": -23.108190536499023, "global_step": 137940, "epoch": 1661} {"train_loss": -22.87113380432129, "global_step": 137941, "epoch": 1661} {"train_loss": -23.14204978942871, "global_step": 137942, "epoch": 1661} {"train_loss": -23.023740768432617, "global_step": 137943, "epoch": 1661} {"train_loss": -23.080259323120117, "global_step": 137944, "epoch": 1661} {"train_loss": -22.89732563064759, "global_step": 137945, "epoch": 1661, "val_loss": 6303510.5} {"train_loss": -22.980192184448242, "global_step": 137946, "epoch": 1662} {"train_loss": -22.865121841430664, "global_step": 137947, "epoch": 1662} {"train_loss": -22.59620475769043, "global_step": 137948, "epoch": 1662} {"train_loss": -22.7929630279541, "global_step": 137949, "epoch": 1662} {"train_loss": -22.879701614379883, "global_step": 137950, "epoch": 1662} {"train_loss": -22.975141525268555, "global_step": 137951, "epoch": 1662} {"train_loss": -23.08180809020996, "global_step": 137952, "epoch": 1662} {"train_loss": -22.866527557373047, "global_step": 137953, "epoch": 1662} {"train_loss": -22.958276748657227, "global_step": 137954, "epoch": 1662} {"train_loss": -23.04255485534668, "global_step": 137955, "epoch": 1662} {"train_loss": -22.893585205078125, "global_step": 137956, "epoch": 1662} {"train_loss": -22.945743560791016, "global_step": 137957, "epoch": 1662} {"train_loss": -23.076276779174805, "global_step": 137958, "epoch": 1662} {"train_loss": -22.82379722595215, "global_step": 137959, "epoch": 1662} {"train_loss": -22.953237533569336, "global_step": 137960, "epoch": 1662} {"train_loss": -23.18448829650879, "global_step": 137961, "epoch": 1662} {"train_loss": -22.644567489624023, "global_step": 137962, "epoch": 1662} {"train_loss": -22.723176956176758, "global_step": 137963, "epoch": 1662} {"train_loss": -23.074106216430664, "global_step": 137964, "epoch": 1662} {"train_loss": -22.570783615112305, "global_step": 137965, "epoch": 1662} {"train_loss": -22.90288734436035, "global_step": 137966, "epoch": 1662} {"train_loss": -22.74858283996582, "global_step": 137967, "epoch": 1662} {"train_loss": -22.76542091369629, "global_step": 137968, "epoch": 1662} {"train_loss": -22.85976791381836, "global_step": 137969, "epoch": 1662} {"train_loss": -22.76886558532715, "global_step": 137970, "epoch": 1662} {"train_loss": -22.930185317993164, "global_step": 137971, "epoch": 1662} {"train_loss": -23.092578887939453, "global_step": 137972, "epoch": 1662} {"train_loss": -22.91908836364746, "global_step": 137973, "epoch": 1662} {"train_loss": -22.956151962280273, "global_step": 137974, "epoch": 1662} {"train_loss": -22.649267196655273, "global_step": 137975, "epoch": 1662} {"train_loss": -23.04097557067871, "global_step": 137976, "epoch": 1662} {"train_loss": -22.819103240966797, "global_step": 137977, "epoch": 1662} {"train_loss": -22.87734603881836, "global_step": 137978, "epoch": 1662} {"train_loss": -22.754318237304688, "global_step": 137979, "epoch": 1662} {"train_loss": -23.18153953552246, "global_step": 137980, "epoch": 1662} {"train_loss": -23.096683502197266, "global_step": 137981, "epoch": 1662} {"train_loss": -22.838041305541992, "global_step": 137982, "epoch": 1662} {"train_loss": -22.911123275756836, "global_step": 137983, "epoch": 1662} {"train_loss": -23.25192642211914, "global_step": 137984, "epoch": 1662} {"train_loss": -23.216703414916992, "global_step": 137985, "epoch": 1662} {"train_loss": -23.08091163635254, "global_step": 137986, "epoch": 1662} {"train_loss": -23.3267879486084, "global_step": 137987, "epoch": 1662} {"train_loss": -23.256141662597656, "global_step": 137988, "epoch": 1662} {"train_loss": -23.32053565979004, "global_step": 137989, "epoch": 1662} {"train_loss": -23.353118896484375, "global_step": 137990, "epoch": 1662} {"train_loss": -23.165746688842773, "global_step": 137991, "epoch": 1662} {"train_loss": -23.393640518188477, "global_step": 137992, "epoch": 1662} {"train_loss": -22.596097946166992, "global_step": 137993, "epoch": 1662} {"train_loss": -23.02119255065918, "global_step": 137994, "epoch": 1662} {"train_loss": -22.792875289916992, "global_step": 137995, "epoch": 1662} {"train_loss": -23.016855239868164, "global_step": 137996, "epoch": 1662} {"train_loss": -23.100488662719727, "global_step": 137997, "epoch": 1662} {"train_loss": -23.214311599731445, "global_step": 137998, "epoch": 1662} {"train_loss": -22.909645080566406, "global_step": 137999, "epoch": 1662} {"train_loss": -22.98855972290039, "global_step": 138000, "epoch": 1662} {"train_loss": -23.23676109313965, "global_step": 138001, "epoch": 1662} {"train_loss": -22.921478271484375, "global_step": 138002, "epoch": 1662} {"train_loss": -22.645816802978516, "global_step": 138003, "epoch": 1662} {"train_loss": -22.997474670410156, "global_step": 138004, "epoch": 1662} {"train_loss": -23.168354034423828, "global_step": 138005, "epoch": 1662} {"train_loss": -22.84235191345215, "global_step": 138006, "epoch": 1662} {"train_loss": -22.813556671142578, "global_step": 138007, "epoch": 1662} {"train_loss": -22.76297378540039, "global_step": 138008, "epoch": 1662} {"train_loss": -22.972787857055664, "global_step": 138009, "epoch": 1662} {"train_loss": -23.104726791381836, "global_step": 138010, "epoch": 1662} {"train_loss": -22.467737197875977, "global_step": 138011, "epoch": 1662} {"train_loss": -22.941343307495117, "global_step": 138012, "epoch": 1662} {"train_loss": -23.077930450439453, "global_step": 138013, "epoch": 1662} {"train_loss": -23.135488510131836, "global_step": 138014, "epoch": 1662} {"train_loss": -22.64985466003418, "global_step": 138015, "epoch": 1662} {"train_loss": -23.119176864624023, "global_step": 138016, "epoch": 1662} {"train_loss": -23.385528564453125, "global_step": 138017, "epoch": 1662} {"train_loss": -23.00905418395996, "global_step": 138018, "epoch": 1662} {"train_loss": -22.598447799682617, "global_step": 138019, "epoch": 1662} {"train_loss": -22.87925910949707, "global_step": 138020, "epoch": 1662} {"train_loss": -23.455320358276367, "global_step": 138021, "epoch": 1662} {"train_loss": -23.217548370361328, "global_step": 138022, "epoch": 1662} {"train_loss": -23.132625579833984, "global_step": 138023, "epoch": 1662} {"train_loss": -23.030847549438477, "global_step": 138024, "epoch": 1662} {"train_loss": -23.10546875, "global_step": 138025, "epoch": 1662} {"train_loss": -22.98506736755371, "global_step": 138026, "epoch": 1662} {"train_loss": -22.973148345947266, "global_step": 138027, "epoch": 1662} {"train_loss": -22.976853221295826, "global_step": 138028, "epoch": 1662, "val_loss": 6259332.5} {"train_loss": -22.535985946655273, "global_step": 138029, "epoch": 1663} {"train_loss": -22.10966682434082, "global_step": 138030, "epoch": 1663} {"train_loss": -22.69148063659668, "global_step": 138031, "epoch": 1663} {"train_loss": -22.842588424682617, "global_step": 138032, "epoch": 1663} {"train_loss": -22.253677368164062, "global_step": 138033, "epoch": 1663} {"train_loss": -23.07605743408203, "global_step": 138034, "epoch": 1663} {"train_loss": -22.6363582611084, "global_step": 138035, "epoch": 1663} {"train_loss": -23.200544357299805, "global_step": 138036, "epoch": 1663} {"train_loss": -22.810348510742188, "global_step": 138037, "epoch": 1663} {"train_loss": -22.89654541015625, "global_step": 138038, "epoch": 1663} {"train_loss": -22.703516006469727, "global_step": 138039, "epoch": 1663} {"train_loss": -22.62335205078125, "global_step": 138040, "epoch": 1663} {"train_loss": -22.864517211914062, "global_step": 138041, "epoch": 1663} {"train_loss": -22.81296157836914, "global_step": 138042, "epoch": 1663} {"train_loss": -22.627573013305664, "global_step": 138043, "epoch": 1663} {"train_loss": -23.152088165283203, "global_step": 138044, "epoch": 1663} {"train_loss": -22.61590576171875, "global_step": 138045, "epoch": 1663} {"train_loss": -22.758590698242188, "global_step": 138046, "epoch": 1663} {"train_loss": -22.533676147460938, "global_step": 138047, "epoch": 1663} {"train_loss": -22.74962043762207, "global_step": 138048, "epoch": 1663} {"train_loss": -23.0203857421875, "global_step": 138049, "epoch": 1663} {"train_loss": -23.110687255859375, "global_step": 138050, "epoch": 1663} {"train_loss": -22.747894287109375, "global_step": 138051, "epoch": 1663} {"train_loss": -22.582990646362305, "global_step": 138052, "epoch": 1663} {"train_loss": -23.188817977905273, "global_step": 138053, "epoch": 1663} {"train_loss": -23.08050537109375, "global_step": 138054, "epoch": 1663} {"train_loss": -22.9664306640625, "global_step": 138055, "epoch": 1663} {"train_loss": -23.00153923034668, "global_step": 138056, "epoch": 1663} {"train_loss": -22.960111618041992, "global_step": 138057, "epoch": 1663} {"train_loss": -23.35391616821289, "global_step": 138058, "epoch": 1663} {"train_loss": -23.00198745727539, "global_step": 138059, "epoch": 1663} {"train_loss": -23.080198287963867, "global_step": 138060, "epoch": 1663} {"train_loss": -22.837553024291992, "global_step": 138061, "epoch": 1663} {"train_loss": -23.007909774780273, "global_step": 138062, "epoch": 1663} {"train_loss": -22.86751365661621, "global_step": 138063, "epoch": 1663} {"train_loss": -23.02455711364746, "global_step": 138064, "epoch": 1663} {"train_loss": -22.985132217407227, "global_step": 138065, "epoch": 1663} {"train_loss": -22.92659568786621, "global_step": 138066, "epoch": 1663} {"train_loss": -22.825044631958008, "global_step": 138067, "epoch": 1663} {"train_loss": -22.942270278930664, "global_step": 138068, "epoch": 1663} {"train_loss": -23.068384170532227, "global_step": 138069, "epoch": 1663} {"train_loss": -23.18158531188965, "global_step": 138070, "epoch": 1663} {"train_loss": -22.796857833862305, "global_step": 138071, "epoch": 1663} {"train_loss": -22.969186782836914, "global_step": 138072, "epoch": 1663} {"train_loss": -22.75311279296875, "global_step": 138073, "epoch": 1663} {"train_loss": -22.97420310974121, "global_step": 138074, "epoch": 1663} {"train_loss": -23.278234481811523, "global_step": 138075, "epoch": 1663} {"train_loss": -23.293725967407227, "global_step": 138076, "epoch": 1663} {"train_loss": -23.35529899597168, "global_step": 138077, "epoch": 1663} {"train_loss": -23.14681053161621, "global_step": 138078, "epoch": 1663} {"train_loss": -23.1175479888916, "global_step": 138079, "epoch": 1663} {"train_loss": -23.08992576599121, "global_step": 138080, "epoch": 1663} {"train_loss": -23.257658004760742, "global_step": 138081, "epoch": 1663} {"train_loss": -22.763629913330078, "global_step": 138082, "epoch": 1663} {"train_loss": -22.814634323120117, "global_step": 138083, "epoch": 1663} {"train_loss": -23.163537979125977, "global_step": 138084, "epoch": 1663} {"train_loss": -23.230941772460938, "global_step": 138085, "epoch": 1663} {"train_loss": -22.70237159729004, "global_step": 138086, "epoch": 1663} {"train_loss": -22.94116973876953, "global_step": 138087, "epoch": 1663} {"train_loss": -23.210168838500977, "global_step": 138088, "epoch": 1663} {"train_loss": -22.973800659179688, "global_step": 138089, "epoch": 1663} {"train_loss": -22.800296783447266, "global_step": 138090, "epoch": 1663} {"train_loss": -22.93253517150879, "global_step": 138091, "epoch": 1663} {"train_loss": -22.953157424926758, "global_step": 138092, "epoch": 1663} {"train_loss": -22.758935928344727, "global_step": 138093, "epoch": 1663} {"train_loss": -23.058889389038086, "global_step": 138094, "epoch": 1663} {"train_loss": -22.623655319213867, "global_step": 138095, "epoch": 1663} {"train_loss": -22.77294921875, "global_step": 138096, "epoch": 1663} {"train_loss": -23.282548904418945, "global_step": 138097, "epoch": 1663} {"train_loss": -22.831958770751953, "global_step": 138098, "epoch": 1663} {"train_loss": -22.93330192565918, "global_step": 138099, "epoch": 1663} {"train_loss": -22.833328247070312, "global_step": 138100, "epoch": 1663} {"train_loss": -23.18589973449707, "global_step": 138101, "epoch": 1663} {"train_loss": -22.87278175354004, "global_step": 138102, "epoch": 1663} {"train_loss": -23.239370346069336, "global_step": 138103, "epoch": 1663} {"train_loss": -22.971742630004883, "global_step": 138104, "epoch": 1663} {"train_loss": -22.888076782226562, "global_step": 138105, "epoch": 1663} {"train_loss": -22.836591720581055, "global_step": 138106, "epoch": 1663} {"train_loss": -23.120105743408203, "global_step": 138107, "epoch": 1663} {"train_loss": -23.060163497924805, "global_step": 138108, "epoch": 1663} {"train_loss": -23.064340591430664, "global_step": 138109, "epoch": 1663} {"train_loss": -23.015233993530273, "global_step": 138110, "epoch": 1663} {"train_loss": -22.94251607412315, "global_step": 138111, "epoch": 1663, "val_loss": 6191098.0} {"train_loss": -22.216915130615234, "global_step": 138112, "epoch": 1664} {"train_loss": -22.61056137084961, "global_step": 138113, "epoch": 1664} {"train_loss": -22.2872257232666, "global_step": 138114, "epoch": 1664} {"train_loss": -22.889286041259766, "global_step": 138115, "epoch": 1664} {"train_loss": -22.395427703857422, "global_step": 138116, "epoch": 1664} {"train_loss": -22.588788986206055, "global_step": 138117, "epoch": 1664} {"train_loss": -22.0147762298584, "global_step": 138118, "epoch": 1664} {"train_loss": -22.675790786743164, "global_step": 138119, "epoch": 1664} {"train_loss": -22.51106071472168, "global_step": 138120, "epoch": 1664} {"train_loss": -23.004791259765625, "global_step": 138121, "epoch": 1664} {"train_loss": -22.398611068725586, "global_step": 138122, "epoch": 1664} {"train_loss": -22.50625991821289, "global_step": 138123, "epoch": 1664} {"train_loss": -22.80238914489746, "global_step": 138124, "epoch": 1664} {"train_loss": -22.995466232299805, "global_step": 138125, "epoch": 1664} {"train_loss": -22.821741104125977, "global_step": 138126, "epoch": 1664} {"train_loss": -22.91800308227539, "global_step": 138127, "epoch": 1664} {"train_loss": -22.99281883239746, "global_step": 138128, "epoch": 1664} {"train_loss": -22.445947647094727, "global_step": 138129, "epoch": 1664} {"train_loss": -22.681795120239258, "global_step": 138130, "epoch": 1664} {"train_loss": -22.542612075805664, "global_step": 138131, "epoch": 1664} {"train_loss": -22.74332618713379, "global_step": 138132, "epoch": 1664} {"train_loss": -23.009939193725586, "global_step": 138133, "epoch": 1664} {"train_loss": -23.062997817993164, "global_step": 138134, "epoch": 1664} {"train_loss": -22.758663177490234, "global_step": 138135, "epoch": 1664} {"train_loss": -23.080854415893555, "global_step": 138136, "epoch": 1664} {"train_loss": -22.851240158081055, "global_step": 138137, "epoch": 1664} {"train_loss": -22.752914428710938, "global_step": 138138, "epoch": 1664} {"train_loss": -22.899839401245117, "global_step": 138139, "epoch": 1664} {"train_loss": -22.87666893005371, "global_step": 138140, "epoch": 1664} {"train_loss": -23.13608741760254, "global_step": 138141, "epoch": 1664} {"train_loss": -22.66921043395996, "global_step": 138142, "epoch": 1664} {"train_loss": -23.20804786682129, "global_step": 138143, "epoch": 1664} {"train_loss": -23.11783790588379, "global_step": 138144, "epoch": 1664} {"train_loss": -22.853185653686523, "global_step": 138145, "epoch": 1664} {"train_loss": -22.715906143188477, "global_step": 138146, "epoch": 1664} {"train_loss": -22.657745361328125, "global_step": 138147, "epoch": 1664} {"train_loss": -23.063827514648438, "global_step": 138148, "epoch": 1664} {"train_loss": -22.57260513305664, "global_step": 138149, "epoch": 1664} {"train_loss": -23.13276481628418, "global_step": 138150, "epoch": 1664} {"train_loss": -22.973588943481445, "global_step": 138151, "epoch": 1664} {"train_loss": -22.951580047607422, "global_step": 138152, "epoch": 1664} {"train_loss": -22.63663101196289, "global_step": 138153, "epoch": 1664} {"train_loss": -22.791120529174805, "global_step": 138154, "epoch": 1664} {"train_loss": -23.292034149169922, "global_step": 138155, "epoch": 1664} {"train_loss": -22.89278221130371, "global_step": 138156, "epoch": 1664} {"train_loss": -22.927457809448242, "global_step": 138157, "epoch": 1664} {"train_loss": -22.887237548828125, "global_step": 138158, "epoch": 1664} {"train_loss": -22.9459228515625, "global_step": 138159, "epoch": 1664} {"train_loss": -22.862384796142578, "global_step": 138160, "epoch": 1664} {"train_loss": -23.47279930114746, "global_step": 138161, "epoch": 1664} {"train_loss": -22.79825782775879, "global_step": 138162, "epoch": 1664} {"train_loss": -23.252151489257812, "global_step": 138163, "epoch": 1664} {"train_loss": -23.268482208251953, "global_step": 138164, "epoch": 1664} {"train_loss": -22.823760986328125, "global_step": 138165, "epoch": 1664} {"train_loss": -23.209753036499023, "global_step": 138166, "epoch": 1664} {"train_loss": -23.53731346130371, "global_step": 138167, "epoch": 1664} {"train_loss": -22.874717712402344, "global_step": 138168, "epoch": 1664} {"train_loss": -23.341718673706055, "global_step": 138169, "epoch": 1664} {"train_loss": -23.042667388916016, "global_step": 138170, "epoch": 1664} {"train_loss": -23.173234939575195, "global_step": 138171, "epoch": 1664} {"train_loss": -22.995901107788086, "global_step": 138172, "epoch": 1664} {"train_loss": -23.407102584838867, "global_step": 138173, "epoch": 1664} {"train_loss": -22.9725284576416, "global_step": 138174, "epoch": 1664} {"train_loss": -22.80650520324707, "global_step": 138175, "epoch": 1664} {"train_loss": -23.13050651550293, "global_step": 138176, "epoch": 1664} {"train_loss": -23.05547523498535, "global_step": 138177, "epoch": 1664} {"train_loss": -22.769535064697266, "global_step": 138178, "epoch": 1664} {"train_loss": -23.333101272583008, "global_step": 138179, "epoch": 1664} {"train_loss": -23.400527954101562, "global_step": 138180, "epoch": 1664} {"train_loss": -22.76088523864746, "global_step": 138181, "epoch": 1664} {"train_loss": -23.295902252197266, "global_step": 138182, "epoch": 1664} {"train_loss": -22.8253231048584, "global_step": 138183, "epoch": 1664} {"train_loss": -23.028989791870117, "global_step": 138184, "epoch": 1664} {"train_loss": -23.30168342590332, "global_step": 138185, "epoch": 1664} {"train_loss": -22.85601043701172, "global_step": 138186, "epoch": 1664} {"train_loss": -22.936574935913086, "global_step": 138187, "epoch": 1664} {"train_loss": -23.19232749938965, "global_step": 138188, "epoch": 1664} {"train_loss": -23.017370223999023, "global_step": 138189, "epoch": 1664} {"train_loss": -22.628360748291016, "global_step": 138190, "epoch": 1664} {"train_loss": -23.359027862548828, "global_step": 138191, "epoch": 1664} {"train_loss": -23.32044792175293, "global_step": 138192, "epoch": 1664} {"train_loss": -23.480276107788086, "global_step": 138193, "epoch": 1664} {"train_loss": -22.89391143063465, "global_step": 138194, "epoch": 1664, "val_loss": 6293890.5} {"train_loss": -22.57543182373047, "global_step": 138195, "epoch": 1665} {"train_loss": -22.78509521484375, "global_step": 138196, "epoch": 1665} {"train_loss": -22.842023849487305, "global_step": 138197, "epoch": 1665} {"train_loss": -22.446836471557617, "global_step": 138198, "epoch": 1665} {"train_loss": -22.538381576538086, "global_step": 138199, "epoch": 1665} {"train_loss": -22.41452407836914, "global_step": 138200, "epoch": 1665} {"train_loss": -22.885452270507812, "global_step": 138201, "epoch": 1665} {"train_loss": -22.302968978881836, "global_step": 138202, "epoch": 1665} {"train_loss": -22.443317413330078, "global_step": 138203, "epoch": 1665} {"train_loss": -22.42616844177246, "global_step": 138204, "epoch": 1665} {"train_loss": -22.566951751708984, "global_step": 138205, "epoch": 1665} {"train_loss": -22.332223892211914, "global_step": 138206, "epoch": 1665} {"train_loss": -22.813047409057617, "global_step": 138207, "epoch": 1665} {"train_loss": -22.527015686035156, "global_step": 138208, "epoch": 1665} {"train_loss": -22.642200469970703, "global_step": 138209, "epoch": 1665} {"train_loss": -22.656421661376953, "global_step": 138210, "epoch": 1665} {"train_loss": -22.546072006225586, "global_step": 138211, "epoch": 1665} {"train_loss": -22.711994171142578, "global_step": 138212, "epoch": 1665} {"train_loss": -23.09184455871582, "global_step": 138213, "epoch": 1665} {"train_loss": -22.371397018432617, "global_step": 138214, "epoch": 1665} {"train_loss": -22.592741012573242, "global_step": 138215, "epoch": 1665} {"train_loss": -22.585405349731445, "global_step": 138216, "epoch": 1665} {"train_loss": -22.75691795349121, "global_step": 138217, "epoch": 1665} {"train_loss": -22.951513290405273, "global_step": 138218, "epoch": 1665} {"train_loss": -22.598968505859375, "global_step": 138219, "epoch": 1665} {"train_loss": -22.892044067382812, "global_step": 138220, "epoch": 1665} {"train_loss": -22.431406021118164, "global_step": 138221, "epoch": 1665} {"train_loss": -22.66236686706543, "global_step": 138222, "epoch": 1665} {"train_loss": -22.891944885253906, "global_step": 138223, "epoch": 1665} {"train_loss": -23.013402938842773, "global_step": 138224, "epoch": 1665} {"train_loss": -22.699230194091797, "global_step": 138225, "epoch": 1665} {"train_loss": -22.99979591369629, "global_step": 138226, "epoch": 1665} {"train_loss": -23.27370262145996, "global_step": 138227, "epoch": 1665} {"train_loss": -22.812793731689453, "global_step": 138228, "epoch": 1665} {"train_loss": -23.15667152404785, "global_step": 138229, "epoch": 1665} {"train_loss": -22.76022720336914, "global_step": 138230, "epoch": 1665} {"train_loss": -22.82123374938965, "global_step": 138231, "epoch": 1665} {"train_loss": -23.295164108276367, "global_step": 138232, "epoch": 1665} {"train_loss": -23.0345458984375, "global_step": 138233, "epoch": 1665} {"train_loss": -22.743881225585938, "global_step": 138234, "epoch": 1665} {"train_loss": -22.99197769165039, "global_step": 138235, "epoch": 1665} {"train_loss": -23.362180709838867, "global_step": 138236, "epoch": 1665} {"train_loss": -23.203914642333984, "global_step": 138237, "epoch": 1665} {"train_loss": -22.966520309448242, "global_step": 138238, "epoch": 1665} {"train_loss": -22.86481285095215, "global_step": 138239, "epoch": 1665} {"train_loss": -22.75457763671875, "global_step": 138240, "epoch": 1665} {"train_loss": -23.284072875976562, "global_step": 138241, "epoch": 1665} {"train_loss": -22.81825828552246, "global_step": 138242, "epoch": 1665} {"train_loss": -22.97731590270996, "global_step": 138243, "epoch": 1665} {"train_loss": -23.17848777770996, "global_step": 138244, "epoch": 1665} {"train_loss": -22.88505744934082, "global_step": 138245, "epoch": 1665} {"train_loss": -23.18239974975586, "global_step": 138246, "epoch": 1665} {"train_loss": -22.75897216796875, "global_step": 138247, "epoch": 1665} {"train_loss": -22.798307418823242, "global_step": 138248, "epoch": 1665} {"train_loss": -22.949031829833984, "global_step": 138249, "epoch": 1665} {"train_loss": -23.00140953063965, "global_step": 138250, "epoch": 1665} {"train_loss": -23.202756881713867, "global_step": 138251, "epoch": 1665} {"train_loss": -23.251388549804688, "global_step": 138252, "epoch": 1665} {"train_loss": -23.166414260864258, "global_step": 138253, "epoch": 1665} {"train_loss": -22.94403076171875, "global_step": 138254, "epoch": 1665} {"train_loss": -23.2719669342041, "global_step": 138255, "epoch": 1665} {"train_loss": -23.255468368530273, "global_step": 138256, "epoch": 1665} {"train_loss": -23.445241928100586, "global_step": 138257, "epoch": 1665} {"train_loss": -22.990013122558594, "global_step": 138258, "epoch": 1665} {"train_loss": -23.20015525817871, "global_step": 138259, "epoch": 1665} {"train_loss": -22.661863327026367, "global_step": 138260, "epoch": 1665} {"train_loss": -22.856847763061523, "global_step": 138261, "epoch": 1665} {"train_loss": -23.244855880737305, "global_step": 138262, "epoch": 1665} {"train_loss": -23.17396354675293, "global_step": 138263, "epoch": 1665} {"train_loss": -23.139917373657227, "global_step": 138264, "epoch": 1665} {"train_loss": -23.201305389404297, "global_step": 138265, "epoch": 1665} {"train_loss": -22.929412841796875, "global_step": 138266, "epoch": 1665} {"train_loss": -22.44676971435547, "global_step": 138267, "epoch": 1665} {"train_loss": -22.844791412353516, "global_step": 138268, "epoch": 1665} {"train_loss": -22.77804946899414, "global_step": 138269, "epoch": 1665} {"train_loss": -23.226987838745117, "global_step": 138270, "epoch": 1665} {"train_loss": -23.0288143157959, "global_step": 138271, "epoch": 1665} {"train_loss": -22.7723388671875, "global_step": 138272, "epoch": 1665} {"train_loss": -23.484060287475586, "global_step": 138273, "epoch": 1665} {"train_loss": -23.031482696533203, "global_step": 138274, "epoch": 1665} {"train_loss": -23.123844146728516, "global_step": 138275, "epoch": 1665} {"train_loss": -23.19550132751465, "global_step": 138276, "epoch": 1665} {"train_loss": -22.91058584006436, "global_step": 138277, "epoch": 1665, "val_loss": 6326948.0} {"train_loss": -22.54520606994629, "global_step": 138278, "epoch": 1666} {"train_loss": -22.40159034729004, "global_step": 138279, "epoch": 1666} {"train_loss": -22.44226837158203, "global_step": 138280, "epoch": 1666} {"train_loss": -22.948789596557617, "global_step": 138281, "epoch": 1666} {"train_loss": -22.370777130126953, "global_step": 138282, "epoch": 1666} {"train_loss": -22.96120262145996, "global_step": 138283, "epoch": 1666} {"train_loss": -22.39406394958496, "global_step": 138284, "epoch": 1666} {"train_loss": -22.7885799407959, "global_step": 138285, "epoch": 1666} {"train_loss": -22.86341094970703, "global_step": 138286, "epoch": 1666} {"train_loss": -22.59218406677246, "global_step": 138287, "epoch": 1666} {"train_loss": -22.603689193725586, "global_step": 138288, "epoch": 1666} {"train_loss": -22.946401596069336, "global_step": 138289, "epoch": 1666} {"train_loss": -22.81122589111328, "global_step": 138290, "epoch": 1666} {"train_loss": -22.892898559570312, "global_step": 138291, "epoch": 1666} {"train_loss": -23.2017879486084, "global_step": 138292, "epoch": 1666} {"train_loss": -22.703962326049805, "global_step": 138293, "epoch": 1666} {"train_loss": -22.84773063659668, "global_step": 138294, "epoch": 1666} {"train_loss": -23.13176155090332, "global_step": 138295, "epoch": 1666} {"train_loss": -22.94647789001465, "global_step": 138296, "epoch": 1666} {"train_loss": -23.232067108154297, "global_step": 138297, "epoch": 1666} {"train_loss": -22.793603897094727, "global_step": 138298, "epoch": 1666} {"train_loss": -22.645034790039062, "global_step": 138299, "epoch": 1666} {"train_loss": -22.938764572143555, "global_step": 138300, "epoch": 1666} {"train_loss": -22.977750778198242, "global_step": 138301, "epoch": 1666} {"train_loss": -23.02077865600586, "global_step": 138302, "epoch": 1666} {"train_loss": -23.43381118774414, "global_step": 138303, "epoch": 1666} {"train_loss": -22.777992248535156, "global_step": 138304, "epoch": 1666} {"train_loss": -23.19085693359375, "global_step": 138305, "epoch": 1666} {"train_loss": -23.1835994720459, "global_step": 138306, "epoch": 1666} {"train_loss": -22.96630859375, "global_step": 138307, "epoch": 1666} {"train_loss": -22.831212997436523, "global_step": 138308, "epoch": 1666} {"train_loss": -23.107786178588867, "global_step": 138309, "epoch": 1666} {"train_loss": -22.978239059448242, "global_step": 138310, "epoch": 1666} {"train_loss": -22.897415161132812, "global_step": 138311, "epoch": 1666} {"train_loss": -22.93539810180664, "global_step": 138312, "epoch": 1666} {"train_loss": -22.77925682067871, "global_step": 138313, "epoch": 1666} {"train_loss": -22.917497634887695, "global_step": 138314, "epoch": 1666} {"train_loss": -23.341917037963867, "global_step": 138315, "epoch": 1666} {"train_loss": -22.944984436035156, "global_step": 138316, "epoch": 1666} {"train_loss": -23.06061363220215, "global_step": 138317, "epoch": 1666} {"train_loss": -22.799560546875, "global_step": 138318, "epoch": 1666} {"train_loss": -23.055814743041992, "global_step": 138319, "epoch": 1666} {"train_loss": -22.941640853881836, "global_step": 138320, "epoch": 1666} {"train_loss": -22.52252197265625, "global_step": 138321, "epoch": 1666} {"train_loss": -22.745452880859375, "global_step": 138322, "epoch": 1666} {"train_loss": -23.132421493530273, "global_step": 138323, "epoch": 1666} {"train_loss": -22.986921310424805, "global_step": 138324, "epoch": 1666} {"train_loss": -23.300704956054688, "global_step": 138325, "epoch": 1666} {"train_loss": -22.465595245361328, "global_step": 138326, "epoch": 1666} {"train_loss": -23.32561683654785, "global_step": 138327, "epoch": 1666} {"train_loss": -22.997936248779297, "global_step": 138328, "epoch": 1666} {"train_loss": -23.040876388549805, "global_step": 138329, "epoch": 1666} {"train_loss": -23.240774154663086, "global_step": 138330, "epoch": 1666} {"train_loss": -23.017805099487305, "global_step": 138331, "epoch": 1666} {"train_loss": -23.06757164001465, "global_step": 138332, "epoch": 1666} {"train_loss": -23.428152084350586, "global_step": 138333, "epoch": 1666} {"train_loss": -23.021228790283203, "global_step": 138334, "epoch": 1666} {"train_loss": -22.863096237182617, "global_step": 138335, "epoch": 1666} {"train_loss": -22.924087524414062, "global_step": 138336, "epoch": 1666} {"train_loss": -23.44841957092285, "global_step": 138337, "epoch": 1666} {"train_loss": -22.96723747253418, "global_step": 138338, "epoch": 1666} {"train_loss": -22.74074363708496, "global_step": 138339, "epoch": 1666} {"train_loss": -22.99049186706543, "global_step": 138340, "epoch": 1666} {"train_loss": -23.07630157470703, "global_step": 138341, "epoch": 1666} {"train_loss": -23.176321029663086, "global_step": 138342, "epoch": 1666} {"train_loss": -23.0480899810791, "global_step": 138343, "epoch": 1666} {"train_loss": -23.290815353393555, "global_step": 138344, "epoch": 1666} {"train_loss": -22.879318237304688, "global_step": 138345, "epoch": 1666} {"train_loss": -22.901615142822266, "global_step": 138346, "epoch": 1666} {"train_loss": -23.141645431518555, "global_step": 138347, "epoch": 1666} {"train_loss": -22.964481353759766, "global_step": 138348, "epoch": 1666} {"train_loss": -23.09174156188965, "global_step": 138349, "epoch": 1666} {"train_loss": -23.12453269958496, "global_step": 138350, "epoch": 1666} {"train_loss": -22.850696563720703, "global_step": 138351, "epoch": 1666} {"train_loss": -22.9460391998291, "global_step": 138352, "epoch": 1666} {"train_loss": -23.098617553710938, "global_step": 138353, "epoch": 1666} {"train_loss": -23.22405433654785, "global_step": 138354, "epoch": 1666} {"train_loss": -22.94598960876465, "global_step": 138355, "epoch": 1666} {"train_loss": -22.643707275390625, "global_step": 138356, "epoch": 1666} {"train_loss": -22.694448471069336, "global_step": 138357, "epoch": 1666} {"train_loss": -22.791584014892578, "global_step": 138358, "epoch": 1666} {"train_loss": -22.758808135986328, "global_step": 138359, "epoch": 1666} {"train_loss": -22.939601921173463, "global_step": 138360, "epoch": 1666, "val_loss": 6358164.0} {"train_loss": -22.000547409057617, "global_step": 138361, "epoch": 1667} {"train_loss": -22.613235473632812, "global_step": 138362, "epoch": 1667} {"train_loss": -22.684293746948242, "global_step": 138363, "epoch": 1667} {"train_loss": -22.83737564086914, "global_step": 138364, "epoch": 1667} {"train_loss": -22.143030166625977, "global_step": 138365, "epoch": 1667} {"train_loss": -22.63336753845215, "global_step": 138366, "epoch": 1667} {"train_loss": -22.460004806518555, "global_step": 138367, "epoch": 1667} {"train_loss": -22.330129623413086, "global_step": 138368, "epoch": 1667} {"train_loss": -22.793455123901367, "global_step": 138369, "epoch": 1667} {"train_loss": -22.6202449798584, "global_step": 138370, "epoch": 1667} {"train_loss": -22.82293701171875, "global_step": 138371, "epoch": 1667} {"train_loss": -22.529569625854492, "global_step": 138372, "epoch": 1667} {"train_loss": -22.95339012145996, "global_step": 138373, "epoch": 1667} {"train_loss": -23.050901412963867, "global_step": 138374, "epoch": 1667} {"train_loss": -22.781049728393555, "global_step": 138375, "epoch": 1667} {"train_loss": -22.85210609436035, "global_step": 138376, "epoch": 1667} {"train_loss": -22.912185668945312, "global_step": 138377, "epoch": 1667} {"train_loss": -22.97370719909668, "global_step": 138378, "epoch": 1667} {"train_loss": -23.281156539916992, "global_step": 138379, "epoch": 1667} {"train_loss": -23.059059143066406, "global_step": 138380, "epoch": 1667} {"train_loss": -23.425657272338867, "global_step": 138381, "epoch": 1667} {"train_loss": -23.033306121826172, "global_step": 138382, "epoch": 1667} {"train_loss": -23.214574813842773, "global_step": 138383, "epoch": 1667} {"train_loss": -23.30183219909668, "global_step": 138384, "epoch": 1667} {"train_loss": -23.0640869140625, "global_step": 138385, "epoch": 1667} {"train_loss": -22.758203506469727, "global_step": 138386, "epoch": 1667} {"train_loss": -23.55641746520996, "global_step": 138387, "epoch": 1667} {"train_loss": -23.193675994873047, "global_step": 138388, "epoch": 1667} {"train_loss": -23.103986740112305, "global_step": 138389, "epoch": 1667} {"train_loss": -23.198787689208984, "global_step": 138390, "epoch": 1667} {"train_loss": -22.989660263061523, "global_step": 138391, "epoch": 1667} {"train_loss": -22.8720760345459, "global_step": 138392, "epoch": 1667} {"train_loss": -23.469045639038086, "global_step": 138393, "epoch": 1667} {"train_loss": -23.283353805541992, "global_step": 138394, "epoch": 1667} {"train_loss": -23.0288143157959, "global_step": 138395, "epoch": 1667} {"train_loss": -23.219120025634766, "global_step": 138396, "epoch": 1667} {"train_loss": -22.838970184326172, "global_step": 138397, "epoch": 1667} {"train_loss": -23.172239303588867, "global_step": 138398, "epoch": 1667} {"train_loss": -23.059240341186523, "global_step": 138399, "epoch": 1667} {"train_loss": -23.137592315673828, "global_step": 138400, "epoch": 1667} {"train_loss": -23.249740600585938, "global_step": 138401, "epoch": 1667} {"train_loss": -22.972471237182617, "global_step": 138402, "epoch": 1667} {"train_loss": -22.996829986572266, "global_step": 138403, "epoch": 1667} {"train_loss": -23.199487686157227, "global_step": 138404, "epoch": 1667} {"train_loss": -22.962390899658203, "global_step": 138405, "epoch": 1667} {"train_loss": -23.055368423461914, "global_step": 138406, "epoch": 1667} {"train_loss": -23.080881118774414, "global_step": 138407, "epoch": 1667} {"train_loss": -23.129474639892578, "global_step": 138408, "epoch": 1667} {"train_loss": -22.8564510345459, "global_step": 138409, "epoch": 1667} {"train_loss": -22.993671417236328, "global_step": 138410, "epoch": 1667} {"train_loss": -23.056055068969727, "global_step": 138411, "epoch": 1667} {"train_loss": -23.15131950378418, "global_step": 138412, "epoch": 1667} {"train_loss": -22.6580867767334, "global_step": 138413, "epoch": 1667} {"train_loss": -22.801990509033203, "global_step": 138414, "epoch": 1667} {"train_loss": -22.949487686157227, "global_step": 138415, "epoch": 1667} {"train_loss": -22.781713485717773, "global_step": 138416, "epoch": 1667} {"train_loss": -22.660947799682617, "global_step": 138417, "epoch": 1667} {"train_loss": -23.198442459106445, "global_step": 138418, "epoch": 1667} {"train_loss": -23.140148162841797, "global_step": 138419, "epoch": 1667} {"train_loss": -22.609678268432617, "global_step": 138420, "epoch": 1667} {"train_loss": -22.67072868347168, "global_step": 138421, "epoch": 1667} {"train_loss": -23.34758949279785, "global_step": 138422, "epoch": 1667} {"train_loss": -23.06435203552246, "global_step": 138423, "epoch": 1667} {"train_loss": -22.87679100036621, "global_step": 138424, "epoch": 1667} {"train_loss": -22.693042755126953, "global_step": 138425, "epoch": 1667} {"train_loss": -23.52374267578125, "global_step": 138426, "epoch": 1667} {"train_loss": -23.18251609802246, "global_step": 138427, "epoch": 1667} {"train_loss": -22.950698852539062, "global_step": 138428, "epoch": 1667} {"train_loss": -23.277923583984375, "global_step": 138429, "epoch": 1667} {"train_loss": -22.98663902282715, "global_step": 138430, "epoch": 1667} {"train_loss": -23.375934600830078, "global_step": 138431, "epoch": 1667} {"train_loss": -23.17544937133789, "global_step": 138432, "epoch": 1667} {"train_loss": -22.71319007873535, "global_step": 138433, "epoch": 1667} {"train_loss": -22.927913665771484, "global_step": 138434, "epoch": 1667} {"train_loss": -23.421375274658203, "global_step": 138435, "epoch": 1667} {"train_loss": -23.26300621032715, "global_step": 138436, "epoch": 1667} {"train_loss": -23.28213882446289, "global_step": 138437, "epoch": 1667} {"train_loss": -23.19820213317871, "global_step": 138438, "epoch": 1667} {"train_loss": -23.028501510620117, "global_step": 138439, "epoch": 1667} {"train_loss": -22.92745018005371, "global_step": 138440, "epoch": 1667} {"train_loss": -22.927200317382812, "global_step": 138441, "epoch": 1667} {"train_loss": -23.299373626708984, "global_step": 138442, "epoch": 1667} {"train_loss": -22.99274639910962, "global_step": 138443, "epoch": 1667, "val_loss": 6313798.0} {"train_loss": -22.667922973632812, "global_step": 138444, "epoch": 1668} {"train_loss": -21.742643356323242, "global_step": 138445, "epoch": 1668} {"train_loss": -21.754667282104492, "global_step": 138446, "epoch": 1668} {"train_loss": -22.432065963745117, "global_step": 138447, "epoch": 1668} {"train_loss": -22.6377010345459, "global_step": 138448, "epoch": 1668} {"train_loss": -21.792957305908203, "global_step": 138449, "epoch": 1668} {"train_loss": -22.558500289916992, "global_step": 138450, "epoch": 1668} {"train_loss": -22.350706100463867, "global_step": 138451, "epoch": 1668} {"train_loss": -22.5306453704834, "global_step": 138452, "epoch": 1668} {"train_loss": -22.881271362304688, "global_step": 138453, "epoch": 1668} {"train_loss": -22.347015380859375, "global_step": 138454, "epoch": 1668} {"train_loss": -22.473417282104492, "global_step": 138455, "epoch": 1668} {"train_loss": -22.58439064025879, "global_step": 138456, "epoch": 1668} {"train_loss": -22.576345443725586, "global_step": 138457, "epoch": 1668} {"train_loss": -22.7072696685791, "global_step": 138458, "epoch": 1668} {"train_loss": -22.489545822143555, "global_step": 138459, "epoch": 1668} {"train_loss": -22.337627410888672, "global_step": 138460, "epoch": 1668} {"train_loss": -22.5091552734375, "global_step": 138461, "epoch": 1668} {"train_loss": -23.06129264831543, "global_step": 138462, "epoch": 1668} {"train_loss": -22.90935707092285, "global_step": 138463, "epoch": 1668} {"train_loss": -22.666223526000977, "global_step": 138464, "epoch": 1668} {"train_loss": -22.84383201599121, "global_step": 138465, "epoch": 1668} {"train_loss": -22.640195846557617, "global_step": 138466, "epoch": 1668} {"train_loss": -22.563472747802734, "global_step": 138467, "epoch": 1668} {"train_loss": -22.884687423706055, "global_step": 138468, "epoch": 1668} {"train_loss": -23.183170318603516, "global_step": 138469, "epoch": 1668} {"train_loss": -23.056013107299805, "global_step": 138470, "epoch": 1668} {"train_loss": -23.206884384155273, "global_step": 138471, "epoch": 1668} {"train_loss": -23.03162956237793, "global_step": 138472, "epoch": 1668} {"train_loss": -22.97162628173828, "global_step": 138473, "epoch": 1668} {"train_loss": -22.79143524169922, "global_step": 138474, "epoch": 1668} {"train_loss": -23.07037925720215, "global_step": 138475, "epoch": 1668} {"train_loss": -23.285131454467773, "global_step": 138476, "epoch": 1668} {"train_loss": -23.0305233001709, "global_step": 138477, "epoch": 1668} {"train_loss": -22.983600616455078, "global_step": 138478, "epoch": 1668} {"train_loss": -23.081026077270508, "global_step": 138479, "epoch": 1668} {"train_loss": -23.20192527770996, "global_step": 138480, "epoch": 1668} {"train_loss": -23.04359245300293, "global_step": 138481, "epoch": 1668} {"train_loss": -22.974323272705078, "global_step": 138482, "epoch": 1668} {"train_loss": -22.884918212890625, "global_step": 138483, "epoch": 1668} {"train_loss": -23.11147117614746, "global_step": 138484, "epoch": 1668} {"train_loss": -23.404748916625977, "global_step": 138485, "epoch": 1668} {"train_loss": -23.112607955932617, "global_step": 138486, "epoch": 1668} {"train_loss": -23.259010314941406, "global_step": 138487, "epoch": 1668} {"train_loss": -22.909423828125, "global_step": 138488, "epoch": 1668} {"train_loss": -23.273283004760742, "global_step": 138489, "epoch": 1668} {"train_loss": -22.703420639038086, "global_step": 138490, "epoch": 1668} {"train_loss": -22.912982940673828, "global_step": 138491, "epoch": 1668} {"train_loss": -22.743070602416992, "global_step": 138492, "epoch": 1668} {"train_loss": -22.492929458618164, "global_step": 138493, "epoch": 1668} {"train_loss": -23.0481014251709, "global_step": 138494, "epoch": 1668} {"train_loss": -23.017169952392578, "global_step": 138495, "epoch": 1668} {"train_loss": -22.545358657836914, "global_step": 138496, "epoch": 1668} {"train_loss": -22.599843978881836, "global_step": 138497, "epoch": 1668} {"train_loss": -23.17818260192871, "global_step": 138498, "epoch": 1668} {"train_loss": -22.733280181884766, "global_step": 138499, "epoch": 1668} {"train_loss": -22.68338966369629, "global_step": 138500, "epoch": 1668} {"train_loss": -22.597965240478516, "global_step": 138501, "epoch": 1668} {"train_loss": -22.986738204956055, "global_step": 138502, "epoch": 1668} {"train_loss": -22.89179039001465, "global_step": 138503, "epoch": 1668} {"train_loss": -22.8742618560791, "global_step": 138504, "epoch": 1668} {"train_loss": -22.783296585083008, "global_step": 138505, "epoch": 1668} {"train_loss": -23.0909366607666, "global_step": 138506, "epoch": 1668} {"train_loss": -22.782611846923828, "global_step": 138507, "epoch": 1668} {"train_loss": -23.077045440673828, "global_step": 138508, "epoch": 1668} {"train_loss": -23.114940643310547, "global_step": 138509, "epoch": 1668} {"train_loss": -22.909948348999023, "global_step": 138510, "epoch": 1668} {"train_loss": -22.966236114501953, "global_step": 138511, "epoch": 1668} {"train_loss": -22.71747398376465, "global_step": 138512, "epoch": 1668} {"train_loss": -23.37083625793457, "global_step": 138513, "epoch": 1668} {"train_loss": -23.192508697509766, "global_step": 138514, "epoch": 1668} {"train_loss": -23.092594146728516, "global_step": 138515, "epoch": 1668} {"train_loss": -23.059829711914062, "global_step": 138516, "epoch": 1668} {"train_loss": -23.2522029876709, "global_step": 138517, "epoch": 1668} {"train_loss": -22.789600372314453, "global_step": 138518, "epoch": 1668} {"train_loss": -22.968294143676758, "global_step": 138519, "epoch": 1668} {"train_loss": -23.08991050720215, "global_step": 138520, "epoch": 1668} {"train_loss": -23.185800552368164, "global_step": 138521, "epoch": 1668} {"train_loss": -22.977476119995117, "global_step": 138522, "epoch": 1668} {"train_loss": -23.126081466674805, "global_step": 138523, "epoch": 1668} {"train_loss": -23.146703720092773, "global_step": 138524, "epoch": 1668} {"train_loss": -23.11414909362793, "global_step": 138525, "epoch": 1668} {"train_loss": -22.865384549979705, "global_step": 138526, "epoch": 1668, "val_loss": 6386272.0} {"train_loss": -22.263925552368164, "global_step": 138527, "epoch": 1669} {"train_loss": -21.393375396728516, "global_step": 138528, "epoch": 1669} {"train_loss": -21.288511276245117, "global_step": 138529, "epoch": 1669} {"train_loss": -22.463022232055664, "global_step": 138530, "epoch": 1669} {"train_loss": -22.26521110534668, "global_step": 138531, "epoch": 1669} {"train_loss": -22.257932662963867, "global_step": 138532, "epoch": 1669} {"train_loss": -22.485624313354492, "global_step": 138533, "epoch": 1669} {"train_loss": -22.266202926635742, "global_step": 138534, "epoch": 1669} {"train_loss": -22.279525756835938, "global_step": 138535, "epoch": 1669} {"train_loss": -22.371183395385742, "global_step": 138536, "epoch": 1669} {"train_loss": -22.72426414489746, "global_step": 138537, "epoch": 1669} {"train_loss": -22.61000633239746, "global_step": 138538, "epoch": 1669} {"train_loss": -22.69818115234375, "global_step": 138539, "epoch": 1669} {"train_loss": -22.306867599487305, "global_step": 138540, "epoch": 1669} {"train_loss": -22.81622886657715, "global_step": 138541, "epoch": 1669} {"train_loss": -22.8704833984375, "global_step": 138542, "epoch": 1669} {"train_loss": -22.485227584838867, "global_step": 138543, "epoch": 1669} {"train_loss": -22.775577545166016, "global_step": 138544, "epoch": 1669} {"train_loss": -22.77627944946289, "global_step": 138545, "epoch": 1669} {"train_loss": -23.038223266601562, "global_step": 138546, "epoch": 1669} {"train_loss": -22.58782196044922, "global_step": 138547, "epoch": 1669} {"train_loss": -23.294034957885742, "global_step": 138548, "epoch": 1669} {"train_loss": -23.009061813354492, "global_step": 138549, "epoch": 1669} {"train_loss": -22.877248764038086, "global_step": 138550, "epoch": 1669} {"train_loss": -23.285308837890625, "global_step": 138551, "epoch": 1669} {"train_loss": -23.091867446899414, "global_step": 138552, "epoch": 1669} {"train_loss": -22.807035446166992, "global_step": 138553, "epoch": 1669} {"train_loss": -22.694860458374023, "global_step": 138554, "epoch": 1669} {"train_loss": -23.310354232788086, "global_step": 138555, "epoch": 1669} {"train_loss": -22.92009735107422, "global_step": 138556, "epoch": 1669} {"train_loss": -22.591720581054688, "global_step": 138557, "epoch": 1669} {"train_loss": -22.842849731445312, "global_step": 138558, "epoch": 1669} {"train_loss": -23.025800704956055, "global_step": 138559, "epoch": 1669} {"train_loss": -23.363605499267578, "global_step": 138560, "epoch": 1669} {"train_loss": -23.489166259765625, "global_step": 138561, "epoch": 1669} {"train_loss": -22.934240341186523, "global_step": 138562, "epoch": 1669} {"train_loss": -22.84786605834961, "global_step": 138563, "epoch": 1669} {"train_loss": -23.197134017944336, "global_step": 138564, "epoch": 1669} {"train_loss": -23.16086769104004, "global_step": 138565, "epoch": 1669} {"train_loss": -22.458017349243164, "global_step": 138566, "epoch": 1669} {"train_loss": -22.801639556884766, "global_step": 138567, "epoch": 1669} {"train_loss": -22.818296432495117, "global_step": 138568, "epoch": 1669} {"train_loss": -23.126752853393555, "global_step": 138569, "epoch": 1669} {"train_loss": -22.55396842956543, "global_step": 138570, "epoch": 1669} {"train_loss": -22.847553253173828, "global_step": 138571, "epoch": 1669} {"train_loss": -23.420799255371094, "global_step": 138572, "epoch": 1669} {"train_loss": -22.848684310913086, "global_step": 138573, "epoch": 1669} {"train_loss": -22.924911499023438, "global_step": 138574, "epoch": 1669} {"train_loss": -22.93874740600586, "global_step": 138575, "epoch": 1669} {"train_loss": -22.652891159057617, "global_step": 138576, "epoch": 1669} {"train_loss": -22.9505672454834, "global_step": 138577, "epoch": 1669} {"train_loss": -22.582792282104492, "global_step": 138578, "epoch": 1669} {"train_loss": -22.66072654724121, "global_step": 138579, "epoch": 1669} {"train_loss": -22.774757385253906, "global_step": 138580, "epoch": 1669} {"train_loss": -22.942127227783203, "global_step": 138581, "epoch": 1669} {"train_loss": -22.828855514526367, "global_step": 138582, "epoch": 1669} {"train_loss": -22.91485023498535, "global_step": 138583, "epoch": 1669} {"train_loss": -23.64008903503418, "global_step": 138584, "epoch": 1669} {"train_loss": -22.924875259399414, "global_step": 138585, "epoch": 1669} {"train_loss": -23.192472457885742, "global_step": 138586, "epoch": 1669} {"train_loss": -22.88541030883789, "global_step": 138587, "epoch": 1669} {"train_loss": -22.896177291870117, "global_step": 138588, "epoch": 1669} {"train_loss": -23.099166870117188, "global_step": 138589, "epoch": 1669} {"train_loss": -22.661100387573242, "global_step": 138590, "epoch": 1669} {"train_loss": -22.843717575073242, "global_step": 138591, "epoch": 1669} {"train_loss": -23.332822799682617, "global_step": 138592, "epoch": 1669} {"train_loss": -22.899250030517578, "global_step": 138593, "epoch": 1669} {"train_loss": -22.90921401977539, "global_step": 138594, "epoch": 1669} {"train_loss": -23.02703285217285, "global_step": 138595, "epoch": 1669} {"train_loss": -23.372730255126953, "global_step": 138596, "epoch": 1669} {"train_loss": -22.965862274169922, "global_step": 138597, "epoch": 1669} {"train_loss": -22.987136840820312, "global_step": 138598, "epoch": 1669} {"train_loss": -23.061006546020508, "global_step": 138599, "epoch": 1669} {"train_loss": -23.175411224365234, "global_step": 138600, "epoch": 1669} {"train_loss": -23.044105529785156, "global_step": 138601, "epoch": 1669} {"train_loss": -23.25119972229004, "global_step": 138602, "epoch": 1669} {"train_loss": -23.186918258666992, "global_step": 138603, "epoch": 1669} {"train_loss": -23.277572631835938, "global_step": 138604, "epoch": 1669} {"train_loss": -23.16875648498535, "global_step": 138605, "epoch": 1669} {"train_loss": -23.214847564697266, "global_step": 138606, "epoch": 1669} {"train_loss": -23.283395767211914, "global_step": 138607, "epoch": 1669} {"train_loss": -23.1467342376709, "global_step": 138608, "epoch": 1669} {"train_loss": -22.86967160328325, "global_step": 138609, "epoch": 1669, "val_loss": 6245765.0} {"train_loss": -22.94708251953125, "global_step": 138610, "epoch": 1670} {"train_loss": -22.820188522338867, "global_step": 138611, "epoch": 1670} {"train_loss": -22.827701568603516, "global_step": 138612, "epoch": 1670} {"train_loss": -23.07427978515625, "global_step": 138613, "epoch": 1670} {"train_loss": -23.023433685302734, "global_step": 138614, "epoch": 1670} {"train_loss": -23.087858200073242, "global_step": 138615, "epoch": 1670} {"train_loss": -22.65964698791504, "global_step": 138616, "epoch": 1670} {"train_loss": -23.035444259643555, "global_step": 138617, "epoch": 1670} {"train_loss": -22.77911376953125, "global_step": 138618, "epoch": 1670} {"train_loss": -22.504085540771484, "global_step": 138619, "epoch": 1670} {"train_loss": -23.26124382019043, "global_step": 138620, "epoch": 1670} {"train_loss": -22.845657348632812, "global_step": 138621, "epoch": 1670} {"train_loss": -22.777507781982422, "global_step": 138622, "epoch": 1670} {"train_loss": -22.916723251342773, "global_step": 138623, "epoch": 1670} {"train_loss": -23.309123992919922, "global_step": 138624, "epoch": 1670} {"train_loss": -22.885168075561523, "global_step": 138625, "epoch": 1670} {"train_loss": -22.912378311157227, "global_step": 138626, "epoch": 1670} {"train_loss": -22.81960105895996, "global_step": 138627, "epoch": 1670} {"train_loss": -23.264081954956055, "global_step": 138628, "epoch": 1670} {"train_loss": -23.387853622436523, "global_step": 138629, "epoch": 1670} {"train_loss": -22.693984985351562, "global_step": 138630, "epoch": 1670} {"train_loss": -23.045310974121094, "global_step": 138631, "epoch": 1670} {"train_loss": -23.194435119628906, "global_step": 138632, "epoch": 1670} {"train_loss": -23.459156036376953, "global_step": 138633, "epoch": 1670} {"train_loss": -23.226835250854492, "global_step": 138634, "epoch": 1670} {"train_loss": -22.81178855895996, "global_step": 138635, "epoch": 1670} {"train_loss": -23.123004913330078, "global_step": 138636, "epoch": 1670} {"train_loss": -23.094257354736328, "global_step": 138637, "epoch": 1670} {"train_loss": -23.178388595581055, "global_step": 138638, "epoch": 1670} {"train_loss": -22.520793914794922, "global_step": 138639, "epoch": 1670} {"train_loss": -23.015926361083984, "global_step": 138640, "epoch": 1670} {"train_loss": -23.17051124572754, "global_step": 138641, "epoch": 1670} {"train_loss": -23.053131103515625, "global_step": 138642, "epoch": 1670} {"train_loss": -23.139236450195312, "global_step": 138643, "epoch": 1670} {"train_loss": -22.850372314453125, "global_step": 138644, "epoch": 1670} {"train_loss": -23.12458610534668, "global_step": 138645, "epoch": 1670} {"train_loss": -22.956344604492188, "global_step": 138646, "epoch": 1670} {"train_loss": -23.086027145385742, "global_step": 138647, "epoch": 1670} {"train_loss": -23.204233169555664, "global_step": 138648, "epoch": 1670} {"train_loss": -23.3831787109375, "global_step": 138649, "epoch": 1670} {"train_loss": -22.877811431884766, "global_step": 138650, "epoch": 1670} {"train_loss": -23.292692184448242, "global_step": 138651, "epoch": 1670} {"train_loss": -22.984006881713867, "global_step": 138652, "epoch": 1670} {"train_loss": -22.921367645263672, "global_step": 138653, "epoch": 1670} {"train_loss": -22.912694931030273, "global_step": 138654, "epoch": 1670} {"train_loss": -23.500089645385742, "global_step": 138655, "epoch": 1670} {"train_loss": -23.269105911254883, "global_step": 138656, "epoch": 1670} {"train_loss": -23.28567123413086, "global_step": 138657, "epoch": 1670} {"train_loss": -23.318069458007812, "global_step": 138658, "epoch": 1670} {"train_loss": -23.056110382080078, "global_step": 138659, "epoch": 1670} {"train_loss": -22.785099029541016, "global_step": 138660, "epoch": 1670} {"train_loss": -23.014738082885742, "global_step": 138661, "epoch": 1670} {"train_loss": -23.191497802734375, "global_step": 138662, "epoch": 1670} {"train_loss": -22.644681930541992, "global_step": 138663, "epoch": 1670} {"train_loss": -22.956281661987305, "global_step": 138664, "epoch": 1670} {"train_loss": -23.12890625, "global_step": 138665, "epoch": 1670} {"train_loss": -22.83345603942871, "global_step": 138666, "epoch": 1670} {"train_loss": -22.913894653320312, "global_step": 138667, "epoch": 1670} {"train_loss": -22.678190231323242, "global_step": 138668, "epoch": 1670} {"train_loss": -23.1114559173584, "global_step": 138669, "epoch": 1670} {"train_loss": -22.630599975585938, "global_step": 138670, "epoch": 1670} {"train_loss": -23.49824333190918, "global_step": 138671, "epoch": 1670} {"train_loss": -23.095706939697266, "global_step": 138672, "epoch": 1670} {"train_loss": -23.017845153808594, "global_step": 138673, "epoch": 1670} {"train_loss": -22.94841766357422, "global_step": 138674, "epoch": 1670} {"train_loss": -23.039304733276367, "global_step": 138675, "epoch": 1670} {"train_loss": -23.230817794799805, "global_step": 138676, "epoch": 1670} {"train_loss": -23.068452835083008, "global_step": 138677, "epoch": 1670} {"train_loss": -23.124670028686523, "global_step": 138678, "epoch": 1670} {"train_loss": -23.039411544799805, "global_step": 138679, "epoch": 1670} {"train_loss": -22.815946578979492, "global_step": 138680, "epoch": 1670} {"train_loss": -22.679731369018555, "global_step": 138681, "epoch": 1670} {"train_loss": -22.604333877563477, "global_step": 138682, "epoch": 1670} {"train_loss": -22.88360595703125, "global_step": 138683, "epoch": 1670} {"train_loss": -23.142784118652344, "global_step": 138684, "epoch": 1670} {"train_loss": -22.916959762573242, "global_step": 138685, "epoch": 1670} {"train_loss": -23.009944915771484, "global_step": 138686, "epoch": 1670} {"train_loss": -22.565258026123047, "global_step": 138687, "epoch": 1670} {"train_loss": -23.229467391967773, "global_step": 138688, "epoch": 1670} {"train_loss": -22.936140060424805, "global_step": 138689, "epoch": 1670} {"train_loss": -23.044065475463867, "global_step": 138690, "epoch": 1670} {"train_loss": -23.28374671936035, "global_step": 138691, "epoch": 1670} {"train_loss": -23.02675833185035, "global_step": 138692, "epoch": 1670, "val_loss": 6300461.0} {"train_loss": -22.561222076416016, "global_step": 138693, "epoch": 1671} {"train_loss": -22.91347312927246, "global_step": 138694, "epoch": 1671} {"train_loss": -22.72846794128418, "global_step": 138695, "epoch": 1671} {"train_loss": -22.897680282592773, "global_step": 138696, "epoch": 1671} {"train_loss": -22.942861557006836, "global_step": 138697, "epoch": 1671} {"train_loss": -23.12700080871582, "global_step": 138698, "epoch": 1671} {"train_loss": -23.13607406616211, "global_step": 138699, "epoch": 1671} {"train_loss": -22.995271682739258, "global_step": 138700, "epoch": 1671} {"train_loss": -23.241252899169922, "global_step": 138701, "epoch": 1671} {"train_loss": -22.63112449645996, "global_step": 138702, "epoch": 1671} {"train_loss": -23.194875717163086, "global_step": 138703, "epoch": 1671} {"train_loss": -23.021106719970703, "global_step": 138704, "epoch": 1671} {"train_loss": -23.10288429260254, "global_step": 138705, "epoch": 1671} {"train_loss": -22.932065963745117, "global_step": 138706, "epoch": 1671} {"train_loss": -23.026891708374023, "global_step": 138707, "epoch": 1671} {"train_loss": -23.01618003845215, "global_step": 138708, "epoch": 1671} {"train_loss": -23.002439498901367, "global_step": 138709, "epoch": 1671} {"train_loss": -22.97397232055664, "global_step": 138710, "epoch": 1671} {"train_loss": -23.033262252807617, "global_step": 138711, "epoch": 1671} {"train_loss": -23.11077308654785, "global_step": 138712, "epoch": 1671} {"train_loss": -22.604114532470703, "global_step": 138713, "epoch": 1671} {"train_loss": -23.04343605041504, "global_step": 138714, "epoch": 1671} {"train_loss": -22.529006958007812, "global_step": 138715, "epoch": 1671} {"train_loss": -23.37986183166504, "global_step": 138716, "epoch": 1671} {"train_loss": -22.795202255249023, "global_step": 138717, "epoch": 1671} {"train_loss": -23.215377807617188, "global_step": 138718, "epoch": 1671} {"train_loss": -23.106201171875, "global_step": 138719, "epoch": 1671} {"train_loss": -23.034347534179688, "global_step": 138720, "epoch": 1671} {"train_loss": -22.63652801513672, "global_step": 138721, "epoch": 1671} {"train_loss": -22.50229263305664, "global_step": 138722, "epoch": 1671} {"train_loss": -22.85759925842285, "global_step": 138723, "epoch": 1671} {"train_loss": -23.137537002563477, "global_step": 138724, "epoch": 1671} {"train_loss": -22.709583282470703, "global_step": 138725, "epoch": 1671} {"train_loss": -22.989591598510742, "global_step": 138726, "epoch": 1671} {"train_loss": -23.150217056274414, "global_step": 138727, "epoch": 1671} {"train_loss": -23.340866088867188, "global_step": 138728, "epoch": 1671} {"train_loss": -23.166030883789062, "global_step": 138729, "epoch": 1671} {"train_loss": -22.954038619995117, "global_step": 138730, "epoch": 1671} {"train_loss": -23.089780807495117, "global_step": 138731, "epoch": 1671} {"train_loss": -23.478260040283203, "global_step": 138732, "epoch": 1671} {"train_loss": -23.128070831298828, "global_step": 138733, "epoch": 1671} {"train_loss": -23.122594833374023, "global_step": 138734, "epoch": 1671} {"train_loss": -23.01700782775879, "global_step": 138735, "epoch": 1671} {"train_loss": -23.182022094726562, "global_step": 138736, "epoch": 1671} {"train_loss": -22.779142379760742, "global_step": 138737, "epoch": 1671} {"train_loss": -23.16818618774414, "global_step": 138738, "epoch": 1671} {"train_loss": -23.298507690429688, "global_step": 138739, "epoch": 1671} {"train_loss": -22.891584396362305, "global_step": 138740, "epoch": 1671} {"train_loss": -22.97064781188965, "global_step": 138741, "epoch": 1671} {"train_loss": -22.846715927124023, "global_step": 138742, "epoch": 1671} {"train_loss": -23.288829803466797, "global_step": 138743, "epoch": 1671} {"train_loss": -22.847923278808594, "global_step": 138744, "epoch": 1671} {"train_loss": -23.03701400756836, "global_step": 138745, "epoch": 1671} {"train_loss": -22.924421310424805, "global_step": 138746, "epoch": 1671} {"train_loss": -23.043542861938477, "global_step": 138747, "epoch": 1671} {"train_loss": -23.109189987182617, "global_step": 138748, "epoch": 1671} {"train_loss": -22.84556007385254, "global_step": 138749, "epoch": 1671} {"train_loss": -22.634033203125, "global_step": 138750, "epoch": 1671} {"train_loss": -23.360483169555664, "global_step": 138751, "epoch": 1671} {"train_loss": -22.934999465942383, "global_step": 138752, "epoch": 1671} {"train_loss": -23.11179542541504, "global_step": 138753, "epoch": 1671} {"train_loss": -23.175586700439453, "global_step": 138754, "epoch": 1671} {"train_loss": -22.948104858398438, "global_step": 138755, "epoch": 1671} {"train_loss": -22.70625877380371, "global_step": 138756, "epoch": 1671} {"train_loss": -23.171279907226562, "global_step": 138757, "epoch": 1671} {"train_loss": -23.04654884338379, "global_step": 138758, "epoch": 1671} {"train_loss": -22.898067474365234, "global_step": 138759, "epoch": 1671} {"train_loss": -22.710784912109375, "global_step": 138760, "epoch": 1671} {"train_loss": -23.020647048950195, "global_step": 138761, "epoch": 1671} {"train_loss": -22.562808990478516, "global_step": 138762, "epoch": 1671} {"train_loss": -23.054834365844727, "global_step": 138763, "epoch": 1671} {"train_loss": -23.1308536529541, "global_step": 138764, "epoch": 1671} {"train_loss": -22.838321685791016, "global_step": 138765, "epoch": 1671} {"train_loss": -23.121559143066406, "global_step": 138766, "epoch": 1671} {"train_loss": -23.185516357421875, "global_step": 138767, "epoch": 1671} {"train_loss": -22.904157638549805, "global_step": 138768, "epoch": 1671} {"train_loss": -22.71407127380371, "global_step": 138769, "epoch": 1671} {"train_loss": -22.829587936401367, "global_step": 138770, "epoch": 1671} {"train_loss": -22.674585342407227, "global_step": 138771, "epoch": 1671} {"train_loss": -23.006553649902344, "global_step": 138772, "epoch": 1671} {"train_loss": -23.01202964782715, "global_step": 138773, "epoch": 1671} {"train_loss": -22.852209091186523, "global_step": 138774, "epoch": 1671} {"train_loss": -22.9556724134698, "global_step": 138775, "epoch": 1671, "val_loss": 6308651.0} {"train_loss": -22.6822566986084, "global_step": 138776, "epoch": 1672} {"train_loss": -21.782453536987305, "global_step": 138777, "epoch": 1672} {"train_loss": -22.336572647094727, "global_step": 138778, "epoch": 1672} {"train_loss": -22.38382339477539, "global_step": 138779, "epoch": 1672} {"train_loss": -22.036596298217773, "global_step": 138780, "epoch": 1672} {"train_loss": -22.445518493652344, "global_step": 138781, "epoch": 1672} {"train_loss": -22.246007919311523, "global_step": 138782, "epoch": 1672} {"train_loss": -22.215635299682617, "global_step": 138783, "epoch": 1672} {"train_loss": -22.496065139770508, "global_step": 138784, "epoch": 1672} {"train_loss": -22.579511642456055, "global_step": 138785, "epoch": 1672} {"train_loss": -22.819747924804688, "global_step": 138786, "epoch": 1672} {"train_loss": -22.210525512695312, "global_step": 138787, "epoch": 1672} {"train_loss": -22.699411392211914, "global_step": 138788, "epoch": 1672} {"train_loss": -22.157751083374023, "global_step": 138789, "epoch": 1672} {"train_loss": -22.372800827026367, "global_step": 138790, "epoch": 1672} {"train_loss": -22.95824432373047, "global_step": 138791, "epoch": 1672} {"train_loss": -22.59969139099121, "global_step": 138792, "epoch": 1672} {"train_loss": -22.772146224975586, "global_step": 138793, "epoch": 1672} {"train_loss": -22.575895309448242, "global_step": 138794, "epoch": 1672} {"train_loss": -22.849517822265625, "global_step": 138795, "epoch": 1672} {"train_loss": -22.74043846130371, "global_step": 138796, "epoch": 1672} {"train_loss": -22.531150817871094, "global_step": 138797, "epoch": 1672} {"train_loss": -22.625732421875, "global_step": 138798, "epoch": 1672} {"train_loss": -22.87868309020996, "global_step": 138799, "epoch": 1672} {"train_loss": -22.85936164855957, "global_step": 138800, "epoch": 1672} {"train_loss": -23.031021118164062, "global_step": 138801, "epoch": 1672} {"train_loss": -22.872699737548828, "global_step": 138802, "epoch": 1672} {"train_loss": -23.028345108032227, "global_step": 138803, "epoch": 1672} {"train_loss": -23.284704208374023, "global_step": 138804, "epoch": 1672} {"train_loss": -23.108123779296875, "global_step": 138805, "epoch": 1672} {"train_loss": -22.638427734375, "global_step": 138806, "epoch": 1672} {"train_loss": -22.851648330688477, "global_step": 138807, "epoch": 1672} {"train_loss": -23.096832275390625, "global_step": 138808, "epoch": 1672} {"train_loss": -23.00484275817871, "global_step": 138809, "epoch": 1672} {"train_loss": -22.92424201965332, "global_step": 138810, "epoch": 1672} {"train_loss": -23.28705406188965, "global_step": 138811, "epoch": 1672} {"train_loss": -23.290119171142578, "global_step": 138812, "epoch": 1672} {"train_loss": -22.651294708251953, "global_step": 138813, "epoch": 1672} {"train_loss": -23.241758346557617, "global_step": 138814, "epoch": 1672} {"train_loss": -22.840986251831055, "global_step": 138815, "epoch": 1672} {"train_loss": -23.22746467590332, "global_step": 138816, "epoch": 1672} {"train_loss": -22.4166316986084, "global_step": 138817, "epoch": 1672} {"train_loss": -22.95236587524414, "global_step": 138818, "epoch": 1672} {"train_loss": -22.91482162475586, "global_step": 138819, "epoch": 1672} {"train_loss": -23.1590518951416, "global_step": 138820, "epoch": 1672} {"train_loss": -23.04682731628418, "global_step": 138821, "epoch": 1672} {"train_loss": -22.90040397644043, "global_step": 138822, "epoch": 1672} {"train_loss": -23.1649112701416, "global_step": 138823, "epoch": 1672} {"train_loss": -23.007970809936523, "global_step": 138824, "epoch": 1672} {"train_loss": -22.865543365478516, "global_step": 138825, "epoch": 1672} {"train_loss": -23.239587783813477, "global_step": 138826, "epoch": 1672} {"train_loss": -22.235994338989258, "global_step": 138827, "epoch": 1672} {"train_loss": -22.754507064819336, "global_step": 138828, "epoch": 1672} {"train_loss": -22.693649291992188, "global_step": 138829, "epoch": 1672} {"train_loss": -22.58754539489746, "global_step": 138830, "epoch": 1672} {"train_loss": -22.981184005737305, "global_step": 138831, "epoch": 1672} {"train_loss": -22.80544090270996, "global_step": 138832, "epoch": 1672} {"train_loss": -23.322437286376953, "global_step": 138833, "epoch": 1672} {"train_loss": -22.51581382751465, "global_step": 138834, "epoch": 1672} {"train_loss": -23.294530868530273, "global_step": 138835, "epoch": 1672} {"train_loss": -23.02495002746582, "global_step": 138836, "epoch": 1672} {"train_loss": -22.94898796081543, "global_step": 138837, "epoch": 1672} {"train_loss": -23.004545211791992, "global_step": 138838, "epoch": 1672} {"train_loss": -22.99075698852539, "global_step": 138839, "epoch": 1672} {"train_loss": -23.249479293823242, "global_step": 138840, "epoch": 1672} {"train_loss": -22.841035842895508, "global_step": 138841, "epoch": 1672} {"train_loss": -23.119935989379883, "global_step": 138842, "epoch": 1672} {"train_loss": -23.023618698120117, "global_step": 138843, "epoch": 1672} {"train_loss": -22.70901107788086, "global_step": 138844, "epoch": 1672} {"train_loss": -22.87457847595215, "global_step": 138845, "epoch": 1672} {"train_loss": -22.805265426635742, "global_step": 138846, "epoch": 1672} {"train_loss": -23.466238021850586, "global_step": 138847, "epoch": 1672} {"train_loss": -22.867263793945312, "global_step": 138848, "epoch": 1672} {"train_loss": -23.03326416015625, "global_step": 138849, "epoch": 1672} {"train_loss": -22.97406578063965, "global_step": 138850, "epoch": 1672} {"train_loss": -23.271947860717773, "global_step": 138851, "epoch": 1672} {"train_loss": -22.749765396118164, "global_step": 138852, "epoch": 1672} {"train_loss": -23.064672470092773, "global_step": 138853, "epoch": 1672} {"train_loss": -22.74071502685547, "global_step": 138854, "epoch": 1672} {"train_loss": -23.011972427368164, "global_step": 138855, "epoch": 1672} {"train_loss": -23.124662399291992, "global_step": 138856, "epoch": 1672} {"train_loss": -22.805011749267578, "global_step": 138857, "epoch": 1672} {"train_loss": -22.832540144403296, "global_step": 138858, "epoch": 1672, "val_loss": 6377868.0} {"train_loss": -22.8515682220459, "global_step": 138859, "epoch": 1673} {"train_loss": -22.889440536499023, "global_step": 138860, "epoch": 1673} {"train_loss": -22.848468780517578, "global_step": 138861, "epoch": 1673} {"train_loss": -23.011215209960938, "global_step": 138862, "epoch": 1673} {"train_loss": -23.16473960876465, "global_step": 138863, "epoch": 1673} {"train_loss": -23.05649757385254, "global_step": 138864, "epoch": 1673} {"train_loss": -23.00986671447754, "global_step": 138865, "epoch": 1673} {"train_loss": -22.815977096557617, "global_step": 138866, "epoch": 1673} {"train_loss": -22.864416122436523, "global_step": 138867, "epoch": 1673} {"train_loss": -23.048328399658203, "global_step": 138868, "epoch": 1673} {"train_loss": -23.051002502441406, "global_step": 138869, "epoch": 1673} {"train_loss": -22.786880493164062, "global_step": 138870, "epoch": 1673} {"train_loss": -22.9755859375, "global_step": 138871, "epoch": 1673} {"train_loss": -23.10245132446289, "global_step": 138872, "epoch": 1673} {"train_loss": -22.835617065429688, "global_step": 138873, "epoch": 1673} {"train_loss": -23.051738739013672, "global_step": 138874, "epoch": 1673} {"train_loss": -22.93894386291504, "global_step": 138875, "epoch": 1673} {"train_loss": -23.083683013916016, "global_step": 138876, "epoch": 1673} {"train_loss": -22.954214096069336, "global_step": 138877, "epoch": 1673} {"train_loss": -22.874631881713867, "global_step": 138878, "epoch": 1673} {"train_loss": -23.065366744995117, "global_step": 138879, "epoch": 1673} {"train_loss": -23.286762237548828, "global_step": 138880, "epoch": 1673} {"train_loss": -22.884984970092773, "global_step": 138881, "epoch": 1673} {"train_loss": -22.831741333007812, "global_step": 138882, "epoch": 1673} {"train_loss": -22.807994842529297, "global_step": 138883, "epoch": 1673} {"train_loss": -22.934770584106445, "global_step": 138884, "epoch": 1673} {"train_loss": -23.443599700927734, "global_step": 138885, "epoch": 1673} {"train_loss": -23.05048942565918, "global_step": 138886, "epoch": 1673} {"train_loss": -22.995777130126953, "global_step": 138887, "epoch": 1673} {"train_loss": -23.284048080444336, "global_step": 138888, "epoch": 1673} {"train_loss": -23.288759231567383, "global_step": 138889, "epoch": 1673} {"train_loss": -23.133512496948242, "global_step": 138890, "epoch": 1673} {"train_loss": -23.03579330444336, "global_step": 138891, "epoch": 1673} {"train_loss": -22.971689224243164, "global_step": 138892, "epoch": 1673} {"train_loss": -22.77535057067871, "global_step": 138893, "epoch": 1673} {"train_loss": -23.397863388061523, "global_step": 138894, "epoch": 1673} {"train_loss": -22.692007064819336, "global_step": 138895, "epoch": 1673} {"train_loss": -22.96824073791504, "global_step": 138896, "epoch": 1673} {"train_loss": -22.87885856628418, "global_step": 138897, "epoch": 1673} {"train_loss": -23.007122039794922, "global_step": 138898, "epoch": 1673} {"train_loss": -22.729385375976562, "global_step": 138899, "epoch": 1673} {"train_loss": -22.779930114746094, "global_step": 138900, "epoch": 1673} {"train_loss": -23.057788848876953, "global_step": 138901, "epoch": 1673} {"train_loss": -23.60771369934082, "global_step": 138902, "epoch": 1673} {"train_loss": -22.6485538482666, "global_step": 138903, "epoch": 1673} {"train_loss": -23.242401123046875, "global_step": 138904, "epoch": 1673} {"train_loss": -22.873886108398438, "global_step": 138905, "epoch": 1673} {"train_loss": -22.836515426635742, "global_step": 138906, "epoch": 1673} {"train_loss": -23.171186447143555, "global_step": 138907, "epoch": 1673} {"train_loss": -22.942243576049805, "global_step": 138908, "epoch": 1673} {"train_loss": -22.767826080322266, "global_step": 138909, "epoch": 1673} {"train_loss": -23.35971450805664, "global_step": 138910, "epoch": 1673} {"train_loss": -23.127302169799805, "global_step": 138911, "epoch": 1673} {"train_loss": -23.666784286499023, "global_step": 138912, "epoch": 1673} {"train_loss": -23.133182525634766, "global_step": 138913, "epoch": 1673} {"train_loss": -22.954452514648438, "global_step": 138914, "epoch": 1673} {"train_loss": -23.3543643951416, "global_step": 138915, "epoch": 1673} {"train_loss": -23.01546287536621, "global_step": 138916, "epoch": 1673} {"train_loss": -23.331682205200195, "global_step": 138917, "epoch": 1673} {"train_loss": -22.67661476135254, "global_step": 138918, "epoch": 1673} {"train_loss": -22.904184341430664, "global_step": 138919, "epoch": 1673} {"train_loss": -23.248815536499023, "global_step": 138920, "epoch": 1673} {"train_loss": -22.659231185913086, "global_step": 138921, "epoch": 1673} {"train_loss": -23.163373947143555, "global_step": 138922, "epoch": 1673} {"train_loss": -22.989925384521484, "global_step": 138923, "epoch": 1673} {"train_loss": -23.14659881591797, "global_step": 138924, "epoch": 1673} {"train_loss": -22.959592819213867, "global_step": 138925, "epoch": 1673} {"train_loss": -22.969736099243164, "global_step": 138926, "epoch": 1673} {"train_loss": -22.792516708374023, "global_step": 138927, "epoch": 1673} {"train_loss": -22.832754135131836, "global_step": 138928, "epoch": 1673} {"train_loss": -23.102705001831055, "global_step": 138929, "epoch": 1673} {"train_loss": -22.749191284179688, "global_step": 138930, "epoch": 1673} {"train_loss": -23.143163681030273, "global_step": 138931, "epoch": 1673} {"train_loss": -22.909542083740234, "global_step": 138932, "epoch": 1673} {"train_loss": -23.42781639099121, "global_step": 138933, "epoch": 1673} {"train_loss": -23.217954635620117, "global_step": 138934, "epoch": 1673} {"train_loss": -23.021467208862305, "global_step": 138935, "epoch": 1673} {"train_loss": -23.12527847290039, "global_step": 138936, "epoch": 1673} {"train_loss": -22.924375534057617, "global_step": 138937, "epoch": 1673} {"train_loss": -22.990629196166992, "global_step": 138938, "epoch": 1673} {"train_loss": -22.852903366088867, "global_step": 138939, "epoch": 1673} {"train_loss": -23.50457191467285, "global_step": 138940, "epoch": 1673} {"train_loss": -23.026225423238362, "global_step": 138941, "epoch": 1673, "val_loss": 6271798.0} {"train_loss": -22.591102600097656, "global_step": 138942, "epoch": 1674} {"train_loss": -22.64531135559082, "global_step": 138943, "epoch": 1674} {"train_loss": -22.579666137695312, "global_step": 138944, "epoch": 1674} {"train_loss": -22.601215362548828, "global_step": 138945, "epoch": 1674} {"train_loss": -22.03658103942871, "global_step": 138946, "epoch": 1674} {"train_loss": -22.543420791625977, "global_step": 138947, "epoch": 1674} {"train_loss": -22.629301071166992, "global_step": 138948, "epoch": 1674} {"train_loss": -22.349172592163086, "global_step": 138949, "epoch": 1674} {"train_loss": -22.30132293701172, "global_step": 138950, "epoch": 1674} {"train_loss": -22.385805130004883, "global_step": 138951, "epoch": 1674} {"train_loss": -22.87435531616211, "global_step": 138952, "epoch": 1674} {"train_loss": -22.604372024536133, "global_step": 138953, "epoch": 1674} {"train_loss": -22.822858810424805, "global_step": 138954, "epoch": 1674} {"train_loss": -22.86338233947754, "global_step": 138955, "epoch": 1674} {"train_loss": -22.6592960357666, "global_step": 138956, "epoch": 1674} {"train_loss": -22.759052276611328, "global_step": 138957, "epoch": 1674} {"train_loss": -22.604774475097656, "global_step": 138958, "epoch": 1674} {"train_loss": -22.711868286132812, "global_step": 138959, "epoch": 1674} {"train_loss": -22.88411521911621, "global_step": 138960, "epoch": 1674} {"train_loss": -22.558958053588867, "global_step": 138961, "epoch": 1674} {"train_loss": -22.65656280517578, "global_step": 138962, "epoch": 1674} {"train_loss": -22.78676414489746, "global_step": 138963, "epoch": 1674} {"train_loss": -23.395130157470703, "global_step": 138964, "epoch": 1674} {"train_loss": -22.78083610534668, "global_step": 138965, "epoch": 1674} {"train_loss": -22.709197998046875, "global_step": 138966, "epoch": 1674} {"train_loss": -22.767667770385742, "global_step": 138967, "epoch": 1674} {"train_loss": -22.80181884765625, "global_step": 138968, "epoch": 1674} {"train_loss": -23.028053283691406, "global_step": 138969, "epoch": 1674} {"train_loss": -22.95214080810547, "global_step": 138970, "epoch": 1674} {"train_loss": -22.814916610717773, "global_step": 138971, "epoch": 1674} {"train_loss": -23.167821884155273, "global_step": 138972, "epoch": 1674} {"train_loss": -22.90500259399414, "global_step": 138973, "epoch": 1674} {"train_loss": -23.031641006469727, "global_step": 138974, "epoch": 1674} {"train_loss": -23.3072452545166, "global_step": 138975, "epoch": 1674} {"train_loss": -23.047393798828125, "global_step": 138976, "epoch": 1674} {"train_loss": -22.810388565063477, "global_step": 138977, "epoch": 1674} {"train_loss": -23.11170768737793, "global_step": 138978, "epoch": 1674} {"train_loss": -23.28867530822754, "global_step": 138979, "epoch": 1674} {"train_loss": -22.675792694091797, "global_step": 138980, "epoch": 1674} {"train_loss": -23.090551376342773, "global_step": 138981, "epoch": 1674} {"train_loss": -23.10819435119629, "global_step": 138982, "epoch": 1674} {"train_loss": -22.399688720703125, "global_step": 138983, "epoch": 1674} {"train_loss": -22.706106185913086, "global_step": 138984, "epoch": 1674} {"train_loss": -22.892913818359375, "global_step": 138985, "epoch": 1674} {"train_loss": -22.864044189453125, "global_step": 138986, "epoch": 1674} {"train_loss": -23.105409622192383, "global_step": 138987, "epoch": 1674} {"train_loss": -22.808979034423828, "global_step": 138988, "epoch": 1674} {"train_loss": -22.772214889526367, "global_step": 138989, "epoch": 1674} {"train_loss": -23.42596435546875, "global_step": 138990, "epoch": 1674} {"train_loss": -22.911788940429688, "global_step": 138991, "epoch": 1674} {"train_loss": -22.711830139160156, "global_step": 138992, "epoch": 1674} {"train_loss": -22.938980102539062, "global_step": 138993, "epoch": 1674} {"train_loss": -23.211999893188477, "global_step": 138994, "epoch": 1674} {"train_loss": -22.914396286010742, "global_step": 138995, "epoch": 1674} {"train_loss": -23.075849533081055, "global_step": 138996, "epoch": 1674} {"train_loss": -22.661855697631836, "global_step": 138997, "epoch": 1674} {"train_loss": -22.883766174316406, "global_step": 138998, "epoch": 1674} {"train_loss": -22.738121032714844, "global_step": 138999, "epoch": 1674} {"train_loss": -22.803220748901367, "global_step": 139000, "epoch": 1674} {"train_loss": -23.0723819732666, "global_step": 139001, "epoch": 1674} {"train_loss": -22.96076774597168, "global_step": 139002, "epoch": 1674} {"train_loss": -23.114194869995117, "global_step": 139003, "epoch": 1674} {"train_loss": -22.991622924804688, "global_step": 139004, "epoch": 1674} {"train_loss": -22.70724868774414, "global_step": 139005, "epoch": 1674} {"train_loss": -23.09693145751953, "global_step": 139006, "epoch": 1674} {"train_loss": -23.115476608276367, "global_step": 139007, "epoch": 1674} {"train_loss": -23.14785385131836, "global_step": 139008, "epoch": 1674} {"train_loss": -23.251575469970703, "global_step": 139009, "epoch": 1674} {"train_loss": -23.0990047454834, "global_step": 139010, "epoch": 1674} {"train_loss": -23.093069076538086, "global_step": 139011, "epoch": 1674} {"train_loss": -22.7862491607666, "global_step": 139012, "epoch": 1674} {"train_loss": -23.160430908203125, "global_step": 139013, "epoch": 1674} {"train_loss": -22.696691513061523, "global_step": 139014, "epoch": 1674} {"train_loss": -22.782888412475586, "global_step": 139015, "epoch": 1674} {"train_loss": -23.252899169921875, "global_step": 139016, "epoch": 1674} {"train_loss": -23.402957916259766, "global_step": 139017, "epoch": 1674} {"train_loss": -23.5819149017334, "global_step": 139018, "epoch": 1674} {"train_loss": -23.262083053588867, "global_step": 139019, "epoch": 1674} {"train_loss": -23.233510971069336, "global_step": 139020, "epoch": 1674} {"train_loss": -22.888357162475586, "global_step": 139021, "epoch": 1674} {"train_loss": -23.094894409179688, "global_step": 139022, "epoch": 1674} {"train_loss": -23.343175888061523, "global_step": 139023, "epoch": 1674} {"train_loss": -22.88771142155291, "global_step": 139024, "epoch": 1674, "val_loss": 6317701.5} {"train_loss": -22.573123931884766, "global_step": 139025, "epoch": 1675} {"train_loss": -22.874244689941406, "global_step": 139026, "epoch": 1675} {"train_loss": -22.48969078063965, "global_step": 139027, "epoch": 1675} {"train_loss": -22.385984420776367, "global_step": 139028, "epoch": 1675} {"train_loss": -22.432815551757812, "global_step": 139029, "epoch": 1675} {"train_loss": -22.70447540283203, "global_step": 139030, "epoch": 1675} {"train_loss": -22.917306900024414, "global_step": 139031, "epoch": 1675} {"train_loss": -22.577356338500977, "global_step": 139032, "epoch": 1675} {"train_loss": -23.022232055664062, "global_step": 139033, "epoch": 1675} {"train_loss": -22.741506576538086, "global_step": 139034, "epoch": 1675} {"train_loss": -22.650836944580078, "global_step": 139035, "epoch": 1675} {"train_loss": -23.179855346679688, "global_step": 139036, "epoch": 1675} {"train_loss": -23.021255493164062, "global_step": 139037, "epoch": 1675} {"train_loss": -22.842866897583008, "global_step": 139038, "epoch": 1675} {"train_loss": -23.015714645385742, "global_step": 139039, "epoch": 1675} {"train_loss": -22.614349365234375, "global_step": 139040, "epoch": 1675} {"train_loss": -23.080856323242188, "global_step": 139041, "epoch": 1675} {"train_loss": -23.26314353942871, "global_step": 139042, "epoch": 1675} {"train_loss": -23.185007095336914, "global_step": 139043, "epoch": 1675} {"train_loss": -22.683626174926758, "global_step": 139044, "epoch": 1675} {"train_loss": -22.900714874267578, "global_step": 139045, "epoch": 1675} {"train_loss": -22.69110870361328, "global_step": 139046, "epoch": 1675} {"train_loss": -23.17190933227539, "global_step": 139047, "epoch": 1675} {"train_loss": -23.16205406188965, "global_step": 139048, "epoch": 1675} {"train_loss": -23.02851676940918, "global_step": 139049, "epoch": 1675} {"train_loss": -23.325397491455078, "global_step": 139050, "epoch": 1675} {"train_loss": -23.116336822509766, "global_step": 139051, "epoch": 1675} {"train_loss": -23.111637115478516, "global_step": 139052, "epoch": 1675} {"train_loss": -22.9715576171875, "global_step": 139053, "epoch": 1675} {"train_loss": -22.913724899291992, "global_step": 139054, "epoch": 1675} {"train_loss": -23.356313705444336, "global_step": 139055, "epoch": 1675} {"train_loss": -22.85261344909668, "global_step": 139056, "epoch": 1675} {"train_loss": -23.052087783813477, "global_step": 139057, "epoch": 1675} {"train_loss": -22.90397834777832, "global_step": 139058, "epoch": 1675} {"train_loss": -22.9556827545166, "global_step": 139059, "epoch": 1675} {"train_loss": -23.36468505859375, "global_step": 139060, "epoch": 1675} {"train_loss": -22.998289108276367, "global_step": 139061, "epoch": 1675} {"train_loss": -22.870014190673828, "global_step": 139062, "epoch": 1675} {"train_loss": -23.21883201599121, "global_step": 139063, "epoch": 1675} {"train_loss": -23.109601974487305, "global_step": 139064, "epoch": 1675} {"train_loss": -23.264785766601562, "global_step": 139065, "epoch": 1675} {"train_loss": -23.094512939453125, "global_step": 139066, "epoch": 1675} {"train_loss": -23.236957550048828, "global_step": 139067, "epoch": 1675} {"train_loss": -23.058286666870117, "global_step": 139068, "epoch": 1675} {"train_loss": -23.238956451416016, "global_step": 139069, "epoch": 1675} {"train_loss": -22.776098251342773, "global_step": 139070, "epoch": 1675} {"train_loss": -23.43085289001465, "global_step": 139071, "epoch": 1675} {"train_loss": -23.207181930541992, "global_step": 139072, "epoch": 1675} {"train_loss": -23.133499145507812, "global_step": 139073, "epoch": 1675} {"train_loss": -22.928129196166992, "global_step": 139074, "epoch": 1675} {"train_loss": -23.072057723999023, "global_step": 139075, "epoch": 1675} {"train_loss": -22.98076820373535, "global_step": 139076, "epoch": 1675} {"train_loss": -22.86076545715332, "global_step": 139077, "epoch": 1675} {"train_loss": -23.16071891784668, "global_step": 139078, "epoch": 1675} {"train_loss": -23.545686721801758, "global_step": 139079, "epoch": 1675} {"train_loss": -23.205059051513672, "global_step": 139080, "epoch": 1675} {"train_loss": -23.289255142211914, "global_step": 139081, "epoch": 1675} {"train_loss": -23.0400390625, "global_step": 139082, "epoch": 1675} {"train_loss": -23.114816665649414, "global_step": 139083, "epoch": 1675} {"train_loss": -23.10975456237793, "global_step": 139084, "epoch": 1675} {"train_loss": -23.06209373474121, "global_step": 139085, "epoch": 1675} {"train_loss": -22.934677124023438, "global_step": 139086, "epoch": 1675} {"train_loss": -23.336713790893555, "global_step": 139087, "epoch": 1675} {"train_loss": -23.266706466674805, "global_step": 139088, "epoch": 1675} {"train_loss": -23.14088249206543, "global_step": 139089, "epoch": 1675} {"train_loss": -22.790271759033203, "global_step": 139090, "epoch": 1675} {"train_loss": -23.116230010986328, "global_step": 139091, "epoch": 1675} {"train_loss": -22.95881462097168, "global_step": 139092, "epoch": 1675} {"train_loss": -22.89205551147461, "global_step": 139093, "epoch": 1675} {"train_loss": -22.7440128326416, "global_step": 139094, "epoch": 1675} {"train_loss": -23.052526473999023, "global_step": 139095, "epoch": 1675} {"train_loss": -22.181615829467773, "global_step": 139096, "epoch": 1675} {"train_loss": -22.204919815063477, "global_step": 139097, "epoch": 1675} {"train_loss": -22.626203536987305, "global_step": 139098, "epoch": 1675} {"train_loss": -22.62217140197754, "global_step": 139099, "epoch": 1675} {"train_loss": -23.109521865844727, "global_step": 139100, "epoch": 1675} {"train_loss": -22.78916358947754, "global_step": 139101, "epoch": 1675} {"train_loss": -22.963176727294922, "global_step": 139102, "epoch": 1675} {"train_loss": -22.995519638061523, "global_step": 139103, "epoch": 1675} {"train_loss": -23.040231704711914, "global_step": 139104, "epoch": 1675} {"train_loss": -22.8078670501709, "global_step": 139105, "epoch": 1675} {"train_loss": -22.216676712036133, "global_step": 139106, "epoch": 1675} {"train_loss": -22.9503173828125, "global_step": 139107, "epoch": 1675, "val_loss": 6305145.0} {"train_loss": -22.676620483398438, "global_step": 139108, "epoch": 1676} {"train_loss": -22.432859420776367, "global_step": 139109, "epoch": 1676} {"train_loss": -22.660778045654297, "global_step": 139110, "epoch": 1676} {"train_loss": -22.52289581298828, "global_step": 139111, "epoch": 1676} {"train_loss": -22.347721099853516, "global_step": 139112, "epoch": 1676} {"train_loss": -22.901994705200195, "global_step": 139113, "epoch": 1676} {"train_loss": -22.977853775024414, "global_step": 139114, "epoch": 1676} {"train_loss": -22.69664764404297, "global_step": 139115, "epoch": 1676} {"train_loss": -23.035314559936523, "global_step": 139116, "epoch": 1676} {"train_loss": -22.75663948059082, "global_step": 139117, "epoch": 1676} {"train_loss": -23.254655838012695, "global_step": 139118, "epoch": 1676} {"train_loss": -22.832489013671875, "global_step": 139119, "epoch": 1676} {"train_loss": -22.94607925415039, "global_step": 139120, "epoch": 1676} {"train_loss": -22.695331573486328, "global_step": 139121, "epoch": 1676} {"train_loss": -22.91557502746582, "global_step": 139122, "epoch": 1676} {"train_loss": -23.144046783447266, "global_step": 139123, "epoch": 1676} {"train_loss": -22.858386993408203, "global_step": 139124, "epoch": 1676} {"train_loss": -22.7131290435791, "global_step": 139125, "epoch": 1676} {"train_loss": -23.319244384765625, "global_step": 139126, "epoch": 1676} {"train_loss": -23.029569625854492, "global_step": 139127, "epoch": 1676} {"train_loss": -22.956876754760742, "global_step": 139128, "epoch": 1676} {"train_loss": -22.945575714111328, "global_step": 139129, "epoch": 1676} {"train_loss": -22.833728790283203, "global_step": 139130, "epoch": 1676} {"train_loss": -23.293405532836914, "global_step": 139131, "epoch": 1676} {"train_loss": -23.330121994018555, "global_step": 139132, "epoch": 1676} {"train_loss": -23.416025161743164, "global_step": 139133, "epoch": 1676} {"train_loss": -23.2980899810791, "global_step": 139134, "epoch": 1676} {"train_loss": -22.716943740844727, "global_step": 139135, "epoch": 1676} {"train_loss": -22.72294807434082, "global_step": 139136, "epoch": 1676} {"train_loss": -22.737598419189453, "global_step": 139137, "epoch": 1676} {"train_loss": -22.567537307739258, "global_step": 139138, "epoch": 1676} {"train_loss": -23.06047821044922, "global_step": 139139, "epoch": 1676} {"train_loss": -22.6759090423584, "global_step": 139140, "epoch": 1676} {"train_loss": -22.768857955932617, "global_step": 139141, "epoch": 1676} {"train_loss": -22.952978134155273, "global_step": 139142, "epoch": 1676} {"train_loss": -22.819440841674805, "global_step": 139143, "epoch": 1676} {"train_loss": -22.86834716796875, "global_step": 139144, "epoch": 1676} {"train_loss": -23.267005920410156, "global_step": 139145, "epoch": 1676} {"train_loss": -22.919906616210938, "global_step": 139146, "epoch": 1676} {"train_loss": -23.448469161987305, "global_step": 139147, "epoch": 1676} {"train_loss": -23.06224822998047, "global_step": 139148, "epoch": 1676} {"train_loss": -23.03598403930664, "global_step": 139149, "epoch": 1676} {"train_loss": -22.98940658569336, "global_step": 139150, "epoch": 1676} {"train_loss": -23.002784729003906, "global_step": 139151, "epoch": 1676} {"train_loss": -23.20918846130371, "global_step": 139152, "epoch": 1676} {"train_loss": -22.746179580688477, "global_step": 139153, "epoch": 1676} {"train_loss": -22.703542709350586, "global_step": 139154, "epoch": 1676} {"train_loss": -23.430845260620117, "global_step": 139155, "epoch": 1676} {"train_loss": -23.142736434936523, "global_step": 139156, "epoch": 1676} {"train_loss": -22.928117752075195, "global_step": 139157, "epoch": 1676} {"train_loss": -22.60528564453125, "global_step": 139158, "epoch": 1676} {"train_loss": -22.807714462280273, "global_step": 139159, "epoch": 1676} {"train_loss": -22.75031280517578, "global_step": 139160, "epoch": 1676} {"train_loss": -23.334802627563477, "global_step": 139161, "epoch": 1676} {"train_loss": -23.23250389099121, "global_step": 139162, "epoch": 1676} {"train_loss": -23.320905685424805, "global_step": 139163, "epoch": 1676} {"train_loss": -22.987504959106445, "global_step": 139164, "epoch": 1676} {"train_loss": -22.89032554626465, "global_step": 139165, "epoch": 1676} {"train_loss": -22.886138916015625, "global_step": 139166, "epoch": 1676} {"train_loss": -23.130924224853516, "global_step": 139167, "epoch": 1676} {"train_loss": -23.282840728759766, "global_step": 139168, "epoch": 1676} {"train_loss": -22.976743698120117, "global_step": 139169, "epoch": 1676} {"train_loss": -23.023523330688477, "global_step": 139170, "epoch": 1676} {"train_loss": -23.1413631439209, "global_step": 139171, "epoch": 1676} {"train_loss": -22.89346694946289, "global_step": 139172, "epoch": 1676} {"train_loss": -22.82691764831543, "global_step": 139173, "epoch": 1676} {"train_loss": -23.0983943939209, "global_step": 139174, "epoch": 1676} {"train_loss": -23.14375877380371, "global_step": 139175, "epoch": 1676} {"train_loss": -22.6942081451416, "global_step": 139176, "epoch": 1676} {"train_loss": -22.987491607666016, "global_step": 139177, "epoch": 1676} {"train_loss": -23.051288604736328, "global_step": 139178, "epoch": 1676} {"train_loss": -23.037870407104492, "global_step": 139179, "epoch": 1676} {"train_loss": -23.053688049316406, "global_step": 139180, "epoch": 1676} {"train_loss": -22.987085342407227, "global_step": 139181, "epoch": 1676} {"train_loss": -22.821043014526367, "global_step": 139182, "epoch": 1676} {"train_loss": -22.83234214782715, "global_step": 139183, "epoch": 1676} {"train_loss": -22.440526962280273, "global_step": 139184, "epoch": 1676} {"train_loss": -22.86060333251953, "global_step": 139185, "epoch": 1676} {"train_loss": -22.53904151916504, "global_step": 139186, "epoch": 1676} {"train_loss": -22.730762481689453, "global_step": 139187, "epoch": 1676} {"train_loss": -22.8632869720459, "global_step": 139188, "epoch": 1676} {"train_loss": -23.094257354736328, "global_step": 139189, "epoch": 1676} {"train_loss": -22.95346179640437, "global_step": 139190, "epoch": 1676, "val_loss": 6361746.5} {"train_loss": -21.318708419799805, "global_step": 139191, "epoch": 1677} {"train_loss": -22.14806365966797, "global_step": 139192, "epoch": 1677} {"train_loss": -21.64922332763672, "global_step": 139193, "epoch": 1677} {"train_loss": -21.53554344177246, "global_step": 139194, "epoch": 1677} {"train_loss": -22.378690719604492, "global_step": 139195, "epoch": 1677} {"train_loss": -21.997968673706055, "global_step": 139196, "epoch": 1677} {"train_loss": -21.933626174926758, "global_step": 139197, "epoch": 1677} {"train_loss": -22.090152740478516, "global_step": 139198, "epoch": 1677} {"train_loss": -22.105710983276367, "global_step": 139199, "epoch": 1677} {"train_loss": -22.466747283935547, "global_step": 139200, "epoch": 1677} {"train_loss": -22.47307777404785, "global_step": 139201, "epoch": 1677} {"train_loss": -22.257726669311523, "global_step": 139202, "epoch": 1677} {"train_loss": -22.154571533203125, "global_step": 139203, "epoch": 1677} {"train_loss": -22.438495635986328, "global_step": 139204, "epoch": 1677} {"train_loss": -22.281524658203125, "global_step": 139205, "epoch": 1677} {"train_loss": -22.5496826171875, "global_step": 139206, "epoch": 1677} {"train_loss": -22.477746963500977, "global_step": 139207, "epoch": 1677} {"train_loss": -22.532272338867188, "global_step": 139208, "epoch": 1677} {"train_loss": -22.5473690032959, "global_step": 139209, "epoch": 1677} {"train_loss": -22.49799156188965, "global_step": 139210, "epoch": 1677} {"train_loss": -22.67161750793457, "global_step": 139211, "epoch": 1677} {"train_loss": -23.029966354370117, "global_step": 139212, "epoch": 1677} {"train_loss": -22.661571502685547, "global_step": 139213, "epoch": 1677} {"train_loss": -22.771528244018555, "global_step": 139214, "epoch": 1677} {"train_loss": -22.51894760131836, "global_step": 139215, "epoch": 1677} {"train_loss": -22.781949996948242, "global_step": 139216, "epoch": 1677} {"train_loss": -22.82042121887207, "global_step": 139217, "epoch": 1677} {"train_loss": -22.700824737548828, "global_step": 139218, "epoch": 1677} {"train_loss": -22.61492156982422, "global_step": 139219, "epoch": 1677} {"train_loss": -22.59473991394043, "global_step": 139220, "epoch": 1677} {"train_loss": -22.974729537963867, "global_step": 139221, "epoch": 1677} {"train_loss": -22.794422149658203, "global_step": 139222, "epoch": 1677} {"train_loss": -23.05323600769043, "global_step": 139223, "epoch": 1677} {"train_loss": -23.17110824584961, "global_step": 139224, "epoch": 1677} {"train_loss": -23.00455093383789, "global_step": 139225, "epoch": 1677} {"train_loss": -22.89495849609375, "global_step": 139226, "epoch": 1677} {"train_loss": -22.913270950317383, "global_step": 139227, "epoch": 1677} {"train_loss": -22.84439468383789, "global_step": 139228, "epoch": 1677} {"train_loss": -23.14093589782715, "global_step": 139229, "epoch": 1677} {"train_loss": -22.971818923950195, "global_step": 139230, "epoch": 1677} {"train_loss": -23.143428802490234, "global_step": 139231, "epoch": 1677} {"train_loss": -22.875497817993164, "global_step": 139232, "epoch": 1677} {"train_loss": -23.30084800720215, "global_step": 139233, "epoch": 1677} {"train_loss": -23.174894332885742, "global_step": 139234, "epoch": 1677} {"train_loss": -23.19645118713379, "global_step": 139235, "epoch": 1677} {"train_loss": -22.743270874023438, "global_step": 139236, "epoch": 1677} {"train_loss": -23.35385513305664, "global_step": 139237, "epoch": 1677} {"train_loss": -22.790128707885742, "global_step": 139238, "epoch": 1677} {"train_loss": -22.68694496154785, "global_step": 139239, "epoch": 1677} {"train_loss": -23.29277992248535, "global_step": 139240, "epoch": 1677} {"train_loss": -23.019939422607422, "global_step": 139241, "epoch": 1677} {"train_loss": -23.234792709350586, "global_step": 139242, "epoch": 1677} {"train_loss": -23.0094051361084, "global_step": 139243, "epoch": 1677} {"train_loss": -23.164337158203125, "global_step": 139244, "epoch": 1677} {"train_loss": -23.160003662109375, "global_step": 139245, "epoch": 1677} {"train_loss": -23.163848876953125, "global_step": 139246, "epoch": 1677} {"train_loss": -23.15065574645996, "global_step": 139247, "epoch": 1677} {"train_loss": -23.08066177368164, "global_step": 139248, "epoch": 1677} {"train_loss": -22.92652702331543, "global_step": 139249, "epoch": 1677} {"train_loss": -22.880094528198242, "global_step": 139250, "epoch": 1677} {"train_loss": -22.877735137939453, "global_step": 139251, "epoch": 1677} {"train_loss": -22.866186141967773, "global_step": 139252, "epoch": 1677} {"train_loss": -23.034767150878906, "global_step": 139253, "epoch": 1677} {"train_loss": -22.785032272338867, "global_step": 139254, "epoch": 1677} {"train_loss": -22.685495376586914, "global_step": 139255, "epoch": 1677} {"train_loss": -23.115562438964844, "global_step": 139256, "epoch": 1677} {"train_loss": -23.207914352416992, "global_step": 139257, "epoch": 1677} {"train_loss": -23.031003952026367, "global_step": 139258, "epoch": 1677} {"train_loss": -23.000564575195312, "global_step": 139259, "epoch": 1677} {"train_loss": -23.13592529296875, "global_step": 139260, "epoch": 1677} {"train_loss": -22.913713455200195, "global_step": 139261, "epoch": 1677} {"train_loss": -22.938512802124023, "global_step": 139262, "epoch": 1677} {"train_loss": -22.979856491088867, "global_step": 139263, "epoch": 1677} {"train_loss": -22.971837997436523, "global_step": 139264, "epoch": 1677} {"train_loss": -23.059650421142578, "global_step": 139265, "epoch": 1677} {"train_loss": -22.998891830444336, "global_step": 139266, "epoch": 1677} {"train_loss": -22.697660446166992, "global_step": 139267, "epoch": 1677} {"train_loss": -23.053503036499023, "global_step": 139268, "epoch": 1677} {"train_loss": -22.62409019470215, "global_step": 139269, "epoch": 1677} {"train_loss": -23.335203170776367, "global_step": 139270, "epoch": 1677} {"train_loss": -23.008333206176758, "global_step": 139271, "epoch": 1677} {"train_loss": -23.113168716430664, "global_step": 139272, "epoch": 1677} {"train_loss": -22.79158304972821, "global_step": 139273, "epoch": 1677, "val_loss": 6290196.0} {"train_loss": -22.460546493530273, "global_step": 139274, "epoch": 1678} {"train_loss": -22.821887969970703, "global_step": 139275, "epoch": 1678} {"train_loss": -22.681516647338867, "global_step": 139276, "epoch": 1678} {"train_loss": -22.4268798828125, "global_step": 139277, "epoch": 1678} {"train_loss": -22.77646827697754, "global_step": 139278, "epoch": 1678} {"train_loss": -22.41172981262207, "global_step": 139279, "epoch": 1678} {"train_loss": -22.64446258544922, "global_step": 139280, "epoch": 1678} {"train_loss": -23.03870964050293, "global_step": 139281, "epoch": 1678} {"train_loss": -23.000930786132812, "global_step": 139282, "epoch": 1678} {"train_loss": -22.743385314941406, "global_step": 139283, "epoch": 1678} {"train_loss": -22.807315826416016, "global_step": 139284, "epoch": 1678} {"train_loss": -23.256986618041992, "global_step": 139285, "epoch": 1678} {"train_loss": -22.888334274291992, "global_step": 139286, "epoch": 1678} {"train_loss": -22.45835304260254, "global_step": 139287, "epoch": 1678} {"train_loss": -23.123289108276367, "global_step": 139288, "epoch": 1678} {"train_loss": -22.7581729888916, "global_step": 139289, "epoch": 1678} {"train_loss": -22.820575714111328, "global_step": 139290, "epoch": 1678} {"train_loss": -23.2843074798584, "global_step": 139291, "epoch": 1678} {"train_loss": -22.906322479248047, "global_step": 139292, "epoch": 1678} {"train_loss": -22.88332176208496, "global_step": 139293, "epoch": 1678} {"train_loss": -23.291027069091797, "global_step": 139294, "epoch": 1678} {"train_loss": -23.442951202392578, "global_step": 139295, "epoch": 1678} {"train_loss": -22.3703556060791, "global_step": 139296, "epoch": 1678} {"train_loss": -23.070653915405273, "global_step": 139297, "epoch": 1678} {"train_loss": -23.0876522064209, "global_step": 139298, "epoch": 1678} {"train_loss": -22.923887252807617, "global_step": 139299, "epoch": 1678} {"train_loss": -22.964385986328125, "global_step": 139300, "epoch": 1678} {"train_loss": -23.04218864440918, "global_step": 139301, "epoch": 1678} {"train_loss": -23.098020553588867, "global_step": 139302, "epoch": 1678} {"train_loss": -22.879194259643555, "global_step": 139303, "epoch": 1678} {"train_loss": -23.074344635009766, "global_step": 139304, "epoch": 1678} {"train_loss": -23.248014450073242, "global_step": 139305, "epoch": 1678} {"train_loss": -23.22468376159668, "global_step": 139306, "epoch": 1678} {"train_loss": -22.97776985168457, "global_step": 139307, "epoch": 1678} {"train_loss": -23.156965255737305, "global_step": 139308, "epoch": 1678} {"train_loss": -22.64952850341797, "global_step": 139309, "epoch": 1678} {"train_loss": -23.109378814697266, "global_step": 139310, "epoch": 1678} {"train_loss": -23.088438034057617, "global_step": 139311, "epoch": 1678} {"train_loss": -22.630538940429688, "global_step": 139312, "epoch": 1678} {"train_loss": -23.10603141784668, "global_step": 139313, "epoch": 1678} {"train_loss": -22.91327476501465, "global_step": 139314, "epoch": 1678} {"train_loss": -22.88772964477539, "global_step": 139315, "epoch": 1678} {"train_loss": -22.91140365600586, "global_step": 139316, "epoch": 1678} {"train_loss": -22.760549545288086, "global_step": 139317, "epoch": 1678} {"train_loss": -22.75060272216797, "global_step": 139318, "epoch": 1678} {"train_loss": -22.85383415222168, "global_step": 139319, "epoch": 1678} {"train_loss": -22.819143295288086, "global_step": 139320, "epoch": 1678} {"train_loss": -22.927677154541016, "global_step": 139321, "epoch": 1678} {"train_loss": -22.848859786987305, "global_step": 139322, "epoch": 1678} {"train_loss": -22.707645416259766, "global_step": 139323, "epoch": 1678} {"train_loss": -23.021337509155273, "global_step": 139324, "epoch": 1678} {"train_loss": -22.661413192749023, "global_step": 139325, "epoch": 1678} {"train_loss": -23.316513061523438, "global_step": 139326, "epoch": 1678} {"train_loss": -22.40467643737793, "global_step": 139327, "epoch": 1678} {"train_loss": -22.48041343688965, "global_step": 139328, "epoch": 1678} {"train_loss": -22.784805297851562, "global_step": 139329, "epoch": 1678} {"train_loss": -23.05752944946289, "global_step": 139330, "epoch": 1678} {"train_loss": -22.87700843811035, "global_step": 139331, "epoch": 1678} {"train_loss": -23.126317977905273, "global_step": 139332, "epoch": 1678} {"train_loss": -22.864809036254883, "global_step": 139333, "epoch": 1678} {"train_loss": -22.734373092651367, "global_step": 139334, "epoch": 1678} {"train_loss": -23.02608299255371, "global_step": 139335, "epoch": 1678} {"train_loss": -23.07281494140625, "global_step": 139336, "epoch": 1678} {"train_loss": -22.595279693603516, "global_step": 139337, "epoch": 1678} {"train_loss": -23.153905868530273, "global_step": 139338, "epoch": 1678} {"train_loss": -23.100727081298828, "global_step": 139339, "epoch": 1678} {"train_loss": -22.996458053588867, "global_step": 139340, "epoch": 1678} {"train_loss": -22.993650436401367, "global_step": 139341, "epoch": 1678} {"train_loss": -22.7135009765625, "global_step": 139342, "epoch": 1678} {"train_loss": -23.30971336364746, "global_step": 139343, "epoch": 1678} {"train_loss": -23.23099136352539, "global_step": 139344, "epoch": 1678} {"train_loss": -23.393457412719727, "global_step": 139345, "epoch": 1678} {"train_loss": -22.902746200561523, "global_step": 139346, "epoch": 1678} {"train_loss": -23.247438430786133, "global_step": 139347, "epoch": 1678} {"train_loss": -22.907581329345703, "global_step": 139348, "epoch": 1678} {"train_loss": -22.857406616210938, "global_step": 139349, "epoch": 1678} {"train_loss": -23.23735809326172, "global_step": 139350, "epoch": 1678} {"train_loss": -23.029264450073242, "global_step": 139351, "epoch": 1678} {"train_loss": -23.0887393951416, "global_step": 139352, "epoch": 1678} {"train_loss": -23.188852310180664, "global_step": 139353, "epoch": 1678} {"train_loss": -23.141286849975586, "global_step": 139354, "epoch": 1678} {"train_loss": -22.662799835205078, "global_step": 139355, "epoch": 1678} {"train_loss": -22.941158524478773, "global_step": 139356, "epoch": 1678, "val_loss": 6248681.0} {"train_loss": -22.825468063354492, "global_step": 139357, "epoch": 1679} {"train_loss": -22.27880859375, "global_step": 139358, "epoch": 1679} {"train_loss": -22.268762588500977, "global_step": 139359, "epoch": 1679} {"train_loss": -22.99637794494629, "global_step": 139360, "epoch": 1679} {"train_loss": -22.668489456176758, "global_step": 139361, "epoch": 1679} {"train_loss": -22.480518341064453, "global_step": 139362, "epoch": 1679} {"train_loss": -23.069894790649414, "global_step": 139363, "epoch": 1679} {"train_loss": -22.46112060546875, "global_step": 139364, "epoch": 1679} {"train_loss": -22.43465805053711, "global_step": 139365, "epoch": 1679} {"train_loss": -23.06758689880371, "global_step": 139366, "epoch": 1679} {"train_loss": -22.6602725982666, "global_step": 139367, "epoch": 1679} {"train_loss": -22.856739044189453, "global_step": 139368, "epoch": 1679} {"train_loss": -22.723508834838867, "global_step": 139369, "epoch": 1679} {"train_loss": -22.63900375366211, "global_step": 139370, "epoch": 1679} {"train_loss": -23.18033790588379, "global_step": 139371, "epoch": 1679} {"train_loss": -22.62607765197754, "global_step": 139372, "epoch": 1679} {"train_loss": -22.932405471801758, "global_step": 139373, "epoch": 1679} {"train_loss": -23.105661392211914, "global_step": 139374, "epoch": 1679} {"train_loss": -22.7557430267334, "global_step": 139375, "epoch": 1679} {"train_loss": -23.465063095092773, "global_step": 139376, "epoch": 1679} {"train_loss": -23.198633193969727, "global_step": 139377, "epoch": 1679} {"train_loss": -23.153606414794922, "global_step": 139378, "epoch": 1679} {"train_loss": -23.186616897583008, "global_step": 139379, "epoch": 1679} {"train_loss": -22.836536407470703, "global_step": 139380, "epoch": 1679} {"train_loss": -22.903629302978516, "global_step": 139381, "epoch": 1679} {"train_loss": -23.179479598999023, "global_step": 139382, "epoch": 1679} {"train_loss": -22.859617233276367, "global_step": 139383, "epoch": 1679} {"train_loss": -22.926578521728516, "global_step": 139384, "epoch": 1679} {"train_loss": -23.0417537689209, "global_step": 139385, "epoch": 1679} {"train_loss": -22.989072799682617, "global_step": 139386, "epoch": 1679} {"train_loss": -23.153465270996094, "global_step": 139387, "epoch": 1679} {"train_loss": -22.89190673828125, "global_step": 139388, "epoch": 1679} {"train_loss": -23.071304321289062, "global_step": 139389, "epoch": 1679} {"train_loss": -23.212039947509766, "global_step": 139390, "epoch": 1679} {"train_loss": -22.98825454711914, "global_step": 139391, "epoch": 1679} {"train_loss": -23.0539608001709, "global_step": 139392, "epoch": 1679} {"train_loss": -22.98383140563965, "global_step": 139393, "epoch": 1679} {"train_loss": -22.860946655273438, "global_step": 139394, "epoch": 1679} {"train_loss": -22.612140655517578, "global_step": 139395, "epoch": 1679} {"train_loss": -22.936237335205078, "global_step": 139396, "epoch": 1679} {"train_loss": -23.48855209350586, "global_step": 139397, "epoch": 1679} {"train_loss": -22.858617782592773, "global_step": 139398, "epoch": 1679} {"train_loss": -23.361391067504883, "global_step": 139399, "epoch": 1679} {"train_loss": -23.462997436523438, "global_step": 139400, "epoch": 1679} {"train_loss": -23.072980880737305, "global_step": 139401, "epoch": 1679} {"train_loss": -22.928110122680664, "global_step": 139402, "epoch": 1679} {"train_loss": -23.010408401489258, "global_step": 139403, "epoch": 1679} {"train_loss": -22.835447311401367, "global_step": 139404, "epoch": 1679} {"train_loss": -23.121379852294922, "global_step": 139405, "epoch": 1679} {"train_loss": -22.828367233276367, "global_step": 139406, "epoch": 1679} {"train_loss": -23.207834243774414, "global_step": 139407, "epoch": 1679} {"train_loss": -23.05208396911621, "global_step": 139408, "epoch": 1679} {"train_loss": -23.0249080657959, "global_step": 139409, "epoch": 1679} {"train_loss": -23.18338394165039, "global_step": 139410, "epoch": 1679} {"train_loss": -23.32114601135254, "global_step": 139411, "epoch": 1679} {"train_loss": -22.91526222229004, "global_step": 139412, "epoch": 1679} {"train_loss": -22.971052169799805, "global_step": 139413, "epoch": 1679} {"train_loss": -23.10717010498047, "global_step": 139414, "epoch": 1679} {"train_loss": -23.21024513244629, "global_step": 139415, "epoch": 1679} {"train_loss": -23.022911071777344, "global_step": 139416, "epoch": 1679} {"train_loss": -22.876602172851562, "global_step": 139417, "epoch": 1679} {"train_loss": -22.72335433959961, "global_step": 139418, "epoch": 1679} {"train_loss": -22.840085983276367, "global_step": 139419, "epoch": 1679} {"train_loss": -22.81514549255371, "global_step": 139420, "epoch": 1679} {"train_loss": -22.556798934936523, "global_step": 139421, "epoch": 1679} {"train_loss": -22.92494773864746, "global_step": 139422, "epoch": 1679} {"train_loss": -22.948591232299805, "global_step": 139423, "epoch": 1679} {"train_loss": -22.88715934753418, "global_step": 139424, "epoch": 1679} {"train_loss": -22.916915893554688, "global_step": 139425, "epoch": 1679} {"train_loss": -23.216018676757812, "global_step": 139426, "epoch": 1679} {"train_loss": -22.72234344482422, "global_step": 139427, "epoch": 1679} {"train_loss": -23.09379768371582, "global_step": 139428, "epoch": 1679} {"train_loss": -23.096933364868164, "global_step": 139429, "epoch": 1679} {"train_loss": -23.126813888549805, "global_step": 139430, "epoch": 1679} {"train_loss": -22.95789909362793, "global_step": 139431, "epoch": 1679} {"train_loss": -23.058324813842773, "global_step": 139432, "epoch": 1679} {"train_loss": -23.173248291015625, "global_step": 139433, "epoch": 1679} {"train_loss": -23.16827964782715, "global_step": 139434, "epoch": 1679} {"train_loss": -23.33973503112793, "global_step": 139435, "epoch": 1679} {"train_loss": -23.148239135742188, "global_step": 139436, "epoch": 1679} {"train_loss": -23.262596130371094, "global_step": 139437, "epoch": 1679} {"train_loss": -23.063600540161133, "global_step": 139438, "epoch": 1679} {"train_loss": -22.96799558616546, "global_step": 139439, "epoch": 1679, "val_loss": 6318933.0} {"train_loss": -22.475000381469727, "global_step": 139440, "epoch": 1680} {"train_loss": -22.95460319519043, "global_step": 139441, "epoch": 1680} {"train_loss": -22.902658462524414, "global_step": 139442, "epoch": 1680} {"train_loss": -23.073532104492188, "global_step": 139443, "epoch": 1680} {"train_loss": -23.045330047607422, "global_step": 139444, "epoch": 1680} {"train_loss": -22.996368408203125, "global_step": 139445, "epoch": 1680} {"train_loss": -23.16639518737793, "global_step": 139446, "epoch": 1680} {"train_loss": -22.79654884338379, "global_step": 139447, "epoch": 1680} {"train_loss": -22.886096954345703, "global_step": 139448, "epoch": 1680} {"train_loss": -22.929161071777344, "global_step": 139449, "epoch": 1680} {"train_loss": -23.009521484375, "global_step": 139450, "epoch": 1680} {"train_loss": -23.139083862304688, "global_step": 139451, "epoch": 1680} {"train_loss": -22.626115798950195, "global_step": 139452, "epoch": 1680} {"train_loss": -22.858339309692383, "global_step": 139453, "epoch": 1680} {"train_loss": -22.730060577392578, "global_step": 139454, "epoch": 1680} {"train_loss": -23.34149742126465, "global_step": 139455, "epoch": 1680} {"train_loss": -23.076623916625977, "global_step": 139456, "epoch": 1680} {"train_loss": -23.006332397460938, "global_step": 139457, "epoch": 1680} {"train_loss": -23.397886276245117, "global_step": 139458, "epoch": 1680} {"train_loss": -23.00270652770996, "global_step": 139459, "epoch": 1680} {"train_loss": -22.710405349731445, "global_step": 139460, "epoch": 1680} {"train_loss": -23.112674713134766, "global_step": 139461, "epoch": 1680} {"train_loss": -23.053573608398438, "global_step": 139462, "epoch": 1680} {"train_loss": -23.195838928222656, "global_step": 139463, "epoch": 1680} {"train_loss": -23.130130767822266, "global_step": 139464, "epoch": 1680} {"train_loss": -22.964519500732422, "global_step": 139465, "epoch": 1680} {"train_loss": -22.74991798400879, "global_step": 139466, "epoch": 1680} {"train_loss": -23.184385299682617, "global_step": 139467, "epoch": 1680} {"train_loss": -23.316303253173828, "global_step": 139468, "epoch": 1680} {"train_loss": -23.008359909057617, "global_step": 139469, "epoch": 1680} {"train_loss": -22.91736602783203, "global_step": 139470, "epoch": 1680} {"train_loss": -23.24725341796875, "global_step": 139471, "epoch": 1680} {"train_loss": -23.224376678466797, "global_step": 139472, "epoch": 1680} {"train_loss": -22.952735900878906, "global_step": 139473, "epoch": 1680} {"train_loss": -22.818721771240234, "global_step": 139474, "epoch": 1680} {"train_loss": -23.305124282836914, "global_step": 139475, "epoch": 1680} {"train_loss": -23.180944442749023, "global_step": 139476, "epoch": 1680} {"train_loss": -23.225553512573242, "global_step": 139477, "epoch": 1680} {"train_loss": -23.1409854888916, "global_step": 139478, "epoch": 1680} {"train_loss": -22.70705223083496, "global_step": 139479, "epoch": 1680} {"train_loss": -22.69411849975586, "global_step": 139480, "epoch": 1680} {"train_loss": -23.02701187133789, "global_step": 139481, "epoch": 1680} {"train_loss": -22.42336082458496, "global_step": 139482, "epoch": 1680} {"train_loss": -23.173778533935547, "global_step": 139483, "epoch": 1680} {"train_loss": -22.51676368713379, "global_step": 139484, "epoch": 1680} {"train_loss": -22.724584579467773, "global_step": 139485, "epoch": 1680} {"train_loss": -23.3436222076416, "global_step": 139486, "epoch": 1680} {"train_loss": -23.244321823120117, "global_step": 139487, "epoch": 1680} {"train_loss": -22.962995529174805, "global_step": 139488, "epoch": 1680} {"train_loss": -22.87662696838379, "global_step": 139489, "epoch": 1680} {"train_loss": -23.197044372558594, "global_step": 139490, "epoch": 1680} {"train_loss": -23.243427276611328, "global_step": 139491, "epoch": 1680} {"train_loss": -22.58165168762207, "global_step": 139492, "epoch": 1680} {"train_loss": -23.15297508239746, "global_step": 139493, "epoch": 1680} {"train_loss": -22.953468322753906, "global_step": 139494, "epoch": 1680} {"train_loss": -23.13083839416504, "global_step": 139495, "epoch": 1680} {"train_loss": -23.02778434753418, "global_step": 139496, "epoch": 1680} {"train_loss": -23.213729858398438, "global_step": 139497, "epoch": 1680} {"train_loss": -22.987937927246094, "global_step": 139498, "epoch": 1680} {"train_loss": -22.950876235961914, "global_step": 139499, "epoch": 1680} {"train_loss": -22.869821548461914, "global_step": 139500, "epoch": 1680} {"train_loss": -23.021095275878906, "global_step": 139501, "epoch": 1680} {"train_loss": -22.96575927734375, "global_step": 139502, "epoch": 1680} {"train_loss": -23.241308212280273, "global_step": 139503, "epoch": 1680} {"train_loss": -23.314104080200195, "global_step": 139504, "epoch": 1680} {"train_loss": -23.17061424255371, "global_step": 139505, "epoch": 1680} {"train_loss": -23.053329467773438, "global_step": 139506, "epoch": 1680} {"train_loss": -23.29404640197754, "global_step": 139507, "epoch": 1680} {"train_loss": -22.874536514282227, "global_step": 139508, "epoch": 1680} {"train_loss": -23.16155433654785, "global_step": 139509, "epoch": 1680} {"train_loss": -23.27354621887207, "global_step": 139510, "epoch": 1680} {"train_loss": -22.837491989135742, "global_step": 139511, "epoch": 1680} {"train_loss": -23.025964736938477, "global_step": 139512, "epoch": 1680} {"train_loss": -22.989151000976562, "global_step": 139513, "epoch": 1680} {"train_loss": -22.994165420532227, "global_step": 139514, "epoch": 1680} {"train_loss": -22.805850982666016, "global_step": 139515, "epoch": 1680} {"train_loss": -23.056262969970703, "global_step": 139516, "epoch": 1680} {"train_loss": -23.3350887298584, "global_step": 139517, "epoch": 1680} {"train_loss": -22.976285934448242, "global_step": 139518, "epoch": 1680} {"train_loss": -22.787919998168945, "global_step": 139519, "epoch": 1680} {"train_loss": -23.042356491088867, "global_step": 139520, "epoch": 1680} {"train_loss": -22.83898162841797, "global_step": 139521, "epoch": 1680} {"train_loss": -22.997422988156238, "global_step": 139522, "epoch": 1680, "val_loss": 6264493.5} {"train_loss": -21.9367618560791, "global_step": 139523, "epoch": 1681} {"train_loss": -22.50377082824707, "global_step": 139524, "epoch": 1681} {"train_loss": -22.3409423828125, "global_step": 139525, "epoch": 1681} {"train_loss": -22.581899642944336, "global_step": 139526, "epoch": 1681} {"train_loss": -22.370426177978516, "global_step": 139527, "epoch": 1681} {"train_loss": -22.959470748901367, "global_step": 139528, "epoch": 1681} {"train_loss": -22.564584732055664, "global_step": 139529, "epoch": 1681} {"train_loss": -22.879304885864258, "global_step": 139530, "epoch": 1681} {"train_loss": -22.78936767578125, "global_step": 139531, "epoch": 1681} {"train_loss": -22.895605087280273, "global_step": 139532, "epoch": 1681} {"train_loss": -22.60847282409668, "global_step": 139533, "epoch": 1681} {"train_loss": -23.383098602294922, "global_step": 139534, "epoch": 1681} {"train_loss": -23.297441482543945, "global_step": 139535, "epoch": 1681} {"train_loss": -22.805206298828125, "global_step": 139536, "epoch": 1681} {"train_loss": -22.856107711791992, "global_step": 139537, "epoch": 1681} {"train_loss": -22.856887817382812, "global_step": 139538, "epoch": 1681} {"train_loss": -23.29157829284668, "global_step": 139539, "epoch": 1681} {"train_loss": -23.109434127807617, "global_step": 139540, "epoch": 1681} {"train_loss": -22.780853271484375, "global_step": 139541, "epoch": 1681} {"train_loss": -22.942941665649414, "global_step": 139542, "epoch": 1681} {"train_loss": -23.303014755249023, "global_step": 139543, "epoch": 1681} {"train_loss": -23.130279541015625, "global_step": 139544, "epoch": 1681} {"train_loss": -23.112953186035156, "global_step": 139545, "epoch": 1681} {"train_loss": -22.90766716003418, "global_step": 139546, "epoch": 1681} {"train_loss": -23.277408599853516, "global_step": 139547, "epoch": 1681} {"train_loss": -22.92107391357422, "global_step": 139548, "epoch": 1681} {"train_loss": -23.049787521362305, "global_step": 139549, "epoch": 1681} {"train_loss": -23.15256690979004, "global_step": 139550, "epoch": 1681} {"train_loss": -23.30626678466797, "global_step": 139551, "epoch": 1681} {"train_loss": -23.136672973632812, "global_step": 139552, "epoch": 1681} {"train_loss": -22.886381149291992, "global_step": 139553, "epoch": 1681} {"train_loss": -23.23526382446289, "global_step": 139554, "epoch": 1681} {"train_loss": -22.90924644470215, "global_step": 139555, "epoch": 1681} {"train_loss": -22.918399810791016, "global_step": 139556, "epoch": 1681} {"train_loss": -22.446136474609375, "global_step": 139557, "epoch": 1681} {"train_loss": -23.003103256225586, "global_step": 139558, "epoch": 1681} {"train_loss": -22.736042022705078, "global_step": 139559, "epoch": 1681} {"train_loss": -22.66608238220215, "global_step": 139560, "epoch": 1681} {"train_loss": -23.158599853515625, "global_step": 139561, "epoch": 1681} {"train_loss": -22.602384567260742, "global_step": 139562, "epoch": 1681} {"train_loss": -22.7302188873291, "global_step": 139563, "epoch": 1681} {"train_loss": -22.62977409362793, "global_step": 139564, "epoch": 1681} {"train_loss": -22.843774795532227, "global_step": 139565, "epoch": 1681} {"train_loss": -22.98154640197754, "global_step": 139566, "epoch": 1681} {"train_loss": -23.047536849975586, "global_step": 139567, "epoch": 1681} {"train_loss": -22.9652156829834, "global_step": 139568, "epoch": 1681} {"train_loss": -22.962696075439453, "global_step": 139569, "epoch": 1681} {"train_loss": -23.093244552612305, "global_step": 139570, "epoch": 1681} {"train_loss": -23.169734954833984, "global_step": 139571, "epoch": 1681} {"train_loss": -23.103965759277344, "global_step": 139572, "epoch": 1681} {"train_loss": -23.438396453857422, "global_step": 139573, "epoch": 1681} {"train_loss": -23.02201271057129, "global_step": 139574, "epoch": 1681} {"train_loss": -23.138715744018555, "global_step": 139575, "epoch": 1681} {"train_loss": -22.897939682006836, "global_step": 139576, "epoch": 1681} {"train_loss": -23.102773666381836, "global_step": 139577, "epoch": 1681} {"train_loss": -23.167295455932617, "global_step": 139578, "epoch": 1681} {"train_loss": -22.973970413208008, "global_step": 139579, "epoch": 1681} {"train_loss": -23.255949020385742, "global_step": 139580, "epoch": 1681} {"train_loss": -22.904399871826172, "global_step": 139581, "epoch": 1681} {"train_loss": -23.250877380371094, "global_step": 139582, "epoch": 1681} {"train_loss": -23.063060760498047, "global_step": 139583, "epoch": 1681} {"train_loss": -22.87760353088379, "global_step": 139584, "epoch": 1681} {"train_loss": -23.272294998168945, "global_step": 139585, "epoch": 1681} {"train_loss": -22.88577651977539, "global_step": 139586, "epoch": 1681} {"train_loss": -23.142810821533203, "global_step": 139587, "epoch": 1681} {"train_loss": -23.180316925048828, "global_step": 139588, "epoch": 1681} {"train_loss": -22.835580825805664, "global_step": 139589, "epoch": 1681} {"train_loss": -23.014204025268555, "global_step": 139590, "epoch": 1681} {"train_loss": -23.373281478881836, "global_step": 139591, "epoch": 1681} {"train_loss": -23.12678337097168, "global_step": 139592, "epoch": 1681} {"train_loss": -23.009679794311523, "global_step": 139593, "epoch": 1681} {"train_loss": -23.122848510742188, "global_step": 139594, "epoch": 1681} {"train_loss": -23.17127799987793, "global_step": 139595, "epoch": 1681} {"train_loss": -23.076215744018555, "global_step": 139596, "epoch": 1681} {"train_loss": -23.088851928710938, "global_step": 139597, "epoch": 1681} {"train_loss": -23.182729721069336, "global_step": 139598, "epoch": 1681} {"train_loss": -23.331369400024414, "global_step": 139599, "epoch": 1681} {"train_loss": -23.208547592163086, "global_step": 139600, "epoch": 1681} {"train_loss": -23.030271530151367, "global_step": 139601, "epoch": 1681} {"train_loss": -23.166606903076172, "global_step": 139602, "epoch": 1681} {"train_loss": -23.01202964782715, "global_step": 139603, "epoch": 1681} {"train_loss": -22.916112899780273, "global_step": 139604, "epoch": 1681} {"train_loss": -22.976312959050556, "global_step": 139605, "epoch": 1681, "val_loss": 6289483.0} {"train_loss": -22.64936637878418, "global_step": 139606, "epoch": 1682} {"train_loss": -22.414655685424805, "global_step": 139607, "epoch": 1682} {"train_loss": -22.349708557128906, "global_step": 139608, "epoch": 1682} {"train_loss": -22.579132080078125, "global_step": 139609, "epoch": 1682} {"train_loss": -22.15477180480957, "global_step": 139610, "epoch": 1682} {"train_loss": -22.188093185424805, "global_step": 139611, "epoch": 1682} {"train_loss": -22.286569595336914, "global_step": 139612, "epoch": 1682} {"train_loss": -22.678892135620117, "global_step": 139613, "epoch": 1682} {"train_loss": -22.378381729125977, "global_step": 139614, "epoch": 1682} {"train_loss": -22.676204681396484, "global_step": 139615, "epoch": 1682} {"train_loss": -22.344223022460938, "global_step": 139616, "epoch": 1682} {"train_loss": -22.552061080932617, "global_step": 139617, "epoch": 1682} {"train_loss": -22.61065673828125, "global_step": 139618, "epoch": 1682} {"train_loss": -22.187349319458008, "global_step": 139619, "epoch": 1682} {"train_loss": -23.043853759765625, "global_step": 139620, "epoch": 1682} {"train_loss": -22.36307144165039, "global_step": 139621, "epoch": 1682} {"train_loss": -22.57054901123047, "global_step": 139622, "epoch": 1682} {"train_loss": -22.86496925354004, "global_step": 139623, "epoch": 1682} {"train_loss": -22.721147537231445, "global_step": 139624, "epoch": 1682} {"train_loss": -22.87213706970215, "global_step": 139625, "epoch": 1682} {"train_loss": -23.06715202331543, "global_step": 139626, "epoch": 1682} {"train_loss": -22.692941665649414, "global_step": 139627, "epoch": 1682} {"train_loss": -23.075672149658203, "global_step": 139628, "epoch": 1682} {"train_loss": -23.038007736206055, "global_step": 139629, "epoch": 1682} {"train_loss": -22.77960777282715, "global_step": 139630, "epoch": 1682} {"train_loss": -22.937707901000977, "global_step": 139631, "epoch": 1682} {"train_loss": -22.810272216796875, "global_step": 139632, "epoch": 1682} {"train_loss": -22.841693878173828, "global_step": 139633, "epoch": 1682} {"train_loss": -23.193265914916992, "global_step": 139634, "epoch": 1682} {"train_loss": -23.185178756713867, "global_step": 139635, "epoch": 1682} {"train_loss": -22.680984497070312, "global_step": 139636, "epoch": 1682} {"train_loss": -22.96994972229004, "global_step": 139637, "epoch": 1682} {"train_loss": -22.901369094848633, "global_step": 139638, "epoch": 1682} {"train_loss": -22.98910903930664, "global_step": 139639, "epoch": 1682} {"train_loss": -23.167091369628906, "global_step": 139640, "epoch": 1682} {"train_loss": -23.11089515686035, "global_step": 139641, "epoch": 1682} {"train_loss": -23.38995933532715, "global_step": 139642, "epoch": 1682} {"train_loss": -22.84256935119629, "global_step": 139643, "epoch": 1682} {"train_loss": -23.208860397338867, "global_step": 139644, "epoch": 1682} {"train_loss": -23.160314559936523, "global_step": 139645, "epoch": 1682} {"train_loss": -22.839101791381836, "global_step": 139646, "epoch": 1682} {"train_loss": -23.116931915283203, "global_step": 139647, "epoch": 1682} {"train_loss": -23.142480850219727, "global_step": 139648, "epoch": 1682} {"train_loss": -22.772268295288086, "global_step": 139649, "epoch": 1682} {"train_loss": -23.10475730895996, "global_step": 139650, "epoch": 1682} {"train_loss": -22.867156982421875, "global_step": 139651, "epoch": 1682} {"train_loss": -23.026029586791992, "global_step": 139652, "epoch": 1682} {"train_loss": -22.781991958618164, "global_step": 139653, "epoch": 1682} {"train_loss": -22.959487915039062, "global_step": 139654, "epoch": 1682} {"train_loss": -23.360483169555664, "global_step": 139655, "epoch": 1682} {"train_loss": -23.14647102355957, "global_step": 139656, "epoch": 1682} {"train_loss": -23.04788589477539, "global_step": 139657, "epoch": 1682} {"train_loss": -23.05173110961914, "global_step": 139658, "epoch": 1682} {"train_loss": -22.78597640991211, "global_step": 139659, "epoch": 1682} {"train_loss": -22.883989334106445, "global_step": 139660, "epoch": 1682} {"train_loss": -23.360227584838867, "global_step": 139661, "epoch": 1682} {"train_loss": -23.04325294494629, "global_step": 139662, "epoch": 1682} {"train_loss": -23.428728103637695, "global_step": 139663, "epoch": 1682} {"train_loss": -23.154584884643555, "global_step": 139664, "epoch": 1682} {"train_loss": -22.865713119506836, "global_step": 139665, "epoch": 1682} {"train_loss": -22.907896041870117, "global_step": 139666, "epoch": 1682} {"train_loss": -22.775562286376953, "global_step": 139667, "epoch": 1682} {"train_loss": -22.82529067993164, "global_step": 139668, "epoch": 1682} {"train_loss": -22.906484603881836, "global_step": 139669, "epoch": 1682} {"train_loss": -22.7393856048584, "global_step": 139670, "epoch": 1682} {"train_loss": -23.227642059326172, "global_step": 139671, "epoch": 1682} {"train_loss": -22.96681785583496, "global_step": 139672, "epoch": 1682} {"train_loss": -22.8565731048584, "global_step": 139673, "epoch": 1682} {"train_loss": -23.124664306640625, "global_step": 139674, "epoch": 1682} {"train_loss": -23.20601463317871, "global_step": 139675, "epoch": 1682} {"train_loss": -23.157499313354492, "global_step": 139676, "epoch": 1682} {"train_loss": -23.207046508789062, "global_step": 139677, "epoch": 1682} {"train_loss": -22.54706382751465, "global_step": 139678, "epoch": 1682} {"train_loss": -22.824909210205078, "global_step": 139679, "epoch": 1682} {"train_loss": -22.687253952026367, "global_step": 139680, "epoch": 1682} {"train_loss": -23.22003173828125, "global_step": 139681, "epoch": 1682} {"train_loss": -23.147470474243164, "global_step": 139682, "epoch": 1682} {"train_loss": -23.081058502197266, "global_step": 139683, "epoch": 1682} {"train_loss": -23.17612648010254, "global_step": 139684, "epoch": 1682} {"train_loss": -23.014944076538086, "global_step": 139685, "epoch": 1682} {"train_loss": -23.288511276245117, "global_step": 139686, "epoch": 1682} {"train_loss": -22.986867904663086, "global_step": 139687, "epoch": 1682} {"train_loss": -22.87154788281544, "global_step": 139688, "epoch": 1682, "val_loss": 6388055.0} {"train_loss": -22.59918212890625, "global_step": 139689, "epoch": 1683} {"train_loss": -22.6343994140625, "global_step": 139690, "epoch": 1683} {"train_loss": -22.8952693939209, "global_step": 139691, "epoch": 1683} {"train_loss": -22.590993881225586, "global_step": 139692, "epoch": 1683} {"train_loss": -22.740951538085938, "global_step": 139693, "epoch": 1683} {"train_loss": -22.6831111907959, "global_step": 139694, "epoch": 1683} {"train_loss": -22.676673889160156, "global_step": 139695, "epoch": 1683} {"train_loss": -22.756027221679688, "global_step": 139696, "epoch": 1683} {"train_loss": -23.074865341186523, "global_step": 139697, "epoch": 1683} {"train_loss": -23.018003463745117, "global_step": 139698, "epoch": 1683} {"train_loss": -22.863805770874023, "global_step": 139699, "epoch": 1683} {"train_loss": -22.982343673706055, "global_step": 139700, "epoch": 1683} {"train_loss": -23.39883804321289, "global_step": 139701, "epoch": 1683} {"train_loss": -23.0109806060791, "global_step": 139702, "epoch": 1683} {"train_loss": -22.98232078552246, "global_step": 139703, "epoch": 1683} {"train_loss": -23.039539337158203, "global_step": 139704, "epoch": 1683} {"train_loss": -22.877246856689453, "global_step": 139705, "epoch": 1683} {"train_loss": -22.79859161376953, "global_step": 139706, "epoch": 1683} {"train_loss": -22.939199447631836, "global_step": 139707, "epoch": 1683} {"train_loss": -22.714628219604492, "global_step": 139708, "epoch": 1683} {"train_loss": -23.422672271728516, "global_step": 139709, "epoch": 1683} {"train_loss": -22.831378936767578, "global_step": 139710, "epoch": 1683} {"train_loss": -23.33740234375, "global_step": 139711, "epoch": 1683} {"train_loss": -23.178998947143555, "global_step": 139712, "epoch": 1683} {"train_loss": -22.643198013305664, "global_step": 139713, "epoch": 1683} {"train_loss": -22.935022354125977, "global_step": 139714, "epoch": 1683} {"train_loss": -23.145050048828125, "global_step": 139715, "epoch": 1683} {"train_loss": -22.85812759399414, "global_step": 139716, "epoch": 1683} {"train_loss": -23.40781021118164, "global_step": 139717, "epoch": 1683} {"train_loss": -22.7703857421875, "global_step": 139718, "epoch": 1683} {"train_loss": -23.053449630737305, "global_step": 139719, "epoch": 1683} {"train_loss": -23.101049423217773, "global_step": 139720, "epoch": 1683} {"train_loss": -22.829509735107422, "global_step": 139721, "epoch": 1683} {"train_loss": -23.06865882873535, "global_step": 139722, "epoch": 1683} {"train_loss": -23.653799057006836, "global_step": 139723, "epoch": 1683} {"train_loss": -22.889638900756836, "global_step": 139724, "epoch": 1683} {"train_loss": -23.113693237304688, "global_step": 139725, "epoch": 1683} {"train_loss": -22.898014068603516, "global_step": 139726, "epoch": 1683} {"train_loss": -22.76923370361328, "global_step": 139727, "epoch": 1683} {"train_loss": -22.882015228271484, "global_step": 139728, "epoch": 1683} {"train_loss": -23.063220977783203, "global_step": 139729, "epoch": 1683} {"train_loss": -23.027225494384766, "global_step": 139730, "epoch": 1683} {"train_loss": -22.875354766845703, "global_step": 139731, "epoch": 1683} {"train_loss": -23.089353561401367, "global_step": 139732, "epoch": 1683} {"train_loss": -22.899381637573242, "global_step": 139733, "epoch": 1683} {"train_loss": -22.757596969604492, "global_step": 139734, "epoch": 1683} {"train_loss": -23.393163681030273, "global_step": 139735, "epoch": 1683} {"train_loss": -22.840539932250977, "global_step": 139736, "epoch": 1683} {"train_loss": -23.008838653564453, "global_step": 139737, "epoch": 1683} {"train_loss": -23.176855087280273, "global_step": 139738, "epoch": 1683} {"train_loss": -23.04290008544922, "global_step": 139739, "epoch": 1683} {"train_loss": -22.860605239868164, "global_step": 139740, "epoch": 1683} {"train_loss": -23.2615966796875, "global_step": 139741, "epoch": 1683} {"train_loss": -23.12495231628418, "global_step": 139742, "epoch": 1683} {"train_loss": -23.079015731811523, "global_step": 139743, "epoch": 1683} {"train_loss": -23.476734161376953, "global_step": 139744, "epoch": 1683} {"train_loss": -22.96881866455078, "global_step": 139745, "epoch": 1683} {"train_loss": -22.607608795166016, "global_step": 139746, "epoch": 1683} {"train_loss": -22.920162200927734, "global_step": 139747, "epoch": 1683} {"train_loss": -22.880064010620117, "global_step": 139748, "epoch": 1683} {"train_loss": -23.052509307861328, "global_step": 139749, "epoch": 1683} {"train_loss": -22.604223251342773, "global_step": 139750, "epoch": 1683} {"train_loss": -22.909757614135742, "global_step": 139751, "epoch": 1683} {"train_loss": -22.84293556213379, "global_step": 139752, "epoch": 1683} {"train_loss": -23.160940170288086, "global_step": 139753, "epoch": 1683} {"train_loss": -23.125286102294922, "global_step": 139754, "epoch": 1683} {"train_loss": -22.83098030090332, "global_step": 139755, "epoch": 1683} {"train_loss": -22.98587989807129, "global_step": 139756, "epoch": 1683} {"train_loss": -23.03656768798828, "global_step": 139757, "epoch": 1683} {"train_loss": -23.29817008972168, "global_step": 139758, "epoch": 1683} {"train_loss": -23.143856048583984, "global_step": 139759, "epoch": 1683} {"train_loss": -22.90741539001465, "global_step": 139760, "epoch": 1683} {"train_loss": -22.880094528198242, "global_step": 139761, "epoch": 1683} {"train_loss": -23.03492546081543, "global_step": 139762, "epoch": 1683} {"train_loss": -23.05731201171875, "global_step": 139763, "epoch": 1683} {"train_loss": -23.175094604492188, "global_step": 139764, "epoch": 1683} {"train_loss": -23.074491500854492, "global_step": 139765, "epoch": 1683} {"train_loss": -22.692359924316406, "global_step": 139766, "epoch": 1683} {"train_loss": -23.036279678344727, "global_step": 139767, "epoch": 1683} {"train_loss": -22.883869171142578, "global_step": 139768, "epoch": 1683} {"train_loss": -23.35523796081543, "global_step": 139769, "epoch": 1683} {"train_loss": -22.803695678710938, "global_step": 139770, "epoch": 1683} {"train_loss": -22.97972378098821, "global_step": 139771, "epoch": 1683, "val_loss": 6353756.0} {"train_loss": -22.430395126342773, "global_step": 139772, "epoch": 1684} {"train_loss": -22.079904556274414, "global_step": 139773, "epoch": 1684} {"train_loss": -22.360258102416992, "global_step": 139774, "epoch": 1684} {"train_loss": -23.324926376342773, "global_step": 139775, "epoch": 1684} {"train_loss": -22.525442123413086, "global_step": 139776, "epoch": 1684} {"train_loss": -22.988174438476562, "global_step": 139777, "epoch": 1684} {"train_loss": -22.84700584411621, "global_step": 139778, "epoch": 1684} {"train_loss": -22.463926315307617, "global_step": 139779, "epoch": 1684} {"train_loss": -22.84596824645996, "global_step": 139780, "epoch": 1684} {"train_loss": -22.932083129882812, "global_step": 139781, "epoch": 1684} {"train_loss": -22.860673904418945, "global_step": 139782, "epoch": 1684} {"train_loss": -22.891653060913086, "global_step": 139783, "epoch": 1684} {"train_loss": -22.921716690063477, "global_step": 139784, "epoch": 1684} {"train_loss": -22.70185661315918, "global_step": 139785, "epoch": 1684} {"train_loss": -23.132858276367188, "global_step": 139786, "epoch": 1684} {"train_loss": -23.102550506591797, "global_step": 139787, "epoch": 1684} {"train_loss": -23.101852416992188, "global_step": 139788, "epoch": 1684} {"train_loss": -22.599740982055664, "global_step": 139789, "epoch": 1684} {"train_loss": -22.984853744506836, "global_step": 139790, "epoch": 1684} {"train_loss": -23.302555084228516, "global_step": 139791, "epoch": 1684} {"train_loss": -23.004915237426758, "global_step": 139792, "epoch": 1684} {"train_loss": -23.359403610229492, "global_step": 139793, "epoch": 1684} {"train_loss": -23.23105812072754, "global_step": 139794, "epoch": 1684} {"train_loss": -23.026500701904297, "global_step": 139795, "epoch": 1684} {"train_loss": -22.918380737304688, "global_step": 139796, "epoch": 1684} {"train_loss": -23.01209831237793, "global_step": 139797, "epoch": 1684} {"train_loss": -23.243432998657227, "global_step": 139798, "epoch": 1684} {"train_loss": -23.319080352783203, "global_step": 139799, "epoch": 1684} {"train_loss": -22.749799728393555, "global_step": 139800, "epoch": 1684} {"train_loss": -23.152292251586914, "global_step": 139801, "epoch": 1684} {"train_loss": -23.6182861328125, "global_step": 139802, "epoch": 1684} {"train_loss": -22.668025970458984, "global_step": 139803, "epoch": 1684} {"train_loss": -22.797754287719727, "global_step": 139804, "epoch": 1684} {"train_loss": -23.0253849029541, "global_step": 139805, "epoch": 1684} {"train_loss": -22.848215103149414, "global_step": 139806, "epoch": 1684} {"train_loss": -22.78336524963379, "global_step": 139807, "epoch": 1684} {"train_loss": -23.01417350769043, "global_step": 139808, "epoch": 1684} {"train_loss": -23.343490600585938, "global_step": 139809, "epoch": 1684} {"train_loss": -22.693586349487305, "global_step": 139810, "epoch": 1684} {"train_loss": -22.986778259277344, "global_step": 139811, "epoch": 1684} {"train_loss": -23.172534942626953, "global_step": 139812, "epoch": 1684} {"train_loss": -23.26251792907715, "global_step": 139813, "epoch": 1684} {"train_loss": -23.452289581298828, "global_step": 139814, "epoch": 1684} {"train_loss": -22.697416305541992, "global_step": 139815, "epoch": 1684} {"train_loss": -23.130277633666992, "global_step": 139816, "epoch": 1684} {"train_loss": -22.969749450683594, "global_step": 139817, "epoch": 1684} {"train_loss": -22.979509353637695, "global_step": 139818, "epoch": 1684} {"train_loss": -23.179704666137695, "global_step": 139819, "epoch": 1684} {"train_loss": -23.27302360534668, "global_step": 139820, "epoch": 1684} {"train_loss": -22.82480239868164, "global_step": 139821, "epoch": 1684} {"train_loss": -23.156648635864258, "global_step": 139822, "epoch": 1684} {"train_loss": -23.061735153198242, "global_step": 139823, "epoch": 1684} {"train_loss": -22.752948760986328, "global_step": 139824, "epoch": 1684} {"train_loss": -22.843463897705078, "global_step": 139825, "epoch": 1684} {"train_loss": -23.336166381835938, "global_step": 139826, "epoch": 1684} {"train_loss": -23.16951560974121, "global_step": 139827, "epoch": 1684} {"train_loss": -22.976926803588867, "global_step": 139828, "epoch": 1684} {"train_loss": -22.88484764099121, "global_step": 139829, "epoch": 1684} {"train_loss": -22.949312210083008, "global_step": 139830, "epoch": 1684} {"train_loss": -22.719154357910156, "global_step": 139831, "epoch": 1684} {"train_loss": -23.0020809173584, "global_step": 139832, "epoch": 1684} {"train_loss": -22.919448852539062, "global_step": 139833, "epoch": 1684} {"train_loss": -23.122350692749023, "global_step": 139834, "epoch": 1684} {"train_loss": -22.897920608520508, "global_step": 139835, "epoch": 1684} {"train_loss": -22.943946838378906, "global_step": 139836, "epoch": 1684} {"train_loss": -22.24452781677246, "global_step": 139837, "epoch": 1684} {"train_loss": -23.198612213134766, "global_step": 139838, "epoch": 1684} {"train_loss": -23.195219039916992, "global_step": 139839, "epoch": 1684} {"train_loss": -22.72589111328125, "global_step": 139840, "epoch": 1684} {"train_loss": -22.803129196166992, "global_step": 139841, "epoch": 1684} {"train_loss": -23.071063995361328, "global_step": 139842, "epoch": 1684} {"train_loss": -23.23464012145996, "global_step": 139843, "epoch": 1684} {"train_loss": -23.451677322387695, "global_step": 139844, "epoch": 1684} {"train_loss": -23.14194679260254, "global_step": 139845, "epoch": 1684} {"train_loss": -23.6531982421875, "global_step": 139846, "epoch": 1684} {"train_loss": -23.3162899017334, "global_step": 139847, "epoch": 1684} {"train_loss": -23.194965362548828, "global_step": 139848, "epoch": 1684} {"train_loss": -23.250123977661133, "global_step": 139849, "epoch": 1684} {"train_loss": -23.198904037475586, "global_step": 139850, "epoch": 1684} {"train_loss": -23.161203384399414, "global_step": 139851, "epoch": 1684} {"train_loss": -23.224822998046875, "global_step": 139852, "epoch": 1684} {"train_loss": -23.214513778686523, "global_step": 139853, "epoch": 1684} {"train_loss": -23.00598845424422, "global_step": 139854, "epoch": 1684, "val_loss": 6285768.5} {"train_loss": -23.281709671020508, "global_step": 139855, "epoch": 1685} {"train_loss": -22.516332626342773, "global_step": 139856, "epoch": 1685} {"train_loss": -22.642730712890625, "global_step": 139857, "epoch": 1685} {"train_loss": -23.182973861694336, "global_step": 139858, "epoch": 1685} {"train_loss": -23.08643913269043, "global_step": 139859, "epoch": 1685} {"train_loss": -22.770732879638672, "global_step": 139860, "epoch": 1685} {"train_loss": -22.917036056518555, "global_step": 139861, "epoch": 1685} {"train_loss": -23.116065979003906, "global_step": 139862, "epoch": 1685} {"train_loss": -22.711246490478516, "global_step": 139863, "epoch": 1685} {"train_loss": -22.64865493774414, "global_step": 139864, "epoch": 1685} {"train_loss": -23.350065231323242, "global_step": 139865, "epoch": 1685} {"train_loss": -22.75899314880371, "global_step": 139866, "epoch": 1685} {"train_loss": -23.041656494140625, "global_step": 139867, "epoch": 1685} {"train_loss": -23.279977798461914, "global_step": 139868, "epoch": 1685} {"train_loss": -22.982559204101562, "global_step": 139869, "epoch": 1685} {"train_loss": -23.413827896118164, "global_step": 139870, "epoch": 1685} {"train_loss": -22.926517486572266, "global_step": 139871, "epoch": 1685} {"train_loss": -22.910470962524414, "global_step": 139872, "epoch": 1685} {"train_loss": -22.96236228942871, "global_step": 139873, "epoch": 1685} {"train_loss": -23.194602966308594, "global_step": 139874, "epoch": 1685} {"train_loss": -22.863828659057617, "global_step": 139875, "epoch": 1685} {"train_loss": -23.016529083251953, "global_step": 139876, "epoch": 1685} {"train_loss": -23.023746490478516, "global_step": 139877, "epoch": 1685} {"train_loss": -23.14186668395996, "global_step": 139878, "epoch": 1685} {"train_loss": -22.862451553344727, "global_step": 139879, "epoch": 1685} {"train_loss": -22.948007583618164, "global_step": 139880, "epoch": 1685} {"train_loss": -23.026077270507812, "global_step": 139881, "epoch": 1685} {"train_loss": -22.805864334106445, "global_step": 139882, "epoch": 1685} {"train_loss": -23.082948684692383, "global_step": 139883, "epoch": 1685} {"train_loss": -23.197803497314453, "global_step": 139884, "epoch": 1685} {"train_loss": -23.320636749267578, "global_step": 139885, "epoch": 1685} {"train_loss": -22.843597412109375, "global_step": 139886, "epoch": 1685} {"train_loss": -22.604795455932617, "global_step": 139887, "epoch": 1685} {"train_loss": -23.024810791015625, "global_step": 139888, "epoch": 1685} {"train_loss": -23.051755905151367, "global_step": 139889, "epoch": 1685} {"train_loss": -22.98684310913086, "global_step": 139890, "epoch": 1685} {"train_loss": -23.275697708129883, "global_step": 139891, "epoch": 1685} {"train_loss": -22.84623146057129, "global_step": 139892, "epoch": 1685} {"train_loss": -23.152555465698242, "global_step": 139893, "epoch": 1685} {"train_loss": -22.93060874938965, "global_step": 139894, "epoch": 1685} {"train_loss": -23.054168701171875, "global_step": 139895, "epoch": 1685} {"train_loss": -23.21370506286621, "global_step": 139896, "epoch": 1685} {"train_loss": -23.125219345092773, "global_step": 139897, "epoch": 1685} {"train_loss": -23.047082901000977, "global_step": 139898, "epoch": 1685} {"train_loss": -22.940587997436523, "global_step": 139899, "epoch": 1685} {"train_loss": -23.295934677124023, "global_step": 139900, "epoch": 1685} {"train_loss": -23.024717330932617, "global_step": 139901, "epoch": 1685} {"train_loss": -23.516300201416016, "global_step": 139902, "epoch": 1685} {"train_loss": -23.129240036010742, "global_step": 139903, "epoch": 1685} {"train_loss": -22.958614349365234, "global_step": 139904, "epoch": 1685} {"train_loss": -23.17771339416504, "global_step": 139905, "epoch": 1685} {"train_loss": -22.911373138427734, "global_step": 139906, "epoch": 1685} {"train_loss": -22.98410987854004, "global_step": 139907, "epoch": 1685} {"train_loss": -22.721830368041992, "global_step": 139908, "epoch": 1685} {"train_loss": -22.933107376098633, "global_step": 139909, "epoch": 1685} {"train_loss": -22.914724349975586, "global_step": 139910, "epoch": 1685} {"train_loss": -23.119333267211914, "global_step": 139911, "epoch": 1685} {"train_loss": -23.037811279296875, "global_step": 139912, "epoch": 1685} {"train_loss": -23.197420120239258, "global_step": 139913, "epoch": 1685} {"train_loss": -22.954294204711914, "global_step": 139914, "epoch": 1685} {"train_loss": -23.478967666625977, "global_step": 139915, "epoch": 1685} {"train_loss": -22.78375816345215, "global_step": 139916, "epoch": 1685} {"train_loss": -23.225278854370117, "global_step": 139917, "epoch": 1685} {"train_loss": -23.34799575805664, "global_step": 139918, "epoch": 1685} {"train_loss": -23.3565731048584, "global_step": 139919, "epoch": 1685} {"train_loss": -23.230859756469727, "global_step": 139920, "epoch": 1685} {"train_loss": -22.823278427124023, "global_step": 139921, "epoch": 1685} {"train_loss": -22.882980346679688, "global_step": 139922, "epoch": 1685} {"train_loss": -23.24970817565918, "global_step": 139923, "epoch": 1685} {"train_loss": -23.169464111328125, "global_step": 139924, "epoch": 1685} {"train_loss": -23.199514389038086, "global_step": 139925, "epoch": 1685} {"train_loss": -23.07453727722168, "global_step": 139926, "epoch": 1685} {"train_loss": -22.96230125427246, "global_step": 139927, "epoch": 1685} {"train_loss": -23.135040283203125, "global_step": 139928, "epoch": 1685} {"train_loss": -23.243825912475586, "global_step": 139929, "epoch": 1685} {"train_loss": -22.836294174194336, "global_step": 139930, "epoch": 1685} {"train_loss": -23.106775283813477, "global_step": 139931, "epoch": 1685} {"train_loss": -22.83897590637207, "global_step": 139932, "epoch": 1685} {"train_loss": -23.060571670532227, "global_step": 139933, "epoch": 1685} {"train_loss": -23.301509857177734, "global_step": 139934, "epoch": 1685} {"train_loss": -22.975540161132812, "global_step": 139935, "epoch": 1685} {"train_loss": -22.715200424194336, "global_step": 139936, "epoch": 1685} {"train_loss": -23.03170525884054, "global_step": 139937, "epoch": 1685, "val_loss": 6344410.5} {"train_loss": -22.1595401763916, "global_step": 139938, "epoch": 1686} {"train_loss": -23.12459373474121, "global_step": 139939, "epoch": 1686} {"train_loss": -22.257471084594727, "global_step": 139940, "epoch": 1686} {"train_loss": -22.479022979736328, "global_step": 139941, "epoch": 1686} {"train_loss": -22.227039337158203, "global_step": 139942, "epoch": 1686} {"train_loss": -22.610233306884766, "global_step": 139943, "epoch": 1686} {"train_loss": -22.759939193725586, "global_step": 139944, "epoch": 1686} {"train_loss": -22.740461349487305, "global_step": 139945, "epoch": 1686} {"train_loss": -22.625436782836914, "global_step": 139946, "epoch": 1686} {"train_loss": -22.53338623046875, "global_step": 139947, "epoch": 1686} {"train_loss": -22.569883346557617, "global_step": 139948, "epoch": 1686} {"train_loss": -22.531536102294922, "global_step": 139949, "epoch": 1686} {"train_loss": -22.3216495513916, "global_step": 139950, "epoch": 1686} {"train_loss": -22.97978973388672, "global_step": 139951, "epoch": 1686} {"train_loss": -22.343778610229492, "global_step": 139952, "epoch": 1686} {"train_loss": -22.793981552124023, "global_step": 139953, "epoch": 1686} {"train_loss": -22.92278480529785, "global_step": 139954, "epoch": 1686} {"train_loss": -22.90081024169922, "global_step": 139955, "epoch": 1686} {"train_loss": -22.69134521484375, "global_step": 139956, "epoch": 1686} {"train_loss": -22.827543258666992, "global_step": 139957, "epoch": 1686} {"train_loss": -23.34489631652832, "global_step": 139958, "epoch": 1686} {"train_loss": -22.959409713745117, "global_step": 139959, "epoch": 1686} {"train_loss": -23.46669578552246, "global_step": 139960, "epoch": 1686} {"train_loss": -22.88531494140625, "global_step": 139961, "epoch": 1686} {"train_loss": -23.164936065673828, "global_step": 139962, "epoch": 1686} {"train_loss": -22.934694290161133, "global_step": 139963, "epoch": 1686} {"train_loss": -23.20185089111328, "global_step": 139964, "epoch": 1686} {"train_loss": -23.163040161132812, "global_step": 139965, "epoch": 1686} {"train_loss": -22.91423225402832, "global_step": 139966, "epoch": 1686} {"train_loss": -22.798242568969727, "global_step": 139967, "epoch": 1686} {"train_loss": -23.487247467041016, "global_step": 139968, "epoch": 1686} {"train_loss": -23.249126434326172, "global_step": 139969, "epoch": 1686} {"train_loss": -23.081491470336914, "global_step": 139970, "epoch": 1686} {"train_loss": -22.85487174987793, "global_step": 139971, "epoch": 1686} {"train_loss": -22.803239822387695, "global_step": 139972, "epoch": 1686} {"train_loss": -23.396432876586914, "global_step": 139973, "epoch": 1686} {"train_loss": -22.93898582458496, "global_step": 139974, "epoch": 1686} {"train_loss": -23.282028198242188, "global_step": 139975, "epoch": 1686} {"train_loss": -23.03323745727539, "global_step": 139976, "epoch": 1686} {"train_loss": -23.260717391967773, "global_step": 139977, "epoch": 1686} {"train_loss": -23.41025733947754, "global_step": 139978, "epoch": 1686} {"train_loss": -22.942459106445312, "global_step": 139979, "epoch": 1686} {"train_loss": -23.171730041503906, "global_step": 139980, "epoch": 1686} {"train_loss": -22.851343154907227, "global_step": 139981, "epoch": 1686} {"train_loss": -23.316116333007812, "global_step": 139982, "epoch": 1686} {"train_loss": -23.18425941467285, "global_step": 139983, "epoch": 1686} {"train_loss": -23.166685104370117, "global_step": 139984, "epoch": 1686} {"train_loss": -23.18702507019043, "global_step": 139985, "epoch": 1686} {"train_loss": -23.182950973510742, "global_step": 139986, "epoch": 1686} {"train_loss": -22.917682647705078, "global_step": 139987, "epoch": 1686} {"train_loss": -22.962940216064453, "global_step": 139988, "epoch": 1686} {"train_loss": -23.22406578063965, "global_step": 139989, "epoch": 1686} {"train_loss": -22.977954864501953, "global_step": 139990, "epoch": 1686} {"train_loss": -23.161951065063477, "global_step": 139991, "epoch": 1686} {"train_loss": -22.95153045654297, "global_step": 139992, "epoch": 1686} {"train_loss": -23.02313232421875, "global_step": 139993, "epoch": 1686} {"train_loss": -23.1877384185791, "global_step": 139994, "epoch": 1686} {"train_loss": -22.931753158569336, "global_step": 139995, "epoch": 1686} {"train_loss": -22.675514221191406, "global_step": 139996, "epoch": 1686} {"train_loss": -22.637638092041016, "global_step": 139997, "epoch": 1686} {"train_loss": -23.092878341674805, "global_step": 139998, "epoch": 1686} {"train_loss": -23.458721160888672, "global_step": 139999, "epoch": 1686} {"train_loss": -23.131582260131836, "global_step": 140000, "epoch": 1686} {"train_loss": -23.052610397338867, "global_step": 140001, "epoch": 1686} {"train_loss": -23.195449829101562, "global_step": 140002, "epoch": 1686} {"train_loss": -23.21980094909668, "global_step": 140003, "epoch": 1686} {"train_loss": -22.792287826538086, "global_step": 140004, "epoch": 1686} {"train_loss": -22.921241760253906, "global_step": 140005, "epoch": 1686} {"train_loss": -23.173147201538086, "global_step": 140006, "epoch": 1686} {"train_loss": -23.378643035888672, "global_step": 140007, "epoch": 1686} {"train_loss": -23.58411979675293, "global_step": 140008, "epoch": 1686} {"train_loss": -23.150930404663086, "global_step": 140009, "epoch": 1686} {"train_loss": -22.880830764770508, "global_step": 140010, "epoch": 1686} {"train_loss": -23.076614379882812, "global_step": 140011, "epoch": 1686} {"train_loss": -23.15752410888672, "global_step": 140012, "epoch": 1686} {"train_loss": -23.29617691040039, "global_step": 140013, "epoch": 1686} {"train_loss": -22.832061767578125, "global_step": 140014, "epoch": 1686} {"train_loss": -23.021268844604492, "global_step": 140015, "epoch": 1686} {"train_loss": -23.25003433227539, "global_step": 140016, "epoch": 1686} {"train_loss": -23.1486759185791, "global_step": 140017, "epoch": 1686} {"train_loss": -22.935495376586914, "global_step": 140018, "epoch": 1686} {"train_loss": -23.06391716003418, "global_step": 140019, "epoch": 1686} {"train_loss": -22.98070080309029, "global_step": 140020, "epoch": 1686, "val_loss": 6300427.5} {"train_loss": -21.864532470703125, "global_step": 140021, "epoch": 1687} {"train_loss": -22.170852661132812, "global_step": 140022, "epoch": 1687} {"train_loss": -22.467010498046875, "global_step": 140023, "epoch": 1687} {"train_loss": -22.62195587158203, "global_step": 140024, "epoch": 1687} {"train_loss": -22.145339965820312, "global_step": 140025, "epoch": 1687} {"train_loss": -22.211101531982422, "global_step": 140026, "epoch": 1687} {"train_loss": -22.838964462280273, "global_step": 140027, "epoch": 1687} {"train_loss": -22.681177139282227, "global_step": 140028, "epoch": 1687} {"train_loss": -22.96971321105957, "global_step": 140029, "epoch": 1687} {"train_loss": -22.40561866760254, "global_step": 140030, "epoch": 1687} {"train_loss": -22.542325973510742, "global_step": 140031, "epoch": 1687} {"train_loss": -22.900146484375, "global_step": 140032, "epoch": 1687} {"train_loss": -22.595876693725586, "global_step": 140033, "epoch": 1687} {"train_loss": -22.804494857788086, "global_step": 140034, "epoch": 1687} {"train_loss": -22.857513427734375, "global_step": 140035, "epoch": 1687} {"train_loss": -22.72196388244629, "global_step": 140036, "epoch": 1687} {"train_loss": -22.760164260864258, "global_step": 140037, "epoch": 1687} {"train_loss": -22.522401809692383, "global_step": 140038, "epoch": 1687} {"train_loss": -22.758955001831055, "global_step": 140039, "epoch": 1687} {"train_loss": -23.039409637451172, "global_step": 140040, "epoch": 1687} {"train_loss": -22.8689022064209, "global_step": 140041, "epoch": 1687} {"train_loss": -22.561304092407227, "global_step": 140042, "epoch": 1687} {"train_loss": -22.844411849975586, "global_step": 140043, "epoch": 1687} {"train_loss": -22.754657745361328, "global_step": 140044, "epoch": 1687} {"train_loss": -23.0471248626709, "global_step": 140045, "epoch": 1687} {"train_loss": -22.838451385498047, "global_step": 140046, "epoch": 1687} {"train_loss": -23.33603858947754, "global_step": 140047, "epoch": 1687} {"train_loss": -23.276103973388672, "global_step": 140048, "epoch": 1687} {"train_loss": -22.779333114624023, "global_step": 140049, "epoch": 1687} {"train_loss": -22.750883102416992, "global_step": 140050, "epoch": 1687} {"train_loss": -22.587690353393555, "global_step": 140051, "epoch": 1687} {"train_loss": -23.126358032226562, "global_step": 140052, "epoch": 1687} {"train_loss": -23.2014102935791, "global_step": 140053, "epoch": 1687} {"train_loss": -23.212934494018555, "global_step": 140054, "epoch": 1687} {"train_loss": -23.049978256225586, "global_step": 140055, "epoch": 1687} {"train_loss": -23.128259658813477, "global_step": 140056, "epoch": 1687} {"train_loss": -23.102357864379883, "global_step": 140057, "epoch": 1687} {"train_loss": -23.29935646057129, "global_step": 140058, "epoch": 1687} {"train_loss": -22.88416862487793, "global_step": 140059, "epoch": 1687} {"train_loss": -23.330280303955078, "global_step": 140060, "epoch": 1687} {"train_loss": -23.01235008239746, "global_step": 140061, "epoch": 1687} {"train_loss": -23.11856460571289, "global_step": 140062, "epoch": 1687} {"train_loss": -23.253421783447266, "global_step": 140063, "epoch": 1687} {"train_loss": -23.20528221130371, "global_step": 140064, "epoch": 1687} {"train_loss": -23.213651657104492, "global_step": 140065, "epoch": 1687} {"train_loss": -22.78754997253418, "global_step": 140066, "epoch": 1687} {"train_loss": -22.517139434814453, "global_step": 140067, "epoch": 1687} {"train_loss": -22.757431030273438, "global_step": 140068, "epoch": 1687} {"train_loss": -23.034515380859375, "global_step": 140069, "epoch": 1687} {"train_loss": -23.239931106567383, "global_step": 140070, "epoch": 1687} {"train_loss": -23.26025390625, "global_step": 140071, "epoch": 1687} {"train_loss": -22.909849166870117, "global_step": 140072, "epoch": 1687} {"train_loss": -22.905887603759766, "global_step": 140073, "epoch": 1687} {"train_loss": -23.102046966552734, "global_step": 140074, "epoch": 1687} {"train_loss": -22.91914176940918, "global_step": 140075, "epoch": 1687} {"train_loss": -22.997098922729492, "global_step": 140076, "epoch": 1687} {"train_loss": -23.17951011657715, "global_step": 140077, "epoch": 1687} {"train_loss": -22.98505973815918, "global_step": 140078, "epoch": 1687} {"train_loss": -23.35382080078125, "global_step": 140079, "epoch": 1687} {"train_loss": -23.245248794555664, "global_step": 140080, "epoch": 1687} {"train_loss": -23.034122467041016, "global_step": 140081, "epoch": 1687} {"train_loss": -23.311826705932617, "global_step": 140082, "epoch": 1687} {"train_loss": -23.264394760131836, "global_step": 140083, "epoch": 1687} {"train_loss": -22.787534713745117, "global_step": 140084, "epoch": 1687} {"train_loss": -23.639245986938477, "global_step": 140085, "epoch": 1687} {"train_loss": -22.835857391357422, "global_step": 140086, "epoch": 1687} {"train_loss": -23.088043212890625, "global_step": 140087, "epoch": 1687} {"train_loss": -23.076358795166016, "global_step": 140088, "epoch": 1687} {"train_loss": -23.10062599182129, "global_step": 140089, "epoch": 1687} {"train_loss": -23.207386016845703, "global_step": 140090, "epoch": 1687} {"train_loss": -23.101215362548828, "global_step": 140091, "epoch": 1687} {"train_loss": -23.137008666992188, "global_step": 140092, "epoch": 1687} {"train_loss": -22.725326538085938, "global_step": 140093, "epoch": 1687} {"train_loss": -23.05515480041504, "global_step": 140094, "epoch": 1687} {"train_loss": -22.95151710510254, "global_step": 140095, "epoch": 1687} {"train_loss": -22.801345825195312, "global_step": 140096, "epoch": 1687} {"train_loss": -23.228811264038086, "global_step": 140097, "epoch": 1687} {"train_loss": -23.1386775970459, "global_step": 140098, "epoch": 1687} {"train_loss": -23.04524040222168, "global_step": 140099, "epoch": 1687} {"train_loss": -23.116785049438477, "global_step": 140100, "epoch": 1687} {"train_loss": -23.376325607299805, "global_step": 140101, "epoch": 1687} {"train_loss": -23.27876853942871, "global_step": 140102, "epoch": 1687} {"train_loss": -22.935052664883166, "global_step": 140103, "epoch": 1687, "val_loss": 6240904.5} {"train_loss": -22.197114944458008, "global_step": 140104, "epoch": 1688} {"train_loss": -22.55245018005371, "global_step": 140105, "epoch": 1688} {"train_loss": -22.413738250732422, "global_step": 140106, "epoch": 1688} {"train_loss": -22.544492721557617, "global_step": 140107, "epoch": 1688} {"train_loss": -22.531076431274414, "global_step": 140108, "epoch": 1688} {"train_loss": -22.987585067749023, "global_step": 140109, "epoch": 1688} {"train_loss": -22.330360412597656, "global_step": 140110, "epoch": 1688} {"train_loss": -22.563213348388672, "global_step": 140111, "epoch": 1688} {"train_loss": -22.382522583007812, "global_step": 140112, "epoch": 1688} {"train_loss": -22.380735397338867, "global_step": 140113, "epoch": 1688} {"train_loss": -22.816730499267578, "global_step": 140114, "epoch": 1688} {"train_loss": -22.93122673034668, "global_step": 140115, "epoch": 1688} {"train_loss": -23.115848541259766, "global_step": 140116, "epoch": 1688} {"train_loss": -22.943439483642578, "global_step": 140117, "epoch": 1688} {"train_loss": -22.714853286743164, "global_step": 140118, "epoch": 1688} {"train_loss": -22.619850158691406, "global_step": 140119, "epoch": 1688} {"train_loss": -22.69371223449707, "global_step": 140120, "epoch": 1688} {"train_loss": -22.942319869995117, "global_step": 140121, "epoch": 1688} {"train_loss": -22.939498901367188, "global_step": 140122, "epoch": 1688} {"train_loss": -22.916046142578125, "global_step": 140123, "epoch": 1688} {"train_loss": -23.05623435974121, "global_step": 140124, "epoch": 1688} {"train_loss": -22.626829147338867, "global_step": 140125, "epoch": 1688} {"train_loss": -22.842641830444336, "global_step": 140126, "epoch": 1688} {"train_loss": -22.99321937561035, "global_step": 140127, "epoch": 1688} {"train_loss": -22.629779815673828, "global_step": 140128, "epoch": 1688} {"train_loss": -23.012693405151367, "global_step": 140129, "epoch": 1688} {"train_loss": -23.027029037475586, "global_step": 140130, "epoch": 1688} {"train_loss": -23.458555221557617, "global_step": 140131, "epoch": 1688} {"train_loss": -22.912870407104492, "global_step": 140132, "epoch": 1688} {"train_loss": -22.82491111755371, "global_step": 140133, "epoch": 1688} {"train_loss": -23.337278366088867, "global_step": 140134, "epoch": 1688} {"train_loss": -23.096906661987305, "global_step": 140135, "epoch": 1688} {"train_loss": -23.25593376159668, "global_step": 140136, "epoch": 1688} {"train_loss": -23.049890518188477, "global_step": 140137, "epoch": 1688} {"train_loss": -22.885360717773438, "global_step": 140138, "epoch": 1688} {"train_loss": -23.104293823242188, "global_step": 140139, "epoch": 1688} {"train_loss": -23.02215576171875, "global_step": 140140, "epoch": 1688} {"train_loss": -22.91017723083496, "global_step": 140141, "epoch": 1688} {"train_loss": -22.80579948425293, "global_step": 140142, "epoch": 1688} {"train_loss": -23.548343658447266, "global_step": 140143, "epoch": 1688} {"train_loss": -22.879037857055664, "global_step": 140144, "epoch": 1688} {"train_loss": -23.198026657104492, "global_step": 140145, "epoch": 1688} {"train_loss": -22.828872680664062, "global_step": 140146, "epoch": 1688} {"train_loss": -22.821683883666992, "global_step": 140147, "epoch": 1688} {"train_loss": -23.32015609741211, "global_step": 140148, "epoch": 1688} {"train_loss": -22.833768844604492, "global_step": 140149, "epoch": 1688} {"train_loss": -23.385229110717773, "global_step": 140150, "epoch": 1688} {"train_loss": -22.765338897705078, "global_step": 140151, "epoch": 1688} {"train_loss": -22.829532623291016, "global_step": 140152, "epoch": 1688} {"train_loss": -23.333703994750977, "global_step": 140153, "epoch": 1688} {"train_loss": -23.074432373046875, "global_step": 140154, "epoch": 1688} {"train_loss": -22.79043197631836, "global_step": 140155, "epoch": 1688} {"train_loss": -23.238080978393555, "global_step": 140156, "epoch": 1688} {"train_loss": -22.8054141998291, "global_step": 140157, "epoch": 1688} {"train_loss": -23.037540435791016, "global_step": 140158, "epoch": 1688} {"train_loss": -22.870529174804688, "global_step": 140159, "epoch": 1688} {"train_loss": -22.825790405273438, "global_step": 140160, "epoch": 1688} {"train_loss": -23.152679443359375, "global_step": 140161, "epoch": 1688} {"train_loss": -23.079294204711914, "global_step": 140162, "epoch": 1688} {"train_loss": -23.231740951538086, "global_step": 140163, "epoch": 1688} {"train_loss": -22.973241806030273, "global_step": 140164, "epoch": 1688} {"train_loss": -22.980506896972656, "global_step": 140165, "epoch": 1688} {"train_loss": -23.42059326171875, "global_step": 140166, "epoch": 1688} {"train_loss": -23.178945541381836, "global_step": 140167, "epoch": 1688} {"train_loss": -23.276655197143555, "global_step": 140168, "epoch": 1688} {"train_loss": -22.735397338867188, "global_step": 140169, "epoch": 1688} {"train_loss": -23.227991104125977, "global_step": 140170, "epoch": 1688} {"train_loss": -23.099416732788086, "global_step": 140171, "epoch": 1688} {"train_loss": -23.532367706298828, "global_step": 140172, "epoch": 1688} {"train_loss": -22.90500259399414, "global_step": 140173, "epoch": 1688} {"train_loss": -23.05672836303711, "global_step": 140174, "epoch": 1688} {"train_loss": -23.08586883544922, "global_step": 140175, "epoch": 1688} {"train_loss": -22.370376586914062, "global_step": 140176, "epoch": 1688} {"train_loss": -23.30049705505371, "global_step": 140177, "epoch": 1688} {"train_loss": -23.022686004638672, "global_step": 140178, "epoch": 1688} {"train_loss": -22.976110458374023, "global_step": 140179, "epoch": 1688} {"train_loss": -23.28898048400879, "global_step": 140180, "epoch": 1688} {"train_loss": -22.980966567993164, "global_step": 140181, "epoch": 1688} {"train_loss": -23.254636764526367, "global_step": 140182, "epoch": 1688} {"train_loss": -23.483154296875, "global_step": 140183, "epoch": 1688} {"train_loss": -23.02419662475586, "global_step": 140184, "epoch": 1688} {"train_loss": -23.323680877685547, "global_step": 140185, "epoch": 1688} {"train_loss": -22.970003909375293, "global_step": 140186, "epoch": 1688, "val_loss": 6315352.0} {"train_loss": -23.150678634643555, "global_step": 140187, "epoch": 1689} {"train_loss": -23.004060745239258, "global_step": 140188, "epoch": 1689} {"train_loss": -23.009552001953125, "global_step": 140189, "epoch": 1689} {"train_loss": -22.943822860717773, "global_step": 140190, "epoch": 1689} {"train_loss": -23.122135162353516, "global_step": 140191, "epoch": 1689} {"train_loss": -23.23531150817871, "global_step": 140192, "epoch": 1689} {"train_loss": -22.772741317749023, "global_step": 140193, "epoch": 1689} {"train_loss": -22.876699447631836, "global_step": 140194, "epoch": 1689} {"train_loss": -23.036495208740234, "global_step": 140195, "epoch": 1689} {"train_loss": -22.988248825073242, "global_step": 140196, "epoch": 1689} {"train_loss": -23.0037841796875, "global_step": 140197, "epoch": 1689} {"train_loss": -22.60481071472168, "global_step": 140198, "epoch": 1689} {"train_loss": -23.354751586914062, "global_step": 140199, "epoch": 1689} {"train_loss": -22.83485221862793, "global_step": 140200, "epoch": 1689} {"train_loss": -22.828121185302734, "global_step": 140201, "epoch": 1689} {"train_loss": -22.599414825439453, "global_step": 140202, "epoch": 1689} {"train_loss": -22.707752227783203, "global_step": 140203, "epoch": 1689} {"train_loss": -22.755491256713867, "global_step": 140204, "epoch": 1689} {"train_loss": -22.76366424560547, "global_step": 140205, "epoch": 1689} {"train_loss": -22.715641021728516, "global_step": 140206, "epoch": 1689} {"train_loss": -22.687345504760742, "global_step": 140207, "epoch": 1689} {"train_loss": -23.021154403686523, "global_step": 140208, "epoch": 1689} {"train_loss": -22.939985275268555, "global_step": 140209, "epoch": 1689} {"train_loss": -22.726051330566406, "global_step": 140210, "epoch": 1689} {"train_loss": -22.950931549072266, "global_step": 140211, "epoch": 1689} {"train_loss": -23.04451560974121, "global_step": 140212, "epoch": 1689} {"train_loss": -23.213178634643555, "global_step": 140213, "epoch": 1689} {"train_loss": -22.890226364135742, "global_step": 140214, "epoch": 1689} {"train_loss": -23.151926040649414, "global_step": 140215, "epoch": 1689} {"train_loss": -23.08461570739746, "global_step": 140216, "epoch": 1689} {"train_loss": -23.034772872924805, "global_step": 140217, "epoch": 1689} {"train_loss": -23.04435157775879, "global_step": 140218, "epoch": 1689} {"train_loss": -23.252878189086914, "global_step": 140219, "epoch": 1689} {"train_loss": -23.2978515625, "global_step": 140220, "epoch": 1689} {"train_loss": -23.17921257019043, "global_step": 140221, "epoch": 1689} {"train_loss": -23.52360725402832, "global_step": 140222, "epoch": 1689} {"train_loss": -23.122465133666992, "global_step": 140223, "epoch": 1689} {"train_loss": -23.089923858642578, "global_step": 140224, "epoch": 1689} {"train_loss": -23.32712173461914, "global_step": 140225, "epoch": 1689} {"train_loss": -22.881757736206055, "global_step": 140226, "epoch": 1689} {"train_loss": -22.56049919128418, "global_step": 140227, "epoch": 1689} {"train_loss": -22.94495391845703, "global_step": 140228, "epoch": 1689} {"train_loss": -23.13742446899414, "global_step": 140229, "epoch": 1689} {"train_loss": -22.9670467376709, "global_step": 140230, "epoch": 1689} {"train_loss": -23.239980697631836, "global_step": 140231, "epoch": 1689} {"train_loss": -23.185462951660156, "global_step": 140232, "epoch": 1689} {"train_loss": -23.144981384277344, "global_step": 140233, "epoch": 1689} {"train_loss": -22.97855567932129, "global_step": 140234, "epoch": 1689} {"train_loss": -23.10879898071289, "global_step": 140235, "epoch": 1689} {"train_loss": -23.3348331451416, "global_step": 140236, "epoch": 1689} {"train_loss": -22.73267936706543, "global_step": 140237, "epoch": 1689} {"train_loss": -23.04373550415039, "global_step": 140238, "epoch": 1689} {"train_loss": -22.615808486938477, "global_step": 140239, "epoch": 1689} {"train_loss": -22.821823120117188, "global_step": 140240, "epoch": 1689} {"train_loss": -22.690412521362305, "global_step": 140241, "epoch": 1689} {"train_loss": -23.224388122558594, "global_step": 140242, "epoch": 1689} {"train_loss": -23.10654640197754, "global_step": 140243, "epoch": 1689} {"train_loss": -23.366924285888672, "global_step": 140244, "epoch": 1689} {"train_loss": -23.080276489257812, "global_step": 140245, "epoch": 1689} {"train_loss": -23.128185272216797, "global_step": 140246, "epoch": 1689} {"train_loss": -23.235036849975586, "global_step": 140247, "epoch": 1689} {"train_loss": -22.892932891845703, "global_step": 140248, "epoch": 1689} {"train_loss": -23.227556228637695, "global_step": 140249, "epoch": 1689} {"train_loss": -23.24049949645996, "global_step": 140250, "epoch": 1689} {"train_loss": -23.02947998046875, "global_step": 140251, "epoch": 1689} {"train_loss": -22.871234893798828, "global_step": 140252, "epoch": 1689} {"train_loss": -23.0402774810791, "global_step": 140253, "epoch": 1689} {"train_loss": -22.82865333557129, "global_step": 140254, "epoch": 1689} {"train_loss": -23.004566192626953, "global_step": 140255, "epoch": 1689} {"train_loss": -23.202085494995117, "global_step": 140256, "epoch": 1689} {"train_loss": -23.04271697998047, "global_step": 140257, "epoch": 1689} {"train_loss": -23.06870460510254, "global_step": 140258, "epoch": 1689} {"train_loss": -22.483556747436523, "global_step": 140259, "epoch": 1689} {"train_loss": -22.949460983276367, "global_step": 140260, "epoch": 1689} {"train_loss": -22.578359603881836, "global_step": 140261, "epoch": 1689} {"train_loss": -23.05597686767578, "global_step": 140262, "epoch": 1689} {"train_loss": -23.22383689880371, "global_step": 140263, "epoch": 1689} {"train_loss": -23.041160583496094, "global_step": 140264, "epoch": 1689} {"train_loss": -23.137054443359375, "global_step": 140265, "epoch": 1689} {"train_loss": -23.302183151245117, "global_step": 140266, "epoch": 1689} {"train_loss": -22.629344940185547, "global_step": 140267, "epoch": 1689} {"train_loss": -22.79109001159668, "global_step": 140268, "epoch": 1689} {"train_loss": -22.99594996348921, "global_step": 140269, "epoch": 1689, "val_loss": 6281631.5} {"train_loss": -21.231456756591797, "global_step": 140270, "epoch": 1690} {"train_loss": -22.480981826782227, "global_step": 140271, "epoch": 1690} {"train_loss": -21.153278350830078, "global_step": 140272, "epoch": 1690} {"train_loss": -22.015457153320312, "global_step": 140273, "epoch": 1690} {"train_loss": -22.010313034057617, "global_step": 140274, "epoch": 1690} {"train_loss": -22.15900993347168, "global_step": 140275, "epoch": 1690} {"train_loss": -22.566059112548828, "global_step": 140276, "epoch": 1690} {"train_loss": -22.191471099853516, "global_step": 140277, "epoch": 1690} {"train_loss": -22.324445724487305, "global_step": 140278, "epoch": 1690} {"train_loss": -22.551563262939453, "global_step": 140279, "epoch": 1690} {"train_loss": -22.322677612304688, "global_step": 140280, "epoch": 1690} {"train_loss": -22.289138793945312, "global_step": 140281, "epoch": 1690} {"train_loss": -21.88233757019043, "global_step": 140282, "epoch": 1690} {"train_loss": -22.737150192260742, "global_step": 140283, "epoch": 1690} {"train_loss": -21.997037887573242, "global_step": 140284, "epoch": 1690} {"train_loss": -22.7121639251709, "global_step": 140285, "epoch": 1690} {"train_loss": -22.701629638671875, "global_step": 140286, "epoch": 1690} {"train_loss": -22.236387252807617, "global_step": 140287, "epoch": 1690} {"train_loss": -22.71381950378418, "global_step": 140288, "epoch": 1690} {"train_loss": -22.56199073791504, "global_step": 140289, "epoch": 1690} {"train_loss": -22.57223892211914, "global_step": 140290, "epoch": 1690} {"train_loss": -22.963245391845703, "global_step": 140291, "epoch": 1690} {"train_loss": -22.768468856811523, "global_step": 140292, "epoch": 1690} {"train_loss": -22.529706954956055, "global_step": 140293, "epoch": 1690} {"train_loss": -22.835304260253906, "global_step": 140294, "epoch": 1690} {"train_loss": -22.38500213623047, "global_step": 140295, "epoch": 1690} {"train_loss": -23.016172409057617, "global_step": 140296, "epoch": 1690} {"train_loss": -22.613147735595703, "global_step": 140297, "epoch": 1690} {"train_loss": -22.929258346557617, "global_step": 140298, "epoch": 1690} {"train_loss": -23.07643699645996, "global_step": 140299, "epoch": 1690} {"train_loss": -22.95844841003418, "global_step": 140300, "epoch": 1690} {"train_loss": -22.538827896118164, "global_step": 140301, "epoch": 1690} {"train_loss": -23.048450469970703, "global_step": 140302, "epoch": 1690} {"train_loss": -22.50084114074707, "global_step": 140303, "epoch": 1690} {"train_loss": -22.711252212524414, "global_step": 140304, "epoch": 1690} {"train_loss": -22.589651107788086, "global_step": 140305, "epoch": 1690} {"train_loss": -23.0031795501709, "global_step": 140306, "epoch": 1690} {"train_loss": -23.24256706237793, "global_step": 140307, "epoch": 1690} {"train_loss": -22.54851531982422, "global_step": 140308, "epoch": 1690} {"train_loss": -22.959962844848633, "global_step": 140309, "epoch": 1690} {"train_loss": -22.973196029663086, "global_step": 140310, "epoch": 1690} {"train_loss": -22.628860473632812, "global_step": 140311, "epoch": 1690} {"train_loss": -23.06460952758789, "global_step": 140312, "epoch": 1690} {"train_loss": -22.547895431518555, "global_step": 140313, "epoch": 1690} {"train_loss": -22.688871383666992, "global_step": 140314, "epoch": 1690} {"train_loss": -22.87165641784668, "global_step": 140315, "epoch": 1690} {"train_loss": -23.100149154663086, "global_step": 140316, "epoch": 1690} {"train_loss": -22.868179321289062, "global_step": 140317, "epoch": 1690} {"train_loss": -23.033552169799805, "global_step": 140318, "epoch": 1690} {"train_loss": -22.955228805541992, "global_step": 140319, "epoch": 1690} {"train_loss": -22.72553062438965, "global_step": 140320, "epoch": 1690} {"train_loss": -22.815074920654297, "global_step": 140321, "epoch": 1690} {"train_loss": -23.042890548706055, "global_step": 140322, "epoch": 1690} {"train_loss": -22.775344848632812, "global_step": 140323, "epoch": 1690} {"train_loss": -23.20526123046875, "global_step": 140324, "epoch": 1690} {"train_loss": -23.09671401977539, "global_step": 140325, "epoch": 1690} {"train_loss": -23.15594482421875, "global_step": 140326, "epoch": 1690} {"train_loss": -22.760549545288086, "global_step": 140327, "epoch": 1690} {"train_loss": -23.140668869018555, "global_step": 140328, "epoch": 1690} {"train_loss": -23.154706954956055, "global_step": 140329, "epoch": 1690} {"train_loss": -22.917652130126953, "global_step": 140330, "epoch": 1690} {"train_loss": -22.765193939208984, "global_step": 140331, "epoch": 1690} {"train_loss": -23.039356231689453, "global_step": 140332, "epoch": 1690} {"train_loss": -22.95500373840332, "global_step": 140333, "epoch": 1690} {"train_loss": -22.940019607543945, "global_step": 140334, "epoch": 1690} {"train_loss": -23.31523895263672, "global_step": 140335, "epoch": 1690} {"train_loss": -23.157276153564453, "global_step": 140336, "epoch": 1690} {"train_loss": -22.883005142211914, "global_step": 140337, "epoch": 1690} {"train_loss": -23.08533477783203, "global_step": 140338, "epoch": 1690} {"train_loss": -22.82240104675293, "global_step": 140339, "epoch": 1690} {"train_loss": -23.072738647460938, "global_step": 140340, "epoch": 1690} {"train_loss": -22.97486686706543, "global_step": 140341, "epoch": 1690} {"train_loss": -23.356901168823242, "global_step": 140342, "epoch": 1690} {"train_loss": -22.984426498413086, "global_step": 140343, "epoch": 1690} {"train_loss": -23.021230697631836, "global_step": 140344, "epoch": 1690} {"train_loss": -23.136274337768555, "global_step": 140345, "epoch": 1690} {"train_loss": -22.94609832763672, "global_step": 140346, "epoch": 1690} {"train_loss": -23.018342971801758, "global_step": 140347, "epoch": 1690} {"train_loss": -22.706457138061523, "global_step": 140348, "epoch": 1690} {"train_loss": -21.95183753967285, "global_step": 140349, "epoch": 1690} {"train_loss": -22.870447158813477, "global_step": 140350, "epoch": 1690} {"train_loss": -22.6005916595459, "global_step": 140351, "epoch": 1690} {"train_loss": -22.720329951090985, "global_step": 140352, "epoch": 1690, "val_loss": 6339477.5} {"train_loss": -22.80861473083496, "global_step": 140353, "epoch": 1691} {"train_loss": -22.71480369567871, "global_step": 140354, "epoch": 1691} {"train_loss": -22.762670516967773, "global_step": 140355, "epoch": 1691} {"train_loss": -22.573930740356445, "global_step": 140356, "epoch": 1691} {"train_loss": -22.4737606048584, "global_step": 140357, "epoch": 1691} {"train_loss": -22.55155372619629, "global_step": 140358, "epoch": 1691} {"train_loss": -22.629610061645508, "global_step": 140359, "epoch": 1691} {"train_loss": -22.617076873779297, "global_step": 140360, "epoch": 1691} {"train_loss": -22.50815200805664, "global_step": 140361, "epoch": 1691} {"train_loss": -22.759199142456055, "global_step": 140362, "epoch": 1691} {"train_loss": -22.519086837768555, "global_step": 140363, "epoch": 1691} {"train_loss": -23.01783561706543, "global_step": 140364, "epoch": 1691} {"train_loss": -22.766523361206055, "global_step": 140365, "epoch": 1691} {"train_loss": -22.63966941833496, "global_step": 140366, "epoch": 1691} {"train_loss": -22.900606155395508, "global_step": 140367, "epoch": 1691} {"train_loss": -22.84148597717285, "global_step": 140368, "epoch": 1691} {"train_loss": -22.773975372314453, "global_step": 140369, "epoch": 1691} {"train_loss": -22.57950782775879, "global_step": 140370, "epoch": 1691} {"train_loss": -23.211698532104492, "global_step": 140371, "epoch": 1691} {"train_loss": -22.965930938720703, "global_step": 140372, "epoch": 1691} {"train_loss": -22.728147506713867, "global_step": 140373, "epoch": 1691} {"train_loss": -22.941585540771484, "global_step": 140374, "epoch": 1691} {"train_loss": -23.040891647338867, "global_step": 140375, "epoch": 1691} {"train_loss": -22.823476791381836, "global_step": 140376, "epoch": 1691} {"train_loss": -22.710086822509766, "global_step": 140377, "epoch": 1691} {"train_loss": -23.197751998901367, "global_step": 140378, "epoch": 1691} {"train_loss": -22.888010025024414, "global_step": 140379, "epoch": 1691} {"train_loss": -22.9608211517334, "global_step": 140380, "epoch": 1691} {"train_loss": -23.15234375, "global_step": 140381, "epoch": 1691} {"train_loss": -23.035320281982422, "global_step": 140382, "epoch": 1691} {"train_loss": -23.129657745361328, "global_step": 140383, "epoch": 1691} {"train_loss": -23.003381729125977, "global_step": 140384, "epoch": 1691} {"train_loss": -23.010255813598633, "global_step": 140385, "epoch": 1691} {"train_loss": -23.047027587890625, "global_step": 140386, "epoch": 1691} {"train_loss": -23.008134841918945, "global_step": 140387, "epoch": 1691} {"train_loss": -23.04129409790039, "global_step": 140388, "epoch": 1691} {"train_loss": -22.994836807250977, "global_step": 140389, "epoch": 1691} {"train_loss": -22.604036331176758, "global_step": 140390, "epoch": 1691} {"train_loss": -22.80875015258789, "global_step": 140391, "epoch": 1691} {"train_loss": -23.134159088134766, "global_step": 140392, "epoch": 1691} {"train_loss": -22.888046264648438, "global_step": 140393, "epoch": 1691} {"train_loss": -23.131637573242188, "global_step": 140394, "epoch": 1691} {"train_loss": -23.27994155883789, "global_step": 140395, "epoch": 1691} {"train_loss": -22.882835388183594, "global_step": 140396, "epoch": 1691} {"train_loss": -22.55885124206543, "global_step": 140397, "epoch": 1691} {"train_loss": -23.0523624420166, "global_step": 140398, "epoch": 1691} {"train_loss": -23.2558536529541, "global_step": 140399, "epoch": 1691} {"train_loss": -22.894433975219727, "global_step": 140400, "epoch": 1691} {"train_loss": -22.853729248046875, "global_step": 140401, "epoch": 1691} {"train_loss": -23.00513458251953, "global_step": 140402, "epoch": 1691} {"train_loss": -23.222414016723633, "global_step": 140403, "epoch": 1691} {"train_loss": -23.0302734375, "global_step": 140404, "epoch": 1691} {"train_loss": -22.878416061401367, "global_step": 140405, "epoch": 1691} {"train_loss": -23.030776977539062, "global_step": 140406, "epoch": 1691} {"train_loss": -23.216123580932617, "global_step": 140407, "epoch": 1691} {"train_loss": -22.671506881713867, "global_step": 140408, "epoch": 1691} {"train_loss": -22.865558624267578, "global_step": 140409, "epoch": 1691} {"train_loss": -23.14650535583496, "global_step": 140410, "epoch": 1691} {"train_loss": -22.90174674987793, "global_step": 140411, "epoch": 1691} {"train_loss": -22.73125648498535, "global_step": 140412, "epoch": 1691} {"train_loss": -22.929059982299805, "global_step": 140413, "epoch": 1691} {"train_loss": -22.832550048828125, "global_step": 140414, "epoch": 1691} {"train_loss": -23.135971069335938, "global_step": 140415, "epoch": 1691} {"train_loss": -22.973234176635742, "global_step": 140416, "epoch": 1691} {"train_loss": -22.71817398071289, "global_step": 140417, "epoch": 1691} {"train_loss": -23.35926628112793, "global_step": 140418, "epoch": 1691} {"train_loss": -23.130844116210938, "global_step": 140419, "epoch": 1691} {"train_loss": -23.115676879882812, "global_step": 140420, "epoch": 1691} {"train_loss": -23.382232666015625, "global_step": 140421, "epoch": 1691} {"train_loss": -23.448312759399414, "global_step": 140422, "epoch": 1691} {"train_loss": -23.60956382751465, "global_step": 140423, "epoch": 1691} {"train_loss": -23.124372482299805, "global_step": 140424, "epoch": 1691} {"train_loss": -23.196714401245117, "global_step": 140425, "epoch": 1691} {"train_loss": -23.187753677368164, "global_step": 140426, "epoch": 1691} {"train_loss": -23.197938919067383, "global_step": 140427, "epoch": 1691} {"train_loss": -23.43037223815918, "global_step": 140428, "epoch": 1691} {"train_loss": -23.47663688659668, "global_step": 140429, "epoch": 1691} {"train_loss": -22.86893081665039, "global_step": 140430, "epoch": 1691} {"train_loss": -23.29084587097168, "global_step": 140431, "epoch": 1691} {"train_loss": -22.935266494750977, "global_step": 140432, "epoch": 1691} {"train_loss": -23.297346115112305, "global_step": 140433, "epoch": 1691} {"train_loss": -23.061017990112305, "global_step": 140434, "epoch": 1691} {"train_loss": -22.966310983680817, "global_step": 140435, "epoch": 1691, "val_loss": 6294228.0} {"train_loss": -21.915407180786133, "global_step": 140436, "epoch": 1692} {"train_loss": -22.41047477722168, "global_step": 140437, "epoch": 1692} {"train_loss": -22.660247802734375, "global_step": 140438, "epoch": 1692} {"train_loss": -22.191930770874023, "global_step": 140439, "epoch": 1692} {"train_loss": -22.145851135253906, "global_step": 140440, "epoch": 1692} {"train_loss": -22.28660774230957, "global_step": 140441, "epoch": 1692} {"train_loss": -22.226823806762695, "global_step": 140442, "epoch": 1692} {"train_loss": -22.243793487548828, "global_step": 140443, "epoch": 1692} {"train_loss": -22.09821128845215, "global_step": 140444, "epoch": 1692} {"train_loss": -22.605329513549805, "global_step": 140445, "epoch": 1692} {"train_loss": -22.658802032470703, "global_step": 140446, "epoch": 1692} {"train_loss": -22.35000991821289, "global_step": 140447, "epoch": 1692} {"train_loss": -22.44441032409668, "global_step": 140448, "epoch": 1692} {"train_loss": -22.53240966796875, "global_step": 140449, "epoch": 1692} {"train_loss": -22.20102882385254, "global_step": 140450, "epoch": 1692} {"train_loss": -22.73320960998535, "global_step": 140451, "epoch": 1692} {"train_loss": -22.648550033569336, "global_step": 140452, "epoch": 1692} {"train_loss": -22.93647575378418, "global_step": 140453, "epoch": 1692} {"train_loss": -22.43109130859375, "global_step": 140454, "epoch": 1692} {"train_loss": -22.59220314025879, "global_step": 140455, "epoch": 1692} {"train_loss": -22.246747970581055, "global_step": 140456, "epoch": 1692} {"train_loss": -23.338287353515625, "global_step": 140457, "epoch": 1692} {"train_loss": -22.835174560546875, "global_step": 140458, "epoch": 1692} {"train_loss": -22.872102737426758, "global_step": 140459, "epoch": 1692} {"train_loss": -22.454111099243164, "global_step": 140460, "epoch": 1692} {"train_loss": -22.925731658935547, "global_step": 140461, "epoch": 1692} {"train_loss": -23.063230514526367, "global_step": 140462, "epoch": 1692} {"train_loss": -23.091114044189453, "global_step": 140463, "epoch": 1692} {"train_loss": -22.804380416870117, "global_step": 140464, "epoch": 1692} {"train_loss": -22.785411834716797, "global_step": 140465, "epoch": 1692} {"train_loss": -23.236295700073242, "global_step": 140466, "epoch": 1692} {"train_loss": -23.146047592163086, "global_step": 140467, "epoch": 1692} {"train_loss": -23.036008834838867, "global_step": 140468, "epoch": 1692} {"train_loss": -22.725522994995117, "global_step": 140469, "epoch": 1692} {"train_loss": -22.76582145690918, "global_step": 140470, "epoch": 1692} {"train_loss": -23.510074615478516, "global_step": 140471, "epoch": 1692} {"train_loss": -22.80717658996582, "global_step": 140472, "epoch": 1692} {"train_loss": -23.20284080505371, "global_step": 140473, "epoch": 1692} {"train_loss": -22.99220085144043, "global_step": 140474, "epoch": 1692} {"train_loss": -22.991992950439453, "global_step": 140475, "epoch": 1692} {"train_loss": -22.83465003967285, "global_step": 140476, "epoch": 1692} {"train_loss": -23.657289505004883, "global_step": 140477, "epoch": 1692} {"train_loss": -23.152660369873047, "global_step": 140478, "epoch": 1692} {"train_loss": -22.94775390625, "global_step": 140479, "epoch": 1692} {"train_loss": -23.24175453186035, "global_step": 140480, "epoch": 1692} {"train_loss": -23.49833106994629, "global_step": 140481, "epoch": 1692} {"train_loss": -23.099668502807617, "global_step": 140482, "epoch": 1692} {"train_loss": -22.517303466796875, "global_step": 140483, "epoch": 1692} {"train_loss": -23.03778076171875, "global_step": 140484, "epoch": 1692} {"train_loss": -22.9163761138916, "global_step": 140485, "epoch": 1692} {"train_loss": -22.52498435974121, "global_step": 140486, "epoch": 1692} {"train_loss": -23.17784309387207, "global_step": 140487, "epoch": 1692} {"train_loss": -22.936254501342773, "global_step": 140488, "epoch": 1692} {"train_loss": -22.94808006286621, "global_step": 140489, "epoch": 1692} {"train_loss": -23.158639907836914, "global_step": 140490, "epoch": 1692} {"train_loss": -23.356714248657227, "global_step": 140491, "epoch": 1692} {"train_loss": -22.757400512695312, "global_step": 140492, "epoch": 1692} {"train_loss": -23.541515350341797, "global_step": 140493, "epoch": 1692} {"train_loss": -23.207416534423828, "global_step": 140494, "epoch": 1692} {"train_loss": -23.177560806274414, "global_step": 140495, "epoch": 1692} {"train_loss": -22.801664352416992, "global_step": 140496, "epoch": 1692} {"train_loss": -23.081945419311523, "global_step": 140497, "epoch": 1692} {"train_loss": -23.28267478942871, "global_step": 140498, "epoch": 1692} {"train_loss": -22.955078125, "global_step": 140499, "epoch": 1692} {"train_loss": -23.105350494384766, "global_step": 140500, "epoch": 1692} {"train_loss": -23.29473304748535, "global_step": 140501, "epoch": 1692} {"train_loss": -23.023101806640625, "global_step": 140502, "epoch": 1692} {"train_loss": -23.097076416015625, "global_step": 140503, "epoch": 1692} {"train_loss": -23.09499168395996, "global_step": 140504, "epoch": 1692} {"train_loss": -22.824771881103516, "global_step": 140505, "epoch": 1692} {"train_loss": -22.757972717285156, "global_step": 140506, "epoch": 1692} {"train_loss": -23.282245635986328, "global_step": 140507, "epoch": 1692} {"train_loss": -22.981822967529297, "global_step": 140508, "epoch": 1692} {"train_loss": -22.68897247314453, "global_step": 140509, "epoch": 1692} {"train_loss": -22.79694938659668, "global_step": 140510, "epoch": 1692} {"train_loss": -23.39961051940918, "global_step": 140511, "epoch": 1692} {"train_loss": -22.66872215270996, "global_step": 140512, "epoch": 1692} {"train_loss": -22.74855613708496, "global_step": 140513, "epoch": 1692} {"train_loss": -22.915815353393555, "global_step": 140514, "epoch": 1692} {"train_loss": -23.010456085205078, "global_step": 140515, "epoch": 1692} {"train_loss": -22.84560203552246, "global_step": 140516, "epoch": 1692} {"train_loss": -22.988313674926758, "global_step": 140517, "epoch": 1692} {"train_loss": -22.867863046117577, "global_step": 140518, "epoch": 1692, "val_loss": 6329813.0} {"train_loss": -21.74445152282715, "global_step": 140519, "epoch": 1693} {"train_loss": -22.92501449584961, "global_step": 140520, "epoch": 1693} {"train_loss": -22.557493209838867, "global_step": 140521, "epoch": 1693} {"train_loss": -22.414443969726562, "global_step": 140522, "epoch": 1693} {"train_loss": -22.707435607910156, "global_step": 140523, "epoch": 1693} {"train_loss": -22.77591896057129, "global_step": 140524, "epoch": 1693} {"train_loss": -22.978551864624023, "global_step": 140525, "epoch": 1693} {"train_loss": -22.98973274230957, "global_step": 140526, "epoch": 1693} {"train_loss": -22.850202560424805, "global_step": 140527, "epoch": 1693} {"train_loss": -22.950490951538086, "global_step": 140528, "epoch": 1693} {"train_loss": -22.966588973999023, "global_step": 140529, "epoch": 1693} {"train_loss": -22.811376571655273, "global_step": 140530, "epoch": 1693} {"train_loss": -23.063344955444336, "global_step": 140531, "epoch": 1693} {"train_loss": -22.78743553161621, "global_step": 140532, "epoch": 1693} {"train_loss": -22.869050979614258, "global_step": 140533, "epoch": 1693} {"train_loss": -22.829313278198242, "global_step": 140534, "epoch": 1693} {"train_loss": -23.227346420288086, "global_step": 140535, "epoch": 1693} {"train_loss": -22.954030990600586, "global_step": 140536, "epoch": 1693} {"train_loss": -22.942625045776367, "global_step": 140537, "epoch": 1693} {"train_loss": -22.9014949798584, "global_step": 140538, "epoch": 1693} {"train_loss": -22.904199600219727, "global_step": 140539, "epoch": 1693} {"train_loss": -22.98744773864746, "global_step": 140540, "epoch": 1693} {"train_loss": -23.02570152282715, "global_step": 140541, "epoch": 1693} {"train_loss": -22.9517879486084, "global_step": 140542, "epoch": 1693} {"train_loss": -23.046035766601562, "global_step": 140543, "epoch": 1693} {"train_loss": -22.6390438079834, "global_step": 140544, "epoch": 1693} {"train_loss": -23.192819595336914, "global_step": 140545, "epoch": 1693} {"train_loss": -22.81497573852539, "global_step": 140546, "epoch": 1693} {"train_loss": -23.434412002563477, "global_step": 140547, "epoch": 1693} {"train_loss": -22.56890869140625, "global_step": 140548, "epoch": 1693} {"train_loss": -23.150564193725586, "global_step": 140549, "epoch": 1693} {"train_loss": -23.26300621032715, "global_step": 140550, "epoch": 1693} {"train_loss": -23.300546646118164, "global_step": 140551, "epoch": 1693} {"train_loss": -22.821208953857422, "global_step": 140552, "epoch": 1693} {"train_loss": -23.05022430419922, "global_step": 140553, "epoch": 1693} {"train_loss": -22.88648796081543, "global_step": 140554, "epoch": 1693} {"train_loss": -23.137521743774414, "global_step": 140555, "epoch": 1693} {"train_loss": -23.43098258972168, "global_step": 140556, "epoch": 1693} {"train_loss": -23.178014755249023, "global_step": 140557, "epoch": 1693} {"train_loss": -23.228797912597656, "global_step": 140558, "epoch": 1693} {"train_loss": -23.008983612060547, "global_step": 140559, "epoch": 1693} {"train_loss": -22.771574020385742, "global_step": 140560, "epoch": 1693} {"train_loss": -23.115278244018555, "global_step": 140561, "epoch": 1693} {"train_loss": -22.90657615661621, "global_step": 140562, "epoch": 1693} {"train_loss": -23.179983139038086, "global_step": 140563, "epoch": 1693} {"train_loss": -22.749664306640625, "global_step": 140564, "epoch": 1693} {"train_loss": -23.055692672729492, "global_step": 140565, "epoch": 1693} {"train_loss": -23.2020263671875, "global_step": 140566, "epoch": 1693} {"train_loss": -22.945083618164062, "global_step": 140567, "epoch": 1693} {"train_loss": -23.03790283203125, "global_step": 140568, "epoch": 1693} {"train_loss": -23.241056442260742, "global_step": 140569, "epoch": 1693} {"train_loss": -23.112045288085938, "global_step": 140570, "epoch": 1693} {"train_loss": -23.291807174682617, "global_step": 140571, "epoch": 1693} {"train_loss": -23.29294776916504, "global_step": 140572, "epoch": 1693} {"train_loss": -22.79940414428711, "global_step": 140573, "epoch": 1693} {"train_loss": -23.501998901367188, "global_step": 140574, "epoch": 1693} {"train_loss": -23.127912521362305, "global_step": 140575, "epoch": 1693} {"train_loss": -23.112058639526367, "global_step": 140576, "epoch": 1693} {"train_loss": -23.301496505737305, "global_step": 140577, "epoch": 1693} {"train_loss": -23.205121994018555, "global_step": 140578, "epoch": 1693} {"train_loss": -22.985416412353516, "global_step": 140579, "epoch": 1693} {"train_loss": -22.799623489379883, "global_step": 140580, "epoch": 1693} {"train_loss": -23.172719955444336, "global_step": 140581, "epoch": 1693} {"train_loss": -22.893924713134766, "global_step": 140582, "epoch": 1693} {"train_loss": -22.96978187561035, "global_step": 140583, "epoch": 1693} {"train_loss": -22.97116470336914, "global_step": 140584, "epoch": 1693} {"train_loss": -22.959272384643555, "global_step": 140585, "epoch": 1693} {"train_loss": -22.870708465576172, "global_step": 140586, "epoch": 1693} {"train_loss": -23.182674407958984, "global_step": 140587, "epoch": 1693} {"train_loss": -23.431196212768555, "global_step": 140588, "epoch": 1693} {"train_loss": -23.362760543823242, "global_step": 140589, "epoch": 1693} {"train_loss": -22.814817428588867, "global_step": 140590, "epoch": 1693} {"train_loss": -23.348735809326172, "global_step": 140591, "epoch": 1693} {"train_loss": -22.566617965698242, "global_step": 140592, "epoch": 1693} {"train_loss": -23.360219955444336, "global_step": 140593, "epoch": 1693} {"train_loss": -23.056110382080078, "global_step": 140594, "epoch": 1693} {"train_loss": -22.835948944091797, "global_step": 140595, "epoch": 1693} {"train_loss": -22.78055191040039, "global_step": 140596, "epoch": 1693} {"train_loss": -23.01399040222168, "global_step": 140597, "epoch": 1693} {"train_loss": -22.842161178588867, "global_step": 140598, "epoch": 1693} {"train_loss": -23.087772369384766, "global_step": 140599, "epoch": 1693} {"train_loss": -23.02803611755371, "global_step": 140600, "epoch": 1693} {"train_loss": -22.991218406033802, "global_step": 140601, "epoch": 1693, "val_loss": 6337400.5} {"train_loss": -22.774755477905273, "global_step": 140602, "epoch": 1694} {"train_loss": -22.260498046875, "global_step": 140603, "epoch": 1694} {"train_loss": -23.10109519958496, "global_step": 140604, "epoch": 1694} {"train_loss": -22.83515167236328, "global_step": 140605, "epoch": 1694} {"train_loss": -22.65961456298828, "global_step": 140606, "epoch": 1694} {"train_loss": -22.96907615661621, "global_step": 140607, "epoch": 1694} {"train_loss": -22.782150268554688, "global_step": 140608, "epoch": 1694} {"train_loss": -22.78338623046875, "global_step": 140609, "epoch": 1694} {"train_loss": -23.169660568237305, "global_step": 140610, "epoch": 1694} {"train_loss": -23.13661766052246, "global_step": 140611, "epoch": 1694} {"train_loss": -23.157459259033203, "global_step": 140612, "epoch": 1694} {"train_loss": -23.191015243530273, "global_step": 140613, "epoch": 1694} {"train_loss": -23.120227813720703, "global_step": 140614, "epoch": 1694} {"train_loss": -22.9880428314209, "global_step": 140615, "epoch": 1694} {"train_loss": -22.988174438476562, "global_step": 140616, "epoch": 1694} {"train_loss": -22.909395217895508, "global_step": 140617, "epoch": 1694} {"train_loss": -23.251638412475586, "global_step": 140618, "epoch": 1694} {"train_loss": -22.696577072143555, "global_step": 140619, "epoch": 1694} {"train_loss": -22.994937896728516, "global_step": 140620, "epoch": 1694} {"train_loss": -23.140310287475586, "global_step": 140621, "epoch": 1694} {"train_loss": -23.056066513061523, "global_step": 140622, "epoch": 1694} {"train_loss": -23.621335983276367, "global_step": 140623, "epoch": 1694} {"train_loss": -23.223554611206055, "global_step": 140624, "epoch": 1694} {"train_loss": -23.057010650634766, "global_step": 140625, "epoch": 1694} {"train_loss": -23.48153305053711, "global_step": 140626, "epoch": 1694} {"train_loss": -23.17281150817871, "global_step": 140627, "epoch": 1694} {"train_loss": -22.754980087280273, "global_step": 140628, "epoch": 1694} {"train_loss": -22.926666259765625, "global_step": 140629, "epoch": 1694} {"train_loss": -23.302770614624023, "global_step": 140630, "epoch": 1694} {"train_loss": -23.05537986755371, "global_step": 140631, "epoch": 1694} {"train_loss": -23.31241798400879, "global_step": 140632, "epoch": 1694} {"train_loss": -22.941553115844727, "global_step": 140633, "epoch": 1694} {"train_loss": -22.89837646484375, "global_step": 140634, "epoch": 1694} {"train_loss": -22.966646194458008, "global_step": 140635, "epoch": 1694} {"train_loss": -23.294334411621094, "global_step": 140636, "epoch": 1694} {"train_loss": -23.264951705932617, "global_step": 140637, "epoch": 1694} {"train_loss": -23.393129348754883, "global_step": 140638, "epoch": 1694} {"train_loss": -23.188268661499023, "global_step": 140639, "epoch": 1694} {"train_loss": -23.19942283630371, "global_step": 140640, "epoch": 1694} {"train_loss": -23.33315658569336, "global_step": 140641, "epoch": 1694} {"train_loss": -23.175540924072266, "global_step": 140642, "epoch": 1694} {"train_loss": -23.31468391418457, "global_step": 140643, "epoch": 1694} {"train_loss": -22.61488914489746, "global_step": 140644, "epoch": 1694} {"train_loss": -22.635604858398438, "global_step": 140645, "epoch": 1694} {"train_loss": -23.15354347229004, "global_step": 140646, "epoch": 1694} {"train_loss": -23.255395889282227, "global_step": 140647, "epoch": 1694} {"train_loss": -22.820493698120117, "global_step": 140648, "epoch": 1694} {"train_loss": -23.26502799987793, "global_step": 140649, "epoch": 1694} {"train_loss": -22.88315773010254, "global_step": 140650, "epoch": 1694} {"train_loss": -23.33479881286621, "global_step": 140651, "epoch": 1694} {"train_loss": -23.216358184814453, "global_step": 140652, "epoch": 1694} {"train_loss": -22.7861385345459, "global_step": 140653, "epoch": 1694} {"train_loss": -23.101505279541016, "global_step": 140654, "epoch": 1694} {"train_loss": -22.801870346069336, "global_step": 140655, "epoch": 1694} {"train_loss": -23.02497673034668, "global_step": 140656, "epoch": 1694} {"train_loss": -22.966672897338867, "global_step": 140657, "epoch": 1694} {"train_loss": -23.24863624572754, "global_step": 140658, "epoch": 1694} {"train_loss": -23.150745391845703, "global_step": 140659, "epoch": 1694} {"train_loss": -23.33355712890625, "global_step": 140660, "epoch": 1694} {"train_loss": -22.769079208374023, "global_step": 140661, "epoch": 1694} {"train_loss": -22.567419052124023, "global_step": 140662, "epoch": 1694} {"train_loss": -23.109210968017578, "global_step": 140663, "epoch": 1694} {"train_loss": -22.905197143554688, "global_step": 140664, "epoch": 1694} {"train_loss": -22.789642333984375, "global_step": 140665, "epoch": 1694} {"train_loss": -22.787683486938477, "global_step": 140666, "epoch": 1694} {"train_loss": -23.19336700439453, "global_step": 140667, "epoch": 1694} {"train_loss": -22.725862503051758, "global_step": 140668, "epoch": 1694} {"train_loss": -23.584442138671875, "global_step": 140669, "epoch": 1694} {"train_loss": -23.01628303527832, "global_step": 140670, "epoch": 1694} {"train_loss": -23.05156707763672, "global_step": 140671, "epoch": 1694} {"train_loss": -22.966751098632812, "global_step": 140672, "epoch": 1694} {"train_loss": -23.10947608947754, "global_step": 140673, "epoch": 1694} {"train_loss": -22.874204635620117, "global_step": 140674, "epoch": 1694} {"train_loss": -22.901445388793945, "global_step": 140675, "epoch": 1694} {"train_loss": -23.195274353027344, "global_step": 140676, "epoch": 1694} {"train_loss": -23.11203384399414, "global_step": 140677, "epoch": 1694} {"train_loss": -22.979162216186523, "global_step": 140678, "epoch": 1694} {"train_loss": -23.214841842651367, "global_step": 140679, "epoch": 1694} {"train_loss": -23.200056076049805, "global_step": 140680, "epoch": 1694} {"train_loss": -23.0488224029541, "global_step": 140681, "epoch": 1694} {"train_loss": -23.304731369018555, "global_step": 140682, "epoch": 1694} {"train_loss": -23.73619270324707, "global_step": 140683, "epoch": 1694} {"train_loss": -23.063390754791627, "global_step": 140684, "epoch": 1694, "val_loss": 6321933.5} {"train_loss": -22.928133010864258, "global_step": 140685, "epoch": 1695} {"train_loss": -22.69264030456543, "global_step": 140686, "epoch": 1695} {"train_loss": -22.57549285888672, "global_step": 140687, "epoch": 1695} {"train_loss": -23.103742599487305, "global_step": 140688, "epoch": 1695} {"train_loss": -23.132415771484375, "global_step": 140689, "epoch": 1695} {"train_loss": -22.813861846923828, "global_step": 140690, "epoch": 1695} {"train_loss": -22.931001663208008, "global_step": 140691, "epoch": 1695} {"train_loss": -23.122756958007812, "global_step": 140692, "epoch": 1695} {"train_loss": -22.788259506225586, "global_step": 140693, "epoch": 1695} {"train_loss": -23.08002281188965, "global_step": 140694, "epoch": 1695} {"train_loss": -23.367263793945312, "global_step": 140695, "epoch": 1695} {"train_loss": -22.862932205200195, "global_step": 140696, "epoch": 1695} {"train_loss": -23.12691307067871, "global_step": 140697, "epoch": 1695} {"train_loss": -23.13212776184082, "global_step": 140698, "epoch": 1695} {"train_loss": -23.05678367614746, "global_step": 140699, "epoch": 1695} {"train_loss": -23.4052791595459, "global_step": 140700, "epoch": 1695} {"train_loss": -22.573394775390625, "global_step": 140701, "epoch": 1695} {"train_loss": -23.177766799926758, "global_step": 140702, "epoch": 1695} {"train_loss": -23.117849349975586, "global_step": 140703, "epoch": 1695} {"train_loss": -23.067934036254883, "global_step": 140704, "epoch": 1695} {"train_loss": -22.808486938476562, "global_step": 140705, "epoch": 1695} {"train_loss": -23.261478424072266, "global_step": 140706, "epoch": 1695} {"train_loss": -22.939809799194336, "global_step": 140707, "epoch": 1695} {"train_loss": -22.968347549438477, "global_step": 140708, "epoch": 1695} {"train_loss": -23.024728775024414, "global_step": 140709, "epoch": 1695} {"train_loss": -23.255023956298828, "global_step": 140710, "epoch": 1695} {"train_loss": -22.92547035217285, "global_step": 140711, "epoch": 1695} {"train_loss": -23.07428741455078, "global_step": 140712, "epoch": 1695} {"train_loss": -23.006072998046875, "global_step": 140713, "epoch": 1695} {"train_loss": -22.8539981842041, "global_step": 140714, "epoch": 1695} {"train_loss": -23.00482749938965, "global_step": 140715, "epoch": 1695} {"train_loss": -22.966089248657227, "global_step": 140716, "epoch": 1695} {"train_loss": -23.16046714782715, "global_step": 140717, "epoch": 1695} {"train_loss": -23.15770721435547, "global_step": 140718, "epoch": 1695} {"train_loss": -22.932302474975586, "global_step": 140719, "epoch": 1695} {"train_loss": -23.248777389526367, "global_step": 140720, "epoch": 1695} {"train_loss": -23.53571128845215, "global_step": 140721, "epoch": 1695} {"train_loss": -23.274213790893555, "global_step": 140722, "epoch": 1695} {"train_loss": -23.07305335998535, "global_step": 140723, "epoch": 1695} {"train_loss": -22.84386444091797, "global_step": 140724, "epoch": 1695} {"train_loss": -23.067289352416992, "global_step": 140725, "epoch": 1695} {"train_loss": -23.0905704498291, "global_step": 140726, "epoch": 1695} {"train_loss": -22.88089370727539, "global_step": 140727, "epoch": 1695} {"train_loss": -22.689653396606445, "global_step": 140728, "epoch": 1695} {"train_loss": -22.80999183654785, "global_step": 140729, "epoch": 1695} {"train_loss": -23.042699813842773, "global_step": 140730, "epoch": 1695} {"train_loss": -22.928380966186523, "global_step": 140731, "epoch": 1695} {"train_loss": -22.667497634887695, "global_step": 140732, "epoch": 1695} {"train_loss": -22.857276916503906, "global_step": 140733, "epoch": 1695} {"train_loss": -23.030475616455078, "global_step": 140734, "epoch": 1695} {"train_loss": -23.44968605041504, "global_step": 140735, "epoch": 1695} {"train_loss": -22.9713191986084, "global_step": 140736, "epoch": 1695} {"train_loss": -23.160978317260742, "global_step": 140737, "epoch": 1695} {"train_loss": -23.062101364135742, "global_step": 140738, "epoch": 1695} {"train_loss": -22.91756248474121, "global_step": 140739, "epoch": 1695} {"train_loss": -23.06551170349121, "global_step": 140740, "epoch": 1695} {"train_loss": -23.20296287536621, "global_step": 140741, "epoch": 1695} {"train_loss": -22.91286277770996, "global_step": 140742, "epoch": 1695} {"train_loss": -22.749526977539062, "global_step": 140743, "epoch": 1695} {"train_loss": -23.126638412475586, "global_step": 140744, "epoch": 1695} {"train_loss": -22.72584342956543, "global_step": 140745, "epoch": 1695} {"train_loss": -22.9323673248291, "global_step": 140746, "epoch": 1695} {"train_loss": -23.1594295501709, "global_step": 140747, "epoch": 1695} {"train_loss": -23.16497039794922, "global_step": 140748, "epoch": 1695} {"train_loss": -22.812957763671875, "global_step": 140749, "epoch": 1695} {"train_loss": -22.91098403930664, "global_step": 140750, "epoch": 1695} {"train_loss": -22.93180274963379, "global_step": 140751, "epoch": 1695} {"train_loss": -23.200109481811523, "global_step": 140752, "epoch": 1695} {"train_loss": -23.54494857788086, "global_step": 140753, "epoch": 1695} {"train_loss": -23.03754234313965, "global_step": 140754, "epoch": 1695} {"train_loss": -23.218420028686523, "global_step": 140755, "epoch": 1695} {"train_loss": -23.060163497924805, "global_step": 140756, "epoch": 1695} {"train_loss": -23.539459228515625, "global_step": 140757, "epoch": 1695} {"train_loss": -23.045969009399414, "global_step": 140758, "epoch": 1695} {"train_loss": -22.876678466796875, "global_step": 140759, "epoch": 1695} {"train_loss": -23.234739303588867, "global_step": 140760, "epoch": 1695} {"train_loss": -23.053327560424805, "global_step": 140761, "epoch": 1695} {"train_loss": -22.962133407592773, "global_step": 140762, "epoch": 1695} {"train_loss": -22.687631607055664, "global_step": 140763, "epoch": 1695} {"train_loss": -22.778797149658203, "global_step": 140764, "epoch": 1695} {"train_loss": -23.29551887512207, "global_step": 140765, "epoch": 1695} {"train_loss": -22.756261825561523, "global_step": 140766, "epoch": 1695} {"train_loss": -23.007543517882567, "global_step": 140767, "epoch": 1695, "val_loss": 6245936.0} {"train_loss": -20.340850830078125, "global_step": 140768, "epoch": 1696} {"train_loss": -22.112842559814453, "global_step": 140769, "epoch": 1696} {"train_loss": -22.294578552246094, "global_step": 140770, "epoch": 1696} {"train_loss": -21.631589889526367, "global_step": 140771, "epoch": 1696} {"train_loss": -21.670764923095703, "global_step": 140772, "epoch": 1696} {"train_loss": -21.52431297302246, "global_step": 140773, "epoch": 1696} {"train_loss": -22.131484985351562, "global_step": 140774, "epoch": 1696} {"train_loss": -22.436328887939453, "global_step": 140775, "epoch": 1696} {"train_loss": -22.2403564453125, "global_step": 140776, "epoch": 1696} {"train_loss": -22.38084602355957, "global_step": 140777, "epoch": 1696} {"train_loss": -22.300321578979492, "global_step": 140778, "epoch": 1696} {"train_loss": -22.452749252319336, "global_step": 140779, "epoch": 1696} {"train_loss": -22.001331329345703, "global_step": 140780, "epoch": 1696} {"train_loss": -22.48872184753418, "global_step": 140781, "epoch": 1696} {"train_loss": -22.792070388793945, "global_step": 140782, "epoch": 1696} {"train_loss": -22.361845016479492, "global_step": 140783, "epoch": 1696} {"train_loss": -22.507545471191406, "global_step": 140784, "epoch": 1696} {"train_loss": -22.32924461364746, "global_step": 140785, "epoch": 1696} {"train_loss": -22.77242660522461, "global_step": 140786, "epoch": 1696} {"train_loss": -22.57439613342285, "global_step": 140787, "epoch": 1696} {"train_loss": -22.532230377197266, "global_step": 140788, "epoch": 1696} {"train_loss": -22.441389083862305, "global_step": 140789, "epoch": 1696} {"train_loss": -22.281665802001953, "global_step": 140790, "epoch": 1696} {"train_loss": -22.558252334594727, "global_step": 140791, "epoch": 1696} {"train_loss": -22.870887756347656, "global_step": 140792, "epoch": 1696} {"train_loss": -22.858388900756836, "global_step": 140793, "epoch": 1696} {"train_loss": -22.675901412963867, "global_step": 140794, "epoch": 1696} {"train_loss": -22.703571319580078, "global_step": 140795, "epoch": 1696} {"train_loss": -22.440006256103516, "global_step": 140796, "epoch": 1696} {"train_loss": -22.789827346801758, "global_step": 140797, "epoch": 1696} {"train_loss": -23.116544723510742, "global_step": 140798, "epoch": 1696} {"train_loss": -23.024179458618164, "global_step": 140799, "epoch": 1696} {"train_loss": -23.135501861572266, "global_step": 140800, "epoch": 1696} {"train_loss": -23.230295181274414, "global_step": 140801, "epoch": 1696} {"train_loss": -22.660400390625, "global_step": 140802, "epoch": 1696} {"train_loss": -22.867807388305664, "global_step": 140803, "epoch": 1696} {"train_loss": -23.121091842651367, "global_step": 140804, "epoch": 1696} {"train_loss": -23.21251678466797, "global_step": 140805, "epoch": 1696} {"train_loss": -23.177778244018555, "global_step": 140806, "epoch": 1696} {"train_loss": -23.139368057250977, "global_step": 140807, "epoch": 1696} {"train_loss": -23.198331832885742, "global_step": 140808, "epoch": 1696} {"train_loss": -23.326797485351562, "global_step": 140809, "epoch": 1696} {"train_loss": -23.0753173828125, "global_step": 140810, "epoch": 1696} {"train_loss": -23.243423461914062, "global_step": 140811, "epoch": 1696} {"train_loss": -22.902536392211914, "global_step": 140812, "epoch": 1696} {"train_loss": -23.245433807373047, "global_step": 140813, "epoch": 1696} {"train_loss": -22.878461837768555, "global_step": 140814, "epoch": 1696} {"train_loss": -22.96270179748535, "global_step": 140815, "epoch": 1696} {"train_loss": -22.778711318969727, "global_step": 140816, "epoch": 1696} {"train_loss": -23.49627113342285, "global_step": 140817, "epoch": 1696} {"train_loss": -22.7803955078125, "global_step": 140818, "epoch": 1696} {"train_loss": -22.87354850769043, "global_step": 140819, "epoch": 1696} {"train_loss": -23.322647094726562, "global_step": 140820, "epoch": 1696} {"train_loss": -22.660573959350586, "global_step": 140821, "epoch": 1696} {"train_loss": -23.233789443969727, "global_step": 140822, "epoch": 1696} {"train_loss": -23.192094802856445, "global_step": 140823, "epoch": 1696} {"train_loss": -22.82600975036621, "global_step": 140824, "epoch": 1696} {"train_loss": -22.469812393188477, "global_step": 140825, "epoch": 1696} {"train_loss": -22.482145309448242, "global_step": 140826, "epoch": 1696} {"train_loss": -22.90673065185547, "global_step": 140827, "epoch": 1696} {"train_loss": -22.523624420166016, "global_step": 140828, "epoch": 1696} {"train_loss": -23.107681274414062, "global_step": 140829, "epoch": 1696} {"train_loss": -22.734777450561523, "global_step": 140830, "epoch": 1696} {"train_loss": -22.6530818939209, "global_step": 140831, "epoch": 1696} {"train_loss": -23.180173873901367, "global_step": 140832, "epoch": 1696} {"train_loss": -23.406850814819336, "global_step": 140833, "epoch": 1696} {"train_loss": -22.55977439880371, "global_step": 140834, "epoch": 1696} {"train_loss": -22.831758499145508, "global_step": 140835, "epoch": 1696} {"train_loss": -23.139942169189453, "global_step": 140836, "epoch": 1696} {"train_loss": -22.8253231048584, "global_step": 140837, "epoch": 1696} {"train_loss": -23.228567123413086, "global_step": 140838, "epoch": 1696} {"train_loss": -23.368003845214844, "global_step": 140839, "epoch": 1696} {"train_loss": -23.106111526489258, "global_step": 140840, "epoch": 1696} {"train_loss": -22.92775535583496, "global_step": 140841, "epoch": 1696} {"train_loss": -23.048925399780273, "global_step": 140842, "epoch": 1696} {"train_loss": -23.269020080566406, "global_step": 140843, "epoch": 1696} {"train_loss": -23.714658737182617, "global_step": 140844, "epoch": 1696} {"train_loss": -22.76017951965332, "global_step": 140845, "epoch": 1696} {"train_loss": -22.997541427612305, "global_step": 140846, "epoch": 1696} {"train_loss": -23.181339263916016, "global_step": 140847, "epoch": 1696} {"train_loss": -22.86548614501953, "global_step": 140848, "epoch": 1696} {"train_loss": -23.106725692749023, "global_step": 140849, "epoch": 1696} {"train_loss": -22.774534547185322, "global_step": 140850, "epoch": 1696, "val_loss": 6245526.5} {"train_loss": -22.750654220581055, "global_step": 140851, "epoch": 1697} {"train_loss": -22.594776153564453, "global_step": 140852, "epoch": 1697} {"train_loss": -22.881200790405273, "global_step": 140853, "epoch": 1697} {"train_loss": -23.023223876953125, "global_step": 140854, "epoch": 1697} {"train_loss": -22.964921951293945, "global_step": 140855, "epoch": 1697} {"train_loss": -22.996198654174805, "global_step": 140856, "epoch": 1697} {"train_loss": -22.676776885986328, "global_step": 140857, "epoch": 1697} {"train_loss": -23.123004913330078, "global_step": 140858, "epoch": 1697} {"train_loss": -23.084775924682617, "global_step": 140859, "epoch": 1697} {"train_loss": -22.954099655151367, "global_step": 140860, "epoch": 1697} {"train_loss": -23.335124969482422, "global_step": 140861, "epoch": 1697} {"train_loss": -22.99932098388672, "global_step": 140862, "epoch": 1697} {"train_loss": -23.078977584838867, "global_step": 140863, "epoch": 1697} {"train_loss": -22.292116165161133, "global_step": 140864, "epoch": 1697} {"train_loss": -23.065017700195312, "global_step": 140865, "epoch": 1697} {"train_loss": -23.004262924194336, "global_step": 140866, "epoch": 1697} {"train_loss": -23.154455184936523, "global_step": 140867, "epoch": 1697} {"train_loss": -22.987714767456055, "global_step": 140868, "epoch": 1697} {"train_loss": -22.912038803100586, "global_step": 140869, "epoch": 1697} {"train_loss": -23.181089401245117, "global_step": 140870, "epoch": 1697} {"train_loss": -23.17560386657715, "global_step": 140871, "epoch": 1697} {"train_loss": -23.214187622070312, "global_step": 140872, "epoch": 1697} {"train_loss": -23.170621871948242, "global_step": 140873, "epoch": 1697} {"train_loss": -22.941429138183594, "global_step": 140874, "epoch": 1697} {"train_loss": -23.341703414916992, "global_step": 140875, "epoch": 1697} {"train_loss": -23.178144454956055, "global_step": 140876, "epoch": 1697} {"train_loss": -23.023300170898438, "global_step": 140877, "epoch": 1697} {"train_loss": -23.08957290649414, "global_step": 140878, "epoch": 1697} {"train_loss": -23.08018684387207, "global_step": 140879, "epoch": 1697} {"train_loss": -23.046232223510742, "global_step": 140880, "epoch": 1697} {"train_loss": -22.85489845275879, "global_step": 140881, "epoch": 1697} {"train_loss": -22.854244232177734, "global_step": 140882, "epoch": 1697} {"train_loss": -23.515125274658203, "global_step": 140883, "epoch": 1697} {"train_loss": -23.356687545776367, "global_step": 140884, "epoch": 1697} {"train_loss": -23.078359603881836, "global_step": 140885, "epoch": 1697} {"train_loss": -23.49806022644043, "global_step": 140886, "epoch": 1697} {"train_loss": -22.79233741760254, "global_step": 140887, "epoch": 1697} {"train_loss": -22.867816925048828, "global_step": 140888, "epoch": 1697} {"train_loss": -23.267253875732422, "global_step": 140889, "epoch": 1697} {"train_loss": -23.31983757019043, "global_step": 140890, "epoch": 1697} {"train_loss": -23.503122329711914, "global_step": 140891, "epoch": 1697} {"train_loss": -23.203758239746094, "global_step": 140892, "epoch": 1697} {"train_loss": -23.130704879760742, "global_step": 140893, "epoch": 1697} {"train_loss": -23.15736198425293, "global_step": 140894, "epoch": 1697} {"train_loss": -22.947641372680664, "global_step": 140895, "epoch": 1697} {"train_loss": -23.177133560180664, "global_step": 140896, "epoch": 1697} {"train_loss": -23.242162704467773, "global_step": 140897, "epoch": 1697} {"train_loss": -22.96208381652832, "global_step": 140898, "epoch": 1697} {"train_loss": -23.20057487487793, "global_step": 140899, "epoch": 1697} {"train_loss": -23.07277488708496, "global_step": 140900, "epoch": 1697} {"train_loss": -22.895109176635742, "global_step": 140901, "epoch": 1697} {"train_loss": -23.072851181030273, "global_step": 140902, "epoch": 1697} {"train_loss": -22.850345611572266, "global_step": 140903, "epoch": 1697} {"train_loss": -23.404621124267578, "global_step": 140904, "epoch": 1697} {"train_loss": -23.18924331665039, "global_step": 140905, "epoch": 1697} {"train_loss": -23.336050033569336, "global_step": 140906, "epoch": 1697} {"train_loss": -23.270395278930664, "global_step": 140907, "epoch": 1697} {"train_loss": -23.01032829284668, "global_step": 140908, "epoch": 1697} {"train_loss": -23.328227996826172, "global_step": 140909, "epoch": 1697} {"train_loss": -23.074609756469727, "global_step": 140910, "epoch": 1697} {"train_loss": -23.33925437927246, "global_step": 140911, "epoch": 1697} {"train_loss": -23.03777313232422, "global_step": 140912, "epoch": 1697} {"train_loss": -22.706186294555664, "global_step": 140913, "epoch": 1697} {"train_loss": -23.302663803100586, "global_step": 140914, "epoch": 1697} {"train_loss": -23.291446685791016, "global_step": 140915, "epoch": 1697} {"train_loss": -22.963623046875, "global_step": 140916, "epoch": 1697} {"train_loss": -22.917930603027344, "global_step": 140917, "epoch": 1697} {"train_loss": -23.14011001586914, "global_step": 140918, "epoch": 1697} {"train_loss": -23.183277130126953, "global_step": 140919, "epoch": 1697} {"train_loss": -22.91933250427246, "global_step": 140920, "epoch": 1697} {"train_loss": -23.159780502319336, "global_step": 140921, "epoch": 1697} {"train_loss": -23.0128173828125, "global_step": 140922, "epoch": 1697} {"train_loss": -23.08674430847168, "global_step": 140923, "epoch": 1697} {"train_loss": -22.949953079223633, "global_step": 140924, "epoch": 1697} {"train_loss": -23.548412322998047, "global_step": 140925, "epoch": 1697} {"train_loss": -23.23649787902832, "global_step": 140926, "epoch": 1697} {"train_loss": -23.33493995666504, "global_step": 140927, "epoch": 1697} {"train_loss": -22.985275268554688, "global_step": 140928, "epoch": 1697} {"train_loss": -22.79400634765625, "global_step": 140929, "epoch": 1697} {"train_loss": -23.09857177734375, "global_step": 140930, "epoch": 1697} {"train_loss": -23.72675895690918, "global_step": 140931, "epoch": 1697} {"train_loss": -22.606557846069336, "global_step": 140932, "epoch": 1697} {"train_loss": -23.072208795202783, "global_step": 140933, "epoch": 1697, "val_loss": 6264118.0} {"train_loss": -22.50815200805664, "global_step": 140934, "epoch": 1698} {"train_loss": -21.99838638305664, "global_step": 140935, "epoch": 1698} {"train_loss": -22.514617919921875, "global_step": 140936, "epoch": 1698} {"train_loss": -22.83002281188965, "global_step": 140937, "epoch": 1698} {"train_loss": -21.7152042388916, "global_step": 140938, "epoch": 1698} {"train_loss": -22.6117000579834, "global_step": 140939, "epoch": 1698} {"train_loss": -21.89712905883789, "global_step": 140940, "epoch": 1698} {"train_loss": -22.666324615478516, "global_step": 140941, "epoch": 1698} {"train_loss": -22.21946144104004, "global_step": 140942, "epoch": 1698} {"train_loss": -22.643674850463867, "global_step": 140943, "epoch": 1698} {"train_loss": -22.640146255493164, "global_step": 140944, "epoch": 1698} {"train_loss": -22.3372859954834, "global_step": 140945, "epoch": 1698} {"train_loss": -22.841760635375977, "global_step": 140946, "epoch": 1698} {"train_loss": -22.63759422302246, "global_step": 140947, "epoch": 1698} {"train_loss": -22.917800903320312, "global_step": 140948, "epoch": 1698} {"train_loss": -22.900089263916016, "global_step": 140949, "epoch": 1698} {"train_loss": -22.490407943725586, "global_step": 140950, "epoch": 1698} {"train_loss": -22.372220993041992, "global_step": 140951, "epoch": 1698} {"train_loss": -22.54572105407715, "global_step": 140952, "epoch": 1698} {"train_loss": -22.60767936706543, "global_step": 140953, "epoch": 1698} {"train_loss": -22.59311294555664, "global_step": 140954, "epoch": 1698} {"train_loss": -22.856088638305664, "global_step": 140955, "epoch": 1698} {"train_loss": -23.228239059448242, "global_step": 140956, "epoch": 1698} {"train_loss": -22.815690994262695, "global_step": 140957, "epoch": 1698} {"train_loss": -22.855356216430664, "global_step": 140958, "epoch": 1698} {"train_loss": -22.823904037475586, "global_step": 140959, "epoch": 1698} {"train_loss": -22.862287521362305, "global_step": 140960, "epoch": 1698} {"train_loss": -22.913633346557617, "global_step": 140961, "epoch": 1698} {"train_loss": -22.963518142700195, "global_step": 140962, "epoch": 1698} {"train_loss": -22.962919235229492, "global_step": 140963, "epoch": 1698} {"train_loss": -22.605579376220703, "global_step": 140964, "epoch": 1698} {"train_loss": -22.972206115722656, "global_step": 140965, "epoch": 1698} {"train_loss": -22.824186325073242, "global_step": 140966, "epoch": 1698} {"train_loss": -23.137834548950195, "global_step": 140967, "epoch": 1698} {"train_loss": -22.64379119873047, "global_step": 140968, "epoch": 1698} {"train_loss": -23.047277450561523, "global_step": 140969, "epoch": 1698} {"train_loss": -23.29703140258789, "global_step": 140970, "epoch": 1698} {"train_loss": -22.82965660095215, "global_step": 140971, "epoch": 1698} {"train_loss": -23.43340492248535, "global_step": 140972, "epoch": 1698} {"train_loss": -23.105833053588867, "global_step": 140973, "epoch": 1698} {"train_loss": -23.17876625061035, "global_step": 140974, "epoch": 1698} {"train_loss": -23.000051498413086, "global_step": 140975, "epoch": 1698} {"train_loss": -23.034770965576172, "global_step": 140976, "epoch": 1698} {"train_loss": -22.805118560791016, "global_step": 140977, "epoch": 1698} {"train_loss": -23.206937789916992, "global_step": 140978, "epoch": 1698} {"train_loss": -22.885669708251953, "global_step": 140979, "epoch": 1698} {"train_loss": -22.805784225463867, "global_step": 140980, "epoch": 1698} {"train_loss": -23.212194442749023, "global_step": 140981, "epoch": 1698} {"train_loss": -22.758649826049805, "global_step": 140982, "epoch": 1698} {"train_loss": -22.80695915222168, "global_step": 140983, "epoch": 1698} {"train_loss": -23.138078689575195, "global_step": 140984, "epoch": 1698} {"train_loss": -22.821760177612305, "global_step": 140985, "epoch": 1698} {"train_loss": -23.31012535095215, "global_step": 140986, "epoch": 1698} {"train_loss": -23.06564712524414, "global_step": 140987, "epoch": 1698} {"train_loss": -23.18946075439453, "global_step": 140988, "epoch": 1698} {"train_loss": -22.83027458190918, "global_step": 140989, "epoch": 1698} {"train_loss": -23.012353897094727, "global_step": 140990, "epoch": 1698} {"train_loss": -23.502994537353516, "global_step": 140991, "epoch": 1698} {"train_loss": -23.076902389526367, "global_step": 140992, "epoch": 1698} {"train_loss": -23.058134078979492, "global_step": 140993, "epoch": 1698} {"train_loss": -22.973459243774414, "global_step": 140994, "epoch": 1698} {"train_loss": -22.664413452148438, "global_step": 140995, "epoch": 1698} {"train_loss": -23.240598678588867, "global_step": 140996, "epoch": 1698} {"train_loss": -23.107694625854492, "global_step": 140997, "epoch": 1698} {"train_loss": -23.237607955932617, "global_step": 140998, "epoch": 1698} {"train_loss": -22.931026458740234, "global_step": 140999, "epoch": 1698} {"train_loss": -23.039947509765625, "global_step": 141000, "epoch": 1698} {"train_loss": -23.366744995117188, "global_step": 141001, "epoch": 1698} {"train_loss": -22.957738876342773, "global_step": 141002, "epoch": 1698} {"train_loss": -23.216529846191406, "global_step": 141003, "epoch": 1698} {"train_loss": -23.211483001708984, "global_step": 141004, "epoch": 1698} {"train_loss": -23.266172409057617, "global_step": 141005, "epoch": 1698} {"train_loss": -22.978805541992188, "global_step": 141006, "epoch": 1698} {"train_loss": -23.060932159423828, "global_step": 141007, "epoch": 1698} {"train_loss": -23.00641441345215, "global_step": 141008, "epoch": 1698} {"train_loss": -23.220701217651367, "global_step": 141009, "epoch": 1698} {"train_loss": -23.018827438354492, "global_step": 141010, "epoch": 1698} {"train_loss": -22.685138702392578, "global_step": 141011, "epoch": 1698} {"train_loss": -22.954269409179688, "global_step": 141012, "epoch": 1698} {"train_loss": -22.884435653686523, "global_step": 141013, "epoch": 1698} {"train_loss": -23.088411331176758, "global_step": 141014, "epoch": 1698} {"train_loss": -22.86605453491211, "global_step": 141015, "epoch": 1698} {"train_loss": -22.892619144485657, "global_step": 141016, "epoch": 1698, "val_loss": 6261711.5} {"train_loss": -22.344444274902344, "global_step": 141017, "epoch": 1699} {"train_loss": -22.514013290405273, "global_step": 141018, "epoch": 1699} {"train_loss": -22.434812545776367, "global_step": 141019, "epoch": 1699} {"train_loss": -22.446491241455078, "global_step": 141020, "epoch": 1699} {"train_loss": -22.805519104003906, "global_step": 141021, "epoch": 1699} {"train_loss": -22.615488052368164, "global_step": 141022, "epoch": 1699} {"train_loss": -22.863285064697266, "global_step": 141023, "epoch": 1699} {"train_loss": -22.787891387939453, "global_step": 141024, "epoch": 1699} {"train_loss": -22.829837799072266, "global_step": 141025, "epoch": 1699} {"train_loss": -22.719409942626953, "global_step": 141026, "epoch": 1699} {"train_loss": -22.612308502197266, "global_step": 141027, "epoch": 1699} {"train_loss": -22.574472427368164, "global_step": 141028, "epoch": 1699} {"train_loss": -22.674396514892578, "global_step": 141029, "epoch": 1699} {"train_loss": -22.475570678710938, "global_step": 141030, "epoch": 1699} {"train_loss": -22.888778686523438, "global_step": 141031, "epoch": 1699} {"train_loss": -22.73091697692871, "global_step": 141032, "epoch": 1699} {"train_loss": -22.73927116394043, "global_step": 141033, "epoch": 1699} {"train_loss": -22.799108505249023, "global_step": 141034, "epoch": 1699} {"train_loss": -22.931819915771484, "global_step": 141035, "epoch": 1699} {"train_loss": -22.819137573242188, "global_step": 141036, "epoch": 1699} {"train_loss": -23.18539810180664, "global_step": 141037, "epoch": 1699} {"train_loss": -22.73744773864746, "global_step": 141038, "epoch": 1699} {"train_loss": -23.24178123474121, "global_step": 141039, "epoch": 1699} {"train_loss": -23.426908493041992, "global_step": 141040, "epoch": 1699} {"train_loss": -23.12215232849121, "global_step": 141041, "epoch": 1699} {"train_loss": -22.905838012695312, "global_step": 141042, "epoch": 1699} {"train_loss": -22.868955612182617, "global_step": 141043, "epoch": 1699} {"train_loss": -23.095325469970703, "global_step": 141044, "epoch": 1699} {"train_loss": -23.365066528320312, "global_step": 141045, "epoch": 1699} {"train_loss": -23.27191162109375, "global_step": 141046, "epoch": 1699} {"train_loss": -23.2286319732666, "global_step": 141047, "epoch": 1699} {"train_loss": -22.779783248901367, "global_step": 141048, "epoch": 1699} {"train_loss": -22.901565551757812, "global_step": 141049, "epoch": 1699} {"train_loss": -23.161787033081055, "global_step": 141050, "epoch": 1699} {"train_loss": -23.1195125579834, "global_step": 141051, "epoch": 1699} {"train_loss": -23.305593490600586, "global_step": 141052, "epoch": 1699} {"train_loss": -23.4153995513916, "global_step": 141053, "epoch": 1699} {"train_loss": -23.55537986755371, "global_step": 141054, "epoch": 1699} {"train_loss": -23.277490615844727, "global_step": 141055, "epoch": 1699} {"train_loss": -23.59623146057129, "global_step": 141056, "epoch": 1699} {"train_loss": -23.33751678466797, "global_step": 141057, "epoch": 1699} {"train_loss": -23.020376205444336, "global_step": 141058, "epoch": 1699} {"train_loss": -22.978422164916992, "global_step": 141059, "epoch": 1699} {"train_loss": -23.40445899963379, "global_step": 141060, "epoch": 1699} {"train_loss": -22.858810424804688, "global_step": 141061, "epoch": 1699} {"train_loss": -22.80707550048828, "global_step": 141062, "epoch": 1699} {"train_loss": -23.116506576538086, "global_step": 141063, "epoch": 1699} {"train_loss": -22.97163200378418, "global_step": 141064, "epoch": 1699} {"train_loss": -22.984010696411133, "global_step": 141065, "epoch": 1699} {"train_loss": -22.693998336791992, "global_step": 141066, "epoch": 1699} {"train_loss": -23.15899658203125, "global_step": 141067, "epoch": 1699} {"train_loss": -23.27225685119629, "global_step": 141068, "epoch": 1699} {"train_loss": -22.998517990112305, "global_step": 141069, "epoch": 1699} {"train_loss": -23.137802124023438, "global_step": 141070, "epoch": 1699} {"train_loss": -22.8179874420166, "global_step": 141071, "epoch": 1699} {"train_loss": -22.915555953979492, "global_step": 141072, "epoch": 1699} {"train_loss": -22.85520362854004, "global_step": 141073, "epoch": 1699} {"train_loss": -23.03400230407715, "global_step": 141074, "epoch": 1699} {"train_loss": -22.88872718811035, "global_step": 141075, "epoch": 1699} {"train_loss": -23.045291900634766, "global_step": 141076, "epoch": 1699} {"train_loss": -23.058216094970703, "global_step": 141077, "epoch": 1699} {"train_loss": -23.10408592224121, "global_step": 141078, "epoch": 1699} {"train_loss": -23.143659591674805, "global_step": 141079, "epoch": 1699} {"train_loss": -23.299015045166016, "global_step": 141080, "epoch": 1699} {"train_loss": -22.833759307861328, "global_step": 141081, "epoch": 1699} {"train_loss": -23.268844604492188, "global_step": 141082, "epoch": 1699} {"train_loss": -23.067169189453125, "global_step": 141083, "epoch": 1699} {"train_loss": -23.026142120361328, "global_step": 141084, "epoch": 1699} {"train_loss": -22.775503158569336, "global_step": 141085, "epoch": 1699} {"train_loss": -22.884687423706055, "global_step": 141086, "epoch": 1699} {"train_loss": -23.113361358642578, "global_step": 141087, "epoch": 1699} {"train_loss": -23.074665069580078, "global_step": 141088, "epoch": 1699} {"train_loss": -22.959131240844727, "global_step": 141089, "epoch": 1699} {"train_loss": -23.051666259765625, "global_step": 141090, "epoch": 1699} {"train_loss": -23.221426010131836, "global_step": 141091, "epoch": 1699} {"train_loss": -23.356056213378906, "global_step": 141092, "epoch": 1699} {"train_loss": -23.466428756713867, "global_step": 141093, "epoch": 1699} {"train_loss": -23.188955307006836, "global_step": 141094, "epoch": 1699} {"train_loss": -23.256351470947266, "global_step": 141095, "epoch": 1699} {"train_loss": -23.149917602539062, "global_step": 141096, "epoch": 1699} {"train_loss": -23.368749618530273, "global_step": 141097, "epoch": 1699} {"train_loss": -23.13571548461914, "global_step": 141098, "epoch": 1699} {"train_loss": -22.96588644923934, "global_step": 141099, "epoch": 1699, "val_loss": 6268781.0} {"train_loss": -22.42429542541504, "global_step": 141100, "epoch": 1700} {"train_loss": -22.061880111694336, "global_step": 141101, "epoch": 1700} {"train_loss": -22.870243072509766, "global_step": 141102, "epoch": 1700} {"train_loss": -22.627485275268555, "global_step": 141103, "epoch": 1700} {"train_loss": -22.644155502319336, "global_step": 141104, "epoch": 1700} {"train_loss": -22.950286865234375, "global_step": 141105, "epoch": 1700} {"train_loss": -22.897424697875977, "global_step": 141106, "epoch": 1700} {"train_loss": -22.798961639404297, "global_step": 141107, "epoch": 1700} {"train_loss": -22.392507553100586, "global_step": 141108, "epoch": 1700} {"train_loss": -23.040878295898438, "global_step": 141109, "epoch": 1700} {"train_loss": -22.756235122680664, "global_step": 141110, "epoch": 1700} {"train_loss": -22.840234756469727, "global_step": 141111, "epoch": 1700} {"train_loss": -22.90423011779785, "global_step": 141112, "epoch": 1700} {"train_loss": -23.236427307128906, "global_step": 141113, "epoch": 1700} {"train_loss": -22.805694580078125, "global_step": 141114, "epoch": 1700} {"train_loss": -23.207443237304688, "global_step": 141115, "epoch": 1700} {"train_loss": -23.230680465698242, "global_step": 141116, "epoch": 1700} {"train_loss": -23.031265258789062, "global_step": 141117, "epoch": 1700} {"train_loss": -23.257099151611328, "global_step": 141118, "epoch": 1700} {"train_loss": -23.145896911621094, "global_step": 141119, "epoch": 1700} {"train_loss": -23.19137954711914, "global_step": 141120, "epoch": 1700} {"train_loss": -22.963563919067383, "global_step": 141121, "epoch": 1700} {"train_loss": -23.075910568237305, "global_step": 141122, "epoch": 1700} {"train_loss": -23.034360885620117, "global_step": 141123, "epoch": 1700} {"train_loss": -23.0128173828125, "global_step": 141124, "epoch": 1700} {"train_loss": -22.896116256713867, "global_step": 141125, "epoch": 1700} {"train_loss": -23.14617347717285, "global_step": 141126, "epoch": 1700} {"train_loss": -23.231708526611328, "global_step": 141127, "epoch": 1700} {"train_loss": -23.031238555908203, "global_step": 141128, "epoch": 1700} {"train_loss": -23.378774642944336, "global_step": 141129, "epoch": 1700} {"train_loss": -23.02570915222168, "global_step": 141130, "epoch": 1700} {"train_loss": -22.64725112915039, "global_step": 141131, "epoch": 1700} {"train_loss": -23.086044311523438, "global_step": 141132, "epoch": 1700} {"train_loss": -23.344633102416992, "global_step": 141133, "epoch": 1700} {"train_loss": -22.79314613342285, "global_step": 141134, "epoch": 1700} {"train_loss": -23.04682731628418, "global_step": 141135, "epoch": 1700} {"train_loss": -22.755277633666992, "global_step": 141136, "epoch": 1700} {"train_loss": -22.98334503173828, "global_step": 141137, "epoch": 1700} {"train_loss": -23.167892456054688, "global_step": 141138, "epoch": 1700} {"train_loss": -23.037689208984375, "global_step": 141139, "epoch": 1700} {"train_loss": -23.0986385345459, "global_step": 141140, "epoch": 1700} {"train_loss": -22.950597763061523, "global_step": 141141, "epoch": 1700} {"train_loss": -22.875396728515625, "global_step": 141142, "epoch": 1700} {"train_loss": -23.205554962158203, "global_step": 141143, "epoch": 1700} {"train_loss": -23.110980987548828, "global_step": 141144, "epoch": 1700} {"train_loss": -22.942733764648438, "global_step": 141145, "epoch": 1700} {"train_loss": -22.935823440551758, "global_step": 141146, "epoch": 1700} {"train_loss": -23.24123191833496, "global_step": 141147, "epoch": 1700} {"train_loss": -22.909116744995117, "global_step": 141148, "epoch": 1700} {"train_loss": -22.489774703979492, "global_step": 141149, "epoch": 1700} {"train_loss": -23.055925369262695, "global_step": 141150, "epoch": 1700} {"train_loss": -22.52276039123535, "global_step": 141151, "epoch": 1700} {"train_loss": -22.938512802124023, "global_step": 141152, "epoch": 1700} {"train_loss": -23.07867431640625, "global_step": 141153, "epoch": 1700} {"train_loss": -22.47557258605957, "global_step": 141154, "epoch": 1700} {"train_loss": -23.14664077758789, "global_step": 141155, "epoch": 1700} {"train_loss": -22.59823989868164, "global_step": 141156, "epoch": 1700} {"train_loss": -22.896154403686523, "global_step": 141157, "epoch": 1700} {"train_loss": -22.93692970275879, "global_step": 141158, "epoch": 1700} {"train_loss": -23.24775505065918, "global_step": 141159, "epoch": 1700} {"train_loss": -22.714046478271484, "global_step": 141160, "epoch": 1700} {"train_loss": -23.085102081298828, "global_step": 141161, "epoch": 1700} {"train_loss": -23.000701904296875, "global_step": 141162, "epoch": 1700} {"train_loss": -23.446252822875977, "global_step": 141163, "epoch": 1700} {"train_loss": -22.567989349365234, "global_step": 141164, "epoch": 1700} {"train_loss": -23.319189071655273, "global_step": 141165, "epoch": 1700} {"train_loss": -22.992700576782227, "global_step": 141166, "epoch": 1700} {"train_loss": -23.207782745361328, "global_step": 141167, "epoch": 1700} {"train_loss": -22.914838790893555, "global_step": 141168, "epoch": 1700} {"train_loss": -23.189626693725586, "global_step": 141169, "epoch": 1700} {"train_loss": -23.516870498657227, "global_step": 141170, "epoch": 1700} {"train_loss": -23.243011474609375, "global_step": 141171, "epoch": 1700} {"train_loss": -23.28443717956543, "global_step": 141172, "epoch": 1700} {"train_loss": -22.891742706298828, "global_step": 141173, "epoch": 1700} {"train_loss": -22.888303756713867, "global_step": 141174, "epoch": 1700} {"train_loss": -23.4274959564209, "global_step": 141175, "epoch": 1700} {"train_loss": -23.211536407470703, "global_step": 141176, "epoch": 1700} {"train_loss": -23.126279830932617, "global_step": 141177, "epoch": 1700} {"train_loss": -23.607820510864258, "global_step": 141178, "epoch": 1700} {"train_loss": -23.0916805267334, "global_step": 141179, "epoch": 1700} {"train_loss": -22.608945846557617, "global_step": 141180, "epoch": 1700} {"train_loss": -22.82269859313965, "global_step": 141181, "epoch": 1700} {"train_loss": -23.002404132521296, "global_step": 141182, "epoch": 1700, "train/sim_max_reward_0": 1.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4500000": 1.0, "test/sim_max_reward_4500001": 1.0, "test/sim_max_reward_4500002": 1.0, "test/sim_max_reward_4500003": 1.0, "test/sim_max_reward_4500004": 1.0, "test/sim_max_reward_4500005": 1.0, "test/sim_max_reward_4500006": 1.0, "test/sim_max_reward_4500007": 1.0, "test/sim_max_reward_4500008": 1.0, "test/sim_max_reward_4500009": 1.0, "test/sim_max_reward_4500010": 1.0, "test/sim_max_reward_4500011": 1.0, "test/sim_max_reward_4500012": 1.0, "test/sim_max_reward_4500013": 1.0, "test/sim_max_reward_4500014": 1.0, "test/sim_max_reward_4500015": 1.0, "test/sim_max_reward_4500016": 1.0, "test/sim_max_reward_4500017": 1.0, "test/sim_max_reward_4500018": 1.0, "test/sim_max_reward_4500019": 1.0, "test/sim_max_reward_4500020": 1.0, "test/sim_max_reward_4500021": 1.0, "train/mean_score": 1.0, "test/mean_score": 1.0, "val_loss": 6253252.5} {"train_loss": -22.881072998046875, "global_step": 141183, "epoch": 1701} {"train_loss": -22.61883544921875, "global_step": 141184, "epoch": 1701} {"train_loss": -22.502267837524414, "global_step": 141185, "epoch": 1701} {"train_loss": -22.952489852905273, "global_step": 141186, "epoch": 1701} {"train_loss": -22.7391414642334, "global_step": 141187, "epoch": 1701} {"train_loss": -22.270559310913086, "global_step": 141188, "epoch": 1701} {"train_loss": -22.434795379638672, "global_step": 141189, "epoch": 1701} {"train_loss": -23.040494918823242, "global_step": 141190, "epoch": 1701} {"train_loss": -22.482240676879883, "global_step": 141191, "epoch": 1701} {"train_loss": -22.91225242614746, "global_step": 141192, "epoch": 1701} {"train_loss": -22.974727630615234, "global_step": 141193, "epoch": 1701} {"train_loss": -22.881391525268555, "global_step": 141194, "epoch": 1701} {"train_loss": -22.982519149780273, "global_step": 141195, "epoch": 1701} {"train_loss": -22.83328628540039, "global_step": 141196, "epoch": 1701} {"train_loss": -22.766420364379883, "global_step": 141197, "epoch": 1701} {"train_loss": -22.67848014831543, "global_step": 141198, "epoch": 1701} {"train_loss": -23.115880966186523, "global_step": 141199, "epoch": 1701} {"train_loss": -23.08321762084961, "global_step": 141200, "epoch": 1701} {"train_loss": -22.935348510742188, "global_step": 141201, "epoch": 1701} {"train_loss": -22.948850631713867, "global_step": 141202, "epoch": 1701} {"train_loss": -23.064302444458008, "global_step": 141203, "epoch": 1701} {"train_loss": -23.024459838867188, "global_step": 141204, "epoch": 1701} {"train_loss": -23.030733108520508, "global_step": 141205, "epoch": 1701} {"train_loss": -23.40675926208496, "global_step": 141206, "epoch": 1701} {"train_loss": -23.020536422729492, "global_step": 141207, "epoch": 1701} {"train_loss": -22.727745056152344, "global_step": 141208, "epoch": 1701} {"train_loss": -23.320558547973633, "global_step": 141209, "epoch": 1701} {"train_loss": -22.77583122253418, "global_step": 141210, "epoch": 1701} {"train_loss": -23.16055679321289, "global_step": 141211, "epoch": 1701} {"train_loss": -23.006895065307617, "global_step": 141212, "epoch": 1701} {"train_loss": -23.17062759399414, "global_step": 141213, "epoch": 1701} {"train_loss": -23.163692474365234, "global_step": 141214, "epoch": 1701} {"train_loss": -23.123258590698242, "global_step": 141215, "epoch": 1701} {"train_loss": -22.778409957885742, "global_step": 141216, "epoch": 1701} {"train_loss": -23.053802490234375, "global_step": 141217, "epoch": 1701} {"train_loss": -22.92762565612793, "global_step": 141218, "epoch": 1701} {"train_loss": -22.988636016845703, "global_step": 141219, "epoch": 1701} {"train_loss": -22.80912971496582, "global_step": 141220, "epoch": 1701} {"train_loss": -23.048673629760742, "global_step": 141221, "epoch": 1701} {"train_loss": -22.907268524169922, "global_step": 141222, "epoch": 1701} {"train_loss": -23.229406356811523, "global_step": 141223, "epoch": 1701} {"train_loss": -23.028949737548828, "global_step": 141224, "epoch": 1701} {"train_loss": -23.62434959411621, "global_step": 141225, "epoch": 1701} {"train_loss": -23.263626098632812, "global_step": 141226, "epoch": 1701} {"train_loss": -23.425457000732422, "global_step": 141227, "epoch": 1701} {"train_loss": -23.271392822265625, "global_step": 141228, "epoch": 1701} {"train_loss": -23.183176040649414, "global_step": 141229, "epoch": 1701} {"train_loss": -22.906770706176758, "global_step": 141230, "epoch": 1701} {"train_loss": -22.872262954711914, "global_step": 141231, "epoch": 1701} {"train_loss": -22.91637420654297, "global_step": 141232, "epoch": 1701} {"train_loss": -23.02867317199707, "global_step": 141233, "epoch": 1701} {"train_loss": -23.464269638061523, "global_step": 141234, "epoch": 1701} {"train_loss": -22.450536727905273, "global_step": 141235, "epoch": 1701} {"train_loss": -23.178693771362305, "global_step": 141236, "epoch": 1701} {"train_loss": -23.023120880126953, "global_step": 141237, "epoch": 1701} {"train_loss": -23.438886642456055, "global_step": 141238, "epoch": 1701} {"train_loss": -22.7150936126709, "global_step": 141239, "epoch": 1701} {"train_loss": -23.334257125854492, "global_step": 141240, "epoch": 1701} {"train_loss": -22.709497451782227, "global_step": 141241, "epoch": 1701} {"train_loss": -23.14975357055664, "global_step": 141242, "epoch": 1701} {"train_loss": -23.24460792541504, "global_step": 141243, "epoch": 1701} {"train_loss": -23.322050094604492, "global_step": 141244, "epoch": 1701} {"train_loss": -22.966068267822266, "global_step": 141245, "epoch": 1701} {"train_loss": -23.279020309448242, "global_step": 141246, "epoch": 1701} {"train_loss": -22.894989013671875, "global_step": 141247, "epoch": 1701} {"train_loss": -22.71709442138672, "global_step": 141248, "epoch": 1701} {"train_loss": -23.065692901611328, "global_step": 141249, "epoch": 1701} {"train_loss": -23.058223724365234, "global_step": 141250, "epoch": 1701} {"train_loss": -23.13580894470215, "global_step": 141251, "epoch": 1701} {"train_loss": -23.011571884155273, "global_step": 141252, "epoch": 1701} {"train_loss": -22.76058006286621, "global_step": 141253, "epoch": 1701} {"train_loss": -23.193801879882812, "global_step": 141254, "epoch": 1701} {"train_loss": -22.958736419677734, "global_step": 141255, "epoch": 1701} {"train_loss": -23.080867767333984, "global_step": 141256, "epoch": 1701} {"train_loss": -23.444311141967773, "global_step": 141257, "epoch": 1701} {"train_loss": -23.149951934814453, "global_step": 141258, "epoch": 1701} {"train_loss": -23.03558921813965, "global_step": 141259, "epoch": 1701} {"train_loss": -23.3110408782959, "global_step": 141260, "epoch": 1701} {"train_loss": -23.071044921875, "global_step": 141261, "epoch": 1701} {"train_loss": -23.191486358642578, "global_step": 141262, "epoch": 1701} {"train_loss": -23.361217498779297, "global_step": 141263, "epoch": 1701} {"train_loss": -22.97748374938965, "global_step": 141264, "epoch": 1701} {"train_loss": -23.002729025231787, "global_step": 141265, "epoch": 1701, "val_loss": 6294697.0} {"train_loss": -22.44202995300293, "global_step": 141266, "epoch": 1702} {"train_loss": -22.205713272094727, "global_step": 141267, "epoch": 1702} {"train_loss": -22.90021324157715, "global_step": 141268, "epoch": 1702} {"train_loss": -22.583383560180664, "global_step": 141269, "epoch": 1702} {"train_loss": -22.63612937927246, "global_step": 141270, "epoch": 1702} {"train_loss": -22.47519302368164, "global_step": 141271, "epoch": 1702} {"train_loss": -23.19136619567871, "global_step": 141272, "epoch": 1702} {"train_loss": -22.491682052612305, "global_step": 141273, "epoch": 1702} {"train_loss": -23.170007705688477, "global_step": 141274, "epoch": 1702} {"train_loss": -22.774240493774414, "global_step": 141275, "epoch": 1702} {"train_loss": -22.956850051879883, "global_step": 141276, "epoch": 1702} {"train_loss": -22.458642959594727, "global_step": 141277, "epoch": 1702} {"train_loss": -22.76178550720215, "global_step": 141278, "epoch": 1702} {"train_loss": -23.1720027923584, "global_step": 141279, "epoch": 1702} {"train_loss": -22.94792938232422, "global_step": 141280, "epoch": 1702} {"train_loss": -23.228107452392578, "global_step": 141281, "epoch": 1702} {"train_loss": -22.819509506225586, "global_step": 141282, "epoch": 1702} {"train_loss": -22.783334732055664, "global_step": 141283, "epoch": 1702} {"train_loss": -22.71717643737793, "global_step": 141284, "epoch": 1702} {"train_loss": -23.214902877807617, "global_step": 141285, "epoch": 1702} {"train_loss": -23.15576171875, "global_step": 141286, "epoch": 1702} {"train_loss": -22.891233444213867, "global_step": 141287, "epoch": 1702} {"train_loss": -23.064807891845703, "global_step": 141288, "epoch": 1702} {"train_loss": -22.984905242919922, "global_step": 141289, "epoch": 1702} {"train_loss": -23.028732299804688, "global_step": 141290, "epoch": 1702} {"train_loss": -22.959665298461914, "global_step": 141291, "epoch": 1702} {"train_loss": -22.868785858154297, "global_step": 141292, "epoch": 1702} {"train_loss": -23.038116455078125, "global_step": 141293, "epoch": 1702} {"train_loss": -22.706100463867188, "global_step": 141294, "epoch": 1702} {"train_loss": -22.822912216186523, "global_step": 141295, "epoch": 1702} {"train_loss": -23.30868911743164, "global_step": 141296, "epoch": 1702} {"train_loss": -22.804157257080078, "global_step": 141297, "epoch": 1702} {"train_loss": -23.118398666381836, "global_step": 141298, "epoch": 1702} {"train_loss": -23.110076904296875, "global_step": 141299, "epoch": 1702} {"train_loss": -23.038358688354492, "global_step": 141300, "epoch": 1702} {"train_loss": -22.954511642456055, "global_step": 141301, "epoch": 1702} {"train_loss": -22.6060848236084, "global_step": 141302, "epoch": 1702} {"train_loss": -23.0706844329834, "global_step": 141303, "epoch": 1702} {"train_loss": -23.31817626953125, "global_step": 141304, "epoch": 1702} {"train_loss": -23.1025333404541, "global_step": 141305, "epoch": 1702} {"train_loss": -22.826797485351562, "global_step": 141306, "epoch": 1702} {"train_loss": -23.2255916595459, "global_step": 141307, "epoch": 1702} {"train_loss": -23.3363094329834, "global_step": 141308, "epoch": 1702} {"train_loss": -23.247312545776367, "global_step": 141309, "epoch": 1702} {"train_loss": -23.262065887451172, "global_step": 141310, "epoch": 1702} {"train_loss": -23.11827278137207, "global_step": 141311, "epoch": 1702} {"train_loss": -23.252422332763672, "global_step": 141312, "epoch": 1702} {"train_loss": -23.13094139099121, "global_step": 141313, "epoch": 1702} {"train_loss": -23.116226196289062, "global_step": 141314, "epoch": 1702} {"train_loss": -23.425079345703125, "global_step": 141315, "epoch": 1702} {"train_loss": -22.738439559936523, "global_step": 141316, "epoch": 1702} {"train_loss": -22.906768798828125, "global_step": 141317, "epoch": 1702} {"train_loss": -23.316375732421875, "global_step": 141318, "epoch": 1702} {"train_loss": -23.143949508666992, "global_step": 141319, "epoch": 1702} {"train_loss": -23.06859588623047, "global_step": 141320, "epoch": 1702} {"train_loss": -23.05744743347168, "global_step": 141321, "epoch": 1702} {"train_loss": -23.068708419799805, "global_step": 141322, "epoch": 1702} {"train_loss": -22.79593276977539, "global_step": 141323, "epoch": 1702} {"train_loss": -23.26975440979004, "global_step": 141324, "epoch": 1702} {"train_loss": -23.148624420166016, "global_step": 141325, "epoch": 1702} {"train_loss": -22.952497482299805, "global_step": 141326, "epoch": 1702} {"train_loss": -23.12333106994629, "global_step": 141327, "epoch": 1702} {"train_loss": -23.1580810546875, "global_step": 141328, "epoch": 1702} {"train_loss": -22.939767837524414, "global_step": 141329, "epoch": 1702} {"train_loss": -23.49067497253418, "global_step": 141330, "epoch": 1702} {"train_loss": -23.103090286254883, "global_step": 141331, "epoch": 1702} {"train_loss": -23.323062896728516, "global_step": 141332, "epoch": 1702} {"train_loss": -23.257841110229492, "global_step": 141333, "epoch": 1702} {"train_loss": -23.54591941833496, "global_step": 141334, "epoch": 1702} {"train_loss": -23.400009155273438, "global_step": 141335, "epoch": 1702} {"train_loss": -22.900991439819336, "global_step": 141336, "epoch": 1702} {"train_loss": -23.13889503479004, "global_step": 141337, "epoch": 1702} {"train_loss": -23.182117462158203, "global_step": 141338, "epoch": 1702} {"train_loss": -23.4962215423584, "global_step": 141339, "epoch": 1702} {"train_loss": -23.51580810546875, "global_step": 141340, "epoch": 1702} {"train_loss": -23.12482261657715, "global_step": 141341, "epoch": 1702} {"train_loss": -23.128381729125977, "global_step": 141342, "epoch": 1702} {"train_loss": -23.105260848999023, "global_step": 141343, "epoch": 1702} {"train_loss": -22.873571395874023, "global_step": 141344, "epoch": 1702} {"train_loss": -22.96430206298828, "global_step": 141345, "epoch": 1702} {"train_loss": -23.02303695678711, "global_step": 141346, "epoch": 1702} {"train_loss": -23.20956039428711, "global_step": 141347, "epoch": 1702} {"train_loss": -23.01747427790998, "global_step": 141348, "epoch": 1702, "val_loss": 6304225.5} {"train_loss": -19.325246810913086, "global_step": 141349, "epoch": 1703} {"train_loss": -20.89412498474121, "global_step": 141350, "epoch": 1703} {"train_loss": -20.633991241455078, "global_step": 141351, "epoch": 1703} {"train_loss": -20.8793888092041, "global_step": 141352, "epoch": 1703} {"train_loss": -21.048688888549805, "global_step": 141353, "epoch": 1703} {"train_loss": -20.91837501525879, "global_step": 141354, "epoch": 1703} {"train_loss": -21.298505783081055, "global_step": 141355, "epoch": 1703} {"train_loss": -21.560148239135742, "global_step": 141356, "epoch": 1703} {"train_loss": -21.582401275634766, "global_step": 141357, "epoch": 1703} {"train_loss": -21.781545639038086, "global_step": 141358, "epoch": 1703} {"train_loss": -21.686750411987305, "global_step": 141359, "epoch": 1703} {"train_loss": -21.22824478149414, "global_step": 141360, "epoch": 1703} {"train_loss": -21.74686050415039, "global_step": 141361, "epoch": 1703} {"train_loss": -21.71822166442871, "global_step": 141362, "epoch": 1703} {"train_loss": -21.93123435974121, "global_step": 141363, "epoch": 1703} {"train_loss": -21.84718132019043, "global_step": 141364, "epoch": 1703} {"train_loss": -22.11594009399414, "global_step": 141365, "epoch": 1703} {"train_loss": -21.64699935913086, "global_step": 141366, "epoch": 1703} {"train_loss": -21.761280059814453, "global_step": 141367, "epoch": 1703} {"train_loss": -21.912811279296875, "global_step": 141368, "epoch": 1703} {"train_loss": -22.088911056518555, "global_step": 141369, "epoch": 1703} {"train_loss": -22.090648651123047, "global_step": 141370, "epoch": 1703} {"train_loss": -22.253103256225586, "global_step": 141371, "epoch": 1703} {"train_loss": -22.502145767211914, "global_step": 141372, "epoch": 1703} {"train_loss": -22.456327438354492, "global_step": 141373, "epoch": 1703} {"train_loss": -22.140104293823242, "global_step": 141374, "epoch": 1703} {"train_loss": -22.083698272705078, "global_step": 141375, "epoch": 1703} {"train_loss": -22.465116500854492, "global_step": 141376, "epoch": 1703} {"train_loss": -22.52766227722168, "global_step": 141377, "epoch": 1703} {"train_loss": -22.367815017700195, "global_step": 141378, "epoch": 1703} {"train_loss": -22.35940933227539, "global_step": 141379, "epoch": 1703} {"train_loss": -22.613035202026367, "global_step": 141380, "epoch": 1703} {"train_loss": -22.565608978271484, "global_step": 141381, "epoch": 1703} {"train_loss": -22.310779571533203, "global_step": 141382, "epoch": 1703} {"train_loss": -23.3400936126709, "global_step": 141383, "epoch": 1703} {"train_loss": -22.30446434020996, "global_step": 141384, "epoch": 1703} {"train_loss": -22.847219467163086, "global_step": 141385, "epoch": 1703} {"train_loss": -22.495702743530273, "global_step": 141386, "epoch": 1703} {"train_loss": -22.646039962768555, "global_step": 141387, "epoch": 1703} {"train_loss": -22.933332443237305, "global_step": 141388, "epoch": 1703} {"train_loss": -22.646942138671875, "global_step": 141389, "epoch": 1703} {"train_loss": -22.850378036499023, "global_step": 141390, "epoch": 1703} {"train_loss": -22.721689224243164, "global_step": 141391, "epoch": 1703} {"train_loss": -23.073698043823242, "global_step": 141392, "epoch": 1703} {"train_loss": -22.756187438964844, "global_step": 141393, "epoch": 1703} {"train_loss": -23.165075302124023, "global_step": 141394, "epoch": 1703} {"train_loss": -23.10063362121582, "global_step": 141395, "epoch": 1703} {"train_loss": -23.052461624145508, "global_step": 141396, "epoch": 1703} {"train_loss": -23.081968307495117, "global_step": 141397, "epoch": 1703} {"train_loss": -22.67719078063965, "global_step": 141398, "epoch": 1703} {"train_loss": -22.829938888549805, "global_step": 141399, "epoch": 1703} {"train_loss": -22.93634605407715, "global_step": 141400, "epoch": 1703} {"train_loss": -23.35977554321289, "global_step": 141401, "epoch": 1703} {"train_loss": -23.108062744140625, "global_step": 141402, "epoch": 1703} {"train_loss": -23.027923583984375, "global_step": 141403, "epoch": 1703} {"train_loss": -23.06103515625, "global_step": 141404, "epoch": 1703} {"train_loss": -23.1501522064209, "global_step": 141405, "epoch": 1703} {"train_loss": -23.16788101196289, "global_step": 141406, "epoch": 1703} {"train_loss": -23.235820770263672, "global_step": 141407, "epoch": 1703} {"train_loss": -22.97283172607422, "global_step": 141408, "epoch": 1703} {"train_loss": -23.09803009033203, "global_step": 141409, "epoch": 1703} {"train_loss": -23.12618064880371, "global_step": 141410, "epoch": 1703} {"train_loss": -23.0343074798584, "global_step": 141411, "epoch": 1703} {"train_loss": -22.88745880126953, "global_step": 141412, "epoch": 1703} {"train_loss": -22.877017974853516, "global_step": 141413, "epoch": 1703} {"train_loss": -23.259347915649414, "global_step": 141414, "epoch": 1703} {"train_loss": -22.83707618713379, "global_step": 141415, "epoch": 1703} {"train_loss": -23.106042861938477, "global_step": 141416, "epoch": 1703} {"train_loss": -23.46013832092285, "global_step": 141417, "epoch": 1703} {"train_loss": -23.022829055786133, "global_step": 141418, "epoch": 1703} {"train_loss": -23.43292808532715, "global_step": 141419, "epoch": 1703} {"train_loss": -22.85037612915039, "global_step": 141420, "epoch": 1703} {"train_loss": -23.3367977142334, "global_step": 141421, "epoch": 1703} {"train_loss": -23.1727237701416, "global_step": 141422, "epoch": 1703} {"train_loss": -23.3490047454834, "global_step": 141423, "epoch": 1703} {"train_loss": -23.155471801757812, "global_step": 141424, "epoch": 1703} {"train_loss": -23.09934425354004, "global_step": 141425, "epoch": 1703} {"train_loss": -23.4218807220459, "global_step": 141426, "epoch": 1703} {"train_loss": -23.25719451904297, "global_step": 141427, "epoch": 1703} {"train_loss": -23.088415145874023, "global_step": 141428, "epoch": 1703} {"train_loss": -23.121856689453125, "global_step": 141429, "epoch": 1703} {"train_loss": -23.040058135986328, "global_step": 141430, "epoch": 1703} {"train_loss": -22.5040695695992, "global_step": 141431, "epoch": 1703, "val_loss": 6345791.0} {"train_loss": -22.847463607788086, "global_step": 141432, "epoch": 1704} {"train_loss": -22.52680015563965, "global_step": 141433, "epoch": 1704} {"train_loss": -22.803668975830078, "global_step": 141434, "epoch": 1704} {"train_loss": -22.95916175842285, "global_step": 141435, "epoch": 1704} {"train_loss": -23.01395034790039, "global_step": 141436, "epoch": 1704} {"train_loss": -23.190061569213867, "global_step": 141437, "epoch": 1704} {"train_loss": -22.744115829467773, "global_step": 141438, "epoch": 1704} {"train_loss": -22.907028198242188, "global_step": 141439, "epoch": 1704} {"train_loss": -23.069272994995117, "global_step": 141440, "epoch": 1704} {"train_loss": -22.789480209350586, "global_step": 141441, "epoch": 1704} {"train_loss": -23.169692993164062, "global_step": 141442, "epoch": 1704} {"train_loss": -23.103271484375, "global_step": 141443, "epoch": 1704} {"train_loss": -23.37079429626465, "global_step": 141444, "epoch": 1704} {"train_loss": -22.98992156982422, "global_step": 141445, "epoch": 1704} {"train_loss": -23.372806549072266, "global_step": 141446, "epoch": 1704} {"train_loss": -22.93393898010254, "global_step": 141447, "epoch": 1704} {"train_loss": -23.37973976135254, "global_step": 141448, "epoch": 1704} {"train_loss": -22.9965877532959, "global_step": 141449, "epoch": 1704} {"train_loss": -22.439640045166016, "global_step": 141450, "epoch": 1704} {"train_loss": -23.013248443603516, "global_step": 141451, "epoch": 1704} {"train_loss": -23.07902717590332, "global_step": 141452, "epoch": 1704} {"train_loss": -23.569997787475586, "global_step": 141453, "epoch": 1704} {"train_loss": -22.702768325805664, "global_step": 141454, "epoch": 1704} {"train_loss": -22.972131729125977, "global_step": 141455, "epoch": 1704} {"train_loss": -22.71323013305664, "global_step": 141456, "epoch": 1704} {"train_loss": -23.06866455078125, "global_step": 141457, "epoch": 1704} {"train_loss": -22.43629264831543, "global_step": 141458, "epoch": 1704} {"train_loss": -22.567626953125, "global_step": 141459, "epoch": 1704} {"train_loss": -23.06349754333496, "global_step": 141460, "epoch": 1704} {"train_loss": -23.408735275268555, "global_step": 141461, "epoch": 1704} {"train_loss": -22.918058395385742, "global_step": 141462, "epoch": 1704} {"train_loss": -23.066434860229492, "global_step": 141463, "epoch": 1704} {"train_loss": -22.921571731567383, "global_step": 141464, "epoch": 1704} {"train_loss": -23.44538688659668, "global_step": 141465, "epoch": 1704} {"train_loss": -22.896331787109375, "global_step": 141466, "epoch": 1704} {"train_loss": -22.86809730529785, "global_step": 141467, "epoch": 1704} {"train_loss": -22.8897762298584, "global_step": 141468, "epoch": 1704} {"train_loss": -23.261823654174805, "global_step": 141469, "epoch": 1704} {"train_loss": -23.13739013671875, "global_step": 141470, "epoch": 1704} {"train_loss": -23.12611198425293, "global_step": 141471, "epoch": 1704} {"train_loss": -23.189838409423828, "global_step": 141472, "epoch": 1704} {"train_loss": -23.086027145385742, "global_step": 141473, "epoch": 1704} {"train_loss": -23.012460708618164, "global_step": 141474, "epoch": 1704} {"train_loss": -23.24032974243164, "global_step": 141475, "epoch": 1704} {"train_loss": -23.0701961517334, "global_step": 141476, "epoch": 1704} {"train_loss": -23.18808364868164, "global_step": 141477, "epoch": 1704} {"train_loss": -22.92866325378418, "global_step": 141478, "epoch": 1704} {"train_loss": -23.26858901977539, "global_step": 141479, "epoch": 1704} {"train_loss": -23.224857330322266, "global_step": 141480, "epoch": 1704} {"train_loss": -23.030689239501953, "global_step": 141481, "epoch": 1704} {"train_loss": -23.267271041870117, "global_step": 141482, "epoch": 1704} {"train_loss": -23.13513946533203, "global_step": 141483, "epoch": 1704} {"train_loss": -23.0185604095459, "global_step": 141484, "epoch": 1704} {"train_loss": -23.374969482421875, "global_step": 141485, "epoch": 1704} {"train_loss": -22.978540420532227, "global_step": 141486, "epoch": 1704} {"train_loss": -23.173810958862305, "global_step": 141487, "epoch": 1704} {"train_loss": -23.224348068237305, "global_step": 141488, "epoch": 1704} {"train_loss": -23.09699821472168, "global_step": 141489, "epoch": 1704} {"train_loss": -23.0609130859375, "global_step": 141490, "epoch": 1704} {"train_loss": -22.910232543945312, "global_step": 141491, "epoch": 1704} {"train_loss": -23.118925094604492, "global_step": 141492, "epoch": 1704} {"train_loss": -23.296463012695312, "global_step": 141493, "epoch": 1704} {"train_loss": -22.939931869506836, "global_step": 141494, "epoch": 1704} {"train_loss": -22.86659812927246, "global_step": 141495, "epoch": 1704} {"train_loss": -22.927751541137695, "global_step": 141496, "epoch": 1704} {"train_loss": -22.897926330566406, "global_step": 141497, "epoch": 1704} {"train_loss": -22.90180778503418, "global_step": 141498, "epoch": 1704} {"train_loss": -22.79595947265625, "global_step": 141499, "epoch": 1704} {"train_loss": -23.103790283203125, "global_step": 141500, "epoch": 1704} {"train_loss": -22.91885757446289, "global_step": 141501, "epoch": 1704} {"train_loss": -22.93849754333496, "global_step": 141502, "epoch": 1704} {"train_loss": -23.106382369995117, "global_step": 141503, "epoch": 1704} {"train_loss": -23.466283798217773, "global_step": 141504, "epoch": 1704} {"train_loss": -22.946853637695312, "global_step": 141505, "epoch": 1704} {"train_loss": -23.173826217651367, "global_step": 141506, "epoch": 1704} {"train_loss": -23.291860580444336, "global_step": 141507, "epoch": 1704} {"train_loss": -22.877531051635742, "global_step": 141508, "epoch": 1704} {"train_loss": -23.116281509399414, "global_step": 141509, "epoch": 1704} {"train_loss": -23.071500778198242, "global_step": 141510, "epoch": 1704} {"train_loss": -22.88705825805664, "global_step": 141511, "epoch": 1704} {"train_loss": -22.836393356323242, "global_step": 141512, "epoch": 1704} {"train_loss": -23.02694320678711, "global_step": 141513, "epoch": 1704} {"train_loss": -23.03350887528385, "global_step": 141514, "epoch": 1704, "val_loss": 6305482.0} {"train_loss": -22.5481014251709, "global_step": 141515, "epoch": 1705} {"train_loss": -22.862276077270508, "global_step": 141516, "epoch": 1705} {"train_loss": -22.570449829101562, "global_step": 141517, "epoch": 1705} {"train_loss": -22.4099063873291, "global_step": 141518, "epoch": 1705} {"train_loss": -22.369314193725586, "global_step": 141519, "epoch": 1705} {"train_loss": -22.843017578125, "global_step": 141520, "epoch": 1705} {"train_loss": -23.001768112182617, "global_step": 141521, "epoch": 1705} {"train_loss": -22.79817008972168, "global_step": 141522, "epoch": 1705} {"train_loss": -22.8867244720459, "global_step": 141523, "epoch": 1705} {"train_loss": -22.928380966186523, "global_step": 141524, "epoch": 1705} {"train_loss": -22.946714401245117, "global_step": 141525, "epoch": 1705} {"train_loss": -22.8594913482666, "global_step": 141526, "epoch": 1705} {"train_loss": -22.938024520874023, "global_step": 141527, "epoch": 1705} {"train_loss": -23.29707908630371, "global_step": 141528, "epoch": 1705} {"train_loss": -23.0744686126709, "global_step": 141529, "epoch": 1705} {"train_loss": -22.95297622680664, "global_step": 141530, "epoch": 1705} {"train_loss": -23.02264976501465, "global_step": 141531, "epoch": 1705} {"train_loss": -22.83903694152832, "global_step": 141532, "epoch": 1705} {"train_loss": -22.905057907104492, "global_step": 141533, "epoch": 1705} {"train_loss": -23.109373092651367, "global_step": 141534, "epoch": 1705} {"train_loss": -23.34027099609375, "global_step": 141535, "epoch": 1705} {"train_loss": -23.102018356323242, "global_step": 141536, "epoch": 1705} {"train_loss": -22.90363883972168, "global_step": 141537, "epoch": 1705} {"train_loss": -23.262588500976562, "global_step": 141538, "epoch": 1705} {"train_loss": -22.8399658203125, "global_step": 141539, "epoch": 1705} {"train_loss": -23.028539657592773, "global_step": 141540, "epoch": 1705} {"train_loss": -22.85260772705078, "global_step": 141541, "epoch": 1705} {"train_loss": -23.083847045898438, "global_step": 141542, "epoch": 1705} {"train_loss": -23.21524429321289, "global_step": 141543, "epoch": 1705} {"train_loss": -22.808353424072266, "global_step": 141544, "epoch": 1705} {"train_loss": -23.136938095092773, "global_step": 141545, "epoch": 1705} {"train_loss": -23.151264190673828, "global_step": 141546, "epoch": 1705} {"train_loss": -23.403833389282227, "global_step": 141547, "epoch": 1705} {"train_loss": -23.415552139282227, "global_step": 141548, "epoch": 1705} {"train_loss": -23.040945053100586, "global_step": 141549, "epoch": 1705} {"train_loss": -23.197179794311523, "global_step": 141550, "epoch": 1705} {"train_loss": -23.303516387939453, "global_step": 141551, "epoch": 1705} {"train_loss": -23.275869369506836, "global_step": 141552, "epoch": 1705} {"train_loss": -23.430465698242188, "global_step": 141553, "epoch": 1705} {"train_loss": -23.077585220336914, "global_step": 141554, "epoch": 1705} {"train_loss": -22.838041305541992, "global_step": 141555, "epoch": 1705} {"train_loss": -22.86709976196289, "global_step": 141556, "epoch": 1705} {"train_loss": -23.258193969726562, "global_step": 141557, "epoch": 1705} {"train_loss": -22.87419319152832, "global_step": 141558, "epoch": 1705} {"train_loss": -23.245594024658203, "global_step": 141559, "epoch": 1705} {"train_loss": -22.648386001586914, "global_step": 141560, "epoch": 1705} {"train_loss": -23.213241577148438, "global_step": 141561, "epoch": 1705} {"train_loss": -23.355688095092773, "global_step": 141562, "epoch": 1705} {"train_loss": -23.11849021911621, "global_step": 141563, "epoch": 1705} {"train_loss": -23.08582878112793, "global_step": 141564, "epoch": 1705} {"train_loss": -23.23529052734375, "global_step": 141565, "epoch": 1705} {"train_loss": -23.147451400756836, "global_step": 141566, "epoch": 1705} {"train_loss": -22.768712997436523, "global_step": 141567, "epoch": 1705} {"train_loss": -22.964256286621094, "global_step": 141568, "epoch": 1705} {"train_loss": -23.218626022338867, "global_step": 141569, "epoch": 1705} {"train_loss": -23.07680320739746, "global_step": 141570, "epoch": 1705} {"train_loss": -22.842071533203125, "global_step": 141571, "epoch": 1705} {"train_loss": -23.5541934967041, "global_step": 141572, "epoch": 1705} {"train_loss": -23.086719512939453, "global_step": 141573, "epoch": 1705} {"train_loss": -23.15443229675293, "global_step": 141574, "epoch": 1705} {"train_loss": -23.16358757019043, "global_step": 141575, "epoch": 1705} {"train_loss": -23.134113311767578, "global_step": 141576, "epoch": 1705} {"train_loss": -23.02728843688965, "global_step": 141577, "epoch": 1705} {"train_loss": -23.022480010986328, "global_step": 141578, "epoch": 1705} {"train_loss": -23.578386306762695, "global_step": 141579, "epoch": 1705} {"train_loss": -23.496057510375977, "global_step": 141580, "epoch": 1705} {"train_loss": -23.500303268432617, "global_step": 141581, "epoch": 1705} {"train_loss": -23.201114654541016, "global_step": 141582, "epoch": 1705} {"train_loss": -22.9409236907959, "global_step": 141583, "epoch": 1705} {"train_loss": -23.150419235229492, "global_step": 141584, "epoch": 1705} {"train_loss": -23.262659072875977, "global_step": 141585, "epoch": 1705} {"train_loss": -23.073383331298828, "global_step": 141586, "epoch": 1705} {"train_loss": -22.92761993408203, "global_step": 141587, "epoch": 1705} {"train_loss": -22.778722763061523, "global_step": 141588, "epoch": 1705} {"train_loss": -23.40398597717285, "global_step": 141589, "epoch": 1705} {"train_loss": -23.015893936157227, "global_step": 141590, "epoch": 1705} {"train_loss": -23.073938369750977, "global_step": 141591, "epoch": 1705} {"train_loss": -22.90363121032715, "global_step": 141592, "epoch": 1705} {"train_loss": -23.18975830078125, "global_step": 141593, "epoch": 1705} {"train_loss": -23.100900650024414, "global_step": 141594, "epoch": 1705} {"train_loss": -23.208784103393555, "global_step": 141595, "epoch": 1705} {"train_loss": -23.230743408203125, "global_step": 141596, "epoch": 1705} {"train_loss": -23.07518104185541, "global_step": 141597, "epoch": 1705, "val_loss": 6361780.0} {"train_loss": -22.429080963134766, "global_step": 141598, "epoch": 1706} {"train_loss": -22.72524070739746, "global_step": 141599, "epoch": 1706} {"train_loss": -22.760961532592773, "global_step": 141600, "epoch": 1706} {"train_loss": -22.31853675842285, "global_step": 141601, "epoch": 1706} {"train_loss": -22.491727828979492, "global_step": 141602, "epoch": 1706} {"train_loss": -22.673978805541992, "global_step": 141603, "epoch": 1706} {"train_loss": -23.066526412963867, "global_step": 141604, "epoch": 1706} {"train_loss": -22.85603141784668, "global_step": 141605, "epoch": 1706} {"train_loss": -23.103164672851562, "global_step": 141606, "epoch": 1706} {"train_loss": -23.18052101135254, "global_step": 141607, "epoch": 1706} {"train_loss": -22.98895835876465, "global_step": 141608, "epoch": 1706} {"train_loss": -22.87052345275879, "global_step": 141609, "epoch": 1706} {"train_loss": -22.418989181518555, "global_step": 141610, "epoch": 1706} {"train_loss": -22.91691780090332, "global_step": 141611, "epoch": 1706} {"train_loss": -22.742206573486328, "global_step": 141612, "epoch": 1706} {"train_loss": -22.608036041259766, "global_step": 141613, "epoch": 1706} {"train_loss": -22.867727279663086, "global_step": 141614, "epoch": 1706} {"train_loss": -23.065311431884766, "global_step": 141615, "epoch": 1706} {"train_loss": -22.834102630615234, "global_step": 141616, "epoch": 1706} {"train_loss": -22.650758743286133, "global_step": 141617, "epoch": 1706} {"train_loss": -23.07308006286621, "global_step": 141618, "epoch": 1706} {"train_loss": -22.843717575073242, "global_step": 141619, "epoch": 1706} {"train_loss": -22.924528121948242, "global_step": 141620, "epoch": 1706} {"train_loss": -23.013782501220703, "global_step": 141621, "epoch": 1706} {"train_loss": -23.11555290222168, "global_step": 141622, "epoch": 1706} {"train_loss": -22.757278442382812, "global_step": 141623, "epoch": 1706} {"train_loss": -23.285364151000977, "global_step": 141624, "epoch": 1706} {"train_loss": -22.60053825378418, "global_step": 141625, "epoch": 1706} {"train_loss": -22.7987003326416, "global_step": 141626, "epoch": 1706} {"train_loss": -23.2189884185791, "global_step": 141627, "epoch": 1706} {"train_loss": -22.785369873046875, "global_step": 141628, "epoch": 1706} {"train_loss": -23.208782196044922, "global_step": 141629, "epoch": 1706} {"train_loss": -23.167789459228516, "global_step": 141630, "epoch": 1706} {"train_loss": -22.876829147338867, "global_step": 141631, "epoch": 1706} {"train_loss": -23.169269561767578, "global_step": 141632, "epoch": 1706} {"train_loss": -23.246997833251953, "global_step": 141633, "epoch": 1706} {"train_loss": -23.02459144592285, "global_step": 141634, "epoch": 1706} {"train_loss": -23.425931930541992, "global_step": 141635, "epoch": 1706} {"train_loss": -22.989830017089844, "global_step": 141636, "epoch": 1706} {"train_loss": -23.2435359954834, "global_step": 141637, "epoch": 1706} {"train_loss": -23.1851749420166, "global_step": 141638, "epoch": 1706} {"train_loss": -22.711505889892578, "global_step": 141639, "epoch": 1706} {"train_loss": -23.1214542388916, "global_step": 141640, "epoch": 1706} {"train_loss": -23.500730514526367, "global_step": 141641, "epoch": 1706} {"train_loss": -22.938735961914062, "global_step": 141642, "epoch": 1706} {"train_loss": -22.763643264770508, "global_step": 141643, "epoch": 1706} {"train_loss": -23.050291061401367, "global_step": 141644, "epoch": 1706} {"train_loss": -23.19347381591797, "global_step": 141645, "epoch": 1706} {"train_loss": -23.2720947265625, "global_step": 141646, "epoch": 1706} {"train_loss": -23.140737533569336, "global_step": 141647, "epoch": 1706} {"train_loss": -23.181737899780273, "global_step": 141648, "epoch": 1706} {"train_loss": -23.055051803588867, "global_step": 141649, "epoch": 1706} {"train_loss": -22.74951171875, "global_step": 141650, "epoch": 1706} {"train_loss": -23.067611694335938, "global_step": 141651, "epoch": 1706} {"train_loss": -23.069143295288086, "global_step": 141652, "epoch": 1706} {"train_loss": -22.892940521240234, "global_step": 141653, "epoch": 1706} {"train_loss": -22.952409744262695, "global_step": 141654, "epoch": 1706} {"train_loss": -23.270553588867188, "global_step": 141655, "epoch": 1706} {"train_loss": -22.75061798095703, "global_step": 141656, "epoch": 1706} {"train_loss": -23.2865047454834, "global_step": 141657, "epoch": 1706} {"train_loss": -22.705114364624023, "global_step": 141658, "epoch": 1706} {"train_loss": -22.92522621154785, "global_step": 141659, "epoch": 1706} {"train_loss": -23.037052154541016, "global_step": 141660, "epoch": 1706} {"train_loss": -23.181264877319336, "global_step": 141661, "epoch": 1706} {"train_loss": -22.680606842041016, "global_step": 141662, "epoch": 1706} {"train_loss": -22.734594345092773, "global_step": 141663, "epoch": 1706} {"train_loss": -22.914091110229492, "global_step": 141664, "epoch": 1706} {"train_loss": -23.000160217285156, "global_step": 141665, "epoch": 1706} {"train_loss": -23.148107528686523, "global_step": 141666, "epoch": 1706} {"train_loss": -23.028898239135742, "global_step": 141667, "epoch": 1706} {"train_loss": -23.177566528320312, "global_step": 141668, "epoch": 1706} {"train_loss": -23.3835391998291, "global_step": 141669, "epoch": 1706} {"train_loss": -23.144775390625, "global_step": 141670, "epoch": 1706} {"train_loss": -23.450014114379883, "global_step": 141671, "epoch": 1706} {"train_loss": -23.17816162109375, "global_step": 141672, "epoch": 1706} {"train_loss": -22.79998779296875, "global_step": 141673, "epoch": 1706} {"train_loss": -22.949968338012695, "global_step": 141674, "epoch": 1706} {"train_loss": -23.18181037902832, "global_step": 141675, "epoch": 1706} {"train_loss": -23.204099655151367, "global_step": 141676, "epoch": 1706} {"train_loss": -22.978988647460938, "global_step": 141677, "epoch": 1706} {"train_loss": -23.007789611816406, "global_step": 141678, "epoch": 1706} {"train_loss": -23.287633895874023, "global_step": 141679, "epoch": 1706} {"train_loss": -22.980536771107868, "global_step": 141680, "epoch": 1706, "val_loss": 6351850.5} {"train_loss": -22.40323257446289, "global_step": 141681, "epoch": 1707} {"train_loss": -22.84291648864746, "global_step": 141682, "epoch": 1707} {"train_loss": -22.685338973999023, "global_step": 141683, "epoch": 1707} {"train_loss": -22.86928367614746, "global_step": 141684, "epoch": 1707} {"train_loss": -22.979026794433594, "global_step": 141685, "epoch": 1707} {"train_loss": -22.940954208374023, "global_step": 141686, "epoch": 1707} {"train_loss": -23.159940719604492, "global_step": 141687, "epoch": 1707} {"train_loss": -22.650402069091797, "global_step": 141688, "epoch": 1707} {"train_loss": -23.01448631286621, "global_step": 141689, "epoch": 1707} {"train_loss": -22.650793075561523, "global_step": 141690, "epoch": 1707} {"train_loss": -22.803836822509766, "global_step": 141691, "epoch": 1707} {"train_loss": -22.97846031188965, "global_step": 141692, "epoch": 1707} {"train_loss": -22.426542282104492, "global_step": 141693, "epoch": 1707} {"train_loss": -22.923349380493164, "global_step": 141694, "epoch": 1707} {"train_loss": -22.700681686401367, "global_step": 141695, "epoch": 1707} {"train_loss": -22.66895866394043, "global_step": 141696, "epoch": 1707} {"train_loss": -23.131479263305664, "global_step": 141697, "epoch": 1707} {"train_loss": -22.804052352905273, "global_step": 141698, "epoch": 1707} {"train_loss": -22.999149322509766, "global_step": 141699, "epoch": 1707} {"train_loss": -23.047086715698242, "global_step": 141700, "epoch": 1707} {"train_loss": -22.601499557495117, "global_step": 141701, "epoch": 1707} {"train_loss": -23.220504760742188, "global_step": 141702, "epoch": 1707} {"train_loss": -22.8559627532959, "global_step": 141703, "epoch": 1707} {"train_loss": -23.28500747680664, "global_step": 141704, "epoch": 1707} {"train_loss": -22.79793357849121, "global_step": 141705, "epoch": 1707} {"train_loss": -22.82471466064453, "global_step": 141706, "epoch": 1707} {"train_loss": -22.932445526123047, "global_step": 141707, "epoch": 1707} {"train_loss": -23.23787498474121, "global_step": 141708, "epoch": 1707} {"train_loss": -22.91671371459961, "global_step": 141709, "epoch": 1707} {"train_loss": -22.92698097229004, "global_step": 141710, "epoch": 1707} {"train_loss": -23.106494903564453, "global_step": 141711, "epoch": 1707} {"train_loss": -22.978605270385742, "global_step": 141712, "epoch": 1707} {"train_loss": -23.532865524291992, "global_step": 141713, "epoch": 1707} {"train_loss": -22.532779693603516, "global_step": 141714, "epoch": 1707} {"train_loss": -23.012672424316406, "global_step": 141715, "epoch": 1707} {"train_loss": -23.124357223510742, "global_step": 141716, "epoch": 1707} {"train_loss": -22.69637680053711, "global_step": 141717, "epoch": 1707} {"train_loss": -23.06941795349121, "global_step": 141718, "epoch": 1707} {"train_loss": -23.35816192626953, "global_step": 141719, "epoch": 1707} {"train_loss": -23.029247283935547, "global_step": 141720, "epoch": 1707} {"train_loss": -23.22774314880371, "global_step": 141721, "epoch": 1707} {"train_loss": -23.14558982849121, "global_step": 141722, "epoch": 1707} {"train_loss": -23.530073165893555, "global_step": 141723, "epoch": 1707} {"train_loss": -23.03030776977539, "global_step": 141724, "epoch": 1707} {"train_loss": -23.36200714111328, "global_step": 141725, "epoch": 1707} {"train_loss": -22.861602783203125, "global_step": 141726, "epoch": 1707} {"train_loss": -22.847061157226562, "global_step": 141727, "epoch": 1707} {"train_loss": -22.92580795288086, "global_step": 141728, "epoch": 1707} {"train_loss": -22.881322860717773, "global_step": 141729, "epoch": 1707} {"train_loss": -23.232501983642578, "global_step": 141730, "epoch": 1707} {"train_loss": -23.123580932617188, "global_step": 141731, "epoch": 1707} {"train_loss": -22.987468719482422, "global_step": 141732, "epoch": 1707} {"train_loss": -23.290822982788086, "global_step": 141733, "epoch": 1707} {"train_loss": -23.20387077331543, "global_step": 141734, "epoch": 1707} {"train_loss": -23.32305335998535, "global_step": 141735, "epoch": 1707} {"train_loss": -23.3524112701416, "global_step": 141736, "epoch": 1707} {"train_loss": -23.172489166259766, "global_step": 141737, "epoch": 1707} {"train_loss": -23.223182678222656, "global_step": 141738, "epoch": 1707} {"train_loss": -23.273771286010742, "global_step": 141739, "epoch": 1707} {"train_loss": -23.215688705444336, "global_step": 141740, "epoch": 1707} {"train_loss": -23.055038452148438, "global_step": 141741, "epoch": 1707} {"train_loss": -23.241071701049805, "global_step": 141742, "epoch": 1707} {"train_loss": -22.94008445739746, "global_step": 141743, "epoch": 1707} {"train_loss": -23.188840866088867, "global_step": 141744, "epoch": 1707} {"train_loss": -23.378828048706055, "global_step": 141745, "epoch": 1707} {"train_loss": -23.004074096679688, "global_step": 141746, "epoch": 1707} {"train_loss": -23.490182876586914, "global_step": 141747, "epoch": 1707} {"train_loss": -23.048152923583984, "global_step": 141748, "epoch": 1707} {"train_loss": -23.359867095947266, "global_step": 141749, "epoch": 1707} {"train_loss": -23.21839714050293, "global_step": 141750, "epoch": 1707} {"train_loss": -23.443235397338867, "global_step": 141751, "epoch": 1707} {"train_loss": -23.39760398864746, "global_step": 141752, "epoch": 1707} {"train_loss": -23.546518325805664, "global_step": 141753, "epoch": 1707} {"train_loss": -23.019208908081055, "global_step": 141754, "epoch": 1707} {"train_loss": -23.18928337097168, "global_step": 141755, "epoch": 1707} {"train_loss": -23.401784896850586, "global_step": 141756, "epoch": 1707} {"train_loss": -23.329435348510742, "global_step": 141757, "epoch": 1707} {"train_loss": -23.237722396850586, "global_step": 141758, "epoch": 1707} {"train_loss": -23.17634391784668, "global_step": 141759, "epoch": 1707} {"train_loss": -23.251394271850586, "global_step": 141760, "epoch": 1707} {"train_loss": -23.33905029296875, "global_step": 141761, "epoch": 1707} {"train_loss": -23.170331954956055, "global_step": 141762, "epoch": 1707} {"train_loss": -23.049551239932875, "global_step": 141763, "epoch": 1707, "val_loss": 6255299.0} {"train_loss": -22.006057739257812, "global_step": 141764, "epoch": 1708} {"train_loss": -22.140090942382812, "global_step": 141765, "epoch": 1708} {"train_loss": -21.95984649658203, "global_step": 141766, "epoch": 1708} {"train_loss": -22.10980224609375, "global_step": 141767, "epoch": 1708} {"train_loss": -22.36485481262207, "global_step": 141768, "epoch": 1708} {"train_loss": -22.41983413696289, "global_step": 141769, "epoch": 1708} {"train_loss": -22.716466903686523, "global_step": 141770, "epoch": 1708} {"train_loss": -22.619548797607422, "global_step": 141771, "epoch": 1708} {"train_loss": -22.381912231445312, "global_step": 141772, "epoch": 1708} {"train_loss": -22.34212303161621, "global_step": 141773, "epoch": 1708} {"train_loss": -22.81080436706543, "global_step": 141774, "epoch": 1708} {"train_loss": -22.494632720947266, "global_step": 141775, "epoch": 1708} {"train_loss": -22.217205047607422, "global_step": 141776, "epoch": 1708} {"train_loss": -22.42557144165039, "global_step": 141777, "epoch": 1708} {"train_loss": -22.801040649414062, "global_step": 141778, "epoch": 1708} {"train_loss": -22.703861236572266, "global_step": 141779, "epoch": 1708} {"train_loss": -22.5227108001709, "global_step": 141780, "epoch": 1708} {"train_loss": -22.810232162475586, "global_step": 141781, "epoch": 1708} {"train_loss": -22.909452438354492, "global_step": 141782, "epoch": 1708} {"train_loss": -22.611196517944336, "global_step": 141783, "epoch": 1708} {"train_loss": -23.168607711791992, "global_step": 141784, "epoch": 1708} {"train_loss": -23.07569694519043, "global_step": 141785, "epoch": 1708} {"train_loss": -22.606735229492188, "global_step": 141786, "epoch": 1708} {"train_loss": -23.029170989990234, "global_step": 141787, "epoch": 1708} {"train_loss": -22.670780181884766, "global_step": 141788, "epoch": 1708} {"train_loss": -22.849655151367188, "global_step": 141789, "epoch": 1708} {"train_loss": -22.833627700805664, "global_step": 141790, "epoch": 1708} {"train_loss": -22.8056583404541, "global_step": 141791, "epoch": 1708} {"train_loss": -22.825387954711914, "global_step": 141792, "epoch": 1708} {"train_loss": -23.040576934814453, "global_step": 141793, "epoch": 1708} {"train_loss": -23.0443172454834, "global_step": 141794, "epoch": 1708} {"train_loss": -22.713668823242188, "global_step": 141795, "epoch": 1708} {"train_loss": -22.781131744384766, "global_step": 141796, "epoch": 1708} {"train_loss": -23.2437801361084, "global_step": 141797, "epoch": 1708} {"train_loss": -22.982135772705078, "global_step": 141798, "epoch": 1708} {"train_loss": -23.117660522460938, "global_step": 141799, "epoch": 1708} {"train_loss": -23.293487548828125, "global_step": 141800, "epoch": 1708} {"train_loss": -23.49875831604004, "global_step": 141801, "epoch": 1708} {"train_loss": -22.936853408813477, "global_step": 141802, "epoch": 1708} {"train_loss": -23.062353134155273, "global_step": 141803, "epoch": 1708} {"train_loss": -23.020774841308594, "global_step": 141804, "epoch": 1708} {"train_loss": -22.875686645507812, "global_step": 141805, "epoch": 1708} {"train_loss": -23.017227172851562, "global_step": 141806, "epoch": 1708} {"train_loss": -23.463836669921875, "global_step": 141807, "epoch": 1708} {"train_loss": -23.234891891479492, "global_step": 141808, "epoch": 1708} {"train_loss": -23.030765533447266, "global_step": 141809, "epoch": 1708} {"train_loss": -23.284006118774414, "global_step": 141810, "epoch": 1708} {"train_loss": -22.915006637573242, "global_step": 141811, "epoch": 1708} {"train_loss": -23.15663719177246, "global_step": 141812, "epoch": 1708} {"train_loss": -23.32781410217285, "global_step": 141813, "epoch": 1708} {"train_loss": -23.172592163085938, "global_step": 141814, "epoch": 1708} {"train_loss": -23.07083511352539, "global_step": 141815, "epoch": 1708} {"train_loss": -23.467594146728516, "global_step": 141816, "epoch": 1708} {"train_loss": -23.14853286743164, "global_step": 141817, "epoch": 1708} {"train_loss": -23.15618324279785, "global_step": 141818, "epoch": 1708} {"train_loss": -23.037057876586914, "global_step": 141819, "epoch": 1708} {"train_loss": -23.091428756713867, "global_step": 141820, "epoch": 1708} {"train_loss": -23.35364532470703, "global_step": 141821, "epoch": 1708} {"train_loss": -23.2082576751709, "global_step": 141822, "epoch": 1708} {"train_loss": -23.57159423828125, "global_step": 141823, "epoch": 1708} {"train_loss": -22.75011444091797, "global_step": 141824, "epoch": 1708} {"train_loss": -23.524738311767578, "global_step": 141825, "epoch": 1708} {"train_loss": -22.931385040283203, "global_step": 141826, "epoch": 1708} {"train_loss": -23.3021240234375, "global_step": 141827, "epoch": 1708} {"train_loss": -23.306676864624023, "global_step": 141828, "epoch": 1708} {"train_loss": -23.118539810180664, "global_step": 141829, "epoch": 1708} {"train_loss": -22.950878143310547, "global_step": 141830, "epoch": 1708} {"train_loss": -23.403106689453125, "global_step": 141831, "epoch": 1708} {"train_loss": -22.9769229888916, "global_step": 141832, "epoch": 1708} {"train_loss": -23.023412704467773, "global_step": 141833, "epoch": 1708} {"train_loss": -23.28628921508789, "global_step": 141834, "epoch": 1708} {"train_loss": -23.497034072875977, "global_step": 141835, "epoch": 1708} {"train_loss": -22.971080780029297, "global_step": 141836, "epoch": 1708} {"train_loss": -23.1436710357666, "global_step": 141837, "epoch": 1708} {"train_loss": -23.0130615234375, "global_step": 141838, "epoch": 1708} {"train_loss": -23.207609176635742, "global_step": 141839, "epoch": 1708} {"train_loss": -23.426359176635742, "global_step": 141840, "epoch": 1708} {"train_loss": -23.2535400390625, "global_step": 141841, "epoch": 1708} {"train_loss": -23.242307662963867, "global_step": 141842, "epoch": 1708} {"train_loss": -22.918054580688477, "global_step": 141843, "epoch": 1708} {"train_loss": -23.01885986328125, "global_step": 141844, "epoch": 1708} {"train_loss": -23.370792388916016, "global_step": 141845, "epoch": 1708} {"train_loss": -22.956335412450585, "global_step": 141846, "epoch": 1708, "val_loss": 6309013.0} {"train_loss": -22.703344345092773, "global_step": 141847, "epoch": 1709} {"train_loss": -22.628812789916992, "global_step": 141848, "epoch": 1709} {"train_loss": -22.243816375732422, "global_step": 141849, "epoch": 1709} {"train_loss": -23.067264556884766, "global_step": 141850, "epoch": 1709} {"train_loss": -22.907506942749023, "global_step": 141851, "epoch": 1709} {"train_loss": -22.482086181640625, "global_step": 141852, "epoch": 1709} {"train_loss": -22.967870712280273, "global_step": 141853, "epoch": 1709} {"train_loss": -22.867521286010742, "global_step": 141854, "epoch": 1709} {"train_loss": -23.10719108581543, "global_step": 141855, "epoch": 1709} {"train_loss": -23.091262817382812, "global_step": 141856, "epoch": 1709} {"train_loss": -22.937185287475586, "global_step": 141857, "epoch": 1709} {"train_loss": -23.2980899810791, "global_step": 141858, "epoch": 1709} {"train_loss": -22.743715286254883, "global_step": 141859, "epoch": 1709} {"train_loss": -22.746322631835938, "global_step": 141860, "epoch": 1709} {"train_loss": -23.0184326171875, "global_step": 141861, "epoch": 1709} {"train_loss": -23.264835357666016, "global_step": 141862, "epoch": 1709} {"train_loss": -22.950000762939453, "global_step": 141863, "epoch": 1709} {"train_loss": -23.028539657592773, "global_step": 141864, "epoch": 1709} {"train_loss": -23.33180809020996, "global_step": 141865, "epoch": 1709} {"train_loss": -23.331588745117188, "global_step": 141866, "epoch": 1709} {"train_loss": -23.32699966430664, "global_step": 141867, "epoch": 1709} {"train_loss": -22.952274322509766, "global_step": 141868, "epoch": 1709} {"train_loss": -23.465173721313477, "global_step": 141869, "epoch": 1709} {"train_loss": -23.149145126342773, "global_step": 141870, "epoch": 1709} {"train_loss": -22.820358276367188, "global_step": 141871, "epoch": 1709} {"train_loss": -23.264537811279297, "global_step": 141872, "epoch": 1709} {"train_loss": -23.177343368530273, "global_step": 141873, "epoch": 1709} {"train_loss": -23.182735443115234, "global_step": 141874, "epoch": 1709} {"train_loss": -23.321130752563477, "global_step": 141875, "epoch": 1709} {"train_loss": -23.115327835083008, "global_step": 141876, "epoch": 1709} {"train_loss": -23.442537307739258, "global_step": 141877, "epoch": 1709} {"train_loss": -23.355453491210938, "global_step": 141878, "epoch": 1709} {"train_loss": -23.405691146850586, "global_step": 141879, "epoch": 1709} {"train_loss": -23.332515716552734, "global_step": 141880, "epoch": 1709} {"train_loss": -22.7347469329834, "global_step": 141881, "epoch": 1709} {"train_loss": -22.982351303100586, "global_step": 141882, "epoch": 1709} {"train_loss": -23.31574249267578, "global_step": 141883, "epoch": 1709} {"train_loss": -23.33643913269043, "global_step": 141884, "epoch": 1709} {"train_loss": -23.142539978027344, "global_step": 141885, "epoch": 1709} {"train_loss": -22.907873153686523, "global_step": 141886, "epoch": 1709} {"train_loss": -23.163578033447266, "global_step": 141887, "epoch": 1709} {"train_loss": -23.071365356445312, "global_step": 141888, "epoch": 1709} {"train_loss": -23.374271392822266, "global_step": 141889, "epoch": 1709} {"train_loss": -23.070940017700195, "global_step": 141890, "epoch": 1709} {"train_loss": -23.182214736938477, "global_step": 141891, "epoch": 1709} {"train_loss": -23.05023765563965, "global_step": 141892, "epoch": 1709} {"train_loss": -23.639484405517578, "global_step": 141893, "epoch": 1709} {"train_loss": -23.060321807861328, "global_step": 141894, "epoch": 1709} {"train_loss": -23.117734909057617, "global_step": 141895, "epoch": 1709} {"train_loss": -23.17667007446289, "global_step": 141896, "epoch": 1709} {"train_loss": -23.30101203918457, "global_step": 141897, "epoch": 1709} {"train_loss": -22.899368286132812, "global_step": 141898, "epoch": 1709} {"train_loss": -23.011844635009766, "global_step": 141899, "epoch": 1709} {"train_loss": -23.123872756958008, "global_step": 141900, "epoch": 1709} {"train_loss": -22.747732162475586, "global_step": 141901, "epoch": 1709} {"train_loss": -23.072500228881836, "global_step": 141902, "epoch": 1709} {"train_loss": -23.138195037841797, "global_step": 141903, "epoch": 1709} {"train_loss": -22.824094772338867, "global_step": 141904, "epoch": 1709} {"train_loss": -23.2640380859375, "global_step": 141905, "epoch": 1709} {"train_loss": -22.870277404785156, "global_step": 141906, "epoch": 1709} {"train_loss": -22.76780128479004, "global_step": 141907, "epoch": 1709} {"train_loss": -23.11585235595703, "global_step": 141908, "epoch": 1709} {"train_loss": -23.149229049682617, "global_step": 141909, "epoch": 1709} {"train_loss": -22.5623836517334, "global_step": 141910, "epoch": 1709} {"train_loss": -22.80238151550293, "global_step": 141911, "epoch": 1709} {"train_loss": -22.610929489135742, "global_step": 141912, "epoch": 1709} {"train_loss": -23.156644821166992, "global_step": 141913, "epoch": 1709} {"train_loss": -22.680282592773438, "global_step": 141914, "epoch": 1709} {"train_loss": -23.119049072265625, "global_step": 141915, "epoch": 1709} {"train_loss": -22.80567741394043, "global_step": 141916, "epoch": 1709} {"train_loss": -22.881343841552734, "global_step": 141917, "epoch": 1709} {"train_loss": -23.15485954284668, "global_step": 141918, "epoch": 1709} {"train_loss": -23.018476486206055, "global_step": 141919, "epoch": 1709} {"train_loss": -22.855497360229492, "global_step": 141920, "epoch": 1709} {"train_loss": -23.38396453857422, "global_step": 141921, "epoch": 1709} {"train_loss": -23.18373680114746, "global_step": 141922, "epoch": 1709} {"train_loss": -23.07115364074707, "global_step": 141923, "epoch": 1709} {"train_loss": -23.03384780883789, "global_step": 141924, "epoch": 1709} {"train_loss": -23.2802791595459, "global_step": 141925, "epoch": 1709} {"train_loss": -22.881250381469727, "global_step": 141926, "epoch": 1709} {"train_loss": -22.849319458007812, "global_step": 141927, "epoch": 1709} {"train_loss": -23.19282341003418, "global_step": 141928, "epoch": 1709} {"train_loss": -23.047486822289155, "global_step": 141929, "epoch": 1709, "val_loss": 6268920.5} {"train_loss": -23.07895278930664, "global_step": 141930, "epoch": 1710} {"train_loss": -22.806055068969727, "global_step": 141931, "epoch": 1710} {"train_loss": -22.94496726989746, "global_step": 141932, "epoch": 1710} {"train_loss": -22.779470443725586, "global_step": 141933, "epoch": 1710} {"train_loss": -23.149734497070312, "global_step": 141934, "epoch": 1710} {"train_loss": -23.030454635620117, "global_step": 141935, "epoch": 1710} {"train_loss": -23.088176727294922, "global_step": 141936, "epoch": 1710} {"train_loss": -22.96742820739746, "global_step": 141937, "epoch": 1710} {"train_loss": -22.9586124420166, "global_step": 141938, "epoch": 1710} {"train_loss": -22.55946922302246, "global_step": 141939, "epoch": 1710} {"train_loss": -23.070377349853516, "global_step": 141940, "epoch": 1710} {"train_loss": -22.96791648864746, "global_step": 141941, "epoch": 1710} {"train_loss": -23.14985466003418, "global_step": 141942, "epoch": 1710} {"train_loss": -22.993408203125, "global_step": 141943, "epoch": 1710} {"train_loss": -23.174497604370117, "global_step": 141944, "epoch": 1710} {"train_loss": -23.11188316345215, "global_step": 141945, "epoch": 1710} {"train_loss": -22.943395614624023, "global_step": 141946, "epoch": 1710} {"train_loss": -22.86542320251465, "global_step": 141947, "epoch": 1710} {"train_loss": -22.965606689453125, "global_step": 141948, "epoch": 1710} {"train_loss": -23.104122161865234, "global_step": 141949, "epoch": 1710} {"train_loss": -22.99274253845215, "global_step": 141950, "epoch": 1710} {"train_loss": -22.899755477905273, "global_step": 141951, "epoch": 1710} {"train_loss": -22.78183364868164, "global_step": 141952, "epoch": 1710} {"train_loss": -22.844558715820312, "global_step": 141953, "epoch": 1710} {"train_loss": -22.845294952392578, "global_step": 141954, "epoch": 1710} {"train_loss": -22.987369537353516, "global_step": 141955, "epoch": 1710} {"train_loss": -22.96462059020996, "global_step": 141956, "epoch": 1710} {"train_loss": -23.2268009185791, "global_step": 141957, "epoch": 1710} {"train_loss": -22.90958023071289, "global_step": 141958, "epoch": 1710} {"train_loss": -22.85472869873047, "global_step": 141959, "epoch": 1710} {"train_loss": -22.848112106323242, "global_step": 141960, "epoch": 1710} {"train_loss": -22.852502822875977, "global_step": 141961, "epoch": 1710} {"train_loss": -22.934568405151367, "global_step": 141962, "epoch": 1710} {"train_loss": -23.19215202331543, "global_step": 141963, "epoch": 1710} {"train_loss": -22.88603401184082, "global_step": 141964, "epoch": 1710} {"train_loss": -23.32695198059082, "global_step": 141965, "epoch": 1710} {"train_loss": -23.282718658447266, "global_step": 141966, "epoch": 1710} {"train_loss": -23.104328155517578, "global_step": 141967, "epoch": 1710} {"train_loss": -23.225614547729492, "global_step": 141968, "epoch": 1710} {"train_loss": -23.075454711914062, "global_step": 141969, "epoch": 1710} {"train_loss": -23.68804931640625, "global_step": 141970, "epoch": 1710} {"train_loss": -23.20697021484375, "global_step": 141971, "epoch": 1710} {"train_loss": -23.03120994567871, "global_step": 141972, "epoch": 1710} {"train_loss": -23.43688201904297, "global_step": 141973, "epoch": 1710} {"train_loss": -23.26304817199707, "global_step": 141974, "epoch": 1710} {"train_loss": -23.052000045776367, "global_step": 141975, "epoch": 1710} {"train_loss": -23.714834213256836, "global_step": 141976, "epoch": 1710} {"train_loss": -23.272184371948242, "global_step": 141977, "epoch": 1710} {"train_loss": -23.394702911376953, "global_step": 141978, "epoch": 1710} {"train_loss": -22.68182945251465, "global_step": 141979, "epoch": 1710} {"train_loss": -22.76346778869629, "global_step": 141980, "epoch": 1710} {"train_loss": -23.199628829956055, "global_step": 141981, "epoch": 1710} {"train_loss": -23.6580810546875, "global_step": 141982, "epoch": 1710} {"train_loss": -22.69280433654785, "global_step": 141983, "epoch": 1710} {"train_loss": -23.110326766967773, "global_step": 141984, "epoch": 1710} {"train_loss": -23.335485458374023, "global_step": 141985, "epoch": 1710} {"train_loss": -23.200464248657227, "global_step": 141986, "epoch": 1710} {"train_loss": -23.18165397644043, "global_step": 141987, "epoch": 1710} {"train_loss": -22.96666717529297, "global_step": 141988, "epoch": 1710} {"train_loss": -23.336097717285156, "global_step": 141989, "epoch": 1710} {"train_loss": -22.916322708129883, "global_step": 141990, "epoch": 1710} {"train_loss": -23.12556266784668, "global_step": 141991, "epoch": 1710} {"train_loss": -23.371763229370117, "global_step": 141992, "epoch": 1710} {"train_loss": -23.216812133789062, "global_step": 141993, "epoch": 1710} {"train_loss": -23.086668014526367, "global_step": 141994, "epoch": 1710} {"train_loss": -23.03150177001953, "global_step": 141995, "epoch": 1710} {"train_loss": -23.155338287353516, "global_step": 141996, "epoch": 1710} {"train_loss": -23.116369247436523, "global_step": 141997, "epoch": 1710} {"train_loss": -23.25523567199707, "global_step": 141998, "epoch": 1710} {"train_loss": -23.005672454833984, "global_step": 141999, "epoch": 1710} {"train_loss": -22.89522361755371, "global_step": 142000, "epoch": 1710} {"train_loss": -23.423194885253906, "global_step": 142001, "epoch": 1710} {"train_loss": -23.470678329467773, "global_step": 142002, "epoch": 1710} {"train_loss": -22.741422653198242, "global_step": 142003, "epoch": 1710} {"train_loss": -23.233186721801758, "global_step": 142004, "epoch": 1710} {"train_loss": -23.13206672668457, "global_step": 142005, "epoch": 1710} {"train_loss": -23.096853256225586, "global_step": 142006, "epoch": 1710} {"train_loss": -22.85294532775879, "global_step": 142007, "epoch": 1710} {"train_loss": -23.203495025634766, "global_step": 142008, "epoch": 1710} {"train_loss": -22.734731674194336, "global_step": 142009, "epoch": 1710} {"train_loss": -23.18271255493164, "global_step": 142010, "epoch": 1710} {"train_loss": -22.941965103149414, "global_step": 142011, "epoch": 1710} {"train_loss": -23.059636081557677, "global_step": 142012, "epoch": 1710, "val_loss": 6310459.0} {"train_loss": -22.78810691833496, "global_step": 142013, "epoch": 1711} {"train_loss": -22.53330421447754, "global_step": 142014, "epoch": 1711} {"train_loss": -22.844696044921875, "global_step": 142015, "epoch": 1711} {"train_loss": -22.691625595092773, "global_step": 142016, "epoch": 1711} {"train_loss": -22.725345611572266, "global_step": 142017, "epoch": 1711} {"train_loss": -22.93674659729004, "global_step": 142018, "epoch": 1711} {"train_loss": -22.891752243041992, "global_step": 142019, "epoch": 1711} {"train_loss": -22.797639846801758, "global_step": 142020, "epoch": 1711} {"train_loss": -23.406301498413086, "global_step": 142021, "epoch": 1711} {"train_loss": -23.132678985595703, "global_step": 142022, "epoch": 1711} {"train_loss": -22.85114860534668, "global_step": 142023, "epoch": 1711} {"train_loss": -22.852018356323242, "global_step": 142024, "epoch": 1711} {"train_loss": -22.990325927734375, "global_step": 142025, "epoch": 1711} {"train_loss": -23.327573776245117, "global_step": 142026, "epoch": 1711} {"train_loss": -22.97709083557129, "global_step": 142027, "epoch": 1711} {"train_loss": -22.79736328125, "global_step": 142028, "epoch": 1711} {"train_loss": -22.829345703125, "global_step": 142029, "epoch": 1711} {"train_loss": -22.92644691467285, "global_step": 142030, "epoch": 1711} {"train_loss": -22.844146728515625, "global_step": 142031, "epoch": 1711} {"train_loss": -22.815601348876953, "global_step": 142032, "epoch": 1711} {"train_loss": -22.80588722229004, "global_step": 142033, "epoch": 1711} {"train_loss": -23.012964248657227, "global_step": 142034, "epoch": 1711} {"train_loss": -23.0582218170166, "global_step": 142035, "epoch": 1711} {"train_loss": -22.9627742767334, "global_step": 142036, "epoch": 1711} {"train_loss": -22.779958724975586, "global_step": 142037, "epoch": 1711} {"train_loss": -22.931859970092773, "global_step": 142038, "epoch": 1711} {"train_loss": -23.35433578491211, "global_step": 142039, "epoch": 1711} {"train_loss": -23.03162956237793, "global_step": 142040, "epoch": 1711} {"train_loss": -22.94682502746582, "global_step": 142041, "epoch": 1711} {"train_loss": -22.67593765258789, "global_step": 142042, "epoch": 1711} {"train_loss": -23.067447662353516, "global_step": 142043, "epoch": 1711} {"train_loss": -22.874799728393555, "global_step": 142044, "epoch": 1711} {"train_loss": -22.95167350769043, "global_step": 142045, "epoch": 1711} {"train_loss": -23.2276554107666, "global_step": 142046, "epoch": 1711} {"train_loss": -22.921520233154297, "global_step": 142047, "epoch": 1711} {"train_loss": -22.786624908447266, "global_step": 142048, "epoch": 1711} {"train_loss": -22.78208351135254, "global_step": 142049, "epoch": 1711} {"train_loss": -23.048603057861328, "global_step": 142050, "epoch": 1711} {"train_loss": -22.951705932617188, "global_step": 142051, "epoch": 1711} {"train_loss": -23.064847946166992, "global_step": 142052, "epoch": 1711} {"train_loss": -22.93014907836914, "global_step": 142053, "epoch": 1711} {"train_loss": -22.8469181060791, "global_step": 142054, "epoch": 1711} {"train_loss": -22.66680145263672, "global_step": 142055, "epoch": 1711} {"train_loss": -22.92770004272461, "global_step": 142056, "epoch": 1711} {"train_loss": -22.917409896850586, "global_step": 142057, "epoch": 1711} {"train_loss": -22.979122161865234, "global_step": 142058, "epoch": 1711} {"train_loss": -22.832178115844727, "global_step": 142059, "epoch": 1711} {"train_loss": -23.20534324645996, "global_step": 142060, "epoch": 1711} {"train_loss": -23.192493438720703, "global_step": 142061, "epoch": 1711} {"train_loss": -22.95709800720215, "global_step": 142062, "epoch": 1711} {"train_loss": -22.96761703491211, "global_step": 142063, "epoch": 1711} {"train_loss": -23.19778823852539, "global_step": 142064, "epoch": 1711} {"train_loss": -23.227354049682617, "global_step": 142065, "epoch": 1711} {"train_loss": -23.259944915771484, "global_step": 142066, "epoch": 1711} {"train_loss": -23.094575881958008, "global_step": 142067, "epoch": 1711} {"train_loss": -23.62140464782715, "global_step": 142068, "epoch": 1711} {"train_loss": -23.079010009765625, "global_step": 142069, "epoch": 1711} {"train_loss": -23.23550796508789, "global_step": 142070, "epoch": 1711} {"train_loss": -23.39918327331543, "global_step": 142071, "epoch": 1711} {"train_loss": -23.17972755432129, "global_step": 142072, "epoch": 1711} {"train_loss": -23.171445846557617, "global_step": 142073, "epoch": 1711} {"train_loss": -23.42372703552246, "global_step": 142074, "epoch": 1711} {"train_loss": -23.272716522216797, "global_step": 142075, "epoch": 1711} {"train_loss": -23.387462615966797, "global_step": 142076, "epoch": 1711} {"train_loss": -23.227331161499023, "global_step": 142077, "epoch": 1711} {"train_loss": -23.257726669311523, "global_step": 142078, "epoch": 1711} {"train_loss": -23.266965866088867, "global_step": 142079, "epoch": 1711} {"train_loss": -23.239505767822266, "global_step": 142080, "epoch": 1711} {"train_loss": -22.933706283569336, "global_step": 142081, "epoch": 1711} {"train_loss": -22.958444595336914, "global_step": 142082, "epoch": 1711} {"train_loss": -22.69814109802246, "global_step": 142083, "epoch": 1711} {"train_loss": -23.062734603881836, "global_step": 142084, "epoch": 1711} {"train_loss": -23.27577018737793, "global_step": 142085, "epoch": 1711} {"train_loss": -23.070396423339844, "global_step": 142086, "epoch": 1711} {"train_loss": -23.3227481842041, "global_step": 142087, "epoch": 1711} {"train_loss": -23.129858016967773, "global_step": 142088, "epoch": 1711} {"train_loss": -23.24087142944336, "global_step": 142089, "epoch": 1711} {"train_loss": -23.325769424438477, "global_step": 142090, "epoch": 1711} {"train_loss": -23.524084091186523, "global_step": 142091, "epoch": 1711} {"train_loss": -23.045345306396484, "global_step": 142092, "epoch": 1711} {"train_loss": -23.109067916870117, "global_step": 142093, "epoch": 1711} {"train_loss": -23.11150550842285, "global_step": 142094, "epoch": 1711} {"train_loss": -23.028640816010626, "global_step": 142095, "epoch": 1711, "val_loss": 6311296.5} {"train_loss": -23.087657928466797, "global_step": 142096, "epoch": 1712} {"train_loss": -23.086185455322266, "global_step": 142097, "epoch": 1712} {"train_loss": -22.899412155151367, "global_step": 142098, "epoch": 1712} {"train_loss": -23.0546932220459, "global_step": 142099, "epoch": 1712} {"train_loss": -23.082534790039062, "global_step": 142100, "epoch": 1712} {"train_loss": -23.22652244567871, "global_step": 142101, "epoch": 1712} {"train_loss": -23.680612564086914, "global_step": 142102, "epoch": 1712} {"train_loss": -23.078020095825195, "global_step": 142103, "epoch": 1712} {"train_loss": -22.873363494873047, "global_step": 142104, "epoch": 1712} {"train_loss": -22.959075927734375, "global_step": 142105, "epoch": 1712} {"train_loss": -22.951513290405273, "global_step": 142106, "epoch": 1712} {"train_loss": -23.02298927307129, "global_step": 142107, "epoch": 1712} {"train_loss": -22.974506378173828, "global_step": 142108, "epoch": 1712} {"train_loss": -22.935047149658203, "global_step": 142109, "epoch": 1712} {"train_loss": -22.836244583129883, "global_step": 142110, "epoch": 1712} {"train_loss": -23.23822593688965, "global_step": 142111, "epoch": 1712} {"train_loss": -23.19790267944336, "global_step": 142112, "epoch": 1712} {"train_loss": -23.157957077026367, "global_step": 142113, "epoch": 1712} {"train_loss": -23.188735961914062, "global_step": 142114, "epoch": 1712} {"train_loss": -22.955625534057617, "global_step": 142115, "epoch": 1712} {"train_loss": -23.460590362548828, "global_step": 142116, "epoch": 1712} {"train_loss": -23.026750564575195, "global_step": 142117, "epoch": 1712} {"train_loss": -23.215116500854492, "global_step": 142118, "epoch": 1712} {"train_loss": -23.10645866394043, "global_step": 142119, "epoch": 1712} {"train_loss": -23.197851181030273, "global_step": 142120, "epoch": 1712} {"train_loss": -23.38532829284668, "global_step": 142121, "epoch": 1712} {"train_loss": -23.523000717163086, "global_step": 142122, "epoch": 1712} {"train_loss": -23.40343475341797, "global_step": 142123, "epoch": 1712} {"train_loss": -23.176963806152344, "global_step": 142124, "epoch": 1712} {"train_loss": -22.97024917602539, "global_step": 142125, "epoch": 1712} {"train_loss": -22.946914672851562, "global_step": 142126, "epoch": 1712} {"train_loss": -22.983789443969727, "global_step": 142127, "epoch": 1712} {"train_loss": -23.05543327331543, "global_step": 142128, "epoch": 1712} {"train_loss": -22.882535934448242, "global_step": 142129, "epoch": 1712} {"train_loss": -23.41139793395996, "global_step": 142130, "epoch": 1712} {"train_loss": -23.3938045501709, "global_step": 142131, "epoch": 1712} {"train_loss": -23.03401756286621, "global_step": 142132, "epoch": 1712} {"train_loss": -23.092992782592773, "global_step": 142133, "epoch": 1712} {"train_loss": -23.333845138549805, "global_step": 142134, "epoch": 1712} {"train_loss": -23.30613899230957, "global_step": 142135, "epoch": 1712} {"train_loss": -23.190595626831055, "global_step": 142136, "epoch": 1712} {"train_loss": -23.203022003173828, "global_step": 142137, "epoch": 1712} {"train_loss": -22.9152889251709, "global_step": 142138, "epoch": 1712} {"train_loss": -22.812170028686523, "global_step": 142139, "epoch": 1712} {"train_loss": -22.643287658691406, "global_step": 142140, "epoch": 1712} {"train_loss": -22.673288345336914, "global_step": 142141, "epoch": 1712} {"train_loss": -22.899118423461914, "global_step": 142142, "epoch": 1712} {"train_loss": -22.919172286987305, "global_step": 142143, "epoch": 1712} {"train_loss": -23.168556213378906, "global_step": 142144, "epoch": 1712} {"train_loss": -22.925119400024414, "global_step": 142145, "epoch": 1712} {"train_loss": -23.17050552368164, "global_step": 142146, "epoch": 1712} {"train_loss": -22.889211654663086, "global_step": 142147, "epoch": 1712} {"train_loss": -23.11775016784668, "global_step": 142148, "epoch": 1712} {"train_loss": -22.946102142333984, "global_step": 142149, "epoch": 1712} {"train_loss": -23.2617244720459, "global_step": 142150, "epoch": 1712} {"train_loss": -23.097583770751953, "global_step": 142151, "epoch": 1712} {"train_loss": -22.870534896850586, "global_step": 142152, "epoch": 1712} {"train_loss": -22.868467330932617, "global_step": 142153, "epoch": 1712} {"train_loss": -22.921581268310547, "global_step": 142154, "epoch": 1712} {"train_loss": -23.2890625, "global_step": 142155, "epoch": 1712} {"train_loss": -23.18621253967285, "global_step": 142156, "epoch": 1712} {"train_loss": -23.117387771606445, "global_step": 142157, "epoch": 1712} {"train_loss": -23.027080535888672, "global_step": 142158, "epoch": 1712} {"train_loss": -23.047985076904297, "global_step": 142159, "epoch": 1712} {"train_loss": -22.998798370361328, "global_step": 142160, "epoch": 1712} {"train_loss": -23.15292739868164, "global_step": 142161, "epoch": 1712} {"train_loss": -23.49667739868164, "global_step": 142162, "epoch": 1712} {"train_loss": -22.90184211730957, "global_step": 142163, "epoch": 1712} {"train_loss": -23.186552047729492, "global_step": 142164, "epoch": 1712} {"train_loss": -23.033233642578125, "global_step": 142165, "epoch": 1712} {"train_loss": -23.047788619995117, "global_step": 142166, "epoch": 1712} {"train_loss": -23.381189346313477, "global_step": 142167, "epoch": 1712} {"train_loss": -23.068527221679688, "global_step": 142168, "epoch": 1712} {"train_loss": -23.243350982666016, "global_step": 142169, "epoch": 1712} {"train_loss": -22.981605529785156, "global_step": 142170, "epoch": 1712} {"train_loss": -22.971145629882812, "global_step": 142171, "epoch": 1712} {"train_loss": -22.955612182617188, "global_step": 142172, "epoch": 1712} {"train_loss": -23.298154830932617, "global_step": 142173, "epoch": 1712} {"train_loss": -22.879501342773438, "global_step": 142174, "epoch": 1712} {"train_loss": -23.023273468017578, "global_step": 142175, "epoch": 1712} {"train_loss": -22.724416732788086, "global_step": 142176, "epoch": 1712} {"train_loss": -23.11005973815918, "global_step": 142177, "epoch": 1712} {"train_loss": -23.09010255193136, "global_step": 142178, "epoch": 1712, "val_loss": 6292598.0} {"train_loss": -23.159156799316406, "global_step": 142179, "epoch": 1713} {"train_loss": -22.27960777282715, "global_step": 142180, "epoch": 1713} {"train_loss": -22.99982261657715, "global_step": 142181, "epoch": 1713} {"train_loss": -22.069799423217773, "global_step": 142182, "epoch": 1713} {"train_loss": -22.7919921875, "global_step": 142183, "epoch": 1713} {"train_loss": -22.90726661682129, "global_step": 142184, "epoch": 1713} {"train_loss": -22.980443954467773, "global_step": 142185, "epoch": 1713} {"train_loss": -23.036117553710938, "global_step": 142186, "epoch": 1713} {"train_loss": -23.10420036315918, "global_step": 142187, "epoch": 1713} {"train_loss": -22.812204360961914, "global_step": 142188, "epoch": 1713} {"train_loss": -22.652694702148438, "global_step": 142189, "epoch": 1713} {"train_loss": -22.584638595581055, "global_step": 142190, "epoch": 1713} {"train_loss": -23.351057052612305, "global_step": 142191, "epoch": 1713} {"train_loss": -22.88202476501465, "global_step": 142192, "epoch": 1713} {"train_loss": -22.94770622253418, "global_step": 142193, "epoch": 1713} {"train_loss": -22.96265983581543, "global_step": 142194, "epoch": 1713} {"train_loss": -23.158069610595703, "global_step": 142195, "epoch": 1713} {"train_loss": -22.943037033081055, "global_step": 142196, "epoch": 1713} {"train_loss": -22.741823196411133, "global_step": 142197, "epoch": 1713} {"train_loss": -23.406566619873047, "global_step": 142198, "epoch": 1713} {"train_loss": -23.051483154296875, "global_step": 142199, "epoch": 1713} {"train_loss": -23.04938316345215, "global_step": 142200, "epoch": 1713} {"train_loss": -23.155256271362305, "global_step": 142201, "epoch": 1713} {"train_loss": -23.234329223632812, "global_step": 142202, "epoch": 1713} {"train_loss": -23.05196189880371, "global_step": 142203, "epoch": 1713} {"train_loss": -23.556354522705078, "global_step": 142204, "epoch": 1713} {"train_loss": -23.137990951538086, "global_step": 142205, "epoch": 1713} {"train_loss": -23.145654678344727, "global_step": 142206, "epoch": 1713} {"train_loss": -23.608346939086914, "global_step": 142207, "epoch": 1713} {"train_loss": -23.426937103271484, "global_step": 142208, "epoch": 1713} {"train_loss": -23.14589500427246, "global_step": 142209, "epoch": 1713} {"train_loss": -23.146604537963867, "global_step": 142210, "epoch": 1713} {"train_loss": -23.386762619018555, "global_step": 142211, "epoch": 1713} {"train_loss": -23.314701080322266, "global_step": 142212, "epoch": 1713} {"train_loss": -22.69508171081543, "global_step": 142213, "epoch": 1713} {"train_loss": -22.73598289489746, "global_step": 142214, "epoch": 1713} {"train_loss": -22.94692611694336, "global_step": 142215, "epoch": 1713} {"train_loss": -23.368261337280273, "global_step": 142216, "epoch": 1713} {"train_loss": -23.094409942626953, "global_step": 142217, "epoch": 1713} {"train_loss": -22.99156379699707, "global_step": 142218, "epoch": 1713} {"train_loss": -23.1019229888916, "global_step": 142219, "epoch": 1713} {"train_loss": -22.581274032592773, "global_step": 142220, "epoch": 1713} {"train_loss": -22.89362907409668, "global_step": 142221, "epoch": 1713} {"train_loss": -22.960330963134766, "global_step": 142222, "epoch": 1713} {"train_loss": -23.112218856811523, "global_step": 142223, "epoch": 1713} {"train_loss": -22.942102432250977, "global_step": 142224, "epoch": 1713} {"train_loss": -23.214242935180664, "global_step": 142225, "epoch": 1713} {"train_loss": -22.843351364135742, "global_step": 142226, "epoch": 1713} {"train_loss": -23.107681274414062, "global_step": 142227, "epoch": 1713} {"train_loss": -23.494544982910156, "global_step": 142228, "epoch": 1713} {"train_loss": -23.019210815429688, "global_step": 142229, "epoch": 1713} {"train_loss": -23.349720001220703, "global_step": 142230, "epoch": 1713} {"train_loss": -23.04585838317871, "global_step": 142231, "epoch": 1713} {"train_loss": -23.101041793823242, "global_step": 142232, "epoch": 1713} {"train_loss": -23.28946876525879, "global_step": 142233, "epoch": 1713} {"train_loss": -22.99458122253418, "global_step": 142234, "epoch": 1713} {"train_loss": -23.281034469604492, "global_step": 142235, "epoch": 1713} {"train_loss": -23.256162643432617, "global_step": 142236, "epoch": 1713} {"train_loss": -23.081621170043945, "global_step": 142237, "epoch": 1713} {"train_loss": -23.642669677734375, "global_step": 142238, "epoch": 1713} {"train_loss": -22.897159576416016, "global_step": 142239, "epoch": 1713} {"train_loss": -22.97181510925293, "global_step": 142240, "epoch": 1713} {"train_loss": -22.866191864013672, "global_step": 142241, "epoch": 1713} {"train_loss": -23.234031677246094, "global_step": 142242, "epoch": 1713} {"train_loss": -23.11347770690918, "global_step": 142243, "epoch": 1713} {"train_loss": -22.902545928955078, "global_step": 142244, "epoch": 1713} {"train_loss": -23.201881408691406, "global_step": 142245, "epoch": 1713} {"train_loss": -23.178266525268555, "global_step": 142246, "epoch": 1713} {"train_loss": -23.014846801757812, "global_step": 142247, "epoch": 1713} {"train_loss": -23.170246124267578, "global_step": 142248, "epoch": 1713} {"train_loss": -23.05521583557129, "global_step": 142249, "epoch": 1713} {"train_loss": -23.137584686279297, "global_step": 142250, "epoch": 1713} {"train_loss": -23.440832138061523, "global_step": 142251, "epoch": 1713} {"train_loss": -23.518707275390625, "global_step": 142252, "epoch": 1713} {"train_loss": -22.985010147094727, "global_step": 142253, "epoch": 1713} {"train_loss": -23.074542999267578, "global_step": 142254, "epoch": 1713} {"train_loss": -23.455530166625977, "global_step": 142255, "epoch": 1713} {"train_loss": -23.472810745239258, "global_step": 142256, "epoch": 1713} {"train_loss": -22.733362197875977, "global_step": 142257, "epoch": 1713} {"train_loss": -23.241622924804688, "global_step": 142258, "epoch": 1713} {"train_loss": -22.641202926635742, "global_step": 142259, "epoch": 1713} {"train_loss": -22.765363693237305, "global_step": 142260, "epoch": 1713} {"train_loss": -23.0695594419916, "global_step": 142261, "epoch": 1713, "val_loss": 6317262.0} {"train_loss": -22.23795509338379, "global_step": 142262, "epoch": 1714} {"train_loss": -22.172468185424805, "global_step": 142263, "epoch": 1714} {"train_loss": -22.37495994567871, "global_step": 142264, "epoch": 1714} {"train_loss": -22.170795440673828, "global_step": 142265, "epoch": 1714} {"train_loss": -22.180021286010742, "global_step": 142266, "epoch": 1714} {"train_loss": -22.666227340698242, "global_step": 142267, "epoch": 1714} {"train_loss": -22.17388343811035, "global_step": 142268, "epoch": 1714} {"train_loss": -22.430973052978516, "global_step": 142269, "epoch": 1714} {"train_loss": -22.7825984954834, "global_step": 142270, "epoch": 1714} {"train_loss": -22.643003463745117, "global_step": 142271, "epoch": 1714} {"train_loss": -22.95647621154785, "global_step": 142272, "epoch": 1714} {"train_loss": -22.332841873168945, "global_step": 142273, "epoch": 1714} {"train_loss": -22.73516845703125, "global_step": 142274, "epoch": 1714} {"train_loss": -22.63031005859375, "global_step": 142275, "epoch": 1714} {"train_loss": -22.716413497924805, "global_step": 142276, "epoch": 1714} {"train_loss": -23.211212158203125, "global_step": 142277, "epoch": 1714} {"train_loss": -22.738794326782227, "global_step": 142278, "epoch": 1714} {"train_loss": -22.701093673706055, "global_step": 142279, "epoch": 1714} {"train_loss": -23.10919761657715, "global_step": 142280, "epoch": 1714} {"train_loss": -22.952749252319336, "global_step": 142281, "epoch": 1714} {"train_loss": -22.568199157714844, "global_step": 142282, "epoch": 1714} {"train_loss": -22.472797393798828, "global_step": 142283, "epoch": 1714} {"train_loss": -22.767120361328125, "global_step": 142284, "epoch": 1714} {"train_loss": -22.534252166748047, "global_step": 142285, "epoch": 1714} {"train_loss": -23.117889404296875, "global_step": 142286, "epoch": 1714} {"train_loss": -23.09052085876465, "global_step": 142287, "epoch": 1714} {"train_loss": -23.069347381591797, "global_step": 142288, "epoch": 1714} {"train_loss": -22.897565841674805, "global_step": 142289, "epoch": 1714} {"train_loss": -23.150678634643555, "global_step": 142290, "epoch": 1714} {"train_loss": -23.085826873779297, "global_step": 142291, "epoch": 1714} {"train_loss": -22.79969596862793, "global_step": 142292, "epoch": 1714} {"train_loss": -22.981033325195312, "global_step": 142293, "epoch": 1714} {"train_loss": -23.180997848510742, "global_step": 142294, "epoch": 1714} {"train_loss": -23.006214141845703, "global_step": 142295, "epoch": 1714} {"train_loss": -23.114501953125, "global_step": 142296, "epoch": 1714} {"train_loss": -23.09686279296875, "global_step": 142297, "epoch": 1714} {"train_loss": -23.07588005065918, "global_step": 142298, "epoch": 1714} {"train_loss": -22.892141342163086, "global_step": 142299, "epoch": 1714} {"train_loss": -23.015111923217773, "global_step": 142300, "epoch": 1714} {"train_loss": -22.865299224853516, "global_step": 142301, "epoch": 1714} {"train_loss": -23.23611068725586, "global_step": 142302, "epoch": 1714} {"train_loss": -23.21803092956543, "global_step": 142303, "epoch": 1714} {"train_loss": -22.9853515625, "global_step": 142304, "epoch": 1714} {"train_loss": -23.689960479736328, "global_step": 142305, "epoch": 1714} {"train_loss": -22.878198623657227, "global_step": 142306, "epoch": 1714} {"train_loss": -23.06569480895996, "global_step": 142307, "epoch": 1714} {"train_loss": -23.1910400390625, "global_step": 142308, "epoch": 1714} {"train_loss": -22.86194610595703, "global_step": 142309, "epoch": 1714} {"train_loss": -22.8336124420166, "global_step": 142310, "epoch": 1714} {"train_loss": -23.348758697509766, "global_step": 142311, "epoch": 1714} {"train_loss": -23.02404022216797, "global_step": 142312, "epoch": 1714} {"train_loss": -23.11918830871582, "global_step": 142313, "epoch": 1714} {"train_loss": -23.044757843017578, "global_step": 142314, "epoch": 1714} {"train_loss": -23.028594970703125, "global_step": 142315, "epoch": 1714} {"train_loss": -22.776538848876953, "global_step": 142316, "epoch": 1714} {"train_loss": -23.126867294311523, "global_step": 142317, "epoch": 1714} {"train_loss": -23.201059341430664, "global_step": 142318, "epoch": 1714} {"train_loss": -23.325193405151367, "global_step": 142319, "epoch": 1714} {"train_loss": -22.847043991088867, "global_step": 142320, "epoch": 1714} {"train_loss": -22.810855865478516, "global_step": 142321, "epoch": 1714} {"train_loss": -23.408018112182617, "global_step": 142322, "epoch": 1714} {"train_loss": -23.22349739074707, "global_step": 142323, "epoch": 1714} {"train_loss": -22.853260040283203, "global_step": 142324, "epoch": 1714} {"train_loss": -23.039793014526367, "global_step": 142325, "epoch": 1714} {"train_loss": -23.076467514038086, "global_step": 142326, "epoch": 1714} {"train_loss": -23.03104591369629, "global_step": 142327, "epoch": 1714} {"train_loss": -23.134668350219727, "global_step": 142328, "epoch": 1714} {"train_loss": -23.522716522216797, "global_step": 142329, "epoch": 1714} {"train_loss": -22.93784523010254, "global_step": 142330, "epoch": 1714} {"train_loss": -22.832801818847656, "global_step": 142331, "epoch": 1714} {"train_loss": -23.063617706298828, "global_step": 142332, "epoch": 1714} {"train_loss": -23.351266860961914, "global_step": 142333, "epoch": 1714} {"train_loss": -23.154264450073242, "global_step": 142334, "epoch": 1714} {"train_loss": -23.153486251831055, "global_step": 142335, "epoch": 1714} {"train_loss": -23.222579956054688, "global_step": 142336, "epoch": 1714} {"train_loss": -23.28224754333496, "global_step": 142337, "epoch": 1714} {"train_loss": -22.99100685119629, "global_step": 142338, "epoch": 1714} {"train_loss": -22.790145874023438, "global_step": 142339, "epoch": 1714} {"train_loss": -23.29304313659668, "global_step": 142340, "epoch": 1714} {"train_loss": -23.343368530273438, "global_step": 142341, "epoch": 1714} {"train_loss": -23.26152992248535, "global_step": 142342, "epoch": 1714} {"train_loss": -23.05940055847168, "global_step": 142343, "epoch": 1714} {"train_loss": -22.928858998310137, "global_step": 142344, "epoch": 1714, "val_loss": 6241320.0} {"train_loss": -22.55195426940918, "global_step": 142345, "epoch": 1715} {"train_loss": -22.702564239501953, "global_step": 142346, "epoch": 1715} {"train_loss": -22.519418716430664, "global_step": 142347, "epoch": 1715} {"train_loss": -22.623987197875977, "global_step": 142348, "epoch": 1715} {"train_loss": -22.188770294189453, "global_step": 142349, "epoch": 1715} {"train_loss": -22.360445022583008, "global_step": 142350, "epoch": 1715} {"train_loss": -22.7010555267334, "global_step": 142351, "epoch": 1715} {"train_loss": -22.986291885375977, "global_step": 142352, "epoch": 1715} {"train_loss": -22.367069244384766, "global_step": 142353, "epoch": 1715} {"train_loss": -22.63709259033203, "global_step": 142354, "epoch": 1715} {"train_loss": -22.49367904663086, "global_step": 142355, "epoch": 1715} {"train_loss": -22.72464370727539, "global_step": 142356, "epoch": 1715} {"train_loss": -23.003957748413086, "global_step": 142357, "epoch": 1715} {"train_loss": -22.841463088989258, "global_step": 142358, "epoch": 1715} {"train_loss": -23.262338638305664, "global_step": 142359, "epoch": 1715} {"train_loss": -22.825897216796875, "global_step": 142360, "epoch": 1715} {"train_loss": -22.681442260742188, "global_step": 142361, "epoch": 1715} {"train_loss": -22.933120727539062, "global_step": 142362, "epoch": 1715} {"train_loss": -22.729764938354492, "global_step": 142363, "epoch": 1715} {"train_loss": -22.615079879760742, "global_step": 142364, "epoch": 1715} {"train_loss": -22.854394912719727, "global_step": 142365, "epoch": 1715} {"train_loss": -23.02186393737793, "global_step": 142366, "epoch": 1715} {"train_loss": -22.985837936401367, "global_step": 142367, "epoch": 1715} {"train_loss": -23.24582862854004, "global_step": 142368, "epoch": 1715} {"train_loss": -23.04039192199707, "global_step": 142369, "epoch": 1715} {"train_loss": -22.84967041015625, "global_step": 142370, "epoch": 1715} {"train_loss": -22.687885284423828, "global_step": 142371, "epoch": 1715} {"train_loss": -23.35129737854004, "global_step": 142372, "epoch": 1715} {"train_loss": -22.99916648864746, "global_step": 142373, "epoch": 1715} {"train_loss": -23.23904800415039, "global_step": 142374, "epoch": 1715} {"train_loss": -22.751707077026367, "global_step": 142375, "epoch": 1715} {"train_loss": -22.94487190246582, "global_step": 142376, "epoch": 1715} {"train_loss": -23.203533172607422, "global_step": 142377, "epoch": 1715} {"train_loss": -23.305034637451172, "global_step": 142378, "epoch": 1715} {"train_loss": -23.136695861816406, "global_step": 142379, "epoch": 1715} {"train_loss": -23.350671768188477, "global_step": 142380, "epoch": 1715} {"train_loss": -23.090131759643555, "global_step": 142381, "epoch": 1715} {"train_loss": -23.340978622436523, "global_step": 142382, "epoch": 1715} {"train_loss": -22.922895431518555, "global_step": 142383, "epoch": 1715} {"train_loss": -23.049657821655273, "global_step": 142384, "epoch": 1715} {"train_loss": -23.135923385620117, "global_step": 142385, "epoch": 1715} {"train_loss": -23.356443405151367, "global_step": 142386, "epoch": 1715} {"train_loss": -23.436695098876953, "global_step": 142387, "epoch": 1715} {"train_loss": -23.122879028320312, "global_step": 142388, "epoch": 1715} {"train_loss": -23.27912712097168, "global_step": 142389, "epoch": 1715} {"train_loss": -23.057981491088867, "global_step": 142390, "epoch": 1715} {"train_loss": -23.26337242126465, "global_step": 142391, "epoch": 1715} {"train_loss": -23.41353416442871, "global_step": 142392, "epoch": 1715} {"train_loss": -23.213804244995117, "global_step": 142393, "epoch": 1715} {"train_loss": -23.1016845703125, "global_step": 142394, "epoch": 1715} {"train_loss": -23.490697860717773, "global_step": 142395, "epoch": 1715} {"train_loss": -23.296064376831055, "global_step": 142396, "epoch": 1715} {"train_loss": -23.066543579101562, "global_step": 142397, "epoch": 1715} {"train_loss": -23.547277450561523, "global_step": 142398, "epoch": 1715} {"train_loss": -23.050073623657227, "global_step": 142399, "epoch": 1715} {"train_loss": -23.076467514038086, "global_step": 142400, "epoch": 1715} {"train_loss": -22.93680763244629, "global_step": 142401, "epoch": 1715} {"train_loss": -22.922693252563477, "global_step": 142402, "epoch": 1715} {"train_loss": -23.339445114135742, "global_step": 142403, "epoch": 1715} {"train_loss": -22.709705352783203, "global_step": 142404, "epoch": 1715} {"train_loss": -23.260093688964844, "global_step": 142405, "epoch": 1715} {"train_loss": -23.20981788635254, "global_step": 142406, "epoch": 1715} {"train_loss": -23.102567672729492, "global_step": 142407, "epoch": 1715} {"train_loss": -23.098655700683594, "global_step": 142408, "epoch": 1715} {"train_loss": -23.271203994750977, "global_step": 142409, "epoch": 1715} {"train_loss": -23.056678771972656, "global_step": 142410, "epoch": 1715} {"train_loss": -22.608787536621094, "global_step": 142411, "epoch": 1715} {"train_loss": -22.603271484375, "global_step": 142412, "epoch": 1715} {"train_loss": -23.050519943237305, "global_step": 142413, "epoch": 1715} {"train_loss": -23.353281021118164, "global_step": 142414, "epoch": 1715} {"train_loss": -23.375741958618164, "global_step": 142415, "epoch": 1715} {"train_loss": -22.89400291442871, "global_step": 142416, "epoch": 1715} {"train_loss": -23.215173721313477, "global_step": 142417, "epoch": 1715} {"train_loss": -23.100921630859375, "global_step": 142418, "epoch": 1715} {"train_loss": -22.930692672729492, "global_step": 142419, "epoch": 1715} {"train_loss": -23.265745162963867, "global_step": 142420, "epoch": 1715} {"train_loss": -23.181522369384766, "global_step": 142421, "epoch": 1715} {"train_loss": -22.801137924194336, "global_step": 142422, "epoch": 1715} {"train_loss": -22.994815826416016, "global_step": 142423, "epoch": 1715} {"train_loss": -23.03987693786621, "global_step": 142424, "epoch": 1715} {"train_loss": -23.06593894958496, "global_step": 142425, "epoch": 1715} {"train_loss": -22.777339935302734, "global_step": 142426, "epoch": 1715} {"train_loss": -22.993874607315984, "global_step": 142427, "epoch": 1715, "val_loss": 6277343.0} {"train_loss": -22.167179107666016, "global_step": 142428, "epoch": 1716} {"train_loss": -22.752460479736328, "global_step": 142429, "epoch": 1716} {"train_loss": -22.735809326171875, "global_step": 142430, "epoch": 1716} {"train_loss": -22.697607040405273, "global_step": 142431, "epoch": 1716} {"train_loss": -22.83417510986328, "global_step": 142432, "epoch": 1716} {"train_loss": -22.676511764526367, "global_step": 142433, "epoch": 1716} {"train_loss": -22.931636810302734, "global_step": 142434, "epoch": 1716} {"train_loss": -22.592437744140625, "global_step": 142435, "epoch": 1716} {"train_loss": -23.469196319580078, "global_step": 142436, "epoch": 1716} {"train_loss": -22.797876358032227, "global_step": 142437, "epoch": 1716} {"train_loss": -22.986387252807617, "global_step": 142438, "epoch": 1716} {"train_loss": -22.803447723388672, "global_step": 142439, "epoch": 1716} {"train_loss": -23.354232788085938, "global_step": 142440, "epoch": 1716} {"train_loss": -22.83746337890625, "global_step": 142441, "epoch": 1716} {"train_loss": -23.118560791015625, "global_step": 142442, "epoch": 1716} {"train_loss": -23.19586753845215, "global_step": 142443, "epoch": 1716} {"train_loss": -23.123428344726562, "global_step": 142444, "epoch": 1716} {"train_loss": -22.57720184326172, "global_step": 142445, "epoch": 1716} {"train_loss": -22.929244995117188, "global_step": 142446, "epoch": 1716} {"train_loss": -22.908414840698242, "global_step": 142447, "epoch": 1716} {"train_loss": -23.48072624206543, "global_step": 142448, "epoch": 1716} {"train_loss": -23.296945571899414, "global_step": 142449, "epoch": 1716} {"train_loss": -22.78550910949707, "global_step": 142450, "epoch": 1716} {"train_loss": -23.44472312927246, "global_step": 142451, "epoch": 1716} {"train_loss": -22.930356979370117, "global_step": 142452, "epoch": 1716} {"train_loss": -22.800146102905273, "global_step": 142453, "epoch": 1716} {"train_loss": -23.079614639282227, "global_step": 142454, "epoch": 1716} {"train_loss": -22.827367782592773, "global_step": 142455, "epoch": 1716} {"train_loss": -23.269895553588867, "global_step": 142456, "epoch": 1716} {"train_loss": -22.809192657470703, "global_step": 142457, "epoch": 1716} {"train_loss": -22.996191024780273, "global_step": 142458, "epoch": 1716} {"train_loss": -23.12879753112793, "global_step": 142459, "epoch": 1716} {"train_loss": -22.866939544677734, "global_step": 142460, "epoch": 1716} {"train_loss": -23.067697525024414, "global_step": 142461, "epoch": 1716} {"train_loss": -23.293481826782227, "global_step": 142462, "epoch": 1716} {"train_loss": -22.865787506103516, "global_step": 142463, "epoch": 1716} {"train_loss": -22.72726821899414, "global_step": 142464, "epoch": 1716} {"train_loss": -22.755882263183594, "global_step": 142465, "epoch": 1716} {"train_loss": -22.895862579345703, "global_step": 142466, "epoch": 1716} {"train_loss": -23.090185165405273, "global_step": 142467, "epoch": 1716} {"train_loss": -22.923568725585938, "global_step": 142468, "epoch": 1716} {"train_loss": -23.13629722595215, "global_step": 142469, "epoch": 1716} {"train_loss": -23.095096588134766, "global_step": 142470, "epoch": 1716} {"train_loss": -23.346750259399414, "global_step": 142471, "epoch": 1716} {"train_loss": -23.544780731201172, "global_step": 142472, "epoch": 1716} {"train_loss": -23.10603904724121, "global_step": 142473, "epoch": 1716} {"train_loss": -22.872507095336914, "global_step": 142474, "epoch": 1716} {"train_loss": -23.542325973510742, "global_step": 142475, "epoch": 1716} {"train_loss": -23.078392028808594, "global_step": 142476, "epoch": 1716} {"train_loss": -23.078907012939453, "global_step": 142477, "epoch": 1716} {"train_loss": -23.1872615814209, "global_step": 142478, "epoch": 1716} {"train_loss": -23.202245712280273, "global_step": 142479, "epoch": 1716} {"train_loss": -23.104841232299805, "global_step": 142480, "epoch": 1716} {"train_loss": -22.860971450805664, "global_step": 142481, "epoch": 1716} {"train_loss": -22.988500595092773, "global_step": 142482, "epoch": 1716} {"train_loss": -23.270069122314453, "global_step": 142483, "epoch": 1716} {"train_loss": -22.902097702026367, "global_step": 142484, "epoch": 1716} {"train_loss": -23.463186264038086, "global_step": 142485, "epoch": 1716} {"train_loss": -22.865814208984375, "global_step": 142486, "epoch": 1716} {"train_loss": -22.746381759643555, "global_step": 142487, "epoch": 1716} {"train_loss": -23.165393829345703, "global_step": 142488, "epoch": 1716} {"train_loss": -23.2984676361084, "global_step": 142489, "epoch": 1716} {"train_loss": -23.001632690429688, "global_step": 142490, "epoch": 1716} {"train_loss": -22.928678512573242, "global_step": 142491, "epoch": 1716} {"train_loss": -22.949647903442383, "global_step": 142492, "epoch": 1716} {"train_loss": -22.989065170288086, "global_step": 142493, "epoch": 1716} {"train_loss": -23.23297691345215, "global_step": 142494, "epoch": 1716} {"train_loss": -22.693506240844727, "global_step": 142495, "epoch": 1716} {"train_loss": -23.019119262695312, "global_step": 142496, "epoch": 1716} {"train_loss": -23.386425018310547, "global_step": 142497, "epoch": 1716} {"train_loss": -22.760629653930664, "global_step": 142498, "epoch": 1716} {"train_loss": -23.306058883666992, "global_step": 142499, "epoch": 1716} {"train_loss": -23.091108322143555, "global_step": 142500, "epoch": 1716} {"train_loss": -23.2258358001709, "global_step": 142501, "epoch": 1716} {"train_loss": -23.158117294311523, "global_step": 142502, "epoch": 1716} {"train_loss": -23.19642448425293, "global_step": 142503, "epoch": 1716} {"train_loss": -23.14035987854004, "global_step": 142504, "epoch": 1716} {"train_loss": -23.2148380279541, "global_step": 142505, "epoch": 1716} {"train_loss": -22.904176712036133, "global_step": 142506, "epoch": 1716} {"train_loss": -23.235593795776367, "global_step": 142507, "epoch": 1716} {"train_loss": -23.035293579101562, "global_step": 142508, "epoch": 1716} {"train_loss": -23.500802993774414, "global_step": 142509, "epoch": 1716} {"train_loss": -23.04895237842238, "global_step": 142510, "epoch": 1716, "val_loss": 6281379.0} {"train_loss": -22.633222579956055, "global_step": 142511, "epoch": 1717} {"train_loss": -23.04353141784668, "global_step": 142512, "epoch": 1717} {"train_loss": -22.82276725769043, "global_step": 142513, "epoch": 1717} {"train_loss": -23.178333282470703, "global_step": 142514, "epoch": 1717} {"train_loss": -23.188430786132812, "global_step": 142515, "epoch": 1717} {"train_loss": -22.90558433532715, "global_step": 142516, "epoch": 1717} {"train_loss": -23.115848541259766, "global_step": 142517, "epoch": 1717} {"train_loss": -22.914936065673828, "global_step": 142518, "epoch": 1717} {"train_loss": -22.928234100341797, "global_step": 142519, "epoch": 1717} {"train_loss": -22.640108108520508, "global_step": 142520, "epoch": 1717} {"train_loss": -23.349905014038086, "global_step": 142521, "epoch": 1717} {"train_loss": -22.835010528564453, "global_step": 142522, "epoch": 1717} {"train_loss": -23.292295455932617, "global_step": 142523, "epoch": 1717} {"train_loss": -23.07008934020996, "global_step": 142524, "epoch": 1717} {"train_loss": -22.723514556884766, "global_step": 142525, "epoch": 1717} {"train_loss": -23.0801944732666, "global_step": 142526, "epoch": 1717} {"train_loss": -23.196369171142578, "global_step": 142527, "epoch": 1717} {"train_loss": -22.9390869140625, "global_step": 142528, "epoch": 1717} {"train_loss": -22.598697662353516, "global_step": 142529, "epoch": 1717} {"train_loss": -22.234086990356445, "global_step": 142530, "epoch": 1717} {"train_loss": -23.103775024414062, "global_step": 142531, "epoch": 1717} {"train_loss": -23.012798309326172, "global_step": 142532, "epoch": 1717} {"train_loss": -22.65639877319336, "global_step": 142533, "epoch": 1717} {"train_loss": -22.898630142211914, "global_step": 142534, "epoch": 1717} {"train_loss": -23.366636276245117, "global_step": 142535, "epoch": 1717} {"train_loss": -22.754180908203125, "global_step": 142536, "epoch": 1717} {"train_loss": -23.295358657836914, "global_step": 142537, "epoch": 1717} {"train_loss": -23.22991371154785, "global_step": 142538, "epoch": 1717} {"train_loss": -22.86505889892578, "global_step": 142539, "epoch": 1717} {"train_loss": -23.212961196899414, "global_step": 142540, "epoch": 1717} {"train_loss": -23.225784301757812, "global_step": 142541, "epoch": 1717} {"train_loss": -23.007299423217773, "global_step": 142542, "epoch": 1717} {"train_loss": -23.301860809326172, "global_step": 142543, "epoch": 1717} {"train_loss": -23.268341064453125, "global_step": 142544, "epoch": 1717} {"train_loss": -23.06156349182129, "global_step": 142545, "epoch": 1717} {"train_loss": -23.028934478759766, "global_step": 142546, "epoch": 1717} {"train_loss": -23.195158004760742, "global_step": 142547, "epoch": 1717} {"train_loss": -23.278261184692383, "global_step": 142548, "epoch": 1717} {"train_loss": -22.747751235961914, "global_step": 142549, "epoch": 1717} {"train_loss": -23.69577407836914, "global_step": 142550, "epoch": 1717} {"train_loss": -23.253936767578125, "global_step": 142551, "epoch": 1717} {"train_loss": -23.184362411499023, "global_step": 142552, "epoch": 1717} {"train_loss": -22.870298385620117, "global_step": 142553, "epoch": 1717} {"train_loss": -23.211347579956055, "global_step": 142554, "epoch": 1717} {"train_loss": -22.97275733947754, "global_step": 142555, "epoch": 1717} {"train_loss": -23.180326461791992, "global_step": 142556, "epoch": 1717} {"train_loss": -23.18779945373535, "global_step": 142557, "epoch": 1717} {"train_loss": -22.923154830932617, "global_step": 142558, "epoch": 1717} {"train_loss": -23.210416793823242, "global_step": 142559, "epoch": 1717} {"train_loss": -23.043771743774414, "global_step": 142560, "epoch": 1717} {"train_loss": -23.52850341796875, "global_step": 142561, "epoch": 1717} {"train_loss": -23.16997718811035, "global_step": 142562, "epoch": 1717} {"train_loss": -23.05810546875, "global_step": 142563, "epoch": 1717} {"train_loss": -23.10731315612793, "global_step": 142564, "epoch": 1717} {"train_loss": -23.220739364624023, "global_step": 142565, "epoch": 1717} {"train_loss": -23.44312858581543, "global_step": 142566, "epoch": 1717} {"train_loss": -22.996044158935547, "global_step": 142567, "epoch": 1717} {"train_loss": -23.14494514465332, "global_step": 142568, "epoch": 1717} {"train_loss": -23.369775772094727, "global_step": 142569, "epoch": 1717} {"train_loss": -23.105138778686523, "global_step": 142570, "epoch": 1717} {"train_loss": -23.41498374938965, "global_step": 142571, "epoch": 1717} {"train_loss": -23.262176513671875, "global_step": 142572, "epoch": 1717} {"train_loss": -23.03911781311035, "global_step": 142573, "epoch": 1717} {"train_loss": -23.424362182617188, "global_step": 142574, "epoch": 1717} {"train_loss": -23.45377540588379, "global_step": 142575, "epoch": 1717} {"train_loss": -23.160144805908203, "global_step": 142576, "epoch": 1717} {"train_loss": -23.20051383972168, "global_step": 142577, "epoch": 1717} {"train_loss": -23.287763595581055, "global_step": 142578, "epoch": 1717} {"train_loss": -22.975929260253906, "global_step": 142579, "epoch": 1717} {"train_loss": -23.284631729125977, "global_step": 142580, "epoch": 1717} {"train_loss": -23.395009994506836, "global_step": 142581, "epoch": 1717} {"train_loss": -22.960912704467773, "global_step": 142582, "epoch": 1717} {"train_loss": -23.34919548034668, "global_step": 142583, "epoch": 1717} {"train_loss": -23.39849853515625, "global_step": 142584, "epoch": 1717} {"train_loss": -23.19136619567871, "global_step": 142585, "epoch": 1717} {"train_loss": -22.994230270385742, "global_step": 142586, "epoch": 1717} {"train_loss": -23.489652633666992, "global_step": 142587, "epoch": 1717} {"train_loss": -23.094388961791992, "global_step": 142588, "epoch": 1717} {"train_loss": -23.082128524780273, "global_step": 142589, "epoch": 1717} {"train_loss": -23.055036544799805, "global_step": 142590, "epoch": 1717} {"train_loss": -23.238357543945312, "global_step": 142591, "epoch": 1717} {"train_loss": -23.270109176635742, "global_step": 142592, "epoch": 1717} {"train_loss": -23.124732787350574, "global_step": 142593, "epoch": 1717, "val_loss": 6321609.5} {"train_loss": -23.130098342895508, "global_step": 142594, "epoch": 1718} {"train_loss": -22.633522033691406, "global_step": 142595, "epoch": 1718} {"train_loss": -22.939512252807617, "global_step": 142596, "epoch": 1718} {"train_loss": -22.877498626708984, "global_step": 142597, "epoch": 1718} {"train_loss": -23.233381271362305, "global_step": 142598, "epoch": 1718} {"train_loss": -22.885103225708008, "global_step": 142599, "epoch": 1718} {"train_loss": -23.176881790161133, "global_step": 142600, "epoch": 1718} {"train_loss": -23.058618545532227, "global_step": 142601, "epoch": 1718} {"train_loss": -22.9045467376709, "global_step": 142602, "epoch": 1718} {"train_loss": -23.23005485534668, "global_step": 142603, "epoch": 1718} {"train_loss": -23.08299446105957, "global_step": 142604, "epoch": 1718} {"train_loss": -23.232572555541992, "global_step": 142605, "epoch": 1718} {"train_loss": -23.03285026550293, "global_step": 142606, "epoch": 1718} {"train_loss": -23.106212615966797, "global_step": 142607, "epoch": 1718} {"train_loss": -22.90680694580078, "global_step": 142608, "epoch": 1718} {"train_loss": -23.050146102905273, "global_step": 142609, "epoch": 1718} {"train_loss": -23.254175186157227, "global_step": 142610, "epoch": 1718} {"train_loss": -23.16029930114746, "global_step": 142611, "epoch": 1718} {"train_loss": -22.907821655273438, "global_step": 142612, "epoch": 1718} {"train_loss": -23.09344482421875, "global_step": 142613, "epoch": 1718} {"train_loss": -22.99024772644043, "global_step": 142614, "epoch": 1718} {"train_loss": -23.09006118774414, "global_step": 142615, "epoch": 1718} {"train_loss": -22.659210205078125, "global_step": 142616, "epoch": 1718} {"train_loss": -23.10902214050293, "global_step": 142617, "epoch": 1718} {"train_loss": -22.9637393951416, "global_step": 142618, "epoch": 1718} {"train_loss": -22.557266235351562, "global_step": 142619, "epoch": 1718} {"train_loss": -22.964115142822266, "global_step": 142620, "epoch": 1718} {"train_loss": -23.267044067382812, "global_step": 142621, "epoch": 1718} {"train_loss": -23.265527725219727, "global_step": 142622, "epoch": 1718} {"train_loss": -22.917827606201172, "global_step": 142623, "epoch": 1718} {"train_loss": -22.705732345581055, "global_step": 142624, "epoch": 1718} {"train_loss": -23.15470314025879, "global_step": 142625, "epoch": 1718} {"train_loss": -22.866010665893555, "global_step": 142626, "epoch": 1718} {"train_loss": -22.98432159423828, "global_step": 142627, "epoch": 1718} {"train_loss": -23.206798553466797, "global_step": 142628, "epoch": 1718} {"train_loss": -23.46268081665039, "global_step": 142629, "epoch": 1718} {"train_loss": -22.980850219726562, "global_step": 142630, "epoch": 1718} {"train_loss": -23.066791534423828, "global_step": 142631, "epoch": 1718} {"train_loss": -22.981067657470703, "global_step": 142632, "epoch": 1718} {"train_loss": -22.929725646972656, "global_step": 142633, "epoch": 1718} {"train_loss": -22.928607940673828, "global_step": 142634, "epoch": 1718} {"train_loss": -23.102754592895508, "global_step": 142635, "epoch": 1718} {"train_loss": -22.978713989257812, "global_step": 142636, "epoch": 1718} {"train_loss": -23.148771286010742, "global_step": 142637, "epoch": 1718} {"train_loss": -23.176815032958984, "global_step": 142638, "epoch": 1718} {"train_loss": -23.17633056640625, "global_step": 142639, "epoch": 1718} {"train_loss": -23.146657943725586, "global_step": 142640, "epoch": 1718} {"train_loss": -23.028690338134766, "global_step": 142641, "epoch": 1718} {"train_loss": -22.923398971557617, "global_step": 142642, "epoch": 1718} {"train_loss": -23.1505069732666, "global_step": 142643, "epoch": 1718} {"train_loss": -23.14825439453125, "global_step": 142644, "epoch": 1718} {"train_loss": -23.00574493408203, "global_step": 142645, "epoch": 1718} {"train_loss": -23.128469467163086, "global_step": 142646, "epoch": 1718} {"train_loss": -22.82923698425293, "global_step": 142647, "epoch": 1718} {"train_loss": -22.860088348388672, "global_step": 142648, "epoch": 1718} {"train_loss": -23.261987686157227, "global_step": 142649, "epoch": 1718} {"train_loss": -23.583984375, "global_step": 142650, "epoch": 1718} {"train_loss": -22.77179527282715, "global_step": 142651, "epoch": 1718} {"train_loss": -23.217344284057617, "global_step": 142652, "epoch": 1718} {"train_loss": -23.02808952331543, "global_step": 142653, "epoch": 1718} {"train_loss": -23.033296585083008, "global_step": 142654, "epoch": 1718} {"train_loss": -23.094688415527344, "global_step": 142655, "epoch": 1718} {"train_loss": -23.163129806518555, "global_step": 142656, "epoch": 1718} {"train_loss": -23.2054443359375, "global_step": 142657, "epoch": 1718} {"train_loss": -22.989564895629883, "global_step": 142658, "epoch": 1718} {"train_loss": -22.934528350830078, "global_step": 142659, "epoch": 1718} {"train_loss": -22.919498443603516, "global_step": 142660, "epoch": 1718} {"train_loss": -22.89908790588379, "global_step": 142661, "epoch": 1718} {"train_loss": -23.19846534729004, "global_step": 142662, "epoch": 1718} {"train_loss": -23.16724967956543, "global_step": 142663, "epoch": 1718} {"train_loss": -23.305072784423828, "global_step": 142664, "epoch": 1718} {"train_loss": -23.173044204711914, "global_step": 142665, "epoch": 1718} {"train_loss": -22.945566177368164, "global_step": 142666, "epoch": 1718} {"train_loss": -22.857372283935547, "global_step": 142667, "epoch": 1718} {"train_loss": -23.379194259643555, "global_step": 142668, "epoch": 1718} {"train_loss": -23.30596351623535, "global_step": 142669, "epoch": 1718} {"train_loss": -22.824981689453125, "global_step": 142670, "epoch": 1718} {"train_loss": -22.807466506958008, "global_step": 142671, "epoch": 1718} {"train_loss": -23.471723556518555, "global_step": 142672, "epoch": 1718} {"train_loss": -22.973785400390625, "global_step": 142673, "epoch": 1718} {"train_loss": -23.250411987304688, "global_step": 142674, "epoch": 1718} {"train_loss": -23.294553756713867, "global_step": 142675, "epoch": 1718} {"train_loss": -23.03516840647502, "global_step": 142676, "epoch": 1718, "val_loss": 6376238.0} {"train_loss": -22.922321319580078, "global_step": 142677, "epoch": 1719} {"train_loss": -22.974740982055664, "global_step": 142678, "epoch": 1719} {"train_loss": -22.7299861907959, "global_step": 142679, "epoch": 1719} {"train_loss": -22.361238479614258, "global_step": 142680, "epoch": 1719} {"train_loss": -22.906766891479492, "global_step": 142681, "epoch": 1719} {"train_loss": -22.883216857910156, "global_step": 142682, "epoch": 1719} {"train_loss": -22.77484893798828, "global_step": 142683, "epoch": 1719} {"train_loss": -23.073476791381836, "global_step": 142684, "epoch": 1719} {"train_loss": -22.48345184326172, "global_step": 142685, "epoch": 1719} {"train_loss": -22.879467010498047, "global_step": 142686, "epoch": 1719} {"train_loss": -23.037965774536133, "global_step": 142687, "epoch": 1719} {"train_loss": -22.801992416381836, "global_step": 142688, "epoch": 1719} {"train_loss": -22.996591567993164, "global_step": 142689, "epoch": 1719} {"train_loss": -22.916425704956055, "global_step": 142690, "epoch": 1719} {"train_loss": -22.781211853027344, "global_step": 142691, "epoch": 1719} {"train_loss": -23.071826934814453, "global_step": 142692, "epoch": 1719} {"train_loss": -22.94673728942871, "global_step": 142693, "epoch": 1719} {"train_loss": -23.095895767211914, "global_step": 142694, "epoch": 1719} {"train_loss": -22.7735538482666, "global_step": 142695, "epoch": 1719} {"train_loss": -22.86189842224121, "global_step": 142696, "epoch": 1719} {"train_loss": -23.019563674926758, "global_step": 142697, "epoch": 1719} {"train_loss": -23.00723648071289, "global_step": 142698, "epoch": 1719} {"train_loss": -22.732711791992188, "global_step": 142699, "epoch": 1719} {"train_loss": -23.201541900634766, "global_step": 142700, "epoch": 1719} {"train_loss": -22.986949920654297, "global_step": 142701, "epoch": 1719} {"train_loss": -23.288488388061523, "global_step": 142702, "epoch": 1719} {"train_loss": -22.79120445251465, "global_step": 142703, "epoch": 1719} {"train_loss": -22.899105072021484, "global_step": 142704, "epoch": 1719} {"train_loss": -23.006549835205078, "global_step": 142705, "epoch": 1719} {"train_loss": -23.107717514038086, "global_step": 142706, "epoch": 1719} {"train_loss": -23.088499069213867, "global_step": 142707, "epoch": 1719} {"train_loss": -22.92254066467285, "global_step": 142708, "epoch": 1719} {"train_loss": -23.13417625427246, "global_step": 142709, "epoch": 1719} {"train_loss": -23.29156494140625, "global_step": 142710, "epoch": 1719} {"train_loss": -23.23410987854004, "global_step": 142711, "epoch": 1719} {"train_loss": -23.1351318359375, "global_step": 142712, "epoch": 1719} {"train_loss": -23.5126895904541, "global_step": 142713, "epoch": 1719} {"train_loss": -23.188636779785156, "global_step": 142714, "epoch": 1719} {"train_loss": -23.326637268066406, "global_step": 142715, "epoch": 1719} {"train_loss": -23.22291374206543, "global_step": 142716, "epoch": 1719} {"train_loss": -22.928739547729492, "global_step": 142717, "epoch": 1719} {"train_loss": -22.89813232421875, "global_step": 142718, "epoch": 1719} {"train_loss": -23.080646514892578, "global_step": 142719, "epoch": 1719} {"train_loss": -23.198095321655273, "global_step": 142720, "epoch": 1719} {"train_loss": -23.176084518432617, "global_step": 142721, "epoch": 1719} {"train_loss": -23.11164665222168, "global_step": 142722, "epoch": 1719} {"train_loss": -23.41844367980957, "global_step": 142723, "epoch": 1719} {"train_loss": -23.32611846923828, "global_step": 142724, "epoch": 1719} {"train_loss": -23.192306518554688, "global_step": 142725, "epoch": 1719} {"train_loss": -23.40110969543457, "global_step": 142726, "epoch": 1719} {"train_loss": -23.385343551635742, "global_step": 142727, "epoch": 1719} {"train_loss": -23.03937339782715, "global_step": 142728, "epoch": 1719} {"train_loss": -23.176057815551758, "global_step": 142729, "epoch": 1719} {"train_loss": -23.306028366088867, "global_step": 142730, "epoch": 1719} {"train_loss": -22.864721298217773, "global_step": 142731, "epoch": 1719} {"train_loss": -23.136892318725586, "global_step": 142732, "epoch": 1719} {"train_loss": -22.864521026611328, "global_step": 142733, "epoch": 1719} {"train_loss": -22.75065040588379, "global_step": 142734, "epoch": 1719} {"train_loss": -22.6563720703125, "global_step": 142735, "epoch": 1719} {"train_loss": -23.308591842651367, "global_step": 142736, "epoch": 1719} {"train_loss": -22.99640464782715, "global_step": 142737, "epoch": 1719} {"train_loss": -23.62006378173828, "global_step": 142738, "epoch": 1719} {"train_loss": -23.159561157226562, "global_step": 142739, "epoch": 1719} {"train_loss": -23.064476013183594, "global_step": 142740, "epoch": 1719} {"train_loss": -23.443532943725586, "global_step": 142741, "epoch": 1719} {"train_loss": -23.13947296142578, "global_step": 142742, "epoch": 1719} {"train_loss": -23.129846572875977, "global_step": 142743, "epoch": 1719} {"train_loss": -22.9674072265625, "global_step": 142744, "epoch": 1719} {"train_loss": -22.843246459960938, "global_step": 142745, "epoch": 1719} {"train_loss": -22.629865646362305, "global_step": 142746, "epoch": 1719} {"train_loss": -23.114425659179688, "global_step": 142747, "epoch": 1719} {"train_loss": -22.926977157592773, "global_step": 142748, "epoch": 1719} {"train_loss": -22.87224578857422, "global_step": 142749, "epoch": 1719} {"train_loss": -23.19729995727539, "global_step": 142750, "epoch": 1719} {"train_loss": -23.1865291595459, "global_step": 142751, "epoch": 1719} {"train_loss": -23.29534149169922, "global_step": 142752, "epoch": 1719} {"train_loss": -22.880765914916992, "global_step": 142753, "epoch": 1719} {"train_loss": -23.29501724243164, "global_step": 142754, "epoch": 1719} {"train_loss": -23.304004669189453, "global_step": 142755, "epoch": 1719} {"train_loss": -22.846946716308594, "global_step": 142756, "epoch": 1719} {"train_loss": -23.4127140045166, "global_step": 142757, "epoch": 1719} {"train_loss": -23.442535400390625, "global_step": 142758, "epoch": 1719} {"train_loss": -23.055082642888447, "global_step": 142759, "epoch": 1719, "val_loss": 6263717.0} {"train_loss": -22.794973373413086, "global_step": 142760, "epoch": 1720} {"train_loss": -22.885202407836914, "global_step": 142761, "epoch": 1720} {"train_loss": -22.573261260986328, "global_step": 142762, "epoch": 1720} {"train_loss": -22.727100372314453, "global_step": 142763, "epoch": 1720} {"train_loss": -22.85809326171875, "global_step": 142764, "epoch": 1720} {"train_loss": -23.204486846923828, "global_step": 142765, "epoch": 1720} {"train_loss": -23.031949996948242, "global_step": 142766, "epoch": 1720} {"train_loss": -22.760709762573242, "global_step": 142767, "epoch": 1720} {"train_loss": -23.222278594970703, "global_step": 142768, "epoch": 1720} {"train_loss": -23.10981559753418, "global_step": 142769, "epoch": 1720} {"train_loss": -23.199020385742188, "global_step": 142770, "epoch": 1720} {"train_loss": -22.957895278930664, "global_step": 142771, "epoch": 1720} {"train_loss": -23.288074493408203, "global_step": 142772, "epoch": 1720} {"train_loss": -22.903974533081055, "global_step": 142773, "epoch": 1720} {"train_loss": -22.85079002380371, "global_step": 142774, "epoch": 1720} {"train_loss": -22.9077091217041, "global_step": 142775, "epoch": 1720} {"train_loss": -23.10923194885254, "global_step": 142776, "epoch": 1720} {"train_loss": -23.140716552734375, "global_step": 142777, "epoch": 1720} {"train_loss": -23.35365104675293, "global_step": 142778, "epoch": 1720} {"train_loss": -22.737966537475586, "global_step": 142779, "epoch": 1720} {"train_loss": -23.187955856323242, "global_step": 142780, "epoch": 1720} {"train_loss": -23.31103515625, "global_step": 142781, "epoch": 1720} {"train_loss": -23.149816513061523, "global_step": 142782, "epoch": 1720} {"train_loss": -23.32146644592285, "global_step": 142783, "epoch": 1720} {"train_loss": -23.47165298461914, "global_step": 142784, "epoch": 1720} {"train_loss": -22.873695373535156, "global_step": 142785, "epoch": 1720} {"train_loss": -22.950735092163086, "global_step": 142786, "epoch": 1720} {"train_loss": -22.742416381835938, "global_step": 142787, "epoch": 1720} {"train_loss": -23.336591720581055, "global_step": 142788, "epoch": 1720} {"train_loss": -23.286298751831055, "global_step": 142789, "epoch": 1720} {"train_loss": -23.231321334838867, "global_step": 142790, "epoch": 1720} {"train_loss": -22.876989364624023, "global_step": 142791, "epoch": 1720} {"train_loss": -23.39203453063965, "global_step": 142792, "epoch": 1720} {"train_loss": -23.61384391784668, "global_step": 142793, "epoch": 1720} {"train_loss": -23.124740600585938, "global_step": 142794, "epoch": 1720} {"train_loss": -23.275800704956055, "global_step": 142795, "epoch": 1720} {"train_loss": -22.92097282409668, "global_step": 142796, "epoch": 1720} {"train_loss": -23.31107521057129, "global_step": 142797, "epoch": 1720} {"train_loss": -23.322309494018555, "global_step": 142798, "epoch": 1720} {"train_loss": -23.415401458740234, "global_step": 142799, "epoch": 1720} {"train_loss": -23.294300079345703, "global_step": 142800, "epoch": 1720} {"train_loss": -23.24961280822754, "global_step": 142801, "epoch": 1720} {"train_loss": -23.041818618774414, "global_step": 142802, "epoch": 1720} {"train_loss": -22.82274627685547, "global_step": 142803, "epoch": 1720} {"train_loss": -22.987417221069336, "global_step": 142804, "epoch": 1720} {"train_loss": -23.499217987060547, "global_step": 142805, "epoch": 1720} {"train_loss": -22.983795166015625, "global_step": 142806, "epoch": 1720} {"train_loss": -22.950021743774414, "global_step": 142807, "epoch": 1720} {"train_loss": -22.94869041442871, "global_step": 142808, "epoch": 1720} {"train_loss": -23.240663528442383, "global_step": 142809, "epoch": 1720} {"train_loss": -23.200876235961914, "global_step": 142810, "epoch": 1720} {"train_loss": -22.805007934570312, "global_step": 142811, "epoch": 1720} {"train_loss": -23.088993072509766, "global_step": 142812, "epoch": 1720} {"train_loss": -23.03443717956543, "global_step": 142813, "epoch": 1720} {"train_loss": -23.336759567260742, "global_step": 142814, "epoch": 1720} {"train_loss": -22.894590377807617, "global_step": 142815, "epoch": 1720} {"train_loss": -22.88309669494629, "global_step": 142816, "epoch": 1720} {"train_loss": -22.81752586364746, "global_step": 142817, "epoch": 1720} {"train_loss": -22.897451400756836, "global_step": 142818, "epoch": 1720} {"train_loss": -22.917219161987305, "global_step": 142819, "epoch": 1720} {"train_loss": -23.198932647705078, "global_step": 142820, "epoch": 1720} {"train_loss": -23.249393463134766, "global_step": 142821, "epoch": 1720} {"train_loss": -23.14438247680664, "global_step": 142822, "epoch": 1720} {"train_loss": -23.289796829223633, "global_step": 142823, "epoch": 1720} {"train_loss": -23.316303253173828, "global_step": 142824, "epoch": 1720} {"train_loss": -22.949047088623047, "global_step": 142825, "epoch": 1720} {"train_loss": -22.961645126342773, "global_step": 142826, "epoch": 1720} {"train_loss": -23.4532470703125, "global_step": 142827, "epoch": 1720} {"train_loss": -23.212127685546875, "global_step": 142828, "epoch": 1720} {"train_loss": -22.8273983001709, "global_step": 142829, "epoch": 1720} {"train_loss": -23.131887435913086, "global_step": 142830, "epoch": 1720} {"train_loss": -23.293048858642578, "global_step": 142831, "epoch": 1720} {"train_loss": -23.521467208862305, "global_step": 142832, "epoch": 1720} {"train_loss": -23.04294776916504, "global_step": 142833, "epoch": 1720} {"train_loss": -23.081085205078125, "global_step": 142834, "epoch": 1720} {"train_loss": -22.849653244018555, "global_step": 142835, "epoch": 1720} {"train_loss": -23.314191818237305, "global_step": 142836, "epoch": 1720} {"train_loss": -23.273252487182617, "global_step": 142837, "epoch": 1720} {"train_loss": -23.064355850219727, "global_step": 142838, "epoch": 1720} {"train_loss": -22.657825469970703, "global_step": 142839, "epoch": 1720} {"train_loss": -23.152637481689453, "global_step": 142840, "epoch": 1720} {"train_loss": -23.424856185913086, "global_step": 142841, "epoch": 1720} {"train_loss": -23.106797229812805, "global_step": 142842, "epoch": 1720, "val_loss": 6194982.0} {"train_loss": -22.267932891845703, "global_step": 142843, "epoch": 1721} {"train_loss": -22.155668258666992, "global_step": 142844, "epoch": 1721} {"train_loss": -22.895694732666016, "global_step": 142845, "epoch": 1721} {"train_loss": -22.5567684173584, "global_step": 142846, "epoch": 1721} {"train_loss": -22.290355682373047, "global_step": 142847, "epoch": 1721} {"train_loss": -22.76346206665039, "global_step": 142848, "epoch": 1721} {"train_loss": -23.07733154296875, "global_step": 142849, "epoch": 1721} {"train_loss": -22.508169174194336, "global_step": 142850, "epoch": 1721} {"train_loss": -22.965911865234375, "global_step": 142851, "epoch": 1721} {"train_loss": -22.789804458618164, "global_step": 142852, "epoch": 1721} {"train_loss": -23.059171676635742, "global_step": 142853, "epoch": 1721} {"train_loss": -22.49310874938965, "global_step": 142854, "epoch": 1721} {"train_loss": -22.9654541015625, "global_step": 142855, "epoch": 1721} {"train_loss": -22.914098739624023, "global_step": 142856, "epoch": 1721} {"train_loss": -22.552860260009766, "global_step": 142857, "epoch": 1721} {"train_loss": -22.717544555664062, "global_step": 142858, "epoch": 1721} {"train_loss": -23.066869735717773, "global_step": 142859, "epoch": 1721} {"train_loss": -23.333532333374023, "global_step": 142860, "epoch": 1721} {"train_loss": -23.243921279907227, "global_step": 142861, "epoch": 1721} {"train_loss": -23.02920913696289, "global_step": 142862, "epoch": 1721} {"train_loss": -23.00575828552246, "global_step": 142863, "epoch": 1721} {"train_loss": -23.08932876586914, "global_step": 142864, "epoch": 1721} {"train_loss": -22.94123649597168, "global_step": 142865, "epoch": 1721} {"train_loss": -22.895666122436523, "global_step": 142866, "epoch": 1721} {"train_loss": -23.04256248474121, "global_step": 142867, "epoch": 1721} {"train_loss": -22.939807891845703, "global_step": 142868, "epoch": 1721} {"train_loss": -23.03684425354004, "global_step": 142869, "epoch": 1721} {"train_loss": -23.05354118347168, "global_step": 142870, "epoch": 1721} {"train_loss": -23.182498931884766, "global_step": 142871, "epoch": 1721} {"train_loss": -23.171558380126953, "global_step": 142872, "epoch": 1721} {"train_loss": -22.8558349609375, "global_step": 142873, "epoch": 1721} {"train_loss": -22.804676055908203, "global_step": 142874, "epoch": 1721} {"train_loss": -23.13026237487793, "global_step": 142875, "epoch": 1721} {"train_loss": -23.0341739654541, "global_step": 142876, "epoch": 1721} {"train_loss": -23.204730987548828, "global_step": 142877, "epoch": 1721} {"train_loss": -23.08355140686035, "global_step": 142878, "epoch": 1721} {"train_loss": -23.033145904541016, "global_step": 142879, "epoch": 1721} {"train_loss": -23.413434982299805, "global_step": 142880, "epoch": 1721} {"train_loss": -23.04498291015625, "global_step": 142881, "epoch": 1721} {"train_loss": -22.43583106994629, "global_step": 142882, "epoch": 1721} {"train_loss": -23.291933059692383, "global_step": 142883, "epoch": 1721} {"train_loss": -22.891324996948242, "global_step": 142884, "epoch": 1721} {"train_loss": -23.17220115661621, "global_step": 142885, "epoch": 1721} {"train_loss": -23.183923721313477, "global_step": 142886, "epoch": 1721} {"train_loss": -23.1884822845459, "global_step": 142887, "epoch": 1721} {"train_loss": -23.217885971069336, "global_step": 142888, "epoch": 1721} {"train_loss": -23.285308837890625, "global_step": 142889, "epoch": 1721} {"train_loss": -22.945844650268555, "global_step": 142890, "epoch": 1721} {"train_loss": -23.35648536682129, "global_step": 142891, "epoch": 1721} {"train_loss": -23.21332359313965, "global_step": 142892, "epoch": 1721} {"train_loss": -23.151840209960938, "global_step": 142893, "epoch": 1721} {"train_loss": -23.008502960205078, "global_step": 142894, "epoch": 1721} {"train_loss": -23.22028160095215, "global_step": 142895, "epoch": 1721} {"train_loss": -22.75361442565918, "global_step": 142896, "epoch": 1721} {"train_loss": -22.669729232788086, "global_step": 142897, "epoch": 1721} {"train_loss": -23.199867248535156, "global_step": 142898, "epoch": 1721} {"train_loss": -22.703332901000977, "global_step": 142899, "epoch": 1721} {"train_loss": -22.835996627807617, "global_step": 142900, "epoch": 1721} {"train_loss": -23.066755294799805, "global_step": 142901, "epoch": 1721} {"train_loss": -22.909019470214844, "global_step": 142902, "epoch": 1721} {"train_loss": -23.07549476623535, "global_step": 142903, "epoch": 1721} {"train_loss": -23.11726188659668, "global_step": 142904, "epoch": 1721} {"train_loss": -23.106679916381836, "global_step": 142905, "epoch": 1721} {"train_loss": -23.275157928466797, "global_step": 142906, "epoch": 1721} {"train_loss": -22.72945213317871, "global_step": 142907, "epoch": 1721} {"train_loss": -23.100088119506836, "global_step": 142908, "epoch": 1721} {"train_loss": -23.150053024291992, "global_step": 142909, "epoch": 1721} {"train_loss": -23.10155487060547, "global_step": 142910, "epoch": 1721} {"train_loss": -23.075876235961914, "global_step": 142911, "epoch": 1721} {"train_loss": -23.010059356689453, "global_step": 142912, "epoch": 1721} {"train_loss": -23.193483352661133, "global_step": 142913, "epoch": 1721} {"train_loss": -22.975088119506836, "global_step": 142914, "epoch": 1721} {"train_loss": -23.286758422851562, "global_step": 142915, "epoch": 1721} {"train_loss": -23.022994995117188, "global_step": 142916, "epoch": 1721} {"train_loss": -23.289060592651367, "global_step": 142917, "epoch": 1721} {"train_loss": -23.02745819091797, "global_step": 142918, "epoch": 1721} {"train_loss": -23.273984909057617, "global_step": 142919, "epoch": 1721} {"train_loss": -23.188709259033203, "global_step": 142920, "epoch": 1721} {"train_loss": -23.063852310180664, "global_step": 142921, "epoch": 1721} {"train_loss": -23.075342178344727, "global_step": 142922, "epoch": 1721} {"train_loss": -23.304616928100586, "global_step": 142923, "epoch": 1721} {"train_loss": -22.77591323852539, "global_step": 142924, "epoch": 1721} {"train_loss": -22.981884117586066, "global_step": 142925, "epoch": 1721, "val_loss": 6275811.0} {"train_loss": -22.48476791381836, "global_step": 142926, "epoch": 1722} {"train_loss": -22.716510772705078, "global_step": 142927, "epoch": 1722} {"train_loss": -23.00691795349121, "global_step": 142928, "epoch": 1722} {"train_loss": -22.73651123046875, "global_step": 142929, "epoch": 1722} {"train_loss": -22.93044662475586, "global_step": 142930, "epoch": 1722} {"train_loss": -22.99922752380371, "global_step": 142931, "epoch": 1722} {"train_loss": -22.813560485839844, "global_step": 142932, "epoch": 1722} {"train_loss": -22.646276473999023, "global_step": 142933, "epoch": 1722} {"train_loss": -22.69980239868164, "global_step": 142934, "epoch": 1722} {"train_loss": -22.755821228027344, "global_step": 142935, "epoch": 1722} {"train_loss": -22.95343589782715, "global_step": 142936, "epoch": 1722} {"train_loss": -22.91214370727539, "global_step": 142937, "epoch": 1722} {"train_loss": -22.822729110717773, "global_step": 142938, "epoch": 1722} {"train_loss": -22.42493438720703, "global_step": 142939, "epoch": 1722} {"train_loss": -23.074892044067383, "global_step": 142940, "epoch": 1722} {"train_loss": -22.59425926208496, "global_step": 142941, "epoch": 1722} {"train_loss": -22.67586326599121, "global_step": 142942, "epoch": 1722} {"train_loss": -22.877843856811523, "global_step": 142943, "epoch": 1722} {"train_loss": -23.197933197021484, "global_step": 142944, "epoch": 1722} {"train_loss": -23.034460067749023, "global_step": 142945, "epoch": 1722} {"train_loss": -22.987979888916016, "global_step": 142946, "epoch": 1722} {"train_loss": -23.071741104125977, "global_step": 142947, "epoch": 1722} {"train_loss": -22.807483673095703, "global_step": 142948, "epoch": 1722} {"train_loss": -23.053218841552734, "global_step": 142949, "epoch": 1722} {"train_loss": -23.23714256286621, "global_step": 142950, "epoch": 1722} {"train_loss": -22.84566307067871, "global_step": 142951, "epoch": 1722} {"train_loss": -23.063751220703125, "global_step": 142952, "epoch": 1722} {"train_loss": -22.84125328063965, "global_step": 142953, "epoch": 1722} {"train_loss": -23.298114776611328, "global_step": 142954, "epoch": 1722} {"train_loss": -22.950225830078125, "global_step": 142955, "epoch": 1722} {"train_loss": -23.03385353088379, "global_step": 142956, "epoch": 1722} {"train_loss": -23.051664352416992, "global_step": 142957, "epoch": 1722} {"train_loss": -22.804677963256836, "global_step": 142958, "epoch": 1722} {"train_loss": -22.972715377807617, "global_step": 142959, "epoch": 1722} {"train_loss": -23.114675521850586, "global_step": 142960, "epoch": 1722} {"train_loss": -22.794443130493164, "global_step": 142961, "epoch": 1722} {"train_loss": -23.05938720703125, "global_step": 142962, "epoch": 1722} {"train_loss": -23.17279624938965, "global_step": 142963, "epoch": 1722} {"train_loss": -23.7281436920166, "global_step": 142964, "epoch": 1722} {"train_loss": -23.403553009033203, "global_step": 142965, "epoch": 1722} {"train_loss": -23.31321144104004, "global_step": 142966, "epoch": 1722} {"train_loss": -23.250198364257812, "global_step": 142967, "epoch": 1722} {"train_loss": -23.146533966064453, "global_step": 142968, "epoch": 1722} {"train_loss": -23.392805099487305, "global_step": 142969, "epoch": 1722} {"train_loss": -23.247207641601562, "global_step": 142970, "epoch": 1722} {"train_loss": -22.825864791870117, "global_step": 142971, "epoch": 1722} {"train_loss": -23.0615177154541, "global_step": 142972, "epoch": 1722} {"train_loss": -23.167707443237305, "global_step": 142973, "epoch": 1722} {"train_loss": -23.156042098999023, "global_step": 142974, "epoch": 1722} {"train_loss": -23.211423873901367, "global_step": 142975, "epoch": 1722} {"train_loss": -23.475751876831055, "global_step": 142976, "epoch": 1722} {"train_loss": -23.23621940612793, "global_step": 142977, "epoch": 1722} {"train_loss": -23.176313400268555, "global_step": 142978, "epoch": 1722} {"train_loss": -23.066030502319336, "global_step": 142979, "epoch": 1722} {"train_loss": -22.722829818725586, "global_step": 142980, "epoch": 1722} {"train_loss": -23.21903419494629, "global_step": 142981, "epoch": 1722} {"train_loss": -23.288864135742188, "global_step": 142982, "epoch": 1722} {"train_loss": -23.1016902923584, "global_step": 142983, "epoch": 1722} {"train_loss": -23.011695861816406, "global_step": 142984, "epoch": 1722} {"train_loss": -23.315895080566406, "global_step": 142985, "epoch": 1722} {"train_loss": -23.018022537231445, "global_step": 142986, "epoch": 1722} {"train_loss": -22.76141929626465, "global_step": 142987, "epoch": 1722} {"train_loss": -23.328569412231445, "global_step": 142988, "epoch": 1722} {"train_loss": -22.81467056274414, "global_step": 142989, "epoch": 1722} {"train_loss": -23.014997482299805, "global_step": 142990, "epoch": 1722} {"train_loss": -23.3052978515625, "global_step": 142991, "epoch": 1722} {"train_loss": -23.244827270507812, "global_step": 142992, "epoch": 1722} {"train_loss": -22.953107833862305, "global_step": 142993, "epoch": 1722} {"train_loss": -22.793201446533203, "global_step": 142994, "epoch": 1722} {"train_loss": -23.379789352416992, "global_step": 142995, "epoch": 1722} {"train_loss": -23.099607467651367, "global_step": 142996, "epoch": 1722} {"train_loss": -22.821252822875977, "global_step": 142997, "epoch": 1722} {"train_loss": -23.357236862182617, "global_step": 142998, "epoch": 1722} {"train_loss": -22.943885803222656, "global_step": 142999, "epoch": 1722} {"train_loss": -23.26059341430664, "global_step": 143000, "epoch": 1722} {"train_loss": -23.16365623474121, "global_step": 143001, "epoch": 1722} {"train_loss": -22.90077018737793, "global_step": 143002, "epoch": 1722} {"train_loss": -23.3273983001709, "global_step": 143003, "epoch": 1722} {"train_loss": -23.60043716430664, "global_step": 143004, "epoch": 1722} {"train_loss": -23.160932540893555, "global_step": 143005, "epoch": 1722} {"train_loss": -23.313154220581055, "global_step": 143006, "epoch": 1722} {"train_loss": -23.04865074157715, "global_step": 143007, "epoch": 1722} {"train_loss": -23.041749517601655, "global_step": 143008, "epoch": 1722, "val_loss": 6327438.5} {"train_loss": -22.360492706298828, "global_step": 143009, "epoch": 1723} {"train_loss": -22.222198486328125, "global_step": 143010, "epoch": 1723} {"train_loss": -21.71949005126953, "global_step": 143011, "epoch": 1723} {"train_loss": -22.84769058227539, "global_step": 143012, "epoch": 1723} {"train_loss": -22.447586059570312, "global_step": 143013, "epoch": 1723} {"train_loss": -22.710357666015625, "global_step": 143014, "epoch": 1723} {"train_loss": -22.507583618164062, "global_step": 143015, "epoch": 1723} {"train_loss": -22.805683135986328, "global_step": 143016, "epoch": 1723} {"train_loss": -22.592506408691406, "global_step": 143017, "epoch": 1723} {"train_loss": -22.763944625854492, "global_step": 143018, "epoch": 1723} {"train_loss": -22.9116268157959, "global_step": 143019, "epoch": 1723} {"train_loss": -22.292341232299805, "global_step": 143020, "epoch": 1723} {"train_loss": -22.669208526611328, "global_step": 143021, "epoch": 1723} {"train_loss": -22.441740036010742, "global_step": 143022, "epoch": 1723} {"train_loss": -22.581085205078125, "global_step": 143023, "epoch": 1723} {"train_loss": -22.841520309448242, "global_step": 143024, "epoch": 1723} {"train_loss": -22.518054962158203, "global_step": 143025, "epoch": 1723} {"train_loss": -23.152606964111328, "global_step": 143026, "epoch": 1723} {"train_loss": -22.946109771728516, "global_step": 143027, "epoch": 1723} {"train_loss": -23.03859519958496, "global_step": 143028, "epoch": 1723} {"train_loss": -23.0155086517334, "global_step": 143029, "epoch": 1723} {"train_loss": -22.94460105895996, "global_step": 143030, "epoch": 1723} {"train_loss": -22.735034942626953, "global_step": 143031, "epoch": 1723} {"train_loss": -22.709745407104492, "global_step": 143032, "epoch": 1723} {"train_loss": -22.972021102905273, "global_step": 143033, "epoch": 1723} {"train_loss": -23.21860122680664, "global_step": 143034, "epoch": 1723} {"train_loss": -22.647024154663086, "global_step": 143035, "epoch": 1723} {"train_loss": -23.096939086914062, "global_step": 143036, "epoch": 1723} {"train_loss": -23.463327407836914, "global_step": 143037, "epoch": 1723} {"train_loss": -23.031986236572266, "global_step": 143038, "epoch": 1723} {"train_loss": -23.053293228149414, "global_step": 143039, "epoch": 1723} {"train_loss": -23.12102508544922, "global_step": 143040, "epoch": 1723} {"train_loss": -23.217363357543945, "global_step": 143041, "epoch": 1723} {"train_loss": -22.981672286987305, "global_step": 143042, "epoch": 1723} {"train_loss": -23.058258056640625, "global_step": 143043, "epoch": 1723} {"train_loss": -23.272977828979492, "global_step": 143044, "epoch": 1723} {"train_loss": -23.16427993774414, "global_step": 143045, "epoch": 1723} {"train_loss": -23.267305374145508, "global_step": 143046, "epoch": 1723} {"train_loss": -23.23952865600586, "global_step": 143047, "epoch": 1723} {"train_loss": -22.94039535522461, "global_step": 143048, "epoch": 1723} {"train_loss": -23.326614379882812, "global_step": 143049, "epoch": 1723} {"train_loss": -23.0990047454834, "global_step": 143050, "epoch": 1723} {"train_loss": -23.09979820251465, "global_step": 143051, "epoch": 1723} {"train_loss": -23.35337257385254, "global_step": 143052, "epoch": 1723} {"train_loss": -22.969175338745117, "global_step": 143053, "epoch": 1723} {"train_loss": -23.051687240600586, "global_step": 143054, "epoch": 1723} {"train_loss": -23.2502498626709, "global_step": 143055, "epoch": 1723} {"train_loss": -23.182947158813477, "global_step": 143056, "epoch": 1723} {"train_loss": -23.306774139404297, "global_step": 143057, "epoch": 1723} {"train_loss": -22.9962158203125, "global_step": 143058, "epoch": 1723} {"train_loss": -23.08991813659668, "global_step": 143059, "epoch": 1723} {"train_loss": -23.191082000732422, "global_step": 143060, "epoch": 1723} {"train_loss": -23.700111389160156, "global_step": 143061, "epoch": 1723} {"train_loss": -23.220996856689453, "global_step": 143062, "epoch": 1723} {"train_loss": -23.285398483276367, "global_step": 143063, "epoch": 1723} {"train_loss": -22.89116668701172, "global_step": 143064, "epoch": 1723} {"train_loss": -23.592117309570312, "global_step": 143065, "epoch": 1723} {"train_loss": -22.526315689086914, "global_step": 143066, "epoch": 1723} {"train_loss": -22.695058822631836, "global_step": 143067, "epoch": 1723} {"train_loss": -23.378324508666992, "global_step": 143068, "epoch": 1723} {"train_loss": -23.40278434753418, "global_step": 143069, "epoch": 1723} {"train_loss": -23.407367706298828, "global_step": 143070, "epoch": 1723} {"train_loss": -23.100509643554688, "global_step": 143071, "epoch": 1723} {"train_loss": -23.193098068237305, "global_step": 143072, "epoch": 1723} {"train_loss": -23.277729034423828, "global_step": 143073, "epoch": 1723} {"train_loss": -23.215906143188477, "global_step": 143074, "epoch": 1723} {"train_loss": -23.34760284423828, "global_step": 143075, "epoch": 1723} {"train_loss": -22.86793327331543, "global_step": 143076, "epoch": 1723} {"train_loss": -23.3491268157959, "global_step": 143077, "epoch": 1723} {"train_loss": -23.346145629882812, "global_step": 143078, "epoch": 1723} {"train_loss": -23.503318786621094, "global_step": 143079, "epoch": 1723} {"train_loss": -23.48357582092285, "global_step": 143080, "epoch": 1723} {"train_loss": -22.91195297241211, "global_step": 143081, "epoch": 1723} {"train_loss": -23.084182739257812, "global_step": 143082, "epoch": 1723} {"train_loss": -22.922407150268555, "global_step": 143083, "epoch": 1723} {"train_loss": -23.280241012573242, "global_step": 143084, "epoch": 1723} {"train_loss": -23.316442489624023, "global_step": 143085, "epoch": 1723} {"train_loss": -23.114566802978516, "global_step": 143086, "epoch": 1723} {"train_loss": -23.47462272644043, "global_step": 143087, "epoch": 1723} {"train_loss": -23.06256103515625, "global_step": 143088, "epoch": 1723} {"train_loss": -22.984737396240234, "global_step": 143089, "epoch": 1723} {"train_loss": -23.146503448486328, "global_step": 143090, "epoch": 1723} {"train_loss": -23.01243844089738, "global_step": 143091, "epoch": 1723, "val_loss": 6325183.0} {"train_loss": -23.21526527404785, "global_step": 143092, "epoch": 1724} {"train_loss": -23.144935607910156, "global_step": 143093, "epoch": 1724} {"train_loss": -22.972700119018555, "global_step": 143094, "epoch": 1724} {"train_loss": -23.077207565307617, "global_step": 143095, "epoch": 1724} {"train_loss": -23.29758071899414, "global_step": 143096, "epoch": 1724} {"train_loss": -22.789756774902344, "global_step": 143097, "epoch": 1724} {"train_loss": -22.80112075805664, "global_step": 143098, "epoch": 1724} {"train_loss": -22.63689613342285, "global_step": 143099, "epoch": 1724} {"train_loss": -23.269113540649414, "global_step": 143100, "epoch": 1724} {"train_loss": -22.9451904296875, "global_step": 143101, "epoch": 1724} {"train_loss": -22.985143661499023, "global_step": 143102, "epoch": 1724} {"train_loss": -22.79587173461914, "global_step": 143103, "epoch": 1724} {"train_loss": -22.673330307006836, "global_step": 143104, "epoch": 1724} {"train_loss": -23.213836669921875, "global_step": 143105, "epoch": 1724} {"train_loss": -23.27962303161621, "global_step": 143106, "epoch": 1724} {"train_loss": -22.867618560791016, "global_step": 143107, "epoch": 1724} {"train_loss": -22.883237838745117, "global_step": 143108, "epoch": 1724} {"train_loss": -22.5988826751709, "global_step": 143109, "epoch": 1724} {"train_loss": -23.305639266967773, "global_step": 143110, "epoch": 1724} {"train_loss": -23.125715255737305, "global_step": 143111, "epoch": 1724} {"train_loss": -23.271032333374023, "global_step": 143112, "epoch": 1724} {"train_loss": -22.99045753479004, "global_step": 143113, "epoch": 1724} {"train_loss": -23.07320213317871, "global_step": 143114, "epoch": 1724} {"train_loss": -22.758291244506836, "global_step": 143115, "epoch": 1724} {"train_loss": -23.323787689208984, "global_step": 143116, "epoch": 1724} {"train_loss": -23.083690643310547, "global_step": 143117, "epoch": 1724} {"train_loss": -23.03256607055664, "global_step": 143118, "epoch": 1724} {"train_loss": -23.153860092163086, "global_step": 143119, "epoch": 1724} {"train_loss": -22.86712646484375, "global_step": 143120, "epoch": 1724} {"train_loss": -22.649982452392578, "global_step": 143121, "epoch": 1724} {"train_loss": -23.246732711791992, "global_step": 143122, "epoch": 1724} {"train_loss": -22.901655197143555, "global_step": 143123, "epoch": 1724} {"train_loss": -23.039640426635742, "global_step": 143124, "epoch": 1724} {"train_loss": -23.108394622802734, "global_step": 143125, "epoch": 1724} {"train_loss": -23.481300354003906, "global_step": 143126, "epoch": 1724} {"train_loss": -23.088193893432617, "global_step": 143127, "epoch": 1724} {"train_loss": -23.407197952270508, "global_step": 143128, "epoch": 1724} {"train_loss": -23.187904357910156, "global_step": 143129, "epoch": 1724} {"train_loss": -23.157669067382812, "global_step": 143130, "epoch": 1724} {"train_loss": -23.119359970092773, "global_step": 143131, "epoch": 1724} {"train_loss": -23.122495651245117, "global_step": 143132, "epoch": 1724} {"train_loss": -23.295780181884766, "global_step": 143133, "epoch": 1724} {"train_loss": -23.362417221069336, "global_step": 143134, "epoch": 1724} {"train_loss": -22.77757453918457, "global_step": 143135, "epoch": 1724} {"train_loss": -23.200790405273438, "global_step": 143136, "epoch": 1724} {"train_loss": -23.113441467285156, "global_step": 143137, "epoch": 1724} {"train_loss": -23.114721298217773, "global_step": 143138, "epoch": 1724} {"train_loss": -23.296401977539062, "global_step": 143139, "epoch": 1724} {"train_loss": -23.3621826171875, "global_step": 143140, "epoch": 1724} {"train_loss": -22.702945709228516, "global_step": 143141, "epoch": 1724} {"train_loss": -22.93671417236328, "global_step": 143142, "epoch": 1724} {"train_loss": -23.115188598632812, "global_step": 143143, "epoch": 1724} {"train_loss": -23.177827835083008, "global_step": 143144, "epoch": 1724} {"train_loss": -23.185880661010742, "global_step": 143145, "epoch": 1724} {"train_loss": -23.44318199157715, "global_step": 143146, "epoch": 1724} {"train_loss": -22.816532135009766, "global_step": 143147, "epoch": 1724} {"train_loss": -23.04608154296875, "global_step": 143148, "epoch": 1724} {"train_loss": -23.11935806274414, "global_step": 143149, "epoch": 1724} {"train_loss": -23.191930770874023, "global_step": 143150, "epoch": 1724} {"train_loss": -22.85271644592285, "global_step": 143151, "epoch": 1724} {"train_loss": -23.061603546142578, "global_step": 143152, "epoch": 1724} {"train_loss": -23.040119171142578, "global_step": 143153, "epoch": 1724} {"train_loss": -23.246017456054688, "global_step": 143154, "epoch": 1724} {"train_loss": -23.056318283081055, "global_step": 143155, "epoch": 1724} {"train_loss": -22.69886016845703, "global_step": 143156, "epoch": 1724} {"train_loss": -22.347694396972656, "global_step": 143157, "epoch": 1724} {"train_loss": -22.954078674316406, "global_step": 143158, "epoch": 1724} {"train_loss": -22.91064453125, "global_step": 143159, "epoch": 1724} {"train_loss": -22.806686401367188, "global_step": 143160, "epoch": 1724} {"train_loss": -22.91169548034668, "global_step": 143161, "epoch": 1724} {"train_loss": -23.04986572265625, "global_step": 143162, "epoch": 1724} {"train_loss": -22.91737937927246, "global_step": 143163, "epoch": 1724} {"train_loss": -23.047956466674805, "global_step": 143164, "epoch": 1724} {"train_loss": -22.83736228942871, "global_step": 143165, "epoch": 1724} {"train_loss": -23.03675651550293, "global_step": 143166, "epoch": 1724} {"train_loss": -23.052391052246094, "global_step": 143167, "epoch": 1724} {"train_loss": -23.3980770111084, "global_step": 143168, "epoch": 1724} {"train_loss": -23.125883102416992, "global_step": 143169, "epoch": 1724} {"train_loss": -22.918798446655273, "global_step": 143170, "epoch": 1724} {"train_loss": -23.142107009887695, "global_step": 143171, "epoch": 1724} {"train_loss": -22.80634307861328, "global_step": 143172, "epoch": 1724} {"train_loss": -22.98501968383789, "global_step": 143173, "epoch": 1724} {"train_loss": -23.048587063708936, "global_step": 143174, "epoch": 1724, "val_loss": 6290348.0} {"train_loss": -22.55877113342285, "global_step": 143175, "epoch": 1725} {"train_loss": -22.722875595092773, "global_step": 143176, "epoch": 1725} {"train_loss": -22.09820556640625, "global_step": 143177, "epoch": 1725} {"train_loss": -22.218381881713867, "global_step": 143178, "epoch": 1725} {"train_loss": -22.39707374572754, "global_step": 143179, "epoch": 1725} {"train_loss": -22.113758087158203, "global_step": 143180, "epoch": 1725} {"train_loss": -22.814428329467773, "global_step": 143181, "epoch": 1725} {"train_loss": -22.30685806274414, "global_step": 143182, "epoch": 1725} {"train_loss": -22.375547409057617, "global_step": 143183, "epoch": 1725} {"train_loss": -22.88787841796875, "global_step": 143184, "epoch": 1725} {"train_loss": -23.00409507751465, "global_step": 143185, "epoch": 1725} {"train_loss": -22.843244552612305, "global_step": 143186, "epoch": 1725} {"train_loss": -22.85934829711914, "global_step": 143187, "epoch": 1725} {"train_loss": -22.636920928955078, "global_step": 143188, "epoch": 1725} {"train_loss": -22.6948184967041, "global_step": 143189, "epoch": 1725} {"train_loss": -22.63894271850586, "global_step": 143190, "epoch": 1725} {"train_loss": -22.939725875854492, "global_step": 143191, "epoch": 1725} {"train_loss": -22.58367347717285, "global_step": 143192, "epoch": 1725} {"train_loss": -22.75900650024414, "global_step": 143193, "epoch": 1725} {"train_loss": -22.704788208007812, "global_step": 143194, "epoch": 1725} {"train_loss": -23.08333396911621, "global_step": 143195, "epoch": 1725} {"train_loss": -22.974308013916016, "global_step": 143196, "epoch": 1725} {"train_loss": -23.288238525390625, "global_step": 143197, "epoch": 1725} {"train_loss": -22.702009201049805, "global_step": 143198, "epoch": 1725} {"train_loss": -22.844009399414062, "global_step": 143199, "epoch": 1725} {"train_loss": -23.31411361694336, "global_step": 143200, "epoch": 1725} {"train_loss": -23.24246597290039, "global_step": 143201, "epoch": 1725} {"train_loss": -22.6718807220459, "global_step": 143202, "epoch": 1725} {"train_loss": -22.989519119262695, "global_step": 143203, "epoch": 1725} {"train_loss": -23.075693130493164, "global_step": 143204, "epoch": 1725} {"train_loss": -22.904499053955078, "global_step": 143205, "epoch": 1725} {"train_loss": -23.22452735900879, "global_step": 143206, "epoch": 1725} {"train_loss": -23.032047271728516, "global_step": 143207, "epoch": 1725} {"train_loss": -23.001867294311523, "global_step": 143208, "epoch": 1725} {"train_loss": -22.797119140625, "global_step": 143209, "epoch": 1725} {"train_loss": -22.9586181640625, "global_step": 143210, "epoch": 1725} {"train_loss": -23.100967407226562, "global_step": 143211, "epoch": 1725} {"train_loss": -23.187353134155273, "global_step": 143212, "epoch": 1725} {"train_loss": -23.2966365814209, "global_step": 143213, "epoch": 1725} {"train_loss": -23.304977416992188, "global_step": 143214, "epoch": 1725} {"train_loss": -22.86884307861328, "global_step": 143215, "epoch": 1725} {"train_loss": -23.254323959350586, "global_step": 143216, "epoch": 1725} {"train_loss": -23.3277587890625, "global_step": 143217, "epoch": 1725} {"train_loss": -22.931676864624023, "global_step": 143218, "epoch": 1725} {"train_loss": -23.10443687438965, "global_step": 143219, "epoch": 1725} {"train_loss": -23.080215454101562, "global_step": 143220, "epoch": 1725} {"train_loss": -22.35480308532715, "global_step": 143221, "epoch": 1725} {"train_loss": -22.814451217651367, "global_step": 143222, "epoch": 1725} {"train_loss": -23.16168975830078, "global_step": 143223, "epoch": 1725} {"train_loss": -23.174877166748047, "global_step": 143224, "epoch": 1725} {"train_loss": -22.779233932495117, "global_step": 143225, "epoch": 1725} {"train_loss": -22.971256256103516, "global_step": 143226, "epoch": 1725} {"train_loss": -22.976377487182617, "global_step": 143227, "epoch": 1725} {"train_loss": -22.71990966796875, "global_step": 143228, "epoch": 1725} {"train_loss": -23.156972885131836, "global_step": 143229, "epoch": 1725} {"train_loss": -23.078998565673828, "global_step": 143230, "epoch": 1725} {"train_loss": -22.80419921875, "global_step": 143231, "epoch": 1725} {"train_loss": -23.390945434570312, "global_step": 143232, "epoch": 1725} {"train_loss": -23.220003128051758, "global_step": 143233, "epoch": 1725} {"train_loss": -23.116147994995117, "global_step": 143234, "epoch": 1725} {"train_loss": -23.375812530517578, "global_step": 143235, "epoch": 1725} {"train_loss": -23.219186782836914, "global_step": 143236, "epoch": 1725} {"train_loss": -23.216384887695312, "global_step": 143237, "epoch": 1725} {"train_loss": -22.58831787109375, "global_step": 143238, "epoch": 1725} {"train_loss": -22.94826316833496, "global_step": 143239, "epoch": 1725} {"train_loss": -23.023544311523438, "global_step": 143240, "epoch": 1725} {"train_loss": -23.045740127563477, "global_step": 143241, "epoch": 1725} {"train_loss": -23.30879020690918, "global_step": 143242, "epoch": 1725} {"train_loss": -23.495758056640625, "global_step": 143243, "epoch": 1725} {"train_loss": -22.7725772857666, "global_step": 143244, "epoch": 1725} {"train_loss": -23.327829360961914, "global_step": 143245, "epoch": 1725} {"train_loss": -23.05826759338379, "global_step": 143246, "epoch": 1725} {"train_loss": -23.130802154541016, "global_step": 143247, "epoch": 1725} {"train_loss": -22.90298080444336, "global_step": 143248, "epoch": 1725} {"train_loss": -22.889822006225586, "global_step": 143249, "epoch": 1725} {"train_loss": -22.900959014892578, "global_step": 143250, "epoch": 1725} {"train_loss": -23.00674819946289, "global_step": 143251, "epoch": 1725} {"train_loss": -23.19413948059082, "global_step": 143252, "epoch": 1725} {"train_loss": -22.970046997070312, "global_step": 143253, "epoch": 1725} {"train_loss": -23.305625915527344, "global_step": 143254, "epoch": 1725} {"train_loss": -23.08118438720703, "global_step": 143255, "epoch": 1725} {"train_loss": -23.354331970214844, "global_step": 143256, "epoch": 1725} {"train_loss": -22.94359717311629, "global_step": 143257, "epoch": 1725, "val_loss": 6314262.0} {"train_loss": -22.49493980407715, "global_step": 143258, "epoch": 1726} {"train_loss": -22.01797866821289, "global_step": 143259, "epoch": 1726} {"train_loss": -22.43549346923828, "global_step": 143260, "epoch": 1726} {"train_loss": -22.684795379638672, "global_step": 143261, "epoch": 1726} {"train_loss": -22.352758407592773, "global_step": 143262, "epoch": 1726} {"train_loss": -22.573909759521484, "global_step": 143263, "epoch": 1726} {"train_loss": -22.79090118408203, "global_step": 143264, "epoch": 1726} {"train_loss": -22.65886688232422, "global_step": 143265, "epoch": 1726} {"train_loss": -22.803436279296875, "global_step": 143266, "epoch": 1726} {"train_loss": -22.69029998779297, "global_step": 143267, "epoch": 1726} {"train_loss": -23.07571792602539, "global_step": 143268, "epoch": 1726} {"train_loss": -22.554014205932617, "global_step": 143269, "epoch": 1726} {"train_loss": -23.098554611206055, "global_step": 143270, "epoch": 1726} {"train_loss": -22.770050048828125, "global_step": 143271, "epoch": 1726} {"train_loss": -23.2398681640625, "global_step": 143272, "epoch": 1726} {"train_loss": -22.61968994140625, "global_step": 143273, "epoch": 1726} {"train_loss": -22.71055030822754, "global_step": 143274, "epoch": 1726} {"train_loss": -22.8480281829834, "global_step": 143275, "epoch": 1726} {"train_loss": -22.742334365844727, "global_step": 143276, "epoch": 1726} {"train_loss": -22.987960815429688, "global_step": 143277, "epoch": 1726} {"train_loss": -23.050764083862305, "global_step": 143278, "epoch": 1726} {"train_loss": -22.761032104492188, "global_step": 143279, "epoch": 1726} {"train_loss": -23.096660614013672, "global_step": 143280, "epoch": 1726} {"train_loss": -22.852340698242188, "global_step": 143281, "epoch": 1726} {"train_loss": -23.018661499023438, "global_step": 143282, "epoch": 1726} {"train_loss": -22.93914794921875, "global_step": 143283, "epoch": 1726} {"train_loss": -23.189044952392578, "global_step": 143284, "epoch": 1726} {"train_loss": -22.908721923828125, "global_step": 143285, "epoch": 1726} {"train_loss": -22.981769561767578, "global_step": 143286, "epoch": 1726} {"train_loss": -23.09822654724121, "global_step": 143287, "epoch": 1726} {"train_loss": -23.129764556884766, "global_step": 143288, "epoch": 1726} {"train_loss": -22.99554443359375, "global_step": 143289, "epoch": 1726} {"train_loss": -23.340002059936523, "global_step": 143290, "epoch": 1726} {"train_loss": -22.774030685424805, "global_step": 143291, "epoch": 1726} {"train_loss": -23.40531349182129, "global_step": 143292, "epoch": 1726} {"train_loss": -23.105100631713867, "global_step": 143293, "epoch": 1726} {"train_loss": -23.144378662109375, "global_step": 143294, "epoch": 1726} {"train_loss": -22.776649475097656, "global_step": 143295, "epoch": 1726} {"train_loss": -23.04976463317871, "global_step": 143296, "epoch": 1726} {"train_loss": -23.1534481048584, "global_step": 143297, "epoch": 1726} {"train_loss": -23.36971092224121, "global_step": 143298, "epoch": 1726} {"train_loss": -22.975339889526367, "global_step": 143299, "epoch": 1726} {"train_loss": -23.181798934936523, "global_step": 143300, "epoch": 1726} {"train_loss": -23.381582260131836, "global_step": 143301, "epoch": 1726} {"train_loss": -23.009042739868164, "global_step": 143302, "epoch": 1726} {"train_loss": -22.706886291503906, "global_step": 143303, "epoch": 1726} {"train_loss": -23.074758529663086, "global_step": 143304, "epoch": 1726} {"train_loss": -22.97018814086914, "global_step": 143305, "epoch": 1726} {"train_loss": -22.841352462768555, "global_step": 143306, "epoch": 1726} {"train_loss": -22.90117835998535, "global_step": 143307, "epoch": 1726} {"train_loss": -22.709348678588867, "global_step": 143308, "epoch": 1726} {"train_loss": -22.84000015258789, "global_step": 143309, "epoch": 1726} {"train_loss": -22.697546005249023, "global_step": 143310, "epoch": 1726} {"train_loss": -23.110506057739258, "global_step": 143311, "epoch": 1726} {"train_loss": -23.016456604003906, "global_step": 143312, "epoch": 1726} {"train_loss": -22.652158737182617, "global_step": 143313, "epoch": 1726} {"train_loss": -23.076435089111328, "global_step": 143314, "epoch": 1726} {"train_loss": -23.08493423461914, "global_step": 143315, "epoch": 1726} {"train_loss": -22.849639892578125, "global_step": 143316, "epoch": 1726} {"train_loss": -23.601303100585938, "global_step": 143317, "epoch": 1726} {"train_loss": -22.8796443939209, "global_step": 143318, "epoch": 1726} {"train_loss": -22.729385375976562, "global_step": 143319, "epoch": 1726} {"train_loss": -23.253244400024414, "global_step": 143320, "epoch": 1726} {"train_loss": -22.96610450744629, "global_step": 143321, "epoch": 1726} {"train_loss": -23.039344787597656, "global_step": 143322, "epoch": 1726} {"train_loss": -23.185461044311523, "global_step": 143323, "epoch": 1726} {"train_loss": -22.85806655883789, "global_step": 143324, "epoch": 1726} {"train_loss": -23.1220760345459, "global_step": 143325, "epoch": 1726} {"train_loss": -23.143720626831055, "global_step": 143326, "epoch": 1726} {"train_loss": -22.741222381591797, "global_step": 143327, "epoch": 1726} {"train_loss": -22.933303833007812, "global_step": 143328, "epoch": 1726} {"train_loss": -22.806396484375, "global_step": 143329, "epoch": 1726} {"train_loss": -23.46778678894043, "global_step": 143330, "epoch": 1726} {"train_loss": -23.237619400024414, "global_step": 143331, "epoch": 1726} {"train_loss": -23.270343780517578, "global_step": 143332, "epoch": 1726} {"train_loss": -23.275869369506836, "global_step": 143333, "epoch": 1726} {"train_loss": -23.136777877807617, "global_step": 143334, "epoch": 1726} {"train_loss": -23.1833438873291, "global_step": 143335, "epoch": 1726} {"train_loss": -23.12729263305664, "global_step": 143336, "epoch": 1726} {"train_loss": -23.28066062927246, "global_step": 143337, "epoch": 1726} {"train_loss": -23.091228485107422, "global_step": 143338, "epoch": 1726} {"train_loss": -23.18256950378418, "global_step": 143339, "epoch": 1726} {"train_loss": -22.962790776448077, "global_step": 143340, "epoch": 1726, "val_loss": 6364895.5} {"train_loss": -22.566604614257812, "global_step": 143341, "epoch": 1727} {"train_loss": -22.85967254638672, "global_step": 143342, "epoch": 1727} {"train_loss": -22.94822120666504, "global_step": 143343, "epoch": 1727} {"train_loss": -22.959609985351562, "global_step": 143344, "epoch": 1727} {"train_loss": -22.476839065551758, "global_step": 143345, "epoch": 1727} {"train_loss": -22.733034133911133, "global_step": 143346, "epoch": 1727} {"train_loss": -23.039487838745117, "global_step": 143347, "epoch": 1727} {"train_loss": -22.875446319580078, "global_step": 143348, "epoch": 1727} {"train_loss": -22.7179012298584, "global_step": 143349, "epoch": 1727} {"train_loss": -22.881689071655273, "global_step": 143350, "epoch": 1727} {"train_loss": -22.978286743164062, "global_step": 143351, "epoch": 1727} {"train_loss": -22.561864852905273, "global_step": 143352, "epoch": 1727} {"train_loss": -23.073009490966797, "global_step": 143353, "epoch": 1727} {"train_loss": -22.881977081298828, "global_step": 143354, "epoch": 1727} {"train_loss": -22.8287296295166, "global_step": 143355, "epoch": 1727} {"train_loss": -23.04957389831543, "global_step": 143356, "epoch": 1727} {"train_loss": -22.793365478515625, "global_step": 143357, "epoch": 1727} {"train_loss": -22.288698196411133, "global_step": 143358, "epoch": 1727} {"train_loss": -22.707263946533203, "global_step": 143359, "epoch": 1727} {"train_loss": -22.774465560913086, "global_step": 143360, "epoch": 1727} {"train_loss": -23.139291763305664, "global_step": 143361, "epoch": 1727} {"train_loss": -23.068944931030273, "global_step": 143362, "epoch": 1727} {"train_loss": -22.902790069580078, "global_step": 143363, "epoch": 1727} {"train_loss": -22.95262336730957, "global_step": 143364, "epoch": 1727} {"train_loss": -23.136362075805664, "global_step": 143365, "epoch": 1727} {"train_loss": -22.930356979370117, "global_step": 143366, "epoch": 1727} {"train_loss": -23.01947021484375, "global_step": 143367, "epoch": 1727} {"train_loss": -22.789012908935547, "global_step": 143368, "epoch": 1727} {"train_loss": -22.978776931762695, "global_step": 143369, "epoch": 1727} {"train_loss": -23.230701446533203, "global_step": 143370, "epoch": 1727} {"train_loss": -23.02983283996582, "global_step": 143371, "epoch": 1727} {"train_loss": -23.254026412963867, "global_step": 143372, "epoch": 1727} {"train_loss": -22.97796058654785, "global_step": 143373, "epoch": 1727} {"train_loss": -23.02996826171875, "global_step": 143374, "epoch": 1727} {"train_loss": -22.65433120727539, "global_step": 143375, "epoch": 1727} {"train_loss": -23.072975158691406, "global_step": 143376, "epoch": 1727} {"train_loss": -23.079553604125977, "global_step": 143377, "epoch": 1727} {"train_loss": -22.924591064453125, "global_step": 143378, "epoch": 1727} {"train_loss": -23.374191284179688, "global_step": 143379, "epoch": 1727} {"train_loss": -22.984344482421875, "global_step": 143380, "epoch": 1727} {"train_loss": -23.328189849853516, "global_step": 143381, "epoch": 1727} {"train_loss": -22.937129974365234, "global_step": 143382, "epoch": 1727} {"train_loss": -23.164398193359375, "global_step": 143383, "epoch": 1727} {"train_loss": -22.938302993774414, "global_step": 143384, "epoch": 1727} {"train_loss": -23.00142478942871, "global_step": 143385, "epoch": 1727} {"train_loss": -23.23648452758789, "global_step": 143386, "epoch": 1727} {"train_loss": -23.47943878173828, "global_step": 143387, "epoch": 1727} {"train_loss": -23.122495651245117, "global_step": 143388, "epoch": 1727} {"train_loss": -23.53267478942871, "global_step": 143389, "epoch": 1727} {"train_loss": -22.985811233520508, "global_step": 143390, "epoch": 1727} {"train_loss": -22.96932029724121, "global_step": 143391, "epoch": 1727} {"train_loss": -22.925626754760742, "global_step": 143392, "epoch": 1727} {"train_loss": -23.503084182739258, "global_step": 143393, "epoch": 1727} {"train_loss": -22.997488021850586, "global_step": 143394, "epoch": 1727} {"train_loss": -23.039823532104492, "global_step": 143395, "epoch": 1727} {"train_loss": -22.891571044921875, "global_step": 143396, "epoch": 1727} {"train_loss": -23.28912353515625, "global_step": 143397, "epoch": 1727} {"train_loss": -23.078702926635742, "global_step": 143398, "epoch": 1727} {"train_loss": -23.261030197143555, "global_step": 143399, "epoch": 1727} {"train_loss": -23.124853134155273, "global_step": 143400, "epoch": 1727} {"train_loss": -23.312705993652344, "global_step": 143401, "epoch": 1727} {"train_loss": -23.125442504882812, "global_step": 143402, "epoch": 1727} {"train_loss": -22.770580291748047, "global_step": 143403, "epoch": 1727} {"train_loss": -23.035310745239258, "global_step": 143404, "epoch": 1727} {"train_loss": -23.41762351989746, "global_step": 143405, "epoch": 1727} {"train_loss": -23.16509246826172, "global_step": 143406, "epoch": 1727} {"train_loss": -23.15846824645996, "global_step": 143407, "epoch": 1727} {"train_loss": -23.127784729003906, "global_step": 143408, "epoch": 1727} {"train_loss": -23.29057502746582, "global_step": 143409, "epoch": 1727} {"train_loss": -23.46864128112793, "global_step": 143410, "epoch": 1727} {"train_loss": -23.349760055541992, "global_step": 143411, "epoch": 1727} {"train_loss": -23.203018188476562, "global_step": 143412, "epoch": 1727} {"train_loss": -23.165624618530273, "global_step": 143413, "epoch": 1727} {"train_loss": -23.550100326538086, "global_step": 143414, "epoch": 1727} {"train_loss": -22.841508865356445, "global_step": 143415, "epoch": 1727} {"train_loss": -23.088796615600586, "global_step": 143416, "epoch": 1727} {"train_loss": -23.438825607299805, "global_step": 143417, "epoch": 1727} {"train_loss": -23.319231033325195, "global_step": 143418, "epoch": 1727} {"train_loss": -23.14069938659668, "global_step": 143419, "epoch": 1727} {"train_loss": -23.44913101196289, "global_step": 143420, "epoch": 1727} {"train_loss": -23.143569946289062, "global_step": 143421, "epoch": 1727} {"train_loss": -23.375471115112305, "global_step": 143422, "epoch": 1727} {"train_loss": -23.053454502519354, "global_step": 143423, "epoch": 1727, "val_loss": 6315914.0} {"train_loss": -23.09881591796875, "global_step": 143424, "epoch": 1728} {"train_loss": -22.514131546020508, "global_step": 143425, "epoch": 1728} {"train_loss": -23.0355281829834, "global_step": 143426, "epoch": 1728} {"train_loss": -22.842960357666016, "global_step": 143427, "epoch": 1728} {"train_loss": -22.803552627563477, "global_step": 143428, "epoch": 1728} {"train_loss": -22.973678588867188, "global_step": 143429, "epoch": 1728} {"train_loss": -22.7900333404541, "global_step": 143430, "epoch": 1728} {"train_loss": -23.189260482788086, "global_step": 143431, "epoch": 1728} {"train_loss": -23.110549926757812, "global_step": 143432, "epoch": 1728} {"train_loss": -22.715307235717773, "global_step": 143433, "epoch": 1728} {"train_loss": -22.814268112182617, "global_step": 143434, "epoch": 1728} {"train_loss": -22.643524169921875, "global_step": 143435, "epoch": 1728} {"train_loss": -22.785154342651367, "global_step": 143436, "epoch": 1728} {"train_loss": -22.861814498901367, "global_step": 143437, "epoch": 1728} {"train_loss": -22.588003158569336, "global_step": 143438, "epoch": 1728} {"train_loss": -22.67169761657715, "global_step": 143439, "epoch": 1728} {"train_loss": -23.259885787963867, "global_step": 143440, "epoch": 1728} {"train_loss": -23.06886100769043, "global_step": 143441, "epoch": 1728} {"train_loss": -23.05864715576172, "global_step": 143442, "epoch": 1728} {"train_loss": -23.22083854675293, "global_step": 143443, "epoch": 1728} {"train_loss": -22.684545516967773, "global_step": 143444, "epoch": 1728} {"train_loss": -22.75819206237793, "global_step": 143445, "epoch": 1728} {"train_loss": -23.131284713745117, "global_step": 143446, "epoch": 1728} {"train_loss": -22.920318603515625, "global_step": 143447, "epoch": 1728} {"train_loss": -23.31574058532715, "global_step": 143448, "epoch": 1728} {"train_loss": -22.821577072143555, "global_step": 143449, "epoch": 1728} {"train_loss": -22.961034774780273, "global_step": 143450, "epoch": 1728} {"train_loss": -22.882566452026367, "global_step": 143451, "epoch": 1728} {"train_loss": -22.946142196655273, "global_step": 143452, "epoch": 1728} {"train_loss": -23.02890968322754, "global_step": 143453, "epoch": 1728} {"train_loss": -23.138349533081055, "global_step": 143454, "epoch": 1728} {"train_loss": -23.249887466430664, "global_step": 143455, "epoch": 1728} {"train_loss": -23.220478057861328, "global_step": 143456, "epoch": 1728} {"train_loss": -22.968463897705078, "global_step": 143457, "epoch": 1728} {"train_loss": -22.73105239868164, "global_step": 143458, "epoch": 1728} {"train_loss": -23.25349235534668, "global_step": 143459, "epoch": 1728} {"train_loss": -23.22947883605957, "global_step": 143460, "epoch": 1728} {"train_loss": -23.17970085144043, "global_step": 143461, "epoch": 1728} {"train_loss": -23.325410842895508, "global_step": 143462, "epoch": 1728} {"train_loss": -23.398128509521484, "global_step": 143463, "epoch": 1728} {"train_loss": -22.98186683654785, "global_step": 143464, "epoch": 1728} {"train_loss": -23.14365005493164, "global_step": 143465, "epoch": 1728} {"train_loss": -23.122343063354492, "global_step": 143466, "epoch": 1728} {"train_loss": -23.425003051757812, "global_step": 143467, "epoch": 1728} {"train_loss": -22.916584014892578, "global_step": 143468, "epoch": 1728} {"train_loss": -23.18610954284668, "global_step": 143469, "epoch": 1728} {"train_loss": -22.744657516479492, "global_step": 143470, "epoch": 1728} {"train_loss": -23.123258590698242, "global_step": 143471, "epoch": 1728} {"train_loss": -22.90572166442871, "global_step": 143472, "epoch": 1728} {"train_loss": -23.33953285217285, "global_step": 143473, "epoch": 1728} {"train_loss": -22.9482479095459, "global_step": 143474, "epoch": 1728} {"train_loss": -23.287372589111328, "global_step": 143475, "epoch": 1728} {"train_loss": -22.783252716064453, "global_step": 143476, "epoch": 1728} {"train_loss": -23.007658004760742, "global_step": 143477, "epoch": 1728} {"train_loss": -23.086637496948242, "global_step": 143478, "epoch": 1728} {"train_loss": -23.213226318359375, "global_step": 143479, "epoch": 1728} {"train_loss": -23.063589096069336, "global_step": 143480, "epoch": 1728} {"train_loss": -23.431333541870117, "global_step": 143481, "epoch": 1728} {"train_loss": -22.932987213134766, "global_step": 143482, "epoch": 1728} {"train_loss": -23.19074058532715, "global_step": 143483, "epoch": 1728} {"train_loss": -23.24110221862793, "global_step": 143484, "epoch": 1728} {"train_loss": -23.063892364501953, "global_step": 143485, "epoch": 1728} {"train_loss": -22.9620418548584, "global_step": 143486, "epoch": 1728} {"train_loss": -22.650943756103516, "global_step": 143487, "epoch": 1728} {"train_loss": -22.832643508911133, "global_step": 143488, "epoch": 1728} {"train_loss": -23.16225242614746, "global_step": 143489, "epoch": 1728} {"train_loss": -23.032785415649414, "global_step": 143490, "epoch": 1728} {"train_loss": -23.109338760375977, "global_step": 143491, "epoch": 1728} {"train_loss": -23.368864059448242, "global_step": 143492, "epoch": 1728} {"train_loss": -22.827085494995117, "global_step": 143493, "epoch": 1728} {"train_loss": -23.344547271728516, "global_step": 143494, "epoch": 1728} {"train_loss": -23.27596092224121, "global_step": 143495, "epoch": 1728} {"train_loss": -23.127567291259766, "global_step": 143496, "epoch": 1728} {"train_loss": -23.205341339111328, "global_step": 143497, "epoch": 1728} {"train_loss": -23.301076889038086, "global_step": 143498, "epoch": 1728} {"train_loss": -23.253286361694336, "global_step": 143499, "epoch": 1728} {"train_loss": -22.86810874938965, "global_step": 143500, "epoch": 1728} {"train_loss": -23.53803062438965, "global_step": 143501, "epoch": 1728} {"train_loss": -23.397611618041992, "global_step": 143502, "epoch": 1728} {"train_loss": -23.30974006652832, "global_step": 143503, "epoch": 1728} {"train_loss": -23.10334587097168, "global_step": 143504, "epoch": 1728} {"train_loss": -23.36249351501465, "global_step": 143505, "epoch": 1728} {"train_loss": -23.05531681014831, "global_step": 143506, "epoch": 1728, "val_loss": 6320241.0} {"train_loss": -22.814800262451172, "global_step": 143507, "epoch": 1729} {"train_loss": -22.455785751342773, "global_step": 143508, "epoch": 1729} {"train_loss": -23.0765438079834, "global_step": 143509, "epoch": 1729} {"train_loss": -22.45359230041504, "global_step": 143510, "epoch": 1729} {"train_loss": -22.562152862548828, "global_step": 143511, "epoch": 1729} {"train_loss": -22.636690139770508, "global_step": 143512, "epoch": 1729} {"train_loss": -22.409162521362305, "global_step": 143513, "epoch": 1729} {"train_loss": -23.021442413330078, "global_step": 143514, "epoch": 1729} {"train_loss": -22.656234741210938, "global_step": 143515, "epoch": 1729} {"train_loss": -22.852420806884766, "global_step": 143516, "epoch": 1729} {"train_loss": -22.74593162536621, "global_step": 143517, "epoch": 1729} {"train_loss": -22.527997970581055, "global_step": 143518, "epoch": 1729} {"train_loss": -22.929792404174805, "global_step": 143519, "epoch": 1729} {"train_loss": -22.916852951049805, "global_step": 143520, "epoch": 1729} {"train_loss": -22.893606185913086, "global_step": 143521, "epoch": 1729} {"train_loss": -22.87022590637207, "global_step": 143522, "epoch": 1729} {"train_loss": -23.196096420288086, "global_step": 143523, "epoch": 1729} {"train_loss": -23.157672882080078, "global_step": 143524, "epoch": 1729} {"train_loss": -23.071619033813477, "global_step": 143525, "epoch": 1729} {"train_loss": -23.29827308654785, "global_step": 143526, "epoch": 1729} {"train_loss": -23.109743118286133, "global_step": 143527, "epoch": 1729} {"train_loss": -23.05364990234375, "global_step": 143528, "epoch": 1729} {"train_loss": -23.4289608001709, "global_step": 143529, "epoch": 1729} {"train_loss": -23.142637252807617, "global_step": 143530, "epoch": 1729} {"train_loss": -23.13217544555664, "global_step": 143531, "epoch": 1729} {"train_loss": -23.130796432495117, "global_step": 143532, "epoch": 1729} {"train_loss": -23.151416778564453, "global_step": 143533, "epoch": 1729} {"train_loss": -22.871126174926758, "global_step": 143534, "epoch": 1729} {"train_loss": -23.4599609375, "global_step": 143535, "epoch": 1729} {"train_loss": -23.23552703857422, "global_step": 143536, "epoch": 1729} {"train_loss": -23.135910034179688, "global_step": 143537, "epoch": 1729} {"train_loss": -23.313739776611328, "global_step": 143538, "epoch": 1729} {"train_loss": -23.045068740844727, "global_step": 143539, "epoch": 1729} {"train_loss": -23.17234230041504, "global_step": 143540, "epoch": 1729} {"train_loss": -23.190725326538086, "global_step": 143541, "epoch": 1729} {"train_loss": -23.423444747924805, "global_step": 143542, "epoch": 1729} {"train_loss": -23.069721221923828, "global_step": 143543, "epoch": 1729} {"train_loss": -23.200895309448242, "global_step": 143544, "epoch": 1729} {"train_loss": -22.988021850585938, "global_step": 143545, "epoch": 1729} {"train_loss": -23.32316017150879, "global_step": 143546, "epoch": 1729} {"train_loss": -23.12220573425293, "global_step": 143547, "epoch": 1729} {"train_loss": -23.274450302124023, "global_step": 143548, "epoch": 1729} {"train_loss": -23.32880973815918, "global_step": 143549, "epoch": 1729} {"train_loss": -23.701826095581055, "global_step": 143550, "epoch": 1729} {"train_loss": -22.898344039916992, "global_step": 143551, "epoch": 1729} {"train_loss": -22.86335563659668, "global_step": 143552, "epoch": 1729} {"train_loss": -22.651071548461914, "global_step": 143553, "epoch": 1729} {"train_loss": -23.296329498291016, "global_step": 143554, "epoch": 1729} {"train_loss": -23.00010108947754, "global_step": 143555, "epoch": 1729} {"train_loss": -22.857934951782227, "global_step": 143556, "epoch": 1729} {"train_loss": -22.929916381835938, "global_step": 143557, "epoch": 1729} {"train_loss": -22.885828018188477, "global_step": 143558, "epoch": 1729} {"train_loss": -23.062545776367188, "global_step": 143559, "epoch": 1729} {"train_loss": -22.795366287231445, "global_step": 143560, "epoch": 1729} {"train_loss": -23.30084800720215, "global_step": 143561, "epoch": 1729} {"train_loss": -23.369260787963867, "global_step": 143562, "epoch": 1729} {"train_loss": -22.771848678588867, "global_step": 143563, "epoch": 1729} {"train_loss": -22.89423179626465, "global_step": 143564, "epoch": 1729} {"train_loss": -23.036483764648438, "global_step": 143565, "epoch": 1729} {"train_loss": -23.416656494140625, "global_step": 143566, "epoch": 1729} {"train_loss": -22.81107521057129, "global_step": 143567, "epoch": 1729} {"train_loss": -23.354909896850586, "global_step": 143568, "epoch": 1729} {"train_loss": -23.10100555419922, "global_step": 143569, "epoch": 1729} {"train_loss": -23.03829002380371, "global_step": 143570, "epoch": 1729} {"train_loss": -23.0516357421875, "global_step": 143571, "epoch": 1729} {"train_loss": -23.41775894165039, "global_step": 143572, "epoch": 1729} {"train_loss": -23.413928985595703, "global_step": 143573, "epoch": 1729} {"train_loss": -22.823984146118164, "global_step": 143574, "epoch": 1729} {"train_loss": -23.049421310424805, "global_step": 143575, "epoch": 1729} {"train_loss": -23.22723388671875, "global_step": 143576, "epoch": 1729} {"train_loss": -23.32563591003418, "global_step": 143577, "epoch": 1729} {"train_loss": -22.942657470703125, "global_step": 143578, "epoch": 1729} {"train_loss": -23.2929630279541, "global_step": 143579, "epoch": 1729} {"train_loss": -22.982763290405273, "global_step": 143580, "epoch": 1729} {"train_loss": -23.351974487304688, "global_step": 143581, "epoch": 1729} {"train_loss": -23.015289306640625, "global_step": 143582, "epoch": 1729} {"train_loss": -23.1785888671875, "global_step": 143583, "epoch": 1729} {"train_loss": -23.21392822265625, "global_step": 143584, "epoch": 1729} {"train_loss": -23.221952438354492, "global_step": 143585, "epoch": 1729} {"train_loss": -23.552875518798828, "global_step": 143586, "epoch": 1729} {"train_loss": -22.9616756439209, "global_step": 143587, "epoch": 1729} {"train_loss": -23.497507095336914, "global_step": 143588, "epoch": 1729} {"train_loss": -23.066774827888214, "global_step": 143589, "epoch": 1729, "val_loss": 6258038.0} {"train_loss": -22.79587745666504, "global_step": 143590, "epoch": 1730} {"train_loss": -22.299116134643555, "global_step": 143591, "epoch": 1730} {"train_loss": -22.29660987854004, "global_step": 143592, "epoch": 1730} {"train_loss": -22.90032958984375, "global_step": 143593, "epoch": 1730} {"train_loss": -22.660411834716797, "global_step": 143594, "epoch": 1730} {"train_loss": -21.995376586914062, "global_step": 143595, "epoch": 1730} {"train_loss": -22.60634994506836, "global_step": 143596, "epoch": 1730} {"train_loss": -23.071088790893555, "global_step": 143597, "epoch": 1730} {"train_loss": -22.59697914123535, "global_step": 143598, "epoch": 1730} {"train_loss": -23.17782211303711, "global_step": 143599, "epoch": 1730} {"train_loss": -22.551382064819336, "global_step": 143600, "epoch": 1730} {"train_loss": -22.935382843017578, "global_step": 143601, "epoch": 1730} {"train_loss": -22.928197860717773, "global_step": 143602, "epoch": 1730} {"train_loss": -23.07329750061035, "global_step": 143603, "epoch": 1730} {"train_loss": -23.206350326538086, "global_step": 143604, "epoch": 1730} {"train_loss": -22.758255004882812, "global_step": 143605, "epoch": 1730} {"train_loss": -22.79945945739746, "global_step": 143606, "epoch": 1730} {"train_loss": -23.046506881713867, "global_step": 143607, "epoch": 1730} {"train_loss": -22.922887802124023, "global_step": 143608, "epoch": 1730} {"train_loss": -23.097871780395508, "global_step": 143609, "epoch": 1730} {"train_loss": -23.034799575805664, "global_step": 143610, "epoch": 1730} {"train_loss": -23.190433502197266, "global_step": 143611, "epoch": 1730} {"train_loss": -23.174150466918945, "global_step": 143612, "epoch": 1730} {"train_loss": -22.871505737304688, "global_step": 143613, "epoch": 1730} {"train_loss": -22.627483367919922, "global_step": 143614, "epoch": 1730} {"train_loss": -23.214275360107422, "global_step": 143615, "epoch": 1730} {"train_loss": -22.77009391784668, "global_step": 143616, "epoch": 1730} {"train_loss": -22.827054977416992, "global_step": 143617, "epoch": 1730} {"train_loss": -22.89454460144043, "global_step": 143618, "epoch": 1730} {"train_loss": -23.154102325439453, "global_step": 143619, "epoch": 1730} {"train_loss": -23.154890060424805, "global_step": 143620, "epoch": 1730} {"train_loss": -22.864864349365234, "global_step": 143621, "epoch": 1730} {"train_loss": -23.18950653076172, "global_step": 143622, "epoch": 1730} {"train_loss": -23.14655876159668, "global_step": 143623, "epoch": 1730} {"train_loss": -23.110591888427734, "global_step": 143624, "epoch": 1730} {"train_loss": -23.242542266845703, "global_step": 143625, "epoch": 1730} {"train_loss": -23.514896392822266, "global_step": 143626, "epoch": 1730} {"train_loss": -23.009450912475586, "global_step": 143627, "epoch": 1730} {"train_loss": -23.202285766601562, "global_step": 143628, "epoch": 1730} {"train_loss": -22.996793746948242, "global_step": 143629, "epoch": 1730} {"train_loss": -23.038698196411133, "global_step": 143630, "epoch": 1730} {"train_loss": -23.610280990600586, "global_step": 143631, "epoch": 1730} {"train_loss": -23.238096237182617, "global_step": 143632, "epoch": 1730} {"train_loss": -23.1182861328125, "global_step": 143633, "epoch": 1730} {"train_loss": -23.180131912231445, "global_step": 143634, "epoch": 1730} {"train_loss": -23.508039474487305, "global_step": 143635, "epoch": 1730} {"train_loss": -23.4486083984375, "global_step": 143636, "epoch": 1730} {"train_loss": -23.494577407836914, "global_step": 143637, "epoch": 1730} {"train_loss": -23.326913833618164, "global_step": 143638, "epoch": 1730} {"train_loss": -22.729095458984375, "global_step": 143639, "epoch": 1730} {"train_loss": -23.19403839111328, "global_step": 143640, "epoch": 1730} {"train_loss": -23.23082733154297, "global_step": 143641, "epoch": 1730} {"train_loss": -22.4915771484375, "global_step": 143642, "epoch": 1730} {"train_loss": -23.11751365661621, "global_step": 143643, "epoch": 1730} {"train_loss": -23.03427505493164, "global_step": 143644, "epoch": 1730} {"train_loss": -23.461698532104492, "global_step": 143645, "epoch": 1730} {"train_loss": -22.93360710144043, "global_step": 143646, "epoch": 1730} {"train_loss": -23.002878189086914, "global_step": 143647, "epoch": 1730} {"train_loss": -23.033899307250977, "global_step": 143648, "epoch": 1730} {"train_loss": -23.611560821533203, "global_step": 143649, "epoch": 1730} {"train_loss": -22.983186721801758, "global_step": 143650, "epoch": 1730} {"train_loss": -22.741987228393555, "global_step": 143651, "epoch": 1730} {"train_loss": -22.72942352294922, "global_step": 143652, "epoch": 1730} {"train_loss": -22.996923446655273, "global_step": 143653, "epoch": 1730} {"train_loss": -22.847091674804688, "global_step": 143654, "epoch": 1730} {"train_loss": -22.797874450683594, "global_step": 143655, "epoch": 1730} {"train_loss": -22.7086238861084, "global_step": 143656, "epoch": 1730} {"train_loss": -23.09986686706543, "global_step": 143657, "epoch": 1730} {"train_loss": -22.8945255279541, "global_step": 143658, "epoch": 1730} {"train_loss": -22.846107482910156, "global_step": 143659, "epoch": 1730} {"train_loss": -22.875593185424805, "global_step": 143660, "epoch": 1730} {"train_loss": -23.190685272216797, "global_step": 143661, "epoch": 1730} {"train_loss": -23.163644790649414, "global_step": 143662, "epoch": 1730} {"train_loss": -23.11988639831543, "global_step": 143663, "epoch": 1730} {"train_loss": -22.974088668823242, "global_step": 143664, "epoch": 1730} {"train_loss": -23.1622314453125, "global_step": 143665, "epoch": 1730} {"train_loss": -22.668779373168945, "global_step": 143666, "epoch": 1730} {"train_loss": -23.517797470092773, "global_step": 143667, "epoch": 1730} {"train_loss": -23.14347267150879, "global_step": 143668, "epoch": 1730} {"train_loss": -22.95514488220215, "global_step": 143669, "epoch": 1730} {"train_loss": -23.028287887573242, "global_step": 143670, "epoch": 1730} {"train_loss": -23.029865264892578, "global_step": 143671, "epoch": 1730} {"train_loss": -23.01734515270555, "global_step": 143672, "epoch": 1730, "val_loss": 6302044.0} {"train_loss": -22.585153579711914, "global_step": 143673, "epoch": 1731} {"train_loss": -22.8746395111084, "global_step": 143674, "epoch": 1731} {"train_loss": -22.971845626831055, "global_step": 143675, "epoch": 1731} {"train_loss": -22.452987670898438, "global_step": 143676, "epoch": 1731} {"train_loss": -22.906442642211914, "global_step": 143677, "epoch": 1731} {"train_loss": -22.680465698242188, "global_step": 143678, "epoch": 1731} {"train_loss": -22.735347747802734, "global_step": 143679, "epoch": 1731} {"train_loss": -22.70499610900879, "global_step": 143680, "epoch": 1731} {"train_loss": -22.991552352905273, "global_step": 143681, "epoch": 1731} {"train_loss": -23.122976303100586, "global_step": 143682, "epoch": 1731} {"train_loss": -23.132946014404297, "global_step": 143683, "epoch": 1731} {"train_loss": -22.773582458496094, "global_step": 143684, "epoch": 1731} {"train_loss": -23.121030807495117, "global_step": 143685, "epoch": 1731} {"train_loss": -23.059816360473633, "global_step": 143686, "epoch": 1731} {"train_loss": -23.441349029541016, "global_step": 143687, "epoch": 1731} {"train_loss": -22.93088150024414, "global_step": 143688, "epoch": 1731} {"train_loss": -23.057937622070312, "global_step": 143689, "epoch": 1731} {"train_loss": -23.101505279541016, "global_step": 143690, "epoch": 1731} {"train_loss": -23.217817306518555, "global_step": 143691, "epoch": 1731} {"train_loss": -23.0031795501709, "global_step": 143692, "epoch": 1731} {"train_loss": -23.254934310913086, "global_step": 143693, "epoch": 1731} {"train_loss": -23.00771141052246, "global_step": 143694, "epoch": 1731} {"train_loss": -23.252487182617188, "global_step": 143695, "epoch": 1731} {"train_loss": -23.14569854736328, "global_step": 143696, "epoch": 1731} {"train_loss": -23.279664993286133, "global_step": 143697, "epoch": 1731} {"train_loss": -23.05063247680664, "global_step": 143698, "epoch": 1731} {"train_loss": -23.299108505249023, "global_step": 143699, "epoch": 1731} {"train_loss": -23.293302536010742, "global_step": 143700, "epoch": 1731} {"train_loss": -23.01909828186035, "global_step": 143701, "epoch": 1731} {"train_loss": -22.98068618774414, "global_step": 143702, "epoch": 1731} {"train_loss": -23.179216384887695, "global_step": 143703, "epoch": 1731} {"train_loss": -22.78718376159668, "global_step": 143704, "epoch": 1731} {"train_loss": -23.1437931060791, "global_step": 143705, "epoch": 1731} {"train_loss": -23.193683624267578, "global_step": 143706, "epoch": 1731} {"train_loss": -22.82964324951172, "global_step": 143707, "epoch": 1731} {"train_loss": -23.002580642700195, "global_step": 143708, "epoch": 1731} {"train_loss": -23.24761390686035, "global_step": 143709, "epoch": 1731} {"train_loss": -23.36415672302246, "global_step": 143710, "epoch": 1731} {"train_loss": -23.404327392578125, "global_step": 143711, "epoch": 1731} {"train_loss": -23.081710815429688, "global_step": 143712, "epoch": 1731} {"train_loss": -23.196622848510742, "global_step": 143713, "epoch": 1731} {"train_loss": -23.204633712768555, "global_step": 143714, "epoch": 1731} {"train_loss": -22.99092674255371, "global_step": 143715, "epoch": 1731} {"train_loss": -23.22491455078125, "global_step": 143716, "epoch": 1731} {"train_loss": -23.011322021484375, "global_step": 143717, "epoch": 1731} {"train_loss": -23.24262046813965, "global_step": 143718, "epoch": 1731} {"train_loss": -23.009403228759766, "global_step": 143719, "epoch": 1731} {"train_loss": -23.07848358154297, "global_step": 143720, "epoch": 1731} {"train_loss": -22.843847274780273, "global_step": 143721, "epoch": 1731} {"train_loss": -22.868738174438477, "global_step": 143722, "epoch": 1731} {"train_loss": -23.079618453979492, "global_step": 143723, "epoch": 1731} {"train_loss": -23.065990447998047, "global_step": 143724, "epoch": 1731} {"train_loss": -23.3691463470459, "global_step": 143725, "epoch": 1731} {"train_loss": -23.1480770111084, "global_step": 143726, "epoch": 1731} {"train_loss": -23.268245697021484, "global_step": 143727, "epoch": 1731} {"train_loss": -23.05952262878418, "global_step": 143728, "epoch": 1731} {"train_loss": -23.395965576171875, "global_step": 143729, "epoch": 1731} {"train_loss": -23.463397979736328, "global_step": 143730, "epoch": 1731} {"train_loss": -23.324743270874023, "global_step": 143731, "epoch": 1731} {"train_loss": -23.067401885986328, "global_step": 143732, "epoch": 1731} {"train_loss": -23.50452995300293, "global_step": 143733, "epoch": 1731} {"train_loss": -23.205020904541016, "global_step": 143734, "epoch": 1731} {"train_loss": -23.337995529174805, "global_step": 143735, "epoch": 1731} {"train_loss": -23.508813858032227, "global_step": 143736, "epoch": 1731} {"train_loss": -22.96071434020996, "global_step": 143737, "epoch": 1731} {"train_loss": -22.80541229248047, "global_step": 143738, "epoch": 1731} {"train_loss": -23.233280181884766, "global_step": 143739, "epoch": 1731} {"train_loss": -22.901052474975586, "global_step": 143740, "epoch": 1731} {"train_loss": -22.947372436523438, "global_step": 143741, "epoch": 1731} {"train_loss": -22.894235610961914, "global_step": 143742, "epoch": 1731} {"train_loss": -23.183351516723633, "global_step": 143743, "epoch": 1731} {"train_loss": -22.885404586791992, "global_step": 143744, "epoch": 1731} {"train_loss": -23.490835189819336, "global_step": 143745, "epoch": 1731} {"train_loss": -23.085134506225586, "global_step": 143746, "epoch": 1731} {"train_loss": -23.216400146484375, "global_step": 143747, "epoch": 1731} {"train_loss": -23.119617462158203, "global_step": 143748, "epoch": 1731} {"train_loss": -23.082822799682617, "global_step": 143749, "epoch": 1731} {"train_loss": -23.030200958251953, "global_step": 143750, "epoch": 1731} {"train_loss": -23.26875877380371, "global_step": 143751, "epoch": 1731} {"train_loss": -23.097612380981445, "global_step": 143752, "epoch": 1731} {"train_loss": -22.72987174987793, "global_step": 143753, "epoch": 1731} {"train_loss": -22.655344009399414, "global_step": 143754, "epoch": 1731} {"train_loss": -23.09313787896949, "global_step": 143755, "epoch": 1731, "val_loss": 6332610.0} {"train_loss": -21.548416137695312, "global_step": 143756, "epoch": 1732} {"train_loss": -22.804996490478516, "global_step": 143757, "epoch": 1732} {"train_loss": -21.93602752685547, "global_step": 143758, "epoch": 1732} {"train_loss": -22.590681076049805, "global_step": 143759, "epoch": 1732} {"train_loss": -22.18898582458496, "global_step": 143760, "epoch": 1732} {"train_loss": -22.1486873626709, "global_step": 143761, "epoch": 1732} {"train_loss": -22.958032608032227, "global_step": 143762, "epoch": 1732} {"train_loss": -22.221532821655273, "global_step": 143763, "epoch": 1732} {"train_loss": -22.45746421813965, "global_step": 143764, "epoch": 1732} {"train_loss": -22.459012985229492, "global_step": 143765, "epoch": 1732} {"train_loss": -22.263349533081055, "global_step": 143766, "epoch": 1732} {"train_loss": -22.748355865478516, "global_step": 143767, "epoch": 1732} {"train_loss": -22.381244659423828, "global_step": 143768, "epoch": 1732} {"train_loss": -22.64338493347168, "global_step": 143769, "epoch": 1732} {"train_loss": -22.678945541381836, "global_step": 143770, "epoch": 1732} {"train_loss": -22.58547019958496, "global_step": 143771, "epoch": 1732} {"train_loss": -23.10939598083496, "global_step": 143772, "epoch": 1732} {"train_loss": -22.58347511291504, "global_step": 143773, "epoch": 1732} {"train_loss": -22.968046188354492, "global_step": 143774, "epoch": 1732} {"train_loss": -22.767444610595703, "global_step": 143775, "epoch": 1732} {"train_loss": -23.059762954711914, "global_step": 143776, "epoch": 1732} {"train_loss": -22.885114669799805, "global_step": 143777, "epoch": 1732} {"train_loss": -22.706329345703125, "global_step": 143778, "epoch": 1732} {"train_loss": -22.928701400756836, "global_step": 143779, "epoch": 1732} {"train_loss": -23.00821304321289, "global_step": 143780, "epoch": 1732} {"train_loss": -22.64023780822754, "global_step": 143781, "epoch": 1732} {"train_loss": -23.189300537109375, "global_step": 143782, "epoch": 1732} {"train_loss": -22.71376609802246, "global_step": 143783, "epoch": 1732} {"train_loss": -22.641754150390625, "global_step": 143784, "epoch": 1732} {"train_loss": -22.77827262878418, "global_step": 143785, "epoch": 1732} {"train_loss": -22.879135131835938, "global_step": 143786, "epoch": 1732} {"train_loss": -23.186811447143555, "global_step": 143787, "epoch": 1732} {"train_loss": -22.85462760925293, "global_step": 143788, "epoch": 1732} {"train_loss": -22.74005126953125, "global_step": 143789, "epoch": 1732} {"train_loss": -22.793832778930664, "global_step": 143790, "epoch": 1732} {"train_loss": -23.091943740844727, "global_step": 143791, "epoch": 1732} {"train_loss": -23.50472068786621, "global_step": 143792, "epoch": 1732} {"train_loss": -23.00296401977539, "global_step": 143793, "epoch": 1732} {"train_loss": -22.773672103881836, "global_step": 143794, "epoch": 1732} {"train_loss": -23.212190628051758, "global_step": 143795, "epoch": 1732} {"train_loss": -23.398590087890625, "global_step": 143796, "epoch": 1732} {"train_loss": -22.755943298339844, "global_step": 143797, "epoch": 1732} {"train_loss": -22.952625274658203, "global_step": 143798, "epoch": 1732} {"train_loss": -22.931337356567383, "global_step": 143799, "epoch": 1732} {"train_loss": -23.160634994506836, "global_step": 143800, "epoch": 1732} {"train_loss": -23.06476593017578, "global_step": 143801, "epoch": 1732} {"train_loss": -22.881559371948242, "global_step": 143802, "epoch": 1732} {"train_loss": -23.365312576293945, "global_step": 143803, "epoch": 1732} {"train_loss": -22.892292022705078, "global_step": 143804, "epoch": 1732} {"train_loss": -23.407255172729492, "global_step": 143805, "epoch": 1732} {"train_loss": -23.13795280456543, "global_step": 143806, "epoch": 1732} {"train_loss": -23.294281005859375, "global_step": 143807, "epoch": 1732} {"train_loss": -23.155616760253906, "global_step": 143808, "epoch": 1732} {"train_loss": -23.205968856811523, "global_step": 143809, "epoch": 1732} {"train_loss": -23.23398780822754, "global_step": 143810, "epoch": 1732} {"train_loss": -23.156644821166992, "global_step": 143811, "epoch": 1732} {"train_loss": -23.2103328704834, "global_step": 143812, "epoch": 1732} {"train_loss": -23.380048751831055, "global_step": 143813, "epoch": 1732} {"train_loss": -23.12040138244629, "global_step": 143814, "epoch": 1732} {"train_loss": -23.158227920532227, "global_step": 143815, "epoch": 1732} {"train_loss": -23.340551376342773, "global_step": 143816, "epoch": 1732} {"train_loss": -23.06804847717285, "global_step": 143817, "epoch": 1732} {"train_loss": -23.38426399230957, "global_step": 143818, "epoch": 1732} {"train_loss": -23.352758407592773, "global_step": 143819, "epoch": 1732} {"train_loss": -22.82139778137207, "global_step": 143820, "epoch": 1732} {"train_loss": -22.811492919921875, "global_step": 143821, "epoch": 1732} {"train_loss": -23.217599868774414, "global_step": 143822, "epoch": 1732} {"train_loss": -23.10831642150879, "global_step": 143823, "epoch": 1732} {"train_loss": -23.20745849609375, "global_step": 143824, "epoch": 1732} {"train_loss": -22.749282836914062, "global_step": 143825, "epoch": 1732} {"train_loss": -23.507436752319336, "global_step": 143826, "epoch": 1732} {"train_loss": -23.126367568969727, "global_step": 143827, "epoch": 1732} {"train_loss": -22.803129196166992, "global_step": 143828, "epoch": 1732} {"train_loss": -23.124834060668945, "global_step": 143829, "epoch": 1732} {"train_loss": -23.00510025024414, "global_step": 143830, "epoch": 1732} {"train_loss": -23.061630249023438, "global_step": 143831, "epoch": 1732} {"train_loss": -23.307214736938477, "global_step": 143832, "epoch": 1732} {"train_loss": -23.41065788269043, "global_step": 143833, "epoch": 1732} {"train_loss": -22.56084632873535, "global_step": 143834, "epoch": 1732} {"train_loss": -22.858362197875977, "global_step": 143835, "epoch": 1732} {"train_loss": -23.235559463500977, "global_step": 143836, "epoch": 1732} {"train_loss": -22.66766357421875, "global_step": 143837, "epoch": 1732} {"train_loss": -22.923158898411028, "global_step": 143838, "epoch": 1732, "val_loss": 6233284.0} {"train_loss": -22.898845672607422, "global_step": 143839, "epoch": 1733} {"train_loss": -23.128477096557617, "global_step": 143840, "epoch": 1733} {"train_loss": -22.82302474975586, "global_step": 143841, "epoch": 1733} {"train_loss": -23.04254150390625, "global_step": 143842, "epoch": 1733} {"train_loss": -23.49209976196289, "global_step": 143843, "epoch": 1733} {"train_loss": -22.658605575561523, "global_step": 143844, "epoch": 1733} {"train_loss": -23.132816314697266, "global_step": 143845, "epoch": 1733} {"train_loss": -22.77143669128418, "global_step": 143846, "epoch": 1733} {"train_loss": -22.76353645324707, "global_step": 143847, "epoch": 1733} {"train_loss": -23.12171173095703, "global_step": 143848, "epoch": 1733} {"train_loss": -23.157712936401367, "global_step": 143849, "epoch": 1733} {"train_loss": -22.91080093383789, "global_step": 143850, "epoch": 1733} {"train_loss": -23.035930633544922, "global_step": 143851, "epoch": 1733} {"train_loss": -23.086761474609375, "global_step": 143852, "epoch": 1733} {"train_loss": -23.127079010009766, "global_step": 143853, "epoch": 1733} {"train_loss": -23.146596908569336, "global_step": 143854, "epoch": 1733} {"train_loss": -23.01894187927246, "global_step": 143855, "epoch": 1733} {"train_loss": -23.051013946533203, "global_step": 143856, "epoch": 1733} {"train_loss": -22.7793025970459, "global_step": 143857, "epoch": 1733} {"train_loss": -23.031015396118164, "global_step": 143858, "epoch": 1733} {"train_loss": -22.75507164001465, "global_step": 143859, "epoch": 1733} {"train_loss": -23.027557373046875, "global_step": 143860, "epoch": 1733} {"train_loss": -23.460132598876953, "global_step": 143861, "epoch": 1733} {"train_loss": -23.08680534362793, "global_step": 143862, "epoch": 1733} {"train_loss": -23.220659255981445, "global_step": 143863, "epoch": 1733} {"train_loss": -23.15363883972168, "global_step": 143864, "epoch": 1733} {"train_loss": -22.9251766204834, "global_step": 143865, "epoch": 1733} {"train_loss": -23.13243865966797, "global_step": 143866, "epoch": 1733} {"train_loss": -23.3179931640625, "global_step": 143867, "epoch": 1733} {"train_loss": -23.166025161743164, "global_step": 143868, "epoch": 1733} {"train_loss": -23.191146850585938, "global_step": 143869, "epoch": 1733} {"train_loss": -22.9907169342041, "global_step": 143870, "epoch": 1733} {"train_loss": -23.099700927734375, "global_step": 143871, "epoch": 1733} {"train_loss": -23.02033042907715, "global_step": 143872, "epoch": 1733} {"train_loss": -23.01118278503418, "global_step": 143873, "epoch": 1733} {"train_loss": -23.01064109802246, "global_step": 143874, "epoch": 1733} {"train_loss": -23.035634994506836, "global_step": 143875, "epoch": 1733} {"train_loss": -23.159992218017578, "global_step": 143876, "epoch": 1733} {"train_loss": -22.897748947143555, "global_step": 143877, "epoch": 1733} {"train_loss": -22.861486434936523, "global_step": 143878, "epoch": 1733} {"train_loss": -23.152423858642578, "global_step": 143879, "epoch": 1733} {"train_loss": -23.6290225982666, "global_step": 143880, "epoch": 1733} {"train_loss": -23.514142990112305, "global_step": 143881, "epoch": 1733} {"train_loss": -23.16263771057129, "global_step": 143882, "epoch": 1733} {"train_loss": -23.318471908569336, "global_step": 143883, "epoch": 1733} {"train_loss": -23.64582633972168, "global_step": 143884, "epoch": 1733} {"train_loss": -22.980472564697266, "global_step": 143885, "epoch": 1733} {"train_loss": -22.95562744140625, "global_step": 143886, "epoch": 1733} {"train_loss": -23.05868148803711, "global_step": 143887, "epoch": 1733} {"train_loss": -23.431631088256836, "global_step": 143888, "epoch": 1733} {"train_loss": -23.252901077270508, "global_step": 143889, "epoch": 1733} {"train_loss": -22.89552116394043, "global_step": 143890, "epoch": 1733} {"train_loss": -22.99784278869629, "global_step": 143891, "epoch": 1733} {"train_loss": -23.34077262878418, "global_step": 143892, "epoch": 1733} {"train_loss": -23.68729019165039, "global_step": 143893, "epoch": 1733} {"train_loss": -23.371931076049805, "global_step": 143894, "epoch": 1733} {"train_loss": -23.44221305847168, "global_step": 143895, "epoch": 1733} {"train_loss": -22.95989418029785, "global_step": 143896, "epoch": 1733} {"train_loss": -23.38351821899414, "global_step": 143897, "epoch": 1733} {"train_loss": -23.282672882080078, "global_step": 143898, "epoch": 1733} {"train_loss": -22.846494674682617, "global_step": 143899, "epoch": 1733} {"train_loss": -22.84969139099121, "global_step": 143900, "epoch": 1733} {"train_loss": -22.33558464050293, "global_step": 143901, "epoch": 1733} {"train_loss": -22.359651565551758, "global_step": 143902, "epoch": 1733} {"train_loss": -23.238828659057617, "global_step": 143903, "epoch": 1733} {"train_loss": -23.19425392150879, "global_step": 143904, "epoch": 1733} {"train_loss": -22.7906494140625, "global_step": 143905, "epoch": 1733} {"train_loss": -23.104406356811523, "global_step": 143906, "epoch": 1733} {"train_loss": -23.01830291748047, "global_step": 143907, "epoch": 1733} {"train_loss": -22.732074737548828, "global_step": 143908, "epoch": 1733} {"train_loss": -22.712234497070312, "global_step": 143909, "epoch": 1733} {"train_loss": -23.24030876159668, "global_step": 143910, "epoch": 1733} {"train_loss": -22.989887237548828, "global_step": 143911, "epoch": 1733} {"train_loss": -23.141836166381836, "global_step": 143912, "epoch": 1733} {"train_loss": -23.118408203125, "global_step": 143913, "epoch": 1733} {"train_loss": -23.323816299438477, "global_step": 143914, "epoch": 1733} {"train_loss": -23.050764083862305, "global_step": 143915, "epoch": 1733} {"train_loss": -23.298099517822266, "global_step": 143916, "epoch": 1733} {"train_loss": -23.399551391601562, "global_step": 143917, "epoch": 1733} {"train_loss": -23.17315673828125, "global_step": 143918, "epoch": 1733} {"train_loss": -23.13121795654297, "global_step": 143919, "epoch": 1733} {"train_loss": -23.19309425354004, "global_step": 143920, "epoch": 1733} {"train_loss": -23.083250137696783, "global_step": 143921, "epoch": 1733, "val_loss": 6244931.0} {"train_loss": -22.545164108276367, "global_step": 143922, "epoch": 1734} {"train_loss": -22.726545333862305, "global_step": 143923, "epoch": 1734} {"train_loss": -22.912141799926758, "global_step": 143924, "epoch": 1734} {"train_loss": -23.31561279296875, "global_step": 143925, "epoch": 1734} {"train_loss": -23.08284568786621, "global_step": 143926, "epoch": 1734} {"train_loss": -22.794570922851562, "global_step": 143927, "epoch": 1734} {"train_loss": -22.90984535217285, "global_step": 143928, "epoch": 1734} {"train_loss": -23.078025817871094, "global_step": 143929, "epoch": 1734} {"train_loss": -23.29810333251953, "global_step": 143930, "epoch": 1734} {"train_loss": -23.01906967163086, "global_step": 143931, "epoch": 1734} {"train_loss": -22.96010398864746, "global_step": 143932, "epoch": 1734} {"train_loss": -23.09320068359375, "global_step": 143933, "epoch": 1734} {"train_loss": -22.852005004882812, "global_step": 143934, "epoch": 1734} {"train_loss": -23.470989227294922, "global_step": 143935, "epoch": 1734} {"train_loss": -23.162841796875, "global_step": 143936, "epoch": 1734} {"train_loss": -22.797277450561523, "global_step": 143937, "epoch": 1734} {"train_loss": -22.973003387451172, "global_step": 143938, "epoch": 1734} {"train_loss": -22.983083724975586, "global_step": 143939, "epoch": 1734} {"train_loss": -23.446979522705078, "global_step": 143940, "epoch": 1734} {"train_loss": -23.283353805541992, "global_step": 143941, "epoch": 1734} {"train_loss": -23.189924240112305, "global_step": 143942, "epoch": 1734} {"train_loss": -23.131805419921875, "global_step": 143943, "epoch": 1734} {"train_loss": -22.968326568603516, "global_step": 143944, "epoch": 1734} {"train_loss": -23.1567325592041, "global_step": 143945, "epoch": 1734} {"train_loss": -22.979040145874023, "global_step": 143946, "epoch": 1734} {"train_loss": -23.094064712524414, "global_step": 143947, "epoch": 1734} {"train_loss": -22.7364501953125, "global_step": 143948, "epoch": 1734} {"train_loss": -23.285736083984375, "global_step": 143949, "epoch": 1734} {"train_loss": -22.9268856048584, "global_step": 143950, "epoch": 1734} {"train_loss": -23.282466888427734, "global_step": 143951, "epoch": 1734} {"train_loss": -23.1742000579834, "global_step": 143952, "epoch": 1734} {"train_loss": -23.22554588317871, "global_step": 143953, "epoch": 1734} {"train_loss": -23.352859497070312, "global_step": 143954, "epoch": 1734} {"train_loss": -23.541616439819336, "global_step": 143955, "epoch": 1734} {"train_loss": -23.131452560424805, "global_step": 143956, "epoch": 1734} {"train_loss": -23.17083740234375, "global_step": 143957, "epoch": 1734} {"train_loss": -23.184843063354492, "global_step": 143958, "epoch": 1734} {"train_loss": -23.363550186157227, "global_step": 143959, "epoch": 1734} {"train_loss": -23.423593521118164, "global_step": 143960, "epoch": 1734} {"train_loss": -23.236984252929688, "global_step": 143961, "epoch": 1734} {"train_loss": -23.091684341430664, "global_step": 143962, "epoch": 1734} {"train_loss": -23.050872802734375, "global_step": 143963, "epoch": 1734} {"train_loss": -22.445144653320312, "global_step": 143964, "epoch": 1734} {"train_loss": -23.05618667602539, "global_step": 143965, "epoch": 1734} {"train_loss": -23.11383628845215, "global_step": 143966, "epoch": 1734} {"train_loss": -22.759628295898438, "global_step": 143967, "epoch": 1734} {"train_loss": -22.49245262145996, "global_step": 143968, "epoch": 1734} {"train_loss": -22.70947265625, "global_step": 143969, "epoch": 1734} {"train_loss": -22.7004451751709, "global_step": 143970, "epoch": 1734} {"train_loss": -22.50909996032715, "global_step": 143971, "epoch": 1734} {"train_loss": -22.56686782836914, "global_step": 143972, "epoch": 1734} {"train_loss": -22.929420471191406, "global_step": 143973, "epoch": 1734} {"train_loss": -23.090383529663086, "global_step": 143974, "epoch": 1734} {"train_loss": -22.796483993530273, "global_step": 143975, "epoch": 1734} {"train_loss": -23.01520347595215, "global_step": 143976, "epoch": 1734} {"train_loss": -22.880084991455078, "global_step": 143977, "epoch": 1734} {"train_loss": -22.984704971313477, "global_step": 143978, "epoch": 1734} {"train_loss": -23.24472427368164, "global_step": 143979, "epoch": 1734} {"train_loss": -22.86530876159668, "global_step": 143980, "epoch": 1734} {"train_loss": -23.22284507751465, "global_step": 143981, "epoch": 1734} {"train_loss": -23.32930564880371, "global_step": 143982, "epoch": 1734} {"train_loss": -23.194387435913086, "global_step": 143983, "epoch": 1734} {"train_loss": -23.022113800048828, "global_step": 143984, "epoch": 1734} {"train_loss": -23.3453426361084, "global_step": 143985, "epoch": 1734} {"train_loss": -23.133420944213867, "global_step": 143986, "epoch": 1734} {"train_loss": -23.199176788330078, "global_step": 143987, "epoch": 1734} {"train_loss": -22.94926643371582, "global_step": 143988, "epoch": 1734} {"train_loss": -23.416181564331055, "global_step": 143989, "epoch": 1734} {"train_loss": -23.137414932250977, "global_step": 143990, "epoch": 1734} {"train_loss": -22.978097915649414, "global_step": 143991, "epoch": 1734} {"train_loss": -23.38935661315918, "global_step": 143992, "epoch": 1734} {"train_loss": -23.200183868408203, "global_step": 143993, "epoch": 1734} {"train_loss": -23.306005477905273, "global_step": 143994, "epoch": 1734} {"train_loss": -22.92234230041504, "global_step": 143995, "epoch": 1734} {"train_loss": -23.57314109802246, "global_step": 143996, "epoch": 1734} {"train_loss": -23.150428771972656, "global_step": 143997, "epoch": 1734} {"train_loss": -22.808271408081055, "global_step": 143998, "epoch": 1734} {"train_loss": -23.40386962890625, "global_step": 143999, "epoch": 1734} {"train_loss": -23.462390899658203, "global_step": 144000, "epoch": 1734} {"train_loss": -23.224729537963867, "global_step": 144001, "epoch": 1734} {"train_loss": -23.295358657836914, "global_step": 144002, "epoch": 1734} {"train_loss": -23.068689346313477, "global_step": 144003, "epoch": 1734} {"train_loss": -23.0806902000703, "global_step": 144004, "epoch": 1734, "val_loss": 6439093.0} {"train_loss": -23.136545181274414, "global_step": 144005, "epoch": 1735} {"train_loss": -22.661916732788086, "global_step": 144006, "epoch": 1735} {"train_loss": -22.61185073852539, "global_step": 144007, "epoch": 1735} {"train_loss": -22.839277267456055, "global_step": 144008, "epoch": 1735} {"train_loss": -22.73050308227539, "global_step": 144009, "epoch": 1735} {"train_loss": -22.646230697631836, "global_step": 144010, "epoch": 1735} {"train_loss": -23.006942749023438, "global_step": 144011, "epoch": 1735} {"train_loss": -22.71744728088379, "global_step": 144012, "epoch": 1735} {"train_loss": -22.998971939086914, "global_step": 144013, "epoch": 1735} {"train_loss": -22.869497299194336, "global_step": 144014, "epoch": 1735} {"train_loss": -23.043066024780273, "global_step": 144015, "epoch": 1735} {"train_loss": -22.83292007446289, "global_step": 144016, "epoch": 1735} {"train_loss": -23.203758239746094, "global_step": 144017, "epoch": 1735} {"train_loss": -23.030607223510742, "global_step": 144018, "epoch": 1735} {"train_loss": -22.922494888305664, "global_step": 144019, "epoch": 1735} {"train_loss": -22.968915939331055, "global_step": 144020, "epoch": 1735} {"train_loss": -22.741735458374023, "global_step": 144021, "epoch": 1735} {"train_loss": -23.09323501586914, "global_step": 144022, "epoch": 1735} {"train_loss": -22.987905502319336, "global_step": 144023, "epoch": 1735} {"train_loss": -22.93476104736328, "global_step": 144024, "epoch": 1735} {"train_loss": -22.819782257080078, "global_step": 144025, "epoch": 1735} {"train_loss": -22.865402221679688, "global_step": 144026, "epoch": 1735} {"train_loss": -22.917959213256836, "global_step": 144027, "epoch": 1735} {"train_loss": -23.06344223022461, "global_step": 144028, "epoch": 1735} {"train_loss": -22.901752471923828, "global_step": 144029, "epoch": 1735} {"train_loss": -23.238037109375, "global_step": 144030, "epoch": 1735} {"train_loss": -22.83518409729004, "global_step": 144031, "epoch": 1735} {"train_loss": -23.035261154174805, "global_step": 144032, "epoch": 1735} {"train_loss": -23.259002685546875, "global_step": 144033, "epoch": 1735} {"train_loss": -22.943424224853516, "global_step": 144034, "epoch": 1735} {"train_loss": -23.371244430541992, "global_step": 144035, "epoch": 1735} {"train_loss": -23.048412322998047, "global_step": 144036, "epoch": 1735} {"train_loss": -23.170663833618164, "global_step": 144037, "epoch": 1735} {"train_loss": -23.651796340942383, "global_step": 144038, "epoch": 1735} {"train_loss": -23.300586700439453, "global_step": 144039, "epoch": 1735} {"train_loss": -23.382038116455078, "global_step": 144040, "epoch": 1735} {"train_loss": -23.282466888427734, "global_step": 144041, "epoch": 1735} {"train_loss": -23.075971603393555, "global_step": 144042, "epoch": 1735} {"train_loss": -23.121938705444336, "global_step": 144043, "epoch": 1735} {"train_loss": -22.969831466674805, "global_step": 144044, "epoch": 1735} {"train_loss": -23.038259506225586, "global_step": 144045, "epoch": 1735} {"train_loss": -23.435216903686523, "global_step": 144046, "epoch": 1735} {"train_loss": -23.43852424621582, "global_step": 144047, "epoch": 1735} {"train_loss": -23.1363525390625, "global_step": 144048, "epoch": 1735} {"train_loss": -23.319095611572266, "global_step": 144049, "epoch": 1735} {"train_loss": -23.254270553588867, "global_step": 144050, "epoch": 1735} {"train_loss": -22.699989318847656, "global_step": 144051, "epoch": 1735} {"train_loss": -23.18788719177246, "global_step": 144052, "epoch": 1735} {"train_loss": -23.59610366821289, "global_step": 144053, "epoch": 1735} {"train_loss": -23.164478302001953, "global_step": 144054, "epoch": 1735} {"train_loss": -23.154727935791016, "global_step": 144055, "epoch": 1735} {"train_loss": -23.170490264892578, "global_step": 144056, "epoch": 1735} {"train_loss": -23.247520446777344, "global_step": 144057, "epoch": 1735} {"train_loss": -23.475156784057617, "global_step": 144058, "epoch": 1735} {"train_loss": -23.273656845092773, "global_step": 144059, "epoch": 1735} {"train_loss": -22.940080642700195, "global_step": 144060, "epoch": 1735} {"train_loss": -23.52004051208496, "global_step": 144061, "epoch": 1735} {"train_loss": -23.2536563873291, "global_step": 144062, "epoch": 1735} {"train_loss": -23.15315055847168, "global_step": 144063, "epoch": 1735} {"train_loss": -22.9239444732666, "global_step": 144064, "epoch": 1735} {"train_loss": -23.2722225189209, "global_step": 144065, "epoch": 1735} {"train_loss": -23.2376708984375, "global_step": 144066, "epoch": 1735} {"train_loss": -22.9751033782959, "global_step": 144067, "epoch": 1735} {"train_loss": -23.34801483154297, "global_step": 144068, "epoch": 1735} {"train_loss": -22.81610107421875, "global_step": 144069, "epoch": 1735} {"train_loss": -23.04909324645996, "global_step": 144070, "epoch": 1735} {"train_loss": -23.476425170898438, "global_step": 144071, "epoch": 1735} {"train_loss": -23.487186431884766, "global_step": 144072, "epoch": 1735} {"train_loss": -23.28885269165039, "global_step": 144073, "epoch": 1735} {"train_loss": -22.980154037475586, "global_step": 144074, "epoch": 1735} {"train_loss": -23.668075561523438, "global_step": 144075, "epoch": 1735} {"train_loss": -23.209306716918945, "global_step": 144076, "epoch": 1735} {"train_loss": -23.07366943359375, "global_step": 144077, "epoch": 1735} {"train_loss": -23.418201446533203, "global_step": 144078, "epoch": 1735} {"train_loss": -23.072656631469727, "global_step": 144079, "epoch": 1735} {"train_loss": -23.371768951416016, "global_step": 144080, "epoch": 1735} {"train_loss": -23.330358505249023, "global_step": 144081, "epoch": 1735} {"train_loss": -23.187702178955078, "global_step": 144082, "epoch": 1735} {"train_loss": -23.202848434448242, "global_step": 144083, "epoch": 1735} {"train_loss": -22.646970748901367, "global_step": 144084, "epoch": 1735} {"train_loss": -23.188512802124023, "global_step": 144085, "epoch": 1735} {"train_loss": -22.97797966003418, "global_step": 144086, "epoch": 1735} {"train_loss": -23.103253697774495, "global_step": 144087, "epoch": 1735, "val_loss": 6301943.0} {"train_loss": -22.51043128967285, "global_step": 144088, "epoch": 1736} {"train_loss": -22.466968536376953, "global_step": 144089, "epoch": 1736} {"train_loss": -22.678882598876953, "global_step": 144090, "epoch": 1736} {"train_loss": -22.630542755126953, "global_step": 144091, "epoch": 1736} {"train_loss": -22.97128677368164, "global_step": 144092, "epoch": 1736} {"train_loss": -22.686805725097656, "global_step": 144093, "epoch": 1736} {"train_loss": -22.88405418395996, "global_step": 144094, "epoch": 1736} {"train_loss": -22.900510787963867, "global_step": 144095, "epoch": 1736} {"train_loss": -22.661954879760742, "global_step": 144096, "epoch": 1736} {"train_loss": -22.357118606567383, "global_step": 144097, "epoch": 1736} {"train_loss": -23.07355308532715, "global_step": 144098, "epoch": 1736} {"train_loss": -23.05661964416504, "global_step": 144099, "epoch": 1736} {"train_loss": -22.887725830078125, "global_step": 144100, "epoch": 1736} {"train_loss": -22.768827438354492, "global_step": 144101, "epoch": 1736} {"train_loss": -23.113201141357422, "global_step": 144102, "epoch": 1736} {"train_loss": -22.975784301757812, "global_step": 144103, "epoch": 1736} {"train_loss": -22.982437133789062, "global_step": 144104, "epoch": 1736} {"train_loss": -23.0163631439209, "global_step": 144105, "epoch": 1736} {"train_loss": -23.07318878173828, "global_step": 144106, "epoch": 1736} {"train_loss": -22.665246963500977, "global_step": 144107, "epoch": 1736} {"train_loss": -22.944005966186523, "global_step": 144108, "epoch": 1736} {"train_loss": -23.119916915893555, "global_step": 144109, "epoch": 1736} {"train_loss": -22.999216079711914, "global_step": 144110, "epoch": 1736} {"train_loss": -23.30470085144043, "global_step": 144111, "epoch": 1736} {"train_loss": -23.221759796142578, "global_step": 144112, "epoch": 1736} {"train_loss": -23.380603790283203, "global_step": 144113, "epoch": 1736} {"train_loss": -22.952808380126953, "global_step": 144114, "epoch": 1736} {"train_loss": -22.736141204833984, "global_step": 144115, "epoch": 1736} {"train_loss": -23.09345054626465, "global_step": 144116, "epoch": 1736} {"train_loss": -23.39322280883789, "global_step": 144117, "epoch": 1736} {"train_loss": -23.162933349609375, "global_step": 144118, "epoch": 1736} {"train_loss": -23.163101196289062, "global_step": 144119, "epoch": 1736} {"train_loss": -23.559965133666992, "global_step": 144120, "epoch": 1736} {"train_loss": -23.262067794799805, "global_step": 144121, "epoch": 1736} {"train_loss": -23.08277702331543, "global_step": 144122, "epoch": 1736} {"train_loss": -23.1492919921875, "global_step": 144123, "epoch": 1736} {"train_loss": -23.016223907470703, "global_step": 144124, "epoch": 1736} {"train_loss": -22.961536407470703, "global_step": 144125, "epoch": 1736} {"train_loss": -23.172780990600586, "global_step": 144126, "epoch": 1736} {"train_loss": -22.904699325561523, "global_step": 144127, "epoch": 1736} {"train_loss": -23.3154354095459, "global_step": 144128, "epoch": 1736} {"train_loss": -23.093233108520508, "global_step": 144129, "epoch": 1736} {"train_loss": -22.802310943603516, "global_step": 144130, "epoch": 1736} {"train_loss": -23.26639175415039, "global_step": 144131, "epoch": 1736} {"train_loss": -22.921131134033203, "global_step": 144132, "epoch": 1736} {"train_loss": -22.96497917175293, "global_step": 144133, "epoch": 1736} {"train_loss": -23.265100479125977, "global_step": 144134, "epoch": 1736} {"train_loss": -23.141815185546875, "global_step": 144135, "epoch": 1736} {"train_loss": -23.3715763092041, "global_step": 144136, "epoch": 1736} {"train_loss": -23.138044357299805, "global_step": 144137, "epoch": 1736} {"train_loss": -23.462392807006836, "global_step": 144138, "epoch": 1736} {"train_loss": -23.26423454284668, "global_step": 144139, "epoch": 1736} {"train_loss": -22.910438537597656, "global_step": 144140, "epoch": 1736} {"train_loss": -23.213836669921875, "global_step": 144141, "epoch": 1736} {"train_loss": -22.992477416992188, "global_step": 144142, "epoch": 1736} {"train_loss": -23.133283615112305, "global_step": 144143, "epoch": 1736} {"train_loss": -23.247682571411133, "global_step": 144144, "epoch": 1736} {"train_loss": -23.361356735229492, "global_step": 144145, "epoch": 1736} {"train_loss": -22.85662841796875, "global_step": 144146, "epoch": 1736} {"train_loss": -23.153554916381836, "global_step": 144147, "epoch": 1736} {"train_loss": -23.194303512573242, "global_step": 144148, "epoch": 1736} {"train_loss": -23.41232681274414, "global_step": 144149, "epoch": 1736} {"train_loss": -23.25798988342285, "global_step": 144150, "epoch": 1736} {"train_loss": -23.18441390991211, "global_step": 144151, "epoch": 1736} {"train_loss": -23.154504776000977, "global_step": 144152, "epoch": 1736} {"train_loss": -22.81471061706543, "global_step": 144153, "epoch": 1736} {"train_loss": -23.23550796508789, "global_step": 144154, "epoch": 1736} {"train_loss": -23.27894401550293, "global_step": 144155, "epoch": 1736} {"train_loss": -23.163488388061523, "global_step": 144156, "epoch": 1736} {"train_loss": -23.25288963317871, "global_step": 144157, "epoch": 1736} {"train_loss": -23.178327560424805, "global_step": 144158, "epoch": 1736} {"train_loss": -23.144378662109375, "global_step": 144159, "epoch": 1736} {"train_loss": -23.350635528564453, "global_step": 144160, "epoch": 1736} {"train_loss": -22.95717430114746, "global_step": 144161, "epoch": 1736} {"train_loss": -23.270980834960938, "global_step": 144162, "epoch": 1736} {"train_loss": -23.199920654296875, "global_step": 144163, "epoch": 1736} {"train_loss": -23.28462791442871, "global_step": 144164, "epoch": 1736} {"train_loss": -23.40485954284668, "global_step": 144165, "epoch": 1736} {"train_loss": -23.5071964263916, "global_step": 144166, "epoch": 1736} {"train_loss": -23.28388214111328, "global_step": 144167, "epoch": 1736} {"train_loss": -23.447851181030273, "global_step": 144168, "epoch": 1736} {"train_loss": -23.073848724365234, "global_step": 144169, "epoch": 1736} {"train_loss": -23.08178522500647, "global_step": 144170, "epoch": 1736, "val_loss": 6383226.5} {"train_loss": -22.29484748840332, "global_step": 144171, "epoch": 1737} {"train_loss": -22.673471450805664, "global_step": 144172, "epoch": 1737} {"train_loss": -22.607763290405273, "global_step": 144173, "epoch": 1737} {"train_loss": -22.911977767944336, "global_step": 144174, "epoch": 1737} {"train_loss": -22.516605377197266, "global_step": 144175, "epoch": 1737} {"train_loss": -22.9444522857666, "global_step": 144176, "epoch": 1737} {"train_loss": -22.73040199279785, "global_step": 144177, "epoch": 1737} {"train_loss": -22.617273330688477, "global_step": 144178, "epoch": 1737} {"train_loss": -22.949220657348633, "global_step": 144179, "epoch": 1737} {"train_loss": -23.09038543701172, "global_step": 144180, "epoch": 1737} {"train_loss": -22.88062286376953, "global_step": 144181, "epoch": 1737} {"train_loss": -23.088903427124023, "global_step": 144182, "epoch": 1737} {"train_loss": -22.762826919555664, "global_step": 144183, "epoch": 1737} {"train_loss": -22.8751277923584, "global_step": 144184, "epoch": 1737} {"train_loss": -22.882740020751953, "global_step": 144185, "epoch": 1737} {"train_loss": -23.17728614807129, "global_step": 144186, "epoch": 1737} {"train_loss": -22.959318161010742, "global_step": 144187, "epoch": 1737} {"train_loss": -22.969053268432617, "global_step": 144188, "epoch": 1737} {"train_loss": -22.759870529174805, "global_step": 144189, "epoch": 1737} {"train_loss": -23.142162322998047, "global_step": 144190, "epoch": 1737} {"train_loss": -23.13007164001465, "global_step": 144191, "epoch": 1737} {"train_loss": -23.047128677368164, "global_step": 144192, "epoch": 1737} {"train_loss": -23.322221755981445, "global_step": 144193, "epoch": 1737} {"train_loss": -23.125476837158203, "global_step": 144194, "epoch": 1737} {"train_loss": -23.052688598632812, "global_step": 144195, "epoch": 1737} {"train_loss": -23.168622970581055, "global_step": 144196, "epoch": 1737} {"train_loss": -23.357742309570312, "global_step": 144197, "epoch": 1737} {"train_loss": -23.256921768188477, "global_step": 144198, "epoch": 1737} {"train_loss": -23.268421173095703, "global_step": 144199, "epoch": 1737} {"train_loss": -23.260406494140625, "global_step": 144200, "epoch": 1737} {"train_loss": -23.29435157775879, "global_step": 144201, "epoch": 1737} {"train_loss": -22.969377517700195, "global_step": 144202, "epoch": 1737} {"train_loss": -22.741662979125977, "global_step": 144203, "epoch": 1737} {"train_loss": -23.262977600097656, "global_step": 144204, "epoch": 1737} {"train_loss": -23.009735107421875, "global_step": 144205, "epoch": 1737} {"train_loss": -22.906152725219727, "global_step": 144206, "epoch": 1737} {"train_loss": -23.033437728881836, "global_step": 144207, "epoch": 1737} {"train_loss": -23.350122451782227, "global_step": 144208, "epoch": 1737} {"train_loss": -23.189332962036133, "global_step": 144209, "epoch": 1737} {"train_loss": -23.005704879760742, "global_step": 144210, "epoch": 1737} {"train_loss": -23.5372371673584, "global_step": 144211, "epoch": 1737} {"train_loss": -23.161178588867188, "global_step": 144212, "epoch": 1737} {"train_loss": -23.13057518005371, "global_step": 144213, "epoch": 1737} {"train_loss": -23.283246994018555, "global_step": 144214, "epoch": 1737} {"train_loss": -23.03218650817871, "global_step": 144215, "epoch": 1737} {"train_loss": -22.935165405273438, "global_step": 144216, "epoch": 1737} {"train_loss": -23.184993743896484, "global_step": 144217, "epoch": 1737} {"train_loss": -23.18511390686035, "global_step": 144218, "epoch": 1737} {"train_loss": -23.208816528320312, "global_step": 144219, "epoch": 1737} {"train_loss": -22.993213653564453, "global_step": 144220, "epoch": 1737} {"train_loss": -23.296829223632812, "global_step": 144221, "epoch": 1737} {"train_loss": -23.044797897338867, "global_step": 144222, "epoch": 1737} {"train_loss": -23.110349655151367, "global_step": 144223, "epoch": 1737} {"train_loss": -23.135583877563477, "global_step": 144224, "epoch": 1737} {"train_loss": -23.450021743774414, "global_step": 144225, "epoch": 1737} {"train_loss": -22.928464889526367, "global_step": 144226, "epoch": 1737} {"train_loss": -22.997581481933594, "global_step": 144227, "epoch": 1737} {"train_loss": -23.160633087158203, "global_step": 144228, "epoch": 1737} {"train_loss": -23.12915802001953, "global_step": 144229, "epoch": 1737} {"train_loss": -22.88336944580078, "global_step": 144230, "epoch": 1737} {"train_loss": -23.565261840820312, "global_step": 144231, "epoch": 1737} {"train_loss": -23.151395797729492, "global_step": 144232, "epoch": 1737} {"train_loss": -23.59537696838379, "global_step": 144233, "epoch": 1737} {"train_loss": -23.435285568237305, "global_step": 144234, "epoch": 1737} {"train_loss": -23.090890884399414, "global_step": 144235, "epoch": 1737} {"train_loss": -23.025602340698242, "global_step": 144236, "epoch": 1737} {"train_loss": -23.360450744628906, "global_step": 144237, "epoch": 1737} {"train_loss": -23.198881149291992, "global_step": 144238, "epoch": 1737} {"train_loss": -23.01299476623535, "global_step": 144239, "epoch": 1737} {"train_loss": -23.323226928710938, "global_step": 144240, "epoch": 1737} {"train_loss": -22.93174171447754, "global_step": 144241, "epoch": 1737} {"train_loss": -23.049121856689453, "global_step": 144242, "epoch": 1737} {"train_loss": -22.932416915893555, "global_step": 144243, "epoch": 1737} {"train_loss": -23.12213706970215, "global_step": 144244, "epoch": 1737} {"train_loss": -22.97801971435547, "global_step": 144245, "epoch": 1737} {"train_loss": -23.23155403137207, "global_step": 144246, "epoch": 1737} {"train_loss": -22.5557804107666, "global_step": 144247, "epoch": 1737} {"train_loss": -22.91291618347168, "global_step": 144248, "epoch": 1737} {"train_loss": -23.119338989257812, "global_step": 144249, "epoch": 1737} {"train_loss": -23.375581741333008, "global_step": 144250, "epoch": 1737} {"train_loss": -23.162336349487305, "global_step": 144251, "epoch": 1737} {"train_loss": -23.435522079467773, "global_step": 144252, "epoch": 1737} {"train_loss": -23.077547326145403, "global_step": 144253, "epoch": 1737, "val_loss": 6374055.0} {"train_loss": -23.04673957824707, "global_step": 144254, "epoch": 1738} {"train_loss": -22.9364070892334, "global_step": 144255, "epoch": 1738} {"train_loss": -23.03090476989746, "global_step": 144256, "epoch": 1738} {"train_loss": -22.8839054107666, "global_step": 144257, "epoch": 1738} {"train_loss": -23.01438331604004, "global_step": 144258, "epoch": 1738} {"train_loss": -23.084747314453125, "global_step": 144259, "epoch": 1738} {"train_loss": -22.869709014892578, "global_step": 144260, "epoch": 1738} {"train_loss": -22.93116569519043, "global_step": 144261, "epoch": 1738} {"train_loss": -23.168302536010742, "global_step": 144262, "epoch": 1738} {"train_loss": -23.00535774230957, "global_step": 144263, "epoch": 1738} {"train_loss": -23.3553466796875, "global_step": 144264, "epoch": 1738} {"train_loss": -23.306255340576172, "global_step": 144265, "epoch": 1738} {"train_loss": -23.10263442993164, "global_step": 144266, "epoch": 1738} {"train_loss": -23.388517379760742, "global_step": 144267, "epoch": 1738} {"train_loss": -22.98893165588379, "global_step": 144268, "epoch": 1738} {"train_loss": -23.162073135375977, "global_step": 144269, "epoch": 1738} {"train_loss": -23.123334884643555, "global_step": 144270, "epoch": 1738} {"train_loss": -22.991710662841797, "global_step": 144271, "epoch": 1738} {"train_loss": -23.284894943237305, "global_step": 144272, "epoch": 1738} {"train_loss": -23.16301918029785, "global_step": 144273, "epoch": 1738} {"train_loss": -23.45301628112793, "global_step": 144274, "epoch": 1738} {"train_loss": -23.457672119140625, "global_step": 144275, "epoch": 1738} {"train_loss": -23.0875186920166, "global_step": 144276, "epoch": 1738} {"train_loss": -22.95828628540039, "global_step": 144277, "epoch": 1738} {"train_loss": -22.945894241333008, "global_step": 144278, "epoch": 1738} {"train_loss": -23.242324829101562, "global_step": 144279, "epoch": 1738} {"train_loss": -22.9527530670166, "global_step": 144280, "epoch": 1738} {"train_loss": -23.24322509765625, "global_step": 144281, "epoch": 1738} {"train_loss": -23.285175323486328, "global_step": 144282, "epoch": 1738} {"train_loss": -23.367431640625, "global_step": 144283, "epoch": 1738} {"train_loss": -22.988821029663086, "global_step": 144284, "epoch": 1738} {"train_loss": -23.71147918701172, "global_step": 144285, "epoch": 1738} {"train_loss": -23.26407814025879, "global_step": 144286, "epoch": 1738} {"train_loss": -23.084604263305664, "global_step": 144287, "epoch": 1738} {"train_loss": -23.251577377319336, "global_step": 144288, "epoch": 1738} {"train_loss": -22.77534294128418, "global_step": 144289, "epoch": 1738} {"train_loss": -23.186857223510742, "global_step": 144290, "epoch": 1738} {"train_loss": -23.244592666625977, "global_step": 144291, "epoch": 1738} {"train_loss": -23.205305099487305, "global_step": 144292, "epoch": 1738} {"train_loss": -22.951831817626953, "global_step": 144293, "epoch": 1738} {"train_loss": -23.256986618041992, "global_step": 144294, "epoch": 1738} {"train_loss": -23.566919326782227, "global_step": 144295, "epoch": 1738} {"train_loss": -23.13718032836914, "global_step": 144296, "epoch": 1738} {"train_loss": -23.011804580688477, "global_step": 144297, "epoch": 1738} {"train_loss": -22.842487335205078, "global_step": 144298, "epoch": 1738} {"train_loss": -23.411592483520508, "global_step": 144299, "epoch": 1738} {"train_loss": -23.07248878479004, "global_step": 144300, "epoch": 1738} {"train_loss": -23.10860252380371, "global_step": 144301, "epoch": 1738} {"train_loss": -23.01279640197754, "global_step": 144302, "epoch": 1738} {"train_loss": -23.203027725219727, "global_step": 144303, "epoch": 1738} {"train_loss": -23.050790786743164, "global_step": 144304, "epoch": 1738} {"train_loss": -22.840436935424805, "global_step": 144305, "epoch": 1738} {"train_loss": -22.65707015991211, "global_step": 144306, "epoch": 1738} {"train_loss": -23.15453338623047, "global_step": 144307, "epoch": 1738} {"train_loss": -23.3099422454834, "global_step": 144308, "epoch": 1738} {"train_loss": -23.319272994995117, "global_step": 144309, "epoch": 1738} {"train_loss": -23.012266159057617, "global_step": 144310, "epoch": 1738} {"train_loss": -23.33784294128418, "global_step": 144311, "epoch": 1738} {"train_loss": -22.732099533081055, "global_step": 144312, "epoch": 1738} {"train_loss": -22.884504318237305, "global_step": 144313, "epoch": 1738} {"train_loss": -23.453969955444336, "global_step": 144314, "epoch": 1738} {"train_loss": -23.321584701538086, "global_step": 144315, "epoch": 1738} {"train_loss": -23.028837203979492, "global_step": 144316, "epoch": 1738} {"train_loss": -23.2083740234375, "global_step": 144317, "epoch": 1738} {"train_loss": -23.261526107788086, "global_step": 144318, "epoch": 1738} {"train_loss": -22.790624618530273, "global_step": 144319, "epoch": 1738} {"train_loss": -23.290197372436523, "global_step": 144320, "epoch": 1738} {"train_loss": -23.30103874206543, "global_step": 144321, "epoch": 1738} {"train_loss": -23.041379928588867, "global_step": 144322, "epoch": 1738} {"train_loss": -22.974193572998047, "global_step": 144323, "epoch": 1738} {"train_loss": -23.02093505859375, "global_step": 144324, "epoch": 1738} {"train_loss": -23.105262756347656, "global_step": 144325, "epoch": 1738} {"train_loss": -23.072484970092773, "global_step": 144326, "epoch": 1738} {"train_loss": -23.13324737548828, "global_step": 144327, "epoch": 1738} {"train_loss": -23.52840232849121, "global_step": 144328, "epoch": 1738} {"train_loss": -23.152587890625, "global_step": 144329, "epoch": 1738} {"train_loss": -22.694116592407227, "global_step": 144330, "epoch": 1738} {"train_loss": -23.24239158630371, "global_step": 144331, "epoch": 1738} {"train_loss": -23.467313766479492, "global_step": 144332, "epoch": 1738} {"train_loss": -23.361989974975586, "global_step": 144333, "epoch": 1738} {"train_loss": -22.815673828125, "global_step": 144334, "epoch": 1738} {"train_loss": -23.477092742919922, "global_step": 144335, "epoch": 1738} {"train_loss": -23.12919285785721, "global_step": 144336, "epoch": 1738, "val_loss": 6364220.0} {"train_loss": -22.842065811157227, "global_step": 144337, "epoch": 1739} {"train_loss": -23.162500381469727, "global_step": 144338, "epoch": 1739} {"train_loss": -22.862699508666992, "global_step": 144339, "epoch": 1739} {"train_loss": -22.966571807861328, "global_step": 144340, "epoch": 1739} {"train_loss": -22.86459732055664, "global_step": 144341, "epoch": 1739} {"train_loss": -22.750961303710938, "global_step": 144342, "epoch": 1739} {"train_loss": -22.716066360473633, "global_step": 144343, "epoch": 1739} {"train_loss": -22.8350887298584, "global_step": 144344, "epoch": 1739} {"train_loss": -23.045352935791016, "global_step": 144345, "epoch": 1739} {"train_loss": -23.35133171081543, "global_step": 144346, "epoch": 1739} {"train_loss": -23.250858306884766, "global_step": 144347, "epoch": 1739} {"train_loss": -23.125511169433594, "global_step": 144348, "epoch": 1739} {"train_loss": -23.059934616088867, "global_step": 144349, "epoch": 1739} {"train_loss": -22.98427963256836, "global_step": 144350, "epoch": 1739} {"train_loss": -23.02661895751953, "global_step": 144351, "epoch": 1739} {"train_loss": -23.130504608154297, "global_step": 144352, "epoch": 1739} {"train_loss": -23.258331298828125, "global_step": 144353, "epoch": 1739} {"train_loss": -22.892017364501953, "global_step": 144354, "epoch": 1739} {"train_loss": -22.755142211914062, "global_step": 144355, "epoch": 1739} {"train_loss": -23.342588424682617, "global_step": 144356, "epoch": 1739} {"train_loss": -23.05710792541504, "global_step": 144357, "epoch": 1739} {"train_loss": -23.192655563354492, "global_step": 144358, "epoch": 1739} {"train_loss": -23.30770492553711, "global_step": 144359, "epoch": 1739} {"train_loss": -23.16179084777832, "global_step": 144360, "epoch": 1739} {"train_loss": -23.0611572265625, "global_step": 144361, "epoch": 1739} {"train_loss": -23.59799575805664, "global_step": 144362, "epoch": 1739} {"train_loss": -23.370676040649414, "global_step": 144363, "epoch": 1739} {"train_loss": -23.58820915222168, "global_step": 144364, "epoch": 1739} {"train_loss": -23.290857315063477, "global_step": 144365, "epoch": 1739} {"train_loss": -23.190383911132812, "global_step": 144366, "epoch": 1739} {"train_loss": -23.189634323120117, "global_step": 144367, "epoch": 1739} {"train_loss": -23.22027587890625, "global_step": 144368, "epoch": 1739} {"train_loss": -23.17461585998535, "global_step": 144369, "epoch": 1739} {"train_loss": -23.162899017333984, "global_step": 144370, "epoch": 1739} {"train_loss": -23.5638484954834, "global_step": 144371, "epoch": 1739} {"train_loss": -23.20981788635254, "global_step": 144372, "epoch": 1739} {"train_loss": -23.214109420776367, "global_step": 144373, "epoch": 1739} {"train_loss": -23.3016357421875, "global_step": 144374, "epoch": 1739} {"train_loss": -23.29363441467285, "global_step": 144375, "epoch": 1739} {"train_loss": -23.280439376831055, "global_step": 144376, "epoch": 1739} {"train_loss": -22.97364616394043, "global_step": 144377, "epoch": 1739} {"train_loss": -22.95319938659668, "global_step": 144378, "epoch": 1739} {"train_loss": -22.964082717895508, "global_step": 144379, "epoch": 1739} {"train_loss": -23.311513900756836, "global_step": 144380, "epoch": 1739} {"train_loss": -22.978769302368164, "global_step": 144381, "epoch": 1739} {"train_loss": -23.303974151611328, "global_step": 144382, "epoch": 1739} {"train_loss": -23.366535186767578, "global_step": 144383, "epoch": 1739} {"train_loss": -23.30221176147461, "global_step": 144384, "epoch": 1739} {"train_loss": -23.67386817932129, "global_step": 144385, "epoch": 1739} {"train_loss": -23.34243392944336, "global_step": 144386, "epoch": 1739} {"train_loss": -22.885290145874023, "global_step": 144387, "epoch": 1739} {"train_loss": -22.81389808654785, "global_step": 144388, "epoch": 1739} {"train_loss": -23.216461181640625, "global_step": 144389, "epoch": 1739} {"train_loss": -23.208580017089844, "global_step": 144390, "epoch": 1739} {"train_loss": -22.935646057128906, "global_step": 144391, "epoch": 1739} {"train_loss": -23.179763793945312, "global_step": 144392, "epoch": 1739} {"train_loss": -22.993690490722656, "global_step": 144393, "epoch": 1739} {"train_loss": -23.12769889831543, "global_step": 144394, "epoch": 1739} {"train_loss": -23.177974700927734, "global_step": 144395, "epoch": 1739} {"train_loss": -23.48875617980957, "global_step": 144396, "epoch": 1739} {"train_loss": -22.914350509643555, "global_step": 144397, "epoch": 1739} {"train_loss": -23.14044189453125, "global_step": 144398, "epoch": 1739} {"train_loss": -22.97344970703125, "global_step": 144399, "epoch": 1739} {"train_loss": -23.389455795288086, "global_step": 144400, "epoch": 1739} {"train_loss": -23.028837203979492, "global_step": 144401, "epoch": 1739} {"train_loss": -22.936288833618164, "global_step": 144402, "epoch": 1739} {"train_loss": -23.149166107177734, "global_step": 144403, "epoch": 1739} {"train_loss": -23.22230339050293, "global_step": 144404, "epoch": 1739} {"train_loss": -23.15523338317871, "global_step": 144405, "epoch": 1739} {"train_loss": -23.403242111206055, "global_step": 144406, "epoch": 1739} {"train_loss": -23.0036563873291, "global_step": 144407, "epoch": 1739} {"train_loss": -23.04231071472168, "global_step": 144408, "epoch": 1739} {"train_loss": -23.360815048217773, "global_step": 144409, "epoch": 1739} {"train_loss": -23.19922637939453, "global_step": 144410, "epoch": 1739} {"train_loss": -22.961246490478516, "global_step": 144411, "epoch": 1739} {"train_loss": -23.094282150268555, "global_step": 144412, "epoch": 1739} {"train_loss": -23.12794303894043, "global_step": 144413, "epoch": 1739} {"train_loss": -23.14443588256836, "global_step": 144414, "epoch": 1739} {"train_loss": -23.041746139526367, "global_step": 144415, "epoch": 1739} {"train_loss": -23.322662353515625, "global_step": 144416, "epoch": 1739} {"train_loss": -23.475629806518555, "global_step": 144417, "epoch": 1739} {"train_loss": -23.361618041992188, "global_step": 144418, "epoch": 1739} {"train_loss": -23.15164193762354, "global_step": 144419, "epoch": 1739, "val_loss": 6379242.0} {"train_loss": -22.483057022094727, "global_step": 144420, "epoch": 1740} {"train_loss": -20.711088180541992, "global_step": 144421, "epoch": 1740} {"train_loss": -21.66257095336914, "global_step": 144422, "epoch": 1740} {"train_loss": -22.797163009643555, "global_step": 144423, "epoch": 1740} {"train_loss": -22.381465911865234, "global_step": 144424, "epoch": 1740} {"train_loss": -21.817245483398438, "global_step": 144425, "epoch": 1740} {"train_loss": -22.783466339111328, "global_step": 144426, "epoch": 1740} {"train_loss": -22.197011947631836, "global_step": 144427, "epoch": 1740} {"train_loss": -22.762216567993164, "global_step": 144428, "epoch": 1740} {"train_loss": -21.819446563720703, "global_step": 144429, "epoch": 1740} {"train_loss": -22.540952682495117, "global_step": 144430, "epoch": 1740} {"train_loss": -22.219865798950195, "global_step": 144431, "epoch": 1740} {"train_loss": -22.46076774597168, "global_step": 144432, "epoch": 1740} {"train_loss": -22.685626983642578, "global_step": 144433, "epoch": 1740} {"train_loss": -22.793928146362305, "global_step": 144434, "epoch": 1740} {"train_loss": -22.585012435913086, "global_step": 144435, "epoch": 1740} {"train_loss": -22.19002914428711, "global_step": 144436, "epoch": 1740} {"train_loss": -22.52808952331543, "global_step": 144437, "epoch": 1740} {"train_loss": -22.967939376831055, "global_step": 144438, "epoch": 1740} {"train_loss": -22.475107192993164, "global_step": 144439, "epoch": 1740} {"train_loss": -22.569656372070312, "global_step": 144440, "epoch": 1740} {"train_loss": -22.835407257080078, "global_step": 144441, "epoch": 1740} {"train_loss": -22.834125518798828, "global_step": 144442, "epoch": 1740} {"train_loss": -22.77720069885254, "global_step": 144443, "epoch": 1740} {"train_loss": -22.785953521728516, "global_step": 144444, "epoch": 1740} {"train_loss": -22.988677978515625, "global_step": 144445, "epoch": 1740} {"train_loss": -22.85027503967285, "global_step": 144446, "epoch": 1740} {"train_loss": -22.82172203063965, "global_step": 144447, "epoch": 1740} {"train_loss": -23.04926872253418, "global_step": 144448, "epoch": 1740} {"train_loss": -22.992765426635742, "global_step": 144449, "epoch": 1740} {"train_loss": -23.168413162231445, "global_step": 144450, "epoch": 1740} {"train_loss": -22.620471954345703, "global_step": 144451, "epoch": 1740} {"train_loss": -23.082489013671875, "global_step": 144452, "epoch": 1740} {"train_loss": -23.08903694152832, "global_step": 144453, "epoch": 1740} {"train_loss": -22.891000747680664, "global_step": 144454, "epoch": 1740} {"train_loss": -22.943410873413086, "global_step": 144455, "epoch": 1740} {"train_loss": -23.020597457885742, "global_step": 144456, "epoch": 1740} {"train_loss": -23.130680084228516, "global_step": 144457, "epoch": 1740} {"train_loss": -22.94221305847168, "global_step": 144458, "epoch": 1740} {"train_loss": -23.140806198120117, "global_step": 144459, "epoch": 1740} {"train_loss": -22.918378829956055, "global_step": 144460, "epoch": 1740} {"train_loss": -23.38983917236328, "global_step": 144461, "epoch": 1740} {"train_loss": -23.355731964111328, "global_step": 144462, "epoch": 1740} {"train_loss": -23.029760360717773, "global_step": 144463, "epoch": 1740} {"train_loss": -23.4200382232666, "global_step": 144464, "epoch": 1740} {"train_loss": -22.989883422851562, "global_step": 144465, "epoch": 1740} {"train_loss": -23.445215225219727, "global_step": 144466, "epoch": 1740} {"train_loss": -23.1329402923584, "global_step": 144467, "epoch": 1740} {"train_loss": -23.144968032836914, "global_step": 144468, "epoch": 1740} {"train_loss": -23.471635818481445, "global_step": 144469, "epoch": 1740} {"train_loss": -23.122100830078125, "global_step": 144470, "epoch": 1740} {"train_loss": -22.934492111206055, "global_step": 144471, "epoch": 1740} {"train_loss": -22.896697998046875, "global_step": 144472, "epoch": 1740} {"train_loss": -23.295690536499023, "global_step": 144473, "epoch": 1740} {"train_loss": -23.514225006103516, "global_step": 144474, "epoch": 1740} {"train_loss": -23.221731185913086, "global_step": 144475, "epoch": 1740} {"train_loss": -23.108463287353516, "global_step": 144476, "epoch": 1740} {"train_loss": -23.346189498901367, "global_step": 144477, "epoch": 1740} {"train_loss": -23.17609977722168, "global_step": 144478, "epoch": 1740} {"train_loss": -22.96868324279785, "global_step": 144479, "epoch": 1740} {"train_loss": -23.613407135009766, "global_step": 144480, "epoch": 1740} {"train_loss": -23.255977630615234, "global_step": 144481, "epoch": 1740} {"train_loss": -23.089529037475586, "global_step": 144482, "epoch": 1740} {"train_loss": -23.142723083496094, "global_step": 144483, "epoch": 1740} {"train_loss": -23.199674606323242, "global_step": 144484, "epoch": 1740} {"train_loss": -23.18119239807129, "global_step": 144485, "epoch": 1740} {"train_loss": -23.094680786132812, "global_step": 144486, "epoch": 1740} {"train_loss": -23.219263076782227, "global_step": 144487, "epoch": 1740} {"train_loss": -22.94302749633789, "global_step": 144488, "epoch": 1740} {"train_loss": -23.237951278686523, "global_step": 144489, "epoch": 1740} {"train_loss": -22.9702205657959, "global_step": 144490, "epoch": 1740} {"train_loss": -23.145933151245117, "global_step": 144491, "epoch": 1740} {"train_loss": -22.746816635131836, "global_step": 144492, "epoch": 1740} {"train_loss": -22.714365005493164, "global_step": 144493, "epoch": 1740} {"train_loss": -23.11910057067871, "global_step": 144494, "epoch": 1740} {"train_loss": -23.29507827758789, "global_step": 144495, "epoch": 1740} {"train_loss": -23.189727783203125, "global_step": 144496, "epoch": 1740} {"train_loss": -23.203237533569336, "global_step": 144497, "epoch": 1740} {"train_loss": -22.948131561279297, "global_step": 144498, "epoch": 1740} {"train_loss": -23.313865661621094, "global_step": 144499, "epoch": 1740} {"train_loss": -23.297653198242188, "global_step": 144500, "epoch": 1740} {"train_loss": -23.294858932495117, "global_step": 144501, "epoch": 1740} {"train_loss": -22.910737370870198, "global_step": 144502, "epoch": 1740, "val_loss": 6225100.0} {"train_loss": -21.947856903076172, "global_step": 144503, "epoch": 1741} {"train_loss": -22.476736068725586, "global_step": 144504, "epoch": 1741} {"train_loss": -22.478769302368164, "global_step": 144505, "epoch": 1741} {"train_loss": -22.324514389038086, "global_step": 144506, "epoch": 1741} {"train_loss": -22.49888038635254, "global_step": 144507, "epoch": 1741} {"train_loss": -22.358600616455078, "global_step": 144508, "epoch": 1741} {"train_loss": -23.09144401550293, "global_step": 144509, "epoch": 1741} {"train_loss": -22.812000274658203, "global_step": 144510, "epoch": 1741} {"train_loss": -22.720947265625, "global_step": 144511, "epoch": 1741} {"train_loss": -22.45478630065918, "global_step": 144512, "epoch": 1741} {"train_loss": -23.038084030151367, "global_step": 144513, "epoch": 1741} {"train_loss": -22.671911239624023, "global_step": 144514, "epoch": 1741} {"train_loss": -22.836116790771484, "global_step": 144515, "epoch": 1741} {"train_loss": -22.788190841674805, "global_step": 144516, "epoch": 1741} {"train_loss": -22.711172103881836, "global_step": 144517, "epoch": 1741} {"train_loss": -23.0537109375, "global_step": 144518, "epoch": 1741} {"train_loss": -22.73833656311035, "global_step": 144519, "epoch": 1741} {"train_loss": -22.67241096496582, "global_step": 144520, "epoch": 1741} {"train_loss": -23.00264549255371, "global_step": 144521, "epoch": 1741} {"train_loss": -22.98246192932129, "global_step": 144522, "epoch": 1741} {"train_loss": -23.164749145507812, "global_step": 144523, "epoch": 1741} {"train_loss": -23.122215270996094, "global_step": 144524, "epoch": 1741} {"train_loss": -22.90964698791504, "global_step": 144525, "epoch": 1741} {"train_loss": -23.15278434753418, "global_step": 144526, "epoch": 1741} {"train_loss": -23.22120475769043, "global_step": 144527, "epoch": 1741} {"train_loss": -23.221214294433594, "global_step": 144528, "epoch": 1741} {"train_loss": -23.25356101989746, "global_step": 144529, "epoch": 1741} {"train_loss": -23.422712326049805, "global_step": 144530, "epoch": 1741} {"train_loss": -22.9837646484375, "global_step": 144531, "epoch": 1741} {"train_loss": -23.14503288269043, "global_step": 144532, "epoch": 1741} {"train_loss": -23.194231033325195, "global_step": 144533, "epoch": 1741} {"train_loss": -23.054738998413086, "global_step": 144534, "epoch": 1741} {"train_loss": -23.09804344177246, "global_step": 144535, "epoch": 1741} {"train_loss": -23.3647518157959, "global_step": 144536, "epoch": 1741} {"train_loss": -23.14613151550293, "global_step": 144537, "epoch": 1741} {"train_loss": -23.150585174560547, "global_step": 144538, "epoch": 1741} {"train_loss": -23.27057456970215, "global_step": 144539, "epoch": 1741} {"train_loss": -23.1674747467041, "global_step": 144540, "epoch": 1741} {"train_loss": -23.34689712524414, "global_step": 144541, "epoch": 1741} {"train_loss": -23.219457626342773, "global_step": 144542, "epoch": 1741} {"train_loss": -23.292089462280273, "global_step": 144543, "epoch": 1741} {"train_loss": -23.31781578063965, "global_step": 144544, "epoch": 1741} {"train_loss": -22.84917640686035, "global_step": 144545, "epoch": 1741} {"train_loss": -22.90717315673828, "global_step": 144546, "epoch": 1741} {"train_loss": -23.33835792541504, "global_step": 144547, "epoch": 1741} {"train_loss": -22.89251708984375, "global_step": 144548, "epoch": 1741} {"train_loss": -23.10797882080078, "global_step": 144549, "epoch": 1741} {"train_loss": -23.159391403198242, "global_step": 144550, "epoch": 1741} {"train_loss": -22.95138168334961, "global_step": 144551, "epoch": 1741} {"train_loss": -23.2197322845459, "global_step": 144552, "epoch": 1741} {"train_loss": -23.24932289123535, "global_step": 144553, "epoch": 1741} {"train_loss": -23.491228103637695, "global_step": 144554, "epoch": 1741} {"train_loss": -23.156492233276367, "global_step": 144555, "epoch": 1741} {"train_loss": -23.241533279418945, "global_step": 144556, "epoch": 1741} {"train_loss": -22.886409759521484, "global_step": 144557, "epoch": 1741} {"train_loss": -23.392641067504883, "global_step": 144558, "epoch": 1741} {"train_loss": -22.97859001159668, "global_step": 144559, "epoch": 1741} {"train_loss": -23.331451416015625, "global_step": 144560, "epoch": 1741} {"train_loss": -23.284442901611328, "global_step": 144561, "epoch": 1741} {"train_loss": -23.353418350219727, "global_step": 144562, "epoch": 1741} {"train_loss": -23.3904972076416, "global_step": 144563, "epoch": 1741} {"train_loss": -23.2547550201416, "global_step": 144564, "epoch": 1741} {"train_loss": -23.21200180053711, "global_step": 144565, "epoch": 1741} {"train_loss": -22.915674209594727, "global_step": 144566, "epoch": 1741} {"train_loss": -22.718469619750977, "global_step": 144567, "epoch": 1741} {"train_loss": -22.8105525970459, "global_step": 144568, "epoch": 1741} {"train_loss": -22.932281494140625, "global_step": 144569, "epoch": 1741} {"train_loss": -23.012685775756836, "global_step": 144570, "epoch": 1741} {"train_loss": -23.03730583190918, "global_step": 144571, "epoch": 1741} {"train_loss": -23.328327178955078, "global_step": 144572, "epoch": 1741} {"train_loss": -23.01686668395996, "global_step": 144573, "epoch": 1741} {"train_loss": -23.145740509033203, "global_step": 144574, "epoch": 1741} {"train_loss": -23.32282066345215, "global_step": 144575, "epoch": 1741} {"train_loss": -23.16851043701172, "global_step": 144576, "epoch": 1741} {"train_loss": -22.912626266479492, "global_step": 144577, "epoch": 1741} {"train_loss": -23.626264572143555, "global_step": 144578, "epoch": 1741} {"train_loss": -23.346302032470703, "global_step": 144579, "epoch": 1741} {"train_loss": -23.28289222717285, "global_step": 144580, "epoch": 1741} {"train_loss": -23.48818016052246, "global_step": 144581, "epoch": 1741} {"train_loss": -23.485197067260742, "global_step": 144582, "epoch": 1741} {"train_loss": -23.354217529296875, "global_step": 144583, "epoch": 1741} {"train_loss": -23.525171279907227, "global_step": 144584, "epoch": 1741} {"train_loss": -23.063422145613703, "global_step": 144585, "epoch": 1741, "val_loss": 6322430.0} {"train_loss": -22.769760131835938, "global_step": 144586, "epoch": 1742} {"train_loss": -22.42280387878418, "global_step": 144587, "epoch": 1742} {"train_loss": -22.29285430908203, "global_step": 144588, "epoch": 1742} {"train_loss": -22.42782974243164, "global_step": 144589, "epoch": 1742} {"train_loss": -22.959684371948242, "global_step": 144590, "epoch": 1742} {"train_loss": -22.895235061645508, "global_step": 144591, "epoch": 1742} {"train_loss": -22.616104125976562, "global_step": 144592, "epoch": 1742} {"train_loss": -22.875585556030273, "global_step": 144593, "epoch": 1742} {"train_loss": -23.006275177001953, "global_step": 144594, "epoch": 1742} {"train_loss": -22.852388381958008, "global_step": 144595, "epoch": 1742} {"train_loss": -22.902822494506836, "global_step": 144596, "epoch": 1742} {"train_loss": -23.08355140686035, "global_step": 144597, "epoch": 1742} {"train_loss": -23.135316848754883, "global_step": 144598, "epoch": 1742} {"train_loss": -22.825511932373047, "global_step": 144599, "epoch": 1742} {"train_loss": -23.05971336364746, "global_step": 144600, "epoch": 1742} {"train_loss": -22.906185150146484, "global_step": 144601, "epoch": 1742} {"train_loss": -22.885278701782227, "global_step": 144602, "epoch": 1742} {"train_loss": -23.073823928833008, "global_step": 144603, "epoch": 1742} {"train_loss": -22.968534469604492, "global_step": 144604, "epoch": 1742} {"train_loss": -22.96930503845215, "global_step": 144605, "epoch": 1742} {"train_loss": -23.54368782043457, "global_step": 144606, "epoch": 1742} {"train_loss": -23.096237182617188, "global_step": 144607, "epoch": 1742} {"train_loss": -23.312501907348633, "global_step": 144608, "epoch": 1742} {"train_loss": -23.18160057067871, "global_step": 144609, "epoch": 1742} {"train_loss": -22.981903076171875, "global_step": 144610, "epoch": 1742} {"train_loss": -22.782625198364258, "global_step": 144611, "epoch": 1742} {"train_loss": -23.422290802001953, "global_step": 144612, "epoch": 1742} {"train_loss": -22.685449600219727, "global_step": 144613, "epoch": 1742} {"train_loss": -23.005216598510742, "global_step": 144614, "epoch": 1742} {"train_loss": -23.19522476196289, "global_step": 144615, "epoch": 1742} {"train_loss": -23.10386085510254, "global_step": 144616, "epoch": 1742} {"train_loss": -23.181106567382812, "global_step": 144617, "epoch": 1742} {"train_loss": -23.142822265625, "global_step": 144618, "epoch": 1742} {"train_loss": -23.02817153930664, "global_step": 144619, "epoch": 1742} {"train_loss": -22.94407081604004, "global_step": 144620, "epoch": 1742} {"train_loss": -23.003154754638672, "global_step": 144621, "epoch": 1742} {"train_loss": -22.955249786376953, "global_step": 144622, "epoch": 1742} {"train_loss": -23.111377716064453, "global_step": 144623, "epoch": 1742} {"train_loss": -23.025053024291992, "global_step": 144624, "epoch": 1742} {"train_loss": -23.0747127532959, "global_step": 144625, "epoch": 1742} {"train_loss": -23.020187377929688, "global_step": 144626, "epoch": 1742} {"train_loss": -22.832645416259766, "global_step": 144627, "epoch": 1742} {"train_loss": -22.746721267700195, "global_step": 144628, "epoch": 1742} {"train_loss": -23.020288467407227, "global_step": 144629, "epoch": 1742} {"train_loss": -23.089153289794922, "global_step": 144630, "epoch": 1742} {"train_loss": -23.61359977722168, "global_step": 144631, "epoch": 1742} {"train_loss": -22.753894805908203, "global_step": 144632, "epoch": 1742} {"train_loss": -23.163358688354492, "global_step": 144633, "epoch": 1742} {"train_loss": -23.292631149291992, "global_step": 144634, "epoch": 1742} {"train_loss": -23.024057388305664, "global_step": 144635, "epoch": 1742} {"train_loss": -23.229442596435547, "global_step": 144636, "epoch": 1742} {"train_loss": -23.229419708251953, "global_step": 144637, "epoch": 1742} {"train_loss": -23.016931533813477, "global_step": 144638, "epoch": 1742} {"train_loss": -22.7925968170166, "global_step": 144639, "epoch": 1742} {"train_loss": -22.957355499267578, "global_step": 144640, "epoch": 1742} {"train_loss": -23.170734405517578, "global_step": 144641, "epoch": 1742} {"train_loss": -23.515588760375977, "global_step": 144642, "epoch": 1742} {"train_loss": -22.940460205078125, "global_step": 144643, "epoch": 1742} {"train_loss": -22.7341365814209, "global_step": 144644, "epoch": 1742} {"train_loss": -23.5572452545166, "global_step": 144645, "epoch": 1742} {"train_loss": -23.19668197631836, "global_step": 144646, "epoch": 1742} {"train_loss": -23.026403427124023, "global_step": 144647, "epoch": 1742} {"train_loss": -23.121484756469727, "global_step": 144648, "epoch": 1742} {"train_loss": -23.130657196044922, "global_step": 144649, "epoch": 1742} {"train_loss": -22.754514694213867, "global_step": 144650, "epoch": 1742} {"train_loss": -22.80670166015625, "global_step": 144651, "epoch": 1742} {"train_loss": -23.16219139099121, "global_step": 144652, "epoch": 1742} {"train_loss": -23.332183837890625, "global_step": 144653, "epoch": 1742} {"train_loss": -23.11701011657715, "global_step": 144654, "epoch": 1742} {"train_loss": -23.188596725463867, "global_step": 144655, "epoch": 1742} {"train_loss": -23.002283096313477, "global_step": 144656, "epoch": 1742} {"train_loss": -23.241914749145508, "global_step": 144657, "epoch": 1742} {"train_loss": -23.13958740234375, "global_step": 144658, "epoch": 1742} {"train_loss": -23.00794792175293, "global_step": 144659, "epoch": 1742} {"train_loss": -23.159889221191406, "global_step": 144660, "epoch": 1742} {"train_loss": -23.134159088134766, "global_step": 144661, "epoch": 1742} {"train_loss": -23.026294708251953, "global_step": 144662, "epoch": 1742} {"train_loss": -23.076929092407227, "global_step": 144663, "epoch": 1742} {"train_loss": -23.247587203979492, "global_step": 144664, "epoch": 1742} {"train_loss": -23.375905990600586, "global_step": 144665, "epoch": 1742} {"train_loss": -23.17247200012207, "global_step": 144666, "epoch": 1742} {"train_loss": -23.30864143371582, "global_step": 144667, "epoch": 1742} {"train_loss": -23.0466784281903, "global_step": 144668, "epoch": 1742, "val_loss": 6224226.5} {"train_loss": -22.6906795501709, "global_step": 144669, "epoch": 1743} {"train_loss": -22.9013729095459, "global_step": 144670, "epoch": 1743} {"train_loss": -22.600101470947266, "global_step": 144671, "epoch": 1743} {"train_loss": -23.041030883789062, "global_step": 144672, "epoch": 1743} {"train_loss": -22.900638580322266, "global_step": 144673, "epoch": 1743} {"train_loss": -23.072561264038086, "global_step": 144674, "epoch": 1743} {"train_loss": -23.1259708404541, "global_step": 144675, "epoch": 1743} {"train_loss": -22.41506004333496, "global_step": 144676, "epoch": 1743} {"train_loss": -22.803485870361328, "global_step": 144677, "epoch": 1743} {"train_loss": -22.476947784423828, "global_step": 144678, "epoch": 1743} {"train_loss": -22.86743927001953, "global_step": 144679, "epoch": 1743} {"train_loss": -22.361310958862305, "global_step": 144680, "epoch": 1743} {"train_loss": -22.795278549194336, "global_step": 144681, "epoch": 1743} {"train_loss": -22.92328453063965, "global_step": 144682, "epoch": 1743} {"train_loss": -22.93529510498047, "global_step": 144683, "epoch": 1743} {"train_loss": -22.721738815307617, "global_step": 144684, "epoch": 1743} {"train_loss": -23.216394424438477, "global_step": 144685, "epoch": 1743} {"train_loss": -23.091947555541992, "global_step": 144686, "epoch": 1743} {"train_loss": -22.984861373901367, "global_step": 144687, "epoch": 1743} {"train_loss": -22.8450927734375, "global_step": 144688, "epoch": 1743} {"train_loss": -22.90224266052246, "global_step": 144689, "epoch": 1743} {"train_loss": -22.662710189819336, "global_step": 144690, "epoch": 1743} {"train_loss": -23.214630126953125, "global_step": 144691, "epoch": 1743} {"train_loss": -23.21623992919922, "global_step": 144692, "epoch": 1743} {"train_loss": -23.080108642578125, "global_step": 144693, "epoch": 1743} {"train_loss": -22.8960018157959, "global_step": 144694, "epoch": 1743} {"train_loss": -22.975034713745117, "global_step": 144695, "epoch": 1743} {"train_loss": -22.950681686401367, "global_step": 144696, "epoch": 1743} {"train_loss": -23.0800838470459, "global_step": 144697, "epoch": 1743} {"train_loss": -23.03582763671875, "global_step": 144698, "epoch": 1743} {"train_loss": -23.361440658569336, "global_step": 144699, "epoch": 1743} {"train_loss": -23.164405822753906, "global_step": 144700, "epoch": 1743} {"train_loss": -23.45989990234375, "global_step": 144701, "epoch": 1743} {"train_loss": -23.335407257080078, "global_step": 144702, "epoch": 1743} {"train_loss": -22.854955673217773, "global_step": 144703, "epoch": 1743} {"train_loss": -23.217971801757812, "global_step": 144704, "epoch": 1743} {"train_loss": -23.20557975769043, "global_step": 144705, "epoch": 1743} {"train_loss": -23.0828800201416, "global_step": 144706, "epoch": 1743} {"train_loss": -23.20389747619629, "global_step": 144707, "epoch": 1743} {"train_loss": -23.35271644592285, "global_step": 144708, "epoch": 1743} {"train_loss": -23.17372703552246, "global_step": 144709, "epoch": 1743} {"train_loss": -23.138425827026367, "global_step": 144710, "epoch": 1743} {"train_loss": -23.30720329284668, "global_step": 144711, "epoch": 1743} {"train_loss": -23.56698989868164, "global_step": 144712, "epoch": 1743} {"train_loss": -23.47455406188965, "global_step": 144713, "epoch": 1743} {"train_loss": -23.173330307006836, "global_step": 144714, "epoch": 1743} {"train_loss": -23.054080963134766, "global_step": 144715, "epoch": 1743} {"train_loss": -23.000717163085938, "global_step": 144716, "epoch": 1743} {"train_loss": -23.4751033782959, "global_step": 144717, "epoch": 1743} {"train_loss": -23.081472396850586, "global_step": 144718, "epoch": 1743} {"train_loss": -23.353759765625, "global_step": 144719, "epoch": 1743} {"train_loss": -23.131784439086914, "global_step": 144720, "epoch": 1743} {"train_loss": -23.342222213745117, "global_step": 144721, "epoch": 1743} {"train_loss": -23.334728240966797, "global_step": 144722, "epoch": 1743} {"train_loss": -23.076698303222656, "global_step": 144723, "epoch": 1743} {"train_loss": -23.245168685913086, "global_step": 144724, "epoch": 1743} {"train_loss": -23.199665069580078, "global_step": 144725, "epoch": 1743} {"train_loss": -23.21788215637207, "global_step": 144726, "epoch": 1743} {"train_loss": -23.14461326599121, "global_step": 144727, "epoch": 1743} {"train_loss": -23.363588333129883, "global_step": 144728, "epoch": 1743} {"train_loss": -23.09814453125, "global_step": 144729, "epoch": 1743} {"train_loss": -23.027694702148438, "global_step": 144730, "epoch": 1743} {"train_loss": -23.221277236938477, "global_step": 144731, "epoch": 1743} {"train_loss": -23.020315170288086, "global_step": 144732, "epoch": 1743} {"train_loss": -23.16535758972168, "global_step": 144733, "epoch": 1743} {"train_loss": -22.993701934814453, "global_step": 144734, "epoch": 1743} {"train_loss": -23.4198055267334, "global_step": 144735, "epoch": 1743} {"train_loss": -23.22792625427246, "global_step": 144736, "epoch": 1743} {"train_loss": -22.86153221130371, "global_step": 144737, "epoch": 1743} {"train_loss": -23.21383285522461, "global_step": 144738, "epoch": 1743} {"train_loss": -23.000690460205078, "global_step": 144739, "epoch": 1743} {"train_loss": -23.203245162963867, "global_step": 144740, "epoch": 1743} {"train_loss": -23.095815658569336, "global_step": 144741, "epoch": 1743} {"train_loss": -23.134685516357422, "global_step": 144742, "epoch": 1743} {"train_loss": -23.10173988342285, "global_step": 144743, "epoch": 1743} {"train_loss": -23.10634994506836, "global_step": 144744, "epoch": 1743} {"train_loss": -23.266542434692383, "global_step": 144745, "epoch": 1743} {"train_loss": -23.212543487548828, "global_step": 144746, "epoch": 1743} {"train_loss": -23.583005905151367, "global_step": 144747, "epoch": 1743} {"train_loss": -23.150968551635742, "global_step": 144748, "epoch": 1743} {"train_loss": -23.006940841674805, "global_step": 144749, "epoch": 1743} {"train_loss": -23.140729904174805, "global_step": 144750, "epoch": 1743} {"train_loss": -23.0860526992614, "global_step": 144751, "epoch": 1743, "val_loss": 6362904.0} {"train_loss": -21.998092651367188, "global_step": 144752, "epoch": 1744} {"train_loss": -22.187713623046875, "global_step": 144753, "epoch": 1744} {"train_loss": -22.56498146057129, "global_step": 144754, "epoch": 1744} {"train_loss": -22.808481216430664, "global_step": 144755, "epoch": 1744} {"train_loss": -22.324359893798828, "global_step": 144756, "epoch": 1744} {"train_loss": -22.431650161743164, "global_step": 144757, "epoch": 1744} {"train_loss": -23.007776260375977, "global_step": 144758, "epoch": 1744} {"train_loss": -22.864721298217773, "global_step": 144759, "epoch": 1744} {"train_loss": -23.023134231567383, "global_step": 144760, "epoch": 1744} {"train_loss": -23.0155086517334, "global_step": 144761, "epoch": 1744} {"train_loss": -22.97421646118164, "global_step": 144762, "epoch": 1744} {"train_loss": -22.602949142456055, "global_step": 144763, "epoch": 1744} {"train_loss": -22.73586082458496, "global_step": 144764, "epoch": 1744} {"train_loss": -22.82522201538086, "global_step": 144765, "epoch": 1744} {"train_loss": -22.90817642211914, "global_step": 144766, "epoch": 1744} {"train_loss": -23.136789321899414, "global_step": 144767, "epoch": 1744} {"train_loss": -22.622234344482422, "global_step": 144768, "epoch": 1744} {"train_loss": -22.952661514282227, "global_step": 144769, "epoch": 1744} {"train_loss": -22.781152725219727, "global_step": 144770, "epoch": 1744} {"train_loss": -23.318862915039062, "global_step": 144771, "epoch": 1744} {"train_loss": -22.816679000854492, "global_step": 144772, "epoch": 1744} {"train_loss": -22.532814025878906, "global_step": 144773, "epoch": 1744} {"train_loss": -23.343137741088867, "global_step": 144774, "epoch": 1744} {"train_loss": -23.032926559448242, "global_step": 144775, "epoch": 1744} {"train_loss": -22.926952362060547, "global_step": 144776, "epoch": 1744} {"train_loss": -23.12769317626953, "global_step": 144777, "epoch": 1744} {"train_loss": -22.968965530395508, "global_step": 144778, "epoch": 1744} {"train_loss": -22.998178482055664, "global_step": 144779, "epoch": 1744} {"train_loss": -23.01627540588379, "global_step": 144780, "epoch": 1744} {"train_loss": -23.283300399780273, "global_step": 144781, "epoch": 1744} {"train_loss": -23.274324417114258, "global_step": 144782, "epoch": 1744} {"train_loss": -22.89299964904785, "global_step": 144783, "epoch": 1744} {"train_loss": -23.075925827026367, "global_step": 144784, "epoch": 1744} {"train_loss": -23.112592697143555, "global_step": 144785, "epoch": 1744} {"train_loss": -22.867002487182617, "global_step": 144786, "epoch": 1744} {"train_loss": -23.245330810546875, "global_step": 144787, "epoch": 1744} {"train_loss": -23.10501480102539, "global_step": 144788, "epoch": 1744} {"train_loss": -23.275585174560547, "global_step": 144789, "epoch": 1744} {"train_loss": -22.758708953857422, "global_step": 144790, "epoch": 1744} {"train_loss": -23.492450714111328, "global_step": 144791, "epoch": 1744} {"train_loss": -22.595096588134766, "global_step": 144792, "epoch": 1744} {"train_loss": -22.952247619628906, "global_step": 144793, "epoch": 1744} {"train_loss": -23.335752487182617, "global_step": 144794, "epoch": 1744} {"train_loss": -23.408985137939453, "global_step": 144795, "epoch": 1744} {"train_loss": -23.285797119140625, "global_step": 144796, "epoch": 1744} {"train_loss": -23.404752731323242, "global_step": 144797, "epoch": 1744} {"train_loss": -23.208221435546875, "global_step": 144798, "epoch": 1744} {"train_loss": -23.013254165649414, "global_step": 144799, "epoch": 1744} {"train_loss": -23.05496597290039, "global_step": 144800, "epoch": 1744} {"train_loss": -23.30391502380371, "global_step": 144801, "epoch": 1744} {"train_loss": -23.123523712158203, "global_step": 144802, "epoch": 1744} {"train_loss": -23.266942977905273, "global_step": 144803, "epoch": 1744} {"train_loss": -23.241073608398438, "global_step": 144804, "epoch": 1744} {"train_loss": -23.606367111206055, "global_step": 144805, "epoch": 1744} {"train_loss": -22.956777572631836, "global_step": 144806, "epoch": 1744} {"train_loss": -22.874351501464844, "global_step": 144807, "epoch": 1744} {"train_loss": -22.91128921508789, "global_step": 144808, "epoch": 1744} {"train_loss": -23.032682418823242, "global_step": 144809, "epoch": 1744} {"train_loss": -22.690414428710938, "global_step": 144810, "epoch": 1744} {"train_loss": -23.181211471557617, "global_step": 144811, "epoch": 1744} {"train_loss": -22.9759464263916, "global_step": 144812, "epoch": 1744} {"train_loss": -23.325170516967773, "global_step": 144813, "epoch": 1744} {"train_loss": -22.76782989501953, "global_step": 144814, "epoch": 1744} {"train_loss": -23.33797264099121, "global_step": 144815, "epoch": 1744} {"train_loss": -23.183822631835938, "global_step": 144816, "epoch": 1744} {"train_loss": -23.10221290588379, "global_step": 144817, "epoch": 1744} {"train_loss": -23.55997085571289, "global_step": 144818, "epoch": 1744} {"train_loss": -23.013275146484375, "global_step": 144819, "epoch": 1744} {"train_loss": -22.810623168945312, "global_step": 144820, "epoch": 1744} {"train_loss": -23.14381217956543, "global_step": 144821, "epoch": 1744} {"train_loss": -23.38826560974121, "global_step": 144822, "epoch": 1744} {"train_loss": -22.934289932250977, "global_step": 144823, "epoch": 1744} {"train_loss": -23.338565826416016, "global_step": 144824, "epoch": 1744} {"train_loss": -22.93562889099121, "global_step": 144825, "epoch": 1744} {"train_loss": -23.25980567932129, "global_step": 144826, "epoch": 1744} {"train_loss": -23.204206466674805, "global_step": 144827, "epoch": 1744} {"train_loss": -23.433368682861328, "global_step": 144828, "epoch": 1744} {"train_loss": -23.01984977722168, "global_step": 144829, "epoch": 1744} {"train_loss": -23.346628189086914, "global_step": 144830, "epoch": 1744} {"train_loss": -23.2130126953125, "global_step": 144831, "epoch": 1744} {"train_loss": -23.107925415039062, "global_step": 144832, "epoch": 1744} {"train_loss": -23.302824020385742, "global_step": 144833, "epoch": 1744} {"train_loss": -23.035168475415333, "global_step": 144834, "epoch": 1744, "val_loss": 6220385.0} {"train_loss": -22.296113967895508, "global_step": 144835, "epoch": 1745} {"train_loss": -23.080596923828125, "global_step": 144836, "epoch": 1745} {"train_loss": -22.741849899291992, "global_step": 144837, "epoch": 1745} {"train_loss": -22.746320724487305, "global_step": 144838, "epoch": 1745} {"train_loss": -23.170570373535156, "global_step": 144839, "epoch": 1745} {"train_loss": -22.859512329101562, "global_step": 144840, "epoch": 1745} {"train_loss": -22.267498016357422, "global_step": 144841, "epoch": 1745} {"train_loss": -22.643680572509766, "global_step": 144842, "epoch": 1745} {"train_loss": -22.435413360595703, "global_step": 144843, "epoch": 1745} {"train_loss": -22.794294357299805, "global_step": 144844, "epoch": 1745} {"train_loss": -22.416215896606445, "global_step": 144845, "epoch": 1745} {"train_loss": -22.797117233276367, "global_step": 144846, "epoch": 1745} {"train_loss": -22.55317497253418, "global_step": 144847, "epoch": 1745} {"train_loss": -22.766422271728516, "global_step": 144848, "epoch": 1745} {"train_loss": -22.454483032226562, "global_step": 144849, "epoch": 1745} {"train_loss": -22.927724838256836, "global_step": 144850, "epoch": 1745} {"train_loss": -22.80348014831543, "global_step": 144851, "epoch": 1745} {"train_loss": -22.927457809448242, "global_step": 144852, "epoch": 1745} {"train_loss": -22.73160743713379, "global_step": 144853, "epoch": 1745} {"train_loss": -23.178117752075195, "global_step": 144854, "epoch": 1745} {"train_loss": -22.638200759887695, "global_step": 144855, "epoch": 1745} {"train_loss": -22.888790130615234, "global_step": 144856, "epoch": 1745} {"train_loss": -23.023469924926758, "global_step": 144857, "epoch": 1745} {"train_loss": -22.945669174194336, "global_step": 144858, "epoch": 1745} {"train_loss": -23.055566787719727, "global_step": 144859, "epoch": 1745} {"train_loss": -22.952463150024414, "global_step": 144860, "epoch": 1745} {"train_loss": -22.892011642456055, "global_step": 144861, "epoch": 1745} {"train_loss": -22.837308883666992, "global_step": 144862, "epoch": 1745} {"train_loss": -23.044218063354492, "global_step": 144863, "epoch": 1745} {"train_loss": -22.99725341796875, "global_step": 144864, "epoch": 1745} {"train_loss": -22.95191764831543, "global_step": 144865, "epoch": 1745} {"train_loss": -22.784055709838867, "global_step": 144866, "epoch": 1745} {"train_loss": -23.224287033081055, "global_step": 144867, "epoch": 1745} {"train_loss": -23.092178344726562, "global_step": 144868, "epoch": 1745} {"train_loss": -22.86240005493164, "global_step": 144869, "epoch": 1745} {"train_loss": -23.036916732788086, "global_step": 144870, "epoch": 1745} {"train_loss": -23.100666046142578, "global_step": 144871, "epoch": 1745} {"train_loss": -22.778453826904297, "global_step": 144872, "epoch": 1745} {"train_loss": -23.53343391418457, "global_step": 144873, "epoch": 1745} {"train_loss": -22.936128616333008, "global_step": 144874, "epoch": 1745} {"train_loss": -23.13245964050293, "global_step": 144875, "epoch": 1745} {"train_loss": -22.86844825744629, "global_step": 144876, "epoch": 1745} {"train_loss": -22.82219886779785, "global_step": 144877, "epoch": 1745} {"train_loss": -23.18970489501953, "global_step": 144878, "epoch": 1745} {"train_loss": -23.099945068359375, "global_step": 144879, "epoch": 1745} {"train_loss": -23.08010482788086, "global_step": 144880, "epoch": 1745} {"train_loss": -23.142669677734375, "global_step": 144881, "epoch": 1745} {"train_loss": -23.31418228149414, "global_step": 144882, "epoch": 1745} {"train_loss": -23.235567092895508, "global_step": 144883, "epoch": 1745} {"train_loss": -22.669687271118164, "global_step": 144884, "epoch": 1745} {"train_loss": -23.430036544799805, "global_step": 144885, "epoch": 1745} {"train_loss": -23.207921981811523, "global_step": 144886, "epoch": 1745} {"train_loss": -23.157840728759766, "global_step": 144887, "epoch": 1745} {"train_loss": -23.401229858398438, "global_step": 144888, "epoch": 1745} {"train_loss": -23.038175582885742, "global_step": 144889, "epoch": 1745} {"train_loss": -23.490537643432617, "global_step": 144890, "epoch": 1745} {"train_loss": -23.21790885925293, "global_step": 144891, "epoch": 1745} {"train_loss": -23.4180908203125, "global_step": 144892, "epoch": 1745} {"train_loss": -23.722543716430664, "global_step": 144893, "epoch": 1745} {"train_loss": -23.13858413696289, "global_step": 144894, "epoch": 1745} {"train_loss": -23.364187240600586, "global_step": 144895, "epoch": 1745} {"train_loss": -22.81453514099121, "global_step": 144896, "epoch": 1745} {"train_loss": -23.497413635253906, "global_step": 144897, "epoch": 1745} {"train_loss": -23.45657730102539, "global_step": 144898, "epoch": 1745} {"train_loss": -23.251001358032227, "global_step": 144899, "epoch": 1745} {"train_loss": -23.179298400878906, "global_step": 144900, "epoch": 1745} {"train_loss": -23.461217880249023, "global_step": 144901, "epoch": 1745} {"train_loss": -23.271114349365234, "global_step": 144902, "epoch": 1745} {"train_loss": -22.91225242614746, "global_step": 144903, "epoch": 1745} {"train_loss": -23.084020614624023, "global_step": 144904, "epoch": 1745} {"train_loss": -23.482162475585938, "global_step": 144905, "epoch": 1745} {"train_loss": -22.879690170288086, "global_step": 144906, "epoch": 1745} {"train_loss": -22.80904197692871, "global_step": 144907, "epoch": 1745} {"train_loss": -23.143564224243164, "global_step": 144908, "epoch": 1745} {"train_loss": -22.699838638305664, "global_step": 144909, "epoch": 1745} {"train_loss": -23.307689666748047, "global_step": 144910, "epoch": 1745} {"train_loss": -23.09952735900879, "global_step": 144911, "epoch": 1745} {"train_loss": -23.260953903198242, "global_step": 144912, "epoch": 1745} {"train_loss": -22.759878158569336, "global_step": 144913, "epoch": 1745} {"train_loss": -23.1727237701416, "global_step": 144914, "epoch": 1745} {"train_loss": -23.186574935913086, "global_step": 144915, "epoch": 1745} {"train_loss": -23.234296798706055, "global_step": 144916, "epoch": 1745} {"train_loss": -23.026173924825276, "global_step": 144917, "epoch": 1745, "val_loss": 6312548.0} {"train_loss": -22.432348251342773, "global_step": 144918, "epoch": 1746} {"train_loss": -22.129566192626953, "global_step": 144919, "epoch": 1746} {"train_loss": -22.39266014099121, "global_step": 144920, "epoch": 1746} {"train_loss": -22.308561325073242, "global_step": 144921, "epoch": 1746} {"train_loss": -22.635574340820312, "global_step": 144922, "epoch": 1746} {"train_loss": -22.486417770385742, "global_step": 144923, "epoch": 1746} {"train_loss": -22.503679275512695, "global_step": 144924, "epoch": 1746} {"train_loss": -22.574604034423828, "global_step": 144925, "epoch": 1746} {"train_loss": -22.48993492126465, "global_step": 144926, "epoch": 1746} {"train_loss": -22.666671752929688, "global_step": 144927, "epoch": 1746} {"train_loss": -22.602447509765625, "global_step": 144928, "epoch": 1746} {"train_loss": -22.740779876708984, "global_step": 144929, "epoch": 1746} {"train_loss": -22.934864044189453, "global_step": 144930, "epoch": 1746} {"train_loss": -23.02901268005371, "global_step": 144931, "epoch": 1746} {"train_loss": -22.746562957763672, "global_step": 144932, "epoch": 1746} {"train_loss": -22.95747947692871, "global_step": 144933, "epoch": 1746} {"train_loss": -22.772430419921875, "global_step": 144934, "epoch": 1746} {"train_loss": -23.10120964050293, "global_step": 144935, "epoch": 1746} {"train_loss": -23.403030395507812, "global_step": 144936, "epoch": 1746} {"train_loss": -22.936674118041992, "global_step": 144937, "epoch": 1746} {"train_loss": -22.906869888305664, "global_step": 144938, "epoch": 1746} {"train_loss": -23.126005172729492, "global_step": 144939, "epoch": 1746} {"train_loss": -23.183103561401367, "global_step": 144940, "epoch": 1746} {"train_loss": -23.139942169189453, "global_step": 144941, "epoch": 1746} {"train_loss": -22.9925594329834, "global_step": 144942, "epoch": 1746} {"train_loss": -23.217147827148438, "global_step": 144943, "epoch": 1746} {"train_loss": -22.90997886657715, "global_step": 144944, "epoch": 1746} {"train_loss": -23.043725967407227, "global_step": 144945, "epoch": 1746} {"train_loss": -22.99740982055664, "global_step": 144946, "epoch": 1746} {"train_loss": -23.428110122680664, "global_step": 144947, "epoch": 1746} {"train_loss": -23.028398513793945, "global_step": 144948, "epoch": 1746} {"train_loss": -23.155948638916016, "global_step": 144949, "epoch": 1746} {"train_loss": -23.00382423400879, "global_step": 144950, "epoch": 1746} {"train_loss": -23.157264709472656, "global_step": 144951, "epoch": 1746} {"train_loss": -23.284360885620117, "global_step": 144952, "epoch": 1746} {"train_loss": -23.479476928710938, "global_step": 144953, "epoch": 1746} {"train_loss": -23.113813400268555, "global_step": 144954, "epoch": 1746} {"train_loss": -23.12386131286621, "global_step": 144955, "epoch": 1746} {"train_loss": -23.13024139404297, "global_step": 144956, "epoch": 1746} {"train_loss": -23.120161056518555, "global_step": 144957, "epoch": 1746} {"train_loss": -23.144851684570312, "global_step": 144958, "epoch": 1746} {"train_loss": -23.29452896118164, "global_step": 144959, "epoch": 1746} {"train_loss": -23.130619049072266, "global_step": 144960, "epoch": 1746} {"train_loss": -23.232589721679688, "global_step": 144961, "epoch": 1746} {"train_loss": -23.26227378845215, "global_step": 144962, "epoch": 1746} {"train_loss": -23.161827087402344, "global_step": 144963, "epoch": 1746} {"train_loss": -23.166547775268555, "global_step": 144964, "epoch": 1746} {"train_loss": -23.093469619750977, "global_step": 144965, "epoch": 1746} {"train_loss": -23.415327072143555, "global_step": 144966, "epoch": 1746} {"train_loss": -23.21248435974121, "global_step": 144967, "epoch": 1746} {"train_loss": -23.4303035736084, "global_step": 144968, "epoch": 1746} {"train_loss": -23.19334602355957, "global_step": 144969, "epoch": 1746} {"train_loss": -23.371337890625, "global_step": 144970, "epoch": 1746} {"train_loss": -23.16515350341797, "global_step": 144971, "epoch": 1746} {"train_loss": -22.928634643554688, "global_step": 144972, "epoch": 1746} {"train_loss": -23.033796310424805, "global_step": 144973, "epoch": 1746} {"train_loss": -23.330974578857422, "global_step": 144974, "epoch": 1746} {"train_loss": -23.170583724975586, "global_step": 144975, "epoch": 1746} {"train_loss": -23.305530548095703, "global_step": 144976, "epoch": 1746} {"train_loss": -23.02198600769043, "global_step": 144977, "epoch": 1746} {"train_loss": -23.129907608032227, "global_step": 144978, "epoch": 1746} {"train_loss": -23.225269317626953, "global_step": 144979, "epoch": 1746} {"train_loss": -22.898244857788086, "global_step": 144980, "epoch": 1746} {"train_loss": -23.16999626159668, "global_step": 144981, "epoch": 1746} {"train_loss": -23.26273536682129, "global_step": 144982, "epoch": 1746} {"train_loss": -23.347227096557617, "global_step": 144983, "epoch": 1746} {"train_loss": -23.48806381225586, "global_step": 144984, "epoch": 1746} {"train_loss": -23.423364639282227, "global_step": 144985, "epoch": 1746} {"train_loss": -22.95060157775879, "global_step": 144986, "epoch": 1746} {"train_loss": -23.181652069091797, "global_step": 144987, "epoch": 1746} {"train_loss": -23.424808502197266, "global_step": 144988, "epoch": 1746} {"train_loss": -22.92088508605957, "global_step": 144989, "epoch": 1746} {"train_loss": -22.930606842041016, "global_step": 144990, "epoch": 1746} {"train_loss": -22.882036209106445, "global_step": 144991, "epoch": 1746} {"train_loss": -23.392471313476562, "global_step": 144992, "epoch": 1746} {"train_loss": -23.41370964050293, "global_step": 144993, "epoch": 1746} {"train_loss": -23.121381759643555, "global_step": 144994, "epoch": 1746} {"train_loss": -23.07839012145996, "global_step": 144995, "epoch": 1746} {"train_loss": -23.030282974243164, "global_step": 144996, "epoch": 1746} {"train_loss": -23.305601119995117, "global_step": 144997, "epoch": 1746} {"train_loss": -22.946857452392578, "global_step": 144998, "epoch": 1746} {"train_loss": -23.15257453918457, "global_step": 144999, "epoch": 1746} {"train_loss": -23.043446322521532, "global_step": 145000, "epoch": 1746, "val_loss": 6375636.0} {"train_loss": -22.77605628967285, "global_step": 145001, "epoch": 1747} {"train_loss": -22.726057052612305, "global_step": 145002, "epoch": 1747} {"train_loss": -23.27640151977539, "global_step": 145003, "epoch": 1747} {"train_loss": -22.6378116607666, "global_step": 145004, "epoch": 1747} {"train_loss": -22.660062789916992, "global_step": 145005, "epoch": 1747} {"train_loss": -22.32539939880371, "global_step": 145006, "epoch": 1747} {"train_loss": -22.83698844909668, "global_step": 145007, "epoch": 1747} {"train_loss": -22.651992797851562, "global_step": 145008, "epoch": 1747} {"train_loss": -23.257150650024414, "global_step": 145009, "epoch": 1747} {"train_loss": -22.65681266784668, "global_step": 145010, "epoch": 1747} {"train_loss": -22.932676315307617, "global_step": 145011, "epoch": 1747} {"train_loss": -23.167747497558594, "global_step": 145012, "epoch": 1747} {"train_loss": -22.676549911499023, "global_step": 145013, "epoch": 1747} {"train_loss": -22.937829971313477, "global_step": 145014, "epoch": 1747} {"train_loss": -22.744924545288086, "global_step": 145015, "epoch": 1747} {"train_loss": -23.35084342956543, "global_step": 145016, "epoch": 1747} {"train_loss": -23.401533126831055, "global_step": 145017, "epoch": 1747} {"train_loss": -23.21712303161621, "global_step": 145018, "epoch": 1747} {"train_loss": -22.983413696289062, "global_step": 145019, "epoch": 1747} {"train_loss": -22.910436630249023, "global_step": 145020, "epoch": 1747} {"train_loss": -23.45745086669922, "global_step": 145021, "epoch": 1747} {"train_loss": -22.90708351135254, "global_step": 145022, "epoch": 1747} {"train_loss": -23.484867095947266, "global_step": 145023, "epoch": 1747} {"train_loss": -23.06072425842285, "global_step": 145024, "epoch": 1747} {"train_loss": -23.3160457611084, "global_step": 145025, "epoch": 1747} {"train_loss": -23.252670288085938, "global_step": 145026, "epoch": 1747} {"train_loss": -23.08258628845215, "global_step": 145027, "epoch": 1747} {"train_loss": -23.257701873779297, "global_step": 145028, "epoch": 1747} {"train_loss": -23.440349578857422, "global_step": 145029, "epoch": 1747} {"train_loss": -22.891586303710938, "global_step": 145030, "epoch": 1747} {"train_loss": -23.52928352355957, "global_step": 145031, "epoch": 1747} {"train_loss": -23.170209884643555, "global_step": 145032, "epoch": 1747} {"train_loss": -23.2197265625, "global_step": 145033, "epoch": 1747} {"train_loss": -22.872079849243164, "global_step": 145034, "epoch": 1747} {"train_loss": -23.260007858276367, "global_step": 145035, "epoch": 1747} {"train_loss": -23.322153091430664, "global_step": 145036, "epoch": 1747} {"train_loss": -23.50077247619629, "global_step": 145037, "epoch": 1747} {"train_loss": -23.071767807006836, "global_step": 145038, "epoch": 1747} {"train_loss": -23.34236717224121, "global_step": 145039, "epoch": 1747} {"train_loss": -23.447402954101562, "global_step": 145040, "epoch": 1747} {"train_loss": -23.63949966430664, "global_step": 145041, "epoch": 1747} {"train_loss": -22.91322898864746, "global_step": 145042, "epoch": 1747} {"train_loss": -22.749013900756836, "global_step": 145043, "epoch": 1747} {"train_loss": -22.49751091003418, "global_step": 145044, "epoch": 1747} {"train_loss": -22.615598678588867, "global_step": 145045, "epoch": 1747} {"train_loss": -22.826690673828125, "global_step": 145046, "epoch": 1747} {"train_loss": -22.77203941345215, "global_step": 145047, "epoch": 1747} {"train_loss": -22.94166374206543, "global_step": 145048, "epoch": 1747} {"train_loss": -22.98823356628418, "global_step": 145049, "epoch": 1747} {"train_loss": -23.157623291015625, "global_step": 145050, "epoch": 1747} {"train_loss": -22.50120735168457, "global_step": 145051, "epoch": 1747} {"train_loss": -22.909740447998047, "global_step": 145052, "epoch": 1747} {"train_loss": -22.754518508911133, "global_step": 145053, "epoch": 1747} {"train_loss": -23.099273681640625, "global_step": 145054, "epoch": 1747} {"train_loss": -23.030601501464844, "global_step": 145055, "epoch": 1747} {"train_loss": -22.857946395874023, "global_step": 145056, "epoch": 1747} {"train_loss": -23.058664321899414, "global_step": 145057, "epoch": 1747} {"train_loss": -22.92852210998535, "global_step": 145058, "epoch": 1747} {"train_loss": -23.25735855102539, "global_step": 145059, "epoch": 1747} {"train_loss": -23.295440673828125, "global_step": 145060, "epoch": 1747} {"train_loss": -23.373830795288086, "global_step": 145061, "epoch": 1747} {"train_loss": -22.86727523803711, "global_step": 145062, "epoch": 1747} {"train_loss": -22.95834732055664, "global_step": 145063, "epoch": 1747} {"train_loss": -23.302148818969727, "global_step": 145064, "epoch": 1747} {"train_loss": -23.351713180541992, "global_step": 145065, "epoch": 1747} {"train_loss": -23.0698184967041, "global_step": 145066, "epoch": 1747} {"train_loss": -23.192880630493164, "global_step": 145067, "epoch": 1747} {"train_loss": -23.02620506286621, "global_step": 145068, "epoch": 1747} {"train_loss": -23.3761043548584, "global_step": 145069, "epoch": 1747} {"train_loss": -23.376440048217773, "global_step": 145070, "epoch": 1747} {"train_loss": -23.228559494018555, "global_step": 145071, "epoch": 1747} {"train_loss": -22.9002742767334, "global_step": 145072, "epoch": 1747} {"train_loss": -23.49317741394043, "global_step": 145073, "epoch": 1747} {"train_loss": -23.49247169494629, "global_step": 145074, "epoch": 1747} {"train_loss": -23.312410354614258, "global_step": 145075, "epoch": 1747} {"train_loss": -23.349462509155273, "global_step": 145076, "epoch": 1747} {"train_loss": -23.40591812133789, "global_step": 145077, "epoch": 1747} {"train_loss": -23.07513999938965, "global_step": 145078, "epoch": 1747} {"train_loss": -23.489999771118164, "global_step": 145079, "epoch": 1747} {"train_loss": -22.998546600341797, "global_step": 145080, "epoch": 1747} {"train_loss": -23.32271385192871, "global_step": 145081, "epoch": 1747} {"train_loss": -23.256484985351562, "global_step": 145082, "epoch": 1747} {"train_loss": -23.08363294026938, "global_step": 145083, "epoch": 1747, "val_loss": 6304584.0} {"train_loss": -22.518810272216797, "global_step": 145084, "epoch": 1748} {"train_loss": -22.60420036315918, "global_step": 145085, "epoch": 1748} {"train_loss": -22.57094383239746, "global_step": 145086, "epoch": 1748} {"train_loss": -22.369483947753906, "global_step": 145087, "epoch": 1748} {"train_loss": -21.873836517333984, "global_step": 145088, "epoch": 1748} {"train_loss": -22.59590721130371, "global_step": 145089, "epoch": 1748} {"train_loss": -22.312219619750977, "global_step": 145090, "epoch": 1748} {"train_loss": -22.57253074645996, "global_step": 145091, "epoch": 1748} {"train_loss": -22.408987045288086, "global_step": 145092, "epoch": 1748} {"train_loss": -22.208505630493164, "global_step": 145093, "epoch": 1748} {"train_loss": -23.124021530151367, "global_step": 145094, "epoch": 1748} {"train_loss": -22.45728874206543, "global_step": 145095, "epoch": 1748} {"train_loss": -22.55385398864746, "global_step": 145096, "epoch": 1748} {"train_loss": -22.6805477142334, "global_step": 145097, "epoch": 1748} {"train_loss": -22.823041915893555, "global_step": 145098, "epoch": 1748} {"train_loss": -22.554250717163086, "global_step": 145099, "epoch": 1748} {"train_loss": -22.728679656982422, "global_step": 145100, "epoch": 1748} {"train_loss": -22.672903060913086, "global_step": 145101, "epoch": 1748} {"train_loss": -22.875442504882812, "global_step": 145102, "epoch": 1748} {"train_loss": -22.542455673217773, "global_step": 145103, "epoch": 1748} {"train_loss": -23.076101303100586, "global_step": 145104, "epoch": 1748} {"train_loss": -22.679950714111328, "global_step": 145105, "epoch": 1748} {"train_loss": -23.157808303833008, "global_step": 145106, "epoch": 1748} {"train_loss": -22.48371696472168, "global_step": 145107, "epoch": 1748} {"train_loss": -22.968984603881836, "global_step": 145108, "epoch": 1748} {"train_loss": -22.990076065063477, "global_step": 145109, "epoch": 1748} {"train_loss": -22.747587203979492, "global_step": 145110, "epoch": 1748} {"train_loss": -22.96162986755371, "global_step": 145111, "epoch": 1748} {"train_loss": -23.3469295501709, "global_step": 145112, "epoch": 1748} {"train_loss": -22.98667335510254, "global_step": 145113, "epoch": 1748} {"train_loss": -23.13730239868164, "global_step": 145114, "epoch": 1748} {"train_loss": -23.0557918548584, "global_step": 145115, "epoch": 1748} {"train_loss": -23.0935115814209, "global_step": 145116, "epoch": 1748} {"train_loss": -23.147077560424805, "global_step": 145117, "epoch": 1748} {"train_loss": -23.30190658569336, "global_step": 145118, "epoch": 1748} {"train_loss": -23.025150299072266, "global_step": 145119, "epoch": 1748} {"train_loss": -23.04872703552246, "global_step": 145120, "epoch": 1748} {"train_loss": -23.212682723999023, "global_step": 145121, "epoch": 1748} {"train_loss": -23.139102935791016, "global_step": 145122, "epoch": 1748} {"train_loss": -23.306564331054688, "global_step": 145123, "epoch": 1748} {"train_loss": -23.235509872436523, "global_step": 145124, "epoch": 1748} {"train_loss": -23.133342742919922, "global_step": 145125, "epoch": 1748} {"train_loss": -23.655017852783203, "global_step": 145126, "epoch": 1748} {"train_loss": -23.01602554321289, "global_step": 145127, "epoch": 1748} {"train_loss": -23.34926414489746, "global_step": 145128, "epoch": 1748} {"train_loss": -23.58338737487793, "global_step": 145129, "epoch": 1748} {"train_loss": -23.107664108276367, "global_step": 145130, "epoch": 1748} {"train_loss": -22.86126136779785, "global_step": 145131, "epoch": 1748} {"train_loss": -22.695449829101562, "global_step": 145132, "epoch": 1748} {"train_loss": -22.948789596557617, "global_step": 145133, "epoch": 1748} {"train_loss": -22.82152557373047, "global_step": 145134, "epoch": 1748} {"train_loss": -23.10700035095215, "global_step": 145135, "epoch": 1748} {"train_loss": -22.971128463745117, "global_step": 145136, "epoch": 1748} {"train_loss": -23.456022262573242, "global_step": 145137, "epoch": 1748} {"train_loss": -22.780893325805664, "global_step": 145138, "epoch": 1748} {"train_loss": -22.6306095123291, "global_step": 145139, "epoch": 1748} {"train_loss": -23.135150909423828, "global_step": 145140, "epoch": 1748} {"train_loss": -22.843181610107422, "global_step": 145141, "epoch": 1748} {"train_loss": -22.908056259155273, "global_step": 145142, "epoch": 1748} {"train_loss": -23.117782592773438, "global_step": 145143, "epoch": 1748} {"train_loss": -22.776044845581055, "global_step": 145144, "epoch": 1748} {"train_loss": -23.263099670410156, "global_step": 145145, "epoch": 1748} {"train_loss": -23.105985641479492, "global_step": 145146, "epoch": 1748} {"train_loss": -23.46912956237793, "global_step": 145147, "epoch": 1748} {"train_loss": -23.188434600830078, "global_step": 145148, "epoch": 1748} {"train_loss": -23.299076080322266, "global_step": 145149, "epoch": 1748} {"train_loss": -23.117197036743164, "global_step": 145150, "epoch": 1748} {"train_loss": -23.68912124633789, "global_step": 145151, "epoch": 1748} {"train_loss": -23.08902931213379, "global_step": 145152, "epoch": 1748} {"train_loss": -22.91242027282715, "global_step": 145153, "epoch": 1748} {"train_loss": -23.259387969970703, "global_step": 145154, "epoch": 1748} {"train_loss": -23.069652557373047, "global_step": 145155, "epoch": 1748} {"train_loss": -22.64644432067871, "global_step": 145156, "epoch": 1748} {"train_loss": -23.431106567382812, "global_step": 145157, "epoch": 1748} {"train_loss": -23.265623092651367, "global_step": 145158, "epoch": 1748} {"train_loss": -23.215734481811523, "global_step": 145159, "epoch": 1748} {"train_loss": -22.890913009643555, "global_step": 145160, "epoch": 1748} {"train_loss": -23.23005485534668, "global_step": 145161, "epoch": 1748} {"train_loss": -23.344085693359375, "global_step": 145162, "epoch": 1748} {"train_loss": -23.223899841308594, "global_step": 145163, "epoch": 1748} {"train_loss": -23.408512115478516, "global_step": 145164, "epoch": 1748} {"train_loss": -22.86024284362793, "global_step": 145165, "epoch": 1748} {"train_loss": -22.97942623460149, "global_step": 145166, "epoch": 1748, "val_loss": 6389433.5} {"train_loss": -22.944028854370117, "global_step": 145167, "epoch": 1749} {"train_loss": -22.887624740600586, "global_step": 145168, "epoch": 1749} {"train_loss": -22.74432945251465, "global_step": 145169, "epoch": 1749} {"train_loss": -22.63321304321289, "global_step": 145170, "epoch": 1749} {"train_loss": -22.66875648498535, "global_step": 145171, "epoch": 1749} {"train_loss": -22.828033447265625, "global_step": 145172, "epoch": 1749} {"train_loss": -23.132766723632812, "global_step": 145173, "epoch": 1749} {"train_loss": -22.95403480529785, "global_step": 145174, "epoch": 1749} {"train_loss": -22.895580291748047, "global_step": 145175, "epoch": 1749} {"train_loss": -23.21857261657715, "global_step": 145176, "epoch": 1749} {"train_loss": -22.834625244140625, "global_step": 145177, "epoch": 1749} {"train_loss": -22.725187301635742, "global_step": 145178, "epoch": 1749} {"train_loss": -22.811145782470703, "global_step": 145179, "epoch": 1749} {"train_loss": -22.966297149658203, "global_step": 145180, "epoch": 1749} {"train_loss": -23.103031158447266, "global_step": 145181, "epoch": 1749} {"train_loss": -23.157169342041016, "global_step": 145182, "epoch": 1749} {"train_loss": -22.57906150817871, "global_step": 145183, "epoch": 1749} {"train_loss": -22.77951431274414, "global_step": 145184, "epoch": 1749} {"train_loss": -22.895090103149414, "global_step": 145185, "epoch": 1749} {"train_loss": -22.792341232299805, "global_step": 145186, "epoch": 1749} {"train_loss": -23.23321533203125, "global_step": 145187, "epoch": 1749} {"train_loss": -23.0382022857666, "global_step": 145188, "epoch": 1749} {"train_loss": -23.022541046142578, "global_step": 145189, "epoch": 1749} {"train_loss": -22.8448543548584, "global_step": 145190, "epoch": 1749} {"train_loss": -23.619333267211914, "global_step": 145191, "epoch": 1749} {"train_loss": -22.77174949645996, "global_step": 145192, "epoch": 1749} {"train_loss": -22.8204288482666, "global_step": 145193, "epoch": 1749} {"train_loss": -23.517833709716797, "global_step": 145194, "epoch": 1749} {"train_loss": -23.368864059448242, "global_step": 145195, "epoch": 1749} {"train_loss": -23.14385986328125, "global_step": 145196, "epoch": 1749} {"train_loss": -23.124881744384766, "global_step": 145197, "epoch": 1749} {"train_loss": -23.270112991333008, "global_step": 145198, "epoch": 1749} {"train_loss": -23.334716796875, "global_step": 145199, "epoch": 1749} {"train_loss": -23.165302276611328, "global_step": 145200, "epoch": 1749} {"train_loss": -22.833595275878906, "global_step": 145201, "epoch": 1749} {"train_loss": -23.2752628326416, "global_step": 145202, "epoch": 1749} {"train_loss": -23.39291763305664, "global_step": 145203, "epoch": 1749} {"train_loss": -23.174762725830078, "global_step": 145204, "epoch": 1749} {"train_loss": -23.174711227416992, "global_step": 145205, "epoch": 1749} {"train_loss": -22.95726203918457, "global_step": 145206, "epoch": 1749} {"train_loss": -22.878332138061523, "global_step": 145207, "epoch": 1749} {"train_loss": -23.140249252319336, "global_step": 145208, "epoch": 1749} {"train_loss": -23.340436935424805, "global_step": 145209, "epoch": 1749} {"train_loss": -23.353227615356445, "global_step": 145210, "epoch": 1749} {"train_loss": -22.95407485961914, "global_step": 145211, "epoch": 1749} {"train_loss": -23.2172908782959, "global_step": 145212, "epoch": 1749} {"train_loss": -23.795185089111328, "global_step": 145213, "epoch": 1749} {"train_loss": -23.09975814819336, "global_step": 145214, "epoch": 1749} {"train_loss": -23.34954261779785, "global_step": 145215, "epoch": 1749} {"train_loss": -23.43577003479004, "global_step": 145216, "epoch": 1749} {"train_loss": -23.278654098510742, "global_step": 145217, "epoch": 1749} {"train_loss": -23.01449203491211, "global_step": 145218, "epoch": 1749} {"train_loss": -23.147520065307617, "global_step": 145219, "epoch": 1749} {"train_loss": -23.65145492553711, "global_step": 145220, "epoch": 1749} {"train_loss": -23.246204376220703, "global_step": 145221, "epoch": 1749} {"train_loss": -23.30034828186035, "global_step": 145222, "epoch": 1749} {"train_loss": -23.393075942993164, "global_step": 145223, "epoch": 1749} {"train_loss": -23.218891143798828, "global_step": 145224, "epoch": 1749} {"train_loss": -23.224206924438477, "global_step": 145225, "epoch": 1749} {"train_loss": -23.318653106689453, "global_step": 145226, "epoch": 1749} {"train_loss": -23.17668914794922, "global_step": 145227, "epoch": 1749} {"train_loss": -23.578994750976562, "global_step": 145228, "epoch": 1749} {"train_loss": -23.36568260192871, "global_step": 145229, "epoch": 1749} {"train_loss": -23.024457931518555, "global_step": 145230, "epoch": 1749} {"train_loss": -23.550643920898438, "global_step": 145231, "epoch": 1749} {"train_loss": -23.329273223876953, "global_step": 145232, "epoch": 1749} {"train_loss": -23.099803924560547, "global_step": 145233, "epoch": 1749} {"train_loss": -23.330629348754883, "global_step": 145234, "epoch": 1749} {"train_loss": -23.1721134185791, "global_step": 145235, "epoch": 1749} {"train_loss": -23.014860153198242, "global_step": 145236, "epoch": 1749} {"train_loss": -23.20406150817871, "global_step": 145237, "epoch": 1749} {"train_loss": -23.21708106994629, "global_step": 145238, "epoch": 1749} {"train_loss": -22.94007682800293, "global_step": 145239, "epoch": 1749} {"train_loss": -23.239822387695312, "global_step": 145240, "epoch": 1749} {"train_loss": -23.218830108642578, "global_step": 145241, "epoch": 1749} {"train_loss": -22.858409881591797, "global_step": 145242, "epoch": 1749} {"train_loss": -23.544546127319336, "global_step": 145243, "epoch": 1749} {"train_loss": -23.52123260498047, "global_step": 145244, "epoch": 1749} {"train_loss": -23.105688095092773, "global_step": 145245, "epoch": 1749} {"train_loss": -23.23570442199707, "global_step": 145246, "epoch": 1749} {"train_loss": -23.239145278930664, "global_step": 145247, "epoch": 1749} {"train_loss": -23.363866806030273, "global_step": 145248, "epoch": 1749} {"train_loss": -23.148967880800544, "global_step": 145249, "epoch": 1749, "val_loss": 6348551.0} {"train_loss": -22.637842178344727, "global_step": 145250, "epoch": 1750} {"train_loss": -22.56398582458496, "global_step": 145251, "epoch": 1750} {"train_loss": -22.895177841186523, "global_step": 145252, "epoch": 1750} {"train_loss": -22.719268798828125, "global_step": 145253, "epoch": 1750} {"train_loss": -22.895641326904297, "global_step": 145254, "epoch": 1750} {"train_loss": -23.240009307861328, "global_step": 145255, "epoch": 1750} {"train_loss": -23.219501495361328, "global_step": 145256, "epoch": 1750} {"train_loss": -22.54086685180664, "global_step": 145257, "epoch": 1750} {"train_loss": -22.85263442993164, "global_step": 145258, "epoch": 1750} {"train_loss": -22.681594848632812, "global_step": 145259, "epoch": 1750} {"train_loss": -22.840909957885742, "global_step": 145260, "epoch": 1750} {"train_loss": -22.831342697143555, "global_step": 145261, "epoch": 1750} {"train_loss": -23.024490356445312, "global_step": 145262, "epoch": 1750} {"train_loss": -23.010107040405273, "global_step": 145263, "epoch": 1750} {"train_loss": -23.003070831298828, "global_step": 145264, "epoch": 1750} {"train_loss": -22.75918960571289, "global_step": 145265, "epoch": 1750} {"train_loss": -23.10150146484375, "global_step": 145266, "epoch": 1750} {"train_loss": -23.168432235717773, "global_step": 145267, "epoch": 1750} {"train_loss": -22.852569580078125, "global_step": 145268, "epoch": 1750} {"train_loss": -23.101518630981445, "global_step": 145269, "epoch": 1750} {"train_loss": -23.244951248168945, "global_step": 145270, "epoch": 1750} {"train_loss": -23.094755172729492, "global_step": 145271, "epoch": 1750} {"train_loss": -23.10641860961914, "global_step": 145272, "epoch": 1750} {"train_loss": -23.280492782592773, "global_step": 145273, "epoch": 1750} {"train_loss": -22.86577796936035, "global_step": 145274, "epoch": 1750} {"train_loss": -23.06949234008789, "global_step": 145275, "epoch": 1750} {"train_loss": -23.316349029541016, "global_step": 145276, "epoch": 1750} {"train_loss": -23.2512149810791, "global_step": 145277, "epoch": 1750} {"train_loss": -23.015289306640625, "global_step": 145278, "epoch": 1750} {"train_loss": -23.1505126953125, "global_step": 145279, "epoch": 1750} {"train_loss": -22.92331886291504, "global_step": 145280, "epoch": 1750} {"train_loss": -23.235538482666016, "global_step": 145281, "epoch": 1750} {"train_loss": -23.24629783630371, "global_step": 145282, "epoch": 1750} {"train_loss": -22.972396850585938, "global_step": 145283, "epoch": 1750} {"train_loss": -22.998838424682617, "global_step": 145284, "epoch": 1750} {"train_loss": -23.11921501159668, "global_step": 145285, "epoch": 1750} {"train_loss": -23.09406089782715, "global_step": 145286, "epoch": 1750} {"train_loss": -23.220653533935547, "global_step": 145287, "epoch": 1750} {"train_loss": -23.239452362060547, "global_step": 145288, "epoch": 1750} {"train_loss": -23.122900009155273, "global_step": 145289, "epoch": 1750} {"train_loss": -23.13741683959961, "global_step": 145290, "epoch": 1750} {"train_loss": -22.55659294128418, "global_step": 145291, "epoch": 1750} {"train_loss": -23.29583740234375, "global_step": 145292, "epoch": 1750} {"train_loss": -23.19489097595215, "global_step": 145293, "epoch": 1750} {"train_loss": -23.240360260009766, "global_step": 145294, "epoch": 1750} {"train_loss": -23.205411911010742, "global_step": 145295, "epoch": 1750} {"train_loss": -23.264480590820312, "global_step": 145296, "epoch": 1750} {"train_loss": -22.966638565063477, "global_step": 145297, "epoch": 1750} {"train_loss": -22.8958797454834, "global_step": 145298, "epoch": 1750} {"train_loss": -22.790266036987305, "global_step": 145299, "epoch": 1750} {"train_loss": -22.677371978759766, "global_step": 145300, "epoch": 1750} {"train_loss": -22.993627548217773, "global_step": 145301, "epoch": 1750} {"train_loss": -23.18716812133789, "global_step": 145302, "epoch": 1750} {"train_loss": -22.937633514404297, "global_step": 145303, "epoch": 1750} {"train_loss": -23.35344696044922, "global_step": 145304, "epoch": 1750} {"train_loss": -23.08839988708496, "global_step": 145305, "epoch": 1750} {"train_loss": -23.312101364135742, "global_step": 145306, "epoch": 1750} {"train_loss": -23.433462142944336, "global_step": 145307, "epoch": 1750} {"train_loss": -22.763025283813477, "global_step": 145308, "epoch": 1750} {"train_loss": -23.60732650756836, "global_step": 145309, "epoch": 1750} {"train_loss": -23.059431076049805, "global_step": 145310, "epoch": 1750} {"train_loss": -23.266660690307617, "global_step": 145311, "epoch": 1750} {"train_loss": -23.2258243560791, "global_step": 145312, "epoch": 1750} {"train_loss": -23.414335250854492, "global_step": 145313, "epoch": 1750} {"train_loss": -22.98672866821289, "global_step": 145314, "epoch": 1750} {"train_loss": -23.122190475463867, "global_step": 145315, "epoch": 1750} {"train_loss": -22.993932723999023, "global_step": 145316, "epoch": 1750} {"train_loss": -23.450876235961914, "global_step": 145317, "epoch": 1750} {"train_loss": -22.9099063873291, "global_step": 145318, "epoch": 1750} {"train_loss": -22.840280532836914, "global_step": 145319, "epoch": 1750} {"train_loss": -23.19821548461914, "global_step": 145320, "epoch": 1750} {"train_loss": -23.24849510192871, "global_step": 145321, "epoch": 1750} {"train_loss": -23.1385440826416, "global_step": 145322, "epoch": 1750} {"train_loss": -22.894733428955078, "global_step": 145323, "epoch": 1750} {"train_loss": -23.14054298400879, "global_step": 145324, "epoch": 1750} {"train_loss": -23.361114501953125, "global_step": 145325, "epoch": 1750} {"train_loss": -23.31521987915039, "global_step": 145326, "epoch": 1750} {"train_loss": -23.423383712768555, "global_step": 145327, "epoch": 1750} {"train_loss": -23.1049861907959, "global_step": 145328, "epoch": 1750} {"train_loss": -22.899465560913086, "global_step": 145329, "epoch": 1750} {"train_loss": -22.45685577392578, "global_step": 145330, "epoch": 1750} {"train_loss": -22.96089744567871, "global_step": 145331, "epoch": 1750} {"train_loss": -23.05502528454884, "global_step": 145332, "epoch": 1750, "train/sim_max_reward_0": 1.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4500000": 1.0, "test/sim_max_reward_4500001": 1.0, "test/sim_max_reward_4500002": 1.0, "test/sim_max_reward_4500003": 1.0, "test/sim_max_reward_4500004": 1.0, "test/sim_max_reward_4500005": 1.0, "test/sim_max_reward_4500006": 1.0, "test/sim_max_reward_4500007": 1.0, "test/sim_max_reward_4500008": 1.0, "test/sim_max_reward_4500009": 1.0, "test/sim_max_reward_4500010": 1.0, "test/sim_max_reward_4500011": 1.0, "test/sim_max_reward_4500012": 1.0, "test/sim_max_reward_4500013": 1.0, "test/sim_max_reward_4500014": 1.0, "test/sim_max_reward_4500015": 1.0, "test/sim_max_reward_4500016": 1.0, "test/sim_max_reward_4500017": 1.0, "test/sim_max_reward_4500018": 1.0, "test/sim_max_reward_4500019": 1.0, "test/sim_max_reward_4500020": 1.0, "test/sim_max_reward_4500021": 1.0, "train/mean_score": 1.0, "test/mean_score": 1.0, "val_loss": 6461417.0} {"train_loss": -22.676860809326172, "global_step": 145333, "epoch": 1751} {"train_loss": -22.33253288269043, "global_step": 145334, "epoch": 1751} {"train_loss": -22.61955451965332, "global_step": 145335, "epoch": 1751} {"train_loss": -22.83664894104004, "global_step": 145336, "epoch": 1751} {"train_loss": -22.53658103942871, "global_step": 145337, "epoch": 1751} {"train_loss": -22.893884658813477, "global_step": 145338, "epoch": 1751} {"train_loss": -22.974069595336914, "global_step": 145339, "epoch": 1751} {"train_loss": -22.503007888793945, "global_step": 145340, "epoch": 1751} {"train_loss": -22.823179244995117, "global_step": 145341, "epoch": 1751} {"train_loss": -22.74849510192871, "global_step": 145342, "epoch": 1751} {"train_loss": -22.793350219726562, "global_step": 145343, "epoch": 1751} {"train_loss": -23.160879135131836, "global_step": 145344, "epoch": 1751} {"train_loss": -22.756175994873047, "global_step": 145345, "epoch": 1751} {"train_loss": -22.883108139038086, "global_step": 145346, "epoch": 1751} {"train_loss": -23.075788497924805, "global_step": 145347, "epoch": 1751} {"train_loss": -22.812349319458008, "global_step": 145348, "epoch": 1751} {"train_loss": -22.9331111907959, "global_step": 145349, "epoch": 1751} {"train_loss": -23.319433212280273, "global_step": 145350, "epoch": 1751} {"train_loss": -22.999738693237305, "global_step": 145351, "epoch": 1751} {"train_loss": -22.968957901000977, "global_step": 145352, "epoch": 1751} {"train_loss": -22.76978874206543, "global_step": 145353, "epoch": 1751} {"train_loss": -23.000032424926758, "global_step": 145354, "epoch": 1751} {"train_loss": -23.290176391601562, "global_step": 145355, "epoch": 1751} {"train_loss": -23.085453033447266, "global_step": 145356, "epoch": 1751} {"train_loss": -22.806625366210938, "global_step": 145357, "epoch": 1751} {"train_loss": -23.44684600830078, "global_step": 145358, "epoch": 1751} {"train_loss": -23.0428466796875, "global_step": 145359, "epoch": 1751} {"train_loss": -23.300809860229492, "global_step": 145360, "epoch": 1751} {"train_loss": -23.08519744873047, "global_step": 145361, "epoch": 1751} {"train_loss": -23.181304931640625, "global_step": 145362, "epoch": 1751} {"train_loss": -22.902719497680664, "global_step": 145363, "epoch": 1751} {"train_loss": -23.507665634155273, "global_step": 145364, "epoch": 1751} {"train_loss": -23.340593338012695, "global_step": 145365, "epoch": 1751} {"train_loss": -23.358652114868164, "global_step": 145366, "epoch": 1751} {"train_loss": -23.36875343322754, "global_step": 145367, "epoch": 1751} {"train_loss": -23.011829376220703, "global_step": 145368, "epoch": 1751} {"train_loss": -23.249298095703125, "global_step": 145369, "epoch": 1751} {"train_loss": -23.33820915222168, "global_step": 145370, "epoch": 1751} {"train_loss": -23.573301315307617, "global_step": 145371, "epoch": 1751} {"train_loss": -23.4008846282959, "global_step": 145372, "epoch": 1751} {"train_loss": -23.245113372802734, "global_step": 145373, "epoch": 1751} {"train_loss": -22.9898624420166, "global_step": 145374, "epoch": 1751} {"train_loss": -23.12931251525879, "global_step": 145375, "epoch": 1751} {"train_loss": -23.474380493164062, "global_step": 145376, "epoch": 1751} {"train_loss": -23.173492431640625, "global_step": 145377, "epoch": 1751} {"train_loss": -23.385221481323242, "global_step": 145378, "epoch": 1751} {"train_loss": -23.231311798095703, "global_step": 145379, "epoch": 1751} {"train_loss": -23.471532821655273, "global_step": 145380, "epoch": 1751} {"train_loss": -23.383230209350586, "global_step": 145381, "epoch": 1751} {"train_loss": -23.328393936157227, "global_step": 145382, "epoch": 1751} {"train_loss": -22.825849533081055, "global_step": 145383, "epoch": 1751} {"train_loss": -23.327646255493164, "global_step": 145384, "epoch": 1751} {"train_loss": -22.870351791381836, "global_step": 145385, "epoch": 1751} {"train_loss": -23.223495483398438, "global_step": 145386, "epoch": 1751} {"train_loss": -22.801822662353516, "global_step": 145387, "epoch": 1751} {"train_loss": -22.69065284729004, "global_step": 145388, "epoch": 1751} {"train_loss": -23.011884689331055, "global_step": 145389, "epoch": 1751} {"train_loss": -23.38695526123047, "global_step": 145390, "epoch": 1751} {"train_loss": -23.31849479675293, "global_step": 145391, "epoch": 1751} {"train_loss": -23.052663803100586, "global_step": 145392, "epoch": 1751} {"train_loss": -23.003915786743164, "global_step": 145393, "epoch": 1751} {"train_loss": -23.114177703857422, "global_step": 145394, "epoch": 1751} {"train_loss": -22.990205764770508, "global_step": 145395, "epoch": 1751} {"train_loss": -23.54560661315918, "global_step": 145396, "epoch": 1751} {"train_loss": -22.914112091064453, "global_step": 145397, "epoch": 1751} {"train_loss": -23.15906524658203, "global_step": 145398, "epoch": 1751} {"train_loss": -23.230634689331055, "global_step": 145399, "epoch": 1751} {"train_loss": -22.973644256591797, "global_step": 145400, "epoch": 1751} {"train_loss": -23.264860153198242, "global_step": 145401, "epoch": 1751} {"train_loss": -23.4168643951416, "global_step": 145402, "epoch": 1751} {"train_loss": -23.341007232666016, "global_step": 145403, "epoch": 1751} {"train_loss": -23.50705337524414, "global_step": 145404, "epoch": 1751} {"train_loss": -23.30600929260254, "global_step": 145405, "epoch": 1751} {"train_loss": -23.502948760986328, "global_step": 145406, "epoch": 1751} {"train_loss": -23.11537742614746, "global_step": 145407, "epoch": 1751} {"train_loss": -22.733484268188477, "global_step": 145408, "epoch": 1751} {"train_loss": -23.31334686279297, "global_step": 145409, "epoch": 1751} {"train_loss": -23.26691436767578, "global_step": 145410, "epoch": 1751} {"train_loss": -23.12025260925293, "global_step": 145411, "epoch": 1751} {"train_loss": -23.219606399536133, "global_step": 145412, "epoch": 1751} {"train_loss": -23.226198196411133, "global_step": 145413, "epoch": 1751} {"train_loss": -23.362232208251953, "global_step": 145414, "epoch": 1751} {"train_loss": -23.12473258052964, "global_step": 145415, "epoch": 1751, "val_loss": 6447477.0} {"train_loss": -22.940656661987305, "global_step": 145416, "epoch": 1752} {"train_loss": -22.7020206451416, "global_step": 145417, "epoch": 1752} {"train_loss": -22.321449279785156, "global_step": 145418, "epoch": 1752} {"train_loss": -22.02463150024414, "global_step": 145419, "epoch": 1752} {"train_loss": -22.071439743041992, "global_step": 145420, "epoch": 1752} {"train_loss": -22.833059310913086, "global_step": 145421, "epoch": 1752} {"train_loss": -22.086841583251953, "global_step": 145422, "epoch": 1752} {"train_loss": -22.46540641784668, "global_step": 145423, "epoch": 1752} {"train_loss": -22.46128273010254, "global_step": 145424, "epoch": 1752} {"train_loss": -22.164072036743164, "global_step": 145425, "epoch": 1752} {"train_loss": -22.794408798217773, "global_step": 145426, "epoch": 1752} {"train_loss": -22.077550888061523, "global_step": 145427, "epoch": 1752} {"train_loss": -22.5067195892334, "global_step": 145428, "epoch": 1752} {"train_loss": -22.13337516784668, "global_step": 145429, "epoch": 1752} {"train_loss": -22.73557472229004, "global_step": 145430, "epoch": 1752} {"train_loss": -22.53322410583496, "global_step": 145431, "epoch": 1752} {"train_loss": -22.92066192626953, "global_step": 145432, "epoch": 1752} {"train_loss": -22.867624282836914, "global_step": 145433, "epoch": 1752} {"train_loss": -22.673025131225586, "global_step": 145434, "epoch": 1752} {"train_loss": -22.8829402923584, "global_step": 145435, "epoch": 1752} {"train_loss": -22.71909523010254, "global_step": 145436, "epoch": 1752} {"train_loss": -22.96808433532715, "global_step": 145437, "epoch": 1752} {"train_loss": -22.921483993530273, "global_step": 145438, "epoch": 1752} {"train_loss": -22.78130340576172, "global_step": 145439, "epoch": 1752} {"train_loss": -22.955480575561523, "global_step": 145440, "epoch": 1752} {"train_loss": -22.726856231689453, "global_step": 145441, "epoch": 1752} {"train_loss": -23.090221405029297, "global_step": 145442, "epoch": 1752} {"train_loss": -22.892227172851562, "global_step": 145443, "epoch": 1752} {"train_loss": -22.976720809936523, "global_step": 145444, "epoch": 1752} {"train_loss": -23.043033599853516, "global_step": 145445, "epoch": 1752} {"train_loss": -23.141340255737305, "global_step": 145446, "epoch": 1752} {"train_loss": -23.48611831665039, "global_step": 145447, "epoch": 1752} {"train_loss": -23.115707397460938, "global_step": 145448, "epoch": 1752} {"train_loss": -22.884750366210938, "global_step": 145449, "epoch": 1752} {"train_loss": -23.05794334411621, "global_step": 145450, "epoch": 1752} {"train_loss": -22.7719783782959, "global_step": 145451, "epoch": 1752} {"train_loss": -23.06716537475586, "global_step": 145452, "epoch": 1752} {"train_loss": -23.437524795532227, "global_step": 145453, "epoch": 1752} {"train_loss": -22.99918556213379, "global_step": 145454, "epoch": 1752} {"train_loss": -23.30405044555664, "global_step": 145455, "epoch": 1752} {"train_loss": -23.122419357299805, "global_step": 145456, "epoch": 1752} {"train_loss": -23.0395565032959, "global_step": 145457, "epoch": 1752} {"train_loss": -22.96495246887207, "global_step": 145458, "epoch": 1752} {"train_loss": -23.069108963012695, "global_step": 145459, "epoch": 1752} {"train_loss": -23.002334594726562, "global_step": 145460, "epoch": 1752} {"train_loss": -23.144804000854492, "global_step": 145461, "epoch": 1752} {"train_loss": -23.41259765625, "global_step": 145462, "epoch": 1752} {"train_loss": -23.046096801757812, "global_step": 145463, "epoch": 1752} {"train_loss": -23.368854522705078, "global_step": 145464, "epoch": 1752} {"train_loss": -23.42017936706543, "global_step": 145465, "epoch": 1752} {"train_loss": -23.378995895385742, "global_step": 145466, "epoch": 1752} {"train_loss": -22.84499740600586, "global_step": 145467, "epoch": 1752} {"train_loss": -23.216161727905273, "global_step": 145468, "epoch": 1752} {"train_loss": -23.506031036376953, "global_step": 145469, "epoch": 1752} {"train_loss": -23.381765365600586, "global_step": 145470, "epoch": 1752} {"train_loss": -23.28858757019043, "global_step": 145471, "epoch": 1752} {"train_loss": -22.98284912109375, "global_step": 145472, "epoch": 1752} {"train_loss": -23.49962615966797, "global_step": 145473, "epoch": 1752} {"train_loss": -23.26255226135254, "global_step": 145474, "epoch": 1752} {"train_loss": -22.896045684814453, "global_step": 145475, "epoch": 1752} {"train_loss": -23.03036117553711, "global_step": 145476, "epoch": 1752} {"train_loss": -23.202327728271484, "global_step": 145477, "epoch": 1752} {"train_loss": -23.099218368530273, "global_step": 145478, "epoch": 1752} {"train_loss": -23.255619049072266, "global_step": 145479, "epoch": 1752} {"train_loss": -22.983877182006836, "global_step": 145480, "epoch": 1752} {"train_loss": -23.313215255737305, "global_step": 145481, "epoch": 1752} {"train_loss": -23.31873893737793, "global_step": 145482, "epoch": 1752} {"train_loss": -22.61604118347168, "global_step": 145483, "epoch": 1752} {"train_loss": -23.094711303710938, "global_step": 145484, "epoch": 1752} {"train_loss": -23.428466796875, "global_step": 145485, "epoch": 1752} {"train_loss": -22.94789695739746, "global_step": 145486, "epoch": 1752} {"train_loss": -22.753904342651367, "global_step": 145487, "epoch": 1752} {"train_loss": -22.962839126586914, "global_step": 145488, "epoch": 1752} {"train_loss": -22.97334861755371, "global_step": 145489, "epoch": 1752} {"train_loss": -22.938093185424805, "global_step": 145490, "epoch": 1752} {"train_loss": -22.815519332885742, "global_step": 145491, "epoch": 1752} {"train_loss": -23.157955169677734, "global_step": 145492, "epoch": 1752} {"train_loss": -23.385587692260742, "global_step": 145493, "epoch": 1752} {"train_loss": -23.16451644897461, "global_step": 145494, "epoch": 1752} {"train_loss": -22.801021575927734, "global_step": 145495, "epoch": 1752} {"train_loss": -23.24910545349121, "global_step": 145496, "epoch": 1752} {"train_loss": -23.38210105895996, "global_step": 145497, "epoch": 1752} {"train_loss": -22.96304583262248, "global_step": 145498, "epoch": 1752, "val_loss": 6519854.0} {"train_loss": -22.715259552001953, "global_step": 145499, "epoch": 1753} {"train_loss": -22.796201705932617, "global_step": 145500, "epoch": 1753} {"train_loss": -22.753711700439453, "global_step": 145501, "epoch": 1753} {"train_loss": -22.93320083618164, "global_step": 145502, "epoch": 1753} {"train_loss": -22.983549118041992, "global_step": 145503, "epoch": 1753} {"train_loss": -22.82659912109375, "global_step": 145504, "epoch": 1753} {"train_loss": -22.998340606689453, "global_step": 145505, "epoch": 1753} {"train_loss": -23.38603401184082, "global_step": 145506, "epoch": 1753} {"train_loss": -22.802030563354492, "global_step": 145507, "epoch": 1753} {"train_loss": -23.262731552124023, "global_step": 145508, "epoch": 1753} {"train_loss": -23.049192428588867, "global_step": 145509, "epoch": 1753} {"train_loss": -23.064613342285156, "global_step": 145510, "epoch": 1753} {"train_loss": -23.192317962646484, "global_step": 145511, "epoch": 1753} {"train_loss": -22.736352920532227, "global_step": 145512, "epoch": 1753} {"train_loss": -23.36953353881836, "global_step": 145513, "epoch": 1753} {"train_loss": -23.15705108642578, "global_step": 145514, "epoch": 1753} {"train_loss": -23.06878662109375, "global_step": 145515, "epoch": 1753} {"train_loss": -23.219724655151367, "global_step": 145516, "epoch": 1753} {"train_loss": -22.963790893554688, "global_step": 145517, "epoch": 1753} {"train_loss": -23.27640151977539, "global_step": 145518, "epoch": 1753} {"train_loss": -23.172183990478516, "global_step": 145519, "epoch": 1753} {"train_loss": -23.2205867767334, "global_step": 145520, "epoch": 1753} {"train_loss": -23.095600128173828, "global_step": 145521, "epoch": 1753} {"train_loss": -23.33314323425293, "global_step": 145522, "epoch": 1753} {"train_loss": -23.072696685791016, "global_step": 145523, "epoch": 1753} {"train_loss": -23.300167083740234, "global_step": 145524, "epoch": 1753} {"train_loss": -23.2242488861084, "global_step": 145525, "epoch": 1753} {"train_loss": -23.235952377319336, "global_step": 145526, "epoch": 1753} {"train_loss": -23.28559684753418, "global_step": 145527, "epoch": 1753} {"train_loss": -23.235811233520508, "global_step": 145528, "epoch": 1753} {"train_loss": -23.394691467285156, "global_step": 145529, "epoch": 1753} {"train_loss": -23.27155876159668, "global_step": 145530, "epoch": 1753} {"train_loss": -22.933780670166016, "global_step": 145531, "epoch": 1753} {"train_loss": -23.119754791259766, "global_step": 145532, "epoch": 1753} {"train_loss": -23.121423721313477, "global_step": 145533, "epoch": 1753} {"train_loss": -23.2545223236084, "global_step": 145534, "epoch": 1753} {"train_loss": -23.454923629760742, "global_step": 145535, "epoch": 1753} {"train_loss": -23.16806983947754, "global_step": 145536, "epoch": 1753} {"train_loss": -23.142831802368164, "global_step": 145537, "epoch": 1753} {"train_loss": -23.263090133666992, "global_step": 145538, "epoch": 1753} {"train_loss": -23.206418991088867, "global_step": 145539, "epoch": 1753} {"train_loss": -23.242881774902344, "global_step": 145540, "epoch": 1753} {"train_loss": -23.326688766479492, "global_step": 145541, "epoch": 1753} {"train_loss": -23.210847854614258, "global_step": 145542, "epoch": 1753} {"train_loss": -23.320100784301758, "global_step": 145543, "epoch": 1753} {"train_loss": -23.32037925720215, "global_step": 145544, "epoch": 1753} {"train_loss": -23.167510986328125, "global_step": 145545, "epoch": 1753} {"train_loss": -23.43035888671875, "global_step": 145546, "epoch": 1753} {"train_loss": -23.090301513671875, "global_step": 145547, "epoch": 1753} {"train_loss": -23.160844802856445, "global_step": 145548, "epoch": 1753} {"train_loss": -23.14480209350586, "global_step": 145549, "epoch": 1753} {"train_loss": -23.216144561767578, "global_step": 145550, "epoch": 1753} {"train_loss": -23.05556297302246, "global_step": 145551, "epoch": 1753} {"train_loss": -23.480823516845703, "global_step": 145552, "epoch": 1753} {"train_loss": -22.97401237487793, "global_step": 145553, "epoch": 1753} {"train_loss": -23.17280387878418, "global_step": 145554, "epoch": 1753} {"train_loss": -23.009841918945312, "global_step": 145555, "epoch": 1753} {"train_loss": -23.02876091003418, "global_step": 145556, "epoch": 1753} {"train_loss": -23.286813735961914, "global_step": 145557, "epoch": 1753} {"train_loss": -23.346261978149414, "global_step": 145558, "epoch": 1753} {"train_loss": -23.02374267578125, "global_step": 145559, "epoch": 1753} {"train_loss": -23.339458465576172, "global_step": 145560, "epoch": 1753} {"train_loss": -23.178054809570312, "global_step": 145561, "epoch": 1753} {"train_loss": -23.356372833251953, "global_step": 145562, "epoch": 1753} {"train_loss": -22.88727378845215, "global_step": 145563, "epoch": 1753} {"train_loss": -23.827497482299805, "global_step": 145564, "epoch": 1753} {"train_loss": -23.106733322143555, "global_step": 145565, "epoch": 1753} {"train_loss": -23.511655807495117, "global_step": 145566, "epoch": 1753} {"train_loss": -23.433250427246094, "global_step": 145567, "epoch": 1753} {"train_loss": -23.32254409790039, "global_step": 145568, "epoch": 1753} {"train_loss": -23.57871437072754, "global_step": 145569, "epoch": 1753} {"train_loss": -23.297943115234375, "global_step": 145570, "epoch": 1753} {"train_loss": -23.522371292114258, "global_step": 145571, "epoch": 1753} {"train_loss": -22.988637924194336, "global_step": 145572, "epoch": 1753} {"train_loss": -23.35187530517578, "global_step": 145573, "epoch": 1753} {"train_loss": -23.436460494995117, "global_step": 145574, "epoch": 1753} {"train_loss": -23.107585906982422, "global_step": 145575, "epoch": 1753} {"train_loss": -23.084104537963867, "global_step": 145576, "epoch": 1753} {"train_loss": -23.304460525512695, "global_step": 145577, "epoch": 1753} {"train_loss": -22.948144912719727, "global_step": 145578, "epoch": 1753} {"train_loss": -23.368297576904297, "global_step": 145579, "epoch": 1753} {"train_loss": -23.377534866333008, "global_step": 145580, "epoch": 1753} {"train_loss": -23.189144846904707, "global_step": 145581, "epoch": 1753, "val_loss": 6280999.0} {"train_loss": -22.879871368408203, "global_step": 145582, "epoch": 1754} {"train_loss": -22.803285598754883, "global_step": 145583, "epoch": 1754} {"train_loss": -22.37921905517578, "global_step": 145584, "epoch": 1754} {"train_loss": -23.181615829467773, "global_step": 145585, "epoch": 1754} {"train_loss": -22.9903621673584, "global_step": 145586, "epoch": 1754} {"train_loss": -22.959278106689453, "global_step": 145587, "epoch": 1754} {"train_loss": -22.871845245361328, "global_step": 145588, "epoch": 1754} {"train_loss": -23.238346099853516, "global_step": 145589, "epoch": 1754} {"train_loss": -22.787229537963867, "global_step": 145590, "epoch": 1754} {"train_loss": -22.72811508178711, "global_step": 145591, "epoch": 1754} {"train_loss": -23.2730655670166, "global_step": 145592, "epoch": 1754} {"train_loss": -23.00179672241211, "global_step": 145593, "epoch": 1754} {"train_loss": -23.41354751586914, "global_step": 145594, "epoch": 1754} {"train_loss": -23.032278060913086, "global_step": 145595, "epoch": 1754} {"train_loss": -23.074281692504883, "global_step": 145596, "epoch": 1754} {"train_loss": -23.262508392333984, "global_step": 145597, "epoch": 1754} {"train_loss": -22.848125457763672, "global_step": 145598, "epoch": 1754} {"train_loss": -23.08146858215332, "global_step": 145599, "epoch": 1754} {"train_loss": -23.34612274169922, "global_step": 145600, "epoch": 1754} {"train_loss": -23.03206443786621, "global_step": 145601, "epoch": 1754} {"train_loss": -23.101354598999023, "global_step": 145602, "epoch": 1754} {"train_loss": -23.049962997436523, "global_step": 145603, "epoch": 1754} {"train_loss": -23.40276527404785, "global_step": 145604, "epoch": 1754} {"train_loss": -22.977806091308594, "global_step": 145605, "epoch": 1754} {"train_loss": -22.837574005126953, "global_step": 145606, "epoch": 1754} {"train_loss": -23.184452056884766, "global_step": 145607, "epoch": 1754} {"train_loss": -22.76602554321289, "global_step": 145608, "epoch": 1754} {"train_loss": -22.684782028198242, "global_step": 145609, "epoch": 1754} {"train_loss": -23.071212768554688, "global_step": 145610, "epoch": 1754} {"train_loss": -22.824373245239258, "global_step": 145611, "epoch": 1754} {"train_loss": -23.37705421447754, "global_step": 145612, "epoch": 1754} {"train_loss": -23.282312393188477, "global_step": 145613, "epoch": 1754} {"train_loss": -23.21357536315918, "global_step": 145614, "epoch": 1754} {"train_loss": -23.12801170349121, "global_step": 145615, "epoch": 1754} {"train_loss": -23.252573013305664, "global_step": 145616, "epoch": 1754} {"train_loss": -23.098529815673828, "global_step": 145617, "epoch": 1754} {"train_loss": -23.3836727142334, "global_step": 145618, "epoch": 1754} {"train_loss": -22.816204071044922, "global_step": 145619, "epoch": 1754} {"train_loss": -22.87057876586914, "global_step": 145620, "epoch": 1754} {"train_loss": -23.092422485351562, "global_step": 145621, "epoch": 1754} {"train_loss": -23.766996383666992, "global_step": 145622, "epoch": 1754} {"train_loss": -22.487201690673828, "global_step": 145623, "epoch": 1754} {"train_loss": -23.171308517456055, "global_step": 145624, "epoch": 1754} {"train_loss": -23.25168228149414, "global_step": 145625, "epoch": 1754} {"train_loss": -23.18902587890625, "global_step": 145626, "epoch": 1754} {"train_loss": -23.11771583557129, "global_step": 145627, "epoch": 1754} {"train_loss": -22.9631404876709, "global_step": 145628, "epoch": 1754} {"train_loss": -23.11139488220215, "global_step": 145629, "epoch": 1754} {"train_loss": -23.04074478149414, "global_step": 145630, "epoch": 1754} {"train_loss": -23.061508178710938, "global_step": 145631, "epoch": 1754} {"train_loss": -22.97307014465332, "global_step": 145632, "epoch": 1754} {"train_loss": -22.654516220092773, "global_step": 145633, "epoch": 1754} {"train_loss": -23.059307098388672, "global_step": 145634, "epoch": 1754} {"train_loss": -23.203657150268555, "global_step": 145635, "epoch": 1754} {"train_loss": -23.008934020996094, "global_step": 145636, "epoch": 1754} {"train_loss": -23.01311683654785, "global_step": 145637, "epoch": 1754} {"train_loss": -23.503828048706055, "global_step": 145638, "epoch": 1754} {"train_loss": -22.398731231689453, "global_step": 145639, "epoch": 1754} {"train_loss": -23.34140968322754, "global_step": 145640, "epoch": 1754} {"train_loss": -22.713455200195312, "global_step": 145641, "epoch": 1754} {"train_loss": -23.57267189025879, "global_step": 145642, "epoch": 1754} {"train_loss": -23.036102294921875, "global_step": 145643, "epoch": 1754} {"train_loss": -22.900802612304688, "global_step": 145644, "epoch": 1754} {"train_loss": -23.179868698120117, "global_step": 145645, "epoch": 1754} {"train_loss": -23.728883743286133, "global_step": 145646, "epoch": 1754} {"train_loss": -22.630563735961914, "global_step": 145647, "epoch": 1754} {"train_loss": -23.07646942138672, "global_step": 145648, "epoch": 1754} {"train_loss": -23.10011100769043, "global_step": 145649, "epoch": 1754} {"train_loss": -23.169265747070312, "global_step": 145650, "epoch": 1754} {"train_loss": -22.97491455078125, "global_step": 145651, "epoch": 1754} {"train_loss": -23.236892700195312, "global_step": 145652, "epoch": 1754} {"train_loss": -22.83921241760254, "global_step": 145653, "epoch": 1754} {"train_loss": -23.24285888671875, "global_step": 145654, "epoch": 1754} {"train_loss": -23.015308380126953, "global_step": 145655, "epoch": 1754} {"train_loss": -23.08754539489746, "global_step": 145656, "epoch": 1754} {"train_loss": -22.93877601623535, "global_step": 145657, "epoch": 1754} {"train_loss": -22.98073959350586, "global_step": 145658, "epoch": 1754} {"train_loss": -22.759191513061523, "global_step": 145659, "epoch": 1754} {"train_loss": -23.150110244750977, "global_step": 145660, "epoch": 1754} {"train_loss": -23.15959358215332, "global_step": 145661, "epoch": 1754} {"train_loss": -23.17482566833496, "global_step": 145662, "epoch": 1754} {"train_loss": -23.128772735595703, "global_step": 145663, "epoch": 1754} {"train_loss": -23.056056034134095, "global_step": 145664, "epoch": 1754, "val_loss": 6328814.0} {"train_loss": -22.980770111083984, "global_step": 145665, "epoch": 1755} {"train_loss": -23.013151168823242, "global_step": 145666, "epoch": 1755} {"train_loss": -22.689579010009766, "global_step": 145667, "epoch": 1755} {"train_loss": -23.266828536987305, "global_step": 145668, "epoch": 1755} {"train_loss": -22.930810928344727, "global_step": 145669, "epoch": 1755} {"train_loss": -23.191877365112305, "global_step": 145670, "epoch": 1755} {"train_loss": -23.20338249206543, "global_step": 145671, "epoch": 1755} {"train_loss": -23.03434181213379, "global_step": 145672, "epoch": 1755} {"train_loss": -23.136077880859375, "global_step": 145673, "epoch": 1755} {"train_loss": -23.201387405395508, "global_step": 145674, "epoch": 1755} {"train_loss": -23.26972007751465, "global_step": 145675, "epoch": 1755} {"train_loss": -23.126758575439453, "global_step": 145676, "epoch": 1755} {"train_loss": -23.33827018737793, "global_step": 145677, "epoch": 1755} {"train_loss": -23.518278121948242, "global_step": 145678, "epoch": 1755} {"train_loss": -23.172468185424805, "global_step": 145679, "epoch": 1755} {"train_loss": -23.282270431518555, "global_step": 145680, "epoch": 1755} {"train_loss": -23.06477165222168, "global_step": 145681, "epoch": 1755} {"train_loss": -23.242658615112305, "global_step": 145682, "epoch": 1755} {"train_loss": -23.3138427734375, "global_step": 145683, "epoch": 1755} {"train_loss": -23.019134521484375, "global_step": 145684, "epoch": 1755} {"train_loss": -23.16908073425293, "global_step": 145685, "epoch": 1755} {"train_loss": -23.372121810913086, "global_step": 145686, "epoch": 1755} {"train_loss": -23.39695167541504, "global_step": 145687, "epoch": 1755} {"train_loss": -23.028974533081055, "global_step": 145688, "epoch": 1755} {"train_loss": -23.044357299804688, "global_step": 145689, "epoch": 1755} {"train_loss": -23.1306095123291, "global_step": 145690, "epoch": 1755} {"train_loss": -23.536869049072266, "global_step": 145691, "epoch": 1755} {"train_loss": -22.832670211791992, "global_step": 145692, "epoch": 1755} {"train_loss": -23.131132125854492, "global_step": 145693, "epoch": 1755} {"train_loss": -23.344953536987305, "global_step": 145694, "epoch": 1755} {"train_loss": -23.43402099609375, "global_step": 145695, "epoch": 1755} {"train_loss": -23.349674224853516, "global_step": 145696, "epoch": 1755} {"train_loss": -23.125465393066406, "global_step": 145697, "epoch": 1755} {"train_loss": -23.3946533203125, "global_step": 145698, "epoch": 1755} {"train_loss": -22.89249038696289, "global_step": 145699, "epoch": 1755} {"train_loss": -23.390716552734375, "global_step": 145700, "epoch": 1755} {"train_loss": -23.22629165649414, "global_step": 145701, "epoch": 1755} {"train_loss": -23.018280029296875, "global_step": 145702, "epoch": 1755} {"train_loss": -22.82177734375, "global_step": 145703, "epoch": 1755} {"train_loss": -23.608198165893555, "global_step": 145704, "epoch": 1755} {"train_loss": -23.162033081054688, "global_step": 145705, "epoch": 1755} {"train_loss": -23.144760131835938, "global_step": 145706, "epoch": 1755} {"train_loss": -22.651348114013672, "global_step": 145707, "epoch": 1755} {"train_loss": -23.27452850341797, "global_step": 145708, "epoch": 1755} {"train_loss": -23.335729598999023, "global_step": 145709, "epoch": 1755} {"train_loss": -22.945697784423828, "global_step": 145710, "epoch": 1755} {"train_loss": -23.04073143005371, "global_step": 145711, "epoch": 1755} {"train_loss": -23.09193229675293, "global_step": 145712, "epoch": 1755} {"train_loss": -23.0496826171875, "global_step": 145713, "epoch": 1755} {"train_loss": -22.703903198242188, "global_step": 145714, "epoch": 1755} {"train_loss": -23.53714942932129, "global_step": 145715, "epoch": 1755} {"train_loss": -22.98015594482422, "global_step": 145716, "epoch": 1755} {"train_loss": -23.12497901916504, "global_step": 145717, "epoch": 1755} {"train_loss": -23.13693618774414, "global_step": 145718, "epoch": 1755} {"train_loss": -23.015722274780273, "global_step": 145719, "epoch": 1755} {"train_loss": -23.190444946289062, "global_step": 145720, "epoch": 1755} {"train_loss": -22.84992027282715, "global_step": 145721, "epoch": 1755} {"train_loss": -23.25294303894043, "global_step": 145722, "epoch": 1755} {"train_loss": -22.6540584564209, "global_step": 145723, "epoch": 1755} {"train_loss": -23.420181274414062, "global_step": 145724, "epoch": 1755} {"train_loss": -22.959299087524414, "global_step": 145725, "epoch": 1755} {"train_loss": -23.022180557250977, "global_step": 145726, "epoch": 1755} {"train_loss": -22.874649047851562, "global_step": 145727, "epoch": 1755} {"train_loss": -23.3925838470459, "global_step": 145728, "epoch": 1755} {"train_loss": -23.085987091064453, "global_step": 145729, "epoch": 1755} {"train_loss": -22.89200782775879, "global_step": 145730, "epoch": 1755} {"train_loss": -23.351808547973633, "global_step": 145731, "epoch": 1755} {"train_loss": -23.0311336517334, "global_step": 145732, "epoch": 1755} {"train_loss": -23.72955894470215, "global_step": 145733, "epoch": 1755} {"train_loss": -23.19811248779297, "global_step": 145734, "epoch": 1755} {"train_loss": -23.352705001831055, "global_step": 145735, "epoch": 1755} {"train_loss": -23.25103759765625, "global_step": 145736, "epoch": 1755} {"train_loss": -23.086523056030273, "global_step": 145737, "epoch": 1755} {"train_loss": -23.53071403503418, "global_step": 145738, "epoch": 1755} {"train_loss": -23.280675888061523, "global_step": 145739, "epoch": 1755} {"train_loss": -22.97909164428711, "global_step": 145740, "epoch": 1755} {"train_loss": -23.346960067749023, "global_step": 145741, "epoch": 1755} {"train_loss": -23.391881942749023, "global_step": 145742, "epoch": 1755} {"train_loss": -23.399066925048828, "global_step": 145743, "epoch": 1755} {"train_loss": -23.026979446411133, "global_step": 145744, "epoch": 1755} {"train_loss": -23.23103904724121, "global_step": 145745, "epoch": 1755} {"train_loss": -23.140317916870117, "global_step": 145746, "epoch": 1755} {"train_loss": -23.176807127803205, "global_step": 145747, "epoch": 1755, "val_loss": 6342607.5} {"train_loss": -22.742938995361328, "global_step": 145748, "epoch": 1756} {"train_loss": -22.657852172851562, "global_step": 145749, "epoch": 1756} {"train_loss": -23.066373825073242, "global_step": 145750, "epoch": 1756} {"train_loss": -22.80545997619629, "global_step": 145751, "epoch": 1756} {"train_loss": -23.275543212890625, "global_step": 145752, "epoch": 1756} {"train_loss": -22.927488327026367, "global_step": 145753, "epoch": 1756} {"train_loss": -23.035768508911133, "global_step": 145754, "epoch": 1756} {"train_loss": -23.309890747070312, "global_step": 145755, "epoch": 1756} {"train_loss": -22.987083435058594, "global_step": 145756, "epoch": 1756} {"train_loss": -22.986629486083984, "global_step": 145757, "epoch": 1756} {"train_loss": -23.075618743896484, "global_step": 145758, "epoch": 1756} {"train_loss": -22.70759391784668, "global_step": 145759, "epoch": 1756} {"train_loss": -22.970979690551758, "global_step": 145760, "epoch": 1756} {"train_loss": -22.911489486694336, "global_step": 145761, "epoch": 1756} {"train_loss": -22.91962242126465, "global_step": 145762, "epoch": 1756} {"train_loss": -22.97330093383789, "global_step": 145763, "epoch": 1756} {"train_loss": -23.279804229736328, "global_step": 145764, "epoch": 1756} {"train_loss": -22.99333953857422, "global_step": 145765, "epoch": 1756} {"train_loss": -23.08233070373535, "global_step": 145766, "epoch": 1756} {"train_loss": -23.28213119506836, "global_step": 145767, "epoch": 1756} {"train_loss": -23.106658935546875, "global_step": 145768, "epoch": 1756} {"train_loss": -23.123437881469727, "global_step": 145769, "epoch": 1756} {"train_loss": -22.759084701538086, "global_step": 145770, "epoch": 1756} {"train_loss": -23.032297134399414, "global_step": 145771, "epoch": 1756} {"train_loss": -23.244504928588867, "global_step": 145772, "epoch": 1756} {"train_loss": -22.974262237548828, "global_step": 145773, "epoch": 1756} {"train_loss": -23.3166446685791, "global_step": 145774, "epoch": 1756} {"train_loss": -22.898679733276367, "global_step": 145775, "epoch": 1756} {"train_loss": -23.188873291015625, "global_step": 145776, "epoch": 1756} {"train_loss": -23.094409942626953, "global_step": 145777, "epoch": 1756} {"train_loss": -23.459598541259766, "global_step": 145778, "epoch": 1756} {"train_loss": -23.48829460144043, "global_step": 145779, "epoch": 1756} {"train_loss": -23.2257022857666, "global_step": 145780, "epoch": 1756} {"train_loss": -23.093210220336914, "global_step": 145781, "epoch": 1756} {"train_loss": -23.301498413085938, "global_step": 145782, "epoch": 1756} {"train_loss": -22.941205978393555, "global_step": 145783, "epoch": 1756} {"train_loss": -23.45357322692871, "global_step": 145784, "epoch": 1756} {"train_loss": -23.1822566986084, "global_step": 145785, "epoch": 1756} {"train_loss": -22.623929977416992, "global_step": 145786, "epoch": 1756} {"train_loss": -22.918930053710938, "global_step": 145787, "epoch": 1756} {"train_loss": -22.9340763092041, "global_step": 145788, "epoch": 1756} {"train_loss": -23.221256256103516, "global_step": 145789, "epoch": 1756} {"train_loss": -23.210357666015625, "global_step": 145790, "epoch": 1756} {"train_loss": -23.086410522460938, "global_step": 145791, "epoch": 1756} {"train_loss": -23.324485778808594, "global_step": 145792, "epoch": 1756} {"train_loss": -23.02470588684082, "global_step": 145793, "epoch": 1756} {"train_loss": -22.88646125793457, "global_step": 145794, "epoch": 1756} {"train_loss": -23.492490768432617, "global_step": 145795, "epoch": 1756} {"train_loss": -23.255725860595703, "global_step": 145796, "epoch": 1756} {"train_loss": -23.445720672607422, "global_step": 145797, "epoch": 1756} {"train_loss": -22.901241302490234, "global_step": 145798, "epoch": 1756} {"train_loss": -23.14044761657715, "global_step": 145799, "epoch": 1756} {"train_loss": -23.538206100463867, "global_step": 145800, "epoch": 1756} {"train_loss": -22.793949127197266, "global_step": 145801, "epoch": 1756} {"train_loss": -23.38287353515625, "global_step": 145802, "epoch": 1756} {"train_loss": -23.077274322509766, "global_step": 145803, "epoch": 1756} {"train_loss": -23.288883209228516, "global_step": 145804, "epoch": 1756} {"train_loss": -23.52908706665039, "global_step": 145805, "epoch": 1756} {"train_loss": -23.070791244506836, "global_step": 145806, "epoch": 1756} {"train_loss": -23.10379981994629, "global_step": 145807, "epoch": 1756} {"train_loss": -23.188621520996094, "global_step": 145808, "epoch": 1756} {"train_loss": -23.128620147705078, "global_step": 145809, "epoch": 1756} {"train_loss": -23.443429946899414, "global_step": 145810, "epoch": 1756} {"train_loss": -23.180505752563477, "global_step": 145811, "epoch": 1756} {"train_loss": -23.094587326049805, "global_step": 145812, "epoch": 1756} {"train_loss": -23.160900115966797, "global_step": 145813, "epoch": 1756} {"train_loss": -23.179880142211914, "global_step": 145814, "epoch": 1756} {"train_loss": -23.20125389099121, "global_step": 145815, "epoch": 1756} {"train_loss": -23.391845703125, "global_step": 145816, "epoch": 1756} {"train_loss": -23.275407791137695, "global_step": 145817, "epoch": 1756} {"train_loss": -23.427167892456055, "global_step": 145818, "epoch": 1756} {"train_loss": -23.185461044311523, "global_step": 145819, "epoch": 1756} {"train_loss": -23.084993362426758, "global_step": 145820, "epoch": 1756} {"train_loss": -22.883169174194336, "global_step": 145821, "epoch": 1756} {"train_loss": -22.948286056518555, "global_step": 145822, "epoch": 1756} {"train_loss": -23.28318214416504, "global_step": 145823, "epoch": 1756} {"train_loss": -23.17516326904297, "global_step": 145824, "epoch": 1756} {"train_loss": -23.286828994750977, "global_step": 145825, "epoch": 1756} {"train_loss": -23.153846740722656, "global_step": 145826, "epoch": 1756} {"train_loss": -23.34280776977539, "global_step": 145827, "epoch": 1756} {"train_loss": -23.468761444091797, "global_step": 145828, "epoch": 1756} {"train_loss": -23.19957160949707, "global_step": 145829, "epoch": 1756} {"train_loss": -23.133830219866283, "global_step": 145830, "epoch": 1756, "val_loss": 6214233.5} {"train_loss": -23.184829711914062, "global_step": 145831, "epoch": 1757} {"train_loss": -23.14496421813965, "global_step": 145832, "epoch": 1757} {"train_loss": -22.687942504882812, "global_step": 145833, "epoch": 1757} {"train_loss": -22.887449264526367, "global_step": 145834, "epoch": 1757} {"train_loss": -22.795339584350586, "global_step": 145835, "epoch": 1757} {"train_loss": -23.154315948486328, "global_step": 145836, "epoch": 1757} {"train_loss": -23.351806640625, "global_step": 145837, "epoch": 1757} {"train_loss": -22.98554039001465, "global_step": 145838, "epoch": 1757} {"train_loss": -23.208457946777344, "global_step": 145839, "epoch": 1757} {"train_loss": -23.034088134765625, "global_step": 145840, "epoch": 1757} {"train_loss": -23.072782516479492, "global_step": 145841, "epoch": 1757} {"train_loss": -22.9644718170166, "global_step": 145842, "epoch": 1757} {"train_loss": -23.47115707397461, "global_step": 145843, "epoch": 1757} {"train_loss": -23.077129364013672, "global_step": 145844, "epoch": 1757} {"train_loss": -23.127817153930664, "global_step": 145845, "epoch": 1757} {"train_loss": -22.915830612182617, "global_step": 145846, "epoch": 1757} {"train_loss": -23.076629638671875, "global_step": 145847, "epoch": 1757} {"train_loss": -23.297983169555664, "global_step": 145848, "epoch": 1757} {"train_loss": -23.511465072631836, "global_step": 145849, "epoch": 1757} {"train_loss": -23.158971786499023, "global_step": 145850, "epoch": 1757} {"train_loss": -23.217802047729492, "global_step": 145851, "epoch": 1757} {"train_loss": -22.993505477905273, "global_step": 145852, "epoch": 1757} {"train_loss": -23.52954864501953, "global_step": 145853, "epoch": 1757} {"train_loss": -23.46407127380371, "global_step": 145854, "epoch": 1757} {"train_loss": -23.32769203186035, "global_step": 145855, "epoch": 1757} {"train_loss": -23.104665756225586, "global_step": 145856, "epoch": 1757} {"train_loss": -22.794803619384766, "global_step": 145857, "epoch": 1757} {"train_loss": -23.082887649536133, "global_step": 145858, "epoch": 1757} {"train_loss": -23.101736068725586, "global_step": 145859, "epoch": 1757} {"train_loss": -23.447256088256836, "global_step": 145860, "epoch": 1757} {"train_loss": -22.992359161376953, "global_step": 145861, "epoch": 1757} {"train_loss": -23.089075088500977, "global_step": 145862, "epoch": 1757} {"train_loss": -23.31821632385254, "global_step": 145863, "epoch": 1757} {"train_loss": -23.215438842773438, "global_step": 145864, "epoch": 1757} {"train_loss": -22.919795989990234, "global_step": 145865, "epoch": 1757} {"train_loss": -23.295339584350586, "global_step": 145866, "epoch": 1757} {"train_loss": -23.3175048828125, "global_step": 145867, "epoch": 1757} {"train_loss": -23.23544692993164, "global_step": 145868, "epoch": 1757} {"train_loss": -23.043821334838867, "global_step": 145869, "epoch": 1757} {"train_loss": -22.980316162109375, "global_step": 145870, "epoch": 1757} {"train_loss": -23.47819709777832, "global_step": 145871, "epoch": 1757} {"train_loss": -23.313308715820312, "global_step": 145872, "epoch": 1757} {"train_loss": -23.355764389038086, "global_step": 145873, "epoch": 1757} {"train_loss": -22.86347770690918, "global_step": 145874, "epoch": 1757} {"train_loss": -23.367904663085938, "global_step": 145875, "epoch": 1757} {"train_loss": -23.36121940612793, "global_step": 145876, "epoch": 1757} {"train_loss": -23.31276512145996, "global_step": 145877, "epoch": 1757} {"train_loss": -23.07535171508789, "global_step": 145878, "epoch": 1757} {"train_loss": -23.297611236572266, "global_step": 145879, "epoch": 1757} {"train_loss": -23.355484008789062, "global_step": 145880, "epoch": 1757} {"train_loss": -23.055143356323242, "global_step": 145881, "epoch": 1757} {"train_loss": -23.301321029663086, "global_step": 145882, "epoch": 1757} {"train_loss": -23.38633918762207, "global_step": 145883, "epoch": 1757} {"train_loss": -23.260583877563477, "global_step": 145884, "epoch": 1757} {"train_loss": -23.25995445251465, "global_step": 145885, "epoch": 1757} {"train_loss": -23.381032943725586, "global_step": 145886, "epoch": 1757} {"train_loss": -22.68107795715332, "global_step": 145887, "epoch": 1757} {"train_loss": -23.132980346679688, "global_step": 145888, "epoch": 1757} {"train_loss": -23.113418579101562, "global_step": 145889, "epoch": 1757} {"train_loss": -23.12882423400879, "global_step": 145890, "epoch": 1757} {"train_loss": -23.498071670532227, "global_step": 145891, "epoch": 1757} {"train_loss": -23.294565200805664, "global_step": 145892, "epoch": 1757} {"train_loss": -23.49403190612793, "global_step": 145893, "epoch": 1757} {"train_loss": -23.521421432495117, "global_step": 145894, "epoch": 1757} {"train_loss": -23.330717086791992, "global_step": 145895, "epoch": 1757} {"train_loss": -23.5374698638916, "global_step": 145896, "epoch": 1757} {"train_loss": -23.178068161010742, "global_step": 145897, "epoch": 1757} {"train_loss": -23.505691528320312, "global_step": 145898, "epoch": 1757} {"train_loss": -23.309595108032227, "global_step": 145899, "epoch": 1757} {"train_loss": -22.739179611206055, "global_step": 145900, "epoch": 1757} {"train_loss": -23.067262649536133, "global_step": 145901, "epoch": 1757} {"train_loss": -23.316253662109375, "global_step": 145902, "epoch": 1757} {"train_loss": -22.8487606048584, "global_step": 145903, "epoch": 1757} {"train_loss": -23.09494400024414, "global_step": 145904, "epoch": 1757} {"train_loss": -23.36911392211914, "global_step": 145905, "epoch": 1757} {"train_loss": -23.106454849243164, "global_step": 145906, "epoch": 1757} {"train_loss": -23.514047622680664, "global_step": 145907, "epoch": 1757} {"train_loss": -23.349700927734375, "global_step": 145908, "epoch": 1757} {"train_loss": -23.13225746154785, "global_step": 145909, "epoch": 1757} {"train_loss": -22.965932846069336, "global_step": 145910, "epoch": 1757} {"train_loss": -23.290727615356445, "global_step": 145911, "epoch": 1757} {"train_loss": -23.22212791442871, "global_step": 145912, "epoch": 1757} {"train_loss": -23.214166939976703, "global_step": 145913, "epoch": 1757, "val_loss": 6386734.0} {"train_loss": -22.671674728393555, "global_step": 145914, "epoch": 1758} {"train_loss": -22.506147384643555, "global_step": 145915, "epoch": 1758} {"train_loss": -22.602041244506836, "global_step": 145916, "epoch": 1758} {"train_loss": -22.544963836669922, "global_step": 145917, "epoch": 1758} {"train_loss": -22.276058197021484, "global_step": 145918, "epoch": 1758} {"train_loss": -23.034603118896484, "global_step": 145919, "epoch": 1758} {"train_loss": -23.10030174255371, "global_step": 145920, "epoch": 1758} {"train_loss": -23.02178192138672, "global_step": 145921, "epoch": 1758} {"train_loss": -22.98219871520996, "global_step": 145922, "epoch": 1758} {"train_loss": -23.106464385986328, "global_step": 145923, "epoch": 1758} {"train_loss": -23.0108699798584, "global_step": 145924, "epoch": 1758} {"train_loss": -23.04496192932129, "global_step": 145925, "epoch": 1758} {"train_loss": -22.980093002319336, "global_step": 145926, "epoch": 1758} {"train_loss": -23.139232635498047, "global_step": 145927, "epoch": 1758} {"train_loss": -22.635244369506836, "global_step": 145928, "epoch": 1758} {"train_loss": -23.040016174316406, "global_step": 145929, "epoch": 1758} {"train_loss": -22.994491577148438, "global_step": 145930, "epoch": 1758} {"train_loss": -23.086624145507812, "global_step": 145931, "epoch": 1758} {"train_loss": -23.018909454345703, "global_step": 145932, "epoch": 1758} {"train_loss": -23.19777488708496, "global_step": 145933, "epoch": 1758} {"train_loss": -22.879247665405273, "global_step": 145934, "epoch": 1758} {"train_loss": -22.96756362915039, "global_step": 145935, "epoch": 1758} {"train_loss": -23.18247413635254, "global_step": 145936, "epoch": 1758} {"train_loss": -23.179929733276367, "global_step": 145937, "epoch": 1758} {"train_loss": -22.97818374633789, "global_step": 145938, "epoch": 1758} {"train_loss": -23.44803237915039, "global_step": 145939, "epoch": 1758} {"train_loss": -22.9564266204834, "global_step": 145940, "epoch": 1758} {"train_loss": -23.039323806762695, "global_step": 145941, "epoch": 1758} {"train_loss": -23.04890251159668, "global_step": 145942, "epoch": 1758} {"train_loss": -23.25648307800293, "global_step": 145943, "epoch": 1758} {"train_loss": -22.970449447631836, "global_step": 145944, "epoch": 1758} {"train_loss": -23.104360580444336, "global_step": 145945, "epoch": 1758} {"train_loss": -22.91454315185547, "global_step": 145946, "epoch": 1758} {"train_loss": -23.146697998046875, "global_step": 145947, "epoch": 1758} {"train_loss": -23.533239364624023, "global_step": 145948, "epoch": 1758} {"train_loss": -23.102886199951172, "global_step": 145949, "epoch": 1758} {"train_loss": -23.210124969482422, "global_step": 145950, "epoch": 1758} {"train_loss": -23.283689498901367, "global_step": 145951, "epoch": 1758} {"train_loss": -23.295217514038086, "global_step": 145952, "epoch": 1758} {"train_loss": -22.887144088745117, "global_step": 145953, "epoch": 1758} {"train_loss": -23.18489646911621, "global_step": 145954, "epoch": 1758} {"train_loss": -23.311864852905273, "global_step": 145955, "epoch": 1758} {"train_loss": -23.558820724487305, "global_step": 145956, "epoch": 1758} {"train_loss": -23.0320987701416, "global_step": 145957, "epoch": 1758} {"train_loss": -23.60964012145996, "global_step": 145958, "epoch": 1758} {"train_loss": -23.3310546875, "global_step": 145959, "epoch": 1758} {"train_loss": -22.959604263305664, "global_step": 145960, "epoch": 1758} {"train_loss": -22.888296127319336, "global_step": 145961, "epoch": 1758} {"train_loss": -23.101423263549805, "global_step": 145962, "epoch": 1758} {"train_loss": -23.183944702148438, "global_step": 145963, "epoch": 1758} {"train_loss": -23.004613876342773, "global_step": 145964, "epoch": 1758} {"train_loss": -22.988210678100586, "global_step": 145965, "epoch": 1758} {"train_loss": -23.137575149536133, "global_step": 145966, "epoch": 1758} {"train_loss": -23.509977340698242, "global_step": 145967, "epoch": 1758} {"train_loss": -23.32720375061035, "global_step": 145968, "epoch": 1758} {"train_loss": -23.006031036376953, "global_step": 145969, "epoch": 1758} {"train_loss": -22.68482780456543, "global_step": 145970, "epoch": 1758} {"train_loss": -22.895828247070312, "global_step": 145971, "epoch": 1758} {"train_loss": -23.193700790405273, "global_step": 145972, "epoch": 1758} {"train_loss": -23.171377182006836, "global_step": 145973, "epoch": 1758} {"train_loss": -22.99079132080078, "global_step": 145974, "epoch": 1758} {"train_loss": -23.472614288330078, "global_step": 145975, "epoch": 1758} {"train_loss": -23.26761245727539, "global_step": 145976, "epoch": 1758} {"train_loss": -22.662050247192383, "global_step": 145977, "epoch": 1758} {"train_loss": -23.02341079711914, "global_step": 145978, "epoch": 1758} {"train_loss": -23.14556884765625, "global_step": 145979, "epoch": 1758} {"train_loss": -23.164649963378906, "global_step": 145980, "epoch": 1758} {"train_loss": -23.28094482421875, "global_step": 145981, "epoch": 1758} {"train_loss": -23.23923110961914, "global_step": 145982, "epoch": 1758} {"train_loss": -22.97722816467285, "global_step": 145983, "epoch": 1758} {"train_loss": -23.259794235229492, "global_step": 145984, "epoch": 1758} {"train_loss": -23.467073440551758, "global_step": 145985, "epoch": 1758} {"train_loss": -23.17364501953125, "global_step": 145986, "epoch": 1758} {"train_loss": -23.48848533630371, "global_step": 145987, "epoch": 1758} {"train_loss": -23.168453216552734, "global_step": 145988, "epoch": 1758} {"train_loss": -23.065805435180664, "global_step": 145989, "epoch": 1758} {"train_loss": -23.219858169555664, "global_step": 145990, "epoch": 1758} {"train_loss": -22.7604923248291, "global_step": 145991, "epoch": 1758} {"train_loss": -23.053964614868164, "global_step": 145992, "epoch": 1758} {"train_loss": -23.105987548828125, "global_step": 145993, "epoch": 1758} {"train_loss": -22.99639129638672, "global_step": 145994, "epoch": 1758} {"train_loss": -23.483057022094727, "global_step": 145995, "epoch": 1758} {"train_loss": -23.093122321439076, "global_step": 145996, "epoch": 1758, "val_loss": 6362671.0} {"train_loss": -23.104324340820312, "global_step": 145997, "epoch": 1759} {"train_loss": -23.219697952270508, "global_step": 145998, "epoch": 1759} {"train_loss": -23.197540283203125, "global_step": 145999, "epoch": 1759} {"train_loss": -23.02779769897461, "global_step": 146000, "epoch": 1759} {"train_loss": -23.577796936035156, "global_step": 146001, "epoch": 1759} {"train_loss": -23.251218795776367, "global_step": 146002, "epoch": 1759} {"train_loss": -23.071428298950195, "global_step": 146003, "epoch": 1759} {"train_loss": -23.1471004486084, "global_step": 146004, "epoch": 1759} {"train_loss": -23.384014129638672, "global_step": 146005, "epoch": 1759} {"train_loss": -23.022855758666992, "global_step": 146006, "epoch": 1759} {"train_loss": -23.28940200805664, "global_step": 146007, "epoch": 1759} {"train_loss": -23.61524200439453, "global_step": 146008, "epoch": 1759} {"train_loss": -23.439359664916992, "global_step": 146009, "epoch": 1759} {"train_loss": -22.83316421508789, "global_step": 146010, "epoch": 1759} {"train_loss": -23.29465675354004, "global_step": 146011, "epoch": 1759} {"train_loss": -23.421966552734375, "global_step": 146012, "epoch": 1759} {"train_loss": -23.18701171875, "global_step": 146013, "epoch": 1759} {"train_loss": -23.1265926361084, "global_step": 146014, "epoch": 1759} {"train_loss": -23.020116806030273, "global_step": 146015, "epoch": 1759} {"train_loss": -23.077129364013672, "global_step": 146016, "epoch": 1759} {"train_loss": -23.037050247192383, "global_step": 146017, "epoch": 1759} {"train_loss": -23.295339584350586, "global_step": 146018, "epoch": 1759} {"train_loss": -23.046241760253906, "global_step": 146019, "epoch": 1759} {"train_loss": -22.985994338989258, "global_step": 146020, "epoch": 1759} {"train_loss": -23.22962760925293, "global_step": 146021, "epoch": 1759} {"train_loss": -23.21870994567871, "global_step": 146022, "epoch": 1759} {"train_loss": -22.710834503173828, "global_step": 146023, "epoch": 1759} {"train_loss": -23.100927352905273, "global_step": 146024, "epoch": 1759} {"train_loss": -23.36440086364746, "global_step": 146025, "epoch": 1759} {"train_loss": -23.2088680267334, "global_step": 146026, "epoch": 1759} {"train_loss": -23.307050704956055, "global_step": 146027, "epoch": 1759} {"train_loss": -23.46902847290039, "global_step": 146028, "epoch": 1759} {"train_loss": -23.137744903564453, "global_step": 146029, "epoch": 1759} {"train_loss": -23.186643600463867, "global_step": 146030, "epoch": 1759} {"train_loss": -23.011005401611328, "global_step": 146031, "epoch": 1759} {"train_loss": -23.50313377380371, "global_step": 146032, "epoch": 1759} {"train_loss": -23.145877838134766, "global_step": 146033, "epoch": 1759} {"train_loss": -23.029865264892578, "global_step": 146034, "epoch": 1759} {"train_loss": -23.24965476989746, "global_step": 146035, "epoch": 1759} {"train_loss": -22.867938995361328, "global_step": 146036, "epoch": 1759} {"train_loss": -23.170536041259766, "global_step": 146037, "epoch": 1759} {"train_loss": -22.88948631286621, "global_step": 146038, "epoch": 1759} {"train_loss": -23.418012619018555, "global_step": 146039, "epoch": 1759} {"train_loss": -22.817794799804688, "global_step": 146040, "epoch": 1759} {"train_loss": -23.120040893554688, "global_step": 146041, "epoch": 1759} {"train_loss": -23.302719116210938, "global_step": 146042, "epoch": 1759} {"train_loss": -22.830699920654297, "global_step": 146043, "epoch": 1759} {"train_loss": -23.068744659423828, "global_step": 146044, "epoch": 1759} {"train_loss": -22.94816780090332, "global_step": 146045, "epoch": 1759} {"train_loss": -23.236059188842773, "global_step": 146046, "epoch": 1759} {"train_loss": -22.9497127532959, "global_step": 146047, "epoch": 1759} {"train_loss": -23.14653205871582, "global_step": 146048, "epoch": 1759} {"train_loss": -23.042768478393555, "global_step": 146049, "epoch": 1759} {"train_loss": -23.626012802124023, "global_step": 146050, "epoch": 1759} {"train_loss": -23.0279598236084, "global_step": 146051, "epoch": 1759} {"train_loss": -23.051610946655273, "global_step": 146052, "epoch": 1759} {"train_loss": -22.799571990966797, "global_step": 146053, "epoch": 1759} {"train_loss": -23.386926651000977, "global_step": 146054, "epoch": 1759} {"train_loss": -23.16170310974121, "global_step": 146055, "epoch": 1759} {"train_loss": -23.135927200317383, "global_step": 146056, "epoch": 1759} {"train_loss": -23.275238037109375, "global_step": 146057, "epoch": 1759} {"train_loss": -22.889375686645508, "global_step": 146058, "epoch": 1759} {"train_loss": -22.95792007446289, "global_step": 146059, "epoch": 1759} {"train_loss": -23.24464225769043, "global_step": 146060, "epoch": 1759} {"train_loss": -23.623676300048828, "global_step": 146061, "epoch": 1759} {"train_loss": -23.126508712768555, "global_step": 146062, "epoch": 1759} {"train_loss": -23.093782424926758, "global_step": 146063, "epoch": 1759} {"train_loss": -23.089752197265625, "global_step": 146064, "epoch": 1759} {"train_loss": -23.52203369140625, "global_step": 146065, "epoch": 1759} {"train_loss": -23.0921688079834, "global_step": 146066, "epoch": 1759} {"train_loss": -23.032590866088867, "global_step": 146067, "epoch": 1759} {"train_loss": -23.282501220703125, "global_step": 146068, "epoch": 1759} {"train_loss": -23.084991455078125, "global_step": 146069, "epoch": 1759} {"train_loss": -23.11629295349121, "global_step": 146070, "epoch": 1759} {"train_loss": -23.259061813354492, "global_step": 146071, "epoch": 1759} {"train_loss": -23.1705265045166, "global_step": 146072, "epoch": 1759} {"train_loss": -23.30377769470215, "global_step": 146073, "epoch": 1759} {"train_loss": -23.325857162475586, "global_step": 146074, "epoch": 1759} {"train_loss": -22.817298889160156, "global_step": 146075, "epoch": 1759} {"train_loss": -23.427003860473633, "global_step": 146076, "epoch": 1759} {"train_loss": -23.090085983276367, "global_step": 146077, "epoch": 1759} {"train_loss": -23.339366912841797, "global_step": 146078, "epoch": 1759} {"train_loss": -23.177770522703607, "global_step": 146079, "epoch": 1759, "val_loss": 6228870.0} {"train_loss": -22.276235580444336, "global_step": 146080, "epoch": 1760} {"train_loss": -23.13454246520996, "global_step": 146081, "epoch": 1760} {"train_loss": -22.400157928466797, "global_step": 146082, "epoch": 1760} {"train_loss": -22.696666717529297, "global_step": 146083, "epoch": 1760} {"train_loss": -22.60220718383789, "global_step": 146084, "epoch": 1760} {"train_loss": -22.899009704589844, "global_step": 146085, "epoch": 1760} {"train_loss": -23.182050704956055, "global_step": 146086, "epoch": 1760} {"train_loss": -22.739635467529297, "global_step": 146087, "epoch": 1760} {"train_loss": -22.69593620300293, "global_step": 146088, "epoch": 1760} {"train_loss": -22.880643844604492, "global_step": 146089, "epoch": 1760} {"train_loss": -23.095388412475586, "global_step": 146090, "epoch": 1760} {"train_loss": -22.99962043762207, "global_step": 146091, "epoch": 1760} {"train_loss": -23.05044937133789, "global_step": 146092, "epoch": 1760} {"train_loss": -22.988605499267578, "global_step": 146093, "epoch": 1760} {"train_loss": -22.96685028076172, "global_step": 146094, "epoch": 1760} {"train_loss": -22.93171501159668, "global_step": 146095, "epoch": 1760} {"train_loss": -22.956144332885742, "global_step": 146096, "epoch": 1760} {"train_loss": -23.036413192749023, "global_step": 146097, "epoch": 1760} {"train_loss": -23.024993896484375, "global_step": 146098, "epoch": 1760} {"train_loss": -23.40544891357422, "global_step": 146099, "epoch": 1760} {"train_loss": -23.084732055664062, "global_step": 146100, "epoch": 1760} {"train_loss": -22.9198055267334, "global_step": 146101, "epoch": 1760} {"train_loss": -22.93268394470215, "global_step": 146102, "epoch": 1760} {"train_loss": -23.34273338317871, "global_step": 146103, "epoch": 1760} {"train_loss": -23.154495239257812, "global_step": 146104, "epoch": 1760} {"train_loss": -23.027494430541992, "global_step": 146105, "epoch": 1760} {"train_loss": -23.209196090698242, "global_step": 146106, "epoch": 1760} {"train_loss": -23.232812881469727, "global_step": 146107, "epoch": 1760} {"train_loss": -23.29123878479004, "global_step": 146108, "epoch": 1760} {"train_loss": -23.527694702148438, "global_step": 146109, "epoch": 1760} {"train_loss": -23.36452865600586, "global_step": 146110, "epoch": 1760} {"train_loss": -23.307964324951172, "global_step": 146111, "epoch": 1760} {"train_loss": -23.41529655456543, "global_step": 146112, "epoch": 1760} {"train_loss": -23.323820114135742, "global_step": 146113, "epoch": 1760} {"train_loss": -23.437698364257812, "global_step": 146114, "epoch": 1760} {"train_loss": -23.393117904663086, "global_step": 146115, "epoch": 1760} {"train_loss": -23.351139068603516, "global_step": 146116, "epoch": 1760} {"train_loss": -23.588245391845703, "global_step": 146117, "epoch": 1760} {"train_loss": -23.413726806640625, "global_step": 146118, "epoch": 1760} {"train_loss": -23.007047653198242, "global_step": 146119, "epoch": 1760} {"train_loss": -22.663528442382812, "global_step": 146120, "epoch": 1760} {"train_loss": -23.2817440032959, "global_step": 146121, "epoch": 1760} {"train_loss": -23.268735885620117, "global_step": 146122, "epoch": 1760} {"train_loss": -23.421295166015625, "global_step": 146123, "epoch": 1760} {"train_loss": -22.64539909362793, "global_step": 146124, "epoch": 1760} {"train_loss": -23.172975540161133, "global_step": 146125, "epoch": 1760} {"train_loss": -23.059507369995117, "global_step": 146126, "epoch": 1760} {"train_loss": -23.156286239624023, "global_step": 146127, "epoch": 1760} {"train_loss": -23.05126953125, "global_step": 146128, "epoch": 1760} {"train_loss": -23.061264038085938, "global_step": 146129, "epoch": 1760} {"train_loss": -23.508577346801758, "global_step": 146130, "epoch": 1760} {"train_loss": -23.203643798828125, "global_step": 146131, "epoch": 1760} {"train_loss": -23.07339096069336, "global_step": 146132, "epoch": 1760} {"train_loss": -23.464649200439453, "global_step": 146133, "epoch": 1760} {"train_loss": -23.430036544799805, "global_step": 146134, "epoch": 1760} {"train_loss": -23.23246192932129, "global_step": 146135, "epoch": 1760} {"train_loss": -23.319759368896484, "global_step": 146136, "epoch": 1760} {"train_loss": -23.141637802124023, "global_step": 146137, "epoch": 1760} {"train_loss": -22.75101089477539, "global_step": 146138, "epoch": 1760} {"train_loss": -23.25261116027832, "global_step": 146139, "epoch": 1760} {"train_loss": -22.894332885742188, "global_step": 146140, "epoch": 1760} {"train_loss": -23.10346794128418, "global_step": 146141, "epoch": 1760} {"train_loss": -23.050561904907227, "global_step": 146142, "epoch": 1760} {"train_loss": -23.152481079101562, "global_step": 146143, "epoch": 1760} {"train_loss": -23.033353805541992, "global_step": 146144, "epoch": 1760} {"train_loss": -22.825855255126953, "global_step": 146145, "epoch": 1760} {"train_loss": -23.234760284423828, "global_step": 146146, "epoch": 1760} {"train_loss": -23.221420288085938, "global_step": 146147, "epoch": 1760} {"train_loss": -23.355932235717773, "global_step": 146148, "epoch": 1760} {"train_loss": -22.955291748046875, "global_step": 146149, "epoch": 1760} {"train_loss": -23.415273666381836, "global_step": 146150, "epoch": 1760} {"train_loss": -23.009061813354492, "global_step": 146151, "epoch": 1760} {"train_loss": -23.243274688720703, "global_step": 146152, "epoch": 1760} {"train_loss": -23.28597640991211, "global_step": 146153, "epoch": 1760} {"train_loss": -22.952865600585938, "global_step": 146154, "epoch": 1760} {"train_loss": -23.46112632751465, "global_step": 146155, "epoch": 1760} {"train_loss": -23.000228881835938, "global_step": 146156, "epoch": 1760} {"train_loss": -23.010421752929688, "global_step": 146157, "epoch": 1760} {"train_loss": -23.188413619995117, "global_step": 146158, "epoch": 1760} {"train_loss": -23.48848533630371, "global_step": 146159, "epoch": 1760} {"train_loss": -23.114395141601562, "global_step": 146160, "epoch": 1760} {"train_loss": -23.144683837890625, "global_step": 146161, "epoch": 1760} {"train_loss": -23.113288373832244, "global_step": 146162, "epoch": 1760, "val_loss": 6356314.0} {"train_loss": -22.79776954650879, "global_step": 146163, "epoch": 1761} {"train_loss": -22.918167114257812, "global_step": 146164, "epoch": 1761} {"train_loss": -23.164884567260742, "global_step": 146165, "epoch": 1761} {"train_loss": -22.736509323120117, "global_step": 146166, "epoch": 1761} {"train_loss": -22.799203872680664, "global_step": 146167, "epoch": 1761} {"train_loss": -22.951995849609375, "global_step": 146168, "epoch": 1761} {"train_loss": -22.995473861694336, "global_step": 146169, "epoch": 1761} {"train_loss": -23.165569305419922, "global_step": 146170, "epoch": 1761} {"train_loss": -22.653045654296875, "global_step": 146171, "epoch": 1761} {"train_loss": -23.17186164855957, "global_step": 146172, "epoch": 1761} {"train_loss": -23.12825584411621, "global_step": 146173, "epoch": 1761} {"train_loss": -22.87311363220215, "global_step": 146174, "epoch": 1761} {"train_loss": -23.189611434936523, "global_step": 146175, "epoch": 1761} {"train_loss": -23.380117416381836, "global_step": 146176, "epoch": 1761} {"train_loss": -23.076034545898438, "global_step": 146177, "epoch": 1761} {"train_loss": -22.89261245727539, "global_step": 146178, "epoch": 1761} {"train_loss": -23.162342071533203, "global_step": 146179, "epoch": 1761} {"train_loss": -23.291793823242188, "global_step": 146180, "epoch": 1761} {"train_loss": -23.08657455444336, "global_step": 146181, "epoch": 1761} {"train_loss": -22.965002059936523, "global_step": 146182, "epoch": 1761} {"train_loss": -23.38289451599121, "global_step": 146183, "epoch": 1761} {"train_loss": -22.768964767456055, "global_step": 146184, "epoch": 1761} {"train_loss": -23.87538719177246, "global_step": 146185, "epoch": 1761} {"train_loss": -23.524198532104492, "global_step": 146186, "epoch": 1761} {"train_loss": -23.201391220092773, "global_step": 146187, "epoch": 1761} {"train_loss": -23.494945526123047, "global_step": 146188, "epoch": 1761} {"train_loss": -23.02145767211914, "global_step": 146189, "epoch": 1761} {"train_loss": -22.95954132080078, "global_step": 146190, "epoch": 1761} {"train_loss": -23.375099182128906, "global_step": 146191, "epoch": 1761} {"train_loss": -22.80791664123535, "global_step": 146192, "epoch": 1761} {"train_loss": -22.612668991088867, "global_step": 146193, "epoch": 1761} {"train_loss": -23.539426803588867, "global_step": 146194, "epoch": 1761} {"train_loss": -23.107608795166016, "global_step": 146195, "epoch": 1761} {"train_loss": -23.049314498901367, "global_step": 146196, "epoch": 1761} {"train_loss": -23.515689849853516, "global_step": 146197, "epoch": 1761} {"train_loss": -23.152006149291992, "global_step": 146198, "epoch": 1761} {"train_loss": -23.1859188079834, "global_step": 146199, "epoch": 1761} {"train_loss": -23.317960739135742, "global_step": 146200, "epoch": 1761} {"train_loss": -22.972951889038086, "global_step": 146201, "epoch": 1761} {"train_loss": -23.0358943939209, "global_step": 146202, "epoch": 1761} {"train_loss": -23.17203712463379, "global_step": 146203, "epoch": 1761} {"train_loss": -23.22309684753418, "global_step": 146204, "epoch": 1761} {"train_loss": -23.164037704467773, "global_step": 146205, "epoch": 1761} {"train_loss": -23.138580322265625, "global_step": 146206, "epoch": 1761} {"train_loss": -23.226545333862305, "global_step": 146207, "epoch": 1761} {"train_loss": -23.193952560424805, "global_step": 146208, "epoch": 1761} {"train_loss": -23.40408706665039, "global_step": 146209, "epoch": 1761} {"train_loss": -23.27826499938965, "global_step": 146210, "epoch": 1761} {"train_loss": -23.469072341918945, "global_step": 146211, "epoch": 1761} {"train_loss": -23.250699996948242, "global_step": 146212, "epoch": 1761} {"train_loss": -22.993207931518555, "global_step": 146213, "epoch": 1761} {"train_loss": -22.941686630249023, "global_step": 146214, "epoch": 1761} {"train_loss": -23.390317916870117, "global_step": 146215, "epoch": 1761} {"train_loss": -23.617422103881836, "global_step": 146216, "epoch": 1761} {"train_loss": -23.44755744934082, "global_step": 146217, "epoch": 1761} {"train_loss": -23.13796043395996, "global_step": 146218, "epoch": 1761} {"train_loss": -22.86885643005371, "global_step": 146219, "epoch": 1761} {"train_loss": -23.61321449279785, "global_step": 146220, "epoch": 1761} {"train_loss": -23.4075870513916, "global_step": 146221, "epoch": 1761} {"train_loss": -23.429555892944336, "global_step": 146222, "epoch": 1761} {"train_loss": -22.99921989440918, "global_step": 146223, "epoch": 1761} {"train_loss": -23.430482864379883, "global_step": 146224, "epoch": 1761} {"train_loss": -22.962644577026367, "global_step": 146225, "epoch": 1761} {"train_loss": -23.45612144470215, "global_step": 146226, "epoch": 1761} {"train_loss": -22.943994522094727, "global_step": 146227, "epoch": 1761} {"train_loss": -23.1910400390625, "global_step": 146228, "epoch": 1761} {"train_loss": -23.1079158782959, "global_step": 146229, "epoch": 1761} {"train_loss": -23.10619354248047, "global_step": 146230, "epoch": 1761} {"train_loss": -23.668624877929688, "global_step": 146231, "epoch": 1761} {"train_loss": -23.15883445739746, "global_step": 146232, "epoch": 1761} {"train_loss": -23.190128326416016, "global_step": 146233, "epoch": 1761} {"train_loss": -23.284469604492188, "global_step": 146234, "epoch": 1761} {"train_loss": -23.420080184936523, "global_step": 146235, "epoch": 1761} {"train_loss": -23.003868103027344, "global_step": 146236, "epoch": 1761} {"train_loss": -23.18184471130371, "global_step": 146237, "epoch": 1761} {"train_loss": -23.243337631225586, "global_step": 146238, "epoch": 1761} {"train_loss": -23.245487213134766, "global_step": 146239, "epoch": 1761} {"train_loss": -23.1385498046875, "global_step": 146240, "epoch": 1761} {"train_loss": -23.304203033447266, "global_step": 146241, "epoch": 1761} {"train_loss": -22.917736053466797, "global_step": 146242, "epoch": 1761} {"train_loss": -23.363874435424805, "global_step": 146243, "epoch": 1761} {"train_loss": -23.4531192779541, "global_step": 146244, "epoch": 1761} {"train_loss": -23.19312026701778, "global_step": 146245, "epoch": 1761, "val_loss": 6306521.0} {"train_loss": -22.8487548828125, "global_step": 146246, "epoch": 1762} {"train_loss": -22.794164657592773, "global_step": 146247, "epoch": 1762} {"train_loss": -22.99579429626465, "global_step": 146248, "epoch": 1762} {"train_loss": -22.5250301361084, "global_step": 146249, "epoch": 1762} {"train_loss": -22.846921920776367, "global_step": 146250, "epoch": 1762} {"train_loss": -22.472509384155273, "global_step": 146251, "epoch": 1762} {"train_loss": -23.060176849365234, "global_step": 146252, "epoch": 1762} {"train_loss": -23.057371139526367, "global_step": 146253, "epoch": 1762} {"train_loss": -23.14171600341797, "global_step": 146254, "epoch": 1762} {"train_loss": -23.196796417236328, "global_step": 146255, "epoch": 1762} {"train_loss": -23.12694549560547, "global_step": 146256, "epoch": 1762} {"train_loss": -22.588037490844727, "global_step": 146257, "epoch": 1762} {"train_loss": -22.990373611450195, "global_step": 146258, "epoch": 1762} {"train_loss": -23.345617294311523, "global_step": 146259, "epoch": 1762} {"train_loss": -23.41837501525879, "global_step": 146260, "epoch": 1762} {"train_loss": -22.916004180908203, "global_step": 146261, "epoch": 1762} {"train_loss": -22.96756935119629, "global_step": 146262, "epoch": 1762} {"train_loss": -22.749114990234375, "global_step": 146263, "epoch": 1762} {"train_loss": -22.956682205200195, "global_step": 146264, "epoch": 1762} {"train_loss": -22.86439323425293, "global_step": 146265, "epoch": 1762} {"train_loss": -23.161725997924805, "global_step": 146266, "epoch": 1762} {"train_loss": -23.08949089050293, "global_step": 146267, "epoch": 1762} {"train_loss": -22.852319717407227, "global_step": 146268, "epoch": 1762} {"train_loss": -23.153146743774414, "global_step": 146269, "epoch": 1762} {"train_loss": -23.503089904785156, "global_step": 146270, "epoch": 1762} {"train_loss": -23.12660026550293, "global_step": 146271, "epoch": 1762} {"train_loss": -23.23939323425293, "global_step": 146272, "epoch": 1762} {"train_loss": -23.396459579467773, "global_step": 146273, "epoch": 1762} {"train_loss": -23.472135543823242, "global_step": 146274, "epoch": 1762} {"train_loss": -23.32640266418457, "global_step": 146275, "epoch": 1762} {"train_loss": -23.25077247619629, "global_step": 146276, "epoch": 1762} {"train_loss": -23.435951232910156, "global_step": 146277, "epoch": 1762} {"train_loss": -23.084314346313477, "global_step": 146278, "epoch": 1762} {"train_loss": -23.051206588745117, "global_step": 146279, "epoch": 1762} {"train_loss": -23.09882164001465, "global_step": 146280, "epoch": 1762} {"train_loss": -23.32151985168457, "global_step": 146281, "epoch": 1762} {"train_loss": -23.29620933532715, "global_step": 146282, "epoch": 1762} {"train_loss": -23.120342254638672, "global_step": 146283, "epoch": 1762} {"train_loss": -23.3989315032959, "global_step": 146284, "epoch": 1762} {"train_loss": -23.695341110229492, "global_step": 146285, "epoch": 1762} {"train_loss": -23.2692928314209, "global_step": 146286, "epoch": 1762} {"train_loss": -23.443593978881836, "global_step": 146287, "epoch": 1762} {"train_loss": -23.05322265625, "global_step": 146288, "epoch": 1762} {"train_loss": -22.734243392944336, "global_step": 146289, "epoch": 1762} {"train_loss": -23.061269760131836, "global_step": 146290, "epoch": 1762} {"train_loss": -22.888090133666992, "global_step": 146291, "epoch": 1762} {"train_loss": -23.171239852905273, "global_step": 146292, "epoch": 1762} {"train_loss": -23.030431747436523, "global_step": 146293, "epoch": 1762} {"train_loss": -22.941316604614258, "global_step": 146294, "epoch": 1762} {"train_loss": -23.164766311645508, "global_step": 146295, "epoch": 1762} {"train_loss": -22.842620849609375, "global_step": 146296, "epoch": 1762} {"train_loss": -23.112552642822266, "global_step": 146297, "epoch": 1762} {"train_loss": -23.194427490234375, "global_step": 146298, "epoch": 1762} {"train_loss": -23.29755973815918, "global_step": 146299, "epoch": 1762} {"train_loss": -23.09522819519043, "global_step": 146300, "epoch": 1762} {"train_loss": -22.890880584716797, "global_step": 146301, "epoch": 1762} {"train_loss": -23.28163719177246, "global_step": 146302, "epoch": 1762} {"train_loss": -23.149744033813477, "global_step": 146303, "epoch": 1762} {"train_loss": -22.999135971069336, "global_step": 146304, "epoch": 1762} {"train_loss": -23.34868812561035, "global_step": 146305, "epoch": 1762} {"train_loss": -23.09364891052246, "global_step": 146306, "epoch": 1762} {"train_loss": -22.93278694152832, "global_step": 146307, "epoch": 1762} {"train_loss": -23.44843101501465, "global_step": 146308, "epoch": 1762} {"train_loss": -23.536123275756836, "global_step": 146309, "epoch": 1762} {"train_loss": -22.675352096557617, "global_step": 146310, "epoch": 1762} {"train_loss": -23.061450958251953, "global_step": 146311, "epoch": 1762} {"train_loss": -23.20021629333496, "global_step": 146312, "epoch": 1762} {"train_loss": -22.8543758392334, "global_step": 146313, "epoch": 1762} {"train_loss": -22.77992057800293, "global_step": 146314, "epoch": 1762} {"train_loss": -23.139013290405273, "global_step": 146315, "epoch": 1762} {"train_loss": -23.09649658203125, "global_step": 146316, "epoch": 1762} {"train_loss": -23.052568435668945, "global_step": 146317, "epoch": 1762} {"train_loss": -23.122480392456055, "global_step": 146318, "epoch": 1762} {"train_loss": -23.220550537109375, "global_step": 146319, "epoch": 1762} {"train_loss": -23.14918327331543, "global_step": 146320, "epoch": 1762} {"train_loss": -23.27846908569336, "global_step": 146321, "epoch": 1762} {"train_loss": -23.09157371520996, "global_step": 146322, "epoch": 1762} {"train_loss": -23.293806076049805, "global_step": 146323, "epoch": 1762} {"train_loss": -23.00025749206543, "global_step": 146324, "epoch": 1762} {"train_loss": -22.81925392150879, "global_step": 146325, "epoch": 1762} {"train_loss": -22.738388061523438, "global_step": 146326, "epoch": 1762} {"train_loss": -23.05278968811035, "global_step": 146327, "epoch": 1762} {"train_loss": -23.085317312952984, "global_step": 146328, "epoch": 1762, "val_loss": 6296915.5} {"train_loss": -22.82680320739746, "global_step": 146329, "epoch": 1763} {"train_loss": -23.068349838256836, "global_step": 146330, "epoch": 1763} {"train_loss": -22.914548873901367, "global_step": 146331, "epoch": 1763} {"train_loss": -22.680068969726562, "global_step": 146332, "epoch": 1763} {"train_loss": -23.50064468383789, "global_step": 146333, "epoch": 1763} {"train_loss": -22.780851364135742, "global_step": 146334, "epoch": 1763} {"train_loss": -23.076583862304688, "global_step": 146335, "epoch": 1763} {"train_loss": -22.929147720336914, "global_step": 146336, "epoch": 1763} {"train_loss": -23.27978515625, "global_step": 146337, "epoch": 1763} {"train_loss": -22.720508575439453, "global_step": 146338, "epoch": 1763} {"train_loss": -22.82301139831543, "global_step": 146339, "epoch": 1763} {"train_loss": -23.232187271118164, "global_step": 146340, "epoch": 1763} {"train_loss": -22.85883140563965, "global_step": 146341, "epoch": 1763} {"train_loss": -23.236068725585938, "global_step": 146342, "epoch": 1763} {"train_loss": -23.314716339111328, "global_step": 146343, "epoch": 1763} {"train_loss": -22.795042037963867, "global_step": 146344, "epoch": 1763} {"train_loss": -23.10102081298828, "global_step": 146345, "epoch": 1763} {"train_loss": -23.26402473449707, "global_step": 146346, "epoch": 1763} {"train_loss": -23.444379806518555, "global_step": 146347, "epoch": 1763} {"train_loss": -22.855030059814453, "global_step": 146348, "epoch": 1763} {"train_loss": -22.96347999572754, "global_step": 146349, "epoch": 1763} {"train_loss": -23.30336570739746, "global_step": 146350, "epoch": 1763} {"train_loss": -22.83544921875, "global_step": 146351, "epoch": 1763} {"train_loss": -23.39249038696289, "global_step": 146352, "epoch": 1763} {"train_loss": -22.646432876586914, "global_step": 146353, "epoch": 1763} {"train_loss": -22.95962905883789, "global_step": 146354, "epoch": 1763} {"train_loss": -23.198083877563477, "global_step": 146355, "epoch": 1763} {"train_loss": -23.181982040405273, "global_step": 146356, "epoch": 1763} {"train_loss": -23.190343856811523, "global_step": 146357, "epoch": 1763} {"train_loss": -23.191272735595703, "global_step": 146358, "epoch": 1763} {"train_loss": -22.89937400817871, "global_step": 146359, "epoch": 1763} {"train_loss": -23.06923484802246, "global_step": 146360, "epoch": 1763} {"train_loss": -23.068220138549805, "global_step": 146361, "epoch": 1763} {"train_loss": -23.170534133911133, "global_step": 146362, "epoch": 1763} {"train_loss": -22.98273277282715, "global_step": 146363, "epoch": 1763} {"train_loss": -23.1644287109375, "global_step": 146364, "epoch": 1763} {"train_loss": -22.739898681640625, "global_step": 146365, "epoch": 1763} {"train_loss": -22.96543312072754, "global_step": 146366, "epoch": 1763} {"train_loss": -22.880599975585938, "global_step": 146367, "epoch": 1763} {"train_loss": -22.861469268798828, "global_step": 146368, "epoch": 1763} {"train_loss": -23.129470825195312, "global_step": 146369, "epoch": 1763} {"train_loss": -23.142276763916016, "global_step": 146370, "epoch": 1763} {"train_loss": -23.312807083129883, "global_step": 146371, "epoch": 1763} {"train_loss": -23.084489822387695, "global_step": 146372, "epoch": 1763} {"train_loss": -23.353757858276367, "global_step": 146373, "epoch": 1763} {"train_loss": -23.43047523498535, "global_step": 146374, "epoch": 1763} {"train_loss": -23.48263931274414, "global_step": 146375, "epoch": 1763} {"train_loss": -23.0809326171875, "global_step": 146376, "epoch": 1763} {"train_loss": -23.33158302307129, "global_step": 146377, "epoch": 1763} {"train_loss": -23.380544662475586, "global_step": 146378, "epoch": 1763} {"train_loss": -23.146860122680664, "global_step": 146379, "epoch": 1763} {"train_loss": -23.142789840698242, "global_step": 146380, "epoch": 1763} {"train_loss": -22.95541000366211, "global_step": 146381, "epoch": 1763} {"train_loss": -23.15769386291504, "global_step": 146382, "epoch": 1763} {"train_loss": -23.244678497314453, "global_step": 146383, "epoch": 1763} {"train_loss": -23.18143081665039, "global_step": 146384, "epoch": 1763} {"train_loss": -23.355619430541992, "global_step": 146385, "epoch": 1763} {"train_loss": -23.392940521240234, "global_step": 146386, "epoch": 1763} {"train_loss": -22.922513961791992, "global_step": 146387, "epoch": 1763} {"train_loss": -22.85993003845215, "global_step": 146388, "epoch": 1763} {"train_loss": -23.00417709350586, "global_step": 146389, "epoch": 1763} {"train_loss": -22.88631248474121, "global_step": 146390, "epoch": 1763} {"train_loss": -22.8857421875, "global_step": 146391, "epoch": 1763} {"train_loss": -23.462026596069336, "global_step": 146392, "epoch": 1763} {"train_loss": -23.14339256286621, "global_step": 146393, "epoch": 1763} {"train_loss": -23.27495765686035, "global_step": 146394, "epoch": 1763} {"train_loss": -23.19148826599121, "global_step": 146395, "epoch": 1763} {"train_loss": -23.278329849243164, "global_step": 146396, "epoch": 1763} {"train_loss": -23.126951217651367, "global_step": 146397, "epoch": 1763} {"train_loss": -23.549072265625, "global_step": 146398, "epoch": 1763} {"train_loss": -23.23929786682129, "global_step": 146399, "epoch": 1763} {"train_loss": -23.193483352661133, "global_step": 146400, "epoch": 1763} {"train_loss": -22.9880313873291, "global_step": 146401, "epoch": 1763} {"train_loss": -23.211166381835938, "global_step": 146402, "epoch": 1763} {"train_loss": -23.08448600769043, "global_step": 146403, "epoch": 1763} {"train_loss": -23.660802841186523, "global_step": 146404, "epoch": 1763} {"train_loss": -23.23824119567871, "global_step": 146405, "epoch": 1763} {"train_loss": -22.915742874145508, "global_step": 146406, "epoch": 1763} {"train_loss": -23.236404418945312, "global_step": 146407, "epoch": 1763} {"train_loss": -23.643407821655273, "global_step": 146408, "epoch": 1763} {"train_loss": -23.493316650390625, "global_step": 146409, "epoch": 1763} {"train_loss": -23.205028533935547, "global_step": 146410, "epoch": 1763} {"train_loss": -23.142603472054724, "global_step": 146411, "epoch": 1763, "val_loss": 6276041.0} {"train_loss": -22.016571044921875, "global_step": 146412, "epoch": 1764} {"train_loss": -21.56032371520996, "global_step": 146413, "epoch": 1764} {"train_loss": -22.40508460998535, "global_step": 146414, "epoch": 1764} {"train_loss": -22.864423751831055, "global_step": 146415, "epoch": 1764} {"train_loss": -22.621458053588867, "global_step": 146416, "epoch": 1764} {"train_loss": -22.34682846069336, "global_step": 146417, "epoch": 1764} {"train_loss": -22.403141021728516, "global_step": 146418, "epoch": 1764} {"train_loss": -22.818883895874023, "global_step": 146419, "epoch": 1764} {"train_loss": -22.7703914642334, "global_step": 146420, "epoch": 1764} {"train_loss": -22.706317901611328, "global_step": 146421, "epoch": 1764} {"train_loss": -22.939176559448242, "global_step": 146422, "epoch": 1764} {"train_loss": -22.7327938079834, "global_step": 146423, "epoch": 1764} {"train_loss": -22.700075149536133, "global_step": 146424, "epoch": 1764} {"train_loss": -22.976516723632812, "global_step": 146425, "epoch": 1764} {"train_loss": -23.01851463317871, "global_step": 146426, "epoch": 1764} {"train_loss": -22.975370407104492, "global_step": 146427, "epoch": 1764} {"train_loss": -23.14229965209961, "global_step": 146428, "epoch": 1764} {"train_loss": -23.458662033081055, "global_step": 146429, "epoch": 1764} {"train_loss": -23.069255828857422, "global_step": 146430, "epoch": 1764} {"train_loss": -22.822925567626953, "global_step": 146431, "epoch": 1764} {"train_loss": -22.830575942993164, "global_step": 146432, "epoch": 1764} {"train_loss": -23.041847229003906, "global_step": 146433, "epoch": 1764} {"train_loss": -23.16057777404785, "global_step": 146434, "epoch": 1764} {"train_loss": -22.71662139892578, "global_step": 146435, "epoch": 1764} {"train_loss": -23.033105850219727, "global_step": 146436, "epoch": 1764} {"train_loss": -22.781723022460938, "global_step": 146437, "epoch": 1764} {"train_loss": -22.877643585205078, "global_step": 146438, "epoch": 1764} {"train_loss": -23.3238582611084, "global_step": 146439, "epoch": 1764} {"train_loss": -22.966571807861328, "global_step": 146440, "epoch": 1764} {"train_loss": -23.24909782409668, "global_step": 146441, "epoch": 1764} {"train_loss": -23.119022369384766, "global_step": 146442, "epoch": 1764} {"train_loss": -23.33127212524414, "global_step": 146443, "epoch": 1764} {"train_loss": -23.164344787597656, "global_step": 146444, "epoch": 1764} {"train_loss": -23.11170768737793, "global_step": 146445, "epoch": 1764} {"train_loss": -23.108871459960938, "global_step": 146446, "epoch": 1764} {"train_loss": -23.496707916259766, "global_step": 146447, "epoch": 1764} {"train_loss": -23.44171142578125, "global_step": 146448, "epoch": 1764} {"train_loss": -23.451614379882812, "global_step": 146449, "epoch": 1764} {"train_loss": -23.47149085998535, "global_step": 146450, "epoch": 1764} {"train_loss": -23.101646423339844, "global_step": 146451, "epoch": 1764} {"train_loss": -23.210372924804688, "global_step": 146452, "epoch": 1764} {"train_loss": -23.35939598083496, "global_step": 146453, "epoch": 1764} {"train_loss": -22.932003021240234, "global_step": 146454, "epoch": 1764} {"train_loss": -23.257030487060547, "global_step": 146455, "epoch": 1764} {"train_loss": -23.265520095825195, "global_step": 146456, "epoch": 1764} {"train_loss": -23.265625, "global_step": 146457, "epoch": 1764} {"train_loss": -23.299890518188477, "global_step": 146458, "epoch": 1764} {"train_loss": -23.068252563476562, "global_step": 146459, "epoch": 1764} {"train_loss": -23.390247344970703, "global_step": 146460, "epoch": 1764} {"train_loss": -23.00044822692871, "global_step": 146461, "epoch": 1764} {"train_loss": -23.16864585876465, "global_step": 146462, "epoch": 1764} {"train_loss": -23.15579605102539, "global_step": 146463, "epoch": 1764} {"train_loss": -22.6561222076416, "global_step": 146464, "epoch": 1764} {"train_loss": -22.90284538269043, "global_step": 146465, "epoch": 1764} {"train_loss": -23.06512451171875, "global_step": 146466, "epoch": 1764} {"train_loss": -23.050107955932617, "global_step": 146467, "epoch": 1764} {"train_loss": -23.077178955078125, "global_step": 146468, "epoch": 1764} {"train_loss": -23.065074920654297, "global_step": 146469, "epoch": 1764} {"train_loss": -22.90272331237793, "global_step": 146470, "epoch": 1764} {"train_loss": -23.4232120513916, "global_step": 146471, "epoch": 1764} {"train_loss": -22.906265258789062, "global_step": 146472, "epoch": 1764} {"train_loss": -22.71548843383789, "global_step": 146473, "epoch": 1764} {"train_loss": -23.336198806762695, "global_step": 146474, "epoch": 1764} {"train_loss": -23.0573673248291, "global_step": 146475, "epoch": 1764} {"train_loss": -22.974109649658203, "global_step": 146476, "epoch": 1764} {"train_loss": -23.417987823486328, "global_step": 146477, "epoch": 1764} {"train_loss": -23.311132431030273, "global_step": 146478, "epoch": 1764} {"train_loss": -22.764795303344727, "global_step": 146479, "epoch": 1764} {"train_loss": -23.439477920532227, "global_step": 146480, "epoch": 1764} {"train_loss": -22.992063522338867, "global_step": 146481, "epoch": 1764} {"train_loss": -23.115280151367188, "global_step": 146482, "epoch": 1764} {"train_loss": -22.95358657836914, "global_step": 146483, "epoch": 1764} {"train_loss": -23.386089324951172, "global_step": 146484, "epoch": 1764} {"train_loss": -23.309600830078125, "global_step": 146485, "epoch": 1764} {"train_loss": -23.445575714111328, "global_step": 146486, "epoch": 1764} {"train_loss": -23.24360466003418, "global_step": 146487, "epoch": 1764} {"train_loss": -23.343433380126953, "global_step": 146488, "epoch": 1764} {"train_loss": -23.418350219726562, "global_step": 146489, "epoch": 1764} {"train_loss": -22.8957462310791, "global_step": 146490, "epoch": 1764} {"train_loss": -23.297704696655273, "global_step": 146491, "epoch": 1764} {"train_loss": -23.16200065612793, "global_step": 146492, "epoch": 1764} {"train_loss": -23.05607795715332, "global_step": 146493, "epoch": 1764} {"train_loss": -23.04594067493117, "global_step": 146494, "epoch": 1764, "val_loss": 6425434.5} {"train_loss": -23.134883880615234, "global_step": 146495, "epoch": 1765} {"train_loss": -22.827533721923828, "global_step": 146496, "epoch": 1765} {"train_loss": -23.033523559570312, "global_step": 146497, "epoch": 1765} {"train_loss": -22.799806594848633, "global_step": 146498, "epoch": 1765} {"train_loss": -23.04078483581543, "global_step": 146499, "epoch": 1765} {"train_loss": -22.866260528564453, "global_step": 146500, "epoch": 1765} {"train_loss": -22.6401424407959, "global_step": 146501, "epoch": 1765} {"train_loss": -23.053747177124023, "global_step": 146502, "epoch": 1765} {"train_loss": -23.44998550415039, "global_step": 146503, "epoch": 1765} {"train_loss": -22.778263092041016, "global_step": 146504, "epoch": 1765} {"train_loss": -22.544668197631836, "global_step": 146505, "epoch": 1765} {"train_loss": -23.178489685058594, "global_step": 146506, "epoch": 1765} {"train_loss": -23.157827377319336, "global_step": 146507, "epoch": 1765} {"train_loss": -23.241744995117188, "global_step": 146508, "epoch": 1765} {"train_loss": -23.274917602539062, "global_step": 146509, "epoch": 1765} {"train_loss": -23.004596710205078, "global_step": 146510, "epoch": 1765} {"train_loss": -23.135282516479492, "global_step": 146511, "epoch": 1765} {"train_loss": -23.070886611938477, "global_step": 146512, "epoch": 1765} {"train_loss": -22.64328956604004, "global_step": 146513, "epoch": 1765} {"train_loss": -22.978328704833984, "global_step": 146514, "epoch": 1765} {"train_loss": -23.161909103393555, "global_step": 146515, "epoch": 1765} {"train_loss": -23.271442413330078, "global_step": 146516, "epoch": 1765} {"train_loss": -23.272048950195312, "global_step": 146517, "epoch": 1765} {"train_loss": -22.9265193939209, "global_step": 146518, "epoch": 1765} {"train_loss": -22.94405174255371, "global_step": 146519, "epoch": 1765} {"train_loss": -23.08931541442871, "global_step": 146520, "epoch": 1765} {"train_loss": -23.030366897583008, "global_step": 146521, "epoch": 1765} {"train_loss": -23.273944854736328, "global_step": 146522, "epoch": 1765} {"train_loss": -23.100831985473633, "global_step": 146523, "epoch": 1765} {"train_loss": -23.160551071166992, "global_step": 146524, "epoch": 1765} {"train_loss": -23.12992286682129, "global_step": 146525, "epoch": 1765} {"train_loss": -23.28348159790039, "global_step": 146526, "epoch": 1765} {"train_loss": -22.926273345947266, "global_step": 146527, "epoch": 1765} {"train_loss": -23.12544822692871, "global_step": 146528, "epoch": 1765} {"train_loss": -23.328474044799805, "global_step": 146529, "epoch": 1765} {"train_loss": -23.096881866455078, "global_step": 146530, "epoch": 1765} {"train_loss": -23.047143936157227, "global_step": 146531, "epoch": 1765} {"train_loss": -23.167776107788086, "global_step": 146532, "epoch": 1765} {"train_loss": -23.544137954711914, "global_step": 146533, "epoch": 1765} {"train_loss": -23.306440353393555, "global_step": 146534, "epoch": 1765} {"train_loss": -22.901874542236328, "global_step": 146535, "epoch": 1765} {"train_loss": -23.3914852142334, "global_step": 146536, "epoch": 1765} {"train_loss": -23.391250610351562, "global_step": 146537, "epoch": 1765} {"train_loss": -23.2025146484375, "global_step": 146538, "epoch": 1765} {"train_loss": -23.426755905151367, "global_step": 146539, "epoch": 1765} {"train_loss": -23.623525619506836, "global_step": 146540, "epoch": 1765} {"train_loss": -23.039865493774414, "global_step": 146541, "epoch": 1765} {"train_loss": -23.40118408203125, "global_step": 146542, "epoch": 1765} {"train_loss": -23.047454833984375, "global_step": 146543, "epoch": 1765} {"train_loss": -23.31712532043457, "global_step": 146544, "epoch": 1765} {"train_loss": -23.346479415893555, "global_step": 146545, "epoch": 1765} {"train_loss": -23.090070724487305, "global_step": 146546, "epoch": 1765} {"train_loss": -23.24912452697754, "global_step": 146547, "epoch": 1765} {"train_loss": -23.37531089782715, "global_step": 146548, "epoch": 1765} {"train_loss": -23.389968872070312, "global_step": 146549, "epoch": 1765} {"train_loss": -23.510059356689453, "global_step": 146550, "epoch": 1765} {"train_loss": -23.103551864624023, "global_step": 146551, "epoch": 1765} {"train_loss": -23.346534729003906, "global_step": 146552, "epoch": 1765} {"train_loss": -23.172727584838867, "global_step": 146553, "epoch": 1765} {"train_loss": -23.384031295776367, "global_step": 146554, "epoch": 1765} {"train_loss": -23.221817016601562, "global_step": 146555, "epoch": 1765} {"train_loss": -23.151887893676758, "global_step": 146556, "epoch": 1765} {"train_loss": -22.862913131713867, "global_step": 146557, "epoch": 1765} {"train_loss": -22.53725242614746, "global_step": 146558, "epoch": 1765} {"train_loss": -23.284719467163086, "global_step": 146559, "epoch": 1765} {"train_loss": -23.174667358398438, "global_step": 146560, "epoch": 1765} {"train_loss": -22.7683048248291, "global_step": 146561, "epoch": 1765} {"train_loss": -23.231420516967773, "global_step": 146562, "epoch": 1765} {"train_loss": -23.081695556640625, "global_step": 146563, "epoch": 1765} {"train_loss": -23.110103607177734, "global_step": 146564, "epoch": 1765} {"train_loss": -23.623668670654297, "global_step": 146565, "epoch": 1765} {"train_loss": -23.141416549682617, "global_step": 146566, "epoch": 1765} {"train_loss": -23.345592498779297, "global_step": 146567, "epoch": 1765} {"train_loss": -23.172086715698242, "global_step": 146568, "epoch": 1765} {"train_loss": -23.061492919921875, "global_step": 146569, "epoch": 1765} {"train_loss": -23.35346794128418, "global_step": 146570, "epoch": 1765} {"train_loss": -23.241718292236328, "global_step": 146571, "epoch": 1765} {"train_loss": -23.343717575073242, "global_step": 146572, "epoch": 1765} {"train_loss": -23.316532135009766, "global_step": 146573, "epoch": 1765} {"train_loss": -23.04862403869629, "global_step": 146574, "epoch": 1765} {"train_loss": -23.356977462768555, "global_step": 146575, "epoch": 1765} {"train_loss": -23.258708953857422, "global_step": 146576, "epoch": 1765} {"train_loss": -23.16576718709555, "global_step": 146577, "epoch": 1765, "val_loss": 6336141.0} {"train_loss": -22.73654556274414, "global_step": 146578, "epoch": 1766} {"train_loss": -22.991674423217773, "global_step": 146579, "epoch": 1766} {"train_loss": -22.935277938842773, "global_step": 146580, "epoch": 1766} {"train_loss": -22.80091094970703, "global_step": 146581, "epoch": 1766} {"train_loss": -22.959747314453125, "global_step": 146582, "epoch": 1766} {"train_loss": -22.453054428100586, "global_step": 146583, "epoch": 1766} {"train_loss": -23.29474639892578, "global_step": 146584, "epoch": 1766} {"train_loss": -23.033761978149414, "global_step": 146585, "epoch": 1766} {"train_loss": -23.191513061523438, "global_step": 146586, "epoch": 1766} {"train_loss": -23.24362564086914, "global_step": 146587, "epoch": 1766} {"train_loss": -23.162567138671875, "global_step": 146588, "epoch": 1766} {"train_loss": -23.20186996459961, "global_step": 146589, "epoch": 1766} {"train_loss": -22.88264274597168, "global_step": 146590, "epoch": 1766} {"train_loss": -22.752185821533203, "global_step": 146591, "epoch": 1766} {"train_loss": -22.894123077392578, "global_step": 146592, "epoch": 1766} {"train_loss": -23.16599464416504, "global_step": 146593, "epoch": 1766} {"train_loss": -22.909889221191406, "global_step": 146594, "epoch": 1766} {"train_loss": -23.03127098083496, "global_step": 146595, "epoch": 1766} {"train_loss": -23.687782287597656, "global_step": 146596, "epoch": 1766} {"train_loss": -23.087547302246094, "global_step": 146597, "epoch": 1766} {"train_loss": -23.3227596282959, "global_step": 146598, "epoch": 1766} {"train_loss": -22.915876388549805, "global_step": 146599, "epoch": 1766} {"train_loss": -23.114452362060547, "global_step": 146600, "epoch": 1766} {"train_loss": -23.23678970336914, "global_step": 146601, "epoch": 1766} {"train_loss": -22.597238540649414, "global_step": 146602, "epoch": 1766} {"train_loss": -23.130842208862305, "global_step": 146603, "epoch": 1766} {"train_loss": -23.019926071166992, "global_step": 146604, "epoch": 1766} {"train_loss": -23.118810653686523, "global_step": 146605, "epoch": 1766} {"train_loss": -23.2487850189209, "global_step": 146606, "epoch": 1766} {"train_loss": -23.08238983154297, "global_step": 146607, "epoch": 1766} {"train_loss": -23.166427612304688, "global_step": 146608, "epoch": 1766} {"train_loss": -23.08041763305664, "global_step": 146609, "epoch": 1766} {"train_loss": -23.318506240844727, "global_step": 146610, "epoch": 1766} {"train_loss": -23.220048904418945, "global_step": 146611, "epoch": 1766} {"train_loss": -22.928546905517578, "global_step": 146612, "epoch": 1766} {"train_loss": -22.84354019165039, "global_step": 146613, "epoch": 1766} {"train_loss": -23.028656005859375, "global_step": 146614, "epoch": 1766} {"train_loss": -23.370954513549805, "global_step": 146615, "epoch": 1766} {"train_loss": -23.470624923706055, "global_step": 146616, "epoch": 1766} {"train_loss": -23.36505889892578, "global_step": 146617, "epoch": 1766} {"train_loss": -23.28058433532715, "global_step": 146618, "epoch": 1766} {"train_loss": -22.95984649658203, "global_step": 146619, "epoch": 1766} {"train_loss": -23.105091094970703, "global_step": 146620, "epoch": 1766} {"train_loss": -23.104822158813477, "global_step": 146621, "epoch": 1766} {"train_loss": -23.065942764282227, "global_step": 146622, "epoch": 1766} {"train_loss": -23.259214401245117, "global_step": 146623, "epoch": 1766} {"train_loss": -23.000795364379883, "global_step": 146624, "epoch": 1766} {"train_loss": -23.044010162353516, "global_step": 146625, "epoch": 1766} {"train_loss": -23.073949813842773, "global_step": 146626, "epoch": 1766} {"train_loss": -23.318614959716797, "global_step": 146627, "epoch": 1766} {"train_loss": -23.295852661132812, "global_step": 146628, "epoch": 1766} {"train_loss": -23.278024673461914, "global_step": 146629, "epoch": 1766} {"train_loss": -23.16730308532715, "global_step": 146630, "epoch": 1766} {"train_loss": -23.137086868286133, "global_step": 146631, "epoch": 1766} {"train_loss": -22.733917236328125, "global_step": 146632, "epoch": 1766} {"train_loss": -23.127004623413086, "global_step": 146633, "epoch": 1766} {"train_loss": -23.022802352905273, "global_step": 146634, "epoch": 1766} {"train_loss": -23.075559616088867, "global_step": 146635, "epoch": 1766} {"train_loss": -23.1968994140625, "global_step": 146636, "epoch": 1766} {"train_loss": -23.293256759643555, "global_step": 146637, "epoch": 1766} {"train_loss": -23.200834274291992, "global_step": 146638, "epoch": 1766} {"train_loss": -23.298316955566406, "global_step": 146639, "epoch": 1766} {"train_loss": -23.423192977905273, "global_step": 146640, "epoch": 1766} {"train_loss": -23.416919708251953, "global_step": 146641, "epoch": 1766} {"train_loss": -23.25446891784668, "global_step": 146642, "epoch": 1766} {"train_loss": -23.527448654174805, "global_step": 146643, "epoch": 1766} {"train_loss": -23.603979110717773, "global_step": 146644, "epoch": 1766} {"train_loss": -23.33671760559082, "global_step": 146645, "epoch": 1766} {"train_loss": -23.3597354888916, "global_step": 146646, "epoch": 1766} {"train_loss": -22.972084045410156, "global_step": 146647, "epoch": 1766} {"train_loss": -23.362672805786133, "global_step": 146648, "epoch": 1766} {"train_loss": -23.39072608947754, "global_step": 146649, "epoch": 1766} {"train_loss": -23.44720458984375, "global_step": 146650, "epoch": 1766} {"train_loss": -23.407766342163086, "global_step": 146651, "epoch": 1766} {"train_loss": -23.076154708862305, "global_step": 146652, "epoch": 1766} {"train_loss": -23.166284561157227, "global_step": 146653, "epoch": 1766} {"train_loss": -23.1278076171875, "global_step": 146654, "epoch": 1766} {"train_loss": -23.062715530395508, "global_step": 146655, "epoch": 1766} {"train_loss": -23.138290405273438, "global_step": 146656, "epoch": 1766} {"train_loss": -23.099424362182617, "global_step": 146657, "epoch": 1766} {"train_loss": -22.947965621948242, "global_step": 146658, "epoch": 1766} {"train_loss": -23.29488182067871, "global_step": 146659, "epoch": 1766} {"train_loss": -23.15795886947448, "global_step": 146660, "epoch": 1766, "val_loss": 6313956.0} {"train_loss": -22.521957397460938, "global_step": 146661, "epoch": 1767} {"train_loss": -22.965116500854492, "global_step": 146662, "epoch": 1767} {"train_loss": -22.584972381591797, "global_step": 146663, "epoch": 1767} {"train_loss": -23.298309326171875, "global_step": 146664, "epoch": 1767} {"train_loss": -23.14689064025879, "global_step": 146665, "epoch": 1767} {"train_loss": -22.9290771484375, "global_step": 146666, "epoch": 1767} {"train_loss": -22.675373077392578, "global_step": 146667, "epoch": 1767} {"train_loss": -23.044736862182617, "global_step": 146668, "epoch": 1767} {"train_loss": -22.977426528930664, "global_step": 146669, "epoch": 1767} {"train_loss": -23.144216537475586, "global_step": 146670, "epoch": 1767} {"train_loss": -22.640897750854492, "global_step": 146671, "epoch": 1767} {"train_loss": -22.913724899291992, "global_step": 146672, "epoch": 1767} {"train_loss": -22.968896865844727, "global_step": 146673, "epoch": 1767} {"train_loss": -22.798419952392578, "global_step": 146674, "epoch": 1767} {"train_loss": -23.250473022460938, "global_step": 146675, "epoch": 1767} {"train_loss": -22.890417098999023, "global_step": 146676, "epoch": 1767} {"train_loss": -23.04085350036621, "global_step": 146677, "epoch": 1767} {"train_loss": -23.258495330810547, "global_step": 146678, "epoch": 1767} {"train_loss": -23.034818649291992, "global_step": 146679, "epoch": 1767} {"train_loss": -23.234373092651367, "global_step": 146680, "epoch": 1767} {"train_loss": -23.130722045898438, "global_step": 146681, "epoch": 1767} {"train_loss": -22.89910316467285, "global_step": 146682, "epoch": 1767} {"train_loss": -22.943374633789062, "global_step": 146683, "epoch": 1767} {"train_loss": -22.966638565063477, "global_step": 146684, "epoch": 1767} {"train_loss": -23.343582153320312, "global_step": 146685, "epoch": 1767} {"train_loss": -23.154205322265625, "global_step": 146686, "epoch": 1767} {"train_loss": -22.875280380249023, "global_step": 146687, "epoch": 1767} {"train_loss": -23.2890625, "global_step": 146688, "epoch": 1767} {"train_loss": -22.97568702697754, "global_step": 146689, "epoch": 1767} {"train_loss": -23.214134216308594, "global_step": 146690, "epoch": 1767} {"train_loss": -23.22068977355957, "global_step": 146691, "epoch": 1767} {"train_loss": -23.32687759399414, "global_step": 146692, "epoch": 1767} {"train_loss": -22.97385025024414, "global_step": 146693, "epoch": 1767} {"train_loss": -22.714740753173828, "global_step": 146694, "epoch": 1767} {"train_loss": -23.24285316467285, "global_step": 146695, "epoch": 1767} {"train_loss": -23.341188430786133, "global_step": 146696, "epoch": 1767} {"train_loss": -23.50162696838379, "global_step": 146697, "epoch": 1767} {"train_loss": -23.302892684936523, "global_step": 146698, "epoch": 1767} {"train_loss": -23.318117141723633, "global_step": 146699, "epoch": 1767} {"train_loss": -23.04193687438965, "global_step": 146700, "epoch": 1767} {"train_loss": -23.1484432220459, "global_step": 146701, "epoch": 1767} {"train_loss": -23.17866325378418, "global_step": 146702, "epoch": 1767} {"train_loss": -23.642967224121094, "global_step": 146703, "epoch": 1767} {"train_loss": -22.992801666259766, "global_step": 146704, "epoch": 1767} {"train_loss": -23.554264068603516, "global_step": 146705, "epoch": 1767} {"train_loss": -23.301973342895508, "global_step": 146706, "epoch": 1767} {"train_loss": -23.61267852783203, "global_step": 146707, "epoch": 1767} {"train_loss": -23.378393173217773, "global_step": 146708, "epoch": 1767} {"train_loss": -23.523244857788086, "global_step": 146709, "epoch": 1767} {"train_loss": -23.769636154174805, "global_step": 146710, "epoch": 1767} {"train_loss": -22.861099243164062, "global_step": 146711, "epoch": 1767} {"train_loss": -23.300107955932617, "global_step": 146712, "epoch": 1767} {"train_loss": -22.918792724609375, "global_step": 146713, "epoch": 1767} {"train_loss": -23.437849044799805, "global_step": 146714, "epoch": 1767} {"train_loss": -23.225481033325195, "global_step": 146715, "epoch": 1767} {"train_loss": -23.300724029541016, "global_step": 146716, "epoch": 1767} {"train_loss": -23.11102294921875, "global_step": 146717, "epoch": 1767} {"train_loss": -23.27132225036621, "global_step": 146718, "epoch": 1767} {"train_loss": -22.998050689697266, "global_step": 146719, "epoch": 1767} {"train_loss": -23.26629066467285, "global_step": 146720, "epoch": 1767} {"train_loss": -23.290987014770508, "global_step": 146721, "epoch": 1767} {"train_loss": -22.995540618896484, "global_step": 146722, "epoch": 1767} {"train_loss": -22.96125030517578, "global_step": 146723, "epoch": 1767} {"train_loss": -23.442752838134766, "global_step": 146724, "epoch": 1767} {"train_loss": -23.283554077148438, "global_step": 146725, "epoch": 1767} {"train_loss": -23.226072311401367, "global_step": 146726, "epoch": 1767} {"train_loss": -23.109264373779297, "global_step": 146727, "epoch": 1767} {"train_loss": -23.460174560546875, "global_step": 146728, "epoch": 1767} {"train_loss": -23.390005111694336, "global_step": 146729, "epoch": 1767} {"train_loss": -23.492116928100586, "global_step": 146730, "epoch": 1767} {"train_loss": -23.50994300842285, "global_step": 146731, "epoch": 1767} {"train_loss": -23.272693634033203, "global_step": 146732, "epoch": 1767} {"train_loss": -23.070600509643555, "global_step": 146733, "epoch": 1767} {"train_loss": -23.241806030273438, "global_step": 146734, "epoch": 1767} {"train_loss": -23.308347702026367, "global_step": 146735, "epoch": 1767} {"train_loss": -23.266263961791992, "global_step": 146736, "epoch": 1767} {"train_loss": -23.369882583618164, "global_step": 146737, "epoch": 1767} {"train_loss": -23.40794563293457, "global_step": 146738, "epoch": 1767} {"train_loss": -22.96430778503418, "global_step": 146739, "epoch": 1767} {"train_loss": -22.818571090698242, "global_step": 146740, "epoch": 1767} {"train_loss": -22.653108596801758, "global_step": 146741, "epoch": 1767} {"train_loss": -22.574003219604492, "global_step": 146742, "epoch": 1767} {"train_loss": -23.152401728802417, "global_step": 146743, "epoch": 1767, "val_loss": 6395975.0} {"train_loss": -21.822805404663086, "global_step": 146744, "epoch": 1768} {"train_loss": -22.687894821166992, "global_step": 146745, "epoch": 1768} {"train_loss": -21.922897338867188, "global_step": 146746, "epoch": 1768} {"train_loss": -22.339197158813477, "global_step": 146747, "epoch": 1768} {"train_loss": -21.82672691345215, "global_step": 146748, "epoch": 1768} {"train_loss": -22.318082809448242, "global_step": 146749, "epoch": 1768} {"train_loss": -21.90883445739746, "global_step": 146750, "epoch": 1768} {"train_loss": -22.499027252197266, "global_step": 146751, "epoch": 1768} {"train_loss": -22.108631134033203, "global_step": 146752, "epoch": 1768} {"train_loss": -22.21026039123535, "global_step": 146753, "epoch": 1768} {"train_loss": -22.730533599853516, "global_step": 146754, "epoch": 1768} {"train_loss": -22.71261978149414, "global_step": 146755, "epoch": 1768} {"train_loss": -22.348398208618164, "global_step": 146756, "epoch": 1768} {"train_loss": -22.302061080932617, "global_step": 146757, "epoch": 1768} {"train_loss": -22.47719383239746, "global_step": 146758, "epoch": 1768} {"train_loss": -22.100326538085938, "global_step": 146759, "epoch": 1768} {"train_loss": -22.73828125, "global_step": 146760, "epoch": 1768} {"train_loss": -22.357229232788086, "global_step": 146761, "epoch": 1768} {"train_loss": -23.049198150634766, "global_step": 146762, "epoch": 1768} {"train_loss": -22.800403594970703, "global_step": 146763, "epoch": 1768} {"train_loss": -23.154556274414062, "global_step": 146764, "epoch": 1768} {"train_loss": -22.713497161865234, "global_step": 146765, "epoch": 1768} {"train_loss": -22.777402877807617, "global_step": 146766, "epoch": 1768} {"train_loss": -22.747812271118164, "global_step": 146767, "epoch": 1768} {"train_loss": -23.055156707763672, "global_step": 146768, "epoch": 1768} {"train_loss": -23.08916664123535, "global_step": 146769, "epoch": 1768} {"train_loss": -22.727529525756836, "global_step": 146770, "epoch": 1768} {"train_loss": -23.015073776245117, "global_step": 146771, "epoch": 1768} {"train_loss": -23.06989860534668, "global_step": 146772, "epoch": 1768} {"train_loss": -22.593496322631836, "global_step": 146773, "epoch": 1768} {"train_loss": -22.4866943359375, "global_step": 146774, "epoch": 1768} {"train_loss": -23.023723602294922, "global_step": 146775, "epoch": 1768} {"train_loss": -22.89910888671875, "global_step": 146776, "epoch": 1768} {"train_loss": -22.842613220214844, "global_step": 146777, "epoch": 1768} {"train_loss": -22.90354347229004, "global_step": 146778, "epoch": 1768} {"train_loss": -22.954463958740234, "global_step": 146779, "epoch": 1768} {"train_loss": -23.290876388549805, "global_step": 146780, "epoch": 1768} {"train_loss": -23.37656593322754, "global_step": 146781, "epoch": 1768} {"train_loss": -23.30689811706543, "global_step": 146782, "epoch": 1768} {"train_loss": -23.290876388549805, "global_step": 146783, "epoch": 1768} {"train_loss": -23.1883602142334, "global_step": 146784, "epoch": 1768} {"train_loss": -23.377439498901367, "global_step": 146785, "epoch": 1768} {"train_loss": -22.880495071411133, "global_step": 146786, "epoch": 1768} {"train_loss": -23.118940353393555, "global_step": 146787, "epoch": 1768} {"train_loss": -23.054136276245117, "global_step": 146788, "epoch": 1768} {"train_loss": -22.841211318969727, "global_step": 146789, "epoch": 1768} {"train_loss": -23.509628295898438, "global_step": 146790, "epoch": 1768} {"train_loss": -23.09878921508789, "global_step": 146791, "epoch": 1768} {"train_loss": -23.205060958862305, "global_step": 146792, "epoch": 1768} {"train_loss": -23.479705810546875, "global_step": 146793, "epoch": 1768} {"train_loss": -23.411386489868164, "global_step": 146794, "epoch": 1768} {"train_loss": -22.90806007385254, "global_step": 146795, "epoch": 1768} {"train_loss": -23.42951011657715, "global_step": 146796, "epoch": 1768} {"train_loss": -23.16347312927246, "global_step": 146797, "epoch": 1768} {"train_loss": -23.16881561279297, "global_step": 146798, "epoch": 1768} {"train_loss": -23.3553466796875, "global_step": 146799, "epoch": 1768} {"train_loss": -23.21986198425293, "global_step": 146800, "epoch": 1768} {"train_loss": -23.251861572265625, "global_step": 146801, "epoch": 1768} {"train_loss": -23.18205451965332, "global_step": 146802, "epoch": 1768} {"train_loss": -23.33988380432129, "global_step": 146803, "epoch": 1768} {"train_loss": -22.959165573120117, "global_step": 146804, "epoch": 1768} {"train_loss": -23.2304630279541, "global_step": 146805, "epoch": 1768} {"train_loss": -23.13517189025879, "global_step": 146806, "epoch": 1768} {"train_loss": -23.059171676635742, "global_step": 146807, "epoch": 1768} {"train_loss": -23.120128631591797, "global_step": 146808, "epoch": 1768} {"train_loss": -23.291217803955078, "global_step": 146809, "epoch": 1768} {"train_loss": -23.293668746948242, "global_step": 146810, "epoch": 1768} {"train_loss": -23.043994903564453, "global_step": 146811, "epoch": 1768} {"train_loss": -23.030380249023438, "global_step": 146812, "epoch": 1768} {"train_loss": -23.16745376586914, "global_step": 146813, "epoch": 1768} {"train_loss": -22.99477767944336, "global_step": 146814, "epoch": 1768} {"train_loss": -23.276874542236328, "global_step": 146815, "epoch": 1768} {"train_loss": -23.131946563720703, "global_step": 146816, "epoch": 1768} {"train_loss": -23.313236236572266, "global_step": 146817, "epoch": 1768} {"train_loss": -22.91071319580078, "global_step": 146818, "epoch": 1768} {"train_loss": -23.434782028198242, "global_step": 146819, "epoch": 1768} {"train_loss": -23.61139678955078, "global_step": 146820, "epoch": 1768} {"train_loss": -23.12881088256836, "global_step": 146821, "epoch": 1768} {"train_loss": -23.62102508544922, "global_step": 146822, "epoch": 1768} {"train_loss": -23.301393508911133, "global_step": 146823, "epoch": 1768} {"train_loss": -22.890920639038086, "global_step": 146824, "epoch": 1768} {"train_loss": -23.396650314331055, "global_step": 146825, "epoch": 1768} {"train_loss": -22.934208192021014, "global_step": 146826, "epoch": 1768, "val_loss": 6291067.0} {"train_loss": -23.05006980895996, "global_step": 146827, "epoch": 1769} {"train_loss": -23.364526748657227, "global_step": 146828, "epoch": 1769} {"train_loss": -23.167266845703125, "global_step": 146829, "epoch": 1769} {"train_loss": -23.08576774597168, "global_step": 146830, "epoch": 1769} {"train_loss": -23.168912887573242, "global_step": 146831, "epoch": 1769} {"train_loss": -22.853147506713867, "global_step": 146832, "epoch": 1769} {"train_loss": -22.52943229675293, "global_step": 146833, "epoch": 1769} {"train_loss": -22.2824764251709, "global_step": 146834, "epoch": 1769} {"train_loss": -22.975784301757812, "global_step": 146835, "epoch": 1769} {"train_loss": -22.618024826049805, "global_step": 146836, "epoch": 1769} {"train_loss": -22.489086151123047, "global_step": 146837, "epoch": 1769} {"train_loss": -23.18617057800293, "global_step": 146838, "epoch": 1769} {"train_loss": -22.755613327026367, "global_step": 146839, "epoch": 1769} {"train_loss": -23.16757583618164, "global_step": 146840, "epoch": 1769} {"train_loss": -22.80640411376953, "global_step": 146841, "epoch": 1769} {"train_loss": -22.982053756713867, "global_step": 146842, "epoch": 1769} {"train_loss": -22.799625396728516, "global_step": 146843, "epoch": 1769} {"train_loss": -22.764692306518555, "global_step": 146844, "epoch": 1769} {"train_loss": -22.935842514038086, "global_step": 146845, "epoch": 1769} {"train_loss": -23.022790908813477, "global_step": 146846, "epoch": 1769} {"train_loss": -23.14972686767578, "global_step": 146847, "epoch": 1769} {"train_loss": -22.86640167236328, "global_step": 146848, "epoch": 1769} {"train_loss": -23.20782470703125, "global_step": 146849, "epoch": 1769} {"train_loss": -22.9705810546875, "global_step": 146850, "epoch": 1769} {"train_loss": -23.331884384155273, "global_step": 146851, "epoch": 1769} {"train_loss": -23.244909286499023, "global_step": 146852, "epoch": 1769} {"train_loss": -23.385854721069336, "global_step": 146853, "epoch": 1769} {"train_loss": -23.049360275268555, "global_step": 146854, "epoch": 1769} {"train_loss": -23.002647399902344, "global_step": 146855, "epoch": 1769} {"train_loss": -23.024749755859375, "global_step": 146856, "epoch": 1769} {"train_loss": -23.183218002319336, "global_step": 146857, "epoch": 1769} {"train_loss": -23.433658599853516, "global_step": 146858, "epoch": 1769} {"train_loss": -23.3494930267334, "global_step": 146859, "epoch": 1769} {"train_loss": -23.1323299407959, "global_step": 146860, "epoch": 1769} {"train_loss": -23.063432693481445, "global_step": 146861, "epoch": 1769} {"train_loss": -23.088054656982422, "global_step": 146862, "epoch": 1769} {"train_loss": -23.154836654663086, "global_step": 146863, "epoch": 1769} {"train_loss": -23.34186363220215, "global_step": 146864, "epoch": 1769} {"train_loss": -23.25946617126465, "global_step": 146865, "epoch": 1769} {"train_loss": -23.046966552734375, "global_step": 146866, "epoch": 1769} {"train_loss": -23.104406356811523, "global_step": 146867, "epoch": 1769} {"train_loss": -22.98982810974121, "global_step": 146868, "epoch": 1769} {"train_loss": -23.342737197875977, "global_step": 146869, "epoch": 1769} {"train_loss": -23.391212463378906, "global_step": 146870, "epoch": 1769} {"train_loss": -23.058292388916016, "global_step": 146871, "epoch": 1769} {"train_loss": -23.284156799316406, "global_step": 146872, "epoch": 1769} {"train_loss": -23.35789680480957, "global_step": 146873, "epoch": 1769} {"train_loss": -23.105558395385742, "global_step": 146874, "epoch": 1769} {"train_loss": -23.139944076538086, "global_step": 146875, "epoch": 1769} {"train_loss": -23.068988800048828, "global_step": 146876, "epoch": 1769} {"train_loss": -23.15454864501953, "global_step": 146877, "epoch": 1769} {"train_loss": -23.058740615844727, "global_step": 146878, "epoch": 1769} {"train_loss": -23.088764190673828, "global_step": 146879, "epoch": 1769} {"train_loss": -23.499107360839844, "global_step": 146880, "epoch": 1769} {"train_loss": -23.5102596282959, "global_step": 146881, "epoch": 1769} {"train_loss": -23.647367477416992, "global_step": 146882, "epoch": 1769} {"train_loss": -23.405820846557617, "global_step": 146883, "epoch": 1769} {"train_loss": -23.372325897216797, "global_step": 146884, "epoch": 1769} {"train_loss": -23.32691764831543, "global_step": 146885, "epoch": 1769} {"train_loss": -23.12035369873047, "global_step": 146886, "epoch": 1769} {"train_loss": -23.342939376831055, "global_step": 146887, "epoch": 1769} {"train_loss": -23.268381118774414, "global_step": 146888, "epoch": 1769} {"train_loss": -23.11714744567871, "global_step": 146889, "epoch": 1769} {"train_loss": -23.421234130859375, "global_step": 146890, "epoch": 1769} {"train_loss": -23.32801055908203, "global_step": 146891, "epoch": 1769} {"train_loss": -23.30006980895996, "global_step": 146892, "epoch": 1769} {"train_loss": -23.365070343017578, "global_step": 146893, "epoch": 1769} {"train_loss": -23.214384078979492, "global_step": 146894, "epoch": 1769} {"train_loss": -23.446094512939453, "global_step": 146895, "epoch": 1769} {"train_loss": -23.48874855041504, "global_step": 146896, "epoch": 1769} {"train_loss": -23.190526962280273, "global_step": 146897, "epoch": 1769} {"train_loss": -23.241193771362305, "global_step": 146898, "epoch": 1769} {"train_loss": -23.26173973083496, "global_step": 146899, "epoch": 1769} {"train_loss": -23.122629165649414, "global_step": 146900, "epoch": 1769} {"train_loss": -23.485340118408203, "global_step": 146901, "epoch": 1769} {"train_loss": -23.51726531982422, "global_step": 146902, "epoch": 1769} {"train_loss": -23.32309341430664, "global_step": 146903, "epoch": 1769} {"train_loss": -23.082962036132812, "global_step": 146904, "epoch": 1769} {"train_loss": -23.618953704833984, "global_step": 146905, "epoch": 1769} {"train_loss": -23.53323745727539, "global_step": 146906, "epoch": 1769} {"train_loss": -23.374526977539062, "global_step": 146907, "epoch": 1769} {"train_loss": -23.381107330322266, "global_step": 146908, "epoch": 1769} {"train_loss": -23.155174140470574, "global_step": 146909, "epoch": 1769, "val_loss": 6326494.0} {"train_loss": -23.0638427734375, "global_step": 146910, "epoch": 1770} {"train_loss": -22.611082077026367, "global_step": 146911, "epoch": 1770} {"train_loss": -22.89571189880371, "global_step": 146912, "epoch": 1770} {"train_loss": -23.17657470703125, "global_step": 146913, "epoch": 1770} {"train_loss": -22.747716903686523, "global_step": 146914, "epoch": 1770} {"train_loss": -22.85919761657715, "global_step": 146915, "epoch": 1770} {"train_loss": -22.891904830932617, "global_step": 146916, "epoch": 1770} {"train_loss": -23.462554931640625, "global_step": 146917, "epoch": 1770} {"train_loss": -22.799015045166016, "global_step": 146918, "epoch": 1770} {"train_loss": -22.718307495117188, "global_step": 146919, "epoch": 1770} {"train_loss": -22.754199981689453, "global_step": 146920, "epoch": 1770} {"train_loss": -23.459945678710938, "global_step": 146921, "epoch": 1770} {"train_loss": -23.079139709472656, "global_step": 146922, "epoch": 1770} {"train_loss": -23.158109664916992, "global_step": 146923, "epoch": 1770} {"train_loss": -22.97344207763672, "global_step": 146924, "epoch": 1770} {"train_loss": -23.435232162475586, "global_step": 146925, "epoch": 1770} {"train_loss": -23.14898109436035, "global_step": 146926, "epoch": 1770} {"train_loss": -23.0081729888916, "global_step": 146927, "epoch": 1770} {"train_loss": -23.150800704956055, "global_step": 146928, "epoch": 1770} {"train_loss": -23.577573776245117, "global_step": 146929, "epoch": 1770} {"train_loss": -23.197263717651367, "global_step": 146930, "epoch": 1770} {"train_loss": -22.998037338256836, "global_step": 146931, "epoch": 1770} {"train_loss": -23.288320541381836, "global_step": 146932, "epoch": 1770} {"train_loss": -23.21999168395996, "global_step": 146933, "epoch": 1770} {"train_loss": -23.30923843383789, "global_step": 146934, "epoch": 1770} {"train_loss": -23.232494354248047, "global_step": 146935, "epoch": 1770} {"train_loss": -23.092958450317383, "global_step": 146936, "epoch": 1770} {"train_loss": -23.08930778503418, "global_step": 146937, "epoch": 1770} {"train_loss": -23.01108741760254, "global_step": 146938, "epoch": 1770} {"train_loss": -23.342920303344727, "global_step": 146939, "epoch": 1770} {"train_loss": -23.192224502563477, "global_step": 146940, "epoch": 1770} {"train_loss": -23.52988624572754, "global_step": 146941, "epoch": 1770} {"train_loss": -22.954545974731445, "global_step": 146942, "epoch": 1770} {"train_loss": -23.325607299804688, "global_step": 146943, "epoch": 1770} {"train_loss": -23.274574279785156, "global_step": 146944, "epoch": 1770} {"train_loss": -23.22246742248535, "global_step": 146945, "epoch": 1770} {"train_loss": -23.38929557800293, "global_step": 146946, "epoch": 1770} {"train_loss": -23.252822875976562, "global_step": 146947, "epoch": 1770} {"train_loss": -22.916101455688477, "global_step": 146948, "epoch": 1770} {"train_loss": -23.406681060791016, "global_step": 146949, "epoch": 1770} {"train_loss": -23.465984344482422, "global_step": 146950, "epoch": 1770} {"train_loss": -23.34418487548828, "global_step": 146951, "epoch": 1770} {"train_loss": -23.064697265625, "global_step": 146952, "epoch": 1770} {"train_loss": -23.033655166625977, "global_step": 146953, "epoch": 1770} {"train_loss": -23.039573669433594, "global_step": 146954, "epoch": 1770} {"train_loss": -22.90150260925293, "global_step": 146955, "epoch": 1770} {"train_loss": -23.109683990478516, "global_step": 146956, "epoch": 1770} {"train_loss": -23.161996841430664, "global_step": 146957, "epoch": 1770} {"train_loss": -23.2598934173584, "global_step": 146958, "epoch": 1770} {"train_loss": -23.01838493347168, "global_step": 146959, "epoch": 1770} {"train_loss": -23.31111717224121, "global_step": 146960, "epoch": 1770} {"train_loss": -23.183326721191406, "global_step": 146961, "epoch": 1770} {"train_loss": -23.611774444580078, "global_step": 146962, "epoch": 1770} {"train_loss": -23.1720027923584, "global_step": 146963, "epoch": 1770} {"train_loss": -23.102231979370117, "global_step": 146964, "epoch": 1770} {"train_loss": -23.293630599975586, "global_step": 146965, "epoch": 1770} {"train_loss": -23.43869400024414, "global_step": 146966, "epoch": 1770} {"train_loss": -23.215829849243164, "global_step": 146967, "epoch": 1770} {"train_loss": -23.354835510253906, "global_step": 146968, "epoch": 1770} {"train_loss": -23.682029724121094, "global_step": 146969, "epoch": 1770} {"train_loss": -23.15692710876465, "global_step": 146970, "epoch": 1770} {"train_loss": -23.144704818725586, "global_step": 146971, "epoch": 1770} {"train_loss": -23.27175521850586, "global_step": 146972, "epoch": 1770} {"train_loss": -23.29701042175293, "global_step": 146973, "epoch": 1770} {"train_loss": -23.096216201782227, "global_step": 146974, "epoch": 1770} {"train_loss": -22.923620223999023, "global_step": 146975, "epoch": 1770} {"train_loss": -23.199684143066406, "global_step": 146976, "epoch": 1770} {"train_loss": -22.803678512573242, "global_step": 146977, "epoch": 1770} {"train_loss": -22.668792724609375, "global_step": 146978, "epoch": 1770} {"train_loss": -22.974336624145508, "global_step": 146979, "epoch": 1770} {"train_loss": -23.346179962158203, "global_step": 146980, "epoch": 1770} {"train_loss": -23.215299606323242, "global_step": 146981, "epoch": 1770} {"train_loss": -23.4552001953125, "global_step": 146982, "epoch": 1770} {"train_loss": -22.87483787536621, "global_step": 146983, "epoch": 1770} {"train_loss": -22.998432159423828, "global_step": 146984, "epoch": 1770} {"train_loss": -23.184629440307617, "global_step": 146985, "epoch": 1770} {"train_loss": -23.2901668548584, "global_step": 146986, "epoch": 1770} {"train_loss": -23.420520782470703, "global_step": 146987, "epoch": 1770} {"train_loss": -22.964750289916992, "global_step": 146988, "epoch": 1770} {"train_loss": -23.4101505279541, "global_step": 146989, "epoch": 1770} {"train_loss": -22.987186431884766, "global_step": 146990, "epoch": 1770} {"train_loss": -23.165237426757812, "global_step": 146991, "epoch": 1770} {"train_loss": -23.15481043436441, "global_step": 146992, "epoch": 1770, "val_loss": 6349477.0} {"train_loss": -23.018308639526367, "global_step": 146993, "epoch": 1771} {"train_loss": -22.88015365600586, "global_step": 146994, "epoch": 1771} {"train_loss": -23.049095153808594, "global_step": 146995, "epoch": 1771} {"train_loss": -23.10659408569336, "global_step": 146996, "epoch": 1771} {"train_loss": -23.18316650390625, "global_step": 146997, "epoch": 1771} {"train_loss": -22.99921989440918, "global_step": 146998, "epoch": 1771} {"train_loss": -23.007280349731445, "global_step": 146999, "epoch": 1771} {"train_loss": -23.23459815979004, "global_step": 147000, "epoch": 1771} {"train_loss": -23.245384216308594, "global_step": 147001, "epoch": 1771} {"train_loss": -23.070363998413086, "global_step": 147002, "epoch": 1771} {"train_loss": -22.889556884765625, "global_step": 147003, "epoch": 1771} {"train_loss": -23.272254943847656, "global_step": 147004, "epoch": 1771} {"train_loss": -23.32804298400879, "global_step": 147005, "epoch": 1771} {"train_loss": -23.29498291015625, "global_step": 147006, "epoch": 1771} {"train_loss": -23.39510154724121, "global_step": 147007, "epoch": 1771} {"train_loss": -23.130939483642578, "global_step": 147008, "epoch": 1771} {"train_loss": -23.080888748168945, "global_step": 147009, "epoch": 1771} {"train_loss": -22.948579788208008, "global_step": 147010, "epoch": 1771} {"train_loss": -23.1561336517334, "global_step": 147011, "epoch": 1771} {"train_loss": -23.380273818969727, "global_step": 147012, "epoch": 1771} {"train_loss": -22.91412925720215, "global_step": 147013, "epoch": 1771} {"train_loss": -23.184364318847656, "global_step": 147014, "epoch": 1771} {"train_loss": -23.0563907623291, "global_step": 147015, "epoch": 1771} {"train_loss": -22.97028160095215, "global_step": 147016, "epoch": 1771} {"train_loss": -23.049222946166992, "global_step": 147017, "epoch": 1771} {"train_loss": -23.05369758605957, "global_step": 147018, "epoch": 1771} {"train_loss": -22.989282608032227, "global_step": 147019, "epoch": 1771} {"train_loss": -23.121606826782227, "global_step": 147020, "epoch": 1771} {"train_loss": -23.086172103881836, "global_step": 147021, "epoch": 1771} {"train_loss": -23.320144653320312, "global_step": 147022, "epoch": 1771} {"train_loss": -23.11155128479004, "global_step": 147023, "epoch": 1771} {"train_loss": -22.919170379638672, "global_step": 147024, "epoch": 1771} {"train_loss": -23.674524307250977, "global_step": 147025, "epoch": 1771} {"train_loss": -22.915945053100586, "global_step": 147026, "epoch": 1771} {"train_loss": -23.201093673706055, "global_step": 147027, "epoch": 1771} {"train_loss": -23.552669525146484, "global_step": 147028, "epoch": 1771} {"train_loss": -23.069406509399414, "global_step": 147029, "epoch": 1771} {"train_loss": -23.483596801757812, "global_step": 147030, "epoch": 1771} {"train_loss": -23.377105712890625, "global_step": 147031, "epoch": 1771} {"train_loss": -23.304670333862305, "global_step": 147032, "epoch": 1771} {"train_loss": -23.539400100708008, "global_step": 147033, "epoch": 1771} {"train_loss": -23.435678482055664, "global_step": 147034, "epoch": 1771} {"train_loss": -23.45802879333496, "global_step": 147035, "epoch": 1771} {"train_loss": -23.401464462280273, "global_step": 147036, "epoch": 1771} {"train_loss": -22.843307495117188, "global_step": 147037, "epoch": 1771} {"train_loss": -23.18404197692871, "global_step": 147038, "epoch": 1771} {"train_loss": -22.91863441467285, "global_step": 147039, "epoch": 1771} {"train_loss": -23.395273208618164, "global_step": 147040, "epoch": 1771} {"train_loss": -23.464012145996094, "global_step": 147041, "epoch": 1771} {"train_loss": -23.033767700195312, "global_step": 147042, "epoch": 1771} {"train_loss": -23.2392578125, "global_step": 147043, "epoch": 1771} {"train_loss": -23.09119987487793, "global_step": 147044, "epoch": 1771} {"train_loss": -22.79347801208496, "global_step": 147045, "epoch": 1771} {"train_loss": -23.2270565032959, "global_step": 147046, "epoch": 1771} {"train_loss": -22.856014251708984, "global_step": 147047, "epoch": 1771} {"train_loss": -23.30286979675293, "global_step": 147048, "epoch": 1771} {"train_loss": -23.072368621826172, "global_step": 147049, "epoch": 1771} {"train_loss": -23.116262435913086, "global_step": 147050, "epoch": 1771} {"train_loss": -23.166637420654297, "global_step": 147051, "epoch": 1771} {"train_loss": -23.21076202392578, "global_step": 147052, "epoch": 1771} {"train_loss": -23.112531661987305, "global_step": 147053, "epoch": 1771} {"train_loss": -23.3268985748291, "global_step": 147054, "epoch": 1771} {"train_loss": -23.517715454101562, "global_step": 147055, "epoch": 1771} {"train_loss": -22.931602478027344, "global_step": 147056, "epoch": 1771} {"train_loss": -23.608112335205078, "global_step": 147057, "epoch": 1771} {"train_loss": -23.45075798034668, "global_step": 147058, "epoch": 1771} {"train_loss": -23.125974655151367, "global_step": 147059, "epoch": 1771} {"train_loss": -22.789060592651367, "global_step": 147060, "epoch": 1771} {"train_loss": -23.28358268737793, "global_step": 147061, "epoch": 1771} {"train_loss": -23.318668365478516, "global_step": 147062, "epoch": 1771} {"train_loss": -23.35084342956543, "global_step": 147063, "epoch": 1771} {"train_loss": -22.803712844848633, "global_step": 147064, "epoch": 1771} {"train_loss": -23.132352828979492, "global_step": 147065, "epoch": 1771} {"train_loss": -23.28519630432129, "global_step": 147066, "epoch": 1771} {"train_loss": -23.510648727416992, "global_step": 147067, "epoch": 1771} {"train_loss": -23.253337860107422, "global_step": 147068, "epoch": 1771} {"train_loss": -23.543153762817383, "global_step": 147069, "epoch": 1771} {"train_loss": -23.241195678710938, "global_step": 147070, "epoch": 1771} {"train_loss": -23.06328582763672, "global_step": 147071, "epoch": 1771} {"train_loss": -23.361347198486328, "global_step": 147072, "epoch": 1771} {"train_loss": -23.047393798828125, "global_step": 147073, "epoch": 1771} {"train_loss": -23.621631622314453, "global_step": 147074, "epoch": 1771} {"train_loss": -23.191899471972363, "global_step": 147075, "epoch": 1771, "val_loss": 6337512.0} {"train_loss": -22.917139053344727, "global_step": 147076, "epoch": 1772} {"train_loss": -22.828744888305664, "global_step": 147077, "epoch": 1772} {"train_loss": -23.335418701171875, "global_step": 147078, "epoch": 1772} {"train_loss": -22.692604064941406, "global_step": 147079, "epoch": 1772} {"train_loss": -22.936315536499023, "global_step": 147080, "epoch": 1772} {"train_loss": -22.856124877929688, "global_step": 147081, "epoch": 1772} {"train_loss": -22.7164363861084, "global_step": 147082, "epoch": 1772} {"train_loss": -22.959287643432617, "global_step": 147083, "epoch": 1772} {"train_loss": -23.001001358032227, "global_step": 147084, "epoch": 1772} {"train_loss": -22.780553817749023, "global_step": 147085, "epoch": 1772} {"train_loss": -22.888010025024414, "global_step": 147086, "epoch": 1772} {"train_loss": -22.55397605895996, "global_step": 147087, "epoch": 1772} {"train_loss": -22.90960121154785, "global_step": 147088, "epoch": 1772} {"train_loss": -22.847684860229492, "global_step": 147089, "epoch": 1772} {"train_loss": -23.0685977935791, "global_step": 147090, "epoch": 1772} {"train_loss": -22.66411018371582, "global_step": 147091, "epoch": 1772} {"train_loss": -23.08957862854004, "global_step": 147092, "epoch": 1772} {"train_loss": -22.868885040283203, "global_step": 147093, "epoch": 1772} {"train_loss": -22.853784561157227, "global_step": 147094, "epoch": 1772} {"train_loss": -23.48563003540039, "global_step": 147095, "epoch": 1772} {"train_loss": -22.811552047729492, "global_step": 147096, "epoch": 1772} {"train_loss": -23.06166648864746, "global_step": 147097, "epoch": 1772} {"train_loss": -22.954082489013672, "global_step": 147098, "epoch": 1772} {"train_loss": -22.808706283569336, "global_step": 147099, "epoch": 1772} {"train_loss": -23.096044540405273, "global_step": 147100, "epoch": 1772} {"train_loss": -23.395944595336914, "global_step": 147101, "epoch": 1772} {"train_loss": -23.036733627319336, "global_step": 147102, "epoch": 1772} {"train_loss": -23.094369888305664, "global_step": 147103, "epoch": 1772} {"train_loss": -22.98566246032715, "global_step": 147104, "epoch": 1772} {"train_loss": -23.043058395385742, "global_step": 147105, "epoch": 1772} {"train_loss": -23.391830444335938, "global_step": 147106, "epoch": 1772} {"train_loss": -23.08260154724121, "global_step": 147107, "epoch": 1772} {"train_loss": -23.342016220092773, "global_step": 147108, "epoch": 1772} {"train_loss": -23.10799217224121, "global_step": 147109, "epoch": 1772} {"train_loss": -23.425037384033203, "global_step": 147110, "epoch": 1772} {"train_loss": -23.140371322631836, "global_step": 147111, "epoch": 1772} {"train_loss": -23.085494995117188, "global_step": 147112, "epoch": 1772} {"train_loss": -23.13578224182129, "global_step": 147113, "epoch": 1772} {"train_loss": -23.409162521362305, "global_step": 147114, "epoch": 1772} {"train_loss": -23.707178115844727, "global_step": 147115, "epoch": 1772} {"train_loss": -23.1639347076416, "global_step": 147116, "epoch": 1772} {"train_loss": -23.426313400268555, "global_step": 147117, "epoch": 1772} {"train_loss": -23.38075065612793, "global_step": 147118, "epoch": 1772} {"train_loss": -22.565263748168945, "global_step": 147119, "epoch": 1772} {"train_loss": -23.263446807861328, "global_step": 147120, "epoch": 1772} {"train_loss": -23.172922134399414, "global_step": 147121, "epoch": 1772} {"train_loss": -23.09807014465332, "global_step": 147122, "epoch": 1772} {"train_loss": -23.59134864807129, "global_step": 147123, "epoch": 1772} {"train_loss": -23.170761108398438, "global_step": 147124, "epoch": 1772} {"train_loss": -23.546220779418945, "global_step": 147125, "epoch": 1772} {"train_loss": -23.19087791442871, "global_step": 147126, "epoch": 1772} {"train_loss": -23.241500854492188, "global_step": 147127, "epoch": 1772} {"train_loss": -23.5666561126709, "global_step": 147128, "epoch": 1772} {"train_loss": -23.073640823364258, "global_step": 147129, "epoch": 1772} {"train_loss": -23.224878311157227, "global_step": 147130, "epoch": 1772} {"train_loss": -23.37978744506836, "global_step": 147131, "epoch": 1772} {"train_loss": -22.93829917907715, "global_step": 147132, "epoch": 1772} {"train_loss": -23.455768585205078, "global_step": 147133, "epoch": 1772} {"train_loss": -23.22225570678711, "global_step": 147134, "epoch": 1772} {"train_loss": -22.997711181640625, "global_step": 147135, "epoch": 1772} {"train_loss": -23.41171646118164, "global_step": 147136, "epoch": 1772} {"train_loss": -22.903230667114258, "global_step": 147137, "epoch": 1772} {"train_loss": -22.96595573425293, "global_step": 147138, "epoch": 1772} {"train_loss": -23.12666130065918, "global_step": 147139, "epoch": 1772} {"train_loss": -23.204328536987305, "global_step": 147140, "epoch": 1772} {"train_loss": -23.05226707458496, "global_step": 147141, "epoch": 1772} {"train_loss": -23.137754440307617, "global_step": 147142, "epoch": 1772} {"train_loss": -23.4005184173584, "global_step": 147143, "epoch": 1772} {"train_loss": -23.248937606811523, "global_step": 147144, "epoch": 1772} {"train_loss": -23.33298110961914, "global_step": 147145, "epoch": 1772} {"train_loss": -22.85235023498535, "global_step": 147146, "epoch": 1772} {"train_loss": -23.141759872436523, "global_step": 147147, "epoch": 1772} {"train_loss": -23.611042022705078, "global_step": 147148, "epoch": 1772} {"train_loss": -23.21881675720215, "global_step": 147149, "epoch": 1772} {"train_loss": -22.793903350830078, "global_step": 147150, "epoch": 1772} {"train_loss": -23.495588302612305, "global_step": 147151, "epoch": 1772} {"train_loss": -23.184741973876953, "global_step": 147152, "epoch": 1772} {"train_loss": -23.56800651550293, "global_step": 147153, "epoch": 1772} {"train_loss": -23.327260971069336, "global_step": 147154, "epoch": 1772} {"train_loss": -23.163654327392578, "global_step": 147155, "epoch": 1772} {"train_loss": -23.52029800415039, "global_step": 147156, "epoch": 1772} {"train_loss": -23.10455894470215, "global_step": 147157, "epoch": 1772} {"train_loss": -23.11821815766484, "global_step": 147158, "epoch": 1772, "val_loss": 6413693.5} {"train_loss": -23.143686294555664, "global_step": 147159, "epoch": 1773} {"train_loss": -22.49625587463379, "global_step": 147160, "epoch": 1773} {"train_loss": -22.281431198120117, "global_step": 147161, "epoch": 1773} {"train_loss": -23.12079429626465, "global_step": 147162, "epoch": 1773} {"train_loss": -23.035444259643555, "global_step": 147163, "epoch": 1773} {"train_loss": -22.884510040283203, "global_step": 147164, "epoch": 1773} {"train_loss": -22.916732788085938, "global_step": 147165, "epoch": 1773} {"train_loss": -22.821653366088867, "global_step": 147166, "epoch": 1773} {"train_loss": -23.14373207092285, "global_step": 147167, "epoch": 1773} {"train_loss": -22.914878845214844, "global_step": 147168, "epoch": 1773} {"train_loss": -22.99409294128418, "global_step": 147169, "epoch": 1773} {"train_loss": -23.13282012939453, "global_step": 147170, "epoch": 1773} {"train_loss": -23.2720947265625, "global_step": 147171, "epoch": 1773} {"train_loss": -23.142446517944336, "global_step": 147172, "epoch": 1773} {"train_loss": -23.355886459350586, "global_step": 147173, "epoch": 1773} {"train_loss": -23.213815689086914, "global_step": 147174, "epoch": 1773} {"train_loss": -22.915786743164062, "global_step": 147175, "epoch": 1773} {"train_loss": -23.202863693237305, "global_step": 147176, "epoch": 1773} {"train_loss": -22.744037628173828, "global_step": 147177, "epoch": 1773} {"train_loss": -23.053089141845703, "global_step": 147178, "epoch": 1773} {"train_loss": -22.97757339477539, "global_step": 147179, "epoch": 1773} {"train_loss": -23.28973960876465, "global_step": 147180, "epoch": 1773} {"train_loss": -23.127033233642578, "global_step": 147181, "epoch": 1773} {"train_loss": -23.0172119140625, "global_step": 147182, "epoch": 1773} {"train_loss": -22.95094108581543, "global_step": 147183, "epoch": 1773} {"train_loss": -23.138935089111328, "global_step": 147184, "epoch": 1773} {"train_loss": -23.370298385620117, "global_step": 147185, "epoch": 1773} {"train_loss": -23.10257911682129, "global_step": 147186, "epoch": 1773} {"train_loss": -23.006317138671875, "global_step": 147187, "epoch": 1773} {"train_loss": -23.13629722595215, "global_step": 147188, "epoch": 1773} {"train_loss": -23.365739822387695, "global_step": 147189, "epoch": 1773} {"train_loss": -23.11933135986328, "global_step": 147190, "epoch": 1773} {"train_loss": -23.41718101501465, "global_step": 147191, "epoch": 1773} {"train_loss": -22.824689865112305, "global_step": 147192, "epoch": 1773} {"train_loss": -22.9125919342041, "global_step": 147193, "epoch": 1773} {"train_loss": -23.414365768432617, "global_step": 147194, "epoch": 1773} {"train_loss": -23.1778621673584, "global_step": 147195, "epoch": 1773} {"train_loss": -23.08138084411621, "global_step": 147196, "epoch": 1773} {"train_loss": -23.04804039001465, "global_step": 147197, "epoch": 1773} {"train_loss": -23.23476791381836, "global_step": 147198, "epoch": 1773} {"train_loss": -23.15573501586914, "global_step": 147199, "epoch": 1773} {"train_loss": -23.31594467163086, "global_step": 147200, "epoch": 1773} {"train_loss": -23.091032028198242, "global_step": 147201, "epoch": 1773} {"train_loss": -23.06574821472168, "global_step": 147202, "epoch": 1773} {"train_loss": -23.350299835205078, "global_step": 147203, "epoch": 1773} {"train_loss": -23.176748275756836, "global_step": 147204, "epoch": 1773} {"train_loss": -23.417348861694336, "global_step": 147205, "epoch": 1773} {"train_loss": -23.36639976501465, "global_step": 147206, "epoch": 1773} {"train_loss": -23.02457618713379, "global_step": 147207, "epoch": 1773} {"train_loss": -23.20768928527832, "global_step": 147208, "epoch": 1773} {"train_loss": -23.13714027404785, "global_step": 147209, "epoch": 1773} {"train_loss": -23.50930404663086, "global_step": 147210, "epoch": 1773} {"train_loss": -23.526813507080078, "global_step": 147211, "epoch": 1773} {"train_loss": -23.19336700439453, "global_step": 147212, "epoch": 1773} {"train_loss": -23.39761734008789, "global_step": 147213, "epoch": 1773} {"train_loss": -23.1463680267334, "global_step": 147214, "epoch": 1773} {"train_loss": -23.575454711914062, "global_step": 147215, "epoch": 1773} {"train_loss": -23.425931930541992, "global_step": 147216, "epoch": 1773} {"train_loss": -23.083736419677734, "global_step": 147217, "epoch": 1773} {"train_loss": -23.57098960876465, "global_step": 147218, "epoch": 1773} {"train_loss": -23.306467056274414, "global_step": 147219, "epoch": 1773} {"train_loss": -23.621891021728516, "global_step": 147220, "epoch": 1773} {"train_loss": -23.21746063232422, "global_step": 147221, "epoch": 1773} {"train_loss": -23.519309997558594, "global_step": 147222, "epoch": 1773} {"train_loss": -23.689218521118164, "global_step": 147223, "epoch": 1773} {"train_loss": -23.10699462890625, "global_step": 147224, "epoch": 1773} {"train_loss": -23.333913803100586, "global_step": 147225, "epoch": 1773} {"train_loss": -23.156383514404297, "global_step": 147226, "epoch": 1773} {"train_loss": -22.881324768066406, "global_step": 147227, "epoch": 1773} {"train_loss": -23.1331787109375, "global_step": 147228, "epoch": 1773} {"train_loss": -23.571535110473633, "global_step": 147229, "epoch": 1773} {"train_loss": -23.597702026367188, "global_step": 147230, "epoch": 1773} {"train_loss": -23.509288787841797, "global_step": 147231, "epoch": 1773} {"train_loss": -23.12782859802246, "global_step": 147232, "epoch": 1773} {"train_loss": -22.917987823486328, "global_step": 147233, "epoch": 1773} {"train_loss": -23.025484085083008, "global_step": 147234, "epoch": 1773} {"train_loss": -23.25900650024414, "global_step": 147235, "epoch": 1773} {"train_loss": -23.556339263916016, "global_step": 147236, "epoch": 1773} {"train_loss": -23.463232040405273, "global_step": 147237, "epoch": 1773} {"train_loss": -23.414615631103516, "global_step": 147238, "epoch": 1773} {"train_loss": -23.794857025146484, "global_step": 147239, "epoch": 1773} {"train_loss": -23.095596313476562, "global_step": 147240, "epoch": 1773} {"train_loss": -23.210518250982446, "global_step": 147241, "epoch": 1773, "val_loss": 6317413.0} {"train_loss": -21.496278762817383, "global_step": 147242, "epoch": 1774} {"train_loss": -21.481365203857422, "global_step": 147243, "epoch": 1774} {"train_loss": -22.720434188842773, "global_step": 147244, "epoch": 1774} {"train_loss": -21.989850997924805, "global_step": 147245, "epoch": 1774} {"train_loss": -22.365009307861328, "global_step": 147246, "epoch": 1774} {"train_loss": -22.639205932617188, "global_step": 147247, "epoch": 1774} {"train_loss": -22.27298355102539, "global_step": 147248, "epoch": 1774} {"train_loss": -22.76824378967285, "global_step": 147249, "epoch": 1774} {"train_loss": -22.267484664916992, "global_step": 147250, "epoch": 1774} {"train_loss": -22.782087326049805, "global_step": 147251, "epoch": 1774} {"train_loss": -22.517560958862305, "global_step": 147252, "epoch": 1774} {"train_loss": -22.45004653930664, "global_step": 147253, "epoch": 1774} {"train_loss": -22.501285552978516, "global_step": 147254, "epoch": 1774} {"train_loss": -22.68055534362793, "global_step": 147255, "epoch": 1774} {"train_loss": -22.786603927612305, "global_step": 147256, "epoch": 1774} {"train_loss": -22.419523239135742, "global_step": 147257, "epoch": 1774} {"train_loss": -22.568368911743164, "global_step": 147258, "epoch": 1774} {"train_loss": -22.589691162109375, "global_step": 147259, "epoch": 1774} {"train_loss": -22.89521598815918, "global_step": 147260, "epoch": 1774} {"train_loss": -22.992494583129883, "global_step": 147261, "epoch": 1774} {"train_loss": -23.04743766784668, "global_step": 147262, "epoch": 1774} {"train_loss": -22.885223388671875, "global_step": 147263, "epoch": 1774} {"train_loss": -22.963275909423828, "global_step": 147264, "epoch": 1774} {"train_loss": -22.796070098876953, "global_step": 147265, "epoch": 1774} {"train_loss": -22.86531639099121, "global_step": 147266, "epoch": 1774} {"train_loss": -22.672813415527344, "global_step": 147267, "epoch": 1774} {"train_loss": -22.819814682006836, "global_step": 147268, "epoch": 1774} {"train_loss": -23.175718307495117, "global_step": 147269, "epoch": 1774} {"train_loss": -22.774534225463867, "global_step": 147270, "epoch": 1774} {"train_loss": -23.06390953063965, "global_step": 147271, "epoch": 1774} {"train_loss": -23.0526180267334, "global_step": 147272, "epoch": 1774} {"train_loss": -23.118263244628906, "global_step": 147273, "epoch": 1774} {"train_loss": -23.393779754638672, "global_step": 147274, "epoch": 1774} {"train_loss": -23.16936683654785, "global_step": 147275, "epoch": 1774} {"train_loss": -23.125585556030273, "global_step": 147276, "epoch": 1774} {"train_loss": -23.47324562072754, "global_step": 147277, "epoch": 1774} {"train_loss": -22.9614200592041, "global_step": 147278, "epoch": 1774} {"train_loss": -23.066986083984375, "global_step": 147279, "epoch": 1774} {"train_loss": -23.33174705505371, "global_step": 147280, "epoch": 1774} {"train_loss": -22.843276977539062, "global_step": 147281, "epoch": 1774} {"train_loss": -22.836149215698242, "global_step": 147282, "epoch": 1774} {"train_loss": -23.01246452331543, "global_step": 147283, "epoch": 1774} {"train_loss": -22.990434646606445, "global_step": 147284, "epoch": 1774} {"train_loss": -23.411054611206055, "global_step": 147285, "epoch": 1774} {"train_loss": -23.02692985534668, "global_step": 147286, "epoch": 1774} {"train_loss": -23.224763870239258, "global_step": 147287, "epoch": 1774} {"train_loss": -23.059064865112305, "global_step": 147288, "epoch": 1774} {"train_loss": -23.168537139892578, "global_step": 147289, "epoch": 1774} {"train_loss": -22.74793243408203, "global_step": 147290, "epoch": 1774} {"train_loss": -22.8486385345459, "global_step": 147291, "epoch": 1774} {"train_loss": -23.082874298095703, "global_step": 147292, "epoch": 1774} {"train_loss": -23.108598709106445, "global_step": 147293, "epoch": 1774} {"train_loss": -22.950725555419922, "global_step": 147294, "epoch": 1774} {"train_loss": -23.175302505493164, "global_step": 147295, "epoch": 1774} {"train_loss": -23.21299171447754, "global_step": 147296, "epoch": 1774} {"train_loss": -22.732467651367188, "global_step": 147297, "epoch": 1774} {"train_loss": -23.07744598388672, "global_step": 147298, "epoch": 1774} {"train_loss": -22.784284591674805, "global_step": 147299, "epoch": 1774} {"train_loss": -23.030166625976562, "global_step": 147300, "epoch": 1774} {"train_loss": -23.264585494995117, "global_step": 147301, "epoch": 1774} {"train_loss": -23.434316635131836, "global_step": 147302, "epoch": 1774} {"train_loss": -23.231491088867188, "global_step": 147303, "epoch": 1774} {"train_loss": -23.18630599975586, "global_step": 147304, "epoch": 1774} {"train_loss": -23.369537353515625, "global_step": 147305, "epoch": 1774} {"train_loss": -22.778844833374023, "global_step": 147306, "epoch": 1774} {"train_loss": -23.353778839111328, "global_step": 147307, "epoch": 1774} {"train_loss": -22.983091354370117, "global_step": 147308, "epoch": 1774} {"train_loss": -23.04690170288086, "global_step": 147309, "epoch": 1774} {"train_loss": -22.930360794067383, "global_step": 147310, "epoch": 1774} {"train_loss": -22.92304039001465, "global_step": 147311, "epoch": 1774} {"train_loss": -23.05635643005371, "global_step": 147312, "epoch": 1774} {"train_loss": -22.998493194580078, "global_step": 147313, "epoch": 1774} {"train_loss": -23.526731491088867, "global_step": 147314, "epoch": 1774} {"train_loss": -23.269912719726562, "global_step": 147315, "epoch": 1774} {"train_loss": -23.398122787475586, "global_step": 147316, "epoch": 1774} {"train_loss": -22.730213165283203, "global_step": 147317, "epoch": 1774} {"train_loss": -23.030797958374023, "global_step": 147318, "epoch": 1774} {"train_loss": -23.41925621032715, "global_step": 147319, "epoch": 1774} {"train_loss": -22.974292755126953, "global_step": 147320, "epoch": 1774} {"train_loss": -23.22675895690918, "global_step": 147321, "epoch": 1774} {"train_loss": -23.25796890258789, "global_step": 147322, "epoch": 1774} {"train_loss": -23.24240493774414, "global_step": 147323, "epoch": 1774} {"train_loss": -22.92809978163386, "global_step": 147324, "epoch": 1774, "val_loss": 6340035.0} {"train_loss": -21.29618263244629, "global_step": 147325, "epoch": 1775} {"train_loss": -22.029783248901367, "global_step": 147326, "epoch": 1775} {"train_loss": -23.003381729125977, "global_step": 147327, "epoch": 1775} {"train_loss": -22.018497467041016, "global_step": 147328, "epoch": 1775} {"train_loss": -22.635324478149414, "global_step": 147329, "epoch": 1775} {"train_loss": -22.501760482788086, "global_step": 147330, "epoch": 1775} {"train_loss": -22.34706687927246, "global_step": 147331, "epoch": 1775} {"train_loss": -22.803138732910156, "global_step": 147332, "epoch": 1775} {"train_loss": -22.810728073120117, "global_step": 147333, "epoch": 1775} {"train_loss": -22.86673927307129, "global_step": 147334, "epoch": 1775} {"train_loss": -22.47125816345215, "global_step": 147335, "epoch": 1775} {"train_loss": -22.639726638793945, "global_step": 147336, "epoch": 1775} {"train_loss": -22.598058700561523, "global_step": 147337, "epoch": 1775} {"train_loss": -22.34014320373535, "global_step": 147338, "epoch": 1775} {"train_loss": -22.482093811035156, "global_step": 147339, "epoch": 1775} {"train_loss": -22.35383415222168, "global_step": 147340, "epoch": 1775} {"train_loss": -22.316329956054688, "global_step": 147341, "epoch": 1775} {"train_loss": -22.943763732910156, "global_step": 147342, "epoch": 1775} {"train_loss": -22.666608810424805, "global_step": 147343, "epoch": 1775} {"train_loss": -22.39948081970215, "global_step": 147344, "epoch": 1775} {"train_loss": -22.892074584960938, "global_step": 147345, "epoch": 1775} {"train_loss": -23.002737045288086, "global_step": 147346, "epoch": 1775} {"train_loss": -22.95928382873535, "global_step": 147347, "epoch": 1775} {"train_loss": -22.80997657775879, "global_step": 147348, "epoch": 1775} {"train_loss": -23.01763916015625, "global_step": 147349, "epoch": 1775} {"train_loss": -22.8792667388916, "global_step": 147350, "epoch": 1775} {"train_loss": -22.634143829345703, "global_step": 147351, "epoch": 1775} {"train_loss": -22.687007904052734, "global_step": 147352, "epoch": 1775} {"train_loss": -23.116987228393555, "global_step": 147353, "epoch": 1775} {"train_loss": -22.95038414001465, "global_step": 147354, "epoch": 1775} {"train_loss": -23.259408950805664, "global_step": 147355, "epoch": 1775} {"train_loss": -23.022151947021484, "global_step": 147356, "epoch": 1775} {"train_loss": -23.193944931030273, "global_step": 147357, "epoch": 1775} {"train_loss": -23.39821434020996, "global_step": 147358, "epoch": 1775} {"train_loss": -22.770797729492188, "global_step": 147359, "epoch": 1775} {"train_loss": -23.35822868347168, "global_step": 147360, "epoch": 1775} {"train_loss": -23.505977630615234, "global_step": 147361, "epoch": 1775} {"train_loss": -23.192935943603516, "global_step": 147362, "epoch": 1775} {"train_loss": -23.302892684936523, "global_step": 147363, "epoch": 1775} {"train_loss": -22.901626586914062, "global_step": 147364, "epoch": 1775} {"train_loss": -23.286020278930664, "global_step": 147365, "epoch": 1775} {"train_loss": -23.074499130249023, "global_step": 147366, "epoch": 1775} {"train_loss": -23.364883422851562, "global_step": 147367, "epoch": 1775} {"train_loss": -23.166046142578125, "global_step": 147368, "epoch": 1775} {"train_loss": -23.271005630493164, "global_step": 147369, "epoch": 1775} {"train_loss": -23.180747985839844, "global_step": 147370, "epoch": 1775} {"train_loss": -23.43525505065918, "global_step": 147371, "epoch": 1775} {"train_loss": -22.868349075317383, "global_step": 147372, "epoch": 1775} {"train_loss": -23.293611526489258, "global_step": 147373, "epoch": 1775} {"train_loss": -23.349504470825195, "global_step": 147374, "epoch": 1775} {"train_loss": -23.5117130279541, "global_step": 147375, "epoch": 1775} {"train_loss": -23.827001571655273, "global_step": 147376, "epoch": 1775} {"train_loss": -23.576215744018555, "global_step": 147377, "epoch": 1775} {"train_loss": -23.164649963378906, "global_step": 147378, "epoch": 1775} {"train_loss": -23.207721710205078, "global_step": 147379, "epoch": 1775} {"train_loss": -23.579124450683594, "global_step": 147380, "epoch": 1775} {"train_loss": -23.10725975036621, "global_step": 147381, "epoch": 1775} {"train_loss": -23.623695373535156, "global_step": 147382, "epoch": 1775} {"train_loss": -23.0907039642334, "global_step": 147383, "epoch": 1775} {"train_loss": -23.492326736450195, "global_step": 147384, "epoch": 1775} {"train_loss": -23.38698959350586, "global_step": 147385, "epoch": 1775} {"train_loss": -23.68195152282715, "global_step": 147386, "epoch": 1775} {"train_loss": -23.4311580657959, "global_step": 147387, "epoch": 1775} {"train_loss": -23.40995216369629, "global_step": 147388, "epoch": 1775} {"train_loss": -23.073434829711914, "global_step": 147389, "epoch": 1775} {"train_loss": -23.16264533996582, "global_step": 147390, "epoch": 1775} {"train_loss": -23.196796417236328, "global_step": 147391, "epoch": 1775} {"train_loss": -23.43390464782715, "global_step": 147392, "epoch": 1775} {"train_loss": -23.222787857055664, "global_step": 147393, "epoch": 1775} {"train_loss": -23.247161865234375, "global_step": 147394, "epoch": 1775} {"train_loss": -23.489072799682617, "global_step": 147395, "epoch": 1775} {"train_loss": -23.313297271728516, "global_step": 147396, "epoch": 1775} {"train_loss": -23.41619873046875, "global_step": 147397, "epoch": 1775} {"train_loss": -22.916963577270508, "global_step": 147398, "epoch": 1775} {"train_loss": -23.677865982055664, "global_step": 147399, "epoch": 1775} {"train_loss": -23.61896514892578, "global_step": 147400, "epoch": 1775} {"train_loss": -22.857135772705078, "global_step": 147401, "epoch": 1775} {"train_loss": -23.265865325927734, "global_step": 147402, "epoch": 1775} {"train_loss": -23.43013572692871, "global_step": 147403, "epoch": 1775} {"train_loss": -23.119035720825195, "global_step": 147404, "epoch": 1775} {"train_loss": -23.151447296142578, "global_step": 147405, "epoch": 1775} {"train_loss": -23.103866577148438, "global_step": 147406, "epoch": 1775} {"train_loss": -23.043147765010236, "global_step": 147407, "epoch": 1775, "val_loss": 6218416.5} {"train_loss": -22.978382110595703, "global_step": 147408, "epoch": 1776} {"train_loss": -22.209688186645508, "global_step": 147409, "epoch": 1776} {"train_loss": -22.063810348510742, "global_step": 147410, "epoch": 1776} {"train_loss": -22.95474624633789, "global_step": 147411, "epoch": 1776} {"train_loss": -23.050565719604492, "global_step": 147412, "epoch": 1776} {"train_loss": -23.127222061157227, "global_step": 147413, "epoch": 1776} {"train_loss": -23.23374366760254, "global_step": 147414, "epoch": 1776} {"train_loss": -23.186445236206055, "global_step": 147415, "epoch": 1776} {"train_loss": -22.772878646850586, "global_step": 147416, "epoch": 1776} {"train_loss": -22.85762596130371, "global_step": 147417, "epoch": 1776} {"train_loss": -23.177478790283203, "global_step": 147418, "epoch": 1776} {"train_loss": -22.99335289001465, "global_step": 147419, "epoch": 1776} {"train_loss": -23.412433624267578, "global_step": 147420, "epoch": 1776} {"train_loss": -23.06052017211914, "global_step": 147421, "epoch": 1776} {"train_loss": -23.238183975219727, "global_step": 147422, "epoch": 1776} {"train_loss": -23.095998764038086, "global_step": 147423, "epoch": 1776} {"train_loss": -23.02115821838379, "global_step": 147424, "epoch": 1776} {"train_loss": -23.084447860717773, "global_step": 147425, "epoch": 1776} {"train_loss": -22.895645141601562, "global_step": 147426, "epoch": 1776} {"train_loss": -22.967016220092773, "global_step": 147427, "epoch": 1776} {"train_loss": -23.114179611206055, "global_step": 147428, "epoch": 1776} {"train_loss": -23.294097900390625, "global_step": 147429, "epoch": 1776} {"train_loss": -23.318784713745117, "global_step": 147430, "epoch": 1776} {"train_loss": -22.907682418823242, "global_step": 147431, "epoch": 1776} {"train_loss": -23.30622673034668, "global_step": 147432, "epoch": 1776} {"train_loss": -22.84040641784668, "global_step": 147433, "epoch": 1776} {"train_loss": -23.361454010009766, "global_step": 147434, "epoch": 1776} {"train_loss": -23.052595138549805, "global_step": 147435, "epoch": 1776} {"train_loss": -23.14198112487793, "global_step": 147436, "epoch": 1776} {"train_loss": -23.496612548828125, "global_step": 147437, "epoch": 1776} {"train_loss": -23.296289443969727, "global_step": 147438, "epoch": 1776} {"train_loss": -23.697141647338867, "global_step": 147439, "epoch": 1776} {"train_loss": -23.109527587890625, "global_step": 147440, "epoch": 1776} {"train_loss": -23.370548248291016, "global_step": 147441, "epoch": 1776} {"train_loss": -23.34795379638672, "global_step": 147442, "epoch": 1776} {"train_loss": -23.429309844970703, "global_step": 147443, "epoch": 1776} {"train_loss": -23.37166404724121, "global_step": 147444, "epoch": 1776} {"train_loss": -23.014774322509766, "global_step": 147445, "epoch": 1776} {"train_loss": -23.2121639251709, "global_step": 147446, "epoch": 1776} {"train_loss": -23.29659080505371, "global_step": 147447, "epoch": 1776} {"train_loss": -22.94785499572754, "global_step": 147448, "epoch": 1776} {"train_loss": -23.49336814880371, "global_step": 147449, "epoch": 1776} {"train_loss": -23.488882064819336, "global_step": 147450, "epoch": 1776} {"train_loss": -23.11856460571289, "global_step": 147451, "epoch": 1776} {"train_loss": -23.340709686279297, "global_step": 147452, "epoch": 1776} {"train_loss": -23.50192642211914, "global_step": 147453, "epoch": 1776} {"train_loss": -23.013891220092773, "global_step": 147454, "epoch": 1776} {"train_loss": -23.696334838867188, "global_step": 147455, "epoch": 1776} {"train_loss": -23.17257308959961, "global_step": 147456, "epoch": 1776} {"train_loss": -23.22515296936035, "global_step": 147457, "epoch": 1776} {"train_loss": -23.148601531982422, "global_step": 147458, "epoch": 1776} {"train_loss": -23.463502883911133, "global_step": 147459, "epoch": 1776} {"train_loss": -23.458829879760742, "global_step": 147460, "epoch": 1776} {"train_loss": -23.420373916625977, "global_step": 147461, "epoch": 1776} {"train_loss": -23.414335250854492, "global_step": 147462, "epoch": 1776} {"train_loss": -23.142309188842773, "global_step": 147463, "epoch": 1776} {"train_loss": -23.24166488647461, "global_step": 147464, "epoch": 1776} {"train_loss": -23.37113380432129, "global_step": 147465, "epoch": 1776} {"train_loss": -23.44119644165039, "global_step": 147466, "epoch": 1776} {"train_loss": -23.008634567260742, "global_step": 147467, "epoch": 1776} {"train_loss": -23.021142959594727, "global_step": 147468, "epoch": 1776} {"train_loss": -22.871591567993164, "global_step": 147469, "epoch": 1776} {"train_loss": -23.28907585144043, "global_step": 147470, "epoch": 1776} {"train_loss": -22.829696655273438, "global_step": 147471, "epoch": 1776} {"train_loss": -23.128259658813477, "global_step": 147472, "epoch": 1776} {"train_loss": -23.244251251220703, "global_step": 147473, "epoch": 1776} {"train_loss": -22.936424255371094, "global_step": 147474, "epoch": 1776} {"train_loss": -23.172033309936523, "global_step": 147475, "epoch": 1776} {"train_loss": -23.49137306213379, "global_step": 147476, "epoch": 1776} {"train_loss": -23.007986068725586, "global_step": 147477, "epoch": 1776} {"train_loss": -23.423715591430664, "global_step": 147478, "epoch": 1776} {"train_loss": -22.970590591430664, "global_step": 147479, "epoch": 1776} {"train_loss": -23.34604835510254, "global_step": 147480, "epoch": 1776} {"train_loss": -23.13453483581543, "global_step": 147481, "epoch": 1776} {"train_loss": -23.383625030517578, "global_step": 147482, "epoch": 1776} {"train_loss": -23.184734344482422, "global_step": 147483, "epoch": 1776} {"train_loss": -23.39938735961914, "global_step": 147484, "epoch": 1776} {"train_loss": -23.0210018157959, "global_step": 147485, "epoch": 1776} {"train_loss": -22.968544006347656, "global_step": 147486, "epoch": 1776} {"train_loss": -23.150365829467773, "global_step": 147487, "epoch": 1776} {"train_loss": -23.450468063354492, "global_step": 147488, "epoch": 1776} {"train_loss": -23.102487564086914, "global_step": 147489, "epoch": 1776} {"train_loss": -23.169444968901484, "global_step": 147490, "epoch": 1776, "val_loss": 6315602.0} {"train_loss": -22.893693923950195, "global_step": 147491, "epoch": 1777} {"train_loss": -23.227603912353516, "global_step": 147492, "epoch": 1777} {"train_loss": -22.899642944335938, "global_step": 147493, "epoch": 1777} {"train_loss": -22.591339111328125, "global_step": 147494, "epoch": 1777} {"train_loss": -22.733112335205078, "global_step": 147495, "epoch": 1777} {"train_loss": -23.234037399291992, "global_step": 147496, "epoch": 1777} {"train_loss": -23.070484161376953, "global_step": 147497, "epoch": 1777} {"train_loss": -22.833938598632812, "global_step": 147498, "epoch": 1777} {"train_loss": -23.020605087280273, "global_step": 147499, "epoch": 1777} {"train_loss": -23.12279510498047, "global_step": 147500, "epoch": 1777} {"train_loss": -23.287118911743164, "global_step": 147501, "epoch": 1777} {"train_loss": -23.465213775634766, "global_step": 147502, "epoch": 1777} {"train_loss": -23.11806869506836, "global_step": 147503, "epoch": 1777} {"train_loss": -23.191038131713867, "global_step": 147504, "epoch": 1777} {"train_loss": -23.396265029907227, "global_step": 147505, "epoch": 1777} {"train_loss": -23.212018966674805, "global_step": 147506, "epoch": 1777} {"train_loss": -23.2921085357666, "global_step": 147507, "epoch": 1777} {"train_loss": -23.354589462280273, "global_step": 147508, "epoch": 1777} {"train_loss": -23.26519203186035, "global_step": 147509, "epoch": 1777} {"train_loss": -22.906103134155273, "global_step": 147510, "epoch": 1777} {"train_loss": -23.2956600189209, "global_step": 147511, "epoch": 1777} {"train_loss": -23.203676223754883, "global_step": 147512, "epoch": 1777} {"train_loss": -23.078767776489258, "global_step": 147513, "epoch": 1777} {"train_loss": -23.20258331298828, "global_step": 147514, "epoch": 1777} {"train_loss": -23.133193969726562, "global_step": 147515, "epoch": 1777} {"train_loss": -23.2067928314209, "global_step": 147516, "epoch": 1777} {"train_loss": -23.37272071838379, "global_step": 147517, "epoch": 1777} {"train_loss": -23.50771141052246, "global_step": 147518, "epoch": 1777} {"train_loss": -23.163984298706055, "global_step": 147519, "epoch": 1777} {"train_loss": -22.9283447265625, "global_step": 147520, "epoch": 1777} {"train_loss": -23.114572525024414, "global_step": 147521, "epoch": 1777} {"train_loss": -23.09071159362793, "global_step": 147522, "epoch": 1777} {"train_loss": -22.876920700073242, "global_step": 147523, "epoch": 1777} {"train_loss": -22.88455581665039, "global_step": 147524, "epoch": 1777} {"train_loss": -23.30533218383789, "global_step": 147525, "epoch": 1777} {"train_loss": -22.57297706604004, "global_step": 147526, "epoch": 1777} {"train_loss": -22.799386978149414, "global_step": 147527, "epoch": 1777} {"train_loss": -23.100574493408203, "global_step": 147528, "epoch": 1777} {"train_loss": -22.85396957397461, "global_step": 147529, "epoch": 1777} {"train_loss": -23.093475341796875, "global_step": 147530, "epoch": 1777} {"train_loss": -22.73003387451172, "global_step": 147531, "epoch": 1777} {"train_loss": -22.904390335083008, "global_step": 147532, "epoch": 1777} {"train_loss": -23.029510498046875, "global_step": 147533, "epoch": 1777} {"train_loss": -23.305347442626953, "global_step": 147534, "epoch": 1777} {"train_loss": -23.102933883666992, "global_step": 147535, "epoch": 1777} {"train_loss": -23.00772476196289, "global_step": 147536, "epoch": 1777} {"train_loss": -22.579282760620117, "global_step": 147537, "epoch": 1777} {"train_loss": -22.986562728881836, "global_step": 147538, "epoch": 1777} {"train_loss": -23.16390037536621, "global_step": 147539, "epoch": 1777} {"train_loss": -22.872411727905273, "global_step": 147540, "epoch": 1777} {"train_loss": -22.661527633666992, "global_step": 147541, "epoch": 1777} {"train_loss": -22.927200317382812, "global_step": 147542, "epoch": 1777} {"train_loss": -23.105932235717773, "global_step": 147543, "epoch": 1777} {"train_loss": -23.017547607421875, "global_step": 147544, "epoch": 1777} {"train_loss": -23.088285446166992, "global_step": 147545, "epoch": 1777} {"train_loss": -23.41938591003418, "global_step": 147546, "epoch": 1777} {"train_loss": -23.290950775146484, "global_step": 147547, "epoch": 1777} {"train_loss": -23.166479110717773, "global_step": 147548, "epoch": 1777} {"train_loss": -23.375858306884766, "global_step": 147549, "epoch": 1777} {"train_loss": -23.03745460510254, "global_step": 147550, "epoch": 1777} {"train_loss": -22.906164169311523, "global_step": 147551, "epoch": 1777} {"train_loss": -23.022619247436523, "global_step": 147552, "epoch": 1777} {"train_loss": -23.053516387939453, "global_step": 147553, "epoch": 1777} {"train_loss": -23.0288143157959, "global_step": 147554, "epoch": 1777} {"train_loss": -23.41806411743164, "global_step": 147555, "epoch": 1777} {"train_loss": -23.308460235595703, "global_step": 147556, "epoch": 1777} {"train_loss": -23.15557861328125, "global_step": 147557, "epoch": 1777} {"train_loss": -22.990787506103516, "global_step": 147558, "epoch": 1777} {"train_loss": -23.26068687438965, "global_step": 147559, "epoch": 1777} {"train_loss": -22.877607345581055, "global_step": 147560, "epoch": 1777} {"train_loss": -23.106245040893555, "global_step": 147561, "epoch": 1777} {"train_loss": -23.114166259765625, "global_step": 147562, "epoch": 1777} {"train_loss": -22.986921310424805, "global_step": 147563, "epoch": 1777} {"train_loss": -23.137588500976562, "global_step": 147564, "epoch": 1777} {"train_loss": -23.137502670288086, "global_step": 147565, "epoch": 1777} {"train_loss": -23.24867057800293, "global_step": 147566, "epoch": 1777} {"train_loss": -23.187034606933594, "global_step": 147567, "epoch": 1777} {"train_loss": -23.43416976928711, "global_step": 147568, "epoch": 1777} {"train_loss": -23.374454498291016, "global_step": 147569, "epoch": 1777} {"train_loss": -23.455942153930664, "global_step": 147570, "epoch": 1777} {"train_loss": -23.495935440063477, "global_step": 147571, "epoch": 1777} {"train_loss": -23.17409324645996, "global_step": 147572, "epoch": 1777} {"train_loss": -23.103727064936994, "global_step": 147573, "epoch": 1777, "val_loss": 6345847.0} {"train_loss": -22.709016799926758, "global_step": 147574, "epoch": 1778} {"train_loss": -22.851713180541992, "global_step": 147575, "epoch": 1778} {"train_loss": -22.76276397705078, "global_step": 147576, "epoch": 1778} {"train_loss": -22.59797477722168, "global_step": 147577, "epoch": 1778} {"train_loss": -22.970441818237305, "global_step": 147578, "epoch": 1778} {"train_loss": -22.571462631225586, "global_step": 147579, "epoch": 1778} {"train_loss": -22.94756507873535, "global_step": 147580, "epoch": 1778} {"train_loss": -22.871051788330078, "global_step": 147581, "epoch": 1778} {"train_loss": -22.96820068359375, "global_step": 147582, "epoch": 1778} {"train_loss": -23.02604103088379, "global_step": 147583, "epoch": 1778} {"train_loss": -23.05898094177246, "global_step": 147584, "epoch": 1778} {"train_loss": -22.96204948425293, "global_step": 147585, "epoch": 1778} {"train_loss": -22.93255043029785, "global_step": 147586, "epoch": 1778} {"train_loss": -23.04180908203125, "global_step": 147587, "epoch": 1778} {"train_loss": -23.15913200378418, "global_step": 147588, "epoch": 1778} {"train_loss": -22.80183982849121, "global_step": 147589, "epoch": 1778} {"train_loss": -22.873334884643555, "global_step": 147590, "epoch": 1778} {"train_loss": -23.333261489868164, "global_step": 147591, "epoch": 1778} {"train_loss": -22.768247604370117, "global_step": 147592, "epoch": 1778} {"train_loss": -23.149127960205078, "global_step": 147593, "epoch": 1778} {"train_loss": -23.56195831298828, "global_step": 147594, "epoch": 1778} {"train_loss": -23.486007690429688, "global_step": 147595, "epoch": 1778} {"train_loss": -23.2857666015625, "global_step": 147596, "epoch": 1778} {"train_loss": -23.123863220214844, "global_step": 147597, "epoch": 1778} {"train_loss": -23.42021942138672, "global_step": 147598, "epoch": 1778} {"train_loss": -22.890432357788086, "global_step": 147599, "epoch": 1778} {"train_loss": -23.22982406616211, "global_step": 147600, "epoch": 1778} {"train_loss": -22.900665283203125, "global_step": 147601, "epoch": 1778} {"train_loss": -23.026208877563477, "global_step": 147602, "epoch": 1778} {"train_loss": -22.843292236328125, "global_step": 147603, "epoch": 1778} {"train_loss": -23.14967918395996, "global_step": 147604, "epoch": 1778} {"train_loss": -23.369775772094727, "global_step": 147605, "epoch": 1778} {"train_loss": -23.048131942749023, "global_step": 147606, "epoch": 1778} {"train_loss": -22.845008850097656, "global_step": 147607, "epoch": 1778} {"train_loss": -23.267847061157227, "global_step": 147608, "epoch": 1778} {"train_loss": -23.393659591674805, "global_step": 147609, "epoch": 1778} {"train_loss": -23.29225730895996, "global_step": 147610, "epoch": 1778} {"train_loss": -22.981637954711914, "global_step": 147611, "epoch": 1778} {"train_loss": -22.78529930114746, "global_step": 147612, "epoch": 1778} {"train_loss": -23.451133728027344, "global_step": 147613, "epoch": 1778} {"train_loss": -23.141077041625977, "global_step": 147614, "epoch": 1778} {"train_loss": -23.708770751953125, "global_step": 147615, "epoch": 1778} {"train_loss": -23.338180541992188, "global_step": 147616, "epoch": 1778} {"train_loss": -23.40087890625, "global_step": 147617, "epoch": 1778} {"train_loss": -23.338415145874023, "global_step": 147618, "epoch": 1778} {"train_loss": -23.354938507080078, "global_step": 147619, "epoch": 1778} {"train_loss": -23.475879669189453, "global_step": 147620, "epoch": 1778} {"train_loss": -23.28978729248047, "global_step": 147621, "epoch": 1778} {"train_loss": -23.3372859954834, "global_step": 147622, "epoch": 1778} {"train_loss": -23.188661575317383, "global_step": 147623, "epoch": 1778} {"train_loss": -23.383373260498047, "global_step": 147624, "epoch": 1778} {"train_loss": -23.08896255493164, "global_step": 147625, "epoch": 1778} {"train_loss": -23.586484909057617, "global_step": 147626, "epoch": 1778} {"train_loss": -22.900394439697266, "global_step": 147627, "epoch": 1778} {"train_loss": -23.669879913330078, "global_step": 147628, "epoch": 1778} {"train_loss": -23.318220138549805, "global_step": 147629, "epoch": 1778} {"train_loss": -23.22016143798828, "global_step": 147630, "epoch": 1778} {"train_loss": -23.227087020874023, "global_step": 147631, "epoch": 1778} {"train_loss": -23.05021095275879, "global_step": 147632, "epoch": 1778} {"train_loss": -23.50152587890625, "global_step": 147633, "epoch": 1778} {"train_loss": -23.464757919311523, "global_step": 147634, "epoch": 1778} {"train_loss": -23.340702056884766, "global_step": 147635, "epoch": 1778} {"train_loss": -23.314178466796875, "global_step": 147636, "epoch": 1778} {"train_loss": -23.37322998046875, "global_step": 147637, "epoch": 1778} {"train_loss": -23.741046905517578, "global_step": 147638, "epoch": 1778} {"train_loss": -23.293306350708008, "global_step": 147639, "epoch": 1778} {"train_loss": -23.61996841430664, "global_step": 147640, "epoch": 1778} {"train_loss": -23.307903289794922, "global_step": 147641, "epoch": 1778} {"train_loss": -23.29574203491211, "global_step": 147642, "epoch": 1778} {"train_loss": -23.14961814880371, "global_step": 147643, "epoch": 1778} {"train_loss": -23.19733238220215, "global_step": 147644, "epoch": 1778} {"train_loss": -23.29414939880371, "global_step": 147645, "epoch": 1778} {"train_loss": -23.268537521362305, "global_step": 147646, "epoch": 1778} {"train_loss": -23.156558990478516, "global_step": 147647, "epoch": 1778} {"train_loss": -23.075735092163086, "global_step": 147648, "epoch": 1778} {"train_loss": -23.14437484741211, "global_step": 147649, "epoch": 1778} {"train_loss": -23.41414451599121, "global_step": 147650, "epoch": 1778} {"train_loss": -23.410001754760742, "global_step": 147651, "epoch": 1778} {"train_loss": -23.062204360961914, "global_step": 147652, "epoch": 1778} {"train_loss": -22.90427017211914, "global_step": 147653, "epoch": 1778} {"train_loss": -23.216510772705078, "global_step": 147654, "epoch": 1778} {"train_loss": -22.982086181640625, "global_step": 147655, "epoch": 1778} {"train_loss": -23.167226883302252, "global_step": 147656, "epoch": 1778, "val_loss": 6531864.5} {"train_loss": -22.93104362487793, "global_step": 147657, "epoch": 1779} {"train_loss": -23.29034423828125, "global_step": 147658, "epoch": 1779} {"train_loss": -23.053831100463867, "global_step": 147659, "epoch": 1779} {"train_loss": -22.888273239135742, "global_step": 147660, "epoch": 1779} {"train_loss": -23.09169578552246, "global_step": 147661, "epoch": 1779} {"train_loss": -23.104982376098633, "global_step": 147662, "epoch": 1779} {"train_loss": -23.019908905029297, "global_step": 147663, "epoch": 1779} {"train_loss": -23.24947166442871, "global_step": 147664, "epoch": 1779} {"train_loss": -23.467971801757812, "global_step": 147665, "epoch": 1779} {"train_loss": -23.070646286010742, "global_step": 147666, "epoch": 1779} {"train_loss": -23.05597496032715, "global_step": 147667, "epoch": 1779} {"train_loss": -23.405248641967773, "global_step": 147668, "epoch": 1779} {"train_loss": -22.996992111206055, "global_step": 147669, "epoch": 1779} {"train_loss": -23.117170333862305, "global_step": 147670, "epoch": 1779} {"train_loss": -23.083505630493164, "global_step": 147671, "epoch": 1779} {"train_loss": -23.181936264038086, "global_step": 147672, "epoch": 1779} {"train_loss": -23.414602279663086, "global_step": 147673, "epoch": 1779} {"train_loss": -23.720474243164062, "global_step": 147674, "epoch": 1779} {"train_loss": -23.17441177368164, "global_step": 147675, "epoch": 1779} {"train_loss": -23.24250602722168, "global_step": 147676, "epoch": 1779} {"train_loss": -23.324726104736328, "global_step": 147677, "epoch": 1779} {"train_loss": -23.530776977539062, "global_step": 147678, "epoch": 1779} {"train_loss": -23.493274688720703, "global_step": 147679, "epoch": 1779} {"train_loss": -23.466951370239258, "global_step": 147680, "epoch": 1779} {"train_loss": -23.437057495117188, "global_step": 147681, "epoch": 1779} {"train_loss": -23.520404815673828, "global_step": 147682, "epoch": 1779} {"train_loss": -23.36988639831543, "global_step": 147683, "epoch": 1779} {"train_loss": -23.59397315979004, "global_step": 147684, "epoch": 1779} {"train_loss": -23.22921371459961, "global_step": 147685, "epoch": 1779} {"train_loss": -23.227224349975586, "global_step": 147686, "epoch": 1779} {"train_loss": -23.23688316345215, "global_step": 147687, "epoch": 1779} {"train_loss": -23.3695068359375, "global_step": 147688, "epoch": 1779} {"train_loss": -23.336572647094727, "global_step": 147689, "epoch": 1779} {"train_loss": -23.058456420898438, "global_step": 147690, "epoch": 1779} {"train_loss": -23.195486068725586, "global_step": 147691, "epoch": 1779} {"train_loss": -23.25318717956543, "global_step": 147692, "epoch": 1779} {"train_loss": -23.14122772216797, "global_step": 147693, "epoch": 1779} {"train_loss": -23.277700424194336, "global_step": 147694, "epoch": 1779} {"train_loss": -22.87307357788086, "global_step": 147695, "epoch": 1779} {"train_loss": -23.22195053100586, "global_step": 147696, "epoch": 1779} {"train_loss": -23.3392391204834, "global_step": 147697, "epoch": 1779} {"train_loss": -22.96441078186035, "global_step": 147698, "epoch": 1779} {"train_loss": -23.08677101135254, "global_step": 147699, "epoch": 1779} {"train_loss": -23.413022994995117, "global_step": 147700, "epoch": 1779} {"train_loss": -23.035757064819336, "global_step": 147701, "epoch": 1779} {"train_loss": -23.19771385192871, "global_step": 147702, "epoch": 1779} {"train_loss": -23.36301040649414, "global_step": 147703, "epoch": 1779} {"train_loss": -22.958776473999023, "global_step": 147704, "epoch": 1779} {"train_loss": -23.250898361206055, "global_step": 147705, "epoch": 1779} {"train_loss": -23.122119903564453, "global_step": 147706, "epoch": 1779} {"train_loss": -23.159814834594727, "global_step": 147707, "epoch": 1779} {"train_loss": -23.346837997436523, "global_step": 147708, "epoch": 1779} {"train_loss": -23.6890869140625, "global_step": 147709, "epoch": 1779} {"train_loss": -23.163433074951172, "global_step": 147710, "epoch": 1779} {"train_loss": -22.946699142456055, "global_step": 147711, "epoch": 1779} {"train_loss": -22.97449493408203, "global_step": 147712, "epoch": 1779} {"train_loss": -23.14348030090332, "global_step": 147713, "epoch": 1779} {"train_loss": -23.092506408691406, "global_step": 147714, "epoch": 1779} {"train_loss": -23.132986068725586, "global_step": 147715, "epoch": 1779} {"train_loss": -22.95501136779785, "global_step": 147716, "epoch": 1779} {"train_loss": -23.292905807495117, "global_step": 147717, "epoch": 1779} {"train_loss": -22.822797775268555, "global_step": 147718, "epoch": 1779} {"train_loss": -23.40593719482422, "global_step": 147719, "epoch": 1779} {"train_loss": -23.24410057067871, "global_step": 147720, "epoch": 1779} {"train_loss": -22.98422622680664, "global_step": 147721, "epoch": 1779} {"train_loss": -23.13106346130371, "global_step": 147722, "epoch": 1779} {"train_loss": -23.395265579223633, "global_step": 147723, "epoch": 1779} {"train_loss": -23.014694213867188, "global_step": 147724, "epoch": 1779} {"train_loss": -23.238004684448242, "global_step": 147725, "epoch": 1779} {"train_loss": -23.292606353759766, "global_step": 147726, "epoch": 1779} {"train_loss": -23.02484703063965, "global_step": 147727, "epoch": 1779} {"train_loss": -23.35341453552246, "global_step": 147728, "epoch": 1779} {"train_loss": -23.41295051574707, "global_step": 147729, "epoch": 1779} {"train_loss": -22.96259117126465, "global_step": 147730, "epoch": 1779} {"train_loss": -23.445302963256836, "global_step": 147731, "epoch": 1779} {"train_loss": -23.330175399780273, "global_step": 147732, "epoch": 1779} {"train_loss": -23.240591049194336, "global_step": 147733, "epoch": 1779} {"train_loss": -23.334980010986328, "global_step": 147734, "epoch": 1779} {"train_loss": -23.263574600219727, "global_step": 147735, "epoch": 1779} {"train_loss": -23.393667221069336, "global_step": 147736, "epoch": 1779} {"train_loss": -23.25844383239746, "global_step": 147737, "epoch": 1779} {"train_loss": -22.993066787719727, "global_step": 147738, "epoch": 1779} {"train_loss": -23.2077562263213, "global_step": 147739, "epoch": 1779, "val_loss": 6365070.5} {"train_loss": -23.196945190429688, "global_step": 147740, "epoch": 1780} {"train_loss": -22.895179748535156, "global_step": 147741, "epoch": 1780} {"train_loss": -22.92015838623047, "global_step": 147742, "epoch": 1780} {"train_loss": -22.955886840820312, "global_step": 147743, "epoch": 1780} {"train_loss": -22.62586212158203, "global_step": 147744, "epoch": 1780} {"train_loss": -22.882652282714844, "global_step": 147745, "epoch": 1780} {"train_loss": -23.02882957458496, "global_step": 147746, "epoch": 1780} {"train_loss": -23.213489532470703, "global_step": 147747, "epoch": 1780} {"train_loss": -23.17058753967285, "global_step": 147748, "epoch": 1780} {"train_loss": -22.89579963684082, "global_step": 147749, "epoch": 1780} {"train_loss": -23.043258666992188, "global_step": 147750, "epoch": 1780} {"train_loss": -22.926925659179688, "global_step": 147751, "epoch": 1780} {"train_loss": -23.198013305664062, "global_step": 147752, "epoch": 1780} {"train_loss": -23.125757217407227, "global_step": 147753, "epoch": 1780} {"train_loss": -22.844608306884766, "global_step": 147754, "epoch": 1780} {"train_loss": -23.22637367248535, "global_step": 147755, "epoch": 1780} {"train_loss": -23.12396812438965, "global_step": 147756, "epoch": 1780} {"train_loss": -23.147565841674805, "global_step": 147757, "epoch": 1780} {"train_loss": -23.150468826293945, "global_step": 147758, "epoch": 1780} {"train_loss": -23.143882751464844, "global_step": 147759, "epoch": 1780} {"train_loss": -23.518239974975586, "global_step": 147760, "epoch": 1780} {"train_loss": -23.134132385253906, "global_step": 147761, "epoch": 1780} {"train_loss": -22.770511627197266, "global_step": 147762, "epoch": 1780} {"train_loss": -23.38585090637207, "global_step": 147763, "epoch": 1780} {"train_loss": -22.598434448242188, "global_step": 147764, "epoch": 1780} {"train_loss": -23.180265426635742, "global_step": 147765, "epoch": 1780} {"train_loss": -23.0531063079834, "global_step": 147766, "epoch": 1780} {"train_loss": -23.371244430541992, "global_step": 147767, "epoch": 1780} {"train_loss": -23.559967041015625, "global_step": 147768, "epoch": 1780} {"train_loss": -23.65827178955078, "global_step": 147769, "epoch": 1780} {"train_loss": -23.552642822265625, "global_step": 147770, "epoch": 1780} {"train_loss": -23.339710235595703, "global_step": 147771, "epoch": 1780} {"train_loss": -23.4033260345459, "global_step": 147772, "epoch": 1780} {"train_loss": -23.211050033569336, "global_step": 147773, "epoch": 1780} {"train_loss": -23.383520126342773, "global_step": 147774, "epoch": 1780} {"train_loss": -23.23952293395996, "global_step": 147775, "epoch": 1780} {"train_loss": -23.119861602783203, "global_step": 147776, "epoch": 1780} {"train_loss": -23.24836540222168, "global_step": 147777, "epoch": 1780} {"train_loss": -22.956329345703125, "global_step": 147778, "epoch": 1780} {"train_loss": -23.675390243530273, "global_step": 147779, "epoch": 1780} {"train_loss": -23.252765655517578, "global_step": 147780, "epoch": 1780} {"train_loss": -23.204130172729492, "global_step": 147781, "epoch": 1780} {"train_loss": -23.154552459716797, "global_step": 147782, "epoch": 1780} {"train_loss": -23.291555404663086, "global_step": 147783, "epoch": 1780} {"train_loss": -23.454984664916992, "global_step": 147784, "epoch": 1780} {"train_loss": -22.81076431274414, "global_step": 147785, "epoch": 1780} {"train_loss": -23.11879539489746, "global_step": 147786, "epoch": 1780} {"train_loss": -23.01386070251465, "global_step": 147787, "epoch": 1780} {"train_loss": -23.145246505737305, "global_step": 147788, "epoch": 1780} {"train_loss": -23.25060272216797, "global_step": 147789, "epoch": 1780} {"train_loss": -23.42072105407715, "global_step": 147790, "epoch": 1780} {"train_loss": -23.359006881713867, "global_step": 147791, "epoch": 1780} {"train_loss": -23.364355087280273, "global_step": 147792, "epoch": 1780} {"train_loss": -23.18405532836914, "global_step": 147793, "epoch": 1780} {"train_loss": -23.461286544799805, "global_step": 147794, "epoch": 1780} {"train_loss": -23.319578170776367, "global_step": 147795, "epoch": 1780} {"train_loss": -23.453243255615234, "global_step": 147796, "epoch": 1780} {"train_loss": -23.21155548095703, "global_step": 147797, "epoch": 1780} {"train_loss": -23.282957077026367, "global_step": 147798, "epoch": 1780} {"train_loss": -23.819643020629883, "global_step": 147799, "epoch": 1780} {"train_loss": -23.54725456237793, "global_step": 147800, "epoch": 1780} {"train_loss": -23.121292114257812, "global_step": 147801, "epoch": 1780} {"train_loss": -23.093534469604492, "global_step": 147802, "epoch": 1780} {"train_loss": -23.539939880371094, "global_step": 147803, "epoch": 1780} {"train_loss": -23.227506637573242, "global_step": 147804, "epoch": 1780} {"train_loss": -23.090818405151367, "global_step": 147805, "epoch": 1780} {"train_loss": -23.16364288330078, "global_step": 147806, "epoch": 1780} {"train_loss": -23.447195053100586, "global_step": 147807, "epoch": 1780} {"train_loss": -23.115583419799805, "global_step": 147808, "epoch": 1780} {"train_loss": -22.97577476501465, "global_step": 147809, "epoch": 1780} {"train_loss": -23.265243530273438, "global_step": 147810, "epoch": 1780} {"train_loss": -22.974586486816406, "global_step": 147811, "epoch": 1780} {"train_loss": -23.307607650756836, "global_step": 147812, "epoch": 1780} {"train_loss": -23.630247116088867, "global_step": 147813, "epoch": 1780} {"train_loss": -23.234907150268555, "global_step": 147814, "epoch": 1780} {"train_loss": -23.042285919189453, "global_step": 147815, "epoch": 1780} {"train_loss": -23.15228271484375, "global_step": 147816, "epoch": 1780} {"train_loss": -22.939706802368164, "global_step": 147817, "epoch": 1780} {"train_loss": -23.09613037109375, "global_step": 147818, "epoch": 1780} {"train_loss": -23.361371994018555, "global_step": 147819, "epoch": 1780} {"train_loss": -22.97739601135254, "global_step": 147820, "epoch": 1780} {"train_loss": -23.29047203063965, "global_step": 147821, "epoch": 1780} {"train_loss": -23.197340195437512, "global_step": 147822, "epoch": 1780, "val_loss": 6375215.0} {"train_loss": -21.961782455444336, "global_step": 147823, "epoch": 1781} {"train_loss": -22.605981826782227, "global_step": 147824, "epoch": 1781} {"train_loss": -23.1412353515625, "global_step": 147825, "epoch": 1781} {"train_loss": -22.632221221923828, "global_step": 147826, "epoch": 1781} {"train_loss": -22.980571746826172, "global_step": 147827, "epoch": 1781} {"train_loss": -22.54274559020996, "global_step": 147828, "epoch": 1781} {"train_loss": -22.691137313842773, "global_step": 147829, "epoch": 1781} {"train_loss": -22.9417781829834, "global_step": 147830, "epoch": 1781} {"train_loss": -22.879779815673828, "global_step": 147831, "epoch": 1781} {"train_loss": -22.6988525390625, "global_step": 147832, "epoch": 1781} {"train_loss": -23.034496307373047, "global_step": 147833, "epoch": 1781} {"train_loss": -22.57219123840332, "global_step": 147834, "epoch": 1781} {"train_loss": -23.1866512298584, "global_step": 147835, "epoch": 1781} {"train_loss": -22.446767807006836, "global_step": 147836, "epoch": 1781} {"train_loss": -22.861738204956055, "global_step": 147837, "epoch": 1781} {"train_loss": -23.03717803955078, "global_step": 147838, "epoch": 1781} {"train_loss": -22.919042587280273, "global_step": 147839, "epoch": 1781} {"train_loss": -22.72983741760254, "global_step": 147840, "epoch": 1781} {"train_loss": -23.47958755493164, "global_step": 147841, "epoch": 1781} {"train_loss": -23.18811798095703, "global_step": 147842, "epoch": 1781} {"train_loss": -23.014331817626953, "global_step": 147843, "epoch": 1781} {"train_loss": -23.105466842651367, "global_step": 147844, "epoch": 1781} {"train_loss": -23.17690086364746, "global_step": 147845, "epoch": 1781} {"train_loss": -23.132755279541016, "global_step": 147846, "epoch": 1781} {"train_loss": -23.265344619750977, "global_step": 147847, "epoch": 1781} {"train_loss": -23.421476364135742, "global_step": 147848, "epoch": 1781} {"train_loss": -23.328840255737305, "global_step": 147849, "epoch": 1781} {"train_loss": -22.938583374023438, "global_step": 147850, "epoch": 1781} {"train_loss": -23.30006217956543, "global_step": 147851, "epoch": 1781} {"train_loss": -22.94080352783203, "global_step": 147852, "epoch": 1781} {"train_loss": -23.36370277404785, "global_step": 147853, "epoch": 1781} {"train_loss": -23.4792423248291, "global_step": 147854, "epoch": 1781} {"train_loss": -23.00443458557129, "global_step": 147855, "epoch": 1781} {"train_loss": -22.910154342651367, "global_step": 147856, "epoch": 1781} {"train_loss": -23.25394058227539, "global_step": 147857, "epoch": 1781} {"train_loss": -23.12636375427246, "global_step": 147858, "epoch": 1781} {"train_loss": -23.459104537963867, "global_step": 147859, "epoch": 1781} {"train_loss": -23.12093162536621, "global_step": 147860, "epoch": 1781} {"train_loss": -23.68733787536621, "global_step": 147861, "epoch": 1781} {"train_loss": -23.224008560180664, "global_step": 147862, "epoch": 1781} {"train_loss": -23.779644012451172, "global_step": 147863, "epoch": 1781} {"train_loss": -23.08980369567871, "global_step": 147864, "epoch": 1781} {"train_loss": -22.814170837402344, "global_step": 147865, "epoch": 1781} {"train_loss": -23.290830612182617, "global_step": 147866, "epoch": 1781} {"train_loss": -23.06313705444336, "global_step": 147867, "epoch": 1781} {"train_loss": -23.418485641479492, "global_step": 147868, "epoch": 1781} {"train_loss": -23.144594192504883, "global_step": 147869, "epoch": 1781} {"train_loss": -23.446775436401367, "global_step": 147870, "epoch": 1781} {"train_loss": -23.4282283782959, "global_step": 147871, "epoch": 1781} {"train_loss": -23.289655685424805, "global_step": 147872, "epoch": 1781} {"train_loss": -23.186813354492188, "global_step": 147873, "epoch": 1781} {"train_loss": -23.224828720092773, "global_step": 147874, "epoch": 1781} {"train_loss": -23.353429794311523, "global_step": 147875, "epoch": 1781} {"train_loss": -23.196990966796875, "global_step": 147876, "epoch": 1781} {"train_loss": -23.14204978942871, "global_step": 147877, "epoch": 1781} {"train_loss": -23.260862350463867, "global_step": 147878, "epoch": 1781} {"train_loss": -23.499282836914062, "global_step": 147879, "epoch": 1781} {"train_loss": -23.186359405517578, "global_step": 147880, "epoch": 1781} {"train_loss": -23.322235107421875, "global_step": 147881, "epoch": 1781} {"train_loss": -23.032018661499023, "global_step": 147882, "epoch": 1781} {"train_loss": -23.566564559936523, "global_step": 147883, "epoch": 1781} {"train_loss": -23.001680374145508, "global_step": 147884, "epoch": 1781} {"train_loss": -22.76611328125, "global_step": 147885, "epoch": 1781} {"train_loss": -23.2419490814209, "global_step": 147886, "epoch": 1781} {"train_loss": -23.041608810424805, "global_step": 147887, "epoch": 1781} {"train_loss": -22.945159912109375, "global_step": 147888, "epoch": 1781} {"train_loss": -23.490741729736328, "global_step": 147889, "epoch": 1781} {"train_loss": -22.66777992248535, "global_step": 147890, "epoch": 1781} {"train_loss": -23.186315536499023, "global_step": 147891, "epoch": 1781} {"train_loss": -23.239898681640625, "global_step": 147892, "epoch": 1781} {"train_loss": -22.96583366394043, "global_step": 147893, "epoch": 1781} {"train_loss": -23.44715690612793, "global_step": 147894, "epoch": 1781} {"train_loss": -23.229265213012695, "global_step": 147895, "epoch": 1781} {"train_loss": -23.325834274291992, "global_step": 147896, "epoch": 1781} {"train_loss": -23.38003158569336, "global_step": 147897, "epoch": 1781} {"train_loss": -23.482789993286133, "global_step": 147898, "epoch": 1781} {"train_loss": -23.5306396484375, "global_step": 147899, "epoch": 1781} {"train_loss": -23.58984375, "global_step": 147900, "epoch": 1781} {"train_loss": -23.419540405273438, "global_step": 147901, "epoch": 1781} {"train_loss": -23.383399963378906, "global_step": 147902, "epoch": 1781} {"train_loss": -23.158035278320312, "global_step": 147903, "epoch": 1781} {"train_loss": -23.1478271484375, "global_step": 147904, "epoch": 1781} {"train_loss": -23.133916716977776, "global_step": 147905, "epoch": 1781, "val_loss": 6309456.0} {"train_loss": -22.33176040649414, "global_step": 147906, "epoch": 1782} {"train_loss": -22.297948837280273, "global_step": 147907, "epoch": 1782} {"train_loss": -23.110151290893555, "global_step": 147908, "epoch": 1782} {"train_loss": -22.2353572845459, "global_step": 147909, "epoch": 1782} {"train_loss": -23.047426223754883, "global_step": 147910, "epoch": 1782} {"train_loss": -22.814176559448242, "global_step": 147911, "epoch": 1782} {"train_loss": -22.879480361938477, "global_step": 147912, "epoch": 1782} {"train_loss": -22.88758659362793, "global_step": 147913, "epoch": 1782} {"train_loss": -22.683359146118164, "global_step": 147914, "epoch": 1782} {"train_loss": -23.238447189331055, "global_step": 147915, "epoch": 1782} {"train_loss": -23.29743003845215, "global_step": 147916, "epoch": 1782} {"train_loss": -22.915098190307617, "global_step": 147917, "epoch": 1782} {"train_loss": -22.82181739807129, "global_step": 147918, "epoch": 1782} {"train_loss": -22.71803855895996, "global_step": 147919, "epoch": 1782} {"train_loss": -23.194746017456055, "global_step": 147920, "epoch": 1782} {"train_loss": -22.864736557006836, "global_step": 147921, "epoch": 1782} {"train_loss": -23.111738204956055, "global_step": 147922, "epoch": 1782} {"train_loss": -23.632280349731445, "global_step": 147923, "epoch": 1782} {"train_loss": -23.339914321899414, "global_step": 147924, "epoch": 1782} {"train_loss": -23.192777633666992, "global_step": 147925, "epoch": 1782} {"train_loss": -23.179304122924805, "global_step": 147926, "epoch": 1782} {"train_loss": -22.869606018066406, "global_step": 147927, "epoch": 1782} {"train_loss": -22.886442184448242, "global_step": 147928, "epoch": 1782} {"train_loss": -23.258893966674805, "global_step": 147929, "epoch": 1782} {"train_loss": -23.18282699584961, "global_step": 147930, "epoch": 1782} {"train_loss": -23.09137535095215, "global_step": 147931, "epoch": 1782} {"train_loss": -22.63422203063965, "global_step": 147932, "epoch": 1782} {"train_loss": -23.19866180419922, "global_step": 147933, "epoch": 1782} {"train_loss": -22.964994430541992, "global_step": 147934, "epoch": 1782} {"train_loss": -22.63494300842285, "global_step": 147935, "epoch": 1782} {"train_loss": -23.47139549255371, "global_step": 147936, "epoch": 1782} {"train_loss": -23.044889450073242, "global_step": 147937, "epoch": 1782} {"train_loss": -23.096837997436523, "global_step": 147938, "epoch": 1782} {"train_loss": -22.93482780456543, "global_step": 147939, "epoch": 1782} {"train_loss": -23.33616065979004, "global_step": 147940, "epoch": 1782} {"train_loss": -23.15566062927246, "global_step": 147941, "epoch": 1782} {"train_loss": -23.172760009765625, "global_step": 147942, "epoch": 1782} {"train_loss": -23.55646324157715, "global_step": 147943, "epoch": 1782} {"train_loss": -23.15205192565918, "global_step": 147944, "epoch": 1782} {"train_loss": -23.469017028808594, "global_step": 147945, "epoch": 1782} {"train_loss": -23.310956954956055, "global_step": 147946, "epoch": 1782} {"train_loss": -23.274810791015625, "global_step": 147947, "epoch": 1782} {"train_loss": -23.663734436035156, "global_step": 147948, "epoch": 1782} {"train_loss": -23.523008346557617, "global_step": 147949, "epoch": 1782} {"train_loss": -23.730091094970703, "global_step": 147950, "epoch": 1782} {"train_loss": -23.327238082885742, "global_step": 147951, "epoch": 1782} {"train_loss": -23.029024124145508, "global_step": 147952, "epoch": 1782} {"train_loss": -23.263578414916992, "global_step": 147953, "epoch": 1782} {"train_loss": -23.232879638671875, "global_step": 147954, "epoch": 1782} {"train_loss": -23.446149826049805, "global_step": 147955, "epoch": 1782} {"train_loss": -23.620136260986328, "global_step": 147956, "epoch": 1782} {"train_loss": -23.247665405273438, "global_step": 147957, "epoch": 1782} {"train_loss": -23.02499771118164, "global_step": 147958, "epoch": 1782} {"train_loss": -23.417274475097656, "global_step": 147959, "epoch": 1782} {"train_loss": -22.73017120361328, "global_step": 147960, "epoch": 1782} {"train_loss": -23.189685821533203, "global_step": 147961, "epoch": 1782} {"train_loss": -22.665876388549805, "global_step": 147962, "epoch": 1782} {"train_loss": -23.331254959106445, "global_step": 147963, "epoch": 1782} {"train_loss": -23.005043029785156, "global_step": 147964, "epoch": 1782} {"train_loss": -22.992027282714844, "global_step": 147965, "epoch": 1782} {"train_loss": -23.001821517944336, "global_step": 147966, "epoch": 1782} {"train_loss": -23.507551193237305, "global_step": 147967, "epoch": 1782} {"train_loss": -23.053438186645508, "global_step": 147968, "epoch": 1782} {"train_loss": -23.182647705078125, "global_step": 147969, "epoch": 1782} {"train_loss": -23.20699119567871, "global_step": 147970, "epoch": 1782} {"train_loss": -23.25147247314453, "global_step": 147971, "epoch": 1782} {"train_loss": -23.110137939453125, "global_step": 147972, "epoch": 1782} {"train_loss": -22.974016189575195, "global_step": 147973, "epoch": 1782} {"train_loss": -22.963790893554688, "global_step": 147974, "epoch": 1782} {"train_loss": -22.906187057495117, "global_step": 147975, "epoch": 1782} {"train_loss": -23.470783233642578, "global_step": 147976, "epoch": 1782} {"train_loss": -23.05167007446289, "global_step": 147977, "epoch": 1782} {"train_loss": -23.302026748657227, "global_step": 147978, "epoch": 1782} {"train_loss": -22.665658950805664, "global_step": 147979, "epoch": 1782} {"train_loss": -23.244932174682617, "global_step": 147980, "epoch": 1782} {"train_loss": -23.075546264648438, "global_step": 147981, "epoch": 1782} {"train_loss": -23.098133087158203, "global_step": 147982, "epoch": 1782} {"train_loss": -23.225107192993164, "global_step": 147983, "epoch": 1782} {"train_loss": -23.122068405151367, "global_step": 147984, "epoch": 1782} {"train_loss": -23.59745979309082, "global_step": 147985, "epoch": 1782} {"train_loss": -23.103580474853516, "global_step": 147986, "epoch": 1782} {"train_loss": -23.476123809814453, "global_step": 147987, "epoch": 1782} {"train_loss": -23.12030017806823, "global_step": 147988, "epoch": 1782, "val_loss": 6210762.0} {"train_loss": -22.110504150390625, "global_step": 147989, "epoch": 1783} {"train_loss": -22.682523727416992, "global_step": 147990, "epoch": 1783} {"train_loss": -22.86178207397461, "global_step": 147991, "epoch": 1783} {"train_loss": -23.248485565185547, "global_step": 147992, "epoch": 1783} {"train_loss": -22.460317611694336, "global_step": 147993, "epoch": 1783} {"train_loss": -23.187253952026367, "global_step": 147994, "epoch": 1783} {"train_loss": -22.774593353271484, "global_step": 147995, "epoch": 1783} {"train_loss": -22.915382385253906, "global_step": 147996, "epoch": 1783} {"train_loss": -23.4448299407959, "global_step": 147997, "epoch": 1783} {"train_loss": -23.230772018432617, "global_step": 147998, "epoch": 1783} {"train_loss": -22.91724967956543, "global_step": 147999, "epoch": 1783} {"train_loss": -22.81281280517578, "global_step": 148000, "epoch": 1783} {"train_loss": -22.860471725463867, "global_step": 148001, "epoch": 1783} {"train_loss": -23.030302047729492, "global_step": 148002, "epoch": 1783} {"train_loss": -23.133708953857422, "global_step": 148003, "epoch": 1783} {"train_loss": -22.798616409301758, "global_step": 148004, "epoch": 1783} {"train_loss": -23.06455421447754, "global_step": 148005, "epoch": 1783} {"train_loss": -23.259206771850586, "global_step": 148006, "epoch": 1783} {"train_loss": -23.11140251159668, "global_step": 148007, "epoch": 1783} {"train_loss": -23.017194747924805, "global_step": 148008, "epoch": 1783} {"train_loss": -23.08165168762207, "global_step": 148009, "epoch": 1783} {"train_loss": -23.08741569519043, "global_step": 148010, "epoch": 1783} {"train_loss": -23.20656967163086, "global_step": 148011, "epoch": 1783} {"train_loss": -23.26247787475586, "global_step": 148012, "epoch": 1783} {"train_loss": -22.538328170776367, "global_step": 148013, "epoch": 1783} {"train_loss": -23.141563415527344, "global_step": 148014, "epoch": 1783} {"train_loss": -23.16691017150879, "global_step": 148015, "epoch": 1783} {"train_loss": -23.252445220947266, "global_step": 148016, "epoch": 1783} {"train_loss": -23.215246200561523, "global_step": 148017, "epoch": 1783} {"train_loss": -23.549718856811523, "global_step": 148018, "epoch": 1783} {"train_loss": -22.854557037353516, "global_step": 148019, "epoch": 1783} {"train_loss": -23.150400161743164, "global_step": 148020, "epoch": 1783} {"train_loss": -23.208974838256836, "global_step": 148021, "epoch": 1783} {"train_loss": -23.0490665435791, "global_step": 148022, "epoch": 1783} {"train_loss": -23.449588775634766, "global_step": 148023, "epoch": 1783} {"train_loss": -22.944995880126953, "global_step": 148024, "epoch": 1783} {"train_loss": -22.889022827148438, "global_step": 148025, "epoch": 1783} {"train_loss": -23.37967872619629, "global_step": 148026, "epoch": 1783} {"train_loss": -23.126800537109375, "global_step": 148027, "epoch": 1783} {"train_loss": -23.37897300720215, "global_step": 148028, "epoch": 1783} {"train_loss": -23.23663902282715, "global_step": 148029, "epoch": 1783} {"train_loss": -23.24715805053711, "global_step": 148030, "epoch": 1783} {"train_loss": -23.286035537719727, "global_step": 148031, "epoch": 1783} {"train_loss": -23.268314361572266, "global_step": 148032, "epoch": 1783} {"train_loss": -23.343475341796875, "global_step": 148033, "epoch": 1783} {"train_loss": -23.24205780029297, "global_step": 148034, "epoch": 1783} {"train_loss": -23.269140243530273, "global_step": 148035, "epoch": 1783} {"train_loss": -23.07680892944336, "global_step": 148036, "epoch": 1783} {"train_loss": -23.416982650756836, "global_step": 148037, "epoch": 1783} {"train_loss": -23.11783790588379, "global_step": 148038, "epoch": 1783} {"train_loss": -23.459821701049805, "global_step": 148039, "epoch": 1783} {"train_loss": -23.330215454101562, "global_step": 148040, "epoch": 1783} {"train_loss": -23.18169403076172, "global_step": 148041, "epoch": 1783} {"train_loss": -22.727527618408203, "global_step": 148042, "epoch": 1783} {"train_loss": -23.548330307006836, "global_step": 148043, "epoch": 1783} {"train_loss": -23.45931053161621, "global_step": 148044, "epoch": 1783} {"train_loss": -23.041969299316406, "global_step": 148045, "epoch": 1783} {"train_loss": -23.50428581237793, "global_step": 148046, "epoch": 1783} {"train_loss": -23.020055770874023, "global_step": 148047, "epoch": 1783} {"train_loss": -23.120405197143555, "global_step": 148048, "epoch": 1783} {"train_loss": -23.065114974975586, "global_step": 148049, "epoch": 1783} {"train_loss": -23.129749298095703, "global_step": 148050, "epoch": 1783} {"train_loss": -23.145536422729492, "global_step": 148051, "epoch": 1783} {"train_loss": -23.385812759399414, "global_step": 148052, "epoch": 1783} {"train_loss": -23.339324951171875, "global_step": 148053, "epoch": 1783} {"train_loss": -22.971912384033203, "global_step": 148054, "epoch": 1783} {"train_loss": -23.586227416992188, "global_step": 148055, "epoch": 1783} {"train_loss": -23.27564811706543, "global_step": 148056, "epoch": 1783} {"train_loss": -23.455930709838867, "global_step": 148057, "epoch": 1783} {"train_loss": -22.808698654174805, "global_step": 148058, "epoch": 1783} {"train_loss": -22.993616104125977, "global_step": 148059, "epoch": 1783} {"train_loss": -23.108280181884766, "global_step": 148060, "epoch": 1783} {"train_loss": -23.636985778808594, "global_step": 148061, "epoch": 1783} {"train_loss": -22.97088050842285, "global_step": 148062, "epoch": 1783} {"train_loss": -23.239187240600586, "global_step": 148063, "epoch": 1783} {"train_loss": -23.1887149810791, "global_step": 148064, "epoch": 1783} {"train_loss": -23.204771041870117, "global_step": 148065, "epoch": 1783} {"train_loss": -22.774381637573242, "global_step": 148066, "epoch": 1783} {"train_loss": -23.02484130859375, "global_step": 148067, "epoch": 1783} {"train_loss": -23.19908332824707, "global_step": 148068, "epoch": 1783} {"train_loss": -23.70013999938965, "global_step": 148069, "epoch": 1783} {"train_loss": -23.113271713256836, "global_step": 148070, "epoch": 1783} {"train_loss": -23.142595130276966, "global_step": 148071, "epoch": 1783, "val_loss": 6309702.0} {"train_loss": -22.746414184570312, "global_step": 148072, "epoch": 1784} {"train_loss": -22.78207778930664, "global_step": 148073, "epoch": 1784} {"train_loss": -22.863779067993164, "global_step": 148074, "epoch": 1784} {"train_loss": -22.949216842651367, "global_step": 148075, "epoch": 1784} {"train_loss": -23.04480743408203, "global_step": 148076, "epoch": 1784} {"train_loss": -22.899198532104492, "global_step": 148077, "epoch": 1784} {"train_loss": -22.697790145874023, "global_step": 148078, "epoch": 1784} {"train_loss": -23.173389434814453, "global_step": 148079, "epoch": 1784} {"train_loss": -23.076282501220703, "global_step": 148080, "epoch": 1784} {"train_loss": -22.799108505249023, "global_step": 148081, "epoch": 1784} {"train_loss": -22.902217864990234, "global_step": 148082, "epoch": 1784} {"train_loss": -23.426761627197266, "global_step": 148083, "epoch": 1784} {"train_loss": -22.756671905517578, "global_step": 148084, "epoch": 1784} {"train_loss": -22.761852264404297, "global_step": 148085, "epoch": 1784} {"train_loss": -22.969436645507812, "global_step": 148086, "epoch": 1784} {"train_loss": -23.012651443481445, "global_step": 148087, "epoch": 1784} {"train_loss": -23.248327255249023, "global_step": 148088, "epoch": 1784} {"train_loss": -22.983144760131836, "global_step": 148089, "epoch": 1784} {"train_loss": -23.31037139892578, "global_step": 148090, "epoch": 1784} {"train_loss": -23.28314781188965, "global_step": 148091, "epoch": 1784} {"train_loss": -23.105514526367188, "global_step": 148092, "epoch": 1784} {"train_loss": -23.165142059326172, "global_step": 148093, "epoch": 1784} {"train_loss": -23.404346466064453, "global_step": 148094, "epoch": 1784} {"train_loss": -23.519699096679688, "global_step": 148095, "epoch": 1784} {"train_loss": -23.309715270996094, "global_step": 148096, "epoch": 1784} {"train_loss": -22.7391357421875, "global_step": 148097, "epoch": 1784} {"train_loss": -23.02921485900879, "global_step": 148098, "epoch": 1784} {"train_loss": -23.39794921875, "global_step": 148099, "epoch": 1784} {"train_loss": -23.243061065673828, "global_step": 148100, "epoch": 1784} {"train_loss": -23.235593795776367, "global_step": 148101, "epoch": 1784} {"train_loss": -23.591344833374023, "global_step": 148102, "epoch": 1784} {"train_loss": -23.26058006286621, "global_step": 148103, "epoch": 1784} {"train_loss": -23.35775375366211, "global_step": 148104, "epoch": 1784} {"train_loss": -23.183191299438477, "global_step": 148105, "epoch": 1784} {"train_loss": -23.36775016784668, "global_step": 148106, "epoch": 1784} {"train_loss": -23.334964752197266, "global_step": 148107, "epoch": 1784} {"train_loss": -23.149187088012695, "global_step": 148108, "epoch": 1784} {"train_loss": -23.354581832885742, "global_step": 148109, "epoch": 1784} {"train_loss": -23.2769775390625, "global_step": 148110, "epoch": 1784} {"train_loss": -23.19965171813965, "global_step": 148111, "epoch": 1784} {"train_loss": -23.17286491394043, "global_step": 148112, "epoch": 1784} {"train_loss": -23.094011306762695, "global_step": 148113, "epoch": 1784} {"train_loss": -23.330751419067383, "global_step": 148114, "epoch": 1784} {"train_loss": -23.142385482788086, "global_step": 148115, "epoch": 1784} {"train_loss": -23.169723510742188, "global_step": 148116, "epoch": 1784} {"train_loss": -23.285783767700195, "global_step": 148117, "epoch": 1784} {"train_loss": -23.239063262939453, "global_step": 148118, "epoch": 1784} {"train_loss": -23.417692184448242, "global_step": 148119, "epoch": 1784} {"train_loss": -22.937820434570312, "global_step": 148120, "epoch": 1784} {"train_loss": -22.940820693969727, "global_step": 148121, "epoch": 1784} {"train_loss": -23.539587020874023, "global_step": 148122, "epoch": 1784} {"train_loss": -22.817066192626953, "global_step": 148123, "epoch": 1784} {"train_loss": -23.191450119018555, "global_step": 148124, "epoch": 1784} {"train_loss": -23.0006046295166, "global_step": 148125, "epoch": 1784} {"train_loss": -23.483789443969727, "global_step": 148126, "epoch": 1784} {"train_loss": -23.13148307800293, "global_step": 148127, "epoch": 1784} {"train_loss": -22.883596420288086, "global_step": 148128, "epoch": 1784} {"train_loss": -22.86350440979004, "global_step": 148129, "epoch": 1784} {"train_loss": -23.051000595092773, "global_step": 148130, "epoch": 1784} {"train_loss": -23.53564453125, "global_step": 148131, "epoch": 1784} {"train_loss": -23.158668518066406, "global_step": 148132, "epoch": 1784} {"train_loss": -23.493671417236328, "global_step": 148133, "epoch": 1784} {"train_loss": -23.085660934448242, "global_step": 148134, "epoch": 1784} {"train_loss": -23.135540008544922, "global_step": 148135, "epoch": 1784} {"train_loss": -23.4374942779541, "global_step": 148136, "epoch": 1784} {"train_loss": -23.549591064453125, "global_step": 148137, "epoch": 1784} {"train_loss": -23.36777687072754, "global_step": 148138, "epoch": 1784} {"train_loss": -23.272964477539062, "global_step": 148139, "epoch": 1784} {"train_loss": -23.15718650817871, "global_step": 148140, "epoch": 1784} {"train_loss": -23.31808853149414, "global_step": 148141, "epoch": 1784} {"train_loss": -23.159440994262695, "global_step": 148142, "epoch": 1784} {"train_loss": -23.335895538330078, "global_step": 148143, "epoch": 1784} {"train_loss": -23.34320068359375, "global_step": 148144, "epoch": 1784} {"train_loss": -23.29741859436035, "global_step": 148145, "epoch": 1784} {"train_loss": -23.21536636352539, "global_step": 148146, "epoch": 1784} {"train_loss": -23.135766983032227, "global_step": 148147, "epoch": 1784} {"train_loss": -23.244861602783203, "global_step": 148148, "epoch": 1784} {"train_loss": -23.081451416015625, "global_step": 148149, "epoch": 1784} {"train_loss": -23.200748443603516, "global_step": 148150, "epoch": 1784} {"train_loss": -23.199583053588867, "global_step": 148151, "epoch": 1784} {"train_loss": -23.415884017944336, "global_step": 148152, "epoch": 1784} {"train_loss": -23.02779769897461, "global_step": 148153, "epoch": 1784} {"train_loss": -23.174392907016248, "global_step": 148154, "epoch": 1784, "val_loss": 6381311.0} {"train_loss": -22.465574264526367, "global_step": 148155, "epoch": 1785} {"train_loss": -22.121713638305664, "global_step": 148156, "epoch": 1785} {"train_loss": -22.759008407592773, "global_step": 148157, "epoch": 1785} {"train_loss": -22.994857788085938, "global_step": 148158, "epoch": 1785} {"train_loss": -22.942211151123047, "global_step": 148159, "epoch": 1785} {"train_loss": -22.838233947753906, "global_step": 148160, "epoch": 1785} {"train_loss": -22.788488388061523, "global_step": 148161, "epoch": 1785} {"train_loss": -22.859725952148438, "global_step": 148162, "epoch": 1785} {"train_loss": -23.27764320373535, "global_step": 148163, "epoch": 1785} {"train_loss": -22.824918746948242, "global_step": 148164, "epoch": 1785} {"train_loss": -22.815000534057617, "global_step": 148165, "epoch": 1785} {"train_loss": -23.290559768676758, "global_step": 148166, "epoch": 1785} {"train_loss": -23.107255935668945, "global_step": 148167, "epoch": 1785} {"train_loss": -23.333219528198242, "global_step": 148168, "epoch": 1785} {"train_loss": -23.186124801635742, "global_step": 148169, "epoch": 1785} {"train_loss": -23.25490379333496, "global_step": 148170, "epoch": 1785} {"train_loss": -23.077802658081055, "global_step": 148171, "epoch": 1785} {"train_loss": -23.001157760620117, "global_step": 148172, "epoch": 1785} {"train_loss": -23.186635971069336, "global_step": 148173, "epoch": 1785} {"train_loss": -22.855785369873047, "global_step": 148174, "epoch": 1785} {"train_loss": -23.524858474731445, "global_step": 148175, "epoch": 1785} {"train_loss": -23.182994842529297, "global_step": 148176, "epoch": 1785} {"train_loss": -23.260412216186523, "global_step": 148177, "epoch": 1785} {"train_loss": -23.162553787231445, "global_step": 148178, "epoch": 1785} {"train_loss": -22.98256492614746, "global_step": 148179, "epoch": 1785} {"train_loss": -22.826984405517578, "global_step": 148180, "epoch": 1785} {"train_loss": -23.068626403808594, "global_step": 148181, "epoch": 1785} {"train_loss": -23.452239990234375, "global_step": 148182, "epoch": 1785} {"train_loss": -23.312992095947266, "global_step": 148183, "epoch": 1785} {"train_loss": -23.207168579101562, "global_step": 148184, "epoch": 1785} {"train_loss": -23.47509765625, "global_step": 148185, "epoch": 1785} {"train_loss": -23.299856185913086, "global_step": 148186, "epoch": 1785} {"train_loss": -23.15177345275879, "global_step": 148187, "epoch": 1785} {"train_loss": -23.520294189453125, "global_step": 148188, "epoch": 1785} {"train_loss": -23.210865020751953, "global_step": 148189, "epoch": 1785} {"train_loss": -23.053953170776367, "global_step": 148190, "epoch": 1785} {"train_loss": -22.970090866088867, "global_step": 148191, "epoch": 1785} {"train_loss": -23.354690551757812, "global_step": 148192, "epoch": 1785} {"train_loss": -23.517215728759766, "global_step": 148193, "epoch": 1785} {"train_loss": -23.64603042602539, "global_step": 148194, "epoch": 1785} {"train_loss": -23.060226440429688, "global_step": 148195, "epoch": 1785} {"train_loss": -23.37898826599121, "global_step": 148196, "epoch": 1785} {"train_loss": -23.274011611938477, "global_step": 148197, "epoch": 1785} {"train_loss": -23.232954025268555, "global_step": 148198, "epoch": 1785} {"train_loss": -23.233755111694336, "global_step": 148199, "epoch": 1785} {"train_loss": -23.377941131591797, "global_step": 148200, "epoch": 1785} {"train_loss": -23.551977157592773, "global_step": 148201, "epoch": 1785} {"train_loss": -23.011783599853516, "global_step": 148202, "epoch": 1785} {"train_loss": -23.506729125976562, "global_step": 148203, "epoch": 1785} {"train_loss": -23.11050796508789, "global_step": 148204, "epoch": 1785} {"train_loss": -23.002187728881836, "global_step": 148205, "epoch": 1785} {"train_loss": -22.922468185424805, "global_step": 148206, "epoch": 1785} {"train_loss": -23.37787628173828, "global_step": 148207, "epoch": 1785} {"train_loss": -23.266376495361328, "global_step": 148208, "epoch": 1785} {"train_loss": -23.10445213317871, "global_step": 148209, "epoch": 1785} {"train_loss": -22.971961975097656, "global_step": 148210, "epoch": 1785} {"train_loss": -23.27928924560547, "global_step": 148211, "epoch": 1785} {"train_loss": -23.357778549194336, "global_step": 148212, "epoch": 1785} {"train_loss": -23.408727645874023, "global_step": 148213, "epoch": 1785} {"train_loss": -23.203725814819336, "global_step": 148214, "epoch": 1785} {"train_loss": -23.069141387939453, "global_step": 148215, "epoch": 1785} {"train_loss": -23.187543869018555, "global_step": 148216, "epoch": 1785} {"train_loss": -23.208118438720703, "global_step": 148217, "epoch": 1785} {"train_loss": -23.4073486328125, "global_step": 148218, "epoch": 1785} {"train_loss": -23.208431243896484, "global_step": 148219, "epoch": 1785} {"train_loss": -23.426822662353516, "global_step": 148220, "epoch": 1785} {"train_loss": -23.19846534729004, "global_step": 148221, "epoch": 1785} {"train_loss": -23.470796585083008, "global_step": 148222, "epoch": 1785} {"train_loss": -23.209407806396484, "global_step": 148223, "epoch": 1785} {"train_loss": -23.13847541809082, "global_step": 148224, "epoch": 1785} {"train_loss": -23.099828720092773, "global_step": 148225, "epoch": 1785} {"train_loss": -23.5457820892334, "global_step": 148226, "epoch": 1785} {"train_loss": -23.37865447998047, "global_step": 148227, "epoch": 1785} {"train_loss": -23.098791122436523, "global_step": 148228, "epoch": 1785} {"train_loss": -23.06232261657715, "global_step": 148229, "epoch": 1785} {"train_loss": -23.206707000732422, "global_step": 148230, "epoch": 1785} {"train_loss": -23.228025436401367, "global_step": 148231, "epoch": 1785} {"train_loss": -23.133405685424805, "global_step": 148232, "epoch": 1785} {"train_loss": -23.453969955444336, "global_step": 148233, "epoch": 1785} {"train_loss": -23.143600463867188, "global_step": 148234, "epoch": 1785} {"train_loss": -22.95673179626465, "global_step": 148235, "epoch": 1785} {"train_loss": -23.221799850463867, "global_step": 148236, "epoch": 1785} {"train_loss": -23.168441473719586, "global_step": 148237, "epoch": 1785, "val_loss": 6336120.0} {"train_loss": -22.84409523010254, "global_step": 148238, "epoch": 1786} {"train_loss": -22.7358455657959, "global_step": 148239, "epoch": 1786} {"train_loss": -23.02488136291504, "global_step": 148240, "epoch": 1786} {"train_loss": -22.60154151916504, "global_step": 148241, "epoch": 1786} {"train_loss": -22.935606002807617, "global_step": 148242, "epoch": 1786} {"train_loss": -22.90717124938965, "global_step": 148243, "epoch": 1786} {"train_loss": -22.76419448852539, "global_step": 148244, "epoch": 1786} {"train_loss": -22.815839767456055, "global_step": 148245, "epoch": 1786} {"train_loss": -22.798940658569336, "global_step": 148246, "epoch": 1786} {"train_loss": -22.91494369506836, "global_step": 148247, "epoch": 1786} {"train_loss": -23.099042892456055, "global_step": 148248, "epoch": 1786} {"train_loss": -22.515336990356445, "global_step": 148249, "epoch": 1786} {"train_loss": -22.867189407348633, "global_step": 148250, "epoch": 1786} {"train_loss": -23.015350341796875, "global_step": 148251, "epoch": 1786} {"train_loss": -22.945844650268555, "global_step": 148252, "epoch": 1786} {"train_loss": -23.480329513549805, "global_step": 148253, "epoch": 1786} {"train_loss": -23.198617935180664, "global_step": 148254, "epoch": 1786} {"train_loss": -23.140335083007812, "global_step": 148255, "epoch": 1786} {"train_loss": -23.061782836914062, "global_step": 148256, "epoch": 1786} {"train_loss": -23.231542587280273, "global_step": 148257, "epoch": 1786} {"train_loss": -23.07551383972168, "global_step": 148258, "epoch": 1786} {"train_loss": -23.13046646118164, "global_step": 148259, "epoch": 1786} {"train_loss": -22.849559783935547, "global_step": 148260, "epoch": 1786} {"train_loss": -23.132654190063477, "global_step": 148261, "epoch": 1786} {"train_loss": -23.212614059448242, "global_step": 148262, "epoch": 1786} {"train_loss": -23.08699607849121, "global_step": 148263, "epoch": 1786} {"train_loss": -23.030210494995117, "global_step": 148264, "epoch": 1786} {"train_loss": -23.390684127807617, "global_step": 148265, "epoch": 1786} {"train_loss": -23.23554039001465, "global_step": 148266, "epoch": 1786} {"train_loss": -23.14291000366211, "global_step": 148267, "epoch": 1786} {"train_loss": -23.2536678314209, "global_step": 148268, "epoch": 1786} {"train_loss": -23.2838191986084, "global_step": 148269, "epoch": 1786} {"train_loss": -23.58631706237793, "global_step": 148270, "epoch": 1786} {"train_loss": -23.325782775878906, "global_step": 148271, "epoch": 1786} {"train_loss": -23.60515022277832, "global_step": 148272, "epoch": 1786} {"train_loss": -23.42521095275879, "global_step": 148273, "epoch": 1786} {"train_loss": -23.073678970336914, "global_step": 148274, "epoch": 1786} {"train_loss": -23.38390350341797, "global_step": 148275, "epoch": 1786} {"train_loss": -23.270282745361328, "global_step": 148276, "epoch": 1786} {"train_loss": -23.30787467956543, "global_step": 148277, "epoch": 1786} {"train_loss": -23.485502243041992, "global_step": 148278, "epoch": 1786} {"train_loss": -23.100494384765625, "global_step": 148279, "epoch": 1786} {"train_loss": -23.175199508666992, "global_step": 148280, "epoch": 1786} {"train_loss": -23.03116226196289, "global_step": 148281, "epoch": 1786} {"train_loss": -22.892444610595703, "global_step": 148282, "epoch": 1786} {"train_loss": -22.607776641845703, "global_step": 148283, "epoch": 1786} {"train_loss": -23.019376754760742, "global_step": 148284, "epoch": 1786} {"train_loss": -23.04261589050293, "global_step": 148285, "epoch": 1786} {"train_loss": -23.3243408203125, "global_step": 148286, "epoch": 1786} {"train_loss": -23.31476402282715, "global_step": 148287, "epoch": 1786} {"train_loss": -23.034101486206055, "global_step": 148288, "epoch": 1786} {"train_loss": -23.290136337280273, "global_step": 148289, "epoch": 1786} {"train_loss": -23.138593673706055, "global_step": 148290, "epoch": 1786} {"train_loss": -23.201404571533203, "global_step": 148291, "epoch": 1786} {"train_loss": -23.07964515686035, "global_step": 148292, "epoch": 1786} {"train_loss": -22.943288803100586, "global_step": 148293, "epoch": 1786} {"train_loss": -23.160139083862305, "global_step": 148294, "epoch": 1786} {"train_loss": -23.270788192749023, "global_step": 148295, "epoch": 1786} {"train_loss": -23.259429931640625, "global_step": 148296, "epoch": 1786} {"train_loss": -23.110937118530273, "global_step": 148297, "epoch": 1786} {"train_loss": -23.265195846557617, "global_step": 148298, "epoch": 1786} {"train_loss": -23.23431968688965, "global_step": 148299, "epoch": 1786} {"train_loss": -23.12472915649414, "global_step": 148300, "epoch": 1786} {"train_loss": -23.153827667236328, "global_step": 148301, "epoch": 1786} {"train_loss": -23.447113037109375, "global_step": 148302, "epoch": 1786} {"train_loss": -22.90806007385254, "global_step": 148303, "epoch": 1786} {"train_loss": -23.231338500976562, "global_step": 148304, "epoch": 1786} {"train_loss": -23.01949119567871, "global_step": 148305, "epoch": 1786} {"train_loss": -23.210851669311523, "global_step": 148306, "epoch": 1786} {"train_loss": -23.305356979370117, "global_step": 148307, "epoch": 1786} {"train_loss": -23.050853729248047, "global_step": 148308, "epoch": 1786} {"train_loss": -23.015552520751953, "global_step": 148309, "epoch": 1786} {"train_loss": -22.777971267700195, "global_step": 148310, "epoch": 1786} {"train_loss": -23.349872589111328, "global_step": 148311, "epoch": 1786} {"train_loss": -23.161041259765625, "global_step": 148312, "epoch": 1786} {"train_loss": -23.234222412109375, "global_step": 148313, "epoch": 1786} {"train_loss": -23.274961471557617, "global_step": 148314, "epoch": 1786} {"train_loss": -23.38043785095215, "global_step": 148315, "epoch": 1786} {"train_loss": -23.3983097076416, "global_step": 148316, "epoch": 1786} {"train_loss": -23.095075607299805, "global_step": 148317, "epoch": 1786} {"train_loss": -23.1773738861084, "global_step": 148318, "epoch": 1786} {"train_loss": -23.39596939086914, "global_step": 148319, "epoch": 1786} {"train_loss": -23.13389863163592, "global_step": 148320, "epoch": 1786, "val_loss": 6330410.5} {"train_loss": -22.611698150634766, "global_step": 148321, "epoch": 1787} {"train_loss": -22.534378051757812, "global_step": 148322, "epoch": 1787} {"train_loss": -23.27108383178711, "global_step": 148323, "epoch": 1787} {"train_loss": -23.342267990112305, "global_step": 148324, "epoch": 1787} {"train_loss": -23.05924415588379, "global_step": 148325, "epoch": 1787} {"train_loss": -22.845645904541016, "global_step": 148326, "epoch": 1787} {"train_loss": -23.141422271728516, "global_step": 148327, "epoch": 1787} {"train_loss": -23.188268661499023, "global_step": 148328, "epoch": 1787} {"train_loss": -23.440921783447266, "global_step": 148329, "epoch": 1787} {"train_loss": -23.053390502929688, "global_step": 148330, "epoch": 1787} {"train_loss": -23.229822158813477, "global_step": 148331, "epoch": 1787} {"train_loss": -23.240650177001953, "global_step": 148332, "epoch": 1787} {"train_loss": -23.268695831298828, "global_step": 148333, "epoch": 1787} {"train_loss": -23.378599166870117, "global_step": 148334, "epoch": 1787} {"train_loss": -23.429931640625, "global_step": 148335, "epoch": 1787} {"train_loss": -22.85335350036621, "global_step": 148336, "epoch": 1787} {"train_loss": -23.528579711914062, "global_step": 148337, "epoch": 1787} {"train_loss": -23.189863204956055, "global_step": 148338, "epoch": 1787} {"train_loss": -23.42548179626465, "global_step": 148339, "epoch": 1787} {"train_loss": -23.139623641967773, "global_step": 148340, "epoch": 1787} {"train_loss": -23.179088592529297, "global_step": 148341, "epoch": 1787} {"train_loss": -23.192838668823242, "global_step": 148342, "epoch": 1787} {"train_loss": -22.968984603881836, "global_step": 148343, "epoch": 1787} {"train_loss": -23.120908737182617, "global_step": 148344, "epoch": 1787} {"train_loss": -22.97332191467285, "global_step": 148345, "epoch": 1787} {"train_loss": -23.212705612182617, "global_step": 148346, "epoch": 1787} {"train_loss": -23.219934463500977, "global_step": 148347, "epoch": 1787} {"train_loss": -23.016141891479492, "global_step": 148348, "epoch": 1787} {"train_loss": -22.94721221923828, "global_step": 148349, "epoch": 1787} {"train_loss": -23.393203735351562, "global_step": 148350, "epoch": 1787} {"train_loss": -23.36429786682129, "global_step": 148351, "epoch": 1787} {"train_loss": -23.783720016479492, "global_step": 148352, "epoch": 1787} {"train_loss": -23.16888427734375, "global_step": 148353, "epoch": 1787} {"train_loss": -23.587324142456055, "global_step": 148354, "epoch": 1787} {"train_loss": -23.48001480102539, "global_step": 148355, "epoch": 1787} {"train_loss": -23.332033157348633, "global_step": 148356, "epoch": 1787} {"train_loss": -23.147525787353516, "global_step": 148357, "epoch": 1787} {"train_loss": -23.551416397094727, "global_step": 148358, "epoch": 1787} {"train_loss": -23.499719619750977, "global_step": 148359, "epoch": 1787} {"train_loss": -23.39162254333496, "global_step": 148360, "epoch": 1787} {"train_loss": -23.338056564331055, "global_step": 148361, "epoch": 1787} {"train_loss": -23.44208335876465, "global_step": 148362, "epoch": 1787} {"train_loss": -23.001434326171875, "global_step": 148363, "epoch": 1787} {"train_loss": -23.37281608581543, "global_step": 148364, "epoch": 1787} {"train_loss": -23.0788516998291, "global_step": 148365, "epoch": 1787} {"train_loss": -22.68850326538086, "global_step": 148366, "epoch": 1787} {"train_loss": -23.551450729370117, "global_step": 148367, "epoch": 1787} {"train_loss": -22.38727569580078, "global_step": 148368, "epoch": 1787} {"train_loss": -22.639514923095703, "global_step": 148369, "epoch": 1787} {"train_loss": -22.562658309936523, "global_step": 148370, "epoch": 1787} {"train_loss": -22.69940185546875, "global_step": 148371, "epoch": 1787} {"train_loss": -23.235666275024414, "global_step": 148372, "epoch": 1787} {"train_loss": -22.734487533569336, "global_step": 148373, "epoch": 1787} {"train_loss": -23.24453353881836, "global_step": 148374, "epoch": 1787} {"train_loss": -23.3617000579834, "global_step": 148375, "epoch": 1787} {"train_loss": -23.313657760620117, "global_step": 148376, "epoch": 1787} {"train_loss": -23.15742301940918, "global_step": 148377, "epoch": 1787} {"train_loss": -23.231555938720703, "global_step": 148378, "epoch": 1787} {"train_loss": -23.240947723388672, "global_step": 148379, "epoch": 1787} {"train_loss": -23.07840347290039, "global_step": 148380, "epoch": 1787} {"train_loss": -22.968530654907227, "global_step": 148381, "epoch": 1787} {"train_loss": -23.298307418823242, "global_step": 148382, "epoch": 1787} {"train_loss": -22.930856704711914, "global_step": 148383, "epoch": 1787} {"train_loss": -23.308025360107422, "global_step": 148384, "epoch": 1787} {"train_loss": -23.010976791381836, "global_step": 148385, "epoch": 1787} {"train_loss": -22.965957641601562, "global_step": 148386, "epoch": 1787} {"train_loss": -23.49519157409668, "global_step": 148387, "epoch": 1787} {"train_loss": -23.022371292114258, "global_step": 148388, "epoch": 1787} {"train_loss": -23.32819175720215, "global_step": 148389, "epoch": 1787} {"train_loss": -23.210769653320312, "global_step": 148390, "epoch": 1787} {"train_loss": -23.732229232788086, "global_step": 148391, "epoch": 1787} {"train_loss": -23.369449615478516, "global_step": 148392, "epoch": 1787} {"train_loss": -22.944568634033203, "global_step": 148393, "epoch": 1787} {"train_loss": -23.3510684967041, "global_step": 148394, "epoch": 1787} {"train_loss": -23.010526657104492, "global_step": 148395, "epoch": 1787} {"train_loss": -23.377460479736328, "global_step": 148396, "epoch": 1787} {"train_loss": -22.753870010375977, "global_step": 148397, "epoch": 1787} {"train_loss": -23.23419761657715, "global_step": 148398, "epoch": 1787} {"train_loss": -23.435049057006836, "global_step": 148399, "epoch": 1787} {"train_loss": -23.41213035583496, "global_step": 148400, "epoch": 1787} {"train_loss": -23.23990249633789, "global_step": 148401, "epoch": 1787} {"train_loss": -23.433034896850586, "global_step": 148402, "epoch": 1787} {"train_loss": -23.187914974718208, "global_step": 148403, "epoch": 1787, "val_loss": 6260990.0} {"train_loss": -22.523794174194336, "global_step": 148404, "epoch": 1788} {"train_loss": -22.308446884155273, "global_step": 148405, "epoch": 1788} {"train_loss": -23.09720802307129, "global_step": 148406, "epoch": 1788} {"train_loss": -22.57636070251465, "global_step": 148407, "epoch": 1788} {"train_loss": -22.688190460205078, "global_step": 148408, "epoch": 1788} {"train_loss": -22.88763999938965, "global_step": 148409, "epoch": 1788} {"train_loss": -22.964130401611328, "global_step": 148410, "epoch": 1788} {"train_loss": -22.616750717163086, "global_step": 148411, "epoch": 1788} {"train_loss": -23.009191513061523, "global_step": 148412, "epoch": 1788} {"train_loss": -22.741243362426758, "global_step": 148413, "epoch": 1788} {"train_loss": -22.955644607543945, "global_step": 148414, "epoch": 1788} {"train_loss": -22.898422241210938, "global_step": 148415, "epoch": 1788} {"train_loss": -23.13002586364746, "global_step": 148416, "epoch": 1788} {"train_loss": -22.794506072998047, "global_step": 148417, "epoch": 1788} {"train_loss": -22.792797088623047, "global_step": 148418, "epoch": 1788} {"train_loss": -22.78874969482422, "global_step": 148419, "epoch": 1788} {"train_loss": -22.744314193725586, "global_step": 148420, "epoch": 1788} {"train_loss": -22.830780029296875, "global_step": 148421, "epoch": 1788} {"train_loss": -23.06920051574707, "global_step": 148422, "epoch": 1788} {"train_loss": -23.2354793548584, "global_step": 148423, "epoch": 1788} {"train_loss": -23.226598739624023, "global_step": 148424, "epoch": 1788} {"train_loss": -23.01946449279785, "global_step": 148425, "epoch": 1788} {"train_loss": -22.902315139770508, "global_step": 148426, "epoch": 1788} {"train_loss": -22.973941802978516, "global_step": 148427, "epoch": 1788} {"train_loss": -22.962326049804688, "global_step": 148428, "epoch": 1788} {"train_loss": -23.178970336914062, "global_step": 148429, "epoch": 1788} {"train_loss": -22.931922912597656, "global_step": 148430, "epoch": 1788} {"train_loss": -22.618892669677734, "global_step": 148431, "epoch": 1788} {"train_loss": -23.35199546813965, "global_step": 148432, "epoch": 1788} {"train_loss": -23.144712448120117, "global_step": 148433, "epoch": 1788} {"train_loss": -23.34917449951172, "global_step": 148434, "epoch": 1788} {"train_loss": -23.438467025756836, "global_step": 148435, "epoch": 1788} {"train_loss": -23.324609756469727, "global_step": 148436, "epoch": 1788} {"train_loss": -22.96152687072754, "global_step": 148437, "epoch": 1788} {"train_loss": -23.227041244506836, "global_step": 148438, "epoch": 1788} {"train_loss": -23.087726593017578, "global_step": 148439, "epoch": 1788} {"train_loss": -23.415403366088867, "global_step": 148440, "epoch": 1788} {"train_loss": -23.369184494018555, "global_step": 148441, "epoch": 1788} {"train_loss": -22.682485580444336, "global_step": 148442, "epoch": 1788} {"train_loss": -23.410280227661133, "global_step": 148443, "epoch": 1788} {"train_loss": -23.360794067382812, "global_step": 148444, "epoch": 1788} {"train_loss": -23.235244750976562, "global_step": 148445, "epoch": 1788} {"train_loss": -23.32131576538086, "global_step": 148446, "epoch": 1788} {"train_loss": -23.256418228149414, "global_step": 148447, "epoch": 1788} {"train_loss": -23.17461585998535, "global_step": 148448, "epoch": 1788} {"train_loss": -22.988143920898438, "global_step": 148449, "epoch": 1788} {"train_loss": -23.677892684936523, "global_step": 148450, "epoch": 1788} {"train_loss": -23.2163028717041, "global_step": 148451, "epoch": 1788} {"train_loss": -23.336868286132812, "global_step": 148452, "epoch": 1788} {"train_loss": -23.5180721282959, "global_step": 148453, "epoch": 1788} {"train_loss": -23.588777542114258, "global_step": 148454, "epoch": 1788} {"train_loss": -23.213153839111328, "global_step": 148455, "epoch": 1788} {"train_loss": -23.232601165771484, "global_step": 148456, "epoch": 1788} {"train_loss": -23.38265037536621, "global_step": 148457, "epoch": 1788} {"train_loss": -23.247936248779297, "global_step": 148458, "epoch": 1788} {"train_loss": -23.42909812927246, "global_step": 148459, "epoch": 1788} {"train_loss": -22.97627830505371, "global_step": 148460, "epoch": 1788} {"train_loss": -23.052366256713867, "global_step": 148461, "epoch": 1788} {"train_loss": -23.19114875793457, "global_step": 148462, "epoch": 1788} {"train_loss": -23.20097541809082, "global_step": 148463, "epoch": 1788} {"train_loss": -22.90045166015625, "global_step": 148464, "epoch": 1788} {"train_loss": -23.291074752807617, "global_step": 148465, "epoch": 1788} {"train_loss": -23.06210708618164, "global_step": 148466, "epoch": 1788} {"train_loss": -23.167152404785156, "global_step": 148467, "epoch": 1788} {"train_loss": -23.30352210998535, "global_step": 148468, "epoch": 1788} {"train_loss": -23.2640323638916, "global_step": 148469, "epoch": 1788} {"train_loss": -22.869171142578125, "global_step": 148470, "epoch": 1788} {"train_loss": -23.241743087768555, "global_step": 148471, "epoch": 1788} {"train_loss": -22.7479190826416, "global_step": 148472, "epoch": 1788} {"train_loss": -22.995656967163086, "global_step": 148473, "epoch": 1788} {"train_loss": -23.5471134185791, "global_step": 148474, "epoch": 1788} {"train_loss": -22.775665283203125, "global_step": 148475, "epoch": 1788} {"train_loss": -23.05391502380371, "global_step": 148476, "epoch": 1788} {"train_loss": -23.055862426757812, "global_step": 148477, "epoch": 1788} {"train_loss": -23.075353622436523, "global_step": 148478, "epoch": 1788} {"train_loss": -23.154281616210938, "global_step": 148479, "epoch": 1788} {"train_loss": -22.894441604614258, "global_step": 148480, "epoch": 1788} {"train_loss": -23.522001266479492, "global_step": 148481, "epoch": 1788} {"train_loss": -23.4752140045166, "global_step": 148482, "epoch": 1788} {"train_loss": -23.391714096069336, "global_step": 148483, "epoch": 1788} {"train_loss": -23.37824058532715, "global_step": 148484, "epoch": 1788} {"train_loss": -23.171045303344727, "global_step": 148485, "epoch": 1788} {"train_loss": -23.098874471273767, "global_step": 148486, "epoch": 1788, "val_loss": 6394912.5} {"train_loss": -22.838415145874023, "global_step": 148487, "epoch": 1789} {"train_loss": -22.569013595581055, "global_step": 148488, "epoch": 1789} {"train_loss": -23.02826499938965, "global_step": 148489, "epoch": 1789} {"train_loss": -23.306623458862305, "global_step": 148490, "epoch": 1789} {"train_loss": -23.11281394958496, "global_step": 148491, "epoch": 1789} {"train_loss": -23.078948974609375, "global_step": 148492, "epoch": 1789} {"train_loss": -23.053503036499023, "global_step": 148493, "epoch": 1789} {"train_loss": -23.015274047851562, "global_step": 148494, "epoch": 1789} {"train_loss": -22.90114974975586, "global_step": 148495, "epoch": 1789} {"train_loss": -23.071165084838867, "global_step": 148496, "epoch": 1789} {"train_loss": -23.098281860351562, "global_step": 148497, "epoch": 1789} {"train_loss": -23.093374252319336, "global_step": 148498, "epoch": 1789} {"train_loss": -23.013151168823242, "global_step": 148499, "epoch": 1789} {"train_loss": -23.065628051757812, "global_step": 148500, "epoch": 1789} {"train_loss": -22.87264060974121, "global_step": 148501, "epoch": 1789} {"train_loss": -22.759052276611328, "global_step": 148502, "epoch": 1789} {"train_loss": -23.433841705322266, "global_step": 148503, "epoch": 1789} {"train_loss": -23.6105899810791, "global_step": 148504, "epoch": 1789} {"train_loss": -23.054128646850586, "global_step": 148505, "epoch": 1789} {"train_loss": -23.03544807434082, "global_step": 148506, "epoch": 1789} {"train_loss": -23.25287437438965, "global_step": 148507, "epoch": 1789} {"train_loss": -23.312686920166016, "global_step": 148508, "epoch": 1789} {"train_loss": -23.22104263305664, "global_step": 148509, "epoch": 1789} {"train_loss": -23.351835250854492, "global_step": 148510, "epoch": 1789} {"train_loss": -23.422744750976562, "global_step": 148511, "epoch": 1789} {"train_loss": -23.63030433654785, "global_step": 148512, "epoch": 1789} {"train_loss": -23.132898330688477, "global_step": 148513, "epoch": 1789} {"train_loss": -22.980100631713867, "global_step": 148514, "epoch": 1789} {"train_loss": -22.82901954650879, "global_step": 148515, "epoch": 1789} {"train_loss": -23.163997650146484, "global_step": 148516, "epoch": 1789} {"train_loss": -23.19500732421875, "global_step": 148517, "epoch": 1789} {"train_loss": -23.2946720123291, "global_step": 148518, "epoch": 1789} {"train_loss": -23.095523834228516, "global_step": 148519, "epoch": 1789} {"train_loss": -23.4372615814209, "global_step": 148520, "epoch": 1789} {"train_loss": -23.659719467163086, "global_step": 148521, "epoch": 1789} {"train_loss": -23.073514938354492, "global_step": 148522, "epoch": 1789} {"train_loss": -23.327247619628906, "global_step": 148523, "epoch": 1789} {"train_loss": -23.129364013671875, "global_step": 148524, "epoch": 1789} {"train_loss": -23.4890193939209, "global_step": 148525, "epoch": 1789} {"train_loss": -23.41193962097168, "global_step": 148526, "epoch": 1789} {"train_loss": -23.44425392150879, "global_step": 148527, "epoch": 1789} {"train_loss": -23.562015533447266, "global_step": 148528, "epoch": 1789} {"train_loss": -23.129934310913086, "global_step": 148529, "epoch": 1789} {"train_loss": -23.364137649536133, "global_step": 148530, "epoch": 1789} {"train_loss": -23.267370223999023, "global_step": 148531, "epoch": 1789} {"train_loss": -23.112064361572266, "global_step": 148532, "epoch": 1789} {"train_loss": -22.785062789916992, "global_step": 148533, "epoch": 1789} {"train_loss": -22.44556999206543, "global_step": 148534, "epoch": 1789} {"train_loss": -23.133686065673828, "global_step": 148535, "epoch": 1789} {"train_loss": -23.34052848815918, "global_step": 148536, "epoch": 1789} {"train_loss": -23.36671257019043, "global_step": 148537, "epoch": 1789} {"train_loss": -23.0050048828125, "global_step": 148538, "epoch": 1789} {"train_loss": -23.481016159057617, "global_step": 148539, "epoch": 1789} {"train_loss": -23.402103424072266, "global_step": 148540, "epoch": 1789} {"train_loss": -23.203771591186523, "global_step": 148541, "epoch": 1789} {"train_loss": -23.164226531982422, "global_step": 148542, "epoch": 1789} {"train_loss": -23.329221725463867, "global_step": 148543, "epoch": 1789} {"train_loss": -23.032567977905273, "global_step": 148544, "epoch": 1789} {"train_loss": -23.3129825592041, "global_step": 148545, "epoch": 1789} {"train_loss": -23.202741622924805, "global_step": 148546, "epoch": 1789} {"train_loss": -22.674741744995117, "global_step": 148547, "epoch": 1789} {"train_loss": -22.870750427246094, "global_step": 148548, "epoch": 1789} {"train_loss": -23.252347946166992, "global_step": 148549, "epoch": 1789} {"train_loss": -23.28960609436035, "global_step": 148550, "epoch": 1789} {"train_loss": -23.171072006225586, "global_step": 148551, "epoch": 1789} {"train_loss": -23.080753326416016, "global_step": 148552, "epoch": 1789} {"train_loss": -23.241535186767578, "global_step": 148553, "epoch": 1789} {"train_loss": -23.10489273071289, "global_step": 148554, "epoch": 1789} {"train_loss": -23.1468505859375, "global_step": 148555, "epoch": 1789} {"train_loss": -23.073495864868164, "global_step": 148556, "epoch": 1789} {"train_loss": -23.341341018676758, "global_step": 148557, "epoch": 1789} {"train_loss": -23.473634719848633, "global_step": 148558, "epoch": 1789} {"train_loss": -23.21821403503418, "global_step": 148559, "epoch": 1789} {"train_loss": -23.120725631713867, "global_step": 148560, "epoch": 1789} {"train_loss": -23.266321182250977, "global_step": 148561, "epoch": 1789} {"train_loss": -23.342100143432617, "global_step": 148562, "epoch": 1789} {"train_loss": -23.38503074645996, "global_step": 148563, "epoch": 1789} {"train_loss": -23.121034622192383, "global_step": 148564, "epoch": 1789} {"train_loss": -23.302762985229492, "global_step": 148565, "epoch": 1789} {"train_loss": -23.32769203186035, "global_step": 148566, "epoch": 1789} {"train_loss": -23.07171630859375, "global_step": 148567, "epoch": 1789} {"train_loss": -23.4234676361084, "global_step": 148568, "epoch": 1789} {"train_loss": -23.19348436378571, "global_step": 148569, "epoch": 1789, "val_loss": 6285118.0} {"train_loss": -22.706195831298828, "global_step": 148570, "epoch": 1790} {"train_loss": -23.280649185180664, "global_step": 148571, "epoch": 1790} {"train_loss": -22.839567184448242, "global_step": 148572, "epoch": 1790} {"train_loss": -22.78619384765625, "global_step": 148573, "epoch": 1790} {"train_loss": -23.09793472290039, "global_step": 148574, "epoch": 1790} {"train_loss": -22.341577529907227, "global_step": 148575, "epoch": 1790} {"train_loss": -22.76820182800293, "global_step": 148576, "epoch": 1790} {"train_loss": -22.883310317993164, "global_step": 148577, "epoch": 1790} {"train_loss": -22.637136459350586, "global_step": 148578, "epoch": 1790} {"train_loss": -22.47974395751953, "global_step": 148579, "epoch": 1790} {"train_loss": -22.519977569580078, "global_step": 148580, "epoch": 1790} {"train_loss": -22.532773971557617, "global_step": 148581, "epoch": 1790} {"train_loss": -22.966964721679688, "global_step": 148582, "epoch": 1790} {"train_loss": -22.695920944213867, "global_step": 148583, "epoch": 1790} {"train_loss": -23.140073776245117, "global_step": 148584, "epoch": 1790} {"train_loss": -23.092893600463867, "global_step": 148585, "epoch": 1790} {"train_loss": -22.90789222717285, "global_step": 148586, "epoch": 1790} {"train_loss": -22.981632232666016, "global_step": 148587, "epoch": 1790} {"train_loss": -23.205097198486328, "global_step": 148588, "epoch": 1790} {"train_loss": -23.33877944946289, "global_step": 148589, "epoch": 1790} {"train_loss": -22.787822723388672, "global_step": 148590, "epoch": 1790} {"train_loss": -22.84482192993164, "global_step": 148591, "epoch": 1790} {"train_loss": -23.106887817382812, "global_step": 148592, "epoch": 1790} {"train_loss": -23.520395278930664, "global_step": 148593, "epoch": 1790} {"train_loss": -23.35032844543457, "global_step": 148594, "epoch": 1790} {"train_loss": -23.21198081970215, "global_step": 148595, "epoch": 1790} {"train_loss": -23.024757385253906, "global_step": 148596, "epoch": 1790} {"train_loss": -23.519718170166016, "global_step": 148597, "epoch": 1790} {"train_loss": -23.356046676635742, "global_step": 148598, "epoch": 1790} {"train_loss": -23.568649291992188, "global_step": 148599, "epoch": 1790} {"train_loss": -23.230669021606445, "global_step": 148600, "epoch": 1790} {"train_loss": -23.382553100585938, "global_step": 148601, "epoch": 1790} {"train_loss": -23.10757827758789, "global_step": 148602, "epoch": 1790} {"train_loss": -23.4359188079834, "global_step": 148603, "epoch": 1790} {"train_loss": -23.49444580078125, "global_step": 148604, "epoch": 1790} {"train_loss": -23.196073532104492, "global_step": 148605, "epoch": 1790} {"train_loss": -23.183496475219727, "global_step": 148606, "epoch": 1790} {"train_loss": -23.401762008666992, "global_step": 148607, "epoch": 1790} {"train_loss": -23.412763595581055, "global_step": 148608, "epoch": 1790} {"train_loss": -23.230175018310547, "global_step": 148609, "epoch": 1790} {"train_loss": -23.291458129882812, "global_step": 148610, "epoch": 1790} {"train_loss": -22.8411922454834, "global_step": 148611, "epoch": 1790} {"train_loss": -23.1704158782959, "global_step": 148612, "epoch": 1790} {"train_loss": -23.399662017822266, "global_step": 148613, "epoch": 1790} {"train_loss": -23.321277618408203, "global_step": 148614, "epoch": 1790} {"train_loss": -23.849607467651367, "global_step": 148615, "epoch": 1790} {"train_loss": -22.96531105041504, "global_step": 148616, "epoch": 1790} {"train_loss": -23.50192642211914, "global_step": 148617, "epoch": 1790} {"train_loss": -23.345378875732422, "global_step": 148618, "epoch": 1790} {"train_loss": -23.066715240478516, "global_step": 148619, "epoch": 1790} {"train_loss": -23.334003448486328, "global_step": 148620, "epoch": 1790} {"train_loss": -23.081090927124023, "global_step": 148621, "epoch": 1790} {"train_loss": -23.199951171875, "global_step": 148622, "epoch": 1790} {"train_loss": -23.49759864807129, "global_step": 148623, "epoch": 1790} {"train_loss": -23.341848373413086, "global_step": 148624, "epoch": 1790} {"train_loss": -23.25947380065918, "global_step": 148625, "epoch": 1790} {"train_loss": -23.41661262512207, "global_step": 148626, "epoch": 1790} {"train_loss": -23.05796241760254, "global_step": 148627, "epoch": 1790} {"train_loss": -23.29416275024414, "global_step": 148628, "epoch": 1790} {"train_loss": -23.46966552734375, "global_step": 148629, "epoch": 1790} {"train_loss": -23.228063583374023, "global_step": 148630, "epoch": 1790} {"train_loss": -23.4709529876709, "global_step": 148631, "epoch": 1790} {"train_loss": -23.08449363708496, "global_step": 148632, "epoch": 1790} {"train_loss": -23.113121032714844, "global_step": 148633, "epoch": 1790} {"train_loss": -23.18104362487793, "global_step": 148634, "epoch": 1790} {"train_loss": -23.263338088989258, "global_step": 148635, "epoch": 1790} {"train_loss": -23.2492618560791, "global_step": 148636, "epoch": 1790} {"train_loss": -23.420673370361328, "global_step": 148637, "epoch": 1790} {"train_loss": -23.13604736328125, "global_step": 148638, "epoch": 1790} {"train_loss": -23.073408126831055, "global_step": 148639, "epoch": 1790} {"train_loss": -23.10025978088379, "global_step": 148640, "epoch": 1790} {"train_loss": -23.50013542175293, "global_step": 148641, "epoch": 1790} {"train_loss": -23.425140380859375, "global_step": 148642, "epoch": 1790} {"train_loss": -23.171573638916016, "global_step": 148643, "epoch": 1790} {"train_loss": -23.519193649291992, "global_step": 148644, "epoch": 1790} {"train_loss": -22.773208618164062, "global_step": 148645, "epoch": 1790} {"train_loss": -23.418010711669922, "global_step": 148646, "epoch": 1790} {"train_loss": -23.057146072387695, "global_step": 148647, "epoch": 1790} {"train_loss": -23.55398941040039, "global_step": 148648, "epoch": 1790} {"train_loss": -23.227195739746094, "global_step": 148649, "epoch": 1790} {"train_loss": -23.42484474182129, "global_step": 148650, "epoch": 1790} {"train_loss": -22.970500946044922, "global_step": 148651, "epoch": 1790} {"train_loss": -23.1648573817977, "global_step": 148652, "epoch": 1790, "val_loss": 6570508.0} {"train_loss": -21.52750015258789, "global_step": 148653, "epoch": 1791} {"train_loss": -19.715181350708008, "global_step": 148654, "epoch": 1791} {"train_loss": -22.0726318359375, "global_step": 148655, "epoch": 1791} {"train_loss": -21.545413970947266, "global_step": 148656, "epoch": 1791} {"train_loss": -21.297164916992188, "global_step": 148657, "epoch": 1791} {"train_loss": -21.927806854248047, "global_step": 148658, "epoch": 1791} {"train_loss": -21.441160202026367, "global_step": 148659, "epoch": 1791} {"train_loss": -21.91999053955078, "global_step": 148660, "epoch": 1791} {"train_loss": -22.15179443359375, "global_step": 148661, "epoch": 1791} {"train_loss": -22.1042537689209, "global_step": 148662, "epoch": 1791} {"train_loss": -22.087209701538086, "global_step": 148663, "epoch": 1791} {"train_loss": -21.980504989624023, "global_step": 148664, "epoch": 1791} {"train_loss": -22.422609329223633, "global_step": 148665, "epoch": 1791} {"train_loss": -22.34468650817871, "global_step": 148666, "epoch": 1791} {"train_loss": -22.509939193725586, "global_step": 148667, "epoch": 1791} {"train_loss": -22.45466423034668, "global_step": 148668, "epoch": 1791} {"train_loss": -22.584888458251953, "global_step": 148669, "epoch": 1791} {"train_loss": -22.624282836914062, "global_step": 148670, "epoch": 1791} {"train_loss": -22.650800704956055, "global_step": 148671, "epoch": 1791} {"train_loss": -22.59076499938965, "global_step": 148672, "epoch": 1791} {"train_loss": -22.735992431640625, "global_step": 148673, "epoch": 1791} {"train_loss": -22.654516220092773, "global_step": 148674, "epoch": 1791} {"train_loss": -22.75819969177246, "global_step": 148675, "epoch": 1791} {"train_loss": -22.98908042907715, "global_step": 148676, "epoch": 1791} {"train_loss": -22.71693992614746, "global_step": 148677, "epoch": 1791} {"train_loss": -22.842512130737305, "global_step": 148678, "epoch": 1791} {"train_loss": -22.76997184753418, "global_step": 148679, "epoch": 1791} {"train_loss": -22.711069107055664, "global_step": 148680, "epoch": 1791} {"train_loss": -22.988313674926758, "global_step": 148681, "epoch": 1791} {"train_loss": -23.290924072265625, "global_step": 148682, "epoch": 1791} {"train_loss": -23.04892349243164, "global_step": 148683, "epoch": 1791} {"train_loss": -22.881452560424805, "global_step": 148684, "epoch": 1791} {"train_loss": -22.920557022094727, "global_step": 148685, "epoch": 1791} {"train_loss": -23.055505752563477, "global_step": 148686, "epoch": 1791} {"train_loss": -22.70404624938965, "global_step": 148687, "epoch": 1791} {"train_loss": -23.28644371032715, "global_step": 148688, "epoch": 1791} {"train_loss": -22.86020851135254, "global_step": 148689, "epoch": 1791} {"train_loss": -23.350120544433594, "global_step": 148690, "epoch": 1791} {"train_loss": -23.42201042175293, "global_step": 148691, "epoch": 1791} {"train_loss": -23.41578483581543, "global_step": 148692, "epoch": 1791} {"train_loss": -23.16701316833496, "global_step": 148693, "epoch": 1791} {"train_loss": -23.071887969970703, "global_step": 148694, "epoch": 1791} {"train_loss": -23.3719539642334, "global_step": 148695, "epoch": 1791} {"train_loss": -23.14688491821289, "global_step": 148696, "epoch": 1791} {"train_loss": -23.108259201049805, "global_step": 148697, "epoch": 1791} {"train_loss": -23.44936752319336, "global_step": 148698, "epoch": 1791} {"train_loss": -23.176671981811523, "global_step": 148699, "epoch": 1791} {"train_loss": -23.039386749267578, "global_step": 148700, "epoch": 1791} {"train_loss": -23.19236183166504, "global_step": 148701, "epoch": 1791} {"train_loss": -23.080242156982422, "global_step": 148702, "epoch": 1791} {"train_loss": -22.84522819519043, "global_step": 148703, "epoch": 1791} {"train_loss": -23.5548152923584, "global_step": 148704, "epoch": 1791} {"train_loss": -23.558364868164062, "global_step": 148705, "epoch": 1791} {"train_loss": -23.164159774780273, "global_step": 148706, "epoch": 1791} {"train_loss": -23.245697021484375, "global_step": 148707, "epoch": 1791} {"train_loss": -23.14205551147461, "global_step": 148708, "epoch": 1791} {"train_loss": -23.638517379760742, "global_step": 148709, "epoch": 1791} {"train_loss": -23.543933868408203, "global_step": 148710, "epoch": 1791} {"train_loss": -23.214141845703125, "global_step": 148711, "epoch": 1791} {"train_loss": -23.061782836914062, "global_step": 148712, "epoch": 1791} {"train_loss": -23.043787002563477, "global_step": 148713, "epoch": 1791} {"train_loss": -23.20330238342285, "global_step": 148714, "epoch": 1791} {"train_loss": -23.03120231628418, "global_step": 148715, "epoch": 1791} {"train_loss": -23.50189971923828, "global_step": 148716, "epoch": 1791} {"train_loss": -23.20015525817871, "global_step": 148717, "epoch": 1791} {"train_loss": -23.485044479370117, "global_step": 148718, "epoch": 1791} {"train_loss": -23.41986656188965, "global_step": 148719, "epoch": 1791} {"train_loss": -22.938297271728516, "global_step": 148720, "epoch": 1791} {"train_loss": -23.144460678100586, "global_step": 148721, "epoch": 1791} {"train_loss": -23.32649040222168, "global_step": 148722, "epoch": 1791} {"train_loss": -23.10169792175293, "global_step": 148723, "epoch": 1791} {"train_loss": -23.121503829956055, "global_step": 148724, "epoch": 1791} {"train_loss": -23.128625869750977, "global_step": 148725, "epoch": 1791} {"train_loss": -23.142927169799805, "global_step": 148726, "epoch": 1791} {"train_loss": -23.092260360717773, "global_step": 148727, "epoch": 1791} {"train_loss": -23.620166778564453, "global_step": 148728, "epoch": 1791} {"train_loss": -23.5380802154541, "global_step": 148729, "epoch": 1791} {"train_loss": -23.25545883178711, "global_step": 148730, "epoch": 1791} {"train_loss": -23.25699806213379, "global_step": 148731, "epoch": 1791} {"train_loss": -23.152414321899414, "global_step": 148732, "epoch": 1791} {"train_loss": -23.190488815307617, "global_step": 148733, "epoch": 1791} {"train_loss": -23.1362361907959, "global_step": 148734, "epoch": 1791} {"train_loss": -22.876108284456183, "global_step": 148735, "epoch": 1791, "val_loss": 6291460.5} {"train_loss": -23.40378189086914, "global_step": 148736, "epoch": 1792} {"train_loss": -23.413043975830078, "global_step": 148737, "epoch": 1792} {"train_loss": -22.89291763305664, "global_step": 148738, "epoch": 1792} {"train_loss": -23.123889923095703, "global_step": 148739, "epoch": 1792} {"train_loss": -23.020065307617188, "global_step": 148740, "epoch": 1792} {"train_loss": -23.202993392944336, "global_step": 148741, "epoch": 1792} {"train_loss": -22.95073890686035, "global_step": 148742, "epoch": 1792} {"train_loss": -23.208084106445312, "global_step": 148743, "epoch": 1792} {"train_loss": -23.185819625854492, "global_step": 148744, "epoch": 1792} {"train_loss": -23.00446128845215, "global_step": 148745, "epoch": 1792} {"train_loss": -23.048185348510742, "global_step": 148746, "epoch": 1792} {"train_loss": -22.960128784179688, "global_step": 148747, "epoch": 1792} {"train_loss": -23.098268508911133, "global_step": 148748, "epoch": 1792} {"train_loss": -22.654870986938477, "global_step": 148749, "epoch": 1792} {"train_loss": -22.693927764892578, "global_step": 148750, "epoch": 1792} {"train_loss": -23.517507553100586, "global_step": 148751, "epoch": 1792} {"train_loss": -22.727079391479492, "global_step": 148752, "epoch": 1792} {"train_loss": -23.504404067993164, "global_step": 148753, "epoch": 1792} {"train_loss": -23.376279830932617, "global_step": 148754, "epoch": 1792} {"train_loss": -22.968618392944336, "global_step": 148755, "epoch": 1792} {"train_loss": -23.131845474243164, "global_step": 148756, "epoch": 1792} {"train_loss": -22.95355987548828, "global_step": 148757, "epoch": 1792} {"train_loss": -23.372434616088867, "global_step": 148758, "epoch": 1792} {"train_loss": -23.313072204589844, "global_step": 148759, "epoch": 1792} {"train_loss": -22.743820190429688, "global_step": 148760, "epoch": 1792} {"train_loss": -22.977956771850586, "global_step": 148761, "epoch": 1792} {"train_loss": -22.98518943786621, "global_step": 148762, "epoch": 1792} {"train_loss": -23.567100524902344, "global_step": 148763, "epoch": 1792} {"train_loss": -23.278663635253906, "global_step": 148764, "epoch": 1792} {"train_loss": -23.187597274780273, "global_step": 148765, "epoch": 1792} {"train_loss": -23.38795280456543, "global_step": 148766, "epoch": 1792} {"train_loss": -23.05681610107422, "global_step": 148767, "epoch": 1792} {"train_loss": -23.4655704498291, "global_step": 148768, "epoch": 1792} {"train_loss": -23.309947967529297, "global_step": 148769, "epoch": 1792} {"train_loss": -23.415739059448242, "global_step": 148770, "epoch": 1792} {"train_loss": -22.978368759155273, "global_step": 148771, "epoch": 1792} {"train_loss": -23.1758975982666, "global_step": 148772, "epoch": 1792} {"train_loss": -23.173664093017578, "global_step": 148773, "epoch": 1792} {"train_loss": -23.610107421875, "global_step": 148774, "epoch": 1792} {"train_loss": -22.99286651611328, "global_step": 148775, "epoch": 1792} {"train_loss": -23.048215866088867, "global_step": 148776, "epoch": 1792} {"train_loss": -23.410070419311523, "global_step": 148777, "epoch": 1792} {"train_loss": -23.418621063232422, "global_step": 148778, "epoch": 1792} {"train_loss": -23.284992218017578, "global_step": 148779, "epoch": 1792} {"train_loss": -23.145099639892578, "global_step": 148780, "epoch": 1792} {"train_loss": -23.110843658447266, "global_step": 148781, "epoch": 1792} {"train_loss": -23.181901931762695, "global_step": 148782, "epoch": 1792} {"train_loss": -23.581167221069336, "global_step": 148783, "epoch": 1792} {"train_loss": -23.32844352722168, "global_step": 148784, "epoch": 1792} {"train_loss": -23.118268966674805, "global_step": 148785, "epoch": 1792} {"train_loss": -23.344114303588867, "global_step": 148786, "epoch": 1792} {"train_loss": -23.4492244720459, "global_step": 148787, "epoch": 1792} {"train_loss": -22.956501007080078, "global_step": 148788, "epoch": 1792} {"train_loss": -23.481098175048828, "global_step": 148789, "epoch": 1792} {"train_loss": -23.20998191833496, "global_step": 148790, "epoch": 1792} {"train_loss": -23.271013259887695, "global_step": 148791, "epoch": 1792} {"train_loss": -23.48187255859375, "global_step": 148792, "epoch": 1792} {"train_loss": -23.148427963256836, "global_step": 148793, "epoch": 1792} {"train_loss": -22.717504501342773, "global_step": 148794, "epoch": 1792} {"train_loss": -23.672683715820312, "global_step": 148795, "epoch": 1792} {"train_loss": -23.133880615234375, "global_step": 148796, "epoch": 1792} {"train_loss": -23.079994201660156, "global_step": 148797, "epoch": 1792} {"train_loss": -23.037240982055664, "global_step": 148798, "epoch": 1792} {"train_loss": -24.061542510986328, "global_step": 148799, "epoch": 1792} {"train_loss": -23.227556228637695, "global_step": 148800, "epoch": 1792} {"train_loss": -23.362943649291992, "global_step": 148801, "epoch": 1792} {"train_loss": -23.45722770690918, "global_step": 148802, "epoch": 1792} {"train_loss": -23.071821212768555, "global_step": 148803, "epoch": 1792} {"train_loss": -23.347213745117188, "global_step": 148804, "epoch": 1792} {"train_loss": -23.21221351623535, "global_step": 148805, "epoch": 1792} {"train_loss": -22.992950439453125, "global_step": 148806, "epoch": 1792} {"train_loss": -23.321062088012695, "global_step": 148807, "epoch": 1792} {"train_loss": -23.419734954833984, "global_step": 148808, "epoch": 1792} {"train_loss": -23.0025634765625, "global_step": 148809, "epoch": 1792} {"train_loss": -23.03116226196289, "global_step": 148810, "epoch": 1792} {"train_loss": -23.45905876159668, "global_step": 148811, "epoch": 1792} {"train_loss": -23.321786880493164, "global_step": 148812, "epoch": 1792} {"train_loss": -23.1700382232666, "global_step": 148813, "epoch": 1792} {"train_loss": -23.185104370117188, "global_step": 148814, "epoch": 1792} {"train_loss": -23.117332458496094, "global_step": 148815, "epoch": 1792} {"train_loss": -23.308731079101562, "global_step": 148816, "epoch": 1792} {"train_loss": -23.47768211364746, "global_step": 148817, "epoch": 1792} {"train_loss": -23.211532707673957, "global_step": 148818, "epoch": 1792, "val_loss": 6428194.0} {"train_loss": -23.24741554260254, "global_step": 148819, "epoch": 1793} {"train_loss": -23.13561248779297, "global_step": 148820, "epoch": 1793} {"train_loss": -23.264455795288086, "global_step": 148821, "epoch": 1793} {"train_loss": -23.193830490112305, "global_step": 148822, "epoch": 1793} {"train_loss": -23.15803337097168, "global_step": 148823, "epoch": 1793} {"train_loss": -22.703901290893555, "global_step": 148824, "epoch": 1793} {"train_loss": -22.99945068359375, "global_step": 148825, "epoch": 1793} {"train_loss": -22.868732452392578, "global_step": 148826, "epoch": 1793} {"train_loss": -23.054243087768555, "global_step": 148827, "epoch": 1793} {"train_loss": -23.283191680908203, "global_step": 148828, "epoch": 1793} {"train_loss": -22.567317962646484, "global_step": 148829, "epoch": 1793} {"train_loss": -23.116666793823242, "global_step": 148830, "epoch": 1793} {"train_loss": -23.01412010192871, "global_step": 148831, "epoch": 1793} {"train_loss": -23.393747329711914, "global_step": 148832, "epoch": 1793} {"train_loss": -23.218732833862305, "global_step": 148833, "epoch": 1793} {"train_loss": -23.629743576049805, "global_step": 148834, "epoch": 1793} {"train_loss": -23.357938766479492, "global_step": 148835, "epoch": 1793} {"train_loss": -23.41672134399414, "global_step": 148836, "epoch": 1793} {"train_loss": -23.20253562927246, "global_step": 148837, "epoch": 1793} {"train_loss": -23.118345260620117, "global_step": 148838, "epoch": 1793} {"train_loss": -23.260948181152344, "global_step": 148839, "epoch": 1793} {"train_loss": -23.092756271362305, "global_step": 148840, "epoch": 1793} {"train_loss": -23.531936645507812, "global_step": 148841, "epoch": 1793} {"train_loss": -23.420425415039062, "global_step": 148842, "epoch": 1793} {"train_loss": -23.704763412475586, "global_step": 148843, "epoch": 1793} {"train_loss": -23.21553611755371, "global_step": 148844, "epoch": 1793} {"train_loss": -23.417787551879883, "global_step": 148845, "epoch": 1793} {"train_loss": -23.36526107788086, "global_step": 148846, "epoch": 1793} {"train_loss": -22.9476261138916, "global_step": 148847, "epoch": 1793} {"train_loss": -23.702680587768555, "global_step": 148848, "epoch": 1793} {"train_loss": -23.532367706298828, "global_step": 148849, "epoch": 1793} {"train_loss": -23.677688598632812, "global_step": 148850, "epoch": 1793} {"train_loss": -23.646512985229492, "global_step": 148851, "epoch": 1793} {"train_loss": -23.469106674194336, "global_step": 148852, "epoch": 1793} {"train_loss": -23.152286529541016, "global_step": 148853, "epoch": 1793} {"train_loss": -22.806556701660156, "global_step": 148854, "epoch": 1793} {"train_loss": -23.17719078063965, "global_step": 148855, "epoch": 1793} {"train_loss": -23.232707977294922, "global_step": 148856, "epoch": 1793} {"train_loss": -23.06281089782715, "global_step": 148857, "epoch": 1793} {"train_loss": -23.176122665405273, "global_step": 148858, "epoch": 1793} {"train_loss": -22.90504264831543, "global_step": 148859, "epoch": 1793} {"train_loss": -22.908620834350586, "global_step": 148860, "epoch": 1793} {"train_loss": -22.824249267578125, "global_step": 148861, "epoch": 1793} {"train_loss": -23.1603946685791, "global_step": 148862, "epoch": 1793} {"train_loss": -23.228870391845703, "global_step": 148863, "epoch": 1793} {"train_loss": -23.356931686401367, "global_step": 148864, "epoch": 1793} {"train_loss": -23.37613296508789, "global_step": 148865, "epoch": 1793} {"train_loss": -23.452239990234375, "global_step": 148866, "epoch": 1793} {"train_loss": -23.349273681640625, "global_step": 148867, "epoch": 1793} {"train_loss": -23.524728775024414, "global_step": 148868, "epoch": 1793} {"train_loss": -23.08075523376465, "global_step": 148869, "epoch": 1793} {"train_loss": -23.606489181518555, "global_step": 148870, "epoch": 1793} {"train_loss": -23.386566162109375, "global_step": 148871, "epoch": 1793} {"train_loss": -23.124008178710938, "global_step": 148872, "epoch": 1793} {"train_loss": -23.186922073364258, "global_step": 148873, "epoch": 1793} {"train_loss": -23.549488067626953, "global_step": 148874, "epoch": 1793} {"train_loss": -23.205089569091797, "global_step": 148875, "epoch": 1793} {"train_loss": -23.077438354492188, "global_step": 148876, "epoch": 1793} {"train_loss": -23.379730224609375, "global_step": 148877, "epoch": 1793} {"train_loss": -23.021238327026367, "global_step": 148878, "epoch": 1793} {"train_loss": -23.32912826538086, "global_step": 148879, "epoch": 1793} {"train_loss": -22.99628257751465, "global_step": 148880, "epoch": 1793} {"train_loss": -23.399755477905273, "global_step": 148881, "epoch": 1793} {"train_loss": -23.32490348815918, "global_step": 148882, "epoch": 1793} {"train_loss": -23.3605899810791, "global_step": 148883, "epoch": 1793} {"train_loss": -23.323179244995117, "global_step": 148884, "epoch": 1793} {"train_loss": -23.359634399414062, "global_step": 148885, "epoch": 1793} {"train_loss": -23.14412498474121, "global_step": 148886, "epoch": 1793} {"train_loss": -23.025192260742188, "global_step": 148887, "epoch": 1793} {"train_loss": -23.363521575927734, "global_step": 148888, "epoch": 1793} {"train_loss": -23.254283905029297, "global_step": 148889, "epoch": 1793} {"train_loss": -23.473318099975586, "global_step": 148890, "epoch": 1793} {"train_loss": -23.35013771057129, "global_step": 148891, "epoch": 1793} {"train_loss": -23.523944854736328, "global_step": 148892, "epoch": 1793} {"train_loss": -23.06119728088379, "global_step": 148893, "epoch": 1793} {"train_loss": -23.228116989135742, "global_step": 148894, "epoch": 1793} {"train_loss": -23.48569679260254, "global_step": 148895, "epoch": 1793} {"train_loss": -23.09126091003418, "global_step": 148896, "epoch": 1793} {"train_loss": -23.198158264160156, "global_step": 148897, "epoch": 1793} {"train_loss": -23.112590789794922, "global_step": 148898, "epoch": 1793} {"train_loss": -23.286771774291992, "global_step": 148899, "epoch": 1793} {"train_loss": -23.405807495117188, "global_step": 148900, "epoch": 1793} {"train_loss": -23.23905928738146, "global_step": 148901, "epoch": 1793, "val_loss": 6298693.0} {"train_loss": -22.790884017944336, "global_step": 148902, "epoch": 1794} {"train_loss": -22.99384880065918, "global_step": 148903, "epoch": 1794} {"train_loss": -22.668622970581055, "global_step": 148904, "epoch": 1794} {"train_loss": -23.08380699157715, "global_step": 148905, "epoch": 1794} {"train_loss": -23.05519676208496, "global_step": 148906, "epoch": 1794} {"train_loss": -22.78072738647461, "global_step": 148907, "epoch": 1794} {"train_loss": -23.279850006103516, "global_step": 148908, "epoch": 1794} {"train_loss": -22.723865509033203, "global_step": 148909, "epoch": 1794} {"train_loss": -23.240985870361328, "global_step": 148910, "epoch": 1794} {"train_loss": -22.938377380371094, "global_step": 148911, "epoch": 1794} {"train_loss": -23.505023956298828, "global_step": 148912, "epoch": 1794} {"train_loss": -23.189453125, "global_step": 148913, "epoch": 1794} {"train_loss": -22.632726669311523, "global_step": 148914, "epoch": 1794} {"train_loss": -23.156286239624023, "global_step": 148915, "epoch": 1794} {"train_loss": -23.205947875976562, "global_step": 148916, "epoch": 1794} {"train_loss": -23.257617950439453, "global_step": 148917, "epoch": 1794} {"train_loss": -23.078981399536133, "global_step": 148918, "epoch": 1794} {"train_loss": -23.151226043701172, "global_step": 148919, "epoch": 1794} {"train_loss": -23.40949058532715, "global_step": 148920, "epoch": 1794} {"train_loss": -23.32596778869629, "global_step": 148921, "epoch": 1794} {"train_loss": -23.0455379486084, "global_step": 148922, "epoch": 1794} {"train_loss": -23.225065231323242, "global_step": 148923, "epoch": 1794} {"train_loss": -23.168216705322266, "global_step": 148924, "epoch": 1794} {"train_loss": -23.14827537536621, "global_step": 148925, "epoch": 1794} {"train_loss": -23.217477798461914, "global_step": 148926, "epoch": 1794} {"train_loss": -23.37285804748535, "global_step": 148927, "epoch": 1794} {"train_loss": -23.247339248657227, "global_step": 148928, "epoch": 1794} {"train_loss": -23.22183609008789, "global_step": 148929, "epoch": 1794} {"train_loss": -23.3028507232666, "global_step": 148930, "epoch": 1794} {"train_loss": -23.272663116455078, "global_step": 148931, "epoch": 1794} {"train_loss": -23.10731315612793, "global_step": 148932, "epoch": 1794} {"train_loss": -23.455204010009766, "global_step": 148933, "epoch": 1794} {"train_loss": -23.318653106689453, "global_step": 148934, "epoch": 1794} {"train_loss": -23.223936080932617, "global_step": 148935, "epoch": 1794} {"train_loss": -23.351058959960938, "global_step": 148936, "epoch": 1794} {"train_loss": -23.008909225463867, "global_step": 148937, "epoch": 1794} {"train_loss": -23.086761474609375, "global_step": 148938, "epoch": 1794} {"train_loss": -23.5155086517334, "global_step": 148939, "epoch": 1794} {"train_loss": -23.097034454345703, "global_step": 148940, "epoch": 1794} {"train_loss": -23.5242919921875, "global_step": 148941, "epoch": 1794} {"train_loss": -23.355701446533203, "global_step": 148942, "epoch": 1794} {"train_loss": -23.12980842590332, "global_step": 148943, "epoch": 1794} {"train_loss": -23.218717575073242, "global_step": 148944, "epoch": 1794} {"train_loss": -23.373167037963867, "global_step": 148945, "epoch": 1794} {"train_loss": -23.13333511352539, "global_step": 148946, "epoch": 1794} {"train_loss": -22.893033981323242, "global_step": 148947, "epoch": 1794} {"train_loss": -23.35352897644043, "global_step": 148948, "epoch": 1794} {"train_loss": -23.2269229888916, "global_step": 148949, "epoch": 1794} {"train_loss": -23.549652099609375, "global_step": 148950, "epoch": 1794} {"train_loss": -23.443660736083984, "global_step": 148951, "epoch": 1794} {"train_loss": -23.586122512817383, "global_step": 148952, "epoch": 1794} {"train_loss": -22.977161407470703, "global_step": 148953, "epoch": 1794} {"train_loss": -23.13373374938965, "global_step": 148954, "epoch": 1794} {"train_loss": -23.052907943725586, "global_step": 148955, "epoch": 1794} {"train_loss": -23.262907028198242, "global_step": 148956, "epoch": 1794} {"train_loss": -23.194377899169922, "global_step": 148957, "epoch": 1794} {"train_loss": -23.39363670349121, "global_step": 148958, "epoch": 1794} {"train_loss": -23.35509490966797, "global_step": 148959, "epoch": 1794} {"train_loss": -23.50373077392578, "global_step": 148960, "epoch": 1794} {"train_loss": -23.306684494018555, "global_step": 148961, "epoch": 1794} {"train_loss": -23.308441162109375, "global_step": 148962, "epoch": 1794} {"train_loss": -23.499645233154297, "global_step": 148963, "epoch": 1794} {"train_loss": -23.61006736755371, "global_step": 148964, "epoch": 1794} {"train_loss": -23.015092849731445, "global_step": 148965, "epoch": 1794} {"train_loss": -23.058801651000977, "global_step": 148966, "epoch": 1794} {"train_loss": -23.22479820251465, "global_step": 148967, "epoch": 1794} {"train_loss": -23.60986328125, "global_step": 148968, "epoch": 1794} {"train_loss": -23.67258644104004, "global_step": 148969, "epoch": 1794} {"train_loss": -23.333677291870117, "global_step": 148970, "epoch": 1794} {"train_loss": -23.48172378540039, "global_step": 148971, "epoch": 1794} {"train_loss": -23.641422271728516, "global_step": 148972, "epoch": 1794} {"train_loss": -22.984725952148438, "global_step": 148973, "epoch": 1794} {"train_loss": -22.85666847229004, "global_step": 148974, "epoch": 1794} {"train_loss": -23.074012756347656, "global_step": 148975, "epoch": 1794} {"train_loss": -23.369108200073242, "global_step": 148976, "epoch": 1794} {"train_loss": -23.091495513916016, "global_step": 148977, "epoch": 1794} {"train_loss": -23.110605239868164, "global_step": 148978, "epoch": 1794} {"train_loss": -23.09980583190918, "global_step": 148979, "epoch": 1794} {"train_loss": -23.126220703125, "global_step": 148980, "epoch": 1794} {"train_loss": -23.617334365844727, "global_step": 148981, "epoch": 1794} {"train_loss": -23.126977920532227, "global_step": 148982, "epoch": 1794} {"train_loss": -23.513111114501953, "global_step": 148983, "epoch": 1794} {"train_loss": -23.24865584775626, "global_step": 148984, "epoch": 1794, "val_loss": 6335903.0} {"train_loss": -23.06851577758789, "global_step": 148985, "epoch": 1795} {"train_loss": -22.79620361328125, "global_step": 148986, "epoch": 1795} {"train_loss": -22.975332260131836, "global_step": 148987, "epoch": 1795} {"train_loss": -22.83757209777832, "global_step": 148988, "epoch": 1795} {"train_loss": -22.745534896850586, "global_step": 148989, "epoch": 1795} {"train_loss": -23.39021110534668, "global_step": 148990, "epoch": 1795} {"train_loss": -22.987873077392578, "global_step": 148991, "epoch": 1795} {"train_loss": -23.25050163269043, "global_step": 148992, "epoch": 1795} {"train_loss": -23.148706436157227, "global_step": 148993, "epoch": 1795} {"train_loss": -22.957277297973633, "global_step": 148994, "epoch": 1795} {"train_loss": -22.977752685546875, "global_step": 148995, "epoch": 1795} {"train_loss": -23.0980167388916, "global_step": 148996, "epoch": 1795} {"train_loss": -23.286020278930664, "global_step": 148997, "epoch": 1795} {"train_loss": -23.298311233520508, "global_step": 148998, "epoch": 1795} {"train_loss": -22.510343551635742, "global_step": 148999, "epoch": 1795} {"train_loss": -22.769636154174805, "global_step": 149000, "epoch": 1795} {"train_loss": -23.01226806640625, "global_step": 149001, "epoch": 1795} {"train_loss": -22.96538734436035, "global_step": 149002, "epoch": 1795} {"train_loss": -23.04413604736328, "global_step": 149003, "epoch": 1795} {"train_loss": -23.357975006103516, "global_step": 149004, "epoch": 1795} {"train_loss": -23.446985244750977, "global_step": 149005, "epoch": 1795} {"train_loss": -22.789934158325195, "global_step": 149006, "epoch": 1795} {"train_loss": -23.049942016601562, "global_step": 149007, "epoch": 1795} {"train_loss": -22.920921325683594, "global_step": 149008, "epoch": 1795} {"train_loss": -23.104522705078125, "global_step": 149009, "epoch": 1795} {"train_loss": -23.1418399810791, "global_step": 149010, "epoch": 1795} {"train_loss": -23.196313858032227, "global_step": 149011, "epoch": 1795} {"train_loss": -23.09211540222168, "global_step": 149012, "epoch": 1795} {"train_loss": -23.271780014038086, "global_step": 149013, "epoch": 1795} {"train_loss": -23.37510108947754, "global_step": 149014, "epoch": 1795} {"train_loss": -23.176816940307617, "global_step": 149015, "epoch": 1795} {"train_loss": -23.047409057617188, "global_step": 149016, "epoch": 1795} {"train_loss": -23.248964309692383, "global_step": 149017, "epoch": 1795} {"train_loss": -23.2711181640625, "global_step": 149018, "epoch": 1795} {"train_loss": -23.080427169799805, "global_step": 149019, "epoch": 1795} {"train_loss": -23.39723014831543, "global_step": 149020, "epoch": 1795} {"train_loss": -23.33447265625, "global_step": 149021, "epoch": 1795} {"train_loss": -23.24036979675293, "global_step": 149022, "epoch": 1795} {"train_loss": -23.304672241210938, "global_step": 149023, "epoch": 1795} {"train_loss": -23.308815002441406, "global_step": 149024, "epoch": 1795} {"train_loss": -23.200973510742188, "global_step": 149025, "epoch": 1795} {"train_loss": -23.449674606323242, "global_step": 149026, "epoch": 1795} {"train_loss": -23.424646377563477, "global_step": 149027, "epoch": 1795} {"train_loss": -23.609058380126953, "global_step": 149028, "epoch": 1795} {"train_loss": -23.40115737915039, "global_step": 149029, "epoch": 1795} {"train_loss": -23.546743392944336, "global_step": 149030, "epoch": 1795} {"train_loss": -23.19314956665039, "global_step": 149031, "epoch": 1795} {"train_loss": -23.17580223083496, "global_step": 149032, "epoch": 1795} {"train_loss": -23.310237884521484, "global_step": 149033, "epoch": 1795} {"train_loss": -23.529815673828125, "global_step": 149034, "epoch": 1795} {"train_loss": -23.468564987182617, "global_step": 149035, "epoch": 1795} {"train_loss": -23.239749908447266, "global_step": 149036, "epoch": 1795} {"train_loss": -23.348453521728516, "global_step": 149037, "epoch": 1795} {"train_loss": -23.34181022644043, "global_step": 149038, "epoch": 1795} {"train_loss": -23.435216903686523, "global_step": 149039, "epoch": 1795} {"train_loss": -22.88300132751465, "global_step": 149040, "epoch": 1795} {"train_loss": -23.334747314453125, "global_step": 149041, "epoch": 1795} {"train_loss": -22.94342613220215, "global_step": 149042, "epoch": 1795} {"train_loss": -23.23822021484375, "global_step": 149043, "epoch": 1795} {"train_loss": -23.490741729736328, "global_step": 149044, "epoch": 1795} {"train_loss": -23.5189208984375, "global_step": 149045, "epoch": 1795} {"train_loss": -23.24782371520996, "global_step": 149046, "epoch": 1795} {"train_loss": -23.20777702331543, "global_step": 149047, "epoch": 1795} {"train_loss": -23.255529403686523, "global_step": 149048, "epoch": 1795} {"train_loss": -22.95651626586914, "global_step": 149049, "epoch": 1795} {"train_loss": -22.972557067871094, "global_step": 149050, "epoch": 1795} {"train_loss": -23.617673873901367, "global_step": 149051, "epoch": 1795} {"train_loss": -23.38343620300293, "global_step": 149052, "epoch": 1795} {"train_loss": -22.829015731811523, "global_step": 149053, "epoch": 1795} {"train_loss": -23.477628707885742, "global_step": 149054, "epoch": 1795} {"train_loss": -22.896753311157227, "global_step": 149055, "epoch": 1795} {"train_loss": -23.213228225708008, "global_step": 149056, "epoch": 1795} {"train_loss": -23.155500411987305, "global_step": 149057, "epoch": 1795} {"train_loss": -23.161256790161133, "global_step": 149058, "epoch": 1795} {"train_loss": -23.069795608520508, "global_step": 149059, "epoch": 1795} {"train_loss": -23.251981735229492, "global_step": 149060, "epoch": 1795} {"train_loss": -23.296476364135742, "global_step": 149061, "epoch": 1795} {"train_loss": -23.264755249023438, "global_step": 149062, "epoch": 1795} {"train_loss": -23.2373046875, "global_step": 149063, "epoch": 1795} {"train_loss": -23.352109909057617, "global_step": 149064, "epoch": 1795} {"train_loss": -23.53255844116211, "global_step": 149065, "epoch": 1795} {"train_loss": -22.983495712280273, "global_step": 149066, "epoch": 1795} {"train_loss": -23.176264797348573, "global_step": 149067, "epoch": 1795, "val_loss": 6376715.0} {"train_loss": -23.21839141845703, "global_step": 149068, "epoch": 1796} {"train_loss": -22.643991470336914, "global_step": 149069, "epoch": 1796} {"train_loss": -22.113239288330078, "global_step": 149070, "epoch": 1796} {"train_loss": -22.784229278564453, "global_step": 149071, "epoch": 1796} {"train_loss": -22.377092361450195, "global_step": 149072, "epoch": 1796} {"train_loss": -22.942873001098633, "global_step": 149073, "epoch": 1796} {"train_loss": -22.736209869384766, "global_step": 149074, "epoch": 1796} {"train_loss": -22.84868812561035, "global_step": 149075, "epoch": 1796} {"train_loss": -23.083057403564453, "global_step": 149076, "epoch": 1796} {"train_loss": -22.70288848876953, "global_step": 149077, "epoch": 1796} {"train_loss": -22.875715255737305, "global_step": 149078, "epoch": 1796} {"train_loss": -23.03473472595215, "global_step": 149079, "epoch": 1796} {"train_loss": -23.01766014099121, "global_step": 149080, "epoch": 1796} {"train_loss": -22.946826934814453, "global_step": 149081, "epoch": 1796} {"train_loss": -22.83385467529297, "global_step": 149082, "epoch": 1796} {"train_loss": -22.996965408325195, "global_step": 149083, "epoch": 1796} {"train_loss": -23.26405906677246, "global_step": 149084, "epoch": 1796} {"train_loss": -22.806739807128906, "global_step": 149085, "epoch": 1796} {"train_loss": -22.839208602905273, "global_step": 149086, "epoch": 1796} {"train_loss": -23.207263946533203, "global_step": 149087, "epoch": 1796} {"train_loss": -23.08106803894043, "global_step": 149088, "epoch": 1796} {"train_loss": -23.314130783081055, "global_step": 149089, "epoch": 1796} {"train_loss": -23.192625045776367, "global_step": 149090, "epoch": 1796} {"train_loss": -22.872467041015625, "global_step": 149091, "epoch": 1796} {"train_loss": -23.016172409057617, "global_step": 149092, "epoch": 1796} {"train_loss": -23.137807846069336, "global_step": 149093, "epoch": 1796} {"train_loss": -22.988231658935547, "global_step": 149094, "epoch": 1796} {"train_loss": -23.365346908569336, "global_step": 149095, "epoch": 1796} {"train_loss": -23.265470504760742, "global_step": 149096, "epoch": 1796} {"train_loss": -23.553253173828125, "global_step": 149097, "epoch": 1796} {"train_loss": -23.626834869384766, "global_step": 149098, "epoch": 1796} {"train_loss": -23.283203125, "global_step": 149099, "epoch": 1796} {"train_loss": -23.32814598083496, "global_step": 149100, "epoch": 1796} {"train_loss": -23.20496940612793, "global_step": 149101, "epoch": 1796} {"train_loss": -22.832355499267578, "global_step": 149102, "epoch": 1796} {"train_loss": -23.173484802246094, "global_step": 149103, "epoch": 1796} {"train_loss": -23.233367919921875, "global_step": 149104, "epoch": 1796} {"train_loss": -23.136796951293945, "global_step": 149105, "epoch": 1796} {"train_loss": -23.440229415893555, "global_step": 149106, "epoch": 1796} {"train_loss": -23.117231369018555, "global_step": 149107, "epoch": 1796} {"train_loss": -23.22722816467285, "global_step": 149108, "epoch": 1796} {"train_loss": -23.33084487915039, "global_step": 149109, "epoch": 1796} {"train_loss": -23.350038528442383, "global_step": 149110, "epoch": 1796} {"train_loss": -23.125240325927734, "global_step": 149111, "epoch": 1796} {"train_loss": -23.660276412963867, "global_step": 149112, "epoch": 1796} {"train_loss": -23.418821334838867, "global_step": 149113, "epoch": 1796} {"train_loss": -22.79892349243164, "global_step": 149114, "epoch": 1796} {"train_loss": -22.837051391601562, "global_step": 149115, "epoch": 1796} {"train_loss": -22.766624450683594, "global_step": 149116, "epoch": 1796} {"train_loss": -23.433563232421875, "global_step": 149117, "epoch": 1796} {"train_loss": -22.65608024597168, "global_step": 149118, "epoch": 1796} {"train_loss": -23.08642578125, "global_step": 149119, "epoch": 1796} {"train_loss": -23.148311614990234, "global_step": 149120, "epoch": 1796} {"train_loss": -23.205820083618164, "global_step": 149121, "epoch": 1796} {"train_loss": -23.23345947265625, "global_step": 149122, "epoch": 1796} {"train_loss": -23.367429733276367, "global_step": 149123, "epoch": 1796} {"train_loss": -23.114545822143555, "global_step": 149124, "epoch": 1796} {"train_loss": -22.89513397216797, "global_step": 149125, "epoch": 1796} {"train_loss": -23.218257904052734, "global_step": 149126, "epoch": 1796} {"train_loss": -23.468673706054688, "global_step": 149127, "epoch": 1796} {"train_loss": -23.253679275512695, "global_step": 149128, "epoch": 1796} {"train_loss": -23.162744522094727, "global_step": 149129, "epoch": 1796} {"train_loss": -23.34358024597168, "global_step": 149130, "epoch": 1796} {"train_loss": -23.663122177124023, "global_step": 149131, "epoch": 1796} {"train_loss": -23.4671630859375, "global_step": 149132, "epoch": 1796} {"train_loss": -22.9770565032959, "global_step": 149133, "epoch": 1796} {"train_loss": -23.202259063720703, "global_step": 149134, "epoch": 1796} {"train_loss": -23.295141220092773, "global_step": 149135, "epoch": 1796} {"train_loss": -23.337060928344727, "global_step": 149136, "epoch": 1796} {"train_loss": -23.215415954589844, "global_step": 149137, "epoch": 1796} {"train_loss": -23.479442596435547, "global_step": 149138, "epoch": 1796} {"train_loss": -23.50066375732422, "global_step": 149139, "epoch": 1796} {"train_loss": -23.569204330444336, "global_step": 149140, "epoch": 1796} {"train_loss": -23.40144920349121, "global_step": 149141, "epoch": 1796} {"train_loss": -23.343219757080078, "global_step": 149142, "epoch": 1796} {"train_loss": -23.539676666259766, "global_step": 149143, "epoch": 1796} {"train_loss": -23.699710845947266, "global_step": 149144, "epoch": 1796} {"train_loss": -23.620792388916016, "global_step": 149145, "epoch": 1796} {"train_loss": -23.5858211517334, "global_step": 149146, "epoch": 1796} {"train_loss": -23.2263126373291, "global_step": 149147, "epoch": 1796} {"train_loss": -23.479604721069336, "global_step": 149148, "epoch": 1796} {"train_loss": -23.3283748626709, "global_step": 149149, "epoch": 1796} {"train_loss": -23.157391812427935, "global_step": 149150, "epoch": 1796, "val_loss": 6277627.0} {"train_loss": -23.217790603637695, "global_step": 149151, "epoch": 1797} {"train_loss": -23.40751075744629, "global_step": 149152, "epoch": 1797} {"train_loss": -23.232954025268555, "global_step": 149153, "epoch": 1797} {"train_loss": -23.3006591796875, "global_step": 149154, "epoch": 1797} {"train_loss": -22.57328224182129, "global_step": 149155, "epoch": 1797} {"train_loss": -23.240026473999023, "global_step": 149156, "epoch": 1797} {"train_loss": -23.127939224243164, "global_step": 149157, "epoch": 1797} {"train_loss": -22.721174240112305, "global_step": 149158, "epoch": 1797} {"train_loss": -22.781118392944336, "global_step": 149159, "epoch": 1797} {"train_loss": -23.231985092163086, "global_step": 149160, "epoch": 1797} {"train_loss": -23.344707489013672, "global_step": 149161, "epoch": 1797} {"train_loss": -22.974180221557617, "global_step": 149162, "epoch": 1797} {"train_loss": -23.161928176879883, "global_step": 149163, "epoch": 1797} {"train_loss": -22.942150115966797, "global_step": 149164, "epoch": 1797} {"train_loss": -23.037429809570312, "global_step": 149165, "epoch": 1797} {"train_loss": -23.01782989501953, "global_step": 149166, "epoch": 1797} {"train_loss": -23.30817985534668, "global_step": 149167, "epoch": 1797} {"train_loss": -23.07416343688965, "global_step": 149168, "epoch": 1797} {"train_loss": -23.389789581298828, "global_step": 149169, "epoch": 1797} {"train_loss": -23.215269088745117, "global_step": 149170, "epoch": 1797} {"train_loss": -23.11496353149414, "global_step": 149171, "epoch": 1797} {"train_loss": -22.929195404052734, "global_step": 149172, "epoch": 1797} {"train_loss": -23.127500534057617, "global_step": 149173, "epoch": 1797} {"train_loss": -23.34686851501465, "global_step": 149174, "epoch": 1797} {"train_loss": -23.100984573364258, "global_step": 149175, "epoch": 1797} {"train_loss": -23.59919548034668, "global_step": 149176, "epoch": 1797} {"train_loss": -22.981752395629883, "global_step": 149177, "epoch": 1797} {"train_loss": -23.103879928588867, "global_step": 149178, "epoch": 1797} {"train_loss": -23.304807662963867, "global_step": 149179, "epoch": 1797} {"train_loss": -23.34358787536621, "global_step": 149180, "epoch": 1797} {"train_loss": -23.56493377685547, "global_step": 149181, "epoch": 1797} {"train_loss": -22.657033920288086, "global_step": 149182, "epoch": 1797} {"train_loss": -23.246112823486328, "global_step": 149183, "epoch": 1797} {"train_loss": -23.158082962036133, "global_step": 149184, "epoch": 1797} {"train_loss": -22.921302795410156, "global_step": 149185, "epoch": 1797} {"train_loss": -23.090513229370117, "global_step": 149186, "epoch": 1797} {"train_loss": -23.265531539916992, "global_step": 149187, "epoch": 1797} {"train_loss": -23.442977905273438, "global_step": 149188, "epoch": 1797} {"train_loss": -23.244470596313477, "global_step": 149189, "epoch": 1797} {"train_loss": -23.321529388427734, "global_step": 149190, "epoch": 1797} {"train_loss": -23.135190963745117, "global_step": 149191, "epoch": 1797} {"train_loss": -23.4266357421875, "global_step": 149192, "epoch": 1797} {"train_loss": -23.223630905151367, "global_step": 149193, "epoch": 1797} {"train_loss": -23.747283935546875, "global_step": 149194, "epoch": 1797} {"train_loss": -23.578397750854492, "global_step": 149195, "epoch": 1797} {"train_loss": -23.519153594970703, "global_step": 149196, "epoch": 1797} {"train_loss": -23.335363388061523, "global_step": 149197, "epoch": 1797} {"train_loss": -23.115619659423828, "global_step": 149198, "epoch": 1797} {"train_loss": -23.02277183532715, "global_step": 149199, "epoch": 1797} {"train_loss": -23.261157989501953, "global_step": 149200, "epoch": 1797} {"train_loss": -23.356054306030273, "global_step": 149201, "epoch": 1797} {"train_loss": -23.774484634399414, "global_step": 149202, "epoch": 1797} {"train_loss": -23.346498489379883, "global_step": 149203, "epoch": 1797} {"train_loss": -23.495737075805664, "global_step": 149204, "epoch": 1797} {"train_loss": -23.171463012695312, "global_step": 149205, "epoch": 1797} {"train_loss": -23.4639835357666, "global_step": 149206, "epoch": 1797} {"train_loss": -23.381166458129883, "global_step": 149207, "epoch": 1797} {"train_loss": -23.204259872436523, "global_step": 149208, "epoch": 1797} {"train_loss": -23.177562713623047, "global_step": 149209, "epoch": 1797} {"train_loss": -23.04971694946289, "global_step": 149210, "epoch": 1797} {"train_loss": -23.079269409179688, "global_step": 149211, "epoch": 1797} {"train_loss": -23.25410270690918, "global_step": 149212, "epoch": 1797} {"train_loss": -23.63323402404785, "global_step": 149213, "epoch": 1797} {"train_loss": -23.03261375427246, "global_step": 149214, "epoch": 1797} {"train_loss": -23.53998565673828, "global_step": 149215, "epoch": 1797} {"train_loss": -23.341487884521484, "global_step": 149216, "epoch": 1797} {"train_loss": -23.478891372680664, "global_step": 149217, "epoch": 1797} {"train_loss": -23.44264030456543, "global_step": 149218, "epoch": 1797} {"train_loss": -23.66414451599121, "global_step": 149219, "epoch": 1797} {"train_loss": -22.818464279174805, "global_step": 149220, "epoch": 1797} {"train_loss": -23.0136775970459, "global_step": 149221, "epoch": 1797} {"train_loss": -23.151968002319336, "global_step": 149222, "epoch": 1797} {"train_loss": -23.43341827392578, "global_step": 149223, "epoch": 1797} {"train_loss": -22.80184555053711, "global_step": 149224, "epoch": 1797} {"train_loss": -23.0089168548584, "global_step": 149225, "epoch": 1797} {"train_loss": -22.894588470458984, "global_step": 149226, "epoch": 1797} {"train_loss": -23.30311393737793, "global_step": 149227, "epoch": 1797} {"train_loss": -22.99995231628418, "global_step": 149228, "epoch": 1797} {"train_loss": -23.271177291870117, "global_step": 149229, "epoch": 1797} {"train_loss": -23.285158157348633, "global_step": 149230, "epoch": 1797} {"train_loss": -23.2060604095459, "global_step": 149231, "epoch": 1797} {"train_loss": -23.028276443481445, "global_step": 149232, "epoch": 1797} {"train_loss": -23.216646998761647, "global_step": 149233, "epoch": 1797, "val_loss": 6331590.5} {"train_loss": -22.699691772460938, "global_step": 149234, "epoch": 1798} {"train_loss": -23.14999008178711, "global_step": 149235, "epoch": 1798} {"train_loss": -22.541500091552734, "global_step": 149236, "epoch": 1798} {"train_loss": -22.43697166442871, "global_step": 149237, "epoch": 1798} {"train_loss": -22.404552459716797, "global_step": 149238, "epoch": 1798} {"train_loss": -22.40939712524414, "global_step": 149239, "epoch": 1798} {"train_loss": -22.940603256225586, "global_step": 149240, "epoch": 1798} {"train_loss": -22.438034057617188, "global_step": 149241, "epoch": 1798} {"train_loss": -22.865041732788086, "global_step": 149242, "epoch": 1798} {"train_loss": -22.45938491821289, "global_step": 149243, "epoch": 1798} {"train_loss": -22.938833236694336, "global_step": 149244, "epoch": 1798} {"train_loss": -22.932537078857422, "global_step": 149245, "epoch": 1798} {"train_loss": -22.58670997619629, "global_step": 149246, "epoch": 1798} {"train_loss": -22.917055130004883, "global_step": 149247, "epoch": 1798} {"train_loss": -22.79469108581543, "global_step": 149248, "epoch": 1798} {"train_loss": -23.257572174072266, "global_step": 149249, "epoch": 1798} {"train_loss": -22.481531143188477, "global_step": 149250, "epoch": 1798} {"train_loss": -23.445295333862305, "global_step": 149251, "epoch": 1798} {"train_loss": -23.126623153686523, "global_step": 149252, "epoch": 1798} {"train_loss": -23.020755767822266, "global_step": 149253, "epoch": 1798} {"train_loss": -22.89824867248535, "global_step": 149254, "epoch": 1798} {"train_loss": -23.274383544921875, "global_step": 149255, "epoch": 1798} {"train_loss": -23.05660629272461, "global_step": 149256, "epoch": 1798} {"train_loss": -23.209205627441406, "global_step": 149257, "epoch": 1798} {"train_loss": -23.109289169311523, "global_step": 149258, "epoch": 1798} {"train_loss": -23.196699142456055, "global_step": 149259, "epoch": 1798} {"train_loss": -22.94549560546875, "global_step": 149260, "epoch": 1798} {"train_loss": -23.0972900390625, "global_step": 149261, "epoch": 1798} {"train_loss": -23.355955123901367, "global_step": 149262, "epoch": 1798} {"train_loss": -23.018423080444336, "global_step": 149263, "epoch": 1798} {"train_loss": -23.45389175415039, "global_step": 149264, "epoch": 1798} {"train_loss": -23.418508529663086, "global_step": 149265, "epoch": 1798} {"train_loss": -23.092145919799805, "global_step": 149266, "epoch": 1798} {"train_loss": -22.932523727416992, "global_step": 149267, "epoch": 1798} {"train_loss": -23.015146255493164, "global_step": 149268, "epoch": 1798} {"train_loss": -23.10379981994629, "global_step": 149269, "epoch": 1798} {"train_loss": -23.06976318359375, "global_step": 149270, "epoch": 1798} {"train_loss": -23.269079208374023, "global_step": 149271, "epoch": 1798} {"train_loss": -23.281620025634766, "global_step": 149272, "epoch": 1798} {"train_loss": -23.541234970092773, "global_step": 149273, "epoch": 1798} {"train_loss": -23.146595001220703, "global_step": 149274, "epoch": 1798} {"train_loss": -23.55010414123535, "global_step": 149275, "epoch": 1798} {"train_loss": -23.494388580322266, "global_step": 149276, "epoch": 1798} {"train_loss": -23.135190963745117, "global_step": 149277, "epoch": 1798} {"train_loss": -23.594141006469727, "global_step": 149278, "epoch": 1798} {"train_loss": -23.57036781311035, "global_step": 149279, "epoch": 1798} {"train_loss": -23.219486236572266, "global_step": 149280, "epoch": 1798} {"train_loss": -22.953886032104492, "global_step": 149281, "epoch": 1798} {"train_loss": -23.151325225830078, "global_step": 149282, "epoch": 1798} {"train_loss": -23.223495483398438, "global_step": 149283, "epoch": 1798} {"train_loss": -23.083982467651367, "global_step": 149284, "epoch": 1798} {"train_loss": -23.477746963500977, "global_step": 149285, "epoch": 1798} {"train_loss": -23.184558868408203, "global_step": 149286, "epoch": 1798} {"train_loss": -23.3015193939209, "global_step": 149287, "epoch": 1798} {"train_loss": -23.813417434692383, "global_step": 149288, "epoch": 1798} {"train_loss": -23.368274688720703, "global_step": 149289, "epoch": 1798} {"train_loss": -23.172395706176758, "global_step": 149290, "epoch": 1798} {"train_loss": -23.287948608398438, "global_step": 149291, "epoch": 1798} {"train_loss": -23.39288902282715, "global_step": 149292, "epoch": 1798} {"train_loss": -23.405981063842773, "global_step": 149293, "epoch": 1798} {"train_loss": -23.286500930786133, "global_step": 149294, "epoch": 1798} {"train_loss": -23.5036678314209, "global_step": 149295, "epoch": 1798} {"train_loss": -22.92439079284668, "global_step": 149296, "epoch": 1798} {"train_loss": -23.290225982666016, "global_step": 149297, "epoch": 1798} {"train_loss": -23.25769805908203, "global_step": 149298, "epoch": 1798} {"train_loss": -23.2003173828125, "global_step": 149299, "epoch": 1798} {"train_loss": -23.185930252075195, "global_step": 149300, "epoch": 1798} {"train_loss": -23.31396484375, "global_step": 149301, "epoch": 1798} {"train_loss": -23.136016845703125, "global_step": 149302, "epoch": 1798} {"train_loss": -23.538602828979492, "global_step": 149303, "epoch": 1798} {"train_loss": -23.273414611816406, "global_step": 149304, "epoch": 1798} {"train_loss": -23.594083786010742, "global_step": 149305, "epoch": 1798} {"train_loss": -23.22880744934082, "global_step": 149306, "epoch": 1798} {"train_loss": -23.1351318359375, "global_step": 149307, "epoch": 1798} {"train_loss": -23.370481491088867, "global_step": 149308, "epoch": 1798} {"train_loss": -23.337692260742188, "global_step": 149309, "epoch": 1798} {"train_loss": -23.31942367553711, "global_step": 149310, "epoch": 1798} {"train_loss": -23.64640998840332, "global_step": 149311, "epoch": 1798} {"train_loss": -23.217405319213867, "global_step": 149312, "epoch": 1798} {"train_loss": -23.23836326599121, "global_step": 149313, "epoch": 1798} {"train_loss": -23.180959701538086, "global_step": 149314, "epoch": 1798} {"train_loss": -23.541351318359375, "global_step": 149315, "epoch": 1798} {"train_loss": -23.149748377053136, "global_step": 149316, "epoch": 1798, "val_loss": 6317731.0} {"train_loss": -22.98423194885254, "global_step": 149317, "epoch": 1799} {"train_loss": -22.849594116210938, "global_step": 149318, "epoch": 1799} {"train_loss": -23.465194702148438, "global_step": 149319, "epoch": 1799} {"train_loss": -22.894840240478516, "global_step": 149320, "epoch": 1799} {"train_loss": -22.97250747680664, "global_step": 149321, "epoch": 1799} {"train_loss": -22.950647354125977, "global_step": 149322, "epoch": 1799} {"train_loss": -22.851484298706055, "global_step": 149323, "epoch": 1799} {"train_loss": -22.89076042175293, "global_step": 149324, "epoch": 1799} {"train_loss": -23.280542373657227, "global_step": 149325, "epoch": 1799} {"train_loss": -23.03066635131836, "global_step": 149326, "epoch": 1799} {"train_loss": -23.05829620361328, "global_step": 149327, "epoch": 1799} {"train_loss": -23.1049747467041, "global_step": 149328, "epoch": 1799} {"train_loss": -22.945404052734375, "global_step": 149329, "epoch": 1799} {"train_loss": -23.233112335205078, "global_step": 149330, "epoch": 1799} {"train_loss": -23.024093627929688, "global_step": 149331, "epoch": 1799} {"train_loss": -23.080251693725586, "global_step": 149332, "epoch": 1799} {"train_loss": -23.283233642578125, "global_step": 149333, "epoch": 1799} {"train_loss": -23.290950775146484, "global_step": 149334, "epoch": 1799} {"train_loss": -23.453989028930664, "global_step": 149335, "epoch": 1799} {"train_loss": -23.137649536132812, "global_step": 149336, "epoch": 1799} {"train_loss": -23.19889259338379, "global_step": 149337, "epoch": 1799} {"train_loss": -23.31703758239746, "global_step": 149338, "epoch": 1799} {"train_loss": -23.006784439086914, "global_step": 149339, "epoch": 1799} {"train_loss": -23.065670013427734, "global_step": 149340, "epoch": 1799} {"train_loss": -23.327041625976562, "global_step": 149341, "epoch": 1799} {"train_loss": -23.204727172851562, "global_step": 149342, "epoch": 1799} {"train_loss": -23.474098205566406, "global_step": 149343, "epoch": 1799} {"train_loss": -23.332469940185547, "global_step": 149344, "epoch": 1799} {"train_loss": -23.269935607910156, "global_step": 149345, "epoch": 1799} {"train_loss": -23.317834854125977, "global_step": 149346, "epoch": 1799} {"train_loss": -23.2285213470459, "global_step": 149347, "epoch": 1799} {"train_loss": -23.432859420776367, "global_step": 149348, "epoch": 1799} {"train_loss": -23.10399055480957, "global_step": 149349, "epoch": 1799} {"train_loss": -23.086530685424805, "global_step": 149350, "epoch": 1799} {"train_loss": -23.1944637298584, "global_step": 149351, "epoch": 1799} {"train_loss": -23.204862594604492, "global_step": 149352, "epoch": 1799} {"train_loss": -23.208341598510742, "global_step": 149353, "epoch": 1799} {"train_loss": -22.94434356689453, "global_step": 149354, "epoch": 1799} {"train_loss": -23.357379913330078, "global_step": 149355, "epoch": 1799} {"train_loss": -23.66217613220215, "global_step": 149356, "epoch": 1799} {"train_loss": -23.302268981933594, "global_step": 149357, "epoch": 1799} {"train_loss": -23.0113582611084, "global_step": 149358, "epoch": 1799} {"train_loss": -23.585180282592773, "global_step": 149359, "epoch": 1799} {"train_loss": -23.548355102539062, "global_step": 149360, "epoch": 1799} {"train_loss": -23.435115814208984, "global_step": 149361, "epoch": 1799} {"train_loss": -23.331995010375977, "global_step": 149362, "epoch": 1799} {"train_loss": -23.327695846557617, "global_step": 149363, "epoch": 1799} {"train_loss": -23.366167068481445, "global_step": 149364, "epoch": 1799} {"train_loss": -23.36977195739746, "global_step": 149365, "epoch": 1799} {"train_loss": -23.332965850830078, "global_step": 149366, "epoch": 1799} {"train_loss": -23.198623657226562, "global_step": 149367, "epoch": 1799} {"train_loss": -23.18616485595703, "global_step": 149368, "epoch": 1799} {"train_loss": -23.177204132080078, "global_step": 149369, "epoch": 1799} {"train_loss": -23.551761627197266, "global_step": 149370, "epoch": 1799} {"train_loss": -23.237110137939453, "global_step": 149371, "epoch": 1799} {"train_loss": -23.26963996887207, "global_step": 149372, "epoch": 1799} {"train_loss": -23.47661781311035, "global_step": 149373, "epoch": 1799} {"train_loss": -23.189929962158203, "global_step": 149374, "epoch": 1799} {"train_loss": -23.11225128173828, "global_step": 149375, "epoch": 1799} {"train_loss": -23.39902687072754, "global_step": 149376, "epoch": 1799} {"train_loss": -23.43571662902832, "global_step": 149377, "epoch": 1799} {"train_loss": -23.296106338500977, "global_step": 149378, "epoch": 1799} {"train_loss": -22.98423194885254, "global_step": 149379, "epoch": 1799} {"train_loss": -23.13043785095215, "global_step": 149380, "epoch": 1799} {"train_loss": -23.13204002380371, "global_step": 149381, "epoch": 1799} {"train_loss": -22.993356704711914, "global_step": 149382, "epoch": 1799} {"train_loss": -23.28456687927246, "global_step": 149383, "epoch": 1799} {"train_loss": -23.460229873657227, "global_step": 149384, "epoch": 1799} {"train_loss": -23.3804988861084, "global_step": 149385, "epoch": 1799} {"train_loss": -23.347488403320312, "global_step": 149386, "epoch": 1799} {"train_loss": -23.481027603149414, "global_step": 149387, "epoch": 1799} {"train_loss": -23.55766487121582, "global_step": 149388, "epoch": 1799} {"train_loss": -23.45180320739746, "global_step": 149389, "epoch": 1799} {"train_loss": -22.785497665405273, "global_step": 149390, "epoch": 1799} {"train_loss": -23.25214958190918, "global_step": 149391, "epoch": 1799} {"train_loss": -23.69966697692871, "global_step": 149392, "epoch": 1799} {"train_loss": -23.374181747436523, "global_step": 149393, "epoch": 1799} {"train_loss": -23.304121017456055, "global_step": 149394, "epoch": 1799} {"train_loss": -23.50424575805664, "global_step": 149395, "epoch": 1799} {"train_loss": -23.274417877197266, "global_step": 149396, "epoch": 1799} {"train_loss": -23.443603515625, "global_step": 149397, "epoch": 1799} {"train_loss": -23.3359375, "global_step": 149398, "epoch": 1799} {"train_loss": -23.225506472300335, "global_step": 149399, "epoch": 1799, "val_loss": 6299746.0} {"train_loss": -23.10184097290039, "global_step": 149400, "epoch": 1800} {"train_loss": -23.00412368774414, "global_step": 149401, "epoch": 1800} {"train_loss": -23.474624633789062, "global_step": 149402, "epoch": 1800} {"train_loss": -22.970855712890625, "global_step": 149403, "epoch": 1800} {"train_loss": -23.251516342163086, "global_step": 149404, "epoch": 1800} {"train_loss": -23.009672164916992, "global_step": 149405, "epoch": 1800} {"train_loss": -23.22894859313965, "global_step": 149406, "epoch": 1800} {"train_loss": -22.918424606323242, "global_step": 149407, "epoch": 1800} {"train_loss": -23.214426040649414, "global_step": 149408, "epoch": 1800} {"train_loss": -22.988798141479492, "global_step": 149409, "epoch": 1800} {"train_loss": -22.92529296875, "global_step": 149410, "epoch": 1800} {"train_loss": -22.646900177001953, "global_step": 149411, "epoch": 1800} {"train_loss": -22.995763778686523, "global_step": 149412, "epoch": 1800} {"train_loss": -22.875097274780273, "global_step": 149413, "epoch": 1800} {"train_loss": -23.250139236450195, "global_step": 149414, "epoch": 1800} {"train_loss": -23.18146324157715, "global_step": 149415, "epoch": 1800} {"train_loss": -23.114622116088867, "global_step": 149416, "epoch": 1800} {"train_loss": -22.88018226623535, "global_step": 149417, "epoch": 1800} {"train_loss": -23.041122436523438, "global_step": 149418, "epoch": 1800} {"train_loss": -22.918127059936523, "global_step": 149419, "epoch": 1800} {"train_loss": -23.37165069580078, "global_step": 149420, "epoch": 1800} {"train_loss": -23.125343322753906, "global_step": 149421, "epoch": 1800} {"train_loss": -23.342315673828125, "global_step": 149422, "epoch": 1800} {"train_loss": -23.050567626953125, "global_step": 149423, "epoch": 1800} {"train_loss": -22.7736759185791, "global_step": 149424, "epoch": 1800} {"train_loss": -23.45794677734375, "global_step": 149425, "epoch": 1800} {"train_loss": -22.70725440979004, "global_step": 149426, "epoch": 1800} {"train_loss": -23.5264835357666, "global_step": 149427, "epoch": 1800} {"train_loss": -23.141080856323242, "global_step": 149428, "epoch": 1800} {"train_loss": -23.03554344177246, "global_step": 149429, "epoch": 1800} {"train_loss": -23.240230560302734, "global_step": 149430, "epoch": 1800} {"train_loss": -23.02447509765625, "global_step": 149431, "epoch": 1800} {"train_loss": -22.56732749938965, "global_step": 149432, "epoch": 1800} {"train_loss": -23.25109100341797, "global_step": 149433, "epoch": 1800} {"train_loss": -23.546152114868164, "global_step": 149434, "epoch": 1800} {"train_loss": -23.61432647705078, "global_step": 149435, "epoch": 1800} {"train_loss": -23.220792770385742, "global_step": 149436, "epoch": 1800} {"train_loss": -23.323537826538086, "global_step": 149437, "epoch": 1800} {"train_loss": -23.176504135131836, "global_step": 149438, "epoch": 1800} {"train_loss": -23.5559139251709, "global_step": 149439, "epoch": 1800} {"train_loss": -23.19403648376465, "global_step": 149440, "epoch": 1800} {"train_loss": -23.332937240600586, "global_step": 149441, "epoch": 1800} {"train_loss": -22.876192092895508, "global_step": 149442, "epoch": 1800} {"train_loss": -23.42738914489746, "global_step": 149443, "epoch": 1800} {"train_loss": -23.358579635620117, "global_step": 149444, "epoch": 1800} {"train_loss": -23.3043270111084, "global_step": 149445, "epoch": 1800} {"train_loss": -23.458669662475586, "global_step": 149446, "epoch": 1800} {"train_loss": -23.43866729736328, "global_step": 149447, "epoch": 1800} {"train_loss": -23.460037231445312, "global_step": 149448, "epoch": 1800} {"train_loss": -23.348602294921875, "global_step": 149449, "epoch": 1800} {"train_loss": -23.34259033203125, "global_step": 149450, "epoch": 1800} {"train_loss": -23.239547729492188, "global_step": 149451, "epoch": 1800} {"train_loss": -22.99847984313965, "global_step": 149452, "epoch": 1800} {"train_loss": -23.117136001586914, "global_step": 149453, "epoch": 1800} {"train_loss": -23.31583595275879, "global_step": 149454, "epoch": 1800} {"train_loss": -23.621294021606445, "global_step": 149455, "epoch": 1800} {"train_loss": -22.65785789489746, "global_step": 149456, "epoch": 1800} {"train_loss": -23.141916275024414, "global_step": 149457, "epoch": 1800} {"train_loss": -23.084415435791016, "global_step": 149458, "epoch": 1800} {"train_loss": -23.262083053588867, "global_step": 149459, "epoch": 1800} {"train_loss": -22.974132537841797, "global_step": 149460, "epoch": 1800} {"train_loss": -23.12672233581543, "global_step": 149461, "epoch": 1800} {"train_loss": -23.41057777404785, "global_step": 149462, "epoch": 1800} {"train_loss": -23.37470054626465, "global_step": 149463, "epoch": 1800} {"train_loss": -23.268949508666992, "global_step": 149464, "epoch": 1800} {"train_loss": -23.50816535949707, "global_step": 149465, "epoch": 1800} {"train_loss": -23.028615951538086, "global_step": 149466, "epoch": 1800} {"train_loss": -23.440753936767578, "global_step": 149467, "epoch": 1800} {"train_loss": -22.993619918823242, "global_step": 149468, "epoch": 1800} {"train_loss": -23.374935150146484, "global_step": 149469, "epoch": 1800} {"train_loss": -23.085330963134766, "global_step": 149470, "epoch": 1800} {"train_loss": -23.127878189086914, "global_step": 149471, "epoch": 1800} {"train_loss": -23.312707901000977, "global_step": 149472, "epoch": 1800} {"train_loss": -23.163606643676758, "global_step": 149473, "epoch": 1800} {"train_loss": -23.125730514526367, "global_step": 149474, "epoch": 1800} {"train_loss": -23.356876373291016, "global_step": 149475, "epoch": 1800} {"train_loss": -23.501754760742188, "global_step": 149476, "epoch": 1800} {"train_loss": -23.339153289794922, "global_step": 149477, "epoch": 1800} {"train_loss": -23.496822357177734, "global_step": 149478, "epoch": 1800} {"train_loss": -23.244596481323242, "global_step": 149479, "epoch": 1800} {"train_loss": -23.43755531311035, "global_step": 149480, "epoch": 1800} {"train_loss": -23.29493522644043, "global_step": 149481, "epoch": 1800} {"train_loss": -23.20894781365452, "global_step": 149482, "epoch": 1800, "train/sim_max_reward_0": 1.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 0.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4500000": 1.0, "test/sim_max_reward_4500001": 1.0, "test/sim_max_reward_4500002": 1.0, "test/sim_max_reward_4500003": 1.0, "test/sim_max_reward_4500004": 1.0, "test/sim_max_reward_4500005": 1.0, "test/sim_max_reward_4500006": 1.0, "test/sim_max_reward_4500007": 1.0, "test/sim_max_reward_4500008": 1.0, "test/sim_max_reward_4500009": 1.0, "test/sim_max_reward_4500010": 1.0, "test/sim_max_reward_4500011": 1.0, "test/sim_max_reward_4500012": 1.0, "test/sim_max_reward_4500013": 1.0, "test/sim_max_reward_4500014": 1.0, "test/sim_max_reward_4500015": 1.0, "test/sim_max_reward_4500016": 1.0, "test/sim_max_reward_4500017": 1.0, "test/sim_max_reward_4500018": 1.0, "test/sim_max_reward_4500019": 1.0, "test/sim_max_reward_4500020": 1.0, "test/sim_max_reward_4500021": 1.0, "train/mean_score": 0.8333333333333334, "test/mean_score": 1.0, "val_loss": 6331519.0} {"train_loss": -23.06374168395996, "global_step": 149483, "epoch": 1801} {"train_loss": -22.58078956604004, "global_step": 149484, "epoch": 1801} {"train_loss": -22.988317489624023, "global_step": 149485, "epoch": 1801} {"train_loss": -22.424453735351562, "global_step": 149486, "epoch": 1801} {"train_loss": -22.657169342041016, "global_step": 149487, "epoch": 1801} {"train_loss": -23.041868209838867, "global_step": 149488, "epoch": 1801} {"train_loss": -22.812578201293945, "global_step": 149489, "epoch": 1801} {"train_loss": -23.355987548828125, "global_step": 149490, "epoch": 1801} {"train_loss": -22.579893112182617, "global_step": 149491, "epoch": 1801} {"train_loss": -22.90896987915039, "global_step": 149492, "epoch": 1801} {"train_loss": -23.01773452758789, "global_step": 149493, "epoch": 1801} {"train_loss": -22.853256225585938, "global_step": 149494, "epoch": 1801} {"train_loss": -22.771865844726562, "global_step": 149495, "epoch": 1801} {"train_loss": -22.993717193603516, "global_step": 149496, "epoch": 1801} {"train_loss": -22.696414947509766, "global_step": 149497, "epoch": 1801} {"train_loss": -22.88140869140625, "global_step": 149498, "epoch": 1801} {"train_loss": -23.148834228515625, "global_step": 149499, "epoch": 1801} {"train_loss": -23.198999404907227, "global_step": 149500, "epoch": 1801} {"train_loss": -23.055259704589844, "global_step": 149501, "epoch": 1801} {"train_loss": -22.7995662689209, "global_step": 149502, "epoch": 1801} {"train_loss": -22.870405197143555, "global_step": 149503, "epoch": 1801} {"train_loss": -23.041933059692383, "global_step": 149504, "epoch": 1801} {"train_loss": -23.024621963500977, "global_step": 149505, "epoch": 1801} {"train_loss": -23.23213768005371, "global_step": 149506, "epoch": 1801} {"train_loss": -23.099058151245117, "global_step": 149507, "epoch": 1801} {"train_loss": -23.042125701904297, "global_step": 149508, "epoch": 1801} {"train_loss": -22.858173370361328, "global_step": 149509, "epoch": 1801} {"train_loss": -23.444849014282227, "global_step": 149510, "epoch": 1801} {"train_loss": -22.89303970336914, "global_step": 149511, "epoch": 1801} {"train_loss": -23.191736221313477, "global_step": 149512, "epoch": 1801} {"train_loss": -23.351316452026367, "global_step": 149513, "epoch": 1801} {"train_loss": -23.392257690429688, "global_step": 149514, "epoch": 1801} {"train_loss": -23.18349266052246, "global_step": 149515, "epoch": 1801} {"train_loss": -22.84050750732422, "global_step": 149516, "epoch": 1801} {"train_loss": -23.21906852722168, "global_step": 149517, "epoch": 1801} {"train_loss": -22.890846252441406, "global_step": 149518, "epoch": 1801} {"train_loss": -23.507572174072266, "global_step": 149519, "epoch": 1801} {"train_loss": -23.007741928100586, "global_step": 149520, "epoch": 1801} {"train_loss": -23.48882484436035, "global_step": 149521, "epoch": 1801} {"train_loss": -23.300390243530273, "global_step": 149522, "epoch": 1801} {"train_loss": -22.84369468688965, "global_step": 149523, "epoch": 1801} {"train_loss": -23.2950439453125, "global_step": 149524, "epoch": 1801} {"train_loss": -23.302780151367188, "global_step": 149525, "epoch": 1801} {"train_loss": -22.908660888671875, "global_step": 149526, "epoch": 1801} {"train_loss": -23.284072875976562, "global_step": 149527, "epoch": 1801} {"train_loss": -23.43820571899414, "global_step": 149528, "epoch": 1801} {"train_loss": -23.214982986450195, "global_step": 149529, "epoch": 1801} {"train_loss": -22.99444007873535, "global_step": 149530, "epoch": 1801} {"train_loss": -23.138425827026367, "global_step": 149531, "epoch": 1801} {"train_loss": -23.446287155151367, "global_step": 149532, "epoch": 1801} {"train_loss": -22.893497467041016, "global_step": 149533, "epoch": 1801} {"train_loss": -23.33542251586914, "global_step": 149534, "epoch": 1801} {"train_loss": -23.165597915649414, "global_step": 149535, "epoch": 1801} {"train_loss": -22.92852020263672, "global_step": 149536, "epoch": 1801} {"train_loss": -23.6207332611084, "global_step": 149537, "epoch": 1801} {"train_loss": -22.711240768432617, "global_step": 149538, "epoch": 1801} {"train_loss": -23.06815528869629, "global_step": 149539, "epoch": 1801} {"train_loss": -23.340526580810547, "global_step": 149540, "epoch": 1801} {"train_loss": -22.77130699157715, "global_step": 149541, "epoch": 1801} {"train_loss": -23.511449813842773, "global_step": 149542, "epoch": 1801} {"train_loss": -22.982532501220703, "global_step": 149543, "epoch": 1801} {"train_loss": -22.987314224243164, "global_step": 149544, "epoch": 1801} {"train_loss": -23.31020164489746, "global_step": 149545, "epoch": 1801} {"train_loss": -23.004968643188477, "global_step": 149546, "epoch": 1801} {"train_loss": -23.025094985961914, "global_step": 149547, "epoch": 1801} {"train_loss": -22.859567642211914, "global_step": 149548, "epoch": 1801} {"train_loss": -23.297042846679688, "global_step": 149549, "epoch": 1801} {"train_loss": -23.147804260253906, "global_step": 149550, "epoch": 1801} {"train_loss": -23.36598777770996, "global_step": 149551, "epoch": 1801} {"train_loss": -23.496150970458984, "global_step": 149552, "epoch": 1801} {"train_loss": -22.99153709411621, "global_step": 149553, "epoch": 1801} {"train_loss": -23.443893432617188, "global_step": 149554, "epoch": 1801} {"train_loss": -23.283607482910156, "global_step": 149555, "epoch": 1801} {"train_loss": -22.812231063842773, "global_step": 149556, "epoch": 1801} {"train_loss": -23.275327682495117, "global_step": 149557, "epoch": 1801} {"train_loss": -23.166669845581055, "global_step": 149558, "epoch": 1801} {"train_loss": -23.13454246520996, "global_step": 149559, "epoch": 1801} {"train_loss": -23.32527732849121, "global_step": 149560, "epoch": 1801} {"train_loss": -23.03458023071289, "global_step": 149561, "epoch": 1801} {"train_loss": -23.365554809570312, "global_step": 149562, "epoch": 1801} {"train_loss": -23.159021377563477, "global_step": 149563, "epoch": 1801} {"train_loss": -23.13361167907715, "global_step": 149564, "epoch": 1801} {"train_loss": -23.085672286619623, "global_step": 149565, "epoch": 1801, "val_loss": 6365517.5} {"train_loss": -22.706283569335938, "global_step": 149566, "epoch": 1802} {"train_loss": -21.846982955932617, "global_step": 149567, "epoch": 1802} {"train_loss": -22.553319931030273, "global_step": 149568, "epoch": 1802} {"train_loss": -22.363391876220703, "global_step": 149569, "epoch": 1802} {"train_loss": -22.303186416625977, "global_step": 149570, "epoch": 1802} {"train_loss": -22.680362701416016, "global_step": 149571, "epoch": 1802} {"train_loss": -22.863006591796875, "global_step": 149572, "epoch": 1802} {"train_loss": -22.497119903564453, "global_step": 149573, "epoch": 1802} {"train_loss": -22.601369857788086, "global_step": 149574, "epoch": 1802} {"train_loss": -22.989912033081055, "global_step": 149575, "epoch": 1802} {"train_loss": -22.73590087890625, "global_step": 149576, "epoch": 1802} {"train_loss": -22.41206169128418, "global_step": 149577, "epoch": 1802} {"train_loss": -22.454147338867188, "global_step": 149578, "epoch": 1802} {"train_loss": -22.679067611694336, "global_step": 149579, "epoch": 1802} {"train_loss": -22.7097110748291, "global_step": 149580, "epoch": 1802} {"train_loss": -22.809677124023438, "global_step": 149581, "epoch": 1802} {"train_loss": -22.854536056518555, "global_step": 149582, "epoch": 1802} {"train_loss": -22.693267822265625, "global_step": 149583, "epoch": 1802} {"train_loss": -22.697467803955078, "global_step": 149584, "epoch": 1802} {"train_loss": -22.770872116088867, "global_step": 149585, "epoch": 1802} {"train_loss": -22.62656021118164, "global_step": 149586, "epoch": 1802} {"train_loss": -23.1750431060791, "global_step": 149587, "epoch": 1802} {"train_loss": -23.02900505065918, "global_step": 149588, "epoch": 1802} {"train_loss": -23.112415313720703, "global_step": 149589, "epoch": 1802} {"train_loss": -22.284631729125977, "global_step": 149590, "epoch": 1802} {"train_loss": -22.856489181518555, "global_step": 149591, "epoch": 1802} {"train_loss": -23.112241744995117, "global_step": 149592, "epoch": 1802} {"train_loss": -23.605575561523438, "global_step": 149593, "epoch": 1802} {"train_loss": -23.12031364440918, "global_step": 149594, "epoch": 1802} {"train_loss": -22.7432918548584, "global_step": 149595, "epoch": 1802} {"train_loss": -23.16425132751465, "global_step": 149596, "epoch": 1802} {"train_loss": -22.99616813659668, "global_step": 149597, "epoch": 1802} {"train_loss": -23.22272300720215, "global_step": 149598, "epoch": 1802} {"train_loss": -23.354856491088867, "global_step": 149599, "epoch": 1802} {"train_loss": -23.381031036376953, "global_step": 149600, "epoch": 1802} {"train_loss": -23.188032150268555, "global_step": 149601, "epoch": 1802} {"train_loss": -23.106494903564453, "global_step": 149602, "epoch": 1802} {"train_loss": -23.150548934936523, "global_step": 149603, "epoch": 1802} {"train_loss": -22.97654914855957, "global_step": 149604, "epoch": 1802} {"train_loss": -23.138442993164062, "global_step": 149605, "epoch": 1802} {"train_loss": -23.105234146118164, "global_step": 149606, "epoch": 1802} {"train_loss": -23.197158813476562, "global_step": 149607, "epoch": 1802} {"train_loss": -23.536579132080078, "global_step": 149608, "epoch": 1802} {"train_loss": -22.96132469177246, "global_step": 149609, "epoch": 1802} {"train_loss": -23.114444732666016, "global_step": 149610, "epoch": 1802} {"train_loss": -23.393274307250977, "global_step": 149611, "epoch": 1802} {"train_loss": -23.338611602783203, "global_step": 149612, "epoch": 1802} {"train_loss": -23.442529678344727, "global_step": 149613, "epoch": 1802} {"train_loss": -23.39192771911621, "global_step": 149614, "epoch": 1802} {"train_loss": -23.108732223510742, "global_step": 149615, "epoch": 1802} {"train_loss": -23.47101402282715, "global_step": 149616, "epoch": 1802} {"train_loss": -23.36757469177246, "global_step": 149617, "epoch": 1802} {"train_loss": -23.030563354492188, "global_step": 149618, "epoch": 1802} {"train_loss": -23.44139862060547, "global_step": 149619, "epoch": 1802} {"train_loss": -23.25821304321289, "global_step": 149620, "epoch": 1802} {"train_loss": -23.49307632446289, "global_step": 149621, "epoch": 1802} {"train_loss": -23.294036865234375, "global_step": 149622, "epoch": 1802} {"train_loss": -23.479522705078125, "global_step": 149623, "epoch": 1802} {"train_loss": -23.459959030151367, "global_step": 149624, "epoch": 1802} {"train_loss": -23.48520278930664, "global_step": 149625, "epoch": 1802} {"train_loss": -23.168964385986328, "global_step": 149626, "epoch": 1802} {"train_loss": -23.649816513061523, "global_step": 149627, "epoch": 1802} {"train_loss": -23.216949462890625, "global_step": 149628, "epoch": 1802} {"train_loss": -23.360198974609375, "global_step": 149629, "epoch": 1802} {"train_loss": -23.20025634765625, "global_step": 149630, "epoch": 1802} {"train_loss": -23.614004135131836, "global_step": 149631, "epoch": 1802} {"train_loss": -23.231094360351562, "global_step": 149632, "epoch": 1802} {"train_loss": -23.510679244995117, "global_step": 149633, "epoch": 1802} {"train_loss": -23.591136932373047, "global_step": 149634, "epoch": 1802} {"train_loss": -23.344135284423828, "global_step": 149635, "epoch": 1802} {"train_loss": -22.869810104370117, "global_step": 149636, "epoch": 1802} {"train_loss": -23.321401596069336, "global_step": 149637, "epoch": 1802} {"train_loss": -23.227338790893555, "global_step": 149638, "epoch": 1802} {"train_loss": -23.67928123474121, "global_step": 149639, "epoch": 1802} {"train_loss": -23.410160064697266, "global_step": 149640, "epoch": 1802} {"train_loss": -23.79025650024414, "global_step": 149641, "epoch": 1802} {"train_loss": -23.412208557128906, "global_step": 149642, "epoch": 1802} {"train_loss": -23.469482421875, "global_step": 149643, "epoch": 1802} {"train_loss": -23.385251998901367, "global_step": 149644, "epoch": 1802} {"train_loss": -23.223966598510742, "global_step": 149645, "epoch": 1802} {"train_loss": -23.24942398071289, "global_step": 149646, "epoch": 1802} {"train_loss": -23.654312133789062, "global_step": 149647, "epoch": 1802} {"train_loss": -23.10453603353845, "global_step": 149648, "epoch": 1802, "val_loss": 6355484.0} {"train_loss": -22.63596534729004, "global_step": 149649, "epoch": 1803} {"train_loss": -22.72721290588379, "global_step": 149650, "epoch": 1803} {"train_loss": -21.58497428894043, "global_step": 149651, "epoch": 1803} {"train_loss": -22.203018188476562, "global_step": 149652, "epoch": 1803} {"train_loss": -22.793188095092773, "global_step": 149653, "epoch": 1803} {"train_loss": -22.813114166259766, "global_step": 149654, "epoch": 1803} {"train_loss": -22.526899337768555, "global_step": 149655, "epoch": 1803} {"train_loss": -22.751066207885742, "global_step": 149656, "epoch": 1803} {"train_loss": -22.87019157409668, "global_step": 149657, "epoch": 1803} {"train_loss": -22.559741973876953, "global_step": 149658, "epoch": 1803} {"train_loss": -23.007959365844727, "global_step": 149659, "epoch": 1803} {"train_loss": -22.443435668945312, "global_step": 149660, "epoch": 1803} {"train_loss": -23.36203384399414, "global_step": 149661, "epoch": 1803} {"train_loss": -22.982877731323242, "global_step": 149662, "epoch": 1803} {"train_loss": -22.962383270263672, "global_step": 149663, "epoch": 1803} {"train_loss": -22.98210334777832, "global_step": 149664, "epoch": 1803} {"train_loss": -22.735088348388672, "global_step": 149665, "epoch": 1803} {"train_loss": -23.252777099609375, "global_step": 149666, "epoch": 1803} {"train_loss": -23.070524215698242, "global_step": 149667, "epoch": 1803} {"train_loss": -23.131488800048828, "global_step": 149668, "epoch": 1803} {"train_loss": -23.105148315429688, "global_step": 149669, "epoch": 1803} {"train_loss": -22.864316940307617, "global_step": 149670, "epoch": 1803} {"train_loss": -23.339710235595703, "global_step": 149671, "epoch": 1803} {"train_loss": -23.09592628479004, "global_step": 149672, "epoch": 1803} {"train_loss": -23.270231246948242, "global_step": 149673, "epoch": 1803} {"train_loss": -23.234310150146484, "global_step": 149674, "epoch": 1803} {"train_loss": -22.848297119140625, "global_step": 149675, "epoch": 1803} {"train_loss": -22.989564895629883, "global_step": 149676, "epoch": 1803} {"train_loss": -23.3407039642334, "global_step": 149677, "epoch": 1803} {"train_loss": -23.15455436706543, "global_step": 149678, "epoch": 1803} {"train_loss": -23.350725173950195, "global_step": 149679, "epoch": 1803} {"train_loss": -22.937406539916992, "global_step": 149680, "epoch": 1803} {"train_loss": -22.93756675720215, "global_step": 149681, "epoch": 1803} {"train_loss": -23.552001953125, "global_step": 149682, "epoch": 1803} {"train_loss": -23.053321838378906, "global_step": 149683, "epoch": 1803} {"train_loss": -22.90924644470215, "global_step": 149684, "epoch": 1803} {"train_loss": -23.132314682006836, "global_step": 149685, "epoch": 1803} {"train_loss": -23.394750595092773, "global_step": 149686, "epoch": 1803} {"train_loss": -22.95131492614746, "global_step": 149687, "epoch": 1803} {"train_loss": -23.07013511657715, "global_step": 149688, "epoch": 1803} {"train_loss": -23.553476333618164, "global_step": 149689, "epoch": 1803} {"train_loss": -23.235212326049805, "global_step": 149690, "epoch": 1803} {"train_loss": -23.26141357421875, "global_step": 149691, "epoch": 1803} {"train_loss": -23.605318069458008, "global_step": 149692, "epoch": 1803} {"train_loss": -22.923198699951172, "global_step": 149693, "epoch": 1803} {"train_loss": -23.3867244720459, "global_step": 149694, "epoch": 1803} {"train_loss": -23.330059051513672, "global_step": 149695, "epoch": 1803} {"train_loss": -23.65004539489746, "global_step": 149696, "epoch": 1803} {"train_loss": -23.30205726623535, "global_step": 149697, "epoch": 1803} {"train_loss": -23.296031951904297, "global_step": 149698, "epoch": 1803} {"train_loss": -23.43275260925293, "global_step": 149699, "epoch": 1803} {"train_loss": -23.205663681030273, "global_step": 149700, "epoch": 1803} {"train_loss": -23.413110733032227, "global_step": 149701, "epoch": 1803} {"train_loss": -23.333829879760742, "global_step": 149702, "epoch": 1803} {"train_loss": -23.589555740356445, "global_step": 149703, "epoch": 1803} {"train_loss": -23.269145965576172, "global_step": 149704, "epoch": 1803} {"train_loss": -23.489105224609375, "global_step": 149705, "epoch": 1803} {"train_loss": -23.288850784301758, "global_step": 149706, "epoch": 1803} {"train_loss": -23.45149040222168, "global_step": 149707, "epoch": 1803} {"train_loss": -23.12466049194336, "global_step": 149708, "epoch": 1803} {"train_loss": -23.24382972717285, "global_step": 149709, "epoch": 1803} {"train_loss": -23.123212814331055, "global_step": 149710, "epoch": 1803} {"train_loss": -23.114295959472656, "global_step": 149711, "epoch": 1803} {"train_loss": -23.118606567382812, "global_step": 149712, "epoch": 1803} {"train_loss": -23.675649642944336, "global_step": 149713, "epoch": 1803} {"train_loss": -23.343481063842773, "global_step": 149714, "epoch": 1803} {"train_loss": -23.501453399658203, "global_step": 149715, "epoch": 1803} {"train_loss": -22.96357536315918, "global_step": 149716, "epoch": 1803} {"train_loss": -23.2181339263916, "global_step": 149717, "epoch": 1803} {"train_loss": -23.273468017578125, "global_step": 149718, "epoch": 1803} {"train_loss": -23.280746459960938, "global_step": 149719, "epoch": 1803} {"train_loss": -23.33216667175293, "global_step": 149720, "epoch": 1803} {"train_loss": -23.335844039916992, "global_step": 149721, "epoch": 1803} {"train_loss": -23.25104331970215, "global_step": 149722, "epoch": 1803} {"train_loss": -23.36232566833496, "global_step": 149723, "epoch": 1803} {"train_loss": -23.224760055541992, "global_step": 149724, "epoch": 1803} {"train_loss": -22.999629974365234, "global_step": 149725, "epoch": 1803} {"train_loss": -23.204357147216797, "global_step": 149726, "epoch": 1803} {"train_loss": -23.45267677307129, "global_step": 149727, "epoch": 1803} {"train_loss": -23.512788772583008, "global_step": 149728, "epoch": 1803} {"train_loss": -23.35970115661621, "global_step": 149729, "epoch": 1803} {"train_loss": -23.341064453125, "global_step": 149730, "epoch": 1803} {"train_loss": -23.137330227587597, "global_step": 149731, "epoch": 1803, "val_loss": 6272444.0} {"train_loss": -22.789470672607422, "global_step": 149732, "epoch": 1804} {"train_loss": -22.826480865478516, "global_step": 149733, "epoch": 1804} {"train_loss": -23.10990333557129, "global_step": 149734, "epoch": 1804} {"train_loss": -23.339033126831055, "global_step": 149735, "epoch": 1804} {"train_loss": -23.00514030456543, "global_step": 149736, "epoch": 1804} {"train_loss": -23.155588150024414, "global_step": 149737, "epoch": 1804} {"train_loss": -23.242267608642578, "global_step": 149738, "epoch": 1804} {"train_loss": -23.05829429626465, "global_step": 149739, "epoch": 1804} {"train_loss": -23.3331241607666, "global_step": 149740, "epoch": 1804} {"train_loss": -23.15765953063965, "global_step": 149741, "epoch": 1804} {"train_loss": -23.71643829345703, "global_step": 149742, "epoch": 1804} {"train_loss": -23.111520767211914, "global_step": 149743, "epoch": 1804} {"train_loss": -23.12210464477539, "global_step": 149744, "epoch": 1804} {"train_loss": -23.019041061401367, "global_step": 149745, "epoch": 1804} {"train_loss": -23.062192916870117, "global_step": 149746, "epoch": 1804} {"train_loss": -23.228343963623047, "global_step": 149747, "epoch": 1804} {"train_loss": -23.498977661132812, "global_step": 149748, "epoch": 1804} {"train_loss": -23.065561294555664, "global_step": 149749, "epoch": 1804} {"train_loss": -23.329748153686523, "global_step": 149750, "epoch": 1804} {"train_loss": -23.29090118408203, "global_step": 149751, "epoch": 1804} {"train_loss": -23.143766403198242, "global_step": 149752, "epoch": 1804} {"train_loss": -23.137907028198242, "global_step": 149753, "epoch": 1804} {"train_loss": -23.190534591674805, "global_step": 149754, "epoch": 1804} {"train_loss": -23.333688735961914, "global_step": 149755, "epoch": 1804} {"train_loss": -23.075105667114258, "global_step": 149756, "epoch": 1804} {"train_loss": -23.060226440429688, "global_step": 149757, "epoch": 1804} {"train_loss": -23.33969497680664, "global_step": 149758, "epoch": 1804} {"train_loss": -23.409841537475586, "global_step": 149759, "epoch": 1804} {"train_loss": -23.166278839111328, "global_step": 149760, "epoch": 1804} {"train_loss": -23.111509323120117, "global_step": 149761, "epoch": 1804} {"train_loss": -22.8853816986084, "global_step": 149762, "epoch": 1804} {"train_loss": -23.323610305786133, "global_step": 149763, "epoch": 1804} {"train_loss": -22.950214385986328, "global_step": 149764, "epoch": 1804} {"train_loss": -23.17520523071289, "global_step": 149765, "epoch": 1804} {"train_loss": -23.435653686523438, "global_step": 149766, "epoch": 1804} {"train_loss": -23.291013717651367, "global_step": 149767, "epoch": 1804} {"train_loss": -23.37714195251465, "global_step": 149768, "epoch": 1804} {"train_loss": -23.07461166381836, "global_step": 149769, "epoch": 1804} {"train_loss": -23.581411361694336, "global_step": 149770, "epoch": 1804} {"train_loss": -23.37501335144043, "global_step": 149771, "epoch": 1804} {"train_loss": -23.26735496520996, "global_step": 149772, "epoch": 1804} {"train_loss": -23.341360092163086, "global_step": 149773, "epoch": 1804} {"train_loss": -23.598241806030273, "global_step": 149774, "epoch": 1804} {"train_loss": -23.48737335205078, "global_step": 149775, "epoch": 1804} {"train_loss": -23.59895133972168, "global_step": 149776, "epoch": 1804} {"train_loss": -23.01263999938965, "global_step": 149777, "epoch": 1804} {"train_loss": -23.44205665588379, "global_step": 149778, "epoch": 1804} {"train_loss": -22.74493408203125, "global_step": 149779, "epoch": 1804} {"train_loss": -23.24075698852539, "global_step": 149780, "epoch": 1804} {"train_loss": -23.071121215820312, "global_step": 149781, "epoch": 1804} {"train_loss": -23.294849395751953, "global_step": 149782, "epoch": 1804} {"train_loss": -23.486963272094727, "global_step": 149783, "epoch": 1804} {"train_loss": -23.413808822631836, "global_step": 149784, "epoch": 1804} {"train_loss": -22.978275299072266, "global_step": 149785, "epoch": 1804} {"train_loss": -23.71735382080078, "global_step": 149786, "epoch": 1804} {"train_loss": -23.531904220581055, "global_step": 149787, "epoch": 1804} {"train_loss": -23.227262496948242, "global_step": 149788, "epoch": 1804} {"train_loss": -22.951147079467773, "global_step": 149789, "epoch": 1804} {"train_loss": -23.229421615600586, "global_step": 149790, "epoch": 1804} {"train_loss": -23.105985641479492, "global_step": 149791, "epoch": 1804} {"train_loss": -23.283424377441406, "global_step": 149792, "epoch": 1804} {"train_loss": -23.11785316467285, "global_step": 149793, "epoch": 1804} {"train_loss": -22.80191993713379, "global_step": 149794, "epoch": 1804} {"train_loss": -23.15215301513672, "global_step": 149795, "epoch": 1804} {"train_loss": -22.97034454345703, "global_step": 149796, "epoch": 1804} {"train_loss": -23.17740821838379, "global_step": 149797, "epoch": 1804} {"train_loss": -23.5455379486084, "global_step": 149798, "epoch": 1804} {"train_loss": -23.02821922302246, "global_step": 149799, "epoch": 1804} {"train_loss": -23.36629295349121, "global_step": 149800, "epoch": 1804} {"train_loss": -23.32380485534668, "global_step": 149801, "epoch": 1804} {"train_loss": -23.123159408569336, "global_step": 149802, "epoch": 1804} {"train_loss": -23.212915420532227, "global_step": 149803, "epoch": 1804} {"train_loss": -23.05120849609375, "global_step": 149804, "epoch": 1804} {"train_loss": -23.10774040222168, "global_step": 149805, "epoch": 1804} {"train_loss": -22.93202781677246, "global_step": 149806, "epoch": 1804} {"train_loss": -23.166112899780273, "global_step": 149807, "epoch": 1804} {"train_loss": -23.371992111206055, "global_step": 149808, "epoch": 1804} {"train_loss": -23.425216674804688, "global_step": 149809, "epoch": 1804} {"train_loss": -23.291046142578125, "global_step": 149810, "epoch": 1804} {"train_loss": -23.068632125854492, "global_step": 149811, "epoch": 1804} {"train_loss": -23.249813079833984, "global_step": 149812, "epoch": 1804} {"train_loss": -23.532527923583984, "global_step": 149813, "epoch": 1804} {"train_loss": -23.213908988309193, "global_step": 149814, "epoch": 1804, "val_loss": 6419391.0} {"train_loss": -22.970020294189453, "global_step": 149815, "epoch": 1805} {"train_loss": -22.917957305908203, "global_step": 149816, "epoch": 1805} {"train_loss": -22.977920532226562, "global_step": 149817, "epoch": 1805} {"train_loss": -22.703786849975586, "global_step": 149818, "epoch": 1805} {"train_loss": -22.896963119506836, "global_step": 149819, "epoch": 1805} {"train_loss": -22.74598503112793, "global_step": 149820, "epoch": 1805} {"train_loss": -22.976285934448242, "global_step": 149821, "epoch": 1805} {"train_loss": -22.80946922302246, "global_step": 149822, "epoch": 1805} {"train_loss": -22.669870376586914, "global_step": 149823, "epoch": 1805} {"train_loss": -23.098215103149414, "global_step": 149824, "epoch": 1805} {"train_loss": -22.849628448486328, "global_step": 149825, "epoch": 1805} {"train_loss": -22.88336181640625, "global_step": 149826, "epoch": 1805} {"train_loss": -23.081329345703125, "global_step": 149827, "epoch": 1805} {"train_loss": -22.942045211791992, "global_step": 149828, "epoch": 1805} {"train_loss": -23.085050582885742, "global_step": 149829, "epoch": 1805} {"train_loss": -23.174428939819336, "global_step": 149830, "epoch": 1805} {"train_loss": -22.626850128173828, "global_step": 149831, "epoch": 1805} {"train_loss": -22.803770065307617, "global_step": 149832, "epoch": 1805} {"train_loss": -23.0885009765625, "global_step": 149833, "epoch": 1805} {"train_loss": -23.19696044921875, "global_step": 149834, "epoch": 1805} {"train_loss": -23.223501205444336, "global_step": 149835, "epoch": 1805} {"train_loss": -23.43439292907715, "global_step": 149836, "epoch": 1805} {"train_loss": -23.246049880981445, "global_step": 149837, "epoch": 1805} {"train_loss": -23.06610870361328, "global_step": 149838, "epoch": 1805} {"train_loss": -23.155109405517578, "global_step": 149839, "epoch": 1805} {"train_loss": -23.40765953063965, "global_step": 149840, "epoch": 1805} {"train_loss": -23.343355178833008, "global_step": 149841, "epoch": 1805} {"train_loss": -23.218036651611328, "global_step": 149842, "epoch": 1805} {"train_loss": -23.48978614807129, "global_step": 149843, "epoch": 1805} {"train_loss": -23.399946212768555, "global_step": 149844, "epoch": 1805} {"train_loss": -22.862295150756836, "global_step": 149845, "epoch": 1805} {"train_loss": -23.423236846923828, "global_step": 149846, "epoch": 1805} {"train_loss": -23.738534927368164, "global_step": 149847, "epoch": 1805} {"train_loss": -23.5415096282959, "global_step": 149848, "epoch": 1805} {"train_loss": -23.557769775390625, "global_step": 149849, "epoch": 1805} {"train_loss": -23.172576904296875, "global_step": 149850, "epoch": 1805} {"train_loss": -23.21773338317871, "global_step": 149851, "epoch": 1805} {"train_loss": -23.1973819732666, "global_step": 149852, "epoch": 1805} {"train_loss": -22.89381217956543, "global_step": 149853, "epoch": 1805} {"train_loss": -23.077396392822266, "global_step": 149854, "epoch": 1805} {"train_loss": -23.301725387573242, "global_step": 149855, "epoch": 1805} {"train_loss": -23.35593032836914, "global_step": 149856, "epoch": 1805} {"train_loss": -23.42469024658203, "global_step": 149857, "epoch": 1805} {"train_loss": -23.26483726501465, "global_step": 149858, "epoch": 1805} {"train_loss": -23.277286529541016, "global_step": 149859, "epoch": 1805} {"train_loss": -23.141809463500977, "global_step": 149860, "epoch": 1805} {"train_loss": -22.82925796508789, "global_step": 149861, "epoch": 1805} {"train_loss": -23.281789779663086, "global_step": 149862, "epoch": 1805} {"train_loss": -23.014982223510742, "global_step": 149863, "epoch": 1805} {"train_loss": -22.98894500732422, "global_step": 149864, "epoch": 1805} {"train_loss": -23.092721939086914, "global_step": 149865, "epoch": 1805} {"train_loss": -22.66781997680664, "global_step": 149866, "epoch": 1805} {"train_loss": -23.185163497924805, "global_step": 149867, "epoch": 1805} {"train_loss": -22.800268173217773, "global_step": 149868, "epoch": 1805} {"train_loss": -23.357240676879883, "global_step": 149869, "epoch": 1805} {"train_loss": -23.325504302978516, "global_step": 149870, "epoch": 1805} {"train_loss": -23.568710327148438, "global_step": 149871, "epoch": 1805} {"train_loss": -23.336835861206055, "global_step": 149872, "epoch": 1805} {"train_loss": -23.144710540771484, "global_step": 149873, "epoch": 1805} {"train_loss": -22.922840118408203, "global_step": 149874, "epoch": 1805} {"train_loss": -23.423002243041992, "global_step": 149875, "epoch": 1805} {"train_loss": -23.29534912109375, "global_step": 149876, "epoch": 1805} {"train_loss": -23.122278213500977, "global_step": 149877, "epoch": 1805} {"train_loss": -23.368467330932617, "global_step": 149878, "epoch": 1805} {"train_loss": -23.033613204956055, "global_step": 149879, "epoch": 1805} {"train_loss": -23.244169235229492, "global_step": 149880, "epoch": 1805} {"train_loss": -23.47133445739746, "global_step": 149881, "epoch": 1805} {"train_loss": -23.439910888671875, "global_step": 149882, "epoch": 1805} {"train_loss": -23.332019805908203, "global_step": 149883, "epoch": 1805} {"train_loss": -23.409631729125977, "global_step": 149884, "epoch": 1805} {"train_loss": -23.164152145385742, "global_step": 149885, "epoch": 1805} {"train_loss": -23.660165786743164, "global_step": 149886, "epoch": 1805} {"train_loss": -23.48105239868164, "global_step": 149887, "epoch": 1805} {"train_loss": -23.3581485748291, "global_step": 149888, "epoch": 1805} {"train_loss": -23.18596076965332, "global_step": 149889, "epoch": 1805} {"train_loss": -23.670873641967773, "global_step": 149890, "epoch": 1805} {"train_loss": -23.443666458129883, "global_step": 149891, "epoch": 1805} {"train_loss": -23.230871200561523, "global_step": 149892, "epoch": 1805} {"train_loss": -23.906993865966797, "global_step": 149893, "epoch": 1805} {"train_loss": -23.31788444519043, "global_step": 149894, "epoch": 1805} {"train_loss": -23.196487426757812, "global_step": 149895, "epoch": 1805} {"train_loss": -23.448993682861328, "global_step": 149896, "epoch": 1805} {"train_loss": -23.190923323114234, "global_step": 149897, "epoch": 1805, "val_loss": 6352877.0} {"train_loss": -22.910335540771484, "global_step": 149898, "epoch": 1806} {"train_loss": -22.7236270904541, "global_step": 149899, "epoch": 1806} {"train_loss": -22.854944229125977, "global_step": 149900, "epoch": 1806} {"train_loss": -23.089275360107422, "global_step": 149901, "epoch": 1806} {"train_loss": -23.005325317382812, "global_step": 149902, "epoch": 1806} {"train_loss": -22.439655303955078, "global_step": 149903, "epoch": 1806} {"train_loss": -22.700780868530273, "global_step": 149904, "epoch": 1806} {"train_loss": -23.06025505065918, "global_step": 149905, "epoch": 1806} {"train_loss": -22.983089447021484, "global_step": 149906, "epoch": 1806} {"train_loss": -22.611661911010742, "global_step": 149907, "epoch": 1806} {"train_loss": -22.846817016601562, "global_step": 149908, "epoch": 1806} {"train_loss": -23.189178466796875, "global_step": 149909, "epoch": 1806} {"train_loss": -22.59220314025879, "global_step": 149910, "epoch": 1806} {"train_loss": -22.89484214782715, "global_step": 149911, "epoch": 1806} {"train_loss": -23.00314712524414, "global_step": 149912, "epoch": 1806} {"train_loss": -23.26500701904297, "global_step": 149913, "epoch": 1806} {"train_loss": -22.674179077148438, "global_step": 149914, "epoch": 1806} {"train_loss": -23.240707397460938, "global_step": 149915, "epoch": 1806} {"train_loss": -23.273820877075195, "global_step": 149916, "epoch": 1806} {"train_loss": -22.98809814453125, "global_step": 149917, "epoch": 1806} {"train_loss": -22.94814109802246, "global_step": 149918, "epoch": 1806} {"train_loss": -23.49698257446289, "global_step": 149919, "epoch": 1806} {"train_loss": -23.039960861206055, "global_step": 149920, "epoch": 1806} {"train_loss": -22.7646484375, "global_step": 149921, "epoch": 1806} {"train_loss": -23.113584518432617, "global_step": 149922, "epoch": 1806} {"train_loss": -23.281675338745117, "global_step": 149923, "epoch": 1806} {"train_loss": -23.07747459411621, "global_step": 149924, "epoch": 1806} {"train_loss": -23.541091918945312, "global_step": 149925, "epoch": 1806} {"train_loss": -23.1422119140625, "global_step": 149926, "epoch": 1806} {"train_loss": -23.231168746948242, "global_step": 149927, "epoch": 1806} {"train_loss": -22.95557975769043, "global_step": 149928, "epoch": 1806} {"train_loss": -23.530702590942383, "global_step": 149929, "epoch": 1806} {"train_loss": -23.310531616210938, "global_step": 149930, "epoch": 1806} {"train_loss": -23.28156852722168, "global_step": 149931, "epoch": 1806} {"train_loss": -22.972917556762695, "global_step": 149932, "epoch": 1806} {"train_loss": -22.827234268188477, "global_step": 149933, "epoch": 1806} {"train_loss": -22.868179321289062, "global_step": 149934, "epoch": 1806} {"train_loss": -23.015472412109375, "global_step": 149935, "epoch": 1806} {"train_loss": -23.243886947631836, "global_step": 149936, "epoch": 1806} {"train_loss": -23.06884765625, "global_step": 149937, "epoch": 1806} {"train_loss": -23.559934616088867, "global_step": 149938, "epoch": 1806} {"train_loss": -23.153858184814453, "global_step": 149939, "epoch": 1806} {"train_loss": -23.232131958007812, "global_step": 149940, "epoch": 1806} {"train_loss": -23.149198532104492, "global_step": 149941, "epoch": 1806} {"train_loss": -23.372831344604492, "global_step": 149942, "epoch": 1806} {"train_loss": -23.179950714111328, "global_step": 149943, "epoch": 1806} {"train_loss": -23.48529815673828, "global_step": 149944, "epoch": 1806} {"train_loss": -22.80734634399414, "global_step": 149945, "epoch": 1806} {"train_loss": -23.45395278930664, "global_step": 149946, "epoch": 1806} {"train_loss": -23.194091796875, "global_step": 149947, "epoch": 1806} {"train_loss": -23.194232940673828, "global_step": 149948, "epoch": 1806} {"train_loss": -23.279653549194336, "global_step": 149949, "epoch": 1806} {"train_loss": -23.325387954711914, "global_step": 149950, "epoch": 1806} {"train_loss": -23.281034469604492, "global_step": 149951, "epoch": 1806} {"train_loss": -23.166645050048828, "global_step": 149952, "epoch": 1806} {"train_loss": -22.911344528198242, "global_step": 149953, "epoch": 1806} {"train_loss": -23.26458740234375, "global_step": 149954, "epoch": 1806} {"train_loss": -23.257787704467773, "global_step": 149955, "epoch": 1806} {"train_loss": -23.277587890625, "global_step": 149956, "epoch": 1806} {"train_loss": -23.10065269470215, "global_step": 149957, "epoch": 1806} {"train_loss": -23.38812828063965, "global_step": 149958, "epoch": 1806} {"train_loss": -22.860620498657227, "global_step": 149959, "epoch": 1806} {"train_loss": -23.298681259155273, "global_step": 149960, "epoch": 1806} {"train_loss": -23.352378845214844, "global_step": 149961, "epoch": 1806} {"train_loss": -23.630992889404297, "global_step": 149962, "epoch": 1806} {"train_loss": -23.1680908203125, "global_step": 149963, "epoch": 1806} {"train_loss": -23.288042068481445, "global_step": 149964, "epoch": 1806} {"train_loss": -23.36252212524414, "global_step": 149965, "epoch": 1806} {"train_loss": -23.475181579589844, "global_step": 149966, "epoch": 1806} {"train_loss": -23.75665283203125, "global_step": 149967, "epoch": 1806} {"train_loss": -23.245107650756836, "global_step": 149968, "epoch": 1806} {"train_loss": -23.188589096069336, "global_step": 149969, "epoch": 1806} {"train_loss": -23.210485458374023, "global_step": 149970, "epoch": 1806} {"train_loss": -23.206777572631836, "global_step": 149971, "epoch": 1806} {"train_loss": -23.15412712097168, "global_step": 149972, "epoch": 1806} {"train_loss": -23.018985748291016, "global_step": 149973, "epoch": 1806} {"train_loss": -23.140539169311523, "global_step": 149974, "epoch": 1806} {"train_loss": -23.23211097717285, "global_step": 149975, "epoch": 1806} {"train_loss": -23.358854293823242, "global_step": 149976, "epoch": 1806} {"train_loss": -23.338747024536133, "global_step": 149977, "epoch": 1806} {"train_loss": -23.228641510009766, "global_step": 149978, "epoch": 1806} {"train_loss": -23.66484260559082, "global_step": 149979, "epoch": 1806} {"train_loss": -23.168146455144306, "global_step": 149980, "epoch": 1806, "val_loss": 6447094.5} {"train_loss": -21.87335777282715, "global_step": 149981, "epoch": 1807} {"train_loss": -23.038883209228516, "global_step": 149982, "epoch": 1807} {"train_loss": -22.52236557006836, "global_step": 149983, "epoch": 1807} {"train_loss": -23.057382583618164, "global_step": 149984, "epoch": 1807} {"train_loss": -22.2756290435791, "global_step": 149985, "epoch": 1807} {"train_loss": -22.781930923461914, "global_step": 149986, "epoch": 1807} {"train_loss": -22.895227432250977, "global_step": 149987, "epoch": 1807} {"train_loss": -22.458091735839844, "global_step": 149988, "epoch": 1807} {"train_loss": -22.636022567749023, "global_step": 149989, "epoch": 1807} {"train_loss": -22.712766647338867, "global_step": 149990, "epoch": 1807} {"train_loss": -23.101438522338867, "global_step": 149991, "epoch": 1807} {"train_loss": -22.7288875579834, "global_step": 149992, "epoch": 1807} {"train_loss": -23.05942726135254, "global_step": 149993, "epoch": 1807} {"train_loss": -22.649423599243164, "global_step": 149994, "epoch": 1807} {"train_loss": -22.69106674194336, "global_step": 149995, "epoch": 1807} {"train_loss": -22.921207427978516, "global_step": 149996, "epoch": 1807} {"train_loss": -22.78328514099121, "global_step": 149997, "epoch": 1807} {"train_loss": -23.056509017944336, "global_step": 149998, "epoch": 1807} {"train_loss": -22.66549301147461, "global_step": 149999, "epoch": 1807} {"train_loss": -22.93274688720703, "global_step": 150000, "epoch": 1807} {"train_loss": -22.903913497924805, "global_step": 150001, "epoch": 1807} {"train_loss": -22.960294723510742, "global_step": 150002, "epoch": 1807} {"train_loss": -23.08513832092285, "global_step": 150003, "epoch": 1807} {"train_loss": -22.930160522460938, "global_step": 150004, "epoch": 1807} {"train_loss": -22.82728385925293, "global_step": 150005, "epoch": 1807} {"train_loss": -22.95362091064453, "global_step": 150006, "epoch": 1807} {"train_loss": -22.711536407470703, "global_step": 150007, "epoch": 1807} {"train_loss": -22.9841251373291, "global_step": 150008, "epoch": 1807} {"train_loss": -22.70635986328125, "global_step": 150009, "epoch": 1807} {"train_loss": -23.3630313873291, "global_step": 150010, "epoch": 1807} {"train_loss": -22.938779830932617, "global_step": 150011, "epoch": 1807} {"train_loss": -22.982563018798828, "global_step": 150012, "epoch": 1807} {"train_loss": -23.23975944519043, "global_step": 150013, "epoch": 1807} {"train_loss": -23.082727432250977, "global_step": 150014, "epoch": 1807} {"train_loss": -22.8736572265625, "global_step": 150015, "epoch": 1807} {"train_loss": -23.362144470214844, "global_step": 150016, "epoch": 1807} {"train_loss": -23.39113426208496, "global_step": 150017, "epoch": 1807} {"train_loss": -23.462995529174805, "global_step": 150018, "epoch": 1807} {"train_loss": -23.053068161010742, "global_step": 150019, "epoch": 1807} {"train_loss": -23.07964324951172, "global_step": 150020, "epoch": 1807} {"train_loss": -23.781919479370117, "global_step": 150021, "epoch": 1807} {"train_loss": -23.066625595092773, "global_step": 150022, "epoch": 1807} {"train_loss": -23.15395164489746, "global_step": 150023, "epoch": 1807} {"train_loss": -23.70790672302246, "global_step": 150024, "epoch": 1807} {"train_loss": -23.2855167388916, "global_step": 150025, "epoch": 1807} {"train_loss": -23.263322830200195, "global_step": 150026, "epoch": 1807} {"train_loss": -23.226917266845703, "global_step": 150027, "epoch": 1807} {"train_loss": -23.595428466796875, "global_step": 150028, "epoch": 1807} {"train_loss": -23.307336807250977, "global_step": 150029, "epoch": 1807} {"train_loss": -23.221481323242188, "global_step": 150030, "epoch": 1807} {"train_loss": -23.317323684692383, "global_step": 150031, "epoch": 1807} {"train_loss": -23.551755905151367, "global_step": 150032, "epoch": 1807} {"train_loss": -23.41255760192871, "global_step": 150033, "epoch": 1807} {"train_loss": -23.165374755859375, "global_step": 150034, "epoch": 1807} {"train_loss": -23.411664962768555, "global_step": 150035, "epoch": 1807} {"train_loss": -23.547103881835938, "global_step": 150036, "epoch": 1807} {"train_loss": -23.285680770874023, "global_step": 150037, "epoch": 1807} {"train_loss": -23.44161033630371, "global_step": 150038, "epoch": 1807} {"train_loss": -22.983694076538086, "global_step": 150039, "epoch": 1807} {"train_loss": -23.426254272460938, "global_step": 150040, "epoch": 1807} {"train_loss": -23.552143096923828, "global_step": 150041, "epoch": 1807} {"train_loss": -23.484060287475586, "global_step": 150042, "epoch": 1807} {"train_loss": -23.762723922729492, "global_step": 150043, "epoch": 1807} {"train_loss": -23.712085723876953, "global_step": 150044, "epoch": 1807} {"train_loss": -23.611675262451172, "global_step": 150045, "epoch": 1807} {"train_loss": -23.55009651184082, "global_step": 150046, "epoch": 1807} {"train_loss": -23.562339782714844, "global_step": 150047, "epoch": 1807} {"train_loss": -23.351581573486328, "global_step": 150048, "epoch": 1807} {"train_loss": -22.88449478149414, "global_step": 150049, "epoch": 1807} {"train_loss": -23.491811752319336, "global_step": 150050, "epoch": 1807} {"train_loss": -23.51995849609375, "global_step": 150051, "epoch": 1807} {"train_loss": -23.28585433959961, "global_step": 150052, "epoch": 1807} {"train_loss": -22.98468017578125, "global_step": 150053, "epoch": 1807} {"train_loss": -23.074010848999023, "global_step": 150054, "epoch": 1807} {"train_loss": -23.323917388916016, "global_step": 150055, "epoch": 1807} {"train_loss": -23.257619857788086, "global_step": 150056, "epoch": 1807} {"train_loss": -23.39336585998535, "global_step": 150057, "epoch": 1807} {"train_loss": -23.537450790405273, "global_step": 150058, "epoch": 1807} {"train_loss": -23.178985595703125, "global_step": 150059, "epoch": 1807} {"train_loss": -23.046785354614258, "global_step": 150060, "epoch": 1807} {"train_loss": -23.533483505249023, "global_step": 150061, "epoch": 1807} {"train_loss": -23.379358291625977, "global_step": 150062, "epoch": 1807} {"train_loss": -23.140893292714313, "global_step": 150063, "epoch": 1807, "val_loss": 6362806.0} {"train_loss": -22.906469345092773, "global_step": 150064, "epoch": 1808} {"train_loss": -23.134122848510742, "global_step": 150065, "epoch": 1808} {"train_loss": -23.296722412109375, "global_step": 150066, "epoch": 1808} {"train_loss": -22.98238182067871, "global_step": 150067, "epoch": 1808} {"train_loss": -22.821557998657227, "global_step": 150068, "epoch": 1808} {"train_loss": -22.892364501953125, "global_step": 150069, "epoch": 1808} {"train_loss": -22.859357833862305, "global_step": 150070, "epoch": 1808} {"train_loss": -23.00554847717285, "global_step": 150071, "epoch": 1808} {"train_loss": -23.322494506835938, "global_step": 150072, "epoch": 1808} {"train_loss": -23.101694107055664, "global_step": 150073, "epoch": 1808} {"train_loss": -23.100736618041992, "global_step": 150074, "epoch": 1808} {"train_loss": -23.34079933166504, "global_step": 150075, "epoch": 1808} {"train_loss": -23.080110549926758, "global_step": 150076, "epoch": 1808} {"train_loss": -23.07562828063965, "global_step": 150077, "epoch": 1808} {"train_loss": -23.35775375366211, "global_step": 150078, "epoch": 1808} {"train_loss": -23.392356872558594, "global_step": 150079, "epoch": 1808} {"train_loss": -23.252016067504883, "global_step": 150080, "epoch": 1808} {"train_loss": -23.29998016357422, "global_step": 150081, "epoch": 1808} {"train_loss": -23.30726432800293, "global_step": 150082, "epoch": 1808} {"train_loss": -23.301218032836914, "global_step": 150083, "epoch": 1808} {"train_loss": -23.161840438842773, "global_step": 150084, "epoch": 1808} {"train_loss": -23.346643447875977, "global_step": 150085, "epoch": 1808} {"train_loss": -23.184728622436523, "global_step": 150086, "epoch": 1808} {"train_loss": -23.405736923217773, "global_step": 150087, "epoch": 1808} {"train_loss": -23.412643432617188, "global_step": 150088, "epoch": 1808} {"train_loss": -23.293869018554688, "global_step": 150089, "epoch": 1808} {"train_loss": -23.639978408813477, "global_step": 150090, "epoch": 1808} {"train_loss": -23.025659561157227, "global_step": 150091, "epoch": 1808} {"train_loss": -23.205739974975586, "global_step": 150092, "epoch": 1808} {"train_loss": -23.719022750854492, "global_step": 150093, "epoch": 1808} {"train_loss": -23.542259216308594, "global_step": 150094, "epoch": 1808} {"train_loss": -23.302722930908203, "global_step": 150095, "epoch": 1808} {"train_loss": -23.140241622924805, "global_step": 150096, "epoch": 1808} {"train_loss": -23.37221336364746, "global_step": 150097, "epoch": 1808} {"train_loss": -23.578794479370117, "global_step": 150098, "epoch": 1808} {"train_loss": -23.18679428100586, "global_step": 150099, "epoch": 1808} {"train_loss": -23.109296798706055, "global_step": 150100, "epoch": 1808} {"train_loss": -23.106626510620117, "global_step": 150101, "epoch": 1808} {"train_loss": -23.17317008972168, "global_step": 150102, "epoch": 1808} {"train_loss": -23.307937622070312, "global_step": 150103, "epoch": 1808} {"train_loss": -23.408966064453125, "global_step": 150104, "epoch": 1808} {"train_loss": -22.55144691467285, "global_step": 150105, "epoch": 1808} {"train_loss": -23.195459365844727, "global_step": 150106, "epoch": 1808} {"train_loss": -23.325469970703125, "global_step": 150107, "epoch": 1808} {"train_loss": -22.955656051635742, "global_step": 150108, "epoch": 1808} {"train_loss": -23.44944190979004, "global_step": 150109, "epoch": 1808} {"train_loss": -23.45706558227539, "global_step": 150110, "epoch": 1808} {"train_loss": -23.30423355102539, "global_step": 150111, "epoch": 1808} {"train_loss": -23.16685676574707, "global_step": 150112, "epoch": 1808} {"train_loss": -23.455862045288086, "global_step": 150113, "epoch": 1808} {"train_loss": -23.261198043823242, "global_step": 150114, "epoch": 1808} {"train_loss": -23.328893661499023, "global_step": 150115, "epoch": 1808} {"train_loss": -23.05562400817871, "global_step": 150116, "epoch": 1808} {"train_loss": -23.348129272460938, "global_step": 150117, "epoch": 1808} {"train_loss": -23.35188102722168, "global_step": 150118, "epoch": 1808} {"train_loss": -23.393789291381836, "global_step": 150119, "epoch": 1808} {"train_loss": -23.414833068847656, "global_step": 150120, "epoch": 1808} {"train_loss": -23.566837310791016, "global_step": 150121, "epoch": 1808} {"train_loss": -23.179834365844727, "global_step": 150122, "epoch": 1808} {"train_loss": -22.87705421447754, "global_step": 150123, "epoch": 1808} {"train_loss": -23.379364013671875, "global_step": 150124, "epoch": 1808} {"train_loss": -23.339567184448242, "global_step": 150125, "epoch": 1808} {"train_loss": -22.96733856201172, "global_step": 150126, "epoch": 1808} {"train_loss": -23.615026473999023, "global_step": 150127, "epoch": 1808} {"train_loss": -23.258020401000977, "global_step": 150128, "epoch": 1808} {"train_loss": -23.095378875732422, "global_step": 150129, "epoch": 1808} {"train_loss": -23.409133911132812, "global_step": 150130, "epoch": 1808} {"train_loss": -24.05803871154785, "global_step": 150131, "epoch": 1808} {"train_loss": -23.270553588867188, "global_step": 150132, "epoch": 1808} {"train_loss": -23.741474151611328, "global_step": 150133, "epoch": 1808} {"train_loss": -23.37289810180664, "global_step": 150134, "epoch": 1808} {"train_loss": -23.22162437438965, "global_step": 150135, "epoch": 1808} {"train_loss": -23.141592025756836, "global_step": 150136, "epoch": 1808} {"train_loss": -23.068622589111328, "global_step": 150137, "epoch": 1808} {"train_loss": -23.26463508605957, "global_step": 150138, "epoch": 1808} {"train_loss": -23.687963485717773, "global_step": 150139, "epoch": 1808} {"train_loss": -23.281522750854492, "global_step": 150140, "epoch": 1808} {"train_loss": -23.322357177734375, "global_step": 150141, "epoch": 1808} {"train_loss": -23.283681869506836, "global_step": 150142, "epoch": 1808} {"train_loss": -23.490650177001953, "global_step": 150143, "epoch": 1808} {"train_loss": -23.325695037841797, "global_step": 150144, "epoch": 1808} {"train_loss": -23.10799217224121, "global_step": 150145, "epoch": 1808} {"train_loss": -23.256065782294215, "global_step": 150146, "epoch": 1808, "val_loss": 6318863.0} {"train_loss": -22.9842472076416, "global_step": 150147, "epoch": 1809} {"train_loss": -23.1002254486084, "global_step": 150148, "epoch": 1809} {"train_loss": -23.516305923461914, "global_step": 150149, "epoch": 1809} {"train_loss": -23.141971588134766, "global_step": 150150, "epoch": 1809} {"train_loss": -23.4799861907959, "global_step": 150151, "epoch": 1809} {"train_loss": -22.690753936767578, "global_step": 150152, "epoch": 1809} {"train_loss": -23.002592086791992, "global_step": 150153, "epoch": 1809} {"train_loss": -23.165491104125977, "global_step": 150154, "epoch": 1809} {"train_loss": -23.163345336914062, "global_step": 150155, "epoch": 1809} {"train_loss": -22.592863082885742, "global_step": 150156, "epoch": 1809} {"train_loss": -23.38238525390625, "global_step": 150157, "epoch": 1809} {"train_loss": -23.206911087036133, "global_step": 150158, "epoch": 1809} {"train_loss": -23.52182960510254, "global_step": 150159, "epoch": 1809} {"train_loss": -23.360456466674805, "global_step": 150160, "epoch": 1809} {"train_loss": -23.53377342224121, "global_step": 150161, "epoch": 1809} {"train_loss": -23.354461669921875, "global_step": 150162, "epoch": 1809} {"train_loss": -23.216703414916992, "global_step": 150163, "epoch": 1809} {"train_loss": -23.24873161315918, "global_step": 150164, "epoch": 1809} {"train_loss": -23.363704681396484, "global_step": 150165, "epoch": 1809} {"train_loss": -23.18451499938965, "global_step": 150166, "epoch": 1809} {"train_loss": -23.2008056640625, "global_step": 150167, "epoch": 1809} {"train_loss": -23.259632110595703, "global_step": 150168, "epoch": 1809} {"train_loss": -23.368255615234375, "global_step": 150169, "epoch": 1809} {"train_loss": -23.410846710205078, "global_step": 150170, "epoch": 1809} {"train_loss": -23.2613468170166, "global_step": 150171, "epoch": 1809} {"train_loss": -22.94490623474121, "global_step": 150172, "epoch": 1809} {"train_loss": -23.108844757080078, "global_step": 150173, "epoch": 1809} {"train_loss": -23.21316909790039, "global_step": 150174, "epoch": 1809} {"train_loss": -23.60452651977539, "global_step": 150175, "epoch": 1809} {"train_loss": -23.46181869506836, "global_step": 150176, "epoch": 1809} {"train_loss": -23.33722496032715, "global_step": 150177, "epoch": 1809} {"train_loss": -23.42418098449707, "global_step": 150178, "epoch": 1809} {"train_loss": -23.258316040039062, "global_step": 150179, "epoch": 1809} {"train_loss": -22.9759578704834, "global_step": 150180, "epoch": 1809} {"train_loss": -23.19363784790039, "global_step": 150181, "epoch": 1809} {"train_loss": -23.445499420166016, "global_step": 150182, "epoch": 1809} {"train_loss": -23.42561912536621, "global_step": 150183, "epoch": 1809} {"train_loss": -23.439992904663086, "global_step": 150184, "epoch": 1809} {"train_loss": -23.370817184448242, "global_step": 150185, "epoch": 1809} {"train_loss": -23.362817764282227, "global_step": 150186, "epoch": 1809} {"train_loss": -22.922876358032227, "global_step": 150187, "epoch": 1809} {"train_loss": -23.24543571472168, "global_step": 150188, "epoch": 1809} {"train_loss": -23.528797149658203, "global_step": 150189, "epoch": 1809} {"train_loss": -23.3457088470459, "global_step": 150190, "epoch": 1809} {"train_loss": -23.04012107849121, "global_step": 150191, "epoch": 1809} {"train_loss": -23.236188888549805, "global_step": 150192, "epoch": 1809} {"train_loss": -23.224363327026367, "global_step": 150193, "epoch": 1809} {"train_loss": -23.4859619140625, "global_step": 150194, "epoch": 1809} {"train_loss": -23.66575050354004, "global_step": 150195, "epoch": 1809} {"train_loss": -23.220487594604492, "global_step": 150196, "epoch": 1809} {"train_loss": -23.316362380981445, "global_step": 150197, "epoch": 1809} {"train_loss": -23.296634674072266, "global_step": 150198, "epoch": 1809} {"train_loss": -23.086044311523438, "global_step": 150199, "epoch": 1809} {"train_loss": -23.366952896118164, "global_step": 150200, "epoch": 1809} {"train_loss": -23.433008193969727, "global_step": 150201, "epoch": 1809} {"train_loss": -23.198415756225586, "global_step": 150202, "epoch": 1809} {"train_loss": -23.627840042114258, "global_step": 150203, "epoch": 1809} {"train_loss": -23.293811798095703, "global_step": 150204, "epoch": 1809} {"train_loss": -23.40028190612793, "global_step": 150205, "epoch": 1809} {"train_loss": -23.412614822387695, "global_step": 150206, "epoch": 1809} {"train_loss": -23.214048385620117, "global_step": 150207, "epoch": 1809} {"train_loss": -23.51961326599121, "global_step": 150208, "epoch": 1809} {"train_loss": -23.094491958618164, "global_step": 150209, "epoch": 1809} {"train_loss": -22.633588790893555, "global_step": 150210, "epoch": 1809} {"train_loss": -23.595544815063477, "global_step": 150211, "epoch": 1809} {"train_loss": -23.078786849975586, "global_step": 150212, "epoch": 1809} {"train_loss": -23.17719078063965, "global_step": 150213, "epoch": 1809} {"train_loss": -22.97479820251465, "global_step": 150214, "epoch": 1809} {"train_loss": -22.83002281188965, "global_step": 150215, "epoch": 1809} {"train_loss": -23.103748321533203, "global_step": 150216, "epoch": 1809} {"train_loss": -23.013999938964844, "global_step": 150217, "epoch": 1809} {"train_loss": -23.118484497070312, "global_step": 150218, "epoch": 1809} {"train_loss": -23.170881271362305, "global_step": 150219, "epoch": 1809} {"train_loss": -22.992643356323242, "global_step": 150220, "epoch": 1809} {"train_loss": -23.499414443969727, "global_step": 150221, "epoch": 1809} {"train_loss": -23.141433715820312, "global_step": 150222, "epoch": 1809} {"train_loss": -23.032575607299805, "global_step": 150223, "epoch": 1809} {"train_loss": -23.453672409057617, "global_step": 150224, "epoch": 1809} {"train_loss": -23.267425537109375, "global_step": 150225, "epoch": 1809} {"train_loss": -22.788074493408203, "global_step": 150226, "epoch": 1809} {"train_loss": -23.247493743896484, "global_step": 150227, "epoch": 1809} {"train_loss": -23.43558692932129, "global_step": 150228, "epoch": 1809} {"train_loss": -23.23931822719344, "global_step": 150229, "epoch": 1809, "val_loss": 6313586.5} {"train_loss": -21.945632934570312, "global_step": 150230, "epoch": 1810} {"train_loss": -22.324993133544922, "global_step": 150231, "epoch": 1810} {"train_loss": -22.50840950012207, "global_step": 150232, "epoch": 1810} {"train_loss": -22.401212692260742, "global_step": 150233, "epoch": 1810} {"train_loss": -22.351499557495117, "global_step": 150234, "epoch": 1810} {"train_loss": -22.9001407623291, "global_step": 150235, "epoch": 1810} {"train_loss": -22.70279312133789, "global_step": 150236, "epoch": 1810} {"train_loss": -22.589141845703125, "global_step": 150237, "epoch": 1810} {"train_loss": -23.02225685119629, "global_step": 150238, "epoch": 1810} {"train_loss": -22.794971466064453, "global_step": 150239, "epoch": 1810} {"train_loss": -22.72297477722168, "global_step": 150240, "epoch": 1810} {"train_loss": -22.653671264648438, "global_step": 150241, "epoch": 1810} {"train_loss": -22.895938873291016, "global_step": 150242, "epoch": 1810} {"train_loss": -22.68499183654785, "global_step": 150243, "epoch": 1810} {"train_loss": -22.67403793334961, "global_step": 150244, "epoch": 1810} {"train_loss": -22.779748916625977, "global_step": 150245, "epoch": 1810} {"train_loss": -23.227821350097656, "global_step": 150246, "epoch": 1810} {"train_loss": -23.318073272705078, "global_step": 150247, "epoch": 1810} {"train_loss": -22.846792221069336, "global_step": 150248, "epoch": 1810} {"train_loss": -22.92799186706543, "global_step": 150249, "epoch": 1810} {"train_loss": -22.52692222595215, "global_step": 150250, "epoch": 1810} {"train_loss": -23.189146041870117, "global_step": 150251, "epoch": 1810} {"train_loss": -23.3422794342041, "global_step": 150252, "epoch": 1810} {"train_loss": -23.440776824951172, "global_step": 150253, "epoch": 1810} {"train_loss": -22.991857528686523, "global_step": 150254, "epoch": 1810} {"train_loss": -22.96958351135254, "global_step": 150255, "epoch": 1810} {"train_loss": -23.3951416015625, "global_step": 150256, "epoch": 1810} {"train_loss": -23.0722713470459, "global_step": 150257, "epoch": 1810} {"train_loss": -23.32950210571289, "global_step": 150258, "epoch": 1810} {"train_loss": -23.0074462890625, "global_step": 150259, "epoch": 1810} {"train_loss": -23.3848819732666, "global_step": 150260, "epoch": 1810} {"train_loss": -23.00271224975586, "global_step": 150261, "epoch": 1810} {"train_loss": -23.29677391052246, "global_step": 150262, "epoch": 1810} {"train_loss": -22.835325241088867, "global_step": 150263, "epoch": 1810} {"train_loss": -23.6981201171875, "global_step": 150264, "epoch": 1810} {"train_loss": -23.287031173706055, "global_step": 150265, "epoch": 1810} {"train_loss": -23.5903263092041, "global_step": 150266, "epoch": 1810} {"train_loss": -23.52261734008789, "global_step": 150267, "epoch": 1810} {"train_loss": -23.572751998901367, "global_step": 150268, "epoch": 1810} {"train_loss": -23.637428283691406, "global_step": 150269, "epoch": 1810} {"train_loss": -23.229251861572266, "global_step": 150270, "epoch": 1810} {"train_loss": -23.642070770263672, "global_step": 150271, "epoch": 1810} {"train_loss": -23.27981185913086, "global_step": 150272, "epoch": 1810} {"train_loss": -23.67732810974121, "global_step": 150273, "epoch": 1810} {"train_loss": -23.228437423706055, "global_step": 150274, "epoch": 1810} {"train_loss": -22.951810836791992, "global_step": 150275, "epoch": 1810} {"train_loss": -23.534780502319336, "global_step": 150276, "epoch": 1810} {"train_loss": -23.271888732910156, "global_step": 150277, "epoch": 1810} {"train_loss": -23.269821166992188, "global_step": 150278, "epoch": 1810} {"train_loss": -23.50583839416504, "global_step": 150279, "epoch": 1810} {"train_loss": -23.170896530151367, "global_step": 150280, "epoch": 1810} {"train_loss": -23.344449996948242, "global_step": 150281, "epoch": 1810} {"train_loss": -23.450389862060547, "global_step": 150282, "epoch": 1810} {"train_loss": -23.570756912231445, "global_step": 150283, "epoch": 1810} {"train_loss": -23.18760108947754, "global_step": 150284, "epoch": 1810} {"train_loss": -23.068578720092773, "global_step": 150285, "epoch": 1810} {"train_loss": -23.784460067749023, "global_step": 150286, "epoch": 1810} {"train_loss": -23.045658111572266, "global_step": 150287, "epoch": 1810} {"train_loss": -22.91739845275879, "global_step": 150288, "epoch": 1810} {"train_loss": -23.448280334472656, "global_step": 150289, "epoch": 1810} {"train_loss": -23.5627384185791, "global_step": 150290, "epoch": 1810} {"train_loss": -23.980667114257812, "global_step": 150291, "epoch": 1810} {"train_loss": -23.406463623046875, "global_step": 150292, "epoch": 1810} {"train_loss": -23.034311294555664, "global_step": 150293, "epoch": 1810} {"train_loss": -23.05255126953125, "global_step": 150294, "epoch": 1810} {"train_loss": -23.445737838745117, "global_step": 150295, "epoch": 1810} {"train_loss": -23.3448543548584, "global_step": 150296, "epoch": 1810} {"train_loss": -23.166650772094727, "global_step": 150297, "epoch": 1810} {"train_loss": -23.274063110351562, "global_step": 150298, "epoch": 1810} {"train_loss": -23.395212173461914, "global_step": 150299, "epoch": 1810} {"train_loss": -23.374801635742188, "global_step": 150300, "epoch": 1810} {"train_loss": -23.297931671142578, "global_step": 150301, "epoch": 1810} {"train_loss": -23.581968307495117, "global_step": 150302, "epoch": 1810} {"train_loss": -23.30609130859375, "global_step": 150303, "epoch": 1810} {"train_loss": -23.428024291992188, "global_step": 150304, "epoch": 1810} {"train_loss": -23.388935089111328, "global_step": 150305, "epoch": 1810} {"train_loss": -22.833431243896484, "global_step": 150306, "epoch": 1810} {"train_loss": -23.38650131225586, "global_step": 150307, "epoch": 1810} {"train_loss": -23.321332931518555, "global_step": 150308, "epoch": 1810} {"train_loss": -23.002965927124023, "global_step": 150309, "epoch": 1810} {"train_loss": -23.116809844970703, "global_step": 150310, "epoch": 1810} {"train_loss": -23.620176315307617, "global_step": 150311, "epoch": 1810} {"train_loss": -23.16093435632177, "global_step": 150312, "epoch": 1810, "val_loss": 6445781.5} {"train_loss": -22.583913803100586, "global_step": 150313, "epoch": 1811} {"train_loss": -22.6226806640625, "global_step": 150314, "epoch": 1811} {"train_loss": -22.37154197692871, "global_step": 150315, "epoch": 1811} {"train_loss": -22.94211769104004, "global_step": 150316, "epoch": 1811} {"train_loss": -22.58408546447754, "global_step": 150317, "epoch": 1811} {"train_loss": -23.1639404296875, "global_step": 150318, "epoch": 1811} {"train_loss": -22.40009117126465, "global_step": 150319, "epoch": 1811} {"train_loss": -22.68942642211914, "global_step": 150320, "epoch": 1811} {"train_loss": -22.579383850097656, "global_step": 150321, "epoch": 1811} {"train_loss": -22.868865966796875, "global_step": 150322, "epoch": 1811} {"train_loss": -22.950103759765625, "global_step": 150323, "epoch": 1811} {"train_loss": -22.62997055053711, "global_step": 150324, "epoch": 1811} {"train_loss": -22.482709884643555, "global_step": 150325, "epoch": 1811} {"train_loss": -22.523242950439453, "global_step": 150326, "epoch": 1811} {"train_loss": -22.744293212890625, "global_step": 150327, "epoch": 1811} {"train_loss": -23.0957088470459, "global_step": 150328, "epoch": 1811} {"train_loss": -23.095489501953125, "global_step": 150329, "epoch": 1811} {"train_loss": -22.73028564453125, "global_step": 150330, "epoch": 1811} {"train_loss": -23.006956100463867, "global_step": 150331, "epoch": 1811} {"train_loss": -22.704544067382812, "global_step": 150332, "epoch": 1811} {"train_loss": -23.00909996032715, "global_step": 150333, "epoch": 1811} {"train_loss": -23.384292602539062, "global_step": 150334, "epoch": 1811} {"train_loss": -23.2916259765625, "global_step": 150335, "epoch": 1811} {"train_loss": -23.40589714050293, "global_step": 150336, "epoch": 1811} {"train_loss": -22.76594352722168, "global_step": 150337, "epoch": 1811} {"train_loss": -22.958404541015625, "global_step": 150338, "epoch": 1811} {"train_loss": -23.36619758605957, "global_step": 150339, "epoch": 1811} {"train_loss": -23.370534896850586, "global_step": 150340, "epoch": 1811} {"train_loss": -23.126405715942383, "global_step": 150341, "epoch": 1811} {"train_loss": -23.0435848236084, "global_step": 150342, "epoch": 1811} {"train_loss": -23.323938369750977, "global_step": 150343, "epoch": 1811} {"train_loss": -23.224836349487305, "global_step": 150344, "epoch": 1811} {"train_loss": -23.515356063842773, "global_step": 150345, "epoch": 1811} {"train_loss": -23.416461944580078, "global_step": 150346, "epoch": 1811} {"train_loss": -23.197467803955078, "global_step": 150347, "epoch": 1811} {"train_loss": -23.199283599853516, "global_step": 150348, "epoch": 1811} {"train_loss": -23.508634567260742, "global_step": 150349, "epoch": 1811} {"train_loss": -23.092737197875977, "global_step": 150350, "epoch": 1811} {"train_loss": -23.30582046508789, "global_step": 150351, "epoch": 1811} {"train_loss": -23.073232650756836, "global_step": 150352, "epoch": 1811} {"train_loss": -23.625547409057617, "global_step": 150353, "epoch": 1811} {"train_loss": -23.50315284729004, "global_step": 150354, "epoch": 1811} {"train_loss": -23.489240646362305, "global_step": 150355, "epoch": 1811} {"train_loss": -23.153949737548828, "global_step": 150356, "epoch": 1811} {"train_loss": -23.23469352722168, "global_step": 150357, "epoch": 1811} {"train_loss": -23.40143585205078, "global_step": 150358, "epoch": 1811} {"train_loss": -23.264389038085938, "global_step": 150359, "epoch": 1811} {"train_loss": -23.30573081970215, "global_step": 150360, "epoch": 1811} {"train_loss": -23.492246627807617, "global_step": 150361, "epoch": 1811} {"train_loss": -23.418378829956055, "global_step": 150362, "epoch": 1811} {"train_loss": -23.219533920288086, "global_step": 150363, "epoch": 1811} {"train_loss": -23.279220581054688, "global_step": 150364, "epoch": 1811} {"train_loss": -23.54956817626953, "global_step": 150365, "epoch": 1811} {"train_loss": -23.24567222595215, "global_step": 150366, "epoch": 1811} {"train_loss": -23.173261642456055, "global_step": 150367, "epoch": 1811} {"train_loss": -22.964487075805664, "global_step": 150368, "epoch": 1811} {"train_loss": -23.73689079284668, "global_step": 150369, "epoch": 1811} {"train_loss": -22.842470169067383, "global_step": 150370, "epoch": 1811} {"train_loss": -23.437166213989258, "global_step": 150371, "epoch": 1811} {"train_loss": -23.190969467163086, "global_step": 150372, "epoch": 1811} {"train_loss": -23.54621124267578, "global_step": 150373, "epoch": 1811} {"train_loss": -23.383302688598633, "global_step": 150374, "epoch": 1811} {"train_loss": -22.879697799682617, "global_step": 150375, "epoch": 1811} {"train_loss": -23.401016235351562, "global_step": 150376, "epoch": 1811} {"train_loss": -23.116348266601562, "global_step": 150377, "epoch": 1811} {"train_loss": -23.513500213623047, "global_step": 150378, "epoch": 1811} {"train_loss": -23.336713790893555, "global_step": 150379, "epoch": 1811} {"train_loss": -23.1569766998291, "global_step": 150380, "epoch": 1811} {"train_loss": -23.108234405517578, "global_step": 150381, "epoch": 1811} {"train_loss": -23.020578384399414, "global_step": 150382, "epoch": 1811} {"train_loss": -23.102209091186523, "global_step": 150383, "epoch": 1811} {"train_loss": -22.795774459838867, "global_step": 150384, "epoch": 1811} {"train_loss": -23.27535057067871, "global_step": 150385, "epoch": 1811} {"train_loss": -23.324748992919922, "global_step": 150386, "epoch": 1811} {"train_loss": -23.397241592407227, "global_step": 150387, "epoch": 1811} {"train_loss": -23.07908821105957, "global_step": 150388, "epoch": 1811} {"train_loss": -23.088499069213867, "global_step": 150389, "epoch": 1811} {"train_loss": -23.218175888061523, "global_step": 150390, "epoch": 1811} {"train_loss": -23.116924285888672, "global_step": 150391, "epoch": 1811} {"train_loss": -23.38755226135254, "global_step": 150392, "epoch": 1811} {"train_loss": -23.672321319580078, "global_step": 150393, "epoch": 1811} {"train_loss": -23.2159481048584, "global_step": 150394, "epoch": 1811} {"train_loss": -23.12095083673316, "global_step": 150395, "epoch": 1811, "val_loss": 6265851.0} {"train_loss": -22.976049423217773, "global_step": 150396, "epoch": 1812} {"train_loss": -22.961877822875977, "global_step": 150397, "epoch": 1812} {"train_loss": -23.26125144958496, "global_step": 150398, "epoch": 1812} {"train_loss": -22.7227840423584, "global_step": 150399, "epoch": 1812} {"train_loss": -22.827392578125, "global_step": 150400, "epoch": 1812} {"train_loss": -22.75200843811035, "global_step": 150401, "epoch": 1812} {"train_loss": -22.943710327148438, "global_step": 150402, "epoch": 1812} {"train_loss": -22.964101791381836, "global_step": 150403, "epoch": 1812} {"train_loss": -23.095617294311523, "global_step": 150404, "epoch": 1812} {"train_loss": -22.810781478881836, "global_step": 150405, "epoch": 1812} {"train_loss": -22.983142852783203, "global_step": 150406, "epoch": 1812} {"train_loss": -22.90106964111328, "global_step": 150407, "epoch": 1812} {"train_loss": -23.152454376220703, "global_step": 150408, "epoch": 1812} {"train_loss": -22.896787643432617, "global_step": 150409, "epoch": 1812} {"train_loss": -23.197580337524414, "global_step": 150410, "epoch": 1812} {"train_loss": -23.092226028442383, "global_step": 150411, "epoch": 1812} {"train_loss": -23.162281036376953, "global_step": 150412, "epoch": 1812} {"train_loss": -23.08641815185547, "global_step": 150413, "epoch": 1812} {"train_loss": -23.180288314819336, "global_step": 150414, "epoch": 1812} {"train_loss": -23.083118438720703, "global_step": 150415, "epoch": 1812} {"train_loss": -23.25920867919922, "global_step": 150416, "epoch": 1812} {"train_loss": -23.119760513305664, "global_step": 150417, "epoch": 1812} {"train_loss": -23.407333374023438, "global_step": 150418, "epoch": 1812} {"train_loss": -23.637447357177734, "global_step": 150419, "epoch": 1812} {"train_loss": -23.564313888549805, "global_step": 150420, "epoch": 1812} {"train_loss": -22.992076873779297, "global_step": 150421, "epoch": 1812} {"train_loss": -23.109743118286133, "global_step": 150422, "epoch": 1812} {"train_loss": -23.242338180541992, "global_step": 150423, "epoch": 1812} {"train_loss": -23.21636962890625, "global_step": 150424, "epoch": 1812} {"train_loss": -23.663541793823242, "global_step": 150425, "epoch": 1812} {"train_loss": -23.34686851501465, "global_step": 150426, "epoch": 1812} {"train_loss": -23.35213279724121, "global_step": 150427, "epoch": 1812} {"train_loss": -23.80133628845215, "global_step": 150428, "epoch": 1812} {"train_loss": -23.519933700561523, "global_step": 150429, "epoch": 1812} {"train_loss": -23.40176010131836, "global_step": 150430, "epoch": 1812} {"train_loss": -23.149702072143555, "global_step": 150431, "epoch": 1812} {"train_loss": -23.280439376831055, "global_step": 150432, "epoch": 1812} {"train_loss": -23.297077178955078, "global_step": 150433, "epoch": 1812} {"train_loss": -23.049978256225586, "global_step": 150434, "epoch": 1812} {"train_loss": -23.457487106323242, "global_step": 150435, "epoch": 1812} {"train_loss": -23.07635498046875, "global_step": 150436, "epoch": 1812} {"train_loss": -23.455684661865234, "global_step": 150437, "epoch": 1812} {"train_loss": -23.29791259765625, "global_step": 150438, "epoch": 1812} {"train_loss": -22.916425704956055, "global_step": 150439, "epoch": 1812} {"train_loss": -23.681198120117188, "global_step": 150440, "epoch": 1812} {"train_loss": -23.55904197692871, "global_step": 150441, "epoch": 1812} {"train_loss": -23.178449630737305, "global_step": 150442, "epoch": 1812} {"train_loss": -23.508543014526367, "global_step": 150443, "epoch": 1812} {"train_loss": -23.592670440673828, "global_step": 150444, "epoch": 1812} {"train_loss": -23.369674682617188, "global_step": 150445, "epoch": 1812} {"train_loss": -23.341476440429688, "global_step": 150446, "epoch": 1812} {"train_loss": -23.40500831604004, "global_step": 150447, "epoch": 1812} {"train_loss": -23.293643951416016, "global_step": 150448, "epoch": 1812} {"train_loss": -23.50397300720215, "global_step": 150449, "epoch": 1812} {"train_loss": -23.439924240112305, "global_step": 150450, "epoch": 1812} {"train_loss": -23.705610275268555, "global_step": 150451, "epoch": 1812} {"train_loss": -23.19297981262207, "global_step": 150452, "epoch": 1812} {"train_loss": -23.268123626708984, "global_step": 150453, "epoch": 1812} {"train_loss": -23.261140823364258, "global_step": 150454, "epoch": 1812} {"train_loss": -23.477312088012695, "global_step": 150455, "epoch": 1812} {"train_loss": -23.025394439697266, "global_step": 150456, "epoch": 1812} {"train_loss": -23.248220443725586, "global_step": 150457, "epoch": 1812} {"train_loss": -23.40831756591797, "global_step": 150458, "epoch": 1812} {"train_loss": -23.403919219970703, "global_step": 150459, "epoch": 1812} {"train_loss": -23.122472763061523, "global_step": 150460, "epoch": 1812} {"train_loss": -23.5009708404541, "global_step": 150461, "epoch": 1812} {"train_loss": -23.164350509643555, "global_step": 150462, "epoch": 1812} {"train_loss": -23.55438995361328, "global_step": 150463, "epoch": 1812} {"train_loss": -23.381061553955078, "global_step": 150464, "epoch": 1812} {"train_loss": -23.38205337524414, "global_step": 150465, "epoch": 1812} {"train_loss": -23.301647186279297, "global_step": 150466, "epoch": 1812} {"train_loss": -23.1264705657959, "global_step": 150467, "epoch": 1812} {"train_loss": -23.615114212036133, "global_step": 150468, "epoch": 1812} {"train_loss": -23.18190574645996, "global_step": 150469, "epoch": 1812} {"train_loss": -23.534521102905273, "global_step": 150470, "epoch": 1812} {"train_loss": -23.489952087402344, "global_step": 150471, "epoch": 1812} {"train_loss": -22.974119186401367, "global_step": 150472, "epoch": 1812} {"train_loss": -23.004138946533203, "global_step": 150473, "epoch": 1812} {"train_loss": -23.32777214050293, "global_step": 150474, "epoch": 1812} {"train_loss": -22.871610641479492, "global_step": 150475, "epoch": 1812} {"train_loss": -22.73549461364746, "global_step": 150476, "epoch": 1812} {"train_loss": -23.05691909790039, "global_step": 150477, "epoch": 1812} {"train_loss": -23.241036794271814, "global_step": 150478, "epoch": 1812, "val_loss": 6322942.0} {"train_loss": -23.113418579101562, "global_step": 150479, "epoch": 1813} {"train_loss": -22.69199562072754, "global_step": 150480, "epoch": 1813} {"train_loss": -23.056659698486328, "global_step": 150481, "epoch": 1813} {"train_loss": -23.14848518371582, "global_step": 150482, "epoch": 1813} {"train_loss": -22.99900245666504, "global_step": 150483, "epoch": 1813} {"train_loss": -23.353578567504883, "global_step": 150484, "epoch": 1813} {"train_loss": -23.05568504333496, "global_step": 150485, "epoch": 1813} {"train_loss": -22.61528778076172, "global_step": 150486, "epoch": 1813} {"train_loss": -23.081613540649414, "global_step": 150487, "epoch": 1813} {"train_loss": -23.328140258789062, "global_step": 150488, "epoch": 1813} {"train_loss": -23.449243545532227, "global_step": 150489, "epoch": 1813} {"train_loss": -23.190750122070312, "global_step": 150490, "epoch": 1813} {"train_loss": -23.16859245300293, "global_step": 150491, "epoch": 1813} {"train_loss": -22.978153228759766, "global_step": 150492, "epoch": 1813} {"train_loss": -23.04984474182129, "global_step": 150493, "epoch": 1813} {"train_loss": -23.030689239501953, "global_step": 150494, "epoch": 1813} {"train_loss": -23.279497146606445, "global_step": 150495, "epoch": 1813} {"train_loss": -23.10599136352539, "global_step": 150496, "epoch": 1813} {"train_loss": -23.196638107299805, "global_step": 150497, "epoch": 1813} {"train_loss": -23.18577766418457, "global_step": 150498, "epoch": 1813} {"train_loss": -23.245458602905273, "global_step": 150499, "epoch": 1813} {"train_loss": -23.28854751586914, "global_step": 150500, "epoch": 1813} {"train_loss": -23.16329574584961, "global_step": 150501, "epoch": 1813} {"train_loss": -23.20041847229004, "global_step": 150502, "epoch": 1813} {"train_loss": -23.164026260375977, "global_step": 150503, "epoch": 1813} {"train_loss": -23.18045425415039, "global_step": 150504, "epoch": 1813} {"train_loss": -22.997989654541016, "global_step": 150505, "epoch": 1813} {"train_loss": -23.26175880432129, "global_step": 150506, "epoch": 1813} {"train_loss": -23.218109130859375, "global_step": 150507, "epoch": 1813} {"train_loss": -23.37225341796875, "global_step": 150508, "epoch": 1813} {"train_loss": -23.464731216430664, "global_step": 150509, "epoch": 1813} {"train_loss": -23.04970932006836, "global_step": 150510, "epoch": 1813} {"train_loss": -23.35980796813965, "global_step": 150511, "epoch": 1813} {"train_loss": -23.515689849853516, "global_step": 150512, "epoch": 1813} {"train_loss": -23.672250747680664, "global_step": 150513, "epoch": 1813} {"train_loss": -23.579389572143555, "global_step": 150514, "epoch": 1813} {"train_loss": -23.275318145751953, "global_step": 150515, "epoch": 1813} {"train_loss": -23.232589721679688, "global_step": 150516, "epoch": 1813} {"train_loss": -23.255435943603516, "global_step": 150517, "epoch": 1813} {"train_loss": -23.243894577026367, "global_step": 150518, "epoch": 1813} {"train_loss": -23.002668380737305, "global_step": 150519, "epoch": 1813} {"train_loss": -23.408063888549805, "global_step": 150520, "epoch": 1813} {"train_loss": -23.6416072845459, "global_step": 150521, "epoch": 1813} {"train_loss": -23.42484474182129, "global_step": 150522, "epoch": 1813} {"train_loss": -23.2011775970459, "global_step": 150523, "epoch": 1813} {"train_loss": -23.401334762573242, "global_step": 150524, "epoch": 1813} {"train_loss": -23.630401611328125, "global_step": 150525, "epoch": 1813} {"train_loss": -23.319421768188477, "global_step": 150526, "epoch": 1813} {"train_loss": -23.54753875732422, "global_step": 150527, "epoch": 1813} {"train_loss": -23.23311996459961, "global_step": 150528, "epoch": 1813} {"train_loss": -23.215118408203125, "global_step": 150529, "epoch": 1813} {"train_loss": -23.308385848999023, "global_step": 150530, "epoch": 1813} {"train_loss": -23.196640014648438, "global_step": 150531, "epoch": 1813} {"train_loss": -23.504873275756836, "global_step": 150532, "epoch": 1813} {"train_loss": -23.48807144165039, "global_step": 150533, "epoch": 1813} {"train_loss": -23.33741569519043, "global_step": 150534, "epoch": 1813} {"train_loss": -23.4246883392334, "global_step": 150535, "epoch": 1813} {"train_loss": -23.305978775024414, "global_step": 150536, "epoch": 1813} {"train_loss": -23.337614059448242, "global_step": 150537, "epoch": 1813} {"train_loss": -23.360013961791992, "global_step": 150538, "epoch": 1813} {"train_loss": -23.25538444519043, "global_step": 150539, "epoch": 1813} {"train_loss": -22.937461853027344, "global_step": 150540, "epoch": 1813} {"train_loss": -23.389564514160156, "global_step": 150541, "epoch": 1813} {"train_loss": -23.380279541015625, "global_step": 150542, "epoch": 1813} {"train_loss": -23.417997360229492, "global_step": 150543, "epoch": 1813} {"train_loss": -23.508298873901367, "global_step": 150544, "epoch": 1813} {"train_loss": -23.52115249633789, "global_step": 150545, "epoch": 1813} {"train_loss": -23.57543182373047, "global_step": 150546, "epoch": 1813} {"train_loss": -23.206018447875977, "global_step": 150547, "epoch": 1813} {"train_loss": -23.312253952026367, "global_step": 150548, "epoch": 1813} {"train_loss": -23.219619750976562, "global_step": 150549, "epoch": 1813} {"train_loss": -23.335233688354492, "global_step": 150550, "epoch": 1813} {"train_loss": -23.28374671936035, "global_step": 150551, "epoch": 1813} {"train_loss": -23.419113159179688, "global_step": 150552, "epoch": 1813} {"train_loss": -22.988357543945312, "global_step": 150553, "epoch": 1813} {"train_loss": -23.663068771362305, "global_step": 150554, "epoch": 1813} {"train_loss": -23.512983322143555, "global_step": 150555, "epoch": 1813} {"train_loss": -23.63846778869629, "global_step": 150556, "epoch": 1813} {"train_loss": -23.635257720947266, "global_step": 150557, "epoch": 1813} {"train_loss": -22.86195945739746, "global_step": 150558, "epoch": 1813} {"train_loss": -23.09246826171875, "global_step": 150559, "epoch": 1813} {"train_loss": -22.776914596557617, "global_step": 150560, "epoch": 1813} {"train_loss": -23.258471592363104, "global_step": 150561, "epoch": 1813, "val_loss": 6321336.0} {"train_loss": -23.007638931274414, "global_step": 150562, "epoch": 1814} {"train_loss": -22.508567810058594, "global_step": 150563, "epoch": 1814} {"train_loss": -22.575313568115234, "global_step": 150564, "epoch": 1814} {"train_loss": -22.743484497070312, "global_step": 150565, "epoch": 1814} {"train_loss": -22.632247924804688, "global_step": 150566, "epoch": 1814} {"train_loss": -22.683048248291016, "global_step": 150567, "epoch": 1814} {"train_loss": -22.70798110961914, "global_step": 150568, "epoch": 1814} {"train_loss": -22.943161010742188, "global_step": 150569, "epoch": 1814} {"train_loss": -22.7912540435791, "global_step": 150570, "epoch": 1814} {"train_loss": -23.241424560546875, "global_step": 150571, "epoch": 1814} {"train_loss": -23.201618194580078, "global_step": 150572, "epoch": 1814} {"train_loss": -22.69693946838379, "global_step": 150573, "epoch": 1814} {"train_loss": -23.255552291870117, "global_step": 150574, "epoch": 1814} {"train_loss": -22.718595504760742, "global_step": 150575, "epoch": 1814} {"train_loss": -23.12561798095703, "global_step": 150576, "epoch": 1814} {"train_loss": -22.7015438079834, "global_step": 150577, "epoch": 1814} {"train_loss": -23.19645118713379, "global_step": 150578, "epoch": 1814} {"train_loss": -22.912778854370117, "global_step": 150579, "epoch": 1814} {"train_loss": -23.212669372558594, "global_step": 150580, "epoch": 1814} {"train_loss": -22.966022491455078, "global_step": 150581, "epoch": 1814} {"train_loss": -23.146240234375, "global_step": 150582, "epoch": 1814} {"train_loss": -23.117795944213867, "global_step": 150583, "epoch": 1814} {"train_loss": -23.28590202331543, "global_step": 150584, "epoch": 1814} {"train_loss": -23.23176383972168, "global_step": 150585, "epoch": 1814} {"train_loss": -23.13498878479004, "global_step": 150586, "epoch": 1814} {"train_loss": -22.928442001342773, "global_step": 150587, "epoch": 1814} {"train_loss": -23.034942626953125, "global_step": 150588, "epoch": 1814} {"train_loss": -22.823347091674805, "global_step": 150589, "epoch": 1814} {"train_loss": -23.305206298828125, "global_step": 150590, "epoch": 1814} {"train_loss": -23.116994857788086, "global_step": 150591, "epoch": 1814} {"train_loss": -23.388275146484375, "global_step": 150592, "epoch": 1814} {"train_loss": -23.236648559570312, "global_step": 150593, "epoch": 1814} {"train_loss": -23.075592041015625, "global_step": 150594, "epoch": 1814} {"train_loss": -23.335844039916992, "global_step": 150595, "epoch": 1814} {"train_loss": -23.45792579650879, "global_step": 150596, "epoch": 1814} {"train_loss": -23.181072235107422, "global_step": 150597, "epoch": 1814} {"train_loss": -23.1138973236084, "global_step": 150598, "epoch": 1814} {"train_loss": -23.710371017456055, "global_step": 150599, "epoch": 1814} {"train_loss": -23.563785552978516, "global_step": 150600, "epoch": 1814} {"train_loss": -23.473852157592773, "global_step": 150601, "epoch": 1814} {"train_loss": -23.076072692871094, "global_step": 150602, "epoch": 1814} {"train_loss": -23.341962814331055, "global_step": 150603, "epoch": 1814} {"train_loss": -23.546396255493164, "global_step": 150604, "epoch": 1814} {"train_loss": -23.733736038208008, "global_step": 150605, "epoch": 1814} {"train_loss": -23.74628257751465, "global_step": 150606, "epoch": 1814} {"train_loss": -23.380496978759766, "global_step": 150607, "epoch": 1814} {"train_loss": -23.308740615844727, "global_step": 150608, "epoch": 1814} {"train_loss": -23.92540740966797, "global_step": 150609, "epoch": 1814} {"train_loss": -23.28583335876465, "global_step": 150610, "epoch": 1814} {"train_loss": -23.077899932861328, "global_step": 150611, "epoch": 1814} {"train_loss": -23.293048858642578, "global_step": 150612, "epoch": 1814} {"train_loss": -23.01877212524414, "global_step": 150613, "epoch": 1814} {"train_loss": -23.225706100463867, "global_step": 150614, "epoch": 1814} {"train_loss": -23.302759170532227, "global_step": 150615, "epoch": 1814} {"train_loss": -23.15863609313965, "global_step": 150616, "epoch": 1814} {"train_loss": -23.314041137695312, "global_step": 150617, "epoch": 1814} {"train_loss": -22.97645378112793, "global_step": 150618, "epoch": 1814} {"train_loss": -22.96613311767578, "global_step": 150619, "epoch": 1814} {"train_loss": -22.99051856994629, "global_step": 150620, "epoch": 1814} {"train_loss": -23.06514549255371, "global_step": 150621, "epoch": 1814} {"train_loss": -23.506498336791992, "global_step": 150622, "epoch": 1814} {"train_loss": -22.570688247680664, "global_step": 150623, "epoch": 1814} {"train_loss": -23.25440216064453, "global_step": 150624, "epoch": 1814} {"train_loss": -23.027191162109375, "global_step": 150625, "epoch": 1814} {"train_loss": -23.082609176635742, "global_step": 150626, "epoch": 1814} {"train_loss": -23.05183982849121, "global_step": 150627, "epoch": 1814} {"train_loss": -23.011199951171875, "global_step": 150628, "epoch": 1814} {"train_loss": -23.06646728515625, "global_step": 150629, "epoch": 1814} {"train_loss": -23.102157592773438, "global_step": 150630, "epoch": 1814} {"train_loss": -23.648935317993164, "global_step": 150631, "epoch": 1814} {"train_loss": -23.471303939819336, "global_step": 150632, "epoch": 1814} {"train_loss": -23.121898651123047, "global_step": 150633, "epoch": 1814} {"train_loss": -23.13388442993164, "global_step": 150634, "epoch": 1814} {"train_loss": -23.31625747680664, "global_step": 150635, "epoch": 1814} {"train_loss": -23.02243423461914, "global_step": 150636, "epoch": 1814} {"train_loss": -23.5445613861084, "global_step": 150637, "epoch": 1814} {"train_loss": -22.953187942504883, "global_step": 150638, "epoch": 1814} {"train_loss": -23.189298629760742, "global_step": 150639, "epoch": 1814} {"train_loss": -23.28261375427246, "global_step": 150640, "epoch": 1814} {"train_loss": -23.5252628326416, "global_step": 150641, "epoch": 1814} {"train_loss": -23.48164176940918, "global_step": 150642, "epoch": 1814} {"train_loss": -23.097061157226562, "global_step": 150643, "epoch": 1814} {"train_loss": -23.141259434711504, "global_step": 150644, "epoch": 1814, "val_loss": 6320942.0} {"train_loss": -22.7937068939209, "global_step": 150645, "epoch": 1815} {"train_loss": -22.816923141479492, "global_step": 150646, "epoch": 1815} {"train_loss": -23.106067657470703, "global_step": 150647, "epoch": 1815} {"train_loss": -22.726200103759766, "global_step": 150648, "epoch": 1815} {"train_loss": -22.87281036376953, "global_step": 150649, "epoch": 1815} {"train_loss": -23.0161190032959, "global_step": 150650, "epoch": 1815} {"train_loss": -23.13787078857422, "global_step": 150651, "epoch": 1815} {"train_loss": -23.184415817260742, "global_step": 150652, "epoch": 1815} {"train_loss": -23.179264068603516, "global_step": 150653, "epoch": 1815} {"train_loss": -22.946807861328125, "global_step": 150654, "epoch": 1815} {"train_loss": -23.07706642150879, "global_step": 150655, "epoch": 1815} {"train_loss": -23.304685592651367, "global_step": 150656, "epoch": 1815} {"train_loss": -22.994232177734375, "global_step": 150657, "epoch": 1815} {"train_loss": -22.43349838256836, "global_step": 150658, "epoch": 1815} {"train_loss": -23.58345603942871, "global_step": 150659, "epoch": 1815} {"train_loss": -22.858930587768555, "global_step": 150660, "epoch": 1815} {"train_loss": -23.214624404907227, "global_step": 150661, "epoch": 1815} {"train_loss": -23.39114761352539, "global_step": 150662, "epoch": 1815} {"train_loss": -23.005950927734375, "global_step": 150663, "epoch": 1815} {"train_loss": -23.31464958190918, "global_step": 150664, "epoch": 1815} {"train_loss": -23.18367576599121, "global_step": 150665, "epoch": 1815} {"train_loss": -23.250755310058594, "global_step": 150666, "epoch": 1815} {"train_loss": -23.0919132232666, "global_step": 150667, "epoch": 1815} {"train_loss": -23.232450485229492, "global_step": 150668, "epoch": 1815} {"train_loss": -23.185348510742188, "global_step": 150669, "epoch": 1815} {"train_loss": -23.7183895111084, "global_step": 150670, "epoch": 1815} {"train_loss": -23.405851364135742, "global_step": 150671, "epoch": 1815} {"train_loss": -23.67365074157715, "global_step": 150672, "epoch": 1815} {"train_loss": -23.44281578063965, "global_step": 150673, "epoch": 1815} {"train_loss": -23.224069595336914, "global_step": 150674, "epoch": 1815} {"train_loss": -23.21255111694336, "global_step": 150675, "epoch": 1815} {"train_loss": -23.308927536010742, "global_step": 150676, "epoch": 1815} {"train_loss": -23.358861923217773, "global_step": 150677, "epoch": 1815} {"train_loss": -23.375991821289062, "global_step": 150678, "epoch": 1815} {"train_loss": -23.46017837524414, "global_step": 150679, "epoch": 1815} {"train_loss": -23.385738372802734, "global_step": 150680, "epoch": 1815} {"train_loss": -23.465930938720703, "global_step": 150681, "epoch": 1815} {"train_loss": -23.63330841064453, "global_step": 150682, "epoch": 1815} {"train_loss": -23.419301986694336, "global_step": 150683, "epoch": 1815} {"train_loss": -23.54036521911621, "global_step": 150684, "epoch": 1815} {"train_loss": -23.47612953186035, "global_step": 150685, "epoch": 1815} {"train_loss": -23.168516159057617, "global_step": 150686, "epoch": 1815} {"train_loss": -23.350854873657227, "global_step": 150687, "epoch": 1815} {"train_loss": -23.50956153869629, "global_step": 150688, "epoch": 1815} {"train_loss": -23.34854507446289, "global_step": 150689, "epoch": 1815} {"train_loss": -23.056446075439453, "global_step": 150690, "epoch": 1815} {"train_loss": -23.534488677978516, "global_step": 150691, "epoch": 1815} {"train_loss": -23.496566772460938, "global_step": 150692, "epoch": 1815} {"train_loss": -23.280912399291992, "global_step": 150693, "epoch": 1815} {"train_loss": -23.54181480407715, "global_step": 150694, "epoch": 1815} {"train_loss": -23.530439376831055, "global_step": 150695, "epoch": 1815} {"train_loss": -23.513002395629883, "global_step": 150696, "epoch": 1815} {"train_loss": -23.323827743530273, "global_step": 150697, "epoch": 1815} {"train_loss": -23.116622924804688, "global_step": 150698, "epoch": 1815} {"train_loss": -23.55314064025879, "global_step": 150699, "epoch": 1815} {"train_loss": -23.301084518432617, "global_step": 150700, "epoch": 1815} {"train_loss": -23.422412872314453, "global_step": 150701, "epoch": 1815} {"train_loss": -23.463714599609375, "global_step": 150702, "epoch": 1815} {"train_loss": -23.495702743530273, "global_step": 150703, "epoch": 1815} {"train_loss": -23.158727645874023, "global_step": 150704, "epoch": 1815} {"train_loss": -23.311681747436523, "global_step": 150705, "epoch": 1815} {"train_loss": -22.942001342773438, "global_step": 150706, "epoch": 1815} {"train_loss": -23.004140853881836, "global_step": 150707, "epoch": 1815} {"train_loss": -23.279756546020508, "global_step": 150708, "epoch": 1815} {"train_loss": -23.170034408569336, "global_step": 150709, "epoch": 1815} {"train_loss": -23.06559944152832, "global_step": 150710, "epoch": 1815} {"train_loss": -23.27826499938965, "global_step": 150711, "epoch": 1815} {"train_loss": -23.240869522094727, "global_step": 150712, "epoch": 1815} {"train_loss": -23.41377067565918, "global_step": 150713, "epoch": 1815} {"train_loss": -23.044496536254883, "global_step": 150714, "epoch": 1815} {"train_loss": -23.253786087036133, "global_step": 150715, "epoch": 1815} {"train_loss": -23.423370361328125, "global_step": 150716, "epoch": 1815} {"train_loss": -23.289243698120117, "global_step": 150717, "epoch": 1815} {"train_loss": -23.31903648376465, "global_step": 150718, "epoch": 1815} {"train_loss": -23.266042709350586, "global_step": 150719, "epoch": 1815} {"train_loss": -23.45576286315918, "global_step": 150720, "epoch": 1815} {"train_loss": -23.53107261657715, "global_step": 150721, "epoch": 1815} {"train_loss": -23.468891143798828, "global_step": 150722, "epoch": 1815} {"train_loss": -22.697250366210938, "global_step": 150723, "epoch": 1815} {"train_loss": -23.248096466064453, "global_step": 150724, "epoch": 1815} {"train_loss": -23.384397506713867, "global_step": 150725, "epoch": 1815} {"train_loss": -23.299039840698242, "global_step": 150726, "epoch": 1815} {"train_loss": -23.27049841363746, "global_step": 150727, "epoch": 1815, "val_loss": 6267231.5} {"train_loss": -23.247995376586914, "global_step": 150728, "epoch": 1816} {"train_loss": -23.002981185913086, "global_step": 150729, "epoch": 1816} {"train_loss": -22.85367202758789, "global_step": 150730, "epoch": 1816} {"train_loss": -23.04755401611328, "global_step": 150731, "epoch": 1816} {"train_loss": -23.188217163085938, "global_step": 150732, "epoch": 1816} {"train_loss": -23.18916130065918, "global_step": 150733, "epoch": 1816} {"train_loss": -22.748144149780273, "global_step": 150734, "epoch": 1816} {"train_loss": -23.0738468170166, "global_step": 150735, "epoch": 1816} {"train_loss": -22.93418312072754, "global_step": 150736, "epoch": 1816} {"train_loss": -22.915496826171875, "global_step": 150737, "epoch": 1816} {"train_loss": -23.331918716430664, "global_step": 150738, "epoch": 1816} {"train_loss": -23.015684127807617, "global_step": 150739, "epoch": 1816} {"train_loss": -22.70155143737793, "global_step": 150740, "epoch": 1816} {"train_loss": -23.213254928588867, "global_step": 150741, "epoch": 1816} {"train_loss": -23.508928298950195, "global_step": 150742, "epoch": 1816} {"train_loss": -23.030858993530273, "global_step": 150743, "epoch": 1816} {"train_loss": -23.170082092285156, "global_step": 150744, "epoch": 1816} {"train_loss": -23.262805938720703, "global_step": 150745, "epoch": 1816} {"train_loss": -22.716644287109375, "global_step": 150746, "epoch": 1816} {"train_loss": -23.110477447509766, "global_step": 150747, "epoch": 1816} {"train_loss": -23.0451602935791, "global_step": 150748, "epoch": 1816} {"train_loss": -23.395889282226562, "global_step": 150749, "epoch": 1816} {"train_loss": -23.705472946166992, "global_step": 150750, "epoch": 1816} {"train_loss": -22.990673065185547, "global_step": 150751, "epoch": 1816} {"train_loss": -22.995988845825195, "global_step": 150752, "epoch": 1816} {"train_loss": -23.132604598999023, "global_step": 150753, "epoch": 1816} {"train_loss": -23.136865615844727, "global_step": 150754, "epoch": 1816} {"train_loss": -23.394329071044922, "global_step": 150755, "epoch": 1816} {"train_loss": -23.434696197509766, "global_step": 150756, "epoch": 1816} {"train_loss": -23.654346466064453, "global_step": 150757, "epoch": 1816} {"train_loss": -23.13834571838379, "global_step": 150758, "epoch": 1816} {"train_loss": -23.27899742126465, "global_step": 150759, "epoch": 1816} {"train_loss": -23.023984909057617, "global_step": 150760, "epoch": 1816} {"train_loss": -23.364009857177734, "global_step": 150761, "epoch": 1816} {"train_loss": -23.293062210083008, "global_step": 150762, "epoch": 1816} {"train_loss": -23.10848045349121, "global_step": 150763, "epoch": 1816} {"train_loss": -23.490476608276367, "global_step": 150764, "epoch": 1816} {"train_loss": -23.502052307128906, "global_step": 150765, "epoch": 1816} {"train_loss": -23.216293334960938, "global_step": 150766, "epoch": 1816} {"train_loss": -22.98259925842285, "global_step": 150767, "epoch": 1816} {"train_loss": -23.465585708618164, "global_step": 150768, "epoch": 1816} {"train_loss": -23.075895309448242, "global_step": 150769, "epoch": 1816} {"train_loss": -22.99672508239746, "global_step": 150770, "epoch": 1816} {"train_loss": -23.1796817779541, "global_step": 150771, "epoch": 1816} {"train_loss": -23.129302978515625, "global_step": 150772, "epoch": 1816} {"train_loss": -23.01799201965332, "global_step": 150773, "epoch": 1816} {"train_loss": -23.479389190673828, "global_step": 150774, "epoch": 1816} {"train_loss": -22.913105010986328, "global_step": 150775, "epoch": 1816} {"train_loss": -23.529142379760742, "global_step": 150776, "epoch": 1816} {"train_loss": -22.8713436126709, "global_step": 150777, "epoch": 1816} {"train_loss": -23.527759552001953, "global_step": 150778, "epoch": 1816} {"train_loss": -23.078943252563477, "global_step": 150779, "epoch": 1816} {"train_loss": -23.600589752197266, "global_step": 150780, "epoch": 1816} {"train_loss": -23.038461685180664, "global_step": 150781, "epoch": 1816} {"train_loss": -23.54921531677246, "global_step": 150782, "epoch": 1816} {"train_loss": -23.032339096069336, "global_step": 150783, "epoch": 1816} {"train_loss": -23.432098388671875, "global_step": 150784, "epoch": 1816} {"train_loss": -22.99165916442871, "global_step": 150785, "epoch": 1816} {"train_loss": -22.705305099487305, "global_step": 150786, "epoch": 1816} {"train_loss": -23.190685272216797, "global_step": 150787, "epoch": 1816} {"train_loss": -23.17901039123535, "global_step": 150788, "epoch": 1816} {"train_loss": -22.879545211791992, "global_step": 150789, "epoch": 1816} {"train_loss": -23.415512084960938, "global_step": 150790, "epoch": 1816} {"train_loss": -23.18879508972168, "global_step": 150791, "epoch": 1816} {"train_loss": -23.028366088867188, "global_step": 150792, "epoch": 1816} {"train_loss": -23.1614933013916, "global_step": 150793, "epoch": 1816} {"train_loss": -23.084257125854492, "global_step": 150794, "epoch": 1816} {"train_loss": -23.213470458984375, "global_step": 150795, "epoch": 1816} {"train_loss": -23.193912506103516, "global_step": 150796, "epoch": 1816} {"train_loss": -23.383825302124023, "global_step": 150797, "epoch": 1816} {"train_loss": -23.701797485351562, "global_step": 150798, "epoch": 1816} {"train_loss": -23.211944580078125, "global_step": 150799, "epoch": 1816} {"train_loss": -23.245487213134766, "global_step": 150800, "epoch": 1816} {"train_loss": -23.256488800048828, "global_step": 150801, "epoch": 1816} {"train_loss": -22.883535385131836, "global_step": 150802, "epoch": 1816} {"train_loss": -23.213876724243164, "global_step": 150803, "epoch": 1816} {"train_loss": -22.989755630493164, "global_step": 150804, "epoch": 1816} {"train_loss": -23.19063377380371, "global_step": 150805, "epoch": 1816} {"train_loss": -23.375019073486328, "global_step": 150806, "epoch": 1816} {"train_loss": -22.757129669189453, "global_step": 150807, "epoch": 1816} {"train_loss": -22.90782928466797, "global_step": 150808, "epoch": 1816} {"train_loss": -23.4310245513916, "global_step": 150809, "epoch": 1816} {"train_loss": -23.176533572645074, "global_step": 150810, "epoch": 1816, "val_loss": 6280458.0} {"train_loss": -22.376846313476562, "global_step": 150811, "epoch": 1817} {"train_loss": -22.78728485107422, "global_step": 150812, "epoch": 1817} {"train_loss": -22.923803329467773, "global_step": 150813, "epoch": 1817} {"train_loss": -22.640371322631836, "global_step": 150814, "epoch": 1817} {"train_loss": -22.937604904174805, "global_step": 150815, "epoch": 1817} {"train_loss": -22.513751983642578, "global_step": 150816, "epoch": 1817} {"train_loss": -23.30927848815918, "global_step": 150817, "epoch": 1817} {"train_loss": -22.86815643310547, "global_step": 150818, "epoch": 1817} {"train_loss": -23.097972869873047, "global_step": 150819, "epoch": 1817} {"train_loss": -23.26463508605957, "global_step": 150820, "epoch": 1817} {"train_loss": -23.233652114868164, "global_step": 150821, "epoch": 1817} {"train_loss": -23.30498504638672, "global_step": 150822, "epoch": 1817} {"train_loss": -23.15517234802246, "global_step": 150823, "epoch": 1817} {"train_loss": -23.012067794799805, "global_step": 150824, "epoch": 1817} {"train_loss": -23.139387130737305, "global_step": 150825, "epoch": 1817} {"train_loss": -23.09860610961914, "global_step": 150826, "epoch": 1817} {"train_loss": -23.20102882385254, "global_step": 150827, "epoch": 1817} {"train_loss": -23.326461791992188, "global_step": 150828, "epoch": 1817} {"train_loss": -23.322017669677734, "global_step": 150829, "epoch": 1817} {"train_loss": -23.41290855407715, "global_step": 150830, "epoch": 1817} {"train_loss": -23.149667739868164, "global_step": 150831, "epoch": 1817} {"train_loss": -23.231054306030273, "global_step": 150832, "epoch": 1817} {"train_loss": -23.451135635375977, "global_step": 150833, "epoch": 1817} {"train_loss": -23.1326904296875, "global_step": 150834, "epoch": 1817} {"train_loss": -23.65587043762207, "global_step": 150835, "epoch": 1817} {"train_loss": -23.108707427978516, "global_step": 150836, "epoch": 1817} {"train_loss": -23.321203231811523, "global_step": 150837, "epoch": 1817} {"train_loss": -23.310302734375, "global_step": 150838, "epoch": 1817} {"train_loss": -23.56306266784668, "global_step": 150839, "epoch": 1817} {"train_loss": -23.3221378326416, "global_step": 150840, "epoch": 1817} {"train_loss": -23.176715850830078, "global_step": 150841, "epoch": 1817} {"train_loss": -23.098976135253906, "global_step": 150842, "epoch": 1817} {"train_loss": -23.5751953125, "global_step": 150843, "epoch": 1817} {"train_loss": -23.190383911132812, "global_step": 150844, "epoch": 1817} {"train_loss": -23.245498657226562, "global_step": 150845, "epoch": 1817} {"train_loss": -23.30127716064453, "global_step": 150846, "epoch": 1817} {"train_loss": -23.455732345581055, "global_step": 150847, "epoch": 1817} {"train_loss": -23.53119468688965, "global_step": 150848, "epoch": 1817} {"train_loss": -23.193944931030273, "global_step": 150849, "epoch": 1817} {"train_loss": -23.24978256225586, "global_step": 150850, "epoch": 1817} {"train_loss": -23.676603317260742, "global_step": 150851, "epoch": 1817} {"train_loss": -22.959226608276367, "global_step": 150852, "epoch": 1817} {"train_loss": -23.23421287536621, "global_step": 150853, "epoch": 1817} {"train_loss": -23.337100982666016, "global_step": 150854, "epoch": 1817} {"train_loss": -23.214418411254883, "global_step": 150855, "epoch": 1817} {"train_loss": -23.414976119995117, "global_step": 150856, "epoch": 1817} {"train_loss": -23.14080810546875, "global_step": 150857, "epoch": 1817} {"train_loss": -23.29193687438965, "global_step": 150858, "epoch": 1817} {"train_loss": -23.113969802856445, "global_step": 150859, "epoch": 1817} {"train_loss": -23.34188461303711, "global_step": 150860, "epoch": 1817} {"train_loss": -23.123008728027344, "global_step": 150861, "epoch": 1817} {"train_loss": -23.14242935180664, "global_step": 150862, "epoch": 1817} {"train_loss": -23.41676902770996, "global_step": 150863, "epoch": 1817} {"train_loss": -23.3243465423584, "global_step": 150864, "epoch": 1817} {"train_loss": -22.978116989135742, "global_step": 150865, "epoch": 1817} {"train_loss": -23.336410522460938, "global_step": 150866, "epoch": 1817} {"train_loss": -23.318586349487305, "global_step": 150867, "epoch": 1817} {"train_loss": -23.54615592956543, "global_step": 150868, "epoch": 1817} {"train_loss": -23.4451961517334, "global_step": 150869, "epoch": 1817} {"train_loss": -23.337207794189453, "global_step": 150870, "epoch": 1817} {"train_loss": -23.307212829589844, "global_step": 150871, "epoch": 1817} {"train_loss": -23.249292373657227, "global_step": 150872, "epoch": 1817} {"train_loss": -23.472158432006836, "global_step": 150873, "epoch": 1817} {"train_loss": -23.614004135131836, "global_step": 150874, "epoch": 1817} {"train_loss": -23.56410789489746, "global_step": 150875, "epoch": 1817} {"train_loss": -22.84731101989746, "global_step": 150876, "epoch": 1817} {"train_loss": -23.521774291992188, "global_step": 150877, "epoch": 1817} {"train_loss": -23.2053279876709, "global_step": 150878, "epoch": 1817} {"train_loss": -23.653539657592773, "global_step": 150879, "epoch": 1817} {"train_loss": -23.676593780517578, "global_step": 150880, "epoch": 1817} {"train_loss": -23.480356216430664, "global_step": 150881, "epoch": 1817} {"train_loss": -23.48419761657715, "global_step": 150882, "epoch": 1817} {"train_loss": -23.33759117126465, "global_step": 150883, "epoch": 1817} {"train_loss": -23.278684616088867, "global_step": 150884, "epoch": 1817} {"train_loss": -23.188859939575195, "global_step": 150885, "epoch": 1817} {"train_loss": -23.266813278198242, "global_step": 150886, "epoch": 1817} {"train_loss": -23.430940628051758, "global_step": 150887, "epoch": 1817} {"train_loss": -23.086944580078125, "global_step": 150888, "epoch": 1817} {"train_loss": -23.576730728149414, "global_step": 150889, "epoch": 1817} {"train_loss": -23.10737419128418, "global_step": 150890, "epoch": 1817} {"train_loss": -23.385986328125, "global_step": 150891, "epoch": 1817} {"train_loss": -23.493383407592773, "global_step": 150892, "epoch": 1817} {"train_loss": -23.254921005432863, "global_step": 150893, "epoch": 1817, "val_loss": 6449928.0} {"train_loss": -23.05305290222168, "global_step": 150894, "epoch": 1818} {"train_loss": -22.397296905517578, "global_step": 150895, "epoch": 1818} {"train_loss": -22.8900203704834, "global_step": 150896, "epoch": 1818} {"train_loss": -23.15217399597168, "global_step": 150897, "epoch": 1818} {"train_loss": -23.012165069580078, "global_step": 150898, "epoch": 1818} {"train_loss": -22.81987953186035, "global_step": 150899, "epoch": 1818} {"train_loss": -22.935256958007812, "global_step": 150900, "epoch": 1818} {"train_loss": -22.90631103515625, "global_step": 150901, "epoch": 1818} {"train_loss": -22.871524810791016, "global_step": 150902, "epoch": 1818} {"train_loss": -22.944238662719727, "global_step": 150903, "epoch": 1818} {"train_loss": -23.050209045410156, "global_step": 150904, "epoch": 1818} {"train_loss": -23.653419494628906, "global_step": 150905, "epoch": 1818} {"train_loss": -23.078475952148438, "global_step": 150906, "epoch": 1818} {"train_loss": -23.252248764038086, "global_step": 150907, "epoch": 1818} {"train_loss": -23.244474411010742, "global_step": 150908, "epoch": 1818} {"train_loss": -23.100831985473633, "global_step": 150909, "epoch": 1818} {"train_loss": -22.680715560913086, "global_step": 150910, "epoch": 1818} {"train_loss": -23.166589736938477, "global_step": 150911, "epoch": 1818} {"train_loss": -23.051610946655273, "global_step": 150912, "epoch": 1818} {"train_loss": -23.11210823059082, "global_step": 150913, "epoch": 1818} {"train_loss": -23.27151870727539, "global_step": 150914, "epoch": 1818} {"train_loss": -23.251813888549805, "global_step": 150915, "epoch": 1818} {"train_loss": -23.011884689331055, "global_step": 150916, "epoch": 1818} {"train_loss": -23.46902084350586, "global_step": 150917, "epoch": 1818} {"train_loss": -23.295778274536133, "global_step": 150918, "epoch": 1818} {"train_loss": -23.09427833557129, "global_step": 150919, "epoch": 1818} {"train_loss": -23.257734298706055, "global_step": 150920, "epoch": 1818} {"train_loss": -23.208744049072266, "global_step": 150921, "epoch": 1818} {"train_loss": -23.100229263305664, "global_step": 150922, "epoch": 1818} {"train_loss": -22.841257095336914, "global_step": 150923, "epoch": 1818} {"train_loss": -22.99789810180664, "global_step": 150924, "epoch": 1818} {"train_loss": -23.44483757019043, "global_step": 150925, "epoch": 1818} {"train_loss": -23.064599990844727, "global_step": 150926, "epoch": 1818} {"train_loss": -23.243337631225586, "global_step": 150927, "epoch": 1818} {"train_loss": -23.226638793945312, "global_step": 150928, "epoch": 1818} {"train_loss": -23.027700424194336, "global_step": 150929, "epoch": 1818} {"train_loss": -23.298486709594727, "global_step": 150930, "epoch": 1818} {"train_loss": -23.144567489624023, "global_step": 150931, "epoch": 1818} {"train_loss": -23.15941619873047, "global_step": 150932, "epoch": 1818} {"train_loss": -22.82068634033203, "global_step": 150933, "epoch": 1818} {"train_loss": -23.105039596557617, "global_step": 150934, "epoch": 1818} {"train_loss": -23.30405044555664, "global_step": 150935, "epoch": 1818} {"train_loss": -23.64008140563965, "global_step": 150936, "epoch": 1818} {"train_loss": -23.224163055419922, "global_step": 150937, "epoch": 1818} {"train_loss": -23.342863082885742, "global_step": 150938, "epoch": 1818} {"train_loss": -23.154687881469727, "global_step": 150939, "epoch": 1818} {"train_loss": -23.454483032226562, "global_step": 150940, "epoch": 1818} {"train_loss": -23.07550621032715, "global_step": 150941, "epoch": 1818} {"train_loss": -23.39435386657715, "global_step": 150942, "epoch": 1818} {"train_loss": -23.65144920349121, "global_step": 150943, "epoch": 1818} {"train_loss": -23.304243087768555, "global_step": 150944, "epoch": 1818} {"train_loss": -23.588592529296875, "global_step": 150945, "epoch": 1818} {"train_loss": -23.554222106933594, "global_step": 150946, "epoch": 1818} {"train_loss": -23.051725387573242, "global_step": 150947, "epoch": 1818} {"train_loss": -23.435169219970703, "global_step": 150948, "epoch": 1818} {"train_loss": -23.496562957763672, "global_step": 150949, "epoch": 1818} {"train_loss": -23.448518753051758, "global_step": 150950, "epoch": 1818} {"train_loss": -23.29657554626465, "global_step": 150951, "epoch": 1818} {"train_loss": -23.127914428710938, "global_step": 150952, "epoch": 1818} {"train_loss": -23.442602157592773, "global_step": 150953, "epoch": 1818} {"train_loss": -23.170917510986328, "global_step": 150954, "epoch": 1818} {"train_loss": -23.431251525878906, "global_step": 150955, "epoch": 1818} {"train_loss": -23.443004608154297, "global_step": 150956, "epoch": 1818} {"train_loss": -23.565536499023438, "global_step": 150957, "epoch": 1818} {"train_loss": -23.368728637695312, "global_step": 150958, "epoch": 1818} {"train_loss": -23.39190101623535, "global_step": 150959, "epoch": 1818} {"train_loss": -23.629444122314453, "global_step": 150960, "epoch": 1818} {"train_loss": -22.96170997619629, "global_step": 150961, "epoch": 1818} {"train_loss": -23.607141494750977, "global_step": 150962, "epoch": 1818} {"train_loss": -23.615110397338867, "global_step": 150963, "epoch": 1818} {"train_loss": -23.18509864807129, "global_step": 150964, "epoch": 1818} {"train_loss": -23.397815704345703, "global_step": 150965, "epoch": 1818} {"train_loss": -23.17544937133789, "global_step": 150966, "epoch": 1818} {"train_loss": -23.091279983520508, "global_step": 150967, "epoch": 1818} {"train_loss": -23.153249740600586, "global_step": 150968, "epoch": 1818} {"train_loss": -23.46856689453125, "global_step": 150969, "epoch": 1818} {"train_loss": -23.50347328186035, "global_step": 150970, "epoch": 1818} {"train_loss": -23.12010383605957, "global_step": 150971, "epoch": 1818} {"train_loss": -22.99423599243164, "global_step": 150972, "epoch": 1818} {"train_loss": -23.694793701171875, "global_step": 150973, "epoch": 1818} {"train_loss": -22.964441299438477, "global_step": 150974, "epoch": 1818} {"train_loss": -23.33460807800293, "global_step": 150975, "epoch": 1818} {"train_loss": -23.22559591086514, "global_step": 150976, "epoch": 1818, "val_loss": 6299659.0} {"train_loss": -22.65821647644043, "global_step": 150977, "epoch": 1819} {"train_loss": -21.9750919342041, "global_step": 150978, "epoch": 1819} {"train_loss": -22.435678482055664, "global_step": 150979, "epoch": 1819} {"train_loss": -22.966588973999023, "global_step": 150980, "epoch": 1819} {"train_loss": -21.6142578125, "global_step": 150981, "epoch": 1819} {"train_loss": -23.104724884033203, "global_step": 150982, "epoch": 1819} {"train_loss": -22.506772994995117, "global_step": 150983, "epoch": 1819} {"train_loss": -22.979726791381836, "global_step": 150984, "epoch": 1819} {"train_loss": -22.874130249023438, "global_step": 150985, "epoch": 1819} {"train_loss": -22.978147506713867, "global_step": 150986, "epoch": 1819} {"train_loss": -22.751720428466797, "global_step": 150987, "epoch": 1819} {"train_loss": -23.144071578979492, "global_step": 150988, "epoch": 1819} {"train_loss": -23.04740333557129, "global_step": 150989, "epoch": 1819} {"train_loss": -22.905153274536133, "global_step": 150990, "epoch": 1819} {"train_loss": -23.0159969329834, "global_step": 150991, "epoch": 1819} {"train_loss": -23.043188095092773, "global_step": 150992, "epoch": 1819} {"train_loss": -22.752286911010742, "global_step": 150993, "epoch": 1819} {"train_loss": -23.24424171447754, "global_step": 150994, "epoch": 1819} {"train_loss": -22.947662353515625, "global_step": 150995, "epoch": 1819} {"train_loss": -23.205108642578125, "global_step": 150996, "epoch": 1819} {"train_loss": -23.180912017822266, "global_step": 150997, "epoch": 1819} {"train_loss": -23.47161102294922, "global_step": 150998, "epoch": 1819} {"train_loss": -23.231225967407227, "global_step": 150999, "epoch": 1819} {"train_loss": -23.49000358581543, "global_step": 151000, "epoch": 1819} {"train_loss": -23.169010162353516, "global_step": 151001, "epoch": 1819} {"train_loss": -23.32452392578125, "global_step": 151002, "epoch": 1819} {"train_loss": -23.33966064453125, "global_step": 151003, "epoch": 1819} {"train_loss": -23.31952476501465, "global_step": 151004, "epoch": 1819} {"train_loss": -23.223215103149414, "global_step": 151005, "epoch": 1819} {"train_loss": -23.295785903930664, "global_step": 151006, "epoch": 1819} {"train_loss": -23.153173446655273, "global_step": 151007, "epoch": 1819} {"train_loss": -23.485824584960938, "global_step": 151008, "epoch": 1819} {"train_loss": -23.341550827026367, "global_step": 151009, "epoch": 1819} {"train_loss": -23.005456924438477, "global_step": 151010, "epoch": 1819} {"train_loss": -23.340246200561523, "global_step": 151011, "epoch": 1819} {"train_loss": -23.79007339477539, "global_step": 151012, "epoch": 1819} {"train_loss": -23.432262420654297, "global_step": 151013, "epoch": 1819} {"train_loss": -23.13669776916504, "global_step": 151014, "epoch": 1819} {"train_loss": -23.181154251098633, "global_step": 151015, "epoch": 1819} {"train_loss": -23.49654197692871, "global_step": 151016, "epoch": 1819} {"train_loss": -23.252883911132812, "global_step": 151017, "epoch": 1819} {"train_loss": -23.3231258392334, "global_step": 151018, "epoch": 1819} {"train_loss": -23.745559692382812, "global_step": 151019, "epoch": 1819} {"train_loss": -23.538862228393555, "global_step": 151020, "epoch": 1819} {"train_loss": -23.55623435974121, "global_step": 151021, "epoch": 1819} {"train_loss": -23.026803970336914, "global_step": 151022, "epoch": 1819} {"train_loss": -22.838830947875977, "global_step": 151023, "epoch": 1819} {"train_loss": -23.546154022216797, "global_step": 151024, "epoch": 1819} {"train_loss": -23.311325073242188, "global_step": 151025, "epoch": 1819} {"train_loss": -23.38103675842285, "global_step": 151026, "epoch": 1819} {"train_loss": -23.11652183532715, "global_step": 151027, "epoch": 1819} {"train_loss": -23.131868362426758, "global_step": 151028, "epoch": 1819} {"train_loss": -23.329694747924805, "global_step": 151029, "epoch": 1819} {"train_loss": -23.596914291381836, "global_step": 151030, "epoch": 1819} {"train_loss": -23.037240982055664, "global_step": 151031, "epoch": 1819} {"train_loss": -23.363697052001953, "global_step": 151032, "epoch": 1819} {"train_loss": -23.57601547241211, "global_step": 151033, "epoch": 1819} {"train_loss": -23.530790328979492, "global_step": 151034, "epoch": 1819} {"train_loss": -23.58412742614746, "global_step": 151035, "epoch": 1819} {"train_loss": -23.272565841674805, "global_step": 151036, "epoch": 1819} {"train_loss": -23.278846740722656, "global_step": 151037, "epoch": 1819} {"train_loss": -23.358442306518555, "global_step": 151038, "epoch": 1819} {"train_loss": -23.26128578186035, "global_step": 151039, "epoch": 1819} {"train_loss": -23.392642974853516, "global_step": 151040, "epoch": 1819} {"train_loss": -23.356794357299805, "global_step": 151041, "epoch": 1819} {"train_loss": -23.285009384155273, "global_step": 151042, "epoch": 1819} {"train_loss": -23.227079391479492, "global_step": 151043, "epoch": 1819} {"train_loss": -22.934967041015625, "global_step": 151044, "epoch": 1819} {"train_loss": -23.329687118530273, "global_step": 151045, "epoch": 1819} {"train_loss": -22.99005126953125, "global_step": 151046, "epoch": 1819} {"train_loss": -23.28487777709961, "global_step": 151047, "epoch": 1819} {"train_loss": -23.734066009521484, "global_step": 151048, "epoch": 1819} {"train_loss": -23.36904525756836, "global_step": 151049, "epoch": 1819} {"train_loss": -23.2623291015625, "global_step": 151050, "epoch": 1819} {"train_loss": -23.31460952758789, "global_step": 151051, "epoch": 1819} {"train_loss": -23.395648956298828, "global_step": 151052, "epoch": 1819} {"train_loss": -23.203548431396484, "global_step": 151053, "epoch": 1819} {"train_loss": -23.31473731994629, "global_step": 151054, "epoch": 1819} {"train_loss": -23.405590057373047, "global_step": 151055, "epoch": 1819} {"train_loss": -23.355199813842773, "global_step": 151056, "epoch": 1819} {"train_loss": -23.403717041015625, "global_step": 151057, "epoch": 1819} {"train_loss": -23.4930477142334, "global_step": 151058, "epoch": 1819} {"train_loss": -23.21332113426852, "global_step": 151059, "epoch": 1819, "val_loss": 6287048.0} {"train_loss": -22.775638580322266, "global_step": 151060, "epoch": 1820} {"train_loss": -22.98407554626465, "global_step": 151061, "epoch": 1820} {"train_loss": -22.4007568359375, "global_step": 151062, "epoch": 1820} {"train_loss": -23.019672393798828, "global_step": 151063, "epoch": 1820} {"train_loss": -22.79218101501465, "global_step": 151064, "epoch": 1820} {"train_loss": -22.89674949645996, "global_step": 151065, "epoch": 1820} {"train_loss": -23.392629623413086, "global_step": 151066, "epoch": 1820} {"train_loss": -23.08009147644043, "global_step": 151067, "epoch": 1820} {"train_loss": -23.095600128173828, "global_step": 151068, "epoch": 1820} {"train_loss": -22.96741485595703, "global_step": 151069, "epoch": 1820} {"train_loss": -23.0383243560791, "global_step": 151070, "epoch": 1820} {"train_loss": -22.979001998901367, "global_step": 151071, "epoch": 1820} {"train_loss": -23.03925132751465, "global_step": 151072, "epoch": 1820} {"train_loss": -22.706602096557617, "global_step": 151073, "epoch": 1820} {"train_loss": -23.125329971313477, "global_step": 151074, "epoch": 1820} {"train_loss": -23.328720092773438, "global_step": 151075, "epoch": 1820} {"train_loss": -22.79303741455078, "global_step": 151076, "epoch": 1820} {"train_loss": -23.44207191467285, "global_step": 151077, "epoch": 1820} {"train_loss": -22.952287673950195, "global_step": 151078, "epoch": 1820} {"train_loss": -23.328794479370117, "global_step": 151079, "epoch": 1820} {"train_loss": -23.078096389770508, "global_step": 151080, "epoch": 1820} {"train_loss": -22.624134063720703, "global_step": 151081, "epoch": 1820} {"train_loss": -23.064884185791016, "global_step": 151082, "epoch": 1820} {"train_loss": -23.01579475402832, "global_step": 151083, "epoch": 1820} {"train_loss": -23.432016372680664, "global_step": 151084, "epoch": 1820} {"train_loss": -22.83741569519043, "global_step": 151085, "epoch": 1820} {"train_loss": -23.181577682495117, "global_step": 151086, "epoch": 1820} {"train_loss": -23.488731384277344, "global_step": 151087, "epoch": 1820} {"train_loss": -23.241971969604492, "global_step": 151088, "epoch": 1820} {"train_loss": -23.58623504638672, "global_step": 151089, "epoch": 1820} {"train_loss": -23.166629791259766, "global_step": 151090, "epoch": 1820} {"train_loss": -23.466949462890625, "global_step": 151091, "epoch": 1820} {"train_loss": -23.037567138671875, "global_step": 151092, "epoch": 1820} {"train_loss": -22.917593002319336, "global_step": 151093, "epoch": 1820} {"train_loss": -22.95088005065918, "global_step": 151094, "epoch": 1820} {"train_loss": -23.02276611328125, "global_step": 151095, "epoch": 1820} {"train_loss": -22.9625301361084, "global_step": 151096, "epoch": 1820} {"train_loss": -23.263235092163086, "global_step": 151097, "epoch": 1820} {"train_loss": -23.296283721923828, "global_step": 151098, "epoch": 1820} {"train_loss": -23.450611114501953, "global_step": 151099, "epoch": 1820} {"train_loss": -23.01766586303711, "global_step": 151100, "epoch": 1820} {"train_loss": -22.870113372802734, "global_step": 151101, "epoch": 1820} {"train_loss": -23.088972091674805, "global_step": 151102, "epoch": 1820} {"train_loss": -23.196796417236328, "global_step": 151103, "epoch": 1820} {"train_loss": -23.215362548828125, "global_step": 151104, "epoch": 1820} {"train_loss": -23.128530502319336, "global_step": 151105, "epoch": 1820} {"train_loss": -23.2860050201416, "global_step": 151106, "epoch": 1820} {"train_loss": -22.98649024963379, "global_step": 151107, "epoch": 1820} {"train_loss": -23.253446578979492, "global_step": 151108, "epoch": 1820} {"train_loss": -23.097780227661133, "global_step": 151109, "epoch": 1820} {"train_loss": -23.281570434570312, "global_step": 151110, "epoch": 1820} {"train_loss": -23.460725784301758, "global_step": 151111, "epoch": 1820} {"train_loss": -22.92886734008789, "global_step": 151112, "epoch": 1820} {"train_loss": -23.886316299438477, "global_step": 151113, "epoch": 1820} {"train_loss": -23.3505802154541, "global_step": 151114, "epoch": 1820} {"train_loss": -23.271549224853516, "global_step": 151115, "epoch": 1820} {"train_loss": -23.02284812927246, "global_step": 151116, "epoch": 1820} {"train_loss": -23.317276000976562, "global_step": 151117, "epoch": 1820} {"train_loss": -23.165082931518555, "global_step": 151118, "epoch": 1820} {"train_loss": -23.507400512695312, "global_step": 151119, "epoch": 1820} {"train_loss": -23.541696548461914, "global_step": 151120, "epoch": 1820} {"train_loss": -23.617265701293945, "global_step": 151121, "epoch": 1820} {"train_loss": -23.04611587524414, "global_step": 151122, "epoch": 1820} {"train_loss": -23.52107810974121, "global_step": 151123, "epoch": 1820} {"train_loss": -23.184293746948242, "global_step": 151124, "epoch": 1820} {"train_loss": -23.510663986206055, "global_step": 151125, "epoch": 1820} {"train_loss": -23.741239547729492, "global_step": 151126, "epoch": 1820} {"train_loss": -23.710607528686523, "global_step": 151127, "epoch": 1820} {"train_loss": -23.53314781188965, "global_step": 151128, "epoch": 1820} {"train_loss": -23.61844825744629, "global_step": 151129, "epoch": 1820} {"train_loss": -23.365264892578125, "global_step": 151130, "epoch": 1820} {"train_loss": -22.994707107543945, "global_step": 151131, "epoch": 1820} {"train_loss": -23.72991371154785, "global_step": 151132, "epoch": 1820} {"train_loss": -23.29610824584961, "global_step": 151133, "epoch": 1820} {"train_loss": -23.224197387695312, "global_step": 151134, "epoch": 1820} {"train_loss": -23.07699966430664, "global_step": 151135, "epoch": 1820} {"train_loss": -23.572372436523438, "global_step": 151136, "epoch": 1820} {"train_loss": -23.47798728942871, "global_step": 151137, "epoch": 1820} {"train_loss": -23.357458114624023, "global_step": 151138, "epoch": 1820} {"train_loss": -23.19121551513672, "global_step": 151139, "epoch": 1820} {"train_loss": -22.82843780517578, "global_step": 151140, "epoch": 1820} {"train_loss": -23.22199821472168, "global_step": 151141, "epoch": 1820} {"train_loss": -23.178766020809313, "global_step": 151142, "epoch": 1820, "val_loss": 6497550.0} {"train_loss": -20.000654220581055, "global_step": 151143, "epoch": 1821} {"train_loss": -22.270105361938477, "global_step": 151144, "epoch": 1821} {"train_loss": -20.332914352416992, "global_step": 151145, "epoch": 1821} {"train_loss": -21.65274429321289, "global_step": 151146, "epoch": 1821} {"train_loss": -21.28949546813965, "global_step": 151147, "epoch": 1821} {"train_loss": -21.452932357788086, "global_step": 151148, "epoch": 1821} {"train_loss": -22.156652450561523, "global_step": 151149, "epoch": 1821} {"train_loss": -21.75425910949707, "global_step": 151150, "epoch": 1821} {"train_loss": -22.344482421875, "global_step": 151151, "epoch": 1821} {"train_loss": -22.1812801361084, "global_step": 151152, "epoch": 1821} {"train_loss": -22.2130126953125, "global_step": 151153, "epoch": 1821} {"train_loss": -22.291305541992188, "global_step": 151154, "epoch": 1821} {"train_loss": -21.865659713745117, "global_step": 151155, "epoch": 1821} {"train_loss": -22.642362594604492, "global_step": 151156, "epoch": 1821} {"train_loss": -22.278223037719727, "global_step": 151157, "epoch": 1821} {"train_loss": -22.382007598876953, "global_step": 151158, "epoch": 1821} {"train_loss": -22.249494552612305, "global_step": 151159, "epoch": 1821} {"train_loss": -22.406423568725586, "global_step": 151160, "epoch": 1821} {"train_loss": -22.13764762878418, "global_step": 151161, "epoch": 1821} {"train_loss": -22.43894386291504, "global_step": 151162, "epoch": 1821} {"train_loss": -22.32110023498535, "global_step": 151163, "epoch": 1821} {"train_loss": -22.32187843322754, "global_step": 151164, "epoch": 1821} {"train_loss": -22.715694427490234, "global_step": 151165, "epoch": 1821} {"train_loss": -22.20318603515625, "global_step": 151166, "epoch": 1821} {"train_loss": -22.9294490814209, "global_step": 151167, "epoch": 1821} {"train_loss": -22.38595962524414, "global_step": 151168, "epoch": 1821} {"train_loss": -22.817800521850586, "global_step": 151169, "epoch": 1821} {"train_loss": -22.79144859313965, "global_step": 151170, "epoch": 1821} {"train_loss": -22.478628158569336, "global_step": 151171, "epoch": 1821} {"train_loss": -22.993383407592773, "global_step": 151172, "epoch": 1821} {"train_loss": -22.774120330810547, "global_step": 151173, "epoch": 1821} {"train_loss": -22.8579044342041, "global_step": 151174, "epoch": 1821} {"train_loss": -23.035388946533203, "global_step": 151175, "epoch": 1821} {"train_loss": -22.79742431640625, "global_step": 151176, "epoch": 1821} {"train_loss": -23.052955627441406, "global_step": 151177, "epoch": 1821} {"train_loss": -23.30687713623047, "global_step": 151178, "epoch": 1821} {"train_loss": -23.163644790649414, "global_step": 151179, "epoch": 1821} {"train_loss": -23.287363052368164, "global_step": 151180, "epoch": 1821} {"train_loss": -23.22623634338379, "global_step": 151181, "epoch": 1821} {"train_loss": -23.014053344726562, "global_step": 151182, "epoch": 1821} {"train_loss": -23.47517204284668, "global_step": 151183, "epoch": 1821} {"train_loss": -23.03845977783203, "global_step": 151184, "epoch": 1821} {"train_loss": -23.065595626831055, "global_step": 151185, "epoch": 1821} {"train_loss": -23.3292293548584, "global_step": 151186, "epoch": 1821} {"train_loss": -23.331310272216797, "global_step": 151187, "epoch": 1821} {"train_loss": -23.70369529724121, "global_step": 151188, "epoch": 1821} {"train_loss": -23.478055953979492, "global_step": 151189, "epoch": 1821} {"train_loss": -23.31630516052246, "global_step": 151190, "epoch": 1821} {"train_loss": -23.130434036254883, "global_step": 151191, "epoch": 1821} {"train_loss": -23.299657821655273, "global_step": 151192, "epoch": 1821} {"train_loss": -23.170148849487305, "global_step": 151193, "epoch": 1821} {"train_loss": -23.100746154785156, "global_step": 151194, "epoch": 1821} {"train_loss": -23.1129093170166, "global_step": 151195, "epoch": 1821} {"train_loss": -23.314199447631836, "global_step": 151196, "epoch": 1821} {"train_loss": -23.027677536010742, "global_step": 151197, "epoch": 1821} {"train_loss": -23.652700424194336, "global_step": 151198, "epoch": 1821} {"train_loss": -23.097524642944336, "global_step": 151199, "epoch": 1821} {"train_loss": -23.24112319946289, "global_step": 151200, "epoch": 1821} {"train_loss": -23.58839988708496, "global_step": 151201, "epoch": 1821} {"train_loss": -23.16021728515625, "global_step": 151202, "epoch": 1821} {"train_loss": -23.40082359313965, "global_step": 151203, "epoch": 1821} {"train_loss": -23.163715362548828, "global_step": 151204, "epoch": 1821} {"train_loss": -23.211101531982422, "global_step": 151205, "epoch": 1821} {"train_loss": -22.959020614624023, "global_step": 151206, "epoch": 1821} {"train_loss": -23.496963500976562, "global_step": 151207, "epoch": 1821} {"train_loss": -23.22666358947754, "global_step": 151208, "epoch": 1821} {"train_loss": -23.305753707885742, "global_step": 151209, "epoch": 1821} {"train_loss": -23.56618309020996, "global_step": 151210, "epoch": 1821} {"train_loss": -23.220457077026367, "global_step": 151211, "epoch": 1821} {"train_loss": -23.789663314819336, "global_step": 151212, "epoch": 1821} {"train_loss": -22.955307006835938, "global_step": 151213, "epoch": 1821} {"train_loss": -23.582590103149414, "global_step": 151214, "epoch": 1821} {"train_loss": -23.34401512145996, "global_step": 151215, "epoch": 1821} {"train_loss": -23.625171661376953, "global_step": 151216, "epoch": 1821} {"train_loss": -23.449464797973633, "global_step": 151217, "epoch": 1821} {"train_loss": -23.48615264892578, "global_step": 151218, "epoch": 1821} {"train_loss": -23.40303611755371, "global_step": 151219, "epoch": 1821} {"train_loss": -23.47963523864746, "global_step": 151220, "epoch": 1821} {"train_loss": -23.45654296875, "global_step": 151221, "epoch": 1821} {"train_loss": -23.506383895874023, "global_step": 151222, "epoch": 1821} {"train_loss": -23.87184715270996, "global_step": 151223, "epoch": 1821} {"train_loss": -23.199440002441406, "global_step": 151224, "epoch": 1821} {"train_loss": -22.883165796119048, "global_step": 151225, "epoch": 1821, "val_loss": 6278081.0} {"train_loss": -22.68153953552246, "global_step": 151226, "epoch": 1822} {"train_loss": -22.44710350036621, "global_step": 151227, "epoch": 1822} {"train_loss": -23.217039108276367, "global_step": 151228, "epoch": 1822} {"train_loss": -22.90187644958496, "global_step": 151229, "epoch": 1822} {"train_loss": -22.588836669921875, "global_step": 151230, "epoch": 1822} {"train_loss": -22.4566650390625, "global_step": 151231, "epoch": 1822} {"train_loss": -23.224332809448242, "global_step": 151232, "epoch": 1822} {"train_loss": -23.094022750854492, "global_step": 151233, "epoch": 1822} {"train_loss": -23.1146183013916, "global_step": 151234, "epoch": 1822} {"train_loss": -23.137527465820312, "global_step": 151235, "epoch": 1822} {"train_loss": -23.233936309814453, "global_step": 151236, "epoch": 1822} {"train_loss": -23.58024024963379, "global_step": 151237, "epoch": 1822} {"train_loss": -23.117883682250977, "global_step": 151238, "epoch": 1822} {"train_loss": -23.425933837890625, "global_step": 151239, "epoch": 1822} {"train_loss": -23.223386764526367, "global_step": 151240, "epoch": 1822} {"train_loss": -23.316247940063477, "global_step": 151241, "epoch": 1822} {"train_loss": -23.06561851501465, "global_step": 151242, "epoch": 1822} {"train_loss": -23.343460083007812, "global_step": 151243, "epoch": 1822} {"train_loss": -23.561893463134766, "global_step": 151244, "epoch": 1822} {"train_loss": -22.979909896850586, "global_step": 151245, "epoch": 1822} {"train_loss": -23.04952049255371, "global_step": 151246, "epoch": 1822} {"train_loss": -23.52762222290039, "global_step": 151247, "epoch": 1822} {"train_loss": -23.401113510131836, "global_step": 151248, "epoch": 1822} {"train_loss": -23.16236686706543, "global_step": 151249, "epoch": 1822} {"train_loss": -23.13472557067871, "global_step": 151250, "epoch": 1822} {"train_loss": -22.931760787963867, "global_step": 151251, "epoch": 1822} {"train_loss": -22.894962310791016, "global_step": 151252, "epoch": 1822} {"train_loss": -23.385608673095703, "global_step": 151253, "epoch": 1822} {"train_loss": -23.53561782836914, "global_step": 151254, "epoch": 1822} {"train_loss": -23.134748458862305, "global_step": 151255, "epoch": 1822} {"train_loss": -23.19841766357422, "global_step": 151256, "epoch": 1822} {"train_loss": -23.321653366088867, "global_step": 151257, "epoch": 1822} {"train_loss": -23.069379806518555, "global_step": 151258, "epoch": 1822} {"train_loss": -23.53598403930664, "global_step": 151259, "epoch": 1822} {"train_loss": -23.176115036010742, "global_step": 151260, "epoch": 1822} {"train_loss": -23.570728302001953, "global_step": 151261, "epoch": 1822} {"train_loss": -23.412338256835938, "global_step": 151262, "epoch": 1822} {"train_loss": -23.397863388061523, "global_step": 151263, "epoch": 1822} {"train_loss": -23.234272003173828, "global_step": 151264, "epoch": 1822} {"train_loss": -22.916501998901367, "global_step": 151265, "epoch": 1822} {"train_loss": -23.61513328552246, "global_step": 151266, "epoch": 1822} {"train_loss": -23.310428619384766, "global_step": 151267, "epoch": 1822} {"train_loss": -23.4732723236084, "global_step": 151268, "epoch": 1822} {"train_loss": -23.110916137695312, "global_step": 151269, "epoch": 1822} {"train_loss": -23.478845596313477, "global_step": 151270, "epoch": 1822} {"train_loss": -23.400833129882812, "global_step": 151271, "epoch": 1822} {"train_loss": -23.563596725463867, "global_step": 151272, "epoch": 1822} {"train_loss": -23.450210571289062, "global_step": 151273, "epoch": 1822} {"train_loss": -22.819978713989258, "global_step": 151274, "epoch": 1822} {"train_loss": -23.55341148376465, "global_step": 151275, "epoch": 1822} {"train_loss": -23.405838012695312, "global_step": 151276, "epoch": 1822} {"train_loss": -23.269424438476562, "global_step": 151277, "epoch": 1822} {"train_loss": -23.602569580078125, "global_step": 151278, "epoch": 1822} {"train_loss": -23.22273826599121, "global_step": 151279, "epoch": 1822} {"train_loss": -23.28470230102539, "global_step": 151280, "epoch": 1822} {"train_loss": -23.56777000427246, "global_step": 151281, "epoch": 1822} {"train_loss": -23.19400978088379, "global_step": 151282, "epoch": 1822} {"train_loss": -23.4522762298584, "global_step": 151283, "epoch": 1822} {"train_loss": -22.644317626953125, "global_step": 151284, "epoch": 1822} {"train_loss": -23.179807662963867, "global_step": 151285, "epoch": 1822} {"train_loss": -22.767663955688477, "global_step": 151286, "epoch": 1822} {"train_loss": -23.04578971862793, "global_step": 151287, "epoch": 1822} {"train_loss": -22.874399185180664, "global_step": 151288, "epoch": 1822} {"train_loss": -23.366222381591797, "global_step": 151289, "epoch": 1822} {"train_loss": -23.18631362915039, "global_step": 151290, "epoch": 1822} {"train_loss": -23.31123161315918, "global_step": 151291, "epoch": 1822} {"train_loss": -23.28981590270996, "global_step": 151292, "epoch": 1822} {"train_loss": -23.1370792388916, "global_step": 151293, "epoch": 1822} {"train_loss": -23.155691146850586, "global_step": 151294, "epoch": 1822} {"train_loss": -23.484291076660156, "global_step": 151295, "epoch": 1822} {"train_loss": -22.905080795288086, "global_step": 151296, "epoch": 1822} {"train_loss": -23.058279037475586, "global_step": 151297, "epoch": 1822} {"train_loss": -23.604873657226562, "global_step": 151298, "epoch": 1822} {"train_loss": -23.08083152770996, "global_step": 151299, "epoch": 1822} {"train_loss": -23.528135299682617, "global_step": 151300, "epoch": 1822} {"train_loss": -23.131223678588867, "global_step": 151301, "epoch": 1822} {"train_loss": -23.376216888427734, "global_step": 151302, "epoch": 1822} {"train_loss": -23.2568416595459, "global_step": 151303, "epoch": 1822} {"train_loss": -23.360641479492188, "global_step": 151304, "epoch": 1822} {"train_loss": -23.255821228027344, "global_step": 151305, "epoch": 1822} {"train_loss": -23.322261810302734, "global_step": 151306, "epoch": 1822} {"train_loss": -23.489246368408203, "global_step": 151307, "epoch": 1822} {"train_loss": -23.217143966490966, "global_step": 151308, "epoch": 1822, "val_loss": 6239596.0} {"train_loss": -22.885446548461914, "global_step": 151309, "epoch": 1823} {"train_loss": -22.996017456054688, "global_step": 151310, "epoch": 1823} {"train_loss": -23.14018440246582, "global_step": 151311, "epoch": 1823} {"train_loss": -22.387020111083984, "global_step": 151312, "epoch": 1823} {"train_loss": -23.1505184173584, "global_step": 151313, "epoch": 1823} {"train_loss": -23.53106117248535, "global_step": 151314, "epoch": 1823} {"train_loss": -23.164640426635742, "global_step": 151315, "epoch": 1823} {"train_loss": -23.223350524902344, "global_step": 151316, "epoch": 1823} {"train_loss": -23.136859893798828, "global_step": 151317, "epoch": 1823} {"train_loss": -23.244230270385742, "global_step": 151318, "epoch": 1823} {"train_loss": -23.383649826049805, "global_step": 151319, "epoch": 1823} {"train_loss": -22.960901260375977, "global_step": 151320, "epoch": 1823} {"train_loss": -23.25789451599121, "global_step": 151321, "epoch": 1823} {"train_loss": -23.239337921142578, "global_step": 151322, "epoch": 1823} {"train_loss": -22.897157669067383, "global_step": 151323, "epoch": 1823} {"train_loss": -23.332258224487305, "global_step": 151324, "epoch": 1823} {"train_loss": -23.519054412841797, "global_step": 151325, "epoch": 1823} {"train_loss": -23.486730575561523, "global_step": 151326, "epoch": 1823} {"train_loss": -23.18574333190918, "global_step": 151327, "epoch": 1823} {"train_loss": -22.968002319335938, "global_step": 151328, "epoch": 1823} {"train_loss": -23.220426559448242, "global_step": 151329, "epoch": 1823} {"train_loss": -23.305158615112305, "global_step": 151330, "epoch": 1823} {"train_loss": -23.201045989990234, "global_step": 151331, "epoch": 1823} {"train_loss": -23.01416015625, "global_step": 151332, "epoch": 1823} {"train_loss": -23.343786239624023, "global_step": 151333, "epoch": 1823} {"train_loss": -23.425273895263672, "global_step": 151334, "epoch": 1823} {"train_loss": -23.23784828186035, "global_step": 151335, "epoch": 1823} {"train_loss": -23.299808502197266, "global_step": 151336, "epoch": 1823} {"train_loss": -23.07053565979004, "global_step": 151337, "epoch": 1823} {"train_loss": -23.302122116088867, "global_step": 151338, "epoch": 1823} {"train_loss": -23.274871826171875, "global_step": 151339, "epoch": 1823} {"train_loss": -23.24081802368164, "global_step": 151340, "epoch": 1823} {"train_loss": -23.593717575073242, "global_step": 151341, "epoch": 1823} {"train_loss": -23.231494903564453, "global_step": 151342, "epoch": 1823} {"train_loss": -23.638961791992188, "global_step": 151343, "epoch": 1823} {"train_loss": -23.247785568237305, "global_step": 151344, "epoch": 1823} {"train_loss": -22.86920166015625, "global_step": 151345, "epoch": 1823} {"train_loss": -23.42396354675293, "global_step": 151346, "epoch": 1823} {"train_loss": -23.5554256439209, "global_step": 151347, "epoch": 1823} {"train_loss": -23.52876091003418, "global_step": 151348, "epoch": 1823} {"train_loss": -23.29520606994629, "global_step": 151349, "epoch": 1823} {"train_loss": -23.454376220703125, "global_step": 151350, "epoch": 1823} {"train_loss": -23.689374923706055, "global_step": 151351, "epoch": 1823} {"train_loss": -23.077646255493164, "global_step": 151352, "epoch": 1823} {"train_loss": -23.418445587158203, "global_step": 151353, "epoch": 1823} {"train_loss": -23.34712791442871, "global_step": 151354, "epoch": 1823} {"train_loss": -23.470996856689453, "global_step": 151355, "epoch": 1823} {"train_loss": -23.46238136291504, "global_step": 151356, "epoch": 1823} {"train_loss": -23.055335998535156, "global_step": 151357, "epoch": 1823} {"train_loss": -23.318876266479492, "global_step": 151358, "epoch": 1823} {"train_loss": -23.23137855529785, "global_step": 151359, "epoch": 1823} {"train_loss": -23.14286231994629, "global_step": 151360, "epoch": 1823} {"train_loss": -23.553686141967773, "global_step": 151361, "epoch": 1823} {"train_loss": -23.48650550842285, "global_step": 151362, "epoch": 1823} {"train_loss": -23.263347625732422, "global_step": 151363, "epoch": 1823} {"train_loss": -23.380714416503906, "global_step": 151364, "epoch": 1823} {"train_loss": -23.201068878173828, "global_step": 151365, "epoch": 1823} {"train_loss": -23.535537719726562, "global_step": 151366, "epoch": 1823} {"train_loss": -23.70585060119629, "global_step": 151367, "epoch": 1823} {"train_loss": -23.360515594482422, "global_step": 151368, "epoch": 1823} {"train_loss": -23.3773250579834, "global_step": 151369, "epoch": 1823} {"train_loss": -23.335371017456055, "global_step": 151370, "epoch": 1823} {"train_loss": -23.533910751342773, "global_step": 151371, "epoch": 1823} {"train_loss": -23.2686710357666, "global_step": 151372, "epoch": 1823} {"train_loss": -23.521286010742188, "global_step": 151373, "epoch": 1823} {"train_loss": -23.48748779296875, "global_step": 151374, "epoch": 1823} {"train_loss": -23.543733596801758, "global_step": 151375, "epoch": 1823} {"train_loss": -23.457977294921875, "global_step": 151376, "epoch": 1823} {"train_loss": -23.517932891845703, "global_step": 151377, "epoch": 1823} {"train_loss": -23.539339065551758, "global_step": 151378, "epoch": 1823} {"train_loss": -23.515165328979492, "global_step": 151379, "epoch": 1823} {"train_loss": -23.440073013305664, "global_step": 151380, "epoch": 1823} {"train_loss": -23.658279418945312, "global_step": 151381, "epoch": 1823} {"train_loss": -23.5511531829834, "global_step": 151382, "epoch": 1823} {"train_loss": -23.31170082092285, "global_step": 151383, "epoch": 1823} {"train_loss": -23.468368530273438, "global_step": 151384, "epoch": 1823} {"train_loss": -23.29378318786621, "global_step": 151385, "epoch": 1823} {"train_loss": -23.519033432006836, "global_step": 151386, "epoch": 1823} {"train_loss": -23.82037925720215, "global_step": 151387, "epoch": 1823} {"train_loss": -23.159177780151367, "global_step": 151388, "epoch": 1823} {"train_loss": -23.374204635620117, "global_step": 151389, "epoch": 1823} {"train_loss": -23.338293075561523, "global_step": 151390, "epoch": 1823} {"train_loss": -23.33805206023067, "global_step": 151391, "epoch": 1823, "val_loss": 6358673.0} {"train_loss": -22.367328643798828, "global_step": 151392, "epoch": 1824} {"train_loss": -23.04714012145996, "global_step": 151393, "epoch": 1824} {"train_loss": -22.60137367248535, "global_step": 151394, "epoch": 1824} {"train_loss": -22.266969680786133, "global_step": 151395, "epoch": 1824} {"train_loss": -22.226179122924805, "global_step": 151396, "epoch": 1824} {"train_loss": -22.685983657836914, "global_step": 151397, "epoch": 1824} {"train_loss": -22.718769073486328, "global_step": 151398, "epoch": 1824} {"train_loss": -23.102258682250977, "global_step": 151399, "epoch": 1824} {"train_loss": -23.28075408935547, "global_step": 151400, "epoch": 1824} {"train_loss": -22.589588165283203, "global_step": 151401, "epoch": 1824} {"train_loss": -22.81097984313965, "global_step": 151402, "epoch": 1824} {"train_loss": -23.504291534423828, "global_step": 151403, "epoch": 1824} {"train_loss": -23.33641815185547, "global_step": 151404, "epoch": 1824} {"train_loss": -22.909950256347656, "global_step": 151405, "epoch": 1824} {"train_loss": -22.740955352783203, "global_step": 151406, "epoch": 1824} {"train_loss": -22.94173240661621, "global_step": 151407, "epoch": 1824} {"train_loss": -23.388235092163086, "global_step": 151408, "epoch": 1824} {"train_loss": -22.93234634399414, "global_step": 151409, "epoch": 1824} {"train_loss": -23.184558868408203, "global_step": 151410, "epoch": 1824} {"train_loss": -23.04204559326172, "global_step": 151411, "epoch": 1824} {"train_loss": -23.214780807495117, "global_step": 151412, "epoch": 1824} {"train_loss": -23.116506576538086, "global_step": 151413, "epoch": 1824} {"train_loss": -23.22617530822754, "global_step": 151414, "epoch": 1824} {"train_loss": -22.913467407226562, "global_step": 151415, "epoch": 1824} {"train_loss": -23.258378982543945, "global_step": 151416, "epoch": 1824} {"train_loss": -23.41611099243164, "global_step": 151417, "epoch": 1824} {"train_loss": -23.239225387573242, "global_step": 151418, "epoch": 1824} {"train_loss": -23.049402236938477, "global_step": 151419, "epoch": 1824} {"train_loss": -23.107349395751953, "global_step": 151420, "epoch": 1824} {"train_loss": -22.951465606689453, "global_step": 151421, "epoch": 1824} {"train_loss": -23.046127319335938, "global_step": 151422, "epoch": 1824} {"train_loss": -23.483325958251953, "global_step": 151423, "epoch": 1824} {"train_loss": -23.246511459350586, "global_step": 151424, "epoch": 1824} {"train_loss": -23.14031982421875, "global_step": 151425, "epoch": 1824} {"train_loss": -23.566190719604492, "global_step": 151426, "epoch": 1824} {"train_loss": -23.417516708374023, "global_step": 151427, "epoch": 1824} {"train_loss": -23.557035446166992, "global_step": 151428, "epoch": 1824} {"train_loss": -23.369409561157227, "global_step": 151429, "epoch": 1824} {"train_loss": -23.424341201782227, "global_step": 151430, "epoch": 1824} {"train_loss": -22.830930709838867, "global_step": 151431, "epoch": 1824} {"train_loss": -23.181509017944336, "global_step": 151432, "epoch": 1824} {"train_loss": -23.707767486572266, "global_step": 151433, "epoch": 1824} {"train_loss": -23.243549346923828, "global_step": 151434, "epoch": 1824} {"train_loss": -22.940017700195312, "global_step": 151435, "epoch": 1824} {"train_loss": -23.20466423034668, "global_step": 151436, "epoch": 1824} {"train_loss": -23.246488571166992, "global_step": 151437, "epoch": 1824} {"train_loss": -23.37138557434082, "global_step": 151438, "epoch": 1824} {"train_loss": -23.16065788269043, "global_step": 151439, "epoch": 1824} {"train_loss": -22.994638442993164, "global_step": 151440, "epoch": 1824} {"train_loss": -23.086584091186523, "global_step": 151441, "epoch": 1824} {"train_loss": -23.148937225341797, "global_step": 151442, "epoch": 1824} {"train_loss": -23.206396102905273, "global_step": 151443, "epoch": 1824} {"train_loss": -23.071805953979492, "global_step": 151444, "epoch": 1824} {"train_loss": -23.232084274291992, "global_step": 151445, "epoch": 1824} {"train_loss": -23.33662223815918, "global_step": 151446, "epoch": 1824} {"train_loss": -23.273941040039062, "global_step": 151447, "epoch": 1824} {"train_loss": -23.54847526550293, "global_step": 151448, "epoch": 1824} {"train_loss": -23.214574813842773, "global_step": 151449, "epoch": 1824} {"train_loss": -23.257888793945312, "global_step": 151450, "epoch": 1824} {"train_loss": -22.955663681030273, "global_step": 151451, "epoch": 1824} {"train_loss": -23.532747268676758, "global_step": 151452, "epoch": 1824} {"train_loss": -23.1787109375, "global_step": 151453, "epoch": 1824} {"train_loss": -23.517942428588867, "global_step": 151454, "epoch": 1824} {"train_loss": -23.311256408691406, "global_step": 151455, "epoch": 1824} {"train_loss": -23.297632217407227, "global_step": 151456, "epoch": 1824} {"train_loss": -23.630300521850586, "global_step": 151457, "epoch": 1824} {"train_loss": -23.314939498901367, "global_step": 151458, "epoch": 1824} {"train_loss": -23.5123291015625, "global_step": 151459, "epoch": 1824} {"train_loss": -23.76719093322754, "global_step": 151460, "epoch": 1824} {"train_loss": -23.531858444213867, "global_step": 151461, "epoch": 1824} {"train_loss": -22.95587158203125, "global_step": 151462, "epoch": 1824} {"train_loss": -23.235031127929688, "global_step": 151463, "epoch": 1824} {"train_loss": -23.783750534057617, "global_step": 151464, "epoch": 1824} {"train_loss": -23.33418846130371, "global_step": 151465, "epoch": 1824} {"train_loss": -23.40420913696289, "global_step": 151466, "epoch": 1824} {"train_loss": -23.693309783935547, "global_step": 151467, "epoch": 1824} {"train_loss": -23.24831199645996, "global_step": 151468, "epoch": 1824} {"train_loss": -23.239099502563477, "global_step": 151469, "epoch": 1824} {"train_loss": -23.0941219329834, "global_step": 151470, "epoch": 1824} {"train_loss": -23.021963119506836, "global_step": 151471, "epoch": 1824} {"train_loss": -23.081029891967773, "global_step": 151472, "epoch": 1824} {"train_loss": -23.351654052734375, "global_step": 151473, "epoch": 1824} {"train_loss": -23.184720326618976, "global_step": 151474, "epoch": 1824, "val_loss": 6427723.0} {"train_loss": -22.664838790893555, "global_step": 151475, "epoch": 1825} {"train_loss": -22.950056076049805, "global_step": 151476, "epoch": 1825} {"train_loss": -23.114091873168945, "global_step": 151477, "epoch": 1825} {"train_loss": -22.964580535888672, "global_step": 151478, "epoch": 1825} {"train_loss": -22.597990036010742, "global_step": 151479, "epoch": 1825} {"train_loss": -23.226533889770508, "global_step": 151480, "epoch": 1825} {"train_loss": -23.17967987060547, "global_step": 151481, "epoch": 1825} {"train_loss": -23.037155151367188, "global_step": 151482, "epoch": 1825} {"train_loss": -22.782743453979492, "global_step": 151483, "epoch": 1825} {"train_loss": -23.280393600463867, "global_step": 151484, "epoch": 1825} {"train_loss": -23.03314781188965, "global_step": 151485, "epoch": 1825} {"train_loss": -22.925485610961914, "global_step": 151486, "epoch": 1825} {"train_loss": -23.321332931518555, "global_step": 151487, "epoch": 1825} {"train_loss": -23.293500900268555, "global_step": 151488, "epoch": 1825} {"train_loss": -23.392141342163086, "global_step": 151489, "epoch": 1825} {"train_loss": -23.01259994506836, "global_step": 151490, "epoch": 1825} {"train_loss": -23.174551010131836, "global_step": 151491, "epoch": 1825} {"train_loss": -23.1851863861084, "global_step": 151492, "epoch": 1825} {"train_loss": -23.39188575744629, "global_step": 151493, "epoch": 1825} {"train_loss": -23.436750411987305, "global_step": 151494, "epoch": 1825} {"train_loss": -23.39957046508789, "global_step": 151495, "epoch": 1825} {"train_loss": -23.529434204101562, "global_step": 151496, "epoch": 1825} {"train_loss": -23.61708641052246, "global_step": 151497, "epoch": 1825} {"train_loss": -23.44278907775879, "global_step": 151498, "epoch": 1825} {"train_loss": -23.394128799438477, "global_step": 151499, "epoch": 1825} {"train_loss": -23.255939483642578, "global_step": 151500, "epoch": 1825} {"train_loss": -23.403959274291992, "global_step": 151501, "epoch": 1825} {"train_loss": -23.4232120513916, "global_step": 151502, "epoch": 1825} {"train_loss": -23.535924911499023, "global_step": 151503, "epoch": 1825} {"train_loss": -23.23801612854004, "global_step": 151504, "epoch": 1825} {"train_loss": -23.427276611328125, "global_step": 151505, "epoch": 1825} {"train_loss": -23.38254737854004, "global_step": 151506, "epoch": 1825} {"train_loss": -23.38431167602539, "global_step": 151507, "epoch": 1825} {"train_loss": -23.411046981811523, "global_step": 151508, "epoch": 1825} {"train_loss": -23.474206924438477, "global_step": 151509, "epoch": 1825} {"train_loss": -23.283720016479492, "global_step": 151510, "epoch": 1825} {"train_loss": -23.492156982421875, "global_step": 151511, "epoch": 1825} {"train_loss": -23.374723434448242, "global_step": 151512, "epoch": 1825} {"train_loss": -23.599882125854492, "global_step": 151513, "epoch": 1825} {"train_loss": -23.48640251159668, "global_step": 151514, "epoch": 1825} {"train_loss": -23.179981231689453, "global_step": 151515, "epoch": 1825} {"train_loss": -23.420143127441406, "global_step": 151516, "epoch": 1825} {"train_loss": -23.451099395751953, "global_step": 151517, "epoch": 1825} {"train_loss": -23.717269897460938, "global_step": 151518, "epoch": 1825} {"train_loss": -23.384489059448242, "global_step": 151519, "epoch": 1825} {"train_loss": -23.514387130737305, "global_step": 151520, "epoch": 1825} {"train_loss": -23.34471321105957, "global_step": 151521, "epoch": 1825} {"train_loss": -23.112882614135742, "global_step": 151522, "epoch": 1825} {"train_loss": -23.317646026611328, "global_step": 151523, "epoch": 1825} {"train_loss": -23.13248062133789, "global_step": 151524, "epoch": 1825} {"train_loss": -23.565088272094727, "global_step": 151525, "epoch": 1825} {"train_loss": -23.202787399291992, "global_step": 151526, "epoch": 1825} {"train_loss": -23.188852310180664, "global_step": 151527, "epoch": 1825} {"train_loss": -23.345661163330078, "global_step": 151528, "epoch": 1825} {"train_loss": -23.177331924438477, "global_step": 151529, "epoch": 1825} {"train_loss": -23.470951080322266, "global_step": 151530, "epoch": 1825} {"train_loss": -23.294790267944336, "global_step": 151531, "epoch": 1825} {"train_loss": -23.356639862060547, "global_step": 151532, "epoch": 1825} {"train_loss": -23.149049758911133, "global_step": 151533, "epoch": 1825} {"train_loss": -23.27375602722168, "global_step": 151534, "epoch": 1825} {"train_loss": -22.88556480407715, "global_step": 151535, "epoch": 1825} {"train_loss": -23.80883026123047, "global_step": 151536, "epoch": 1825} {"train_loss": -23.14336585998535, "global_step": 151537, "epoch": 1825} {"train_loss": -23.506877899169922, "global_step": 151538, "epoch": 1825} {"train_loss": -23.23235511779785, "global_step": 151539, "epoch": 1825} {"train_loss": -23.450801849365234, "global_step": 151540, "epoch": 1825} {"train_loss": -23.31061553955078, "global_step": 151541, "epoch": 1825} {"train_loss": -23.450037002563477, "global_step": 151542, "epoch": 1825} {"train_loss": -23.287508010864258, "global_step": 151543, "epoch": 1825} {"train_loss": -23.4254093170166, "global_step": 151544, "epoch": 1825} {"train_loss": -23.429899215698242, "global_step": 151545, "epoch": 1825} {"train_loss": -23.0516300201416, "global_step": 151546, "epoch": 1825} {"train_loss": -22.843534469604492, "global_step": 151547, "epoch": 1825} {"train_loss": -23.1698055267334, "global_step": 151548, "epoch": 1825} {"train_loss": -23.52219581604004, "global_step": 151549, "epoch": 1825} {"train_loss": -23.35369300842285, "global_step": 151550, "epoch": 1825} {"train_loss": -23.45246696472168, "global_step": 151551, "epoch": 1825} {"train_loss": -23.237171173095703, "global_step": 151552, "epoch": 1825} {"train_loss": -23.37063980102539, "global_step": 151553, "epoch": 1825} {"train_loss": -23.372976303100586, "global_step": 151554, "epoch": 1825} {"train_loss": -23.393802642822266, "global_step": 151555, "epoch": 1825} {"train_loss": -23.32477378845215, "global_step": 151556, "epoch": 1825} {"train_loss": -23.28215746132724, "global_step": 151557, "epoch": 1825, "val_loss": 6463315.0} {"train_loss": -22.990026473999023, "global_step": 151558, "epoch": 1826} {"train_loss": -22.653579711914062, "global_step": 151559, "epoch": 1826} {"train_loss": -22.441349029541016, "global_step": 151560, "epoch": 1826} {"train_loss": -22.960134506225586, "global_step": 151561, "epoch": 1826} {"train_loss": -23.074588775634766, "global_step": 151562, "epoch": 1826} {"train_loss": -22.743871688842773, "global_step": 151563, "epoch": 1826} {"train_loss": -23.297088623046875, "global_step": 151564, "epoch": 1826} {"train_loss": -22.927915573120117, "global_step": 151565, "epoch": 1826} {"train_loss": -23.305477142333984, "global_step": 151566, "epoch": 1826} {"train_loss": -22.902402877807617, "global_step": 151567, "epoch": 1826} {"train_loss": -23.397825241088867, "global_step": 151568, "epoch": 1826} {"train_loss": -22.98170280456543, "global_step": 151569, "epoch": 1826} {"train_loss": -22.84479331970215, "global_step": 151570, "epoch": 1826} {"train_loss": -22.808866500854492, "global_step": 151571, "epoch": 1826} {"train_loss": -23.090412139892578, "global_step": 151572, "epoch": 1826} {"train_loss": -22.961746215820312, "global_step": 151573, "epoch": 1826} {"train_loss": -23.099533081054688, "global_step": 151574, "epoch": 1826} {"train_loss": -22.94445037841797, "global_step": 151575, "epoch": 1826} {"train_loss": -23.260425567626953, "global_step": 151576, "epoch": 1826} {"train_loss": -23.035757064819336, "global_step": 151577, "epoch": 1826} {"train_loss": -23.170286178588867, "global_step": 151578, "epoch": 1826} {"train_loss": -23.35236167907715, "global_step": 151579, "epoch": 1826} {"train_loss": -23.426794052124023, "global_step": 151580, "epoch": 1826} {"train_loss": -23.042404174804688, "global_step": 151581, "epoch": 1826} {"train_loss": -23.205862045288086, "global_step": 151582, "epoch": 1826} {"train_loss": -23.414295196533203, "global_step": 151583, "epoch": 1826} {"train_loss": -23.26689910888672, "global_step": 151584, "epoch": 1826} {"train_loss": -23.290502548217773, "global_step": 151585, "epoch": 1826} {"train_loss": -23.287097930908203, "global_step": 151586, "epoch": 1826} {"train_loss": -23.059112548828125, "global_step": 151587, "epoch": 1826} {"train_loss": -23.554948806762695, "global_step": 151588, "epoch": 1826} {"train_loss": -22.978857040405273, "global_step": 151589, "epoch": 1826} {"train_loss": -23.059207916259766, "global_step": 151590, "epoch": 1826} {"train_loss": -23.420377731323242, "global_step": 151591, "epoch": 1826} {"train_loss": -23.373859405517578, "global_step": 151592, "epoch": 1826} {"train_loss": -23.334659576416016, "global_step": 151593, "epoch": 1826} {"train_loss": -23.238433837890625, "global_step": 151594, "epoch": 1826} {"train_loss": -23.531930923461914, "global_step": 151595, "epoch": 1826} {"train_loss": -23.24615478515625, "global_step": 151596, "epoch": 1826} {"train_loss": -23.572118759155273, "global_step": 151597, "epoch": 1826} {"train_loss": -22.884119033813477, "global_step": 151598, "epoch": 1826} {"train_loss": -23.24312400817871, "global_step": 151599, "epoch": 1826} {"train_loss": -23.270126342773438, "global_step": 151600, "epoch": 1826} {"train_loss": -23.21342658996582, "global_step": 151601, "epoch": 1826} {"train_loss": -23.06553077697754, "global_step": 151602, "epoch": 1826} {"train_loss": -23.464881896972656, "global_step": 151603, "epoch": 1826} {"train_loss": -23.214746475219727, "global_step": 151604, "epoch": 1826} {"train_loss": -23.37063980102539, "global_step": 151605, "epoch": 1826} {"train_loss": -23.494205474853516, "global_step": 151606, "epoch": 1826} {"train_loss": -23.274749755859375, "global_step": 151607, "epoch": 1826} {"train_loss": -23.23152732849121, "global_step": 151608, "epoch": 1826} {"train_loss": -23.72227668762207, "global_step": 151609, "epoch": 1826} {"train_loss": -23.36939811706543, "global_step": 151610, "epoch": 1826} {"train_loss": -23.159587860107422, "global_step": 151611, "epoch": 1826} {"train_loss": -23.430936813354492, "global_step": 151612, "epoch": 1826} {"train_loss": -23.174375534057617, "global_step": 151613, "epoch": 1826} {"train_loss": -23.4036808013916, "global_step": 151614, "epoch": 1826} {"train_loss": -23.153757095336914, "global_step": 151615, "epoch": 1826} {"train_loss": -23.00040054321289, "global_step": 151616, "epoch": 1826} {"train_loss": -23.054813385009766, "global_step": 151617, "epoch": 1826} {"train_loss": -23.603233337402344, "global_step": 151618, "epoch": 1826} {"train_loss": -23.3024959564209, "global_step": 151619, "epoch": 1826} {"train_loss": -23.297618865966797, "global_step": 151620, "epoch": 1826} {"train_loss": -23.325359344482422, "global_step": 151621, "epoch": 1826} {"train_loss": -23.478639602661133, "global_step": 151622, "epoch": 1826} {"train_loss": -23.228464126586914, "global_step": 151623, "epoch": 1826} {"train_loss": -23.206995010375977, "global_step": 151624, "epoch": 1826} {"train_loss": -23.665292739868164, "global_step": 151625, "epoch": 1826} {"train_loss": -22.849367141723633, "global_step": 151626, "epoch": 1826} {"train_loss": -23.343191146850586, "global_step": 151627, "epoch": 1826} {"train_loss": -23.42976951599121, "global_step": 151628, "epoch": 1826} {"train_loss": -23.560150146484375, "global_step": 151629, "epoch": 1826} {"train_loss": -23.500455856323242, "global_step": 151630, "epoch": 1826} {"train_loss": -23.539072036743164, "global_step": 151631, "epoch": 1826} {"train_loss": -23.63956642150879, "global_step": 151632, "epoch": 1826} {"train_loss": -23.511640548706055, "global_step": 151633, "epoch": 1826} {"train_loss": -23.249942779541016, "global_step": 151634, "epoch": 1826} {"train_loss": -23.46185874938965, "global_step": 151635, "epoch": 1826} {"train_loss": -23.786008834838867, "global_step": 151636, "epoch": 1826} {"train_loss": -23.479291915893555, "global_step": 151637, "epoch": 1826} {"train_loss": -23.541095733642578, "global_step": 151638, "epoch": 1826} {"train_loss": -22.89885902404785, "global_step": 151639, "epoch": 1826} {"train_loss": -23.238431424979705, "global_step": 151640, "epoch": 1826, "val_loss": 6365178.0} {"train_loss": -23.034780502319336, "global_step": 151641, "epoch": 1827} {"train_loss": -23.10743522644043, "global_step": 151642, "epoch": 1827} {"train_loss": -23.399635314941406, "global_step": 151643, "epoch": 1827} {"train_loss": -22.608373641967773, "global_step": 151644, "epoch": 1827} {"train_loss": -22.76665687561035, "global_step": 151645, "epoch": 1827} {"train_loss": -22.991586685180664, "global_step": 151646, "epoch": 1827} {"train_loss": -22.79148292541504, "global_step": 151647, "epoch": 1827} {"train_loss": -22.906925201416016, "global_step": 151648, "epoch": 1827} {"train_loss": -23.17314910888672, "global_step": 151649, "epoch": 1827} {"train_loss": -23.177282333374023, "global_step": 151650, "epoch": 1827} {"train_loss": -23.021442413330078, "global_step": 151651, "epoch": 1827} {"train_loss": -23.27239227294922, "global_step": 151652, "epoch": 1827} {"train_loss": -22.98897361755371, "global_step": 151653, "epoch": 1827} {"train_loss": -23.23971939086914, "global_step": 151654, "epoch": 1827} {"train_loss": -23.02147674560547, "global_step": 151655, "epoch": 1827} {"train_loss": -22.652578353881836, "global_step": 151656, "epoch": 1827} {"train_loss": -22.746437072753906, "global_step": 151657, "epoch": 1827} {"train_loss": -23.24505615234375, "global_step": 151658, "epoch": 1827} {"train_loss": -23.19784927368164, "global_step": 151659, "epoch": 1827} {"train_loss": -23.18374252319336, "global_step": 151660, "epoch": 1827} {"train_loss": -23.2235164642334, "global_step": 151661, "epoch": 1827} {"train_loss": -23.257396697998047, "global_step": 151662, "epoch": 1827} {"train_loss": -23.059858322143555, "global_step": 151663, "epoch": 1827} {"train_loss": -23.069028854370117, "global_step": 151664, "epoch": 1827} {"train_loss": -23.193479537963867, "global_step": 151665, "epoch": 1827} {"train_loss": -23.37066650390625, "global_step": 151666, "epoch": 1827} {"train_loss": -23.146574020385742, "global_step": 151667, "epoch": 1827} {"train_loss": -23.141218185424805, "global_step": 151668, "epoch": 1827} {"train_loss": -23.347166061401367, "global_step": 151669, "epoch": 1827} {"train_loss": -23.317541122436523, "global_step": 151670, "epoch": 1827} {"train_loss": -22.81376075744629, "global_step": 151671, "epoch": 1827} {"train_loss": -23.595951080322266, "global_step": 151672, "epoch": 1827} {"train_loss": -23.158231735229492, "global_step": 151673, "epoch": 1827} {"train_loss": -23.45076560974121, "global_step": 151674, "epoch": 1827} {"train_loss": -23.492929458618164, "global_step": 151675, "epoch": 1827} {"train_loss": -23.30975341796875, "global_step": 151676, "epoch": 1827} {"train_loss": -23.26105308532715, "global_step": 151677, "epoch": 1827} {"train_loss": -23.37930679321289, "global_step": 151678, "epoch": 1827} {"train_loss": -23.47442054748535, "global_step": 151679, "epoch": 1827} {"train_loss": -23.36063575744629, "global_step": 151680, "epoch": 1827} {"train_loss": -23.42510414123535, "global_step": 151681, "epoch": 1827} {"train_loss": -23.85162353515625, "global_step": 151682, "epoch": 1827} {"train_loss": -23.573240280151367, "global_step": 151683, "epoch": 1827} {"train_loss": -23.681259155273438, "global_step": 151684, "epoch": 1827} {"train_loss": -23.2131404876709, "global_step": 151685, "epoch": 1827} {"train_loss": -22.7742862701416, "global_step": 151686, "epoch": 1827} {"train_loss": -23.143091201782227, "global_step": 151687, "epoch": 1827} {"train_loss": -23.417251586914062, "global_step": 151688, "epoch": 1827} {"train_loss": -23.59478759765625, "global_step": 151689, "epoch": 1827} {"train_loss": -23.0502986907959, "global_step": 151690, "epoch": 1827} {"train_loss": -23.02298927307129, "global_step": 151691, "epoch": 1827} {"train_loss": -23.26055908203125, "global_step": 151692, "epoch": 1827} {"train_loss": -23.43996238708496, "global_step": 151693, "epoch": 1827} {"train_loss": -23.032615661621094, "global_step": 151694, "epoch": 1827} {"train_loss": -22.9482479095459, "global_step": 151695, "epoch": 1827} {"train_loss": -22.930103302001953, "global_step": 151696, "epoch": 1827} {"train_loss": -23.226886749267578, "global_step": 151697, "epoch": 1827} {"train_loss": -23.17702293395996, "global_step": 151698, "epoch": 1827} {"train_loss": -23.100976943969727, "global_step": 151699, "epoch": 1827} {"train_loss": -23.37059211730957, "global_step": 151700, "epoch": 1827} {"train_loss": -23.281524658203125, "global_step": 151701, "epoch": 1827} {"train_loss": -22.99892234802246, "global_step": 151702, "epoch": 1827} {"train_loss": -23.109331130981445, "global_step": 151703, "epoch": 1827} {"train_loss": -23.085647583007812, "global_step": 151704, "epoch": 1827} {"train_loss": -23.13458251953125, "global_step": 151705, "epoch": 1827} {"train_loss": -23.420669555664062, "global_step": 151706, "epoch": 1827} {"train_loss": -23.34375, "global_step": 151707, "epoch": 1827} {"train_loss": -23.33662223815918, "global_step": 151708, "epoch": 1827} {"train_loss": -23.43964385986328, "global_step": 151709, "epoch": 1827} {"train_loss": -23.086896896362305, "global_step": 151710, "epoch": 1827} {"train_loss": -23.44732093811035, "global_step": 151711, "epoch": 1827} {"train_loss": -23.27648162841797, "global_step": 151712, "epoch": 1827} {"train_loss": -23.693647384643555, "global_step": 151713, "epoch": 1827} {"train_loss": -23.27406120300293, "global_step": 151714, "epoch": 1827} {"train_loss": -23.467435836791992, "global_step": 151715, "epoch": 1827} {"train_loss": -23.267654418945312, "global_step": 151716, "epoch": 1827} {"train_loss": -23.83978271484375, "global_step": 151717, "epoch": 1827} {"train_loss": -23.525217056274414, "global_step": 151718, "epoch": 1827} {"train_loss": -23.517465591430664, "global_step": 151719, "epoch": 1827} {"train_loss": -23.603879928588867, "global_step": 151720, "epoch": 1827} {"train_loss": -23.28688621520996, "global_step": 151721, "epoch": 1827} {"train_loss": -22.8133544921875, "global_step": 151722, "epoch": 1827} {"train_loss": -23.215228712702373, "global_step": 151723, "epoch": 1827, "val_loss": 6253961.0} {"train_loss": -23.100183486938477, "global_step": 151724, "epoch": 1828} {"train_loss": -22.948843002319336, "global_step": 151725, "epoch": 1828} {"train_loss": -23.33243751525879, "global_step": 151726, "epoch": 1828} {"train_loss": -23.432546615600586, "global_step": 151727, "epoch": 1828} {"train_loss": -23.19948387145996, "global_step": 151728, "epoch": 1828} {"train_loss": -23.247709274291992, "global_step": 151729, "epoch": 1828} {"train_loss": -23.665084838867188, "global_step": 151730, "epoch": 1828} {"train_loss": -23.54104995727539, "global_step": 151731, "epoch": 1828} {"train_loss": -23.396190643310547, "global_step": 151732, "epoch": 1828} {"train_loss": -23.091917037963867, "global_step": 151733, "epoch": 1828} {"train_loss": -23.522537231445312, "global_step": 151734, "epoch": 1828} {"train_loss": -23.351003646850586, "global_step": 151735, "epoch": 1828} {"train_loss": -23.216968536376953, "global_step": 151736, "epoch": 1828} {"train_loss": -23.33423614501953, "global_step": 151737, "epoch": 1828} {"train_loss": -23.507410049438477, "global_step": 151738, "epoch": 1828} {"train_loss": -23.461759567260742, "global_step": 151739, "epoch": 1828} {"train_loss": -23.2030086517334, "global_step": 151740, "epoch": 1828} {"train_loss": -23.245887756347656, "global_step": 151741, "epoch": 1828} {"train_loss": -23.287109375, "global_step": 151742, "epoch": 1828} {"train_loss": -23.426481246948242, "global_step": 151743, "epoch": 1828} {"train_loss": -23.235519409179688, "global_step": 151744, "epoch": 1828} {"train_loss": -22.876117706298828, "global_step": 151745, "epoch": 1828} {"train_loss": -23.248430252075195, "global_step": 151746, "epoch": 1828} {"train_loss": -23.39733123779297, "global_step": 151747, "epoch": 1828} {"train_loss": -23.171777725219727, "global_step": 151748, "epoch": 1828} {"train_loss": -23.05489158630371, "global_step": 151749, "epoch": 1828} {"train_loss": -23.112699508666992, "global_step": 151750, "epoch": 1828} {"train_loss": -23.594812393188477, "global_step": 151751, "epoch": 1828} {"train_loss": -23.506128311157227, "global_step": 151752, "epoch": 1828} {"train_loss": -23.170862197875977, "global_step": 151753, "epoch": 1828} {"train_loss": -23.157865524291992, "global_step": 151754, "epoch": 1828} {"train_loss": -23.17042350769043, "global_step": 151755, "epoch": 1828} {"train_loss": -23.225351333618164, "global_step": 151756, "epoch": 1828} {"train_loss": -23.221248626708984, "global_step": 151757, "epoch": 1828} {"train_loss": -23.13576316833496, "global_step": 151758, "epoch": 1828} {"train_loss": -23.434900283813477, "global_step": 151759, "epoch": 1828} {"train_loss": -23.593114852905273, "global_step": 151760, "epoch": 1828} {"train_loss": -23.174131393432617, "global_step": 151761, "epoch": 1828} {"train_loss": -23.284088134765625, "global_step": 151762, "epoch": 1828} {"train_loss": -23.346162796020508, "global_step": 151763, "epoch": 1828} {"train_loss": -23.573495864868164, "global_step": 151764, "epoch": 1828} {"train_loss": -23.48780059814453, "global_step": 151765, "epoch": 1828} {"train_loss": -23.17597007751465, "global_step": 151766, "epoch": 1828} {"train_loss": -23.467382431030273, "global_step": 151767, "epoch": 1828} {"train_loss": -23.231220245361328, "global_step": 151768, "epoch": 1828} {"train_loss": -23.481122970581055, "global_step": 151769, "epoch": 1828} {"train_loss": -23.3488826751709, "global_step": 151770, "epoch": 1828} {"train_loss": -23.188207626342773, "global_step": 151771, "epoch": 1828} {"train_loss": -23.25227928161621, "global_step": 151772, "epoch": 1828} {"train_loss": -23.250898361206055, "global_step": 151773, "epoch": 1828} {"train_loss": -23.333717346191406, "global_step": 151774, "epoch": 1828} {"train_loss": -23.49207878112793, "global_step": 151775, "epoch": 1828} {"train_loss": -23.385971069335938, "global_step": 151776, "epoch": 1828} {"train_loss": -23.437814712524414, "global_step": 151777, "epoch": 1828} {"train_loss": -23.199621200561523, "global_step": 151778, "epoch": 1828} {"train_loss": -23.14457130432129, "global_step": 151779, "epoch": 1828} {"train_loss": -23.74785614013672, "global_step": 151780, "epoch": 1828} {"train_loss": -23.5338191986084, "global_step": 151781, "epoch": 1828} {"train_loss": -23.700979232788086, "global_step": 151782, "epoch": 1828} {"train_loss": -23.78169059753418, "global_step": 151783, "epoch": 1828} {"train_loss": -23.458648681640625, "global_step": 151784, "epoch": 1828} {"train_loss": -23.2519474029541, "global_step": 151785, "epoch": 1828} {"train_loss": -23.571075439453125, "global_step": 151786, "epoch": 1828} {"train_loss": -23.04746437072754, "global_step": 151787, "epoch": 1828} {"train_loss": -23.41354751586914, "global_step": 151788, "epoch": 1828} {"train_loss": -23.084396362304688, "global_step": 151789, "epoch": 1828} {"train_loss": -23.342050552368164, "global_step": 151790, "epoch": 1828} {"train_loss": -23.61175537109375, "global_step": 151791, "epoch": 1828} {"train_loss": -23.20673942565918, "global_step": 151792, "epoch": 1828} {"train_loss": -23.077489852905273, "global_step": 151793, "epoch": 1828} {"train_loss": -23.399301528930664, "global_step": 151794, "epoch": 1828} {"train_loss": -23.433040618896484, "global_step": 151795, "epoch": 1828} {"train_loss": -23.2391357421875, "global_step": 151796, "epoch": 1828} {"train_loss": -23.286033630371094, "global_step": 151797, "epoch": 1828} {"train_loss": -23.38801383972168, "global_step": 151798, "epoch": 1828} {"train_loss": -23.44400978088379, "global_step": 151799, "epoch": 1828} {"train_loss": -22.927139282226562, "global_step": 151800, "epoch": 1828} {"train_loss": -23.26633644104004, "global_step": 151801, "epoch": 1828} {"train_loss": -23.51582145690918, "global_step": 151802, "epoch": 1828} {"train_loss": -23.51793098449707, "global_step": 151803, "epoch": 1828} {"train_loss": -23.447168350219727, "global_step": 151804, "epoch": 1828} {"train_loss": -23.01234245300293, "global_step": 151805, "epoch": 1828} {"train_loss": -23.335486883140472, "global_step": 151806, "epoch": 1828, "val_loss": 6396313.0} {"train_loss": -22.773157119750977, "global_step": 151807, "epoch": 1829} {"train_loss": -23.020654678344727, "global_step": 151808, "epoch": 1829} {"train_loss": -23.228912353515625, "global_step": 151809, "epoch": 1829} {"train_loss": -22.517696380615234, "global_step": 151810, "epoch": 1829} {"train_loss": -22.872806549072266, "global_step": 151811, "epoch": 1829} {"train_loss": -22.89234733581543, "global_step": 151812, "epoch": 1829} {"train_loss": -22.97896385192871, "global_step": 151813, "epoch": 1829} {"train_loss": -23.321086883544922, "global_step": 151814, "epoch": 1829} {"train_loss": -23.4016056060791, "global_step": 151815, "epoch": 1829} {"train_loss": -22.825162887573242, "global_step": 151816, "epoch": 1829} {"train_loss": -23.116941452026367, "global_step": 151817, "epoch": 1829} {"train_loss": -23.08145523071289, "global_step": 151818, "epoch": 1829} {"train_loss": -23.21405601501465, "global_step": 151819, "epoch": 1829} {"train_loss": -23.429365158081055, "global_step": 151820, "epoch": 1829} {"train_loss": -22.864425659179688, "global_step": 151821, "epoch": 1829} {"train_loss": -23.282455444335938, "global_step": 151822, "epoch": 1829} {"train_loss": -22.73648452758789, "global_step": 151823, "epoch": 1829} {"train_loss": -23.232009887695312, "global_step": 151824, "epoch": 1829} {"train_loss": -23.397933959960938, "global_step": 151825, "epoch": 1829} {"train_loss": -23.414926528930664, "global_step": 151826, "epoch": 1829} {"train_loss": -23.485126495361328, "global_step": 151827, "epoch": 1829} {"train_loss": -23.207046508789062, "global_step": 151828, "epoch": 1829} {"train_loss": -23.361083984375, "global_step": 151829, "epoch": 1829} {"train_loss": -23.461288452148438, "global_step": 151830, "epoch": 1829} {"train_loss": -23.632686614990234, "global_step": 151831, "epoch": 1829} {"train_loss": -23.318344116210938, "global_step": 151832, "epoch": 1829} {"train_loss": -23.109792709350586, "global_step": 151833, "epoch": 1829} {"train_loss": -23.362163543701172, "global_step": 151834, "epoch": 1829} {"train_loss": -23.334964752197266, "global_step": 151835, "epoch": 1829} {"train_loss": -23.19651222229004, "global_step": 151836, "epoch": 1829} {"train_loss": -23.307514190673828, "global_step": 151837, "epoch": 1829} {"train_loss": -23.43869972229004, "global_step": 151838, "epoch": 1829} {"train_loss": -23.11224365234375, "global_step": 151839, "epoch": 1829} {"train_loss": -23.287757873535156, "global_step": 151840, "epoch": 1829} {"train_loss": -23.112646102905273, "global_step": 151841, "epoch": 1829} {"train_loss": -22.885913848876953, "global_step": 151842, "epoch": 1829} {"train_loss": -23.23237419128418, "global_step": 151843, "epoch": 1829} {"train_loss": -23.4700927734375, "global_step": 151844, "epoch": 1829} {"train_loss": -23.49956512451172, "global_step": 151845, "epoch": 1829} {"train_loss": -23.369428634643555, "global_step": 151846, "epoch": 1829} {"train_loss": -23.5610294342041, "global_step": 151847, "epoch": 1829} {"train_loss": -23.027921676635742, "global_step": 151848, "epoch": 1829} {"train_loss": -22.948698043823242, "global_step": 151849, "epoch": 1829} {"train_loss": -23.403303146362305, "global_step": 151850, "epoch": 1829} {"train_loss": -23.00107765197754, "global_step": 151851, "epoch": 1829} {"train_loss": -23.042072296142578, "global_step": 151852, "epoch": 1829} {"train_loss": -23.724523544311523, "global_step": 151853, "epoch": 1829} {"train_loss": -23.248090744018555, "global_step": 151854, "epoch": 1829} {"train_loss": -23.16188621520996, "global_step": 151855, "epoch": 1829} {"train_loss": -23.28944206237793, "global_step": 151856, "epoch": 1829} {"train_loss": -23.03085708618164, "global_step": 151857, "epoch": 1829} {"train_loss": -23.30905532836914, "global_step": 151858, "epoch": 1829} {"train_loss": -22.95794677734375, "global_step": 151859, "epoch": 1829} {"train_loss": -23.204504013061523, "global_step": 151860, "epoch": 1829} {"train_loss": -23.182727813720703, "global_step": 151861, "epoch": 1829} {"train_loss": -23.214126586914062, "global_step": 151862, "epoch": 1829} {"train_loss": -23.065216064453125, "global_step": 151863, "epoch": 1829} {"train_loss": -23.21192741394043, "global_step": 151864, "epoch": 1829} {"train_loss": -23.48594093322754, "global_step": 151865, "epoch": 1829} {"train_loss": -23.071229934692383, "global_step": 151866, "epoch": 1829} {"train_loss": -23.319326400756836, "global_step": 151867, "epoch": 1829} {"train_loss": -23.030799865722656, "global_step": 151868, "epoch": 1829} {"train_loss": -23.577985763549805, "global_step": 151869, "epoch": 1829} {"train_loss": -23.119245529174805, "global_step": 151870, "epoch": 1829} {"train_loss": -23.273303985595703, "global_step": 151871, "epoch": 1829} {"train_loss": -23.71434211730957, "global_step": 151872, "epoch": 1829} {"train_loss": -23.47456932067871, "global_step": 151873, "epoch": 1829} {"train_loss": -23.590734481811523, "global_step": 151874, "epoch": 1829} {"train_loss": -23.261371612548828, "global_step": 151875, "epoch": 1829} {"train_loss": -23.357511520385742, "global_step": 151876, "epoch": 1829} {"train_loss": -23.060144424438477, "global_step": 151877, "epoch": 1829} {"train_loss": -23.24671745300293, "global_step": 151878, "epoch": 1829} {"train_loss": -22.973230361938477, "global_step": 151879, "epoch": 1829} {"train_loss": -23.42584800720215, "global_step": 151880, "epoch": 1829} {"train_loss": -22.839879989624023, "global_step": 151881, "epoch": 1829} {"train_loss": -23.25428581237793, "global_step": 151882, "epoch": 1829} {"train_loss": -23.229339599609375, "global_step": 151883, "epoch": 1829} {"train_loss": -23.353736877441406, "global_step": 151884, "epoch": 1829} {"train_loss": -23.32160758972168, "global_step": 151885, "epoch": 1829} {"train_loss": -22.931961059570312, "global_step": 151886, "epoch": 1829} {"train_loss": -23.36343765258789, "global_step": 151887, "epoch": 1829} {"train_loss": -23.117021560668945, "global_step": 151888, "epoch": 1829} {"train_loss": -23.224505481949773, "global_step": 151889, "epoch": 1829, "val_loss": 6326522.5} {"train_loss": -21.841028213500977, "global_step": 151890, "epoch": 1830} {"train_loss": -22.29972267150879, "global_step": 151891, "epoch": 1830} {"train_loss": -22.334192276000977, "global_step": 151892, "epoch": 1830} {"train_loss": -22.76599884033203, "global_step": 151893, "epoch": 1830} {"train_loss": -22.538131713867188, "global_step": 151894, "epoch": 1830} {"train_loss": -22.837543487548828, "global_step": 151895, "epoch": 1830} {"train_loss": -22.8288631439209, "global_step": 151896, "epoch": 1830} {"train_loss": -22.731782913208008, "global_step": 151897, "epoch": 1830} {"train_loss": -22.781400680541992, "global_step": 151898, "epoch": 1830} {"train_loss": -22.74916648864746, "global_step": 151899, "epoch": 1830} {"train_loss": -22.788251876831055, "global_step": 151900, "epoch": 1830} {"train_loss": -23.220706939697266, "global_step": 151901, "epoch": 1830} {"train_loss": -22.876434326171875, "global_step": 151902, "epoch": 1830} {"train_loss": -23.34823226928711, "global_step": 151903, "epoch": 1830} {"train_loss": -23.03236198425293, "global_step": 151904, "epoch": 1830} {"train_loss": -23.19758415222168, "global_step": 151905, "epoch": 1830} {"train_loss": -22.865522384643555, "global_step": 151906, "epoch": 1830} {"train_loss": -23.095129013061523, "global_step": 151907, "epoch": 1830} {"train_loss": -23.25474739074707, "global_step": 151908, "epoch": 1830} {"train_loss": -22.91208839416504, "global_step": 151909, "epoch": 1830} {"train_loss": -23.020830154418945, "global_step": 151910, "epoch": 1830} {"train_loss": -23.145111083984375, "global_step": 151911, "epoch": 1830} {"train_loss": -23.383331298828125, "global_step": 151912, "epoch": 1830} {"train_loss": -23.283960342407227, "global_step": 151913, "epoch": 1830} {"train_loss": -23.43988037109375, "global_step": 151914, "epoch": 1830} {"train_loss": -23.272891998291016, "global_step": 151915, "epoch": 1830} {"train_loss": -23.337966918945312, "global_step": 151916, "epoch": 1830} {"train_loss": -23.173643112182617, "global_step": 151917, "epoch": 1830} {"train_loss": -23.605573654174805, "global_step": 151918, "epoch": 1830} {"train_loss": -23.29313087463379, "global_step": 151919, "epoch": 1830} {"train_loss": -23.579687118530273, "global_step": 151920, "epoch": 1830} {"train_loss": -23.46548843383789, "global_step": 151921, "epoch": 1830} {"train_loss": -23.43027114868164, "global_step": 151922, "epoch": 1830} {"train_loss": -23.240501403808594, "global_step": 151923, "epoch": 1830} {"train_loss": -23.62198829650879, "global_step": 151924, "epoch": 1830} {"train_loss": -23.251155853271484, "global_step": 151925, "epoch": 1830} {"train_loss": -23.6346492767334, "global_step": 151926, "epoch": 1830} {"train_loss": -23.288232803344727, "global_step": 151927, "epoch": 1830} {"train_loss": -23.194503784179688, "global_step": 151928, "epoch": 1830} {"train_loss": -23.244386672973633, "global_step": 151929, "epoch": 1830} {"train_loss": -23.71758270263672, "global_step": 151930, "epoch": 1830} {"train_loss": -23.521764755249023, "global_step": 151931, "epoch": 1830} {"train_loss": -23.119352340698242, "global_step": 151932, "epoch": 1830} {"train_loss": -23.36117935180664, "global_step": 151933, "epoch": 1830} {"train_loss": -23.413753509521484, "global_step": 151934, "epoch": 1830} {"train_loss": -23.408252716064453, "global_step": 151935, "epoch": 1830} {"train_loss": -23.272512435913086, "global_step": 151936, "epoch": 1830} {"train_loss": -23.398656845092773, "global_step": 151937, "epoch": 1830} {"train_loss": -23.524919509887695, "global_step": 151938, "epoch": 1830} {"train_loss": -23.4949893951416, "global_step": 151939, "epoch": 1830} {"train_loss": -23.481449127197266, "global_step": 151940, "epoch": 1830} {"train_loss": -23.606895446777344, "global_step": 151941, "epoch": 1830} {"train_loss": -23.31315040588379, "global_step": 151942, "epoch": 1830} {"train_loss": -23.324466705322266, "global_step": 151943, "epoch": 1830} {"train_loss": -23.224395751953125, "global_step": 151944, "epoch": 1830} {"train_loss": -23.5173282623291, "global_step": 151945, "epoch": 1830} {"train_loss": -23.46430206298828, "global_step": 151946, "epoch": 1830} {"train_loss": -23.799043655395508, "global_step": 151947, "epoch": 1830} {"train_loss": -23.61093521118164, "global_step": 151948, "epoch": 1830} {"train_loss": -23.41282081604004, "global_step": 151949, "epoch": 1830} {"train_loss": -23.534101486206055, "global_step": 151950, "epoch": 1830} {"train_loss": -23.532901763916016, "global_step": 151951, "epoch": 1830} {"train_loss": -23.06751251220703, "global_step": 151952, "epoch": 1830} {"train_loss": -23.48129653930664, "global_step": 151953, "epoch": 1830} {"train_loss": -22.998559951782227, "global_step": 151954, "epoch": 1830} {"train_loss": -23.505615234375, "global_step": 151955, "epoch": 1830} {"train_loss": -23.348655700683594, "global_step": 151956, "epoch": 1830} {"train_loss": -22.990407943725586, "global_step": 151957, "epoch": 1830} {"train_loss": -23.353515625, "global_step": 151958, "epoch": 1830} {"train_loss": -23.197004318237305, "global_step": 151959, "epoch": 1830} {"train_loss": -23.637863159179688, "global_step": 151960, "epoch": 1830} {"train_loss": -23.5100154876709, "global_step": 151961, "epoch": 1830} {"train_loss": -23.18340492248535, "global_step": 151962, "epoch": 1830} {"train_loss": -23.20725440979004, "global_step": 151963, "epoch": 1830} {"train_loss": -23.197599411010742, "global_step": 151964, "epoch": 1830} {"train_loss": -23.528217315673828, "global_step": 151965, "epoch": 1830} {"train_loss": -23.637258529663086, "global_step": 151966, "epoch": 1830} {"train_loss": -23.609113693237305, "global_step": 151967, "epoch": 1830} {"train_loss": -23.36150360107422, "global_step": 151968, "epoch": 1830} {"train_loss": -23.11747169494629, "global_step": 151969, "epoch": 1830} {"train_loss": -23.525602340698242, "global_step": 151970, "epoch": 1830} {"train_loss": -23.3425350189209, "global_step": 151971, "epoch": 1830} {"train_loss": -23.250733203198536, "global_step": 151972, "epoch": 1830, "val_loss": 6381409.0} {"train_loss": -23.107261657714844, "global_step": 151973, "epoch": 1831} {"train_loss": -23.458173751831055, "global_step": 151974, "epoch": 1831} {"train_loss": -22.69611167907715, "global_step": 151975, "epoch": 1831} {"train_loss": -23.03521728515625, "global_step": 151976, "epoch": 1831} {"train_loss": -23.079343795776367, "global_step": 151977, "epoch": 1831} {"train_loss": -22.960803985595703, "global_step": 151978, "epoch": 1831} {"train_loss": -23.019636154174805, "global_step": 151979, "epoch": 1831} {"train_loss": -23.132184982299805, "global_step": 151980, "epoch": 1831} {"train_loss": -22.819459915161133, "global_step": 151981, "epoch": 1831} {"train_loss": -23.6787166595459, "global_step": 151982, "epoch": 1831} {"train_loss": -22.59632682800293, "global_step": 151983, "epoch": 1831} {"train_loss": -23.127164840698242, "global_step": 151984, "epoch": 1831} {"train_loss": -23.010807037353516, "global_step": 151985, "epoch": 1831} {"train_loss": -22.847116470336914, "global_step": 151986, "epoch": 1831} {"train_loss": -23.22186279296875, "global_step": 151987, "epoch": 1831} {"train_loss": -23.231603622436523, "global_step": 151988, "epoch": 1831} {"train_loss": -23.111875534057617, "global_step": 151989, "epoch": 1831} {"train_loss": -22.84676742553711, "global_step": 151990, "epoch": 1831} {"train_loss": -23.3597412109375, "global_step": 151991, "epoch": 1831} {"train_loss": -23.1802978515625, "global_step": 151992, "epoch": 1831} {"train_loss": -23.2558650970459, "global_step": 151993, "epoch": 1831} {"train_loss": -23.16887855529785, "global_step": 151994, "epoch": 1831} {"train_loss": -23.106401443481445, "global_step": 151995, "epoch": 1831} {"train_loss": -23.294050216674805, "global_step": 151996, "epoch": 1831} {"train_loss": -23.073959350585938, "global_step": 151997, "epoch": 1831} {"train_loss": -23.383665084838867, "global_step": 151998, "epoch": 1831} {"train_loss": -23.13302993774414, "global_step": 151999, "epoch": 1831} {"train_loss": -23.2640323638916, "global_step": 152000, "epoch": 1831} {"train_loss": -23.29920768737793, "global_step": 152001, "epoch": 1831} {"train_loss": -23.522525787353516, "global_step": 152002, "epoch": 1831} {"train_loss": -23.215686798095703, "global_step": 152003, "epoch": 1831} {"train_loss": -23.329092025756836, "global_step": 152004, "epoch": 1831} {"train_loss": -23.078536987304688, "global_step": 152005, "epoch": 1831} {"train_loss": -23.034955978393555, "global_step": 152006, "epoch": 1831} {"train_loss": -23.37713623046875, "global_step": 152007, "epoch": 1831} {"train_loss": -23.237592697143555, "global_step": 152008, "epoch": 1831} {"train_loss": -23.52007484436035, "global_step": 152009, "epoch": 1831} {"train_loss": -23.369958877563477, "global_step": 152010, "epoch": 1831} {"train_loss": -23.689138412475586, "global_step": 152011, "epoch": 1831} {"train_loss": -23.17068099975586, "global_step": 152012, "epoch": 1831} {"train_loss": -23.472013473510742, "global_step": 152013, "epoch": 1831} {"train_loss": -23.35986328125, "global_step": 152014, "epoch": 1831} {"train_loss": -23.66287612915039, "global_step": 152015, "epoch": 1831} {"train_loss": -23.478837966918945, "global_step": 152016, "epoch": 1831} {"train_loss": -23.42266273498535, "global_step": 152017, "epoch": 1831} {"train_loss": -23.231918334960938, "global_step": 152018, "epoch": 1831} {"train_loss": -23.416210174560547, "global_step": 152019, "epoch": 1831} {"train_loss": -23.463546752929688, "global_step": 152020, "epoch": 1831} {"train_loss": -23.541654586791992, "global_step": 152021, "epoch": 1831} {"train_loss": -23.517684936523438, "global_step": 152022, "epoch": 1831} {"train_loss": -23.076234817504883, "global_step": 152023, "epoch": 1831} {"train_loss": -23.314178466796875, "global_step": 152024, "epoch": 1831} {"train_loss": -23.28999137878418, "global_step": 152025, "epoch": 1831} {"train_loss": -23.520578384399414, "global_step": 152026, "epoch": 1831} {"train_loss": -23.18511390686035, "global_step": 152027, "epoch": 1831} {"train_loss": -23.414709091186523, "global_step": 152028, "epoch": 1831} {"train_loss": -23.295427322387695, "global_step": 152029, "epoch": 1831} {"train_loss": -22.81114387512207, "global_step": 152030, "epoch": 1831} {"train_loss": -23.2835750579834, "global_step": 152031, "epoch": 1831} {"train_loss": -23.233840942382812, "global_step": 152032, "epoch": 1831} {"train_loss": -23.500568389892578, "global_step": 152033, "epoch": 1831} {"train_loss": -23.24531364440918, "global_step": 152034, "epoch": 1831} {"train_loss": -23.570173263549805, "global_step": 152035, "epoch": 1831} {"train_loss": -23.509511947631836, "global_step": 152036, "epoch": 1831} {"train_loss": -23.79686164855957, "global_step": 152037, "epoch": 1831} {"train_loss": -23.796493530273438, "global_step": 152038, "epoch": 1831} {"train_loss": -23.335899353027344, "global_step": 152039, "epoch": 1831} {"train_loss": -23.435731887817383, "global_step": 152040, "epoch": 1831} {"train_loss": -23.37452507019043, "global_step": 152041, "epoch": 1831} {"train_loss": -22.795740127563477, "global_step": 152042, "epoch": 1831} {"train_loss": -23.243051528930664, "global_step": 152043, "epoch": 1831} {"train_loss": -23.578229904174805, "global_step": 152044, "epoch": 1831} {"train_loss": -23.367780685424805, "global_step": 152045, "epoch": 1831} {"train_loss": -23.10357093811035, "global_step": 152046, "epoch": 1831} {"train_loss": -23.191547393798828, "global_step": 152047, "epoch": 1831} {"train_loss": -23.098377227783203, "global_step": 152048, "epoch": 1831} {"train_loss": -22.7244815826416, "global_step": 152049, "epoch": 1831} {"train_loss": -22.86693572998047, "global_step": 152050, "epoch": 1831} {"train_loss": -22.815914154052734, "global_step": 152051, "epoch": 1831} {"train_loss": -23.335569381713867, "global_step": 152052, "epoch": 1831} {"train_loss": -23.00558090209961, "global_step": 152053, "epoch": 1831} {"train_loss": -23.365320205688477, "global_step": 152054, "epoch": 1831} {"train_loss": -23.238737451024804, "global_step": 152055, "epoch": 1831, "val_loss": 6306446.0} {"train_loss": -22.192747116088867, "global_step": 152056, "epoch": 1832} {"train_loss": -22.801809310913086, "global_step": 152057, "epoch": 1832} {"train_loss": -23.00682830810547, "global_step": 152058, "epoch": 1832} {"train_loss": -22.59930992126465, "global_step": 152059, "epoch": 1832} {"train_loss": -23.19038963317871, "global_step": 152060, "epoch": 1832} {"train_loss": -22.939424514770508, "global_step": 152061, "epoch": 1832} {"train_loss": -23.068265914916992, "global_step": 152062, "epoch": 1832} {"train_loss": -22.949737548828125, "global_step": 152063, "epoch": 1832} {"train_loss": -23.083236694335938, "global_step": 152064, "epoch": 1832} {"train_loss": -23.499086380004883, "global_step": 152065, "epoch": 1832} {"train_loss": -23.0781307220459, "global_step": 152066, "epoch": 1832} {"train_loss": -23.0230655670166, "global_step": 152067, "epoch": 1832} {"train_loss": -23.22214126586914, "global_step": 152068, "epoch": 1832} {"train_loss": -23.301166534423828, "global_step": 152069, "epoch": 1832} {"train_loss": -22.980363845825195, "global_step": 152070, "epoch": 1832} {"train_loss": -23.626604080200195, "global_step": 152071, "epoch": 1832} {"train_loss": -23.22450828552246, "global_step": 152072, "epoch": 1832} {"train_loss": -23.26091194152832, "global_step": 152073, "epoch": 1832} {"train_loss": -23.526079177856445, "global_step": 152074, "epoch": 1832} {"train_loss": -23.093738555908203, "global_step": 152075, "epoch": 1832} {"train_loss": -23.168075561523438, "global_step": 152076, "epoch": 1832} {"train_loss": -23.447879791259766, "global_step": 152077, "epoch": 1832} {"train_loss": -23.252084732055664, "global_step": 152078, "epoch": 1832} {"train_loss": -23.209421157836914, "global_step": 152079, "epoch": 1832} {"train_loss": -23.224206924438477, "global_step": 152080, "epoch": 1832} {"train_loss": -23.31302833557129, "global_step": 152081, "epoch": 1832} {"train_loss": -23.51272964477539, "global_step": 152082, "epoch": 1832} {"train_loss": -23.386123657226562, "global_step": 152083, "epoch": 1832} {"train_loss": -22.82178497314453, "global_step": 152084, "epoch": 1832} {"train_loss": -23.257497787475586, "global_step": 152085, "epoch": 1832} {"train_loss": -23.4860897064209, "global_step": 152086, "epoch": 1832} {"train_loss": -23.499570846557617, "global_step": 152087, "epoch": 1832} {"train_loss": -23.00666618347168, "global_step": 152088, "epoch": 1832} {"train_loss": -23.34567642211914, "global_step": 152089, "epoch": 1832} {"train_loss": -23.140796661376953, "global_step": 152090, "epoch": 1832} {"train_loss": -22.89533042907715, "global_step": 152091, "epoch": 1832} {"train_loss": -23.259994506835938, "global_step": 152092, "epoch": 1832} {"train_loss": -23.704675674438477, "global_step": 152093, "epoch": 1832} {"train_loss": -23.36904525756836, "global_step": 152094, "epoch": 1832} {"train_loss": -23.055505752563477, "global_step": 152095, "epoch": 1832} {"train_loss": -23.166162490844727, "global_step": 152096, "epoch": 1832} {"train_loss": -23.415334701538086, "global_step": 152097, "epoch": 1832} {"train_loss": -23.002870559692383, "global_step": 152098, "epoch": 1832} {"train_loss": -23.406206130981445, "global_step": 152099, "epoch": 1832} {"train_loss": -23.169523239135742, "global_step": 152100, "epoch": 1832} {"train_loss": -23.211822509765625, "global_step": 152101, "epoch": 1832} {"train_loss": -23.207931518554688, "global_step": 152102, "epoch": 1832} {"train_loss": -23.524425506591797, "global_step": 152103, "epoch": 1832} {"train_loss": -23.215911865234375, "global_step": 152104, "epoch": 1832} {"train_loss": -23.586599349975586, "global_step": 152105, "epoch": 1832} {"train_loss": -23.540760040283203, "global_step": 152106, "epoch": 1832} {"train_loss": -23.1160831451416, "global_step": 152107, "epoch": 1832} {"train_loss": -23.512680053710938, "global_step": 152108, "epoch": 1832} {"train_loss": -23.359251022338867, "global_step": 152109, "epoch": 1832} {"train_loss": -23.311262130737305, "global_step": 152110, "epoch": 1832} {"train_loss": -23.297706604003906, "global_step": 152111, "epoch": 1832} {"train_loss": -23.349613189697266, "global_step": 152112, "epoch": 1832} {"train_loss": -23.238868713378906, "global_step": 152113, "epoch": 1832} {"train_loss": -23.473684310913086, "global_step": 152114, "epoch": 1832} {"train_loss": -23.20115089416504, "global_step": 152115, "epoch": 1832} {"train_loss": -23.136701583862305, "global_step": 152116, "epoch": 1832} {"train_loss": -22.988140106201172, "global_step": 152117, "epoch": 1832} {"train_loss": -23.145999908447266, "global_step": 152118, "epoch": 1832} {"train_loss": -23.19073486328125, "global_step": 152119, "epoch": 1832} {"train_loss": -23.356863021850586, "global_step": 152120, "epoch": 1832} {"train_loss": -22.973691940307617, "global_step": 152121, "epoch": 1832} {"train_loss": -22.9892635345459, "global_step": 152122, "epoch": 1832} {"train_loss": -23.463333129882812, "global_step": 152123, "epoch": 1832} {"train_loss": -23.428478240966797, "global_step": 152124, "epoch": 1832} {"train_loss": -22.986467361450195, "global_step": 152125, "epoch": 1832} {"train_loss": -23.322200775146484, "global_step": 152126, "epoch": 1832} {"train_loss": -23.28706932067871, "global_step": 152127, "epoch": 1832} {"train_loss": -23.346206665039062, "global_step": 152128, "epoch": 1832} {"train_loss": -23.36063003540039, "global_step": 152129, "epoch": 1832} {"train_loss": -23.487384796142578, "global_step": 152130, "epoch": 1832} {"train_loss": -23.3410701751709, "global_step": 152131, "epoch": 1832} {"train_loss": -23.145212173461914, "global_step": 152132, "epoch": 1832} {"train_loss": -23.40125846862793, "global_step": 152133, "epoch": 1832} {"train_loss": -23.600173950195312, "global_step": 152134, "epoch": 1832} {"train_loss": -23.395721435546875, "global_step": 152135, "epoch": 1832} {"train_loss": -23.56326675415039, "global_step": 152136, "epoch": 1832} {"train_loss": -23.26038360595703, "global_step": 152137, "epoch": 1832} {"train_loss": -23.24191723099674, "global_step": 152138, "epoch": 1832, "val_loss": 6304885.0} {"train_loss": -22.142179489135742, "global_step": 152139, "epoch": 1833} {"train_loss": -21.483427047729492, "global_step": 152140, "epoch": 1833} {"train_loss": -22.065738677978516, "global_step": 152141, "epoch": 1833} {"train_loss": -23.03184700012207, "global_step": 152142, "epoch": 1833} {"train_loss": -22.456058502197266, "global_step": 152143, "epoch": 1833} {"train_loss": -22.310510635375977, "global_step": 152144, "epoch": 1833} {"train_loss": -22.16277503967285, "global_step": 152145, "epoch": 1833} {"train_loss": -22.112384796142578, "global_step": 152146, "epoch": 1833} {"train_loss": -22.189815521240234, "global_step": 152147, "epoch": 1833} {"train_loss": -22.2164363861084, "global_step": 152148, "epoch": 1833} {"train_loss": -22.530593872070312, "global_step": 152149, "epoch": 1833} {"train_loss": -22.421831130981445, "global_step": 152150, "epoch": 1833} {"train_loss": -22.463071823120117, "global_step": 152151, "epoch": 1833} {"train_loss": -22.573562622070312, "global_step": 152152, "epoch": 1833} {"train_loss": -22.4567813873291, "global_step": 152153, "epoch": 1833} {"train_loss": -22.35739517211914, "global_step": 152154, "epoch": 1833} {"train_loss": -22.562259674072266, "global_step": 152155, "epoch": 1833} {"train_loss": -22.932296752929688, "global_step": 152156, "epoch": 1833} {"train_loss": -22.30629539489746, "global_step": 152157, "epoch": 1833} {"train_loss": -22.88815689086914, "global_step": 152158, "epoch": 1833} {"train_loss": -22.452579498291016, "global_step": 152159, "epoch": 1833} {"train_loss": -22.8124942779541, "global_step": 152160, "epoch": 1833} {"train_loss": -23.04043960571289, "global_step": 152161, "epoch": 1833} {"train_loss": -22.67275047302246, "global_step": 152162, "epoch": 1833} {"train_loss": -22.9704532623291, "global_step": 152163, "epoch": 1833} {"train_loss": -22.967483520507812, "global_step": 152164, "epoch": 1833} {"train_loss": -22.98274040222168, "global_step": 152165, "epoch": 1833} {"train_loss": -23.07551383972168, "global_step": 152166, "epoch": 1833} {"train_loss": -23.25605010986328, "global_step": 152167, "epoch": 1833} {"train_loss": -22.594846725463867, "global_step": 152168, "epoch": 1833} {"train_loss": -23.377607345581055, "global_step": 152169, "epoch": 1833} {"train_loss": -22.981359481811523, "global_step": 152170, "epoch": 1833} {"train_loss": -23.26753044128418, "global_step": 152171, "epoch": 1833} {"train_loss": -22.943923950195312, "global_step": 152172, "epoch": 1833} {"train_loss": -23.31468391418457, "global_step": 152173, "epoch": 1833} {"train_loss": -23.284616470336914, "global_step": 152174, "epoch": 1833} {"train_loss": -22.923477172851562, "global_step": 152175, "epoch": 1833} {"train_loss": -22.8498592376709, "global_step": 152176, "epoch": 1833} {"train_loss": -23.378921508789062, "global_step": 152177, "epoch": 1833} {"train_loss": -23.160968780517578, "global_step": 152178, "epoch": 1833} {"train_loss": -23.5345516204834, "global_step": 152179, "epoch": 1833} {"train_loss": -23.423751831054688, "global_step": 152180, "epoch": 1833} {"train_loss": -23.09157371520996, "global_step": 152181, "epoch": 1833} {"train_loss": -23.217615127563477, "global_step": 152182, "epoch": 1833} {"train_loss": -23.13922691345215, "global_step": 152183, "epoch": 1833} {"train_loss": -23.67646598815918, "global_step": 152184, "epoch": 1833} {"train_loss": -23.27564239501953, "global_step": 152185, "epoch": 1833} {"train_loss": -23.373464584350586, "global_step": 152186, "epoch": 1833} {"train_loss": -23.11911392211914, "global_step": 152187, "epoch": 1833} {"train_loss": -23.462827682495117, "global_step": 152188, "epoch": 1833} {"train_loss": -23.666105270385742, "global_step": 152189, "epoch": 1833} {"train_loss": -23.563045501708984, "global_step": 152190, "epoch": 1833} {"train_loss": -23.112295150756836, "global_step": 152191, "epoch": 1833} {"train_loss": -23.707565307617188, "global_step": 152192, "epoch": 1833} {"train_loss": -23.794233322143555, "global_step": 152193, "epoch": 1833} {"train_loss": -23.605606079101562, "global_step": 152194, "epoch": 1833} {"train_loss": -23.25833511352539, "global_step": 152195, "epoch": 1833} {"train_loss": -23.308284759521484, "global_step": 152196, "epoch": 1833} {"train_loss": -23.231515884399414, "global_step": 152197, "epoch": 1833} {"train_loss": -23.70172691345215, "global_step": 152198, "epoch": 1833} {"train_loss": -22.812702178955078, "global_step": 152199, "epoch": 1833} {"train_loss": -22.609804153442383, "global_step": 152200, "epoch": 1833} {"train_loss": -22.77153968811035, "global_step": 152201, "epoch": 1833} {"train_loss": -23.37456703186035, "global_step": 152202, "epoch": 1833} {"train_loss": -23.283048629760742, "global_step": 152203, "epoch": 1833} {"train_loss": -22.905954360961914, "global_step": 152204, "epoch": 1833} {"train_loss": -23.264699935913086, "global_step": 152205, "epoch": 1833} {"train_loss": -23.211645126342773, "global_step": 152206, "epoch": 1833} {"train_loss": -23.421140670776367, "global_step": 152207, "epoch": 1833} {"train_loss": -23.61952018737793, "global_step": 152208, "epoch": 1833} {"train_loss": -23.462890625, "global_step": 152209, "epoch": 1833} {"train_loss": -23.047531127929688, "global_step": 152210, "epoch": 1833} {"train_loss": -23.381772994995117, "global_step": 152211, "epoch": 1833} {"train_loss": -23.592920303344727, "global_step": 152212, "epoch": 1833} {"train_loss": -23.013347625732422, "global_step": 152213, "epoch": 1833} {"train_loss": -23.293888092041016, "global_step": 152214, "epoch": 1833} {"train_loss": -23.449363708496094, "global_step": 152215, "epoch": 1833} {"train_loss": -23.363235473632812, "global_step": 152216, "epoch": 1833} {"train_loss": -23.50214958190918, "global_step": 152217, "epoch": 1833} {"train_loss": -23.306547164916992, "global_step": 152218, "epoch": 1833} {"train_loss": -23.347909927368164, "global_step": 152219, "epoch": 1833} {"train_loss": -23.592679977416992, "global_step": 152220, "epoch": 1833} {"train_loss": -23.025597308055463, "global_step": 152221, "epoch": 1833, "val_loss": 6636566.0} {"train_loss": -22.624509811401367, "global_step": 152222, "epoch": 1834} {"train_loss": -22.69777488708496, "global_step": 152223, "epoch": 1834} {"train_loss": -23.065017700195312, "global_step": 152224, "epoch": 1834} {"train_loss": -22.811908721923828, "global_step": 152225, "epoch": 1834} {"train_loss": -23.09025001525879, "global_step": 152226, "epoch": 1834} {"train_loss": -22.989273071289062, "global_step": 152227, "epoch": 1834} {"train_loss": -23.211257934570312, "global_step": 152228, "epoch": 1834} {"train_loss": -23.49175453186035, "global_step": 152229, "epoch": 1834} {"train_loss": -22.86661720275879, "global_step": 152230, "epoch": 1834} {"train_loss": -23.2694091796875, "global_step": 152231, "epoch": 1834} {"train_loss": -23.12801170349121, "global_step": 152232, "epoch": 1834} {"train_loss": -23.24080467224121, "global_step": 152233, "epoch": 1834} {"train_loss": -23.608755111694336, "global_step": 152234, "epoch": 1834} {"train_loss": -23.524736404418945, "global_step": 152235, "epoch": 1834} {"train_loss": -23.081396102905273, "global_step": 152236, "epoch": 1834} {"train_loss": -23.529996871948242, "global_step": 152237, "epoch": 1834} {"train_loss": -23.318565368652344, "global_step": 152238, "epoch": 1834} {"train_loss": -23.141193389892578, "global_step": 152239, "epoch": 1834} {"train_loss": -23.293027877807617, "global_step": 152240, "epoch": 1834} {"train_loss": -23.379411697387695, "global_step": 152241, "epoch": 1834} {"train_loss": -23.060028076171875, "global_step": 152242, "epoch": 1834} {"train_loss": -23.19389533996582, "global_step": 152243, "epoch": 1834} {"train_loss": -23.456151962280273, "global_step": 152244, "epoch": 1834} {"train_loss": -23.399137496948242, "global_step": 152245, "epoch": 1834} {"train_loss": -23.424612045288086, "global_step": 152246, "epoch": 1834} {"train_loss": -23.17317008972168, "global_step": 152247, "epoch": 1834} {"train_loss": -23.633148193359375, "global_step": 152248, "epoch": 1834} {"train_loss": -23.333730697631836, "global_step": 152249, "epoch": 1834} {"train_loss": -23.653684616088867, "global_step": 152250, "epoch": 1834} {"train_loss": -23.464740753173828, "global_step": 152251, "epoch": 1834} {"train_loss": -23.417085647583008, "global_step": 152252, "epoch": 1834} {"train_loss": -23.35492515563965, "global_step": 152253, "epoch": 1834} {"train_loss": -23.545578002929688, "global_step": 152254, "epoch": 1834} {"train_loss": -23.360116958618164, "global_step": 152255, "epoch": 1834} {"train_loss": -23.065799713134766, "global_step": 152256, "epoch": 1834} {"train_loss": -23.322816848754883, "global_step": 152257, "epoch": 1834} {"train_loss": -23.128576278686523, "global_step": 152258, "epoch": 1834} {"train_loss": -23.1704044342041, "global_step": 152259, "epoch": 1834} {"train_loss": -22.83681297302246, "global_step": 152260, "epoch": 1834} {"train_loss": -23.353071212768555, "global_step": 152261, "epoch": 1834} {"train_loss": -23.320720672607422, "global_step": 152262, "epoch": 1834} {"train_loss": -23.19660758972168, "global_step": 152263, "epoch": 1834} {"train_loss": -23.030263900756836, "global_step": 152264, "epoch": 1834} {"train_loss": -23.174123764038086, "global_step": 152265, "epoch": 1834} {"train_loss": -23.4368896484375, "global_step": 152266, "epoch": 1834} {"train_loss": -23.482242584228516, "global_step": 152267, "epoch": 1834} {"train_loss": -23.37836265563965, "global_step": 152268, "epoch": 1834} {"train_loss": -23.133560180664062, "global_step": 152269, "epoch": 1834} {"train_loss": -23.207111358642578, "global_step": 152270, "epoch": 1834} {"train_loss": -22.713287353515625, "global_step": 152271, "epoch": 1834} {"train_loss": -23.67457389831543, "global_step": 152272, "epoch": 1834} {"train_loss": -23.52359962463379, "global_step": 152273, "epoch": 1834} {"train_loss": -22.923660278320312, "global_step": 152274, "epoch": 1834} {"train_loss": -23.197717666625977, "global_step": 152275, "epoch": 1834} {"train_loss": -23.177087783813477, "global_step": 152276, "epoch": 1834} {"train_loss": -23.601470947265625, "global_step": 152277, "epoch": 1834} {"train_loss": -23.617612838745117, "global_step": 152278, "epoch": 1834} {"train_loss": -23.488384246826172, "global_step": 152279, "epoch": 1834} {"train_loss": -23.555431365966797, "global_step": 152280, "epoch": 1834} {"train_loss": -23.088666915893555, "global_step": 152281, "epoch": 1834} {"train_loss": -23.278602600097656, "global_step": 152282, "epoch": 1834} {"train_loss": -22.98768424987793, "global_step": 152283, "epoch": 1834} {"train_loss": -23.667984008789062, "global_step": 152284, "epoch": 1834} {"train_loss": -23.43082046508789, "global_step": 152285, "epoch": 1834} {"train_loss": -23.000810623168945, "global_step": 152286, "epoch": 1834} {"train_loss": -22.728275299072266, "global_step": 152287, "epoch": 1834} {"train_loss": -22.87501335144043, "global_step": 152288, "epoch": 1834} {"train_loss": -23.409914016723633, "global_step": 152289, "epoch": 1834} {"train_loss": -23.484228134155273, "global_step": 152290, "epoch": 1834} {"train_loss": -23.41973304748535, "global_step": 152291, "epoch": 1834} {"train_loss": -23.271039962768555, "global_step": 152292, "epoch": 1834} {"train_loss": -23.135557174682617, "global_step": 152293, "epoch": 1834} {"train_loss": -23.19463539123535, "global_step": 152294, "epoch": 1834} {"train_loss": -23.660297393798828, "global_step": 152295, "epoch": 1834} {"train_loss": -23.712825775146484, "global_step": 152296, "epoch": 1834} {"train_loss": -23.233951568603516, "global_step": 152297, "epoch": 1834} {"train_loss": -23.436269760131836, "global_step": 152298, "epoch": 1834} {"train_loss": -23.281105041503906, "global_step": 152299, "epoch": 1834} {"train_loss": -23.148441314697266, "global_step": 152300, "epoch": 1834} {"train_loss": -23.468996047973633, "global_step": 152301, "epoch": 1834} {"train_loss": -23.599552154541016, "global_step": 152302, "epoch": 1834} {"train_loss": -23.461389541625977, "global_step": 152303, "epoch": 1834} {"train_loss": -23.286229788538922, "global_step": 152304, "epoch": 1834, "val_loss": 6324920.5} {"train_loss": -22.608041763305664, "global_step": 152305, "epoch": 1835} {"train_loss": -21.7326717376709, "global_step": 152306, "epoch": 1835} {"train_loss": -22.59595489501953, "global_step": 152307, "epoch": 1835} {"train_loss": -23.16686248779297, "global_step": 152308, "epoch": 1835} {"train_loss": -22.601966857910156, "global_step": 152309, "epoch": 1835} {"train_loss": -22.63861083984375, "global_step": 152310, "epoch": 1835} {"train_loss": -22.960561752319336, "global_step": 152311, "epoch": 1835} {"train_loss": -22.74197769165039, "global_step": 152312, "epoch": 1835} {"train_loss": -23.271102905273438, "global_step": 152313, "epoch": 1835} {"train_loss": -23.287464141845703, "global_step": 152314, "epoch": 1835} {"train_loss": -23.117633819580078, "global_step": 152315, "epoch": 1835} {"train_loss": -23.19538688659668, "global_step": 152316, "epoch": 1835} {"train_loss": -22.949087142944336, "global_step": 152317, "epoch": 1835} {"train_loss": -23.138957977294922, "global_step": 152318, "epoch": 1835} {"train_loss": -22.96233558654785, "global_step": 152319, "epoch": 1835} {"train_loss": -22.717575073242188, "global_step": 152320, "epoch": 1835} {"train_loss": -22.863298416137695, "global_step": 152321, "epoch": 1835} {"train_loss": -23.390045166015625, "global_step": 152322, "epoch": 1835} {"train_loss": -22.669095993041992, "global_step": 152323, "epoch": 1835} {"train_loss": -23.199344635009766, "global_step": 152324, "epoch": 1835} {"train_loss": -23.522306442260742, "global_step": 152325, "epoch": 1835} {"train_loss": -23.2131404876709, "global_step": 152326, "epoch": 1835} {"train_loss": -23.090133666992188, "global_step": 152327, "epoch": 1835} {"train_loss": -23.49066734313965, "global_step": 152328, "epoch": 1835} {"train_loss": -23.392866134643555, "global_step": 152329, "epoch": 1835} {"train_loss": -23.581106185913086, "global_step": 152330, "epoch": 1835} {"train_loss": -23.164138793945312, "global_step": 152331, "epoch": 1835} {"train_loss": -23.758350372314453, "global_step": 152332, "epoch": 1835} {"train_loss": -23.366352081298828, "global_step": 152333, "epoch": 1835} {"train_loss": -23.284391403198242, "global_step": 152334, "epoch": 1835} {"train_loss": -23.299100875854492, "global_step": 152335, "epoch": 1835} {"train_loss": -23.387845993041992, "global_step": 152336, "epoch": 1835} {"train_loss": -23.497589111328125, "global_step": 152337, "epoch": 1835} {"train_loss": -23.595670700073242, "global_step": 152338, "epoch": 1835} {"train_loss": -23.110021591186523, "global_step": 152339, "epoch": 1835} {"train_loss": -23.292572021484375, "global_step": 152340, "epoch": 1835} {"train_loss": -23.331357955932617, "global_step": 152341, "epoch": 1835} {"train_loss": -23.594968795776367, "global_step": 152342, "epoch": 1835} {"train_loss": -23.420244216918945, "global_step": 152343, "epoch": 1835} {"train_loss": -23.127954483032227, "global_step": 152344, "epoch": 1835} {"train_loss": -23.551427841186523, "global_step": 152345, "epoch": 1835} {"train_loss": -22.968381881713867, "global_step": 152346, "epoch": 1835} {"train_loss": -22.86153221130371, "global_step": 152347, "epoch": 1835} {"train_loss": -23.061918258666992, "global_step": 152348, "epoch": 1835} {"train_loss": -23.1688289642334, "global_step": 152349, "epoch": 1835} {"train_loss": -23.04526138305664, "global_step": 152350, "epoch": 1835} {"train_loss": -23.46815299987793, "global_step": 152351, "epoch": 1835} {"train_loss": -23.48662757873535, "global_step": 152352, "epoch": 1835} {"train_loss": -23.3272647857666, "global_step": 152353, "epoch": 1835} {"train_loss": -23.5755672454834, "global_step": 152354, "epoch": 1835} {"train_loss": -23.261220932006836, "global_step": 152355, "epoch": 1835} {"train_loss": -23.55805778503418, "global_step": 152356, "epoch": 1835} {"train_loss": -23.138235092163086, "global_step": 152357, "epoch": 1835} {"train_loss": -23.454015731811523, "global_step": 152358, "epoch": 1835} {"train_loss": -22.64472770690918, "global_step": 152359, "epoch": 1835} {"train_loss": -23.088932037353516, "global_step": 152360, "epoch": 1835} {"train_loss": -22.99371910095215, "global_step": 152361, "epoch": 1835} {"train_loss": -23.231250762939453, "global_step": 152362, "epoch": 1835} {"train_loss": -23.07497215270996, "global_step": 152363, "epoch": 1835} {"train_loss": -23.113943099975586, "global_step": 152364, "epoch": 1835} {"train_loss": -23.662107467651367, "global_step": 152365, "epoch": 1835} {"train_loss": -23.0841121673584, "global_step": 152366, "epoch": 1835} {"train_loss": -23.110843658447266, "global_step": 152367, "epoch": 1835} {"train_loss": -23.324254989624023, "global_step": 152368, "epoch": 1835} {"train_loss": -23.61147117614746, "global_step": 152369, "epoch": 1835} {"train_loss": -23.40248680114746, "global_step": 152370, "epoch": 1835} {"train_loss": -23.445215225219727, "global_step": 152371, "epoch": 1835} {"train_loss": -23.499624252319336, "global_step": 152372, "epoch": 1835} {"train_loss": -23.435791015625, "global_step": 152373, "epoch": 1835} {"train_loss": -23.559988021850586, "global_step": 152374, "epoch": 1835} {"train_loss": -23.717626571655273, "global_step": 152375, "epoch": 1835} {"train_loss": -23.243684768676758, "global_step": 152376, "epoch": 1835} {"train_loss": -23.34307289123535, "global_step": 152377, "epoch": 1835} {"train_loss": -23.38898277282715, "global_step": 152378, "epoch": 1835} {"train_loss": -23.773351669311523, "global_step": 152379, "epoch": 1835} {"train_loss": -23.30171012878418, "global_step": 152380, "epoch": 1835} {"train_loss": -23.613134384155273, "global_step": 152381, "epoch": 1835} {"train_loss": -23.346088409423828, "global_step": 152382, "epoch": 1835} {"train_loss": -23.36813735961914, "global_step": 152383, "epoch": 1835} {"train_loss": -23.221017837524414, "global_step": 152384, "epoch": 1835} {"train_loss": -23.278709411621094, "global_step": 152385, "epoch": 1835} {"train_loss": -23.695642471313477, "global_step": 152386, "epoch": 1835} {"train_loss": -23.215213545833727, "global_step": 152387, "epoch": 1835, "val_loss": 6216829.0} {"train_loss": -20.67354393005371, "global_step": 152388, "epoch": 1836} {"train_loss": -22.2961483001709, "global_step": 152389, "epoch": 1836} {"train_loss": -21.41413688659668, "global_step": 152390, "epoch": 1836} {"train_loss": -21.78043556213379, "global_step": 152391, "epoch": 1836} {"train_loss": -21.53428077697754, "global_step": 152392, "epoch": 1836} {"train_loss": -22.378236770629883, "global_step": 152393, "epoch": 1836} {"train_loss": -21.937345504760742, "global_step": 152394, "epoch": 1836} {"train_loss": -22.374967575073242, "global_step": 152395, "epoch": 1836} {"train_loss": -22.17567253112793, "global_step": 152396, "epoch": 1836} {"train_loss": -22.25234031677246, "global_step": 152397, "epoch": 1836} {"train_loss": -22.241897583007812, "global_step": 152398, "epoch": 1836} {"train_loss": -22.487083435058594, "global_step": 152399, "epoch": 1836} {"train_loss": -22.45460319519043, "global_step": 152400, "epoch": 1836} {"train_loss": -22.479345321655273, "global_step": 152401, "epoch": 1836} {"train_loss": -22.116334915161133, "global_step": 152402, "epoch": 1836} {"train_loss": -22.31144142150879, "global_step": 152403, "epoch": 1836} {"train_loss": -22.33102798461914, "global_step": 152404, "epoch": 1836} {"train_loss": -22.485727310180664, "global_step": 152405, "epoch": 1836} {"train_loss": -22.763385772705078, "global_step": 152406, "epoch": 1836} {"train_loss": -22.589353561401367, "global_step": 152407, "epoch": 1836} {"train_loss": -22.65333366394043, "global_step": 152408, "epoch": 1836} {"train_loss": -22.60367202758789, "global_step": 152409, "epoch": 1836} {"train_loss": -23.022920608520508, "global_step": 152410, "epoch": 1836} {"train_loss": -22.693496704101562, "global_step": 152411, "epoch": 1836} {"train_loss": -22.759658813476562, "global_step": 152412, "epoch": 1836} {"train_loss": -22.422822952270508, "global_step": 152413, "epoch": 1836} {"train_loss": -22.884199142456055, "global_step": 152414, "epoch": 1836} {"train_loss": -23.094892501831055, "global_step": 152415, "epoch": 1836} {"train_loss": -22.803586959838867, "global_step": 152416, "epoch": 1836} {"train_loss": -22.8856258392334, "global_step": 152417, "epoch": 1836} {"train_loss": -22.770917892456055, "global_step": 152418, "epoch": 1836} {"train_loss": -22.858999252319336, "global_step": 152419, "epoch": 1836} {"train_loss": -22.763492584228516, "global_step": 152420, "epoch": 1836} {"train_loss": -23.0974063873291, "global_step": 152421, "epoch": 1836} {"train_loss": -23.217559814453125, "global_step": 152422, "epoch": 1836} {"train_loss": -23.101598739624023, "global_step": 152423, "epoch": 1836} {"train_loss": -23.17586326599121, "global_step": 152424, "epoch": 1836} {"train_loss": -23.075946807861328, "global_step": 152425, "epoch": 1836} {"train_loss": -22.72808265686035, "global_step": 152426, "epoch": 1836} {"train_loss": -23.429590225219727, "global_step": 152427, "epoch": 1836} {"train_loss": -22.709997177124023, "global_step": 152428, "epoch": 1836} {"train_loss": -23.12676429748535, "global_step": 152429, "epoch": 1836} {"train_loss": -23.62956428527832, "global_step": 152430, "epoch": 1836} {"train_loss": -22.901288986206055, "global_step": 152431, "epoch": 1836} {"train_loss": -23.40274429321289, "global_step": 152432, "epoch": 1836} {"train_loss": -23.284534454345703, "global_step": 152433, "epoch": 1836} {"train_loss": -23.12571144104004, "global_step": 152434, "epoch": 1836} {"train_loss": -23.754215240478516, "global_step": 152435, "epoch": 1836} {"train_loss": -23.784442901611328, "global_step": 152436, "epoch": 1836} {"train_loss": -23.534921646118164, "global_step": 152437, "epoch": 1836} {"train_loss": -23.0244197845459, "global_step": 152438, "epoch": 1836} {"train_loss": -23.641042709350586, "global_step": 152439, "epoch": 1836} {"train_loss": -23.450937271118164, "global_step": 152440, "epoch": 1836} {"train_loss": -23.098812103271484, "global_step": 152441, "epoch": 1836} {"train_loss": -23.758739471435547, "global_step": 152442, "epoch": 1836} {"train_loss": -23.50153160095215, "global_step": 152443, "epoch": 1836} {"train_loss": -23.66410255432129, "global_step": 152444, "epoch": 1836} {"train_loss": -23.135818481445312, "global_step": 152445, "epoch": 1836} {"train_loss": -23.347644805908203, "global_step": 152446, "epoch": 1836} {"train_loss": -23.586862564086914, "global_step": 152447, "epoch": 1836} {"train_loss": -23.256271362304688, "global_step": 152448, "epoch": 1836} {"train_loss": -23.471899032592773, "global_step": 152449, "epoch": 1836} {"train_loss": -23.6767635345459, "global_step": 152450, "epoch": 1836} {"train_loss": -23.303171157836914, "global_step": 152451, "epoch": 1836} {"train_loss": -23.629262924194336, "global_step": 152452, "epoch": 1836} {"train_loss": -23.458524703979492, "global_step": 152453, "epoch": 1836} {"train_loss": -23.362783432006836, "global_step": 152454, "epoch": 1836} {"train_loss": -22.940536499023438, "global_step": 152455, "epoch": 1836} {"train_loss": -23.674942016601562, "global_step": 152456, "epoch": 1836} {"train_loss": -23.079696655273438, "global_step": 152457, "epoch": 1836} {"train_loss": -23.200830459594727, "global_step": 152458, "epoch": 1836} {"train_loss": -23.441965103149414, "global_step": 152459, "epoch": 1836} {"train_loss": -23.11932945251465, "global_step": 152460, "epoch": 1836} {"train_loss": -23.65264892578125, "global_step": 152461, "epoch": 1836} {"train_loss": -23.576623916625977, "global_step": 152462, "epoch": 1836} {"train_loss": -23.060449600219727, "global_step": 152463, "epoch": 1836} {"train_loss": -23.788652420043945, "global_step": 152464, "epoch": 1836} {"train_loss": -23.300668716430664, "global_step": 152465, "epoch": 1836} {"train_loss": -23.547407150268555, "global_step": 152466, "epoch": 1836} {"train_loss": -23.400728225708008, "global_step": 152467, "epoch": 1836} {"train_loss": -23.624467849731445, "global_step": 152468, "epoch": 1836} {"train_loss": -23.437976837158203, "global_step": 152469, "epoch": 1836} {"train_loss": -22.976815487965045, "global_step": 152470, "epoch": 1836, "val_loss": 6358499.5} {"train_loss": -23.353666305541992, "global_step": 152471, "epoch": 1837} {"train_loss": -23.01251220703125, "global_step": 152472, "epoch": 1837} {"train_loss": -23.17220115661621, "global_step": 152473, "epoch": 1837} {"train_loss": -22.967924118041992, "global_step": 152474, "epoch": 1837} {"train_loss": -22.931251525878906, "global_step": 152475, "epoch": 1837} {"train_loss": -22.928466796875, "global_step": 152476, "epoch": 1837} {"train_loss": -23.14164161682129, "global_step": 152477, "epoch": 1837} {"train_loss": -23.0643367767334, "global_step": 152478, "epoch": 1837} {"train_loss": -23.2595157623291, "global_step": 152479, "epoch": 1837} {"train_loss": -22.786182403564453, "global_step": 152480, "epoch": 1837} {"train_loss": -23.53229522705078, "global_step": 152481, "epoch": 1837} {"train_loss": -23.18128204345703, "global_step": 152482, "epoch": 1837} {"train_loss": -23.28444480895996, "global_step": 152483, "epoch": 1837} {"train_loss": -23.191436767578125, "global_step": 152484, "epoch": 1837} {"train_loss": -23.075300216674805, "global_step": 152485, "epoch": 1837} {"train_loss": -23.342880249023438, "global_step": 152486, "epoch": 1837} {"train_loss": -23.399221420288086, "global_step": 152487, "epoch": 1837} {"train_loss": -23.04595184326172, "global_step": 152488, "epoch": 1837} {"train_loss": -23.23479461669922, "global_step": 152489, "epoch": 1837} {"train_loss": -23.31660270690918, "global_step": 152490, "epoch": 1837} {"train_loss": -23.051944732666016, "global_step": 152491, "epoch": 1837} {"train_loss": -23.42380714416504, "global_step": 152492, "epoch": 1837} {"train_loss": -23.45118522644043, "global_step": 152493, "epoch": 1837} {"train_loss": -23.568822860717773, "global_step": 152494, "epoch": 1837} {"train_loss": -23.13689613342285, "global_step": 152495, "epoch": 1837} {"train_loss": -23.4832706451416, "global_step": 152496, "epoch": 1837} {"train_loss": -23.515867233276367, "global_step": 152497, "epoch": 1837} {"train_loss": -23.431745529174805, "global_step": 152498, "epoch": 1837} {"train_loss": -23.38201904296875, "global_step": 152499, "epoch": 1837} {"train_loss": -22.95136070251465, "global_step": 152500, "epoch": 1837} {"train_loss": -23.63746452331543, "global_step": 152501, "epoch": 1837} {"train_loss": -23.50569725036621, "global_step": 152502, "epoch": 1837} {"train_loss": -22.96595573425293, "global_step": 152503, "epoch": 1837} {"train_loss": -23.345947265625, "global_step": 152504, "epoch": 1837} {"train_loss": -23.560667037963867, "global_step": 152505, "epoch": 1837} {"train_loss": -23.327346801757812, "global_step": 152506, "epoch": 1837} {"train_loss": -23.566038131713867, "global_step": 152507, "epoch": 1837} {"train_loss": -23.415678024291992, "global_step": 152508, "epoch": 1837} {"train_loss": -23.170591354370117, "global_step": 152509, "epoch": 1837} {"train_loss": -23.451879501342773, "global_step": 152510, "epoch": 1837} {"train_loss": -23.6666316986084, "global_step": 152511, "epoch": 1837} {"train_loss": -23.53206443786621, "global_step": 152512, "epoch": 1837} {"train_loss": -23.015844345092773, "global_step": 152513, "epoch": 1837} {"train_loss": -23.314184188842773, "global_step": 152514, "epoch": 1837} {"train_loss": -23.508588790893555, "global_step": 152515, "epoch": 1837} {"train_loss": -23.389131546020508, "global_step": 152516, "epoch": 1837} {"train_loss": -23.485584259033203, "global_step": 152517, "epoch": 1837} {"train_loss": -23.434478759765625, "global_step": 152518, "epoch": 1837} {"train_loss": -23.480863571166992, "global_step": 152519, "epoch": 1837} {"train_loss": -23.42340660095215, "global_step": 152520, "epoch": 1837} {"train_loss": -22.99197006225586, "global_step": 152521, "epoch": 1837} {"train_loss": -23.147157669067383, "global_step": 152522, "epoch": 1837} {"train_loss": -23.139673233032227, "global_step": 152523, "epoch": 1837} {"train_loss": -23.590518951416016, "global_step": 152524, "epoch": 1837} {"train_loss": -23.456571578979492, "global_step": 152525, "epoch": 1837} {"train_loss": -23.44004249572754, "global_step": 152526, "epoch": 1837} {"train_loss": -23.5455322265625, "global_step": 152527, "epoch": 1837} {"train_loss": -23.686880111694336, "global_step": 152528, "epoch": 1837} {"train_loss": -23.736684799194336, "global_step": 152529, "epoch": 1837} {"train_loss": -23.891386032104492, "global_step": 152530, "epoch": 1837} {"train_loss": -23.17160987854004, "global_step": 152531, "epoch": 1837} {"train_loss": -23.738447189331055, "global_step": 152532, "epoch": 1837} {"train_loss": -23.020254135131836, "global_step": 152533, "epoch": 1837} {"train_loss": -23.50604820251465, "global_step": 152534, "epoch": 1837} {"train_loss": -23.278705596923828, "global_step": 152535, "epoch": 1837} {"train_loss": -23.357280731201172, "global_step": 152536, "epoch": 1837} {"train_loss": -23.5999755859375, "global_step": 152537, "epoch": 1837} {"train_loss": -23.304468154907227, "global_step": 152538, "epoch": 1837} {"train_loss": -22.922006607055664, "global_step": 152539, "epoch": 1837} {"train_loss": -23.7310791015625, "global_step": 152540, "epoch": 1837} {"train_loss": -23.318662643432617, "global_step": 152541, "epoch": 1837} {"train_loss": -23.572839736938477, "global_step": 152542, "epoch": 1837} {"train_loss": -23.638046264648438, "global_step": 152543, "epoch": 1837} {"train_loss": -23.542217254638672, "global_step": 152544, "epoch": 1837} {"train_loss": -23.248584747314453, "global_step": 152545, "epoch": 1837} {"train_loss": -23.52264404296875, "global_step": 152546, "epoch": 1837} {"train_loss": -23.47818374633789, "global_step": 152547, "epoch": 1837} {"train_loss": -23.622411727905273, "global_step": 152548, "epoch": 1837} {"train_loss": -23.494142532348633, "global_step": 152549, "epoch": 1837} {"train_loss": -23.43597984313965, "global_step": 152550, "epoch": 1837} {"train_loss": -23.140216827392578, "global_step": 152551, "epoch": 1837} {"train_loss": -23.561370849609375, "global_step": 152552, "epoch": 1837} {"train_loss": -23.342836678746234, "global_step": 152553, "epoch": 1837, "val_loss": 6195651.0} {"train_loss": -22.103219985961914, "global_step": 152554, "epoch": 1838} {"train_loss": -22.552465438842773, "global_step": 152555, "epoch": 1838} {"train_loss": -22.688983917236328, "global_step": 152556, "epoch": 1838} {"train_loss": -22.568164825439453, "global_step": 152557, "epoch": 1838} {"train_loss": -23.14994239807129, "global_step": 152558, "epoch": 1838} {"train_loss": -22.687013626098633, "global_step": 152559, "epoch": 1838} {"train_loss": -22.43212127685547, "global_step": 152560, "epoch": 1838} {"train_loss": -23.01558494567871, "global_step": 152561, "epoch": 1838} {"train_loss": -23.084232330322266, "global_step": 152562, "epoch": 1838} {"train_loss": -22.58206558227539, "global_step": 152563, "epoch": 1838} {"train_loss": -22.441450119018555, "global_step": 152564, "epoch": 1838} {"train_loss": -22.811155319213867, "global_step": 152565, "epoch": 1838} {"train_loss": -22.85700798034668, "global_step": 152566, "epoch": 1838} {"train_loss": -22.9013671875, "global_step": 152567, "epoch": 1838} {"train_loss": -22.922746658325195, "global_step": 152568, "epoch": 1838} {"train_loss": -22.868595123291016, "global_step": 152569, "epoch": 1838} {"train_loss": -23.094730377197266, "global_step": 152570, "epoch": 1838} {"train_loss": -23.088939666748047, "global_step": 152571, "epoch": 1838} {"train_loss": -23.1375675201416, "global_step": 152572, "epoch": 1838} {"train_loss": -22.936559677124023, "global_step": 152573, "epoch": 1838} {"train_loss": -23.20627784729004, "global_step": 152574, "epoch": 1838} {"train_loss": -22.91541290283203, "global_step": 152575, "epoch": 1838} {"train_loss": -23.246212005615234, "global_step": 152576, "epoch": 1838} {"train_loss": -23.07099151611328, "global_step": 152577, "epoch": 1838} {"train_loss": -23.093902587890625, "global_step": 152578, "epoch": 1838} {"train_loss": -23.209941864013672, "global_step": 152579, "epoch": 1838} {"train_loss": -23.289691925048828, "global_step": 152580, "epoch": 1838} {"train_loss": -23.0459041595459, "global_step": 152581, "epoch": 1838} {"train_loss": -23.24709129333496, "global_step": 152582, "epoch": 1838} {"train_loss": -23.176353454589844, "global_step": 152583, "epoch": 1838} {"train_loss": -23.250320434570312, "global_step": 152584, "epoch": 1838} {"train_loss": -23.370073318481445, "global_step": 152585, "epoch": 1838} {"train_loss": -23.58815574645996, "global_step": 152586, "epoch": 1838} {"train_loss": -23.182876586914062, "global_step": 152587, "epoch": 1838} {"train_loss": -22.844562530517578, "global_step": 152588, "epoch": 1838} {"train_loss": -23.2305908203125, "global_step": 152589, "epoch": 1838} {"train_loss": -23.020544052124023, "global_step": 152590, "epoch": 1838} {"train_loss": -23.370840072631836, "global_step": 152591, "epoch": 1838} {"train_loss": -23.15276527404785, "global_step": 152592, "epoch": 1838} {"train_loss": -23.604032516479492, "global_step": 152593, "epoch": 1838} {"train_loss": -23.151546478271484, "global_step": 152594, "epoch": 1838} {"train_loss": -23.045034408569336, "global_step": 152595, "epoch": 1838} {"train_loss": -23.443540573120117, "global_step": 152596, "epoch": 1838} {"train_loss": -23.362815856933594, "global_step": 152597, "epoch": 1838} {"train_loss": -23.525135040283203, "global_step": 152598, "epoch": 1838} {"train_loss": -23.245079040527344, "global_step": 152599, "epoch": 1838} {"train_loss": -23.15778923034668, "global_step": 152600, "epoch": 1838} {"train_loss": -23.659204483032227, "global_step": 152601, "epoch": 1838} {"train_loss": -23.60272216796875, "global_step": 152602, "epoch": 1838} {"train_loss": -23.55881118774414, "global_step": 152603, "epoch": 1838} {"train_loss": -23.6392879486084, "global_step": 152604, "epoch": 1838} {"train_loss": -23.373167037963867, "global_step": 152605, "epoch": 1838} {"train_loss": -23.720870971679688, "global_step": 152606, "epoch": 1838} {"train_loss": -23.300230026245117, "global_step": 152607, "epoch": 1838} {"train_loss": -23.49820899963379, "global_step": 152608, "epoch": 1838} {"train_loss": -23.49318504333496, "global_step": 152609, "epoch": 1838} {"train_loss": -23.207624435424805, "global_step": 152610, "epoch": 1838} {"train_loss": -23.308191299438477, "global_step": 152611, "epoch": 1838} {"train_loss": -23.147016525268555, "global_step": 152612, "epoch": 1838} {"train_loss": -23.665699005126953, "global_step": 152613, "epoch": 1838} {"train_loss": -22.983367919921875, "global_step": 152614, "epoch": 1838} {"train_loss": -23.104440689086914, "global_step": 152615, "epoch": 1838} {"train_loss": -23.5076847076416, "global_step": 152616, "epoch": 1838} {"train_loss": -23.444293975830078, "global_step": 152617, "epoch": 1838} {"train_loss": -23.23444938659668, "global_step": 152618, "epoch": 1838} {"train_loss": -23.6178035736084, "global_step": 152619, "epoch": 1838} {"train_loss": -23.652088165283203, "global_step": 152620, "epoch": 1838} {"train_loss": -23.102102279663086, "global_step": 152621, "epoch": 1838} {"train_loss": -22.757404327392578, "global_step": 152622, "epoch": 1838} {"train_loss": -23.412511825561523, "global_step": 152623, "epoch": 1838} {"train_loss": -22.82547950744629, "global_step": 152624, "epoch": 1838} {"train_loss": -23.38522720336914, "global_step": 152625, "epoch": 1838} {"train_loss": -23.344690322875977, "global_step": 152626, "epoch": 1838} {"train_loss": -23.64873695373535, "global_step": 152627, "epoch": 1838} {"train_loss": -23.634788513183594, "global_step": 152628, "epoch": 1838} {"train_loss": -23.356199264526367, "global_step": 152629, "epoch": 1838} {"train_loss": -23.38448143005371, "global_step": 152630, "epoch": 1838} {"train_loss": -23.562288284301758, "global_step": 152631, "epoch": 1838} {"train_loss": -23.134292602539062, "global_step": 152632, "epoch": 1838} {"train_loss": -23.474258422851562, "global_step": 152633, "epoch": 1838} {"train_loss": -23.652408599853516, "global_step": 152634, "epoch": 1838} {"train_loss": -23.319921493530273, "global_step": 152635, "epoch": 1838} {"train_loss": -23.195062683289308, "global_step": 152636, "epoch": 1838, "val_loss": 6364761.0} {"train_loss": -23.219961166381836, "global_step": 152637, "epoch": 1839} {"train_loss": -23.031116485595703, "global_step": 152638, "epoch": 1839} {"train_loss": -23.186811447143555, "global_step": 152639, "epoch": 1839} {"train_loss": -23.156126022338867, "global_step": 152640, "epoch": 1839} {"train_loss": -22.947818756103516, "global_step": 152641, "epoch": 1839} {"train_loss": -23.211753845214844, "global_step": 152642, "epoch": 1839} {"train_loss": -23.21426773071289, "global_step": 152643, "epoch": 1839} {"train_loss": -23.267812728881836, "global_step": 152644, "epoch": 1839} {"train_loss": -23.456331253051758, "global_step": 152645, "epoch": 1839} {"train_loss": -23.317869186401367, "global_step": 152646, "epoch": 1839} {"train_loss": -23.46308708190918, "global_step": 152647, "epoch": 1839} {"train_loss": -23.654489517211914, "global_step": 152648, "epoch": 1839} {"train_loss": -23.211164474487305, "global_step": 152649, "epoch": 1839} {"train_loss": -23.447717666625977, "global_step": 152650, "epoch": 1839} {"train_loss": -23.0471248626709, "global_step": 152651, "epoch": 1839} {"train_loss": -23.37076187133789, "global_step": 152652, "epoch": 1839} {"train_loss": -23.573278427124023, "global_step": 152653, "epoch": 1839} {"train_loss": -23.45844841003418, "global_step": 152654, "epoch": 1839} {"train_loss": -23.35132598876953, "global_step": 152655, "epoch": 1839} {"train_loss": -23.19020652770996, "global_step": 152656, "epoch": 1839} {"train_loss": -23.523208618164062, "global_step": 152657, "epoch": 1839} {"train_loss": -23.121301651000977, "global_step": 152658, "epoch": 1839} {"train_loss": -23.699234008789062, "global_step": 152659, "epoch": 1839} {"train_loss": -23.440738677978516, "global_step": 152660, "epoch": 1839} {"train_loss": -23.539384841918945, "global_step": 152661, "epoch": 1839} {"train_loss": -23.587589263916016, "global_step": 152662, "epoch": 1839} {"train_loss": -23.38861656188965, "global_step": 152663, "epoch": 1839} {"train_loss": -23.421640396118164, "global_step": 152664, "epoch": 1839} {"train_loss": -23.524282455444336, "global_step": 152665, "epoch": 1839} {"train_loss": -23.43939781188965, "global_step": 152666, "epoch": 1839} {"train_loss": -23.51947593688965, "global_step": 152667, "epoch": 1839} {"train_loss": -23.30280303955078, "global_step": 152668, "epoch": 1839} {"train_loss": -23.24757957458496, "global_step": 152669, "epoch": 1839} {"train_loss": -23.309782028198242, "global_step": 152670, "epoch": 1839} {"train_loss": -23.87506675720215, "global_step": 152671, "epoch": 1839} {"train_loss": -23.183349609375, "global_step": 152672, "epoch": 1839} {"train_loss": -23.961515426635742, "global_step": 152673, "epoch": 1839} {"train_loss": -23.49545669555664, "global_step": 152674, "epoch": 1839} {"train_loss": -23.371000289916992, "global_step": 152675, "epoch": 1839} {"train_loss": -23.443769454956055, "global_step": 152676, "epoch": 1839} {"train_loss": -23.183128356933594, "global_step": 152677, "epoch": 1839} {"train_loss": -23.58998680114746, "global_step": 152678, "epoch": 1839} {"train_loss": -22.93412208557129, "global_step": 152679, "epoch": 1839} {"train_loss": -23.071868896484375, "global_step": 152680, "epoch": 1839} {"train_loss": -23.62457847595215, "global_step": 152681, "epoch": 1839} {"train_loss": -23.66913414001465, "global_step": 152682, "epoch": 1839} {"train_loss": -23.62177085876465, "global_step": 152683, "epoch": 1839} {"train_loss": -23.43714714050293, "global_step": 152684, "epoch": 1839} {"train_loss": -23.236906051635742, "global_step": 152685, "epoch": 1839} {"train_loss": -23.584142684936523, "global_step": 152686, "epoch": 1839} {"train_loss": -23.398941040039062, "global_step": 152687, "epoch": 1839} {"train_loss": -23.235136032104492, "global_step": 152688, "epoch": 1839} {"train_loss": -23.170942306518555, "global_step": 152689, "epoch": 1839} {"train_loss": -23.187435150146484, "global_step": 152690, "epoch": 1839} {"train_loss": -23.669666290283203, "global_step": 152691, "epoch": 1839} {"train_loss": -23.591495513916016, "global_step": 152692, "epoch": 1839} {"train_loss": -23.415973663330078, "global_step": 152693, "epoch": 1839} {"train_loss": -23.457035064697266, "global_step": 152694, "epoch": 1839} {"train_loss": -23.266597747802734, "global_step": 152695, "epoch": 1839} {"train_loss": -23.188505172729492, "global_step": 152696, "epoch": 1839} {"train_loss": -23.58935546875, "global_step": 152697, "epoch": 1839} {"train_loss": -23.450529098510742, "global_step": 152698, "epoch": 1839} {"train_loss": -23.16237449645996, "global_step": 152699, "epoch": 1839} {"train_loss": -23.722532272338867, "global_step": 152700, "epoch": 1839} {"train_loss": -23.24185562133789, "global_step": 152701, "epoch": 1839} {"train_loss": -23.45137596130371, "global_step": 152702, "epoch": 1839} {"train_loss": -23.471677780151367, "global_step": 152703, "epoch": 1839} {"train_loss": -23.421560287475586, "global_step": 152704, "epoch": 1839} {"train_loss": -23.508642196655273, "global_step": 152705, "epoch": 1839} {"train_loss": -23.319107055664062, "global_step": 152706, "epoch": 1839} {"train_loss": -23.51313591003418, "global_step": 152707, "epoch": 1839} {"train_loss": -23.478187561035156, "global_step": 152708, "epoch": 1839} {"train_loss": -23.203943252563477, "global_step": 152709, "epoch": 1839} {"train_loss": -23.678762435913086, "global_step": 152710, "epoch": 1839} {"train_loss": -23.559131622314453, "global_step": 152711, "epoch": 1839} {"train_loss": -23.331424713134766, "global_step": 152712, "epoch": 1839} {"train_loss": -23.298696517944336, "global_step": 152713, "epoch": 1839} {"train_loss": -23.32588768005371, "global_step": 152714, "epoch": 1839} {"train_loss": -23.235116958618164, "global_step": 152715, "epoch": 1839} {"train_loss": -23.39072036743164, "global_step": 152716, "epoch": 1839} {"train_loss": -23.3552188873291, "global_step": 152717, "epoch": 1839} {"train_loss": -23.386722564697266, "global_step": 152718, "epoch": 1839} {"train_loss": -23.39714932728963, "global_step": 152719, "epoch": 1839, "val_loss": 6310156.0} {"train_loss": -23.290603637695312, "global_step": 152720, "epoch": 1840} {"train_loss": -22.6799373626709, "global_step": 152721, "epoch": 1840} {"train_loss": -23.329069137573242, "global_step": 152722, "epoch": 1840} {"train_loss": -23.262378692626953, "global_step": 152723, "epoch": 1840} {"train_loss": -23.044424057006836, "global_step": 152724, "epoch": 1840} {"train_loss": -23.009374618530273, "global_step": 152725, "epoch": 1840} {"train_loss": -22.792932510375977, "global_step": 152726, "epoch": 1840} {"train_loss": -22.978351593017578, "global_step": 152727, "epoch": 1840} {"train_loss": -23.303375244140625, "global_step": 152728, "epoch": 1840} {"train_loss": -23.240381240844727, "global_step": 152729, "epoch": 1840} {"train_loss": -23.270551681518555, "global_step": 152730, "epoch": 1840} {"train_loss": -23.152944564819336, "global_step": 152731, "epoch": 1840} {"train_loss": -23.504770278930664, "global_step": 152732, "epoch": 1840} {"train_loss": -23.754812240600586, "global_step": 152733, "epoch": 1840} {"train_loss": -23.196348190307617, "global_step": 152734, "epoch": 1840} {"train_loss": -22.73601722717285, "global_step": 152735, "epoch": 1840} {"train_loss": -23.488733291625977, "global_step": 152736, "epoch": 1840} {"train_loss": -23.016569137573242, "global_step": 152737, "epoch": 1840} {"train_loss": -22.836606979370117, "global_step": 152738, "epoch": 1840} {"train_loss": -23.4981689453125, "global_step": 152739, "epoch": 1840} {"train_loss": -23.191116333007812, "global_step": 152740, "epoch": 1840} {"train_loss": -23.022287368774414, "global_step": 152741, "epoch": 1840} {"train_loss": -23.51102066040039, "global_step": 152742, "epoch": 1840} {"train_loss": -22.893415451049805, "global_step": 152743, "epoch": 1840} {"train_loss": -23.502973556518555, "global_step": 152744, "epoch": 1840} {"train_loss": -23.705307006835938, "global_step": 152745, "epoch": 1840} {"train_loss": -23.0925350189209, "global_step": 152746, "epoch": 1840} {"train_loss": -23.239017486572266, "global_step": 152747, "epoch": 1840} {"train_loss": -23.252452850341797, "global_step": 152748, "epoch": 1840} {"train_loss": -23.287870407104492, "global_step": 152749, "epoch": 1840} {"train_loss": -23.309354782104492, "global_step": 152750, "epoch": 1840} {"train_loss": -23.36189842224121, "global_step": 152751, "epoch": 1840} {"train_loss": -23.171955108642578, "global_step": 152752, "epoch": 1840} {"train_loss": -23.025543212890625, "global_step": 152753, "epoch": 1840} {"train_loss": -23.405155181884766, "global_step": 152754, "epoch": 1840} {"train_loss": -23.563777923583984, "global_step": 152755, "epoch": 1840} {"train_loss": -22.953292846679688, "global_step": 152756, "epoch": 1840} {"train_loss": -23.415695190429688, "global_step": 152757, "epoch": 1840} {"train_loss": -23.20436668395996, "global_step": 152758, "epoch": 1840} {"train_loss": -23.633779525756836, "global_step": 152759, "epoch": 1840} {"train_loss": -23.145580291748047, "global_step": 152760, "epoch": 1840} {"train_loss": -23.352643966674805, "global_step": 152761, "epoch": 1840} {"train_loss": -22.85240364074707, "global_step": 152762, "epoch": 1840} {"train_loss": -23.47300910949707, "global_step": 152763, "epoch": 1840} {"train_loss": -23.236711502075195, "global_step": 152764, "epoch": 1840} {"train_loss": -23.2736759185791, "global_step": 152765, "epoch": 1840} {"train_loss": -23.75326919555664, "global_step": 152766, "epoch": 1840} {"train_loss": -23.448036193847656, "global_step": 152767, "epoch": 1840} {"train_loss": -23.664539337158203, "global_step": 152768, "epoch": 1840} {"train_loss": -23.4466609954834, "global_step": 152769, "epoch": 1840} {"train_loss": -23.49493980407715, "global_step": 152770, "epoch": 1840} {"train_loss": -23.479969024658203, "global_step": 152771, "epoch": 1840} {"train_loss": -23.33116340637207, "global_step": 152772, "epoch": 1840} {"train_loss": -23.293201446533203, "global_step": 152773, "epoch": 1840} {"train_loss": -23.404193878173828, "global_step": 152774, "epoch": 1840} {"train_loss": -23.486852645874023, "global_step": 152775, "epoch": 1840} {"train_loss": -23.00498390197754, "global_step": 152776, "epoch": 1840} {"train_loss": -23.147071838378906, "global_step": 152777, "epoch": 1840} {"train_loss": -23.71476173400879, "global_step": 152778, "epoch": 1840} {"train_loss": -23.001893997192383, "global_step": 152779, "epoch": 1840} {"train_loss": -23.17200469970703, "global_step": 152780, "epoch": 1840} {"train_loss": -23.637678146362305, "global_step": 152781, "epoch": 1840} {"train_loss": -23.28242301940918, "global_step": 152782, "epoch": 1840} {"train_loss": -22.849674224853516, "global_step": 152783, "epoch": 1840} {"train_loss": -23.089452743530273, "global_step": 152784, "epoch": 1840} {"train_loss": -23.14931297302246, "global_step": 152785, "epoch": 1840} {"train_loss": -23.251386642456055, "global_step": 152786, "epoch": 1840} {"train_loss": -22.552526473999023, "global_step": 152787, "epoch": 1840} {"train_loss": -23.236692428588867, "global_step": 152788, "epoch": 1840} {"train_loss": -23.047882080078125, "global_step": 152789, "epoch": 1840} {"train_loss": -22.984159469604492, "global_step": 152790, "epoch": 1840} {"train_loss": -23.032245635986328, "global_step": 152791, "epoch": 1840} {"train_loss": -23.354366302490234, "global_step": 152792, "epoch": 1840} {"train_loss": -23.21486473083496, "global_step": 152793, "epoch": 1840} {"train_loss": -22.98111343383789, "global_step": 152794, "epoch": 1840} {"train_loss": -23.00786781311035, "global_step": 152795, "epoch": 1840} {"train_loss": -23.49329948425293, "global_step": 152796, "epoch": 1840} {"train_loss": -23.40205955505371, "global_step": 152797, "epoch": 1840} {"train_loss": -22.958206176757812, "global_step": 152798, "epoch": 1840} {"train_loss": -23.051992416381836, "global_step": 152799, "epoch": 1840} {"train_loss": -23.39398765563965, "global_step": 152800, "epoch": 1840} {"train_loss": -23.628652572631836, "global_step": 152801, "epoch": 1840} {"train_loss": -23.230547502816442, "global_step": 152802, "epoch": 1840, "val_loss": 6238211.0} {"train_loss": -23.26365852355957, "global_step": 152803, "epoch": 1841} {"train_loss": -22.858495712280273, "global_step": 152804, "epoch": 1841} {"train_loss": -22.804977416992188, "global_step": 152805, "epoch": 1841} {"train_loss": -23.25710105895996, "global_step": 152806, "epoch": 1841} {"train_loss": -22.938642501831055, "global_step": 152807, "epoch": 1841} {"train_loss": -23.44868278503418, "global_step": 152808, "epoch": 1841} {"train_loss": -23.087711334228516, "global_step": 152809, "epoch": 1841} {"train_loss": -22.732501983642578, "global_step": 152810, "epoch": 1841} {"train_loss": -22.955881118774414, "global_step": 152811, "epoch": 1841} {"train_loss": -22.716426849365234, "global_step": 152812, "epoch": 1841} {"train_loss": -23.541929244995117, "global_step": 152813, "epoch": 1841} {"train_loss": -23.370656967163086, "global_step": 152814, "epoch": 1841} {"train_loss": -22.708688735961914, "global_step": 152815, "epoch": 1841} {"train_loss": -23.371076583862305, "global_step": 152816, "epoch": 1841} {"train_loss": -22.936330795288086, "global_step": 152817, "epoch": 1841} {"train_loss": -23.377151489257812, "global_step": 152818, "epoch": 1841} {"train_loss": -23.376449584960938, "global_step": 152819, "epoch": 1841} {"train_loss": -23.131540298461914, "global_step": 152820, "epoch": 1841} {"train_loss": -23.056838989257812, "global_step": 152821, "epoch": 1841} {"train_loss": -23.285724639892578, "global_step": 152822, "epoch": 1841} {"train_loss": -23.254159927368164, "global_step": 152823, "epoch": 1841} {"train_loss": -23.009565353393555, "global_step": 152824, "epoch": 1841} {"train_loss": -23.566543579101562, "global_step": 152825, "epoch": 1841} {"train_loss": -22.822439193725586, "global_step": 152826, "epoch": 1841} {"train_loss": -22.857208251953125, "global_step": 152827, "epoch": 1841} {"train_loss": -23.378509521484375, "global_step": 152828, "epoch": 1841} {"train_loss": -23.582395553588867, "global_step": 152829, "epoch": 1841} {"train_loss": -23.544986724853516, "global_step": 152830, "epoch": 1841} {"train_loss": -23.293676376342773, "global_step": 152831, "epoch": 1841} {"train_loss": -23.281692504882812, "global_step": 152832, "epoch": 1841} {"train_loss": -23.442411422729492, "global_step": 152833, "epoch": 1841} {"train_loss": -23.023151397705078, "global_step": 152834, "epoch": 1841} {"train_loss": -23.30394172668457, "global_step": 152835, "epoch": 1841} {"train_loss": -23.658863067626953, "global_step": 152836, "epoch": 1841} {"train_loss": -23.207569122314453, "global_step": 152837, "epoch": 1841} {"train_loss": -23.25046157836914, "global_step": 152838, "epoch": 1841} {"train_loss": -23.397695541381836, "global_step": 152839, "epoch": 1841} {"train_loss": -23.255035400390625, "global_step": 152840, "epoch": 1841} {"train_loss": -23.336774826049805, "global_step": 152841, "epoch": 1841} {"train_loss": -23.672935485839844, "global_step": 152842, "epoch": 1841} {"train_loss": -23.224205017089844, "global_step": 152843, "epoch": 1841} {"train_loss": -23.191295623779297, "global_step": 152844, "epoch": 1841} {"train_loss": -23.0985107421875, "global_step": 152845, "epoch": 1841} {"train_loss": -23.359556198120117, "global_step": 152846, "epoch": 1841} {"train_loss": -23.194290161132812, "global_step": 152847, "epoch": 1841} {"train_loss": -23.438833236694336, "global_step": 152848, "epoch": 1841} {"train_loss": -23.216142654418945, "global_step": 152849, "epoch": 1841} {"train_loss": -23.159849166870117, "global_step": 152850, "epoch": 1841} {"train_loss": -23.461984634399414, "global_step": 152851, "epoch": 1841} {"train_loss": -23.196109771728516, "global_step": 152852, "epoch": 1841} {"train_loss": -23.41437530517578, "global_step": 152853, "epoch": 1841} {"train_loss": -23.425912857055664, "global_step": 152854, "epoch": 1841} {"train_loss": -23.710920333862305, "global_step": 152855, "epoch": 1841} {"train_loss": -23.227933883666992, "global_step": 152856, "epoch": 1841} {"train_loss": -23.300607681274414, "global_step": 152857, "epoch": 1841} {"train_loss": -23.5389404296875, "global_step": 152858, "epoch": 1841} {"train_loss": -23.81000328063965, "global_step": 152859, "epoch": 1841} {"train_loss": -23.360620498657227, "global_step": 152860, "epoch": 1841} {"train_loss": -23.286596298217773, "global_step": 152861, "epoch": 1841} {"train_loss": -23.579490661621094, "global_step": 152862, "epoch": 1841} {"train_loss": -23.780561447143555, "global_step": 152863, "epoch": 1841} {"train_loss": -23.34152603149414, "global_step": 152864, "epoch": 1841} {"train_loss": -23.539249420166016, "global_step": 152865, "epoch": 1841} {"train_loss": -23.374107360839844, "global_step": 152866, "epoch": 1841} {"train_loss": -23.250436782836914, "global_step": 152867, "epoch": 1841} {"train_loss": -23.427528381347656, "global_step": 152868, "epoch": 1841} {"train_loss": -23.715438842773438, "global_step": 152869, "epoch": 1841} {"train_loss": -23.14015769958496, "global_step": 152870, "epoch": 1841} {"train_loss": -23.1173095703125, "global_step": 152871, "epoch": 1841} {"train_loss": -23.6055965423584, "global_step": 152872, "epoch": 1841} {"train_loss": -23.63857650756836, "global_step": 152873, "epoch": 1841} {"train_loss": -23.621383666992188, "global_step": 152874, "epoch": 1841} {"train_loss": -23.394224166870117, "global_step": 152875, "epoch": 1841} {"train_loss": -23.230297088623047, "global_step": 152876, "epoch": 1841} {"train_loss": -23.612342834472656, "global_step": 152877, "epoch": 1841} {"train_loss": -23.460323333740234, "global_step": 152878, "epoch": 1841} {"train_loss": -23.48732566833496, "global_step": 152879, "epoch": 1841} {"train_loss": -23.29183006286621, "global_step": 152880, "epoch": 1841} {"train_loss": -23.381792068481445, "global_step": 152881, "epoch": 1841} {"train_loss": -23.478443145751953, "global_step": 152882, "epoch": 1841} {"train_loss": -23.63523292541504, "global_step": 152883, "epoch": 1841} {"train_loss": -23.33640480041504, "global_step": 152884, "epoch": 1841} {"train_loss": -23.31894348328372, "global_step": 152885, "epoch": 1841, "val_loss": 6458288.5} {"train_loss": -21.567026138305664, "global_step": 152886, "epoch": 1842} {"train_loss": -19.846790313720703, "global_step": 152887, "epoch": 1842} {"train_loss": -23.180086135864258, "global_step": 152888, "epoch": 1842} {"train_loss": -22.420169830322266, "global_step": 152889, "epoch": 1842} {"train_loss": -22.495880126953125, "global_step": 152890, "epoch": 1842} {"train_loss": -22.917333602905273, "global_step": 152891, "epoch": 1842} {"train_loss": -22.63555335998535, "global_step": 152892, "epoch": 1842} {"train_loss": -22.563262939453125, "global_step": 152893, "epoch": 1842} {"train_loss": -22.798511505126953, "global_step": 152894, "epoch": 1842} {"train_loss": -22.81312370300293, "global_step": 152895, "epoch": 1842} {"train_loss": -22.805757522583008, "global_step": 152896, "epoch": 1842} {"train_loss": -23.006832122802734, "global_step": 152897, "epoch": 1842} {"train_loss": -22.11208152770996, "global_step": 152898, "epoch": 1842} {"train_loss": -22.784940719604492, "global_step": 152899, "epoch": 1842} {"train_loss": -22.829984664916992, "global_step": 152900, "epoch": 1842} {"train_loss": -22.895780563354492, "global_step": 152901, "epoch": 1842} {"train_loss": -22.927616119384766, "global_step": 152902, "epoch": 1842} {"train_loss": -22.894800186157227, "global_step": 152903, "epoch": 1842} {"train_loss": -23.122825622558594, "global_step": 152904, "epoch": 1842} {"train_loss": -23.123302459716797, "global_step": 152905, "epoch": 1842} {"train_loss": -23.05327796936035, "global_step": 152906, "epoch": 1842} {"train_loss": -23.224876403808594, "global_step": 152907, "epoch": 1842} {"train_loss": -22.800506591796875, "global_step": 152908, "epoch": 1842} {"train_loss": -23.15592384338379, "global_step": 152909, "epoch": 1842} {"train_loss": -23.68393325805664, "global_step": 152910, "epoch": 1842} {"train_loss": -23.199132919311523, "global_step": 152911, "epoch": 1842} {"train_loss": -23.223854064941406, "global_step": 152912, "epoch": 1842} {"train_loss": -23.270620346069336, "global_step": 152913, "epoch": 1842} {"train_loss": -23.269210815429688, "global_step": 152914, "epoch": 1842} {"train_loss": -23.391740798950195, "global_step": 152915, "epoch": 1842} {"train_loss": -22.983570098876953, "global_step": 152916, "epoch": 1842} {"train_loss": -23.256423950195312, "global_step": 152917, "epoch": 1842} {"train_loss": -23.466873168945312, "global_step": 152918, "epoch": 1842} {"train_loss": -23.289081573486328, "global_step": 152919, "epoch": 1842} {"train_loss": -23.370376586914062, "global_step": 152920, "epoch": 1842} {"train_loss": -23.759153366088867, "global_step": 152921, "epoch": 1842} {"train_loss": -23.255359649658203, "global_step": 152922, "epoch": 1842} {"train_loss": -23.443470001220703, "global_step": 152923, "epoch": 1842} {"train_loss": -23.259033203125, "global_step": 152924, "epoch": 1842} {"train_loss": -23.725427627563477, "global_step": 152925, "epoch": 1842} {"train_loss": -23.07321548461914, "global_step": 152926, "epoch": 1842} {"train_loss": -23.312240600585938, "global_step": 152927, "epoch": 1842} {"train_loss": -23.10618019104004, "global_step": 152928, "epoch": 1842} {"train_loss": -23.693866729736328, "global_step": 152929, "epoch": 1842} {"train_loss": -23.513364791870117, "global_step": 152930, "epoch": 1842} {"train_loss": -23.3147029876709, "global_step": 152931, "epoch": 1842} {"train_loss": -23.35736656188965, "global_step": 152932, "epoch": 1842} {"train_loss": -23.692235946655273, "global_step": 152933, "epoch": 1842} {"train_loss": -23.638065338134766, "global_step": 152934, "epoch": 1842} {"train_loss": -23.4184627532959, "global_step": 152935, "epoch": 1842} {"train_loss": -23.912626266479492, "global_step": 152936, "epoch": 1842} {"train_loss": -23.60793113708496, "global_step": 152937, "epoch": 1842} {"train_loss": -23.04281997680664, "global_step": 152938, "epoch": 1842} {"train_loss": -23.29402732849121, "global_step": 152939, "epoch": 1842} {"train_loss": -23.216543197631836, "global_step": 152940, "epoch": 1842} {"train_loss": -23.35955238342285, "global_step": 152941, "epoch": 1842} {"train_loss": -23.721603393554688, "global_step": 152942, "epoch": 1842} {"train_loss": -23.621898651123047, "global_step": 152943, "epoch": 1842} {"train_loss": -23.6214542388916, "global_step": 152944, "epoch": 1842} {"train_loss": -23.621660232543945, "global_step": 152945, "epoch": 1842} {"train_loss": -23.30838966369629, "global_step": 152946, "epoch": 1842} {"train_loss": -23.14324378967285, "global_step": 152947, "epoch": 1842} {"train_loss": -23.36173439025879, "global_step": 152948, "epoch": 1842} {"train_loss": -23.22983741760254, "global_step": 152949, "epoch": 1842} {"train_loss": -23.266647338867188, "global_step": 152950, "epoch": 1842} {"train_loss": -22.95131492614746, "global_step": 152951, "epoch": 1842} {"train_loss": -23.069564819335938, "global_step": 152952, "epoch": 1842} {"train_loss": -22.864171981811523, "global_step": 152953, "epoch": 1842} {"train_loss": -23.32647705078125, "global_step": 152954, "epoch": 1842} {"train_loss": -23.067846298217773, "global_step": 152955, "epoch": 1842} {"train_loss": -23.299558639526367, "global_step": 152956, "epoch": 1842} {"train_loss": -23.667325973510742, "global_step": 152957, "epoch": 1842} {"train_loss": -23.208248138427734, "global_step": 152958, "epoch": 1842} {"train_loss": -23.23973274230957, "global_step": 152959, "epoch": 1842} {"train_loss": -23.422870635986328, "global_step": 152960, "epoch": 1842} {"train_loss": -22.565326690673828, "global_step": 152961, "epoch": 1842} {"train_loss": -23.443632125854492, "global_step": 152962, "epoch": 1842} {"train_loss": -23.06690788269043, "global_step": 152963, "epoch": 1842} {"train_loss": -22.881671905517578, "global_step": 152964, "epoch": 1842} {"train_loss": -23.461597442626953, "global_step": 152965, "epoch": 1842} {"train_loss": -23.0083065032959, "global_step": 152966, "epoch": 1842} {"train_loss": -23.2539119720459, "global_step": 152967, "epoch": 1842} {"train_loss": -23.126314530889672, "global_step": 152968, "epoch": 1842, "val_loss": 6475751.0} {"train_loss": -22.97737693786621, "global_step": 152969, "epoch": 1843} {"train_loss": -23.148874282836914, "global_step": 152970, "epoch": 1843} {"train_loss": -22.85635757446289, "global_step": 152971, "epoch": 1843} {"train_loss": -23.07515525817871, "global_step": 152972, "epoch": 1843} {"train_loss": -22.79915428161621, "global_step": 152973, "epoch": 1843} {"train_loss": -22.85369873046875, "global_step": 152974, "epoch": 1843} {"train_loss": -22.97441291809082, "global_step": 152975, "epoch": 1843} {"train_loss": -22.880626678466797, "global_step": 152976, "epoch": 1843} {"train_loss": -23.23080825805664, "global_step": 152977, "epoch": 1843} {"train_loss": -23.31141471862793, "global_step": 152978, "epoch": 1843} {"train_loss": -22.971479415893555, "global_step": 152979, "epoch": 1843} {"train_loss": -23.036558151245117, "global_step": 152980, "epoch": 1843} {"train_loss": -23.056446075439453, "global_step": 152981, "epoch": 1843} {"train_loss": -23.14193344116211, "global_step": 152982, "epoch": 1843} {"train_loss": -23.42013931274414, "global_step": 152983, "epoch": 1843} {"train_loss": -23.43086814880371, "global_step": 152984, "epoch": 1843} {"train_loss": -23.577627182006836, "global_step": 152985, "epoch": 1843} {"train_loss": -23.330093383789062, "global_step": 152986, "epoch": 1843} {"train_loss": -23.37862205505371, "global_step": 152987, "epoch": 1843} {"train_loss": -23.24587059020996, "global_step": 152988, "epoch": 1843} {"train_loss": -23.138547897338867, "global_step": 152989, "epoch": 1843} {"train_loss": -23.137508392333984, "global_step": 152990, "epoch": 1843} {"train_loss": -23.105722427368164, "global_step": 152991, "epoch": 1843} {"train_loss": -22.942373275756836, "global_step": 152992, "epoch": 1843} {"train_loss": -23.39888572692871, "global_step": 152993, "epoch": 1843} {"train_loss": -23.55678939819336, "global_step": 152994, "epoch": 1843} {"train_loss": -23.14385223388672, "global_step": 152995, "epoch": 1843} {"train_loss": -23.539011001586914, "global_step": 152996, "epoch": 1843} {"train_loss": -23.29593276977539, "global_step": 152997, "epoch": 1843} {"train_loss": -23.291746139526367, "global_step": 152998, "epoch": 1843} {"train_loss": -23.175439834594727, "global_step": 152999, "epoch": 1843} {"train_loss": -23.488727569580078, "global_step": 153000, "epoch": 1843} {"train_loss": -23.5699520111084, "global_step": 153001, "epoch": 1843} {"train_loss": -23.543231964111328, "global_step": 153002, "epoch": 1843} {"train_loss": -23.648954391479492, "global_step": 153003, "epoch": 1843} {"train_loss": -23.647016525268555, "global_step": 153004, "epoch": 1843} {"train_loss": -23.5047550201416, "global_step": 153005, "epoch": 1843} {"train_loss": -23.236658096313477, "global_step": 153006, "epoch": 1843} {"train_loss": -23.44318199157715, "global_step": 153007, "epoch": 1843} {"train_loss": -23.194324493408203, "global_step": 153008, "epoch": 1843} {"train_loss": -23.382455825805664, "global_step": 153009, "epoch": 1843} {"train_loss": -23.135324478149414, "global_step": 153010, "epoch": 1843} {"train_loss": -22.992755889892578, "global_step": 153011, "epoch": 1843} {"train_loss": -23.493879318237305, "global_step": 153012, "epoch": 1843} {"train_loss": -23.45728874206543, "global_step": 153013, "epoch": 1843} {"train_loss": -23.389150619506836, "global_step": 153014, "epoch": 1843} {"train_loss": -23.392858505249023, "global_step": 153015, "epoch": 1843} {"train_loss": -23.170629501342773, "global_step": 153016, "epoch": 1843} {"train_loss": -23.407758712768555, "global_step": 153017, "epoch": 1843} {"train_loss": -23.610198974609375, "global_step": 153018, "epoch": 1843} {"train_loss": -23.189041137695312, "global_step": 153019, "epoch": 1843} {"train_loss": -23.8625431060791, "global_step": 153020, "epoch": 1843} {"train_loss": -23.481067657470703, "global_step": 153021, "epoch": 1843} {"train_loss": -23.174936294555664, "global_step": 153022, "epoch": 1843} {"train_loss": -23.256635665893555, "global_step": 153023, "epoch": 1843} {"train_loss": -23.461973190307617, "global_step": 153024, "epoch": 1843} {"train_loss": -23.44432830810547, "global_step": 153025, "epoch": 1843} {"train_loss": -23.00178337097168, "global_step": 153026, "epoch": 1843} {"train_loss": -23.331350326538086, "global_step": 153027, "epoch": 1843} {"train_loss": -23.100385665893555, "global_step": 153028, "epoch": 1843} {"train_loss": -23.39191246032715, "global_step": 153029, "epoch": 1843} {"train_loss": -23.14175033569336, "global_step": 153030, "epoch": 1843} {"train_loss": -23.383882522583008, "global_step": 153031, "epoch": 1843} {"train_loss": -23.08578872680664, "global_step": 153032, "epoch": 1843} {"train_loss": -23.587072372436523, "global_step": 153033, "epoch": 1843} {"train_loss": -23.168109893798828, "global_step": 153034, "epoch": 1843} {"train_loss": -22.93406105041504, "global_step": 153035, "epoch": 1843} {"train_loss": -22.823747634887695, "global_step": 153036, "epoch": 1843} {"train_loss": -23.088315963745117, "global_step": 153037, "epoch": 1843} {"train_loss": -23.127256393432617, "global_step": 153038, "epoch": 1843} {"train_loss": -22.998594284057617, "global_step": 153039, "epoch": 1843} {"train_loss": -23.372331619262695, "global_step": 153040, "epoch": 1843} {"train_loss": -23.426273345947266, "global_step": 153041, "epoch": 1843} {"train_loss": -23.353601455688477, "global_step": 153042, "epoch": 1843} {"train_loss": -23.057804107666016, "global_step": 153043, "epoch": 1843} {"train_loss": -23.384187698364258, "global_step": 153044, "epoch": 1843} {"train_loss": -23.406478881835938, "global_step": 153045, "epoch": 1843} {"train_loss": -23.121145248413086, "global_step": 153046, "epoch": 1843} {"train_loss": -23.257352828979492, "global_step": 153047, "epoch": 1843} {"train_loss": -23.3703556060791, "global_step": 153048, "epoch": 1843} {"train_loss": -23.646127700805664, "global_step": 153049, "epoch": 1843} {"train_loss": -23.210527420043945, "global_step": 153050, "epoch": 1843} {"train_loss": -23.26606543667345, "global_step": 153051, "epoch": 1843, "val_loss": 6425368.0} {"train_loss": -23.010818481445312, "global_step": 153052, "epoch": 1844} {"train_loss": -22.833892822265625, "global_step": 153053, "epoch": 1844} {"train_loss": -23.038211822509766, "global_step": 153054, "epoch": 1844} {"train_loss": -22.83222007751465, "global_step": 153055, "epoch": 1844} {"train_loss": -22.975927352905273, "global_step": 153056, "epoch": 1844} {"train_loss": -22.950590133666992, "global_step": 153057, "epoch": 1844} {"train_loss": -22.6762638092041, "global_step": 153058, "epoch": 1844} {"train_loss": -22.769546508789062, "global_step": 153059, "epoch": 1844} {"train_loss": -23.13117790222168, "global_step": 153060, "epoch": 1844} {"train_loss": -22.968175888061523, "global_step": 153061, "epoch": 1844} {"train_loss": -23.040300369262695, "global_step": 153062, "epoch": 1844} {"train_loss": -22.520483016967773, "global_step": 153063, "epoch": 1844} {"train_loss": -23.2249698638916, "global_step": 153064, "epoch": 1844} {"train_loss": -23.076427459716797, "global_step": 153065, "epoch": 1844} {"train_loss": -23.544986724853516, "global_step": 153066, "epoch": 1844} {"train_loss": -22.884740829467773, "global_step": 153067, "epoch": 1844} {"train_loss": -23.435028076171875, "global_step": 153068, "epoch": 1844} {"train_loss": -22.939495086669922, "global_step": 153069, "epoch": 1844} {"train_loss": -22.873315811157227, "global_step": 153070, "epoch": 1844} {"train_loss": -22.753732681274414, "global_step": 153071, "epoch": 1844} {"train_loss": -23.503751754760742, "global_step": 153072, "epoch": 1844} {"train_loss": -22.55215835571289, "global_step": 153073, "epoch": 1844} {"train_loss": -23.32453727722168, "global_step": 153074, "epoch": 1844} {"train_loss": -23.153284072875977, "global_step": 153075, "epoch": 1844} {"train_loss": -23.260242462158203, "global_step": 153076, "epoch": 1844} {"train_loss": -23.509244918823242, "global_step": 153077, "epoch": 1844} {"train_loss": -23.198686599731445, "global_step": 153078, "epoch": 1844} {"train_loss": -23.080692291259766, "global_step": 153079, "epoch": 1844} {"train_loss": -23.422792434692383, "global_step": 153080, "epoch": 1844} {"train_loss": -23.546260833740234, "global_step": 153081, "epoch": 1844} {"train_loss": -23.597990036010742, "global_step": 153082, "epoch": 1844} {"train_loss": -23.050121307373047, "global_step": 153083, "epoch": 1844} {"train_loss": -22.9348087310791, "global_step": 153084, "epoch": 1844} {"train_loss": -23.2414608001709, "global_step": 153085, "epoch": 1844} {"train_loss": -23.59283447265625, "global_step": 153086, "epoch": 1844} {"train_loss": -23.066259384155273, "global_step": 153087, "epoch": 1844} {"train_loss": -23.325536727905273, "global_step": 153088, "epoch": 1844} {"train_loss": -23.03717613220215, "global_step": 153089, "epoch": 1844} {"train_loss": -23.512434005737305, "global_step": 153090, "epoch": 1844} {"train_loss": -23.186920166015625, "global_step": 153091, "epoch": 1844} {"train_loss": -23.289474487304688, "global_step": 153092, "epoch": 1844} {"train_loss": -23.2002010345459, "global_step": 153093, "epoch": 1844} {"train_loss": -23.260080337524414, "global_step": 153094, "epoch": 1844} {"train_loss": -23.737333297729492, "global_step": 153095, "epoch": 1844} {"train_loss": -23.535200119018555, "global_step": 153096, "epoch": 1844} {"train_loss": -23.20918846130371, "global_step": 153097, "epoch": 1844} {"train_loss": -22.867979049682617, "global_step": 153098, "epoch": 1844} {"train_loss": -23.120532989501953, "global_step": 153099, "epoch": 1844} {"train_loss": -23.390493392944336, "global_step": 153100, "epoch": 1844} {"train_loss": -23.254350662231445, "global_step": 153101, "epoch": 1844} {"train_loss": -22.989988327026367, "global_step": 153102, "epoch": 1844} {"train_loss": -23.41958236694336, "global_step": 153103, "epoch": 1844} {"train_loss": -23.22458267211914, "global_step": 153104, "epoch": 1844} {"train_loss": -23.005918502807617, "global_step": 153105, "epoch": 1844} {"train_loss": -23.258256912231445, "global_step": 153106, "epoch": 1844} {"train_loss": -23.545156478881836, "global_step": 153107, "epoch": 1844} {"train_loss": -23.11669158935547, "global_step": 153108, "epoch": 1844} {"train_loss": -23.41345977783203, "global_step": 153109, "epoch": 1844} {"train_loss": -23.666152954101562, "global_step": 153110, "epoch": 1844} {"train_loss": -23.30785369873047, "global_step": 153111, "epoch": 1844} {"train_loss": -23.193479537963867, "global_step": 153112, "epoch": 1844} {"train_loss": -23.61847686767578, "global_step": 153113, "epoch": 1844} {"train_loss": -23.253786087036133, "global_step": 153114, "epoch": 1844} {"train_loss": -23.692113876342773, "global_step": 153115, "epoch": 1844} {"train_loss": -23.119152069091797, "global_step": 153116, "epoch": 1844} {"train_loss": -23.48163414001465, "global_step": 153117, "epoch": 1844} {"train_loss": -23.46291160583496, "global_step": 153118, "epoch": 1844} {"train_loss": -23.299673080444336, "global_step": 153119, "epoch": 1844} {"train_loss": -23.419464111328125, "global_step": 153120, "epoch": 1844} {"train_loss": -23.582815170288086, "global_step": 153121, "epoch": 1844} {"train_loss": -23.385618209838867, "global_step": 153122, "epoch": 1844} {"train_loss": -23.384098052978516, "global_step": 153123, "epoch": 1844} {"train_loss": -23.23158836364746, "global_step": 153124, "epoch": 1844} {"train_loss": -23.03676414489746, "global_step": 153125, "epoch": 1844} {"train_loss": -22.9329833984375, "global_step": 153126, "epoch": 1844} {"train_loss": -23.434635162353516, "global_step": 153127, "epoch": 1844} {"train_loss": -23.36348533630371, "global_step": 153128, "epoch": 1844} {"train_loss": -22.954830169677734, "global_step": 153129, "epoch": 1844} {"train_loss": -23.409427642822266, "global_step": 153130, "epoch": 1844} {"train_loss": -23.027545928955078, "global_step": 153131, "epoch": 1844} {"train_loss": -23.27296257019043, "global_step": 153132, "epoch": 1844} {"train_loss": -23.371152877807617, "global_step": 153133, "epoch": 1844} {"train_loss": -23.21875303337373, "global_step": 153134, "epoch": 1844, "val_loss": 6311856.0} {"train_loss": -23.523679733276367, "global_step": 153135, "epoch": 1845} {"train_loss": -23.199234008789062, "global_step": 153136, "epoch": 1845} {"train_loss": -22.985563278198242, "global_step": 153137, "epoch": 1845} {"train_loss": -23.272573471069336, "global_step": 153138, "epoch": 1845} {"train_loss": -23.280332565307617, "global_step": 153139, "epoch": 1845} {"train_loss": -23.002105712890625, "global_step": 153140, "epoch": 1845} {"train_loss": -23.1138973236084, "global_step": 153141, "epoch": 1845} {"train_loss": -22.994247436523438, "global_step": 153142, "epoch": 1845} {"train_loss": -22.942550659179688, "global_step": 153143, "epoch": 1845} {"train_loss": -23.163137435913086, "global_step": 153144, "epoch": 1845} {"train_loss": -23.238872528076172, "global_step": 153145, "epoch": 1845} {"train_loss": -23.358739852905273, "global_step": 153146, "epoch": 1845} {"train_loss": -23.351545333862305, "global_step": 153147, "epoch": 1845} {"train_loss": -23.001699447631836, "global_step": 153148, "epoch": 1845} {"train_loss": -23.577829360961914, "global_step": 153149, "epoch": 1845} {"train_loss": -23.431150436401367, "global_step": 153150, "epoch": 1845} {"train_loss": -23.1173095703125, "global_step": 153151, "epoch": 1845} {"train_loss": -23.234405517578125, "global_step": 153152, "epoch": 1845} {"train_loss": -23.34309196472168, "global_step": 153153, "epoch": 1845} {"train_loss": -23.534271240234375, "global_step": 153154, "epoch": 1845} {"train_loss": -23.51850700378418, "global_step": 153155, "epoch": 1845} {"train_loss": -23.34918212890625, "global_step": 153156, "epoch": 1845} {"train_loss": -23.577163696289062, "global_step": 153157, "epoch": 1845} {"train_loss": -23.55628776550293, "global_step": 153158, "epoch": 1845} {"train_loss": -23.241355895996094, "global_step": 153159, "epoch": 1845} {"train_loss": -23.390859603881836, "global_step": 153160, "epoch": 1845} {"train_loss": -22.929290771484375, "global_step": 153161, "epoch": 1845} {"train_loss": -22.88324546813965, "global_step": 153162, "epoch": 1845} {"train_loss": -23.192428588867188, "global_step": 153163, "epoch": 1845} {"train_loss": -23.51934051513672, "global_step": 153164, "epoch": 1845} {"train_loss": -23.41818618774414, "global_step": 153165, "epoch": 1845} {"train_loss": -23.73914337158203, "global_step": 153166, "epoch": 1845} {"train_loss": -23.234542846679688, "global_step": 153167, "epoch": 1845} {"train_loss": -23.747602462768555, "global_step": 153168, "epoch": 1845} {"train_loss": -23.318937301635742, "global_step": 153169, "epoch": 1845} {"train_loss": -23.149328231811523, "global_step": 153170, "epoch": 1845} {"train_loss": -23.5136775970459, "global_step": 153171, "epoch": 1845} {"train_loss": -23.34683609008789, "global_step": 153172, "epoch": 1845} {"train_loss": -23.068418502807617, "global_step": 153173, "epoch": 1845} {"train_loss": -23.66008758544922, "global_step": 153174, "epoch": 1845} {"train_loss": -23.719226837158203, "global_step": 153175, "epoch": 1845} {"train_loss": -23.523906707763672, "global_step": 153176, "epoch": 1845} {"train_loss": -23.35436248779297, "global_step": 153177, "epoch": 1845} {"train_loss": -23.732187271118164, "global_step": 153178, "epoch": 1845} {"train_loss": -23.570592880249023, "global_step": 153179, "epoch": 1845} {"train_loss": -23.216014862060547, "global_step": 153180, "epoch": 1845} {"train_loss": -23.203998565673828, "global_step": 153181, "epoch": 1845} {"train_loss": -23.113492965698242, "global_step": 153182, "epoch": 1845} {"train_loss": -23.603483200073242, "global_step": 153183, "epoch": 1845} {"train_loss": -23.262611389160156, "global_step": 153184, "epoch": 1845} {"train_loss": -23.26338005065918, "global_step": 153185, "epoch": 1845} {"train_loss": -23.283437728881836, "global_step": 153186, "epoch": 1845} {"train_loss": -23.40875244140625, "global_step": 153187, "epoch": 1845} {"train_loss": -23.547161102294922, "global_step": 153188, "epoch": 1845} {"train_loss": -23.391355514526367, "global_step": 153189, "epoch": 1845} {"train_loss": -23.699352264404297, "global_step": 153190, "epoch": 1845} {"train_loss": -23.447092056274414, "global_step": 153191, "epoch": 1845} {"train_loss": -23.01814842224121, "global_step": 153192, "epoch": 1845} {"train_loss": -23.450281143188477, "global_step": 153193, "epoch": 1845} {"train_loss": -23.3243350982666, "global_step": 153194, "epoch": 1845} {"train_loss": -23.512327194213867, "global_step": 153195, "epoch": 1845} {"train_loss": -23.363418579101562, "global_step": 153196, "epoch": 1845} {"train_loss": -23.648122787475586, "global_step": 153197, "epoch": 1845} {"train_loss": -23.298776626586914, "global_step": 153198, "epoch": 1845} {"train_loss": -23.24410057067871, "global_step": 153199, "epoch": 1845} {"train_loss": -23.67875862121582, "global_step": 153200, "epoch": 1845} {"train_loss": -23.47795867919922, "global_step": 153201, "epoch": 1845} {"train_loss": -23.451648712158203, "global_step": 153202, "epoch": 1845} {"train_loss": -23.31302833557129, "global_step": 153203, "epoch": 1845} {"train_loss": -23.6357421875, "global_step": 153204, "epoch": 1845} {"train_loss": -23.422317504882812, "global_step": 153205, "epoch": 1845} {"train_loss": -23.357900619506836, "global_step": 153206, "epoch": 1845} {"train_loss": -23.026077270507812, "global_step": 153207, "epoch": 1845} {"train_loss": -23.538455963134766, "global_step": 153208, "epoch": 1845} {"train_loss": -23.45236587524414, "global_step": 153209, "epoch": 1845} {"train_loss": -23.393339157104492, "global_step": 153210, "epoch": 1845} {"train_loss": -23.481496810913086, "global_step": 153211, "epoch": 1845} {"train_loss": -23.084497451782227, "global_step": 153212, "epoch": 1845} {"train_loss": -23.10504722595215, "global_step": 153213, "epoch": 1845} {"train_loss": -23.3367977142334, "global_step": 153214, "epoch": 1845} {"train_loss": -23.117599487304688, "global_step": 153215, "epoch": 1845} {"train_loss": -23.38238525390625, "global_step": 153216, "epoch": 1845} {"train_loss": -23.344656725963915, "global_step": 153217, "epoch": 1845, "val_loss": 6377689.5} {"train_loss": -22.42824363708496, "global_step": 153218, "epoch": 1846} {"train_loss": -22.844078063964844, "global_step": 153219, "epoch": 1846} {"train_loss": -23.067045211791992, "global_step": 153220, "epoch": 1846} {"train_loss": -22.879186630249023, "global_step": 153221, "epoch": 1846} {"train_loss": -23.18288230895996, "global_step": 153222, "epoch": 1846} {"train_loss": -23.209535598754883, "global_step": 153223, "epoch": 1846} {"train_loss": -23.32631492614746, "global_step": 153224, "epoch": 1846} {"train_loss": -23.040414810180664, "global_step": 153225, "epoch": 1846} {"train_loss": -23.10615348815918, "global_step": 153226, "epoch": 1846} {"train_loss": -22.641464233398438, "global_step": 153227, "epoch": 1846} {"train_loss": -23.00162696838379, "global_step": 153228, "epoch": 1846} {"train_loss": -23.095544815063477, "global_step": 153229, "epoch": 1846} {"train_loss": -23.136688232421875, "global_step": 153230, "epoch": 1846} {"train_loss": -23.253578186035156, "global_step": 153231, "epoch": 1846} {"train_loss": -23.061100006103516, "global_step": 153232, "epoch": 1846} {"train_loss": -23.054790496826172, "global_step": 153233, "epoch": 1846} {"train_loss": -22.877979278564453, "global_step": 153234, "epoch": 1846} {"train_loss": -23.00740623474121, "global_step": 153235, "epoch": 1846} {"train_loss": -23.339828491210938, "global_step": 153236, "epoch": 1846} {"train_loss": -22.96345329284668, "global_step": 153237, "epoch": 1846} {"train_loss": -23.16492462158203, "global_step": 153238, "epoch": 1846} {"train_loss": -23.275949478149414, "global_step": 153239, "epoch": 1846} {"train_loss": -23.542646408081055, "global_step": 153240, "epoch": 1846} {"train_loss": -23.31399917602539, "global_step": 153241, "epoch": 1846} {"train_loss": -23.099727630615234, "global_step": 153242, "epoch": 1846} {"train_loss": -23.333005905151367, "global_step": 153243, "epoch": 1846} {"train_loss": -23.13153648376465, "global_step": 153244, "epoch": 1846} {"train_loss": -23.436063766479492, "global_step": 153245, "epoch": 1846} {"train_loss": -23.163049697875977, "global_step": 153246, "epoch": 1846} {"train_loss": -23.32627296447754, "global_step": 153247, "epoch": 1846} {"train_loss": -23.550647735595703, "global_step": 153248, "epoch": 1846} {"train_loss": -23.066333770751953, "global_step": 153249, "epoch": 1846} {"train_loss": -23.203519821166992, "global_step": 153250, "epoch": 1846} {"train_loss": -23.558095932006836, "global_step": 153251, "epoch": 1846} {"train_loss": -23.568029403686523, "global_step": 153252, "epoch": 1846} {"train_loss": -23.298608779907227, "global_step": 153253, "epoch": 1846} {"train_loss": -23.39032554626465, "global_step": 153254, "epoch": 1846} {"train_loss": -23.702543258666992, "global_step": 153255, "epoch": 1846} {"train_loss": -23.32234001159668, "global_step": 153256, "epoch": 1846} {"train_loss": -23.405189514160156, "global_step": 153257, "epoch": 1846} {"train_loss": -23.545928955078125, "global_step": 153258, "epoch": 1846} {"train_loss": -23.675580978393555, "global_step": 153259, "epoch": 1846} {"train_loss": -23.522022247314453, "global_step": 153260, "epoch": 1846} {"train_loss": -23.61459732055664, "global_step": 153261, "epoch": 1846} {"train_loss": -23.393213272094727, "global_step": 153262, "epoch": 1846} {"train_loss": -23.709186553955078, "global_step": 153263, "epoch": 1846} {"train_loss": -23.723159790039062, "global_step": 153264, "epoch": 1846} {"train_loss": -23.257099151611328, "global_step": 153265, "epoch": 1846} {"train_loss": -23.394947052001953, "global_step": 153266, "epoch": 1846} {"train_loss": -23.257511138916016, "global_step": 153267, "epoch": 1846} {"train_loss": -22.82068634033203, "global_step": 153268, "epoch": 1846} {"train_loss": -23.36611557006836, "global_step": 153269, "epoch": 1846} {"train_loss": -23.177202224731445, "global_step": 153270, "epoch": 1846} {"train_loss": -23.231281280517578, "global_step": 153271, "epoch": 1846} {"train_loss": -23.436674118041992, "global_step": 153272, "epoch": 1846} {"train_loss": -23.332603454589844, "global_step": 153273, "epoch": 1846} {"train_loss": -23.26455307006836, "global_step": 153274, "epoch": 1846} {"train_loss": -23.230653762817383, "global_step": 153275, "epoch": 1846} {"train_loss": -23.327585220336914, "global_step": 153276, "epoch": 1846} {"train_loss": -23.416250228881836, "global_step": 153277, "epoch": 1846} {"train_loss": -23.508031845092773, "global_step": 153278, "epoch": 1846} {"train_loss": -23.314176559448242, "global_step": 153279, "epoch": 1846} {"train_loss": -23.247270584106445, "global_step": 153280, "epoch": 1846} {"train_loss": -23.56174659729004, "global_step": 153281, "epoch": 1846} {"train_loss": -23.27048110961914, "global_step": 153282, "epoch": 1846} {"train_loss": -23.35258674621582, "global_step": 153283, "epoch": 1846} {"train_loss": -23.442989349365234, "global_step": 153284, "epoch": 1846} {"train_loss": -23.431655883789062, "global_step": 153285, "epoch": 1846} {"train_loss": -23.467161178588867, "global_step": 153286, "epoch": 1846} {"train_loss": -23.400928497314453, "global_step": 153287, "epoch": 1846} {"train_loss": -23.351438522338867, "global_step": 153288, "epoch": 1846} {"train_loss": -23.046772003173828, "global_step": 153289, "epoch": 1846} {"train_loss": -23.240947723388672, "global_step": 153290, "epoch": 1846} {"train_loss": -23.131244659423828, "global_step": 153291, "epoch": 1846} {"train_loss": -23.0961856842041, "global_step": 153292, "epoch": 1846} {"train_loss": -23.008102416992188, "global_step": 153293, "epoch": 1846} {"train_loss": -22.89133644104004, "global_step": 153294, "epoch": 1846} {"train_loss": -23.417509078979492, "global_step": 153295, "epoch": 1846} {"train_loss": -23.124876022338867, "global_step": 153296, "epoch": 1846} {"train_loss": -23.39162254333496, "global_step": 153297, "epoch": 1846} {"train_loss": -23.602256774902344, "global_step": 153298, "epoch": 1846} {"train_loss": -23.69610595703125, "global_step": 153299, "epoch": 1846} {"train_loss": -23.26484071203025, "global_step": 153300, "epoch": 1846, "val_loss": 6334244.0} {"train_loss": -23.05496597290039, "global_step": 153301, "epoch": 1847} {"train_loss": -22.717981338500977, "global_step": 153302, "epoch": 1847} {"train_loss": -22.63522720336914, "global_step": 153303, "epoch": 1847} {"train_loss": -23.184226989746094, "global_step": 153304, "epoch": 1847} {"train_loss": -22.967336654663086, "global_step": 153305, "epoch": 1847} {"train_loss": -23.210851669311523, "global_step": 153306, "epoch": 1847} {"train_loss": -23.330442428588867, "global_step": 153307, "epoch": 1847} {"train_loss": -22.851835250854492, "global_step": 153308, "epoch": 1847} {"train_loss": -23.189756393432617, "global_step": 153309, "epoch": 1847} {"train_loss": -23.4129695892334, "global_step": 153310, "epoch": 1847} {"train_loss": -23.015743255615234, "global_step": 153311, "epoch": 1847} {"train_loss": -23.266876220703125, "global_step": 153312, "epoch": 1847} {"train_loss": -23.037443161010742, "global_step": 153313, "epoch": 1847} {"train_loss": -23.50722312927246, "global_step": 153314, "epoch": 1847} {"train_loss": -23.238819122314453, "global_step": 153315, "epoch": 1847} {"train_loss": -22.7922420501709, "global_step": 153316, "epoch": 1847} {"train_loss": -23.615209579467773, "global_step": 153317, "epoch": 1847} {"train_loss": -23.052509307861328, "global_step": 153318, "epoch": 1847} {"train_loss": -23.843109130859375, "global_step": 153319, "epoch": 1847} {"train_loss": -23.149555206298828, "global_step": 153320, "epoch": 1847} {"train_loss": -23.308223724365234, "global_step": 153321, "epoch": 1847} {"train_loss": -22.957691192626953, "global_step": 153322, "epoch": 1847} {"train_loss": -23.193695068359375, "global_step": 153323, "epoch": 1847} {"train_loss": -23.25739860534668, "global_step": 153324, "epoch": 1847} {"train_loss": -23.316753387451172, "global_step": 153325, "epoch": 1847} {"train_loss": -23.34600830078125, "global_step": 153326, "epoch": 1847} {"train_loss": -23.642011642456055, "global_step": 153327, "epoch": 1847} {"train_loss": -23.093595504760742, "global_step": 153328, "epoch": 1847} {"train_loss": -23.3339900970459, "global_step": 153329, "epoch": 1847} {"train_loss": -23.22658920288086, "global_step": 153330, "epoch": 1847} {"train_loss": -23.40496253967285, "global_step": 153331, "epoch": 1847} {"train_loss": -23.52020835876465, "global_step": 153332, "epoch": 1847} {"train_loss": -22.975238800048828, "global_step": 153333, "epoch": 1847} {"train_loss": -23.36476707458496, "global_step": 153334, "epoch": 1847} {"train_loss": -23.073511123657227, "global_step": 153335, "epoch": 1847} {"train_loss": -23.385787963867188, "global_step": 153336, "epoch": 1847} {"train_loss": -23.318849563598633, "global_step": 153337, "epoch": 1847} {"train_loss": -23.094572067260742, "global_step": 153338, "epoch": 1847} {"train_loss": -23.497726440429688, "global_step": 153339, "epoch": 1847} {"train_loss": -23.184247970581055, "global_step": 153340, "epoch": 1847} {"train_loss": -23.173385620117188, "global_step": 153341, "epoch": 1847} {"train_loss": -23.244953155517578, "global_step": 153342, "epoch": 1847} {"train_loss": -23.770687103271484, "global_step": 153343, "epoch": 1847} {"train_loss": -23.383100509643555, "global_step": 153344, "epoch": 1847} {"train_loss": -23.139036178588867, "global_step": 153345, "epoch": 1847} {"train_loss": -23.47653579711914, "global_step": 153346, "epoch": 1847} {"train_loss": -23.52251625061035, "global_step": 153347, "epoch": 1847} {"train_loss": -23.51848793029785, "global_step": 153348, "epoch": 1847} {"train_loss": -23.32879638671875, "global_step": 153349, "epoch": 1847} {"train_loss": -22.949798583984375, "global_step": 153350, "epoch": 1847} {"train_loss": -23.780202865600586, "global_step": 153351, "epoch": 1847} {"train_loss": -23.303470611572266, "global_step": 153352, "epoch": 1847} {"train_loss": -23.217601776123047, "global_step": 153353, "epoch": 1847} {"train_loss": -23.740694046020508, "global_step": 153354, "epoch": 1847} {"train_loss": -23.534360885620117, "global_step": 153355, "epoch": 1847} {"train_loss": -23.786605834960938, "global_step": 153356, "epoch": 1847} {"train_loss": -23.654157638549805, "global_step": 153357, "epoch": 1847} {"train_loss": -23.599369049072266, "global_step": 153358, "epoch": 1847} {"train_loss": -23.355669021606445, "global_step": 153359, "epoch": 1847} {"train_loss": -23.314334869384766, "global_step": 153360, "epoch": 1847} {"train_loss": -23.413211822509766, "global_step": 153361, "epoch": 1847} {"train_loss": -23.452688217163086, "global_step": 153362, "epoch": 1847} {"train_loss": -23.45183563232422, "global_step": 153363, "epoch": 1847} {"train_loss": -23.406169891357422, "global_step": 153364, "epoch": 1847} {"train_loss": -23.329431533813477, "global_step": 153365, "epoch": 1847} {"train_loss": -23.345685958862305, "global_step": 153366, "epoch": 1847} {"train_loss": -23.312835693359375, "global_step": 153367, "epoch": 1847} {"train_loss": -23.191761016845703, "global_step": 153368, "epoch": 1847} {"train_loss": -23.368896484375, "global_step": 153369, "epoch": 1847} {"train_loss": -23.215686798095703, "global_step": 153370, "epoch": 1847} {"train_loss": -23.6766414642334, "global_step": 153371, "epoch": 1847} {"train_loss": -23.42091941833496, "global_step": 153372, "epoch": 1847} {"train_loss": -23.25118064880371, "global_step": 153373, "epoch": 1847} {"train_loss": -23.169952392578125, "global_step": 153374, "epoch": 1847} {"train_loss": -23.434621810913086, "global_step": 153375, "epoch": 1847} {"train_loss": -23.196680068969727, "global_step": 153376, "epoch": 1847} {"train_loss": -23.069992065429688, "global_step": 153377, "epoch": 1847} {"train_loss": -23.18588638305664, "global_step": 153378, "epoch": 1847} {"train_loss": -23.39869499206543, "global_step": 153379, "epoch": 1847} {"train_loss": -23.556249618530273, "global_step": 153380, "epoch": 1847} {"train_loss": -23.795785903930664, "global_step": 153381, "epoch": 1847} {"train_loss": -23.44546127319336, "global_step": 153382, "epoch": 1847} {"train_loss": -23.31998680298587, "global_step": 153383, "epoch": 1847, "val_loss": 6411434.0} {"train_loss": -22.371292114257812, "global_step": 153384, "epoch": 1848} {"train_loss": -22.654001235961914, "global_step": 153385, "epoch": 1848} {"train_loss": -22.389739990234375, "global_step": 153386, "epoch": 1848} {"train_loss": -22.7497615814209, "global_step": 153387, "epoch": 1848} {"train_loss": -22.467193603515625, "global_step": 153388, "epoch": 1848} {"train_loss": -23.00654411315918, "global_step": 153389, "epoch": 1848} {"train_loss": -22.703577041625977, "global_step": 153390, "epoch": 1848} {"train_loss": -22.247926712036133, "global_step": 153391, "epoch": 1848} {"train_loss": -22.87706756591797, "global_step": 153392, "epoch": 1848} {"train_loss": -22.955917358398438, "global_step": 153393, "epoch": 1848} {"train_loss": -22.60122299194336, "global_step": 153394, "epoch": 1848} {"train_loss": -22.636823654174805, "global_step": 153395, "epoch": 1848} {"train_loss": -23.058740615844727, "global_step": 153396, "epoch": 1848} {"train_loss": -22.9884033203125, "global_step": 153397, "epoch": 1848} {"train_loss": -23.007558822631836, "global_step": 153398, "epoch": 1848} {"train_loss": -22.740646362304688, "global_step": 153399, "epoch": 1848} {"train_loss": -23.079538345336914, "global_step": 153400, "epoch": 1848} {"train_loss": -22.98801040649414, "global_step": 153401, "epoch": 1848} {"train_loss": -22.781362533569336, "global_step": 153402, "epoch": 1848} {"train_loss": -23.106679916381836, "global_step": 153403, "epoch": 1848} {"train_loss": -23.041414260864258, "global_step": 153404, "epoch": 1848} {"train_loss": -23.082279205322266, "global_step": 153405, "epoch": 1848} {"train_loss": -23.483884811401367, "global_step": 153406, "epoch": 1848} {"train_loss": -23.01569175720215, "global_step": 153407, "epoch": 1848} {"train_loss": -23.046632766723633, "global_step": 153408, "epoch": 1848} {"train_loss": -23.365615844726562, "global_step": 153409, "epoch": 1848} {"train_loss": -23.30460548400879, "global_step": 153410, "epoch": 1848} {"train_loss": -22.59195899963379, "global_step": 153411, "epoch": 1848} {"train_loss": -23.039775848388672, "global_step": 153412, "epoch": 1848} {"train_loss": -23.002307891845703, "global_step": 153413, "epoch": 1848} {"train_loss": -23.191198348999023, "global_step": 153414, "epoch": 1848} {"train_loss": -23.070566177368164, "global_step": 153415, "epoch": 1848} {"train_loss": -23.2111759185791, "global_step": 153416, "epoch": 1848} {"train_loss": -23.064666748046875, "global_step": 153417, "epoch": 1848} {"train_loss": -23.46866798400879, "global_step": 153418, "epoch": 1848} {"train_loss": -22.837295532226562, "global_step": 153419, "epoch": 1848} {"train_loss": -23.543302536010742, "global_step": 153420, "epoch": 1848} {"train_loss": -23.134227752685547, "global_step": 153421, "epoch": 1848} {"train_loss": -23.148401260375977, "global_step": 153422, "epoch": 1848} {"train_loss": -23.5355281829834, "global_step": 153423, "epoch": 1848} {"train_loss": -23.019746780395508, "global_step": 153424, "epoch": 1848} {"train_loss": -23.315582275390625, "global_step": 153425, "epoch": 1848} {"train_loss": -23.282882690429688, "global_step": 153426, "epoch": 1848} {"train_loss": -23.229450225830078, "global_step": 153427, "epoch": 1848} {"train_loss": -22.989591598510742, "global_step": 153428, "epoch": 1848} {"train_loss": -23.110692977905273, "global_step": 153429, "epoch": 1848} {"train_loss": -23.409942626953125, "global_step": 153430, "epoch": 1848} {"train_loss": -23.157146453857422, "global_step": 153431, "epoch": 1848} {"train_loss": -23.326536178588867, "global_step": 153432, "epoch": 1848} {"train_loss": -23.250211715698242, "global_step": 153433, "epoch": 1848} {"train_loss": -23.584049224853516, "global_step": 153434, "epoch": 1848} {"train_loss": -23.049467086791992, "global_step": 153435, "epoch": 1848} {"train_loss": -23.421499252319336, "global_step": 153436, "epoch": 1848} {"train_loss": -23.50634002685547, "global_step": 153437, "epoch": 1848} {"train_loss": -23.549650192260742, "global_step": 153438, "epoch": 1848} {"train_loss": -23.47829246520996, "global_step": 153439, "epoch": 1848} {"train_loss": -23.53437614440918, "global_step": 153440, "epoch": 1848} {"train_loss": -23.218198776245117, "global_step": 153441, "epoch": 1848} {"train_loss": -23.51632308959961, "global_step": 153442, "epoch": 1848} {"train_loss": -23.371042251586914, "global_step": 153443, "epoch": 1848} {"train_loss": -23.535390853881836, "global_step": 153444, "epoch": 1848} {"train_loss": -23.21536636352539, "global_step": 153445, "epoch": 1848} {"train_loss": -23.54490089416504, "global_step": 153446, "epoch": 1848} {"train_loss": -23.533803939819336, "global_step": 153447, "epoch": 1848} {"train_loss": -22.953887939453125, "global_step": 153448, "epoch": 1848} {"train_loss": -23.478885650634766, "global_step": 153449, "epoch": 1848} {"train_loss": -23.154891967773438, "global_step": 153450, "epoch": 1848} {"train_loss": -23.202478408813477, "global_step": 153451, "epoch": 1848} {"train_loss": -22.912952423095703, "global_step": 153452, "epoch": 1848} {"train_loss": -23.117616653442383, "global_step": 153453, "epoch": 1848} {"train_loss": -23.472558975219727, "global_step": 153454, "epoch": 1848} {"train_loss": -23.62189292907715, "global_step": 153455, "epoch": 1848} {"train_loss": -23.21216583251953, "global_step": 153456, "epoch": 1848} {"train_loss": -23.40699005126953, "global_step": 153457, "epoch": 1848} {"train_loss": -22.793378829956055, "global_step": 153458, "epoch": 1848} {"train_loss": -22.938949584960938, "global_step": 153459, "epoch": 1848} {"train_loss": -23.539960861206055, "global_step": 153460, "epoch": 1848} {"train_loss": -23.318422317504883, "global_step": 153461, "epoch": 1848} {"train_loss": -23.537078857421875, "global_step": 153462, "epoch": 1848} {"train_loss": -23.447879791259766, "global_step": 153463, "epoch": 1848} {"train_loss": -23.154264450073242, "global_step": 153464, "epoch": 1848} {"train_loss": -22.816198348999023, "global_step": 153465, "epoch": 1848} {"train_loss": -23.13326828738293, "global_step": 153466, "epoch": 1848, "val_loss": 6337057.0} {"train_loss": -21.22613525390625, "global_step": 153467, "epoch": 1849} {"train_loss": -22.13589096069336, "global_step": 153468, "epoch": 1849} {"train_loss": -21.564420700073242, "global_step": 153469, "epoch": 1849} {"train_loss": -22.56171989440918, "global_step": 153470, "epoch": 1849} {"train_loss": -22.340255737304688, "global_step": 153471, "epoch": 1849} {"train_loss": -22.427099227905273, "global_step": 153472, "epoch": 1849} {"train_loss": -22.55556869506836, "global_step": 153473, "epoch": 1849} {"train_loss": -22.486722946166992, "global_step": 153474, "epoch": 1849} {"train_loss": -22.59895896911621, "global_step": 153475, "epoch": 1849} {"train_loss": -22.4345703125, "global_step": 153476, "epoch": 1849} {"train_loss": -22.332794189453125, "global_step": 153477, "epoch": 1849} {"train_loss": -22.544172286987305, "global_step": 153478, "epoch": 1849} {"train_loss": -22.568527221679688, "global_step": 153479, "epoch": 1849} {"train_loss": -23.04695701599121, "global_step": 153480, "epoch": 1849} {"train_loss": -22.6261043548584, "global_step": 153481, "epoch": 1849} {"train_loss": -22.58432960510254, "global_step": 153482, "epoch": 1849} {"train_loss": -22.609085083007812, "global_step": 153483, "epoch": 1849} {"train_loss": -23.02223777770996, "global_step": 153484, "epoch": 1849} {"train_loss": -22.909650802612305, "global_step": 153485, "epoch": 1849} {"train_loss": -23.379398345947266, "global_step": 153486, "epoch": 1849} {"train_loss": -23.168066024780273, "global_step": 153487, "epoch": 1849} {"train_loss": -22.898595809936523, "global_step": 153488, "epoch": 1849} {"train_loss": -22.827377319335938, "global_step": 153489, "epoch": 1849} {"train_loss": -22.85104751586914, "global_step": 153490, "epoch": 1849} {"train_loss": -23.089801788330078, "global_step": 153491, "epoch": 1849} {"train_loss": -23.0784969329834, "global_step": 153492, "epoch": 1849} {"train_loss": -23.144155502319336, "global_step": 153493, "epoch": 1849} {"train_loss": -23.142492294311523, "global_step": 153494, "epoch": 1849} {"train_loss": -23.464094161987305, "global_step": 153495, "epoch": 1849} {"train_loss": -23.084518432617188, "global_step": 153496, "epoch": 1849} {"train_loss": -23.062713623046875, "global_step": 153497, "epoch": 1849} {"train_loss": -23.219406127929688, "global_step": 153498, "epoch": 1849} {"train_loss": -23.54509925842285, "global_step": 153499, "epoch": 1849} {"train_loss": -23.229856491088867, "global_step": 153500, "epoch": 1849} {"train_loss": -23.114276885986328, "global_step": 153501, "epoch": 1849} {"train_loss": -22.9914608001709, "global_step": 153502, "epoch": 1849} {"train_loss": -22.77573013305664, "global_step": 153503, "epoch": 1849} {"train_loss": -23.37407875061035, "global_step": 153504, "epoch": 1849} {"train_loss": -22.735401153564453, "global_step": 153505, "epoch": 1849} {"train_loss": -23.273929595947266, "global_step": 153506, "epoch": 1849} {"train_loss": -23.2237491607666, "global_step": 153507, "epoch": 1849} {"train_loss": -23.503881454467773, "global_step": 153508, "epoch": 1849} {"train_loss": -23.293935775756836, "global_step": 153509, "epoch": 1849} {"train_loss": -23.37900733947754, "global_step": 153510, "epoch": 1849} {"train_loss": -23.40675926208496, "global_step": 153511, "epoch": 1849} {"train_loss": -23.284208297729492, "global_step": 153512, "epoch": 1849} {"train_loss": -22.99677085876465, "global_step": 153513, "epoch": 1849} {"train_loss": -23.19045066833496, "global_step": 153514, "epoch": 1849} {"train_loss": -23.225605010986328, "global_step": 153515, "epoch": 1849} {"train_loss": -23.57796287536621, "global_step": 153516, "epoch": 1849} {"train_loss": -23.14251708984375, "global_step": 153517, "epoch": 1849} {"train_loss": -22.973806381225586, "global_step": 153518, "epoch": 1849} {"train_loss": -23.398508071899414, "global_step": 153519, "epoch": 1849} {"train_loss": -23.492355346679688, "global_step": 153520, "epoch": 1849} {"train_loss": -23.008100509643555, "global_step": 153521, "epoch": 1849} {"train_loss": -23.456531524658203, "global_step": 153522, "epoch": 1849} {"train_loss": -23.082229614257812, "global_step": 153523, "epoch": 1849} {"train_loss": -23.224552154541016, "global_step": 153524, "epoch": 1849} {"train_loss": -23.447168350219727, "global_step": 153525, "epoch": 1849} {"train_loss": -23.28204917907715, "global_step": 153526, "epoch": 1849} {"train_loss": -23.76995086669922, "global_step": 153527, "epoch": 1849} {"train_loss": -23.565383911132812, "global_step": 153528, "epoch": 1849} {"train_loss": -23.239097595214844, "global_step": 153529, "epoch": 1849} {"train_loss": -23.784713745117188, "global_step": 153530, "epoch": 1849} {"train_loss": -22.967315673828125, "global_step": 153531, "epoch": 1849} {"train_loss": -23.421920776367188, "global_step": 153532, "epoch": 1849} {"train_loss": -23.746902465820312, "global_step": 153533, "epoch": 1849} {"train_loss": -23.38374900817871, "global_step": 153534, "epoch": 1849} {"train_loss": -23.559650421142578, "global_step": 153535, "epoch": 1849} {"train_loss": -23.248899459838867, "global_step": 153536, "epoch": 1849} {"train_loss": -23.553186416625977, "global_step": 153537, "epoch": 1849} {"train_loss": -23.49443244934082, "global_step": 153538, "epoch": 1849} {"train_loss": -23.270769119262695, "global_step": 153539, "epoch": 1849} {"train_loss": -23.365478515625, "global_step": 153540, "epoch": 1849} {"train_loss": -23.227725982666016, "global_step": 153541, "epoch": 1849} {"train_loss": -23.27490234375, "global_step": 153542, "epoch": 1849} {"train_loss": -23.464420318603516, "global_step": 153543, "epoch": 1849} {"train_loss": -23.54975700378418, "global_step": 153544, "epoch": 1849} {"train_loss": -23.309528350830078, "global_step": 153545, "epoch": 1849} {"train_loss": -23.575414657592773, "global_step": 153546, "epoch": 1849} {"train_loss": -23.557416915893555, "global_step": 153547, "epoch": 1849} {"train_loss": -23.01233673095703, "global_step": 153548, "epoch": 1849} {"train_loss": -23.073609409562078, "global_step": 153549, "epoch": 1849, "val_loss": 6285343.5} {"train_loss": -22.9466552734375, "global_step": 153550, "epoch": 1850} {"train_loss": -23.279882431030273, "global_step": 153551, "epoch": 1850} {"train_loss": -23.20110321044922, "global_step": 153552, "epoch": 1850} {"train_loss": -22.853200912475586, "global_step": 153553, "epoch": 1850} {"train_loss": -22.81890296936035, "global_step": 153554, "epoch": 1850} {"train_loss": -22.8428897857666, "global_step": 153555, "epoch": 1850} {"train_loss": -23.443593978881836, "global_step": 153556, "epoch": 1850} {"train_loss": -23.256633758544922, "global_step": 153557, "epoch": 1850} {"train_loss": -23.16469383239746, "global_step": 153558, "epoch": 1850} {"train_loss": -23.35938835144043, "global_step": 153559, "epoch": 1850} {"train_loss": -23.273616790771484, "global_step": 153560, "epoch": 1850} {"train_loss": -23.034912109375, "global_step": 153561, "epoch": 1850} {"train_loss": -23.3192081451416, "global_step": 153562, "epoch": 1850} {"train_loss": -22.883893966674805, "global_step": 153563, "epoch": 1850} {"train_loss": -23.439878463745117, "global_step": 153564, "epoch": 1850} {"train_loss": -22.87763786315918, "global_step": 153565, "epoch": 1850} {"train_loss": -23.32731819152832, "global_step": 153566, "epoch": 1850} {"train_loss": -23.16816520690918, "global_step": 153567, "epoch": 1850} {"train_loss": -23.319425582885742, "global_step": 153568, "epoch": 1850} {"train_loss": -23.008825302124023, "global_step": 153569, "epoch": 1850} {"train_loss": -23.172657012939453, "global_step": 153570, "epoch": 1850} {"train_loss": -22.941797256469727, "global_step": 153571, "epoch": 1850} {"train_loss": -23.17633056640625, "global_step": 153572, "epoch": 1850} {"train_loss": -22.9635009765625, "global_step": 153573, "epoch": 1850} {"train_loss": -23.561908721923828, "global_step": 153574, "epoch": 1850} {"train_loss": -23.211090087890625, "global_step": 153575, "epoch": 1850} {"train_loss": -23.028711318969727, "global_step": 153576, "epoch": 1850} {"train_loss": -23.049375534057617, "global_step": 153577, "epoch": 1850} {"train_loss": -23.215442657470703, "global_step": 153578, "epoch": 1850} {"train_loss": -22.972137451171875, "global_step": 153579, "epoch": 1850} {"train_loss": -23.353097915649414, "global_step": 153580, "epoch": 1850} {"train_loss": -22.941648483276367, "global_step": 153581, "epoch": 1850} {"train_loss": -23.017515182495117, "global_step": 153582, "epoch": 1850} {"train_loss": -23.249197006225586, "global_step": 153583, "epoch": 1850} {"train_loss": -23.146194458007812, "global_step": 153584, "epoch": 1850} {"train_loss": -23.42635154724121, "global_step": 153585, "epoch": 1850} {"train_loss": -23.39434814453125, "global_step": 153586, "epoch": 1850} {"train_loss": -23.12227439880371, "global_step": 153587, "epoch": 1850} {"train_loss": -23.381223678588867, "global_step": 153588, "epoch": 1850} {"train_loss": -23.03937339782715, "global_step": 153589, "epoch": 1850} {"train_loss": -23.48428726196289, "global_step": 153590, "epoch": 1850} {"train_loss": -23.297590255737305, "global_step": 153591, "epoch": 1850} {"train_loss": -23.039953231811523, "global_step": 153592, "epoch": 1850} {"train_loss": -23.05453872680664, "global_step": 153593, "epoch": 1850} {"train_loss": -23.5882625579834, "global_step": 153594, "epoch": 1850} {"train_loss": -23.690792083740234, "global_step": 153595, "epoch": 1850} {"train_loss": -23.531208038330078, "global_step": 153596, "epoch": 1850} {"train_loss": -23.396831512451172, "global_step": 153597, "epoch": 1850} {"train_loss": -23.340377807617188, "global_step": 153598, "epoch": 1850} {"train_loss": -23.317455291748047, "global_step": 153599, "epoch": 1850} {"train_loss": -23.70123863220215, "global_step": 153600, "epoch": 1850} {"train_loss": -23.6583309173584, "global_step": 153601, "epoch": 1850} {"train_loss": -23.137060165405273, "global_step": 153602, "epoch": 1850} {"train_loss": -23.30225372314453, "global_step": 153603, "epoch": 1850} {"train_loss": -23.63097381591797, "global_step": 153604, "epoch": 1850} {"train_loss": -23.235271453857422, "global_step": 153605, "epoch": 1850} {"train_loss": -23.37203598022461, "global_step": 153606, "epoch": 1850} {"train_loss": -23.59745216369629, "global_step": 153607, "epoch": 1850} {"train_loss": -23.847930908203125, "global_step": 153608, "epoch": 1850} {"train_loss": -23.643402099609375, "global_step": 153609, "epoch": 1850} {"train_loss": -23.37978744506836, "global_step": 153610, "epoch": 1850} {"train_loss": -23.47662353515625, "global_step": 153611, "epoch": 1850} {"train_loss": -23.351261138916016, "global_step": 153612, "epoch": 1850} {"train_loss": -23.71902084350586, "global_step": 153613, "epoch": 1850} {"train_loss": -23.387348175048828, "global_step": 153614, "epoch": 1850} {"train_loss": -23.509811401367188, "global_step": 153615, "epoch": 1850} {"train_loss": -23.620718002319336, "global_step": 153616, "epoch": 1850} {"train_loss": -23.56061363220215, "global_step": 153617, "epoch": 1850} {"train_loss": -23.46479606628418, "global_step": 153618, "epoch": 1850} {"train_loss": -23.744314193725586, "global_step": 153619, "epoch": 1850} {"train_loss": -23.58839225769043, "global_step": 153620, "epoch": 1850} {"train_loss": -23.83449363708496, "global_step": 153621, "epoch": 1850} {"train_loss": -23.31043815612793, "global_step": 153622, "epoch": 1850} {"train_loss": -23.610408782958984, "global_step": 153623, "epoch": 1850} {"train_loss": -23.4794979095459, "global_step": 153624, "epoch": 1850} {"train_loss": -23.590707778930664, "global_step": 153625, "epoch": 1850} {"train_loss": -23.184667587280273, "global_step": 153626, "epoch": 1850} {"train_loss": -23.296112060546875, "global_step": 153627, "epoch": 1850} {"train_loss": -23.15497589111328, "global_step": 153628, "epoch": 1850} {"train_loss": -23.967086791992188, "global_step": 153629, "epoch": 1850} {"train_loss": -23.68940544128418, "global_step": 153630, "epoch": 1850} {"train_loss": -23.847265243530273, "global_step": 153631, "epoch": 1850} {"train_loss": -23.33015611947301, "global_step": 153632, "epoch": 1850, "train/sim_max_reward_0": 1.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 0.0, "test/sim_max_reward_4500000": 1.0, "test/sim_max_reward_4500001": 1.0, "test/sim_max_reward_4500002": 1.0, "test/sim_max_reward_4500003": 1.0, "test/sim_max_reward_4500004": 0.0, "test/sim_max_reward_4500005": 1.0, "test/sim_max_reward_4500006": 1.0, "test/sim_max_reward_4500007": 1.0, "test/sim_max_reward_4500008": 1.0, "test/sim_max_reward_4500009": 1.0, "test/sim_max_reward_4500010": 1.0, "test/sim_max_reward_4500011": 1.0, "test/sim_max_reward_4500012": 1.0, "test/sim_max_reward_4500013": 1.0, "test/sim_max_reward_4500014": 1.0, "test/sim_max_reward_4500015": 1.0, "test/sim_max_reward_4500016": 1.0, "test/sim_max_reward_4500017": 1.0, "test/sim_max_reward_4500018": 1.0, "test/sim_max_reward_4500019": 1.0, "test/sim_max_reward_4500020": 1.0, "test/sim_max_reward_4500021": 1.0, "train/mean_score": 0.8333333333333334, "test/mean_score": 0.9545454545454546, "val_loss": 6421002.0} {"train_loss": -23.082700729370117, "global_step": 153633, "epoch": 1851} {"train_loss": -23.016510009765625, "global_step": 153634, "epoch": 1851} {"train_loss": -22.632266998291016, "global_step": 153635, "epoch": 1851} {"train_loss": -23.456422805786133, "global_step": 153636, "epoch": 1851} {"train_loss": -23.20063591003418, "global_step": 153637, "epoch": 1851} {"train_loss": -23.186904907226562, "global_step": 153638, "epoch": 1851} {"train_loss": -22.94143295288086, "global_step": 153639, "epoch": 1851} {"train_loss": -23.33526039123535, "global_step": 153640, "epoch": 1851} {"train_loss": -23.16254234313965, "global_step": 153641, "epoch": 1851} {"train_loss": -23.149295806884766, "global_step": 153642, "epoch": 1851} {"train_loss": -23.247634887695312, "global_step": 153643, "epoch": 1851} {"train_loss": -23.154565811157227, "global_step": 153644, "epoch": 1851} {"train_loss": -23.32820701599121, "global_step": 153645, "epoch": 1851} {"train_loss": -22.929723739624023, "global_step": 153646, "epoch": 1851} {"train_loss": -23.296884536743164, "global_step": 153647, "epoch": 1851} {"train_loss": -22.87306022644043, "global_step": 153648, "epoch": 1851} {"train_loss": -22.756229400634766, "global_step": 153649, "epoch": 1851} {"train_loss": -23.28363037109375, "global_step": 153650, "epoch": 1851} {"train_loss": -23.150171279907227, "global_step": 153651, "epoch": 1851} {"train_loss": -23.16071128845215, "global_step": 153652, "epoch": 1851} {"train_loss": -23.128538131713867, "global_step": 153653, "epoch": 1851} {"train_loss": -23.061941146850586, "global_step": 153654, "epoch": 1851} {"train_loss": -23.256357192993164, "global_step": 153655, "epoch": 1851} {"train_loss": -23.050107955932617, "global_step": 153656, "epoch": 1851} {"train_loss": -23.187788009643555, "global_step": 153657, "epoch": 1851} {"train_loss": -23.29458999633789, "global_step": 153658, "epoch": 1851} {"train_loss": -23.16232681274414, "global_step": 153659, "epoch": 1851} {"train_loss": -23.312545776367188, "global_step": 153660, "epoch": 1851} {"train_loss": -23.442392349243164, "global_step": 153661, "epoch": 1851} {"train_loss": -23.276325225830078, "global_step": 153662, "epoch": 1851} {"train_loss": -23.820127487182617, "global_step": 153663, "epoch": 1851} {"train_loss": -23.37139320373535, "global_step": 153664, "epoch": 1851} {"train_loss": -23.18604850769043, "global_step": 153665, "epoch": 1851} {"train_loss": -23.09760093688965, "global_step": 153666, "epoch": 1851} {"train_loss": -23.457937240600586, "global_step": 153667, "epoch": 1851} {"train_loss": -23.5699520111084, "global_step": 153668, "epoch": 1851} {"train_loss": -23.24985122680664, "global_step": 153669, "epoch": 1851} {"train_loss": -23.3713321685791, "global_step": 153670, "epoch": 1851} {"train_loss": -22.978164672851562, "global_step": 153671, "epoch": 1851} {"train_loss": -23.03028106689453, "global_step": 153672, "epoch": 1851} {"train_loss": -23.1204891204834, "global_step": 153673, "epoch": 1851} {"train_loss": -23.001310348510742, "global_step": 153674, "epoch": 1851} {"train_loss": -23.385583877563477, "global_step": 153675, "epoch": 1851} {"train_loss": -23.02254295349121, "global_step": 153676, "epoch": 1851} {"train_loss": -23.15186882019043, "global_step": 153677, "epoch": 1851} {"train_loss": -23.2575626373291, "global_step": 153678, "epoch": 1851} {"train_loss": -23.66343116760254, "global_step": 153679, "epoch": 1851} {"train_loss": -22.98094367980957, "global_step": 153680, "epoch": 1851} {"train_loss": -23.432662963867188, "global_step": 153681, "epoch": 1851} {"train_loss": -23.327316284179688, "global_step": 153682, "epoch": 1851} {"train_loss": -23.341917037963867, "global_step": 153683, "epoch": 1851} {"train_loss": -23.316984176635742, "global_step": 153684, "epoch": 1851} {"train_loss": -23.336225509643555, "global_step": 153685, "epoch": 1851} {"train_loss": -23.619993209838867, "global_step": 153686, "epoch": 1851} {"train_loss": -23.067119598388672, "global_step": 153687, "epoch": 1851} {"train_loss": -23.186832427978516, "global_step": 153688, "epoch": 1851} {"train_loss": -23.160411834716797, "global_step": 153689, "epoch": 1851} {"train_loss": -23.654882431030273, "global_step": 153690, "epoch": 1851} {"train_loss": -23.409912109375, "global_step": 153691, "epoch": 1851} {"train_loss": -23.333120346069336, "global_step": 153692, "epoch": 1851} {"train_loss": -23.206802368164062, "global_step": 153693, "epoch": 1851} {"train_loss": -23.36224937438965, "global_step": 153694, "epoch": 1851} {"train_loss": -23.47532081604004, "global_step": 153695, "epoch": 1851} {"train_loss": -23.738574981689453, "global_step": 153696, "epoch": 1851} {"train_loss": -23.537939071655273, "global_step": 153697, "epoch": 1851} {"train_loss": -23.410924911499023, "global_step": 153698, "epoch": 1851} {"train_loss": -23.60288429260254, "global_step": 153699, "epoch": 1851} {"train_loss": -23.0947265625, "global_step": 153700, "epoch": 1851} {"train_loss": -23.36955451965332, "global_step": 153701, "epoch": 1851} {"train_loss": -23.43256950378418, "global_step": 153702, "epoch": 1851} {"train_loss": -23.514480590820312, "global_step": 153703, "epoch": 1851} {"train_loss": -23.198286056518555, "global_step": 153704, "epoch": 1851} {"train_loss": -23.33786964416504, "global_step": 153705, "epoch": 1851} {"train_loss": -23.407764434814453, "global_step": 153706, "epoch": 1851} {"train_loss": -23.385202407836914, "global_step": 153707, "epoch": 1851} {"train_loss": -23.304458618164062, "global_step": 153708, "epoch": 1851} {"train_loss": -23.90667152404785, "global_step": 153709, "epoch": 1851} {"train_loss": -23.082651138305664, "global_step": 153710, "epoch": 1851} {"train_loss": -23.566268920898438, "global_step": 153711, "epoch": 1851} {"train_loss": -23.640804290771484, "global_step": 153712, "epoch": 1851} {"train_loss": -23.479650497436523, "global_step": 153713, "epoch": 1851} {"train_loss": -23.079736709594727, "global_step": 153714, "epoch": 1851} {"train_loss": -23.277242683502564, "global_step": 153715, "epoch": 1851, "val_loss": 6258187.0} {"train_loss": -23.048551559448242, "global_step": 153716, "epoch": 1852} {"train_loss": -22.701765060424805, "global_step": 153717, "epoch": 1852} {"train_loss": -23.12101936340332, "global_step": 153718, "epoch": 1852} {"train_loss": -23.22788429260254, "global_step": 153719, "epoch": 1852} {"train_loss": -22.758329391479492, "global_step": 153720, "epoch": 1852} {"train_loss": -22.728107452392578, "global_step": 153721, "epoch": 1852} {"train_loss": -23.01149559020996, "global_step": 153722, "epoch": 1852} {"train_loss": -22.967044830322266, "global_step": 153723, "epoch": 1852} {"train_loss": -23.263219833374023, "global_step": 153724, "epoch": 1852} {"train_loss": -23.167877197265625, "global_step": 153725, "epoch": 1852} {"train_loss": -23.46097183227539, "global_step": 153726, "epoch": 1852} {"train_loss": -23.340505599975586, "global_step": 153727, "epoch": 1852} {"train_loss": -22.67949867248535, "global_step": 153728, "epoch": 1852} {"train_loss": -22.74176597595215, "global_step": 153729, "epoch": 1852} {"train_loss": -23.43282127380371, "global_step": 153730, "epoch": 1852} {"train_loss": -22.545196533203125, "global_step": 153731, "epoch": 1852} {"train_loss": -22.98837661743164, "global_step": 153732, "epoch": 1852} {"train_loss": -22.996782302856445, "global_step": 153733, "epoch": 1852} {"train_loss": -23.183956146240234, "global_step": 153734, "epoch": 1852} {"train_loss": -23.314043045043945, "global_step": 153735, "epoch": 1852} {"train_loss": -23.380878448486328, "global_step": 153736, "epoch": 1852} {"train_loss": -23.116901397705078, "global_step": 153737, "epoch": 1852} {"train_loss": -23.291852951049805, "global_step": 153738, "epoch": 1852} {"train_loss": -23.0756893157959, "global_step": 153739, "epoch": 1852} {"train_loss": -23.156286239624023, "global_step": 153740, "epoch": 1852} {"train_loss": -23.50302505493164, "global_step": 153741, "epoch": 1852} {"train_loss": -23.306795120239258, "global_step": 153742, "epoch": 1852} {"train_loss": -23.69891929626465, "global_step": 153743, "epoch": 1852} {"train_loss": -22.99603843688965, "global_step": 153744, "epoch": 1852} {"train_loss": -23.05776023864746, "global_step": 153745, "epoch": 1852} {"train_loss": -23.72517967224121, "global_step": 153746, "epoch": 1852} {"train_loss": -23.13746452331543, "global_step": 153747, "epoch": 1852} {"train_loss": -23.461334228515625, "global_step": 153748, "epoch": 1852} {"train_loss": -23.473007202148438, "global_step": 153749, "epoch": 1852} {"train_loss": -23.332674026489258, "global_step": 153750, "epoch": 1852} {"train_loss": -23.333040237426758, "global_step": 153751, "epoch": 1852} {"train_loss": -23.087451934814453, "global_step": 153752, "epoch": 1852} {"train_loss": -23.528377532958984, "global_step": 153753, "epoch": 1852} {"train_loss": -23.441909790039062, "global_step": 153754, "epoch": 1852} {"train_loss": -23.55402946472168, "global_step": 153755, "epoch": 1852} {"train_loss": -23.466184616088867, "global_step": 153756, "epoch": 1852} {"train_loss": -23.64947509765625, "global_step": 153757, "epoch": 1852} {"train_loss": -23.5522518157959, "global_step": 153758, "epoch": 1852} {"train_loss": -23.579586029052734, "global_step": 153759, "epoch": 1852} {"train_loss": -23.353778839111328, "global_step": 153760, "epoch": 1852} {"train_loss": -23.341249465942383, "global_step": 153761, "epoch": 1852} {"train_loss": -23.220102310180664, "global_step": 153762, "epoch": 1852} {"train_loss": -23.339263916015625, "global_step": 153763, "epoch": 1852} {"train_loss": -22.9425106048584, "global_step": 153764, "epoch": 1852} {"train_loss": -23.476810455322266, "global_step": 153765, "epoch": 1852} {"train_loss": -23.594114303588867, "global_step": 153766, "epoch": 1852} {"train_loss": -23.59752082824707, "global_step": 153767, "epoch": 1852} {"train_loss": -23.584623336791992, "global_step": 153768, "epoch": 1852} {"train_loss": -23.498489379882812, "global_step": 153769, "epoch": 1852} {"train_loss": -23.192811965942383, "global_step": 153770, "epoch": 1852} {"train_loss": -23.431928634643555, "global_step": 153771, "epoch": 1852} {"train_loss": -23.558469772338867, "global_step": 153772, "epoch": 1852} {"train_loss": -23.696645736694336, "global_step": 153773, "epoch": 1852} {"train_loss": -23.293622970581055, "global_step": 153774, "epoch": 1852} {"train_loss": -23.742528915405273, "global_step": 153775, "epoch": 1852} {"train_loss": -23.327392578125, "global_step": 153776, "epoch": 1852} {"train_loss": -23.40367889404297, "global_step": 153777, "epoch": 1852} {"train_loss": -23.527822494506836, "global_step": 153778, "epoch": 1852} {"train_loss": -23.3035888671875, "global_step": 153779, "epoch": 1852} {"train_loss": -23.46225357055664, "global_step": 153780, "epoch": 1852} {"train_loss": -23.524524688720703, "global_step": 153781, "epoch": 1852} {"train_loss": -23.41285514831543, "global_step": 153782, "epoch": 1852} {"train_loss": -23.4224853515625, "global_step": 153783, "epoch": 1852} {"train_loss": -23.65752410888672, "global_step": 153784, "epoch": 1852} {"train_loss": -23.33906364440918, "global_step": 153785, "epoch": 1852} {"train_loss": -23.331260681152344, "global_step": 153786, "epoch": 1852} {"train_loss": -23.251113891601562, "global_step": 153787, "epoch": 1852} {"train_loss": -23.202234268188477, "global_step": 153788, "epoch": 1852} {"train_loss": -23.462221145629883, "global_step": 153789, "epoch": 1852} {"train_loss": -23.054336547851562, "global_step": 153790, "epoch": 1852} {"train_loss": -23.373924255371094, "global_step": 153791, "epoch": 1852} {"train_loss": -23.883432388305664, "global_step": 153792, "epoch": 1852} {"train_loss": -23.39352035522461, "global_step": 153793, "epoch": 1852} {"train_loss": -23.33793067932129, "global_step": 153794, "epoch": 1852} {"train_loss": -23.40127944946289, "global_step": 153795, "epoch": 1852} {"train_loss": -23.587512969970703, "global_step": 153796, "epoch": 1852} {"train_loss": -23.79176902770996, "global_step": 153797, "epoch": 1852} {"train_loss": -23.30171398944165, "global_step": 153798, "epoch": 1852, "val_loss": 6297498.0} {"train_loss": -23.117008209228516, "global_step": 153799, "epoch": 1853} {"train_loss": -23.047616958618164, "global_step": 153800, "epoch": 1853} {"train_loss": -23.56001853942871, "global_step": 153801, "epoch": 1853} {"train_loss": -23.02659797668457, "global_step": 153802, "epoch": 1853} {"train_loss": -22.985153198242188, "global_step": 153803, "epoch": 1853} {"train_loss": -23.103620529174805, "global_step": 153804, "epoch": 1853} {"train_loss": -22.99338722229004, "global_step": 153805, "epoch": 1853} {"train_loss": -23.286537170410156, "global_step": 153806, "epoch": 1853} {"train_loss": -22.90071678161621, "global_step": 153807, "epoch": 1853} {"train_loss": -23.00589370727539, "global_step": 153808, "epoch": 1853} {"train_loss": -23.495929718017578, "global_step": 153809, "epoch": 1853} {"train_loss": -23.025585174560547, "global_step": 153810, "epoch": 1853} {"train_loss": -23.22479820251465, "global_step": 153811, "epoch": 1853} {"train_loss": -22.939899444580078, "global_step": 153812, "epoch": 1853} {"train_loss": -23.126855850219727, "global_step": 153813, "epoch": 1853} {"train_loss": -23.516958236694336, "global_step": 153814, "epoch": 1853} {"train_loss": -23.475210189819336, "global_step": 153815, "epoch": 1853} {"train_loss": -22.838666915893555, "global_step": 153816, "epoch": 1853} {"train_loss": -23.073434829711914, "global_step": 153817, "epoch": 1853} {"train_loss": -23.194272994995117, "global_step": 153818, "epoch": 1853} {"train_loss": -23.330610275268555, "global_step": 153819, "epoch": 1853} {"train_loss": -22.940168380737305, "global_step": 153820, "epoch": 1853} {"train_loss": -23.421789169311523, "global_step": 153821, "epoch": 1853} {"train_loss": -23.662519454956055, "global_step": 153822, "epoch": 1853} {"train_loss": -23.0703182220459, "global_step": 153823, "epoch": 1853} {"train_loss": -23.45613670349121, "global_step": 153824, "epoch": 1853} {"train_loss": -23.434921264648438, "global_step": 153825, "epoch": 1853} {"train_loss": -23.161300659179688, "global_step": 153826, "epoch": 1853} {"train_loss": -23.53138542175293, "global_step": 153827, "epoch": 1853} {"train_loss": -23.259794235229492, "global_step": 153828, "epoch": 1853} {"train_loss": -23.37090492248535, "global_step": 153829, "epoch": 1853} {"train_loss": -23.1307315826416, "global_step": 153830, "epoch": 1853} {"train_loss": -23.450334548950195, "global_step": 153831, "epoch": 1853} {"train_loss": -23.45386505126953, "global_step": 153832, "epoch": 1853} {"train_loss": -23.258581161499023, "global_step": 153833, "epoch": 1853} {"train_loss": -23.91680145263672, "global_step": 153834, "epoch": 1853} {"train_loss": -23.21640396118164, "global_step": 153835, "epoch": 1853} {"train_loss": -23.605749130249023, "global_step": 153836, "epoch": 1853} {"train_loss": -22.97265625, "global_step": 153837, "epoch": 1853} {"train_loss": -23.146188735961914, "global_step": 153838, "epoch": 1853} {"train_loss": -23.89057159423828, "global_step": 153839, "epoch": 1853} {"train_loss": -23.427204132080078, "global_step": 153840, "epoch": 1853} {"train_loss": -23.2131404876709, "global_step": 153841, "epoch": 1853} {"train_loss": -23.579252243041992, "global_step": 153842, "epoch": 1853} {"train_loss": -23.36275863647461, "global_step": 153843, "epoch": 1853} {"train_loss": -23.27204704284668, "global_step": 153844, "epoch": 1853} {"train_loss": -23.345386505126953, "global_step": 153845, "epoch": 1853} {"train_loss": -23.241514205932617, "global_step": 153846, "epoch": 1853} {"train_loss": -23.53860855102539, "global_step": 153847, "epoch": 1853} {"train_loss": -23.453536987304688, "global_step": 153848, "epoch": 1853} {"train_loss": -23.61426544189453, "global_step": 153849, "epoch": 1853} {"train_loss": -23.666349411010742, "global_step": 153850, "epoch": 1853} {"train_loss": -23.685195922851562, "global_step": 153851, "epoch": 1853} {"train_loss": -23.06235122680664, "global_step": 153852, "epoch": 1853} {"train_loss": -23.328413009643555, "global_step": 153853, "epoch": 1853} {"train_loss": -23.075048446655273, "global_step": 153854, "epoch": 1853} {"train_loss": -23.440053939819336, "global_step": 153855, "epoch": 1853} {"train_loss": -23.31448745727539, "global_step": 153856, "epoch": 1853} {"train_loss": -23.347230911254883, "global_step": 153857, "epoch": 1853} {"train_loss": -23.322818756103516, "global_step": 153858, "epoch": 1853} {"train_loss": -23.383045196533203, "global_step": 153859, "epoch": 1853} {"train_loss": -23.54652976989746, "global_step": 153860, "epoch": 1853} {"train_loss": -23.317638397216797, "global_step": 153861, "epoch": 1853} {"train_loss": -23.38193130493164, "global_step": 153862, "epoch": 1853} {"train_loss": -23.286457061767578, "global_step": 153863, "epoch": 1853} {"train_loss": -23.659061431884766, "global_step": 153864, "epoch": 1853} {"train_loss": -22.952194213867188, "global_step": 153865, "epoch": 1853} {"train_loss": -22.840688705444336, "global_step": 153866, "epoch": 1853} {"train_loss": -23.64715003967285, "global_step": 153867, "epoch": 1853} {"train_loss": -23.313262939453125, "global_step": 153868, "epoch": 1853} {"train_loss": -22.89145851135254, "global_step": 153869, "epoch": 1853} {"train_loss": -22.971559524536133, "global_step": 153870, "epoch": 1853} {"train_loss": -23.365619659423828, "global_step": 153871, "epoch": 1853} {"train_loss": -23.127906799316406, "global_step": 153872, "epoch": 1853} {"train_loss": -23.416473388671875, "global_step": 153873, "epoch": 1853} {"train_loss": -23.585371017456055, "global_step": 153874, "epoch": 1853} {"train_loss": -23.40338706970215, "global_step": 153875, "epoch": 1853} {"train_loss": -23.292011260986328, "global_step": 153876, "epoch": 1853} {"train_loss": -23.140729904174805, "global_step": 153877, "epoch": 1853} {"train_loss": -23.028873443603516, "global_step": 153878, "epoch": 1853} {"train_loss": -23.29170799255371, "global_step": 153879, "epoch": 1853} {"train_loss": -23.0616397857666, "global_step": 153880, "epoch": 1853} {"train_loss": -23.307262282773674, "global_step": 153881, "epoch": 1853, "val_loss": 6367154.0} {"train_loss": -23.6132869720459, "global_step": 153882, "epoch": 1854} {"train_loss": -22.986408233642578, "global_step": 153883, "epoch": 1854} {"train_loss": -23.18979835510254, "global_step": 153884, "epoch": 1854} {"train_loss": -23.09962272644043, "global_step": 153885, "epoch": 1854} {"train_loss": -23.094839096069336, "global_step": 153886, "epoch": 1854} {"train_loss": -23.445571899414062, "global_step": 153887, "epoch": 1854} {"train_loss": -23.31768798828125, "global_step": 153888, "epoch": 1854} {"train_loss": -23.548559188842773, "global_step": 153889, "epoch": 1854} {"train_loss": -23.15402603149414, "global_step": 153890, "epoch": 1854} {"train_loss": -23.251771926879883, "global_step": 153891, "epoch": 1854} {"train_loss": -23.287002563476562, "global_step": 153892, "epoch": 1854} {"train_loss": -23.17870330810547, "global_step": 153893, "epoch": 1854} {"train_loss": -22.94093894958496, "global_step": 153894, "epoch": 1854} {"train_loss": -23.591711044311523, "global_step": 153895, "epoch": 1854} {"train_loss": -23.17081069946289, "global_step": 153896, "epoch": 1854} {"train_loss": -22.889646530151367, "global_step": 153897, "epoch": 1854} {"train_loss": -23.3439884185791, "global_step": 153898, "epoch": 1854} {"train_loss": -23.22464370727539, "global_step": 153899, "epoch": 1854} {"train_loss": -23.482643127441406, "global_step": 153900, "epoch": 1854} {"train_loss": -23.1491756439209, "global_step": 153901, "epoch": 1854} {"train_loss": -23.088056564331055, "global_step": 153902, "epoch": 1854} {"train_loss": -23.35995101928711, "global_step": 153903, "epoch": 1854} {"train_loss": -23.59518051147461, "global_step": 153904, "epoch": 1854} {"train_loss": -23.196577072143555, "global_step": 153905, "epoch": 1854} {"train_loss": -23.574689865112305, "global_step": 153906, "epoch": 1854} {"train_loss": -23.593706130981445, "global_step": 153907, "epoch": 1854} {"train_loss": -23.26789665222168, "global_step": 153908, "epoch": 1854} {"train_loss": -23.395444869995117, "global_step": 153909, "epoch": 1854} {"train_loss": -23.201963424682617, "global_step": 153910, "epoch": 1854} {"train_loss": -23.57830810546875, "global_step": 153911, "epoch": 1854} {"train_loss": -23.202756881713867, "global_step": 153912, "epoch": 1854} {"train_loss": -23.52155113220215, "global_step": 153913, "epoch": 1854} {"train_loss": -23.439733505249023, "global_step": 153914, "epoch": 1854} {"train_loss": -23.4038143157959, "global_step": 153915, "epoch": 1854} {"train_loss": -23.437969207763672, "global_step": 153916, "epoch": 1854} {"train_loss": -23.23690414428711, "global_step": 153917, "epoch": 1854} {"train_loss": -23.22676658630371, "global_step": 153918, "epoch": 1854} {"train_loss": -23.38644027709961, "global_step": 153919, "epoch": 1854} {"train_loss": -23.48345947265625, "global_step": 153920, "epoch": 1854} {"train_loss": -23.612714767456055, "global_step": 153921, "epoch": 1854} {"train_loss": -23.366580963134766, "global_step": 153922, "epoch": 1854} {"train_loss": -23.35443687438965, "global_step": 153923, "epoch": 1854} {"train_loss": -23.867372512817383, "global_step": 153924, "epoch": 1854} {"train_loss": -23.56247329711914, "global_step": 153925, "epoch": 1854} {"train_loss": -23.368741989135742, "global_step": 153926, "epoch": 1854} {"train_loss": -23.613584518432617, "global_step": 153927, "epoch": 1854} {"train_loss": -23.264495849609375, "global_step": 153928, "epoch": 1854} {"train_loss": -23.337387084960938, "global_step": 153929, "epoch": 1854} {"train_loss": -23.555561065673828, "global_step": 153930, "epoch": 1854} {"train_loss": -23.236934661865234, "global_step": 153931, "epoch": 1854} {"train_loss": -23.440526962280273, "global_step": 153932, "epoch": 1854} {"train_loss": -22.930160522460938, "global_step": 153933, "epoch": 1854} {"train_loss": -23.132516860961914, "global_step": 153934, "epoch": 1854} {"train_loss": -22.969562530517578, "global_step": 153935, "epoch": 1854} {"train_loss": -22.74033546447754, "global_step": 153936, "epoch": 1854} {"train_loss": -22.54819679260254, "global_step": 153937, "epoch": 1854} {"train_loss": -22.6358642578125, "global_step": 153938, "epoch": 1854} {"train_loss": -23.34989356994629, "global_step": 153939, "epoch": 1854} {"train_loss": -23.730106353759766, "global_step": 153940, "epoch": 1854} {"train_loss": -22.9296932220459, "global_step": 153941, "epoch": 1854} {"train_loss": -23.190959930419922, "global_step": 153942, "epoch": 1854} {"train_loss": -23.644264221191406, "global_step": 153943, "epoch": 1854} {"train_loss": -23.118398666381836, "global_step": 153944, "epoch": 1854} {"train_loss": -23.2847900390625, "global_step": 153945, "epoch": 1854} {"train_loss": -23.36956787109375, "global_step": 153946, "epoch": 1854} {"train_loss": -23.47203254699707, "global_step": 153947, "epoch": 1854} {"train_loss": -23.40700912475586, "global_step": 153948, "epoch": 1854} {"train_loss": -23.08856964111328, "global_step": 153949, "epoch": 1854} {"train_loss": -23.22736167907715, "global_step": 153950, "epoch": 1854} {"train_loss": -23.320425033569336, "global_step": 153951, "epoch": 1854} {"train_loss": -23.412511825561523, "global_step": 153952, "epoch": 1854} {"train_loss": -23.32074546813965, "global_step": 153953, "epoch": 1854} {"train_loss": -23.30733299255371, "global_step": 153954, "epoch": 1854} {"train_loss": -23.507339477539062, "global_step": 153955, "epoch": 1854} {"train_loss": -23.358060836791992, "global_step": 153956, "epoch": 1854} {"train_loss": -22.992643356323242, "global_step": 153957, "epoch": 1854} {"train_loss": -23.342910766601562, "global_step": 153958, "epoch": 1854} {"train_loss": -23.718708038330078, "global_step": 153959, "epoch": 1854} {"train_loss": -23.56093406677246, "global_step": 153960, "epoch": 1854} {"train_loss": -23.27381706237793, "global_step": 153961, "epoch": 1854} {"train_loss": -23.545978546142578, "global_step": 153962, "epoch": 1854} {"train_loss": -23.3370361328125, "global_step": 153963, "epoch": 1854} {"train_loss": -23.30904524010348, "global_step": 153964, "epoch": 1854, "val_loss": 6326834.0} {"train_loss": -22.52140235900879, "global_step": 153965, "epoch": 1855} {"train_loss": -22.961563110351562, "global_step": 153966, "epoch": 1855} {"train_loss": -22.924081802368164, "global_step": 153967, "epoch": 1855} {"train_loss": -23.004724502563477, "global_step": 153968, "epoch": 1855} {"train_loss": -22.88715171813965, "global_step": 153969, "epoch": 1855} {"train_loss": -22.959089279174805, "global_step": 153970, "epoch": 1855} {"train_loss": -22.723011016845703, "global_step": 153971, "epoch": 1855} {"train_loss": -23.223257064819336, "global_step": 153972, "epoch": 1855} {"train_loss": -23.018247604370117, "global_step": 153973, "epoch": 1855} {"train_loss": -23.15665626525879, "global_step": 153974, "epoch": 1855} {"train_loss": -22.875242233276367, "global_step": 153975, "epoch": 1855} {"train_loss": -22.829147338867188, "global_step": 153976, "epoch": 1855} {"train_loss": -23.390600204467773, "global_step": 153977, "epoch": 1855} {"train_loss": -23.336938858032227, "global_step": 153978, "epoch": 1855} {"train_loss": -23.223474502563477, "global_step": 153979, "epoch": 1855} {"train_loss": -22.86191177368164, "global_step": 153980, "epoch": 1855} {"train_loss": -23.437397003173828, "global_step": 153981, "epoch": 1855} {"train_loss": -22.91440773010254, "global_step": 153982, "epoch": 1855} {"train_loss": -23.06958770751953, "global_step": 153983, "epoch": 1855} {"train_loss": -23.268220901489258, "global_step": 153984, "epoch": 1855} {"train_loss": -23.17575454711914, "global_step": 153985, "epoch": 1855} {"train_loss": -23.497243881225586, "global_step": 153986, "epoch": 1855} {"train_loss": -23.407621383666992, "global_step": 153987, "epoch": 1855} {"train_loss": -23.107297897338867, "global_step": 153988, "epoch": 1855} {"train_loss": -22.83436393737793, "global_step": 153989, "epoch": 1855} {"train_loss": -23.361501693725586, "global_step": 153990, "epoch": 1855} {"train_loss": -23.106861114501953, "global_step": 153991, "epoch": 1855} {"train_loss": -23.445053100585938, "global_step": 153992, "epoch": 1855} {"train_loss": -23.16561508178711, "global_step": 153993, "epoch": 1855} {"train_loss": -23.681264877319336, "global_step": 153994, "epoch": 1855} {"train_loss": -23.05356788635254, "global_step": 153995, "epoch": 1855} {"train_loss": -23.419126510620117, "global_step": 153996, "epoch": 1855} {"train_loss": -23.360565185546875, "global_step": 153997, "epoch": 1855} {"train_loss": -23.284305572509766, "global_step": 153998, "epoch": 1855} {"train_loss": -23.45416259765625, "global_step": 153999, "epoch": 1855} {"train_loss": -23.41249656677246, "global_step": 154000, "epoch": 1855} {"train_loss": -23.4237117767334, "global_step": 154001, "epoch": 1855} {"train_loss": -23.47389030456543, "global_step": 154002, "epoch": 1855} {"train_loss": -23.40519142150879, "global_step": 154003, "epoch": 1855} {"train_loss": -23.49309730529785, "global_step": 154004, "epoch": 1855} {"train_loss": -23.42361831665039, "global_step": 154005, "epoch": 1855} {"train_loss": -23.045442581176758, "global_step": 154006, "epoch": 1855} {"train_loss": -23.471811294555664, "global_step": 154007, "epoch": 1855} {"train_loss": -23.679100036621094, "global_step": 154008, "epoch": 1855} {"train_loss": -23.517898559570312, "global_step": 154009, "epoch": 1855} {"train_loss": -23.591726303100586, "global_step": 154010, "epoch": 1855} {"train_loss": -23.570545196533203, "global_step": 154011, "epoch": 1855} {"train_loss": -23.256000518798828, "global_step": 154012, "epoch": 1855} {"train_loss": -23.228330612182617, "global_step": 154013, "epoch": 1855} {"train_loss": -23.079864501953125, "global_step": 154014, "epoch": 1855} {"train_loss": -23.032373428344727, "global_step": 154015, "epoch": 1855} {"train_loss": -23.608196258544922, "global_step": 154016, "epoch": 1855} {"train_loss": -23.18533706665039, "global_step": 154017, "epoch": 1855} {"train_loss": -23.10445785522461, "global_step": 154018, "epoch": 1855} {"train_loss": -23.127099990844727, "global_step": 154019, "epoch": 1855} {"train_loss": -23.374792098999023, "global_step": 154020, "epoch": 1855} {"train_loss": -23.187986373901367, "global_step": 154021, "epoch": 1855} {"train_loss": -23.138608932495117, "global_step": 154022, "epoch": 1855} {"train_loss": -22.94196128845215, "global_step": 154023, "epoch": 1855} {"train_loss": -23.21531867980957, "global_step": 154024, "epoch": 1855} {"train_loss": -23.20308494567871, "global_step": 154025, "epoch": 1855} {"train_loss": -22.64725685119629, "global_step": 154026, "epoch": 1855} {"train_loss": -23.467416763305664, "global_step": 154027, "epoch": 1855} {"train_loss": -22.707849502563477, "global_step": 154028, "epoch": 1855} {"train_loss": -23.145986557006836, "global_step": 154029, "epoch": 1855} {"train_loss": -23.14002799987793, "global_step": 154030, "epoch": 1855} {"train_loss": -23.486154556274414, "global_step": 154031, "epoch": 1855} {"train_loss": -23.25687026977539, "global_step": 154032, "epoch": 1855} {"train_loss": -23.252744674682617, "global_step": 154033, "epoch": 1855} {"train_loss": -23.460330963134766, "global_step": 154034, "epoch": 1855} {"train_loss": -23.183000564575195, "global_step": 154035, "epoch": 1855} {"train_loss": -23.14226722717285, "global_step": 154036, "epoch": 1855} {"train_loss": -22.7602481842041, "global_step": 154037, "epoch": 1855} {"train_loss": -23.256982803344727, "global_step": 154038, "epoch": 1855} {"train_loss": -23.736827850341797, "global_step": 154039, "epoch": 1855} {"train_loss": -23.349014282226562, "global_step": 154040, "epoch": 1855} {"train_loss": -23.322839736938477, "global_step": 154041, "epoch": 1855} {"train_loss": -23.28911018371582, "global_step": 154042, "epoch": 1855} {"train_loss": -23.729589462280273, "global_step": 154043, "epoch": 1855} {"train_loss": -23.470090866088867, "global_step": 154044, "epoch": 1855} {"train_loss": -22.975906372070312, "global_step": 154045, "epoch": 1855} {"train_loss": -23.13453483581543, "global_step": 154046, "epoch": 1855} {"train_loss": -23.23181244264166, "global_step": 154047, "epoch": 1855, "val_loss": 6373259.0} {"train_loss": -22.641515731811523, "global_step": 154048, "epoch": 1856} {"train_loss": -22.85354995727539, "global_step": 154049, "epoch": 1856} {"train_loss": -23.155868530273438, "global_step": 154050, "epoch": 1856} {"train_loss": -22.837430953979492, "global_step": 154051, "epoch": 1856} {"train_loss": -22.77280616760254, "global_step": 154052, "epoch": 1856} {"train_loss": -23.36410903930664, "global_step": 154053, "epoch": 1856} {"train_loss": -22.870641708374023, "global_step": 154054, "epoch": 1856} {"train_loss": -23.12685203552246, "global_step": 154055, "epoch": 1856} {"train_loss": -22.924360275268555, "global_step": 154056, "epoch": 1856} {"train_loss": -23.031387329101562, "global_step": 154057, "epoch": 1856} {"train_loss": -23.10920524597168, "global_step": 154058, "epoch": 1856} {"train_loss": -22.954551696777344, "global_step": 154059, "epoch": 1856} {"train_loss": -23.29789161682129, "global_step": 154060, "epoch": 1856} {"train_loss": -23.322036743164062, "global_step": 154061, "epoch": 1856} {"train_loss": -22.928739547729492, "global_step": 154062, "epoch": 1856} {"train_loss": -23.62624740600586, "global_step": 154063, "epoch": 1856} {"train_loss": -23.088987350463867, "global_step": 154064, "epoch": 1856} {"train_loss": -23.106916427612305, "global_step": 154065, "epoch": 1856} {"train_loss": -23.215845108032227, "global_step": 154066, "epoch": 1856} {"train_loss": -23.47365379333496, "global_step": 154067, "epoch": 1856} {"train_loss": -23.214282989501953, "global_step": 154068, "epoch": 1856} {"train_loss": -23.327068328857422, "global_step": 154069, "epoch": 1856} {"train_loss": -23.581558227539062, "global_step": 154070, "epoch": 1856} {"train_loss": -23.360929489135742, "global_step": 154071, "epoch": 1856} {"train_loss": -23.432830810546875, "global_step": 154072, "epoch": 1856} {"train_loss": -23.60312271118164, "global_step": 154073, "epoch": 1856} {"train_loss": -22.94648551940918, "global_step": 154074, "epoch": 1856} {"train_loss": -23.531370162963867, "global_step": 154075, "epoch": 1856} {"train_loss": -23.272367477416992, "global_step": 154076, "epoch": 1856} {"train_loss": -23.2177734375, "global_step": 154077, "epoch": 1856} {"train_loss": -23.45952606201172, "global_step": 154078, "epoch": 1856} {"train_loss": -23.597990036010742, "global_step": 154079, "epoch": 1856} {"train_loss": -23.570653915405273, "global_step": 154080, "epoch": 1856} {"train_loss": -23.980466842651367, "global_step": 154081, "epoch": 1856} {"train_loss": -23.34889030456543, "global_step": 154082, "epoch": 1856} {"train_loss": -23.286529541015625, "global_step": 154083, "epoch": 1856} {"train_loss": -23.361774444580078, "global_step": 154084, "epoch": 1856} {"train_loss": -23.503162384033203, "global_step": 154085, "epoch": 1856} {"train_loss": -23.710681915283203, "global_step": 154086, "epoch": 1856} {"train_loss": -23.427080154418945, "global_step": 154087, "epoch": 1856} {"train_loss": -23.31732749938965, "global_step": 154088, "epoch": 1856} {"train_loss": -23.17221450805664, "global_step": 154089, "epoch": 1856} {"train_loss": -23.200963973999023, "global_step": 154090, "epoch": 1856} {"train_loss": -23.60761070251465, "global_step": 154091, "epoch": 1856} {"train_loss": -23.34868621826172, "global_step": 154092, "epoch": 1856} {"train_loss": -23.499467849731445, "global_step": 154093, "epoch": 1856} {"train_loss": -22.87457847595215, "global_step": 154094, "epoch": 1856} {"train_loss": -23.38055992126465, "global_step": 154095, "epoch": 1856} {"train_loss": -23.354984283447266, "global_step": 154096, "epoch": 1856} {"train_loss": -23.808408737182617, "global_step": 154097, "epoch": 1856} {"train_loss": -23.019651412963867, "global_step": 154098, "epoch": 1856} {"train_loss": -23.358169555664062, "global_step": 154099, "epoch": 1856} {"train_loss": -23.313657760620117, "global_step": 154100, "epoch": 1856} {"train_loss": -24.060598373413086, "global_step": 154101, "epoch": 1856} {"train_loss": -23.420936584472656, "global_step": 154102, "epoch": 1856} {"train_loss": -23.711515426635742, "global_step": 154103, "epoch": 1856} {"train_loss": -23.385225296020508, "global_step": 154104, "epoch": 1856} {"train_loss": -23.571420669555664, "global_step": 154105, "epoch": 1856} {"train_loss": -23.03520965576172, "global_step": 154106, "epoch": 1856} {"train_loss": -23.36391258239746, "global_step": 154107, "epoch": 1856} {"train_loss": -23.535676956176758, "global_step": 154108, "epoch": 1856} {"train_loss": -22.99091339111328, "global_step": 154109, "epoch": 1856} {"train_loss": -23.41876220703125, "global_step": 154110, "epoch": 1856} {"train_loss": -23.210954666137695, "global_step": 154111, "epoch": 1856} {"train_loss": -23.489412307739258, "global_step": 154112, "epoch": 1856} {"train_loss": -23.420297622680664, "global_step": 154113, "epoch": 1856} {"train_loss": -23.38144302368164, "global_step": 154114, "epoch": 1856} {"train_loss": -23.334829330444336, "global_step": 154115, "epoch": 1856} {"train_loss": -23.53150749206543, "global_step": 154116, "epoch": 1856} {"train_loss": -23.121198654174805, "global_step": 154117, "epoch": 1856} {"train_loss": -23.117387771606445, "global_step": 154118, "epoch": 1856} {"train_loss": -23.2375545501709, "global_step": 154119, "epoch": 1856} {"train_loss": -23.495386123657227, "global_step": 154120, "epoch": 1856} {"train_loss": -23.548511505126953, "global_step": 154121, "epoch": 1856} {"train_loss": -23.046600341796875, "global_step": 154122, "epoch": 1856} {"train_loss": -23.1851863861084, "global_step": 154123, "epoch": 1856} {"train_loss": -23.62543296813965, "global_step": 154124, "epoch": 1856} {"train_loss": -23.29364013671875, "global_step": 154125, "epoch": 1856} {"train_loss": -23.44791030883789, "global_step": 154126, "epoch": 1856} {"train_loss": -23.233230590820312, "global_step": 154127, "epoch": 1856} {"train_loss": -23.627891540527344, "global_step": 154128, "epoch": 1856} {"train_loss": -23.487272262573242, "global_step": 154129, "epoch": 1856} {"train_loss": -23.322212058377552, "global_step": 154130, "epoch": 1856, "val_loss": 6390450.0} {"train_loss": -22.53415870666504, "global_step": 154131, "epoch": 1857} {"train_loss": -22.875028610229492, "global_step": 154132, "epoch": 1857} {"train_loss": -22.73111343383789, "global_step": 154133, "epoch": 1857} {"train_loss": -23.145782470703125, "global_step": 154134, "epoch": 1857} {"train_loss": -22.810617446899414, "global_step": 154135, "epoch": 1857} {"train_loss": -23.1884822845459, "global_step": 154136, "epoch": 1857} {"train_loss": -23.536537170410156, "global_step": 154137, "epoch": 1857} {"train_loss": -22.820219039916992, "global_step": 154138, "epoch": 1857} {"train_loss": -22.891916275024414, "global_step": 154139, "epoch": 1857} {"train_loss": -22.953750610351562, "global_step": 154140, "epoch": 1857} {"train_loss": -23.12961196899414, "global_step": 154141, "epoch": 1857} {"train_loss": -23.25855827331543, "global_step": 154142, "epoch": 1857} {"train_loss": -23.298288345336914, "global_step": 154143, "epoch": 1857} {"train_loss": -23.327987670898438, "global_step": 154144, "epoch": 1857} {"train_loss": -23.46786880493164, "global_step": 154145, "epoch": 1857} {"train_loss": -23.321340560913086, "global_step": 154146, "epoch": 1857} {"train_loss": -23.406892776489258, "global_step": 154147, "epoch": 1857} {"train_loss": -23.658750534057617, "global_step": 154148, "epoch": 1857} {"train_loss": -23.381162643432617, "global_step": 154149, "epoch": 1857} {"train_loss": -23.380746841430664, "global_step": 154150, "epoch": 1857} {"train_loss": -22.992645263671875, "global_step": 154151, "epoch": 1857} {"train_loss": -23.175790786743164, "global_step": 154152, "epoch": 1857} {"train_loss": -23.26833152770996, "global_step": 154153, "epoch": 1857} {"train_loss": -23.466827392578125, "global_step": 154154, "epoch": 1857} {"train_loss": -23.174694061279297, "global_step": 154155, "epoch": 1857} {"train_loss": -23.181381225585938, "global_step": 154156, "epoch": 1857} {"train_loss": -23.48187828063965, "global_step": 154157, "epoch": 1857} {"train_loss": -23.565237045288086, "global_step": 154158, "epoch": 1857} {"train_loss": -23.415515899658203, "global_step": 154159, "epoch": 1857} {"train_loss": -23.68106460571289, "global_step": 154160, "epoch": 1857} {"train_loss": -23.158781051635742, "global_step": 154161, "epoch": 1857} {"train_loss": -23.11897087097168, "global_step": 154162, "epoch": 1857} {"train_loss": -23.41253662109375, "global_step": 154163, "epoch": 1857} {"train_loss": -23.378671646118164, "global_step": 154164, "epoch": 1857} {"train_loss": -23.390546798706055, "global_step": 154165, "epoch": 1857} {"train_loss": -23.317794799804688, "global_step": 154166, "epoch": 1857} {"train_loss": -23.157245635986328, "global_step": 154167, "epoch": 1857} {"train_loss": -23.406269073486328, "global_step": 154168, "epoch": 1857} {"train_loss": -23.130155563354492, "global_step": 154169, "epoch": 1857} {"train_loss": -23.263141632080078, "global_step": 154170, "epoch": 1857} {"train_loss": -23.42870330810547, "global_step": 154171, "epoch": 1857} {"train_loss": -23.015045166015625, "global_step": 154172, "epoch": 1857} {"train_loss": -23.848196029663086, "global_step": 154173, "epoch": 1857} {"train_loss": -22.833763122558594, "global_step": 154174, "epoch": 1857} {"train_loss": -23.473546981811523, "global_step": 154175, "epoch": 1857} {"train_loss": -23.642074584960938, "global_step": 154176, "epoch": 1857} {"train_loss": -23.69563865661621, "global_step": 154177, "epoch": 1857} {"train_loss": -23.819496154785156, "global_step": 154178, "epoch": 1857} {"train_loss": -23.43793296813965, "global_step": 154179, "epoch": 1857} {"train_loss": -23.549625396728516, "global_step": 154180, "epoch": 1857} {"train_loss": -22.955852508544922, "global_step": 154181, "epoch": 1857} {"train_loss": -23.709314346313477, "global_step": 154182, "epoch": 1857} {"train_loss": -23.418081283569336, "global_step": 154183, "epoch": 1857} {"train_loss": -23.637968063354492, "global_step": 154184, "epoch": 1857} {"train_loss": -23.26703643798828, "global_step": 154185, "epoch": 1857} {"train_loss": -23.7714900970459, "global_step": 154186, "epoch": 1857} {"train_loss": -23.21357536315918, "global_step": 154187, "epoch": 1857} {"train_loss": -23.261566162109375, "global_step": 154188, "epoch": 1857} {"train_loss": -23.603269577026367, "global_step": 154189, "epoch": 1857} {"train_loss": -23.740676879882812, "global_step": 154190, "epoch": 1857} {"train_loss": -23.311115264892578, "global_step": 154191, "epoch": 1857} {"train_loss": -23.293720245361328, "global_step": 154192, "epoch": 1857} {"train_loss": -23.346765518188477, "global_step": 154193, "epoch": 1857} {"train_loss": -23.386306762695312, "global_step": 154194, "epoch": 1857} {"train_loss": -23.619850158691406, "global_step": 154195, "epoch": 1857} {"train_loss": -23.34590721130371, "global_step": 154196, "epoch": 1857} {"train_loss": -23.693490982055664, "global_step": 154197, "epoch": 1857} {"train_loss": -23.3615665435791, "global_step": 154198, "epoch": 1857} {"train_loss": -23.200300216674805, "global_step": 154199, "epoch": 1857} {"train_loss": -23.476842880249023, "global_step": 154200, "epoch": 1857} {"train_loss": -23.283422470092773, "global_step": 154201, "epoch": 1857} {"train_loss": -23.224550247192383, "global_step": 154202, "epoch": 1857} {"train_loss": -23.264333724975586, "global_step": 154203, "epoch": 1857} {"train_loss": -23.39466094970703, "global_step": 154204, "epoch": 1857} {"train_loss": -23.347888946533203, "global_step": 154205, "epoch": 1857} {"train_loss": -23.1914119720459, "global_step": 154206, "epoch": 1857} {"train_loss": -23.327091217041016, "global_step": 154207, "epoch": 1857} {"train_loss": -23.67347526550293, "global_step": 154208, "epoch": 1857} {"train_loss": -23.68391990661621, "global_step": 154209, "epoch": 1857} {"train_loss": -23.788427352905273, "global_step": 154210, "epoch": 1857} {"train_loss": -23.53639030456543, "global_step": 154211, "epoch": 1857} {"train_loss": -23.146854400634766, "global_step": 154212, "epoch": 1857} {"train_loss": -23.34207321075072, "global_step": 154213, "epoch": 1857, "val_loss": 6452260.0} {"train_loss": -22.670093536376953, "global_step": 154214, "epoch": 1858} {"train_loss": -22.357213973999023, "global_step": 154215, "epoch": 1858} {"train_loss": -21.841032028198242, "global_step": 154216, "epoch": 1858} {"train_loss": -22.092626571655273, "global_step": 154217, "epoch": 1858} {"train_loss": -22.558507919311523, "global_step": 154218, "epoch": 1858} {"train_loss": -22.763635635375977, "global_step": 154219, "epoch": 1858} {"train_loss": -22.831327438354492, "global_step": 154220, "epoch": 1858} {"train_loss": -22.759679794311523, "global_step": 154221, "epoch": 1858} {"train_loss": -22.563833236694336, "global_step": 154222, "epoch": 1858} {"train_loss": -22.833343505859375, "global_step": 154223, "epoch": 1858} {"train_loss": -22.818828582763672, "global_step": 154224, "epoch": 1858} {"train_loss": -22.374313354492188, "global_step": 154225, "epoch": 1858} {"train_loss": -23.015274047851562, "global_step": 154226, "epoch": 1858} {"train_loss": -22.87774658203125, "global_step": 154227, "epoch": 1858} {"train_loss": -22.822336196899414, "global_step": 154228, "epoch": 1858} {"train_loss": -23.012502670288086, "global_step": 154229, "epoch": 1858} {"train_loss": -23.052213668823242, "global_step": 154230, "epoch": 1858} {"train_loss": -23.12209701538086, "global_step": 154231, "epoch": 1858} {"train_loss": -22.79032325744629, "global_step": 154232, "epoch": 1858} {"train_loss": -23.178823471069336, "global_step": 154233, "epoch": 1858} {"train_loss": -22.683454513549805, "global_step": 154234, "epoch": 1858} {"train_loss": -23.113204956054688, "global_step": 154235, "epoch": 1858} {"train_loss": -23.26658058166504, "global_step": 154236, "epoch": 1858} {"train_loss": -22.725706100463867, "global_step": 154237, "epoch": 1858} {"train_loss": -23.254018783569336, "global_step": 154238, "epoch": 1858} {"train_loss": -23.202991485595703, "global_step": 154239, "epoch": 1858} {"train_loss": -23.220495223999023, "global_step": 154240, "epoch": 1858} {"train_loss": -23.103681564331055, "global_step": 154241, "epoch": 1858} {"train_loss": -22.773792266845703, "global_step": 154242, "epoch": 1858} {"train_loss": -23.0878849029541, "global_step": 154243, "epoch": 1858} {"train_loss": -23.352109909057617, "global_step": 154244, "epoch": 1858} {"train_loss": -23.452621459960938, "global_step": 154245, "epoch": 1858} {"train_loss": -23.238601684570312, "global_step": 154246, "epoch": 1858} {"train_loss": -23.26033592224121, "global_step": 154247, "epoch": 1858} {"train_loss": -23.580379486083984, "global_step": 154248, "epoch": 1858} {"train_loss": -23.217336654663086, "global_step": 154249, "epoch": 1858} {"train_loss": -23.47846031188965, "global_step": 154250, "epoch": 1858} {"train_loss": -23.149747848510742, "global_step": 154251, "epoch": 1858} {"train_loss": -23.21199607849121, "global_step": 154252, "epoch": 1858} {"train_loss": -23.405920028686523, "global_step": 154253, "epoch": 1858} {"train_loss": -23.515966415405273, "global_step": 154254, "epoch": 1858} {"train_loss": -23.304443359375, "global_step": 154255, "epoch": 1858} {"train_loss": -23.45197868347168, "global_step": 154256, "epoch": 1858} {"train_loss": -23.52694320678711, "global_step": 154257, "epoch": 1858} {"train_loss": -22.879087448120117, "global_step": 154258, "epoch": 1858} {"train_loss": -23.219818115234375, "global_step": 154259, "epoch": 1858} {"train_loss": -23.455102920532227, "global_step": 154260, "epoch": 1858} {"train_loss": -23.218149185180664, "global_step": 154261, "epoch": 1858} {"train_loss": -23.556640625, "global_step": 154262, "epoch": 1858} {"train_loss": -23.596635818481445, "global_step": 154263, "epoch": 1858} {"train_loss": -23.438329696655273, "global_step": 154264, "epoch": 1858} {"train_loss": -23.643692016601562, "global_step": 154265, "epoch": 1858} {"train_loss": -23.392833709716797, "global_step": 154266, "epoch": 1858} {"train_loss": -23.67211151123047, "global_step": 154267, "epoch": 1858} {"train_loss": -23.829389572143555, "global_step": 154268, "epoch": 1858} {"train_loss": -23.396957397460938, "global_step": 154269, "epoch": 1858} {"train_loss": -23.201995849609375, "global_step": 154270, "epoch": 1858} {"train_loss": -23.486764907836914, "global_step": 154271, "epoch": 1858} {"train_loss": -23.354114532470703, "global_step": 154272, "epoch": 1858} {"train_loss": -23.841978073120117, "global_step": 154273, "epoch": 1858} {"train_loss": -23.729658126831055, "global_step": 154274, "epoch": 1858} {"train_loss": -23.52671241760254, "global_step": 154275, "epoch": 1858} {"train_loss": -23.25263786315918, "global_step": 154276, "epoch": 1858} {"train_loss": -23.547727584838867, "global_step": 154277, "epoch": 1858} {"train_loss": -23.58466339111328, "global_step": 154278, "epoch": 1858} {"train_loss": -23.19631004333496, "global_step": 154279, "epoch": 1858} {"train_loss": -23.228900909423828, "global_step": 154280, "epoch": 1858} {"train_loss": -23.283777236938477, "global_step": 154281, "epoch": 1858} {"train_loss": -22.96503257751465, "global_step": 154282, "epoch": 1858} {"train_loss": -23.32869529724121, "global_step": 154283, "epoch": 1858} {"train_loss": -23.20418930053711, "global_step": 154284, "epoch": 1858} {"train_loss": -23.185636520385742, "global_step": 154285, "epoch": 1858} {"train_loss": -23.57651138305664, "global_step": 154286, "epoch": 1858} {"train_loss": -23.383697509765625, "global_step": 154287, "epoch": 1858} {"train_loss": -23.4892635345459, "global_step": 154288, "epoch": 1858} {"train_loss": -23.531583786010742, "global_step": 154289, "epoch": 1858} {"train_loss": -23.46291160583496, "global_step": 154290, "epoch": 1858} {"train_loss": -23.754913330078125, "global_step": 154291, "epoch": 1858} {"train_loss": -23.604642868041992, "global_step": 154292, "epoch": 1858} {"train_loss": -23.798494338989258, "global_step": 154293, "epoch": 1858} {"train_loss": -23.200180053710938, "global_step": 154294, "epoch": 1858} {"train_loss": -23.340656280517578, "global_step": 154295, "epoch": 1858} {"train_loss": -23.19013935686594, "global_step": 154296, "epoch": 1858, "val_loss": 6448619.0} {"train_loss": -23.33186149597168, "global_step": 154297, "epoch": 1859} {"train_loss": -23.515928268432617, "global_step": 154298, "epoch": 1859} {"train_loss": -23.38020133972168, "global_step": 154299, "epoch": 1859} {"train_loss": -23.159269332885742, "global_step": 154300, "epoch": 1859} {"train_loss": -23.446229934692383, "global_step": 154301, "epoch": 1859} {"train_loss": -23.371301651000977, "global_step": 154302, "epoch": 1859} {"train_loss": -23.549957275390625, "global_step": 154303, "epoch": 1859} {"train_loss": -23.1221923828125, "global_step": 154304, "epoch": 1859} {"train_loss": -23.179513931274414, "global_step": 154305, "epoch": 1859} {"train_loss": -23.548263549804688, "global_step": 154306, "epoch": 1859} {"train_loss": -23.271818161010742, "global_step": 154307, "epoch": 1859} {"train_loss": -23.17412757873535, "global_step": 154308, "epoch": 1859} {"train_loss": -22.758398056030273, "global_step": 154309, "epoch": 1859} {"train_loss": -23.875410079956055, "global_step": 154310, "epoch": 1859} {"train_loss": -23.554059982299805, "global_step": 154311, "epoch": 1859} {"train_loss": -23.39242935180664, "global_step": 154312, "epoch": 1859} {"train_loss": -23.140241622924805, "global_step": 154313, "epoch": 1859} {"train_loss": -23.420175552368164, "global_step": 154314, "epoch": 1859} {"train_loss": -23.274017333984375, "global_step": 154315, "epoch": 1859} {"train_loss": -23.11268424987793, "global_step": 154316, "epoch": 1859} {"train_loss": -23.522659301757812, "global_step": 154317, "epoch": 1859} {"train_loss": -23.369369506835938, "global_step": 154318, "epoch": 1859} {"train_loss": -23.603015899658203, "global_step": 154319, "epoch": 1859} {"train_loss": -23.504606246948242, "global_step": 154320, "epoch": 1859} {"train_loss": -23.246061325073242, "global_step": 154321, "epoch": 1859} {"train_loss": -23.912982940673828, "global_step": 154322, "epoch": 1859} {"train_loss": -23.629716873168945, "global_step": 154323, "epoch": 1859} {"train_loss": -23.149105072021484, "global_step": 154324, "epoch": 1859} {"train_loss": -23.587736129760742, "global_step": 154325, "epoch": 1859} {"train_loss": -23.600269317626953, "global_step": 154326, "epoch": 1859} {"train_loss": -23.41647720336914, "global_step": 154327, "epoch": 1859} {"train_loss": -23.29852867126465, "global_step": 154328, "epoch": 1859} {"train_loss": -23.209835052490234, "global_step": 154329, "epoch": 1859} {"train_loss": -23.3934383392334, "global_step": 154330, "epoch": 1859} {"train_loss": -23.340818405151367, "global_step": 154331, "epoch": 1859} {"train_loss": -23.646970748901367, "global_step": 154332, "epoch": 1859} {"train_loss": -23.458749771118164, "global_step": 154333, "epoch": 1859} {"train_loss": -23.647430419921875, "global_step": 154334, "epoch": 1859} {"train_loss": -23.5054874420166, "global_step": 154335, "epoch": 1859} {"train_loss": -23.550397872924805, "global_step": 154336, "epoch": 1859} {"train_loss": -23.44410514831543, "global_step": 154337, "epoch": 1859} {"train_loss": -23.3615779876709, "global_step": 154338, "epoch": 1859} {"train_loss": -23.295705795288086, "global_step": 154339, "epoch": 1859} {"train_loss": -23.671432495117188, "global_step": 154340, "epoch": 1859} {"train_loss": -23.549421310424805, "global_step": 154341, "epoch": 1859} {"train_loss": -23.324567794799805, "global_step": 154342, "epoch": 1859} {"train_loss": -23.64259910583496, "global_step": 154343, "epoch": 1859} {"train_loss": -23.45795249938965, "global_step": 154344, "epoch": 1859} {"train_loss": -23.526315689086914, "global_step": 154345, "epoch": 1859} {"train_loss": -23.699527740478516, "global_step": 154346, "epoch": 1859} {"train_loss": -23.547327041625977, "global_step": 154347, "epoch": 1859} {"train_loss": -23.257434844970703, "global_step": 154348, "epoch": 1859} {"train_loss": -23.077640533447266, "global_step": 154349, "epoch": 1859} {"train_loss": -23.486799240112305, "global_step": 154350, "epoch": 1859} {"train_loss": -23.60793113708496, "global_step": 154351, "epoch": 1859} {"train_loss": -23.690793991088867, "global_step": 154352, "epoch": 1859} {"train_loss": -23.278566360473633, "global_step": 154353, "epoch": 1859} {"train_loss": -23.452720642089844, "global_step": 154354, "epoch": 1859} {"train_loss": -23.631616592407227, "global_step": 154355, "epoch": 1859} {"train_loss": -23.79900550842285, "global_step": 154356, "epoch": 1859} {"train_loss": -23.6806640625, "global_step": 154357, "epoch": 1859} {"train_loss": -23.0264892578125, "global_step": 154358, "epoch": 1859} {"train_loss": -23.245731353759766, "global_step": 154359, "epoch": 1859} {"train_loss": -23.518482208251953, "global_step": 154360, "epoch": 1859} {"train_loss": -23.479785919189453, "global_step": 154361, "epoch": 1859} {"train_loss": -23.24092674255371, "global_step": 154362, "epoch": 1859} {"train_loss": -23.55913734436035, "global_step": 154363, "epoch": 1859} {"train_loss": -23.705209732055664, "global_step": 154364, "epoch": 1859} {"train_loss": -23.1237735748291, "global_step": 154365, "epoch": 1859} {"train_loss": -23.473142623901367, "global_step": 154366, "epoch": 1859} {"train_loss": -23.276411056518555, "global_step": 154367, "epoch": 1859} {"train_loss": -23.328176498413086, "global_step": 154368, "epoch": 1859} {"train_loss": -23.2575740814209, "global_step": 154369, "epoch": 1859} {"train_loss": -23.17415428161621, "global_step": 154370, "epoch": 1859} {"train_loss": -23.248708724975586, "global_step": 154371, "epoch": 1859} {"train_loss": -23.549530029296875, "global_step": 154372, "epoch": 1859} {"train_loss": -23.207014083862305, "global_step": 154373, "epoch": 1859} {"train_loss": -23.200414657592773, "global_step": 154374, "epoch": 1859} {"train_loss": -23.23004722595215, "global_step": 154375, "epoch": 1859} {"train_loss": -23.422775268554688, "global_step": 154376, "epoch": 1859} {"train_loss": -23.107858657836914, "global_step": 154377, "epoch": 1859} {"train_loss": -22.949277877807617, "global_step": 154378, "epoch": 1859} {"train_loss": -23.39605924307582, "global_step": 154379, "epoch": 1859, "val_loss": 6375278.0} {"train_loss": -23.242942810058594, "global_step": 154380, "epoch": 1860} {"train_loss": -22.993152618408203, "global_step": 154381, "epoch": 1860} {"train_loss": -23.0998477935791, "global_step": 154382, "epoch": 1860} {"train_loss": -23.337448120117188, "global_step": 154383, "epoch": 1860} {"train_loss": -23.00002098083496, "global_step": 154384, "epoch": 1860} {"train_loss": -23.45614242553711, "global_step": 154385, "epoch": 1860} {"train_loss": -22.81890869140625, "global_step": 154386, "epoch": 1860} {"train_loss": -23.482704162597656, "global_step": 154387, "epoch": 1860} {"train_loss": -23.09541893005371, "global_step": 154388, "epoch": 1860} {"train_loss": -23.353002548217773, "global_step": 154389, "epoch": 1860} {"train_loss": -23.143573760986328, "global_step": 154390, "epoch": 1860} {"train_loss": -23.151287078857422, "global_step": 154391, "epoch": 1860} {"train_loss": -23.090330123901367, "global_step": 154392, "epoch": 1860} {"train_loss": -23.29336929321289, "global_step": 154393, "epoch": 1860} {"train_loss": -23.27018165588379, "global_step": 154394, "epoch": 1860} {"train_loss": -23.13507843017578, "global_step": 154395, "epoch": 1860} {"train_loss": -23.32028579711914, "global_step": 154396, "epoch": 1860} {"train_loss": -23.475419998168945, "global_step": 154397, "epoch": 1860} {"train_loss": -23.526330947875977, "global_step": 154398, "epoch": 1860} {"train_loss": -23.427303314208984, "global_step": 154399, "epoch": 1860} {"train_loss": -23.520278930664062, "global_step": 154400, "epoch": 1860} {"train_loss": -23.048030853271484, "global_step": 154401, "epoch": 1860} {"train_loss": -23.345518112182617, "global_step": 154402, "epoch": 1860} {"train_loss": -22.900745391845703, "global_step": 154403, "epoch": 1860} {"train_loss": -23.5301456451416, "global_step": 154404, "epoch": 1860} {"train_loss": -23.54929542541504, "global_step": 154405, "epoch": 1860} {"train_loss": -23.045469284057617, "global_step": 154406, "epoch": 1860} {"train_loss": -23.227020263671875, "global_step": 154407, "epoch": 1860} {"train_loss": -23.010879516601562, "global_step": 154408, "epoch": 1860} {"train_loss": -23.41783905029297, "global_step": 154409, "epoch": 1860} {"train_loss": -23.61526107788086, "global_step": 154410, "epoch": 1860} {"train_loss": -23.4611873626709, "global_step": 154411, "epoch": 1860} {"train_loss": -23.531408309936523, "global_step": 154412, "epoch": 1860} {"train_loss": -23.48712730407715, "global_step": 154413, "epoch": 1860} {"train_loss": -23.1936092376709, "global_step": 154414, "epoch": 1860} {"train_loss": -23.457246780395508, "global_step": 154415, "epoch": 1860} {"train_loss": -23.04228973388672, "global_step": 154416, "epoch": 1860} {"train_loss": -23.317276000976562, "global_step": 154417, "epoch": 1860} {"train_loss": -23.37660026550293, "global_step": 154418, "epoch": 1860} {"train_loss": -23.23380470275879, "global_step": 154419, "epoch": 1860} {"train_loss": -23.24957275390625, "global_step": 154420, "epoch": 1860} {"train_loss": -23.203052520751953, "global_step": 154421, "epoch": 1860} {"train_loss": -23.261911392211914, "global_step": 154422, "epoch": 1860} {"train_loss": -23.287214279174805, "global_step": 154423, "epoch": 1860} {"train_loss": -23.189939498901367, "global_step": 154424, "epoch": 1860} {"train_loss": -22.98326873779297, "global_step": 154425, "epoch": 1860} {"train_loss": -23.169591903686523, "global_step": 154426, "epoch": 1860} {"train_loss": -23.480243682861328, "global_step": 154427, "epoch": 1860} {"train_loss": -23.12278938293457, "global_step": 154428, "epoch": 1860} {"train_loss": -23.57169532775879, "global_step": 154429, "epoch": 1860} {"train_loss": -23.213743209838867, "global_step": 154430, "epoch": 1860} {"train_loss": -23.320432662963867, "global_step": 154431, "epoch": 1860} {"train_loss": -23.223339080810547, "global_step": 154432, "epoch": 1860} {"train_loss": -23.44662857055664, "global_step": 154433, "epoch": 1860} {"train_loss": -22.997846603393555, "global_step": 154434, "epoch": 1860} {"train_loss": -23.222776412963867, "global_step": 154435, "epoch": 1860} {"train_loss": -23.31212615966797, "global_step": 154436, "epoch": 1860} {"train_loss": -23.589256286621094, "global_step": 154437, "epoch": 1860} {"train_loss": -23.441425323486328, "global_step": 154438, "epoch": 1860} {"train_loss": -23.306501388549805, "global_step": 154439, "epoch": 1860} {"train_loss": -23.10123062133789, "global_step": 154440, "epoch": 1860} {"train_loss": -23.176456451416016, "global_step": 154441, "epoch": 1860} {"train_loss": -23.25934600830078, "global_step": 154442, "epoch": 1860} {"train_loss": -23.41725730895996, "global_step": 154443, "epoch": 1860} {"train_loss": -23.475351333618164, "global_step": 154444, "epoch": 1860} {"train_loss": -23.309080123901367, "global_step": 154445, "epoch": 1860} {"train_loss": -23.462295532226562, "global_step": 154446, "epoch": 1860} {"train_loss": -23.21477699279785, "global_step": 154447, "epoch": 1860} {"train_loss": -23.37300682067871, "global_step": 154448, "epoch": 1860} {"train_loss": -23.462425231933594, "global_step": 154449, "epoch": 1860} {"train_loss": -23.61375617980957, "global_step": 154450, "epoch": 1860} {"train_loss": -23.321002960205078, "global_step": 154451, "epoch": 1860} {"train_loss": -23.29245376586914, "global_step": 154452, "epoch": 1860} {"train_loss": -23.289396286010742, "global_step": 154453, "epoch": 1860} {"train_loss": -23.26459312438965, "global_step": 154454, "epoch": 1860} {"train_loss": -23.453027725219727, "global_step": 154455, "epoch": 1860} {"train_loss": -23.84959602355957, "global_step": 154456, "epoch": 1860} {"train_loss": -23.549985885620117, "global_step": 154457, "epoch": 1860} {"train_loss": -23.678495407104492, "global_step": 154458, "epoch": 1860} {"train_loss": -23.506412506103516, "global_step": 154459, "epoch": 1860} {"train_loss": -23.675216674804688, "global_step": 154460, "epoch": 1860} {"train_loss": -23.625043869018555, "global_step": 154461, "epoch": 1860} {"train_loss": -23.33124712289098, "global_step": 154462, "epoch": 1860, "val_loss": 6440121.0} {"train_loss": -22.04673194885254, "global_step": 154463, "epoch": 1861} {"train_loss": -22.572004318237305, "global_step": 154464, "epoch": 1861} {"train_loss": -22.2409725189209, "global_step": 154465, "epoch": 1861} {"train_loss": -22.184385299682617, "global_step": 154466, "epoch": 1861} {"train_loss": -22.322294235229492, "global_step": 154467, "epoch": 1861} {"train_loss": -22.753393173217773, "global_step": 154468, "epoch": 1861} {"train_loss": -22.434619903564453, "global_step": 154469, "epoch": 1861} {"train_loss": -22.90240478515625, "global_step": 154470, "epoch": 1861} {"train_loss": -22.54310417175293, "global_step": 154471, "epoch": 1861} {"train_loss": -22.783222198486328, "global_step": 154472, "epoch": 1861} {"train_loss": -22.974002838134766, "global_step": 154473, "epoch": 1861} {"train_loss": -23.035873413085938, "global_step": 154474, "epoch": 1861} {"train_loss": -22.794614791870117, "global_step": 154475, "epoch": 1861} {"train_loss": -22.75629234313965, "global_step": 154476, "epoch": 1861} {"train_loss": -23.064695358276367, "global_step": 154477, "epoch": 1861} {"train_loss": -22.676382064819336, "global_step": 154478, "epoch": 1861} {"train_loss": -22.972002029418945, "global_step": 154479, "epoch": 1861} {"train_loss": -22.996017456054688, "global_step": 154480, "epoch": 1861} {"train_loss": -22.84378433227539, "global_step": 154481, "epoch": 1861} {"train_loss": -22.90663719177246, "global_step": 154482, "epoch": 1861} {"train_loss": -23.013269424438477, "global_step": 154483, "epoch": 1861} {"train_loss": -23.1827449798584, "global_step": 154484, "epoch": 1861} {"train_loss": -23.314992904663086, "global_step": 154485, "epoch": 1861} {"train_loss": -23.009809494018555, "global_step": 154486, "epoch": 1861} {"train_loss": -23.16373062133789, "global_step": 154487, "epoch": 1861} {"train_loss": -23.282230377197266, "global_step": 154488, "epoch": 1861} {"train_loss": -23.30594825744629, "global_step": 154489, "epoch": 1861} {"train_loss": -23.463523864746094, "global_step": 154490, "epoch": 1861} {"train_loss": -23.148651123046875, "global_step": 154491, "epoch": 1861} {"train_loss": -23.529150009155273, "global_step": 154492, "epoch": 1861} {"train_loss": -23.27480125427246, "global_step": 154493, "epoch": 1861} {"train_loss": -23.606740951538086, "global_step": 154494, "epoch": 1861} {"train_loss": -23.175386428833008, "global_step": 154495, "epoch": 1861} {"train_loss": -23.364444732666016, "global_step": 154496, "epoch": 1861} {"train_loss": -22.888086318969727, "global_step": 154497, "epoch": 1861} {"train_loss": -23.480262756347656, "global_step": 154498, "epoch": 1861} {"train_loss": -23.22126579284668, "global_step": 154499, "epoch": 1861} {"train_loss": -23.48854637145996, "global_step": 154500, "epoch": 1861} {"train_loss": -23.688329696655273, "global_step": 154501, "epoch": 1861} {"train_loss": -23.14572525024414, "global_step": 154502, "epoch": 1861} {"train_loss": -23.314651489257812, "global_step": 154503, "epoch": 1861} {"train_loss": -23.42836570739746, "global_step": 154504, "epoch": 1861} {"train_loss": -23.302621841430664, "global_step": 154505, "epoch": 1861} {"train_loss": -23.37581443786621, "global_step": 154506, "epoch": 1861} {"train_loss": -22.986873626708984, "global_step": 154507, "epoch": 1861} {"train_loss": -23.470457077026367, "global_step": 154508, "epoch": 1861} {"train_loss": -23.222888946533203, "global_step": 154509, "epoch": 1861} {"train_loss": -23.775083541870117, "global_step": 154510, "epoch": 1861} {"train_loss": -23.366947174072266, "global_step": 154511, "epoch": 1861} {"train_loss": -23.61151885986328, "global_step": 154512, "epoch": 1861} {"train_loss": -23.460412979125977, "global_step": 154513, "epoch": 1861} {"train_loss": -23.3846492767334, "global_step": 154514, "epoch": 1861} {"train_loss": -23.75058937072754, "global_step": 154515, "epoch": 1861} {"train_loss": -23.22930908203125, "global_step": 154516, "epoch": 1861} {"train_loss": -23.553516387939453, "global_step": 154517, "epoch": 1861} {"train_loss": -23.248140335083008, "global_step": 154518, "epoch": 1861} {"train_loss": -23.396961212158203, "global_step": 154519, "epoch": 1861} {"train_loss": -23.410694122314453, "global_step": 154520, "epoch": 1861} {"train_loss": -23.355131149291992, "global_step": 154521, "epoch": 1861} {"train_loss": -23.22755241394043, "global_step": 154522, "epoch": 1861} {"train_loss": -23.48386573791504, "global_step": 154523, "epoch": 1861} {"train_loss": -23.53034782409668, "global_step": 154524, "epoch": 1861} {"train_loss": -23.313440322875977, "global_step": 154525, "epoch": 1861} {"train_loss": -23.553760528564453, "global_step": 154526, "epoch": 1861} {"train_loss": -23.502246856689453, "global_step": 154527, "epoch": 1861} {"train_loss": -23.719097137451172, "global_step": 154528, "epoch": 1861} {"train_loss": -23.175106048583984, "global_step": 154529, "epoch": 1861} {"train_loss": -23.059040069580078, "global_step": 154530, "epoch": 1861} {"train_loss": -23.444822311401367, "global_step": 154531, "epoch": 1861} {"train_loss": -23.725717544555664, "global_step": 154532, "epoch": 1861} {"train_loss": -23.309003829956055, "global_step": 154533, "epoch": 1861} {"train_loss": -23.456144332885742, "global_step": 154534, "epoch": 1861} {"train_loss": -23.3878173828125, "global_step": 154535, "epoch": 1861} {"train_loss": -23.5448055267334, "global_step": 154536, "epoch": 1861} {"train_loss": -23.211999893188477, "global_step": 154537, "epoch": 1861} {"train_loss": -23.158090591430664, "global_step": 154538, "epoch": 1861} {"train_loss": -23.08380889892578, "global_step": 154539, "epoch": 1861} {"train_loss": -23.087743759155273, "global_step": 154540, "epoch": 1861} {"train_loss": -23.709125518798828, "global_step": 154541, "epoch": 1861} {"train_loss": -23.427610397338867, "global_step": 154542, "epoch": 1861} {"train_loss": -23.35145378112793, "global_step": 154543, "epoch": 1861} {"train_loss": -23.670581817626953, "global_step": 154544, "epoch": 1861} {"train_loss": -23.222159282270685, "global_step": 154545, "epoch": 1861, "val_loss": 6484226.0} {"train_loss": -22.957670211791992, "global_step": 154546, "epoch": 1862} {"train_loss": -23.010576248168945, "global_step": 154547, "epoch": 1862} {"train_loss": -22.953821182250977, "global_step": 154548, "epoch": 1862} {"train_loss": -22.909778594970703, "global_step": 154549, "epoch": 1862} {"train_loss": -23.21177864074707, "global_step": 154550, "epoch": 1862} {"train_loss": -22.99601173400879, "global_step": 154551, "epoch": 1862} {"train_loss": -22.966697692871094, "global_step": 154552, "epoch": 1862} {"train_loss": -23.146703720092773, "global_step": 154553, "epoch": 1862} {"train_loss": -23.211271286010742, "global_step": 154554, "epoch": 1862} {"train_loss": -23.123708724975586, "global_step": 154555, "epoch": 1862} {"train_loss": -23.52152442932129, "global_step": 154556, "epoch": 1862} {"train_loss": -22.981050491333008, "global_step": 154557, "epoch": 1862} {"train_loss": -23.229522705078125, "global_step": 154558, "epoch": 1862} {"train_loss": -23.64871597290039, "global_step": 154559, "epoch": 1862} {"train_loss": -23.349084854125977, "global_step": 154560, "epoch": 1862} {"train_loss": -23.13762855529785, "global_step": 154561, "epoch": 1862} {"train_loss": -23.6160888671875, "global_step": 154562, "epoch": 1862} {"train_loss": -23.612613677978516, "global_step": 154563, "epoch": 1862} {"train_loss": -23.084890365600586, "global_step": 154564, "epoch": 1862} {"train_loss": -23.54111671447754, "global_step": 154565, "epoch": 1862} {"train_loss": -23.201200485229492, "global_step": 154566, "epoch": 1862} {"train_loss": -23.63364601135254, "global_step": 154567, "epoch": 1862} {"train_loss": -23.019113540649414, "global_step": 154568, "epoch": 1862} {"train_loss": -23.459938049316406, "global_step": 154569, "epoch": 1862} {"train_loss": -23.2410945892334, "global_step": 154570, "epoch": 1862} {"train_loss": -23.558029174804688, "global_step": 154571, "epoch": 1862} {"train_loss": -23.216646194458008, "global_step": 154572, "epoch": 1862} {"train_loss": -23.6193904876709, "global_step": 154573, "epoch": 1862} {"train_loss": -23.297216415405273, "global_step": 154574, "epoch": 1862} {"train_loss": -23.17771339416504, "global_step": 154575, "epoch": 1862} {"train_loss": -23.515317916870117, "global_step": 154576, "epoch": 1862} {"train_loss": -22.9269962310791, "global_step": 154577, "epoch": 1862} {"train_loss": -23.152408599853516, "global_step": 154578, "epoch": 1862} {"train_loss": -23.432758331298828, "global_step": 154579, "epoch": 1862} {"train_loss": -23.390127182006836, "global_step": 154580, "epoch": 1862} {"train_loss": -23.264474868774414, "global_step": 154581, "epoch": 1862} {"train_loss": -23.350860595703125, "global_step": 154582, "epoch": 1862} {"train_loss": -23.310016632080078, "global_step": 154583, "epoch": 1862} {"train_loss": -23.554702758789062, "global_step": 154584, "epoch": 1862} {"train_loss": -23.40744400024414, "global_step": 154585, "epoch": 1862} {"train_loss": -23.50617027282715, "global_step": 154586, "epoch": 1862} {"train_loss": -23.41581916809082, "global_step": 154587, "epoch": 1862} {"train_loss": -23.4185848236084, "global_step": 154588, "epoch": 1862} {"train_loss": -23.54323387145996, "global_step": 154589, "epoch": 1862} {"train_loss": -23.65892219543457, "global_step": 154590, "epoch": 1862} {"train_loss": -23.383441925048828, "global_step": 154591, "epoch": 1862} {"train_loss": -23.423612594604492, "global_step": 154592, "epoch": 1862} {"train_loss": -23.188865661621094, "global_step": 154593, "epoch": 1862} {"train_loss": -23.378437042236328, "global_step": 154594, "epoch": 1862} {"train_loss": -23.11939811706543, "global_step": 154595, "epoch": 1862} {"train_loss": -23.800405502319336, "global_step": 154596, "epoch": 1862} {"train_loss": -23.35209083557129, "global_step": 154597, "epoch": 1862} {"train_loss": -23.321386337280273, "global_step": 154598, "epoch": 1862} {"train_loss": -23.347326278686523, "global_step": 154599, "epoch": 1862} {"train_loss": -23.562414169311523, "global_step": 154600, "epoch": 1862} {"train_loss": -23.39896583557129, "global_step": 154601, "epoch": 1862} {"train_loss": -23.351425170898438, "global_step": 154602, "epoch": 1862} {"train_loss": -23.36976432800293, "global_step": 154603, "epoch": 1862} {"train_loss": -23.430347442626953, "global_step": 154604, "epoch": 1862} {"train_loss": -23.174091339111328, "global_step": 154605, "epoch": 1862} {"train_loss": -23.084455490112305, "global_step": 154606, "epoch": 1862} {"train_loss": -23.173538208007812, "global_step": 154607, "epoch": 1862} {"train_loss": -23.44681739807129, "global_step": 154608, "epoch": 1862} {"train_loss": -23.254592895507812, "global_step": 154609, "epoch": 1862} {"train_loss": -23.223617553710938, "global_step": 154610, "epoch": 1862} {"train_loss": -23.034570693969727, "global_step": 154611, "epoch": 1862} {"train_loss": -23.230777740478516, "global_step": 154612, "epoch": 1862} {"train_loss": -23.279476165771484, "global_step": 154613, "epoch": 1862} {"train_loss": -22.837800979614258, "global_step": 154614, "epoch": 1862} {"train_loss": -23.135190963745117, "global_step": 154615, "epoch": 1862} {"train_loss": -23.22706413269043, "global_step": 154616, "epoch": 1862} {"train_loss": -23.030561447143555, "global_step": 154617, "epoch": 1862} {"train_loss": -23.226093292236328, "global_step": 154618, "epoch": 1862} {"train_loss": -22.966419219970703, "global_step": 154619, "epoch": 1862} {"train_loss": -23.403406143188477, "global_step": 154620, "epoch": 1862} {"train_loss": -23.21089744567871, "global_step": 154621, "epoch": 1862} {"train_loss": -23.312009811401367, "global_step": 154622, "epoch": 1862} {"train_loss": -23.335596084594727, "global_step": 154623, "epoch": 1862} {"train_loss": -22.885278701782227, "global_step": 154624, "epoch": 1862} {"train_loss": -23.227264404296875, "global_step": 154625, "epoch": 1862} {"train_loss": -23.23713493347168, "global_step": 154626, "epoch": 1862} {"train_loss": -23.159793853759766, "global_step": 154627, "epoch": 1862} {"train_loss": -23.29032969187541, "global_step": 154628, "epoch": 1862, "val_loss": 6343220.0} {"train_loss": -22.728168487548828, "global_step": 154629, "epoch": 1863} {"train_loss": -23.536373138427734, "global_step": 154630, "epoch": 1863} {"train_loss": -22.936107635498047, "global_step": 154631, "epoch": 1863} {"train_loss": -22.805997848510742, "global_step": 154632, "epoch": 1863} {"train_loss": -23.342639923095703, "global_step": 154633, "epoch": 1863} {"train_loss": -22.495107650756836, "global_step": 154634, "epoch": 1863} {"train_loss": -23.171512603759766, "global_step": 154635, "epoch": 1863} {"train_loss": -22.68160057067871, "global_step": 154636, "epoch": 1863} {"train_loss": -23.136260986328125, "global_step": 154637, "epoch": 1863} {"train_loss": -22.97355842590332, "global_step": 154638, "epoch": 1863} {"train_loss": -23.10319709777832, "global_step": 154639, "epoch": 1863} {"train_loss": -22.92234992980957, "global_step": 154640, "epoch": 1863} {"train_loss": -22.87664031982422, "global_step": 154641, "epoch": 1863} {"train_loss": -23.50252342224121, "global_step": 154642, "epoch": 1863} {"train_loss": -22.96811866760254, "global_step": 154643, "epoch": 1863} {"train_loss": -22.801862716674805, "global_step": 154644, "epoch": 1863} {"train_loss": -23.416763305664062, "global_step": 154645, "epoch": 1863} {"train_loss": -22.94124412536621, "global_step": 154646, "epoch": 1863} {"train_loss": -23.05135154724121, "global_step": 154647, "epoch": 1863} {"train_loss": -22.803022384643555, "global_step": 154648, "epoch": 1863} {"train_loss": -23.102798461914062, "global_step": 154649, "epoch": 1863} {"train_loss": -23.157258987426758, "global_step": 154650, "epoch": 1863} {"train_loss": -22.907852172851562, "global_step": 154651, "epoch": 1863} {"train_loss": -23.110017776489258, "global_step": 154652, "epoch": 1863} {"train_loss": -23.21732521057129, "global_step": 154653, "epoch": 1863} {"train_loss": -23.125965118408203, "global_step": 154654, "epoch": 1863} {"train_loss": -23.273271560668945, "global_step": 154655, "epoch": 1863} {"train_loss": -23.40305519104004, "global_step": 154656, "epoch": 1863} {"train_loss": -23.4051513671875, "global_step": 154657, "epoch": 1863} {"train_loss": -23.223678588867188, "global_step": 154658, "epoch": 1863} {"train_loss": -23.33393669128418, "global_step": 154659, "epoch": 1863} {"train_loss": -23.63534927368164, "global_step": 154660, "epoch": 1863} {"train_loss": -23.26531219482422, "global_step": 154661, "epoch": 1863} {"train_loss": -23.23219871520996, "global_step": 154662, "epoch": 1863} {"train_loss": -23.27374267578125, "global_step": 154663, "epoch": 1863} {"train_loss": -23.191341400146484, "global_step": 154664, "epoch": 1863} {"train_loss": -23.19552993774414, "global_step": 154665, "epoch": 1863} {"train_loss": -23.184261322021484, "global_step": 154666, "epoch": 1863} {"train_loss": -23.730810165405273, "global_step": 154667, "epoch": 1863} {"train_loss": -23.10028648376465, "global_step": 154668, "epoch": 1863} {"train_loss": -23.54605484008789, "global_step": 154669, "epoch": 1863} {"train_loss": -23.264720916748047, "global_step": 154670, "epoch": 1863} {"train_loss": -23.308317184448242, "global_step": 154671, "epoch": 1863} {"train_loss": -22.962953567504883, "global_step": 154672, "epoch": 1863} {"train_loss": -23.637901306152344, "global_step": 154673, "epoch": 1863} {"train_loss": -23.589599609375, "global_step": 154674, "epoch": 1863} {"train_loss": -23.483766555786133, "global_step": 154675, "epoch": 1863} {"train_loss": -23.50146484375, "global_step": 154676, "epoch": 1863} {"train_loss": -24.1807804107666, "global_step": 154677, "epoch": 1863} {"train_loss": -23.303373336791992, "global_step": 154678, "epoch": 1863} {"train_loss": -23.287734985351562, "global_step": 154679, "epoch": 1863} {"train_loss": -23.56878089904785, "global_step": 154680, "epoch": 1863} {"train_loss": -23.611549377441406, "global_step": 154681, "epoch": 1863} {"train_loss": -23.628530502319336, "global_step": 154682, "epoch": 1863} {"train_loss": -23.172391891479492, "global_step": 154683, "epoch": 1863} {"train_loss": -23.460908889770508, "global_step": 154684, "epoch": 1863} {"train_loss": -23.163108825683594, "global_step": 154685, "epoch": 1863} {"train_loss": -23.315454483032227, "global_step": 154686, "epoch": 1863} {"train_loss": -23.160017013549805, "global_step": 154687, "epoch": 1863} {"train_loss": -23.276840209960938, "global_step": 154688, "epoch": 1863} {"train_loss": -23.144493103027344, "global_step": 154689, "epoch": 1863} {"train_loss": -23.49064064025879, "global_step": 154690, "epoch": 1863} {"train_loss": -23.771303176879883, "global_step": 154691, "epoch": 1863} {"train_loss": -23.283132553100586, "global_step": 154692, "epoch": 1863} {"train_loss": -23.333478927612305, "global_step": 154693, "epoch": 1863} {"train_loss": -23.610998153686523, "global_step": 154694, "epoch": 1863} {"train_loss": -23.799091339111328, "global_step": 154695, "epoch": 1863} {"train_loss": -23.432947158813477, "global_step": 154696, "epoch": 1863} {"train_loss": -23.204702377319336, "global_step": 154697, "epoch": 1863} {"train_loss": -23.300771713256836, "global_step": 154698, "epoch": 1863} {"train_loss": -23.391942977905273, "global_step": 154699, "epoch": 1863} {"train_loss": -23.57258415222168, "global_step": 154700, "epoch": 1863} {"train_loss": -23.83493995666504, "global_step": 154701, "epoch": 1863} {"train_loss": -23.493589401245117, "global_step": 154702, "epoch": 1863} {"train_loss": -23.623828887939453, "global_step": 154703, "epoch": 1863} {"train_loss": -23.153940200805664, "global_step": 154704, "epoch": 1863} {"train_loss": -23.221378326416016, "global_step": 154705, "epoch": 1863} {"train_loss": -22.86574363708496, "global_step": 154706, "epoch": 1863} {"train_loss": -23.299711227416992, "global_step": 154707, "epoch": 1863} {"train_loss": -23.11946678161621, "global_step": 154708, "epoch": 1863} {"train_loss": -23.447513580322266, "global_step": 154709, "epoch": 1863} {"train_loss": -23.44169044494629, "global_step": 154710, "epoch": 1863} {"train_loss": -23.262345762137908, "global_step": 154711, "epoch": 1863, "val_loss": 6373856.5} {"train_loss": -22.34248161315918, "global_step": 154712, "epoch": 1864} {"train_loss": -23.08098793029785, "global_step": 154713, "epoch": 1864} {"train_loss": -22.315265655517578, "global_step": 154714, "epoch": 1864} {"train_loss": -22.697099685668945, "global_step": 154715, "epoch": 1864} {"train_loss": -22.812847137451172, "global_step": 154716, "epoch": 1864} {"train_loss": -22.6818790435791, "global_step": 154717, "epoch": 1864} {"train_loss": -23.07295036315918, "global_step": 154718, "epoch": 1864} {"train_loss": -22.824920654296875, "global_step": 154719, "epoch": 1864} {"train_loss": -22.6143741607666, "global_step": 154720, "epoch": 1864} {"train_loss": -22.757720947265625, "global_step": 154721, "epoch": 1864} {"train_loss": -22.75408363342285, "global_step": 154722, "epoch": 1864} {"train_loss": -23.174036026000977, "global_step": 154723, "epoch": 1864} {"train_loss": -22.8138484954834, "global_step": 154724, "epoch": 1864} {"train_loss": -22.9028377532959, "global_step": 154725, "epoch": 1864} {"train_loss": -23.16554832458496, "global_step": 154726, "epoch": 1864} {"train_loss": -23.10013771057129, "global_step": 154727, "epoch": 1864} {"train_loss": -22.89064598083496, "global_step": 154728, "epoch": 1864} {"train_loss": -23.0747127532959, "global_step": 154729, "epoch": 1864} {"train_loss": -22.802127838134766, "global_step": 154730, "epoch": 1864} {"train_loss": -22.99296760559082, "global_step": 154731, "epoch": 1864} {"train_loss": -23.148723602294922, "global_step": 154732, "epoch": 1864} {"train_loss": -22.999603271484375, "global_step": 154733, "epoch": 1864} {"train_loss": -23.222854614257812, "global_step": 154734, "epoch": 1864} {"train_loss": -23.225255966186523, "global_step": 154735, "epoch": 1864} {"train_loss": -23.234329223632812, "global_step": 154736, "epoch": 1864} {"train_loss": -23.285146713256836, "global_step": 154737, "epoch": 1864} {"train_loss": -23.24561882019043, "global_step": 154738, "epoch": 1864} {"train_loss": -23.199710845947266, "global_step": 154739, "epoch": 1864} {"train_loss": -23.338546752929688, "global_step": 154740, "epoch": 1864} {"train_loss": -23.489547729492188, "global_step": 154741, "epoch": 1864} {"train_loss": -23.329206466674805, "global_step": 154742, "epoch": 1864} {"train_loss": -23.19025230407715, "global_step": 154743, "epoch": 1864} {"train_loss": -23.27509880065918, "global_step": 154744, "epoch": 1864} {"train_loss": -23.326448440551758, "global_step": 154745, "epoch": 1864} {"train_loss": -23.356155395507812, "global_step": 154746, "epoch": 1864} {"train_loss": -23.4915771484375, "global_step": 154747, "epoch": 1864} {"train_loss": -23.377777099609375, "global_step": 154748, "epoch": 1864} {"train_loss": -23.398462295532227, "global_step": 154749, "epoch": 1864} {"train_loss": -23.528757095336914, "global_step": 154750, "epoch": 1864} {"train_loss": -22.958337783813477, "global_step": 154751, "epoch": 1864} {"train_loss": -23.234827041625977, "global_step": 154752, "epoch": 1864} {"train_loss": -23.312307357788086, "global_step": 154753, "epoch": 1864} {"train_loss": -23.233007431030273, "global_step": 154754, "epoch": 1864} {"train_loss": -22.88421058654785, "global_step": 154755, "epoch": 1864} {"train_loss": -23.353450775146484, "global_step": 154756, "epoch": 1864} {"train_loss": -23.301090240478516, "global_step": 154757, "epoch": 1864} {"train_loss": -22.922550201416016, "global_step": 154758, "epoch": 1864} {"train_loss": -23.377431869506836, "global_step": 154759, "epoch": 1864} {"train_loss": -23.037260055541992, "global_step": 154760, "epoch": 1864} {"train_loss": -23.279165267944336, "global_step": 154761, "epoch": 1864} {"train_loss": -23.238065719604492, "global_step": 154762, "epoch": 1864} {"train_loss": -23.45851707458496, "global_step": 154763, "epoch": 1864} {"train_loss": -23.213003158569336, "global_step": 154764, "epoch": 1864} {"train_loss": -23.61878204345703, "global_step": 154765, "epoch": 1864} {"train_loss": -23.54941749572754, "global_step": 154766, "epoch": 1864} {"train_loss": -23.31564712524414, "global_step": 154767, "epoch": 1864} {"train_loss": -23.341724395751953, "global_step": 154768, "epoch": 1864} {"train_loss": -23.234699249267578, "global_step": 154769, "epoch": 1864} {"train_loss": -23.408761978149414, "global_step": 154770, "epoch": 1864} {"train_loss": -23.381534576416016, "global_step": 154771, "epoch": 1864} {"train_loss": -23.337520599365234, "global_step": 154772, "epoch": 1864} {"train_loss": -23.30452537536621, "global_step": 154773, "epoch": 1864} {"train_loss": -23.427099227905273, "global_step": 154774, "epoch": 1864} {"train_loss": -23.334768295288086, "global_step": 154775, "epoch": 1864} {"train_loss": -23.249204635620117, "global_step": 154776, "epoch": 1864} {"train_loss": -23.55352783203125, "global_step": 154777, "epoch": 1864} {"train_loss": -23.11551284790039, "global_step": 154778, "epoch": 1864} {"train_loss": -23.359811782836914, "global_step": 154779, "epoch": 1864} {"train_loss": -23.143478393554688, "global_step": 154780, "epoch": 1864} {"train_loss": -23.683198928833008, "global_step": 154781, "epoch": 1864} {"train_loss": -23.27091407775879, "global_step": 154782, "epoch": 1864} {"train_loss": -23.57411003112793, "global_step": 154783, "epoch": 1864} {"train_loss": -23.330371856689453, "global_step": 154784, "epoch": 1864} {"train_loss": -23.135190963745117, "global_step": 154785, "epoch": 1864} {"train_loss": -23.30866241455078, "global_step": 154786, "epoch": 1864} {"train_loss": -23.669883728027344, "global_step": 154787, "epoch": 1864} {"train_loss": -23.1783390045166, "global_step": 154788, "epoch": 1864} {"train_loss": -23.432592391967773, "global_step": 154789, "epoch": 1864} {"train_loss": -23.59079360961914, "global_step": 154790, "epoch": 1864} {"train_loss": -23.335599899291992, "global_step": 154791, "epoch": 1864} {"train_loss": -23.1182861328125, "global_step": 154792, "epoch": 1864} {"train_loss": -23.279020309448242, "global_step": 154793, "epoch": 1864} {"train_loss": -23.21524973949754, "global_step": 154794, "epoch": 1864, "val_loss": 6482160.0} {"train_loss": -21.967493057250977, "global_step": 154795, "epoch": 1865} {"train_loss": -22.67637825012207, "global_step": 154796, "epoch": 1865} {"train_loss": -22.940460205078125, "global_step": 154797, "epoch": 1865} {"train_loss": -21.562734603881836, "global_step": 154798, "epoch": 1865} {"train_loss": -22.867446899414062, "global_step": 154799, "epoch": 1865} {"train_loss": -22.741125106811523, "global_step": 154800, "epoch": 1865} {"train_loss": -22.50779914855957, "global_step": 154801, "epoch": 1865} {"train_loss": -22.988868713378906, "global_step": 154802, "epoch": 1865} {"train_loss": -22.56416893005371, "global_step": 154803, "epoch": 1865} {"train_loss": -22.58123016357422, "global_step": 154804, "epoch": 1865} {"train_loss": -22.58521842956543, "global_step": 154805, "epoch": 1865} {"train_loss": -22.801713943481445, "global_step": 154806, "epoch": 1865} {"train_loss": -22.619413375854492, "global_step": 154807, "epoch": 1865} {"train_loss": -22.80906105041504, "global_step": 154808, "epoch": 1865} {"train_loss": -22.852664947509766, "global_step": 154809, "epoch": 1865} {"train_loss": -23.004758834838867, "global_step": 154810, "epoch": 1865} {"train_loss": -22.885555267333984, "global_step": 154811, "epoch": 1865} {"train_loss": -22.971403121948242, "global_step": 154812, "epoch": 1865} {"train_loss": -22.96821403503418, "global_step": 154813, "epoch": 1865} {"train_loss": -22.8974552154541, "global_step": 154814, "epoch": 1865} {"train_loss": -23.207046508789062, "global_step": 154815, "epoch": 1865} {"train_loss": -22.94093894958496, "global_step": 154816, "epoch": 1865} {"train_loss": -23.264493942260742, "global_step": 154817, "epoch": 1865} {"train_loss": -23.1859188079834, "global_step": 154818, "epoch": 1865} {"train_loss": -23.447538375854492, "global_step": 154819, "epoch": 1865} {"train_loss": -23.171592712402344, "global_step": 154820, "epoch": 1865} {"train_loss": -22.893720626831055, "global_step": 154821, "epoch": 1865} {"train_loss": -23.10175132751465, "global_step": 154822, "epoch": 1865} {"train_loss": -23.392608642578125, "global_step": 154823, "epoch": 1865} {"train_loss": -23.355667114257812, "global_step": 154824, "epoch": 1865} {"train_loss": -23.287084579467773, "global_step": 154825, "epoch": 1865} {"train_loss": -23.547060012817383, "global_step": 154826, "epoch": 1865} {"train_loss": -23.390233993530273, "global_step": 154827, "epoch": 1865} {"train_loss": -23.3369197845459, "global_step": 154828, "epoch": 1865} {"train_loss": -23.494491577148438, "global_step": 154829, "epoch": 1865} {"train_loss": -23.444366455078125, "global_step": 154830, "epoch": 1865} {"train_loss": -23.450796127319336, "global_step": 154831, "epoch": 1865} {"train_loss": -23.82265853881836, "global_step": 154832, "epoch": 1865} {"train_loss": -23.53937339782715, "global_step": 154833, "epoch": 1865} {"train_loss": -23.320688247680664, "global_step": 154834, "epoch": 1865} {"train_loss": -23.585216522216797, "global_step": 154835, "epoch": 1865} {"train_loss": -23.662216186523438, "global_step": 154836, "epoch": 1865} {"train_loss": -23.39162254333496, "global_step": 154837, "epoch": 1865} {"train_loss": -23.47032356262207, "global_step": 154838, "epoch": 1865} {"train_loss": -23.060890197753906, "global_step": 154839, "epoch": 1865} {"train_loss": -23.670747756958008, "global_step": 154840, "epoch": 1865} {"train_loss": -23.409351348876953, "global_step": 154841, "epoch": 1865} {"train_loss": -23.411279678344727, "global_step": 154842, "epoch": 1865} {"train_loss": -23.46800994873047, "global_step": 154843, "epoch": 1865} {"train_loss": -23.42131996154785, "global_step": 154844, "epoch": 1865} {"train_loss": -23.191875457763672, "global_step": 154845, "epoch": 1865} {"train_loss": -23.36638832092285, "global_step": 154846, "epoch": 1865} {"train_loss": -23.630577087402344, "global_step": 154847, "epoch": 1865} {"train_loss": -23.095077514648438, "global_step": 154848, "epoch": 1865} {"train_loss": -23.107412338256836, "global_step": 154849, "epoch": 1865} {"train_loss": -23.596054077148438, "global_step": 154850, "epoch": 1865} {"train_loss": -23.51136589050293, "global_step": 154851, "epoch": 1865} {"train_loss": -23.167781829833984, "global_step": 154852, "epoch": 1865} {"train_loss": -23.38556671142578, "global_step": 154853, "epoch": 1865} {"train_loss": -23.58953857421875, "global_step": 154854, "epoch": 1865} {"train_loss": -23.532934188842773, "global_step": 154855, "epoch": 1865} {"train_loss": -23.330493927001953, "global_step": 154856, "epoch": 1865} {"train_loss": -22.94635009765625, "global_step": 154857, "epoch": 1865} {"train_loss": -23.1124324798584, "global_step": 154858, "epoch": 1865} {"train_loss": -23.075435638427734, "global_step": 154859, "epoch": 1865} {"train_loss": -23.264707565307617, "global_step": 154860, "epoch": 1865} {"train_loss": -23.584684371948242, "global_step": 154861, "epoch": 1865} {"train_loss": -23.384836196899414, "global_step": 154862, "epoch": 1865} {"train_loss": -23.101795196533203, "global_step": 154863, "epoch": 1865} {"train_loss": -23.18208885192871, "global_step": 154864, "epoch": 1865} {"train_loss": -23.39219093322754, "global_step": 154865, "epoch": 1865} {"train_loss": -23.077795028686523, "global_step": 154866, "epoch": 1865} {"train_loss": -22.594757080078125, "global_step": 154867, "epoch": 1865} {"train_loss": -23.49726676940918, "global_step": 154868, "epoch": 1865} {"train_loss": -23.505643844604492, "global_step": 154869, "epoch": 1865} {"train_loss": -23.24163818359375, "global_step": 154870, "epoch": 1865} {"train_loss": -22.9344539642334, "global_step": 154871, "epoch": 1865} {"train_loss": -22.912351608276367, "global_step": 154872, "epoch": 1865} {"train_loss": -23.237451553344727, "global_step": 154873, "epoch": 1865} {"train_loss": -23.426420211791992, "global_step": 154874, "epoch": 1865} {"train_loss": -23.072673797607422, "global_step": 154875, "epoch": 1865} {"train_loss": -23.356403350830078, "global_step": 154876, "epoch": 1865} {"train_loss": -23.165219042674604, "global_step": 154877, "epoch": 1865, "val_loss": 6374360.5} {"train_loss": -23.171533584594727, "global_step": 154878, "epoch": 1866} {"train_loss": -23.16513442993164, "global_step": 154879, "epoch": 1866} {"train_loss": -23.378704071044922, "global_step": 154880, "epoch": 1866} {"train_loss": -23.026941299438477, "global_step": 154881, "epoch": 1866} {"train_loss": -22.502750396728516, "global_step": 154882, "epoch": 1866} {"train_loss": -22.85077476501465, "global_step": 154883, "epoch": 1866} {"train_loss": -23.03386878967285, "global_step": 154884, "epoch": 1866} {"train_loss": -23.24837303161621, "global_step": 154885, "epoch": 1866} {"train_loss": -23.23909568786621, "global_step": 154886, "epoch": 1866} {"train_loss": -23.15496826171875, "global_step": 154887, "epoch": 1866} {"train_loss": -23.464061737060547, "global_step": 154888, "epoch": 1866} {"train_loss": -23.17020606994629, "global_step": 154889, "epoch": 1866} {"train_loss": -22.805021286010742, "global_step": 154890, "epoch": 1866} {"train_loss": -23.229948043823242, "global_step": 154891, "epoch": 1866} {"train_loss": -23.178808212280273, "global_step": 154892, "epoch": 1866} {"train_loss": -23.036401748657227, "global_step": 154893, "epoch": 1866} {"train_loss": -23.176984786987305, "global_step": 154894, "epoch": 1866} {"train_loss": -23.398229598999023, "global_step": 154895, "epoch": 1866} {"train_loss": -23.493701934814453, "global_step": 154896, "epoch": 1866} {"train_loss": -23.25482177734375, "global_step": 154897, "epoch": 1866} {"train_loss": -23.17535972595215, "global_step": 154898, "epoch": 1866} {"train_loss": -23.399463653564453, "global_step": 154899, "epoch": 1866} {"train_loss": -23.319875717163086, "global_step": 154900, "epoch": 1866} {"train_loss": -23.39456558227539, "global_step": 154901, "epoch": 1866} {"train_loss": -23.279348373413086, "global_step": 154902, "epoch": 1866} {"train_loss": -23.72182273864746, "global_step": 154903, "epoch": 1866} {"train_loss": -23.602567672729492, "global_step": 154904, "epoch": 1866} {"train_loss": -23.632762908935547, "global_step": 154905, "epoch": 1866} {"train_loss": -23.217086791992188, "global_step": 154906, "epoch": 1866} {"train_loss": -23.31766700744629, "global_step": 154907, "epoch": 1866} {"train_loss": -23.563724517822266, "global_step": 154908, "epoch": 1866} {"train_loss": -23.393051147460938, "global_step": 154909, "epoch": 1866} {"train_loss": -23.09218406677246, "global_step": 154910, "epoch": 1866} {"train_loss": -23.26434326171875, "global_step": 154911, "epoch": 1866} {"train_loss": -23.591930389404297, "global_step": 154912, "epoch": 1866} {"train_loss": -23.342649459838867, "global_step": 154913, "epoch": 1866} {"train_loss": -23.40640640258789, "global_step": 154914, "epoch": 1866} {"train_loss": -23.468351364135742, "global_step": 154915, "epoch": 1866} {"train_loss": -23.454391479492188, "global_step": 154916, "epoch": 1866} {"train_loss": -23.33174705505371, "global_step": 154917, "epoch": 1866} {"train_loss": -23.41470718383789, "global_step": 154918, "epoch": 1866} {"train_loss": -23.68159294128418, "global_step": 154919, "epoch": 1866} {"train_loss": -23.333600997924805, "global_step": 154920, "epoch": 1866} {"train_loss": -23.781265258789062, "global_step": 154921, "epoch": 1866} {"train_loss": -23.61195182800293, "global_step": 154922, "epoch": 1866} {"train_loss": -23.39436149597168, "global_step": 154923, "epoch": 1866} {"train_loss": -24.010713577270508, "global_step": 154924, "epoch": 1866} {"train_loss": -23.65988540649414, "global_step": 154925, "epoch": 1866} {"train_loss": -23.738332748413086, "global_step": 154926, "epoch": 1866} {"train_loss": -23.66824722290039, "global_step": 154927, "epoch": 1866} {"train_loss": -23.395828247070312, "global_step": 154928, "epoch": 1866} {"train_loss": -23.29966926574707, "global_step": 154929, "epoch": 1866} {"train_loss": -23.27393913269043, "global_step": 154930, "epoch": 1866} {"train_loss": -23.535722732543945, "global_step": 154931, "epoch": 1866} {"train_loss": -23.42060661315918, "global_step": 154932, "epoch": 1866} {"train_loss": -23.566801071166992, "global_step": 154933, "epoch": 1866} {"train_loss": -23.23761749267578, "global_step": 154934, "epoch": 1866} {"train_loss": -23.368072509765625, "global_step": 154935, "epoch": 1866} {"train_loss": -23.356138229370117, "global_step": 154936, "epoch": 1866} {"train_loss": -23.71870231628418, "global_step": 154937, "epoch": 1866} {"train_loss": -23.645389556884766, "global_step": 154938, "epoch": 1866} {"train_loss": -23.323583602905273, "global_step": 154939, "epoch": 1866} {"train_loss": -23.268354415893555, "global_step": 154940, "epoch": 1866} {"train_loss": -23.155508041381836, "global_step": 154941, "epoch": 1866} {"train_loss": -23.4134578704834, "global_step": 154942, "epoch": 1866} {"train_loss": -23.29920768737793, "global_step": 154943, "epoch": 1866} {"train_loss": -23.33863067626953, "global_step": 154944, "epoch": 1866} {"train_loss": -23.73600196838379, "global_step": 154945, "epoch": 1866} {"train_loss": -23.38923454284668, "global_step": 154946, "epoch": 1866} {"train_loss": -23.249069213867188, "global_step": 154947, "epoch": 1866} {"train_loss": -23.374557495117188, "global_step": 154948, "epoch": 1866} {"train_loss": -22.978132247924805, "global_step": 154949, "epoch": 1866} {"train_loss": -23.3541202545166, "global_step": 154950, "epoch": 1866} {"train_loss": -23.34562110900879, "global_step": 154951, "epoch": 1866} {"train_loss": -23.283700942993164, "global_step": 154952, "epoch": 1866} {"train_loss": -23.526105880737305, "global_step": 154953, "epoch": 1866} {"train_loss": -23.409948348999023, "global_step": 154954, "epoch": 1866} {"train_loss": -23.38286781311035, "global_step": 154955, "epoch": 1866} {"train_loss": -23.34193229675293, "global_step": 154956, "epoch": 1866} {"train_loss": -23.547590255737305, "global_step": 154957, "epoch": 1866} {"train_loss": -23.027572631835938, "global_step": 154958, "epoch": 1866} {"train_loss": -23.092002868652344, "global_step": 154959, "epoch": 1866} {"train_loss": -23.366408359573548, "global_step": 154960, "epoch": 1866, "val_loss": 6318646.5} {"train_loss": -22.878814697265625, "global_step": 154961, "epoch": 1867} {"train_loss": -21.754810333251953, "global_step": 154962, "epoch": 1867} {"train_loss": -22.604473114013672, "global_step": 154963, "epoch": 1867} {"train_loss": -22.1156063079834, "global_step": 154964, "epoch": 1867} {"train_loss": -22.714252471923828, "global_step": 154965, "epoch": 1867} {"train_loss": -22.37942886352539, "global_step": 154966, "epoch": 1867} {"train_loss": -22.611534118652344, "global_step": 154967, "epoch": 1867} {"train_loss": -22.688413619995117, "global_step": 154968, "epoch": 1867} {"train_loss": -23.027204513549805, "global_step": 154969, "epoch": 1867} {"train_loss": -22.819156646728516, "global_step": 154970, "epoch": 1867} {"train_loss": -23.247024536132812, "global_step": 154971, "epoch": 1867} {"train_loss": -22.590166091918945, "global_step": 154972, "epoch": 1867} {"train_loss": -22.999479293823242, "global_step": 154973, "epoch": 1867} {"train_loss": -22.852201461791992, "global_step": 154974, "epoch": 1867} {"train_loss": -22.527481079101562, "global_step": 154975, "epoch": 1867} {"train_loss": -22.950769424438477, "global_step": 154976, "epoch": 1867} {"train_loss": -22.63824462890625, "global_step": 154977, "epoch": 1867} {"train_loss": -23.024311065673828, "global_step": 154978, "epoch": 1867} {"train_loss": -23.072599411010742, "global_step": 154979, "epoch": 1867} {"train_loss": -23.36016845703125, "global_step": 154980, "epoch": 1867} {"train_loss": -23.25642204284668, "global_step": 154981, "epoch": 1867} {"train_loss": -22.850183486938477, "global_step": 154982, "epoch": 1867} {"train_loss": -22.819482803344727, "global_step": 154983, "epoch": 1867} {"train_loss": -23.207033157348633, "global_step": 154984, "epoch": 1867} {"train_loss": -23.048810958862305, "global_step": 154985, "epoch": 1867} {"train_loss": -23.10866355895996, "global_step": 154986, "epoch": 1867} {"train_loss": -23.120426177978516, "global_step": 154987, "epoch": 1867} {"train_loss": -22.976552963256836, "global_step": 154988, "epoch": 1867} {"train_loss": -23.01980972290039, "global_step": 154989, "epoch": 1867} {"train_loss": -23.252058029174805, "global_step": 154990, "epoch": 1867} {"train_loss": -23.474685668945312, "global_step": 154991, "epoch": 1867} {"train_loss": -23.269739151000977, "global_step": 154992, "epoch": 1867} {"train_loss": -23.50657844543457, "global_step": 154993, "epoch": 1867} {"train_loss": -22.96016502380371, "global_step": 154994, "epoch": 1867} {"train_loss": -23.037961959838867, "global_step": 154995, "epoch": 1867} {"train_loss": -22.994300842285156, "global_step": 154996, "epoch": 1867} {"train_loss": -22.928176879882812, "global_step": 154997, "epoch": 1867} {"train_loss": -23.103551864624023, "global_step": 154998, "epoch": 1867} {"train_loss": -23.424110412597656, "global_step": 154999, "epoch": 1867} {"train_loss": -23.33282470703125, "global_step": 155000, "epoch": 1867} {"train_loss": -22.869348526000977, "global_step": 155001, "epoch": 1867} {"train_loss": -23.741697311401367, "global_step": 155002, "epoch": 1867} {"train_loss": -23.192119598388672, "global_step": 155003, "epoch": 1867} {"train_loss": -23.574172973632812, "global_step": 155004, "epoch": 1867} {"train_loss": -23.280426025390625, "global_step": 155005, "epoch": 1867} {"train_loss": -23.18368911743164, "global_step": 155006, "epoch": 1867} {"train_loss": -23.616962432861328, "global_step": 155007, "epoch": 1867} {"train_loss": -23.460491180419922, "global_step": 155008, "epoch": 1867} {"train_loss": -23.17359733581543, "global_step": 155009, "epoch": 1867} {"train_loss": -23.546009063720703, "global_step": 155010, "epoch": 1867} {"train_loss": -23.39192008972168, "global_step": 155011, "epoch": 1867} {"train_loss": -23.562911987304688, "global_step": 155012, "epoch": 1867} {"train_loss": -23.676279067993164, "global_step": 155013, "epoch": 1867} {"train_loss": -23.32405662536621, "global_step": 155014, "epoch": 1867} {"train_loss": -23.540014266967773, "global_step": 155015, "epoch": 1867} {"train_loss": -23.43868064880371, "global_step": 155016, "epoch": 1867} {"train_loss": -23.129316329956055, "global_step": 155017, "epoch": 1867} {"train_loss": -23.443552017211914, "global_step": 155018, "epoch": 1867} {"train_loss": -23.40622329711914, "global_step": 155019, "epoch": 1867} {"train_loss": -23.149412155151367, "global_step": 155020, "epoch": 1867} {"train_loss": -23.44026756286621, "global_step": 155021, "epoch": 1867} {"train_loss": -23.611764907836914, "global_step": 155022, "epoch": 1867} {"train_loss": -23.255393981933594, "global_step": 155023, "epoch": 1867} {"train_loss": -23.750608444213867, "global_step": 155024, "epoch": 1867} {"train_loss": -23.421295166015625, "global_step": 155025, "epoch": 1867} {"train_loss": -23.192306518554688, "global_step": 155026, "epoch": 1867} {"train_loss": -23.0647029876709, "global_step": 155027, "epoch": 1867} {"train_loss": -23.62784194946289, "global_step": 155028, "epoch": 1867} {"train_loss": -23.53544044494629, "global_step": 155029, "epoch": 1867} {"train_loss": -23.060089111328125, "global_step": 155030, "epoch": 1867} {"train_loss": -22.946847915649414, "global_step": 155031, "epoch": 1867} {"train_loss": -23.569992065429688, "global_step": 155032, "epoch": 1867} {"train_loss": -23.14410400390625, "global_step": 155033, "epoch": 1867} {"train_loss": -23.3140869140625, "global_step": 155034, "epoch": 1867} {"train_loss": -23.532852172851562, "global_step": 155035, "epoch": 1867} {"train_loss": -23.709197998046875, "global_step": 155036, "epoch": 1867} {"train_loss": -23.65335464477539, "global_step": 155037, "epoch": 1867} {"train_loss": -23.47540283203125, "global_step": 155038, "epoch": 1867} {"train_loss": -23.45589828491211, "global_step": 155039, "epoch": 1867} {"train_loss": -23.182870864868164, "global_step": 155040, "epoch": 1867} {"train_loss": -23.516084671020508, "global_step": 155041, "epoch": 1867} {"train_loss": -23.473661422729492, "global_step": 155042, "epoch": 1867} {"train_loss": -23.200569198792238, "global_step": 155043, "epoch": 1867, "val_loss": 6331644.5} {"train_loss": -23.50909423828125, "global_step": 155044, "epoch": 1868} {"train_loss": -23.299352645874023, "global_step": 155045, "epoch": 1868} {"train_loss": -23.838411331176758, "global_step": 155046, "epoch": 1868} {"train_loss": -23.18902587890625, "global_step": 155047, "epoch": 1868} {"train_loss": -23.15709114074707, "global_step": 155048, "epoch": 1868} {"train_loss": -23.59486198425293, "global_step": 155049, "epoch": 1868} {"train_loss": -23.198200225830078, "global_step": 155050, "epoch": 1868} {"train_loss": -23.28120994567871, "global_step": 155051, "epoch": 1868} {"train_loss": -23.088455200195312, "global_step": 155052, "epoch": 1868} {"train_loss": -23.325227737426758, "global_step": 155053, "epoch": 1868} {"train_loss": -23.63772964477539, "global_step": 155054, "epoch": 1868} {"train_loss": -23.831968307495117, "global_step": 155055, "epoch": 1868} {"train_loss": -23.30085563659668, "global_step": 155056, "epoch": 1868} {"train_loss": -23.52978515625, "global_step": 155057, "epoch": 1868} {"train_loss": -23.592741012573242, "global_step": 155058, "epoch": 1868} {"train_loss": -23.373523712158203, "global_step": 155059, "epoch": 1868} {"train_loss": -23.465505599975586, "global_step": 155060, "epoch": 1868} {"train_loss": -23.274860382080078, "global_step": 155061, "epoch": 1868} {"train_loss": -23.269031524658203, "global_step": 155062, "epoch": 1868} {"train_loss": -23.47275733947754, "global_step": 155063, "epoch": 1868} {"train_loss": -23.42938232421875, "global_step": 155064, "epoch": 1868} {"train_loss": -23.378896713256836, "global_step": 155065, "epoch": 1868} {"train_loss": -23.38248634338379, "global_step": 155066, "epoch": 1868} {"train_loss": -23.307125091552734, "global_step": 155067, "epoch": 1868} {"train_loss": -23.062557220458984, "global_step": 155068, "epoch": 1868} {"train_loss": -23.248098373413086, "global_step": 155069, "epoch": 1868} {"train_loss": -22.947473526000977, "global_step": 155070, "epoch": 1868} {"train_loss": -23.29800796508789, "global_step": 155071, "epoch": 1868} {"train_loss": -23.279817581176758, "global_step": 155072, "epoch": 1868} {"train_loss": -23.341733932495117, "global_step": 155073, "epoch": 1868} {"train_loss": -23.259923934936523, "global_step": 155074, "epoch": 1868} {"train_loss": -23.344812393188477, "global_step": 155075, "epoch": 1868} {"train_loss": -23.2606258392334, "global_step": 155076, "epoch": 1868} {"train_loss": -23.339588165283203, "global_step": 155077, "epoch": 1868} {"train_loss": -23.389423370361328, "global_step": 155078, "epoch": 1868} {"train_loss": -23.9150447845459, "global_step": 155079, "epoch": 1868} {"train_loss": -23.550884246826172, "global_step": 155080, "epoch": 1868} {"train_loss": -23.357074737548828, "global_step": 155081, "epoch": 1868} {"train_loss": -23.727659225463867, "global_step": 155082, "epoch": 1868} {"train_loss": -23.903778076171875, "global_step": 155083, "epoch": 1868} {"train_loss": -23.339284896850586, "global_step": 155084, "epoch": 1868} {"train_loss": -23.133459091186523, "global_step": 155085, "epoch": 1868} {"train_loss": -23.36510467529297, "global_step": 155086, "epoch": 1868} {"train_loss": -23.388656616210938, "global_step": 155087, "epoch": 1868} {"train_loss": -23.89503288269043, "global_step": 155088, "epoch": 1868} {"train_loss": -23.63541603088379, "global_step": 155089, "epoch": 1868} {"train_loss": -23.3822021484375, "global_step": 155090, "epoch": 1868} {"train_loss": -23.120676040649414, "global_step": 155091, "epoch": 1868} {"train_loss": -23.244094848632812, "global_step": 155092, "epoch": 1868} {"train_loss": -23.52993392944336, "global_step": 155093, "epoch": 1868} {"train_loss": -23.615825653076172, "global_step": 155094, "epoch": 1868} {"train_loss": -23.404550552368164, "global_step": 155095, "epoch": 1868} {"train_loss": -23.92103385925293, "global_step": 155096, "epoch": 1868} {"train_loss": -23.4006290435791, "global_step": 155097, "epoch": 1868} {"train_loss": -23.471988677978516, "global_step": 155098, "epoch": 1868} {"train_loss": -23.2440242767334, "global_step": 155099, "epoch": 1868} {"train_loss": -23.14088249206543, "global_step": 155100, "epoch": 1868} {"train_loss": -23.712228775024414, "global_step": 155101, "epoch": 1868} {"train_loss": -23.06029510498047, "global_step": 155102, "epoch": 1868} {"train_loss": -23.730178833007812, "global_step": 155103, "epoch": 1868} {"train_loss": -23.6236629486084, "global_step": 155104, "epoch": 1868} {"train_loss": -23.240148544311523, "global_step": 155105, "epoch": 1868} {"train_loss": -23.34795570373535, "global_step": 155106, "epoch": 1868} {"train_loss": -23.436687469482422, "global_step": 155107, "epoch": 1868} {"train_loss": -23.319900512695312, "global_step": 155108, "epoch": 1868} {"train_loss": -22.996288299560547, "global_step": 155109, "epoch": 1868} {"train_loss": -22.178884506225586, "global_step": 155110, "epoch": 1868} {"train_loss": -22.754749298095703, "global_step": 155111, "epoch": 1868} {"train_loss": -23.5992374420166, "global_step": 155112, "epoch": 1868} {"train_loss": -23.043073654174805, "global_step": 155113, "epoch": 1868} {"train_loss": -23.33222007751465, "global_step": 155114, "epoch": 1868} {"train_loss": -23.0242977142334, "global_step": 155115, "epoch": 1868} {"train_loss": -23.22687339782715, "global_step": 155116, "epoch": 1868} {"train_loss": -23.09153175354004, "global_step": 155117, "epoch": 1868} {"train_loss": -23.146774291992188, "global_step": 155118, "epoch": 1868} {"train_loss": -23.184528350830078, "global_step": 155119, "epoch": 1868} {"train_loss": -23.076217651367188, "global_step": 155120, "epoch": 1868} {"train_loss": -23.360797882080078, "global_step": 155121, "epoch": 1868} {"train_loss": -23.415973663330078, "global_step": 155122, "epoch": 1868} {"train_loss": -23.110639572143555, "global_step": 155123, "epoch": 1868} {"train_loss": -23.23093032836914, "global_step": 155124, "epoch": 1868} {"train_loss": -23.44266128540039, "global_step": 155125, "epoch": 1868} {"train_loss": -23.358406480536402, "global_step": 155126, "epoch": 1868, "val_loss": 6291934.5} {"train_loss": -22.821470260620117, "global_step": 155127, "epoch": 1869} {"train_loss": -22.50154685974121, "global_step": 155128, "epoch": 1869} {"train_loss": -22.727293014526367, "global_step": 155129, "epoch": 1869} {"train_loss": -22.555002212524414, "global_step": 155130, "epoch": 1869} {"train_loss": -22.607816696166992, "global_step": 155131, "epoch": 1869} {"train_loss": -22.726774215698242, "global_step": 155132, "epoch": 1869} {"train_loss": -22.5697078704834, "global_step": 155133, "epoch": 1869} {"train_loss": -23.060195922851562, "global_step": 155134, "epoch": 1869} {"train_loss": -22.704172134399414, "global_step": 155135, "epoch": 1869} {"train_loss": -22.850650787353516, "global_step": 155136, "epoch": 1869} {"train_loss": -23.362506866455078, "global_step": 155137, "epoch": 1869} {"train_loss": -23.531522750854492, "global_step": 155138, "epoch": 1869} {"train_loss": -23.04218101501465, "global_step": 155139, "epoch": 1869} {"train_loss": -23.147296905517578, "global_step": 155140, "epoch": 1869} {"train_loss": -22.88547134399414, "global_step": 155141, "epoch": 1869} {"train_loss": -23.01045799255371, "global_step": 155142, "epoch": 1869} {"train_loss": -22.80730438232422, "global_step": 155143, "epoch": 1869} {"train_loss": -22.845861434936523, "global_step": 155144, "epoch": 1869} {"train_loss": -23.1108341217041, "global_step": 155145, "epoch": 1869} {"train_loss": -23.524858474731445, "global_step": 155146, "epoch": 1869} {"train_loss": -23.181859970092773, "global_step": 155147, "epoch": 1869} {"train_loss": -23.293912887573242, "global_step": 155148, "epoch": 1869} {"train_loss": -23.488229751586914, "global_step": 155149, "epoch": 1869} {"train_loss": -23.165071487426758, "global_step": 155150, "epoch": 1869} {"train_loss": -23.42087173461914, "global_step": 155151, "epoch": 1869} {"train_loss": -23.127960205078125, "global_step": 155152, "epoch": 1869} {"train_loss": -23.21413230895996, "global_step": 155153, "epoch": 1869} {"train_loss": -23.40082550048828, "global_step": 155154, "epoch": 1869} {"train_loss": -23.380603790283203, "global_step": 155155, "epoch": 1869} {"train_loss": -22.93080711364746, "global_step": 155156, "epoch": 1869} {"train_loss": -23.216777801513672, "global_step": 155157, "epoch": 1869} {"train_loss": -23.56403160095215, "global_step": 155158, "epoch": 1869} {"train_loss": -23.619937896728516, "global_step": 155159, "epoch": 1869} {"train_loss": -23.258529663085938, "global_step": 155160, "epoch": 1869} {"train_loss": -23.57520294189453, "global_step": 155161, "epoch": 1869} {"train_loss": -23.389328002929688, "global_step": 155162, "epoch": 1869} {"train_loss": -23.686389923095703, "global_step": 155163, "epoch": 1869} {"train_loss": -23.2224063873291, "global_step": 155164, "epoch": 1869} {"train_loss": -23.417104721069336, "global_step": 155165, "epoch": 1869} {"train_loss": -23.365859985351562, "global_step": 155166, "epoch": 1869} {"train_loss": -23.0233097076416, "global_step": 155167, "epoch": 1869} {"train_loss": -23.25139045715332, "global_step": 155168, "epoch": 1869} {"train_loss": -23.127126693725586, "global_step": 155169, "epoch": 1869} {"train_loss": -23.332956314086914, "global_step": 155170, "epoch": 1869} {"train_loss": -23.40659523010254, "global_step": 155171, "epoch": 1869} {"train_loss": -23.368642807006836, "global_step": 155172, "epoch": 1869} {"train_loss": -22.98464584350586, "global_step": 155173, "epoch": 1869} {"train_loss": -23.412870407104492, "global_step": 155174, "epoch": 1869} {"train_loss": -23.338735580444336, "global_step": 155175, "epoch": 1869} {"train_loss": -23.595956802368164, "global_step": 155176, "epoch": 1869} {"train_loss": -23.16028594970703, "global_step": 155177, "epoch": 1869} {"train_loss": -23.98160743713379, "global_step": 155178, "epoch": 1869} {"train_loss": -23.681886672973633, "global_step": 155179, "epoch": 1869} {"train_loss": -23.643301010131836, "global_step": 155180, "epoch": 1869} {"train_loss": -23.431570053100586, "global_step": 155181, "epoch": 1869} {"train_loss": -23.680736541748047, "global_step": 155182, "epoch": 1869} {"train_loss": -23.564664840698242, "global_step": 155183, "epoch": 1869} {"train_loss": -23.799707412719727, "global_step": 155184, "epoch": 1869} {"train_loss": -23.42365837097168, "global_step": 155185, "epoch": 1869} {"train_loss": -23.48586082458496, "global_step": 155186, "epoch": 1869} {"train_loss": -23.806385040283203, "global_step": 155187, "epoch": 1869} {"train_loss": -23.81192398071289, "global_step": 155188, "epoch": 1869} {"train_loss": -23.652002334594727, "global_step": 155189, "epoch": 1869} {"train_loss": -23.731412887573242, "global_step": 155190, "epoch": 1869} {"train_loss": -23.300031661987305, "global_step": 155191, "epoch": 1869} {"train_loss": -23.594648361206055, "global_step": 155192, "epoch": 1869} {"train_loss": -23.08648109436035, "global_step": 155193, "epoch": 1869} {"train_loss": -23.28749656677246, "global_step": 155194, "epoch": 1869} {"train_loss": -23.250137329101562, "global_step": 155195, "epoch": 1869} {"train_loss": -23.552593231201172, "global_step": 155196, "epoch": 1869} {"train_loss": -23.447832107543945, "global_step": 155197, "epoch": 1869} {"train_loss": -23.58510398864746, "global_step": 155198, "epoch": 1869} {"train_loss": -23.501007080078125, "global_step": 155199, "epoch": 1869} {"train_loss": -23.570756912231445, "global_step": 155200, "epoch": 1869} {"train_loss": -23.59604263305664, "global_step": 155201, "epoch": 1869} {"train_loss": -23.563400268554688, "global_step": 155202, "epoch": 1869} {"train_loss": -23.19099998474121, "global_step": 155203, "epoch": 1869} {"train_loss": -23.522321701049805, "global_step": 155204, "epoch": 1869} {"train_loss": -23.370338439941406, "global_step": 155205, "epoch": 1869} {"train_loss": -23.648855209350586, "global_step": 155206, "epoch": 1869} {"train_loss": -23.51686668395996, "global_step": 155207, "epoch": 1869} {"train_loss": -23.304731369018555, "global_step": 155208, "epoch": 1869} {"train_loss": -23.300116366650684, "global_step": 155209, "epoch": 1869, "val_loss": 6310526.5} {"train_loss": -23.30557632446289, "global_step": 155210, "epoch": 1870} {"train_loss": -23.283830642700195, "global_step": 155211, "epoch": 1870} {"train_loss": -23.553447723388672, "global_step": 155212, "epoch": 1870} {"train_loss": -23.280380249023438, "global_step": 155213, "epoch": 1870} {"train_loss": -23.21943473815918, "global_step": 155214, "epoch": 1870} {"train_loss": -23.292917251586914, "global_step": 155215, "epoch": 1870} {"train_loss": -23.383472442626953, "global_step": 155216, "epoch": 1870} {"train_loss": -23.337350845336914, "global_step": 155217, "epoch": 1870} {"train_loss": -23.433778762817383, "global_step": 155218, "epoch": 1870} {"train_loss": -23.81305503845215, "global_step": 155219, "epoch": 1870} {"train_loss": -23.482574462890625, "global_step": 155220, "epoch": 1870} {"train_loss": -23.516815185546875, "global_step": 155221, "epoch": 1870} {"train_loss": -23.257230758666992, "global_step": 155222, "epoch": 1870} {"train_loss": -23.376556396484375, "global_step": 155223, "epoch": 1870} {"train_loss": -23.277677536010742, "global_step": 155224, "epoch": 1870} {"train_loss": -23.094331741333008, "global_step": 155225, "epoch": 1870} {"train_loss": -23.434612274169922, "global_step": 155226, "epoch": 1870} {"train_loss": -23.382028579711914, "global_step": 155227, "epoch": 1870} {"train_loss": -23.226903915405273, "global_step": 155228, "epoch": 1870} {"train_loss": -23.53396224975586, "global_step": 155229, "epoch": 1870} {"train_loss": -23.75284767150879, "global_step": 155230, "epoch": 1870} {"train_loss": -23.53377342224121, "global_step": 155231, "epoch": 1870} {"train_loss": -23.46963882446289, "global_step": 155232, "epoch": 1870} {"train_loss": -23.416629791259766, "global_step": 155233, "epoch": 1870} {"train_loss": -23.260984420776367, "global_step": 155234, "epoch": 1870} {"train_loss": -23.350339889526367, "global_step": 155235, "epoch": 1870} {"train_loss": -23.32301139831543, "global_step": 155236, "epoch": 1870} {"train_loss": -23.39271354675293, "global_step": 155237, "epoch": 1870} {"train_loss": -23.18864631652832, "global_step": 155238, "epoch": 1870} {"train_loss": -23.356746673583984, "global_step": 155239, "epoch": 1870} {"train_loss": -23.487655639648438, "global_step": 155240, "epoch": 1870} {"train_loss": -23.463598251342773, "global_step": 155241, "epoch": 1870} {"train_loss": -23.584882736206055, "global_step": 155242, "epoch": 1870} {"train_loss": -23.50240135192871, "global_step": 155243, "epoch": 1870} {"train_loss": -23.397111892700195, "global_step": 155244, "epoch": 1870} {"train_loss": -23.34321403503418, "global_step": 155245, "epoch": 1870} {"train_loss": -23.4543514251709, "global_step": 155246, "epoch": 1870} {"train_loss": -23.51526641845703, "global_step": 155247, "epoch": 1870} {"train_loss": -23.408132553100586, "global_step": 155248, "epoch": 1870} {"train_loss": -23.225736618041992, "global_step": 155249, "epoch": 1870} {"train_loss": -23.340307235717773, "global_step": 155250, "epoch": 1870} {"train_loss": -23.282819747924805, "global_step": 155251, "epoch": 1870} {"train_loss": -23.390241622924805, "global_step": 155252, "epoch": 1870} {"train_loss": -23.349287033081055, "global_step": 155253, "epoch": 1870} {"train_loss": -23.703603744506836, "global_step": 155254, "epoch": 1870} {"train_loss": -23.174924850463867, "global_step": 155255, "epoch": 1870} {"train_loss": -23.501821517944336, "global_step": 155256, "epoch": 1870} {"train_loss": -23.151874542236328, "global_step": 155257, "epoch": 1870} {"train_loss": -23.201215744018555, "global_step": 155258, "epoch": 1870} {"train_loss": -22.98696517944336, "global_step": 155259, "epoch": 1870} {"train_loss": -23.061979293823242, "global_step": 155260, "epoch": 1870} {"train_loss": -23.499364852905273, "global_step": 155261, "epoch": 1870} {"train_loss": -23.515029907226562, "global_step": 155262, "epoch": 1870} {"train_loss": -23.46646499633789, "global_step": 155263, "epoch": 1870} {"train_loss": -23.800512313842773, "global_step": 155264, "epoch": 1870} {"train_loss": -23.4456787109375, "global_step": 155265, "epoch": 1870} {"train_loss": -23.482990264892578, "global_step": 155266, "epoch": 1870} {"train_loss": -23.73426628112793, "global_step": 155267, "epoch": 1870} {"train_loss": -23.58138084411621, "global_step": 155268, "epoch": 1870} {"train_loss": -23.32223892211914, "global_step": 155269, "epoch": 1870} {"train_loss": -23.625106811523438, "global_step": 155270, "epoch": 1870} {"train_loss": -23.817758560180664, "global_step": 155271, "epoch": 1870} {"train_loss": -23.25252342224121, "global_step": 155272, "epoch": 1870} {"train_loss": -23.181116104125977, "global_step": 155273, "epoch": 1870} {"train_loss": -23.353351593017578, "global_step": 155274, "epoch": 1870} {"train_loss": -23.346572875976562, "global_step": 155275, "epoch": 1870} {"train_loss": -23.353649139404297, "global_step": 155276, "epoch": 1870} {"train_loss": -23.66815185546875, "global_step": 155277, "epoch": 1870} {"train_loss": -23.594247817993164, "global_step": 155278, "epoch": 1870} {"train_loss": -23.65203285217285, "global_step": 155279, "epoch": 1870} {"train_loss": -23.0963077545166, "global_step": 155280, "epoch": 1870} {"train_loss": -23.718544006347656, "global_step": 155281, "epoch": 1870} {"train_loss": -23.463531494140625, "global_step": 155282, "epoch": 1870} {"train_loss": -23.73712921142578, "global_step": 155283, "epoch": 1870} {"train_loss": -23.61564064025879, "global_step": 155284, "epoch": 1870} {"train_loss": -23.694494247436523, "global_step": 155285, "epoch": 1870} {"train_loss": -23.409259796142578, "global_step": 155286, "epoch": 1870} {"train_loss": -23.34476661682129, "global_step": 155287, "epoch": 1870} {"train_loss": -23.606077194213867, "global_step": 155288, "epoch": 1870} {"train_loss": -23.404939651489258, "global_step": 155289, "epoch": 1870} {"train_loss": -23.69160270690918, "global_step": 155290, "epoch": 1870} {"train_loss": -23.631139755249023, "global_step": 155291, "epoch": 1870} {"train_loss": -23.40871707502618, "global_step": 155292, "epoch": 1870, "val_loss": 6362117.0} {"train_loss": -22.922317504882812, "global_step": 155293, "epoch": 1871} {"train_loss": -22.744094848632812, "global_step": 155294, "epoch": 1871} {"train_loss": -23.357572555541992, "global_step": 155295, "epoch": 1871} {"train_loss": -23.213361740112305, "global_step": 155296, "epoch": 1871} {"train_loss": -23.127792358398438, "global_step": 155297, "epoch": 1871} {"train_loss": -23.375003814697266, "global_step": 155298, "epoch": 1871} {"train_loss": -23.388195037841797, "global_step": 155299, "epoch": 1871} {"train_loss": -23.38186264038086, "global_step": 155300, "epoch": 1871} {"train_loss": -23.25779151916504, "global_step": 155301, "epoch": 1871} {"train_loss": -23.217575073242188, "global_step": 155302, "epoch": 1871} {"train_loss": -23.598928451538086, "global_step": 155303, "epoch": 1871} {"train_loss": -23.378345489501953, "global_step": 155304, "epoch": 1871} {"train_loss": -23.189855575561523, "global_step": 155305, "epoch": 1871} {"train_loss": -23.5207462310791, "global_step": 155306, "epoch": 1871} {"train_loss": -23.44929313659668, "global_step": 155307, "epoch": 1871} {"train_loss": -23.517425537109375, "global_step": 155308, "epoch": 1871} {"train_loss": -23.673526763916016, "global_step": 155309, "epoch": 1871} {"train_loss": -23.719289779663086, "global_step": 155310, "epoch": 1871} {"train_loss": -23.346769332885742, "global_step": 155311, "epoch": 1871} {"train_loss": -23.593994140625, "global_step": 155312, "epoch": 1871} {"train_loss": -23.562969207763672, "global_step": 155313, "epoch": 1871} {"train_loss": -23.576034545898438, "global_step": 155314, "epoch": 1871} {"train_loss": -23.530475616455078, "global_step": 155315, "epoch": 1871} {"train_loss": -23.441795349121094, "global_step": 155316, "epoch": 1871} {"train_loss": -23.47153663635254, "global_step": 155317, "epoch": 1871} {"train_loss": -23.350574493408203, "global_step": 155318, "epoch": 1871} {"train_loss": -23.29578971862793, "global_step": 155319, "epoch": 1871} {"train_loss": -23.57271957397461, "global_step": 155320, "epoch": 1871} {"train_loss": -23.786489486694336, "global_step": 155321, "epoch": 1871} {"train_loss": -23.585697174072266, "global_step": 155322, "epoch": 1871} {"train_loss": -23.394412994384766, "global_step": 155323, "epoch": 1871} {"train_loss": -23.49957847595215, "global_step": 155324, "epoch": 1871} {"train_loss": -23.744749069213867, "global_step": 155325, "epoch": 1871} {"train_loss": -23.4388484954834, "global_step": 155326, "epoch": 1871} {"train_loss": -23.670825958251953, "global_step": 155327, "epoch": 1871} {"train_loss": -23.27029800415039, "global_step": 155328, "epoch": 1871} {"train_loss": -23.442121505737305, "global_step": 155329, "epoch": 1871} {"train_loss": -22.99432373046875, "global_step": 155330, "epoch": 1871} {"train_loss": -23.412195205688477, "global_step": 155331, "epoch": 1871} {"train_loss": -23.665605545043945, "global_step": 155332, "epoch": 1871} {"train_loss": -23.484689712524414, "global_step": 155333, "epoch": 1871} {"train_loss": -23.24799919128418, "global_step": 155334, "epoch": 1871} {"train_loss": -23.630460739135742, "global_step": 155335, "epoch": 1871} {"train_loss": -23.564579010009766, "global_step": 155336, "epoch": 1871} {"train_loss": -23.31264305114746, "global_step": 155337, "epoch": 1871} {"train_loss": -23.642810821533203, "global_step": 155338, "epoch": 1871} {"train_loss": -23.19256019592285, "global_step": 155339, "epoch": 1871} {"train_loss": -22.9089298248291, "global_step": 155340, "epoch": 1871} {"train_loss": -23.22580909729004, "global_step": 155341, "epoch": 1871} {"train_loss": -23.49664306640625, "global_step": 155342, "epoch": 1871} {"train_loss": -23.352792739868164, "global_step": 155343, "epoch": 1871} {"train_loss": -23.200607299804688, "global_step": 155344, "epoch": 1871} {"train_loss": -23.489063262939453, "global_step": 155345, "epoch": 1871} {"train_loss": -23.29608726501465, "global_step": 155346, "epoch": 1871} {"train_loss": -23.443218231201172, "global_step": 155347, "epoch": 1871} {"train_loss": -23.022775650024414, "global_step": 155348, "epoch": 1871} {"train_loss": -23.0460147857666, "global_step": 155349, "epoch": 1871} {"train_loss": -23.539796829223633, "global_step": 155350, "epoch": 1871} {"train_loss": -23.59225845336914, "global_step": 155351, "epoch": 1871} {"train_loss": -23.214696884155273, "global_step": 155352, "epoch": 1871} {"train_loss": -23.451902389526367, "global_step": 155353, "epoch": 1871} {"train_loss": -23.628681182861328, "global_step": 155354, "epoch": 1871} {"train_loss": -23.557281494140625, "global_step": 155355, "epoch": 1871} {"train_loss": -22.87881851196289, "global_step": 155356, "epoch": 1871} {"train_loss": -23.640748977661133, "global_step": 155357, "epoch": 1871} {"train_loss": -23.38447380065918, "global_step": 155358, "epoch": 1871} {"train_loss": -23.523483276367188, "global_step": 155359, "epoch": 1871} {"train_loss": -23.52375602722168, "global_step": 155360, "epoch": 1871} {"train_loss": -23.469602584838867, "global_step": 155361, "epoch": 1871} {"train_loss": -23.46376609802246, "global_step": 155362, "epoch": 1871} {"train_loss": -23.253320693969727, "global_step": 155363, "epoch": 1871} {"train_loss": -23.3608341217041, "global_step": 155364, "epoch": 1871} {"train_loss": -23.509445190429688, "global_step": 155365, "epoch": 1871} {"train_loss": -23.590940475463867, "global_step": 155366, "epoch": 1871} {"train_loss": -23.037296295166016, "global_step": 155367, "epoch": 1871} {"train_loss": -23.2925968170166, "global_step": 155368, "epoch": 1871} {"train_loss": -23.058673858642578, "global_step": 155369, "epoch": 1871} {"train_loss": -23.0515193939209, "global_step": 155370, "epoch": 1871} {"train_loss": -23.179990768432617, "global_step": 155371, "epoch": 1871} {"train_loss": -23.335098266601562, "global_step": 155372, "epoch": 1871} {"train_loss": -23.525474548339844, "global_step": 155373, "epoch": 1871} {"train_loss": -23.268226623535156, "global_step": 155374, "epoch": 1871} {"train_loss": -23.364628688398614, "global_step": 155375, "epoch": 1871, "val_loss": 6279670.0} {"train_loss": -22.694746017456055, "global_step": 155376, "epoch": 1872} {"train_loss": -23.057748794555664, "global_step": 155377, "epoch": 1872} {"train_loss": -22.648141860961914, "global_step": 155378, "epoch": 1872} {"train_loss": -22.98545265197754, "global_step": 155379, "epoch": 1872} {"train_loss": -23.15390968322754, "global_step": 155380, "epoch": 1872} {"train_loss": -22.928991317749023, "global_step": 155381, "epoch": 1872} {"train_loss": -23.40729331970215, "global_step": 155382, "epoch": 1872} {"train_loss": -22.994564056396484, "global_step": 155383, "epoch": 1872} {"train_loss": -23.032323837280273, "global_step": 155384, "epoch": 1872} {"train_loss": -22.89002799987793, "global_step": 155385, "epoch": 1872} {"train_loss": -23.45392417907715, "global_step": 155386, "epoch": 1872} {"train_loss": -22.907800674438477, "global_step": 155387, "epoch": 1872} {"train_loss": -23.321243286132812, "global_step": 155388, "epoch": 1872} {"train_loss": -23.439573287963867, "global_step": 155389, "epoch": 1872} {"train_loss": -23.197555541992188, "global_step": 155390, "epoch": 1872} {"train_loss": -23.010818481445312, "global_step": 155391, "epoch": 1872} {"train_loss": -23.6055965423584, "global_step": 155392, "epoch": 1872} {"train_loss": -23.141183853149414, "global_step": 155393, "epoch": 1872} {"train_loss": -23.212078094482422, "global_step": 155394, "epoch": 1872} {"train_loss": -23.050153732299805, "global_step": 155395, "epoch": 1872} {"train_loss": -23.511009216308594, "global_step": 155396, "epoch": 1872} {"train_loss": -23.22255516052246, "global_step": 155397, "epoch": 1872} {"train_loss": -23.548898696899414, "global_step": 155398, "epoch": 1872} {"train_loss": -23.496580123901367, "global_step": 155399, "epoch": 1872} {"train_loss": -23.25156021118164, "global_step": 155400, "epoch": 1872} {"train_loss": -23.269033432006836, "global_step": 155401, "epoch": 1872} {"train_loss": -23.35263442993164, "global_step": 155402, "epoch": 1872} {"train_loss": -23.547061920166016, "global_step": 155403, "epoch": 1872} {"train_loss": -23.192699432373047, "global_step": 155404, "epoch": 1872} {"train_loss": -23.61976432800293, "global_step": 155405, "epoch": 1872} {"train_loss": -23.574270248413086, "global_step": 155406, "epoch": 1872} {"train_loss": -23.47712516784668, "global_step": 155407, "epoch": 1872} {"train_loss": -22.965641021728516, "global_step": 155408, "epoch": 1872} {"train_loss": -23.091806411743164, "global_step": 155409, "epoch": 1872} {"train_loss": -23.06485939025879, "global_step": 155410, "epoch": 1872} {"train_loss": -23.066091537475586, "global_step": 155411, "epoch": 1872} {"train_loss": -23.25455665588379, "global_step": 155412, "epoch": 1872} {"train_loss": -23.12928581237793, "global_step": 155413, "epoch": 1872} {"train_loss": -23.375577926635742, "global_step": 155414, "epoch": 1872} {"train_loss": -22.91747283935547, "global_step": 155415, "epoch": 1872} {"train_loss": -23.084470748901367, "global_step": 155416, "epoch": 1872} {"train_loss": -23.111448287963867, "global_step": 155417, "epoch": 1872} {"train_loss": -23.645498275756836, "global_step": 155418, "epoch": 1872} {"train_loss": -23.601709365844727, "global_step": 155419, "epoch": 1872} {"train_loss": -23.26075553894043, "global_step": 155420, "epoch": 1872} {"train_loss": -23.821483612060547, "global_step": 155421, "epoch": 1872} {"train_loss": -23.09027671813965, "global_step": 155422, "epoch": 1872} {"train_loss": -23.71189308166504, "global_step": 155423, "epoch": 1872} {"train_loss": -23.172571182250977, "global_step": 155424, "epoch": 1872} {"train_loss": -23.76080894470215, "global_step": 155425, "epoch": 1872} {"train_loss": -23.085147857666016, "global_step": 155426, "epoch": 1872} {"train_loss": -23.367862701416016, "global_step": 155427, "epoch": 1872} {"train_loss": -23.03499412536621, "global_step": 155428, "epoch": 1872} {"train_loss": -23.32294464111328, "global_step": 155429, "epoch": 1872} {"train_loss": -23.382299423217773, "global_step": 155430, "epoch": 1872} {"train_loss": -23.49188995361328, "global_step": 155431, "epoch": 1872} {"train_loss": -22.97133445739746, "global_step": 155432, "epoch": 1872} {"train_loss": -22.925344467163086, "global_step": 155433, "epoch": 1872} {"train_loss": -23.62890625, "global_step": 155434, "epoch": 1872} {"train_loss": -23.396780014038086, "global_step": 155435, "epoch": 1872} {"train_loss": -23.388893127441406, "global_step": 155436, "epoch": 1872} {"train_loss": -23.096755981445312, "global_step": 155437, "epoch": 1872} {"train_loss": -23.264049530029297, "global_step": 155438, "epoch": 1872} {"train_loss": -23.545602798461914, "global_step": 155439, "epoch": 1872} {"train_loss": -23.709854125976562, "global_step": 155440, "epoch": 1872} {"train_loss": -23.14752769470215, "global_step": 155441, "epoch": 1872} {"train_loss": -23.40833854675293, "global_step": 155442, "epoch": 1872} {"train_loss": -23.53955078125, "global_step": 155443, "epoch": 1872} {"train_loss": -22.734365463256836, "global_step": 155444, "epoch": 1872} {"train_loss": -23.568973541259766, "global_step": 155445, "epoch": 1872} {"train_loss": -23.576892852783203, "global_step": 155446, "epoch": 1872} {"train_loss": -23.684432983398438, "global_step": 155447, "epoch": 1872} {"train_loss": -23.267213821411133, "global_step": 155448, "epoch": 1872} {"train_loss": -23.447587966918945, "global_step": 155449, "epoch": 1872} {"train_loss": -23.453603744506836, "global_step": 155450, "epoch": 1872} {"train_loss": -23.51363182067871, "global_step": 155451, "epoch": 1872} {"train_loss": -23.408445358276367, "global_step": 155452, "epoch": 1872} {"train_loss": -23.332324981689453, "global_step": 155453, "epoch": 1872} {"train_loss": -23.209203720092773, "global_step": 155454, "epoch": 1872} {"train_loss": -23.15201187133789, "global_step": 155455, "epoch": 1872} {"train_loss": -23.37375259399414, "global_step": 155456, "epoch": 1872} {"train_loss": -23.243453979492188, "global_step": 155457, "epoch": 1872} {"train_loss": -23.274494148162475, "global_step": 155458, "epoch": 1872, "val_loss": 6391608.5} {"train_loss": -21.622880935668945, "global_step": 155459, "epoch": 1873} {"train_loss": -22.58177375793457, "global_step": 155460, "epoch": 1873} {"train_loss": -21.33287239074707, "global_step": 155461, "epoch": 1873} {"train_loss": -22.693937301635742, "global_step": 155462, "epoch": 1873} {"train_loss": -22.528013229370117, "global_step": 155463, "epoch": 1873} {"train_loss": -22.716886520385742, "global_step": 155464, "epoch": 1873} {"train_loss": -22.654212951660156, "global_step": 155465, "epoch": 1873} {"train_loss": -22.588144302368164, "global_step": 155466, "epoch": 1873} {"train_loss": -22.86598014831543, "global_step": 155467, "epoch": 1873} {"train_loss": -22.500951766967773, "global_step": 155468, "epoch": 1873} {"train_loss": -22.731334686279297, "global_step": 155469, "epoch": 1873} {"train_loss": -22.725282669067383, "global_step": 155470, "epoch": 1873} {"train_loss": -23.051067352294922, "global_step": 155471, "epoch": 1873} {"train_loss": -22.990150451660156, "global_step": 155472, "epoch": 1873} {"train_loss": -22.865934371948242, "global_step": 155473, "epoch": 1873} {"train_loss": -22.742401123046875, "global_step": 155474, "epoch": 1873} {"train_loss": -22.893508911132812, "global_step": 155475, "epoch": 1873} {"train_loss": -23.444473266601562, "global_step": 155476, "epoch": 1873} {"train_loss": -22.60139274597168, "global_step": 155477, "epoch": 1873} {"train_loss": -22.839025497436523, "global_step": 155478, "epoch": 1873} {"train_loss": -22.87959861755371, "global_step": 155479, "epoch": 1873} {"train_loss": -23.01235008239746, "global_step": 155480, "epoch": 1873} {"train_loss": -23.55989646911621, "global_step": 155481, "epoch": 1873} {"train_loss": -23.250329971313477, "global_step": 155482, "epoch": 1873} {"train_loss": -23.521467208862305, "global_step": 155483, "epoch": 1873} {"train_loss": -22.987695693969727, "global_step": 155484, "epoch": 1873} {"train_loss": -22.948720932006836, "global_step": 155485, "epoch": 1873} {"train_loss": -23.16152000427246, "global_step": 155486, "epoch": 1873} {"train_loss": -23.315189361572266, "global_step": 155487, "epoch": 1873} {"train_loss": -23.276479721069336, "global_step": 155488, "epoch": 1873} {"train_loss": -23.32699966430664, "global_step": 155489, "epoch": 1873} {"train_loss": -23.132333755493164, "global_step": 155490, "epoch": 1873} {"train_loss": -23.29595947265625, "global_step": 155491, "epoch": 1873} {"train_loss": -23.26838493347168, "global_step": 155492, "epoch": 1873} {"train_loss": -23.25345802307129, "global_step": 155493, "epoch": 1873} {"train_loss": -23.650827407836914, "global_step": 155494, "epoch": 1873} {"train_loss": -23.40155792236328, "global_step": 155495, "epoch": 1873} {"train_loss": -23.623132705688477, "global_step": 155496, "epoch": 1873} {"train_loss": -23.661298751831055, "global_step": 155497, "epoch": 1873} {"train_loss": -23.431781768798828, "global_step": 155498, "epoch": 1873} {"train_loss": -23.4057559967041, "global_step": 155499, "epoch": 1873} {"train_loss": -23.418888092041016, "global_step": 155500, "epoch": 1873} {"train_loss": -23.359909057617188, "global_step": 155501, "epoch": 1873} {"train_loss": -23.396072387695312, "global_step": 155502, "epoch": 1873} {"train_loss": -23.52706527709961, "global_step": 155503, "epoch": 1873} {"train_loss": -23.294803619384766, "global_step": 155504, "epoch": 1873} {"train_loss": -23.457632064819336, "global_step": 155505, "epoch": 1873} {"train_loss": -23.029483795166016, "global_step": 155506, "epoch": 1873} {"train_loss": -23.569734573364258, "global_step": 155507, "epoch": 1873} {"train_loss": -23.575212478637695, "global_step": 155508, "epoch": 1873} {"train_loss": -23.52483558654785, "global_step": 155509, "epoch": 1873} {"train_loss": -23.623123168945312, "global_step": 155510, "epoch": 1873} {"train_loss": -24.0582218170166, "global_step": 155511, "epoch": 1873} {"train_loss": -23.170419692993164, "global_step": 155512, "epoch": 1873} {"train_loss": -23.2216854095459, "global_step": 155513, "epoch": 1873} {"train_loss": -23.552648544311523, "global_step": 155514, "epoch": 1873} {"train_loss": -23.744659423828125, "global_step": 155515, "epoch": 1873} {"train_loss": -23.243122100830078, "global_step": 155516, "epoch": 1873} {"train_loss": -23.107568740844727, "global_step": 155517, "epoch": 1873} {"train_loss": -23.484764099121094, "global_step": 155518, "epoch": 1873} {"train_loss": -23.31165885925293, "global_step": 155519, "epoch": 1873} {"train_loss": -23.52764892578125, "global_step": 155520, "epoch": 1873} {"train_loss": -23.744340896606445, "global_step": 155521, "epoch": 1873} {"train_loss": -23.313627243041992, "global_step": 155522, "epoch": 1873} {"train_loss": -23.642778396606445, "global_step": 155523, "epoch": 1873} {"train_loss": -23.718490600585938, "global_step": 155524, "epoch": 1873} {"train_loss": -23.622547149658203, "global_step": 155525, "epoch": 1873} {"train_loss": -23.449697494506836, "global_step": 155526, "epoch": 1873} {"train_loss": -23.365949630737305, "global_step": 155527, "epoch": 1873} {"train_loss": -23.62615966796875, "global_step": 155528, "epoch": 1873} {"train_loss": -23.72649574279785, "global_step": 155529, "epoch": 1873} {"train_loss": -23.4859561920166, "global_step": 155530, "epoch": 1873} {"train_loss": -23.570598602294922, "global_step": 155531, "epoch": 1873} {"train_loss": -23.203397750854492, "global_step": 155532, "epoch": 1873} {"train_loss": -23.610179901123047, "global_step": 155533, "epoch": 1873} {"train_loss": -23.388219833374023, "global_step": 155534, "epoch": 1873} {"train_loss": -23.388681411743164, "global_step": 155535, "epoch": 1873} {"train_loss": -23.401086807250977, "global_step": 155536, "epoch": 1873} {"train_loss": -23.470640182495117, "global_step": 155537, "epoch": 1873} {"train_loss": -23.223398208618164, "global_step": 155538, "epoch": 1873} {"train_loss": -22.862695693969727, "global_step": 155539, "epoch": 1873} {"train_loss": -22.923465728759766, "global_step": 155540, "epoch": 1873} {"train_loss": -23.20551208128412, "global_step": 155541, "epoch": 1873, "val_loss": 6332135.0} {"train_loss": -22.976709365844727, "global_step": 155542, "epoch": 1874} {"train_loss": -22.847360610961914, "global_step": 155543, "epoch": 1874} {"train_loss": -22.780004501342773, "global_step": 155544, "epoch": 1874} {"train_loss": -22.128385543823242, "global_step": 155545, "epoch": 1874} {"train_loss": -22.89069175720215, "global_step": 155546, "epoch": 1874} {"train_loss": -22.816028594970703, "global_step": 155547, "epoch": 1874} {"train_loss": -23.194379806518555, "global_step": 155548, "epoch": 1874} {"train_loss": -22.895029067993164, "global_step": 155549, "epoch": 1874} {"train_loss": -23.205432891845703, "global_step": 155550, "epoch": 1874} {"train_loss": -22.9303035736084, "global_step": 155551, "epoch": 1874} {"train_loss": -22.68702507019043, "global_step": 155552, "epoch": 1874} {"train_loss": -22.83580780029297, "global_step": 155553, "epoch": 1874} {"train_loss": -23.18547248840332, "global_step": 155554, "epoch": 1874} {"train_loss": -22.98348617553711, "global_step": 155555, "epoch": 1874} {"train_loss": -23.041894912719727, "global_step": 155556, "epoch": 1874} {"train_loss": -22.926965713500977, "global_step": 155557, "epoch": 1874} {"train_loss": -23.035554885864258, "global_step": 155558, "epoch": 1874} {"train_loss": -22.785625457763672, "global_step": 155559, "epoch": 1874} {"train_loss": -23.608129501342773, "global_step": 155560, "epoch": 1874} {"train_loss": -23.12235450744629, "global_step": 155561, "epoch": 1874} {"train_loss": -23.324554443359375, "global_step": 155562, "epoch": 1874} {"train_loss": -23.264951705932617, "global_step": 155563, "epoch": 1874} {"train_loss": -23.20505714416504, "global_step": 155564, "epoch": 1874} {"train_loss": -22.920873641967773, "global_step": 155565, "epoch": 1874} {"train_loss": -23.1331787109375, "global_step": 155566, "epoch": 1874} {"train_loss": -23.007247924804688, "global_step": 155567, "epoch": 1874} {"train_loss": -23.381128311157227, "global_step": 155568, "epoch": 1874} {"train_loss": -23.1605281829834, "global_step": 155569, "epoch": 1874} {"train_loss": -23.36360740661621, "global_step": 155570, "epoch": 1874} {"train_loss": -23.313562393188477, "global_step": 155571, "epoch": 1874} {"train_loss": -23.136198043823242, "global_step": 155572, "epoch": 1874} {"train_loss": -23.01105308532715, "global_step": 155573, "epoch": 1874} {"train_loss": -23.25870704650879, "global_step": 155574, "epoch": 1874} {"train_loss": -23.12318992614746, "global_step": 155575, "epoch": 1874} {"train_loss": -23.317947387695312, "global_step": 155576, "epoch": 1874} {"train_loss": -23.39468002319336, "global_step": 155577, "epoch": 1874} {"train_loss": -23.55108070373535, "global_step": 155578, "epoch": 1874} {"train_loss": -23.617576599121094, "global_step": 155579, "epoch": 1874} {"train_loss": -23.210721969604492, "global_step": 155580, "epoch": 1874} {"train_loss": -23.397958755493164, "global_step": 155581, "epoch": 1874} {"train_loss": -23.259235382080078, "global_step": 155582, "epoch": 1874} {"train_loss": -23.466785430908203, "global_step": 155583, "epoch": 1874} {"train_loss": -23.628368377685547, "global_step": 155584, "epoch": 1874} {"train_loss": -23.477706909179688, "global_step": 155585, "epoch": 1874} {"train_loss": -23.482328414916992, "global_step": 155586, "epoch": 1874} {"train_loss": -23.5067138671875, "global_step": 155587, "epoch": 1874} {"train_loss": -23.434160232543945, "global_step": 155588, "epoch": 1874} {"train_loss": -23.616918563842773, "global_step": 155589, "epoch": 1874} {"train_loss": -23.277807235717773, "global_step": 155590, "epoch": 1874} {"train_loss": -22.85141372680664, "global_step": 155591, "epoch": 1874} {"train_loss": -23.163604736328125, "global_step": 155592, "epoch": 1874} {"train_loss": -23.456247329711914, "global_step": 155593, "epoch": 1874} {"train_loss": -23.044921875, "global_step": 155594, "epoch": 1874} {"train_loss": -23.12251853942871, "global_step": 155595, "epoch": 1874} {"train_loss": -23.400386810302734, "global_step": 155596, "epoch": 1874} {"train_loss": -23.372522354125977, "global_step": 155597, "epoch": 1874} {"train_loss": -23.335189819335938, "global_step": 155598, "epoch": 1874} {"train_loss": -23.57276725769043, "global_step": 155599, "epoch": 1874} {"train_loss": -23.413766860961914, "global_step": 155600, "epoch": 1874} {"train_loss": -23.534046173095703, "global_step": 155601, "epoch": 1874} {"train_loss": -23.48141860961914, "global_step": 155602, "epoch": 1874} {"train_loss": -23.754058837890625, "global_step": 155603, "epoch": 1874} {"train_loss": -23.28377914428711, "global_step": 155604, "epoch": 1874} {"train_loss": -22.9030818939209, "global_step": 155605, "epoch": 1874} {"train_loss": -23.720151901245117, "global_step": 155606, "epoch": 1874} {"train_loss": -23.26248550415039, "global_step": 155607, "epoch": 1874} {"train_loss": -23.404687881469727, "global_step": 155608, "epoch": 1874} {"train_loss": -23.27962303161621, "global_step": 155609, "epoch": 1874} {"train_loss": -23.567594528198242, "global_step": 155610, "epoch": 1874} {"train_loss": -23.435224533081055, "global_step": 155611, "epoch": 1874} {"train_loss": -23.996068954467773, "global_step": 155612, "epoch": 1874} {"train_loss": -23.538166046142578, "global_step": 155613, "epoch": 1874} {"train_loss": -23.50086784362793, "global_step": 155614, "epoch": 1874} {"train_loss": -23.649511337280273, "global_step": 155615, "epoch": 1874} {"train_loss": -23.135915756225586, "global_step": 155616, "epoch": 1874} {"train_loss": -23.358068466186523, "global_step": 155617, "epoch": 1874} {"train_loss": -22.976242065429688, "global_step": 155618, "epoch": 1874} {"train_loss": -23.63039779663086, "global_step": 155619, "epoch": 1874} {"train_loss": -23.735517501831055, "global_step": 155620, "epoch": 1874} {"train_loss": -23.0809383392334, "global_step": 155621, "epoch": 1874} {"train_loss": -23.3884334564209, "global_step": 155622, "epoch": 1874} {"train_loss": -22.99236488342285, "global_step": 155623, "epoch": 1874} {"train_loss": -23.24244660067271, "global_step": 155624, "epoch": 1874, "val_loss": 6286749.0} {"train_loss": -22.863922119140625, "global_step": 155625, "epoch": 1875} {"train_loss": -23.308658599853516, "global_step": 155626, "epoch": 1875} {"train_loss": -22.93727684020996, "global_step": 155627, "epoch": 1875} {"train_loss": -23.26544952392578, "global_step": 155628, "epoch": 1875} {"train_loss": -22.878835678100586, "global_step": 155629, "epoch": 1875} {"train_loss": -23.322683334350586, "global_step": 155630, "epoch": 1875} {"train_loss": -23.439971923828125, "global_step": 155631, "epoch": 1875} {"train_loss": -23.212438583374023, "global_step": 155632, "epoch": 1875} {"train_loss": -22.62489891052246, "global_step": 155633, "epoch": 1875} {"train_loss": -23.411108016967773, "global_step": 155634, "epoch": 1875} {"train_loss": -23.067785263061523, "global_step": 155635, "epoch": 1875} {"train_loss": -22.789226531982422, "global_step": 155636, "epoch": 1875} {"train_loss": -23.347156524658203, "global_step": 155637, "epoch": 1875} {"train_loss": -23.26613998413086, "global_step": 155638, "epoch": 1875} {"train_loss": -23.24481773376465, "global_step": 155639, "epoch": 1875} {"train_loss": -23.25520896911621, "global_step": 155640, "epoch": 1875} {"train_loss": -23.158262252807617, "global_step": 155641, "epoch": 1875} {"train_loss": -23.394149780273438, "global_step": 155642, "epoch": 1875} {"train_loss": -22.921558380126953, "global_step": 155643, "epoch": 1875} {"train_loss": -23.140302658081055, "global_step": 155644, "epoch": 1875} {"train_loss": -23.307113647460938, "global_step": 155645, "epoch": 1875} {"train_loss": -23.057172775268555, "global_step": 155646, "epoch": 1875} {"train_loss": -23.493244171142578, "global_step": 155647, "epoch": 1875} {"train_loss": -23.299715042114258, "global_step": 155648, "epoch": 1875} {"train_loss": -23.019311904907227, "global_step": 155649, "epoch": 1875} {"train_loss": -23.320449829101562, "global_step": 155650, "epoch": 1875} {"train_loss": -23.3654727935791, "global_step": 155651, "epoch": 1875} {"train_loss": -23.29104232788086, "global_step": 155652, "epoch": 1875} {"train_loss": -23.403488159179688, "global_step": 155653, "epoch": 1875} {"train_loss": -23.347156524658203, "global_step": 155654, "epoch": 1875} {"train_loss": -23.482532501220703, "global_step": 155655, "epoch": 1875} {"train_loss": -23.388246536254883, "global_step": 155656, "epoch": 1875} {"train_loss": -23.2781982421875, "global_step": 155657, "epoch": 1875} {"train_loss": -23.272830963134766, "global_step": 155658, "epoch": 1875} {"train_loss": -23.231718063354492, "global_step": 155659, "epoch": 1875} {"train_loss": -23.529932022094727, "global_step": 155660, "epoch": 1875} {"train_loss": -23.168058395385742, "global_step": 155661, "epoch": 1875} {"train_loss": -22.91460418701172, "global_step": 155662, "epoch": 1875} {"train_loss": -23.06732177734375, "global_step": 155663, "epoch": 1875} {"train_loss": -23.46635627746582, "global_step": 155664, "epoch": 1875} {"train_loss": -23.490631103515625, "global_step": 155665, "epoch": 1875} {"train_loss": -23.37783432006836, "global_step": 155666, "epoch": 1875} {"train_loss": -22.80814552307129, "global_step": 155667, "epoch": 1875} {"train_loss": -23.05412483215332, "global_step": 155668, "epoch": 1875} {"train_loss": -23.05098533630371, "global_step": 155669, "epoch": 1875} {"train_loss": -23.183387756347656, "global_step": 155670, "epoch": 1875} {"train_loss": -23.251005172729492, "global_step": 155671, "epoch": 1875} {"train_loss": -23.54343032836914, "global_step": 155672, "epoch": 1875} {"train_loss": -23.382688522338867, "global_step": 155673, "epoch": 1875} {"train_loss": -23.109058380126953, "global_step": 155674, "epoch": 1875} {"train_loss": -23.2059383392334, "global_step": 155675, "epoch": 1875} {"train_loss": -23.21084976196289, "global_step": 155676, "epoch": 1875} {"train_loss": -23.45979881286621, "global_step": 155677, "epoch": 1875} {"train_loss": -23.701688766479492, "global_step": 155678, "epoch": 1875} {"train_loss": -23.66293716430664, "global_step": 155679, "epoch": 1875} {"train_loss": -23.741628646850586, "global_step": 155680, "epoch": 1875} {"train_loss": -23.232952117919922, "global_step": 155681, "epoch": 1875} {"train_loss": -23.552886962890625, "global_step": 155682, "epoch": 1875} {"train_loss": -23.206745147705078, "global_step": 155683, "epoch": 1875} {"train_loss": -23.621442794799805, "global_step": 155684, "epoch": 1875} {"train_loss": -23.468820571899414, "global_step": 155685, "epoch": 1875} {"train_loss": -23.667198181152344, "global_step": 155686, "epoch": 1875} {"train_loss": -23.39410972595215, "global_step": 155687, "epoch": 1875} {"train_loss": -22.802616119384766, "global_step": 155688, "epoch": 1875} {"train_loss": -23.76597785949707, "global_step": 155689, "epoch": 1875} {"train_loss": -23.549392700195312, "global_step": 155690, "epoch": 1875} {"train_loss": -23.55555534362793, "global_step": 155691, "epoch": 1875} {"train_loss": -23.711668014526367, "global_step": 155692, "epoch": 1875} {"train_loss": -23.303142547607422, "global_step": 155693, "epoch": 1875} {"train_loss": -23.388208389282227, "global_step": 155694, "epoch": 1875} {"train_loss": -23.64986228942871, "global_step": 155695, "epoch": 1875} {"train_loss": -23.26141929626465, "global_step": 155696, "epoch": 1875} {"train_loss": -23.492515563964844, "global_step": 155697, "epoch": 1875} {"train_loss": -23.505081176757812, "global_step": 155698, "epoch": 1875} {"train_loss": -23.883275985717773, "global_step": 155699, "epoch": 1875} {"train_loss": -23.486087799072266, "global_step": 155700, "epoch": 1875} {"train_loss": -23.90030860900879, "global_step": 155701, "epoch": 1875} {"train_loss": -23.179723739624023, "global_step": 155702, "epoch": 1875} {"train_loss": -23.47726821899414, "global_step": 155703, "epoch": 1875} {"train_loss": -23.3427791595459, "global_step": 155704, "epoch": 1875} {"train_loss": -23.535091400146484, "global_step": 155705, "epoch": 1875} {"train_loss": -23.363483428955078, "global_step": 155706, "epoch": 1875} {"train_loss": -23.307351882199207, "global_step": 155707, "epoch": 1875, "val_loss": 6375734.0} {"train_loss": -23.70830726623535, "global_step": 155708, "epoch": 1876} {"train_loss": -23.383520126342773, "global_step": 155709, "epoch": 1876} {"train_loss": -23.257282257080078, "global_step": 155710, "epoch": 1876} {"train_loss": -22.990995407104492, "global_step": 155711, "epoch": 1876} {"train_loss": -23.088640213012695, "global_step": 155712, "epoch": 1876} {"train_loss": -22.911542892456055, "global_step": 155713, "epoch": 1876} {"train_loss": -23.462228775024414, "global_step": 155714, "epoch": 1876} {"train_loss": -23.213666915893555, "global_step": 155715, "epoch": 1876} {"train_loss": -22.99384880065918, "global_step": 155716, "epoch": 1876} {"train_loss": -22.96651268005371, "global_step": 155717, "epoch": 1876} {"train_loss": -23.380552291870117, "global_step": 155718, "epoch": 1876} {"train_loss": -23.07686424255371, "global_step": 155719, "epoch": 1876} {"train_loss": -23.156347274780273, "global_step": 155720, "epoch": 1876} {"train_loss": -23.69843101501465, "global_step": 155721, "epoch": 1876} {"train_loss": -23.28143882751465, "global_step": 155722, "epoch": 1876} {"train_loss": -23.36090660095215, "global_step": 155723, "epoch": 1876} {"train_loss": -23.372068405151367, "global_step": 155724, "epoch": 1876} {"train_loss": -23.331575393676758, "global_step": 155725, "epoch": 1876} {"train_loss": -23.29353141784668, "global_step": 155726, "epoch": 1876} {"train_loss": -23.286537170410156, "global_step": 155727, "epoch": 1876} {"train_loss": -23.473880767822266, "global_step": 155728, "epoch": 1876} {"train_loss": -23.093088150024414, "global_step": 155729, "epoch": 1876} {"train_loss": -23.55134391784668, "global_step": 155730, "epoch": 1876} {"train_loss": -23.639026641845703, "global_step": 155731, "epoch": 1876} {"train_loss": -23.295495986938477, "global_step": 155732, "epoch": 1876} {"train_loss": -23.344064712524414, "global_step": 155733, "epoch": 1876} {"train_loss": -23.48781394958496, "global_step": 155734, "epoch": 1876} {"train_loss": -23.51112937927246, "global_step": 155735, "epoch": 1876} {"train_loss": -23.43934440612793, "global_step": 155736, "epoch": 1876} {"train_loss": -23.670867919921875, "global_step": 155737, "epoch": 1876} {"train_loss": -23.403017044067383, "global_step": 155738, "epoch": 1876} {"train_loss": -23.22081756591797, "global_step": 155739, "epoch": 1876} {"train_loss": -23.697906494140625, "global_step": 155740, "epoch": 1876} {"train_loss": -23.35552406311035, "global_step": 155741, "epoch": 1876} {"train_loss": -22.745763778686523, "global_step": 155742, "epoch": 1876} {"train_loss": -23.12989616394043, "global_step": 155743, "epoch": 1876} {"train_loss": -22.775848388671875, "global_step": 155744, "epoch": 1876} {"train_loss": -23.392091751098633, "global_step": 155745, "epoch": 1876} {"train_loss": -23.47737693786621, "global_step": 155746, "epoch": 1876} {"train_loss": -23.237918853759766, "global_step": 155747, "epoch": 1876} {"train_loss": -23.161670684814453, "global_step": 155748, "epoch": 1876} {"train_loss": -22.97416114807129, "global_step": 155749, "epoch": 1876} {"train_loss": -23.234466552734375, "global_step": 155750, "epoch": 1876} {"train_loss": -23.684680938720703, "global_step": 155751, "epoch": 1876} {"train_loss": -23.12283706665039, "global_step": 155752, "epoch": 1876} {"train_loss": -23.719804763793945, "global_step": 155753, "epoch": 1876} {"train_loss": -23.364492416381836, "global_step": 155754, "epoch": 1876} {"train_loss": -23.27833366394043, "global_step": 155755, "epoch": 1876} {"train_loss": -23.3310489654541, "global_step": 155756, "epoch": 1876} {"train_loss": -23.439077377319336, "global_step": 155757, "epoch": 1876} {"train_loss": -23.678255081176758, "global_step": 155758, "epoch": 1876} {"train_loss": -23.417552947998047, "global_step": 155759, "epoch": 1876} {"train_loss": -23.376829147338867, "global_step": 155760, "epoch": 1876} {"train_loss": -23.48040771484375, "global_step": 155761, "epoch": 1876} {"train_loss": -23.5393123626709, "global_step": 155762, "epoch": 1876} {"train_loss": -23.6755313873291, "global_step": 155763, "epoch": 1876} {"train_loss": -23.698888778686523, "global_step": 155764, "epoch": 1876} {"train_loss": -23.591655731201172, "global_step": 155765, "epoch": 1876} {"train_loss": -23.42280387878418, "global_step": 155766, "epoch": 1876} {"train_loss": -23.362436294555664, "global_step": 155767, "epoch": 1876} {"train_loss": -23.09491539001465, "global_step": 155768, "epoch": 1876} {"train_loss": -23.62644386291504, "global_step": 155769, "epoch": 1876} {"train_loss": -23.072193145751953, "global_step": 155770, "epoch": 1876} {"train_loss": -23.380752563476562, "global_step": 155771, "epoch": 1876} {"train_loss": -23.596132278442383, "global_step": 155772, "epoch": 1876} {"train_loss": -23.371017456054688, "global_step": 155773, "epoch": 1876} {"train_loss": -23.408523559570312, "global_step": 155774, "epoch": 1876} {"train_loss": -23.444543838500977, "global_step": 155775, "epoch": 1876} {"train_loss": -23.513931274414062, "global_step": 155776, "epoch": 1876} {"train_loss": -23.30470848083496, "global_step": 155777, "epoch": 1876} {"train_loss": -23.164630889892578, "global_step": 155778, "epoch": 1876} {"train_loss": -23.4222469329834, "global_step": 155779, "epoch": 1876} {"train_loss": -23.513181686401367, "global_step": 155780, "epoch": 1876} {"train_loss": -23.72584342956543, "global_step": 155781, "epoch": 1876} {"train_loss": -22.996957778930664, "global_step": 155782, "epoch": 1876} {"train_loss": -23.58867835998535, "global_step": 155783, "epoch": 1876} {"train_loss": -23.076963424682617, "global_step": 155784, "epoch": 1876} {"train_loss": -23.344350814819336, "global_step": 155785, "epoch": 1876} {"train_loss": -23.391233444213867, "global_step": 155786, "epoch": 1876} {"train_loss": -23.568655014038086, "global_step": 155787, "epoch": 1876} {"train_loss": -23.577056884765625, "global_step": 155788, "epoch": 1876} {"train_loss": -23.5109806060791, "global_step": 155789, "epoch": 1876} {"train_loss": -23.368789236229585, "global_step": 155790, "epoch": 1876, "val_loss": 6272648.0} {"train_loss": -23.390277862548828, "global_step": 155791, "epoch": 1877} {"train_loss": -23.65358543395996, "global_step": 155792, "epoch": 1877} {"train_loss": -22.986848831176758, "global_step": 155793, "epoch": 1877} {"train_loss": -23.192415237426758, "global_step": 155794, "epoch": 1877} {"train_loss": -23.407955169677734, "global_step": 155795, "epoch": 1877} {"train_loss": -23.00183868408203, "global_step": 155796, "epoch": 1877} {"train_loss": -22.916746139526367, "global_step": 155797, "epoch": 1877} {"train_loss": -23.034805297851562, "global_step": 155798, "epoch": 1877} {"train_loss": -23.09474754333496, "global_step": 155799, "epoch": 1877} {"train_loss": -23.68863296508789, "global_step": 155800, "epoch": 1877} {"train_loss": -23.673391342163086, "global_step": 155801, "epoch": 1877} {"train_loss": -23.247838973999023, "global_step": 155802, "epoch": 1877} {"train_loss": -23.29224395751953, "global_step": 155803, "epoch": 1877} {"train_loss": -23.63456916809082, "global_step": 155804, "epoch": 1877} {"train_loss": -23.49078941345215, "global_step": 155805, "epoch": 1877} {"train_loss": -23.065719604492188, "global_step": 155806, "epoch": 1877} {"train_loss": -23.66155433654785, "global_step": 155807, "epoch": 1877} {"train_loss": -23.17892837524414, "global_step": 155808, "epoch": 1877} {"train_loss": -23.336986541748047, "global_step": 155809, "epoch": 1877} {"train_loss": -23.482559204101562, "global_step": 155810, "epoch": 1877} {"train_loss": -23.39525604248047, "global_step": 155811, "epoch": 1877} {"train_loss": -23.903196334838867, "global_step": 155812, "epoch": 1877} {"train_loss": -23.664505004882812, "global_step": 155813, "epoch": 1877} {"train_loss": -23.18724250793457, "global_step": 155814, "epoch": 1877} {"train_loss": -23.35144805908203, "global_step": 155815, "epoch": 1877} {"train_loss": -23.624948501586914, "global_step": 155816, "epoch": 1877} {"train_loss": -23.867191314697266, "global_step": 155817, "epoch": 1877} {"train_loss": -23.52651023864746, "global_step": 155818, "epoch": 1877} {"train_loss": -23.381994247436523, "global_step": 155819, "epoch": 1877} {"train_loss": -23.355485916137695, "global_step": 155820, "epoch": 1877} {"train_loss": -23.632009506225586, "global_step": 155821, "epoch": 1877} {"train_loss": -23.489477157592773, "global_step": 155822, "epoch": 1877} {"train_loss": -23.68966293334961, "global_step": 155823, "epoch": 1877} {"train_loss": -23.599546432495117, "global_step": 155824, "epoch": 1877} {"train_loss": -23.52046775817871, "global_step": 155825, "epoch": 1877} {"train_loss": -23.43192481994629, "global_step": 155826, "epoch": 1877} {"train_loss": -23.7150821685791, "global_step": 155827, "epoch": 1877} {"train_loss": -23.333759307861328, "global_step": 155828, "epoch": 1877} {"train_loss": -23.586631774902344, "global_step": 155829, "epoch": 1877} {"train_loss": -23.2432861328125, "global_step": 155830, "epoch": 1877} {"train_loss": -23.31938362121582, "global_step": 155831, "epoch": 1877} {"train_loss": -23.515111923217773, "global_step": 155832, "epoch": 1877} {"train_loss": -23.523759841918945, "global_step": 155833, "epoch": 1877} {"train_loss": -23.356136322021484, "global_step": 155834, "epoch": 1877} {"train_loss": -23.631284713745117, "global_step": 155835, "epoch": 1877} {"train_loss": -23.337949752807617, "global_step": 155836, "epoch": 1877} {"train_loss": -23.313901901245117, "global_step": 155837, "epoch": 1877} {"train_loss": -23.366897583007812, "global_step": 155838, "epoch": 1877} {"train_loss": -23.088882446289062, "global_step": 155839, "epoch": 1877} {"train_loss": -23.129980087280273, "global_step": 155840, "epoch": 1877} {"train_loss": -23.067195892333984, "global_step": 155841, "epoch": 1877} {"train_loss": -22.980527877807617, "global_step": 155842, "epoch": 1877} {"train_loss": -23.11818504333496, "global_step": 155843, "epoch": 1877} {"train_loss": -23.41962242126465, "global_step": 155844, "epoch": 1877} {"train_loss": -23.305505752563477, "global_step": 155845, "epoch": 1877} {"train_loss": -23.267383575439453, "global_step": 155846, "epoch": 1877} {"train_loss": -23.18599510192871, "global_step": 155847, "epoch": 1877} {"train_loss": -23.42015266418457, "global_step": 155848, "epoch": 1877} {"train_loss": -23.240676879882812, "global_step": 155849, "epoch": 1877} {"train_loss": -23.43134880065918, "global_step": 155850, "epoch": 1877} {"train_loss": -23.586673736572266, "global_step": 155851, "epoch": 1877} {"train_loss": -23.273473739624023, "global_step": 155852, "epoch": 1877} {"train_loss": -23.803319931030273, "global_step": 155853, "epoch": 1877} {"train_loss": -23.402406692504883, "global_step": 155854, "epoch": 1877} {"train_loss": -23.639944076538086, "global_step": 155855, "epoch": 1877} {"train_loss": -23.038524627685547, "global_step": 155856, "epoch": 1877} {"train_loss": -23.324573516845703, "global_step": 155857, "epoch": 1877} {"train_loss": -23.653600692749023, "global_step": 155858, "epoch": 1877} {"train_loss": -23.40635108947754, "global_step": 155859, "epoch": 1877} {"train_loss": -23.60939598083496, "global_step": 155860, "epoch": 1877} {"train_loss": -23.005142211914062, "global_step": 155861, "epoch": 1877} {"train_loss": -23.637767791748047, "global_step": 155862, "epoch": 1877} {"train_loss": -23.34548568725586, "global_step": 155863, "epoch": 1877} {"train_loss": -23.601093292236328, "global_step": 155864, "epoch": 1877} {"train_loss": -23.14694595336914, "global_step": 155865, "epoch": 1877} {"train_loss": -23.587125778198242, "global_step": 155866, "epoch": 1877} {"train_loss": -23.653165817260742, "global_step": 155867, "epoch": 1877} {"train_loss": -23.491971969604492, "global_step": 155868, "epoch": 1877} {"train_loss": -23.2602481842041, "global_step": 155869, "epoch": 1877} {"train_loss": -23.557479858398438, "global_step": 155870, "epoch": 1877} {"train_loss": -23.55605125427246, "global_step": 155871, "epoch": 1877} {"train_loss": -23.275455474853516, "global_step": 155872, "epoch": 1877} {"train_loss": -23.409629660916615, "global_step": 155873, "epoch": 1877, "val_loss": 6271469.0} {"train_loss": -23.072072982788086, "global_step": 155874, "epoch": 1878} {"train_loss": -22.910720825195312, "global_step": 155875, "epoch": 1878} {"train_loss": -23.30982780456543, "global_step": 155876, "epoch": 1878} {"train_loss": -22.918310165405273, "global_step": 155877, "epoch": 1878} {"train_loss": -22.743684768676758, "global_step": 155878, "epoch": 1878} {"train_loss": -23.15501594543457, "global_step": 155879, "epoch": 1878} {"train_loss": -23.02333641052246, "global_step": 155880, "epoch": 1878} {"train_loss": -22.912689208984375, "global_step": 155881, "epoch": 1878} {"train_loss": -23.060333251953125, "global_step": 155882, "epoch": 1878} {"train_loss": -22.9744930267334, "global_step": 155883, "epoch": 1878} {"train_loss": -23.414600372314453, "global_step": 155884, "epoch": 1878} {"train_loss": -23.39021873474121, "global_step": 155885, "epoch": 1878} {"train_loss": -22.934471130371094, "global_step": 155886, "epoch": 1878} {"train_loss": -22.89826011657715, "global_step": 155887, "epoch": 1878} {"train_loss": -23.626131057739258, "global_step": 155888, "epoch": 1878} {"train_loss": -23.279987335205078, "global_step": 155889, "epoch": 1878} {"train_loss": -23.341169357299805, "global_step": 155890, "epoch": 1878} {"train_loss": -23.27018165588379, "global_step": 155891, "epoch": 1878} {"train_loss": -23.52642822265625, "global_step": 155892, "epoch": 1878} {"train_loss": -23.4212589263916, "global_step": 155893, "epoch": 1878} {"train_loss": -23.5274658203125, "global_step": 155894, "epoch": 1878} {"train_loss": -23.087387084960938, "global_step": 155895, "epoch": 1878} {"train_loss": -23.447690963745117, "global_step": 155896, "epoch": 1878} {"train_loss": -23.268630981445312, "global_step": 155897, "epoch": 1878} {"train_loss": -23.149261474609375, "global_step": 155898, "epoch": 1878} {"train_loss": -23.278316497802734, "global_step": 155899, "epoch": 1878} {"train_loss": -23.119163513183594, "global_step": 155900, "epoch": 1878} {"train_loss": -23.52113914489746, "global_step": 155901, "epoch": 1878} {"train_loss": -23.471769332885742, "global_step": 155902, "epoch": 1878} {"train_loss": -23.456069946289062, "global_step": 155903, "epoch": 1878} {"train_loss": -23.720542907714844, "global_step": 155904, "epoch": 1878} {"train_loss": -23.454816818237305, "global_step": 155905, "epoch": 1878} {"train_loss": -23.225574493408203, "global_step": 155906, "epoch": 1878} {"train_loss": -23.42386245727539, "global_step": 155907, "epoch": 1878} {"train_loss": -23.46440887451172, "global_step": 155908, "epoch": 1878} {"train_loss": -23.29188346862793, "global_step": 155909, "epoch": 1878} {"train_loss": -23.298967361450195, "global_step": 155910, "epoch": 1878} {"train_loss": -23.486616134643555, "global_step": 155911, "epoch": 1878} {"train_loss": -22.955257415771484, "global_step": 155912, "epoch": 1878} {"train_loss": -23.325063705444336, "global_step": 155913, "epoch": 1878} {"train_loss": -23.471111297607422, "global_step": 155914, "epoch": 1878} {"train_loss": -23.597705841064453, "global_step": 155915, "epoch": 1878} {"train_loss": -23.216917037963867, "global_step": 155916, "epoch": 1878} {"train_loss": -23.320646286010742, "global_step": 155917, "epoch": 1878} {"train_loss": -23.387239456176758, "global_step": 155918, "epoch": 1878} {"train_loss": -23.43505096435547, "global_step": 155919, "epoch": 1878} {"train_loss": -23.4827880859375, "global_step": 155920, "epoch": 1878} {"train_loss": -23.258636474609375, "global_step": 155921, "epoch": 1878} {"train_loss": -23.565000534057617, "global_step": 155922, "epoch": 1878} {"train_loss": -23.709827423095703, "global_step": 155923, "epoch": 1878} {"train_loss": -23.302778244018555, "global_step": 155924, "epoch": 1878} {"train_loss": -23.726842880249023, "global_step": 155925, "epoch": 1878} {"train_loss": -23.4309139251709, "global_step": 155926, "epoch": 1878} {"train_loss": -23.427488327026367, "global_step": 155927, "epoch": 1878} {"train_loss": -23.08669662475586, "global_step": 155928, "epoch": 1878} {"train_loss": -23.013620376586914, "global_step": 155929, "epoch": 1878} {"train_loss": -23.563390731811523, "global_step": 155930, "epoch": 1878} {"train_loss": -23.170513153076172, "global_step": 155931, "epoch": 1878} {"train_loss": -23.396923065185547, "global_step": 155932, "epoch": 1878} {"train_loss": -23.294706344604492, "global_step": 155933, "epoch": 1878} {"train_loss": -23.381229400634766, "global_step": 155934, "epoch": 1878} {"train_loss": -23.41358184814453, "global_step": 155935, "epoch": 1878} {"train_loss": -23.40752601623535, "global_step": 155936, "epoch": 1878} {"train_loss": -23.2268123626709, "global_step": 155937, "epoch": 1878} {"train_loss": -23.507455825805664, "global_step": 155938, "epoch": 1878} {"train_loss": -23.706817626953125, "global_step": 155939, "epoch": 1878} {"train_loss": -23.119308471679688, "global_step": 155940, "epoch": 1878} {"train_loss": -23.592334747314453, "global_step": 155941, "epoch": 1878} {"train_loss": -23.697019577026367, "global_step": 155942, "epoch": 1878} {"train_loss": -23.151845932006836, "global_step": 155943, "epoch": 1878} {"train_loss": -23.347076416015625, "global_step": 155944, "epoch": 1878} {"train_loss": -23.5400333404541, "global_step": 155945, "epoch": 1878} {"train_loss": -23.44168472290039, "global_step": 155946, "epoch": 1878} {"train_loss": -23.3942813873291, "global_step": 155947, "epoch": 1878} {"train_loss": -23.32128143310547, "global_step": 155948, "epoch": 1878} {"train_loss": -23.486661911010742, "global_step": 155949, "epoch": 1878} {"train_loss": -23.60574722290039, "global_step": 155950, "epoch": 1878} {"train_loss": -23.559892654418945, "global_step": 155951, "epoch": 1878} {"train_loss": -23.467695236206055, "global_step": 155952, "epoch": 1878} {"train_loss": -23.82582664489746, "global_step": 155953, "epoch": 1878} {"train_loss": -23.414051055908203, "global_step": 155954, "epoch": 1878} {"train_loss": -23.48048973083496, "global_step": 155955, "epoch": 1878} {"train_loss": -23.348002307386285, "global_step": 155956, "epoch": 1878, "val_loss": 6361512.0} {"train_loss": -22.890302658081055, "global_step": 155957, "epoch": 1879} {"train_loss": -22.828012466430664, "global_step": 155958, "epoch": 1879} {"train_loss": -23.21841049194336, "global_step": 155959, "epoch": 1879} {"train_loss": -23.18517303466797, "global_step": 155960, "epoch": 1879} {"train_loss": -23.03171730041504, "global_step": 155961, "epoch": 1879} {"train_loss": -23.02912712097168, "global_step": 155962, "epoch": 1879} {"train_loss": -23.107528686523438, "global_step": 155963, "epoch": 1879} {"train_loss": -22.930871963500977, "global_step": 155964, "epoch": 1879} {"train_loss": -23.45206069946289, "global_step": 155965, "epoch": 1879} {"train_loss": -23.287981033325195, "global_step": 155966, "epoch": 1879} {"train_loss": -23.354421615600586, "global_step": 155967, "epoch": 1879} {"train_loss": -23.031415939331055, "global_step": 155968, "epoch": 1879} {"train_loss": -23.273544311523438, "global_step": 155969, "epoch": 1879} {"train_loss": -23.12013816833496, "global_step": 155970, "epoch": 1879} {"train_loss": -23.33160972595215, "global_step": 155971, "epoch": 1879} {"train_loss": -23.18562889099121, "global_step": 155972, "epoch": 1879} {"train_loss": -23.557971954345703, "global_step": 155973, "epoch": 1879} {"train_loss": -23.324567794799805, "global_step": 155974, "epoch": 1879} {"train_loss": -23.387340545654297, "global_step": 155975, "epoch": 1879} {"train_loss": -23.39009666442871, "global_step": 155976, "epoch": 1879} {"train_loss": -23.337209701538086, "global_step": 155977, "epoch": 1879} {"train_loss": -23.59006118774414, "global_step": 155978, "epoch": 1879} {"train_loss": -23.475332260131836, "global_step": 155979, "epoch": 1879} {"train_loss": -23.339969635009766, "global_step": 155980, "epoch": 1879} {"train_loss": -23.40122413635254, "global_step": 155981, "epoch": 1879} {"train_loss": -23.453628540039062, "global_step": 155982, "epoch": 1879} {"train_loss": -23.41337776184082, "global_step": 155983, "epoch": 1879} {"train_loss": -23.596561431884766, "global_step": 155984, "epoch": 1879} {"train_loss": -23.57600975036621, "global_step": 155985, "epoch": 1879} {"train_loss": -23.059463500976562, "global_step": 155986, "epoch": 1879} {"train_loss": -23.59771156311035, "global_step": 155987, "epoch": 1879} {"train_loss": -23.24512481689453, "global_step": 155988, "epoch": 1879} {"train_loss": -23.3590145111084, "global_step": 155989, "epoch": 1879} {"train_loss": -23.34830665588379, "global_step": 155990, "epoch": 1879} {"train_loss": -23.391653060913086, "global_step": 155991, "epoch": 1879} {"train_loss": -23.47743034362793, "global_step": 155992, "epoch": 1879} {"train_loss": -22.924509048461914, "global_step": 155993, "epoch": 1879} {"train_loss": -23.320865631103516, "global_step": 155994, "epoch": 1879} {"train_loss": -23.42888832092285, "global_step": 155995, "epoch": 1879} {"train_loss": -23.35577964782715, "global_step": 155996, "epoch": 1879} {"train_loss": -23.42886734008789, "global_step": 155997, "epoch": 1879} {"train_loss": -23.48343276977539, "global_step": 155998, "epoch": 1879} {"train_loss": -23.046735763549805, "global_step": 155999, "epoch": 1879} {"train_loss": -23.673513412475586, "global_step": 156000, "epoch": 1879} {"train_loss": -23.81818389892578, "global_step": 156001, "epoch": 1879} {"train_loss": -23.23994255065918, "global_step": 156002, "epoch": 1879} {"train_loss": -23.25050163269043, "global_step": 156003, "epoch": 1879} {"train_loss": -23.082242965698242, "global_step": 156004, "epoch": 1879} {"train_loss": -23.32111167907715, "global_step": 156005, "epoch": 1879} {"train_loss": -23.344297409057617, "global_step": 156006, "epoch": 1879} {"train_loss": -23.607980728149414, "global_step": 156007, "epoch": 1879} {"train_loss": -23.39596939086914, "global_step": 156008, "epoch": 1879} {"train_loss": -23.615530014038086, "global_step": 156009, "epoch": 1879} {"train_loss": -22.94415855407715, "global_step": 156010, "epoch": 1879} {"train_loss": -23.4769287109375, "global_step": 156011, "epoch": 1879} {"train_loss": -23.300405502319336, "global_step": 156012, "epoch": 1879} {"train_loss": -23.18550682067871, "global_step": 156013, "epoch": 1879} {"train_loss": -23.331396102905273, "global_step": 156014, "epoch": 1879} {"train_loss": -23.453794479370117, "global_step": 156015, "epoch": 1879} {"train_loss": -23.834985733032227, "global_step": 156016, "epoch": 1879} {"train_loss": -23.577524185180664, "global_step": 156017, "epoch": 1879} {"train_loss": -23.168508529663086, "global_step": 156018, "epoch": 1879} {"train_loss": -23.535938262939453, "global_step": 156019, "epoch": 1879} {"train_loss": -22.91572380065918, "global_step": 156020, "epoch": 1879} {"train_loss": -23.53643798828125, "global_step": 156021, "epoch": 1879} {"train_loss": -23.58680534362793, "global_step": 156022, "epoch": 1879} {"train_loss": -23.86363410949707, "global_step": 156023, "epoch": 1879} {"train_loss": -23.636167526245117, "global_step": 156024, "epoch": 1879} {"train_loss": -23.318740844726562, "global_step": 156025, "epoch": 1879} {"train_loss": -23.578332901000977, "global_step": 156026, "epoch": 1879} {"train_loss": -23.814430236816406, "global_step": 156027, "epoch": 1879} {"train_loss": -23.526111602783203, "global_step": 156028, "epoch": 1879} {"train_loss": -23.36255645751953, "global_step": 156029, "epoch": 1879} {"train_loss": -23.51337242126465, "global_step": 156030, "epoch": 1879} {"train_loss": -23.9754695892334, "global_step": 156031, "epoch": 1879} {"train_loss": -23.483631134033203, "global_step": 156032, "epoch": 1879} {"train_loss": -23.42865562438965, "global_step": 156033, "epoch": 1879} {"train_loss": -23.81336784362793, "global_step": 156034, "epoch": 1879} {"train_loss": -23.92535972595215, "global_step": 156035, "epoch": 1879} {"train_loss": -23.788429260253906, "global_step": 156036, "epoch": 1879} {"train_loss": -23.07977294921875, "global_step": 156037, "epoch": 1879} {"train_loss": -23.56805992126465, "global_step": 156038, "epoch": 1879} {"train_loss": -23.382930525814196, "global_step": 156039, "epoch": 1879, "val_loss": 6376451.0} {"train_loss": -23.564123153686523, "global_step": 156040, "epoch": 1880} {"train_loss": -23.411121368408203, "global_step": 156041, "epoch": 1880} {"train_loss": -22.95127296447754, "global_step": 156042, "epoch": 1880} {"train_loss": -23.702768325805664, "global_step": 156043, "epoch": 1880} {"train_loss": -23.2072696685791, "global_step": 156044, "epoch": 1880} {"train_loss": -23.282312393188477, "global_step": 156045, "epoch": 1880} {"train_loss": -23.16953468322754, "global_step": 156046, "epoch": 1880} {"train_loss": -22.846899032592773, "global_step": 156047, "epoch": 1880} {"train_loss": -23.58632469177246, "global_step": 156048, "epoch": 1880} {"train_loss": -23.364843368530273, "global_step": 156049, "epoch": 1880} {"train_loss": -23.346548080444336, "global_step": 156050, "epoch": 1880} {"train_loss": -23.772216796875, "global_step": 156051, "epoch": 1880} {"train_loss": -23.459474563598633, "global_step": 156052, "epoch": 1880} {"train_loss": -23.118057250976562, "global_step": 156053, "epoch": 1880} {"train_loss": -23.596826553344727, "global_step": 156054, "epoch": 1880} {"train_loss": -23.18613052368164, "global_step": 156055, "epoch": 1880} {"train_loss": -23.392688751220703, "global_step": 156056, "epoch": 1880} {"train_loss": -23.199819564819336, "global_step": 156057, "epoch": 1880} {"train_loss": -23.498796463012695, "global_step": 156058, "epoch": 1880} {"train_loss": -23.32453727722168, "global_step": 156059, "epoch": 1880} {"train_loss": -23.658279418945312, "global_step": 156060, "epoch": 1880} {"train_loss": -23.469289779663086, "global_step": 156061, "epoch": 1880} {"train_loss": -23.068281173706055, "global_step": 156062, "epoch": 1880} {"train_loss": -23.378955841064453, "global_step": 156063, "epoch": 1880} {"train_loss": -23.708831787109375, "global_step": 156064, "epoch": 1880} {"train_loss": -23.18437957763672, "global_step": 156065, "epoch": 1880} {"train_loss": -22.74287223815918, "global_step": 156066, "epoch": 1880} {"train_loss": -23.717634201049805, "global_step": 156067, "epoch": 1880} {"train_loss": -23.232248306274414, "global_step": 156068, "epoch": 1880} {"train_loss": -22.957048416137695, "global_step": 156069, "epoch": 1880} {"train_loss": -22.934537887573242, "global_step": 156070, "epoch": 1880} {"train_loss": -23.317575454711914, "global_step": 156071, "epoch": 1880} {"train_loss": -23.457494735717773, "global_step": 156072, "epoch": 1880} {"train_loss": -23.274642944335938, "global_step": 156073, "epoch": 1880} {"train_loss": -23.606348037719727, "global_step": 156074, "epoch": 1880} {"train_loss": -23.5544490814209, "global_step": 156075, "epoch": 1880} {"train_loss": -23.77508544921875, "global_step": 156076, "epoch": 1880} {"train_loss": -23.528297424316406, "global_step": 156077, "epoch": 1880} {"train_loss": -23.195186614990234, "global_step": 156078, "epoch": 1880} {"train_loss": -23.57826042175293, "global_step": 156079, "epoch": 1880} {"train_loss": -23.425207138061523, "global_step": 156080, "epoch": 1880} {"train_loss": -23.41942024230957, "global_step": 156081, "epoch": 1880} {"train_loss": -23.468093872070312, "global_step": 156082, "epoch": 1880} {"train_loss": -22.960416793823242, "global_step": 156083, "epoch": 1880} {"train_loss": -23.245466232299805, "global_step": 156084, "epoch": 1880} {"train_loss": -23.390933990478516, "global_step": 156085, "epoch": 1880} {"train_loss": -23.989267349243164, "global_step": 156086, "epoch": 1880} {"train_loss": -23.388639450073242, "global_step": 156087, "epoch": 1880} {"train_loss": -23.702917098999023, "global_step": 156088, "epoch": 1880} {"train_loss": -23.5107479095459, "global_step": 156089, "epoch": 1880} {"train_loss": -23.384809494018555, "global_step": 156090, "epoch": 1880} {"train_loss": -23.595561981201172, "global_step": 156091, "epoch": 1880} {"train_loss": -23.55350112915039, "global_step": 156092, "epoch": 1880} {"train_loss": -23.368030548095703, "global_step": 156093, "epoch": 1880} {"train_loss": -23.603727340698242, "global_step": 156094, "epoch": 1880} {"train_loss": -23.499618530273438, "global_step": 156095, "epoch": 1880} {"train_loss": -23.274372100830078, "global_step": 156096, "epoch": 1880} {"train_loss": -23.2231502532959, "global_step": 156097, "epoch": 1880} {"train_loss": -23.408166885375977, "global_step": 156098, "epoch": 1880} {"train_loss": -23.897682189941406, "global_step": 156099, "epoch": 1880} {"train_loss": -23.356040954589844, "global_step": 156100, "epoch": 1880} {"train_loss": -23.468713760375977, "global_step": 156101, "epoch": 1880} {"train_loss": -23.528850555419922, "global_step": 156102, "epoch": 1880} {"train_loss": -23.56001853942871, "global_step": 156103, "epoch": 1880} {"train_loss": -23.101247787475586, "global_step": 156104, "epoch": 1880} {"train_loss": -23.010055541992188, "global_step": 156105, "epoch": 1880} {"train_loss": -23.303802490234375, "global_step": 156106, "epoch": 1880} {"train_loss": -23.701330184936523, "global_step": 156107, "epoch": 1880} {"train_loss": -23.692096710205078, "global_step": 156108, "epoch": 1880} {"train_loss": -23.339340209960938, "global_step": 156109, "epoch": 1880} {"train_loss": -23.282119750976562, "global_step": 156110, "epoch": 1880} {"train_loss": -23.369497299194336, "global_step": 156111, "epoch": 1880} {"train_loss": -23.312393188476562, "global_step": 156112, "epoch": 1880} {"train_loss": -23.27711296081543, "global_step": 156113, "epoch": 1880} {"train_loss": -23.27956771850586, "global_step": 156114, "epoch": 1880} {"train_loss": -23.39876937866211, "global_step": 156115, "epoch": 1880} {"train_loss": -23.315160751342773, "global_step": 156116, "epoch": 1880} {"train_loss": -23.451581954956055, "global_step": 156117, "epoch": 1880} {"train_loss": -23.84425926208496, "global_step": 156118, "epoch": 1880} {"train_loss": -23.51130485534668, "global_step": 156119, "epoch": 1880} {"train_loss": -23.84943199157715, "global_step": 156120, "epoch": 1880} {"train_loss": -23.037588119506836, "global_step": 156121, "epoch": 1880} {"train_loss": -23.371978484004376, "global_step": 156122, "epoch": 1880, "val_loss": 6390516.0} {"train_loss": -23.54741859436035, "global_step": 156123, "epoch": 1881} {"train_loss": -22.391693115234375, "global_step": 156124, "epoch": 1881} {"train_loss": -23.221826553344727, "global_step": 156125, "epoch": 1881} {"train_loss": -22.95741081237793, "global_step": 156126, "epoch": 1881} {"train_loss": -23.015323638916016, "global_step": 156127, "epoch": 1881} {"train_loss": -23.14166831970215, "global_step": 156128, "epoch": 1881} {"train_loss": -23.072599411010742, "global_step": 156129, "epoch": 1881} {"train_loss": -23.244354248046875, "global_step": 156130, "epoch": 1881} {"train_loss": -22.833744049072266, "global_step": 156131, "epoch": 1881} {"train_loss": -23.188953399658203, "global_step": 156132, "epoch": 1881} {"train_loss": -23.32529640197754, "global_step": 156133, "epoch": 1881} {"train_loss": -23.266387939453125, "global_step": 156134, "epoch": 1881} {"train_loss": -23.119266510009766, "global_step": 156135, "epoch": 1881} {"train_loss": -23.028242111206055, "global_step": 156136, "epoch": 1881} {"train_loss": -23.362730026245117, "global_step": 156137, "epoch": 1881} {"train_loss": -23.3563289642334, "global_step": 156138, "epoch": 1881} {"train_loss": -23.070262908935547, "global_step": 156139, "epoch": 1881} {"train_loss": -23.145004272460938, "global_step": 156140, "epoch": 1881} {"train_loss": -23.186111450195312, "global_step": 156141, "epoch": 1881} {"train_loss": -22.921804428100586, "global_step": 156142, "epoch": 1881} {"train_loss": -23.371915817260742, "global_step": 156143, "epoch": 1881} {"train_loss": -23.929718017578125, "global_step": 156144, "epoch": 1881} {"train_loss": -23.608057022094727, "global_step": 156145, "epoch": 1881} {"train_loss": -23.23248291015625, "global_step": 156146, "epoch": 1881} {"train_loss": -23.314346313476562, "global_step": 156147, "epoch": 1881} {"train_loss": -23.443490982055664, "global_step": 156148, "epoch": 1881} {"train_loss": -23.426956176757812, "global_step": 156149, "epoch": 1881} {"train_loss": -23.58477783203125, "global_step": 156150, "epoch": 1881} {"train_loss": -23.29598045349121, "global_step": 156151, "epoch": 1881} {"train_loss": -23.547941207885742, "global_step": 156152, "epoch": 1881} {"train_loss": -23.716846466064453, "global_step": 156153, "epoch": 1881} {"train_loss": -23.298124313354492, "global_step": 156154, "epoch": 1881} {"train_loss": -23.165193557739258, "global_step": 156155, "epoch": 1881} {"train_loss": -23.316659927368164, "global_step": 156156, "epoch": 1881} {"train_loss": -23.51362419128418, "global_step": 156157, "epoch": 1881} {"train_loss": -23.49777603149414, "global_step": 156158, "epoch": 1881} {"train_loss": -23.135971069335938, "global_step": 156159, "epoch": 1881} {"train_loss": -23.36332130432129, "global_step": 156160, "epoch": 1881} {"train_loss": -23.50139045715332, "global_step": 156161, "epoch": 1881} {"train_loss": -23.699146270751953, "global_step": 156162, "epoch": 1881} {"train_loss": -23.128639221191406, "global_step": 156163, "epoch": 1881} {"train_loss": -23.349023818969727, "global_step": 156164, "epoch": 1881} {"train_loss": -23.58240509033203, "global_step": 156165, "epoch": 1881} {"train_loss": -23.366880416870117, "global_step": 156166, "epoch": 1881} {"train_loss": -23.29091453552246, "global_step": 156167, "epoch": 1881} {"train_loss": -23.20320701599121, "global_step": 156168, "epoch": 1881} {"train_loss": -23.256397247314453, "global_step": 156169, "epoch": 1881} {"train_loss": -23.36412239074707, "global_step": 156170, "epoch": 1881} {"train_loss": -23.569385528564453, "global_step": 156171, "epoch": 1881} {"train_loss": -23.585363388061523, "global_step": 156172, "epoch": 1881} {"train_loss": -22.967086791992188, "global_step": 156173, "epoch": 1881} {"train_loss": -23.447084426879883, "global_step": 156174, "epoch": 1881} {"train_loss": -23.380897521972656, "global_step": 156175, "epoch": 1881} {"train_loss": -23.289594650268555, "global_step": 156176, "epoch": 1881} {"train_loss": -23.422000885009766, "global_step": 156177, "epoch": 1881} {"train_loss": -23.662893295288086, "global_step": 156178, "epoch": 1881} {"train_loss": -23.490629196166992, "global_step": 156179, "epoch": 1881} {"train_loss": -23.692106246948242, "global_step": 156180, "epoch": 1881} {"train_loss": -23.334980010986328, "global_step": 156181, "epoch": 1881} {"train_loss": -23.18306541442871, "global_step": 156182, "epoch": 1881} {"train_loss": -23.64032554626465, "global_step": 156183, "epoch": 1881} {"train_loss": -23.322147369384766, "global_step": 156184, "epoch": 1881} {"train_loss": -22.915096282958984, "global_step": 156185, "epoch": 1881} {"train_loss": -23.11479949951172, "global_step": 156186, "epoch": 1881} {"train_loss": -23.640775680541992, "global_step": 156187, "epoch": 1881} {"train_loss": -23.268247604370117, "global_step": 156188, "epoch": 1881} {"train_loss": -23.44428253173828, "global_step": 156189, "epoch": 1881} {"train_loss": -23.00518226623535, "global_step": 156190, "epoch": 1881} {"train_loss": -23.29249382019043, "global_step": 156191, "epoch": 1881} {"train_loss": -23.578367233276367, "global_step": 156192, "epoch": 1881} {"train_loss": -23.82343101501465, "global_step": 156193, "epoch": 1881} {"train_loss": -23.12114906311035, "global_step": 156194, "epoch": 1881} {"train_loss": -23.57606315612793, "global_step": 156195, "epoch": 1881} {"train_loss": -23.574689865112305, "global_step": 156196, "epoch": 1881} {"train_loss": -23.64521598815918, "global_step": 156197, "epoch": 1881} {"train_loss": -23.30328369140625, "global_step": 156198, "epoch": 1881} {"train_loss": -23.103404998779297, "global_step": 156199, "epoch": 1881} {"train_loss": -23.443397521972656, "global_step": 156200, "epoch": 1881} {"train_loss": -23.486059188842773, "global_step": 156201, "epoch": 1881} {"train_loss": -23.75974464416504, "global_step": 156202, "epoch": 1881} {"train_loss": -23.84505271911621, "global_step": 156203, "epoch": 1881} {"train_loss": -23.324745178222656, "global_step": 156204, "epoch": 1881} {"train_loss": -23.32555534178952, "global_step": 156205, "epoch": 1881, "val_loss": 6358943.0} {"train_loss": -22.41377067565918, "global_step": 156206, "epoch": 1882} {"train_loss": -23.169513702392578, "global_step": 156207, "epoch": 1882} {"train_loss": -21.742368698120117, "global_step": 156208, "epoch": 1882} {"train_loss": -22.553485870361328, "global_step": 156209, "epoch": 1882} {"train_loss": -22.634950637817383, "global_step": 156210, "epoch": 1882} {"train_loss": -22.715009689331055, "global_step": 156211, "epoch": 1882} {"train_loss": -22.548288345336914, "global_step": 156212, "epoch": 1882} {"train_loss": -22.84505844116211, "global_step": 156213, "epoch": 1882} {"train_loss": -22.38132095336914, "global_step": 156214, "epoch": 1882} {"train_loss": -23.046762466430664, "global_step": 156215, "epoch": 1882} {"train_loss": -22.47919273376465, "global_step": 156216, "epoch": 1882} {"train_loss": -22.847274780273438, "global_step": 156217, "epoch": 1882} {"train_loss": -22.83639907836914, "global_step": 156218, "epoch": 1882} {"train_loss": -23.190359115600586, "global_step": 156219, "epoch": 1882} {"train_loss": -22.787288665771484, "global_step": 156220, "epoch": 1882} {"train_loss": -23.222257614135742, "global_step": 156221, "epoch": 1882} {"train_loss": -23.54976463317871, "global_step": 156222, "epoch": 1882} {"train_loss": -22.827564239501953, "global_step": 156223, "epoch": 1882} {"train_loss": -23.216636657714844, "global_step": 156224, "epoch": 1882} {"train_loss": -23.35218620300293, "global_step": 156225, "epoch": 1882} {"train_loss": -22.901519775390625, "global_step": 156226, "epoch": 1882} {"train_loss": -22.718942642211914, "global_step": 156227, "epoch": 1882} {"train_loss": -23.32293128967285, "global_step": 156228, "epoch": 1882} {"train_loss": -23.231779098510742, "global_step": 156229, "epoch": 1882} {"train_loss": -22.97040367126465, "global_step": 156230, "epoch": 1882} {"train_loss": -23.00006675720215, "global_step": 156231, "epoch": 1882} {"train_loss": -23.317237854003906, "global_step": 156232, "epoch": 1882} {"train_loss": -23.234487533569336, "global_step": 156233, "epoch": 1882} {"train_loss": -23.43982696533203, "global_step": 156234, "epoch": 1882} {"train_loss": -23.459117889404297, "global_step": 156235, "epoch": 1882} {"train_loss": -23.37203598022461, "global_step": 156236, "epoch": 1882} {"train_loss": -23.29420280456543, "global_step": 156237, "epoch": 1882} {"train_loss": -23.179420471191406, "global_step": 156238, "epoch": 1882} {"train_loss": -23.26736068725586, "global_step": 156239, "epoch": 1882} {"train_loss": -23.112579345703125, "global_step": 156240, "epoch": 1882} {"train_loss": -23.45197105407715, "global_step": 156241, "epoch": 1882} {"train_loss": -23.510873794555664, "global_step": 156242, "epoch": 1882} {"train_loss": -23.32461166381836, "global_step": 156243, "epoch": 1882} {"train_loss": -23.165403366088867, "global_step": 156244, "epoch": 1882} {"train_loss": -23.455957412719727, "global_step": 156245, "epoch": 1882} {"train_loss": -23.402585983276367, "global_step": 156246, "epoch": 1882} {"train_loss": -23.19684600830078, "global_step": 156247, "epoch": 1882} {"train_loss": -23.640371322631836, "global_step": 156248, "epoch": 1882} {"train_loss": -23.560964584350586, "global_step": 156249, "epoch": 1882} {"train_loss": -23.572858810424805, "global_step": 156250, "epoch": 1882} {"train_loss": -23.351184844970703, "global_step": 156251, "epoch": 1882} {"train_loss": -23.61768913269043, "global_step": 156252, "epoch": 1882} {"train_loss": -23.253679275512695, "global_step": 156253, "epoch": 1882} {"train_loss": -23.402740478515625, "global_step": 156254, "epoch": 1882} {"train_loss": -23.690338134765625, "global_step": 156255, "epoch": 1882} {"train_loss": -23.661842346191406, "global_step": 156256, "epoch": 1882} {"train_loss": -23.50313949584961, "global_step": 156257, "epoch": 1882} {"train_loss": -23.4128360748291, "global_step": 156258, "epoch": 1882} {"train_loss": -23.585630416870117, "global_step": 156259, "epoch": 1882} {"train_loss": -23.538288116455078, "global_step": 156260, "epoch": 1882} {"train_loss": -23.22987174987793, "global_step": 156261, "epoch": 1882} {"train_loss": -23.68144989013672, "global_step": 156262, "epoch": 1882} {"train_loss": -23.21822166442871, "global_step": 156263, "epoch": 1882} {"train_loss": -23.5362491607666, "global_step": 156264, "epoch": 1882} {"train_loss": -23.57185173034668, "global_step": 156265, "epoch": 1882} {"train_loss": -23.413312911987305, "global_step": 156266, "epoch": 1882} {"train_loss": -23.428970336914062, "global_step": 156267, "epoch": 1882} {"train_loss": -23.377471923828125, "global_step": 156268, "epoch": 1882} {"train_loss": -23.3101806640625, "global_step": 156269, "epoch": 1882} {"train_loss": -23.545028686523438, "global_step": 156270, "epoch": 1882} {"train_loss": -23.423959732055664, "global_step": 156271, "epoch": 1882} {"train_loss": -23.677640914916992, "global_step": 156272, "epoch": 1882} {"train_loss": -23.399169921875, "global_step": 156273, "epoch": 1882} {"train_loss": -23.088144302368164, "global_step": 156274, "epoch": 1882} {"train_loss": -23.42304229736328, "global_step": 156275, "epoch": 1882} {"train_loss": -23.56591796875, "global_step": 156276, "epoch": 1882} {"train_loss": -23.556264877319336, "global_step": 156277, "epoch": 1882} {"train_loss": -23.698030471801758, "global_step": 156278, "epoch": 1882} {"train_loss": -23.505292892456055, "global_step": 156279, "epoch": 1882} {"train_loss": -23.844327926635742, "global_step": 156280, "epoch": 1882} {"train_loss": -23.728458404541016, "global_step": 156281, "epoch": 1882} {"train_loss": -23.453657150268555, "global_step": 156282, "epoch": 1882} {"train_loss": -23.632238388061523, "global_step": 156283, "epoch": 1882} {"train_loss": -23.336956024169922, "global_step": 156284, "epoch": 1882} {"train_loss": -23.55657958984375, "global_step": 156285, "epoch": 1882} {"train_loss": -23.438535690307617, "global_step": 156286, "epoch": 1882} {"train_loss": -23.66181755065918, "global_step": 156287, "epoch": 1882} {"train_loss": -23.276093977043427, "global_step": 156288, "epoch": 1882, "val_loss": 6418967.5} {"train_loss": -22.6606388092041, "global_step": 156289, "epoch": 1883} {"train_loss": -22.064687728881836, "global_step": 156290, "epoch": 1883} {"train_loss": -23.769468307495117, "global_step": 156291, "epoch": 1883} {"train_loss": -22.07480239868164, "global_step": 156292, "epoch": 1883} {"train_loss": -22.826618194580078, "global_step": 156293, "epoch": 1883} {"train_loss": -22.173809051513672, "global_step": 156294, "epoch": 1883} {"train_loss": -22.865150451660156, "global_step": 156295, "epoch": 1883} {"train_loss": -22.810270309448242, "global_step": 156296, "epoch": 1883} {"train_loss": -22.599288940429688, "global_step": 156297, "epoch": 1883} {"train_loss": -22.77783203125, "global_step": 156298, "epoch": 1883} {"train_loss": -23.180150985717773, "global_step": 156299, "epoch": 1883} {"train_loss": -22.925107955932617, "global_step": 156300, "epoch": 1883} {"train_loss": -22.744876861572266, "global_step": 156301, "epoch": 1883} {"train_loss": -23.00257110595703, "global_step": 156302, "epoch": 1883} {"train_loss": -23.301584243774414, "global_step": 156303, "epoch": 1883} {"train_loss": -23.23945426940918, "global_step": 156304, "epoch": 1883} {"train_loss": -23.137968063354492, "global_step": 156305, "epoch": 1883} {"train_loss": -22.99468994140625, "global_step": 156306, "epoch": 1883} {"train_loss": -23.140451431274414, "global_step": 156307, "epoch": 1883} {"train_loss": -23.169992446899414, "global_step": 156308, "epoch": 1883} {"train_loss": -23.445491790771484, "global_step": 156309, "epoch": 1883} {"train_loss": -23.274368286132812, "global_step": 156310, "epoch": 1883} {"train_loss": -23.2894229888916, "global_step": 156311, "epoch": 1883} {"train_loss": -23.235580444335938, "global_step": 156312, "epoch": 1883} {"train_loss": -23.263837814331055, "global_step": 156313, "epoch": 1883} {"train_loss": -23.254518508911133, "global_step": 156314, "epoch": 1883} {"train_loss": -23.09669303894043, "global_step": 156315, "epoch": 1883} {"train_loss": -23.349618911743164, "global_step": 156316, "epoch": 1883} {"train_loss": -23.188810348510742, "global_step": 156317, "epoch": 1883} {"train_loss": -23.233549118041992, "global_step": 156318, "epoch": 1883} {"train_loss": -23.10186195373535, "global_step": 156319, "epoch": 1883} {"train_loss": -23.693571090698242, "global_step": 156320, "epoch": 1883} {"train_loss": -23.28510093688965, "global_step": 156321, "epoch": 1883} {"train_loss": -23.618057250976562, "global_step": 156322, "epoch": 1883} {"train_loss": -23.605356216430664, "global_step": 156323, "epoch": 1883} {"train_loss": -23.225400924682617, "global_step": 156324, "epoch": 1883} {"train_loss": -23.533048629760742, "global_step": 156325, "epoch": 1883} {"train_loss": -23.1248722076416, "global_step": 156326, "epoch": 1883} {"train_loss": -23.194684982299805, "global_step": 156327, "epoch": 1883} {"train_loss": -23.302627563476562, "global_step": 156328, "epoch": 1883} {"train_loss": -23.416967391967773, "global_step": 156329, "epoch": 1883} {"train_loss": -23.30269432067871, "global_step": 156330, "epoch": 1883} {"train_loss": -23.286542892456055, "global_step": 156331, "epoch": 1883} {"train_loss": -23.420461654663086, "global_step": 156332, "epoch": 1883} {"train_loss": -23.421079635620117, "global_step": 156333, "epoch": 1883} {"train_loss": -23.75972557067871, "global_step": 156334, "epoch": 1883} {"train_loss": -23.750524520874023, "global_step": 156335, "epoch": 1883} {"train_loss": -23.696592330932617, "global_step": 156336, "epoch": 1883} {"train_loss": -23.773130416870117, "global_step": 156337, "epoch": 1883} {"train_loss": -23.395212173461914, "global_step": 156338, "epoch": 1883} {"train_loss": -23.05176544189453, "global_step": 156339, "epoch": 1883} {"train_loss": -23.30657386779785, "global_step": 156340, "epoch": 1883} {"train_loss": -23.493406295776367, "global_step": 156341, "epoch": 1883} {"train_loss": -23.537250518798828, "global_step": 156342, "epoch": 1883} {"train_loss": -23.55853843688965, "global_step": 156343, "epoch": 1883} {"train_loss": -23.379825592041016, "global_step": 156344, "epoch": 1883} {"train_loss": -23.698535919189453, "global_step": 156345, "epoch": 1883} {"train_loss": -23.52034568786621, "global_step": 156346, "epoch": 1883} {"train_loss": -23.4106502532959, "global_step": 156347, "epoch": 1883} {"train_loss": -23.482419967651367, "global_step": 156348, "epoch": 1883} {"train_loss": -23.571115493774414, "global_step": 156349, "epoch": 1883} {"train_loss": -23.36421775817871, "global_step": 156350, "epoch": 1883} {"train_loss": -23.372953414916992, "global_step": 156351, "epoch": 1883} {"train_loss": -23.661787033081055, "global_step": 156352, "epoch": 1883} {"train_loss": -23.426250457763672, "global_step": 156353, "epoch": 1883} {"train_loss": -23.02315330505371, "global_step": 156354, "epoch": 1883} {"train_loss": -23.584747314453125, "global_step": 156355, "epoch": 1883} {"train_loss": -23.594987869262695, "global_step": 156356, "epoch": 1883} {"train_loss": -23.559268951416016, "global_step": 156357, "epoch": 1883} {"train_loss": -23.2934627532959, "global_step": 156358, "epoch": 1883} {"train_loss": -23.47958755493164, "global_step": 156359, "epoch": 1883} {"train_loss": -23.75471305847168, "global_step": 156360, "epoch": 1883} {"train_loss": -23.440441131591797, "global_step": 156361, "epoch": 1883} {"train_loss": -23.773508071899414, "global_step": 156362, "epoch": 1883} {"train_loss": -23.54575538635254, "global_step": 156363, "epoch": 1883} {"train_loss": -23.57875633239746, "global_step": 156364, "epoch": 1883} {"train_loss": -23.407270431518555, "global_step": 156365, "epoch": 1883} {"train_loss": -23.948495864868164, "global_step": 156366, "epoch": 1883} {"train_loss": -23.7597713470459, "global_step": 156367, "epoch": 1883} {"train_loss": -23.82257652282715, "global_step": 156368, "epoch": 1883} {"train_loss": -23.462844848632812, "global_step": 156369, "epoch": 1883} {"train_loss": -23.902572631835938, "global_step": 156370, "epoch": 1883} {"train_loss": -23.329999418143768, "global_step": 156371, "epoch": 1883, "val_loss": 6329927.0} {"train_loss": -22.986328125, "global_step": 156372, "epoch": 1884} {"train_loss": -22.38258171081543, "global_step": 156373, "epoch": 1884} {"train_loss": -20.822986602783203, "global_step": 156374, "epoch": 1884} {"train_loss": -22.258588790893555, "global_step": 156375, "epoch": 1884} {"train_loss": -22.69088363647461, "global_step": 156376, "epoch": 1884} {"train_loss": -22.531335830688477, "global_step": 156377, "epoch": 1884} {"train_loss": -22.8370361328125, "global_step": 156378, "epoch": 1884} {"train_loss": -22.59058952331543, "global_step": 156379, "epoch": 1884} {"train_loss": -22.863569259643555, "global_step": 156380, "epoch": 1884} {"train_loss": -23.243335723876953, "global_step": 156381, "epoch": 1884} {"train_loss": -23.012104034423828, "global_step": 156382, "epoch": 1884} {"train_loss": -22.855297088623047, "global_step": 156383, "epoch": 1884} {"train_loss": -23.262144088745117, "global_step": 156384, "epoch": 1884} {"train_loss": -23.363632202148438, "global_step": 156385, "epoch": 1884} {"train_loss": -23.070497512817383, "global_step": 156386, "epoch": 1884} {"train_loss": -22.755483627319336, "global_step": 156387, "epoch": 1884} {"train_loss": -23.345062255859375, "global_step": 156388, "epoch": 1884} {"train_loss": -22.73006248474121, "global_step": 156389, "epoch": 1884} {"train_loss": -23.3365421295166, "global_step": 156390, "epoch": 1884} {"train_loss": -22.932727813720703, "global_step": 156391, "epoch": 1884} {"train_loss": -22.980117797851562, "global_step": 156392, "epoch": 1884} {"train_loss": -23.28360939025879, "global_step": 156393, "epoch": 1884} {"train_loss": -23.426193237304688, "global_step": 156394, "epoch": 1884} {"train_loss": -23.155803680419922, "global_step": 156395, "epoch": 1884} {"train_loss": -23.470800399780273, "global_step": 156396, "epoch": 1884} {"train_loss": -22.928083419799805, "global_step": 156397, "epoch": 1884} {"train_loss": -23.296161651611328, "global_step": 156398, "epoch": 1884} {"train_loss": -23.75992774963379, "global_step": 156399, "epoch": 1884} {"train_loss": -23.428462982177734, "global_step": 156400, "epoch": 1884} {"train_loss": -23.14866828918457, "global_step": 156401, "epoch": 1884} {"train_loss": -23.342771530151367, "global_step": 156402, "epoch": 1884} {"train_loss": -23.311391830444336, "global_step": 156403, "epoch": 1884} {"train_loss": -23.177967071533203, "global_step": 156404, "epoch": 1884} {"train_loss": -23.48358154296875, "global_step": 156405, "epoch": 1884} {"train_loss": -23.594711303710938, "global_step": 156406, "epoch": 1884} {"train_loss": -23.413650512695312, "global_step": 156407, "epoch": 1884} {"train_loss": -23.433046340942383, "global_step": 156408, "epoch": 1884} {"train_loss": -23.3890380859375, "global_step": 156409, "epoch": 1884} {"train_loss": -23.430517196655273, "global_step": 156410, "epoch": 1884} {"train_loss": -23.197912216186523, "global_step": 156411, "epoch": 1884} {"train_loss": -23.50284194946289, "global_step": 156412, "epoch": 1884} {"train_loss": -23.353384017944336, "global_step": 156413, "epoch": 1884} {"train_loss": -23.562318801879883, "global_step": 156414, "epoch": 1884} {"train_loss": -23.342470169067383, "global_step": 156415, "epoch": 1884} {"train_loss": -23.5382022857666, "global_step": 156416, "epoch": 1884} {"train_loss": -23.3324031829834, "global_step": 156417, "epoch": 1884} {"train_loss": -23.254554748535156, "global_step": 156418, "epoch": 1884} {"train_loss": -23.583267211914062, "global_step": 156419, "epoch": 1884} {"train_loss": -23.632389068603516, "global_step": 156420, "epoch": 1884} {"train_loss": -23.38300323486328, "global_step": 156421, "epoch": 1884} {"train_loss": -23.6157169342041, "global_step": 156422, "epoch": 1884} {"train_loss": -23.24281883239746, "global_step": 156423, "epoch": 1884} {"train_loss": -23.29298210144043, "global_step": 156424, "epoch": 1884} {"train_loss": -23.529268264770508, "global_step": 156425, "epoch": 1884} {"train_loss": -23.591842651367188, "global_step": 156426, "epoch": 1884} {"train_loss": -23.350679397583008, "global_step": 156427, "epoch": 1884} {"train_loss": -23.59702491760254, "global_step": 156428, "epoch": 1884} {"train_loss": -23.44908905029297, "global_step": 156429, "epoch": 1884} {"train_loss": -23.518665313720703, "global_step": 156430, "epoch": 1884} {"train_loss": -23.450441360473633, "global_step": 156431, "epoch": 1884} {"train_loss": -23.476505279541016, "global_step": 156432, "epoch": 1884} {"train_loss": -23.4240779876709, "global_step": 156433, "epoch": 1884} {"train_loss": -23.756149291992188, "global_step": 156434, "epoch": 1884} {"train_loss": -23.42094612121582, "global_step": 156435, "epoch": 1884} {"train_loss": -23.323896408081055, "global_step": 156436, "epoch": 1884} {"train_loss": -23.55376625061035, "global_step": 156437, "epoch": 1884} {"train_loss": -22.740009307861328, "global_step": 156438, "epoch": 1884} {"train_loss": -23.412015914916992, "global_step": 156439, "epoch": 1884} {"train_loss": -23.647172927856445, "global_step": 156440, "epoch": 1884} {"train_loss": -23.462373733520508, "global_step": 156441, "epoch": 1884} {"train_loss": -23.45417022705078, "global_step": 156442, "epoch": 1884} {"train_loss": -23.72516632080078, "global_step": 156443, "epoch": 1884} {"train_loss": -23.2708683013916, "global_step": 156444, "epoch": 1884} {"train_loss": -23.434879302978516, "global_step": 156445, "epoch": 1884} {"train_loss": -23.48317527770996, "global_step": 156446, "epoch": 1884} {"train_loss": -23.272436141967773, "global_step": 156447, "epoch": 1884} {"train_loss": -23.28476905822754, "global_step": 156448, "epoch": 1884} {"train_loss": -23.75771141052246, "global_step": 156449, "epoch": 1884} {"train_loss": -23.099885940551758, "global_step": 156450, "epoch": 1884} {"train_loss": -23.12239646911621, "global_step": 156451, "epoch": 1884} {"train_loss": -23.658071517944336, "global_step": 156452, "epoch": 1884} {"train_loss": -23.43294334411621, "global_step": 156453, "epoch": 1884} {"train_loss": -23.261178349874104, "global_step": 156454, "epoch": 1884, "val_loss": 6461779.0} {"train_loss": -22.88199234008789, "global_step": 156455, "epoch": 1885} {"train_loss": -22.983718872070312, "global_step": 156456, "epoch": 1885} {"train_loss": -23.08461570739746, "global_step": 156457, "epoch": 1885} {"train_loss": -22.412572860717773, "global_step": 156458, "epoch": 1885} {"train_loss": -22.806926727294922, "global_step": 156459, "epoch": 1885} {"train_loss": -22.93182945251465, "global_step": 156460, "epoch": 1885} {"train_loss": -22.84430503845215, "global_step": 156461, "epoch": 1885} {"train_loss": -23.073261260986328, "global_step": 156462, "epoch": 1885} {"train_loss": -23.134857177734375, "global_step": 156463, "epoch": 1885} {"train_loss": -23.129480361938477, "global_step": 156464, "epoch": 1885} {"train_loss": -22.94632911682129, "global_step": 156465, "epoch": 1885} {"train_loss": -23.117631912231445, "global_step": 156466, "epoch": 1885} {"train_loss": -23.169023513793945, "global_step": 156467, "epoch": 1885} {"train_loss": -23.138797760009766, "global_step": 156468, "epoch": 1885} {"train_loss": -23.0048828125, "global_step": 156469, "epoch": 1885} {"train_loss": -23.440567016601562, "global_step": 156470, "epoch": 1885} {"train_loss": -23.055044174194336, "global_step": 156471, "epoch": 1885} {"train_loss": -22.919559478759766, "global_step": 156472, "epoch": 1885} {"train_loss": -23.336252212524414, "global_step": 156473, "epoch": 1885} {"train_loss": -23.089509963989258, "global_step": 156474, "epoch": 1885} {"train_loss": -23.393712997436523, "global_step": 156475, "epoch": 1885} {"train_loss": -23.33164405822754, "global_step": 156476, "epoch": 1885} {"train_loss": -23.410261154174805, "global_step": 156477, "epoch": 1885} {"train_loss": -23.301605224609375, "global_step": 156478, "epoch": 1885} {"train_loss": -23.018789291381836, "global_step": 156479, "epoch": 1885} {"train_loss": -23.15534782409668, "global_step": 156480, "epoch": 1885} {"train_loss": -23.725814819335938, "global_step": 156481, "epoch": 1885} {"train_loss": -23.41063117980957, "global_step": 156482, "epoch": 1885} {"train_loss": -23.296396255493164, "global_step": 156483, "epoch": 1885} {"train_loss": -23.06539535522461, "global_step": 156484, "epoch": 1885} {"train_loss": -23.904552459716797, "global_step": 156485, "epoch": 1885} {"train_loss": -23.12116241455078, "global_step": 156486, "epoch": 1885} {"train_loss": -23.715063095092773, "global_step": 156487, "epoch": 1885} {"train_loss": -23.458524703979492, "global_step": 156488, "epoch": 1885} {"train_loss": -23.285079956054688, "global_step": 156489, "epoch": 1885} {"train_loss": -23.262113571166992, "global_step": 156490, "epoch": 1885} {"train_loss": -23.278427124023438, "global_step": 156491, "epoch": 1885} {"train_loss": -23.601747512817383, "global_step": 156492, "epoch": 1885} {"train_loss": -23.353696823120117, "global_step": 156493, "epoch": 1885} {"train_loss": -23.249013900756836, "global_step": 156494, "epoch": 1885} {"train_loss": -23.35457992553711, "global_step": 156495, "epoch": 1885} {"train_loss": -23.714750289916992, "global_step": 156496, "epoch": 1885} {"train_loss": -23.7720947265625, "global_step": 156497, "epoch": 1885} {"train_loss": -23.36734962463379, "global_step": 156498, "epoch": 1885} {"train_loss": -23.432279586791992, "global_step": 156499, "epoch": 1885} {"train_loss": -23.408971786499023, "global_step": 156500, "epoch": 1885} {"train_loss": -23.64335060119629, "global_step": 156501, "epoch": 1885} {"train_loss": -23.476789474487305, "global_step": 156502, "epoch": 1885} {"train_loss": -23.47015953063965, "global_step": 156503, "epoch": 1885} {"train_loss": -23.39699363708496, "global_step": 156504, "epoch": 1885} {"train_loss": -23.523706436157227, "global_step": 156505, "epoch": 1885} {"train_loss": -23.471811294555664, "global_step": 156506, "epoch": 1885} {"train_loss": -23.22336769104004, "global_step": 156507, "epoch": 1885} {"train_loss": -23.461523056030273, "global_step": 156508, "epoch": 1885} {"train_loss": -23.41876220703125, "global_step": 156509, "epoch": 1885} {"train_loss": -23.29524803161621, "global_step": 156510, "epoch": 1885} {"train_loss": -23.54839324951172, "global_step": 156511, "epoch": 1885} {"train_loss": -23.410173416137695, "global_step": 156512, "epoch": 1885} {"train_loss": -23.325056076049805, "global_step": 156513, "epoch": 1885} {"train_loss": -23.644716262817383, "global_step": 156514, "epoch": 1885} {"train_loss": -23.132444381713867, "global_step": 156515, "epoch": 1885} {"train_loss": -23.554584503173828, "global_step": 156516, "epoch": 1885} {"train_loss": -23.48712921142578, "global_step": 156517, "epoch": 1885} {"train_loss": -23.28208351135254, "global_step": 156518, "epoch": 1885} {"train_loss": -23.611791610717773, "global_step": 156519, "epoch": 1885} {"train_loss": -23.288009643554688, "global_step": 156520, "epoch": 1885} {"train_loss": -23.144994735717773, "global_step": 156521, "epoch": 1885} {"train_loss": -23.708520889282227, "global_step": 156522, "epoch": 1885} {"train_loss": -23.63233757019043, "global_step": 156523, "epoch": 1885} {"train_loss": -23.317115783691406, "global_step": 156524, "epoch": 1885} {"train_loss": -23.52621841430664, "global_step": 156525, "epoch": 1885} {"train_loss": -23.777639389038086, "global_step": 156526, "epoch": 1885} {"train_loss": -23.58350372314453, "global_step": 156527, "epoch": 1885} {"train_loss": -23.473432540893555, "global_step": 156528, "epoch": 1885} {"train_loss": -23.371198654174805, "global_step": 156529, "epoch": 1885} {"train_loss": -23.53672218322754, "global_step": 156530, "epoch": 1885} {"train_loss": -23.834524154663086, "global_step": 156531, "epoch": 1885} {"train_loss": -23.619810104370117, "global_step": 156532, "epoch": 1885} {"train_loss": -23.251720428466797, "global_step": 156533, "epoch": 1885} {"train_loss": -23.409748077392578, "global_step": 156534, "epoch": 1885} {"train_loss": -23.384794235229492, "global_step": 156535, "epoch": 1885} {"train_loss": -23.513940811157227, "global_step": 156536, "epoch": 1885} {"train_loss": -23.352117446531732, "global_step": 156537, "epoch": 1885, "val_loss": 6425916.0} {"train_loss": -23.03223419189453, "global_step": 156538, "epoch": 1886} {"train_loss": -23.031431198120117, "global_step": 156539, "epoch": 1886} {"train_loss": -23.252567291259766, "global_step": 156540, "epoch": 1886} {"train_loss": -23.0195369720459, "global_step": 156541, "epoch": 1886} {"train_loss": -23.023590087890625, "global_step": 156542, "epoch": 1886} {"train_loss": -23.311315536499023, "global_step": 156543, "epoch": 1886} {"train_loss": -22.968246459960938, "global_step": 156544, "epoch": 1886} {"train_loss": -23.175251007080078, "global_step": 156545, "epoch": 1886} {"train_loss": -23.09142303466797, "global_step": 156546, "epoch": 1886} {"train_loss": -22.974767684936523, "global_step": 156547, "epoch": 1886} {"train_loss": -23.327415466308594, "global_step": 156548, "epoch": 1886} {"train_loss": -23.27187156677246, "global_step": 156549, "epoch": 1886} {"train_loss": -23.360395431518555, "global_step": 156550, "epoch": 1886} {"train_loss": -23.563344955444336, "global_step": 156551, "epoch": 1886} {"train_loss": -23.535146713256836, "global_step": 156552, "epoch": 1886} {"train_loss": -23.140708923339844, "global_step": 156553, "epoch": 1886} {"train_loss": -22.769027709960938, "global_step": 156554, "epoch": 1886} {"train_loss": -23.429380416870117, "global_step": 156555, "epoch": 1886} {"train_loss": -23.210208892822266, "global_step": 156556, "epoch": 1886} {"train_loss": -23.202335357666016, "global_step": 156557, "epoch": 1886} {"train_loss": -23.384666442871094, "global_step": 156558, "epoch": 1886} {"train_loss": -23.34604835510254, "global_step": 156559, "epoch": 1886} {"train_loss": -23.326519012451172, "global_step": 156560, "epoch": 1886} {"train_loss": -23.45835304260254, "global_step": 156561, "epoch": 1886} {"train_loss": -23.205106735229492, "global_step": 156562, "epoch": 1886} {"train_loss": -23.777297973632812, "global_step": 156563, "epoch": 1886} {"train_loss": -23.33786392211914, "global_step": 156564, "epoch": 1886} {"train_loss": -23.269296646118164, "global_step": 156565, "epoch": 1886} {"train_loss": -23.20975112915039, "global_step": 156566, "epoch": 1886} {"train_loss": -23.551986694335938, "global_step": 156567, "epoch": 1886} {"train_loss": -23.18461799621582, "global_step": 156568, "epoch": 1886} {"train_loss": -23.389137268066406, "global_step": 156569, "epoch": 1886} {"train_loss": -23.418176651000977, "global_step": 156570, "epoch": 1886} {"train_loss": -23.022886276245117, "global_step": 156571, "epoch": 1886} {"train_loss": -23.39850425720215, "global_step": 156572, "epoch": 1886} {"train_loss": -23.785005569458008, "global_step": 156573, "epoch": 1886} {"train_loss": -23.348102569580078, "global_step": 156574, "epoch": 1886} {"train_loss": -23.4548282623291, "global_step": 156575, "epoch": 1886} {"train_loss": -23.569318771362305, "global_step": 156576, "epoch": 1886} {"train_loss": -23.35208511352539, "global_step": 156577, "epoch": 1886} {"train_loss": -23.743118286132812, "global_step": 156578, "epoch": 1886} {"train_loss": -23.402956008911133, "global_step": 156579, "epoch": 1886} {"train_loss": -23.842390060424805, "global_step": 156580, "epoch": 1886} {"train_loss": -23.67276954650879, "global_step": 156581, "epoch": 1886} {"train_loss": -23.591373443603516, "global_step": 156582, "epoch": 1886} {"train_loss": -23.450519561767578, "global_step": 156583, "epoch": 1886} {"train_loss": -23.096424102783203, "global_step": 156584, "epoch": 1886} {"train_loss": -23.43028450012207, "global_step": 156585, "epoch": 1886} {"train_loss": -23.380237579345703, "global_step": 156586, "epoch": 1886} {"train_loss": -23.673460006713867, "global_step": 156587, "epoch": 1886} {"train_loss": -23.604040145874023, "global_step": 156588, "epoch": 1886} {"train_loss": -23.546293258666992, "global_step": 156589, "epoch": 1886} {"train_loss": -23.495880126953125, "global_step": 156590, "epoch": 1886} {"train_loss": -23.684106826782227, "global_step": 156591, "epoch": 1886} {"train_loss": -23.597929000854492, "global_step": 156592, "epoch": 1886} {"train_loss": -23.489004135131836, "global_step": 156593, "epoch": 1886} {"train_loss": -23.723608016967773, "global_step": 156594, "epoch": 1886} {"train_loss": -23.303403854370117, "global_step": 156595, "epoch": 1886} {"train_loss": -23.502639770507812, "global_step": 156596, "epoch": 1886} {"train_loss": -23.244592666625977, "global_step": 156597, "epoch": 1886} {"train_loss": -23.5689754486084, "global_step": 156598, "epoch": 1886} {"train_loss": -23.616445541381836, "global_step": 156599, "epoch": 1886} {"train_loss": -23.26473045349121, "global_step": 156600, "epoch": 1886} {"train_loss": -23.1726016998291, "global_step": 156601, "epoch": 1886} {"train_loss": -23.73830795288086, "global_step": 156602, "epoch": 1886} {"train_loss": -23.58515739440918, "global_step": 156603, "epoch": 1886} {"train_loss": -23.583763122558594, "global_step": 156604, "epoch": 1886} {"train_loss": -23.877887725830078, "global_step": 156605, "epoch": 1886} {"train_loss": -23.819499969482422, "global_step": 156606, "epoch": 1886} {"train_loss": -23.352527618408203, "global_step": 156607, "epoch": 1886} {"train_loss": -23.49458885192871, "global_step": 156608, "epoch": 1886} {"train_loss": -23.22368812561035, "global_step": 156609, "epoch": 1886} {"train_loss": -23.02687644958496, "global_step": 156610, "epoch": 1886} {"train_loss": -23.559537887573242, "global_step": 156611, "epoch": 1886} {"train_loss": -23.686325073242188, "global_step": 156612, "epoch": 1886} {"train_loss": -23.036727905273438, "global_step": 156613, "epoch": 1886} {"train_loss": -23.594154357910156, "global_step": 156614, "epoch": 1886} {"train_loss": -23.649106979370117, "global_step": 156615, "epoch": 1886} {"train_loss": -23.19875717163086, "global_step": 156616, "epoch": 1886} {"train_loss": -23.065664291381836, "global_step": 156617, "epoch": 1886} {"train_loss": -23.28635025024414, "global_step": 156618, "epoch": 1886} {"train_loss": -23.339155197143555, "global_step": 156619, "epoch": 1886} {"train_loss": -23.38437735316265, "global_step": 156620, "epoch": 1886, "val_loss": 6342737.0} {"train_loss": -23.563383102416992, "global_step": 156621, "epoch": 1887} {"train_loss": -23.229633331298828, "global_step": 156622, "epoch": 1887} {"train_loss": -23.208005905151367, "global_step": 156623, "epoch": 1887} {"train_loss": -23.220924377441406, "global_step": 156624, "epoch": 1887} {"train_loss": -22.929758071899414, "global_step": 156625, "epoch": 1887} {"train_loss": -23.079906463623047, "global_step": 156626, "epoch": 1887} {"train_loss": -23.458663940429688, "global_step": 156627, "epoch": 1887} {"train_loss": -23.0648250579834, "global_step": 156628, "epoch": 1887} {"train_loss": -23.21608543395996, "global_step": 156629, "epoch": 1887} {"train_loss": -23.216463088989258, "global_step": 156630, "epoch": 1887} {"train_loss": -23.180618286132812, "global_step": 156631, "epoch": 1887} {"train_loss": -23.399930953979492, "global_step": 156632, "epoch": 1887} {"train_loss": -23.299530029296875, "global_step": 156633, "epoch": 1887} {"train_loss": -23.19647216796875, "global_step": 156634, "epoch": 1887} {"train_loss": -23.06201171875, "global_step": 156635, "epoch": 1887} {"train_loss": -23.62252426147461, "global_step": 156636, "epoch": 1887} {"train_loss": -23.653121948242188, "global_step": 156637, "epoch": 1887} {"train_loss": -23.24994468688965, "global_step": 156638, "epoch": 1887} {"train_loss": -23.158658981323242, "global_step": 156639, "epoch": 1887} {"train_loss": -23.27284812927246, "global_step": 156640, "epoch": 1887} {"train_loss": -23.37015151977539, "global_step": 156641, "epoch": 1887} {"train_loss": -23.76735496520996, "global_step": 156642, "epoch": 1887} {"train_loss": -23.245250701904297, "global_step": 156643, "epoch": 1887} {"train_loss": -23.218015670776367, "global_step": 156644, "epoch": 1887} {"train_loss": -23.237314224243164, "global_step": 156645, "epoch": 1887} {"train_loss": -23.257360458374023, "global_step": 156646, "epoch": 1887} {"train_loss": -23.60274314880371, "global_step": 156647, "epoch": 1887} {"train_loss": -23.451345443725586, "global_step": 156648, "epoch": 1887} {"train_loss": -23.631061553955078, "global_step": 156649, "epoch": 1887} {"train_loss": -23.602134704589844, "global_step": 156650, "epoch": 1887} {"train_loss": -23.168298721313477, "global_step": 156651, "epoch": 1887} {"train_loss": -23.022485733032227, "global_step": 156652, "epoch": 1887} {"train_loss": -22.869897842407227, "global_step": 156653, "epoch": 1887} {"train_loss": -23.52483558654785, "global_step": 156654, "epoch": 1887} {"train_loss": -23.299406051635742, "global_step": 156655, "epoch": 1887} {"train_loss": -23.521635055541992, "global_step": 156656, "epoch": 1887} {"train_loss": -23.553714752197266, "global_step": 156657, "epoch": 1887} {"train_loss": -23.41256332397461, "global_step": 156658, "epoch": 1887} {"train_loss": -23.24310302734375, "global_step": 156659, "epoch": 1887} {"train_loss": -23.71572494506836, "global_step": 156660, "epoch": 1887} {"train_loss": -23.501699447631836, "global_step": 156661, "epoch": 1887} {"train_loss": -23.407337188720703, "global_step": 156662, "epoch": 1887} {"train_loss": -23.91473960876465, "global_step": 156663, "epoch": 1887} {"train_loss": -23.605497360229492, "global_step": 156664, "epoch": 1887} {"train_loss": -23.740604400634766, "global_step": 156665, "epoch": 1887} {"train_loss": -23.339597702026367, "global_step": 156666, "epoch": 1887} {"train_loss": -23.443201065063477, "global_step": 156667, "epoch": 1887} {"train_loss": -23.653310775756836, "global_step": 156668, "epoch": 1887} {"train_loss": -23.05963897705078, "global_step": 156669, "epoch": 1887} {"train_loss": -23.02585220336914, "global_step": 156670, "epoch": 1887} {"train_loss": -23.579992294311523, "global_step": 156671, "epoch": 1887} {"train_loss": -23.506711959838867, "global_step": 156672, "epoch": 1887} {"train_loss": -23.617509841918945, "global_step": 156673, "epoch": 1887} {"train_loss": -23.356109619140625, "global_step": 156674, "epoch": 1887} {"train_loss": -23.638751983642578, "global_step": 156675, "epoch": 1887} {"train_loss": -23.512989044189453, "global_step": 156676, "epoch": 1887} {"train_loss": -22.996023178100586, "global_step": 156677, "epoch": 1887} {"train_loss": -23.351669311523438, "global_step": 156678, "epoch": 1887} {"train_loss": -23.180078506469727, "global_step": 156679, "epoch": 1887} {"train_loss": -23.234325408935547, "global_step": 156680, "epoch": 1887} {"train_loss": -23.01144027709961, "global_step": 156681, "epoch": 1887} {"train_loss": -23.557659149169922, "global_step": 156682, "epoch": 1887} {"train_loss": -23.340970993041992, "global_step": 156683, "epoch": 1887} {"train_loss": -24.073410034179688, "global_step": 156684, "epoch": 1887} {"train_loss": -23.71255874633789, "global_step": 156685, "epoch": 1887} {"train_loss": -23.675418853759766, "global_step": 156686, "epoch": 1887} {"train_loss": -23.818708419799805, "global_step": 156687, "epoch": 1887} {"train_loss": -23.73714256286621, "global_step": 156688, "epoch": 1887} {"train_loss": -23.455392837524414, "global_step": 156689, "epoch": 1887} {"train_loss": -23.626026153564453, "global_step": 156690, "epoch": 1887} {"train_loss": -23.59235954284668, "global_step": 156691, "epoch": 1887} {"train_loss": -23.26617431640625, "global_step": 156692, "epoch": 1887} {"train_loss": -23.191579818725586, "global_step": 156693, "epoch": 1887} {"train_loss": -23.472951889038086, "global_step": 156694, "epoch": 1887} {"train_loss": -23.696943283081055, "global_step": 156695, "epoch": 1887} {"train_loss": -23.499656677246094, "global_step": 156696, "epoch": 1887} {"train_loss": -23.406320571899414, "global_step": 156697, "epoch": 1887} {"train_loss": -23.506210327148438, "global_step": 156698, "epoch": 1887} {"train_loss": -23.77894401550293, "global_step": 156699, "epoch": 1887} {"train_loss": -23.467405319213867, "global_step": 156700, "epoch": 1887} {"train_loss": -23.305143356323242, "global_step": 156701, "epoch": 1887} {"train_loss": -23.543888092041016, "global_step": 156702, "epoch": 1887} {"train_loss": -23.415627950645355, "global_step": 156703, "epoch": 1887, "val_loss": 6197339.0} {"train_loss": -23.112943649291992, "global_step": 156704, "epoch": 1888} {"train_loss": -23.317174911499023, "global_step": 156705, "epoch": 1888} {"train_loss": -22.712766647338867, "global_step": 156706, "epoch": 1888} {"train_loss": -23.451454162597656, "global_step": 156707, "epoch": 1888} {"train_loss": -22.977863311767578, "global_step": 156708, "epoch": 1888} {"train_loss": -23.274505615234375, "global_step": 156709, "epoch": 1888} {"train_loss": -23.329755783081055, "global_step": 156710, "epoch": 1888} {"train_loss": -22.78399658203125, "global_step": 156711, "epoch": 1888} {"train_loss": -23.150165557861328, "global_step": 156712, "epoch": 1888} {"train_loss": -23.484891891479492, "global_step": 156713, "epoch": 1888} {"train_loss": -23.267906188964844, "global_step": 156714, "epoch": 1888} {"train_loss": -23.23780059814453, "global_step": 156715, "epoch": 1888} {"train_loss": -23.335691452026367, "global_step": 156716, "epoch": 1888} {"train_loss": -23.267282485961914, "global_step": 156717, "epoch": 1888} {"train_loss": -22.957231521606445, "global_step": 156718, "epoch": 1888} {"train_loss": -23.425809860229492, "global_step": 156719, "epoch": 1888} {"train_loss": -23.407560348510742, "global_step": 156720, "epoch": 1888} {"train_loss": -23.32721519470215, "global_step": 156721, "epoch": 1888} {"train_loss": -23.35774040222168, "global_step": 156722, "epoch": 1888} {"train_loss": -23.445676803588867, "global_step": 156723, "epoch": 1888} {"train_loss": -23.43462371826172, "global_step": 156724, "epoch": 1888} {"train_loss": -23.247438430786133, "global_step": 156725, "epoch": 1888} {"train_loss": -23.172937393188477, "global_step": 156726, "epoch": 1888} {"train_loss": -23.335391998291016, "global_step": 156727, "epoch": 1888} {"train_loss": -23.579248428344727, "global_step": 156728, "epoch": 1888} {"train_loss": -23.640796661376953, "global_step": 156729, "epoch": 1888} {"train_loss": -23.31459617614746, "global_step": 156730, "epoch": 1888} {"train_loss": -23.72272300720215, "global_step": 156731, "epoch": 1888} {"train_loss": -23.262914657592773, "global_step": 156732, "epoch": 1888} {"train_loss": -22.879011154174805, "global_step": 156733, "epoch": 1888} {"train_loss": -23.234439849853516, "global_step": 156734, "epoch": 1888} {"train_loss": -23.35446548461914, "global_step": 156735, "epoch": 1888} {"train_loss": -23.094730377197266, "global_step": 156736, "epoch": 1888} {"train_loss": -23.394468307495117, "global_step": 156737, "epoch": 1888} {"train_loss": -23.28339958190918, "global_step": 156738, "epoch": 1888} {"train_loss": -23.23177146911621, "global_step": 156739, "epoch": 1888} {"train_loss": -23.67681884765625, "global_step": 156740, "epoch": 1888} {"train_loss": -23.467573165893555, "global_step": 156741, "epoch": 1888} {"train_loss": -23.339393615722656, "global_step": 156742, "epoch": 1888} {"train_loss": -23.45281982421875, "global_step": 156743, "epoch": 1888} {"train_loss": -22.78712272644043, "global_step": 156744, "epoch": 1888} {"train_loss": -23.279678344726562, "global_step": 156745, "epoch": 1888} {"train_loss": -23.381744384765625, "global_step": 156746, "epoch": 1888} {"train_loss": -23.575284957885742, "global_step": 156747, "epoch": 1888} {"train_loss": -23.119306564331055, "global_step": 156748, "epoch": 1888} {"train_loss": -23.271705627441406, "global_step": 156749, "epoch": 1888} {"train_loss": -23.45218849182129, "global_step": 156750, "epoch": 1888} {"train_loss": -23.288421630859375, "global_step": 156751, "epoch": 1888} {"train_loss": -23.136484146118164, "global_step": 156752, "epoch": 1888} {"train_loss": -23.151201248168945, "global_step": 156753, "epoch": 1888} {"train_loss": -23.582944869995117, "global_step": 156754, "epoch": 1888} {"train_loss": -23.74507713317871, "global_step": 156755, "epoch": 1888} {"train_loss": -23.57357406616211, "global_step": 156756, "epoch": 1888} {"train_loss": -23.449825286865234, "global_step": 156757, "epoch": 1888} {"train_loss": -23.248687744140625, "global_step": 156758, "epoch": 1888} {"train_loss": -23.678388595581055, "global_step": 156759, "epoch": 1888} {"train_loss": -23.46135711669922, "global_step": 156760, "epoch": 1888} {"train_loss": -23.544946670532227, "global_step": 156761, "epoch": 1888} {"train_loss": -23.195234298706055, "global_step": 156762, "epoch": 1888} {"train_loss": -23.862266540527344, "global_step": 156763, "epoch": 1888} {"train_loss": -23.40229034423828, "global_step": 156764, "epoch": 1888} {"train_loss": -23.365848541259766, "global_step": 156765, "epoch": 1888} {"train_loss": -23.572092056274414, "global_step": 156766, "epoch": 1888} {"train_loss": -23.08076286315918, "global_step": 156767, "epoch": 1888} {"train_loss": -23.226064682006836, "global_step": 156768, "epoch": 1888} {"train_loss": -23.84821891784668, "global_step": 156769, "epoch": 1888} {"train_loss": -23.38164520263672, "global_step": 156770, "epoch": 1888} {"train_loss": -23.376333236694336, "global_step": 156771, "epoch": 1888} {"train_loss": -23.284305572509766, "global_step": 156772, "epoch": 1888} {"train_loss": -23.50398826599121, "global_step": 156773, "epoch": 1888} {"train_loss": -23.385557174682617, "global_step": 156774, "epoch": 1888} {"train_loss": -23.600440979003906, "global_step": 156775, "epoch": 1888} {"train_loss": -23.243717193603516, "global_step": 156776, "epoch": 1888} {"train_loss": -23.772422790527344, "global_step": 156777, "epoch": 1888} {"train_loss": -23.374120712280273, "global_step": 156778, "epoch": 1888} {"train_loss": -23.847562789916992, "global_step": 156779, "epoch": 1888} {"train_loss": -23.262603759765625, "global_step": 156780, "epoch": 1888} {"train_loss": -23.114225387573242, "global_step": 156781, "epoch": 1888} {"train_loss": -23.41779899597168, "global_step": 156782, "epoch": 1888} {"train_loss": -23.614118576049805, "global_step": 156783, "epoch": 1888} {"train_loss": -23.551036834716797, "global_step": 156784, "epoch": 1888} {"train_loss": -23.310745239257812, "global_step": 156785, "epoch": 1888} {"train_loss": -23.366533210478632, "global_step": 156786, "epoch": 1888, "val_loss": 6297607.0} {"train_loss": -22.640716552734375, "global_step": 156787, "epoch": 1889} {"train_loss": -22.87687873840332, "global_step": 156788, "epoch": 1889} {"train_loss": -22.212400436401367, "global_step": 156789, "epoch": 1889} {"train_loss": -22.510774612426758, "global_step": 156790, "epoch": 1889} {"train_loss": -22.728567123413086, "global_step": 156791, "epoch": 1889} {"train_loss": -22.89605712890625, "global_step": 156792, "epoch": 1889} {"train_loss": -22.537126541137695, "global_step": 156793, "epoch": 1889} {"train_loss": -22.81000518798828, "global_step": 156794, "epoch": 1889} {"train_loss": -22.626514434814453, "global_step": 156795, "epoch": 1889} {"train_loss": -23.000986099243164, "global_step": 156796, "epoch": 1889} {"train_loss": -22.51511001586914, "global_step": 156797, "epoch": 1889} {"train_loss": -23.45694351196289, "global_step": 156798, "epoch": 1889} {"train_loss": -22.65382194519043, "global_step": 156799, "epoch": 1889} {"train_loss": -22.776025772094727, "global_step": 156800, "epoch": 1889} {"train_loss": -23.00075340270996, "global_step": 156801, "epoch": 1889} {"train_loss": -22.90391731262207, "global_step": 156802, "epoch": 1889} {"train_loss": -23.06357765197754, "global_step": 156803, "epoch": 1889} {"train_loss": -23.019939422607422, "global_step": 156804, "epoch": 1889} {"train_loss": -23.236642837524414, "global_step": 156805, "epoch": 1889} {"train_loss": -23.221054077148438, "global_step": 156806, "epoch": 1889} {"train_loss": -23.318439483642578, "global_step": 156807, "epoch": 1889} {"train_loss": -22.743574142456055, "global_step": 156808, "epoch": 1889} {"train_loss": -23.564334869384766, "global_step": 156809, "epoch": 1889} {"train_loss": -23.20807456970215, "global_step": 156810, "epoch": 1889} {"train_loss": -23.2653751373291, "global_step": 156811, "epoch": 1889} {"train_loss": -23.409305572509766, "global_step": 156812, "epoch": 1889} {"train_loss": -23.41851234436035, "global_step": 156813, "epoch": 1889} {"train_loss": -23.048460006713867, "global_step": 156814, "epoch": 1889} {"train_loss": -23.444299697875977, "global_step": 156815, "epoch": 1889} {"train_loss": -23.344045639038086, "global_step": 156816, "epoch": 1889} {"train_loss": -23.26090431213379, "global_step": 156817, "epoch": 1889} {"train_loss": -23.00152587890625, "global_step": 156818, "epoch": 1889} {"train_loss": -23.585250854492188, "global_step": 156819, "epoch": 1889} {"train_loss": -23.07982063293457, "global_step": 156820, "epoch": 1889} {"train_loss": -23.606319427490234, "global_step": 156821, "epoch": 1889} {"train_loss": -23.128747940063477, "global_step": 156822, "epoch": 1889} {"train_loss": -23.49532127380371, "global_step": 156823, "epoch": 1889} {"train_loss": -23.224159240722656, "global_step": 156824, "epoch": 1889} {"train_loss": -23.53369140625, "global_step": 156825, "epoch": 1889} {"train_loss": -23.395658493041992, "global_step": 156826, "epoch": 1889} {"train_loss": -23.43903923034668, "global_step": 156827, "epoch": 1889} {"train_loss": -23.641206741333008, "global_step": 156828, "epoch": 1889} {"train_loss": -23.574071884155273, "global_step": 156829, "epoch": 1889} {"train_loss": -23.31308364868164, "global_step": 156830, "epoch": 1889} {"train_loss": -23.532894134521484, "global_step": 156831, "epoch": 1889} {"train_loss": -23.278810501098633, "global_step": 156832, "epoch": 1889} {"train_loss": -23.301748275756836, "global_step": 156833, "epoch": 1889} {"train_loss": -23.351919174194336, "global_step": 156834, "epoch": 1889} {"train_loss": -23.563766479492188, "global_step": 156835, "epoch": 1889} {"train_loss": -23.391061782836914, "global_step": 156836, "epoch": 1889} {"train_loss": -23.508115768432617, "global_step": 156837, "epoch": 1889} {"train_loss": -23.429948806762695, "global_step": 156838, "epoch": 1889} {"train_loss": -23.41172218322754, "global_step": 156839, "epoch": 1889} {"train_loss": -23.514745712280273, "global_step": 156840, "epoch": 1889} {"train_loss": -23.42840003967285, "global_step": 156841, "epoch": 1889} {"train_loss": -23.449739456176758, "global_step": 156842, "epoch": 1889} {"train_loss": -23.44854164123535, "global_step": 156843, "epoch": 1889} {"train_loss": -23.25287437438965, "global_step": 156844, "epoch": 1889} {"train_loss": -23.19866371154785, "global_step": 156845, "epoch": 1889} {"train_loss": -23.52003288269043, "global_step": 156846, "epoch": 1889} {"train_loss": -23.345487594604492, "global_step": 156847, "epoch": 1889} {"train_loss": -23.161630630493164, "global_step": 156848, "epoch": 1889} {"train_loss": -22.806859970092773, "global_step": 156849, "epoch": 1889} {"train_loss": -23.30836296081543, "global_step": 156850, "epoch": 1889} {"train_loss": -23.35758399963379, "global_step": 156851, "epoch": 1889} {"train_loss": -23.410324096679688, "global_step": 156852, "epoch": 1889} {"train_loss": -23.094484329223633, "global_step": 156853, "epoch": 1889} {"train_loss": -23.303504943847656, "global_step": 156854, "epoch": 1889} {"train_loss": -23.660017013549805, "global_step": 156855, "epoch": 1889} {"train_loss": -23.2674617767334, "global_step": 156856, "epoch": 1889} {"train_loss": -23.331754684448242, "global_step": 156857, "epoch": 1889} {"train_loss": -23.14037322998047, "global_step": 156858, "epoch": 1889} {"train_loss": -23.395862579345703, "global_step": 156859, "epoch": 1889} {"train_loss": -23.54804801940918, "global_step": 156860, "epoch": 1889} {"train_loss": -23.62452507019043, "global_step": 156861, "epoch": 1889} {"train_loss": -23.401153564453125, "global_step": 156862, "epoch": 1889} {"train_loss": -23.6957950592041, "global_step": 156863, "epoch": 1889} {"train_loss": -23.534391403198242, "global_step": 156864, "epoch": 1889} {"train_loss": -23.804258346557617, "global_step": 156865, "epoch": 1889} {"train_loss": -23.463071823120117, "global_step": 156866, "epoch": 1889} {"train_loss": -23.37822723388672, "global_step": 156867, "epoch": 1889} {"train_loss": -22.971250534057617, "global_step": 156868, "epoch": 1889} {"train_loss": -23.22854129377618, "global_step": 156869, "epoch": 1889, "val_loss": 6274240.0} {"train_loss": -23.414175033569336, "global_step": 156870, "epoch": 1890} {"train_loss": -23.206838607788086, "global_step": 156871, "epoch": 1890} {"train_loss": -22.854707717895508, "global_step": 156872, "epoch": 1890} {"train_loss": -23.36199951171875, "global_step": 156873, "epoch": 1890} {"train_loss": -23.345510482788086, "global_step": 156874, "epoch": 1890} {"train_loss": -23.45429801940918, "global_step": 156875, "epoch": 1890} {"train_loss": -22.964216232299805, "global_step": 156876, "epoch": 1890} {"train_loss": -23.210338592529297, "global_step": 156877, "epoch": 1890} {"train_loss": -23.46784210205078, "global_step": 156878, "epoch": 1890} {"train_loss": -23.418582916259766, "global_step": 156879, "epoch": 1890} {"train_loss": -23.3287410736084, "global_step": 156880, "epoch": 1890} {"train_loss": -23.268163681030273, "global_step": 156881, "epoch": 1890} {"train_loss": -23.19927978515625, "global_step": 156882, "epoch": 1890} {"train_loss": -23.749685287475586, "global_step": 156883, "epoch": 1890} {"train_loss": -23.206369400024414, "global_step": 156884, "epoch": 1890} {"train_loss": -23.200382232666016, "global_step": 156885, "epoch": 1890} {"train_loss": -23.154518127441406, "global_step": 156886, "epoch": 1890} {"train_loss": -23.417320251464844, "global_step": 156887, "epoch": 1890} {"train_loss": -23.304147720336914, "global_step": 156888, "epoch": 1890} {"train_loss": -23.26377296447754, "global_step": 156889, "epoch": 1890} {"train_loss": -23.403818130493164, "global_step": 156890, "epoch": 1890} {"train_loss": -23.175140380859375, "global_step": 156891, "epoch": 1890} {"train_loss": -23.353776931762695, "global_step": 156892, "epoch": 1890} {"train_loss": -23.421323776245117, "global_step": 156893, "epoch": 1890} {"train_loss": -23.61521339416504, "global_step": 156894, "epoch": 1890} {"train_loss": -23.63467025756836, "global_step": 156895, "epoch": 1890} {"train_loss": -23.204885482788086, "global_step": 156896, "epoch": 1890} {"train_loss": -23.410802841186523, "global_step": 156897, "epoch": 1890} {"train_loss": -23.62017250061035, "global_step": 156898, "epoch": 1890} {"train_loss": -23.255277633666992, "global_step": 156899, "epoch": 1890} {"train_loss": -23.576831817626953, "global_step": 156900, "epoch": 1890} {"train_loss": -23.392621994018555, "global_step": 156901, "epoch": 1890} {"train_loss": -23.398244857788086, "global_step": 156902, "epoch": 1890} {"train_loss": -23.176050186157227, "global_step": 156903, "epoch": 1890} {"train_loss": -23.408063888549805, "global_step": 156904, "epoch": 1890} {"train_loss": -23.055049896240234, "global_step": 156905, "epoch": 1890} {"train_loss": -23.627851486206055, "global_step": 156906, "epoch": 1890} {"train_loss": -23.586790084838867, "global_step": 156907, "epoch": 1890} {"train_loss": -23.68364906311035, "global_step": 156908, "epoch": 1890} {"train_loss": -23.358137130737305, "global_step": 156909, "epoch": 1890} {"train_loss": -23.463430404663086, "global_step": 156910, "epoch": 1890} {"train_loss": -23.66608428955078, "global_step": 156911, "epoch": 1890} {"train_loss": -23.266788482666016, "global_step": 156912, "epoch": 1890} {"train_loss": -23.655933380126953, "global_step": 156913, "epoch": 1890} {"train_loss": -23.398529052734375, "global_step": 156914, "epoch": 1890} {"train_loss": -23.262645721435547, "global_step": 156915, "epoch": 1890} {"train_loss": -23.83395767211914, "global_step": 156916, "epoch": 1890} {"train_loss": -23.620121002197266, "global_step": 156917, "epoch": 1890} {"train_loss": -23.60164451599121, "global_step": 156918, "epoch": 1890} {"train_loss": -23.57147216796875, "global_step": 156919, "epoch": 1890} {"train_loss": -22.961454391479492, "global_step": 156920, "epoch": 1890} {"train_loss": -23.483827590942383, "global_step": 156921, "epoch": 1890} {"train_loss": -23.63237953186035, "global_step": 156922, "epoch": 1890} {"train_loss": -23.37141990661621, "global_step": 156923, "epoch": 1890} {"train_loss": -23.85430335998535, "global_step": 156924, "epoch": 1890} {"train_loss": -23.485849380493164, "global_step": 156925, "epoch": 1890} {"train_loss": -23.602951049804688, "global_step": 156926, "epoch": 1890} {"train_loss": -23.15157127380371, "global_step": 156927, "epoch": 1890} {"train_loss": -23.291706085205078, "global_step": 156928, "epoch": 1890} {"train_loss": -23.15503692626953, "global_step": 156929, "epoch": 1890} {"train_loss": -23.617172241210938, "global_step": 156930, "epoch": 1890} {"train_loss": -23.380496978759766, "global_step": 156931, "epoch": 1890} {"train_loss": -23.142230987548828, "global_step": 156932, "epoch": 1890} {"train_loss": -23.016735076904297, "global_step": 156933, "epoch": 1890} {"train_loss": -22.982074737548828, "global_step": 156934, "epoch": 1890} {"train_loss": -23.524518966674805, "global_step": 156935, "epoch": 1890} {"train_loss": -23.587858200073242, "global_step": 156936, "epoch": 1890} {"train_loss": -22.96845054626465, "global_step": 156937, "epoch": 1890} {"train_loss": -23.157629013061523, "global_step": 156938, "epoch": 1890} {"train_loss": -23.21061134338379, "global_step": 156939, "epoch": 1890} {"train_loss": -23.177824020385742, "global_step": 156940, "epoch": 1890} {"train_loss": -23.312986373901367, "global_step": 156941, "epoch": 1890} {"train_loss": -23.376493453979492, "global_step": 156942, "epoch": 1890} {"train_loss": -23.615345001220703, "global_step": 156943, "epoch": 1890} {"train_loss": -23.61153793334961, "global_step": 156944, "epoch": 1890} {"train_loss": -23.937870025634766, "global_step": 156945, "epoch": 1890} {"train_loss": -23.45979118347168, "global_step": 156946, "epoch": 1890} {"train_loss": -23.678266525268555, "global_step": 156947, "epoch": 1890} {"train_loss": -23.105567932128906, "global_step": 156948, "epoch": 1890} {"train_loss": -23.18963050842285, "global_step": 156949, "epoch": 1890} {"train_loss": -23.235214233398438, "global_step": 156950, "epoch": 1890} {"train_loss": -23.3377628326416, "global_step": 156951, "epoch": 1890} {"train_loss": -23.37178597967309, "global_step": 156952, "epoch": 1890, "val_loss": 6452735.5} {"train_loss": -22.69546890258789, "global_step": 156953, "epoch": 1891} {"train_loss": -23.03688621520996, "global_step": 156954, "epoch": 1891} {"train_loss": -23.527494430541992, "global_step": 156955, "epoch": 1891} {"train_loss": -23.061389923095703, "global_step": 156956, "epoch": 1891} {"train_loss": -23.00057601928711, "global_step": 156957, "epoch": 1891} {"train_loss": -23.181711196899414, "global_step": 156958, "epoch": 1891} {"train_loss": -23.246274948120117, "global_step": 156959, "epoch": 1891} {"train_loss": -23.281055450439453, "global_step": 156960, "epoch": 1891} {"train_loss": -23.21369743347168, "global_step": 156961, "epoch": 1891} {"train_loss": -23.45755958557129, "global_step": 156962, "epoch": 1891} {"train_loss": -23.291397094726562, "global_step": 156963, "epoch": 1891} {"train_loss": -23.41045570373535, "global_step": 156964, "epoch": 1891} {"train_loss": -23.119413375854492, "global_step": 156965, "epoch": 1891} {"train_loss": -23.53894805908203, "global_step": 156966, "epoch": 1891} {"train_loss": -23.59882926940918, "global_step": 156967, "epoch": 1891} {"train_loss": -23.492643356323242, "global_step": 156968, "epoch": 1891} {"train_loss": -23.50372314453125, "global_step": 156969, "epoch": 1891} {"train_loss": -23.450082778930664, "global_step": 156970, "epoch": 1891} {"train_loss": -23.382709503173828, "global_step": 156971, "epoch": 1891} {"train_loss": -23.376615524291992, "global_step": 156972, "epoch": 1891} {"train_loss": -23.29163932800293, "global_step": 156973, "epoch": 1891} {"train_loss": -23.391393661499023, "global_step": 156974, "epoch": 1891} {"train_loss": -23.503637313842773, "global_step": 156975, "epoch": 1891} {"train_loss": -23.18206214904785, "global_step": 156976, "epoch": 1891} {"train_loss": -23.27168846130371, "global_step": 156977, "epoch": 1891} {"train_loss": -23.4948787689209, "global_step": 156978, "epoch": 1891} {"train_loss": -23.30782699584961, "global_step": 156979, "epoch": 1891} {"train_loss": -23.59383201599121, "global_step": 156980, "epoch": 1891} {"train_loss": -23.55954933166504, "global_step": 156981, "epoch": 1891} {"train_loss": -23.686384201049805, "global_step": 156982, "epoch": 1891} {"train_loss": -23.583585739135742, "global_step": 156983, "epoch": 1891} {"train_loss": -23.33544921875, "global_step": 156984, "epoch": 1891} {"train_loss": -23.510852813720703, "global_step": 156985, "epoch": 1891} {"train_loss": -23.711410522460938, "global_step": 156986, "epoch": 1891} {"train_loss": -23.47736167907715, "global_step": 156987, "epoch": 1891} {"train_loss": -23.212146759033203, "global_step": 156988, "epoch": 1891} {"train_loss": -23.374364852905273, "global_step": 156989, "epoch": 1891} {"train_loss": -23.456626892089844, "global_step": 156990, "epoch": 1891} {"train_loss": -23.15746307373047, "global_step": 156991, "epoch": 1891} {"train_loss": -23.14204216003418, "global_step": 156992, "epoch": 1891} {"train_loss": -23.52016258239746, "global_step": 156993, "epoch": 1891} {"train_loss": -23.4848690032959, "global_step": 156994, "epoch": 1891} {"train_loss": -23.2542781829834, "global_step": 156995, "epoch": 1891} {"train_loss": -23.59212303161621, "global_step": 156996, "epoch": 1891} {"train_loss": -23.598581314086914, "global_step": 156997, "epoch": 1891} {"train_loss": -23.35371208190918, "global_step": 156998, "epoch": 1891} {"train_loss": -23.286579132080078, "global_step": 156999, "epoch": 1891} {"train_loss": -23.62514305114746, "global_step": 157000, "epoch": 1891} {"train_loss": -23.322628021240234, "global_step": 157001, "epoch": 1891} {"train_loss": -23.60979652404785, "global_step": 157002, "epoch": 1891} {"train_loss": -23.63899040222168, "global_step": 157003, "epoch": 1891} {"train_loss": -23.428632736206055, "global_step": 157004, "epoch": 1891} {"train_loss": -23.300382614135742, "global_step": 157005, "epoch": 1891} {"train_loss": -23.349140167236328, "global_step": 157006, "epoch": 1891} {"train_loss": -23.49148941040039, "global_step": 157007, "epoch": 1891} {"train_loss": -23.20179557800293, "global_step": 157008, "epoch": 1891} {"train_loss": -23.56672477722168, "global_step": 157009, "epoch": 1891} {"train_loss": -23.451833724975586, "global_step": 157010, "epoch": 1891} {"train_loss": -23.26181411743164, "global_step": 157011, "epoch": 1891} {"train_loss": -23.347082138061523, "global_step": 157012, "epoch": 1891} {"train_loss": -23.8436279296875, "global_step": 157013, "epoch": 1891} {"train_loss": -23.402517318725586, "global_step": 157014, "epoch": 1891} {"train_loss": -23.544883728027344, "global_step": 157015, "epoch": 1891} {"train_loss": -23.74476432800293, "global_step": 157016, "epoch": 1891} {"train_loss": -23.58188247680664, "global_step": 157017, "epoch": 1891} {"train_loss": -23.313079833984375, "global_step": 157018, "epoch": 1891} {"train_loss": -23.213623046875, "global_step": 157019, "epoch": 1891} {"train_loss": -23.517271041870117, "global_step": 157020, "epoch": 1891} {"train_loss": -23.681655883789062, "global_step": 157021, "epoch": 1891} {"train_loss": -23.634008407592773, "global_step": 157022, "epoch": 1891} {"train_loss": -23.468463897705078, "global_step": 157023, "epoch": 1891} {"train_loss": -23.837261199951172, "global_step": 157024, "epoch": 1891} {"train_loss": -23.345529556274414, "global_step": 157025, "epoch": 1891} {"train_loss": -23.190765380859375, "global_step": 157026, "epoch": 1891} {"train_loss": -23.64471435546875, "global_step": 157027, "epoch": 1891} {"train_loss": -23.36488914489746, "global_step": 157028, "epoch": 1891} {"train_loss": -23.306177139282227, "global_step": 157029, "epoch": 1891} {"train_loss": -23.211301803588867, "global_step": 157030, "epoch": 1891} {"train_loss": -23.29561996459961, "global_step": 157031, "epoch": 1891} {"train_loss": -23.415847778320312, "global_step": 157032, "epoch": 1891} {"train_loss": -23.25985336303711, "global_step": 157033, "epoch": 1891} {"train_loss": -23.604740142822266, "global_step": 157034, "epoch": 1891} {"train_loss": -23.397898984242634, "global_step": 157035, "epoch": 1891, "val_loss": 6421189.0} {"train_loss": -22.45306968688965, "global_step": 157036, "epoch": 1892} {"train_loss": -21.80830192565918, "global_step": 157037, "epoch": 1892} {"train_loss": -21.371183395385742, "global_step": 157038, "epoch": 1892} {"train_loss": -22.68743133544922, "global_step": 157039, "epoch": 1892} {"train_loss": -22.735538482666016, "global_step": 157040, "epoch": 1892} {"train_loss": -22.127103805541992, "global_step": 157041, "epoch": 1892} {"train_loss": -22.760955810546875, "global_step": 157042, "epoch": 1892} {"train_loss": -22.57106590270996, "global_step": 157043, "epoch": 1892} {"train_loss": -23.146020889282227, "global_step": 157044, "epoch": 1892} {"train_loss": -22.680068969726562, "global_step": 157045, "epoch": 1892} {"train_loss": -22.871686935424805, "global_step": 157046, "epoch": 1892} {"train_loss": -22.69621467590332, "global_step": 157047, "epoch": 1892} {"train_loss": -22.885852813720703, "global_step": 157048, "epoch": 1892} {"train_loss": -22.668100357055664, "global_step": 157049, "epoch": 1892} {"train_loss": -23.21225929260254, "global_step": 157050, "epoch": 1892} {"train_loss": -22.948978424072266, "global_step": 157051, "epoch": 1892} {"train_loss": -22.94232749938965, "global_step": 157052, "epoch": 1892} {"train_loss": -23.057071685791016, "global_step": 157053, "epoch": 1892} {"train_loss": -22.843238830566406, "global_step": 157054, "epoch": 1892} {"train_loss": -23.137292861938477, "global_step": 157055, "epoch": 1892} {"train_loss": -23.35691261291504, "global_step": 157056, "epoch": 1892} {"train_loss": -23.048200607299805, "global_step": 157057, "epoch": 1892} {"train_loss": -23.6153507232666, "global_step": 157058, "epoch": 1892} {"train_loss": -22.837858200073242, "global_step": 157059, "epoch": 1892} {"train_loss": -23.08320426940918, "global_step": 157060, "epoch": 1892} {"train_loss": -23.123640060424805, "global_step": 157061, "epoch": 1892} {"train_loss": -23.115432739257812, "global_step": 157062, "epoch": 1892} {"train_loss": -23.36693000793457, "global_step": 157063, "epoch": 1892} {"train_loss": -23.20781898498535, "global_step": 157064, "epoch": 1892} {"train_loss": -23.210269927978516, "global_step": 157065, "epoch": 1892} {"train_loss": -23.277170181274414, "global_step": 157066, "epoch": 1892} {"train_loss": -23.5018253326416, "global_step": 157067, "epoch": 1892} {"train_loss": -23.396703720092773, "global_step": 157068, "epoch": 1892} {"train_loss": -23.25691795349121, "global_step": 157069, "epoch": 1892} {"train_loss": -23.42336082458496, "global_step": 157070, "epoch": 1892} {"train_loss": -23.39219856262207, "global_step": 157071, "epoch": 1892} {"train_loss": -23.57695960998535, "global_step": 157072, "epoch": 1892} {"train_loss": -23.476682662963867, "global_step": 157073, "epoch": 1892} {"train_loss": -23.25200653076172, "global_step": 157074, "epoch": 1892} {"train_loss": -23.448041915893555, "global_step": 157075, "epoch": 1892} {"train_loss": -23.59016990661621, "global_step": 157076, "epoch": 1892} {"train_loss": -23.40546989440918, "global_step": 157077, "epoch": 1892} {"train_loss": -23.413002014160156, "global_step": 157078, "epoch": 1892} {"train_loss": -23.854137420654297, "global_step": 157079, "epoch": 1892} {"train_loss": -23.5150146484375, "global_step": 157080, "epoch": 1892} {"train_loss": -23.695032119750977, "global_step": 157081, "epoch": 1892} {"train_loss": -23.534473419189453, "global_step": 157082, "epoch": 1892} {"train_loss": -23.23421287536621, "global_step": 157083, "epoch": 1892} {"train_loss": -23.66473960876465, "global_step": 157084, "epoch": 1892} {"train_loss": -23.048521041870117, "global_step": 157085, "epoch": 1892} {"train_loss": -22.83864402770996, "global_step": 157086, "epoch": 1892} {"train_loss": -23.57339859008789, "global_step": 157087, "epoch": 1892} {"train_loss": -22.895856857299805, "global_step": 157088, "epoch": 1892} {"train_loss": -22.82688331604004, "global_step": 157089, "epoch": 1892} {"train_loss": -23.189029693603516, "global_step": 157090, "epoch": 1892} {"train_loss": -23.43242645263672, "global_step": 157091, "epoch": 1892} {"train_loss": -23.70584487915039, "global_step": 157092, "epoch": 1892} {"train_loss": -23.010345458984375, "global_step": 157093, "epoch": 1892} {"train_loss": -23.322965621948242, "global_step": 157094, "epoch": 1892} {"train_loss": -23.412353515625, "global_step": 157095, "epoch": 1892} {"train_loss": -23.30255699157715, "global_step": 157096, "epoch": 1892} {"train_loss": -23.65616226196289, "global_step": 157097, "epoch": 1892} {"train_loss": -23.540592193603516, "global_step": 157098, "epoch": 1892} {"train_loss": -23.18497657775879, "global_step": 157099, "epoch": 1892} {"train_loss": -24.020660400390625, "global_step": 157100, "epoch": 1892} {"train_loss": -23.40889549255371, "global_step": 157101, "epoch": 1892} {"train_loss": -23.396568298339844, "global_step": 157102, "epoch": 1892} {"train_loss": -23.447080612182617, "global_step": 157103, "epoch": 1892} {"train_loss": -23.223936080932617, "global_step": 157104, "epoch": 1892} {"train_loss": -23.853818893432617, "global_step": 157105, "epoch": 1892} {"train_loss": -23.53702163696289, "global_step": 157106, "epoch": 1892} {"train_loss": -23.51643943786621, "global_step": 157107, "epoch": 1892} {"train_loss": -23.619943618774414, "global_step": 157108, "epoch": 1892} {"train_loss": -23.535186767578125, "global_step": 157109, "epoch": 1892} {"train_loss": -23.289697647094727, "global_step": 157110, "epoch": 1892} {"train_loss": -23.517370223999023, "global_step": 157111, "epoch": 1892} {"train_loss": -23.511962890625, "global_step": 157112, "epoch": 1892} {"train_loss": -23.465423583984375, "global_step": 157113, "epoch": 1892} {"train_loss": -23.638525009155273, "global_step": 157114, "epoch": 1892} {"train_loss": -23.88751792907715, "global_step": 157115, "epoch": 1892} {"train_loss": -23.509958267211914, "global_step": 157116, "epoch": 1892} {"train_loss": -23.474407196044922, "global_step": 157117, "epoch": 1892} {"train_loss": -23.235661012580596, "global_step": 157118, "epoch": 1892, "val_loss": 6429011.0} {"train_loss": -23.374990463256836, "global_step": 157119, "epoch": 1893} {"train_loss": -23.42090606689453, "global_step": 157120, "epoch": 1893} {"train_loss": -23.068090438842773, "global_step": 157121, "epoch": 1893} {"train_loss": -23.11109733581543, "global_step": 157122, "epoch": 1893} {"train_loss": -23.10210418701172, "global_step": 157123, "epoch": 1893} {"train_loss": -23.630388259887695, "global_step": 157124, "epoch": 1893} {"train_loss": -23.349477767944336, "global_step": 157125, "epoch": 1893} {"train_loss": -23.700098037719727, "global_step": 157126, "epoch": 1893} {"train_loss": -22.777414321899414, "global_step": 157127, "epoch": 1893} {"train_loss": -23.069805145263672, "global_step": 157128, "epoch": 1893} {"train_loss": -23.363317489624023, "global_step": 157129, "epoch": 1893} {"train_loss": -23.533405303955078, "global_step": 157130, "epoch": 1893} {"train_loss": -23.23381805419922, "global_step": 157131, "epoch": 1893} {"train_loss": -23.059125900268555, "global_step": 157132, "epoch": 1893} {"train_loss": -23.052034378051758, "global_step": 157133, "epoch": 1893} {"train_loss": -23.435791015625, "global_step": 157134, "epoch": 1893} {"train_loss": -23.553054809570312, "global_step": 157135, "epoch": 1893} {"train_loss": -23.43671989440918, "global_step": 157136, "epoch": 1893} {"train_loss": -23.18875503540039, "global_step": 157137, "epoch": 1893} {"train_loss": -23.758115768432617, "global_step": 157138, "epoch": 1893} {"train_loss": -23.391738891601562, "global_step": 157139, "epoch": 1893} {"train_loss": -23.447036743164062, "global_step": 157140, "epoch": 1893} {"train_loss": -23.577043533325195, "global_step": 157141, "epoch": 1893} {"train_loss": -23.330459594726562, "global_step": 157142, "epoch": 1893} {"train_loss": -23.70911979675293, "global_step": 157143, "epoch": 1893} {"train_loss": -23.777509689331055, "global_step": 157144, "epoch": 1893} {"train_loss": -23.147846221923828, "global_step": 157145, "epoch": 1893} {"train_loss": -23.915630340576172, "global_step": 157146, "epoch": 1893} {"train_loss": -23.952661514282227, "global_step": 157147, "epoch": 1893} {"train_loss": -23.696027755737305, "global_step": 157148, "epoch": 1893} {"train_loss": -23.38422966003418, "global_step": 157149, "epoch": 1893} {"train_loss": -23.64875602722168, "global_step": 157150, "epoch": 1893} {"train_loss": -23.5357666015625, "global_step": 157151, "epoch": 1893} {"train_loss": -23.398006439208984, "global_step": 157152, "epoch": 1893} {"train_loss": -23.567380905151367, "global_step": 157153, "epoch": 1893} {"train_loss": -23.52495765686035, "global_step": 157154, "epoch": 1893} {"train_loss": -23.288684844970703, "global_step": 157155, "epoch": 1893} {"train_loss": -23.715904235839844, "global_step": 157156, "epoch": 1893} {"train_loss": -23.897090911865234, "global_step": 157157, "epoch": 1893} {"train_loss": -23.586288452148438, "global_step": 157158, "epoch": 1893} {"train_loss": -23.452482223510742, "global_step": 157159, "epoch": 1893} {"train_loss": -23.318578720092773, "global_step": 157160, "epoch": 1893} {"train_loss": -23.391925811767578, "global_step": 157161, "epoch": 1893} {"train_loss": -23.243968963623047, "global_step": 157162, "epoch": 1893} {"train_loss": -23.536849975585938, "global_step": 157163, "epoch": 1893} {"train_loss": -23.210922241210938, "global_step": 157164, "epoch": 1893} {"train_loss": -23.123123168945312, "global_step": 157165, "epoch": 1893} {"train_loss": -23.433305740356445, "global_step": 157166, "epoch": 1893} {"train_loss": -22.84518814086914, "global_step": 157167, "epoch": 1893} {"train_loss": -23.556171417236328, "global_step": 157168, "epoch": 1893} {"train_loss": -23.186079025268555, "global_step": 157169, "epoch": 1893} {"train_loss": -23.041706085205078, "global_step": 157170, "epoch": 1893} {"train_loss": -23.117979049682617, "global_step": 157171, "epoch": 1893} {"train_loss": -23.21834945678711, "global_step": 157172, "epoch": 1893} {"train_loss": -23.15846061706543, "global_step": 157173, "epoch": 1893} {"train_loss": -23.207630157470703, "global_step": 157174, "epoch": 1893} {"train_loss": -23.48182487487793, "global_step": 157175, "epoch": 1893} {"train_loss": -23.346097946166992, "global_step": 157176, "epoch": 1893} {"train_loss": -23.006122589111328, "global_step": 157177, "epoch": 1893} {"train_loss": -23.524503707885742, "global_step": 157178, "epoch": 1893} {"train_loss": -23.226770401000977, "global_step": 157179, "epoch": 1893} {"train_loss": -23.31009292602539, "global_step": 157180, "epoch": 1893} {"train_loss": -23.114307403564453, "global_step": 157181, "epoch": 1893} {"train_loss": -23.369720458984375, "global_step": 157182, "epoch": 1893} {"train_loss": -23.283960342407227, "global_step": 157183, "epoch": 1893} {"train_loss": -23.375537872314453, "global_step": 157184, "epoch": 1893} {"train_loss": -23.539600372314453, "global_step": 157185, "epoch": 1893} {"train_loss": -23.467710494995117, "global_step": 157186, "epoch": 1893} {"train_loss": -23.10710906982422, "global_step": 157187, "epoch": 1893} {"train_loss": -23.45037078857422, "global_step": 157188, "epoch": 1893} {"train_loss": -23.48101234436035, "global_step": 157189, "epoch": 1893} {"train_loss": -23.484941482543945, "global_step": 157190, "epoch": 1893} {"train_loss": -23.38569450378418, "global_step": 157191, "epoch": 1893} {"train_loss": -23.22623062133789, "global_step": 157192, "epoch": 1893} {"train_loss": -23.396520614624023, "global_step": 157193, "epoch": 1893} {"train_loss": -23.5667667388916, "global_step": 157194, "epoch": 1893} {"train_loss": -23.35450553894043, "global_step": 157195, "epoch": 1893} {"train_loss": -23.273603439331055, "global_step": 157196, "epoch": 1893} {"train_loss": -23.638696670532227, "global_step": 157197, "epoch": 1893} {"train_loss": -23.777647018432617, "global_step": 157198, "epoch": 1893} {"train_loss": -23.426145553588867, "global_step": 157199, "epoch": 1893} {"train_loss": -23.4251708984375, "global_step": 157200, "epoch": 1893} {"train_loss": -23.401533517492823, "global_step": 157201, "epoch": 1893, "val_loss": 6394432.0} {"train_loss": -22.45210838317871, "global_step": 157202, "epoch": 1894} {"train_loss": -22.192928314208984, "global_step": 157203, "epoch": 1894} {"train_loss": -23.304454803466797, "global_step": 157204, "epoch": 1894} {"train_loss": -23.145751953125, "global_step": 157205, "epoch": 1894} {"train_loss": -23.02010726928711, "global_step": 157206, "epoch": 1894} {"train_loss": -23.146533966064453, "global_step": 157207, "epoch": 1894} {"train_loss": -22.998502731323242, "global_step": 157208, "epoch": 1894} {"train_loss": -22.965791702270508, "global_step": 157209, "epoch": 1894} {"train_loss": -22.673696517944336, "global_step": 157210, "epoch": 1894} {"train_loss": -23.057941436767578, "global_step": 157211, "epoch": 1894} {"train_loss": -22.805776596069336, "global_step": 157212, "epoch": 1894} {"train_loss": -23.12771987915039, "global_step": 157213, "epoch": 1894} {"train_loss": -23.089401245117188, "global_step": 157214, "epoch": 1894} {"train_loss": -22.99742317199707, "global_step": 157215, "epoch": 1894} {"train_loss": -23.287622451782227, "global_step": 157216, "epoch": 1894} {"train_loss": -22.92038917541504, "global_step": 157217, "epoch": 1894} {"train_loss": -23.14451026916504, "global_step": 157218, "epoch": 1894} {"train_loss": -23.46380043029785, "global_step": 157219, "epoch": 1894} {"train_loss": -23.175539016723633, "global_step": 157220, "epoch": 1894} {"train_loss": -22.998451232910156, "global_step": 157221, "epoch": 1894} {"train_loss": -23.38720703125, "global_step": 157222, "epoch": 1894} {"train_loss": -23.016176223754883, "global_step": 157223, "epoch": 1894} {"train_loss": -23.44366455078125, "global_step": 157224, "epoch": 1894} {"train_loss": -23.0793514251709, "global_step": 157225, "epoch": 1894} {"train_loss": -23.102935791015625, "global_step": 157226, "epoch": 1894} {"train_loss": -23.124298095703125, "global_step": 157227, "epoch": 1894} {"train_loss": -23.29422378540039, "global_step": 157228, "epoch": 1894} {"train_loss": -23.956640243530273, "global_step": 157229, "epoch": 1894} {"train_loss": -23.23865509033203, "global_step": 157230, "epoch": 1894} {"train_loss": -23.238195419311523, "global_step": 157231, "epoch": 1894} {"train_loss": -22.956960678100586, "global_step": 157232, "epoch": 1894} {"train_loss": -23.490234375, "global_step": 157233, "epoch": 1894} {"train_loss": -23.63084602355957, "global_step": 157234, "epoch": 1894} {"train_loss": -23.358352661132812, "global_step": 157235, "epoch": 1894} {"train_loss": -23.497724533081055, "global_step": 157236, "epoch": 1894} {"train_loss": -23.35570526123047, "global_step": 157237, "epoch": 1894} {"train_loss": -23.396177291870117, "global_step": 157238, "epoch": 1894} {"train_loss": -23.526411056518555, "global_step": 157239, "epoch": 1894} {"train_loss": -23.580656051635742, "global_step": 157240, "epoch": 1894} {"train_loss": -23.615976333618164, "global_step": 157241, "epoch": 1894} {"train_loss": -23.47004508972168, "global_step": 157242, "epoch": 1894} {"train_loss": -23.747533798217773, "global_step": 157243, "epoch": 1894} {"train_loss": -23.425445556640625, "global_step": 157244, "epoch": 1894} {"train_loss": -23.278141021728516, "global_step": 157245, "epoch": 1894} {"train_loss": -23.64328384399414, "global_step": 157246, "epoch": 1894} {"train_loss": -23.545164108276367, "global_step": 157247, "epoch": 1894} {"train_loss": -23.546655654907227, "global_step": 157248, "epoch": 1894} {"train_loss": -23.30365562438965, "global_step": 157249, "epoch": 1894} {"train_loss": -23.66047477722168, "global_step": 157250, "epoch": 1894} {"train_loss": -23.565963745117188, "global_step": 157251, "epoch": 1894} {"train_loss": -23.9003963470459, "global_step": 157252, "epoch": 1894} {"train_loss": -23.7266788482666, "global_step": 157253, "epoch": 1894} {"train_loss": -23.825117111206055, "global_step": 157254, "epoch": 1894} {"train_loss": -23.453903198242188, "global_step": 157255, "epoch": 1894} {"train_loss": -23.752300262451172, "global_step": 157256, "epoch": 1894} {"train_loss": -23.3237247467041, "global_step": 157257, "epoch": 1894} {"train_loss": -23.269866943359375, "global_step": 157258, "epoch": 1894} {"train_loss": -22.917118072509766, "global_step": 157259, "epoch": 1894} {"train_loss": -23.09793472290039, "global_step": 157260, "epoch": 1894} {"train_loss": -23.35683250427246, "global_step": 157261, "epoch": 1894} {"train_loss": -23.662988662719727, "global_step": 157262, "epoch": 1894} {"train_loss": -23.267419815063477, "global_step": 157263, "epoch": 1894} {"train_loss": -23.537019729614258, "global_step": 157264, "epoch": 1894} {"train_loss": -23.47171974182129, "global_step": 157265, "epoch": 1894} {"train_loss": -23.392553329467773, "global_step": 157266, "epoch": 1894} {"train_loss": -23.361576080322266, "global_step": 157267, "epoch": 1894} {"train_loss": -23.727941513061523, "global_step": 157268, "epoch": 1894} {"train_loss": -23.585622787475586, "global_step": 157269, "epoch": 1894} {"train_loss": -23.594730377197266, "global_step": 157270, "epoch": 1894} {"train_loss": -23.463394165039062, "global_step": 157271, "epoch": 1894} {"train_loss": -23.30465316772461, "global_step": 157272, "epoch": 1894} {"train_loss": -23.615970611572266, "global_step": 157273, "epoch": 1894} {"train_loss": -23.075702667236328, "global_step": 157274, "epoch": 1894} {"train_loss": -23.149921417236328, "global_step": 157275, "epoch": 1894} {"train_loss": -23.342599868774414, "global_step": 157276, "epoch": 1894} {"train_loss": -23.576364517211914, "global_step": 157277, "epoch": 1894} {"train_loss": -23.453540802001953, "global_step": 157278, "epoch": 1894} {"train_loss": -23.837514877319336, "global_step": 157279, "epoch": 1894} {"train_loss": -23.76529312133789, "global_step": 157280, "epoch": 1894} {"train_loss": -23.740076065063477, "global_step": 157281, "epoch": 1894} {"train_loss": -23.5899658203125, "global_step": 157282, "epoch": 1894} {"train_loss": -23.285137176513672, "global_step": 157283, "epoch": 1894} {"train_loss": -23.355708455464924, "global_step": 157284, "epoch": 1894, "val_loss": 6384924.0} {"train_loss": -23.16700553894043, "global_step": 157285, "epoch": 1895} {"train_loss": -23.41523551940918, "global_step": 157286, "epoch": 1895} {"train_loss": -23.11067771911621, "global_step": 157287, "epoch": 1895} {"train_loss": -23.123388290405273, "global_step": 157288, "epoch": 1895} {"train_loss": -23.118911743164062, "global_step": 157289, "epoch": 1895} {"train_loss": -23.303529739379883, "global_step": 157290, "epoch": 1895} {"train_loss": -23.11962890625, "global_step": 157291, "epoch": 1895} {"train_loss": -22.909793853759766, "global_step": 157292, "epoch": 1895} {"train_loss": -23.39853286743164, "global_step": 157293, "epoch": 1895} {"train_loss": -23.604904174804688, "global_step": 157294, "epoch": 1895} {"train_loss": -23.351383209228516, "global_step": 157295, "epoch": 1895} {"train_loss": -23.0208683013916, "global_step": 157296, "epoch": 1895} {"train_loss": -23.36191177368164, "global_step": 157297, "epoch": 1895} {"train_loss": -23.280864715576172, "global_step": 157298, "epoch": 1895} {"train_loss": -23.287656784057617, "global_step": 157299, "epoch": 1895} {"train_loss": -23.201684951782227, "global_step": 157300, "epoch": 1895} {"train_loss": -23.370071411132812, "global_step": 157301, "epoch": 1895} {"train_loss": -23.06960678100586, "global_step": 157302, "epoch": 1895} {"train_loss": -23.016876220703125, "global_step": 157303, "epoch": 1895} {"train_loss": -23.0989933013916, "global_step": 157304, "epoch": 1895} {"train_loss": -23.08351707458496, "global_step": 157305, "epoch": 1895} {"train_loss": -23.338300704956055, "global_step": 157306, "epoch": 1895} {"train_loss": -23.351991653442383, "global_step": 157307, "epoch": 1895} {"train_loss": -23.18117904663086, "global_step": 157308, "epoch": 1895} {"train_loss": -23.37587547302246, "global_step": 157309, "epoch": 1895} {"train_loss": -23.17047119140625, "global_step": 157310, "epoch": 1895} {"train_loss": -23.44849967956543, "global_step": 157311, "epoch": 1895} {"train_loss": -23.260229110717773, "global_step": 157312, "epoch": 1895} {"train_loss": -23.5831298828125, "global_step": 157313, "epoch": 1895} {"train_loss": -23.600820541381836, "global_step": 157314, "epoch": 1895} {"train_loss": -23.472158432006836, "global_step": 157315, "epoch": 1895} {"train_loss": -23.26482391357422, "global_step": 157316, "epoch": 1895} {"train_loss": -23.3138484954834, "global_step": 157317, "epoch": 1895} {"train_loss": -23.279539108276367, "global_step": 157318, "epoch": 1895} {"train_loss": -23.52100944519043, "global_step": 157319, "epoch": 1895} {"train_loss": -23.666975021362305, "global_step": 157320, "epoch": 1895} {"train_loss": -23.095857620239258, "global_step": 157321, "epoch": 1895} {"train_loss": -23.405813217163086, "global_step": 157322, "epoch": 1895} {"train_loss": -23.010150909423828, "global_step": 157323, "epoch": 1895} {"train_loss": -23.074533462524414, "global_step": 157324, "epoch": 1895} {"train_loss": -23.546070098876953, "global_step": 157325, "epoch": 1895} {"train_loss": -23.26527976989746, "global_step": 157326, "epoch": 1895} {"train_loss": -23.18523597717285, "global_step": 157327, "epoch": 1895} {"train_loss": -23.199918746948242, "global_step": 157328, "epoch": 1895} {"train_loss": -23.692907333374023, "global_step": 157329, "epoch": 1895} {"train_loss": -23.373117446899414, "global_step": 157330, "epoch": 1895} {"train_loss": -23.647323608398438, "global_step": 157331, "epoch": 1895} {"train_loss": -23.631019592285156, "global_step": 157332, "epoch": 1895} {"train_loss": -23.330036163330078, "global_step": 157333, "epoch": 1895} {"train_loss": -23.41166877746582, "global_step": 157334, "epoch": 1895} {"train_loss": -23.30796241760254, "global_step": 157335, "epoch": 1895} {"train_loss": -23.407285690307617, "global_step": 157336, "epoch": 1895} {"train_loss": -23.33685874938965, "global_step": 157337, "epoch": 1895} {"train_loss": -23.36263656616211, "global_step": 157338, "epoch": 1895} {"train_loss": -23.016830444335938, "global_step": 157339, "epoch": 1895} {"train_loss": -23.26852035522461, "global_step": 157340, "epoch": 1895} {"train_loss": -23.38572120666504, "global_step": 157341, "epoch": 1895} {"train_loss": -23.689420700073242, "global_step": 157342, "epoch": 1895} {"train_loss": -23.58853530883789, "global_step": 157343, "epoch": 1895} {"train_loss": -23.39691734313965, "global_step": 157344, "epoch": 1895} {"train_loss": -23.44301414489746, "global_step": 157345, "epoch": 1895} {"train_loss": -23.630355834960938, "global_step": 157346, "epoch": 1895} {"train_loss": -23.33976173400879, "global_step": 157347, "epoch": 1895} {"train_loss": -23.125654220581055, "global_step": 157348, "epoch": 1895} {"train_loss": -23.545928955078125, "global_step": 157349, "epoch": 1895} {"train_loss": -23.586877822875977, "global_step": 157350, "epoch": 1895} {"train_loss": -23.481731414794922, "global_step": 157351, "epoch": 1895} {"train_loss": -23.583206176757812, "global_step": 157352, "epoch": 1895} {"train_loss": -23.478984832763672, "global_step": 157353, "epoch": 1895} {"train_loss": -23.8073787689209, "global_step": 157354, "epoch": 1895} {"train_loss": -23.24615478515625, "global_step": 157355, "epoch": 1895} {"train_loss": -23.746152877807617, "global_step": 157356, "epoch": 1895} {"train_loss": -23.724233627319336, "global_step": 157357, "epoch": 1895} {"train_loss": -23.1802921295166, "global_step": 157358, "epoch": 1895} {"train_loss": -23.412057876586914, "global_step": 157359, "epoch": 1895} {"train_loss": -23.157581329345703, "global_step": 157360, "epoch": 1895} {"train_loss": -23.205307006835938, "global_step": 157361, "epoch": 1895} {"train_loss": -23.46915626525879, "global_step": 157362, "epoch": 1895} {"train_loss": -23.376890182495117, "global_step": 157363, "epoch": 1895} {"train_loss": -23.482938766479492, "global_step": 157364, "epoch": 1895} {"train_loss": -23.52983283996582, "global_step": 157365, "epoch": 1895} {"train_loss": -23.860702514648438, "global_step": 157366, "epoch": 1895} {"train_loss": -23.353448017534003, "global_step": 157367, "epoch": 1895, "val_loss": 6306563.0} {"train_loss": -23.35297966003418, "global_step": 157368, "epoch": 1896} {"train_loss": -22.746170043945312, "global_step": 157369, "epoch": 1896} {"train_loss": -23.218130111694336, "global_step": 157370, "epoch": 1896} {"train_loss": -23.0828800201416, "global_step": 157371, "epoch": 1896} {"train_loss": -22.8990535736084, "global_step": 157372, "epoch": 1896} {"train_loss": -23.0546932220459, "global_step": 157373, "epoch": 1896} {"train_loss": -23.05557632446289, "global_step": 157374, "epoch": 1896} {"train_loss": -23.249549865722656, "global_step": 157375, "epoch": 1896} {"train_loss": -23.025678634643555, "global_step": 157376, "epoch": 1896} {"train_loss": -23.504301071166992, "global_step": 157377, "epoch": 1896} {"train_loss": -23.316818237304688, "global_step": 157378, "epoch": 1896} {"train_loss": -23.187055587768555, "global_step": 157379, "epoch": 1896} {"train_loss": -23.215303421020508, "global_step": 157380, "epoch": 1896} {"train_loss": -23.265235900878906, "global_step": 157381, "epoch": 1896} {"train_loss": -23.123876571655273, "global_step": 157382, "epoch": 1896} {"train_loss": -23.182174682617188, "global_step": 157383, "epoch": 1896} {"train_loss": -23.74203872680664, "global_step": 157384, "epoch": 1896} {"train_loss": -23.463829040527344, "global_step": 157385, "epoch": 1896} {"train_loss": -23.380048751831055, "global_step": 157386, "epoch": 1896} {"train_loss": -23.265249252319336, "global_step": 157387, "epoch": 1896} {"train_loss": -23.518701553344727, "global_step": 157388, "epoch": 1896} {"train_loss": -23.539684295654297, "global_step": 157389, "epoch": 1896} {"train_loss": -23.29866600036621, "global_step": 157390, "epoch": 1896} {"train_loss": -23.211462020874023, "global_step": 157391, "epoch": 1896} {"train_loss": -23.950529098510742, "global_step": 157392, "epoch": 1896} {"train_loss": -23.575162887573242, "global_step": 157393, "epoch": 1896} {"train_loss": -23.37482452392578, "global_step": 157394, "epoch": 1896} {"train_loss": -23.279518127441406, "global_step": 157395, "epoch": 1896} {"train_loss": -23.324594497680664, "global_step": 157396, "epoch": 1896} {"train_loss": -23.380613327026367, "global_step": 157397, "epoch": 1896} {"train_loss": -23.389699935913086, "global_step": 157398, "epoch": 1896} {"train_loss": -23.536365509033203, "global_step": 157399, "epoch": 1896} {"train_loss": -23.26152801513672, "global_step": 157400, "epoch": 1896} {"train_loss": -23.746854782104492, "global_step": 157401, "epoch": 1896} {"train_loss": -23.869705200195312, "global_step": 157402, "epoch": 1896} {"train_loss": -23.76326560974121, "global_step": 157403, "epoch": 1896} {"train_loss": -23.283987045288086, "global_step": 157404, "epoch": 1896} {"train_loss": -23.11475944519043, "global_step": 157405, "epoch": 1896} {"train_loss": -23.29615020751953, "global_step": 157406, "epoch": 1896} {"train_loss": -23.393117904663086, "global_step": 157407, "epoch": 1896} {"train_loss": -23.19318199157715, "global_step": 157408, "epoch": 1896} {"train_loss": -23.2686767578125, "global_step": 157409, "epoch": 1896} {"train_loss": -23.609506607055664, "global_step": 157410, "epoch": 1896} {"train_loss": -23.19437599182129, "global_step": 157411, "epoch": 1896} {"train_loss": -23.316789627075195, "global_step": 157412, "epoch": 1896} {"train_loss": -23.51499366760254, "global_step": 157413, "epoch": 1896} {"train_loss": -23.594058990478516, "global_step": 157414, "epoch": 1896} {"train_loss": -23.363264083862305, "global_step": 157415, "epoch": 1896} {"train_loss": -23.82828712463379, "global_step": 157416, "epoch": 1896} {"train_loss": -23.138662338256836, "global_step": 157417, "epoch": 1896} {"train_loss": -23.349573135375977, "global_step": 157418, "epoch": 1896} {"train_loss": -23.698461532592773, "global_step": 157419, "epoch": 1896} {"train_loss": -23.715349197387695, "global_step": 157420, "epoch": 1896} {"train_loss": -23.797433853149414, "global_step": 157421, "epoch": 1896} {"train_loss": -23.505714416503906, "global_step": 157422, "epoch": 1896} {"train_loss": -23.449045181274414, "global_step": 157423, "epoch": 1896} {"train_loss": -23.480274200439453, "global_step": 157424, "epoch": 1896} {"train_loss": -23.518917083740234, "global_step": 157425, "epoch": 1896} {"train_loss": -23.367420196533203, "global_step": 157426, "epoch": 1896} {"train_loss": -23.443883895874023, "global_step": 157427, "epoch": 1896} {"train_loss": -23.736770629882812, "global_step": 157428, "epoch": 1896} {"train_loss": -23.64099884033203, "global_step": 157429, "epoch": 1896} {"train_loss": -23.177799224853516, "global_step": 157430, "epoch": 1896} {"train_loss": -23.928823471069336, "global_step": 157431, "epoch": 1896} {"train_loss": -23.6843318939209, "global_step": 157432, "epoch": 1896} {"train_loss": -23.705646514892578, "global_step": 157433, "epoch": 1896} {"train_loss": -23.84449005126953, "global_step": 157434, "epoch": 1896} {"train_loss": -23.758020401000977, "global_step": 157435, "epoch": 1896} {"train_loss": -23.635801315307617, "global_step": 157436, "epoch": 1896} {"train_loss": -23.744596481323242, "global_step": 157437, "epoch": 1896} {"train_loss": -23.723670959472656, "global_step": 157438, "epoch": 1896} {"train_loss": -23.698240280151367, "global_step": 157439, "epoch": 1896} {"train_loss": -23.22865867614746, "global_step": 157440, "epoch": 1896} {"train_loss": -23.40873146057129, "global_step": 157441, "epoch": 1896} {"train_loss": -23.51021385192871, "global_step": 157442, "epoch": 1896} {"train_loss": -23.640222549438477, "global_step": 157443, "epoch": 1896} {"train_loss": -23.655813217163086, "global_step": 157444, "epoch": 1896} {"train_loss": -23.78696060180664, "global_step": 157445, "epoch": 1896} {"train_loss": -23.620426177978516, "global_step": 157446, "epoch": 1896} {"train_loss": -23.037220001220703, "global_step": 157447, "epoch": 1896} {"train_loss": -23.716794967651367, "global_step": 157448, "epoch": 1896} {"train_loss": -23.673681259155273, "global_step": 157449, "epoch": 1896} {"train_loss": -23.440490538815418, "global_step": 157450, "epoch": 1896, "val_loss": 6531929.0} {"train_loss": -23.256244659423828, "global_step": 157451, "epoch": 1897} {"train_loss": -22.835466384887695, "global_step": 157452, "epoch": 1897} {"train_loss": -23.228010177612305, "global_step": 157453, "epoch": 1897} {"train_loss": -23.260282516479492, "global_step": 157454, "epoch": 1897} {"train_loss": -22.448034286499023, "global_step": 157455, "epoch": 1897} {"train_loss": -23.017236709594727, "global_step": 157456, "epoch": 1897} {"train_loss": -23.03801918029785, "global_step": 157457, "epoch": 1897} {"train_loss": -23.15264320373535, "global_step": 157458, "epoch": 1897} {"train_loss": -23.173879623413086, "global_step": 157459, "epoch": 1897} {"train_loss": -22.774328231811523, "global_step": 157460, "epoch": 1897} {"train_loss": -22.786245346069336, "global_step": 157461, "epoch": 1897} {"train_loss": -23.35267448425293, "global_step": 157462, "epoch": 1897} {"train_loss": -22.760019302368164, "global_step": 157463, "epoch": 1897} {"train_loss": -22.78687286376953, "global_step": 157464, "epoch": 1897} {"train_loss": -23.20509147644043, "global_step": 157465, "epoch": 1897} {"train_loss": -22.999544143676758, "global_step": 157466, "epoch": 1897} {"train_loss": -23.00975799560547, "global_step": 157467, "epoch": 1897} {"train_loss": -22.917640686035156, "global_step": 157468, "epoch": 1897} {"train_loss": -22.9288330078125, "global_step": 157469, "epoch": 1897} {"train_loss": -23.170345306396484, "global_step": 157470, "epoch": 1897} {"train_loss": -23.027061462402344, "global_step": 157471, "epoch": 1897} {"train_loss": -22.837934494018555, "global_step": 157472, "epoch": 1897} {"train_loss": -22.781095504760742, "global_step": 157473, "epoch": 1897} {"train_loss": -23.14881706237793, "global_step": 157474, "epoch": 1897} {"train_loss": -23.30805778503418, "global_step": 157475, "epoch": 1897} {"train_loss": -23.09134292602539, "global_step": 157476, "epoch": 1897} {"train_loss": -23.63362693786621, "global_step": 157477, "epoch": 1897} {"train_loss": -23.317718505859375, "global_step": 157478, "epoch": 1897} {"train_loss": -23.16627311706543, "global_step": 157479, "epoch": 1897} {"train_loss": -23.457630157470703, "global_step": 157480, "epoch": 1897} {"train_loss": -23.475379943847656, "global_step": 157481, "epoch": 1897} {"train_loss": -23.4014835357666, "global_step": 157482, "epoch": 1897} {"train_loss": -23.372282028198242, "global_step": 157483, "epoch": 1897} {"train_loss": -23.259950637817383, "global_step": 157484, "epoch": 1897} {"train_loss": -23.740116119384766, "global_step": 157485, "epoch": 1897} {"train_loss": -23.2233943939209, "global_step": 157486, "epoch": 1897} {"train_loss": -23.49161148071289, "global_step": 157487, "epoch": 1897} {"train_loss": -23.531049728393555, "global_step": 157488, "epoch": 1897} {"train_loss": -23.381240844726562, "global_step": 157489, "epoch": 1897} {"train_loss": -23.3272705078125, "global_step": 157490, "epoch": 1897} {"train_loss": -23.224220275878906, "global_step": 157491, "epoch": 1897} {"train_loss": -23.17146873474121, "global_step": 157492, "epoch": 1897} {"train_loss": -23.27727699279785, "global_step": 157493, "epoch": 1897} {"train_loss": -23.2774600982666, "global_step": 157494, "epoch": 1897} {"train_loss": -23.695871353149414, "global_step": 157495, "epoch": 1897} {"train_loss": -23.448415756225586, "global_step": 157496, "epoch": 1897} {"train_loss": -23.932676315307617, "global_step": 157497, "epoch": 1897} {"train_loss": -23.395627975463867, "global_step": 157498, "epoch": 1897} {"train_loss": -23.400339126586914, "global_step": 157499, "epoch": 1897} {"train_loss": -23.394874572753906, "global_step": 157500, "epoch": 1897} {"train_loss": -23.54425621032715, "global_step": 157501, "epoch": 1897} {"train_loss": -23.820974349975586, "global_step": 157502, "epoch": 1897} {"train_loss": -23.537626266479492, "global_step": 157503, "epoch": 1897} {"train_loss": -23.277212142944336, "global_step": 157504, "epoch": 1897} {"train_loss": -23.162473678588867, "global_step": 157505, "epoch": 1897} {"train_loss": -23.458295822143555, "global_step": 157506, "epoch": 1897} {"train_loss": -23.553510665893555, "global_step": 157507, "epoch": 1897} {"train_loss": -23.560375213623047, "global_step": 157508, "epoch": 1897} {"train_loss": -23.083209991455078, "global_step": 157509, "epoch": 1897} {"train_loss": -23.225666046142578, "global_step": 157510, "epoch": 1897} {"train_loss": -23.318744659423828, "global_step": 157511, "epoch": 1897} {"train_loss": -23.346845626831055, "global_step": 157512, "epoch": 1897} {"train_loss": -23.512170791625977, "global_step": 157513, "epoch": 1897} {"train_loss": -23.723798751831055, "global_step": 157514, "epoch": 1897} {"train_loss": -24.0916690826416, "global_step": 157515, "epoch": 1897} {"train_loss": -23.3577823638916, "global_step": 157516, "epoch": 1897} {"train_loss": -23.244415283203125, "global_step": 157517, "epoch": 1897} {"train_loss": -23.735803604125977, "global_step": 157518, "epoch": 1897} {"train_loss": -23.908933639526367, "global_step": 157519, "epoch": 1897} {"train_loss": -23.592496871948242, "global_step": 157520, "epoch": 1897} {"train_loss": -23.607513427734375, "global_step": 157521, "epoch": 1897} {"train_loss": -23.590835571289062, "global_step": 157522, "epoch": 1897} {"train_loss": -23.1411190032959, "global_step": 157523, "epoch": 1897} {"train_loss": -23.485204696655273, "global_step": 157524, "epoch": 1897} {"train_loss": -23.56987953186035, "global_step": 157525, "epoch": 1897} {"train_loss": -23.580169677734375, "global_step": 157526, "epoch": 1897} {"train_loss": -23.48555564880371, "global_step": 157527, "epoch": 1897} {"train_loss": -23.617874145507812, "global_step": 157528, "epoch": 1897} {"train_loss": -23.796329498291016, "global_step": 157529, "epoch": 1897} {"train_loss": -23.278432846069336, "global_step": 157530, "epoch": 1897} {"train_loss": -23.555509567260742, "global_step": 157531, "epoch": 1897} {"train_loss": -23.129600524902344, "global_step": 157532, "epoch": 1897} {"train_loss": -23.310029363057698, "global_step": 157533, "epoch": 1897, "val_loss": 6424275.0} {"train_loss": -23.261667251586914, "global_step": 157534, "epoch": 1898} {"train_loss": -23.165494918823242, "global_step": 157535, "epoch": 1898} {"train_loss": -22.9017276763916, "global_step": 157536, "epoch": 1898} {"train_loss": -23.197484970092773, "global_step": 157537, "epoch": 1898} {"train_loss": -23.05394172668457, "global_step": 157538, "epoch": 1898} {"train_loss": -23.162038803100586, "global_step": 157539, "epoch": 1898} {"train_loss": -23.334070205688477, "global_step": 157540, "epoch": 1898} {"train_loss": -23.469480514526367, "global_step": 157541, "epoch": 1898} {"train_loss": -23.119216918945312, "global_step": 157542, "epoch": 1898} {"train_loss": -23.4626522064209, "global_step": 157543, "epoch": 1898} {"train_loss": -23.260160446166992, "global_step": 157544, "epoch": 1898} {"train_loss": -23.63439178466797, "global_step": 157545, "epoch": 1898} {"train_loss": -23.108861923217773, "global_step": 157546, "epoch": 1898} {"train_loss": -23.132564544677734, "global_step": 157547, "epoch": 1898} {"train_loss": -23.368993759155273, "global_step": 157548, "epoch": 1898} {"train_loss": -23.194692611694336, "global_step": 157549, "epoch": 1898} {"train_loss": -23.17462730407715, "global_step": 157550, "epoch": 1898} {"train_loss": -23.732934951782227, "global_step": 157551, "epoch": 1898} {"train_loss": -23.51679039001465, "global_step": 157552, "epoch": 1898} {"train_loss": -23.45159339904785, "global_step": 157553, "epoch": 1898} {"train_loss": -23.337116241455078, "global_step": 157554, "epoch": 1898} {"train_loss": -23.844337463378906, "global_step": 157555, "epoch": 1898} {"train_loss": -23.345571517944336, "global_step": 157556, "epoch": 1898} {"train_loss": -23.22934341430664, "global_step": 157557, "epoch": 1898} {"train_loss": -23.42996597290039, "global_step": 157558, "epoch": 1898} {"train_loss": -23.122421264648438, "global_step": 157559, "epoch": 1898} {"train_loss": -23.033737182617188, "global_step": 157560, "epoch": 1898} {"train_loss": -23.1856689453125, "global_step": 157561, "epoch": 1898} {"train_loss": -23.603214263916016, "global_step": 157562, "epoch": 1898} {"train_loss": -23.158353805541992, "global_step": 157563, "epoch": 1898} {"train_loss": -23.173315048217773, "global_step": 157564, "epoch": 1898} {"train_loss": -23.271390914916992, "global_step": 157565, "epoch": 1898} {"train_loss": -23.484012603759766, "global_step": 157566, "epoch": 1898} {"train_loss": -23.624359130859375, "global_step": 157567, "epoch": 1898} {"train_loss": -23.405860900878906, "global_step": 157568, "epoch": 1898} {"train_loss": -23.362407684326172, "global_step": 157569, "epoch": 1898} {"train_loss": -23.253469467163086, "global_step": 157570, "epoch": 1898} {"train_loss": -23.428823471069336, "global_step": 157571, "epoch": 1898} {"train_loss": -23.428226470947266, "global_step": 157572, "epoch": 1898} {"train_loss": -23.307025909423828, "global_step": 157573, "epoch": 1898} {"train_loss": -23.564619064331055, "global_step": 157574, "epoch": 1898} {"train_loss": -23.197935104370117, "global_step": 157575, "epoch": 1898} {"train_loss": -23.40955924987793, "global_step": 157576, "epoch": 1898} {"train_loss": -23.380435943603516, "global_step": 157577, "epoch": 1898} {"train_loss": -23.23984718322754, "global_step": 157578, "epoch": 1898} {"train_loss": -23.877609252929688, "global_step": 157579, "epoch": 1898} {"train_loss": -23.363571166992188, "global_step": 157580, "epoch": 1898} {"train_loss": -23.239261627197266, "global_step": 157581, "epoch": 1898} {"train_loss": -23.238710403442383, "global_step": 157582, "epoch": 1898} {"train_loss": -23.48567771911621, "global_step": 157583, "epoch": 1898} {"train_loss": -23.46684455871582, "global_step": 157584, "epoch": 1898} {"train_loss": -23.568740844726562, "global_step": 157585, "epoch": 1898} {"train_loss": -23.17173194885254, "global_step": 157586, "epoch": 1898} {"train_loss": -23.395246505737305, "global_step": 157587, "epoch": 1898} {"train_loss": -23.2932186126709, "global_step": 157588, "epoch": 1898} {"train_loss": -23.605573654174805, "global_step": 157589, "epoch": 1898} {"train_loss": -23.531131744384766, "global_step": 157590, "epoch": 1898} {"train_loss": -23.474393844604492, "global_step": 157591, "epoch": 1898} {"train_loss": -23.366392135620117, "global_step": 157592, "epoch": 1898} {"train_loss": -23.612974166870117, "global_step": 157593, "epoch": 1898} {"train_loss": -23.583234786987305, "global_step": 157594, "epoch": 1898} {"train_loss": -23.499513626098633, "global_step": 157595, "epoch": 1898} {"train_loss": -23.103857040405273, "global_step": 157596, "epoch": 1898} {"train_loss": -23.7133731842041, "global_step": 157597, "epoch": 1898} {"train_loss": -23.395366668701172, "global_step": 157598, "epoch": 1898} {"train_loss": -23.27808380126953, "global_step": 157599, "epoch": 1898} {"train_loss": -22.846290588378906, "global_step": 157600, "epoch": 1898} {"train_loss": -23.63176155090332, "global_step": 157601, "epoch": 1898} {"train_loss": -23.360708236694336, "global_step": 157602, "epoch": 1898} {"train_loss": -22.955123901367188, "global_step": 157603, "epoch": 1898} {"train_loss": -23.348709106445312, "global_step": 157604, "epoch": 1898} {"train_loss": -23.418943405151367, "global_step": 157605, "epoch": 1898} {"train_loss": -23.424402236938477, "global_step": 157606, "epoch": 1898} {"train_loss": -23.17658042907715, "global_step": 157607, "epoch": 1898} {"train_loss": -23.625324249267578, "global_step": 157608, "epoch": 1898} {"train_loss": -23.385496139526367, "global_step": 157609, "epoch": 1898} {"train_loss": -23.399330139160156, "global_step": 157610, "epoch": 1898} {"train_loss": -23.480161666870117, "global_step": 157611, "epoch": 1898} {"train_loss": -23.17642593383789, "global_step": 157612, "epoch": 1898} {"train_loss": -23.16238021850586, "global_step": 157613, "epoch": 1898} {"train_loss": -23.269887924194336, "global_step": 157614, "epoch": 1898} {"train_loss": -23.33603858947754, "global_step": 157615, "epoch": 1898} {"train_loss": -23.369415627904687, "global_step": 157616, "epoch": 1898, "val_loss": 6260225.0} {"train_loss": -22.322986602783203, "global_step": 157617, "epoch": 1899} {"train_loss": -22.917007446289062, "global_step": 157618, "epoch": 1899} {"train_loss": -22.427656173706055, "global_step": 157619, "epoch": 1899} {"train_loss": -23.24691390991211, "global_step": 157620, "epoch": 1899} {"train_loss": -22.924766540527344, "global_step": 157621, "epoch": 1899} {"train_loss": -22.78045082092285, "global_step": 157622, "epoch": 1899} {"train_loss": -22.86464500427246, "global_step": 157623, "epoch": 1899} {"train_loss": -23.02182960510254, "global_step": 157624, "epoch": 1899} {"train_loss": -22.93278694152832, "global_step": 157625, "epoch": 1899} {"train_loss": -22.806142807006836, "global_step": 157626, "epoch": 1899} {"train_loss": -23.004173278808594, "global_step": 157627, "epoch": 1899} {"train_loss": -23.054519653320312, "global_step": 157628, "epoch": 1899} {"train_loss": -23.247793197631836, "global_step": 157629, "epoch": 1899} {"train_loss": -22.86886978149414, "global_step": 157630, "epoch": 1899} {"train_loss": -23.059289932250977, "global_step": 157631, "epoch": 1899} {"train_loss": -23.074859619140625, "global_step": 157632, "epoch": 1899} {"train_loss": -23.19061851501465, "global_step": 157633, "epoch": 1899} {"train_loss": -23.239885330200195, "global_step": 157634, "epoch": 1899} {"train_loss": -23.391660690307617, "global_step": 157635, "epoch": 1899} {"train_loss": -23.408100128173828, "global_step": 157636, "epoch": 1899} {"train_loss": -23.375213623046875, "global_step": 157637, "epoch": 1899} {"train_loss": -23.460983276367188, "global_step": 157638, "epoch": 1899} {"train_loss": -23.504175186157227, "global_step": 157639, "epoch": 1899} {"train_loss": -22.855623245239258, "global_step": 157640, "epoch": 1899} {"train_loss": -23.261219024658203, "global_step": 157641, "epoch": 1899} {"train_loss": -23.177526473999023, "global_step": 157642, "epoch": 1899} {"train_loss": -23.474964141845703, "global_step": 157643, "epoch": 1899} {"train_loss": -23.65662956237793, "global_step": 157644, "epoch": 1899} {"train_loss": -23.586362838745117, "global_step": 157645, "epoch": 1899} {"train_loss": -23.475072860717773, "global_step": 157646, "epoch": 1899} {"train_loss": -23.21510887145996, "global_step": 157647, "epoch": 1899} {"train_loss": -23.34490394592285, "global_step": 157648, "epoch": 1899} {"train_loss": -23.451047897338867, "global_step": 157649, "epoch": 1899} {"train_loss": -23.452320098876953, "global_step": 157650, "epoch": 1899} {"train_loss": -23.296672821044922, "global_step": 157651, "epoch": 1899} {"train_loss": -23.317533493041992, "global_step": 157652, "epoch": 1899} {"train_loss": -23.023876190185547, "global_step": 157653, "epoch": 1899} {"train_loss": -23.624225616455078, "global_step": 157654, "epoch": 1899} {"train_loss": -23.5886173248291, "global_step": 157655, "epoch": 1899} {"train_loss": -23.237258911132812, "global_step": 157656, "epoch": 1899} {"train_loss": -23.11732292175293, "global_step": 157657, "epoch": 1899} {"train_loss": -23.57979393005371, "global_step": 157658, "epoch": 1899} {"train_loss": -23.534564971923828, "global_step": 157659, "epoch": 1899} {"train_loss": -23.227827072143555, "global_step": 157660, "epoch": 1899} {"train_loss": -23.390111923217773, "global_step": 157661, "epoch": 1899} {"train_loss": -23.496885299682617, "global_step": 157662, "epoch": 1899} {"train_loss": -23.42252540588379, "global_step": 157663, "epoch": 1899} {"train_loss": -23.347745895385742, "global_step": 157664, "epoch": 1899} {"train_loss": -23.022905349731445, "global_step": 157665, "epoch": 1899} {"train_loss": -23.243078231811523, "global_step": 157666, "epoch": 1899} {"train_loss": -23.46489906311035, "global_step": 157667, "epoch": 1899} {"train_loss": -23.5216121673584, "global_step": 157668, "epoch": 1899} {"train_loss": -23.58298683166504, "global_step": 157669, "epoch": 1899} {"train_loss": -23.44497299194336, "global_step": 157670, "epoch": 1899} {"train_loss": -23.870004653930664, "global_step": 157671, "epoch": 1899} {"train_loss": -23.30038833618164, "global_step": 157672, "epoch": 1899} {"train_loss": -23.69226837158203, "global_step": 157673, "epoch": 1899} {"train_loss": -23.082515716552734, "global_step": 157674, "epoch": 1899} {"train_loss": -23.220840454101562, "global_step": 157675, "epoch": 1899} {"train_loss": -23.380178451538086, "global_step": 157676, "epoch": 1899} {"train_loss": -23.38910484313965, "global_step": 157677, "epoch": 1899} {"train_loss": -23.60611915588379, "global_step": 157678, "epoch": 1899} {"train_loss": -23.764755249023438, "global_step": 157679, "epoch": 1899} {"train_loss": -23.716463088989258, "global_step": 157680, "epoch": 1899} {"train_loss": -23.38372230529785, "global_step": 157681, "epoch": 1899} {"train_loss": -23.8897647857666, "global_step": 157682, "epoch": 1899} {"train_loss": -23.872549057006836, "global_step": 157683, "epoch": 1899} {"train_loss": -23.3215274810791, "global_step": 157684, "epoch": 1899} {"train_loss": -23.480670928955078, "global_step": 157685, "epoch": 1899} {"train_loss": -23.126436233520508, "global_step": 157686, "epoch": 1899} {"train_loss": -23.417905807495117, "global_step": 157687, "epoch": 1899} {"train_loss": -23.549320220947266, "global_step": 157688, "epoch": 1899} {"train_loss": -23.340286254882812, "global_step": 157689, "epoch": 1899} {"train_loss": -23.722227096557617, "global_step": 157690, "epoch": 1899} {"train_loss": -23.62095832824707, "global_step": 157691, "epoch": 1899} {"train_loss": -23.501577377319336, "global_step": 157692, "epoch": 1899} {"train_loss": -23.489595413208008, "global_step": 157693, "epoch": 1899} {"train_loss": -23.08578872680664, "global_step": 157694, "epoch": 1899} {"train_loss": -23.4375, "global_step": 157695, "epoch": 1899} {"train_loss": -23.34665870666504, "global_step": 157696, "epoch": 1899} {"train_loss": -23.343046188354492, "global_step": 157697, "epoch": 1899} {"train_loss": -23.2174072265625, "global_step": 157698, "epoch": 1899} {"train_loss": -23.326018092143965, "global_step": 157699, "epoch": 1899, "val_loss": 6362952.0} {"train_loss": -22.779539108276367, "global_step": 157700, "epoch": 1900} {"train_loss": -22.120407104492188, "global_step": 157701, "epoch": 1900} {"train_loss": -23.131498336791992, "global_step": 157702, "epoch": 1900} {"train_loss": -22.707717895507812, "global_step": 157703, "epoch": 1900} {"train_loss": -22.75543785095215, "global_step": 157704, "epoch": 1900} {"train_loss": -23.134984970092773, "global_step": 157705, "epoch": 1900} {"train_loss": -23.014728546142578, "global_step": 157706, "epoch": 1900} {"train_loss": -23.01769256591797, "global_step": 157707, "epoch": 1900} {"train_loss": -23.229480743408203, "global_step": 157708, "epoch": 1900} {"train_loss": -22.79606819152832, "global_step": 157709, "epoch": 1900} {"train_loss": -23.317724227905273, "global_step": 157710, "epoch": 1900} {"train_loss": -23.45562744140625, "global_step": 157711, "epoch": 1900} {"train_loss": -23.208417892456055, "global_step": 157712, "epoch": 1900} {"train_loss": -23.405759811401367, "global_step": 157713, "epoch": 1900} {"train_loss": -23.197879791259766, "global_step": 157714, "epoch": 1900} {"train_loss": -23.240154266357422, "global_step": 157715, "epoch": 1900} {"train_loss": -23.434364318847656, "global_step": 157716, "epoch": 1900} {"train_loss": -23.49554443359375, "global_step": 157717, "epoch": 1900} {"train_loss": -23.161901473999023, "global_step": 157718, "epoch": 1900} {"train_loss": -23.131423950195312, "global_step": 157719, "epoch": 1900} {"train_loss": -23.620132446289062, "global_step": 157720, "epoch": 1900} {"train_loss": -23.439254760742188, "global_step": 157721, "epoch": 1900} {"train_loss": -23.345233917236328, "global_step": 157722, "epoch": 1900} {"train_loss": -23.113096237182617, "global_step": 157723, "epoch": 1900} {"train_loss": -23.211753845214844, "global_step": 157724, "epoch": 1900} {"train_loss": -23.500532150268555, "global_step": 157725, "epoch": 1900} {"train_loss": -23.230194091796875, "global_step": 157726, "epoch": 1900} {"train_loss": -23.333311080932617, "global_step": 157727, "epoch": 1900} {"train_loss": -23.567302703857422, "global_step": 157728, "epoch": 1900} {"train_loss": -23.413959503173828, "global_step": 157729, "epoch": 1900} {"train_loss": -23.434566497802734, "global_step": 157730, "epoch": 1900} {"train_loss": -23.615285873413086, "global_step": 157731, "epoch": 1900} {"train_loss": -23.26580238342285, "global_step": 157732, "epoch": 1900} {"train_loss": -23.844528198242188, "global_step": 157733, "epoch": 1900} {"train_loss": -23.425138473510742, "global_step": 157734, "epoch": 1900} {"train_loss": -23.533363342285156, "global_step": 157735, "epoch": 1900} {"train_loss": -23.200733184814453, "global_step": 157736, "epoch": 1900} {"train_loss": -23.251890182495117, "global_step": 157737, "epoch": 1900} {"train_loss": -23.399709701538086, "global_step": 157738, "epoch": 1900} {"train_loss": -23.386587142944336, "global_step": 157739, "epoch": 1900} {"train_loss": -23.197650909423828, "global_step": 157740, "epoch": 1900} {"train_loss": -23.497364044189453, "global_step": 157741, "epoch": 1900} {"train_loss": -23.44919776916504, "global_step": 157742, "epoch": 1900} {"train_loss": -23.505582809448242, "global_step": 157743, "epoch": 1900} {"train_loss": -23.130491256713867, "global_step": 157744, "epoch": 1900} {"train_loss": -23.147872924804688, "global_step": 157745, "epoch": 1900} {"train_loss": -23.86322784423828, "global_step": 157746, "epoch": 1900} {"train_loss": -23.400537490844727, "global_step": 157747, "epoch": 1900} {"train_loss": -23.058759689331055, "global_step": 157748, "epoch": 1900} {"train_loss": -23.518333435058594, "global_step": 157749, "epoch": 1900} {"train_loss": -23.525564193725586, "global_step": 157750, "epoch": 1900} {"train_loss": -23.083938598632812, "global_step": 157751, "epoch": 1900} {"train_loss": -23.425207138061523, "global_step": 157752, "epoch": 1900} {"train_loss": -23.365535736083984, "global_step": 157753, "epoch": 1900} {"train_loss": -23.43494987487793, "global_step": 157754, "epoch": 1900} {"train_loss": -23.578144073486328, "global_step": 157755, "epoch": 1900} {"train_loss": -23.5645751953125, "global_step": 157756, "epoch": 1900} {"train_loss": -23.39920425415039, "global_step": 157757, "epoch": 1900} {"train_loss": -23.242877960205078, "global_step": 157758, "epoch": 1900} {"train_loss": -23.550350189208984, "global_step": 157759, "epoch": 1900} {"train_loss": -23.452112197875977, "global_step": 157760, "epoch": 1900} {"train_loss": -23.634140014648438, "global_step": 157761, "epoch": 1900} {"train_loss": -23.70792007446289, "global_step": 157762, "epoch": 1900} {"train_loss": -23.343236923217773, "global_step": 157763, "epoch": 1900} {"train_loss": -23.250585556030273, "global_step": 157764, "epoch": 1900} {"train_loss": -23.45004653930664, "global_step": 157765, "epoch": 1900} {"train_loss": -23.68348503112793, "global_step": 157766, "epoch": 1900} {"train_loss": -23.366004943847656, "global_step": 157767, "epoch": 1900} {"train_loss": -23.609783172607422, "global_step": 157768, "epoch": 1900} {"train_loss": -23.52854347229004, "global_step": 157769, "epoch": 1900} {"train_loss": -23.742578506469727, "global_step": 157770, "epoch": 1900} {"train_loss": -23.895273208618164, "global_step": 157771, "epoch": 1900} {"train_loss": -23.11812400817871, "global_step": 157772, "epoch": 1900} {"train_loss": -23.164745330810547, "global_step": 157773, "epoch": 1900} {"train_loss": -23.024457931518555, "global_step": 157774, "epoch": 1900} {"train_loss": -23.62504005432129, "global_step": 157775, "epoch": 1900} {"train_loss": -23.29203987121582, "global_step": 157776, "epoch": 1900} {"train_loss": -23.414846420288086, "global_step": 157777, "epoch": 1900} {"train_loss": -23.592947006225586, "global_step": 157778, "epoch": 1900} {"train_loss": -23.341217041015625, "global_step": 157779, "epoch": 1900} {"train_loss": -23.57927703857422, "global_step": 157780, "epoch": 1900} {"train_loss": -23.4663143157959, "global_step": 157781, "epoch": 1900} {"train_loss": -23.341418530567584, "global_step": 157782, "epoch": 1900, "train/sim_max_reward_0": 1.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 0.0, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4500000": 0.0, "test/sim_max_reward_4500001": 1.0, "test/sim_max_reward_4500002": 1.0, "test/sim_max_reward_4500003": 1.0, "test/sim_max_reward_4500004": 1.0, "test/sim_max_reward_4500005": 1.0, "test/sim_max_reward_4500006": 1.0, "test/sim_max_reward_4500007": 1.0, "test/sim_max_reward_4500008": 1.0, "test/sim_max_reward_4500009": 1.0, "test/sim_max_reward_4500010": 1.0, "test/sim_max_reward_4500011": 1.0, "test/sim_max_reward_4500012": 1.0, "test/sim_max_reward_4500013": 1.0, "test/sim_max_reward_4500014": 1.0, "test/sim_max_reward_4500015": 1.0, "test/sim_max_reward_4500016": 1.0, "test/sim_max_reward_4500017": 1.0, "test/sim_max_reward_4500018": 1.0, "test/sim_max_reward_4500019": 0.0, "test/sim_max_reward_4500020": 1.0, "test/sim_max_reward_4500021": 1.0, "train/mean_score": 0.8333333333333334, "test/mean_score": 0.9090909090909091, "val_loss": 6369826.5} {"train_loss": -21.73260498046875, "global_step": 157783, "epoch": 1901} {"train_loss": -22.251596450805664, "global_step": 157784, "epoch": 1901} {"train_loss": -22.49070167541504, "global_step": 157785, "epoch": 1901} {"train_loss": -22.43097496032715, "global_step": 157786, "epoch": 1901} {"train_loss": -22.686986923217773, "global_step": 157787, "epoch": 1901} {"train_loss": -23.070104598999023, "global_step": 157788, "epoch": 1901} {"train_loss": -22.60888671875, "global_step": 157789, "epoch": 1901} {"train_loss": -22.78510856628418, "global_step": 157790, "epoch": 1901} {"train_loss": -22.395429611206055, "global_step": 157791, "epoch": 1901} {"train_loss": -22.7355899810791, "global_step": 157792, "epoch": 1901} {"train_loss": -22.654951095581055, "global_step": 157793, "epoch": 1901} {"train_loss": -22.72296905517578, "global_step": 157794, "epoch": 1901} {"train_loss": -23.0211238861084, "global_step": 157795, "epoch": 1901} {"train_loss": -23.159109115600586, "global_step": 157796, "epoch": 1901} {"train_loss": -22.97831153869629, "global_step": 157797, "epoch": 1901} {"train_loss": -22.59305191040039, "global_step": 157798, "epoch": 1901} {"train_loss": -23.383777618408203, "global_step": 157799, "epoch": 1901} {"train_loss": -23.181640625, "global_step": 157800, "epoch": 1901} {"train_loss": -22.814271926879883, "global_step": 157801, "epoch": 1901} {"train_loss": -23.0665340423584, "global_step": 157802, "epoch": 1901} {"train_loss": -23.124876022338867, "global_step": 157803, "epoch": 1901} {"train_loss": -23.32529067993164, "global_step": 157804, "epoch": 1901} {"train_loss": -23.11764907836914, "global_step": 157805, "epoch": 1901} {"train_loss": -23.108030319213867, "global_step": 157806, "epoch": 1901} {"train_loss": -23.301258087158203, "global_step": 157807, "epoch": 1901} {"train_loss": -23.459400177001953, "global_step": 157808, "epoch": 1901} {"train_loss": -23.402372360229492, "global_step": 157809, "epoch": 1901} {"train_loss": -23.15675163269043, "global_step": 157810, "epoch": 1901} {"train_loss": -23.745269775390625, "global_step": 157811, "epoch": 1901} {"train_loss": -23.047666549682617, "global_step": 157812, "epoch": 1901} {"train_loss": -23.478973388671875, "global_step": 157813, "epoch": 1901} {"train_loss": -23.37404441833496, "global_step": 157814, "epoch": 1901} {"train_loss": -23.352754592895508, "global_step": 157815, "epoch": 1901} {"train_loss": -23.39328384399414, "global_step": 157816, "epoch": 1901} {"train_loss": -23.202381134033203, "global_step": 157817, "epoch": 1901} {"train_loss": -23.3686580657959, "global_step": 157818, "epoch": 1901} {"train_loss": -23.193052291870117, "global_step": 157819, "epoch": 1901} {"train_loss": -23.24103355407715, "global_step": 157820, "epoch": 1901} {"train_loss": -23.10202980041504, "global_step": 157821, "epoch": 1901} {"train_loss": -23.217649459838867, "global_step": 157822, "epoch": 1901} {"train_loss": -23.43192481994629, "global_step": 157823, "epoch": 1901} {"train_loss": -23.382474899291992, "global_step": 157824, "epoch": 1901} {"train_loss": -23.228567123413086, "global_step": 157825, "epoch": 1901} {"train_loss": -23.23577117919922, "global_step": 157826, "epoch": 1901} {"train_loss": -23.260765075683594, "global_step": 157827, "epoch": 1901} {"train_loss": -23.270429611206055, "global_step": 157828, "epoch": 1901} {"train_loss": -23.57794761657715, "global_step": 157829, "epoch": 1901} {"train_loss": -23.60256004333496, "global_step": 157830, "epoch": 1901} {"train_loss": -23.4022274017334, "global_step": 157831, "epoch": 1901} {"train_loss": -23.33888816833496, "global_step": 157832, "epoch": 1901} {"train_loss": -23.36784553527832, "global_step": 157833, "epoch": 1901} {"train_loss": -23.165098190307617, "global_step": 157834, "epoch": 1901} {"train_loss": -23.563444137573242, "global_step": 157835, "epoch": 1901} {"train_loss": -22.915645599365234, "global_step": 157836, "epoch": 1901} {"train_loss": -23.211210250854492, "global_step": 157837, "epoch": 1901} {"train_loss": -23.545515060424805, "global_step": 157838, "epoch": 1901} {"train_loss": -22.917938232421875, "global_step": 157839, "epoch": 1901} {"train_loss": -23.29787826538086, "global_step": 157840, "epoch": 1901} {"train_loss": -23.355670928955078, "global_step": 157841, "epoch": 1901} {"train_loss": -23.873672485351562, "global_step": 157842, "epoch": 1901} {"train_loss": -23.260602951049805, "global_step": 157843, "epoch": 1901} {"train_loss": -23.709299087524414, "global_step": 157844, "epoch": 1901} {"train_loss": -23.23225212097168, "global_step": 157845, "epoch": 1901} {"train_loss": -23.105031967163086, "global_step": 157846, "epoch": 1901} {"train_loss": -23.525943756103516, "global_step": 157847, "epoch": 1901} {"train_loss": -23.47235679626465, "global_step": 157848, "epoch": 1901} {"train_loss": -23.72176170349121, "global_step": 157849, "epoch": 1901} {"train_loss": -23.453983306884766, "global_step": 157850, "epoch": 1901} {"train_loss": -23.736820220947266, "global_step": 157851, "epoch": 1901} {"train_loss": -23.49957275390625, "global_step": 157852, "epoch": 1901} {"train_loss": -23.370288848876953, "global_step": 157853, "epoch": 1901} {"train_loss": -23.16315269470215, "global_step": 157854, "epoch": 1901} {"train_loss": -23.763010025024414, "global_step": 157855, "epoch": 1901} {"train_loss": -23.33766746520996, "global_step": 157856, "epoch": 1901} {"train_loss": -23.314359664916992, "global_step": 157857, "epoch": 1901} {"train_loss": -23.194719314575195, "global_step": 157858, "epoch": 1901} {"train_loss": -23.356210708618164, "global_step": 157859, "epoch": 1901} {"train_loss": -23.445556640625, "global_step": 157860, "epoch": 1901} {"train_loss": -23.36678123474121, "global_step": 157861, "epoch": 1901} {"train_loss": -23.463651657104492, "global_step": 157862, "epoch": 1901} {"train_loss": -23.47084617614746, "global_step": 157863, "epoch": 1901} {"train_loss": -23.642623901367188, "global_step": 157864, "epoch": 1901} {"train_loss": -23.190085928124116, "global_step": 157865, "epoch": 1901, "val_loss": 6380117.0} {"train_loss": -23.425268173217773, "global_step": 157866, "epoch": 1902} {"train_loss": -23.373275756835938, "global_step": 157867, "epoch": 1902} {"train_loss": -23.351842880249023, "global_step": 157868, "epoch": 1902} {"train_loss": -23.55813217163086, "global_step": 157869, "epoch": 1902} {"train_loss": -23.497827529907227, "global_step": 157870, "epoch": 1902} {"train_loss": -23.209375381469727, "global_step": 157871, "epoch": 1902} {"train_loss": -23.35367774963379, "global_step": 157872, "epoch": 1902} {"train_loss": -23.194873809814453, "global_step": 157873, "epoch": 1902} {"train_loss": -23.473493576049805, "global_step": 157874, "epoch": 1902} {"train_loss": -23.789710998535156, "global_step": 157875, "epoch": 1902} {"train_loss": -23.617929458618164, "global_step": 157876, "epoch": 1902} {"train_loss": -23.505842208862305, "global_step": 157877, "epoch": 1902} {"train_loss": -23.51416015625, "global_step": 157878, "epoch": 1902} {"train_loss": -23.50428581237793, "global_step": 157879, "epoch": 1902} {"train_loss": -23.646570205688477, "global_step": 157880, "epoch": 1902} {"train_loss": -23.56281852722168, "global_step": 157881, "epoch": 1902} {"train_loss": -23.42763328552246, "global_step": 157882, "epoch": 1902} {"train_loss": -23.313520431518555, "global_step": 157883, "epoch": 1902} {"train_loss": -23.48468017578125, "global_step": 157884, "epoch": 1902} {"train_loss": -23.57950210571289, "global_step": 157885, "epoch": 1902} {"train_loss": -23.274473190307617, "global_step": 157886, "epoch": 1902} {"train_loss": -23.70037269592285, "global_step": 157887, "epoch": 1902} {"train_loss": -23.615509033203125, "global_step": 157888, "epoch": 1902} {"train_loss": -23.40229606628418, "global_step": 157889, "epoch": 1902} {"train_loss": -23.961753845214844, "global_step": 157890, "epoch": 1902} {"train_loss": -23.823062896728516, "global_step": 157891, "epoch": 1902} {"train_loss": -23.479318618774414, "global_step": 157892, "epoch": 1902} {"train_loss": -23.42714500427246, "global_step": 157893, "epoch": 1902} {"train_loss": -23.53142547607422, "global_step": 157894, "epoch": 1902} {"train_loss": -23.511470794677734, "global_step": 157895, "epoch": 1902} {"train_loss": -23.63247299194336, "global_step": 157896, "epoch": 1902} {"train_loss": -23.546615600585938, "global_step": 157897, "epoch": 1902} {"train_loss": -23.273176193237305, "global_step": 157898, "epoch": 1902} {"train_loss": -23.13087272644043, "global_step": 157899, "epoch": 1902} {"train_loss": -23.32466697692871, "global_step": 157900, "epoch": 1902} {"train_loss": -23.4057674407959, "global_step": 157901, "epoch": 1902} {"train_loss": -23.371503829956055, "global_step": 157902, "epoch": 1902} {"train_loss": -23.52961540222168, "global_step": 157903, "epoch": 1902} {"train_loss": -23.435468673706055, "global_step": 157904, "epoch": 1902} {"train_loss": -23.160430908203125, "global_step": 157905, "epoch": 1902} {"train_loss": -23.664838790893555, "global_step": 157906, "epoch": 1902} {"train_loss": -23.34836196899414, "global_step": 157907, "epoch": 1902} {"train_loss": -23.5644474029541, "global_step": 157908, "epoch": 1902} {"train_loss": -23.004297256469727, "global_step": 157909, "epoch": 1902} {"train_loss": -22.946247100830078, "global_step": 157910, "epoch": 1902} {"train_loss": -23.34258460998535, "global_step": 157911, "epoch": 1902} {"train_loss": -23.39885139465332, "global_step": 157912, "epoch": 1902} {"train_loss": -23.73058319091797, "global_step": 157913, "epoch": 1902} {"train_loss": -23.138792037963867, "global_step": 157914, "epoch": 1902} {"train_loss": -23.130002975463867, "global_step": 157915, "epoch": 1902} {"train_loss": -23.47164535522461, "global_step": 157916, "epoch": 1902} {"train_loss": -22.636228561401367, "global_step": 157917, "epoch": 1902} {"train_loss": -23.09820556640625, "global_step": 157918, "epoch": 1902} {"train_loss": -23.267770767211914, "global_step": 157919, "epoch": 1902} {"train_loss": -23.252819061279297, "global_step": 157920, "epoch": 1902} {"train_loss": -23.30820083618164, "global_step": 157921, "epoch": 1902} {"train_loss": -23.584760665893555, "global_step": 157922, "epoch": 1902} {"train_loss": -23.3707332611084, "global_step": 157923, "epoch": 1902} {"train_loss": -23.69923973083496, "global_step": 157924, "epoch": 1902} {"train_loss": -23.37549591064453, "global_step": 157925, "epoch": 1902} {"train_loss": -23.392803192138672, "global_step": 157926, "epoch": 1902} {"train_loss": -23.101316452026367, "global_step": 157927, "epoch": 1902} {"train_loss": -23.128963470458984, "global_step": 157928, "epoch": 1902} {"train_loss": -23.59697914123535, "global_step": 157929, "epoch": 1902} {"train_loss": -23.480823516845703, "global_step": 157930, "epoch": 1902} {"train_loss": -23.05000877380371, "global_step": 157931, "epoch": 1902} {"train_loss": -23.29257583618164, "global_step": 157932, "epoch": 1902} {"train_loss": -23.313867568969727, "global_step": 157933, "epoch": 1902} {"train_loss": -23.412160873413086, "global_step": 157934, "epoch": 1902} {"train_loss": -23.59784507751465, "global_step": 157935, "epoch": 1902} {"train_loss": -22.909143447875977, "global_step": 157936, "epoch": 1902} {"train_loss": -23.72802734375, "global_step": 157937, "epoch": 1902} {"train_loss": -23.312458038330078, "global_step": 157938, "epoch": 1902} {"train_loss": -23.49900245666504, "global_step": 157939, "epoch": 1902} {"train_loss": -23.58483123779297, "global_step": 157940, "epoch": 1902} {"train_loss": -23.3231143951416, "global_step": 157941, "epoch": 1902} {"train_loss": -23.900461196899414, "global_step": 157942, "epoch": 1902} {"train_loss": -23.5065975189209, "global_step": 157943, "epoch": 1902} {"train_loss": -23.722949981689453, "global_step": 157944, "epoch": 1902} {"train_loss": -23.441375732421875, "global_step": 157945, "epoch": 1902} {"train_loss": -23.58501625061035, "global_step": 157946, "epoch": 1902} {"train_loss": -23.617599487304688, "global_step": 157947, "epoch": 1902} {"train_loss": -23.424736804272754, "global_step": 157948, "epoch": 1902, "val_loss": 6281567.0} {"train_loss": -22.383813858032227, "global_step": 157949, "epoch": 1903} {"train_loss": -23.17067527770996, "global_step": 157950, "epoch": 1903} {"train_loss": -22.934619903564453, "global_step": 157951, "epoch": 1903} {"train_loss": -23.02976417541504, "global_step": 157952, "epoch": 1903} {"train_loss": -22.991901397705078, "global_step": 157953, "epoch": 1903} {"train_loss": -23.140151977539062, "global_step": 157954, "epoch": 1903} {"train_loss": -23.08687400817871, "global_step": 157955, "epoch": 1903} {"train_loss": -22.899072647094727, "global_step": 157956, "epoch": 1903} {"train_loss": -22.986114501953125, "global_step": 157957, "epoch": 1903} {"train_loss": -23.28516960144043, "global_step": 157958, "epoch": 1903} {"train_loss": -23.109052658081055, "global_step": 157959, "epoch": 1903} {"train_loss": -23.17066764831543, "global_step": 157960, "epoch": 1903} {"train_loss": -23.523244857788086, "global_step": 157961, "epoch": 1903} {"train_loss": -23.235912322998047, "global_step": 157962, "epoch": 1903} {"train_loss": -23.00147819519043, "global_step": 157963, "epoch": 1903} {"train_loss": -23.22101402282715, "global_step": 157964, "epoch": 1903} {"train_loss": -23.398900985717773, "global_step": 157965, "epoch": 1903} {"train_loss": -23.02559471130371, "global_step": 157966, "epoch": 1903} {"train_loss": -23.072269439697266, "global_step": 157967, "epoch": 1903} {"train_loss": -23.27291488647461, "global_step": 157968, "epoch": 1903} {"train_loss": -23.01554298400879, "global_step": 157969, "epoch": 1903} {"train_loss": -23.250102996826172, "global_step": 157970, "epoch": 1903} {"train_loss": -23.045087814331055, "global_step": 157971, "epoch": 1903} {"train_loss": -23.598411560058594, "global_step": 157972, "epoch": 1903} {"train_loss": -23.499988555908203, "global_step": 157973, "epoch": 1903} {"train_loss": -23.65714454650879, "global_step": 157974, "epoch": 1903} {"train_loss": -23.42213249206543, "global_step": 157975, "epoch": 1903} {"train_loss": -23.396732330322266, "global_step": 157976, "epoch": 1903} {"train_loss": -23.007625579833984, "global_step": 157977, "epoch": 1903} {"train_loss": -23.314697265625, "global_step": 157978, "epoch": 1903} {"train_loss": -23.423070907592773, "global_step": 157979, "epoch": 1903} {"train_loss": -23.985137939453125, "global_step": 157980, "epoch": 1903} {"train_loss": -23.498823165893555, "global_step": 157981, "epoch": 1903} {"train_loss": -23.63213348388672, "global_step": 157982, "epoch": 1903} {"train_loss": -23.326040267944336, "global_step": 157983, "epoch": 1903} {"train_loss": -23.746896743774414, "global_step": 157984, "epoch": 1903} {"train_loss": -23.543067932128906, "global_step": 157985, "epoch": 1903} {"train_loss": -23.619844436645508, "global_step": 157986, "epoch": 1903} {"train_loss": -23.25885581970215, "global_step": 157987, "epoch": 1903} {"train_loss": -23.613452911376953, "global_step": 157988, "epoch": 1903} {"train_loss": -23.604618072509766, "global_step": 157989, "epoch": 1903} {"train_loss": -23.728025436401367, "global_step": 157990, "epoch": 1903} {"train_loss": -23.174039840698242, "global_step": 157991, "epoch": 1903} {"train_loss": -23.714933395385742, "global_step": 157992, "epoch": 1903} {"train_loss": -23.713605880737305, "global_step": 157993, "epoch": 1903} {"train_loss": -23.525882720947266, "global_step": 157994, "epoch": 1903} {"train_loss": -23.901269912719727, "global_step": 157995, "epoch": 1903} {"train_loss": -24.062116622924805, "global_step": 157996, "epoch": 1903} {"train_loss": -23.369192123413086, "global_step": 157997, "epoch": 1903} {"train_loss": -23.364660263061523, "global_step": 157998, "epoch": 1903} {"train_loss": -23.73813819885254, "global_step": 157999, "epoch": 1903} {"train_loss": -23.344148635864258, "global_step": 158000, "epoch": 1903} {"train_loss": -23.36995506286621, "global_step": 158001, "epoch": 1903} {"train_loss": -23.534475326538086, "global_step": 158002, "epoch": 1903} {"train_loss": -23.40006446838379, "global_step": 158003, "epoch": 1903} {"train_loss": -23.542339324951172, "global_step": 158004, "epoch": 1903} {"train_loss": -23.354686737060547, "global_step": 158005, "epoch": 1903} {"train_loss": -23.44649314880371, "global_step": 158006, "epoch": 1903} {"train_loss": -23.535526275634766, "global_step": 158007, "epoch": 1903} {"train_loss": -23.17612075805664, "global_step": 158008, "epoch": 1903} {"train_loss": -23.066946029663086, "global_step": 158009, "epoch": 1903} {"train_loss": -23.39481544494629, "global_step": 158010, "epoch": 1903} {"train_loss": -23.737394332885742, "global_step": 158011, "epoch": 1903} {"train_loss": -23.311532974243164, "global_step": 158012, "epoch": 1903} {"train_loss": -23.373008728027344, "global_step": 158013, "epoch": 1903} {"train_loss": -23.470245361328125, "global_step": 158014, "epoch": 1903} {"train_loss": -23.609210968017578, "global_step": 158015, "epoch": 1903} {"train_loss": -23.212493896484375, "global_step": 158016, "epoch": 1903} {"train_loss": -23.33788299560547, "global_step": 158017, "epoch": 1903} {"train_loss": -23.17305564880371, "global_step": 158018, "epoch": 1903} {"train_loss": -23.28539276123047, "global_step": 158019, "epoch": 1903} {"train_loss": -23.73537254333496, "global_step": 158020, "epoch": 1903} {"train_loss": -23.560409545898438, "global_step": 158021, "epoch": 1903} {"train_loss": -23.657638549804688, "global_step": 158022, "epoch": 1903} {"train_loss": -23.569257736206055, "global_step": 158023, "epoch": 1903} {"train_loss": -23.54962730407715, "global_step": 158024, "epoch": 1903} {"train_loss": -23.833730697631836, "global_step": 158025, "epoch": 1903} {"train_loss": -23.202322006225586, "global_step": 158026, "epoch": 1903} {"train_loss": -23.465429306030273, "global_step": 158027, "epoch": 1903} {"train_loss": -23.575910568237305, "global_step": 158028, "epoch": 1903} {"train_loss": -23.41206932067871, "global_step": 158029, "epoch": 1903} {"train_loss": -23.30979347229004, "global_step": 158030, "epoch": 1903} {"train_loss": -23.375232236931122, "global_step": 158031, "epoch": 1903, "val_loss": 6386900.0} {"train_loss": -22.40929412841797, "global_step": 158032, "epoch": 1904} {"train_loss": -22.546186447143555, "global_step": 158033, "epoch": 1904} {"train_loss": -22.82208251953125, "global_step": 158034, "epoch": 1904} {"train_loss": -22.619426727294922, "global_step": 158035, "epoch": 1904} {"train_loss": -22.6189022064209, "global_step": 158036, "epoch": 1904} {"train_loss": -22.593412399291992, "global_step": 158037, "epoch": 1904} {"train_loss": -22.703325271606445, "global_step": 158038, "epoch": 1904} {"train_loss": -22.661087036132812, "global_step": 158039, "epoch": 1904} {"train_loss": -22.575363159179688, "global_step": 158040, "epoch": 1904} {"train_loss": -22.62662696838379, "global_step": 158041, "epoch": 1904} {"train_loss": -23.05893898010254, "global_step": 158042, "epoch": 1904} {"train_loss": -22.852298736572266, "global_step": 158043, "epoch": 1904} {"train_loss": -23.178062438964844, "global_step": 158044, "epoch": 1904} {"train_loss": -23.111047744750977, "global_step": 158045, "epoch": 1904} {"train_loss": -23.079992294311523, "global_step": 158046, "epoch": 1904} {"train_loss": -23.38594627380371, "global_step": 158047, "epoch": 1904} {"train_loss": -23.0314884185791, "global_step": 158048, "epoch": 1904} {"train_loss": -23.235750198364258, "global_step": 158049, "epoch": 1904} {"train_loss": -23.156225204467773, "global_step": 158050, "epoch": 1904} {"train_loss": -23.09510612487793, "global_step": 158051, "epoch": 1904} {"train_loss": -23.037017822265625, "global_step": 158052, "epoch": 1904} {"train_loss": -23.297353744506836, "global_step": 158053, "epoch": 1904} {"train_loss": -22.965381622314453, "global_step": 158054, "epoch": 1904} {"train_loss": -23.120288848876953, "global_step": 158055, "epoch": 1904} {"train_loss": -23.599950790405273, "global_step": 158056, "epoch": 1904} {"train_loss": -23.238815307617188, "global_step": 158057, "epoch": 1904} {"train_loss": -23.443811416625977, "global_step": 158058, "epoch": 1904} {"train_loss": -23.4580135345459, "global_step": 158059, "epoch": 1904} {"train_loss": -23.31314468383789, "global_step": 158060, "epoch": 1904} {"train_loss": -23.375635147094727, "global_step": 158061, "epoch": 1904} {"train_loss": -23.176151275634766, "global_step": 158062, "epoch": 1904} {"train_loss": -23.403030395507812, "global_step": 158063, "epoch": 1904} {"train_loss": -23.463876724243164, "global_step": 158064, "epoch": 1904} {"train_loss": -23.19757652282715, "global_step": 158065, "epoch": 1904} {"train_loss": -23.32245445251465, "global_step": 158066, "epoch": 1904} {"train_loss": -23.43773078918457, "global_step": 158067, "epoch": 1904} {"train_loss": -23.169843673706055, "global_step": 158068, "epoch": 1904} {"train_loss": -23.382949829101562, "global_step": 158069, "epoch": 1904} {"train_loss": -23.49555015563965, "global_step": 158070, "epoch": 1904} {"train_loss": -23.378719329833984, "global_step": 158071, "epoch": 1904} {"train_loss": -23.563383102416992, "global_step": 158072, "epoch": 1904} {"train_loss": -23.663164138793945, "global_step": 158073, "epoch": 1904} {"train_loss": -23.53361701965332, "global_step": 158074, "epoch": 1904} {"train_loss": -23.450647354125977, "global_step": 158075, "epoch": 1904} {"train_loss": -23.239492416381836, "global_step": 158076, "epoch": 1904} {"train_loss": -23.588735580444336, "global_step": 158077, "epoch": 1904} {"train_loss": -23.472900390625, "global_step": 158078, "epoch": 1904} {"train_loss": -23.72258949279785, "global_step": 158079, "epoch": 1904} {"train_loss": -23.447858810424805, "global_step": 158080, "epoch": 1904} {"train_loss": -23.493661880493164, "global_step": 158081, "epoch": 1904} {"train_loss": -23.41523551940918, "global_step": 158082, "epoch": 1904} {"train_loss": -23.492795944213867, "global_step": 158083, "epoch": 1904} {"train_loss": -23.470853805541992, "global_step": 158084, "epoch": 1904} {"train_loss": -23.567190170288086, "global_step": 158085, "epoch": 1904} {"train_loss": -23.458730697631836, "global_step": 158086, "epoch": 1904} {"train_loss": -23.547636032104492, "global_step": 158087, "epoch": 1904} {"train_loss": -23.62358856201172, "global_step": 158088, "epoch": 1904} {"train_loss": -23.46864891052246, "global_step": 158089, "epoch": 1904} {"train_loss": -23.603958129882812, "global_step": 158090, "epoch": 1904} {"train_loss": -23.31441879272461, "global_step": 158091, "epoch": 1904} {"train_loss": -22.689241409301758, "global_step": 158092, "epoch": 1904} {"train_loss": -23.17583656311035, "global_step": 158093, "epoch": 1904} {"train_loss": -23.444059371948242, "global_step": 158094, "epoch": 1904} {"train_loss": -23.30103874206543, "global_step": 158095, "epoch": 1904} {"train_loss": -23.17587661743164, "global_step": 158096, "epoch": 1904} {"train_loss": -23.087156295776367, "global_step": 158097, "epoch": 1904} {"train_loss": -23.539148330688477, "global_step": 158098, "epoch": 1904} {"train_loss": -23.21125030517578, "global_step": 158099, "epoch": 1904} {"train_loss": -23.22245979309082, "global_step": 158100, "epoch": 1904} {"train_loss": -23.520992279052734, "global_step": 158101, "epoch": 1904} {"train_loss": -23.8060359954834, "global_step": 158102, "epoch": 1904} {"train_loss": -23.495609283447266, "global_step": 158103, "epoch": 1904} {"train_loss": -23.654300689697266, "global_step": 158104, "epoch": 1904} {"train_loss": -23.26839828491211, "global_step": 158105, "epoch": 1904} {"train_loss": -23.556089401245117, "global_step": 158106, "epoch": 1904} {"train_loss": -23.29416847229004, "global_step": 158107, "epoch": 1904} {"train_loss": -23.310956954956055, "global_step": 158108, "epoch": 1904} {"train_loss": -23.33345603942871, "global_step": 158109, "epoch": 1904} {"train_loss": -23.484516143798828, "global_step": 158110, "epoch": 1904} {"train_loss": -23.70294189453125, "global_step": 158111, "epoch": 1904} {"train_loss": -23.753950119018555, "global_step": 158112, "epoch": 1904} {"train_loss": -23.912626266479492, "global_step": 158113, "epoch": 1904} {"train_loss": -23.30991572644337, "global_step": 158114, "epoch": 1904, "val_loss": 6284285.0} {"train_loss": -21.832595825195312, "global_step": 158115, "epoch": 1905} {"train_loss": -22.82147216796875, "global_step": 158116, "epoch": 1905} {"train_loss": -22.590282440185547, "global_step": 158117, "epoch": 1905} {"train_loss": -22.412206649780273, "global_step": 158118, "epoch": 1905} {"train_loss": -23.003896713256836, "global_step": 158119, "epoch": 1905} {"train_loss": -22.891925811767578, "global_step": 158120, "epoch": 1905} {"train_loss": -22.793760299682617, "global_step": 158121, "epoch": 1905} {"train_loss": -22.83977699279785, "global_step": 158122, "epoch": 1905} {"train_loss": -23.22835350036621, "global_step": 158123, "epoch": 1905} {"train_loss": -22.69708824157715, "global_step": 158124, "epoch": 1905} {"train_loss": -23.13524055480957, "global_step": 158125, "epoch": 1905} {"train_loss": -22.979976654052734, "global_step": 158126, "epoch": 1905} {"train_loss": -23.091796875, "global_step": 158127, "epoch": 1905} {"train_loss": -23.18057632446289, "global_step": 158128, "epoch": 1905} {"train_loss": -23.0408992767334, "global_step": 158129, "epoch": 1905} {"train_loss": -23.43227767944336, "global_step": 158130, "epoch": 1905} {"train_loss": -22.99020004272461, "global_step": 158131, "epoch": 1905} {"train_loss": -23.265308380126953, "global_step": 158132, "epoch": 1905} {"train_loss": -23.42524528503418, "global_step": 158133, "epoch": 1905} {"train_loss": -23.423446655273438, "global_step": 158134, "epoch": 1905} {"train_loss": -23.157943725585938, "global_step": 158135, "epoch": 1905} {"train_loss": -23.425947189331055, "global_step": 158136, "epoch": 1905} {"train_loss": -22.86341667175293, "global_step": 158137, "epoch": 1905} {"train_loss": -23.373647689819336, "global_step": 158138, "epoch": 1905} {"train_loss": -23.28133773803711, "global_step": 158139, "epoch": 1905} {"train_loss": -22.93674659729004, "global_step": 158140, "epoch": 1905} {"train_loss": -23.477298736572266, "global_step": 158141, "epoch": 1905} {"train_loss": -23.38692283630371, "global_step": 158142, "epoch": 1905} {"train_loss": -23.015518188476562, "global_step": 158143, "epoch": 1905} {"train_loss": -23.39985466003418, "global_step": 158144, "epoch": 1905} {"train_loss": -23.3692684173584, "global_step": 158145, "epoch": 1905} {"train_loss": -23.18680763244629, "global_step": 158146, "epoch": 1905} {"train_loss": -23.218542098999023, "global_step": 158147, "epoch": 1905} {"train_loss": -23.20304298400879, "global_step": 158148, "epoch": 1905} {"train_loss": -23.625883102416992, "global_step": 158149, "epoch": 1905} {"train_loss": -23.36166763305664, "global_step": 158150, "epoch": 1905} {"train_loss": -23.4956111907959, "global_step": 158151, "epoch": 1905} {"train_loss": -23.525739669799805, "global_step": 158152, "epoch": 1905} {"train_loss": -23.421613693237305, "global_step": 158153, "epoch": 1905} {"train_loss": -23.45570182800293, "global_step": 158154, "epoch": 1905} {"train_loss": -23.394662857055664, "global_step": 158155, "epoch": 1905} {"train_loss": -23.20230484008789, "global_step": 158156, "epoch": 1905} {"train_loss": -23.360536575317383, "global_step": 158157, "epoch": 1905} {"train_loss": -23.647855758666992, "global_step": 158158, "epoch": 1905} {"train_loss": -23.2178897857666, "global_step": 158159, "epoch": 1905} {"train_loss": -23.665311813354492, "global_step": 158160, "epoch": 1905} {"train_loss": -23.287521362304688, "global_step": 158161, "epoch": 1905} {"train_loss": -23.323102951049805, "global_step": 158162, "epoch": 1905} {"train_loss": -23.411012649536133, "global_step": 158163, "epoch": 1905} {"train_loss": -23.710065841674805, "global_step": 158164, "epoch": 1905} {"train_loss": -23.350494384765625, "global_step": 158165, "epoch": 1905} {"train_loss": -23.456233978271484, "global_step": 158166, "epoch": 1905} {"train_loss": -23.284564971923828, "global_step": 158167, "epoch": 1905} {"train_loss": -23.385953903198242, "global_step": 158168, "epoch": 1905} {"train_loss": -23.222084045410156, "global_step": 158169, "epoch": 1905} {"train_loss": -23.510290145874023, "global_step": 158170, "epoch": 1905} {"train_loss": -23.396591186523438, "global_step": 158171, "epoch": 1905} {"train_loss": -23.666479110717773, "global_step": 158172, "epoch": 1905} {"train_loss": -23.265138626098633, "global_step": 158173, "epoch": 1905} {"train_loss": -23.739728927612305, "global_step": 158174, "epoch": 1905} {"train_loss": -23.685495376586914, "global_step": 158175, "epoch": 1905} {"train_loss": -23.12952995300293, "global_step": 158176, "epoch": 1905} {"train_loss": -23.237991333007812, "global_step": 158177, "epoch": 1905} {"train_loss": -23.109067916870117, "global_step": 158178, "epoch": 1905} {"train_loss": -23.410364151000977, "global_step": 158179, "epoch": 1905} {"train_loss": -23.542173385620117, "global_step": 158180, "epoch": 1905} {"train_loss": -23.489492416381836, "global_step": 158181, "epoch": 1905} {"train_loss": -23.64402198791504, "global_step": 158182, "epoch": 1905} {"train_loss": -23.836606979370117, "global_step": 158183, "epoch": 1905} {"train_loss": -23.18345069885254, "global_step": 158184, "epoch": 1905} {"train_loss": -23.7032527923584, "global_step": 158185, "epoch": 1905} {"train_loss": -23.586450576782227, "global_step": 158186, "epoch": 1905} {"train_loss": -23.44087028503418, "global_step": 158187, "epoch": 1905} {"train_loss": -23.135671615600586, "global_step": 158188, "epoch": 1905} {"train_loss": -23.686120986938477, "global_step": 158189, "epoch": 1905} {"train_loss": -23.516010284423828, "global_step": 158190, "epoch": 1905} {"train_loss": -23.504880905151367, "global_step": 158191, "epoch": 1905} {"train_loss": -23.48126220703125, "global_step": 158192, "epoch": 1905} {"train_loss": -23.544981002807617, "global_step": 158193, "epoch": 1905} {"train_loss": -23.664112091064453, "global_step": 158194, "epoch": 1905} {"train_loss": -23.58880043029785, "global_step": 158195, "epoch": 1905} {"train_loss": -23.38888168334961, "global_step": 158196, "epoch": 1905} {"train_loss": -23.304826115987385, "global_step": 158197, "epoch": 1905, "val_loss": 6381402.0} {"train_loss": -22.786819458007812, "global_step": 158198, "epoch": 1906} {"train_loss": -22.755544662475586, "global_step": 158199, "epoch": 1906} {"train_loss": -22.9670467376709, "global_step": 158200, "epoch": 1906} {"train_loss": -22.937374114990234, "global_step": 158201, "epoch": 1906} {"train_loss": -23.02426528930664, "global_step": 158202, "epoch": 1906} {"train_loss": -23.223121643066406, "global_step": 158203, "epoch": 1906} {"train_loss": -23.20050621032715, "global_step": 158204, "epoch": 1906} {"train_loss": -23.225231170654297, "global_step": 158205, "epoch": 1906} {"train_loss": -22.986860275268555, "global_step": 158206, "epoch": 1906} {"train_loss": -23.37026596069336, "global_step": 158207, "epoch": 1906} {"train_loss": -22.731773376464844, "global_step": 158208, "epoch": 1906} {"train_loss": -22.518383026123047, "global_step": 158209, "epoch": 1906} {"train_loss": -23.02255630493164, "global_step": 158210, "epoch": 1906} {"train_loss": -23.057275772094727, "global_step": 158211, "epoch": 1906} {"train_loss": -23.126251220703125, "global_step": 158212, "epoch": 1906} {"train_loss": -23.132444381713867, "global_step": 158213, "epoch": 1906} {"train_loss": -22.95163345336914, "global_step": 158214, "epoch": 1906} {"train_loss": -23.247623443603516, "global_step": 158215, "epoch": 1906} {"train_loss": -23.117170333862305, "global_step": 158216, "epoch": 1906} {"train_loss": -23.09323501586914, "global_step": 158217, "epoch": 1906} {"train_loss": -23.125133514404297, "global_step": 158218, "epoch": 1906} {"train_loss": -23.81125259399414, "global_step": 158219, "epoch": 1906} {"train_loss": -23.150928497314453, "global_step": 158220, "epoch": 1906} {"train_loss": -23.429534912109375, "global_step": 158221, "epoch": 1906} {"train_loss": -23.250614166259766, "global_step": 158222, "epoch": 1906} {"train_loss": -23.554018020629883, "global_step": 158223, "epoch": 1906} {"train_loss": -23.2402286529541, "global_step": 158224, "epoch": 1906} {"train_loss": -23.281782150268555, "global_step": 158225, "epoch": 1906} {"train_loss": -23.60331153869629, "global_step": 158226, "epoch": 1906} {"train_loss": -23.5529842376709, "global_step": 158227, "epoch": 1906} {"train_loss": -23.490386962890625, "global_step": 158228, "epoch": 1906} {"train_loss": -23.320968627929688, "global_step": 158229, "epoch": 1906} {"train_loss": -23.589008331298828, "global_step": 158230, "epoch": 1906} {"train_loss": -23.679670333862305, "global_step": 158231, "epoch": 1906} {"train_loss": -23.26593589782715, "global_step": 158232, "epoch": 1906} {"train_loss": -23.50398063659668, "global_step": 158233, "epoch": 1906} {"train_loss": -23.650747299194336, "global_step": 158234, "epoch": 1906} {"train_loss": -23.33722496032715, "global_step": 158235, "epoch": 1906} {"train_loss": -23.44049644470215, "global_step": 158236, "epoch": 1906} {"train_loss": -23.423099517822266, "global_step": 158237, "epoch": 1906} {"train_loss": -23.361221313476562, "global_step": 158238, "epoch": 1906} {"train_loss": -23.621124267578125, "global_step": 158239, "epoch": 1906} {"train_loss": -23.7825927734375, "global_step": 158240, "epoch": 1906} {"train_loss": -23.570390701293945, "global_step": 158241, "epoch": 1906} {"train_loss": -23.635793685913086, "global_step": 158242, "epoch": 1906} {"train_loss": -23.345115661621094, "global_step": 158243, "epoch": 1906} {"train_loss": -23.72049903869629, "global_step": 158244, "epoch": 1906} {"train_loss": -23.261348724365234, "global_step": 158245, "epoch": 1906} {"train_loss": -23.0567626953125, "global_step": 158246, "epoch": 1906} {"train_loss": -23.105865478515625, "global_step": 158247, "epoch": 1906} {"train_loss": -23.392135620117188, "global_step": 158248, "epoch": 1906} {"train_loss": -23.484609603881836, "global_step": 158249, "epoch": 1906} {"train_loss": -23.40308952331543, "global_step": 158250, "epoch": 1906} {"train_loss": -23.536746978759766, "global_step": 158251, "epoch": 1906} {"train_loss": -23.702550888061523, "global_step": 158252, "epoch": 1906} {"train_loss": -23.6467227935791, "global_step": 158253, "epoch": 1906} {"train_loss": -23.329071044921875, "global_step": 158254, "epoch": 1906} {"train_loss": -22.788604736328125, "global_step": 158255, "epoch": 1906} {"train_loss": -23.672094345092773, "global_step": 158256, "epoch": 1906} {"train_loss": -23.645666122436523, "global_step": 158257, "epoch": 1906} {"train_loss": -23.078523635864258, "global_step": 158258, "epoch": 1906} {"train_loss": -23.355390548706055, "global_step": 158259, "epoch": 1906} {"train_loss": -23.326894760131836, "global_step": 158260, "epoch": 1906} {"train_loss": -23.121549606323242, "global_step": 158261, "epoch": 1906} {"train_loss": -23.568603515625, "global_step": 158262, "epoch": 1906} {"train_loss": -23.65488052368164, "global_step": 158263, "epoch": 1906} {"train_loss": -23.537572860717773, "global_step": 158264, "epoch": 1906} {"train_loss": -23.35590362548828, "global_step": 158265, "epoch": 1906} {"train_loss": -23.63583755493164, "global_step": 158266, "epoch": 1906} {"train_loss": -23.148731231689453, "global_step": 158267, "epoch": 1906} {"train_loss": -23.066396713256836, "global_step": 158268, "epoch": 1906} {"train_loss": -23.823537826538086, "global_step": 158269, "epoch": 1906} {"train_loss": -23.50503158569336, "global_step": 158270, "epoch": 1906} {"train_loss": -23.63129997253418, "global_step": 158271, "epoch": 1906} {"train_loss": -23.71609115600586, "global_step": 158272, "epoch": 1906} {"train_loss": -23.664249420166016, "global_step": 158273, "epoch": 1906} {"train_loss": -23.026020050048828, "global_step": 158274, "epoch": 1906} {"train_loss": -23.468870162963867, "global_step": 158275, "epoch": 1906} {"train_loss": -23.457433700561523, "global_step": 158276, "epoch": 1906} {"train_loss": -23.700597763061523, "global_step": 158277, "epoch": 1906} {"train_loss": -23.318326950073242, "global_step": 158278, "epoch": 1906} {"train_loss": -23.612751007080078, "global_step": 158279, "epoch": 1906} {"train_loss": -23.350277705364917, "global_step": 158280, "epoch": 1906, "val_loss": 6304635.0} {"train_loss": -23.243244171142578, "global_step": 158281, "epoch": 1907} {"train_loss": -23.40511131286621, "global_step": 158282, "epoch": 1907} {"train_loss": -23.41267204284668, "global_step": 158283, "epoch": 1907} {"train_loss": -23.350065231323242, "global_step": 158284, "epoch": 1907} {"train_loss": -23.590097427368164, "global_step": 158285, "epoch": 1907} {"train_loss": -23.806142807006836, "global_step": 158286, "epoch": 1907} {"train_loss": -23.5306453704834, "global_step": 158287, "epoch": 1907} {"train_loss": -23.367572784423828, "global_step": 158288, "epoch": 1907} {"train_loss": -23.277624130249023, "global_step": 158289, "epoch": 1907} {"train_loss": -23.5039119720459, "global_step": 158290, "epoch": 1907} {"train_loss": -23.264272689819336, "global_step": 158291, "epoch": 1907} {"train_loss": -23.509525299072266, "global_step": 158292, "epoch": 1907} {"train_loss": -23.33041000366211, "global_step": 158293, "epoch": 1907} {"train_loss": -23.1428279876709, "global_step": 158294, "epoch": 1907} {"train_loss": -23.04291343688965, "global_step": 158295, "epoch": 1907} {"train_loss": -23.387027740478516, "global_step": 158296, "epoch": 1907} {"train_loss": -23.394031524658203, "global_step": 158297, "epoch": 1907} {"train_loss": -23.401540756225586, "global_step": 158298, "epoch": 1907} {"train_loss": -23.404767990112305, "global_step": 158299, "epoch": 1907} {"train_loss": -23.34705924987793, "global_step": 158300, "epoch": 1907} {"train_loss": -23.182905197143555, "global_step": 158301, "epoch": 1907} {"train_loss": -23.287199020385742, "global_step": 158302, "epoch": 1907} {"train_loss": -23.4526424407959, "global_step": 158303, "epoch": 1907} {"train_loss": -23.583389282226562, "global_step": 158304, "epoch": 1907} {"train_loss": -23.49627685546875, "global_step": 158305, "epoch": 1907} {"train_loss": -23.481616973876953, "global_step": 158306, "epoch": 1907} {"train_loss": -23.219236373901367, "global_step": 158307, "epoch": 1907} {"train_loss": -23.326356887817383, "global_step": 158308, "epoch": 1907} {"train_loss": -23.606367111206055, "global_step": 158309, "epoch": 1907} {"train_loss": -23.536405563354492, "global_step": 158310, "epoch": 1907} {"train_loss": -23.456199645996094, "global_step": 158311, "epoch": 1907} {"train_loss": -23.423669815063477, "global_step": 158312, "epoch": 1907} {"train_loss": -23.2248477935791, "global_step": 158313, "epoch": 1907} {"train_loss": -23.546918869018555, "global_step": 158314, "epoch": 1907} {"train_loss": -23.49875259399414, "global_step": 158315, "epoch": 1907} {"train_loss": -23.582059860229492, "global_step": 158316, "epoch": 1907} {"train_loss": -23.759553909301758, "global_step": 158317, "epoch": 1907} {"train_loss": -23.512163162231445, "global_step": 158318, "epoch": 1907} {"train_loss": -23.833881378173828, "global_step": 158319, "epoch": 1907} {"train_loss": -23.21775245666504, "global_step": 158320, "epoch": 1907} {"train_loss": -23.12554359436035, "global_step": 158321, "epoch": 1907} {"train_loss": -23.162761688232422, "global_step": 158322, "epoch": 1907} {"train_loss": -23.52631187438965, "global_step": 158323, "epoch": 1907} {"train_loss": -23.447803497314453, "global_step": 158324, "epoch": 1907} {"train_loss": -23.05006980895996, "global_step": 158325, "epoch": 1907} {"train_loss": -23.328413009643555, "global_step": 158326, "epoch": 1907} {"train_loss": -23.683759689331055, "global_step": 158327, "epoch": 1907} {"train_loss": -23.5040225982666, "global_step": 158328, "epoch": 1907} {"train_loss": -23.961368560791016, "global_step": 158329, "epoch": 1907} {"train_loss": -23.562353134155273, "global_step": 158330, "epoch": 1907} {"train_loss": -23.384553909301758, "global_step": 158331, "epoch": 1907} {"train_loss": -23.903841018676758, "global_step": 158332, "epoch": 1907} {"train_loss": -22.978912353515625, "global_step": 158333, "epoch": 1907} {"train_loss": -23.43702507019043, "global_step": 158334, "epoch": 1907} {"train_loss": -23.4565372467041, "global_step": 158335, "epoch": 1907} {"train_loss": -23.387325286865234, "global_step": 158336, "epoch": 1907} {"train_loss": -23.75946807861328, "global_step": 158337, "epoch": 1907} {"train_loss": -23.35517692565918, "global_step": 158338, "epoch": 1907} {"train_loss": -23.6135311126709, "global_step": 158339, "epoch": 1907} {"train_loss": -23.75590705871582, "global_step": 158340, "epoch": 1907} {"train_loss": -23.564382553100586, "global_step": 158341, "epoch": 1907} {"train_loss": -23.60074234008789, "global_step": 158342, "epoch": 1907} {"train_loss": -23.330015182495117, "global_step": 158343, "epoch": 1907} {"train_loss": -23.661951065063477, "global_step": 158344, "epoch": 1907} {"train_loss": -23.776996612548828, "global_step": 158345, "epoch": 1907} {"train_loss": -23.80881118774414, "global_step": 158346, "epoch": 1907} {"train_loss": -23.426733016967773, "global_step": 158347, "epoch": 1907} {"train_loss": -23.7359561920166, "global_step": 158348, "epoch": 1907} {"train_loss": -23.632293701171875, "global_step": 158349, "epoch": 1907} {"train_loss": -23.598159790039062, "global_step": 158350, "epoch": 1907} {"train_loss": -23.455533981323242, "global_step": 158351, "epoch": 1907} {"train_loss": -23.566158294677734, "global_step": 158352, "epoch": 1907} {"train_loss": -23.4375057220459, "global_step": 158353, "epoch": 1907} {"train_loss": -23.2788028717041, "global_step": 158354, "epoch": 1907} {"train_loss": -23.79622459411621, "global_step": 158355, "epoch": 1907} {"train_loss": -23.60565757751465, "global_step": 158356, "epoch": 1907} {"train_loss": -23.315500259399414, "global_step": 158357, "epoch": 1907} {"train_loss": -23.702266693115234, "global_step": 158358, "epoch": 1907} {"train_loss": -23.21858024597168, "global_step": 158359, "epoch": 1907} {"train_loss": -23.262388229370117, "global_step": 158360, "epoch": 1907} {"train_loss": -23.53315544128418, "global_step": 158361, "epoch": 1907} {"train_loss": -23.520490646362305, "global_step": 158362, "epoch": 1907} {"train_loss": -23.44822058620223, "global_step": 158363, "epoch": 1907, "val_loss": 6354052.5} {"train_loss": -23.34519386291504, "global_step": 158364, "epoch": 1908} {"train_loss": -22.538503646850586, "global_step": 158365, "epoch": 1908} {"train_loss": -22.413251876831055, "global_step": 158366, "epoch": 1908} {"train_loss": -22.86305046081543, "global_step": 158367, "epoch": 1908} {"train_loss": -23.171905517578125, "global_step": 158368, "epoch": 1908} {"train_loss": -22.788959503173828, "global_step": 158369, "epoch": 1908} {"train_loss": -23.279266357421875, "global_step": 158370, "epoch": 1908} {"train_loss": -23.251245498657227, "global_step": 158371, "epoch": 1908} {"train_loss": -23.21993064880371, "global_step": 158372, "epoch": 1908} {"train_loss": -23.38728141784668, "global_step": 158373, "epoch": 1908} {"train_loss": -23.235876083374023, "global_step": 158374, "epoch": 1908} {"train_loss": -22.91096305847168, "global_step": 158375, "epoch": 1908} {"train_loss": -23.209829330444336, "global_step": 158376, "epoch": 1908} {"train_loss": -23.382959365844727, "global_step": 158377, "epoch": 1908} {"train_loss": -23.564374923706055, "global_step": 158378, "epoch": 1908} {"train_loss": -23.28731346130371, "global_step": 158379, "epoch": 1908} {"train_loss": -23.227432250976562, "global_step": 158380, "epoch": 1908} {"train_loss": -23.460073471069336, "global_step": 158381, "epoch": 1908} {"train_loss": -23.773786544799805, "global_step": 158382, "epoch": 1908} {"train_loss": -23.3536376953125, "global_step": 158383, "epoch": 1908} {"train_loss": -23.315921783447266, "global_step": 158384, "epoch": 1908} {"train_loss": -23.260644912719727, "global_step": 158385, "epoch": 1908} {"train_loss": -23.46206283569336, "global_step": 158386, "epoch": 1908} {"train_loss": -23.305116653442383, "global_step": 158387, "epoch": 1908} {"train_loss": -23.436067581176758, "global_step": 158388, "epoch": 1908} {"train_loss": -23.582876205444336, "global_step": 158389, "epoch": 1908} {"train_loss": -23.392932891845703, "global_step": 158390, "epoch": 1908} {"train_loss": -23.633363723754883, "global_step": 158391, "epoch": 1908} {"train_loss": -23.68259620666504, "global_step": 158392, "epoch": 1908} {"train_loss": -23.411741256713867, "global_step": 158393, "epoch": 1908} {"train_loss": -23.444639205932617, "global_step": 158394, "epoch": 1908} {"train_loss": -23.660934448242188, "global_step": 158395, "epoch": 1908} {"train_loss": -23.54364585876465, "global_step": 158396, "epoch": 1908} {"train_loss": -23.7902774810791, "global_step": 158397, "epoch": 1908} {"train_loss": -23.444429397583008, "global_step": 158398, "epoch": 1908} {"train_loss": -23.547338485717773, "global_step": 158399, "epoch": 1908} {"train_loss": -23.521324157714844, "global_step": 158400, "epoch": 1908} {"train_loss": -23.216447830200195, "global_step": 158401, "epoch": 1908} {"train_loss": -23.364994049072266, "global_step": 158402, "epoch": 1908} {"train_loss": -23.607519149780273, "global_step": 158403, "epoch": 1908} {"train_loss": -23.37649917602539, "global_step": 158404, "epoch": 1908} {"train_loss": -23.408496856689453, "global_step": 158405, "epoch": 1908} {"train_loss": -23.414039611816406, "global_step": 158406, "epoch": 1908} {"train_loss": -23.497257232666016, "global_step": 158407, "epoch": 1908} {"train_loss": -23.395904541015625, "global_step": 158408, "epoch": 1908} {"train_loss": -23.211584091186523, "global_step": 158409, "epoch": 1908} {"train_loss": -23.43733787536621, "global_step": 158410, "epoch": 1908} {"train_loss": -23.244796752929688, "global_step": 158411, "epoch": 1908} {"train_loss": -23.40218162536621, "global_step": 158412, "epoch": 1908} {"train_loss": -23.47308921813965, "global_step": 158413, "epoch": 1908} {"train_loss": -23.584508895874023, "global_step": 158414, "epoch": 1908} {"train_loss": -23.321487426757812, "global_step": 158415, "epoch": 1908} {"train_loss": -23.213748931884766, "global_step": 158416, "epoch": 1908} {"train_loss": -23.50333023071289, "global_step": 158417, "epoch": 1908} {"train_loss": -23.582136154174805, "global_step": 158418, "epoch": 1908} {"train_loss": -23.365798950195312, "global_step": 158419, "epoch": 1908} {"train_loss": -23.578943252563477, "global_step": 158420, "epoch": 1908} {"train_loss": -24.069599151611328, "global_step": 158421, "epoch": 1908} {"train_loss": -23.33015251159668, "global_step": 158422, "epoch": 1908} {"train_loss": -23.53727149963379, "global_step": 158423, "epoch": 1908} {"train_loss": -23.707731246948242, "global_step": 158424, "epoch": 1908} {"train_loss": -23.71933364868164, "global_step": 158425, "epoch": 1908} {"train_loss": -23.299457550048828, "global_step": 158426, "epoch": 1908} {"train_loss": -23.374418258666992, "global_step": 158427, "epoch": 1908} {"train_loss": -23.728836059570312, "global_step": 158428, "epoch": 1908} {"train_loss": -23.360864639282227, "global_step": 158429, "epoch": 1908} {"train_loss": -23.14787483215332, "global_step": 158430, "epoch": 1908} {"train_loss": -23.570707321166992, "global_step": 158431, "epoch": 1908} {"train_loss": -23.476736068725586, "global_step": 158432, "epoch": 1908} {"train_loss": -23.566566467285156, "global_step": 158433, "epoch": 1908} {"train_loss": -23.641864776611328, "global_step": 158434, "epoch": 1908} {"train_loss": -23.3791446685791, "global_step": 158435, "epoch": 1908} {"train_loss": -23.5544490814209, "global_step": 158436, "epoch": 1908} {"train_loss": -23.283254623413086, "global_step": 158437, "epoch": 1908} {"train_loss": -23.614662170410156, "global_step": 158438, "epoch": 1908} {"train_loss": -23.23481559753418, "global_step": 158439, "epoch": 1908} {"train_loss": -23.32803726196289, "global_step": 158440, "epoch": 1908} {"train_loss": -23.095529556274414, "global_step": 158441, "epoch": 1908} {"train_loss": -23.56139373779297, "global_step": 158442, "epoch": 1908} {"train_loss": -23.391599655151367, "global_step": 158443, "epoch": 1908} {"train_loss": -23.319738388061523, "global_step": 158444, "epoch": 1908} {"train_loss": -23.73984718322754, "global_step": 158445, "epoch": 1908} {"train_loss": -23.39930998560894, "global_step": 158446, "epoch": 1908, "val_loss": 6330867.5} {"train_loss": -23.1903018951416, "global_step": 158447, "epoch": 1909} {"train_loss": -23.258005142211914, "global_step": 158448, "epoch": 1909} {"train_loss": -23.609289169311523, "global_step": 158449, "epoch": 1909} {"train_loss": -23.524877548217773, "global_step": 158450, "epoch": 1909} {"train_loss": -22.89125633239746, "global_step": 158451, "epoch": 1909} {"train_loss": -23.07668113708496, "global_step": 158452, "epoch": 1909} {"train_loss": -22.759464263916016, "global_step": 158453, "epoch": 1909} {"train_loss": -23.20111083984375, "global_step": 158454, "epoch": 1909} {"train_loss": -23.089462280273438, "global_step": 158455, "epoch": 1909} {"train_loss": -23.071149826049805, "global_step": 158456, "epoch": 1909} {"train_loss": -22.951539993286133, "global_step": 158457, "epoch": 1909} {"train_loss": -23.115896224975586, "global_step": 158458, "epoch": 1909} {"train_loss": -23.123197555541992, "global_step": 158459, "epoch": 1909} {"train_loss": -23.404739379882812, "global_step": 158460, "epoch": 1909} {"train_loss": -23.5585994720459, "global_step": 158461, "epoch": 1909} {"train_loss": -22.88971519470215, "global_step": 158462, "epoch": 1909} {"train_loss": -23.4487361907959, "global_step": 158463, "epoch": 1909} {"train_loss": -23.34431266784668, "global_step": 158464, "epoch": 1909} {"train_loss": -23.399295806884766, "global_step": 158465, "epoch": 1909} {"train_loss": -23.412418365478516, "global_step": 158466, "epoch": 1909} {"train_loss": -23.413663864135742, "global_step": 158467, "epoch": 1909} {"train_loss": -23.83905029296875, "global_step": 158468, "epoch": 1909} {"train_loss": -23.522308349609375, "global_step": 158469, "epoch": 1909} {"train_loss": -23.681915283203125, "global_step": 158470, "epoch": 1909} {"train_loss": -23.57124137878418, "global_step": 158471, "epoch": 1909} {"train_loss": -23.279617309570312, "global_step": 158472, "epoch": 1909} {"train_loss": -23.234853744506836, "global_step": 158473, "epoch": 1909} {"train_loss": -23.49610710144043, "global_step": 158474, "epoch": 1909} {"train_loss": -23.796525955200195, "global_step": 158475, "epoch": 1909} {"train_loss": -23.345693588256836, "global_step": 158476, "epoch": 1909} {"train_loss": -23.339326858520508, "global_step": 158477, "epoch": 1909} {"train_loss": -23.70003890991211, "global_step": 158478, "epoch": 1909} {"train_loss": -23.739221572875977, "global_step": 158479, "epoch": 1909} {"train_loss": -23.277835845947266, "global_step": 158480, "epoch": 1909} {"train_loss": -23.450057983398438, "global_step": 158481, "epoch": 1909} {"train_loss": -23.45277976989746, "global_step": 158482, "epoch": 1909} {"train_loss": -23.52695083618164, "global_step": 158483, "epoch": 1909} {"train_loss": -23.339115142822266, "global_step": 158484, "epoch": 1909} {"train_loss": -23.59668731689453, "global_step": 158485, "epoch": 1909} {"train_loss": -23.235126495361328, "global_step": 158486, "epoch": 1909} {"train_loss": -23.35829734802246, "global_step": 158487, "epoch": 1909} {"train_loss": -23.751022338867188, "global_step": 158488, "epoch": 1909} {"train_loss": -23.180572509765625, "global_step": 158489, "epoch": 1909} {"train_loss": -23.79481315612793, "global_step": 158490, "epoch": 1909} {"train_loss": -23.866058349609375, "global_step": 158491, "epoch": 1909} {"train_loss": -23.110136032104492, "global_step": 158492, "epoch": 1909} {"train_loss": -23.37843894958496, "global_step": 158493, "epoch": 1909} {"train_loss": -22.891063690185547, "global_step": 158494, "epoch": 1909} {"train_loss": -22.8164119720459, "global_step": 158495, "epoch": 1909} {"train_loss": -23.142677307128906, "global_step": 158496, "epoch": 1909} {"train_loss": -22.605100631713867, "global_step": 158497, "epoch": 1909} {"train_loss": -23.549482345581055, "global_step": 158498, "epoch": 1909} {"train_loss": -22.91437339782715, "global_step": 158499, "epoch": 1909} {"train_loss": -22.708227157592773, "global_step": 158500, "epoch": 1909} {"train_loss": -23.137048721313477, "global_step": 158501, "epoch": 1909} {"train_loss": -23.195615768432617, "global_step": 158502, "epoch": 1909} {"train_loss": -23.201745986938477, "global_step": 158503, "epoch": 1909} {"train_loss": -23.330202102661133, "global_step": 158504, "epoch": 1909} {"train_loss": -23.333908081054688, "global_step": 158505, "epoch": 1909} {"train_loss": -23.455066680908203, "global_step": 158506, "epoch": 1909} {"train_loss": -23.542804718017578, "global_step": 158507, "epoch": 1909} {"train_loss": -23.337736129760742, "global_step": 158508, "epoch": 1909} {"train_loss": -23.19488525390625, "global_step": 158509, "epoch": 1909} {"train_loss": -23.622669219970703, "global_step": 158510, "epoch": 1909} {"train_loss": -23.654769897460938, "global_step": 158511, "epoch": 1909} {"train_loss": -23.40689468383789, "global_step": 158512, "epoch": 1909} {"train_loss": -23.770057678222656, "global_step": 158513, "epoch": 1909} {"train_loss": -23.352170944213867, "global_step": 158514, "epoch": 1909} {"train_loss": -23.422149658203125, "global_step": 158515, "epoch": 1909} {"train_loss": -23.45160675048828, "global_step": 158516, "epoch": 1909} {"train_loss": -23.597593307495117, "global_step": 158517, "epoch": 1909} {"train_loss": -23.15851593017578, "global_step": 158518, "epoch": 1909} {"train_loss": -23.52475929260254, "global_step": 158519, "epoch": 1909} {"train_loss": -23.79366111755371, "global_step": 158520, "epoch": 1909} {"train_loss": -23.467065811157227, "global_step": 158521, "epoch": 1909} {"train_loss": -23.701841354370117, "global_step": 158522, "epoch": 1909} {"train_loss": -23.588037490844727, "global_step": 158523, "epoch": 1909} {"train_loss": -23.19874382019043, "global_step": 158524, "epoch": 1909} {"train_loss": -23.60628318786621, "global_step": 158525, "epoch": 1909} {"train_loss": -23.945096969604492, "global_step": 158526, "epoch": 1909} {"train_loss": -23.526533126831055, "global_step": 158527, "epoch": 1909} {"train_loss": -23.42070770263672, "global_step": 158528, "epoch": 1909} {"train_loss": -23.363728580704656, "global_step": 158529, "epoch": 1909, "val_loss": 6339808.0} {"train_loss": -21.606721878051758, "global_step": 158530, "epoch": 1910} {"train_loss": -22.93100929260254, "global_step": 158531, "epoch": 1910} {"train_loss": -22.209096908569336, "global_step": 158532, "epoch": 1910} {"train_loss": -22.442424774169922, "global_step": 158533, "epoch": 1910} {"train_loss": -22.508893966674805, "global_step": 158534, "epoch": 1910} {"train_loss": -22.4873046875, "global_step": 158535, "epoch": 1910} {"train_loss": -22.557998657226562, "global_step": 158536, "epoch": 1910} {"train_loss": -22.844646453857422, "global_step": 158537, "epoch": 1910} {"train_loss": -22.462295532226562, "global_step": 158538, "epoch": 1910} {"train_loss": -22.726520538330078, "global_step": 158539, "epoch": 1910} {"train_loss": -22.7171688079834, "global_step": 158540, "epoch": 1910} {"train_loss": -22.563575744628906, "global_step": 158541, "epoch": 1910} {"train_loss": -22.7275390625, "global_step": 158542, "epoch": 1910} {"train_loss": -22.7666072845459, "global_step": 158543, "epoch": 1910} {"train_loss": -22.5488224029541, "global_step": 158544, "epoch": 1910} {"train_loss": -23.20440101623535, "global_step": 158545, "epoch": 1910} {"train_loss": -22.759611129760742, "global_step": 158546, "epoch": 1910} {"train_loss": -23.050100326538086, "global_step": 158547, "epoch": 1910} {"train_loss": -22.950828552246094, "global_step": 158548, "epoch": 1910} {"train_loss": -22.983102798461914, "global_step": 158549, "epoch": 1910} {"train_loss": -23.021379470825195, "global_step": 158550, "epoch": 1910} {"train_loss": -23.372417449951172, "global_step": 158551, "epoch": 1910} {"train_loss": -23.07352066040039, "global_step": 158552, "epoch": 1910} {"train_loss": -23.000202178955078, "global_step": 158553, "epoch": 1910} {"train_loss": -23.198379516601562, "global_step": 158554, "epoch": 1910} {"train_loss": -22.761526107788086, "global_step": 158555, "epoch": 1910} {"train_loss": -23.226173400878906, "global_step": 158556, "epoch": 1910} {"train_loss": -22.93130874633789, "global_step": 158557, "epoch": 1910} {"train_loss": -23.492395401000977, "global_step": 158558, "epoch": 1910} {"train_loss": -23.39507484436035, "global_step": 158559, "epoch": 1910} {"train_loss": -23.497644424438477, "global_step": 158560, "epoch": 1910} {"train_loss": -23.345922470092773, "global_step": 158561, "epoch": 1910} {"train_loss": -23.204742431640625, "global_step": 158562, "epoch": 1910} {"train_loss": -23.153907775878906, "global_step": 158563, "epoch": 1910} {"train_loss": -23.442853927612305, "global_step": 158564, "epoch": 1910} {"train_loss": -23.47348403930664, "global_step": 158565, "epoch": 1910} {"train_loss": -23.599706649780273, "global_step": 158566, "epoch": 1910} {"train_loss": -23.260313034057617, "global_step": 158567, "epoch": 1910} {"train_loss": -23.25032615661621, "global_step": 158568, "epoch": 1910} {"train_loss": -23.48357391357422, "global_step": 158569, "epoch": 1910} {"train_loss": -23.30191421508789, "global_step": 158570, "epoch": 1910} {"train_loss": -23.532459259033203, "global_step": 158571, "epoch": 1910} {"train_loss": -23.498605728149414, "global_step": 158572, "epoch": 1910} {"train_loss": -23.253705978393555, "global_step": 158573, "epoch": 1910} {"train_loss": -23.384765625, "global_step": 158574, "epoch": 1910} {"train_loss": -23.414644241333008, "global_step": 158575, "epoch": 1910} {"train_loss": -23.054737091064453, "global_step": 158576, "epoch": 1910} {"train_loss": -23.278337478637695, "global_step": 158577, "epoch": 1910} {"train_loss": -23.496829986572266, "global_step": 158578, "epoch": 1910} {"train_loss": -23.579832077026367, "global_step": 158579, "epoch": 1910} {"train_loss": -23.596847534179688, "global_step": 158580, "epoch": 1910} {"train_loss": -23.2088565826416, "global_step": 158581, "epoch": 1910} {"train_loss": -23.5642147064209, "global_step": 158582, "epoch": 1910} {"train_loss": -23.433963775634766, "global_step": 158583, "epoch": 1910} {"train_loss": -23.750102996826172, "global_step": 158584, "epoch": 1910} {"train_loss": -23.461660385131836, "global_step": 158585, "epoch": 1910} {"train_loss": -23.462181091308594, "global_step": 158586, "epoch": 1910} {"train_loss": -23.55976676940918, "global_step": 158587, "epoch": 1910} {"train_loss": -23.653575897216797, "global_step": 158588, "epoch": 1910} {"train_loss": -23.578083038330078, "global_step": 158589, "epoch": 1910} {"train_loss": -23.656553268432617, "global_step": 158590, "epoch": 1910} {"train_loss": -23.671289443969727, "global_step": 158591, "epoch": 1910} {"train_loss": -23.589656829833984, "global_step": 158592, "epoch": 1910} {"train_loss": -23.6099796295166, "global_step": 158593, "epoch": 1910} {"train_loss": -23.71408462524414, "global_step": 158594, "epoch": 1910} {"train_loss": -23.321563720703125, "global_step": 158595, "epoch": 1910} {"train_loss": -23.374067306518555, "global_step": 158596, "epoch": 1910} {"train_loss": -23.609577178955078, "global_step": 158597, "epoch": 1910} {"train_loss": -23.689138412475586, "global_step": 158598, "epoch": 1910} {"train_loss": -23.526519775390625, "global_step": 158599, "epoch": 1910} {"train_loss": -23.74443244934082, "global_step": 158600, "epoch": 1910} {"train_loss": -23.271839141845703, "global_step": 158601, "epoch": 1910} {"train_loss": -23.440404891967773, "global_step": 158602, "epoch": 1910} {"train_loss": -23.33582878112793, "global_step": 158603, "epoch": 1910} {"train_loss": -23.70488929748535, "global_step": 158604, "epoch": 1910} {"train_loss": -23.648483276367188, "global_step": 158605, "epoch": 1910} {"train_loss": -23.61732292175293, "global_step": 158606, "epoch": 1910} {"train_loss": -23.73352813720703, "global_step": 158607, "epoch": 1910} {"train_loss": -23.065048217773438, "global_step": 158608, "epoch": 1910} {"train_loss": -23.511293411254883, "global_step": 158609, "epoch": 1910} {"train_loss": -23.30303382873535, "global_step": 158610, "epoch": 1910} {"train_loss": -23.169294357299805, "global_step": 158611, "epoch": 1910} {"train_loss": -23.234761984951525, "global_step": 158612, "epoch": 1910, "val_loss": 6353145.5} {"train_loss": -22.332773208618164, "global_step": 158613, "epoch": 1911} {"train_loss": -22.271451950073242, "global_step": 158614, "epoch": 1911} {"train_loss": -23.008316040039062, "global_step": 158615, "epoch": 1911} {"train_loss": -22.743579864501953, "global_step": 158616, "epoch": 1911} {"train_loss": -23.060489654541016, "global_step": 158617, "epoch": 1911} {"train_loss": -22.99690818786621, "global_step": 158618, "epoch": 1911} {"train_loss": -22.932462692260742, "global_step": 158619, "epoch": 1911} {"train_loss": -23.115196228027344, "global_step": 158620, "epoch": 1911} {"train_loss": -23.15645980834961, "global_step": 158621, "epoch": 1911} {"train_loss": -23.07892608642578, "global_step": 158622, "epoch": 1911} {"train_loss": -23.453136444091797, "global_step": 158623, "epoch": 1911} {"train_loss": -23.201828002929688, "global_step": 158624, "epoch": 1911} {"train_loss": -23.318979263305664, "global_step": 158625, "epoch": 1911} {"train_loss": -23.214040756225586, "global_step": 158626, "epoch": 1911} {"train_loss": -23.45724105834961, "global_step": 158627, "epoch": 1911} {"train_loss": -22.92038345336914, "global_step": 158628, "epoch": 1911} {"train_loss": -23.121870040893555, "global_step": 158629, "epoch": 1911} {"train_loss": -23.51283073425293, "global_step": 158630, "epoch": 1911} {"train_loss": -23.311960220336914, "global_step": 158631, "epoch": 1911} {"train_loss": -23.203577041625977, "global_step": 158632, "epoch": 1911} {"train_loss": -23.655759811401367, "global_step": 158633, "epoch": 1911} {"train_loss": -23.632587432861328, "global_step": 158634, "epoch": 1911} {"train_loss": -23.590885162353516, "global_step": 158635, "epoch": 1911} {"train_loss": -23.368486404418945, "global_step": 158636, "epoch": 1911} {"train_loss": -23.347875595092773, "global_step": 158637, "epoch": 1911} {"train_loss": -23.162389755249023, "global_step": 158638, "epoch": 1911} {"train_loss": -23.37381935119629, "global_step": 158639, "epoch": 1911} {"train_loss": -23.6823787689209, "global_step": 158640, "epoch": 1911} {"train_loss": -23.611745834350586, "global_step": 158641, "epoch": 1911} {"train_loss": -23.66788101196289, "global_step": 158642, "epoch": 1911} {"train_loss": -23.51217269897461, "global_step": 158643, "epoch": 1911} {"train_loss": -23.772733688354492, "global_step": 158644, "epoch": 1911} {"train_loss": -23.769702911376953, "global_step": 158645, "epoch": 1911} {"train_loss": -23.335519790649414, "global_step": 158646, "epoch": 1911} {"train_loss": -23.502975463867188, "global_step": 158647, "epoch": 1911} {"train_loss": -23.335378646850586, "global_step": 158648, "epoch": 1911} {"train_loss": -23.560827255249023, "global_step": 158649, "epoch": 1911} {"train_loss": -23.221038818359375, "global_step": 158650, "epoch": 1911} {"train_loss": -23.38001251220703, "global_step": 158651, "epoch": 1911} {"train_loss": -23.580093383789062, "global_step": 158652, "epoch": 1911} {"train_loss": -23.242273330688477, "global_step": 158653, "epoch": 1911} {"train_loss": -23.353046417236328, "global_step": 158654, "epoch": 1911} {"train_loss": -23.7174015045166, "global_step": 158655, "epoch": 1911} {"train_loss": -23.5790958404541, "global_step": 158656, "epoch": 1911} {"train_loss": -23.086017608642578, "global_step": 158657, "epoch": 1911} {"train_loss": -23.50686264038086, "global_step": 158658, "epoch": 1911} {"train_loss": -23.241621017456055, "global_step": 158659, "epoch": 1911} {"train_loss": -23.7576961517334, "global_step": 158660, "epoch": 1911} {"train_loss": -23.61469268798828, "global_step": 158661, "epoch": 1911} {"train_loss": -23.52997398376465, "global_step": 158662, "epoch": 1911} {"train_loss": -23.392072677612305, "global_step": 158663, "epoch": 1911} {"train_loss": -23.62710189819336, "global_step": 158664, "epoch": 1911} {"train_loss": -23.662494659423828, "global_step": 158665, "epoch": 1911} {"train_loss": -23.308032989501953, "global_step": 158666, "epoch": 1911} {"train_loss": -23.523086547851562, "global_step": 158667, "epoch": 1911} {"train_loss": -23.789838790893555, "global_step": 158668, "epoch": 1911} {"train_loss": -23.729206085205078, "global_step": 158669, "epoch": 1911} {"train_loss": -23.45990562438965, "global_step": 158670, "epoch": 1911} {"train_loss": -23.57387924194336, "global_step": 158671, "epoch": 1911} {"train_loss": -23.23893165588379, "global_step": 158672, "epoch": 1911} {"train_loss": -23.69402503967285, "global_step": 158673, "epoch": 1911} {"train_loss": -23.62306022644043, "global_step": 158674, "epoch": 1911} {"train_loss": -23.636167526245117, "global_step": 158675, "epoch": 1911} {"train_loss": -23.543567657470703, "global_step": 158676, "epoch": 1911} {"train_loss": -23.372163772583008, "global_step": 158677, "epoch": 1911} {"train_loss": -23.687259674072266, "global_step": 158678, "epoch": 1911} {"train_loss": -23.467121124267578, "global_step": 158679, "epoch": 1911} {"train_loss": -23.44597053527832, "global_step": 158680, "epoch": 1911} {"train_loss": -23.27095603942871, "global_step": 158681, "epoch": 1911} {"train_loss": -23.142627716064453, "global_step": 158682, "epoch": 1911} {"train_loss": -23.16816520690918, "global_step": 158683, "epoch": 1911} {"train_loss": -23.191370010375977, "global_step": 158684, "epoch": 1911} {"train_loss": -23.448278427124023, "global_step": 158685, "epoch": 1911} {"train_loss": -23.49234962463379, "global_step": 158686, "epoch": 1911} {"train_loss": -23.557287216186523, "global_step": 158687, "epoch": 1911} {"train_loss": -23.076993942260742, "global_step": 158688, "epoch": 1911} {"train_loss": -23.873323440551758, "global_step": 158689, "epoch": 1911} {"train_loss": -23.183488845825195, "global_step": 158690, "epoch": 1911} {"train_loss": -23.495641708374023, "global_step": 158691, "epoch": 1911} {"train_loss": -23.332962036132812, "global_step": 158692, "epoch": 1911} {"train_loss": -23.209543228149414, "global_step": 158693, "epoch": 1911} {"train_loss": -23.0047664642334, "global_step": 158694, "epoch": 1911} {"train_loss": -23.391653750316205, "global_step": 158695, "epoch": 1911, "val_loss": 6370718.0} {"train_loss": -22.24501609802246, "global_step": 158696, "epoch": 1912} {"train_loss": -22.639671325683594, "global_step": 158697, "epoch": 1912} {"train_loss": -22.313480377197266, "global_step": 158698, "epoch": 1912} {"train_loss": -23.18366813659668, "global_step": 158699, "epoch": 1912} {"train_loss": -22.430133819580078, "global_step": 158700, "epoch": 1912} {"train_loss": -22.84586524963379, "global_step": 158701, "epoch": 1912} {"train_loss": -22.976282119750977, "global_step": 158702, "epoch": 1912} {"train_loss": -22.904184341430664, "global_step": 158703, "epoch": 1912} {"train_loss": -22.555784225463867, "global_step": 158704, "epoch": 1912} {"train_loss": -23.097095489501953, "global_step": 158705, "epoch": 1912} {"train_loss": -23.28464126586914, "global_step": 158706, "epoch": 1912} {"train_loss": -22.567819595336914, "global_step": 158707, "epoch": 1912} {"train_loss": -23.223493576049805, "global_step": 158708, "epoch": 1912} {"train_loss": -23.2587890625, "global_step": 158709, "epoch": 1912} {"train_loss": -23.214658737182617, "global_step": 158710, "epoch": 1912} {"train_loss": -22.928632736206055, "global_step": 158711, "epoch": 1912} {"train_loss": -22.959562301635742, "global_step": 158712, "epoch": 1912} {"train_loss": -23.251102447509766, "global_step": 158713, "epoch": 1912} {"train_loss": -23.11991310119629, "global_step": 158714, "epoch": 1912} {"train_loss": -23.249914169311523, "global_step": 158715, "epoch": 1912} {"train_loss": -23.274991989135742, "global_step": 158716, "epoch": 1912} {"train_loss": -23.45585060119629, "global_step": 158717, "epoch": 1912} {"train_loss": -23.84139060974121, "global_step": 158718, "epoch": 1912} {"train_loss": -23.451738357543945, "global_step": 158719, "epoch": 1912} {"train_loss": -23.42782974243164, "global_step": 158720, "epoch": 1912} {"train_loss": -23.084821701049805, "global_step": 158721, "epoch": 1912} {"train_loss": -23.087202072143555, "global_step": 158722, "epoch": 1912} {"train_loss": -23.197362899780273, "global_step": 158723, "epoch": 1912} {"train_loss": -23.17535400390625, "global_step": 158724, "epoch": 1912} {"train_loss": -23.329694747924805, "global_step": 158725, "epoch": 1912} {"train_loss": -23.526288986206055, "global_step": 158726, "epoch": 1912} {"train_loss": -23.389678955078125, "global_step": 158727, "epoch": 1912} {"train_loss": -23.506244659423828, "global_step": 158728, "epoch": 1912} {"train_loss": -23.520227432250977, "global_step": 158729, "epoch": 1912} {"train_loss": -23.59261703491211, "global_step": 158730, "epoch": 1912} {"train_loss": -23.3254451751709, "global_step": 158731, "epoch": 1912} {"train_loss": -23.52641487121582, "global_step": 158732, "epoch": 1912} {"train_loss": -23.672468185424805, "global_step": 158733, "epoch": 1912} {"train_loss": -23.508386611938477, "global_step": 158734, "epoch": 1912} {"train_loss": -23.494909286499023, "global_step": 158735, "epoch": 1912} {"train_loss": -23.230310440063477, "global_step": 158736, "epoch": 1912} {"train_loss": -23.211530685424805, "global_step": 158737, "epoch": 1912} {"train_loss": -23.614486694335938, "global_step": 158738, "epoch": 1912} {"train_loss": -23.96376609802246, "global_step": 158739, "epoch": 1912} {"train_loss": -23.581815719604492, "global_step": 158740, "epoch": 1912} {"train_loss": -23.428030014038086, "global_step": 158741, "epoch": 1912} {"train_loss": -23.619070053100586, "global_step": 158742, "epoch": 1912} {"train_loss": -23.576759338378906, "global_step": 158743, "epoch": 1912} {"train_loss": -23.64044952392578, "global_step": 158744, "epoch": 1912} {"train_loss": -23.760488510131836, "global_step": 158745, "epoch": 1912} {"train_loss": -23.2470703125, "global_step": 158746, "epoch": 1912} {"train_loss": -23.26484489440918, "global_step": 158747, "epoch": 1912} {"train_loss": -23.517528533935547, "global_step": 158748, "epoch": 1912} {"train_loss": -23.542400360107422, "global_step": 158749, "epoch": 1912} {"train_loss": -23.870441436767578, "global_step": 158750, "epoch": 1912} {"train_loss": -23.387481689453125, "global_step": 158751, "epoch": 1912} {"train_loss": -23.659631729125977, "global_step": 158752, "epoch": 1912} {"train_loss": -23.687650680541992, "global_step": 158753, "epoch": 1912} {"train_loss": -23.616792678833008, "global_step": 158754, "epoch": 1912} {"train_loss": -23.804275512695312, "global_step": 158755, "epoch": 1912} {"train_loss": -23.773141860961914, "global_step": 158756, "epoch": 1912} {"train_loss": -23.239957809448242, "global_step": 158757, "epoch": 1912} {"train_loss": -23.289764404296875, "global_step": 158758, "epoch": 1912} {"train_loss": -23.082197189331055, "global_step": 158759, "epoch": 1912} {"train_loss": -23.22205924987793, "global_step": 158760, "epoch": 1912} {"train_loss": -22.71583366394043, "global_step": 158761, "epoch": 1912} {"train_loss": -22.7448787689209, "global_step": 158762, "epoch": 1912} {"train_loss": -23.386564254760742, "global_step": 158763, "epoch": 1912} {"train_loss": -23.30912208557129, "global_step": 158764, "epoch": 1912} {"train_loss": -23.583372116088867, "global_step": 158765, "epoch": 1912} {"train_loss": -23.32493019104004, "global_step": 158766, "epoch": 1912} {"train_loss": -23.50945472717285, "global_step": 158767, "epoch": 1912} {"train_loss": -23.010229110717773, "global_step": 158768, "epoch": 1912} {"train_loss": -22.74191665649414, "global_step": 158769, "epoch": 1912} {"train_loss": -23.198375701904297, "global_step": 158770, "epoch": 1912} {"train_loss": -23.119413375854492, "global_step": 158771, "epoch": 1912} {"train_loss": -23.166641235351562, "global_step": 158772, "epoch": 1912} {"train_loss": -23.302019119262695, "global_step": 158773, "epoch": 1912} {"train_loss": -23.109098434448242, "global_step": 158774, "epoch": 1912} {"train_loss": -23.645803451538086, "global_step": 158775, "epoch": 1912} {"train_loss": -23.068174362182617, "global_step": 158776, "epoch": 1912} {"train_loss": -23.45756721496582, "global_step": 158777, "epoch": 1912} {"train_loss": -23.27457372826266, "global_step": 158778, "epoch": 1912, "val_loss": 6239151.0} {"train_loss": -22.79096794128418, "global_step": 158779, "epoch": 1913} {"train_loss": -22.772306442260742, "global_step": 158780, "epoch": 1913} {"train_loss": -22.873889923095703, "global_step": 158781, "epoch": 1913} {"train_loss": -22.584848403930664, "global_step": 158782, "epoch": 1913} {"train_loss": -23.215641021728516, "global_step": 158783, "epoch": 1913} {"train_loss": -22.809864044189453, "global_step": 158784, "epoch": 1913} {"train_loss": -22.750293731689453, "global_step": 158785, "epoch": 1913} {"train_loss": -22.965225219726562, "global_step": 158786, "epoch": 1913} {"train_loss": -22.943944931030273, "global_step": 158787, "epoch": 1913} {"train_loss": -23.1862850189209, "global_step": 158788, "epoch": 1913} {"train_loss": -22.848562240600586, "global_step": 158789, "epoch": 1913} {"train_loss": -23.237442016601562, "global_step": 158790, "epoch": 1913} {"train_loss": -23.552703857421875, "global_step": 158791, "epoch": 1913} {"train_loss": -23.407928466796875, "global_step": 158792, "epoch": 1913} {"train_loss": -23.290069580078125, "global_step": 158793, "epoch": 1913} {"train_loss": -23.338224411010742, "global_step": 158794, "epoch": 1913} {"train_loss": -23.2156982421875, "global_step": 158795, "epoch": 1913} {"train_loss": -23.13596534729004, "global_step": 158796, "epoch": 1913} {"train_loss": -23.5614070892334, "global_step": 158797, "epoch": 1913} {"train_loss": -23.04430389404297, "global_step": 158798, "epoch": 1913} {"train_loss": -23.460874557495117, "global_step": 158799, "epoch": 1913} {"train_loss": -23.34385108947754, "global_step": 158800, "epoch": 1913} {"train_loss": -23.66041374206543, "global_step": 158801, "epoch": 1913} {"train_loss": -23.22617530822754, "global_step": 158802, "epoch": 1913} {"train_loss": -23.284317016601562, "global_step": 158803, "epoch": 1913} {"train_loss": -23.704593658447266, "global_step": 158804, "epoch": 1913} {"train_loss": -23.641841888427734, "global_step": 158805, "epoch": 1913} {"train_loss": -23.470592498779297, "global_step": 158806, "epoch": 1913} {"train_loss": -23.676015853881836, "global_step": 158807, "epoch": 1913} {"train_loss": -23.582965850830078, "global_step": 158808, "epoch": 1913} {"train_loss": -23.669546127319336, "global_step": 158809, "epoch": 1913} {"train_loss": -23.73438835144043, "global_step": 158810, "epoch": 1913} {"train_loss": -23.420406341552734, "global_step": 158811, "epoch": 1913} {"train_loss": -23.5042724609375, "global_step": 158812, "epoch": 1913} {"train_loss": -23.364927291870117, "global_step": 158813, "epoch": 1913} {"train_loss": -23.817182540893555, "global_step": 158814, "epoch": 1913} {"train_loss": -23.618635177612305, "global_step": 158815, "epoch": 1913} {"train_loss": -23.235260009765625, "global_step": 158816, "epoch": 1913} {"train_loss": -23.326566696166992, "global_step": 158817, "epoch": 1913} {"train_loss": -23.429792404174805, "global_step": 158818, "epoch": 1913} {"train_loss": -23.826339721679688, "global_step": 158819, "epoch": 1913} {"train_loss": -23.372739791870117, "global_step": 158820, "epoch": 1913} {"train_loss": -23.331012725830078, "global_step": 158821, "epoch": 1913} {"train_loss": -22.97822380065918, "global_step": 158822, "epoch": 1913} {"train_loss": -23.537700653076172, "global_step": 158823, "epoch": 1913} {"train_loss": -23.265554428100586, "global_step": 158824, "epoch": 1913} {"train_loss": -23.23402976989746, "global_step": 158825, "epoch": 1913} {"train_loss": -23.074560165405273, "global_step": 158826, "epoch": 1913} {"train_loss": -23.129348754882812, "global_step": 158827, "epoch": 1913} {"train_loss": -23.678319931030273, "global_step": 158828, "epoch": 1913} {"train_loss": -23.390966415405273, "global_step": 158829, "epoch": 1913} {"train_loss": -23.364398956298828, "global_step": 158830, "epoch": 1913} {"train_loss": -23.69757652282715, "global_step": 158831, "epoch": 1913} {"train_loss": -23.263471603393555, "global_step": 158832, "epoch": 1913} {"train_loss": -23.219970703125, "global_step": 158833, "epoch": 1913} {"train_loss": -23.486818313598633, "global_step": 158834, "epoch": 1913} {"train_loss": -23.24278450012207, "global_step": 158835, "epoch": 1913} {"train_loss": -23.66645622253418, "global_step": 158836, "epoch": 1913} {"train_loss": -23.183198928833008, "global_step": 158837, "epoch": 1913} {"train_loss": -23.640880584716797, "global_step": 158838, "epoch": 1913} {"train_loss": -23.419097900390625, "global_step": 158839, "epoch": 1913} {"train_loss": -24.040414810180664, "global_step": 158840, "epoch": 1913} {"train_loss": -23.312604904174805, "global_step": 158841, "epoch": 1913} {"train_loss": -23.589338302612305, "global_step": 158842, "epoch": 1913} {"train_loss": -23.50324821472168, "global_step": 158843, "epoch": 1913} {"train_loss": -23.717103958129883, "global_step": 158844, "epoch": 1913} {"train_loss": -23.49350357055664, "global_step": 158845, "epoch": 1913} {"train_loss": -23.349332809448242, "global_step": 158846, "epoch": 1913} {"train_loss": -23.535085678100586, "global_step": 158847, "epoch": 1913} {"train_loss": -23.363401412963867, "global_step": 158848, "epoch": 1913} {"train_loss": -23.370943069458008, "global_step": 158849, "epoch": 1913} {"train_loss": -23.969396591186523, "global_step": 158850, "epoch": 1913} {"train_loss": -23.645204544067383, "global_step": 158851, "epoch": 1913} {"train_loss": -23.361814498901367, "global_step": 158852, "epoch": 1913} {"train_loss": -23.60773277282715, "global_step": 158853, "epoch": 1913} {"train_loss": -23.74947166442871, "global_step": 158854, "epoch": 1913} {"train_loss": -23.354028701782227, "global_step": 158855, "epoch": 1913} {"train_loss": -22.8017578125, "global_step": 158856, "epoch": 1913} {"train_loss": -23.252168655395508, "global_step": 158857, "epoch": 1913} {"train_loss": -23.643457412719727, "global_step": 158858, "epoch": 1913} {"train_loss": -23.412555694580078, "global_step": 158859, "epoch": 1913} {"train_loss": -23.30067253112793, "global_step": 158860, "epoch": 1913} {"train_loss": -23.3803705192474, "global_step": 158861, "epoch": 1913, "val_loss": 6380843.5} {"train_loss": -22.91397476196289, "global_step": 158862, "epoch": 1914} {"train_loss": -23.22919273376465, "global_step": 158863, "epoch": 1914} {"train_loss": -23.438053131103516, "global_step": 158864, "epoch": 1914} {"train_loss": -22.922815322875977, "global_step": 158865, "epoch": 1914} {"train_loss": -22.982566833496094, "global_step": 158866, "epoch": 1914} {"train_loss": -23.158496856689453, "global_step": 158867, "epoch": 1914} {"train_loss": -22.9644832611084, "global_step": 158868, "epoch": 1914} {"train_loss": -23.01393699645996, "global_step": 158869, "epoch": 1914} {"train_loss": -23.373029708862305, "global_step": 158870, "epoch": 1914} {"train_loss": -23.337053298950195, "global_step": 158871, "epoch": 1914} {"train_loss": -23.113452911376953, "global_step": 158872, "epoch": 1914} {"train_loss": -23.233016967773438, "global_step": 158873, "epoch": 1914} {"train_loss": -23.593778610229492, "global_step": 158874, "epoch": 1914} {"train_loss": -23.13435173034668, "global_step": 158875, "epoch": 1914} {"train_loss": -23.08547019958496, "global_step": 158876, "epoch": 1914} {"train_loss": -23.181127548217773, "global_step": 158877, "epoch": 1914} {"train_loss": -23.193294525146484, "global_step": 158878, "epoch": 1914} {"train_loss": -23.360332489013672, "global_step": 158879, "epoch": 1914} {"train_loss": -23.375991821289062, "global_step": 158880, "epoch": 1914} {"train_loss": -23.58991813659668, "global_step": 158881, "epoch": 1914} {"train_loss": -23.55194664001465, "global_step": 158882, "epoch": 1914} {"train_loss": -23.3950138092041, "global_step": 158883, "epoch": 1914} {"train_loss": -23.446613311767578, "global_step": 158884, "epoch": 1914} {"train_loss": -23.45585060119629, "global_step": 158885, "epoch": 1914} {"train_loss": -23.637670516967773, "global_step": 158886, "epoch": 1914} {"train_loss": -23.459491729736328, "global_step": 158887, "epoch": 1914} {"train_loss": -23.482948303222656, "global_step": 158888, "epoch": 1914} {"train_loss": -23.536386489868164, "global_step": 158889, "epoch": 1914} {"train_loss": -23.635032653808594, "global_step": 158890, "epoch": 1914} {"train_loss": -23.894065856933594, "global_step": 158891, "epoch": 1914} {"train_loss": -23.442625045776367, "global_step": 158892, "epoch": 1914} {"train_loss": -23.485414505004883, "global_step": 158893, "epoch": 1914} {"train_loss": -23.92658042907715, "global_step": 158894, "epoch": 1914} {"train_loss": -23.51177978515625, "global_step": 158895, "epoch": 1914} {"train_loss": -23.315954208374023, "global_step": 158896, "epoch": 1914} {"train_loss": -23.76990509033203, "global_step": 158897, "epoch": 1914} {"train_loss": -23.434837341308594, "global_step": 158898, "epoch": 1914} {"train_loss": -23.470731735229492, "global_step": 158899, "epoch": 1914} {"train_loss": -22.850248336791992, "global_step": 158900, "epoch": 1914} {"train_loss": -23.021406173706055, "global_step": 158901, "epoch": 1914} {"train_loss": -23.189311981201172, "global_step": 158902, "epoch": 1914} {"train_loss": -23.77326011657715, "global_step": 158903, "epoch": 1914} {"train_loss": -23.58739471435547, "global_step": 158904, "epoch": 1914} {"train_loss": -23.179433822631836, "global_step": 158905, "epoch": 1914} {"train_loss": -23.341665267944336, "global_step": 158906, "epoch": 1914} {"train_loss": -23.427597045898438, "global_step": 158907, "epoch": 1914} {"train_loss": -22.69785499572754, "global_step": 158908, "epoch": 1914} {"train_loss": -23.556299209594727, "global_step": 158909, "epoch": 1914} {"train_loss": -23.282638549804688, "global_step": 158910, "epoch": 1914} {"train_loss": -23.339208602905273, "global_step": 158911, "epoch": 1914} {"train_loss": -23.644424438476562, "global_step": 158912, "epoch": 1914} {"train_loss": -23.066457748413086, "global_step": 158913, "epoch": 1914} {"train_loss": -23.51692771911621, "global_step": 158914, "epoch": 1914} {"train_loss": -23.44598960876465, "global_step": 158915, "epoch": 1914} {"train_loss": -23.604074478149414, "global_step": 158916, "epoch": 1914} {"train_loss": -23.257572174072266, "global_step": 158917, "epoch": 1914} {"train_loss": -23.566532135009766, "global_step": 158918, "epoch": 1914} {"train_loss": -23.5078067779541, "global_step": 158919, "epoch": 1914} {"train_loss": -23.43047332763672, "global_step": 158920, "epoch": 1914} {"train_loss": -24.013463973999023, "global_step": 158921, "epoch": 1914} {"train_loss": -23.461172103881836, "global_step": 158922, "epoch": 1914} {"train_loss": -23.252317428588867, "global_step": 158923, "epoch": 1914} {"train_loss": -23.439495086669922, "global_step": 158924, "epoch": 1914} {"train_loss": -23.645601272583008, "global_step": 158925, "epoch": 1914} {"train_loss": -23.313491821289062, "global_step": 158926, "epoch": 1914} {"train_loss": -23.506711959838867, "global_step": 158927, "epoch": 1914} {"train_loss": -23.33627700805664, "global_step": 158928, "epoch": 1914} {"train_loss": -23.40996742248535, "global_step": 158929, "epoch": 1914} {"train_loss": -23.201480865478516, "global_step": 158930, "epoch": 1914} {"train_loss": -23.752729415893555, "global_step": 158931, "epoch": 1914} {"train_loss": -23.610797882080078, "global_step": 158932, "epoch": 1914} {"train_loss": -23.799732208251953, "global_step": 158933, "epoch": 1914} {"train_loss": -23.427276611328125, "global_step": 158934, "epoch": 1914} {"train_loss": -23.039541244506836, "global_step": 158935, "epoch": 1914} {"train_loss": -23.311182022094727, "global_step": 158936, "epoch": 1914} {"train_loss": -23.51711654663086, "global_step": 158937, "epoch": 1914} {"train_loss": -23.593124389648438, "global_step": 158938, "epoch": 1914} {"train_loss": -23.829504013061523, "global_step": 158939, "epoch": 1914} {"train_loss": -23.443504333496094, "global_step": 158940, "epoch": 1914} {"train_loss": -23.425556182861328, "global_step": 158941, "epoch": 1914} {"train_loss": -23.640451431274414, "global_step": 158942, "epoch": 1914} {"train_loss": -23.876209259033203, "global_step": 158943, "epoch": 1914} {"train_loss": -23.39613742138966, "global_step": 158944, "epoch": 1914, "val_loss": 6399710.5} {"train_loss": -22.895788192749023, "global_step": 158945, "epoch": 1915} {"train_loss": -23.214691162109375, "global_step": 158946, "epoch": 1915} {"train_loss": -22.849266052246094, "global_step": 158947, "epoch": 1915} {"train_loss": -22.989439010620117, "global_step": 158948, "epoch": 1915} {"train_loss": -23.288986206054688, "global_step": 158949, "epoch": 1915} {"train_loss": -23.22365379333496, "global_step": 158950, "epoch": 1915} {"train_loss": -23.085599899291992, "global_step": 158951, "epoch": 1915} {"train_loss": -23.567138671875, "global_step": 158952, "epoch": 1915} {"train_loss": -23.332853317260742, "global_step": 158953, "epoch": 1915} {"train_loss": -23.49736213684082, "global_step": 158954, "epoch": 1915} {"train_loss": -22.882509231567383, "global_step": 158955, "epoch": 1915} {"train_loss": -23.003110885620117, "global_step": 158956, "epoch": 1915} {"train_loss": -23.409332275390625, "global_step": 158957, "epoch": 1915} {"train_loss": -23.334932327270508, "global_step": 158958, "epoch": 1915} {"train_loss": -23.07862663269043, "global_step": 158959, "epoch": 1915} {"train_loss": -23.05659294128418, "global_step": 158960, "epoch": 1915} {"train_loss": -23.45064353942871, "global_step": 158961, "epoch": 1915} {"train_loss": -23.228872299194336, "global_step": 158962, "epoch": 1915} {"train_loss": -23.287851333618164, "global_step": 158963, "epoch": 1915} {"train_loss": -23.340978622436523, "global_step": 158964, "epoch": 1915} {"train_loss": -23.506683349609375, "global_step": 158965, "epoch": 1915} {"train_loss": -23.453205108642578, "global_step": 158966, "epoch": 1915} {"train_loss": -22.998510360717773, "global_step": 158967, "epoch": 1915} {"train_loss": -23.320899963378906, "global_step": 158968, "epoch": 1915} {"train_loss": -23.496253967285156, "global_step": 158969, "epoch": 1915} {"train_loss": -23.29805564880371, "global_step": 158970, "epoch": 1915} {"train_loss": -23.86736488342285, "global_step": 158971, "epoch": 1915} {"train_loss": -23.350006103515625, "global_step": 158972, "epoch": 1915} {"train_loss": -23.227283477783203, "global_step": 158973, "epoch": 1915} {"train_loss": -23.478900909423828, "global_step": 158974, "epoch": 1915} {"train_loss": -23.393110275268555, "global_step": 158975, "epoch": 1915} {"train_loss": -23.51723289489746, "global_step": 158976, "epoch": 1915} {"train_loss": -23.557994842529297, "global_step": 158977, "epoch": 1915} {"train_loss": -23.393901824951172, "global_step": 158978, "epoch": 1915} {"train_loss": -23.6118106842041, "global_step": 158979, "epoch": 1915} {"train_loss": -23.409961700439453, "global_step": 158980, "epoch": 1915} {"train_loss": -23.54804801940918, "global_step": 158981, "epoch": 1915} {"train_loss": -23.700971603393555, "global_step": 158982, "epoch": 1915} {"train_loss": -23.596683502197266, "global_step": 158983, "epoch": 1915} {"train_loss": -23.55765724182129, "global_step": 158984, "epoch": 1915} {"train_loss": -23.42530632019043, "global_step": 158985, "epoch": 1915} {"train_loss": -23.400754928588867, "global_step": 158986, "epoch": 1915} {"train_loss": -23.408815383911133, "global_step": 158987, "epoch": 1915} {"train_loss": -23.36216926574707, "global_step": 158988, "epoch": 1915} {"train_loss": -23.692625045776367, "global_step": 158989, "epoch": 1915} {"train_loss": -23.28443717956543, "global_step": 158990, "epoch": 1915} {"train_loss": -23.534008026123047, "global_step": 158991, "epoch": 1915} {"train_loss": -23.23898696899414, "global_step": 158992, "epoch": 1915} {"train_loss": -23.599956512451172, "global_step": 158993, "epoch": 1915} {"train_loss": -23.6650333404541, "global_step": 158994, "epoch": 1915} {"train_loss": -23.277057647705078, "global_step": 158995, "epoch": 1915} {"train_loss": -23.601551055908203, "global_step": 158996, "epoch": 1915} {"train_loss": -23.262678146362305, "global_step": 158997, "epoch": 1915} {"train_loss": -23.32638931274414, "global_step": 158998, "epoch": 1915} {"train_loss": -23.56648063659668, "global_step": 158999, "epoch": 1915} {"train_loss": -23.354198455810547, "global_step": 159000, "epoch": 1915} {"train_loss": -23.58882713317871, "global_step": 159001, "epoch": 1915} {"train_loss": -23.389989852905273, "global_step": 159002, "epoch": 1915} {"train_loss": -23.26132583618164, "global_step": 159003, "epoch": 1915} {"train_loss": -23.80267906188965, "global_step": 159004, "epoch": 1915} {"train_loss": -23.22724723815918, "global_step": 159005, "epoch": 1915} {"train_loss": -23.660703659057617, "global_step": 159006, "epoch": 1915} {"train_loss": -23.174673080444336, "global_step": 159007, "epoch": 1915} {"train_loss": -24.12811279296875, "global_step": 159008, "epoch": 1915} {"train_loss": -23.44419288635254, "global_step": 159009, "epoch": 1915} {"train_loss": -23.598005294799805, "global_step": 159010, "epoch": 1915} {"train_loss": -23.46260643005371, "global_step": 159011, "epoch": 1915} {"train_loss": -23.521596908569336, "global_step": 159012, "epoch": 1915} {"train_loss": -23.449514389038086, "global_step": 159013, "epoch": 1915} {"train_loss": -23.618732452392578, "global_step": 159014, "epoch": 1915} {"train_loss": -23.529661178588867, "global_step": 159015, "epoch": 1915} {"train_loss": -23.255064010620117, "global_step": 159016, "epoch": 1915} {"train_loss": -23.74519157409668, "global_step": 159017, "epoch": 1915} {"train_loss": -23.801694869995117, "global_step": 159018, "epoch": 1915} {"train_loss": -23.389734268188477, "global_step": 159019, "epoch": 1915} {"train_loss": -23.552631378173828, "global_step": 159020, "epoch": 1915} {"train_loss": -23.22083854675293, "global_step": 159021, "epoch": 1915} {"train_loss": -23.762014389038086, "global_step": 159022, "epoch": 1915} {"train_loss": -23.306203842163086, "global_step": 159023, "epoch": 1915} {"train_loss": -23.385332107543945, "global_step": 159024, "epoch": 1915} {"train_loss": -23.55990982055664, "global_step": 159025, "epoch": 1915} {"train_loss": -23.802322387695312, "global_step": 159026, "epoch": 1915} {"train_loss": -23.4005848987993, "global_step": 159027, "epoch": 1915, "val_loss": 6339599.0} {"train_loss": -21.586713790893555, "global_step": 159028, "epoch": 1916} {"train_loss": -22.555936813354492, "global_step": 159029, "epoch": 1916} {"train_loss": -22.94184684753418, "global_step": 159030, "epoch": 1916} {"train_loss": -22.478622436523438, "global_step": 159031, "epoch": 1916} {"train_loss": -22.444753646850586, "global_step": 159032, "epoch": 1916} {"train_loss": -22.781627655029297, "global_step": 159033, "epoch": 1916} {"train_loss": -22.745637893676758, "global_step": 159034, "epoch": 1916} {"train_loss": -22.634071350097656, "global_step": 159035, "epoch": 1916} {"train_loss": -22.357406616210938, "global_step": 159036, "epoch": 1916} {"train_loss": -23.31978416442871, "global_step": 159037, "epoch": 1916} {"train_loss": -22.870695114135742, "global_step": 159038, "epoch": 1916} {"train_loss": -23.284957885742188, "global_step": 159039, "epoch": 1916} {"train_loss": -23.185041427612305, "global_step": 159040, "epoch": 1916} {"train_loss": -23.19584083557129, "global_step": 159041, "epoch": 1916} {"train_loss": -23.02910614013672, "global_step": 159042, "epoch": 1916} {"train_loss": -23.172948837280273, "global_step": 159043, "epoch": 1916} {"train_loss": -23.149791717529297, "global_step": 159044, "epoch": 1916} {"train_loss": -23.069887161254883, "global_step": 159045, "epoch": 1916} {"train_loss": -23.044902801513672, "global_step": 159046, "epoch": 1916} {"train_loss": -23.470582962036133, "global_step": 159047, "epoch": 1916} {"train_loss": -23.329389572143555, "global_step": 159048, "epoch": 1916} {"train_loss": -23.331512451171875, "global_step": 159049, "epoch": 1916} {"train_loss": -23.07453155517578, "global_step": 159050, "epoch": 1916} {"train_loss": -23.611234664916992, "global_step": 159051, "epoch": 1916} {"train_loss": -23.506261825561523, "global_step": 159052, "epoch": 1916} {"train_loss": -23.692956924438477, "global_step": 159053, "epoch": 1916} {"train_loss": -23.10969352722168, "global_step": 159054, "epoch": 1916} {"train_loss": -23.530385971069336, "global_step": 159055, "epoch": 1916} {"train_loss": -23.765897750854492, "global_step": 159056, "epoch": 1916} {"train_loss": -23.49521255493164, "global_step": 159057, "epoch": 1916} {"train_loss": -23.496929168701172, "global_step": 159058, "epoch": 1916} {"train_loss": -23.743167877197266, "global_step": 159059, "epoch": 1916} {"train_loss": -23.545913696289062, "global_step": 159060, "epoch": 1916} {"train_loss": -23.590675354003906, "global_step": 159061, "epoch": 1916} {"train_loss": -23.555917739868164, "global_step": 159062, "epoch": 1916} {"train_loss": -23.687164306640625, "global_step": 159063, "epoch": 1916} {"train_loss": -23.378273010253906, "global_step": 159064, "epoch": 1916} {"train_loss": -23.863981246948242, "global_step": 159065, "epoch": 1916} {"train_loss": -23.883420944213867, "global_step": 159066, "epoch": 1916} {"train_loss": -23.353256225585938, "global_step": 159067, "epoch": 1916} {"train_loss": -23.556745529174805, "global_step": 159068, "epoch": 1916} {"train_loss": -23.019941329956055, "global_step": 159069, "epoch": 1916} {"train_loss": -23.666772842407227, "global_step": 159070, "epoch": 1916} {"train_loss": -23.38886070251465, "global_step": 159071, "epoch": 1916} {"train_loss": -23.691221237182617, "global_step": 159072, "epoch": 1916} {"train_loss": -23.425161361694336, "global_step": 159073, "epoch": 1916} {"train_loss": -23.340490341186523, "global_step": 159074, "epoch": 1916} {"train_loss": -23.72950553894043, "global_step": 159075, "epoch": 1916} {"train_loss": -23.289058685302734, "global_step": 159076, "epoch": 1916} {"train_loss": -23.341129302978516, "global_step": 159077, "epoch": 1916} {"train_loss": -23.566387176513672, "global_step": 159078, "epoch": 1916} {"train_loss": -23.26811408996582, "global_step": 159079, "epoch": 1916} {"train_loss": -23.915761947631836, "global_step": 159080, "epoch": 1916} {"train_loss": -23.202993392944336, "global_step": 159081, "epoch": 1916} {"train_loss": -23.65970230102539, "global_step": 159082, "epoch": 1916} {"train_loss": -23.72478675842285, "global_step": 159083, "epoch": 1916} {"train_loss": -23.480566024780273, "global_step": 159084, "epoch": 1916} {"train_loss": -23.574630737304688, "global_step": 159085, "epoch": 1916} {"train_loss": -23.33479881286621, "global_step": 159086, "epoch": 1916} {"train_loss": -24.098045349121094, "global_step": 159087, "epoch": 1916} {"train_loss": -23.149816513061523, "global_step": 159088, "epoch": 1916} {"train_loss": -23.321149826049805, "global_step": 159089, "epoch": 1916} {"train_loss": -23.42008399963379, "global_step": 159090, "epoch": 1916} {"train_loss": -23.559192657470703, "global_step": 159091, "epoch": 1916} {"train_loss": -23.257553100585938, "global_step": 159092, "epoch": 1916} {"train_loss": -23.496105194091797, "global_step": 159093, "epoch": 1916} {"train_loss": -23.565610885620117, "global_step": 159094, "epoch": 1916} {"train_loss": -23.805768966674805, "global_step": 159095, "epoch": 1916} {"train_loss": -23.804655075073242, "global_step": 159096, "epoch": 1916} {"train_loss": -23.63543128967285, "global_step": 159097, "epoch": 1916} {"train_loss": -23.300085067749023, "global_step": 159098, "epoch": 1916} {"train_loss": -23.377859115600586, "global_step": 159099, "epoch": 1916} {"train_loss": -23.153532028198242, "global_step": 159100, "epoch": 1916} {"train_loss": -23.85820960998535, "global_step": 159101, "epoch": 1916} {"train_loss": -23.145755767822266, "global_step": 159102, "epoch": 1916} {"train_loss": -23.28502082824707, "global_step": 159103, "epoch": 1916} {"train_loss": -23.474878311157227, "global_step": 159104, "epoch": 1916} {"train_loss": -23.550647735595703, "global_step": 159105, "epoch": 1916} {"train_loss": -23.193389892578125, "global_step": 159106, "epoch": 1916} {"train_loss": -23.57210350036621, "global_step": 159107, "epoch": 1916} {"train_loss": -23.735626220703125, "global_step": 159108, "epoch": 1916} {"train_loss": -23.56251335144043, "global_step": 159109, "epoch": 1916} {"train_loss": -23.336882097175323, "global_step": 159110, "epoch": 1916, "val_loss": 6401819.0} {"train_loss": -23.5527400970459, "global_step": 159111, "epoch": 1917} {"train_loss": -23.354806900024414, "global_step": 159112, "epoch": 1917} {"train_loss": -23.367719650268555, "global_step": 159113, "epoch": 1917} {"train_loss": -23.391050338745117, "global_step": 159114, "epoch": 1917} {"train_loss": -23.334556579589844, "global_step": 159115, "epoch": 1917} {"train_loss": -23.19571304321289, "global_step": 159116, "epoch": 1917} {"train_loss": -23.431303024291992, "global_step": 159117, "epoch": 1917} {"train_loss": -23.27320671081543, "global_step": 159118, "epoch": 1917} {"train_loss": -23.162527084350586, "global_step": 159119, "epoch": 1917} {"train_loss": -23.213525772094727, "global_step": 159120, "epoch": 1917} {"train_loss": -23.16776466369629, "global_step": 159121, "epoch": 1917} {"train_loss": -23.355131149291992, "global_step": 159122, "epoch": 1917} {"train_loss": -23.58522605895996, "global_step": 159123, "epoch": 1917} {"train_loss": -23.325363159179688, "global_step": 159124, "epoch": 1917} {"train_loss": -23.59821128845215, "global_step": 159125, "epoch": 1917} {"train_loss": -23.069929122924805, "global_step": 159126, "epoch": 1917} {"train_loss": -23.458728790283203, "global_step": 159127, "epoch": 1917} {"train_loss": -23.36411476135254, "global_step": 159128, "epoch": 1917} {"train_loss": -23.7063045501709, "global_step": 159129, "epoch": 1917} {"train_loss": -23.612041473388672, "global_step": 159130, "epoch": 1917} {"train_loss": -23.408329010009766, "global_step": 159131, "epoch": 1917} {"train_loss": -23.513906478881836, "global_step": 159132, "epoch": 1917} {"train_loss": -23.60316276550293, "global_step": 159133, "epoch": 1917} {"train_loss": -23.26310157775879, "global_step": 159134, "epoch": 1917} {"train_loss": -23.527645111083984, "global_step": 159135, "epoch": 1917} {"train_loss": -23.514558792114258, "global_step": 159136, "epoch": 1917} {"train_loss": -23.885391235351562, "global_step": 159137, "epoch": 1917} {"train_loss": -23.10365104675293, "global_step": 159138, "epoch": 1917} {"train_loss": -23.193161010742188, "global_step": 159139, "epoch": 1917} {"train_loss": -23.422718048095703, "global_step": 159140, "epoch": 1917} {"train_loss": -23.70632553100586, "global_step": 159141, "epoch": 1917} {"train_loss": -23.57107162475586, "global_step": 159142, "epoch": 1917} {"train_loss": -23.79355812072754, "global_step": 159143, "epoch": 1917} {"train_loss": -23.295467376708984, "global_step": 159144, "epoch": 1917} {"train_loss": -23.4105281829834, "global_step": 159145, "epoch": 1917} {"train_loss": -23.481252670288086, "global_step": 159146, "epoch": 1917} {"train_loss": -23.814224243164062, "global_step": 159147, "epoch": 1917} {"train_loss": -23.793563842773438, "global_step": 159148, "epoch": 1917} {"train_loss": -23.64154624938965, "global_step": 159149, "epoch": 1917} {"train_loss": -23.466299057006836, "global_step": 159150, "epoch": 1917} {"train_loss": -24.057058334350586, "global_step": 159151, "epoch": 1917} {"train_loss": -23.364795684814453, "global_step": 159152, "epoch": 1917} {"train_loss": -23.77933692932129, "global_step": 159153, "epoch": 1917} {"train_loss": -23.73354148864746, "global_step": 159154, "epoch": 1917} {"train_loss": -23.880521774291992, "global_step": 159155, "epoch": 1917} {"train_loss": -23.683338165283203, "global_step": 159156, "epoch": 1917} {"train_loss": -23.657028198242188, "global_step": 159157, "epoch": 1917} {"train_loss": -23.793594360351562, "global_step": 159158, "epoch": 1917} {"train_loss": -23.79172706604004, "global_step": 159159, "epoch": 1917} {"train_loss": -23.27915382385254, "global_step": 159160, "epoch": 1917} {"train_loss": -23.767805099487305, "global_step": 159161, "epoch": 1917} {"train_loss": -23.347721099853516, "global_step": 159162, "epoch": 1917} {"train_loss": -23.006406784057617, "global_step": 159163, "epoch": 1917} {"train_loss": -22.800247192382812, "global_step": 159164, "epoch": 1917} {"train_loss": -23.35218620300293, "global_step": 159165, "epoch": 1917} {"train_loss": -23.519607543945312, "global_step": 159166, "epoch": 1917} {"train_loss": -23.07570457458496, "global_step": 159167, "epoch": 1917} {"train_loss": -23.23874855041504, "global_step": 159168, "epoch": 1917} {"train_loss": -23.61482810974121, "global_step": 159169, "epoch": 1917} {"train_loss": -23.263839721679688, "global_step": 159170, "epoch": 1917} {"train_loss": -23.165006637573242, "global_step": 159171, "epoch": 1917} {"train_loss": -23.295166015625, "global_step": 159172, "epoch": 1917} {"train_loss": -23.612220764160156, "global_step": 159173, "epoch": 1917} {"train_loss": -23.48067855834961, "global_step": 159174, "epoch": 1917} {"train_loss": -22.878835678100586, "global_step": 159175, "epoch": 1917} {"train_loss": -23.501972198486328, "global_step": 159176, "epoch": 1917} {"train_loss": -23.0447998046875, "global_step": 159177, "epoch": 1917} {"train_loss": -23.889366149902344, "global_step": 159178, "epoch": 1917} {"train_loss": -23.486940383911133, "global_step": 159179, "epoch": 1917} {"train_loss": -23.531787872314453, "global_step": 159180, "epoch": 1917} {"train_loss": -22.999277114868164, "global_step": 159181, "epoch": 1917} {"train_loss": -23.560754776000977, "global_step": 159182, "epoch": 1917} {"train_loss": -23.300565719604492, "global_step": 159183, "epoch": 1917} {"train_loss": -23.606576919555664, "global_step": 159184, "epoch": 1917} {"train_loss": -23.3603515625, "global_step": 159185, "epoch": 1917} {"train_loss": -23.791521072387695, "global_step": 159186, "epoch": 1917} {"train_loss": -23.44631004333496, "global_step": 159187, "epoch": 1917} {"train_loss": -23.311511993408203, "global_step": 159188, "epoch": 1917} {"train_loss": -23.2890682220459, "global_step": 159189, "epoch": 1917} {"train_loss": -23.782197952270508, "global_step": 159190, "epoch": 1917} {"train_loss": -23.36370849609375, "global_step": 159191, "epoch": 1917} {"train_loss": -23.409460067749023, "global_step": 159192, "epoch": 1917} {"train_loss": -23.457340125577996, "global_step": 159193, "epoch": 1917, "val_loss": 6228426.0} {"train_loss": -22.720365524291992, "global_step": 159194, "epoch": 1918} {"train_loss": -22.640674591064453, "global_step": 159195, "epoch": 1918} {"train_loss": -23.527719497680664, "global_step": 159196, "epoch": 1918} {"train_loss": -23.01370620727539, "global_step": 159197, "epoch": 1918} {"train_loss": -23.009366989135742, "global_step": 159198, "epoch": 1918} {"train_loss": -23.467435836791992, "global_step": 159199, "epoch": 1918} {"train_loss": -23.311809539794922, "global_step": 159200, "epoch": 1918} {"train_loss": -23.04183006286621, "global_step": 159201, "epoch": 1918} {"train_loss": -23.04974937438965, "global_step": 159202, "epoch": 1918} {"train_loss": -23.284910202026367, "global_step": 159203, "epoch": 1918} {"train_loss": -23.685495376586914, "global_step": 159204, "epoch": 1918} {"train_loss": -23.299293518066406, "global_step": 159205, "epoch": 1918} {"train_loss": -23.17275047302246, "global_step": 159206, "epoch": 1918} {"train_loss": -23.61471939086914, "global_step": 159207, "epoch": 1918} {"train_loss": -23.262720108032227, "global_step": 159208, "epoch": 1918} {"train_loss": -23.56787872314453, "global_step": 159209, "epoch": 1918} {"train_loss": -23.22503662109375, "global_step": 159210, "epoch": 1918} {"train_loss": -23.2784481048584, "global_step": 159211, "epoch": 1918} {"train_loss": -23.053264617919922, "global_step": 159212, "epoch": 1918} {"train_loss": -23.382038116455078, "global_step": 159213, "epoch": 1918} {"train_loss": -23.16226577758789, "global_step": 159214, "epoch": 1918} {"train_loss": -23.10035514831543, "global_step": 159215, "epoch": 1918} {"train_loss": -23.430463790893555, "global_step": 159216, "epoch": 1918} {"train_loss": -23.289947509765625, "global_step": 159217, "epoch": 1918} {"train_loss": -23.57798194885254, "global_step": 159218, "epoch": 1918} {"train_loss": -23.46208381652832, "global_step": 159219, "epoch": 1918} {"train_loss": -23.301502227783203, "global_step": 159220, "epoch": 1918} {"train_loss": -23.543981552124023, "global_step": 159221, "epoch": 1918} {"train_loss": -23.66876792907715, "global_step": 159222, "epoch": 1918} {"train_loss": -23.528066635131836, "global_step": 159223, "epoch": 1918} {"train_loss": -23.61672019958496, "global_step": 159224, "epoch": 1918} {"train_loss": -23.331640243530273, "global_step": 159225, "epoch": 1918} {"train_loss": -23.728641510009766, "global_step": 159226, "epoch": 1918} {"train_loss": -23.76591682434082, "global_step": 159227, "epoch": 1918} {"train_loss": -23.493961334228516, "global_step": 159228, "epoch": 1918} {"train_loss": -23.678152084350586, "global_step": 159229, "epoch": 1918} {"train_loss": -23.75203514099121, "global_step": 159230, "epoch": 1918} {"train_loss": -23.889999389648438, "global_step": 159231, "epoch": 1918} {"train_loss": -23.408344268798828, "global_step": 159232, "epoch": 1918} {"train_loss": -23.512678146362305, "global_step": 159233, "epoch": 1918} {"train_loss": -23.78061866760254, "global_step": 159234, "epoch": 1918} {"train_loss": -23.28769874572754, "global_step": 159235, "epoch": 1918} {"train_loss": -23.279287338256836, "global_step": 159236, "epoch": 1918} {"train_loss": -23.599088668823242, "global_step": 159237, "epoch": 1918} {"train_loss": -23.321752548217773, "global_step": 159238, "epoch": 1918} {"train_loss": -23.342592239379883, "global_step": 159239, "epoch": 1918} {"train_loss": -23.486515045166016, "global_step": 159240, "epoch": 1918} {"train_loss": -23.55585479736328, "global_step": 159241, "epoch": 1918} {"train_loss": -23.45098304748535, "global_step": 159242, "epoch": 1918} {"train_loss": -23.02943992614746, "global_step": 159243, "epoch": 1918} {"train_loss": -23.236082077026367, "global_step": 159244, "epoch": 1918} {"train_loss": -23.556015014648438, "global_step": 159245, "epoch": 1918} {"train_loss": -22.99663734436035, "global_step": 159246, "epoch": 1918} {"train_loss": -23.30461883544922, "global_step": 159247, "epoch": 1918} {"train_loss": -23.370807647705078, "global_step": 159248, "epoch": 1918} {"train_loss": -23.477359771728516, "global_step": 159249, "epoch": 1918} {"train_loss": -23.593332290649414, "global_step": 159250, "epoch": 1918} {"train_loss": -24.077585220336914, "global_step": 159251, "epoch": 1918} {"train_loss": -23.402585983276367, "global_step": 159252, "epoch": 1918} {"train_loss": -23.34535026550293, "global_step": 159253, "epoch": 1918} {"train_loss": -23.475683212280273, "global_step": 159254, "epoch": 1918} {"train_loss": -23.48373794555664, "global_step": 159255, "epoch": 1918} {"train_loss": -23.274616241455078, "global_step": 159256, "epoch": 1918} {"train_loss": -23.162832260131836, "global_step": 159257, "epoch": 1918} {"train_loss": -23.597522735595703, "global_step": 159258, "epoch": 1918} {"train_loss": -23.522136688232422, "global_step": 159259, "epoch": 1918} {"train_loss": -23.642179489135742, "global_step": 159260, "epoch": 1918} {"train_loss": -23.395639419555664, "global_step": 159261, "epoch": 1918} {"train_loss": -23.69614601135254, "global_step": 159262, "epoch": 1918} {"train_loss": -23.294546127319336, "global_step": 159263, "epoch": 1918} {"train_loss": -23.44059181213379, "global_step": 159264, "epoch": 1918} {"train_loss": -23.865060806274414, "global_step": 159265, "epoch": 1918} {"train_loss": -23.415067672729492, "global_step": 159266, "epoch": 1918} {"train_loss": -23.16484832763672, "global_step": 159267, "epoch": 1918} {"train_loss": -23.34722328186035, "global_step": 159268, "epoch": 1918} {"train_loss": -23.611412048339844, "global_step": 159269, "epoch": 1918} {"train_loss": -23.534189224243164, "global_step": 159270, "epoch": 1918} {"train_loss": -23.427003860473633, "global_step": 159271, "epoch": 1918} {"train_loss": -23.7303466796875, "global_step": 159272, "epoch": 1918} {"train_loss": -23.388919830322266, "global_step": 159273, "epoch": 1918} {"train_loss": -23.496601104736328, "global_step": 159274, "epoch": 1918} {"train_loss": -23.602384567260742, "global_step": 159275, "epoch": 1918} {"train_loss": -23.409335653465913, "global_step": 159276, "epoch": 1918, "val_loss": 6328005.0} {"train_loss": -22.985361099243164, "global_step": 159277, "epoch": 1919} {"train_loss": -23.295454025268555, "global_step": 159278, "epoch": 1919} {"train_loss": -23.255348205566406, "global_step": 159279, "epoch": 1919} {"train_loss": -23.407400131225586, "global_step": 159280, "epoch": 1919} {"train_loss": -23.074722290039062, "global_step": 159281, "epoch": 1919} {"train_loss": -23.44192886352539, "global_step": 159282, "epoch": 1919} {"train_loss": -23.013690948486328, "global_step": 159283, "epoch": 1919} {"train_loss": -23.308364868164062, "global_step": 159284, "epoch": 1919} {"train_loss": -23.39969825744629, "global_step": 159285, "epoch": 1919} {"train_loss": -23.440279006958008, "global_step": 159286, "epoch": 1919} {"train_loss": -23.35653305053711, "global_step": 159287, "epoch": 1919} {"train_loss": -22.93622398376465, "global_step": 159288, "epoch": 1919} {"train_loss": -23.013320922851562, "global_step": 159289, "epoch": 1919} {"train_loss": -23.565765380859375, "global_step": 159290, "epoch": 1919} {"train_loss": -23.66586685180664, "global_step": 159291, "epoch": 1919} {"train_loss": -23.112314224243164, "global_step": 159292, "epoch": 1919} {"train_loss": -23.25795555114746, "global_step": 159293, "epoch": 1919} {"train_loss": -23.803775787353516, "global_step": 159294, "epoch": 1919} {"train_loss": -23.488431930541992, "global_step": 159295, "epoch": 1919} {"train_loss": -23.60065269470215, "global_step": 159296, "epoch": 1919} {"train_loss": -23.201879501342773, "global_step": 159297, "epoch": 1919} {"train_loss": -23.518484115600586, "global_step": 159298, "epoch": 1919} {"train_loss": -23.646549224853516, "global_step": 159299, "epoch": 1919} {"train_loss": -23.361806869506836, "global_step": 159300, "epoch": 1919} {"train_loss": -23.460721969604492, "global_step": 159301, "epoch": 1919} {"train_loss": -23.265409469604492, "global_step": 159302, "epoch": 1919} {"train_loss": -23.611669540405273, "global_step": 159303, "epoch": 1919} {"train_loss": -23.541839599609375, "global_step": 159304, "epoch": 1919} {"train_loss": -23.681827545166016, "global_step": 159305, "epoch": 1919} {"train_loss": -23.445295333862305, "global_step": 159306, "epoch": 1919} {"train_loss": -23.641231536865234, "global_step": 159307, "epoch": 1919} {"train_loss": -23.419090270996094, "global_step": 159308, "epoch": 1919} {"train_loss": -23.65736961364746, "global_step": 159309, "epoch": 1919} {"train_loss": -23.472827911376953, "global_step": 159310, "epoch": 1919} {"train_loss": -23.662216186523438, "global_step": 159311, "epoch": 1919} {"train_loss": -23.69166374206543, "global_step": 159312, "epoch": 1919} {"train_loss": -23.9509334564209, "global_step": 159313, "epoch": 1919} {"train_loss": -23.82269859313965, "global_step": 159314, "epoch": 1919} {"train_loss": -23.583576202392578, "global_step": 159315, "epoch": 1919} {"train_loss": -23.203474044799805, "global_step": 159316, "epoch": 1919} {"train_loss": -23.6239070892334, "global_step": 159317, "epoch": 1919} {"train_loss": -23.548715591430664, "global_step": 159318, "epoch": 1919} {"train_loss": -23.624786376953125, "global_step": 159319, "epoch": 1919} {"train_loss": -23.414262771606445, "global_step": 159320, "epoch": 1919} {"train_loss": -23.244382858276367, "global_step": 159321, "epoch": 1919} {"train_loss": -23.292423248291016, "global_step": 159322, "epoch": 1919} {"train_loss": -23.635116577148438, "global_step": 159323, "epoch": 1919} {"train_loss": -23.491804122924805, "global_step": 159324, "epoch": 1919} {"train_loss": -23.372648239135742, "global_step": 159325, "epoch": 1919} {"train_loss": -23.347387313842773, "global_step": 159326, "epoch": 1919} {"train_loss": -23.23879051208496, "global_step": 159327, "epoch": 1919} {"train_loss": -23.529327392578125, "global_step": 159328, "epoch": 1919} {"train_loss": -23.756498336791992, "global_step": 159329, "epoch": 1919} {"train_loss": -23.499067306518555, "global_step": 159330, "epoch": 1919} {"train_loss": -23.43225860595703, "global_step": 159331, "epoch": 1919} {"train_loss": -23.718088150024414, "global_step": 159332, "epoch": 1919} {"train_loss": -23.7268123626709, "global_step": 159333, "epoch": 1919} {"train_loss": -23.559234619140625, "global_step": 159334, "epoch": 1919} {"train_loss": -23.723346710205078, "global_step": 159335, "epoch": 1919} {"train_loss": -23.44761085510254, "global_step": 159336, "epoch": 1919} {"train_loss": -23.591466903686523, "global_step": 159337, "epoch": 1919} {"train_loss": -23.577260971069336, "global_step": 159338, "epoch": 1919} {"train_loss": -23.709272384643555, "global_step": 159339, "epoch": 1919} {"train_loss": -23.63396644592285, "global_step": 159340, "epoch": 1919} {"train_loss": -23.346439361572266, "global_step": 159341, "epoch": 1919} {"train_loss": -23.667926788330078, "global_step": 159342, "epoch": 1919} {"train_loss": -23.45656394958496, "global_step": 159343, "epoch": 1919} {"train_loss": -23.757802963256836, "global_step": 159344, "epoch": 1919} {"train_loss": -23.894149780273438, "global_step": 159345, "epoch": 1919} {"train_loss": -23.476882934570312, "global_step": 159346, "epoch": 1919} {"train_loss": -23.838542938232422, "global_step": 159347, "epoch": 1919} {"train_loss": -23.7213191986084, "global_step": 159348, "epoch": 1919} {"train_loss": -23.98508644104004, "global_step": 159349, "epoch": 1919} {"train_loss": -23.155820846557617, "global_step": 159350, "epoch": 1919} {"train_loss": -23.257455825805664, "global_step": 159351, "epoch": 1919} {"train_loss": -23.87349510192871, "global_step": 159352, "epoch": 1919} {"train_loss": -23.647443771362305, "global_step": 159353, "epoch": 1919} {"train_loss": -23.3803768157959, "global_step": 159354, "epoch": 1919} {"train_loss": -24.06342887878418, "global_step": 159355, "epoch": 1919} {"train_loss": -23.43492317199707, "global_step": 159356, "epoch": 1919} {"train_loss": -23.34377098083496, "global_step": 159357, "epoch": 1919} {"train_loss": -24.042722702026367, "global_step": 159358, "epoch": 1919} {"train_loss": -23.49033036289445, "global_step": 159359, "epoch": 1919, "val_loss": 6355030.0} {"train_loss": -22.558584213256836, "global_step": 159360, "epoch": 1920} {"train_loss": -22.406055450439453, "global_step": 159361, "epoch": 1920} {"train_loss": -23.195880889892578, "global_step": 159362, "epoch": 1920} {"train_loss": -22.757810592651367, "global_step": 159363, "epoch": 1920} {"train_loss": -23.430997848510742, "global_step": 159364, "epoch": 1920} {"train_loss": -22.985240936279297, "global_step": 159365, "epoch": 1920} {"train_loss": -23.467273712158203, "global_step": 159366, "epoch": 1920} {"train_loss": -23.220827102661133, "global_step": 159367, "epoch": 1920} {"train_loss": -22.99702262878418, "global_step": 159368, "epoch": 1920} {"train_loss": -22.621763229370117, "global_step": 159369, "epoch": 1920} {"train_loss": -23.37712860107422, "global_step": 159370, "epoch": 1920} {"train_loss": -22.761091232299805, "global_step": 159371, "epoch": 1920} {"train_loss": -23.146652221679688, "global_step": 159372, "epoch": 1920} {"train_loss": -23.364917755126953, "global_step": 159373, "epoch": 1920} {"train_loss": -23.26934814453125, "global_step": 159374, "epoch": 1920} {"train_loss": -23.460758209228516, "global_step": 159375, "epoch": 1920} {"train_loss": -23.276874542236328, "global_step": 159376, "epoch": 1920} {"train_loss": -23.07484245300293, "global_step": 159377, "epoch": 1920} {"train_loss": -23.393831253051758, "global_step": 159378, "epoch": 1920} {"train_loss": -23.393354415893555, "global_step": 159379, "epoch": 1920} {"train_loss": -23.20216178894043, "global_step": 159380, "epoch": 1920} {"train_loss": -23.207578659057617, "global_step": 159381, "epoch": 1920} {"train_loss": -23.53290367126465, "global_step": 159382, "epoch": 1920} {"train_loss": -22.87989616394043, "global_step": 159383, "epoch": 1920} {"train_loss": -23.27032470703125, "global_step": 159384, "epoch": 1920} {"train_loss": -23.294200897216797, "global_step": 159385, "epoch": 1920} {"train_loss": -23.318010330200195, "global_step": 159386, "epoch": 1920} {"train_loss": -23.541776657104492, "global_step": 159387, "epoch": 1920} {"train_loss": -23.44215202331543, "global_step": 159388, "epoch": 1920} {"train_loss": -23.1424503326416, "global_step": 159389, "epoch": 1920} {"train_loss": -23.414457321166992, "global_step": 159390, "epoch": 1920} {"train_loss": -23.345733642578125, "global_step": 159391, "epoch": 1920} {"train_loss": -23.412155151367188, "global_step": 159392, "epoch": 1920} {"train_loss": -23.374361038208008, "global_step": 159393, "epoch": 1920} {"train_loss": -23.181180953979492, "global_step": 159394, "epoch": 1920} {"train_loss": -23.428709030151367, "global_step": 159395, "epoch": 1920} {"train_loss": -23.46048355102539, "global_step": 159396, "epoch": 1920} {"train_loss": -23.232620239257812, "global_step": 159397, "epoch": 1920} {"train_loss": -23.512720108032227, "global_step": 159398, "epoch": 1920} {"train_loss": -23.75850486755371, "global_step": 159399, "epoch": 1920} {"train_loss": -23.603092193603516, "global_step": 159400, "epoch": 1920} {"train_loss": -23.436384201049805, "global_step": 159401, "epoch": 1920} {"train_loss": -23.41033935546875, "global_step": 159402, "epoch": 1920} {"train_loss": -23.933443069458008, "global_step": 159403, "epoch": 1920} {"train_loss": -23.76661491394043, "global_step": 159404, "epoch": 1920} {"train_loss": -23.597606658935547, "global_step": 159405, "epoch": 1920} {"train_loss": -23.304502487182617, "global_step": 159406, "epoch": 1920} {"train_loss": -23.21354103088379, "global_step": 159407, "epoch": 1920} {"train_loss": -23.50568962097168, "global_step": 159408, "epoch": 1920} {"train_loss": -23.233963012695312, "global_step": 159409, "epoch": 1920} {"train_loss": -23.58418846130371, "global_step": 159410, "epoch": 1920} {"train_loss": -23.857988357543945, "global_step": 159411, "epoch": 1920} {"train_loss": -23.67624855041504, "global_step": 159412, "epoch": 1920} {"train_loss": -23.606782913208008, "global_step": 159413, "epoch": 1920} {"train_loss": -23.534055709838867, "global_step": 159414, "epoch": 1920} {"train_loss": -23.605125427246094, "global_step": 159415, "epoch": 1920} {"train_loss": -23.375354766845703, "global_step": 159416, "epoch": 1920} {"train_loss": -23.547346115112305, "global_step": 159417, "epoch": 1920} {"train_loss": -23.13873291015625, "global_step": 159418, "epoch": 1920} {"train_loss": -23.62180519104004, "global_step": 159419, "epoch": 1920} {"train_loss": -23.455106735229492, "global_step": 159420, "epoch": 1920} {"train_loss": -23.628952026367188, "global_step": 159421, "epoch": 1920} {"train_loss": -23.504714965820312, "global_step": 159422, "epoch": 1920} {"train_loss": -23.52859115600586, "global_step": 159423, "epoch": 1920} {"train_loss": -23.489843368530273, "global_step": 159424, "epoch": 1920} {"train_loss": -23.95668601989746, "global_step": 159425, "epoch": 1920} {"train_loss": -23.291858673095703, "global_step": 159426, "epoch": 1920} {"train_loss": -23.389644622802734, "global_step": 159427, "epoch": 1920} {"train_loss": -23.362384796142578, "global_step": 159428, "epoch": 1920} {"train_loss": -23.4553279876709, "global_step": 159429, "epoch": 1920} {"train_loss": -23.36213493347168, "global_step": 159430, "epoch": 1920} {"train_loss": -23.473791122436523, "global_step": 159431, "epoch": 1920} {"train_loss": -23.682188034057617, "global_step": 159432, "epoch": 1920} {"train_loss": -23.36866569519043, "global_step": 159433, "epoch": 1920} {"train_loss": -23.676382064819336, "global_step": 159434, "epoch": 1920} {"train_loss": -23.34465980529785, "global_step": 159435, "epoch": 1920} {"train_loss": -23.216894149780273, "global_step": 159436, "epoch": 1920} {"train_loss": -23.257831573486328, "global_step": 159437, "epoch": 1920} {"train_loss": -23.389169692993164, "global_step": 159438, "epoch": 1920} {"train_loss": -23.168277740478516, "global_step": 159439, "epoch": 1920} {"train_loss": -23.158811569213867, "global_step": 159440, "epoch": 1920} {"train_loss": -23.439292907714844, "global_step": 159441, "epoch": 1920} {"train_loss": -23.358372378062054, "global_step": 159442, "epoch": 1920, "val_loss": 6283359.0} {"train_loss": -22.809743881225586, "global_step": 159443, "epoch": 1921} {"train_loss": -23.208044052124023, "global_step": 159444, "epoch": 1921} {"train_loss": -23.126731872558594, "global_step": 159445, "epoch": 1921} {"train_loss": -23.27515983581543, "global_step": 159446, "epoch": 1921} {"train_loss": -22.87424087524414, "global_step": 159447, "epoch": 1921} {"train_loss": -23.639371871948242, "global_step": 159448, "epoch": 1921} {"train_loss": -23.015975952148438, "global_step": 159449, "epoch": 1921} {"train_loss": -23.039831161499023, "global_step": 159450, "epoch": 1921} {"train_loss": -23.4179630279541, "global_step": 159451, "epoch": 1921} {"train_loss": -23.546844482421875, "global_step": 159452, "epoch": 1921} {"train_loss": -23.22987937927246, "global_step": 159453, "epoch": 1921} {"train_loss": -23.27264976501465, "global_step": 159454, "epoch": 1921} {"train_loss": -23.459232330322266, "global_step": 159455, "epoch": 1921} {"train_loss": -23.624656677246094, "global_step": 159456, "epoch": 1921} {"train_loss": -23.74555015563965, "global_step": 159457, "epoch": 1921} {"train_loss": -23.632659912109375, "global_step": 159458, "epoch": 1921} {"train_loss": -23.36945915222168, "global_step": 159459, "epoch": 1921} {"train_loss": -23.619054794311523, "global_step": 159460, "epoch": 1921} {"train_loss": -23.305341720581055, "global_step": 159461, "epoch": 1921} {"train_loss": -23.738325119018555, "global_step": 159462, "epoch": 1921} {"train_loss": -23.7203369140625, "global_step": 159463, "epoch": 1921} {"train_loss": -23.56379508972168, "global_step": 159464, "epoch": 1921} {"train_loss": -23.53204917907715, "global_step": 159465, "epoch": 1921} {"train_loss": -23.576879501342773, "global_step": 159466, "epoch": 1921} {"train_loss": -23.326627731323242, "global_step": 159467, "epoch": 1921} {"train_loss": -23.67416763305664, "global_step": 159468, "epoch": 1921} {"train_loss": -23.45328712463379, "global_step": 159469, "epoch": 1921} {"train_loss": -23.81935691833496, "global_step": 159470, "epoch": 1921} {"train_loss": -23.781949996948242, "global_step": 159471, "epoch": 1921} {"train_loss": -23.601682662963867, "global_step": 159472, "epoch": 1921} {"train_loss": -23.0753231048584, "global_step": 159473, "epoch": 1921} {"train_loss": -23.238910675048828, "global_step": 159474, "epoch": 1921} {"train_loss": -23.606700897216797, "global_step": 159475, "epoch": 1921} {"train_loss": -23.501585006713867, "global_step": 159476, "epoch": 1921} {"train_loss": -23.379261016845703, "global_step": 159477, "epoch": 1921} {"train_loss": -23.48752212524414, "global_step": 159478, "epoch": 1921} {"train_loss": -23.377395629882812, "global_step": 159479, "epoch": 1921} {"train_loss": -23.453622817993164, "global_step": 159480, "epoch": 1921} {"train_loss": -23.619674682617188, "global_step": 159481, "epoch": 1921} {"train_loss": -23.130847930908203, "global_step": 159482, "epoch": 1921} {"train_loss": -23.105859756469727, "global_step": 159483, "epoch": 1921} {"train_loss": -23.903919219970703, "global_step": 159484, "epoch": 1921} {"train_loss": -23.3424129486084, "global_step": 159485, "epoch": 1921} {"train_loss": -23.18057632446289, "global_step": 159486, "epoch": 1921} {"train_loss": -23.88238525390625, "global_step": 159487, "epoch": 1921} {"train_loss": -23.231006622314453, "global_step": 159488, "epoch": 1921} {"train_loss": -23.475685119628906, "global_step": 159489, "epoch": 1921} {"train_loss": -23.454391479492188, "global_step": 159490, "epoch": 1921} {"train_loss": -23.623798370361328, "global_step": 159491, "epoch": 1921} {"train_loss": -23.463932037353516, "global_step": 159492, "epoch": 1921} {"train_loss": -23.427480697631836, "global_step": 159493, "epoch": 1921} {"train_loss": -23.333898544311523, "global_step": 159494, "epoch": 1921} {"train_loss": -23.512203216552734, "global_step": 159495, "epoch": 1921} {"train_loss": -23.5405216217041, "global_step": 159496, "epoch": 1921} {"train_loss": -23.363611221313477, "global_step": 159497, "epoch": 1921} {"train_loss": -23.687009811401367, "global_step": 159498, "epoch": 1921} {"train_loss": -23.324052810668945, "global_step": 159499, "epoch": 1921} {"train_loss": -23.553913116455078, "global_step": 159500, "epoch": 1921} {"train_loss": -23.4899959564209, "global_step": 159501, "epoch": 1921} {"train_loss": -23.34773063659668, "global_step": 159502, "epoch": 1921} {"train_loss": -23.79285430908203, "global_step": 159503, "epoch": 1921} {"train_loss": -23.25947380065918, "global_step": 159504, "epoch": 1921} {"train_loss": -23.411409378051758, "global_step": 159505, "epoch": 1921} {"train_loss": -23.53053855895996, "global_step": 159506, "epoch": 1921} {"train_loss": -23.02134132385254, "global_step": 159507, "epoch": 1921} {"train_loss": -23.4709529876709, "global_step": 159508, "epoch": 1921} {"train_loss": -23.422222137451172, "global_step": 159509, "epoch": 1921} {"train_loss": -23.327390670776367, "global_step": 159510, "epoch": 1921} {"train_loss": -23.33957862854004, "global_step": 159511, "epoch": 1921} {"train_loss": -23.269987106323242, "global_step": 159512, "epoch": 1921} {"train_loss": -23.218482971191406, "global_step": 159513, "epoch": 1921} {"train_loss": -23.612762451171875, "global_step": 159514, "epoch": 1921} {"train_loss": -23.26991844177246, "global_step": 159515, "epoch": 1921} {"train_loss": -23.13387107849121, "global_step": 159516, "epoch": 1921} {"train_loss": -23.832937240600586, "global_step": 159517, "epoch": 1921} {"train_loss": -23.069059371948242, "global_step": 159518, "epoch": 1921} {"train_loss": -23.590436935424805, "global_step": 159519, "epoch": 1921} {"train_loss": -23.952865600585938, "global_step": 159520, "epoch": 1921} {"train_loss": -23.61591911315918, "global_step": 159521, "epoch": 1921} {"train_loss": -23.474212646484375, "global_step": 159522, "epoch": 1921} {"train_loss": -23.202733993530273, "global_step": 159523, "epoch": 1921} {"train_loss": -23.62627410888672, "global_step": 159524, "epoch": 1921} {"train_loss": -23.454294158751708, "global_step": 159525, "epoch": 1921, "val_loss": 6332715.0} {"train_loss": -23.076452255249023, "global_step": 159526, "epoch": 1922} {"train_loss": -23.090553283691406, "global_step": 159527, "epoch": 1922} {"train_loss": -23.45842933654785, "global_step": 159528, "epoch": 1922} {"train_loss": -22.933805465698242, "global_step": 159529, "epoch": 1922} {"train_loss": -23.33284568786621, "global_step": 159530, "epoch": 1922} {"train_loss": -23.20430564880371, "global_step": 159531, "epoch": 1922} {"train_loss": -23.168378829956055, "global_step": 159532, "epoch": 1922} {"train_loss": -23.13458824157715, "global_step": 159533, "epoch": 1922} {"train_loss": -23.068872451782227, "global_step": 159534, "epoch": 1922} {"train_loss": -22.988239288330078, "global_step": 159535, "epoch": 1922} {"train_loss": -23.18891716003418, "global_step": 159536, "epoch": 1922} {"train_loss": -23.131357192993164, "global_step": 159537, "epoch": 1922} {"train_loss": -23.183652877807617, "global_step": 159538, "epoch": 1922} {"train_loss": -23.3245906829834, "global_step": 159539, "epoch": 1922} {"train_loss": -23.484149932861328, "global_step": 159540, "epoch": 1922} {"train_loss": -23.39025115966797, "global_step": 159541, "epoch": 1922} {"train_loss": -23.349355697631836, "global_step": 159542, "epoch": 1922} {"train_loss": -23.149282455444336, "global_step": 159543, "epoch": 1922} {"train_loss": -23.503568649291992, "global_step": 159544, "epoch": 1922} {"train_loss": -23.108036041259766, "global_step": 159545, "epoch": 1922} {"train_loss": -23.58570671081543, "global_step": 159546, "epoch": 1922} {"train_loss": -23.102771759033203, "global_step": 159547, "epoch": 1922} {"train_loss": -23.44776725769043, "global_step": 159548, "epoch": 1922} {"train_loss": -23.323179244995117, "global_step": 159549, "epoch": 1922} {"train_loss": -23.893898010253906, "global_step": 159550, "epoch": 1922} {"train_loss": -23.370187759399414, "global_step": 159551, "epoch": 1922} {"train_loss": -23.623456954956055, "global_step": 159552, "epoch": 1922} {"train_loss": -23.440967559814453, "global_step": 159553, "epoch": 1922} {"train_loss": -23.695940017700195, "global_step": 159554, "epoch": 1922} {"train_loss": -23.391691207885742, "global_step": 159555, "epoch": 1922} {"train_loss": -23.422086715698242, "global_step": 159556, "epoch": 1922} {"train_loss": -23.398147583007812, "global_step": 159557, "epoch": 1922} {"train_loss": -23.562294006347656, "global_step": 159558, "epoch": 1922} {"train_loss": -23.449172973632812, "global_step": 159559, "epoch": 1922} {"train_loss": -23.54596519470215, "global_step": 159560, "epoch": 1922} {"train_loss": -23.72577667236328, "global_step": 159561, "epoch": 1922} {"train_loss": -23.885122299194336, "global_step": 159562, "epoch": 1922} {"train_loss": -23.786794662475586, "global_step": 159563, "epoch": 1922} {"train_loss": -23.340343475341797, "global_step": 159564, "epoch": 1922} {"train_loss": -23.910680770874023, "global_step": 159565, "epoch": 1922} {"train_loss": -23.589378356933594, "global_step": 159566, "epoch": 1922} {"train_loss": -23.387964248657227, "global_step": 159567, "epoch": 1922} {"train_loss": -23.271530151367188, "global_step": 159568, "epoch": 1922} {"train_loss": -23.58574867248535, "global_step": 159569, "epoch": 1922} {"train_loss": -23.6822452545166, "global_step": 159570, "epoch": 1922} {"train_loss": -24.126977920532227, "global_step": 159571, "epoch": 1922} {"train_loss": -23.850452423095703, "global_step": 159572, "epoch": 1922} {"train_loss": -23.536231994628906, "global_step": 159573, "epoch": 1922} {"train_loss": -23.677467346191406, "global_step": 159574, "epoch": 1922} {"train_loss": -23.21771812438965, "global_step": 159575, "epoch": 1922} {"train_loss": -23.615375518798828, "global_step": 159576, "epoch": 1922} {"train_loss": -23.73898696899414, "global_step": 159577, "epoch": 1922} {"train_loss": -23.345489501953125, "global_step": 159578, "epoch": 1922} {"train_loss": -23.059249877929688, "global_step": 159579, "epoch": 1922} {"train_loss": -23.68259620666504, "global_step": 159580, "epoch": 1922} {"train_loss": -23.699661254882812, "global_step": 159581, "epoch": 1922} {"train_loss": -23.250425338745117, "global_step": 159582, "epoch": 1922} {"train_loss": -23.731367111206055, "global_step": 159583, "epoch": 1922} {"train_loss": -23.809980392456055, "global_step": 159584, "epoch": 1922} {"train_loss": -23.754676818847656, "global_step": 159585, "epoch": 1922} {"train_loss": -23.56819725036621, "global_step": 159586, "epoch": 1922} {"train_loss": -23.258390426635742, "global_step": 159587, "epoch": 1922} {"train_loss": -23.099740982055664, "global_step": 159588, "epoch": 1922} {"train_loss": -23.529067993164062, "global_step": 159589, "epoch": 1922} {"train_loss": -23.036710739135742, "global_step": 159590, "epoch": 1922} {"train_loss": -23.538700103759766, "global_step": 159591, "epoch": 1922} {"train_loss": -23.37282943725586, "global_step": 159592, "epoch": 1922} {"train_loss": -23.29957389831543, "global_step": 159593, "epoch": 1922} {"train_loss": -23.407400131225586, "global_step": 159594, "epoch": 1922} {"train_loss": -23.43360710144043, "global_step": 159595, "epoch": 1922} {"train_loss": -23.538053512573242, "global_step": 159596, "epoch": 1922} {"train_loss": -23.069124221801758, "global_step": 159597, "epoch": 1922} {"train_loss": -23.75326156616211, "global_step": 159598, "epoch": 1922} {"train_loss": -23.244911193847656, "global_step": 159599, "epoch": 1922} {"train_loss": -23.236440658569336, "global_step": 159600, "epoch": 1922} {"train_loss": -23.60093116760254, "global_step": 159601, "epoch": 1922} {"train_loss": -23.474143981933594, "global_step": 159602, "epoch": 1922} {"train_loss": -23.241159439086914, "global_step": 159603, "epoch": 1922} {"train_loss": -23.387907028198242, "global_step": 159604, "epoch": 1922} {"train_loss": -23.5207576751709, "global_step": 159605, "epoch": 1922} {"train_loss": -23.534503936767578, "global_step": 159606, "epoch": 1922} {"train_loss": -23.271982192993164, "global_step": 159607, "epoch": 1922} {"train_loss": -23.42207237611334, "global_step": 159608, "epoch": 1922, "val_loss": 6246540.0} {"train_loss": -23.45465660095215, "global_step": 159609, "epoch": 1923} {"train_loss": -23.233795166015625, "global_step": 159610, "epoch": 1923} {"train_loss": -23.031543731689453, "global_step": 159611, "epoch": 1923} {"train_loss": -22.954580307006836, "global_step": 159612, "epoch": 1923} {"train_loss": -23.54084587097168, "global_step": 159613, "epoch": 1923} {"train_loss": -23.124130249023438, "global_step": 159614, "epoch": 1923} {"train_loss": -23.00693702697754, "global_step": 159615, "epoch": 1923} {"train_loss": -23.51091957092285, "global_step": 159616, "epoch": 1923} {"train_loss": -23.474369049072266, "global_step": 159617, "epoch": 1923} {"train_loss": -23.43233299255371, "global_step": 159618, "epoch": 1923} {"train_loss": -23.341201782226562, "global_step": 159619, "epoch": 1923} {"train_loss": -23.68782615661621, "global_step": 159620, "epoch": 1923} {"train_loss": -23.34046745300293, "global_step": 159621, "epoch": 1923} {"train_loss": -23.446882247924805, "global_step": 159622, "epoch": 1923} {"train_loss": -23.43878173828125, "global_step": 159623, "epoch": 1923} {"train_loss": -23.587644577026367, "global_step": 159624, "epoch": 1923} {"train_loss": -23.685216903686523, "global_step": 159625, "epoch": 1923} {"train_loss": -23.4884090423584, "global_step": 159626, "epoch": 1923} {"train_loss": -23.633962631225586, "global_step": 159627, "epoch": 1923} {"train_loss": -23.37925910949707, "global_step": 159628, "epoch": 1923} {"train_loss": -23.4039306640625, "global_step": 159629, "epoch": 1923} {"train_loss": -23.245620727539062, "global_step": 159630, "epoch": 1923} {"train_loss": -23.668476104736328, "global_step": 159631, "epoch": 1923} {"train_loss": -23.53061294555664, "global_step": 159632, "epoch": 1923} {"train_loss": -23.357622146606445, "global_step": 159633, "epoch": 1923} {"train_loss": -23.497804641723633, "global_step": 159634, "epoch": 1923} {"train_loss": -23.514799118041992, "global_step": 159635, "epoch": 1923} {"train_loss": -23.14115333557129, "global_step": 159636, "epoch": 1923} {"train_loss": -23.69948959350586, "global_step": 159637, "epoch": 1923} {"train_loss": -23.395496368408203, "global_step": 159638, "epoch": 1923} {"train_loss": -23.1058292388916, "global_step": 159639, "epoch": 1923} {"train_loss": -23.325885772705078, "global_step": 159640, "epoch": 1923} {"train_loss": -23.771316528320312, "global_step": 159641, "epoch": 1923} {"train_loss": -23.526039123535156, "global_step": 159642, "epoch": 1923} {"train_loss": -23.213285446166992, "global_step": 159643, "epoch": 1923} {"train_loss": -23.575336456298828, "global_step": 159644, "epoch": 1923} {"train_loss": -23.271909713745117, "global_step": 159645, "epoch": 1923} {"train_loss": -23.179840087890625, "global_step": 159646, "epoch": 1923} {"train_loss": -23.502307891845703, "global_step": 159647, "epoch": 1923} {"train_loss": -23.554624557495117, "global_step": 159648, "epoch": 1923} {"train_loss": -23.170337677001953, "global_step": 159649, "epoch": 1923} {"train_loss": -23.555545806884766, "global_step": 159650, "epoch": 1923} {"train_loss": -23.576663970947266, "global_step": 159651, "epoch": 1923} {"train_loss": -23.822765350341797, "global_step": 159652, "epoch": 1923} {"train_loss": -23.407546997070312, "global_step": 159653, "epoch": 1923} {"train_loss": -23.790842056274414, "global_step": 159654, "epoch": 1923} {"train_loss": -23.52657127380371, "global_step": 159655, "epoch": 1923} {"train_loss": -23.635517120361328, "global_step": 159656, "epoch": 1923} {"train_loss": -23.428203582763672, "global_step": 159657, "epoch": 1923} {"train_loss": -23.60881805419922, "global_step": 159658, "epoch": 1923} {"train_loss": -23.369474411010742, "global_step": 159659, "epoch": 1923} {"train_loss": -23.65096092224121, "global_step": 159660, "epoch": 1923} {"train_loss": -23.681135177612305, "global_step": 159661, "epoch": 1923} {"train_loss": -23.826353073120117, "global_step": 159662, "epoch": 1923} {"train_loss": -23.56781768798828, "global_step": 159663, "epoch": 1923} {"train_loss": -23.505395889282227, "global_step": 159664, "epoch": 1923} {"train_loss": -23.875722885131836, "global_step": 159665, "epoch": 1923} {"train_loss": -23.221527099609375, "global_step": 159666, "epoch": 1923} {"train_loss": -23.234668731689453, "global_step": 159667, "epoch": 1923} {"train_loss": -23.45287322998047, "global_step": 159668, "epoch": 1923} {"train_loss": -23.543134689331055, "global_step": 159669, "epoch": 1923} {"train_loss": -23.717975616455078, "global_step": 159670, "epoch": 1923} {"train_loss": -23.24518585205078, "global_step": 159671, "epoch": 1923} {"train_loss": -23.574121475219727, "global_step": 159672, "epoch": 1923} {"train_loss": -23.187021255493164, "global_step": 159673, "epoch": 1923} {"train_loss": -24.006132125854492, "global_step": 159674, "epoch": 1923} {"train_loss": -23.28177261352539, "global_step": 159675, "epoch": 1923} {"train_loss": -23.886554718017578, "global_step": 159676, "epoch": 1923} {"train_loss": -23.368938446044922, "global_step": 159677, "epoch": 1923} {"train_loss": -23.541038513183594, "global_step": 159678, "epoch": 1923} {"train_loss": -23.490869522094727, "global_step": 159679, "epoch": 1923} {"train_loss": -23.17974281311035, "global_step": 159680, "epoch": 1923} {"train_loss": -23.723407745361328, "global_step": 159681, "epoch": 1923} {"train_loss": -23.799936294555664, "global_step": 159682, "epoch": 1923} {"train_loss": -23.51726722717285, "global_step": 159683, "epoch": 1923} {"train_loss": -23.745752334594727, "global_step": 159684, "epoch": 1923} {"train_loss": -23.258010864257812, "global_step": 159685, "epoch": 1923} {"train_loss": -23.667757034301758, "global_step": 159686, "epoch": 1923} {"train_loss": -23.50040626525879, "global_step": 159687, "epoch": 1923} {"train_loss": -23.682605743408203, "global_step": 159688, "epoch": 1923} {"train_loss": -22.998018264770508, "global_step": 159689, "epoch": 1923} {"train_loss": -23.610977172851562, "global_step": 159690, "epoch": 1923} {"train_loss": -23.463093746139343, "global_step": 159691, "epoch": 1923, "val_loss": 6478447.5} {"train_loss": -23.330429077148438, "global_step": 159692, "epoch": 1924} {"train_loss": -22.747446060180664, "global_step": 159693, "epoch": 1924} {"train_loss": -23.305490493774414, "global_step": 159694, "epoch": 1924} {"train_loss": -23.289432525634766, "global_step": 159695, "epoch": 1924} {"train_loss": -23.549243927001953, "global_step": 159696, "epoch": 1924} {"train_loss": -23.159711837768555, "global_step": 159697, "epoch": 1924} {"train_loss": -23.390871047973633, "global_step": 159698, "epoch": 1924} {"train_loss": -23.330625534057617, "global_step": 159699, "epoch": 1924} {"train_loss": -23.3704891204834, "global_step": 159700, "epoch": 1924} {"train_loss": -23.326887130737305, "global_step": 159701, "epoch": 1924} {"train_loss": -23.506622314453125, "global_step": 159702, "epoch": 1924} {"train_loss": -23.277549743652344, "global_step": 159703, "epoch": 1924} {"train_loss": -23.178747177124023, "global_step": 159704, "epoch": 1924} {"train_loss": -23.547746658325195, "global_step": 159705, "epoch": 1924} {"train_loss": -22.657901763916016, "global_step": 159706, "epoch": 1924} {"train_loss": -22.945810317993164, "global_step": 159707, "epoch": 1924} {"train_loss": -23.6701717376709, "global_step": 159708, "epoch": 1924} {"train_loss": -22.973478317260742, "global_step": 159709, "epoch": 1924} {"train_loss": -23.288137435913086, "global_step": 159710, "epoch": 1924} {"train_loss": -23.297439575195312, "global_step": 159711, "epoch": 1924} {"train_loss": -23.929601669311523, "global_step": 159712, "epoch": 1924} {"train_loss": -23.350072860717773, "global_step": 159713, "epoch": 1924} {"train_loss": -23.27500343322754, "global_step": 159714, "epoch": 1924} {"train_loss": -23.332067489624023, "global_step": 159715, "epoch": 1924} {"train_loss": -23.768939971923828, "global_step": 159716, "epoch": 1924} {"train_loss": -23.383502960205078, "global_step": 159717, "epoch": 1924} {"train_loss": -23.497312545776367, "global_step": 159718, "epoch": 1924} {"train_loss": -23.29559326171875, "global_step": 159719, "epoch": 1924} {"train_loss": -23.48957633972168, "global_step": 159720, "epoch": 1924} {"train_loss": -23.432294845581055, "global_step": 159721, "epoch": 1924} {"train_loss": -23.835763931274414, "global_step": 159722, "epoch": 1924} {"train_loss": -23.58648681640625, "global_step": 159723, "epoch": 1924} {"train_loss": -23.730812072753906, "global_step": 159724, "epoch": 1924} {"train_loss": -23.05519676208496, "global_step": 159725, "epoch": 1924} {"train_loss": -23.530298233032227, "global_step": 159726, "epoch": 1924} {"train_loss": -23.315841674804688, "global_step": 159727, "epoch": 1924} {"train_loss": -23.64301109313965, "global_step": 159728, "epoch": 1924} {"train_loss": -23.488338470458984, "global_step": 159729, "epoch": 1924} {"train_loss": -23.234785079956055, "global_step": 159730, "epoch": 1924} {"train_loss": -23.279911041259766, "global_step": 159731, "epoch": 1924} {"train_loss": -23.35755729675293, "global_step": 159732, "epoch": 1924} {"train_loss": -23.515411376953125, "global_step": 159733, "epoch": 1924} {"train_loss": -23.498167037963867, "global_step": 159734, "epoch": 1924} {"train_loss": -23.483083724975586, "global_step": 159735, "epoch": 1924} {"train_loss": -23.347705841064453, "global_step": 159736, "epoch": 1924} {"train_loss": -23.325138092041016, "global_step": 159737, "epoch": 1924} {"train_loss": -23.592731475830078, "global_step": 159738, "epoch": 1924} {"train_loss": -23.384788513183594, "global_step": 159739, "epoch": 1924} {"train_loss": -23.345251083374023, "global_step": 159740, "epoch": 1924} {"train_loss": -23.80573844909668, "global_step": 159741, "epoch": 1924} {"train_loss": -23.552936553955078, "global_step": 159742, "epoch": 1924} {"train_loss": -23.55754852294922, "global_step": 159743, "epoch": 1924} {"train_loss": -23.5489559173584, "global_step": 159744, "epoch": 1924} {"train_loss": -23.329896926879883, "global_step": 159745, "epoch": 1924} {"train_loss": -23.391820907592773, "global_step": 159746, "epoch": 1924} {"train_loss": -23.502944946289062, "global_step": 159747, "epoch": 1924} {"train_loss": -23.399747848510742, "global_step": 159748, "epoch": 1924} {"train_loss": -23.59919548034668, "global_step": 159749, "epoch": 1924} {"train_loss": -23.280136108398438, "global_step": 159750, "epoch": 1924} {"train_loss": -23.46527671813965, "global_step": 159751, "epoch": 1924} {"train_loss": -23.268325805664062, "global_step": 159752, "epoch": 1924} {"train_loss": -23.328723907470703, "global_step": 159753, "epoch": 1924} {"train_loss": -23.439006805419922, "global_step": 159754, "epoch": 1924} {"train_loss": -23.23917579650879, "global_step": 159755, "epoch": 1924} {"train_loss": -23.486845016479492, "global_step": 159756, "epoch": 1924} {"train_loss": -23.67557716369629, "global_step": 159757, "epoch": 1924} {"train_loss": -23.458541870117188, "global_step": 159758, "epoch": 1924} {"train_loss": -23.67722511291504, "global_step": 159759, "epoch": 1924} {"train_loss": -23.136281967163086, "global_step": 159760, "epoch": 1924} {"train_loss": -23.491546630859375, "global_step": 159761, "epoch": 1924} {"train_loss": -23.6508846282959, "global_step": 159762, "epoch": 1924} {"train_loss": -23.4063777923584, "global_step": 159763, "epoch": 1924} {"train_loss": -23.307727813720703, "global_step": 159764, "epoch": 1924} {"train_loss": -23.337467193603516, "global_step": 159765, "epoch": 1924} {"train_loss": -23.845176696777344, "global_step": 159766, "epoch": 1924} {"train_loss": -23.567401885986328, "global_step": 159767, "epoch": 1924} {"train_loss": -23.736433029174805, "global_step": 159768, "epoch": 1924} {"train_loss": -23.376731872558594, "global_step": 159769, "epoch": 1924} {"train_loss": -23.62753677368164, "global_step": 159770, "epoch": 1924} {"train_loss": -23.760581970214844, "global_step": 159771, "epoch": 1924} {"train_loss": -23.432361602783203, "global_step": 159772, "epoch": 1924} {"train_loss": -23.628400802612305, "global_step": 159773, "epoch": 1924} {"train_loss": -23.42791904311582, "global_step": 159774, "epoch": 1924, "val_loss": 6391831.0} {"train_loss": -22.553884506225586, "global_step": 159775, "epoch": 1925} {"train_loss": -23.242496490478516, "global_step": 159776, "epoch": 1925} {"train_loss": -22.569711685180664, "global_step": 159777, "epoch": 1925} {"train_loss": -23.48261070251465, "global_step": 159778, "epoch": 1925} {"train_loss": -22.83784294128418, "global_step": 159779, "epoch": 1925} {"train_loss": -22.830114364624023, "global_step": 159780, "epoch": 1925} {"train_loss": -22.845535278320312, "global_step": 159781, "epoch": 1925} {"train_loss": -23.210067749023438, "global_step": 159782, "epoch": 1925} {"train_loss": -23.221220016479492, "global_step": 159783, "epoch": 1925} {"train_loss": -22.6203670501709, "global_step": 159784, "epoch": 1925} {"train_loss": -22.94040870666504, "global_step": 159785, "epoch": 1925} {"train_loss": -23.12074851989746, "global_step": 159786, "epoch": 1925} {"train_loss": -23.09501075744629, "global_step": 159787, "epoch": 1925} {"train_loss": -23.55419921875, "global_step": 159788, "epoch": 1925} {"train_loss": -22.84918212890625, "global_step": 159789, "epoch": 1925} {"train_loss": -23.31321144104004, "global_step": 159790, "epoch": 1925} {"train_loss": -22.94916534423828, "global_step": 159791, "epoch": 1925} {"train_loss": -23.418596267700195, "global_step": 159792, "epoch": 1925} {"train_loss": -23.580533981323242, "global_step": 159793, "epoch": 1925} {"train_loss": -23.608123779296875, "global_step": 159794, "epoch": 1925} {"train_loss": -23.020986557006836, "global_step": 159795, "epoch": 1925} {"train_loss": -23.117773056030273, "global_step": 159796, "epoch": 1925} {"train_loss": -23.10706901550293, "global_step": 159797, "epoch": 1925} {"train_loss": -23.43892478942871, "global_step": 159798, "epoch": 1925} {"train_loss": -23.37464141845703, "global_step": 159799, "epoch": 1925} {"train_loss": -23.338937759399414, "global_step": 159800, "epoch": 1925} {"train_loss": -23.521961212158203, "global_step": 159801, "epoch": 1925} {"train_loss": -23.3322696685791, "global_step": 159802, "epoch": 1925} {"train_loss": -23.35426139831543, "global_step": 159803, "epoch": 1925} {"train_loss": -23.35999870300293, "global_step": 159804, "epoch": 1925} {"train_loss": -23.249296188354492, "global_step": 159805, "epoch": 1925} {"train_loss": -23.31117820739746, "global_step": 159806, "epoch": 1925} {"train_loss": -23.418066024780273, "global_step": 159807, "epoch": 1925} {"train_loss": -23.279315948486328, "global_step": 159808, "epoch": 1925} {"train_loss": -23.679630279541016, "global_step": 159809, "epoch": 1925} {"train_loss": -23.264801025390625, "global_step": 159810, "epoch": 1925} {"train_loss": -23.47819709777832, "global_step": 159811, "epoch": 1925} {"train_loss": -23.868473052978516, "global_step": 159812, "epoch": 1925} {"train_loss": -23.6108455657959, "global_step": 159813, "epoch": 1925} {"train_loss": -23.486038208007812, "global_step": 159814, "epoch": 1925} {"train_loss": -23.315067291259766, "global_step": 159815, "epoch": 1925} {"train_loss": -23.388355255126953, "global_step": 159816, "epoch": 1925} {"train_loss": -23.287673950195312, "global_step": 159817, "epoch": 1925} {"train_loss": -23.204938888549805, "global_step": 159818, "epoch": 1925} {"train_loss": -23.259605407714844, "global_step": 159819, "epoch": 1925} {"train_loss": -23.15884780883789, "global_step": 159820, "epoch": 1925} {"train_loss": -23.721586227416992, "global_step": 159821, "epoch": 1925} {"train_loss": -23.544418334960938, "global_step": 159822, "epoch": 1925} {"train_loss": -23.68906021118164, "global_step": 159823, "epoch": 1925} {"train_loss": -23.523681640625, "global_step": 159824, "epoch": 1925} {"train_loss": -23.3488826751709, "global_step": 159825, "epoch": 1925} {"train_loss": -23.49380874633789, "global_step": 159826, "epoch": 1925} {"train_loss": -23.492250442504883, "global_step": 159827, "epoch": 1925} {"train_loss": -23.1690616607666, "global_step": 159828, "epoch": 1925} {"train_loss": -23.525394439697266, "global_step": 159829, "epoch": 1925} {"train_loss": -23.65212059020996, "global_step": 159830, "epoch": 1925} {"train_loss": -23.35157585144043, "global_step": 159831, "epoch": 1925} {"train_loss": -23.490482330322266, "global_step": 159832, "epoch": 1925} {"train_loss": -23.257062911987305, "global_step": 159833, "epoch": 1925} {"train_loss": -23.677776336669922, "global_step": 159834, "epoch": 1925} {"train_loss": -23.157541275024414, "global_step": 159835, "epoch": 1925} {"train_loss": -23.4991455078125, "global_step": 159836, "epoch": 1925} {"train_loss": -23.2808780670166, "global_step": 159837, "epoch": 1925} {"train_loss": -23.28715705871582, "global_step": 159838, "epoch": 1925} {"train_loss": -23.437698364257812, "global_step": 159839, "epoch": 1925} {"train_loss": -23.4091739654541, "global_step": 159840, "epoch": 1925} {"train_loss": -23.261829376220703, "global_step": 159841, "epoch": 1925} {"train_loss": -23.193477630615234, "global_step": 159842, "epoch": 1925} {"train_loss": -23.03189468383789, "global_step": 159843, "epoch": 1925} {"train_loss": -23.302030563354492, "global_step": 159844, "epoch": 1925} {"train_loss": -23.472801208496094, "global_step": 159845, "epoch": 1925} {"train_loss": -23.194555282592773, "global_step": 159846, "epoch": 1925} {"train_loss": -23.275009155273438, "global_step": 159847, "epoch": 1925} {"train_loss": -23.175884246826172, "global_step": 159848, "epoch": 1925} {"train_loss": -23.47321128845215, "global_step": 159849, "epoch": 1925} {"train_loss": -23.09904670715332, "global_step": 159850, "epoch": 1925} {"train_loss": -23.24452018737793, "global_step": 159851, "epoch": 1925} {"train_loss": -23.380399703979492, "global_step": 159852, "epoch": 1925} {"train_loss": -23.246686935424805, "global_step": 159853, "epoch": 1925} {"train_loss": -23.230819702148438, "global_step": 159854, "epoch": 1925} {"train_loss": -22.70888328552246, "global_step": 159855, "epoch": 1925} {"train_loss": -23.541183471679688, "global_step": 159856, "epoch": 1925} {"train_loss": -23.29543095324413, "global_step": 159857, "epoch": 1925, "val_loss": 6321055.0} {"train_loss": -22.588815689086914, "global_step": 159858, "epoch": 1926} {"train_loss": -23.007427215576172, "global_step": 159859, "epoch": 1926} {"train_loss": -23.215850830078125, "global_step": 159860, "epoch": 1926} {"train_loss": -23.10077476501465, "global_step": 159861, "epoch": 1926} {"train_loss": -22.866065979003906, "global_step": 159862, "epoch": 1926} {"train_loss": -23.19544792175293, "global_step": 159863, "epoch": 1926} {"train_loss": -22.937864303588867, "global_step": 159864, "epoch": 1926} {"train_loss": -23.10874366760254, "global_step": 159865, "epoch": 1926} {"train_loss": -23.406787872314453, "global_step": 159866, "epoch": 1926} {"train_loss": -23.26564598083496, "global_step": 159867, "epoch": 1926} {"train_loss": -23.351913452148438, "global_step": 159868, "epoch": 1926} {"train_loss": -23.391403198242188, "global_step": 159869, "epoch": 1926} {"train_loss": -23.172941207885742, "global_step": 159870, "epoch": 1926} {"train_loss": -23.312170028686523, "global_step": 159871, "epoch": 1926} {"train_loss": -23.626741409301758, "global_step": 159872, "epoch": 1926} {"train_loss": -23.57906723022461, "global_step": 159873, "epoch": 1926} {"train_loss": -23.4116268157959, "global_step": 159874, "epoch": 1926} {"train_loss": -23.258451461791992, "global_step": 159875, "epoch": 1926} {"train_loss": -23.32750701904297, "global_step": 159876, "epoch": 1926} {"train_loss": -23.764097213745117, "global_step": 159877, "epoch": 1926} {"train_loss": -23.518495559692383, "global_step": 159878, "epoch": 1926} {"train_loss": -23.545358657836914, "global_step": 159879, "epoch": 1926} {"train_loss": -23.610673904418945, "global_step": 159880, "epoch": 1926} {"train_loss": -23.594579696655273, "global_step": 159881, "epoch": 1926} {"train_loss": -23.436168670654297, "global_step": 159882, "epoch": 1926} {"train_loss": -23.454692840576172, "global_step": 159883, "epoch": 1926} {"train_loss": -23.57927894592285, "global_step": 159884, "epoch": 1926} {"train_loss": -23.805688858032227, "global_step": 159885, "epoch": 1926} {"train_loss": -23.935026168823242, "global_step": 159886, "epoch": 1926} {"train_loss": -23.87918472290039, "global_step": 159887, "epoch": 1926} {"train_loss": -23.80592155456543, "global_step": 159888, "epoch": 1926} {"train_loss": -23.608978271484375, "global_step": 159889, "epoch": 1926} {"train_loss": -23.255741119384766, "global_step": 159890, "epoch": 1926} {"train_loss": -23.511579513549805, "global_step": 159891, "epoch": 1926} {"train_loss": -23.359622955322266, "global_step": 159892, "epoch": 1926} {"train_loss": -23.35783576965332, "global_step": 159893, "epoch": 1926} {"train_loss": -23.798816680908203, "global_step": 159894, "epoch": 1926} {"train_loss": -23.35470199584961, "global_step": 159895, "epoch": 1926} {"train_loss": -23.28960609436035, "global_step": 159896, "epoch": 1926} {"train_loss": -23.4102840423584, "global_step": 159897, "epoch": 1926} {"train_loss": -23.017711639404297, "global_step": 159898, "epoch": 1926} {"train_loss": -22.913408279418945, "global_step": 159899, "epoch": 1926} {"train_loss": -23.26639175415039, "global_step": 159900, "epoch": 1926} {"train_loss": -23.557828903198242, "global_step": 159901, "epoch": 1926} {"train_loss": -23.424707412719727, "global_step": 159902, "epoch": 1926} {"train_loss": -23.80033302307129, "global_step": 159903, "epoch": 1926} {"train_loss": -23.406097412109375, "global_step": 159904, "epoch": 1926} {"train_loss": -23.263940811157227, "global_step": 159905, "epoch": 1926} {"train_loss": -23.23907470703125, "global_step": 159906, "epoch": 1926} {"train_loss": -23.419246673583984, "global_step": 159907, "epoch": 1926} {"train_loss": -23.674619674682617, "global_step": 159908, "epoch": 1926} {"train_loss": -23.341190338134766, "global_step": 159909, "epoch": 1926} {"train_loss": -23.629871368408203, "global_step": 159910, "epoch": 1926} {"train_loss": -23.792896270751953, "global_step": 159911, "epoch": 1926} {"train_loss": -23.40102195739746, "global_step": 159912, "epoch": 1926} {"train_loss": -23.44965934753418, "global_step": 159913, "epoch": 1926} {"train_loss": -23.545856475830078, "global_step": 159914, "epoch": 1926} {"train_loss": -23.577512741088867, "global_step": 159915, "epoch": 1926} {"train_loss": -23.764814376831055, "global_step": 159916, "epoch": 1926} {"train_loss": -23.54642677307129, "global_step": 159917, "epoch": 1926} {"train_loss": -23.540075302124023, "global_step": 159918, "epoch": 1926} {"train_loss": -23.534574508666992, "global_step": 159919, "epoch": 1926} {"train_loss": -23.414121627807617, "global_step": 159920, "epoch": 1926} {"train_loss": -23.691055297851562, "global_step": 159921, "epoch": 1926} {"train_loss": -23.645917892456055, "global_step": 159922, "epoch": 1926} {"train_loss": -23.66351318359375, "global_step": 159923, "epoch": 1926} {"train_loss": -23.43218231201172, "global_step": 159924, "epoch": 1926} {"train_loss": -23.467315673828125, "global_step": 159925, "epoch": 1926} {"train_loss": -23.131200790405273, "global_step": 159926, "epoch": 1926} {"train_loss": -23.36241912841797, "global_step": 159927, "epoch": 1926} {"train_loss": -23.269968032836914, "global_step": 159928, "epoch": 1926} {"train_loss": -23.64668846130371, "global_step": 159929, "epoch": 1926} {"train_loss": -23.303251266479492, "global_step": 159930, "epoch": 1926} {"train_loss": -23.377120971679688, "global_step": 159931, "epoch": 1926} {"train_loss": -23.55188751220703, "global_step": 159932, "epoch": 1926} {"train_loss": -23.28689956665039, "global_step": 159933, "epoch": 1926} {"train_loss": -23.062620162963867, "global_step": 159934, "epoch": 1926} {"train_loss": -23.61004066467285, "global_step": 159935, "epoch": 1926} {"train_loss": -23.83292007446289, "global_step": 159936, "epoch": 1926} {"train_loss": -23.309179306030273, "global_step": 159937, "epoch": 1926} {"train_loss": -23.585233688354492, "global_step": 159938, "epoch": 1926} {"train_loss": -23.562856674194336, "global_step": 159939, "epoch": 1926} {"train_loss": -23.440891817391638, "global_step": 159940, "epoch": 1926, "val_loss": 6501778.0} {"train_loss": -22.829442977905273, "global_step": 159941, "epoch": 1927} {"train_loss": -23.250158309936523, "global_step": 159942, "epoch": 1927} {"train_loss": -23.322202682495117, "global_step": 159943, "epoch": 1927} {"train_loss": -23.575042724609375, "global_step": 159944, "epoch": 1927} {"train_loss": -23.048063278198242, "global_step": 159945, "epoch": 1927} {"train_loss": -23.427677154541016, "global_step": 159946, "epoch": 1927} {"train_loss": -23.016212463378906, "global_step": 159947, "epoch": 1927} {"train_loss": -23.14198875427246, "global_step": 159948, "epoch": 1927} {"train_loss": -23.291587829589844, "global_step": 159949, "epoch": 1927} {"train_loss": -23.306955337524414, "global_step": 159950, "epoch": 1927} {"train_loss": -23.85011863708496, "global_step": 159951, "epoch": 1927} {"train_loss": -23.161457061767578, "global_step": 159952, "epoch": 1927} {"train_loss": -23.290990829467773, "global_step": 159953, "epoch": 1927} {"train_loss": -23.71138572692871, "global_step": 159954, "epoch": 1927} {"train_loss": -23.464771270751953, "global_step": 159955, "epoch": 1927} {"train_loss": -23.523006439208984, "global_step": 159956, "epoch": 1927} {"train_loss": -23.40048599243164, "global_step": 159957, "epoch": 1927} {"train_loss": -23.57501220703125, "global_step": 159958, "epoch": 1927} {"train_loss": -23.247970581054688, "global_step": 159959, "epoch": 1927} {"train_loss": -23.669513702392578, "global_step": 159960, "epoch": 1927} {"train_loss": -23.240169525146484, "global_step": 159961, "epoch": 1927} {"train_loss": -23.559234619140625, "global_step": 159962, "epoch": 1927} {"train_loss": -23.464860916137695, "global_step": 159963, "epoch": 1927} {"train_loss": -23.333894729614258, "global_step": 159964, "epoch": 1927} {"train_loss": -23.458541870117188, "global_step": 159965, "epoch": 1927} {"train_loss": -23.348257064819336, "global_step": 159966, "epoch": 1927} {"train_loss": -23.721349716186523, "global_step": 159967, "epoch": 1927} {"train_loss": -23.056055068969727, "global_step": 159968, "epoch": 1927} {"train_loss": -23.08478355407715, "global_step": 159969, "epoch": 1927} {"train_loss": -23.470556259155273, "global_step": 159970, "epoch": 1927} {"train_loss": -23.534910202026367, "global_step": 159971, "epoch": 1927} {"train_loss": -23.427885055541992, "global_step": 159972, "epoch": 1927} {"train_loss": -23.726394653320312, "global_step": 159973, "epoch": 1927} {"train_loss": -23.518564224243164, "global_step": 159974, "epoch": 1927} {"train_loss": -23.584836959838867, "global_step": 159975, "epoch": 1927} {"train_loss": -23.814537048339844, "global_step": 159976, "epoch": 1927} {"train_loss": -23.759187698364258, "global_step": 159977, "epoch": 1927} {"train_loss": -23.580270767211914, "global_step": 159978, "epoch": 1927} {"train_loss": -23.682992935180664, "global_step": 159979, "epoch": 1927} {"train_loss": -23.656763076782227, "global_step": 159980, "epoch": 1927} {"train_loss": -23.419052124023438, "global_step": 159981, "epoch": 1927} {"train_loss": -23.491910934448242, "global_step": 159982, "epoch": 1927} {"train_loss": -23.71268653869629, "global_step": 159983, "epoch": 1927} {"train_loss": -23.579496383666992, "global_step": 159984, "epoch": 1927} {"train_loss": -23.349864959716797, "global_step": 159985, "epoch": 1927} {"train_loss": -23.667978286743164, "global_step": 159986, "epoch": 1927} {"train_loss": -23.55622673034668, "global_step": 159987, "epoch": 1927} {"train_loss": -23.51893424987793, "global_step": 159988, "epoch": 1927} {"train_loss": -23.562536239624023, "global_step": 159989, "epoch": 1927} {"train_loss": -23.452558517456055, "global_step": 159990, "epoch": 1927} {"train_loss": -23.533220291137695, "global_step": 159991, "epoch": 1927} {"train_loss": -23.21178436279297, "global_step": 159992, "epoch": 1927} {"train_loss": -23.467519760131836, "global_step": 159993, "epoch": 1927} {"train_loss": -23.538671493530273, "global_step": 159994, "epoch": 1927} {"train_loss": -23.56373405456543, "global_step": 159995, "epoch": 1927} {"train_loss": -23.54150390625, "global_step": 159996, "epoch": 1927} {"train_loss": -23.225805282592773, "global_step": 159997, "epoch": 1927} {"train_loss": -23.529325485229492, "global_step": 159998, "epoch": 1927} {"train_loss": -23.445802688598633, "global_step": 159999, "epoch": 1927} {"train_loss": -23.062667846679688, "global_step": 160000, "epoch": 1927} {"train_loss": -23.718021392822266, "global_step": 160001, "epoch": 1927} {"train_loss": -23.52849006652832, "global_step": 160002, "epoch": 1927} {"train_loss": -23.362539291381836, "global_step": 160003, "epoch": 1927} {"train_loss": -23.47785758972168, "global_step": 160004, "epoch": 1927} {"train_loss": -23.67268943786621, "global_step": 160005, "epoch": 1927} {"train_loss": -23.53841209411621, "global_step": 160006, "epoch": 1927} {"train_loss": -23.998136520385742, "global_step": 160007, "epoch": 1927} {"train_loss": -23.51727867126465, "global_step": 160008, "epoch": 1927} {"train_loss": -23.72056770324707, "global_step": 160009, "epoch": 1927} {"train_loss": -23.767160415649414, "global_step": 160010, "epoch": 1927} {"train_loss": -23.363590240478516, "global_step": 160011, "epoch": 1927} {"train_loss": -23.421161651611328, "global_step": 160012, "epoch": 1927} {"train_loss": -23.714841842651367, "global_step": 160013, "epoch": 1927} {"train_loss": -23.818593978881836, "global_step": 160014, "epoch": 1927} {"train_loss": -23.490392684936523, "global_step": 160015, "epoch": 1927} {"train_loss": -23.502588272094727, "global_step": 160016, "epoch": 1927} {"train_loss": -23.959331512451172, "global_step": 160017, "epoch": 1927} {"train_loss": -23.581953048706055, "global_step": 160018, "epoch": 1927} {"train_loss": -23.229068756103516, "global_step": 160019, "epoch": 1927} {"train_loss": -23.815418243408203, "global_step": 160020, "epoch": 1927} {"train_loss": -23.315811157226562, "global_step": 160021, "epoch": 1927} {"train_loss": -23.45191764831543, "global_step": 160022, "epoch": 1927} {"train_loss": -23.493397517376636, "global_step": 160023, "epoch": 1927, "val_loss": 6331875.0} {"train_loss": -21.449140548706055, "global_step": 160024, "epoch": 1928} {"train_loss": -20.967060089111328, "global_step": 160025, "epoch": 1928} {"train_loss": -21.598970413208008, "global_step": 160026, "epoch": 1928} {"train_loss": -22.446979522705078, "global_step": 160027, "epoch": 1928} {"train_loss": -21.407976150512695, "global_step": 160028, "epoch": 1928} {"train_loss": -22.525842666625977, "global_step": 160029, "epoch": 1928} {"train_loss": -21.85247039794922, "global_step": 160030, "epoch": 1928} {"train_loss": -22.489288330078125, "global_step": 160031, "epoch": 1928} {"train_loss": -22.573476791381836, "global_step": 160032, "epoch": 1928} {"train_loss": -22.728715896606445, "global_step": 160033, "epoch": 1928} {"train_loss": -22.422080993652344, "global_step": 160034, "epoch": 1928} {"train_loss": -22.793825149536133, "global_step": 160035, "epoch": 1928} {"train_loss": -22.09878921508789, "global_step": 160036, "epoch": 1928} {"train_loss": -22.471662521362305, "global_step": 160037, "epoch": 1928} {"train_loss": -22.580827713012695, "global_step": 160038, "epoch": 1928} {"train_loss": -22.3575382232666, "global_step": 160039, "epoch": 1928} {"train_loss": -22.824758529663086, "global_step": 160040, "epoch": 1928} {"train_loss": -22.89613914489746, "global_step": 160041, "epoch": 1928} {"train_loss": -22.79376792907715, "global_step": 160042, "epoch": 1928} {"train_loss": -22.4322566986084, "global_step": 160043, "epoch": 1928} {"train_loss": -22.836549758911133, "global_step": 160044, "epoch": 1928} {"train_loss": -22.937917709350586, "global_step": 160045, "epoch": 1928} {"train_loss": -22.80680274963379, "global_step": 160046, "epoch": 1928} {"train_loss": -23.247859954833984, "global_step": 160047, "epoch": 1928} {"train_loss": -23.306251525878906, "global_step": 160048, "epoch": 1928} {"train_loss": -23.153499603271484, "global_step": 160049, "epoch": 1928} {"train_loss": -23.463041305541992, "global_step": 160050, "epoch": 1928} {"train_loss": -23.345632553100586, "global_step": 160051, "epoch": 1928} {"train_loss": -23.34657096862793, "global_step": 160052, "epoch": 1928} {"train_loss": -23.147558212280273, "global_step": 160053, "epoch": 1928} {"train_loss": -23.457950592041016, "global_step": 160054, "epoch": 1928} {"train_loss": -23.25555992126465, "global_step": 160055, "epoch": 1928} {"train_loss": -23.489181518554688, "global_step": 160056, "epoch": 1928} {"train_loss": -23.459627151489258, "global_step": 160057, "epoch": 1928} {"train_loss": -23.154800415039062, "global_step": 160058, "epoch": 1928} {"train_loss": -23.220922470092773, "global_step": 160059, "epoch": 1928} {"train_loss": -23.154809951782227, "global_step": 160060, "epoch": 1928} {"train_loss": -23.59597396850586, "global_step": 160061, "epoch": 1928} {"train_loss": -23.4315185546875, "global_step": 160062, "epoch": 1928} {"train_loss": -23.42569351196289, "global_step": 160063, "epoch": 1928} {"train_loss": -23.299436569213867, "global_step": 160064, "epoch": 1928} {"train_loss": -23.392820358276367, "global_step": 160065, "epoch": 1928} {"train_loss": -23.425128936767578, "global_step": 160066, "epoch": 1928} {"train_loss": -23.33784294128418, "global_step": 160067, "epoch": 1928} {"train_loss": -23.222549438476562, "global_step": 160068, "epoch": 1928} {"train_loss": -23.545331954956055, "global_step": 160069, "epoch": 1928} {"train_loss": -23.4088191986084, "global_step": 160070, "epoch": 1928} {"train_loss": -22.968955993652344, "global_step": 160071, "epoch": 1928} {"train_loss": -23.31870460510254, "global_step": 160072, "epoch": 1928} {"train_loss": -23.546445846557617, "global_step": 160073, "epoch": 1928} {"train_loss": -23.808103561401367, "global_step": 160074, "epoch": 1928} {"train_loss": -23.532032012939453, "global_step": 160075, "epoch": 1928} {"train_loss": -23.542156219482422, "global_step": 160076, "epoch": 1928} {"train_loss": -23.7865047454834, "global_step": 160077, "epoch": 1928} {"train_loss": -23.78364372253418, "global_step": 160078, "epoch": 1928} {"train_loss": -23.781972885131836, "global_step": 160079, "epoch": 1928} {"train_loss": -23.5592098236084, "global_step": 160080, "epoch": 1928} {"train_loss": -23.50164794921875, "global_step": 160081, "epoch": 1928} {"train_loss": -23.393320083618164, "global_step": 160082, "epoch": 1928} {"train_loss": -23.36441993713379, "global_step": 160083, "epoch": 1928} {"train_loss": -23.62934684753418, "global_step": 160084, "epoch": 1928} {"train_loss": -23.669347763061523, "global_step": 160085, "epoch": 1928} {"train_loss": -23.782278060913086, "global_step": 160086, "epoch": 1928} {"train_loss": -23.443161010742188, "global_step": 160087, "epoch": 1928} {"train_loss": -23.783401489257812, "global_step": 160088, "epoch": 1928} {"train_loss": -23.73341178894043, "global_step": 160089, "epoch": 1928} {"train_loss": -23.895681381225586, "global_step": 160090, "epoch": 1928} {"train_loss": -23.79326629638672, "global_step": 160091, "epoch": 1928} {"train_loss": -23.540733337402344, "global_step": 160092, "epoch": 1928} {"train_loss": -23.654077529907227, "global_step": 160093, "epoch": 1928} {"train_loss": -23.75298309326172, "global_step": 160094, "epoch": 1928} {"train_loss": -23.342090606689453, "global_step": 160095, "epoch": 1928} {"train_loss": -23.449506759643555, "global_step": 160096, "epoch": 1928} {"train_loss": -23.340551376342773, "global_step": 160097, "epoch": 1928} {"train_loss": -23.28499412536621, "global_step": 160098, "epoch": 1928} {"train_loss": -23.45157814025879, "global_step": 160099, "epoch": 1928} {"train_loss": -23.51521873474121, "global_step": 160100, "epoch": 1928} {"train_loss": -23.626312255859375, "global_step": 160101, "epoch": 1928} {"train_loss": -23.165313720703125, "global_step": 160102, "epoch": 1928} {"train_loss": -23.606243133544922, "global_step": 160103, "epoch": 1928} {"train_loss": -23.629209518432617, "global_step": 160104, "epoch": 1928} {"train_loss": -23.769468307495117, "global_step": 160105, "epoch": 1928} {"train_loss": -23.171829131712396, "global_step": 160106, "epoch": 1928, "val_loss": 6307636.0} {"train_loss": -22.838520050048828, "global_step": 160107, "epoch": 1929} {"train_loss": -22.735843658447266, "global_step": 160108, "epoch": 1929} {"train_loss": -22.780241012573242, "global_step": 160109, "epoch": 1929} {"train_loss": -23.01957130432129, "global_step": 160110, "epoch": 1929} {"train_loss": -22.75010108947754, "global_step": 160111, "epoch": 1929} {"train_loss": -22.939468383789062, "global_step": 160112, "epoch": 1929} {"train_loss": -23.148067474365234, "global_step": 160113, "epoch": 1929} {"train_loss": -23.356332778930664, "global_step": 160114, "epoch": 1929} {"train_loss": -23.27420997619629, "global_step": 160115, "epoch": 1929} {"train_loss": -23.135072708129883, "global_step": 160116, "epoch": 1929} {"train_loss": -22.995208740234375, "global_step": 160117, "epoch": 1929} {"train_loss": -23.13408851623535, "global_step": 160118, "epoch": 1929} {"train_loss": -23.16357421875, "global_step": 160119, "epoch": 1929} {"train_loss": -23.35579490661621, "global_step": 160120, "epoch": 1929} {"train_loss": -23.243520736694336, "global_step": 160121, "epoch": 1929} {"train_loss": -22.94414710998535, "global_step": 160122, "epoch": 1929} {"train_loss": -23.31067657470703, "global_step": 160123, "epoch": 1929} {"train_loss": -23.532499313354492, "global_step": 160124, "epoch": 1929} {"train_loss": -23.30234718322754, "global_step": 160125, "epoch": 1929} {"train_loss": -23.108129501342773, "global_step": 160126, "epoch": 1929} {"train_loss": -23.098865509033203, "global_step": 160127, "epoch": 1929} {"train_loss": -23.5841121673584, "global_step": 160128, "epoch": 1929} {"train_loss": -23.136367797851562, "global_step": 160129, "epoch": 1929} {"train_loss": -23.201101303100586, "global_step": 160130, "epoch": 1929} {"train_loss": -23.521160125732422, "global_step": 160131, "epoch": 1929} {"train_loss": -23.339994430541992, "global_step": 160132, "epoch": 1929} {"train_loss": -23.137922286987305, "global_step": 160133, "epoch": 1929} {"train_loss": -23.448041915893555, "global_step": 160134, "epoch": 1929} {"train_loss": -23.54630470275879, "global_step": 160135, "epoch": 1929} {"train_loss": -23.04353904724121, "global_step": 160136, "epoch": 1929} {"train_loss": -23.434616088867188, "global_step": 160137, "epoch": 1929} {"train_loss": -23.19156837463379, "global_step": 160138, "epoch": 1929} {"train_loss": -23.433265686035156, "global_step": 160139, "epoch": 1929} {"train_loss": -23.702810287475586, "global_step": 160140, "epoch": 1929} {"train_loss": -23.116596221923828, "global_step": 160141, "epoch": 1929} {"train_loss": -23.524892807006836, "global_step": 160142, "epoch": 1929} {"train_loss": -23.25113868713379, "global_step": 160143, "epoch": 1929} {"train_loss": -23.43027114868164, "global_step": 160144, "epoch": 1929} {"train_loss": -23.6951847076416, "global_step": 160145, "epoch": 1929} {"train_loss": -23.89420509338379, "global_step": 160146, "epoch": 1929} {"train_loss": -23.360034942626953, "global_step": 160147, "epoch": 1929} {"train_loss": -23.562414169311523, "global_step": 160148, "epoch": 1929} {"train_loss": -23.171367645263672, "global_step": 160149, "epoch": 1929} {"train_loss": -23.480152130126953, "global_step": 160150, "epoch": 1929} {"train_loss": -23.60213279724121, "global_step": 160151, "epoch": 1929} {"train_loss": -23.436429977416992, "global_step": 160152, "epoch": 1929} {"train_loss": -23.28131103515625, "global_step": 160153, "epoch": 1929} {"train_loss": -23.559999465942383, "global_step": 160154, "epoch": 1929} {"train_loss": -23.804738998413086, "global_step": 160155, "epoch": 1929} {"train_loss": -23.36019515991211, "global_step": 160156, "epoch": 1929} {"train_loss": -23.266414642333984, "global_step": 160157, "epoch": 1929} {"train_loss": -23.507450103759766, "global_step": 160158, "epoch": 1929} {"train_loss": -23.633779525756836, "global_step": 160159, "epoch": 1929} {"train_loss": -23.340375900268555, "global_step": 160160, "epoch": 1929} {"train_loss": -23.113737106323242, "global_step": 160161, "epoch": 1929} {"train_loss": -22.978900909423828, "global_step": 160162, "epoch": 1929} {"train_loss": -23.23855972290039, "global_step": 160163, "epoch": 1929} {"train_loss": -23.30915641784668, "global_step": 160164, "epoch": 1929} {"train_loss": -23.441694259643555, "global_step": 160165, "epoch": 1929} {"train_loss": -23.3192138671875, "global_step": 160166, "epoch": 1929} {"train_loss": -23.773258209228516, "global_step": 160167, "epoch": 1929} {"train_loss": -23.453237533569336, "global_step": 160168, "epoch": 1929} {"train_loss": -23.322656631469727, "global_step": 160169, "epoch": 1929} {"train_loss": -23.107534408569336, "global_step": 160170, "epoch": 1929} {"train_loss": -23.452611923217773, "global_step": 160171, "epoch": 1929} {"train_loss": -23.31599998474121, "global_step": 160172, "epoch": 1929} {"train_loss": -23.56854820251465, "global_step": 160173, "epoch": 1929} {"train_loss": -23.9224910736084, "global_step": 160174, "epoch": 1929} {"train_loss": -23.630430221557617, "global_step": 160175, "epoch": 1929} {"train_loss": -23.443557739257812, "global_step": 160176, "epoch": 1929} {"train_loss": -23.584321975708008, "global_step": 160177, "epoch": 1929} {"train_loss": -23.688751220703125, "global_step": 160178, "epoch": 1929} {"train_loss": -23.40558433532715, "global_step": 160179, "epoch": 1929} {"train_loss": -23.661609649658203, "global_step": 160180, "epoch": 1929} {"train_loss": -23.22110939025879, "global_step": 160181, "epoch": 1929} {"train_loss": -23.763748168945312, "global_step": 160182, "epoch": 1929} {"train_loss": -23.50106430053711, "global_step": 160183, "epoch": 1929} {"train_loss": -23.55156707763672, "global_step": 160184, "epoch": 1929} {"train_loss": -23.857694625854492, "global_step": 160185, "epoch": 1929} {"train_loss": -23.511856079101562, "global_step": 160186, "epoch": 1929} {"train_loss": -23.43556785583496, "global_step": 160187, "epoch": 1929} {"train_loss": -23.468259811401367, "global_step": 160188, "epoch": 1929} {"train_loss": -23.355523006025567, "global_step": 160189, "epoch": 1929, "val_loss": 6406992.0} {"train_loss": -23.030426025390625, "global_step": 160190, "epoch": 1930} {"train_loss": -23.470947265625, "global_step": 160191, "epoch": 1930} {"train_loss": -23.203245162963867, "global_step": 160192, "epoch": 1930} {"train_loss": -22.94615364074707, "global_step": 160193, "epoch": 1930} {"train_loss": -23.09775161743164, "global_step": 160194, "epoch": 1930} {"train_loss": -23.212921142578125, "global_step": 160195, "epoch": 1930} {"train_loss": -22.535297393798828, "global_step": 160196, "epoch": 1930} {"train_loss": -22.866779327392578, "global_step": 160197, "epoch": 1930} {"train_loss": -22.878210067749023, "global_step": 160198, "epoch": 1930} {"train_loss": -23.227895736694336, "global_step": 160199, "epoch": 1930} {"train_loss": -22.631534576416016, "global_step": 160200, "epoch": 1930} {"train_loss": -23.1718807220459, "global_step": 160201, "epoch": 1930} {"train_loss": -23.109811782836914, "global_step": 160202, "epoch": 1930} {"train_loss": -23.597721099853516, "global_step": 160203, "epoch": 1930} {"train_loss": -23.157041549682617, "global_step": 160204, "epoch": 1930} {"train_loss": -23.39067840576172, "global_step": 160205, "epoch": 1930} {"train_loss": -23.69148063659668, "global_step": 160206, "epoch": 1930} {"train_loss": -23.158218383789062, "global_step": 160207, "epoch": 1930} {"train_loss": -23.49875259399414, "global_step": 160208, "epoch": 1930} {"train_loss": -23.22620964050293, "global_step": 160209, "epoch": 1930} {"train_loss": -23.535009384155273, "global_step": 160210, "epoch": 1930} {"train_loss": -23.083988189697266, "global_step": 160211, "epoch": 1930} {"train_loss": -23.558645248413086, "global_step": 160212, "epoch": 1930} {"train_loss": -23.439695358276367, "global_step": 160213, "epoch": 1930} {"train_loss": -23.424421310424805, "global_step": 160214, "epoch": 1930} {"train_loss": -23.286636352539062, "global_step": 160215, "epoch": 1930} {"train_loss": -23.491565704345703, "global_step": 160216, "epoch": 1930} {"train_loss": -23.714250564575195, "global_step": 160217, "epoch": 1930} {"train_loss": -23.519254684448242, "global_step": 160218, "epoch": 1930} {"train_loss": -23.580961227416992, "global_step": 160219, "epoch": 1930} {"train_loss": -23.78290367126465, "global_step": 160220, "epoch": 1930} {"train_loss": -23.289106369018555, "global_step": 160221, "epoch": 1930} {"train_loss": -23.596532821655273, "global_step": 160222, "epoch": 1930} {"train_loss": -23.42547607421875, "global_step": 160223, "epoch": 1930} {"train_loss": -23.751569747924805, "global_step": 160224, "epoch": 1930} {"train_loss": -23.20387840270996, "global_step": 160225, "epoch": 1930} {"train_loss": -23.66876792907715, "global_step": 160226, "epoch": 1930} {"train_loss": -23.33199119567871, "global_step": 160227, "epoch": 1930} {"train_loss": -23.43733024597168, "global_step": 160228, "epoch": 1930} {"train_loss": -23.423818588256836, "global_step": 160229, "epoch": 1930} {"train_loss": -23.67786979675293, "global_step": 160230, "epoch": 1930} {"train_loss": -23.238927841186523, "global_step": 160231, "epoch": 1930} {"train_loss": -23.208375930786133, "global_step": 160232, "epoch": 1930} {"train_loss": -23.427627563476562, "global_step": 160233, "epoch": 1930} {"train_loss": -23.565317153930664, "global_step": 160234, "epoch": 1930} {"train_loss": -23.6485652923584, "global_step": 160235, "epoch": 1930} {"train_loss": -23.00837516784668, "global_step": 160236, "epoch": 1930} {"train_loss": -23.631832122802734, "global_step": 160237, "epoch": 1930} {"train_loss": -23.617462158203125, "global_step": 160238, "epoch": 1930} {"train_loss": -23.612449645996094, "global_step": 160239, "epoch": 1930} {"train_loss": -23.107038497924805, "global_step": 160240, "epoch": 1930} {"train_loss": -23.74675941467285, "global_step": 160241, "epoch": 1930} {"train_loss": -23.644685745239258, "global_step": 160242, "epoch": 1930} {"train_loss": -23.522737503051758, "global_step": 160243, "epoch": 1930} {"train_loss": -23.501144409179688, "global_step": 160244, "epoch": 1930} {"train_loss": -23.537771224975586, "global_step": 160245, "epoch": 1930} {"train_loss": -23.18931007385254, "global_step": 160246, "epoch": 1930} {"train_loss": -23.53313636779785, "global_step": 160247, "epoch": 1930} {"train_loss": -23.594186782836914, "global_step": 160248, "epoch": 1930} {"train_loss": -23.71083641052246, "global_step": 160249, "epoch": 1930} {"train_loss": -23.661361694335938, "global_step": 160250, "epoch": 1930} {"train_loss": -23.48293113708496, "global_step": 160251, "epoch": 1930} {"train_loss": -23.531112670898438, "global_step": 160252, "epoch": 1930} {"train_loss": -23.591081619262695, "global_step": 160253, "epoch": 1930} {"train_loss": -23.41303825378418, "global_step": 160254, "epoch": 1930} {"train_loss": -23.59169578552246, "global_step": 160255, "epoch": 1930} {"train_loss": -23.530847549438477, "global_step": 160256, "epoch": 1930} {"train_loss": -23.534818649291992, "global_step": 160257, "epoch": 1930} {"train_loss": -23.55231285095215, "global_step": 160258, "epoch": 1930} {"train_loss": -23.51622200012207, "global_step": 160259, "epoch": 1930} {"train_loss": -23.444608688354492, "global_step": 160260, "epoch": 1930} {"train_loss": -23.14728355407715, "global_step": 160261, "epoch": 1930} {"train_loss": -23.43485450744629, "global_step": 160262, "epoch": 1930} {"train_loss": -23.287883758544922, "global_step": 160263, "epoch": 1930} {"train_loss": -23.618635177612305, "global_step": 160264, "epoch": 1930} {"train_loss": -23.43145179748535, "global_step": 160265, "epoch": 1930} {"train_loss": -23.436166763305664, "global_step": 160266, "epoch": 1930} {"train_loss": -23.470596313476562, "global_step": 160267, "epoch": 1930} {"train_loss": -23.554889678955078, "global_step": 160268, "epoch": 1930} {"train_loss": -23.422666549682617, "global_step": 160269, "epoch": 1930} {"train_loss": -23.499570846557617, "global_step": 160270, "epoch": 1930} {"train_loss": -23.6174259185791, "global_step": 160271, "epoch": 1930} {"train_loss": -23.38590387551181, "global_step": 160272, "epoch": 1930, "val_loss": 6383975.0} {"train_loss": -23.28577423095703, "global_step": 160273, "epoch": 1931} {"train_loss": -23.039743423461914, "global_step": 160274, "epoch": 1931} {"train_loss": -23.200376510620117, "global_step": 160275, "epoch": 1931} {"train_loss": -23.03139305114746, "global_step": 160276, "epoch": 1931} {"train_loss": -23.106054306030273, "global_step": 160277, "epoch": 1931} {"train_loss": -23.400447845458984, "global_step": 160278, "epoch": 1931} {"train_loss": -23.124582290649414, "global_step": 160279, "epoch": 1931} {"train_loss": -23.391494750976562, "global_step": 160280, "epoch": 1931} {"train_loss": -23.224462509155273, "global_step": 160281, "epoch": 1931} {"train_loss": -23.356231689453125, "global_step": 160282, "epoch": 1931} {"train_loss": -23.33605194091797, "global_step": 160283, "epoch": 1931} {"train_loss": -23.406469345092773, "global_step": 160284, "epoch": 1931} {"train_loss": -23.478071212768555, "global_step": 160285, "epoch": 1931} {"train_loss": -23.726911544799805, "global_step": 160286, "epoch": 1931} {"train_loss": -23.426191329956055, "global_step": 160287, "epoch": 1931} {"train_loss": -23.720596313476562, "global_step": 160288, "epoch": 1931} {"train_loss": -23.30245018005371, "global_step": 160289, "epoch": 1931} {"train_loss": -23.591840744018555, "global_step": 160290, "epoch": 1931} {"train_loss": -23.386327743530273, "global_step": 160291, "epoch": 1931} {"train_loss": -23.774017333984375, "global_step": 160292, "epoch": 1931} {"train_loss": -23.259288787841797, "global_step": 160293, "epoch": 1931} {"train_loss": -23.521940231323242, "global_step": 160294, "epoch": 1931} {"train_loss": -23.55544090270996, "global_step": 160295, "epoch": 1931} {"train_loss": -23.577857971191406, "global_step": 160296, "epoch": 1931} {"train_loss": -23.490652084350586, "global_step": 160297, "epoch": 1931} {"train_loss": -23.272127151489258, "global_step": 160298, "epoch": 1931} {"train_loss": -23.500316619873047, "global_step": 160299, "epoch": 1931} {"train_loss": -23.493412017822266, "global_step": 160300, "epoch": 1931} {"train_loss": -23.317129135131836, "global_step": 160301, "epoch": 1931} {"train_loss": -23.60145378112793, "global_step": 160302, "epoch": 1931} {"train_loss": -23.24139976501465, "global_step": 160303, "epoch": 1931} {"train_loss": -23.763446807861328, "global_step": 160304, "epoch": 1931} {"train_loss": -23.767011642456055, "global_step": 160305, "epoch": 1931} {"train_loss": -23.22173500061035, "global_step": 160306, "epoch": 1931} {"train_loss": -23.45071792602539, "global_step": 160307, "epoch": 1931} {"train_loss": -23.617717742919922, "global_step": 160308, "epoch": 1931} {"train_loss": -23.804285049438477, "global_step": 160309, "epoch": 1931} {"train_loss": -23.71700096130371, "global_step": 160310, "epoch": 1931} {"train_loss": -23.42307472229004, "global_step": 160311, "epoch": 1931} {"train_loss": -23.61616325378418, "global_step": 160312, "epoch": 1931} {"train_loss": -23.974271774291992, "global_step": 160313, "epoch": 1931} {"train_loss": -23.65846061706543, "global_step": 160314, "epoch": 1931} {"train_loss": -23.38182830810547, "global_step": 160315, "epoch": 1931} {"train_loss": -23.409189224243164, "global_step": 160316, "epoch": 1931} {"train_loss": -23.227750778198242, "global_step": 160317, "epoch": 1931} {"train_loss": -23.305850982666016, "global_step": 160318, "epoch": 1931} {"train_loss": -23.373003005981445, "global_step": 160319, "epoch": 1931} {"train_loss": -23.50482749938965, "global_step": 160320, "epoch": 1931} {"train_loss": -23.51896095275879, "global_step": 160321, "epoch": 1931} {"train_loss": -23.807443618774414, "global_step": 160322, "epoch": 1931} {"train_loss": -23.546772003173828, "global_step": 160323, "epoch": 1931} {"train_loss": -23.48909568786621, "global_step": 160324, "epoch": 1931} {"train_loss": -23.034683227539062, "global_step": 160325, "epoch": 1931} {"train_loss": -23.52155876159668, "global_step": 160326, "epoch": 1931} {"train_loss": -23.550832748413086, "global_step": 160327, "epoch": 1931} {"train_loss": -23.228904724121094, "global_step": 160328, "epoch": 1931} {"train_loss": -23.48045539855957, "global_step": 160329, "epoch": 1931} {"train_loss": -23.255599975585938, "global_step": 160330, "epoch": 1931} {"train_loss": -23.278099060058594, "global_step": 160331, "epoch": 1931} {"train_loss": -23.2901554107666, "global_step": 160332, "epoch": 1931} {"train_loss": -23.0595703125, "global_step": 160333, "epoch": 1931} {"train_loss": -23.34950065612793, "global_step": 160334, "epoch": 1931} {"train_loss": -23.280107498168945, "global_step": 160335, "epoch": 1931} {"train_loss": -23.925527572631836, "global_step": 160336, "epoch": 1931} {"train_loss": -23.24317741394043, "global_step": 160337, "epoch": 1931} {"train_loss": -23.43623161315918, "global_step": 160338, "epoch": 1931} {"train_loss": -23.213315963745117, "global_step": 160339, "epoch": 1931} {"train_loss": -23.35439682006836, "global_step": 160340, "epoch": 1931} {"train_loss": -23.54778480529785, "global_step": 160341, "epoch": 1931} {"train_loss": -23.43243980407715, "global_step": 160342, "epoch": 1931} {"train_loss": -23.36648941040039, "global_step": 160343, "epoch": 1931} {"train_loss": -23.384336471557617, "global_step": 160344, "epoch": 1931} {"train_loss": -23.78705596923828, "global_step": 160345, "epoch": 1931} {"train_loss": -23.43861198425293, "global_step": 160346, "epoch": 1931} {"train_loss": -23.692983627319336, "global_step": 160347, "epoch": 1931} {"train_loss": -23.844694137573242, "global_step": 160348, "epoch": 1931} {"train_loss": -23.40287971496582, "global_step": 160349, "epoch": 1931} {"train_loss": -23.329435348510742, "global_step": 160350, "epoch": 1931} {"train_loss": -23.5441951751709, "global_step": 160351, "epoch": 1931} {"train_loss": -23.182703018188477, "global_step": 160352, "epoch": 1931} {"train_loss": -23.593992233276367, "global_step": 160353, "epoch": 1931} {"train_loss": -23.707550048828125, "global_step": 160354, "epoch": 1931} {"train_loss": -23.437752827104315, "global_step": 160355, "epoch": 1931, "val_loss": 6226429.0} {"train_loss": -23.258346557617188, "global_step": 160356, "epoch": 1932} {"train_loss": -23.19742774963379, "global_step": 160357, "epoch": 1932} {"train_loss": -23.0092830657959, "global_step": 160358, "epoch": 1932} {"train_loss": -23.09071159362793, "global_step": 160359, "epoch": 1932} {"train_loss": -22.952051162719727, "global_step": 160360, "epoch": 1932} {"train_loss": -22.939767837524414, "global_step": 160361, "epoch": 1932} {"train_loss": -23.276151657104492, "global_step": 160362, "epoch": 1932} {"train_loss": -23.186582565307617, "global_step": 160363, "epoch": 1932} {"train_loss": -23.465490341186523, "global_step": 160364, "epoch": 1932} {"train_loss": -23.061330795288086, "global_step": 160365, "epoch": 1932} {"train_loss": -22.665298461914062, "global_step": 160366, "epoch": 1932} {"train_loss": -23.32651138305664, "global_step": 160367, "epoch": 1932} {"train_loss": -23.2807674407959, "global_step": 160368, "epoch": 1932} {"train_loss": -23.120779037475586, "global_step": 160369, "epoch": 1932} {"train_loss": -23.460886001586914, "global_step": 160370, "epoch": 1932} {"train_loss": -23.472869873046875, "global_step": 160371, "epoch": 1932} {"train_loss": -23.228273391723633, "global_step": 160372, "epoch": 1932} {"train_loss": -23.205217361450195, "global_step": 160373, "epoch": 1932} {"train_loss": -22.94553565979004, "global_step": 160374, "epoch": 1932} {"train_loss": -23.355613708496094, "global_step": 160375, "epoch": 1932} {"train_loss": -23.140018463134766, "global_step": 160376, "epoch": 1932} {"train_loss": -23.59333610534668, "global_step": 160377, "epoch": 1932} {"train_loss": -23.364959716796875, "global_step": 160378, "epoch": 1932} {"train_loss": -23.501619338989258, "global_step": 160379, "epoch": 1932} {"train_loss": -23.450307846069336, "global_step": 160380, "epoch": 1932} {"train_loss": -23.753019332885742, "global_step": 160381, "epoch": 1932} {"train_loss": -23.323352813720703, "global_step": 160382, "epoch": 1932} {"train_loss": -23.6058292388916, "global_step": 160383, "epoch": 1932} {"train_loss": -23.5235538482666, "global_step": 160384, "epoch": 1932} {"train_loss": -23.236770629882812, "global_step": 160385, "epoch": 1932} {"train_loss": -23.62571144104004, "global_step": 160386, "epoch": 1932} {"train_loss": -22.99910545349121, "global_step": 160387, "epoch": 1932} {"train_loss": -23.720340728759766, "global_step": 160388, "epoch": 1932} {"train_loss": -23.265522003173828, "global_step": 160389, "epoch": 1932} {"train_loss": -23.3136043548584, "global_step": 160390, "epoch": 1932} {"train_loss": -22.994564056396484, "global_step": 160391, "epoch": 1932} {"train_loss": -23.410491943359375, "global_step": 160392, "epoch": 1932} {"train_loss": -23.369165420532227, "global_step": 160393, "epoch": 1932} {"train_loss": -23.37628746032715, "global_step": 160394, "epoch": 1932} {"train_loss": -23.269298553466797, "global_step": 160395, "epoch": 1932} {"train_loss": -23.79473114013672, "global_step": 160396, "epoch": 1932} {"train_loss": -23.624509811401367, "global_step": 160397, "epoch": 1932} {"train_loss": -23.61848258972168, "global_step": 160398, "epoch": 1932} {"train_loss": -23.972562789916992, "global_step": 160399, "epoch": 1932} {"train_loss": -23.496952056884766, "global_step": 160400, "epoch": 1932} {"train_loss": -23.27202796936035, "global_step": 160401, "epoch": 1932} {"train_loss": -23.85129737854004, "global_step": 160402, "epoch": 1932} {"train_loss": -23.286794662475586, "global_step": 160403, "epoch": 1932} {"train_loss": -23.5200138092041, "global_step": 160404, "epoch": 1932} {"train_loss": -23.067493438720703, "global_step": 160405, "epoch": 1932} {"train_loss": -23.023813247680664, "global_step": 160406, "epoch": 1932} {"train_loss": -22.718093872070312, "global_step": 160407, "epoch": 1932} {"train_loss": -23.604339599609375, "global_step": 160408, "epoch": 1932} {"train_loss": -22.884458541870117, "global_step": 160409, "epoch": 1932} {"train_loss": -22.747732162475586, "global_step": 160410, "epoch": 1932} {"train_loss": -23.351898193359375, "global_step": 160411, "epoch": 1932} {"train_loss": -23.444557189941406, "global_step": 160412, "epoch": 1932} {"train_loss": -23.647977828979492, "global_step": 160413, "epoch": 1932} {"train_loss": -23.10089683532715, "global_step": 160414, "epoch": 1932} {"train_loss": -23.553457260131836, "global_step": 160415, "epoch": 1932} {"train_loss": -23.558454513549805, "global_step": 160416, "epoch": 1932} {"train_loss": -23.36440086364746, "global_step": 160417, "epoch": 1932} {"train_loss": -23.930377960205078, "global_step": 160418, "epoch": 1932} {"train_loss": -23.2914981842041, "global_step": 160419, "epoch": 1932} {"train_loss": -23.44257164001465, "global_step": 160420, "epoch": 1932} {"train_loss": -23.43372344970703, "global_step": 160421, "epoch": 1932} {"train_loss": -23.171010971069336, "global_step": 160422, "epoch": 1932} {"train_loss": -23.4725399017334, "global_step": 160423, "epoch": 1932} {"train_loss": -23.338956832885742, "global_step": 160424, "epoch": 1932} {"train_loss": -23.418354034423828, "global_step": 160425, "epoch": 1932} {"train_loss": -23.181419372558594, "global_step": 160426, "epoch": 1932} {"train_loss": -23.962072372436523, "global_step": 160427, "epoch": 1932} {"train_loss": -23.08904457092285, "global_step": 160428, "epoch": 1932} {"train_loss": -23.669984817504883, "global_step": 160429, "epoch": 1932} {"train_loss": -23.59915542602539, "global_step": 160430, "epoch": 1932} {"train_loss": -23.68735694885254, "global_step": 160431, "epoch": 1932} {"train_loss": -23.751995086669922, "global_step": 160432, "epoch": 1932} {"train_loss": -23.574020385742188, "global_step": 160433, "epoch": 1932} {"train_loss": -23.269887924194336, "global_step": 160434, "epoch": 1932} {"train_loss": -23.69589614868164, "global_step": 160435, "epoch": 1932} {"train_loss": -23.307241439819336, "global_step": 160436, "epoch": 1932} {"train_loss": -23.651865005493164, "global_step": 160437, "epoch": 1932} {"train_loss": -23.37266542825354, "global_step": 160438, "epoch": 1932, "val_loss": 6392859.0} {"train_loss": -23.377763748168945, "global_step": 160439, "epoch": 1933} {"train_loss": -22.666183471679688, "global_step": 160440, "epoch": 1933} {"train_loss": -22.612730026245117, "global_step": 160441, "epoch": 1933} {"train_loss": -23.04833221435547, "global_step": 160442, "epoch": 1933} {"train_loss": -23.062353134155273, "global_step": 160443, "epoch": 1933} {"train_loss": -23.193477630615234, "global_step": 160444, "epoch": 1933} {"train_loss": -23.276193618774414, "global_step": 160445, "epoch": 1933} {"train_loss": -23.47759437561035, "global_step": 160446, "epoch": 1933} {"train_loss": -23.386627197265625, "global_step": 160447, "epoch": 1933} {"train_loss": -23.0184326171875, "global_step": 160448, "epoch": 1933} {"train_loss": -23.292787551879883, "global_step": 160449, "epoch": 1933} {"train_loss": -23.1927490234375, "global_step": 160450, "epoch": 1933} {"train_loss": -23.179061889648438, "global_step": 160451, "epoch": 1933} {"train_loss": -22.975732803344727, "global_step": 160452, "epoch": 1933} {"train_loss": -23.147308349609375, "global_step": 160453, "epoch": 1933} {"train_loss": -23.47193717956543, "global_step": 160454, "epoch": 1933} {"train_loss": -23.405385971069336, "global_step": 160455, "epoch": 1933} {"train_loss": -23.493539810180664, "global_step": 160456, "epoch": 1933} {"train_loss": -23.55055809020996, "global_step": 160457, "epoch": 1933} {"train_loss": -23.78273582458496, "global_step": 160458, "epoch": 1933} {"train_loss": -23.22547149658203, "global_step": 160459, "epoch": 1933} {"train_loss": -23.487966537475586, "global_step": 160460, "epoch": 1933} {"train_loss": -23.336034774780273, "global_step": 160461, "epoch": 1933} {"train_loss": -23.559085845947266, "global_step": 160462, "epoch": 1933} {"train_loss": -23.383588790893555, "global_step": 160463, "epoch": 1933} {"train_loss": -23.432762145996094, "global_step": 160464, "epoch": 1933} {"train_loss": -23.66164207458496, "global_step": 160465, "epoch": 1933} {"train_loss": -23.48649024963379, "global_step": 160466, "epoch": 1933} {"train_loss": -23.607404708862305, "global_step": 160467, "epoch": 1933} {"train_loss": -23.487417221069336, "global_step": 160468, "epoch": 1933} {"train_loss": -23.396968841552734, "global_step": 160469, "epoch": 1933} {"train_loss": -23.884729385375977, "global_step": 160470, "epoch": 1933} {"train_loss": -23.592288970947266, "global_step": 160471, "epoch": 1933} {"train_loss": -23.48892593383789, "global_step": 160472, "epoch": 1933} {"train_loss": -23.26020622253418, "global_step": 160473, "epoch": 1933} {"train_loss": -23.369352340698242, "global_step": 160474, "epoch": 1933} {"train_loss": -23.095693588256836, "global_step": 160475, "epoch": 1933} {"train_loss": -23.170547485351562, "global_step": 160476, "epoch": 1933} {"train_loss": -23.44525718688965, "global_step": 160477, "epoch": 1933} {"train_loss": -23.81409454345703, "global_step": 160478, "epoch": 1933} {"train_loss": -22.956151962280273, "global_step": 160479, "epoch": 1933} {"train_loss": -23.187828063964844, "global_step": 160480, "epoch": 1933} {"train_loss": -24.033044815063477, "global_step": 160481, "epoch": 1933} {"train_loss": -23.463607788085938, "global_step": 160482, "epoch": 1933} {"train_loss": -23.237443923950195, "global_step": 160483, "epoch": 1933} {"train_loss": -23.89459991455078, "global_step": 160484, "epoch": 1933} {"train_loss": -23.572437286376953, "global_step": 160485, "epoch": 1933} {"train_loss": -23.351226806640625, "global_step": 160486, "epoch": 1933} {"train_loss": -23.22165298461914, "global_step": 160487, "epoch": 1933} {"train_loss": -23.73092269897461, "global_step": 160488, "epoch": 1933} {"train_loss": -23.51762580871582, "global_step": 160489, "epoch": 1933} {"train_loss": -23.25618553161621, "global_step": 160490, "epoch": 1933} {"train_loss": -23.771678924560547, "global_step": 160491, "epoch": 1933} {"train_loss": -23.27559471130371, "global_step": 160492, "epoch": 1933} {"train_loss": -23.184003829956055, "global_step": 160493, "epoch": 1933} {"train_loss": -23.327787399291992, "global_step": 160494, "epoch": 1933} {"train_loss": -23.775829315185547, "global_step": 160495, "epoch": 1933} {"train_loss": -23.496898651123047, "global_step": 160496, "epoch": 1933} {"train_loss": -23.279338836669922, "global_step": 160497, "epoch": 1933} {"train_loss": -23.57859992980957, "global_step": 160498, "epoch": 1933} {"train_loss": -23.34037208557129, "global_step": 160499, "epoch": 1933} {"train_loss": -23.578140258789062, "global_step": 160500, "epoch": 1933} {"train_loss": -23.48459243774414, "global_step": 160501, "epoch": 1933} {"train_loss": -23.820693969726562, "global_step": 160502, "epoch": 1933} {"train_loss": -23.655542373657227, "global_step": 160503, "epoch": 1933} {"train_loss": -23.60759925842285, "global_step": 160504, "epoch": 1933} {"train_loss": -23.582876205444336, "global_step": 160505, "epoch": 1933} {"train_loss": -23.420856475830078, "global_step": 160506, "epoch": 1933} {"train_loss": -23.878494262695312, "global_step": 160507, "epoch": 1933} {"train_loss": -23.441869735717773, "global_step": 160508, "epoch": 1933} {"train_loss": -23.46235466003418, "global_step": 160509, "epoch": 1933} {"train_loss": -23.56174087524414, "global_step": 160510, "epoch": 1933} {"train_loss": -23.588232040405273, "global_step": 160511, "epoch": 1933} {"train_loss": -23.123586654663086, "global_step": 160512, "epoch": 1933} {"train_loss": -23.766326904296875, "global_step": 160513, "epoch": 1933} {"train_loss": -23.51531982421875, "global_step": 160514, "epoch": 1933} {"train_loss": -23.347360610961914, "global_step": 160515, "epoch": 1933} {"train_loss": -23.394460678100586, "global_step": 160516, "epoch": 1933} {"train_loss": -23.458072662353516, "global_step": 160517, "epoch": 1933} {"train_loss": -23.285741806030273, "global_step": 160518, "epoch": 1933} {"train_loss": -23.49654197692871, "global_step": 160519, "epoch": 1933} {"train_loss": -23.834064483642578, "global_step": 160520, "epoch": 1933} {"train_loss": -23.42926604489246, "global_step": 160521, "epoch": 1933, "val_loss": 6379583.0} {"train_loss": -23.336942672729492, "global_step": 160522, "epoch": 1934} {"train_loss": -23.20680809020996, "global_step": 160523, "epoch": 1934} {"train_loss": -23.179441452026367, "global_step": 160524, "epoch": 1934} {"train_loss": -23.08827781677246, "global_step": 160525, "epoch": 1934} {"train_loss": -23.28412437438965, "global_step": 160526, "epoch": 1934} {"train_loss": -23.586864471435547, "global_step": 160527, "epoch": 1934} {"train_loss": -23.367361068725586, "global_step": 160528, "epoch": 1934} {"train_loss": -23.437057495117188, "global_step": 160529, "epoch": 1934} {"train_loss": -23.36589813232422, "global_step": 160530, "epoch": 1934} {"train_loss": -23.912384033203125, "global_step": 160531, "epoch": 1934} {"train_loss": -23.3167724609375, "global_step": 160532, "epoch": 1934} {"train_loss": -23.190893173217773, "global_step": 160533, "epoch": 1934} {"train_loss": -23.51564598083496, "global_step": 160534, "epoch": 1934} {"train_loss": -23.613454818725586, "global_step": 160535, "epoch": 1934} {"train_loss": -23.112092971801758, "global_step": 160536, "epoch": 1934} {"train_loss": -23.408571243286133, "global_step": 160537, "epoch": 1934} {"train_loss": -23.65150260925293, "global_step": 160538, "epoch": 1934} {"train_loss": -23.60564613342285, "global_step": 160539, "epoch": 1934} {"train_loss": -23.186798095703125, "global_step": 160540, "epoch": 1934} {"train_loss": -23.81551170349121, "global_step": 160541, "epoch": 1934} {"train_loss": -23.60065460205078, "global_step": 160542, "epoch": 1934} {"train_loss": -23.68128776550293, "global_step": 160543, "epoch": 1934} {"train_loss": -23.70033836364746, "global_step": 160544, "epoch": 1934} {"train_loss": -23.228200912475586, "global_step": 160545, "epoch": 1934} {"train_loss": -23.796897888183594, "global_step": 160546, "epoch": 1934} {"train_loss": -23.83796501159668, "global_step": 160547, "epoch": 1934} {"train_loss": -23.986286163330078, "global_step": 160548, "epoch": 1934} {"train_loss": -23.5853328704834, "global_step": 160549, "epoch": 1934} {"train_loss": -23.55836296081543, "global_step": 160550, "epoch": 1934} {"train_loss": -23.76041603088379, "global_step": 160551, "epoch": 1934} {"train_loss": -23.447265625, "global_step": 160552, "epoch": 1934} {"train_loss": -23.2862548828125, "global_step": 160553, "epoch": 1934} {"train_loss": -23.584962844848633, "global_step": 160554, "epoch": 1934} {"train_loss": -23.442066192626953, "global_step": 160555, "epoch": 1934} {"train_loss": -23.990074157714844, "global_step": 160556, "epoch": 1934} {"train_loss": -23.75843048095703, "global_step": 160557, "epoch": 1934} {"train_loss": -23.605573654174805, "global_step": 160558, "epoch": 1934} {"train_loss": -23.47071647644043, "global_step": 160559, "epoch": 1934} {"train_loss": -24.115835189819336, "global_step": 160560, "epoch": 1934} {"train_loss": -23.933734893798828, "global_step": 160561, "epoch": 1934} {"train_loss": -23.7460994720459, "global_step": 160562, "epoch": 1934} {"train_loss": -23.650449752807617, "global_step": 160563, "epoch": 1934} {"train_loss": -22.716894149780273, "global_step": 160564, "epoch": 1934} {"train_loss": -22.60855484008789, "global_step": 160565, "epoch": 1934} {"train_loss": -22.519269943237305, "global_step": 160566, "epoch": 1934} {"train_loss": -23.178218841552734, "global_step": 160567, "epoch": 1934} {"train_loss": -23.376691818237305, "global_step": 160568, "epoch": 1934} {"train_loss": -23.194374084472656, "global_step": 160569, "epoch": 1934} {"train_loss": -23.10880470275879, "global_step": 160570, "epoch": 1934} {"train_loss": -23.299335479736328, "global_step": 160571, "epoch": 1934} {"train_loss": -23.610260009765625, "global_step": 160572, "epoch": 1934} {"train_loss": -23.25847625732422, "global_step": 160573, "epoch": 1934} {"train_loss": -23.207347869873047, "global_step": 160574, "epoch": 1934} {"train_loss": -23.479440689086914, "global_step": 160575, "epoch": 1934} {"train_loss": -23.231185913085938, "global_step": 160576, "epoch": 1934} {"train_loss": -23.670270919799805, "global_step": 160577, "epoch": 1934} {"train_loss": -23.521318435668945, "global_step": 160578, "epoch": 1934} {"train_loss": -23.665206909179688, "global_step": 160579, "epoch": 1934} {"train_loss": -23.206832885742188, "global_step": 160580, "epoch": 1934} {"train_loss": -23.620813369750977, "global_step": 160581, "epoch": 1934} {"train_loss": -23.645233154296875, "global_step": 160582, "epoch": 1934} {"train_loss": -23.613988876342773, "global_step": 160583, "epoch": 1934} {"train_loss": -23.261404037475586, "global_step": 160584, "epoch": 1934} {"train_loss": -23.3934326171875, "global_step": 160585, "epoch": 1934} {"train_loss": -23.13088035583496, "global_step": 160586, "epoch": 1934} {"train_loss": -23.452133178710938, "global_step": 160587, "epoch": 1934} {"train_loss": -23.212739944458008, "global_step": 160588, "epoch": 1934} {"train_loss": -23.37129783630371, "global_step": 160589, "epoch": 1934} {"train_loss": -23.550405502319336, "global_step": 160590, "epoch": 1934} {"train_loss": -24.06736183166504, "global_step": 160591, "epoch": 1934} {"train_loss": -22.936538696289062, "global_step": 160592, "epoch": 1934} {"train_loss": -23.295473098754883, "global_step": 160593, "epoch": 1934} {"train_loss": -23.77619743347168, "global_step": 160594, "epoch": 1934} {"train_loss": -23.042016983032227, "global_step": 160595, "epoch": 1934} {"train_loss": -23.286174774169922, "global_step": 160596, "epoch": 1934} {"train_loss": -23.59014320373535, "global_step": 160597, "epoch": 1934} {"train_loss": -23.166032791137695, "global_step": 160598, "epoch": 1934} {"train_loss": -23.979570388793945, "global_step": 160599, "epoch": 1934} {"train_loss": -23.34231948852539, "global_step": 160600, "epoch": 1934} {"train_loss": -23.630035400390625, "global_step": 160601, "epoch": 1934} {"train_loss": -23.160367965698242, "global_step": 160602, "epoch": 1934} {"train_loss": -23.608200073242188, "global_step": 160603, "epoch": 1934} {"train_loss": -23.449450642229564, "global_step": 160604, "epoch": 1934, "val_loss": 6419723.0} {"train_loss": -22.768085479736328, "global_step": 160605, "epoch": 1935} {"train_loss": -22.34383201599121, "global_step": 160606, "epoch": 1935} {"train_loss": -23.094684600830078, "global_step": 160607, "epoch": 1935} {"train_loss": -22.496793746948242, "global_step": 160608, "epoch": 1935} {"train_loss": -22.721324920654297, "global_step": 160609, "epoch": 1935} {"train_loss": -23.237890243530273, "global_step": 160610, "epoch": 1935} {"train_loss": -23.217329025268555, "global_step": 160611, "epoch": 1935} {"train_loss": -23.170108795166016, "global_step": 160612, "epoch": 1935} {"train_loss": -22.911380767822266, "global_step": 160613, "epoch": 1935} {"train_loss": -23.448902130126953, "global_step": 160614, "epoch": 1935} {"train_loss": -23.041391372680664, "global_step": 160615, "epoch": 1935} {"train_loss": -23.033926010131836, "global_step": 160616, "epoch": 1935} {"train_loss": -23.1595458984375, "global_step": 160617, "epoch": 1935} {"train_loss": -22.987329483032227, "global_step": 160618, "epoch": 1935} {"train_loss": -23.41675567626953, "global_step": 160619, "epoch": 1935} {"train_loss": -23.0831241607666, "global_step": 160620, "epoch": 1935} {"train_loss": -23.547239303588867, "global_step": 160621, "epoch": 1935} {"train_loss": -23.159719467163086, "global_step": 160622, "epoch": 1935} {"train_loss": -23.20200538635254, "global_step": 160623, "epoch": 1935} {"train_loss": -22.995344161987305, "global_step": 160624, "epoch": 1935} {"train_loss": -23.007905960083008, "global_step": 160625, "epoch": 1935} {"train_loss": -23.133094787597656, "global_step": 160626, "epoch": 1935} {"train_loss": -23.12187957763672, "global_step": 160627, "epoch": 1935} {"train_loss": -23.664411544799805, "global_step": 160628, "epoch": 1935} {"train_loss": -23.230148315429688, "global_step": 160629, "epoch": 1935} {"train_loss": -23.404611587524414, "global_step": 160630, "epoch": 1935} {"train_loss": -23.741666793823242, "global_step": 160631, "epoch": 1935} {"train_loss": -23.366735458374023, "global_step": 160632, "epoch": 1935} {"train_loss": -23.6450138092041, "global_step": 160633, "epoch": 1935} {"train_loss": -23.795684814453125, "global_step": 160634, "epoch": 1935} {"train_loss": -23.671422958374023, "global_step": 160635, "epoch": 1935} {"train_loss": -23.681882858276367, "global_step": 160636, "epoch": 1935} {"train_loss": -23.521244049072266, "global_step": 160637, "epoch": 1935} {"train_loss": -23.585556030273438, "global_step": 160638, "epoch": 1935} {"train_loss": -23.91921043395996, "global_step": 160639, "epoch": 1935} {"train_loss": -23.43146324157715, "global_step": 160640, "epoch": 1935} {"train_loss": -23.681747436523438, "global_step": 160641, "epoch": 1935} {"train_loss": -23.651288986206055, "global_step": 160642, "epoch": 1935} {"train_loss": -23.44752311706543, "global_step": 160643, "epoch": 1935} {"train_loss": -23.47125244140625, "global_step": 160644, "epoch": 1935} {"train_loss": -23.44515037536621, "global_step": 160645, "epoch": 1935} {"train_loss": -23.29147720336914, "global_step": 160646, "epoch": 1935} {"train_loss": -23.700942993164062, "global_step": 160647, "epoch": 1935} {"train_loss": -22.999210357666016, "global_step": 160648, "epoch": 1935} {"train_loss": -23.672744750976562, "global_step": 160649, "epoch": 1935} {"train_loss": -23.433765411376953, "global_step": 160650, "epoch": 1935} {"train_loss": -23.64585304260254, "global_step": 160651, "epoch": 1935} {"train_loss": -23.784833908081055, "global_step": 160652, "epoch": 1935} {"train_loss": -23.5230770111084, "global_step": 160653, "epoch": 1935} {"train_loss": -23.49367332458496, "global_step": 160654, "epoch": 1935} {"train_loss": -23.658599853515625, "global_step": 160655, "epoch": 1935} {"train_loss": -23.453935623168945, "global_step": 160656, "epoch": 1935} {"train_loss": -23.527196884155273, "global_step": 160657, "epoch": 1935} {"train_loss": -23.619443893432617, "global_step": 160658, "epoch": 1935} {"train_loss": -23.09714126586914, "global_step": 160659, "epoch": 1935} {"train_loss": -23.38467788696289, "global_step": 160660, "epoch": 1935} {"train_loss": -23.076154708862305, "global_step": 160661, "epoch": 1935} {"train_loss": -23.169048309326172, "global_step": 160662, "epoch": 1935} {"train_loss": -23.112926483154297, "global_step": 160663, "epoch": 1935} {"train_loss": -23.821691513061523, "global_step": 160664, "epoch": 1935} {"train_loss": -23.241159439086914, "global_step": 160665, "epoch": 1935} {"train_loss": -23.7031307220459, "global_step": 160666, "epoch": 1935} {"train_loss": -23.121959686279297, "global_step": 160667, "epoch": 1935} {"train_loss": -23.312597274780273, "global_step": 160668, "epoch": 1935} {"train_loss": -23.87578773498535, "global_step": 160669, "epoch": 1935} {"train_loss": -23.255308151245117, "global_step": 160670, "epoch": 1935} {"train_loss": -23.24546241760254, "global_step": 160671, "epoch": 1935} {"train_loss": -23.552902221679688, "global_step": 160672, "epoch": 1935} {"train_loss": -23.340356826782227, "global_step": 160673, "epoch": 1935} {"train_loss": -23.639368057250977, "global_step": 160674, "epoch": 1935} {"train_loss": -23.55902862548828, "global_step": 160675, "epoch": 1935} {"train_loss": -23.58611488342285, "global_step": 160676, "epoch": 1935} {"train_loss": -23.687686920166016, "global_step": 160677, "epoch": 1935} {"train_loss": -23.414735794067383, "global_step": 160678, "epoch": 1935} {"train_loss": -23.266586303710938, "global_step": 160679, "epoch": 1935} {"train_loss": -24.082828521728516, "global_step": 160680, "epoch": 1935} {"train_loss": -23.579504013061523, "global_step": 160681, "epoch": 1935} {"train_loss": -23.508085250854492, "global_step": 160682, "epoch": 1935} {"train_loss": -23.48511505126953, "global_step": 160683, "epoch": 1935} {"train_loss": -23.893693923950195, "global_step": 160684, "epoch": 1935} {"train_loss": -23.581811904907227, "global_step": 160685, "epoch": 1935} {"train_loss": -23.61970329284668, "global_step": 160686, "epoch": 1935} {"train_loss": -23.382695967892566, "global_step": 160687, "epoch": 1935, "val_loss": 6466125.0} {"train_loss": -23.214008331298828, "global_step": 160688, "epoch": 1936} {"train_loss": -23.20173454284668, "global_step": 160689, "epoch": 1936} {"train_loss": -23.578956604003906, "global_step": 160690, "epoch": 1936} {"train_loss": -22.840425491333008, "global_step": 160691, "epoch": 1936} {"train_loss": -23.336450576782227, "global_step": 160692, "epoch": 1936} {"train_loss": -23.30314064025879, "global_step": 160693, "epoch": 1936} {"train_loss": -23.508283615112305, "global_step": 160694, "epoch": 1936} {"train_loss": -23.55400276184082, "global_step": 160695, "epoch": 1936} {"train_loss": -23.52428436279297, "global_step": 160696, "epoch": 1936} {"train_loss": -23.297754287719727, "global_step": 160697, "epoch": 1936} {"train_loss": -23.555028915405273, "global_step": 160698, "epoch": 1936} {"train_loss": -23.45440673828125, "global_step": 160699, "epoch": 1936} {"train_loss": -23.51905632019043, "global_step": 160700, "epoch": 1936} {"train_loss": -23.55522346496582, "global_step": 160701, "epoch": 1936} {"train_loss": -23.344749450683594, "global_step": 160702, "epoch": 1936} {"train_loss": -23.943571090698242, "global_step": 160703, "epoch": 1936} {"train_loss": -23.586332321166992, "global_step": 160704, "epoch": 1936} {"train_loss": -23.55377769470215, "global_step": 160705, "epoch": 1936} {"train_loss": -23.667444229125977, "global_step": 160706, "epoch": 1936} {"train_loss": -23.384763717651367, "global_step": 160707, "epoch": 1936} {"train_loss": -23.55080223083496, "global_step": 160708, "epoch": 1936} {"train_loss": -23.52659034729004, "global_step": 160709, "epoch": 1936} {"train_loss": -23.457754135131836, "global_step": 160710, "epoch": 1936} {"train_loss": -23.41937255859375, "global_step": 160711, "epoch": 1936} {"train_loss": -23.36495590209961, "global_step": 160712, "epoch": 1936} {"train_loss": -23.354015350341797, "global_step": 160713, "epoch": 1936} {"train_loss": -23.276159286499023, "global_step": 160714, "epoch": 1936} {"train_loss": -23.699918746948242, "global_step": 160715, "epoch": 1936} {"train_loss": -23.332935333251953, "global_step": 160716, "epoch": 1936} {"train_loss": -23.538480758666992, "global_step": 160717, "epoch": 1936} {"train_loss": -23.649444580078125, "global_step": 160718, "epoch": 1936} {"train_loss": -23.714557647705078, "global_step": 160719, "epoch": 1936} {"train_loss": -23.832382202148438, "global_step": 160720, "epoch": 1936} {"train_loss": -23.659727096557617, "global_step": 160721, "epoch": 1936} {"train_loss": -23.253223419189453, "global_step": 160722, "epoch": 1936} {"train_loss": -23.678173065185547, "global_step": 160723, "epoch": 1936} {"train_loss": -23.16901969909668, "global_step": 160724, "epoch": 1936} {"train_loss": -23.400970458984375, "global_step": 160725, "epoch": 1936} {"train_loss": -23.323034286499023, "global_step": 160726, "epoch": 1936} {"train_loss": -23.78120231628418, "global_step": 160727, "epoch": 1936} {"train_loss": -23.652772903442383, "global_step": 160728, "epoch": 1936} {"train_loss": -23.71319580078125, "global_step": 160729, "epoch": 1936} {"train_loss": -23.56087303161621, "global_step": 160730, "epoch": 1936} {"train_loss": -23.548616409301758, "global_step": 160731, "epoch": 1936} {"train_loss": -23.807912826538086, "global_step": 160732, "epoch": 1936} {"train_loss": -23.71942138671875, "global_step": 160733, "epoch": 1936} {"train_loss": -23.086074829101562, "global_step": 160734, "epoch": 1936} {"train_loss": -23.54009437561035, "global_step": 160735, "epoch": 1936} {"train_loss": -23.556320190429688, "global_step": 160736, "epoch": 1936} {"train_loss": -23.798288345336914, "global_step": 160737, "epoch": 1936} {"train_loss": -23.514867782592773, "global_step": 160738, "epoch": 1936} {"train_loss": -23.763492584228516, "global_step": 160739, "epoch": 1936} {"train_loss": -23.89887046813965, "global_step": 160740, "epoch": 1936} {"train_loss": -23.530527114868164, "global_step": 160741, "epoch": 1936} {"train_loss": -23.683795928955078, "global_step": 160742, "epoch": 1936} {"train_loss": -23.435415267944336, "global_step": 160743, "epoch": 1936} {"train_loss": -23.34657096862793, "global_step": 160744, "epoch": 1936} {"train_loss": -23.44964027404785, "global_step": 160745, "epoch": 1936} {"train_loss": -23.049808502197266, "global_step": 160746, "epoch": 1936} {"train_loss": -23.72040367126465, "global_step": 160747, "epoch": 1936} {"train_loss": -23.637126922607422, "global_step": 160748, "epoch": 1936} {"train_loss": -23.57168960571289, "global_step": 160749, "epoch": 1936} {"train_loss": -23.513214111328125, "global_step": 160750, "epoch": 1936} {"train_loss": -23.584917068481445, "global_step": 160751, "epoch": 1936} {"train_loss": -23.112211227416992, "global_step": 160752, "epoch": 1936} {"train_loss": -23.516754150390625, "global_step": 160753, "epoch": 1936} {"train_loss": -23.469684600830078, "global_step": 160754, "epoch": 1936} {"train_loss": -23.771228790283203, "global_step": 160755, "epoch": 1936} {"train_loss": -23.723180770874023, "global_step": 160756, "epoch": 1936} {"train_loss": -23.311080932617188, "global_step": 160757, "epoch": 1936} {"train_loss": -23.603336334228516, "global_step": 160758, "epoch": 1936} {"train_loss": -23.536386489868164, "global_step": 160759, "epoch": 1936} {"train_loss": -23.407442092895508, "global_step": 160760, "epoch": 1936} {"train_loss": -23.142379760742188, "global_step": 160761, "epoch": 1936} {"train_loss": -23.314634323120117, "global_step": 160762, "epoch": 1936} {"train_loss": -23.488859176635742, "global_step": 160763, "epoch": 1936} {"train_loss": -23.105411529541016, "global_step": 160764, "epoch": 1936} {"train_loss": -23.571929931640625, "global_step": 160765, "epoch": 1936} {"train_loss": -23.625835418701172, "global_step": 160766, "epoch": 1936} {"train_loss": -23.45564079284668, "global_step": 160767, "epoch": 1936} {"train_loss": -23.405981063842773, "global_step": 160768, "epoch": 1936} {"train_loss": -23.431407928466797, "global_step": 160769, "epoch": 1936} {"train_loss": -23.490280725869788, "global_step": 160770, "epoch": 1936, "val_loss": 6352447.0} {"train_loss": -23.109760284423828, "global_step": 160771, "epoch": 1937} {"train_loss": -22.781553268432617, "global_step": 160772, "epoch": 1937} {"train_loss": -22.872766494750977, "global_step": 160773, "epoch": 1937} {"train_loss": -23.19980239868164, "global_step": 160774, "epoch": 1937} {"train_loss": -22.699493408203125, "global_step": 160775, "epoch": 1937} {"train_loss": -23.14319610595703, "global_step": 160776, "epoch": 1937} {"train_loss": -22.83931541442871, "global_step": 160777, "epoch": 1937} {"train_loss": -23.09329605102539, "global_step": 160778, "epoch": 1937} {"train_loss": -23.171945571899414, "global_step": 160779, "epoch": 1937} {"train_loss": -23.269580841064453, "global_step": 160780, "epoch": 1937} {"train_loss": -22.94570541381836, "global_step": 160781, "epoch": 1937} {"train_loss": -23.56757354736328, "global_step": 160782, "epoch": 1937} {"train_loss": -23.321598052978516, "global_step": 160783, "epoch": 1937} {"train_loss": -23.322052001953125, "global_step": 160784, "epoch": 1937} {"train_loss": -23.276138305664062, "global_step": 160785, "epoch": 1937} {"train_loss": -22.826642990112305, "global_step": 160786, "epoch": 1937} {"train_loss": -23.28046417236328, "global_step": 160787, "epoch": 1937} {"train_loss": -23.43182373046875, "global_step": 160788, "epoch": 1937} {"train_loss": -23.322919845581055, "global_step": 160789, "epoch": 1937} {"train_loss": -23.399585723876953, "global_step": 160790, "epoch": 1937} {"train_loss": -23.415103912353516, "global_step": 160791, "epoch": 1937} {"train_loss": -23.529916763305664, "global_step": 160792, "epoch": 1937} {"train_loss": -23.086095809936523, "global_step": 160793, "epoch": 1937} {"train_loss": -23.557214736938477, "global_step": 160794, "epoch": 1937} {"train_loss": -23.162540435791016, "global_step": 160795, "epoch": 1937} {"train_loss": -23.34133529663086, "global_step": 160796, "epoch": 1937} {"train_loss": -23.33024024963379, "global_step": 160797, "epoch": 1937} {"train_loss": -23.496259689331055, "global_step": 160798, "epoch": 1937} {"train_loss": -22.99616050720215, "global_step": 160799, "epoch": 1937} {"train_loss": -23.47783851623535, "global_step": 160800, "epoch": 1937} {"train_loss": -23.74494743347168, "global_step": 160801, "epoch": 1937} {"train_loss": -23.21327018737793, "global_step": 160802, "epoch": 1937} {"train_loss": -22.953908920288086, "global_step": 160803, "epoch": 1937} {"train_loss": -23.807416915893555, "global_step": 160804, "epoch": 1937} {"train_loss": -23.613086700439453, "global_step": 160805, "epoch": 1937} {"train_loss": -23.5328311920166, "global_step": 160806, "epoch": 1937} {"train_loss": -23.889827728271484, "global_step": 160807, "epoch": 1937} {"train_loss": -23.91126823425293, "global_step": 160808, "epoch": 1937} {"train_loss": -23.25412368774414, "global_step": 160809, "epoch": 1937} {"train_loss": -23.638107299804688, "global_step": 160810, "epoch": 1937} {"train_loss": -23.718780517578125, "global_step": 160811, "epoch": 1937} {"train_loss": -23.718719482421875, "global_step": 160812, "epoch": 1937} {"train_loss": -23.431982040405273, "global_step": 160813, "epoch": 1937} {"train_loss": -22.9896297454834, "global_step": 160814, "epoch": 1937} {"train_loss": -23.533126831054688, "global_step": 160815, "epoch": 1937} {"train_loss": -23.571256637573242, "global_step": 160816, "epoch": 1937} {"train_loss": -23.65591049194336, "global_step": 160817, "epoch": 1937} {"train_loss": -23.33429527282715, "global_step": 160818, "epoch": 1937} {"train_loss": -23.70879554748535, "global_step": 160819, "epoch": 1937} {"train_loss": -23.18332290649414, "global_step": 160820, "epoch": 1937} {"train_loss": -23.182035446166992, "global_step": 160821, "epoch": 1937} {"train_loss": -23.855941772460938, "global_step": 160822, "epoch": 1937} {"train_loss": -23.324081420898438, "global_step": 160823, "epoch": 1937} {"train_loss": -23.408803939819336, "global_step": 160824, "epoch": 1937} {"train_loss": -23.3254451751709, "global_step": 160825, "epoch": 1937} {"train_loss": -23.797407150268555, "global_step": 160826, "epoch": 1937} {"train_loss": -23.519062042236328, "global_step": 160827, "epoch": 1937} {"train_loss": -23.372304916381836, "global_step": 160828, "epoch": 1937} {"train_loss": -23.39324951171875, "global_step": 160829, "epoch": 1937} {"train_loss": -23.887859344482422, "global_step": 160830, "epoch": 1937} {"train_loss": -24.00008201599121, "global_step": 160831, "epoch": 1937} {"train_loss": -23.42286491394043, "global_step": 160832, "epoch": 1937} {"train_loss": -23.5228271484375, "global_step": 160833, "epoch": 1937} {"train_loss": -23.70195960998535, "global_step": 160834, "epoch": 1937} {"train_loss": -23.74397087097168, "global_step": 160835, "epoch": 1937} {"train_loss": -23.37885856628418, "global_step": 160836, "epoch": 1937} {"train_loss": -23.633684158325195, "global_step": 160837, "epoch": 1937} {"train_loss": -23.690927505493164, "global_step": 160838, "epoch": 1937} {"train_loss": -23.2925968170166, "global_step": 160839, "epoch": 1937} {"train_loss": -23.489734649658203, "global_step": 160840, "epoch": 1937} {"train_loss": -23.58502769470215, "global_step": 160841, "epoch": 1937} {"train_loss": -23.7847900390625, "global_step": 160842, "epoch": 1937} {"train_loss": -23.70778465270996, "global_step": 160843, "epoch": 1937} {"train_loss": -23.4571590423584, "global_step": 160844, "epoch": 1937} {"train_loss": -23.649194717407227, "global_step": 160845, "epoch": 1937} {"train_loss": -23.23601722717285, "global_step": 160846, "epoch": 1937} {"train_loss": -23.712188720703125, "global_step": 160847, "epoch": 1937} {"train_loss": -23.667997360229492, "global_step": 160848, "epoch": 1937} {"train_loss": -23.665590286254883, "global_step": 160849, "epoch": 1937} {"train_loss": -23.579336166381836, "global_step": 160850, "epoch": 1937} {"train_loss": -23.8321533203125, "global_step": 160851, "epoch": 1937} {"train_loss": -23.73402976989746, "global_step": 160852, "epoch": 1937} {"train_loss": -23.438737869262695, "global_step": 160853, "epoch": 1937, "val_loss": 6380383.0} {"train_loss": -22.670495986938477, "global_step": 160854, "epoch": 1938} {"train_loss": -22.580949783325195, "global_step": 160855, "epoch": 1938} {"train_loss": -22.854827880859375, "global_step": 160856, "epoch": 1938} {"train_loss": -23.033096313476562, "global_step": 160857, "epoch": 1938} {"train_loss": -22.983238220214844, "global_step": 160858, "epoch": 1938} {"train_loss": -22.545589447021484, "global_step": 160859, "epoch": 1938} {"train_loss": -22.992279052734375, "global_step": 160860, "epoch": 1938} {"train_loss": -22.902576446533203, "global_step": 160861, "epoch": 1938} {"train_loss": -23.134756088256836, "global_step": 160862, "epoch": 1938} {"train_loss": -23.048667907714844, "global_step": 160863, "epoch": 1938} {"train_loss": -22.90053367614746, "global_step": 160864, "epoch": 1938} {"train_loss": -23.21858024597168, "global_step": 160865, "epoch": 1938} {"train_loss": -22.947677612304688, "global_step": 160866, "epoch": 1938} {"train_loss": -22.72830581665039, "global_step": 160867, "epoch": 1938} {"train_loss": -22.973669052124023, "global_step": 160868, "epoch": 1938} {"train_loss": -23.356760025024414, "global_step": 160869, "epoch": 1938} {"train_loss": -23.078256607055664, "global_step": 160870, "epoch": 1938} {"train_loss": -23.22818374633789, "global_step": 160871, "epoch": 1938} {"train_loss": -23.376028060913086, "global_step": 160872, "epoch": 1938} {"train_loss": -23.702238082885742, "global_step": 160873, "epoch": 1938} {"train_loss": -23.4085636138916, "global_step": 160874, "epoch": 1938} {"train_loss": -23.480323791503906, "global_step": 160875, "epoch": 1938} {"train_loss": -23.104555130004883, "global_step": 160876, "epoch": 1938} {"train_loss": -23.33576011657715, "global_step": 160877, "epoch": 1938} {"train_loss": -23.24627113342285, "global_step": 160878, "epoch": 1938} {"train_loss": -23.47256851196289, "global_step": 160879, "epoch": 1938} {"train_loss": -23.175186157226562, "global_step": 160880, "epoch": 1938} {"train_loss": -23.281423568725586, "global_step": 160881, "epoch": 1938} {"train_loss": -23.659692764282227, "global_step": 160882, "epoch": 1938} {"train_loss": -23.0384578704834, "global_step": 160883, "epoch": 1938} {"train_loss": -23.299697875976562, "global_step": 160884, "epoch": 1938} {"train_loss": -23.765424728393555, "global_step": 160885, "epoch": 1938} {"train_loss": -23.432559967041016, "global_step": 160886, "epoch": 1938} {"train_loss": -23.506994247436523, "global_step": 160887, "epoch": 1938} {"train_loss": -23.580341339111328, "global_step": 160888, "epoch": 1938} {"train_loss": -23.531200408935547, "global_step": 160889, "epoch": 1938} {"train_loss": -23.38779067993164, "global_step": 160890, "epoch": 1938} {"train_loss": -23.925222396850586, "global_step": 160891, "epoch": 1938} {"train_loss": -23.413114547729492, "global_step": 160892, "epoch": 1938} {"train_loss": -23.172992706298828, "global_step": 160893, "epoch": 1938} {"train_loss": -23.562089920043945, "global_step": 160894, "epoch": 1938} {"train_loss": -23.49346923828125, "global_step": 160895, "epoch": 1938} {"train_loss": -23.211780548095703, "global_step": 160896, "epoch": 1938} {"train_loss": -23.622739791870117, "global_step": 160897, "epoch": 1938} {"train_loss": -23.69044303894043, "global_step": 160898, "epoch": 1938} {"train_loss": -23.112640380859375, "global_step": 160899, "epoch": 1938} {"train_loss": -23.58165740966797, "global_step": 160900, "epoch": 1938} {"train_loss": -23.381805419921875, "global_step": 160901, "epoch": 1938} {"train_loss": -23.56367301940918, "global_step": 160902, "epoch": 1938} {"train_loss": -23.471824645996094, "global_step": 160903, "epoch": 1938} {"train_loss": -23.356168746948242, "global_step": 160904, "epoch": 1938} {"train_loss": -23.261667251586914, "global_step": 160905, "epoch": 1938} {"train_loss": -23.631101608276367, "global_step": 160906, "epoch": 1938} {"train_loss": -23.131786346435547, "global_step": 160907, "epoch": 1938} {"train_loss": -23.65424156188965, "global_step": 160908, "epoch": 1938} {"train_loss": -23.425935745239258, "global_step": 160909, "epoch": 1938} {"train_loss": -24.07997703552246, "global_step": 160910, "epoch": 1938} {"train_loss": -23.718616485595703, "global_step": 160911, "epoch": 1938} {"train_loss": -23.50370216369629, "global_step": 160912, "epoch": 1938} {"train_loss": -23.51985740661621, "global_step": 160913, "epoch": 1938} {"train_loss": -23.532255172729492, "global_step": 160914, "epoch": 1938} {"train_loss": -23.589603424072266, "global_step": 160915, "epoch": 1938} {"train_loss": -23.987668991088867, "global_step": 160916, "epoch": 1938} {"train_loss": -23.70423698425293, "global_step": 160917, "epoch": 1938} {"train_loss": -23.717178344726562, "global_step": 160918, "epoch": 1938} {"train_loss": -23.765995025634766, "global_step": 160919, "epoch": 1938} {"train_loss": -23.431396484375, "global_step": 160920, "epoch": 1938} {"train_loss": -23.27198028564453, "global_step": 160921, "epoch": 1938} {"train_loss": -23.74416732788086, "global_step": 160922, "epoch": 1938} {"train_loss": -23.403104782104492, "global_step": 160923, "epoch": 1938} {"train_loss": -23.268192291259766, "global_step": 160924, "epoch": 1938} {"train_loss": -23.46903419494629, "global_step": 160925, "epoch": 1938} {"train_loss": -23.38848876953125, "global_step": 160926, "epoch": 1938} {"train_loss": -24.028121948242188, "global_step": 160927, "epoch": 1938} {"train_loss": -23.384763717651367, "global_step": 160928, "epoch": 1938} {"train_loss": -23.694875717163086, "global_step": 160929, "epoch": 1938} {"train_loss": -23.708059310913086, "global_step": 160930, "epoch": 1938} {"train_loss": -23.3459529876709, "global_step": 160931, "epoch": 1938} {"train_loss": -23.577625274658203, "global_step": 160932, "epoch": 1938} {"train_loss": -23.45775604248047, "global_step": 160933, "epoch": 1938} {"train_loss": -23.765914916992188, "global_step": 160934, "epoch": 1938} {"train_loss": -23.55191993713379, "global_step": 160935, "epoch": 1938} {"train_loss": -23.370228135442158, "global_step": 160936, "epoch": 1938, "val_loss": 6328626.0} {"train_loss": -23.392587661743164, "global_step": 160937, "epoch": 1939} {"train_loss": -23.303442001342773, "global_step": 160938, "epoch": 1939} {"train_loss": -23.20790672302246, "global_step": 160939, "epoch": 1939} {"train_loss": -23.11347007751465, "global_step": 160940, "epoch": 1939} {"train_loss": -23.24497413635254, "global_step": 160941, "epoch": 1939} {"train_loss": -23.262889862060547, "global_step": 160942, "epoch": 1939} {"train_loss": -23.271203994750977, "global_step": 160943, "epoch": 1939} {"train_loss": -23.06285858154297, "global_step": 160944, "epoch": 1939} {"train_loss": -23.0681209564209, "global_step": 160945, "epoch": 1939} {"train_loss": -23.243942260742188, "global_step": 160946, "epoch": 1939} {"train_loss": -23.040510177612305, "global_step": 160947, "epoch": 1939} {"train_loss": -23.194726943969727, "global_step": 160948, "epoch": 1939} {"train_loss": -23.153593063354492, "global_step": 160949, "epoch": 1939} {"train_loss": -23.297622680664062, "global_step": 160950, "epoch": 1939} {"train_loss": -22.925642013549805, "global_step": 160951, "epoch": 1939} {"train_loss": -23.317039489746094, "global_step": 160952, "epoch": 1939} {"train_loss": -23.068283081054688, "global_step": 160953, "epoch": 1939} {"train_loss": -23.148366928100586, "global_step": 160954, "epoch": 1939} {"train_loss": -23.263826370239258, "global_step": 160955, "epoch": 1939} {"train_loss": -23.5352725982666, "global_step": 160956, "epoch": 1939} {"train_loss": -23.000829696655273, "global_step": 160957, "epoch": 1939} {"train_loss": -23.277938842773438, "global_step": 160958, "epoch": 1939} {"train_loss": -23.342151641845703, "global_step": 160959, "epoch": 1939} {"train_loss": -23.085737228393555, "global_step": 160960, "epoch": 1939} {"train_loss": -23.366893768310547, "global_step": 160961, "epoch": 1939} {"train_loss": -23.386259078979492, "global_step": 160962, "epoch": 1939} {"train_loss": -23.347089767456055, "global_step": 160963, "epoch": 1939} {"train_loss": -23.543426513671875, "global_step": 160964, "epoch": 1939} {"train_loss": -23.297882080078125, "global_step": 160965, "epoch": 1939} {"train_loss": -23.581457138061523, "global_step": 160966, "epoch": 1939} {"train_loss": -23.361242294311523, "global_step": 160967, "epoch": 1939} {"train_loss": -23.156457901000977, "global_step": 160968, "epoch": 1939} {"train_loss": -23.278722763061523, "global_step": 160969, "epoch": 1939} {"train_loss": -23.48272705078125, "global_step": 160970, "epoch": 1939} {"train_loss": -23.332700729370117, "global_step": 160971, "epoch": 1939} {"train_loss": -23.36117172241211, "global_step": 160972, "epoch": 1939} {"train_loss": -23.818836212158203, "global_step": 160973, "epoch": 1939} {"train_loss": -23.44287872314453, "global_step": 160974, "epoch": 1939} {"train_loss": -23.73575210571289, "global_step": 160975, "epoch": 1939} {"train_loss": -23.344512939453125, "global_step": 160976, "epoch": 1939} {"train_loss": -23.67868423461914, "global_step": 160977, "epoch": 1939} {"train_loss": -23.701980590820312, "global_step": 160978, "epoch": 1939} {"train_loss": -23.6721248626709, "global_step": 160979, "epoch": 1939} {"train_loss": -23.5997257232666, "global_step": 160980, "epoch": 1939} {"train_loss": -23.663911819458008, "global_step": 160981, "epoch": 1939} {"train_loss": -23.59833335876465, "global_step": 160982, "epoch": 1939} {"train_loss": -23.845474243164062, "global_step": 160983, "epoch": 1939} {"train_loss": -24.03669548034668, "global_step": 160984, "epoch": 1939} {"train_loss": -23.64988136291504, "global_step": 160985, "epoch": 1939} {"train_loss": -23.14640235900879, "global_step": 160986, "epoch": 1939} {"train_loss": -24.202795028686523, "global_step": 160987, "epoch": 1939} {"train_loss": -23.655624389648438, "global_step": 160988, "epoch": 1939} {"train_loss": -23.651416778564453, "global_step": 160989, "epoch": 1939} {"train_loss": -23.577598571777344, "global_step": 160990, "epoch": 1939} {"train_loss": -23.336002349853516, "global_step": 160991, "epoch": 1939} {"train_loss": -23.526586532592773, "global_step": 160992, "epoch": 1939} {"train_loss": -23.7145938873291, "global_step": 160993, "epoch": 1939} {"train_loss": -23.726837158203125, "global_step": 160994, "epoch": 1939} {"train_loss": -23.350727081298828, "global_step": 160995, "epoch": 1939} {"train_loss": -23.677885055541992, "global_step": 160996, "epoch": 1939} {"train_loss": -23.208045959472656, "global_step": 160997, "epoch": 1939} {"train_loss": -23.592010498046875, "global_step": 160998, "epoch": 1939} {"train_loss": -23.163818359375, "global_step": 160999, "epoch": 1939} {"train_loss": -23.752954483032227, "global_step": 161000, "epoch": 1939} {"train_loss": -23.345117568969727, "global_step": 161001, "epoch": 1939} {"train_loss": -23.640539169311523, "global_step": 161002, "epoch": 1939} {"train_loss": -23.60426139831543, "global_step": 161003, "epoch": 1939} {"train_loss": -23.6478328704834, "global_step": 161004, "epoch": 1939} {"train_loss": -23.6916561126709, "global_step": 161005, "epoch": 1939} {"train_loss": -23.49134635925293, "global_step": 161006, "epoch": 1939} {"train_loss": -23.478452682495117, "global_step": 161007, "epoch": 1939} {"train_loss": -23.103897094726562, "global_step": 161008, "epoch": 1939} {"train_loss": -23.28831672668457, "global_step": 161009, "epoch": 1939} {"train_loss": -23.671499252319336, "global_step": 161010, "epoch": 1939} {"train_loss": -23.66707420349121, "global_step": 161011, "epoch": 1939} {"train_loss": -23.48198890686035, "global_step": 161012, "epoch": 1939} {"train_loss": -23.478504180908203, "global_step": 161013, "epoch": 1939} {"train_loss": -23.11622428894043, "global_step": 161014, "epoch": 1939} {"train_loss": -23.84042739868164, "global_step": 161015, "epoch": 1939} {"train_loss": -23.330902099609375, "global_step": 161016, "epoch": 1939} {"train_loss": -23.458166122436523, "global_step": 161017, "epoch": 1939} {"train_loss": -23.832538604736328, "global_step": 161018, "epoch": 1939} {"train_loss": -23.437541846769403, "global_step": 161019, "epoch": 1939, "val_loss": 6366747.0} {"train_loss": -23.438156127929688, "global_step": 161020, "epoch": 1940} {"train_loss": -23.3308162689209, "global_step": 161021, "epoch": 1940} {"train_loss": -23.529993057250977, "global_step": 161022, "epoch": 1940} {"train_loss": -23.311840057373047, "global_step": 161023, "epoch": 1940} {"train_loss": -23.716140747070312, "global_step": 161024, "epoch": 1940} {"train_loss": -23.54530906677246, "global_step": 161025, "epoch": 1940} {"train_loss": -23.39301109313965, "global_step": 161026, "epoch": 1940} {"train_loss": -23.47647476196289, "global_step": 161027, "epoch": 1940} {"train_loss": -23.101167678833008, "global_step": 161028, "epoch": 1940} {"train_loss": -23.400434494018555, "global_step": 161029, "epoch": 1940} {"train_loss": -23.12471580505371, "global_step": 161030, "epoch": 1940} {"train_loss": -23.194944381713867, "global_step": 161031, "epoch": 1940} {"train_loss": -23.43377685546875, "global_step": 161032, "epoch": 1940} {"train_loss": -23.928089141845703, "global_step": 161033, "epoch": 1940} {"train_loss": -23.31711196899414, "global_step": 161034, "epoch": 1940} {"train_loss": -23.371952056884766, "global_step": 161035, "epoch": 1940} {"train_loss": -23.427854537963867, "global_step": 161036, "epoch": 1940} {"train_loss": -23.493480682373047, "global_step": 161037, "epoch": 1940} {"train_loss": -23.809003829956055, "global_step": 161038, "epoch": 1940} {"train_loss": -23.469594955444336, "global_step": 161039, "epoch": 1940} {"train_loss": -23.629497528076172, "global_step": 161040, "epoch": 1940} {"train_loss": -23.291828155517578, "global_step": 161041, "epoch": 1940} {"train_loss": -23.17012596130371, "global_step": 161042, "epoch": 1940} {"train_loss": -23.420225143432617, "global_step": 161043, "epoch": 1940} {"train_loss": -23.37496566772461, "global_step": 161044, "epoch": 1940} {"train_loss": -23.71950340270996, "global_step": 161045, "epoch": 1940} {"train_loss": -23.415311813354492, "global_step": 161046, "epoch": 1940} {"train_loss": -23.347583770751953, "global_step": 161047, "epoch": 1940} {"train_loss": -23.759063720703125, "global_step": 161048, "epoch": 1940} {"train_loss": -23.701770782470703, "global_step": 161049, "epoch": 1940} {"train_loss": -23.951284408569336, "global_step": 161050, "epoch": 1940} {"train_loss": -23.535139083862305, "global_step": 161051, "epoch": 1940} {"train_loss": -23.326271057128906, "global_step": 161052, "epoch": 1940} {"train_loss": -23.341886520385742, "global_step": 161053, "epoch": 1940} {"train_loss": -23.95949363708496, "global_step": 161054, "epoch": 1940} {"train_loss": -23.739789962768555, "global_step": 161055, "epoch": 1940} {"train_loss": -23.64299201965332, "global_step": 161056, "epoch": 1940} {"train_loss": -23.92227554321289, "global_step": 161057, "epoch": 1940} {"train_loss": -23.571165084838867, "global_step": 161058, "epoch": 1940} {"train_loss": -23.968517303466797, "global_step": 161059, "epoch": 1940} {"train_loss": -23.49128532409668, "global_step": 161060, "epoch": 1940} {"train_loss": -23.644201278686523, "global_step": 161061, "epoch": 1940} {"train_loss": -23.805471420288086, "global_step": 161062, "epoch": 1940} {"train_loss": -23.923538208007812, "global_step": 161063, "epoch": 1940} {"train_loss": -23.511363983154297, "global_step": 161064, "epoch": 1940} {"train_loss": -23.780200958251953, "global_step": 161065, "epoch": 1940} {"train_loss": -23.89630126953125, "global_step": 161066, "epoch": 1940} {"train_loss": -23.758644104003906, "global_step": 161067, "epoch": 1940} {"train_loss": -23.716293334960938, "global_step": 161068, "epoch": 1940} {"train_loss": -23.436199188232422, "global_step": 161069, "epoch": 1940} {"train_loss": -22.9835205078125, "global_step": 161070, "epoch": 1940} {"train_loss": -22.495019912719727, "global_step": 161071, "epoch": 1940} {"train_loss": -21.727941513061523, "global_step": 161072, "epoch": 1940} {"train_loss": -22.507545471191406, "global_step": 161073, "epoch": 1940} {"train_loss": -23.174793243408203, "global_step": 161074, "epoch": 1940} {"train_loss": -22.666397094726562, "global_step": 161075, "epoch": 1940} {"train_loss": -22.785110473632812, "global_step": 161076, "epoch": 1940} {"train_loss": -23.014541625976562, "global_step": 161077, "epoch": 1940} {"train_loss": -22.97600746154785, "global_step": 161078, "epoch": 1940} {"train_loss": -23.054100036621094, "global_step": 161079, "epoch": 1940} {"train_loss": -23.003427505493164, "global_step": 161080, "epoch": 1940} {"train_loss": -22.95889663696289, "global_step": 161081, "epoch": 1940} {"train_loss": -23.02600860595703, "global_step": 161082, "epoch": 1940} {"train_loss": -23.159250259399414, "global_step": 161083, "epoch": 1940} {"train_loss": -23.020893096923828, "global_step": 161084, "epoch": 1940} {"train_loss": -22.888513565063477, "global_step": 161085, "epoch": 1940} {"train_loss": -23.325119018554688, "global_step": 161086, "epoch": 1940} {"train_loss": -23.398130416870117, "global_step": 161087, "epoch": 1940} {"train_loss": -22.865238189697266, "global_step": 161088, "epoch": 1940} {"train_loss": -23.213293075561523, "global_step": 161089, "epoch": 1940} {"train_loss": -23.029476165771484, "global_step": 161090, "epoch": 1940} {"train_loss": -23.335172653198242, "global_step": 161091, "epoch": 1940} {"train_loss": -23.43407440185547, "global_step": 161092, "epoch": 1940} {"train_loss": -23.12591552734375, "global_step": 161093, "epoch": 1940} {"train_loss": -23.68093490600586, "global_step": 161094, "epoch": 1940} {"train_loss": -23.38630485534668, "global_step": 161095, "epoch": 1940} {"train_loss": -23.34929847717285, "global_step": 161096, "epoch": 1940} {"train_loss": -23.59901237487793, "global_step": 161097, "epoch": 1940} {"train_loss": -23.406494140625, "global_step": 161098, "epoch": 1940} {"train_loss": -23.40729331970215, "global_step": 161099, "epoch": 1940} {"train_loss": -23.545894622802734, "global_step": 161100, "epoch": 1940} {"train_loss": -23.457603454589844, "global_step": 161101, "epoch": 1940} {"train_loss": -23.37007338742176, "global_step": 161102, "epoch": 1940, "val_loss": 6362663.5} {"train_loss": -23.30666160583496, "global_step": 161103, "epoch": 1941} {"train_loss": -23.33038330078125, "global_step": 161104, "epoch": 1941} {"train_loss": -23.283756256103516, "global_step": 161105, "epoch": 1941} {"train_loss": -23.102890014648438, "global_step": 161106, "epoch": 1941} {"train_loss": -23.767383575439453, "global_step": 161107, "epoch": 1941} {"train_loss": -23.30954933166504, "global_step": 161108, "epoch": 1941} {"train_loss": -23.52492332458496, "global_step": 161109, "epoch": 1941} {"train_loss": -23.461271286010742, "global_step": 161110, "epoch": 1941} {"train_loss": -23.42951774597168, "global_step": 161111, "epoch": 1941} {"train_loss": -23.25861167907715, "global_step": 161112, "epoch": 1941} {"train_loss": -23.32154655456543, "global_step": 161113, "epoch": 1941} {"train_loss": -23.419353485107422, "global_step": 161114, "epoch": 1941} {"train_loss": -23.369369506835938, "global_step": 161115, "epoch": 1941} {"train_loss": -23.922754287719727, "global_step": 161116, "epoch": 1941} {"train_loss": -23.233396530151367, "global_step": 161117, "epoch": 1941} {"train_loss": -23.333749771118164, "global_step": 161118, "epoch": 1941} {"train_loss": -23.35362434387207, "global_step": 161119, "epoch": 1941} {"train_loss": -23.64223861694336, "global_step": 161120, "epoch": 1941} {"train_loss": -23.311214447021484, "global_step": 161121, "epoch": 1941} {"train_loss": -23.303632736206055, "global_step": 161122, "epoch": 1941} {"train_loss": -23.589305877685547, "global_step": 161123, "epoch": 1941} {"train_loss": -23.355436325073242, "global_step": 161124, "epoch": 1941} {"train_loss": -23.717985153198242, "global_step": 161125, "epoch": 1941} {"train_loss": -23.502552032470703, "global_step": 161126, "epoch": 1941} {"train_loss": -23.305465698242188, "global_step": 161127, "epoch": 1941} {"train_loss": -23.142133712768555, "global_step": 161128, "epoch": 1941} {"train_loss": -23.465864181518555, "global_step": 161129, "epoch": 1941} {"train_loss": -23.506515502929688, "global_step": 161130, "epoch": 1941} {"train_loss": -23.620473861694336, "global_step": 161131, "epoch": 1941} {"train_loss": -23.57199478149414, "global_step": 161132, "epoch": 1941} {"train_loss": -23.877145767211914, "global_step": 161133, "epoch": 1941} {"train_loss": -23.26439666748047, "global_step": 161134, "epoch": 1941} {"train_loss": -23.43268394470215, "global_step": 161135, "epoch": 1941} {"train_loss": -23.87726402282715, "global_step": 161136, "epoch": 1941} {"train_loss": -23.49312400817871, "global_step": 161137, "epoch": 1941} {"train_loss": -23.66316032409668, "global_step": 161138, "epoch": 1941} {"train_loss": -23.60268211364746, "global_step": 161139, "epoch": 1941} {"train_loss": -23.61248779296875, "global_step": 161140, "epoch": 1941} {"train_loss": -23.61103057861328, "global_step": 161141, "epoch": 1941} {"train_loss": -23.74106216430664, "global_step": 161142, "epoch": 1941} {"train_loss": -23.866979598999023, "global_step": 161143, "epoch": 1941} {"train_loss": -23.410198211669922, "global_step": 161144, "epoch": 1941} {"train_loss": -23.442951202392578, "global_step": 161145, "epoch": 1941} {"train_loss": -23.366073608398438, "global_step": 161146, "epoch": 1941} {"train_loss": -24.118671417236328, "global_step": 161147, "epoch": 1941} {"train_loss": -23.243534088134766, "global_step": 161148, "epoch": 1941} {"train_loss": -24.009246826171875, "global_step": 161149, "epoch": 1941} {"train_loss": -23.649513244628906, "global_step": 161150, "epoch": 1941} {"train_loss": -23.962268829345703, "global_step": 161151, "epoch": 1941} {"train_loss": -23.82172203063965, "global_step": 161152, "epoch": 1941} {"train_loss": -23.623397827148438, "global_step": 161153, "epoch": 1941} {"train_loss": -23.680831909179688, "global_step": 161154, "epoch": 1941} {"train_loss": -23.544147491455078, "global_step": 161155, "epoch": 1941} {"train_loss": -23.92887306213379, "global_step": 161156, "epoch": 1941} {"train_loss": -23.201732635498047, "global_step": 161157, "epoch": 1941} {"train_loss": -23.418935775756836, "global_step": 161158, "epoch": 1941} {"train_loss": -23.279056549072266, "global_step": 161159, "epoch": 1941} {"train_loss": -23.2487850189209, "global_step": 161160, "epoch": 1941} {"train_loss": -23.293075561523438, "global_step": 161161, "epoch": 1941} {"train_loss": -23.23265838623047, "global_step": 161162, "epoch": 1941} {"train_loss": -23.701173782348633, "global_step": 161163, "epoch": 1941} {"train_loss": -23.65859031677246, "global_step": 161164, "epoch": 1941} {"train_loss": -23.304059982299805, "global_step": 161165, "epoch": 1941} {"train_loss": -23.20001792907715, "global_step": 161166, "epoch": 1941} {"train_loss": -23.413618087768555, "global_step": 161167, "epoch": 1941} {"train_loss": -23.444921493530273, "global_step": 161168, "epoch": 1941} {"train_loss": -23.49565315246582, "global_step": 161169, "epoch": 1941} {"train_loss": -23.274673461914062, "global_step": 161170, "epoch": 1941} {"train_loss": -23.290481567382812, "global_step": 161171, "epoch": 1941} {"train_loss": -22.912630081176758, "global_step": 161172, "epoch": 1941} {"train_loss": -23.557247161865234, "global_step": 161173, "epoch": 1941} {"train_loss": -23.393171310424805, "global_step": 161174, "epoch": 1941} {"train_loss": -23.451908111572266, "global_step": 161175, "epoch": 1941} {"train_loss": -23.425006866455078, "global_step": 161176, "epoch": 1941} {"train_loss": -23.13473892211914, "global_step": 161177, "epoch": 1941} {"train_loss": -23.3336181640625, "global_step": 161178, "epoch": 1941} {"train_loss": -23.290136337280273, "global_step": 161179, "epoch": 1941} {"train_loss": -23.333396911621094, "global_step": 161180, "epoch": 1941} {"train_loss": -23.173181533813477, "global_step": 161181, "epoch": 1941} {"train_loss": -23.61786460876465, "global_step": 161182, "epoch": 1941} {"train_loss": -23.185806274414062, "global_step": 161183, "epoch": 1941} {"train_loss": -23.864805221557617, "global_step": 161184, "epoch": 1941} {"train_loss": -23.472992402961456, "global_step": 161185, "epoch": 1941, "val_loss": 6394038.0} {"train_loss": -23.56849479675293, "global_step": 161186, "epoch": 1942} {"train_loss": -23.295347213745117, "global_step": 161187, "epoch": 1942} {"train_loss": -23.53737449645996, "global_step": 161188, "epoch": 1942} {"train_loss": -23.706920623779297, "global_step": 161189, "epoch": 1942} {"train_loss": -22.8158016204834, "global_step": 161190, "epoch": 1942} {"train_loss": -23.532567977905273, "global_step": 161191, "epoch": 1942} {"train_loss": -23.16509246826172, "global_step": 161192, "epoch": 1942} {"train_loss": -23.41347312927246, "global_step": 161193, "epoch": 1942} {"train_loss": -23.3249568939209, "global_step": 161194, "epoch": 1942} {"train_loss": -23.624929428100586, "global_step": 161195, "epoch": 1942} {"train_loss": -23.36396598815918, "global_step": 161196, "epoch": 1942} {"train_loss": -23.564939498901367, "global_step": 161197, "epoch": 1942} {"train_loss": -23.513078689575195, "global_step": 161198, "epoch": 1942} {"train_loss": -23.585783004760742, "global_step": 161199, "epoch": 1942} {"train_loss": -23.14919090270996, "global_step": 161200, "epoch": 1942} {"train_loss": -23.56143569946289, "global_step": 161201, "epoch": 1942} {"train_loss": -23.34566879272461, "global_step": 161202, "epoch": 1942} {"train_loss": -23.358789443969727, "global_step": 161203, "epoch": 1942} {"train_loss": -23.459211349487305, "global_step": 161204, "epoch": 1942} {"train_loss": -23.102636337280273, "global_step": 161205, "epoch": 1942} {"train_loss": -23.178932189941406, "global_step": 161206, "epoch": 1942} {"train_loss": -23.431739807128906, "global_step": 161207, "epoch": 1942} {"train_loss": -23.314014434814453, "global_step": 161208, "epoch": 1942} {"train_loss": -23.39076805114746, "global_step": 161209, "epoch": 1942} {"train_loss": -23.72870445251465, "global_step": 161210, "epoch": 1942} {"train_loss": -23.45979118347168, "global_step": 161211, "epoch": 1942} {"train_loss": -23.44879722595215, "global_step": 161212, "epoch": 1942} {"train_loss": -23.26199722290039, "global_step": 161213, "epoch": 1942} {"train_loss": -23.41810417175293, "global_step": 161214, "epoch": 1942} {"train_loss": -23.6737117767334, "global_step": 161215, "epoch": 1942} {"train_loss": -23.578901290893555, "global_step": 161216, "epoch": 1942} {"train_loss": -23.37582778930664, "global_step": 161217, "epoch": 1942} {"train_loss": -23.6749324798584, "global_step": 161218, "epoch": 1942} {"train_loss": -23.591249465942383, "global_step": 161219, "epoch": 1942} {"train_loss": -23.362977981567383, "global_step": 161220, "epoch": 1942} {"train_loss": -23.696247100830078, "global_step": 161221, "epoch": 1942} {"train_loss": -23.588632583618164, "global_step": 161222, "epoch": 1942} {"train_loss": -23.603567123413086, "global_step": 161223, "epoch": 1942} {"train_loss": -23.609071731567383, "global_step": 161224, "epoch": 1942} {"train_loss": -23.710012435913086, "global_step": 161225, "epoch": 1942} {"train_loss": -23.788434982299805, "global_step": 161226, "epoch": 1942} {"train_loss": -23.797025680541992, "global_step": 161227, "epoch": 1942} {"train_loss": -23.604589462280273, "global_step": 161228, "epoch": 1942} {"train_loss": -23.695798873901367, "global_step": 161229, "epoch": 1942} {"train_loss": -23.39021873474121, "global_step": 161230, "epoch": 1942} {"train_loss": -23.978017807006836, "global_step": 161231, "epoch": 1942} {"train_loss": -23.698471069335938, "global_step": 161232, "epoch": 1942} {"train_loss": -24.10175132751465, "global_step": 161233, "epoch": 1942} {"train_loss": -23.306257247924805, "global_step": 161234, "epoch": 1942} {"train_loss": -23.282306671142578, "global_step": 161235, "epoch": 1942} {"train_loss": -23.323911666870117, "global_step": 161236, "epoch": 1942} {"train_loss": -23.4898738861084, "global_step": 161237, "epoch": 1942} {"train_loss": -23.615400314331055, "global_step": 161238, "epoch": 1942} {"train_loss": -23.059967041015625, "global_step": 161239, "epoch": 1942} {"train_loss": -23.176925659179688, "global_step": 161240, "epoch": 1942} {"train_loss": -23.80409049987793, "global_step": 161241, "epoch": 1942} {"train_loss": -23.093290328979492, "global_step": 161242, "epoch": 1942} {"train_loss": -23.299915313720703, "global_step": 161243, "epoch": 1942} {"train_loss": -23.431947708129883, "global_step": 161244, "epoch": 1942} {"train_loss": -23.62957763671875, "global_step": 161245, "epoch": 1942} {"train_loss": -23.633615493774414, "global_step": 161246, "epoch": 1942} {"train_loss": -23.682661056518555, "global_step": 161247, "epoch": 1942} {"train_loss": -23.817459106445312, "global_step": 161248, "epoch": 1942} {"train_loss": -23.291513442993164, "global_step": 161249, "epoch": 1942} {"train_loss": -23.37140464782715, "global_step": 161250, "epoch": 1942} {"train_loss": -23.514892578125, "global_step": 161251, "epoch": 1942} {"train_loss": -23.339736938476562, "global_step": 161252, "epoch": 1942} {"train_loss": -23.559736251831055, "global_step": 161253, "epoch": 1942} {"train_loss": -23.513364791870117, "global_step": 161254, "epoch": 1942} {"train_loss": -23.468210220336914, "global_step": 161255, "epoch": 1942} {"train_loss": -23.629806518554688, "global_step": 161256, "epoch": 1942} {"train_loss": -23.845623016357422, "global_step": 161257, "epoch": 1942} {"train_loss": -23.649812698364258, "global_step": 161258, "epoch": 1942} {"train_loss": -23.22989845275879, "global_step": 161259, "epoch": 1942} {"train_loss": -23.156997680664062, "global_step": 161260, "epoch": 1942} {"train_loss": -23.096445083618164, "global_step": 161261, "epoch": 1942} {"train_loss": -23.70323944091797, "global_step": 161262, "epoch": 1942} {"train_loss": -23.991764068603516, "global_step": 161263, "epoch": 1942} {"train_loss": -23.853740692138672, "global_step": 161264, "epoch": 1942} {"train_loss": -24.043750762939453, "global_step": 161265, "epoch": 1942} {"train_loss": -23.740097045898438, "global_step": 161266, "epoch": 1942} {"train_loss": -23.289356231689453, "global_step": 161267, "epoch": 1942} {"train_loss": -23.505721586296357, "global_step": 161268, "epoch": 1942, "val_loss": 6374121.0} {"train_loss": -22.938886642456055, "global_step": 161269, "epoch": 1943} {"train_loss": -23.609159469604492, "global_step": 161270, "epoch": 1943} {"train_loss": -23.131656646728516, "global_step": 161271, "epoch": 1943} {"train_loss": -23.555646896362305, "global_step": 161272, "epoch": 1943} {"train_loss": -23.2636775970459, "global_step": 161273, "epoch": 1943} {"train_loss": -23.49448585510254, "global_step": 161274, "epoch": 1943} {"train_loss": -23.266403198242188, "global_step": 161275, "epoch": 1943} {"train_loss": -23.720685958862305, "global_step": 161276, "epoch": 1943} {"train_loss": -23.35769271850586, "global_step": 161277, "epoch": 1943} {"train_loss": -23.650390625, "global_step": 161278, "epoch": 1943} {"train_loss": -23.46900749206543, "global_step": 161279, "epoch": 1943} {"train_loss": -23.54965591430664, "global_step": 161280, "epoch": 1943} {"train_loss": -23.436798095703125, "global_step": 161281, "epoch": 1943} {"train_loss": -23.401029586791992, "global_step": 161282, "epoch": 1943} {"train_loss": -23.373823165893555, "global_step": 161283, "epoch": 1943} {"train_loss": -23.81917381286621, "global_step": 161284, "epoch": 1943} {"train_loss": -23.47437858581543, "global_step": 161285, "epoch": 1943} {"train_loss": -23.45501708984375, "global_step": 161286, "epoch": 1943} {"train_loss": -23.170568466186523, "global_step": 161287, "epoch": 1943} {"train_loss": -23.181737899780273, "global_step": 161288, "epoch": 1943} {"train_loss": -23.713794708251953, "global_step": 161289, "epoch": 1943} {"train_loss": -23.343982696533203, "global_step": 161290, "epoch": 1943} {"train_loss": -23.17943572998047, "global_step": 161291, "epoch": 1943} {"train_loss": -23.280675888061523, "global_step": 161292, "epoch": 1943} {"train_loss": -23.521177291870117, "global_step": 161293, "epoch": 1943} {"train_loss": -23.550878524780273, "global_step": 161294, "epoch": 1943} {"train_loss": -23.3427791595459, "global_step": 161295, "epoch": 1943} {"train_loss": -23.71900749206543, "global_step": 161296, "epoch": 1943} {"train_loss": -23.67706298828125, "global_step": 161297, "epoch": 1943} {"train_loss": -23.681705474853516, "global_step": 161298, "epoch": 1943} {"train_loss": -23.645309448242188, "global_step": 161299, "epoch": 1943} {"train_loss": -23.428544998168945, "global_step": 161300, "epoch": 1943} {"train_loss": -23.328407287597656, "global_step": 161301, "epoch": 1943} {"train_loss": -23.47406005859375, "global_step": 161302, "epoch": 1943} {"train_loss": -23.483373641967773, "global_step": 161303, "epoch": 1943} {"train_loss": -23.288816452026367, "global_step": 161304, "epoch": 1943} {"train_loss": -23.86378288269043, "global_step": 161305, "epoch": 1943} {"train_loss": -23.2085018157959, "global_step": 161306, "epoch": 1943} {"train_loss": -23.557510375976562, "global_step": 161307, "epoch": 1943} {"train_loss": -23.517492294311523, "global_step": 161308, "epoch": 1943} {"train_loss": -23.505653381347656, "global_step": 161309, "epoch": 1943} {"train_loss": -23.344924926757812, "global_step": 161310, "epoch": 1943} {"train_loss": -23.57176971435547, "global_step": 161311, "epoch": 1943} {"train_loss": -23.546730041503906, "global_step": 161312, "epoch": 1943} {"train_loss": -23.508291244506836, "global_step": 161313, "epoch": 1943} {"train_loss": -23.394062042236328, "global_step": 161314, "epoch": 1943} {"train_loss": -23.240346908569336, "global_step": 161315, "epoch": 1943} {"train_loss": -23.72149658203125, "global_step": 161316, "epoch": 1943} {"train_loss": -23.484155654907227, "global_step": 161317, "epoch": 1943} {"train_loss": -23.33917236328125, "global_step": 161318, "epoch": 1943} {"train_loss": -23.27838134765625, "global_step": 161319, "epoch": 1943} {"train_loss": -23.53803062438965, "global_step": 161320, "epoch": 1943} {"train_loss": -23.115638732910156, "global_step": 161321, "epoch": 1943} {"train_loss": -23.4982967376709, "global_step": 161322, "epoch": 1943} {"train_loss": -23.407991409301758, "global_step": 161323, "epoch": 1943} {"train_loss": -23.740320205688477, "global_step": 161324, "epoch": 1943} {"train_loss": -23.230527877807617, "global_step": 161325, "epoch": 1943} {"train_loss": -23.353923797607422, "global_step": 161326, "epoch": 1943} {"train_loss": -23.343433380126953, "global_step": 161327, "epoch": 1943} {"train_loss": -23.1157169342041, "global_step": 161328, "epoch": 1943} {"train_loss": -23.411657333374023, "global_step": 161329, "epoch": 1943} {"train_loss": -23.376550674438477, "global_step": 161330, "epoch": 1943} {"train_loss": -23.4899959564209, "global_step": 161331, "epoch": 1943} {"train_loss": -23.93596839904785, "global_step": 161332, "epoch": 1943} {"train_loss": -23.734533309936523, "global_step": 161333, "epoch": 1943} {"train_loss": -23.66132164001465, "global_step": 161334, "epoch": 1943} {"train_loss": -23.537372589111328, "global_step": 161335, "epoch": 1943} {"train_loss": -23.54506492614746, "global_step": 161336, "epoch": 1943} {"train_loss": -23.81641960144043, "global_step": 161337, "epoch": 1943} {"train_loss": -23.61671257019043, "global_step": 161338, "epoch": 1943} {"train_loss": -23.582752227783203, "global_step": 161339, "epoch": 1943} {"train_loss": -23.35332679748535, "global_step": 161340, "epoch": 1943} {"train_loss": -23.59164047241211, "global_step": 161341, "epoch": 1943} {"train_loss": -23.52070426940918, "global_step": 161342, "epoch": 1943} {"train_loss": -23.676074981689453, "global_step": 161343, "epoch": 1943} {"train_loss": -23.42267417907715, "global_step": 161344, "epoch": 1943} {"train_loss": -23.82006072998047, "global_step": 161345, "epoch": 1943} {"train_loss": -23.484304428100586, "global_step": 161346, "epoch": 1943} {"train_loss": -23.31863784790039, "global_step": 161347, "epoch": 1943} {"train_loss": -23.674034118652344, "global_step": 161348, "epoch": 1943} {"train_loss": -23.780099868774414, "global_step": 161349, "epoch": 1943} {"train_loss": -23.714380264282227, "global_step": 161350, "epoch": 1943} {"train_loss": -23.482542290745013, "global_step": 161351, "epoch": 1943, "val_loss": 6346939.0} {"train_loss": -23.59341049194336, "global_step": 161352, "epoch": 1944} {"train_loss": -22.72059440612793, "global_step": 161353, "epoch": 1944} {"train_loss": -23.014326095581055, "global_step": 161354, "epoch": 1944} {"train_loss": -23.033857345581055, "global_step": 161355, "epoch": 1944} {"train_loss": -23.6552677154541, "global_step": 161356, "epoch": 1944} {"train_loss": -23.570297241210938, "global_step": 161357, "epoch": 1944} {"train_loss": -23.471416473388672, "global_step": 161358, "epoch": 1944} {"train_loss": -23.191587448120117, "global_step": 161359, "epoch": 1944} {"train_loss": -23.4603271484375, "global_step": 161360, "epoch": 1944} {"train_loss": -23.388851165771484, "global_step": 161361, "epoch": 1944} {"train_loss": -23.46347999572754, "global_step": 161362, "epoch": 1944} {"train_loss": -23.450220108032227, "global_step": 161363, "epoch": 1944} {"train_loss": -23.33119773864746, "global_step": 161364, "epoch": 1944} {"train_loss": -23.431320190429688, "global_step": 161365, "epoch": 1944} {"train_loss": -23.65138053894043, "global_step": 161366, "epoch": 1944} {"train_loss": -23.388925552368164, "global_step": 161367, "epoch": 1944} {"train_loss": -23.5003719329834, "global_step": 161368, "epoch": 1944} {"train_loss": -23.523984909057617, "global_step": 161369, "epoch": 1944} {"train_loss": -23.41768455505371, "global_step": 161370, "epoch": 1944} {"train_loss": -23.676023483276367, "global_step": 161371, "epoch": 1944} {"train_loss": -23.493200302124023, "global_step": 161372, "epoch": 1944} {"train_loss": -23.51070213317871, "global_step": 161373, "epoch": 1944} {"train_loss": -23.42864418029785, "global_step": 161374, "epoch": 1944} {"train_loss": -23.42093849182129, "global_step": 161375, "epoch": 1944} {"train_loss": -23.725858688354492, "global_step": 161376, "epoch": 1944} {"train_loss": -23.835529327392578, "global_step": 161377, "epoch": 1944} {"train_loss": -23.560182571411133, "global_step": 161378, "epoch": 1944} {"train_loss": -23.653573989868164, "global_step": 161379, "epoch": 1944} {"train_loss": -23.37108612060547, "global_step": 161380, "epoch": 1944} {"train_loss": -23.435562133789062, "global_step": 161381, "epoch": 1944} {"train_loss": -23.800100326538086, "global_step": 161382, "epoch": 1944} {"train_loss": -23.523771286010742, "global_step": 161383, "epoch": 1944} {"train_loss": -23.367734909057617, "global_step": 161384, "epoch": 1944} {"train_loss": -23.47256851196289, "global_step": 161385, "epoch": 1944} {"train_loss": -23.199914932250977, "global_step": 161386, "epoch": 1944} {"train_loss": -23.686330795288086, "global_step": 161387, "epoch": 1944} {"train_loss": -23.66777992248535, "global_step": 161388, "epoch": 1944} {"train_loss": -23.045822143554688, "global_step": 161389, "epoch": 1944} {"train_loss": -23.688983917236328, "global_step": 161390, "epoch": 1944} {"train_loss": -23.64693260192871, "global_step": 161391, "epoch": 1944} {"train_loss": -23.50752067565918, "global_step": 161392, "epoch": 1944} {"train_loss": -23.451580047607422, "global_step": 161393, "epoch": 1944} {"train_loss": -22.88161277770996, "global_step": 161394, "epoch": 1944} {"train_loss": -23.566146850585938, "global_step": 161395, "epoch": 1944} {"train_loss": -23.722806930541992, "global_step": 161396, "epoch": 1944} {"train_loss": -23.55618667602539, "global_step": 161397, "epoch": 1944} {"train_loss": -23.543188095092773, "global_step": 161398, "epoch": 1944} {"train_loss": -23.194360733032227, "global_step": 161399, "epoch": 1944} {"train_loss": -23.428388595581055, "global_step": 161400, "epoch": 1944} {"train_loss": -23.169641494750977, "global_step": 161401, "epoch": 1944} {"train_loss": -23.179548263549805, "global_step": 161402, "epoch": 1944} {"train_loss": -23.34259605407715, "global_step": 161403, "epoch": 1944} {"train_loss": -23.33036994934082, "global_step": 161404, "epoch": 1944} {"train_loss": -23.455488204956055, "global_step": 161405, "epoch": 1944} {"train_loss": -23.310415267944336, "global_step": 161406, "epoch": 1944} {"train_loss": -23.442564010620117, "global_step": 161407, "epoch": 1944} {"train_loss": -23.622817993164062, "global_step": 161408, "epoch": 1944} {"train_loss": -22.992177963256836, "global_step": 161409, "epoch": 1944} {"train_loss": -23.3426456451416, "global_step": 161410, "epoch": 1944} {"train_loss": -23.289194107055664, "global_step": 161411, "epoch": 1944} {"train_loss": -23.528982162475586, "global_step": 161412, "epoch": 1944} {"train_loss": -22.965925216674805, "global_step": 161413, "epoch": 1944} {"train_loss": -23.627967834472656, "global_step": 161414, "epoch": 1944} {"train_loss": -23.296995162963867, "global_step": 161415, "epoch": 1944} {"train_loss": -23.184053421020508, "global_step": 161416, "epoch": 1944} {"train_loss": -23.708362579345703, "global_step": 161417, "epoch": 1944} {"train_loss": -23.681564331054688, "global_step": 161418, "epoch": 1944} {"train_loss": -23.528106689453125, "global_step": 161419, "epoch": 1944} {"train_loss": -23.83518409729004, "global_step": 161420, "epoch": 1944} {"train_loss": -23.27880096435547, "global_step": 161421, "epoch": 1944} {"train_loss": -23.71472930908203, "global_step": 161422, "epoch": 1944} {"train_loss": -23.33701515197754, "global_step": 161423, "epoch": 1944} {"train_loss": -23.34661865234375, "global_step": 161424, "epoch": 1944} {"train_loss": -23.707717895507812, "global_step": 161425, "epoch": 1944} {"train_loss": -23.36182975769043, "global_step": 161426, "epoch": 1944} {"train_loss": -23.522245407104492, "global_step": 161427, "epoch": 1944} {"train_loss": -23.855133056640625, "global_step": 161428, "epoch": 1944} {"train_loss": -23.240442276000977, "global_step": 161429, "epoch": 1944} {"train_loss": -23.814611434936523, "global_step": 161430, "epoch": 1944} {"train_loss": -23.38690757751465, "global_step": 161431, "epoch": 1944} {"train_loss": -23.13947105407715, "global_step": 161432, "epoch": 1944} {"train_loss": -23.3956356048584, "global_step": 161433, "epoch": 1944} {"train_loss": -23.439101276627508, "global_step": 161434, "epoch": 1944, "val_loss": 6353997.5} {"train_loss": -23.09283447265625, "global_step": 161435, "epoch": 1945} {"train_loss": -22.655744552612305, "global_step": 161436, "epoch": 1945} {"train_loss": -23.33005714416504, "global_step": 161437, "epoch": 1945} {"train_loss": -23.477445602416992, "global_step": 161438, "epoch": 1945} {"train_loss": -23.265958786010742, "global_step": 161439, "epoch": 1945} {"train_loss": -23.571352005004883, "global_step": 161440, "epoch": 1945} {"train_loss": -23.09734535217285, "global_step": 161441, "epoch": 1945} {"train_loss": -23.18985366821289, "global_step": 161442, "epoch": 1945} {"train_loss": -23.53602409362793, "global_step": 161443, "epoch": 1945} {"train_loss": -23.284208297729492, "global_step": 161444, "epoch": 1945} {"train_loss": -23.214048385620117, "global_step": 161445, "epoch": 1945} {"train_loss": -23.65459442138672, "global_step": 161446, "epoch": 1945} {"train_loss": -23.069700241088867, "global_step": 161447, "epoch": 1945} {"train_loss": -23.741891860961914, "global_step": 161448, "epoch": 1945} {"train_loss": -23.540742874145508, "global_step": 161449, "epoch": 1945} {"train_loss": -23.013046264648438, "global_step": 161450, "epoch": 1945} {"train_loss": -23.692550659179688, "global_step": 161451, "epoch": 1945} {"train_loss": -23.195634841918945, "global_step": 161452, "epoch": 1945} {"train_loss": -23.51959991455078, "global_step": 161453, "epoch": 1945} {"train_loss": -23.60133934020996, "global_step": 161454, "epoch": 1945} {"train_loss": -23.598981857299805, "global_step": 161455, "epoch": 1945} {"train_loss": -23.394094467163086, "global_step": 161456, "epoch": 1945} {"train_loss": -23.76283836364746, "global_step": 161457, "epoch": 1945} {"train_loss": -23.652441024780273, "global_step": 161458, "epoch": 1945} {"train_loss": -23.449752807617188, "global_step": 161459, "epoch": 1945} {"train_loss": -23.466325759887695, "global_step": 161460, "epoch": 1945} {"train_loss": -23.759740829467773, "global_step": 161461, "epoch": 1945} {"train_loss": -23.929931640625, "global_step": 161462, "epoch": 1945} {"train_loss": -23.39182472229004, "global_step": 161463, "epoch": 1945} {"train_loss": -23.76656150817871, "global_step": 161464, "epoch": 1945} {"train_loss": -23.263629913330078, "global_step": 161465, "epoch": 1945} {"train_loss": -23.548965454101562, "global_step": 161466, "epoch": 1945} {"train_loss": -23.591794967651367, "global_step": 161467, "epoch": 1945} {"train_loss": -23.679641723632812, "global_step": 161468, "epoch": 1945} {"train_loss": -23.92890739440918, "global_step": 161469, "epoch": 1945} {"train_loss": -23.919036865234375, "global_step": 161470, "epoch": 1945} {"train_loss": -23.449106216430664, "global_step": 161471, "epoch": 1945} {"train_loss": -23.536849975585938, "global_step": 161472, "epoch": 1945} {"train_loss": -23.590375900268555, "global_step": 161473, "epoch": 1945} {"train_loss": -23.720701217651367, "global_step": 161474, "epoch": 1945} {"train_loss": -23.58620834350586, "global_step": 161475, "epoch": 1945} {"train_loss": -23.68414306640625, "global_step": 161476, "epoch": 1945} {"train_loss": -23.56084632873535, "global_step": 161477, "epoch": 1945} {"train_loss": -23.69602394104004, "global_step": 161478, "epoch": 1945} {"train_loss": -23.49064826965332, "global_step": 161479, "epoch": 1945} {"train_loss": -23.214120864868164, "global_step": 161480, "epoch": 1945} {"train_loss": -23.167104721069336, "global_step": 161481, "epoch": 1945} {"train_loss": -23.168699264526367, "global_step": 161482, "epoch": 1945} {"train_loss": -23.14089584350586, "global_step": 161483, "epoch": 1945} {"train_loss": -23.521595001220703, "global_step": 161484, "epoch": 1945} {"train_loss": -23.51030921936035, "global_step": 161485, "epoch": 1945} {"train_loss": -23.519651412963867, "global_step": 161486, "epoch": 1945} {"train_loss": -23.374513626098633, "global_step": 161487, "epoch": 1945} {"train_loss": -23.477155685424805, "global_step": 161488, "epoch": 1945} {"train_loss": -23.254953384399414, "global_step": 161489, "epoch": 1945} {"train_loss": -23.586698532104492, "global_step": 161490, "epoch": 1945} {"train_loss": -23.828907012939453, "global_step": 161491, "epoch": 1945} {"train_loss": -23.71164321899414, "global_step": 161492, "epoch": 1945} {"train_loss": -23.377798080444336, "global_step": 161493, "epoch": 1945} {"train_loss": -23.492748260498047, "global_step": 161494, "epoch": 1945} {"train_loss": -23.454748153686523, "global_step": 161495, "epoch": 1945} {"train_loss": -23.679981231689453, "global_step": 161496, "epoch": 1945} {"train_loss": -23.726842880249023, "global_step": 161497, "epoch": 1945} {"train_loss": -23.564666748046875, "global_step": 161498, "epoch": 1945} {"train_loss": -23.504539489746094, "global_step": 161499, "epoch": 1945} {"train_loss": -23.601003646850586, "global_step": 161500, "epoch": 1945} {"train_loss": -23.288833618164062, "global_step": 161501, "epoch": 1945} {"train_loss": -23.689285278320312, "global_step": 161502, "epoch": 1945} {"train_loss": -23.4249210357666, "global_step": 161503, "epoch": 1945} {"train_loss": -23.675128936767578, "global_step": 161504, "epoch": 1945} {"train_loss": -23.258520126342773, "global_step": 161505, "epoch": 1945} {"train_loss": -24.0024356842041, "global_step": 161506, "epoch": 1945} {"train_loss": -23.314542770385742, "global_step": 161507, "epoch": 1945} {"train_loss": -23.80263328552246, "global_step": 161508, "epoch": 1945} {"train_loss": -23.671096801757812, "global_step": 161509, "epoch": 1945} {"train_loss": -23.177696228027344, "global_step": 161510, "epoch": 1945} {"train_loss": -23.493305206298828, "global_step": 161511, "epoch": 1945} {"train_loss": -23.7656307220459, "global_step": 161512, "epoch": 1945} {"train_loss": -23.622228622436523, "global_step": 161513, "epoch": 1945} {"train_loss": -23.802587509155273, "global_step": 161514, "epoch": 1945} {"train_loss": -23.690017700195312, "global_step": 161515, "epoch": 1945} {"train_loss": -23.271631240844727, "global_step": 161516, "epoch": 1945} {"train_loss": -23.50553682626012, "global_step": 161517, "epoch": 1945, "val_loss": 6282640.0} {"train_loss": -20.117990493774414, "global_step": 161518, "epoch": 1946} {"train_loss": -21.796213150024414, "global_step": 161519, "epoch": 1946} {"train_loss": -21.08443260192871, "global_step": 161520, "epoch": 1946} {"train_loss": -22.31254005432129, "global_step": 161521, "epoch": 1946} {"train_loss": -21.469881057739258, "global_step": 161522, "epoch": 1946} {"train_loss": -22.459936141967773, "global_step": 161523, "epoch": 1946} {"train_loss": -22.341083526611328, "global_step": 161524, "epoch": 1946} {"train_loss": -22.44837760925293, "global_step": 161525, "epoch": 1946} {"train_loss": -22.472976684570312, "global_step": 161526, "epoch": 1946} {"train_loss": -22.390439987182617, "global_step": 161527, "epoch": 1946} {"train_loss": -22.669599533081055, "global_step": 161528, "epoch": 1946} {"train_loss": -22.745153427124023, "global_step": 161529, "epoch": 1946} {"train_loss": -22.550321578979492, "global_step": 161530, "epoch": 1946} {"train_loss": -22.78571891784668, "global_step": 161531, "epoch": 1946} {"train_loss": -22.564680099487305, "global_step": 161532, "epoch": 1946} {"train_loss": -22.86176872253418, "global_step": 161533, "epoch": 1946} {"train_loss": -23.088687896728516, "global_step": 161534, "epoch": 1946} {"train_loss": -22.80250358581543, "global_step": 161535, "epoch": 1946} {"train_loss": -22.634654998779297, "global_step": 161536, "epoch": 1946} {"train_loss": -22.730712890625, "global_step": 161537, "epoch": 1946} {"train_loss": -22.856534957885742, "global_step": 161538, "epoch": 1946} {"train_loss": -22.766357421875, "global_step": 161539, "epoch": 1946} {"train_loss": -22.621198654174805, "global_step": 161540, "epoch": 1946} {"train_loss": -23.28302574157715, "global_step": 161541, "epoch": 1946} {"train_loss": -23.045551300048828, "global_step": 161542, "epoch": 1946} {"train_loss": -23.092302322387695, "global_step": 161543, "epoch": 1946} {"train_loss": -23.206695556640625, "global_step": 161544, "epoch": 1946} {"train_loss": -23.151594161987305, "global_step": 161545, "epoch": 1946} {"train_loss": -23.185062408447266, "global_step": 161546, "epoch": 1946} {"train_loss": -23.251710891723633, "global_step": 161547, "epoch": 1946} {"train_loss": -23.547887802124023, "global_step": 161548, "epoch": 1946} {"train_loss": -23.506389617919922, "global_step": 161549, "epoch": 1946} {"train_loss": -22.92955780029297, "global_step": 161550, "epoch": 1946} {"train_loss": -23.33273696899414, "global_step": 161551, "epoch": 1946} {"train_loss": -23.32487678527832, "global_step": 161552, "epoch": 1946} {"train_loss": -23.233774185180664, "global_step": 161553, "epoch": 1946} {"train_loss": -23.5043888092041, "global_step": 161554, "epoch": 1946} {"train_loss": -23.183820724487305, "global_step": 161555, "epoch": 1946} {"train_loss": -23.546297073364258, "global_step": 161556, "epoch": 1946} {"train_loss": -23.936437606811523, "global_step": 161557, "epoch": 1946} {"train_loss": -23.674274444580078, "global_step": 161558, "epoch": 1946} {"train_loss": -23.467016220092773, "global_step": 161559, "epoch": 1946} {"train_loss": -23.519723892211914, "global_step": 161560, "epoch": 1946} {"train_loss": -23.447813034057617, "global_step": 161561, "epoch": 1946} {"train_loss": -23.456653594970703, "global_step": 161562, "epoch": 1946} {"train_loss": -23.578428268432617, "global_step": 161563, "epoch": 1946} {"train_loss": -23.32358741760254, "global_step": 161564, "epoch": 1946} {"train_loss": -23.439300537109375, "global_step": 161565, "epoch": 1946} {"train_loss": -23.761911392211914, "global_step": 161566, "epoch": 1946} {"train_loss": -23.26186180114746, "global_step": 161567, "epoch": 1946} {"train_loss": -23.737733840942383, "global_step": 161568, "epoch": 1946} {"train_loss": -23.60074806213379, "global_step": 161569, "epoch": 1946} {"train_loss": -23.139446258544922, "global_step": 161570, "epoch": 1946} {"train_loss": -23.571117401123047, "global_step": 161571, "epoch": 1946} {"train_loss": -23.18105697631836, "global_step": 161572, "epoch": 1946} {"train_loss": -23.37819480895996, "global_step": 161573, "epoch": 1946} {"train_loss": -23.716140747070312, "global_step": 161574, "epoch": 1946} {"train_loss": -23.46689224243164, "global_step": 161575, "epoch": 1946} {"train_loss": -23.732450485229492, "global_step": 161576, "epoch": 1946} {"train_loss": -23.857418060302734, "global_step": 161577, "epoch": 1946} {"train_loss": -23.638614654541016, "global_step": 161578, "epoch": 1946} {"train_loss": -23.5789852142334, "global_step": 161579, "epoch": 1946} {"train_loss": -23.534353256225586, "global_step": 161580, "epoch": 1946} {"train_loss": -23.631521224975586, "global_step": 161581, "epoch": 1946} {"train_loss": -23.81761360168457, "global_step": 161582, "epoch": 1946} {"train_loss": -23.683650970458984, "global_step": 161583, "epoch": 1946} {"train_loss": -23.534116744995117, "global_step": 161584, "epoch": 1946} {"train_loss": -23.365829467773438, "global_step": 161585, "epoch": 1946} {"train_loss": -23.739105224609375, "global_step": 161586, "epoch": 1946} {"train_loss": -23.523832321166992, "global_step": 161587, "epoch": 1946} {"train_loss": -23.72941017150879, "global_step": 161588, "epoch": 1946} {"train_loss": -23.00050163269043, "global_step": 161589, "epoch": 1946} {"train_loss": -23.759532928466797, "global_step": 161590, "epoch": 1946} {"train_loss": -23.618606567382812, "global_step": 161591, "epoch": 1946} {"train_loss": -23.739599227905273, "global_step": 161592, "epoch": 1946} {"train_loss": -23.792089462280273, "global_step": 161593, "epoch": 1946} {"train_loss": -23.667692184448242, "global_step": 161594, "epoch": 1946} {"train_loss": -23.597919464111328, "global_step": 161595, "epoch": 1946} {"train_loss": -23.829647064208984, "global_step": 161596, "epoch": 1946} {"train_loss": -23.882333755493164, "global_step": 161597, "epoch": 1946} {"train_loss": -23.72426414489746, "global_step": 161598, "epoch": 1946} {"train_loss": -23.652570724487305, "global_step": 161599, "epoch": 1946} {"train_loss": -23.186370298086878, "global_step": 161600, "epoch": 1946, "val_loss": 6445421.5} {"train_loss": -21.718778610229492, "global_step": 161601, "epoch": 1947} {"train_loss": -22.927392959594727, "global_step": 161602, "epoch": 1947} {"train_loss": -22.240121841430664, "global_step": 161603, "epoch": 1947} {"train_loss": -23.14456558227539, "global_step": 161604, "epoch": 1947} {"train_loss": -22.707685470581055, "global_step": 161605, "epoch": 1947} {"train_loss": -22.881763458251953, "global_step": 161606, "epoch": 1947} {"train_loss": -22.38317108154297, "global_step": 161607, "epoch": 1947} {"train_loss": -22.132387161254883, "global_step": 161608, "epoch": 1947} {"train_loss": -22.381986618041992, "global_step": 161609, "epoch": 1947} {"train_loss": -22.8742733001709, "global_step": 161610, "epoch": 1947} {"train_loss": -23.036806106567383, "global_step": 161611, "epoch": 1947} {"train_loss": -22.641950607299805, "global_step": 161612, "epoch": 1947} {"train_loss": -22.81247329711914, "global_step": 161613, "epoch": 1947} {"train_loss": -23.01423454284668, "global_step": 161614, "epoch": 1947} {"train_loss": -22.829959869384766, "global_step": 161615, "epoch": 1947} {"train_loss": -23.213773727416992, "global_step": 161616, "epoch": 1947} {"train_loss": -23.145244598388672, "global_step": 161617, "epoch": 1947} {"train_loss": -22.833003997802734, "global_step": 161618, "epoch": 1947} {"train_loss": -23.0234317779541, "global_step": 161619, "epoch": 1947} {"train_loss": -23.281217575073242, "global_step": 161620, "epoch": 1947} {"train_loss": -23.162092208862305, "global_step": 161621, "epoch": 1947} {"train_loss": -23.252609252929688, "global_step": 161622, "epoch": 1947} {"train_loss": -23.094385147094727, "global_step": 161623, "epoch": 1947} {"train_loss": -23.340059280395508, "global_step": 161624, "epoch": 1947} {"train_loss": -23.54006576538086, "global_step": 161625, "epoch": 1947} {"train_loss": -23.20892906188965, "global_step": 161626, "epoch": 1947} {"train_loss": -23.05313491821289, "global_step": 161627, "epoch": 1947} {"train_loss": -23.046842575073242, "global_step": 161628, "epoch": 1947} {"train_loss": -23.54819107055664, "global_step": 161629, "epoch": 1947} {"train_loss": -23.030975341796875, "global_step": 161630, "epoch": 1947} {"train_loss": -23.563405990600586, "global_step": 161631, "epoch": 1947} {"train_loss": -23.44733238220215, "global_step": 161632, "epoch": 1947} {"train_loss": -23.376861572265625, "global_step": 161633, "epoch": 1947} {"train_loss": -23.62373161315918, "global_step": 161634, "epoch": 1947} {"train_loss": -23.104476928710938, "global_step": 161635, "epoch": 1947} {"train_loss": -23.35538673400879, "global_step": 161636, "epoch": 1947} {"train_loss": -23.49363136291504, "global_step": 161637, "epoch": 1947} {"train_loss": -23.3439884185791, "global_step": 161638, "epoch": 1947} {"train_loss": -23.315643310546875, "global_step": 161639, "epoch": 1947} {"train_loss": -23.704404830932617, "global_step": 161640, "epoch": 1947} {"train_loss": -23.56598663330078, "global_step": 161641, "epoch": 1947} {"train_loss": -23.436071395874023, "global_step": 161642, "epoch": 1947} {"train_loss": -23.325786590576172, "global_step": 161643, "epoch": 1947} {"train_loss": -24.16242790222168, "global_step": 161644, "epoch": 1947} {"train_loss": -23.17522621154785, "global_step": 161645, "epoch": 1947} {"train_loss": -23.297744750976562, "global_step": 161646, "epoch": 1947} {"train_loss": -24.117597579956055, "global_step": 161647, "epoch": 1947} {"train_loss": -23.57606315612793, "global_step": 161648, "epoch": 1947} {"train_loss": -23.368200302124023, "global_step": 161649, "epoch": 1947} {"train_loss": -23.43934440612793, "global_step": 161650, "epoch": 1947} {"train_loss": -23.319215774536133, "global_step": 161651, "epoch": 1947} {"train_loss": -23.56021499633789, "global_step": 161652, "epoch": 1947} {"train_loss": -23.465362548828125, "global_step": 161653, "epoch": 1947} {"train_loss": -23.686290740966797, "global_step": 161654, "epoch": 1947} {"train_loss": -24.009828567504883, "global_step": 161655, "epoch": 1947} {"train_loss": -23.629365921020508, "global_step": 161656, "epoch": 1947} {"train_loss": -23.50153160095215, "global_step": 161657, "epoch": 1947} {"train_loss": -23.541263580322266, "global_step": 161658, "epoch": 1947} {"train_loss": -23.566402435302734, "global_step": 161659, "epoch": 1947} {"train_loss": -23.758272171020508, "global_step": 161660, "epoch": 1947} {"train_loss": -23.464859008789062, "global_step": 161661, "epoch": 1947} {"train_loss": -23.721927642822266, "global_step": 161662, "epoch": 1947} {"train_loss": -23.42963981628418, "global_step": 161663, "epoch": 1947} {"train_loss": -23.51552391052246, "global_step": 161664, "epoch": 1947} {"train_loss": -23.152565002441406, "global_step": 161665, "epoch": 1947} {"train_loss": -23.731660842895508, "global_step": 161666, "epoch": 1947} {"train_loss": -23.24915885925293, "global_step": 161667, "epoch": 1947} {"train_loss": -23.38092803955078, "global_step": 161668, "epoch": 1947} {"train_loss": -23.587453842163086, "global_step": 161669, "epoch": 1947} {"train_loss": -23.413681030273438, "global_step": 161670, "epoch": 1947} {"train_loss": -23.683271408081055, "global_step": 161671, "epoch": 1947} {"train_loss": -23.497989654541016, "global_step": 161672, "epoch": 1947} {"train_loss": -23.604022979736328, "global_step": 161673, "epoch": 1947} {"train_loss": -23.751352310180664, "global_step": 161674, "epoch": 1947} {"train_loss": -23.567075729370117, "global_step": 161675, "epoch": 1947} {"train_loss": -23.221494674682617, "global_step": 161676, "epoch": 1947} {"train_loss": -23.811861038208008, "global_step": 161677, "epoch": 1947} {"train_loss": -23.52737808227539, "global_step": 161678, "epoch": 1947} {"train_loss": -23.531530380249023, "global_step": 161679, "epoch": 1947} {"train_loss": -23.362625122070312, "global_step": 161680, "epoch": 1947} {"train_loss": -23.908233642578125, "global_step": 161681, "epoch": 1947} {"train_loss": -23.58344078063965, "global_step": 161682, "epoch": 1947} {"train_loss": -23.31094879701913, "global_step": 161683, "epoch": 1947, "val_loss": 6456663.0} {"train_loss": -22.909931182861328, "global_step": 161684, "epoch": 1948} {"train_loss": -23.020977020263672, "global_step": 161685, "epoch": 1948} {"train_loss": -22.54157257080078, "global_step": 161686, "epoch": 1948} {"train_loss": -22.771238327026367, "global_step": 161687, "epoch": 1948} {"train_loss": -22.950910568237305, "global_step": 161688, "epoch": 1948} {"train_loss": -23.00103187561035, "global_step": 161689, "epoch": 1948} {"train_loss": -22.391939163208008, "global_step": 161690, "epoch": 1948} {"train_loss": -23.203439712524414, "global_step": 161691, "epoch": 1948} {"train_loss": -23.09851837158203, "global_step": 161692, "epoch": 1948} {"train_loss": -22.621423721313477, "global_step": 161693, "epoch": 1948} {"train_loss": -22.96531105041504, "global_step": 161694, "epoch": 1948} {"train_loss": -22.66320037841797, "global_step": 161695, "epoch": 1948} {"train_loss": -23.431339263916016, "global_step": 161696, "epoch": 1948} {"train_loss": -23.069570541381836, "global_step": 161697, "epoch": 1948} {"train_loss": -23.436460494995117, "global_step": 161698, "epoch": 1948} {"train_loss": -23.209226608276367, "global_step": 161699, "epoch": 1948} {"train_loss": -23.023786544799805, "global_step": 161700, "epoch": 1948} {"train_loss": -23.518875122070312, "global_step": 161701, "epoch": 1948} {"train_loss": -23.493656158447266, "global_step": 161702, "epoch": 1948} {"train_loss": -23.410778045654297, "global_step": 161703, "epoch": 1948} {"train_loss": -23.331565856933594, "global_step": 161704, "epoch": 1948} {"train_loss": -23.495033264160156, "global_step": 161705, "epoch": 1948} {"train_loss": -23.432592391967773, "global_step": 161706, "epoch": 1948} {"train_loss": -23.547576904296875, "global_step": 161707, "epoch": 1948} {"train_loss": -23.535146713256836, "global_step": 161708, "epoch": 1948} {"train_loss": -23.705047607421875, "global_step": 161709, "epoch": 1948} {"train_loss": -23.637744903564453, "global_step": 161710, "epoch": 1948} {"train_loss": -23.569183349609375, "global_step": 161711, "epoch": 1948} {"train_loss": -23.787002563476562, "global_step": 161712, "epoch": 1948} {"train_loss": -23.530048370361328, "global_step": 161713, "epoch": 1948} {"train_loss": -23.8480224609375, "global_step": 161714, "epoch": 1948} {"train_loss": -23.74654197692871, "global_step": 161715, "epoch": 1948} {"train_loss": -23.808300018310547, "global_step": 161716, "epoch": 1948} {"train_loss": -23.923730850219727, "global_step": 161717, "epoch": 1948} {"train_loss": -23.391178131103516, "global_step": 161718, "epoch": 1948} {"train_loss": -23.464811325073242, "global_step": 161719, "epoch": 1948} {"train_loss": -23.573034286499023, "global_step": 161720, "epoch": 1948} {"train_loss": -23.922983169555664, "global_step": 161721, "epoch": 1948} {"train_loss": -23.48927879333496, "global_step": 161722, "epoch": 1948} {"train_loss": -23.603839874267578, "global_step": 161723, "epoch": 1948} {"train_loss": -23.484922409057617, "global_step": 161724, "epoch": 1948} {"train_loss": -23.512493133544922, "global_step": 161725, "epoch": 1948} {"train_loss": -23.21552085876465, "global_step": 161726, "epoch": 1948} {"train_loss": -23.4338436126709, "global_step": 161727, "epoch": 1948} {"train_loss": -23.3703556060791, "global_step": 161728, "epoch": 1948} {"train_loss": -23.602859497070312, "global_step": 161729, "epoch": 1948} {"train_loss": -23.64451026916504, "global_step": 161730, "epoch": 1948} {"train_loss": -23.401111602783203, "global_step": 161731, "epoch": 1948} {"train_loss": -23.697351455688477, "global_step": 161732, "epoch": 1948} {"train_loss": -23.926671981811523, "global_step": 161733, "epoch": 1948} {"train_loss": -23.21181297302246, "global_step": 161734, "epoch": 1948} {"train_loss": -23.49243927001953, "global_step": 161735, "epoch": 1948} {"train_loss": -23.953977584838867, "global_step": 161736, "epoch": 1948} {"train_loss": -23.15686798095703, "global_step": 161737, "epoch": 1948} {"train_loss": -23.356678009033203, "global_step": 161738, "epoch": 1948} {"train_loss": -23.619218826293945, "global_step": 161739, "epoch": 1948} {"train_loss": -23.750268936157227, "global_step": 161740, "epoch": 1948} {"train_loss": -23.897581100463867, "global_step": 161741, "epoch": 1948} {"train_loss": -23.47176170349121, "global_step": 161742, "epoch": 1948} {"train_loss": -23.676488876342773, "global_step": 161743, "epoch": 1948} {"train_loss": -23.591596603393555, "global_step": 161744, "epoch": 1948} {"train_loss": -23.621511459350586, "global_step": 161745, "epoch": 1948} {"train_loss": -23.31538200378418, "global_step": 161746, "epoch": 1948} {"train_loss": -23.56129264831543, "global_step": 161747, "epoch": 1948} {"train_loss": -23.616308212280273, "global_step": 161748, "epoch": 1948} {"train_loss": -23.737272262573242, "global_step": 161749, "epoch": 1948} {"train_loss": -23.442480087280273, "global_step": 161750, "epoch": 1948} {"train_loss": -23.54679298400879, "global_step": 161751, "epoch": 1948} {"train_loss": -23.448564529418945, "global_step": 161752, "epoch": 1948} {"train_loss": -23.725299835205078, "global_step": 161753, "epoch": 1948} {"train_loss": -23.398685455322266, "global_step": 161754, "epoch": 1948} {"train_loss": -23.508947372436523, "global_step": 161755, "epoch": 1948} {"train_loss": -23.9752140045166, "global_step": 161756, "epoch": 1948} {"train_loss": -23.455062866210938, "global_step": 161757, "epoch": 1948} {"train_loss": -23.414005279541016, "global_step": 161758, "epoch": 1948} {"train_loss": -23.35561752319336, "global_step": 161759, "epoch": 1948} {"train_loss": -23.4510498046875, "global_step": 161760, "epoch": 1948} {"train_loss": -23.55367088317871, "global_step": 161761, "epoch": 1948} {"train_loss": -23.3366756439209, "global_step": 161762, "epoch": 1948} {"train_loss": -23.614761352539062, "global_step": 161763, "epoch": 1948} {"train_loss": -23.66009521484375, "global_step": 161764, "epoch": 1948} {"train_loss": -23.784093856811523, "global_step": 161765, "epoch": 1948} {"train_loss": -23.451297369347998, "global_step": 161766, "epoch": 1948, "val_loss": 6420925.0} {"train_loss": -23.2453556060791, "global_step": 161767, "epoch": 1949} {"train_loss": -23.082929611206055, "global_step": 161768, "epoch": 1949} {"train_loss": -23.214094161987305, "global_step": 161769, "epoch": 1949} {"train_loss": -23.418941497802734, "global_step": 161770, "epoch": 1949} {"train_loss": -23.498762130737305, "global_step": 161771, "epoch": 1949} {"train_loss": -23.286441802978516, "global_step": 161772, "epoch": 1949} {"train_loss": -23.142810821533203, "global_step": 161773, "epoch": 1949} {"train_loss": -23.42705726623535, "global_step": 161774, "epoch": 1949} {"train_loss": -23.676616668701172, "global_step": 161775, "epoch": 1949} {"train_loss": -23.445465087890625, "global_step": 161776, "epoch": 1949} {"train_loss": -23.373926162719727, "global_step": 161777, "epoch": 1949} {"train_loss": -23.0853271484375, "global_step": 161778, "epoch": 1949} {"train_loss": -23.356143951416016, "global_step": 161779, "epoch": 1949} {"train_loss": -23.156166076660156, "global_step": 161780, "epoch": 1949} {"train_loss": -23.506147384643555, "global_step": 161781, "epoch": 1949} {"train_loss": -23.6104736328125, "global_step": 161782, "epoch": 1949} {"train_loss": -23.565343856811523, "global_step": 161783, "epoch": 1949} {"train_loss": -23.58475685119629, "global_step": 161784, "epoch": 1949} {"train_loss": -23.324962615966797, "global_step": 161785, "epoch": 1949} {"train_loss": -23.54063606262207, "global_step": 161786, "epoch": 1949} {"train_loss": -23.417524337768555, "global_step": 161787, "epoch": 1949} {"train_loss": -23.576007843017578, "global_step": 161788, "epoch": 1949} {"train_loss": -23.382436752319336, "global_step": 161789, "epoch": 1949} {"train_loss": -23.560440063476562, "global_step": 161790, "epoch": 1949} {"train_loss": -23.56001853942871, "global_step": 161791, "epoch": 1949} {"train_loss": -23.454727172851562, "global_step": 161792, "epoch": 1949} {"train_loss": -23.124343872070312, "global_step": 161793, "epoch": 1949} {"train_loss": -23.455997467041016, "global_step": 161794, "epoch": 1949} {"train_loss": -23.48495864868164, "global_step": 161795, "epoch": 1949} {"train_loss": -23.67062759399414, "global_step": 161796, "epoch": 1949} {"train_loss": -22.96548843383789, "global_step": 161797, "epoch": 1949} {"train_loss": -23.49762725830078, "global_step": 161798, "epoch": 1949} {"train_loss": -23.699100494384766, "global_step": 161799, "epoch": 1949} {"train_loss": -23.404268264770508, "global_step": 161800, "epoch": 1949} {"train_loss": -23.409442901611328, "global_step": 161801, "epoch": 1949} {"train_loss": -23.68453025817871, "global_step": 161802, "epoch": 1949} {"train_loss": -23.740371704101562, "global_step": 161803, "epoch": 1949} {"train_loss": -23.84146499633789, "global_step": 161804, "epoch": 1949} {"train_loss": -23.805570602416992, "global_step": 161805, "epoch": 1949} {"train_loss": -23.636505126953125, "global_step": 161806, "epoch": 1949} {"train_loss": -23.572938919067383, "global_step": 161807, "epoch": 1949} {"train_loss": -23.532072067260742, "global_step": 161808, "epoch": 1949} {"train_loss": -23.69662094116211, "global_step": 161809, "epoch": 1949} {"train_loss": -23.636154174804688, "global_step": 161810, "epoch": 1949} {"train_loss": -23.58573341369629, "global_step": 161811, "epoch": 1949} {"train_loss": -23.86087989807129, "global_step": 161812, "epoch": 1949} {"train_loss": -23.62906837463379, "global_step": 161813, "epoch": 1949} {"train_loss": -23.819822311401367, "global_step": 161814, "epoch": 1949} {"train_loss": -23.440963745117188, "global_step": 161815, "epoch": 1949} {"train_loss": -23.898319244384766, "global_step": 161816, "epoch": 1949} {"train_loss": -23.330055236816406, "global_step": 161817, "epoch": 1949} {"train_loss": -23.22287368774414, "global_step": 161818, "epoch": 1949} {"train_loss": -23.646272659301758, "global_step": 161819, "epoch": 1949} {"train_loss": -23.354429244995117, "global_step": 161820, "epoch": 1949} {"train_loss": -23.70196533203125, "global_step": 161821, "epoch": 1949} {"train_loss": -23.36067771911621, "global_step": 161822, "epoch": 1949} {"train_loss": -23.709577560424805, "global_step": 161823, "epoch": 1949} {"train_loss": -23.671239852905273, "global_step": 161824, "epoch": 1949} {"train_loss": -23.593868255615234, "global_step": 161825, "epoch": 1949} {"train_loss": -23.097238540649414, "global_step": 161826, "epoch": 1949} {"train_loss": -23.00937843322754, "global_step": 161827, "epoch": 1949} {"train_loss": -23.559324264526367, "global_step": 161828, "epoch": 1949} {"train_loss": -23.76615333557129, "global_step": 161829, "epoch": 1949} {"train_loss": -24.11429214477539, "global_step": 161830, "epoch": 1949} {"train_loss": -23.88882827758789, "global_step": 161831, "epoch": 1949} {"train_loss": -23.469297409057617, "global_step": 161832, "epoch": 1949} {"train_loss": -23.736392974853516, "global_step": 161833, "epoch": 1949} {"train_loss": -23.851573944091797, "global_step": 161834, "epoch": 1949} {"train_loss": -23.607269287109375, "global_step": 161835, "epoch": 1949} {"train_loss": -23.358978271484375, "global_step": 161836, "epoch": 1949} {"train_loss": -23.581707000732422, "global_step": 161837, "epoch": 1949} {"train_loss": -23.149917602539062, "global_step": 161838, "epoch": 1949} {"train_loss": -23.161909103393555, "global_step": 161839, "epoch": 1949} {"train_loss": -23.11078453063965, "global_step": 161840, "epoch": 1949} {"train_loss": -23.451812744140625, "global_step": 161841, "epoch": 1949} {"train_loss": -23.432044982910156, "global_step": 161842, "epoch": 1949} {"train_loss": -23.432010650634766, "global_step": 161843, "epoch": 1949} {"train_loss": -23.594215393066406, "global_step": 161844, "epoch": 1949} {"train_loss": -23.98826026916504, "global_step": 161845, "epoch": 1949} {"train_loss": -23.60834312438965, "global_step": 161846, "epoch": 1949} {"train_loss": -23.6192684173584, "global_step": 161847, "epoch": 1949} {"train_loss": -23.739648818969727, "global_step": 161848, "epoch": 1949} {"train_loss": -23.519238483474915, "global_step": 161849, "epoch": 1949, "val_loss": 6398961.5} {"train_loss": -23.553327560424805, "global_step": 161850, "epoch": 1950} {"train_loss": -23.15987205505371, "global_step": 161851, "epoch": 1950} {"train_loss": -23.557327270507812, "global_step": 161852, "epoch": 1950} {"train_loss": -23.444454193115234, "global_step": 161853, "epoch": 1950} {"train_loss": -23.3679256439209, "global_step": 161854, "epoch": 1950} {"train_loss": -23.608076095581055, "global_step": 161855, "epoch": 1950} {"train_loss": -23.527963638305664, "global_step": 161856, "epoch": 1950} {"train_loss": -23.314420700073242, "global_step": 161857, "epoch": 1950} {"train_loss": -23.59947967529297, "global_step": 161858, "epoch": 1950} {"train_loss": -23.159337997436523, "global_step": 161859, "epoch": 1950} {"train_loss": -23.4831485748291, "global_step": 161860, "epoch": 1950} {"train_loss": -23.504301071166992, "global_step": 161861, "epoch": 1950} {"train_loss": -23.51726531982422, "global_step": 161862, "epoch": 1950} {"train_loss": -23.34514808654785, "global_step": 161863, "epoch": 1950} {"train_loss": -23.6638240814209, "global_step": 161864, "epoch": 1950} {"train_loss": -23.3750057220459, "global_step": 161865, "epoch": 1950} {"train_loss": -23.15898895263672, "global_step": 161866, "epoch": 1950} {"train_loss": -22.962642669677734, "global_step": 161867, "epoch": 1950} {"train_loss": -23.431610107421875, "global_step": 161868, "epoch": 1950} {"train_loss": -23.525609970092773, "global_step": 161869, "epoch": 1950} {"train_loss": -23.742446899414062, "global_step": 161870, "epoch": 1950} {"train_loss": -23.342397689819336, "global_step": 161871, "epoch": 1950} {"train_loss": -23.431028366088867, "global_step": 161872, "epoch": 1950} {"train_loss": -23.459747314453125, "global_step": 161873, "epoch": 1950} {"train_loss": -23.820526123046875, "global_step": 161874, "epoch": 1950} {"train_loss": -23.439489364624023, "global_step": 161875, "epoch": 1950} {"train_loss": -23.419588088989258, "global_step": 161876, "epoch": 1950} {"train_loss": -23.797651290893555, "global_step": 161877, "epoch": 1950} {"train_loss": -23.761310577392578, "global_step": 161878, "epoch": 1950} {"train_loss": -23.534263610839844, "global_step": 161879, "epoch": 1950} {"train_loss": -23.414352416992188, "global_step": 161880, "epoch": 1950} {"train_loss": -23.956825256347656, "global_step": 161881, "epoch": 1950} {"train_loss": -23.774572372436523, "global_step": 161882, "epoch": 1950} {"train_loss": -23.596416473388672, "global_step": 161883, "epoch": 1950} {"train_loss": -23.890520095825195, "global_step": 161884, "epoch": 1950} {"train_loss": -23.481460571289062, "global_step": 161885, "epoch": 1950} {"train_loss": -23.73708152770996, "global_step": 161886, "epoch": 1950} {"train_loss": -23.172510147094727, "global_step": 161887, "epoch": 1950} {"train_loss": -23.989850997924805, "global_step": 161888, "epoch": 1950} {"train_loss": -23.95387840270996, "global_step": 161889, "epoch": 1950} {"train_loss": -23.79208755493164, "global_step": 161890, "epoch": 1950} {"train_loss": -23.624141693115234, "global_step": 161891, "epoch": 1950} {"train_loss": -23.87120246887207, "global_step": 161892, "epoch": 1950} {"train_loss": -23.21766471862793, "global_step": 161893, "epoch": 1950} {"train_loss": -23.253543853759766, "global_step": 161894, "epoch": 1950} {"train_loss": -22.910749435424805, "global_step": 161895, "epoch": 1950} {"train_loss": -23.21773338317871, "global_step": 161896, "epoch": 1950} {"train_loss": -23.225645065307617, "global_step": 161897, "epoch": 1950} {"train_loss": -23.530847549438477, "global_step": 161898, "epoch": 1950} {"train_loss": -23.61423110961914, "global_step": 161899, "epoch": 1950} {"train_loss": -23.45454216003418, "global_step": 161900, "epoch": 1950} {"train_loss": -23.63034439086914, "global_step": 161901, "epoch": 1950} {"train_loss": -23.080657958984375, "global_step": 161902, "epoch": 1950} {"train_loss": -23.373640060424805, "global_step": 161903, "epoch": 1950} {"train_loss": -23.620487213134766, "global_step": 161904, "epoch": 1950} {"train_loss": -23.72339630126953, "global_step": 161905, "epoch": 1950} {"train_loss": -23.89695167541504, "global_step": 161906, "epoch": 1950} {"train_loss": -23.542644500732422, "global_step": 161907, "epoch": 1950} {"train_loss": -23.875211715698242, "global_step": 161908, "epoch": 1950} {"train_loss": -23.36907958984375, "global_step": 161909, "epoch": 1950} {"train_loss": -23.55811882019043, "global_step": 161910, "epoch": 1950} {"train_loss": -23.636428833007812, "global_step": 161911, "epoch": 1950} {"train_loss": -23.339115142822266, "global_step": 161912, "epoch": 1950} {"train_loss": -23.41731834411621, "global_step": 161913, "epoch": 1950} {"train_loss": -23.760068893432617, "global_step": 161914, "epoch": 1950} {"train_loss": -23.769012451171875, "global_step": 161915, "epoch": 1950} {"train_loss": -23.546676635742188, "global_step": 161916, "epoch": 1950} {"train_loss": -23.32358169555664, "global_step": 161917, "epoch": 1950} {"train_loss": -23.90595817565918, "global_step": 161918, "epoch": 1950} {"train_loss": -23.578798294067383, "global_step": 161919, "epoch": 1950} {"train_loss": -23.578598022460938, "global_step": 161920, "epoch": 1950} {"train_loss": -23.503314971923828, "global_step": 161921, "epoch": 1950} {"train_loss": -23.441312789916992, "global_step": 161922, "epoch": 1950} {"train_loss": -23.59763526916504, "global_step": 161923, "epoch": 1950} {"train_loss": -23.37703514099121, "global_step": 161924, "epoch": 1950} {"train_loss": -23.459196090698242, "global_step": 161925, "epoch": 1950} {"train_loss": -23.57107925415039, "global_step": 161926, "epoch": 1950} {"train_loss": -23.630477905273438, "global_step": 161927, "epoch": 1950} {"train_loss": -23.45288848876953, "global_step": 161928, "epoch": 1950} {"train_loss": -23.545896530151367, "global_step": 161929, "epoch": 1950} {"train_loss": -23.939546585083008, "global_step": 161930, "epoch": 1950} {"train_loss": -23.716108322143555, "global_step": 161931, "epoch": 1950} {"train_loss": -23.528649824211396, "global_step": 161932, "epoch": 1950, "train/sim_max_reward_0": 1.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4500000": 1.0, "test/sim_max_reward_4500001": 1.0, "test/sim_max_reward_4500002": 1.0, "test/sim_max_reward_4500003": 1.0, "test/sim_max_reward_4500004": 1.0, "test/sim_max_reward_4500005": 1.0, "test/sim_max_reward_4500006": 1.0, "test/sim_max_reward_4500007": 1.0, "test/sim_max_reward_4500008": 1.0, "test/sim_max_reward_4500009": 1.0, "test/sim_max_reward_4500010": 1.0, "test/sim_max_reward_4500011": 1.0, "test/sim_max_reward_4500012": 1.0, "test/sim_max_reward_4500013": 1.0, "test/sim_max_reward_4500014": 1.0, "test/sim_max_reward_4500015": 1.0, "test/sim_max_reward_4500016": 1.0, "test/sim_max_reward_4500017": 1.0, "test/sim_max_reward_4500018": 1.0, "test/sim_max_reward_4500019": 1.0, "test/sim_max_reward_4500020": 1.0, "test/sim_max_reward_4500021": 1.0, "train/mean_score": 1.0, "test/mean_score": 1.0, "val_loss": 6357493.5} {"train_loss": -23.005483627319336, "global_step": 161933, "epoch": 1951} {"train_loss": -22.889652252197266, "global_step": 161934, "epoch": 1951} {"train_loss": -22.299535751342773, "global_step": 161935, "epoch": 1951} {"train_loss": -22.932065963745117, "global_step": 161936, "epoch": 1951} {"train_loss": -22.788846969604492, "global_step": 161937, "epoch": 1951} {"train_loss": -23.14826774597168, "global_step": 161938, "epoch": 1951} {"train_loss": -23.114973068237305, "global_step": 161939, "epoch": 1951} {"train_loss": -22.910070419311523, "global_step": 161940, "epoch": 1951} {"train_loss": -23.499622344970703, "global_step": 161941, "epoch": 1951} {"train_loss": -22.934537887573242, "global_step": 161942, "epoch": 1951} {"train_loss": -22.926448822021484, "global_step": 161943, "epoch": 1951} {"train_loss": -22.895353317260742, "global_step": 161944, "epoch": 1951} {"train_loss": -23.132978439331055, "global_step": 161945, "epoch": 1951} {"train_loss": -23.10711669921875, "global_step": 161946, "epoch": 1951} {"train_loss": -23.102741241455078, "global_step": 161947, "epoch": 1951} {"train_loss": -23.131967544555664, "global_step": 161948, "epoch": 1951} {"train_loss": -23.134138107299805, "global_step": 161949, "epoch": 1951} {"train_loss": -23.25481605529785, "global_step": 161950, "epoch": 1951} {"train_loss": -22.887853622436523, "global_step": 161951, "epoch": 1951} {"train_loss": -23.152219772338867, "global_step": 161952, "epoch": 1951} {"train_loss": -23.631778717041016, "global_step": 161953, "epoch": 1951} {"train_loss": -23.35512924194336, "global_step": 161954, "epoch": 1951} {"train_loss": -23.43125343322754, "global_step": 161955, "epoch": 1951} {"train_loss": -23.65740203857422, "global_step": 161956, "epoch": 1951} {"train_loss": -23.38431739807129, "global_step": 161957, "epoch": 1951} {"train_loss": -23.309335708618164, "global_step": 161958, "epoch": 1951} {"train_loss": -23.534912109375, "global_step": 161959, "epoch": 1951} {"train_loss": -23.32795524597168, "global_step": 161960, "epoch": 1951} {"train_loss": -23.10080337524414, "global_step": 161961, "epoch": 1951} {"train_loss": -23.08373260498047, "global_step": 161962, "epoch": 1951} {"train_loss": -23.271703720092773, "global_step": 161963, "epoch": 1951} {"train_loss": -23.276775360107422, "global_step": 161964, "epoch": 1951} {"train_loss": -23.30950164794922, "global_step": 161965, "epoch": 1951} {"train_loss": -23.36988067626953, "global_step": 161966, "epoch": 1951} {"train_loss": -23.329734802246094, "global_step": 161967, "epoch": 1951} {"train_loss": -23.711994171142578, "global_step": 161968, "epoch": 1951} {"train_loss": -23.68891716003418, "global_step": 161969, "epoch": 1951} {"train_loss": -23.64841651916504, "global_step": 161970, "epoch": 1951} {"train_loss": -23.54178810119629, "global_step": 161971, "epoch": 1951} {"train_loss": -23.596349716186523, "global_step": 161972, "epoch": 1951} {"train_loss": -23.71530532836914, "global_step": 161973, "epoch": 1951} {"train_loss": -23.19144630432129, "global_step": 161974, "epoch": 1951} {"train_loss": -23.305158615112305, "global_step": 161975, "epoch": 1951} {"train_loss": -23.2912540435791, "global_step": 161976, "epoch": 1951} {"train_loss": -23.27863311767578, "global_step": 161977, "epoch": 1951} {"train_loss": -23.1483154296875, "global_step": 161978, "epoch": 1951} {"train_loss": -23.01239585876465, "global_step": 161979, "epoch": 1951} {"train_loss": -23.623090744018555, "global_step": 161980, "epoch": 1951} {"train_loss": -23.489818572998047, "global_step": 161981, "epoch": 1951} {"train_loss": -23.394302368164062, "global_step": 161982, "epoch": 1951} {"train_loss": -23.6178035736084, "global_step": 161983, "epoch": 1951} {"train_loss": -23.868316650390625, "global_step": 161984, "epoch": 1951} {"train_loss": -24.059539794921875, "global_step": 161985, "epoch": 1951} {"train_loss": -23.611282348632812, "global_step": 161986, "epoch": 1951} {"train_loss": -23.93116569519043, "global_step": 161987, "epoch": 1951} {"train_loss": -23.361154556274414, "global_step": 161988, "epoch": 1951} {"train_loss": -23.51422691345215, "global_step": 161989, "epoch": 1951} {"train_loss": -23.01333999633789, "global_step": 161990, "epoch": 1951} {"train_loss": -23.577625274658203, "global_step": 161991, "epoch": 1951} {"train_loss": -23.55543327331543, "global_step": 161992, "epoch": 1951} {"train_loss": -23.21868133544922, "global_step": 161993, "epoch": 1951} {"train_loss": -23.50081443786621, "global_step": 161994, "epoch": 1951} {"train_loss": -23.751996994018555, "global_step": 161995, "epoch": 1951} {"train_loss": -23.8124942779541, "global_step": 161996, "epoch": 1951} {"train_loss": -23.501909255981445, "global_step": 161997, "epoch": 1951} {"train_loss": -23.71143913269043, "global_step": 161998, "epoch": 1951} {"train_loss": -23.485258102416992, "global_step": 161999, "epoch": 1951} {"train_loss": -23.93512725830078, "global_step": 162000, "epoch": 1951} {"train_loss": -23.908878326416016, "global_step": 162001, "epoch": 1951} {"train_loss": -23.603139877319336, "global_step": 162002, "epoch": 1951} {"train_loss": -23.32033348083496, "global_step": 162003, "epoch": 1951} {"train_loss": -23.334125518798828, "global_step": 162004, "epoch": 1951} {"train_loss": -23.12061882019043, "global_step": 162005, "epoch": 1951} {"train_loss": -23.572607040405273, "global_step": 162006, "epoch": 1951} {"train_loss": -23.0258846282959, "global_step": 162007, "epoch": 1951} {"train_loss": -23.460739135742188, "global_step": 162008, "epoch": 1951} {"train_loss": -23.38361167907715, "global_step": 162009, "epoch": 1951} {"train_loss": -23.658428192138672, "global_step": 162010, "epoch": 1951} {"train_loss": -23.47010612487793, "global_step": 162011, "epoch": 1951} {"train_loss": -23.562286376953125, "global_step": 162012, "epoch": 1951} {"train_loss": -23.83746910095215, "global_step": 162013, "epoch": 1951} {"train_loss": -23.56171417236328, "global_step": 162014, "epoch": 1951} {"train_loss": -23.37001775258995, "global_step": 162015, "epoch": 1951, "val_loss": 6320433.0} {"train_loss": -22.355518341064453, "global_step": 162016, "epoch": 1952} {"train_loss": -22.945192337036133, "global_step": 162017, "epoch": 1952} {"train_loss": -22.71292495727539, "global_step": 162018, "epoch": 1952} {"train_loss": -23.223440170288086, "global_step": 162019, "epoch": 1952} {"train_loss": -22.223020553588867, "global_step": 162020, "epoch": 1952} {"train_loss": -22.696863174438477, "global_step": 162021, "epoch": 1952} {"train_loss": -23.021055221557617, "global_step": 162022, "epoch": 1952} {"train_loss": -22.9790096282959, "global_step": 162023, "epoch": 1952} {"train_loss": -23.099363327026367, "global_step": 162024, "epoch": 1952} {"train_loss": -22.902158737182617, "global_step": 162025, "epoch": 1952} {"train_loss": -22.838369369506836, "global_step": 162026, "epoch": 1952} {"train_loss": -23.07239532470703, "global_step": 162027, "epoch": 1952} {"train_loss": -23.11874771118164, "global_step": 162028, "epoch": 1952} {"train_loss": -22.793838500976562, "global_step": 162029, "epoch": 1952} {"train_loss": -22.946125030517578, "global_step": 162030, "epoch": 1952} {"train_loss": -22.95015525817871, "global_step": 162031, "epoch": 1952} {"train_loss": -23.410812377929688, "global_step": 162032, "epoch": 1952} {"train_loss": -22.887422561645508, "global_step": 162033, "epoch": 1952} {"train_loss": -22.974172592163086, "global_step": 162034, "epoch": 1952} {"train_loss": -22.956783294677734, "global_step": 162035, "epoch": 1952} {"train_loss": -23.081247329711914, "global_step": 162036, "epoch": 1952} {"train_loss": -22.904541015625, "global_step": 162037, "epoch": 1952} {"train_loss": -23.281721115112305, "global_step": 162038, "epoch": 1952} {"train_loss": -23.707860946655273, "global_step": 162039, "epoch": 1952} {"train_loss": -23.415746688842773, "global_step": 162040, "epoch": 1952} {"train_loss": -23.569063186645508, "global_step": 162041, "epoch": 1952} {"train_loss": -23.0885066986084, "global_step": 162042, "epoch": 1952} {"train_loss": -23.386144638061523, "global_step": 162043, "epoch": 1952} {"train_loss": -23.775745391845703, "global_step": 162044, "epoch": 1952} {"train_loss": -23.563138961791992, "global_step": 162045, "epoch": 1952} {"train_loss": -23.785856246948242, "global_step": 162046, "epoch": 1952} {"train_loss": -23.436521530151367, "global_step": 162047, "epoch": 1952} {"train_loss": -23.622465133666992, "global_step": 162048, "epoch": 1952} {"train_loss": -23.363821029663086, "global_step": 162049, "epoch": 1952} {"train_loss": -23.708269119262695, "global_step": 162050, "epoch": 1952} {"train_loss": -23.393253326416016, "global_step": 162051, "epoch": 1952} {"train_loss": -23.454992294311523, "global_step": 162052, "epoch": 1952} {"train_loss": -23.891979217529297, "global_step": 162053, "epoch": 1952} {"train_loss": -23.58228874206543, "global_step": 162054, "epoch": 1952} {"train_loss": -23.469554901123047, "global_step": 162055, "epoch": 1952} {"train_loss": -23.715316772460938, "global_step": 162056, "epoch": 1952} {"train_loss": -23.393383026123047, "global_step": 162057, "epoch": 1952} {"train_loss": -23.65155029296875, "global_step": 162058, "epoch": 1952} {"train_loss": -23.751243591308594, "global_step": 162059, "epoch": 1952} {"train_loss": -23.88821792602539, "global_step": 162060, "epoch": 1952} {"train_loss": -23.527616500854492, "global_step": 162061, "epoch": 1952} {"train_loss": -23.395769119262695, "global_step": 162062, "epoch": 1952} {"train_loss": -23.88498878479004, "global_step": 162063, "epoch": 1952} {"train_loss": -23.594358444213867, "global_step": 162064, "epoch": 1952} {"train_loss": -23.355056762695312, "global_step": 162065, "epoch": 1952} {"train_loss": -23.90598487854004, "global_step": 162066, "epoch": 1952} {"train_loss": -23.346845626831055, "global_step": 162067, "epoch": 1952} {"train_loss": -23.566701889038086, "global_step": 162068, "epoch": 1952} {"train_loss": -23.818706512451172, "global_step": 162069, "epoch": 1952} {"train_loss": -23.524789810180664, "global_step": 162070, "epoch": 1952} {"train_loss": -23.567596435546875, "global_step": 162071, "epoch": 1952} {"train_loss": -23.45253562927246, "global_step": 162072, "epoch": 1952} {"train_loss": -23.38374900817871, "global_step": 162073, "epoch": 1952} {"train_loss": -23.662485122680664, "global_step": 162074, "epoch": 1952} {"train_loss": -23.68830680847168, "global_step": 162075, "epoch": 1952} {"train_loss": -23.614425659179688, "global_step": 162076, "epoch": 1952} {"train_loss": -23.587125778198242, "global_step": 162077, "epoch": 1952} {"train_loss": -23.087854385375977, "global_step": 162078, "epoch": 1952} {"train_loss": -23.268888473510742, "global_step": 162079, "epoch": 1952} {"train_loss": -23.721939086914062, "global_step": 162080, "epoch": 1952} {"train_loss": -23.410751342773438, "global_step": 162081, "epoch": 1952} {"train_loss": -23.578378677368164, "global_step": 162082, "epoch": 1952} {"train_loss": -23.121685028076172, "global_step": 162083, "epoch": 1952} {"train_loss": -23.41473960876465, "global_step": 162084, "epoch": 1952} {"train_loss": -23.243589401245117, "global_step": 162085, "epoch": 1952} {"train_loss": -23.315937042236328, "global_step": 162086, "epoch": 1952} {"train_loss": -23.347095489501953, "global_step": 162087, "epoch": 1952} {"train_loss": -23.652883529663086, "global_step": 162088, "epoch": 1952} {"train_loss": -23.567323684692383, "global_step": 162089, "epoch": 1952} {"train_loss": -23.627737045288086, "global_step": 162090, "epoch": 1952} {"train_loss": -23.385629653930664, "global_step": 162091, "epoch": 1952} {"train_loss": -23.75493049621582, "global_step": 162092, "epoch": 1952} {"train_loss": -23.8439884185791, "global_step": 162093, "epoch": 1952} {"train_loss": -23.72198486328125, "global_step": 162094, "epoch": 1952} {"train_loss": -23.37445068359375, "global_step": 162095, "epoch": 1952} {"train_loss": -23.991931915283203, "global_step": 162096, "epoch": 1952} {"train_loss": -23.674453735351562, "global_step": 162097, "epoch": 1952} {"train_loss": -23.389919143125237, "global_step": 162098, "epoch": 1952, "val_loss": 6363978.5} {"train_loss": -22.019681930541992, "global_step": 162099, "epoch": 1953} {"train_loss": -22.44053077697754, "global_step": 162100, "epoch": 1953} {"train_loss": -23.42246437072754, "global_step": 162101, "epoch": 1953} {"train_loss": -23.217313766479492, "global_step": 162102, "epoch": 1953} {"train_loss": -23.058252334594727, "global_step": 162103, "epoch": 1953} {"train_loss": -23.163715362548828, "global_step": 162104, "epoch": 1953} {"train_loss": -22.57087516784668, "global_step": 162105, "epoch": 1953} {"train_loss": -23.043386459350586, "global_step": 162106, "epoch": 1953} {"train_loss": -23.311254501342773, "global_step": 162107, "epoch": 1953} {"train_loss": -22.840517044067383, "global_step": 162108, "epoch": 1953} {"train_loss": -23.134252548217773, "global_step": 162109, "epoch": 1953} {"train_loss": -23.158201217651367, "global_step": 162110, "epoch": 1953} {"train_loss": -23.200504302978516, "global_step": 162111, "epoch": 1953} {"train_loss": -23.055143356323242, "global_step": 162112, "epoch": 1953} {"train_loss": -22.857074737548828, "global_step": 162113, "epoch": 1953} {"train_loss": -23.568872451782227, "global_step": 162114, "epoch": 1953} {"train_loss": -23.47658348083496, "global_step": 162115, "epoch": 1953} {"train_loss": -23.24503517150879, "global_step": 162116, "epoch": 1953} {"train_loss": -23.556360244750977, "global_step": 162117, "epoch": 1953} {"train_loss": -23.223838806152344, "global_step": 162118, "epoch": 1953} {"train_loss": -23.376296997070312, "global_step": 162119, "epoch": 1953} {"train_loss": -23.286930084228516, "global_step": 162120, "epoch": 1953} {"train_loss": -23.39361572265625, "global_step": 162121, "epoch": 1953} {"train_loss": -23.67946434020996, "global_step": 162122, "epoch": 1953} {"train_loss": -23.60019874572754, "global_step": 162123, "epoch": 1953} {"train_loss": -23.72397232055664, "global_step": 162124, "epoch": 1953} {"train_loss": -23.522069931030273, "global_step": 162125, "epoch": 1953} {"train_loss": -23.33065414428711, "global_step": 162126, "epoch": 1953} {"train_loss": -23.38154411315918, "global_step": 162127, "epoch": 1953} {"train_loss": -23.48202896118164, "global_step": 162128, "epoch": 1953} {"train_loss": -23.793615341186523, "global_step": 162129, "epoch": 1953} {"train_loss": -23.408422470092773, "global_step": 162130, "epoch": 1953} {"train_loss": -23.516897201538086, "global_step": 162131, "epoch": 1953} {"train_loss": -23.507787704467773, "global_step": 162132, "epoch": 1953} {"train_loss": -23.616535186767578, "global_step": 162133, "epoch": 1953} {"train_loss": -23.870468139648438, "global_step": 162134, "epoch": 1953} {"train_loss": -23.83829689025879, "global_step": 162135, "epoch": 1953} {"train_loss": -23.72113609313965, "global_step": 162136, "epoch": 1953} {"train_loss": -23.568906784057617, "global_step": 162137, "epoch": 1953} {"train_loss": -23.917098999023438, "global_step": 162138, "epoch": 1953} {"train_loss": -23.775999069213867, "global_step": 162139, "epoch": 1953} {"train_loss": -23.4610652923584, "global_step": 162140, "epoch": 1953} {"train_loss": -23.77486228942871, "global_step": 162141, "epoch": 1953} {"train_loss": -23.663251876831055, "global_step": 162142, "epoch": 1953} {"train_loss": -23.33957862854004, "global_step": 162143, "epoch": 1953} {"train_loss": -23.7838134765625, "global_step": 162144, "epoch": 1953} {"train_loss": -23.448375701904297, "global_step": 162145, "epoch": 1953} {"train_loss": -23.635757446289062, "global_step": 162146, "epoch": 1953} {"train_loss": -23.193490982055664, "global_step": 162147, "epoch": 1953} {"train_loss": -23.823698043823242, "global_step": 162148, "epoch": 1953} {"train_loss": -23.721765518188477, "global_step": 162149, "epoch": 1953} {"train_loss": -23.888038635253906, "global_step": 162150, "epoch": 1953} {"train_loss": -23.414968490600586, "global_step": 162151, "epoch": 1953} {"train_loss": -23.958349227905273, "global_step": 162152, "epoch": 1953} {"train_loss": -23.737194061279297, "global_step": 162153, "epoch": 1953} {"train_loss": -23.58290672302246, "global_step": 162154, "epoch": 1953} {"train_loss": -23.367555618286133, "global_step": 162155, "epoch": 1953} {"train_loss": -23.5299072265625, "global_step": 162156, "epoch": 1953} {"train_loss": -23.127748489379883, "global_step": 162157, "epoch": 1953} {"train_loss": -23.772104263305664, "global_step": 162158, "epoch": 1953} {"train_loss": -23.432260513305664, "global_step": 162159, "epoch": 1953} {"train_loss": -23.768468856811523, "global_step": 162160, "epoch": 1953} {"train_loss": -23.092243194580078, "global_step": 162161, "epoch": 1953} {"train_loss": -23.76936912536621, "global_step": 162162, "epoch": 1953} {"train_loss": -23.707584381103516, "global_step": 162163, "epoch": 1953} {"train_loss": -23.59079360961914, "global_step": 162164, "epoch": 1953} {"train_loss": -23.69750213623047, "global_step": 162165, "epoch": 1953} {"train_loss": -23.65622901916504, "global_step": 162166, "epoch": 1953} {"train_loss": -23.806997299194336, "global_step": 162167, "epoch": 1953} {"train_loss": -23.3978271484375, "global_step": 162168, "epoch": 1953} {"train_loss": -23.25629997253418, "global_step": 162169, "epoch": 1953} {"train_loss": -23.436016082763672, "global_step": 162170, "epoch": 1953} {"train_loss": -23.335172653198242, "global_step": 162171, "epoch": 1953} {"train_loss": -23.739606857299805, "global_step": 162172, "epoch": 1953} {"train_loss": -23.562524795532227, "global_step": 162173, "epoch": 1953} {"train_loss": -23.753721237182617, "global_step": 162174, "epoch": 1953} {"train_loss": -23.323095321655273, "global_step": 162175, "epoch": 1953} {"train_loss": -23.517929077148438, "global_step": 162176, "epoch": 1953} {"train_loss": -23.816072463989258, "global_step": 162177, "epoch": 1953} {"train_loss": -23.351591110229492, "global_step": 162178, "epoch": 1953} {"train_loss": -23.797780990600586, "global_step": 162179, "epoch": 1953} {"train_loss": -23.55116844177246, "global_step": 162180, "epoch": 1953} {"train_loss": -23.46221735391272, "global_step": 162181, "epoch": 1953, "val_loss": 6324672.5} {"train_loss": -22.346372604370117, "global_step": 162182, "epoch": 1954} {"train_loss": -22.28951072692871, "global_step": 162183, "epoch": 1954} {"train_loss": -23.467227935791016, "global_step": 162184, "epoch": 1954} {"train_loss": -22.82929039001465, "global_step": 162185, "epoch": 1954} {"train_loss": -22.58307647705078, "global_step": 162186, "epoch": 1954} {"train_loss": -23.031442642211914, "global_step": 162187, "epoch": 1954} {"train_loss": -23.147172927856445, "global_step": 162188, "epoch": 1954} {"train_loss": -23.285892486572266, "global_step": 162189, "epoch": 1954} {"train_loss": -22.97317886352539, "global_step": 162190, "epoch": 1954} {"train_loss": -23.35042381286621, "global_step": 162191, "epoch": 1954} {"train_loss": -23.070743560791016, "global_step": 162192, "epoch": 1954} {"train_loss": -22.905698776245117, "global_step": 162193, "epoch": 1954} {"train_loss": -23.41771697998047, "global_step": 162194, "epoch": 1954} {"train_loss": -22.926305770874023, "global_step": 162195, "epoch": 1954} {"train_loss": -23.16094970703125, "global_step": 162196, "epoch": 1954} {"train_loss": -23.22968101501465, "global_step": 162197, "epoch": 1954} {"train_loss": -23.826038360595703, "global_step": 162198, "epoch": 1954} {"train_loss": -23.6621150970459, "global_step": 162199, "epoch": 1954} {"train_loss": -23.2734317779541, "global_step": 162200, "epoch": 1954} {"train_loss": -23.350299835205078, "global_step": 162201, "epoch": 1954} {"train_loss": -23.534950256347656, "global_step": 162202, "epoch": 1954} {"train_loss": -23.7934627532959, "global_step": 162203, "epoch": 1954} {"train_loss": -23.442461013793945, "global_step": 162204, "epoch": 1954} {"train_loss": -23.357654571533203, "global_step": 162205, "epoch": 1954} {"train_loss": -23.431299209594727, "global_step": 162206, "epoch": 1954} {"train_loss": -23.109159469604492, "global_step": 162207, "epoch": 1954} {"train_loss": -23.340330123901367, "global_step": 162208, "epoch": 1954} {"train_loss": -23.600271224975586, "global_step": 162209, "epoch": 1954} {"train_loss": -23.580780029296875, "global_step": 162210, "epoch": 1954} {"train_loss": -23.586816787719727, "global_step": 162211, "epoch": 1954} {"train_loss": -23.439495086669922, "global_step": 162212, "epoch": 1954} {"train_loss": -23.56328773498535, "global_step": 162213, "epoch": 1954} {"train_loss": -23.59872817993164, "global_step": 162214, "epoch": 1954} {"train_loss": -23.563024520874023, "global_step": 162215, "epoch": 1954} {"train_loss": -23.174095153808594, "global_step": 162216, "epoch": 1954} {"train_loss": -23.483129501342773, "global_step": 162217, "epoch": 1954} {"train_loss": -23.68203353881836, "global_step": 162218, "epoch": 1954} {"train_loss": -23.501388549804688, "global_step": 162219, "epoch": 1954} {"train_loss": -23.779613494873047, "global_step": 162220, "epoch": 1954} {"train_loss": -23.24964141845703, "global_step": 162221, "epoch": 1954} {"train_loss": -24.012493133544922, "global_step": 162222, "epoch": 1954} {"train_loss": -23.74703025817871, "global_step": 162223, "epoch": 1954} {"train_loss": -23.3393611907959, "global_step": 162224, "epoch": 1954} {"train_loss": -23.581602096557617, "global_step": 162225, "epoch": 1954} {"train_loss": -23.507509231567383, "global_step": 162226, "epoch": 1954} {"train_loss": -23.534746170043945, "global_step": 162227, "epoch": 1954} {"train_loss": -23.40325355529785, "global_step": 162228, "epoch": 1954} {"train_loss": -23.71277618408203, "global_step": 162229, "epoch": 1954} {"train_loss": -23.07942008972168, "global_step": 162230, "epoch": 1954} {"train_loss": -23.707565307617188, "global_step": 162231, "epoch": 1954} {"train_loss": -23.658002853393555, "global_step": 162232, "epoch": 1954} {"train_loss": -23.12531852722168, "global_step": 162233, "epoch": 1954} {"train_loss": -23.54296875, "global_step": 162234, "epoch": 1954} {"train_loss": -23.52823829650879, "global_step": 162235, "epoch": 1954} {"train_loss": -23.736841201782227, "global_step": 162236, "epoch": 1954} {"train_loss": -23.01433563232422, "global_step": 162237, "epoch": 1954} {"train_loss": -23.486364364624023, "global_step": 162238, "epoch": 1954} {"train_loss": -23.573749542236328, "global_step": 162239, "epoch": 1954} {"train_loss": -23.801576614379883, "global_step": 162240, "epoch": 1954} {"train_loss": -23.107847213745117, "global_step": 162241, "epoch": 1954} {"train_loss": -23.158933639526367, "global_step": 162242, "epoch": 1954} {"train_loss": -23.364423751831055, "global_step": 162243, "epoch": 1954} {"train_loss": -23.467565536499023, "global_step": 162244, "epoch": 1954} {"train_loss": -23.715532302856445, "global_step": 162245, "epoch": 1954} {"train_loss": -23.534915924072266, "global_step": 162246, "epoch": 1954} {"train_loss": -23.438810348510742, "global_step": 162247, "epoch": 1954} {"train_loss": -23.49574089050293, "global_step": 162248, "epoch": 1954} {"train_loss": -23.564870834350586, "global_step": 162249, "epoch": 1954} {"train_loss": -23.576519012451172, "global_step": 162250, "epoch": 1954} {"train_loss": -23.436410903930664, "global_step": 162251, "epoch": 1954} {"train_loss": -23.435415267944336, "global_step": 162252, "epoch": 1954} {"train_loss": -23.6157169342041, "global_step": 162253, "epoch": 1954} {"train_loss": -23.862707138061523, "global_step": 162254, "epoch": 1954} {"train_loss": -23.639198303222656, "global_step": 162255, "epoch": 1954} {"train_loss": -23.670698165893555, "global_step": 162256, "epoch": 1954} {"train_loss": -23.948911666870117, "global_step": 162257, "epoch": 1954} {"train_loss": -23.821521759033203, "global_step": 162258, "epoch": 1954} {"train_loss": -23.674346923828125, "global_step": 162259, "epoch": 1954} {"train_loss": -23.172870635986328, "global_step": 162260, "epoch": 1954} {"train_loss": -22.784048080444336, "global_step": 162261, "epoch": 1954} {"train_loss": -23.26179313659668, "global_step": 162262, "epoch": 1954} {"train_loss": -23.467336654663086, "global_step": 162263, "epoch": 1954} {"train_loss": -23.406102697533296, "global_step": 162264, "epoch": 1954, "val_loss": 6279540.0} {"train_loss": -21.959402084350586, "global_step": 162265, "epoch": 1955} {"train_loss": -22.934171676635742, "global_step": 162266, "epoch": 1955} {"train_loss": -22.701229095458984, "global_step": 162267, "epoch": 1955} {"train_loss": -23.020477294921875, "global_step": 162268, "epoch": 1955} {"train_loss": -22.663253784179688, "global_step": 162269, "epoch": 1955} {"train_loss": -23.29783058166504, "global_step": 162270, "epoch": 1955} {"train_loss": -22.53388786315918, "global_step": 162271, "epoch": 1955} {"train_loss": -22.96742057800293, "global_step": 162272, "epoch": 1955} {"train_loss": -22.619632720947266, "global_step": 162273, "epoch": 1955} {"train_loss": -23.25950813293457, "global_step": 162274, "epoch": 1955} {"train_loss": -22.872838973999023, "global_step": 162275, "epoch": 1955} {"train_loss": -22.9655818939209, "global_step": 162276, "epoch": 1955} {"train_loss": -23.428049087524414, "global_step": 162277, "epoch": 1955} {"train_loss": -23.15498924255371, "global_step": 162278, "epoch": 1955} {"train_loss": -23.2225399017334, "global_step": 162279, "epoch": 1955} {"train_loss": -23.381582260131836, "global_step": 162280, "epoch": 1955} {"train_loss": -23.155197143554688, "global_step": 162281, "epoch": 1955} {"train_loss": -23.29729652404785, "global_step": 162282, "epoch": 1955} {"train_loss": -22.849857330322266, "global_step": 162283, "epoch": 1955} {"train_loss": -23.332950592041016, "global_step": 162284, "epoch": 1955} {"train_loss": -23.15839958190918, "global_step": 162285, "epoch": 1955} {"train_loss": -23.34197235107422, "global_step": 162286, "epoch": 1955} {"train_loss": -23.879972457885742, "global_step": 162287, "epoch": 1955} {"train_loss": -23.243436813354492, "global_step": 162288, "epoch": 1955} {"train_loss": -23.461170196533203, "global_step": 162289, "epoch": 1955} {"train_loss": -23.1545467376709, "global_step": 162290, "epoch": 1955} {"train_loss": -23.475248336791992, "global_step": 162291, "epoch": 1955} {"train_loss": -23.371551513671875, "global_step": 162292, "epoch": 1955} {"train_loss": -23.4925479888916, "global_step": 162293, "epoch": 1955} {"train_loss": -23.59670066833496, "global_step": 162294, "epoch": 1955} {"train_loss": -23.13623046875, "global_step": 162295, "epoch": 1955} {"train_loss": -23.714801788330078, "global_step": 162296, "epoch": 1955} {"train_loss": -23.360107421875, "global_step": 162297, "epoch": 1955} {"train_loss": -23.655590057373047, "global_step": 162298, "epoch": 1955} {"train_loss": -23.78053855895996, "global_step": 162299, "epoch": 1955} {"train_loss": -23.549293518066406, "global_step": 162300, "epoch": 1955} {"train_loss": -23.880281448364258, "global_step": 162301, "epoch": 1955} {"train_loss": -23.46297264099121, "global_step": 162302, "epoch": 1955} {"train_loss": -23.678991317749023, "global_step": 162303, "epoch": 1955} {"train_loss": -23.806570053100586, "global_step": 162304, "epoch": 1955} {"train_loss": -23.613981246948242, "global_step": 162305, "epoch": 1955} {"train_loss": -23.727811813354492, "global_step": 162306, "epoch": 1955} {"train_loss": -23.859167098999023, "global_step": 162307, "epoch": 1955} {"train_loss": -23.226825714111328, "global_step": 162308, "epoch": 1955} {"train_loss": -23.26706314086914, "global_step": 162309, "epoch": 1955} {"train_loss": -23.474729537963867, "global_step": 162310, "epoch": 1955} {"train_loss": -23.399845123291016, "global_step": 162311, "epoch": 1955} {"train_loss": -23.49030113220215, "global_step": 162312, "epoch": 1955} {"train_loss": -23.517898559570312, "global_step": 162313, "epoch": 1955} {"train_loss": -23.568466186523438, "global_step": 162314, "epoch": 1955} {"train_loss": -23.134031295776367, "global_step": 162315, "epoch": 1955} {"train_loss": -23.33228874206543, "global_step": 162316, "epoch": 1955} {"train_loss": -23.402000427246094, "global_step": 162317, "epoch": 1955} {"train_loss": -23.352033615112305, "global_step": 162318, "epoch": 1955} {"train_loss": -23.545873641967773, "global_step": 162319, "epoch": 1955} {"train_loss": -23.684972763061523, "global_step": 162320, "epoch": 1955} {"train_loss": -23.74112319946289, "global_step": 162321, "epoch": 1955} {"train_loss": -23.67500114440918, "global_step": 162322, "epoch": 1955} {"train_loss": -23.335128784179688, "global_step": 162323, "epoch": 1955} {"train_loss": -23.556913375854492, "global_step": 162324, "epoch": 1955} {"train_loss": -23.719337463378906, "global_step": 162325, "epoch": 1955} {"train_loss": -23.741132736206055, "global_step": 162326, "epoch": 1955} {"train_loss": -23.726112365722656, "global_step": 162327, "epoch": 1955} {"train_loss": -23.69968032836914, "global_step": 162328, "epoch": 1955} {"train_loss": -23.72543716430664, "global_step": 162329, "epoch": 1955} {"train_loss": -23.74494171142578, "global_step": 162330, "epoch": 1955} {"train_loss": -23.58594512939453, "global_step": 162331, "epoch": 1955} {"train_loss": -24.08133316040039, "global_step": 162332, "epoch": 1955} {"train_loss": -23.635129928588867, "global_step": 162333, "epoch": 1955} {"train_loss": -23.810728073120117, "global_step": 162334, "epoch": 1955} {"train_loss": -24.147571563720703, "global_step": 162335, "epoch": 1955} {"train_loss": -23.70969009399414, "global_step": 162336, "epoch": 1955} {"train_loss": -23.84569549560547, "global_step": 162337, "epoch": 1955} {"train_loss": -23.3005313873291, "global_step": 162338, "epoch": 1955} {"train_loss": -23.867027282714844, "global_step": 162339, "epoch": 1955} {"train_loss": -23.892553329467773, "global_step": 162340, "epoch": 1955} {"train_loss": -23.63410758972168, "global_step": 162341, "epoch": 1955} {"train_loss": -23.84926414489746, "global_step": 162342, "epoch": 1955} {"train_loss": -23.31532096862793, "global_step": 162343, "epoch": 1955} {"train_loss": -23.50342559814453, "global_step": 162344, "epoch": 1955} {"train_loss": -23.437484741210938, "global_step": 162345, "epoch": 1955} {"train_loss": -23.79865074157715, "global_step": 162346, "epoch": 1955} {"train_loss": -23.42627670104245, "global_step": 162347, "epoch": 1955, "val_loss": 6295405.5} {"train_loss": -22.791208267211914, "global_step": 162348, "epoch": 1956} {"train_loss": -22.54237937927246, "global_step": 162349, "epoch": 1956} {"train_loss": -22.872657775878906, "global_step": 162350, "epoch": 1956} {"train_loss": -22.755447387695312, "global_step": 162351, "epoch": 1956} {"train_loss": -22.807945251464844, "global_step": 162352, "epoch": 1956} {"train_loss": -23.109516143798828, "global_step": 162353, "epoch": 1956} {"train_loss": -22.737049102783203, "global_step": 162354, "epoch": 1956} {"train_loss": -23.175981521606445, "global_step": 162355, "epoch": 1956} {"train_loss": -23.47260093688965, "global_step": 162356, "epoch": 1956} {"train_loss": -23.0194034576416, "global_step": 162357, "epoch": 1956} {"train_loss": -23.043222427368164, "global_step": 162358, "epoch": 1956} {"train_loss": -23.614255905151367, "global_step": 162359, "epoch": 1956} {"train_loss": -22.83278465270996, "global_step": 162360, "epoch": 1956} {"train_loss": -23.168298721313477, "global_step": 162361, "epoch": 1956} {"train_loss": -23.043498992919922, "global_step": 162362, "epoch": 1956} {"train_loss": -23.32344627380371, "global_step": 162363, "epoch": 1956} {"train_loss": -23.311357498168945, "global_step": 162364, "epoch": 1956} {"train_loss": -23.49715232849121, "global_step": 162365, "epoch": 1956} {"train_loss": -23.472965240478516, "global_step": 162366, "epoch": 1956} {"train_loss": -23.510648727416992, "global_step": 162367, "epoch": 1956} {"train_loss": -23.140790939331055, "global_step": 162368, "epoch": 1956} {"train_loss": -23.81852149963379, "global_step": 162369, "epoch": 1956} {"train_loss": -23.659242630004883, "global_step": 162370, "epoch": 1956} {"train_loss": -23.491954803466797, "global_step": 162371, "epoch": 1956} {"train_loss": -23.53961181640625, "global_step": 162372, "epoch": 1956} {"train_loss": -23.748199462890625, "global_step": 162373, "epoch": 1956} {"train_loss": -23.59394645690918, "global_step": 162374, "epoch": 1956} {"train_loss": -23.581737518310547, "global_step": 162375, "epoch": 1956} {"train_loss": -23.235809326171875, "global_step": 162376, "epoch": 1956} {"train_loss": -23.511035919189453, "global_step": 162377, "epoch": 1956} {"train_loss": -23.73714828491211, "global_step": 162378, "epoch": 1956} {"train_loss": -23.763839721679688, "global_step": 162379, "epoch": 1956} {"train_loss": -23.72900390625, "global_step": 162380, "epoch": 1956} {"train_loss": -23.770809173583984, "global_step": 162381, "epoch": 1956} {"train_loss": -23.586551666259766, "global_step": 162382, "epoch": 1956} {"train_loss": -23.646093368530273, "global_step": 162383, "epoch": 1956} {"train_loss": -23.357328414916992, "global_step": 162384, "epoch": 1956} {"train_loss": -23.6392765045166, "global_step": 162385, "epoch": 1956} {"train_loss": -23.408174514770508, "global_step": 162386, "epoch": 1956} {"train_loss": -23.634057998657227, "global_step": 162387, "epoch": 1956} {"train_loss": -23.65937614440918, "global_step": 162388, "epoch": 1956} {"train_loss": -23.42986488342285, "global_step": 162389, "epoch": 1956} {"train_loss": -23.711334228515625, "global_step": 162390, "epoch": 1956} {"train_loss": -23.76226043701172, "global_step": 162391, "epoch": 1956} {"train_loss": -23.642154693603516, "global_step": 162392, "epoch": 1956} {"train_loss": -23.846899032592773, "global_step": 162393, "epoch": 1956} {"train_loss": -23.50596809387207, "global_step": 162394, "epoch": 1956} {"train_loss": -23.075199127197266, "global_step": 162395, "epoch": 1956} {"train_loss": -23.143308639526367, "global_step": 162396, "epoch": 1956} {"train_loss": -23.77406120300293, "global_step": 162397, "epoch": 1956} {"train_loss": -23.74043846130371, "global_step": 162398, "epoch": 1956} {"train_loss": -23.422576904296875, "global_step": 162399, "epoch": 1956} {"train_loss": -23.510910034179688, "global_step": 162400, "epoch": 1956} {"train_loss": -23.333465576171875, "global_step": 162401, "epoch": 1956} {"train_loss": -23.345645904541016, "global_step": 162402, "epoch": 1956} {"train_loss": -23.8155517578125, "global_step": 162403, "epoch": 1956} {"train_loss": -23.656421661376953, "global_step": 162404, "epoch": 1956} {"train_loss": -23.564855575561523, "global_step": 162405, "epoch": 1956} {"train_loss": -23.70900535583496, "global_step": 162406, "epoch": 1956} {"train_loss": -23.72379493713379, "global_step": 162407, "epoch": 1956} {"train_loss": -23.54457664489746, "global_step": 162408, "epoch": 1956} {"train_loss": -23.518451690673828, "global_step": 162409, "epoch": 1956} {"train_loss": -23.668216705322266, "global_step": 162410, "epoch": 1956} {"train_loss": -23.5888671875, "global_step": 162411, "epoch": 1956} {"train_loss": -23.643949508666992, "global_step": 162412, "epoch": 1956} {"train_loss": -23.500600814819336, "global_step": 162413, "epoch": 1956} {"train_loss": -23.432008743286133, "global_step": 162414, "epoch": 1956} {"train_loss": -23.646286010742188, "global_step": 162415, "epoch": 1956} {"train_loss": -23.616491317749023, "global_step": 162416, "epoch": 1956} {"train_loss": -23.80152702331543, "global_step": 162417, "epoch": 1956} {"train_loss": -23.440866470336914, "global_step": 162418, "epoch": 1956} {"train_loss": -23.616811752319336, "global_step": 162419, "epoch": 1956} {"train_loss": -23.635955810546875, "global_step": 162420, "epoch": 1956} {"train_loss": -23.649866104125977, "global_step": 162421, "epoch": 1956} {"train_loss": -23.559097290039062, "global_step": 162422, "epoch": 1956} {"train_loss": -23.39904022216797, "global_step": 162423, "epoch": 1956} {"train_loss": -24.140104293823242, "global_step": 162424, "epoch": 1956} {"train_loss": -23.525617599487305, "global_step": 162425, "epoch": 1956} {"train_loss": -23.806013107299805, "global_step": 162426, "epoch": 1956} {"train_loss": -23.8539981842041, "global_step": 162427, "epoch": 1956} {"train_loss": -23.68988609313965, "global_step": 162428, "epoch": 1956} {"train_loss": -23.451461791992188, "global_step": 162429, "epoch": 1956} {"train_loss": -23.480110490178486, "global_step": 162430, "epoch": 1956, "val_loss": 6223922.0} {"train_loss": -23.30441665649414, "global_step": 162431, "epoch": 1957} {"train_loss": -22.374725341796875, "global_step": 162432, "epoch": 1957} {"train_loss": -22.741119384765625, "global_step": 162433, "epoch": 1957} {"train_loss": -22.820096969604492, "global_step": 162434, "epoch": 1957} {"train_loss": -23.00066375732422, "global_step": 162435, "epoch": 1957} {"train_loss": -22.801860809326172, "global_step": 162436, "epoch": 1957} {"train_loss": -22.937015533447266, "global_step": 162437, "epoch": 1957} {"train_loss": -23.1814022064209, "global_step": 162438, "epoch": 1957} {"train_loss": -22.835481643676758, "global_step": 162439, "epoch": 1957} {"train_loss": -23.329227447509766, "global_step": 162440, "epoch": 1957} {"train_loss": -22.979764938354492, "global_step": 162441, "epoch": 1957} {"train_loss": -23.370685577392578, "global_step": 162442, "epoch": 1957} {"train_loss": -23.590038299560547, "global_step": 162443, "epoch": 1957} {"train_loss": -22.915159225463867, "global_step": 162444, "epoch": 1957} {"train_loss": -23.229251861572266, "global_step": 162445, "epoch": 1957} {"train_loss": -23.34269142150879, "global_step": 162446, "epoch": 1957} {"train_loss": -23.166900634765625, "global_step": 162447, "epoch": 1957} {"train_loss": -23.285924911499023, "global_step": 162448, "epoch": 1957} {"train_loss": -22.960556030273438, "global_step": 162449, "epoch": 1957} {"train_loss": -23.18086814880371, "global_step": 162450, "epoch": 1957} {"train_loss": -23.3092041015625, "global_step": 162451, "epoch": 1957} {"train_loss": -23.240530014038086, "global_step": 162452, "epoch": 1957} {"train_loss": -23.37181282043457, "global_step": 162453, "epoch": 1957} {"train_loss": -23.12225914001465, "global_step": 162454, "epoch": 1957} {"train_loss": -23.08133888244629, "global_step": 162455, "epoch": 1957} {"train_loss": -23.5946102142334, "global_step": 162456, "epoch": 1957} {"train_loss": -23.247888565063477, "global_step": 162457, "epoch": 1957} {"train_loss": -23.093347549438477, "global_step": 162458, "epoch": 1957} {"train_loss": -23.202335357666016, "global_step": 162459, "epoch": 1957} {"train_loss": -23.193185806274414, "global_step": 162460, "epoch": 1957} {"train_loss": -23.358936309814453, "global_step": 162461, "epoch": 1957} {"train_loss": -23.0943546295166, "global_step": 162462, "epoch": 1957} {"train_loss": -23.26792335510254, "global_step": 162463, "epoch": 1957} {"train_loss": -23.703397750854492, "global_step": 162464, "epoch": 1957} {"train_loss": -23.233835220336914, "global_step": 162465, "epoch": 1957} {"train_loss": -23.61214256286621, "global_step": 162466, "epoch": 1957} {"train_loss": -23.55988883972168, "global_step": 162467, "epoch": 1957} {"train_loss": -23.417354583740234, "global_step": 162468, "epoch": 1957} {"train_loss": -23.375001907348633, "global_step": 162469, "epoch": 1957} {"train_loss": -23.45665168762207, "global_step": 162470, "epoch": 1957} {"train_loss": -23.393095016479492, "global_step": 162471, "epoch": 1957} {"train_loss": -23.356361389160156, "global_step": 162472, "epoch": 1957} {"train_loss": -23.397369384765625, "global_step": 162473, "epoch": 1957} {"train_loss": -23.78726577758789, "global_step": 162474, "epoch": 1957} {"train_loss": -23.672582626342773, "global_step": 162475, "epoch": 1957} {"train_loss": -23.390838623046875, "global_step": 162476, "epoch": 1957} {"train_loss": -23.566312789916992, "global_step": 162477, "epoch": 1957} {"train_loss": -23.48999786376953, "global_step": 162478, "epoch": 1957} {"train_loss": -23.82135009765625, "global_step": 162479, "epoch": 1957} {"train_loss": -23.482458114624023, "global_step": 162480, "epoch": 1957} {"train_loss": -23.473657608032227, "global_step": 162481, "epoch": 1957} {"train_loss": -23.578706741333008, "global_step": 162482, "epoch": 1957} {"train_loss": -23.82771873474121, "global_step": 162483, "epoch": 1957} {"train_loss": -23.77541160583496, "global_step": 162484, "epoch": 1957} {"train_loss": -23.29935646057129, "global_step": 162485, "epoch": 1957} {"train_loss": -23.259672164916992, "global_step": 162486, "epoch": 1957} {"train_loss": -23.7285099029541, "global_step": 162487, "epoch": 1957} {"train_loss": -23.709518432617188, "global_step": 162488, "epoch": 1957} {"train_loss": -23.353635787963867, "global_step": 162489, "epoch": 1957} {"train_loss": -23.149429321289062, "global_step": 162490, "epoch": 1957} {"train_loss": -23.275381088256836, "global_step": 162491, "epoch": 1957} {"train_loss": -23.370288848876953, "global_step": 162492, "epoch": 1957} {"train_loss": -23.10984992980957, "global_step": 162493, "epoch": 1957} {"train_loss": -23.183626174926758, "global_step": 162494, "epoch": 1957} {"train_loss": -23.45301628112793, "global_step": 162495, "epoch": 1957} {"train_loss": -23.20387077331543, "global_step": 162496, "epoch": 1957} {"train_loss": -23.517972946166992, "global_step": 162497, "epoch": 1957} {"train_loss": -23.200532913208008, "global_step": 162498, "epoch": 1957} {"train_loss": -23.09281349182129, "global_step": 162499, "epoch": 1957} {"train_loss": -23.759580612182617, "global_step": 162500, "epoch": 1957} {"train_loss": -23.403879165649414, "global_step": 162501, "epoch": 1957} {"train_loss": -23.367753982543945, "global_step": 162502, "epoch": 1957} {"train_loss": -23.038312911987305, "global_step": 162503, "epoch": 1957} {"train_loss": -22.958539962768555, "global_step": 162504, "epoch": 1957} {"train_loss": -23.826610565185547, "global_step": 162505, "epoch": 1957} {"train_loss": -23.655332565307617, "global_step": 162506, "epoch": 1957} {"train_loss": -23.320362091064453, "global_step": 162507, "epoch": 1957} {"train_loss": -23.79022216796875, "global_step": 162508, "epoch": 1957} {"train_loss": -23.515195846557617, "global_step": 162509, "epoch": 1957} {"train_loss": -23.68580436706543, "global_step": 162510, "epoch": 1957} {"train_loss": -23.268146514892578, "global_step": 162511, "epoch": 1957} {"train_loss": -23.665430068969727, "global_step": 162512, "epoch": 1957} {"train_loss": -23.320885623794005, "global_step": 162513, "epoch": 1957, "val_loss": 6349084.5} {"train_loss": -23.032291412353516, "global_step": 162514, "epoch": 1958} {"train_loss": -23.26215934753418, "global_step": 162515, "epoch": 1958} {"train_loss": -23.242733001708984, "global_step": 162516, "epoch": 1958} {"train_loss": -23.23281478881836, "global_step": 162517, "epoch": 1958} {"train_loss": -22.97254180908203, "global_step": 162518, "epoch": 1958} {"train_loss": -23.529190063476562, "global_step": 162519, "epoch": 1958} {"train_loss": -23.269968032836914, "global_step": 162520, "epoch": 1958} {"train_loss": -23.27349853515625, "global_step": 162521, "epoch": 1958} {"train_loss": -23.35651397705078, "global_step": 162522, "epoch": 1958} {"train_loss": -23.683252334594727, "global_step": 162523, "epoch": 1958} {"train_loss": -23.34659194946289, "global_step": 162524, "epoch": 1958} {"train_loss": -23.37860679626465, "global_step": 162525, "epoch": 1958} {"train_loss": -23.57107925415039, "global_step": 162526, "epoch": 1958} {"train_loss": -23.75352668762207, "global_step": 162527, "epoch": 1958} {"train_loss": -23.284543991088867, "global_step": 162528, "epoch": 1958} {"train_loss": -23.134693145751953, "global_step": 162529, "epoch": 1958} {"train_loss": -23.40724754333496, "global_step": 162530, "epoch": 1958} {"train_loss": -23.426605224609375, "global_step": 162531, "epoch": 1958} {"train_loss": -23.819416046142578, "global_step": 162532, "epoch": 1958} {"train_loss": -23.334701538085938, "global_step": 162533, "epoch": 1958} {"train_loss": -23.48952293395996, "global_step": 162534, "epoch": 1958} {"train_loss": -23.261926651000977, "global_step": 162535, "epoch": 1958} {"train_loss": -23.493131637573242, "global_step": 162536, "epoch": 1958} {"train_loss": -23.660608291625977, "global_step": 162537, "epoch": 1958} {"train_loss": -23.645706176757812, "global_step": 162538, "epoch": 1958} {"train_loss": -23.33115005493164, "global_step": 162539, "epoch": 1958} {"train_loss": -23.723876953125, "global_step": 162540, "epoch": 1958} {"train_loss": -23.229127883911133, "global_step": 162541, "epoch": 1958} {"train_loss": -23.222326278686523, "global_step": 162542, "epoch": 1958} {"train_loss": -23.827978134155273, "global_step": 162543, "epoch": 1958} {"train_loss": -23.509885787963867, "global_step": 162544, "epoch": 1958} {"train_loss": -23.95147132873535, "global_step": 162545, "epoch": 1958} {"train_loss": -23.704736709594727, "global_step": 162546, "epoch": 1958} {"train_loss": -23.490964889526367, "global_step": 162547, "epoch": 1958} {"train_loss": -23.74271011352539, "global_step": 162548, "epoch": 1958} {"train_loss": -23.226490020751953, "global_step": 162549, "epoch": 1958} {"train_loss": -23.555143356323242, "global_step": 162550, "epoch": 1958} {"train_loss": -23.46708106994629, "global_step": 162551, "epoch": 1958} {"train_loss": -23.677942276000977, "global_step": 162552, "epoch": 1958} {"train_loss": -23.572589874267578, "global_step": 162553, "epoch": 1958} {"train_loss": -23.734460830688477, "global_step": 162554, "epoch": 1958} {"train_loss": -23.94386863708496, "global_step": 162555, "epoch": 1958} {"train_loss": -23.56589126586914, "global_step": 162556, "epoch": 1958} {"train_loss": -23.305408477783203, "global_step": 162557, "epoch": 1958} {"train_loss": -23.46222496032715, "global_step": 162558, "epoch": 1958} {"train_loss": -23.475162506103516, "global_step": 162559, "epoch": 1958} {"train_loss": -23.49064826965332, "global_step": 162560, "epoch": 1958} {"train_loss": -24.021799087524414, "global_step": 162561, "epoch": 1958} {"train_loss": -23.64020347595215, "global_step": 162562, "epoch": 1958} {"train_loss": -23.715944290161133, "global_step": 162563, "epoch": 1958} {"train_loss": -23.719898223876953, "global_step": 162564, "epoch": 1958} {"train_loss": -23.306039810180664, "global_step": 162565, "epoch": 1958} {"train_loss": -23.87505531311035, "global_step": 162566, "epoch": 1958} {"train_loss": -23.754764556884766, "global_step": 162567, "epoch": 1958} {"train_loss": -23.69407844543457, "global_step": 162568, "epoch": 1958} {"train_loss": -23.762691497802734, "global_step": 162569, "epoch": 1958} {"train_loss": -23.508216857910156, "global_step": 162570, "epoch": 1958} {"train_loss": -23.581207275390625, "global_step": 162571, "epoch": 1958} {"train_loss": -23.47991371154785, "global_step": 162572, "epoch": 1958} {"train_loss": -23.74432945251465, "global_step": 162573, "epoch": 1958} {"train_loss": -23.61695671081543, "global_step": 162574, "epoch": 1958} {"train_loss": -23.16636085510254, "global_step": 162575, "epoch": 1958} {"train_loss": -23.22761344909668, "global_step": 162576, "epoch": 1958} {"train_loss": -23.134611129760742, "global_step": 162577, "epoch": 1958} {"train_loss": -23.273630142211914, "global_step": 162578, "epoch": 1958} {"train_loss": -23.36203384399414, "global_step": 162579, "epoch": 1958} {"train_loss": -23.92594337463379, "global_step": 162580, "epoch": 1958} {"train_loss": -23.509384155273438, "global_step": 162581, "epoch": 1958} {"train_loss": -23.085447311401367, "global_step": 162582, "epoch": 1958} {"train_loss": -23.461008071899414, "global_step": 162583, "epoch": 1958} {"train_loss": -23.555866241455078, "global_step": 162584, "epoch": 1958} {"train_loss": -23.845794677734375, "global_step": 162585, "epoch": 1958} {"train_loss": -23.616544723510742, "global_step": 162586, "epoch": 1958} {"train_loss": -23.95474624633789, "global_step": 162587, "epoch": 1958} {"train_loss": -23.611642837524414, "global_step": 162588, "epoch": 1958} {"train_loss": -23.687166213989258, "global_step": 162589, "epoch": 1958} {"train_loss": -23.980295181274414, "global_step": 162590, "epoch": 1958} {"train_loss": -23.3610897064209, "global_step": 162591, "epoch": 1958} {"train_loss": -23.54909324645996, "global_step": 162592, "epoch": 1958} {"train_loss": -23.203384399414062, "global_step": 162593, "epoch": 1958} {"train_loss": -23.226356506347656, "global_step": 162594, "epoch": 1958} {"train_loss": -23.4779052734375, "global_step": 162595, "epoch": 1958} {"train_loss": -23.51925741908062, "global_step": 162596, "epoch": 1958, "val_loss": 6392831.0} {"train_loss": -23.187103271484375, "global_step": 162597, "epoch": 1959} {"train_loss": -23.4683895111084, "global_step": 162598, "epoch": 1959} {"train_loss": -23.25873374938965, "global_step": 162599, "epoch": 1959} {"train_loss": -23.20937156677246, "global_step": 162600, "epoch": 1959} {"train_loss": -23.09321403503418, "global_step": 162601, "epoch": 1959} {"train_loss": -23.29973793029785, "global_step": 162602, "epoch": 1959} {"train_loss": -23.258005142211914, "global_step": 162603, "epoch": 1959} {"train_loss": -23.091697692871094, "global_step": 162604, "epoch": 1959} {"train_loss": -23.391355514526367, "global_step": 162605, "epoch": 1959} {"train_loss": -23.557580947875977, "global_step": 162606, "epoch": 1959} {"train_loss": -23.13273048400879, "global_step": 162607, "epoch": 1959} {"train_loss": -23.758161544799805, "global_step": 162608, "epoch": 1959} {"train_loss": -22.934219360351562, "global_step": 162609, "epoch": 1959} {"train_loss": -23.119089126586914, "global_step": 162610, "epoch": 1959} {"train_loss": -23.141624450683594, "global_step": 162611, "epoch": 1959} {"train_loss": -23.37879753112793, "global_step": 162612, "epoch": 1959} {"train_loss": -23.39128875732422, "global_step": 162613, "epoch": 1959} {"train_loss": -23.530868530273438, "global_step": 162614, "epoch": 1959} {"train_loss": -23.54878807067871, "global_step": 162615, "epoch": 1959} {"train_loss": -24.03887176513672, "global_step": 162616, "epoch": 1959} {"train_loss": -23.819046020507812, "global_step": 162617, "epoch": 1959} {"train_loss": -23.700481414794922, "global_step": 162618, "epoch": 1959} {"train_loss": -23.166101455688477, "global_step": 162619, "epoch": 1959} {"train_loss": -23.690139770507812, "global_step": 162620, "epoch": 1959} {"train_loss": -23.546499252319336, "global_step": 162621, "epoch": 1959} {"train_loss": -23.4390869140625, "global_step": 162622, "epoch": 1959} {"train_loss": -23.89822769165039, "global_step": 162623, "epoch": 1959} {"train_loss": -23.44379997253418, "global_step": 162624, "epoch": 1959} {"train_loss": -23.372312545776367, "global_step": 162625, "epoch": 1959} {"train_loss": -23.392210006713867, "global_step": 162626, "epoch": 1959} {"train_loss": -23.54547691345215, "global_step": 162627, "epoch": 1959} {"train_loss": -23.69453239440918, "global_step": 162628, "epoch": 1959} {"train_loss": -23.425405502319336, "global_step": 162629, "epoch": 1959} {"train_loss": -23.301883697509766, "global_step": 162630, "epoch": 1959} {"train_loss": -23.70941162109375, "global_step": 162631, "epoch": 1959} {"train_loss": -23.46018409729004, "global_step": 162632, "epoch": 1959} {"train_loss": -23.748868942260742, "global_step": 162633, "epoch": 1959} {"train_loss": -23.439590454101562, "global_step": 162634, "epoch": 1959} {"train_loss": -23.803356170654297, "global_step": 162635, "epoch": 1959} {"train_loss": -23.442487716674805, "global_step": 162636, "epoch": 1959} {"train_loss": -23.351999282836914, "global_step": 162637, "epoch": 1959} {"train_loss": -23.556386947631836, "global_step": 162638, "epoch": 1959} {"train_loss": -23.535663604736328, "global_step": 162639, "epoch": 1959} {"train_loss": -23.819660186767578, "global_step": 162640, "epoch": 1959} {"train_loss": -24.00359535217285, "global_step": 162641, "epoch": 1959} {"train_loss": -23.0223445892334, "global_step": 162642, "epoch": 1959} {"train_loss": -22.893190383911133, "global_step": 162643, "epoch": 1959} {"train_loss": -23.153465270996094, "global_step": 162644, "epoch": 1959} {"train_loss": -23.548364639282227, "global_step": 162645, "epoch": 1959} {"train_loss": -23.070465087890625, "global_step": 162646, "epoch": 1959} {"train_loss": -23.717985153198242, "global_step": 162647, "epoch": 1959} {"train_loss": -23.3372859954834, "global_step": 162648, "epoch": 1959} {"train_loss": -23.452558517456055, "global_step": 162649, "epoch": 1959} {"train_loss": -23.329328536987305, "global_step": 162650, "epoch": 1959} {"train_loss": -23.406110763549805, "global_step": 162651, "epoch": 1959} {"train_loss": -23.079771041870117, "global_step": 162652, "epoch": 1959} {"train_loss": -23.4830265045166, "global_step": 162653, "epoch": 1959} {"train_loss": -23.387481689453125, "global_step": 162654, "epoch": 1959} {"train_loss": -23.174911499023438, "global_step": 162655, "epoch": 1959} {"train_loss": -23.722272872924805, "global_step": 162656, "epoch": 1959} {"train_loss": -23.17045783996582, "global_step": 162657, "epoch": 1959} {"train_loss": -23.481327056884766, "global_step": 162658, "epoch": 1959} {"train_loss": -23.79683494567871, "global_step": 162659, "epoch": 1959} {"train_loss": -23.602325439453125, "global_step": 162660, "epoch": 1959} {"train_loss": -23.44063377380371, "global_step": 162661, "epoch": 1959} {"train_loss": -23.692197799682617, "global_step": 162662, "epoch": 1959} {"train_loss": -23.52388572692871, "global_step": 162663, "epoch": 1959} {"train_loss": -23.866180419921875, "global_step": 162664, "epoch": 1959} {"train_loss": -23.96637535095215, "global_step": 162665, "epoch": 1959} {"train_loss": -23.580547332763672, "global_step": 162666, "epoch": 1959} {"train_loss": -23.745468139648438, "global_step": 162667, "epoch": 1959} {"train_loss": -23.4622859954834, "global_step": 162668, "epoch": 1959} {"train_loss": -23.722631454467773, "global_step": 162669, "epoch": 1959} {"train_loss": -23.57553482055664, "global_step": 162670, "epoch": 1959} {"train_loss": -23.721797943115234, "global_step": 162671, "epoch": 1959} {"train_loss": -23.609128952026367, "global_step": 162672, "epoch": 1959} {"train_loss": -23.950225830078125, "global_step": 162673, "epoch": 1959} {"train_loss": -23.357954025268555, "global_step": 162674, "epoch": 1959} {"train_loss": -23.55893898010254, "global_step": 162675, "epoch": 1959} {"train_loss": -23.40650749206543, "global_step": 162676, "epoch": 1959} {"train_loss": -23.700103759765625, "global_step": 162677, "epoch": 1959} {"train_loss": -23.773344039916992, "global_step": 162678, "epoch": 1959} {"train_loss": -23.487440316073865, "global_step": 162679, "epoch": 1959, "val_loss": 6387932.0} {"train_loss": -23.048261642456055, "global_step": 162680, "epoch": 1960} {"train_loss": -22.62257957458496, "global_step": 162681, "epoch": 1960} {"train_loss": -22.880308151245117, "global_step": 162682, "epoch": 1960} {"train_loss": -23.25382423400879, "global_step": 162683, "epoch": 1960} {"train_loss": -22.978748321533203, "global_step": 162684, "epoch": 1960} {"train_loss": -23.208932876586914, "global_step": 162685, "epoch": 1960} {"train_loss": -23.425987243652344, "global_step": 162686, "epoch": 1960} {"train_loss": -23.482547760009766, "global_step": 162687, "epoch": 1960} {"train_loss": -23.380762100219727, "global_step": 162688, "epoch": 1960} {"train_loss": -23.091623306274414, "global_step": 162689, "epoch": 1960} {"train_loss": -23.16737174987793, "global_step": 162690, "epoch": 1960} {"train_loss": -23.75699806213379, "global_step": 162691, "epoch": 1960} {"train_loss": -23.51409339904785, "global_step": 162692, "epoch": 1960} {"train_loss": -23.375532150268555, "global_step": 162693, "epoch": 1960} {"train_loss": -23.123228073120117, "global_step": 162694, "epoch": 1960} {"train_loss": -23.33222007751465, "global_step": 162695, "epoch": 1960} {"train_loss": -23.526399612426758, "global_step": 162696, "epoch": 1960} {"train_loss": -23.286014556884766, "global_step": 162697, "epoch": 1960} {"train_loss": -23.25092315673828, "global_step": 162698, "epoch": 1960} {"train_loss": -23.60463523864746, "global_step": 162699, "epoch": 1960} {"train_loss": -23.518659591674805, "global_step": 162700, "epoch": 1960} {"train_loss": -23.02667808532715, "global_step": 162701, "epoch": 1960} {"train_loss": -23.49994468688965, "global_step": 162702, "epoch": 1960} {"train_loss": -23.50272560119629, "global_step": 162703, "epoch": 1960} {"train_loss": -23.643070220947266, "global_step": 162704, "epoch": 1960} {"train_loss": -23.634687423706055, "global_step": 162705, "epoch": 1960} {"train_loss": -23.201358795166016, "global_step": 162706, "epoch": 1960} {"train_loss": -23.782384872436523, "global_step": 162707, "epoch": 1960} {"train_loss": -23.52740478515625, "global_step": 162708, "epoch": 1960} {"train_loss": -23.355270385742188, "global_step": 162709, "epoch": 1960} {"train_loss": -23.50383949279785, "global_step": 162710, "epoch": 1960} {"train_loss": -24.05181312561035, "global_step": 162711, "epoch": 1960} {"train_loss": -23.441564559936523, "global_step": 162712, "epoch": 1960} {"train_loss": -23.204294204711914, "global_step": 162713, "epoch": 1960} {"train_loss": -23.849441528320312, "global_step": 162714, "epoch": 1960} {"train_loss": -23.37270736694336, "global_step": 162715, "epoch": 1960} {"train_loss": -23.47836685180664, "global_step": 162716, "epoch": 1960} {"train_loss": -23.66408348083496, "global_step": 162717, "epoch": 1960} {"train_loss": -23.795820236206055, "global_step": 162718, "epoch": 1960} {"train_loss": -23.3955020904541, "global_step": 162719, "epoch": 1960} {"train_loss": -23.726455688476562, "global_step": 162720, "epoch": 1960} {"train_loss": -23.597225189208984, "global_step": 162721, "epoch": 1960} {"train_loss": -23.834413528442383, "global_step": 162722, "epoch": 1960} {"train_loss": -23.462804794311523, "global_step": 162723, "epoch": 1960} {"train_loss": -23.666330337524414, "global_step": 162724, "epoch": 1960} {"train_loss": -23.994922637939453, "global_step": 162725, "epoch": 1960} {"train_loss": -23.721603393554688, "global_step": 162726, "epoch": 1960} {"train_loss": -23.65179443359375, "global_step": 162727, "epoch": 1960} {"train_loss": -23.547727584838867, "global_step": 162728, "epoch": 1960} {"train_loss": -23.30928611755371, "global_step": 162729, "epoch": 1960} {"train_loss": -23.554733276367188, "global_step": 162730, "epoch": 1960} {"train_loss": -23.75791358947754, "global_step": 162731, "epoch": 1960} {"train_loss": -23.400407791137695, "global_step": 162732, "epoch": 1960} {"train_loss": -23.66877555847168, "global_step": 162733, "epoch": 1960} {"train_loss": -23.272323608398438, "global_step": 162734, "epoch": 1960} {"train_loss": -23.788692474365234, "global_step": 162735, "epoch": 1960} {"train_loss": -23.344709396362305, "global_step": 162736, "epoch": 1960} {"train_loss": -23.586774826049805, "global_step": 162737, "epoch": 1960} {"train_loss": -23.523529052734375, "global_step": 162738, "epoch": 1960} {"train_loss": -23.574750900268555, "global_step": 162739, "epoch": 1960} {"train_loss": -23.93195915222168, "global_step": 162740, "epoch": 1960} {"train_loss": -23.79103660583496, "global_step": 162741, "epoch": 1960} {"train_loss": -23.241119384765625, "global_step": 162742, "epoch": 1960} {"train_loss": -23.465757369995117, "global_step": 162743, "epoch": 1960} {"train_loss": -23.692054748535156, "global_step": 162744, "epoch": 1960} {"train_loss": -23.527685165405273, "global_step": 162745, "epoch": 1960} {"train_loss": -23.536720275878906, "global_step": 162746, "epoch": 1960} {"train_loss": -23.310461044311523, "global_step": 162747, "epoch": 1960} {"train_loss": -23.782367706298828, "global_step": 162748, "epoch": 1960} {"train_loss": -23.57172966003418, "global_step": 162749, "epoch": 1960} {"train_loss": -23.38030433654785, "global_step": 162750, "epoch": 1960} {"train_loss": -23.78030776977539, "global_step": 162751, "epoch": 1960} {"train_loss": -23.276525497436523, "global_step": 162752, "epoch": 1960} {"train_loss": -23.746479034423828, "global_step": 162753, "epoch": 1960} {"train_loss": -23.515316009521484, "global_step": 162754, "epoch": 1960} {"train_loss": -23.914316177368164, "global_step": 162755, "epoch": 1960} {"train_loss": -23.492292404174805, "global_step": 162756, "epoch": 1960} {"train_loss": -23.539047241210938, "global_step": 162757, "epoch": 1960} {"train_loss": -23.80438804626465, "global_step": 162758, "epoch": 1960} {"train_loss": -23.454912185668945, "global_step": 162759, "epoch": 1960} {"train_loss": -24.022642135620117, "global_step": 162760, "epoch": 1960} {"train_loss": -23.47475814819336, "global_step": 162761, "epoch": 1960} {"train_loss": -23.499135810208607, "global_step": 162762, "epoch": 1960, "val_loss": 6400058.0} {"train_loss": -23.484407424926758, "global_step": 162763, "epoch": 1961} {"train_loss": -23.15070152282715, "global_step": 162764, "epoch": 1961} {"train_loss": -23.477895736694336, "global_step": 162765, "epoch": 1961} {"train_loss": -23.223844528198242, "global_step": 162766, "epoch": 1961} {"train_loss": -23.42682647705078, "global_step": 162767, "epoch": 1961} {"train_loss": -23.233501434326172, "global_step": 162768, "epoch": 1961} {"train_loss": -23.50831413269043, "global_step": 162769, "epoch": 1961} {"train_loss": -23.710853576660156, "global_step": 162770, "epoch": 1961} {"train_loss": -23.244789123535156, "global_step": 162771, "epoch": 1961} {"train_loss": -23.297088623046875, "global_step": 162772, "epoch": 1961} {"train_loss": -22.827085494995117, "global_step": 162773, "epoch": 1961} {"train_loss": -23.345630645751953, "global_step": 162774, "epoch": 1961} {"train_loss": -23.39609146118164, "global_step": 162775, "epoch": 1961} {"train_loss": -23.278656005859375, "global_step": 162776, "epoch": 1961} {"train_loss": -23.42970085144043, "global_step": 162777, "epoch": 1961} {"train_loss": -23.594655990600586, "global_step": 162778, "epoch": 1961} {"train_loss": -23.545602798461914, "global_step": 162779, "epoch": 1961} {"train_loss": -23.64359474182129, "global_step": 162780, "epoch": 1961} {"train_loss": -23.217851638793945, "global_step": 162781, "epoch": 1961} {"train_loss": -23.90613555908203, "global_step": 162782, "epoch": 1961} {"train_loss": -23.41338539123535, "global_step": 162783, "epoch": 1961} {"train_loss": -23.375263214111328, "global_step": 162784, "epoch": 1961} {"train_loss": -23.055896759033203, "global_step": 162785, "epoch": 1961} {"train_loss": -23.46832847595215, "global_step": 162786, "epoch": 1961} {"train_loss": -23.461414337158203, "global_step": 162787, "epoch": 1961} {"train_loss": -23.37271499633789, "global_step": 162788, "epoch": 1961} {"train_loss": -23.262414932250977, "global_step": 162789, "epoch": 1961} {"train_loss": -23.500228881835938, "global_step": 162790, "epoch": 1961} {"train_loss": -23.288175582885742, "global_step": 162791, "epoch": 1961} {"train_loss": -23.263431549072266, "global_step": 162792, "epoch": 1961} {"train_loss": -23.8027400970459, "global_step": 162793, "epoch": 1961} {"train_loss": -23.53135108947754, "global_step": 162794, "epoch": 1961} {"train_loss": -23.468854904174805, "global_step": 162795, "epoch": 1961} {"train_loss": -23.7409725189209, "global_step": 162796, "epoch": 1961} {"train_loss": -23.61680793762207, "global_step": 162797, "epoch": 1961} {"train_loss": -23.72315788269043, "global_step": 162798, "epoch": 1961} {"train_loss": -23.908334732055664, "global_step": 162799, "epoch": 1961} {"train_loss": -23.61702537536621, "global_step": 162800, "epoch": 1961} {"train_loss": -23.497907638549805, "global_step": 162801, "epoch": 1961} {"train_loss": -23.546939849853516, "global_step": 162802, "epoch": 1961} {"train_loss": -23.54581069946289, "global_step": 162803, "epoch": 1961} {"train_loss": -23.75958251953125, "global_step": 162804, "epoch": 1961} {"train_loss": -23.170392990112305, "global_step": 162805, "epoch": 1961} {"train_loss": -23.63629913330078, "global_step": 162806, "epoch": 1961} {"train_loss": -23.74997901916504, "global_step": 162807, "epoch": 1961} {"train_loss": -23.428464889526367, "global_step": 162808, "epoch": 1961} {"train_loss": -23.58686637878418, "global_step": 162809, "epoch": 1961} {"train_loss": -23.584712982177734, "global_step": 162810, "epoch": 1961} {"train_loss": -23.48284149169922, "global_step": 162811, "epoch": 1961} {"train_loss": -23.65412139892578, "global_step": 162812, "epoch": 1961} {"train_loss": -23.466821670532227, "global_step": 162813, "epoch": 1961} {"train_loss": -23.421640396118164, "global_step": 162814, "epoch": 1961} {"train_loss": -23.847278594970703, "global_step": 162815, "epoch": 1961} {"train_loss": -23.74649429321289, "global_step": 162816, "epoch": 1961} {"train_loss": -23.569869995117188, "global_step": 162817, "epoch": 1961} {"train_loss": -24.095308303833008, "global_step": 162818, "epoch": 1961} {"train_loss": -23.534269332885742, "global_step": 162819, "epoch": 1961} {"train_loss": -23.67948341369629, "global_step": 162820, "epoch": 1961} {"train_loss": -23.29197120666504, "global_step": 162821, "epoch": 1961} {"train_loss": -24.080209732055664, "global_step": 162822, "epoch": 1961} {"train_loss": -23.372102737426758, "global_step": 162823, "epoch": 1961} {"train_loss": -23.32942008972168, "global_step": 162824, "epoch": 1961} {"train_loss": -23.472261428833008, "global_step": 162825, "epoch": 1961} {"train_loss": -23.516830444335938, "global_step": 162826, "epoch": 1961} {"train_loss": -23.532155990600586, "global_step": 162827, "epoch": 1961} {"train_loss": -23.567564010620117, "global_step": 162828, "epoch": 1961} {"train_loss": -23.256872177124023, "global_step": 162829, "epoch": 1961} {"train_loss": -23.69890785217285, "global_step": 162830, "epoch": 1961} {"train_loss": -23.51677703857422, "global_step": 162831, "epoch": 1961} {"train_loss": -23.4361515045166, "global_step": 162832, "epoch": 1961} {"train_loss": -23.538053512573242, "global_step": 162833, "epoch": 1961} {"train_loss": -23.850839614868164, "global_step": 162834, "epoch": 1961} {"train_loss": -23.62346076965332, "global_step": 162835, "epoch": 1961} {"train_loss": -23.631956100463867, "global_step": 162836, "epoch": 1961} {"train_loss": -23.165977478027344, "global_step": 162837, "epoch": 1961} {"train_loss": -23.626630783081055, "global_step": 162838, "epoch": 1961} {"train_loss": -23.7645206451416, "global_step": 162839, "epoch": 1961} {"train_loss": -23.322694778442383, "global_step": 162840, "epoch": 1961} {"train_loss": -23.757108688354492, "global_step": 162841, "epoch": 1961} {"train_loss": -23.852453231811523, "global_step": 162842, "epoch": 1961} {"train_loss": -23.361865997314453, "global_step": 162843, "epoch": 1961} {"train_loss": -23.552001953125, "global_step": 162844, "epoch": 1961} {"train_loss": -23.536346090845313, "global_step": 162845, "epoch": 1961, "val_loss": 6385593.0} {"train_loss": -23.061553955078125, "global_step": 162846, "epoch": 1962} {"train_loss": -22.979372024536133, "global_step": 162847, "epoch": 1962} {"train_loss": -23.29450798034668, "global_step": 162848, "epoch": 1962} {"train_loss": -23.64093589782715, "global_step": 162849, "epoch": 1962} {"train_loss": -23.3565731048584, "global_step": 162850, "epoch": 1962} {"train_loss": -23.098310470581055, "global_step": 162851, "epoch": 1962} {"train_loss": -23.698820114135742, "global_step": 162852, "epoch": 1962} {"train_loss": -23.345943450927734, "global_step": 162853, "epoch": 1962} {"train_loss": -22.810972213745117, "global_step": 162854, "epoch": 1962} {"train_loss": -23.586666107177734, "global_step": 162855, "epoch": 1962} {"train_loss": -23.18638038635254, "global_step": 162856, "epoch": 1962} {"train_loss": -23.459352493286133, "global_step": 162857, "epoch": 1962} {"train_loss": -23.073902130126953, "global_step": 162858, "epoch": 1962} {"train_loss": -23.10047721862793, "global_step": 162859, "epoch": 1962} {"train_loss": -23.02322769165039, "global_step": 162860, "epoch": 1962} {"train_loss": -22.99435806274414, "global_step": 162861, "epoch": 1962} {"train_loss": -23.419689178466797, "global_step": 162862, "epoch": 1962} {"train_loss": -23.414112091064453, "global_step": 162863, "epoch": 1962} {"train_loss": -23.433958053588867, "global_step": 162864, "epoch": 1962} {"train_loss": -23.346088409423828, "global_step": 162865, "epoch": 1962} {"train_loss": -23.474515914916992, "global_step": 162866, "epoch": 1962} {"train_loss": -23.453750610351562, "global_step": 162867, "epoch": 1962} {"train_loss": -23.268461227416992, "global_step": 162868, "epoch": 1962} {"train_loss": -23.501768112182617, "global_step": 162869, "epoch": 1962} {"train_loss": -23.48646354675293, "global_step": 162870, "epoch": 1962} {"train_loss": -23.490402221679688, "global_step": 162871, "epoch": 1962} {"train_loss": -23.4945011138916, "global_step": 162872, "epoch": 1962} {"train_loss": -23.50898551940918, "global_step": 162873, "epoch": 1962} {"train_loss": -23.538267135620117, "global_step": 162874, "epoch": 1962} {"train_loss": -23.437795639038086, "global_step": 162875, "epoch": 1962} {"train_loss": -23.25555419921875, "global_step": 162876, "epoch": 1962} {"train_loss": -23.58905601501465, "global_step": 162877, "epoch": 1962} {"train_loss": -23.517221450805664, "global_step": 162878, "epoch": 1962} {"train_loss": -23.620065689086914, "global_step": 162879, "epoch": 1962} {"train_loss": -23.469297409057617, "global_step": 162880, "epoch": 1962} {"train_loss": -23.517587661743164, "global_step": 162881, "epoch": 1962} {"train_loss": -23.4591121673584, "global_step": 162882, "epoch": 1962} {"train_loss": -23.38251304626465, "global_step": 162883, "epoch": 1962} {"train_loss": -23.55561637878418, "global_step": 162884, "epoch": 1962} {"train_loss": -24.073556900024414, "global_step": 162885, "epoch": 1962} {"train_loss": -23.46931266784668, "global_step": 162886, "epoch": 1962} {"train_loss": -23.536087036132812, "global_step": 162887, "epoch": 1962} {"train_loss": -23.583209991455078, "global_step": 162888, "epoch": 1962} {"train_loss": -23.61049461364746, "global_step": 162889, "epoch": 1962} {"train_loss": -23.4953670501709, "global_step": 162890, "epoch": 1962} {"train_loss": -23.343393325805664, "global_step": 162891, "epoch": 1962} {"train_loss": -23.870712280273438, "global_step": 162892, "epoch": 1962} {"train_loss": -23.2102108001709, "global_step": 162893, "epoch": 1962} {"train_loss": -23.82381248474121, "global_step": 162894, "epoch": 1962} {"train_loss": -23.686084747314453, "global_step": 162895, "epoch": 1962} {"train_loss": -23.762062072753906, "global_step": 162896, "epoch": 1962} {"train_loss": -23.76624870300293, "global_step": 162897, "epoch": 1962} {"train_loss": -23.70318603515625, "global_step": 162898, "epoch": 1962} {"train_loss": -23.675588607788086, "global_step": 162899, "epoch": 1962} {"train_loss": -23.825407028198242, "global_step": 162900, "epoch": 1962} {"train_loss": -23.52186393737793, "global_step": 162901, "epoch": 1962} {"train_loss": -23.47629165649414, "global_step": 162902, "epoch": 1962} {"train_loss": -23.42502784729004, "global_step": 162903, "epoch": 1962} {"train_loss": -23.123037338256836, "global_step": 162904, "epoch": 1962} {"train_loss": -23.57294273376465, "global_step": 162905, "epoch": 1962} {"train_loss": -23.928794860839844, "global_step": 162906, "epoch": 1962} {"train_loss": -23.546920776367188, "global_step": 162907, "epoch": 1962} {"train_loss": -23.56614875793457, "global_step": 162908, "epoch": 1962} {"train_loss": -23.48503875732422, "global_step": 162909, "epoch": 1962} {"train_loss": -23.68329429626465, "global_step": 162910, "epoch": 1962} {"train_loss": -23.4132137298584, "global_step": 162911, "epoch": 1962} {"train_loss": -23.451705932617188, "global_step": 162912, "epoch": 1962} {"train_loss": -23.347585678100586, "global_step": 162913, "epoch": 1962} {"train_loss": -23.78126335144043, "global_step": 162914, "epoch": 1962} {"train_loss": -23.377283096313477, "global_step": 162915, "epoch": 1962} {"train_loss": -23.873294830322266, "global_step": 162916, "epoch": 1962} {"train_loss": -23.137277603149414, "global_step": 162917, "epoch": 1962} {"train_loss": -23.624576568603516, "global_step": 162918, "epoch": 1962} {"train_loss": -23.50360679626465, "global_step": 162919, "epoch": 1962} {"train_loss": -23.654926300048828, "global_step": 162920, "epoch": 1962} {"train_loss": -23.255895614624023, "global_step": 162921, "epoch": 1962} {"train_loss": -23.543781280517578, "global_step": 162922, "epoch": 1962} {"train_loss": -23.437917709350586, "global_step": 162923, "epoch": 1962} {"train_loss": -23.796070098876953, "global_step": 162924, "epoch": 1962} {"train_loss": -23.937170028686523, "global_step": 162925, "epoch": 1962} {"train_loss": -23.895238876342773, "global_step": 162926, "epoch": 1962} {"train_loss": -23.66128158569336, "global_step": 162927, "epoch": 1962} {"train_loss": -23.475457134017024, "global_step": 162928, "epoch": 1962, "val_loss": 6270383.0} {"train_loss": -22.902631759643555, "global_step": 162929, "epoch": 1963} {"train_loss": -22.79766082763672, "global_step": 162930, "epoch": 1963} {"train_loss": -23.36382293701172, "global_step": 162931, "epoch": 1963} {"train_loss": -23.159297943115234, "global_step": 162932, "epoch": 1963} {"train_loss": -23.348356246948242, "global_step": 162933, "epoch": 1963} {"train_loss": -23.582090377807617, "global_step": 162934, "epoch": 1963} {"train_loss": -23.343198776245117, "global_step": 162935, "epoch": 1963} {"train_loss": -23.319482803344727, "global_step": 162936, "epoch": 1963} {"train_loss": -23.440969467163086, "global_step": 162937, "epoch": 1963} {"train_loss": -23.24033546447754, "global_step": 162938, "epoch": 1963} {"train_loss": -23.350072860717773, "global_step": 162939, "epoch": 1963} {"train_loss": -23.308395385742188, "global_step": 162940, "epoch": 1963} {"train_loss": -23.60926628112793, "global_step": 162941, "epoch": 1963} {"train_loss": -23.296606063842773, "global_step": 162942, "epoch": 1963} {"train_loss": -23.530609130859375, "global_step": 162943, "epoch": 1963} {"train_loss": -23.28289031982422, "global_step": 162944, "epoch": 1963} {"train_loss": -23.328519821166992, "global_step": 162945, "epoch": 1963} {"train_loss": -23.433874130249023, "global_step": 162946, "epoch": 1963} {"train_loss": -23.323394775390625, "global_step": 162947, "epoch": 1963} {"train_loss": -23.050756454467773, "global_step": 162948, "epoch": 1963} {"train_loss": -23.61036491394043, "global_step": 162949, "epoch": 1963} {"train_loss": -23.282215118408203, "global_step": 162950, "epoch": 1963} {"train_loss": -23.377134323120117, "global_step": 162951, "epoch": 1963} {"train_loss": -23.458120346069336, "global_step": 162952, "epoch": 1963} {"train_loss": -23.495193481445312, "global_step": 162953, "epoch": 1963} {"train_loss": -23.25386619567871, "global_step": 162954, "epoch": 1963} {"train_loss": -23.76702308654785, "global_step": 162955, "epoch": 1963} {"train_loss": -23.540077209472656, "global_step": 162956, "epoch": 1963} {"train_loss": -23.40582847595215, "global_step": 162957, "epoch": 1963} {"train_loss": -23.584299087524414, "global_step": 162958, "epoch": 1963} {"train_loss": -23.4984073638916, "global_step": 162959, "epoch": 1963} {"train_loss": -23.689626693725586, "global_step": 162960, "epoch": 1963} {"train_loss": -23.596202850341797, "global_step": 162961, "epoch": 1963} {"train_loss": -23.5852108001709, "global_step": 162962, "epoch": 1963} {"train_loss": -23.538246154785156, "global_step": 162963, "epoch": 1963} {"train_loss": -23.4005184173584, "global_step": 162964, "epoch": 1963} {"train_loss": -23.607574462890625, "global_step": 162965, "epoch": 1963} {"train_loss": -23.42795181274414, "global_step": 162966, "epoch": 1963} {"train_loss": -23.4301815032959, "global_step": 162967, "epoch": 1963} {"train_loss": -23.72701072692871, "global_step": 162968, "epoch": 1963} {"train_loss": -23.708372116088867, "global_step": 162969, "epoch": 1963} {"train_loss": -23.510663986206055, "global_step": 162970, "epoch": 1963} {"train_loss": -23.648672103881836, "global_step": 162971, "epoch": 1963} {"train_loss": -23.99538803100586, "global_step": 162972, "epoch": 1963} {"train_loss": -23.612213134765625, "global_step": 162973, "epoch": 1963} {"train_loss": -23.3983211517334, "global_step": 162974, "epoch": 1963} {"train_loss": -23.140830993652344, "global_step": 162975, "epoch": 1963} {"train_loss": -23.26947021484375, "global_step": 162976, "epoch": 1963} {"train_loss": -23.031347274780273, "global_step": 162977, "epoch": 1963} {"train_loss": -23.7521915435791, "global_step": 162978, "epoch": 1963} {"train_loss": -23.574148178100586, "global_step": 162979, "epoch": 1963} {"train_loss": -23.87605094909668, "global_step": 162980, "epoch": 1963} {"train_loss": -23.282760620117188, "global_step": 162981, "epoch": 1963} {"train_loss": -23.86493492126465, "global_step": 162982, "epoch": 1963} {"train_loss": -23.4940242767334, "global_step": 162983, "epoch": 1963} {"train_loss": -23.56201934814453, "global_step": 162984, "epoch": 1963} {"train_loss": -23.622211456298828, "global_step": 162985, "epoch": 1963} {"train_loss": -23.622121810913086, "global_step": 162986, "epoch": 1963} {"train_loss": -23.783348083496094, "global_step": 162987, "epoch": 1963} {"train_loss": -23.5291690826416, "global_step": 162988, "epoch": 1963} {"train_loss": -23.19544792175293, "global_step": 162989, "epoch": 1963} {"train_loss": -23.554401397705078, "global_step": 162990, "epoch": 1963} {"train_loss": -23.11882209777832, "global_step": 162991, "epoch": 1963} {"train_loss": -23.366403579711914, "global_step": 162992, "epoch": 1963} {"train_loss": -23.243549346923828, "global_step": 162993, "epoch": 1963} {"train_loss": -23.345178604125977, "global_step": 162994, "epoch": 1963} {"train_loss": -23.315082550048828, "global_step": 162995, "epoch": 1963} {"train_loss": -23.45216178894043, "global_step": 162996, "epoch": 1963} {"train_loss": -23.647945404052734, "global_step": 162997, "epoch": 1963} {"train_loss": -23.156095504760742, "global_step": 162998, "epoch": 1963} {"train_loss": -23.751243591308594, "global_step": 162999, "epoch": 1963} {"train_loss": -23.6993408203125, "global_step": 163000, "epoch": 1963} {"train_loss": -23.839008331298828, "global_step": 163001, "epoch": 1963} {"train_loss": -23.669193267822266, "global_step": 163002, "epoch": 1963} {"train_loss": -23.437864303588867, "global_step": 163003, "epoch": 1963} {"train_loss": -24.04810333251953, "global_step": 163004, "epoch": 1963} {"train_loss": -24.001388549804688, "global_step": 163005, "epoch": 1963} {"train_loss": -23.38472557067871, "global_step": 163006, "epoch": 1963} {"train_loss": -23.7800350189209, "global_step": 163007, "epoch": 1963} {"train_loss": -23.62470817565918, "global_step": 163008, "epoch": 1963} {"train_loss": -23.642139434814453, "global_step": 163009, "epoch": 1963} {"train_loss": -23.763874053955078, "global_step": 163010, "epoch": 1963} {"train_loss": -23.497707229062737, "global_step": 163011, "epoch": 1963, "val_loss": 6230390.0} {"train_loss": -23.23448371887207, "global_step": 163012, "epoch": 1964} {"train_loss": -23.3725528717041, "global_step": 163013, "epoch": 1964} {"train_loss": -23.409605026245117, "global_step": 163014, "epoch": 1964} {"train_loss": -23.484472274780273, "global_step": 163015, "epoch": 1964} {"train_loss": -23.198074340820312, "global_step": 163016, "epoch": 1964} {"train_loss": -23.492351531982422, "global_step": 163017, "epoch": 1964} {"train_loss": -23.39272117614746, "global_step": 163018, "epoch": 1964} {"train_loss": -23.78461265563965, "global_step": 163019, "epoch": 1964} {"train_loss": -23.587724685668945, "global_step": 163020, "epoch": 1964} {"train_loss": -23.310842514038086, "global_step": 163021, "epoch": 1964} {"train_loss": -23.433876037597656, "global_step": 163022, "epoch": 1964} {"train_loss": -23.47047996520996, "global_step": 163023, "epoch": 1964} {"train_loss": -23.8030948638916, "global_step": 163024, "epoch": 1964} {"train_loss": -23.463592529296875, "global_step": 163025, "epoch": 1964} {"train_loss": -23.23082733154297, "global_step": 163026, "epoch": 1964} {"train_loss": -23.372175216674805, "global_step": 163027, "epoch": 1964} {"train_loss": -23.29083824157715, "global_step": 163028, "epoch": 1964} {"train_loss": -23.412212371826172, "global_step": 163029, "epoch": 1964} {"train_loss": -23.442312240600586, "global_step": 163030, "epoch": 1964} {"train_loss": -23.635334014892578, "global_step": 163031, "epoch": 1964} {"train_loss": -23.519750595092773, "global_step": 163032, "epoch": 1964} {"train_loss": -23.61151695251465, "global_step": 163033, "epoch": 1964} {"train_loss": -23.62212371826172, "global_step": 163034, "epoch": 1964} {"train_loss": -23.343027114868164, "global_step": 163035, "epoch": 1964} {"train_loss": -23.642759323120117, "global_step": 163036, "epoch": 1964} {"train_loss": -23.611278533935547, "global_step": 163037, "epoch": 1964} {"train_loss": -23.874767303466797, "global_step": 163038, "epoch": 1964} {"train_loss": -23.945547103881836, "global_step": 163039, "epoch": 1964} {"train_loss": -23.30821418762207, "global_step": 163040, "epoch": 1964} {"train_loss": -23.890186309814453, "global_step": 163041, "epoch": 1964} {"train_loss": -23.558279037475586, "global_step": 163042, "epoch": 1964} {"train_loss": -23.612577438354492, "global_step": 163043, "epoch": 1964} {"train_loss": -23.57390594482422, "global_step": 163044, "epoch": 1964} {"train_loss": -23.5071964263916, "global_step": 163045, "epoch": 1964} {"train_loss": -23.544084548950195, "global_step": 163046, "epoch": 1964} {"train_loss": -23.398183822631836, "global_step": 163047, "epoch": 1964} {"train_loss": -23.852706909179688, "global_step": 163048, "epoch": 1964} {"train_loss": -23.672697067260742, "global_step": 163049, "epoch": 1964} {"train_loss": -23.283681869506836, "global_step": 163050, "epoch": 1964} {"train_loss": -23.223169326782227, "global_step": 163051, "epoch": 1964} {"train_loss": -23.94814109802246, "global_step": 163052, "epoch": 1964} {"train_loss": -23.569992065429688, "global_step": 163053, "epoch": 1964} {"train_loss": -23.257102966308594, "global_step": 163054, "epoch": 1964} {"train_loss": -23.79707145690918, "global_step": 163055, "epoch": 1964} {"train_loss": -23.24532127380371, "global_step": 163056, "epoch": 1964} {"train_loss": -23.748525619506836, "global_step": 163057, "epoch": 1964} {"train_loss": -23.083534240722656, "global_step": 163058, "epoch": 1964} {"train_loss": -23.731420516967773, "global_step": 163059, "epoch": 1964} {"train_loss": -23.134967803955078, "global_step": 163060, "epoch": 1964} {"train_loss": -23.405057907104492, "global_step": 163061, "epoch": 1964} {"train_loss": -23.4487361907959, "global_step": 163062, "epoch": 1964} {"train_loss": -23.735761642456055, "global_step": 163063, "epoch": 1964} {"train_loss": -23.4824275970459, "global_step": 163064, "epoch": 1964} {"train_loss": -23.529624938964844, "global_step": 163065, "epoch": 1964} {"train_loss": -23.294370651245117, "global_step": 163066, "epoch": 1964} {"train_loss": -23.520381927490234, "global_step": 163067, "epoch": 1964} {"train_loss": -23.557235717773438, "global_step": 163068, "epoch": 1964} {"train_loss": -23.835948944091797, "global_step": 163069, "epoch": 1964} {"train_loss": -23.721439361572266, "global_step": 163070, "epoch": 1964} {"train_loss": -23.537351608276367, "global_step": 163071, "epoch": 1964} {"train_loss": -23.430479049682617, "global_step": 163072, "epoch": 1964} {"train_loss": -23.594221115112305, "global_step": 163073, "epoch": 1964} {"train_loss": -23.363977432250977, "global_step": 163074, "epoch": 1964} {"train_loss": -23.576932907104492, "global_step": 163075, "epoch": 1964} {"train_loss": -23.737743377685547, "global_step": 163076, "epoch": 1964} {"train_loss": -23.402372360229492, "global_step": 163077, "epoch": 1964} {"train_loss": -23.93389892578125, "global_step": 163078, "epoch": 1964} {"train_loss": -23.33352279663086, "global_step": 163079, "epoch": 1964} {"train_loss": -23.804386138916016, "global_step": 163080, "epoch": 1964} {"train_loss": -23.842702865600586, "global_step": 163081, "epoch": 1964} {"train_loss": -23.502277374267578, "global_step": 163082, "epoch": 1964} {"train_loss": -23.901700973510742, "global_step": 163083, "epoch": 1964} {"train_loss": -23.478233337402344, "global_step": 163084, "epoch": 1964} {"train_loss": -23.511199951171875, "global_step": 163085, "epoch": 1964} {"train_loss": -23.54863929748535, "global_step": 163086, "epoch": 1964} {"train_loss": -23.1611385345459, "global_step": 163087, "epoch": 1964} {"train_loss": -23.480798721313477, "global_step": 163088, "epoch": 1964} {"train_loss": -23.808935165405273, "global_step": 163089, "epoch": 1964} {"train_loss": -23.382535934448242, "global_step": 163090, "epoch": 1964} {"train_loss": -23.570337295532227, "global_step": 163091, "epoch": 1964} {"train_loss": -23.72479820251465, "global_step": 163092, "epoch": 1964} {"train_loss": -23.34503173828125, "global_step": 163093, "epoch": 1964} {"train_loss": -23.55114946020655, "global_step": 163094, "epoch": 1964, "val_loss": 6347597.0} {"train_loss": -22.560300827026367, "global_step": 163095, "epoch": 1965} {"train_loss": -22.685964584350586, "global_step": 163096, "epoch": 1965} {"train_loss": -23.051050186157227, "global_step": 163097, "epoch": 1965} {"train_loss": -22.584980010986328, "global_step": 163098, "epoch": 1965} {"train_loss": -22.506317138671875, "global_step": 163099, "epoch": 1965} {"train_loss": -22.960498809814453, "global_step": 163100, "epoch": 1965} {"train_loss": -22.982934951782227, "global_step": 163101, "epoch": 1965} {"train_loss": -23.082761764526367, "global_step": 163102, "epoch": 1965} {"train_loss": -22.767093658447266, "global_step": 163103, "epoch": 1965} {"train_loss": -23.37532615661621, "global_step": 163104, "epoch": 1965} {"train_loss": -22.849140167236328, "global_step": 163105, "epoch": 1965} {"train_loss": -23.121789932250977, "global_step": 163106, "epoch": 1965} {"train_loss": -23.440038681030273, "global_step": 163107, "epoch": 1965} {"train_loss": -22.9211483001709, "global_step": 163108, "epoch": 1965} {"train_loss": -23.153793334960938, "global_step": 163109, "epoch": 1965} {"train_loss": -23.48061180114746, "global_step": 163110, "epoch": 1965} {"train_loss": -23.533206939697266, "global_step": 163111, "epoch": 1965} {"train_loss": -23.524343490600586, "global_step": 163112, "epoch": 1965} {"train_loss": -23.65497398376465, "global_step": 163113, "epoch": 1965} {"train_loss": -23.530668258666992, "global_step": 163114, "epoch": 1965} {"train_loss": -23.297475814819336, "global_step": 163115, "epoch": 1965} {"train_loss": -23.422710418701172, "global_step": 163116, "epoch": 1965} {"train_loss": -23.47305679321289, "global_step": 163117, "epoch": 1965} {"train_loss": -23.449405670166016, "global_step": 163118, "epoch": 1965} {"train_loss": -23.455093383789062, "global_step": 163119, "epoch": 1965} {"train_loss": -23.52312660217285, "global_step": 163120, "epoch": 1965} {"train_loss": -23.5601749420166, "global_step": 163121, "epoch": 1965} {"train_loss": -23.580488204956055, "global_step": 163122, "epoch": 1965} {"train_loss": -23.326704025268555, "global_step": 163123, "epoch": 1965} {"train_loss": -23.60151481628418, "global_step": 163124, "epoch": 1965} {"train_loss": -23.953388214111328, "global_step": 163125, "epoch": 1965} {"train_loss": -23.291044235229492, "global_step": 163126, "epoch": 1965} {"train_loss": -23.62862205505371, "global_step": 163127, "epoch": 1965} {"train_loss": -23.72760581970215, "global_step": 163128, "epoch": 1965} {"train_loss": -23.24427604675293, "global_step": 163129, "epoch": 1965} {"train_loss": -23.448575973510742, "global_step": 163130, "epoch": 1965} {"train_loss": -23.61907958984375, "global_step": 163131, "epoch": 1965} {"train_loss": -23.777700424194336, "global_step": 163132, "epoch": 1965} {"train_loss": -23.55458641052246, "global_step": 163133, "epoch": 1965} {"train_loss": -23.669801712036133, "global_step": 163134, "epoch": 1965} {"train_loss": -23.813373565673828, "global_step": 163135, "epoch": 1965} {"train_loss": -23.71834373474121, "global_step": 163136, "epoch": 1965} {"train_loss": -23.446752548217773, "global_step": 163137, "epoch": 1965} {"train_loss": -23.59882926940918, "global_step": 163138, "epoch": 1965} {"train_loss": -23.49688148498535, "global_step": 163139, "epoch": 1965} {"train_loss": -23.5709171295166, "global_step": 163140, "epoch": 1965} {"train_loss": -23.546167373657227, "global_step": 163141, "epoch": 1965} {"train_loss": -23.631328582763672, "global_step": 163142, "epoch": 1965} {"train_loss": -23.822769165039062, "global_step": 163143, "epoch": 1965} {"train_loss": -23.775869369506836, "global_step": 163144, "epoch": 1965} {"train_loss": -23.279245376586914, "global_step": 163145, "epoch": 1965} {"train_loss": -23.7293701171875, "global_step": 163146, "epoch": 1965} {"train_loss": -23.596147537231445, "global_step": 163147, "epoch": 1965} {"train_loss": -23.70975112915039, "global_step": 163148, "epoch": 1965} {"train_loss": -23.274049758911133, "global_step": 163149, "epoch": 1965} {"train_loss": -23.9612979888916, "global_step": 163150, "epoch": 1965} {"train_loss": -23.499649047851562, "global_step": 163151, "epoch": 1965} {"train_loss": -23.620664596557617, "global_step": 163152, "epoch": 1965} {"train_loss": -23.615633010864258, "global_step": 163153, "epoch": 1965} {"train_loss": -23.311609268188477, "global_step": 163154, "epoch": 1965} {"train_loss": -23.898208618164062, "global_step": 163155, "epoch": 1965} {"train_loss": -23.51009178161621, "global_step": 163156, "epoch": 1965} {"train_loss": -23.602514266967773, "global_step": 163157, "epoch": 1965} {"train_loss": -23.325992584228516, "global_step": 163158, "epoch": 1965} {"train_loss": -23.713207244873047, "global_step": 163159, "epoch": 1965} {"train_loss": -23.281036376953125, "global_step": 163160, "epoch": 1965} {"train_loss": -23.510738372802734, "global_step": 163161, "epoch": 1965} {"train_loss": -23.148374557495117, "global_step": 163162, "epoch": 1965} {"train_loss": -23.77616310119629, "global_step": 163163, "epoch": 1965} {"train_loss": -23.38081932067871, "global_step": 163164, "epoch": 1965} {"train_loss": -23.189117431640625, "global_step": 163165, "epoch": 1965} {"train_loss": -22.650760650634766, "global_step": 163166, "epoch": 1965} {"train_loss": -23.298444747924805, "global_step": 163167, "epoch": 1965} {"train_loss": -23.869674682617188, "global_step": 163168, "epoch": 1965} {"train_loss": -23.62174415588379, "global_step": 163169, "epoch": 1965} {"train_loss": -23.247943878173828, "global_step": 163170, "epoch": 1965} {"train_loss": -23.936155319213867, "global_step": 163171, "epoch": 1965} {"train_loss": -23.64043426513672, "global_step": 163172, "epoch": 1965} {"train_loss": -23.604995727539062, "global_step": 163173, "epoch": 1965} {"train_loss": -23.687314987182617, "global_step": 163174, "epoch": 1965} {"train_loss": -23.718149185180664, "global_step": 163175, "epoch": 1965} {"train_loss": -23.939237594604492, "global_step": 163176, "epoch": 1965} {"train_loss": -23.4337628146252, "global_step": 163177, "epoch": 1965, "val_loss": 6360225.0} {"train_loss": -23.43280601501465, "global_step": 163178, "epoch": 1966} {"train_loss": -23.489768981933594, "global_step": 163179, "epoch": 1966} {"train_loss": -23.653696060180664, "global_step": 163180, "epoch": 1966} {"train_loss": -23.379648208618164, "global_step": 163181, "epoch": 1966} {"train_loss": -23.723907470703125, "global_step": 163182, "epoch": 1966} {"train_loss": -23.161117553710938, "global_step": 163183, "epoch": 1966} {"train_loss": -23.257871627807617, "global_step": 163184, "epoch": 1966} {"train_loss": -23.59110450744629, "global_step": 163185, "epoch": 1966} {"train_loss": -23.440942764282227, "global_step": 163186, "epoch": 1966} {"train_loss": -23.617176055908203, "global_step": 163187, "epoch": 1966} {"train_loss": -23.77505874633789, "global_step": 163188, "epoch": 1966} {"train_loss": -23.668670654296875, "global_step": 163189, "epoch": 1966} {"train_loss": -23.414045333862305, "global_step": 163190, "epoch": 1966} {"train_loss": -23.66763687133789, "global_step": 163191, "epoch": 1966} {"train_loss": -23.803302764892578, "global_step": 163192, "epoch": 1966} {"train_loss": -23.36518669128418, "global_step": 163193, "epoch": 1966} {"train_loss": -23.809938430786133, "global_step": 163194, "epoch": 1966} {"train_loss": -23.3115234375, "global_step": 163195, "epoch": 1966} {"train_loss": -23.61603355407715, "global_step": 163196, "epoch": 1966} {"train_loss": -23.3101749420166, "global_step": 163197, "epoch": 1966} {"train_loss": -23.651052474975586, "global_step": 163198, "epoch": 1966} {"train_loss": -23.36174964904785, "global_step": 163199, "epoch": 1966} {"train_loss": -23.731781005859375, "global_step": 163200, "epoch": 1966} {"train_loss": -23.74907684326172, "global_step": 163201, "epoch": 1966} {"train_loss": -23.924354553222656, "global_step": 163202, "epoch": 1966} {"train_loss": -23.612812042236328, "global_step": 163203, "epoch": 1966} {"train_loss": -23.70770263671875, "global_step": 163204, "epoch": 1966} {"train_loss": -23.145051956176758, "global_step": 163205, "epoch": 1966} {"train_loss": -23.91460609436035, "global_step": 163206, "epoch": 1966} {"train_loss": -23.3144588470459, "global_step": 163207, "epoch": 1966} {"train_loss": -22.854045867919922, "global_step": 163208, "epoch": 1966} {"train_loss": -23.613019943237305, "global_step": 163209, "epoch": 1966} {"train_loss": -23.470691680908203, "global_step": 163210, "epoch": 1966} {"train_loss": -23.895673751831055, "global_step": 163211, "epoch": 1966} {"train_loss": -23.48563003540039, "global_step": 163212, "epoch": 1966} {"train_loss": -23.771818161010742, "global_step": 163213, "epoch": 1966} {"train_loss": -23.050556182861328, "global_step": 163214, "epoch": 1966} {"train_loss": -23.74273109436035, "global_step": 163215, "epoch": 1966} {"train_loss": -23.492578506469727, "global_step": 163216, "epoch": 1966} {"train_loss": -23.414173126220703, "global_step": 163217, "epoch": 1966} {"train_loss": -23.651655197143555, "global_step": 163218, "epoch": 1966} {"train_loss": -23.775114059448242, "global_step": 163219, "epoch": 1966} {"train_loss": -23.504133224487305, "global_step": 163220, "epoch": 1966} {"train_loss": -23.71186637878418, "global_step": 163221, "epoch": 1966} {"train_loss": -23.42960548400879, "global_step": 163222, "epoch": 1966} {"train_loss": -23.967885971069336, "global_step": 163223, "epoch": 1966} {"train_loss": -23.515522003173828, "global_step": 163224, "epoch": 1966} {"train_loss": -23.44105339050293, "global_step": 163225, "epoch": 1966} {"train_loss": -23.651498794555664, "global_step": 163226, "epoch": 1966} {"train_loss": -23.29654884338379, "global_step": 163227, "epoch": 1966} {"train_loss": -23.293563842773438, "global_step": 163228, "epoch": 1966} {"train_loss": -23.336658477783203, "global_step": 163229, "epoch": 1966} {"train_loss": -23.416975021362305, "global_step": 163230, "epoch": 1966} {"train_loss": -23.516956329345703, "global_step": 163231, "epoch": 1966} {"train_loss": -23.529787063598633, "global_step": 163232, "epoch": 1966} {"train_loss": -23.864721298217773, "global_step": 163233, "epoch": 1966} {"train_loss": -23.401756286621094, "global_step": 163234, "epoch": 1966} {"train_loss": -23.367008209228516, "global_step": 163235, "epoch": 1966} {"train_loss": -23.682958602905273, "global_step": 163236, "epoch": 1966} {"train_loss": -23.48036003112793, "global_step": 163237, "epoch": 1966} {"train_loss": -23.478660583496094, "global_step": 163238, "epoch": 1966} {"train_loss": -23.365121841430664, "global_step": 163239, "epoch": 1966} {"train_loss": -23.325407028198242, "global_step": 163240, "epoch": 1966} {"train_loss": -23.33295249938965, "global_step": 163241, "epoch": 1966} {"train_loss": -23.42641258239746, "global_step": 163242, "epoch": 1966} {"train_loss": -23.78183937072754, "global_step": 163243, "epoch": 1966} {"train_loss": -23.727697372436523, "global_step": 163244, "epoch": 1966} {"train_loss": -23.512975692749023, "global_step": 163245, "epoch": 1966} {"train_loss": -23.161392211914062, "global_step": 163246, "epoch": 1966} {"train_loss": -23.669950485229492, "global_step": 163247, "epoch": 1966} {"train_loss": -23.660531997680664, "global_step": 163248, "epoch": 1966} {"train_loss": -23.675371170043945, "global_step": 163249, "epoch": 1966} {"train_loss": -23.23331642150879, "global_step": 163250, "epoch": 1966} {"train_loss": -23.684717178344727, "global_step": 163251, "epoch": 1966} {"train_loss": -23.95613670349121, "global_step": 163252, "epoch": 1966} {"train_loss": -23.30514907836914, "global_step": 163253, "epoch": 1966} {"train_loss": -23.14338493347168, "global_step": 163254, "epoch": 1966} {"train_loss": -23.29136085510254, "global_step": 163255, "epoch": 1966} {"train_loss": -23.32944107055664, "global_step": 163256, "epoch": 1966} {"train_loss": -23.389318466186523, "global_step": 163257, "epoch": 1966} {"train_loss": -23.596586227416992, "global_step": 163258, "epoch": 1966} {"train_loss": -23.418777465820312, "global_step": 163259, "epoch": 1966} {"train_loss": -23.522294722407697, "global_step": 163260, "epoch": 1966, "val_loss": 6415520.5} {"train_loss": -22.20710563659668, "global_step": 163261, "epoch": 1967} {"train_loss": -22.222614288330078, "global_step": 163262, "epoch": 1967} {"train_loss": -22.770156860351562, "global_step": 163263, "epoch": 1967} {"train_loss": -23.051929473876953, "global_step": 163264, "epoch": 1967} {"train_loss": -22.85743522644043, "global_step": 163265, "epoch": 1967} {"train_loss": -22.686635971069336, "global_step": 163266, "epoch": 1967} {"train_loss": -23.187925338745117, "global_step": 163267, "epoch": 1967} {"train_loss": -22.857084274291992, "global_step": 163268, "epoch": 1967} {"train_loss": -23.117856979370117, "global_step": 163269, "epoch": 1967} {"train_loss": -22.897375106811523, "global_step": 163270, "epoch": 1967} {"train_loss": -23.023189544677734, "global_step": 163271, "epoch": 1967} {"train_loss": -23.04819107055664, "global_step": 163272, "epoch": 1967} {"train_loss": -23.095579147338867, "global_step": 163273, "epoch": 1967} {"train_loss": -23.493940353393555, "global_step": 163274, "epoch": 1967} {"train_loss": -23.085296630859375, "global_step": 163275, "epoch": 1967} {"train_loss": -23.153308868408203, "global_step": 163276, "epoch": 1967} {"train_loss": -23.26247215270996, "global_step": 163277, "epoch": 1967} {"train_loss": -23.210187911987305, "global_step": 163278, "epoch": 1967} {"train_loss": -23.3983211517334, "global_step": 163279, "epoch": 1967} {"train_loss": -23.16947364807129, "global_step": 163280, "epoch": 1967} {"train_loss": -23.1464900970459, "global_step": 163281, "epoch": 1967} {"train_loss": -23.13623046875, "global_step": 163282, "epoch": 1967} {"train_loss": -23.253433227539062, "global_step": 163283, "epoch": 1967} {"train_loss": -23.363405227661133, "global_step": 163284, "epoch": 1967} {"train_loss": -23.145923614501953, "global_step": 163285, "epoch": 1967} {"train_loss": -23.59800148010254, "global_step": 163286, "epoch": 1967} {"train_loss": -23.55946922302246, "global_step": 163287, "epoch": 1967} {"train_loss": -23.0813045501709, "global_step": 163288, "epoch": 1967} {"train_loss": -23.544103622436523, "global_step": 163289, "epoch": 1967} {"train_loss": -23.55159568786621, "global_step": 163290, "epoch": 1967} {"train_loss": -23.50131607055664, "global_step": 163291, "epoch": 1967} {"train_loss": -23.496728897094727, "global_step": 163292, "epoch": 1967} {"train_loss": -23.82695198059082, "global_step": 163293, "epoch": 1967} {"train_loss": -23.769540786743164, "global_step": 163294, "epoch": 1967} {"train_loss": -23.462026596069336, "global_step": 163295, "epoch": 1967} {"train_loss": -23.511598587036133, "global_step": 163296, "epoch": 1967} {"train_loss": -23.2829647064209, "global_step": 163297, "epoch": 1967} {"train_loss": -23.419239044189453, "global_step": 163298, "epoch": 1967} {"train_loss": -23.674489974975586, "global_step": 163299, "epoch": 1967} {"train_loss": -23.498977661132812, "global_step": 163300, "epoch": 1967} {"train_loss": -23.7091064453125, "global_step": 163301, "epoch": 1967} {"train_loss": -23.587539672851562, "global_step": 163302, "epoch": 1967} {"train_loss": -23.842504501342773, "global_step": 163303, "epoch": 1967} {"train_loss": -23.589603424072266, "global_step": 163304, "epoch": 1967} {"train_loss": -23.491323471069336, "global_step": 163305, "epoch": 1967} {"train_loss": -23.76784324645996, "global_step": 163306, "epoch": 1967} {"train_loss": -23.7380428314209, "global_step": 163307, "epoch": 1967} {"train_loss": -23.670934677124023, "global_step": 163308, "epoch": 1967} {"train_loss": -23.64566421508789, "global_step": 163309, "epoch": 1967} {"train_loss": -23.564104080200195, "global_step": 163310, "epoch": 1967} {"train_loss": -23.845840454101562, "global_step": 163311, "epoch": 1967} {"train_loss": -23.59774398803711, "global_step": 163312, "epoch": 1967} {"train_loss": -23.49231719970703, "global_step": 163313, "epoch": 1967} {"train_loss": -23.902708053588867, "global_step": 163314, "epoch": 1967} {"train_loss": -23.714895248413086, "global_step": 163315, "epoch": 1967} {"train_loss": -23.58856773376465, "global_step": 163316, "epoch": 1967} {"train_loss": -23.275894165039062, "global_step": 163317, "epoch": 1967} {"train_loss": -23.58820152282715, "global_step": 163318, "epoch": 1967} {"train_loss": -23.405759811401367, "global_step": 163319, "epoch": 1967} {"train_loss": -23.74680519104004, "global_step": 163320, "epoch": 1967} {"train_loss": -23.575254440307617, "global_step": 163321, "epoch": 1967} {"train_loss": -23.83668327331543, "global_step": 163322, "epoch": 1967} {"train_loss": -23.47635841369629, "global_step": 163323, "epoch": 1967} {"train_loss": -23.832427978515625, "global_step": 163324, "epoch": 1967} {"train_loss": -23.7105770111084, "global_step": 163325, "epoch": 1967} {"train_loss": -23.52474021911621, "global_step": 163326, "epoch": 1967} {"train_loss": -23.4166316986084, "global_step": 163327, "epoch": 1967} {"train_loss": -23.47991371154785, "global_step": 163328, "epoch": 1967} {"train_loss": -23.416868209838867, "global_step": 163329, "epoch": 1967} {"train_loss": -23.816556930541992, "global_step": 163330, "epoch": 1967} {"train_loss": -23.691268920898438, "global_step": 163331, "epoch": 1967} {"train_loss": -23.721988677978516, "global_step": 163332, "epoch": 1967} {"train_loss": -23.677778244018555, "global_step": 163333, "epoch": 1967} {"train_loss": -23.81432342529297, "global_step": 163334, "epoch": 1967} {"train_loss": -23.169357299804688, "global_step": 163335, "epoch": 1967} {"train_loss": -23.719079971313477, "global_step": 163336, "epoch": 1967} {"train_loss": -23.50703239440918, "global_step": 163337, "epoch": 1967} {"train_loss": -23.309232711791992, "global_step": 163338, "epoch": 1967} {"train_loss": -23.898733139038086, "global_step": 163339, "epoch": 1967} {"train_loss": -23.776517868041992, "global_step": 163340, "epoch": 1967} {"train_loss": -23.775144577026367, "global_step": 163341, "epoch": 1967} {"train_loss": -23.4310302734375, "global_step": 163342, "epoch": 1967} {"train_loss": -23.427245840968855, "global_step": 163343, "epoch": 1967, "val_loss": 6270406.0} {"train_loss": -23.56839942932129, "global_step": 163344, "epoch": 1968} {"train_loss": -23.28365135192871, "global_step": 163345, "epoch": 1968} {"train_loss": -23.140422821044922, "global_step": 163346, "epoch": 1968} {"train_loss": -23.3841552734375, "global_step": 163347, "epoch": 1968} {"train_loss": -23.20564079284668, "global_step": 163348, "epoch": 1968} {"train_loss": -22.762582778930664, "global_step": 163349, "epoch": 1968} {"train_loss": -23.183095932006836, "global_step": 163350, "epoch": 1968} {"train_loss": -23.206932067871094, "global_step": 163351, "epoch": 1968} {"train_loss": -23.237510681152344, "global_step": 163352, "epoch": 1968} {"train_loss": -23.494192123413086, "global_step": 163353, "epoch": 1968} {"train_loss": -23.358991622924805, "global_step": 163354, "epoch": 1968} {"train_loss": -23.226882934570312, "global_step": 163355, "epoch": 1968} {"train_loss": -23.542694091796875, "global_step": 163356, "epoch": 1968} {"train_loss": -23.644943237304688, "global_step": 163357, "epoch": 1968} {"train_loss": -23.293363571166992, "global_step": 163358, "epoch": 1968} {"train_loss": -23.370471954345703, "global_step": 163359, "epoch": 1968} {"train_loss": -23.93403434753418, "global_step": 163360, "epoch": 1968} {"train_loss": -23.439544677734375, "global_step": 163361, "epoch": 1968} {"train_loss": -23.707910537719727, "global_step": 163362, "epoch": 1968} {"train_loss": -23.697519302368164, "global_step": 163363, "epoch": 1968} {"train_loss": -23.115772247314453, "global_step": 163364, "epoch": 1968} {"train_loss": -23.771848678588867, "global_step": 163365, "epoch": 1968} {"train_loss": -23.52465057373047, "global_step": 163366, "epoch": 1968} {"train_loss": -23.67821502685547, "global_step": 163367, "epoch": 1968} {"train_loss": -23.729467391967773, "global_step": 163368, "epoch": 1968} {"train_loss": -23.435901641845703, "global_step": 163369, "epoch": 1968} {"train_loss": -23.430959701538086, "global_step": 163370, "epoch": 1968} {"train_loss": -23.385723114013672, "global_step": 163371, "epoch": 1968} {"train_loss": -23.59442710876465, "global_step": 163372, "epoch": 1968} {"train_loss": -23.26206398010254, "global_step": 163373, "epoch": 1968} {"train_loss": -23.33000373840332, "global_step": 163374, "epoch": 1968} {"train_loss": -23.55140495300293, "global_step": 163375, "epoch": 1968} {"train_loss": -23.504440307617188, "global_step": 163376, "epoch": 1968} {"train_loss": -23.367677688598633, "global_step": 163377, "epoch": 1968} {"train_loss": -23.493635177612305, "global_step": 163378, "epoch": 1968} {"train_loss": -23.43377113342285, "global_step": 163379, "epoch": 1968} {"train_loss": -23.684791564941406, "global_step": 163380, "epoch": 1968} {"train_loss": -23.417970657348633, "global_step": 163381, "epoch": 1968} {"train_loss": -23.403085708618164, "global_step": 163382, "epoch": 1968} {"train_loss": -23.644371032714844, "global_step": 163383, "epoch": 1968} {"train_loss": -23.36285972595215, "global_step": 163384, "epoch": 1968} {"train_loss": -23.520736694335938, "global_step": 163385, "epoch": 1968} {"train_loss": -23.955352783203125, "global_step": 163386, "epoch": 1968} {"train_loss": -23.169696807861328, "global_step": 163387, "epoch": 1968} {"train_loss": -23.366382598876953, "global_step": 163388, "epoch": 1968} {"train_loss": -23.915973663330078, "global_step": 163389, "epoch": 1968} {"train_loss": -23.679664611816406, "global_step": 163390, "epoch": 1968} {"train_loss": -23.551904678344727, "global_step": 163391, "epoch": 1968} {"train_loss": -23.641109466552734, "global_step": 163392, "epoch": 1968} {"train_loss": -23.575769424438477, "global_step": 163393, "epoch": 1968} {"train_loss": -23.482168197631836, "global_step": 163394, "epoch": 1968} {"train_loss": -23.75492286682129, "global_step": 163395, "epoch": 1968} {"train_loss": -23.485326766967773, "global_step": 163396, "epoch": 1968} {"train_loss": -23.534805297851562, "global_step": 163397, "epoch": 1968} {"train_loss": -23.579788208007812, "global_step": 163398, "epoch": 1968} {"train_loss": -23.29457664489746, "global_step": 163399, "epoch": 1968} {"train_loss": -23.60564613342285, "global_step": 163400, "epoch": 1968} {"train_loss": -23.546669006347656, "global_step": 163401, "epoch": 1968} {"train_loss": -23.75865364074707, "global_step": 163402, "epoch": 1968} {"train_loss": -23.47031021118164, "global_step": 163403, "epoch": 1968} {"train_loss": -23.567270278930664, "global_step": 163404, "epoch": 1968} {"train_loss": -23.86275291442871, "global_step": 163405, "epoch": 1968} {"train_loss": -23.318265914916992, "global_step": 163406, "epoch": 1968} {"train_loss": -23.642597198486328, "global_step": 163407, "epoch": 1968} {"train_loss": -23.72073745727539, "global_step": 163408, "epoch": 1968} {"train_loss": -23.57432746887207, "global_step": 163409, "epoch": 1968} {"train_loss": -23.609636306762695, "global_step": 163410, "epoch": 1968} {"train_loss": -23.613588333129883, "global_step": 163411, "epoch": 1968} {"train_loss": -23.702104568481445, "global_step": 163412, "epoch": 1968} {"train_loss": -23.910812377929688, "global_step": 163413, "epoch": 1968} {"train_loss": -23.731170654296875, "global_step": 163414, "epoch": 1968} {"train_loss": -24.029281616210938, "global_step": 163415, "epoch": 1968} {"train_loss": -23.529949188232422, "global_step": 163416, "epoch": 1968} {"train_loss": -23.403980255126953, "global_step": 163417, "epoch": 1968} {"train_loss": -23.435861587524414, "global_step": 163418, "epoch": 1968} {"train_loss": -23.848852157592773, "global_step": 163419, "epoch": 1968} {"train_loss": -23.602659225463867, "global_step": 163420, "epoch": 1968} {"train_loss": -23.46864128112793, "global_step": 163421, "epoch": 1968} {"train_loss": -23.81938934326172, "global_step": 163422, "epoch": 1968} {"train_loss": -23.40651512145996, "global_step": 163423, "epoch": 1968} {"train_loss": -23.850778579711914, "global_step": 163424, "epoch": 1968} {"train_loss": -23.43428611755371, "global_step": 163425, "epoch": 1968} {"train_loss": -23.51481888093144, "global_step": 163426, "epoch": 1968, "val_loss": 6324529.0} {"train_loss": -23.136014938354492, "global_step": 163427, "epoch": 1969} {"train_loss": -22.74570655822754, "global_step": 163428, "epoch": 1969} {"train_loss": -22.370092391967773, "global_step": 163429, "epoch": 1969} {"train_loss": -23.398197174072266, "global_step": 163430, "epoch": 1969} {"train_loss": -22.654935836791992, "global_step": 163431, "epoch": 1969} {"train_loss": -23.316301345825195, "global_step": 163432, "epoch": 1969} {"train_loss": -23.065526962280273, "global_step": 163433, "epoch": 1969} {"train_loss": -23.356184005737305, "global_step": 163434, "epoch": 1969} {"train_loss": -22.739023208618164, "global_step": 163435, "epoch": 1969} {"train_loss": -23.03730583190918, "global_step": 163436, "epoch": 1969} {"train_loss": -23.270793914794922, "global_step": 163437, "epoch": 1969} {"train_loss": -22.794347763061523, "global_step": 163438, "epoch": 1969} {"train_loss": -23.469148635864258, "global_step": 163439, "epoch": 1969} {"train_loss": -23.524839401245117, "global_step": 163440, "epoch": 1969} {"train_loss": -23.45558738708496, "global_step": 163441, "epoch": 1969} {"train_loss": -22.844547271728516, "global_step": 163442, "epoch": 1969} {"train_loss": -23.316720962524414, "global_step": 163443, "epoch": 1969} {"train_loss": -23.22750473022461, "global_step": 163444, "epoch": 1969} {"train_loss": -23.214387893676758, "global_step": 163445, "epoch": 1969} {"train_loss": -23.41935157775879, "global_step": 163446, "epoch": 1969} {"train_loss": -23.401458740234375, "global_step": 163447, "epoch": 1969} {"train_loss": -23.179643630981445, "global_step": 163448, "epoch": 1969} {"train_loss": -23.359716415405273, "global_step": 163449, "epoch": 1969} {"train_loss": -23.104541778564453, "global_step": 163450, "epoch": 1969} {"train_loss": -23.393461227416992, "global_step": 163451, "epoch": 1969} {"train_loss": -23.34293556213379, "global_step": 163452, "epoch": 1969} {"train_loss": -23.086414337158203, "global_step": 163453, "epoch": 1969} {"train_loss": -23.333341598510742, "global_step": 163454, "epoch": 1969} {"train_loss": -23.43165397644043, "global_step": 163455, "epoch": 1969} {"train_loss": -23.58442497253418, "global_step": 163456, "epoch": 1969} {"train_loss": -23.61835479736328, "global_step": 163457, "epoch": 1969} {"train_loss": -23.681093215942383, "global_step": 163458, "epoch": 1969} {"train_loss": -23.369077682495117, "global_step": 163459, "epoch": 1969} {"train_loss": -23.42000961303711, "global_step": 163460, "epoch": 1969} {"train_loss": -23.3846492767334, "global_step": 163461, "epoch": 1969} {"train_loss": -23.458391189575195, "global_step": 163462, "epoch": 1969} {"train_loss": -23.570459365844727, "global_step": 163463, "epoch": 1969} {"train_loss": -23.29311752319336, "global_step": 163464, "epoch": 1969} {"train_loss": -23.909393310546875, "global_step": 163465, "epoch": 1969} {"train_loss": -23.73979377746582, "global_step": 163466, "epoch": 1969} {"train_loss": -23.467573165893555, "global_step": 163467, "epoch": 1969} {"train_loss": -23.619985580444336, "global_step": 163468, "epoch": 1969} {"train_loss": -23.37989616394043, "global_step": 163469, "epoch": 1969} {"train_loss": -23.853458404541016, "global_step": 163470, "epoch": 1969} {"train_loss": -23.6131649017334, "global_step": 163471, "epoch": 1969} {"train_loss": -23.602155685424805, "global_step": 163472, "epoch": 1969} {"train_loss": -23.3034610748291, "global_step": 163473, "epoch": 1969} {"train_loss": -23.348896026611328, "global_step": 163474, "epoch": 1969} {"train_loss": -23.528017044067383, "global_step": 163475, "epoch": 1969} {"train_loss": -23.499435424804688, "global_step": 163476, "epoch": 1969} {"train_loss": -23.57554054260254, "global_step": 163477, "epoch": 1969} {"train_loss": -23.52991485595703, "global_step": 163478, "epoch": 1969} {"train_loss": -23.96355628967285, "global_step": 163479, "epoch": 1969} {"train_loss": -23.477338790893555, "global_step": 163480, "epoch": 1969} {"train_loss": -23.2987117767334, "global_step": 163481, "epoch": 1969} {"train_loss": -23.667285919189453, "global_step": 163482, "epoch": 1969} {"train_loss": -23.6163272857666, "global_step": 163483, "epoch": 1969} {"train_loss": -23.603519439697266, "global_step": 163484, "epoch": 1969} {"train_loss": -23.940908432006836, "global_step": 163485, "epoch": 1969} {"train_loss": -23.647855758666992, "global_step": 163486, "epoch": 1969} {"train_loss": -23.544252395629883, "global_step": 163487, "epoch": 1969} {"train_loss": -23.711231231689453, "global_step": 163488, "epoch": 1969} {"train_loss": -23.569211959838867, "global_step": 163489, "epoch": 1969} {"train_loss": -23.96565055847168, "global_step": 163490, "epoch": 1969} {"train_loss": -23.672393798828125, "global_step": 163491, "epoch": 1969} {"train_loss": -23.74397850036621, "global_step": 163492, "epoch": 1969} {"train_loss": -23.1998348236084, "global_step": 163493, "epoch": 1969} {"train_loss": -23.88483238220215, "global_step": 163494, "epoch": 1969} {"train_loss": -23.628265380859375, "global_step": 163495, "epoch": 1969} {"train_loss": -24.05010414123535, "global_step": 163496, "epoch": 1969} {"train_loss": -23.644384384155273, "global_step": 163497, "epoch": 1969} {"train_loss": -23.507740020751953, "global_step": 163498, "epoch": 1969} {"train_loss": -23.698152542114258, "global_step": 163499, "epoch": 1969} {"train_loss": -23.646886825561523, "global_step": 163500, "epoch": 1969} {"train_loss": -23.79254150390625, "global_step": 163501, "epoch": 1969} {"train_loss": -23.575284957885742, "global_step": 163502, "epoch": 1969} {"train_loss": -23.860702514648438, "global_step": 163503, "epoch": 1969} {"train_loss": -23.613021850585938, "global_step": 163504, "epoch": 1969} {"train_loss": -23.598535537719727, "global_step": 163505, "epoch": 1969} {"train_loss": -23.658639907836914, "global_step": 163506, "epoch": 1969} {"train_loss": -23.496797561645508, "global_step": 163507, "epoch": 1969} {"train_loss": -23.521337509155273, "global_step": 163508, "epoch": 1969} {"train_loss": -23.44738075532109, "global_step": 163509, "epoch": 1969, "val_loss": 6418962.0} {"train_loss": -23.20924949645996, "global_step": 163510, "epoch": 1970} {"train_loss": -23.39700698852539, "global_step": 163511, "epoch": 1970} {"train_loss": -23.265893936157227, "global_step": 163512, "epoch": 1970} {"train_loss": -23.302295684814453, "global_step": 163513, "epoch": 1970} {"train_loss": -23.28021812438965, "global_step": 163514, "epoch": 1970} {"train_loss": -23.453065872192383, "global_step": 163515, "epoch": 1970} {"train_loss": -23.426708221435547, "global_step": 163516, "epoch": 1970} {"train_loss": -23.37708854675293, "global_step": 163517, "epoch": 1970} {"train_loss": -23.51215362548828, "global_step": 163518, "epoch": 1970} {"train_loss": -23.435853958129883, "global_step": 163519, "epoch": 1970} {"train_loss": -23.14349937438965, "global_step": 163520, "epoch": 1970} {"train_loss": -23.41813087463379, "global_step": 163521, "epoch": 1970} {"train_loss": -23.54251480102539, "global_step": 163522, "epoch": 1970} {"train_loss": -23.473840713500977, "global_step": 163523, "epoch": 1970} {"train_loss": -23.532148361206055, "global_step": 163524, "epoch": 1970} {"train_loss": -23.729427337646484, "global_step": 163525, "epoch": 1970} {"train_loss": -23.54169273376465, "global_step": 163526, "epoch": 1970} {"train_loss": -22.93490982055664, "global_step": 163527, "epoch": 1970} {"train_loss": -23.623111724853516, "global_step": 163528, "epoch": 1970} {"train_loss": -23.503660202026367, "global_step": 163529, "epoch": 1970} {"train_loss": -23.795902252197266, "global_step": 163530, "epoch": 1970} {"train_loss": -23.91042137145996, "global_step": 163531, "epoch": 1970} {"train_loss": -23.6181697845459, "global_step": 163532, "epoch": 1970} {"train_loss": -23.336164474487305, "global_step": 163533, "epoch": 1970} {"train_loss": -23.8142147064209, "global_step": 163534, "epoch": 1970} {"train_loss": -23.932249069213867, "global_step": 163535, "epoch": 1970} {"train_loss": -23.703359603881836, "global_step": 163536, "epoch": 1970} {"train_loss": -23.569456100463867, "global_step": 163537, "epoch": 1970} {"train_loss": -23.479740142822266, "global_step": 163538, "epoch": 1970} {"train_loss": -23.86862564086914, "global_step": 163539, "epoch": 1970} {"train_loss": -23.52349090576172, "global_step": 163540, "epoch": 1970} {"train_loss": -23.509323120117188, "global_step": 163541, "epoch": 1970} {"train_loss": -23.39340591430664, "global_step": 163542, "epoch": 1970} {"train_loss": -23.65951919555664, "global_step": 163543, "epoch": 1970} {"train_loss": -23.50872802734375, "global_step": 163544, "epoch": 1970} {"train_loss": -23.529630661010742, "global_step": 163545, "epoch": 1970} {"train_loss": -23.74835205078125, "global_step": 163546, "epoch": 1970} {"train_loss": -23.2634220123291, "global_step": 163547, "epoch": 1970} {"train_loss": -23.323476791381836, "global_step": 163548, "epoch": 1970} {"train_loss": -23.526330947875977, "global_step": 163549, "epoch": 1970} {"train_loss": -23.868179321289062, "global_step": 163550, "epoch": 1970} {"train_loss": -23.544336318969727, "global_step": 163551, "epoch": 1970} {"train_loss": -23.690204620361328, "global_step": 163552, "epoch": 1970} {"train_loss": -23.413724899291992, "global_step": 163553, "epoch": 1970} {"train_loss": -23.77128791809082, "global_step": 163554, "epoch": 1970} {"train_loss": -23.652568817138672, "global_step": 163555, "epoch": 1970} {"train_loss": -23.457178115844727, "global_step": 163556, "epoch": 1970} {"train_loss": -23.451950073242188, "global_step": 163557, "epoch": 1970} {"train_loss": -23.501768112182617, "global_step": 163558, "epoch": 1970} {"train_loss": -23.68123435974121, "global_step": 163559, "epoch": 1970} {"train_loss": -23.372512817382812, "global_step": 163560, "epoch": 1970} {"train_loss": -23.978612899780273, "global_step": 163561, "epoch": 1970} {"train_loss": -23.596113204956055, "global_step": 163562, "epoch": 1970} {"train_loss": -23.455190658569336, "global_step": 163563, "epoch": 1970} {"train_loss": -23.718658447265625, "global_step": 163564, "epoch": 1970} {"train_loss": -23.568008422851562, "global_step": 163565, "epoch": 1970} {"train_loss": -23.799108505249023, "global_step": 163566, "epoch": 1970} {"train_loss": -23.486066818237305, "global_step": 163567, "epoch": 1970} {"train_loss": -23.72696304321289, "global_step": 163568, "epoch": 1970} {"train_loss": -23.794965744018555, "global_step": 163569, "epoch": 1970} {"train_loss": -23.99317169189453, "global_step": 163570, "epoch": 1970} {"train_loss": -23.60499382019043, "global_step": 163571, "epoch": 1970} {"train_loss": -23.611438751220703, "global_step": 163572, "epoch": 1970} {"train_loss": -23.62489128112793, "global_step": 163573, "epoch": 1970} {"train_loss": -23.370553970336914, "global_step": 163574, "epoch": 1970} {"train_loss": -23.705488204956055, "global_step": 163575, "epoch": 1970} {"train_loss": -23.39836883544922, "global_step": 163576, "epoch": 1970} {"train_loss": -22.50545310974121, "global_step": 163577, "epoch": 1970} {"train_loss": -21.94571876525879, "global_step": 163578, "epoch": 1970} {"train_loss": -23.272960662841797, "global_step": 163579, "epoch": 1970} {"train_loss": -23.106945037841797, "global_step": 163580, "epoch": 1970} {"train_loss": -22.54062271118164, "global_step": 163581, "epoch": 1970} {"train_loss": -23.12771987915039, "global_step": 163582, "epoch": 1970} {"train_loss": -23.143224716186523, "global_step": 163583, "epoch": 1970} {"train_loss": -23.229135513305664, "global_step": 163584, "epoch": 1970} {"train_loss": -23.21510124206543, "global_step": 163585, "epoch": 1970} {"train_loss": -22.867595672607422, "global_step": 163586, "epoch": 1970} {"train_loss": -23.448211669921875, "global_step": 163587, "epoch": 1970} {"train_loss": -23.15085220336914, "global_step": 163588, "epoch": 1970} {"train_loss": -23.399749755859375, "global_step": 163589, "epoch": 1970} {"train_loss": -23.128889083862305, "global_step": 163590, "epoch": 1970} {"train_loss": -23.413179397583008, "global_step": 163591, "epoch": 1970} {"train_loss": -23.444965730230493, "global_step": 163592, "epoch": 1970, "val_loss": 6476598.0} {"train_loss": -23.278217315673828, "global_step": 163593, "epoch": 1971} {"train_loss": -23.242109298706055, "global_step": 163594, "epoch": 1971} {"train_loss": -22.804309844970703, "global_step": 163595, "epoch": 1971} {"train_loss": -23.036949157714844, "global_step": 163596, "epoch": 1971} {"train_loss": -22.902631759643555, "global_step": 163597, "epoch": 1971} {"train_loss": -23.050573348999023, "global_step": 163598, "epoch": 1971} {"train_loss": -23.159915924072266, "global_step": 163599, "epoch": 1971} {"train_loss": -22.763946533203125, "global_step": 163600, "epoch": 1971} {"train_loss": -23.06931495666504, "global_step": 163601, "epoch": 1971} {"train_loss": -22.646032333374023, "global_step": 163602, "epoch": 1971} {"train_loss": -23.091758728027344, "global_step": 163603, "epoch": 1971} {"train_loss": -23.351667404174805, "global_step": 163604, "epoch": 1971} {"train_loss": -23.479711532592773, "global_step": 163605, "epoch": 1971} {"train_loss": -23.732437133789062, "global_step": 163606, "epoch": 1971} {"train_loss": -23.274518966674805, "global_step": 163607, "epoch": 1971} {"train_loss": -23.390838623046875, "global_step": 163608, "epoch": 1971} {"train_loss": -23.598737716674805, "global_step": 163609, "epoch": 1971} {"train_loss": -23.45118522644043, "global_step": 163610, "epoch": 1971} {"train_loss": -23.4727840423584, "global_step": 163611, "epoch": 1971} {"train_loss": -23.048233032226562, "global_step": 163612, "epoch": 1971} {"train_loss": -23.29904556274414, "global_step": 163613, "epoch": 1971} {"train_loss": -23.702207565307617, "global_step": 163614, "epoch": 1971} {"train_loss": -23.79749298095703, "global_step": 163615, "epoch": 1971} {"train_loss": -23.47136878967285, "global_step": 163616, "epoch": 1971} {"train_loss": -23.62794303894043, "global_step": 163617, "epoch": 1971} {"train_loss": -23.77522850036621, "global_step": 163618, "epoch": 1971} {"train_loss": -23.588428497314453, "global_step": 163619, "epoch": 1971} {"train_loss": -23.787031173706055, "global_step": 163620, "epoch": 1971} {"train_loss": -23.79056167602539, "global_step": 163621, "epoch": 1971} {"train_loss": -23.827451705932617, "global_step": 163622, "epoch": 1971} {"train_loss": -23.51250648498535, "global_step": 163623, "epoch": 1971} {"train_loss": -23.739469528198242, "global_step": 163624, "epoch": 1971} {"train_loss": -23.83705711364746, "global_step": 163625, "epoch": 1971} {"train_loss": -23.62436294555664, "global_step": 163626, "epoch": 1971} {"train_loss": -23.769357681274414, "global_step": 163627, "epoch": 1971} {"train_loss": -23.54305076599121, "global_step": 163628, "epoch": 1971} {"train_loss": -23.808881759643555, "global_step": 163629, "epoch": 1971} {"train_loss": -23.287734985351562, "global_step": 163630, "epoch": 1971} {"train_loss": -24.22601318359375, "global_step": 163631, "epoch": 1971} {"train_loss": -23.808364868164062, "global_step": 163632, "epoch": 1971} {"train_loss": -23.929731369018555, "global_step": 163633, "epoch": 1971} {"train_loss": -23.53687858581543, "global_step": 163634, "epoch": 1971} {"train_loss": -23.498472213745117, "global_step": 163635, "epoch": 1971} {"train_loss": -23.467369079589844, "global_step": 163636, "epoch": 1971} {"train_loss": -23.97311782836914, "global_step": 163637, "epoch": 1971} {"train_loss": -23.58930206298828, "global_step": 163638, "epoch": 1971} {"train_loss": -23.549428939819336, "global_step": 163639, "epoch": 1971} {"train_loss": -23.51786994934082, "global_step": 163640, "epoch": 1971} {"train_loss": -23.48672103881836, "global_step": 163641, "epoch": 1971} {"train_loss": -23.674468994140625, "global_step": 163642, "epoch": 1971} {"train_loss": -23.798721313476562, "global_step": 163643, "epoch": 1971} {"train_loss": -23.606168746948242, "global_step": 163644, "epoch": 1971} {"train_loss": -23.642932891845703, "global_step": 163645, "epoch": 1971} {"train_loss": -23.679372787475586, "global_step": 163646, "epoch": 1971} {"train_loss": -23.871145248413086, "global_step": 163647, "epoch": 1971} {"train_loss": -23.429784774780273, "global_step": 163648, "epoch": 1971} {"train_loss": -23.65431785583496, "global_step": 163649, "epoch": 1971} {"train_loss": -23.74444007873535, "global_step": 163650, "epoch": 1971} {"train_loss": -23.81671714782715, "global_step": 163651, "epoch": 1971} {"train_loss": -23.530691146850586, "global_step": 163652, "epoch": 1971} {"train_loss": -23.862844467163086, "global_step": 163653, "epoch": 1971} {"train_loss": -23.704116821289062, "global_step": 163654, "epoch": 1971} {"train_loss": -23.816776275634766, "global_step": 163655, "epoch": 1971} {"train_loss": -23.943603515625, "global_step": 163656, "epoch": 1971} {"train_loss": -23.737911224365234, "global_step": 163657, "epoch": 1971} {"train_loss": -23.693708419799805, "global_step": 163658, "epoch": 1971} {"train_loss": -23.71648597717285, "global_step": 163659, "epoch": 1971} {"train_loss": -24.010177612304688, "global_step": 163660, "epoch": 1971} {"train_loss": -23.84619140625, "global_step": 163661, "epoch": 1971} {"train_loss": -23.658679962158203, "global_step": 163662, "epoch": 1971} {"train_loss": -23.782236099243164, "global_step": 163663, "epoch": 1971} {"train_loss": -23.45703125, "global_step": 163664, "epoch": 1971} {"train_loss": -23.673131942749023, "global_step": 163665, "epoch": 1971} {"train_loss": -23.540719985961914, "global_step": 163666, "epoch": 1971} {"train_loss": -23.3514347076416, "global_step": 163667, "epoch": 1971} {"train_loss": -23.469823837280273, "global_step": 163668, "epoch": 1971} {"train_loss": -23.8347110748291, "global_step": 163669, "epoch": 1971} {"train_loss": -23.712541580200195, "global_step": 163670, "epoch": 1971} {"train_loss": -23.845077514648438, "global_step": 163671, "epoch": 1971} {"train_loss": -23.623186111450195, "global_step": 163672, "epoch": 1971} {"train_loss": -23.266305923461914, "global_step": 163673, "epoch": 1971} {"train_loss": -23.619184494018555, "global_step": 163674, "epoch": 1971} {"train_loss": -23.553022568484387, "global_step": 163675, "epoch": 1971, "val_loss": 6453795.0} {"train_loss": -23.548213958740234, "global_step": 163676, "epoch": 1972} {"train_loss": -23.259485244750977, "global_step": 163677, "epoch": 1972} {"train_loss": -23.34107780456543, "global_step": 163678, "epoch": 1972} {"train_loss": -23.57547378540039, "global_step": 163679, "epoch": 1972} {"train_loss": -23.46722984313965, "global_step": 163680, "epoch": 1972} {"train_loss": -23.17502784729004, "global_step": 163681, "epoch": 1972} {"train_loss": -23.397138595581055, "global_step": 163682, "epoch": 1972} {"train_loss": -23.30368423461914, "global_step": 163683, "epoch": 1972} {"train_loss": -23.38187599182129, "global_step": 163684, "epoch": 1972} {"train_loss": -23.079252243041992, "global_step": 163685, "epoch": 1972} {"train_loss": -23.213146209716797, "global_step": 163686, "epoch": 1972} {"train_loss": -23.41995620727539, "global_step": 163687, "epoch": 1972} {"train_loss": -23.40754508972168, "global_step": 163688, "epoch": 1972} {"train_loss": -23.306766510009766, "global_step": 163689, "epoch": 1972} {"train_loss": -23.386075973510742, "global_step": 163690, "epoch": 1972} {"train_loss": -23.567594528198242, "global_step": 163691, "epoch": 1972} {"train_loss": -23.17142677307129, "global_step": 163692, "epoch": 1972} {"train_loss": -23.760469436645508, "global_step": 163693, "epoch": 1972} {"train_loss": -23.51122283935547, "global_step": 163694, "epoch": 1972} {"train_loss": -23.7386417388916, "global_step": 163695, "epoch": 1972} {"train_loss": -23.71472930908203, "global_step": 163696, "epoch": 1972} {"train_loss": -23.412809371948242, "global_step": 163697, "epoch": 1972} {"train_loss": -23.436113357543945, "global_step": 163698, "epoch": 1972} {"train_loss": -23.503671646118164, "global_step": 163699, "epoch": 1972} {"train_loss": -23.672012329101562, "global_step": 163700, "epoch": 1972} {"train_loss": -23.569902420043945, "global_step": 163701, "epoch": 1972} {"train_loss": -23.635168075561523, "global_step": 163702, "epoch": 1972} {"train_loss": -23.50394058227539, "global_step": 163703, "epoch": 1972} {"train_loss": -23.61408233642578, "global_step": 163704, "epoch": 1972} {"train_loss": -23.59432029724121, "global_step": 163705, "epoch": 1972} {"train_loss": -23.4495906829834, "global_step": 163706, "epoch": 1972} {"train_loss": -23.513065338134766, "global_step": 163707, "epoch": 1972} {"train_loss": -23.398046493530273, "global_step": 163708, "epoch": 1972} {"train_loss": -23.471878051757812, "global_step": 163709, "epoch": 1972} {"train_loss": -23.561243057250977, "global_step": 163710, "epoch": 1972} {"train_loss": -23.69562339782715, "global_step": 163711, "epoch": 1972} {"train_loss": -23.8751277923584, "global_step": 163712, "epoch": 1972} {"train_loss": -23.586156845092773, "global_step": 163713, "epoch": 1972} {"train_loss": -23.508237838745117, "global_step": 163714, "epoch": 1972} {"train_loss": -23.343984603881836, "global_step": 163715, "epoch": 1972} {"train_loss": -23.7927303314209, "global_step": 163716, "epoch": 1972} {"train_loss": -23.271902084350586, "global_step": 163717, "epoch": 1972} {"train_loss": -23.424697875976562, "global_step": 163718, "epoch": 1972} {"train_loss": -23.65475082397461, "global_step": 163719, "epoch": 1972} {"train_loss": -23.356388092041016, "global_step": 163720, "epoch": 1972} {"train_loss": -23.558515548706055, "global_step": 163721, "epoch": 1972} {"train_loss": -23.87689971923828, "global_step": 163722, "epoch": 1972} {"train_loss": -23.601346969604492, "global_step": 163723, "epoch": 1972} {"train_loss": -23.562177658081055, "global_step": 163724, "epoch": 1972} {"train_loss": -23.3829402923584, "global_step": 163725, "epoch": 1972} {"train_loss": -23.692779541015625, "global_step": 163726, "epoch": 1972} {"train_loss": -23.68544578552246, "global_step": 163727, "epoch": 1972} {"train_loss": -23.849327087402344, "global_step": 163728, "epoch": 1972} {"train_loss": -23.7740535736084, "global_step": 163729, "epoch": 1972} {"train_loss": -23.826871871948242, "global_step": 163730, "epoch": 1972} {"train_loss": -23.773008346557617, "global_step": 163731, "epoch": 1972} {"train_loss": -23.65505599975586, "global_step": 163732, "epoch": 1972} {"train_loss": -23.51563835144043, "global_step": 163733, "epoch": 1972} {"train_loss": -23.943872451782227, "global_step": 163734, "epoch": 1972} {"train_loss": -23.585880279541016, "global_step": 163735, "epoch": 1972} {"train_loss": -23.72313117980957, "global_step": 163736, "epoch": 1972} {"train_loss": -23.314844131469727, "global_step": 163737, "epoch": 1972} {"train_loss": -23.512418746948242, "global_step": 163738, "epoch": 1972} {"train_loss": -23.4989013671875, "global_step": 163739, "epoch": 1972} {"train_loss": -23.666040420532227, "global_step": 163740, "epoch": 1972} {"train_loss": -23.492874145507812, "global_step": 163741, "epoch": 1972} {"train_loss": -23.533369064331055, "global_step": 163742, "epoch": 1972} {"train_loss": -23.80508804321289, "global_step": 163743, "epoch": 1972} {"train_loss": -23.596786499023438, "global_step": 163744, "epoch": 1972} {"train_loss": -23.386112213134766, "global_step": 163745, "epoch": 1972} {"train_loss": -23.687101364135742, "global_step": 163746, "epoch": 1972} {"train_loss": -23.283742904663086, "global_step": 163747, "epoch": 1972} {"train_loss": -23.537023544311523, "global_step": 163748, "epoch": 1972} {"train_loss": -23.66477394104004, "global_step": 163749, "epoch": 1972} {"train_loss": -23.52821922302246, "global_step": 163750, "epoch": 1972} {"train_loss": -23.570789337158203, "global_step": 163751, "epoch": 1972} {"train_loss": -23.591447830200195, "global_step": 163752, "epoch": 1972} {"train_loss": -24.042821884155273, "global_step": 163753, "epoch": 1972} {"train_loss": -23.71583366394043, "global_step": 163754, "epoch": 1972} {"train_loss": -23.821826934814453, "global_step": 163755, "epoch": 1972} {"train_loss": -23.74287986755371, "global_step": 163756, "epoch": 1972} {"train_loss": -23.747053146362305, "global_step": 163757, "epoch": 1972} {"train_loss": -23.557568860341267, "global_step": 163758, "epoch": 1972, "val_loss": 6344088.0} {"train_loss": -22.948476791381836, "global_step": 163759, "epoch": 1973} {"train_loss": -22.26456642150879, "global_step": 163760, "epoch": 1973} {"train_loss": -22.027280807495117, "global_step": 163761, "epoch": 1973} {"train_loss": -22.42585563659668, "global_step": 163762, "epoch": 1973} {"train_loss": -22.690603256225586, "global_step": 163763, "epoch": 1973} {"train_loss": -22.20638084411621, "global_step": 163764, "epoch": 1973} {"train_loss": -22.678762435913086, "global_step": 163765, "epoch": 1973} {"train_loss": -23.203189849853516, "global_step": 163766, "epoch": 1973} {"train_loss": -22.767229080200195, "global_step": 163767, "epoch": 1973} {"train_loss": -23.26934242248535, "global_step": 163768, "epoch": 1973} {"train_loss": -22.503341674804688, "global_step": 163769, "epoch": 1973} {"train_loss": -23.20216941833496, "global_step": 163770, "epoch": 1973} {"train_loss": -23.08681297302246, "global_step": 163771, "epoch": 1973} {"train_loss": -23.128477096557617, "global_step": 163772, "epoch": 1973} {"train_loss": -22.870948791503906, "global_step": 163773, "epoch": 1973} {"train_loss": -23.327558517456055, "global_step": 163774, "epoch": 1973} {"train_loss": -23.363208770751953, "global_step": 163775, "epoch": 1973} {"train_loss": -22.779037475585938, "global_step": 163776, "epoch": 1973} {"train_loss": -22.973751068115234, "global_step": 163777, "epoch": 1973} {"train_loss": -23.206205368041992, "global_step": 163778, "epoch": 1973} {"train_loss": -23.235200881958008, "global_step": 163779, "epoch": 1973} {"train_loss": -23.24687957763672, "global_step": 163780, "epoch": 1973} {"train_loss": -23.297163009643555, "global_step": 163781, "epoch": 1973} {"train_loss": -23.310392379760742, "global_step": 163782, "epoch": 1973} {"train_loss": -23.324338912963867, "global_step": 163783, "epoch": 1973} {"train_loss": -23.11150550842285, "global_step": 163784, "epoch": 1973} {"train_loss": -23.1103572845459, "global_step": 163785, "epoch": 1973} {"train_loss": -23.492053985595703, "global_step": 163786, "epoch": 1973} {"train_loss": -23.419055938720703, "global_step": 163787, "epoch": 1973} {"train_loss": -23.526473999023438, "global_step": 163788, "epoch": 1973} {"train_loss": -23.31513786315918, "global_step": 163789, "epoch": 1973} {"train_loss": -23.59665870666504, "global_step": 163790, "epoch": 1973} {"train_loss": -23.64750099182129, "global_step": 163791, "epoch": 1973} {"train_loss": -23.628067016601562, "global_step": 163792, "epoch": 1973} {"train_loss": -23.250776290893555, "global_step": 163793, "epoch": 1973} {"train_loss": -23.926786422729492, "global_step": 163794, "epoch": 1973} {"train_loss": -23.685239791870117, "global_step": 163795, "epoch": 1973} {"train_loss": -23.778615951538086, "global_step": 163796, "epoch": 1973} {"train_loss": -23.453357696533203, "global_step": 163797, "epoch": 1973} {"train_loss": -23.710603713989258, "global_step": 163798, "epoch": 1973} {"train_loss": -23.886625289916992, "global_step": 163799, "epoch": 1973} {"train_loss": -23.535512924194336, "global_step": 163800, "epoch": 1973} {"train_loss": -23.660385131835938, "global_step": 163801, "epoch": 1973} {"train_loss": -23.594396591186523, "global_step": 163802, "epoch": 1973} {"train_loss": -23.60194206237793, "global_step": 163803, "epoch": 1973} {"train_loss": -23.591087341308594, "global_step": 163804, "epoch": 1973} {"train_loss": -23.583681106567383, "global_step": 163805, "epoch": 1973} {"train_loss": -23.735002517700195, "global_step": 163806, "epoch": 1973} {"train_loss": -23.721372604370117, "global_step": 163807, "epoch": 1973} {"train_loss": -23.865493774414062, "global_step": 163808, "epoch": 1973} {"train_loss": -24.05096435546875, "global_step": 163809, "epoch": 1973} {"train_loss": -23.578388214111328, "global_step": 163810, "epoch": 1973} {"train_loss": -23.341753005981445, "global_step": 163811, "epoch": 1973} {"train_loss": -23.075674057006836, "global_step": 163812, "epoch": 1973} {"train_loss": -23.041797637939453, "global_step": 163813, "epoch": 1973} {"train_loss": -23.239667892456055, "global_step": 163814, "epoch": 1973} {"train_loss": -22.627042770385742, "global_step": 163815, "epoch": 1973} {"train_loss": -22.683805465698242, "global_step": 163816, "epoch": 1973} {"train_loss": -22.889087677001953, "global_step": 163817, "epoch": 1973} {"train_loss": -23.21196174621582, "global_step": 163818, "epoch": 1973} {"train_loss": -22.93630027770996, "global_step": 163819, "epoch": 1973} {"train_loss": -22.801055908203125, "global_step": 163820, "epoch": 1973} {"train_loss": -23.16996192932129, "global_step": 163821, "epoch": 1973} {"train_loss": -23.272626876831055, "global_step": 163822, "epoch": 1973} {"train_loss": -23.10904884338379, "global_step": 163823, "epoch": 1973} {"train_loss": -23.115812301635742, "global_step": 163824, "epoch": 1973} {"train_loss": -23.374082565307617, "global_step": 163825, "epoch": 1973} {"train_loss": -23.178091049194336, "global_step": 163826, "epoch": 1973} {"train_loss": -23.109594345092773, "global_step": 163827, "epoch": 1973} {"train_loss": -23.35791778564453, "global_step": 163828, "epoch": 1973} {"train_loss": -23.127042770385742, "global_step": 163829, "epoch": 1973} {"train_loss": -23.07118797302246, "global_step": 163830, "epoch": 1973} {"train_loss": -23.43311882019043, "global_step": 163831, "epoch": 1973} {"train_loss": -23.36372947692871, "global_step": 163832, "epoch": 1973} {"train_loss": -23.495960235595703, "global_step": 163833, "epoch": 1973} {"train_loss": -23.287649154663086, "global_step": 163834, "epoch": 1973} {"train_loss": -23.692323684692383, "global_step": 163835, "epoch": 1973} {"train_loss": -23.81734275817871, "global_step": 163836, "epoch": 1973} {"train_loss": -23.502063751220703, "global_step": 163837, "epoch": 1973} {"train_loss": -23.541748046875, "global_step": 163838, "epoch": 1973} {"train_loss": -23.367530822753906, "global_step": 163839, "epoch": 1973} {"train_loss": -23.433549880981445, "global_step": 163840, "epoch": 1973} {"train_loss": -23.261969003332666, "global_step": 163841, "epoch": 1973, "val_loss": 6296563.5} {"train_loss": -23.024356842041016, "global_step": 163842, "epoch": 1974} {"train_loss": -23.522653579711914, "global_step": 163843, "epoch": 1974} {"train_loss": -23.306930541992188, "global_step": 163844, "epoch": 1974} {"train_loss": -23.69038963317871, "global_step": 163845, "epoch": 1974} {"train_loss": -23.74129295349121, "global_step": 163846, "epoch": 1974} {"train_loss": -23.201873779296875, "global_step": 163847, "epoch": 1974} {"train_loss": -23.245145797729492, "global_step": 163848, "epoch": 1974} {"train_loss": -23.419151306152344, "global_step": 163849, "epoch": 1974} {"train_loss": -23.27617073059082, "global_step": 163850, "epoch": 1974} {"train_loss": -22.88296127319336, "global_step": 163851, "epoch": 1974} {"train_loss": -23.341123580932617, "global_step": 163852, "epoch": 1974} {"train_loss": -23.42575454711914, "global_step": 163853, "epoch": 1974} {"train_loss": -23.120681762695312, "global_step": 163854, "epoch": 1974} {"train_loss": -23.85343360900879, "global_step": 163855, "epoch": 1974} {"train_loss": -23.54115104675293, "global_step": 163856, "epoch": 1974} {"train_loss": -23.551916122436523, "global_step": 163857, "epoch": 1974} {"train_loss": -23.30291175842285, "global_step": 163858, "epoch": 1974} {"train_loss": -24.03902244567871, "global_step": 163859, "epoch": 1974} {"train_loss": -23.286588668823242, "global_step": 163860, "epoch": 1974} {"train_loss": -23.19455909729004, "global_step": 163861, "epoch": 1974} {"train_loss": -23.93320655822754, "global_step": 163862, "epoch": 1974} {"train_loss": -23.42930030822754, "global_step": 163863, "epoch": 1974} {"train_loss": -23.70461082458496, "global_step": 163864, "epoch": 1974} {"train_loss": -23.43269157409668, "global_step": 163865, "epoch": 1974} {"train_loss": -23.1158447265625, "global_step": 163866, "epoch": 1974} {"train_loss": -23.202423095703125, "global_step": 163867, "epoch": 1974} {"train_loss": -23.59565544128418, "global_step": 163868, "epoch": 1974} {"train_loss": -23.743011474609375, "global_step": 163869, "epoch": 1974} {"train_loss": -23.393766403198242, "global_step": 163870, "epoch": 1974} {"train_loss": -23.398508071899414, "global_step": 163871, "epoch": 1974} {"train_loss": -23.790477752685547, "global_step": 163872, "epoch": 1974} {"train_loss": -23.563922882080078, "global_step": 163873, "epoch": 1974} {"train_loss": -23.193456649780273, "global_step": 163874, "epoch": 1974} {"train_loss": -23.48756217956543, "global_step": 163875, "epoch": 1974} {"train_loss": -23.55997657775879, "global_step": 163876, "epoch": 1974} {"train_loss": -23.9141902923584, "global_step": 163877, "epoch": 1974} {"train_loss": -23.87773895263672, "global_step": 163878, "epoch": 1974} {"train_loss": -23.67616081237793, "global_step": 163879, "epoch": 1974} {"train_loss": -23.36452293395996, "global_step": 163880, "epoch": 1974} {"train_loss": -23.884647369384766, "global_step": 163881, "epoch": 1974} {"train_loss": -23.878732681274414, "global_step": 163882, "epoch": 1974} {"train_loss": -23.436986923217773, "global_step": 163883, "epoch": 1974} {"train_loss": -23.40955924987793, "global_step": 163884, "epoch": 1974} {"train_loss": -23.69732666015625, "global_step": 163885, "epoch": 1974} {"train_loss": -23.727880477905273, "global_step": 163886, "epoch": 1974} {"train_loss": -23.3341064453125, "global_step": 163887, "epoch": 1974} {"train_loss": -23.595693588256836, "global_step": 163888, "epoch": 1974} {"train_loss": -23.654142379760742, "global_step": 163889, "epoch": 1974} {"train_loss": -23.410429000854492, "global_step": 163890, "epoch": 1974} {"train_loss": -23.385229110717773, "global_step": 163891, "epoch": 1974} {"train_loss": -23.85921859741211, "global_step": 163892, "epoch": 1974} {"train_loss": -23.57034683227539, "global_step": 163893, "epoch": 1974} {"train_loss": -23.320241928100586, "global_step": 163894, "epoch": 1974} {"train_loss": -23.751455307006836, "global_step": 163895, "epoch": 1974} {"train_loss": -23.748525619506836, "global_step": 163896, "epoch": 1974} {"train_loss": -23.584407806396484, "global_step": 163897, "epoch": 1974} {"train_loss": -23.522098541259766, "global_step": 163898, "epoch": 1974} {"train_loss": -23.635465621948242, "global_step": 163899, "epoch": 1974} {"train_loss": -23.6628360748291, "global_step": 163900, "epoch": 1974} {"train_loss": -23.668127059936523, "global_step": 163901, "epoch": 1974} {"train_loss": -23.805524826049805, "global_step": 163902, "epoch": 1974} {"train_loss": -23.53876304626465, "global_step": 163903, "epoch": 1974} {"train_loss": -23.859540939331055, "global_step": 163904, "epoch": 1974} {"train_loss": -23.503381729125977, "global_step": 163905, "epoch": 1974} {"train_loss": -23.4046688079834, "global_step": 163906, "epoch": 1974} {"train_loss": -23.76190185546875, "global_step": 163907, "epoch": 1974} {"train_loss": -23.910545349121094, "global_step": 163908, "epoch": 1974} {"train_loss": -23.609331130981445, "global_step": 163909, "epoch": 1974} {"train_loss": -23.806856155395508, "global_step": 163910, "epoch": 1974} {"train_loss": -23.217370986938477, "global_step": 163911, "epoch": 1974} {"train_loss": -23.644397735595703, "global_step": 163912, "epoch": 1974} {"train_loss": -23.596513748168945, "global_step": 163913, "epoch": 1974} {"train_loss": -23.51321792602539, "global_step": 163914, "epoch": 1974} {"train_loss": -23.775360107421875, "global_step": 163915, "epoch": 1974} {"train_loss": -23.64620018005371, "global_step": 163916, "epoch": 1974} {"train_loss": -23.428646087646484, "global_step": 163917, "epoch": 1974} {"train_loss": -23.335250854492188, "global_step": 163918, "epoch": 1974} {"train_loss": -23.398221969604492, "global_step": 163919, "epoch": 1974} {"train_loss": -23.880613327026367, "global_step": 163920, "epoch": 1974} {"train_loss": -23.601774215698242, "global_step": 163921, "epoch": 1974} {"train_loss": -23.31294059753418, "global_step": 163922, "epoch": 1974} {"train_loss": -23.39846420288086, "global_step": 163923, "epoch": 1974} {"train_loss": -23.52187140591173, "global_step": 163924, "epoch": 1974, "val_loss": 6412575.0} {"train_loss": -23.3328914642334, "global_step": 163925, "epoch": 1975} {"train_loss": -22.99106216430664, "global_step": 163926, "epoch": 1975} {"train_loss": -22.603517532348633, "global_step": 163927, "epoch": 1975} {"train_loss": -23.19717025756836, "global_step": 163928, "epoch": 1975} {"train_loss": -22.728466033935547, "global_step": 163929, "epoch": 1975} {"train_loss": -23.435928344726562, "global_step": 163930, "epoch": 1975} {"train_loss": -22.668031692504883, "global_step": 163931, "epoch": 1975} {"train_loss": -22.419557571411133, "global_step": 163932, "epoch": 1975} {"train_loss": -23.3117733001709, "global_step": 163933, "epoch": 1975} {"train_loss": -22.40927505493164, "global_step": 163934, "epoch": 1975} {"train_loss": -22.95130729675293, "global_step": 163935, "epoch": 1975} {"train_loss": -22.773818969726562, "global_step": 163936, "epoch": 1975} {"train_loss": -23.456893920898438, "global_step": 163937, "epoch": 1975} {"train_loss": -23.247873306274414, "global_step": 163938, "epoch": 1975} {"train_loss": -23.65968894958496, "global_step": 163939, "epoch": 1975} {"train_loss": -23.121585845947266, "global_step": 163940, "epoch": 1975} {"train_loss": -23.1060848236084, "global_step": 163941, "epoch": 1975} {"train_loss": -22.987319946289062, "global_step": 163942, "epoch": 1975} {"train_loss": -23.446165084838867, "global_step": 163943, "epoch": 1975} {"train_loss": -23.099353790283203, "global_step": 163944, "epoch": 1975} {"train_loss": -23.44357681274414, "global_step": 163945, "epoch": 1975} {"train_loss": -23.06178855895996, "global_step": 163946, "epoch": 1975} {"train_loss": -23.333646774291992, "global_step": 163947, "epoch": 1975} {"train_loss": -23.381803512573242, "global_step": 163948, "epoch": 1975} {"train_loss": -23.2604923248291, "global_step": 163949, "epoch": 1975} {"train_loss": -23.370397567749023, "global_step": 163950, "epoch": 1975} {"train_loss": -23.776599884033203, "global_step": 163951, "epoch": 1975} {"train_loss": -23.108537673950195, "global_step": 163952, "epoch": 1975} {"train_loss": -23.626867294311523, "global_step": 163953, "epoch": 1975} {"train_loss": -23.059446334838867, "global_step": 163954, "epoch": 1975} {"train_loss": -23.15163230895996, "global_step": 163955, "epoch": 1975} {"train_loss": -23.511829376220703, "global_step": 163956, "epoch": 1975} {"train_loss": -23.46156120300293, "global_step": 163957, "epoch": 1975} {"train_loss": -23.314573287963867, "global_step": 163958, "epoch": 1975} {"train_loss": -23.25126075744629, "global_step": 163959, "epoch": 1975} {"train_loss": -23.28327751159668, "global_step": 163960, "epoch": 1975} {"train_loss": -23.47463035583496, "global_step": 163961, "epoch": 1975} {"train_loss": -23.678504943847656, "global_step": 163962, "epoch": 1975} {"train_loss": -23.21370506286621, "global_step": 163963, "epoch": 1975} {"train_loss": -23.659822463989258, "global_step": 163964, "epoch": 1975} {"train_loss": -23.201269149780273, "global_step": 163965, "epoch": 1975} {"train_loss": -23.57069969177246, "global_step": 163966, "epoch": 1975} {"train_loss": -23.687597274780273, "global_step": 163967, "epoch": 1975} {"train_loss": -23.6728458404541, "global_step": 163968, "epoch": 1975} {"train_loss": -23.696884155273438, "global_step": 163969, "epoch": 1975} {"train_loss": -23.83662986755371, "global_step": 163970, "epoch": 1975} {"train_loss": -23.42307472229004, "global_step": 163971, "epoch": 1975} {"train_loss": -23.969379425048828, "global_step": 163972, "epoch": 1975} {"train_loss": -24.060087203979492, "global_step": 163973, "epoch": 1975} {"train_loss": -23.259456634521484, "global_step": 163974, "epoch": 1975} {"train_loss": -23.65187644958496, "global_step": 163975, "epoch": 1975} {"train_loss": -23.79201316833496, "global_step": 163976, "epoch": 1975} {"train_loss": -23.559513092041016, "global_step": 163977, "epoch": 1975} {"train_loss": -23.180212020874023, "global_step": 163978, "epoch": 1975} {"train_loss": -23.2935848236084, "global_step": 163979, "epoch": 1975} {"train_loss": -23.563703536987305, "global_step": 163980, "epoch": 1975} {"train_loss": -23.434158325195312, "global_step": 163981, "epoch": 1975} {"train_loss": -24.05742073059082, "global_step": 163982, "epoch": 1975} {"train_loss": -23.832082748413086, "global_step": 163983, "epoch": 1975} {"train_loss": -23.784616470336914, "global_step": 163984, "epoch": 1975} {"train_loss": -23.368356704711914, "global_step": 163985, "epoch": 1975} {"train_loss": -23.46854591369629, "global_step": 163986, "epoch": 1975} {"train_loss": -23.307113647460938, "global_step": 163987, "epoch": 1975} {"train_loss": -23.697101593017578, "global_step": 163988, "epoch": 1975} {"train_loss": -23.798192977905273, "global_step": 163989, "epoch": 1975} {"train_loss": -23.62725257873535, "global_step": 163990, "epoch": 1975} {"train_loss": -23.732805252075195, "global_step": 163991, "epoch": 1975} {"train_loss": -23.52000617980957, "global_step": 163992, "epoch": 1975} {"train_loss": -23.86341094970703, "global_step": 163993, "epoch": 1975} {"train_loss": -23.415674209594727, "global_step": 163994, "epoch": 1975} {"train_loss": -23.73841667175293, "global_step": 163995, "epoch": 1975} {"train_loss": -23.48048210144043, "global_step": 163996, "epoch": 1975} {"train_loss": -23.672800064086914, "global_step": 163997, "epoch": 1975} {"train_loss": -23.746641159057617, "global_step": 163998, "epoch": 1975} {"train_loss": -23.667984008789062, "global_step": 163999, "epoch": 1975} {"train_loss": -23.64206886291504, "global_step": 164000, "epoch": 1975} {"train_loss": -23.6021785736084, "global_step": 164001, "epoch": 1975} {"train_loss": -23.632282257080078, "global_step": 164002, "epoch": 1975} {"train_loss": -23.45989990234375, "global_step": 164003, "epoch": 1975} {"train_loss": -23.430517196655273, "global_step": 164004, "epoch": 1975} {"train_loss": -23.61545181274414, "global_step": 164005, "epoch": 1975} {"train_loss": -23.774457931518555, "global_step": 164006, "epoch": 1975} {"train_loss": -23.414100532072137, "global_step": 164007, "epoch": 1975, "val_loss": 6399225.0} {"train_loss": -23.309310913085938, "global_step": 164008, "epoch": 1976} {"train_loss": -23.623441696166992, "global_step": 164009, "epoch": 1976} {"train_loss": -23.63032341003418, "global_step": 164010, "epoch": 1976} {"train_loss": -23.23248291015625, "global_step": 164011, "epoch": 1976} {"train_loss": -23.67642593383789, "global_step": 164012, "epoch": 1976} {"train_loss": -23.532150268554688, "global_step": 164013, "epoch": 1976} {"train_loss": -23.782522201538086, "global_step": 164014, "epoch": 1976} {"train_loss": -23.326053619384766, "global_step": 164015, "epoch": 1976} {"train_loss": -23.22624969482422, "global_step": 164016, "epoch": 1976} {"train_loss": -23.458053588867188, "global_step": 164017, "epoch": 1976} {"train_loss": -23.41621971130371, "global_step": 164018, "epoch": 1976} {"train_loss": -23.626096725463867, "global_step": 164019, "epoch": 1976} {"train_loss": -22.894115447998047, "global_step": 164020, "epoch": 1976} {"train_loss": -23.148910522460938, "global_step": 164021, "epoch": 1976} {"train_loss": -23.300914764404297, "global_step": 164022, "epoch": 1976} {"train_loss": -23.513898849487305, "global_step": 164023, "epoch": 1976} {"train_loss": -23.394765853881836, "global_step": 164024, "epoch": 1976} {"train_loss": -23.44302749633789, "global_step": 164025, "epoch": 1976} {"train_loss": -23.559783935546875, "global_step": 164026, "epoch": 1976} {"train_loss": -23.819353103637695, "global_step": 164027, "epoch": 1976} {"train_loss": -23.85318946838379, "global_step": 164028, "epoch": 1976} {"train_loss": -23.712583541870117, "global_step": 164029, "epoch": 1976} {"train_loss": -23.705827713012695, "global_step": 164030, "epoch": 1976} {"train_loss": -23.69424819946289, "global_step": 164031, "epoch": 1976} {"train_loss": -23.79740333557129, "global_step": 164032, "epoch": 1976} {"train_loss": -23.662273406982422, "global_step": 164033, "epoch": 1976} {"train_loss": -23.453475952148438, "global_step": 164034, "epoch": 1976} {"train_loss": -23.4570255279541, "global_step": 164035, "epoch": 1976} {"train_loss": -23.5610294342041, "global_step": 164036, "epoch": 1976} {"train_loss": -23.64898681640625, "global_step": 164037, "epoch": 1976} {"train_loss": -23.497060775756836, "global_step": 164038, "epoch": 1976} {"train_loss": -23.51724624633789, "global_step": 164039, "epoch": 1976} {"train_loss": -23.601572036743164, "global_step": 164040, "epoch": 1976} {"train_loss": -23.69856071472168, "global_step": 164041, "epoch": 1976} {"train_loss": -23.178495407104492, "global_step": 164042, "epoch": 1976} {"train_loss": -23.789783477783203, "global_step": 164043, "epoch": 1976} {"train_loss": -23.55122184753418, "global_step": 164044, "epoch": 1976} {"train_loss": -23.906726837158203, "global_step": 164045, "epoch": 1976} {"train_loss": -23.791379928588867, "global_step": 164046, "epoch": 1976} {"train_loss": -23.352773666381836, "global_step": 164047, "epoch": 1976} {"train_loss": -23.490169525146484, "global_step": 164048, "epoch": 1976} {"train_loss": -23.504064559936523, "global_step": 164049, "epoch": 1976} {"train_loss": -23.432851791381836, "global_step": 164050, "epoch": 1976} {"train_loss": -23.76105499267578, "global_step": 164051, "epoch": 1976} {"train_loss": -23.365346908569336, "global_step": 164052, "epoch": 1976} {"train_loss": -23.51607894897461, "global_step": 164053, "epoch": 1976} {"train_loss": -23.62067222595215, "global_step": 164054, "epoch": 1976} {"train_loss": -23.683820724487305, "global_step": 164055, "epoch": 1976} {"train_loss": -23.53274917602539, "global_step": 164056, "epoch": 1976} {"train_loss": -23.96140480041504, "global_step": 164057, "epoch": 1976} {"train_loss": -23.41958999633789, "global_step": 164058, "epoch": 1976} {"train_loss": -23.42170524597168, "global_step": 164059, "epoch": 1976} {"train_loss": -23.43855857849121, "global_step": 164060, "epoch": 1976} {"train_loss": -23.05535888671875, "global_step": 164061, "epoch": 1976} {"train_loss": -23.345577239990234, "global_step": 164062, "epoch": 1976} {"train_loss": -24.004743576049805, "global_step": 164063, "epoch": 1976} {"train_loss": -23.25653076171875, "global_step": 164064, "epoch": 1976} {"train_loss": -23.395544052124023, "global_step": 164065, "epoch": 1976} {"train_loss": -23.6334285736084, "global_step": 164066, "epoch": 1976} {"train_loss": -23.353849411010742, "global_step": 164067, "epoch": 1976} {"train_loss": -23.46417236328125, "global_step": 164068, "epoch": 1976} {"train_loss": -23.757291793823242, "global_step": 164069, "epoch": 1976} {"train_loss": -23.516080856323242, "global_step": 164070, "epoch": 1976} {"train_loss": -23.51618003845215, "global_step": 164071, "epoch": 1976} {"train_loss": -23.829242706298828, "global_step": 164072, "epoch": 1976} {"train_loss": -23.617137908935547, "global_step": 164073, "epoch": 1976} {"train_loss": -23.462387084960938, "global_step": 164074, "epoch": 1976} {"train_loss": -23.63471031188965, "global_step": 164075, "epoch": 1976} {"train_loss": -23.725177764892578, "global_step": 164076, "epoch": 1976} {"train_loss": -23.1795711517334, "global_step": 164077, "epoch": 1976} {"train_loss": -23.674850463867188, "global_step": 164078, "epoch": 1976} {"train_loss": -23.609310150146484, "global_step": 164079, "epoch": 1976} {"train_loss": -23.81244468688965, "global_step": 164080, "epoch": 1976} {"train_loss": -23.74056625366211, "global_step": 164081, "epoch": 1976} {"train_loss": -23.743968963623047, "global_step": 164082, "epoch": 1976} {"train_loss": -23.68488121032715, "global_step": 164083, "epoch": 1976} {"train_loss": -23.8101806640625, "global_step": 164084, "epoch": 1976} {"train_loss": -23.618289947509766, "global_step": 164085, "epoch": 1976} {"train_loss": -23.80198097229004, "global_step": 164086, "epoch": 1976} {"train_loss": -23.87939453125, "global_step": 164087, "epoch": 1976} {"train_loss": -23.76602554321289, "global_step": 164088, "epoch": 1976} {"train_loss": -23.744253158569336, "global_step": 164089, "epoch": 1976} {"train_loss": -23.56112273342638, "global_step": 164090, "epoch": 1976, "val_loss": 6242481.5} {"train_loss": -23.277185440063477, "global_step": 164091, "epoch": 1977} {"train_loss": -23.288761138916016, "global_step": 164092, "epoch": 1977} {"train_loss": -22.961254119873047, "global_step": 164093, "epoch": 1977} {"train_loss": -23.307039260864258, "global_step": 164094, "epoch": 1977} {"train_loss": -23.2574520111084, "global_step": 164095, "epoch": 1977} {"train_loss": -23.135404586791992, "global_step": 164096, "epoch": 1977} {"train_loss": -23.23581314086914, "global_step": 164097, "epoch": 1977} {"train_loss": -23.312286376953125, "global_step": 164098, "epoch": 1977} {"train_loss": -22.722875595092773, "global_step": 164099, "epoch": 1977} {"train_loss": -22.955169677734375, "global_step": 164100, "epoch": 1977} {"train_loss": -23.43941879272461, "global_step": 164101, "epoch": 1977} {"train_loss": -22.9211483001709, "global_step": 164102, "epoch": 1977} {"train_loss": -23.35446548461914, "global_step": 164103, "epoch": 1977} {"train_loss": -23.064367294311523, "global_step": 164104, "epoch": 1977} {"train_loss": -23.721906661987305, "global_step": 164105, "epoch": 1977} {"train_loss": -23.355796813964844, "global_step": 164106, "epoch": 1977} {"train_loss": -23.28278160095215, "global_step": 164107, "epoch": 1977} {"train_loss": -23.249563217163086, "global_step": 164108, "epoch": 1977} {"train_loss": -23.511295318603516, "global_step": 164109, "epoch": 1977} {"train_loss": -23.367284774780273, "global_step": 164110, "epoch": 1977} {"train_loss": -23.44669532775879, "global_step": 164111, "epoch": 1977} {"train_loss": -23.61847496032715, "global_step": 164112, "epoch": 1977} {"train_loss": -23.404024124145508, "global_step": 164113, "epoch": 1977} {"train_loss": -23.544780731201172, "global_step": 164114, "epoch": 1977} {"train_loss": -23.40547752380371, "global_step": 164115, "epoch": 1977} {"train_loss": -23.776809692382812, "global_step": 164116, "epoch": 1977} {"train_loss": -23.611806869506836, "global_step": 164117, "epoch": 1977} {"train_loss": -23.51238441467285, "global_step": 164118, "epoch": 1977} {"train_loss": -23.70003890991211, "global_step": 164119, "epoch": 1977} {"train_loss": -23.690948486328125, "global_step": 164120, "epoch": 1977} {"train_loss": -23.40903091430664, "global_step": 164121, "epoch": 1977} {"train_loss": -23.69748306274414, "global_step": 164122, "epoch": 1977} {"train_loss": -23.461151123046875, "global_step": 164123, "epoch": 1977} {"train_loss": -23.655668258666992, "global_step": 164124, "epoch": 1977} {"train_loss": -23.522356033325195, "global_step": 164125, "epoch": 1977} {"train_loss": -23.380964279174805, "global_step": 164126, "epoch": 1977} {"train_loss": -23.6861629486084, "global_step": 164127, "epoch": 1977} {"train_loss": -23.65321159362793, "global_step": 164128, "epoch": 1977} {"train_loss": -23.759572982788086, "global_step": 164129, "epoch": 1977} {"train_loss": -23.51838493347168, "global_step": 164130, "epoch": 1977} {"train_loss": -23.90964698791504, "global_step": 164131, "epoch": 1977} {"train_loss": -23.9466609954834, "global_step": 164132, "epoch": 1977} {"train_loss": -23.40382194519043, "global_step": 164133, "epoch": 1977} {"train_loss": -23.666601181030273, "global_step": 164134, "epoch": 1977} {"train_loss": -23.524822235107422, "global_step": 164135, "epoch": 1977} {"train_loss": -23.772733688354492, "global_step": 164136, "epoch": 1977} {"train_loss": -23.769956588745117, "global_step": 164137, "epoch": 1977} {"train_loss": -23.7174015045166, "global_step": 164138, "epoch": 1977} {"train_loss": -23.811511993408203, "global_step": 164139, "epoch": 1977} {"train_loss": -23.599498748779297, "global_step": 164140, "epoch": 1977} {"train_loss": -23.75111961364746, "global_step": 164141, "epoch": 1977} {"train_loss": -23.753761291503906, "global_step": 164142, "epoch": 1977} {"train_loss": -23.458084106445312, "global_step": 164143, "epoch": 1977} {"train_loss": -23.4374942779541, "global_step": 164144, "epoch": 1977} {"train_loss": -23.492645263671875, "global_step": 164145, "epoch": 1977} {"train_loss": -23.776229858398438, "global_step": 164146, "epoch": 1977} {"train_loss": -23.394968032836914, "global_step": 164147, "epoch": 1977} {"train_loss": -23.67532730102539, "global_step": 164148, "epoch": 1977} {"train_loss": -23.30508804321289, "global_step": 164149, "epoch": 1977} {"train_loss": -23.44599723815918, "global_step": 164150, "epoch": 1977} {"train_loss": -23.53007698059082, "global_step": 164151, "epoch": 1977} {"train_loss": -23.719202041625977, "global_step": 164152, "epoch": 1977} {"train_loss": -23.54287338256836, "global_step": 164153, "epoch": 1977} {"train_loss": -23.574644088745117, "global_step": 164154, "epoch": 1977} {"train_loss": -23.7856502532959, "global_step": 164155, "epoch": 1977} {"train_loss": -23.606922149658203, "global_step": 164156, "epoch": 1977} {"train_loss": -23.51426124572754, "global_step": 164157, "epoch": 1977} {"train_loss": -23.416362762451172, "global_step": 164158, "epoch": 1977} {"train_loss": -23.87158966064453, "global_step": 164159, "epoch": 1977} {"train_loss": -23.266605377197266, "global_step": 164160, "epoch": 1977} {"train_loss": -23.797269821166992, "global_step": 164161, "epoch": 1977} {"train_loss": -23.928119659423828, "global_step": 164162, "epoch": 1977} {"train_loss": -23.780973434448242, "global_step": 164163, "epoch": 1977} {"train_loss": -23.764968872070312, "global_step": 164164, "epoch": 1977} {"train_loss": -23.59075927734375, "global_step": 164165, "epoch": 1977} {"train_loss": -23.513334274291992, "global_step": 164166, "epoch": 1977} {"train_loss": -23.314332962036133, "global_step": 164167, "epoch": 1977} {"train_loss": -23.790128707885742, "global_step": 164168, "epoch": 1977} {"train_loss": -23.533857345581055, "global_step": 164169, "epoch": 1977} {"train_loss": -23.459674835205078, "global_step": 164170, "epoch": 1977} {"train_loss": -23.299741744995117, "global_step": 164171, "epoch": 1977} {"train_loss": -23.401880264282227, "global_step": 164172, "epoch": 1977} {"train_loss": -23.520383719938348, "global_step": 164173, "epoch": 1977, "val_loss": 6338205.5} {"train_loss": -23.221635818481445, "global_step": 164174, "epoch": 1978} {"train_loss": -23.665075302124023, "global_step": 164175, "epoch": 1978} {"train_loss": -23.245311737060547, "global_step": 164176, "epoch": 1978} {"train_loss": -23.064468383789062, "global_step": 164177, "epoch": 1978} {"train_loss": -22.49544334411621, "global_step": 164178, "epoch": 1978} {"train_loss": -22.625873565673828, "global_step": 164179, "epoch": 1978} {"train_loss": -23.206769943237305, "global_step": 164180, "epoch": 1978} {"train_loss": -23.083118438720703, "global_step": 164181, "epoch": 1978} {"train_loss": -22.871854782104492, "global_step": 164182, "epoch": 1978} {"train_loss": -23.587247848510742, "global_step": 164183, "epoch": 1978} {"train_loss": -22.97132682800293, "global_step": 164184, "epoch": 1978} {"train_loss": -23.697933197021484, "global_step": 164185, "epoch": 1978} {"train_loss": -23.085050582885742, "global_step": 164186, "epoch": 1978} {"train_loss": -23.68010902404785, "global_step": 164187, "epoch": 1978} {"train_loss": -22.96354103088379, "global_step": 164188, "epoch": 1978} {"train_loss": -23.54754638671875, "global_step": 164189, "epoch": 1978} {"train_loss": -23.077497482299805, "global_step": 164190, "epoch": 1978} {"train_loss": -23.2679500579834, "global_step": 164191, "epoch": 1978} {"train_loss": -23.320697784423828, "global_step": 164192, "epoch": 1978} {"train_loss": -22.83416175842285, "global_step": 164193, "epoch": 1978} {"train_loss": -23.389917373657227, "global_step": 164194, "epoch": 1978} {"train_loss": -23.479591369628906, "global_step": 164195, "epoch": 1978} {"train_loss": -23.07562828063965, "global_step": 164196, "epoch": 1978} {"train_loss": -23.272964477539062, "global_step": 164197, "epoch": 1978} {"train_loss": -23.812467575073242, "global_step": 164198, "epoch": 1978} {"train_loss": -23.371784210205078, "global_step": 164199, "epoch": 1978} {"train_loss": -23.52528953552246, "global_step": 164200, "epoch": 1978} {"train_loss": -23.844223022460938, "global_step": 164201, "epoch": 1978} {"train_loss": -23.35295867919922, "global_step": 164202, "epoch": 1978} {"train_loss": -23.3053035736084, "global_step": 164203, "epoch": 1978} {"train_loss": -23.644855499267578, "global_step": 164204, "epoch": 1978} {"train_loss": -23.44007682800293, "global_step": 164205, "epoch": 1978} {"train_loss": -23.224164962768555, "global_step": 164206, "epoch": 1978} {"train_loss": -23.543994903564453, "global_step": 164207, "epoch": 1978} {"train_loss": -23.679759979248047, "global_step": 164208, "epoch": 1978} {"train_loss": -23.858097076416016, "global_step": 164209, "epoch": 1978} {"train_loss": -23.77640724182129, "global_step": 164210, "epoch": 1978} {"train_loss": -23.6284122467041, "global_step": 164211, "epoch": 1978} {"train_loss": -23.7728328704834, "global_step": 164212, "epoch": 1978} {"train_loss": -23.6472110748291, "global_step": 164213, "epoch": 1978} {"train_loss": -23.735103607177734, "global_step": 164214, "epoch": 1978} {"train_loss": -23.71210289001465, "global_step": 164215, "epoch": 1978} {"train_loss": -23.70767593383789, "global_step": 164216, "epoch": 1978} {"train_loss": -23.31855583190918, "global_step": 164217, "epoch": 1978} {"train_loss": -23.634057998657227, "global_step": 164218, "epoch": 1978} {"train_loss": -23.527376174926758, "global_step": 164219, "epoch": 1978} {"train_loss": -23.94905662536621, "global_step": 164220, "epoch": 1978} {"train_loss": -23.767166137695312, "global_step": 164221, "epoch": 1978} {"train_loss": -23.951684951782227, "global_step": 164222, "epoch": 1978} {"train_loss": -23.380844116210938, "global_step": 164223, "epoch": 1978} {"train_loss": -23.510671615600586, "global_step": 164224, "epoch": 1978} {"train_loss": -23.069950103759766, "global_step": 164225, "epoch": 1978} {"train_loss": -23.058368682861328, "global_step": 164226, "epoch": 1978} {"train_loss": -23.35008430480957, "global_step": 164227, "epoch": 1978} {"train_loss": -23.582265853881836, "global_step": 164228, "epoch": 1978} {"train_loss": -23.60288429260254, "global_step": 164229, "epoch": 1978} {"train_loss": -23.64399528503418, "global_step": 164230, "epoch": 1978} {"train_loss": -23.713659286499023, "global_step": 164231, "epoch": 1978} {"train_loss": -23.445110321044922, "global_step": 164232, "epoch": 1978} {"train_loss": -23.47940444946289, "global_step": 164233, "epoch": 1978} {"train_loss": -23.857563018798828, "global_step": 164234, "epoch": 1978} {"train_loss": -23.06195640563965, "global_step": 164235, "epoch": 1978} {"train_loss": -23.638174057006836, "global_step": 164236, "epoch": 1978} {"train_loss": -23.5832462310791, "global_step": 164237, "epoch": 1978} {"train_loss": -23.55198860168457, "global_step": 164238, "epoch": 1978} {"train_loss": -23.514707565307617, "global_step": 164239, "epoch": 1978} {"train_loss": -23.391307830810547, "global_step": 164240, "epoch": 1978} {"train_loss": -23.598608016967773, "global_step": 164241, "epoch": 1978} {"train_loss": -23.707866668701172, "global_step": 164242, "epoch": 1978} {"train_loss": -23.7188777923584, "global_step": 164243, "epoch": 1978} {"train_loss": -24.025127410888672, "global_step": 164244, "epoch": 1978} {"train_loss": -23.626922607421875, "global_step": 164245, "epoch": 1978} {"train_loss": -23.83072280883789, "global_step": 164246, "epoch": 1978} {"train_loss": -23.34469985961914, "global_step": 164247, "epoch": 1978} {"train_loss": -24.00955581665039, "global_step": 164248, "epoch": 1978} {"train_loss": -23.482696533203125, "global_step": 164249, "epoch": 1978} {"train_loss": -23.50107192993164, "global_step": 164250, "epoch": 1978} {"train_loss": -23.603269577026367, "global_step": 164251, "epoch": 1978} {"train_loss": -23.87660026550293, "global_step": 164252, "epoch": 1978} {"train_loss": -23.5107479095459, "global_step": 164253, "epoch": 1978} {"train_loss": -23.740121841430664, "global_step": 164254, "epoch": 1978} {"train_loss": -23.683935165405273, "global_step": 164255, "epoch": 1978} {"train_loss": -23.469048373670464, "global_step": 164256, "epoch": 1978, "val_loss": 6447491.0} {"train_loss": -22.473356246948242, "global_step": 164257, "epoch": 1979} {"train_loss": -22.0533504486084, "global_step": 164258, "epoch": 1979} {"train_loss": -22.84284782409668, "global_step": 164259, "epoch": 1979} {"train_loss": -22.68337059020996, "global_step": 164260, "epoch": 1979} {"train_loss": -23.082605361938477, "global_step": 164261, "epoch": 1979} {"train_loss": -22.80781364440918, "global_step": 164262, "epoch": 1979} {"train_loss": -23.52952003479004, "global_step": 164263, "epoch": 1979} {"train_loss": -23.33326530456543, "global_step": 164264, "epoch": 1979} {"train_loss": -23.29368019104004, "global_step": 164265, "epoch": 1979} {"train_loss": -22.876310348510742, "global_step": 164266, "epoch": 1979} {"train_loss": -23.07459831237793, "global_step": 164267, "epoch": 1979} {"train_loss": -22.912565231323242, "global_step": 164268, "epoch": 1979} {"train_loss": -23.237279891967773, "global_step": 164269, "epoch": 1979} {"train_loss": -23.24249839782715, "global_step": 164270, "epoch": 1979} {"train_loss": -23.570222854614258, "global_step": 164271, "epoch": 1979} {"train_loss": -22.924419403076172, "global_step": 164272, "epoch": 1979} {"train_loss": -23.40046501159668, "global_step": 164273, "epoch": 1979} {"train_loss": -23.127431869506836, "global_step": 164274, "epoch": 1979} {"train_loss": -23.222564697265625, "global_step": 164275, "epoch": 1979} {"train_loss": -23.383398056030273, "global_step": 164276, "epoch": 1979} {"train_loss": -22.984411239624023, "global_step": 164277, "epoch": 1979} {"train_loss": -23.030160903930664, "global_step": 164278, "epoch": 1979} {"train_loss": -23.153928756713867, "global_step": 164279, "epoch": 1979} {"train_loss": -23.20755958557129, "global_step": 164280, "epoch": 1979} {"train_loss": -23.253860473632812, "global_step": 164281, "epoch": 1979} {"train_loss": -23.410810470581055, "global_step": 164282, "epoch": 1979} {"train_loss": -23.67034339904785, "global_step": 164283, "epoch": 1979} {"train_loss": -23.34111976623535, "global_step": 164284, "epoch": 1979} {"train_loss": -23.4051513671875, "global_step": 164285, "epoch": 1979} {"train_loss": -23.507301330566406, "global_step": 164286, "epoch": 1979} {"train_loss": -23.41008949279785, "global_step": 164287, "epoch": 1979} {"train_loss": -23.665660858154297, "global_step": 164288, "epoch": 1979} {"train_loss": -23.57552146911621, "global_step": 164289, "epoch": 1979} {"train_loss": -23.547773361206055, "global_step": 164290, "epoch": 1979} {"train_loss": -23.66585350036621, "global_step": 164291, "epoch": 1979} {"train_loss": -23.666654586791992, "global_step": 164292, "epoch": 1979} {"train_loss": -23.504215240478516, "global_step": 164293, "epoch": 1979} {"train_loss": -23.09849739074707, "global_step": 164294, "epoch": 1979} {"train_loss": -23.545063018798828, "global_step": 164295, "epoch": 1979} {"train_loss": -23.37491226196289, "global_step": 164296, "epoch": 1979} {"train_loss": -23.570459365844727, "global_step": 164297, "epoch": 1979} {"train_loss": -23.393190383911133, "global_step": 164298, "epoch": 1979} {"train_loss": -23.531763076782227, "global_step": 164299, "epoch": 1979} {"train_loss": -23.330488204956055, "global_step": 164300, "epoch": 1979} {"train_loss": -23.578065872192383, "global_step": 164301, "epoch": 1979} {"train_loss": -23.492116928100586, "global_step": 164302, "epoch": 1979} {"train_loss": -23.854476928710938, "global_step": 164303, "epoch": 1979} {"train_loss": -23.604808807373047, "global_step": 164304, "epoch": 1979} {"train_loss": -23.569625854492188, "global_step": 164305, "epoch": 1979} {"train_loss": -23.39034080505371, "global_step": 164306, "epoch": 1979} {"train_loss": -23.84486198425293, "global_step": 164307, "epoch": 1979} {"train_loss": -23.76422691345215, "global_step": 164308, "epoch": 1979} {"train_loss": -23.711217880249023, "global_step": 164309, "epoch": 1979} {"train_loss": -23.70061683654785, "global_step": 164310, "epoch": 1979} {"train_loss": -23.447336196899414, "global_step": 164311, "epoch": 1979} {"train_loss": -23.827306747436523, "global_step": 164312, "epoch": 1979} {"train_loss": -23.37041664123535, "global_step": 164313, "epoch": 1979} {"train_loss": -23.165678024291992, "global_step": 164314, "epoch": 1979} {"train_loss": -23.93781852722168, "global_step": 164315, "epoch": 1979} {"train_loss": -23.340478897094727, "global_step": 164316, "epoch": 1979} {"train_loss": -23.514694213867188, "global_step": 164317, "epoch": 1979} {"train_loss": -23.904449462890625, "global_step": 164318, "epoch": 1979} {"train_loss": -23.796024322509766, "global_step": 164319, "epoch": 1979} {"train_loss": -24.118484497070312, "global_step": 164320, "epoch": 1979} {"train_loss": -23.818727493286133, "global_step": 164321, "epoch": 1979} {"train_loss": -23.751157760620117, "global_step": 164322, "epoch": 1979} {"train_loss": -24.018400192260742, "global_step": 164323, "epoch": 1979} {"train_loss": -23.337059020996094, "global_step": 164324, "epoch": 1979} {"train_loss": -23.694856643676758, "global_step": 164325, "epoch": 1979} {"train_loss": -23.539579391479492, "global_step": 164326, "epoch": 1979} {"train_loss": -23.25453758239746, "global_step": 164327, "epoch": 1979} {"train_loss": -23.327781677246094, "global_step": 164328, "epoch": 1979} {"train_loss": -23.5838680267334, "global_step": 164329, "epoch": 1979} {"train_loss": -23.699188232421875, "global_step": 164330, "epoch": 1979} {"train_loss": -23.431442260742188, "global_step": 164331, "epoch": 1979} {"train_loss": -23.3817138671875, "global_step": 164332, "epoch": 1979} {"train_loss": -23.433517456054688, "global_step": 164333, "epoch": 1979} {"train_loss": -23.576356887817383, "global_step": 164334, "epoch": 1979} {"train_loss": -23.702016830444336, "global_step": 164335, "epoch": 1979} {"train_loss": -23.54478645324707, "global_step": 164336, "epoch": 1979} {"train_loss": -23.727705001831055, "global_step": 164337, "epoch": 1979} {"train_loss": -23.556983947753906, "global_step": 164338, "epoch": 1979} {"train_loss": -23.425628478268543, "global_step": 164339, "epoch": 1979, "val_loss": 6435822.0} {"train_loss": -22.82771110534668, "global_step": 164340, "epoch": 1980} {"train_loss": -23.20542335510254, "global_step": 164341, "epoch": 1980} {"train_loss": -23.003496170043945, "global_step": 164342, "epoch": 1980} {"train_loss": -23.254201889038086, "global_step": 164343, "epoch": 1980} {"train_loss": -23.19074058532715, "global_step": 164344, "epoch": 1980} {"train_loss": -23.267921447753906, "global_step": 164345, "epoch": 1980} {"train_loss": -23.03496742248535, "global_step": 164346, "epoch": 1980} {"train_loss": -23.435165405273438, "global_step": 164347, "epoch": 1980} {"train_loss": -23.075763702392578, "global_step": 164348, "epoch": 1980} {"train_loss": -23.174076080322266, "global_step": 164349, "epoch": 1980} {"train_loss": -23.504789352416992, "global_step": 164350, "epoch": 1980} {"train_loss": -23.138029098510742, "global_step": 164351, "epoch": 1980} {"train_loss": -23.23603630065918, "global_step": 164352, "epoch": 1980} {"train_loss": -23.398603439331055, "global_step": 164353, "epoch": 1980} {"train_loss": -23.502487182617188, "global_step": 164354, "epoch": 1980} {"train_loss": -23.10163116455078, "global_step": 164355, "epoch": 1980} {"train_loss": -23.435911178588867, "global_step": 164356, "epoch": 1980} {"train_loss": -23.496164321899414, "global_step": 164357, "epoch": 1980} {"train_loss": -23.746530532836914, "global_step": 164358, "epoch": 1980} {"train_loss": -23.2409610748291, "global_step": 164359, "epoch": 1980} {"train_loss": -23.38189125061035, "global_step": 164360, "epoch": 1980} {"train_loss": -23.290952682495117, "global_step": 164361, "epoch": 1980} {"train_loss": -23.998788833618164, "global_step": 164362, "epoch": 1980} {"train_loss": -23.599729537963867, "global_step": 164363, "epoch": 1980} {"train_loss": -23.499908447265625, "global_step": 164364, "epoch": 1980} {"train_loss": -23.872316360473633, "global_step": 164365, "epoch": 1980} {"train_loss": -23.440092086791992, "global_step": 164366, "epoch": 1980} {"train_loss": -23.801023483276367, "global_step": 164367, "epoch": 1980} {"train_loss": -23.777542114257812, "global_step": 164368, "epoch": 1980} {"train_loss": -23.52107048034668, "global_step": 164369, "epoch": 1980} {"train_loss": -23.451505661010742, "global_step": 164370, "epoch": 1980} {"train_loss": -23.72846794128418, "global_step": 164371, "epoch": 1980} {"train_loss": -23.82391357421875, "global_step": 164372, "epoch": 1980} {"train_loss": -23.398733139038086, "global_step": 164373, "epoch": 1980} {"train_loss": -23.722986221313477, "global_step": 164374, "epoch": 1980} {"train_loss": -23.404067993164062, "global_step": 164375, "epoch": 1980} {"train_loss": -23.361278533935547, "global_step": 164376, "epoch": 1980} {"train_loss": -23.788105010986328, "global_step": 164377, "epoch": 1980} {"train_loss": -23.50443458557129, "global_step": 164378, "epoch": 1980} {"train_loss": -23.69369888305664, "global_step": 164379, "epoch": 1980} {"train_loss": -23.52988052368164, "global_step": 164380, "epoch": 1980} {"train_loss": -23.585020065307617, "global_step": 164381, "epoch": 1980} {"train_loss": -23.6643123626709, "global_step": 164382, "epoch": 1980} {"train_loss": -23.79098892211914, "global_step": 164383, "epoch": 1980} {"train_loss": -23.517681121826172, "global_step": 164384, "epoch": 1980} {"train_loss": -23.550357818603516, "global_step": 164385, "epoch": 1980} {"train_loss": -23.586570739746094, "global_step": 164386, "epoch": 1980} {"train_loss": -23.620746612548828, "global_step": 164387, "epoch": 1980} {"train_loss": -23.62834930419922, "global_step": 164388, "epoch": 1980} {"train_loss": -23.865680694580078, "global_step": 164389, "epoch": 1980} {"train_loss": -23.418071746826172, "global_step": 164390, "epoch": 1980} {"train_loss": -23.149320602416992, "global_step": 164391, "epoch": 1980} {"train_loss": -23.623044967651367, "global_step": 164392, "epoch": 1980} {"train_loss": -23.678329467773438, "global_step": 164393, "epoch": 1980} {"train_loss": -23.388347625732422, "global_step": 164394, "epoch": 1980} {"train_loss": -23.714523315429688, "global_step": 164395, "epoch": 1980} {"train_loss": -23.38649559020996, "global_step": 164396, "epoch": 1980} {"train_loss": -23.44678497314453, "global_step": 164397, "epoch": 1980} {"train_loss": -23.59174156188965, "global_step": 164398, "epoch": 1980} {"train_loss": -23.693174362182617, "global_step": 164399, "epoch": 1980} {"train_loss": -23.52853012084961, "global_step": 164400, "epoch": 1980} {"train_loss": -23.67669677734375, "global_step": 164401, "epoch": 1980} {"train_loss": -23.330398559570312, "global_step": 164402, "epoch": 1980} {"train_loss": -24.254249572753906, "global_step": 164403, "epoch": 1980} {"train_loss": -23.560230255126953, "global_step": 164404, "epoch": 1980} {"train_loss": -23.633831024169922, "global_step": 164405, "epoch": 1980} {"train_loss": -24.221723556518555, "global_step": 164406, "epoch": 1980} {"train_loss": -23.494497299194336, "global_step": 164407, "epoch": 1980} {"train_loss": -23.454360961914062, "global_step": 164408, "epoch": 1980} {"train_loss": -23.431432723999023, "global_step": 164409, "epoch": 1980} {"train_loss": -23.522897720336914, "global_step": 164410, "epoch": 1980} {"train_loss": -23.8898868560791, "global_step": 164411, "epoch": 1980} {"train_loss": -23.465938568115234, "global_step": 164412, "epoch": 1980} {"train_loss": -23.4075927734375, "global_step": 164413, "epoch": 1980} {"train_loss": -23.550445556640625, "global_step": 164414, "epoch": 1980} {"train_loss": -23.789066314697266, "global_step": 164415, "epoch": 1980} {"train_loss": -23.667724609375, "global_step": 164416, "epoch": 1980} {"train_loss": -23.80720329284668, "global_step": 164417, "epoch": 1980} {"train_loss": -23.736066818237305, "global_step": 164418, "epoch": 1980} {"train_loss": -23.774681091308594, "global_step": 164419, "epoch": 1980} {"train_loss": -23.794721603393555, "global_step": 164420, "epoch": 1980} {"train_loss": -23.851011276245117, "global_step": 164421, "epoch": 1980} {"train_loss": -23.521765053990375, "global_step": 164422, "epoch": 1980, "val_loss": 6354022.0} {"train_loss": -23.606698989868164, "global_step": 164423, "epoch": 1981} {"train_loss": -22.95595359802246, "global_step": 164424, "epoch": 1981} {"train_loss": -22.94549560546875, "global_step": 164425, "epoch": 1981} {"train_loss": -22.449949264526367, "global_step": 164426, "epoch": 1981} {"train_loss": -22.876028060913086, "global_step": 164427, "epoch": 1981} {"train_loss": -23.12269401550293, "global_step": 164428, "epoch": 1981} {"train_loss": -22.907236099243164, "global_step": 164429, "epoch": 1981} {"train_loss": -23.121381759643555, "global_step": 164430, "epoch": 1981} {"train_loss": -23.1638240814209, "global_step": 164431, "epoch": 1981} {"train_loss": -23.290210723876953, "global_step": 164432, "epoch": 1981} {"train_loss": -23.47170066833496, "global_step": 164433, "epoch": 1981} {"train_loss": -23.03708839416504, "global_step": 164434, "epoch": 1981} {"train_loss": -23.069339752197266, "global_step": 164435, "epoch": 1981} {"train_loss": -23.1282901763916, "global_step": 164436, "epoch": 1981} {"train_loss": -23.17683982849121, "global_step": 164437, "epoch": 1981} {"train_loss": -23.428211212158203, "global_step": 164438, "epoch": 1981} {"train_loss": -23.275217056274414, "global_step": 164439, "epoch": 1981} {"train_loss": -23.284292221069336, "global_step": 164440, "epoch": 1981} {"train_loss": -23.288105010986328, "global_step": 164441, "epoch": 1981} {"train_loss": -23.122034072875977, "global_step": 164442, "epoch": 1981} {"train_loss": -23.228321075439453, "global_step": 164443, "epoch": 1981} {"train_loss": -23.112424850463867, "global_step": 164444, "epoch": 1981} {"train_loss": -23.02141761779785, "global_step": 164445, "epoch": 1981} {"train_loss": -23.499622344970703, "global_step": 164446, "epoch": 1981} {"train_loss": -23.45757484436035, "global_step": 164447, "epoch": 1981} {"train_loss": -23.654804229736328, "global_step": 164448, "epoch": 1981} {"train_loss": -23.581289291381836, "global_step": 164449, "epoch": 1981} {"train_loss": -23.278146743774414, "global_step": 164450, "epoch": 1981} {"train_loss": -23.376436233520508, "global_step": 164451, "epoch": 1981} {"train_loss": -23.473770141601562, "global_step": 164452, "epoch": 1981} {"train_loss": -23.890378952026367, "global_step": 164453, "epoch": 1981} {"train_loss": -23.919225692749023, "global_step": 164454, "epoch": 1981} {"train_loss": -23.807708740234375, "global_step": 164455, "epoch": 1981} {"train_loss": -23.585285186767578, "global_step": 164456, "epoch": 1981} {"train_loss": -24.347745895385742, "global_step": 164457, "epoch": 1981} {"train_loss": -23.61838150024414, "global_step": 164458, "epoch": 1981} {"train_loss": -23.79164695739746, "global_step": 164459, "epoch": 1981} {"train_loss": -23.616024017333984, "global_step": 164460, "epoch": 1981} {"train_loss": -23.840587615966797, "global_step": 164461, "epoch": 1981} {"train_loss": -23.492233276367188, "global_step": 164462, "epoch": 1981} {"train_loss": -23.378644943237305, "global_step": 164463, "epoch": 1981} {"train_loss": -23.924209594726562, "global_step": 164464, "epoch": 1981} {"train_loss": -24.028100967407227, "global_step": 164465, "epoch": 1981} {"train_loss": -23.68031883239746, "global_step": 164466, "epoch": 1981} {"train_loss": -23.49711036682129, "global_step": 164467, "epoch": 1981} {"train_loss": -24.028966903686523, "global_step": 164468, "epoch": 1981} {"train_loss": -23.62582778930664, "global_step": 164469, "epoch": 1981} {"train_loss": -23.812597274780273, "global_step": 164470, "epoch": 1981} {"train_loss": -23.46222686767578, "global_step": 164471, "epoch": 1981} {"train_loss": -23.680370330810547, "global_step": 164472, "epoch": 1981} {"train_loss": -23.919370651245117, "global_step": 164473, "epoch": 1981} {"train_loss": -23.762792587280273, "global_step": 164474, "epoch": 1981} {"train_loss": -24.089048385620117, "global_step": 164475, "epoch": 1981} {"train_loss": -23.51328468322754, "global_step": 164476, "epoch": 1981} {"train_loss": -23.799304962158203, "global_step": 164477, "epoch": 1981} {"train_loss": -23.832443237304688, "global_step": 164478, "epoch": 1981} {"train_loss": -23.40347671508789, "global_step": 164479, "epoch": 1981} {"train_loss": -23.604673385620117, "global_step": 164480, "epoch": 1981} {"train_loss": -23.72787857055664, "global_step": 164481, "epoch": 1981} {"train_loss": -23.673254013061523, "global_step": 164482, "epoch": 1981} {"train_loss": -23.617795944213867, "global_step": 164483, "epoch": 1981} {"train_loss": -23.839059829711914, "global_step": 164484, "epoch": 1981} {"train_loss": -23.417816162109375, "global_step": 164485, "epoch": 1981} {"train_loss": -23.72617530822754, "global_step": 164486, "epoch": 1981} {"train_loss": -23.402435302734375, "global_step": 164487, "epoch": 1981} {"train_loss": -23.63338279724121, "global_step": 164488, "epoch": 1981} {"train_loss": -23.725942611694336, "global_step": 164489, "epoch": 1981} {"train_loss": -23.81328010559082, "global_step": 164490, "epoch": 1981} {"train_loss": -23.895910263061523, "global_step": 164491, "epoch": 1981} {"train_loss": -23.54715347290039, "global_step": 164492, "epoch": 1981} {"train_loss": -22.796613693237305, "global_step": 164493, "epoch": 1981} {"train_loss": -22.44175148010254, "global_step": 164494, "epoch": 1981} {"train_loss": -22.8990535736084, "global_step": 164495, "epoch": 1981} {"train_loss": -23.554908752441406, "global_step": 164496, "epoch": 1981} {"train_loss": -23.67920684814453, "global_step": 164497, "epoch": 1981} {"train_loss": -23.735769271850586, "global_step": 164498, "epoch": 1981} {"train_loss": -23.290180206298828, "global_step": 164499, "epoch": 1981} {"train_loss": -23.6488094329834, "global_step": 164500, "epoch": 1981} {"train_loss": -23.48174476623535, "global_step": 164501, "epoch": 1981} {"train_loss": -23.527610778808594, "global_step": 164502, "epoch": 1981} {"train_loss": -23.476078033447266, "global_step": 164503, "epoch": 1981} {"train_loss": -23.587207794189453, "global_step": 164504, "epoch": 1981} {"train_loss": -23.491789737379694, "global_step": 164505, "epoch": 1981, "val_loss": 6432455.5} {"train_loss": -23.16803550720215, "global_step": 164506, "epoch": 1982} {"train_loss": -22.93626594543457, "global_step": 164507, "epoch": 1982} {"train_loss": -23.49739646911621, "global_step": 164508, "epoch": 1982} {"train_loss": -23.047561645507812, "global_step": 164509, "epoch": 1982} {"train_loss": -22.680036544799805, "global_step": 164510, "epoch": 1982} {"train_loss": -23.30811882019043, "global_step": 164511, "epoch": 1982} {"train_loss": -23.080366134643555, "global_step": 164512, "epoch": 1982} {"train_loss": -23.001697540283203, "global_step": 164513, "epoch": 1982} {"train_loss": -23.01169776916504, "global_step": 164514, "epoch": 1982} {"train_loss": -22.950603485107422, "global_step": 164515, "epoch": 1982} {"train_loss": -23.147703170776367, "global_step": 164516, "epoch": 1982} {"train_loss": -23.5362491607666, "global_step": 164517, "epoch": 1982} {"train_loss": -23.207643508911133, "global_step": 164518, "epoch": 1982} {"train_loss": -23.088245391845703, "global_step": 164519, "epoch": 1982} {"train_loss": -23.431806564331055, "global_step": 164520, "epoch": 1982} {"train_loss": -23.738235473632812, "global_step": 164521, "epoch": 1982} {"train_loss": -23.1541748046875, "global_step": 164522, "epoch": 1982} {"train_loss": -23.32735252380371, "global_step": 164523, "epoch": 1982} {"train_loss": -23.62422752380371, "global_step": 164524, "epoch": 1982} {"train_loss": -23.405170440673828, "global_step": 164525, "epoch": 1982} {"train_loss": -23.53617286682129, "global_step": 164526, "epoch": 1982} {"train_loss": -23.662826538085938, "global_step": 164527, "epoch": 1982} {"train_loss": -23.571374893188477, "global_step": 164528, "epoch": 1982} {"train_loss": -23.598615646362305, "global_step": 164529, "epoch": 1982} {"train_loss": -23.25250816345215, "global_step": 164530, "epoch": 1982} {"train_loss": -23.151952743530273, "global_step": 164531, "epoch": 1982} {"train_loss": -23.331396102905273, "global_step": 164532, "epoch": 1982} {"train_loss": -23.58075523376465, "global_step": 164533, "epoch": 1982} {"train_loss": -23.2523250579834, "global_step": 164534, "epoch": 1982} {"train_loss": -23.923023223876953, "global_step": 164535, "epoch": 1982} {"train_loss": -23.6445255279541, "global_step": 164536, "epoch": 1982} {"train_loss": -23.852479934692383, "global_step": 164537, "epoch": 1982} {"train_loss": -23.567535400390625, "global_step": 164538, "epoch": 1982} {"train_loss": -23.403553009033203, "global_step": 164539, "epoch": 1982} {"train_loss": -23.700428009033203, "global_step": 164540, "epoch": 1982} {"train_loss": -23.737979888916016, "global_step": 164541, "epoch": 1982} {"train_loss": -23.598360061645508, "global_step": 164542, "epoch": 1982} {"train_loss": -23.842517852783203, "global_step": 164543, "epoch": 1982} {"train_loss": -23.985445022583008, "global_step": 164544, "epoch": 1982} {"train_loss": -23.433897018432617, "global_step": 164545, "epoch": 1982} {"train_loss": -23.339170455932617, "global_step": 164546, "epoch": 1982} {"train_loss": -23.652868270874023, "global_step": 164547, "epoch": 1982} {"train_loss": -23.435514450073242, "global_step": 164548, "epoch": 1982} {"train_loss": -23.481904983520508, "global_step": 164549, "epoch": 1982} {"train_loss": -23.39876937866211, "global_step": 164550, "epoch": 1982} {"train_loss": -23.421125411987305, "global_step": 164551, "epoch": 1982} {"train_loss": -23.278656005859375, "global_step": 164552, "epoch": 1982} {"train_loss": -23.372106552124023, "global_step": 164553, "epoch": 1982} {"train_loss": -23.868925094604492, "global_step": 164554, "epoch": 1982} {"train_loss": -23.71671485900879, "global_step": 164555, "epoch": 1982} {"train_loss": -23.788362503051758, "global_step": 164556, "epoch": 1982} {"train_loss": -23.449268341064453, "global_step": 164557, "epoch": 1982} {"train_loss": -23.730670928955078, "global_step": 164558, "epoch": 1982} {"train_loss": -23.611536026000977, "global_step": 164559, "epoch": 1982} {"train_loss": -23.873104095458984, "global_step": 164560, "epoch": 1982} {"train_loss": -23.574926376342773, "global_step": 164561, "epoch": 1982} {"train_loss": -23.552663803100586, "global_step": 164562, "epoch": 1982} {"train_loss": -23.767507553100586, "global_step": 164563, "epoch": 1982} {"train_loss": -23.63576316833496, "global_step": 164564, "epoch": 1982} {"train_loss": -23.87013053894043, "global_step": 164565, "epoch": 1982} {"train_loss": -23.713443756103516, "global_step": 164566, "epoch": 1982} {"train_loss": -23.484220504760742, "global_step": 164567, "epoch": 1982} {"train_loss": -23.62486457824707, "global_step": 164568, "epoch": 1982} {"train_loss": -23.96946144104004, "global_step": 164569, "epoch": 1982} {"train_loss": -23.842269897460938, "global_step": 164570, "epoch": 1982} {"train_loss": -23.458358764648438, "global_step": 164571, "epoch": 1982} {"train_loss": -23.927371978759766, "global_step": 164572, "epoch": 1982} {"train_loss": -23.90790367126465, "global_step": 164573, "epoch": 1982} {"train_loss": -23.61610984802246, "global_step": 164574, "epoch": 1982} {"train_loss": -23.429838180541992, "global_step": 164575, "epoch": 1982} {"train_loss": -23.612117767333984, "global_step": 164576, "epoch": 1982} {"train_loss": -23.411863327026367, "global_step": 164577, "epoch": 1982} {"train_loss": -23.49086570739746, "global_step": 164578, "epoch": 1982} {"train_loss": -23.829153060913086, "global_step": 164579, "epoch": 1982} {"train_loss": -23.584524154663086, "global_step": 164580, "epoch": 1982} {"train_loss": -23.467330932617188, "global_step": 164581, "epoch": 1982} {"train_loss": -23.85077476501465, "global_step": 164582, "epoch": 1982} {"train_loss": -23.589962005615234, "global_step": 164583, "epoch": 1982} {"train_loss": -24.22871208190918, "global_step": 164584, "epoch": 1982} {"train_loss": -23.579666137695312, "global_step": 164585, "epoch": 1982} {"train_loss": -23.688798904418945, "global_step": 164586, "epoch": 1982} {"train_loss": -23.814044952392578, "global_step": 164587, "epoch": 1982} {"train_loss": -23.538097059870342, "global_step": 164588, "epoch": 1982, "val_loss": 6393482.0} {"train_loss": -23.601171493530273, "global_step": 164589, "epoch": 1983} {"train_loss": -23.567733764648438, "global_step": 164590, "epoch": 1983} {"train_loss": -23.023700714111328, "global_step": 164591, "epoch": 1983} {"train_loss": -23.09515953063965, "global_step": 164592, "epoch": 1983} {"train_loss": -23.004018783569336, "global_step": 164593, "epoch": 1983} {"train_loss": -23.658910751342773, "global_step": 164594, "epoch": 1983} {"train_loss": -23.099660873413086, "global_step": 164595, "epoch": 1983} {"train_loss": -22.923696517944336, "global_step": 164596, "epoch": 1983} {"train_loss": -23.4791316986084, "global_step": 164597, "epoch": 1983} {"train_loss": -23.397388458251953, "global_step": 164598, "epoch": 1983} {"train_loss": -23.05400276184082, "global_step": 164599, "epoch": 1983} {"train_loss": -23.125730514526367, "global_step": 164600, "epoch": 1983} {"train_loss": -23.06302833557129, "global_step": 164601, "epoch": 1983} {"train_loss": -23.48415184020996, "global_step": 164602, "epoch": 1983} {"train_loss": -22.979122161865234, "global_step": 164603, "epoch": 1983} {"train_loss": -23.223997116088867, "global_step": 164604, "epoch": 1983} {"train_loss": -23.023618698120117, "global_step": 164605, "epoch": 1983} {"train_loss": -23.540884017944336, "global_step": 164606, "epoch": 1983} {"train_loss": -23.541107177734375, "global_step": 164607, "epoch": 1983} {"train_loss": -23.216323852539062, "global_step": 164608, "epoch": 1983} {"train_loss": -23.495595932006836, "global_step": 164609, "epoch": 1983} {"train_loss": -23.400089263916016, "global_step": 164610, "epoch": 1983} {"train_loss": -23.091938018798828, "global_step": 164611, "epoch": 1983} {"train_loss": -23.500181198120117, "global_step": 164612, "epoch": 1983} {"train_loss": -23.307580947875977, "global_step": 164613, "epoch": 1983} {"train_loss": -23.195493698120117, "global_step": 164614, "epoch": 1983} {"train_loss": -23.203052520751953, "global_step": 164615, "epoch": 1983} {"train_loss": -23.34024429321289, "global_step": 164616, "epoch": 1983} {"train_loss": -23.497879028320312, "global_step": 164617, "epoch": 1983} {"train_loss": -23.6396541595459, "global_step": 164618, "epoch": 1983} {"train_loss": -23.46590232849121, "global_step": 164619, "epoch": 1983} {"train_loss": -23.905893325805664, "global_step": 164620, "epoch": 1983} {"train_loss": -23.659191131591797, "global_step": 164621, "epoch": 1983} {"train_loss": -23.280668258666992, "global_step": 164622, "epoch": 1983} {"train_loss": -23.154434204101562, "global_step": 164623, "epoch": 1983} {"train_loss": -23.384145736694336, "global_step": 164624, "epoch": 1983} {"train_loss": -23.475194931030273, "global_step": 164625, "epoch": 1983} {"train_loss": -23.80792808532715, "global_step": 164626, "epoch": 1983} {"train_loss": -23.48116111755371, "global_step": 164627, "epoch": 1983} {"train_loss": -23.874374389648438, "global_step": 164628, "epoch": 1983} {"train_loss": -23.549564361572266, "global_step": 164629, "epoch": 1983} {"train_loss": -23.199464797973633, "global_step": 164630, "epoch": 1983} {"train_loss": -23.592548370361328, "global_step": 164631, "epoch": 1983} {"train_loss": -23.857967376708984, "global_step": 164632, "epoch": 1983} {"train_loss": -23.442062377929688, "global_step": 164633, "epoch": 1983} {"train_loss": -23.5780086517334, "global_step": 164634, "epoch": 1983} {"train_loss": -23.68848991394043, "global_step": 164635, "epoch": 1983} {"train_loss": -23.844482421875, "global_step": 164636, "epoch": 1983} {"train_loss": -23.617231369018555, "global_step": 164637, "epoch": 1983} {"train_loss": -24.109426498413086, "global_step": 164638, "epoch": 1983} {"train_loss": -23.248620986938477, "global_step": 164639, "epoch": 1983} {"train_loss": -23.318899154663086, "global_step": 164640, "epoch": 1983} {"train_loss": -23.693737030029297, "global_step": 164641, "epoch": 1983} {"train_loss": -23.80875587463379, "global_step": 164642, "epoch": 1983} {"train_loss": -23.35880470275879, "global_step": 164643, "epoch": 1983} {"train_loss": -23.96942710876465, "global_step": 164644, "epoch": 1983} {"train_loss": -23.644704818725586, "global_step": 164645, "epoch": 1983} {"train_loss": -23.61306381225586, "global_step": 164646, "epoch": 1983} {"train_loss": -23.45624351501465, "global_step": 164647, "epoch": 1983} {"train_loss": -23.656116485595703, "global_step": 164648, "epoch": 1983} {"train_loss": -23.85394287109375, "global_step": 164649, "epoch": 1983} {"train_loss": -23.571115493774414, "global_step": 164650, "epoch": 1983} {"train_loss": -23.78188133239746, "global_step": 164651, "epoch": 1983} {"train_loss": -23.570648193359375, "global_step": 164652, "epoch": 1983} {"train_loss": -23.63519287109375, "global_step": 164653, "epoch": 1983} {"train_loss": -23.442663192749023, "global_step": 164654, "epoch": 1983} {"train_loss": -23.737329483032227, "global_step": 164655, "epoch": 1983} {"train_loss": -23.518583297729492, "global_step": 164656, "epoch": 1983} {"train_loss": -23.93816566467285, "global_step": 164657, "epoch": 1983} {"train_loss": -23.487560272216797, "global_step": 164658, "epoch": 1983} {"train_loss": -23.746089935302734, "global_step": 164659, "epoch": 1983} {"train_loss": -23.922433853149414, "global_step": 164660, "epoch": 1983} {"train_loss": -23.788373947143555, "global_step": 164661, "epoch": 1983} {"train_loss": -23.45635986328125, "global_step": 164662, "epoch": 1983} {"train_loss": -23.37795066833496, "global_step": 164663, "epoch": 1983} {"train_loss": -23.770462036132812, "global_step": 164664, "epoch": 1983} {"train_loss": -23.95631980895996, "global_step": 164665, "epoch": 1983} {"train_loss": -23.787126541137695, "global_step": 164666, "epoch": 1983} {"train_loss": -23.880416870117188, "global_step": 164667, "epoch": 1983} {"train_loss": -23.543302536010742, "global_step": 164668, "epoch": 1983} {"train_loss": -23.601341247558594, "global_step": 164669, "epoch": 1983} {"train_loss": -23.593032836914062, "global_step": 164670, "epoch": 1983} {"train_loss": -23.50487380429923, "global_step": 164671, "epoch": 1983, "val_loss": 6386943.0} {"train_loss": -23.20661735534668, "global_step": 164672, "epoch": 1984} {"train_loss": -23.175512313842773, "global_step": 164673, "epoch": 1984} {"train_loss": -23.225706100463867, "global_step": 164674, "epoch": 1984} {"train_loss": -23.264755249023438, "global_step": 164675, "epoch": 1984} {"train_loss": -23.19014549255371, "global_step": 164676, "epoch": 1984} {"train_loss": -23.221864700317383, "global_step": 164677, "epoch": 1984} {"train_loss": -23.3616886138916, "global_step": 164678, "epoch": 1984} {"train_loss": -23.22243309020996, "global_step": 164679, "epoch": 1984} {"train_loss": -23.51607894897461, "global_step": 164680, "epoch": 1984} {"train_loss": -22.880720138549805, "global_step": 164681, "epoch": 1984} {"train_loss": -23.388492584228516, "global_step": 164682, "epoch": 1984} {"train_loss": -23.5533504486084, "global_step": 164683, "epoch": 1984} {"train_loss": -23.53191375732422, "global_step": 164684, "epoch": 1984} {"train_loss": -23.470108032226562, "global_step": 164685, "epoch": 1984} {"train_loss": -23.725482940673828, "global_step": 164686, "epoch": 1984} {"train_loss": -23.099685668945312, "global_step": 164687, "epoch": 1984} {"train_loss": -23.48195457458496, "global_step": 164688, "epoch": 1984} {"train_loss": -23.605710983276367, "global_step": 164689, "epoch": 1984} {"train_loss": -23.525035858154297, "global_step": 164690, "epoch": 1984} {"train_loss": -23.471298217773438, "global_step": 164691, "epoch": 1984} {"train_loss": -23.24622917175293, "global_step": 164692, "epoch": 1984} {"train_loss": -23.34907341003418, "global_step": 164693, "epoch": 1984} {"train_loss": -23.11833381652832, "global_step": 164694, "epoch": 1984} {"train_loss": -23.61092185974121, "global_step": 164695, "epoch": 1984} {"train_loss": -23.191701889038086, "global_step": 164696, "epoch": 1984} {"train_loss": -23.651460647583008, "global_step": 164697, "epoch": 1984} {"train_loss": -23.344146728515625, "global_step": 164698, "epoch": 1984} {"train_loss": -23.711118698120117, "global_step": 164699, "epoch": 1984} {"train_loss": -23.519733428955078, "global_step": 164700, "epoch": 1984} {"train_loss": -23.730085372924805, "global_step": 164701, "epoch": 1984} {"train_loss": -23.56464195251465, "global_step": 164702, "epoch": 1984} {"train_loss": -23.532278060913086, "global_step": 164703, "epoch": 1984} {"train_loss": -23.504377365112305, "global_step": 164704, "epoch": 1984} {"train_loss": -23.74222183227539, "global_step": 164705, "epoch": 1984} {"train_loss": -23.95290184020996, "global_step": 164706, "epoch": 1984} {"train_loss": -23.773752212524414, "global_step": 164707, "epoch": 1984} {"train_loss": -23.938140869140625, "global_step": 164708, "epoch": 1984} {"train_loss": -23.658559799194336, "global_step": 164709, "epoch": 1984} {"train_loss": -23.321714401245117, "global_step": 164710, "epoch": 1984} {"train_loss": -23.624317169189453, "global_step": 164711, "epoch": 1984} {"train_loss": -23.905231475830078, "global_step": 164712, "epoch": 1984} {"train_loss": -23.512939453125, "global_step": 164713, "epoch": 1984} {"train_loss": -23.770099639892578, "global_step": 164714, "epoch": 1984} {"train_loss": -23.395116806030273, "global_step": 164715, "epoch": 1984} {"train_loss": -23.60814666748047, "global_step": 164716, "epoch": 1984} {"train_loss": -23.952741622924805, "global_step": 164717, "epoch": 1984} {"train_loss": -23.94779396057129, "global_step": 164718, "epoch": 1984} {"train_loss": -23.567550659179688, "global_step": 164719, "epoch": 1984} {"train_loss": -23.425586700439453, "global_step": 164720, "epoch": 1984} {"train_loss": -23.555362701416016, "global_step": 164721, "epoch": 1984} {"train_loss": -23.614816665649414, "global_step": 164722, "epoch": 1984} {"train_loss": -23.78249168395996, "global_step": 164723, "epoch": 1984} {"train_loss": -23.55934715270996, "global_step": 164724, "epoch": 1984} {"train_loss": -23.6857967376709, "global_step": 164725, "epoch": 1984} {"train_loss": -23.61134147644043, "global_step": 164726, "epoch": 1984} {"train_loss": -23.686738967895508, "global_step": 164727, "epoch": 1984} {"train_loss": -23.600187301635742, "global_step": 164728, "epoch": 1984} {"train_loss": -23.57216453552246, "global_step": 164729, "epoch": 1984} {"train_loss": -24.000213623046875, "global_step": 164730, "epoch": 1984} {"train_loss": -23.77604103088379, "global_step": 164731, "epoch": 1984} {"train_loss": -23.592529296875, "global_step": 164732, "epoch": 1984} {"train_loss": -23.869741439819336, "global_step": 164733, "epoch": 1984} {"train_loss": -23.411136627197266, "global_step": 164734, "epoch": 1984} {"train_loss": -23.82944679260254, "global_step": 164735, "epoch": 1984} {"train_loss": -23.27277946472168, "global_step": 164736, "epoch": 1984} {"train_loss": -24.17020606994629, "global_step": 164737, "epoch": 1984} {"train_loss": -23.43186378479004, "global_step": 164738, "epoch": 1984} {"train_loss": -23.86378288269043, "global_step": 164739, "epoch": 1984} {"train_loss": -23.82390022277832, "global_step": 164740, "epoch": 1984} {"train_loss": -23.801145553588867, "global_step": 164741, "epoch": 1984} {"train_loss": -23.850820541381836, "global_step": 164742, "epoch": 1984} {"train_loss": -23.616497039794922, "global_step": 164743, "epoch": 1984} {"train_loss": -23.578466415405273, "global_step": 164744, "epoch": 1984} {"train_loss": -23.80739402770996, "global_step": 164745, "epoch": 1984} {"train_loss": -23.468753814697266, "global_step": 164746, "epoch": 1984} {"train_loss": -23.758956909179688, "global_step": 164747, "epoch": 1984} {"train_loss": -23.702468872070312, "global_step": 164748, "epoch": 1984} {"train_loss": -23.614215850830078, "global_step": 164749, "epoch": 1984} {"train_loss": -22.880762100219727, "global_step": 164750, "epoch": 1984} {"train_loss": -23.28889274597168, "global_step": 164751, "epoch": 1984} {"train_loss": -23.311246871948242, "global_step": 164752, "epoch": 1984} {"train_loss": -23.70308494567871, "global_step": 164753, "epoch": 1984} {"train_loss": -23.55116311038833, "global_step": 164754, "epoch": 1984, "val_loss": 6315743.0} {"train_loss": -23.269489288330078, "global_step": 164755, "epoch": 1985} {"train_loss": -23.0955867767334, "global_step": 164756, "epoch": 1985} {"train_loss": -23.24177360534668, "global_step": 164757, "epoch": 1985} {"train_loss": -22.99251365661621, "global_step": 164758, "epoch": 1985} {"train_loss": -23.40472984313965, "global_step": 164759, "epoch": 1985} {"train_loss": -23.10584831237793, "global_step": 164760, "epoch": 1985} {"train_loss": -23.457983016967773, "global_step": 164761, "epoch": 1985} {"train_loss": -23.37113380432129, "global_step": 164762, "epoch": 1985} {"train_loss": -23.16331672668457, "global_step": 164763, "epoch": 1985} {"train_loss": -23.174304962158203, "global_step": 164764, "epoch": 1985} {"train_loss": -22.96943473815918, "global_step": 164765, "epoch": 1985} {"train_loss": -22.95912742614746, "global_step": 164766, "epoch": 1985} {"train_loss": -23.327783584594727, "global_step": 164767, "epoch": 1985} {"train_loss": -23.16798973083496, "global_step": 164768, "epoch": 1985} {"train_loss": -23.284578323364258, "global_step": 164769, "epoch": 1985} {"train_loss": -23.336999893188477, "global_step": 164770, "epoch": 1985} {"train_loss": -23.47697639465332, "global_step": 164771, "epoch": 1985} {"train_loss": -23.228567123413086, "global_step": 164772, "epoch": 1985} {"train_loss": -23.300312042236328, "global_step": 164773, "epoch": 1985} {"train_loss": -23.4531192779541, "global_step": 164774, "epoch": 1985} {"train_loss": -22.906232833862305, "global_step": 164775, "epoch": 1985} {"train_loss": -23.522676467895508, "global_step": 164776, "epoch": 1985} {"train_loss": -23.36730194091797, "global_step": 164777, "epoch": 1985} {"train_loss": -23.317609786987305, "global_step": 164778, "epoch": 1985} {"train_loss": -23.359888076782227, "global_step": 164779, "epoch": 1985} {"train_loss": -23.39349937438965, "global_step": 164780, "epoch": 1985} {"train_loss": -23.90089225769043, "global_step": 164781, "epoch": 1985} {"train_loss": -23.750335693359375, "global_step": 164782, "epoch": 1985} {"train_loss": -23.341962814331055, "global_step": 164783, "epoch": 1985} {"train_loss": -23.35480308532715, "global_step": 164784, "epoch": 1985} {"train_loss": -23.60359764099121, "global_step": 164785, "epoch": 1985} {"train_loss": -23.45186424255371, "global_step": 164786, "epoch": 1985} {"train_loss": -23.411636352539062, "global_step": 164787, "epoch": 1985} {"train_loss": -23.427501678466797, "global_step": 164788, "epoch": 1985} {"train_loss": -23.612573623657227, "global_step": 164789, "epoch": 1985} {"train_loss": -23.667200088500977, "global_step": 164790, "epoch": 1985} {"train_loss": -23.453229904174805, "global_step": 164791, "epoch": 1985} {"train_loss": -23.430118560791016, "global_step": 164792, "epoch": 1985} {"train_loss": -23.451221466064453, "global_step": 164793, "epoch": 1985} {"train_loss": -23.91107940673828, "global_step": 164794, "epoch": 1985} {"train_loss": -23.91802978515625, "global_step": 164795, "epoch": 1985} {"train_loss": -23.44247817993164, "global_step": 164796, "epoch": 1985} {"train_loss": -23.46138572692871, "global_step": 164797, "epoch": 1985} {"train_loss": -23.47361946105957, "global_step": 164798, "epoch": 1985} {"train_loss": -23.43231773376465, "global_step": 164799, "epoch": 1985} {"train_loss": -23.489795684814453, "global_step": 164800, "epoch": 1985} {"train_loss": -23.520612716674805, "global_step": 164801, "epoch": 1985} {"train_loss": -23.85694694519043, "global_step": 164802, "epoch": 1985} {"train_loss": -23.591524124145508, "global_step": 164803, "epoch": 1985} {"train_loss": -23.643207550048828, "global_step": 164804, "epoch": 1985} {"train_loss": -23.799264907836914, "global_step": 164805, "epoch": 1985} {"train_loss": -24.079021453857422, "global_step": 164806, "epoch": 1985} {"train_loss": -23.71946144104004, "global_step": 164807, "epoch": 1985} {"train_loss": -23.39297103881836, "global_step": 164808, "epoch": 1985} {"train_loss": -23.887182235717773, "global_step": 164809, "epoch": 1985} {"train_loss": -23.65704345703125, "global_step": 164810, "epoch": 1985} {"train_loss": -24.057838439941406, "global_step": 164811, "epoch": 1985} {"train_loss": -23.688995361328125, "global_step": 164812, "epoch": 1985} {"train_loss": -23.77700424194336, "global_step": 164813, "epoch": 1985} {"train_loss": -23.842065811157227, "global_step": 164814, "epoch": 1985} {"train_loss": -23.528478622436523, "global_step": 164815, "epoch": 1985} {"train_loss": -23.639450073242188, "global_step": 164816, "epoch": 1985} {"train_loss": -23.431045532226562, "global_step": 164817, "epoch": 1985} {"train_loss": -23.69015884399414, "global_step": 164818, "epoch": 1985} {"train_loss": -23.970365524291992, "global_step": 164819, "epoch": 1985} {"train_loss": -23.697668075561523, "global_step": 164820, "epoch": 1985} {"train_loss": -23.637401580810547, "global_step": 164821, "epoch": 1985} {"train_loss": -23.809255599975586, "global_step": 164822, "epoch": 1985} {"train_loss": -23.501815795898438, "global_step": 164823, "epoch": 1985} {"train_loss": -23.860916137695312, "global_step": 164824, "epoch": 1985} {"train_loss": -23.9088077545166, "global_step": 164825, "epoch": 1985} {"train_loss": -23.630775451660156, "global_step": 164826, "epoch": 1985} {"train_loss": -23.629053115844727, "global_step": 164827, "epoch": 1985} {"train_loss": -23.236291885375977, "global_step": 164828, "epoch": 1985} {"train_loss": -24.02361488342285, "global_step": 164829, "epoch": 1985} {"train_loss": -23.500410079956055, "global_step": 164830, "epoch": 1985} {"train_loss": -23.43655776977539, "global_step": 164831, "epoch": 1985} {"train_loss": -23.67853355407715, "global_step": 164832, "epoch": 1985} {"train_loss": -23.694028854370117, "global_step": 164833, "epoch": 1985} {"train_loss": -23.3867244720459, "global_step": 164834, "epoch": 1985} {"train_loss": -23.807584762573242, "global_step": 164835, "epoch": 1985} {"train_loss": -23.61006736755371, "global_step": 164836, "epoch": 1985} {"train_loss": -23.517106159623847, "global_step": 164837, "epoch": 1985, "val_loss": 6280733.0} {"train_loss": -23.362747192382812, "global_step": 164838, "epoch": 1986} {"train_loss": -22.945985794067383, "global_step": 164839, "epoch": 1986} {"train_loss": -22.795066833496094, "global_step": 164840, "epoch": 1986} {"train_loss": -22.987201690673828, "global_step": 164841, "epoch": 1986} {"train_loss": -23.81252098083496, "global_step": 164842, "epoch": 1986} {"train_loss": -23.48309326171875, "global_step": 164843, "epoch": 1986} {"train_loss": -23.489049911499023, "global_step": 164844, "epoch": 1986} {"train_loss": -23.3188533782959, "global_step": 164845, "epoch": 1986} {"train_loss": -23.52829360961914, "global_step": 164846, "epoch": 1986} {"train_loss": -23.29278564453125, "global_step": 164847, "epoch": 1986} {"train_loss": -23.30145263671875, "global_step": 164848, "epoch": 1986} {"train_loss": -23.267148971557617, "global_step": 164849, "epoch": 1986} {"train_loss": -23.31110191345215, "global_step": 164850, "epoch": 1986} {"train_loss": -23.441425323486328, "global_step": 164851, "epoch": 1986} {"train_loss": -23.290067672729492, "global_step": 164852, "epoch": 1986} {"train_loss": -23.526153564453125, "global_step": 164853, "epoch": 1986} {"train_loss": -23.49725914001465, "global_step": 164854, "epoch": 1986} {"train_loss": -23.509265899658203, "global_step": 164855, "epoch": 1986} {"train_loss": -23.428680419921875, "global_step": 164856, "epoch": 1986} {"train_loss": -23.51798439025879, "global_step": 164857, "epoch": 1986} {"train_loss": -23.406085968017578, "global_step": 164858, "epoch": 1986} {"train_loss": -23.49622917175293, "global_step": 164859, "epoch": 1986} {"train_loss": -23.796823501586914, "global_step": 164860, "epoch": 1986} {"train_loss": -23.52018165588379, "global_step": 164861, "epoch": 1986} {"train_loss": -23.50410270690918, "global_step": 164862, "epoch": 1986} {"train_loss": -23.351648330688477, "global_step": 164863, "epoch": 1986} {"train_loss": -23.738920211791992, "global_step": 164864, "epoch": 1986} {"train_loss": -23.73990821838379, "global_step": 164865, "epoch": 1986} {"train_loss": -23.683059692382812, "global_step": 164866, "epoch": 1986} {"train_loss": -23.823957443237305, "global_step": 164867, "epoch": 1986} {"train_loss": -23.686094284057617, "global_step": 164868, "epoch": 1986} {"train_loss": -23.729148864746094, "global_step": 164869, "epoch": 1986} {"train_loss": -23.7215576171875, "global_step": 164870, "epoch": 1986} {"train_loss": -23.66126823425293, "global_step": 164871, "epoch": 1986} {"train_loss": -23.222457885742188, "global_step": 164872, "epoch": 1986} {"train_loss": -23.791440963745117, "global_step": 164873, "epoch": 1986} {"train_loss": -23.680810928344727, "global_step": 164874, "epoch": 1986} {"train_loss": -23.216949462890625, "global_step": 164875, "epoch": 1986} {"train_loss": -23.590181350708008, "global_step": 164876, "epoch": 1986} {"train_loss": -23.931411743164062, "global_step": 164877, "epoch": 1986} {"train_loss": -23.853866577148438, "global_step": 164878, "epoch": 1986} {"train_loss": -23.786035537719727, "global_step": 164879, "epoch": 1986} {"train_loss": -23.579851150512695, "global_step": 164880, "epoch": 1986} {"train_loss": -23.84116554260254, "global_step": 164881, "epoch": 1986} {"train_loss": -23.627838134765625, "global_step": 164882, "epoch": 1986} {"train_loss": -23.200586318969727, "global_step": 164883, "epoch": 1986} {"train_loss": -23.4858455657959, "global_step": 164884, "epoch": 1986} {"train_loss": -23.81631851196289, "global_step": 164885, "epoch": 1986} {"train_loss": -23.61301612854004, "global_step": 164886, "epoch": 1986} {"train_loss": -23.566083908081055, "global_step": 164887, "epoch": 1986} {"train_loss": -23.36176109313965, "global_step": 164888, "epoch": 1986} {"train_loss": -23.686431884765625, "global_step": 164889, "epoch": 1986} {"train_loss": -23.66994285583496, "global_step": 164890, "epoch": 1986} {"train_loss": -23.66969871520996, "global_step": 164891, "epoch": 1986} {"train_loss": -23.586400985717773, "global_step": 164892, "epoch": 1986} {"train_loss": -23.80499267578125, "global_step": 164893, "epoch": 1986} {"train_loss": -23.847633361816406, "global_step": 164894, "epoch": 1986} {"train_loss": -23.54140281677246, "global_step": 164895, "epoch": 1986} {"train_loss": -23.821699142456055, "global_step": 164896, "epoch": 1986} {"train_loss": -23.56369400024414, "global_step": 164897, "epoch": 1986} {"train_loss": -23.878454208374023, "global_step": 164898, "epoch": 1986} {"train_loss": -23.47281265258789, "global_step": 164899, "epoch": 1986} {"train_loss": -23.65201759338379, "global_step": 164900, "epoch": 1986} {"train_loss": -23.854394912719727, "global_step": 164901, "epoch": 1986} {"train_loss": -23.68403434753418, "global_step": 164902, "epoch": 1986} {"train_loss": -23.98093032836914, "global_step": 164903, "epoch": 1986} {"train_loss": -23.5465087890625, "global_step": 164904, "epoch": 1986} {"train_loss": -23.411033630371094, "global_step": 164905, "epoch": 1986} {"train_loss": -23.463775634765625, "global_step": 164906, "epoch": 1986} {"train_loss": -23.05144691467285, "global_step": 164907, "epoch": 1986} {"train_loss": -23.305654525756836, "global_step": 164908, "epoch": 1986} {"train_loss": -23.4729061126709, "global_step": 164909, "epoch": 1986} {"train_loss": -23.534578323364258, "global_step": 164910, "epoch": 1986} {"train_loss": -23.47511863708496, "global_step": 164911, "epoch": 1986} {"train_loss": -23.45482635498047, "global_step": 164912, "epoch": 1986} {"train_loss": -23.59751319885254, "global_step": 164913, "epoch": 1986} {"train_loss": -23.64918327331543, "global_step": 164914, "epoch": 1986} {"train_loss": -23.494298934936523, "global_step": 164915, "epoch": 1986} {"train_loss": -23.931135177612305, "global_step": 164916, "epoch": 1986} {"train_loss": -23.394668579101562, "global_step": 164917, "epoch": 1986} {"train_loss": -23.766986846923828, "global_step": 164918, "epoch": 1986} {"train_loss": -23.808250427246094, "global_step": 164919, "epoch": 1986} {"train_loss": -23.548197849687323, "global_step": 164920, "epoch": 1986, "val_loss": 6307129.5} {"train_loss": -22.506412506103516, "global_step": 164921, "epoch": 1987} {"train_loss": -22.701866149902344, "global_step": 164922, "epoch": 1987} {"train_loss": -23.25263023376465, "global_step": 164923, "epoch": 1987} {"train_loss": -22.643003463745117, "global_step": 164924, "epoch": 1987} {"train_loss": -22.35077476501465, "global_step": 164925, "epoch": 1987} {"train_loss": -22.994861602783203, "global_step": 164926, "epoch": 1987} {"train_loss": -23.02225112915039, "global_step": 164927, "epoch": 1987} {"train_loss": -22.928619384765625, "global_step": 164928, "epoch": 1987} {"train_loss": -22.75672721862793, "global_step": 164929, "epoch": 1987} {"train_loss": -22.763628005981445, "global_step": 164930, "epoch": 1987} {"train_loss": -22.786535263061523, "global_step": 164931, "epoch": 1987} {"train_loss": -23.29215431213379, "global_step": 164932, "epoch": 1987} {"train_loss": -22.897220611572266, "global_step": 164933, "epoch": 1987} {"train_loss": -22.809385299682617, "global_step": 164934, "epoch": 1987} {"train_loss": -22.981155395507812, "global_step": 164935, "epoch": 1987} {"train_loss": -23.194311141967773, "global_step": 164936, "epoch": 1987} {"train_loss": -23.15330696105957, "global_step": 164937, "epoch": 1987} {"train_loss": -23.046171188354492, "global_step": 164938, "epoch": 1987} {"train_loss": -23.340200424194336, "global_step": 164939, "epoch": 1987} {"train_loss": -23.19850730895996, "global_step": 164940, "epoch": 1987} {"train_loss": -23.486387252807617, "global_step": 164941, "epoch": 1987} {"train_loss": -23.038761138916016, "global_step": 164942, "epoch": 1987} {"train_loss": -23.758630752563477, "global_step": 164943, "epoch": 1987} {"train_loss": -23.47826385498047, "global_step": 164944, "epoch": 1987} {"train_loss": -23.170740127563477, "global_step": 164945, "epoch": 1987} {"train_loss": -23.65662384033203, "global_step": 164946, "epoch": 1987} {"train_loss": -23.18155860900879, "global_step": 164947, "epoch": 1987} {"train_loss": -23.628713607788086, "global_step": 164948, "epoch": 1987} {"train_loss": -23.28250503540039, "global_step": 164949, "epoch": 1987} {"train_loss": -23.489561080932617, "global_step": 164950, "epoch": 1987} {"train_loss": -23.668033599853516, "global_step": 164951, "epoch": 1987} {"train_loss": -23.623544692993164, "global_step": 164952, "epoch": 1987} {"train_loss": -23.70060157775879, "global_step": 164953, "epoch": 1987} {"train_loss": -23.15644073486328, "global_step": 164954, "epoch": 1987} {"train_loss": -23.2541561126709, "global_step": 164955, "epoch": 1987} {"train_loss": -23.324832916259766, "global_step": 164956, "epoch": 1987} {"train_loss": -23.49845314025879, "global_step": 164957, "epoch": 1987} {"train_loss": -23.433120727539062, "global_step": 164958, "epoch": 1987} {"train_loss": -23.884550094604492, "global_step": 164959, "epoch": 1987} {"train_loss": -23.594730377197266, "global_step": 164960, "epoch": 1987} {"train_loss": -23.221845626831055, "global_step": 164961, "epoch": 1987} {"train_loss": -23.79072380065918, "global_step": 164962, "epoch": 1987} {"train_loss": -23.758329391479492, "global_step": 164963, "epoch": 1987} {"train_loss": -23.785856246948242, "global_step": 164964, "epoch": 1987} {"train_loss": -23.92701530456543, "global_step": 164965, "epoch": 1987} {"train_loss": -23.78946304321289, "global_step": 164966, "epoch": 1987} {"train_loss": -23.65757179260254, "global_step": 164967, "epoch": 1987} {"train_loss": -23.76865005493164, "global_step": 164968, "epoch": 1987} {"train_loss": -23.585153579711914, "global_step": 164969, "epoch": 1987} {"train_loss": -23.544422149658203, "global_step": 164970, "epoch": 1987} {"train_loss": -23.82967758178711, "global_step": 164971, "epoch": 1987} {"train_loss": -23.811094284057617, "global_step": 164972, "epoch": 1987} {"train_loss": -23.558496475219727, "global_step": 164973, "epoch": 1987} {"train_loss": -23.727209091186523, "global_step": 164974, "epoch": 1987} {"train_loss": -23.82316017150879, "global_step": 164975, "epoch": 1987} {"train_loss": -23.79807472229004, "global_step": 164976, "epoch": 1987} {"train_loss": -23.56717300415039, "global_step": 164977, "epoch": 1987} {"train_loss": -23.421831130981445, "global_step": 164978, "epoch": 1987} {"train_loss": -23.16791343688965, "global_step": 164979, "epoch": 1987} {"train_loss": -23.293684005737305, "global_step": 164980, "epoch": 1987} {"train_loss": -22.59779167175293, "global_step": 164981, "epoch": 1987} {"train_loss": -23.396833419799805, "global_step": 164982, "epoch": 1987} {"train_loss": -23.700029373168945, "global_step": 164983, "epoch": 1987} {"train_loss": -23.17987060546875, "global_step": 164984, "epoch": 1987} {"train_loss": -23.53289794921875, "global_step": 164985, "epoch": 1987} {"train_loss": -23.542200088500977, "global_step": 164986, "epoch": 1987} {"train_loss": -23.219257354736328, "global_step": 164987, "epoch": 1987} {"train_loss": -23.36724281311035, "global_step": 164988, "epoch": 1987} {"train_loss": -23.30031394958496, "global_step": 164989, "epoch": 1987} {"train_loss": -23.44361686706543, "global_step": 164990, "epoch": 1987} {"train_loss": -23.318235397338867, "global_step": 164991, "epoch": 1987} {"train_loss": -23.528547286987305, "global_step": 164992, "epoch": 1987} {"train_loss": -23.853500366210938, "global_step": 164993, "epoch": 1987} {"train_loss": -23.24178123474121, "global_step": 164994, "epoch": 1987} {"train_loss": -23.398672103881836, "global_step": 164995, "epoch": 1987} {"train_loss": -23.45606803894043, "global_step": 164996, "epoch": 1987} {"train_loss": -23.45318031311035, "global_step": 164997, "epoch": 1987} {"train_loss": -23.099706649780273, "global_step": 164998, "epoch": 1987} {"train_loss": -23.963293075561523, "global_step": 164999, "epoch": 1987} {"train_loss": -23.328397750854492, "global_step": 165000, "epoch": 1987} {"train_loss": -23.788101196289062, "global_step": 165001, "epoch": 1987} {"train_loss": -23.71330451965332, "global_step": 165002, "epoch": 1987} {"train_loss": -23.38684773732381, "global_step": 165003, "epoch": 1987, "val_loss": 6350261.0} {"train_loss": -23.271604537963867, "global_step": 165004, "epoch": 1988} {"train_loss": -23.60516357421875, "global_step": 165005, "epoch": 1988} {"train_loss": -23.282381057739258, "global_step": 165006, "epoch": 1988} {"train_loss": -23.546649932861328, "global_step": 165007, "epoch": 1988} {"train_loss": -23.415388107299805, "global_step": 165008, "epoch": 1988} {"train_loss": -23.445026397705078, "global_step": 165009, "epoch": 1988} {"train_loss": -23.317441940307617, "global_step": 165010, "epoch": 1988} {"train_loss": -23.796567916870117, "global_step": 165011, "epoch": 1988} {"train_loss": -23.515295028686523, "global_step": 165012, "epoch": 1988} {"train_loss": -23.50782012939453, "global_step": 165013, "epoch": 1988} {"train_loss": -23.371429443359375, "global_step": 165014, "epoch": 1988} {"train_loss": -23.327377319335938, "global_step": 165015, "epoch": 1988} {"train_loss": -23.60858154296875, "global_step": 165016, "epoch": 1988} {"train_loss": -23.46027946472168, "global_step": 165017, "epoch": 1988} {"train_loss": -23.791770935058594, "global_step": 165018, "epoch": 1988} {"train_loss": -23.478666305541992, "global_step": 165019, "epoch": 1988} {"train_loss": -23.445175170898438, "global_step": 165020, "epoch": 1988} {"train_loss": -23.622783660888672, "global_step": 165021, "epoch": 1988} {"train_loss": -23.7924861907959, "global_step": 165022, "epoch": 1988} {"train_loss": -23.631868362426758, "global_step": 165023, "epoch": 1988} {"train_loss": -23.361713409423828, "global_step": 165024, "epoch": 1988} {"train_loss": -23.734052658081055, "global_step": 165025, "epoch": 1988} {"train_loss": -23.51224708557129, "global_step": 165026, "epoch": 1988} {"train_loss": -23.75789451599121, "global_step": 165027, "epoch": 1988} {"train_loss": -23.358861923217773, "global_step": 165028, "epoch": 1988} {"train_loss": -23.669042587280273, "global_step": 165029, "epoch": 1988} {"train_loss": -24.059736251831055, "global_step": 165030, "epoch": 1988} {"train_loss": -23.73793601989746, "global_step": 165031, "epoch": 1988} {"train_loss": -23.6859188079834, "global_step": 165032, "epoch": 1988} {"train_loss": -23.346769332885742, "global_step": 165033, "epoch": 1988} {"train_loss": -23.834993362426758, "global_step": 165034, "epoch": 1988} {"train_loss": -23.619693756103516, "global_step": 165035, "epoch": 1988} {"train_loss": -23.514204025268555, "global_step": 165036, "epoch": 1988} {"train_loss": -23.895273208618164, "global_step": 165037, "epoch": 1988} {"train_loss": -23.653520584106445, "global_step": 165038, "epoch": 1988} {"train_loss": -23.837862014770508, "global_step": 165039, "epoch": 1988} {"train_loss": -23.6004695892334, "global_step": 165040, "epoch": 1988} {"train_loss": -23.692655563354492, "global_step": 165041, "epoch": 1988} {"train_loss": -23.720365524291992, "global_step": 165042, "epoch": 1988} {"train_loss": -23.735567092895508, "global_step": 165043, "epoch": 1988} {"train_loss": -23.73275375366211, "global_step": 165044, "epoch": 1988} {"train_loss": -23.69244956970215, "global_step": 165045, "epoch": 1988} {"train_loss": -23.554319381713867, "global_step": 165046, "epoch": 1988} {"train_loss": -23.76875877380371, "global_step": 165047, "epoch": 1988} {"train_loss": -24.006977081298828, "global_step": 165048, "epoch": 1988} {"train_loss": -23.61754035949707, "global_step": 165049, "epoch": 1988} {"train_loss": -23.843280792236328, "global_step": 165050, "epoch": 1988} {"train_loss": -23.706714630126953, "global_step": 165051, "epoch": 1988} {"train_loss": -23.86553382873535, "global_step": 165052, "epoch": 1988} {"train_loss": -23.559980392456055, "global_step": 165053, "epoch": 1988} {"train_loss": -23.666168212890625, "global_step": 165054, "epoch": 1988} {"train_loss": -23.57417106628418, "global_step": 165055, "epoch": 1988} {"train_loss": -23.42197608947754, "global_step": 165056, "epoch": 1988} {"train_loss": -23.29286003112793, "global_step": 165057, "epoch": 1988} {"train_loss": -23.677839279174805, "global_step": 165058, "epoch": 1988} {"train_loss": -22.881864547729492, "global_step": 165059, "epoch": 1988} {"train_loss": -23.077177047729492, "global_step": 165060, "epoch": 1988} {"train_loss": -23.378507614135742, "global_step": 165061, "epoch": 1988} {"train_loss": -23.52509880065918, "global_step": 165062, "epoch": 1988} {"train_loss": -23.77566909790039, "global_step": 165063, "epoch": 1988} {"train_loss": -23.413129806518555, "global_step": 165064, "epoch": 1988} {"train_loss": -23.023460388183594, "global_step": 165065, "epoch": 1988} {"train_loss": -23.361713409423828, "global_step": 165066, "epoch": 1988} {"train_loss": -23.610580444335938, "global_step": 165067, "epoch": 1988} {"train_loss": -24.123525619506836, "global_step": 165068, "epoch": 1988} {"train_loss": -23.44803810119629, "global_step": 165069, "epoch": 1988} {"train_loss": -22.965723037719727, "global_step": 165070, "epoch": 1988} {"train_loss": -23.896238327026367, "global_step": 165071, "epoch": 1988} {"train_loss": -23.165990829467773, "global_step": 165072, "epoch": 1988} {"train_loss": -23.85274314880371, "global_step": 165073, "epoch": 1988} {"train_loss": -23.317174911499023, "global_step": 165074, "epoch": 1988} {"train_loss": -23.402448654174805, "global_step": 165075, "epoch": 1988} {"train_loss": -23.70779037475586, "global_step": 165076, "epoch": 1988} {"train_loss": -23.746383666992188, "global_step": 165077, "epoch": 1988} {"train_loss": -23.703916549682617, "global_step": 165078, "epoch": 1988} {"train_loss": -23.777097702026367, "global_step": 165079, "epoch": 1988} {"train_loss": -23.47754669189453, "global_step": 165080, "epoch": 1988} {"train_loss": -23.502653121948242, "global_step": 165081, "epoch": 1988} {"train_loss": -23.52931022644043, "global_step": 165082, "epoch": 1988} {"train_loss": -23.570791244506836, "global_step": 165083, "epoch": 1988} {"train_loss": -23.727426528930664, "global_step": 165084, "epoch": 1988} {"train_loss": -23.349016189575195, "global_step": 165085, "epoch": 1988} {"train_loss": -23.56158488629812, "global_step": 165086, "epoch": 1988, "val_loss": 6380357.5} {"train_loss": -23.199989318847656, "global_step": 165087, "epoch": 1989} {"train_loss": -23.107074737548828, "global_step": 165088, "epoch": 1989} {"train_loss": -23.194185256958008, "global_step": 165089, "epoch": 1989} {"train_loss": -23.84235954284668, "global_step": 165090, "epoch": 1989} {"train_loss": -22.982221603393555, "global_step": 165091, "epoch": 1989} {"train_loss": -23.173736572265625, "global_step": 165092, "epoch": 1989} {"train_loss": -23.030115127563477, "global_step": 165093, "epoch": 1989} {"train_loss": -23.16180992126465, "global_step": 165094, "epoch": 1989} {"train_loss": -23.116724014282227, "global_step": 165095, "epoch": 1989} {"train_loss": -23.208351135253906, "global_step": 165096, "epoch": 1989} {"train_loss": -23.124897003173828, "global_step": 165097, "epoch": 1989} {"train_loss": -23.08249855041504, "global_step": 165098, "epoch": 1989} {"train_loss": -23.391292572021484, "global_step": 165099, "epoch": 1989} {"train_loss": -23.46895980834961, "global_step": 165100, "epoch": 1989} {"train_loss": -23.425256729125977, "global_step": 165101, "epoch": 1989} {"train_loss": -23.257429122924805, "global_step": 165102, "epoch": 1989} {"train_loss": -23.355743408203125, "global_step": 165103, "epoch": 1989} {"train_loss": -23.55313491821289, "global_step": 165104, "epoch": 1989} {"train_loss": -23.62529945373535, "global_step": 165105, "epoch": 1989} {"train_loss": -23.562124252319336, "global_step": 165106, "epoch": 1989} {"train_loss": -23.998096466064453, "global_step": 165107, "epoch": 1989} {"train_loss": -23.279756546020508, "global_step": 165108, "epoch": 1989} {"train_loss": -23.674053192138672, "global_step": 165109, "epoch": 1989} {"train_loss": -23.466060638427734, "global_step": 165110, "epoch": 1989} {"train_loss": -23.209800720214844, "global_step": 165111, "epoch": 1989} {"train_loss": -23.486230850219727, "global_step": 165112, "epoch": 1989} {"train_loss": -22.916156768798828, "global_step": 165113, "epoch": 1989} {"train_loss": -23.29612922668457, "global_step": 165114, "epoch": 1989} {"train_loss": -23.60051155090332, "global_step": 165115, "epoch": 1989} {"train_loss": -23.470998764038086, "global_step": 165116, "epoch": 1989} {"train_loss": -23.75246238708496, "global_step": 165117, "epoch": 1989} {"train_loss": -23.421201705932617, "global_step": 165118, "epoch": 1989} {"train_loss": -23.891204833984375, "global_step": 165119, "epoch": 1989} {"train_loss": -23.691829681396484, "global_step": 165120, "epoch": 1989} {"train_loss": -23.42727279663086, "global_step": 165121, "epoch": 1989} {"train_loss": -23.48859977722168, "global_step": 165122, "epoch": 1989} {"train_loss": -23.84742546081543, "global_step": 165123, "epoch": 1989} {"train_loss": -23.874643325805664, "global_step": 165124, "epoch": 1989} {"train_loss": -23.421308517456055, "global_step": 165125, "epoch": 1989} {"train_loss": -23.494775772094727, "global_step": 165126, "epoch": 1989} {"train_loss": -23.589784622192383, "global_step": 165127, "epoch": 1989} {"train_loss": -23.721399307250977, "global_step": 165128, "epoch": 1989} {"train_loss": -23.64821434020996, "global_step": 165129, "epoch": 1989} {"train_loss": -23.588943481445312, "global_step": 165130, "epoch": 1989} {"train_loss": -23.42702293395996, "global_step": 165131, "epoch": 1989} {"train_loss": -23.368240356445312, "global_step": 165132, "epoch": 1989} {"train_loss": -23.153091430664062, "global_step": 165133, "epoch": 1989} {"train_loss": -23.40298843383789, "global_step": 165134, "epoch": 1989} {"train_loss": -23.631864547729492, "global_step": 165135, "epoch": 1989} {"train_loss": -23.55513572692871, "global_step": 165136, "epoch": 1989} {"train_loss": -23.270233154296875, "global_step": 165137, "epoch": 1989} {"train_loss": -23.525623321533203, "global_step": 165138, "epoch": 1989} {"train_loss": -23.67243194580078, "global_step": 165139, "epoch": 1989} {"train_loss": -23.569913864135742, "global_step": 165140, "epoch": 1989} {"train_loss": -23.188562393188477, "global_step": 165141, "epoch": 1989} {"train_loss": -23.770532608032227, "global_step": 165142, "epoch": 1989} {"train_loss": -23.323875427246094, "global_step": 165143, "epoch": 1989} {"train_loss": -23.484580993652344, "global_step": 165144, "epoch": 1989} {"train_loss": -23.692808151245117, "global_step": 165145, "epoch": 1989} {"train_loss": -23.637298583984375, "global_step": 165146, "epoch": 1989} {"train_loss": -23.659269332885742, "global_step": 165147, "epoch": 1989} {"train_loss": -23.709720611572266, "global_step": 165148, "epoch": 1989} {"train_loss": -23.495162963867188, "global_step": 165149, "epoch": 1989} {"train_loss": -23.6312255859375, "global_step": 165150, "epoch": 1989} {"train_loss": -23.72963523864746, "global_step": 165151, "epoch": 1989} {"train_loss": -23.231374740600586, "global_step": 165152, "epoch": 1989} {"train_loss": -23.346004486083984, "global_step": 165153, "epoch": 1989} {"train_loss": -23.410215377807617, "global_step": 165154, "epoch": 1989} {"train_loss": -23.2106990814209, "global_step": 165155, "epoch": 1989} {"train_loss": -23.194766998291016, "global_step": 165156, "epoch": 1989} {"train_loss": -23.24592399597168, "global_step": 165157, "epoch": 1989} {"train_loss": -23.56062889099121, "global_step": 165158, "epoch": 1989} {"train_loss": -23.124950408935547, "global_step": 165159, "epoch": 1989} {"train_loss": -23.56498146057129, "global_step": 165160, "epoch": 1989} {"train_loss": -23.76729393005371, "global_step": 165161, "epoch": 1989} {"train_loss": -23.7633056640625, "global_step": 165162, "epoch": 1989} {"train_loss": -23.804309844970703, "global_step": 165163, "epoch": 1989} {"train_loss": -23.432743072509766, "global_step": 165164, "epoch": 1989} {"train_loss": -23.587987899780273, "global_step": 165165, "epoch": 1989} {"train_loss": -23.76614761352539, "global_step": 165166, "epoch": 1989} {"train_loss": -23.528568267822266, "global_step": 165167, "epoch": 1989} {"train_loss": -23.922677993774414, "global_step": 165168, "epoch": 1989} {"train_loss": -23.48406908885542, "global_step": 165169, "epoch": 1989, "val_loss": 6377428.0} {"train_loss": -22.904462814331055, "global_step": 165170, "epoch": 1990} {"train_loss": -22.76055335998535, "global_step": 165171, "epoch": 1990} {"train_loss": -22.864320755004883, "global_step": 165172, "epoch": 1990} {"train_loss": -22.921918869018555, "global_step": 165173, "epoch": 1990} {"train_loss": -23.338144302368164, "global_step": 165174, "epoch": 1990} {"train_loss": -23.084278106689453, "global_step": 165175, "epoch": 1990} {"train_loss": -23.377822875976562, "global_step": 165176, "epoch": 1990} {"train_loss": -23.037607192993164, "global_step": 165177, "epoch": 1990} {"train_loss": -23.674114227294922, "global_step": 165178, "epoch": 1990} {"train_loss": -23.284473419189453, "global_step": 165179, "epoch": 1990} {"train_loss": -23.280670166015625, "global_step": 165180, "epoch": 1990} {"train_loss": -23.173364639282227, "global_step": 165181, "epoch": 1990} {"train_loss": -23.61262321472168, "global_step": 165182, "epoch": 1990} {"train_loss": -23.195514678955078, "global_step": 165183, "epoch": 1990} {"train_loss": -23.274991989135742, "global_step": 165184, "epoch": 1990} {"train_loss": -23.33504295349121, "global_step": 165185, "epoch": 1990} {"train_loss": -23.288848876953125, "global_step": 165186, "epoch": 1990} {"train_loss": -23.787691116333008, "global_step": 165187, "epoch": 1990} {"train_loss": -23.7194881439209, "global_step": 165188, "epoch": 1990} {"train_loss": -23.371917724609375, "global_step": 165189, "epoch": 1990} {"train_loss": -23.451492309570312, "global_step": 165190, "epoch": 1990} {"train_loss": -23.48834991455078, "global_step": 165191, "epoch": 1990} {"train_loss": -23.21332359313965, "global_step": 165192, "epoch": 1990} {"train_loss": -23.443387985229492, "global_step": 165193, "epoch": 1990} {"train_loss": -23.659605026245117, "global_step": 165194, "epoch": 1990} {"train_loss": -23.79557228088379, "global_step": 165195, "epoch": 1990} {"train_loss": -23.331850051879883, "global_step": 165196, "epoch": 1990} {"train_loss": -23.629430770874023, "global_step": 165197, "epoch": 1990} {"train_loss": -23.340011596679688, "global_step": 165198, "epoch": 1990} {"train_loss": -23.308073043823242, "global_step": 165199, "epoch": 1990} {"train_loss": -23.499967575073242, "global_step": 165200, "epoch": 1990} {"train_loss": -23.817514419555664, "global_step": 165201, "epoch": 1990} {"train_loss": -23.799489974975586, "global_step": 165202, "epoch": 1990} {"train_loss": -23.67232322692871, "global_step": 165203, "epoch": 1990} {"train_loss": -23.487133026123047, "global_step": 165204, "epoch": 1990} {"train_loss": -23.367856979370117, "global_step": 165205, "epoch": 1990} {"train_loss": -23.651010513305664, "global_step": 165206, "epoch": 1990} {"train_loss": -23.433340072631836, "global_step": 165207, "epoch": 1990} {"train_loss": -23.377567291259766, "global_step": 165208, "epoch": 1990} {"train_loss": -23.907567977905273, "global_step": 165209, "epoch": 1990} {"train_loss": -23.765655517578125, "global_step": 165210, "epoch": 1990} {"train_loss": -23.450054168701172, "global_step": 165211, "epoch": 1990} {"train_loss": -23.517160415649414, "global_step": 165212, "epoch": 1990} {"train_loss": -23.92205810546875, "global_step": 165213, "epoch": 1990} {"train_loss": -23.509069442749023, "global_step": 165214, "epoch": 1990} {"train_loss": -23.277042388916016, "global_step": 165215, "epoch": 1990} {"train_loss": -23.302000045776367, "global_step": 165216, "epoch": 1990} {"train_loss": -23.356992721557617, "global_step": 165217, "epoch": 1990} {"train_loss": -23.129966735839844, "global_step": 165218, "epoch": 1990} {"train_loss": -23.518075942993164, "global_step": 165219, "epoch": 1990} {"train_loss": -23.551015853881836, "global_step": 165220, "epoch": 1990} {"train_loss": -23.632314682006836, "global_step": 165221, "epoch": 1990} {"train_loss": -23.843908309936523, "global_step": 165222, "epoch": 1990} {"train_loss": -23.368404388427734, "global_step": 165223, "epoch": 1990} {"train_loss": -23.629976272583008, "global_step": 165224, "epoch": 1990} {"train_loss": -23.543033599853516, "global_step": 165225, "epoch": 1990} {"train_loss": -23.731796264648438, "global_step": 165226, "epoch": 1990} {"train_loss": -23.571239471435547, "global_step": 165227, "epoch": 1990} {"train_loss": -23.346723556518555, "global_step": 165228, "epoch": 1990} {"train_loss": -23.509845733642578, "global_step": 165229, "epoch": 1990} {"train_loss": -23.930822372436523, "global_step": 165230, "epoch": 1990} {"train_loss": -23.553604125976562, "global_step": 165231, "epoch": 1990} {"train_loss": -23.47962760925293, "global_step": 165232, "epoch": 1990} {"train_loss": -23.985891342163086, "global_step": 165233, "epoch": 1990} {"train_loss": -23.21859359741211, "global_step": 165234, "epoch": 1990} {"train_loss": -23.22344970703125, "global_step": 165235, "epoch": 1990} {"train_loss": -23.505298614501953, "global_step": 165236, "epoch": 1990} {"train_loss": -23.594003677368164, "global_step": 165237, "epoch": 1990} {"train_loss": -23.180822372436523, "global_step": 165238, "epoch": 1990} {"train_loss": -23.553220748901367, "global_step": 165239, "epoch": 1990} {"train_loss": -23.25563621520996, "global_step": 165240, "epoch": 1990} {"train_loss": -23.595449447631836, "global_step": 165241, "epoch": 1990} {"train_loss": -23.612218856811523, "global_step": 165242, "epoch": 1990} {"train_loss": -23.735097885131836, "global_step": 165243, "epoch": 1990} {"train_loss": -23.563257217407227, "global_step": 165244, "epoch": 1990} {"train_loss": -23.411964416503906, "global_step": 165245, "epoch": 1990} {"train_loss": -23.352811813354492, "global_step": 165246, "epoch": 1990} {"train_loss": -23.958209991455078, "global_step": 165247, "epoch": 1990} {"train_loss": -23.795032501220703, "global_step": 165248, "epoch": 1990} {"train_loss": -23.72871208190918, "global_step": 165249, "epoch": 1990} {"train_loss": -23.355220794677734, "global_step": 165250, "epoch": 1990} {"train_loss": -23.224956512451172, "global_step": 165251, "epoch": 1990} {"train_loss": -23.47412945850786, "global_step": 165252, "epoch": 1990, "val_loss": 6351948.5} {"train_loss": -22.64166259765625, "global_step": 165253, "epoch": 1991} {"train_loss": -23.19512939453125, "global_step": 165254, "epoch": 1991} {"train_loss": -23.099567413330078, "global_step": 165255, "epoch": 1991} {"train_loss": -23.17158317565918, "global_step": 165256, "epoch": 1991} {"train_loss": -23.205554962158203, "global_step": 165257, "epoch": 1991} {"train_loss": -23.232736587524414, "global_step": 165258, "epoch": 1991} {"train_loss": -23.1763858795166, "global_step": 165259, "epoch": 1991} {"train_loss": -23.24799346923828, "global_step": 165260, "epoch": 1991} {"train_loss": -23.164793014526367, "global_step": 165261, "epoch": 1991} {"train_loss": -23.482879638671875, "global_step": 165262, "epoch": 1991} {"train_loss": -23.354175567626953, "global_step": 165263, "epoch": 1991} {"train_loss": -23.59061050415039, "global_step": 165264, "epoch": 1991} {"train_loss": -23.517141342163086, "global_step": 165265, "epoch": 1991} {"train_loss": -23.262958526611328, "global_step": 165266, "epoch": 1991} {"train_loss": -23.5234432220459, "global_step": 165267, "epoch": 1991} {"train_loss": -23.506757736206055, "global_step": 165268, "epoch": 1991} {"train_loss": -23.58127212524414, "global_step": 165269, "epoch": 1991} {"train_loss": -23.338560104370117, "global_step": 165270, "epoch": 1991} {"train_loss": -23.46657371520996, "global_step": 165271, "epoch": 1991} {"train_loss": -23.15570831298828, "global_step": 165272, "epoch": 1991} {"train_loss": -23.511201858520508, "global_step": 165273, "epoch": 1991} {"train_loss": -23.721702575683594, "global_step": 165274, "epoch": 1991} {"train_loss": -23.576984405517578, "global_step": 165275, "epoch": 1991} {"train_loss": -23.69595718383789, "global_step": 165276, "epoch": 1991} {"train_loss": -23.780675888061523, "global_step": 165277, "epoch": 1991} {"train_loss": -23.570024490356445, "global_step": 165278, "epoch": 1991} {"train_loss": -23.670669555664062, "global_step": 165279, "epoch": 1991} {"train_loss": -23.769798278808594, "global_step": 165280, "epoch": 1991} {"train_loss": -23.64055061340332, "global_step": 165281, "epoch": 1991} {"train_loss": -23.544790267944336, "global_step": 165282, "epoch": 1991} {"train_loss": -23.91025161743164, "global_step": 165283, "epoch": 1991} {"train_loss": -23.381580352783203, "global_step": 165284, "epoch": 1991} {"train_loss": -23.241683959960938, "global_step": 165285, "epoch": 1991} {"train_loss": -23.58125877380371, "global_step": 165286, "epoch": 1991} {"train_loss": -23.78339958190918, "global_step": 165287, "epoch": 1991} {"train_loss": -24.10112190246582, "global_step": 165288, "epoch": 1991} {"train_loss": -23.89524269104004, "global_step": 165289, "epoch": 1991} {"train_loss": -23.613292694091797, "global_step": 165290, "epoch": 1991} {"train_loss": -23.813798904418945, "global_step": 165291, "epoch": 1991} {"train_loss": -23.948993682861328, "global_step": 165292, "epoch": 1991} {"train_loss": -23.464826583862305, "global_step": 165293, "epoch": 1991} {"train_loss": -23.89605712890625, "global_step": 165294, "epoch": 1991} {"train_loss": -23.782089233398438, "global_step": 165295, "epoch": 1991} {"train_loss": -23.295690536499023, "global_step": 165296, "epoch": 1991} {"train_loss": -24.209985733032227, "global_step": 165297, "epoch": 1991} {"train_loss": -23.57073974609375, "global_step": 165298, "epoch": 1991} {"train_loss": -24.13819694519043, "global_step": 165299, "epoch": 1991} {"train_loss": -23.639480590820312, "global_step": 165300, "epoch": 1991} {"train_loss": -23.611989974975586, "global_step": 165301, "epoch": 1991} {"train_loss": -23.940982818603516, "global_step": 165302, "epoch": 1991} {"train_loss": -23.89899253845215, "global_step": 165303, "epoch": 1991} {"train_loss": -23.461490631103516, "global_step": 165304, "epoch": 1991} {"train_loss": -23.860477447509766, "global_step": 165305, "epoch": 1991} {"train_loss": -23.62160301208496, "global_step": 165306, "epoch": 1991} {"train_loss": -23.835880279541016, "global_step": 165307, "epoch": 1991} {"train_loss": -23.932415008544922, "global_step": 165308, "epoch": 1991} {"train_loss": -24.07952880859375, "global_step": 165309, "epoch": 1991} {"train_loss": -23.851999282836914, "global_step": 165310, "epoch": 1991} {"train_loss": -23.625595092773438, "global_step": 165311, "epoch": 1991} {"train_loss": -23.457218170166016, "global_step": 165312, "epoch": 1991} {"train_loss": -23.683725357055664, "global_step": 165313, "epoch": 1991} {"train_loss": -23.935850143432617, "global_step": 165314, "epoch": 1991} {"train_loss": -23.716272354125977, "global_step": 165315, "epoch": 1991} {"train_loss": -23.426916122436523, "global_step": 165316, "epoch": 1991} {"train_loss": -23.50174903869629, "global_step": 165317, "epoch": 1991} {"train_loss": -24.04218101501465, "global_step": 165318, "epoch": 1991} {"train_loss": -23.4544620513916, "global_step": 165319, "epoch": 1991} {"train_loss": -23.923439025878906, "global_step": 165320, "epoch": 1991} {"train_loss": -24.03656005859375, "global_step": 165321, "epoch": 1991} {"train_loss": -23.81900405883789, "global_step": 165322, "epoch": 1991} {"train_loss": -23.51605224609375, "global_step": 165323, "epoch": 1991} {"train_loss": -23.720138549804688, "global_step": 165324, "epoch": 1991} {"train_loss": -23.325597763061523, "global_step": 165325, "epoch": 1991} {"train_loss": -23.650175094604492, "global_step": 165326, "epoch": 1991} {"train_loss": -23.289274215698242, "global_step": 165327, "epoch": 1991} {"train_loss": -23.542627334594727, "global_step": 165328, "epoch": 1991} {"train_loss": -23.70992088317871, "global_step": 165329, "epoch": 1991} {"train_loss": -23.34684181213379, "global_step": 165330, "epoch": 1991} {"train_loss": -23.68871307373047, "global_step": 165331, "epoch": 1991} {"train_loss": -23.18096923828125, "global_step": 165332, "epoch": 1991} {"train_loss": -23.499671936035156, "global_step": 165333, "epoch": 1991} {"train_loss": -23.641820907592773, "global_step": 165334, "epoch": 1991} {"train_loss": -23.58754911767431, "global_step": 165335, "epoch": 1991, "val_loss": 6355304.5} {"train_loss": -23.474716186523438, "global_step": 165336, "epoch": 1992} {"train_loss": -23.339393615722656, "global_step": 165337, "epoch": 1992} {"train_loss": -23.30487060546875, "global_step": 165338, "epoch": 1992} {"train_loss": -23.401865005493164, "global_step": 165339, "epoch": 1992} {"train_loss": -22.943185806274414, "global_step": 165340, "epoch": 1992} {"train_loss": -23.452260971069336, "global_step": 165341, "epoch": 1992} {"train_loss": -23.229162216186523, "global_step": 165342, "epoch": 1992} {"train_loss": -23.619550704956055, "global_step": 165343, "epoch": 1992} {"train_loss": -23.082489013671875, "global_step": 165344, "epoch": 1992} {"train_loss": -23.50198745727539, "global_step": 165345, "epoch": 1992} {"train_loss": -23.497148513793945, "global_step": 165346, "epoch": 1992} {"train_loss": -23.6447811126709, "global_step": 165347, "epoch": 1992} {"train_loss": -23.307748794555664, "global_step": 165348, "epoch": 1992} {"train_loss": -23.513916015625, "global_step": 165349, "epoch": 1992} {"train_loss": -23.508403778076172, "global_step": 165350, "epoch": 1992} {"train_loss": -23.462804794311523, "global_step": 165351, "epoch": 1992} {"train_loss": -23.805112838745117, "global_step": 165352, "epoch": 1992} {"train_loss": -23.252065658569336, "global_step": 165353, "epoch": 1992} {"train_loss": -23.46558952331543, "global_step": 165354, "epoch": 1992} {"train_loss": -23.4622802734375, "global_step": 165355, "epoch": 1992} {"train_loss": -23.31852149963379, "global_step": 165356, "epoch": 1992} {"train_loss": -23.822738647460938, "global_step": 165357, "epoch": 1992} {"train_loss": -23.42558479309082, "global_step": 165358, "epoch": 1992} {"train_loss": -23.89631462097168, "global_step": 165359, "epoch": 1992} {"train_loss": -23.594074249267578, "global_step": 165360, "epoch": 1992} {"train_loss": -23.585865020751953, "global_step": 165361, "epoch": 1992} {"train_loss": -23.749008178710938, "global_step": 165362, "epoch": 1992} {"train_loss": -23.714452743530273, "global_step": 165363, "epoch": 1992} {"train_loss": -23.718069076538086, "global_step": 165364, "epoch": 1992} {"train_loss": -23.69721031188965, "global_step": 165365, "epoch": 1992} {"train_loss": -23.76227569580078, "global_step": 165366, "epoch": 1992} {"train_loss": -23.67327880859375, "global_step": 165367, "epoch": 1992} {"train_loss": -23.298978805541992, "global_step": 165368, "epoch": 1992} {"train_loss": -23.73765754699707, "global_step": 165369, "epoch": 1992} {"train_loss": -23.974088668823242, "global_step": 165370, "epoch": 1992} {"train_loss": -23.67003059387207, "global_step": 165371, "epoch": 1992} {"train_loss": -23.784664154052734, "global_step": 165372, "epoch": 1992} {"train_loss": -23.832168579101562, "global_step": 165373, "epoch": 1992} {"train_loss": -24.07173728942871, "global_step": 165374, "epoch": 1992} {"train_loss": -23.620145797729492, "global_step": 165375, "epoch": 1992} {"train_loss": -23.434112548828125, "global_step": 165376, "epoch": 1992} {"train_loss": -23.859539031982422, "global_step": 165377, "epoch": 1992} {"train_loss": -23.521291732788086, "global_step": 165378, "epoch": 1992} {"train_loss": -23.213733673095703, "global_step": 165379, "epoch": 1992} {"train_loss": -23.394365310668945, "global_step": 165380, "epoch": 1992} {"train_loss": -23.245502471923828, "global_step": 165381, "epoch": 1992} {"train_loss": -23.770883560180664, "global_step": 165382, "epoch": 1992} {"train_loss": -23.735044479370117, "global_step": 165383, "epoch": 1992} {"train_loss": -23.398435592651367, "global_step": 165384, "epoch": 1992} {"train_loss": -23.35514259338379, "global_step": 165385, "epoch": 1992} {"train_loss": -23.89066505432129, "global_step": 165386, "epoch": 1992} {"train_loss": -23.81090545654297, "global_step": 165387, "epoch": 1992} {"train_loss": -23.303251266479492, "global_step": 165388, "epoch": 1992} {"train_loss": -24.019573211669922, "global_step": 165389, "epoch": 1992} {"train_loss": -23.73944854736328, "global_step": 165390, "epoch": 1992} {"train_loss": -23.611356735229492, "global_step": 165391, "epoch": 1992} {"train_loss": -23.616453170776367, "global_step": 165392, "epoch": 1992} {"train_loss": -23.548755645751953, "global_step": 165393, "epoch": 1992} {"train_loss": -23.667503356933594, "global_step": 165394, "epoch": 1992} {"train_loss": -23.471328735351562, "global_step": 165395, "epoch": 1992} {"train_loss": -23.525876998901367, "global_step": 165396, "epoch": 1992} {"train_loss": -23.721691131591797, "global_step": 165397, "epoch": 1992} {"train_loss": -23.889429092407227, "global_step": 165398, "epoch": 1992} {"train_loss": -23.498098373413086, "global_step": 165399, "epoch": 1992} {"train_loss": -23.46940040588379, "global_step": 165400, "epoch": 1992} {"train_loss": -23.636728286743164, "global_step": 165401, "epoch": 1992} {"train_loss": -23.98554039001465, "global_step": 165402, "epoch": 1992} {"train_loss": -23.72069549560547, "global_step": 165403, "epoch": 1992} {"train_loss": -23.415128707885742, "global_step": 165404, "epoch": 1992} {"train_loss": -23.597753524780273, "global_step": 165405, "epoch": 1992} {"train_loss": -23.701303482055664, "global_step": 165406, "epoch": 1992} {"train_loss": -23.62080955505371, "global_step": 165407, "epoch": 1992} {"train_loss": -23.73990249633789, "global_step": 165408, "epoch": 1992} {"train_loss": -23.636219024658203, "global_step": 165409, "epoch": 1992} {"train_loss": -23.653684616088867, "global_step": 165410, "epoch": 1992} {"train_loss": -23.743391036987305, "global_step": 165411, "epoch": 1992} {"train_loss": -23.6328067779541, "global_step": 165412, "epoch": 1992} {"train_loss": -23.716121673583984, "global_step": 165413, "epoch": 1992} {"train_loss": -23.377220153808594, "global_step": 165414, "epoch": 1992} {"train_loss": -23.43459701538086, "global_step": 165415, "epoch": 1992} {"train_loss": -23.43260955810547, "global_step": 165416, "epoch": 1992} {"train_loss": -23.535856246948242, "global_step": 165417, "epoch": 1992} {"train_loss": -23.58267632449966, "global_step": 165418, "epoch": 1992, "val_loss": 6449763.0} {"train_loss": -23.250240325927734, "global_step": 165419, "epoch": 1993} {"train_loss": -22.514822006225586, "global_step": 165420, "epoch": 1993} {"train_loss": -22.48555564880371, "global_step": 165421, "epoch": 1993} {"train_loss": -22.295616149902344, "global_step": 165422, "epoch": 1993} {"train_loss": -23.041349411010742, "global_step": 165423, "epoch": 1993} {"train_loss": -22.37025260925293, "global_step": 165424, "epoch": 1993} {"train_loss": -22.824304580688477, "global_step": 165425, "epoch": 1993} {"train_loss": -23.134572982788086, "global_step": 165426, "epoch": 1993} {"train_loss": -23.32747459411621, "global_step": 165427, "epoch": 1993} {"train_loss": -23.195819854736328, "global_step": 165428, "epoch": 1993} {"train_loss": -22.98654556274414, "global_step": 165429, "epoch": 1993} {"train_loss": -23.21927261352539, "global_step": 165430, "epoch": 1993} {"train_loss": -23.240524291992188, "global_step": 165431, "epoch": 1993} {"train_loss": -23.13751220703125, "global_step": 165432, "epoch": 1993} {"train_loss": -23.11109733581543, "global_step": 165433, "epoch": 1993} {"train_loss": -23.20694923400879, "global_step": 165434, "epoch": 1993} {"train_loss": -23.14560317993164, "global_step": 165435, "epoch": 1993} {"train_loss": -23.68605613708496, "global_step": 165436, "epoch": 1993} {"train_loss": -23.515094757080078, "global_step": 165437, "epoch": 1993} {"train_loss": -23.345264434814453, "global_step": 165438, "epoch": 1993} {"train_loss": -23.460630416870117, "global_step": 165439, "epoch": 1993} {"train_loss": -23.24436378479004, "global_step": 165440, "epoch": 1993} {"train_loss": -23.558393478393555, "global_step": 165441, "epoch": 1993} {"train_loss": -23.36322021484375, "global_step": 165442, "epoch": 1993} {"train_loss": -23.400035858154297, "global_step": 165443, "epoch": 1993} {"train_loss": -23.249652862548828, "global_step": 165444, "epoch": 1993} {"train_loss": -23.372018814086914, "global_step": 165445, "epoch": 1993} {"train_loss": -23.324657440185547, "global_step": 165446, "epoch": 1993} {"train_loss": -23.85676383972168, "global_step": 165447, "epoch": 1993} {"train_loss": -23.200746536254883, "global_step": 165448, "epoch": 1993} {"train_loss": -23.622589111328125, "global_step": 165449, "epoch": 1993} {"train_loss": -23.614273071289062, "global_step": 165450, "epoch": 1993} {"train_loss": -23.268442153930664, "global_step": 165451, "epoch": 1993} {"train_loss": -23.891143798828125, "global_step": 165452, "epoch": 1993} {"train_loss": -23.540435791015625, "global_step": 165453, "epoch": 1993} {"train_loss": -23.412221908569336, "global_step": 165454, "epoch": 1993} {"train_loss": -23.425613403320312, "global_step": 165455, "epoch": 1993} {"train_loss": -23.40015983581543, "global_step": 165456, "epoch": 1993} {"train_loss": -23.381519317626953, "global_step": 165457, "epoch": 1993} {"train_loss": -23.451988220214844, "global_step": 165458, "epoch": 1993} {"train_loss": -23.04361343383789, "global_step": 165459, "epoch": 1993} {"train_loss": -23.67072296142578, "global_step": 165460, "epoch": 1993} {"train_loss": -23.520437240600586, "global_step": 165461, "epoch": 1993} {"train_loss": -23.82244110107422, "global_step": 165462, "epoch": 1993} {"train_loss": -23.538862228393555, "global_step": 165463, "epoch": 1993} {"train_loss": -23.740283966064453, "global_step": 165464, "epoch": 1993} {"train_loss": -23.840635299682617, "global_step": 165465, "epoch": 1993} {"train_loss": -23.680418014526367, "global_step": 165466, "epoch": 1993} {"train_loss": -23.542484283447266, "global_step": 165467, "epoch": 1993} {"train_loss": -23.34092140197754, "global_step": 165468, "epoch": 1993} {"train_loss": -23.557994842529297, "global_step": 165469, "epoch": 1993} {"train_loss": -23.47816276550293, "global_step": 165470, "epoch": 1993} {"train_loss": -23.742788314819336, "global_step": 165471, "epoch": 1993} {"train_loss": -23.42805290222168, "global_step": 165472, "epoch": 1993} {"train_loss": -23.796674728393555, "global_step": 165473, "epoch": 1993} {"train_loss": -23.838275909423828, "global_step": 165474, "epoch": 1993} {"train_loss": -22.97124481201172, "global_step": 165475, "epoch": 1993} {"train_loss": -23.320194244384766, "global_step": 165476, "epoch": 1993} {"train_loss": -23.685338973999023, "global_step": 165477, "epoch": 1993} {"train_loss": -23.587570190429688, "global_step": 165478, "epoch": 1993} {"train_loss": -23.70039939880371, "global_step": 165479, "epoch": 1993} {"train_loss": -23.666112899780273, "global_step": 165480, "epoch": 1993} {"train_loss": -23.94740104675293, "global_step": 165481, "epoch": 1993} {"train_loss": -23.585071563720703, "global_step": 165482, "epoch": 1993} {"train_loss": -23.338932037353516, "global_step": 165483, "epoch": 1993} {"train_loss": -23.949356079101562, "global_step": 165484, "epoch": 1993} {"train_loss": -24.05948257446289, "global_step": 165485, "epoch": 1993} {"train_loss": -23.67464828491211, "global_step": 165486, "epoch": 1993} {"train_loss": -23.884227752685547, "global_step": 165487, "epoch": 1993} {"train_loss": -23.566455841064453, "global_step": 165488, "epoch": 1993} {"train_loss": -23.983304977416992, "global_step": 165489, "epoch": 1993} {"train_loss": -23.608718872070312, "global_step": 165490, "epoch": 1993} {"train_loss": -23.736303329467773, "global_step": 165491, "epoch": 1993} {"train_loss": -23.648908615112305, "global_step": 165492, "epoch": 1993} {"train_loss": -23.41537094116211, "global_step": 165493, "epoch": 1993} {"train_loss": -23.70955467224121, "global_step": 165494, "epoch": 1993} {"train_loss": -23.445741653442383, "global_step": 165495, "epoch": 1993} {"train_loss": -23.600662231445312, "global_step": 165496, "epoch": 1993} {"train_loss": -23.690832138061523, "global_step": 165497, "epoch": 1993} {"train_loss": -23.430295944213867, "global_step": 165498, "epoch": 1993} {"train_loss": -23.2441463470459, "global_step": 165499, "epoch": 1993} {"train_loss": -23.836545944213867, "global_step": 165500, "epoch": 1993} {"train_loss": -23.435301102787616, "global_step": 165501, "epoch": 1993, "val_loss": 6327099.5} {"train_loss": -22.91706657409668, "global_step": 165502, "epoch": 1994} {"train_loss": -23.388288497924805, "global_step": 165503, "epoch": 1994} {"train_loss": -23.315532684326172, "global_step": 165504, "epoch": 1994} {"train_loss": -22.82523536682129, "global_step": 165505, "epoch": 1994} {"train_loss": -23.267881393432617, "global_step": 165506, "epoch": 1994} {"train_loss": -23.265018463134766, "global_step": 165507, "epoch": 1994} {"train_loss": -23.65375518798828, "global_step": 165508, "epoch": 1994} {"train_loss": -23.013748168945312, "global_step": 165509, "epoch": 1994} {"train_loss": -23.546974182128906, "global_step": 165510, "epoch": 1994} {"train_loss": -23.532194137573242, "global_step": 165511, "epoch": 1994} {"train_loss": -23.088171005249023, "global_step": 165512, "epoch": 1994} {"train_loss": -23.31251335144043, "global_step": 165513, "epoch": 1994} {"train_loss": -23.459409713745117, "global_step": 165514, "epoch": 1994} {"train_loss": -23.601856231689453, "global_step": 165515, "epoch": 1994} {"train_loss": -23.388452529907227, "global_step": 165516, "epoch": 1994} {"train_loss": -23.61216163635254, "global_step": 165517, "epoch": 1994} {"train_loss": -23.464624404907227, "global_step": 165518, "epoch": 1994} {"train_loss": -23.399011611938477, "global_step": 165519, "epoch": 1994} {"train_loss": -23.947128295898438, "global_step": 165520, "epoch": 1994} {"train_loss": -22.983591079711914, "global_step": 165521, "epoch": 1994} {"train_loss": -23.71702003479004, "global_step": 165522, "epoch": 1994} {"train_loss": -23.424434661865234, "global_step": 165523, "epoch": 1994} {"train_loss": -23.635534286499023, "global_step": 165524, "epoch": 1994} {"train_loss": -23.374094009399414, "global_step": 165525, "epoch": 1994} {"train_loss": -23.491971969604492, "global_step": 165526, "epoch": 1994} {"train_loss": -23.53925895690918, "global_step": 165527, "epoch": 1994} {"train_loss": -23.584651947021484, "global_step": 165528, "epoch": 1994} {"train_loss": -23.377355575561523, "global_step": 165529, "epoch": 1994} {"train_loss": -23.52190589904785, "global_step": 165530, "epoch": 1994} {"train_loss": -23.6683349609375, "global_step": 165531, "epoch": 1994} {"train_loss": -23.32853889465332, "global_step": 165532, "epoch": 1994} {"train_loss": -23.62005043029785, "global_step": 165533, "epoch": 1994} {"train_loss": -23.34749412536621, "global_step": 165534, "epoch": 1994} {"train_loss": -23.803874969482422, "global_step": 165535, "epoch": 1994} {"train_loss": -23.65053367614746, "global_step": 165536, "epoch": 1994} {"train_loss": -23.437198638916016, "global_step": 165537, "epoch": 1994} {"train_loss": -23.54603385925293, "global_step": 165538, "epoch": 1994} {"train_loss": -23.412153244018555, "global_step": 165539, "epoch": 1994} {"train_loss": -23.5142822265625, "global_step": 165540, "epoch": 1994} {"train_loss": -23.47583770751953, "global_step": 165541, "epoch": 1994} {"train_loss": -23.33700942993164, "global_step": 165542, "epoch": 1994} {"train_loss": -23.75628089904785, "global_step": 165543, "epoch": 1994} {"train_loss": -23.676328659057617, "global_step": 165544, "epoch": 1994} {"train_loss": -23.634265899658203, "global_step": 165545, "epoch": 1994} {"train_loss": -23.765274047851562, "global_step": 165546, "epoch": 1994} {"train_loss": -23.3605899810791, "global_step": 165547, "epoch": 1994} {"train_loss": -23.506834030151367, "global_step": 165548, "epoch": 1994} {"train_loss": -23.83350944519043, "global_step": 165549, "epoch": 1994} {"train_loss": -23.894346237182617, "global_step": 165550, "epoch": 1994} {"train_loss": -23.8718204498291, "global_step": 165551, "epoch": 1994} {"train_loss": -23.520130157470703, "global_step": 165552, "epoch": 1994} {"train_loss": -23.335966110229492, "global_step": 165553, "epoch": 1994} {"train_loss": -23.75637435913086, "global_step": 165554, "epoch": 1994} {"train_loss": -23.494312286376953, "global_step": 165555, "epoch": 1994} {"train_loss": -23.542814254760742, "global_step": 165556, "epoch": 1994} {"train_loss": -23.26581382751465, "global_step": 165557, "epoch": 1994} {"train_loss": -23.68996238708496, "global_step": 165558, "epoch": 1994} {"train_loss": -23.610042572021484, "global_step": 165559, "epoch": 1994} {"train_loss": -23.379989624023438, "global_step": 165560, "epoch": 1994} {"train_loss": -23.939640045166016, "global_step": 165561, "epoch": 1994} {"train_loss": -23.424591064453125, "global_step": 165562, "epoch": 1994} {"train_loss": -24.047531127929688, "global_step": 165563, "epoch": 1994} {"train_loss": -23.86849594116211, "global_step": 165564, "epoch": 1994} {"train_loss": -23.728790283203125, "global_step": 165565, "epoch": 1994} {"train_loss": -23.189836502075195, "global_step": 165566, "epoch": 1994} {"train_loss": -23.80841827392578, "global_step": 165567, "epoch": 1994} {"train_loss": -23.740341186523438, "global_step": 165568, "epoch": 1994} {"train_loss": -23.245437622070312, "global_step": 165569, "epoch": 1994} {"train_loss": -23.50033187866211, "global_step": 165570, "epoch": 1994} {"train_loss": -23.498685836791992, "global_step": 165571, "epoch": 1994} {"train_loss": -23.6477108001709, "global_step": 165572, "epoch": 1994} {"train_loss": -23.74073600769043, "global_step": 165573, "epoch": 1994} {"train_loss": -23.46143913269043, "global_step": 165574, "epoch": 1994} {"train_loss": -23.342971801757812, "global_step": 165575, "epoch": 1994} {"train_loss": -23.43429946899414, "global_step": 165576, "epoch": 1994} {"train_loss": -23.77198028564453, "global_step": 165577, "epoch": 1994} {"train_loss": -23.377872467041016, "global_step": 165578, "epoch": 1994} {"train_loss": -23.41947364807129, "global_step": 165579, "epoch": 1994} {"train_loss": -23.371551513671875, "global_step": 165580, "epoch": 1994} {"train_loss": -24.113183975219727, "global_step": 165581, "epoch": 1994} {"train_loss": -23.321142196655273, "global_step": 165582, "epoch": 1994} {"train_loss": -23.41112518310547, "global_step": 165583, "epoch": 1994} {"train_loss": -23.498418853943605, "global_step": 165584, "epoch": 1994, "val_loss": 6361386.0} {"train_loss": -23.222158432006836, "global_step": 165585, "epoch": 1995} {"train_loss": -23.35291862487793, "global_step": 165586, "epoch": 1995} {"train_loss": -23.375038146972656, "global_step": 165587, "epoch": 1995} {"train_loss": -23.13316535949707, "global_step": 165588, "epoch": 1995} {"train_loss": -23.25556755065918, "global_step": 165589, "epoch": 1995} {"train_loss": -23.340576171875, "global_step": 165590, "epoch": 1995} {"train_loss": -23.037879943847656, "global_step": 165591, "epoch": 1995} {"train_loss": -23.06704330444336, "global_step": 165592, "epoch": 1995} {"train_loss": -23.489336013793945, "global_step": 165593, "epoch": 1995} {"train_loss": -23.335142135620117, "global_step": 165594, "epoch": 1995} {"train_loss": -23.31401824951172, "global_step": 165595, "epoch": 1995} {"train_loss": -23.1152286529541, "global_step": 165596, "epoch": 1995} {"train_loss": -23.346097946166992, "global_step": 165597, "epoch": 1995} {"train_loss": -23.609140396118164, "global_step": 165598, "epoch": 1995} {"train_loss": -23.604948043823242, "global_step": 165599, "epoch": 1995} {"train_loss": -23.364734649658203, "global_step": 165600, "epoch": 1995} {"train_loss": -23.733036041259766, "global_step": 165601, "epoch": 1995} {"train_loss": -23.32404899597168, "global_step": 165602, "epoch": 1995} {"train_loss": -23.365903854370117, "global_step": 165603, "epoch": 1995} {"train_loss": -23.47682762145996, "global_step": 165604, "epoch": 1995} {"train_loss": -23.197072982788086, "global_step": 165605, "epoch": 1995} {"train_loss": -23.255659103393555, "global_step": 165606, "epoch": 1995} {"train_loss": -23.226463317871094, "global_step": 165607, "epoch": 1995} {"train_loss": -23.45853042602539, "global_step": 165608, "epoch": 1995} {"train_loss": -23.633586883544922, "global_step": 165609, "epoch": 1995} {"train_loss": -23.3762264251709, "global_step": 165610, "epoch": 1995} {"train_loss": -23.332460403442383, "global_step": 165611, "epoch": 1995} {"train_loss": -23.49048614501953, "global_step": 165612, "epoch": 1995} {"train_loss": -23.25519371032715, "global_step": 165613, "epoch": 1995} {"train_loss": -23.379898071289062, "global_step": 165614, "epoch": 1995} {"train_loss": -23.789093017578125, "global_step": 165615, "epoch": 1995} {"train_loss": -23.38630485534668, "global_step": 165616, "epoch": 1995} {"train_loss": -23.89535140991211, "global_step": 165617, "epoch": 1995} {"train_loss": -23.74388885498047, "global_step": 165618, "epoch": 1995} {"train_loss": -23.26102638244629, "global_step": 165619, "epoch": 1995} {"train_loss": -23.446378707885742, "global_step": 165620, "epoch": 1995} {"train_loss": -23.555959701538086, "global_step": 165621, "epoch": 1995} {"train_loss": -23.78718376159668, "global_step": 165622, "epoch": 1995} {"train_loss": -23.879165649414062, "global_step": 165623, "epoch": 1995} {"train_loss": -23.634628295898438, "global_step": 165624, "epoch": 1995} {"train_loss": -23.838918685913086, "global_step": 165625, "epoch": 1995} {"train_loss": -23.702075958251953, "global_step": 165626, "epoch": 1995} {"train_loss": -23.760915756225586, "global_step": 165627, "epoch": 1995} {"train_loss": -23.659772872924805, "global_step": 165628, "epoch": 1995} {"train_loss": -23.607511520385742, "global_step": 165629, "epoch": 1995} {"train_loss": -23.392292022705078, "global_step": 165630, "epoch": 1995} {"train_loss": -23.82925796508789, "global_step": 165631, "epoch": 1995} {"train_loss": -23.9561824798584, "global_step": 165632, "epoch": 1995} {"train_loss": -23.483325958251953, "global_step": 165633, "epoch": 1995} {"train_loss": -23.669998168945312, "global_step": 165634, "epoch": 1995} {"train_loss": -23.061140060424805, "global_step": 165635, "epoch": 1995} {"train_loss": -23.472341537475586, "global_step": 165636, "epoch": 1995} {"train_loss": -23.542213439941406, "global_step": 165637, "epoch": 1995} {"train_loss": -23.473766326904297, "global_step": 165638, "epoch": 1995} {"train_loss": -23.262969970703125, "global_step": 165639, "epoch": 1995} {"train_loss": -23.114402770996094, "global_step": 165640, "epoch": 1995} {"train_loss": -23.68500328063965, "global_step": 165641, "epoch": 1995} {"train_loss": -23.627050399780273, "global_step": 165642, "epoch": 1995} {"train_loss": -23.337827682495117, "global_step": 165643, "epoch": 1995} {"train_loss": -23.48993682861328, "global_step": 165644, "epoch": 1995} {"train_loss": -23.91615104675293, "global_step": 165645, "epoch": 1995} {"train_loss": -23.67226791381836, "global_step": 165646, "epoch": 1995} {"train_loss": -23.550146102905273, "global_step": 165647, "epoch": 1995} {"train_loss": -23.640684127807617, "global_step": 165648, "epoch": 1995} {"train_loss": -23.76708221435547, "global_step": 165649, "epoch": 1995} {"train_loss": -23.642520904541016, "global_step": 165650, "epoch": 1995} {"train_loss": -23.273527145385742, "global_step": 165651, "epoch": 1995} {"train_loss": -23.44992446899414, "global_step": 165652, "epoch": 1995} {"train_loss": -23.550390243530273, "global_step": 165653, "epoch": 1995} {"train_loss": -23.658798217773438, "global_step": 165654, "epoch": 1995} {"train_loss": -23.80633544921875, "global_step": 165655, "epoch": 1995} {"train_loss": -23.706226348876953, "global_step": 165656, "epoch": 1995} {"train_loss": -23.446136474609375, "global_step": 165657, "epoch": 1995} {"train_loss": -23.51313591003418, "global_step": 165658, "epoch": 1995} {"train_loss": -23.770816802978516, "global_step": 165659, "epoch": 1995} {"train_loss": -23.502439498901367, "global_step": 165660, "epoch": 1995} {"train_loss": -23.614431381225586, "global_step": 165661, "epoch": 1995} {"train_loss": -23.71480369567871, "global_step": 165662, "epoch": 1995} {"train_loss": -23.482572555541992, "global_step": 165663, "epoch": 1995} {"train_loss": -23.453350067138672, "global_step": 165664, "epoch": 1995} {"train_loss": -23.331106185913086, "global_step": 165665, "epoch": 1995} {"train_loss": -23.394502639770508, "global_step": 165666, "epoch": 1995} {"train_loss": -23.499608556908296, "global_step": 165667, "epoch": 1995, "val_loss": 6360613.0} {"train_loss": -23.302616119384766, "global_step": 165668, "epoch": 1996} {"train_loss": -22.79645347595215, "global_step": 165669, "epoch": 1996} {"train_loss": -23.074155807495117, "global_step": 165670, "epoch": 1996} {"train_loss": -23.934545516967773, "global_step": 165671, "epoch": 1996} {"train_loss": -23.139644622802734, "global_step": 165672, "epoch": 1996} {"train_loss": -23.167476654052734, "global_step": 165673, "epoch": 1996} {"train_loss": -23.33155632019043, "global_step": 165674, "epoch": 1996} {"train_loss": -23.43523406982422, "global_step": 165675, "epoch": 1996} {"train_loss": -23.367828369140625, "global_step": 165676, "epoch": 1996} {"train_loss": -23.37534523010254, "global_step": 165677, "epoch": 1996} {"train_loss": -23.170982360839844, "global_step": 165678, "epoch": 1996} {"train_loss": -23.47574806213379, "global_step": 165679, "epoch": 1996} {"train_loss": -23.43460464477539, "global_step": 165680, "epoch": 1996} {"train_loss": -23.469268798828125, "global_step": 165681, "epoch": 1996} {"train_loss": -23.591306686401367, "global_step": 165682, "epoch": 1996} {"train_loss": -23.618825912475586, "global_step": 165683, "epoch": 1996} {"train_loss": -23.136850357055664, "global_step": 165684, "epoch": 1996} {"train_loss": -23.4377498626709, "global_step": 165685, "epoch": 1996} {"train_loss": -23.498748779296875, "global_step": 165686, "epoch": 1996} {"train_loss": -23.859468460083008, "global_step": 165687, "epoch": 1996} {"train_loss": -23.39065933227539, "global_step": 165688, "epoch": 1996} {"train_loss": -23.98708724975586, "global_step": 165689, "epoch": 1996} {"train_loss": -23.799341201782227, "global_step": 165690, "epoch": 1996} {"train_loss": -23.57941246032715, "global_step": 165691, "epoch": 1996} {"train_loss": -23.880056381225586, "global_step": 165692, "epoch": 1996} {"train_loss": -23.98703384399414, "global_step": 165693, "epoch": 1996} {"train_loss": -23.510927200317383, "global_step": 165694, "epoch": 1996} {"train_loss": -23.56758689880371, "global_step": 165695, "epoch": 1996} {"train_loss": -23.594837188720703, "global_step": 165696, "epoch": 1996} {"train_loss": -23.479116439819336, "global_step": 165697, "epoch": 1996} {"train_loss": -23.759084701538086, "global_step": 165698, "epoch": 1996} {"train_loss": -23.43353843688965, "global_step": 165699, "epoch": 1996} {"train_loss": -23.528039932250977, "global_step": 165700, "epoch": 1996} {"train_loss": -23.834217071533203, "global_step": 165701, "epoch": 1996} {"train_loss": -23.535802841186523, "global_step": 165702, "epoch": 1996} {"train_loss": -24.174293518066406, "global_step": 165703, "epoch": 1996} {"train_loss": -23.885780334472656, "global_step": 165704, "epoch": 1996} {"train_loss": -23.445714950561523, "global_step": 165705, "epoch": 1996} {"train_loss": -23.57208824157715, "global_step": 165706, "epoch": 1996} {"train_loss": -23.58060646057129, "global_step": 165707, "epoch": 1996} {"train_loss": -23.07723617553711, "global_step": 165708, "epoch": 1996} {"train_loss": -23.734317779541016, "global_step": 165709, "epoch": 1996} {"train_loss": -23.574810028076172, "global_step": 165710, "epoch": 1996} {"train_loss": -23.4079532623291, "global_step": 165711, "epoch": 1996} {"train_loss": -23.49371910095215, "global_step": 165712, "epoch": 1996} {"train_loss": -23.528715133666992, "global_step": 165713, "epoch": 1996} {"train_loss": -23.52907371520996, "global_step": 165714, "epoch": 1996} {"train_loss": -23.575796127319336, "global_step": 165715, "epoch": 1996} {"train_loss": -23.30312156677246, "global_step": 165716, "epoch": 1996} {"train_loss": -23.58118438720703, "global_step": 165717, "epoch": 1996} {"train_loss": -24.017627716064453, "global_step": 165718, "epoch": 1996} {"train_loss": -23.440011978149414, "global_step": 165719, "epoch": 1996} {"train_loss": -23.595611572265625, "global_step": 165720, "epoch": 1996} {"train_loss": -23.61320686340332, "global_step": 165721, "epoch": 1996} {"train_loss": -23.626129150390625, "global_step": 165722, "epoch": 1996} {"train_loss": -23.545682907104492, "global_step": 165723, "epoch": 1996} {"train_loss": -23.927698135375977, "global_step": 165724, "epoch": 1996} {"train_loss": -23.77615737915039, "global_step": 165725, "epoch": 1996} {"train_loss": -23.8990535736084, "global_step": 165726, "epoch": 1996} {"train_loss": -23.774799346923828, "global_step": 165727, "epoch": 1996} {"train_loss": -23.8749942779541, "global_step": 165728, "epoch": 1996} {"train_loss": -23.58589744567871, "global_step": 165729, "epoch": 1996} {"train_loss": -23.71229362487793, "global_step": 165730, "epoch": 1996} {"train_loss": -23.49086570739746, "global_step": 165731, "epoch": 1996} {"train_loss": -23.649965286254883, "global_step": 165732, "epoch": 1996} {"train_loss": -23.656705856323242, "global_step": 165733, "epoch": 1996} {"train_loss": -23.77228355407715, "global_step": 165734, "epoch": 1996} {"train_loss": -23.878705978393555, "global_step": 165735, "epoch": 1996} {"train_loss": -23.616943359375, "global_step": 165736, "epoch": 1996} {"train_loss": -23.894582748413086, "global_step": 165737, "epoch": 1996} {"train_loss": -23.93985366821289, "global_step": 165738, "epoch": 1996} {"train_loss": -24.154869079589844, "global_step": 165739, "epoch": 1996} {"train_loss": -23.861440658569336, "global_step": 165740, "epoch": 1996} {"train_loss": -23.831357955932617, "global_step": 165741, "epoch": 1996} {"train_loss": -23.667804718017578, "global_step": 165742, "epoch": 1996} {"train_loss": -23.604764938354492, "global_step": 165743, "epoch": 1996} {"train_loss": -23.33246421813965, "global_step": 165744, "epoch": 1996} {"train_loss": -23.584819793701172, "global_step": 165745, "epoch": 1996} {"train_loss": -24.115318298339844, "global_step": 165746, "epoch": 1996} {"train_loss": -24.137109756469727, "global_step": 165747, "epoch": 1996} {"train_loss": -23.359270095825195, "global_step": 165748, "epoch": 1996} {"train_loss": -24.123640060424805, "global_step": 165749, "epoch": 1996} {"train_loss": -23.620880816356244, "global_step": 165750, "epoch": 1996, "val_loss": 6368340.0} {"train_loss": -23.36575698852539, "global_step": 165751, "epoch": 1997} {"train_loss": -23.640344619750977, "global_step": 165752, "epoch": 1997} {"train_loss": -23.09793472290039, "global_step": 165753, "epoch": 1997} {"train_loss": -23.17616081237793, "global_step": 165754, "epoch": 1997} {"train_loss": -23.249711990356445, "global_step": 165755, "epoch": 1997} {"train_loss": -23.38446617126465, "global_step": 165756, "epoch": 1997} {"train_loss": -23.109394073486328, "global_step": 165757, "epoch": 1997} {"train_loss": -23.432403564453125, "global_step": 165758, "epoch": 1997} {"train_loss": -23.671092987060547, "global_step": 165759, "epoch": 1997} {"train_loss": -23.171361923217773, "global_step": 165760, "epoch": 1997} {"train_loss": -23.124603271484375, "global_step": 165761, "epoch": 1997} {"train_loss": -23.2503604888916, "global_step": 165762, "epoch": 1997} {"train_loss": -23.265817642211914, "global_step": 165763, "epoch": 1997} {"train_loss": -23.205917358398438, "global_step": 165764, "epoch": 1997} {"train_loss": -23.454416275024414, "global_step": 165765, "epoch": 1997} {"train_loss": -23.13218116760254, "global_step": 165766, "epoch": 1997} {"train_loss": -23.357852935791016, "global_step": 165767, "epoch": 1997} {"train_loss": -23.053735733032227, "global_step": 165768, "epoch": 1997} {"train_loss": -23.69105339050293, "global_step": 165769, "epoch": 1997} {"train_loss": -23.15757179260254, "global_step": 165770, "epoch": 1997} {"train_loss": -23.447784423828125, "global_step": 165771, "epoch": 1997} {"train_loss": -23.63092803955078, "global_step": 165772, "epoch": 1997} {"train_loss": -23.444995880126953, "global_step": 165773, "epoch": 1997} {"train_loss": -23.554468154907227, "global_step": 165774, "epoch": 1997} {"train_loss": -23.62322998046875, "global_step": 165775, "epoch": 1997} {"train_loss": -23.706586837768555, "global_step": 165776, "epoch": 1997} {"train_loss": -23.30140495300293, "global_step": 165777, "epoch": 1997} {"train_loss": -23.594316482543945, "global_step": 165778, "epoch": 1997} {"train_loss": -23.64082145690918, "global_step": 165779, "epoch": 1997} {"train_loss": -23.49051856994629, "global_step": 165780, "epoch": 1997} {"train_loss": -23.332637786865234, "global_step": 165781, "epoch": 1997} {"train_loss": -23.589902877807617, "global_step": 165782, "epoch": 1997} {"train_loss": -23.763839721679688, "global_step": 165783, "epoch": 1997} {"train_loss": -23.700790405273438, "global_step": 165784, "epoch": 1997} {"train_loss": -23.881732940673828, "global_step": 165785, "epoch": 1997} {"train_loss": -23.826345443725586, "global_step": 165786, "epoch": 1997} {"train_loss": -23.78563690185547, "global_step": 165787, "epoch": 1997} {"train_loss": -23.633264541625977, "global_step": 165788, "epoch": 1997} {"train_loss": -23.43035316467285, "global_step": 165789, "epoch": 1997} {"train_loss": -23.700239181518555, "global_step": 165790, "epoch": 1997} {"train_loss": -23.772184371948242, "global_step": 165791, "epoch": 1997} {"train_loss": -23.990468978881836, "global_step": 165792, "epoch": 1997} {"train_loss": -23.56777572631836, "global_step": 165793, "epoch": 1997} {"train_loss": -23.842472076416016, "global_step": 165794, "epoch": 1997} {"train_loss": -23.780607223510742, "global_step": 165795, "epoch": 1997} {"train_loss": -23.341577529907227, "global_step": 165796, "epoch": 1997} {"train_loss": -23.390869140625, "global_step": 165797, "epoch": 1997} {"train_loss": -23.576770782470703, "global_step": 165798, "epoch": 1997} {"train_loss": -23.121644973754883, "global_step": 165799, "epoch": 1997} {"train_loss": -23.713476181030273, "global_step": 165800, "epoch": 1997} {"train_loss": -23.73554039001465, "global_step": 165801, "epoch": 1997} {"train_loss": -23.473045349121094, "global_step": 165802, "epoch": 1997} {"train_loss": -23.89949607849121, "global_step": 165803, "epoch": 1997} {"train_loss": -23.93659210205078, "global_step": 165804, "epoch": 1997} {"train_loss": -23.444881439208984, "global_step": 165805, "epoch": 1997} {"train_loss": -23.70411491394043, "global_step": 165806, "epoch": 1997} {"train_loss": -23.495718002319336, "global_step": 165807, "epoch": 1997} {"train_loss": -23.345735549926758, "global_step": 165808, "epoch": 1997} {"train_loss": -23.433813095092773, "global_step": 165809, "epoch": 1997} {"train_loss": -23.482250213623047, "global_step": 165810, "epoch": 1997} {"train_loss": -23.56404685974121, "global_step": 165811, "epoch": 1997} {"train_loss": -23.55618667602539, "global_step": 165812, "epoch": 1997} {"train_loss": -23.51881217956543, "global_step": 165813, "epoch": 1997} {"train_loss": -23.70941162109375, "global_step": 165814, "epoch": 1997} {"train_loss": -23.573440551757812, "global_step": 165815, "epoch": 1997} {"train_loss": -23.547550201416016, "global_step": 165816, "epoch": 1997} {"train_loss": -23.52210807800293, "global_step": 165817, "epoch": 1997} {"train_loss": -23.73100471496582, "global_step": 165818, "epoch": 1997} {"train_loss": -23.503372192382812, "global_step": 165819, "epoch": 1997} {"train_loss": -23.798917770385742, "global_step": 165820, "epoch": 1997} {"train_loss": -23.537588119506836, "global_step": 165821, "epoch": 1997} {"train_loss": -23.774188995361328, "global_step": 165822, "epoch": 1997} {"train_loss": -23.980871200561523, "global_step": 165823, "epoch": 1997} {"train_loss": -23.332515716552734, "global_step": 165824, "epoch": 1997} {"train_loss": -23.523361206054688, "global_step": 165825, "epoch": 1997} {"train_loss": -23.483938217163086, "global_step": 165826, "epoch": 1997} {"train_loss": -23.33330726623535, "global_step": 165827, "epoch": 1997} {"train_loss": -23.56033706665039, "global_step": 165828, "epoch": 1997} {"train_loss": -23.38986587524414, "global_step": 165829, "epoch": 1997} {"train_loss": -23.52652359008789, "global_step": 165830, "epoch": 1997} {"train_loss": -23.817533493041992, "global_step": 165831, "epoch": 1997} {"train_loss": -23.4832706451416, "global_step": 165832, "epoch": 1997} {"train_loss": -23.527407565748835, "global_step": 165833, "epoch": 1997, "val_loss": 6429052.0} {"train_loss": -22.003828048706055, "global_step": 165834, "epoch": 1998} {"train_loss": -22.76283073425293, "global_step": 165835, "epoch": 1998} {"train_loss": -21.505582809448242, "global_step": 165836, "epoch": 1998} {"train_loss": -22.335927963256836, "global_step": 165837, "epoch": 1998} {"train_loss": -22.244159698486328, "global_step": 165838, "epoch": 1998} {"train_loss": -22.009368896484375, "global_step": 165839, "epoch": 1998} {"train_loss": -22.94569969177246, "global_step": 165840, "epoch": 1998} {"train_loss": -22.917932510375977, "global_step": 165841, "epoch": 1998} {"train_loss": -22.64164161682129, "global_step": 165842, "epoch": 1998} {"train_loss": -22.775259017944336, "global_step": 165843, "epoch": 1998} {"train_loss": -23.070148468017578, "global_step": 165844, "epoch": 1998} {"train_loss": -22.43901824951172, "global_step": 165845, "epoch": 1998} {"train_loss": -23.084692001342773, "global_step": 165846, "epoch": 1998} {"train_loss": -22.8852596282959, "global_step": 165847, "epoch": 1998} {"train_loss": -23.03810691833496, "global_step": 165848, "epoch": 1998} {"train_loss": -22.936017990112305, "global_step": 165849, "epoch": 1998} {"train_loss": -22.965402603149414, "global_step": 165850, "epoch": 1998} {"train_loss": -23.089405059814453, "global_step": 165851, "epoch": 1998} {"train_loss": -22.467727661132812, "global_step": 165852, "epoch": 1998} {"train_loss": -23.034208297729492, "global_step": 165853, "epoch": 1998} {"train_loss": -23.07394790649414, "global_step": 165854, "epoch": 1998} {"train_loss": -23.14320182800293, "global_step": 165855, "epoch": 1998} {"train_loss": -23.13616371154785, "global_step": 165856, "epoch": 1998} {"train_loss": -23.310684204101562, "global_step": 165857, "epoch": 1998} {"train_loss": -23.34912872314453, "global_step": 165858, "epoch": 1998} {"train_loss": -23.066978454589844, "global_step": 165859, "epoch": 1998} {"train_loss": -23.04966926574707, "global_step": 165860, "epoch": 1998} {"train_loss": -23.23902130126953, "global_step": 165861, "epoch": 1998} {"train_loss": -23.546186447143555, "global_step": 165862, "epoch": 1998} {"train_loss": -23.619625091552734, "global_step": 165863, "epoch": 1998} {"train_loss": -23.321842193603516, "global_step": 165864, "epoch": 1998} {"train_loss": -23.298025131225586, "global_step": 165865, "epoch": 1998} {"train_loss": -23.497222900390625, "global_step": 165866, "epoch": 1998} {"train_loss": -23.315664291381836, "global_step": 165867, "epoch": 1998} {"train_loss": -23.463266372680664, "global_step": 165868, "epoch": 1998} {"train_loss": -23.433130264282227, "global_step": 165869, "epoch": 1998} {"train_loss": -23.475767135620117, "global_step": 165870, "epoch": 1998} {"train_loss": -23.700517654418945, "global_step": 165871, "epoch": 1998} {"train_loss": -23.62055778503418, "global_step": 165872, "epoch": 1998} {"train_loss": -23.788131713867188, "global_step": 165873, "epoch": 1998} {"train_loss": -23.608083724975586, "global_step": 165874, "epoch": 1998} {"train_loss": -23.72748374938965, "global_step": 165875, "epoch": 1998} {"train_loss": -23.646692276000977, "global_step": 165876, "epoch": 1998} {"train_loss": -23.44788932800293, "global_step": 165877, "epoch": 1998} {"train_loss": -23.986997604370117, "global_step": 165878, "epoch": 1998} {"train_loss": -23.285844802856445, "global_step": 165879, "epoch": 1998} {"train_loss": -23.72291374206543, "global_step": 165880, "epoch": 1998} {"train_loss": -24.054967880249023, "global_step": 165881, "epoch": 1998} {"train_loss": -23.47563934326172, "global_step": 165882, "epoch": 1998} {"train_loss": -23.890518188476562, "global_step": 165883, "epoch": 1998} {"train_loss": -24.155466079711914, "global_step": 165884, "epoch": 1998} {"train_loss": -23.3082332611084, "global_step": 165885, "epoch": 1998} {"train_loss": -23.464088439941406, "global_step": 165886, "epoch": 1998} {"train_loss": -23.565113067626953, "global_step": 165887, "epoch": 1998} {"train_loss": -24.18367576599121, "global_step": 165888, "epoch": 1998} {"train_loss": -23.533824920654297, "global_step": 165889, "epoch": 1998} {"train_loss": -23.52437400817871, "global_step": 165890, "epoch": 1998} {"train_loss": -23.73453140258789, "global_step": 165891, "epoch": 1998} {"train_loss": -23.243621826171875, "global_step": 165892, "epoch": 1998} {"train_loss": -23.70423698425293, "global_step": 165893, "epoch": 1998} {"train_loss": -23.60420036315918, "global_step": 165894, "epoch": 1998} {"train_loss": -23.82480812072754, "global_step": 165895, "epoch": 1998} {"train_loss": -23.6137752532959, "global_step": 165896, "epoch": 1998} {"train_loss": -23.602310180664062, "global_step": 165897, "epoch": 1998} {"train_loss": -23.47723388671875, "global_step": 165898, "epoch": 1998} {"train_loss": -23.48896598815918, "global_step": 165899, "epoch": 1998} {"train_loss": -23.859649658203125, "global_step": 165900, "epoch": 1998} {"train_loss": -23.702678680419922, "global_step": 165901, "epoch": 1998} {"train_loss": -23.61853790283203, "global_step": 165902, "epoch": 1998} {"train_loss": -23.568851470947266, "global_step": 165903, "epoch": 1998} {"train_loss": -23.739974975585938, "global_step": 165904, "epoch": 1998} {"train_loss": -23.464435577392578, "global_step": 165905, "epoch": 1998} {"train_loss": -23.26810073852539, "global_step": 165906, "epoch": 1998} {"train_loss": -22.96687889099121, "global_step": 165907, "epoch": 1998} {"train_loss": -23.39716148376465, "global_step": 165908, "epoch": 1998} {"train_loss": -23.487146377563477, "global_step": 165909, "epoch": 1998} {"train_loss": -23.679183959960938, "global_step": 165910, "epoch": 1998} {"train_loss": -23.760290145874023, "global_step": 165911, "epoch": 1998} {"train_loss": -23.603099822998047, "global_step": 165912, "epoch": 1998} {"train_loss": -23.62671661376953, "global_step": 165913, "epoch": 1998} {"train_loss": -23.304330825805664, "global_step": 165914, "epoch": 1998} {"train_loss": -23.830223083496094, "global_step": 165915, "epoch": 1998} {"train_loss": -23.333039019481244, "global_step": 165916, "epoch": 1998, "val_loss": 6326928.0} {"train_loss": -23.317197799682617, "global_step": 165917, "epoch": 1999} {"train_loss": -23.144681930541992, "global_step": 165918, "epoch": 1999} {"train_loss": -23.294309616088867, "global_step": 165919, "epoch": 1999} {"train_loss": -23.157041549682617, "global_step": 165920, "epoch": 1999} {"train_loss": -23.307340621948242, "global_step": 165921, "epoch": 1999} {"train_loss": -23.288650512695312, "global_step": 165922, "epoch": 1999} {"train_loss": -23.216413497924805, "global_step": 165923, "epoch": 1999} {"train_loss": -23.102270126342773, "global_step": 165924, "epoch": 1999} {"train_loss": -23.200387954711914, "global_step": 165925, "epoch": 1999} {"train_loss": -23.05748748779297, "global_step": 165926, "epoch": 1999} {"train_loss": -23.097213745117188, "global_step": 165927, "epoch": 1999} {"train_loss": -23.350889205932617, "global_step": 165928, "epoch": 1999} {"train_loss": -23.270034790039062, "global_step": 165929, "epoch": 1999} {"train_loss": -23.42597007751465, "global_step": 165930, "epoch": 1999} {"train_loss": -23.52716064453125, "global_step": 165931, "epoch": 1999} {"train_loss": -23.769346237182617, "global_step": 165932, "epoch": 1999} {"train_loss": -23.255329132080078, "global_step": 165933, "epoch": 1999} {"train_loss": -23.864505767822266, "global_step": 165934, "epoch": 1999} {"train_loss": -23.397369384765625, "global_step": 165935, "epoch": 1999} {"train_loss": -23.083715438842773, "global_step": 165936, "epoch": 1999} {"train_loss": -23.52094078063965, "global_step": 165937, "epoch": 1999} {"train_loss": -23.44086265563965, "global_step": 165938, "epoch": 1999} {"train_loss": -23.50409507751465, "global_step": 165939, "epoch": 1999} {"train_loss": -23.733787536621094, "global_step": 165940, "epoch": 1999} {"train_loss": -23.711334228515625, "global_step": 165941, "epoch": 1999} {"train_loss": -23.511999130249023, "global_step": 165942, "epoch": 1999} {"train_loss": -23.820682525634766, "global_step": 165943, "epoch": 1999} {"train_loss": -23.49796485900879, "global_step": 165944, "epoch": 1999} {"train_loss": -23.498863220214844, "global_step": 165945, "epoch": 1999} {"train_loss": -23.607501983642578, "global_step": 165946, "epoch": 1999} {"train_loss": -23.654096603393555, "global_step": 165947, "epoch": 1999} {"train_loss": -23.677227020263672, "global_step": 165948, "epoch": 1999} {"train_loss": -23.49700355529785, "global_step": 165949, "epoch": 1999} {"train_loss": -23.27898597717285, "global_step": 165950, "epoch": 1999} {"train_loss": -23.495737075805664, "global_step": 165951, "epoch": 1999} {"train_loss": -23.433395385742188, "global_step": 165952, "epoch": 1999} {"train_loss": -23.5563907623291, "global_step": 165953, "epoch": 1999} {"train_loss": -23.303068161010742, "global_step": 165954, "epoch": 1999} {"train_loss": -24.34412956237793, "global_step": 165955, "epoch": 1999} {"train_loss": -23.407495498657227, "global_step": 165956, "epoch": 1999} {"train_loss": -23.74202537536621, "global_step": 165957, "epoch": 1999} {"train_loss": -23.668161392211914, "global_step": 165958, "epoch": 1999} {"train_loss": -23.41701316833496, "global_step": 165959, "epoch": 1999} {"train_loss": -23.594152450561523, "global_step": 165960, "epoch": 1999} {"train_loss": -23.784048080444336, "global_step": 165961, "epoch": 1999} {"train_loss": -23.436717987060547, "global_step": 165962, "epoch": 1999} {"train_loss": -23.886905670166016, "global_step": 165963, "epoch": 1999} {"train_loss": -23.366260528564453, "global_step": 165964, "epoch": 1999} {"train_loss": -23.642160415649414, "global_step": 165965, "epoch": 1999} {"train_loss": -24.056396484375, "global_step": 165966, "epoch": 1999} {"train_loss": -23.52695083618164, "global_step": 165967, "epoch": 1999} {"train_loss": -23.525922775268555, "global_step": 165968, "epoch": 1999} {"train_loss": -23.777524948120117, "global_step": 165969, "epoch": 1999} {"train_loss": -24.083105087280273, "global_step": 165970, "epoch": 1999} {"train_loss": -23.91816520690918, "global_step": 165971, "epoch": 1999} {"train_loss": -23.591188430786133, "global_step": 165972, "epoch": 1999} {"train_loss": -23.465011596679688, "global_step": 165973, "epoch": 1999} {"train_loss": -23.845609664916992, "global_step": 165974, "epoch": 1999} {"train_loss": -23.881938934326172, "global_step": 165975, "epoch": 1999} {"train_loss": -23.901283264160156, "global_step": 165976, "epoch": 1999} {"train_loss": -23.62056541442871, "global_step": 165977, "epoch": 1999} {"train_loss": -23.5783748626709, "global_step": 165978, "epoch": 1999} {"train_loss": -23.743179321289062, "global_step": 165979, "epoch": 1999} {"train_loss": -23.71446418762207, "global_step": 165980, "epoch": 1999} {"train_loss": -23.698347091674805, "global_step": 165981, "epoch": 1999} {"train_loss": -23.51708984375, "global_step": 165982, "epoch": 1999} {"train_loss": -23.7938175201416, "global_step": 165983, "epoch": 1999} {"train_loss": -23.83485221862793, "global_step": 165984, "epoch": 1999} {"train_loss": -23.888334274291992, "global_step": 165985, "epoch": 1999} {"train_loss": -24.017240524291992, "global_step": 165986, "epoch": 1999} {"train_loss": -23.50411605834961, "global_step": 165987, "epoch": 1999} {"train_loss": -23.474672317504883, "global_step": 165988, "epoch": 1999} {"train_loss": -23.744810104370117, "global_step": 165989, "epoch": 1999} {"train_loss": -23.74593162536621, "global_step": 165990, "epoch": 1999} {"train_loss": -23.440818786621094, "global_step": 165991, "epoch": 1999} {"train_loss": -22.9716854095459, "global_step": 165992, "epoch": 1999} {"train_loss": -23.218191146850586, "global_step": 165993, "epoch": 1999} {"train_loss": -23.576780319213867, "global_step": 165994, "epoch": 1999} {"train_loss": -23.1191349029541, "global_step": 165995, "epoch": 1999} {"train_loss": -23.700117111206055, "global_step": 165996, "epoch": 1999} {"train_loss": -23.29262351989746, "global_step": 165997, "epoch": 1999} {"train_loss": -23.618057250976562, "global_step": 165998, "epoch": 1999} {"train_loss": -23.529725063278015, "global_step": 165999, "epoch": 1999, "val_loss": 6406062.0} {"train_loss": -23.235797882080078, "global_step": 166000, "epoch": 2000} {"train_loss": -22.91193962097168, "global_step": 166001, "epoch": 2000} {"train_loss": -22.66774559020996, "global_step": 166002, "epoch": 2000} {"train_loss": -23.4063663482666, "global_step": 166003, "epoch": 2000} {"train_loss": -22.7095947265625, "global_step": 166004, "epoch": 2000} {"train_loss": -23.03303337097168, "global_step": 166005, "epoch": 2000} {"train_loss": -23.14203453063965, "global_step": 166006, "epoch": 2000} {"train_loss": -22.73270606994629, "global_step": 166007, "epoch": 2000} {"train_loss": -23.206785202026367, "global_step": 166008, "epoch": 2000} {"train_loss": -23.241657257080078, "global_step": 166009, "epoch": 2000} {"train_loss": -23.474746704101562, "global_step": 166010, "epoch": 2000} {"train_loss": -23.088598251342773, "global_step": 166011, "epoch": 2000} {"train_loss": -23.064956665039062, "global_step": 166012, "epoch": 2000} {"train_loss": -23.424118041992188, "global_step": 166013, "epoch": 2000} {"train_loss": -23.359540939331055, "global_step": 166014, "epoch": 2000} {"train_loss": -22.97883415222168, "global_step": 166015, "epoch": 2000} {"train_loss": -23.726896286010742, "global_step": 166016, "epoch": 2000} {"train_loss": -23.330699920654297, "global_step": 166017, "epoch": 2000} {"train_loss": -23.691282272338867, "global_step": 166018, "epoch": 2000} {"train_loss": -23.420194625854492, "global_step": 166019, "epoch": 2000} {"train_loss": -23.413949966430664, "global_step": 166020, "epoch": 2000} {"train_loss": -23.740297317504883, "global_step": 166021, "epoch": 2000} {"train_loss": -23.689146041870117, "global_step": 166022, "epoch": 2000} {"train_loss": -23.584272384643555, "global_step": 166023, "epoch": 2000} {"train_loss": -23.404985427856445, "global_step": 166024, "epoch": 2000} {"train_loss": -23.695878982543945, "global_step": 166025, "epoch": 2000} {"train_loss": -23.657581329345703, "global_step": 166026, "epoch": 2000} {"train_loss": -23.806421279907227, "global_step": 166027, "epoch": 2000} {"train_loss": -23.658985137939453, "global_step": 166028, "epoch": 2000} {"train_loss": -24.042593002319336, "global_step": 166029, "epoch": 2000} {"train_loss": -23.67875099182129, "global_step": 166030, "epoch": 2000} {"train_loss": -23.5504207611084, "global_step": 166031, "epoch": 2000} {"train_loss": -23.78692054748535, "global_step": 166032, "epoch": 2000} {"train_loss": -23.809282302856445, "global_step": 166033, "epoch": 2000} {"train_loss": -23.421598434448242, "global_step": 166034, "epoch": 2000} {"train_loss": -23.810819625854492, "global_step": 166035, "epoch": 2000} {"train_loss": -23.647754669189453, "global_step": 166036, "epoch": 2000} {"train_loss": -23.483869552612305, "global_step": 166037, "epoch": 2000} {"train_loss": -23.75087547302246, "global_step": 166038, "epoch": 2000} {"train_loss": -23.839553833007812, "global_step": 166039, "epoch": 2000} {"train_loss": -23.841455459594727, "global_step": 166040, "epoch": 2000} {"train_loss": -23.710973739624023, "global_step": 166041, "epoch": 2000} {"train_loss": -23.640914916992188, "global_step": 166042, "epoch": 2000} {"train_loss": -23.583486557006836, "global_step": 166043, "epoch": 2000} {"train_loss": -23.987131118774414, "global_step": 166044, "epoch": 2000} {"train_loss": -23.733139038085938, "global_step": 166045, "epoch": 2000} {"train_loss": -23.7706298828125, "global_step": 166046, "epoch": 2000} {"train_loss": -23.550024032592773, "global_step": 166047, "epoch": 2000} {"train_loss": -23.335264205932617, "global_step": 166048, "epoch": 2000} {"train_loss": -23.221485137939453, "global_step": 166049, "epoch": 2000} {"train_loss": -23.349096298217773, "global_step": 166050, "epoch": 2000} {"train_loss": -23.740110397338867, "global_step": 166051, "epoch": 2000} {"train_loss": -23.539182662963867, "global_step": 166052, "epoch": 2000} {"train_loss": -23.236600875854492, "global_step": 166053, "epoch": 2000} {"train_loss": -23.652690887451172, "global_step": 166054, "epoch": 2000} {"train_loss": -23.983572006225586, "global_step": 166055, "epoch": 2000} {"train_loss": -23.57094383239746, "global_step": 166056, "epoch": 2000} {"train_loss": -23.25252342224121, "global_step": 166057, "epoch": 2000} {"train_loss": -23.262168884277344, "global_step": 166058, "epoch": 2000} {"train_loss": -23.278623580932617, "global_step": 166059, "epoch": 2000} {"train_loss": -23.415882110595703, "global_step": 166060, "epoch": 2000} {"train_loss": -23.748014450073242, "global_step": 166061, "epoch": 2000} {"train_loss": -23.718088150024414, "global_step": 166062, "epoch": 2000} {"train_loss": -23.209339141845703, "global_step": 166063, "epoch": 2000} {"train_loss": -23.64664077758789, "global_step": 166064, "epoch": 2000} {"train_loss": -23.785053253173828, "global_step": 166065, "epoch": 2000} {"train_loss": -23.975820541381836, "global_step": 166066, "epoch": 2000} {"train_loss": -23.774906158447266, "global_step": 166067, "epoch": 2000} {"train_loss": -23.681055068969727, "global_step": 166068, "epoch": 2000} {"train_loss": -23.723474502563477, "global_step": 166069, "epoch": 2000} {"train_loss": -23.826631546020508, "global_step": 166070, "epoch": 2000} {"train_loss": -23.620527267456055, "global_step": 166071, "epoch": 2000} {"train_loss": -23.850719451904297, "global_step": 166072, "epoch": 2000} {"train_loss": -23.702444076538086, "global_step": 166073, "epoch": 2000} {"train_loss": -23.972848892211914, "global_step": 166074, "epoch": 2000} {"train_loss": -23.957950592041016, "global_step": 166075, "epoch": 2000} {"train_loss": -23.54680824279785, "global_step": 166076, "epoch": 2000} {"train_loss": -23.946931838989258, "global_step": 166077, "epoch": 2000} {"train_loss": -23.543903350830078, "global_step": 166078, "epoch": 2000} {"train_loss": -23.748321533203125, "global_step": 166079, "epoch": 2000} {"train_loss": -23.365924835205078, "global_step": 166080, "epoch": 2000} {"train_loss": -23.64986228942871, "global_step": 166081, "epoch": 2000} {"train_loss": -23.537641594208868, "global_step": 166082, "epoch": 2000, "train/sim_max_reward_0": 1.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4500000": 1.0, "test/sim_max_reward_4500001": 1.0, "test/sim_max_reward_4500002": 1.0, "test/sim_max_reward_4500003": 1.0, "test/sim_max_reward_4500004": 1.0, "test/sim_max_reward_4500005": 1.0, "test/sim_max_reward_4500006": 1.0, "test/sim_max_reward_4500007": 1.0, "test/sim_max_reward_4500008": 1.0, "test/sim_max_reward_4500009": 1.0, "test/sim_max_reward_4500010": 1.0, "test/sim_max_reward_4500011": 1.0, "test/sim_max_reward_4500012": 1.0, "test/sim_max_reward_4500013": 1.0, "test/sim_max_reward_4500014": 1.0, "test/sim_max_reward_4500015": 1.0, "test/sim_max_reward_4500016": 1.0, "test/sim_max_reward_4500017": 1.0, "test/sim_max_reward_4500018": 1.0, "test/sim_max_reward_4500019": 0.0, "test/sim_max_reward_4500020": 1.0, "test/sim_max_reward_4500021": 1.0, "train/mean_score": 1.0, "test/mean_score": 0.9545454545454546, "val_loss": 6487546.5} {"train_loss": -23.112924575805664, "global_step": 166083, "epoch": 2001} {"train_loss": -22.943593978881836, "global_step": 166084, "epoch": 2001} {"train_loss": -22.94160270690918, "global_step": 166085, "epoch": 2001} {"train_loss": -23.09557342529297, "global_step": 166086, "epoch": 2001} {"train_loss": -23.615476608276367, "global_step": 166087, "epoch": 2001} {"train_loss": -23.353271484375, "global_step": 166088, "epoch": 2001} {"train_loss": -22.848299026489258, "global_step": 166089, "epoch": 2001} {"train_loss": -22.715158462524414, "global_step": 166090, "epoch": 2001} {"train_loss": -22.997129440307617, "global_step": 166091, "epoch": 2001} {"train_loss": -23.058462142944336, "global_step": 166092, "epoch": 2001} {"train_loss": -23.303909301757812, "global_step": 166093, "epoch": 2001} {"train_loss": -23.276905059814453, "global_step": 166094, "epoch": 2001} {"train_loss": -23.382471084594727, "global_step": 166095, "epoch": 2001} {"train_loss": -23.291532516479492, "global_step": 166096, "epoch": 2001} {"train_loss": -23.222030639648438, "global_step": 166097, "epoch": 2001} {"train_loss": -23.53899574279785, "global_step": 166098, "epoch": 2001} {"train_loss": -23.134958267211914, "global_step": 166099, "epoch": 2001} {"train_loss": -23.547306060791016, "global_step": 166100, "epoch": 2001} {"train_loss": -23.287067413330078, "global_step": 166101, "epoch": 2001} {"train_loss": -23.22748374938965, "global_step": 166102, "epoch": 2001} {"train_loss": -23.40740966796875, "global_step": 166103, "epoch": 2001} {"train_loss": -23.475887298583984, "global_step": 166104, "epoch": 2001} {"train_loss": -23.645299911499023, "global_step": 166105, "epoch": 2001} {"train_loss": -23.630260467529297, "global_step": 166106, "epoch": 2001} {"train_loss": -23.429548263549805, "global_step": 166107, "epoch": 2001} {"train_loss": -23.57040023803711, "global_step": 166108, "epoch": 2001} {"train_loss": -23.396841049194336, "global_step": 166109, "epoch": 2001} {"train_loss": -23.70024871826172, "global_step": 166110, "epoch": 2001} {"train_loss": -23.449865341186523, "global_step": 166111, "epoch": 2001} {"train_loss": -23.740798950195312, "global_step": 166112, "epoch": 2001} {"train_loss": -23.6931095123291, "global_step": 166113, "epoch": 2001} {"train_loss": -23.340635299682617, "global_step": 166114, "epoch": 2001} {"train_loss": -23.406435012817383, "global_step": 166115, "epoch": 2001} {"train_loss": -23.604801177978516, "global_step": 166116, "epoch": 2001} {"train_loss": -23.692991256713867, "global_step": 166117, "epoch": 2001} {"train_loss": -23.560522079467773, "global_step": 166118, "epoch": 2001} {"train_loss": -23.596729278564453, "global_step": 166119, "epoch": 2001} {"train_loss": -23.80258560180664, "global_step": 166120, "epoch": 2001} {"train_loss": -23.475229263305664, "global_step": 166121, "epoch": 2001} {"train_loss": -23.363433837890625, "global_step": 166122, "epoch": 2001} {"train_loss": -23.465787887573242, "global_step": 166123, "epoch": 2001} {"train_loss": -23.617849349975586, "global_step": 166124, "epoch": 2001} {"train_loss": -23.624170303344727, "global_step": 166125, "epoch": 2001} {"train_loss": -23.964569091796875, "global_step": 166126, "epoch": 2001} {"train_loss": -23.643905639648438, "global_step": 166127, "epoch": 2001} {"train_loss": -23.696537017822266, "global_step": 166128, "epoch": 2001} {"train_loss": -23.41503143310547, "global_step": 166129, "epoch": 2001} {"train_loss": -23.79835319519043, "global_step": 166130, "epoch": 2001} {"train_loss": -23.64523696899414, "global_step": 166131, "epoch": 2001} {"train_loss": -23.57789421081543, "global_step": 166132, "epoch": 2001} {"train_loss": -23.848798751831055, "global_step": 166133, "epoch": 2001} {"train_loss": -23.935041427612305, "global_step": 166134, "epoch": 2001} {"train_loss": -23.467370986938477, "global_step": 166135, "epoch": 2001} {"train_loss": -23.861785888671875, "global_step": 166136, "epoch": 2001} {"train_loss": -23.77968406677246, "global_step": 166137, "epoch": 2001} {"train_loss": -23.895917892456055, "global_step": 166138, "epoch": 2001} {"train_loss": -23.8358211517334, "global_step": 166139, "epoch": 2001} {"train_loss": -23.738752365112305, "global_step": 166140, "epoch": 2001} {"train_loss": -23.842859268188477, "global_step": 166141, "epoch": 2001} {"train_loss": -23.579086303710938, "global_step": 166142, "epoch": 2001} {"train_loss": -23.880531311035156, "global_step": 166143, "epoch": 2001} {"train_loss": -23.948633193969727, "global_step": 166144, "epoch": 2001} {"train_loss": -23.69955062866211, "global_step": 166145, "epoch": 2001} {"train_loss": -23.352102279663086, "global_step": 166146, "epoch": 2001} {"train_loss": -23.8667049407959, "global_step": 166147, "epoch": 2001} {"train_loss": -24.033811569213867, "global_step": 166148, "epoch": 2001} {"train_loss": -23.74071502685547, "global_step": 166149, "epoch": 2001} {"train_loss": -23.791292190551758, "global_step": 166150, "epoch": 2001} {"train_loss": -23.692358016967773, "global_step": 166151, "epoch": 2001} {"train_loss": -23.2796688079834, "global_step": 166152, "epoch": 2001} {"train_loss": -23.751386642456055, "global_step": 166153, "epoch": 2001} {"train_loss": -23.91956901550293, "global_step": 166154, "epoch": 2001} {"train_loss": -23.8797664642334, "global_step": 166155, "epoch": 2001} {"train_loss": -23.46138572692871, "global_step": 166156, "epoch": 2001} {"train_loss": -23.45183753967285, "global_step": 166157, "epoch": 2001} {"train_loss": -23.721952438354492, "global_step": 166158, "epoch": 2001} {"train_loss": -24.19631004333496, "global_step": 166159, "epoch": 2001} {"train_loss": -23.87638282775879, "global_step": 166160, "epoch": 2001} {"train_loss": -23.947904586791992, "global_step": 166161, "epoch": 2001} {"train_loss": -23.500669479370117, "global_step": 166162, "epoch": 2001} {"train_loss": -23.64839744567871, "global_step": 166163, "epoch": 2001} {"train_loss": -23.523405075073242, "global_step": 166164, "epoch": 2001} {"train_loss": -23.55165143759854, "global_step": 166165, "epoch": 2001, "val_loss": 6442525.0} {"train_loss": -22.96919822692871, "global_step": 166166, "epoch": 2002} {"train_loss": -22.23472785949707, "global_step": 166167, "epoch": 2002} {"train_loss": -22.927427291870117, "global_step": 166168, "epoch": 2002} {"train_loss": -23.334516525268555, "global_step": 166169, "epoch": 2002} {"train_loss": -23.00022315979004, "global_step": 166170, "epoch": 2002} {"train_loss": -23.093591690063477, "global_step": 166171, "epoch": 2002} {"train_loss": -22.793989181518555, "global_step": 166172, "epoch": 2002} {"train_loss": -23.057336807250977, "global_step": 166173, "epoch": 2002} {"train_loss": -23.253210067749023, "global_step": 166174, "epoch": 2002} {"train_loss": -23.34122657775879, "global_step": 166175, "epoch": 2002} {"train_loss": -23.224794387817383, "global_step": 166176, "epoch": 2002} {"train_loss": -23.12944984436035, "global_step": 166177, "epoch": 2002} {"train_loss": -23.37169647216797, "global_step": 166178, "epoch": 2002} {"train_loss": -22.98097038269043, "global_step": 166179, "epoch": 2002} {"train_loss": -23.136993408203125, "global_step": 166180, "epoch": 2002} {"train_loss": -23.064062118530273, "global_step": 166181, "epoch": 2002} {"train_loss": -23.114259719848633, "global_step": 166182, "epoch": 2002} {"train_loss": -23.3924503326416, "global_step": 166183, "epoch": 2002} {"train_loss": -23.144514083862305, "global_step": 166184, "epoch": 2002} {"train_loss": -23.403278350830078, "global_step": 166185, "epoch": 2002} {"train_loss": -23.304134368896484, "global_step": 166186, "epoch": 2002} {"train_loss": -23.494291305541992, "global_step": 166187, "epoch": 2002} {"train_loss": -23.47761344909668, "global_step": 166188, "epoch": 2002} {"train_loss": -23.286123275756836, "global_step": 166189, "epoch": 2002} {"train_loss": -23.637842178344727, "global_step": 166190, "epoch": 2002} {"train_loss": -23.467453002929688, "global_step": 166191, "epoch": 2002} {"train_loss": -23.2229061126709, "global_step": 166192, "epoch": 2002} {"train_loss": -23.297212600708008, "global_step": 166193, "epoch": 2002} {"train_loss": -23.597766876220703, "global_step": 166194, "epoch": 2002} {"train_loss": -23.438953399658203, "global_step": 166195, "epoch": 2002} {"train_loss": -23.747699737548828, "global_step": 166196, "epoch": 2002} {"train_loss": -23.552047729492188, "global_step": 166197, "epoch": 2002} {"train_loss": -23.355127334594727, "global_step": 166198, "epoch": 2002} {"train_loss": -23.339317321777344, "global_step": 166199, "epoch": 2002} {"train_loss": -23.455875396728516, "global_step": 166200, "epoch": 2002} {"train_loss": -23.626087188720703, "global_step": 166201, "epoch": 2002} {"train_loss": -23.46954917907715, "global_step": 166202, "epoch": 2002} {"train_loss": -23.516050338745117, "global_step": 166203, "epoch": 2002} {"train_loss": -23.6403865814209, "global_step": 166204, "epoch": 2002} {"train_loss": -23.772375106811523, "global_step": 166205, "epoch": 2002} {"train_loss": -23.569808959960938, "global_step": 166206, "epoch": 2002} {"train_loss": -23.669240951538086, "global_step": 166207, "epoch": 2002} {"train_loss": -23.57513427734375, "global_step": 166208, "epoch": 2002} {"train_loss": -23.71943473815918, "global_step": 166209, "epoch": 2002} {"train_loss": -23.75949478149414, "global_step": 166210, "epoch": 2002} {"train_loss": -23.630538940429688, "global_step": 166211, "epoch": 2002} {"train_loss": -23.861391067504883, "global_step": 166212, "epoch": 2002} {"train_loss": -23.756406784057617, "global_step": 166213, "epoch": 2002} {"train_loss": -23.477279663085938, "global_step": 166214, "epoch": 2002} {"train_loss": -23.688785552978516, "global_step": 166215, "epoch": 2002} {"train_loss": -23.64082145690918, "global_step": 166216, "epoch": 2002} {"train_loss": -23.597692489624023, "global_step": 166217, "epoch": 2002} {"train_loss": -23.858320236206055, "global_step": 166218, "epoch": 2002} {"train_loss": -23.28436851501465, "global_step": 166219, "epoch": 2002} {"train_loss": -23.12336540222168, "global_step": 166220, "epoch": 2002} {"train_loss": -23.361936569213867, "global_step": 166221, "epoch": 2002} {"train_loss": -23.47321128845215, "global_step": 166222, "epoch": 2002} {"train_loss": -23.671903610229492, "global_step": 166223, "epoch": 2002} {"train_loss": -23.447643280029297, "global_step": 166224, "epoch": 2002} {"train_loss": -24.075666427612305, "global_step": 166225, "epoch": 2002} {"train_loss": -23.856863021850586, "global_step": 166226, "epoch": 2002} {"train_loss": -23.494747161865234, "global_step": 166227, "epoch": 2002} {"train_loss": -23.611858367919922, "global_step": 166228, "epoch": 2002} {"train_loss": -23.41670799255371, "global_step": 166229, "epoch": 2002} {"train_loss": -23.6307373046875, "global_step": 166230, "epoch": 2002} {"train_loss": -23.756816864013672, "global_step": 166231, "epoch": 2002} {"train_loss": -23.3725643157959, "global_step": 166232, "epoch": 2002} {"train_loss": -23.34688377380371, "global_step": 166233, "epoch": 2002} {"train_loss": -23.612133026123047, "global_step": 166234, "epoch": 2002} {"train_loss": -24.092863082885742, "global_step": 166235, "epoch": 2002} {"train_loss": -23.620441436767578, "global_step": 166236, "epoch": 2002} {"train_loss": -23.939146041870117, "global_step": 166237, "epoch": 2002} {"train_loss": -23.75721549987793, "global_step": 166238, "epoch": 2002} {"train_loss": -23.685287475585938, "global_step": 166239, "epoch": 2002} {"train_loss": -23.813806533813477, "global_step": 166240, "epoch": 2002} {"train_loss": -23.38551139831543, "global_step": 166241, "epoch": 2002} {"train_loss": -23.65278434753418, "global_step": 166242, "epoch": 2002} {"train_loss": -23.61638832092285, "global_step": 166243, "epoch": 2002} {"train_loss": -23.74413299560547, "global_step": 166244, "epoch": 2002} {"train_loss": -23.485261917114258, "global_step": 166245, "epoch": 2002} {"train_loss": -23.726825714111328, "global_step": 166246, "epoch": 2002} {"train_loss": -23.74285316467285, "global_step": 166247, "epoch": 2002} {"train_loss": -23.499780126364833, "global_step": 166248, "epoch": 2002, "val_loss": 6374307.0} {"train_loss": -22.59551429748535, "global_step": 166249, "epoch": 2003} {"train_loss": -23.01626205444336, "global_step": 166250, "epoch": 2003} {"train_loss": -22.647668838500977, "global_step": 166251, "epoch": 2003} {"train_loss": -22.534780502319336, "global_step": 166252, "epoch": 2003} {"train_loss": -22.190832138061523, "global_step": 166253, "epoch": 2003} {"train_loss": -23.032785415649414, "global_step": 166254, "epoch": 2003} {"train_loss": -22.657852172851562, "global_step": 166255, "epoch": 2003} {"train_loss": -22.842756271362305, "global_step": 166256, "epoch": 2003} {"train_loss": -23.280759811401367, "global_step": 166257, "epoch": 2003} {"train_loss": -23.04506492614746, "global_step": 166258, "epoch": 2003} {"train_loss": -22.976011276245117, "global_step": 166259, "epoch": 2003} {"train_loss": -22.923280715942383, "global_step": 166260, "epoch": 2003} {"train_loss": -23.092269897460938, "global_step": 166261, "epoch": 2003} {"train_loss": -23.22549057006836, "global_step": 166262, "epoch": 2003} {"train_loss": -22.985048294067383, "global_step": 166263, "epoch": 2003} {"train_loss": -23.470951080322266, "global_step": 166264, "epoch": 2003} {"train_loss": -23.35194969177246, "global_step": 166265, "epoch": 2003} {"train_loss": -22.924034118652344, "global_step": 166266, "epoch": 2003} {"train_loss": -23.213064193725586, "global_step": 166267, "epoch": 2003} {"train_loss": -23.003332138061523, "global_step": 166268, "epoch": 2003} {"train_loss": -22.92103385925293, "global_step": 166269, "epoch": 2003} {"train_loss": -23.254053115844727, "global_step": 166270, "epoch": 2003} {"train_loss": -23.605382919311523, "global_step": 166271, "epoch": 2003} {"train_loss": -23.083011627197266, "global_step": 166272, "epoch": 2003} {"train_loss": -23.36281967163086, "global_step": 166273, "epoch": 2003} {"train_loss": -23.192731857299805, "global_step": 166274, "epoch": 2003} {"train_loss": -23.09300994873047, "global_step": 166275, "epoch": 2003} {"train_loss": -23.374584197998047, "global_step": 166276, "epoch": 2003} {"train_loss": -23.35611343383789, "global_step": 166277, "epoch": 2003} {"train_loss": -23.690330505371094, "global_step": 166278, "epoch": 2003} {"train_loss": -23.280216217041016, "global_step": 166279, "epoch": 2003} {"train_loss": -23.405014038085938, "global_step": 166280, "epoch": 2003} {"train_loss": -23.5999698638916, "global_step": 166281, "epoch": 2003} {"train_loss": -23.948535919189453, "global_step": 166282, "epoch": 2003} {"train_loss": -23.71372413635254, "global_step": 166283, "epoch": 2003} {"train_loss": -23.532901763916016, "global_step": 166284, "epoch": 2003} {"train_loss": -23.635984420776367, "global_step": 166285, "epoch": 2003} {"train_loss": -23.59354019165039, "global_step": 166286, "epoch": 2003} {"train_loss": -23.54438018798828, "global_step": 166287, "epoch": 2003} {"train_loss": -23.533353805541992, "global_step": 166288, "epoch": 2003} {"train_loss": -23.556964874267578, "global_step": 166289, "epoch": 2003} {"train_loss": -23.672895431518555, "global_step": 166290, "epoch": 2003} {"train_loss": -23.752548217773438, "global_step": 166291, "epoch": 2003} {"train_loss": -23.858274459838867, "global_step": 166292, "epoch": 2003} {"train_loss": -23.929662704467773, "global_step": 166293, "epoch": 2003} {"train_loss": -23.802106857299805, "global_step": 166294, "epoch": 2003} {"train_loss": -23.77033805847168, "global_step": 166295, "epoch": 2003} {"train_loss": -23.213459014892578, "global_step": 166296, "epoch": 2003} {"train_loss": -23.623416900634766, "global_step": 166297, "epoch": 2003} {"train_loss": -23.86411476135254, "global_step": 166298, "epoch": 2003} {"train_loss": -23.8381290435791, "global_step": 166299, "epoch": 2003} {"train_loss": -23.837005615234375, "global_step": 166300, "epoch": 2003} {"train_loss": -23.16832160949707, "global_step": 166301, "epoch": 2003} {"train_loss": -23.890031814575195, "global_step": 166302, "epoch": 2003} {"train_loss": -23.643430709838867, "global_step": 166303, "epoch": 2003} {"train_loss": -23.224714279174805, "global_step": 166304, "epoch": 2003} {"train_loss": -23.865880966186523, "global_step": 166305, "epoch": 2003} {"train_loss": -23.469465255737305, "global_step": 166306, "epoch": 2003} {"train_loss": -23.824588775634766, "global_step": 166307, "epoch": 2003} {"train_loss": -23.414602279663086, "global_step": 166308, "epoch": 2003} {"train_loss": -23.558914184570312, "global_step": 166309, "epoch": 2003} {"train_loss": -23.864011764526367, "global_step": 166310, "epoch": 2003} {"train_loss": -23.39203643798828, "global_step": 166311, "epoch": 2003} {"train_loss": -23.6861515045166, "global_step": 166312, "epoch": 2003} {"train_loss": -23.724119186401367, "global_step": 166313, "epoch": 2003} {"train_loss": -23.62064552307129, "global_step": 166314, "epoch": 2003} {"train_loss": -23.336885452270508, "global_step": 166315, "epoch": 2003} {"train_loss": -23.609731674194336, "global_step": 166316, "epoch": 2003} {"train_loss": -23.495941162109375, "global_step": 166317, "epoch": 2003} {"train_loss": -23.57200813293457, "global_step": 166318, "epoch": 2003} {"train_loss": -23.490177154541016, "global_step": 166319, "epoch": 2003} {"train_loss": -23.664823532104492, "global_step": 166320, "epoch": 2003} {"train_loss": -23.94948959350586, "global_step": 166321, "epoch": 2003} {"train_loss": -23.663339614868164, "global_step": 166322, "epoch": 2003} {"train_loss": -23.55495262145996, "global_step": 166323, "epoch": 2003} {"train_loss": -23.438552856445312, "global_step": 166324, "epoch": 2003} {"train_loss": -23.11995506286621, "global_step": 166325, "epoch": 2003} {"train_loss": -23.66935157775879, "global_step": 166326, "epoch": 2003} {"train_loss": -23.579729080200195, "global_step": 166327, "epoch": 2003} {"train_loss": -23.534072875976562, "global_step": 166328, "epoch": 2003} {"train_loss": -23.67237663269043, "global_step": 166329, "epoch": 2003} {"train_loss": -23.839447021484375, "global_step": 166330, "epoch": 2003} {"train_loss": -23.406104811702868, "global_step": 166331, "epoch": 2003, "val_loss": 6337013.5} {"train_loss": -22.168210983276367, "global_step": 166332, "epoch": 2004} {"train_loss": -23.113412857055664, "global_step": 166333, "epoch": 2004} {"train_loss": -22.87186050415039, "global_step": 166334, "epoch": 2004} {"train_loss": -22.60435676574707, "global_step": 166335, "epoch": 2004} {"train_loss": -22.736434936523438, "global_step": 166336, "epoch": 2004} {"train_loss": -23.29014778137207, "global_step": 166337, "epoch": 2004} {"train_loss": -22.73935317993164, "global_step": 166338, "epoch": 2004} {"train_loss": -23.147781372070312, "global_step": 166339, "epoch": 2004} {"train_loss": -23.05828285217285, "global_step": 166340, "epoch": 2004} {"train_loss": -22.988645553588867, "global_step": 166341, "epoch": 2004} {"train_loss": -23.475378036499023, "global_step": 166342, "epoch": 2004} {"train_loss": -23.308490753173828, "global_step": 166343, "epoch": 2004} {"train_loss": -23.465057373046875, "global_step": 166344, "epoch": 2004} {"train_loss": -23.0660343170166, "global_step": 166345, "epoch": 2004} {"train_loss": -23.150880813598633, "global_step": 166346, "epoch": 2004} {"train_loss": -23.51485252380371, "global_step": 166347, "epoch": 2004} {"train_loss": -23.27302360534668, "global_step": 166348, "epoch": 2004} {"train_loss": -23.306119918823242, "global_step": 166349, "epoch": 2004} {"train_loss": -23.21056365966797, "global_step": 166350, "epoch": 2004} {"train_loss": -23.00160026550293, "global_step": 166351, "epoch": 2004} {"train_loss": -23.1389102935791, "global_step": 166352, "epoch": 2004} {"train_loss": -23.38153648376465, "global_step": 166353, "epoch": 2004} {"train_loss": -23.329463958740234, "global_step": 166354, "epoch": 2004} {"train_loss": -23.5998592376709, "global_step": 166355, "epoch": 2004} {"train_loss": -23.52029800415039, "global_step": 166356, "epoch": 2004} {"train_loss": -23.532339096069336, "global_step": 166357, "epoch": 2004} {"train_loss": -23.41813850402832, "global_step": 166358, "epoch": 2004} {"train_loss": -23.781225204467773, "global_step": 166359, "epoch": 2004} {"train_loss": -23.55858039855957, "global_step": 166360, "epoch": 2004} {"train_loss": -23.77273941040039, "global_step": 166361, "epoch": 2004} {"train_loss": -23.667774200439453, "global_step": 166362, "epoch": 2004} {"train_loss": -23.813156127929688, "global_step": 166363, "epoch": 2004} {"train_loss": -23.328678131103516, "global_step": 166364, "epoch": 2004} {"train_loss": -23.776742935180664, "global_step": 166365, "epoch": 2004} {"train_loss": -23.434844970703125, "global_step": 166366, "epoch": 2004} {"train_loss": -23.547977447509766, "global_step": 166367, "epoch": 2004} {"train_loss": -23.83723258972168, "global_step": 166368, "epoch": 2004} {"train_loss": -24.044658660888672, "global_step": 166369, "epoch": 2004} {"train_loss": -23.613420486450195, "global_step": 166370, "epoch": 2004} {"train_loss": -23.829275131225586, "global_step": 166371, "epoch": 2004} {"train_loss": -23.392866134643555, "global_step": 166372, "epoch": 2004} {"train_loss": -23.816978454589844, "global_step": 166373, "epoch": 2004} {"train_loss": -23.497671127319336, "global_step": 166374, "epoch": 2004} {"train_loss": -24.026365280151367, "global_step": 166375, "epoch": 2004} {"train_loss": -23.852008819580078, "global_step": 166376, "epoch": 2004} {"train_loss": -23.599628448486328, "global_step": 166377, "epoch": 2004} {"train_loss": -23.94287109375, "global_step": 166378, "epoch": 2004} {"train_loss": -23.726064682006836, "global_step": 166379, "epoch": 2004} {"train_loss": -23.933889389038086, "global_step": 166380, "epoch": 2004} {"train_loss": -23.4090518951416, "global_step": 166381, "epoch": 2004} {"train_loss": -23.600522994995117, "global_step": 166382, "epoch": 2004} {"train_loss": -23.575876235961914, "global_step": 166383, "epoch": 2004} {"train_loss": -23.68068504333496, "global_step": 166384, "epoch": 2004} {"train_loss": -23.627958297729492, "global_step": 166385, "epoch": 2004} {"train_loss": -23.512784957885742, "global_step": 166386, "epoch": 2004} {"train_loss": -23.345687866210938, "global_step": 166387, "epoch": 2004} {"train_loss": -22.840089797973633, "global_step": 166388, "epoch": 2004} {"train_loss": -23.1989688873291, "global_step": 166389, "epoch": 2004} {"train_loss": -23.256961822509766, "global_step": 166390, "epoch": 2004} {"train_loss": -23.58182144165039, "global_step": 166391, "epoch": 2004} {"train_loss": -23.42166519165039, "global_step": 166392, "epoch": 2004} {"train_loss": -23.432756423950195, "global_step": 166393, "epoch": 2004} {"train_loss": -23.23679542541504, "global_step": 166394, "epoch": 2004} {"train_loss": -23.636930465698242, "global_step": 166395, "epoch": 2004} {"train_loss": -23.77791404724121, "global_step": 166396, "epoch": 2004} {"train_loss": -23.39922332763672, "global_step": 166397, "epoch": 2004} {"train_loss": -23.406917572021484, "global_step": 166398, "epoch": 2004} {"train_loss": -23.183820724487305, "global_step": 166399, "epoch": 2004} {"train_loss": -23.685911178588867, "global_step": 166400, "epoch": 2004} {"train_loss": -23.47150421142578, "global_step": 166401, "epoch": 2004} {"train_loss": -23.70501136779785, "global_step": 166402, "epoch": 2004} {"train_loss": -23.5596981048584, "global_step": 166403, "epoch": 2004} {"train_loss": -24.02141571044922, "global_step": 166404, "epoch": 2004} {"train_loss": -23.521617889404297, "global_step": 166405, "epoch": 2004} {"train_loss": -23.48553466796875, "global_step": 166406, "epoch": 2004} {"train_loss": -23.537433624267578, "global_step": 166407, "epoch": 2004} {"train_loss": -23.760175704956055, "global_step": 166408, "epoch": 2004} {"train_loss": -23.65660858154297, "global_step": 166409, "epoch": 2004} {"train_loss": -23.75213623046875, "global_step": 166410, "epoch": 2004} {"train_loss": -23.610267639160156, "global_step": 166411, "epoch": 2004} {"train_loss": -23.443700790405273, "global_step": 166412, "epoch": 2004} {"train_loss": -23.425222396850586, "global_step": 166413, "epoch": 2004} {"train_loss": -23.460047894213574, "global_step": 166414, "epoch": 2004, "val_loss": 6417523.5} {"train_loss": -23.009748458862305, "global_step": 166415, "epoch": 2005} {"train_loss": -23.102994918823242, "global_step": 166416, "epoch": 2005} {"train_loss": -23.624929428100586, "global_step": 166417, "epoch": 2005} {"train_loss": -23.378175735473633, "global_step": 166418, "epoch": 2005} {"train_loss": -23.45285987854004, "global_step": 166419, "epoch": 2005} {"train_loss": -23.598834991455078, "global_step": 166420, "epoch": 2005} {"train_loss": -23.721837997436523, "global_step": 166421, "epoch": 2005} {"train_loss": -23.430810928344727, "global_step": 166422, "epoch": 2005} {"train_loss": -23.467613220214844, "global_step": 166423, "epoch": 2005} {"train_loss": -23.706396102905273, "global_step": 166424, "epoch": 2005} {"train_loss": -23.716665267944336, "global_step": 166425, "epoch": 2005} {"train_loss": -24.01118278503418, "global_step": 166426, "epoch": 2005} {"train_loss": -23.7033748626709, "global_step": 166427, "epoch": 2005} {"train_loss": -23.876708984375, "global_step": 166428, "epoch": 2005} {"train_loss": -23.756275177001953, "global_step": 166429, "epoch": 2005} {"train_loss": -23.417476654052734, "global_step": 166430, "epoch": 2005} {"train_loss": -23.8362979888916, "global_step": 166431, "epoch": 2005} {"train_loss": -23.751087188720703, "global_step": 166432, "epoch": 2005} {"train_loss": -23.457822799682617, "global_step": 166433, "epoch": 2005} {"train_loss": -23.536575317382812, "global_step": 166434, "epoch": 2005} {"train_loss": -23.555469512939453, "global_step": 166435, "epoch": 2005} {"train_loss": -23.86519432067871, "global_step": 166436, "epoch": 2005} {"train_loss": -23.675573348999023, "global_step": 166437, "epoch": 2005} {"train_loss": -23.84720802307129, "global_step": 166438, "epoch": 2005} {"train_loss": -23.80685806274414, "global_step": 166439, "epoch": 2005} {"train_loss": -23.627593994140625, "global_step": 166440, "epoch": 2005} {"train_loss": -23.93805503845215, "global_step": 166441, "epoch": 2005} {"train_loss": -23.612089157104492, "global_step": 166442, "epoch": 2005} {"train_loss": -23.67404556274414, "global_step": 166443, "epoch": 2005} {"train_loss": -23.73902702331543, "global_step": 166444, "epoch": 2005} {"train_loss": -23.549219131469727, "global_step": 166445, "epoch": 2005} {"train_loss": -23.692283630371094, "global_step": 166446, "epoch": 2005} {"train_loss": -23.618837356567383, "global_step": 166447, "epoch": 2005} {"train_loss": -23.708337783813477, "global_step": 166448, "epoch": 2005} {"train_loss": -23.550437927246094, "global_step": 166449, "epoch": 2005} {"train_loss": -23.08176040649414, "global_step": 166450, "epoch": 2005} {"train_loss": -23.840717315673828, "global_step": 166451, "epoch": 2005} {"train_loss": -23.704212188720703, "global_step": 166452, "epoch": 2005} {"train_loss": -23.803091049194336, "global_step": 166453, "epoch": 2005} {"train_loss": -23.446378707885742, "global_step": 166454, "epoch": 2005} {"train_loss": -23.712011337280273, "global_step": 166455, "epoch": 2005} {"train_loss": -23.388458251953125, "global_step": 166456, "epoch": 2005} {"train_loss": -23.568147659301758, "global_step": 166457, "epoch": 2005} {"train_loss": -23.46888542175293, "global_step": 166458, "epoch": 2005} {"train_loss": -23.978286743164062, "global_step": 166459, "epoch": 2005} {"train_loss": -23.750516891479492, "global_step": 166460, "epoch": 2005} {"train_loss": -23.78993797302246, "global_step": 166461, "epoch": 2005} {"train_loss": -23.3404541015625, "global_step": 166462, "epoch": 2005} {"train_loss": -23.52921485900879, "global_step": 166463, "epoch": 2005} {"train_loss": -23.245548248291016, "global_step": 166464, "epoch": 2005} {"train_loss": -23.706632614135742, "global_step": 166465, "epoch": 2005} {"train_loss": -23.724838256835938, "global_step": 166466, "epoch": 2005} {"train_loss": -23.584367752075195, "global_step": 166467, "epoch": 2005} {"train_loss": -23.93405532836914, "global_step": 166468, "epoch": 2005} {"train_loss": -23.582523345947266, "global_step": 166469, "epoch": 2005} {"train_loss": -23.68638038635254, "global_step": 166470, "epoch": 2005} {"train_loss": -23.86634063720703, "global_step": 166471, "epoch": 2005} {"train_loss": -23.53426170349121, "global_step": 166472, "epoch": 2005} {"train_loss": -23.853103637695312, "global_step": 166473, "epoch": 2005} {"train_loss": -24.004858016967773, "global_step": 166474, "epoch": 2005} {"train_loss": -23.68692398071289, "global_step": 166475, "epoch": 2005} {"train_loss": -23.524898529052734, "global_step": 166476, "epoch": 2005} {"train_loss": -23.60467529296875, "global_step": 166477, "epoch": 2005} {"train_loss": -23.58587074279785, "global_step": 166478, "epoch": 2005} {"train_loss": -23.641666412353516, "global_step": 166479, "epoch": 2005} {"train_loss": -24.00973892211914, "global_step": 166480, "epoch": 2005} {"train_loss": -23.695545196533203, "global_step": 166481, "epoch": 2005} {"train_loss": -23.66412925720215, "global_step": 166482, "epoch": 2005} {"train_loss": -23.61349868774414, "global_step": 166483, "epoch": 2005} {"train_loss": -23.82134437561035, "global_step": 166484, "epoch": 2005} {"train_loss": -23.850446701049805, "global_step": 166485, "epoch": 2005} {"train_loss": -23.692380905151367, "global_step": 166486, "epoch": 2005} {"train_loss": -24.004230499267578, "global_step": 166487, "epoch": 2005} {"train_loss": -23.50519371032715, "global_step": 166488, "epoch": 2005} {"train_loss": -23.698415756225586, "global_step": 166489, "epoch": 2005} {"train_loss": -23.566680908203125, "global_step": 166490, "epoch": 2005} {"train_loss": -23.628332138061523, "global_step": 166491, "epoch": 2005} {"train_loss": -23.746082305908203, "global_step": 166492, "epoch": 2005} {"train_loss": -23.471694946289062, "global_step": 166493, "epoch": 2005} {"train_loss": -23.986064910888672, "global_step": 166494, "epoch": 2005} {"train_loss": -23.72859001159668, "global_step": 166495, "epoch": 2005} {"train_loss": -23.720062255859375, "global_step": 166496, "epoch": 2005} {"train_loss": -23.66112736621535, "global_step": 166497, "epoch": 2005, "val_loss": 6391504.0} {"train_loss": -23.35179901123047, "global_step": 166498, "epoch": 2006} {"train_loss": -23.533374786376953, "global_step": 166499, "epoch": 2006} {"train_loss": -23.629993438720703, "global_step": 166500, "epoch": 2006} {"train_loss": -23.127357482910156, "global_step": 166501, "epoch": 2006} {"train_loss": -23.640186309814453, "global_step": 166502, "epoch": 2006} {"train_loss": -23.69342613220215, "global_step": 166503, "epoch": 2006} {"train_loss": -23.50263023376465, "global_step": 166504, "epoch": 2006} {"train_loss": -23.659894943237305, "global_step": 166505, "epoch": 2006} {"train_loss": -23.37544822692871, "global_step": 166506, "epoch": 2006} {"train_loss": -23.870464324951172, "global_step": 166507, "epoch": 2006} {"train_loss": -23.460439682006836, "global_step": 166508, "epoch": 2006} {"train_loss": -23.929410934448242, "global_step": 166509, "epoch": 2006} {"train_loss": -23.423276901245117, "global_step": 166510, "epoch": 2006} {"train_loss": -23.829349517822266, "global_step": 166511, "epoch": 2006} {"train_loss": -23.424928665161133, "global_step": 166512, "epoch": 2006} {"train_loss": -23.544525146484375, "global_step": 166513, "epoch": 2006} {"train_loss": -23.63935661315918, "global_step": 166514, "epoch": 2006} {"train_loss": -23.867582321166992, "global_step": 166515, "epoch": 2006} {"train_loss": -23.757461547851562, "global_step": 166516, "epoch": 2006} {"train_loss": -23.67011833190918, "global_step": 166517, "epoch": 2006} {"train_loss": -23.857351303100586, "global_step": 166518, "epoch": 2006} {"train_loss": -23.821670532226562, "global_step": 166519, "epoch": 2006} {"train_loss": -24.192304611206055, "global_step": 166520, "epoch": 2006} {"train_loss": -23.88728904724121, "global_step": 166521, "epoch": 2006} {"train_loss": -23.450021743774414, "global_step": 166522, "epoch": 2006} {"train_loss": -23.542659759521484, "global_step": 166523, "epoch": 2006} {"train_loss": -23.580062866210938, "global_step": 166524, "epoch": 2006} {"train_loss": -23.741514205932617, "global_step": 166525, "epoch": 2006} {"train_loss": -23.465137481689453, "global_step": 166526, "epoch": 2006} {"train_loss": -23.382272720336914, "global_step": 166527, "epoch": 2006} {"train_loss": -23.437597274780273, "global_step": 166528, "epoch": 2006} {"train_loss": -23.93017578125, "global_step": 166529, "epoch": 2006} {"train_loss": -23.5579833984375, "global_step": 166530, "epoch": 2006} {"train_loss": -23.98587417602539, "global_step": 166531, "epoch": 2006} {"train_loss": -23.67343521118164, "global_step": 166532, "epoch": 2006} {"train_loss": -23.868528366088867, "global_step": 166533, "epoch": 2006} {"train_loss": -23.73667335510254, "global_step": 166534, "epoch": 2006} {"train_loss": -23.745779037475586, "global_step": 166535, "epoch": 2006} {"train_loss": -23.759204864501953, "global_step": 166536, "epoch": 2006} {"train_loss": -23.7431583404541, "global_step": 166537, "epoch": 2006} {"train_loss": -23.842565536499023, "global_step": 166538, "epoch": 2006} {"train_loss": -23.465314865112305, "global_step": 166539, "epoch": 2006} {"train_loss": -23.766815185546875, "global_step": 166540, "epoch": 2006} {"train_loss": -23.592023849487305, "global_step": 166541, "epoch": 2006} {"train_loss": -23.655912399291992, "global_step": 166542, "epoch": 2006} {"train_loss": -23.528274536132812, "global_step": 166543, "epoch": 2006} {"train_loss": -23.608755111694336, "global_step": 166544, "epoch": 2006} {"train_loss": -23.485248565673828, "global_step": 166545, "epoch": 2006} {"train_loss": -23.462726593017578, "global_step": 166546, "epoch": 2006} {"train_loss": -24.11749839782715, "global_step": 166547, "epoch": 2006} {"train_loss": -23.594024658203125, "global_step": 166548, "epoch": 2006} {"train_loss": -23.24531364440918, "global_step": 166549, "epoch": 2006} {"train_loss": -23.314899444580078, "global_step": 166550, "epoch": 2006} {"train_loss": -23.392602920532227, "global_step": 166551, "epoch": 2006} {"train_loss": -23.614797592163086, "global_step": 166552, "epoch": 2006} {"train_loss": -23.104429244995117, "global_step": 166553, "epoch": 2006} {"train_loss": -23.274024963378906, "global_step": 166554, "epoch": 2006} {"train_loss": -23.441082000732422, "global_step": 166555, "epoch": 2006} {"train_loss": -23.536039352416992, "global_step": 166556, "epoch": 2006} {"train_loss": -23.861522674560547, "global_step": 166557, "epoch": 2006} {"train_loss": -23.337308883666992, "global_step": 166558, "epoch": 2006} {"train_loss": -23.538894653320312, "global_step": 166559, "epoch": 2006} {"train_loss": -23.602209091186523, "global_step": 166560, "epoch": 2006} {"train_loss": -23.843740463256836, "global_step": 166561, "epoch": 2006} {"train_loss": -23.33597183227539, "global_step": 166562, "epoch": 2006} {"train_loss": -23.892305374145508, "global_step": 166563, "epoch": 2006} {"train_loss": -23.515625, "global_step": 166564, "epoch": 2006} {"train_loss": -23.337127685546875, "global_step": 166565, "epoch": 2006} {"train_loss": -23.676401138305664, "global_step": 166566, "epoch": 2006} {"train_loss": -23.80730628967285, "global_step": 166567, "epoch": 2006} {"train_loss": -23.468374252319336, "global_step": 166568, "epoch": 2006} {"train_loss": -23.491371154785156, "global_step": 166569, "epoch": 2006} {"train_loss": -23.38985824584961, "global_step": 166570, "epoch": 2006} {"train_loss": -23.48613739013672, "global_step": 166571, "epoch": 2006} {"train_loss": -23.53293800354004, "global_step": 166572, "epoch": 2006} {"train_loss": -23.83904457092285, "global_step": 166573, "epoch": 2006} {"train_loss": -23.568805694580078, "global_step": 166574, "epoch": 2006} {"train_loss": -23.624725341796875, "global_step": 166575, "epoch": 2006} {"train_loss": -23.58016014099121, "global_step": 166576, "epoch": 2006} {"train_loss": -23.839384078979492, "global_step": 166577, "epoch": 2006} {"train_loss": -23.87782096862793, "global_step": 166578, "epoch": 2006} {"train_loss": -23.786352157592773, "global_step": 166579, "epoch": 2006} {"train_loss": -23.611326608313135, "global_step": 166580, "epoch": 2006, "val_loss": 6407291.0} {"train_loss": -23.157590866088867, "global_step": 166581, "epoch": 2007} {"train_loss": -23.063243865966797, "global_step": 166582, "epoch": 2007} {"train_loss": -22.877748489379883, "global_step": 166583, "epoch": 2007} {"train_loss": -22.57109832763672, "global_step": 166584, "epoch": 2007} {"train_loss": -22.69615936279297, "global_step": 166585, "epoch": 2007} {"train_loss": -22.97455406188965, "global_step": 166586, "epoch": 2007} {"train_loss": -22.86846351623535, "global_step": 166587, "epoch": 2007} {"train_loss": -23.538896560668945, "global_step": 166588, "epoch": 2007} {"train_loss": -23.08925437927246, "global_step": 166589, "epoch": 2007} {"train_loss": -23.157438278198242, "global_step": 166590, "epoch": 2007} {"train_loss": -22.997556686401367, "global_step": 166591, "epoch": 2007} {"train_loss": -23.282363891601562, "global_step": 166592, "epoch": 2007} {"train_loss": -23.284381866455078, "global_step": 166593, "epoch": 2007} {"train_loss": -23.076190948486328, "global_step": 166594, "epoch": 2007} {"train_loss": -23.150421142578125, "global_step": 166595, "epoch": 2007} {"train_loss": -23.067914962768555, "global_step": 166596, "epoch": 2007} {"train_loss": -23.01355743408203, "global_step": 166597, "epoch": 2007} {"train_loss": -23.43854522705078, "global_step": 166598, "epoch": 2007} {"train_loss": -23.202880859375, "global_step": 166599, "epoch": 2007} {"train_loss": -23.5060977935791, "global_step": 166600, "epoch": 2007} {"train_loss": -23.21523094177246, "global_step": 166601, "epoch": 2007} {"train_loss": -23.095884323120117, "global_step": 166602, "epoch": 2007} {"train_loss": -23.457653045654297, "global_step": 166603, "epoch": 2007} {"train_loss": -23.58057975769043, "global_step": 166604, "epoch": 2007} {"train_loss": -23.57916259765625, "global_step": 166605, "epoch": 2007} {"train_loss": -23.51948356628418, "global_step": 166606, "epoch": 2007} {"train_loss": -23.387311935424805, "global_step": 166607, "epoch": 2007} {"train_loss": -23.53594970703125, "global_step": 166608, "epoch": 2007} {"train_loss": -23.732946395874023, "global_step": 166609, "epoch": 2007} {"train_loss": -23.267227172851562, "global_step": 166610, "epoch": 2007} {"train_loss": -23.577024459838867, "global_step": 166611, "epoch": 2007} {"train_loss": -24.018224716186523, "global_step": 166612, "epoch": 2007} {"train_loss": -23.954059600830078, "global_step": 166613, "epoch": 2007} {"train_loss": -23.9792423248291, "global_step": 166614, "epoch": 2007} {"train_loss": -23.780912399291992, "global_step": 166615, "epoch": 2007} {"train_loss": -23.621540069580078, "global_step": 166616, "epoch": 2007} {"train_loss": -23.849699020385742, "global_step": 166617, "epoch": 2007} {"train_loss": -23.69799041748047, "global_step": 166618, "epoch": 2007} {"train_loss": -23.55671501159668, "global_step": 166619, "epoch": 2007} {"train_loss": -23.865896224975586, "global_step": 166620, "epoch": 2007} {"train_loss": -23.809741973876953, "global_step": 166621, "epoch": 2007} {"train_loss": -23.759689331054688, "global_step": 166622, "epoch": 2007} {"train_loss": -23.51462173461914, "global_step": 166623, "epoch": 2007} {"train_loss": -23.510705947875977, "global_step": 166624, "epoch": 2007} {"train_loss": -23.79096031188965, "global_step": 166625, "epoch": 2007} {"train_loss": -23.84722900390625, "global_step": 166626, "epoch": 2007} {"train_loss": -23.815855026245117, "global_step": 166627, "epoch": 2007} {"train_loss": -23.91255760192871, "global_step": 166628, "epoch": 2007} {"train_loss": -23.88768768310547, "global_step": 166629, "epoch": 2007} {"train_loss": -23.68451499938965, "global_step": 166630, "epoch": 2007} {"train_loss": -23.672658920288086, "global_step": 166631, "epoch": 2007} {"train_loss": -23.58739471435547, "global_step": 166632, "epoch": 2007} {"train_loss": -23.86382484436035, "global_step": 166633, "epoch": 2007} {"train_loss": -23.535388946533203, "global_step": 166634, "epoch": 2007} {"train_loss": -23.745498657226562, "global_step": 166635, "epoch": 2007} {"train_loss": -23.71912956237793, "global_step": 166636, "epoch": 2007} {"train_loss": -23.5106201171875, "global_step": 166637, "epoch": 2007} {"train_loss": -23.90053367614746, "global_step": 166638, "epoch": 2007} {"train_loss": -23.724931716918945, "global_step": 166639, "epoch": 2007} {"train_loss": -23.895795822143555, "global_step": 166640, "epoch": 2007} {"train_loss": -23.887556076049805, "global_step": 166641, "epoch": 2007} {"train_loss": -23.487600326538086, "global_step": 166642, "epoch": 2007} {"train_loss": -23.587217330932617, "global_step": 166643, "epoch": 2007} {"train_loss": -23.543354034423828, "global_step": 166644, "epoch": 2007} {"train_loss": -23.668052673339844, "global_step": 166645, "epoch": 2007} {"train_loss": -23.531452178955078, "global_step": 166646, "epoch": 2007} {"train_loss": -23.56063461303711, "global_step": 166647, "epoch": 2007} {"train_loss": -23.75855827331543, "global_step": 166648, "epoch": 2007} {"train_loss": -23.89349937438965, "global_step": 166649, "epoch": 2007} {"train_loss": -23.72284507751465, "global_step": 166650, "epoch": 2007} {"train_loss": -23.707189559936523, "global_step": 166651, "epoch": 2007} {"train_loss": -23.939767837524414, "global_step": 166652, "epoch": 2007} {"train_loss": -23.325708389282227, "global_step": 166653, "epoch": 2007} {"train_loss": -23.40605926513672, "global_step": 166654, "epoch": 2007} {"train_loss": -23.676498413085938, "global_step": 166655, "epoch": 2007} {"train_loss": -23.511350631713867, "global_step": 166656, "epoch": 2007} {"train_loss": -23.571626663208008, "global_step": 166657, "epoch": 2007} {"train_loss": -23.410856246948242, "global_step": 166658, "epoch": 2007} {"train_loss": -23.870264053344727, "global_step": 166659, "epoch": 2007} {"train_loss": -23.44813346862793, "global_step": 166660, "epoch": 2007} {"train_loss": -23.759185791015625, "global_step": 166661, "epoch": 2007} {"train_loss": -23.40542984008789, "global_step": 166662, "epoch": 2007} {"train_loss": -23.524249249194042, "global_step": 166663, "epoch": 2007, "val_loss": 6586036.0} {"train_loss": -23.06302833557129, "global_step": 166664, "epoch": 2008} {"train_loss": -23.219982147216797, "global_step": 166665, "epoch": 2008} {"train_loss": -23.288862228393555, "global_step": 166666, "epoch": 2008} {"train_loss": -22.90147590637207, "global_step": 166667, "epoch": 2008} {"train_loss": -23.335145950317383, "global_step": 166668, "epoch": 2008} {"train_loss": -23.105480194091797, "global_step": 166669, "epoch": 2008} {"train_loss": -22.93517303466797, "global_step": 166670, "epoch": 2008} {"train_loss": -23.394210815429688, "global_step": 166671, "epoch": 2008} {"train_loss": -22.9458065032959, "global_step": 166672, "epoch": 2008} {"train_loss": -23.26673126220703, "global_step": 166673, "epoch": 2008} {"train_loss": -22.818851470947266, "global_step": 166674, "epoch": 2008} {"train_loss": -23.201183319091797, "global_step": 166675, "epoch": 2008} {"train_loss": -23.19586181640625, "global_step": 166676, "epoch": 2008} {"train_loss": -23.250638961791992, "global_step": 166677, "epoch": 2008} {"train_loss": -23.48475456237793, "global_step": 166678, "epoch": 2008} {"train_loss": -23.381576538085938, "global_step": 166679, "epoch": 2008} {"train_loss": -23.57227897644043, "global_step": 166680, "epoch": 2008} {"train_loss": -23.548913955688477, "global_step": 166681, "epoch": 2008} {"train_loss": -23.69178009033203, "global_step": 166682, "epoch": 2008} {"train_loss": -23.70745277404785, "global_step": 166683, "epoch": 2008} {"train_loss": -23.553176879882812, "global_step": 166684, "epoch": 2008} {"train_loss": -23.307910919189453, "global_step": 166685, "epoch": 2008} {"train_loss": -23.77532958984375, "global_step": 166686, "epoch": 2008} {"train_loss": -23.337039947509766, "global_step": 166687, "epoch": 2008} {"train_loss": -23.663660049438477, "global_step": 166688, "epoch": 2008} {"train_loss": -23.594280242919922, "global_step": 166689, "epoch": 2008} {"train_loss": -23.615283966064453, "global_step": 166690, "epoch": 2008} {"train_loss": -23.327375411987305, "global_step": 166691, "epoch": 2008} {"train_loss": -23.520700454711914, "global_step": 166692, "epoch": 2008} {"train_loss": -23.517154693603516, "global_step": 166693, "epoch": 2008} {"train_loss": -23.593128204345703, "global_step": 166694, "epoch": 2008} {"train_loss": -24.021595001220703, "global_step": 166695, "epoch": 2008} {"train_loss": -23.61690330505371, "global_step": 166696, "epoch": 2008} {"train_loss": -23.698205947875977, "global_step": 166697, "epoch": 2008} {"train_loss": -23.887331008911133, "global_step": 166698, "epoch": 2008} {"train_loss": -23.781911849975586, "global_step": 166699, "epoch": 2008} {"train_loss": -23.792158126831055, "global_step": 166700, "epoch": 2008} {"train_loss": -23.640033721923828, "global_step": 166701, "epoch": 2008} {"train_loss": -23.566152572631836, "global_step": 166702, "epoch": 2008} {"train_loss": -23.80253028869629, "global_step": 166703, "epoch": 2008} {"train_loss": -23.821002960205078, "global_step": 166704, "epoch": 2008} {"train_loss": -23.824769973754883, "global_step": 166705, "epoch": 2008} {"train_loss": -23.4366512298584, "global_step": 166706, "epoch": 2008} {"train_loss": -23.704057693481445, "global_step": 166707, "epoch": 2008} {"train_loss": -24.116247177124023, "global_step": 166708, "epoch": 2008} {"train_loss": -23.479225158691406, "global_step": 166709, "epoch": 2008} {"train_loss": -23.68349266052246, "global_step": 166710, "epoch": 2008} {"train_loss": -23.965452194213867, "global_step": 166711, "epoch": 2008} {"train_loss": -24.01380157470703, "global_step": 166712, "epoch": 2008} {"train_loss": -23.694477081298828, "global_step": 166713, "epoch": 2008} {"train_loss": -23.686614990234375, "global_step": 166714, "epoch": 2008} {"train_loss": -23.083524703979492, "global_step": 166715, "epoch": 2008} {"train_loss": -22.637807846069336, "global_step": 166716, "epoch": 2008} {"train_loss": -23.348798751831055, "global_step": 166717, "epoch": 2008} {"train_loss": -23.168251037597656, "global_step": 166718, "epoch": 2008} {"train_loss": -23.165626525878906, "global_step": 166719, "epoch": 2008} {"train_loss": -23.31974220275879, "global_step": 166720, "epoch": 2008} {"train_loss": -23.5653133392334, "global_step": 166721, "epoch": 2008} {"train_loss": -23.22391700744629, "global_step": 166722, "epoch": 2008} {"train_loss": -23.295087814331055, "global_step": 166723, "epoch": 2008} {"train_loss": -23.497499465942383, "global_step": 166724, "epoch": 2008} {"train_loss": -23.066181182861328, "global_step": 166725, "epoch": 2008} {"train_loss": -23.298315048217773, "global_step": 166726, "epoch": 2008} {"train_loss": -23.587726593017578, "global_step": 166727, "epoch": 2008} {"train_loss": -23.406721115112305, "global_step": 166728, "epoch": 2008} {"train_loss": -23.657896041870117, "global_step": 166729, "epoch": 2008} {"train_loss": -23.184934616088867, "global_step": 166730, "epoch": 2008} {"train_loss": -23.281726837158203, "global_step": 166731, "epoch": 2008} {"train_loss": -23.57082748413086, "global_step": 166732, "epoch": 2008} {"train_loss": -23.19928550720215, "global_step": 166733, "epoch": 2008} {"train_loss": -23.24022102355957, "global_step": 166734, "epoch": 2008} {"train_loss": -23.51161003112793, "global_step": 166735, "epoch": 2008} {"train_loss": -23.306623458862305, "global_step": 166736, "epoch": 2008} {"train_loss": -24.04535484313965, "global_step": 166737, "epoch": 2008} {"train_loss": -23.62192153930664, "global_step": 166738, "epoch": 2008} {"train_loss": -23.76495933532715, "global_step": 166739, "epoch": 2008} {"train_loss": -23.389169692993164, "global_step": 166740, "epoch": 2008} {"train_loss": -23.261810302734375, "global_step": 166741, "epoch": 2008} {"train_loss": -23.773330688476562, "global_step": 166742, "epoch": 2008} {"train_loss": -23.598318099975586, "global_step": 166743, "epoch": 2008} {"train_loss": -23.62880516052246, "global_step": 166744, "epoch": 2008} {"train_loss": -23.279695510864258, "global_step": 166745, "epoch": 2008} {"train_loss": -23.471423068678522, "global_step": 166746, "epoch": 2008, "val_loss": 6438091.0} {"train_loss": -23.40974235534668, "global_step": 166747, "epoch": 2009} {"train_loss": -23.10294532775879, "global_step": 166748, "epoch": 2009} {"train_loss": -23.53615951538086, "global_step": 166749, "epoch": 2009} {"train_loss": -23.24416160583496, "global_step": 166750, "epoch": 2009} {"train_loss": -23.485605239868164, "global_step": 166751, "epoch": 2009} {"train_loss": -23.391704559326172, "global_step": 166752, "epoch": 2009} {"train_loss": -23.705646514892578, "global_step": 166753, "epoch": 2009} {"train_loss": -23.869009017944336, "global_step": 166754, "epoch": 2009} {"train_loss": -23.614980697631836, "global_step": 166755, "epoch": 2009} {"train_loss": -23.551780700683594, "global_step": 166756, "epoch": 2009} {"train_loss": -23.574247360229492, "global_step": 166757, "epoch": 2009} {"train_loss": -23.517539978027344, "global_step": 166758, "epoch": 2009} {"train_loss": -23.57509422302246, "global_step": 166759, "epoch": 2009} {"train_loss": -23.823928833007812, "global_step": 166760, "epoch": 2009} {"train_loss": -23.560823440551758, "global_step": 166761, "epoch": 2009} {"train_loss": -23.353824615478516, "global_step": 166762, "epoch": 2009} {"train_loss": -23.227331161499023, "global_step": 166763, "epoch": 2009} {"train_loss": -23.61315155029297, "global_step": 166764, "epoch": 2009} {"train_loss": -23.577350616455078, "global_step": 166765, "epoch": 2009} {"train_loss": -23.2921085357666, "global_step": 166766, "epoch": 2009} {"train_loss": -23.610841751098633, "global_step": 166767, "epoch": 2009} {"train_loss": -23.499248504638672, "global_step": 166768, "epoch": 2009} {"train_loss": -23.406789779663086, "global_step": 166769, "epoch": 2009} {"train_loss": -23.615192413330078, "global_step": 166770, "epoch": 2009} {"train_loss": -23.426624298095703, "global_step": 166771, "epoch": 2009} {"train_loss": -23.560110092163086, "global_step": 166772, "epoch": 2009} {"train_loss": -23.720300674438477, "global_step": 166773, "epoch": 2009} {"train_loss": -23.4100399017334, "global_step": 166774, "epoch": 2009} {"train_loss": -23.808744430541992, "global_step": 166775, "epoch": 2009} {"train_loss": -23.656057357788086, "global_step": 166776, "epoch": 2009} {"train_loss": -23.709976196289062, "global_step": 166777, "epoch": 2009} {"train_loss": -23.594894409179688, "global_step": 166778, "epoch": 2009} {"train_loss": -23.4526309967041, "global_step": 166779, "epoch": 2009} {"train_loss": -23.937549591064453, "global_step": 166780, "epoch": 2009} {"train_loss": -23.52249526977539, "global_step": 166781, "epoch": 2009} {"train_loss": -23.469181060791016, "global_step": 166782, "epoch": 2009} {"train_loss": -22.970340728759766, "global_step": 166783, "epoch": 2009} {"train_loss": -23.670536041259766, "global_step": 166784, "epoch": 2009} {"train_loss": -23.290443420410156, "global_step": 166785, "epoch": 2009} {"train_loss": -23.205322265625, "global_step": 166786, "epoch": 2009} {"train_loss": -23.34329605102539, "global_step": 166787, "epoch": 2009} {"train_loss": -23.51351547241211, "global_step": 166788, "epoch": 2009} {"train_loss": -23.223012924194336, "global_step": 166789, "epoch": 2009} {"train_loss": -23.60198974609375, "global_step": 166790, "epoch": 2009} {"train_loss": -23.358922958374023, "global_step": 166791, "epoch": 2009} {"train_loss": -23.83969497680664, "global_step": 166792, "epoch": 2009} {"train_loss": -23.151296615600586, "global_step": 166793, "epoch": 2009} {"train_loss": -23.455705642700195, "global_step": 166794, "epoch": 2009} {"train_loss": -23.302661895751953, "global_step": 166795, "epoch": 2009} {"train_loss": -23.681203842163086, "global_step": 166796, "epoch": 2009} {"train_loss": -23.201885223388672, "global_step": 166797, "epoch": 2009} {"train_loss": -23.809110641479492, "global_step": 166798, "epoch": 2009} {"train_loss": -23.423748016357422, "global_step": 166799, "epoch": 2009} {"train_loss": -23.713491439819336, "global_step": 166800, "epoch": 2009} {"train_loss": -23.247512817382812, "global_step": 166801, "epoch": 2009} {"train_loss": -23.486589431762695, "global_step": 166802, "epoch": 2009} {"train_loss": -23.6965389251709, "global_step": 166803, "epoch": 2009} {"train_loss": -23.725229263305664, "global_step": 166804, "epoch": 2009} {"train_loss": -23.702722549438477, "global_step": 166805, "epoch": 2009} {"train_loss": -23.732608795166016, "global_step": 166806, "epoch": 2009} {"train_loss": -24.27532386779785, "global_step": 166807, "epoch": 2009} {"train_loss": -23.626638412475586, "global_step": 166808, "epoch": 2009} {"train_loss": -23.4039306640625, "global_step": 166809, "epoch": 2009} {"train_loss": -23.69557762145996, "global_step": 166810, "epoch": 2009} {"train_loss": -23.535566329956055, "global_step": 166811, "epoch": 2009} {"train_loss": -23.91767692565918, "global_step": 166812, "epoch": 2009} {"train_loss": -23.43191909790039, "global_step": 166813, "epoch": 2009} {"train_loss": -23.8059139251709, "global_step": 166814, "epoch": 2009} {"train_loss": -23.243074417114258, "global_step": 166815, "epoch": 2009} {"train_loss": -23.922143936157227, "global_step": 166816, "epoch": 2009} {"train_loss": -23.39955711364746, "global_step": 166817, "epoch": 2009} {"train_loss": -23.38356590270996, "global_step": 166818, "epoch": 2009} {"train_loss": -23.82984733581543, "global_step": 166819, "epoch": 2009} {"train_loss": -23.700204849243164, "global_step": 166820, "epoch": 2009} {"train_loss": -23.85746192932129, "global_step": 166821, "epoch": 2009} {"train_loss": -23.78183364868164, "global_step": 166822, "epoch": 2009} {"train_loss": -23.886402130126953, "global_step": 166823, "epoch": 2009} {"train_loss": -23.62372589111328, "global_step": 166824, "epoch": 2009} {"train_loss": -24.06400489807129, "global_step": 166825, "epoch": 2009} {"train_loss": -23.44749641418457, "global_step": 166826, "epoch": 2009} {"train_loss": -23.752779006958008, "global_step": 166827, "epoch": 2009} {"train_loss": -23.910207748413086, "global_step": 166828, "epoch": 2009} {"train_loss": -23.561722835862493, "global_step": 166829, "epoch": 2009, "val_loss": 6507235.0} {"train_loss": -23.06452751159668, "global_step": 166830, "epoch": 2010} {"train_loss": -23.12636947631836, "global_step": 166831, "epoch": 2010} {"train_loss": -23.486770629882812, "global_step": 166832, "epoch": 2010} {"train_loss": -23.367834091186523, "global_step": 166833, "epoch": 2010} {"train_loss": -23.548254013061523, "global_step": 166834, "epoch": 2010} {"train_loss": -23.618709564208984, "global_step": 166835, "epoch": 2010} {"train_loss": -23.212928771972656, "global_step": 166836, "epoch": 2010} {"train_loss": -23.844717025756836, "global_step": 166837, "epoch": 2010} {"train_loss": -23.194040298461914, "global_step": 166838, "epoch": 2010} {"train_loss": -23.575380325317383, "global_step": 166839, "epoch": 2010} {"train_loss": -23.40370750427246, "global_step": 166840, "epoch": 2010} {"train_loss": -22.98101806640625, "global_step": 166841, "epoch": 2010} {"train_loss": -23.33887481689453, "global_step": 166842, "epoch": 2010} {"train_loss": -23.4422664642334, "global_step": 166843, "epoch": 2010} {"train_loss": -23.296117782592773, "global_step": 166844, "epoch": 2010} {"train_loss": -23.935001373291016, "global_step": 166845, "epoch": 2010} {"train_loss": -24.065967559814453, "global_step": 166846, "epoch": 2010} {"train_loss": -23.853431701660156, "global_step": 166847, "epoch": 2010} {"train_loss": -23.579797744750977, "global_step": 166848, "epoch": 2010} {"train_loss": -23.428634643554688, "global_step": 166849, "epoch": 2010} {"train_loss": -23.51268196105957, "global_step": 166850, "epoch": 2010} {"train_loss": -23.36450958251953, "global_step": 166851, "epoch": 2010} {"train_loss": -23.336233139038086, "global_step": 166852, "epoch": 2010} {"train_loss": -23.47165870666504, "global_step": 166853, "epoch": 2010} {"train_loss": -23.476194381713867, "global_step": 166854, "epoch": 2010} {"train_loss": -23.495397567749023, "global_step": 166855, "epoch": 2010} {"train_loss": -23.660200119018555, "global_step": 166856, "epoch": 2010} {"train_loss": -23.418333053588867, "global_step": 166857, "epoch": 2010} {"train_loss": -23.654237747192383, "global_step": 166858, "epoch": 2010} {"train_loss": -23.124475479125977, "global_step": 166859, "epoch": 2010} {"train_loss": -23.415056228637695, "global_step": 166860, "epoch": 2010} {"train_loss": -23.762296676635742, "global_step": 166861, "epoch": 2010} {"train_loss": -23.90754508972168, "global_step": 166862, "epoch": 2010} {"train_loss": -23.52174949645996, "global_step": 166863, "epoch": 2010} {"train_loss": -23.43088722229004, "global_step": 166864, "epoch": 2010} {"train_loss": -23.778730392456055, "global_step": 166865, "epoch": 2010} {"train_loss": -23.670942306518555, "global_step": 166866, "epoch": 2010} {"train_loss": -23.54522132873535, "global_step": 166867, "epoch": 2010} {"train_loss": -23.944351196289062, "global_step": 166868, "epoch": 2010} {"train_loss": -23.854337692260742, "global_step": 166869, "epoch": 2010} {"train_loss": -23.108491897583008, "global_step": 166870, "epoch": 2010} {"train_loss": -23.772184371948242, "global_step": 166871, "epoch": 2010} {"train_loss": -23.560434341430664, "global_step": 166872, "epoch": 2010} {"train_loss": -23.977710723876953, "global_step": 166873, "epoch": 2010} {"train_loss": -23.300222396850586, "global_step": 166874, "epoch": 2010} {"train_loss": -23.651533126831055, "global_step": 166875, "epoch": 2010} {"train_loss": -23.7924861907959, "global_step": 166876, "epoch": 2010} {"train_loss": -23.806299209594727, "global_step": 166877, "epoch": 2010} {"train_loss": -23.904691696166992, "global_step": 166878, "epoch": 2010} {"train_loss": -23.564041137695312, "global_step": 166879, "epoch": 2010} {"train_loss": -23.34671974182129, "global_step": 166880, "epoch": 2010} {"train_loss": -23.396493911743164, "global_step": 166881, "epoch": 2010} {"train_loss": -23.540077209472656, "global_step": 166882, "epoch": 2010} {"train_loss": -23.35639190673828, "global_step": 166883, "epoch": 2010} {"train_loss": -23.61289405822754, "global_step": 166884, "epoch": 2010} {"train_loss": -23.712385177612305, "global_step": 166885, "epoch": 2010} {"train_loss": -23.60767936706543, "global_step": 166886, "epoch": 2010} {"train_loss": -24.038915634155273, "global_step": 166887, "epoch": 2010} {"train_loss": -23.74549674987793, "global_step": 166888, "epoch": 2010} {"train_loss": -23.4502010345459, "global_step": 166889, "epoch": 2010} {"train_loss": -23.280128479003906, "global_step": 166890, "epoch": 2010} {"train_loss": -23.608341217041016, "global_step": 166891, "epoch": 2010} {"train_loss": -23.853809356689453, "global_step": 166892, "epoch": 2010} {"train_loss": -23.76382827758789, "global_step": 166893, "epoch": 2010} {"train_loss": -23.444934844970703, "global_step": 166894, "epoch": 2010} {"train_loss": -23.49889373779297, "global_step": 166895, "epoch": 2010} {"train_loss": -23.494476318359375, "global_step": 166896, "epoch": 2010} {"train_loss": -23.845901489257812, "global_step": 166897, "epoch": 2010} {"train_loss": -23.524824142456055, "global_step": 166898, "epoch": 2010} {"train_loss": -23.844999313354492, "global_step": 166899, "epoch": 2010} {"train_loss": -23.386112213134766, "global_step": 166900, "epoch": 2010} {"train_loss": -23.599037170410156, "global_step": 166901, "epoch": 2010} {"train_loss": -23.79315185546875, "global_step": 166902, "epoch": 2010} {"train_loss": -23.734556198120117, "global_step": 166903, "epoch": 2010} {"train_loss": -23.5631103515625, "global_step": 166904, "epoch": 2010} {"train_loss": -23.746809005737305, "global_step": 166905, "epoch": 2010} {"train_loss": -23.47315788269043, "global_step": 166906, "epoch": 2010} {"train_loss": -23.20684814453125, "global_step": 166907, "epoch": 2010} {"train_loss": -23.41714859008789, "global_step": 166908, "epoch": 2010} {"train_loss": -23.420856475830078, "global_step": 166909, "epoch": 2010} {"train_loss": -23.757572174072266, "global_step": 166910, "epoch": 2010} {"train_loss": -23.761255264282227, "global_step": 166911, "epoch": 2010} {"train_loss": -23.57734765202166, "global_step": 166912, "epoch": 2010, "val_loss": 6312359.5} {"train_loss": -23.66495132446289, "global_step": 166913, "epoch": 2011} {"train_loss": -23.172122955322266, "global_step": 166914, "epoch": 2011} {"train_loss": -23.403038024902344, "global_step": 166915, "epoch": 2011} {"train_loss": -23.40934181213379, "global_step": 166916, "epoch": 2011} {"train_loss": -23.439382553100586, "global_step": 166917, "epoch": 2011} {"train_loss": -23.180240631103516, "global_step": 166918, "epoch": 2011} {"train_loss": -23.550216674804688, "global_step": 166919, "epoch": 2011} {"train_loss": -23.06863784790039, "global_step": 166920, "epoch": 2011} {"train_loss": -23.504831314086914, "global_step": 166921, "epoch": 2011} {"train_loss": -23.3944149017334, "global_step": 166922, "epoch": 2011} {"train_loss": -23.281864166259766, "global_step": 166923, "epoch": 2011} {"train_loss": -23.262821197509766, "global_step": 166924, "epoch": 2011} {"train_loss": -23.713119506835938, "global_step": 166925, "epoch": 2011} {"train_loss": -23.437307357788086, "global_step": 166926, "epoch": 2011} {"train_loss": -23.422910690307617, "global_step": 166927, "epoch": 2011} {"train_loss": -23.035078048706055, "global_step": 166928, "epoch": 2011} {"train_loss": -23.743337631225586, "global_step": 166929, "epoch": 2011} {"train_loss": -23.416749954223633, "global_step": 166930, "epoch": 2011} {"train_loss": -23.408428192138672, "global_step": 166931, "epoch": 2011} {"train_loss": -23.505481719970703, "global_step": 166932, "epoch": 2011} {"train_loss": -23.328201293945312, "global_step": 166933, "epoch": 2011} {"train_loss": -23.478870391845703, "global_step": 166934, "epoch": 2011} {"train_loss": -23.228235244750977, "global_step": 166935, "epoch": 2011} {"train_loss": -23.667343139648438, "global_step": 166936, "epoch": 2011} {"train_loss": -23.52850341796875, "global_step": 166937, "epoch": 2011} {"train_loss": -23.35371971130371, "global_step": 166938, "epoch": 2011} {"train_loss": -23.48120880126953, "global_step": 166939, "epoch": 2011} {"train_loss": -23.551998138427734, "global_step": 166940, "epoch": 2011} {"train_loss": -23.780380249023438, "global_step": 166941, "epoch": 2011} {"train_loss": -23.115060806274414, "global_step": 166942, "epoch": 2011} {"train_loss": -23.202695846557617, "global_step": 166943, "epoch": 2011} {"train_loss": -23.632617950439453, "global_step": 166944, "epoch": 2011} {"train_loss": -23.620580673217773, "global_step": 166945, "epoch": 2011} {"train_loss": -23.192060470581055, "global_step": 166946, "epoch": 2011} {"train_loss": -23.768692016601562, "global_step": 166947, "epoch": 2011} {"train_loss": -23.4964656829834, "global_step": 166948, "epoch": 2011} {"train_loss": -23.752304077148438, "global_step": 166949, "epoch": 2011} {"train_loss": -23.786376953125, "global_step": 166950, "epoch": 2011} {"train_loss": -23.327239990234375, "global_step": 166951, "epoch": 2011} {"train_loss": -24.012310028076172, "global_step": 166952, "epoch": 2011} {"train_loss": -23.9614200592041, "global_step": 166953, "epoch": 2011} {"train_loss": -24.045156478881836, "global_step": 166954, "epoch": 2011} {"train_loss": -23.59222412109375, "global_step": 166955, "epoch": 2011} {"train_loss": -23.46044158935547, "global_step": 166956, "epoch": 2011} {"train_loss": -23.461271286010742, "global_step": 166957, "epoch": 2011} {"train_loss": -23.370527267456055, "global_step": 166958, "epoch": 2011} {"train_loss": -23.119070053100586, "global_step": 166959, "epoch": 2011} {"train_loss": -23.211591720581055, "global_step": 166960, "epoch": 2011} {"train_loss": -22.87247657775879, "global_step": 166961, "epoch": 2011} {"train_loss": -23.626972198486328, "global_step": 166962, "epoch": 2011} {"train_loss": -23.517425537109375, "global_step": 166963, "epoch": 2011} {"train_loss": -23.227096557617188, "global_step": 166964, "epoch": 2011} {"train_loss": -23.180418014526367, "global_step": 166965, "epoch": 2011} {"train_loss": -23.12428855895996, "global_step": 166966, "epoch": 2011} {"train_loss": -23.616191864013672, "global_step": 166967, "epoch": 2011} {"train_loss": -23.43743896484375, "global_step": 166968, "epoch": 2011} {"train_loss": -23.869491577148438, "global_step": 166969, "epoch": 2011} {"train_loss": -23.41805076599121, "global_step": 166970, "epoch": 2011} {"train_loss": -23.532846450805664, "global_step": 166971, "epoch": 2011} {"train_loss": -23.352357864379883, "global_step": 166972, "epoch": 2011} {"train_loss": -23.33009910583496, "global_step": 166973, "epoch": 2011} {"train_loss": -23.709686279296875, "global_step": 166974, "epoch": 2011} {"train_loss": -23.227445602416992, "global_step": 166975, "epoch": 2011} {"train_loss": -23.736604690551758, "global_step": 166976, "epoch": 2011} {"train_loss": -23.296430587768555, "global_step": 166977, "epoch": 2011} {"train_loss": -23.620065689086914, "global_step": 166978, "epoch": 2011} {"train_loss": -23.99161720275879, "global_step": 166979, "epoch": 2011} {"train_loss": -23.720914840698242, "global_step": 166980, "epoch": 2011} {"train_loss": -23.846878051757812, "global_step": 166981, "epoch": 2011} {"train_loss": -23.425302505493164, "global_step": 166982, "epoch": 2011} {"train_loss": -23.990154266357422, "global_step": 166983, "epoch": 2011} {"train_loss": -23.657514572143555, "global_step": 166984, "epoch": 2011} {"train_loss": -23.819440841674805, "global_step": 166985, "epoch": 2011} {"train_loss": -23.934572219848633, "global_step": 166986, "epoch": 2011} {"train_loss": -23.224210739135742, "global_step": 166987, "epoch": 2011} {"train_loss": -23.46282386779785, "global_step": 166988, "epoch": 2011} {"train_loss": -23.89836311340332, "global_step": 166989, "epoch": 2011} {"train_loss": -23.530677795410156, "global_step": 166990, "epoch": 2011} {"train_loss": -23.7795467376709, "global_step": 166991, "epoch": 2011} {"train_loss": -24.038925170898438, "global_step": 166992, "epoch": 2011} {"train_loss": -23.643369674682617, "global_step": 166993, "epoch": 2011} {"train_loss": -23.908849716186523, "global_step": 166994, "epoch": 2011} {"train_loss": -23.527016926960773, "global_step": 166995, "epoch": 2011, "val_loss": 6294112.0} {"train_loss": -22.300281524658203, "global_step": 166996, "epoch": 2012} {"train_loss": -22.786832809448242, "global_step": 166997, "epoch": 2012} {"train_loss": -22.325658798217773, "global_step": 166998, "epoch": 2012} {"train_loss": -22.53499412536621, "global_step": 166999, "epoch": 2012} {"train_loss": -22.310733795166016, "global_step": 167000, "epoch": 2012} {"train_loss": -22.923723220825195, "global_step": 167001, "epoch": 2012} {"train_loss": -22.66065788269043, "global_step": 167002, "epoch": 2012} {"train_loss": -23.0668888092041, "global_step": 167003, "epoch": 2012} {"train_loss": -22.962209701538086, "global_step": 167004, "epoch": 2012} {"train_loss": -22.88585662841797, "global_step": 167005, "epoch": 2012} {"train_loss": -23.122756958007812, "global_step": 167006, "epoch": 2012} {"train_loss": -23.030872344970703, "global_step": 167007, "epoch": 2012} {"train_loss": -22.715957641601562, "global_step": 167008, "epoch": 2012} {"train_loss": -23.15812110900879, "global_step": 167009, "epoch": 2012} {"train_loss": -22.94400978088379, "global_step": 167010, "epoch": 2012} {"train_loss": -22.91004753112793, "global_step": 167011, "epoch": 2012} {"train_loss": -23.22045135498047, "global_step": 167012, "epoch": 2012} {"train_loss": -23.18243980407715, "global_step": 167013, "epoch": 2012} {"train_loss": -23.384986877441406, "global_step": 167014, "epoch": 2012} {"train_loss": -23.50953483581543, "global_step": 167015, "epoch": 2012} {"train_loss": -23.473939895629883, "global_step": 167016, "epoch": 2012} {"train_loss": -23.309154510498047, "global_step": 167017, "epoch": 2012} {"train_loss": -23.481050491333008, "global_step": 167018, "epoch": 2012} {"train_loss": -23.46845817565918, "global_step": 167019, "epoch": 2012} {"train_loss": -22.95634651184082, "global_step": 167020, "epoch": 2012} {"train_loss": -23.600528717041016, "global_step": 167021, "epoch": 2012} {"train_loss": -23.512130737304688, "global_step": 167022, "epoch": 2012} {"train_loss": -23.55204200744629, "global_step": 167023, "epoch": 2012} {"train_loss": -23.43883514404297, "global_step": 167024, "epoch": 2012} {"train_loss": -23.645273208618164, "global_step": 167025, "epoch": 2012} {"train_loss": -23.434919357299805, "global_step": 167026, "epoch": 2012} {"train_loss": -23.690038681030273, "global_step": 167027, "epoch": 2012} {"train_loss": -23.6214542388916, "global_step": 167028, "epoch": 2012} {"train_loss": -23.50203514099121, "global_step": 167029, "epoch": 2012} {"train_loss": -23.611425399780273, "global_step": 167030, "epoch": 2012} {"train_loss": -23.577423095703125, "global_step": 167031, "epoch": 2012} {"train_loss": -23.418668746948242, "global_step": 167032, "epoch": 2012} {"train_loss": -23.651182174682617, "global_step": 167033, "epoch": 2012} {"train_loss": -23.970184326171875, "global_step": 167034, "epoch": 2012} {"train_loss": -23.594690322875977, "global_step": 167035, "epoch": 2012} {"train_loss": -24.01272201538086, "global_step": 167036, "epoch": 2012} {"train_loss": -23.849313735961914, "global_step": 167037, "epoch": 2012} {"train_loss": -23.695676803588867, "global_step": 167038, "epoch": 2012} {"train_loss": -23.519777297973633, "global_step": 167039, "epoch": 2012} {"train_loss": -23.59602928161621, "global_step": 167040, "epoch": 2012} {"train_loss": -23.46921730041504, "global_step": 167041, "epoch": 2012} {"train_loss": -23.857725143432617, "global_step": 167042, "epoch": 2012} {"train_loss": -23.65940284729004, "global_step": 167043, "epoch": 2012} {"train_loss": -23.65937042236328, "global_step": 167044, "epoch": 2012} {"train_loss": -23.712663650512695, "global_step": 167045, "epoch": 2012} {"train_loss": -23.771066665649414, "global_step": 167046, "epoch": 2012} {"train_loss": -23.629440307617188, "global_step": 167047, "epoch": 2012} {"train_loss": -23.65606117248535, "global_step": 167048, "epoch": 2012} {"train_loss": -23.655826568603516, "global_step": 167049, "epoch": 2012} {"train_loss": -24.128482818603516, "global_step": 167050, "epoch": 2012} {"train_loss": -23.466938018798828, "global_step": 167051, "epoch": 2012} {"train_loss": -23.70413589477539, "global_step": 167052, "epoch": 2012} {"train_loss": -23.39589500427246, "global_step": 167053, "epoch": 2012} {"train_loss": -23.34876823425293, "global_step": 167054, "epoch": 2012} {"train_loss": -23.438369750976562, "global_step": 167055, "epoch": 2012} {"train_loss": -23.60399627685547, "global_step": 167056, "epoch": 2012} {"train_loss": -24.005512237548828, "global_step": 167057, "epoch": 2012} {"train_loss": -24.113046646118164, "global_step": 167058, "epoch": 2012} {"train_loss": -23.808509826660156, "global_step": 167059, "epoch": 2012} {"train_loss": -23.743553161621094, "global_step": 167060, "epoch": 2012} {"train_loss": -23.45223617553711, "global_step": 167061, "epoch": 2012} {"train_loss": -23.38054847717285, "global_step": 167062, "epoch": 2012} {"train_loss": -23.90829849243164, "global_step": 167063, "epoch": 2012} {"train_loss": -23.472858428955078, "global_step": 167064, "epoch": 2012} {"train_loss": -23.473119735717773, "global_step": 167065, "epoch": 2012} {"train_loss": -23.75581169128418, "global_step": 167066, "epoch": 2012} {"train_loss": -23.479124069213867, "global_step": 167067, "epoch": 2012} {"train_loss": -23.61935806274414, "global_step": 167068, "epoch": 2012} {"train_loss": -23.91320037841797, "global_step": 167069, "epoch": 2012} {"train_loss": -23.643095016479492, "global_step": 167070, "epoch": 2012} {"train_loss": -23.53400230407715, "global_step": 167071, "epoch": 2012} {"train_loss": -23.683433532714844, "global_step": 167072, "epoch": 2012} {"train_loss": -23.511188507080078, "global_step": 167073, "epoch": 2012} {"train_loss": -23.474721908569336, "global_step": 167074, "epoch": 2012} {"train_loss": -23.70379066467285, "global_step": 167075, "epoch": 2012} {"train_loss": -24.33502960205078, "global_step": 167076, "epoch": 2012} {"train_loss": -23.52806282043457, "global_step": 167077, "epoch": 2012} {"train_loss": -23.45713394808482, "global_step": 167078, "epoch": 2012, "val_loss": 6338510.0} {"train_loss": -23.32306480407715, "global_step": 167079, "epoch": 2013} {"train_loss": -23.502920150756836, "global_step": 167080, "epoch": 2013} {"train_loss": -23.60402488708496, "global_step": 167081, "epoch": 2013} {"train_loss": -23.62367057800293, "global_step": 167082, "epoch": 2013} {"train_loss": -23.73130989074707, "global_step": 167083, "epoch": 2013} {"train_loss": -23.6845645904541, "global_step": 167084, "epoch": 2013} {"train_loss": -23.887941360473633, "global_step": 167085, "epoch": 2013} {"train_loss": -23.915407180786133, "global_step": 167086, "epoch": 2013} {"train_loss": -23.323293685913086, "global_step": 167087, "epoch": 2013} {"train_loss": -23.510913848876953, "global_step": 167088, "epoch": 2013} {"train_loss": -23.140888214111328, "global_step": 167089, "epoch": 2013} {"train_loss": -23.400259017944336, "global_step": 167090, "epoch": 2013} {"train_loss": -23.76758575439453, "global_step": 167091, "epoch": 2013} {"train_loss": -23.631399154663086, "global_step": 167092, "epoch": 2013} {"train_loss": -23.35177993774414, "global_step": 167093, "epoch": 2013} {"train_loss": -23.701536178588867, "global_step": 167094, "epoch": 2013} {"train_loss": -23.582427978515625, "global_step": 167095, "epoch": 2013} {"train_loss": -23.647140502929688, "global_step": 167096, "epoch": 2013} {"train_loss": -23.988637924194336, "global_step": 167097, "epoch": 2013} {"train_loss": -23.935766220092773, "global_step": 167098, "epoch": 2013} {"train_loss": -23.655385971069336, "global_step": 167099, "epoch": 2013} {"train_loss": -23.631549835205078, "global_step": 167100, "epoch": 2013} {"train_loss": -23.500226974487305, "global_step": 167101, "epoch": 2013} {"train_loss": -23.608570098876953, "global_step": 167102, "epoch": 2013} {"train_loss": -23.82386016845703, "global_step": 167103, "epoch": 2013} {"train_loss": -24.05741310119629, "global_step": 167104, "epoch": 2013} {"train_loss": -23.255308151245117, "global_step": 167105, "epoch": 2013} {"train_loss": -23.676992416381836, "global_step": 167106, "epoch": 2013} {"train_loss": -23.908605575561523, "global_step": 167107, "epoch": 2013} {"train_loss": -23.79859161376953, "global_step": 167108, "epoch": 2013} {"train_loss": -23.864526748657227, "global_step": 167109, "epoch": 2013} {"train_loss": -23.511173248291016, "global_step": 167110, "epoch": 2013} {"train_loss": -23.602975845336914, "global_step": 167111, "epoch": 2013} {"train_loss": -23.661624908447266, "global_step": 167112, "epoch": 2013} {"train_loss": -23.6038875579834, "global_step": 167113, "epoch": 2013} {"train_loss": -23.552297592163086, "global_step": 167114, "epoch": 2013} {"train_loss": -23.62969970703125, "global_step": 167115, "epoch": 2013} {"train_loss": -23.866132736206055, "global_step": 167116, "epoch": 2013} {"train_loss": -23.925758361816406, "global_step": 167117, "epoch": 2013} {"train_loss": -23.697824478149414, "global_step": 167118, "epoch": 2013} {"train_loss": -23.827566146850586, "global_step": 167119, "epoch": 2013} {"train_loss": -23.61602783203125, "global_step": 167120, "epoch": 2013} {"train_loss": -23.93120765686035, "global_step": 167121, "epoch": 2013} {"train_loss": -24.002065658569336, "global_step": 167122, "epoch": 2013} {"train_loss": -23.531875610351562, "global_step": 167123, "epoch": 2013} {"train_loss": -23.730228424072266, "global_step": 167124, "epoch": 2013} {"train_loss": -24.127792358398438, "global_step": 167125, "epoch": 2013} {"train_loss": -23.376741409301758, "global_step": 167126, "epoch": 2013} {"train_loss": -23.914264678955078, "global_step": 167127, "epoch": 2013} {"train_loss": -23.495849609375, "global_step": 167128, "epoch": 2013} {"train_loss": -23.520164489746094, "global_step": 167129, "epoch": 2013} {"train_loss": -23.816219329833984, "global_step": 167130, "epoch": 2013} {"train_loss": -23.846105575561523, "global_step": 167131, "epoch": 2013} {"train_loss": -23.084861755371094, "global_step": 167132, "epoch": 2013} {"train_loss": -23.661115646362305, "global_step": 167133, "epoch": 2013} {"train_loss": -23.930543899536133, "global_step": 167134, "epoch": 2013} {"train_loss": -23.273590087890625, "global_step": 167135, "epoch": 2013} {"train_loss": -23.752132415771484, "global_step": 167136, "epoch": 2013} {"train_loss": -23.8267765045166, "global_step": 167137, "epoch": 2013} {"train_loss": -23.911802291870117, "global_step": 167138, "epoch": 2013} {"train_loss": -23.827882766723633, "global_step": 167139, "epoch": 2013} {"train_loss": -24.12483787536621, "global_step": 167140, "epoch": 2013} {"train_loss": -23.65806007385254, "global_step": 167141, "epoch": 2013} {"train_loss": -23.525054931640625, "global_step": 167142, "epoch": 2013} {"train_loss": -23.730083465576172, "global_step": 167143, "epoch": 2013} {"train_loss": -23.897565841674805, "global_step": 167144, "epoch": 2013} {"train_loss": -23.764677047729492, "global_step": 167145, "epoch": 2013} {"train_loss": -23.782011032104492, "global_step": 167146, "epoch": 2013} {"train_loss": -23.716262817382812, "global_step": 167147, "epoch": 2013} {"train_loss": -24.0048885345459, "global_step": 167148, "epoch": 2013} {"train_loss": -23.81500816345215, "global_step": 167149, "epoch": 2013} {"train_loss": -23.784297943115234, "global_step": 167150, "epoch": 2013} {"train_loss": -23.82551383972168, "global_step": 167151, "epoch": 2013} {"train_loss": -23.710708618164062, "global_step": 167152, "epoch": 2013} {"train_loss": -23.45838165283203, "global_step": 167153, "epoch": 2013} {"train_loss": -23.7833251953125, "global_step": 167154, "epoch": 2013} {"train_loss": -23.8819522857666, "global_step": 167155, "epoch": 2013} {"train_loss": -23.626081466674805, "global_step": 167156, "epoch": 2013} {"train_loss": -23.60502052307129, "global_step": 167157, "epoch": 2013} {"train_loss": -23.500476837158203, "global_step": 167158, "epoch": 2013} {"train_loss": -23.461074829101562, "global_step": 167159, "epoch": 2013} {"train_loss": -23.545804977416992, "global_step": 167160, "epoch": 2013} {"train_loss": -23.667735570884613, "global_step": 167161, "epoch": 2013, "val_loss": 6364890.0} {"train_loss": -23.27690887451172, "global_step": 167162, "epoch": 2014} {"train_loss": -23.21959686279297, "global_step": 167163, "epoch": 2014} {"train_loss": -23.55600357055664, "global_step": 167164, "epoch": 2014} {"train_loss": -22.751487731933594, "global_step": 167165, "epoch": 2014} {"train_loss": -23.27602195739746, "global_step": 167166, "epoch": 2014} {"train_loss": -23.171735763549805, "global_step": 167167, "epoch": 2014} {"train_loss": -23.378299713134766, "global_step": 167168, "epoch": 2014} {"train_loss": -23.308500289916992, "global_step": 167169, "epoch": 2014} {"train_loss": -23.00113868713379, "global_step": 167170, "epoch": 2014} {"train_loss": -23.065221786499023, "global_step": 167171, "epoch": 2014} {"train_loss": -23.372175216674805, "global_step": 167172, "epoch": 2014} {"train_loss": -23.50211524963379, "global_step": 167173, "epoch": 2014} {"train_loss": -23.41485595703125, "global_step": 167174, "epoch": 2014} {"train_loss": -23.23468017578125, "global_step": 167175, "epoch": 2014} {"train_loss": -23.46473503112793, "global_step": 167176, "epoch": 2014} {"train_loss": -23.238632202148438, "global_step": 167177, "epoch": 2014} {"train_loss": -23.224536895751953, "global_step": 167178, "epoch": 2014} {"train_loss": -23.616926193237305, "global_step": 167179, "epoch": 2014} {"train_loss": -23.4365291595459, "global_step": 167180, "epoch": 2014} {"train_loss": -23.21622085571289, "global_step": 167181, "epoch": 2014} {"train_loss": -23.378908157348633, "global_step": 167182, "epoch": 2014} {"train_loss": -23.474485397338867, "global_step": 167183, "epoch": 2014} {"train_loss": -23.298147201538086, "global_step": 167184, "epoch": 2014} {"train_loss": -23.497516632080078, "global_step": 167185, "epoch": 2014} {"train_loss": -23.60474395751953, "global_step": 167186, "epoch": 2014} {"train_loss": -23.459978103637695, "global_step": 167187, "epoch": 2014} {"train_loss": -23.871261596679688, "global_step": 167188, "epoch": 2014} {"train_loss": -23.591928482055664, "global_step": 167189, "epoch": 2014} {"train_loss": -23.40721893310547, "global_step": 167190, "epoch": 2014} {"train_loss": -23.774442672729492, "global_step": 167191, "epoch": 2014} {"train_loss": -23.72187042236328, "global_step": 167192, "epoch": 2014} {"train_loss": -23.377601623535156, "global_step": 167193, "epoch": 2014} {"train_loss": -23.54572105407715, "global_step": 167194, "epoch": 2014} {"train_loss": -23.53306007385254, "global_step": 167195, "epoch": 2014} {"train_loss": -23.843843460083008, "global_step": 167196, "epoch": 2014} {"train_loss": -23.532495498657227, "global_step": 167197, "epoch": 2014} {"train_loss": -23.41014289855957, "global_step": 167198, "epoch": 2014} {"train_loss": -23.636959075927734, "global_step": 167199, "epoch": 2014} {"train_loss": -23.947736740112305, "global_step": 167200, "epoch": 2014} {"train_loss": -23.370132446289062, "global_step": 167201, "epoch": 2014} {"train_loss": -23.80190086364746, "global_step": 167202, "epoch": 2014} {"train_loss": -23.599185943603516, "global_step": 167203, "epoch": 2014} {"train_loss": -23.70766258239746, "global_step": 167204, "epoch": 2014} {"train_loss": -23.393924713134766, "global_step": 167205, "epoch": 2014} {"train_loss": -23.577913284301758, "global_step": 167206, "epoch": 2014} {"train_loss": -23.796550750732422, "global_step": 167207, "epoch": 2014} {"train_loss": -24.069419860839844, "global_step": 167208, "epoch": 2014} {"train_loss": -23.886545181274414, "global_step": 167209, "epoch": 2014} {"train_loss": -23.416324615478516, "global_step": 167210, "epoch": 2014} {"train_loss": -23.529245376586914, "global_step": 167211, "epoch": 2014} {"train_loss": -23.717905044555664, "global_step": 167212, "epoch": 2014} {"train_loss": -23.216501235961914, "global_step": 167213, "epoch": 2014} {"train_loss": -24.0231990814209, "global_step": 167214, "epoch": 2014} {"train_loss": -23.58841896057129, "global_step": 167215, "epoch": 2014} {"train_loss": -23.521289825439453, "global_step": 167216, "epoch": 2014} {"train_loss": -23.671890258789062, "global_step": 167217, "epoch": 2014} {"train_loss": -23.625513076782227, "global_step": 167218, "epoch": 2014} {"train_loss": -23.363819122314453, "global_step": 167219, "epoch": 2014} {"train_loss": -23.485689163208008, "global_step": 167220, "epoch": 2014} {"train_loss": -24.05473518371582, "global_step": 167221, "epoch": 2014} {"train_loss": -23.709468841552734, "global_step": 167222, "epoch": 2014} {"train_loss": -24.132097244262695, "global_step": 167223, "epoch": 2014} {"train_loss": -23.910795211791992, "global_step": 167224, "epoch": 2014} {"train_loss": -23.570537567138672, "global_step": 167225, "epoch": 2014} {"train_loss": -23.640291213989258, "global_step": 167226, "epoch": 2014} {"train_loss": -23.91929054260254, "global_step": 167227, "epoch": 2014} {"train_loss": -23.548765182495117, "global_step": 167228, "epoch": 2014} {"train_loss": -23.846927642822266, "global_step": 167229, "epoch": 2014} {"train_loss": -24.13679313659668, "global_step": 167230, "epoch": 2014} {"train_loss": -23.977060317993164, "global_step": 167231, "epoch": 2014} {"train_loss": -23.543537139892578, "global_step": 167232, "epoch": 2014} {"train_loss": -23.375669479370117, "global_step": 167233, "epoch": 2014} {"train_loss": -23.872873306274414, "global_step": 167234, "epoch": 2014} {"train_loss": -23.952363967895508, "global_step": 167235, "epoch": 2014} {"train_loss": -23.796213150024414, "global_step": 167236, "epoch": 2014} {"train_loss": -23.90838050842285, "global_step": 167237, "epoch": 2014} {"train_loss": -23.919233322143555, "global_step": 167238, "epoch": 2014} {"train_loss": -23.7393856048584, "global_step": 167239, "epoch": 2014} {"train_loss": -23.722270965576172, "global_step": 167240, "epoch": 2014} {"train_loss": -23.758289337158203, "global_step": 167241, "epoch": 2014} {"train_loss": -23.37980842590332, "global_step": 167242, "epoch": 2014} {"train_loss": -23.882980346679688, "global_step": 167243, "epoch": 2014} {"train_loss": -23.586113228855364, "global_step": 167244, "epoch": 2014, "val_loss": 6505030.0} {"train_loss": -22.845706939697266, "global_step": 167245, "epoch": 2015} {"train_loss": -23.154409408569336, "global_step": 167246, "epoch": 2015} {"train_loss": -22.912918090820312, "global_step": 167247, "epoch": 2015} {"train_loss": -22.651857376098633, "global_step": 167248, "epoch": 2015} {"train_loss": -22.832571029663086, "global_step": 167249, "epoch": 2015} {"train_loss": -22.94976806640625, "global_step": 167250, "epoch": 2015} {"train_loss": -23.19046974182129, "global_step": 167251, "epoch": 2015} {"train_loss": -23.067625045776367, "global_step": 167252, "epoch": 2015} {"train_loss": -22.999189376831055, "global_step": 167253, "epoch": 2015} {"train_loss": -23.38312339782715, "global_step": 167254, "epoch": 2015} {"train_loss": -23.692947387695312, "global_step": 167255, "epoch": 2015} {"train_loss": -23.21494483947754, "global_step": 167256, "epoch": 2015} {"train_loss": -23.31509780883789, "global_step": 167257, "epoch": 2015} {"train_loss": -23.55796241760254, "global_step": 167258, "epoch": 2015} {"train_loss": -23.39627456665039, "global_step": 167259, "epoch": 2015} {"train_loss": -23.346389770507812, "global_step": 167260, "epoch": 2015} {"train_loss": -23.45881462097168, "global_step": 167261, "epoch": 2015} {"train_loss": -23.328670501708984, "global_step": 167262, "epoch": 2015} {"train_loss": -23.869850158691406, "global_step": 167263, "epoch": 2015} {"train_loss": -23.31612205505371, "global_step": 167264, "epoch": 2015} {"train_loss": -23.612682342529297, "global_step": 167265, "epoch": 2015} {"train_loss": -23.597753524780273, "global_step": 167266, "epoch": 2015} {"train_loss": -23.474960327148438, "global_step": 167267, "epoch": 2015} {"train_loss": -23.67759895324707, "global_step": 167268, "epoch": 2015} {"train_loss": -23.766050338745117, "global_step": 167269, "epoch": 2015} {"train_loss": -23.805967330932617, "global_step": 167270, "epoch": 2015} {"train_loss": -23.709228515625, "global_step": 167271, "epoch": 2015} {"train_loss": -23.592687606811523, "global_step": 167272, "epoch": 2015} {"train_loss": -23.83426856994629, "global_step": 167273, "epoch": 2015} {"train_loss": -23.52463150024414, "global_step": 167274, "epoch": 2015} {"train_loss": -23.440956115722656, "global_step": 167275, "epoch": 2015} {"train_loss": -23.675636291503906, "global_step": 167276, "epoch": 2015} {"train_loss": -23.817609786987305, "global_step": 167277, "epoch": 2015} {"train_loss": -23.588729858398438, "global_step": 167278, "epoch": 2015} {"train_loss": -23.740243911743164, "global_step": 167279, "epoch": 2015} {"train_loss": -23.7106990814209, "global_step": 167280, "epoch": 2015} {"train_loss": -23.983049392700195, "global_step": 167281, "epoch": 2015} {"train_loss": -23.440526962280273, "global_step": 167282, "epoch": 2015} {"train_loss": -23.75902557373047, "global_step": 167283, "epoch": 2015} {"train_loss": -24.040973663330078, "global_step": 167284, "epoch": 2015} {"train_loss": -24.00581932067871, "global_step": 167285, "epoch": 2015} {"train_loss": -23.748035430908203, "global_step": 167286, "epoch": 2015} {"train_loss": -23.511568069458008, "global_step": 167287, "epoch": 2015} {"train_loss": -23.28899574279785, "global_step": 167288, "epoch": 2015} {"train_loss": -23.585378646850586, "global_step": 167289, "epoch": 2015} {"train_loss": -23.840208053588867, "global_step": 167290, "epoch": 2015} {"train_loss": -23.41200065612793, "global_step": 167291, "epoch": 2015} {"train_loss": -23.432785034179688, "global_step": 167292, "epoch": 2015} {"train_loss": -23.4720458984375, "global_step": 167293, "epoch": 2015} {"train_loss": -23.550281524658203, "global_step": 167294, "epoch": 2015} {"train_loss": -23.654821395874023, "global_step": 167295, "epoch": 2015} {"train_loss": -23.54812240600586, "global_step": 167296, "epoch": 2015} {"train_loss": -23.656091690063477, "global_step": 167297, "epoch": 2015} {"train_loss": -23.66071128845215, "global_step": 167298, "epoch": 2015} {"train_loss": -23.23223876953125, "global_step": 167299, "epoch": 2015} {"train_loss": -23.570545196533203, "global_step": 167300, "epoch": 2015} {"train_loss": -23.817760467529297, "global_step": 167301, "epoch": 2015} {"train_loss": -23.49867057800293, "global_step": 167302, "epoch": 2015} {"train_loss": -23.744930267333984, "global_step": 167303, "epoch": 2015} {"train_loss": -23.654661178588867, "global_step": 167304, "epoch": 2015} {"train_loss": -23.61421012878418, "global_step": 167305, "epoch": 2015} {"train_loss": -23.16840171813965, "global_step": 167306, "epoch": 2015} {"train_loss": -23.47035789489746, "global_step": 167307, "epoch": 2015} {"train_loss": -23.95977783203125, "global_step": 167308, "epoch": 2015} {"train_loss": -23.953176498413086, "global_step": 167309, "epoch": 2015} {"train_loss": -23.48725700378418, "global_step": 167310, "epoch": 2015} {"train_loss": -23.700149536132812, "global_step": 167311, "epoch": 2015} {"train_loss": -23.593408584594727, "global_step": 167312, "epoch": 2015} {"train_loss": -23.41657829284668, "global_step": 167313, "epoch": 2015} {"train_loss": -23.638683319091797, "global_step": 167314, "epoch": 2015} {"train_loss": -23.676013946533203, "global_step": 167315, "epoch": 2015} {"train_loss": -23.59945297241211, "global_step": 167316, "epoch": 2015} {"train_loss": -23.64325714111328, "global_step": 167317, "epoch": 2015} {"train_loss": -23.475576400756836, "global_step": 167318, "epoch": 2015} {"train_loss": -23.48169708251953, "global_step": 167319, "epoch": 2015} {"train_loss": -23.647485733032227, "global_step": 167320, "epoch": 2015} {"train_loss": -23.735443115234375, "global_step": 167321, "epoch": 2015} {"train_loss": -23.173980712890625, "global_step": 167322, "epoch": 2015} {"train_loss": -23.858015060424805, "global_step": 167323, "epoch": 2015} {"train_loss": -23.662240982055664, "global_step": 167324, "epoch": 2015} {"train_loss": -23.93965721130371, "global_step": 167325, "epoch": 2015} {"train_loss": -23.805700302124023, "global_step": 167326, "epoch": 2015} {"train_loss": -23.5396894891578, "global_step": 167327, "epoch": 2015, "val_loss": 6357139.0} {"train_loss": -22.933629989624023, "global_step": 167328, "epoch": 2016} {"train_loss": -22.4691219329834, "global_step": 167329, "epoch": 2016} {"train_loss": -23.912513732910156, "global_step": 167330, "epoch": 2016} {"train_loss": -23.289775848388672, "global_step": 167331, "epoch": 2016} {"train_loss": -23.143217086791992, "global_step": 167332, "epoch": 2016} {"train_loss": -23.15015983581543, "global_step": 167333, "epoch": 2016} {"train_loss": -23.067045211791992, "global_step": 167334, "epoch": 2016} {"train_loss": -23.38495445251465, "global_step": 167335, "epoch": 2016} {"train_loss": -23.46843147277832, "global_step": 167336, "epoch": 2016} {"train_loss": -23.6173152923584, "global_step": 167337, "epoch": 2016} {"train_loss": -23.45002555847168, "global_step": 167338, "epoch": 2016} {"train_loss": -23.708576202392578, "global_step": 167339, "epoch": 2016} {"train_loss": -23.500568389892578, "global_step": 167340, "epoch": 2016} {"train_loss": -23.463529586791992, "global_step": 167341, "epoch": 2016} {"train_loss": -23.76328468322754, "global_step": 167342, "epoch": 2016} {"train_loss": -23.399106979370117, "global_step": 167343, "epoch": 2016} {"train_loss": -23.45068359375, "global_step": 167344, "epoch": 2016} {"train_loss": -23.439348220825195, "global_step": 167345, "epoch": 2016} {"train_loss": -23.880373001098633, "global_step": 167346, "epoch": 2016} {"train_loss": -24.138235092163086, "global_step": 167347, "epoch": 2016} {"train_loss": -23.39363670349121, "global_step": 167348, "epoch": 2016} {"train_loss": -23.26885223388672, "global_step": 167349, "epoch": 2016} {"train_loss": -23.82157325744629, "global_step": 167350, "epoch": 2016} {"train_loss": -23.634227752685547, "global_step": 167351, "epoch": 2016} {"train_loss": -23.60328483581543, "global_step": 167352, "epoch": 2016} {"train_loss": -23.811328887939453, "global_step": 167353, "epoch": 2016} {"train_loss": -23.720428466796875, "global_step": 167354, "epoch": 2016} {"train_loss": -23.65899085998535, "global_step": 167355, "epoch": 2016} {"train_loss": -23.640954971313477, "global_step": 167356, "epoch": 2016} {"train_loss": -23.695293426513672, "global_step": 167357, "epoch": 2016} {"train_loss": -23.6990966796875, "global_step": 167358, "epoch": 2016} {"train_loss": -23.556493759155273, "global_step": 167359, "epoch": 2016} {"train_loss": -23.09427833557129, "global_step": 167360, "epoch": 2016} {"train_loss": -23.471586227416992, "global_step": 167361, "epoch": 2016} {"train_loss": -23.96536636352539, "global_step": 167362, "epoch": 2016} {"train_loss": -24.039316177368164, "global_step": 167363, "epoch": 2016} {"train_loss": -23.53642463684082, "global_step": 167364, "epoch": 2016} {"train_loss": -23.53885841369629, "global_step": 167365, "epoch": 2016} {"train_loss": -23.70137596130371, "global_step": 167366, "epoch": 2016} {"train_loss": -23.760343551635742, "global_step": 167367, "epoch": 2016} {"train_loss": -23.583463668823242, "global_step": 167368, "epoch": 2016} {"train_loss": -23.400487899780273, "global_step": 167369, "epoch": 2016} {"train_loss": -23.52337646484375, "global_step": 167370, "epoch": 2016} {"train_loss": -23.642126083374023, "global_step": 167371, "epoch": 2016} {"train_loss": -23.477277755737305, "global_step": 167372, "epoch": 2016} {"train_loss": -23.583158493041992, "global_step": 167373, "epoch": 2016} {"train_loss": -23.623714447021484, "global_step": 167374, "epoch": 2016} {"train_loss": -24.09444236755371, "global_step": 167375, "epoch": 2016} {"train_loss": -23.57686424255371, "global_step": 167376, "epoch": 2016} {"train_loss": -23.58917236328125, "global_step": 167377, "epoch": 2016} {"train_loss": -23.784887313842773, "global_step": 167378, "epoch": 2016} {"train_loss": -24.12099266052246, "global_step": 167379, "epoch": 2016} {"train_loss": -23.6724853515625, "global_step": 167380, "epoch": 2016} {"train_loss": -23.21331787109375, "global_step": 167381, "epoch": 2016} {"train_loss": -23.684425354003906, "global_step": 167382, "epoch": 2016} {"train_loss": -23.764944076538086, "global_step": 167383, "epoch": 2016} {"train_loss": -23.671619415283203, "global_step": 167384, "epoch": 2016} {"train_loss": -23.987455368041992, "global_step": 167385, "epoch": 2016} {"train_loss": -23.714094161987305, "global_step": 167386, "epoch": 2016} {"train_loss": -23.597572326660156, "global_step": 167387, "epoch": 2016} {"train_loss": -23.41602897644043, "global_step": 167388, "epoch": 2016} {"train_loss": -23.234556198120117, "global_step": 167389, "epoch": 2016} {"train_loss": -23.185468673706055, "global_step": 167390, "epoch": 2016} {"train_loss": -23.725431442260742, "global_step": 167391, "epoch": 2016} {"train_loss": -23.699695587158203, "global_step": 167392, "epoch": 2016} {"train_loss": -23.81410789489746, "global_step": 167393, "epoch": 2016} {"train_loss": -23.805118560791016, "global_step": 167394, "epoch": 2016} {"train_loss": -23.8441104888916, "global_step": 167395, "epoch": 2016} {"train_loss": -23.686573028564453, "global_step": 167396, "epoch": 2016} {"train_loss": -23.43501853942871, "global_step": 167397, "epoch": 2016} {"train_loss": -23.7149715423584, "global_step": 167398, "epoch": 2016} {"train_loss": -23.82875633239746, "global_step": 167399, "epoch": 2016} {"train_loss": -23.48940658569336, "global_step": 167400, "epoch": 2016} {"train_loss": -23.933156967163086, "global_step": 167401, "epoch": 2016} {"train_loss": -23.853363037109375, "global_step": 167402, "epoch": 2016} {"train_loss": -23.653345108032227, "global_step": 167403, "epoch": 2016} {"train_loss": -23.4877872467041, "global_step": 167404, "epoch": 2016} {"train_loss": -23.892242431640625, "global_step": 167405, "epoch": 2016} {"train_loss": -23.430734634399414, "global_step": 167406, "epoch": 2016} {"train_loss": -23.669950485229492, "global_step": 167407, "epoch": 2016} {"train_loss": -23.630077362060547, "global_step": 167408, "epoch": 2016} {"train_loss": -23.876195907592773, "global_step": 167409, "epoch": 2016} {"train_loss": -23.616032565932677, "global_step": 167410, "epoch": 2016, "val_loss": 6360908.0} {"train_loss": -23.508895874023438, "global_step": 167411, "epoch": 2017} {"train_loss": -23.037933349609375, "global_step": 167412, "epoch": 2017} {"train_loss": -23.60342788696289, "global_step": 167413, "epoch": 2017} {"train_loss": -23.487159729003906, "global_step": 167414, "epoch": 2017} {"train_loss": -23.4299373626709, "global_step": 167415, "epoch": 2017} {"train_loss": -23.233844757080078, "global_step": 167416, "epoch": 2017} {"train_loss": -23.537307739257812, "global_step": 167417, "epoch": 2017} {"train_loss": -23.769699096679688, "global_step": 167418, "epoch": 2017} {"train_loss": -23.851327896118164, "global_step": 167419, "epoch": 2017} {"train_loss": -24.060564041137695, "global_step": 167420, "epoch": 2017} {"train_loss": -23.235523223876953, "global_step": 167421, "epoch": 2017} {"train_loss": -23.579450607299805, "global_step": 167422, "epoch": 2017} {"train_loss": -23.53118896484375, "global_step": 167423, "epoch": 2017} {"train_loss": -23.779037475585938, "global_step": 167424, "epoch": 2017} {"train_loss": -23.350772857666016, "global_step": 167425, "epoch": 2017} {"train_loss": -23.58261489868164, "global_step": 167426, "epoch": 2017} {"train_loss": -24.05374526977539, "global_step": 167427, "epoch": 2017} {"train_loss": -23.19476890563965, "global_step": 167428, "epoch": 2017} {"train_loss": -23.459653854370117, "global_step": 167429, "epoch": 2017} {"train_loss": -23.538862228393555, "global_step": 167430, "epoch": 2017} {"train_loss": -23.576101303100586, "global_step": 167431, "epoch": 2017} {"train_loss": -23.45857048034668, "global_step": 167432, "epoch": 2017} {"train_loss": -23.30984115600586, "global_step": 167433, "epoch": 2017} {"train_loss": -23.648160934448242, "global_step": 167434, "epoch": 2017} {"train_loss": -23.717063903808594, "global_step": 167435, "epoch": 2017} {"train_loss": -23.490949630737305, "global_step": 167436, "epoch": 2017} {"train_loss": -23.67410659790039, "global_step": 167437, "epoch": 2017} {"train_loss": -23.689977645874023, "global_step": 167438, "epoch": 2017} {"train_loss": -23.51422882080078, "global_step": 167439, "epoch": 2017} {"train_loss": -23.86626625061035, "global_step": 167440, "epoch": 2017} {"train_loss": -23.657014846801758, "global_step": 167441, "epoch": 2017} {"train_loss": -23.69942283630371, "global_step": 167442, "epoch": 2017} {"train_loss": -23.573495864868164, "global_step": 167443, "epoch": 2017} {"train_loss": -23.71697998046875, "global_step": 167444, "epoch": 2017} {"train_loss": -23.718290328979492, "global_step": 167445, "epoch": 2017} {"train_loss": -23.554895401000977, "global_step": 167446, "epoch": 2017} {"train_loss": -23.344730377197266, "global_step": 167447, "epoch": 2017} {"train_loss": -23.98479652404785, "global_step": 167448, "epoch": 2017} {"train_loss": -23.436002731323242, "global_step": 167449, "epoch": 2017} {"train_loss": -23.29050636291504, "global_step": 167450, "epoch": 2017} {"train_loss": -23.518386840820312, "global_step": 167451, "epoch": 2017} {"train_loss": -23.58432960510254, "global_step": 167452, "epoch": 2017} {"train_loss": -23.512283325195312, "global_step": 167453, "epoch": 2017} {"train_loss": -23.748233795166016, "global_step": 167454, "epoch": 2017} {"train_loss": -23.724002838134766, "global_step": 167455, "epoch": 2017} {"train_loss": -23.765897750854492, "global_step": 167456, "epoch": 2017} {"train_loss": -24.01823616027832, "global_step": 167457, "epoch": 2017} {"train_loss": -23.378076553344727, "global_step": 167458, "epoch": 2017} {"train_loss": -23.9502010345459, "global_step": 167459, "epoch": 2017} {"train_loss": -23.703351974487305, "global_step": 167460, "epoch": 2017} {"train_loss": -23.641326904296875, "global_step": 167461, "epoch": 2017} {"train_loss": -23.5380802154541, "global_step": 167462, "epoch": 2017} {"train_loss": -23.690275192260742, "global_step": 167463, "epoch": 2017} {"train_loss": -23.77259063720703, "global_step": 167464, "epoch": 2017} {"train_loss": -23.821317672729492, "global_step": 167465, "epoch": 2017} {"train_loss": -24.126108169555664, "global_step": 167466, "epoch": 2017} {"train_loss": -23.27370262145996, "global_step": 167467, "epoch": 2017} {"train_loss": -23.857044219970703, "global_step": 167468, "epoch": 2017} {"train_loss": -23.48740577697754, "global_step": 167469, "epoch": 2017} {"train_loss": -23.90266990661621, "global_step": 167470, "epoch": 2017} {"train_loss": -23.773727416992188, "global_step": 167471, "epoch": 2017} {"train_loss": -23.746309280395508, "global_step": 167472, "epoch": 2017} {"train_loss": -23.582443237304688, "global_step": 167473, "epoch": 2017} {"train_loss": -23.566329956054688, "global_step": 167474, "epoch": 2017} {"train_loss": -23.786808013916016, "global_step": 167475, "epoch": 2017} {"train_loss": -23.754732131958008, "global_step": 167476, "epoch": 2017} {"train_loss": -23.75788688659668, "global_step": 167477, "epoch": 2017} {"train_loss": -23.412118911743164, "global_step": 167478, "epoch": 2017} {"train_loss": -23.71198844909668, "global_step": 167479, "epoch": 2017} {"train_loss": -23.30319595336914, "global_step": 167480, "epoch": 2017} {"train_loss": -23.436613082885742, "global_step": 167481, "epoch": 2017} {"train_loss": -23.25792121887207, "global_step": 167482, "epoch": 2017} {"train_loss": -23.338287353515625, "global_step": 167483, "epoch": 2017} {"train_loss": -23.78396987915039, "global_step": 167484, "epoch": 2017} {"train_loss": -23.987009048461914, "global_step": 167485, "epoch": 2017} {"train_loss": -23.803010940551758, "global_step": 167486, "epoch": 2017} {"train_loss": -23.791427612304688, "global_step": 167487, "epoch": 2017} {"train_loss": -23.734346389770508, "global_step": 167488, "epoch": 2017} {"train_loss": -23.995859146118164, "global_step": 167489, "epoch": 2017} {"train_loss": -23.784475326538086, "global_step": 167490, "epoch": 2017} {"train_loss": -23.869291305541992, "global_step": 167491, "epoch": 2017} {"train_loss": -23.456892013549805, "global_step": 167492, "epoch": 2017} {"train_loss": -23.63092672968485, "global_step": 167493, "epoch": 2017, "val_loss": 6317434.5} {"train_loss": -23.077655792236328, "global_step": 167494, "epoch": 2018} {"train_loss": -22.92183494567871, "global_step": 167495, "epoch": 2018} {"train_loss": -23.42909812927246, "global_step": 167496, "epoch": 2018} {"train_loss": -23.017349243164062, "global_step": 167497, "epoch": 2018} {"train_loss": -23.4689884185791, "global_step": 167498, "epoch": 2018} {"train_loss": -23.107831954956055, "global_step": 167499, "epoch": 2018} {"train_loss": -23.120182037353516, "global_step": 167500, "epoch": 2018} {"train_loss": -23.39822769165039, "global_step": 167501, "epoch": 2018} {"train_loss": -23.157690048217773, "global_step": 167502, "epoch": 2018} {"train_loss": -23.61836051940918, "global_step": 167503, "epoch": 2018} {"train_loss": -23.550790786743164, "global_step": 167504, "epoch": 2018} {"train_loss": -23.44049835205078, "global_step": 167505, "epoch": 2018} {"train_loss": -23.305540084838867, "global_step": 167506, "epoch": 2018} {"train_loss": -23.399625778198242, "global_step": 167507, "epoch": 2018} {"train_loss": -23.576292037963867, "global_step": 167508, "epoch": 2018} {"train_loss": -23.734617233276367, "global_step": 167509, "epoch": 2018} {"train_loss": -24.213979721069336, "global_step": 167510, "epoch": 2018} {"train_loss": -23.62062644958496, "global_step": 167511, "epoch": 2018} {"train_loss": -23.756866455078125, "global_step": 167512, "epoch": 2018} {"train_loss": -23.56790542602539, "global_step": 167513, "epoch": 2018} {"train_loss": -23.664377212524414, "global_step": 167514, "epoch": 2018} {"train_loss": -23.55988121032715, "global_step": 167515, "epoch": 2018} {"train_loss": -23.506383895874023, "global_step": 167516, "epoch": 2018} {"train_loss": -23.18645668029785, "global_step": 167517, "epoch": 2018} {"train_loss": -23.587352752685547, "global_step": 167518, "epoch": 2018} {"train_loss": -23.7874813079834, "global_step": 167519, "epoch": 2018} {"train_loss": -23.580476760864258, "global_step": 167520, "epoch": 2018} {"train_loss": -23.325345993041992, "global_step": 167521, "epoch": 2018} {"train_loss": -23.875761032104492, "global_step": 167522, "epoch": 2018} {"train_loss": -23.59855079650879, "global_step": 167523, "epoch": 2018} {"train_loss": -23.702688217163086, "global_step": 167524, "epoch": 2018} {"train_loss": -23.32588768005371, "global_step": 167525, "epoch": 2018} {"train_loss": -23.842199325561523, "global_step": 167526, "epoch": 2018} {"train_loss": -23.540616989135742, "global_step": 167527, "epoch": 2018} {"train_loss": -23.420852661132812, "global_step": 167528, "epoch": 2018} {"train_loss": -23.4451847076416, "global_step": 167529, "epoch": 2018} {"train_loss": -23.83979606628418, "global_step": 167530, "epoch": 2018} {"train_loss": -23.22688865661621, "global_step": 167531, "epoch": 2018} {"train_loss": -23.35961151123047, "global_step": 167532, "epoch": 2018} {"train_loss": -23.826396942138672, "global_step": 167533, "epoch": 2018} {"train_loss": -22.92096519470215, "global_step": 167534, "epoch": 2018} {"train_loss": -23.052093505859375, "global_step": 167535, "epoch": 2018} {"train_loss": -23.17460823059082, "global_step": 167536, "epoch": 2018} {"train_loss": -23.629552841186523, "global_step": 167537, "epoch": 2018} {"train_loss": -23.84817886352539, "global_step": 167538, "epoch": 2018} {"train_loss": -23.824247360229492, "global_step": 167539, "epoch": 2018} {"train_loss": -23.655858993530273, "global_step": 167540, "epoch": 2018} {"train_loss": -23.567453384399414, "global_step": 167541, "epoch": 2018} {"train_loss": -23.635656356811523, "global_step": 167542, "epoch": 2018} {"train_loss": -23.872037887573242, "global_step": 167543, "epoch": 2018} {"train_loss": -23.48201560974121, "global_step": 167544, "epoch": 2018} {"train_loss": -23.85963249206543, "global_step": 167545, "epoch": 2018} {"train_loss": -23.279626846313477, "global_step": 167546, "epoch": 2018} {"train_loss": -23.70062255859375, "global_step": 167547, "epoch": 2018} {"train_loss": -23.2542724609375, "global_step": 167548, "epoch": 2018} {"train_loss": -23.52252960205078, "global_step": 167549, "epoch": 2018} {"train_loss": -23.64581298828125, "global_step": 167550, "epoch": 2018} {"train_loss": -23.861783981323242, "global_step": 167551, "epoch": 2018} {"train_loss": -23.885770797729492, "global_step": 167552, "epoch": 2018} {"train_loss": -23.498809814453125, "global_step": 167553, "epoch": 2018} {"train_loss": -23.284008026123047, "global_step": 167554, "epoch": 2018} {"train_loss": -23.429061889648438, "global_step": 167555, "epoch": 2018} {"train_loss": -23.821470260620117, "global_step": 167556, "epoch": 2018} {"train_loss": -23.3479061126709, "global_step": 167557, "epoch": 2018} {"train_loss": -23.741165161132812, "global_step": 167558, "epoch": 2018} {"train_loss": -23.891773223876953, "global_step": 167559, "epoch": 2018} {"train_loss": -23.841815948486328, "global_step": 167560, "epoch": 2018} {"train_loss": -23.540470123291016, "global_step": 167561, "epoch": 2018} {"train_loss": -23.44832420349121, "global_step": 167562, "epoch": 2018} {"train_loss": -23.710969924926758, "global_step": 167563, "epoch": 2018} {"train_loss": -23.778583526611328, "global_step": 167564, "epoch": 2018} {"train_loss": -23.56982421875, "global_step": 167565, "epoch": 2018} {"train_loss": -23.847919464111328, "global_step": 167566, "epoch": 2018} {"train_loss": -23.618412017822266, "global_step": 167567, "epoch": 2018} {"train_loss": -23.449222564697266, "global_step": 167568, "epoch": 2018} {"train_loss": -23.976787567138672, "global_step": 167569, "epoch": 2018} {"train_loss": -23.79213523864746, "global_step": 167570, "epoch": 2018} {"train_loss": -23.772024154663086, "global_step": 167571, "epoch": 2018} {"train_loss": -23.46109390258789, "global_step": 167572, "epoch": 2018} {"train_loss": -23.413389205932617, "global_step": 167573, "epoch": 2018} {"train_loss": -23.474287033081055, "global_step": 167574, "epoch": 2018} {"train_loss": -23.044452667236328, "global_step": 167575, "epoch": 2018} {"train_loss": -23.53016648809594, "global_step": 167576, "epoch": 2018, "val_loss": 6408331.0} {"train_loss": -23.643381118774414, "global_step": 167577, "epoch": 2019} {"train_loss": -22.764986038208008, "global_step": 167578, "epoch": 2019} {"train_loss": -23.38136863708496, "global_step": 167579, "epoch": 2019} {"train_loss": -23.213167190551758, "global_step": 167580, "epoch": 2019} {"train_loss": -23.192806243896484, "global_step": 167581, "epoch": 2019} {"train_loss": -22.836454391479492, "global_step": 167582, "epoch": 2019} {"train_loss": -23.339969635009766, "global_step": 167583, "epoch": 2019} {"train_loss": -23.597137451171875, "global_step": 167584, "epoch": 2019} {"train_loss": -23.851364135742188, "global_step": 167585, "epoch": 2019} {"train_loss": -23.8178768157959, "global_step": 167586, "epoch": 2019} {"train_loss": -23.648576736450195, "global_step": 167587, "epoch": 2019} {"train_loss": -23.678190231323242, "global_step": 167588, "epoch": 2019} {"train_loss": -23.7199764251709, "global_step": 167589, "epoch": 2019} {"train_loss": -23.197465896606445, "global_step": 167590, "epoch": 2019} {"train_loss": -23.677961349487305, "global_step": 167591, "epoch": 2019} {"train_loss": -23.24976921081543, "global_step": 167592, "epoch": 2019} {"train_loss": -23.409460067749023, "global_step": 167593, "epoch": 2019} {"train_loss": -23.46895408630371, "global_step": 167594, "epoch": 2019} {"train_loss": -23.768217086791992, "global_step": 167595, "epoch": 2019} {"train_loss": -23.37942886352539, "global_step": 167596, "epoch": 2019} {"train_loss": -23.67025375366211, "global_step": 167597, "epoch": 2019} {"train_loss": -23.541473388671875, "global_step": 167598, "epoch": 2019} {"train_loss": -23.448394775390625, "global_step": 167599, "epoch": 2019} {"train_loss": -23.58648109436035, "global_step": 167600, "epoch": 2019} {"train_loss": -23.7320613861084, "global_step": 167601, "epoch": 2019} {"train_loss": -23.752653121948242, "global_step": 167602, "epoch": 2019} {"train_loss": -23.629335403442383, "global_step": 167603, "epoch": 2019} {"train_loss": -23.419790267944336, "global_step": 167604, "epoch": 2019} {"train_loss": -23.601953506469727, "global_step": 167605, "epoch": 2019} {"train_loss": -23.50083351135254, "global_step": 167606, "epoch": 2019} {"train_loss": -23.56705665588379, "global_step": 167607, "epoch": 2019} {"train_loss": -23.4661865234375, "global_step": 167608, "epoch": 2019} {"train_loss": -23.56444549560547, "global_step": 167609, "epoch": 2019} {"train_loss": -23.430898666381836, "global_step": 167610, "epoch": 2019} {"train_loss": -23.81585121154785, "global_step": 167611, "epoch": 2019} {"train_loss": -23.47603416442871, "global_step": 167612, "epoch": 2019} {"train_loss": -23.4709415435791, "global_step": 167613, "epoch": 2019} {"train_loss": -23.898677825927734, "global_step": 167614, "epoch": 2019} {"train_loss": -24.06036376953125, "global_step": 167615, "epoch": 2019} {"train_loss": -23.72564697265625, "global_step": 167616, "epoch": 2019} {"train_loss": -23.6663818359375, "global_step": 167617, "epoch": 2019} {"train_loss": -23.599367141723633, "global_step": 167618, "epoch": 2019} {"train_loss": -23.255939483642578, "global_step": 167619, "epoch": 2019} {"train_loss": -23.562931060791016, "global_step": 167620, "epoch": 2019} {"train_loss": -23.72952651977539, "global_step": 167621, "epoch": 2019} {"train_loss": -23.762723922729492, "global_step": 167622, "epoch": 2019} {"train_loss": -23.654556274414062, "global_step": 167623, "epoch": 2019} {"train_loss": -23.637609481811523, "global_step": 167624, "epoch": 2019} {"train_loss": -23.765186309814453, "global_step": 167625, "epoch": 2019} {"train_loss": -23.890745162963867, "global_step": 167626, "epoch": 2019} {"train_loss": -23.3079776763916, "global_step": 167627, "epoch": 2019} {"train_loss": -23.80504608154297, "global_step": 167628, "epoch": 2019} {"train_loss": -23.513051986694336, "global_step": 167629, "epoch": 2019} {"train_loss": -24.06907081604004, "global_step": 167630, "epoch": 2019} {"train_loss": -23.46095085144043, "global_step": 167631, "epoch": 2019} {"train_loss": -23.7177791595459, "global_step": 167632, "epoch": 2019} {"train_loss": -23.67719841003418, "global_step": 167633, "epoch": 2019} {"train_loss": -23.94257164001465, "global_step": 167634, "epoch": 2019} {"train_loss": -23.612201690673828, "global_step": 167635, "epoch": 2019} {"train_loss": -24.016998291015625, "global_step": 167636, "epoch": 2019} {"train_loss": -23.821048736572266, "global_step": 167637, "epoch": 2019} {"train_loss": -23.10092544555664, "global_step": 167638, "epoch": 2019} {"train_loss": -23.496841430664062, "global_step": 167639, "epoch": 2019} {"train_loss": -23.994245529174805, "global_step": 167640, "epoch": 2019} {"train_loss": -23.422067642211914, "global_step": 167641, "epoch": 2019} {"train_loss": -23.464426040649414, "global_step": 167642, "epoch": 2019} {"train_loss": -23.264019012451172, "global_step": 167643, "epoch": 2019} {"train_loss": -23.076465606689453, "global_step": 167644, "epoch": 2019} {"train_loss": -23.779394149780273, "global_step": 167645, "epoch": 2019} {"train_loss": -23.557437896728516, "global_step": 167646, "epoch": 2019} {"train_loss": -23.776626586914062, "global_step": 167647, "epoch": 2019} {"train_loss": -23.664688110351562, "global_step": 167648, "epoch": 2019} {"train_loss": -23.638004302978516, "global_step": 167649, "epoch": 2019} {"train_loss": -23.674945831298828, "global_step": 167650, "epoch": 2019} {"train_loss": -23.640607833862305, "global_step": 167651, "epoch": 2019} {"train_loss": -24.0736083984375, "global_step": 167652, "epoch": 2019} {"train_loss": -23.517255783081055, "global_step": 167653, "epoch": 2019} {"train_loss": -23.76589012145996, "global_step": 167654, "epoch": 2019} {"train_loss": -23.657108306884766, "global_step": 167655, "epoch": 2019} {"train_loss": -23.813562393188477, "global_step": 167656, "epoch": 2019} {"train_loss": -23.170930862426758, "global_step": 167657, "epoch": 2019} {"train_loss": -23.66977310180664, "global_step": 167658, "epoch": 2019} {"train_loss": -23.580827414271344, "global_step": 167659, "epoch": 2019, "val_loss": 6325773.0} {"train_loss": -23.808195114135742, "global_step": 167660, "epoch": 2020} {"train_loss": -23.53388023376465, "global_step": 167661, "epoch": 2020} {"train_loss": -23.313674926757812, "global_step": 167662, "epoch": 2020} {"train_loss": -23.1577091217041, "global_step": 167663, "epoch": 2020} {"train_loss": -23.100248336791992, "global_step": 167664, "epoch": 2020} {"train_loss": -23.310266494750977, "global_step": 167665, "epoch": 2020} {"train_loss": -23.699947357177734, "global_step": 167666, "epoch": 2020} {"train_loss": -23.605758666992188, "global_step": 167667, "epoch": 2020} {"train_loss": -23.47867202758789, "global_step": 167668, "epoch": 2020} {"train_loss": -23.449106216430664, "global_step": 167669, "epoch": 2020} {"train_loss": -23.185945510864258, "global_step": 167670, "epoch": 2020} {"train_loss": -23.144094467163086, "global_step": 167671, "epoch": 2020} {"train_loss": -23.510879516601562, "global_step": 167672, "epoch": 2020} {"train_loss": -23.554224014282227, "global_step": 167673, "epoch": 2020} {"train_loss": -23.801250457763672, "global_step": 167674, "epoch": 2020} {"train_loss": -23.404470443725586, "global_step": 167675, "epoch": 2020} {"train_loss": -23.656835556030273, "global_step": 167676, "epoch": 2020} {"train_loss": -23.653839111328125, "global_step": 167677, "epoch": 2020} {"train_loss": -23.952741622924805, "global_step": 167678, "epoch": 2020} {"train_loss": -23.775766372680664, "global_step": 167679, "epoch": 2020} {"train_loss": -24.012786865234375, "global_step": 167680, "epoch": 2020} {"train_loss": -23.91876220703125, "global_step": 167681, "epoch": 2020} {"train_loss": -23.391376495361328, "global_step": 167682, "epoch": 2020} {"train_loss": -23.944875717163086, "global_step": 167683, "epoch": 2020} {"train_loss": -23.452735900878906, "global_step": 167684, "epoch": 2020} {"train_loss": -23.827587127685547, "global_step": 167685, "epoch": 2020} {"train_loss": -23.711862564086914, "global_step": 167686, "epoch": 2020} {"train_loss": -23.751516342163086, "global_step": 167687, "epoch": 2020} {"train_loss": -23.60991859436035, "global_step": 167688, "epoch": 2020} {"train_loss": -23.917530059814453, "global_step": 167689, "epoch": 2020} {"train_loss": -23.905832290649414, "global_step": 167690, "epoch": 2020} {"train_loss": -23.46558952331543, "global_step": 167691, "epoch": 2020} {"train_loss": -23.837318420410156, "global_step": 167692, "epoch": 2020} {"train_loss": -23.684415817260742, "global_step": 167693, "epoch": 2020} {"train_loss": -23.543405532836914, "global_step": 167694, "epoch": 2020} {"train_loss": -23.973833084106445, "global_step": 167695, "epoch": 2020} {"train_loss": -23.67259407043457, "global_step": 167696, "epoch": 2020} {"train_loss": -23.528335571289062, "global_step": 167697, "epoch": 2020} {"train_loss": -23.393461227416992, "global_step": 167698, "epoch": 2020} {"train_loss": -23.66023826599121, "global_step": 167699, "epoch": 2020} {"train_loss": -23.534870147705078, "global_step": 167700, "epoch": 2020} {"train_loss": -23.847482681274414, "global_step": 167701, "epoch": 2020} {"train_loss": -23.307804107666016, "global_step": 167702, "epoch": 2020} {"train_loss": -23.72917938232422, "global_step": 167703, "epoch": 2020} {"train_loss": -23.069517135620117, "global_step": 167704, "epoch": 2020} {"train_loss": -23.945526123046875, "global_step": 167705, "epoch": 2020} {"train_loss": -23.653362274169922, "global_step": 167706, "epoch": 2020} {"train_loss": -23.542890548706055, "global_step": 167707, "epoch": 2020} {"train_loss": -23.40094566345215, "global_step": 167708, "epoch": 2020} {"train_loss": -23.17442512512207, "global_step": 167709, "epoch": 2020} {"train_loss": -23.39436149597168, "global_step": 167710, "epoch": 2020} {"train_loss": -23.371057510375977, "global_step": 167711, "epoch": 2020} {"train_loss": -23.475765228271484, "global_step": 167712, "epoch": 2020} {"train_loss": -23.056676864624023, "global_step": 167713, "epoch": 2020} {"train_loss": -23.409664154052734, "global_step": 167714, "epoch": 2020} {"train_loss": -23.337560653686523, "global_step": 167715, "epoch": 2020} {"train_loss": -23.17738914489746, "global_step": 167716, "epoch": 2020} {"train_loss": -23.52359390258789, "global_step": 167717, "epoch": 2020} {"train_loss": -23.386096954345703, "global_step": 167718, "epoch": 2020} {"train_loss": -23.372451782226562, "global_step": 167719, "epoch": 2020} {"train_loss": -22.941608428955078, "global_step": 167720, "epoch": 2020} {"train_loss": -23.36637306213379, "global_step": 167721, "epoch": 2020} {"train_loss": -23.78291130065918, "global_step": 167722, "epoch": 2020} {"train_loss": -23.338056564331055, "global_step": 167723, "epoch": 2020} {"train_loss": -23.840965270996094, "global_step": 167724, "epoch": 2020} {"train_loss": -23.391040802001953, "global_step": 167725, "epoch": 2020} {"train_loss": -23.528127670288086, "global_step": 167726, "epoch": 2020} {"train_loss": -23.385906219482422, "global_step": 167727, "epoch": 2020} {"train_loss": -23.225004196166992, "global_step": 167728, "epoch": 2020} {"train_loss": -23.401357650756836, "global_step": 167729, "epoch": 2020} {"train_loss": -23.36200714111328, "global_step": 167730, "epoch": 2020} {"train_loss": -23.78333282470703, "global_step": 167731, "epoch": 2020} {"train_loss": -23.353166580200195, "global_step": 167732, "epoch": 2020} {"train_loss": -23.496706008911133, "global_step": 167733, "epoch": 2020} {"train_loss": -23.529342651367188, "global_step": 167734, "epoch": 2020} {"train_loss": -23.775285720825195, "global_step": 167735, "epoch": 2020} {"train_loss": -23.768783569335938, "global_step": 167736, "epoch": 2020} {"train_loss": -23.65379524230957, "global_step": 167737, "epoch": 2020} {"train_loss": -23.81654930114746, "global_step": 167738, "epoch": 2020} {"train_loss": -23.70534324645996, "global_step": 167739, "epoch": 2020} {"train_loss": -24.26383399963379, "global_step": 167740, "epoch": 2020} {"train_loss": -24.084293365478516, "global_step": 167741, "epoch": 2020} {"train_loss": -23.559496408485504, "global_step": 167742, "epoch": 2020, "val_loss": 6365289.0} {"train_loss": -23.2203369140625, "global_step": 167743, "epoch": 2021} {"train_loss": -22.538833618164062, "global_step": 167744, "epoch": 2021} {"train_loss": -23.521652221679688, "global_step": 167745, "epoch": 2021} {"train_loss": -23.018423080444336, "global_step": 167746, "epoch": 2021} {"train_loss": -23.041921615600586, "global_step": 167747, "epoch": 2021} {"train_loss": -23.391996383666992, "global_step": 167748, "epoch": 2021} {"train_loss": -23.26934814453125, "global_step": 167749, "epoch": 2021} {"train_loss": -23.06094741821289, "global_step": 167750, "epoch": 2021} {"train_loss": -23.755125045776367, "global_step": 167751, "epoch": 2021} {"train_loss": -23.251934051513672, "global_step": 167752, "epoch": 2021} {"train_loss": -23.676498413085938, "global_step": 167753, "epoch": 2021} {"train_loss": -23.400564193725586, "global_step": 167754, "epoch": 2021} {"train_loss": -23.746816635131836, "global_step": 167755, "epoch": 2021} {"train_loss": -23.426467895507812, "global_step": 167756, "epoch": 2021} {"train_loss": -23.563968658447266, "global_step": 167757, "epoch": 2021} {"train_loss": -23.299072265625, "global_step": 167758, "epoch": 2021} {"train_loss": -23.455175399780273, "global_step": 167759, "epoch": 2021} {"train_loss": -23.4440975189209, "global_step": 167760, "epoch": 2021} {"train_loss": -23.631853103637695, "global_step": 167761, "epoch": 2021} {"train_loss": -23.778907775878906, "global_step": 167762, "epoch": 2021} {"train_loss": -23.512653350830078, "global_step": 167763, "epoch": 2021} {"train_loss": -23.527179718017578, "global_step": 167764, "epoch": 2021} {"train_loss": -23.93517303466797, "global_step": 167765, "epoch": 2021} {"train_loss": -23.67548179626465, "global_step": 167766, "epoch": 2021} {"train_loss": -23.683277130126953, "global_step": 167767, "epoch": 2021} {"train_loss": -23.68716049194336, "global_step": 167768, "epoch": 2021} {"train_loss": -23.811979293823242, "global_step": 167769, "epoch": 2021} {"train_loss": -23.712379455566406, "global_step": 167770, "epoch": 2021} {"train_loss": -23.600976943969727, "global_step": 167771, "epoch": 2021} {"train_loss": -23.733312606811523, "global_step": 167772, "epoch": 2021} {"train_loss": -23.804960250854492, "global_step": 167773, "epoch": 2021} {"train_loss": -23.387557983398438, "global_step": 167774, "epoch": 2021} {"train_loss": -23.227157592773438, "global_step": 167775, "epoch": 2021} {"train_loss": -23.456817626953125, "global_step": 167776, "epoch": 2021} {"train_loss": -23.906198501586914, "global_step": 167777, "epoch": 2021} {"train_loss": -23.77803611755371, "global_step": 167778, "epoch": 2021} {"train_loss": -23.690954208374023, "global_step": 167779, "epoch": 2021} {"train_loss": -23.661222457885742, "global_step": 167780, "epoch": 2021} {"train_loss": -23.740018844604492, "global_step": 167781, "epoch": 2021} {"train_loss": -23.925180435180664, "global_step": 167782, "epoch": 2021} {"train_loss": -23.614439010620117, "global_step": 167783, "epoch": 2021} {"train_loss": -24.096704483032227, "global_step": 167784, "epoch": 2021} {"train_loss": -23.70775032043457, "global_step": 167785, "epoch": 2021} {"train_loss": -24.027820587158203, "global_step": 167786, "epoch": 2021} {"train_loss": -23.58424949645996, "global_step": 167787, "epoch": 2021} {"train_loss": -24.237735748291016, "global_step": 167788, "epoch": 2021} {"train_loss": -23.75721549987793, "global_step": 167789, "epoch": 2021} {"train_loss": -24.076709747314453, "global_step": 167790, "epoch": 2021} {"train_loss": -24.06403923034668, "global_step": 167791, "epoch": 2021} {"train_loss": -23.85105323791504, "global_step": 167792, "epoch": 2021} {"train_loss": -23.321094512939453, "global_step": 167793, "epoch": 2021} {"train_loss": -23.47810935974121, "global_step": 167794, "epoch": 2021} {"train_loss": -23.674758911132812, "global_step": 167795, "epoch": 2021} {"train_loss": -23.728633880615234, "global_step": 167796, "epoch": 2021} {"train_loss": -23.561702728271484, "global_step": 167797, "epoch": 2021} {"train_loss": -23.371681213378906, "global_step": 167798, "epoch": 2021} {"train_loss": -23.73422622680664, "global_step": 167799, "epoch": 2021} {"train_loss": -24.087963104248047, "global_step": 167800, "epoch": 2021} {"train_loss": -23.43296241760254, "global_step": 167801, "epoch": 2021} {"train_loss": -23.358718872070312, "global_step": 167802, "epoch": 2021} {"train_loss": -23.688871383666992, "global_step": 167803, "epoch": 2021} {"train_loss": -23.326162338256836, "global_step": 167804, "epoch": 2021} {"train_loss": -23.925695419311523, "global_step": 167805, "epoch": 2021} {"train_loss": -23.521848678588867, "global_step": 167806, "epoch": 2021} {"train_loss": -23.82986068725586, "global_step": 167807, "epoch": 2021} {"train_loss": -23.53339385986328, "global_step": 167808, "epoch": 2021} {"train_loss": -23.33388328552246, "global_step": 167809, "epoch": 2021} {"train_loss": -23.657085418701172, "global_step": 167810, "epoch": 2021} {"train_loss": -23.744110107421875, "global_step": 167811, "epoch": 2021} {"train_loss": -23.654727935791016, "global_step": 167812, "epoch": 2021} {"train_loss": -23.377416610717773, "global_step": 167813, "epoch": 2021} {"train_loss": -23.643165588378906, "global_step": 167814, "epoch": 2021} {"train_loss": -23.689510345458984, "global_step": 167815, "epoch": 2021} {"train_loss": -24.04054832458496, "global_step": 167816, "epoch": 2021} {"train_loss": -22.94074058532715, "global_step": 167817, "epoch": 2021} {"train_loss": -23.751230239868164, "global_step": 167818, "epoch": 2021} {"train_loss": -23.48134422302246, "global_step": 167819, "epoch": 2021} {"train_loss": -23.522062301635742, "global_step": 167820, "epoch": 2021} {"train_loss": -23.353979110717773, "global_step": 167821, "epoch": 2021} {"train_loss": -23.23967742919922, "global_step": 167822, "epoch": 2021} {"train_loss": -23.435623168945312, "global_step": 167823, "epoch": 2021} {"train_loss": -23.467533111572266, "global_step": 167824, "epoch": 2021} {"train_loss": -23.571637096175227, "global_step": 167825, "epoch": 2021, "val_loss": 6419268.0} {"train_loss": -22.768762588500977, "global_step": 167826, "epoch": 2022} {"train_loss": -23.02939796447754, "global_step": 167827, "epoch": 2022} {"train_loss": -23.10342788696289, "global_step": 167828, "epoch": 2022} {"train_loss": -23.48515510559082, "global_step": 167829, "epoch": 2022} {"train_loss": -23.246362686157227, "global_step": 167830, "epoch": 2022} {"train_loss": -23.513933181762695, "global_step": 167831, "epoch": 2022} {"train_loss": -23.5651798248291, "global_step": 167832, "epoch": 2022} {"train_loss": -23.2231388092041, "global_step": 167833, "epoch": 2022} {"train_loss": -23.302593231201172, "global_step": 167834, "epoch": 2022} {"train_loss": -22.904991149902344, "global_step": 167835, "epoch": 2022} {"train_loss": -23.448171615600586, "global_step": 167836, "epoch": 2022} {"train_loss": -23.41060447692871, "global_step": 167837, "epoch": 2022} {"train_loss": -23.747730255126953, "global_step": 167838, "epoch": 2022} {"train_loss": -23.652530670166016, "global_step": 167839, "epoch": 2022} {"train_loss": -23.40732765197754, "global_step": 167840, "epoch": 2022} {"train_loss": -23.322223663330078, "global_step": 167841, "epoch": 2022} {"train_loss": -23.288793563842773, "global_step": 167842, "epoch": 2022} {"train_loss": -23.668176651000977, "global_step": 167843, "epoch": 2022} {"train_loss": -23.72123146057129, "global_step": 167844, "epoch": 2022} {"train_loss": -23.235492706298828, "global_step": 167845, "epoch": 2022} {"train_loss": -23.429155349731445, "global_step": 167846, "epoch": 2022} {"train_loss": -23.22450828552246, "global_step": 167847, "epoch": 2022} {"train_loss": -23.788822174072266, "global_step": 167848, "epoch": 2022} {"train_loss": -23.434480667114258, "global_step": 167849, "epoch": 2022} {"train_loss": -23.982542037963867, "global_step": 167850, "epoch": 2022} {"train_loss": -23.912433624267578, "global_step": 167851, "epoch": 2022} {"train_loss": -23.536163330078125, "global_step": 167852, "epoch": 2022} {"train_loss": -23.517986297607422, "global_step": 167853, "epoch": 2022} {"train_loss": -23.773021697998047, "global_step": 167854, "epoch": 2022} {"train_loss": -23.669574737548828, "global_step": 167855, "epoch": 2022} {"train_loss": -23.853532791137695, "global_step": 167856, "epoch": 2022} {"train_loss": -23.87567138671875, "global_step": 167857, "epoch": 2022} {"train_loss": -24.048246383666992, "global_step": 167858, "epoch": 2022} {"train_loss": -23.969608306884766, "global_step": 167859, "epoch": 2022} {"train_loss": -23.471105575561523, "global_step": 167860, "epoch": 2022} {"train_loss": -23.94040298461914, "global_step": 167861, "epoch": 2022} {"train_loss": -23.429540634155273, "global_step": 167862, "epoch": 2022} {"train_loss": -23.766096115112305, "global_step": 167863, "epoch": 2022} {"train_loss": -23.860689163208008, "global_step": 167864, "epoch": 2022} {"train_loss": -23.48017692565918, "global_step": 167865, "epoch": 2022} {"train_loss": -23.94692611694336, "global_step": 167866, "epoch": 2022} {"train_loss": -23.590152740478516, "global_step": 167867, "epoch": 2022} {"train_loss": -23.448030471801758, "global_step": 167868, "epoch": 2022} {"train_loss": -23.887962341308594, "global_step": 167869, "epoch": 2022} {"train_loss": -23.913806915283203, "global_step": 167870, "epoch": 2022} {"train_loss": -23.446897506713867, "global_step": 167871, "epoch": 2022} {"train_loss": -23.742353439331055, "global_step": 167872, "epoch": 2022} {"train_loss": -23.776798248291016, "global_step": 167873, "epoch": 2022} {"train_loss": -23.94080924987793, "global_step": 167874, "epoch": 2022} {"train_loss": -23.858234405517578, "global_step": 167875, "epoch": 2022} {"train_loss": -23.55122947692871, "global_step": 167876, "epoch": 2022} {"train_loss": -23.331745147705078, "global_step": 167877, "epoch": 2022} {"train_loss": -23.994531631469727, "global_step": 167878, "epoch": 2022} {"train_loss": -23.934389114379883, "global_step": 167879, "epoch": 2022} {"train_loss": -23.273649215698242, "global_step": 167880, "epoch": 2022} {"train_loss": -23.186248779296875, "global_step": 167881, "epoch": 2022} {"train_loss": -23.331151962280273, "global_step": 167882, "epoch": 2022} {"train_loss": -23.568693161010742, "global_step": 167883, "epoch": 2022} {"train_loss": -23.37792205810547, "global_step": 167884, "epoch": 2022} {"train_loss": -23.739948272705078, "global_step": 167885, "epoch": 2022} {"train_loss": -23.505382537841797, "global_step": 167886, "epoch": 2022} {"train_loss": -23.3907413482666, "global_step": 167887, "epoch": 2022} {"train_loss": -23.49885368347168, "global_step": 167888, "epoch": 2022} {"train_loss": -23.519357681274414, "global_step": 167889, "epoch": 2022} {"train_loss": -23.525863647460938, "global_step": 167890, "epoch": 2022} {"train_loss": -24.07284927368164, "global_step": 167891, "epoch": 2022} {"train_loss": -23.597206115722656, "global_step": 167892, "epoch": 2022} {"train_loss": -23.638017654418945, "global_step": 167893, "epoch": 2022} {"train_loss": -23.748159408569336, "global_step": 167894, "epoch": 2022} {"train_loss": -23.664268493652344, "global_step": 167895, "epoch": 2022} {"train_loss": -23.768474578857422, "global_step": 167896, "epoch": 2022} {"train_loss": -24.07358741760254, "global_step": 167897, "epoch": 2022} {"train_loss": -23.32293128967285, "global_step": 167898, "epoch": 2022} {"train_loss": -23.774301528930664, "global_step": 167899, "epoch": 2022} {"train_loss": -23.447463989257812, "global_step": 167900, "epoch": 2022} {"train_loss": -23.96554183959961, "global_step": 167901, "epoch": 2022} {"train_loss": -23.45345115661621, "global_step": 167902, "epoch": 2022} {"train_loss": -23.405765533447266, "global_step": 167903, "epoch": 2022} {"train_loss": -23.682886123657227, "global_step": 167904, "epoch": 2022} {"train_loss": -23.768707275390625, "global_step": 167905, "epoch": 2022} {"train_loss": -23.907102584838867, "global_step": 167906, "epoch": 2022} {"train_loss": -23.515295028686523, "global_step": 167907, "epoch": 2022} {"train_loss": -23.583486671907355, "global_step": 167908, "epoch": 2022, "val_loss": 6423086.0} {"train_loss": -23.049179077148438, "global_step": 167909, "epoch": 2023} {"train_loss": -22.839183807373047, "global_step": 167910, "epoch": 2023} {"train_loss": -23.258779525756836, "global_step": 167911, "epoch": 2023} {"train_loss": -23.306861877441406, "global_step": 167912, "epoch": 2023} {"train_loss": -23.29434585571289, "global_step": 167913, "epoch": 2023} {"train_loss": -23.198400497436523, "global_step": 167914, "epoch": 2023} {"train_loss": -23.229833602905273, "global_step": 167915, "epoch": 2023} {"train_loss": -23.460607528686523, "global_step": 167916, "epoch": 2023} {"train_loss": -23.095670700073242, "global_step": 167917, "epoch": 2023} {"train_loss": -22.978620529174805, "global_step": 167918, "epoch": 2023} {"train_loss": -23.390335083007812, "global_step": 167919, "epoch": 2023} {"train_loss": -23.32496452331543, "global_step": 167920, "epoch": 2023} {"train_loss": -23.100372314453125, "global_step": 167921, "epoch": 2023} {"train_loss": -23.35494613647461, "global_step": 167922, "epoch": 2023} {"train_loss": -22.953590393066406, "global_step": 167923, "epoch": 2023} {"train_loss": -23.52549171447754, "global_step": 167924, "epoch": 2023} {"train_loss": -23.386560440063477, "global_step": 167925, "epoch": 2023} {"train_loss": -23.46962547302246, "global_step": 167926, "epoch": 2023} {"train_loss": -22.916858673095703, "global_step": 167927, "epoch": 2023} {"train_loss": -23.744421005249023, "global_step": 167928, "epoch": 2023} {"train_loss": -23.237417221069336, "global_step": 167929, "epoch": 2023} {"train_loss": -23.20769691467285, "global_step": 167930, "epoch": 2023} {"train_loss": -23.881074905395508, "global_step": 167931, "epoch": 2023} {"train_loss": -23.28326988220215, "global_step": 167932, "epoch": 2023} {"train_loss": -23.6297664642334, "global_step": 167933, "epoch": 2023} {"train_loss": -23.373239517211914, "global_step": 167934, "epoch": 2023} {"train_loss": -23.261484146118164, "global_step": 167935, "epoch": 2023} {"train_loss": -23.8612117767334, "global_step": 167936, "epoch": 2023} {"train_loss": -23.383512496948242, "global_step": 167937, "epoch": 2023} {"train_loss": -23.481861114501953, "global_step": 167938, "epoch": 2023} {"train_loss": -23.814655303955078, "global_step": 167939, "epoch": 2023} {"train_loss": -23.31220054626465, "global_step": 167940, "epoch": 2023} {"train_loss": -23.63629722595215, "global_step": 167941, "epoch": 2023} {"train_loss": -23.389698028564453, "global_step": 167942, "epoch": 2023} {"train_loss": -23.690052032470703, "global_step": 167943, "epoch": 2023} {"train_loss": -23.889305114746094, "global_step": 167944, "epoch": 2023} {"train_loss": -23.35569190979004, "global_step": 167945, "epoch": 2023} {"train_loss": -23.7475528717041, "global_step": 167946, "epoch": 2023} {"train_loss": -24.068368911743164, "global_step": 167947, "epoch": 2023} {"train_loss": -23.96291160583496, "global_step": 167948, "epoch": 2023} {"train_loss": -23.63027572631836, "global_step": 167949, "epoch": 2023} {"train_loss": -23.847122192382812, "global_step": 167950, "epoch": 2023} {"train_loss": -23.57923698425293, "global_step": 167951, "epoch": 2023} {"train_loss": -23.810810089111328, "global_step": 167952, "epoch": 2023} {"train_loss": -23.758859634399414, "global_step": 167953, "epoch": 2023} {"train_loss": -23.599666595458984, "global_step": 167954, "epoch": 2023} {"train_loss": -23.769521713256836, "global_step": 167955, "epoch": 2023} {"train_loss": -23.71992301940918, "global_step": 167956, "epoch": 2023} {"train_loss": -23.599855422973633, "global_step": 167957, "epoch": 2023} {"train_loss": -23.92225456237793, "global_step": 167958, "epoch": 2023} {"train_loss": -23.646337509155273, "global_step": 167959, "epoch": 2023} {"train_loss": -23.859294891357422, "global_step": 167960, "epoch": 2023} {"train_loss": -23.575576782226562, "global_step": 167961, "epoch": 2023} {"train_loss": -23.616605758666992, "global_step": 167962, "epoch": 2023} {"train_loss": -23.76374626159668, "global_step": 167963, "epoch": 2023} {"train_loss": -23.900753021240234, "global_step": 167964, "epoch": 2023} {"train_loss": -23.851016998291016, "global_step": 167965, "epoch": 2023} {"train_loss": -23.971765518188477, "global_step": 167966, "epoch": 2023} {"train_loss": -23.584299087524414, "global_step": 167967, "epoch": 2023} {"train_loss": -23.673852920532227, "global_step": 167968, "epoch": 2023} {"train_loss": -23.791454315185547, "global_step": 167969, "epoch": 2023} {"train_loss": -23.73833465576172, "global_step": 167970, "epoch": 2023} {"train_loss": -23.524463653564453, "global_step": 167971, "epoch": 2023} {"train_loss": -23.831361770629883, "global_step": 167972, "epoch": 2023} {"train_loss": -23.68600845336914, "global_step": 167973, "epoch": 2023} {"train_loss": -24.218433380126953, "global_step": 167974, "epoch": 2023} {"train_loss": -23.375913619995117, "global_step": 167975, "epoch": 2023} {"train_loss": -23.49741554260254, "global_step": 167976, "epoch": 2023} {"train_loss": -24.175098419189453, "global_step": 167977, "epoch": 2023} {"train_loss": -23.828821182250977, "global_step": 167978, "epoch": 2023} {"train_loss": -23.492788314819336, "global_step": 167979, "epoch": 2023} {"train_loss": -23.66603660583496, "global_step": 167980, "epoch": 2023} {"train_loss": -23.66316795349121, "global_step": 167981, "epoch": 2023} {"train_loss": -23.35637664794922, "global_step": 167982, "epoch": 2023} {"train_loss": -23.823795318603516, "global_step": 167983, "epoch": 2023} {"train_loss": -23.509984970092773, "global_step": 167984, "epoch": 2023} {"train_loss": -23.6162052154541, "global_step": 167985, "epoch": 2023} {"train_loss": -24.165311813354492, "global_step": 167986, "epoch": 2023} {"train_loss": -23.575664520263672, "global_step": 167987, "epoch": 2023} {"train_loss": -23.733858108520508, "global_step": 167988, "epoch": 2023} {"train_loss": -23.81983757019043, "global_step": 167989, "epoch": 2023} {"train_loss": -23.876842498779297, "global_step": 167990, "epoch": 2023} {"train_loss": -23.57818569045469, "global_step": 167991, "epoch": 2023, "val_loss": 6459089.0} {"train_loss": -22.880857467651367, "global_step": 167992, "epoch": 2024} {"train_loss": -22.955265045166016, "global_step": 167993, "epoch": 2024} {"train_loss": -22.03394889831543, "global_step": 167994, "epoch": 2024} {"train_loss": -23.61551284790039, "global_step": 167995, "epoch": 2024} {"train_loss": -22.562402725219727, "global_step": 167996, "epoch": 2024} {"train_loss": -22.677961349487305, "global_step": 167997, "epoch": 2024} {"train_loss": -23.250598907470703, "global_step": 167998, "epoch": 2024} {"train_loss": -22.5494327545166, "global_step": 167999, "epoch": 2024} {"train_loss": -23.140625, "global_step": 168000, "epoch": 2024} {"train_loss": -23.112573623657227, "global_step": 168001, "epoch": 2024} {"train_loss": -23.038766860961914, "global_step": 168002, "epoch": 2024} {"train_loss": -23.24582290649414, "global_step": 168003, "epoch": 2024} {"train_loss": -23.272438049316406, "global_step": 168004, "epoch": 2024} {"train_loss": -23.137300491333008, "global_step": 168005, "epoch": 2024} {"train_loss": -23.04450798034668, "global_step": 168006, "epoch": 2024} {"train_loss": -23.221111297607422, "global_step": 168007, "epoch": 2024} {"train_loss": -23.33966636657715, "global_step": 168008, "epoch": 2024} {"train_loss": -23.161718368530273, "global_step": 168009, "epoch": 2024} {"train_loss": -23.14499282836914, "global_step": 168010, "epoch": 2024} {"train_loss": -22.910892486572266, "global_step": 168011, "epoch": 2024} {"train_loss": -23.374835968017578, "global_step": 168012, "epoch": 2024} {"train_loss": -23.047880172729492, "global_step": 168013, "epoch": 2024} {"train_loss": -23.20130157470703, "global_step": 168014, "epoch": 2024} {"train_loss": -23.194154739379883, "global_step": 168015, "epoch": 2024} {"train_loss": -23.29996681213379, "global_step": 168016, "epoch": 2024} {"train_loss": -23.481138229370117, "global_step": 168017, "epoch": 2024} {"train_loss": -23.41539764404297, "global_step": 168018, "epoch": 2024} {"train_loss": -23.229406356811523, "global_step": 168019, "epoch": 2024} {"train_loss": -23.66792869567871, "global_step": 168020, "epoch": 2024} {"train_loss": -23.558828353881836, "global_step": 168021, "epoch": 2024} {"train_loss": -23.327110290527344, "global_step": 168022, "epoch": 2024} {"train_loss": -23.819990158081055, "global_step": 168023, "epoch": 2024} {"train_loss": -23.15549659729004, "global_step": 168024, "epoch": 2024} {"train_loss": -23.40819549560547, "global_step": 168025, "epoch": 2024} {"train_loss": -23.68697738647461, "global_step": 168026, "epoch": 2024} {"train_loss": -23.733966827392578, "global_step": 168027, "epoch": 2024} {"train_loss": -23.505285263061523, "global_step": 168028, "epoch": 2024} {"train_loss": -23.68246078491211, "global_step": 168029, "epoch": 2024} {"train_loss": -23.758268356323242, "global_step": 168030, "epoch": 2024} {"train_loss": -23.73004150390625, "global_step": 168031, "epoch": 2024} {"train_loss": -23.874032974243164, "global_step": 168032, "epoch": 2024} {"train_loss": -24.077789306640625, "global_step": 168033, "epoch": 2024} {"train_loss": -23.831640243530273, "global_step": 168034, "epoch": 2024} {"train_loss": -23.525436401367188, "global_step": 168035, "epoch": 2024} {"train_loss": -23.99503517150879, "global_step": 168036, "epoch": 2024} {"train_loss": -23.587013244628906, "global_step": 168037, "epoch": 2024} {"train_loss": -24.0184326171875, "global_step": 168038, "epoch": 2024} {"train_loss": -23.639368057250977, "global_step": 168039, "epoch": 2024} {"train_loss": -23.597204208374023, "global_step": 168040, "epoch": 2024} {"train_loss": -23.4813175201416, "global_step": 168041, "epoch": 2024} {"train_loss": -23.960783004760742, "global_step": 168042, "epoch": 2024} {"train_loss": -23.572725296020508, "global_step": 168043, "epoch": 2024} {"train_loss": -23.908309936523438, "global_step": 168044, "epoch": 2024} {"train_loss": -23.347248077392578, "global_step": 168045, "epoch": 2024} {"train_loss": -23.91261863708496, "global_step": 168046, "epoch": 2024} {"train_loss": -23.51908302307129, "global_step": 168047, "epoch": 2024} {"train_loss": -23.935888290405273, "global_step": 168048, "epoch": 2024} {"train_loss": -23.595754623413086, "global_step": 168049, "epoch": 2024} {"train_loss": -23.422910690307617, "global_step": 168050, "epoch": 2024} {"train_loss": -23.3931827545166, "global_step": 168051, "epoch": 2024} {"train_loss": -23.754417419433594, "global_step": 168052, "epoch": 2024} {"train_loss": -23.77496910095215, "global_step": 168053, "epoch": 2024} {"train_loss": -23.94005584716797, "global_step": 168054, "epoch": 2024} {"train_loss": -23.6613826751709, "global_step": 168055, "epoch": 2024} {"train_loss": -23.742963790893555, "global_step": 168056, "epoch": 2024} {"train_loss": -23.510812759399414, "global_step": 168057, "epoch": 2024} {"train_loss": -23.82530975341797, "global_step": 168058, "epoch": 2024} {"train_loss": -23.66335105895996, "global_step": 168059, "epoch": 2024} {"train_loss": -23.585285186767578, "global_step": 168060, "epoch": 2024} {"train_loss": -23.27178382873535, "global_step": 168061, "epoch": 2024} {"train_loss": -24.0656681060791, "global_step": 168062, "epoch": 2024} {"train_loss": -23.369352340698242, "global_step": 168063, "epoch": 2024} {"train_loss": -23.03276824951172, "global_step": 168064, "epoch": 2024} {"train_loss": -23.733217239379883, "global_step": 168065, "epoch": 2024} {"train_loss": -23.53082275390625, "global_step": 168066, "epoch": 2024} {"train_loss": -23.61842155456543, "global_step": 168067, "epoch": 2024} {"train_loss": -23.457660675048828, "global_step": 168068, "epoch": 2024} {"train_loss": -23.99942970275879, "global_step": 168069, "epoch": 2024} {"train_loss": -23.525548934936523, "global_step": 168070, "epoch": 2024} {"train_loss": -23.622255325317383, "global_step": 168071, "epoch": 2024} {"train_loss": -23.607694625854492, "global_step": 168072, "epoch": 2024} {"train_loss": -23.68055534362793, "global_step": 168073, "epoch": 2024} {"train_loss": -23.453513984220574, "global_step": 168074, "epoch": 2024, "val_loss": 6639649.0} {"train_loss": -21.703771591186523, "global_step": 168075, "epoch": 2025} {"train_loss": -22.797163009643555, "global_step": 168076, "epoch": 2025} {"train_loss": -22.67640495300293, "global_step": 168077, "epoch": 2025} {"train_loss": -22.88197898864746, "global_step": 168078, "epoch": 2025} {"train_loss": -23.191884994506836, "global_step": 168079, "epoch": 2025} {"train_loss": -22.585092544555664, "global_step": 168080, "epoch": 2025} {"train_loss": -23.16119956970215, "global_step": 168081, "epoch": 2025} {"train_loss": -23.090831756591797, "global_step": 168082, "epoch": 2025} {"train_loss": -22.9249324798584, "global_step": 168083, "epoch": 2025} {"train_loss": -22.735939025878906, "global_step": 168084, "epoch": 2025} {"train_loss": -23.094528198242188, "global_step": 168085, "epoch": 2025} {"train_loss": -23.5775089263916, "global_step": 168086, "epoch": 2025} {"train_loss": -22.922109603881836, "global_step": 168087, "epoch": 2025} {"train_loss": -23.349857330322266, "global_step": 168088, "epoch": 2025} {"train_loss": -23.484922409057617, "global_step": 168089, "epoch": 2025} {"train_loss": -22.854015350341797, "global_step": 168090, "epoch": 2025} {"train_loss": -23.005300521850586, "global_step": 168091, "epoch": 2025} {"train_loss": -23.506057739257812, "global_step": 168092, "epoch": 2025} {"train_loss": -23.304615020751953, "global_step": 168093, "epoch": 2025} {"train_loss": -23.65192985534668, "global_step": 168094, "epoch": 2025} {"train_loss": -23.334928512573242, "global_step": 168095, "epoch": 2025} {"train_loss": -23.79652976989746, "global_step": 168096, "epoch": 2025} {"train_loss": -23.23723793029785, "global_step": 168097, "epoch": 2025} {"train_loss": -23.683441162109375, "global_step": 168098, "epoch": 2025} {"train_loss": -23.496658325195312, "global_step": 168099, "epoch": 2025} {"train_loss": -23.663312911987305, "global_step": 168100, "epoch": 2025} {"train_loss": -23.49923324584961, "global_step": 168101, "epoch": 2025} {"train_loss": -23.339658737182617, "global_step": 168102, "epoch": 2025} {"train_loss": -23.373382568359375, "global_step": 168103, "epoch": 2025} {"train_loss": -23.076744079589844, "global_step": 168104, "epoch": 2025} {"train_loss": -23.459516525268555, "global_step": 168105, "epoch": 2025} {"train_loss": -23.574628829956055, "global_step": 168106, "epoch": 2025} {"train_loss": -23.55898094177246, "global_step": 168107, "epoch": 2025} {"train_loss": -23.888137817382812, "global_step": 168108, "epoch": 2025} {"train_loss": -23.408950805664062, "global_step": 168109, "epoch": 2025} {"train_loss": -23.73436164855957, "global_step": 168110, "epoch": 2025} {"train_loss": -23.416946411132812, "global_step": 168111, "epoch": 2025} {"train_loss": -23.743986129760742, "global_step": 168112, "epoch": 2025} {"train_loss": -23.790502548217773, "global_step": 168113, "epoch": 2025} {"train_loss": -23.468740463256836, "global_step": 168114, "epoch": 2025} {"train_loss": -23.812414169311523, "global_step": 168115, "epoch": 2025} {"train_loss": -23.831073760986328, "global_step": 168116, "epoch": 2025} {"train_loss": -23.60520362854004, "global_step": 168117, "epoch": 2025} {"train_loss": -23.84612464904785, "global_step": 168118, "epoch": 2025} {"train_loss": -23.801265716552734, "global_step": 168119, "epoch": 2025} {"train_loss": -23.938997268676758, "global_step": 168120, "epoch": 2025} {"train_loss": -24.01333236694336, "global_step": 168121, "epoch": 2025} {"train_loss": -23.742399215698242, "global_step": 168122, "epoch": 2025} {"train_loss": -23.633821487426758, "global_step": 168123, "epoch": 2025} {"train_loss": -23.851743698120117, "global_step": 168124, "epoch": 2025} {"train_loss": -23.910741806030273, "global_step": 168125, "epoch": 2025} {"train_loss": -23.657262802124023, "global_step": 168126, "epoch": 2025} {"train_loss": -23.81781768798828, "global_step": 168127, "epoch": 2025} {"train_loss": -23.344263076782227, "global_step": 168128, "epoch": 2025} {"train_loss": -23.969778060913086, "global_step": 168129, "epoch": 2025} {"train_loss": -23.725162506103516, "global_step": 168130, "epoch": 2025} {"train_loss": -23.940519332885742, "global_step": 168131, "epoch": 2025} {"train_loss": -23.366689682006836, "global_step": 168132, "epoch": 2025} {"train_loss": -23.695655822753906, "global_step": 168133, "epoch": 2025} {"train_loss": -23.614269256591797, "global_step": 168134, "epoch": 2025} {"train_loss": -23.720947265625, "global_step": 168135, "epoch": 2025} {"train_loss": -23.58934211730957, "global_step": 168136, "epoch": 2025} {"train_loss": -24.054494857788086, "global_step": 168137, "epoch": 2025} {"train_loss": -23.60197639465332, "global_step": 168138, "epoch": 2025} {"train_loss": -23.725406646728516, "global_step": 168139, "epoch": 2025} {"train_loss": -24.04849624633789, "global_step": 168140, "epoch": 2025} {"train_loss": -23.63780975341797, "global_step": 168141, "epoch": 2025} {"train_loss": -23.45554542541504, "global_step": 168142, "epoch": 2025} {"train_loss": -23.311216354370117, "global_step": 168143, "epoch": 2025} {"train_loss": -23.654651641845703, "global_step": 168144, "epoch": 2025} {"train_loss": -23.933338165283203, "global_step": 168145, "epoch": 2025} {"train_loss": -23.67311668395996, "global_step": 168146, "epoch": 2025} {"train_loss": -23.58744239807129, "global_step": 168147, "epoch": 2025} {"train_loss": -23.671171188354492, "global_step": 168148, "epoch": 2025} {"train_loss": -23.706907272338867, "global_step": 168149, "epoch": 2025} {"train_loss": -23.77640151977539, "global_step": 168150, "epoch": 2025} {"train_loss": -23.821516036987305, "global_step": 168151, "epoch": 2025} {"train_loss": -23.884384155273438, "global_step": 168152, "epoch": 2025} {"train_loss": -23.938554763793945, "global_step": 168153, "epoch": 2025} {"train_loss": -23.759504318237305, "global_step": 168154, "epoch": 2025} {"train_loss": -23.54599952697754, "global_step": 168155, "epoch": 2025} {"train_loss": -23.6553955078125, "global_step": 168156, "epoch": 2025} {"train_loss": -23.5188217622688, "global_step": 168157, "epoch": 2025, "val_loss": 6334283.0} {"train_loss": -23.09285545349121, "global_step": 168158, "epoch": 2026} {"train_loss": -23.4305477142334, "global_step": 168159, "epoch": 2026} {"train_loss": -23.28312110900879, "global_step": 168160, "epoch": 2026} {"train_loss": -23.28106117248535, "global_step": 168161, "epoch": 2026} {"train_loss": -23.251510620117188, "global_step": 168162, "epoch": 2026} {"train_loss": -23.131818771362305, "global_step": 168163, "epoch": 2026} {"train_loss": -23.81611442565918, "global_step": 168164, "epoch": 2026} {"train_loss": -23.18494987487793, "global_step": 168165, "epoch": 2026} {"train_loss": -23.339500427246094, "global_step": 168166, "epoch": 2026} {"train_loss": -22.993520736694336, "global_step": 168167, "epoch": 2026} {"train_loss": -23.39266014099121, "global_step": 168168, "epoch": 2026} {"train_loss": -23.013839721679688, "global_step": 168169, "epoch": 2026} {"train_loss": -23.216121673583984, "global_step": 168170, "epoch": 2026} {"train_loss": -23.423757553100586, "global_step": 168171, "epoch": 2026} {"train_loss": -23.40470314025879, "global_step": 168172, "epoch": 2026} {"train_loss": -23.167068481445312, "global_step": 168173, "epoch": 2026} {"train_loss": -23.368112564086914, "global_step": 168174, "epoch": 2026} {"train_loss": -23.612916946411133, "global_step": 168175, "epoch": 2026} {"train_loss": -23.611642837524414, "global_step": 168176, "epoch": 2026} {"train_loss": -23.17513084411621, "global_step": 168177, "epoch": 2026} {"train_loss": -23.634765625, "global_step": 168178, "epoch": 2026} {"train_loss": -23.166288375854492, "global_step": 168179, "epoch": 2026} {"train_loss": -23.801319122314453, "global_step": 168180, "epoch": 2026} {"train_loss": -23.383386611938477, "global_step": 168181, "epoch": 2026} {"train_loss": -23.747873306274414, "global_step": 168182, "epoch": 2026} {"train_loss": -23.459060668945312, "global_step": 168183, "epoch": 2026} {"train_loss": -23.76165199279785, "global_step": 168184, "epoch": 2026} {"train_loss": -23.73566246032715, "global_step": 168185, "epoch": 2026} {"train_loss": -23.936628341674805, "global_step": 168186, "epoch": 2026} {"train_loss": -24.080358505249023, "global_step": 168187, "epoch": 2026} {"train_loss": -23.301206588745117, "global_step": 168188, "epoch": 2026} {"train_loss": -23.638517379760742, "global_step": 168189, "epoch": 2026} {"train_loss": -23.983915328979492, "global_step": 168190, "epoch": 2026} {"train_loss": -23.76927375793457, "global_step": 168191, "epoch": 2026} {"train_loss": -23.086414337158203, "global_step": 168192, "epoch": 2026} {"train_loss": -23.443044662475586, "global_step": 168193, "epoch": 2026} {"train_loss": -23.790220260620117, "global_step": 168194, "epoch": 2026} {"train_loss": -23.588424682617188, "global_step": 168195, "epoch": 2026} {"train_loss": -23.690706253051758, "global_step": 168196, "epoch": 2026} {"train_loss": -23.697240829467773, "global_step": 168197, "epoch": 2026} {"train_loss": -23.641983032226562, "global_step": 168198, "epoch": 2026} {"train_loss": -23.374685287475586, "global_step": 168199, "epoch": 2026} {"train_loss": -23.58625030517578, "global_step": 168200, "epoch": 2026} {"train_loss": -23.623830795288086, "global_step": 168201, "epoch": 2026} {"train_loss": -23.406496047973633, "global_step": 168202, "epoch": 2026} {"train_loss": -23.982208251953125, "global_step": 168203, "epoch": 2026} {"train_loss": -23.66996192932129, "global_step": 168204, "epoch": 2026} {"train_loss": -23.82485580444336, "global_step": 168205, "epoch": 2026} {"train_loss": -23.29121971130371, "global_step": 168206, "epoch": 2026} {"train_loss": -23.137807846069336, "global_step": 168207, "epoch": 2026} {"train_loss": -23.43128776550293, "global_step": 168208, "epoch": 2026} {"train_loss": -22.878271102905273, "global_step": 168209, "epoch": 2026} {"train_loss": -23.56732749938965, "global_step": 168210, "epoch": 2026} {"train_loss": -23.715208053588867, "global_step": 168211, "epoch": 2026} {"train_loss": -23.474180221557617, "global_step": 168212, "epoch": 2026} {"train_loss": -23.424970626831055, "global_step": 168213, "epoch": 2026} {"train_loss": -23.208337783813477, "global_step": 168214, "epoch": 2026} {"train_loss": -23.31355857849121, "global_step": 168215, "epoch": 2026} {"train_loss": -23.706348419189453, "global_step": 168216, "epoch": 2026} {"train_loss": -23.698192596435547, "global_step": 168217, "epoch": 2026} {"train_loss": -23.747411727905273, "global_step": 168218, "epoch": 2026} {"train_loss": -23.756919860839844, "global_step": 168219, "epoch": 2026} {"train_loss": -23.84071159362793, "global_step": 168220, "epoch": 2026} {"train_loss": -23.710411071777344, "global_step": 168221, "epoch": 2026} {"train_loss": -23.568824768066406, "global_step": 168222, "epoch": 2026} {"train_loss": -23.726318359375, "global_step": 168223, "epoch": 2026} {"train_loss": -23.76938247680664, "global_step": 168224, "epoch": 2026} {"train_loss": -23.49314308166504, "global_step": 168225, "epoch": 2026} {"train_loss": -23.377960205078125, "global_step": 168226, "epoch": 2026} {"train_loss": -23.65285301208496, "global_step": 168227, "epoch": 2026} {"train_loss": -23.703872680664062, "global_step": 168228, "epoch": 2026} {"train_loss": -23.977005004882812, "global_step": 168229, "epoch": 2026} {"train_loss": -23.498046875, "global_step": 168230, "epoch": 2026} {"train_loss": -23.644248962402344, "global_step": 168231, "epoch": 2026} {"train_loss": -24.02626609802246, "global_step": 168232, "epoch": 2026} {"train_loss": -23.705219268798828, "global_step": 168233, "epoch": 2026} {"train_loss": -23.72710418701172, "global_step": 168234, "epoch": 2026} {"train_loss": -23.80612564086914, "global_step": 168235, "epoch": 2026} {"train_loss": -24.195703506469727, "global_step": 168236, "epoch": 2026} {"train_loss": -23.494535446166992, "global_step": 168237, "epoch": 2026} {"train_loss": -23.667346954345703, "global_step": 168238, "epoch": 2026} {"train_loss": -23.531829833984375, "global_step": 168239, "epoch": 2026} {"train_loss": -23.54050351338214, "global_step": 168240, "epoch": 2026, "val_loss": 6446274.0} {"train_loss": -23.712848663330078, "global_step": 168241, "epoch": 2027} {"train_loss": -23.475976943969727, "global_step": 168242, "epoch": 2027} {"train_loss": -23.867801666259766, "global_step": 168243, "epoch": 2027} {"train_loss": -23.74153709411621, "global_step": 168244, "epoch": 2027} {"train_loss": -23.847593307495117, "global_step": 168245, "epoch": 2027} {"train_loss": -23.77985191345215, "global_step": 168246, "epoch": 2027} {"train_loss": -23.736286163330078, "global_step": 168247, "epoch": 2027} {"train_loss": -23.767398834228516, "global_step": 168248, "epoch": 2027} {"train_loss": -23.758975982666016, "global_step": 168249, "epoch": 2027} {"train_loss": -23.610944747924805, "global_step": 168250, "epoch": 2027} {"train_loss": -23.624176025390625, "global_step": 168251, "epoch": 2027} {"train_loss": -23.49139404296875, "global_step": 168252, "epoch": 2027} {"train_loss": -23.37989616394043, "global_step": 168253, "epoch": 2027} {"train_loss": -23.769550323486328, "global_step": 168254, "epoch": 2027} {"train_loss": -23.693880081176758, "global_step": 168255, "epoch": 2027} {"train_loss": -23.944843292236328, "global_step": 168256, "epoch": 2027} {"train_loss": -23.623537063598633, "global_step": 168257, "epoch": 2027} {"train_loss": -23.558002471923828, "global_step": 168258, "epoch": 2027} {"train_loss": -23.829206466674805, "global_step": 168259, "epoch": 2027} {"train_loss": -23.60143280029297, "global_step": 168260, "epoch": 2027} {"train_loss": -23.77389144897461, "global_step": 168261, "epoch": 2027} {"train_loss": -23.3117618560791, "global_step": 168262, "epoch": 2027} {"train_loss": -24.081754684448242, "global_step": 168263, "epoch": 2027} {"train_loss": -23.616518020629883, "global_step": 168264, "epoch": 2027} {"train_loss": -23.685073852539062, "global_step": 168265, "epoch": 2027} {"train_loss": -23.495723724365234, "global_step": 168266, "epoch": 2027} {"train_loss": -23.420101165771484, "global_step": 168267, "epoch": 2027} {"train_loss": -23.522871017456055, "global_step": 168268, "epoch": 2027} {"train_loss": -23.46776580810547, "global_step": 168269, "epoch": 2027} {"train_loss": -24.137235641479492, "global_step": 168270, "epoch": 2027} {"train_loss": -23.315580368041992, "global_step": 168271, "epoch": 2027} {"train_loss": -23.660459518432617, "global_step": 168272, "epoch": 2027} {"train_loss": -23.633907318115234, "global_step": 168273, "epoch": 2027} {"train_loss": -23.60951042175293, "global_step": 168274, "epoch": 2027} {"train_loss": -23.671527862548828, "global_step": 168275, "epoch": 2027} {"train_loss": -23.698341369628906, "global_step": 168276, "epoch": 2027} {"train_loss": -23.76427459716797, "global_step": 168277, "epoch": 2027} {"train_loss": -23.786657333374023, "global_step": 168278, "epoch": 2027} {"train_loss": -24.092313766479492, "global_step": 168279, "epoch": 2027} {"train_loss": -23.924448013305664, "global_step": 168280, "epoch": 2027} {"train_loss": -23.80315589904785, "global_step": 168281, "epoch": 2027} {"train_loss": -23.568634033203125, "global_step": 168282, "epoch": 2027} {"train_loss": -23.358617782592773, "global_step": 168283, "epoch": 2027} {"train_loss": -23.593393325805664, "global_step": 168284, "epoch": 2027} {"train_loss": -23.746549606323242, "global_step": 168285, "epoch": 2027} {"train_loss": -24.12693977355957, "global_step": 168286, "epoch": 2027} {"train_loss": -23.68849754333496, "global_step": 168287, "epoch": 2027} {"train_loss": -23.99091911315918, "global_step": 168288, "epoch": 2027} {"train_loss": -23.53560447692871, "global_step": 168289, "epoch": 2027} {"train_loss": -23.551939010620117, "global_step": 168290, "epoch": 2027} {"train_loss": -23.925189971923828, "global_step": 168291, "epoch": 2027} {"train_loss": -23.94462776184082, "global_step": 168292, "epoch": 2027} {"train_loss": -23.87997817993164, "global_step": 168293, "epoch": 2027} {"train_loss": -23.84237289428711, "global_step": 168294, "epoch": 2027} {"train_loss": -23.794967651367188, "global_step": 168295, "epoch": 2027} {"train_loss": -23.906335830688477, "global_step": 168296, "epoch": 2027} {"train_loss": -23.51506233215332, "global_step": 168297, "epoch": 2027} {"train_loss": -23.471057891845703, "global_step": 168298, "epoch": 2027} {"train_loss": -23.61658477783203, "global_step": 168299, "epoch": 2027} {"train_loss": -23.91493034362793, "global_step": 168300, "epoch": 2027} {"train_loss": -23.73797607421875, "global_step": 168301, "epoch": 2027} {"train_loss": -23.861839294433594, "global_step": 168302, "epoch": 2027} {"train_loss": -23.979293823242188, "global_step": 168303, "epoch": 2027} {"train_loss": -23.55411720275879, "global_step": 168304, "epoch": 2027} {"train_loss": -23.870223999023438, "global_step": 168305, "epoch": 2027} {"train_loss": -23.662574768066406, "global_step": 168306, "epoch": 2027} {"train_loss": -23.78409767150879, "global_step": 168307, "epoch": 2027} {"train_loss": -23.96392822265625, "global_step": 168308, "epoch": 2027} {"train_loss": -23.5960750579834, "global_step": 168309, "epoch": 2027} {"train_loss": -23.74674415588379, "global_step": 168310, "epoch": 2027} {"train_loss": -23.92108726501465, "global_step": 168311, "epoch": 2027} {"train_loss": -23.465312957763672, "global_step": 168312, "epoch": 2027} {"train_loss": -23.763919830322266, "global_step": 168313, "epoch": 2027} {"train_loss": -23.795011520385742, "global_step": 168314, "epoch": 2027} {"train_loss": -23.740753173828125, "global_step": 168315, "epoch": 2027} {"train_loss": -23.911298751831055, "global_step": 168316, "epoch": 2027} {"train_loss": -24.162282943725586, "global_step": 168317, "epoch": 2027} {"train_loss": -23.82684326171875, "global_step": 168318, "epoch": 2027} {"train_loss": -23.626489639282227, "global_step": 168319, "epoch": 2027} {"train_loss": -23.653135299682617, "global_step": 168320, "epoch": 2027} {"train_loss": -23.793651580810547, "global_step": 168321, "epoch": 2027} {"train_loss": -23.734336853027344, "global_step": 168322, "epoch": 2027} {"train_loss": -23.708231983414617, "global_step": 168323, "epoch": 2027, "val_loss": 6567787.0} {"train_loss": -23.55084800720215, "global_step": 168324, "epoch": 2028} {"train_loss": -22.78626823425293, "global_step": 168325, "epoch": 2028} {"train_loss": -21.99987030029297, "global_step": 168326, "epoch": 2028} {"train_loss": -22.389062881469727, "global_step": 168327, "epoch": 2028} {"train_loss": -23.38544273376465, "global_step": 168328, "epoch": 2028} {"train_loss": -22.86224365234375, "global_step": 168329, "epoch": 2028} {"train_loss": -22.97157859802246, "global_step": 168330, "epoch": 2028} {"train_loss": -23.473669052124023, "global_step": 168331, "epoch": 2028} {"train_loss": -23.51545524597168, "global_step": 168332, "epoch": 2028} {"train_loss": -23.460712432861328, "global_step": 168333, "epoch": 2028} {"train_loss": -23.40069580078125, "global_step": 168334, "epoch": 2028} {"train_loss": -23.19921112060547, "global_step": 168335, "epoch": 2028} {"train_loss": -23.3895320892334, "global_step": 168336, "epoch": 2028} {"train_loss": -23.3458309173584, "global_step": 168337, "epoch": 2028} {"train_loss": -23.612394332885742, "global_step": 168338, "epoch": 2028} {"train_loss": -23.119354248046875, "global_step": 168339, "epoch": 2028} {"train_loss": -23.605024337768555, "global_step": 168340, "epoch": 2028} {"train_loss": -23.587976455688477, "global_step": 168341, "epoch": 2028} {"train_loss": -23.43680763244629, "global_step": 168342, "epoch": 2028} {"train_loss": -23.5034236907959, "global_step": 168343, "epoch": 2028} {"train_loss": -23.48593521118164, "global_step": 168344, "epoch": 2028} {"train_loss": -23.272340774536133, "global_step": 168345, "epoch": 2028} {"train_loss": -23.282697677612305, "global_step": 168346, "epoch": 2028} {"train_loss": -23.67391014099121, "global_step": 168347, "epoch": 2028} {"train_loss": -22.995752334594727, "global_step": 168348, "epoch": 2028} {"train_loss": -23.528594970703125, "global_step": 168349, "epoch": 2028} {"train_loss": -23.390844345092773, "global_step": 168350, "epoch": 2028} {"train_loss": -23.46484375, "global_step": 168351, "epoch": 2028} {"train_loss": -23.210498809814453, "global_step": 168352, "epoch": 2028} {"train_loss": -23.64480972290039, "global_step": 168353, "epoch": 2028} {"train_loss": -23.540014266967773, "global_step": 168354, "epoch": 2028} {"train_loss": -23.51607322692871, "global_step": 168355, "epoch": 2028} {"train_loss": -23.59372901916504, "global_step": 168356, "epoch": 2028} {"train_loss": -23.30763816833496, "global_step": 168357, "epoch": 2028} {"train_loss": -23.95398712158203, "global_step": 168358, "epoch": 2028} {"train_loss": -23.83174705505371, "global_step": 168359, "epoch": 2028} {"train_loss": -23.773557662963867, "global_step": 168360, "epoch": 2028} {"train_loss": -23.827468872070312, "global_step": 168361, "epoch": 2028} {"train_loss": -23.689977645874023, "global_step": 168362, "epoch": 2028} {"train_loss": -23.596599578857422, "global_step": 168363, "epoch": 2028} {"train_loss": -23.685115814208984, "global_step": 168364, "epoch": 2028} {"train_loss": -24.33478355407715, "global_step": 168365, "epoch": 2028} {"train_loss": -23.823959350585938, "global_step": 168366, "epoch": 2028} {"train_loss": -23.933441162109375, "global_step": 168367, "epoch": 2028} {"train_loss": -23.211254119873047, "global_step": 168368, "epoch": 2028} {"train_loss": -23.57369041442871, "global_step": 168369, "epoch": 2028} {"train_loss": -23.801130294799805, "global_step": 168370, "epoch": 2028} {"train_loss": -23.672733306884766, "global_step": 168371, "epoch": 2028} {"train_loss": -23.745786666870117, "global_step": 168372, "epoch": 2028} {"train_loss": -23.704763412475586, "global_step": 168373, "epoch": 2028} {"train_loss": -23.6495361328125, "global_step": 168374, "epoch": 2028} {"train_loss": -23.66900062561035, "global_step": 168375, "epoch": 2028} {"train_loss": -23.2641658782959, "global_step": 168376, "epoch": 2028} {"train_loss": -23.41494369506836, "global_step": 168377, "epoch": 2028} {"train_loss": -24.058208465576172, "global_step": 168378, "epoch": 2028} {"train_loss": -23.865097045898438, "global_step": 168379, "epoch": 2028} {"train_loss": -23.41180992126465, "global_step": 168380, "epoch": 2028} {"train_loss": -23.307453155517578, "global_step": 168381, "epoch": 2028} {"train_loss": -23.56314468383789, "global_step": 168382, "epoch": 2028} {"train_loss": -23.88218116760254, "global_step": 168383, "epoch": 2028} {"train_loss": -23.466999053955078, "global_step": 168384, "epoch": 2028} {"train_loss": -23.66529655456543, "global_step": 168385, "epoch": 2028} {"train_loss": -23.539052963256836, "global_step": 168386, "epoch": 2028} {"train_loss": -23.72112464904785, "global_step": 168387, "epoch": 2028} {"train_loss": -23.847455978393555, "global_step": 168388, "epoch": 2028} {"train_loss": -23.546663284301758, "global_step": 168389, "epoch": 2028} {"train_loss": -23.59408950805664, "global_step": 168390, "epoch": 2028} {"train_loss": -23.562570571899414, "global_step": 168391, "epoch": 2028} {"train_loss": -23.578588485717773, "global_step": 168392, "epoch": 2028} {"train_loss": -23.504322052001953, "global_step": 168393, "epoch": 2028} {"train_loss": -23.54664421081543, "global_step": 168394, "epoch": 2028} {"train_loss": -23.78005599975586, "global_step": 168395, "epoch": 2028} {"train_loss": -23.534439086914062, "global_step": 168396, "epoch": 2028} {"train_loss": -23.756437301635742, "global_step": 168397, "epoch": 2028} {"train_loss": -23.657241821289062, "global_step": 168398, "epoch": 2028} {"train_loss": -23.92466163635254, "global_step": 168399, "epoch": 2028} {"train_loss": -23.515758514404297, "global_step": 168400, "epoch": 2028} {"train_loss": -23.895904541015625, "global_step": 168401, "epoch": 2028} {"train_loss": -23.407108306884766, "global_step": 168402, "epoch": 2028} {"train_loss": -23.67085075378418, "global_step": 168403, "epoch": 2028} {"train_loss": -23.87596321105957, "global_step": 168404, "epoch": 2028} {"train_loss": -23.34269142150879, "global_step": 168405, "epoch": 2028} {"train_loss": -23.524272757840443, "global_step": 168406, "epoch": 2028, "val_loss": 6302472.5} {"train_loss": -23.8703556060791, "global_step": 168407, "epoch": 2029} {"train_loss": -23.324874877929688, "global_step": 168408, "epoch": 2029} {"train_loss": -23.603347778320312, "global_step": 168409, "epoch": 2029} {"train_loss": -23.03242301940918, "global_step": 168410, "epoch": 2029} {"train_loss": -23.60560417175293, "global_step": 168411, "epoch": 2029} {"train_loss": -23.151342391967773, "global_step": 168412, "epoch": 2029} {"train_loss": -23.55341339111328, "global_step": 168413, "epoch": 2029} {"train_loss": -23.1630859375, "global_step": 168414, "epoch": 2029} {"train_loss": -23.137489318847656, "global_step": 168415, "epoch": 2029} {"train_loss": -23.63572120666504, "global_step": 168416, "epoch": 2029} {"train_loss": -23.405445098876953, "global_step": 168417, "epoch": 2029} {"train_loss": -23.376596450805664, "global_step": 168418, "epoch": 2029} {"train_loss": -23.842443466186523, "global_step": 168419, "epoch": 2029} {"train_loss": -23.409334182739258, "global_step": 168420, "epoch": 2029} {"train_loss": -23.578453063964844, "global_step": 168421, "epoch": 2029} {"train_loss": -23.6425838470459, "global_step": 168422, "epoch": 2029} {"train_loss": -23.635465621948242, "global_step": 168423, "epoch": 2029} {"train_loss": -23.639902114868164, "global_step": 168424, "epoch": 2029} {"train_loss": -23.766355514526367, "global_step": 168425, "epoch": 2029} {"train_loss": -23.260482788085938, "global_step": 168426, "epoch": 2029} {"train_loss": -23.639986038208008, "global_step": 168427, "epoch": 2029} {"train_loss": -23.7723445892334, "global_step": 168428, "epoch": 2029} {"train_loss": -23.750537872314453, "global_step": 168429, "epoch": 2029} {"train_loss": -23.85597038269043, "global_step": 168430, "epoch": 2029} {"train_loss": -23.869199752807617, "global_step": 168431, "epoch": 2029} {"train_loss": -23.944223403930664, "global_step": 168432, "epoch": 2029} {"train_loss": -23.713668823242188, "global_step": 168433, "epoch": 2029} {"train_loss": -23.814437866210938, "global_step": 168434, "epoch": 2029} {"train_loss": -23.820701599121094, "global_step": 168435, "epoch": 2029} {"train_loss": -23.38995361328125, "global_step": 168436, "epoch": 2029} {"train_loss": -23.57440757751465, "global_step": 168437, "epoch": 2029} {"train_loss": -23.610435485839844, "global_step": 168438, "epoch": 2029} {"train_loss": -23.522172927856445, "global_step": 168439, "epoch": 2029} {"train_loss": -23.777057647705078, "global_step": 168440, "epoch": 2029} {"train_loss": -23.692472457885742, "global_step": 168441, "epoch": 2029} {"train_loss": -23.35055160522461, "global_step": 168442, "epoch": 2029} {"train_loss": -23.815942764282227, "global_step": 168443, "epoch": 2029} {"train_loss": -23.58146095275879, "global_step": 168444, "epoch": 2029} {"train_loss": -23.387672424316406, "global_step": 168445, "epoch": 2029} {"train_loss": -23.789281845092773, "global_step": 168446, "epoch": 2029} {"train_loss": -23.89813232421875, "global_step": 168447, "epoch": 2029} {"train_loss": -23.68403434753418, "global_step": 168448, "epoch": 2029} {"train_loss": -23.60426139831543, "global_step": 168449, "epoch": 2029} {"train_loss": -23.643569946289062, "global_step": 168450, "epoch": 2029} {"train_loss": -23.619489669799805, "global_step": 168451, "epoch": 2029} {"train_loss": -23.6082706451416, "global_step": 168452, "epoch": 2029} {"train_loss": -23.655574798583984, "global_step": 168453, "epoch": 2029} {"train_loss": -23.39069175720215, "global_step": 168454, "epoch": 2029} {"train_loss": -23.225921630859375, "global_step": 168455, "epoch": 2029} {"train_loss": -23.7022705078125, "global_step": 168456, "epoch": 2029} {"train_loss": -23.93285369873047, "global_step": 168457, "epoch": 2029} {"train_loss": -24.173240661621094, "global_step": 168458, "epoch": 2029} {"train_loss": -23.76667594909668, "global_step": 168459, "epoch": 2029} {"train_loss": -23.532346725463867, "global_step": 168460, "epoch": 2029} {"train_loss": -23.82811164855957, "global_step": 168461, "epoch": 2029} {"train_loss": -23.53285026550293, "global_step": 168462, "epoch": 2029} {"train_loss": -24.056324005126953, "global_step": 168463, "epoch": 2029} {"train_loss": -23.768325805664062, "global_step": 168464, "epoch": 2029} {"train_loss": -23.72547721862793, "global_step": 168465, "epoch": 2029} {"train_loss": -23.87531852722168, "global_step": 168466, "epoch": 2029} {"train_loss": -23.606212615966797, "global_step": 168467, "epoch": 2029} {"train_loss": -24.067068099975586, "global_step": 168468, "epoch": 2029} {"train_loss": -23.97901153564453, "global_step": 168469, "epoch": 2029} {"train_loss": -23.54633331298828, "global_step": 168470, "epoch": 2029} {"train_loss": -23.652273178100586, "global_step": 168471, "epoch": 2029} {"train_loss": -23.8425350189209, "global_step": 168472, "epoch": 2029} {"train_loss": -23.753829956054688, "global_step": 168473, "epoch": 2029} {"train_loss": -23.870834350585938, "global_step": 168474, "epoch": 2029} {"train_loss": -23.813621520996094, "global_step": 168475, "epoch": 2029} {"train_loss": -23.827682495117188, "global_step": 168476, "epoch": 2029} {"train_loss": -23.730710983276367, "global_step": 168477, "epoch": 2029} {"train_loss": -23.819997787475586, "global_step": 168478, "epoch": 2029} {"train_loss": -23.747907638549805, "global_step": 168479, "epoch": 2029} {"train_loss": -23.27223777770996, "global_step": 168480, "epoch": 2029} {"train_loss": -23.73658561706543, "global_step": 168481, "epoch": 2029} {"train_loss": -23.355093002319336, "global_step": 168482, "epoch": 2029} {"train_loss": -23.466167449951172, "global_step": 168483, "epoch": 2029} {"train_loss": -23.85232925415039, "global_step": 168484, "epoch": 2029} {"train_loss": -23.832242965698242, "global_step": 168485, "epoch": 2029} {"train_loss": -23.321624755859375, "global_step": 168486, "epoch": 2029} {"train_loss": -23.857091903686523, "global_step": 168487, "epoch": 2029} {"train_loss": -23.745832443237305, "global_step": 168488, "epoch": 2029} {"train_loss": -23.635308966579206, "global_step": 168489, "epoch": 2029, "val_loss": 6398497.0} {"train_loss": -22.67006492614746, "global_step": 168490, "epoch": 2030} {"train_loss": -23.46807289123535, "global_step": 168491, "epoch": 2030} {"train_loss": -23.39045524597168, "global_step": 168492, "epoch": 2030} {"train_loss": -22.825101852416992, "global_step": 168493, "epoch": 2030} {"train_loss": -23.909439086914062, "global_step": 168494, "epoch": 2030} {"train_loss": -22.97589111328125, "global_step": 168495, "epoch": 2030} {"train_loss": -23.16380500793457, "global_step": 168496, "epoch": 2030} {"train_loss": -23.326454162597656, "global_step": 168497, "epoch": 2030} {"train_loss": -23.01044273376465, "global_step": 168498, "epoch": 2030} {"train_loss": -23.325117111206055, "global_step": 168499, "epoch": 2030} {"train_loss": -23.139436721801758, "global_step": 168500, "epoch": 2030} {"train_loss": -23.340042114257812, "global_step": 168501, "epoch": 2030} {"train_loss": -23.57598114013672, "global_step": 168502, "epoch": 2030} {"train_loss": -23.58940887451172, "global_step": 168503, "epoch": 2030} {"train_loss": -23.27117919921875, "global_step": 168504, "epoch": 2030} {"train_loss": -23.27052116394043, "global_step": 168505, "epoch": 2030} {"train_loss": -23.53389549255371, "global_step": 168506, "epoch": 2030} {"train_loss": -23.628705978393555, "global_step": 168507, "epoch": 2030} {"train_loss": -23.390005111694336, "global_step": 168508, "epoch": 2030} {"train_loss": -23.80319595336914, "global_step": 168509, "epoch": 2030} {"train_loss": -23.587610244750977, "global_step": 168510, "epoch": 2030} {"train_loss": -23.21602439880371, "global_step": 168511, "epoch": 2030} {"train_loss": -23.516578674316406, "global_step": 168512, "epoch": 2030} {"train_loss": -23.602962493896484, "global_step": 168513, "epoch": 2030} {"train_loss": -23.518321990966797, "global_step": 168514, "epoch": 2030} {"train_loss": -23.450359344482422, "global_step": 168515, "epoch": 2030} {"train_loss": -23.84339714050293, "global_step": 168516, "epoch": 2030} {"train_loss": -23.576847076416016, "global_step": 168517, "epoch": 2030} {"train_loss": -23.652341842651367, "global_step": 168518, "epoch": 2030} {"train_loss": -23.450471878051758, "global_step": 168519, "epoch": 2030} {"train_loss": -23.49549674987793, "global_step": 168520, "epoch": 2030} {"train_loss": -23.61311149597168, "global_step": 168521, "epoch": 2030} {"train_loss": -23.688779830932617, "global_step": 168522, "epoch": 2030} {"train_loss": -23.658687591552734, "global_step": 168523, "epoch": 2030} {"train_loss": -23.80035972595215, "global_step": 168524, "epoch": 2030} {"train_loss": -23.7218074798584, "global_step": 168525, "epoch": 2030} {"train_loss": -23.769601821899414, "global_step": 168526, "epoch": 2030} {"train_loss": -23.727628707885742, "global_step": 168527, "epoch": 2030} {"train_loss": -23.85666275024414, "global_step": 168528, "epoch": 2030} {"train_loss": -24.023563385009766, "global_step": 168529, "epoch": 2030} {"train_loss": -23.84903907775879, "global_step": 168530, "epoch": 2030} {"train_loss": -23.94234848022461, "global_step": 168531, "epoch": 2030} {"train_loss": -23.858903884887695, "global_step": 168532, "epoch": 2030} {"train_loss": -23.836414337158203, "global_step": 168533, "epoch": 2030} {"train_loss": -23.754552841186523, "global_step": 168534, "epoch": 2030} {"train_loss": -23.963712692260742, "global_step": 168535, "epoch": 2030} {"train_loss": -23.684385299682617, "global_step": 168536, "epoch": 2030} {"train_loss": -23.44495964050293, "global_step": 168537, "epoch": 2030} {"train_loss": -23.67879295349121, "global_step": 168538, "epoch": 2030} {"train_loss": -23.2282772064209, "global_step": 168539, "epoch": 2030} {"train_loss": -23.880964279174805, "global_step": 168540, "epoch": 2030} {"train_loss": -23.73164939880371, "global_step": 168541, "epoch": 2030} {"train_loss": -23.90590476989746, "global_step": 168542, "epoch": 2030} {"train_loss": -23.845989227294922, "global_step": 168543, "epoch": 2030} {"train_loss": -23.259920120239258, "global_step": 168544, "epoch": 2030} {"train_loss": -23.905349731445312, "global_step": 168545, "epoch": 2030} {"train_loss": -23.910634994506836, "global_step": 168546, "epoch": 2030} {"train_loss": -23.87961196899414, "global_step": 168547, "epoch": 2030} {"train_loss": -23.780187606811523, "global_step": 168548, "epoch": 2030} {"train_loss": -23.558788299560547, "global_step": 168549, "epoch": 2030} {"train_loss": -23.669424057006836, "global_step": 168550, "epoch": 2030} {"train_loss": -23.783145904541016, "global_step": 168551, "epoch": 2030} {"train_loss": -23.910066604614258, "global_step": 168552, "epoch": 2030} {"train_loss": -23.779369354248047, "global_step": 168553, "epoch": 2030} {"train_loss": -23.56879234313965, "global_step": 168554, "epoch": 2030} {"train_loss": -23.919233322143555, "global_step": 168555, "epoch": 2030} {"train_loss": -23.913358688354492, "global_step": 168556, "epoch": 2030} {"train_loss": -23.70827293395996, "global_step": 168557, "epoch": 2030} {"train_loss": -23.644441604614258, "global_step": 168558, "epoch": 2030} {"train_loss": -23.695602416992188, "global_step": 168559, "epoch": 2030} {"train_loss": -22.99301528930664, "global_step": 168560, "epoch": 2030} {"train_loss": -23.474302291870117, "global_step": 168561, "epoch": 2030} {"train_loss": -23.83163833618164, "global_step": 168562, "epoch": 2030} {"train_loss": -23.796680450439453, "global_step": 168563, "epoch": 2030} {"train_loss": -23.23410415649414, "global_step": 168564, "epoch": 2030} {"train_loss": -23.785558700561523, "global_step": 168565, "epoch": 2030} {"train_loss": -23.712066650390625, "global_step": 168566, "epoch": 2030} {"train_loss": -24.056264877319336, "global_step": 168567, "epoch": 2030} {"train_loss": -24.0969181060791, "global_step": 168568, "epoch": 2030} {"train_loss": -23.394025802612305, "global_step": 168569, "epoch": 2030} {"train_loss": -23.609792709350586, "global_step": 168570, "epoch": 2030} {"train_loss": -23.533817291259766, "global_step": 168571, "epoch": 2030} {"train_loss": -23.618274688720703, "global_step": 168572, "epoch": 2030, "val_loss": 6389686.0} {"train_loss": -22.867633819580078, "global_step": 168573, "epoch": 2031} {"train_loss": -23.291860580444336, "global_step": 168574, "epoch": 2031} {"train_loss": -23.138713836669922, "global_step": 168575, "epoch": 2031} {"train_loss": -22.844741821289062, "global_step": 168576, "epoch": 2031} {"train_loss": -22.879138946533203, "global_step": 168577, "epoch": 2031} {"train_loss": -23.090024948120117, "global_step": 168578, "epoch": 2031} {"train_loss": -23.101552963256836, "global_step": 168579, "epoch": 2031} {"train_loss": -22.992673873901367, "global_step": 168580, "epoch": 2031} {"train_loss": -23.199077606201172, "global_step": 168581, "epoch": 2031} {"train_loss": -23.432180404663086, "global_step": 168582, "epoch": 2031} {"train_loss": -23.193876266479492, "global_step": 168583, "epoch": 2031} {"train_loss": -23.354663848876953, "global_step": 168584, "epoch": 2031} {"train_loss": -23.493408203125, "global_step": 168585, "epoch": 2031} {"train_loss": -23.407608032226562, "global_step": 168586, "epoch": 2031} {"train_loss": -23.42642593383789, "global_step": 168587, "epoch": 2031} {"train_loss": -23.39493179321289, "global_step": 168588, "epoch": 2031} {"train_loss": -23.569616317749023, "global_step": 168589, "epoch": 2031} {"train_loss": -23.56201934814453, "global_step": 168590, "epoch": 2031} {"train_loss": -23.047086715698242, "global_step": 168591, "epoch": 2031} {"train_loss": -23.449438095092773, "global_step": 168592, "epoch": 2031} {"train_loss": -23.564481735229492, "global_step": 168593, "epoch": 2031} {"train_loss": -23.619169235229492, "global_step": 168594, "epoch": 2031} {"train_loss": -23.59295082092285, "global_step": 168595, "epoch": 2031} {"train_loss": -23.602346420288086, "global_step": 168596, "epoch": 2031} {"train_loss": -23.17508316040039, "global_step": 168597, "epoch": 2031} {"train_loss": -23.687732696533203, "global_step": 168598, "epoch": 2031} {"train_loss": -23.48438835144043, "global_step": 168599, "epoch": 2031} {"train_loss": -23.829086303710938, "global_step": 168600, "epoch": 2031} {"train_loss": -23.573604583740234, "global_step": 168601, "epoch": 2031} {"train_loss": -23.494489669799805, "global_step": 168602, "epoch": 2031} {"train_loss": -23.607423782348633, "global_step": 168603, "epoch": 2031} {"train_loss": -23.875289916992188, "global_step": 168604, "epoch": 2031} {"train_loss": -23.75040054321289, "global_step": 168605, "epoch": 2031} {"train_loss": -23.89412498474121, "global_step": 168606, "epoch": 2031} {"train_loss": -23.785154342651367, "global_step": 168607, "epoch": 2031} {"train_loss": -23.885284423828125, "global_step": 168608, "epoch": 2031} {"train_loss": -23.522302627563477, "global_step": 168609, "epoch": 2031} {"train_loss": -23.887374877929688, "global_step": 168610, "epoch": 2031} {"train_loss": -23.67311668395996, "global_step": 168611, "epoch": 2031} {"train_loss": -23.929868698120117, "global_step": 168612, "epoch": 2031} {"train_loss": -23.861759185791016, "global_step": 168613, "epoch": 2031} {"train_loss": -23.821447372436523, "global_step": 168614, "epoch": 2031} {"train_loss": -23.716970443725586, "global_step": 168615, "epoch": 2031} {"train_loss": -23.63874053955078, "global_step": 168616, "epoch": 2031} {"train_loss": -23.76932144165039, "global_step": 168617, "epoch": 2031} {"train_loss": -23.636001586914062, "global_step": 168618, "epoch": 2031} {"train_loss": -23.992258071899414, "global_step": 168619, "epoch": 2031} {"train_loss": -23.822660446166992, "global_step": 168620, "epoch": 2031} {"train_loss": -23.794498443603516, "global_step": 168621, "epoch": 2031} {"train_loss": -23.882028579711914, "global_step": 168622, "epoch": 2031} {"train_loss": -23.816268920898438, "global_step": 168623, "epoch": 2031} {"train_loss": -23.63306427001953, "global_step": 168624, "epoch": 2031} {"train_loss": -23.768268585205078, "global_step": 168625, "epoch": 2031} {"train_loss": -23.948793411254883, "global_step": 168626, "epoch": 2031} {"train_loss": -23.832447052001953, "global_step": 168627, "epoch": 2031} {"train_loss": -23.63380241394043, "global_step": 168628, "epoch": 2031} {"train_loss": -23.616518020629883, "global_step": 168629, "epoch": 2031} {"train_loss": -24.08896255493164, "global_step": 168630, "epoch": 2031} {"train_loss": -23.938650131225586, "global_step": 168631, "epoch": 2031} {"train_loss": -23.794267654418945, "global_step": 168632, "epoch": 2031} {"train_loss": -23.922225952148438, "global_step": 168633, "epoch": 2031} {"train_loss": -23.32819938659668, "global_step": 168634, "epoch": 2031} {"train_loss": -23.727527618408203, "global_step": 168635, "epoch": 2031} {"train_loss": -23.70477294921875, "global_step": 168636, "epoch": 2031} {"train_loss": -23.77370262145996, "global_step": 168637, "epoch": 2031} {"train_loss": -23.84013557434082, "global_step": 168638, "epoch": 2031} {"train_loss": -23.81424331665039, "global_step": 168639, "epoch": 2031} {"train_loss": -23.566659927368164, "global_step": 168640, "epoch": 2031} {"train_loss": -23.549850463867188, "global_step": 168641, "epoch": 2031} {"train_loss": -23.761178970336914, "global_step": 168642, "epoch": 2031} {"train_loss": -23.473834991455078, "global_step": 168643, "epoch": 2031} {"train_loss": -23.39198875427246, "global_step": 168644, "epoch": 2031} {"train_loss": -23.819440841674805, "global_step": 168645, "epoch": 2031} {"train_loss": -23.376052856445312, "global_step": 168646, "epoch": 2031} {"train_loss": -23.839948654174805, "global_step": 168647, "epoch": 2031} {"train_loss": -23.635570526123047, "global_step": 168648, "epoch": 2031} {"train_loss": -23.187990188598633, "global_step": 168649, "epoch": 2031} {"train_loss": -23.94509506225586, "global_step": 168650, "epoch": 2031} {"train_loss": -23.6875, "global_step": 168651, "epoch": 2031} {"train_loss": -23.879531860351562, "global_step": 168652, "epoch": 2031} {"train_loss": -23.938344955444336, "global_step": 168653, "epoch": 2031} {"train_loss": -23.498586654663086, "global_step": 168654, "epoch": 2031} {"train_loss": -23.57974505137248, "global_step": 168655, "epoch": 2031, "val_loss": 6262499.0} {"train_loss": -23.232702255249023, "global_step": 168656, "epoch": 2032} {"train_loss": -23.298019409179688, "global_step": 168657, "epoch": 2032} {"train_loss": -23.31513786315918, "global_step": 168658, "epoch": 2032} {"train_loss": -23.41963768005371, "global_step": 168659, "epoch": 2032} {"train_loss": -23.240455627441406, "global_step": 168660, "epoch": 2032} {"train_loss": -23.088054656982422, "global_step": 168661, "epoch": 2032} {"train_loss": -23.6383113861084, "global_step": 168662, "epoch": 2032} {"train_loss": -23.365034103393555, "global_step": 168663, "epoch": 2032} {"train_loss": -23.622907638549805, "global_step": 168664, "epoch": 2032} {"train_loss": -23.61879539489746, "global_step": 168665, "epoch": 2032} {"train_loss": -23.583728790283203, "global_step": 168666, "epoch": 2032} {"train_loss": -23.55879020690918, "global_step": 168667, "epoch": 2032} {"train_loss": -23.665189743041992, "global_step": 168668, "epoch": 2032} {"train_loss": -23.563770294189453, "global_step": 168669, "epoch": 2032} {"train_loss": -23.574310302734375, "global_step": 168670, "epoch": 2032} {"train_loss": -23.252988815307617, "global_step": 168671, "epoch": 2032} {"train_loss": -23.586957931518555, "global_step": 168672, "epoch": 2032} {"train_loss": -23.512271881103516, "global_step": 168673, "epoch": 2032} {"train_loss": -23.867189407348633, "global_step": 168674, "epoch": 2032} {"train_loss": -23.801761627197266, "global_step": 168675, "epoch": 2032} {"train_loss": -23.577695846557617, "global_step": 168676, "epoch": 2032} {"train_loss": -23.63044548034668, "global_step": 168677, "epoch": 2032} {"train_loss": -23.51658058166504, "global_step": 168678, "epoch": 2032} {"train_loss": -23.833515167236328, "global_step": 168679, "epoch": 2032} {"train_loss": -23.59664535522461, "global_step": 168680, "epoch": 2032} {"train_loss": -23.276819229125977, "global_step": 168681, "epoch": 2032} {"train_loss": -23.663358688354492, "global_step": 168682, "epoch": 2032} {"train_loss": -23.27707290649414, "global_step": 168683, "epoch": 2032} {"train_loss": -23.602537155151367, "global_step": 168684, "epoch": 2032} {"train_loss": -23.64760971069336, "global_step": 168685, "epoch": 2032} {"train_loss": -23.744747161865234, "global_step": 168686, "epoch": 2032} {"train_loss": -23.93073844909668, "global_step": 168687, "epoch": 2032} {"train_loss": -23.409330368041992, "global_step": 168688, "epoch": 2032} {"train_loss": -23.536941528320312, "global_step": 168689, "epoch": 2032} {"train_loss": -23.803918838500977, "global_step": 168690, "epoch": 2032} {"train_loss": -24.084857940673828, "global_step": 168691, "epoch": 2032} {"train_loss": -23.771635055541992, "global_step": 168692, "epoch": 2032} {"train_loss": -23.77748680114746, "global_step": 168693, "epoch": 2032} {"train_loss": -23.485733032226562, "global_step": 168694, "epoch": 2032} {"train_loss": -23.356077194213867, "global_step": 168695, "epoch": 2032} {"train_loss": -23.44676971435547, "global_step": 168696, "epoch": 2032} {"train_loss": -23.89261817932129, "global_step": 168697, "epoch": 2032} {"train_loss": -23.43450164794922, "global_step": 168698, "epoch": 2032} {"train_loss": -23.54273796081543, "global_step": 168699, "epoch": 2032} {"train_loss": -23.65641212463379, "global_step": 168700, "epoch": 2032} {"train_loss": -23.847444534301758, "global_step": 168701, "epoch": 2032} {"train_loss": -23.52748680114746, "global_step": 168702, "epoch": 2032} {"train_loss": -23.346576690673828, "global_step": 168703, "epoch": 2032} {"train_loss": -23.8459529876709, "global_step": 168704, "epoch": 2032} {"train_loss": -23.697595596313477, "global_step": 168705, "epoch": 2032} {"train_loss": -23.52456283569336, "global_step": 168706, "epoch": 2032} {"train_loss": -23.252119064331055, "global_step": 168707, "epoch": 2032} {"train_loss": -23.59547996520996, "global_step": 168708, "epoch": 2032} {"train_loss": -23.70940589904785, "global_step": 168709, "epoch": 2032} {"train_loss": -23.78499412536621, "global_step": 168710, "epoch": 2032} {"train_loss": -23.696088790893555, "global_step": 168711, "epoch": 2032} {"train_loss": -23.7961483001709, "global_step": 168712, "epoch": 2032} {"train_loss": -23.843963623046875, "global_step": 168713, "epoch": 2032} {"train_loss": -23.80928611755371, "global_step": 168714, "epoch": 2032} {"train_loss": -23.897323608398438, "global_step": 168715, "epoch": 2032} {"train_loss": -23.604259490966797, "global_step": 168716, "epoch": 2032} {"train_loss": -23.419424057006836, "global_step": 168717, "epoch": 2032} {"train_loss": -23.594266891479492, "global_step": 168718, "epoch": 2032} {"train_loss": -23.967905044555664, "global_step": 168719, "epoch": 2032} {"train_loss": -23.64483642578125, "global_step": 168720, "epoch": 2032} {"train_loss": -23.748083114624023, "global_step": 168721, "epoch": 2032} {"train_loss": -24.199567794799805, "global_step": 168722, "epoch": 2032} {"train_loss": -23.891923904418945, "global_step": 168723, "epoch": 2032} {"train_loss": -23.63641929626465, "global_step": 168724, "epoch": 2032} {"train_loss": -23.687326431274414, "global_step": 168725, "epoch": 2032} {"train_loss": -23.8115291595459, "global_step": 168726, "epoch": 2032} {"train_loss": -23.718111038208008, "global_step": 168727, "epoch": 2032} {"train_loss": -23.891950607299805, "global_step": 168728, "epoch": 2032} {"train_loss": -23.872127532958984, "global_step": 168729, "epoch": 2032} {"train_loss": -24.1256046295166, "global_step": 168730, "epoch": 2032} {"train_loss": -23.60755729675293, "global_step": 168731, "epoch": 2032} {"train_loss": -23.7418155670166, "global_step": 168732, "epoch": 2032} {"train_loss": -24.007740020751953, "global_step": 168733, "epoch": 2032} {"train_loss": -23.74342155456543, "global_step": 168734, "epoch": 2032} {"train_loss": -24.01978302001953, "global_step": 168735, "epoch": 2032} {"train_loss": -23.688724517822266, "global_step": 168736, "epoch": 2032} {"train_loss": -23.41763687133789, "global_step": 168737, "epoch": 2032} {"train_loss": -23.6482019539339, "global_step": 168738, "epoch": 2032, "val_loss": 6410855.0} {"train_loss": -22.69949722290039, "global_step": 168739, "epoch": 2033} {"train_loss": -22.433425903320312, "global_step": 168740, "epoch": 2033} {"train_loss": -23.019378662109375, "global_step": 168741, "epoch": 2033} {"train_loss": -22.682836532592773, "global_step": 168742, "epoch": 2033} {"train_loss": -22.917097091674805, "global_step": 168743, "epoch": 2033} {"train_loss": -22.670398712158203, "global_step": 168744, "epoch": 2033} {"train_loss": -23.192296981811523, "global_step": 168745, "epoch": 2033} {"train_loss": -23.197132110595703, "global_step": 168746, "epoch": 2033} {"train_loss": -22.910531997680664, "global_step": 168747, "epoch": 2033} {"train_loss": -23.34207534790039, "global_step": 168748, "epoch": 2033} {"train_loss": -23.177778244018555, "global_step": 168749, "epoch": 2033} {"train_loss": -23.17398452758789, "global_step": 168750, "epoch": 2033} {"train_loss": -23.079986572265625, "global_step": 168751, "epoch": 2033} {"train_loss": -23.25135612487793, "global_step": 168752, "epoch": 2033} {"train_loss": -23.38629722595215, "global_step": 168753, "epoch": 2033} {"train_loss": -23.615863800048828, "global_step": 168754, "epoch": 2033} {"train_loss": -23.312068939208984, "global_step": 168755, "epoch": 2033} {"train_loss": -23.227155685424805, "global_step": 168756, "epoch": 2033} {"train_loss": -23.366357803344727, "global_step": 168757, "epoch": 2033} {"train_loss": -23.635793685913086, "global_step": 168758, "epoch": 2033} {"train_loss": -23.2644100189209, "global_step": 168759, "epoch": 2033} {"train_loss": -23.690372467041016, "global_step": 168760, "epoch": 2033} {"train_loss": -23.3090763092041, "global_step": 168761, "epoch": 2033} {"train_loss": -23.23098373413086, "global_step": 168762, "epoch": 2033} {"train_loss": -23.455350875854492, "global_step": 168763, "epoch": 2033} {"train_loss": -23.54228401184082, "global_step": 168764, "epoch": 2033} {"train_loss": -23.679624557495117, "global_step": 168765, "epoch": 2033} {"train_loss": -23.3028621673584, "global_step": 168766, "epoch": 2033} {"train_loss": -23.973865509033203, "global_step": 168767, "epoch": 2033} {"train_loss": -23.58186149597168, "global_step": 168768, "epoch": 2033} {"train_loss": -23.6722354888916, "global_step": 168769, "epoch": 2033} {"train_loss": -23.429716110229492, "global_step": 168770, "epoch": 2033} {"train_loss": -23.484582901000977, "global_step": 168771, "epoch": 2033} {"train_loss": -23.958078384399414, "global_step": 168772, "epoch": 2033} {"train_loss": -23.57954978942871, "global_step": 168773, "epoch": 2033} {"train_loss": -23.327730178833008, "global_step": 168774, "epoch": 2033} {"train_loss": -23.631818771362305, "global_step": 168775, "epoch": 2033} {"train_loss": -23.63968849182129, "global_step": 168776, "epoch": 2033} {"train_loss": -23.521955490112305, "global_step": 168777, "epoch": 2033} {"train_loss": -23.43574333190918, "global_step": 168778, "epoch": 2033} {"train_loss": -23.737171173095703, "global_step": 168779, "epoch": 2033} {"train_loss": -24.09739112854004, "global_step": 168780, "epoch": 2033} {"train_loss": -23.452512741088867, "global_step": 168781, "epoch": 2033} {"train_loss": -23.54385757446289, "global_step": 168782, "epoch": 2033} {"train_loss": -23.447059631347656, "global_step": 168783, "epoch": 2033} {"train_loss": -23.86642074584961, "global_step": 168784, "epoch": 2033} {"train_loss": -23.49826431274414, "global_step": 168785, "epoch": 2033} {"train_loss": -23.536428451538086, "global_step": 168786, "epoch": 2033} {"train_loss": -23.495615005493164, "global_step": 168787, "epoch": 2033} {"train_loss": -23.217798233032227, "global_step": 168788, "epoch": 2033} {"train_loss": -23.214025497436523, "global_step": 168789, "epoch": 2033} {"train_loss": -23.486515045166016, "global_step": 168790, "epoch": 2033} {"train_loss": -23.732572555541992, "global_step": 168791, "epoch": 2033} {"train_loss": -23.34624671936035, "global_step": 168792, "epoch": 2033} {"train_loss": -23.076549530029297, "global_step": 168793, "epoch": 2033} {"train_loss": -23.59666633605957, "global_step": 168794, "epoch": 2033} {"train_loss": -23.6257381439209, "global_step": 168795, "epoch": 2033} {"train_loss": -23.67466163635254, "global_step": 168796, "epoch": 2033} {"train_loss": -23.507116317749023, "global_step": 168797, "epoch": 2033} {"train_loss": -23.52692985534668, "global_step": 168798, "epoch": 2033} {"train_loss": -24.007415771484375, "global_step": 168799, "epoch": 2033} {"train_loss": -23.666303634643555, "global_step": 168800, "epoch": 2033} {"train_loss": -23.82461929321289, "global_step": 168801, "epoch": 2033} {"train_loss": -24.027681350708008, "global_step": 168802, "epoch": 2033} {"train_loss": -23.483192443847656, "global_step": 168803, "epoch": 2033} {"train_loss": -23.814071655273438, "global_step": 168804, "epoch": 2033} {"train_loss": -23.909032821655273, "global_step": 168805, "epoch": 2033} {"train_loss": -23.94525146484375, "global_step": 168806, "epoch": 2033} {"train_loss": -23.31161880493164, "global_step": 168807, "epoch": 2033} {"train_loss": -23.959211349487305, "global_step": 168808, "epoch": 2033} {"train_loss": -23.13714599609375, "global_step": 168809, "epoch": 2033} {"train_loss": -23.862228393554688, "global_step": 168810, "epoch": 2033} {"train_loss": -23.877355575561523, "global_step": 168811, "epoch": 2033} {"train_loss": -23.5223331451416, "global_step": 168812, "epoch": 2033} {"train_loss": -24.10465431213379, "global_step": 168813, "epoch": 2033} {"train_loss": -23.541250228881836, "global_step": 168814, "epoch": 2033} {"train_loss": -23.26832389831543, "global_step": 168815, "epoch": 2033} {"train_loss": -23.56464195251465, "global_step": 168816, "epoch": 2033} {"train_loss": -23.631589889526367, "global_step": 168817, "epoch": 2033} {"train_loss": -23.60849952697754, "global_step": 168818, "epoch": 2033} {"train_loss": -23.687788009643555, "global_step": 168819, "epoch": 2033} {"train_loss": -23.7689208984375, "global_step": 168820, "epoch": 2033} {"train_loss": -23.480722036706396, "global_step": 168821, "epoch": 2033, "val_loss": 6468024.5} {"train_loss": -23.116010665893555, "global_step": 168822, "epoch": 2034} {"train_loss": -22.896411895751953, "global_step": 168823, "epoch": 2034} {"train_loss": -23.1986083984375, "global_step": 168824, "epoch": 2034} {"train_loss": -23.015798568725586, "global_step": 168825, "epoch": 2034} {"train_loss": -23.701990127563477, "global_step": 168826, "epoch": 2034} {"train_loss": -23.26699447631836, "global_step": 168827, "epoch": 2034} {"train_loss": -23.608129501342773, "global_step": 168828, "epoch": 2034} {"train_loss": -23.11090850830078, "global_step": 168829, "epoch": 2034} {"train_loss": -23.023162841796875, "global_step": 168830, "epoch": 2034} {"train_loss": -23.256505966186523, "global_step": 168831, "epoch": 2034} {"train_loss": -23.83222770690918, "global_step": 168832, "epoch": 2034} {"train_loss": -23.24932289123535, "global_step": 168833, "epoch": 2034} {"train_loss": -23.71259880065918, "global_step": 168834, "epoch": 2034} {"train_loss": -23.29937744140625, "global_step": 168835, "epoch": 2034} {"train_loss": -23.532142639160156, "global_step": 168836, "epoch": 2034} {"train_loss": -23.53774070739746, "global_step": 168837, "epoch": 2034} {"train_loss": -23.559606552124023, "global_step": 168838, "epoch": 2034} {"train_loss": -23.695444107055664, "global_step": 168839, "epoch": 2034} {"train_loss": -23.695219039916992, "global_step": 168840, "epoch": 2034} {"train_loss": -23.721643447875977, "global_step": 168841, "epoch": 2034} {"train_loss": -23.562875747680664, "global_step": 168842, "epoch": 2034} {"train_loss": -23.271085739135742, "global_step": 168843, "epoch": 2034} {"train_loss": -23.494958877563477, "global_step": 168844, "epoch": 2034} {"train_loss": -23.577199935913086, "global_step": 168845, "epoch": 2034} {"train_loss": -23.8170166015625, "global_step": 168846, "epoch": 2034} {"train_loss": -23.85011100769043, "global_step": 168847, "epoch": 2034} {"train_loss": -23.91063117980957, "global_step": 168848, "epoch": 2034} {"train_loss": -24.12689781188965, "global_step": 168849, "epoch": 2034} {"train_loss": -23.117589950561523, "global_step": 168850, "epoch": 2034} {"train_loss": -23.69016456604004, "global_step": 168851, "epoch": 2034} {"train_loss": -23.465103149414062, "global_step": 168852, "epoch": 2034} {"train_loss": -23.58334732055664, "global_step": 168853, "epoch": 2034} {"train_loss": -23.609167098999023, "global_step": 168854, "epoch": 2034} {"train_loss": -23.778467178344727, "global_step": 168855, "epoch": 2034} {"train_loss": -23.717235565185547, "global_step": 168856, "epoch": 2034} {"train_loss": -23.79933738708496, "global_step": 168857, "epoch": 2034} {"train_loss": -23.79426383972168, "global_step": 168858, "epoch": 2034} {"train_loss": -23.82972526550293, "global_step": 168859, "epoch": 2034} {"train_loss": -23.48797607421875, "global_step": 168860, "epoch": 2034} {"train_loss": -23.92682456970215, "global_step": 168861, "epoch": 2034} {"train_loss": -23.995227813720703, "global_step": 168862, "epoch": 2034} {"train_loss": -23.951322555541992, "global_step": 168863, "epoch": 2034} {"train_loss": -23.61964988708496, "global_step": 168864, "epoch": 2034} {"train_loss": -23.650897979736328, "global_step": 168865, "epoch": 2034} {"train_loss": -23.9113826751709, "global_step": 168866, "epoch": 2034} {"train_loss": -23.810117721557617, "global_step": 168867, "epoch": 2034} {"train_loss": -23.459386825561523, "global_step": 168868, "epoch": 2034} {"train_loss": -23.94730567932129, "global_step": 168869, "epoch": 2034} {"train_loss": -23.323379516601562, "global_step": 168870, "epoch": 2034} {"train_loss": -23.564603805541992, "global_step": 168871, "epoch": 2034} {"train_loss": -23.786352157592773, "global_step": 168872, "epoch": 2034} {"train_loss": -23.864717483520508, "global_step": 168873, "epoch": 2034} {"train_loss": -23.826139450073242, "global_step": 168874, "epoch": 2034} {"train_loss": -23.81486701965332, "global_step": 168875, "epoch": 2034} {"train_loss": -23.512062072753906, "global_step": 168876, "epoch": 2034} {"train_loss": -23.813810348510742, "global_step": 168877, "epoch": 2034} {"train_loss": -23.74727439880371, "global_step": 168878, "epoch": 2034} {"train_loss": -23.423376083374023, "global_step": 168879, "epoch": 2034} {"train_loss": -23.652420043945312, "global_step": 168880, "epoch": 2034} {"train_loss": -23.610647201538086, "global_step": 168881, "epoch": 2034} {"train_loss": -23.995471954345703, "global_step": 168882, "epoch": 2034} {"train_loss": -23.984973907470703, "global_step": 168883, "epoch": 2034} {"train_loss": -23.674489974975586, "global_step": 168884, "epoch": 2034} {"train_loss": -23.968137741088867, "global_step": 168885, "epoch": 2034} {"train_loss": -23.930438995361328, "global_step": 168886, "epoch": 2034} {"train_loss": -23.550769805908203, "global_step": 168887, "epoch": 2034} {"train_loss": -23.656782150268555, "global_step": 168888, "epoch": 2034} {"train_loss": -23.678144454956055, "global_step": 168889, "epoch": 2034} {"train_loss": -23.47969627380371, "global_step": 168890, "epoch": 2034} {"train_loss": -23.522611618041992, "global_step": 168891, "epoch": 2034} {"train_loss": -23.687833786010742, "global_step": 168892, "epoch": 2034} {"train_loss": -23.674163818359375, "global_step": 168893, "epoch": 2034} {"train_loss": -23.83892250061035, "global_step": 168894, "epoch": 2034} {"train_loss": -23.439302444458008, "global_step": 168895, "epoch": 2034} {"train_loss": -23.92938232421875, "global_step": 168896, "epoch": 2034} {"train_loss": -23.761856079101562, "global_step": 168897, "epoch": 2034} {"train_loss": -23.868452072143555, "global_step": 168898, "epoch": 2034} {"train_loss": -23.713590621948242, "global_step": 168899, "epoch": 2034} {"train_loss": -23.726245880126953, "global_step": 168900, "epoch": 2034} {"train_loss": -23.6333065032959, "global_step": 168901, "epoch": 2034} {"train_loss": -23.474451065063477, "global_step": 168902, "epoch": 2034} {"train_loss": -23.80413246154785, "global_step": 168903, "epoch": 2034} {"train_loss": -23.62996103677405, "global_step": 168904, "epoch": 2034, "val_loss": 6396964.0} {"train_loss": -23.7497615814209, "global_step": 168905, "epoch": 2035} {"train_loss": -22.956823348999023, "global_step": 168906, "epoch": 2035} {"train_loss": -23.354665756225586, "global_step": 168907, "epoch": 2035} {"train_loss": -23.62067222595215, "global_step": 168908, "epoch": 2035} {"train_loss": -23.116804122924805, "global_step": 168909, "epoch": 2035} {"train_loss": -23.71691131591797, "global_step": 168910, "epoch": 2035} {"train_loss": -23.29616928100586, "global_step": 168911, "epoch": 2035} {"train_loss": -23.38624382019043, "global_step": 168912, "epoch": 2035} {"train_loss": -23.603727340698242, "global_step": 168913, "epoch": 2035} {"train_loss": -23.552425384521484, "global_step": 168914, "epoch": 2035} {"train_loss": -23.177387237548828, "global_step": 168915, "epoch": 2035} {"train_loss": -23.77572250366211, "global_step": 168916, "epoch": 2035} {"train_loss": -23.566484451293945, "global_step": 168917, "epoch": 2035} {"train_loss": -23.485620498657227, "global_step": 168918, "epoch": 2035} {"train_loss": -23.68474769592285, "global_step": 168919, "epoch": 2035} {"train_loss": -23.593374252319336, "global_step": 168920, "epoch": 2035} {"train_loss": -23.367475509643555, "global_step": 168921, "epoch": 2035} {"train_loss": -23.771543502807617, "global_step": 168922, "epoch": 2035} {"train_loss": -23.424840927124023, "global_step": 168923, "epoch": 2035} {"train_loss": -23.485206604003906, "global_step": 168924, "epoch": 2035} {"train_loss": -23.94770622253418, "global_step": 168925, "epoch": 2035} {"train_loss": -23.562299728393555, "global_step": 168926, "epoch": 2035} {"train_loss": -23.65451431274414, "global_step": 168927, "epoch": 2035} {"train_loss": -23.707014083862305, "global_step": 168928, "epoch": 2035} {"train_loss": -23.736177444458008, "global_step": 168929, "epoch": 2035} {"train_loss": -23.695751190185547, "global_step": 168930, "epoch": 2035} {"train_loss": -23.856449127197266, "global_step": 168931, "epoch": 2035} {"train_loss": -23.707862854003906, "global_step": 168932, "epoch": 2035} {"train_loss": -23.750558853149414, "global_step": 168933, "epoch": 2035} {"train_loss": -23.656726837158203, "global_step": 168934, "epoch": 2035} {"train_loss": -23.593061447143555, "global_step": 168935, "epoch": 2035} {"train_loss": -23.633460998535156, "global_step": 168936, "epoch": 2035} {"train_loss": -24.087675094604492, "global_step": 168937, "epoch": 2035} {"train_loss": -23.890029907226562, "global_step": 168938, "epoch": 2035} {"train_loss": -23.749788284301758, "global_step": 168939, "epoch": 2035} {"train_loss": -23.79988670349121, "global_step": 168940, "epoch": 2035} {"train_loss": -23.82444190979004, "global_step": 168941, "epoch": 2035} {"train_loss": -23.710651397705078, "global_step": 168942, "epoch": 2035} {"train_loss": -23.796337127685547, "global_step": 168943, "epoch": 2035} {"train_loss": -24.122684478759766, "global_step": 168944, "epoch": 2035} {"train_loss": -23.637601852416992, "global_step": 168945, "epoch": 2035} {"train_loss": -23.38905143737793, "global_step": 168946, "epoch": 2035} {"train_loss": -23.245349884033203, "global_step": 168947, "epoch": 2035} {"train_loss": -23.433177947998047, "global_step": 168948, "epoch": 2035} {"train_loss": -23.65791893005371, "global_step": 168949, "epoch": 2035} {"train_loss": -23.497459411621094, "global_step": 168950, "epoch": 2035} {"train_loss": -23.725011825561523, "global_step": 168951, "epoch": 2035} {"train_loss": -23.55231475830078, "global_step": 168952, "epoch": 2035} {"train_loss": -23.511917114257812, "global_step": 168953, "epoch": 2035} {"train_loss": -23.46333885192871, "global_step": 168954, "epoch": 2035} {"train_loss": -23.963651657104492, "global_step": 168955, "epoch": 2035} {"train_loss": -23.55316162109375, "global_step": 168956, "epoch": 2035} {"train_loss": -23.557004928588867, "global_step": 168957, "epoch": 2035} {"train_loss": -23.915597915649414, "global_step": 168958, "epoch": 2035} {"train_loss": -24.068359375, "global_step": 168959, "epoch": 2035} {"train_loss": -23.85726547241211, "global_step": 168960, "epoch": 2035} {"train_loss": -23.226709365844727, "global_step": 168961, "epoch": 2035} {"train_loss": -23.614545822143555, "global_step": 168962, "epoch": 2035} {"train_loss": -23.598712921142578, "global_step": 168963, "epoch": 2035} {"train_loss": -23.603544235229492, "global_step": 168964, "epoch": 2035} {"train_loss": -23.59014320373535, "global_step": 168965, "epoch": 2035} {"train_loss": -23.47507095336914, "global_step": 168966, "epoch": 2035} {"train_loss": -23.85736083984375, "global_step": 168967, "epoch": 2035} {"train_loss": -23.48554801940918, "global_step": 168968, "epoch": 2035} {"train_loss": -23.633947372436523, "global_step": 168969, "epoch": 2035} {"train_loss": -23.71563720703125, "global_step": 168970, "epoch": 2035} {"train_loss": -23.6497802734375, "global_step": 168971, "epoch": 2035} {"train_loss": -23.96366310119629, "global_step": 168972, "epoch": 2035} {"train_loss": -23.571748733520508, "global_step": 168973, "epoch": 2035} {"train_loss": -23.731626510620117, "global_step": 168974, "epoch": 2035} {"train_loss": -23.77467918395996, "global_step": 168975, "epoch": 2035} {"train_loss": -23.711462020874023, "global_step": 168976, "epoch": 2035} {"train_loss": -24.079313278198242, "global_step": 168977, "epoch": 2035} {"train_loss": -23.281719207763672, "global_step": 168978, "epoch": 2035} {"train_loss": -23.857221603393555, "global_step": 168979, "epoch": 2035} {"train_loss": -24.188034057617188, "global_step": 168980, "epoch": 2035} {"train_loss": -23.69512176513672, "global_step": 168981, "epoch": 2035} {"train_loss": -23.784278869628906, "global_step": 168982, "epoch": 2035} {"train_loss": -23.872594833374023, "global_step": 168983, "epoch": 2035} {"train_loss": -23.46139144897461, "global_step": 168984, "epoch": 2035} {"train_loss": -23.306562423706055, "global_step": 168985, "epoch": 2035} {"train_loss": -23.57830810546875, "global_step": 168986, "epoch": 2035} {"train_loss": -23.64459416952478, "global_step": 168987, "epoch": 2035, "val_loss": 6461062.0} {"train_loss": -22.83173942565918, "global_step": 168988, "epoch": 2036} {"train_loss": -22.60851287841797, "global_step": 168989, "epoch": 2036} {"train_loss": -22.44413185119629, "global_step": 168990, "epoch": 2036} {"train_loss": -22.634618759155273, "global_step": 168991, "epoch": 2036} {"train_loss": -23.194076538085938, "global_step": 168992, "epoch": 2036} {"train_loss": -22.959970474243164, "global_step": 168993, "epoch": 2036} {"train_loss": -22.913190841674805, "global_step": 168994, "epoch": 2036} {"train_loss": -23.1064453125, "global_step": 168995, "epoch": 2036} {"train_loss": -23.009021759033203, "global_step": 168996, "epoch": 2036} {"train_loss": -23.002267837524414, "global_step": 168997, "epoch": 2036} {"train_loss": -23.421815872192383, "global_step": 168998, "epoch": 2036} {"train_loss": -23.015405654907227, "global_step": 168999, "epoch": 2036} {"train_loss": -23.14868927001953, "global_step": 169000, "epoch": 2036} {"train_loss": -23.243764877319336, "global_step": 169001, "epoch": 2036} {"train_loss": -23.198644638061523, "global_step": 169002, "epoch": 2036} {"train_loss": -23.610937118530273, "global_step": 169003, "epoch": 2036} {"train_loss": -23.086185455322266, "global_step": 169004, "epoch": 2036} {"train_loss": -23.24688148498535, "global_step": 169005, "epoch": 2036} {"train_loss": -23.045364379882812, "global_step": 169006, "epoch": 2036} {"train_loss": -22.793521881103516, "global_step": 169007, "epoch": 2036} {"train_loss": -23.18716812133789, "global_step": 169008, "epoch": 2036} {"train_loss": -23.1451473236084, "global_step": 169009, "epoch": 2036} {"train_loss": -23.5135555267334, "global_step": 169010, "epoch": 2036} {"train_loss": -23.10286521911621, "global_step": 169011, "epoch": 2036} {"train_loss": -23.55350112915039, "global_step": 169012, "epoch": 2036} {"train_loss": -23.54543113708496, "global_step": 169013, "epoch": 2036} {"train_loss": -23.514469146728516, "global_step": 169014, "epoch": 2036} {"train_loss": -23.798080444335938, "global_step": 169015, "epoch": 2036} {"train_loss": -23.545089721679688, "global_step": 169016, "epoch": 2036} {"train_loss": -23.604734420776367, "global_step": 169017, "epoch": 2036} {"train_loss": -23.32697868347168, "global_step": 169018, "epoch": 2036} {"train_loss": -23.854595184326172, "global_step": 169019, "epoch": 2036} {"train_loss": -23.883756637573242, "global_step": 169020, "epoch": 2036} {"train_loss": -23.914278030395508, "global_step": 169021, "epoch": 2036} {"train_loss": -23.477476119995117, "global_step": 169022, "epoch": 2036} {"train_loss": -23.69158935546875, "global_step": 169023, "epoch": 2036} {"train_loss": -23.80504608154297, "global_step": 169024, "epoch": 2036} {"train_loss": -23.382823944091797, "global_step": 169025, "epoch": 2036} {"train_loss": -23.840871810913086, "global_step": 169026, "epoch": 2036} {"train_loss": -23.593530654907227, "global_step": 169027, "epoch": 2036} {"train_loss": -23.947586059570312, "global_step": 169028, "epoch": 2036} {"train_loss": -23.542203903198242, "global_step": 169029, "epoch": 2036} {"train_loss": -23.7397518157959, "global_step": 169030, "epoch": 2036} {"train_loss": -23.832332611083984, "global_step": 169031, "epoch": 2036} {"train_loss": -23.452369689941406, "global_step": 169032, "epoch": 2036} {"train_loss": -23.45255470275879, "global_step": 169033, "epoch": 2036} {"train_loss": -23.612903594970703, "global_step": 169034, "epoch": 2036} {"train_loss": -23.64021110534668, "global_step": 169035, "epoch": 2036} {"train_loss": -23.56255531311035, "global_step": 169036, "epoch": 2036} {"train_loss": -23.92059326171875, "global_step": 169037, "epoch": 2036} {"train_loss": -23.854406356811523, "global_step": 169038, "epoch": 2036} {"train_loss": -23.89459800720215, "global_step": 169039, "epoch": 2036} {"train_loss": -24.04184913635254, "global_step": 169040, "epoch": 2036} {"train_loss": -23.525653839111328, "global_step": 169041, "epoch": 2036} {"train_loss": -23.78420066833496, "global_step": 169042, "epoch": 2036} {"train_loss": -23.929990768432617, "global_step": 169043, "epoch": 2036} {"train_loss": -23.458154678344727, "global_step": 169044, "epoch": 2036} {"train_loss": -23.465787887573242, "global_step": 169045, "epoch": 2036} {"train_loss": -23.705907821655273, "global_step": 169046, "epoch": 2036} {"train_loss": -23.358291625976562, "global_step": 169047, "epoch": 2036} {"train_loss": -24.212244033813477, "global_step": 169048, "epoch": 2036} {"train_loss": -23.66102409362793, "global_step": 169049, "epoch": 2036} {"train_loss": -23.65146255493164, "global_step": 169050, "epoch": 2036} {"train_loss": -23.57402992248535, "global_step": 169051, "epoch": 2036} {"train_loss": -23.843435287475586, "global_step": 169052, "epoch": 2036} {"train_loss": -23.78228187561035, "global_step": 169053, "epoch": 2036} {"train_loss": -23.426584243774414, "global_step": 169054, "epoch": 2036} {"train_loss": -24.078901290893555, "global_step": 169055, "epoch": 2036} {"train_loss": -23.90366554260254, "global_step": 169056, "epoch": 2036} {"train_loss": -23.631500244140625, "global_step": 169057, "epoch": 2036} {"train_loss": -23.552724838256836, "global_step": 169058, "epoch": 2036} {"train_loss": -23.50142478942871, "global_step": 169059, "epoch": 2036} {"train_loss": -23.800779342651367, "global_step": 169060, "epoch": 2036} {"train_loss": -23.636531829833984, "global_step": 169061, "epoch": 2036} {"train_loss": -23.49968719482422, "global_step": 169062, "epoch": 2036} {"train_loss": -23.403860092163086, "global_step": 169063, "epoch": 2036} {"train_loss": -23.645116806030273, "global_step": 169064, "epoch": 2036} {"train_loss": -23.56885528564453, "global_step": 169065, "epoch": 2036} {"train_loss": -23.58693504333496, "global_step": 169066, "epoch": 2036} {"train_loss": -23.880836486816406, "global_step": 169067, "epoch": 2036} {"train_loss": -24.026948928833008, "global_step": 169068, "epoch": 2036} {"train_loss": -23.97142791748047, "global_step": 169069, "epoch": 2036} {"train_loss": -23.50011363661433, "global_step": 169070, "epoch": 2036, "val_loss": 6372968.0} {"train_loss": -23.017873764038086, "global_step": 169071, "epoch": 2037} {"train_loss": -23.13743019104004, "global_step": 169072, "epoch": 2037} {"train_loss": -23.335081100463867, "global_step": 169073, "epoch": 2037} {"train_loss": -23.47319984436035, "global_step": 169074, "epoch": 2037} {"train_loss": -23.330068588256836, "global_step": 169075, "epoch": 2037} {"train_loss": -23.32818603515625, "global_step": 169076, "epoch": 2037} {"train_loss": -23.292123794555664, "global_step": 169077, "epoch": 2037} {"train_loss": -23.47034454345703, "global_step": 169078, "epoch": 2037} {"train_loss": -23.745615005493164, "global_step": 169079, "epoch": 2037} {"train_loss": -23.355239868164062, "global_step": 169080, "epoch": 2037} {"train_loss": -22.84380531311035, "global_step": 169081, "epoch": 2037} {"train_loss": -23.358020782470703, "global_step": 169082, "epoch": 2037} {"train_loss": -23.293636322021484, "global_step": 169083, "epoch": 2037} {"train_loss": -23.220468521118164, "global_step": 169084, "epoch": 2037} {"train_loss": -23.42661476135254, "global_step": 169085, "epoch": 2037} {"train_loss": -23.817678451538086, "global_step": 169086, "epoch": 2037} {"train_loss": -23.342344284057617, "global_step": 169087, "epoch": 2037} {"train_loss": -23.12819480895996, "global_step": 169088, "epoch": 2037} {"train_loss": -23.515108108520508, "global_step": 169089, "epoch": 2037} {"train_loss": -23.812360763549805, "global_step": 169090, "epoch": 2037} {"train_loss": -23.694812774658203, "global_step": 169091, "epoch": 2037} {"train_loss": -23.75193977355957, "global_step": 169092, "epoch": 2037} {"train_loss": -23.48874855041504, "global_step": 169093, "epoch": 2037} {"train_loss": -23.510051727294922, "global_step": 169094, "epoch": 2037} {"train_loss": -23.77754783630371, "global_step": 169095, "epoch": 2037} {"train_loss": -23.800933837890625, "global_step": 169096, "epoch": 2037} {"train_loss": -23.63936424255371, "global_step": 169097, "epoch": 2037} {"train_loss": -23.72416877746582, "global_step": 169098, "epoch": 2037} {"train_loss": -23.53212547302246, "global_step": 169099, "epoch": 2037} {"train_loss": -23.5605411529541, "global_step": 169100, "epoch": 2037} {"train_loss": -23.655017852783203, "global_step": 169101, "epoch": 2037} {"train_loss": -24.015792846679688, "global_step": 169102, "epoch": 2037} {"train_loss": -23.788827896118164, "global_step": 169103, "epoch": 2037} {"train_loss": -23.697980880737305, "global_step": 169104, "epoch": 2037} {"train_loss": -23.602975845336914, "global_step": 169105, "epoch": 2037} {"train_loss": -23.341333389282227, "global_step": 169106, "epoch": 2037} {"train_loss": -23.60006332397461, "global_step": 169107, "epoch": 2037} {"train_loss": -23.695632934570312, "global_step": 169108, "epoch": 2037} {"train_loss": -23.55547332763672, "global_step": 169109, "epoch": 2037} {"train_loss": -23.380109786987305, "global_step": 169110, "epoch": 2037} {"train_loss": -23.81374740600586, "global_step": 169111, "epoch": 2037} {"train_loss": -23.589487075805664, "global_step": 169112, "epoch": 2037} {"train_loss": -23.239017486572266, "global_step": 169113, "epoch": 2037} {"train_loss": -23.829309463500977, "global_step": 169114, "epoch": 2037} {"train_loss": -23.687633514404297, "global_step": 169115, "epoch": 2037} {"train_loss": -23.637937545776367, "global_step": 169116, "epoch": 2037} {"train_loss": -23.892921447753906, "global_step": 169117, "epoch": 2037} {"train_loss": -23.48116683959961, "global_step": 169118, "epoch": 2037} {"train_loss": -23.63159942626953, "global_step": 169119, "epoch": 2037} {"train_loss": -23.5156307220459, "global_step": 169120, "epoch": 2037} {"train_loss": -23.80830192565918, "global_step": 169121, "epoch": 2037} {"train_loss": -23.816783905029297, "global_step": 169122, "epoch": 2037} {"train_loss": -24.255910873413086, "global_step": 169123, "epoch": 2037} {"train_loss": -23.664918899536133, "global_step": 169124, "epoch": 2037} {"train_loss": -23.8778018951416, "global_step": 169125, "epoch": 2037} {"train_loss": -24.099151611328125, "global_step": 169126, "epoch": 2037} {"train_loss": -23.869972229003906, "global_step": 169127, "epoch": 2037} {"train_loss": -23.62779426574707, "global_step": 169128, "epoch": 2037} {"train_loss": -23.90687370300293, "global_step": 169129, "epoch": 2037} {"train_loss": -23.931970596313477, "global_step": 169130, "epoch": 2037} {"train_loss": -23.913503646850586, "global_step": 169131, "epoch": 2037} {"train_loss": -23.85624885559082, "global_step": 169132, "epoch": 2037} {"train_loss": -23.527179718017578, "global_step": 169133, "epoch": 2037} {"train_loss": -23.41843605041504, "global_step": 169134, "epoch": 2037} {"train_loss": -23.28224754333496, "global_step": 169135, "epoch": 2037} {"train_loss": -22.89003562927246, "global_step": 169136, "epoch": 2037} {"train_loss": -23.181243896484375, "global_step": 169137, "epoch": 2037} {"train_loss": -23.272258758544922, "global_step": 169138, "epoch": 2037} {"train_loss": -23.481204986572266, "global_step": 169139, "epoch": 2037} {"train_loss": -23.384017944335938, "global_step": 169140, "epoch": 2037} {"train_loss": -23.446083068847656, "global_step": 169141, "epoch": 2037} {"train_loss": -23.969696044921875, "global_step": 169142, "epoch": 2037} {"train_loss": -23.887027740478516, "global_step": 169143, "epoch": 2037} {"train_loss": -23.352025985717773, "global_step": 169144, "epoch": 2037} {"train_loss": -23.685884475708008, "global_step": 169145, "epoch": 2037} {"train_loss": -23.622867584228516, "global_step": 169146, "epoch": 2037} {"train_loss": -23.635374069213867, "global_step": 169147, "epoch": 2037} {"train_loss": -23.453269958496094, "global_step": 169148, "epoch": 2037} {"train_loss": -23.793773651123047, "global_step": 169149, "epoch": 2037} {"train_loss": -23.84410285949707, "global_step": 169150, "epoch": 2037} {"train_loss": -23.171234130859375, "global_step": 169151, "epoch": 2037} {"train_loss": -23.717514038085938, "global_step": 169152, "epoch": 2037} {"train_loss": -23.559975543654108, "global_step": 169153, "epoch": 2037, "val_loss": 6522317.0} {"train_loss": -22.8099365234375, "global_step": 169154, "epoch": 2038} {"train_loss": -23.527585983276367, "global_step": 169155, "epoch": 2038} {"train_loss": -22.95503044128418, "global_step": 169156, "epoch": 2038} {"train_loss": -23.193035125732422, "global_step": 169157, "epoch": 2038} {"train_loss": -23.364715576171875, "global_step": 169158, "epoch": 2038} {"train_loss": -23.25004005432129, "global_step": 169159, "epoch": 2038} {"train_loss": -23.04616355895996, "global_step": 169160, "epoch": 2038} {"train_loss": -23.611263275146484, "global_step": 169161, "epoch": 2038} {"train_loss": -23.272111892700195, "global_step": 169162, "epoch": 2038} {"train_loss": -23.52077293395996, "global_step": 169163, "epoch": 2038} {"train_loss": -23.54473876953125, "global_step": 169164, "epoch": 2038} {"train_loss": -23.458141326904297, "global_step": 169165, "epoch": 2038} {"train_loss": -23.58663558959961, "global_step": 169166, "epoch": 2038} {"train_loss": -23.81808853149414, "global_step": 169167, "epoch": 2038} {"train_loss": -23.966447830200195, "global_step": 169168, "epoch": 2038} {"train_loss": -23.773435592651367, "global_step": 169169, "epoch": 2038} {"train_loss": -23.5737361907959, "global_step": 169170, "epoch": 2038} {"train_loss": -23.793603897094727, "global_step": 169171, "epoch": 2038} {"train_loss": -23.68511390686035, "global_step": 169172, "epoch": 2038} {"train_loss": -23.77311897277832, "global_step": 169173, "epoch": 2038} {"train_loss": -23.809354782104492, "global_step": 169174, "epoch": 2038} {"train_loss": -23.421512603759766, "global_step": 169175, "epoch": 2038} {"train_loss": -23.582937240600586, "global_step": 169176, "epoch": 2038} {"train_loss": -23.934589385986328, "global_step": 169177, "epoch": 2038} {"train_loss": -23.789077758789062, "global_step": 169178, "epoch": 2038} {"train_loss": -24.010122299194336, "global_step": 169179, "epoch": 2038} {"train_loss": -23.396745681762695, "global_step": 169180, "epoch": 2038} {"train_loss": -23.52558708190918, "global_step": 169181, "epoch": 2038} {"train_loss": -23.931865692138672, "global_step": 169182, "epoch": 2038} {"train_loss": -23.53519630432129, "global_step": 169183, "epoch": 2038} {"train_loss": -23.803817749023438, "global_step": 169184, "epoch": 2038} {"train_loss": -23.757526397705078, "global_step": 169185, "epoch": 2038} {"train_loss": -23.43763542175293, "global_step": 169186, "epoch": 2038} {"train_loss": -23.939350128173828, "global_step": 169187, "epoch": 2038} {"train_loss": -23.225650787353516, "global_step": 169188, "epoch": 2038} {"train_loss": -23.566028594970703, "global_step": 169189, "epoch": 2038} {"train_loss": -23.98641014099121, "global_step": 169190, "epoch": 2038} {"train_loss": -23.394460678100586, "global_step": 169191, "epoch": 2038} {"train_loss": -23.912954330444336, "global_step": 169192, "epoch": 2038} {"train_loss": -23.562440872192383, "global_step": 169193, "epoch": 2038} {"train_loss": -23.644527435302734, "global_step": 169194, "epoch": 2038} {"train_loss": -23.819442749023438, "global_step": 169195, "epoch": 2038} {"train_loss": -23.46414566040039, "global_step": 169196, "epoch": 2038} {"train_loss": -23.982206344604492, "global_step": 169197, "epoch": 2038} {"train_loss": -24.110300064086914, "global_step": 169198, "epoch": 2038} {"train_loss": -23.5772647857666, "global_step": 169199, "epoch": 2038} {"train_loss": -23.543127059936523, "global_step": 169200, "epoch": 2038} {"train_loss": -23.653905868530273, "global_step": 169201, "epoch": 2038} {"train_loss": -23.648029327392578, "global_step": 169202, "epoch": 2038} {"train_loss": -23.69181251525879, "global_step": 169203, "epoch": 2038} {"train_loss": -23.90567398071289, "global_step": 169204, "epoch": 2038} {"train_loss": -23.950420379638672, "global_step": 169205, "epoch": 2038} {"train_loss": -24.066810607910156, "global_step": 169206, "epoch": 2038} {"train_loss": -23.710874557495117, "global_step": 169207, "epoch": 2038} {"train_loss": -23.42024803161621, "global_step": 169208, "epoch": 2038} {"train_loss": -24.052417755126953, "global_step": 169209, "epoch": 2038} {"train_loss": -23.682876586914062, "global_step": 169210, "epoch": 2038} {"train_loss": -23.747425079345703, "global_step": 169211, "epoch": 2038} {"train_loss": -23.77253532409668, "global_step": 169212, "epoch": 2038} {"train_loss": -23.59023094177246, "global_step": 169213, "epoch": 2038} {"train_loss": -24.018388748168945, "global_step": 169214, "epoch": 2038} {"train_loss": -24.179643630981445, "global_step": 169215, "epoch": 2038} {"train_loss": -23.915666580200195, "global_step": 169216, "epoch": 2038} {"train_loss": -23.64798355102539, "global_step": 169217, "epoch": 2038} {"train_loss": -23.708066940307617, "global_step": 169218, "epoch": 2038} {"train_loss": -23.53334617614746, "global_step": 169219, "epoch": 2038} {"train_loss": -23.671899795532227, "global_step": 169220, "epoch": 2038} {"train_loss": -23.492416381835938, "global_step": 169221, "epoch": 2038} {"train_loss": -23.68035888671875, "global_step": 169222, "epoch": 2038} {"train_loss": -23.704330444335938, "global_step": 169223, "epoch": 2038} {"train_loss": -23.77166175842285, "global_step": 169224, "epoch": 2038} {"train_loss": -23.47260856628418, "global_step": 169225, "epoch": 2038} {"train_loss": -23.67485809326172, "global_step": 169226, "epoch": 2038} {"train_loss": -23.120914459228516, "global_step": 169227, "epoch": 2038} {"train_loss": -23.2691650390625, "global_step": 169228, "epoch": 2038} {"train_loss": -23.10181999206543, "global_step": 169229, "epoch": 2038} {"train_loss": -23.38841438293457, "global_step": 169230, "epoch": 2038} {"train_loss": -23.493350982666016, "global_step": 169231, "epoch": 2038} {"train_loss": -23.548358917236328, "global_step": 169232, "epoch": 2038} {"train_loss": -23.287368774414062, "global_step": 169233, "epoch": 2038} {"train_loss": -23.391599655151367, "global_step": 169234, "epoch": 2038} {"train_loss": -23.842222213745117, "global_step": 169235, "epoch": 2038} {"train_loss": -23.617461859461773, "global_step": 169236, "epoch": 2038, "val_loss": 6386134.5} {"train_loss": -23.499526977539062, "global_step": 169237, "epoch": 2039} {"train_loss": -23.270492553710938, "global_step": 169238, "epoch": 2039} {"train_loss": -22.956586837768555, "global_step": 169239, "epoch": 2039} {"train_loss": -23.346271514892578, "global_step": 169240, "epoch": 2039} {"train_loss": -23.42349624633789, "global_step": 169241, "epoch": 2039} {"train_loss": -23.361665725708008, "global_step": 169242, "epoch": 2039} {"train_loss": -23.249755859375, "global_step": 169243, "epoch": 2039} {"train_loss": -23.094026565551758, "global_step": 169244, "epoch": 2039} {"train_loss": -23.46840476989746, "global_step": 169245, "epoch": 2039} {"train_loss": -23.810317993164062, "global_step": 169246, "epoch": 2039} {"train_loss": -23.65688133239746, "global_step": 169247, "epoch": 2039} {"train_loss": -23.944852828979492, "global_step": 169248, "epoch": 2039} {"train_loss": -23.645936965942383, "global_step": 169249, "epoch": 2039} {"train_loss": -23.140199661254883, "global_step": 169250, "epoch": 2039} {"train_loss": -23.739835739135742, "global_step": 169251, "epoch": 2039} {"train_loss": -23.411273956298828, "global_step": 169252, "epoch": 2039} {"train_loss": -23.631315231323242, "global_step": 169253, "epoch": 2039} {"train_loss": -23.477109909057617, "global_step": 169254, "epoch": 2039} {"train_loss": -23.71195411682129, "global_step": 169255, "epoch": 2039} {"train_loss": -23.728662490844727, "global_step": 169256, "epoch": 2039} {"train_loss": -23.78436851501465, "global_step": 169257, "epoch": 2039} {"train_loss": -23.686813354492188, "global_step": 169258, "epoch": 2039} {"train_loss": -23.35215187072754, "global_step": 169259, "epoch": 2039} {"train_loss": -23.5389461517334, "global_step": 169260, "epoch": 2039} {"train_loss": -23.256032943725586, "global_step": 169261, "epoch": 2039} {"train_loss": -23.40432357788086, "global_step": 169262, "epoch": 2039} {"train_loss": -23.895048141479492, "global_step": 169263, "epoch": 2039} {"train_loss": -23.074504852294922, "global_step": 169264, "epoch": 2039} {"train_loss": -23.2804012298584, "global_step": 169265, "epoch": 2039} {"train_loss": -24.020475387573242, "global_step": 169266, "epoch": 2039} {"train_loss": -23.70979881286621, "global_step": 169267, "epoch": 2039} {"train_loss": -23.607606887817383, "global_step": 169268, "epoch": 2039} {"train_loss": -23.65437126159668, "global_step": 169269, "epoch": 2039} {"train_loss": -23.683080673217773, "global_step": 169270, "epoch": 2039} {"train_loss": -23.586238861083984, "global_step": 169271, "epoch": 2039} {"train_loss": -23.56953239440918, "global_step": 169272, "epoch": 2039} {"train_loss": -23.39478302001953, "global_step": 169273, "epoch": 2039} {"train_loss": -23.281774520874023, "global_step": 169274, "epoch": 2039} {"train_loss": -23.377445220947266, "global_step": 169275, "epoch": 2039} {"train_loss": -23.583669662475586, "global_step": 169276, "epoch": 2039} {"train_loss": -23.723337173461914, "global_step": 169277, "epoch": 2039} {"train_loss": -23.27711296081543, "global_step": 169278, "epoch": 2039} {"train_loss": -23.7261962890625, "global_step": 169279, "epoch": 2039} {"train_loss": -23.306232452392578, "global_step": 169280, "epoch": 2039} {"train_loss": -23.69862937927246, "global_step": 169281, "epoch": 2039} {"train_loss": -23.593542098999023, "global_step": 169282, "epoch": 2039} {"train_loss": -23.841083526611328, "global_step": 169283, "epoch": 2039} {"train_loss": -23.878049850463867, "global_step": 169284, "epoch": 2039} {"train_loss": -23.503515243530273, "global_step": 169285, "epoch": 2039} {"train_loss": -23.77828025817871, "global_step": 169286, "epoch": 2039} {"train_loss": -23.805570602416992, "global_step": 169287, "epoch": 2039} {"train_loss": -23.59561538696289, "global_step": 169288, "epoch": 2039} {"train_loss": -23.513578414916992, "global_step": 169289, "epoch": 2039} {"train_loss": -23.739248275756836, "global_step": 169290, "epoch": 2039} {"train_loss": -23.718244552612305, "global_step": 169291, "epoch": 2039} {"train_loss": -23.52029037475586, "global_step": 169292, "epoch": 2039} {"train_loss": -23.423744201660156, "global_step": 169293, "epoch": 2039} {"train_loss": -23.9137020111084, "global_step": 169294, "epoch": 2039} {"train_loss": -23.86671257019043, "global_step": 169295, "epoch": 2039} {"train_loss": -23.63057518005371, "global_step": 169296, "epoch": 2039} {"train_loss": -23.8194580078125, "global_step": 169297, "epoch": 2039} {"train_loss": -24.16473388671875, "global_step": 169298, "epoch": 2039} {"train_loss": -23.591184616088867, "global_step": 169299, "epoch": 2039} {"train_loss": -23.821985244750977, "global_step": 169300, "epoch": 2039} {"train_loss": -23.671533584594727, "global_step": 169301, "epoch": 2039} {"train_loss": -23.708402633666992, "global_step": 169302, "epoch": 2039} {"train_loss": -23.57767105102539, "global_step": 169303, "epoch": 2039} {"train_loss": -23.70900535583496, "global_step": 169304, "epoch": 2039} {"train_loss": -23.686548233032227, "global_step": 169305, "epoch": 2039} {"train_loss": -23.663902282714844, "global_step": 169306, "epoch": 2039} {"train_loss": -23.593128204345703, "global_step": 169307, "epoch": 2039} {"train_loss": -23.87940788269043, "global_step": 169308, "epoch": 2039} {"train_loss": -23.650915145874023, "global_step": 169309, "epoch": 2039} {"train_loss": -23.84111785888672, "global_step": 169310, "epoch": 2039} {"train_loss": -23.784093856811523, "global_step": 169311, "epoch": 2039} {"train_loss": -23.796049118041992, "global_step": 169312, "epoch": 2039} {"train_loss": -23.729568481445312, "global_step": 169313, "epoch": 2039} {"train_loss": -23.339746475219727, "global_step": 169314, "epoch": 2039} {"train_loss": -23.592077255249023, "global_step": 169315, "epoch": 2039} {"train_loss": -23.757694244384766, "global_step": 169316, "epoch": 2039} {"train_loss": -23.335229873657227, "global_step": 169317, "epoch": 2039} {"train_loss": -23.896604537963867, "global_step": 169318, "epoch": 2039} {"train_loss": -23.597371526511317, "global_step": 169319, "epoch": 2039, "val_loss": 6390251.0} {"train_loss": -23.77798843383789, "global_step": 169320, "epoch": 2040} {"train_loss": -23.789045333862305, "global_step": 169321, "epoch": 2040} {"train_loss": -23.61552619934082, "global_step": 169322, "epoch": 2040} {"train_loss": -23.617366790771484, "global_step": 169323, "epoch": 2040} {"train_loss": -23.396970748901367, "global_step": 169324, "epoch": 2040} {"train_loss": -23.840314865112305, "global_step": 169325, "epoch": 2040} {"train_loss": -23.620046615600586, "global_step": 169326, "epoch": 2040} {"train_loss": -23.829130172729492, "global_step": 169327, "epoch": 2040} {"train_loss": -23.772642135620117, "global_step": 169328, "epoch": 2040} {"train_loss": -23.974288940429688, "global_step": 169329, "epoch": 2040} {"train_loss": -23.782087326049805, "global_step": 169330, "epoch": 2040} {"train_loss": -23.739450454711914, "global_step": 169331, "epoch": 2040} {"train_loss": -23.772733688354492, "global_step": 169332, "epoch": 2040} {"train_loss": -23.927946090698242, "global_step": 169333, "epoch": 2040} {"train_loss": -23.415342330932617, "global_step": 169334, "epoch": 2040} {"train_loss": -23.48487663269043, "global_step": 169335, "epoch": 2040} {"train_loss": -23.532621383666992, "global_step": 169336, "epoch": 2040} {"train_loss": -23.412845611572266, "global_step": 169337, "epoch": 2040} {"train_loss": -23.8456974029541, "global_step": 169338, "epoch": 2040} {"train_loss": -23.794095993041992, "global_step": 169339, "epoch": 2040} {"train_loss": -23.908409118652344, "global_step": 169340, "epoch": 2040} {"train_loss": -23.7161865234375, "global_step": 169341, "epoch": 2040} {"train_loss": -23.854501724243164, "global_step": 169342, "epoch": 2040} {"train_loss": -23.990461349487305, "global_step": 169343, "epoch": 2040} {"train_loss": -23.856231689453125, "global_step": 169344, "epoch": 2040} {"train_loss": -23.922840118408203, "global_step": 169345, "epoch": 2040} {"train_loss": -23.614736557006836, "global_step": 169346, "epoch": 2040} {"train_loss": -23.630718231201172, "global_step": 169347, "epoch": 2040} {"train_loss": -23.514379501342773, "global_step": 169348, "epoch": 2040} {"train_loss": -23.63652992248535, "global_step": 169349, "epoch": 2040} {"train_loss": -23.70454978942871, "global_step": 169350, "epoch": 2040} {"train_loss": -23.627534866333008, "global_step": 169351, "epoch": 2040} {"train_loss": -23.831125259399414, "global_step": 169352, "epoch": 2040} {"train_loss": -23.59919548034668, "global_step": 169353, "epoch": 2040} {"train_loss": -23.657732009887695, "global_step": 169354, "epoch": 2040} {"train_loss": -23.57907485961914, "global_step": 169355, "epoch": 2040} {"train_loss": -23.589662551879883, "global_step": 169356, "epoch": 2040} {"train_loss": -23.63583755493164, "global_step": 169357, "epoch": 2040} {"train_loss": -23.64491081237793, "global_step": 169358, "epoch": 2040} {"train_loss": -23.773883819580078, "global_step": 169359, "epoch": 2040} {"train_loss": -23.747539520263672, "global_step": 169360, "epoch": 2040} {"train_loss": -23.379621505737305, "global_step": 169361, "epoch": 2040} {"train_loss": -24.159555435180664, "global_step": 169362, "epoch": 2040} {"train_loss": -24.27595329284668, "global_step": 169363, "epoch": 2040} {"train_loss": -23.960468292236328, "global_step": 169364, "epoch": 2040} {"train_loss": -24.1297607421875, "global_step": 169365, "epoch": 2040} {"train_loss": -23.774169921875, "global_step": 169366, "epoch": 2040} {"train_loss": -23.87880516052246, "global_step": 169367, "epoch": 2040} {"train_loss": -23.907855987548828, "global_step": 169368, "epoch": 2040} {"train_loss": -23.863779067993164, "global_step": 169369, "epoch": 2040} {"train_loss": -23.559247970581055, "global_step": 169370, "epoch": 2040} {"train_loss": -23.646211624145508, "global_step": 169371, "epoch": 2040} {"train_loss": -23.503183364868164, "global_step": 169372, "epoch": 2040} {"train_loss": -24.08436393737793, "global_step": 169373, "epoch": 2040} {"train_loss": -23.853193283081055, "global_step": 169374, "epoch": 2040} {"train_loss": -23.770265579223633, "global_step": 169375, "epoch": 2040} {"train_loss": -23.55902099609375, "global_step": 169376, "epoch": 2040} {"train_loss": -23.740367889404297, "global_step": 169377, "epoch": 2040} {"train_loss": -24.07159423828125, "global_step": 169378, "epoch": 2040} {"train_loss": -23.67690086364746, "global_step": 169379, "epoch": 2040} {"train_loss": -23.588333129882812, "global_step": 169380, "epoch": 2040} {"train_loss": -23.797815322875977, "global_step": 169381, "epoch": 2040} {"train_loss": -23.37489891052246, "global_step": 169382, "epoch": 2040} {"train_loss": -23.478370666503906, "global_step": 169383, "epoch": 2040} {"train_loss": -23.572790145874023, "global_step": 169384, "epoch": 2040} {"train_loss": -23.8684024810791, "global_step": 169385, "epoch": 2040} {"train_loss": -23.81488609313965, "global_step": 169386, "epoch": 2040} {"train_loss": -24.072574615478516, "global_step": 169387, "epoch": 2040} {"train_loss": -23.667583465576172, "global_step": 169388, "epoch": 2040} {"train_loss": -23.6555233001709, "global_step": 169389, "epoch": 2040} {"train_loss": -23.47242546081543, "global_step": 169390, "epoch": 2040} {"train_loss": -23.819843292236328, "global_step": 169391, "epoch": 2040} {"train_loss": -23.860687255859375, "global_step": 169392, "epoch": 2040} {"train_loss": -23.874441146850586, "global_step": 169393, "epoch": 2040} {"train_loss": -23.89573097229004, "global_step": 169394, "epoch": 2040} {"train_loss": -23.738866806030273, "global_step": 169395, "epoch": 2040} {"train_loss": -23.952980041503906, "global_step": 169396, "epoch": 2040} {"train_loss": -23.473413467407227, "global_step": 169397, "epoch": 2040} {"train_loss": -23.4730224609375, "global_step": 169398, "epoch": 2040} {"train_loss": -23.780990600585938, "global_step": 169399, "epoch": 2040} {"train_loss": -23.738264083862305, "global_step": 169400, "epoch": 2040} {"train_loss": -23.637075424194336, "global_step": 169401, "epoch": 2040} {"train_loss": -23.732432721609094, "global_step": 169402, "epoch": 2040, "val_loss": 6438830.0} {"train_loss": -22.444433212280273, "global_step": 169403, "epoch": 2041} {"train_loss": -22.855459213256836, "global_step": 169404, "epoch": 2041} {"train_loss": -22.806116104125977, "global_step": 169405, "epoch": 2041} {"train_loss": -22.643089294433594, "global_step": 169406, "epoch": 2041} {"train_loss": -23.333051681518555, "global_step": 169407, "epoch": 2041} {"train_loss": -22.361989974975586, "global_step": 169408, "epoch": 2041} {"train_loss": -22.777437210083008, "global_step": 169409, "epoch": 2041} {"train_loss": -23.220998764038086, "global_step": 169410, "epoch": 2041} {"train_loss": -23.229185104370117, "global_step": 169411, "epoch": 2041} {"train_loss": -23.59828758239746, "global_step": 169412, "epoch": 2041} {"train_loss": -23.242408752441406, "global_step": 169413, "epoch": 2041} {"train_loss": -23.63147735595703, "global_step": 169414, "epoch": 2041} {"train_loss": -23.49656867980957, "global_step": 169415, "epoch": 2041} {"train_loss": -23.166051864624023, "global_step": 169416, "epoch": 2041} {"train_loss": -23.29719352722168, "global_step": 169417, "epoch": 2041} {"train_loss": -23.3475341796875, "global_step": 169418, "epoch": 2041} {"train_loss": -23.408205032348633, "global_step": 169419, "epoch": 2041} {"train_loss": -23.115774154663086, "global_step": 169420, "epoch": 2041} {"train_loss": -23.85658073425293, "global_step": 169421, "epoch": 2041} {"train_loss": -23.62268829345703, "global_step": 169422, "epoch": 2041} {"train_loss": -23.38006591796875, "global_step": 169423, "epoch": 2041} {"train_loss": -23.1651668548584, "global_step": 169424, "epoch": 2041} {"train_loss": -23.762828826904297, "global_step": 169425, "epoch": 2041} {"train_loss": -23.948862075805664, "global_step": 169426, "epoch": 2041} {"train_loss": -23.82508087158203, "global_step": 169427, "epoch": 2041} {"train_loss": -23.790454864501953, "global_step": 169428, "epoch": 2041} {"train_loss": -23.74992561340332, "global_step": 169429, "epoch": 2041} {"train_loss": -23.70256233215332, "global_step": 169430, "epoch": 2041} {"train_loss": -23.5057373046875, "global_step": 169431, "epoch": 2041} {"train_loss": -23.817089080810547, "global_step": 169432, "epoch": 2041} {"train_loss": -23.571590423583984, "global_step": 169433, "epoch": 2041} {"train_loss": -23.823034286499023, "global_step": 169434, "epoch": 2041} {"train_loss": -23.560287475585938, "global_step": 169435, "epoch": 2041} {"train_loss": -23.72812271118164, "global_step": 169436, "epoch": 2041} {"train_loss": -23.506858825683594, "global_step": 169437, "epoch": 2041} {"train_loss": -23.71422004699707, "global_step": 169438, "epoch": 2041} {"train_loss": -23.67234230041504, "global_step": 169439, "epoch": 2041} {"train_loss": -23.443164825439453, "global_step": 169440, "epoch": 2041} {"train_loss": -23.75682258605957, "global_step": 169441, "epoch": 2041} {"train_loss": -23.562522888183594, "global_step": 169442, "epoch": 2041} {"train_loss": -23.43299674987793, "global_step": 169443, "epoch": 2041} {"train_loss": -23.945974349975586, "global_step": 169444, "epoch": 2041} {"train_loss": -23.623563766479492, "global_step": 169445, "epoch": 2041} {"train_loss": -23.83887481689453, "global_step": 169446, "epoch": 2041} {"train_loss": -23.689220428466797, "global_step": 169447, "epoch": 2041} {"train_loss": -23.857587814331055, "global_step": 169448, "epoch": 2041} {"train_loss": -24.178617477416992, "global_step": 169449, "epoch": 2041} {"train_loss": -23.819568634033203, "global_step": 169450, "epoch": 2041} {"train_loss": -23.655813217163086, "global_step": 169451, "epoch": 2041} {"train_loss": -23.90961265563965, "global_step": 169452, "epoch": 2041} {"train_loss": -23.87563705444336, "global_step": 169453, "epoch": 2041} {"train_loss": -23.76993751525879, "global_step": 169454, "epoch": 2041} {"train_loss": -23.72303581237793, "global_step": 169455, "epoch": 2041} {"train_loss": -24.107938766479492, "global_step": 169456, "epoch": 2041} {"train_loss": -23.501840591430664, "global_step": 169457, "epoch": 2041} {"train_loss": -23.567594528198242, "global_step": 169458, "epoch": 2041} {"train_loss": -23.917325973510742, "global_step": 169459, "epoch": 2041} {"train_loss": -23.571054458618164, "global_step": 169460, "epoch": 2041} {"train_loss": -23.698328018188477, "global_step": 169461, "epoch": 2041} {"train_loss": -23.855182647705078, "global_step": 169462, "epoch": 2041} {"train_loss": -23.76144790649414, "global_step": 169463, "epoch": 2041} {"train_loss": -23.539548873901367, "global_step": 169464, "epoch": 2041} {"train_loss": -23.523046493530273, "global_step": 169465, "epoch": 2041} {"train_loss": -23.879764556884766, "global_step": 169466, "epoch": 2041} {"train_loss": -23.575603485107422, "global_step": 169467, "epoch": 2041} {"train_loss": -23.5611572265625, "global_step": 169468, "epoch": 2041} {"train_loss": -23.634920120239258, "global_step": 169469, "epoch": 2041} {"train_loss": -23.62101936340332, "global_step": 169470, "epoch": 2041} {"train_loss": -24.025426864624023, "global_step": 169471, "epoch": 2041} {"train_loss": -23.46236228942871, "global_step": 169472, "epoch": 2041} {"train_loss": -23.300369262695312, "global_step": 169473, "epoch": 2041} {"train_loss": -23.59078025817871, "global_step": 169474, "epoch": 2041} {"train_loss": -23.251188278198242, "global_step": 169475, "epoch": 2041} {"train_loss": -23.48280906677246, "global_step": 169476, "epoch": 2041} {"train_loss": -23.2482967376709, "global_step": 169477, "epoch": 2041} {"train_loss": -22.9426326751709, "global_step": 169478, "epoch": 2041} {"train_loss": -23.788902282714844, "global_step": 169479, "epoch": 2041} {"train_loss": -23.342649459838867, "global_step": 169480, "epoch": 2041} {"train_loss": -23.53925895690918, "global_step": 169481, "epoch": 2041} {"train_loss": -23.309629440307617, "global_step": 169482, "epoch": 2041} {"train_loss": -23.363622665405273, "global_step": 169483, "epoch": 2041} {"train_loss": -23.721054077148438, "global_step": 169484, "epoch": 2041} {"train_loss": -23.514318259365588, "global_step": 169485, "epoch": 2041, "val_loss": 6448867.5} {"train_loss": -23.15496253967285, "global_step": 169486, "epoch": 2042} {"train_loss": -23.014440536499023, "global_step": 169487, "epoch": 2042} {"train_loss": -23.144611358642578, "global_step": 169488, "epoch": 2042} {"train_loss": -22.715070724487305, "global_step": 169489, "epoch": 2042} {"train_loss": -22.849712371826172, "global_step": 169490, "epoch": 2042} {"train_loss": -22.879379272460938, "global_step": 169491, "epoch": 2042} {"train_loss": -23.41118812561035, "global_step": 169492, "epoch": 2042} {"train_loss": -22.865205764770508, "global_step": 169493, "epoch": 2042} {"train_loss": -23.340707778930664, "global_step": 169494, "epoch": 2042} {"train_loss": -23.2207088470459, "global_step": 169495, "epoch": 2042} {"train_loss": -23.395933151245117, "global_step": 169496, "epoch": 2042} {"train_loss": -23.3232364654541, "global_step": 169497, "epoch": 2042} {"train_loss": -22.83039665222168, "global_step": 169498, "epoch": 2042} {"train_loss": -23.386173248291016, "global_step": 169499, "epoch": 2042} {"train_loss": -23.121442794799805, "global_step": 169500, "epoch": 2042} {"train_loss": -23.106502532958984, "global_step": 169501, "epoch": 2042} {"train_loss": -23.277997970581055, "global_step": 169502, "epoch": 2042} {"train_loss": -23.620817184448242, "global_step": 169503, "epoch": 2042} {"train_loss": -23.171693801879883, "global_step": 169504, "epoch": 2042} {"train_loss": -23.41733741760254, "global_step": 169505, "epoch": 2042} {"train_loss": -23.32699966430664, "global_step": 169506, "epoch": 2042} {"train_loss": -23.12744140625, "global_step": 169507, "epoch": 2042} {"train_loss": -23.294811248779297, "global_step": 169508, "epoch": 2042} {"train_loss": -23.548707962036133, "global_step": 169509, "epoch": 2042} {"train_loss": -23.462852478027344, "global_step": 169510, "epoch": 2042} {"train_loss": -23.714513778686523, "global_step": 169511, "epoch": 2042} {"train_loss": -23.531415939331055, "global_step": 169512, "epoch": 2042} {"train_loss": -23.915998458862305, "global_step": 169513, "epoch": 2042} {"train_loss": -23.269939422607422, "global_step": 169514, "epoch": 2042} {"train_loss": -23.680843353271484, "global_step": 169515, "epoch": 2042} {"train_loss": -22.975156784057617, "global_step": 169516, "epoch": 2042} {"train_loss": -23.56616973876953, "global_step": 169517, "epoch": 2042} {"train_loss": -23.51763343811035, "global_step": 169518, "epoch": 2042} {"train_loss": -23.425765991210938, "global_step": 169519, "epoch": 2042} {"train_loss": -23.914247512817383, "global_step": 169520, "epoch": 2042} {"train_loss": -23.813552856445312, "global_step": 169521, "epoch": 2042} {"train_loss": -23.40327262878418, "global_step": 169522, "epoch": 2042} {"train_loss": -23.70267677307129, "global_step": 169523, "epoch": 2042} {"train_loss": -23.85516929626465, "global_step": 169524, "epoch": 2042} {"train_loss": -23.929433822631836, "global_step": 169525, "epoch": 2042} {"train_loss": -23.884756088256836, "global_step": 169526, "epoch": 2042} {"train_loss": -23.989519119262695, "global_step": 169527, "epoch": 2042} {"train_loss": -23.364822387695312, "global_step": 169528, "epoch": 2042} {"train_loss": -23.91059112548828, "global_step": 169529, "epoch": 2042} {"train_loss": -23.843812942504883, "global_step": 169530, "epoch": 2042} {"train_loss": -23.31031608581543, "global_step": 169531, "epoch": 2042} {"train_loss": -23.605920791625977, "global_step": 169532, "epoch": 2042} {"train_loss": -23.776432037353516, "global_step": 169533, "epoch": 2042} {"train_loss": -23.461257934570312, "global_step": 169534, "epoch": 2042} {"train_loss": -23.781919479370117, "global_step": 169535, "epoch": 2042} {"train_loss": -23.680761337280273, "global_step": 169536, "epoch": 2042} {"train_loss": -23.88619041442871, "global_step": 169537, "epoch": 2042} {"train_loss": -23.36638832092285, "global_step": 169538, "epoch": 2042} {"train_loss": -23.59185791015625, "global_step": 169539, "epoch": 2042} {"train_loss": -23.64258575439453, "global_step": 169540, "epoch": 2042} {"train_loss": -23.863954544067383, "global_step": 169541, "epoch": 2042} {"train_loss": -23.569204330444336, "global_step": 169542, "epoch": 2042} {"train_loss": -23.731103897094727, "global_step": 169543, "epoch": 2042} {"train_loss": -23.88384437561035, "global_step": 169544, "epoch": 2042} {"train_loss": -23.643985748291016, "global_step": 169545, "epoch": 2042} {"train_loss": -23.767629623413086, "global_step": 169546, "epoch": 2042} {"train_loss": -23.813405990600586, "global_step": 169547, "epoch": 2042} {"train_loss": -23.812726974487305, "global_step": 169548, "epoch": 2042} {"train_loss": -24.12017250061035, "global_step": 169549, "epoch": 2042} {"train_loss": -23.56496238708496, "global_step": 169550, "epoch": 2042} {"train_loss": -23.91193962097168, "global_step": 169551, "epoch": 2042} {"train_loss": -23.501035690307617, "global_step": 169552, "epoch": 2042} {"train_loss": -23.732192993164062, "global_step": 169553, "epoch": 2042} {"train_loss": -23.807851791381836, "global_step": 169554, "epoch": 2042} {"train_loss": -23.7938232421875, "global_step": 169555, "epoch": 2042} {"train_loss": -23.60743522644043, "global_step": 169556, "epoch": 2042} {"train_loss": -23.49318504333496, "global_step": 169557, "epoch": 2042} {"train_loss": -23.767568588256836, "global_step": 169558, "epoch": 2042} {"train_loss": -23.570302963256836, "global_step": 169559, "epoch": 2042} {"train_loss": -24.162450790405273, "global_step": 169560, "epoch": 2042} {"train_loss": -23.548933029174805, "global_step": 169561, "epoch": 2042} {"train_loss": -23.884857177734375, "global_step": 169562, "epoch": 2042} {"train_loss": -23.59430503845215, "global_step": 169563, "epoch": 2042} {"train_loss": -23.66531753540039, "global_step": 169564, "epoch": 2042} {"train_loss": -23.710134506225586, "global_step": 169565, "epoch": 2042} {"train_loss": -24.079429626464844, "global_step": 169566, "epoch": 2042} {"train_loss": -23.610021591186523, "global_step": 169567, "epoch": 2042} {"train_loss": -23.526994544339466, "global_step": 169568, "epoch": 2042, "val_loss": 6418675.0} {"train_loss": -23.420223236083984, "global_step": 169569, "epoch": 2043} {"train_loss": -23.421985626220703, "global_step": 169570, "epoch": 2043} {"train_loss": -23.41517448425293, "global_step": 169571, "epoch": 2043} {"train_loss": -23.1616153717041, "global_step": 169572, "epoch": 2043} {"train_loss": -22.927753448486328, "global_step": 169573, "epoch": 2043} {"train_loss": -22.949939727783203, "global_step": 169574, "epoch": 2043} {"train_loss": -23.703367233276367, "global_step": 169575, "epoch": 2043} {"train_loss": -23.456775665283203, "global_step": 169576, "epoch": 2043} {"train_loss": -23.58467674255371, "global_step": 169577, "epoch": 2043} {"train_loss": -23.853443145751953, "global_step": 169578, "epoch": 2043} {"train_loss": -23.374908447265625, "global_step": 169579, "epoch": 2043} {"train_loss": -23.335067749023438, "global_step": 169580, "epoch": 2043} {"train_loss": -23.582569122314453, "global_step": 169581, "epoch": 2043} {"train_loss": -23.09258460998535, "global_step": 169582, "epoch": 2043} {"train_loss": -22.865583419799805, "global_step": 169583, "epoch": 2043} {"train_loss": -23.197006225585938, "global_step": 169584, "epoch": 2043} {"train_loss": -22.915071487426758, "global_step": 169585, "epoch": 2043} {"train_loss": -23.45637321472168, "global_step": 169586, "epoch": 2043} {"train_loss": -23.25469207763672, "global_step": 169587, "epoch": 2043} {"train_loss": -23.46107292175293, "global_step": 169588, "epoch": 2043} {"train_loss": -23.551469802856445, "global_step": 169589, "epoch": 2043} {"train_loss": -23.428831100463867, "global_step": 169590, "epoch": 2043} {"train_loss": -23.44007682800293, "global_step": 169591, "epoch": 2043} {"train_loss": -23.163320541381836, "global_step": 169592, "epoch": 2043} {"train_loss": -23.472352981567383, "global_step": 169593, "epoch": 2043} {"train_loss": -23.571130752563477, "global_step": 169594, "epoch": 2043} {"train_loss": -23.55622673034668, "global_step": 169595, "epoch": 2043} {"train_loss": -23.83595085144043, "global_step": 169596, "epoch": 2043} {"train_loss": -23.37652587890625, "global_step": 169597, "epoch": 2043} {"train_loss": -23.201313018798828, "global_step": 169598, "epoch": 2043} {"train_loss": -23.103145599365234, "global_step": 169599, "epoch": 2043} {"train_loss": -23.839017868041992, "global_step": 169600, "epoch": 2043} {"train_loss": -23.607450485229492, "global_step": 169601, "epoch": 2043} {"train_loss": -23.657812118530273, "global_step": 169602, "epoch": 2043} {"train_loss": -23.81560516357422, "global_step": 169603, "epoch": 2043} {"train_loss": -23.375417709350586, "global_step": 169604, "epoch": 2043} {"train_loss": -24.26468849182129, "global_step": 169605, "epoch": 2043} {"train_loss": -23.42007827758789, "global_step": 169606, "epoch": 2043} {"train_loss": -23.589527130126953, "global_step": 169607, "epoch": 2043} {"train_loss": -23.905920028686523, "global_step": 169608, "epoch": 2043} {"train_loss": -23.62752342224121, "global_step": 169609, "epoch": 2043} {"train_loss": -23.978443145751953, "global_step": 169610, "epoch": 2043} {"train_loss": -23.561248779296875, "global_step": 169611, "epoch": 2043} {"train_loss": -23.625486373901367, "global_step": 169612, "epoch": 2043} {"train_loss": -23.54139518737793, "global_step": 169613, "epoch": 2043} {"train_loss": -24.06060028076172, "global_step": 169614, "epoch": 2043} {"train_loss": -23.55373191833496, "global_step": 169615, "epoch": 2043} {"train_loss": -23.60365867614746, "global_step": 169616, "epoch": 2043} {"train_loss": -23.380691528320312, "global_step": 169617, "epoch": 2043} {"train_loss": -24.154226303100586, "global_step": 169618, "epoch": 2043} {"train_loss": -23.712844848632812, "global_step": 169619, "epoch": 2043} {"train_loss": -23.36969566345215, "global_step": 169620, "epoch": 2043} {"train_loss": -23.825809478759766, "global_step": 169621, "epoch": 2043} {"train_loss": -23.960651397705078, "global_step": 169622, "epoch": 2043} {"train_loss": -23.7613582611084, "global_step": 169623, "epoch": 2043} {"train_loss": -23.96433448791504, "global_step": 169624, "epoch": 2043} {"train_loss": -23.56366539001465, "global_step": 169625, "epoch": 2043} {"train_loss": -23.853994369506836, "global_step": 169626, "epoch": 2043} {"train_loss": -23.463459014892578, "global_step": 169627, "epoch": 2043} {"train_loss": -23.684904098510742, "global_step": 169628, "epoch": 2043} {"train_loss": -23.59580421447754, "global_step": 169629, "epoch": 2043} {"train_loss": -23.693735122680664, "global_step": 169630, "epoch": 2043} {"train_loss": -24.04840660095215, "global_step": 169631, "epoch": 2043} {"train_loss": -23.86844253540039, "global_step": 169632, "epoch": 2043} {"train_loss": -23.76610565185547, "global_step": 169633, "epoch": 2043} {"train_loss": -23.74289321899414, "global_step": 169634, "epoch": 2043} {"train_loss": -23.805662155151367, "global_step": 169635, "epoch": 2043} {"train_loss": -23.777555465698242, "global_step": 169636, "epoch": 2043} {"train_loss": -23.9782657623291, "global_step": 169637, "epoch": 2043} {"train_loss": -23.91048240661621, "global_step": 169638, "epoch": 2043} {"train_loss": -23.85833168029785, "global_step": 169639, "epoch": 2043} {"train_loss": -23.82967185974121, "global_step": 169640, "epoch": 2043} {"train_loss": -23.604223251342773, "global_step": 169641, "epoch": 2043} {"train_loss": -23.708295822143555, "global_step": 169642, "epoch": 2043} {"train_loss": -23.975988388061523, "global_step": 169643, "epoch": 2043} {"train_loss": -23.41604995727539, "global_step": 169644, "epoch": 2043} {"train_loss": -23.66538429260254, "global_step": 169645, "epoch": 2043} {"train_loss": -23.545555114746094, "global_step": 169646, "epoch": 2043} {"train_loss": -23.33941078186035, "global_step": 169647, "epoch": 2043} {"train_loss": -23.51394271850586, "global_step": 169648, "epoch": 2043} {"train_loss": -23.43665885925293, "global_step": 169649, "epoch": 2043} {"train_loss": -23.38226318359375, "global_step": 169650, "epoch": 2043} {"train_loss": -23.562370805855256, "global_step": 169651, "epoch": 2043, "val_loss": 6496777.0} {"train_loss": -23.318382263183594, "global_step": 169652, "epoch": 2044} {"train_loss": -23.198759078979492, "global_step": 169653, "epoch": 2044} {"train_loss": -23.640670776367188, "global_step": 169654, "epoch": 2044} {"train_loss": -22.93608856201172, "global_step": 169655, "epoch": 2044} {"train_loss": -23.45075225830078, "global_step": 169656, "epoch": 2044} {"train_loss": -22.911602020263672, "global_step": 169657, "epoch": 2044} {"train_loss": -23.35788345336914, "global_step": 169658, "epoch": 2044} {"train_loss": -23.67066764831543, "global_step": 169659, "epoch": 2044} {"train_loss": -23.077539443969727, "global_step": 169660, "epoch": 2044} {"train_loss": -23.408536911010742, "global_step": 169661, "epoch": 2044} {"train_loss": -23.303674697875977, "global_step": 169662, "epoch": 2044} {"train_loss": -23.2370662689209, "global_step": 169663, "epoch": 2044} {"train_loss": -23.288145065307617, "global_step": 169664, "epoch": 2044} {"train_loss": -23.356918334960938, "global_step": 169665, "epoch": 2044} {"train_loss": -23.383459091186523, "global_step": 169666, "epoch": 2044} {"train_loss": -23.604907989501953, "global_step": 169667, "epoch": 2044} {"train_loss": -23.317529678344727, "global_step": 169668, "epoch": 2044} {"train_loss": -23.354476928710938, "global_step": 169669, "epoch": 2044} {"train_loss": -23.74947166442871, "global_step": 169670, "epoch": 2044} {"train_loss": -23.508081436157227, "global_step": 169671, "epoch": 2044} {"train_loss": -23.50347328186035, "global_step": 169672, "epoch": 2044} {"train_loss": -23.8367977142334, "global_step": 169673, "epoch": 2044} {"train_loss": -23.2503604888916, "global_step": 169674, "epoch": 2044} {"train_loss": -23.875160217285156, "global_step": 169675, "epoch": 2044} {"train_loss": -23.36606788635254, "global_step": 169676, "epoch": 2044} {"train_loss": -23.701032638549805, "global_step": 169677, "epoch": 2044} {"train_loss": -24.08342933654785, "global_step": 169678, "epoch": 2044} {"train_loss": -23.829544067382812, "global_step": 169679, "epoch": 2044} {"train_loss": -23.586917877197266, "global_step": 169680, "epoch": 2044} {"train_loss": -23.741769790649414, "global_step": 169681, "epoch": 2044} {"train_loss": -23.920093536376953, "global_step": 169682, "epoch": 2044} {"train_loss": -23.318212509155273, "global_step": 169683, "epoch": 2044} {"train_loss": -23.64939308166504, "global_step": 169684, "epoch": 2044} {"train_loss": -23.62420082092285, "global_step": 169685, "epoch": 2044} {"train_loss": -23.59927749633789, "global_step": 169686, "epoch": 2044} {"train_loss": -23.473892211914062, "global_step": 169687, "epoch": 2044} {"train_loss": -23.51039695739746, "global_step": 169688, "epoch": 2044} {"train_loss": -23.737524032592773, "global_step": 169689, "epoch": 2044} {"train_loss": -23.83907699584961, "global_step": 169690, "epoch": 2044} {"train_loss": -23.75106430053711, "global_step": 169691, "epoch": 2044} {"train_loss": -23.875829696655273, "global_step": 169692, "epoch": 2044} {"train_loss": -23.739038467407227, "global_step": 169693, "epoch": 2044} {"train_loss": -23.94830894470215, "global_step": 169694, "epoch": 2044} {"train_loss": -24.0091609954834, "global_step": 169695, "epoch": 2044} {"train_loss": -23.652137756347656, "global_step": 169696, "epoch": 2044} {"train_loss": -23.874950408935547, "global_step": 169697, "epoch": 2044} {"train_loss": -23.375919342041016, "global_step": 169698, "epoch": 2044} {"train_loss": -23.67809295654297, "global_step": 169699, "epoch": 2044} {"train_loss": -23.887554168701172, "global_step": 169700, "epoch": 2044} {"train_loss": -23.839874267578125, "global_step": 169701, "epoch": 2044} {"train_loss": -23.730321884155273, "global_step": 169702, "epoch": 2044} {"train_loss": -23.86097526550293, "global_step": 169703, "epoch": 2044} {"train_loss": -23.7933349609375, "global_step": 169704, "epoch": 2044} {"train_loss": -23.797494888305664, "global_step": 169705, "epoch": 2044} {"train_loss": -24.053491592407227, "global_step": 169706, "epoch": 2044} {"train_loss": -23.863862991333008, "global_step": 169707, "epoch": 2044} {"train_loss": -23.59370994567871, "global_step": 169708, "epoch": 2044} {"train_loss": -23.487024307250977, "global_step": 169709, "epoch": 2044} {"train_loss": -23.676013946533203, "global_step": 169710, "epoch": 2044} {"train_loss": -23.812376022338867, "global_step": 169711, "epoch": 2044} {"train_loss": -23.44936752319336, "global_step": 169712, "epoch": 2044} {"train_loss": -23.598539352416992, "global_step": 169713, "epoch": 2044} {"train_loss": -23.308515548706055, "global_step": 169714, "epoch": 2044} {"train_loss": -23.443220138549805, "global_step": 169715, "epoch": 2044} {"train_loss": -24.0489559173584, "global_step": 169716, "epoch": 2044} {"train_loss": -23.82708168029785, "global_step": 169717, "epoch": 2044} {"train_loss": -23.763442993164062, "global_step": 169718, "epoch": 2044} {"train_loss": -23.53474235534668, "global_step": 169719, "epoch": 2044} {"train_loss": -24.074174880981445, "global_step": 169720, "epoch": 2044} {"train_loss": -23.781957626342773, "global_step": 169721, "epoch": 2044} {"train_loss": -23.515478134155273, "global_step": 169722, "epoch": 2044} {"train_loss": -23.8196964263916, "global_step": 169723, "epoch": 2044} {"train_loss": -23.45074462890625, "global_step": 169724, "epoch": 2044} {"train_loss": -23.556472778320312, "global_step": 169725, "epoch": 2044} {"train_loss": -23.316139221191406, "global_step": 169726, "epoch": 2044} {"train_loss": -23.36995506286621, "global_step": 169727, "epoch": 2044} {"train_loss": -24.017663955688477, "global_step": 169728, "epoch": 2044} {"train_loss": -23.655380249023438, "global_step": 169729, "epoch": 2044} {"train_loss": -23.52540397644043, "global_step": 169730, "epoch": 2044} {"train_loss": -23.613807678222656, "global_step": 169731, "epoch": 2044} {"train_loss": -23.363325119018555, "global_step": 169732, "epoch": 2044} {"train_loss": -23.47890853881836, "global_step": 169733, "epoch": 2044} {"train_loss": -23.596356035715125, "global_step": 169734, "epoch": 2044, "val_loss": 6330551.0} {"train_loss": -22.748828887939453, "global_step": 169735, "epoch": 2045} {"train_loss": -22.918554306030273, "global_step": 169736, "epoch": 2045} {"train_loss": -23.27304458618164, "global_step": 169737, "epoch": 2045} {"train_loss": -22.561965942382812, "global_step": 169738, "epoch": 2045} {"train_loss": -23.5147647857666, "global_step": 169739, "epoch": 2045} {"train_loss": -23.025588989257812, "global_step": 169740, "epoch": 2045} {"train_loss": -22.90673828125, "global_step": 169741, "epoch": 2045} {"train_loss": -23.144384384155273, "global_step": 169742, "epoch": 2045} {"train_loss": -23.037277221679688, "global_step": 169743, "epoch": 2045} {"train_loss": -23.151777267456055, "global_step": 169744, "epoch": 2045} {"train_loss": -23.48529624938965, "global_step": 169745, "epoch": 2045} {"train_loss": -23.52753257751465, "global_step": 169746, "epoch": 2045} {"train_loss": -23.42060089111328, "global_step": 169747, "epoch": 2045} {"train_loss": -23.572711944580078, "global_step": 169748, "epoch": 2045} {"train_loss": -23.463205337524414, "global_step": 169749, "epoch": 2045} {"train_loss": -23.566822052001953, "global_step": 169750, "epoch": 2045} {"train_loss": -23.351957321166992, "global_step": 169751, "epoch": 2045} {"train_loss": -23.547216415405273, "global_step": 169752, "epoch": 2045} {"train_loss": -23.304977416992188, "global_step": 169753, "epoch": 2045} {"train_loss": -23.730527877807617, "global_step": 169754, "epoch": 2045} {"train_loss": -23.666484832763672, "global_step": 169755, "epoch": 2045} {"train_loss": -23.90010643005371, "global_step": 169756, "epoch": 2045} {"train_loss": -23.509883880615234, "global_step": 169757, "epoch": 2045} {"train_loss": -23.63041114807129, "global_step": 169758, "epoch": 2045} {"train_loss": -23.645557403564453, "global_step": 169759, "epoch": 2045} {"train_loss": -23.468788146972656, "global_step": 169760, "epoch": 2045} {"train_loss": -24.155736923217773, "global_step": 169761, "epoch": 2045} {"train_loss": -23.65041160583496, "global_step": 169762, "epoch": 2045} {"train_loss": -23.68381118774414, "global_step": 169763, "epoch": 2045} {"train_loss": -23.896244049072266, "global_step": 169764, "epoch": 2045} {"train_loss": -23.595495223999023, "global_step": 169765, "epoch": 2045} {"train_loss": -23.704233169555664, "global_step": 169766, "epoch": 2045} {"train_loss": -23.902301788330078, "global_step": 169767, "epoch": 2045} {"train_loss": -23.436513900756836, "global_step": 169768, "epoch": 2045} {"train_loss": -23.51944351196289, "global_step": 169769, "epoch": 2045} {"train_loss": -23.31403160095215, "global_step": 169770, "epoch": 2045} {"train_loss": -23.69402503967285, "global_step": 169771, "epoch": 2045} {"train_loss": -23.402334213256836, "global_step": 169772, "epoch": 2045} {"train_loss": -23.536380767822266, "global_step": 169773, "epoch": 2045} {"train_loss": -23.878662109375, "global_step": 169774, "epoch": 2045} {"train_loss": -23.7896785736084, "global_step": 169775, "epoch": 2045} {"train_loss": -23.817445755004883, "global_step": 169776, "epoch": 2045} {"train_loss": -23.683347702026367, "global_step": 169777, "epoch": 2045} {"train_loss": -23.87444496154785, "global_step": 169778, "epoch": 2045} {"train_loss": -23.6787166595459, "global_step": 169779, "epoch": 2045} {"train_loss": -23.677412033081055, "global_step": 169780, "epoch": 2045} {"train_loss": -23.975767135620117, "global_step": 169781, "epoch": 2045} {"train_loss": -23.57692527770996, "global_step": 169782, "epoch": 2045} {"train_loss": -23.967594146728516, "global_step": 169783, "epoch": 2045} {"train_loss": -23.967191696166992, "global_step": 169784, "epoch": 2045} {"train_loss": -23.85660171508789, "global_step": 169785, "epoch": 2045} {"train_loss": -23.645822525024414, "global_step": 169786, "epoch": 2045} {"train_loss": -23.55674171447754, "global_step": 169787, "epoch": 2045} {"train_loss": -24.006145477294922, "global_step": 169788, "epoch": 2045} {"train_loss": -23.628326416015625, "global_step": 169789, "epoch": 2045} {"train_loss": -23.784658432006836, "global_step": 169790, "epoch": 2045} {"train_loss": -23.86507797241211, "global_step": 169791, "epoch": 2045} {"train_loss": -23.908273696899414, "global_step": 169792, "epoch": 2045} {"train_loss": -23.915327072143555, "global_step": 169793, "epoch": 2045} {"train_loss": -24.030773162841797, "global_step": 169794, "epoch": 2045} {"train_loss": -24.056821823120117, "global_step": 169795, "epoch": 2045} {"train_loss": -23.839292526245117, "global_step": 169796, "epoch": 2045} {"train_loss": -24.186893463134766, "global_step": 169797, "epoch": 2045} {"train_loss": -24.151748657226562, "global_step": 169798, "epoch": 2045} {"train_loss": -23.68631935119629, "global_step": 169799, "epoch": 2045} {"train_loss": -23.557666778564453, "global_step": 169800, "epoch": 2045} {"train_loss": -23.8155460357666, "global_step": 169801, "epoch": 2045} {"train_loss": -23.393476486206055, "global_step": 169802, "epoch": 2045} {"train_loss": -23.54454231262207, "global_step": 169803, "epoch": 2045} {"train_loss": -23.050100326538086, "global_step": 169804, "epoch": 2045} {"train_loss": -23.17697525024414, "global_step": 169805, "epoch": 2045} {"train_loss": -23.519287109375, "global_step": 169806, "epoch": 2045} {"train_loss": -23.320585250854492, "global_step": 169807, "epoch": 2045} {"train_loss": -22.8953914642334, "global_step": 169808, "epoch": 2045} {"train_loss": -23.46558952331543, "global_step": 169809, "epoch": 2045} {"train_loss": -23.456995010375977, "global_step": 169810, "epoch": 2045} {"train_loss": -23.57954978942871, "global_step": 169811, "epoch": 2045} {"train_loss": -23.500001907348633, "global_step": 169812, "epoch": 2045} {"train_loss": -23.536314010620117, "global_step": 169813, "epoch": 2045} {"train_loss": -23.409730911254883, "global_step": 169814, "epoch": 2045} {"train_loss": -23.71641731262207, "global_step": 169815, "epoch": 2045} {"train_loss": -23.469650268554688, "global_step": 169816, "epoch": 2045} {"train_loss": -23.565515150506812, "global_step": 169817, "epoch": 2045, "val_loss": 6365014.0} {"train_loss": -22.983243942260742, "global_step": 169818, "epoch": 2046} {"train_loss": -22.45816993713379, "global_step": 169819, "epoch": 2046} {"train_loss": -23.37824058532715, "global_step": 169820, "epoch": 2046} {"train_loss": -22.9982967376709, "global_step": 169821, "epoch": 2046} {"train_loss": -22.948917388916016, "global_step": 169822, "epoch": 2046} {"train_loss": -23.20595359802246, "global_step": 169823, "epoch": 2046} {"train_loss": -23.04279327392578, "global_step": 169824, "epoch": 2046} {"train_loss": -23.172210693359375, "global_step": 169825, "epoch": 2046} {"train_loss": -23.320898056030273, "global_step": 169826, "epoch": 2046} {"train_loss": -23.478811264038086, "global_step": 169827, "epoch": 2046} {"train_loss": -23.424734115600586, "global_step": 169828, "epoch": 2046} {"train_loss": -23.721839904785156, "global_step": 169829, "epoch": 2046} {"train_loss": -23.394033432006836, "global_step": 169830, "epoch": 2046} {"train_loss": -23.295480728149414, "global_step": 169831, "epoch": 2046} {"train_loss": -23.397531509399414, "global_step": 169832, "epoch": 2046} {"train_loss": -23.574655532836914, "global_step": 169833, "epoch": 2046} {"train_loss": -23.282773971557617, "global_step": 169834, "epoch": 2046} {"train_loss": -23.653860092163086, "global_step": 169835, "epoch": 2046} {"train_loss": -23.187179565429688, "global_step": 169836, "epoch": 2046} {"train_loss": -23.8162899017334, "global_step": 169837, "epoch": 2046} {"train_loss": -23.74513053894043, "global_step": 169838, "epoch": 2046} {"train_loss": -23.330677032470703, "global_step": 169839, "epoch": 2046} {"train_loss": -23.49907112121582, "global_step": 169840, "epoch": 2046} {"train_loss": -23.681547164916992, "global_step": 169841, "epoch": 2046} {"train_loss": -23.57674789428711, "global_step": 169842, "epoch": 2046} {"train_loss": -23.55133819580078, "global_step": 169843, "epoch": 2046} {"train_loss": -23.696853637695312, "global_step": 169844, "epoch": 2046} {"train_loss": -23.85109519958496, "global_step": 169845, "epoch": 2046} {"train_loss": -23.67720603942871, "global_step": 169846, "epoch": 2046} {"train_loss": -24.03398323059082, "global_step": 169847, "epoch": 2046} {"train_loss": -23.34297752380371, "global_step": 169848, "epoch": 2046} {"train_loss": -23.850101470947266, "global_step": 169849, "epoch": 2046} {"train_loss": -23.83525276184082, "global_step": 169850, "epoch": 2046} {"train_loss": -23.748367309570312, "global_step": 169851, "epoch": 2046} {"train_loss": -23.71617317199707, "global_step": 169852, "epoch": 2046} {"train_loss": -23.675138473510742, "global_step": 169853, "epoch": 2046} {"train_loss": -23.86297607421875, "global_step": 169854, "epoch": 2046} {"train_loss": -23.709997177124023, "global_step": 169855, "epoch": 2046} {"train_loss": -23.603084564208984, "global_step": 169856, "epoch": 2046} {"train_loss": -23.54865264892578, "global_step": 169857, "epoch": 2046} {"train_loss": -23.60134506225586, "global_step": 169858, "epoch": 2046} {"train_loss": -23.88356590270996, "global_step": 169859, "epoch": 2046} {"train_loss": -23.730121612548828, "global_step": 169860, "epoch": 2046} {"train_loss": -23.85249137878418, "global_step": 169861, "epoch": 2046} {"train_loss": -23.7270565032959, "global_step": 169862, "epoch": 2046} {"train_loss": -23.806020736694336, "global_step": 169863, "epoch": 2046} {"train_loss": -24.228992462158203, "global_step": 169864, "epoch": 2046} {"train_loss": -23.970251083374023, "global_step": 169865, "epoch": 2046} {"train_loss": -24.001371383666992, "global_step": 169866, "epoch": 2046} {"train_loss": -23.593412399291992, "global_step": 169867, "epoch": 2046} {"train_loss": -23.907461166381836, "global_step": 169868, "epoch": 2046} {"train_loss": -23.5673828125, "global_step": 169869, "epoch": 2046} {"train_loss": -23.43013572692871, "global_step": 169870, "epoch": 2046} {"train_loss": -23.72548484802246, "global_step": 169871, "epoch": 2046} {"train_loss": -23.820659637451172, "global_step": 169872, "epoch": 2046} {"train_loss": -23.949722290039062, "global_step": 169873, "epoch": 2046} {"train_loss": -23.37665367126465, "global_step": 169874, "epoch": 2046} {"train_loss": -23.662586212158203, "global_step": 169875, "epoch": 2046} {"train_loss": -23.78592872619629, "global_step": 169876, "epoch": 2046} {"train_loss": -23.813751220703125, "global_step": 169877, "epoch": 2046} {"train_loss": -24.042871475219727, "global_step": 169878, "epoch": 2046} {"train_loss": -23.588401794433594, "global_step": 169879, "epoch": 2046} {"train_loss": -24.29396629333496, "global_step": 169880, "epoch": 2046} {"train_loss": -23.680578231811523, "global_step": 169881, "epoch": 2046} {"train_loss": -23.2257022857666, "global_step": 169882, "epoch": 2046} {"train_loss": -23.50904083251953, "global_step": 169883, "epoch": 2046} {"train_loss": -23.73504066467285, "global_step": 169884, "epoch": 2046} {"train_loss": -23.504606246948242, "global_step": 169885, "epoch": 2046} {"train_loss": -23.784570693969727, "global_step": 169886, "epoch": 2046} {"train_loss": -23.823165893554688, "global_step": 169887, "epoch": 2046} {"train_loss": -23.600744247436523, "global_step": 169888, "epoch": 2046} {"train_loss": -23.952795028686523, "global_step": 169889, "epoch": 2046} {"train_loss": -23.772998809814453, "global_step": 169890, "epoch": 2046} {"train_loss": -23.780887603759766, "global_step": 169891, "epoch": 2046} {"train_loss": -24.042057037353516, "global_step": 169892, "epoch": 2046} {"train_loss": -23.67266082763672, "global_step": 169893, "epoch": 2046} {"train_loss": -23.481277465820312, "global_step": 169894, "epoch": 2046} {"train_loss": -23.940370559692383, "global_step": 169895, "epoch": 2046} {"train_loss": -23.649524688720703, "global_step": 169896, "epoch": 2046} {"train_loss": -23.58855628967285, "global_step": 169897, "epoch": 2046} {"train_loss": -23.64667320251465, "global_step": 169898, "epoch": 2046} {"train_loss": -23.770902633666992, "global_step": 169899, "epoch": 2046} {"train_loss": -23.622717960771308, "global_step": 169900, "epoch": 2046, "val_loss": 6510065.0} {"train_loss": -22.79648780822754, "global_step": 169901, "epoch": 2047} {"train_loss": -22.91913414001465, "global_step": 169902, "epoch": 2047} {"train_loss": -23.19399070739746, "global_step": 169903, "epoch": 2047} {"train_loss": -23.021995544433594, "global_step": 169904, "epoch": 2047} {"train_loss": -23.617952346801758, "global_step": 169905, "epoch": 2047} {"train_loss": -23.70155143737793, "global_step": 169906, "epoch": 2047} {"train_loss": -23.119998931884766, "global_step": 169907, "epoch": 2047} {"train_loss": -23.18294334411621, "global_step": 169908, "epoch": 2047} {"train_loss": -23.42439079284668, "global_step": 169909, "epoch": 2047} {"train_loss": -23.075544357299805, "global_step": 169910, "epoch": 2047} {"train_loss": -23.54368019104004, "global_step": 169911, "epoch": 2047} {"train_loss": -23.188032150268555, "global_step": 169912, "epoch": 2047} {"train_loss": -23.38041877746582, "global_step": 169913, "epoch": 2047} {"train_loss": -23.26375961303711, "global_step": 169914, "epoch": 2047} {"train_loss": -23.10539436340332, "global_step": 169915, "epoch": 2047} {"train_loss": -23.442306518554688, "global_step": 169916, "epoch": 2047} {"train_loss": -23.285400390625, "global_step": 169917, "epoch": 2047} {"train_loss": -23.426889419555664, "global_step": 169918, "epoch": 2047} {"train_loss": -23.44411277770996, "global_step": 169919, "epoch": 2047} {"train_loss": -23.44866371154785, "global_step": 169920, "epoch": 2047} {"train_loss": -23.230548858642578, "global_step": 169921, "epoch": 2047} {"train_loss": -23.472518920898438, "global_step": 169922, "epoch": 2047} {"train_loss": -23.753122329711914, "global_step": 169923, "epoch": 2047} {"train_loss": -23.571575164794922, "global_step": 169924, "epoch": 2047} {"train_loss": -23.80322265625, "global_step": 169925, "epoch": 2047} {"train_loss": -23.788793563842773, "global_step": 169926, "epoch": 2047} {"train_loss": -24.240421295166016, "global_step": 169927, "epoch": 2047} {"train_loss": -23.226470947265625, "global_step": 169928, "epoch": 2047} {"train_loss": -23.5211181640625, "global_step": 169929, "epoch": 2047} {"train_loss": -23.52530860900879, "global_step": 169930, "epoch": 2047} {"train_loss": -24.01584243774414, "global_step": 169931, "epoch": 2047} {"train_loss": -23.732114791870117, "global_step": 169932, "epoch": 2047} {"train_loss": -23.512372970581055, "global_step": 169933, "epoch": 2047} {"train_loss": -23.490829467773438, "global_step": 169934, "epoch": 2047} {"train_loss": -23.695650100708008, "global_step": 169935, "epoch": 2047} {"train_loss": -23.889928817749023, "global_step": 169936, "epoch": 2047} {"train_loss": -23.529922485351562, "global_step": 169937, "epoch": 2047} {"train_loss": -23.6313533782959, "global_step": 169938, "epoch": 2047} {"train_loss": -23.930179595947266, "global_step": 169939, "epoch": 2047} {"train_loss": -23.90806007385254, "global_step": 169940, "epoch": 2047} {"train_loss": -23.684608459472656, "global_step": 169941, "epoch": 2047} {"train_loss": -23.858348846435547, "global_step": 169942, "epoch": 2047} {"train_loss": -23.855064392089844, "global_step": 169943, "epoch": 2047} {"train_loss": -23.677717208862305, "global_step": 169944, "epoch": 2047} {"train_loss": -23.7971248626709, "global_step": 169945, "epoch": 2047} {"train_loss": -23.724315643310547, "global_step": 169946, "epoch": 2047} {"train_loss": -23.652177810668945, "global_step": 169947, "epoch": 2047} {"train_loss": -24.002206802368164, "global_step": 169948, "epoch": 2047} {"train_loss": -23.9974365234375, "global_step": 169949, "epoch": 2047} {"train_loss": -23.872934341430664, "global_step": 169950, "epoch": 2047} {"train_loss": -23.715234756469727, "global_step": 169951, "epoch": 2047} {"train_loss": -24.40631103515625, "global_step": 169952, "epoch": 2047} {"train_loss": -23.80754280090332, "global_step": 169953, "epoch": 2047} {"train_loss": -23.695384979248047, "global_step": 169954, "epoch": 2047} {"train_loss": -23.92919921875, "global_step": 169955, "epoch": 2047} {"train_loss": -23.922496795654297, "global_step": 169956, "epoch": 2047} {"train_loss": -23.552608489990234, "global_step": 169957, "epoch": 2047} {"train_loss": -23.778425216674805, "global_step": 169958, "epoch": 2047} {"train_loss": -23.673063278198242, "global_step": 169959, "epoch": 2047} {"train_loss": -23.508136749267578, "global_step": 169960, "epoch": 2047} {"train_loss": -23.785863876342773, "global_step": 169961, "epoch": 2047} {"train_loss": -23.484241485595703, "global_step": 169962, "epoch": 2047} {"train_loss": -23.720815658569336, "global_step": 169963, "epoch": 2047} {"train_loss": -23.223852157592773, "global_step": 169964, "epoch": 2047} {"train_loss": -23.54707908630371, "global_step": 169965, "epoch": 2047} {"train_loss": -23.45663833618164, "global_step": 169966, "epoch": 2047} {"train_loss": -23.761640548706055, "global_step": 169967, "epoch": 2047} {"train_loss": -23.4991455078125, "global_step": 169968, "epoch": 2047} {"train_loss": -23.8052978515625, "global_step": 169969, "epoch": 2047} {"train_loss": -23.976591110229492, "global_step": 169970, "epoch": 2047} {"train_loss": -23.909440994262695, "global_step": 169971, "epoch": 2047} {"train_loss": -23.67144203186035, "global_step": 169972, "epoch": 2047} {"train_loss": -23.48422622680664, "global_step": 169973, "epoch": 2047} {"train_loss": -23.545780181884766, "global_step": 169974, "epoch": 2047} {"train_loss": -23.376325607299805, "global_step": 169975, "epoch": 2047} {"train_loss": -23.485376358032227, "global_step": 169976, "epoch": 2047} {"train_loss": -23.889968872070312, "global_step": 169977, "epoch": 2047} {"train_loss": -23.648426055908203, "global_step": 169978, "epoch": 2047} {"train_loss": -23.6790828704834, "global_step": 169979, "epoch": 2047} {"train_loss": -23.644580841064453, "global_step": 169980, "epoch": 2047} {"train_loss": -23.64069175720215, "global_step": 169981, "epoch": 2047} {"train_loss": -23.879850387573242, "global_step": 169982, "epoch": 2047} {"train_loss": -23.61808875669916, "global_step": 169983, "epoch": 2047, "val_loss": 6341330.5} {"train_loss": -23.08171272277832, "global_step": 169984, "epoch": 2048} {"train_loss": -23.486265182495117, "global_step": 169985, "epoch": 2048} {"train_loss": -23.296714782714844, "global_step": 169986, "epoch": 2048} {"train_loss": -23.719148635864258, "global_step": 169987, "epoch": 2048} {"train_loss": -23.227102279663086, "global_step": 169988, "epoch": 2048} {"train_loss": -23.529855728149414, "global_step": 169989, "epoch": 2048} {"train_loss": -23.369247436523438, "global_step": 169990, "epoch": 2048} {"train_loss": -23.04426383972168, "global_step": 169991, "epoch": 2048} {"train_loss": -23.188745498657227, "global_step": 169992, "epoch": 2048} {"train_loss": -22.83607292175293, "global_step": 169993, "epoch": 2048} {"train_loss": -23.289875030517578, "global_step": 169994, "epoch": 2048} {"train_loss": -23.186376571655273, "global_step": 169995, "epoch": 2048} {"train_loss": -23.477092742919922, "global_step": 169996, "epoch": 2048} {"train_loss": -23.43435287475586, "global_step": 169997, "epoch": 2048} {"train_loss": -23.23607635498047, "global_step": 169998, "epoch": 2048} {"train_loss": -23.56663703918457, "global_step": 169999, "epoch": 2048} {"train_loss": -23.349782943725586, "global_step": 170000, "epoch": 2048} {"train_loss": -23.44925880432129, "global_step": 170001, "epoch": 2048} {"train_loss": -23.491025924682617, "global_step": 170002, "epoch": 2048} {"train_loss": -23.62552261352539, "global_step": 170003, "epoch": 2048} {"train_loss": -23.268842697143555, "global_step": 170004, "epoch": 2048} {"train_loss": -23.520994186401367, "global_step": 170005, "epoch": 2048} {"train_loss": -23.733264923095703, "global_step": 170006, "epoch": 2048} {"train_loss": -23.647428512573242, "global_step": 170007, "epoch": 2048} {"train_loss": -23.37531280517578, "global_step": 170008, "epoch": 2048} {"train_loss": -24.05345344543457, "global_step": 170009, "epoch": 2048} {"train_loss": -23.93377113342285, "global_step": 170010, "epoch": 2048} {"train_loss": -23.746768951416016, "global_step": 170011, "epoch": 2048} {"train_loss": -23.42139434814453, "global_step": 170012, "epoch": 2048} {"train_loss": -23.9570369720459, "global_step": 170013, "epoch": 2048} {"train_loss": -23.76718521118164, "global_step": 170014, "epoch": 2048} {"train_loss": -23.87027359008789, "global_step": 170015, "epoch": 2048} {"train_loss": -24.08962059020996, "global_step": 170016, "epoch": 2048} {"train_loss": -23.652063369750977, "global_step": 170017, "epoch": 2048} {"train_loss": -23.687612533569336, "global_step": 170018, "epoch": 2048} {"train_loss": -23.37567710876465, "global_step": 170019, "epoch": 2048} {"train_loss": -24.029949188232422, "global_step": 170020, "epoch": 2048} {"train_loss": -23.792560577392578, "global_step": 170021, "epoch": 2048} {"train_loss": -23.4996395111084, "global_step": 170022, "epoch": 2048} {"train_loss": -23.948087692260742, "global_step": 170023, "epoch": 2048} {"train_loss": -24.058420181274414, "global_step": 170024, "epoch": 2048} {"train_loss": -23.777286529541016, "global_step": 170025, "epoch": 2048} {"train_loss": -23.672231674194336, "global_step": 170026, "epoch": 2048} {"train_loss": -23.499608993530273, "global_step": 170027, "epoch": 2048} {"train_loss": -23.813058853149414, "global_step": 170028, "epoch": 2048} {"train_loss": -23.892698287963867, "global_step": 170029, "epoch": 2048} {"train_loss": -23.736539840698242, "global_step": 170030, "epoch": 2048} {"train_loss": -23.02924346923828, "global_step": 170031, "epoch": 2048} {"train_loss": -23.419784545898438, "global_step": 170032, "epoch": 2048} {"train_loss": -23.282394409179688, "global_step": 170033, "epoch": 2048} {"train_loss": -23.951955795288086, "global_step": 170034, "epoch": 2048} {"train_loss": -23.55815887451172, "global_step": 170035, "epoch": 2048} {"train_loss": -23.494823455810547, "global_step": 170036, "epoch": 2048} {"train_loss": -23.57158851623535, "global_step": 170037, "epoch": 2048} {"train_loss": -23.623018264770508, "global_step": 170038, "epoch": 2048} {"train_loss": -23.506826400756836, "global_step": 170039, "epoch": 2048} {"train_loss": -23.809537887573242, "global_step": 170040, "epoch": 2048} {"train_loss": -23.391550064086914, "global_step": 170041, "epoch": 2048} {"train_loss": -23.72525405883789, "global_step": 170042, "epoch": 2048} {"train_loss": -23.463956832885742, "global_step": 170043, "epoch": 2048} {"train_loss": -23.76162338256836, "global_step": 170044, "epoch": 2048} {"train_loss": -23.909643173217773, "global_step": 170045, "epoch": 2048} {"train_loss": -23.82638931274414, "global_step": 170046, "epoch": 2048} {"train_loss": -23.706945419311523, "global_step": 170047, "epoch": 2048} {"train_loss": -23.899202346801758, "global_step": 170048, "epoch": 2048} {"train_loss": -23.772790908813477, "global_step": 170049, "epoch": 2048} {"train_loss": -23.780332565307617, "global_step": 170050, "epoch": 2048} {"train_loss": -23.595304489135742, "global_step": 170051, "epoch": 2048} {"train_loss": -23.64046287536621, "global_step": 170052, "epoch": 2048} {"train_loss": -23.733184814453125, "global_step": 170053, "epoch": 2048} {"train_loss": -23.856542587280273, "global_step": 170054, "epoch": 2048} {"train_loss": -23.975582122802734, "global_step": 170055, "epoch": 2048} {"train_loss": -23.716476440429688, "global_step": 170056, "epoch": 2048} {"train_loss": -23.82847023010254, "global_step": 170057, "epoch": 2048} {"train_loss": -23.689226150512695, "global_step": 170058, "epoch": 2048} {"train_loss": -23.919811248779297, "global_step": 170059, "epoch": 2048} {"train_loss": -23.86056900024414, "global_step": 170060, "epoch": 2048} {"train_loss": -23.41070556640625, "global_step": 170061, "epoch": 2048} {"train_loss": -23.053449630737305, "global_step": 170062, "epoch": 2048} {"train_loss": -23.820188522338867, "global_step": 170063, "epoch": 2048} {"train_loss": -24.2095947265625, "global_step": 170064, "epoch": 2048} {"train_loss": -23.343326568603516, "global_step": 170065, "epoch": 2048} {"train_loss": -23.58952251112605, "global_step": 170066, "epoch": 2048, "val_loss": 6437265.0} {"train_loss": -22.802204132080078, "global_step": 170067, "epoch": 2049} {"train_loss": -23.104272842407227, "global_step": 170068, "epoch": 2049} {"train_loss": -22.947772979736328, "global_step": 170069, "epoch": 2049} {"train_loss": -23.46722984313965, "global_step": 170070, "epoch": 2049} {"train_loss": -23.4162654876709, "global_step": 170071, "epoch": 2049} {"train_loss": -23.34271240234375, "global_step": 170072, "epoch": 2049} {"train_loss": -22.907917022705078, "global_step": 170073, "epoch": 2049} {"train_loss": -23.43658447265625, "global_step": 170074, "epoch": 2049} {"train_loss": -23.372329711914062, "global_step": 170075, "epoch": 2049} {"train_loss": -23.511564254760742, "global_step": 170076, "epoch": 2049} {"train_loss": -23.38829231262207, "global_step": 170077, "epoch": 2049} {"train_loss": -23.500375747680664, "global_step": 170078, "epoch": 2049} {"train_loss": -23.585668563842773, "global_step": 170079, "epoch": 2049} {"train_loss": -23.167150497436523, "global_step": 170080, "epoch": 2049} {"train_loss": -23.27557373046875, "global_step": 170081, "epoch": 2049} {"train_loss": -23.530941009521484, "global_step": 170082, "epoch": 2049} {"train_loss": -23.43587875366211, "global_step": 170083, "epoch": 2049} {"train_loss": -23.503238677978516, "global_step": 170084, "epoch": 2049} {"train_loss": -23.26520538330078, "global_step": 170085, "epoch": 2049} {"train_loss": -23.858186721801758, "global_step": 170086, "epoch": 2049} {"train_loss": -23.05623435974121, "global_step": 170087, "epoch": 2049} {"train_loss": -23.323959350585938, "global_step": 170088, "epoch": 2049} {"train_loss": -23.631086349487305, "global_step": 170089, "epoch": 2049} {"train_loss": -23.154403686523438, "global_step": 170090, "epoch": 2049} {"train_loss": -23.329723358154297, "global_step": 170091, "epoch": 2049} {"train_loss": -24.039119720458984, "global_step": 170092, "epoch": 2049} {"train_loss": -23.586538314819336, "global_step": 170093, "epoch": 2049} {"train_loss": -23.408878326416016, "global_step": 170094, "epoch": 2049} {"train_loss": -23.7626953125, "global_step": 170095, "epoch": 2049} {"train_loss": -23.647024154663086, "global_step": 170096, "epoch": 2049} {"train_loss": -23.404813766479492, "global_step": 170097, "epoch": 2049} {"train_loss": -23.370101928710938, "global_step": 170098, "epoch": 2049} {"train_loss": -23.306272506713867, "global_step": 170099, "epoch": 2049} {"train_loss": -23.66228675842285, "global_step": 170100, "epoch": 2049} {"train_loss": -23.7346134185791, "global_step": 170101, "epoch": 2049} {"train_loss": -23.861371994018555, "global_step": 170102, "epoch": 2049} {"train_loss": -23.803386688232422, "global_step": 170103, "epoch": 2049} {"train_loss": -23.77882957458496, "global_step": 170104, "epoch": 2049} {"train_loss": -23.84427833557129, "global_step": 170105, "epoch": 2049} {"train_loss": -23.487817764282227, "global_step": 170106, "epoch": 2049} {"train_loss": -23.815664291381836, "global_step": 170107, "epoch": 2049} {"train_loss": -23.963788986206055, "global_step": 170108, "epoch": 2049} {"train_loss": -23.49979591369629, "global_step": 170109, "epoch": 2049} {"train_loss": -23.926862716674805, "global_step": 170110, "epoch": 2049} {"train_loss": -23.519073486328125, "global_step": 170111, "epoch": 2049} {"train_loss": -23.562419891357422, "global_step": 170112, "epoch": 2049} {"train_loss": -24.014497756958008, "global_step": 170113, "epoch": 2049} {"train_loss": -23.639789581298828, "global_step": 170114, "epoch": 2049} {"train_loss": -23.609472274780273, "global_step": 170115, "epoch": 2049} {"train_loss": -23.746007919311523, "global_step": 170116, "epoch": 2049} {"train_loss": -23.826141357421875, "global_step": 170117, "epoch": 2049} {"train_loss": -23.519535064697266, "global_step": 170118, "epoch": 2049} {"train_loss": -23.599817276000977, "global_step": 170119, "epoch": 2049} {"train_loss": -23.98665428161621, "global_step": 170120, "epoch": 2049} {"train_loss": -23.781400680541992, "global_step": 170121, "epoch": 2049} {"train_loss": -23.88602066040039, "global_step": 170122, "epoch": 2049} {"train_loss": -23.44219398498535, "global_step": 170123, "epoch": 2049} {"train_loss": -23.7657413482666, "global_step": 170124, "epoch": 2049} {"train_loss": -23.169639587402344, "global_step": 170125, "epoch": 2049} {"train_loss": -23.833789825439453, "global_step": 170126, "epoch": 2049} {"train_loss": -23.94757080078125, "global_step": 170127, "epoch": 2049} {"train_loss": -23.720853805541992, "global_step": 170128, "epoch": 2049} {"train_loss": -24.114789962768555, "global_step": 170129, "epoch": 2049} {"train_loss": -23.729829788208008, "global_step": 170130, "epoch": 2049} {"train_loss": -23.94904136657715, "global_step": 170131, "epoch": 2049} {"train_loss": -23.58363914489746, "global_step": 170132, "epoch": 2049} {"train_loss": -24.096467971801758, "global_step": 170133, "epoch": 2049} {"train_loss": -23.489648818969727, "global_step": 170134, "epoch": 2049} {"train_loss": -24.220834732055664, "global_step": 170135, "epoch": 2049} {"train_loss": -24.024147033691406, "global_step": 170136, "epoch": 2049} {"train_loss": -23.614452362060547, "global_step": 170137, "epoch": 2049} {"train_loss": -23.722570419311523, "global_step": 170138, "epoch": 2049} {"train_loss": -23.85528564453125, "global_step": 170139, "epoch": 2049} {"train_loss": -23.524860382080078, "global_step": 170140, "epoch": 2049} {"train_loss": -23.66779136657715, "global_step": 170141, "epoch": 2049} {"train_loss": -23.69719886779785, "global_step": 170142, "epoch": 2049} {"train_loss": -23.971677780151367, "global_step": 170143, "epoch": 2049} {"train_loss": -23.817113876342773, "global_step": 170144, "epoch": 2049} {"train_loss": -23.109180450439453, "global_step": 170145, "epoch": 2049} {"train_loss": -23.315805435180664, "global_step": 170146, "epoch": 2049} {"train_loss": -23.822141647338867, "global_step": 170147, "epoch": 2049} {"train_loss": -23.88992691040039, "global_step": 170148, "epoch": 2049} {"train_loss": -23.61244130421834, "global_step": 170149, "epoch": 2049, "val_loss": 6406372.0} {"train_loss": -23.13134765625, "global_step": 170150, "epoch": 2050} {"train_loss": -23.582767486572266, "global_step": 170151, "epoch": 2050} {"train_loss": -23.14167594909668, "global_step": 170152, "epoch": 2050} {"train_loss": -23.3225154876709, "global_step": 170153, "epoch": 2050} {"train_loss": -23.529922485351562, "global_step": 170154, "epoch": 2050} {"train_loss": -23.18643569946289, "global_step": 170155, "epoch": 2050} {"train_loss": -23.197927474975586, "global_step": 170156, "epoch": 2050} {"train_loss": -23.737882614135742, "global_step": 170157, "epoch": 2050} {"train_loss": -23.74359893798828, "global_step": 170158, "epoch": 2050} {"train_loss": -23.555814743041992, "global_step": 170159, "epoch": 2050} {"train_loss": -23.53679847717285, "global_step": 170160, "epoch": 2050} {"train_loss": -23.653127670288086, "global_step": 170161, "epoch": 2050} {"train_loss": -23.851909637451172, "global_step": 170162, "epoch": 2050} {"train_loss": -23.107044219970703, "global_step": 170163, "epoch": 2050} {"train_loss": -23.337223052978516, "global_step": 170164, "epoch": 2050} {"train_loss": -23.027578353881836, "global_step": 170165, "epoch": 2050} {"train_loss": -23.412555694580078, "global_step": 170166, "epoch": 2050} {"train_loss": -23.625343322753906, "global_step": 170167, "epoch": 2050} {"train_loss": -23.36418342590332, "global_step": 170168, "epoch": 2050} {"train_loss": -23.290607452392578, "global_step": 170169, "epoch": 2050} {"train_loss": -23.75593376159668, "global_step": 170170, "epoch": 2050} {"train_loss": -23.483320236206055, "global_step": 170171, "epoch": 2050} {"train_loss": -23.73394775390625, "global_step": 170172, "epoch": 2050} {"train_loss": -23.916309356689453, "global_step": 170173, "epoch": 2050} {"train_loss": -23.543588638305664, "global_step": 170174, "epoch": 2050} {"train_loss": -23.624629974365234, "global_step": 170175, "epoch": 2050} {"train_loss": -23.704614639282227, "global_step": 170176, "epoch": 2050} {"train_loss": -23.419559478759766, "global_step": 170177, "epoch": 2050} {"train_loss": -23.55571746826172, "global_step": 170178, "epoch": 2050} {"train_loss": -23.85215187072754, "global_step": 170179, "epoch": 2050} {"train_loss": -23.766508102416992, "global_step": 170180, "epoch": 2050} {"train_loss": -23.628559112548828, "global_step": 170181, "epoch": 2050} {"train_loss": -23.958730697631836, "global_step": 170182, "epoch": 2050} {"train_loss": -23.9190731048584, "global_step": 170183, "epoch": 2050} {"train_loss": -23.578004837036133, "global_step": 170184, "epoch": 2050} {"train_loss": -23.768692016601562, "global_step": 170185, "epoch": 2050} {"train_loss": -23.289581298828125, "global_step": 170186, "epoch": 2050} {"train_loss": -23.73870849609375, "global_step": 170187, "epoch": 2050} {"train_loss": -23.497610092163086, "global_step": 170188, "epoch": 2050} {"train_loss": -23.697669982910156, "global_step": 170189, "epoch": 2050} {"train_loss": -24.12872314453125, "global_step": 170190, "epoch": 2050} {"train_loss": -23.879291534423828, "global_step": 170191, "epoch": 2050} {"train_loss": -23.373252868652344, "global_step": 170192, "epoch": 2050} {"train_loss": -23.97041893005371, "global_step": 170193, "epoch": 2050} {"train_loss": -23.765138626098633, "global_step": 170194, "epoch": 2050} {"train_loss": -23.827077865600586, "global_step": 170195, "epoch": 2050} {"train_loss": -24.045080184936523, "global_step": 170196, "epoch": 2050} {"train_loss": -23.792224884033203, "global_step": 170197, "epoch": 2050} {"train_loss": -23.634611129760742, "global_step": 170198, "epoch": 2050} {"train_loss": -24.008277893066406, "global_step": 170199, "epoch": 2050} {"train_loss": -23.678998947143555, "global_step": 170200, "epoch": 2050} {"train_loss": -23.486204147338867, "global_step": 170201, "epoch": 2050} {"train_loss": -24.125864028930664, "global_step": 170202, "epoch": 2050} {"train_loss": -23.70475959777832, "global_step": 170203, "epoch": 2050} {"train_loss": -23.77779197692871, "global_step": 170204, "epoch": 2050} {"train_loss": -23.42560386657715, "global_step": 170205, "epoch": 2050} {"train_loss": -24.149091720581055, "global_step": 170206, "epoch": 2050} {"train_loss": -24.1691837310791, "global_step": 170207, "epoch": 2050} {"train_loss": -23.587953567504883, "global_step": 170208, "epoch": 2050} {"train_loss": -23.596052169799805, "global_step": 170209, "epoch": 2050} {"train_loss": -23.79652214050293, "global_step": 170210, "epoch": 2050} {"train_loss": -23.701324462890625, "global_step": 170211, "epoch": 2050} {"train_loss": -23.93553352355957, "global_step": 170212, "epoch": 2050} {"train_loss": -23.779354095458984, "global_step": 170213, "epoch": 2050} {"train_loss": -23.35687828063965, "global_step": 170214, "epoch": 2050} {"train_loss": -23.65199851989746, "global_step": 170215, "epoch": 2050} {"train_loss": -23.493988037109375, "global_step": 170216, "epoch": 2050} {"train_loss": -23.829452514648438, "global_step": 170217, "epoch": 2050} {"train_loss": -24.13240623474121, "global_step": 170218, "epoch": 2050} {"train_loss": -23.7417049407959, "global_step": 170219, "epoch": 2050} {"train_loss": -23.80999183654785, "global_step": 170220, "epoch": 2050} {"train_loss": -23.834280014038086, "global_step": 170221, "epoch": 2050} {"train_loss": -23.631513595581055, "global_step": 170222, "epoch": 2050} {"train_loss": -23.610687255859375, "global_step": 170223, "epoch": 2050} {"train_loss": -23.52788734436035, "global_step": 170224, "epoch": 2050} {"train_loss": -23.704875946044922, "global_step": 170225, "epoch": 2050} {"train_loss": -23.63543701171875, "global_step": 170226, "epoch": 2050} {"train_loss": -23.477216720581055, "global_step": 170227, "epoch": 2050} {"train_loss": -24.004684448242188, "global_step": 170228, "epoch": 2050} {"train_loss": -23.2401123046875, "global_step": 170229, "epoch": 2050} {"train_loss": -23.734359741210938, "global_step": 170230, "epoch": 2050} {"train_loss": -23.52119255065918, "global_step": 170231, "epoch": 2050} {"train_loss": -23.654520678232952, "global_step": 170232, "epoch": 2050, "train/sim_max_reward_0": 1.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4500000": 1.0, "test/sim_max_reward_4500001": 1.0, "test/sim_max_reward_4500002": 1.0, "test/sim_max_reward_4500003": 1.0, "test/sim_max_reward_4500004": 0.0, "test/sim_max_reward_4500005": 1.0, "test/sim_max_reward_4500006": 1.0, "test/sim_max_reward_4500007": 1.0, "test/sim_max_reward_4500008": 1.0, "test/sim_max_reward_4500009": 1.0, "test/sim_max_reward_4500010": 1.0, "test/sim_max_reward_4500011": 1.0, "test/sim_max_reward_4500012": 1.0, "test/sim_max_reward_4500013": 1.0, "test/sim_max_reward_4500014": 1.0, "test/sim_max_reward_4500015": 1.0, "test/sim_max_reward_4500016": 1.0, "test/sim_max_reward_4500017": 1.0, "test/sim_max_reward_4500018": 1.0, "test/sim_max_reward_4500019": 1.0, "test/sim_max_reward_4500020": 1.0, "test/sim_max_reward_4500021": 1.0, "train/mean_score": 1.0, "test/mean_score": 0.9545454545454546, "val_loss": 6391005.0} {"train_loss": -23.160430908203125, "global_step": 170233, "epoch": 2051} {"train_loss": -22.305553436279297, "global_step": 170234, "epoch": 2051} {"train_loss": -23.09955406188965, "global_step": 170235, "epoch": 2051} {"train_loss": -22.980958938598633, "global_step": 170236, "epoch": 2051} {"train_loss": -22.759992599487305, "global_step": 170237, "epoch": 2051} {"train_loss": -23.27308464050293, "global_step": 170238, "epoch": 2051} {"train_loss": -23.0145206451416, "global_step": 170239, "epoch": 2051} {"train_loss": -23.05824089050293, "global_step": 170240, "epoch": 2051} {"train_loss": -23.64578628540039, "global_step": 170241, "epoch": 2051} {"train_loss": -23.783920288085938, "global_step": 170242, "epoch": 2051} {"train_loss": -23.536951065063477, "global_step": 170243, "epoch": 2051} {"train_loss": -23.42388343811035, "global_step": 170244, "epoch": 2051} {"train_loss": -23.12989616394043, "global_step": 170245, "epoch": 2051} {"train_loss": -23.164228439331055, "global_step": 170246, "epoch": 2051} {"train_loss": -23.49608039855957, "global_step": 170247, "epoch": 2051} {"train_loss": -23.41840934753418, "global_step": 170248, "epoch": 2051} {"train_loss": -23.538612365722656, "global_step": 170249, "epoch": 2051} {"train_loss": -23.52167320251465, "global_step": 170250, "epoch": 2051} {"train_loss": -23.524267196655273, "global_step": 170251, "epoch": 2051} {"train_loss": -23.097570419311523, "global_step": 170252, "epoch": 2051} {"train_loss": -23.289474487304688, "global_step": 170253, "epoch": 2051} {"train_loss": -23.17245101928711, "global_step": 170254, "epoch": 2051} {"train_loss": -23.671768188476562, "global_step": 170255, "epoch": 2051} {"train_loss": -23.40157127380371, "global_step": 170256, "epoch": 2051} {"train_loss": -23.52592658996582, "global_step": 170257, "epoch": 2051} {"train_loss": -23.6075496673584, "global_step": 170258, "epoch": 2051} {"train_loss": -23.87299919128418, "global_step": 170259, "epoch": 2051} {"train_loss": -23.525001525878906, "global_step": 170260, "epoch": 2051} {"train_loss": -23.543331146240234, "global_step": 170261, "epoch": 2051} {"train_loss": -23.798480987548828, "global_step": 170262, "epoch": 2051} {"train_loss": -23.68170738220215, "global_step": 170263, "epoch": 2051} {"train_loss": -23.551467895507812, "global_step": 170264, "epoch": 2051} {"train_loss": -23.650836944580078, "global_step": 170265, "epoch": 2051} {"train_loss": -23.475461959838867, "global_step": 170266, "epoch": 2051} {"train_loss": -23.524560928344727, "global_step": 170267, "epoch": 2051} {"train_loss": -24.06654167175293, "global_step": 170268, "epoch": 2051} {"train_loss": -23.81290626525879, "global_step": 170269, "epoch": 2051} {"train_loss": -23.456533432006836, "global_step": 170270, "epoch": 2051} {"train_loss": -23.802764892578125, "global_step": 170271, "epoch": 2051} {"train_loss": -23.825220108032227, "global_step": 170272, "epoch": 2051} {"train_loss": -24.319107055664062, "global_step": 170273, "epoch": 2051} {"train_loss": -23.595029830932617, "global_step": 170274, "epoch": 2051} {"train_loss": -23.61200523376465, "global_step": 170275, "epoch": 2051} {"train_loss": -23.465402603149414, "global_step": 170276, "epoch": 2051} {"train_loss": -23.621601104736328, "global_step": 170277, "epoch": 2051} {"train_loss": -23.832014083862305, "global_step": 170278, "epoch": 2051} {"train_loss": -23.882036209106445, "global_step": 170279, "epoch": 2051} {"train_loss": -23.82074546813965, "global_step": 170280, "epoch": 2051} {"train_loss": -23.557483673095703, "global_step": 170281, "epoch": 2051} {"train_loss": -23.647714614868164, "global_step": 170282, "epoch": 2051} {"train_loss": -23.85608673095703, "global_step": 170283, "epoch": 2051} {"train_loss": -23.73750114440918, "global_step": 170284, "epoch": 2051} {"train_loss": -23.72678565979004, "global_step": 170285, "epoch": 2051} {"train_loss": -23.55379295349121, "global_step": 170286, "epoch": 2051} {"train_loss": -23.954025268554688, "global_step": 170287, "epoch": 2051} {"train_loss": -23.66499900817871, "global_step": 170288, "epoch": 2051} {"train_loss": -23.5964412689209, "global_step": 170289, "epoch": 2051} {"train_loss": -23.585113525390625, "global_step": 170290, "epoch": 2051} {"train_loss": -23.86543083190918, "global_step": 170291, "epoch": 2051} {"train_loss": -23.4932918548584, "global_step": 170292, "epoch": 2051} {"train_loss": -23.67026710510254, "global_step": 170293, "epoch": 2051} {"train_loss": -24.002525329589844, "global_step": 170294, "epoch": 2051} {"train_loss": -23.902347564697266, "global_step": 170295, "epoch": 2051} {"train_loss": -23.908527374267578, "global_step": 170296, "epoch": 2051} {"train_loss": -23.97426414489746, "global_step": 170297, "epoch": 2051} {"train_loss": -23.645978927612305, "global_step": 170298, "epoch": 2051} {"train_loss": -23.97113037109375, "global_step": 170299, "epoch": 2051} {"train_loss": -23.91261100769043, "global_step": 170300, "epoch": 2051} {"train_loss": -23.963796615600586, "global_step": 170301, "epoch": 2051} {"train_loss": -24.02976417541504, "global_step": 170302, "epoch": 2051} {"train_loss": -23.645645141601562, "global_step": 170303, "epoch": 2051} {"train_loss": -24.173460006713867, "global_step": 170304, "epoch": 2051} {"train_loss": -23.83188247680664, "global_step": 170305, "epoch": 2051} {"train_loss": -23.614057540893555, "global_step": 170306, "epoch": 2051} {"train_loss": -24.01171112060547, "global_step": 170307, "epoch": 2051} {"train_loss": -23.934654235839844, "global_step": 170308, "epoch": 2051} {"train_loss": -23.945816040039062, "global_step": 170309, "epoch": 2051} {"train_loss": -24.203393936157227, "global_step": 170310, "epoch": 2051} {"train_loss": -24.03350830078125, "global_step": 170311, "epoch": 2051} {"train_loss": -24.080791473388672, "global_step": 170312, "epoch": 2051} {"train_loss": -23.820377349853516, "global_step": 170313, "epoch": 2051} {"train_loss": -23.727802276611328, "global_step": 170314, "epoch": 2051} {"train_loss": -23.65128831978304, "global_step": 170315, "epoch": 2051, "val_loss": 6364651.0} {"train_loss": -23.727874755859375, "global_step": 170316, "epoch": 2052} {"train_loss": -23.0850887298584, "global_step": 170317, "epoch": 2052} {"train_loss": -23.706472396850586, "global_step": 170318, "epoch": 2052} {"train_loss": -23.329959869384766, "global_step": 170319, "epoch": 2052} {"train_loss": -22.918766021728516, "global_step": 170320, "epoch": 2052} {"train_loss": -23.060205459594727, "global_step": 170321, "epoch": 2052} {"train_loss": -22.96303367614746, "global_step": 170322, "epoch": 2052} {"train_loss": -23.625150680541992, "global_step": 170323, "epoch": 2052} {"train_loss": -23.312559127807617, "global_step": 170324, "epoch": 2052} {"train_loss": -23.44939613342285, "global_step": 170325, "epoch": 2052} {"train_loss": -23.643842697143555, "global_step": 170326, "epoch": 2052} {"train_loss": -23.825937271118164, "global_step": 170327, "epoch": 2052} {"train_loss": -23.871686935424805, "global_step": 170328, "epoch": 2052} {"train_loss": -23.63252830505371, "global_step": 170329, "epoch": 2052} {"train_loss": -23.78505516052246, "global_step": 170330, "epoch": 2052} {"train_loss": -23.18320083618164, "global_step": 170331, "epoch": 2052} {"train_loss": -23.64983558654785, "global_step": 170332, "epoch": 2052} {"train_loss": -24.064483642578125, "global_step": 170333, "epoch": 2052} {"train_loss": -23.904605865478516, "global_step": 170334, "epoch": 2052} {"train_loss": -23.683744430541992, "global_step": 170335, "epoch": 2052} {"train_loss": -23.406835556030273, "global_step": 170336, "epoch": 2052} {"train_loss": -23.726858139038086, "global_step": 170337, "epoch": 2052} {"train_loss": -23.84783935546875, "global_step": 170338, "epoch": 2052} {"train_loss": -23.560321807861328, "global_step": 170339, "epoch": 2052} {"train_loss": -23.55140495300293, "global_step": 170340, "epoch": 2052} {"train_loss": -24.11463737487793, "global_step": 170341, "epoch": 2052} {"train_loss": -24.040653228759766, "global_step": 170342, "epoch": 2052} {"train_loss": -23.85345458984375, "global_step": 170343, "epoch": 2052} {"train_loss": -23.547571182250977, "global_step": 170344, "epoch": 2052} {"train_loss": -23.802549362182617, "global_step": 170345, "epoch": 2052} {"train_loss": -23.934980392456055, "global_step": 170346, "epoch": 2052} {"train_loss": -23.59681510925293, "global_step": 170347, "epoch": 2052} {"train_loss": -24.0278377532959, "global_step": 170348, "epoch": 2052} {"train_loss": -23.84061050415039, "global_step": 170349, "epoch": 2052} {"train_loss": -23.830379486083984, "global_step": 170350, "epoch": 2052} {"train_loss": -23.863210678100586, "global_step": 170351, "epoch": 2052} {"train_loss": -23.497116088867188, "global_step": 170352, "epoch": 2052} {"train_loss": -24.24208641052246, "global_step": 170353, "epoch": 2052} {"train_loss": -23.599742889404297, "global_step": 170354, "epoch": 2052} {"train_loss": -24.177518844604492, "global_step": 170355, "epoch": 2052} {"train_loss": -23.630468368530273, "global_step": 170356, "epoch": 2052} {"train_loss": -23.555631637573242, "global_step": 170357, "epoch": 2052} {"train_loss": -23.409887313842773, "global_step": 170358, "epoch": 2052} {"train_loss": -23.43067741394043, "global_step": 170359, "epoch": 2052} {"train_loss": -23.09027099609375, "global_step": 170360, "epoch": 2052} {"train_loss": -23.77275848388672, "global_step": 170361, "epoch": 2052} {"train_loss": -23.849437713623047, "global_step": 170362, "epoch": 2052} {"train_loss": -23.43232536315918, "global_step": 170363, "epoch": 2052} {"train_loss": -23.441776275634766, "global_step": 170364, "epoch": 2052} {"train_loss": -23.486242294311523, "global_step": 170365, "epoch": 2052} {"train_loss": -23.610904693603516, "global_step": 170366, "epoch": 2052} {"train_loss": -23.626855850219727, "global_step": 170367, "epoch": 2052} {"train_loss": -23.2989559173584, "global_step": 170368, "epoch": 2052} {"train_loss": -23.409061431884766, "global_step": 170369, "epoch": 2052} {"train_loss": -23.991243362426758, "global_step": 170370, "epoch": 2052} {"train_loss": -23.43227195739746, "global_step": 170371, "epoch": 2052} {"train_loss": -23.808298110961914, "global_step": 170372, "epoch": 2052} {"train_loss": -23.41314125061035, "global_step": 170373, "epoch": 2052} {"train_loss": -23.35847282409668, "global_step": 170374, "epoch": 2052} {"train_loss": -23.454689025878906, "global_step": 170375, "epoch": 2052} {"train_loss": -23.8896541595459, "global_step": 170376, "epoch": 2052} {"train_loss": -23.628952026367188, "global_step": 170377, "epoch": 2052} {"train_loss": -23.462112426757812, "global_step": 170378, "epoch": 2052} {"train_loss": -23.701642990112305, "global_step": 170379, "epoch": 2052} {"train_loss": -23.256317138671875, "global_step": 170380, "epoch": 2052} {"train_loss": -23.657794952392578, "global_step": 170381, "epoch": 2052} {"train_loss": -23.233489990234375, "global_step": 170382, "epoch": 2052} {"train_loss": -23.465784072875977, "global_step": 170383, "epoch": 2052} {"train_loss": -23.46702003479004, "global_step": 170384, "epoch": 2052} {"train_loss": -23.654621124267578, "global_step": 170385, "epoch": 2052} {"train_loss": -23.542325973510742, "global_step": 170386, "epoch": 2052} {"train_loss": -23.5430850982666, "global_step": 170387, "epoch": 2052} {"train_loss": -23.448118209838867, "global_step": 170388, "epoch": 2052} {"train_loss": -23.3046817779541, "global_step": 170389, "epoch": 2052} {"train_loss": -23.71925926208496, "global_step": 170390, "epoch": 2052} {"train_loss": -23.219762802124023, "global_step": 170391, "epoch": 2052} {"train_loss": -23.53162384033203, "global_step": 170392, "epoch": 2052} {"train_loss": -23.794147491455078, "global_step": 170393, "epoch": 2052} {"train_loss": -23.494705200195312, "global_step": 170394, "epoch": 2052} {"train_loss": -23.56821060180664, "global_step": 170395, "epoch": 2052} {"train_loss": -23.298416137695312, "global_step": 170396, "epoch": 2052} {"train_loss": -23.686542510986328, "global_step": 170397, "epoch": 2052} {"train_loss": -23.57771857388048, "global_step": 170398, "epoch": 2052, "val_loss": 6427393.0} {"train_loss": -23.26980972290039, "global_step": 170399, "epoch": 2053} {"train_loss": -22.682737350463867, "global_step": 170400, "epoch": 2053} {"train_loss": -22.551815032958984, "global_step": 170401, "epoch": 2053} {"train_loss": -23.383413314819336, "global_step": 170402, "epoch": 2053} {"train_loss": -23.336170196533203, "global_step": 170403, "epoch": 2053} {"train_loss": -23.287437438964844, "global_step": 170404, "epoch": 2053} {"train_loss": -23.5811824798584, "global_step": 170405, "epoch": 2053} {"train_loss": -23.553730010986328, "global_step": 170406, "epoch": 2053} {"train_loss": -23.52048683166504, "global_step": 170407, "epoch": 2053} {"train_loss": -23.058475494384766, "global_step": 170408, "epoch": 2053} {"train_loss": -23.768756866455078, "global_step": 170409, "epoch": 2053} {"train_loss": -23.65813446044922, "global_step": 170410, "epoch": 2053} {"train_loss": -23.60822105407715, "global_step": 170411, "epoch": 2053} {"train_loss": -23.683557510375977, "global_step": 170412, "epoch": 2053} {"train_loss": -23.532730102539062, "global_step": 170413, "epoch": 2053} {"train_loss": -23.248525619506836, "global_step": 170414, "epoch": 2053} {"train_loss": -23.679000854492188, "global_step": 170415, "epoch": 2053} {"train_loss": -23.50168228149414, "global_step": 170416, "epoch": 2053} {"train_loss": -23.546810150146484, "global_step": 170417, "epoch": 2053} {"train_loss": -23.488195419311523, "global_step": 170418, "epoch": 2053} {"train_loss": -23.55733299255371, "global_step": 170419, "epoch": 2053} {"train_loss": -23.60858726501465, "global_step": 170420, "epoch": 2053} {"train_loss": -23.6500186920166, "global_step": 170421, "epoch": 2053} {"train_loss": -23.425586700439453, "global_step": 170422, "epoch": 2053} {"train_loss": -23.534732818603516, "global_step": 170423, "epoch": 2053} {"train_loss": -23.592702865600586, "global_step": 170424, "epoch": 2053} {"train_loss": -23.645437240600586, "global_step": 170425, "epoch": 2053} {"train_loss": -23.753524780273438, "global_step": 170426, "epoch": 2053} {"train_loss": -23.618900299072266, "global_step": 170427, "epoch": 2053} {"train_loss": -23.424503326416016, "global_step": 170428, "epoch": 2053} {"train_loss": -23.574064254760742, "global_step": 170429, "epoch": 2053} {"train_loss": -24.279403686523438, "global_step": 170430, "epoch": 2053} {"train_loss": -24.15545654296875, "global_step": 170431, "epoch": 2053} {"train_loss": -23.696680068969727, "global_step": 170432, "epoch": 2053} {"train_loss": -23.64118003845215, "global_step": 170433, "epoch": 2053} {"train_loss": -23.806076049804688, "global_step": 170434, "epoch": 2053} {"train_loss": -24.065702438354492, "global_step": 170435, "epoch": 2053} {"train_loss": -24.1319637298584, "global_step": 170436, "epoch": 2053} {"train_loss": -23.977033615112305, "global_step": 170437, "epoch": 2053} {"train_loss": -23.996015548706055, "global_step": 170438, "epoch": 2053} {"train_loss": -23.522544860839844, "global_step": 170439, "epoch": 2053} {"train_loss": -23.608905792236328, "global_step": 170440, "epoch": 2053} {"train_loss": -24.007802963256836, "global_step": 170441, "epoch": 2053} {"train_loss": -23.95004653930664, "global_step": 170442, "epoch": 2053} {"train_loss": -24.178516387939453, "global_step": 170443, "epoch": 2053} {"train_loss": -23.402376174926758, "global_step": 170444, "epoch": 2053} {"train_loss": -23.58527946472168, "global_step": 170445, "epoch": 2053} {"train_loss": -23.508115768432617, "global_step": 170446, "epoch": 2053} {"train_loss": -23.592775344848633, "global_step": 170447, "epoch": 2053} {"train_loss": -23.61171531677246, "global_step": 170448, "epoch": 2053} {"train_loss": -23.8541316986084, "global_step": 170449, "epoch": 2053} {"train_loss": -23.292877197265625, "global_step": 170450, "epoch": 2053} {"train_loss": -23.070920944213867, "global_step": 170451, "epoch": 2053} {"train_loss": -22.87380027770996, "global_step": 170452, "epoch": 2053} {"train_loss": -23.522897720336914, "global_step": 170453, "epoch": 2053} {"train_loss": -23.82283592224121, "global_step": 170454, "epoch": 2053} {"train_loss": -23.456439971923828, "global_step": 170455, "epoch": 2053} {"train_loss": -23.8786563873291, "global_step": 170456, "epoch": 2053} {"train_loss": -23.567630767822266, "global_step": 170457, "epoch": 2053} {"train_loss": -23.893945693969727, "global_step": 170458, "epoch": 2053} {"train_loss": -23.875980377197266, "global_step": 170459, "epoch": 2053} {"train_loss": -23.80940055847168, "global_step": 170460, "epoch": 2053} {"train_loss": -23.593252182006836, "global_step": 170461, "epoch": 2053} {"train_loss": -23.729049682617188, "global_step": 170462, "epoch": 2053} {"train_loss": -23.748828887939453, "global_step": 170463, "epoch": 2053} {"train_loss": -23.76897621154785, "global_step": 170464, "epoch": 2053} {"train_loss": -23.697216033935547, "global_step": 170465, "epoch": 2053} {"train_loss": -23.843679428100586, "global_step": 170466, "epoch": 2053} {"train_loss": -23.3171329498291, "global_step": 170467, "epoch": 2053} {"train_loss": -23.90315055847168, "global_step": 170468, "epoch": 2053} {"train_loss": -23.984786987304688, "global_step": 170469, "epoch": 2053} {"train_loss": -23.776138305664062, "global_step": 170470, "epoch": 2053} {"train_loss": -23.887792587280273, "global_step": 170471, "epoch": 2053} {"train_loss": -23.780445098876953, "global_step": 170472, "epoch": 2053} {"train_loss": -24.14442253112793, "global_step": 170473, "epoch": 2053} {"train_loss": -23.53340721130371, "global_step": 170474, "epoch": 2053} {"train_loss": -23.785615921020508, "global_step": 170475, "epoch": 2053} {"train_loss": -23.836292266845703, "global_step": 170476, "epoch": 2053} {"train_loss": -23.519853591918945, "global_step": 170477, "epoch": 2053} {"train_loss": -23.98602867126465, "global_step": 170478, "epoch": 2053} {"train_loss": -23.94855499267578, "global_step": 170479, "epoch": 2053} {"train_loss": -23.652088165283203, "global_step": 170480, "epoch": 2053} {"train_loss": -23.642770882112433, "global_step": 170481, "epoch": 2053, "val_loss": 6319595.0} {"train_loss": -22.834951400756836, "global_step": 170482, "epoch": 2054} {"train_loss": -23.257488250732422, "global_step": 170483, "epoch": 2054} {"train_loss": -23.42939567565918, "global_step": 170484, "epoch": 2054} {"train_loss": -22.866125106811523, "global_step": 170485, "epoch": 2054} {"train_loss": -23.24187660217285, "global_step": 170486, "epoch": 2054} {"train_loss": -23.208831787109375, "global_step": 170487, "epoch": 2054} {"train_loss": -23.333934783935547, "global_step": 170488, "epoch": 2054} {"train_loss": -23.23012351989746, "global_step": 170489, "epoch": 2054} {"train_loss": -23.424732208251953, "global_step": 170490, "epoch": 2054} {"train_loss": -22.829065322875977, "global_step": 170491, "epoch": 2054} {"train_loss": -23.650283813476562, "global_step": 170492, "epoch": 2054} {"train_loss": -23.297800064086914, "global_step": 170493, "epoch": 2054} {"train_loss": -23.471738815307617, "global_step": 170494, "epoch": 2054} {"train_loss": -23.305723190307617, "global_step": 170495, "epoch": 2054} {"train_loss": -23.429231643676758, "global_step": 170496, "epoch": 2054} {"train_loss": -23.685895919799805, "global_step": 170497, "epoch": 2054} {"train_loss": -23.312936782836914, "global_step": 170498, "epoch": 2054} {"train_loss": -23.654972076416016, "global_step": 170499, "epoch": 2054} {"train_loss": -23.519445419311523, "global_step": 170500, "epoch": 2054} {"train_loss": -23.839162826538086, "global_step": 170501, "epoch": 2054} {"train_loss": -23.684219360351562, "global_step": 170502, "epoch": 2054} {"train_loss": -23.498966217041016, "global_step": 170503, "epoch": 2054} {"train_loss": -23.372312545776367, "global_step": 170504, "epoch": 2054} {"train_loss": -23.710468292236328, "global_step": 170505, "epoch": 2054} {"train_loss": -23.936525344848633, "global_step": 170506, "epoch": 2054} {"train_loss": -23.74032211303711, "global_step": 170507, "epoch": 2054} {"train_loss": -23.561429977416992, "global_step": 170508, "epoch": 2054} {"train_loss": -23.748151779174805, "global_step": 170509, "epoch": 2054} {"train_loss": -23.831336975097656, "global_step": 170510, "epoch": 2054} {"train_loss": -23.499120712280273, "global_step": 170511, "epoch": 2054} {"train_loss": -23.512189865112305, "global_step": 170512, "epoch": 2054} {"train_loss": -23.63724136352539, "global_step": 170513, "epoch": 2054} {"train_loss": -23.734642028808594, "global_step": 170514, "epoch": 2054} {"train_loss": -23.564653396606445, "global_step": 170515, "epoch": 2054} {"train_loss": -23.576040267944336, "global_step": 170516, "epoch": 2054} {"train_loss": -24.1629638671875, "global_step": 170517, "epoch": 2054} {"train_loss": -24.015369415283203, "global_step": 170518, "epoch": 2054} {"train_loss": -23.5385799407959, "global_step": 170519, "epoch": 2054} {"train_loss": -23.841039657592773, "global_step": 170520, "epoch": 2054} {"train_loss": -23.650192260742188, "global_step": 170521, "epoch": 2054} {"train_loss": -23.935094833374023, "global_step": 170522, "epoch": 2054} {"train_loss": -23.77220916748047, "global_step": 170523, "epoch": 2054} {"train_loss": -23.99700164794922, "global_step": 170524, "epoch": 2054} {"train_loss": -23.71372413635254, "global_step": 170525, "epoch": 2054} {"train_loss": -23.951309204101562, "global_step": 170526, "epoch": 2054} {"train_loss": -23.81888198852539, "global_step": 170527, "epoch": 2054} {"train_loss": -23.87566566467285, "global_step": 170528, "epoch": 2054} {"train_loss": -23.518381118774414, "global_step": 170529, "epoch": 2054} {"train_loss": -24.083189010620117, "global_step": 170530, "epoch": 2054} {"train_loss": -23.684236526489258, "global_step": 170531, "epoch": 2054} {"train_loss": -23.810089111328125, "global_step": 170532, "epoch": 2054} {"train_loss": -23.841218948364258, "global_step": 170533, "epoch": 2054} {"train_loss": -24.02058982849121, "global_step": 170534, "epoch": 2054} {"train_loss": -23.645544052124023, "global_step": 170535, "epoch": 2054} {"train_loss": -23.78544044494629, "global_step": 170536, "epoch": 2054} {"train_loss": -23.596773147583008, "global_step": 170537, "epoch": 2054} {"train_loss": -23.660215377807617, "global_step": 170538, "epoch": 2054} {"train_loss": -23.526840209960938, "global_step": 170539, "epoch": 2054} {"train_loss": -23.160816192626953, "global_step": 170540, "epoch": 2054} {"train_loss": -23.84282684326172, "global_step": 170541, "epoch": 2054} {"train_loss": -23.77269172668457, "global_step": 170542, "epoch": 2054} {"train_loss": -23.644290924072266, "global_step": 170543, "epoch": 2054} {"train_loss": -23.441770553588867, "global_step": 170544, "epoch": 2054} {"train_loss": -23.481557846069336, "global_step": 170545, "epoch": 2054} {"train_loss": -23.415130615234375, "global_step": 170546, "epoch": 2054} {"train_loss": -23.443464279174805, "global_step": 170547, "epoch": 2054} {"train_loss": -23.604930877685547, "global_step": 170548, "epoch": 2054} {"train_loss": -23.179397583007812, "global_step": 170549, "epoch": 2054} {"train_loss": -23.434778213500977, "global_step": 170550, "epoch": 2054} {"train_loss": -22.881038665771484, "global_step": 170551, "epoch": 2054} {"train_loss": -24.01456069946289, "global_step": 170552, "epoch": 2054} {"train_loss": -22.948711395263672, "global_step": 170553, "epoch": 2054} {"train_loss": -23.41910171508789, "global_step": 170554, "epoch": 2054} {"train_loss": -23.513044357299805, "global_step": 170555, "epoch": 2054} {"train_loss": -23.387365341186523, "global_step": 170556, "epoch": 2054} {"train_loss": -23.387983322143555, "global_step": 170557, "epoch": 2054} {"train_loss": -23.6314754486084, "global_step": 170558, "epoch": 2054} {"train_loss": -23.73771095275879, "global_step": 170559, "epoch": 2054} {"train_loss": -23.393827438354492, "global_step": 170560, "epoch": 2054} {"train_loss": -23.631925582885742, "global_step": 170561, "epoch": 2054} {"train_loss": -23.65445327758789, "global_step": 170562, "epoch": 2054} {"train_loss": -23.27933692932129, "global_step": 170563, "epoch": 2054} {"train_loss": -23.560121283473737, "global_step": 170564, "epoch": 2054, "val_loss": 6439747.5} {"train_loss": -23.00164794921875, "global_step": 170565, "epoch": 2055} {"train_loss": -23.444747924804688, "global_step": 170566, "epoch": 2055} {"train_loss": -23.403669357299805, "global_step": 170567, "epoch": 2055} {"train_loss": -23.060564041137695, "global_step": 170568, "epoch": 2055} {"train_loss": -23.53000259399414, "global_step": 170569, "epoch": 2055} {"train_loss": -23.722789764404297, "global_step": 170570, "epoch": 2055} {"train_loss": -23.5704402923584, "global_step": 170571, "epoch": 2055} {"train_loss": -23.846059799194336, "global_step": 170572, "epoch": 2055} {"train_loss": -23.280698776245117, "global_step": 170573, "epoch": 2055} {"train_loss": -23.466493606567383, "global_step": 170574, "epoch": 2055} {"train_loss": -24.094749450683594, "global_step": 170575, "epoch": 2055} {"train_loss": -23.08500099182129, "global_step": 170576, "epoch": 2055} {"train_loss": -23.76258659362793, "global_step": 170577, "epoch": 2055} {"train_loss": -23.5380916595459, "global_step": 170578, "epoch": 2055} {"train_loss": -23.583463668823242, "global_step": 170579, "epoch": 2055} {"train_loss": -23.564401626586914, "global_step": 170580, "epoch": 2055} {"train_loss": -23.742406845092773, "global_step": 170581, "epoch": 2055} {"train_loss": -23.98464012145996, "global_step": 170582, "epoch": 2055} {"train_loss": -23.74818229675293, "global_step": 170583, "epoch": 2055} {"train_loss": -23.90704345703125, "global_step": 170584, "epoch": 2055} {"train_loss": -23.448320388793945, "global_step": 170585, "epoch": 2055} {"train_loss": -23.642902374267578, "global_step": 170586, "epoch": 2055} {"train_loss": -23.556884765625, "global_step": 170587, "epoch": 2055} {"train_loss": -23.952775955200195, "global_step": 170588, "epoch": 2055} {"train_loss": -23.585561752319336, "global_step": 170589, "epoch": 2055} {"train_loss": -23.407535552978516, "global_step": 170590, "epoch": 2055} {"train_loss": -24.249717712402344, "global_step": 170591, "epoch": 2055} {"train_loss": -23.650495529174805, "global_step": 170592, "epoch": 2055} {"train_loss": -23.821659088134766, "global_step": 170593, "epoch": 2055} {"train_loss": -23.583372116088867, "global_step": 170594, "epoch": 2055} {"train_loss": -23.779144287109375, "global_step": 170595, "epoch": 2055} {"train_loss": -23.737340927124023, "global_step": 170596, "epoch": 2055} {"train_loss": -23.750837326049805, "global_step": 170597, "epoch": 2055} {"train_loss": -23.225505828857422, "global_step": 170598, "epoch": 2055} {"train_loss": -23.917659759521484, "global_step": 170599, "epoch": 2055} {"train_loss": -24.017492294311523, "global_step": 170600, "epoch": 2055} {"train_loss": -23.629125595092773, "global_step": 170601, "epoch": 2055} {"train_loss": -23.617399215698242, "global_step": 170602, "epoch": 2055} {"train_loss": -23.551855087280273, "global_step": 170603, "epoch": 2055} {"train_loss": -23.25127410888672, "global_step": 170604, "epoch": 2055} {"train_loss": -23.943195343017578, "global_step": 170605, "epoch": 2055} {"train_loss": -23.483882904052734, "global_step": 170606, "epoch": 2055} {"train_loss": -23.388824462890625, "global_step": 170607, "epoch": 2055} {"train_loss": -23.669687271118164, "global_step": 170608, "epoch": 2055} {"train_loss": -24.071298599243164, "global_step": 170609, "epoch": 2055} {"train_loss": -23.06378173828125, "global_step": 170610, "epoch": 2055} {"train_loss": -23.88162612915039, "global_step": 170611, "epoch": 2055} {"train_loss": -23.62967872619629, "global_step": 170612, "epoch": 2055} {"train_loss": -23.362409591674805, "global_step": 170613, "epoch": 2055} {"train_loss": -23.79110336303711, "global_step": 170614, "epoch": 2055} {"train_loss": -23.63960075378418, "global_step": 170615, "epoch": 2055} {"train_loss": -23.809080123901367, "global_step": 170616, "epoch": 2055} {"train_loss": -23.42413330078125, "global_step": 170617, "epoch": 2055} {"train_loss": -23.557188034057617, "global_step": 170618, "epoch": 2055} {"train_loss": -23.925189971923828, "global_step": 170619, "epoch": 2055} {"train_loss": -24.085908889770508, "global_step": 170620, "epoch": 2055} {"train_loss": -23.44675636291504, "global_step": 170621, "epoch": 2055} {"train_loss": -23.953842163085938, "global_step": 170622, "epoch": 2055} {"train_loss": -23.91632652282715, "global_step": 170623, "epoch": 2055} {"train_loss": -23.909351348876953, "global_step": 170624, "epoch": 2055} {"train_loss": -23.839590072631836, "global_step": 170625, "epoch": 2055} {"train_loss": -23.61384391784668, "global_step": 170626, "epoch": 2055} {"train_loss": -23.768362045288086, "global_step": 170627, "epoch": 2055} {"train_loss": -23.754379272460938, "global_step": 170628, "epoch": 2055} {"train_loss": -23.851964950561523, "global_step": 170629, "epoch": 2055} {"train_loss": -23.66305923461914, "global_step": 170630, "epoch": 2055} {"train_loss": -23.696273803710938, "global_step": 170631, "epoch": 2055} {"train_loss": -23.5508975982666, "global_step": 170632, "epoch": 2055} {"train_loss": -23.6511287689209, "global_step": 170633, "epoch": 2055} {"train_loss": -23.5954647064209, "global_step": 170634, "epoch": 2055} {"train_loss": -23.37549591064453, "global_step": 170635, "epoch": 2055} {"train_loss": -23.403234481811523, "global_step": 170636, "epoch": 2055} {"train_loss": -23.506057739257812, "global_step": 170637, "epoch": 2055} {"train_loss": -23.708316802978516, "global_step": 170638, "epoch": 2055} {"train_loss": -23.896886825561523, "global_step": 170639, "epoch": 2055} {"train_loss": -23.93257713317871, "global_step": 170640, "epoch": 2055} {"train_loss": -23.852251052856445, "global_step": 170641, "epoch": 2055} {"train_loss": -23.582395553588867, "global_step": 170642, "epoch": 2055} {"train_loss": -24.073869705200195, "global_step": 170643, "epoch": 2055} {"train_loss": -23.380456924438477, "global_step": 170644, "epoch": 2055} {"train_loss": -23.97429656982422, "global_step": 170645, "epoch": 2055} {"train_loss": -23.494888305664062, "global_step": 170646, "epoch": 2055} {"train_loss": -23.644695994365645, "global_step": 170647, "epoch": 2055, "val_loss": 6440335.0} {"train_loss": -23.829984664916992, "global_step": 170648, "epoch": 2056} {"train_loss": -23.607044219970703, "global_step": 170649, "epoch": 2056} {"train_loss": -23.83310890197754, "global_step": 170650, "epoch": 2056} {"train_loss": -23.670272827148438, "global_step": 170651, "epoch": 2056} {"train_loss": -23.416889190673828, "global_step": 170652, "epoch": 2056} {"train_loss": -24.020702362060547, "global_step": 170653, "epoch": 2056} {"train_loss": -23.643888473510742, "global_step": 170654, "epoch": 2056} {"train_loss": -23.431955337524414, "global_step": 170655, "epoch": 2056} {"train_loss": -23.070425033569336, "global_step": 170656, "epoch": 2056} {"train_loss": -23.553279876708984, "global_step": 170657, "epoch": 2056} {"train_loss": -23.748340606689453, "global_step": 170658, "epoch": 2056} {"train_loss": -23.846887588500977, "global_step": 170659, "epoch": 2056} {"train_loss": -23.533884048461914, "global_step": 170660, "epoch": 2056} {"train_loss": -23.406328201293945, "global_step": 170661, "epoch": 2056} {"train_loss": -23.99009895324707, "global_step": 170662, "epoch": 2056} {"train_loss": -23.235918045043945, "global_step": 170663, "epoch": 2056} {"train_loss": -23.649751663208008, "global_step": 170664, "epoch": 2056} {"train_loss": -23.41048240661621, "global_step": 170665, "epoch": 2056} {"train_loss": -23.557485580444336, "global_step": 170666, "epoch": 2056} {"train_loss": -23.39605712890625, "global_step": 170667, "epoch": 2056} {"train_loss": -23.497060775756836, "global_step": 170668, "epoch": 2056} {"train_loss": -23.803062438964844, "global_step": 170669, "epoch": 2056} {"train_loss": -23.815643310546875, "global_step": 170670, "epoch": 2056} {"train_loss": -23.664703369140625, "global_step": 170671, "epoch": 2056} {"train_loss": -23.754398345947266, "global_step": 170672, "epoch": 2056} {"train_loss": -23.546966552734375, "global_step": 170673, "epoch": 2056} {"train_loss": -24.05291748046875, "global_step": 170674, "epoch": 2056} {"train_loss": -23.04303550720215, "global_step": 170675, "epoch": 2056} {"train_loss": -24.04352378845215, "global_step": 170676, "epoch": 2056} {"train_loss": -23.72551155090332, "global_step": 170677, "epoch": 2056} {"train_loss": -23.66472625732422, "global_step": 170678, "epoch": 2056} {"train_loss": -23.583908081054688, "global_step": 170679, "epoch": 2056} {"train_loss": -23.67870330810547, "global_step": 170680, "epoch": 2056} {"train_loss": -24.134077072143555, "global_step": 170681, "epoch": 2056} {"train_loss": -23.749866485595703, "global_step": 170682, "epoch": 2056} {"train_loss": -23.767778396606445, "global_step": 170683, "epoch": 2056} {"train_loss": -23.331134796142578, "global_step": 170684, "epoch": 2056} {"train_loss": -23.6838436126709, "global_step": 170685, "epoch": 2056} {"train_loss": -23.729557037353516, "global_step": 170686, "epoch": 2056} {"train_loss": -23.771644592285156, "global_step": 170687, "epoch": 2056} {"train_loss": -23.801923751831055, "global_step": 170688, "epoch": 2056} {"train_loss": -23.800989151000977, "global_step": 170689, "epoch": 2056} {"train_loss": -23.78306007385254, "global_step": 170690, "epoch": 2056} {"train_loss": -23.978300094604492, "global_step": 170691, "epoch": 2056} {"train_loss": -23.923824310302734, "global_step": 170692, "epoch": 2056} {"train_loss": -23.614622116088867, "global_step": 170693, "epoch": 2056} {"train_loss": -24.02493667602539, "global_step": 170694, "epoch": 2056} {"train_loss": -23.89790153503418, "global_step": 170695, "epoch": 2056} {"train_loss": -24.051626205444336, "global_step": 170696, "epoch": 2056} {"train_loss": -23.688283920288086, "global_step": 170697, "epoch": 2056} {"train_loss": -23.39814567565918, "global_step": 170698, "epoch": 2056} {"train_loss": -23.69644546508789, "global_step": 170699, "epoch": 2056} {"train_loss": -23.925397872924805, "global_step": 170700, "epoch": 2056} {"train_loss": -23.383033752441406, "global_step": 170701, "epoch": 2056} {"train_loss": -22.94082260131836, "global_step": 170702, "epoch": 2056} {"train_loss": -23.76150894165039, "global_step": 170703, "epoch": 2056} {"train_loss": -23.584569931030273, "global_step": 170704, "epoch": 2056} {"train_loss": -24.0633602142334, "global_step": 170705, "epoch": 2056} {"train_loss": -23.530134201049805, "global_step": 170706, "epoch": 2056} {"train_loss": -24.05193519592285, "global_step": 170707, "epoch": 2056} {"train_loss": -23.78352928161621, "global_step": 170708, "epoch": 2056} {"train_loss": -23.633119583129883, "global_step": 170709, "epoch": 2056} {"train_loss": -23.628568649291992, "global_step": 170710, "epoch": 2056} {"train_loss": -23.891830444335938, "global_step": 170711, "epoch": 2056} {"train_loss": -23.912050247192383, "global_step": 170712, "epoch": 2056} {"train_loss": -23.727407455444336, "global_step": 170713, "epoch": 2056} {"train_loss": -23.61316680908203, "global_step": 170714, "epoch": 2056} {"train_loss": -23.717594146728516, "global_step": 170715, "epoch": 2056} {"train_loss": -23.524972915649414, "global_step": 170716, "epoch": 2056} {"train_loss": -23.568954467773438, "global_step": 170717, "epoch": 2056} {"train_loss": -23.8051815032959, "global_step": 170718, "epoch": 2056} {"train_loss": -23.631338119506836, "global_step": 170719, "epoch": 2056} {"train_loss": -24.143163681030273, "global_step": 170720, "epoch": 2056} {"train_loss": -23.543704986572266, "global_step": 170721, "epoch": 2056} {"train_loss": -23.862268447875977, "global_step": 170722, "epoch": 2056} {"train_loss": -23.530170440673828, "global_step": 170723, "epoch": 2056} {"train_loss": -23.682571411132812, "global_step": 170724, "epoch": 2056} {"train_loss": -23.610057830810547, "global_step": 170725, "epoch": 2056} {"train_loss": -23.651578903198242, "global_step": 170726, "epoch": 2056} {"train_loss": -23.552507400512695, "global_step": 170727, "epoch": 2056} {"train_loss": -23.328153610229492, "global_step": 170728, "epoch": 2056} {"train_loss": -23.685199737548828, "global_step": 170729, "epoch": 2056} {"train_loss": -23.665743563548627, "global_step": 170730, "epoch": 2056, "val_loss": 6309577.0} {"train_loss": -23.08784294128418, "global_step": 170731, "epoch": 2057} {"train_loss": -23.294235229492188, "global_step": 170732, "epoch": 2057} {"train_loss": -23.137365341186523, "global_step": 170733, "epoch": 2057} {"train_loss": -23.49044418334961, "global_step": 170734, "epoch": 2057} {"train_loss": -23.281713485717773, "global_step": 170735, "epoch": 2057} {"train_loss": -23.22635269165039, "global_step": 170736, "epoch": 2057} {"train_loss": -22.997848510742188, "global_step": 170737, "epoch": 2057} {"train_loss": -23.686725616455078, "global_step": 170738, "epoch": 2057} {"train_loss": -23.5438289642334, "global_step": 170739, "epoch": 2057} {"train_loss": -23.76070213317871, "global_step": 170740, "epoch": 2057} {"train_loss": -23.483928680419922, "global_step": 170741, "epoch": 2057} {"train_loss": -23.314544677734375, "global_step": 170742, "epoch": 2057} {"train_loss": -23.813308715820312, "global_step": 170743, "epoch": 2057} {"train_loss": -23.58888053894043, "global_step": 170744, "epoch": 2057} {"train_loss": -23.74652671813965, "global_step": 170745, "epoch": 2057} {"train_loss": -23.889606475830078, "global_step": 170746, "epoch": 2057} {"train_loss": -23.973379135131836, "global_step": 170747, "epoch": 2057} {"train_loss": -23.735519409179688, "global_step": 170748, "epoch": 2057} {"train_loss": -23.648212432861328, "global_step": 170749, "epoch": 2057} {"train_loss": -23.56556510925293, "global_step": 170750, "epoch": 2057} {"train_loss": -23.754262924194336, "global_step": 170751, "epoch": 2057} {"train_loss": -23.93464469909668, "global_step": 170752, "epoch": 2057} {"train_loss": -23.523639678955078, "global_step": 170753, "epoch": 2057} {"train_loss": -23.427358627319336, "global_step": 170754, "epoch": 2057} {"train_loss": -23.555097579956055, "global_step": 170755, "epoch": 2057} {"train_loss": -23.74354362487793, "global_step": 170756, "epoch": 2057} {"train_loss": -23.62970542907715, "global_step": 170757, "epoch": 2057} {"train_loss": -23.701854705810547, "global_step": 170758, "epoch": 2057} {"train_loss": -23.858407974243164, "global_step": 170759, "epoch": 2057} {"train_loss": -23.654022216796875, "global_step": 170760, "epoch": 2057} {"train_loss": -23.543298721313477, "global_step": 170761, "epoch": 2057} {"train_loss": -23.828771591186523, "global_step": 170762, "epoch": 2057} {"train_loss": -23.620899200439453, "global_step": 170763, "epoch": 2057} {"train_loss": -23.70516014099121, "global_step": 170764, "epoch": 2057} {"train_loss": -23.76792335510254, "global_step": 170765, "epoch": 2057} {"train_loss": -23.347393035888672, "global_step": 170766, "epoch": 2057} {"train_loss": -23.670557022094727, "global_step": 170767, "epoch": 2057} {"train_loss": -23.7862606048584, "global_step": 170768, "epoch": 2057} {"train_loss": -23.856325149536133, "global_step": 170769, "epoch": 2057} {"train_loss": -23.485610961914062, "global_step": 170770, "epoch": 2057} {"train_loss": -24.060243606567383, "global_step": 170771, "epoch": 2057} {"train_loss": -23.78914451599121, "global_step": 170772, "epoch": 2057} {"train_loss": -23.881755828857422, "global_step": 170773, "epoch": 2057} {"train_loss": -23.81967544555664, "global_step": 170774, "epoch": 2057} {"train_loss": -23.64162254333496, "global_step": 170775, "epoch": 2057} {"train_loss": -24.23473358154297, "global_step": 170776, "epoch": 2057} {"train_loss": -23.600311279296875, "global_step": 170777, "epoch": 2057} {"train_loss": -23.63942527770996, "global_step": 170778, "epoch": 2057} {"train_loss": -23.799888610839844, "global_step": 170779, "epoch": 2057} {"train_loss": -23.899917602539062, "global_step": 170780, "epoch": 2057} {"train_loss": -23.77269172668457, "global_step": 170781, "epoch": 2057} {"train_loss": -24.355512619018555, "global_step": 170782, "epoch": 2057} {"train_loss": -23.805753707885742, "global_step": 170783, "epoch": 2057} {"train_loss": -23.768465042114258, "global_step": 170784, "epoch": 2057} {"train_loss": -23.157302856445312, "global_step": 170785, "epoch": 2057} {"train_loss": -23.76852798461914, "global_step": 170786, "epoch": 2057} {"train_loss": -23.761981964111328, "global_step": 170787, "epoch": 2057} {"train_loss": -23.472064971923828, "global_step": 170788, "epoch": 2057} {"train_loss": -23.452190399169922, "global_step": 170789, "epoch": 2057} {"train_loss": -23.77605628967285, "global_step": 170790, "epoch": 2057} {"train_loss": -23.70770263671875, "global_step": 170791, "epoch": 2057} {"train_loss": -23.033782958984375, "global_step": 170792, "epoch": 2057} {"train_loss": -23.168319702148438, "global_step": 170793, "epoch": 2057} {"train_loss": -23.435514450073242, "global_step": 170794, "epoch": 2057} {"train_loss": -23.826248168945312, "global_step": 170795, "epoch": 2057} {"train_loss": -23.658645629882812, "global_step": 170796, "epoch": 2057} {"train_loss": -23.97732925415039, "global_step": 170797, "epoch": 2057} {"train_loss": -23.677371978759766, "global_step": 170798, "epoch": 2057} {"train_loss": -23.805322647094727, "global_step": 170799, "epoch": 2057} {"train_loss": -23.539016723632812, "global_step": 170800, "epoch": 2057} {"train_loss": -23.737585067749023, "global_step": 170801, "epoch": 2057} {"train_loss": -23.4208927154541, "global_step": 170802, "epoch": 2057} {"train_loss": -23.762161254882812, "global_step": 170803, "epoch": 2057} {"train_loss": -23.56977653503418, "global_step": 170804, "epoch": 2057} {"train_loss": -23.621084213256836, "global_step": 170805, "epoch": 2057} {"train_loss": -23.504667282104492, "global_step": 170806, "epoch": 2057} {"train_loss": -23.522903442382812, "global_step": 170807, "epoch": 2057} {"train_loss": -24.001676559448242, "global_step": 170808, "epoch": 2057} {"train_loss": -23.532468795776367, "global_step": 170809, "epoch": 2057} {"train_loss": -23.71699333190918, "global_step": 170810, "epoch": 2057} {"train_loss": -23.713918685913086, "global_step": 170811, "epoch": 2057} {"train_loss": -23.33717918395996, "global_step": 170812, "epoch": 2057} {"train_loss": -23.628999066640095, "global_step": 170813, "epoch": 2057, "val_loss": 6309684.0} {"train_loss": -23.193593978881836, "global_step": 170814, "epoch": 2058} {"train_loss": -22.78213882446289, "global_step": 170815, "epoch": 2058} {"train_loss": -23.544008255004883, "global_step": 170816, "epoch": 2058} {"train_loss": -22.691068649291992, "global_step": 170817, "epoch": 2058} {"train_loss": -22.175914764404297, "global_step": 170818, "epoch": 2058} {"train_loss": -23.13149070739746, "global_step": 170819, "epoch": 2058} {"train_loss": -23.040119171142578, "global_step": 170820, "epoch": 2058} {"train_loss": -22.82511329650879, "global_step": 170821, "epoch": 2058} {"train_loss": -22.98353385925293, "global_step": 170822, "epoch": 2058} {"train_loss": -23.12104606628418, "global_step": 170823, "epoch": 2058} {"train_loss": -23.30852699279785, "global_step": 170824, "epoch": 2058} {"train_loss": -23.221397399902344, "global_step": 170825, "epoch": 2058} {"train_loss": -23.869855880737305, "global_step": 170826, "epoch": 2058} {"train_loss": -23.03877830505371, "global_step": 170827, "epoch": 2058} {"train_loss": -23.148834228515625, "global_step": 170828, "epoch": 2058} {"train_loss": -23.297502517700195, "global_step": 170829, "epoch": 2058} {"train_loss": -23.344152450561523, "global_step": 170830, "epoch": 2058} {"train_loss": -23.019113540649414, "global_step": 170831, "epoch": 2058} {"train_loss": -23.70767593383789, "global_step": 170832, "epoch": 2058} {"train_loss": -22.952743530273438, "global_step": 170833, "epoch": 2058} {"train_loss": -23.3878173828125, "global_step": 170834, "epoch": 2058} {"train_loss": -23.83175277709961, "global_step": 170835, "epoch": 2058} {"train_loss": -22.93927574157715, "global_step": 170836, "epoch": 2058} {"train_loss": -23.26705551147461, "global_step": 170837, "epoch": 2058} {"train_loss": -23.446063995361328, "global_step": 170838, "epoch": 2058} {"train_loss": -23.226858139038086, "global_step": 170839, "epoch": 2058} {"train_loss": -23.455638885498047, "global_step": 170840, "epoch": 2058} {"train_loss": -23.771284103393555, "global_step": 170841, "epoch": 2058} {"train_loss": -23.270263671875, "global_step": 170842, "epoch": 2058} {"train_loss": -23.96196174621582, "global_step": 170843, "epoch": 2058} {"train_loss": -23.241790771484375, "global_step": 170844, "epoch": 2058} {"train_loss": -23.949033737182617, "global_step": 170845, "epoch": 2058} {"train_loss": -23.593891143798828, "global_step": 170846, "epoch": 2058} {"train_loss": -23.76109504699707, "global_step": 170847, "epoch": 2058} {"train_loss": -24.086530685424805, "global_step": 170848, "epoch": 2058} {"train_loss": -23.979005813598633, "global_step": 170849, "epoch": 2058} {"train_loss": -23.75554656982422, "global_step": 170850, "epoch": 2058} {"train_loss": -23.771047592163086, "global_step": 170851, "epoch": 2058} {"train_loss": -23.870689392089844, "global_step": 170852, "epoch": 2058} {"train_loss": -23.807764053344727, "global_step": 170853, "epoch": 2058} {"train_loss": -23.7806396484375, "global_step": 170854, "epoch": 2058} {"train_loss": -23.973108291625977, "global_step": 170855, "epoch": 2058} {"train_loss": -23.530521392822266, "global_step": 170856, "epoch": 2058} {"train_loss": -23.420551300048828, "global_step": 170857, "epoch": 2058} {"train_loss": -23.68484115600586, "global_step": 170858, "epoch": 2058} {"train_loss": -23.836563110351562, "global_step": 170859, "epoch": 2058} {"train_loss": -23.632986068725586, "global_step": 170860, "epoch": 2058} {"train_loss": -23.51270866394043, "global_step": 170861, "epoch": 2058} {"train_loss": -23.796171188354492, "global_step": 170862, "epoch": 2058} {"train_loss": -23.584402084350586, "global_step": 170863, "epoch": 2058} {"train_loss": -23.630468368530273, "global_step": 170864, "epoch": 2058} {"train_loss": -23.44879722595215, "global_step": 170865, "epoch": 2058} {"train_loss": -24.154212951660156, "global_step": 170866, "epoch": 2058} {"train_loss": -23.841915130615234, "global_step": 170867, "epoch": 2058} {"train_loss": -23.7380313873291, "global_step": 170868, "epoch": 2058} {"train_loss": -23.506155014038086, "global_step": 170869, "epoch": 2058} {"train_loss": -23.725421905517578, "global_step": 170870, "epoch": 2058} {"train_loss": -23.727842330932617, "global_step": 170871, "epoch": 2058} {"train_loss": -23.905715942382812, "global_step": 170872, "epoch": 2058} {"train_loss": -23.826772689819336, "global_step": 170873, "epoch": 2058} {"train_loss": -23.643526077270508, "global_step": 170874, "epoch": 2058} {"train_loss": -23.723398208618164, "global_step": 170875, "epoch": 2058} {"train_loss": -23.63181495666504, "global_step": 170876, "epoch": 2058} {"train_loss": -23.726612091064453, "global_step": 170877, "epoch": 2058} {"train_loss": -23.920475006103516, "global_step": 170878, "epoch": 2058} {"train_loss": -23.770811080932617, "global_step": 170879, "epoch": 2058} {"train_loss": -23.902910232543945, "global_step": 170880, "epoch": 2058} {"train_loss": -23.834821701049805, "global_step": 170881, "epoch": 2058} {"train_loss": -23.976354598999023, "global_step": 170882, "epoch": 2058} {"train_loss": -23.864927291870117, "global_step": 170883, "epoch": 2058} {"train_loss": -23.87666130065918, "global_step": 170884, "epoch": 2058} {"train_loss": -23.6380672454834, "global_step": 170885, "epoch": 2058} {"train_loss": -23.894319534301758, "global_step": 170886, "epoch": 2058} {"train_loss": -23.972185134887695, "global_step": 170887, "epoch": 2058} {"train_loss": -23.983510971069336, "global_step": 170888, "epoch": 2058} {"train_loss": -23.778242111206055, "global_step": 170889, "epoch": 2058} {"train_loss": -23.913888931274414, "global_step": 170890, "epoch": 2058} {"train_loss": -23.82033920288086, "global_step": 170891, "epoch": 2058} {"train_loss": -23.956844329833984, "global_step": 170892, "epoch": 2058} {"train_loss": -23.84696388244629, "global_step": 170893, "epoch": 2058} {"train_loss": -24.001798629760742, "global_step": 170894, "epoch": 2058} {"train_loss": -23.63431739807129, "global_step": 170895, "epoch": 2058} {"train_loss": -23.58584029416004, "global_step": 170896, "epoch": 2058, "val_loss": 6441749.0} {"train_loss": -23.323822021484375, "global_step": 170897, "epoch": 2059} {"train_loss": -23.440021514892578, "global_step": 170898, "epoch": 2059} {"train_loss": -22.957944869995117, "global_step": 170899, "epoch": 2059} {"train_loss": -23.108144760131836, "global_step": 170900, "epoch": 2059} {"train_loss": -23.080060958862305, "global_step": 170901, "epoch": 2059} {"train_loss": -23.55161476135254, "global_step": 170902, "epoch": 2059} {"train_loss": -23.21963882446289, "global_step": 170903, "epoch": 2059} {"train_loss": -23.440458297729492, "global_step": 170904, "epoch": 2059} {"train_loss": -23.322267532348633, "global_step": 170905, "epoch": 2059} {"train_loss": -23.481237411499023, "global_step": 170906, "epoch": 2059} {"train_loss": -23.079313278198242, "global_step": 170907, "epoch": 2059} {"train_loss": -22.885286331176758, "global_step": 170908, "epoch": 2059} {"train_loss": -23.747678756713867, "global_step": 170909, "epoch": 2059} {"train_loss": -23.546855926513672, "global_step": 170910, "epoch": 2059} {"train_loss": -23.382526397705078, "global_step": 170911, "epoch": 2059} {"train_loss": -23.538251876831055, "global_step": 170912, "epoch": 2059} {"train_loss": -23.360097885131836, "global_step": 170913, "epoch": 2059} {"train_loss": -23.56770133972168, "global_step": 170914, "epoch": 2059} {"train_loss": -23.623544692993164, "global_step": 170915, "epoch": 2059} {"train_loss": -23.329998016357422, "global_step": 170916, "epoch": 2059} {"train_loss": -23.638362884521484, "global_step": 170917, "epoch": 2059} {"train_loss": -23.408010482788086, "global_step": 170918, "epoch": 2059} {"train_loss": -23.670597076416016, "global_step": 170919, "epoch": 2059} {"train_loss": -23.183462142944336, "global_step": 170920, "epoch": 2059} {"train_loss": -23.612003326416016, "global_step": 170921, "epoch": 2059} {"train_loss": -23.75950050354004, "global_step": 170922, "epoch": 2059} {"train_loss": -23.666372299194336, "global_step": 170923, "epoch": 2059} {"train_loss": -23.736135482788086, "global_step": 170924, "epoch": 2059} {"train_loss": -23.242822647094727, "global_step": 170925, "epoch": 2059} {"train_loss": -23.880752563476562, "global_step": 170926, "epoch": 2059} {"train_loss": -23.574447631835938, "global_step": 170927, "epoch": 2059} {"train_loss": -23.74458122253418, "global_step": 170928, "epoch": 2059} {"train_loss": -23.932729721069336, "global_step": 170929, "epoch": 2059} {"train_loss": -24.0023250579834, "global_step": 170930, "epoch": 2059} {"train_loss": -23.935928344726562, "global_step": 170931, "epoch": 2059} {"train_loss": -23.907230377197266, "global_step": 170932, "epoch": 2059} {"train_loss": -23.458683013916016, "global_step": 170933, "epoch": 2059} {"train_loss": -23.550695419311523, "global_step": 170934, "epoch": 2059} {"train_loss": -24.00575065612793, "global_step": 170935, "epoch": 2059} {"train_loss": -23.9116153717041, "global_step": 170936, "epoch": 2059} {"train_loss": -23.842906951904297, "global_step": 170937, "epoch": 2059} {"train_loss": -23.595523834228516, "global_step": 170938, "epoch": 2059} {"train_loss": -24.04091453552246, "global_step": 170939, "epoch": 2059} {"train_loss": -23.944578170776367, "global_step": 170940, "epoch": 2059} {"train_loss": -23.89469337463379, "global_step": 170941, "epoch": 2059} {"train_loss": -23.71979331970215, "global_step": 170942, "epoch": 2059} {"train_loss": -23.742233276367188, "global_step": 170943, "epoch": 2059} {"train_loss": -23.637861251831055, "global_step": 170944, "epoch": 2059} {"train_loss": -23.742212295532227, "global_step": 170945, "epoch": 2059} {"train_loss": -23.41851806640625, "global_step": 170946, "epoch": 2059} {"train_loss": -23.960981369018555, "global_step": 170947, "epoch": 2059} {"train_loss": -23.61939239501953, "global_step": 170948, "epoch": 2059} {"train_loss": -23.488386154174805, "global_step": 170949, "epoch": 2059} {"train_loss": -23.646198272705078, "global_step": 170950, "epoch": 2059} {"train_loss": -24.027517318725586, "global_step": 170951, "epoch": 2059} {"train_loss": -24.14644432067871, "global_step": 170952, "epoch": 2059} {"train_loss": -24.09897804260254, "global_step": 170953, "epoch": 2059} {"train_loss": -23.73961067199707, "global_step": 170954, "epoch": 2059} {"train_loss": -23.823659896850586, "global_step": 170955, "epoch": 2059} {"train_loss": -23.841720581054688, "global_step": 170956, "epoch": 2059} {"train_loss": -23.419843673706055, "global_step": 170957, "epoch": 2059} {"train_loss": -23.7623291015625, "global_step": 170958, "epoch": 2059} {"train_loss": -23.637649536132812, "global_step": 170959, "epoch": 2059} {"train_loss": -23.885786056518555, "global_step": 170960, "epoch": 2059} {"train_loss": -23.556476593017578, "global_step": 170961, "epoch": 2059} {"train_loss": -23.67706298828125, "global_step": 170962, "epoch": 2059} {"train_loss": -23.190433502197266, "global_step": 170963, "epoch": 2059} {"train_loss": -24.128873825073242, "global_step": 170964, "epoch": 2059} {"train_loss": -23.633413314819336, "global_step": 170965, "epoch": 2059} {"train_loss": -23.752729415893555, "global_step": 170966, "epoch": 2059} {"train_loss": -24.16903305053711, "global_step": 170967, "epoch": 2059} {"train_loss": -23.829347610473633, "global_step": 170968, "epoch": 2059} {"train_loss": -23.68691062927246, "global_step": 170969, "epoch": 2059} {"train_loss": -23.85441017150879, "global_step": 170970, "epoch": 2059} {"train_loss": -23.64554214477539, "global_step": 170971, "epoch": 2059} {"train_loss": -23.189289093017578, "global_step": 170972, "epoch": 2059} {"train_loss": -23.778884887695312, "global_step": 170973, "epoch": 2059} {"train_loss": -23.26543617248535, "global_step": 170974, "epoch": 2059} {"train_loss": -23.488033294677734, "global_step": 170975, "epoch": 2059} {"train_loss": -23.592273712158203, "global_step": 170976, "epoch": 2059} {"train_loss": -23.365943908691406, "global_step": 170977, "epoch": 2059} {"train_loss": -23.679706573486328, "global_step": 170978, "epoch": 2059} {"train_loss": -23.612788303788886, "global_step": 170979, "epoch": 2059, "val_loss": 6350089.0} {"train_loss": -22.927236557006836, "global_step": 170980, "epoch": 2060} {"train_loss": -23.370098114013672, "global_step": 170981, "epoch": 2060} {"train_loss": -23.466413497924805, "global_step": 170982, "epoch": 2060} {"train_loss": -23.308218002319336, "global_step": 170983, "epoch": 2060} {"train_loss": -23.141164779663086, "global_step": 170984, "epoch": 2060} {"train_loss": -23.247241973876953, "global_step": 170985, "epoch": 2060} {"train_loss": -22.974843978881836, "global_step": 170986, "epoch": 2060} {"train_loss": -23.3804874420166, "global_step": 170987, "epoch": 2060} {"train_loss": -23.327470779418945, "global_step": 170988, "epoch": 2060} {"train_loss": -23.575159072875977, "global_step": 170989, "epoch": 2060} {"train_loss": -23.638513565063477, "global_step": 170990, "epoch": 2060} {"train_loss": -23.325265884399414, "global_step": 170991, "epoch": 2060} {"train_loss": -23.553665161132812, "global_step": 170992, "epoch": 2060} {"train_loss": -23.87770652770996, "global_step": 170993, "epoch": 2060} {"train_loss": -23.489593505859375, "global_step": 170994, "epoch": 2060} {"train_loss": -23.477731704711914, "global_step": 170995, "epoch": 2060} {"train_loss": -23.279478073120117, "global_step": 170996, "epoch": 2060} {"train_loss": -23.316375732421875, "global_step": 170997, "epoch": 2060} {"train_loss": -23.352611541748047, "global_step": 170998, "epoch": 2060} {"train_loss": -23.843669891357422, "global_step": 170999, "epoch": 2060} {"train_loss": -23.360088348388672, "global_step": 171000, "epoch": 2060} {"train_loss": -23.83558464050293, "global_step": 171001, "epoch": 2060} {"train_loss": -24.129255294799805, "global_step": 171002, "epoch": 2060} {"train_loss": -23.529897689819336, "global_step": 171003, "epoch": 2060} {"train_loss": -23.834136962890625, "global_step": 171004, "epoch": 2060} {"train_loss": -23.493423461914062, "global_step": 171005, "epoch": 2060} {"train_loss": -23.82526969909668, "global_step": 171006, "epoch": 2060} {"train_loss": -24.00734519958496, "global_step": 171007, "epoch": 2060} {"train_loss": -23.72427749633789, "global_step": 171008, "epoch": 2060} {"train_loss": -23.508731842041016, "global_step": 171009, "epoch": 2060} {"train_loss": -23.516477584838867, "global_step": 171010, "epoch": 2060} {"train_loss": -23.642642974853516, "global_step": 171011, "epoch": 2060} {"train_loss": -23.7814998626709, "global_step": 171012, "epoch": 2060} {"train_loss": -23.5961856842041, "global_step": 171013, "epoch": 2060} {"train_loss": -23.730175018310547, "global_step": 171014, "epoch": 2060} {"train_loss": -23.6424560546875, "global_step": 171015, "epoch": 2060} {"train_loss": -23.81622314453125, "global_step": 171016, "epoch": 2060} {"train_loss": -23.9630126953125, "global_step": 171017, "epoch": 2060} {"train_loss": -23.913354873657227, "global_step": 171018, "epoch": 2060} {"train_loss": -23.532760620117188, "global_step": 171019, "epoch": 2060} {"train_loss": -23.9809513092041, "global_step": 171020, "epoch": 2060} {"train_loss": -23.605260848999023, "global_step": 171021, "epoch": 2060} {"train_loss": -23.389326095581055, "global_step": 171022, "epoch": 2060} {"train_loss": -23.740997314453125, "global_step": 171023, "epoch": 2060} {"train_loss": -24.031787872314453, "global_step": 171024, "epoch": 2060} {"train_loss": -23.827604293823242, "global_step": 171025, "epoch": 2060} {"train_loss": -23.703269958496094, "global_step": 171026, "epoch": 2060} {"train_loss": -23.433664321899414, "global_step": 171027, "epoch": 2060} {"train_loss": -23.902925491333008, "global_step": 171028, "epoch": 2060} {"train_loss": -23.6794490814209, "global_step": 171029, "epoch": 2060} {"train_loss": -23.662256240844727, "global_step": 171030, "epoch": 2060} {"train_loss": -23.438278198242188, "global_step": 171031, "epoch": 2060} {"train_loss": -23.824628829956055, "global_step": 171032, "epoch": 2060} {"train_loss": -23.05126953125, "global_step": 171033, "epoch": 2060} {"train_loss": -23.398340225219727, "global_step": 171034, "epoch": 2060} {"train_loss": -23.902524948120117, "global_step": 171035, "epoch": 2060} {"train_loss": -23.4375057220459, "global_step": 171036, "epoch": 2060} {"train_loss": -23.430709838867188, "global_step": 171037, "epoch": 2060} {"train_loss": -23.49485969543457, "global_step": 171038, "epoch": 2060} {"train_loss": -23.701265335083008, "global_step": 171039, "epoch": 2060} {"train_loss": -23.492740631103516, "global_step": 171040, "epoch": 2060} {"train_loss": -23.82596778869629, "global_step": 171041, "epoch": 2060} {"train_loss": -23.708696365356445, "global_step": 171042, "epoch": 2060} {"train_loss": -23.853206634521484, "global_step": 171043, "epoch": 2060} {"train_loss": -23.814844131469727, "global_step": 171044, "epoch": 2060} {"train_loss": -23.896718978881836, "global_step": 171045, "epoch": 2060} {"train_loss": -23.57828140258789, "global_step": 171046, "epoch": 2060} {"train_loss": -23.945592880249023, "global_step": 171047, "epoch": 2060} {"train_loss": -23.209970474243164, "global_step": 171048, "epoch": 2060} {"train_loss": -23.5625, "global_step": 171049, "epoch": 2060} {"train_loss": -23.5526123046875, "global_step": 171050, "epoch": 2060} {"train_loss": -23.494672775268555, "global_step": 171051, "epoch": 2060} {"train_loss": -23.427955627441406, "global_step": 171052, "epoch": 2060} {"train_loss": -23.783954620361328, "global_step": 171053, "epoch": 2060} {"train_loss": -23.84455108642578, "global_step": 171054, "epoch": 2060} {"train_loss": -23.636947631835938, "global_step": 171055, "epoch": 2060} {"train_loss": -23.49408531188965, "global_step": 171056, "epoch": 2060} {"train_loss": -23.84421157836914, "global_step": 171057, "epoch": 2060} {"train_loss": -23.34239387512207, "global_step": 171058, "epoch": 2060} {"train_loss": -23.60939598083496, "global_step": 171059, "epoch": 2060} {"train_loss": -23.71129035949707, "global_step": 171060, "epoch": 2060} {"train_loss": -23.484586715698242, "global_step": 171061, "epoch": 2060} {"train_loss": -23.60532887010689, "global_step": 171062, "epoch": 2060, "val_loss": 6292644.0} {"train_loss": -23.194753646850586, "global_step": 171063, "epoch": 2061} {"train_loss": -23.32599449157715, "global_step": 171064, "epoch": 2061} {"train_loss": -23.51076316833496, "global_step": 171065, "epoch": 2061} {"train_loss": -23.006765365600586, "global_step": 171066, "epoch": 2061} {"train_loss": -23.08371353149414, "global_step": 171067, "epoch": 2061} {"train_loss": -23.577707290649414, "global_step": 171068, "epoch": 2061} {"train_loss": -23.260900497436523, "global_step": 171069, "epoch": 2061} {"train_loss": -23.31840705871582, "global_step": 171070, "epoch": 2061} {"train_loss": -23.630828857421875, "global_step": 171071, "epoch": 2061} {"train_loss": -23.449115753173828, "global_step": 171072, "epoch": 2061} {"train_loss": -23.19159698486328, "global_step": 171073, "epoch": 2061} {"train_loss": -23.267303466796875, "global_step": 171074, "epoch": 2061} {"train_loss": -23.85834312438965, "global_step": 171075, "epoch": 2061} {"train_loss": -23.46661376953125, "global_step": 171076, "epoch": 2061} {"train_loss": -23.836957931518555, "global_step": 171077, "epoch": 2061} {"train_loss": -23.87923240661621, "global_step": 171078, "epoch": 2061} {"train_loss": -23.573850631713867, "global_step": 171079, "epoch": 2061} {"train_loss": -23.544052124023438, "global_step": 171080, "epoch": 2061} {"train_loss": -23.3695125579834, "global_step": 171081, "epoch": 2061} {"train_loss": -24.11665153503418, "global_step": 171082, "epoch": 2061} {"train_loss": -23.2934627532959, "global_step": 171083, "epoch": 2061} {"train_loss": -23.77582359313965, "global_step": 171084, "epoch": 2061} {"train_loss": -23.873916625976562, "global_step": 171085, "epoch": 2061} {"train_loss": -23.609928131103516, "global_step": 171086, "epoch": 2061} {"train_loss": -23.70068359375, "global_step": 171087, "epoch": 2061} {"train_loss": -23.795551300048828, "global_step": 171088, "epoch": 2061} {"train_loss": -23.578100204467773, "global_step": 171089, "epoch": 2061} {"train_loss": -23.780733108520508, "global_step": 171090, "epoch": 2061} {"train_loss": -24.06049156188965, "global_step": 171091, "epoch": 2061} {"train_loss": -23.780574798583984, "global_step": 171092, "epoch": 2061} {"train_loss": -23.766080856323242, "global_step": 171093, "epoch": 2061} {"train_loss": -23.653671264648438, "global_step": 171094, "epoch": 2061} {"train_loss": -23.919429779052734, "global_step": 171095, "epoch": 2061} {"train_loss": -23.489696502685547, "global_step": 171096, "epoch": 2061} {"train_loss": -23.630945205688477, "global_step": 171097, "epoch": 2061} {"train_loss": -23.511167526245117, "global_step": 171098, "epoch": 2061} {"train_loss": -24.094242095947266, "global_step": 171099, "epoch": 2061} {"train_loss": -23.712778091430664, "global_step": 171100, "epoch": 2061} {"train_loss": -23.811445236206055, "global_step": 171101, "epoch": 2061} {"train_loss": -23.65610694885254, "global_step": 171102, "epoch": 2061} {"train_loss": -23.98164176940918, "global_step": 171103, "epoch": 2061} {"train_loss": -23.88850975036621, "global_step": 171104, "epoch": 2061} {"train_loss": -23.7760066986084, "global_step": 171105, "epoch": 2061} {"train_loss": -23.212844848632812, "global_step": 171106, "epoch": 2061} {"train_loss": -23.65126609802246, "global_step": 171107, "epoch": 2061} {"train_loss": -23.559051513671875, "global_step": 171108, "epoch": 2061} {"train_loss": -23.649015426635742, "global_step": 171109, "epoch": 2061} {"train_loss": -23.768054962158203, "global_step": 171110, "epoch": 2061} {"train_loss": -23.788503646850586, "global_step": 171111, "epoch": 2061} {"train_loss": -23.40737533569336, "global_step": 171112, "epoch": 2061} {"train_loss": -23.991296768188477, "global_step": 171113, "epoch": 2061} {"train_loss": -23.706052780151367, "global_step": 171114, "epoch": 2061} {"train_loss": -23.55791664123535, "global_step": 171115, "epoch": 2061} {"train_loss": -24.062850952148438, "global_step": 171116, "epoch": 2061} {"train_loss": -23.78702735900879, "global_step": 171117, "epoch": 2061} {"train_loss": -23.68145751953125, "global_step": 171118, "epoch": 2061} {"train_loss": -24.088321685791016, "global_step": 171119, "epoch": 2061} {"train_loss": -23.8426513671875, "global_step": 171120, "epoch": 2061} {"train_loss": -23.728723526000977, "global_step": 171121, "epoch": 2061} {"train_loss": -23.689435958862305, "global_step": 171122, "epoch": 2061} {"train_loss": -23.516992568969727, "global_step": 171123, "epoch": 2061} {"train_loss": -23.74271011352539, "global_step": 171124, "epoch": 2061} {"train_loss": -24.050119400024414, "global_step": 171125, "epoch": 2061} {"train_loss": -24.00996971130371, "global_step": 171126, "epoch": 2061} {"train_loss": -23.795368194580078, "global_step": 171127, "epoch": 2061} {"train_loss": -23.91348648071289, "global_step": 171128, "epoch": 2061} {"train_loss": -23.861684799194336, "global_step": 171129, "epoch": 2061} {"train_loss": -23.951425552368164, "global_step": 171130, "epoch": 2061} {"train_loss": -23.819944381713867, "global_step": 171131, "epoch": 2061} {"train_loss": -24.126222610473633, "global_step": 171132, "epoch": 2061} {"train_loss": -23.92659568786621, "global_step": 171133, "epoch": 2061} {"train_loss": -23.620508193969727, "global_step": 171134, "epoch": 2061} {"train_loss": -23.714323043823242, "global_step": 171135, "epoch": 2061} {"train_loss": -23.514999389648438, "global_step": 171136, "epoch": 2061} {"train_loss": -23.706405639648438, "global_step": 171137, "epoch": 2061} {"train_loss": -23.2756290435791, "global_step": 171138, "epoch": 2061} {"train_loss": -23.726207733154297, "global_step": 171139, "epoch": 2061} {"train_loss": -23.653167724609375, "global_step": 171140, "epoch": 2061} {"train_loss": -23.73134422302246, "global_step": 171141, "epoch": 2061} {"train_loss": -23.916194915771484, "global_step": 171142, "epoch": 2061} {"train_loss": -23.50640869140625, "global_step": 171143, "epoch": 2061} {"train_loss": -23.347885131835938, "global_step": 171144, "epoch": 2061} {"train_loss": -23.653920139174865, "global_step": 171145, "epoch": 2061, "val_loss": 6331997.5} {"train_loss": -23.1258487701416, "global_step": 171146, "epoch": 2062} {"train_loss": -23.18633460998535, "global_step": 171147, "epoch": 2062} {"train_loss": -23.193002700805664, "global_step": 171148, "epoch": 2062} {"train_loss": -23.1085262298584, "global_step": 171149, "epoch": 2062} {"train_loss": -23.23346519470215, "global_step": 171150, "epoch": 2062} {"train_loss": -23.11573600769043, "global_step": 171151, "epoch": 2062} {"train_loss": -22.88502311706543, "global_step": 171152, "epoch": 2062} {"train_loss": -23.383573532104492, "global_step": 171153, "epoch": 2062} {"train_loss": -23.375871658325195, "global_step": 171154, "epoch": 2062} {"train_loss": -23.350528717041016, "global_step": 171155, "epoch": 2062} {"train_loss": -23.57474136352539, "global_step": 171156, "epoch": 2062} {"train_loss": -23.16178321838379, "global_step": 171157, "epoch": 2062} {"train_loss": -23.498687744140625, "global_step": 171158, "epoch": 2062} {"train_loss": -23.52556800842285, "global_step": 171159, "epoch": 2062} {"train_loss": -23.51749610900879, "global_step": 171160, "epoch": 2062} {"train_loss": -23.678014755249023, "global_step": 171161, "epoch": 2062} {"train_loss": -23.94086265563965, "global_step": 171162, "epoch": 2062} {"train_loss": -23.726526260375977, "global_step": 171163, "epoch": 2062} {"train_loss": -23.9750919342041, "global_step": 171164, "epoch": 2062} {"train_loss": -23.57390785217285, "global_step": 171165, "epoch": 2062} {"train_loss": -23.45871925354004, "global_step": 171166, "epoch": 2062} {"train_loss": -23.6204891204834, "global_step": 171167, "epoch": 2062} {"train_loss": -23.842931747436523, "global_step": 171168, "epoch": 2062} {"train_loss": -23.616086959838867, "global_step": 171169, "epoch": 2062} {"train_loss": -23.822799682617188, "global_step": 171170, "epoch": 2062} {"train_loss": -23.946836471557617, "global_step": 171171, "epoch": 2062} {"train_loss": -23.78726577758789, "global_step": 171172, "epoch": 2062} {"train_loss": -24.0045166015625, "global_step": 171173, "epoch": 2062} {"train_loss": -23.989166259765625, "global_step": 171174, "epoch": 2062} {"train_loss": -24.1451358795166, "global_step": 171175, "epoch": 2062} {"train_loss": -23.649150848388672, "global_step": 171176, "epoch": 2062} {"train_loss": -23.672250747680664, "global_step": 171177, "epoch": 2062} {"train_loss": -23.34857749938965, "global_step": 171178, "epoch": 2062} {"train_loss": -23.734045028686523, "global_step": 171179, "epoch": 2062} {"train_loss": -23.7026424407959, "global_step": 171180, "epoch": 2062} {"train_loss": -23.997163772583008, "global_step": 171181, "epoch": 2062} {"train_loss": -23.83819580078125, "global_step": 171182, "epoch": 2062} {"train_loss": -23.493040084838867, "global_step": 171183, "epoch": 2062} {"train_loss": -23.715970993041992, "global_step": 171184, "epoch": 2062} {"train_loss": -23.63851547241211, "global_step": 171185, "epoch": 2062} {"train_loss": -23.625715255737305, "global_step": 171186, "epoch": 2062} {"train_loss": -24.10243797302246, "global_step": 171187, "epoch": 2062} {"train_loss": -23.88578224182129, "global_step": 171188, "epoch": 2062} {"train_loss": -24.112834930419922, "global_step": 171189, "epoch": 2062} {"train_loss": -23.97930908203125, "global_step": 171190, "epoch": 2062} {"train_loss": -23.92865562438965, "global_step": 171191, "epoch": 2062} {"train_loss": -23.821569442749023, "global_step": 171192, "epoch": 2062} {"train_loss": -23.620193481445312, "global_step": 171193, "epoch": 2062} {"train_loss": -23.765872955322266, "global_step": 171194, "epoch": 2062} {"train_loss": -24.123498916625977, "global_step": 171195, "epoch": 2062} {"train_loss": -23.653671264648438, "global_step": 171196, "epoch": 2062} {"train_loss": -23.54751968383789, "global_step": 171197, "epoch": 2062} {"train_loss": -23.337007522583008, "global_step": 171198, "epoch": 2062} {"train_loss": -23.58785057067871, "global_step": 171199, "epoch": 2062} {"train_loss": -23.965478897094727, "global_step": 171200, "epoch": 2062} {"train_loss": -24.022058486938477, "global_step": 171201, "epoch": 2062} {"train_loss": -23.837610244750977, "global_step": 171202, "epoch": 2062} {"train_loss": -23.65303611755371, "global_step": 171203, "epoch": 2062} {"train_loss": -23.935453414916992, "global_step": 171204, "epoch": 2062} {"train_loss": -24.063703536987305, "global_step": 171205, "epoch": 2062} {"train_loss": -23.402950286865234, "global_step": 171206, "epoch": 2062} {"train_loss": -24.2440128326416, "global_step": 171207, "epoch": 2062} {"train_loss": -23.646284103393555, "global_step": 171208, "epoch": 2062} {"train_loss": -23.571149826049805, "global_step": 171209, "epoch": 2062} {"train_loss": -23.71657371520996, "global_step": 171210, "epoch": 2062} {"train_loss": -23.751239776611328, "global_step": 171211, "epoch": 2062} {"train_loss": -24.165130615234375, "global_step": 171212, "epoch": 2062} {"train_loss": -23.945697784423828, "global_step": 171213, "epoch": 2062} {"train_loss": -23.63030433654785, "global_step": 171214, "epoch": 2062} {"train_loss": -23.769845962524414, "global_step": 171215, "epoch": 2062} {"train_loss": -23.66790771484375, "global_step": 171216, "epoch": 2062} {"train_loss": -23.89051628112793, "global_step": 171217, "epoch": 2062} {"train_loss": -23.68686866760254, "global_step": 171218, "epoch": 2062} {"train_loss": -23.617712020874023, "global_step": 171219, "epoch": 2062} {"train_loss": -23.7625732421875, "global_step": 171220, "epoch": 2062} {"train_loss": -23.682628631591797, "global_step": 171221, "epoch": 2062} {"train_loss": -23.48872947692871, "global_step": 171222, "epoch": 2062} {"train_loss": -23.44207191467285, "global_step": 171223, "epoch": 2062} {"train_loss": -23.776952743530273, "global_step": 171224, "epoch": 2062} {"train_loss": -23.54408073425293, "global_step": 171225, "epoch": 2062} {"train_loss": -23.438486099243164, "global_step": 171226, "epoch": 2062} {"train_loss": -23.484893798828125, "global_step": 171227, "epoch": 2062} {"train_loss": -23.65650291902473, "global_step": 171228, "epoch": 2062, "val_loss": 6449261.0} {"train_loss": -23.45488739013672, "global_step": 171229, "epoch": 2063} {"train_loss": -23.222122192382812, "global_step": 171230, "epoch": 2063} {"train_loss": -23.576034545898438, "global_step": 171231, "epoch": 2063} {"train_loss": -23.775192260742188, "global_step": 171232, "epoch": 2063} {"train_loss": -23.209415435791016, "global_step": 171233, "epoch": 2063} {"train_loss": -23.60424041748047, "global_step": 171234, "epoch": 2063} {"train_loss": -23.74103546142578, "global_step": 171235, "epoch": 2063} {"train_loss": -23.721036911010742, "global_step": 171236, "epoch": 2063} {"train_loss": -24.08920669555664, "global_step": 171237, "epoch": 2063} {"train_loss": -23.731407165527344, "global_step": 171238, "epoch": 2063} {"train_loss": -23.65400505065918, "global_step": 171239, "epoch": 2063} {"train_loss": -23.456186294555664, "global_step": 171240, "epoch": 2063} {"train_loss": -23.90985107421875, "global_step": 171241, "epoch": 2063} {"train_loss": -23.848026275634766, "global_step": 171242, "epoch": 2063} {"train_loss": -23.654571533203125, "global_step": 171243, "epoch": 2063} {"train_loss": -23.82968521118164, "global_step": 171244, "epoch": 2063} {"train_loss": -23.960851669311523, "global_step": 171245, "epoch": 2063} {"train_loss": -23.7034969329834, "global_step": 171246, "epoch": 2063} {"train_loss": -23.581716537475586, "global_step": 171247, "epoch": 2063} {"train_loss": -23.568143844604492, "global_step": 171248, "epoch": 2063} {"train_loss": -23.456083297729492, "global_step": 171249, "epoch": 2063} {"train_loss": -23.833066940307617, "global_step": 171250, "epoch": 2063} {"train_loss": -23.481552124023438, "global_step": 171251, "epoch": 2063} {"train_loss": -23.387237548828125, "global_step": 171252, "epoch": 2063} {"train_loss": -23.81162452697754, "global_step": 171253, "epoch": 2063} {"train_loss": -23.600095748901367, "global_step": 171254, "epoch": 2063} {"train_loss": -23.586898803710938, "global_step": 171255, "epoch": 2063} {"train_loss": -23.282949447631836, "global_step": 171256, "epoch": 2063} {"train_loss": -24.022207260131836, "global_step": 171257, "epoch": 2063} {"train_loss": -23.717567443847656, "global_step": 171258, "epoch": 2063} {"train_loss": -23.71413803100586, "global_step": 171259, "epoch": 2063} {"train_loss": -24.04420280456543, "global_step": 171260, "epoch": 2063} {"train_loss": -23.531408309936523, "global_step": 171261, "epoch": 2063} {"train_loss": -23.654041290283203, "global_step": 171262, "epoch": 2063} {"train_loss": -23.903675079345703, "global_step": 171263, "epoch": 2063} {"train_loss": -23.360916137695312, "global_step": 171264, "epoch": 2063} {"train_loss": -23.655813217163086, "global_step": 171265, "epoch": 2063} {"train_loss": -23.639102935791016, "global_step": 171266, "epoch": 2063} {"train_loss": -23.51314353942871, "global_step": 171267, "epoch": 2063} {"train_loss": -24.074493408203125, "global_step": 171268, "epoch": 2063} {"train_loss": -23.80440330505371, "global_step": 171269, "epoch": 2063} {"train_loss": -23.934001922607422, "global_step": 171270, "epoch": 2063} {"train_loss": -23.575834274291992, "global_step": 171271, "epoch": 2063} {"train_loss": -24.243568420410156, "global_step": 171272, "epoch": 2063} {"train_loss": -23.371170043945312, "global_step": 171273, "epoch": 2063} {"train_loss": -23.9438533782959, "global_step": 171274, "epoch": 2063} {"train_loss": -23.704336166381836, "global_step": 171275, "epoch": 2063} {"train_loss": -23.7042236328125, "global_step": 171276, "epoch": 2063} {"train_loss": -23.331674575805664, "global_step": 171277, "epoch": 2063} {"train_loss": -23.35721778869629, "global_step": 171278, "epoch": 2063} {"train_loss": -23.504785537719727, "global_step": 171279, "epoch": 2063} {"train_loss": -23.883975982666016, "global_step": 171280, "epoch": 2063} {"train_loss": -23.93195915222168, "global_step": 171281, "epoch": 2063} {"train_loss": -23.54491424560547, "global_step": 171282, "epoch": 2063} {"train_loss": -23.970335006713867, "global_step": 171283, "epoch": 2063} {"train_loss": -23.79157066345215, "global_step": 171284, "epoch": 2063} {"train_loss": -23.97244644165039, "global_step": 171285, "epoch": 2063} {"train_loss": -23.978567123413086, "global_step": 171286, "epoch": 2063} {"train_loss": -23.851903915405273, "global_step": 171287, "epoch": 2063} {"train_loss": -23.671274185180664, "global_step": 171288, "epoch": 2063} {"train_loss": -23.81281089782715, "global_step": 171289, "epoch": 2063} {"train_loss": -23.850265502929688, "global_step": 171290, "epoch": 2063} {"train_loss": -23.894479751586914, "global_step": 171291, "epoch": 2063} {"train_loss": -23.98038673400879, "global_step": 171292, "epoch": 2063} {"train_loss": -23.881755828857422, "global_step": 171293, "epoch": 2063} {"train_loss": -24.069255828857422, "global_step": 171294, "epoch": 2063} {"train_loss": -23.958454132080078, "global_step": 171295, "epoch": 2063} {"train_loss": -23.995752334594727, "global_step": 171296, "epoch": 2063} {"train_loss": -23.932086944580078, "global_step": 171297, "epoch": 2063} {"train_loss": -23.909557342529297, "global_step": 171298, "epoch": 2063} {"train_loss": -23.778675079345703, "global_step": 171299, "epoch": 2063} {"train_loss": -23.719093322753906, "global_step": 171300, "epoch": 2063} {"train_loss": -24.05905532836914, "global_step": 171301, "epoch": 2063} {"train_loss": -23.089353561401367, "global_step": 171302, "epoch": 2063} {"train_loss": -23.384809494018555, "global_step": 171303, "epoch": 2063} {"train_loss": -23.26519203186035, "global_step": 171304, "epoch": 2063} {"train_loss": -23.05857276916504, "global_step": 171305, "epoch": 2063} {"train_loss": -23.692163467407227, "global_step": 171306, "epoch": 2063} {"train_loss": -23.942716598510742, "global_step": 171307, "epoch": 2063} {"train_loss": -23.25978660583496, "global_step": 171308, "epoch": 2063} {"train_loss": -23.52288818359375, "global_step": 171309, "epoch": 2063} {"train_loss": -23.924240112304688, "global_step": 171310, "epoch": 2063} {"train_loss": -23.69333405092538, "global_step": 171311, "epoch": 2063, "val_loss": 6394353.0} {"train_loss": -23.542043685913086, "global_step": 171312, "epoch": 2064} {"train_loss": -23.480710983276367, "global_step": 171313, "epoch": 2064} {"train_loss": -23.54971694946289, "global_step": 171314, "epoch": 2064} {"train_loss": -22.777578353881836, "global_step": 171315, "epoch": 2064} {"train_loss": -22.81749153137207, "global_step": 171316, "epoch": 2064} {"train_loss": -22.44361686706543, "global_step": 171317, "epoch": 2064} {"train_loss": -23.46368408203125, "global_step": 171318, "epoch": 2064} {"train_loss": -22.20163917541504, "global_step": 171319, "epoch": 2064} {"train_loss": -22.740856170654297, "global_step": 171320, "epoch": 2064} {"train_loss": -23.19243812561035, "global_step": 171321, "epoch": 2064} {"train_loss": -22.65814781188965, "global_step": 171322, "epoch": 2064} {"train_loss": -23.037765502929688, "global_step": 171323, "epoch": 2064} {"train_loss": -23.240015029907227, "global_step": 171324, "epoch": 2064} {"train_loss": -23.304655075073242, "global_step": 171325, "epoch": 2064} {"train_loss": -23.24340057373047, "global_step": 171326, "epoch": 2064} {"train_loss": -23.15287971496582, "global_step": 171327, "epoch": 2064} {"train_loss": -23.096220016479492, "global_step": 171328, "epoch": 2064} {"train_loss": -22.89581871032715, "global_step": 171329, "epoch": 2064} {"train_loss": -23.55982208251953, "global_step": 171330, "epoch": 2064} {"train_loss": -23.104772567749023, "global_step": 171331, "epoch": 2064} {"train_loss": -23.216054916381836, "global_step": 171332, "epoch": 2064} {"train_loss": -23.3605899810791, "global_step": 171333, "epoch": 2064} {"train_loss": -23.335657119750977, "global_step": 171334, "epoch": 2064} {"train_loss": -23.13968849182129, "global_step": 171335, "epoch": 2064} {"train_loss": -23.285776138305664, "global_step": 171336, "epoch": 2064} {"train_loss": -23.141080856323242, "global_step": 171337, "epoch": 2064} {"train_loss": -23.41414451599121, "global_step": 171338, "epoch": 2064} {"train_loss": -23.602245330810547, "global_step": 171339, "epoch": 2064} {"train_loss": -23.667789459228516, "global_step": 171340, "epoch": 2064} {"train_loss": -23.7965030670166, "global_step": 171341, "epoch": 2064} {"train_loss": -23.663772583007812, "global_step": 171342, "epoch": 2064} {"train_loss": -23.4434871673584, "global_step": 171343, "epoch": 2064} {"train_loss": -23.504362106323242, "global_step": 171344, "epoch": 2064} {"train_loss": -23.80847930908203, "global_step": 171345, "epoch": 2064} {"train_loss": -23.810089111328125, "global_step": 171346, "epoch": 2064} {"train_loss": -23.4989013671875, "global_step": 171347, "epoch": 2064} {"train_loss": -23.612953186035156, "global_step": 171348, "epoch": 2064} {"train_loss": -23.683637619018555, "global_step": 171349, "epoch": 2064} {"train_loss": -24.08228874206543, "global_step": 171350, "epoch": 2064} {"train_loss": -23.82178497314453, "global_step": 171351, "epoch": 2064} {"train_loss": -23.864486694335938, "global_step": 171352, "epoch": 2064} {"train_loss": -23.872610092163086, "global_step": 171353, "epoch": 2064} {"train_loss": -23.97894859313965, "global_step": 171354, "epoch": 2064} {"train_loss": -23.892194747924805, "global_step": 171355, "epoch": 2064} {"train_loss": -23.339887619018555, "global_step": 171356, "epoch": 2064} {"train_loss": -23.72383689880371, "global_step": 171357, "epoch": 2064} {"train_loss": -23.52923011779785, "global_step": 171358, "epoch": 2064} {"train_loss": -23.63608169555664, "global_step": 171359, "epoch": 2064} {"train_loss": -23.693634033203125, "global_step": 171360, "epoch": 2064} {"train_loss": -23.56365966796875, "global_step": 171361, "epoch": 2064} {"train_loss": -24.015228271484375, "global_step": 171362, "epoch": 2064} {"train_loss": -23.564167022705078, "global_step": 171363, "epoch": 2064} {"train_loss": -23.91317367553711, "global_step": 171364, "epoch": 2064} {"train_loss": -23.695749282836914, "global_step": 171365, "epoch": 2064} {"train_loss": -23.695756912231445, "global_step": 171366, "epoch": 2064} {"train_loss": -23.426694869995117, "global_step": 171367, "epoch": 2064} {"train_loss": -24.006315231323242, "global_step": 171368, "epoch": 2064} {"train_loss": -23.860570907592773, "global_step": 171369, "epoch": 2064} {"train_loss": -23.86140251159668, "global_step": 171370, "epoch": 2064} {"train_loss": -23.733434677124023, "global_step": 171371, "epoch": 2064} {"train_loss": -23.672739028930664, "global_step": 171372, "epoch": 2064} {"train_loss": -23.589599609375, "global_step": 171373, "epoch": 2064} {"train_loss": -23.45732879638672, "global_step": 171374, "epoch": 2064} {"train_loss": -23.905405044555664, "global_step": 171375, "epoch": 2064} {"train_loss": -23.458938598632812, "global_step": 171376, "epoch": 2064} {"train_loss": -23.503217697143555, "global_step": 171377, "epoch": 2064} {"train_loss": -23.73697853088379, "global_step": 171378, "epoch": 2064} {"train_loss": -23.6821231842041, "global_step": 171379, "epoch": 2064} {"train_loss": -23.602890014648438, "global_step": 171380, "epoch": 2064} {"train_loss": -23.562023162841797, "global_step": 171381, "epoch": 2064} {"train_loss": -23.999528884887695, "global_step": 171382, "epoch": 2064} {"train_loss": -23.652475357055664, "global_step": 171383, "epoch": 2064} {"train_loss": -23.27853775024414, "global_step": 171384, "epoch": 2064} {"train_loss": -23.72981071472168, "global_step": 171385, "epoch": 2064} {"train_loss": -23.42946434020996, "global_step": 171386, "epoch": 2064} {"train_loss": -23.39420509338379, "global_step": 171387, "epoch": 2064} {"train_loss": -23.089841842651367, "global_step": 171388, "epoch": 2064} {"train_loss": -23.794931411743164, "global_step": 171389, "epoch": 2064} {"train_loss": -23.702390670776367, "global_step": 171390, "epoch": 2064} {"train_loss": -23.61354637145996, "global_step": 171391, "epoch": 2064} {"train_loss": -23.611740112304688, "global_step": 171392, "epoch": 2064} {"train_loss": -23.814970016479492, "global_step": 171393, "epoch": 2064} {"train_loss": -23.48045356015125, "global_step": 171394, "epoch": 2064, "val_loss": 6386344.0} {"train_loss": -23.976398468017578, "global_step": 171395, "epoch": 2065} {"train_loss": -23.517593383789062, "global_step": 171396, "epoch": 2065} {"train_loss": -23.655582427978516, "global_step": 171397, "epoch": 2065} {"train_loss": -23.6854305267334, "global_step": 171398, "epoch": 2065} {"train_loss": -23.387537002563477, "global_step": 171399, "epoch": 2065} {"train_loss": -23.279834747314453, "global_step": 171400, "epoch": 2065} {"train_loss": -23.50295066833496, "global_step": 171401, "epoch": 2065} {"train_loss": -23.781986236572266, "global_step": 171402, "epoch": 2065} {"train_loss": -23.480037689208984, "global_step": 171403, "epoch": 2065} {"train_loss": -23.728803634643555, "global_step": 171404, "epoch": 2065} {"train_loss": -24.12550163269043, "global_step": 171405, "epoch": 2065} {"train_loss": -23.569997787475586, "global_step": 171406, "epoch": 2065} {"train_loss": -23.807064056396484, "global_step": 171407, "epoch": 2065} {"train_loss": -23.68953514099121, "global_step": 171408, "epoch": 2065} {"train_loss": -24.01934242248535, "global_step": 171409, "epoch": 2065} {"train_loss": -23.79791259765625, "global_step": 171410, "epoch": 2065} {"train_loss": -23.750308990478516, "global_step": 171411, "epoch": 2065} {"train_loss": -23.663087844848633, "global_step": 171412, "epoch": 2065} {"train_loss": -23.771329879760742, "global_step": 171413, "epoch": 2065} {"train_loss": -23.77607536315918, "global_step": 171414, "epoch": 2065} {"train_loss": -23.758438110351562, "global_step": 171415, "epoch": 2065} {"train_loss": -23.740453720092773, "global_step": 171416, "epoch": 2065} {"train_loss": -23.84654998779297, "global_step": 171417, "epoch": 2065} {"train_loss": -23.64008140563965, "global_step": 171418, "epoch": 2065} {"train_loss": -23.683759689331055, "global_step": 171419, "epoch": 2065} {"train_loss": -23.911231994628906, "global_step": 171420, "epoch": 2065} {"train_loss": -23.558603286743164, "global_step": 171421, "epoch": 2065} {"train_loss": -23.798633575439453, "global_step": 171422, "epoch": 2065} {"train_loss": -23.766836166381836, "global_step": 171423, "epoch": 2065} {"train_loss": -23.674352645874023, "global_step": 171424, "epoch": 2065} {"train_loss": -23.54604148864746, "global_step": 171425, "epoch": 2065} {"train_loss": -23.406469345092773, "global_step": 171426, "epoch": 2065} {"train_loss": -23.97103500366211, "global_step": 171427, "epoch": 2065} {"train_loss": -23.536760330200195, "global_step": 171428, "epoch": 2065} {"train_loss": -23.776037216186523, "global_step": 171429, "epoch": 2065} {"train_loss": -23.734121322631836, "global_step": 171430, "epoch": 2065} {"train_loss": -23.543216705322266, "global_step": 171431, "epoch": 2065} {"train_loss": -23.841520309448242, "global_step": 171432, "epoch": 2065} {"train_loss": -23.58437728881836, "global_step": 171433, "epoch": 2065} {"train_loss": -23.879478454589844, "global_step": 171434, "epoch": 2065} {"train_loss": -23.793777465820312, "global_step": 171435, "epoch": 2065} {"train_loss": -23.628955841064453, "global_step": 171436, "epoch": 2065} {"train_loss": -23.999235153198242, "global_step": 171437, "epoch": 2065} {"train_loss": -24.104511260986328, "global_step": 171438, "epoch": 2065} {"train_loss": -23.80621910095215, "global_step": 171439, "epoch": 2065} {"train_loss": -23.7203311920166, "global_step": 171440, "epoch": 2065} {"train_loss": -23.88921546936035, "global_step": 171441, "epoch": 2065} {"train_loss": -23.7506160736084, "global_step": 171442, "epoch": 2065} {"train_loss": -23.879108428955078, "global_step": 171443, "epoch": 2065} {"train_loss": -23.919925689697266, "global_step": 171444, "epoch": 2065} {"train_loss": -23.678943634033203, "global_step": 171445, "epoch": 2065} {"train_loss": -24.141691207885742, "global_step": 171446, "epoch": 2065} {"train_loss": -24.02968978881836, "global_step": 171447, "epoch": 2065} {"train_loss": -24.123512268066406, "global_step": 171448, "epoch": 2065} {"train_loss": -23.905834197998047, "global_step": 171449, "epoch": 2065} {"train_loss": -24.031715393066406, "global_step": 171450, "epoch": 2065} {"train_loss": -23.30942726135254, "global_step": 171451, "epoch": 2065} {"train_loss": -23.852508544921875, "global_step": 171452, "epoch": 2065} {"train_loss": -23.951637268066406, "global_step": 171453, "epoch": 2065} {"train_loss": -23.546613693237305, "global_step": 171454, "epoch": 2065} {"train_loss": -23.754629135131836, "global_step": 171455, "epoch": 2065} {"train_loss": -23.29247283935547, "global_step": 171456, "epoch": 2065} {"train_loss": -23.25604820251465, "global_step": 171457, "epoch": 2065} {"train_loss": -23.193233489990234, "global_step": 171458, "epoch": 2065} {"train_loss": -23.72545051574707, "global_step": 171459, "epoch": 2065} {"train_loss": -23.32903480529785, "global_step": 171460, "epoch": 2065} {"train_loss": -23.834226608276367, "global_step": 171461, "epoch": 2065} {"train_loss": -23.532394409179688, "global_step": 171462, "epoch": 2065} {"train_loss": -23.056808471679688, "global_step": 171463, "epoch": 2065} {"train_loss": -23.432859420776367, "global_step": 171464, "epoch": 2065} {"train_loss": -23.511587142944336, "global_step": 171465, "epoch": 2065} {"train_loss": -23.40155029296875, "global_step": 171466, "epoch": 2065} {"train_loss": -23.505643844604492, "global_step": 171467, "epoch": 2065} {"train_loss": -23.795764923095703, "global_step": 171468, "epoch": 2065} {"train_loss": -23.461729049682617, "global_step": 171469, "epoch": 2065} {"train_loss": -23.878068923950195, "global_step": 171470, "epoch": 2065} {"train_loss": -23.597129821777344, "global_step": 171471, "epoch": 2065} {"train_loss": -23.746126174926758, "global_step": 171472, "epoch": 2065} {"train_loss": -23.850988388061523, "global_step": 171473, "epoch": 2065} {"train_loss": -23.430007934570312, "global_step": 171474, "epoch": 2065} {"train_loss": -23.822040557861328, "global_step": 171475, "epoch": 2065} {"train_loss": -23.374738693237305, "global_step": 171476, "epoch": 2065} {"train_loss": -23.69493505179164, "global_step": 171477, "epoch": 2065, "val_loss": 6348040.0} {"train_loss": -22.87738609313965, "global_step": 171478, "epoch": 2066} {"train_loss": -23.226003646850586, "global_step": 171479, "epoch": 2066} {"train_loss": -23.313631057739258, "global_step": 171480, "epoch": 2066} {"train_loss": -22.99338150024414, "global_step": 171481, "epoch": 2066} {"train_loss": -23.001972198486328, "global_step": 171482, "epoch": 2066} {"train_loss": -22.978696823120117, "global_step": 171483, "epoch": 2066} {"train_loss": -22.83139991760254, "global_step": 171484, "epoch": 2066} {"train_loss": -23.235435485839844, "global_step": 171485, "epoch": 2066} {"train_loss": -23.4611873626709, "global_step": 171486, "epoch": 2066} {"train_loss": -23.240772247314453, "global_step": 171487, "epoch": 2066} {"train_loss": -23.50356101989746, "global_step": 171488, "epoch": 2066} {"train_loss": -23.323740005493164, "global_step": 171489, "epoch": 2066} {"train_loss": -23.42641258239746, "global_step": 171490, "epoch": 2066} {"train_loss": -23.709089279174805, "global_step": 171491, "epoch": 2066} {"train_loss": -23.3739013671875, "global_step": 171492, "epoch": 2066} {"train_loss": -23.162939071655273, "global_step": 171493, "epoch": 2066} {"train_loss": -23.73583984375, "global_step": 171494, "epoch": 2066} {"train_loss": -23.586631774902344, "global_step": 171495, "epoch": 2066} {"train_loss": -23.357343673706055, "global_step": 171496, "epoch": 2066} {"train_loss": -23.546844482421875, "global_step": 171497, "epoch": 2066} {"train_loss": -23.592466354370117, "global_step": 171498, "epoch": 2066} {"train_loss": -23.45850944519043, "global_step": 171499, "epoch": 2066} {"train_loss": -23.515207290649414, "global_step": 171500, "epoch": 2066} {"train_loss": -23.670751571655273, "global_step": 171501, "epoch": 2066} {"train_loss": -23.713720321655273, "global_step": 171502, "epoch": 2066} {"train_loss": -23.869253158569336, "global_step": 171503, "epoch": 2066} {"train_loss": -23.499866485595703, "global_step": 171504, "epoch": 2066} {"train_loss": -23.774845123291016, "global_step": 171505, "epoch": 2066} {"train_loss": -23.913814544677734, "global_step": 171506, "epoch": 2066} {"train_loss": -23.9234619140625, "global_step": 171507, "epoch": 2066} {"train_loss": -23.583965301513672, "global_step": 171508, "epoch": 2066} {"train_loss": -23.69624137878418, "global_step": 171509, "epoch": 2066} {"train_loss": -23.7105655670166, "global_step": 171510, "epoch": 2066} {"train_loss": -23.818862915039062, "global_step": 171511, "epoch": 2066} {"train_loss": -23.926910400390625, "global_step": 171512, "epoch": 2066} {"train_loss": -23.53070640563965, "global_step": 171513, "epoch": 2066} {"train_loss": -24.042028427124023, "global_step": 171514, "epoch": 2066} {"train_loss": -23.991601943969727, "global_step": 171515, "epoch": 2066} {"train_loss": -23.843778610229492, "global_step": 171516, "epoch": 2066} {"train_loss": -23.659832000732422, "global_step": 171517, "epoch": 2066} {"train_loss": -23.965463638305664, "global_step": 171518, "epoch": 2066} {"train_loss": -23.42945671081543, "global_step": 171519, "epoch": 2066} {"train_loss": -23.81908416748047, "global_step": 171520, "epoch": 2066} {"train_loss": -24.00758171081543, "global_step": 171521, "epoch": 2066} {"train_loss": -24.01954460144043, "global_step": 171522, "epoch": 2066} {"train_loss": -23.866252899169922, "global_step": 171523, "epoch": 2066} {"train_loss": -23.701629638671875, "global_step": 171524, "epoch": 2066} {"train_loss": -23.909690856933594, "global_step": 171525, "epoch": 2066} {"train_loss": -23.9529972076416, "global_step": 171526, "epoch": 2066} {"train_loss": -23.945384979248047, "global_step": 171527, "epoch": 2066} {"train_loss": -23.717395782470703, "global_step": 171528, "epoch": 2066} {"train_loss": -23.64381217956543, "global_step": 171529, "epoch": 2066} {"train_loss": -23.668046951293945, "global_step": 171530, "epoch": 2066} {"train_loss": -23.63236427307129, "global_step": 171531, "epoch": 2066} {"train_loss": -23.790693283081055, "global_step": 171532, "epoch": 2066} {"train_loss": -23.919946670532227, "global_step": 171533, "epoch": 2066} {"train_loss": -23.353769302368164, "global_step": 171534, "epoch": 2066} {"train_loss": -24.007068634033203, "global_step": 171535, "epoch": 2066} {"train_loss": -23.914600372314453, "global_step": 171536, "epoch": 2066} {"train_loss": -23.82083511352539, "global_step": 171537, "epoch": 2066} {"train_loss": -23.347970962524414, "global_step": 171538, "epoch": 2066} {"train_loss": -23.743722915649414, "global_step": 171539, "epoch": 2066} {"train_loss": -23.80629539489746, "global_step": 171540, "epoch": 2066} {"train_loss": -23.92441177368164, "global_step": 171541, "epoch": 2066} {"train_loss": -23.715362548828125, "global_step": 171542, "epoch": 2066} {"train_loss": -23.971635818481445, "global_step": 171543, "epoch": 2066} {"train_loss": -24.01923942565918, "global_step": 171544, "epoch": 2066} {"train_loss": -23.50069236755371, "global_step": 171545, "epoch": 2066} {"train_loss": -23.444366455078125, "global_step": 171546, "epoch": 2066} {"train_loss": -23.538145065307617, "global_step": 171547, "epoch": 2066} {"train_loss": -23.947660446166992, "global_step": 171548, "epoch": 2066} {"train_loss": -23.509471893310547, "global_step": 171549, "epoch": 2066} {"train_loss": -24.01277732849121, "global_step": 171550, "epoch": 2066} {"train_loss": -24.024181365966797, "global_step": 171551, "epoch": 2066} {"train_loss": -23.367109298706055, "global_step": 171552, "epoch": 2066} {"train_loss": -23.49930763244629, "global_step": 171553, "epoch": 2066} {"train_loss": -23.317520141601562, "global_step": 171554, "epoch": 2066} {"train_loss": -23.856576919555664, "global_step": 171555, "epoch": 2066} {"train_loss": -23.937177658081055, "global_step": 171556, "epoch": 2066} {"train_loss": -23.74983024597168, "global_step": 171557, "epoch": 2066} {"train_loss": -24.06744956970215, "global_step": 171558, "epoch": 2066} {"train_loss": -23.99488639831543, "global_step": 171559, "epoch": 2066} {"train_loss": -23.66052319630083, "global_step": 171560, "epoch": 2066, "val_loss": 6385191.5} {"train_loss": -23.1065731048584, "global_step": 171561, "epoch": 2067} {"train_loss": -22.634000778198242, "global_step": 171562, "epoch": 2067} {"train_loss": -22.91086769104004, "global_step": 171563, "epoch": 2067} {"train_loss": -22.742141723632812, "global_step": 171564, "epoch": 2067} {"train_loss": -23.08930015563965, "global_step": 171565, "epoch": 2067} {"train_loss": -23.34798240661621, "global_step": 171566, "epoch": 2067} {"train_loss": -23.14871597290039, "global_step": 171567, "epoch": 2067} {"train_loss": -23.34917449951172, "global_step": 171568, "epoch": 2067} {"train_loss": -23.19272804260254, "global_step": 171569, "epoch": 2067} {"train_loss": -23.455102920532227, "global_step": 171570, "epoch": 2067} {"train_loss": -23.377185821533203, "global_step": 171571, "epoch": 2067} {"train_loss": -23.437227249145508, "global_step": 171572, "epoch": 2067} {"train_loss": -23.5091495513916, "global_step": 171573, "epoch": 2067} {"train_loss": -23.5751895904541, "global_step": 171574, "epoch": 2067} {"train_loss": -23.58104705810547, "global_step": 171575, "epoch": 2067} {"train_loss": -23.36553382873535, "global_step": 171576, "epoch": 2067} {"train_loss": -23.829557418823242, "global_step": 171577, "epoch": 2067} {"train_loss": -23.74860191345215, "global_step": 171578, "epoch": 2067} {"train_loss": -23.62589454650879, "global_step": 171579, "epoch": 2067} {"train_loss": -23.665660858154297, "global_step": 171580, "epoch": 2067} {"train_loss": -23.57427978515625, "global_step": 171581, "epoch": 2067} {"train_loss": -23.98539924621582, "global_step": 171582, "epoch": 2067} {"train_loss": -23.691665649414062, "global_step": 171583, "epoch": 2067} {"train_loss": -23.80109214782715, "global_step": 171584, "epoch": 2067} {"train_loss": -23.92824363708496, "global_step": 171585, "epoch": 2067} {"train_loss": -23.697235107421875, "global_step": 171586, "epoch": 2067} {"train_loss": -23.875776290893555, "global_step": 171587, "epoch": 2067} {"train_loss": -23.69757843017578, "global_step": 171588, "epoch": 2067} {"train_loss": -23.623899459838867, "global_step": 171589, "epoch": 2067} {"train_loss": -23.66395378112793, "global_step": 171590, "epoch": 2067} {"train_loss": -23.982629776000977, "global_step": 171591, "epoch": 2067} {"train_loss": -23.862457275390625, "global_step": 171592, "epoch": 2067} {"train_loss": -23.711551666259766, "global_step": 171593, "epoch": 2067} {"train_loss": -23.628145217895508, "global_step": 171594, "epoch": 2067} {"train_loss": -23.40365219116211, "global_step": 171595, "epoch": 2067} {"train_loss": -23.77801513671875, "global_step": 171596, "epoch": 2067} {"train_loss": -23.783164978027344, "global_step": 171597, "epoch": 2067} {"train_loss": -23.852445602416992, "global_step": 171598, "epoch": 2067} {"train_loss": -23.665542602539062, "global_step": 171599, "epoch": 2067} {"train_loss": -23.611757278442383, "global_step": 171600, "epoch": 2067} {"train_loss": -23.511516571044922, "global_step": 171601, "epoch": 2067} {"train_loss": -23.827863693237305, "global_step": 171602, "epoch": 2067} {"train_loss": -23.806371688842773, "global_step": 171603, "epoch": 2067} {"train_loss": -23.55469512939453, "global_step": 171604, "epoch": 2067} {"train_loss": -23.637662887573242, "global_step": 171605, "epoch": 2067} {"train_loss": -23.66498374938965, "global_step": 171606, "epoch": 2067} {"train_loss": -23.67522621154785, "global_step": 171607, "epoch": 2067} {"train_loss": -23.94626808166504, "global_step": 171608, "epoch": 2067} {"train_loss": -23.963144302368164, "global_step": 171609, "epoch": 2067} {"train_loss": -23.78152084350586, "global_step": 171610, "epoch": 2067} {"train_loss": -23.702880859375, "global_step": 171611, "epoch": 2067} {"train_loss": -23.691221237182617, "global_step": 171612, "epoch": 2067} {"train_loss": -23.95826530456543, "global_step": 171613, "epoch": 2067} {"train_loss": -23.76603126525879, "global_step": 171614, "epoch": 2067} {"train_loss": -23.84538459777832, "global_step": 171615, "epoch": 2067} {"train_loss": -23.7274169921875, "global_step": 171616, "epoch": 2067} {"train_loss": -23.806154251098633, "global_step": 171617, "epoch": 2067} {"train_loss": -23.798551559448242, "global_step": 171618, "epoch": 2067} {"train_loss": -23.652587890625, "global_step": 171619, "epoch": 2067} {"train_loss": -23.625686645507812, "global_step": 171620, "epoch": 2067} {"train_loss": -23.654069900512695, "global_step": 171621, "epoch": 2067} {"train_loss": -23.567052841186523, "global_step": 171622, "epoch": 2067} {"train_loss": -24.116947174072266, "global_step": 171623, "epoch": 2067} {"train_loss": -23.228315353393555, "global_step": 171624, "epoch": 2067} {"train_loss": -23.390050888061523, "global_step": 171625, "epoch": 2067} {"train_loss": -23.93757438659668, "global_step": 171626, "epoch": 2067} {"train_loss": -23.369924545288086, "global_step": 171627, "epoch": 2067} {"train_loss": -23.312179565429688, "global_step": 171628, "epoch": 2067} {"train_loss": -23.535486221313477, "global_step": 171629, "epoch": 2067} {"train_loss": -23.938892364501953, "global_step": 171630, "epoch": 2067} {"train_loss": -23.512296676635742, "global_step": 171631, "epoch": 2067} {"train_loss": -23.880786895751953, "global_step": 171632, "epoch": 2067} {"train_loss": -23.8732852935791, "global_step": 171633, "epoch": 2067} {"train_loss": -23.62324333190918, "global_step": 171634, "epoch": 2067} {"train_loss": -23.912843704223633, "global_step": 171635, "epoch": 2067} {"train_loss": -23.97129249572754, "global_step": 171636, "epoch": 2067} {"train_loss": -23.781030654907227, "global_step": 171637, "epoch": 2067} {"train_loss": -23.541534423828125, "global_step": 171638, "epoch": 2067} {"train_loss": -23.680681228637695, "global_step": 171639, "epoch": 2067} {"train_loss": -23.629703521728516, "global_step": 171640, "epoch": 2067} {"train_loss": -23.93116569519043, "global_step": 171641, "epoch": 2067} {"train_loss": -23.726097106933594, "global_step": 171642, "epoch": 2067} {"train_loss": -23.62296187159527, "global_step": 171643, "epoch": 2067, "val_loss": 6477194.0} {"train_loss": -23.47735023498535, "global_step": 171644, "epoch": 2068} {"train_loss": -23.691343307495117, "global_step": 171645, "epoch": 2068} {"train_loss": -23.6071834564209, "global_step": 171646, "epoch": 2068} {"train_loss": -23.35465431213379, "global_step": 171647, "epoch": 2068} {"train_loss": -23.399124145507812, "global_step": 171648, "epoch": 2068} {"train_loss": -23.30133628845215, "global_step": 171649, "epoch": 2068} {"train_loss": -23.22432518005371, "global_step": 171650, "epoch": 2068} {"train_loss": -23.134870529174805, "global_step": 171651, "epoch": 2068} {"train_loss": -23.597238540649414, "global_step": 171652, "epoch": 2068} {"train_loss": -23.58209991455078, "global_step": 171653, "epoch": 2068} {"train_loss": -23.19358253479004, "global_step": 171654, "epoch": 2068} {"train_loss": -23.47138214111328, "global_step": 171655, "epoch": 2068} {"train_loss": -23.68947982788086, "global_step": 171656, "epoch": 2068} {"train_loss": -23.165550231933594, "global_step": 171657, "epoch": 2068} {"train_loss": -23.40420913696289, "global_step": 171658, "epoch": 2068} {"train_loss": -23.912588119506836, "global_step": 171659, "epoch": 2068} {"train_loss": -23.54349136352539, "global_step": 171660, "epoch": 2068} {"train_loss": -24.026573181152344, "global_step": 171661, "epoch": 2068} {"train_loss": -23.58742332458496, "global_step": 171662, "epoch": 2068} {"train_loss": -23.842370986938477, "global_step": 171663, "epoch": 2068} {"train_loss": -23.659067153930664, "global_step": 171664, "epoch": 2068} {"train_loss": -23.609617233276367, "global_step": 171665, "epoch": 2068} {"train_loss": -23.7811279296875, "global_step": 171666, "epoch": 2068} {"train_loss": -24.085811614990234, "global_step": 171667, "epoch": 2068} {"train_loss": -23.929471969604492, "global_step": 171668, "epoch": 2068} {"train_loss": -23.67154312133789, "global_step": 171669, "epoch": 2068} {"train_loss": -23.440500259399414, "global_step": 171670, "epoch": 2068} {"train_loss": -23.986419677734375, "global_step": 171671, "epoch": 2068} {"train_loss": -23.905784606933594, "global_step": 171672, "epoch": 2068} {"train_loss": -23.608633041381836, "global_step": 171673, "epoch": 2068} {"train_loss": -23.803695678710938, "global_step": 171674, "epoch": 2068} {"train_loss": -23.82929801940918, "global_step": 171675, "epoch": 2068} {"train_loss": -23.466787338256836, "global_step": 171676, "epoch": 2068} {"train_loss": -23.75830078125, "global_step": 171677, "epoch": 2068} {"train_loss": -23.828907012939453, "global_step": 171678, "epoch": 2068} {"train_loss": -23.796031951904297, "global_step": 171679, "epoch": 2068} {"train_loss": -24.025419235229492, "global_step": 171680, "epoch": 2068} {"train_loss": -23.375370025634766, "global_step": 171681, "epoch": 2068} {"train_loss": -23.505512237548828, "global_step": 171682, "epoch": 2068} {"train_loss": -23.4732666015625, "global_step": 171683, "epoch": 2068} {"train_loss": -23.82767105102539, "global_step": 171684, "epoch": 2068} {"train_loss": -23.89138412475586, "global_step": 171685, "epoch": 2068} {"train_loss": -24.155010223388672, "global_step": 171686, "epoch": 2068} {"train_loss": -23.561307907104492, "global_step": 171687, "epoch": 2068} {"train_loss": -23.434112548828125, "global_step": 171688, "epoch": 2068} {"train_loss": -23.720901489257812, "global_step": 171689, "epoch": 2068} {"train_loss": -24.0484619140625, "global_step": 171690, "epoch": 2068} {"train_loss": -23.633211135864258, "global_step": 171691, "epoch": 2068} {"train_loss": -23.804777145385742, "global_step": 171692, "epoch": 2068} {"train_loss": -23.6447811126709, "global_step": 171693, "epoch": 2068} {"train_loss": -23.866321563720703, "global_step": 171694, "epoch": 2068} {"train_loss": -23.853368759155273, "global_step": 171695, "epoch": 2068} {"train_loss": -24.137771606445312, "global_step": 171696, "epoch": 2068} {"train_loss": -23.577329635620117, "global_step": 171697, "epoch": 2068} {"train_loss": -23.716421127319336, "global_step": 171698, "epoch": 2068} {"train_loss": -23.849767684936523, "global_step": 171699, "epoch": 2068} {"train_loss": -23.940881729125977, "global_step": 171700, "epoch": 2068} {"train_loss": -23.863155364990234, "global_step": 171701, "epoch": 2068} {"train_loss": -24.003082275390625, "global_step": 171702, "epoch": 2068} {"train_loss": -24.00147247314453, "global_step": 171703, "epoch": 2068} {"train_loss": -23.561201095581055, "global_step": 171704, "epoch": 2068} {"train_loss": -23.61383056640625, "global_step": 171705, "epoch": 2068} {"train_loss": -23.53567886352539, "global_step": 171706, "epoch": 2068} {"train_loss": -23.579147338867188, "global_step": 171707, "epoch": 2068} {"train_loss": -23.858604431152344, "global_step": 171708, "epoch": 2068} {"train_loss": -23.865699768066406, "global_step": 171709, "epoch": 2068} {"train_loss": -23.84620475769043, "global_step": 171710, "epoch": 2068} {"train_loss": -23.861143112182617, "global_step": 171711, "epoch": 2068} {"train_loss": -23.45331382751465, "global_step": 171712, "epoch": 2068} {"train_loss": -23.535316467285156, "global_step": 171713, "epoch": 2068} {"train_loss": -23.80763053894043, "global_step": 171714, "epoch": 2068} {"train_loss": -23.467418670654297, "global_step": 171715, "epoch": 2068} {"train_loss": -23.63727378845215, "global_step": 171716, "epoch": 2068} {"train_loss": -23.6053466796875, "global_step": 171717, "epoch": 2068} {"train_loss": -23.601375579833984, "global_step": 171718, "epoch": 2068} {"train_loss": -23.709991455078125, "global_step": 171719, "epoch": 2068} {"train_loss": -23.467199325561523, "global_step": 171720, "epoch": 2068} {"train_loss": -23.48261260986328, "global_step": 171721, "epoch": 2068} {"train_loss": -23.867630004882812, "global_step": 171722, "epoch": 2068} {"train_loss": -23.65373992919922, "global_step": 171723, "epoch": 2068} {"train_loss": -23.78632926940918, "global_step": 171724, "epoch": 2068} {"train_loss": -23.734533309936523, "global_step": 171725, "epoch": 2068} {"train_loss": -23.67989804371294, "global_step": 171726, "epoch": 2068, "val_loss": 6494529.0} {"train_loss": -23.390653610229492, "global_step": 171727, "epoch": 2069} {"train_loss": -23.017047882080078, "global_step": 171728, "epoch": 2069} {"train_loss": -23.496383666992188, "global_step": 171729, "epoch": 2069} {"train_loss": -23.30206298828125, "global_step": 171730, "epoch": 2069} {"train_loss": -23.306921005249023, "global_step": 171731, "epoch": 2069} {"train_loss": -22.575286865234375, "global_step": 171732, "epoch": 2069} {"train_loss": -23.43161964416504, "global_step": 171733, "epoch": 2069} {"train_loss": -22.71344566345215, "global_step": 171734, "epoch": 2069} {"train_loss": -23.52474021911621, "global_step": 171735, "epoch": 2069} {"train_loss": -23.608240127563477, "global_step": 171736, "epoch": 2069} {"train_loss": -23.670520782470703, "global_step": 171737, "epoch": 2069} {"train_loss": -23.49675941467285, "global_step": 171738, "epoch": 2069} {"train_loss": -23.59539794921875, "global_step": 171739, "epoch": 2069} {"train_loss": -23.619754791259766, "global_step": 171740, "epoch": 2069} {"train_loss": -23.79656982421875, "global_step": 171741, "epoch": 2069} {"train_loss": -23.76902198791504, "global_step": 171742, "epoch": 2069} {"train_loss": -24.024141311645508, "global_step": 171743, "epoch": 2069} {"train_loss": -23.49126625061035, "global_step": 171744, "epoch": 2069} {"train_loss": -23.38443946838379, "global_step": 171745, "epoch": 2069} {"train_loss": -23.613235473632812, "global_step": 171746, "epoch": 2069} {"train_loss": -23.43856430053711, "global_step": 171747, "epoch": 2069} {"train_loss": -23.710275650024414, "global_step": 171748, "epoch": 2069} {"train_loss": -23.809574127197266, "global_step": 171749, "epoch": 2069} {"train_loss": -23.7651309967041, "global_step": 171750, "epoch": 2069} {"train_loss": -23.593271255493164, "global_step": 171751, "epoch": 2069} {"train_loss": -23.95995330810547, "global_step": 171752, "epoch": 2069} {"train_loss": -23.654775619506836, "global_step": 171753, "epoch": 2069} {"train_loss": -23.86530113220215, "global_step": 171754, "epoch": 2069} {"train_loss": -23.85371208190918, "global_step": 171755, "epoch": 2069} {"train_loss": -23.469839096069336, "global_step": 171756, "epoch": 2069} {"train_loss": -23.672332763671875, "global_step": 171757, "epoch": 2069} {"train_loss": -24.061384201049805, "global_step": 171758, "epoch": 2069} {"train_loss": -23.852645874023438, "global_step": 171759, "epoch": 2069} {"train_loss": -24.20058822631836, "global_step": 171760, "epoch": 2069} {"train_loss": -24.000795364379883, "global_step": 171761, "epoch": 2069} {"train_loss": -24.255640029907227, "global_step": 171762, "epoch": 2069} {"train_loss": -24.018402099609375, "global_step": 171763, "epoch": 2069} {"train_loss": -23.785310745239258, "global_step": 171764, "epoch": 2069} {"train_loss": -23.7435359954834, "global_step": 171765, "epoch": 2069} {"train_loss": -23.841663360595703, "global_step": 171766, "epoch": 2069} {"train_loss": -23.95134735107422, "global_step": 171767, "epoch": 2069} {"train_loss": -23.698013305664062, "global_step": 171768, "epoch": 2069} {"train_loss": -23.659055709838867, "global_step": 171769, "epoch": 2069} {"train_loss": -23.780744552612305, "global_step": 171770, "epoch": 2069} {"train_loss": -23.759408950805664, "global_step": 171771, "epoch": 2069} {"train_loss": -23.421051025390625, "global_step": 171772, "epoch": 2069} {"train_loss": -23.760757446289062, "global_step": 171773, "epoch": 2069} {"train_loss": -23.903242111206055, "global_step": 171774, "epoch": 2069} {"train_loss": -23.73748779296875, "global_step": 171775, "epoch": 2069} {"train_loss": -23.47111701965332, "global_step": 171776, "epoch": 2069} {"train_loss": -24.05195426940918, "global_step": 171777, "epoch": 2069} {"train_loss": -23.783203125, "global_step": 171778, "epoch": 2069} {"train_loss": -24.071088790893555, "global_step": 171779, "epoch": 2069} {"train_loss": -23.616819381713867, "global_step": 171780, "epoch": 2069} {"train_loss": -23.381025314331055, "global_step": 171781, "epoch": 2069} {"train_loss": -23.594823837280273, "global_step": 171782, "epoch": 2069} {"train_loss": -23.72759437561035, "global_step": 171783, "epoch": 2069} {"train_loss": -24.107105255126953, "global_step": 171784, "epoch": 2069} {"train_loss": -23.640798568725586, "global_step": 171785, "epoch": 2069} {"train_loss": -23.75539207458496, "global_step": 171786, "epoch": 2069} {"train_loss": -23.978620529174805, "global_step": 171787, "epoch": 2069} {"train_loss": -23.835813522338867, "global_step": 171788, "epoch": 2069} {"train_loss": -23.563764572143555, "global_step": 171789, "epoch": 2069} {"train_loss": -23.957767486572266, "global_step": 171790, "epoch": 2069} {"train_loss": -23.831457138061523, "global_step": 171791, "epoch": 2069} {"train_loss": -23.7716121673584, "global_step": 171792, "epoch": 2069} {"train_loss": -23.88838005065918, "global_step": 171793, "epoch": 2069} {"train_loss": -23.523574829101562, "global_step": 171794, "epoch": 2069} {"train_loss": -24.04636573791504, "global_step": 171795, "epoch": 2069} {"train_loss": -23.75816535949707, "global_step": 171796, "epoch": 2069} {"train_loss": -23.535329818725586, "global_step": 171797, "epoch": 2069} {"train_loss": -23.62342643737793, "global_step": 171798, "epoch": 2069} {"train_loss": -23.739641189575195, "global_step": 171799, "epoch": 2069} {"train_loss": -23.492788314819336, "global_step": 171800, "epoch": 2069} {"train_loss": -23.83074951171875, "global_step": 171801, "epoch": 2069} {"train_loss": -23.649465560913086, "global_step": 171802, "epoch": 2069} {"train_loss": -23.7286434173584, "global_step": 171803, "epoch": 2069} {"train_loss": -23.515888214111328, "global_step": 171804, "epoch": 2069} {"train_loss": -23.72178840637207, "global_step": 171805, "epoch": 2069} {"train_loss": -23.835538864135742, "global_step": 171806, "epoch": 2069} {"train_loss": -23.747039794921875, "global_step": 171807, "epoch": 2069} {"train_loss": -23.858386993408203, "global_step": 171808, "epoch": 2069} {"train_loss": -23.69278850325619, "global_step": 171809, "epoch": 2069, "val_loss": 6481299.0} {"train_loss": -23.857330322265625, "global_step": 171810, "epoch": 2070} {"train_loss": -23.46430015563965, "global_step": 171811, "epoch": 2070} {"train_loss": -23.66811180114746, "global_step": 171812, "epoch": 2070} {"train_loss": -23.600915908813477, "global_step": 171813, "epoch": 2070} {"train_loss": -23.834598541259766, "global_step": 171814, "epoch": 2070} {"train_loss": -23.882877349853516, "global_step": 171815, "epoch": 2070} {"train_loss": -23.92866325378418, "global_step": 171816, "epoch": 2070} {"train_loss": -23.626571655273438, "global_step": 171817, "epoch": 2070} {"train_loss": -23.840015411376953, "global_step": 171818, "epoch": 2070} {"train_loss": -23.78195571899414, "global_step": 171819, "epoch": 2070} {"train_loss": -24.02186393737793, "global_step": 171820, "epoch": 2070} {"train_loss": -23.71538734436035, "global_step": 171821, "epoch": 2070} {"train_loss": -23.828073501586914, "global_step": 171822, "epoch": 2070} {"train_loss": -23.614084243774414, "global_step": 171823, "epoch": 2070} {"train_loss": -24.08733367919922, "global_step": 171824, "epoch": 2070} {"train_loss": -23.674314498901367, "global_step": 171825, "epoch": 2070} {"train_loss": -24.249919891357422, "global_step": 171826, "epoch": 2070} {"train_loss": -23.761770248413086, "global_step": 171827, "epoch": 2070} {"train_loss": -23.879995346069336, "global_step": 171828, "epoch": 2070} {"train_loss": -23.871196746826172, "global_step": 171829, "epoch": 2070} {"train_loss": -23.408823013305664, "global_step": 171830, "epoch": 2070} {"train_loss": -23.975942611694336, "global_step": 171831, "epoch": 2070} {"train_loss": -23.7059383392334, "global_step": 171832, "epoch": 2070} {"train_loss": -23.45435905456543, "global_step": 171833, "epoch": 2070} {"train_loss": -23.572477340698242, "global_step": 171834, "epoch": 2070} {"train_loss": -23.782262802124023, "global_step": 171835, "epoch": 2070} {"train_loss": -23.8784236907959, "global_step": 171836, "epoch": 2070} {"train_loss": -23.832548141479492, "global_step": 171837, "epoch": 2070} {"train_loss": -23.622053146362305, "global_step": 171838, "epoch": 2070} {"train_loss": -23.73265266418457, "global_step": 171839, "epoch": 2070} {"train_loss": -24.07575798034668, "global_step": 171840, "epoch": 2070} {"train_loss": -23.560651779174805, "global_step": 171841, "epoch": 2070} {"train_loss": -23.589078903198242, "global_step": 171842, "epoch": 2070} {"train_loss": -23.682905197143555, "global_step": 171843, "epoch": 2070} {"train_loss": -23.33185386657715, "global_step": 171844, "epoch": 2070} {"train_loss": -23.518003463745117, "global_step": 171845, "epoch": 2070} {"train_loss": -23.95871353149414, "global_step": 171846, "epoch": 2070} {"train_loss": -23.32942771911621, "global_step": 171847, "epoch": 2070} {"train_loss": -23.653696060180664, "global_step": 171848, "epoch": 2070} {"train_loss": -23.473058700561523, "global_step": 171849, "epoch": 2070} {"train_loss": -23.878950119018555, "global_step": 171850, "epoch": 2070} {"train_loss": -24.057851791381836, "global_step": 171851, "epoch": 2070} {"train_loss": -23.695568084716797, "global_step": 171852, "epoch": 2070} {"train_loss": -23.72818374633789, "global_step": 171853, "epoch": 2070} {"train_loss": -23.428953170776367, "global_step": 171854, "epoch": 2070} {"train_loss": -24.414812088012695, "global_step": 171855, "epoch": 2070} {"train_loss": -23.720006942749023, "global_step": 171856, "epoch": 2070} {"train_loss": -23.460840225219727, "global_step": 171857, "epoch": 2070} {"train_loss": -23.548337936401367, "global_step": 171858, "epoch": 2070} {"train_loss": -23.784658432006836, "global_step": 171859, "epoch": 2070} {"train_loss": -23.38333511352539, "global_step": 171860, "epoch": 2070} {"train_loss": -23.70577049255371, "global_step": 171861, "epoch": 2070} {"train_loss": -23.676183700561523, "global_step": 171862, "epoch": 2070} {"train_loss": -23.94672966003418, "global_step": 171863, "epoch": 2070} {"train_loss": -23.572614669799805, "global_step": 171864, "epoch": 2070} {"train_loss": -24.144432067871094, "global_step": 171865, "epoch": 2070} {"train_loss": -23.475542068481445, "global_step": 171866, "epoch": 2070} {"train_loss": -23.884885787963867, "global_step": 171867, "epoch": 2070} {"train_loss": -23.501516342163086, "global_step": 171868, "epoch": 2070} {"train_loss": -24.078067779541016, "global_step": 171869, "epoch": 2070} {"train_loss": -23.563215255737305, "global_step": 171870, "epoch": 2070} {"train_loss": -23.38230323791504, "global_step": 171871, "epoch": 2070} {"train_loss": -23.70590591430664, "global_step": 171872, "epoch": 2070} {"train_loss": -23.593839645385742, "global_step": 171873, "epoch": 2070} {"train_loss": -23.3314208984375, "global_step": 171874, "epoch": 2070} {"train_loss": -23.738784790039062, "global_step": 171875, "epoch": 2070} {"train_loss": -23.53243064880371, "global_step": 171876, "epoch": 2070} {"train_loss": -23.589082717895508, "global_step": 171877, "epoch": 2070} {"train_loss": -23.561006546020508, "global_step": 171878, "epoch": 2070} {"train_loss": -23.573200225830078, "global_step": 171879, "epoch": 2070} {"train_loss": -23.5777645111084, "global_step": 171880, "epoch": 2070} {"train_loss": -23.576757431030273, "global_step": 171881, "epoch": 2070} {"train_loss": -23.756305694580078, "global_step": 171882, "epoch": 2070} {"train_loss": -23.726085662841797, "global_step": 171883, "epoch": 2070} {"train_loss": -23.67500877380371, "global_step": 171884, "epoch": 2070} {"train_loss": -23.739423751831055, "global_step": 171885, "epoch": 2070} {"train_loss": -23.737537384033203, "global_step": 171886, "epoch": 2070} {"train_loss": -23.838537216186523, "global_step": 171887, "epoch": 2070} {"train_loss": -23.57189178466797, "global_step": 171888, "epoch": 2070} {"train_loss": -23.96137046813965, "global_step": 171889, "epoch": 2070} {"train_loss": -23.754138946533203, "global_step": 171890, "epoch": 2070} {"train_loss": -23.875577926635742, "global_step": 171891, "epoch": 2070} {"train_loss": -23.730193907956043, "global_step": 171892, "epoch": 2070, "val_loss": 6324194.0} {"train_loss": -23.346487045288086, "global_step": 171893, "epoch": 2071} {"train_loss": -23.657079696655273, "global_step": 171894, "epoch": 2071} {"train_loss": -23.500831604003906, "global_step": 171895, "epoch": 2071} {"train_loss": -23.714292526245117, "global_step": 171896, "epoch": 2071} {"train_loss": -23.335824966430664, "global_step": 171897, "epoch": 2071} {"train_loss": -23.682270050048828, "global_step": 171898, "epoch": 2071} {"train_loss": -23.591337203979492, "global_step": 171899, "epoch": 2071} {"train_loss": -23.886714935302734, "global_step": 171900, "epoch": 2071} {"train_loss": -23.592945098876953, "global_step": 171901, "epoch": 2071} {"train_loss": -23.616470336914062, "global_step": 171902, "epoch": 2071} {"train_loss": -23.47044563293457, "global_step": 171903, "epoch": 2071} {"train_loss": -23.47767448425293, "global_step": 171904, "epoch": 2071} {"train_loss": -23.541046142578125, "global_step": 171905, "epoch": 2071} {"train_loss": -23.386991500854492, "global_step": 171906, "epoch": 2071} {"train_loss": -23.95230484008789, "global_step": 171907, "epoch": 2071} {"train_loss": -23.893503189086914, "global_step": 171908, "epoch": 2071} {"train_loss": -23.711406707763672, "global_step": 171909, "epoch": 2071} {"train_loss": -23.67169761657715, "global_step": 171910, "epoch": 2071} {"train_loss": -23.753204345703125, "global_step": 171911, "epoch": 2071} {"train_loss": -23.51906394958496, "global_step": 171912, "epoch": 2071} {"train_loss": -23.881961822509766, "global_step": 171913, "epoch": 2071} {"train_loss": -23.950525283813477, "global_step": 171914, "epoch": 2071} {"train_loss": -23.717374801635742, "global_step": 171915, "epoch": 2071} {"train_loss": -23.47511863708496, "global_step": 171916, "epoch": 2071} {"train_loss": -23.474660873413086, "global_step": 171917, "epoch": 2071} {"train_loss": -23.567035675048828, "global_step": 171918, "epoch": 2071} {"train_loss": -23.677392959594727, "global_step": 171919, "epoch": 2071} {"train_loss": -23.982030868530273, "global_step": 171920, "epoch": 2071} {"train_loss": -23.71925926208496, "global_step": 171921, "epoch": 2071} {"train_loss": -23.355459213256836, "global_step": 171922, "epoch": 2071} {"train_loss": -23.880786895751953, "global_step": 171923, "epoch": 2071} {"train_loss": -23.805448532104492, "global_step": 171924, "epoch": 2071} {"train_loss": -23.731721878051758, "global_step": 171925, "epoch": 2071} {"train_loss": -23.886510848999023, "global_step": 171926, "epoch": 2071} {"train_loss": -23.693824768066406, "global_step": 171927, "epoch": 2071} {"train_loss": -23.28151512145996, "global_step": 171928, "epoch": 2071} {"train_loss": -23.78303337097168, "global_step": 171929, "epoch": 2071} {"train_loss": -23.572179794311523, "global_step": 171930, "epoch": 2071} {"train_loss": -23.83140754699707, "global_step": 171931, "epoch": 2071} {"train_loss": -23.70724868774414, "global_step": 171932, "epoch": 2071} {"train_loss": -23.56932258605957, "global_step": 171933, "epoch": 2071} {"train_loss": -23.78839683532715, "global_step": 171934, "epoch": 2071} {"train_loss": -23.755970001220703, "global_step": 171935, "epoch": 2071} {"train_loss": -23.780651092529297, "global_step": 171936, "epoch": 2071} {"train_loss": -23.642988204956055, "global_step": 171937, "epoch": 2071} {"train_loss": -23.982019424438477, "global_step": 171938, "epoch": 2071} {"train_loss": -23.66474723815918, "global_step": 171939, "epoch": 2071} {"train_loss": -23.85358238220215, "global_step": 171940, "epoch": 2071} {"train_loss": -23.957067489624023, "global_step": 171941, "epoch": 2071} {"train_loss": -23.965316772460938, "global_step": 171942, "epoch": 2071} {"train_loss": -23.832162857055664, "global_step": 171943, "epoch": 2071} {"train_loss": -24.350095748901367, "global_step": 171944, "epoch": 2071} {"train_loss": -23.965181350708008, "global_step": 171945, "epoch": 2071} {"train_loss": -23.715925216674805, "global_step": 171946, "epoch": 2071} {"train_loss": -24.015602111816406, "global_step": 171947, "epoch": 2071} {"train_loss": -23.85089683532715, "global_step": 171948, "epoch": 2071} {"train_loss": -24.13966941833496, "global_step": 171949, "epoch": 2071} {"train_loss": -23.929651260375977, "global_step": 171950, "epoch": 2071} {"train_loss": -23.289682388305664, "global_step": 171951, "epoch": 2071} {"train_loss": -23.34588050842285, "global_step": 171952, "epoch": 2071} {"train_loss": -23.164888381958008, "global_step": 171953, "epoch": 2071} {"train_loss": -23.50838279724121, "global_step": 171954, "epoch": 2071} {"train_loss": -23.856164932250977, "global_step": 171955, "epoch": 2071} {"train_loss": -23.28622817993164, "global_step": 171956, "epoch": 2071} {"train_loss": -23.30097007751465, "global_step": 171957, "epoch": 2071} {"train_loss": -23.662351608276367, "global_step": 171958, "epoch": 2071} {"train_loss": -23.366731643676758, "global_step": 171959, "epoch": 2071} {"train_loss": -23.39176368713379, "global_step": 171960, "epoch": 2071} {"train_loss": -23.5395450592041, "global_step": 171961, "epoch": 2071} {"train_loss": -23.610698699951172, "global_step": 171962, "epoch": 2071} {"train_loss": -23.516368865966797, "global_step": 171963, "epoch": 2071} {"train_loss": -23.042606353759766, "global_step": 171964, "epoch": 2071} {"train_loss": -23.754257202148438, "global_step": 171965, "epoch": 2071} {"train_loss": -23.464595794677734, "global_step": 171966, "epoch": 2071} {"train_loss": -23.610809326171875, "global_step": 171967, "epoch": 2071} {"train_loss": -23.4395694732666, "global_step": 171968, "epoch": 2071} {"train_loss": -23.53500747680664, "global_step": 171969, "epoch": 2071} {"train_loss": -24.01633071899414, "global_step": 171970, "epoch": 2071} {"train_loss": -23.575580596923828, "global_step": 171971, "epoch": 2071} {"train_loss": -23.94698715209961, "global_step": 171972, "epoch": 2071} {"train_loss": -23.690519332885742, "global_step": 171973, "epoch": 2071} {"train_loss": -23.457590103149414, "global_step": 171974, "epoch": 2071} {"train_loss": -23.65996638838067, "global_step": 171975, "epoch": 2071, "val_loss": 6377036.0} {"train_loss": -23.279159545898438, "global_step": 171976, "epoch": 2072} {"train_loss": -23.701499938964844, "global_step": 171977, "epoch": 2072} {"train_loss": -23.447378158569336, "global_step": 171978, "epoch": 2072} {"train_loss": -23.67165184020996, "global_step": 171979, "epoch": 2072} {"train_loss": -23.678943634033203, "global_step": 171980, "epoch": 2072} {"train_loss": -23.294265747070312, "global_step": 171981, "epoch": 2072} {"train_loss": -23.084104537963867, "global_step": 171982, "epoch": 2072} {"train_loss": -23.282381057739258, "global_step": 171983, "epoch": 2072} {"train_loss": -23.512365341186523, "global_step": 171984, "epoch": 2072} {"train_loss": -22.975692749023438, "global_step": 171985, "epoch": 2072} {"train_loss": -23.69257926940918, "global_step": 171986, "epoch": 2072} {"train_loss": -23.761857986450195, "global_step": 171987, "epoch": 2072} {"train_loss": -23.77773094177246, "global_step": 171988, "epoch": 2072} {"train_loss": -23.385766983032227, "global_step": 171989, "epoch": 2072} {"train_loss": -23.909265518188477, "global_step": 171990, "epoch": 2072} {"train_loss": -23.720243453979492, "global_step": 171991, "epoch": 2072} {"train_loss": -23.477270126342773, "global_step": 171992, "epoch": 2072} {"train_loss": -23.73085594177246, "global_step": 171993, "epoch": 2072} {"train_loss": -23.373188018798828, "global_step": 171994, "epoch": 2072} {"train_loss": -23.7141056060791, "global_step": 171995, "epoch": 2072} {"train_loss": -23.3005428314209, "global_step": 171996, "epoch": 2072} {"train_loss": -23.38352394104004, "global_step": 171997, "epoch": 2072} {"train_loss": -23.52487564086914, "global_step": 171998, "epoch": 2072} {"train_loss": -23.475378036499023, "global_step": 171999, "epoch": 2072} {"train_loss": -23.293302536010742, "global_step": 172000, "epoch": 2072} {"train_loss": -23.59646224975586, "global_step": 172001, "epoch": 2072} {"train_loss": -23.433124542236328, "global_step": 172002, "epoch": 2072} {"train_loss": -23.640649795532227, "global_step": 172003, "epoch": 2072} {"train_loss": -23.6705265045166, "global_step": 172004, "epoch": 2072} {"train_loss": -23.912534713745117, "global_step": 172005, "epoch": 2072} {"train_loss": -23.490461349487305, "global_step": 172006, "epoch": 2072} {"train_loss": -23.793113708496094, "global_step": 172007, "epoch": 2072} {"train_loss": -23.61302947998047, "global_step": 172008, "epoch": 2072} {"train_loss": -23.571949005126953, "global_step": 172009, "epoch": 2072} {"train_loss": -23.989891052246094, "global_step": 172010, "epoch": 2072} {"train_loss": -23.416208267211914, "global_step": 172011, "epoch": 2072} {"train_loss": -23.761730194091797, "global_step": 172012, "epoch": 2072} {"train_loss": -23.550643920898438, "global_step": 172013, "epoch": 2072} {"train_loss": -23.89839744567871, "global_step": 172014, "epoch": 2072} {"train_loss": -23.973966598510742, "global_step": 172015, "epoch": 2072} {"train_loss": -23.760860443115234, "global_step": 172016, "epoch": 2072} {"train_loss": -23.711069107055664, "global_step": 172017, "epoch": 2072} {"train_loss": -23.423450469970703, "global_step": 172018, "epoch": 2072} {"train_loss": -23.691572189331055, "global_step": 172019, "epoch": 2072} {"train_loss": -24.0026798248291, "global_step": 172020, "epoch": 2072} {"train_loss": -23.897964477539062, "global_step": 172021, "epoch": 2072} {"train_loss": -23.6718692779541, "global_step": 172022, "epoch": 2072} {"train_loss": -23.6711483001709, "global_step": 172023, "epoch": 2072} {"train_loss": -24.107318878173828, "global_step": 172024, "epoch": 2072} {"train_loss": -23.647245407104492, "global_step": 172025, "epoch": 2072} {"train_loss": -23.769878387451172, "global_step": 172026, "epoch": 2072} {"train_loss": -23.318876266479492, "global_step": 172027, "epoch": 2072} {"train_loss": -23.8568172454834, "global_step": 172028, "epoch": 2072} {"train_loss": -23.620269775390625, "global_step": 172029, "epoch": 2072} {"train_loss": -23.760969161987305, "global_step": 172030, "epoch": 2072} {"train_loss": -23.270627975463867, "global_step": 172031, "epoch": 2072} {"train_loss": -23.30787467956543, "global_step": 172032, "epoch": 2072} {"train_loss": -23.76943016052246, "global_step": 172033, "epoch": 2072} {"train_loss": -23.859182357788086, "global_step": 172034, "epoch": 2072} {"train_loss": -23.653528213500977, "global_step": 172035, "epoch": 2072} {"train_loss": -23.869245529174805, "global_step": 172036, "epoch": 2072} {"train_loss": -23.23444938659668, "global_step": 172037, "epoch": 2072} {"train_loss": -23.73556900024414, "global_step": 172038, "epoch": 2072} {"train_loss": -23.9755802154541, "global_step": 172039, "epoch": 2072} {"train_loss": -23.622940063476562, "global_step": 172040, "epoch": 2072} {"train_loss": -23.619524002075195, "global_step": 172041, "epoch": 2072} {"train_loss": -23.822418212890625, "global_step": 172042, "epoch": 2072} {"train_loss": -23.737707138061523, "global_step": 172043, "epoch": 2072} {"train_loss": -23.740232467651367, "global_step": 172044, "epoch": 2072} {"train_loss": -23.46201515197754, "global_step": 172045, "epoch": 2072} {"train_loss": -23.696884155273438, "global_step": 172046, "epoch": 2072} {"train_loss": -23.549203872680664, "global_step": 172047, "epoch": 2072} {"train_loss": -23.78352165222168, "global_step": 172048, "epoch": 2072} {"train_loss": -23.369583129882812, "global_step": 172049, "epoch": 2072} {"train_loss": -23.334144592285156, "global_step": 172050, "epoch": 2072} {"train_loss": -23.36867904663086, "global_step": 172051, "epoch": 2072} {"train_loss": -23.915359497070312, "global_step": 172052, "epoch": 2072} {"train_loss": -23.84832763671875, "global_step": 172053, "epoch": 2072} {"train_loss": -23.475465774536133, "global_step": 172054, "epoch": 2072} {"train_loss": -23.4294490814209, "global_step": 172055, "epoch": 2072} {"train_loss": -23.9398136138916, "global_step": 172056, "epoch": 2072} {"train_loss": -23.48512077331543, "global_step": 172057, "epoch": 2072} {"train_loss": -23.613428368625872, "global_step": 172058, "epoch": 2072, "val_loss": 6539412.0} {"train_loss": -23.013212203979492, "global_step": 172059, "epoch": 2073} {"train_loss": -23.188678741455078, "global_step": 172060, "epoch": 2073} {"train_loss": -23.397214889526367, "global_step": 172061, "epoch": 2073} {"train_loss": -23.096349716186523, "global_step": 172062, "epoch": 2073} {"train_loss": -23.385032653808594, "global_step": 172063, "epoch": 2073} {"train_loss": -23.0822696685791, "global_step": 172064, "epoch": 2073} {"train_loss": -23.34938621520996, "global_step": 172065, "epoch": 2073} {"train_loss": -23.44309425354004, "global_step": 172066, "epoch": 2073} {"train_loss": -23.510711669921875, "global_step": 172067, "epoch": 2073} {"train_loss": -23.168264389038086, "global_step": 172068, "epoch": 2073} {"train_loss": -23.171894073486328, "global_step": 172069, "epoch": 2073} {"train_loss": -23.58283042907715, "global_step": 172070, "epoch": 2073} {"train_loss": -23.340835571289062, "global_step": 172071, "epoch": 2073} {"train_loss": -23.459070205688477, "global_step": 172072, "epoch": 2073} {"train_loss": -23.700525283813477, "global_step": 172073, "epoch": 2073} {"train_loss": -23.67844009399414, "global_step": 172074, "epoch": 2073} {"train_loss": -23.367725372314453, "global_step": 172075, "epoch": 2073} {"train_loss": -23.62156867980957, "global_step": 172076, "epoch": 2073} {"train_loss": -23.849435806274414, "global_step": 172077, "epoch": 2073} {"train_loss": -23.52054214477539, "global_step": 172078, "epoch": 2073} {"train_loss": -23.68256950378418, "global_step": 172079, "epoch": 2073} {"train_loss": -23.989864349365234, "global_step": 172080, "epoch": 2073} {"train_loss": -23.91580581665039, "global_step": 172081, "epoch": 2073} {"train_loss": -23.490407943725586, "global_step": 172082, "epoch": 2073} {"train_loss": -23.564498901367188, "global_step": 172083, "epoch": 2073} {"train_loss": -23.49271011352539, "global_step": 172084, "epoch": 2073} {"train_loss": -23.895410537719727, "global_step": 172085, "epoch": 2073} {"train_loss": -23.777671813964844, "global_step": 172086, "epoch": 2073} {"train_loss": -23.938236236572266, "global_step": 172087, "epoch": 2073} {"train_loss": -23.998769760131836, "global_step": 172088, "epoch": 2073} {"train_loss": -23.68341636657715, "global_step": 172089, "epoch": 2073} {"train_loss": -23.818021774291992, "global_step": 172090, "epoch": 2073} {"train_loss": -23.862497329711914, "global_step": 172091, "epoch": 2073} {"train_loss": -23.798036575317383, "global_step": 172092, "epoch": 2073} {"train_loss": -23.91792106628418, "global_step": 172093, "epoch": 2073} {"train_loss": -23.589649200439453, "global_step": 172094, "epoch": 2073} {"train_loss": -23.891874313354492, "global_step": 172095, "epoch": 2073} {"train_loss": -23.89875602722168, "global_step": 172096, "epoch": 2073} {"train_loss": -23.947704315185547, "global_step": 172097, "epoch": 2073} {"train_loss": -23.86805534362793, "global_step": 172098, "epoch": 2073} {"train_loss": -23.781763076782227, "global_step": 172099, "epoch": 2073} {"train_loss": -24.0677490234375, "global_step": 172100, "epoch": 2073} {"train_loss": -23.73456382751465, "global_step": 172101, "epoch": 2073} {"train_loss": -23.665830612182617, "global_step": 172102, "epoch": 2073} {"train_loss": -23.561824798583984, "global_step": 172103, "epoch": 2073} {"train_loss": -23.89603614807129, "global_step": 172104, "epoch": 2073} {"train_loss": -23.727933883666992, "global_step": 172105, "epoch": 2073} {"train_loss": -23.805923461914062, "global_step": 172106, "epoch": 2073} {"train_loss": -24.147563934326172, "global_step": 172107, "epoch": 2073} {"train_loss": -23.52039337158203, "global_step": 172108, "epoch": 2073} {"train_loss": -23.68466567993164, "global_step": 172109, "epoch": 2073} {"train_loss": -23.580158233642578, "global_step": 172110, "epoch": 2073} {"train_loss": -23.24302101135254, "global_step": 172111, "epoch": 2073} {"train_loss": -23.6181697845459, "global_step": 172112, "epoch": 2073} {"train_loss": -23.5422420501709, "global_step": 172113, "epoch": 2073} {"train_loss": -23.893617630004883, "global_step": 172114, "epoch": 2073} {"train_loss": -23.690967559814453, "global_step": 172115, "epoch": 2073} {"train_loss": -23.70782470703125, "global_step": 172116, "epoch": 2073} {"train_loss": -23.66297149658203, "global_step": 172117, "epoch": 2073} {"train_loss": -23.437963485717773, "global_step": 172118, "epoch": 2073} {"train_loss": -24.105804443359375, "global_step": 172119, "epoch": 2073} {"train_loss": -23.432144165039062, "global_step": 172120, "epoch": 2073} {"train_loss": -23.835546493530273, "global_step": 172121, "epoch": 2073} {"train_loss": -23.79032325744629, "global_step": 172122, "epoch": 2073} {"train_loss": -23.812875747680664, "global_step": 172123, "epoch": 2073} {"train_loss": -23.728107452392578, "global_step": 172124, "epoch": 2073} {"train_loss": -23.767271041870117, "global_step": 172125, "epoch": 2073} {"train_loss": -23.7774658203125, "global_step": 172126, "epoch": 2073} {"train_loss": -24.11860466003418, "global_step": 172127, "epoch": 2073} {"train_loss": -24.004383087158203, "global_step": 172128, "epoch": 2073} {"train_loss": -24.12868309020996, "global_step": 172129, "epoch": 2073} {"train_loss": -23.901290893554688, "global_step": 172130, "epoch": 2073} {"train_loss": -23.70826530456543, "global_step": 172131, "epoch": 2073} {"train_loss": -23.746353149414062, "global_step": 172132, "epoch": 2073} {"train_loss": -23.879989624023438, "global_step": 172133, "epoch": 2073} {"train_loss": -24.024580001831055, "global_step": 172134, "epoch": 2073} {"train_loss": -23.68039894104004, "global_step": 172135, "epoch": 2073} {"train_loss": -23.61001205444336, "global_step": 172136, "epoch": 2073} {"train_loss": -23.680200576782227, "global_step": 172137, "epoch": 2073} {"train_loss": -23.436471939086914, "global_step": 172138, "epoch": 2073} {"train_loss": -24.1438045501709, "global_step": 172139, "epoch": 2073} {"train_loss": -23.845518112182617, "global_step": 172140, "epoch": 2073} {"train_loss": -23.69369773405144, "global_step": 172141, "epoch": 2073, "val_loss": 6459333.0} {"train_loss": -23.28208351135254, "global_step": 172142, "epoch": 2074} {"train_loss": -23.36614990234375, "global_step": 172143, "epoch": 2074} {"train_loss": -23.67583465576172, "global_step": 172144, "epoch": 2074} {"train_loss": -22.6820068359375, "global_step": 172145, "epoch": 2074} {"train_loss": -23.457548141479492, "global_step": 172146, "epoch": 2074} {"train_loss": -22.701217651367188, "global_step": 172147, "epoch": 2074} {"train_loss": -23.36594009399414, "global_step": 172148, "epoch": 2074} {"train_loss": -23.374120712280273, "global_step": 172149, "epoch": 2074} {"train_loss": -23.429208755493164, "global_step": 172150, "epoch": 2074} {"train_loss": -23.214086532592773, "global_step": 172151, "epoch": 2074} {"train_loss": -23.256900787353516, "global_step": 172152, "epoch": 2074} {"train_loss": -23.346975326538086, "global_step": 172153, "epoch": 2074} {"train_loss": -23.61747169494629, "global_step": 172154, "epoch": 2074} {"train_loss": -23.12031364440918, "global_step": 172155, "epoch": 2074} {"train_loss": -23.349075317382812, "global_step": 172156, "epoch": 2074} {"train_loss": -23.711374282836914, "global_step": 172157, "epoch": 2074} {"train_loss": -23.430908203125, "global_step": 172158, "epoch": 2074} {"train_loss": -23.571537017822266, "global_step": 172159, "epoch": 2074} {"train_loss": -23.597089767456055, "global_step": 172160, "epoch": 2074} {"train_loss": -23.291101455688477, "global_step": 172161, "epoch": 2074} {"train_loss": -23.579919815063477, "global_step": 172162, "epoch": 2074} {"train_loss": -23.919340133666992, "global_step": 172163, "epoch": 2074} {"train_loss": -23.83475685119629, "global_step": 172164, "epoch": 2074} {"train_loss": -23.736289978027344, "global_step": 172165, "epoch": 2074} {"train_loss": -23.531099319458008, "global_step": 172166, "epoch": 2074} {"train_loss": -23.519973754882812, "global_step": 172167, "epoch": 2074} {"train_loss": -23.546655654907227, "global_step": 172168, "epoch": 2074} {"train_loss": -24.184951782226562, "global_step": 172169, "epoch": 2074} {"train_loss": -23.611557006835938, "global_step": 172170, "epoch": 2074} {"train_loss": -23.56159782409668, "global_step": 172171, "epoch": 2074} {"train_loss": -23.452665328979492, "global_step": 172172, "epoch": 2074} {"train_loss": -23.794275283813477, "global_step": 172173, "epoch": 2074} {"train_loss": -23.978134155273438, "global_step": 172174, "epoch": 2074} {"train_loss": -23.241378784179688, "global_step": 172175, "epoch": 2074} {"train_loss": -23.475788116455078, "global_step": 172176, "epoch": 2074} {"train_loss": -23.840923309326172, "global_step": 172177, "epoch": 2074} {"train_loss": -23.8902645111084, "global_step": 172178, "epoch": 2074} {"train_loss": -23.811508178710938, "global_step": 172179, "epoch": 2074} {"train_loss": -23.620864868164062, "global_step": 172180, "epoch": 2074} {"train_loss": -24.013460159301758, "global_step": 172181, "epoch": 2074} {"train_loss": -23.913145065307617, "global_step": 172182, "epoch": 2074} {"train_loss": -23.30535888671875, "global_step": 172183, "epoch": 2074} {"train_loss": -23.514230728149414, "global_step": 172184, "epoch": 2074} {"train_loss": -23.463115692138672, "global_step": 172185, "epoch": 2074} {"train_loss": -23.36577033996582, "global_step": 172186, "epoch": 2074} {"train_loss": -23.616491317749023, "global_step": 172187, "epoch": 2074} {"train_loss": -23.60797119140625, "global_step": 172188, "epoch": 2074} {"train_loss": -23.731063842773438, "global_step": 172189, "epoch": 2074} {"train_loss": -23.641769409179688, "global_step": 172190, "epoch": 2074} {"train_loss": -23.757078170776367, "global_step": 172191, "epoch": 2074} {"train_loss": -23.471847534179688, "global_step": 172192, "epoch": 2074} {"train_loss": -23.968215942382812, "global_step": 172193, "epoch": 2074} {"train_loss": -23.8159236907959, "global_step": 172194, "epoch": 2074} {"train_loss": -23.568546295166016, "global_step": 172195, "epoch": 2074} {"train_loss": -23.950334548950195, "global_step": 172196, "epoch": 2074} {"train_loss": -23.5401554107666, "global_step": 172197, "epoch": 2074} {"train_loss": -23.800886154174805, "global_step": 172198, "epoch": 2074} {"train_loss": -24.11175537109375, "global_step": 172199, "epoch": 2074} {"train_loss": -23.558347702026367, "global_step": 172200, "epoch": 2074} {"train_loss": -23.835676193237305, "global_step": 172201, "epoch": 2074} {"train_loss": -24.1379337310791, "global_step": 172202, "epoch": 2074} {"train_loss": -24.12921714782715, "global_step": 172203, "epoch": 2074} {"train_loss": -23.6822566986084, "global_step": 172204, "epoch": 2074} {"train_loss": -23.57773208618164, "global_step": 172205, "epoch": 2074} {"train_loss": -23.420530319213867, "global_step": 172206, "epoch": 2074} {"train_loss": -23.784696578979492, "global_step": 172207, "epoch": 2074} {"train_loss": -23.294113159179688, "global_step": 172208, "epoch": 2074} {"train_loss": -23.1934757232666, "global_step": 172209, "epoch": 2074} {"train_loss": -23.32455825805664, "global_step": 172210, "epoch": 2074} {"train_loss": -23.523056030273438, "global_step": 172211, "epoch": 2074} {"train_loss": -23.593137741088867, "global_step": 172212, "epoch": 2074} {"train_loss": -23.629430770874023, "global_step": 172213, "epoch": 2074} {"train_loss": -23.69666862487793, "global_step": 172214, "epoch": 2074} {"train_loss": -24.009153366088867, "global_step": 172215, "epoch": 2074} {"train_loss": -23.654569625854492, "global_step": 172216, "epoch": 2074} {"train_loss": -23.664979934692383, "global_step": 172217, "epoch": 2074} {"train_loss": -23.799734115600586, "global_step": 172218, "epoch": 2074} {"train_loss": -23.54380226135254, "global_step": 172219, "epoch": 2074} {"train_loss": -23.341474533081055, "global_step": 172220, "epoch": 2074} {"train_loss": -23.930179595947266, "global_step": 172221, "epoch": 2074} {"train_loss": -23.975706100463867, "global_step": 172222, "epoch": 2074} {"train_loss": -24.020713806152344, "global_step": 172223, "epoch": 2074} {"train_loss": -23.61443427671869, "global_step": 172224, "epoch": 2074, "val_loss": 6325410.0} {"train_loss": -23.060623168945312, "global_step": 172225, "epoch": 2075} {"train_loss": -23.715238571166992, "global_step": 172226, "epoch": 2075} {"train_loss": -24.02461051940918, "global_step": 172227, "epoch": 2075} {"train_loss": -23.23659324645996, "global_step": 172228, "epoch": 2075} {"train_loss": -23.469348907470703, "global_step": 172229, "epoch": 2075} {"train_loss": -23.699634552001953, "global_step": 172230, "epoch": 2075} {"train_loss": -23.2736873626709, "global_step": 172231, "epoch": 2075} {"train_loss": -23.5478458404541, "global_step": 172232, "epoch": 2075} {"train_loss": -23.878421783447266, "global_step": 172233, "epoch": 2075} {"train_loss": -23.45794105529785, "global_step": 172234, "epoch": 2075} {"train_loss": -23.668973922729492, "global_step": 172235, "epoch": 2075} {"train_loss": -23.700454711914062, "global_step": 172236, "epoch": 2075} {"train_loss": -23.813932418823242, "global_step": 172237, "epoch": 2075} {"train_loss": -23.52195167541504, "global_step": 172238, "epoch": 2075} {"train_loss": -23.266027450561523, "global_step": 172239, "epoch": 2075} {"train_loss": -23.39320182800293, "global_step": 172240, "epoch": 2075} {"train_loss": -23.84651756286621, "global_step": 172241, "epoch": 2075} {"train_loss": -23.640966415405273, "global_step": 172242, "epoch": 2075} {"train_loss": -23.804807662963867, "global_step": 172243, "epoch": 2075} {"train_loss": -23.60756492614746, "global_step": 172244, "epoch": 2075} {"train_loss": -23.88763427734375, "global_step": 172245, "epoch": 2075} {"train_loss": -23.67776107788086, "global_step": 172246, "epoch": 2075} {"train_loss": -23.547006607055664, "global_step": 172247, "epoch": 2075} {"train_loss": -24.13837432861328, "global_step": 172248, "epoch": 2075} {"train_loss": -23.7996768951416, "global_step": 172249, "epoch": 2075} {"train_loss": -23.586423873901367, "global_step": 172250, "epoch": 2075} {"train_loss": -23.578556060791016, "global_step": 172251, "epoch": 2075} {"train_loss": -23.428117752075195, "global_step": 172252, "epoch": 2075} {"train_loss": -23.484821319580078, "global_step": 172253, "epoch": 2075} {"train_loss": -23.4072322845459, "global_step": 172254, "epoch": 2075} {"train_loss": -23.910480499267578, "global_step": 172255, "epoch": 2075} {"train_loss": -24.095632553100586, "global_step": 172256, "epoch": 2075} {"train_loss": -23.679580688476562, "global_step": 172257, "epoch": 2075} {"train_loss": -23.635242462158203, "global_step": 172258, "epoch": 2075} {"train_loss": -24.05849266052246, "global_step": 172259, "epoch": 2075} {"train_loss": -23.9556827545166, "global_step": 172260, "epoch": 2075} {"train_loss": -23.6552791595459, "global_step": 172261, "epoch": 2075} {"train_loss": -23.80669403076172, "global_step": 172262, "epoch": 2075} {"train_loss": -24.17644691467285, "global_step": 172263, "epoch": 2075} {"train_loss": -23.902002334594727, "global_step": 172264, "epoch": 2075} {"train_loss": -23.705078125, "global_step": 172265, "epoch": 2075} {"train_loss": -23.719940185546875, "global_step": 172266, "epoch": 2075} {"train_loss": -23.81047248840332, "global_step": 172267, "epoch": 2075} {"train_loss": -24.089956283569336, "global_step": 172268, "epoch": 2075} {"train_loss": -23.620365142822266, "global_step": 172269, "epoch": 2075} {"train_loss": -23.806486129760742, "global_step": 172270, "epoch": 2075} {"train_loss": -23.718408584594727, "global_step": 172271, "epoch": 2075} {"train_loss": -23.760656356811523, "global_step": 172272, "epoch": 2075} {"train_loss": -23.4179744720459, "global_step": 172273, "epoch": 2075} {"train_loss": -23.935733795166016, "global_step": 172274, "epoch": 2075} {"train_loss": -23.8588924407959, "global_step": 172275, "epoch": 2075} {"train_loss": -23.950849533081055, "global_step": 172276, "epoch": 2075} {"train_loss": -23.62302017211914, "global_step": 172277, "epoch": 2075} {"train_loss": -23.810766220092773, "global_step": 172278, "epoch": 2075} {"train_loss": -23.68507194519043, "global_step": 172279, "epoch": 2075} {"train_loss": -23.790740966796875, "global_step": 172280, "epoch": 2075} {"train_loss": -23.705842971801758, "global_step": 172281, "epoch": 2075} {"train_loss": -23.258161544799805, "global_step": 172282, "epoch": 2075} {"train_loss": -23.79243278503418, "global_step": 172283, "epoch": 2075} {"train_loss": -23.511381149291992, "global_step": 172284, "epoch": 2075} {"train_loss": -23.508207321166992, "global_step": 172285, "epoch": 2075} {"train_loss": -23.08819007873535, "global_step": 172286, "epoch": 2075} {"train_loss": -23.697065353393555, "global_step": 172287, "epoch": 2075} {"train_loss": -23.80010986328125, "global_step": 172288, "epoch": 2075} {"train_loss": -23.164825439453125, "global_step": 172289, "epoch": 2075} {"train_loss": -24.214975357055664, "global_step": 172290, "epoch": 2075} {"train_loss": -23.407020568847656, "global_step": 172291, "epoch": 2075} {"train_loss": -23.463254928588867, "global_step": 172292, "epoch": 2075} {"train_loss": -23.610387802124023, "global_step": 172293, "epoch": 2075} {"train_loss": -23.81315040588379, "global_step": 172294, "epoch": 2075} {"train_loss": -23.528818130493164, "global_step": 172295, "epoch": 2075} {"train_loss": -23.56955909729004, "global_step": 172296, "epoch": 2075} {"train_loss": -23.65019416809082, "global_step": 172297, "epoch": 2075} {"train_loss": -24.06568717956543, "global_step": 172298, "epoch": 2075} {"train_loss": -23.75856590270996, "global_step": 172299, "epoch": 2075} {"train_loss": -23.93107795715332, "global_step": 172300, "epoch": 2075} {"train_loss": -23.49327278137207, "global_step": 172301, "epoch": 2075} {"train_loss": -23.55694580078125, "global_step": 172302, "epoch": 2075} {"train_loss": -23.328140258789062, "global_step": 172303, "epoch": 2075} {"train_loss": -23.902841567993164, "global_step": 172304, "epoch": 2075} {"train_loss": -23.916309356689453, "global_step": 172305, "epoch": 2075} {"train_loss": -23.451276779174805, "global_step": 172306, "epoch": 2075} {"train_loss": -23.665791936667567, "global_step": 172307, "epoch": 2075, "val_loss": 6523086.0} {"train_loss": -23.484378814697266, "global_step": 172308, "epoch": 2076} {"train_loss": -23.283056259155273, "global_step": 172309, "epoch": 2076} {"train_loss": -23.820812225341797, "global_step": 172310, "epoch": 2076} {"train_loss": -23.21721649169922, "global_step": 172311, "epoch": 2076} {"train_loss": -23.6009521484375, "global_step": 172312, "epoch": 2076} {"train_loss": -23.429655075073242, "global_step": 172313, "epoch": 2076} {"train_loss": -23.506467819213867, "global_step": 172314, "epoch": 2076} {"train_loss": -23.223560333251953, "global_step": 172315, "epoch": 2076} {"train_loss": -23.36087989807129, "global_step": 172316, "epoch": 2076} {"train_loss": -23.32974624633789, "global_step": 172317, "epoch": 2076} {"train_loss": -23.309810638427734, "global_step": 172318, "epoch": 2076} {"train_loss": -23.80657958984375, "global_step": 172319, "epoch": 2076} {"train_loss": -23.582563400268555, "global_step": 172320, "epoch": 2076} {"train_loss": -23.523237228393555, "global_step": 172321, "epoch": 2076} {"train_loss": -23.9033145904541, "global_step": 172322, "epoch": 2076} {"train_loss": -24.103971481323242, "global_step": 172323, "epoch": 2076} {"train_loss": -23.750186920166016, "global_step": 172324, "epoch": 2076} {"train_loss": -23.94871711730957, "global_step": 172325, "epoch": 2076} {"train_loss": -23.795703887939453, "global_step": 172326, "epoch": 2076} {"train_loss": -23.203580856323242, "global_step": 172327, "epoch": 2076} {"train_loss": -23.841657638549805, "global_step": 172328, "epoch": 2076} {"train_loss": -23.782337188720703, "global_step": 172329, "epoch": 2076} {"train_loss": -23.74497413635254, "global_step": 172330, "epoch": 2076} {"train_loss": -23.628116607666016, "global_step": 172331, "epoch": 2076} {"train_loss": -23.580738067626953, "global_step": 172332, "epoch": 2076} {"train_loss": -23.589975357055664, "global_step": 172333, "epoch": 2076} {"train_loss": -23.79947853088379, "global_step": 172334, "epoch": 2076} {"train_loss": -23.74640464782715, "global_step": 172335, "epoch": 2076} {"train_loss": -23.761581420898438, "global_step": 172336, "epoch": 2076} {"train_loss": -23.91071891784668, "global_step": 172337, "epoch": 2076} {"train_loss": -23.54071617126465, "global_step": 172338, "epoch": 2076} {"train_loss": -23.7821102142334, "global_step": 172339, "epoch": 2076} {"train_loss": -23.416622161865234, "global_step": 172340, "epoch": 2076} {"train_loss": -23.89776611328125, "global_step": 172341, "epoch": 2076} {"train_loss": -23.525392532348633, "global_step": 172342, "epoch": 2076} {"train_loss": -23.360107421875, "global_step": 172343, "epoch": 2076} {"train_loss": -23.647872924804688, "global_step": 172344, "epoch": 2076} {"train_loss": -23.52484703063965, "global_step": 172345, "epoch": 2076} {"train_loss": -23.781646728515625, "global_step": 172346, "epoch": 2076} {"train_loss": -23.576526641845703, "global_step": 172347, "epoch": 2076} {"train_loss": -24.03942108154297, "global_step": 172348, "epoch": 2076} {"train_loss": -23.92136001586914, "global_step": 172349, "epoch": 2076} {"train_loss": -23.439908981323242, "global_step": 172350, "epoch": 2076} {"train_loss": -24.331836700439453, "global_step": 172351, "epoch": 2076} {"train_loss": -23.5732479095459, "global_step": 172352, "epoch": 2076} {"train_loss": -23.909509658813477, "global_step": 172353, "epoch": 2076} {"train_loss": -24.00226402282715, "global_step": 172354, "epoch": 2076} {"train_loss": -23.8976993560791, "global_step": 172355, "epoch": 2076} {"train_loss": -24.077604293823242, "global_step": 172356, "epoch": 2076} {"train_loss": -23.723920822143555, "global_step": 172357, "epoch": 2076} {"train_loss": -24.174333572387695, "global_step": 172358, "epoch": 2076} {"train_loss": -23.789888381958008, "global_step": 172359, "epoch": 2076} {"train_loss": -23.638233184814453, "global_step": 172360, "epoch": 2076} {"train_loss": -23.830974578857422, "global_step": 172361, "epoch": 2076} {"train_loss": -23.619731903076172, "global_step": 172362, "epoch": 2076} {"train_loss": -23.867931365966797, "global_step": 172363, "epoch": 2076} {"train_loss": -23.749603271484375, "global_step": 172364, "epoch": 2076} {"train_loss": -23.831378936767578, "global_step": 172365, "epoch": 2076} {"train_loss": -23.61954689025879, "global_step": 172366, "epoch": 2076} {"train_loss": -23.63494110107422, "global_step": 172367, "epoch": 2076} {"train_loss": -23.4565486907959, "global_step": 172368, "epoch": 2076} {"train_loss": -23.437347412109375, "global_step": 172369, "epoch": 2076} {"train_loss": -23.212886810302734, "global_step": 172370, "epoch": 2076} {"train_loss": -23.63637924194336, "global_step": 172371, "epoch": 2076} {"train_loss": -23.586990356445312, "global_step": 172372, "epoch": 2076} {"train_loss": -23.791425704956055, "global_step": 172373, "epoch": 2076} {"train_loss": -23.423757553100586, "global_step": 172374, "epoch": 2076} {"train_loss": -23.271697998046875, "global_step": 172375, "epoch": 2076} {"train_loss": -23.79451560974121, "global_step": 172376, "epoch": 2076} {"train_loss": -23.64175796508789, "global_step": 172377, "epoch": 2076} {"train_loss": -23.354923248291016, "global_step": 172378, "epoch": 2076} {"train_loss": -23.32063865661621, "global_step": 172379, "epoch": 2076} {"train_loss": -23.672958374023438, "global_step": 172380, "epoch": 2076} {"train_loss": -23.47953224182129, "global_step": 172381, "epoch": 2076} {"train_loss": -23.759876251220703, "global_step": 172382, "epoch": 2076} {"train_loss": -23.972274780273438, "global_step": 172383, "epoch": 2076} {"train_loss": -23.92118263244629, "global_step": 172384, "epoch": 2076} {"train_loss": -23.93855857849121, "global_step": 172385, "epoch": 2076} {"train_loss": -23.716455459594727, "global_step": 172386, "epoch": 2076} {"train_loss": -23.93939781188965, "global_step": 172387, "epoch": 2076} {"train_loss": -23.844100952148438, "global_step": 172388, "epoch": 2076} {"train_loss": -23.986120223999023, "global_step": 172389, "epoch": 2076} {"train_loss": -23.680111230137836, "global_step": 172390, "epoch": 2076, "val_loss": 6550611.5} {"train_loss": -22.77517318725586, "global_step": 172391, "epoch": 2077} {"train_loss": -23.22035789489746, "global_step": 172392, "epoch": 2077} {"train_loss": -23.164106369018555, "global_step": 172393, "epoch": 2077} {"train_loss": -23.26136589050293, "global_step": 172394, "epoch": 2077} {"train_loss": -23.46626853942871, "global_step": 172395, "epoch": 2077} {"train_loss": -23.271020889282227, "global_step": 172396, "epoch": 2077} {"train_loss": -23.258678436279297, "global_step": 172397, "epoch": 2077} {"train_loss": -23.28964614868164, "global_step": 172398, "epoch": 2077} {"train_loss": -22.771360397338867, "global_step": 172399, "epoch": 2077} {"train_loss": -23.608396530151367, "global_step": 172400, "epoch": 2077} {"train_loss": -23.370037078857422, "global_step": 172401, "epoch": 2077} {"train_loss": -23.24219512939453, "global_step": 172402, "epoch": 2077} {"train_loss": -23.610681533813477, "global_step": 172403, "epoch": 2077} {"train_loss": -23.06100082397461, "global_step": 172404, "epoch": 2077} {"train_loss": -23.234128952026367, "global_step": 172405, "epoch": 2077} {"train_loss": -23.65620994567871, "global_step": 172406, "epoch": 2077} {"train_loss": -23.665409088134766, "global_step": 172407, "epoch": 2077} {"train_loss": -23.503034591674805, "global_step": 172408, "epoch": 2077} {"train_loss": -23.758941650390625, "global_step": 172409, "epoch": 2077} {"train_loss": -23.682289123535156, "global_step": 172410, "epoch": 2077} {"train_loss": -23.340116500854492, "global_step": 172411, "epoch": 2077} {"train_loss": -23.70499038696289, "global_step": 172412, "epoch": 2077} {"train_loss": -23.589588165283203, "global_step": 172413, "epoch": 2077} {"train_loss": -23.551427841186523, "global_step": 172414, "epoch": 2077} {"train_loss": -23.657621383666992, "global_step": 172415, "epoch": 2077} {"train_loss": -23.2104549407959, "global_step": 172416, "epoch": 2077} {"train_loss": -23.405630111694336, "global_step": 172417, "epoch": 2077} {"train_loss": -23.174707412719727, "global_step": 172418, "epoch": 2077} {"train_loss": -23.837675094604492, "global_step": 172419, "epoch": 2077} {"train_loss": -23.552003860473633, "global_step": 172420, "epoch": 2077} {"train_loss": -23.631380081176758, "global_step": 172421, "epoch": 2077} {"train_loss": -23.6986141204834, "global_step": 172422, "epoch": 2077} {"train_loss": -23.636579513549805, "global_step": 172423, "epoch": 2077} {"train_loss": -23.8504638671875, "global_step": 172424, "epoch": 2077} {"train_loss": -23.485273361206055, "global_step": 172425, "epoch": 2077} {"train_loss": -23.832380294799805, "global_step": 172426, "epoch": 2077} {"train_loss": -23.617856979370117, "global_step": 172427, "epoch": 2077} {"train_loss": -23.830873489379883, "global_step": 172428, "epoch": 2077} {"train_loss": -23.934743881225586, "global_step": 172429, "epoch": 2077} {"train_loss": -23.888381958007812, "global_step": 172430, "epoch": 2077} {"train_loss": -23.69802474975586, "global_step": 172431, "epoch": 2077} {"train_loss": -23.683027267456055, "global_step": 172432, "epoch": 2077} {"train_loss": -23.5323486328125, "global_step": 172433, "epoch": 2077} {"train_loss": -24.031187057495117, "global_step": 172434, "epoch": 2077} {"train_loss": -24.00445556640625, "global_step": 172435, "epoch": 2077} {"train_loss": -23.622568130493164, "global_step": 172436, "epoch": 2077} {"train_loss": -23.77519989013672, "global_step": 172437, "epoch": 2077} {"train_loss": -23.463010787963867, "global_step": 172438, "epoch": 2077} {"train_loss": -23.84628677368164, "global_step": 172439, "epoch": 2077} {"train_loss": -23.54636001586914, "global_step": 172440, "epoch": 2077} {"train_loss": -23.8482666015625, "global_step": 172441, "epoch": 2077} {"train_loss": -23.601905822753906, "global_step": 172442, "epoch": 2077} {"train_loss": -23.393762588500977, "global_step": 172443, "epoch": 2077} {"train_loss": -23.830129623413086, "global_step": 172444, "epoch": 2077} {"train_loss": -23.415428161621094, "global_step": 172445, "epoch": 2077} {"train_loss": -23.598464965820312, "global_step": 172446, "epoch": 2077} {"train_loss": -23.5985107421875, "global_step": 172447, "epoch": 2077} {"train_loss": -23.65317153930664, "global_step": 172448, "epoch": 2077} {"train_loss": -23.600439071655273, "global_step": 172449, "epoch": 2077} {"train_loss": -24.024988174438477, "global_step": 172450, "epoch": 2077} {"train_loss": -23.708637237548828, "global_step": 172451, "epoch": 2077} {"train_loss": -23.392545700073242, "global_step": 172452, "epoch": 2077} {"train_loss": -23.834716796875, "global_step": 172453, "epoch": 2077} {"train_loss": -23.556856155395508, "global_step": 172454, "epoch": 2077} {"train_loss": -23.561025619506836, "global_step": 172455, "epoch": 2077} {"train_loss": -23.155593872070312, "global_step": 172456, "epoch": 2077} {"train_loss": -23.276073455810547, "global_step": 172457, "epoch": 2077} {"train_loss": -23.87740135192871, "global_step": 172458, "epoch": 2077} {"train_loss": -23.90915298461914, "global_step": 172459, "epoch": 2077} {"train_loss": -23.853271484375, "global_step": 172460, "epoch": 2077} {"train_loss": -23.658126831054688, "global_step": 172461, "epoch": 2077} {"train_loss": -23.45954704284668, "global_step": 172462, "epoch": 2077} {"train_loss": -23.60852813720703, "global_step": 172463, "epoch": 2077} {"train_loss": -23.668079376220703, "global_step": 172464, "epoch": 2077} {"train_loss": -23.930648803710938, "global_step": 172465, "epoch": 2077} {"train_loss": -23.60114097595215, "global_step": 172466, "epoch": 2077} {"train_loss": -23.72947120666504, "global_step": 172467, "epoch": 2077} {"train_loss": -23.524641036987305, "global_step": 172468, "epoch": 2077} {"train_loss": -23.682775497436523, "global_step": 172469, "epoch": 2077} {"train_loss": -23.971670150756836, "global_step": 172470, "epoch": 2077} {"train_loss": -23.865325927734375, "global_step": 172471, "epoch": 2077} {"train_loss": -23.835458755493164, "global_step": 172472, "epoch": 2077} {"train_loss": -23.586912384952406, "global_step": 172473, "epoch": 2077, "val_loss": 6454507.0} {"train_loss": -23.80608558654785, "global_step": 172474, "epoch": 2078} {"train_loss": -23.725271224975586, "global_step": 172475, "epoch": 2078} {"train_loss": -23.47993278503418, "global_step": 172476, "epoch": 2078} {"train_loss": -23.85145378112793, "global_step": 172477, "epoch": 2078} {"train_loss": -23.799985885620117, "global_step": 172478, "epoch": 2078} {"train_loss": -23.884641647338867, "global_step": 172479, "epoch": 2078} {"train_loss": -23.349390029907227, "global_step": 172480, "epoch": 2078} {"train_loss": -23.81539535522461, "global_step": 172481, "epoch": 2078} {"train_loss": -23.43133544921875, "global_step": 172482, "epoch": 2078} {"train_loss": -23.8864803314209, "global_step": 172483, "epoch": 2078} {"train_loss": -23.66194725036621, "global_step": 172484, "epoch": 2078} {"train_loss": -23.48980712890625, "global_step": 172485, "epoch": 2078} {"train_loss": -23.639490127563477, "global_step": 172486, "epoch": 2078} {"train_loss": -23.408414840698242, "global_step": 172487, "epoch": 2078} {"train_loss": -24.108579635620117, "global_step": 172488, "epoch": 2078} {"train_loss": -23.638973236083984, "global_step": 172489, "epoch": 2078} {"train_loss": -23.521066665649414, "global_step": 172490, "epoch": 2078} {"train_loss": -23.72896385192871, "global_step": 172491, "epoch": 2078} {"train_loss": -23.230426788330078, "global_step": 172492, "epoch": 2078} {"train_loss": -23.774442672729492, "global_step": 172493, "epoch": 2078} {"train_loss": -23.649126052856445, "global_step": 172494, "epoch": 2078} {"train_loss": -23.489639282226562, "global_step": 172495, "epoch": 2078} {"train_loss": -23.893949508666992, "global_step": 172496, "epoch": 2078} {"train_loss": -23.670698165893555, "global_step": 172497, "epoch": 2078} {"train_loss": -23.519363403320312, "global_step": 172498, "epoch": 2078} {"train_loss": -23.914169311523438, "global_step": 172499, "epoch": 2078} {"train_loss": -23.909255981445312, "global_step": 172500, "epoch": 2078} {"train_loss": -23.780466079711914, "global_step": 172501, "epoch": 2078} {"train_loss": -23.674335479736328, "global_step": 172502, "epoch": 2078} {"train_loss": -23.591354370117188, "global_step": 172503, "epoch": 2078} {"train_loss": -23.577404022216797, "global_step": 172504, "epoch": 2078} {"train_loss": -23.46442413330078, "global_step": 172505, "epoch": 2078} {"train_loss": -23.939184188842773, "global_step": 172506, "epoch": 2078} {"train_loss": -23.76988410949707, "global_step": 172507, "epoch": 2078} {"train_loss": -23.640430450439453, "global_step": 172508, "epoch": 2078} {"train_loss": -24.254837036132812, "global_step": 172509, "epoch": 2078} {"train_loss": -23.89015769958496, "global_step": 172510, "epoch": 2078} {"train_loss": -23.641971588134766, "global_step": 172511, "epoch": 2078} {"train_loss": -23.656246185302734, "global_step": 172512, "epoch": 2078} {"train_loss": -23.88004493713379, "global_step": 172513, "epoch": 2078} {"train_loss": -23.859729766845703, "global_step": 172514, "epoch": 2078} {"train_loss": -23.77727699279785, "global_step": 172515, "epoch": 2078} {"train_loss": -23.54471778869629, "global_step": 172516, "epoch": 2078} {"train_loss": -23.87173080444336, "global_step": 172517, "epoch": 2078} {"train_loss": -23.67190170288086, "global_step": 172518, "epoch": 2078} {"train_loss": -24.002450942993164, "global_step": 172519, "epoch": 2078} {"train_loss": -23.713294982910156, "global_step": 172520, "epoch": 2078} {"train_loss": -23.871435165405273, "global_step": 172521, "epoch": 2078} {"train_loss": -23.28881072998047, "global_step": 172522, "epoch": 2078} {"train_loss": -23.53211784362793, "global_step": 172523, "epoch": 2078} {"train_loss": -23.74728012084961, "global_step": 172524, "epoch": 2078} {"train_loss": -23.63503074645996, "global_step": 172525, "epoch": 2078} {"train_loss": -23.579421997070312, "global_step": 172526, "epoch": 2078} {"train_loss": -23.536972045898438, "global_step": 172527, "epoch": 2078} {"train_loss": -23.800539016723633, "global_step": 172528, "epoch": 2078} {"train_loss": -23.690174102783203, "global_step": 172529, "epoch": 2078} {"train_loss": -23.661758422851562, "global_step": 172530, "epoch": 2078} {"train_loss": -23.682912826538086, "global_step": 172531, "epoch": 2078} {"train_loss": -23.744314193725586, "global_step": 172532, "epoch": 2078} {"train_loss": -23.770252227783203, "global_step": 172533, "epoch": 2078} {"train_loss": -23.337791442871094, "global_step": 172534, "epoch": 2078} {"train_loss": -23.210233688354492, "global_step": 172535, "epoch": 2078} {"train_loss": -23.579450607299805, "global_step": 172536, "epoch": 2078} {"train_loss": -23.64464569091797, "global_step": 172537, "epoch": 2078} {"train_loss": -23.883602142333984, "global_step": 172538, "epoch": 2078} {"train_loss": -23.68721580505371, "global_step": 172539, "epoch": 2078} {"train_loss": -23.865081787109375, "global_step": 172540, "epoch": 2078} {"train_loss": -24.022493362426758, "global_step": 172541, "epoch": 2078} {"train_loss": -23.878665924072266, "global_step": 172542, "epoch": 2078} {"train_loss": -23.72641372680664, "global_step": 172543, "epoch": 2078} {"train_loss": -23.555509567260742, "global_step": 172544, "epoch": 2078} {"train_loss": -23.30213737487793, "global_step": 172545, "epoch": 2078} {"train_loss": -23.875782012939453, "global_step": 172546, "epoch": 2078} {"train_loss": -23.44034194946289, "global_step": 172547, "epoch": 2078} {"train_loss": -23.812612533569336, "global_step": 172548, "epoch": 2078} {"train_loss": -23.63730239868164, "global_step": 172549, "epoch": 2078} {"train_loss": -23.97789764404297, "global_step": 172550, "epoch": 2078} {"train_loss": -23.785314559936523, "global_step": 172551, "epoch": 2078} {"train_loss": -23.861478805541992, "global_step": 172552, "epoch": 2078} {"train_loss": -23.944894790649414, "global_step": 172553, "epoch": 2078} {"train_loss": -23.8558292388916, "global_step": 172554, "epoch": 2078} {"train_loss": -23.747053146362305, "global_step": 172555, "epoch": 2078} {"train_loss": -23.700612332447466, "global_step": 172556, "epoch": 2078, "val_loss": 6416102.0} {"train_loss": -23.396812438964844, "global_step": 172557, "epoch": 2079} {"train_loss": -23.65120506286621, "global_step": 172558, "epoch": 2079} {"train_loss": -23.53034019470215, "global_step": 172559, "epoch": 2079} {"train_loss": -23.83551025390625, "global_step": 172560, "epoch": 2079} {"train_loss": -23.727005004882812, "global_step": 172561, "epoch": 2079} {"train_loss": -23.404632568359375, "global_step": 172562, "epoch": 2079} {"train_loss": -23.62677764892578, "global_step": 172563, "epoch": 2079} {"train_loss": -23.546146392822266, "global_step": 172564, "epoch": 2079} {"train_loss": -23.935338973999023, "global_step": 172565, "epoch": 2079} {"train_loss": -23.984638214111328, "global_step": 172566, "epoch": 2079} {"train_loss": -24.034879684448242, "global_step": 172567, "epoch": 2079} {"train_loss": -23.698209762573242, "global_step": 172568, "epoch": 2079} {"train_loss": -23.795650482177734, "global_step": 172569, "epoch": 2079} {"train_loss": -23.583248138427734, "global_step": 172570, "epoch": 2079} {"train_loss": -23.42108726501465, "global_step": 172571, "epoch": 2079} {"train_loss": -23.697561264038086, "global_step": 172572, "epoch": 2079} {"train_loss": -23.190937042236328, "global_step": 172573, "epoch": 2079} {"train_loss": -23.529325485229492, "global_step": 172574, "epoch": 2079} {"train_loss": -23.43566131591797, "global_step": 172575, "epoch": 2079} {"train_loss": -23.715110778808594, "global_step": 172576, "epoch": 2079} {"train_loss": -24.03265953063965, "global_step": 172577, "epoch": 2079} {"train_loss": -23.846946716308594, "global_step": 172578, "epoch": 2079} {"train_loss": -23.48414421081543, "global_step": 172579, "epoch": 2079} {"train_loss": -23.962467193603516, "global_step": 172580, "epoch": 2079} {"train_loss": -23.607816696166992, "global_step": 172581, "epoch": 2079} {"train_loss": -23.71253776550293, "global_step": 172582, "epoch": 2079} {"train_loss": -23.451154708862305, "global_step": 172583, "epoch": 2079} {"train_loss": -23.685932159423828, "global_step": 172584, "epoch": 2079} {"train_loss": -23.8385009765625, "global_step": 172585, "epoch": 2079} {"train_loss": -23.829740524291992, "global_step": 172586, "epoch": 2079} {"train_loss": -23.6031494140625, "global_step": 172587, "epoch": 2079} {"train_loss": -24.079931259155273, "global_step": 172588, "epoch": 2079} {"train_loss": -23.5841007232666, "global_step": 172589, "epoch": 2079} {"train_loss": -23.852888107299805, "global_step": 172590, "epoch": 2079} {"train_loss": -24.147802352905273, "global_step": 172591, "epoch": 2079} {"train_loss": -24.0660343170166, "global_step": 172592, "epoch": 2079} {"train_loss": -23.814680099487305, "global_step": 172593, "epoch": 2079} {"train_loss": -23.547666549682617, "global_step": 172594, "epoch": 2079} {"train_loss": -23.80728530883789, "global_step": 172595, "epoch": 2079} {"train_loss": -24.05893898010254, "global_step": 172596, "epoch": 2079} {"train_loss": -23.55905532836914, "global_step": 172597, "epoch": 2079} {"train_loss": -23.301523208618164, "global_step": 172598, "epoch": 2079} {"train_loss": -23.38141632080078, "global_step": 172599, "epoch": 2079} {"train_loss": -23.50394058227539, "global_step": 172600, "epoch": 2079} {"train_loss": -23.911746978759766, "global_step": 172601, "epoch": 2079} {"train_loss": -23.65540885925293, "global_step": 172602, "epoch": 2079} {"train_loss": -22.996280670166016, "global_step": 172603, "epoch": 2079} {"train_loss": -23.6600399017334, "global_step": 172604, "epoch": 2079} {"train_loss": -23.688749313354492, "global_step": 172605, "epoch": 2079} {"train_loss": -23.55466079711914, "global_step": 172606, "epoch": 2079} {"train_loss": -23.386852264404297, "global_step": 172607, "epoch": 2079} {"train_loss": -23.7110652923584, "global_step": 172608, "epoch": 2079} {"train_loss": -23.511390686035156, "global_step": 172609, "epoch": 2079} {"train_loss": -23.76355743408203, "global_step": 172610, "epoch": 2079} {"train_loss": -23.851587295532227, "global_step": 172611, "epoch": 2079} {"train_loss": -23.60951805114746, "global_step": 172612, "epoch": 2079} {"train_loss": -23.526777267456055, "global_step": 172613, "epoch": 2079} {"train_loss": -23.795246124267578, "global_step": 172614, "epoch": 2079} {"train_loss": -23.629674911499023, "global_step": 172615, "epoch": 2079} {"train_loss": -23.483509063720703, "global_step": 172616, "epoch": 2079} {"train_loss": -23.72808837890625, "global_step": 172617, "epoch": 2079} {"train_loss": -23.911481857299805, "global_step": 172618, "epoch": 2079} {"train_loss": -23.77902603149414, "global_step": 172619, "epoch": 2079} {"train_loss": -23.952932357788086, "global_step": 172620, "epoch": 2079} {"train_loss": -23.50270652770996, "global_step": 172621, "epoch": 2079} {"train_loss": -23.945388793945312, "global_step": 172622, "epoch": 2079} {"train_loss": -23.688016891479492, "global_step": 172623, "epoch": 2079} {"train_loss": -23.933238983154297, "global_step": 172624, "epoch": 2079} {"train_loss": -23.858110427856445, "global_step": 172625, "epoch": 2079} {"train_loss": -23.639326095581055, "global_step": 172626, "epoch": 2079} {"train_loss": -24.02521514892578, "global_step": 172627, "epoch": 2079} {"train_loss": -23.972017288208008, "global_step": 172628, "epoch": 2079} {"train_loss": -23.740209579467773, "global_step": 172629, "epoch": 2079} {"train_loss": -23.661706924438477, "global_step": 172630, "epoch": 2079} {"train_loss": -23.56355857849121, "global_step": 172631, "epoch": 2079} {"train_loss": -23.276296615600586, "global_step": 172632, "epoch": 2079} {"train_loss": -23.953413009643555, "global_step": 172633, "epoch": 2079} {"train_loss": -23.821659088134766, "global_step": 172634, "epoch": 2079} {"train_loss": -23.800817489624023, "global_step": 172635, "epoch": 2079} {"train_loss": -24.089035034179688, "global_step": 172636, "epoch": 2079} {"train_loss": -23.687271118164062, "global_step": 172637, "epoch": 2079} {"train_loss": -23.89447593688965, "global_step": 172638, "epoch": 2079} {"train_loss": -23.68976013918957, "global_step": 172639, "epoch": 2079, "val_loss": 6586799.5} {"train_loss": -23.105295181274414, "global_step": 172640, "epoch": 2080} {"train_loss": -22.924060821533203, "global_step": 172641, "epoch": 2080} {"train_loss": -23.119497299194336, "global_step": 172642, "epoch": 2080} {"train_loss": -23.382583618164062, "global_step": 172643, "epoch": 2080} {"train_loss": -23.136621475219727, "global_step": 172644, "epoch": 2080} {"train_loss": -23.261856079101562, "global_step": 172645, "epoch": 2080} {"train_loss": -23.51651954650879, "global_step": 172646, "epoch": 2080} {"train_loss": -23.190271377563477, "global_step": 172647, "epoch": 2080} {"train_loss": -23.273305892944336, "global_step": 172648, "epoch": 2080} {"train_loss": -23.917688369750977, "global_step": 172649, "epoch": 2080} {"train_loss": -23.532255172729492, "global_step": 172650, "epoch": 2080} {"train_loss": -23.311325073242188, "global_step": 172651, "epoch": 2080} {"train_loss": -23.519851684570312, "global_step": 172652, "epoch": 2080} {"train_loss": -23.34566879272461, "global_step": 172653, "epoch": 2080} {"train_loss": -23.446104049682617, "global_step": 172654, "epoch": 2080} {"train_loss": -23.68824005126953, "global_step": 172655, "epoch": 2080} {"train_loss": -23.664020538330078, "global_step": 172656, "epoch": 2080} {"train_loss": -23.39948081970215, "global_step": 172657, "epoch": 2080} {"train_loss": -23.557720184326172, "global_step": 172658, "epoch": 2080} {"train_loss": -24.008581161499023, "global_step": 172659, "epoch": 2080} {"train_loss": -23.775115966796875, "global_step": 172660, "epoch": 2080} {"train_loss": -23.558382034301758, "global_step": 172661, "epoch": 2080} {"train_loss": -23.488134384155273, "global_step": 172662, "epoch": 2080} {"train_loss": -23.480789184570312, "global_step": 172663, "epoch": 2080} {"train_loss": -23.80547332763672, "global_step": 172664, "epoch": 2080} {"train_loss": -23.59235191345215, "global_step": 172665, "epoch": 2080} {"train_loss": -23.493738174438477, "global_step": 172666, "epoch": 2080} {"train_loss": -23.51251220703125, "global_step": 172667, "epoch": 2080} {"train_loss": -23.63559913635254, "global_step": 172668, "epoch": 2080} {"train_loss": -23.939998626708984, "global_step": 172669, "epoch": 2080} {"train_loss": -23.67197608947754, "global_step": 172670, "epoch": 2080} {"train_loss": -23.78273582458496, "global_step": 172671, "epoch": 2080} {"train_loss": -23.77847671508789, "global_step": 172672, "epoch": 2080} {"train_loss": -23.889684677124023, "global_step": 172673, "epoch": 2080} {"train_loss": -23.82942771911621, "global_step": 172674, "epoch": 2080} {"train_loss": -24.054075241088867, "global_step": 172675, "epoch": 2080} {"train_loss": -23.581344604492188, "global_step": 172676, "epoch": 2080} {"train_loss": -23.889596939086914, "global_step": 172677, "epoch": 2080} {"train_loss": -23.884231567382812, "global_step": 172678, "epoch": 2080} {"train_loss": -23.722558975219727, "global_step": 172679, "epoch": 2080} {"train_loss": -23.896547317504883, "global_step": 172680, "epoch": 2080} {"train_loss": -23.971622467041016, "global_step": 172681, "epoch": 2080} {"train_loss": -23.827411651611328, "global_step": 172682, "epoch": 2080} {"train_loss": -23.64923667907715, "global_step": 172683, "epoch": 2080} {"train_loss": -23.702335357666016, "global_step": 172684, "epoch": 2080} {"train_loss": -23.954442977905273, "global_step": 172685, "epoch": 2080} {"train_loss": -23.84656524658203, "global_step": 172686, "epoch": 2080} {"train_loss": -24.152395248413086, "global_step": 172687, "epoch": 2080} {"train_loss": -24.00098991394043, "global_step": 172688, "epoch": 2080} {"train_loss": -23.66022300720215, "global_step": 172689, "epoch": 2080} {"train_loss": -23.85810661315918, "global_step": 172690, "epoch": 2080} {"train_loss": -23.79981231689453, "global_step": 172691, "epoch": 2080} {"train_loss": -23.863842010498047, "global_step": 172692, "epoch": 2080} {"train_loss": -23.806509017944336, "global_step": 172693, "epoch": 2080} {"train_loss": -23.578227996826172, "global_step": 172694, "epoch": 2080} {"train_loss": -23.946876525878906, "global_step": 172695, "epoch": 2080} {"train_loss": -23.71552276611328, "global_step": 172696, "epoch": 2080} {"train_loss": -23.979928970336914, "global_step": 172697, "epoch": 2080} {"train_loss": -23.682836532592773, "global_step": 172698, "epoch": 2080} {"train_loss": -23.882282257080078, "global_step": 172699, "epoch": 2080} {"train_loss": -23.86257553100586, "global_step": 172700, "epoch": 2080} {"train_loss": -23.580469131469727, "global_step": 172701, "epoch": 2080} {"train_loss": -23.64159393310547, "global_step": 172702, "epoch": 2080} {"train_loss": -23.949024200439453, "global_step": 172703, "epoch": 2080} {"train_loss": -23.971837997436523, "global_step": 172704, "epoch": 2080} {"train_loss": -24.04545021057129, "global_step": 172705, "epoch": 2080} {"train_loss": -23.94340705871582, "global_step": 172706, "epoch": 2080} {"train_loss": -23.799907684326172, "global_step": 172707, "epoch": 2080} {"train_loss": -23.976110458374023, "global_step": 172708, "epoch": 2080} {"train_loss": -23.81500244140625, "global_step": 172709, "epoch": 2080} {"train_loss": -23.608442306518555, "global_step": 172710, "epoch": 2080} {"train_loss": -23.797962188720703, "global_step": 172711, "epoch": 2080} {"train_loss": -23.74991226196289, "global_step": 172712, "epoch": 2080} {"train_loss": -23.781728744506836, "global_step": 172713, "epoch": 2080} {"train_loss": -24.20398712158203, "global_step": 172714, "epoch": 2080} {"train_loss": -24.117921829223633, "global_step": 172715, "epoch": 2080} {"train_loss": -23.788959503173828, "global_step": 172716, "epoch": 2080} {"train_loss": -23.676647186279297, "global_step": 172717, "epoch": 2080} {"train_loss": -23.708799362182617, "global_step": 172718, "epoch": 2080} {"train_loss": -23.58732795715332, "global_step": 172719, "epoch": 2080} {"train_loss": -23.579360961914062, "global_step": 172720, "epoch": 2080} {"train_loss": -23.353513717651367, "global_step": 172721, "epoch": 2080} {"train_loss": -23.70178496119488, "global_step": 172722, "epoch": 2080, "val_loss": 6350401.5} {"train_loss": -22.44486427307129, "global_step": 172723, "epoch": 2081} {"train_loss": -21.98278045654297, "global_step": 172724, "epoch": 2081} {"train_loss": -22.345746994018555, "global_step": 172725, "epoch": 2081} {"train_loss": -23.743173599243164, "global_step": 172726, "epoch": 2081} {"train_loss": -22.729522705078125, "global_step": 172727, "epoch": 2081} {"train_loss": -23.638090133666992, "global_step": 172728, "epoch": 2081} {"train_loss": -22.933683395385742, "global_step": 172729, "epoch": 2081} {"train_loss": -23.442659378051758, "global_step": 172730, "epoch": 2081} {"train_loss": -23.382137298583984, "global_step": 172731, "epoch": 2081} {"train_loss": -23.083593368530273, "global_step": 172732, "epoch": 2081} {"train_loss": -23.395862579345703, "global_step": 172733, "epoch": 2081} {"train_loss": -23.46658706665039, "global_step": 172734, "epoch": 2081} {"train_loss": -23.28879165649414, "global_step": 172735, "epoch": 2081} {"train_loss": -23.345333099365234, "global_step": 172736, "epoch": 2081} {"train_loss": -23.103124618530273, "global_step": 172737, "epoch": 2081} {"train_loss": -23.77474021911621, "global_step": 172738, "epoch": 2081} {"train_loss": -23.387115478515625, "global_step": 172739, "epoch": 2081} {"train_loss": -23.540470123291016, "global_step": 172740, "epoch": 2081} {"train_loss": -23.387964248657227, "global_step": 172741, "epoch": 2081} {"train_loss": -23.52818489074707, "global_step": 172742, "epoch": 2081} {"train_loss": -23.311010360717773, "global_step": 172743, "epoch": 2081} {"train_loss": -23.587526321411133, "global_step": 172744, "epoch": 2081} {"train_loss": -23.35222816467285, "global_step": 172745, "epoch": 2081} {"train_loss": -23.453393936157227, "global_step": 172746, "epoch": 2081} {"train_loss": -23.723968505859375, "global_step": 172747, "epoch": 2081} {"train_loss": -23.315841674804688, "global_step": 172748, "epoch": 2081} {"train_loss": -23.50044822692871, "global_step": 172749, "epoch": 2081} {"train_loss": -23.757699966430664, "global_step": 172750, "epoch": 2081} {"train_loss": -23.57008934020996, "global_step": 172751, "epoch": 2081} {"train_loss": -23.85628890991211, "global_step": 172752, "epoch": 2081} {"train_loss": -23.327207565307617, "global_step": 172753, "epoch": 2081} {"train_loss": -23.87497901916504, "global_step": 172754, "epoch": 2081} {"train_loss": -23.877201080322266, "global_step": 172755, "epoch": 2081} {"train_loss": -24.129945755004883, "global_step": 172756, "epoch": 2081} {"train_loss": -23.885408401489258, "global_step": 172757, "epoch": 2081} {"train_loss": -23.817289352416992, "global_step": 172758, "epoch": 2081} {"train_loss": -24.043563842773438, "global_step": 172759, "epoch": 2081} {"train_loss": -23.66172981262207, "global_step": 172760, "epoch": 2081} {"train_loss": -24.338544845581055, "global_step": 172761, "epoch": 2081} {"train_loss": -23.63431167602539, "global_step": 172762, "epoch": 2081} {"train_loss": -24.09869956970215, "global_step": 172763, "epoch": 2081} {"train_loss": -23.76111602783203, "global_step": 172764, "epoch": 2081} {"train_loss": -24.020734786987305, "global_step": 172765, "epoch": 2081} {"train_loss": -23.764617919921875, "global_step": 172766, "epoch": 2081} {"train_loss": -23.911340713500977, "global_step": 172767, "epoch": 2081} {"train_loss": -23.729206085205078, "global_step": 172768, "epoch": 2081} {"train_loss": -23.621112823486328, "global_step": 172769, "epoch": 2081} {"train_loss": -23.748458862304688, "global_step": 172770, "epoch": 2081} {"train_loss": -23.38263511657715, "global_step": 172771, "epoch": 2081} {"train_loss": -24.32145118713379, "global_step": 172772, "epoch": 2081} {"train_loss": -24.208280563354492, "global_step": 172773, "epoch": 2081} {"train_loss": -23.79249382019043, "global_step": 172774, "epoch": 2081} {"train_loss": -23.851377487182617, "global_step": 172775, "epoch": 2081} {"train_loss": -23.56031036376953, "global_step": 172776, "epoch": 2081} {"train_loss": -23.489553451538086, "global_step": 172777, "epoch": 2081} {"train_loss": -23.751859664916992, "global_step": 172778, "epoch": 2081} {"train_loss": -23.400312423706055, "global_step": 172779, "epoch": 2081} {"train_loss": -23.966176986694336, "global_step": 172780, "epoch": 2081} {"train_loss": -23.503646850585938, "global_step": 172781, "epoch": 2081} {"train_loss": -23.388952255249023, "global_step": 172782, "epoch": 2081} {"train_loss": -23.311922073364258, "global_step": 172783, "epoch": 2081} {"train_loss": -23.68800163269043, "global_step": 172784, "epoch": 2081} {"train_loss": -23.83402442932129, "global_step": 172785, "epoch": 2081} {"train_loss": -23.517271041870117, "global_step": 172786, "epoch": 2081} {"train_loss": -23.79581069946289, "global_step": 172787, "epoch": 2081} {"train_loss": -23.68868637084961, "global_step": 172788, "epoch": 2081} {"train_loss": -23.925495147705078, "global_step": 172789, "epoch": 2081} {"train_loss": -23.74070167541504, "global_step": 172790, "epoch": 2081} {"train_loss": -23.77667808532715, "global_step": 172791, "epoch": 2081} {"train_loss": -23.49989128112793, "global_step": 172792, "epoch": 2081} {"train_loss": -23.727041244506836, "global_step": 172793, "epoch": 2081} {"train_loss": -23.721426010131836, "global_step": 172794, "epoch": 2081} {"train_loss": -23.62006950378418, "global_step": 172795, "epoch": 2081} {"train_loss": -23.785629272460938, "global_step": 172796, "epoch": 2081} {"train_loss": -23.480493545532227, "global_step": 172797, "epoch": 2081} {"train_loss": -24.12154197692871, "global_step": 172798, "epoch": 2081} {"train_loss": -23.72559928894043, "global_step": 172799, "epoch": 2081} {"train_loss": -24.189544677734375, "global_step": 172800, "epoch": 2081} {"train_loss": -23.564529418945312, "global_step": 172801, "epoch": 2081} {"train_loss": -24.18561363220215, "global_step": 172802, "epoch": 2081} {"train_loss": -23.893537521362305, "global_step": 172803, "epoch": 2081} {"train_loss": -23.983556747436523, "global_step": 172804, "epoch": 2081} {"train_loss": -23.61549306203084, "global_step": 172805, "epoch": 2081, "val_loss": 6609107.0} {"train_loss": -23.254819869995117, "global_step": 172806, "epoch": 2082} {"train_loss": -22.378271102905273, "global_step": 172807, "epoch": 2082} {"train_loss": -22.87190818786621, "global_step": 172808, "epoch": 2082} {"train_loss": -23.190946578979492, "global_step": 172809, "epoch": 2082} {"train_loss": -23.595075607299805, "global_step": 172810, "epoch": 2082} {"train_loss": -23.326017379760742, "global_step": 172811, "epoch": 2082} {"train_loss": -23.519733428955078, "global_step": 172812, "epoch": 2082} {"train_loss": -23.551420211791992, "global_step": 172813, "epoch": 2082} {"train_loss": -23.412425994873047, "global_step": 172814, "epoch": 2082} {"train_loss": -23.51041030883789, "global_step": 172815, "epoch": 2082} {"train_loss": -23.240671157836914, "global_step": 172816, "epoch": 2082} {"train_loss": -22.86707878112793, "global_step": 172817, "epoch": 2082} {"train_loss": -23.355466842651367, "global_step": 172818, "epoch": 2082} {"train_loss": -23.397558212280273, "global_step": 172819, "epoch": 2082} {"train_loss": -23.75441551208496, "global_step": 172820, "epoch": 2082} {"train_loss": -23.153295516967773, "global_step": 172821, "epoch": 2082} {"train_loss": -23.928659439086914, "global_step": 172822, "epoch": 2082} {"train_loss": -23.495758056640625, "global_step": 172823, "epoch": 2082} {"train_loss": -23.392044067382812, "global_step": 172824, "epoch": 2082} {"train_loss": -23.37007713317871, "global_step": 172825, "epoch": 2082} {"train_loss": -23.41878318786621, "global_step": 172826, "epoch": 2082} {"train_loss": -23.410663604736328, "global_step": 172827, "epoch": 2082} {"train_loss": -23.349821090698242, "global_step": 172828, "epoch": 2082} {"train_loss": -23.523107528686523, "global_step": 172829, "epoch": 2082} {"train_loss": -23.819915771484375, "global_step": 172830, "epoch": 2082} {"train_loss": -23.241622924804688, "global_step": 172831, "epoch": 2082} {"train_loss": -23.62747573852539, "global_step": 172832, "epoch": 2082} {"train_loss": -23.71466827392578, "global_step": 172833, "epoch": 2082} {"train_loss": -23.60702896118164, "global_step": 172834, "epoch": 2082} {"train_loss": -24.090070724487305, "global_step": 172835, "epoch": 2082} {"train_loss": -23.729583740234375, "global_step": 172836, "epoch": 2082} {"train_loss": -23.7724666595459, "global_step": 172837, "epoch": 2082} {"train_loss": -23.703449249267578, "global_step": 172838, "epoch": 2082} {"train_loss": -24.013914108276367, "global_step": 172839, "epoch": 2082} {"train_loss": -23.903772354125977, "global_step": 172840, "epoch": 2082} {"train_loss": -24.170169830322266, "global_step": 172841, "epoch": 2082} {"train_loss": -23.77768325805664, "global_step": 172842, "epoch": 2082} {"train_loss": -23.892658233642578, "global_step": 172843, "epoch": 2082} {"train_loss": -23.807941436767578, "global_step": 172844, "epoch": 2082} {"train_loss": -23.983461380004883, "global_step": 172845, "epoch": 2082} {"train_loss": -23.4910831451416, "global_step": 172846, "epoch": 2082} {"train_loss": -23.852157592773438, "global_step": 172847, "epoch": 2082} {"train_loss": -23.51787757873535, "global_step": 172848, "epoch": 2082} {"train_loss": -23.686729431152344, "global_step": 172849, "epoch": 2082} {"train_loss": -23.727142333984375, "global_step": 172850, "epoch": 2082} {"train_loss": -24.0477352142334, "global_step": 172851, "epoch": 2082} {"train_loss": -23.917333602905273, "global_step": 172852, "epoch": 2082} {"train_loss": -23.510534286499023, "global_step": 172853, "epoch": 2082} {"train_loss": -23.43422508239746, "global_step": 172854, "epoch": 2082} {"train_loss": -23.969881057739258, "global_step": 172855, "epoch": 2082} {"train_loss": -24.317916870117188, "global_step": 172856, "epoch": 2082} {"train_loss": -23.556095123291016, "global_step": 172857, "epoch": 2082} {"train_loss": -23.71295166015625, "global_step": 172858, "epoch": 2082} {"train_loss": -23.61439323425293, "global_step": 172859, "epoch": 2082} {"train_loss": -23.239463806152344, "global_step": 172860, "epoch": 2082} {"train_loss": -23.332929611206055, "global_step": 172861, "epoch": 2082} {"train_loss": -23.809961318969727, "global_step": 172862, "epoch": 2082} {"train_loss": -24.019603729248047, "global_step": 172863, "epoch": 2082} {"train_loss": -23.314716339111328, "global_step": 172864, "epoch": 2082} {"train_loss": -23.572002410888672, "global_step": 172865, "epoch": 2082} {"train_loss": -23.870695114135742, "global_step": 172866, "epoch": 2082} {"train_loss": -23.95370864868164, "global_step": 172867, "epoch": 2082} {"train_loss": -23.42838478088379, "global_step": 172868, "epoch": 2082} {"train_loss": -23.844717025756836, "global_step": 172869, "epoch": 2082} {"train_loss": -23.560436248779297, "global_step": 172870, "epoch": 2082} {"train_loss": -23.438928604125977, "global_step": 172871, "epoch": 2082} {"train_loss": -23.804258346557617, "global_step": 172872, "epoch": 2082} {"train_loss": -23.28572654724121, "global_step": 172873, "epoch": 2082} {"train_loss": -23.77650260925293, "global_step": 172874, "epoch": 2082} {"train_loss": -23.509679794311523, "global_step": 172875, "epoch": 2082} {"train_loss": -23.655553817749023, "global_step": 172876, "epoch": 2082} {"train_loss": -23.283689498901367, "global_step": 172877, "epoch": 2082} {"train_loss": -23.614704132080078, "global_step": 172878, "epoch": 2082} {"train_loss": -23.725889205932617, "global_step": 172879, "epoch": 2082} {"train_loss": -23.271211624145508, "global_step": 172880, "epoch": 2082} {"train_loss": -23.776514053344727, "global_step": 172881, "epoch": 2082} {"train_loss": -23.704023361206055, "global_step": 172882, "epoch": 2082} {"train_loss": -23.655866622924805, "global_step": 172883, "epoch": 2082} {"train_loss": -23.93404197692871, "global_step": 172884, "epoch": 2082} {"train_loss": -23.66158103942871, "global_step": 172885, "epoch": 2082} {"train_loss": -23.880313873291016, "global_step": 172886, "epoch": 2082} {"train_loss": -23.74863052368164, "global_step": 172887, "epoch": 2082} {"train_loss": -23.591635646590266, "global_step": 172888, "epoch": 2082, "val_loss": 6409331.0} {"train_loss": -23.6971492767334, "global_step": 172889, "epoch": 2083} {"train_loss": -23.479236602783203, "global_step": 172890, "epoch": 2083} {"train_loss": -23.228208541870117, "global_step": 172891, "epoch": 2083} {"train_loss": -23.657262802124023, "global_step": 172892, "epoch": 2083} {"train_loss": -23.695575714111328, "global_step": 172893, "epoch": 2083} {"train_loss": -23.606468200683594, "global_step": 172894, "epoch": 2083} {"train_loss": -23.29378318786621, "global_step": 172895, "epoch": 2083} {"train_loss": -23.564207077026367, "global_step": 172896, "epoch": 2083} {"train_loss": -23.622262954711914, "global_step": 172897, "epoch": 2083} {"train_loss": -23.82037925720215, "global_step": 172898, "epoch": 2083} {"train_loss": -23.2884578704834, "global_step": 172899, "epoch": 2083} {"train_loss": -23.651779174804688, "global_step": 172900, "epoch": 2083} {"train_loss": -23.97414207458496, "global_step": 172901, "epoch": 2083} {"train_loss": -23.281631469726562, "global_step": 172902, "epoch": 2083} {"train_loss": -23.652902603149414, "global_step": 172903, "epoch": 2083} {"train_loss": -23.953327178955078, "global_step": 172904, "epoch": 2083} {"train_loss": -23.85209083557129, "global_step": 172905, "epoch": 2083} {"train_loss": -23.796615600585938, "global_step": 172906, "epoch": 2083} {"train_loss": -23.967247009277344, "global_step": 172907, "epoch": 2083} {"train_loss": -23.775991439819336, "global_step": 172908, "epoch": 2083} {"train_loss": -23.662267684936523, "global_step": 172909, "epoch": 2083} {"train_loss": -23.629045486450195, "global_step": 172910, "epoch": 2083} {"train_loss": -23.669599533081055, "global_step": 172911, "epoch": 2083} {"train_loss": -23.360828399658203, "global_step": 172912, "epoch": 2083} {"train_loss": -23.553539276123047, "global_step": 172913, "epoch": 2083} {"train_loss": -23.286346435546875, "global_step": 172914, "epoch": 2083} {"train_loss": -23.89658546447754, "global_step": 172915, "epoch": 2083} {"train_loss": -23.66078758239746, "global_step": 172916, "epoch": 2083} {"train_loss": -24.080718994140625, "global_step": 172917, "epoch": 2083} {"train_loss": -23.86664581298828, "global_step": 172918, "epoch": 2083} {"train_loss": -23.891910552978516, "global_step": 172919, "epoch": 2083} {"train_loss": -23.567100524902344, "global_step": 172920, "epoch": 2083} {"train_loss": -23.84769058227539, "global_step": 172921, "epoch": 2083} {"train_loss": -23.50667381286621, "global_step": 172922, "epoch": 2083} {"train_loss": -23.90419578552246, "global_step": 172923, "epoch": 2083} {"train_loss": -23.968992233276367, "global_step": 172924, "epoch": 2083} {"train_loss": -24.01173210144043, "global_step": 172925, "epoch": 2083} {"train_loss": -23.8673095703125, "global_step": 172926, "epoch": 2083} {"train_loss": -24.0533447265625, "global_step": 172927, "epoch": 2083} {"train_loss": -23.795757293701172, "global_step": 172928, "epoch": 2083} {"train_loss": -23.792499542236328, "global_step": 172929, "epoch": 2083} {"train_loss": -23.516056060791016, "global_step": 172930, "epoch": 2083} {"train_loss": -23.955123901367188, "global_step": 172931, "epoch": 2083} {"train_loss": -23.510818481445312, "global_step": 172932, "epoch": 2083} {"train_loss": -23.502933502197266, "global_step": 172933, "epoch": 2083} {"train_loss": -23.871627807617188, "global_step": 172934, "epoch": 2083} {"train_loss": -24.062284469604492, "global_step": 172935, "epoch": 2083} {"train_loss": -24.146438598632812, "global_step": 172936, "epoch": 2083} {"train_loss": -23.656991958618164, "global_step": 172937, "epoch": 2083} {"train_loss": -23.974241256713867, "global_step": 172938, "epoch": 2083} {"train_loss": -23.896787643432617, "global_step": 172939, "epoch": 2083} {"train_loss": -23.43308448791504, "global_step": 172940, "epoch": 2083} {"train_loss": -23.701126098632812, "global_step": 172941, "epoch": 2083} {"train_loss": -23.951391220092773, "global_step": 172942, "epoch": 2083} {"train_loss": -23.606403350830078, "global_step": 172943, "epoch": 2083} {"train_loss": -24.003660202026367, "global_step": 172944, "epoch": 2083} {"train_loss": -23.885051727294922, "global_step": 172945, "epoch": 2083} {"train_loss": -23.980154037475586, "global_step": 172946, "epoch": 2083} {"train_loss": -23.624034881591797, "global_step": 172947, "epoch": 2083} {"train_loss": -23.805301666259766, "global_step": 172948, "epoch": 2083} {"train_loss": -24.046850204467773, "global_step": 172949, "epoch": 2083} {"train_loss": -23.903200149536133, "global_step": 172950, "epoch": 2083} {"train_loss": -23.972549438476562, "global_step": 172951, "epoch": 2083} {"train_loss": -23.96668815612793, "global_step": 172952, "epoch": 2083} {"train_loss": -23.792041778564453, "global_step": 172953, "epoch": 2083} {"train_loss": -23.82027816772461, "global_step": 172954, "epoch": 2083} {"train_loss": -23.456214904785156, "global_step": 172955, "epoch": 2083} {"train_loss": -24.042327880859375, "global_step": 172956, "epoch": 2083} {"train_loss": -23.6225643157959, "global_step": 172957, "epoch": 2083} {"train_loss": -23.56280517578125, "global_step": 172958, "epoch": 2083} {"train_loss": -23.75635528564453, "global_step": 172959, "epoch": 2083} {"train_loss": -24.111852645874023, "global_step": 172960, "epoch": 2083} {"train_loss": -23.72892951965332, "global_step": 172961, "epoch": 2083} {"train_loss": -23.87444496154785, "global_step": 172962, "epoch": 2083} {"train_loss": -23.891496658325195, "global_step": 172963, "epoch": 2083} {"train_loss": -23.599905014038086, "global_step": 172964, "epoch": 2083} {"train_loss": -23.645105361938477, "global_step": 172965, "epoch": 2083} {"train_loss": -23.831817626953125, "global_step": 172966, "epoch": 2083} {"train_loss": -24.083044052124023, "global_step": 172967, "epoch": 2083} {"train_loss": -23.90723419189453, "global_step": 172968, "epoch": 2083} {"train_loss": -24.275659561157227, "global_step": 172969, "epoch": 2083} {"train_loss": -23.580575942993164, "global_step": 172970, "epoch": 2083} {"train_loss": -23.767903109630907, "global_step": 172971, "epoch": 2083, "val_loss": 6519676.0} {"train_loss": -23.417783737182617, "global_step": 172972, "epoch": 2084} {"train_loss": -23.082183837890625, "global_step": 172973, "epoch": 2084} {"train_loss": -23.079145431518555, "global_step": 172974, "epoch": 2084} {"train_loss": -23.983154296875, "global_step": 172975, "epoch": 2084} {"train_loss": -23.53143310546875, "global_step": 172976, "epoch": 2084} {"train_loss": -22.755905151367188, "global_step": 172977, "epoch": 2084} {"train_loss": -23.0572566986084, "global_step": 172978, "epoch": 2084} {"train_loss": -23.762226104736328, "global_step": 172979, "epoch": 2084} {"train_loss": -23.04377555847168, "global_step": 172980, "epoch": 2084} {"train_loss": -23.68315315246582, "global_step": 172981, "epoch": 2084} {"train_loss": -23.338457107543945, "global_step": 172982, "epoch": 2084} {"train_loss": -23.56022071838379, "global_step": 172983, "epoch": 2084} {"train_loss": -23.415130615234375, "global_step": 172984, "epoch": 2084} {"train_loss": -23.711828231811523, "global_step": 172985, "epoch": 2084} {"train_loss": -23.517213821411133, "global_step": 172986, "epoch": 2084} {"train_loss": -23.317890167236328, "global_step": 172987, "epoch": 2084} {"train_loss": -23.18983268737793, "global_step": 172988, "epoch": 2084} {"train_loss": -23.500486373901367, "global_step": 172989, "epoch": 2084} {"train_loss": -23.548582077026367, "global_step": 172990, "epoch": 2084} {"train_loss": -23.54576873779297, "global_step": 172991, "epoch": 2084} {"train_loss": -23.891769409179688, "global_step": 172992, "epoch": 2084} {"train_loss": -23.57309913635254, "global_step": 172993, "epoch": 2084} {"train_loss": -23.576297760009766, "global_step": 172994, "epoch": 2084} {"train_loss": -23.76694679260254, "global_step": 172995, "epoch": 2084} {"train_loss": -23.953388214111328, "global_step": 172996, "epoch": 2084} {"train_loss": -23.511037826538086, "global_step": 172997, "epoch": 2084} {"train_loss": -23.675830841064453, "global_step": 172998, "epoch": 2084} {"train_loss": -23.69771385192871, "global_step": 172999, "epoch": 2084} {"train_loss": -23.58829116821289, "global_step": 173000, "epoch": 2084} {"train_loss": -23.652708053588867, "global_step": 173001, "epoch": 2084} {"train_loss": -23.70643424987793, "global_step": 173002, "epoch": 2084} {"train_loss": -23.812007904052734, "global_step": 173003, "epoch": 2084} {"train_loss": -23.660491943359375, "global_step": 173004, "epoch": 2084} {"train_loss": -23.660385131835938, "global_step": 173005, "epoch": 2084} {"train_loss": -23.389934539794922, "global_step": 173006, "epoch": 2084} {"train_loss": -23.5859432220459, "global_step": 173007, "epoch": 2084} {"train_loss": -23.617334365844727, "global_step": 173008, "epoch": 2084} {"train_loss": -23.68659019470215, "global_step": 173009, "epoch": 2084} {"train_loss": -23.86159896850586, "global_step": 173010, "epoch": 2084} {"train_loss": -23.4945125579834, "global_step": 173011, "epoch": 2084} {"train_loss": -23.47100830078125, "global_step": 173012, "epoch": 2084} {"train_loss": -23.786672592163086, "global_step": 173013, "epoch": 2084} {"train_loss": -23.886762619018555, "global_step": 173014, "epoch": 2084} {"train_loss": -23.539548873901367, "global_step": 173015, "epoch": 2084} {"train_loss": -23.34427261352539, "global_step": 173016, "epoch": 2084} {"train_loss": -23.774150848388672, "global_step": 173017, "epoch": 2084} {"train_loss": -23.691238403320312, "global_step": 173018, "epoch": 2084} {"train_loss": -23.578594207763672, "global_step": 173019, "epoch": 2084} {"train_loss": -23.564977645874023, "global_step": 173020, "epoch": 2084} {"train_loss": -24.035865783691406, "global_step": 173021, "epoch": 2084} {"train_loss": -23.607990264892578, "global_step": 173022, "epoch": 2084} {"train_loss": -24.050365447998047, "global_step": 173023, "epoch": 2084} {"train_loss": -23.81937026977539, "global_step": 173024, "epoch": 2084} {"train_loss": -23.685827255249023, "global_step": 173025, "epoch": 2084} {"train_loss": -24.049673080444336, "global_step": 173026, "epoch": 2084} {"train_loss": -23.517127990722656, "global_step": 173027, "epoch": 2084} {"train_loss": -23.928220748901367, "global_step": 173028, "epoch": 2084} {"train_loss": -23.391626358032227, "global_step": 173029, "epoch": 2084} {"train_loss": -23.861873626708984, "global_step": 173030, "epoch": 2084} {"train_loss": -23.723691940307617, "global_step": 173031, "epoch": 2084} {"train_loss": -23.7613525390625, "global_step": 173032, "epoch": 2084} {"train_loss": -23.78578758239746, "global_step": 173033, "epoch": 2084} {"train_loss": -23.687469482421875, "global_step": 173034, "epoch": 2084} {"train_loss": -23.976232528686523, "global_step": 173035, "epoch": 2084} {"train_loss": -23.657331466674805, "global_step": 173036, "epoch": 2084} {"train_loss": -23.302589416503906, "global_step": 173037, "epoch": 2084} {"train_loss": -23.760698318481445, "global_step": 173038, "epoch": 2084} {"train_loss": -23.5135498046875, "global_step": 173039, "epoch": 2084} {"train_loss": -24.016233444213867, "global_step": 173040, "epoch": 2084} {"train_loss": -23.5664005279541, "global_step": 173041, "epoch": 2084} {"train_loss": -23.765073776245117, "global_step": 173042, "epoch": 2084} {"train_loss": -23.444137573242188, "global_step": 173043, "epoch": 2084} {"train_loss": -23.938806533813477, "global_step": 173044, "epoch": 2084} {"train_loss": -23.640426635742188, "global_step": 173045, "epoch": 2084} {"train_loss": -23.83941650390625, "global_step": 173046, "epoch": 2084} {"train_loss": -23.804996490478516, "global_step": 173047, "epoch": 2084} {"train_loss": -23.93600845336914, "global_step": 173048, "epoch": 2084} {"train_loss": -23.669660568237305, "global_step": 173049, "epoch": 2084} {"train_loss": -23.48638343811035, "global_step": 173050, "epoch": 2084} {"train_loss": -23.788612365722656, "global_step": 173051, "epoch": 2084} {"train_loss": -24.026416778564453, "global_step": 173052, "epoch": 2084} {"train_loss": -23.984891891479492, "global_step": 173053, "epoch": 2084} {"train_loss": -23.65539504821042, "global_step": 173054, "epoch": 2084, "val_loss": 6382507.0} {"train_loss": -23.46510124206543, "global_step": 173055, "epoch": 2085} {"train_loss": -23.251291275024414, "global_step": 173056, "epoch": 2085} {"train_loss": -23.087261199951172, "global_step": 173057, "epoch": 2085} {"train_loss": -23.669052124023438, "global_step": 173058, "epoch": 2085} {"train_loss": -23.46734619140625, "global_step": 173059, "epoch": 2085} {"train_loss": -23.30234718322754, "global_step": 173060, "epoch": 2085} {"train_loss": -23.107894897460938, "global_step": 173061, "epoch": 2085} {"train_loss": -23.94889259338379, "global_step": 173062, "epoch": 2085} {"train_loss": -23.01388931274414, "global_step": 173063, "epoch": 2085} {"train_loss": -23.338834762573242, "global_step": 173064, "epoch": 2085} {"train_loss": -23.207103729248047, "global_step": 173065, "epoch": 2085} {"train_loss": -23.953367233276367, "global_step": 173066, "epoch": 2085} {"train_loss": -23.346773147583008, "global_step": 173067, "epoch": 2085} {"train_loss": -23.49259376525879, "global_step": 173068, "epoch": 2085} {"train_loss": -23.161548614501953, "global_step": 173069, "epoch": 2085} {"train_loss": -23.5862979888916, "global_step": 173070, "epoch": 2085} {"train_loss": -23.85818099975586, "global_step": 173071, "epoch": 2085} {"train_loss": -23.219785690307617, "global_step": 173072, "epoch": 2085} {"train_loss": -23.791105270385742, "global_step": 173073, "epoch": 2085} {"train_loss": -23.56760597229004, "global_step": 173074, "epoch": 2085} {"train_loss": -23.656158447265625, "global_step": 173075, "epoch": 2085} {"train_loss": -23.53876495361328, "global_step": 173076, "epoch": 2085} {"train_loss": -23.615549087524414, "global_step": 173077, "epoch": 2085} {"train_loss": -23.788745880126953, "global_step": 173078, "epoch": 2085} {"train_loss": -23.74269676208496, "global_step": 173079, "epoch": 2085} {"train_loss": -23.122182846069336, "global_step": 173080, "epoch": 2085} {"train_loss": -23.580224990844727, "global_step": 173081, "epoch": 2085} {"train_loss": -23.76422691345215, "global_step": 173082, "epoch": 2085} {"train_loss": -23.48164939880371, "global_step": 173083, "epoch": 2085} {"train_loss": -23.724441528320312, "global_step": 173084, "epoch": 2085} {"train_loss": -23.854896545410156, "global_step": 173085, "epoch": 2085} {"train_loss": -23.607437133789062, "global_step": 173086, "epoch": 2085} {"train_loss": -23.584217071533203, "global_step": 173087, "epoch": 2085} {"train_loss": -23.53267478942871, "global_step": 173088, "epoch": 2085} {"train_loss": -23.806241989135742, "global_step": 173089, "epoch": 2085} {"train_loss": -23.430335998535156, "global_step": 173090, "epoch": 2085} {"train_loss": -23.93452262878418, "global_step": 173091, "epoch": 2085} {"train_loss": -23.886594772338867, "global_step": 173092, "epoch": 2085} {"train_loss": -23.384653091430664, "global_step": 173093, "epoch": 2085} {"train_loss": -23.802255630493164, "global_step": 173094, "epoch": 2085} {"train_loss": -23.751529693603516, "global_step": 173095, "epoch": 2085} {"train_loss": -23.7624454498291, "global_step": 173096, "epoch": 2085} {"train_loss": -23.950542449951172, "global_step": 173097, "epoch": 2085} {"train_loss": -23.811477661132812, "global_step": 173098, "epoch": 2085} {"train_loss": -24.02086067199707, "global_step": 173099, "epoch": 2085} {"train_loss": -23.816543579101562, "global_step": 173100, "epoch": 2085} {"train_loss": -24.028240203857422, "global_step": 173101, "epoch": 2085} {"train_loss": -24.046695709228516, "global_step": 173102, "epoch": 2085} {"train_loss": -23.82906150817871, "global_step": 173103, "epoch": 2085} {"train_loss": -23.803510665893555, "global_step": 173104, "epoch": 2085} {"train_loss": -23.897672653198242, "global_step": 173105, "epoch": 2085} {"train_loss": -23.685049057006836, "global_step": 173106, "epoch": 2085} {"train_loss": -24.003202438354492, "global_step": 173107, "epoch": 2085} {"train_loss": -24.040372848510742, "global_step": 173108, "epoch": 2085} {"train_loss": -23.92563819885254, "global_step": 173109, "epoch": 2085} {"train_loss": -24.037616729736328, "global_step": 173110, "epoch": 2085} {"train_loss": -23.82756805419922, "global_step": 173111, "epoch": 2085} {"train_loss": -24.041418075561523, "global_step": 173112, "epoch": 2085} {"train_loss": -24.153709411621094, "global_step": 173113, "epoch": 2085} {"train_loss": -23.701496124267578, "global_step": 173114, "epoch": 2085} {"train_loss": -24.350555419921875, "global_step": 173115, "epoch": 2085} {"train_loss": -23.724504470825195, "global_step": 173116, "epoch": 2085} {"train_loss": -23.73946189880371, "global_step": 173117, "epoch": 2085} {"train_loss": -23.849721908569336, "global_step": 173118, "epoch": 2085} {"train_loss": -23.658517837524414, "global_step": 173119, "epoch": 2085} {"train_loss": -23.29982566833496, "global_step": 173120, "epoch": 2085} {"train_loss": -23.968564987182617, "global_step": 173121, "epoch": 2085} {"train_loss": -23.957611083984375, "global_step": 173122, "epoch": 2085} {"train_loss": -23.828044891357422, "global_step": 173123, "epoch": 2085} {"train_loss": -23.608112335205078, "global_step": 173124, "epoch": 2085} {"train_loss": -23.76706886291504, "global_step": 173125, "epoch": 2085} {"train_loss": -24.029211044311523, "global_step": 173126, "epoch": 2085} {"train_loss": -23.549392700195312, "global_step": 173127, "epoch": 2085} {"train_loss": -23.820905685424805, "global_step": 173128, "epoch": 2085} {"train_loss": -23.878997802734375, "global_step": 173129, "epoch": 2085} {"train_loss": -23.913776397705078, "global_step": 173130, "epoch": 2085} {"train_loss": -23.758377075195312, "global_step": 173131, "epoch": 2085} {"train_loss": -24.171239852905273, "global_step": 173132, "epoch": 2085} {"train_loss": -23.694517135620117, "global_step": 173133, "epoch": 2085} {"train_loss": -24.10221290588379, "global_step": 173134, "epoch": 2085} {"train_loss": -24.03948211669922, "global_step": 173135, "epoch": 2085} {"train_loss": -24.02821922302246, "global_step": 173136, "epoch": 2085} {"train_loss": -23.723408136023096, "global_step": 173137, "epoch": 2085, "val_loss": 6304485.0} {"train_loss": -23.58195686340332, "global_step": 173138, "epoch": 2086} {"train_loss": -23.525501251220703, "global_step": 173139, "epoch": 2086} {"train_loss": -23.15989112854004, "global_step": 173140, "epoch": 2086} {"train_loss": -23.39883804321289, "global_step": 173141, "epoch": 2086} {"train_loss": -23.432209014892578, "global_step": 173142, "epoch": 2086} {"train_loss": -23.28580093383789, "global_step": 173143, "epoch": 2086} {"train_loss": -23.558053970336914, "global_step": 173144, "epoch": 2086} {"train_loss": -23.166786193847656, "global_step": 173145, "epoch": 2086} {"train_loss": -23.215084075927734, "global_step": 173146, "epoch": 2086} {"train_loss": -23.36385154724121, "global_step": 173147, "epoch": 2086} {"train_loss": -23.420923233032227, "global_step": 173148, "epoch": 2086} {"train_loss": -23.431095123291016, "global_step": 173149, "epoch": 2086} {"train_loss": -23.753719329833984, "global_step": 173150, "epoch": 2086} {"train_loss": -23.715896606445312, "global_step": 173151, "epoch": 2086} {"train_loss": -23.634275436401367, "global_step": 173152, "epoch": 2086} {"train_loss": -23.648008346557617, "global_step": 173153, "epoch": 2086} {"train_loss": -24.005569458007812, "global_step": 173154, "epoch": 2086} {"train_loss": -23.678791046142578, "global_step": 173155, "epoch": 2086} {"train_loss": -23.530508041381836, "global_step": 173156, "epoch": 2086} {"train_loss": -23.7177791595459, "global_step": 173157, "epoch": 2086} {"train_loss": -23.940656661987305, "global_step": 173158, "epoch": 2086} {"train_loss": -23.906522750854492, "global_step": 173159, "epoch": 2086} {"train_loss": -23.801624298095703, "global_step": 173160, "epoch": 2086} {"train_loss": -23.626508712768555, "global_step": 173161, "epoch": 2086} {"train_loss": -23.957883834838867, "global_step": 173162, "epoch": 2086} {"train_loss": -23.296483993530273, "global_step": 173163, "epoch": 2086} {"train_loss": -23.471057891845703, "global_step": 173164, "epoch": 2086} {"train_loss": -23.896657943725586, "global_step": 173165, "epoch": 2086} {"train_loss": -23.584692001342773, "global_step": 173166, "epoch": 2086} {"train_loss": -23.817054748535156, "global_step": 173167, "epoch": 2086} {"train_loss": -23.712797164916992, "global_step": 173168, "epoch": 2086} {"train_loss": -23.67301368713379, "global_step": 173169, "epoch": 2086} {"train_loss": -23.910682678222656, "global_step": 173170, "epoch": 2086} {"train_loss": -24.112897872924805, "global_step": 173171, "epoch": 2086} {"train_loss": -23.777799606323242, "global_step": 173172, "epoch": 2086} {"train_loss": -23.756778717041016, "global_step": 173173, "epoch": 2086} {"train_loss": -23.534893035888672, "global_step": 173174, "epoch": 2086} {"train_loss": -23.799701690673828, "global_step": 173175, "epoch": 2086} {"train_loss": -23.89874839782715, "global_step": 173176, "epoch": 2086} {"train_loss": -24.25583839416504, "global_step": 173177, "epoch": 2086} {"train_loss": -24.163679122924805, "global_step": 173178, "epoch": 2086} {"train_loss": -23.810962677001953, "global_step": 173179, "epoch": 2086} {"train_loss": -24.309051513671875, "global_step": 173180, "epoch": 2086} {"train_loss": -23.683927536010742, "global_step": 173181, "epoch": 2086} {"train_loss": -23.924577713012695, "global_step": 173182, "epoch": 2086} {"train_loss": -23.706344604492188, "global_step": 173183, "epoch": 2086} {"train_loss": -23.22572135925293, "global_step": 173184, "epoch": 2086} {"train_loss": -23.626567840576172, "global_step": 173185, "epoch": 2086} {"train_loss": -23.602575302124023, "global_step": 173186, "epoch": 2086} {"train_loss": -24.295989990234375, "global_step": 173187, "epoch": 2086} {"train_loss": -23.774757385253906, "global_step": 173188, "epoch": 2086} {"train_loss": -23.5457763671875, "global_step": 173189, "epoch": 2086} {"train_loss": -23.40620231628418, "global_step": 173190, "epoch": 2086} {"train_loss": -23.797719955444336, "global_step": 173191, "epoch": 2086} {"train_loss": -23.541336059570312, "global_step": 173192, "epoch": 2086} {"train_loss": -24.01849937438965, "global_step": 173193, "epoch": 2086} {"train_loss": -24.036977767944336, "global_step": 173194, "epoch": 2086} {"train_loss": -23.50775146484375, "global_step": 173195, "epoch": 2086} {"train_loss": -23.536962509155273, "global_step": 173196, "epoch": 2086} {"train_loss": -23.44757652282715, "global_step": 173197, "epoch": 2086} {"train_loss": -24.14403533935547, "global_step": 173198, "epoch": 2086} {"train_loss": -23.831314086914062, "global_step": 173199, "epoch": 2086} {"train_loss": -23.738080978393555, "global_step": 173200, "epoch": 2086} {"train_loss": -23.408742904663086, "global_step": 173201, "epoch": 2086} {"train_loss": -23.682722091674805, "global_step": 173202, "epoch": 2086} {"train_loss": -23.8061580657959, "global_step": 173203, "epoch": 2086} {"train_loss": -23.757556915283203, "global_step": 173204, "epoch": 2086} {"train_loss": -23.852752685546875, "global_step": 173205, "epoch": 2086} {"train_loss": -23.632755279541016, "global_step": 173206, "epoch": 2086} {"train_loss": -24.029273986816406, "global_step": 173207, "epoch": 2086} {"train_loss": -23.529394149780273, "global_step": 173208, "epoch": 2086} {"train_loss": -23.65740966796875, "global_step": 173209, "epoch": 2086} {"train_loss": -23.94868278503418, "global_step": 173210, "epoch": 2086} {"train_loss": -23.979177474975586, "global_step": 173211, "epoch": 2086} {"train_loss": -24.122854232788086, "global_step": 173212, "epoch": 2086} {"train_loss": -23.844141006469727, "global_step": 173213, "epoch": 2086} {"train_loss": -23.666229248046875, "global_step": 173214, "epoch": 2086} {"train_loss": -23.5366153717041, "global_step": 173215, "epoch": 2086} {"train_loss": -24.164947509765625, "global_step": 173216, "epoch": 2086} {"train_loss": -24.095516204833984, "global_step": 173217, "epoch": 2086} {"train_loss": -23.846240997314453, "global_step": 173218, "epoch": 2086} {"train_loss": -23.83724021911621, "global_step": 173219, "epoch": 2086} {"train_loss": -23.712642324976173, "global_step": 173220, "epoch": 2086, "val_loss": 6393660.5} {"train_loss": -23.415136337280273, "global_step": 173221, "epoch": 2087} {"train_loss": -23.31735610961914, "global_step": 173222, "epoch": 2087} {"train_loss": -23.72045135498047, "global_step": 173223, "epoch": 2087} {"train_loss": -23.187780380249023, "global_step": 173224, "epoch": 2087} {"train_loss": -23.443464279174805, "global_step": 173225, "epoch": 2087} {"train_loss": -23.44500160217285, "global_step": 173226, "epoch": 2087} {"train_loss": -23.839895248413086, "global_step": 173227, "epoch": 2087} {"train_loss": -23.29525375366211, "global_step": 173228, "epoch": 2087} {"train_loss": -23.701217651367188, "global_step": 173229, "epoch": 2087} {"train_loss": -23.393281936645508, "global_step": 173230, "epoch": 2087} {"train_loss": -23.463895797729492, "global_step": 173231, "epoch": 2087} {"train_loss": -23.42609977722168, "global_step": 173232, "epoch": 2087} {"train_loss": -23.690258026123047, "global_step": 173233, "epoch": 2087} {"train_loss": -23.849483489990234, "global_step": 173234, "epoch": 2087} {"train_loss": -23.59601593017578, "global_step": 173235, "epoch": 2087} {"train_loss": -23.741548538208008, "global_step": 173236, "epoch": 2087} {"train_loss": -23.580015182495117, "global_step": 173237, "epoch": 2087} {"train_loss": -23.894332885742188, "global_step": 173238, "epoch": 2087} {"train_loss": -24.014484405517578, "global_step": 173239, "epoch": 2087} {"train_loss": -23.43603515625, "global_step": 173240, "epoch": 2087} {"train_loss": -23.717304229736328, "global_step": 173241, "epoch": 2087} {"train_loss": -23.515600204467773, "global_step": 173242, "epoch": 2087} {"train_loss": -23.555898666381836, "global_step": 173243, "epoch": 2087} {"train_loss": -23.838518142700195, "global_step": 173244, "epoch": 2087} {"train_loss": -23.454666137695312, "global_step": 173245, "epoch": 2087} {"train_loss": -23.911457061767578, "global_step": 173246, "epoch": 2087} {"train_loss": -24.405380249023438, "global_step": 173247, "epoch": 2087} {"train_loss": -23.879505157470703, "global_step": 173248, "epoch": 2087} {"train_loss": -23.73477554321289, "global_step": 173249, "epoch": 2087} {"train_loss": -23.765037536621094, "global_step": 173250, "epoch": 2087} {"train_loss": -23.550870895385742, "global_step": 173251, "epoch": 2087} {"train_loss": -23.794347763061523, "global_step": 173252, "epoch": 2087} {"train_loss": -24.002769470214844, "global_step": 173253, "epoch": 2087} {"train_loss": -23.991968154907227, "global_step": 173254, "epoch": 2087} {"train_loss": -23.856069564819336, "global_step": 173255, "epoch": 2087} {"train_loss": -23.701053619384766, "global_step": 173256, "epoch": 2087} {"train_loss": -23.711713790893555, "global_step": 173257, "epoch": 2087} {"train_loss": -24.165937423706055, "global_step": 173258, "epoch": 2087} {"train_loss": -23.86376190185547, "global_step": 173259, "epoch": 2087} {"train_loss": -23.95353126525879, "global_step": 173260, "epoch": 2087} {"train_loss": -23.926977157592773, "global_step": 173261, "epoch": 2087} {"train_loss": -23.95046043395996, "global_step": 173262, "epoch": 2087} {"train_loss": -23.913785934448242, "global_step": 173263, "epoch": 2087} {"train_loss": -23.931270599365234, "global_step": 173264, "epoch": 2087} {"train_loss": -23.90359878540039, "global_step": 173265, "epoch": 2087} {"train_loss": -24.18348503112793, "global_step": 173266, "epoch": 2087} {"train_loss": -24.029569625854492, "global_step": 173267, "epoch": 2087} {"train_loss": -23.865049362182617, "global_step": 173268, "epoch": 2087} {"train_loss": -23.231006622314453, "global_step": 173269, "epoch": 2087} {"train_loss": -23.394454956054688, "global_step": 173270, "epoch": 2087} {"train_loss": -23.450965881347656, "global_step": 173271, "epoch": 2087} {"train_loss": -23.927875518798828, "global_step": 173272, "epoch": 2087} {"train_loss": -23.901187896728516, "global_step": 173273, "epoch": 2087} {"train_loss": -23.649019241333008, "global_step": 173274, "epoch": 2087} {"train_loss": -23.779054641723633, "global_step": 173275, "epoch": 2087} {"train_loss": -24.040225982666016, "global_step": 173276, "epoch": 2087} {"train_loss": -23.74114418029785, "global_step": 173277, "epoch": 2087} {"train_loss": -23.8471736907959, "global_step": 173278, "epoch": 2087} {"train_loss": -23.30393409729004, "global_step": 173279, "epoch": 2087} {"train_loss": -23.84519386291504, "global_step": 173280, "epoch": 2087} {"train_loss": -23.636585235595703, "global_step": 173281, "epoch": 2087} {"train_loss": -24.194290161132812, "global_step": 173282, "epoch": 2087} {"train_loss": -23.760705947875977, "global_step": 173283, "epoch": 2087} {"train_loss": -23.7548885345459, "global_step": 173284, "epoch": 2087} {"train_loss": -23.910816192626953, "global_step": 173285, "epoch": 2087} {"train_loss": -23.76175308227539, "global_step": 173286, "epoch": 2087} {"train_loss": -23.996519088745117, "global_step": 173287, "epoch": 2087} {"train_loss": -23.876407623291016, "global_step": 173288, "epoch": 2087} {"train_loss": -23.7823429107666, "global_step": 173289, "epoch": 2087} {"train_loss": -23.36934471130371, "global_step": 173290, "epoch": 2087} {"train_loss": -23.482181549072266, "global_step": 173291, "epoch": 2087} {"train_loss": -23.3117733001709, "global_step": 173292, "epoch": 2087} {"train_loss": -23.818023681640625, "global_step": 173293, "epoch": 2087} {"train_loss": -23.63610076904297, "global_step": 173294, "epoch": 2087} {"train_loss": -23.710805892944336, "global_step": 173295, "epoch": 2087} {"train_loss": -23.637033462524414, "global_step": 173296, "epoch": 2087} {"train_loss": -24.234643936157227, "global_step": 173297, "epoch": 2087} {"train_loss": -23.602575302124023, "global_step": 173298, "epoch": 2087} {"train_loss": -23.96961784362793, "global_step": 173299, "epoch": 2087} {"train_loss": -23.735761642456055, "global_step": 173300, "epoch": 2087} {"train_loss": -23.691802978515625, "global_step": 173301, "epoch": 2087} {"train_loss": -23.48641586303711, "global_step": 173302, "epoch": 2087} {"train_loss": -23.727319028004107, "global_step": 173303, "epoch": 2087, "val_loss": 6445346.0} {"train_loss": -23.27081871032715, "global_step": 173304, "epoch": 2088} {"train_loss": -22.826616287231445, "global_step": 173305, "epoch": 2088} {"train_loss": -22.8909969329834, "global_step": 173306, "epoch": 2088} {"train_loss": -23.752614974975586, "global_step": 173307, "epoch": 2088} {"train_loss": -23.461795806884766, "global_step": 173308, "epoch": 2088} {"train_loss": -23.477712631225586, "global_step": 173309, "epoch": 2088} {"train_loss": -23.61964988708496, "global_step": 173310, "epoch": 2088} {"train_loss": -23.814695358276367, "global_step": 173311, "epoch": 2088} {"train_loss": -23.464019775390625, "global_step": 173312, "epoch": 2088} {"train_loss": -23.639406204223633, "global_step": 173313, "epoch": 2088} {"train_loss": -23.569377899169922, "global_step": 173314, "epoch": 2088} {"train_loss": -23.540903091430664, "global_step": 173315, "epoch": 2088} {"train_loss": -23.141233444213867, "global_step": 173316, "epoch": 2088} {"train_loss": -23.45331382751465, "global_step": 173317, "epoch": 2088} {"train_loss": -23.569311141967773, "global_step": 173318, "epoch": 2088} {"train_loss": -23.458816528320312, "global_step": 173319, "epoch": 2088} {"train_loss": -23.670978546142578, "global_step": 173320, "epoch": 2088} {"train_loss": -23.58932113647461, "global_step": 173321, "epoch": 2088} {"train_loss": -23.46088981628418, "global_step": 173322, "epoch": 2088} {"train_loss": -23.50801658630371, "global_step": 173323, "epoch": 2088} {"train_loss": -23.76725196838379, "global_step": 173324, "epoch": 2088} {"train_loss": -24.005613327026367, "global_step": 173325, "epoch": 2088} {"train_loss": -23.587804794311523, "global_step": 173326, "epoch": 2088} {"train_loss": -23.546741485595703, "global_step": 173327, "epoch": 2088} {"train_loss": -23.860700607299805, "global_step": 173328, "epoch": 2088} {"train_loss": -23.741933822631836, "global_step": 173329, "epoch": 2088} {"train_loss": -23.965307235717773, "global_step": 173330, "epoch": 2088} {"train_loss": -23.69119644165039, "global_step": 173331, "epoch": 2088} {"train_loss": -24.151565551757812, "global_step": 173332, "epoch": 2088} {"train_loss": -23.945283889770508, "global_step": 173333, "epoch": 2088} {"train_loss": -23.466909408569336, "global_step": 173334, "epoch": 2088} {"train_loss": -23.588703155517578, "global_step": 173335, "epoch": 2088} {"train_loss": -23.5570068359375, "global_step": 173336, "epoch": 2088} {"train_loss": -23.655986785888672, "global_step": 173337, "epoch": 2088} {"train_loss": -23.80217933654785, "global_step": 173338, "epoch": 2088} {"train_loss": -23.51638412475586, "global_step": 173339, "epoch": 2088} {"train_loss": -23.996091842651367, "global_step": 173340, "epoch": 2088} {"train_loss": -23.58576774597168, "global_step": 173341, "epoch": 2088} {"train_loss": -24.096464157104492, "global_step": 173342, "epoch": 2088} {"train_loss": -23.782756805419922, "global_step": 173343, "epoch": 2088} {"train_loss": -24.183820724487305, "global_step": 173344, "epoch": 2088} {"train_loss": -23.894668579101562, "global_step": 173345, "epoch": 2088} {"train_loss": -23.914953231811523, "global_step": 173346, "epoch": 2088} {"train_loss": -23.961406707763672, "global_step": 173347, "epoch": 2088} {"train_loss": -24.04327392578125, "global_step": 173348, "epoch": 2088} {"train_loss": -23.434696197509766, "global_step": 173349, "epoch": 2088} {"train_loss": -23.871347427368164, "global_step": 173350, "epoch": 2088} {"train_loss": -24.068134307861328, "global_step": 173351, "epoch": 2088} {"train_loss": -23.95809555053711, "global_step": 173352, "epoch": 2088} {"train_loss": -23.918277740478516, "global_step": 173353, "epoch": 2088} {"train_loss": -23.919342041015625, "global_step": 173354, "epoch": 2088} {"train_loss": -23.330907821655273, "global_step": 173355, "epoch": 2088} {"train_loss": -23.969289779663086, "global_step": 173356, "epoch": 2088} {"train_loss": -23.57027244567871, "global_step": 173357, "epoch": 2088} {"train_loss": -23.545475006103516, "global_step": 173358, "epoch": 2088} {"train_loss": -23.6768856048584, "global_step": 173359, "epoch": 2088} {"train_loss": -23.646923065185547, "global_step": 173360, "epoch": 2088} {"train_loss": -23.69677734375, "global_step": 173361, "epoch": 2088} {"train_loss": -23.57473373413086, "global_step": 173362, "epoch": 2088} {"train_loss": -23.765119552612305, "global_step": 173363, "epoch": 2088} {"train_loss": -23.670745849609375, "global_step": 173364, "epoch": 2088} {"train_loss": -23.87830924987793, "global_step": 173365, "epoch": 2088} {"train_loss": -23.717527389526367, "global_step": 173366, "epoch": 2088} {"train_loss": -23.252592086791992, "global_step": 173367, "epoch": 2088} {"train_loss": -23.587326049804688, "global_step": 173368, "epoch": 2088} {"train_loss": -23.63539695739746, "global_step": 173369, "epoch": 2088} {"train_loss": -23.689861297607422, "global_step": 173370, "epoch": 2088} {"train_loss": -23.67799949645996, "global_step": 173371, "epoch": 2088} {"train_loss": -23.956674575805664, "global_step": 173372, "epoch": 2088} {"train_loss": -23.58340835571289, "global_step": 173373, "epoch": 2088} {"train_loss": -23.848186492919922, "global_step": 173374, "epoch": 2088} {"train_loss": -23.807950973510742, "global_step": 173375, "epoch": 2088} {"train_loss": -24.121002197265625, "global_step": 173376, "epoch": 2088} {"train_loss": -23.8848876953125, "global_step": 173377, "epoch": 2088} {"train_loss": -23.38759422302246, "global_step": 173378, "epoch": 2088} {"train_loss": -23.802703857421875, "global_step": 173379, "epoch": 2088} {"train_loss": -23.694272994995117, "global_step": 173380, "epoch": 2088} {"train_loss": -23.605613708496094, "global_step": 173381, "epoch": 2088} {"train_loss": -23.576841354370117, "global_step": 173382, "epoch": 2088} {"train_loss": -23.261005401611328, "global_step": 173383, "epoch": 2088} {"train_loss": -23.931427001953125, "global_step": 173384, "epoch": 2088} {"train_loss": -23.332727432250977, "global_step": 173385, "epoch": 2088} {"train_loss": -23.67658909257636, "global_step": 173386, "epoch": 2088, "val_loss": 6415581.5} {"train_loss": -22.008657455444336, "global_step": 173387, "epoch": 2089} {"train_loss": -22.877567291259766, "global_step": 173388, "epoch": 2089} {"train_loss": -23.686630249023438, "global_step": 173389, "epoch": 2089} {"train_loss": -23.036161422729492, "global_step": 173390, "epoch": 2089} {"train_loss": -23.694473266601562, "global_step": 173391, "epoch": 2089} {"train_loss": -22.933876037597656, "global_step": 173392, "epoch": 2089} {"train_loss": -23.41585350036621, "global_step": 173393, "epoch": 2089} {"train_loss": -23.232376098632812, "global_step": 173394, "epoch": 2089} {"train_loss": -23.791345596313477, "global_step": 173395, "epoch": 2089} {"train_loss": -23.085031509399414, "global_step": 173396, "epoch": 2089} {"train_loss": -23.893814086914062, "global_step": 173397, "epoch": 2089} {"train_loss": -23.566953659057617, "global_step": 173398, "epoch": 2089} {"train_loss": -23.276657104492188, "global_step": 173399, "epoch": 2089} {"train_loss": -23.559539794921875, "global_step": 173400, "epoch": 2089} {"train_loss": -23.141651153564453, "global_step": 173401, "epoch": 2089} {"train_loss": -23.39989471435547, "global_step": 173402, "epoch": 2089} {"train_loss": -23.366653442382812, "global_step": 173403, "epoch": 2089} {"train_loss": -23.73055648803711, "global_step": 173404, "epoch": 2089} {"train_loss": -23.563528060913086, "global_step": 173405, "epoch": 2089} {"train_loss": -23.81435203552246, "global_step": 173406, "epoch": 2089} {"train_loss": -23.727426528930664, "global_step": 173407, "epoch": 2089} {"train_loss": -23.68792152404785, "global_step": 173408, "epoch": 2089} {"train_loss": -23.66274070739746, "global_step": 173409, "epoch": 2089} {"train_loss": -23.62409782409668, "global_step": 173410, "epoch": 2089} {"train_loss": -23.423389434814453, "global_step": 173411, "epoch": 2089} {"train_loss": -23.204500198364258, "global_step": 173412, "epoch": 2089} {"train_loss": -23.615468978881836, "global_step": 173413, "epoch": 2089} {"train_loss": -23.5545711517334, "global_step": 173414, "epoch": 2089} {"train_loss": -23.183122634887695, "global_step": 173415, "epoch": 2089} {"train_loss": -23.76716423034668, "global_step": 173416, "epoch": 2089} {"train_loss": -23.443737030029297, "global_step": 173417, "epoch": 2089} {"train_loss": -23.886056900024414, "global_step": 173418, "epoch": 2089} {"train_loss": -23.674266815185547, "global_step": 173419, "epoch": 2089} {"train_loss": -23.879117965698242, "global_step": 173420, "epoch": 2089} {"train_loss": -23.830717086791992, "global_step": 173421, "epoch": 2089} {"train_loss": -23.747224807739258, "global_step": 173422, "epoch": 2089} {"train_loss": -23.563560485839844, "global_step": 173423, "epoch": 2089} {"train_loss": -23.953100204467773, "global_step": 173424, "epoch": 2089} {"train_loss": -23.75806999206543, "global_step": 173425, "epoch": 2089} {"train_loss": -23.97791862487793, "global_step": 173426, "epoch": 2089} {"train_loss": -23.37971305847168, "global_step": 173427, "epoch": 2089} {"train_loss": -23.711044311523438, "global_step": 173428, "epoch": 2089} {"train_loss": -24.161975860595703, "global_step": 173429, "epoch": 2089} {"train_loss": -23.914093017578125, "global_step": 173430, "epoch": 2089} {"train_loss": -23.54243278503418, "global_step": 173431, "epoch": 2089} {"train_loss": -23.72517204284668, "global_step": 173432, "epoch": 2089} {"train_loss": -24.014726638793945, "global_step": 173433, "epoch": 2089} {"train_loss": -23.781187057495117, "global_step": 173434, "epoch": 2089} {"train_loss": -23.765398025512695, "global_step": 173435, "epoch": 2089} {"train_loss": -24.144216537475586, "global_step": 173436, "epoch": 2089} {"train_loss": -23.83095359802246, "global_step": 173437, "epoch": 2089} {"train_loss": -23.653913497924805, "global_step": 173438, "epoch": 2089} {"train_loss": -23.651288986206055, "global_step": 173439, "epoch": 2089} {"train_loss": -23.740591049194336, "global_step": 173440, "epoch": 2089} {"train_loss": -24.05274772644043, "global_step": 173441, "epoch": 2089} {"train_loss": -23.978912353515625, "global_step": 173442, "epoch": 2089} {"train_loss": -23.523250579833984, "global_step": 173443, "epoch": 2089} {"train_loss": -24.013612747192383, "global_step": 173444, "epoch": 2089} {"train_loss": -23.96674919128418, "global_step": 173445, "epoch": 2089} {"train_loss": -23.56707191467285, "global_step": 173446, "epoch": 2089} {"train_loss": -23.95639419555664, "global_step": 173447, "epoch": 2089} {"train_loss": -23.921173095703125, "global_step": 173448, "epoch": 2089} {"train_loss": -23.93243980407715, "global_step": 173449, "epoch": 2089} {"train_loss": -24.4491024017334, "global_step": 173450, "epoch": 2089} {"train_loss": -23.583866119384766, "global_step": 173451, "epoch": 2089} {"train_loss": -24.33070945739746, "global_step": 173452, "epoch": 2089} {"train_loss": -23.94221305847168, "global_step": 173453, "epoch": 2089} {"train_loss": -23.86185646057129, "global_step": 173454, "epoch": 2089} {"train_loss": -23.698110580444336, "global_step": 173455, "epoch": 2089} {"train_loss": -23.7569522857666, "global_step": 173456, "epoch": 2089} {"train_loss": -23.806806564331055, "global_step": 173457, "epoch": 2089} {"train_loss": -23.891658782958984, "global_step": 173458, "epoch": 2089} {"train_loss": -23.514314651489258, "global_step": 173459, "epoch": 2089} {"train_loss": -23.072328567504883, "global_step": 173460, "epoch": 2089} {"train_loss": -23.82847023010254, "global_step": 173461, "epoch": 2089} {"train_loss": -23.821813583374023, "global_step": 173462, "epoch": 2089} {"train_loss": -23.638235092163086, "global_step": 173463, "epoch": 2089} {"train_loss": -23.602651596069336, "global_step": 173464, "epoch": 2089} {"train_loss": -23.95535659790039, "global_step": 173465, "epoch": 2089} {"train_loss": -23.552541732788086, "global_step": 173466, "epoch": 2089} {"train_loss": -23.587827682495117, "global_step": 173467, "epoch": 2089} {"train_loss": -23.20489501953125, "global_step": 173468, "epoch": 2089} {"train_loss": -23.65234191159168, "global_step": 173469, "epoch": 2089, "val_loss": 6491405.0} {"train_loss": -23.29799461364746, "global_step": 173470, "epoch": 2090} {"train_loss": -23.631818771362305, "global_step": 173471, "epoch": 2090} {"train_loss": -23.626379013061523, "global_step": 173472, "epoch": 2090} {"train_loss": -23.181371688842773, "global_step": 173473, "epoch": 2090} {"train_loss": -23.695571899414062, "global_step": 173474, "epoch": 2090} {"train_loss": -23.547012329101562, "global_step": 173475, "epoch": 2090} {"train_loss": -23.479751586914062, "global_step": 173476, "epoch": 2090} {"train_loss": -23.827787399291992, "global_step": 173477, "epoch": 2090} {"train_loss": -23.34330177307129, "global_step": 173478, "epoch": 2090} {"train_loss": -23.959218978881836, "global_step": 173479, "epoch": 2090} {"train_loss": -23.885211944580078, "global_step": 173480, "epoch": 2090} {"train_loss": -23.520343780517578, "global_step": 173481, "epoch": 2090} {"train_loss": -23.816205978393555, "global_step": 173482, "epoch": 2090} {"train_loss": -23.537702560424805, "global_step": 173483, "epoch": 2090} {"train_loss": -23.73163414001465, "global_step": 173484, "epoch": 2090} {"train_loss": -23.72984504699707, "global_step": 173485, "epoch": 2090} {"train_loss": -23.547119140625, "global_step": 173486, "epoch": 2090} {"train_loss": -23.367830276489258, "global_step": 173487, "epoch": 2090} {"train_loss": -23.723421096801758, "global_step": 173488, "epoch": 2090} {"train_loss": -23.679819107055664, "global_step": 173489, "epoch": 2090} {"train_loss": -23.634450912475586, "global_step": 173490, "epoch": 2090} {"train_loss": -23.337562561035156, "global_step": 173491, "epoch": 2090} {"train_loss": -23.832265853881836, "global_step": 173492, "epoch": 2090} {"train_loss": -23.373119354248047, "global_step": 173493, "epoch": 2090} {"train_loss": -23.719282150268555, "global_step": 173494, "epoch": 2090} {"train_loss": -23.942502975463867, "global_step": 173495, "epoch": 2090} {"train_loss": -23.385482788085938, "global_step": 173496, "epoch": 2090} {"train_loss": -23.66309928894043, "global_step": 173497, "epoch": 2090} {"train_loss": -23.76918601989746, "global_step": 173498, "epoch": 2090} {"train_loss": -24.29567527770996, "global_step": 173499, "epoch": 2090} {"train_loss": -24.024824142456055, "global_step": 173500, "epoch": 2090} {"train_loss": -23.76947593688965, "global_step": 173501, "epoch": 2090} {"train_loss": -23.991222381591797, "global_step": 173502, "epoch": 2090} {"train_loss": -23.717050552368164, "global_step": 173503, "epoch": 2090} {"train_loss": -23.7166748046875, "global_step": 173504, "epoch": 2090} {"train_loss": -23.880325317382812, "global_step": 173505, "epoch": 2090} {"train_loss": -23.924070358276367, "global_step": 173506, "epoch": 2090} {"train_loss": -23.968952178955078, "global_step": 173507, "epoch": 2090} {"train_loss": -23.903329849243164, "global_step": 173508, "epoch": 2090} {"train_loss": -24.232929229736328, "global_step": 173509, "epoch": 2090} {"train_loss": -23.760271072387695, "global_step": 173510, "epoch": 2090} {"train_loss": -24.208967208862305, "global_step": 173511, "epoch": 2090} {"train_loss": -23.677900314331055, "global_step": 173512, "epoch": 2090} {"train_loss": -23.72267723083496, "global_step": 173513, "epoch": 2090} {"train_loss": -23.76570701599121, "global_step": 173514, "epoch": 2090} {"train_loss": -23.852127075195312, "global_step": 173515, "epoch": 2090} {"train_loss": -23.79616355895996, "global_step": 173516, "epoch": 2090} {"train_loss": -23.42841911315918, "global_step": 173517, "epoch": 2090} {"train_loss": -23.601316452026367, "global_step": 173518, "epoch": 2090} {"train_loss": -23.92466926574707, "global_step": 173519, "epoch": 2090} {"train_loss": -24.076833724975586, "global_step": 173520, "epoch": 2090} {"train_loss": -23.8410587310791, "global_step": 173521, "epoch": 2090} {"train_loss": -23.779088973999023, "global_step": 173522, "epoch": 2090} {"train_loss": -23.74721336364746, "global_step": 173523, "epoch": 2090} {"train_loss": -23.871265411376953, "global_step": 173524, "epoch": 2090} {"train_loss": -23.976001739501953, "global_step": 173525, "epoch": 2090} {"train_loss": -23.82356834411621, "global_step": 173526, "epoch": 2090} {"train_loss": -24.228086471557617, "global_step": 173527, "epoch": 2090} {"train_loss": -23.583255767822266, "global_step": 173528, "epoch": 2090} {"train_loss": -23.483976364135742, "global_step": 173529, "epoch": 2090} {"train_loss": -23.748733520507812, "global_step": 173530, "epoch": 2090} {"train_loss": -24.05438804626465, "global_step": 173531, "epoch": 2090} {"train_loss": -23.749624252319336, "global_step": 173532, "epoch": 2090} {"train_loss": -23.64381980895996, "global_step": 173533, "epoch": 2090} {"train_loss": -23.7274112701416, "global_step": 173534, "epoch": 2090} {"train_loss": -23.92347526550293, "global_step": 173535, "epoch": 2090} {"train_loss": -23.719406127929688, "global_step": 173536, "epoch": 2090} {"train_loss": -23.648801803588867, "global_step": 173537, "epoch": 2090} {"train_loss": -23.817651748657227, "global_step": 173538, "epoch": 2090} {"train_loss": -24.014755249023438, "global_step": 173539, "epoch": 2090} {"train_loss": -23.62957000732422, "global_step": 173540, "epoch": 2090} {"train_loss": -23.684141159057617, "global_step": 173541, "epoch": 2090} {"train_loss": -23.886219024658203, "global_step": 173542, "epoch": 2090} {"train_loss": -23.924457550048828, "global_step": 173543, "epoch": 2090} {"train_loss": -23.637372970581055, "global_step": 173544, "epoch": 2090} {"train_loss": -24.18821144104004, "global_step": 173545, "epoch": 2090} {"train_loss": -23.955718994140625, "global_step": 173546, "epoch": 2090} {"train_loss": -23.985971450805664, "global_step": 173547, "epoch": 2090} {"train_loss": -23.942968368530273, "global_step": 173548, "epoch": 2090} {"train_loss": -23.910207748413086, "global_step": 173549, "epoch": 2090} {"train_loss": -23.881811141967773, "global_step": 173550, "epoch": 2090} {"train_loss": -24.166305541992188, "global_step": 173551, "epoch": 2090} {"train_loss": -23.75999181816377, "global_step": 173552, "epoch": 2090, "val_loss": 6413347.0} {"train_loss": -23.254667282104492, "global_step": 173553, "epoch": 2091} {"train_loss": -23.126401901245117, "global_step": 173554, "epoch": 2091} {"train_loss": -23.14624786376953, "global_step": 173555, "epoch": 2091} {"train_loss": -22.851652145385742, "global_step": 173556, "epoch": 2091} {"train_loss": -23.608531951904297, "global_step": 173557, "epoch": 2091} {"train_loss": -23.202234268188477, "global_step": 173558, "epoch": 2091} {"train_loss": -23.472671508789062, "global_step": 173559, "epoch": 2091} {"train_loss": -23.55860710144043, "global_step": 173560, "epoch": 2091} {"train_loss": -23.438678741455078, "global_step": 173561, "epoch": 2091} {"train_loss": -23.694780349731445, "global_step": 173562, "epoch": 2091} {"train_loss": -23.639122009277344, "global_step": 173563, "epoch": 2091} {"train_loss": -23.367027282714844, "global_step": 173564, "epoch": 2091} {"train_loss": -23.684341430664062, "global_step": 173565, "epoch": 2091} {"train_loss": -23.332901000976562, "global_step": 173566, "epoch": 2091} {"train_loss": -23.47430992126465, "global_step": 173567, "epoch": 2091} {"train_loss": -23.852252960205078, "global_step": 173568, "epoch": 2091} {"train_loss": -23.28188133239746, "global_step": 173569, "epoch": 2091} {"train_loss": -23.464595794677734, "global_step": 173570, "epoch": 2091} {"train_loss": -23.86907196044922, "global_step": 173571, "epoch": 2091} {"train_loss": -23.442235946655273, "global_step": 173572, "epoch": 2091} {"train_loss": -23.77273941040039, "global_step": 173573, "epoch": 2091} {"train_loss": -24.080350875854492, "global_step": 173574, "epoch": 2091} {"train_loss": -23.623580932617188, "global_step": 173575, "epoch": 2091} {"train_loss": -24.025545120239258, "global_step": 173576, "epoch": 2091} {"train_loss": -23.63994026184082, "global_step": 173577, "epoch": 2091} {"train_loss": -23.565502166748047, "global_step": 173578, "epoch": 2091} {"train_loss": -23.65114402770996, "global_step": 173579, "epoch": 2091} {"train_loss": -23.910940170288086, "global_step": 173580, "epoch": 2091} {"train_loss": -23.872089385986328, "global_step": 173581, "epoch": 2091} {"train_loss": -23.57527732849121, "global_step": 173582, "epoch": 2091} {"train_loss": -23.68177032470703, "global_step": 173583, "epoch": 2091} {"train_loss": -23.632638931274414, "global_step": 173584, "epoch": 2091} {"train_loss": -23.58475685119629, "global_step": 173585, "epoch": 2091} {"train_loss": -23.991256713867188, "global_step": 173586, "epoch": 2091} {"train_loss": -23.895429611206055, "global_step": 173587, "epoch": 2091} {"train_loss": -23.72220802307129, "global_step": 173588, "epoch": 2091} {"train_loss": -23.30866050720215, "global_step": 173589, "epoch": 2091} {"train_loss": -23.356252670288086, "global_step": 173590, "epoch": 2091} {"train_loss": -23.751422882080078, "global_step": 173591, "epoch": 2091} {"train_loss": -23.594921112060547, "global_step": 173592, "epoch": 2091} {"train_loss": -23.315683364868164, "global_step": 173593, "epoch": 2091} {"train_loss": -23.681310653686523, "global_step": 173594, "epoch": 2091} {"train_loss": -23.498376846313477, "global_step": 173595, "epoch": 2091} {"train_loss": -23.96060562133789, "global_step": 173596, "epoch": 2091} {"train_loss": -23.500370025634766, "global_step": 173597, "epoch": 2091} {"train_loss": -23.644283294677734, "global_step": 173598, "epoch": 2091} {"train_loss": -24.150100708007812, "global_step": 173599, "epoch": 2091} {"train_loss": -23.6130428314209, "global_step": 173600, "epoch": 2091} {"train_loss": -23.533971786499023, "global_step": 173601, "epoch": 2091} {"train_loss": -23.705183029174805, "global_step": 173602, "epoch": 2091} {"train_loss": -23.882905960083008, "global_step": 173603, "epoch": 2091} {"train_loss": -24.01149559020996, "global_step": 173604, "epoch": 2091} {"train_loss": -23.84463882446289, "global_step": 173605, "epoch": 2091} {"train_loss": -23.39159393310547, "global_step": 173606, "epoch": 2091} {"train_loss": -23.916494369506836, "global_step": 173607, "epoch": 2091} {"train_loss": -24.08571434020996, "global_step": 173608, "epoch": 2091} {"train_loss": -23.973302841186523, "global_step": 173609, "epoch": 2091} {"train_loss": -24.056848526000977, "global_step": 173610, "epoch": 2091} {"train_loss": -24.179182052612305, "global_step": 173611, "epoch": 2091} {"train_loss": -23.295883178710938, "global_step": 173612, "epoch": 2091} {"train_loss": -23.783567428588867, "global_step": 173613, "epoch": 2091} {"train_loss": -23.280017852783203, "global_step": 173614, "epoch": 2091} {"train_loss": -23.80322265625, "global_step": 173615, "epoch": 2091} {"train_loss": -23.723352432250977, "global_step": 173616, "epoch": 2091} {"train_loss": -23.392269134521484, "global_step": 173617, "epoch": 2091} {"train_loss": -24.152088165283203, "global_step": 173618, "epoch": 2091} {"train_loss": -24.029052734375, "global_step": 173619, "epoch": 2091} {"train_loss": -23.574560165405273, "global_step": 173620, "epoch": 2091} {"train_loss": -23.94288444519043, "global_step": 173621, "epoch": 2091} {"train_loss": -23.8018741607666, "global_step": 173622, "epoch": 2091} {"train_loss": -23.878376007080078, "global_step": 173623, "epoch": 2091} {"train_loss": -23.813385009765625, "global_step": 173624, "epoch": 2091} {"train_loss": -24.080812454223633, "global_step": 173625, "epoch": 2091} {"train_loss": -23.897266387939453, "global_step": 173626, "epoch": 2091} {"train_loss": -24.01967430114746, "global_step": 173627, "epoch": 2091} {"train_loss": -23.911334991455078, "global_step": 173628, "epoch": 2091} {"train_loss": -23.97252655029297, "global_step": 173629, "epoch": 2091} {"train_loss": -23.93400001525879, "global_step": 173630, "epoch": 2091} {"train_loss": -23.56654930114746, "global_step": 173631, "epoch": 2091} {"train_loss": -24.281667709350586, "global_step": 173632, "epoch": 2091} {"train_loss": -23.764087677001953, "global_step": 173633, "epoch": 2091} {"train_loss": -23.90424156188965, "global_step": 173634, "epoch": 2091} {"train_loss": -23.697830108274896, "global_step": 173635, "epoch": 2091, "val_loss": 6313788.0} {"train_loss": -23.194473266601562, "global_step": 173636, "epoch": 2092} {"train_loss": -22.87873649597168, "global_step": 173637, "epoch": 2092} {"train_loss": -23.138364791870117, "global_step": 173638, "epoch": 2092} {"train_loss": -22.870941162109375, "global_step": 173639, "epoch": 2092} {"train_loss": -23.3350772857666, "global_step": 173640, "epoch": 2092} {"train_loss": -23.611526489257812, "global_step": 173641, "epoch": 2092} {"train_loss": -23.299314498901367, "global_step": 173642, "epoch": 2092} {"train_loss": -23.802152633666992, "global_step": 173643, "epoch": 2092} {"train_loss": -23.573530197143555, "global_step": 173644, "epoch": 2092} {"train_loss": -23.409099578857422, "global_step": 173645, "epoch": 2092} {"train_loss": -23.421218872070312, "global_step": 173646, "epoch": 2092} {"train_loss": -23.387109756469727, "global_step": 173647, "epoch": 2092} {"train_loss": -23.52536964416504, "global_step": 173648, "epoch": 2092} {"train_loss": -23.7559871673584, "global_step": 173649, "epoch": 2092} {"train_loss": -23.427452087402344, "global_step": 173650, "epoch": 2092} {"train_loss": -23.45383071899414, "global_step": 173651, "epoch": 2092} {"train_loss": -23.331167221069336, "global_step": 173652, "epoch": 2092} {"train_loss": -23.773662567138672, "global_step": 173653, "epoch": 2092} {"train_loss": -23.6143798828125, "global_step": 173654, "epoch": 2092} {"train_loss": -23.9884033203125, "global_step": 173655, "epoch": 2092} {"train_loss": -23.2127628326416, "global_step": 173656, "epoch": 2092} {"train_loss": -23.824338912963867, "global_step": 173657, "epoch": 2092} {"train_loss": -23.372234344482422, "global_step": 173658, "epoch": 2092} {"train_loss": -23.550445556640625, "global_step": 173659, "epoch": 2092} {"train_loss": -23.67194175720215, "global_step": 173660, "epoch": 2092} {"train_loss": -23.407094955444336, "global_step": 173661, "epoch": 2092} {"train_loss": -23.73573875427246, "global_step": 173662, "epoch": 2092} {"train_loss": -24.0124454498291, "global_step": 173663, "epoch": 2092} {"train_loss": -23.826810836791992, "global_step": 173664, "epoch": 2092} {"train_loss": -24.101896286010742, "global_step": 173665, "epoch": 2092} {"train_loss": -23.646772384643555, "global_step": 173666, "epoch": 2092} {"train_loss": -23.729429244995117, "global_step": 173667, "epoch": 2092} {"train_loss": -23.880542755126953, "global_step": 173668, "epoch": 2092} {"train_loss": -23.745325088500977, "global_step": 173669, "epoch": 2092} {"train_loss": -23.755460739135742, "global_step": 173670, "epoch": 2092} {"train_loss": -23.853153228759766, "global_step": 173671, "epoch": 2092} {"train_loss": -24.072683334350586, "global_step": 173672, "epoch": 2092} {"train_loss": -23.75979995727539, "global_step": 173673, "epoch": 2092} {"train_loss": -23.735370635986328, "global_step": 173674, "epoch": 2092} {"train_loss": -24.343599319458008, "global_step": 173675, "epoch": 2092} {"train_loss": -23.478031158447266, "global_step": 173676, "epoch": 2092} {"train_loss": -23.7886905670166, "global_step": 173677, "epoch": 2092} {"train_loss": -23.527402877807617, "global_step": 173678, "epoch": 2092} {"train_loss": -23.605072021484375, "global_step": 173679, "epoch": 2092} {"train_loss": -23.646875381469727, "global_step": 173680, "epoch": 2092} {"train_loss": -23.78346824645996, "global_step": 173681, "epoch": 2092} {"train_loss": -24.107717514038086, "global_step": 173682, "epoch": 2092} {"train_loss": -23.404996871948242, "global_step": 173683, "epoch": 2092} {"train_loss": -23.706045150756836, "global_step": 173684, "epoch": 2092} {"train_loss": -24.088085174560547, "global_step": 173685, "epoch": 2092} {"train_loss": -23.594106674194336, "global_step": 173686, "epoch": 2092} {"train_loss": -23.819997787475586, "global_step": 173687, "epoch": 2092} {"train_loss": -24.233800888061523, "global_step": 173688, "epoch": 2092} {"train_loss": -23.732131958007812, "global_step": 173689, "epoch": 2092} {"train_loss": -23.844009399414062, "global_step": 173690, "epoch": 2092} {"train_loss": -24.100330352783203, "global_step": 173691, "epoch": 2092} {"train_loss": -24.03315544128418, "global_step": 173692, "epoch": 2092} {"train_loss": -23.898305892944336, "global_step": 173693, "epoch": 2092} {"train_loss": -23.88307762145996, "global_step": 173694, "epoch": 2092} {"train_loss": -23.788192749023438, "global_step": 173695, "epoch": 2092} {"train_loss": -23.90230369567871, "global_step": 173696, "epoch": 2092} {"train_loss": -23.890472412109375, "global_step": 173697, "epoch": 2092} {"train_loss": -23.965604782104492, "global_step": 173698, "epoch": 2092} {"train_loss": -23.74910545349121, "global_step": 173699, "epoch": 2092} {"train_loss": -23.50346565246582, "global_step": 173700, "epoch": 2092} {"train_loss": -23.447938919067383, "global_step": 173701, "epoch": 2092} {"train_loss": -23.514636993408203, "global_step": 173702, "epoch": 2092} {"train_loss": -23.82525062561035, "global_step": 173703, "epoch": 2092} {"train_loss": -23.3072452545166, "global_step": 173704, "epoch": 2092} {"train_loss": -23.650405883789062, "global_step": 173705, "epoch": 2092} {"train_loss": -22.980627059936523, "global_step": 173706, "epoch": 2092} {"train_loss": -23.878015518188477, "global_step": 173707, "epoch": 2092} {"train_loss": -23.522537231445312, "global_step": 173708, "epoch": 2092} {"train_loss": -23.353282928466797, "global_step": 173709, "epoch": 2092} {"train_loss": -24.082931518554688, "global_step": 173710, "epoch": 2092} {"train_loss": -23.683536529541016, "global_step": 173711, "epoch": 2092} {"train_loss": -23.317686080932617, "global_step": 173712, "epoch": 2092} {"train_loss": -23.664199829101562, "global_step": 173713, "epoch": 2092} {"train_loss": -23.312299728393555, "global_step": 173714, "epoch": 2092} {"train_loss": -23.542999267578125, "global_step": 173715, "epoch": 2092} {"train_loss": -23.694595336914062, "global_step": 173716, "epoch": 2092} {"train_loss": -23.657470703125, "global_step": 173717, "epoch": 2092} {"train_loss": -23.66366540380271, "global_step": 173718, "epoch": 2092, "val_loss": 6513140.0} {"train_loss": -23.380666732788086, "global_step": 173719, "epoch": 2093} {"train_loss": -23.254491806030273, "global_step": 173720, "epoch": 2093} {"train_loss": -23.41333770751953, "global_step": 173721, "epoch": 2093} {"train_loss": -23.74966049194336, "global_step": 173722, "epoch": 2093} {"train_loss": -23.59296989440918, "global_step": 173723, "epoch": 2093} {"train_loss": -23.822128295898438, "global_step": 173724, "epoch": 2093} {"train_loss": -23.57328987121582, "global_step": 173725, "epoch": 2093} {"train_loss": -23.83782958984375, "global_step": 173726, "epoch": 2093} {"train_loss": -23.596174240112305, "global_step": 173727, "epoch": 2093} {"train_loss": -24.061094284057617, "global_step": 173728, "epoch": 2093} {"train_loss": -23.5882625579834, "global_step": 173729, "epoch": 2093} {"train_loss": -23.8427791595459, "global_step": 173730, "epoch": 2093} {"train_loss": -24.02387046813965, "global_step": 173731, "epoch": 2093} {"train_loss": -23.73407554626465, "global_step": 173732, "epoch": 2093} {"train_loss": -23.49629783630371, "global_step": 173733, "epoch": 2093} {"train_loss": -23.662328720092773, "global_step": 173734, "epoch": 2093} {"train_loss": -23.694814682006836, "global_step": 173735, "epoch": 2093} {"train_loss": -23.369474411010742, "global_step": 173736, "epoch": 2093} {"train_loss": -23.54372215270996, "global_step": 173737, "epoch": 2093} {"train_loss": -23.666751861572266, "global_step": 173738, "epoch": 2093} {"train_loss": -23.861297607421875, "global_step": 173739, "epoch": 2093} {"train_loss": -24.12037467956543, "global_step": 173740, "epoch": 2093} {"train_loss": -24.001197814941406, "global_step": 173741, "epoch": 2093} {"train_loss": -23.646419525146484, "global_step": 173742, "epoch": 2093} {"train_loss": -24.0496883392334, "global_step": 173743, "epoch": 2093} {"train_loss": -24.061542510986328, "global_step": 173744, "epoch": 2093} {"train_loss": -23.809553146362305, "global_step": 173745, "epoch": 2093} {"train_loss": -23.801321029663086, "global_step": 173746, "epoch": 2093} {"train_loss": -23.764667510986328, "global_step": 173747, "epoch": 2093} {"train_loss": -23.659263610839844, "global_step": 173748, "epoch": 2093} {"train_loss": -23.714405059814453, "global_step": 173749, "epoch": 2093} {"train_loss": -23.694934844970703, "global_step": 173750, "epoch": 2093} {"train_loss": -23.881017684936523, "global_step": 173751, "epoch": 2093} {"train_loss": -24.18866729736328, "global_step": 173752, "epoch": 2093} {"train_loss": -24.010122299194336, "global_step": 173753, "epoch": 2093} {"train_loss": -23.7493896484375, "global_step": 173754, "epoch": 2093} {"train_loss": -24.009397506713867, "global_step": 173755, "epoch": 2093} {"train_loss": -23.645648956298828, "global_step": 173756, "epoch": 2093} {"train_loss": -23.998319625854492, "global_step": 173757, "epoch": 2093} {"train_loss": -23.422374725341797, "global_step": 173758, "epoch": 2093} {"train_loss": -23.760387420654297, "global_step": 173759, "epoch": 2093} {"train_loss": -23.43182373046875, "global_step": 173760, "epoch": 2093} {"train_loss": -23.520280838012695, "global_step": 173761, "epoch": 2093} {"train_loss": -23.996999740600586, "global_step": 173762, "epoch": 2093} {"train_loss": -23.313541412353516, "global_step": 173763, "epoch": 2093} {"train_loss": -24.10390853881836, "global_step": 173764, "epoch": 2093} {"train_loss": -23.875173568725586, "global_step": 173765, "epoch": 2093} {"train_loss": -23.964313507080078, "global_step": 173766, "epoch": 2093} {"train_loss": -23.344867706298828, "global_step": 173767, "epoch": 2093} {"train_loss": -23.52309226989746, "global_step": 173768, "epoch": 2093} {"train_loss": -23.728343963623047, "global_step": 173769, "epoch": 2093} {"train_loss": -23.3896541595459, "global_step": 173770, "epoch": 2093} {"train_loss": -23.874021530151367, "global_step": 173771, "epoch": 2093} {"train_loss": -23.558738708496094, "global_step": 173772, "epoch": 2093} {"train_loss": -24.016834259033203, "global_step": 173773, "epoch": 2093} {"train_loss": -24.098642349243164, "global_step": 173774, "epoch": 2093} {"train_loss": -23.597383499145508, "global_step": 173775, "epoch": 2093} {"train_loss": -23.986309051513672, "global_step": 173776, "epoch": 2093} {"train_loss": -23.924468994140625, "global_step": 173777, "epoch": 2093} {"train_loss": -23.668060302734375, "global_step": 173778, "epoch": 2093} {"train_loss": -24.037622451782227, "global_step": 173779, "epoch": 2093} {"train_loss": -24.06599235534668, "global_step": 173780, "epoch": 2093} {"train_loss": -23.990619659423828, "global_step": 173781, "epoch": 2093} {"train_loss": -23.465511322021484, "global_step": 173782, "epoch": 2093} {"train_loss": -23.548654556274414, "global_step": 173783, "epoch": 2093} {"train_loss": -23.48053550720215, "global_step": 173784, "epoch": 2093} {"train_loss": -23.643293380737305, "global_step": 173785, "epoch": 2093} {"train_loss": -23.85834312438965, "global_step": 173786, "epoch": 2093} {"train_loss": -23.36262321472168, "global_step": 173787, "epoch": 2093} {"train_loss": -23.86505699157715, "global_step": 173788, "epoch": 2093} {"train_loss": -23.960981369018555, "global_step": 173789, "epoch": 2093} {"train_loss": -23.36577796936035, "global_step": 173790, "epoch": 2093} {"train_loss": -23.741254806518555, "global_step": 173791, "epoch": 2093} {"train_loss": -23.604162216186523, "global_step": 173792, "epoch": 2093} {"train_loss": -23.6400146484375, "global_step": 173793, "epoch": 2093} {"train_loss": -23.612777709960938, "global_step": 173794, "epoch": 2093} {"train_loss": -23.45048713684082, "global_step": 173795, "epoch": 2093} {"train_loss": -23.73176383972168, "global_step": 173796, "epoch": 2093} {"train_loss": -23.852346420288086, "global_step": 173797, "epoch": 2093} {"train_loss": -23.949560165405273, "global_step": 173798, "epoch": 2093} {"train_loss": -23.144874572753906, "global_step": 173799, "epoch": 2093} {"train_loss": -23.689926147460938, "global_step": 173800, "epoch": 2093} {"train_loss": -23.73697676141578, "global_step": 173801, "epoch": 2093, "val_loss": 6347444.0} {"train_loss": -22.979679107666016, "global_step": 173802, "epoch": 2094} {"train_loss": -23.373859405517578, "global_step": 173803, "epoch": 2094} {"train_loss": -22.695219039916992, "global_step": 173804, "epoch": 2094} {"train_loss": -23.199865341186523, "global_step": 173805, "epoch": 2094} {"train_loss": -23.129661560058594, "global_step": 173806, "epoch": 2094} {"train_loss": -23.19435691833496, "global_step": 173807, "epoch": 2094} {"train_loss": -23.286911010742188, "global_step": 173808, "epoch": 2094} {"train_loss": -23.07729148864746, "global_step": 173809, "epoch": 2094} {"train_loss": -23.25629234313965, "global_step": 173810, "epoch": 2094} {"train_loss": -23.822948455810547, "global_step": 173811, "epoch": 2094} {"train_loss": -23.29057502746582, "global_step": 173812, "epoch": 2094} {"train_loss": -23.49248504638672, "global_step": 173813, "epoch": 2094} {"train_loss": -23.538057327270508, "global_step": 173814, "epoch": 2094} {"train_loss": -23.194238662719727, "global_step": 173815, "epoch": 2094} {"train_loss": -23.536405563354492, "global_step": 173816, "epoch": 2094} {"train_loss": -23.570411682128906, "global_step": 173817, "epoch": 2094} {"train_loss": -23.645389556884766, "global_step": 173818, "epoch": 2094} {"train_loss": -23.181501388549805, "global_step": 173819, "epoch": 2094} {"train_loss": -23.87745475769043, "global_step": 173820, "epoch": 2094} {"train_loss": -23.835397720336914, "global_step": 173821, "epoch": 2094} {"train_loss": -23.84992790222168, "global_step": 173822, "epoch": 2094} {"train_loss": -23.60181999206543, "global_step": 173823, "epoch": 2094} {"train_loss": -23.71143341064453, "global_step": 173824, "epoch": 2094} {"train_loss": -23.763391494750977, "global_step": 173825, "epoch": 2094} {"train_loss": -23.506763458251953, "global_step": 173826, "epoch": 2094} {"train_loss": -23.798019409179688, "global_step": 173827, "epoch": 2094} {"train_loss": -23.338687896728516, "global_step": 173828, "epoch": 2094} {"train_loss": -23.6676082611084, "global_step": 173829, "epoch": 2094} {"train_loss": -23.851804733276367, "global_step": 173830, "epoch": 2094} {"train_loss": -23.833698272705078, "global_step": 173831, "epoch": 2094} {"train_loss": -23.90113639831543, "global_step": 173832, "epoch": 2094} {"train_loss": -23.78729248046875, "global_step": 173833, "epoch": 2094} {"train_loss": -23.925928115844727, "global_step": 173834, "epoch": 2094} {"train_loss": -23.618925094604492, "global_step": 173835, "epoch": 2094} {"train_loss": -23.941274642944336, "global_step": 173836, "epoch": 2094} {"train_loss": -24.147062301635742, "global_step": 173837, "epoch": 2094} {"train_loss": -23.823278427124023, "global_step": 173838, "epoch": 2094} {"train_loss": -23.81891441345215, "global_step": 173839, "epoch": 2094} {"train_loss": -23.698375701904297, "global_step": 173840, "epoch": 2094} {"train_loss": -23.818265914916992, "global_step": 173841, "epoch": 2094} {"train_loss": -23.741628646850586, "global_step": 173842, "epoch": 2094} {"train_loss": -24.056446075439453, "global_step": 173843, "epoch": 2094} {"train_loss": -23.936838150024414, "global_step": 173844, "epoch": 2094} {"train_loss": -23.733182907104492, "global_step": 173845, "epoch": 2094} {"train_loss": -23.703994750976562, "global_step": 173846, "epoch": 2094} {"train_loss": -24.408849716186523, "global_step": 173847, "epoch": 2094} {"train_loss": -24.0030460357666, "global_step": 173848, "epoch": 2094} {"train_loss": -23.99933624267578, "global_step": 173849, "epoch": 2094} {"train_loss": -23.725248336791992, "global_step": 173850, "epoch": 2094} {"train_loss": -24.062105178833008, "global_step": 173851, "epoch": 2094} {"train_loss": -23.84388542175293, "global_step": 173852, "epoch": 2094} {"train_loss": -23.749969482421875, "global_step": 173853, "epoch": 2094} {"train_loss": -23.647396087646484, "global_step": 173854, "epoch": 2094} {"train_loss": -24.021116256713867, "global_step": 173855, "epoch": 2094} {"train_loss": -23.896635055541992, "global_step": 173856, "epoch": 2094} {"train_loss": -24.002578735351562, "global_step": 173857, "epoch": 2094} {"train_loss": -24.13162612915039, "global_step": 173858, "epoch": 2094} {"train_loss": -23.46548843383789, "global_step": 173859, "epoch": 2094} {"train_loss": -23.758203506469727, "global_step": 173860, "epoch": 2094} {"train_loss": -24.060104370117188, "global_step": 173861, "epoch": 2094} {"train_loss": -23.81873893737793, "global_step": 173862, "epoch": 2094} {"train_loss": -23.978805541992188, "global_step": 173863, "epoch": 2094} {"train_loss": -23.96010398864746, "global_step": 173864, "epoch": 2094} {"train_loss": -24.035064697265625, "global_step": 173865, "epoch": 2094} {"train_loss": -23.814119338989258, "global_step": 173866, "epoch": 2094} {"train_loss": -24.14396095275879, "global_step": 173867, "epoch": 2094} {"train_loss": -23.236066818237305, "global_step": 173868, "epoch": 2094} {"train_loss": -23.39790153503418, "global_step": 173869, "epoch": 2094} {"train_loss": -23.463611602783203, "global_step": 173870, "epoch": 2094} {"train_loss": -23.943510055541992, "global_step": 173871, "epoch": 2094} {"train_loss": -23.921905517578125, "global_step": 173872, "epoch": 2094} {"train_loss": -23.634784698486328, "global_step": 173873, "epoch": 2094} {"train_loss": -23.012887954711914, "global_step": 173874, "epoch": 2094} {"train_loss": -23.664518356323242, "global_step": 173875, "epoch": 2094} {"train_loss": -23.91937255859375, "global_step": 173876, "epoch": 2094} {"train_loss": -23.686281204223633, "global_step": 173877, "epoch": 2094} {"train_loss": -23.984603881835938, "global_step": 173878, "epoch": 2094} {"train_loss": -23.635772705078125, "global_step": 173879, "epoch": 2094} {"train_loss": -23.716144561767578, "global_step": 173880, "epoch": 2094} {"train_loss": -23.409595489501953, "global_step": 173881, "epoch": 2094} {"train_loss": -23.489038467407227, "global_step": 173882, "epoch": 2094} {"train_loss": -23.699092864990234, "global_step": 173883, "epoch": 2094} {"train_loss": -23.665362392563416, "global_step": 173884, "epoch": 2094, "val_loss": 6600861.0} {"train_loss": -23.11094093322754, "global_step": 173885, "epoch": 2095} {"train_loss": -23.586366653442383, "global_step": 173886, "epoch": 2095} {"train_loss": -23.13521385192871, "global_step": 173887, "epoch": 2095} {"train_loss": -23.07624626159668, "global_step": 173888, "epoch": 2095} {"train_loss": -23.53682518005371, "global_step": 173889, "epoch": 2095} {"train_loss": -23.60085105895996, "global_step": 173890, "epoch": 2095} {"train_loss": -23.256662368774414, "global_step": 173891, "epoch": 2095} {"train_loss": -23.61632537841797, "global_step": 173892, "epoch": 2095} {"train_loss": -23.151641845703125, "global_step": 173893, "epoch": 2095} {"train_loss": -23.39029312133789, "global_step": 173894, "epoch": 2095} {"train_loss": -23.219470977783203, "global_step": 173895, "epoch": 2095} {"train_loss": -23.432104110717773, "global_step": 173896, "epoch": 2095} {"train_loss": -23.684240341186523, "global_step": 173897, "epoch": 2095} {"train_loss": -23.191579818725586, "global_step": 173898, "epoch": 2095} {"train_loss": -23.75187110900879, "global_step": 173899, "epoch": 2095} {"train_loss": -23.29122543334961, "global_step": 173900, "epoch": 2095} {"train_loss": -23.767683029174805, "global_step": 173901, "epoch": 2095} {"train_loss": -24.024280548095703, "global_step": 173902, "epoch": 2095} {"train_loss": -23.71014976501465, "global_step": 173903, "epoch": 2095} {"train_loss": -23.526321411132812, "global_step": 173904, "epoch": 2095} {"train_loss": -23.464693069458008, "global_step": 173905, "epoch": 2095} {"train_loss": -24.014368057250977, "global_step": 173906, "epoch": 2095} {"train_loss": -23.689247131347656, "global_step": 173907, "epoch": 2095} {"train_loss": -23.604948043823242, "global_step": 173908, "epoch": 2095} {"train_loss": -23.568206787109375, "global_step": 173909, "epoch": 2095} {"train_loss": -23.663095474243164, "global_step": 173910, "epoch": 2095} {"train_loss": -23.706689834594727, "global_step": 173911, "epoch": 2095} {"train_loss": -23.429990768432617, "global_step": 173912, "epoch": 2095} {"train_loss": -24.500707626342773, "global_step": 173913, "epoch": 2095} {"train_loss": -23.833173751831055, "global_step": 173914, "epoch": 2095} {"train_loss": -23.808984756469727, "global_step": 173915, "epoch": 2095} {"train_loss": -23.8919620513916, "global_step": 173916, "epoch": 2095} {"train_loss": -23.629932403564453, "global_step": 173917, "epoch": 2095} {"train_loss": -23.666189193725586, "global_step": 173918, "epoch": 2095} {"train_loss": -23.615726470947266, "global_step": 173919, "epoch": 2095} {"train_loss": -23.676321029663086, "global_step": 173920, "epoch": 2095} {"train_loss": -24.0666561126709, "global_step": 173921, "epoch": 2095} {"train_loss": -24.011770248413086, "global_step": 173922, "epoch": 2095} {"train_loss": -23.96966552734375, "global_step": 173923, "epoch": 2095} {"train_loss": -23.69940185546875, "global_step": 173924, "epoch": 2095} {"train_loss": -24.130605697631836, "global_step": 173925, "epoch": 2095} {"train_loss": -23.73420524597168, "global_step": 173926, "epoch": 2095} {"train_loss": -23.947458267211914, "global_step": 173927, "epoch": 2095} {"train_loss": -23.787281036376953, "global_step": 173928, "epoch": 2095} {"train_loss": -23.63520622253418, "global_step": 173929, "epoch": 2095} {"train_loss": -23.811241149902344, "global_step": 173930, "epoch": 2095} {"train_loss": -23.95819664001465, "global_step": 173931, "epoch": 2095} {"train_loss": -23.57988739013672, "global_step": 173932, "epoch": 2095} {"train_loss": -23.67974090576172, "global_step": 173933, "epoch": 2095} {"train_loss": -23.635303497314453, "global_step": 173934, "epoch": 2095} {"train_loss": -23.62858772277832, "global_step": 173935, "epoch": 2095} {"train_loss": -24.096004486083984, "global_step": 173936, "epoch": 2095} {"train_loss": -23.79920768737793, "global_step": 173937, "epoch": 2095} {"train_loss": -24.003177642822266, "global_step": 173938, "epoch": 2095} {"train_loss": -23.908872604370117, "global_step": 173939, "epoch": 2095} {"train_loss": -23.76263427734375, "global_step": 173940, "epoch": 2095} {"train_loss": -23.488208770751953, "global_step": 173941, "epoch": 2095} {"train_loss": -23.66839027404785, "global_step": 173942, "epoch": 2095} {"train_loss": -23.9357967376709, "global_step": 173943, "epoch": 2095} {"train_loss": -23.587915420532227, "global_step": 173944, "epoch": 2095} {"train_loss": -23.674209594726562, "global_step": 173945, "epoch": 2095} {"train_loss": -23.800561904907227, "global_step": 173946, "epoch": 2095} {"train_loss": -23.843921661376953, "global_step": 173947, "epoch": 2095} {"train_loss": -23.329971313476562, "global_step": 173948, "epoch": 2095} {"train_loss": -24.15035057067871, "global_step": 173949, "epoch": 2095} {"train_loss": -23.504446029663086, "global_step": 173950, "epoch": 2095} {"train_loss": -23.786653518676758, "global_step": 173951, "epoch": 2095} {"train_loss": -23.80219078063965, "global_step": 173952, "epoch": 2095} {"train_loss": -23.66046714782715, "global_step": 173953, "epoch": 2095} {"train_loss": -23.771507263183594, "global_step": 173954, "epoch": 2095} {"train_loss": -24.104204177856445, "global_step": 173955, "epoch": 2095} {"train_loss": -23.855615615844727, "global_step": 173956, "epoch": 2095} {"train_loss": -23.53619384765625, "global_step": 173957, "epoch": 2095} {"train_loss": -24.02481460571289, "global_step": 173958, "epoch": 2095} {"train_loss": -23.562299728393555, "global_step": 173959, "epoch": 2095} {"train_loss": -23.849899291992188, "global_step": 173960, "epoch": 2095} {"train_loss": -23.90724754333496, "global_step": 173961, "epoch": 2095} {"train_loss": -24.040037155151367, "global_step": 173962, "epoch": 2095} {"train_loss": -24.006147384643555, "global_step": 173963, "epoch": 2095} {"train_loss": -24.024288177490234, "global_step": 173964, "epoch": 2095} {"train_loss": -23.99164581298828, "global_step": 173965, "epoch": 2095} {"train_loss": -24.1905574798584, "global_step": 173966, "epoch": 2095} {"train_loss": -23.71131292595921, "global_step": 173967, "epoch": 2095, "val_loss": 6399523.5} {"train_loss": -23.892934799194336, "global_step": 173968, "epoch": 2096} {"train_loss": -23.994565963745117, "global_step": 173969, "epoch": 2096} {"train_loss": -23.663345336914062, "global_step": 173970, "epoch": 2096} {"train_loss": -23.354515075683594, "global_step": 173971, "epoch": 2096} {"train_loss": -23.58717918395996, "global_step": 173972, "epoch": 2096} {"train_loss": -23.964658737182617, "global_step": 173973, "epoch": 2096} {"train_loss": -23.842172622680664, "global_step": 173974, "epoch": 2096} {"train_loss": -23.819250106811523, "global_step": 173975, "epoch": 2096} {"train_loss": -22.996662139892578, "global_step": 173976, "epoch": 2096} {"train_loss": -23.6751766204834, "global_step": 173977, "epoch": 2096} {"train_loss": -24.07096290588379, "global_step": 173978, "epoch": 2096} {"train_loss": -23.58922004699707, "global_step": 173979, "epoch": 2096} {"train_loss": -23.22942543029785, "global_step": 173980, "epoch": 2096} {"train_loss": -23.881423950195312, "global_step": 173981, "epoch": 2096} {"train_loss": -23.739181518554688, "global_step": 173982, "epoch": 2096} {"train_loss": -23.719223022460938, "global_step": 173983, "epoch": 2096} {"train_loss": -23.575010299682617, "global_step": 173984, "epoch": 2096} {"train_loss": -24.085365295410156, "global_step": 173985, "epoch": 2096} {"train_loss": -23.596933364868164, "global_step": 173986, "epoch": 2096} {"train_loss": -23.397397994995117, "global_step": 173987, "epoch": 2096} {"train_loss": -23.94944190979004, "global_step": 173988, "epoch": 2096} {"train_loss": -23.592512130737305, "global_step": 173989, "epoch": 2096} {"train_loss": -24.005136489868164, "global_step": 173990, "epoch": 2096} {"train_loss": -23.7298526763916, "global_step": 173991, "epoch": 2096} {"train_loss": -23.710195541381836, "global_step": 173992, "epoch": 2096} {"train_loss": -23.78848648071289, "global_step": 173993, "epoch": 2096} {"train_loss": -24.12278938293457, "global_step": 173994, "epoch": 2096} {"train_loss": -23.63312339782715, "global_step": 173995, "epoch": 2096} {"train_loss": -23.568866729736328, "global_step": 173996, "epoch": 2096} {"train_loss": -23.7908935546875, "global_step": 173997, "epoch": 2096} {"train_loss": -23.491607666015625, "global_step": 173998, "epoch": 2096} {"train_loss": -23.430160522460938, "global_step": 173999, "epoch": 2096} {"train_loss": -23.590164184570312, "global_step": 174000, "epoch": 2096} {"train_loss": -24.27583122253418, "global_step": 174001, "epoch": 2096} {"train_loss": -23.834165573120117, "global_step": 174002, "epoch": 2096} {"train_loss": -23.434873580932617, "global_step": 174003, "epoch": 2096} {"train_loss": -23.738601684570312, "global_step": 174004, "epoch": 2096} {"train_loss": -23.7168025970459, "global_step": 174005, "epoch": 2096} {"train_loss": -23.696990966796875, "global_step": 174006, "epoch": 2096} {"train_loss": -23.430578231811523, "global_step": 174007, "epoch": 2096} {"train_loss": -23.574567794799805, "global_step": 174008, "epoch": 2096} {"train_loss": -23.797149658203125, "global_step": 174009, "epoch": 2096} {"train_loss": -23.948766708374023, "global_step": 174010, "epoch": 2096} {"train_loss": -23.73933219909668, "global_step": 174011, "epoch": 2096} {"train_loss": -23.741722106933594, "global_step": 174012, "epoch": 2096} {"train_loss": -23.829269409179688, "global_step": 174013, "epoch": 2096} {"train_loss": -24.09521484375, "global_step": 174014, "epoch": 2096} {"train_loss": -23.48871421813965, "global_step": 174015, "epoch": 2096} {"train_loss": -23.608985900878906, "global_step": 174016, "epoch": 2096} {"train_loss": -23.834226608276367, "global_step": 174017, "epoch": 2096} {"train_loss": -24.085739135742188, "global_step": 174018, "epoch": 2096} {"train_loss": -23.690479278564453, "global_step": 174019, "epoch": 2096} {"train_loss": -23.743804931640625, "global_step": 174020, "epoch": 2096} {"train_loss": -23.54171371459961, "global_step": 174021, "epoch": 2096} {"train_loss": -23.841962814331055, "global_step": 174022, "epoch": 2096} {"train_loss": -23.76016616821289, "global_step": 174023, "epoch": 2096} {"train_loss": -23.760507583618164, "global_step": 174024, "epoch": 2096} {"train_loss": -24.146785736083984, "global_step": 174025, "epoch": 2096} {"train_loss": -23.821813583374023, "global_step": 174026, "epoch": 2096} {"train_loss": -23.931568145751953, "global_step": 174027, "epoch": 2096} {"train_loss": -23.804931640625, "global_step": 174028, "epoch": 2096} {"train_loss": -23.916179656982422, "global_step": 174029, "epoch": 2096} {"train_loss": -23.432785034179688, "global_step": 174030, "epoch": 2096} {"train_loss": -23.979032516479492, "global_step": 174031, "epoch": 2096} {"train_loss": -23.819604873657227, "global_step": 174032, "epoch": 2096} {"train_loss": -23.877695083618164, "global_step": 174033, "epoch": 2096} {"train_loss": -23.721372604370117, "global_step": 174034, "epoch": 2096} {"train_loss": -24.20672607421875, "global_step": 174035, "epoch": 2096} {"train_loss": -23.89963150024414, "global_step": 174036, "epoch": 2096} {"train_loss": -23.76331901550293, "global_step": 174037, "epoch": 2096} {"train_loss": -23.885364532470703, "global_step": 174038, "epoch": 2096} {"train_loss": -23.64117431640625, "global_step": 174039, "epoch": 2096} {"train_loss": -23.575239181518555, "global_step": 174040, "epoch": 2096} {"train_loss": -23.676267623901367, "global_step": 174041, "epoch": 2096} {"train_loss": -23.978628158569336, "global_step": 174042, "epoch": 2096} {"train_loss": -24.22077178955078, "global_step": 174043, "epoch": 2096} {"train_loss": -24.029560089111328, "global_step": 174044, "epoch": 2096} {"train_loss": -24.123525619506836, "global_step": 174045, "epoch": 2096} {"train_loss": -23.97769546508789, "global_step": 174046, "epoch": 2096} {"train_loss": -23.61308479309082, "global_step": 174047, "epoch": 2096} {"train_loss": -23.835622787475586, "global_step": 174048, "epoch": 2096} {"train_loss": -23.70819091796875, "global_step": 174049, "epoch": 2096} {"train_loss": -23.77239188228745, "global_step": 174050, "epoch": 2096, "val_loss": 6499516.5} {"train_loss": -22.763723373413086, "global_step": 174051, "epoch": 2097} {"train_loss": -22.43379783630371, "global_step": 174052, "epoch": 2097} {"train_loss": -23.65284538269043, "global_step": 174053, "epoch": 2097} {"train_loss": -22.869342803955078, "global_step": 174054, "epoch": 2097} {"train_loss": -22.717872619628906, "global_step": 174055, "epoch": 2097} {"train_loss": -23.107524871826172, "global_step": 174056, "epoch": 2097} {"train_loss": -22.854190826416016, "global_step": 174057, "epoch": 2097} {"train_loss": -23.914255142211914, "global_step": 174058, "epoch": 2097} {"train_loss": -23.070425033569336, "global_step": 174059, "epoch": 2097} {"train_loss": -23.140283584594727, "global_step": 174060, "epoch": 2097} {"train_loss": -23.635906219482422, "global_step": 174061, "epoch": 2097} {"train_loss": -23.048095703125, "global_step": 174062, "epoch": 2097} {"train_loss": -22.932497024536133, "global_step": 174063, "epoch": 2097} {"train_loss": -23.36086654663086, "global_step": 174064, "epoch": 2097} {"train_loss": -23.174972534179688, "global_step": 174065, "epoch": 2097} {"train_loss": -23.635602951049805, "global_step": 174066, "epoch": 2097} {"train_loss": -23.44729232788086, "global_step": 174067, "epoch": 2097} {"train_loss": -23.5811767578125, "global_step": 174068, "epoch": 2097} {"train_loss": -23.18025016784668, "global_step": 174069, "epoch": 2097} {"train_loss": -23.66253662109375, "global_step": 174070, "epoch": 2097} {"train_loss": -23.508153915405273, "global_step": 174071, "epoch": 2097} {"train_loss": -23.656599044799805, "global_step": 174072, "epoch": 2097} {"train_loss": -23.951309204101562, "global_step": 174073, "epoch": 2097} {"train_loss": -23.650360107421875, "global_step": 174074, "epoch": 2097} {"train_loss": -23.92477035522461, "global_step": 174075, "epoch": 2097} {"train_loss": -23.472644805908203, "global_step": 174076, "epoch": 2097} {"train_loss": -23.739913940429688, "global_step": 174077, "epoch": 2097} {"train_loss": -23.614517211914062, "global_step": 174078, "epoch": 2097} {"train_loss": -24.018186569213867, "global_step": 174079, "epoch": 2097} {"train_loss": -23.86004638671875, "global_step": 174080, "epoch": 2097} {"train_loss": -23.47972297668457, "global_step": 174081, "epoch": 2097} {"train_loss": -23.973108291625977, "global_step": 174082, "epoch": 2097} {"train_loss": -23.555761337280273, "global_step": 174083, "epoch": 2097} {"train_loss": -23.0869083404541, "global_step": 174084, "epoch": 2097} {"train_loss": -23.528873443603516, "global_step": 174085, "epoch": 2097} {"train_loss": -24.000656127929688, "global_step": 174086, "epoch": 2097} {"train_loss": -23.533710479736328, "global_step": 174087, "epoch": 2097} {"train_loss": -23.677291870117188, "global_step": 174088, "epoch": 2097} {"train_loss": -23.551305770874023, "global_step": 174089, "epoch": 2097} {"train_loss": -23.780942916870117, "global_step": 174090, "epoch": 2097} {"train_loss": -23.975900650024414, "global_step": 174091, "epoch": 2097} {"train_loss": -24.0726375579834, "global_step": 174092, "epoch": 2097} {"train_loss": -23.615177154541016, "global_step": 174093, "epoch": 2097} {"train_loss": -23.41568946838379, "global_step": 174094, "epoch": 2097} {"train_loss": -23.84272575378418, "global_step": 174095, "epoch": 2097} {"train_loss": -23.944570541381836, "global_step": 174096, "epoch": 2097} {"train_loss": -23.551542282104492, "global_step": 174097, "epoch": 2097} {"train_loss": -23.69435691833496, "global_step": 174098, "epoch": 2097} {"train_loss": -23.905635833740234, "global_step": 174099, "epoch": 2097} {"train_loss": -23.83277702331543, "global_step": 174100, "epoch": 2097} {"train_loss": -24.012863159179688, "global_step": 174101, "epoch": 2097} {"train_loss": -24.044050216674805, "global_step": 174102, "epoch": 2097} {"train_loss": -23.932767868041992, "global_step": 174103, "epoch": 2097} {"train_loss": -23.819334030151367, "global_step": 174104, "epoch": 2097} {"train_loss": -23.785337448120117, "global_step": 174105, "epoch": 2097} {"train_loss": -23.789268493652344, "global_step": 174106, "epoch": 2097} {"train_loss": -23.997968673706055, "global_step": 174107, "epoch": 2097} {"train_loss": -23.712465286254883, "global_step": 174108, "epoch": 2097} {"train_loss": -23.64759635925293, "global_step": 174109, "epoch": 2097} {"train_loss": -23.322053909301758, "global_step": 174110, "epoch": 2097} {"train_loss": -23.627145767211914, "global_step": 174111, "epoch": 2097} {"train_loss": -23.73139762878418, "global_step": 174112, "epoch": 2097} {"train_loss": -23.819782257080078, "global_step": 174113, "epoch": 2097} {"train_loss": -23.355955123901367, "global_step": 174114, "epoch": 2097} {"train_loss": -23.945117950439453, "global_step": 174115, "epoch": 2097} {"train_loss": -23.749061584472656, "global_step": 174116, "epoch": 2097} {"train_loss": -23.6148738861084, "global_step": 174117, "epoch": 2097} {"train_loss": -23.93230628967285, "global_step": 174118, "epoch": 2097} {"train_loss": -23.873613357543945, "global_step": 174119, "epoch": 2097} {"train_loss": -23.864736557006836, "global_step": 174120, "epoch": 2097} {"train_loss": -23.8337459564209, "global_step": 174121, "epoch": 2097} {"train_loss": -23.800180435180664, "global_step": 174122, "epoch": 2097} {"train_loss": -23.946672439575195, "global_step": 174123, "epoch": 2097} {"train_loss": -23.752073287963867, "global_step": 174124, "epoch": 2097} {"train_loss": -23.8192138671875, "global_step": 174125, "epoch": 2097} {"train_loss": -23.51364517211914, "global_step": 174126, "epoch": 2097} {"train_loss": -23.911304473876953, "global_step": 174127, "epoch": 2097} {"train_loss": -23.774621963500977, "global_step": 174128, "epoch": 2097} {"train_loss": -23.603511810302734, "global_step": 174129, "epoch": 2097} {"train_loss": -24.184001922607422, "global_step": 174130, "epoch": 2097} {"train_loss": -23.674833297729492, "global_step": 174131, "epoch": 2097} {"train_loss": -23.470449447631836, "global_step": 174132, "epoch": 2097} {"train_loss": -23.61659353325166, "global_step": 174133, "epoch": 2097, "val_loss": 6541979.0} {"train_loss": -23.400665283203125, "global_step": 174134, "epoch": 2098} {"train_loss": -23.532270431518555, "global_step": 174135, "epoch": 2098} {"train_loss": -23.75185775756836, "global_step": 174136, "epoch": 2098} {"train_loss": -22.901212692260742, "global_step": 174137, "epoch": 2098} {"train_loss": -23.380321502685547, "global_step": 174138, "epoch": 2098} {"train_loss": -23.716703414916992, "global_step": 174139, "epoch": 2098} {"train_loss": -23.512779235839844, "global_step": 174140, "epoch": 2098} {"train_loss": -23.72096061706543, "global_step": 174141, "epoch": 2098} {"train_loss": -23.376564025878906, "global_step": 174142, "epoch": 2098} {"train_loss": -23.523418426513672, "global_step": 174143, "epoch": 2098} {"train_loss": -23.75672721862793, "global_step": 174144, "epoch": 2098} {"train_loss": -23.358585357666016, "global_step": 174145, "epoch": 2098} {"train_loss": -23.573654174804688, "global_step": 174146, "epoch": 2098} {"train_loss": -23.74764060974121, "global_step": 174147, "epoch": 2098} {"train_loss": -23.204137802124023, "global_step": 174148, "epoch": 2098} {"train_loss": -23.425756454467773, "global_step": 174149, "epoch": 2098} {"train_loss": -23.729736328125, "global_step": 174150, "epoch": 2098} {"train_loss": -23.458959579467773, "global_step": 174151, "epoch": 2098} {"train_loss": -23.723770141601562, "global_step": 174152, "epoch": 2098} {"train_loss": -23.447660446166992, "global_step": 174153, "epoch": 2098} {"train_loss": -23.750213623046875, "global_step": 174154, "epoch": 2098} {"train_loss": -24.128416061401367, "global_step": 174155, "epoch": 2098} {"train_loss": -23.736656188964844, "global_step": 174156, "epoch": 2098} {"train_loss": -23.540050506591797, "global_step": 174157, "epoch": 2098} {"train_loss": -23.864635467529297, "global_step": 174158, "epoch": 2098} {"train_loss": -23.667999267578125, "global_step": 174159, "epoch": 2098} {"train_loss": -23.383026123046875, "global_step": 174160, "epoch": 2098} {"train_loss": -23.911876678466797, "global_step": 174161, "epoch": 2098} {"train_loss": -24.104047775268555, "global_step": 174162, "epoch": 2098} {"train_loss": -23.815521240234375, "global_step": 174163, "epoch": 2098} {"train_loss": -23.67787742614746, "global_step": 174164, "epoch": 2098} {"train_loss": -24.224002838134766, "global_step": 174165, "epoch": 2098} {"train_loss": -24.07306480407715, "global_step": 174166, "epoch": 2098} {"train_loss": -23.837976455688477, "global_step": 174167, "epoch": 2098} {"train_loss": -24.084367752075195, "global_step": 174168, "epoch": 2098} {"train_loss": -23.88273048400879, "global_step": 174169, "epoch": 2098} {"train_loss": -23.78596305847168, "global_step": 174170, "epoch": 2098} {"train_loss": -23.843711853027344, "global_step": 174171, "epoch": 2098} {"train_loss": -23.548242568969727, "global_step": 174172, "epoch": 2098} {"train_loss": -23.83478355407715, "global_step": 174173, "epoch": 2098} {"train_loss": -23.972618103027344, "global_step": 174174, "epoch": 2098} {"train_loss": -23.77444076538086, "global_step": 174175, "epoch": 2098} {"train_loss": -23.558456420898438, "global_step": 174176, "epoch": 2098} {"train_loss": -23.53817367553711, "global_step": 174177, "epoch": 2098} {"train_loss": -23.4119930267334, "global_step": 174178, "epoch": 2098} {"train_loss": -23.383466720581055, "global_step": 174179, "epoch": 2098} {"train_loss": -23.31280517578125, "global_step": 174180, "epoch": 2098} {"train_loss": -23.597726821899414, "global_step": 174181, "epoch": 2098} {"train_loss": -23.735227584838867, "global_step": 174182, "epoch": 2098} {"train_loss": -23.961946487426758, "global_step": 174183, "epoch": 2098} {"train_loss": -23.865694046020508, "global_step": 174184, "epoch": 2098} {"train_loss": -23.49917984008789, "global_step": 174185, "epoch": 2098} {"train_loss": -23.832523345947266, "global_step": 174186, "epoch": 2098} {"train_loss": -23.83159828186035, "global_step": 174187, "epoch": 2098} {"train_loss": -23.64984703063965, "global_step": 174188, "epoch": 2098} {"train_loss": -23.641698837280273, "global_step": 174189, "epoch": 2098} {"train_loss": -23.77667808532715, "global_step": 174190, "epoch": 2098} {"train_loss": -23.450439453125, "global_step": 174191, "epoch": 2098} {"train_loss": -23.54774284362793, "global_step": 174192, "epoch": 2098} {"train_loss": -23.735931396484375, "global_step": 174193, "epoch": 2098} {"train_loss": -23.623323440551758, "global_step": 174194, "epoch": 2098} {"train_loss": -23.704486846923828, "global_step": 174195, "epoch": 2098} {"train_loss": -23.447519302368164, "global_step": 174196, "epoch": 2098} {"train_loss": -24.372777938842773, "global_step": 174197, "epoch": 2098} {"train_loss": -24.035247802734375, "global_step": 174198, "epoch": 2098} {"train_loss": -23.750791549682617, "global_step": 174199, "epoch": 2098} {"train_loss": -24.021947860717773, "global_step": 174200, "epoch": 2098} {"train_loss": -23.84397315979004, "global_step": 174201, "epoch": 2098} {"train_loss": -23.93263816833496, "global_step": 174202, "epoch": 2098} {"train_loss": -24.018476486206055, "global_step": 174203, "epoch": 2098} {"train_loss": -23.92399024963379, "global_step": 174204, "epoch": 2098} {"train_loss": -24.017030715942383, "global_step": 174205, "epoch": 2098} {"train_loss": -23.908803939819336, "global_step": 174206, "epoch": 2098} {"train_loss": -23.622913360595703, "global_step": 174207, "epoch": 2098} {"train_loss": -24.277637481689453, "global_step": 174208, "epoch": 2098} {"train_loss": -24.067991256713867, "global_step": 174209, "epoch": 2098} {"train_loss": -23.780641555786133, "global_step": 174210, "epoch": 2098} {"train_loss": -23.696596145629883, "global_step": 174211, "epoch": 2098} {"train_loss": -23.86514663696289, "global_step": 174212, "epoch": 2098} {"train_loss": -23.655797958374023, "global_step": 174213, "epoch": 2098} {"train_loss": -23.858686447143555, "global_step": 174214, "epoch": 2098} {"train_loss": -23.908916473388672, "global_step": 174215, "epoch": 2098} {"train_loss": -23.704680362379694, "global_step": 174216, "epoch": 2098, "val_loss": 6251220.0} {"train_loss": -22.810529708862305, "global_step": 174217, "epoch": 2099} {"train_loss": -21.963855743408203, "global_step": 174218, "epoch": 2099} {"train_loss": -23.068639755249023, "global_step": 174219, "epoch": 2099} {"train_loss": -22.955520629882812, "global_step": 174220, "epoch": 2099} {"train_loss": -23.040998458862305, "global_step": 174221, "epoch": 2099} {"train_loss": -22.763153076171875, "global_step": 174222, "epoch": 2099} {"train_loss": -23.128957748413086, "global_step": 174223, "epoch": 2099} {"train_loss": -23.04231071472168, "global_step": 174224, "epoch": 2099} {"train_loss": -23.068456649780273, "global_step": 174225, "epoch": 2099} {"train_loss": -23.187667846679688, "global_step": 174226, "epoch": 2099} {"train_loss": -23.34910011291504, "global_step": 174227, "epoch": 2099} {"train_loss": -23.515159606933594, "global_step": 174228, "epoch": 2099} {"train_loss": -23.23902702331543, "global_step": 174229, "epoch": 2099} {"train_loss": -22.960453033447266, "global_step": 174230, "epoch": 2099} {"train_loss": -23.26374053955078, "global_step": 174231, "epoch": 2099} {"train_loss": -22.930402755737305, "global_step": 174232, "epoch": 2099} {"train_loss": -23.111398696899414, "global_step": 174233, "epoch": 2099} {"train_loss": -23.095340728759766, "global_step": 174234, "epoch": 2099} {"train_loss": -23.5555477142334, "global_step": 174235, "epoch": 2099} {"train_loss": -23.198894500732422, "global_step": 174236, "epoch": 2099} {"train_loss": -23.4400691986084, "global_step": 174237, "epoch": 2099} {"train_loss": -23.473236083984375, "global_step": 174238, "epoch": 2099} {"train_loss": -22.98048210144043, "global_step": 174239, "epoch": 2099} {"train_loss": -23.83498764038086, "global_step": 174240, "epoch": 2099} {"train_loss": -23.330034255981445, "global_step": 174241, "epoch": 2099} {"train_loss": -23.526575088500977, "global_step": 174242, "epoch": 2099} {"train_loss": -22.968183517456055, "global_step": 174243, "epoch": 2099} {"train_loss": -23.354162216186523, "global_step": 174244, "epoch": 2099} {"train_loss": -23.69766616821289, "global_step": 174245, "epoch": 2099} {"train_loss": -23.50626564025879, "global_step": 174246, "epoch": 2099} {"train_loss": -23.48408317565918, "global_step": 174247, "epoch": 2099} {"train_loss": -23.74895477294922, "global_step": 174248, "epoch": 2099} {"train_loss": -23.649511337280273, "global_step": 174249, "epoch": 2099} {"train_loss": -23.94583511352539, "global_step": 174250, "epoch": 2099} {"train_loss": -23.544925689697266, "global_step": 174251, "epoch": 2099} {"train_loss": -23.802732467651367, "global_step": 174252, "epoch": 2099} {"train_loss": -23.800527572631836, "global_step": 174253, "epoch": 2099} {"train_loss": -24.068979263305664, "global_step": 174254, "epoch": 2099} {"train_loss": -23.942636489868164, "global_step": 174255, "epoch": 2099} {"train_loss": -23.68807029724121, "global_step": 174256, "epoch": 2099} {"train_loss": -23.533527374267578, "global_step": 174257, "epoch": 2099} {"train_loss": -23.733436584472656, "global_step": 174258, "epoch": 2099} {"train_loss": -23.754501342773438, "global_step": 174259, "epoch": 2099} {"train_loss": -24.1424560546875, "global_step": 174260, "epoch": 2099} {"train_loss": -23.369525909423828, "global_step": 174261, "epoch": 2099} {"train_loss": -23.72303581237793, "global_step": 174262, "epoch": 2099} {"train_loss": -23.97658348083496, "global_step": 174263, "epoch": 2099} {"train_loss": -23.77662467956543, "global_step": 174264, "epoch": 2099} {"train_loss": -23.81939125061035, "global_step": 174265, "epoch": 2099} {"train_loss": -23.50874137878418, "global_step": 174266, "epoch": 2099} {"train_loss": -23.613935470581055, "global_step": 174267, "epoch": 2099} {"train_loss": -23.475147247314453, "global_step": 174268, "epoch": 2099} {"train_loss": -23.331844329833984, "global_step": 174269, "epoch": 2099} {"train_loss": -23.836078643798828, "global_step": 174270, "epoch": 2099} {"train_loss": -23.49469566345215, "global_step": 174271, "epoch": 2099} {"train_loss": -23.687360763549805, "global_step": 174272, "epoch": 2099} {"train_loss": -23.57217788696289, "global_step": 174273, "epoch": 2099} {"train_loss": -23.642011642456055, "global_step": 174274, "epoch": 2099} {"train_loss": -23.908924102783203, "global_step": 174275, "epoch": 2099} {"train_loss": -23.901165008544922, "global_step": 174276, "epoch": 2099} {"train_loss": -23.752685546875, "global_step": 174277, "epoch": 2099} {"train_loss": -23.763587951660156, "global_step": 174278, "epoch": 2099} {"train_loss": -23.63522720336914, "global_step": 174279, "epoch": 2099} {"train_loss": -23.552907943725586, "global_step": 174280, "epoch": 2099} {"train_loss": -23.875776290893555, "global_step": 174281, "epoch": 2099} {"train_loss": -23.39962387084961, "global_step": 174282, "epoch": 2099} {"train_loss": -23.42560386657715, "global_step": 174283, "epoch": 2099} {"train_loss": -23.645647048950195, "global_step": 174284, "epoch": 2099} {"train_loss": -24.028141021728516, "global_step": 174285, "epoch": 2099} {"train_loss": -23.643735885620117, "global_step": 174286, "epoch": 2099} {"train_loss": -23.57278060913086, "global_step": 174287, "epoch": 2099} {"train_loss": -23.85628318786621, "global_step": 174288, "epoch": 2099} {"train_loss": -23.808942794799805, "global_step": 174289, "epoch": 2099} {"train_loss": -23.975400924682617, "global_step": 174290, "epoch": 2099} {"train_loss": -23.702911376953125, "global_step": 174291, "epoch": 2099} {"train_loss": -23.554553985595703, "global_step": 174292, "epoch": 2099} {"train_loss": -23.85463523864746, "global_step": 174293, "epoch": 2099} {"train_loss": -23.86499786376953, "global_step": 174294, "epoch": 2099} {"train_loss": -23.65663719177246, "global_step": 174295, "epoch": 2099} {"train_loss": -23.47035026550293, "global_step": 174296, "epoch": 2099} {"train_loss": -23.59590721130371, "global_step": 174297, "epoch": 2099} {"train_loss": -23.91376304626465, "global_step": 174298, "epoch": 2099} {"train_loss": -23.542251931615624, "global_step": 174299, "epoch": 2099, "val_loss": 6517190.0} {"train_loss": -23.041166305541992, "global_step": 174300, "epoch": 2100} {"train_loss": -23.76531410217285, "global_step": 174301, "epoch": 2100} {"train_loss": -23.521984100341797, "global_step": 174302, "epoch": 2100} {"train_loss": -23.176191329956055, "global_step": 174303, "epoch": 2100} {"train_loss": -23.39088249206543, "global_step": 174304, "epoch": 2100} {"train_loss": -23.290699005126953, "global_step": 174305, "epoch": 2100} {"train_loss": -23.317590713500977, "global_step": 174306, "epoch": 2100} {"train_loss": -23.352319717407227, "global_step": 174307, "epoch": 2100} {"train_loss": -23.292964935302734, "global_step": 174308, "epoch": 2100} {"train_loss": -23.96803855895996, "global_step": 174309, "epoch": 2100} {"train_loss": -23.24911880493164, "global_step": 174310, "epoch": 2100} {"train_loss": -23.694183349609375, "global_step": 174311, "epoch": 2100} {"train_loss": -23.53571891784668, "global_step": 174312, "epoch": 2100} {"train_loss": -23.53963279724121, "global_step": 174313, "epoch": 2100} {"train_loss": -23.68992042541504, "global_step": 174314, "epoch": 2100} {"train_loss": -23.757373809814453, "global_step": 174315, "epoch": 2100} {"train_loss": -24.145498275756836, "global_step": 174316, "epoch": 2100} {"train_loss": -23.78242301940918, "global_step": 174317, "epoch": 2100} {"train_loss": -23.7609806060791, "global_step": 174318, "epoch": 2100} {"train_loss": -23.324655532836914, "global_step": 174319, "epoch": 2100} {"train_loss": -23.429838180541992, "global_step": 174320, "epoch": 2100} {"train_loss": -23.5915584564209, "global_step": 174321, "epoch": 2100} {"train_loss": -23.746898651123047, "global_step": 174322, "epoch": 2100} {"train_loss": -23.665740966796875, "global_step": 174323, "epoch": 2100} {"train_loss": -23.41583251953125, "global_step": 174324, "epoch": 2100} {"train_loss": -23.35564613342285, "global_step": 174325, "epoch": 2100} {"train_loss": -23.476123809814453, "global_step": 174326, "epoch": 2100} {"train_loss": -23.437700271606445, "global_step": 174327, "epoch": 2100} {"train_loss": -23.523550033569336, "global_step": 174328, "epoch": 2100} {"train_loss": -23.8591365814209, "global_step": 174329, "epoch": 2100} {"train_loss": -23.613431930541992, "global_step": 174330, "epoch": 2100} {"train_loss": -23.97466278076172, "global_step": 174331, "epoch": 2100} {"train_loss": -23.871978759765625, "global_step": 174332, "epoch": 2100} {"train_loss": -23.652484893798828, "global_step": 174333, "epoch": 2100} {"train_loss": -23.845380783081055, "global_step": 174334, "epoch": 2100} {"train_loss": -23.819503784179688, "global_step": 174335, "epoch": 2100} {"train_loss": -23.91750144958496, "global_step": 174336, "epoch": 2100} {"train_loss": -24.00809669494629, "global_step": 174337, "epoch": 2100} {"train_loss": -24.013214111328125, "global_step": 174338, "epoch": 2100} {"train_loss": -23.974111557006836, "global_step": 174339, "epoch": 2100} {"train_loss": -24.00115203857422, "global_step": 174340, "epoch": 2100} {"train_loss": -23.62226676940918, "global_step": 174341, "epoch": 2100} {"train_loss": -24.085220336914062, "global_step": 174342, "epoch": 2100} {"train_loss": -24.38581085205078, "global_step": 174343, "epoch": 2100} {"train_loss": -24.076398849487305, "global_step": 174344, "epoch": 2100} {"train_loss": -23.73922348022461, "global_step": 174345, "epoch": 2100} {"train_loss": -23.639331817626953, "global_step": 174346, "epoch": 2100} {"train_loss": -23.855243682861328, "global_step": 174347, "epoch": 2100} {"train_loss": -23.957807540893555, "global_step": 174348, "epoch": 2100} {"train_loss": -24.115453720092773, "global_step": 174349, "epoch": 2100} {"train_loss": -23.81247901916504, "global_step": 174350, "epoch": 2100} {"train_loss": -23.761655807495117, "global_step": 174351, "epoch": 2100} {"train_loss": -23.700963973999023, "global_step": 174352, "epoch": 2100} {"train_loss": -23.562759399414062, "global_step": 174353, "epoch": 2100} {"train_loss": -23.81513786315918, "global_step": 174354, "epoch": 2100} {"train_loss": -24.102773666381836, "global_step": 174355, "epoch": 2100} {"train_loss": -23.898529052734375, "global_step": 174356, "epoch": 2100} {"train_loss": -23.686559677124023, "global_step": 174357, "epoch": 2100} {"train_loss": -24.122344970703125, "global_step": 174358, "epoch": 2100} {"train_loss": -24.0310001373291, "global_step": 174359, "epoch": 2100} {"train_loss": -24.046335220336914, "global_step": 174360, "epoch": 2100} {"train_loss": -23.69495964050293, "global_step": 174361, "epoch": 2100} {"train_loss": -23.906232833862305, "global_step": 174362, "epoch": 2100} {"train_loss": -23.589597702026367, "global_step": 174363, "epoch": 2100} {"train_loss": -23.50048065185547, "global_step": 174364, "epoch": 2100} {"train_loss": -23.990970611572266, "global_step": 174365, "epoch": 2100} {"train_loss": -23.99199867248535, "global_step": 174366, "epoch": 2100} {"train_loss": -23.555715560913086, "global_step": 174367, "epoch": 2100} {"train_loss": -23.860271453857422, "global_step": 174368, "epoch": 2100} {"train_loss": -23.662050247192383, "global_step": 174369, "epoch": 2100} {"train_loss": -23.605680465698242, "global_step": 174370, "epoch": 2100} {"train_loss": -24.123952865600586, "global_step": 174371, "epoch": 2100} {"train_loss": -23.802330017089844, "global_step": 174372, "epoch": 2100} {"train_loss": -24.145605087280273, "global_step": 174373, "epoch": 2100} {"train_loss": -23.886978149414062, "global_step": 174374, "epoch": 2100} {"train_loss": -23.66355323791504, "global_step": 174375, "epoch": 2100} {"train_loss": -23.82197380065918, "global_step": 174376, "epoch": 2100} {"train_loss": -23.555051803588867, "global_step": 174377, "epoch": 2100} {"train_loss": -23.606201171875, "global_step": 174378, "epoch": 2100} {"train_loss": -23.954938888549805, "global_step": 174379, "epoch": 2100} {"train_loss": -23.701704025268555, "global_step": 174380, "epoch": 2100} {"train_loss": -23.27589988708496, "global_step": 174381, "epoch": 2100} {"train_loss": -23.75461224475539, "global_step": 174382, "epoch": 2100, "train/sim_max_reward_0": 1.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4500000": 1.0, "test/sim_max_reward_4500001": 1.0, "test/sim_max_reward_4500002": 1.0, "test/sim_max_reward_4500003": 1.0, "test/sim_max_reward_4500004": 1.0, "test/sim_max_reward_4500005": 1.0, "test/sim_max_reward_4500006": 1.0, "test/sim_max_reward_4500007": 1.0, "test/sim_max_reward_4500008": 1.0, "test/sim_max_reward_4500009": 1.0, "test/sim_max_reward_4500010": 1.0, "test/sim_max_reward_4500011": 1.0, "test/sim_max_reward_4500012": 1.0, "test/sim_max_reward_4500013": 1.0, "test/sim_max_reward_4500014": 1.0, "test/sim_max_reward_4500015": 1.0, "test/sim_max_reward_4500016": 1.0, "test/sim_max_reward_4500017": 1.0, "test/sim_max_reward_4500018": 1.0, "test/sim_max_reward_4500019": 1.0, "test/sim_max_reward_4500020": 1.0, "test/sim_max_reward_4500021": 1.0, "train/mean_score": 1.0, "test/mean_score": 1.0, "val_loss": 6460526.5} {"train_loss": -23.142160415649414, "global_step": 174383, "epoch": 2101} {"train_loss": -23.556856155395508, "global_step": 174384, "epoch": 2101} {"train_loss": -23.410390853881836, "global_step": 174385, "epoch": 2101} {"train_loss": -23.097089767456055, "global_step": 174386, "epoch": 2101} {"train_loss": -23.52358055114746, "global_step": 174387, "epoch": 2101} {"train_loss": -23.140329360961914, "global_step": 174388, "epoch": 2101} {"train_loss": -23.287195205688477, "global_step": 174389, "epoch": 2101} {"train_loss": -23.495527267456055, "global_step": 174390, "epoch": 2101} {"train_loss": -23.083093643188477, "global_step": 174391, "epoch": 2101} {"train_loss": -23.24762725830078, "global_step": 174392, "epoch": 2101} {"train_loss": -23.57659339904785, "global_step": 174393, "epoch": 2101} {"train_loss": -23.360523223876953, "global_step": 174394, "epoch": 2101} {"train_loss": -23.113605499267578, "global_step": 174395, "epoch": 2101} {"train_loss": -23.366361618041992, "global_step": 174396, "epoch": 2101} {"train_loss": -23.357675552368164, "global_step": 174397, "epoch": 2101} {"train_loss": -23.4216251373291, "global_step": 174398, "epoch": 2101} {"train_loss": -24.017789840698242, "global_step": 174399, "epoch": 2101} {"train_loss": -23.250255584716797, "global_step": 174400, "epoch": 2101} {"train_loss": -23.902992248535156, "global_step": 174401, "epoch": 2101} {"train_loss": -23.772573471069336, "global_step": 174402, "epoch": 2101} {"train_loss": -23.424253463745117, "global_step": 174403, "epoch": 2101} {"train_loss": -23.657575607299805, "global_step": 174404, "epoch": 2101} {"train_loss": -23.647123336791992, "global_step": 174405, "epoch": 2101} {"train_loss": -23.45492172241211, "global_step": 174406, "epoch": 2101} {"train_loss": -23.4754581451416, "global_step": 174407, "epoch": 2101} {"train_loss": -23.75941276550293, "global_step": 174408, "epoch": 2101} {"train_loss": -23.785625457763672, "global_step": 174409, "epoch": 2101} {"train_loss": -23.9415283203125, "global_step": 174410, "epoch": 2101} {"train_loss": -23.898723602294922, "global_step": 174411, "epoch": 2101} {"train_loss": -23.702754974365234, "global_step": 174412, "epoch": 2101} {"train_loss": -23.664602279663086, "global_step": 174413, "epoch": 2101} {"train_loss": -23.73838233947754, "global_step": 174414, "epoch": 2101} {"train_loss": -23.808961868286133, "global_step": 174415, "epoch": 2101} {"train_loss": -23.716947555541992, "global_step": 174416, "epoch": 2101} {"train_loss": -23.87822151184082, "global_step": 174417, "epoch": 2101} {"train_loss": -23.801307678222656, "global_step": 174418, "epoch": 2101} {"train_loss": -24.016042709350586, "global_step": 174419, "epoch": 2101} {"train_loss": -23.748523712158203, "global_step": 174420, "epoch": 2101} {"train_loss": -23.90266990661621, "global_step": 174421, "epoch": 2101} {"train_loss": -24.260404586791992, "global_step": 174422, "epoch": 2101} {"train_loss": -23.98828125, "global_step": 174423, "epoch": 2101} {"train_loss": -23.918943405151367, "global_step": 174424, "epoch": 2101} {"train_loss": -23.828428268432617, "global_step": 174425, "epoch": 2101} {"train_loss": -24.01756477355957, "global_step": 174426, "epoch": 2101} {"train_loss": -23.718385696411133, "global_step": 174427, "epoch": 2101} {"train_loss": -23.876144409179688, "global_step": 174428, "epoch": 2101} {"train_loss": -23.99087905883789, "global_step": 174429, "epoch": 2101} {"train_loss": -23.55929946899414, "global_step": 174430, "epoch": 2101} {"train_loss": -23.50786018371582, "global_step": 174431, "epoch": 2101} {"train_loss": -23.640336990356445, "global_step": 174432, "epoch": 2101} {"train_loss": -23.702083587646484, "global_step": 174433, "epoch": 2101} {"train_loss": -23.761024475097656, "global_step": 174434, "epoch": 2101} {"train_loss": -24.089963912963867, "global_step": 174435, "epoch": 2101} {"train_loss": -23.671411514282227, "global_step": 174436, "epoch": 2101} {"train_loss": -23.579954147338867, "global_step": 174437, "epoch": 2101} {"train_loss": -23.785114288330078, "global_step": 174438, "epoch": 2101} {"train_loss": -23.926977157592773, "global_step": 174439, "epoch": 2101} {"train_loss": -23.756061553955078, "global_step": 174440, "epoch": 2101} {"train_loss": -23.32216453552246, "global_step": 174441, "epoch": 2101} {"train_loss": -23.41554069519043, "global_step": 174442, "epoch": 2101} {"train_loss": -24.208646774291992, "global_step": 174443, "epoch": 2101} {"train_loss": -24.016361236572266, "global_step": 174444, "epoch": 2101} {"train_loss": -23.79658317565918, "global_step": 174445, "epoch": 2101} {"train_loss": -23.778717041015625, "global_step": 174446, "epoch": 2101} {"train_loss": -23.45587730407715, "global_step": 174447, "epoch": 2101} {"train_loss": -24.157350540161133, "global_step": 174448, "epoch": 2101} {"train_loss": -23.7834415435791, "global_step": 174449, "epoch": 2101} {"train_loss": -23.78580093383789, "global_step": 174450, "epoch": 2101} {"train_loss": -23.839672088623047, "global_step": 174451, "epoch": 2101} {"train_loss": -23.833513259887695, "global_step": 174452, "epoch": 2101} {"train_loss": -23.9848575592041, "global_step": 174453, "epoch": 2101} {"train_loss": -24.00373649597168, "global_step": 174454, "epoch": 2101} {"train_loss": -23.612051010131836, "global_step": 174455, "epoch": 2101} {"train_loss": -23.82027244567871, "global_step": 174456, "epoch": 2101} {"train_loss": -23.96380043029785, "global_step": 174457, "epoch": 2101} {"train_loss": -23.9986572265625, "global_step": 174458, "epoch": 2101} {"train_loss": -23.9177303314209, "global_step": 174459, "epoch": 2101} {"train_loss": -23.631641387939453, "global_step": 174460, "epoch": 2101} {"train_loss": -24.059324264526367, "global_step": 174461, "epoch": 2101} {"train_loss": -23.74951171875, "global_step": 174462, "epoch": 2101} {"train_loss": -23.769615173339844, "global_step": 174463, "epoch": 2101} {"train_loss": -23.2999267578125, "global_step": 174464, "epoch": 2101} {"train_loss": -23.678927846701747, "global_step": 174465, "epoch": 2101, "val_loss": 6334792.5} {"train_loss": -22.750791549682617, "global_step": 174466, "epoch": 2102} {"train_loss": -23.520267486572266, "global_step": 174467, "epoch": 2102} {"train_loss": -23.530323028564453, "global_step": 174468, "epoch": 2102} {"train_loss": -23.25066566467285, "global_step": 174469, "epoch": 2102} {"train_loss": -23.630619049072266, "global_step": 174470, "epoch": 2102} {"train_loss": -23.45754051208496, "global_step": 174471, "epoch": 2102} {"train_loss": -23.137937545776367, "global_step": 174472, "epoch": 2102} {"train_loss": -23.71015739440918, "global_step": 174473, "epoch": 2102} {"train_loss": -23.833547592163086, "global_step": 174474, "epoch": 2102} {"train_loss": -23.518817901611328, "global_step": 174475, "epoch": 2102} {"train_loss": -23.268957138061523, "global_step": 174476, "epoch": 2102} {"train_loss": -23.8992862701416, "global_step": 174477, "epoch": 2102} {"train_loss": -23.673583984375, "global_step": 174478, "epoch": 2102} {"train_loss": -23.57718849182129, "global_step": 174479, "epoch": 2102} {"train_loss": -23.876100540161133, "global_step": 174480, "epoch": 2102} {"train_loss": -23.84187889099121, "global_step": 174481, "epoch": 2102} {"train_loss": -23.727161407470703, "global_step": 174482, "epoch": 2102} {"train_loss": -23.4842586517334, "global_step": 174483, "epoch": 2102} {"train_loss": -23.635019302368164, "global_step": 174484, "epoch": 2102} {"train_loss": -23.932655334472656, "global_step": 174485, "epoch": 2102} {"train_loss": -24.053617477416992, "global_step": 174486, "epoch": 2102} {"train_loss": -23.472244262695312, "global_step": 174487, "epoch": 2102} {"train_loss": -24.170095443725586, "global_step": 174488, "epoch": 2102} {"train_loss": -23.524749755859375, "global_step": 174489, "epoch": 2102} {"train_loss": -24.14949607849121, "global_step": 174490, "epoch": 2102} {"train_loss": -23.688032150268555, "global_step": 174491, "epoch": 2102} {"train_loss": -23.842288970947266, "global_step": 174492, "epoch": 2102} {"train_loss": -23.83257293701172, "global_step": 174493, "epoch": 2102} {"train_loss": -23.565536499023438, "global_step": 174494, "epoch": 2102} {"train_loss": -23.749732971191406, "global_step": 174495, "epoch": 2102} {"train_loss": -23.73431968688965, "global_step": 174496, "epoch": 2102} {"train_loss": -23.749359130859375, "global_step": 174497, "epoch": 2102} {"train_loss": -23.61674690246582, "global_step": 174498, "epoch": 2102} {"train_loss": -23.527685165405273, "global_step": 174499, "epoch": 2102} {"train_loss": -23.995468139648438, "global_step": 174500, "epoch": 2102} {"train_loss": -23.936683654785156, "global_step": 174501, "epoch": 2102} {"train_loss": -23.4753475189209, "global_step": 174502, "epoch": 2102} {"train_loss": -24.332321166992188, "global_step": 174503, "epoch": 2102} {"train_loss": -23.816722869873047, "global_step": 174504, "epoch": 2102} {"train_loss": -23.759428024291992, "global_step": 174505, "epoch": 2102} {"train_loss": -23.758207321166992, "global_step": 174506, "epoch": 2102} {"train_loss": -23.874040603637695, "global_step": 174507, "epoch": 2102} {"train_loss": -24.067779541015625, "global_step": 174508, "epoch": 2102} {"train_loss": -24.16857147216797, "global_step": 174509, "epoch": 2102} {"train_loss": -23.98200798034668, "global_step": 174510, "epoch": 2102} {"train_loss": -23.671018600463867, "global_step": 174511, "epoch": 2102} {"train_loss": -23.775455474853516, "global_step": 174512, "epoch": 2102} {"train_loss": -23.91704750061035, "global_step": 174513, "epoch": 2102} {"train_loss": -23.83505630493164, "global_step": 174514, "epoch": 2102} {"train_loss": -24.096845626831055, "global_step": 174515, "epoch": 2102} {"train_loss": -24.03110122680664, "global_step": 174516, "epoch": 2102} {"train_loss": -23.94765281677246, "global_step": 174517, "epoch": 2102} {"train_loss": -23.641338348388672, "global_step": 174518, "epoch": 2102} {"train_loss": -23.486434936523438, "global_step": 174519, "epoch": 2102} {"train_loss": -23.809818267822266, "global_step": 174520, "epoch": 2102} {"train_loss": -24.025009155273438, "global_step": 174521, "epoch": 2102} {"train_loss": -23.721261978149414, "global_step": 174522, "epoch": 2102} {"train_loss": -23.923803329467773, "global_step": 174523, "epoch": 2102} {"train_loss": -24.321569442749023, "global_step": 174524, "epoch": 2102} {"train_loss": -23.763525009155273, "global_step": 174525, "epoch": 2102} {"train_loss": -23.423099517822266, "global_step": 174526, "epoch": 2102} {"train_loss": -23.721500396728516, "global_step": 174527, "epoch": 2102} {"train_loss": -24.032569885253906, "global_step": 174528, "epoch": 2102} {"train_loss": -23.675676345825195, "global_step": 174529, "epoch": 2102} {"train_loss": -23.566274642944336, "global_step": 174530, "epoch": 2102} {"train_loss": -23.764577865600586, "global_step": 174531, "epoch": 2102} {"train_loss": -24.083223342895508, "global_step": 174532, "epoch": 2102} {"train_loss": -23.867267608642578, "global_step": 174533, "epoch": 2102} {"train_loss": -24.109411239624023, "global_step": 174534, "epoch": 2102} {"train_loss": -23.72645378112793, "global_step": 174535, "epoch": 2102} {"train_loss": -23.89322853088379, "global_step": 174536, "epoch": 2102} {"train_loss": -23.82235336303711, "global_step": 174537, "epoch": 2102} {"train_loss": -24.039047241210938, "global_step": 174538, "epoch": 2102} {"train_loss": -24.027721405029297, "global_step": 174539, "epoch": 2102} {"train_loss": -23.76019287109375, "global_step": 174540, "epoch": 2102} {"train_loss": -23.6588077545166, "global_step": 174541, "epoch": 2102} {"train_loss": -23.70329475402832, "global_step": 174542, "epoch": 2102} {"train_loss": -23.784696578979492, "global_step": 174543, "epoch": 2102} {"train_loss": -23.83710289001465, "global_step": 174544, "epoch": 2102} {"train_loss": -23.721288681030273, "global_step": 174545, "epoch": 2102} {"train_loss": -23.67962646484375, "global_step": 174546, "epoch": 2102} {"train_loss": -23.602109909057617, "global_step": 174547, "epoch": 2102} {"train_loss": -23.76918068851333, "global_step": 174548, "epoch": 2102, "val_loss": 6350299.0} {"train_loss": -22.410736083984375, "global_step": 174549, "epoch": 2103} {"train_loss": -22.405044555664062, "global_step": 174550, "epoch": 2103} {"train_loss": -22.436059951782227, "global_step": 174551, "epoch": 2103} {"train_loss": -22.648361206054688, "global_step": 174552, "epoch": 2103} {"train_loss": -23.20867919921875, "global_step": 174553, "epoch": 2103} {"train_loss": -23.122018814086914, "global_step": 174554, "epoch": 2103} {"train_loss": -23.64349937438965, "global_step": 174555, "epoch": 2103} {"train_loss": -23.34237289428711, "global_step": 174556, "epoch": 2103} {"train_loss": -23.322797775268555, "global_step": 174557, "epoch": 2103} {"train_loss": -23.237445831298828, "global_step": 174558, "epoch": 2103} {"train_loss": -23.29843521118164, "global_step": 174559, "epoch": 2103} {"train_loss": -23.442625045776367, "global_step": 174560, "epoch": 2103} {"train_loss": -23.54620933532715, "global_step": 174561, "epoch": 2103} {"train_loss": -23.479759216308594, "global_step": 174562, "epoch": 2103} {"train_loss": -23.495656967163086, "global_step": 174563, "epoch": 2103} {"train_loss": -23.436100006103516, "global_step": 174564, "epoch": 2103} {"train_loss": -23.33732032775879, "global_step": 174565, "epoch": 2103} {"train_loss": -23.02968978881836, "global_step": 174566, "epoch": 2103} {"train_loss": -23.275842666625977, "global_step": 174567, "epoch": 2103} {"train_loss": -23.145944595336914, "global_step": 174568, "epoch": 2103} {"train_loss": -23.482357025146484, "global_step": 174569, "epoch": 2103} {"train_loss": -23.356857299804688, "global_step": 174570, "epoch": 2103} {"train_loss": -23.028656005859375, "global_step": 174571, "epoch": 2103} {"train_loss": -23.114683151245117, "global_step": 174572, "epoch": 2103} {"train_loss": -23.360233306884766, "global_step": 174573, "epoch": 2103} {"train_loss": -23.36005401611328, "global_step": 174574, "epoch": 2103} {"train_loss": -23.172895431518555, "global_step": 174575, "epoch": 2103} {"train_loss": -23.219419479370117, "global_step": 174576, "epoch": 2103} {"train_loss": -23.462446212768555, "global_step": 174577, "epoch": 2103} {"train_loss": -23.275785446166992, "global_step": 174578, "epoch": 2103} {"train_loss": -23.508460998535156, "global_step": 174579, "epoch": 2103} {"train_loss": -23.754392623901367, "global_step": 174580, "epoch": 2103} {"train_loss": -23.918237686157227, "global_step": 174581, "epoch": 2103} {"train_loss": -23.76336669921875, "global_step": 174582, "epoch": 2103} {"train_loss": -23.64789581298828, "global_step": 174583, "epoch": 2103} {"train_loss": -23.721515655517578, "global_step": 174584, "epoch": 2103} {"train_loss": -23.847566604614258, "global_step": 174585, "epoch": 2103} {"train_loss": -23.80618667602539, "global_step": 174586, "epoch": 2103} {"train_loss": -23.274168014526367, "global_step": 174587, "epoch": 2103} {"train_loss": -23.75668716430664, "global_step": 174588, "epoch": 2103} {"train_loss": -23.963623046875, "global_step": 174589, "epoch": 2103} {"train_loss": -23.75965118408203, "global_step": 174590, "epoch": 2103} {"train_loss": -24.048343658447266, "global_step": 174591, "epoch": 2103} {"train_loss": -23.6221923828125, "global_step": 174592, "epoch": 2103} {"train_loss": -24.00899314880371, "global_step": 174593, "epoch": 2103} {"train_loss": -23.855833053588867, "global_step": 174594, "epoch": 2103} {"train_loss": -24.101459503173828, "global_step": 174595, "epoch": 2103} {"train_loss": -23.7990779876709, "global_step": 174596, "epoch": 2103} {"train_loss": -23.680801391601562, "global_step": 174597, "epoch": 2103} {"train_loss": -23.984060287475586, "global_step": 174598, "epoch": 2103} {"train_loss": -23.82264518737793, "global_step": 174599, "epoch": 2103} {"train_loss": -23.56050682067871, "global_step": 174600, "epoch": 2103} {"train_loss": -23.37718963623047, "global_step": 174601, "epoch": 2103} {"train_loss": -23.754552841186523, "global_step": 174602, "epoch": 2103} {"train_loss": -24.34466552734375, "global_step": 174603, "epoch": 2103} {"train_loss": -24.247060775756836, "global_step": 174604, "epoch": 2103} {"train_loss": -23.89509391784668, "global_step": 174605, "epoch": 2103} {"train_loss": -23.75661277770996, "global_step": 174606, "epoch": 2103} {"train_loss": -23.889925003051758, "global_step": 174607, "epoch": 2103} {"train_loss": -23.61627197265625, "global_step": 174608, "epoch": 2103} {"train_loss": -23.976072311401367, "global_step": 174609, "epoch": 2103} {"train_loss": -23.66283416748047, "global_step": 174610, "epoch": 2103} {"train_loss": -23.90827178955078, "global_step": 174611, "epoch": 2103} {"train_loss": -23.563434600830078, "global_step": 174612, "epoch": 2103} {"train_loss": -23.461185455322266, "global_step": 174613, "epoch": 2103} {"train_loss": -23.730005264282227, "global_step": 174614, "epoch": 2103} {"train_loss": -23.79328727722168, "global_step": 174615, "epoch": 2103} {"train_loss": -24.23282241821289, "global_step": 174616, "epoch": 2103} {"train_loss": -23.814849853515625, "global_step": 174617, "epoch": 2103} {"train_loss": -23.72971534729004, "global_step": 174618, "epoch": 2103} {"train_loss": -23.31769371032715, "global_step": 174619, "epoch": 2103} {"train_loss": -23.87225341796875, "global_step": 174620, "epoch": 2103} {"train_loss": -23.457687377929688, "global_step": 174621, "epoch": 2103} {"train_loss": -23.588653564453125, "global_step": 174622, "epoch": 2103} {"train_loss": -23.831069946289062, "global_step": 174623, "epoch": 2103} {"train_loss": -23.53313446044922, "global_step": 174624, "epoch": 2103} {"train_loss": -23.745849609375, "global_step": 174625, "epoch": 2103} {"train_loss": -24.091039657592773, "global_step": 174626, "epoch": 2103} {"train_loss": -23.719165802001953, "global_step": 174627, "epoch": 2103} {"train_loss": -23.838272094726562, "global_step": 174628, "epoch": 2103} {"train_loss": -23.9231014251709, "global_step": 174629, "epoch": 2103} {"train_loss": -24.200698852539062, "global_step": 174630, "epoch": 2103} {"train_loss": -23.573082728558276, "global_step": 174631, "epoch": 2103, "val_loss": 6444406.0} {"train_loss": -23.799888610839844, "global_step": 174632, "epoch": 2104} {"train_loss": -23.1958065032959, "global_step": 174633, "epoch": 2104} {"train_loss": -23.6412353515625, "global_step": 174634, "epoch": 2104} {"train_loss": -23.820850372314453, "global_step": 174635, "epoch": 2104} {"train_loss": -23.1490421295166, "global_step": 174636, "epoch": 2104} {"train_loss": -23.237781524658203, "global_step": 174637, "epoch": 2104} {"train_loss": -23.357397079467773, "global_step": 174638, "epoch": 2104} {"train_loss": -23.750030517578125, "global_step": 174639, "epoch": 2104} {"train_loss": -23.50394058227539, "global_step": 174640, "epoch": 2104} {"train_loss": -23.817001342773438, "global_step": 174641, "epoch": 2104} {"train_loss": -23.73430824279785, "global_step": 174642, "epoch": 2104} {"train_loss": -22.97408103942871, "global_step": 174643, "epoch": 2104} {"train_loss": -23.527082443237305, "global_step": 174644, "epoch": 2104} {"train_loss": -23.82264518737793, "global_step": 174645, "epoch": 2104} {"train_loss": -23.532459259033203, "global_step": 174646, "epoch": 2104} {"train_loss": -24.06119155883789, "global_step": 174647, "epoch": 2104} {"train_loss": -24.08864402770996, "global_step": 174648, "epoch": 2104} {"train_loss": -23.55431365966797, "global_step": 174649, "epoch": 2104} {"train_loss": -23.767637252807617, "global_step": 174650, "epoch": 2104} {"train_loss": -23.60615348815918, "global_step": 174651, "epoch": 2104} {"train_loss": -23.359609603881836, "global_step": 174652, "epoch": 2104} {"train_loss": -24.066747665405273, "global_step": 174653, "epoch": 2104} {"train_loss": -23.846576690673828, "global_step": 174654, "epoch": 2104} {"train_loss": -23.538991928100586, "global_step": 174655, "epoch": 2104} {"train_loss": -23.594684600830078, "global_step": 174656, "epoch": 2104} {"train_loss": -23.897871017456055, "global_step": 174657, "epoch": 2104} {"train_loss": -23.803232192993164, "global_step": 174658, "epoch": 2104} {"train_loss": -23.959354400634766, "global_step": 174659, "epoch": 2104} {"train_loss": -24.353363037109375, "global_step": 174660, "epoch": 2104} {"train_loss": -23.789819717407227, "global_step": 174661, "epoch": 2104} {"train_loss": -23.719776153564453, "global_step": 174662, "epoch": 2104} {"train_loss": -23.95911979675293, "global_step": 174663, "epoch": 2104} {"train_loss": -23.905147552490234, "global_step": 174664, "epoch": 2104} {"train_loss": -23.91090202331543, "global_step": 174665, "epoch": 2104} {"train_loss": -23.95229148864746, "global_step": 174666, "epoch": 2104} {"train_loss": -23.819921493530273, "global_step": 174667, "epoch": 2104} {"train_loss": -23.898193359375, "global_step": 174668, "epoch": 2104} {"train_loss": -24.13014030456543, "global_step": 174669, "epoch": 2104} {"train_loss": -23.714269638061523, "global_step": 174670, "epoch": 2104} {"train_loss": -23.730382919311523, "global_step": 174671, "epoch": 2104} {"train_loss": -23.791946411132812, "global_step": 174672, "epoch": 2104} {"train_loss": -23.442718505859375, "global_step": 174673, "epoch": 2104} {"train_loss": -23.631736755371094, "global_step": 174674, "epoch": 2104} {"train_loss": -23.488510131835938, "global_step": 174675, "epoch": 2104} {"train_loss": -23.814268112182617, "global_step": 174676, "epoch": 2104} {"train_loss": -23.60982322692871, "global_step": 174677, "epoch": 2104} {"train_loss": -23.728816986083984, "global_step": 174678, "epoch": 2104} {"train_loss": -23.436290740966797, "global_step": 174679, "epoch": 2104} {"train_loss": -23.883420944213867, "global_step": 174680, "epoch": 2104} {"train_loss": -23.824031829833984, "global_step": 174681, "epoch": 2104} {"train_loss": -23.828840255737305, "global_step": 174682, "epoch": 2104} {"train_loss": -23.976734161376953, "global_step": 174683, "epoch": 2104} {"train_loss": -23.69978141784668, "global_step": 174684, "epoch": 2104} {"train_loss": -23.154632568359375, "global_step": 174685, "epoch": 2104} {"train_loss": -23.662830352783203, "global_step": 174686, "epoch": 2104} {"train_loss": -23.949241638183594, "global_step": 174687, "epoch": 2104} {"train_loss": -23.68949317932129, "global_step": 174688, "epoch": 2104} {"train_loss": -23.70871353149414, "global_step": 174689, "epoch": 2104} {"train_loss": -23.60834312438965, "global_step": 174690, "epoch": 2104} {"train_loss": -23.646881103515625, "global_step": 174691, "epoch": 2104} {"train_loss": -23.67327880859375, "global_step": 174692, "epoch": 2104} {"train_loss": -23.743680953979492, "global_step": 174693, "epoch": 2104} {"train_loss": -23.642642974853516, "global_step": 174694, "epoch": 2104} {"train_loss": -23.708145141601562, "global_step": 174695, "epoch": 2104} {"train_loss": -23.4294490814209, "global_step": 174696, "epoch": 2104} {"train_loss": -23.84963035583496, "global_step": 174697, "epoch": 2104} {"train_loss": -23.897672653198242, "global_step": 174698, "epoch": 2104} {"train_loss": -23.344451904296875, "global_step": 174699, "epoch": 2104} {"train_loss": -23.91678237915039, "global_step": 174700, "epoch": 2104} {"train_loss": -23.722036361694336, "global_step": 174701, "epoch": 2104} {"train_loss": -23.634098052978516, "global_step": 174702, "epoch": 2104} {"train_loss": -24.064733505249023, "global_step": 174703, "epoch": 2104} {"train_loss": -23.721006393432617, "global_step": 174704, "epoch": 2104} {"train_loss": -23.89730453491211, "global_step": 174705, "epoch": 2104} {"train_loss": -23.821958541870117, "global_step": 174706, "epoch": 2104} {"train_loss": -23.87666893005371, "global_step": 174707, "epoch": 2104} {"train_loss": -23.587743759155273, "global_step": 174708, "epoch": 2104} {"train_loss": -23.927854537963867, "global_step": 174709, "epoch": 2104} {"train_loss": -24.10207176208496, "global_step": 174710, "epoch": 2104} {"train_loss": -23.571533203125, "global_step": 174711, "epoch": 2104} {"train_loss": -24.170215606689453, "global_step": 174712, "epoch": 2104} {"train_loss": -23.818235397338867, "global_step": 174713, "epoch": 2104} {"train_loss": -23.753050126225116, "global_step": 174714, "epoch": 2104, "val_loss": 6499720.0} {"train_loss": -23.23415184020996, "global_step": 174715, "epoch": 2105} {"train_loss": -22.987791061401367, "global_step": 174716, "epoch": 2105} {"train_loss": -23.315677642822266, "global_step": 174717, "epoch": 2105} {"train_loss": -22.886123657226562, "global_step": 174718, "epoch": 2105} {"train_loss": -23.406803131103516, "global_step": 174719, "epoch": 2105} {"train_loss": -23.171905517578125, "global_step": 174720, "epoch": 2105} {"train_loss": -23.427453994750977, "global_step": 174721, "epoch": 2105} {"train_loss": -23.241796493530273, "global_step": 174722, "epoch": 2105} {"train_loss": -23.374204635620117, "global_step": 174723, "epoch": 2105} {"train_loss": -23.446491241455078, "global_step": 174724, "epoch": 2105} {"train_loss": -23.315086364746094, "global_step": 174725, "epoch": 2105} {"train_loss": -23.414113998413086, "global_step": 174726, "epoch": 2105} {"train_loss": -23.56639289855957, "global_step": 174727, "epoch": 2105} {"train_loss": -23.59316062927246, "global_step": 174728, "epoch": 2105} {"train_loss": -23.62647819519043, "global_step": 174729, "epoch": 2105} {"train_loss": -23.495840072631836, "global_step": 174730, "epoch": 2105} {"train_loss": -23.428529739379883, "global_step": 174731, "epoch": 2105} {"train_loss": -23.00855255126953, "global_step": 174732, "epoch": 2105} {"train_loss": -23.631607055664062, "global_step": 174733, "epoch": 2105} {"train_loss": -23.44786262512207, "global_step": 174734, "epoch": 2105} {"train_loss": -23.52997589111328, "global_step": 174735, "epoch": 2105} {"train_loss": -23.27321434020996, "global_step": 174736, "epoch": 2105} {"train_loss": -23.78916358947754, "global_step": 174737, "epoch": 2105} {"train_loss": -23.437856674194336, "global_step": 174738, "epoch": 2105} {"train_loss": -23.5899600982666, "global_step": 174739, "epoch": 2105} {"train_loss": -23.511051177978516, "global_step": 174740, "epoch": 2105} {"train_loss": -23.62221336364746, "global_step": 174741, "epoch": 2105} {"train_loss": -23.99871253967285, "global_step": 174742, "epoch": 2105} {"train_loss": -23.50559425354004, "global_step": 174743, "epoch": 2105} {"train_loss": -23.85892105102539, "global_step": 174744, "epoch": 2105} {"train_loss": -23.660017013549805, "global_step": 174745, "epoch": 2105} {"train_loss": -23.756017684936523, "global_step": 174746, "epoch": 2105} {"train_loss": -23.510990142822266, "global_step": 174747, "epoch": 2105} {"train_loss": -24.109054565429688, "global_step": 174748, "epoch": 2105} {"train_loss": -24.028106689453125, "global_step": 174749, "epoch": 2105} {"train_loss": -24.08766746520996, "global_step": 174750, "epoch": 2105} {"train_loss": -23.79621696472168, "global_step": 174751, "epoch": 2105} {"train_loss": -23.77474021911621, "global_step": 174752, "epoch": 2105} {"train_loss": -23.821592330932617, "global_step": 174753, "epoch": 2105} {"train_loss": -23.798067092895508, "global_step": 174754, "epoch": 2105} {"train_loss": -24.260244369506836, "global_step": 174755, "epoch": 2105} {"train_loss": -23.644704818725586, "global_step": 174756, "epoch": 2105} {"train_loss": -23.824695587158203, "global_step": 174757, "epoch": 2105} {"train_loss": -23.718490600585938, "global_step": 174758, "epoch": 2105} {"train_loss": -23.912841796875, "global_step": 174759, "epoch": 2105} {"train_loss": -23.773101806640625, "global_step": 174760, "epoch": 2105} {"train_loss": -23.54225730895996, "global_step": 174761, "epoch": 2105} {"train_loss": -23.501876831054688, "global_step": 174762, "epoch": 2105} {"train_loss": -23.883846282958984, "global_step": 174763, "epoch": 2105} {"train_loss": -23.96381187438965, "global_step": 174764, "epoch": 2105} {"train_loss": -23.797197341918945, "global_step": 174765, "epoch": 2105} {"train_loss": -23.45607566833496, "global_step": 174766, "epoch": 2105} {"train_loss": -23.21024513244629, "global_step": 174767, "epoch": 2105} {"train_loss": -23.895654678344727, "global_step": 174768, "epoch": 2105} {"train_loss": -23.520498275756836, "global_step": 174769, "epoch": 2105} {"train_loss": -23.478578567504883, "global_step": 174770, "epoch": 2105} {"train_loss": -23.468748092651367, "global_step": 174771, "epoch": 2105} {"train_loss": -23.351139068603516, "global_step": 174772, "epoch": 2105} {"train_loss": -23.837987899780273, "global_step": 174773, "epoch": 2105} {"train_loss": -23.320722579956055, "global_step": 174774, "epoch": 2105} {"train_loss": -23.612478256225586, "global_step": 174775, "epoch": 2105} {"train_loss": -24.289627075195312, "global_step": 174776, "epoch": 2105} {"train_loss": -23.491235733032227, "global_step": 174777, "epoch": 2105} {"train_loss": -23.61079978942871, "global_step": 174778, "epoch": 2105} {"train_loss": -24.262624740600586, "global_step": 174779, "epoch": 2105} {"train_loss": -23.7183895111084, "global_step": 174780, "epoch": 2105} {"train_loss": -24.07291030883789, "global_step": 174781, "epoch": 2105} {"train_loss": -24.047821044921875, "global_step": 174782, "epoch": 2105} {"train_loss": -23.76506805419922, "global_step": 174783, "epoch": 2105} {"train_loss": -23.802465438842773, "global_step": 174784, "epoch": 2105} {"train_loss": -23.746641159057617, "global_step": 174785, "epoch": 2105} {"train_loss": -24.149112701416016, "global_step": 174786, "epoch": 2105} {"train_loss": -24.164457321166992, "global_step": 174787, "epoch": 2105} {"train_loss": -23.877477645874023, "global_step": 174788, "epoch": 2105} {"train_loss": -23.972457885742188, "global_step": 174789, "epoch": 2105} {"train_loss": -23.8702335357666, "global_step": 174790, "epoch": 2105} {"train_loss": -23.692337036132812, "global_step": 174791, "epoch": 2105} {"train_loss": -23.868494033813477, "global_step": 174792, "epoch": 2105} {"train_loss": -23.97563934326172, "global_step": 174793, "epoch": 2105} {"train_loss": -23.861921310424805, "global_step": 174794, "epoch": 2105} {"train_loss": -24.025419235229492, "global_step": 174795, "epoch": 2105} {"train_loss": -23.897825241088867, "global_step": 174796, "epoch": 2105} {"train_loss": -23.669299504843103, "global_step": 174797, "epoch": 2105, "val_loss": 6468853.0} {"train_loss": -23.905656814575195, "global_step": 174798, "epoch": 2106} {"train_loss": -23.441930770874023, "global_step": 174799, "epoch": 2106} {"train_loss": -23.366561889648438, "global_step": 174800, "epoch": 2106} {"train_loss": -23.664323806762695, "global_step": 174801, "epoch": 2106} {"train_loss": -23.467788696289062, "global_step": 174802, "epoch": 2106} {"train_loss": -23.375308990478516, "global_step": 174803, "epoch": 2106} {"train_loss": -23.68844985961914, "global_step": 174804, "epoch": 2106} {"train_loss": -23.836782455444336, "global_step": 174805, "epoch": 2106} {"train_loss": -23.63528060913086, "global_step": 174806, "epoch": 2106} {"train_loss": -23.479984283447266, "global_step": 174807, "epoch": 2106} {"train_loss": -23.977975845336914, "global_step": 174808, "epoch": 2106} {"train_loss": -23.278940200805664, "global_step": 174809, "epoch": 2106} {"train_loss": -23.53458023071289, "global_step": 174810, "epoch": 2106} {"train_loss": -23.904346466064453, "global_step": 174811, "epoch": 2106} {"train_loss": -23.598194122314453, "global_step": 174812, "epoch": 2106} {"train_loss": -23.699012756347656, "global_step": 174813, "epoch": 2106} {"train_loss": -23.541810989379883, "global_step": 174814, "epoch": 2106} {"train_loss": -23.682279586791992, "global_step": 174815, "epoch": 2106} {"train_loss": -23.382627487182617, "global_step": 174816, "epoch": 2106} {"train_loss": -23.743267059326172, "global_step": 174817, "epoch": 2106} {"train_loss": -23.937650680541992, "global_step": 174818, "epoch": 2106} {"train_loss": -23.622488021850586, "global_step": 174819, "epoch": 2106} {"train_loss": -23.85093116760254, "global_step": 174820, "epoch": 2106} {"train_loss": -23.807580947875977, "global_step": 174821, "epoch": 2106} {"train_loss": -23.80455207824707, "global_step": 174822, "epoch": 2106} {"train_loss": -23.83968162536621, "global_step": 174823, "epoch": 2106} {"train_loss": -23.812063217163086, "global_step": 174824, "epoch": 2106} {"train_loss": -23.76322364807129, "global_step": 174825, "epoch": 2106} {"train_loss": -23.809579849243164, "global_step": 174826, "epoch": 2106} {"train_loss": -23.79035186767578, "global_step": 174827, "epoch": 2106} {"train_loss": -23.852603912353516, "global_step": 174828, "epoch": 2106} {"train_loss": -24.023794174194336, "global_step": 174829, "epoch": 2106} {"train_loss": -23.841299057006836, "global_step": 174830, "epoch": 2106} {"train_loss": -23.9305477142334, "global_step": 174831, "epoch": 2106} {"train_loss": -23.605472564697266, "global_step": 174832, "epoch": 2106} {"train_loss": -24.016498565673828, "global_step": 174833, "epoch": 2106} {"train_loss": -23.813108444213867, "global_step": 174834, "epoch": 2106} {"train_loss": -23.87904930114746, "global_step": 174835, "epoch": 2106} {"train_loss": -23.867084503173828, "global_step": 174836, "epoch": 2106} {"train_loss": -24.12126350402832, "global_step": 174837, "epoch": 2106} {"train_loss": -23.78528594970703, "global_step": 174838, "epoch": 2106} {"train_loss": -23.587724685668945, "global_step": 174839, "epoch": 2106} {"train_loss": -23.641033172607422, "global_step": 174840, "epoch": 2106} {"train_loss": -23.858549118041992, "global_step": 174841, "epoch": 2106} {"train_loss": -24.269968032836914, "global_step": 174842, "epoch": 2106} {"train_loss": -23.991321563720703, "global_step": 174843, "epoch": 2106} {"train_loss": -23.808338165283203, "global_step": 174844, "epoch": 2106} {"train_loss": -24.10512351989746, "global_step": 174845, "epoch": 2106} {"train_loss": -24.0033016204834, "global_step": 174846, "epoch": 2106} {"train_loss": -23.858993530273438, "global_step": 174847, "epoch": 2106} {"train_loss": -23.994474411010742, "global_step": 174848, "epoch": 2106} {"train_loss": -23.67275619506836, "global_step": 174849, "epoch": 2106} {"train_loss": -23.8215274810791, "global_step": 174850, "epoch": 2106} {"train_loss": -23.804386138916016, "global_step": 174851, "epoch": 2106} {"train_loss": -23.779254913330078, "global_step": 174852, "epoch": 2106} {"train_loss": -23.774829864501953, "global_step": 174853, "epoch": 2106} {"train_loss": -24.056888580322266, "global_step": 174854, "epoch": 2106} {"train_loss": -23.654417037963867, "global_step": 174855, "epoch": 2106} {"train_loss": -24.0612735748291, "global_step": 174856, "epoch": 2106} {"train_loss": -23.530370712280273, "global_step": 174857, "epoch": 2106} {"train_loss": -23.823579788208008, "global_step": 174858, "epoch": 2106} {"train_loss": -24.03885269165039, "global_step": 174859, "epoch": 2106} {"train_loss": -23.79555320739746, "global_step": 174860, "epoch": 2106} {"train_loss": -23.99344253540039, "global_step": 174861, "epoch": 2106} {"train_loss": -23.818111419677734, "global_step": 174862, "epoch": 2106} {"train_loss": -23.71357536315918, "global_step": 174863, "epoch": 2106} {"train_loss": -23.588577270507812, "global_step": 174864, "epoch": 2106} {"train_loss": -24.130033493041992, "global_step": 174865, "epoch": 2106} {"train_loss": -23.980363845825195, "global_step": 174866, "epoch": 2106} {"train_loss": -23.777067184448242, "global_step": 174867, "epoch": 2106} {"train_loss": -23.45304298400879, "global_step": 174868, "epoch": 2106} {"train_loss": -23.37720489501953, "global_step": 174869, "epoch": 2106} {"train_loss": -24.17513656616211, "global_step": 174870, "epoch": 2106} {"train_loss": -23.498069763183594, "global_step": 174871, "epoch": 2106} {"train_loss": -23.80855941772461, "global_step": 174872, "epoch": 2106} {"train_loss": -23.884540557861328, "global_step": 174873, "epoch": 2106} {"train_loss": -23.679372787475586, "global_step": 174874, "epoch": 2106} {"train_loss": -23.528310775756836, "global_step": 174875, "epoch": 2106} {"train_loss": -23.590545654296875, "global_step": 174876, "epoch": 2106} {"train_loss": -24.051589965820312, "global_step": 174877, "epoch": 2106} {"train_loss": -23.689855575561523, "global_step": 174878, "epoch": 2106} {"train_loss": -23.626562118530273, "global_step": 174879, "epoch": 2106} {"train_loss": -23.779180480773192, "global_step": 174880, "epoch": 2106, "val_loss": 6350348.0} {"train_loss": -23.610265731811523, "global_step": 174881, "epoch": 2107} {"train_loss": -23.06555938720703, "global_step": 174882, "epoch": 2107} {"train_loss": -24.07941246032715, "global_step": 174883, "epoch": 2107} {"train_loss": -23.18427848815918, "global_step": 174884, "epoch": 2107} {"train_loss": -22.85968589782715, "global_step": 174885, "epoch": 2107} {"train_loss": -23.653833389282227, "global_step": 174886, "epoch": 2107} {"train_loss": -23.645549774169922, "global_step": 174887, "epoch": 2107} {"train_loss": -23.4494686126709, "global_step": 174888, "epoch": 2107} {"train_loss": -23.827383041381836, "global_step": 174889, "epoch": 2107} {"train_loss": -23.311851501464844, "global_step": 174890, "epoch": 2107} {"train_loss": -23.443220138549805, "global_step": 174891, "epoch": 2107} {"train_loss": -23.71062660217285, "global_step": 174892, "epoch": 2107} {"train_loss": -23.490678787231445, "global_step": 174893, "epoch": 2107} {"train_loss": -23.456506729125977, "global_step": 174894, "epoch": 2107} {"train_loss": -23.68594741821289, "global_step": 174895, "epoch": 2107} {"train_loss": -23.665693283081055, "global_step": 174896, "epoch": 2107} {"train_loss": -23.4373779296875, "global_step": 174897, "epoch": 2107} {"train_loss": -23.884323120117188, "global_step": 174898, "epoch": 2107} {"train_loss": -23.645612716674805, "global_step": 174899, "epoch": 2107} {"train_loss": -23.973560333251953, "global_step": 174900, "epoch": 2107} {"train_loss": -23.661075592041016, "global_step": 174901, "epoch": 2107} {"train_loss": -23.927366256713867, "global_step": 174902, "epoch": 2107} {"train_loss": -23.726972579956055, "global_step": 174903, "epoch": 2107} {"train_loss": -23.274778366088867, "global_step": 174904, "epoch": 2107} {"train_loss": -23.94800567626953, "global_step": 174905, "epoch": 2107} {"train_loss": -23.849950790405273, "global_step": 174906, "epoch": 2107} {"train_loss": -23.699491500854492, "global_step": 174907, "epoch": 2107} {"train_loss": -23.930578231811523, "global_step": 174908, "epoch": 2107} {"train_loss": -23.67486572265625, "global_step": 174909, "epoch": 2107} {"train_loss": -23.69073486328125, "global_step": 174910, "epoch": 2107} {"train_loss": -23.776166915893555, "global_step": 174911, "epoch": 2107} {"train_loss": -23.69870948791504, "global_step": 174912, "epoch": 2107} {"train_loss": -23.729665756225586, "global_step": 174913, "epoch": 2107} {"train_loss": -24.32207679748535, "global_step": 174914, "epoch": 2107} {"train_loss": -23.691801071166992, "global_step": 174915, "epoch": 2107} {"train_loss": -23.5402889251709, "global_step": 174916, "epoch": 2107} {"train_loss": -23.999187469482422, "global_step": 174917, "epoch": 2107} {"train_loss": -23.605749130249023, "global_step": 174918, "epoch": 2107} {"train_loss": -24.32138442993164, "global_step": 174919, "epoch": 2107} {"train_loss": -23.678159713745117, "global_step": 174920, "epoch": 2107} {"train_loss": -23.490644454956055, "global_step": 174921, "epoch": 2107} {"train_loss": -23.961599349975586, "global_step": 174922, "epoch": 2107} {"train_loss": -24.003498077392578, "global_step": 174923, "epoch": 2107} {"train_loss": -23.8372859954834, "global_step": 174924, "epoch": 2107} {"train_loss": -23.73990249633789, "global_step": 174925, "epoch": 2107} {"train_loss": -23.32496452331543, "global_step": 174926, "epoch": 2107} {"train_loss": -23.756986618041992, "global_step": 174927, "epoch": 2107} {"train_loss": -23.590578079223633, "global_step": 174928, "epoch": 2107} {"train_loss": -23.1496639251709, "global_step": 174929, "epoch": 2107} {"train_loss": -23.49519920349121, "global_step": 174930, "epoch": 2107} {"train_loss": -23.787433624267578, "global_step": 174931, "epoch": 2107} {"train_loss": -23.80764389038086, "global_step": 174932, "epoch": 2107} {"train_loss": -23.784788131713867, "global_step": 174933, "epoch": 2107} {"train_loss": -23.65572166442871, "global_step": 174934, "epoch": 2107} {"train_loss": -23.928165435791016, "global_step": 174935, "epoch": 2107} {"train_loss": -23.4641170501709, "global_step": 174936, "epoch": 2107} {"train_loss": -24.200538635253906, "global_step": 174937, "epoch": 2107} {"train_loss": -23.50653648376465, "global_step": 174938, "epoch": 2107} {"train_loss": -23.82179069519043, "global_step": 174939, "epoch": 2107} {"train_loss": -23.87691307067871, "global_step": 174940, "epoch": 2107} {"train_loss": -23.69103240966797, "global_step": 174941, "epoch": 2107} {"train_loss": -23.689939498901367, "global_step": 174942, "epoch": 2107} {"train_loss": -23.67011833190918, "global_step": 174943, "epoch": 2107} {"train_loss": -23.833805084228516, "global_step": 174944, "epoch": 2107} {"train_loss": -23.76050567626953, "global_step": 174945, "epoch": 2107} {"train_loss": -23.842519760131836, "global_step": 174946, "epoch": 2107} {"train_loss": -24.03682518005371, "global_step": 174947, "epoch": 2107} {"train_loss": -24.164060592651367, "global_step": 174948, "epoch": 2107} {"train_loss": -23.838071823120117, "global_step": 174949, "epoch": 2107} {"train_loss": -24.100982666015625, "global_step": 174950, "epoch": 2107} {"train_loss": -23.995182037353516, "global_step": 174951, "epoch": 2107} {"train_loss": -23.837106704711914, "global_step": 174952, "epoch": 2107} {"train_loss": -23.8521785736084, "global_step": 174953, "epoch": 2107} {"train_loss": -23.79097557067871, "global_step": 174954, "epoch": 2107} {"train_loss": -23.721519470214844, "global_step": 174955, "epoch": 2107} {"train_loss": -23.935699462890625, "global_step": 174956, "epoch": 2107} {"train_loss": -23.893238067626953, "global_step": 174957, "epoch": 2107} {"train_loss": -24.112773895263672, "global_step": 174958, "epoch": 2107} {"train_loss": -23.779653549194336, "global_step": 174959, "epoch": 2107} {"train_loss": -23.524261474609375, "global_step": 174960, "epoch": 2107} {"train_loss": -23.987764358520508, "global_step": 174961, "epoch": 2107} {"train_loss": -23.702604293823242, "global_step": 174962, "epoch": 2107} {"train_loss": -23.732292841715985, "global_step": 174963, "epoch": 2107, "val_loss": 6435123.5} {"train_loss": -23.534719467163086, "global_step": 174964, "epoch": 2108} {"train_loss": -23.78228759765625, "global_step": 174965, "epoch": 2108} {"train_loss": -23.491905212402344, "global_step": 174966, "epoch": 2108} {"train_loss": -23.201759338378906, "global_step": 174967, "epoch": 2108} {"train_loss": -23.889846801757812, "global_step": 174968, "epoch": 2108} {"train_loss": -23.861377716064453, "global_step": 174969, "epoch": 2108} {"train_loss": -23.776212692260742, "global_step": 174970, "epoch": 2108} {"train_loss": -23.65702247619629, "global_step": 174971, "epoch": 2108} {"train_loss": -23.930744171142578, "global_step": 174972, "epoch": 2108} {"train_loss": -23.97295570373535, "global_step": 174973, "epoch": 2108} {"train_loss": -23.960966110229492, "global_step": 174974, "epoch": 2108} {"train_loss": -23.88676643371582, "global_step": 174975, "epoch": 2108} {"train_loss": -23.4736385345459, "global_step": 174976, "epoch": 2108} {"train_loss": -24.088092803955078, "global_step": 174977, "epoch": 2108} {"train_loss": -23.874839782714844, "global_step": 174978, "epoch": 2108} {"train_loss": -23.922380447387695, "global_step": 174979, "epoch": 2108} {"train_loss": -24.015335083007812, "global_step": 174980, "epoch": 2108} {"train_loss": -23.691612243652344, "global_step": 174981, "epoch": 2108} {"train_loss": -23.596616744995117, "global_step": 174982, "epoch": 2108} {"train_loss": -23.908355712890625, "global_step": 174983, "epoch": 2108} {"train_loss": -24.04561996459961, "global_step": 174984, "epoch": 2108} {"train_loss": -24.01605224609375, "global_step": 174985, "epoch": 2108} {"train_loss": -23.47412872314453, "global_step": 174986, "epoch": 2108} {"train_loss": -23.830358505249023, "global_step": 174987, "epoch": 2108} {"train_loss": -24.03843879699707, "global_step": 174988, "epoch": 2108} {"train_loss": -23.674055099487305, "global_step": 174989, "epoch": 2108} {"train_loss": -23.893896102905273, "global_step": 174990, "epoch": 2108} {"train_loss": -23.760501861572266, "global_step": 174991, "epoch": 2108} {"train_loss": -23.766695022583008, "global_step": 174992, "epoch": 2108} {"train_loss": -23.853931427001953, "global_step": 174993, "epoch": 2108} {"train_loss": -23.770334243774414, "global_step": 174994, "epoch": 2108} {"train_loss": -23.614635467529297, "global_step": 174995, "epoch": 2108} {"train_loss": -23.81399917602539, "global_step": 174996, "epoch": 2108} {"train_loss": -23.564146041870117, "global_step": 174997, "epoch": 2108} {"train_loss": -23.89522933959961, "global_step": 174998, "epoch": 2108} {"train_loss": -23.837345123291016, "global_step": 174999, "epoch": 2108} {"train_loss": -23.76853370666504, "global_step": 175000, "epoch": 2108} {"train_loss": -23.552427291870117, "global_step": 175001, "epoch": 2108} {"train_loss": -23.896282196044922, "global_step": 175002, "epoch": 2108} {"train_loss": -23.670562744140625, "global_step": 175003, "epoch": 2108} {"train_loss": -23.439952850341797, "global_step": 175004, "epoch": 2108} {"train_loss": -23.758865356445312, "global_step": 175005, "epoch": 2108} {"train_loss": -23.69302749633789, "global_step": 175006, "epoch": 2108} {"train_loss": -23.540042877197266, "global_step": 175007, "epoch": 2108} {"train_loss": -24.00035858154297, "global_step": 175008, "epoch": 2108} {"train_loss": -23.8129940032959, "global_step": 175009, "epoch": 2108} {"train_loss": -23.887697219848633, "global_step": 175010, "epoch": 2108} {"train_loss": -24.133804321289062, "global_step": 175011, "epoch": 2108} {"train_loss": -23.9188232421875, "global_step": 175012, "epoch": 2108} {"train_loss": -23.816770553588867, "global_step": 175013, "epoch": 2108} {"train_loss": -23.847158432006836, "global_step": 175014, "epoch": 2108} {"train_loss": -24.005630493164062, "global_step": 175015, "epoch": 2108} {"train_loss": -23.82964515686035, "global_step": 175016, "epoch": 2108} {"train_loss": -23.600648880004883, "global_step": 175017, "epoch": 2108} {"train_loss": -23.97248649597168, "global_step": 175018, "epoch": 2108} {"train_loss": -24.0794620513916, "global_step": 175019, "epoch": 2108} {"train_loss": -23.866722106933594, "global_step": 175020, "epoch": 2108} {"train_loss": -23.55375862121582, "global_step": 175021, "epoch": 2108} {"train_loss": -23.943132400512695, "global_step": 175022, "epoch": 2108} {"train_loss": -23.45099449157715, "global_step": 175023, "epoch": 2108} {"train_loss": -23.557987213134766, "global_step": 175024, "epoch": 2108} {"train_loss": -23.764022827148438, "global_step": 175025, "epoch": 2108} {"train_loss": -23.930456161499023, "global_step": 175026, "epoch": 2108} {"train_loss": -23.756628036499023, "global_step": 175027, "epoch": 2108} {"train_loss": -23.729766845703125, "global_step": 175028, "epoch": 2108} {"train_loss": -24.092445373535156, "global_step": 175029, "epoch": 2108} {"train_loss": -24.010086059570312, "global_step": 175030, "epoch": 2108} {"train_loss": -23.857385635375977, "global_step": 175031, "epoch": 2108} {"train_loss": -23.676671981811523, "global_step": 175032, "epoch": 2108} {"train_loss": -23.84089469909668, "global_step": 175033, "epoch": 2108} {"train_loss": -23.937641143798828, "global_step": 175034, "epoch": 2108} {"train_loss": -24.310413360595703, "global_step": 175035, "epoch": 2108} {"train_loss": -23.8205509185791, "global_step": 175036, "epoch": 2108} {"train_loss": -24.30494499206543, "global_step": 175037, "epoch": 2108} {"train_loss": -23.49540901184082, "global_step": 175038, "epoch": 2108} {"train_loss": -23.75982093811035, "global_step": 175039, "epoch": 2108} {"train_loss": -24.09356117248535, "global_step": 175040, "epoch": 2108} {"train_loss": -23.66119956970215, "global_step": 175041, "epoch": 2108} {"train_loss": -24.058914184570312, "global_step": 175042, "epoch": 2108} {"train_loss": -24.333904266357422, "global_step": 175043, "epoch": 2108} {"train_loss": -23.744155883789062, "global_step": 175044, "epoch": 2108} {"train_loss": -23.74480628967285, "global_step": 175045, "epoch": 2108} {"train_loss": -23.839034436696984, "global_step": 175046, "epoch": 2108, "val_loss": 6291109.0} {"train_loss": -23.352590560913086, "global_step": 175047, "epoch": 2109} {"train_loss": -23.14470100402832, "global_step": 175048, "epoch": 2109} {"train_loss": -23.779163360595703, "global_step": 175049, "epoch": 2109} {"train_loss": -23.9940128326416, "global_step": 175050, "epoch": 2109} {"train_loss": -23.569297790527344, "global_step": 175051, "epoch": 2109} {"train_loss": -23.62164878845215, "global_step": 175052, "epoch": 2109} {"train_loss": -23.476423263549805, "global_step": 175053, "epoch": 2109} {"train_loss": -23.63579559326172, "global_step": 175054, "epoch": 2109} {"train_loss": -23.391355514526367, "global_step": 175055, "epoch": 2109} {"train_loss": -23.94011688232422, "global_step": 175056, "epoch": 2109} {"train_loss": -23.47243309020996, "global_step": 175057, "epoch": 2109} {"train_loss": -23.795635223388672, "global_step": 175058, "epoch": 2109} {"train_loss": -23.47437858581543, "global_step": 175059, "epoch": 2109} {"train_loss": -23.725744247436523, "global_step": 175060, "epoch": 2109} {"train_loss": -23.902143478393555, "global_step": 175061, "epoch": 2109} {"train_loss": -23.466163635253906, "global_step": 175062, "epoch": 2109} {"train_loss": -23.853105545043945, "global_step": 175063, "epoch": 2109} {"train_loss": -23.679956436157227, "global_step": 175064, "epoch": 2109} {"train_loss": -23.562986373901367, "global_step": 175065, "epoch": 2109} {"train_loss": -23.859928131103516, "global_step": 175066, "epoch": 2109} {"train_loss": -23.734342575073242, "global_step": 175067, "epoch": 2109} {"train_loss": -23.348140716552734, "global_step": 175068, "epoch": 2109} {"train_loss": -23.815095901489258, "global_step": 175069, "epoch": 2109} {"train_loss": -23.398298263549805, "global_step": 175070, "epoch": 2109} {"train_loss": -23.40236473083496, "global_step": 175071, "epoch": 2109} {"train_loss": -23.639596939086914, "global_step": 175072, "epoch": 2109} {"train_loss": -23.8404483795166, "global_step": 175073, "epoch": 2109} {"train_loss": -23.257017135620117, "global_step": 175074, "epoch": 2109} {"train_loss": -23.685598373413086, "global_step": 175075, "epoch": 2109} {"train_loss": -23.942115783691406, "global_step": 175076, "epoch": 2109} {"train_loss": -23.526350021362305, "global_step": 175077, "epoch": 2109} {"train_loss": -23.972558975219727, "global_step": 175078, "epoch": 2109} {"train_loss": -23.674570083618164, "global_step": 175079, "epoch": 2109} {"train_loss": -23.678878784179688, "global_step": 175080, "epoch": 2109} {"train_loss": -23.91020965576172, "global_step": 175081, "epoch": 2109} {"train_loss": -24.104995727539062, "global_step": 175082, "epoch": 2109} {"train_loss": -23.792722702026367, "global_step": 175083, "epoch": 2109} {"train_loss": -23.726381301879883, "global_step": 175084, "epoch": 2109} {"train_loss": -23.83192253112793, "global_step": 175085, "epoch": 2109} {"train_loss": -23.772281646728516, "global_step": 175086, "epoch": 2109} {"train_loss": -23.565509796142578, "global_step": 175087, "epoch": 2109} {"train_loss": -23.69232940673828, "global_step": 175088, "epoch": 2109} {"train_loss": -23.842056274414062, "global_step": 175089, "epoch": 2109} {"train_loss": -23.906415939331055, "global_step": 175090, "epoch": 2109} {"train_loss": -23.758899688720703, "global_step": 175091, "epoch": 2109} {"train_loss": -23.64871597290039, "global_step": 175092, "epoch": 2109} {"train_loss": -23.89919662475586, "global_step": 175093, "epoch": 2109} {"train_loss": -23.457637786865234, "global_step": 175094, "epoch": 2109} {"train_loss": -23.62721824645996, "global_step": 175095, "epoch": 2109} {"train_loss": -23.086454391479492, "global_step": 175096, "epoch": 2109} {"train_loss": -23.057424545288086, "global_step": 175097, "epoch": 2109} {"train_loss": -24.01472282409668, "global_step": 175098, "epoch": 2109} {"train_loss": -23.868318557739258, "global_step": 175099, "epoch": 2109} {"train_loss": -23.39497184753418, "global_step": 175100, "epoch": 2109} {"train_loss": -23.46907615661621, "global_step": 175101, "epoch": 2109} {"train_loss": -23.7698917388916, "global_step": 175102, "epoch": 2109} {"train_loss": -23.548542022705078, "global_step": 175103, "epoch": 2109} {"train_loss": -23.766416549682617, "global_step": 175104, "epoch": 2109} {"train_loss": -23.608417510986328, "global_step": 175105, "epoch": 2109} {"train_loss": -23.507278442382812, "global_step": 175106, "epoch": 2109} {"train_loss": -23.591447830200195, "global_step": 175107, "epoch": 2109} {"train_loss": -23.62818717956543, "global_step": 175108, "epoch": 2109} {"train_loss": -23.82647705078125, "global_step": 175109, "epoch": 2109} {"train_loss": -23.58319091796875, "global_step": 175110, "epoch": 2109} {"train_loss": -23.94207763671875, "global_step": 175111, "epoch": 2109} {"train_loss": -23.758495330810547, "global_step": 175112, "epoch": 2109} {"train_loss": -23.759931564331055, "global_step": 175113, "epoch": 2109} {"train_loss": -23.915990829467773, "global_step": 175114, "epoch": 2109} {"train_loss": -23.693424224853516, "global_step": 175115, "epoch": 2109} {"train_loss": -23.211885452270508, "global_step": 175116, "epoch": 2109} {"train_loss": -23.56339454650879, "global_step": 175117, "epoch": 2109} {"train_loss": -24.038909912109375, "global_step": 175118, "epoch": 2109} {"train_loss": -23.685165405273438, "global_step": 175119, "epoch": 2109} {"train_loss": -23.49127197265625, "global_step": 175120, "epoch": 2109} {"train_loss": -23.814455032348633, "global_step": 175121, "epoch": 2109} {"train_loss": -23.607929229736328, "global_step": 175122, "epoch": 2109} {"train_loss": -23.922868728637695, "global_step": 175123, "epoch": 2109} {"train_loss": -23.890830993652344, "global_step": 175124, "epoch": 2109} {"train_loss": -23.766700744628906, "global_step": 175125, "epoch": 2109} {"train_loss": -24.05133056640625, "global_step": 175126, "epoch": 2109} {"train_loss": -23.921340942382812, "global_step": 175127, "epoch": 2109} {"train_loss": -23.95533561706543, "global_step": 175128, "epoch": 2109} {"train_loss": -23.69738741955125, "global_step": 175129, "epoch": 2109, "val_loss": 6406035.0} {"train_loss": -23.279865264892578, "global_step": 175130, "epoch": 2110} {"train_loss": -23.046382904052734, "global_step": 175131, "epoch": 2110} {"train_loss": -23.597867965698242, "global_step": 175132, "epoch": 2110} {"train_loss": -23.06406021118164, "global_step": 175133, "epoch": 2110} {"train_loss": -23.79165267944336, "global_step": 175134, "epoch": 2110} {"train_loss": -23.463655471801758, "global_step": 175135, "epoch": 2110} {"train_loss": -23.65227508544922, "global_step": 175136, "epoch": 2110} {"train_loss": -23.304237365722656, "global_step": 175137, "epoch": 2110} {"train_loss": -23.766298294067383, "global_step": 175138, "epoch": 2110} {"train_loss": -23.754796981811523, "global_step": 175139, "epoch": 2110} {"train_loss": -23.483200073242188, "global_step": 175140, "epoch": 2110} {"train_loss": -23.798120498657227, "global_step": 175141, "epoch": 2110} {"train_loss": -23.2083740234375, "global_step": 175142, "epoch": 2110} {"train_loss": -23.211179733276367, "global_step": 175143, "epoch": 2110} {"train_loss": -23.632427215576172, "global_step": 175144, "epoch": 2110} {"train_loss": -23.601083755493164, "global_step": 175145, "epoch": 2110} {"train_loss": -23.31291389465332, "global_step": 175146, "epoch": 2110} {"train_loss": -23.99075698852539, "global_step": 175147, "epoch": 2110} {"train_loss": -23.52353858947754, "global_step": 175148, "epoch": 2110} {"train_loss": -23.628921508789062, "global_step": 175149, "epoch": 2110} {"train_loss": -23.545333862304688, "global_step": 175150, "epoch": 2110} {"train_loss": -23.814271926879883, "global_step": 175151, "epoch": 2110} {"train_loss": -23.676345825195312, "global_step": 175152, "epoch": 2110} {"train_loss": -23.552967071533203, "global_step": 175153, "epoch": 2110} {"train_loss": -23.81967544555664, "global_step": 175154, "epoch": 2110} {"train_loss": -23.920555114746094, "global_step": 175155, "epoch": 2110} {"train_loss": -23.749853134155273, "global_step": 175156, "epoch": 2110} {"train_loss": -23.831241607666016, "global_step": 175157, "epoch": 2110} {"train_loss": -23.827611923217773, "global_step": 175158, "epoch": 2110} {"train_loss": -23.83234214782715, "global_step": 175159, "epoch": 2110} {"train_loss": -23.79362678527832, "global_step": 175160, "epoch": 2110} {"train_loss": -24.092422485351562, "global_step": 175161, "epoch": 2110} {"train_loss": -23.64386558532715, "global_step": 175162, "epoch": 2110} {"train_loss": -23.57454490661621, "global_step": 175163, "epoch": 2110} {"train_loss": -23.840490341186523, "global_step": 175164, "epoch": 2110} {"train_loss": -24.064777374267578, "global_step": 175165, "epoch": 2110} {"train_loss": -24.05707550048828, "global_step": 175166, "epoch": 2110} {"train_loss": -23.686670303344727, "global_step": 175167, "epoch": 2110} {"train_loss": -23.8488712310791, "global_step": 175168, "epoch": 2110} {"train_loss": -24.128280639648438, "global_step": 175169, "epoch": 2110} {"train_loss": -24.397092819213867, "global_step": 175170, "epoch": 2110} {"train_loss": -24.0922794342041, "global_step": 175171, "epoch": 2110} {"train_loss": -24.023679733276367, "global_step": 175172, "epoch": 2110} {"train_loss": -24.19948959350586, "global_step": 175173, "epoch": 2110} {"train_loss": -23.711246490478516, "global_step": 175174, "epoch": 2110} {"train_loss": -23.800596237182617, "global_step": 175175, "epoch": 2110} {"train_loss": -23.800806045532227, "global_step": 175176, "epoch": 2110} {"train_loss": -23.918350219726562, "global_step": 175177, "epoch": 2110} {"train_loss": -23.709735870361328, "global_step": 175178, "epoch": 2110} {"train_loss": -24.081892013549805, "global_step": 175179, "epoch": 2110} {"train_loss": -23.681293487548828, "global_step": 175180, "epoch": 2110} {"train_loss": -23.807199478149414, "global_step": 175181, "epoch": 2110} {"train_loss": -23.962427139282227, "global_step": 175182, "epoch": 2110} {"train_loss": -23.88663673400879, "global_step": 175183, "epoch": 2110} {"train_loss": -23.817747116088867, "global_step": 175184, "epoch": 2110} {"train_loss": -23.81594467163086, "global_step": 175185, "epoch": 2110} {"train_loss": -23.621450424194336, "global_step": 175186, "epoch": 2110} {"train_loss": -23.846044540405273, "global_step": 175187, "epoch": 2110} {"train_loss": -23.79559898376465, "global_step": 175188, "epoch": 2110} {"train_loss": -23.559764862060547, "global_step": 175189, "epoch": 2110} {"train_loss": -23.682418823242188, "global_step": 175190, "epoch": 2110} {"train_loss": -23.79707145690918, "global_step": 175191, "epoch": 2110} {"train_loss": -23.850374221801758, "global_step": 175192, "epoch": 2110} {"train_loss": -23.759056091308594, "global_step": 175193, "epoch": 2110} {"train_loss": -23.81682777404785, "global_step": 175194, "epoch": 2110} {"train_loss": -23.56667137145996, "global_step": 175195, "epoch": 2110} {"train_loss": -23.957883834838867, "global_step": 175196, "epoch": 2110} {"train_loss": -23.78346061706543, "global_step": 175197, "epoch": 2110} {"train_loss": -24.049726486206055, "global_step": 175198, "epoch": 2110} {"train_loss": -23.835790634155273, "global_step": 175199, "epoch": 2110} {"train_loss": -23.647798538208008, "global_step": 175200, "epoch": 2110} {"train_loss": -24.141298294067383, "global_step": 175201, "epoch": 2110} {"train_loss": -23.73986053466797, "global_step": 175202, "epoch": 2110} {"train_loss": -23.805736541748047, "global_step": 175203, "epoch": 2110} {"train_loss": -24.08588981628418, "global_step": 175204, "epoch": 2110} {"train_loss": -23.531248092651367, "global_step": 175205, "epoch": 2110} {"train_loss": -23.685340881347656, "global_step": 175206, "epoch": 2110} {"train_loss": -24.075162887573242, "global_step": 175207, "epoch": 2110} {"train_loss": -23.751850128173828, "global_step": 175208, "epoch": 2110} {"train_loss": -24.06547737121582, "global_step": 175209, "epoch": 2110} {"train_loss": -23.305580139160156, "global_step": 175210, "epoch": 2110} {"train_loss": -24.07398796081543, "global_step": 175211, "epoch": 2110} {"train_loss": -23.753563731549733, "global_step": 175212, "epoch": 2110, "val_loss": 6484898.0} {"train_loss": -23.607776641845703, "global_step": 175213, "epoch": 2111} {"train_loss": -23.43497657775879, "global_step": 175214, "epoch": 2111} {"train_loss": -23.182695388793945, "global_step": 175215, "epoch": 2111} {"train_loss": -23.590286254882812, "global_step": 175216, "epoch": 2111} {"train_loss": -23.401235580444336, "global_step": 175217, "epoch": 2111} {"train_loss": -23.559019088745117, "global_step": 175218, "epoch": 2111} {"train_loss": -23.432767868041992, "global_step": 175219, "epoch": 2111} {"train_loss": -23.415321350097656, "global_step": 175220, "epoch": 2111} {"train_loss": -23.83807945251465, "global_step": 175221, "epoch": 2111} {"train_loss": -23.753536224365234, "global_step": 175222, "epoch": 2111} {"train_loss": -23.570819854736328, "global_step": 175223, "epoch": 2111} {"train_loss": -23.715473175048828, "global_step": 175224, "epoch": 2111} {"train_loss": -23.534122467041016, "global_step": 175225, "epoch": 2111} {"train_loss": -24.11821746826172, "global_step": 175226, "epoch": 2111} {"train_loss": -23.3083553314209, "global_step": 175227, "epoch": 2111} {"train_loss": -23.65215492248535, "global_step": 175228, "epoch": 2111} {"train_loss": -23.914718627929688, "global_step": 175229, "epoch": 2111} {"train_loss": -23.7374324798584, "global_step": 175230, "epoch": 2111} {"train_loss": -23.86800193786621, "global_step": 175231, "epoch": 2111} {"train_loss": -23.725435256958008, "global_step": 175232, "epoch": 2111} {"train_loss": -23.949115753173828, "global_step": 175233, "epoch": 2111} {"train_loss": -23.522579193115234, "global_step": 175234, "epoch": 2111} {"train_loss": -23.79819679260254, "global_step": 175235, "epoch": 2111} {"train_loss": -23.764118194580078, "global_step": 175236, "epoch": 2111} {"train_loss": -23.965051651000977, "global_step": 175237, "epoch": 2111} {"train_loss": -23.86650848388672, "global_step": 175238, "epoch": 2111} {"train_loss": -23.69272804260254, "global_step": 175239, "epoch": 2111} {"train_loss": -23.768814086914062, "global_step": 175240, "epoch": 2111} {"train_loss": -23.81913948059082, "global_step": 175241, "epoch": 2111} {"train_loss": -23.751815795898438, "global_step": 175242, "epoch": 2111} {"train_loss": -23.62908363342285, "global_step": 175243, "epoch": 2111} {"train_loss": -23.801925659179688, "global_step": 175244, "epoch": 2111} {"train_loss": -24.106658935546875, "global_step": 175245, "epoch": 2111} {"train_loss": -24.25641441345215, "global_step": 175246, "epoch": 2111} {"train_loss": -24.239553451538086, "global_step": 175247, "epoch": 2111} {"train_loss": -24.020627975463867, "global_step": 175248, "epoch": 2111} {"train_loss": -23.82883644104004, "global_step": 175249, "epoch": 2111} {"train_loss": -23.7152099609375, "global_step": 175250, "epoch": 2111} {"train_loss": -24.143678665161133, "global_step": 175251, "epoch": 2111} {"train_loss": -23.91591453552246, "global_step": 175252, "epoch": 2111} {"train_loss": -23.545013427734375, "global_step": 175253, "epoch": 2111} {"train_loss": -23.745267868041992, "global_step": 175254, "epoch": 2111} {"train_loss": -23.566822052001953, "global_step": 175255, "epoch": 2111} {"train_loss": -23.502779006958008, "global_step": 175256, "epoch": 2111} {"train_loss": -23.78376579284668, "global_step": 175257, "epoch": 2111} {"train_loss": -23.68324089050293, "global_step": 175258, "epoch": 2111} {"train_loss": -23.903383255004883, "global_step": 175259, "epoch": 2111} {"train_loss": -23.867237091064453, "global_step": 175260, "epoch": 2111} {"train_loss": -23.818517684936523, "global_step": 175261, "epoch": 2111} {"train_loss": -23.94423484802246, "global_step": 175262, "epoch": 2111} {"train_loss": -23.902658462524414, "global_step": 175263, "epoch": 2111} {"train_loss": -23.8167724609375, "global_step": 175264, "epoch": 2111} {"train_loss": -23.69053077697754, "global_step": 175265, "epoch": 2111} {"train_loss": -23.854948043823242, "global_step": 175266, "epoch": 2111} {"train_loss": -23.807722091674805, "global_step": 175267, "epoch": 2111} {"train_loss": -23.768571853637695, "global_step": 175268, "epoch": 2111} {"train_loss": -23.904165267944336, "global_step": 175269, "epoch": 2111} {"train_loss": -23.698999404907227, "global_step": 175270, "epoch": 2111} {"train_loss": -23.867778778076172, "global_step": 175271, "epoch": 2111} {"train_loss": -24.335508346557617, "global_step": 175272, "epoch": 2111} {"train_loss": -23.77034568786621, "global_step": 175273, "epoch": 2111} {"train_loss": -24.136253356933594, "global_step": 175274, "epoch": 2111} {"train_loss": -23.689619064331055, "global_step": 175275, "epoch": 2111} {"train_loss": -24.146617889404297, "global_step": 175276, "epoch": 2111} {"train_loss": -23.83912467956543, "global_step": 175277, "epoch": 2111} {"train_loss": -23.85464096069336, "global_step": 175278, "epoch": 2111} {"train_loss": -23.722753524780273, "global_step": 175279, "epoch": 2111} {"train_loss": -23.765178680419922, "global_step": 175280, "epoch": 2111} {"train_loss": -23.833866119384766, "global_step": 175281, "epoch": 2111} {"train_loss": -23.3956298828125, "global_step": 175282, "epoch": 2111} {"train_loss": -23.22015380859375, "global_step": 175283, "epoch": 2111} {"train_loss": -23.454862594604492, "global_step": 175284, "epoch": 2111} {"train_loss": -23.764774322509766, "global_step": 175285, "epoch": 2111} {"train_loss": -23.910795211791992, "global_step": 175286, "epoch": 2111} {"train_loss": -23.61020851135254, "global_step": 175287, "epoch": 2111} {"train_loss": -23.291532516479492, "global_step": 175288, "epoch": 2111} {"train_loss": -23.840303421020508, "global_step": 175289, "epoch": 2111} {"train_loss": -23.67763900756836, "global_step": 175290, "epoch": 2111} {"train_loss": -23.558887481689453, "global_step": 175291, "epoch": 2111} {"train_loss": -23.435009002685547, "global_step": 175292, "epoch": 2111} {"train_loss": -23.900693893432617, "global_step": 175293, "epoch": 2111} {"train_loss": -23.312576293945312, "global_step": 175294, "epoch": 2111} {"train_loss": -23.74590680685388, "global_step": 175295, "epoch": 2111, "val_loss": 6289672.0} {"train_loss": -23.036375045776367, "global_step": 175296, "epoch": 2112} {"train_loss": -23.456417083740234, "global_step": 175297, "epoch": 2112} {"train_loss": -23.545581817626953, "global_step": 175298, "epoch": 2112} {"train_loss": -23.643930435180664, "global_step": 175299, "epoch": 2112} {"train_loss": -23.692140579223633, "global_step": 175300, "epoch": 2112} {"train_loss": -23.512834548950195, "global_step": 175301, "epoch": 2112} {"train_loss": -23.510478973388672, "global_step": 175302, "epoch": 2112} {"train_loss": -23.81720733642578, "global_step": 175303, "epoch": 2112} {"train_loss": -23.51003074645996, "global_step": 175304, "epoch": 2112} {"train_loss": -23.59568214416504, "global_step": 175305, "epoch": 2112} {"train_loss": -23.839841842651367, "global_step": 175306, "epoch": 2112} {"train_loss": -23.5477237701416, "global_step": 175307, "epoch": 2112} {"train_loss": -23.66135025024414, "global_step": 175308, "epoch": 2112} {"train_loss": -23.833690643310547, "global_step": 175309, "epoch": 2112} {"train_loss": -23.38054656982422, "global_step": 175310, "epoch": 2112} {"train_loss": -23.606245040893555, "global_step": 175311, "epoch": 2112} {"train_loss": -23.628421783447266, "global_step": 175312, "epoch": 2112} {"train_loss": -23.735334396362305, "global_step": 175313, "epoch": 2112} {"train_loss": -23.65092658996582, "global_step": 175314, "epoch": 2112} {"train_loss": -23.6949462890625, "global_step": 175315, "epoch": 2112} {"train_loss": -23.848909378051758, "global_step": 175316, "epoch": 2112} {"train_loss": -23.99791145324707, "global_step": 175317, "epoch": 2112} {"train_loss": -23.792020797729492, "global_step": 175318, "epoch": 2112} {"train_loss": -23.740201950073242, "global_step": 175319, "epoch": 2112} {"train_loss": -23.640668869018555, "global_step": 175320, "epoch": 2112} {"train_loss": -24.033313751220703, "global_step": 175321, "epoch": 2112} {"train_loss": -23.772842407226562, "global_step": 175322, "epoch": 2112} {"train_loss": -23.7215633392334, "global_step": 175323, "epoch": 2112} {"train_loss": -23.528583526611328, "global_step": 175324, "epoch": 2112} {"train_loss": -23.75669288635254, "global_step": 175325, "epoch": 2112} {"train_loss": -24.116981506347656, "global_step": 175326, "epoch": 2112} {"train_loss": -23.51078224182129, "global_step": 175327, "epoch": 2112} {"train_loss": -23.334321975708008, "global_step": 175328, "epoch": 2112} {"train_loss": -24.13044548034668, "global_step": 175329, "epoch": 2112} {"train_loss": -23.643665313720703, "global_step": 175330, "epoch": 2112} {"train_loss": -23.59431266784668, "global_step": 175331, "epoch": 2112} {"train_loss": -23.77663230895996, "global_step": 175332, "epoch": 2112} {"train_loss": -23.845325469970703, "global_step": 175333, "epoch": 2112} {"train_loss": -23.77781867980957, "global_step": 175334, "epoch": 2112} {"train_loss": -23.97397232055664, "global_step": 175335, "epoch": 2112} {"train_loss": -23.706418991088867, "global_step": 175336, "epoch": 2112} {"train_loss": -23.089645385742188, "global_step": 175337, "epoch": 2112} {"train_loss": -23.79199981689453, "global_step": 175338, "epoch": 2112} {"train_loss": -23.91766357421875, "global_step": 175339, "epoch": 2112} {"train_loss": -23.52595329284668, "global_step": 175340, "epoch": 2112} {"train_loss": -23.638517379760742, "global_step": 175341, "epoch": 2112} {"train_loss": -23.597827911376953, "global_step": 175342, "epoch": 2112} {"train_loss": -23.80817985534668, "global_step": 175343, "epoch": 2112} {"train_loss": -23.541330337524414, "global_step": 175344, "epoch": 2112} {"train_loss": -23.755640029907227, "global_step": 175345, "epoch": 2112} {"train_loss": -23.459192276000977, "global_step": 175346, "epoch": 2112} {"train_loss": -23.90869140625, "global_step": 175347, "epoch": 2112} {"train_loss": -22.965879440307617, "global_step": 175348, "epoch": 2112} {"train_loss": -23.513202667236328, "global_step": 175349, "epoch": 2112} {"train_loss": -23.3640193939209, "global_step": 175350, "epoch": 2112} {"train_loss": -24.019495010375977, "global_step": 175351, "epoch": 2112} {"train_loss": -23.534414291381836, "global_step": 175352, "epoch": 2112} {"train_loss": -23.69144630432129, "global_step": 175353, "epoch": 2112} {"train_loss": -23.566770553588867, "global_step": 175354, "epoch": 2112} {"train_loss": -23.983060836791992, "global_step": 175355, "epoch": 2112} {"train_loss": -23.837793350219727, "global_step": 175356, "epoch": 2112} {"train_loss": -24.119497299194336, "global_step": 175357, "epoch": 2112} {"train_loss": -23.7672176361084, "global_step": 175358, "epoch": 2112} {"train_loss": -23.90207862854004, "global_step": 175359, "epoch": 2112} {"train_loss": -24.101764678955078, "global_step": 175360, "epoch": 2112} {"train_loss": -24.1416072845459, "global_step": 175361, "epoch": 2112} {"train_loss": -23.614225387573242, "global_step": 175362, "epoch": 2112} {"train_loss": -23.97174072265625, "global_step": 175363, "epoch": 2112} {"train_loss": -23.475574493408203, "global_step": 175364, "epoch": 2112} {"train_loss": -24.204072952270508, "global_step": 175365, "epoch": 2112} {"train_loss": -23.87430191040039, "global_step": 175366, "epoch": 2112} {"train_loss": -23.965574264526367, "global_step": 175367, "epoch": 2112} {"train_loss": -23.412887573242188, "global_step": 175368, "epoch": 2112} {"train_loss": -23.87217140197754, "global_step": 175369, "epoch": 2112} {"train_loss": -23.81788444519043, "global_step": 175370, "epoch": 2112} {"train_loss": -23.72328758239746, "global_step": 175371, "epoch": 2112} {"train_loss": -23.80765151977539, "global_step": 175372, "epoch": 2112} {"train_loss": -24.180866241455078, "global_step": 175373, "epoch": 2112} {"train_loss": -24.10040283203125, "global_step": 175374, "epoch": 2112} {"train_loss": -23.622135162353516, "global_step": 175375, "epoch": 2112} {"train_loss": -23.764616012573242, "global_step": 175376, "epoch": 2112} {"train_loss": -23.986515045166016, "global_step": 175377, "epoch": 2112} {"train_loss": -23.730958088334784, "global_step": 175378, "epoch": 2112, "val_loss": 6324303.0} {"train_loss": -23.40447235107422, "global_step": 175379, "epoch": 2113} {"train_loss": -23.765470504760742, "global_step": 175380, "epoch": 2113} {"train_loss": -23.32535171508789, "global_step": 175381, "epoch": 2113} {"train_loss": -23.723569869995117, "global_step": 175382, "epoch": 2113} {"train_loss": -23.457439422607422, "global_step": 175383, "epoch": 2113} {"train_loss": -23.479461669921875, "global_step": 175384, "epoch": 2113} {"train_loss": -23.148000717163086, "global_step": 175385, "epoch": 2113} {"train_loss": -23.798582077026367, "global_step": 175386, "epoch": 2113} {"train_loss": -23.56378173828125, "global_step": 175387, "epoch": 2113} {"train_loss": -23.173215866088867, "global_step": 175388, "epoch": 2113} {"train_loss": -23.44187355041504, "global_step": 175389, "epoch": 2113} {"train_loss": -23.41438865661621, "global_step": 175390, "epoch": 2113} {"train_loss": -23.392637252807617, "global_step": 175391, "epoch": 2113} {"train_loss": -23.849599838256836, "global_step": 175392, "epoch": 2113} {"train_loss": -23.36949920654297, "global_step": 175393, "epoch": 2113} {"train_loss": -23.579736709594727, "global_step": 175394, "epoch": 2113} {"train_loss": -23.41482925415039, "global_step": 175395, "epoch": 2113} {"train_loss": -23.548410415649414, "global_step": 175396, "epoch": 2113} {"train_loss": -23.44468116760254, "global_step": 175397, "epoch": 2113} {"train_loss": -23.861915588378906, "global_step": 175398, "epoch": 2113} {"train_loss": -23.19855308532715, "global_step": 175399, "epoch": 2113} {"train_loss": -23.517013549804688, "global_step": 175400, "epoch": 2113} {"train_loss": -23.799345016479492, "global_step": 175401, "epoch": 2113} {"train_loss": -23.30577850341797, "global_step": 175402, "epoch": 2113} {"train_loss": -23.79567527770996, "global_step": 175403, "epoch": 2113} {"train_loss": -23.3283748626709, "global_step": 175404, "epoch": 2113} {"train_loss": -23.667295455932617, "global_step": 175405, "epoch": 2113} {"train_loss": -23.1004638671875, "global_step": 175406, "epoch": 2113} {"train_loss": -23.886051177978516, "global_step": 175407, "epoch": 2113} {"train_loss": -23.707305908203125, "global_step": 175408, "epoch": 2113} {"train_loss": -23.71998405456543, "global_step": 175409, "epoch": 2113} {"train_loss": -23.74576759338379, "global_step": 175410, "epoch": 2113} {"train_loss": -23.761037826538086, "global_step": 175411, "epoch": 2113} {"train_loss": -23.77674674987793, "global_step": 175412, "epoch": 2113} {"train_loss": -23.722259521484375, "global_step": 175413, "epoch": 2113} {"train_loss": -23.686189651489258, "global_step": 175414, "epoch": 2113} {"train_loss": -23.733814239501953, "global_step": 175415, "epoch": 2113} {"train_loss": -23.92395782470703, "global_step": 175416, "epoch": 2113} {"train_loss": -23.327655792236328, "global_step": 175417, "epoch": 2113} {"train_loss": -24.020902633666992, "global_step": 175418, "epoch": 2113} {"train_loss": -23.72727394104004, "global_step": 175419, "epoch": 2113} {"train_loss": -23.701555252075195, "global_step": 175420, "epoch": 2113} {"train_loss": -23.699460983276367, "global_step": 175421, "epoch": 2113} {"train_loss": -24.060775756835938, "global_step": 175422, "epoch": 2113} {"train_loss": -23.645416259765625, "global_step": 175423, "epoch": 2113} {"train_loss": -23.951791763305664, "global_step": 175424, "epoch": 2113} {"train_loss": -23.792102813720703, "global_step": 175425, "epoch": 2113} {"train_loss": -23.733430862426758, "global_step": 175426, "epoch": 2113} {"train_loss": -23.790189743041992, "global_step": 175427, "epoch": 2113} {"train_loss": -23.631742477416992, "global_step": 175428, "epoch": 2113} {"train_loss": -23.659854888916016, "global_step": 175429, "epoch": 2113} {"train_loss": -23.75111961364746, "global_step": 175430, "epoch": 2113} {"train_loss": -24.061817169189453, "global_step": 175431, "epoch": 2113} {"train_loss": -24.178466796875, "global_step": 175432, "epoch": 2113} {"train_loss": -23.8295955657959, "global_step": 175433, "epoch": 2113} {"train_loss": -23.716909408569336, "global_step": 175434, "epoch": 2113} {"train_loss": -23.186811447143555, "global_step": 175435, "epoch": 2113} {"train_loss": -24.095951080322266, "global_step": 175436, "epoch": 2113} {"train_loss": -24.08713722229004, "global_step": 175437, "epoch": 2113} {"train_loss": -23.793195724487305, "global_step": 175438, "epoch": 2113} {"train_loss": -23.956628799438477, "global_step": 175439, "epoch": 2113} {"train_loss": -24.052595138549805, "global_step": 175440, "epoch": 2113} {"train_loss": -24.171445846557617, "global_step": 175441, "epoch": 2113} {"train_loss": -23.241884231567383, "global_step": 175442, "epoch": 2113} {"train_loss": -23.757272720336914, "global_step": 175443, "epoch": 2113} {"train_loss": -23.424232482910156, "global_step": 175444, "epoch": 2113} {"train_loss": -23.687223434448242, "global_step": 175445, "epoch": 2113} {"train_loss": -23.79401969909668, "global_step": 175446, "epoch": 2113} {"train_loss": -23.834684371948242, "global_step": 175447, "epoch": 2113} {"train_loss": -23.8531551361084, "global_step": 175448, "epoch": 2113} {"train_loss": -23.53883171081543, "global_step": 175449, "epoch": 2113} {"train_loss": -23.58527946472168, "global_step": 175450, "epoch": 2113} {"train_loss": -23.825592041015625, "global_step": 175451, "epoch": 2113} {"train_loss": -24.44758415222168, "global_step": 175452, "epoch": 2113} {"train_loss": -23.968713760375977, "global_step": 175453, "epoch": 2113} {"train_loss": -23.829376220703125, "global_step": 175454, "epoch": 2113} {"train_loss": -24.083585739135742, "global_step": 175455, "epoch": 2113} {"train_loss": -24.112411499023438, "global_step": 175456, "epoch": 2113} {"train_loss": -23.883956909179688, "global_step": 175457, "epoch": 2113} {"train_loss": -23.719675064086914, "global_step": 175458, "epoch": 2113} {"train_loss": -24.05718421936035, "global_step": 175459, "epoch": 2113} {"train_loss": -23.87647247314453, "global_step": 175460, "epoch": 2113} {"train_loss": -23.703451937939747, "global_step": 175461, "epoch": 2113, "val_loss": 6383425.0} {"train_loss": -23.28365135192871, "global_step": 175462, "epoch": 2114} {"train_loss": -23.29665184020996, "global_step": 175463, "epoch": 2114} {"train_loss": -23.2491512298584, "global_step": 175464, "epoch": 2114} {"train_loss": -23.289234161376953, "global_step": 175465, "epoch": 2114} {"train_loss": -23.664031982421875, "global_step": 175466, "epoch": 2114} {"train_loss": -23.6810359954834, "global_step": 175467, "epoch": 2114} {"train_loss": -23.659284591674805, "global_step": 175468, "epoch": 2114} {"train_loss": -23.502981185913086, "global_step": 175469, "epoch": 2114} {"train_loss": -23.873830795288086, "global_step": 175470, "epoch": 2114} {"train_loss": -23.346166610717773, "global_step": 175471, "epoch": 2114} {"train_loss": -23.708740234375, "global_step": 175472, "epoch": 2114} {"train_loss": -23.780202865600586, "global_step": 175473, "epoch": 2114} {"train_loss": -23.91562843322754, "global_step": 175474, "epoch": 2114} {"train_loss": -23.246381759643555, "global_step": 175475, "epoch": 2114} {"train_loss": -23.87734031677246, "global_step": 175476, "epoch": 2114} {"train_loss": -23.68617820739746, "global_step": 175477, "epoch": 2114} {"train_loss": -23.799564361572266, "global_step": 175478, "epoch": 2114} {"train_loss": -24.012935638427734, "global_step": 175479, "epoch": 2114} {"train_loss": -24.004425048828125, "global_step": 175480, "epoch": 2114} {"train_loss": -23.622528076171875, "global_step": 175481, "epoch": 2114} {"train_loss": -23.940412521362305, "global_step": 175482, "epoch": 2114} {"train_loss": -23.82815933227539, "global_step": 175483, "epoch": 2114} {"train_loss": -24.067411422729492, "global_step": 175484, "epoch": 2114} {"train_loss": -23.656240463256836, "global_step": 175485, "epoch": 2114} {"train_loss": -23.825902938842773, "global_step": 175486, "epoch": 2114} {"train_loss": -23.902257919311523, "global_step": 175487, "epoch": 2114} {"train_loss": -23.87265396118164, "global_step": 175488, "epoch": 2114} {"train_loss": -23.846363067626953, "global_step": 175489, "epoch": 2114} {"train_loss": -23.34498405456543, "global_step": 175490, "epoch": 2114} {"train_loss": -23.77904510498047, "global_step": 175491, "epoch": 2114} {"train_loss": -23.793149948120117, "global_step": 175492, "epoch": 2114} {"train_loss": -23.73402976989746, "global_step": 175493, "epoch": 2114} {"train_loss": -24.256837844848633, "global_step": 175494, "epoch": 2114} {"train_loss": -23.71819496154785, "global_step": 175495, "epoch": 2114} {"train_loss": -24.369831085205078, "global_step": 175496, "epoch": 2114} {"train_loss": -23.94321060180664, "global_step": 175497, "epoch": 2114} {"train_loss": -24.168869018554688, "global_step": 175498, "epoch": 2114} {"train_loss": -23.76544761657715, "global_step": 175499, "epoch": 2114} {"train_loss": -23.774993896484375, "global_step": 175500, "epoch": 2114} {"train_loss": -23.487974166870117, "global_step": 175501, "epoch": 2114} {"train_loss": -23.585134506225586, "global_step": 175502, "epoch": 2114} {"train_loss": -23.6483154296875, "global_step": 175503, "epoch": 2114} {"train_loss": -23.921422958374023, "global_step": 175504, "epoch": 2114} {"train_loss": -23.549592971801758, "global_step": 175505, "epoch": 2114} {"train_loss": -23.708791732788086, "global_step": 175506, "epoch": 2114} {"train_loss": -23.87774085998535, "global_step": 175507, "epoch": 2114} {"train_loss": -23.926206588745117, "global_step": 175508, "epoch": 2114} {"train_loss": -23.71949577331543, "global_step": 175509, "epoch": 2114} {"train_loss": -23.80365562438965, "global_step": 175510, "epoch": 2114} {"train_loss": -23.62609100341797, "global_step": 175511, "epoch": 2114} {"train_loss": -23.62518882751465, "global_step": 175512, "epoch": 2114} {"train_loss": -23.650299072265625, "global_step": 175513, "epoch": 2114} {"train_loss": -24.140151977539062, "global_step": 175514, "epoch": 2114} {"train_loss": -23.70291519165039, "global_step": 175515, "epoch": 2114} {"train_loss": -23.79718589782715, "global_step": 175516, "epoch": 2114} {"train_loss": -23.90070152282715, "global_step": 175517, "epoch": 2114} {"train_loss": -23.8245849609375, "global_step": 175518, "epoch": 2114} {"train_loss": -23.590497970581055, "global_step": 175519, "epoch": 2114} {"train_loss": -23.84727668762207, "global_step": 175520, "epoch": 2114} {"train_loss": -23.536945343017578, "global_step": 175521, "epoch": 2114} {"train_loss": -23.78443717956543, "global_step": 175522, "epoch": 2114} {"train_loss": -23.74146270751953, "global_step": 175523, "epoch": 2114} {"train_loss": -23.886940002441406, "global_step": 175524, "epoch": 2114} {"train_loss": -23.56645965576172, "global_step": 175525, "epoch": 2114} {"train_loss": -23.481332778930664, "global_step": 175526, "epoch": 2114} {"train_loss": -23.756502151489258, "global_step": 175527, "epoch": 2114} {"train_loss": -23.45986557006836, "global_step": 175528, "epoch": 2114} {"train_loss": -23.791738510131836, "global_step": 175529, "epoch": 2114} {"train_loss": -23.874176025390625, "global_step": 175530, "epoch": 2114} {"train_loss": -23.72633934020996, "global_step": 175531, "epoch": 2114} {"train_loss": -23.89937400817871, "global_step": 175532, "epoch": 2114} {"train_loss": -23.701589584350586, "global_step": 175533, "epoch": 2114} {"train_loss": -23.53594398498535, "global_step": 175534, "epoch": 2114} {"train_loss": -23.878225326538086, "global_step": 175535, "epoch": 2114} {"train_loss": -23.77630615234375, "global_step": 175536, "epoch": 2114} {"train_loss": -23.43987274169922, "global_step": 175537, "epoch": 2114} {"train_loss": -23.80548095703125, "global_step": 175538, "epoch": 2114} {"train_loss": -23.777671813964844, "global_step": 175539, "epoch": 2114} {"train_loss": -23.95347023010254, "global_step": 175540, "epoch": 2114} {"train_loss": -24.13142967224121, "global_step": 175541, "epoch": 2114} {"train_loss": -23.763444900512695, "global_step": 175542, "epoch": 2114} {"train_loss": -24.008649826049805, "global_step": 175543, "epoch": 2114} {"train_loss": -23.74029582379812, "global_step": 175544, "epoch": 2114, "val_loss": 6356364.0} {"train_loss": -23.385522842407227, "global_step": 175545, "epoch": 2115} {"train_loss": -23.48774528503418, "global_step": 175546, "epoch": 2115} {"train_loss": -23.291641235351562, "global_step": 175547, "epoch": 2115} {"train_loss": -22.882413864135742, "global_step": 175548, "epoch": 2115} {"train_loss": -23.236364364624023, "global_step": 175549, "epoch": 2115} {"train_loss": -23.377819061279297, "global_step": 175550, "epoch": 2115} {"train_loss": -22.903491973876953, "global_step": 175551, "epoch": 2115} {"train_loss": -23.279199600219727, "global_step": 175552, "epoch": 2115} {"train_loss": -23.39438247680664, "global_step": 175553, "epoch": 2115} {"train_loss": -23.30360221862793, "global_step": 175554, "epoch": 2115} {"train_loss": -23.439451217651367, "global_step": 175555, "epoch": 2115} {"train_loss": -23.471372604370117, "global_step": 175556, "epoch": 2115} {"train_loss": -23.695859909057617, "global_step": 175557, "epoch": 2115} {"train_loss": -22.948766708374023, "global_step": 175558, "epoch": 2115} {"train_loss": -23.147777557373047, "global_step": 175559, "epoch": 2115} {"train_loss": -23.38212013244629, "global_step": 175560, "epoch": 2115} {"train_loss": -23.505918502807617, "global_step": 175561, "epoch": 2115} {"train_loss": -23.50543212890625, "global_step": 175562, "epoch": 2115} {"train_loss": -23.572711944580078, "global_step": 175563, "epoch": 2115} {"train_loss": -23.5571346282959, "global_step": 175564, "epoch": 2115} {"train_loss": -23.494873046875, "global_step": 175565, "epoch": 2115} {"train_loss": -23.205533981323242, "global_step": 175566, "epoch": 2115} {"train_loss": -23.537946701049805, "global_step": 175567, "epoch": 2115} {"train_loss": -23.805267333984375, "global_step": 175568, "epoch": 2115} {"train_loss": -23.855005264282227, "global_step": 175569, "epoch": 2115} {"train_loss": -23.814664840698242, "global_step": 175570, "epoch": 2115} {"train_loss": -23.800174713134766, "global_step": 175571, "epoch": 2115} {"train_loss": -23.89316177368164, "global_step": 175572, "epoch": 2115} {"train_loss": -23.44427490234375, "global_step": 175573, "epoch": 2115} {"train_loss": -23.838825225830078, "global_step": 175574, "epoch": 2115} {"train_loss": -23.975664138793945, "global_step": 175575, "epoch": 2115} {"train_loss": -23.74369239807129, "global_step": 175576, "epoch": 2115} {"train_loss": -23.992387771606445, "global_step": 175577, "epoch": 2115} {"train_loss": -23.854490280151367, "global_step": 175578, "epoch": 2115} {"train_loss": -23.670759201049805, "global_step": 175579, "epoch": 2115} {"train_loss": -23.92148780822754, "global_step": 175580, "epoch": 2115} {"train_loss": -23.732446670532227, "global_step": 175581, "epoch": 2115} {"train_loss": -23.716676712036133, "global_step": 175582, "epoch": 2115} {"train_loss": -23.79789161682129, "global_step": 175583, "epoch": 2115} {"train_loss": -23.6685848236084, "global_step": 175584, "epoch": 2115} {"train_loss": -23.773725509643555, "global_step": 175585, "epoch": 2115} {"train_loss": -23.934085845947266, "global_step": 175586, "epoch": 2115} {"train_loss": -23.69662094116211, "global_step": 175587, "epoch": 2115} {"train_loss": -23.674020767211914, "global_step": 175588, "epoch": 2115} {"train_loss": -23.64029884338379, "global_step": 175589, "epoch": 2115} {"train_loss": -24.018962860107422, "global_step": 175590, "epoch": 2115} {"train_loss": -24.235021591186523, "global_step": 175591, "epoch": 2115} {"train_loss": -23.960886001586914, "global_step": 175592, "epoch": 2115} {"train_loss": -24.284271240234375, "global_step": 175593, "epoch": 2115} {"train_loss": -23.702301025390625, "global_step": 175594, "epoch": 2115} {"train_loss": -23.802507400512695, "global_step": 175595, "epoch": 2115} {"train_loss": -23.876684188842773, "global_step": 175596, "epoch": 2115} {"train_loss": -24.144657135009766, "global_step": 175597, "epoch": 2115} {"train_loss": -23.748960494995117, "global_step": 175598, "epoch": 2115} {"train_loss": -23.47699546813965, "global_step": 175599, "epoch": 2115} {"train_loss": -23.743621826171875, "global_step": 175600, "epoch": 2115} {"train_loss": -24.46742057800293, "global_step": 175601, "epoch": 2115} {"train_loss": -23.89317512512207, "global_step": 175602, "epoch": 2115} {"train_loss": -23.862226486206055, "global_step": 175603, "epoch": 2115} {"train_loss": -23.740581512451172, "global_step": 175604, "epoch": 2115} {"train_loss": -23.783355712890625, "global_step": 175605, "epoch": 2115} {"train_loss": -23.895105361938477, "global_step": 175606, "epoch": 2115} {"train_loss": -23.837432861328125, "global_step": 175607, "epoch": 2115} {"train_loss": -23.81693458557129, "global_step": 175608, "epoch": 2115} {"train_loss": -23.970800399780273, "global_step": 175609, "epoch": 2115} {"train_loss": -24.07086944580078, "global_step": 175610, "epoch": 2115} {"train_loss": -24.29290199279785, "global_step": 175611, "epoch": 2115} {"train_loss": -23.94779396057129, "global_step": 175612, "epoch": 2115} {"train_loss": -24.134048461914062, "global_step": 175613, "epoch": 2115} {"train_loss": -23.865373611450195, "global_step": 175614, "epoch": 2115} {"train_loss": -23.82807731628418, "global_step": 175615, "epoch": 2115} {"train_loss": -23.653928756713867, "global_step": 175616, "epoch": 2115} {"train_loss": -23.776273727416992, "global_step": 175617, "epoch": 2115} {"train_loss": -23.82904624938965, "global_step": 175618, "epoch": 2115} {"train_loss": -23.86487579345703, "global_step": 175619, "epoch": 2115} {"train_loss": -23.990097045898438, "global_step": 175620, "epoch": 2115} {"train_loss": -23.907087326049805, "global_step": 175621, "epoch": 2115} {"train_loss": -23.76780128479004, "global_step": 175622, "epoch": 2115} {"train_loss": -23.62775230407715, "global_step": 175623, "epoch": 2115} {"train_loss": -23.753238677978516, "global_step": 175624, "epoch": 2115} {"train_loss": -23.809865951538086, "global_step": 175625, "epoch": 2115} {"train_loss": -24.1309814453125, "global_step": 175626, "epoch": 2115} {"train_loss": -23.715034438903075, "global_step": 175627, "epoch": 2115, "val_loss": 6297224.0} {"train_loss": -23.47752571105957, "global_step": 175628, "epoch": 2116} {"train_loss": -23.420820236206055, "global_step": 175629, "epoch": 2116} {"train_loss": -23.76795768737793, "global_step": 175630, "epoch": 2116} {"train_loss": -23.611711502075195, "global_step": 175631, "epoch": 2116} {"train_loss": -23.443801879882812, "global_step": 175632, "epoch": 2116} {"train_loss": -23.503332138061523, "global_step": 175633, "epoch": 2116} {"train_loss": -23.65931510925293, "global_step": 175634, "epoch": 2116} {"train_loss": -23.557022094726562, "global_step": 175635, "epoch": 2116} {"train_loss": -23.411832809448242, "global_step": 175636, "epoch": 2116} {"train_loss": -23.453947067260742, "global_step": 175637, "epoch": 2116} {"train_loss": -23.564430236816406, "global_step": 175638, "epoch": 2116} {"train_loss": -23.442550659179688, "global_step": 175639, "epoch": 2116} {"train_loss": -23.717849731445312, "global_step": 175640, "epoch": 2116} {"train_loss": -23.852535247802734, "global_step": 175641, "epoch": 2116} {"train_loss": -23.227670669555664, "global_step": 175642, "epoch": 2116} {"train_loss": -23.58716583251953, "global_step": 175643, "epoch": 2116} {"train_loss": -23.830440521240234, "global_step": 175644, "epoch": 2116} {"train_loss": -23.517837524414062, "global_step": 175645, "epoch": 2116} {"train_loss": -23.664655685424805, "global_step": 175646, "epoch": 2116} {"train_loss": -23.531417846679688, "global_step": 175647, "epoch": 2116} {"train_loss": -24.114622116088867, "global_step": 175648, "epoch": 2116} {"train_loss": -23.79975700378418, "global_step": 175649, "epoch": 2116} {"train_loss": -23.479703903198242, "global_step": 175650, "epoch": 2116} {"train_loss": -23.790555953979492, "global_step": 175651, "epoch": 2116} {"train_loss": -23.667184829711914, "global_step": 175652, "epoch": 2116} {"train_loss": -23.89203453063965, "global_step": 175653, "epoch": 2116} {"train_loss": -23.510986328125, "global_step": 175654, "epoch": 2116} {"train_loss": -23.530384063720703, "global_step": 175655, "epoch": 2116} {"train_loss": -23.78375244140625, "global_step": 175656, "epoch": 2116} {"train_loss": -23.792156219482422, "global_step": 175657, "epoch": 2116} {"train_loss": -23.96315574645996, "global_step": 175658, "epoch": 2116} {"train_loss": -23.856868743896484, "global_step": 175659, "epoch": 2116} {"train_loss": -23.747426986694336, "global_step": 175660, "epoch": 2116} {"train_loss": -24.087919235229492, "global_step": 175661, "epoch": 2116} {"train_loss": -23.97511863708496, "global_step": 175662, "epoch": 2116} {"train_loss": -23.953754425048828, "global_step": 175663, "epoch": 2116} {"train_loss": -24.073801040649414, "global_step": 175664, "epoch": 2116} {"train_loss": -23.673416137695312, "global_step": 175665, "epoch": 2116} {"train_loss": -23.798355102539062, "global_step": 175666, "epoch": 2116} {"train_loss": -23.81197166442871, "global_step": 175667, "epoch": 2116} {"train_loss": -23.77973747253418, "global_step": 175668, "epoch": 2116} {"train_loss": -24.15696144104004, "global_step": 175669, "epoch": 2116} {"train_loss": -23.83295249938965, "global_step": 175670, "epoch": 2116} {"train_loss": -23.98382568359375, "global_step": 175671, "epoch": 2116} {"train_loss": -23.733163833618164, "global_step": 175672, "epoch": 2116} {"train_loss": -23.881864547729492, "global_step": 175673, "epoch": 2116} {"train_loss": -23.741819381713867, "global_step": 175674, "epoch": 2116} {"train_loss": -23.819406509399414, "global_step": 175675, "epoch": 2116} {"train_loss": -23.975460052490234, "global_step": 175676, "epoch": 2116} {"train_loss": -23.6649112701416, "global_step": 175677, "epoch": 2116} {"train_loss": -23.82304573059082, "global_step": 175678, "epoch": 2116} {"train_loss": -23.696033477783203, "global_step": 175679, "epoch": 2116} {"train_loss": -23.94712257385254, "global_step": 175680, "epoch": 2116} {"train_loss": -23.931747436523438, "global_step": 175681, "epoch": 2116} {"train_loss": -23.946697235107422, "global_step": 175682, "epoch": 2116} {"train_loss": -23.7099552154541, "global_step": 175683, "epoch": 2116} {"train_loss": -23.5838623046875, "global_step": 175684, "epoch": 2116} {"train_loss": -24.06174659729004, "global_step": 175685, "epoch": 2116} {"train_loss": -23.65842056274414, "global_step": 175686, "epoch": 2116} {"train_loss": -23.436227798461914, "global_step": 175687, "epoch": 2116} {"train_loss": -24.07964324951172, "global_step": 175688, "epoch": 2116} {"train_loss": -23.732940673828125, "global_step": 175689, "epoch": 2116} {"train_loss": -24.06743812561035, "global_step": 175690, "epoch": 2116} {"train_loss": -23.45321273803711, "global_step": 175691, "epoch": 2116} {"train_loss": -23.56937599182129, "global_step": 175692, "epoch": 2116} {"train_loss": -24.06125831604004, "global_step": 175693, "epoch": 2116} {"train_loss": -23.308012008666992, "global_step": 175694, "epoch": 2116} {"train_loss": -23.885440826416016, "global_step": 175695, "epoch": 2116} {"train_loss": -23.957876205444336, "global_step": 175696, "epoch": 2116} {"train_loss": -23.894376754760742, "global_step": 175697, "epoch": 2116} {"train_loss": -23.879756927490234, "global_step": 175698, "epoch": 2116} {"train_loss": -23.46623420715332, "global_step": 175699, "epoch": 2116} {"train_loss": -23.79735565185547, "global_step": 175700, "epoch": 2116} {"train_loss": -23.858625411987305, "global_step": 175701, "epoch": 2116} {"train_loss": -23.31409454345703, "global_step": 175702, "epoch": 2116} {"train_loss": -23.68585777282715, "global_step": 175703, "epoch": 2116} {"train_loss": -23.634851455688477, "global_step": 175704, "epoch": 2116} {"train_loss": -23.731468200683594, "global_step": 175705, "epoch": 2116} {"train_loss": -23.831859588623047, "global_step": 175706, "epoch": 2116} {"train_loss": -24.058931350708008, "global_step": 175707, "epoch": 2116} {"train_loss": -23.850509643554688, "global_step": 175708, "epoch": 2116} {"train_loss": -23.942785263061523, "global_step": 175709, "epoch": 2116} {"train_loss": -23.762745822768615, "global_step": 175710, "epoch": 2116, "val_loss": 6366198.0} {"train_loss": -22.880300521850586, "global_step": 175711, "epoch": 2117} {"train_loss": -23.595943450927734, "global_step": 175712, "epoch": 2117} {"train_loss": -23.512540817260742, "global_step": 175713, "epoch": 2117} {"train_loss": -23.638683319091797, "global_step": 175714, "epoch": 2117} {"train_loss": -23.36115264892578, "global_step": 175715, "epoch": 2117} {"train_loss": -23.535490036010742, "global_step": 175716, "epoch": 2117} {"train_loss": -23.406591415405273, "global_step": 175717, "epoch": 2117} {"train_loss": -23.373395919799805, "global_step": 175718, "epoch": 2117} {"train_loss": -23.092960357666016, "global_step": 175719, "epoch": 2117} {"train_loss": -23.893239974975586, "global_step": 175720, "epoch": 2117} {"train_loss": -23.25672721862793, "global_step": 175721, "epoch": 2117} {"train_loss": -23.854156494140625, "global_step": 175722, "epoch": 2117} {"train_loss": -23.079212188720703, "global_step": 175723, "epoch": 2117} {"train_loss": -23.739913940429688, "global_step": 175724, "epoch": 2117} {"train_loss": -23.585437774658203, "global_step": 175725, "epoch": 2117} {"train_loss": -23.276277542114258, "global_step": 175726, "epoch": 2117} {"train_loss": -23.33613395690918, "global_step": 175727, "epoch": 2117} {"train_loss": -23.215343475341797, "global_step": 175728, "epoch": 2117} {"train_loss": -23.421823501586914, "global_step": 175729, "epoch": 2117} {"train_loss": -23.415403366088867, "global_step": 175730, "epoch": 2117} {"train_loss": -23.68535041809082, "global_step": 175731, "epoch": 2117} {"train_loss": -23.849315643310547, "global_step": 175732, "epoch": 2117} {"train_loss": -23.642545700073242, "global_step": 175733, "epoch": 2117} {"train_loss": -23.664451599121094, "global_step": 175734, "epoch": 2117} {"train_loss": -23.86054801940918, "global_step": 175735, "epoch": 2117} {"train_loss": -23.59382438659668, "global_step": 175736, "epoch": 2117} {"train_loss": -23.9644718170166, "global_step": 175737, "epoch": 2117} {"train_loss": -24.097631454467773, "global_step": 175738, "epoch": 2117} {"train_loss": -23.437210083007812, "global_step": 175739, "epoch": 2117} {"train_loss": -23.750900268554688, "global_step": 175740, "epoch": 2117} {"train_loss": -23.687299728393555, "global_step": 175741, "epoch": 2117} {"train_loss": -23.433408737182617, "global_step": 175742, "epoch": 2117} {"train_loss": -23.627689361572266, "global_step": 175743, "epoch": 2117} {"train_loss": -23.925806045532227, "global_step": 175744, "epoch": 2117} {"train_loss": -23.605859756469727, "global_step": 175745, "epoch": 2117} {"train_loss": -24.148555755615234, "global_step": 175746, "epoch": 2117} {"train_loss": -23.864171981811523, "global_step": 175747, "epoch": 2117} {"train_loss": -23.71271514892578, "global_step": 175748, "epoch": 2117} {"train_loss": -24.024892807006836, "global_step": 175749, "epoch": 2117} {"train_loss": -24.24186897277832, "global_step": 175750, "epoch": 2117} {"train_loss": -23.776927947998047, "global_step": 175751, "epoch": 2117} {"train_loss": -23.530731201171875, "global_step": 175752, "epoch": 2117} {"train_loss": -24.075050354003906, "global_step": 175753, "epoch": 2117} {"train_loss": -23.827558517456055, "global_step": 175754, "epoch": 2117} {"train_loss": -23.75210952758789, "global_step": 175755, "epoch": 2117} {"train_loss": -24.62445068359375, "global_step": 175756, "epoch": 2117} {"train_loss": -23.373371124267578, "global_step": 175757, "epoch": 2117} {"train_loss": -23.680866241455078, "global_step": 175758, "epoch": 2117} {"train_loss": -23.42560386657715, "global_step": 175759, "epoch": 2117} {"train_loss": -23.474979400634766, "global_step": 175760, "epoch": 2117} {"train_loss": -24.08591651916504, "global_step": 175761, "epoch": 2117} {"train_loss": -24.25021743774414, "global_step": 175762, "epoch": 2117} {"train_loss": -23.670209884643555, "global_step": 175763, "epoch": 2117} {"train_loss": -23.2760066986084, "global_step": 175764, "epoch": 2117} {"train_loss": -24.009218215942383, "global_step": 175765, "epoch": 2117} {"train_loss": -23.522428512573242, "global_step": 175766, "epoch": 2117} {"train_loss": -23.863876342773438, "global_step": 175767, "epoch": 2117} {"train_loss": -23.982324600219727, "global_step": 175768, "epoch": 2117} {"train_loss": -23.79581069946289, "global_step": 175769, "epoch": 2117} {"train_loss": -23.834741592407227, "global_step": 175770, "epoch": 2117} {"train_loss": -23.53697967529297, "global_step": 175771, "epoch": 2117} {"train_loss": -23.7209415435791, "global_step": 175772, "epoch": 2117} {"train_loss": -23.73487663269043, "global_step": 175773, "epoch": 2117} {"train_loss": -23.54713249206543, "global_step": 175774, "epoch": 2117} {"train_loss": -24.018835067749023, "global_step": 175775, "epoch": 2117} {"train_loss": -23.873706817626953, "global_step": 175776, "epoch": 2117} {"train_loss": -23.781444549560547, "global_step": 175777, "epoch": 2117} {"train_loss": -23.642629623413086, "global_step": 175778, "epoch": 2117} {"train_loss": -24.337339401245117, "global_step": 175779, "epoch": 2117} {"train_loss": -23.95241355895996, "global_step": 175780, "epoch": 2117} {"train_loss": -23.848804473876953, "global_step": 175781, "epoch": 2117} {"train_loss": -23.75008201599121, "global_step": 175782, "epoch": 2117} {"train_loss": -23.952268600463867, "global_step": 175783, "epoch": 2117} {"train_loss": -24.169797897338867, "global_step": 175784, "epoch": 2117} {"train_loss": -23.742605209350586, "global_step": 175785, "epoch": 2117} {"train_loss": -23.822772979736328, "global_step": 175786, "epoch": 2117} {"train_loss": -23.944229125976562, "global_step": 175787, "epoch": 2117} {"train_loss": -23.854909896850586, "global_step": 175788, "epoch": 2117} {"train_loss": -23.844064712524414, "global_step": 175789, "epoch": 2117} {"train_loss": -23.26434898376465, "global_step": 175790, "epoch": 2117} {"train_loss": -23.554250717163086, "global_step": 175791, "epoch": 2117} {"train_loss": -23.70969009399414, "global_step": 175792, "epoch": 2117} {"train_loss": -23.715092164924346, "global_step": 175793, "epoch": 2117, "val_loss": 6557044.0} {"train_loss": -23.060474395751953, "global_step": 175794, "epoch": 2118} {"train_loss": -21.5800724029541, "global_step": 175795, "epoch": 2118} {"train_loss": -23.540830612182617, "global_step": 175796, "epoch": 2118} {"train_loss": -22.73625946044922, "global_step": 175797, "epoch": 2118} {"train_loss": -23.35620880126953, "global_step": 175798, "epoch": 2118} {"train_loss": -23.047780990600586, "global_step": 175799, "epoch": 2118} {"train_loss": -23.30454444885254, "global_step": 175800, "epoch": 2118} {"train_loss": -23.586917877197266, "global_step": 175801, "epoch": 2118} {"train_loss": -23.153335571289062, "global_step": 175802, "epoch": 2118} {"train_loss": -22.929975509643555, "global_step": 175803, "epoch": 2118} {"train_loss": -23.0970401763916, "global_step": 175804, "epoch": 2118} {"train_loss": -23.3530330657959, "global_step": 175805, "epoch": 2118} {"train_loss": -23.2563533782959, "global_step": 175806, "epoch": 2118} {"train_loss": -23.007736206054688, "global_step": 175807, "epoch": 2118} {"train_loss": -23.479537963867188, "global_step": 175808, "epoch": 2118} {"train_loss": -23.125415802001953, "global_step": 175809, "epoch": 2118} {"train_loss": -23.251840591430664, "global_step": 175810, "epoch": 2118} {"train_loss": -23.34987449645996, "global_step": 175811, "epoch": 2118} {"train_loss": -23.410266876220703, "global_step": 175812, "epoch": 2118} {"train_loss": -23.482370376586914, "global_step": 175813, "epoch": 2118} {"train_loss": -23.434804916381836, "global_step": 175814, "epoch": 2118} {"train_loss": -23.358442306518555, "global_step": 175815, "epoch": 2118} {"train_loss": -23.62998390197754, "global_step": 175816, "epoch": 2118} {"train_loss": -23.782377243041992, "global_step": 175817, "epoch": 2118} {"train_loss": -23.672534942626953, "global_step": 175818, "epoch": 2118} {"train_loss": -23.60651969909668, "global_step": 175819, "epoch": 2118} {"train_loss": -23.986597061157227, "global_step": 175820, "epoch": 2118} {"train_loss": -23.78603172302246, "global_step": 175821, "epoch": 2118} {"train_loss": -23.761444091796875, "global_step": 175822, "epoch": 2118} {"train_loss": -23.723575592041016, "global_step": 175823, "epoch": 2118} {"train_loss": -23.877010345458984, "global_step": 175824, "epoch": 2118} {"train_loss": -23.676727294921875, "global_step": 175825, "epoch": 2118} {"train_loss": -23.911666870117188, "global_step": 175826, "epoch": 2118} {"train_loss": -23.689062118530273, "global_step": 175827, "epoch": 2118} {"train_loss": -23.633777618408203, "global_step": 175828, "epoch": 2118} {"train_loss": -24.04183006286621, "global_step": 175829, "epoch": 2118} {"train_loss": -23.972408294677734, "global_step": 175830, "epoch": 2118} {"train_loss": -23.681102752685547, "global_step": 175831, "epoch": 2118} {"train_loss": -24.041128158569336, "global_step": 175832, "epoch": 2118} {"train_loss": -24.116464614868164, "global_step": 175833, "epoch": 2118} {"train_loss": -23.581035614013672, "global_step": 175834, "epoch": 2118} {"train_loss": -23.683698654174805, "global_step": 175835, "epoch": 2118} {"train_loss": -24.114604949951172, "global_step": 175836, "epoch": 2118} {"train_loss": -23.969621658325195, "global_step": 175837, "epoch": 2118} {"train_loss": -23.693361282348633, "global_step": 175838, "epoch": 2118} {"train_loss": -24.081268310546875, "global_step": 175839, "epoch": 2118} {"train_loss": -23.71870994567871, "global_step": 175840, "epoch": 2118} {"train_loss": -24.060354232788086, "global_step": 175841, "epoch": 2118} {"train_loss": -24.148895263671875, "global_step": 175842, "epoch": 2118} {"train_loss": -23.8861083984375, "global_step": 175843, "epoch": 2118} {"train_loss": -23.999814987182617, "global_step": 175844, "epoch": 2118} {"train_loss": -23.84536361694336, "global_step": 175845, "epoch": 2118} {"train_loss": -23.97933006286621, "global_step": 175846, "epoch": 2118} {"train_loss": -23.894582748413086, "global_step": 175847, "epoch": 2118} {"train_loss": -23.950031280517578, "global_step": 175848, "epoch": 2118} {"train_loss": -23.765621185302734, "global_step": 175849, "epoch": 2118} {"train_loss": -23.815921783447266, "global_step": 175850, "epoch": 2118} {"train_loss": -23.849414825439453, "global_step": 175851, "epoch": 2118} {"train_loss": -23.925378799438477, "global_step": 175852, "epoch": 2118} {"train_loss": -23.490636825561523, "global_step": 175853, "epoch": 2118} {"train_loss": -23.872682571411133, "global_step": 175854, "epoch": 2118} {"train_loss": -24.17664909362793, "global_step": 175855, "epoch": 2118} {"train_loss": -24.11481285095215, "global_step": 175856, "epoch": 2118} {"train_loss": -23.405088424682617, "global_step": 175857, "epoch": 2118} {"train_loss": -23.74180030822754, "global_step": 175858, "epoch": 2118} {"train_loss": -23.595380783081055, "global_step": 175859, "epoch": 2118} {"train_loss": -23.663244247436523, "global_step": 175860, "epoch": 2118} {"train_loss": -23.84456443786621, "global_step": 175861, "epoch": 2118} {"train_loss": -23.875608444213867, "global_step": 175862, "epoch": 2118} {"train_loss": -23.832778930664062, "global_step": 175863, "epoch": 2118} {"train_loss": -24.049245834350586, "global_step": 175864, "epoch": 2118} {"train_loss": -23.866331100463867, "global_step": 175865, "epoch": 2118} {"train_loss": -23.635723114013672, "global_step": 175866, "epoch": 2118} {"train_loss": -23.779882431030273, "global_step": 175867, "epoch": 2118} {"train_loss": -23.837188720703125, "global_step": 175868, "epoch": 2118} {"train_loss": -23.503076553344727, "global_step": 175869, "epoch": 2118} {"train_loss": -23.7359561920166, "global_step": 175870, "epoch": 2118} {"train_loss": -23.919355392456055, "global_step": 175871, "epoch": 2118} {"train_loss": -23.889081954956055, "global_step": 175872, "epoch": 2118} {"train_loss": -24.043519973754883, "global_step": 175873, "epoch": 2118} {"train_loss": -23.694639205932617, "global_step": 175874, "epoch": 2118} {"train_loss": -23.91315269470215, "global_step": 175875, "epoch": 2118} {"train_loss": -23.668590361813465, "global_step": 175876, "epoch": 2118, "val_loss": 6460628.0} {"train_loss": -23.490779876708984, "global_step": 175877, "epoch": 2119} {"train_loss": -23.531707763671875, "global_step": 175878, "epoch": 2119} {"train_loss": -23.299528121948242, "global_step": 175879, "epoch": 2119} {"train_loss": -23.046689987182617, "global_step": 175880, "epoch": 2119} {"train_loss": -23.339752197265625, "global_step": 175881, "epoch": 2119} {"train_loss": -23.256542205810547, "global_step": 175882, "epoch": 2119} {"train_loss": -23.197433471679688, "global_step": 175883, "epoch": 2119} {"train_loss": -23.401304244995117, "global_step": 175884, "epoch": 2119} {"train_loss": -23.60780906677246, "global_step": 175885, "epoch": 2119} {"train_loss": -23.74101448059082, "global_step": 175886, "epoch": 2119} {"train_loss": -23.495624542236328, "global_step": 175887, "epoch": 2119} {"train_loss": -23.689655303955078, "global_step": 175888, "epoch": 2119} {"train_loss": -23.77510643005371, "global_step": 175889, "epoch": 2119} {"train_loss": -23.60274314880371, "global_step": 175890, "epoch": 2119} {"train_loss": -23.463285446166992, "global_step": 175891, "epoch": 2119} {"train_loss": -24.112478256225586, "global_step": 175892, "epoch": 2119} {"train_loss": -23.577716827392578, "global_step": 175893, "epoch": 2119} {"train_loss": -23.415603637695312, "global_step": 175894, "epoch": 2119} {"train_loss": -23.998558044433594, "global_step": 175895, "epoch": 2119} {"train_loss": -23.89667510986328, "global_step": 175896, "epoch": 2119} {"train_loss": -23.744665145874023, "global_step": 175897, "epoch": 2119} {"train_loss": -23.809370040893555, "global_step": 175898, "epoch": 2119} {"train_loss": -23.506610870361328, "global_step": 175899, "epoch": 2119} {"train_loss": -23.43814468383789, "global_step": 175900, "epoch": 2119} {"train_loss": -23.663923263549805, "global_step": 175901, "epoch": 2119} {"train_loss": -23.540374755859375, "global_step": 175902, "epoch": 2119} {"train_loss": -23.866819381713867, "global_step": 175903, "epoch": 2119} {"train_loss": -23.984384536743164, "global_step": 175904, "epoch": 2119} {"train_loss": -24.09037971496582, "global_step": 175905, "epoch": 2119} {"train_loss": -23.827173233032227, "global_step": 175906, "epoch": 2119} {"train_loss": -23.205810546875, "global_step": 175907, "epoch": 2119} {"train_loss": -23.81694793701172, "global_step": 175908, "epoch": 2119} {"train_loss": -23.92182731628418, "global_step": 175909, "epoch": 2119} {"train_loss": -23.695199966430664, "global_step": 175910, "epoch": 2119} {"train_loss": -23.403005599975586, "global_step": 175911, "epoch": 2119} {"train_loss": -23.6182804107666, "global_step": 175912, "epoch": 2119} {"train_loss": -23.88801383972168, "global_step": 175913, "epoch": 2119} {"train_loss": -23.608306884765625, "global_step": 175914, "epoch": 2119} {"train_loss": -23.980884552001953, "global_step": 175915, "epoch": 2119} {"train_loss": -24.000558853149414, "global_step": 175916, "epoch": 2119} {"train_loss": -23.902910232543945, "global_step": 175917, "epoch": 2119} {"train_loss": -23.986135482788086, "global_step": 175918, "epoch": 2119} {"train_loss": -23.864295959472656, "global_step": 175919, "epoch": 2119} {"train_loss": -23.56089210510254, "global_step": 175920, "epoch": 2119} {"train_loss": -23.750001907348633, "global_step": 175921, "epoch": 2119} {"train_loss": -23.685779571533203, "global_step": 175922, "epoch": 2119} {"train_loss": -23.714752197265625, "global_step": 175923, "epoch": 2119} {"train_loss": -23.755077362060547, "global_step": 175924, "epoch": 2119} {"train_loss": -23.543027877807617, "global_step": 175925, "epoch": 2119} {"train_loss": -24.07929039001465, "global_step": 175926, "epoch": 2119} {"train_loss": -23.87493133544922, "global_step": 175927, "epoch": 2119} {"train_loss": -23.88699722290039, "global_step": 175928, "epoch": 2119} {"train_loss": -23.371810913085938, "global_step": 175929, "epoch": 2119} {"train_loss": -23.704191207885742, "global_step": 175930, "epoch": 2119} {"train_loss": -23.78314781188965, "global_step": 175931, "epoch": 2119} {"train_loss": -23.91005516052246, "global_step": 175932, "epoch": 2119} {"train_loss": -23.79014778137207, "global_step": 175933, "epoch": 2119} {"train_loss": -23.8843936920166, "global_step": 175934, "epoch": 2119} {"train_loss": -23.683624267578125, "global_step": 175935, "epoch": 2119} {"train_loss": -23.788896560668945, "global_step": 175936, "epoch": 2119} {"train_loss": -24.01479148864746, "global_step": 175937, "epoch": 2119} {"train_loss": -23.958768844604492, "global_step": 175938, "epoch": 2119} {"train_loss": -24.077350616455078, "global_step": 175939, "epoch": 2119} {"train_loss": -24.162519454956055, "global_step": 175940, "epoch": 2119} {"train_loss": -23.821378707885742, "global_step": 175941, "epoch": 2119} {"train_loss": -23.590927124023438, "global_step": 175942, "epoch": 2119} {"train_loss": -23.538692474365234, "global_step": 175943, "epoch": 2119} {"train_loss": -23.573776245117188, "global_step": 175944, "epoch": 2119} {"train_loss": -24.057065963745117, "global_step": 175945, "epoch": 2119} {"train_loss": -23.8880672454834, "global_step": 175946, "epoch": 2119} {"train_loss": -23.902902603149414, "global_step": 175947, "epoch": 2119} {"train_loss": -23.981504440307617, "global_step": 175948, "epoch": 2119} {"train_loss": -23.836410522460938, "global_step": 175949, "epoch": 2119} {"train_loss": -23.943668365478516, "global_step": 175950, "epoch": 2119} {"train_loss": -23.98904800415039, "global_step": 175951, "epoch": 2119} {"train_loss": -24.057878494262695, "global_step": 175952, "epoch": 2119} {"train_loss": -23.9456729888916, "global_step": 175953, "epoch": 2119} {"train_loss": -23.551651000976562, "global_step": 175954, "epoch": 2119} {"train_loss": -23.81673812866211, "global_step": 175955, "epoch": 2119} {"train_loss": -24.011625289916992, "global_step": 175956, "epoch": 2119} {"train_loss": -23.423860549926758, "global_step": 175957, "epoch": 2119} {"train_loss": -23.666650772094727, "global_step": 175958, "epoch": 2119} {"train_loss": -23.709465072815675, "global_step": 175959, "epoch": 2119, "val_loss": 6465268.0} {"train_loss": -22.078031539916992, "global_step": 175960, "epoch": 2120} {"train_loss": -21.228994369506836, "global_step": 175961, "epoch": 2120} {"train_loss": -22.574499130249023, "global_step": 175962, "epoch": 2120} {"train_loss": -23.086536407470703, "global_step": 175963, "epoch": 2120} {"train_loss": -22.176666259765625, "global_step": 175964, "epoch": 2120} {"train_loss": -22.810651779174805, "global_step": 175965, "epoch": 2120} {"train_loss": -22.60529327392578, "global_step": 175966, "epoch": 2120} {"train_loss": -22.8897762298584, "global_step": 175967, "epoch": 2120} {"train_loss": -22.98767852783203, "global_step": 175968, "epoch": 2120} {"train_loss": -23.006986618041992, "global_step": 175969, "epoch": 2120} {"train_loss": -23.160642623901367, "global_step": 175970, "epoch": 2120} {"train_loss": -22.957242965698242, "global_step": 175971, "epoch": 2120} {"train_loss": -23.22467613220215, "global_step": 175972, "epoch": 2120} {"train_loss": -23.431852340698242, "global_step": 175973, "epoch": 2120} {"train_loss": -23.19581413269043, "global_step": 175974, "epoch": 2120} {"train_loss": -23.51055145263672, "global_step": 175975, "epoch": 2120} {"train_loss": -23.203563690185547, "global_step": 175976, "epoch": 2120} {"train_loss": -23.221214294433594, "global_step": 175977, "epoch": 2120} {"train_loss": -23.460763931274414, "global_step": 175978, "epoch": 2120} {"train_loss": -23.583189010620117, "global_step": 175979, "epoch": 2120} {"train_loss": -23.403278350830078, "global_step": 175980, "epoch": 2120} {"train_loss": -23.784709930419922, "global_step": 175981, "epoch": 2120} {"train_loss": -23.377994537353516, "global_step": 175982, "epoch": 2120} {"train_loss": -23.519636154174805, "global_step": 175983, "epoch": 2120} {"train_loss": -23.326337814331055, "global_step": 175984, "epoch": 2120} {"train_loss": -23.443540573120117, "global_step": 175985, "epoch": 2120} {"train_loss": -23.361433029174805, "global_step": 175986, "epoch": 2120} {"train_loss": -23.433340072631836, "global_step": 175987, "epoch": 2120} {"train_loss": -23.704025268554688, "global_step": 175988, "epoch": 2120} {"train_loss": -23.834657669067383, "global_step": 175989, "epoch": 2120} {"train_loss": -23.620773315429688, "global_step": 175990, "epoch": 2120} {"train_loss": -23.65203285217285, "global_step": 175991, "epoch": 2120} {"train_loss": -23.683349609375, "global_step": 175992, "epoch": 2120} {"train_loss": -23.642059326171875, "global_step": 175993, "epoch": 2120} {"train_loss": -23.651296615600586, "global_step": 175994, "epoch": 2120} {"train_loss": -23.949085235595703, "global_step": 175995, "epoch": 2120} {"train_loss": -23.748937606811523, "global_step": 175996, "epoch": 2120} {"train_loss": -23.747089385986328, "global_step": 175997, "epoch": 2120} {"train_loss": -23.728145599365234, "global_step": 175998, "epoch": 2120} {"train_loss": -23.835657119750977, "global_step": 175999, "epoch": 2120} {"train_loss": -23.61524772644043, "global_step": 176000, "epoch": 2120} {"train_loss": -23.820514678955078, "global_step": 176001, "epoch": 2120} {"train_loss": -23.86606788635254, "global_step": 176002, "epoch": 2120} {"train_loss": -23.89729118347168, "global_step": 176003, "epoch": 2120} {"train_loss": -23.839981079101562, "global_step": 176004, "epoch": 2120} {"train_loss": -23.82508659362793, "global_step": 176005, "epoch": 2120} {"train_loss": -24.05502700805664, "global_step": 176006, "epoch": 2120} {"train_loss": -23.235239028930664, "global_step": 176007, "epoch": 2120} {"train_loss": -23.662708282470703, "global_step": 176008, "epoch": 2120} {"train_loss": -23.91958999633789, "global_step": 176009, "epoch": 2120} {"train_loss": -23.550413131713867, "global_step": 176010, "epoch": 2120} {"train_loss": -23.699874877929688, "global_step": 176011, "epoch": 2120} {"train_loss": -23.70625114440918, "global_step": 176012, "epoch": 2120} {"train_loss": -23.408458709716797, "global_step": 176013, "epoch": 2120} {"train_loss": -23.715564727783203, "global_step": 176014, "epoch": 2120} {"train_loss": -23.651386260986328, "global_step": 176015, "epoch": 2120} {"train_loss": -23.783443450927734, "global_step": 176016, "epoch": 2120} {"train_loss": -23.873031616210938, "global_step": 176017, "epoch": 2120} {"train_loss": -23.852798461914062, "global_step": 176018, "epoch": 2120} {"train_loss": -23.773435592651367, "global_step": 176019, "epoch": 2120} {"train_loss": -23.899991989135742, "global_step": 176020, "epoch": 2120} {"train_loss": -24.054119110107422, "global_step": 176021, "epoch": 2120} {"train_loss": -23.582101821899414, "global_step": 176022, "epoch": 2120} {"train_loss": -23.807287216186523, "global_step": 176023, "epoch": 2120} {"train_loss": -23.470844268798828, "global_step": 176024, "epoch": 2120} {"train_loss": -23.76722526550293, "global_step": 176025, "epoch": 2120} {"train_loss": -24.091623306274414, "global_step": 176026, "epoch": 2120} {"train_loss": -23.988983154296875, "global_step": 176027, "epoch": 2120} {"train_loss": -23.76284408569336, "global_step": 176028, "epoch": 2120} {"train_loss": -23.97734260559082, "global_step": 176029, "epoch": 2120} {"train_loss": -24.07616424560547, "global_step": 176030, "epoch": 2120} {"train_loss": -23.84906005859375, "global_step": 176031, "epoch": 2120} {"train_loss": -23.68260383605957, "global_step": 176032, "epoch": 2120} {"train_loss": -23.630023956298828, "global_step": 176033, "epoch": 2120} {"train_loss": -23.780033111572266, "global_step": 176034, "epoch": 2120} {"train_loss": -24.03993797302246, "global_step": 176035, "epoch": 2120} {"train_loss": -23.746416091918945, "global_step": 176036, "epoch": 2120} {"train_loss": -23.56392478942871, "global_step": 176037, "epoch": 2120} {"train_loss": -24.093841552734375, "global_step": 176038, "epoch": 2120} {"train_loss": -23.82895851135254, "global_step": 176039, "epoch": 2120} {"train_loss": -23.992835998535156, "global_step": 176040, "epoch": 2120} {"train_loss": -23.856307983398438, "global_step": 176041, "epoch": 2120} {"train_loss": -23.52510436184435, "global_step": 176042, "epoch": 2120, "val_loss": 6509658.0} {"train_loss": -23.758188247680664, "global_step": 176043, "epoch": 2121} {"train_loss": -23.755237579345703, "global_step": 176044, "epoch": 2121} {"train_loss": -23.861169815063477, "global_step": 176045, "epoch": 2121} {"train_loss": -23.24265480041504, "global_step": 176046, "epoch": 2121} {"train_loss": -23.460275650024414, "global_step": 176047, "epoch": 2121} {"train_loss": -23.81415367126465, "global_step": 176048, "epoch": 2121} {"train_loss": -23.624059677124023, "global_step": 176049, "epoch": 2121} {"train_loss": -23.939586639404297, "global_step": 176050, "epoch": 2121} {"train_loss": -23.405155181884766, "global_step": 176051, "epoch": 2121} {"train_loss": -23.730188369750977, "global_step": 176052, "epoch": 2121} {"train_loss": -23.870290756225586, "global_step": 176053, "epoch": 2121} {"train_loss": -23.574142456054688, "global_step": 176054, "epoch": 2121} {"train_loss": -23.914047241210938, "global_step": 176055, "epoch": 2121} {"train_loss": -23.927188873291016, "global_step": 176056, "epoch": 2121} {"train_loss": -23.935474395751953, "global_step": 176057, "epoch": 2121} {"train_loss": -23.888944625854492, "global_step": 176058, "epoch": 2121} {"train_loss": -23.96234703063965, "global_step": 176059, "epoch": 2121} {"train_loss": -23.768299102783203, "global_step": 176060, "epoch": 2121} {"train_loss": -23.796707153320312, "global_step": 176061, "epoch": 2121} {"train_loss": -24.160499572753906, "global_step": 176062, "epoch": 2121} {"train_loss": -23.858707427978516, "global_step": 176063, "epoch": 2121} {"train_loss": -24.004247665405273, "global_step": 176064, "epoch": 2121} {"train_loss": -23.91915512084961, "global_step": 176065, "epoch": 2121} {"train_loss": -23.790645599365234, "global_step": 176066, "epoch": 2121} {"train_loss": -23.92024040222168, "global_step": 176067, "epoch": 2121} {"train_loss": -23.6408634185791, "global_step": 176068, "epoch": 2121} {"train_loss": -24.052459716796875, "global_step": 176069, "epoch": 2121} {"train_loss": -24.03822898864746, "global_step": 176070, "epoch": 2121} {"train_loss": -24.072683334350586, "global_step": 176071, "epoch": 2121} {"train_loss": -23.591575622558594, "global_step": 176072, "epoch": 2121} {"train_loss": -23.575551986694336, "global_step": 176073, "epoch": 2121} {"train_loss": -23.94554901123047, "global_step": 176074, "epoch": 2121} {"train_loss": -24.008541107177734, "global_step": 176075, "epoch": 2121} {"train_loss": -23.800870895385742, "global_step": 176076, "epoch": 2121} {"train_loss": -24.13092803955078, "global_step": 176077, "epoch": 2121} {"train_loss": -23.757116317749023, "global_step": 176078, "epoch": 2121} {"train_loss": -23.793701171875, "global_step": 176079, "epoch": 2121} {"train_loss": -24.038965225219727, "global_step": 176080, "epoch": 2121} {"train_loss": -23.512176513671875, "global_step": 176081, "epoch": 2121} {"train_loss": -23.363744735717773, "global_step": 176082, "epoch": 2121} {"train_loss": -23.87175750732422, "global_step": 176083, "epoch": 2121} {"train_loss": -24.10186195373535, "global_step": 176084, "epoch": 2121} {"train_loss": -23.90765953063965, "global_step": 176085, "epoch": 2121} {"train_loss": -24.01032829284668, "global_step": 176086, "epoch": 2121} {"train_loss": -24.02216911315918, "global_step": 176087, "epoch": 2121} {"train_loss": -23.812620162963867, "global_step": 176088, "epoch": 2121} {"train_loss": -23.594518661499023, "global_step": 176089, "epoch": 2121} {"train_loss": -23.625125885009766, "global_step": 176090, "epoch": 2121} {"train_loss": -23.927677154541016, "global_step": 176091, "epoch": 2121} {"train_loss": -23.720901489257812, "global_step": 176092, "epoch": 2121} {"train_loss": -23.631284713745117, "global_step": 176093, "epoch": 2121} {"train_loss": -24.132749557495117, "global_step": 176094, "epoch": 2121} {"train_loss": -23.894750595092773, "global_step": 176095, "epoch": 2121} {"train_loss": -24.030670166015625, "global_step": 176096, "epoch": 2121} {"train_loss": -23.684955596923828, "global_step": 176097, "epoch": 2121} {"train_loss": -23.87077522277832, "global_step": 176098, "epoch": 2121} {"train_loss": -23.739023208618164, "global_step": 176099, "epoch": 2121} {"train_loss": -23.625843048095703, "global_step": 176100, "epoch": 2121} {"train_loss": -23.947998046875, "global_step": 176101, "epoch": 2121} {"train_loss": -23.781156539916992, "global_step": 176102, "epoch": 2121} {"train_loss": -23.6925106048584, "global_step": 176103, "epoch": 2121} {"train_loss": -23.774795532226562, "global_step": 176104, "epoch": 2121} {"train_loss": -24.01961898803711, "global_step": 176105, "epoch": 2121} {"train_loss": -23.839269638061523, "global_step": 176106, "epoch": 2121} {"train_loss": -24.04214859008789, "global_step": 176107, "epoch": 2121} {"train_loss": -24.03986930847168, "global_step": 176108, "epoch": 2121} {"train_loss": -24.112674713134766, "global_step": 176109, "epoch": 2121} {"train_loss": -24.04254722595215, "global_step": 176110, "epoch": 2121} {"train_loss": -23.942546844482422, "global_step": 176111, "epoch": 2121} {"train_loss": -23.760791778564453, "global_step": 176112, "epoch": 2121} {"train_loss": -23.764863967895508, "global_step": 176113, "epoch": 2121} {"train_loss": -23.797826766967773, "global_step": 176114, "epoch": 2121} {"train_loss": -23.98164939880371, "global_step": 176115, "epoch": 2121} {"train_loss": -23.288434982299805, "global_step": 176116, "epoch": 2121} {"train_loss": -22.75071907043457, "global_step": 176117, "epoch": 2121} {"train_loss": -23.291353225708008, "global_step": 176118, "epoch": 2121} {"train_loss": -23.798357009887695, "global_step": 176119, "epoch": 2121} {"train_loss": -23.88002586364746, "global_step": 176120, "epoch": 2121} {"train_loss": -23.418338775634766, "global_step": 176121, "epoch": 2121} {"train_loss": -23.823810577392578, "global_step": 176122, "epoch": 2121} {"train_loss": -23.82461166381836, "global_step": 176123, "epoch": 2121} {"train_loss": -23.44683265686035, "global_step": 176124, "epoch": 2121} {"train_loss": -23.799198242555182, "global_step": 176125, "epoch": 2121, "val_loss": 6419838.0} {"train_loss": -22.67282485961914, "global_step": 176126, "epoch": 2122} {"train_loss": -23.265399932861328, "global_step": 176127, "epoch": 2122} {"train_loss": -23.26627540588379, "global_step": 176128, "epoch": 2122} {"train_loss": -23.178421020507812, "global_step": 176129, "epoch": 2122} {"train_loss": -23.252582550048828, "global_step": 176130, "epoch": 2122} {"train_loss": -23.1149959564209, "global_step": 176131, "epoch": 2122} {"train_loss": -22.990562438964844, "global_step": 176132, "epoch": 2122} {"train_loss": -23.23297119140625, "global_step": 176133, "epoch": 2122} {"train_loss": -23.132383346557617, "global_step": 176134, "epoch": 2122} {"train_loss": -23.16232681274414, "global_step": 176135, "epoch": 2122} {"train_loss": -23.547931671142578, "global_step": 176136, "epoch": 2122} {"train_loss": -23.388986587524414, "global_step": 176137, "epoch": 2122} {"train_loss": -23.78729248046875, "global_step": 176138, "epoch": 2122} {"train_loss": -23.26311683654785, "global_step": 176139, "epoch": 2122} {"train_loss": -23.721742630004883, "global_step": 176140, "epoch": 2122} {"train_loss": -23.845428466796875, "global_step": 176141, "epoch": 2122} {"train_loss": -23.66685676574707, "global_step": 176142, "epoch": 2122} {"train_loss": -23.472238540649414, "global_step": 176143, "epoch": 2122} {"train_loss": -23.591176986694336, "global_step": 176144, "epoch": 2122} {"train_loss": -23.678699493408203, "global_step": 176145, "epoch": 2122} {"train_loss": -23.854616165161133, "global_step": 176146, "epoch": 2122} {"train_loss": -23.447912216186523, "global_step": 176147, "epoch": 2122} {"train_loss": -23.87485694885254, "global_step": 176148, "epoch": 2122} {"train_loss": -23.76320457458496, "global_step": 176149, "epoch": 2122} {"train_loss": -23.656097412109375, "global_step": 176150, "epoch": 2122} {"train_loss": -23.8232479095459, "global_step": 176151, "epoch": 2122} {"train_loss": -23.69111442565918, "global_step": 176152, "epoch": 2122} {"train_loss": -23.37078094482422, "global_step": 176153, "epoch": 2122} {"train_loss": -23.4326171875, "global_step": 176154, "epoch": 2122} {"train_loss": -23.778247833251953, "global_step": 176155, "epoch": 2122} {"train_loss": -23.473949432373047, "global_step": 176156, "epoch": 2122} {"train_loss": -23.790088653564453, "global_step": 176157, "epoch": 2122} {"train_loss": -23.88913345336914, "global_step": 176158, "epoch": 2122} {"train_loss": -24.26557731628418, "global_step": 176159, "epoch": 2122} {"train_loss": -23.499666213989258, "global_step": 176160, "epoch": 2122} {"train_loss": -23.917325973510742, "global_step": 176161, "epoch": 2122} {"train_loss": -23.86261558532715, "global_step": 176162, "epoch": 2122} {"train_loss": -23.961238861083984, "global_step": 176163, "epoch": 2122} {"train_loss": -23.76021957397461, "global_step": 176164, "epoch": 2122} {"train_loss": -23.96792221069336, "global_step": 176165, "epoch": 2122} {"train_loss": -23.921405792236328, "global_step": 176166, "epoch": 2122} {"train_loss": -24.12143325805664, "global_step": 176167, "epoch": 2122} {"train_loss": -23.666669845581055, "global_step": 176168, "epoch": 2122} {"train_loss": -23.86669921875, "global_step": 176169, "epoch": 2122} {"train_loss": -23.681045532226562, "global_step": 176170, "epoch": 2122} {"train_loss": -23.993452072143555, "global_step": 176171, "epoch": 2122} {"train_loss": -24.211214065551758, "global_step": 176172, "epoch": 2122} {"train_loss": -23.770462036132812, "global_step": 176173, "epoch": 2122} {"train_loss": -23.893665313720703, "global_step": 176174, "epoch": 2122} {"train_loss": -24.476415634155273, "global_step": 176175, "epoch": 2122} {"train_loss": -24.01106071472168, "global_step": 176176, "epoch": 2122} {"train_loss": -23.71600914001465, "global_step": 176177, "epoch": 2122} {"train_loss": -23.346908569335938, "global_step": 176178, "epoch": 2122} {"train_loss": -23.802955627441406, "global_step": 176179, "epoch": 2122} {"train_loss": -23.431623458862305, "global_step": 176180, "epoch": 2122} {"train_loss": -23.683223724365234, "global_step": 176181, "epoch": 2122} {"train_loss": -23.582046508789062, "global_step": 176182, "epoch": 2122} {"train_loss": -23.749486923217773, "global_step": 176183, "epoch": 2122} {"train_loss": -24.00721549987793, "global_step": 176184, "epoch": 2122} {"train_loss": -24.05933952331543, "global_step": 176185, "epoch": 2122} {"train_loss": -23.670927047729492, "global_step": 176186, "epoch": 2122} {"train_loss": -23.94456672668457, "global_step": 176187, "epoch": 2122} {"train_loss": -24.017120361328125, "global_step": 176188, "epoch": 2122} {"train_loss": -23.999740600585938, "global_step": 176189, "epoch": 2122} {"train_loss": -24.168537139892578, "global_step": 176190, "epoch": 2122} {"train_loss": -23.671966552734375, "global_step": 176191, "epoch": 2122} {"train_loss": -24.054304122924805, "global_step": 176192, "epoch": 2122} {"train_loss": -23.794906616210938, "global_step": 176193, "epoch": 2122} {"train_loss": -24.140893936157227, "global_step": 176194, "epoch": 2122} {"train_loss": -23.678152084350586, "global_step": 176195, "epoch": 2122} {"train_loss": -23.65704917907715, "global_step": 176196, "epoch": 2122} {"train_loss": -23.453266143798828, "global_step": 176197, "epoch": 2122} {"train_loss": -23.8139705657959, "global_step": 176198, "epoch": 2122} {"train_loss": -23.697834014892578, "global_step": 176199, "epoch": 2122} {"train_loss": -24.12015724182129, "global_step": 176200, "epoch": 2122} {"train_loss": -23.889041900634766, "global_step": 176201, "epoch": 2122} {"train_loss": -24.1008358001709, "global_step": 176202, "epoch": 2122} {"train_loss": -23.728759765625, "global_step": 176203, "epoch": 2122} {"train_loss": -23.741687774658203, "global_step": 176204, "epoch": 2122} {"train_loss": -23.839946746826172, "global_step": 176205, "epoch": 2122} {"train_loss": -23.613943099975586, "global_step": 176206, "epoch": 2122} {"train_loss": -23.756345748901367, "global_step": 176207, "epoch": 2122} {"train_loss": -23.72010005813047, "global_step": 176208, "epoch": 2122, "val_loss": 6519747.5} {"train_loss": -23.443252563476562, "global_step": 176209, "epoch": 2123} {"train_loss": -23.246625900268555, "global_step": 176210, "epoch": 2123} {"train_loss": -23.06272315979004, "global_step": 176211, "epoch": 2123} {"train_loss": -23.28067970275879, "global_step": 176212, "epoch": 2123} {"train_loss": -23.186368942260742, "global_step": 176213, "epoch": 2123} {"train_loss": -23.62789535522461, "global_step": 176214, "epoch": 2123} {"train_loss": -23.030813217163086, "global_step": 176215, "epoch": 2123} {"train_loss": -23.46192169189453, "global_step": 176216, "epoch": 2123} {"train_loss": -23.83440399169922, "global_step": 176217, "epoch": 2123} {"train_loss": -23.398202896118164, "global_step": 176218, "epoch": 2123} {"train_loss": -23.518293380737305, "global_step": 176219, "epoch": 2123} {"train_loss": -23.827789306640625, "global_step": 176220, "epoch": 2123} {"train_loss": -23.39434814453125, "global_step": 176221, "epoch": 2123} {"train_loss": -24.10825538635254, "global_step": 176222, "epoch": 2123} {"train_loss": -23.470355987548828, "global_step": 176223, "epoch": 2123} {"train_loss": -23.74941062927246, "global_step": 176224, "epoch": 2123} {"train_loss": -23.516080856323242, "global_step": 176225, "epoch": 2123} {"train_loss": -23.38654136657715, "global_step": 176226, "epoch": 2123} {"train_loss": -23.50080680847168, "global_step": 176227, "epoch": 2123} {"train_loss": -23.2133731842041, "global_step": 176228, "epoch": 2123} {"train_loss": -23.980527877807617, "global_step": 176229, "epoch": 2123} {"train_loss": -23.659698486328125, "global_step": 176230, "epoch": 2123} {"train_loss": -23.676223754882812, "global_step": 176231, "epoch": 2123} {"train_loss": -23.971969604492188, "global_step": 176232, "epoch": 2123} {"train_loss": -23.370845794677734, "global_step": 176233, "epoch": 2123} {"train_loss": -23.57557487487793, "global_step": 176234, "epoch": 2123} {"train_loss": -23.45015525817871, "global_step": 176235, "epoch": 2123} {"train_loss": -23.885393142700195, "global_step": 176236, "epoch": 2123} {"train_loss": -23.593656539916992, "global_step": 176237, "epoch": 2123} {"train_loss": -23.949607849121094, "global_step": 176238, "epoch": 2123} {"train_loss": -23.454620361328125, "global_step": 176239, "epoch": 2123} {"train_loss": -23.512447357177734, "global_step": 176240, "epoch": 2123} {"train_loss": -23.750150680541992, "global_step": 176241, "epoch": 2123} {"train_loss": -23.797910690307617, "global_step": 176242, "epoch": 2123} {"train_loss": -23.846424102783203, "global_step": 176243, "epoch": 2123} {"train_loss": -23.518850326538086, "global_step": 176244, "epoch": 2123} {"train_loss": -23.697006225585938, "global_step": 176245, "epoch": 2123} {"train_loss": -23.7004337310791, "global_step": 176246, "epoch": 2123} {"train_loss": -23.7882022857666, "global_step": 176247, "epoch": 2123} {"train_loss": -23.99934959411621, "global_step": 176248, "epoch": 2123} {"train_loss": -23.67922019958496, "global_step": 176249, "epoch": 2123} {"train_loss": -23.813213348388672, "global_step": 176250, "epoch": 2123} {"train_loss": -23.882007598876953, "global_step": 176251, "epoch": 2123} {"train_loss": -23.70442008972168, "global_step": 176252, "epoch": 2123} {"train_loss": -23.804107666015625, "global_step": 176253, "epoch": 2123} {"train_loss": -24.135406494140625, "global_step": 176254, "epoch": 2123} {"train_loss": -23.98612403869629, "global_step": 176255, "epoch": 2123} {"train_loss": -23.818035125732422, "global_step": 176256, "epoch": 2123} {"train_loss": -23.586956024169922, "global_step": 176257, "epoch": 2123} {"train_loss": -23.803979873657227, "global_step": 176258, "epoch": 2123} {"train_loss": -23.909839630126953, "global_step": 176259, "epoch": 2123} {"train_loss": -23.648313522338867, "global_step": 176260, "epoch": 2123} {"train_loss": -23.778886795043945, "global_step": 176261, "epoch": 2123} {"train_loss": -23.751895904541016, "global_step": 176262, "epoch": 2123} {"train_loss": -23.683584213256836, "global_step": 176263, "epoch": 2123} {"train_loss": -24.089611053466797, "global_step": 176264, "epoch": 2123} {"train_loss": -23.578393936157227, "global_step": 176265, "epoch": 2123} {"train_loss": -23.81397819519043, "global_step": 176266, "epoch": 2123} {"train_loss": -23.592737197875977, "global_step": 176267, "epoch": 2123} {"train_loss": -23.823923110961914, "global_step": 176268, "epoch": 2123} {"train_loss": -23.956270217895508, "global_step": 176269, "epoch": 2123} {"train_loss": -23.787750244140625, "global_step": 176270, "epoch": 2123} {"train_loss": -23.80634880065918, "global_step": 176271, "epoch": 2123} {"train_loss": -23.83253288269043, "global_step": 176272, "epoch": 2123} {"train_loss": -24.100004196166992, "global_step": 176273, "epoch": 2123} {"train_loss": -23.975727081298828, "global_step": 176274, "epoch": 2123} {"train_loss": -23.939838409423828, "global_step": 176275, "epoch": 2123} {"train_loss": -23.678726196289062, "global_step": 176276, "epoch": 2123} {"train_loss": -23.85313606262207, "global_step": 176277, "epoch": 2123} {"train_loss": -23.816905975341797, "global_step": 176278, "epoch": 2123} {"train_loss": -23.59783363342285, "global_step": 176279, "epoch": 2123} {"train_loss": -23.75396728515625, "global_step": 176280, "epoch": 2123} {"train_loss": -24.331228256225586, "global_step": 176281, "epoch": 2123} {"train_loss": -23.60115623474121, "global_step": 176282, "epoch": 2123} {"train_loss": -23.621063232421875, "global_step": 176283, "epoch": 2123} {"train_loss": -23.34073829650879, "global_step": 176284, "epoch": 2123} {"train_loss": -24.072622299194336, "global_step": 176285, "epoch": 2123} {"train_loss": -23.59988021850586, "global_step": 176286, "epoch": 2123} {"train_loss": -23.713367462158203, "global_step": 176287, "epoch": 2123} {"train_loss": -23.6538143157959, "global_step": 176288, "epoch": 2123} {"train_loss": -23.98374366760254, "global_step": 176289, "epoch": 2123} {"train_loss": -23.621095657348633, "global_step": 176290, "epoch": 2123} {"train_loss": -23.694756496383484, "global_step": 176291, "epoch": 2123, "val_loss": 6321490.0} {"train_loss": -23.27699851989746, "global_step": 176292, "epoch": 2124} {"train_loss": -23.22783851623535, "global_step": 176293, "epoch": 2124} {"train_loss": -23.66419792175293, "global_step": 176294, "epoch": 2124} {"train_loss": -23.407421112060547, "global_step": 176295, "epoch": 2124} {"train_loss": -23.782934188842773, "global_step": 176296, "epoch": 2124} {"train_loss": -23.575233459472656, "global_step": 176297, "epoch": 2124} {"train_loss": -23.552274703979492, "global_step": 176298, "epoch": 2124} {"train_loss": -23.231760025024414, "global_step": 176299, "epoch": 2124} {"train_loss": -23.580509185791016, "global_step": 176300, "epoch": 2124} {"train_loss": -23.844125747680664, "global_step": 176301, "epoch": 2124} {"train_loss": -23.79891014099121, "global_step": 176302, "epoch": 2124} {"train_loss": -23.19515037536621, "global_step": 176303, "epoch": 2124} {"train_loss": -23.462690353393555, "global_step": 176304, "epoch": 2124} {"train_loss": -23.604000091552734, "global_step": 176305, "epoch": 2124} {"train_loss": -23.577932357788086, "global_step": 176306, "epoch": 2124} {"train_loss": -23.744176864624023, "global_step": 176307, "epoch": 2124} {"train_loss": -23.677696228027344, "global_step": 176308, "epoch": 2124} {"train_loss": -23.494173049926758, "global_step": 176309, "epoch": 2124} {"train_loss": -23.542375564575195, "global_step": 176310, "epoch": 2124} {"train_loss": -23.605201721191406, "global_step": 176311, "epoch": 2124} {"train_loss": -23.467588424682617, "global_step": 176312, "epoch": 2124} {"train_loss": -23.8502197265625, "global_step": 176313, "epoch": 2124} {"train_loss": -23.53445816040039, "global_step": 176314, "epoch": 2124} {"train_loss": -23.846899032592773, "global_step": 176315, "epoch": 2124} {"train_loss": -23.525190353393555, "global_step": 176316, "epoch": 2124} {"train_loss": -23.640905380249023, "global_step": 176317, "epoch": 2124} {"train_loss": -23.686166763305664, "global_step": 176318, "epoch": 2124} {"train_loss": -23.7442626953125, "global_step": 176319, "epoch": 2124} {"train_loss": -23.80525016784668, "global_step": 176320, "epoch": 2124} {"train_loss": -24.136226654052734, "global_step": 176321, "epoch": 2124} {"train_loss": -23.427404403686523, "global_step": 176322, "epoch": 2124} {"train_loss": -23.99641227722168, "global_step": 176323, "epoch": 2124} {"train_loss": -24.1270751953125, "global_step": 176324, "epoch": 2124} {"train_loss": -23.921300888061523, "global_step": 176325, "epoch": 2124} {"train_loss": -23.618478775024414, "global_step": 176326, "epoch": 2124} {"train_loss": -24.009550094604492, "global_step": 176327, "epoch": 2124} {"train_loss": -24.361249923706055, "global_step": 176328, "epoch": 2124} {"train_loss": -23.74417495727539, "global_step": 176329, "epoch": 2124} {"train_loss": -23.727447509765625, "global_step": 176330, "epoch": 2124} {"train_loss": -24.179861068725586, "global_step": 176331, "epoch": 2124} {"train_loss": -24.192861557006836, "global_step": 176332, "epoch": 2124} {"train_loss": -24.038625717163086, "global_step": 176333, "epoch": 2124} {"train_loss": -24.1147518157959, "global_step": 176334, "epoch": 2124} {"train_loss": -24.243101119995117, "global_step": 176335, "epoch": 2124} {"train_loss": -24.171178817749023, "global_step": 176336, "epoch": 2124} {"train_loss": -24.023786544799805, "global_step": 176337, "epoch": 2124} {"train_loss": -23.802947998046875, "global_step": 176338, "epoch": 2124} {"train_loss": -23.940059661865234, "global_step": 176339, "epoch": 2124} {"train_loss": -23.606287002563477, "global_step": 176340, "epoch": 2124} {"train_loss": -23.466344833374023, "global_step": 176341, "epoch": 2124} {"train_loss": -23.68678855895996, "global_step": 176342, "epoch": 2124} {"train_loss": -23.72785758972168, "global_step": 176343, "epoch": 2124} {"train_loss": -24.038816452026367, "global_step": 176344, "epoch": 2124} {"train_loss": -23.816177368164062, "global_step": 176345, "epoch": 2124} {"train_loss": -23.447649002075195, "global_step": 176346, "epoch": 2124} {"train_loss": -23.59699058532715, "global_step": 176347, "epoch": 2124} {"train_loss": -23.048404693603516, "global_step": 176348, "epoch": 2124} {"train_loss": -23.68385124206543, "global_step": 176349, "epoch": 2124} {"train_loss": -23.389707565307617, "global_step": 176350, "epoch": 2124} {"train_loss": -23.89042091369629, "global_step": 176351, "epoch": 2124} {"train_loss": -23.76701545715332, "global_step": 176352, "epoch": 2124} {"train_loss": -23.54009246826172, "global_step": 176353, "epoch": 2124} {"train_loss": -23.620630264282227, "global_step": 176354, "epoch": 2124} {"train_loss": -23.72797203063965, "global_step": 176355, "epoch": 2124} {"train_loss": -23.4169979095459, "global_step": 176356, "epoch": 2124} {"train_loss": -23.85640525817871, "global_step": 176357, "epoch": 2124} {"train_loss": -23.932044982910156, "global_step": 176358, "epoch": 2124} {"train_loss": -23.90418243408203, "global_step": 176359, "epoch": 2124} {"train_loss": -24.0274600982666, "global_step": 176360, "epoch": 2124} {"train_loss": -23.829299926757812, "global_step": 176361, "epoch": 2124} {"train_loss": -23.421958923339844, "global_step": 176362, "epoch": 2124} {"train_loss": -23.73084831237793, "global_step": 176363, "epoch": 2124} {"train_loss": -24.149381637573242, "global_step": 176364, "epoch": 2124} {"train_loss": -23.996274948120117, "global_step": 176365, "epoch": 2124} {"train_loss": -23.63360023498535, "global_step": 176366, "epoch": 2124} {"train_loss": -24.008968353271484, "global_step": 176367, "epoch": 2124} {"train_loss": -23.925649642944336, "global_step": 176368, "epoch": 2124} {"train_loss": -24.022991180419922, "global_step": 176369, "epoch": 2124} {"train_loss": -23.943084716796875, "global_step": 176370, "epoch": 2124} {"train_loss": -23.69339942932129, "global_step": 176371, "epoch": 2124} {"train_loss": -23.76995086669922, "global_step": 176372, "epoch": 2124} {"train_loss": -24.01390266418457, "global_step": 176373, "epoch": 2124} {"train_loss": -23.74539320152926, "global_step": 176374, "epoch": 2124, "val_loss": 6401930.0} {"train_loss": -23.963470458984375, "global_step": 176375, "epoch": 2125} {"train_loss": -23.461706161499023, "global_step": 176376, "epoch": 2125} {"train_loss": -23.982412338256836, "global_step": 176377, "epoch": 2125} {"train_loss": -23.85116195678711, "global_step": 176378, "epoch": 2125} {"train_loss": -23.687820434570312, "global_step": 176379, "epoch": 2125} {"train_loss": -23.6044979095459, "global_step": 176380, "epoch": 2125} {"train_loss": -23.789878845214844, "global_step": 176381, "epoch": 2125} {"train_loss": -24.042858123779297, "global_step": 176382, "epoch": 2125} {"train_loss": -23.81168556213379, "global_step": 176383, "epoch": 2125} {"train_loss": -23.429208755493164, "global_step": 176384, "epoch": 2125} {"train_loss": -24.14631462097168, "global_step": 176385, "epoch": 2125} {"train_loss": -23.43971824645996, "global_step": 176386, "epoch": 2125} {"train_loss": -23.90242576599121, "global_step": 176387, "epoch": 2125} {"train_loss": -23.696725845336914, "global_step": 176388, "epoch": 2125} {"train_loss": -24.14249610900879, "global_step": 176389, "epoch": 2125} {"train_loss": -23.78804588317871, "global_step": 176390, "epoch": 2125} {"train_loss": -23.8387451171875, "global_step": 176391, "epoch": 2125} {"train_loss": -23.923852920532227, "global_step": 176392, "epoch": 2125} {"train_loss": -23.90216636657715, "global_step": 176393, "epoch": 2125} {"train_loss": -23.960647583007812, "global_step": 176394, "epoch": 2125} {"train_loss": -23.673416137695312, "global_step": 176395, "epoch": 2125} {"train_loss": -23.9830322265625, "global_step": 176396, "epoch": 2125} {"train_loss": -23.75130844116211, "global_step": 176397, "epoch": 2125} {"train_loss": -23.5234317779541, "global_step": 176398, "epoch": 2125} {"train_loss": -24.014278411865234, "global_step": 176399, "epoch": 2125} {"train_loss": -23.66604995727539, "global_step": 176400, "epoch": 2125} {"train_loss": -23.81988525390625, "global_step": 176401, "epoch": 2125} {"train_loss": -23.241374969482422, "global_step": 176402, "epoch": 2125} {"train_loss": -23.26409912109375, "global_step": 176403, "epoch": 2125} {"train_loss": -23.85032081604004, "global_step": 176404, "epoch": 2125} {"train_loss": -23.94081687927246, "global_step": 176405, "epoch": 2125} {"train_loss": -23.607786178588867, "global_step": 176406, "epoch": 2125} {"train_loss": -23.327316284179688, "global_step": 176407, "epoch": 2125} {"train_loss": -23.507736206054688, "global_step": 176408, "epoch": 2125} {"train_loss": -23.681486129760742, "global_step": 176409, "epoch": 2125} {"train_loss": -23.86249351501465, "global_step": 176410, "epoch": 2125} {"train_loss": -24.03181266784668, "global_step": 176411, "epoch": 2125} {"train_loss": -23.79547882080078, "global_step": 176412, "epoch": 2125} {"train_loss": -23.683530807495117, "global_step": 176413, "epoch": 2125} {"train_loss": -23.87775230407715, "global_step": 176414, "epoch": 2125} {"train_loss": -23.622032165527344, "global_step": 176415, "epoch": 2125} {"train_loss": -23.853239059448242, "global_step": 176416, "epoch": 2125} {"train_loss": -23.568082809448242, "global_step": 176417, "epoch": 2125} {"train_loss": -23.854257583618164, "global_step": 176418, "epoch": 2125} {"train_loss": -23.990354537963867, "global_step": 176419, "epoch": 2125} {"train_loss": -23.875152587890625, "global_step": 176420, "epoch": 2125} {"train_loss": -23.73590660095215, "global_step": 176421, "epoch": 2125} {"train_loss": -24.139575958251953, "global_step": 176422, "epoch": 2125} {"train_loss": -24.061681747436523, "global_step": 176423, "epoch": 2125} {"train_loss": -23.51350975036621, "global_step": 176424, "epoch": 2125} {"train_loss": -24.052621841430664, "global_step": 176425, "epoch": 2125} {"train_loss": -23.8515625, "global_step": 176426, "epoch": 2125} {"train_loss": -24.099342346191406, "global_step": 176427, "epoch": 2125} {"train_loss": -23.8974666595459, "global_step": 176428, "epoch": 2125} {"train_loss": -23.85690689086914, "global_step": 176429, "epoch": 2125} {"train_loss": -24.084209442138672, "global_step": 176430, "epoch": 2125} {"train_loss": -23.91470718383789, "global_step": 176431, "epoch": 2125} {"train_loss": -24.369508743286133, "global_step": 176432, "epoch": 2125} {"train_loss": -24.14156150817871, "global_step": 176433, "epoch": 2125} {"train_loss": -23.624826431274414, "global_step": 176434, "epoch": 2125} {"train_loss": -23.669126510620117, "global_step": 176435, "epoch": 2125} {"train_loss": -23.871246337890625, "global_step": 176436, "epoch": 2125} {"train_loss": -23.705488204956055, "global_step": 176437, "epoch": 2125} {"train_loss": -23.98870277404785, "global_step": 176438, "epoch": 2125} {"train_loss": -24.014209747314453, "global_step": 176439, "epoch": 2125} {"train_loss": -23.909692764282227, "global_step": 176440, "epoch": 2125} {"train_loss": -23.707592010498047, "global_step": 176441, "epoch": 2125} {"train_loss": -24.085660934448242, "global_step": 176442, "epoch": 2125} {"train_loss": -23.743032455444336, "global_step": 176443, "epoch": 2125} {"train_loss": -23.673871994018555, "global_step": 176444, "epoch": 2125} {"train_loss": -23.5676212310791, "global_step": 176445, "epoch": 2125} {"train_loss": -23.754728317260742, "global_step": 176446, "epoch": 2125} {"train_loss": -23.9299373626709, "global_step": 176447, "epoch": 2125} {"train_loss": -23.694869995117188, "global_step": 176448, "epoch": 2125} {"train_loss": -24.08115577697754, "global_step": 176449, "epoch": 2125} {"train_loss": -23.831113815307617, "global_step": 176450, "epoch": 2125} {"train_loss": -23.566585540771484, "global_step": 176451, "epoch": 2125} {"train_loss": -23.843929290771484, "global_step": 176452, "epoch": 2125} {"train_loss": -24.371185302734375, "global_step": 176453, "epoch": 2125} {"train_loss": -23.57993507385254, "global_step": 176454, "epoch": 2125} {"train_loss": -23.978322982788086, "global_step": 176455, "epoch": 2125} {"train_loss": -23.84206199645996, "global_step": 176456, "epoch": 2125} {"train_loss": -23.807817688907484, "global_step": 176457, "epoch": 2125, "val_loss": 6420934.0} {"train_loss": -23.42536735534668, "global_step": 176458, "epoch": 2126} {"train_loss": -22.867103576660156, "global_step": 176459, "epoch": 2126} {"train_loss": -23.619733810424805, "global_step": 176460, "epoch": 2126} {"train_loss": -22.785736083984375, "global_step": 176461, "epoch": 2126} {"train_loss": -23.41602897644043, "global_step": 176462, "epoch": 2126} {"train_loss": -23.106687545776367, "global_step": 176463, "epoch": 2126} {"train_loss": -23.256101608276367, "global_step": 176464, "epoch": 2126} {"train_loss": -23.542673110961914, "global_step": 176465, "epoch": 2126} {"train_loss": -23.66181755065918, "global_step": 176466, "epoch": 2126} {"train_loss": -23.590274810791016, "global_step": 176467, "epoch": 2126} {"train_loss": -23.366958618164062, "global_step": 176468, "epoch": 2126} {"train_loss": -23.539335250854492, "global_step": 176469, "epoch": 2126} {"train_loss": -23.58475685119629, "global_step": 176470, "epoch": 2126} {"train_loss": -22.913908004760742, "global_step": 176471, "epoch": 2126} {"train_loss": -23.684629440307617, "global_step": 176472, "epoch": 2126} {"train_loss": -23.562101364135742, "global_step": 176473, "epoch": 2126} {"train_loss": -23.556821823120117, "global_step": 176474, "epoch": 2126} {"train_loss": -23.19585418701172, "global_step": 176475, "epoch": 2126} {"train_loss": -23.492769241333008, "global_step": 176476, "epoch": 2126} {"train_loss": -23.699966430664062, "global_step": 176477, "epoch": 2126} {"train_loss": -24.116649627685547, "global_step": 176478, "epoch": 2126} {"train_loss": -23.936521530151367, "global_step": 176479, "epoch": 2126} {"train_loss": -23.685443878173828, "global_step": 176480, "epoch": 2126} {"train_loss": -23.974435806274414, "global_step": 176481, "epoch": 2126} {"train_loss": -24.258068084716797, "global_step": 176482, "epoch": 2126} {"train_loss": -23.921951293945312, "global_step": 176483, "epoch": 2126} {"train_loss": -23.72092056274414, "global_step": 176484, "epoch": 2126} {"train_loss": -24.09334373474121, "global_step": 176485, "epoch": 2126} {"train_loss": -23.82981300354004, "global_step": 176486, "epoch": 2126} {"train_loss": -23.72813606262207, "global_step": 176487, "epoch": 2126} {"train_loss": -23.72415542602539, "global_step": 176488, "epoch": 2126} {"train_loss": -23.840524673461914, "global_step": 176489, "epoch": 2126} {"train_loss": -23.9030704498291, "global_step": 176490, "epoch": 2126} {"train_loss": -23.736059188842773, "global_step": 176491, "epoch": 2126} {"train_loss": -23.69954490661621, "global_step": 176492, "epoch": 2126} {"train_loss": -24.163293838500977, "global_step": 176493, "epoch": 2126} {"train_loss": -23.79371452331543, "global_step": 176494, "epoch": 2126} {"train_loss": -23.772098541259766, "global_step": 176495, "epoch": 2126} {"train_loss": -23.78668212890625, "global_step": 176496, "epoch": 2126} {"train_loss": -23.828142166137695, "global_step": 176497, "epoch": 2126} {"train_loss": -24.05689811706543, "global_step": 176498, "epoch": 2126} {"train_loss": -23.958698272705078, "global_step": 176499, "epoch": 2126} {"train_loss": -23.950103759765625, "global_step": 176500, "epoch": 2126} {"train_loss": -24.243417739868164, "global_step": 176501, "epoch": 2126} {"train_loss": -23.89801597595215, "global_step": 176502, "epoch": 2126} {"train_loss": -23.694934844970703, "global_step": 176503, "epoch": 2126} {"train_loss": -23.81641960144043, "global_step": 176504, "epoch": 2126} {"train_loss": -23.58631706237793, "global_step": 176505, "epoch": 2126} {"train_loss": -24.06658363342285, "global_step": 176506, "epoch": 2126} {"train_loss": -23.739059448242188, "global_step": 176507, "epoch": 2126} {"train_loss": -23.942426681518555, "global_step": 176508, "epoch": 2126} {"train_loss": -24.161319732666016, "global_step": 176509, "epoch": 2126} {"train_loss": -23.703821182250977, "global_step": 176510, "epoch": 2126} {"train_loss": -23.777847290039062, "global_step": 176511, "epoch": 2126} {"train_loss": -24.043766021728516, "global_step": 176512, "epoch": 2126} {"train_loss": -24.085233688354492, "global_step": 176513, "epoch": 2126} {"train_loss": -24.02925682067871, "global_step": 176514, "epoch": 2126} {"train_loss": -24.07049560546875, "global_step": 176515, "epoch": 2126} {"train_loss": -24.06569480895996, "global_step": 176516, "epoch": 2126} {"train_loss": -23.78364372253418, "global_step": 176517, "epoch": 2126} {"train_loss": -24.01104164123535, "global_step": 176518, "epoch": 2126} {"train_loss": -23.93648338317871, "global_step": 176519, "epoch": 2126} {"train_loss": -23.94281768798828, "global_step": 176520, "epoch": 2126} {"train_loss": -23.49102210998535, "global_step": 176521, "epoch": 2126} {"train_loss": -23.887012481689453, "global_step": 176522, "epoch": 2126} {"train_loss": -24.159414291381836, "global_step": 176523, "epoch": 2126} {"train_loss": -23.36907386779785, "global_step": 176524, "epoch": 2126} {"train_loss": -23.98991584777832, "global_step": 176525, "epoch": 2126} {"train_loss": -24.023740768432617, "global_step": 176526, "epoch": 2126} {"train_loss": -23.649255752563477, "global_step": 176527, "epoch": 2126} {"train_loss": -24.094160079956055, "global_step": 176528, "epoch": 2126} {"train_loss": -24.118894577026367, "global_step": 176529, "epoch": 2126} {"train_loss": -24.208723068237305, "global_step": 176530, "epoch": 2126} {"train_loss": -23.689437866210938, "global_step": 176531, "epoch": 2126} {"train_loss": -23.84773063659668, "global_step": 176532, "epoch": 2126} {"train_loss": -23.677162170410156, "global_step": 176533, "epoch": 2126} {"train_loss": -23.829870223999023, "global_step": 176534, "epoch": 2126} {"train_loss": -23.196252822875977, "global_step": 176535, "epoch": 2126} {"train_loss": -23.630285263061523, "global_step": 176536, "epoch": 2126} {"train_loss": -23.431379318237305, "global_step": 176537, "epoch": 2126} {"train_loss": -23.581207275390625, "global_step": 176538, "epoch": 2126} {"train_loss": -23.78480339050293, "global_step": 176539, "epoch": 2126} {"train_loss": -23.741975186819054, "global_step": 176540, "epoch": 2126, "val_loss": 6505515.0} {"train_loss": -23.427061080932617, "global_step": 176541, "epoch": 2127} {"train_loss": -23.274728775024414, "global_step": 176542, "epoch": 2127} {"train_loss": -23.247207641601562, "global_step": 176543, "epoch": 2127} {"train_loss": -23.65956687927246, "global_step": 176544, "epoch": 2127} {"train_loss": -23.707990646362305, "global_step": 176545, "epoch": 2127} {"train_loss": -24.042173385620117, "global_step": 176546, "epoch": 2127} {"train_loss": -23.63324546813965, "global_step": 176547, "epoch": 2127} {"train_loss": -23.452194213867188, "global_step": 176548, "epoch": 2127} {"train_loss": -23.845657348632812, "global_step": 176549, "epoch": 2127} {"train_loss": -23.70292854309082, "global_step": 176550, "epoch": 2127} {"train_loss": -23.838077545166016, "global_step": 176551, "epoch": 2127} {"train_loss": -23.68524169921875, "global_step": 176552, "epoch": 2127} {"train_loss": -23.702775955200195, "global_step": 176553, "epoch": 2127} {"train_loss": -23.615232467651367, "global_step": 176554, "epoch": 2127} {"train_loss": -23.853229522705078, "global_step": 176555, "epoch": 2127} {"train_loss": -23.75201416015625, "global_step": 176556, "epoch": 2127} {"train_loss": -24.107606887817383, "global_step": 176557, "epoch": 2127} {"train_loss": -23.74660873413086, "global_step": 176558, "epoch": 2127} {"train_loss": -23.765365600585938, "global_step": 176559, "epoch": 2127} {"train_loss": -23.549713134765625, "global_step": 176560, "epoch": 2127} {"train_loss": -23.901355743408203, "global_step": 176561, "epoch": 2127} {"train_loss": -23.91669273376465, "global_step": 176562, "epoch": 2127} {"train_loss": -23.727643966674805, "global_step": 176563, "epoch": 2127} {"train_loss": -24.262693405151367, "global_step": 176564, "epoch": 2127} {"train_loss": -24.29794692993164, "global_step": 176565, "epoch": 2127} {"train_loss": -24.03203773498535, "global_step": 176566, "epoch": 2127} {"train_loss": -24.149751663208008, "global_step": 176567, "epoch": 2127} {"train_loss": -23.632143020629883, "global_step": 176568, "epoch": 2127} {"train_loss": -23.922452926635742, "global_step": 176569, "epoch": 2127} {"train_loss": -23.895015716552734, "global_step": 176570, "epoch": 2127} {"train_loss": -24.25214958190918, "global_step": 176571, "epoch": 2127} {"train_loss": -23.989957809448242, "global_step": 176572, "epoch": 2127} {"train_loss": -23.746631622314453, "global_step": 176573, "epoch": 2127} {"train_loss": -23.71346664428711, "global_step": 176574, "epoch": 2127} {"train_loss": -23.76350212097168, "global_step": 176575, "epoch": 2127} {"train_loss": -23.41156578063965, "global_step": 176576, "epoch": 2127} {"train_loss": -24.097074508666992, "global_step": 176577, "epoch": 2127} {"train_loss": -23.833959579467773, "global_step": 176578, "epoch": 2127} {"train_loss": -23.93060874938965, "global_step": 176579, "epoch": 2127} {"train_loss": -23.55921745300293, "global_step": 176580, "epoch": 2127} {"train_loss": -23.842044830322266, "global_step": 176581, "epoch": 2127} {"train_loss": -23.854726791381836, "global_step": 176582, "epoch": 2127} {"train_loss": -23.912439346313477, "global_step": 176583, "epoch": 2127} {"train_loss": -23.53386688232422, "global_step": 176584, "epoch": 2127} {"train_loss": -24.0023193359375, "global_step": 176585, "epoch": 2127} {"train_loss": -24.079076766967773, "global_step": 176586, "epoch": 2127} {"train_loss": -23.877321243286133, "global_step": 176587, "epoch": 2127} {"train_loss": -23.823110580444336, "global_step": 176588, "epoch": 2127} {"train_loss": -23.379247665405273, "global_step": 176589, "epoch": 2127} {"train_loss": -23.336929321289062, "global_step": 176590, "epoch": 2127} {"train_loss": -23.428625106811523, "global_step": 176591, "epoch": 2127} {"train_loss": -23.36943817138672, "global_step": 176592, "epoch": 2127} {"train_loss": -24.134445190429688, "global_step": 176593, "epoch": 2127} {"train_loss": -23.590770721435547, "global_step": 176594, "epoch": 2127} {"train_loss": -23.926380157470703, "global_step": 176595, "epoch": 2127} {"train_loss": -23.45674705505371, "global_step": 176596, "epoch": 2127} {"train_loss": -24.02618980407715, "global_step": 176597, "epoch": 2127} {"train_loss": -23.498640060424805, "global_step": 176598, "epoch": 2127} {"train_loss": -23.43071937561035, "global_step": 176599, "epoch": 2127} {"train_loss": -23.73802375793457, "global_step": 176600, "epoch": 2127} {"train_loss": -23.482934951782227, "global_step": 176601, "epoch": 2127} {"train_loss": -23.61589813232422, "global_step": 176602, "epoch": 2127} {"train_loss": -23.627431869506836, "global_step": 176603, "epoch": 2127} {"train_loss": -23.62932777404785, "global_step": 176604, "epoch": 2127} {"train_loss": -23.970748901367188, "global_step": 176605, "epoch": 2127} {"train_loss": -23.571271896362305, "global_step": 176606, "epoch": 2127} {"train_loss": -23.386951446533203, "global_step": 176607, "epoch": 2127} {"train_loss": -23.32997703552246, "global_step": 176608, "epoch": 2127} {"train_loss": -23.67734718322754, "global_step": 176609, "epoch": 2127} {"train_loss": -23.60938835144043, "global_step": 176610, "epoch": 2127} {"train_loss": -23.55597496032715, "global_step": 176611, "epoch": 2127} {"train_loss": -24.020063400268555, "global_step": 176612, "epoch": 2127} {"train_loss": -23.564258575439453, "global_step": 176613, "epoch": 2127} {"train_loss": -23.18264389038086, "global_step": 176614, "epoch": 2127} {"train_loss": -23.567142486572266, "global_step": 176615, "epoch": 2127} {"train_loss": -24.08327293395996, "global_step": 176616, "epoch": 2127} {"train_loss": -23.8404483795166, "global_step": 176617, "epoch": 2127} {"train_loss": -23.921878814697266, "global_step": 176618, "epoch": 2127} {"train_loss": -24.054861068725586, "global_step": 176619, "epoch": 2127} {"train_loss": -23.78961753845215, "global_step": 176620, "epoch": 2127} {"train_loss": -23.588035583496094, "global_step": 176621, "epoch": 2127} {"train_loss": -24.12918472290039, "global_step": 176622, "epoch": 2127} {"train_loss": -23.748701968825007, "global_step": 176623, "epoch": 2127, "val_loss": 6415930.5} {"train_loss": -23.058141708374023, "global_step": 176624, "epoch": 2128} {"train_loss": -21.947269439697266, "global_step": 176625, "epoch": 2128} {"train_loss": -22.732816696166992, "global_step": 176626, "epoch": 2128} {"train_loss": -23.544248580932617, "global_step": 176627, "epoch": 2128} {"train_loss": -23.22827911376953, "global_step": 176628, "epoch": 2128} {"train_loss": -23.335102081298828, "global_step": 176629, "epoch": 2128} {"train_loss": -23.577991485595703, "global_step": 176630, "epoch": 2128} {"train_loss": -23.730587005615234, "global_step": 176631, "epoch": 2128} {"train_loss": -23.427770614624023, "global_step": 176632, "epoch": 2128} {"train_loss": -23.60043716430664, "global_step": 176633, "epoch": 2128} {"train_loss": -23.770429611206055, "global_step": 176634, "epoch": 2128} {"train_loss": -23.241607666015625, "global_step": 176635, "epoch": 2128} {"train_loss": -23.384475708007812, "global_step": 176636, "epoch": 2128} {"train_loss": -22.973928451538086, "global_step": 176637, "epoch": 2128} {"train_loss": -23.80732536315918, "global_step": 176638, "epoch": 2128} {"train_loss": -23.602264404296875, "global_step": 176639, "epoch": 2128} {"train_loss": -23.358776092529297, "global_step": 176640, "epoch": 2128} {"train_loss": -23.615535736083984, "global_step": 176641, "epoch": 2128} {"train_loss": -23.73567008972168, "global_step": 176642, "epoch": 2128} {"train_loss": -24.026838302612305, "global_step": 176643, "epoch": 2128} {"train_loss": -23.722883224487305, "global_step": 176644, "epoch": 2128} {"train_loss": -23.69626235961914, "global_step": 176645, "epoch": 2128} {"train_loss": -23.72532081604004, "global_step": 176646, "epoch": 2128} {"train_loss": -23.582056045532227, "global_step": 176647, "epoch": 2128} {"train_loss": -23.820348739624023, "global_step": 176648, "epoch": 2128} {"train_loss": -23.858169555664062, "global_step": 176649, "epoch": 2128} {"train_loss": -23.8563232421875, "global_step": 176650, "epoch": 2128} {"train_loss": -23.817594528198242, "global_step": 176651, "epoch": 2128} {"train_loss": -24.041488647460938, "global_step": 176652, "epoch": 2128} {"train_loss": -23.69008445739746, "global_step": 176653, "epoch": 2128} {"train_loss": -23.583158493041992, "global_step": 176654, "epoch": 2128} {"train_loss": -23.347803115844727, "global_step": 176655, "epoch": 2128} {"train_loss": -23.953495025634766, "global_step": 176656, "epoch": 2128} {"train_loss": -23.848642349243164, "global_step": 176657, "epoch": 2128} {"train_loss": -23.905136108398438, "global_step": 176658, "epoch": 2128} {"train_loss": -23.911527633666992, "global_step": 176659, "epoch": 2128} {"train_loss": -24.17776870727539, "global_step": 176660, "epoch": 2128} {"train_loss": -24.02389907836914, "global_step": 176661, "epoch": 2128} {"train_loss": -24.00178337097168, "global_step": 176662, "epoch": 2128} {"train_loss": -23.986974716186523, "global_step": 176663, "epoch": 2128} {"train_loss": -23.951215744018555, "global_step": 176664, "epoch": 2128} {"train_loss": -23.974872589111328, "global_step": 176665, "epoch": 2128} {"train_loss": -24.02815818786621, "global_step": 176666, "epoch": 2128} {"train_loss": -23.782852172851562, "global_step": 176667, "epoch": 2128} {"train_loss": -23.483863830566406, "global_step": 176668, "epoch": 2128} {"train_loss": -23.470638275146484, "global_step": 176669, "epoch": 2128} {"train_loss": -23.867759704589844, "global_step": 176670, "epoch": 2128} {"train_loss": -23.570159912109375, "global_step": 176671, "epoch": 2128} {"train_loss": -24.547636032104492, "global_step": 176672, "epoch": 2128} {"train_loss": -24.192899703979492, "global_step": 176673, "epoch": 2128} {"train_loss": -23.622482299804688, "global_step": 176674, "epoch": 2128} {"train_loss": -24.226720809936523, "global_step": 176675, "epoch": 2128} {"train_loss": -24.12849998474121, "global_step": 176676, "epoch": 2128} {"train_loss": -23.941579818725586, "global_step": 176677, "epoch": 2128} {"train_loss": -23.94847869873047, "global_step": 176678, "epoch": 2128} {"train_loss": -23.906574249267578, "global_step": 176679, "epoch": 2128} {"train_loss": -24.275358200073242, "global_step": 176680, "epoch": 2128} {"train_loss": -24.18680191040039, "global_step": 176681, "epoch": 2128} {"train_loss": -23.679428100585938, "global_step": 176682, "epoch": 2128} {"train_loss": -23.786420822143555, "global_step": 176683, "epoch": 2128} {"train_loss": -24.027992248535156, "global_step": 176684, "epoch": 2128} {"train_loss": -23.494794845581055, "global_step": 176685, "epoch": 2128} {"train_loss": -24.012781143188477, "global_step": 176686, "epoch": 2128} {"train_loss": -23.849262237548828, "global_step": 176687, "epoch": 2128} {"train_loss": -24.368261337280273, "global_step": 176688, "epoch": 2128} {"train_loss": -23.74910545349121, "global_step": 176689, "epoch": 2128} {"train_loss": -24.06978988647461, "global_step": 176690, "epoch": 2128} {"train_loss": -23.76313591003418, "global_step": 176691, "epoch": 2128} {"train_loss": -23.791902542114258, "global_step": 176692, "epoch": 2128} {"train_loss": -23.590579986572266, "global_step": 176693, "epoch": 2128} {"train_loss": -23.907148361206055, "global_step": 176694, "epoch": 2128} {"train_loss": -23.965473175048828, "global_step": 176695, "epoch": 2128} {"train_loss": -23.586368560791016, "global_step": 176696, "epoch": 2128} {"train_loss": -23.976205825805664, "global_step": 176697, "epoch": 2128} {"train_loss": -23.9697208404541, "global_step": 176698, "epoch": 2128} {"train_loss": -23.496047973632812, "global_step": 176699, "epoch": 2128} {"train_loss": -23.99262046813965, "global_step": 176700, "epoch": 2128} {"train_loss": -23.58026695251465, "global_step": 176701, "epoch": 2128} {"train_loss": -23.896207809448242, "global_step": 176702, "epoch": 2128} {"train_loss": -23.8170223236084, "global_step": 176703, "epoch": 2128} {"train_loss": -23.759626388549805, "global_step": 176704, "epoch": 2128} {"train_loss": -23.66083335876465, "global_step": 176705, "epoch": 2128} {"train_loss": -23.7534632395549, "global_step": 176706, "epoch": 2128, "val_loss": 6545662.0} {"train_loss": -23.2833194732666, "global_step": 176707, "epoch": 2129} {"train_loss": -23.114316940307617, "global_step": 176708, "epoch": 2129} {"train_loss": -23.613725662231445, "global_step": 176709, "epoch": 2129} {"train_loss": -23.373504638671875, "global_step": 176710, "epoch": 2129} {"train_loss": -23.247821807861328, "global_step": 176711, "epoch": 2129} {"train_loss": -23.101850509643555, "global_step": 176712, "epoch": 2129} {"train_loss": -23.59585189819336, "global_step": 176713, "epoch": 2129} {"train_loss": -23.3790283203125, "global_step": 176714, "epoch": 2129} {"train_loss": -23.559967041015625, "global_step": 176715, "epoch": 2129} {"train_loss": -23.829147338867188, "global_step": 176716, "epoch": 2129} {"train_loss": -23.726816177368164, "global_step": 176717, "epoch": 2129} {"train_loss": -23.751245498657227, "global_step": 176718, "epoch": 2129} {"train_loss": -23.39044761657715, "global_step": 176719, "epoch": 2129} {"train_loss": -23.58674430847168, "global_step": 176720, "epoch": 2129} {"train_loss": -23.563962936401367, "global_step": 176721, "epoch": 2129} {"train_loss": -23.7235164642334, "global_step": 176722, "epoch": 2129} {"train_loss": -23.43344497680664, "global_step": 176723, "epoch": 2129} {"train_loss": -23.398298263549805, "global_step": 176724, "epoch": 2129} {"train_loss": -23.908681869506836, "global_step": 176725, "epoch": 2129} {"train_loss": -23.839847564697266, "global_step": 176726, "epoch": 2129} {"train_loss": -23.912294387817383, "global_step": 176727, "epoch": 2129} {"train_loss": -23.47021484375, "global_step": 176728, "epoch": 2129} {"train_loss": -23.542285919189453, "global_step": 176729, "epoch": 2129} {"train_loss": -23.975549697875977, "global_step": 176730, "epoch": 2129} {"train_loss": -23.353670120239258, "global_step": 176731, "epoch": 2129} {"train_loss": -23.406024932861328, "global_step": 176732, "epoch": 2129} {"train_loss": -23.84917640686035, "global_step": 176733, "epoch": 2129} {"train_loss": -23.636625289916992, "global_step": 176734, "epoch": 2129} {"train_loss": -23.733749389648438, "global_step": 176735, "epoch": 2129} {"train_loss": -23.93695068359375, "global_step": 176736, "epoch": 2129} {"train_loss": -23.838693618774414, "global_step": 176737, "epoch": 2129} {"train_loss": -23.57659149169922, "global_step": 176738, "epoch": 2129} {"train_loss": -23.975360870361328, "global_step": 176739, "epoch": 2129} {"train_loss": -23.922361373901367, "global_step": 176740, "epoch": 2129} {"train_loss": -23.519977569580078, "global_step": 176741, "epoch": 2129} {"train_loss": -23.4464168548584, "global_step": 176742, "epoch": 2129} {"train_loss": -23.58237075805664, "global_step": 176743, "epoch": 2129} {"train_loss": -23.66737937927246, "global_step": 176744, "epoch": 2129} {"train_loss": -23.43500328063965, "global_step": 176745, "epoch": 2129} {"train_loss": -24.19918441772461, "global_step": 176746, "epoch": 2129} {"train_loss": -23.855905532836914, "global_step": 176747, "epoch": 2129} {"train_loss": -23.605863571166992, "global_step": 176748, "epoch": 2129} {"train_loss": -23.710582733154297, "global_step": 176749, "epoch": 2129} {"train_loss": -23.559934616088867, "global_step": 176750, "epoch": 2129} {"train_loss": -23.549455642700195, "global_step": 176751, "epoch": 2129} {"train_loss": -23.829849243164062, "global_step": 176752, "epoch": 2129} {"train_loss": -23.60899543762207, "global_step": 176753, "epoch": 2129} {"train_loss": -23.59056282043457, "global_step": 176754, "epoch": 2129} {"train_loss": -23.89403533935547, "global_step": 176755, "epoch": 2129} {"train_loss": -23.750152587890625, "global_step": 176756, "epoch": 2129} {"train_loss": -23.97768211364746, "global_step": 176757, "epoch": 2129} {"train_loss": -23.922067642211914, "global_step": 176758, "epoch": 2129} {"train_loss": -23.731313705444336, "global_step": 176759, "epoch": 2129} {"train_loss": -23.60727310180664, "global_step": 176760, "epoch": 2129} {"train_loss": -23.50960922241211, "global_step": 176761, "epoch": 2129} {"train_loss": -23.82810401916504, "global_step": 176762, "epoch": 2129} {"train_loss": -24.209165573120117, "global_step": 176763, "epoch": 2129} {"train_loss": -23.469961166381836, "global_step": 176764, "epoch": 2129} {"train_loss": -23.627187728881836, "global_step": 176765, "epoch": 2129} {"train_loss": -23.62944984436035, "global_step": 176766, "epoch": 2129} {"train_loss": -23.669710159301758, "global_step": 176767, "epoch": 2129} {"train_loss": -23.767333984375, "global_step": 176768, "epoch": 2129} {"train_loss": -24.167343139648438, "global_step": 176769, "epoch": 2129} {"train_loss": -23.632219314575195, "global_step": 176770, "epoch": 2129} {"train_loss": -23.96608543395996, "global_step": 176771, "epoch": 2129} {"train_loss": -24.206073760986328, "global_step": 176772, "epoch": 2129} {"train_loss": -24.214561462402344, "global_step": 176773, "epoch": 2129} {"train_loss": -24.180234909057617, "global_step": 176774, "epoch": 2129} {"train_loss": -23.944814682006836, "global_step": 176775, "epoch": 2129} {"train_loss": -24.217302322387695, "global_step": 176776, "epoch": 2129} {"train_loss": -23.542011260986328, "global_step": 176777, "epoch": 2129} {"train_loss": -24.2007999420166, "global_step": 176778, "epoch": 2129} {"train_loss": -23.75482940673828, "global_step": 176779, "epoch": 2129} {"train_loss": -23.86517906188965, "global_step": 176780, "epoch": 2129} {"train_loss": -23.475934982299805, "global_step": 176781, "epoch": 2129} {"train_loss": -22.7838077545166, "global_step": 176782, "epoch": 2129} {"train_loss": -23.409311294555664, "global_step": 176783, "epoch": 2129} {"train_loss": -24.02185821533203, "global_step": 176784, "epoch": 2129} {"train_loss": -23.95222282409668, "global_step": 176785, "epoch": 2129} {"train_loss": -23.539127349853516, "global_step": 176786, "epoch": 2129} {"train_loss": -23.56449317932129, "global_step": 176787, "epoch": 2129} {"train_loss": -23.80901527404785, "global_step": 176788, "epoch": 2129} {"train_loss": -23.693204443138765, "global_step": 176789, "epoch": 2129, "val_loss": 6436226.0} {"train_loss": -23.013654708862305, "global_step": 176790, "epoch": 2130} {"train_loss": -23.12366485595703, "global_step": 176791, "epoch": 2130} {"train_loss": -22.918533325195312, "global_step": 176792, "epoch": 2130} {"train_loss": -23.52977752685547, "global_step": 176793, "epoch": 2130} {"train_loss": -23.170141220092773, "global_step": 176794, "epoch": 2130} {"train_loss": -23.59553337097168, "global_step": 176795, "epoch": 2130} {"train_loss": -23.329910278320312, "global_step": 176796, "epoch": 2130} {"train_loss": -23.364137649536133, "global_step": 176797, "epoch": 2130} {"train_loss": -23.541818618774414, "global_step": 176798, "epoch": 2130} {"train_loss": -23.012134552001953, "global_step": 176799, "epoch": 2130} {"train_loss": -23.544559478759766, "global_step": 176800, "epoch": 2130} {"train_loss": -23.523305892944336, "global_step": 176801, "epoch": 2130} {"train_loss": -23.717084884643555, "global_step": 176802, "epoch": 2130} {"train_loss": -23.50335693359375, "global_step": 176803, "epoch": 2130} {"train_loss": -23.748106002807617, "global_step": 176804, "epoch": 2130} {"train_loss": -23.498300552368164, "global_step": 176805, "epoch": 2130} {"train_loss": -23.754079818725586, "global_step": 176806, "epoch": 2130} {"train_loss": -23.758752822875977, "global_step": 176807, "epoch": 2130} {"train_loss": -23.86431121826172, "global_step": 176808, "epoch": 2130} {"train_loss": -23.62335205078125, "global_step": 176809, "epoch": 2130} {"train_loss": -23.676055908203125, "global_step": 176810, "epoch": 2130} {"train_loss": -23.86810302734375, "global_step": 176811, "epoch": 2130} {"train_loss": -23.660053253173828, "global_step": 176812, "epoch": 2130} {"train_loss": -23.603429794311523, "global_step": 176813, "epoch": 2130} {"train_loss": -23.9190673828125, "global_step": 176814, "epoch": 2130} {"train_loss": -23.785181045532227, "global_step": 176815, "epoch": 2130} {"train_loss": -23.64864730834961, "global_step": 176816, "epoch": 2130} {"train_loss": -24.10831642150879, "global_step": 176817, "epoch": 2130} {"train_loss": -23.6492862701416, "global_step": 176818, "epoch": 2130} {"train_loss": -24.1705379486084, "global_step": 176819, "epoch": 2130} {"train_loss": -23.64041519165039, "global_step": 176820, "epoch": 2130} {"train_loss": -23.89049530029297, "global_step": 176821, "epoch": 2130} {"train_loss": -23.862346649169922, "global_step": 176822, "epoch": 2130} {"train_loss": -23.56597137451172, "global_step": 176823, "epoch": 2130} {"train_loss": -23.729490280151367, "global_step": 176824, "epoch": 2130} {"train_loss": -23.948759078979492, "global_step": 176825, "epoch": 2130} {"train_loss": -23.74213981628418, "global_step": 176826, "epoch": 2130} {"train_loss": -23.569080352783203, "global_step": 176827, "epoch": 2130} {"train_loss": -23.7567195892334, "global_step": 176828, "epoch": 2130} {"train_loss": -23.9123592376709, "global_step": 176829, "epoch": 2130} {"train_loss": -23.812177658081055, "global_step": 176830, "epoch": 2130} {"train_loss": -23.801969528198242, "global_step": 176831, "epoch": 2130} {"train_loss": -23.45001792907715, "global_step": 176832, "epoch": 2130} {"train_loss": -24.02850341796875, "global_step": 176833, "epoch": 2130} {"train_loss": -23.538070678710938, "global_step": 176834, "epoch": 2130} {"train_loss": -23.71614646911621, "global_step": 176835, "epoch": 2130} {"train_loss": -23.345006942749023, "global_step": 176836, "epoch": 2130} {"train_loss": -23.568418502807617, "global_step": 176837, "epoch": 2130} {"train_loss": -23.846372604370117, "global_step": 176838, "epoch": 2130} {"train_loss": -24.053098678588867, "global_step": 176839, "epoch": 2130} {"train_loss": -24.089468002319336, "global_step": 176840, "epoch": 2130} {"train_loss": -23.624073028564453, "global_step": 176841, "epoch": 2130} {"train_loss": -23.780805587768555, "global_step": 176842, "epoch": 2130} {"train_loss": -24.127450942993164, "global_step": 176843, "epoch": 2130} {"train_loss": -23.66905403137207, "global_step": 176844, "epoch": 2130} {"train_loss": -24.065608978271484, "global_step": 176845, "epoch": 2130} {"train_loss": -23.9072265625, "global_step": 176846, "epoch": 2130} {"train_loss": -23.502920150756836, "global_step": 176847, "epoch": 2130} {"train_loss": -23.800336837768555, "global_step": 176848, "epoch": 2130} {"train_loss": -23.670713424682617, "global_step": 176849, "epoch": 2130} {"train_loss": -23.978368759155273, "global_step": 176850, "epoch": 2130} {"train_loss": -23.628345489501953, "global_step": 176851, "epoch": 2130} {"train_loss": -23.822086334228516, "global_step": 176852, "epoch": 2130} {"train_loss": -23.780868530273438, "global_step": 176853, "epoch": 2130} {"train_loss": -23.73494529724121, "global_step": 176854, "epoch": 2130} {"train_loss": -24.147729873657227, "global_step": 176855, "epoch": 2130} {"train_loss": -23.892019271850586, "global_step": 176856, "epoch": 2130} {"train_loss": -23.693143844604492, "global_step": 176857, "epoch": 2130} {"train_loss": -23.920499801635742, "global_step": 176858, "epoch": 2130} {"train_loss": -23.751235961914062, "global_step": 176859, "epoch": 2130} {"train_loss": -23.555313110351562, "global_step": 176860, "epoch": 2130} {"train_loss": -23.728147506713867, "global_step": 176861, "epoch": 2130} {"train_loss": -24.0877628326416, "global_step": 176862, "epoch": 2130} {"train_loss": -23.531538009643555, "global_step": 176863, "epoch": 2130} {"train_loss": -23.848684310913086, "global_step": 176864, "epoch": 2130} {"train_loss": -23.641889572143555, "global_step": 176865, "epoch": 2130} {"train_loss": -23.757307052612305, "global_step": 176866, "epoch": 2130} {"train_loss": -23.726797103881836, "global_step": 176867, "epoch": 2130} {"train_loss": -23.96668815612793, "global_step": 176868, "epoch": 2130} {"train_loss": -23.827884674072266, "global_step": 176869, "epoch": 2130} {"train_loss": -24.027820587158203, "global_step": 176870, "epoch": 2130} {"train_loss": -24.285192489624023, "global_step": 176871, "epoch": 2130} {"train_loss": -23.73183765181576, "global_step": 176872, "epoch": 2130, "val_loss": 6474958.5} {"train_loss": -23.6092472076416, "global_step": 176873, "epoch": 2131} {"train_loss": -23.72203826904297, "global_step": 176874, "epoch": 2131} {"train_loss": -23.327489852905273, "global_step": 176875, "epoch": 2131} {"train_loss": -23.5140380859375, "global_step": 176876, "epoch": 2131} {"train_loss": -23.776105880737305, "global_step": 176877, "epoch": 2131} {"train_loss": -23.60089111328125, "global_step": 176878, "epoch": 2131} {"train_loss": -23.559186935424805, "global_step": 176879, "epoch": 2131} {"train_loss": -24.026243209838867, "global_step": 176880, "epoch": 2131} {"train_loss": -23.706655502319336, "global_step": 176881, "epoch": 2131} {"train_loss": -23.84259605407715, "global_step": 176882, "epoch": 2131} {"train_loss": -23.47380828857422, "global_step": 176883, "epoch": 2131} {"train_loss": -23.57608413696289, "global_step": 176884, "epoch": 2131} {"train_loss": -23.538223266601562, "global_step": 176885, "epoch": 2131} {"train_loss": -23.896387100219727, "global_step": 176886, "epoch": 2131} {"train_loss": -23.813779830932617, "global_step": 176887, "epoch": 2131} {"train_loss": -23.984838485717773, "global_step": 176888, "epoch": 2131} {"train_loss": -23.60199546813965, "global_step": 176889, "epoch": 2131} {"train_loss": -23.345632553100586, "global_step": 176890, "epoch": 2131} {"train_loss": -23.858062744140625, "global_step": 176891, "epoch": 2131} {"train_loss": -23.486083984375, "global_step": 176892, "epoch": 2131} {"train_loss": -23.92038917541504, "global_step": 176893, "epoch": 2131} {"train_loss": -23.662538528442383, "global_step": 176894, "epoch": 2131} {"train_loss": -23.873550415039062, "global_step": 176895, "epoch": 2131} {"train_loss": -23.67745018005371, "global_step": 176896, "epoch": 2131} {"train_loss": -24.16084098815918, "global_step": 176897, "epoch": 2131} {"train_loss": -24.117340087890625, "global_step": 176898, "epoch": 2131} {"train_loss": -24.078935623168945, "global_step": 176899, "epoch": 2131} {"train_loss": -23.6489200592041, "global_step": 176900, "epoch": 2131} {"train_loss": -23.756763458251953, "global_step": 176901, "epoch": 2131} {"train_loss": -23.65280532836914, "global_step": 176902, "epoch": 2131} {"train_loss": -24.151166915893555, "global_step": 176903, "epoch": 2131} {"train_loss": -23.929738998413086, "global_step": 176904, "epoch": 2131} {"train_loss": -23.78382682800293, "global_step": 176905, "epoch": 2131} {"train_loss": -24.17354393005371, "global_step": 176906, "epoch": 2131} {"train_loss": -24.04257583618164, "global_step": 176907, "epoch": 2131} {"train_loss": -23.511503219604492, "global_step": 176908, "epoch": 2131} {"train_loss": -24.13191795349121, "global_step": 176909, "epoch": 2131} {"train_loss": -23.398319244384766, "global_step": 176910, "epoch": 2131} {"train_loss": -24.064455032348633, "global_step": 176911, "epoch": 2131} {"train_loss": -24.183149337768555, "global_step": 176912, "epoch": 2131} {"train_loss": -24.132261276245117, "global_step": 176913, "epoch": 2131} {"train_loss": -23.856643676757812, "global_step": 176914, "epoch": 2131} {"train_loss": -24.054229736328125, "global_step": 176915, "epoch": 2131} {"train_loss": -23.778594970703125, "global_step": 176916, "epoch": 2131} {"train_loss": -24.070823669433594, "global_step": 176917, "epoch": 2131} {"train_loss": -24.002429962158203, "global_step": 176918, "epoch": 2131} {"train_loss": -23.909984588623047, "global_step": 176919, "epoch": 2131} {"train_loss": -24.208646774291992, "global_step": 176920, "epoch": 2131} {"train_loss": -24.195173263549805, "global_step": 176921, "epoch": 2131} {"train_loss": -23.741119384765625, "global_step": 176922, "epoch": 2131} {"train_loss": -24.16107749938965, "global_step": 176923, "epoch": 2131} {"train_loss": -23.729583740234375, "global_step": 176924, "epoch": 2131} {"train_loss": -23.799907684326172, "global_step": 176925, "epoch": 2131} {"train_loss": -23.95427703857422, "global_step": 176926, "epoch": 2131} {"train_loss": -24.0544376373291, "global_step": 176927, "epoch": 2131} {"train_loss": -23.82034683227539, "global_step": 176928, "epoch": 2131} {"train_loss": -24.03497314453125, "global_step": 176929, "epoch": 2131} {"train_loss": -24.40341567993164, "global_step": 176930, "epoch": 2131} {"train_loss": -23.805601119995117, "global_step": 176931, "epoch": 2131} {"train_loss": -24.020437240600586, "global_step": 176932, "epoch": 2131} {"train_loss": -23.885679244995117, "global_step": 176933, "epoch": 2131} {"train_loss": -23.50192642211914, "global_step": 176934, "epoch": 2131} {"train_loss": -23.923627853393555, "global_step": 176935, "epoch": 2131} {"train_loss": -24.279464721679688, "global_step": 176936, "epoch": 2131} {"train_loss": -23.929880142211914, "global_step": 176937, "epoch": 2131} {"train_loss": -23.959436416625977, "global_step": 176938, "epoch": 2131} {"train_loss": -23.71923828125, "global_step": 176939, "epoch": 2131} {"train_loss": -23.575016021728516, "global_step": 176940, "epoch": 2131} {"train_loss": -23.886396408081055, "global_step": 176941, "epoch": 2131} {"train_loss": -24.062713623046875, "global_step": 176942, "epoch": 2131} {"train_loss": -24.017871856689453, "global_step": 176943, "epoch": 2131} {"train_loss": -24.0398006439209, "global_step": 176944, "epoch": 2131} {"train_loss": -23.895986557006836, "global_step": 176945, "epoch": 2131} {"train_loss": -23.663007736206055, "global_step": 176946, "epoch": 2131} {"train_loss": -23.96329116821289, "global_step": 176947, "epoch": 2131} {"train_loss": -23.634618759155273, "global_step": 176948, "epoch": 2131} {"train_loss": -23.962491989135742, "global_step": 176949, "epoch": 2131} {"train_loss": -23.759525299072266, "global_step": 176950, "epoch": 2131} {"train_loss": -23.84119987487793, "global_step": 176951, "epoch": 2131} {"train_loss": -23.560413360595703, "global_step": 176952, "epoch": 2131} {"train_loss": -24.128705978393555, "global_step": 176953, "epoch": 2131} {"train_loss": -23.976593017578125, "global_step": 176954, "epoch": 2131} {"train_loss": -23.85954590303352, "global_step": 176955, "epoch": 2131, "val_loss": 6384736.5} {"train_loss": -23.38079833984375, "global_step": 176956, "epoch": 2132} {"train_loss": -22.908559799194336, "global_step": 176957, "epoch": 2132} {"train_loss": -23.41206932067871, "global_step": 176958, "epoch": 2132} {"train_loss": -23.4588623046875, "global_step": 176959, "epoch": 2132} {"train_loss": -23.42205810546875, "global_step": 176960, "epoch": 2132} {"train_loss": -23.805112838745117, "global_step": 176961, "epoch": 2132} {"train_loss": -23.621213912963867, "global_step": 176962, "epoch": 2132} {"train_loss": -23.7428035736084, "global_step": 176963, "epoch": 2132} {"train_loss": -23.50617790222168, "global_step": 176964, "epoch": 2132} {"train_loss": -23.87546157836914, "global_step": 176965, "epoch": 2132} {"train_loss": -23.54412269592285, "global_step": 176966, "epoch": 2132} {"train_loss": -23.2281551361084, "global_step": 176967, "epoch": 2132} {"train_loss": -23.55389976501465, "global_step": 176968, "epoch": 2132} {"train_loss": -23.56043815612793, "global_step": 176969, "epoch": 2132} {"train_loss": -24.097986221313477, "global_step": 176970, "epoch": 2132} {"train_loss": -23.730636596679688, "global_step": 176971, "epoch": 2132} {"train_loss": -23.228647232055664, "global_step": 176972, "epoch": 2132} {"train_loss": -23.793216705322266, "global_step": 176973, "epoch": 2132} {"train_loss": -23.688018798828125, "global_step": 176974, "epoch": 2132} {"train_loss": -23.530736923217773, "global_step": 176975, "epoch": 2132} {"train_loss": -23.606191635131836, "global_step": 176976, "epoch": 2132} {"train_loss": -23.186298370361328, "global_step": 176977, "epoch": 2132} {"train_loss": -23.443883895874023, "global_step": 176978, "epoch": 2132} {"train_loss": -23.973669052124023, "global_step": 176979, "epoch": 2132} {"train_loss": -23.26319694519043, "global_step": 176980, "epoch": 2132} {"train_loss": -23.796920776367188, "global_step": 176981, "epoch": 2132} {"train_loss": -23.604536056518555, "global_step": 176982, "epoch": 2132} {"train_loss": -24.239887237548828, "global_step": 176983, "epoch": 2132} {"train_loss": -23.719146728515625, "global_step": 176984, "epoch": 2132} {"train_loss": -23.657367706298828, "global_step": 176985, "epoch": 2132} {"train_loss": -23.743072509765625, "global_step": 176986, "epoch": 2132} {"train_loss": -23.598621368408203, "global_step": 176987, "epoch": 2132} {"train_loss": -23.982786178588867, "global_step": 176988, "epoch": 2132} {"train_loss": -23.87465476989746, "global_step": 176989, "epoch": 2132} {"train_loss": -23.63228416442871, "global_step": 176990, "epoch": 2132} {"train_loss": -23.588287353515625, "global_step": 176991, "epoch": 2132} {"train_loss": -23.67525291442871, "global_step": 176992, "epoch": 2132} {"train_loss": -24.052173614501953, "global_step": 176993, "epoch": 2132} {"train_loss": -24.217206954956055, "global_step": 176994, "epoch": 2132} {"train_loss": -24.37685203552246, "global_step": 176995, "epoch": 2132} {"train_loss": -23.7169132232666, "global_step": 176996, "epoch": 2132} {"train_loss": -23.95330238342285, "global_step": 176997, "epoch": 2132} {"train_loss": -23.696884155273438, "global_step": 176998, "epoch": 2132} {"train_loss": -23.61716079711914, "global_step": 176999, "epoch": 2132} {"train_loss": -23.78055191040039, "global_step": 177000, "epoch": 2132} {"train_loss": -24.137826919555664, "global_step": 177001, "epoch": 2132} {"train_loss": -23.729270935058594, "global_step": 177002, "epoch": 2132} {"train_loss": -24.076539993286133, "global_step": 177003, "epoch": 2132} {"train_loss": -23.957143783569336, "global_step": 177004, "epoch": 2132} {"train_loss": -24.00240135192871, "global_step": 177005, "epoch": 2132} {"train_loss": -23.494810104370117, "global_step": 177006, "epoch": 2132} {"train_loss": -23.964031219482422, "global_step": 177007, "epoch": 2132} {"train_loss": -24.16350746154785, "global_step": 177008, "epoch": 2132} {"train_loss": -24.106115341186523, "global_step": 177009, "epoch": 2132} {"train_loss": -23.529773712158203, "global_step": 177010, "epoch": 2132} {"train_loss": -23.401166915893555, "global_step": 177011, "epoch": 2132} {"train_loss": -23.840639114379883, "global_step": 177012, "epoch": 2132} {"train_loss": -23.711627960205078, "global_step": 177013, "epoch": 2132} {"train_loss": -23.588632583618164, "global_step": 177014, "epoch": 2132} {"train_loss": -23.9234561920166, "global_step": 177015, "epoch": 2132} {"train_loss": -23.8477783203125, "global_step": 177016, "epoch": 2132} {"train_loss": -23.879037857055664, "global_step": 177017, "epoch": 2132} {"train_loss": -23.913236618041992, "global_step": 177018, "epoch": 2132} {"train_loss": -24.10837745666504, "global_step": 177019, "epoch": 2132} {"train_loss": -23.780597686767578, "global_step": 177020, "epoch": 2132} {"train_loss": -23.85002326965332, "global_step": 177021, "epoch": 2132} {"train_loss": -23.40964698791504, "global_step": 177022, "epoch": 2132} {"train_loss": -23.941253662109375, "global_step": 177023, "epoch": 2132} {"train_loss": -23.83868980407715, "global_step": 177024, "epoch": 2132} {"train_loss": -23.603164672851562, "global_step": 177025, "epoch": 2132} {"train_loss": -23.889814376831055, "global_step": 177026, "epoch": 2132} {"train_loss": -23.460721969604492, "global_step": 177027, "epoch": 2132} {"train_loss": -23.71111488342285, "global_step": 177028, "epoch": 2132} {"train_loss": -23.814701080322266, "global_step": 177029, "epoch": 2132} {"train_loss": -23.765209197998047, "global_step": 177030, "epoch": 2132} {"train_loss": -23.682401657104492, "global_step": 177031, "epoch": 2132} {"train_loss": -24.13729476928711, "global_step": 177032, "epoch": 2132} {"train_loss": -24.0153751373291, "global_step": 177033, "epoch": 2132} {"train_loss": -24.06477928161621, "global_step": 177034, "epoch": 2132} {"train_loss": -24.01642417907715, "global_step": 177035, "epoch": 2132} {"train_loss": -23.82369613647461, "global_step": 177036, "epoch": 2132} {"train_loss": -23.90424919128418, "global_step": 177037, "epoch": 2132} {"train_loss": -23.75863652056958, "global_step": 177038, "epoch": 2132, "val_loss": 6559540.0} {"train_loss": -22.882902145385742, "global_step": 177039, "epoch": 2133} {"train_loss": -22.994773864746094, "global_step": 177040, "epoch": 2133} {"train_loss": -22.8006534576416, "global_step": 177041, "epoch": 2133} {"train_loss": -23.163650512695312, "global_step": 177042, "epoch": 2133} {"train_loss": -23.256393432617188, "global_step": 177043, "epoch": 2133} {"train_loss": -23.25839614868164, "global_step": 177044, "epoch": 2133} {"train_loss": -23.067676544189453, "global_step": 177045, "epoch": 2133} {"train_loss": -23.681669235229492, "global_step": 177046, "epoch": 2133} {"train_loss": -23.476367950439453, "global_step": 177047, "epoch": 2133} {"train_loss": -23.536237716674805, "global_step": 177048, "epoch": 2133} {"train_loss": -23.79844093322754, "global_step": 177049, "epoch": 2133} {"train_loss": -23.37746238708496, "global_step": 177050, "epoch": 2133} {"train_loss": -23.091428756713867, "global_step": 177051, "epoch": 2133} {"train_loss": -23.294403076171875, "global_step": 177052, "epoch": 2133} {"train_loss": -23.54954719543457, "global_step": 177053, "epoch": 2133} {"train_loss": -23.487152099609375, "global_step": 177054, "epoch": 2133} {"train_loss": -23.757022857666016, "global_step": 177055, "epoch": 2133} {"train_loss": -23.504274368286133, "global_step": 177056, "epoch": 2133} {"train_loss": -23.942676544189453, "global_step": 177057, "epoch": 2133} {"train_loss": -23.42448616027832, "global_step": 177058, "epoch": 2133} {"train_loss": -23.814611434936523, "global_step": 177059, "epoch": 2133} {"train_loss": -23.804471969604492, "global_step": 177060, "epoch": 2133} {"train_loss": -23.703460693359375, "global_step": 177061, "epoch": 2133} {"train_loss": -23.572763442993164, "global_step": 177062, "epoch": 2133} {"train_loss": -23.332490921020508, "global_step": 177063, "epoch": 2133} {"train_loss": -23.68910026550293, "global_step": 177064, "epoch": 2133} {"train_loss": -23.78749656677246, "global_step": 177065, "epoch": 2133} {"train_loss": -24.018186569213867, "global_step": 177066, "epoch": 2133} {"train_loss": -23.920063018798828, "global_step": 177067, "epoch": 2133} {"train_loss": -23.633865356445312, "global_step": 177068, "epoch": 2133} {"train_loss": -23.770835876464844, "global_step": 177069, "epoch": 2133} {"train_loss": -23.636096954345703, "global_step": 177070, "epoch": 2133} {"train_loss": -23.735349655151367, "global_step": 177071, "epoch": 2133} {"train_loss": -24.030323028564453, "global_step": 177072, "epoch": 2133} {"train_loss": -23.723388671875, "global_step": 177073, "epoch": 2133} {"train_loss": -23.79267692565918, "global_step": 177074, "epoch": 2133} {"train_loss": -23.844329833984375, "global_step": 177075, "epoch": 2133} {"train_loss": -23.869766235351562, "global_step": 177076, "epoch": 2133} {"train_loss": -23.662649154663086, "global_step": 177077, "epoch": 2133} {"train_loss": -24.140647888183594, "global_step": 177078, "epoch": 2133} {"train_loss": -23.893630981445312, "global_step": 177079, "epoch": 2133} {"train_loss": -24.001108169555664, "global_step": 177080, "epoch": 2133} {"train_loss": -23.9892520904541, "global_step": 177081, "epoch": 2133} {"train_loss": -23.850065231323242, "global_step": 177082, "epoch": 2133} {"train_loss": -23.50057601928711, "global_step": 177083, "epoch": 2133} {"train_loss": -24.151905059814453, "global_step": 177084, "epoch": 2133} {"train_loss": -24.256162643432617, "global_step": 177085, "epoch": 2133} {"train_loss": -23.799785614013672, "global_step": 177086, "epoch": 2133} {"train_loss": -23.52317237854004, "global_step": 177087, "epoch": 2133} {"train_loss": -23.702831268310547, "global_step": 177088, "epoch": 2133} {"train_loss": -23.79133415222168, "global_step": 177089, "epoch": 2133} {"train_loss": -23.638118743896484, "global_step": 177090, "epoch": 2133} {"train_loss": -23.615558624267578, "global_step": 177091, "epoch": 2133} {"train_loss": -23.84075355529785, "global_step": 177092, "epoch": 2133} {"train_loss": -24.18580436706543, "global_step": 177093, "epoch": 2133} {"train_loss": -23.912443161010742, "global_step": 177094, "epoch": 2133} {"train_loss": -23.931867599487305, "global_step": 177095, "epoch": 2133} {"train_loss": -23.79334259033203, "global_step": 177096, "epoch": 2133} {"train_loss": -23.793569564819336, "global_step": 177097, "epoch": 2133} {"train_loss": -23.894472122192383, "global_step": 177098, "epoch": 2133} {"train_loss": -23.721174240112305, "global_step": 177099, "epoch": 2133} {"train_loss": -23.9371280670166, "global_step": 177100, "epoch": 2133} {"train_loss": -23.754547119140625, "global_step": 177101, "epoch": 2133} {"train_loss": -23.763408660888672, "global_step": 177102, "epoch": 2133} {"train_loss": -23.648590087890625, "global_step": 177103, "epoch": 2133} {"train_loss": -23.8842716217041, "global_step": 177104, "epoch": 2133} {"train_loss": -23.937288284301758, "global_step": 177105, "epoch": 2133} {"train_loss": -23.57004165649414, "global_step": 177106, "epoch": 2133} {"train_loss": -23.85623550415039, "global_step": 177107, "epoch": 2133} {"train_loss": -23.947731018066406, "global_step": 177108, "epoch": 2133} {"train_loss": -23.753568649291992, "global_step": 177109, "epoch": 2133} {"train_loss": -23.93584632873535, "global_step": 177110, "epoch": 2133} {"train_loss": -23.687253952026367, "global_step": 177111, "epoch": 2133} {"train_loss": -23.669830322265625, "global_step": 177112, "epoch": 2133} {"train_loss": -23.879404067993164, "global_step": 177113, "epoch": 2133} {"train_loss": -24.18704605102539, "global_step": 177114, "epoch": 2133} {"train_loss": -24.06586265563965, "global_step": 177115, "epoch": 2133} {"train_loss": -23.926740646362305, "global_step": 177116, "epoch": 2133} {"train_loss": -24.128040313720703, "global_step": 177117, "epoch": 2133} {"train_loss": -24.085363388061523, "global_step": 177118, "epoch": 2133} {"train_loss": -23.786046981811523, "global_step": 177119, "epoch": 2133} {"train_loss": -23.684497833251953, "global_step": 177120, "epoch": 2133} {"train_loss": -23.708478513970434, "global_step": 177121, "epoch": 2133, "val_loss": 6507024.0} {"train_loss": -23.563507080078125, "global_step": 177122, "epoch": 2134} {"train_loss": -23.44923210144043, "global_step": 177123, "epoch": 2134} {"train_loss": -23.379865646362305, "global_step": 177124, "epoch": 2134} {"train_loss": -23.645296096801758, "global_step": 177125, "epoch": 2134} {"train_loss": -23.444387435913086, "global_step": 177126, "epoch": 2134} {"train_loss": -23.118223190307617, "global_step": 177127, "epoch": 2134} {"train_loss": -23.493606567382812, "global_step": 177128, "epoch": 2134} {"train_loss": -23.476686477661133, "global_step": 177129, "epoch": 2134} {"train_loss": -23.63089370727539, "global_step": 177130, "epoch": 2134} {"train_loss": -23.87775230407715, "global_step": 177131, "epoch": 2134} {"train_loss": -23.541208267211914, "global_step": 177132, "epoch": 2134} {"train_loss": -23.625829696655273, "global_step": 177133, "epoch": 2134} {"train_loss": -23.47061538696289, "global_step": 177134, "epoch": 2134} {"train_loss": -23.686254501342773, "global_step": 177135, "epoch": 2134} {"train_loss": -23.41119384765625, "global_step": 177136, "epoch": 2134} {"train_loss": -23.909626007080078, "global_step": 177137, "epoch": 2134} {"train_loss": -23.64735984802246, "global_step": 177138, "epoch": 2134} {"train_loss": -23.963186264038086, "global_step": 177139, "epoch": 2134} {"train_loss": -23.760272979736328, "global_step": 177140, "epoch": 2134} {"train_loss": -23.714279174804688, "global_step": 177141, "epoch": 2134} {"train_loss": -23.285921096801758, "global_step": 177142, "epoch": 2134} {"train_loss": -23.584259033203125, "global_step": 177143, "epoch": 2134} {"train_loss": -23.874156951904297, "global_step": 177144, "epoch": 2134} {"train_loss": -23.72139549255371, "global_step": 177145, "epoch": 2134} {"train_loss": -23.927173614501953, "global_step": 177146, "epoch": 2134} {"train_loss": -23.620298385620117, "global_step": 177147, "epoch": 2134} {"train_loss": -23.541105270385742, "global_step": 177148, "epoch": 2134} {"train_loss": -23.642183303833008, "global_step": 177149, "epoch": 2134} {"train_loss": -23.753711700439453, "global_step": 177150, "epoch": 2134} {"train_loss": -23.73334312438965, "global_step": 177151, "epoch": 2134} {"train_loss": -23.806161880493164, "global_step": 177152, "epoch": 2134} {"train_loss": -23.485265731811523, "global_step": 177153, "epoch": 2134} {"train_loss": -23.700971603393555, "global_step": 177154, "epoch": 2134} {"train_loss": -23.84160804748535, "global_step": 177155, "epoch": 2134} {"train_loss": -23.673227310180664, "global_step": 177156, "epoch": 2134} {"train_loss": -23.9727725982666, "global_step": 177157, "epoch": 2134} {"train_loss": -23.409835815429688, "global_step": 177158, "epoch": 2134} {"train_loss": -23.69089698791504, "global_step": 177159, "epoch": 2134} {"train_loss": -23.645660400390625, "global_step": 177160, "epoch": 2134} {"train_loss": -24.234619140625, "global_step": 177161, "epoch": 2134} {"train_loss": -23.70441246032715, "global_step": 177162, "epoch": 2134} {"train_loss": -23.55306053161621, "global_step": 177163, "epoch": 2134} {"train_loss": -23.74856185913086, "global_step": 177164, "epoch": 2134} {"train_loss": -23.960905075073242, "global_step": 177165, "epoch": 2134} {"train_loss": -23.836034774780273, "global_step": 177166, "epoch": 2134} {"train_loss": -24.27387809753418, "global_step": 177167, "epoch": 2134} {"train_loss": -23.781991958618164, "global_step": 177168, "epoch": 2134} {"train_loss": -23.723541259765625, "global_step": 177169, "epoch": 2134} {"train_loss": -23.535917282104492, "global_step": 177170, "epoch": 2134} {"train_loss": -24.28305435180664, "global_step": 177171, "epoch": 2134} {"train_loss": -23.79690933227539, "global_step": 177172, "epoch": 2134} {"train_loss": -23.615766525268555, "global_step": 177173, "epoch": 2134} {"train_loss": -23.69776153564453, "global_step": 177174, "epoch": 2134} {"train_loss": -24.127016067504883, "global_step": 177175, "epoch": 2134} {"train_loss": -24.074081420898438, "global_step": 177176, "epoch": 2134} {"train_loss": -24.039411544799805, "global_step": 177177, "epoch": 2134} {"train_loss": -23.8039493560791, "global_step": 177178, "epoch": 2134} {"train_loss": -23.917905807495117, "global_step": 177179, "epoch": 2134} {"train_loss": -24.095252990722656, "global_step": 177180, "epoch": 2134} {"train_loss": -23.71345329284668, "global_step": 177181, "epoch": 2134} {"train_loss": -24.1654052734375, "global_step": 177182, "epoch": 2134} {"train_loss": -23.905982971191406, "global_step": 177183, "epoch": 2134} {"train_loss": -23.805662155151367, "global_step": 177184, "epoch": 2134} {"train_loss": -23.823017120361328, "global_step": 177185, "epoch": 2134} {"train_loss": -24.018747329711914, "global_step": 177186, "epoch": 2134} {"train_loss": -23.986326217651367, "global_step": 177187, "epoch": 2134} {"train_loss": -23.77326202392578, "global_step": 177188, "epoch": 2134} {"train_loss": -24.28822135925293, "global_step": 177189, "epoch": 2134} {"train_loss": -23.759584426879883, "global_step": 177190, "epoch": 2134} {"train_loss": -24.112262725830078, "global_step": 177191, "epoch": 2134} {"train_loss": -23.52073097229004, "global_step": 177192, "epoch": 2134} {"train_loss": -23.78925132751465, "global_step": 177193, "epoch": 2134} {"train_loss": -24.022539138793945, "global_step": 177194, "epoch": 2134} {"train_loss": -23.925004959106445, "global_step": 177195, "epoch": 2134} {"train_loss": -23.94129753112793, "global_step": 177196, "epoch": 2134} {"train_loss": -24.038108825683594, "global_step": 177197, "epoch": 2134} {"train_loss": -23.632986068725586, "global_step": 177198, "epoch": 2134} {"train_loss": -24.091358184814453, "global_step": 177199, "epoch": 2134} {"train_loss": -24.186674118041992, "global_step": 177200, "epoch": 2134} {"train_loss": -24.10675621032715, "global_step": 177201, "epoch": 2134} {"train_loss": -23.972455978393555, "global_step": 177202, "epoch": 2134} {"train_loss": -24.02948570251465, "global_step": 177203, "epoch": 2134} {"train_loss": -23.77937629423946, "global_step": 177204, "epoch": 2134, "val_loss": 6485265.0} {"train_loss": -22.974084854125977, "global_step": 177205, "epoch": 2135} {"train_loss": -22.06831169128418, "global_step": 177206, "epoch": 2135} {"train_loss": -22.610300064086914, "global_step": 177207, "epoch": 2135} {"train_loss": -22.125892639160156, "global_step": 177208, "epoch": 2135} {"train_loss": -22.781753540039062, "global_step": 177209, "epoch": 2135} {"train_loss": -23.33920669555664, "global_step": 177210, "epoch": 2135} {"train_loss": -23.03436851501465, "global_step": 177211, "epoch": 2135} {"train_loss": -22.95085334777832, "global_step": 177212, "epoch": 2135} {"train_loss": -23.232376098632812, "global_step": 177213, "epoch": 2135} {"train_loss": -23.111127853393555, "global_step": 177214, "epoch": 2135} {"train_loss": -23.322574615478516, "global_step": 177215, "epoch": 2135} {"train_loss": -23.016143798828125, "global_step": 177216, "epoch": 2135} {"train_loss": -23.288602828979492, "global_step": 177217, "epoch": 2135} {"train_loss": -23.064828872680664, "global_step": 177218, "epoch": 2135} {"train_loss": -23.579771041870117, "global_step": 177219, "epoch": 2135} {"train_loss": -23.242252349853516, "global_step": 177220, "epoch": 2135} {"train_loss": -23.276931762695312, "global_step": 177221, "epoch": 2135} {"train_loss": -23.845426559448242, "global_step": 177222, "epoch": 2135} {"train_loss": -23.483610153198242, "global_step": 177223, "epoch": 2135} {"train_loss": -23.53622817993164, "global_step": 177224, "epoch": 2135} {"train_loss": -23.271400451660156, "global_step": 177225, "epoch": 2135} {"train_loss": -23.591611862182617, "global_step": 177226, "epoch": 2135} {"train_loss": -23.23358726501465, "global_step": 177227, "epoch": 2135} {"train_loss": -23.375080108642578, "global_step": 177228, "epoch": 2135} {"train_loss": -23.7550048828125, "global_step": 177229, "epoch": 2135} {"train_loss": -23.65177345275879, "global_step": 177230, "epoch": 2135} {"train_loss": -23.92109489440918, "global_step": 177231, "epoch": 2135} {"train_loss": -23.771127700805664, "global_step": 177232, "epoch": 2135} {"train_loss": -23.5107479095459, "global_step": 177233, "epoch": 2135} {"train_loss": -23.64253807067871, "global_step": 177234, "epoch": 2135} {"train_loss": -23.56376075744629, "global_step": 177235, "epoch": 2135} {"train_loss": -23.959882736206055, "global_step": 177236, "epoch": 2135} {"train_loss": -24.00960350036621, "global_step": 177237, "epoch": 2135} {"train_loss": -24.225454330444336, "global_step": 177238, "epoch": 2135} {"train_loss": -23.93276023864746, "global_step": 177239, "epoch": 2135} {"train_loss": -23.635154724121094, "global_step": 177240, "epoch": 2135} {"train_loss": -23.8880672454834, "global_step": 177241, "epoch": 2135} {"train_loss": -24.18912696838379, "global_step": 177242, "epoch": 2135} {"train_loss": -24.097509384155273, "global_step": 177243, "epoch": 2135} {"train_loss": -23.8166446685791, "global_step": 177244, "epoch": 2135} {"train_loss": -23.74448013305664, "global_step": 177245, "epoch": 2135} {"train_loss": -23.627548217773438, "global_step": 177246, "epoch": 2135} {"train_loss": -23.87047576904297, "global_step": 177247, "epoch": 2135} {"train_loss": -24.07547378540039, "global_step": 177248, "epoch": 2135} {"train_loss": -24.109792709350586, "global_step": 177249, "epoch": 2135} {"train_loss": -23.9053897857666, "global_step": 177250, "epoch": 2135} {"train_loss": -23.454526901245117, "global_step": 177251, "epoch": 2135} {"train_loss": -23.666635513305664, "global_step": 177252, "epoch": 2135} {"train_loss": -23.5106258392334, "global_step": 177253, "epoch": 2135} {"train_loss": -23.64549446105957, "global_step": 177254, "epoch": 2135} {"train_loss": -23.608596801757812, "global_step": 177255, "epoch": 2135} {"train_loss": -23.843488693237305, "global_step": 177256, "epoch": 2135} {"train_loss": -23.868247985839844, "global_step": 177257, "epoch": 2135} {"train_loss": -23.837818145751953, "global_step": 177258, "epoch": 2135} {"train_loss": -23.835886001586914, "global_step": 177259, "epoch": 2135} {"train_loss": -23.819849014282227, "global_step": 177260, "epoch": 2135} {"train_loss": -24.043323516845703, "global_step": 177261, "epoch": 2135} {"train_loss": -24.1450138092041, "global_step": 177262, "epoch": 2135} {"train_loss": -23.954517364501953, "global_step": 177263, "epoch": 2135} {"train_loss": -24.004016876220703, "global_step": 177264, "epoch": 2135} {"train_loss": -23.56321144104004, "global_step": 177265, "epoch": 2135} {"train_loss": -23.91029167175293, "global_step": 177266, "epoch": 2135} {"train_loss": -23.743192672729492, "global_step": 177267, "epoch": 2135} {"train_loss": -23.642248153686523, "global_step": 177268, "epoch": 2135} {"train_loss": -23.97312355041504, "global_step": 177269, "epoch": 2135} {"train_loss": -23.824878692626953, "global_step": 177270, "epoch": 2135} {"train_loss": -23.83509635925293, "global_step": 177271, "epoch": 2135} {"train_loss": -23.601543426513672, "global_step": 177272, "epoch": 2135} {"train_loss": -23.998172760009766, "global_step": 177273, "epoch": 2135} {"train_loss": -24.271947860717773, "global_step": 177274, "epoch": 2135} {"train_loss": -23.57599639892578, "global_step": 177275, "epoch": 2135} {"train_loss": -24.213565826416016, "global_step": 177276, "epoch": 2135} {"train_loss": -24.104736328125, "global_step": 177277, "epoch": 2135} {"train_loss": -24.244197845458984, "global_step": 177278, "epoch": 2135} {"train_loss": -24.086193084716797, "global_step": 177279, "epoch": 2135} {"train_loss": -23.513486862182617, "global_step": 177280, "epoch": 2135} {"train_loss": -23.615354537963867, "global_step": 177281, "epoch": 2135} {"train_loss": -23.911691665649414, "global_step": 177282, "epoch": 2135} {"train_loss": -23.877273559570312, "global_step": 177283, "epoch": 2135} {"train_loss": -24.08025550842285, "global_step": 177284, "epoch": 2135} {"train_loss": -23.29637336730957, "global_step": 177285, "epoch": 2135} {"train_loss": -24.02290153503418, "global_step": 177286, "epoch": 2135} {"train_loss": -23.63442788641137, "global_step": 177287, "epoch": 2135, "val_loss": 6373580.0} {"train_loss": -23.219240188598633, "global_step": 177288, "epoch": 2136} {"train_loss": -22.70768165588379, "global_step": 177289, "epoch": 2136} {"train_loss": -22.9364013671875, "global_step": 177290, "epoch": 2136} {"train_loss": -22.9121150970459, "global_step": 177291, "epoch": 2136} {"train_loss": -22.93401527404785, "global_step": 177292, "epoch": 2136} {"train_loss": -23.09747886657715, "global_step": 177293, "epoch": 2136} {"train_loss": -23.30776596069336, "global_step": 177294, "epoch": 2136} {"train_loss": -23.061994552612305, "global_step": 177295, "epoch": 2136} {"train_loss": -23.250696182250977, "global_step": 177296, "epoch": 2136} {"train_loss": -22.972484588623047, "global_step": 177297, "epoch": 2136} {"train_loss": -23.212881088256836, "global_step": 177298, "epoch": 2136} {"train_loss": -23.688796997070312, "global_step": 177299, "epoch": 2136} {"train_loss": -23.31220817565918, "global_step": 177300, "epoch": 2136} {"train_loss": -23.658411026000977, "global_step": 177301, "epoch": 2136} {"train_loss": -23.672338485717773, "global_step": 177302, "epoch": 2136} {"train_loss": -23.273984909057617, "global_step": 177303, "epoch": 2136} {"train_loss": -23.369308471679688, "global_step": 177304, "epoch": 2136} {"train_loss": -23.585752487182617, "global_step": 177305, "epoch": 2136} {"train_loss": -23.850088119506836, "global_step": 177306, "epoch": 2136} {"train_loss": -23.407352447509766, "global_step": 177307, "epoch": 2136} {"train_loss": -23.26401138305664, "global_step": 177308, "epoch": 2136} {"train_loss": -23.59270668029785, "global_step": 177309, "epoch": 2136} {"train_loss": -23.510040283203125, "global_step": 177310, "epoch": 2136} {"train_loss": -23.835758209228516, "global_step": 177311, "epoch": 2136} {"train_loss": -24.027183532714844, "global_step": 177312, "epoch": 2136} {"train_loss": -23.640363693237305, "global_step": 177313, "epoch": 2136} {"train_loss": -23.929513931274414, "global_step": 177314, "epoch": 2136} {"train_loss": -23.94388198852539, "global_step": 177315, "epoch": 2136} {"train_loss": -23.7504825592041, "global_step": 177316, "epoch": 2136} {"train_loss": -23.9154052734375, "global_step": 177317, "epoch": 2136} {"train_loss": -23.696094512939453, "global_step": 177318, "epoch": 2136} {"train_loss": -24.023513793945312, "global_step": 177319, "epoch": 2136} {"train_loss": -23.921863555908203, "global_step": 177320, "epoch": 2136} {"train_loss": -24.189043045043945, "global_step": 177321, "epoch": 2136} {"train_loss": -23.87973976135254, "global_step": 177322, "epoch": 2136} {"train_loss": -23.96247673034668, "global_step": 177323, "epoch": 2136} {"train_loss": -24.15911102294922, "global_step": 177324, "epoch": 2136} {"train_loss": -24.006973266601562, "global_step": 177325, "epoch": 2136} {"train_loss": -23.730323791503906, "global_step": 177326, "epoch": 2136} {"train_loss": -23.731801986694336, "global_step": 177327, "epoch": 2136} {"train_loss": -23.768051147460938, "global_step": 177328, "epoch": 2136} {"train_loss": -24.242767333984375, "global_step": 177329, "epoch": 2136} {"train_loss": -23.943063735961914, "global_step": 177330, "epoch": 2136} {"train_loss": -24.039329528808594, "global_step": 177331, "epoch": 2136} {"train_loss": -23.759357452392578, "global_step": 177332, "epoch": 2136} {"train_loss": -23.868406295776367, "global_step": 177333, "epoch": 2136} {"train_loss": -23.86813735961914, "global_step": 177334, "epoch": 2136} {"train_loss": -23.866506576538086, "global_step": 177335, "epoch": 2136} {"train_loss": -24.09403419494629, "global_step": 177336, "epoch": 2136} {"train_loss": -23.69854164123535, "global_step": 177337, "epoch": 2136} {"train_loss": -23.784936904907227, "global_step": 177338, "epoch": 2136} {"train_loss": -23.9576416015625, "global_step": 177339, "epoch": 2136} {"train_loss": -24.15060806274414, "global_step": 177340, "epoch": 2136} {"train_loss": -23.994138717651367, "global_step": 177341, "epoch": 2136} {"train_loss": -23.88715934753418, "global_step": 177342, "epoch": 2136} {"train_loss": -23.978073120117188, "global_step": 177343, "epoch": 2136} {"train_loss": -23.779569625854492, "global_step": 177344, "epoch": 2136} {"train_loss": -23.855209350585938, "global_step": 177345, "epoch": 2136} {"train_loss": -24.182817459106445, "global_step": 177346, "epoch": 2136} {"train_loss": -23.741010665893555, "global_step": 177347, "epoch": 2136} {"train_loss": -23.760272979736328, "global_step": 177348, "epoch": 2136} {"train_loss": -23.725555419921875, "global_step": 177349, "epoch": 2136} {"train_loss": -23.826576232910156, "global_step": 177350, "epoch": 2136} {"train_loss": -24.10930061340332, "global_step": 177351, "epoch": 2136} {"train_loss": -24.08016014099121, "global_step": 177352, "epoch": 2136} {"train_loss": -24.004507064819336, "global_step": 177353, "epoch": 2136} {"train_loss": -23.55401611328125, "global_step": 177354, "epoch": 2136} {"train_loss": -23.969738006591797, "global_step": 177355, "epoch": 2136} {"train_loss": -23.9976749420166, "global_step": 177356, "epoch": 2136} {"train_loss": -23.62666130065918, "global_step": 177357, "epoch": 2136} {"train_loss": -23.58563232421875, "global_step": 177358, "epoch": 2136} {"train_loss": -23.90042495727539, "global_step": 177359, "epoch": 2136} {"train_loss": -24.015344619750977, "global_step": 177360, "epoch": 2136} {"train_loss": -23.896936416625977, "global_step": 177361, "epoch": 2136} {"train_loss": -24.334331512451172, "global_step": 177362, "epoch": 2136} {"train_loss": -24.04439926147461, "global_step": 177363, "epoch": 2136} {"train_loss": -23.799148559570312, "global_step": 177364, "epoch": 2136} {"train_loss": -23.88627052307129, "global_step": 177365, "epoch": 2136} {"train_loss": -23.97141456604004, "global_step": 177366, "epoch": 2136} {"train_loss": -24.279125213623047, "global_step": 177367, "epoch": 2136} {"train_loss": -23.84380531311035, "global_step": 177368, "epoch": 2136} {"train_loss": -24.22444725036621, "global_step": 177369, "epoch": 2136} {"train_loss": -23.75774413419057, "global_step": 177370, "epoch": 2136, "val_loss": 6470967.0} {"train_loss": -23.60578727722168, "global_step": 177371, "epoch": 2137} {"train_loss": -22.749135971069336, "global_step": 177372, "epoch": 2137} {"train_loss": -23.378026962280273, "global_step": 177373, "epoch": 2137} {"train_loss": -24.033267974853516, "global_step": 177374, "epoch": 2137} {"train_loss": -23.2520751953125, "global_step": 177375, "epoch": 2137} {"train_loss": -23.671039581298828, "global_step": 177376, "epoch": 2137} {"train_loss": -23.57835578918457, "global_step": 177377, "epoch": 2137} {"train_loss": -23.34894371032715, "global_step": 177378, "epoch": 2137} {"train_loss": -23.681821823120117, "global_step": 177379, "epoch": 2137} {"train_loss": -23.607908248901367, "global_step": 177380, "epoch": 2137} {"train_loss": -23.5971736907959, "global_step": 177381, "epoch": 2137} {"train_loss": -23.6729679107666, "global_step": 177382, "epoch": 2137} {"train_loss": -23.800155639648438, "global_step": 177383, "epoch": 2137} {"train_loss": -23.885696411132812, "global_step": 177384, "epoch": 2137} {"train_loss": -23.6641902923584, "global_step": 177385, "epoch": 2137} {"train_loss": -23.94537353515625, "global_step": 177386, "epoch": 2137} {"train_loss": -23.597557067871094, "global_step": 177387, "epoch": 2137} {"train_loss": -23.553281784057617, "global_step": 177388, "epoch": 2137} {"train_loss": -23.498319625854492, "global_step": 177389, "epoch": 2137} {"train_loss": -24.03327751159668, "global_step": 177390, "epoch": 2137} {"train_loss": -23.713911056518555, "global_step": 177391, "epoch": 2137} {"train_loss": -23.9392032623291, "global_step": 177392, "epoch": 2137} {"train_loss": -23.624696731567383, "global_step": 177393, "epoch": 2137} {"train_loss": -23.73360252380371, "global_step": 177394, "epoch": 2137} {"train_loss": -23.698322296142578, "global_step": 177395, "epoch": 2137} {"train_loss": -24.199359893798828, "global_step": 177396, "epoch": 2137} {"train_loss": -24.019485473632812, "global_step": 177397, "epoch": 2137} {"train_loss": -23.932540893554688, "global_step": 177398, "epoch": 2137} {"train_loss": -23.74049186706543, "global_step": 177399, "epoch": 2137} {"train_loss": -23.894485473632812, "global_step": 177400, "epoch": 2137} {"train_loss": -24.10433006286621, "global_step": 177401, "epoch": 2137} {"train_loss": -23.92108154296875, "global_step": 177402, "epoch": 2137} {"train_loss": -24.21113395690918, "global_step": 177403, "epoch": 2137} {"train_loss": -23.561649322509766, "global_step": 177404, "epoch": 2137} {"train_loss": -24.356632232666016, "global_step": 177405, "epoch": 2137} {"train_loss": -23.957242965698242, "global_step": 177406, "epoch": 2137} {"train_loss": -23.648380279541016, "global_step": 177407, "epoch": 2137} {"train_loss": -24.057498931884766, "global_step": 177408, "epoch": 2137} {"train_loss": -23.890384674072266, "global_step": 177409, "epoch": 2137} {"train_loss": -23.76810646057129, "global_step": 177410, "epoch": 2137} {"train_loss": -23.721481323242188, "global_step": 177411, "epoch": 2137} {"train_loss": -23.624095916748047, "global_step": 177412, "epoch": 2137} {"train_loss": -24.10873031616211, "global_step": 177413, "epoch": 2137} {"train_loss": -23.702951431274414, "global_step": 177414, "epoch": 2137} {"train_loss": -23.834630966186523, "global_step": 177415, "epoch": 2137} {"train_loss": -23.798429489135742, "global_step": 177416, "epoch": 2137} {"train_loss": -23.95435905456543, "global_step": 177417, "epoch": 2137} {"train_loss": -24.104589462280273, "global_step": 177418, "epoch": 2137} {"train_loss": -23.91477394104004, "global_step": 177419, "epoch": 2137} {"train_loss": -23.862899780273438, "global_step": 177420, "epoch": 2137} {"train_loss": -23.982696533203125, "global_step": 177421, "epoch": 2137} {"train_loss": -23.62420082092285, "global_step": 177422, "epoch": 2137} {"train_loss": -23.925466537475586, "global_step": 177423, "epoch": 2137} {"train_loss": -23.677921295166016, "global_step": 177424, "epoch": 2137} {"train_loss": -23.92235565185547, "global_step": 177425, "epoch": 2137} {"train_loss": -24.280363082885742, "global_step": 177426, "epoch": 2137} {"train_loss": -23.538236618041992, "global_step": 177427, "epoch": 2137} {"train_loss": -23.590246200561523, "global_step": 177428, "epoch": 2137} {"train_loss": -24.071420669555664, "global_step": 177429, "epoch": 2137} {"train_loss": -23.7525577545166, "global_step": 177430, "epoch": 2137} {"train_loss": -24.240097045898438, "global_step": 177431, "epoch": 2137} {"train_loss": -24.491287231445312, "global_step": 177432, "epoch": 2137} {"train_loss": -24.178531646728516, "global_step": 177433, "epoch": 2137} {"train_loss": -23.756078720092773, "global_step": 177434, "epoch": 2137} {"train_loss": -24.03875160217285, "global_step": 177435, "epoch": 2137} {"train_loss": -23.832578659057617, "global_step": 177436, "epoch": 2137} {"train_loss": -23.87486457824707, "global_step": 177437, "epoch": 2137} {"train_loss": -24.223424911499023, "global_step": 177438, "epoch": 2137} {"train_loss": -23.922353744506836, "global_step": 177439, "epoch": 2137} {"train_loss": -23.947124481201172, "global_step": 177440, "epoch": 2137} {"train_loss": -24.137964248657227, "global_step": 177441, "epoch": 2137} {"train_loss": -23.551660537719727, "global_step": 177442, "epoch": 2137} {"train_loss": -24.04767608642578, "global_step": 177443, "epoch": 2137} {"train_loss": -23.548871994018555, "global_step": 177444, "epoch": 2137} {"train_loss": -23.669086456298828, "global_step": 177445, "epoch": 2137} {"train_loss": -23.403913497924805, "global_step": 177446, "epoch": 2137} {"train_loss": -23.53710174560547, "global_step": 177447, "epoch": 2137} {"train_loss": -23.9973087310791, "global_step": 177448, "epoch": 2137} {"train_loss": -23.67159080505371, "global_step": 177449, "epoch": 2137} {"train_loss": -23.49412727355957, "global_step": 177450, "epoch": 2137} {"train_loss": -23.70244789123535, "global_step": 177451, "epoch": 2137} {"train_loss": -24.049583435058594, "global_step": 177452, "epoch": 2137} {"train_loss": -23.810750731502672, "global_step": 177453, "epoch": 2137, "val_loss": 6454465.5} {"train_loss": -23.109500885009766, "global_step": 177454, "epoch": 2138} {"train_loss": -23.335676193237305, "global_step": 177455, "epoch": 2138} {"train_loss": -23.743566513061523, "global_step": 177456, "epoch": 2138} {"train_loss": -23.40916633605957, "global_step": 177457, "epoch": 2138} {"train_loss": -23.584571838378906, "global_step": 177458, "epoch": 2138} {"train_loss": -23.022314071655273, "global_step": 177459, "epoch": 2138} {"train_loss": -23.85544776916504, "global_step": 177460, "epoch": 2138} {"train_loss": -23.3869686126709, "global_step": 177461, "epoch": 2138} {"train_loss": -23.698108673095703, "global_step": 177462, "epoch": 2138} {"train_loss": -23.672842025756836, "global_step": 177463, "epoch": 2138} {"train_loss": -23.727724075317383, "global_step": 177464, "epoch": 2138} {"train_loss": -23.325702667236328, "global_step": 177465, "epoch": 2138} {"train_loss": -23.379016876220703, "global_step": 177466, "epoch": 2138} {"train_loss": -23.329303741455078, "global_step": 177467, "epoch": 2138} {"train_loss": -23.522747039794922, "global_step": 177468, "epoch": 2138} {"train_loss": -23.968454360961914, "global_step": 177469, "epoch": 2138} {"train_loss": -23.394712448120117, "global_step": 177470, "epoch": 2138} {"train_loss": -23.62690544128418, "global_step": 177471, "epoch": 2138} {"train_loss": -23.81476402282715, "global_step": 177472, "epoch": 2138} {"train_loss": -23.64752960205078, "global_step": 177473, "epoch": 2138} {"train_loss": -23.597766876220703, "global_step": 177474, "epoch": 2138} {"train_loss": -23.418418884277344, "global_step": 177475, "epoch": 2138} {"train_loss": -23.971567153930664, "global_step": 177476, "epoch": 2138} {"train_loss": -23.56891441345215, "global_step": 177477, "epoch": 2138} {"train_loss": -24.256162643432617, "global_step": 177478, "epoch": 2138} {"train_loss": -23.822580337524414, "global_step": 177479, "epoch": 2138} {"train_loss": -24.090681076049805, "global_step": 177480, "epoch": 2138} {"train_loss": -23.891357421875, "global_step": 177481, "epoch": 2138} {"train_loss": -23.917360305786133, "global_step": 177482, "epoch": 2138} {"train_loss": -23.584863662719727, "global_step": 177483, "epoch": 2138} {"train_loss": -24.001447677612305, "global_step": 177484, "epoch": 2138} {"train_loss": -23.74542808532715, "global_step": 177485, "epoch": 2138} {"train_loss": -23.869327545166016, "global_step": 177486, "epoch": 2138} {"train_loss": -23.70320701599121, "global_step": 177487, "epoch": 2138} {"train_loss": -24.054107666015625, "global_step": 177488, "epoch": 2138} {"train_loss": -23.96375846862793, "global_step": 177489, "epoch": 2138} {"train_loss": -24.019189834594727, "global_step": 177490, "epoch": 2138} {"train_loss": -24.084897994995117, "global_step": 177491, "epoch": 2138} {"train_loss": -23.319263458251953, "global_step": 177492, "epoch": 2138} {"train_loss": -23.911849975585938, "global_step": 177493, "epoch": 2138} {"train_loss": -23.6278076171875, "global_step": 177494, "epoch": 2138} {"train_loss": -23.89826011657715, "global_step": 177495, "epoch": 2138} {"train_loss": -23.86086082458496, "global_step": 177496, "epoch": 2138} {"train_loss": -24.063352584838867, "global_step": 177497, "epoch": 2138} {"train_loss": -23.895187377929688, "global_step": 177498, "epoch": 2138} {"train_loss": -23.404504776000977, "global_step": 177499, "epoch": 2138} {"train_loss": -23.819345474243164, "global_step": 177500, "epoch": 2138} {"train_loss": -24.047225952148438, "global_step": 177501, "epoch": 2138} {"train_loss": -23.998001098632812, "global_step": 177502, "epoch": 2138} {"train_loss": -23.78363037109375, "global_step": 177503, "epoch": 2138} {"train_loss": -23.909133911132812, "global_step": 177504, "epoch": 2138} {"train_loss": -23.959863662719727, "global_step": 177505, "epoch": 2138} {"train_loss": -23.9019718170166, "global_step": 177506, "epoch": 2138} {"train_loss": -23.95755958557129, "global_step": 177507, "epoch": 2138} {"train_loss": -23.385833740234375, "global_step": 177508, "epoch": 2138} {"train_loss": -23.90070915222168, "global_step": 177509, "epoch": 2138} {"train_loss": -23.7120304107666, "global_step": 177510, "epoch": 2138} {"train_loss": -23.575422286987305, "global_step": 177511, "epoch": 2138} {"train_loss": -23.69501495361328, "global_step": 177512, "epoch": 2138} {"train_loss": -23.940786361694336, "global_step": 177513, "epoch": 2138} {"train_loss": -23.936796188354492, "global_step": 177514, "epoch": 2138} {"train_loss": -23.89518928527832, "global_step": 177515, "epoch": 2138} {"train_loss": -23.976865768432617, "global_step": 177516, "epoch": 2138} {"train_loss": -24.12987518310547, "global_step": 177517, "epoch": 2138} {"train_loss": -23.883859634399414, "global_step": 177518, "epoch": 2138} {"train_loss": -24.44342803955078, "global_step": 177519, "epoch": 2138} {"train_loss": -23.819807052612305, "global_step": 177520, "epoch": 2138} {"train_loss": -23.678808212280273, "global_step": 177521, "epoch": 2138} {"train_loss": -23.911762237548828, "global_step": 177522, "epoch": 2138} {"train_loss": -24.183794021606445, "global_step": 177523, "epoch": 2138} {"train_loss": -23.93358039855957, "global_step": 177524, "epoch": 2138} {"train_loss": -23.96489143371582, "global_step": 177525, "epoch": 2138} {"train_loss": -24.229520797729492, "global_step": 177526, "epoch": 2138} {"train_loss": -23.691129684448242, "global_step": 177527, "epoch": 2138} {"train_loss": -23.98042106628418, "global_step": 177528, "epoch": 2138} {"train_loss": -24.105438232421875, "global_step": 177529, "epoch": 2138} {"train_loss": -24.055871963500977, "global_step": 177530, "epoch": 2138} {"train_loss": -23.617321014404297, "global_step": 177531, "epoch": 2138} {"train_loss": -23.890050888061523, "global_step": 177532, "epoch": 2138} {"train_loss": -23.70479965209961, "global_step": 177533, "epoch": 2138} {"train_loss": -23.867406845092773, "global_step": 177534, "epoch": 2138} {"train_loss": -23.811796188354492, "global_step": 177535, "epoch": 2138} {"train_loss": -23.767626865800604, "global_step": 177536, "epoch": 2138, "val_loss": 6338487.5} {"train_loss": -21.780622482299805, "global_step": 177537, "epoch": 2139} {"train_loss": -22.358121871948242, "global_step": 177538, "epoch": 2139} {"train_loss": -23.16250991821289, "global_step": 177539, "epoch": 2139} {"train_loss": -22.841135025024414, "global_step": 177540, "epoch": 2139} {"train_loss": -23.10433006286621, "global_step": 177541, "epoch": 2139} {"train_loss": -23.40839195251465, "global_step": 177542, "epoch": 2139} {"train_loss": -23.131994247436523, "global_step": 177543, "epoch": 2139} {"train_loss": -23.570173263549805, "global_step": 177544, "epoch": 2139} {"train_loss": -23.087949752807617, "global_step": 177545, "epoch": 2139} {"train_loss": -23.490863800048828, "global_step": 177546, "epoch": 2139} {"train_loss": -23.578174591064453, "global_step": 177547, "epoch": 2139} {"train_loss": -23.33711814880371, "global_step": 177548, "epoch": 2139} {"train_loss": -23.5782413482666, "global_step": 177549, "epoch": 2139} {"train_loss": -22.925933837890625, "global_step": 177550, "epoch": 2139} {"train_loss": -23.524999618530273, "global_step": 177551, "epoch": 2139} {"train_loss": -23.8751163482666, "global_step": 177552, "epoch": 2139} {"train_loss": -23.669828414916992, "global_step": 177553, "epoch": 2139} {"train_loss": -23.98335075378418, "global_step": 177554, "epoch": 2139} {"train_loss": -23.797534942626953, "global_step": 177555, "epoch": 2139} {"train_loss": -23.496692657470703, "global_step": 177556, "epoch": 2139} {"train_loss": -23.6445255279541, "global_step": 177557, "epoch": 2139} {"train_loss": -23.677169799804688, "global_step": 177558, "epoch": 2139} {"train_loss": -23.826431274414062, "global_step": 177559, "epoch": 2139} {"train_loss": -23.524511337280273, "global_step": 177560, "epoch": 2139} {"train_loss": -23.66107749938965, "global_step": 177561, "epoch": 2139} {"train_loss": -24.2595272064209, "global_step": 177562, "epoch": 2139} {"train_loss": -24.09259605407715, "global_step": 177563, "epoch": 2139} {"train_loss": -24.09845542907715, "global_step": 177564, "epoch": 2139} {"train_loss": -23.702146530151367, "global_step": 177565, "epoch": 2139} {"train_loss": -23.80389404296875, "global_step": 177566, "epoch": 2139} {"train_loss": -23.5252685546875, "global_step": 177567, "epoch": 2139} {"train_loss": -23.86384391784668, "global_step": 177568, "epoch": 2139} {"train_loss": -23.98368263244629, "global_step": 177569, "epoch": 2139} {"train_loss": -23.91716766357422, "global_step": 177570, "epoch": 2139} {"train_loss": -23.839975357055664, "global_step": 177571, "epoch": 2139} {"train_loss": -24.022987365722656, "global_step": 177572, "epoch": 2139} {"train_loss": -23.540498733520508, "global_step": 177573, "epoch": 2139} {"train_loss": -24.31172752380371, "global_step": 177574, "epoch": 2139} {"train_loss": -24.165433883666992, "global_step": 177575, "epoch": 2139} {"train_loss": -23.843515396118164, "global_step": 177576, "epoch": 2139} {"train_loss": -23.705276489257812, "global_step": 177577, "epoch": 2139} {"train_loss": -23.96768569946289, "global_step": 177578, "epoch": 2139} {"train_loss": -23.89405632019043, "global_step": 177579, "epoch": 2139} {"train_loss": -23.967748641967773, "global_step": 177580, "epoch": 2139} {"train_loss": -23.765792846679688, "global_step": 177581, "epoch": 2139} {"train_loss": -24.031024932861328, "global_step": 177582, "epoch": 2139} {"train_loss": -23.71415901184082, "global_step": 177583, "epoch": 2139} {"train_loss": -23.88036346435547, "global_step": 177584, "epoch": 2139} {"train_loss": -23.81917381286621, "global_step": 177585, "epoch": 2139} {"train_loss": -23.617202758789062, "global_step": 177586, "epoch": 2139} {"train_loss": -23.71280288696289, "global_step": 177587, "epoch": 2139} {"train_loss": -23.970083236694336, "global_step": 177588, "epoch": 2139} {"train_loss": -24.029016494750977, "global_step": 177589, "epoch": 2139} {"train_loss": -23.765777587890625, "global_step": 177590, "epoch": 2139} {"train_loss": -23.3389949798584, "global_step": 177591, "epoch": 2139} {"train_loss": -22.908390045166016, "global_step": 177592, "epoch": 2139} {"train_loss": -23.6010799407959, "global_step": 177593, "epoch": 2139} {"train_loss": -22.655166625976562, "global_step": 177594, "epoch": 2139} {"train_loss": -23.406396865844727, "global_step": 177595, "epoch": 2139} {"train_loss": -23.221323013305664, "global_step": 177596, "epoch": 2139} {"train_loss": -23.573104858398438, "global_step": 177597, "epoch": 2139} {"train_loss": -23.519081115722656, "global_step": 177598, "epoch": 2139} {"train_loss": -23.489084243774414, "global_step": 177599, "epoch": 2139} {"train_loss": -23.56565284729004, "global_step": 177600, "epoch": 2139} {"train_loss": -23.641855239868164, "global_step": 177601, "epoch": 2139} {"train_loss": -23.724185943603516, "global_step": 177602, "epoch": 2139} {"train_loss": -23.614669799804688, "global_step": 177603, "epoch": 2139} {"train_loss": -23.639074325561523, "global_step": 177604, "epoch": 2139} {"train_loss": -23.849491119384766, "global_step": 177605, "epoch": 2139} {"train_loss": -23.623580932617188, "global_step": 177606, "epoch": 2139} {"train_loss": -23.41560173034668, "global_step": 177607, "epoch": 2139} {"train_loss": -23.998720169067383, "global_step": 177608, "epoch": 2139} {"train_loss": -23.34518814086914, "global_step": 177609, "epoch": 2139} {"train_loss": -23.368621826171875, "global_step": 177610, "epoch": 2139} {"train_loss": -23.726160049438477, "global_step": 177611, "epoch": 2139} {"train_loss": -23.849885940551758, "global_step": 177612, "epoch": 2139} {"train_loss": -23.771957397460938, "global_step": 177613, "epoch": 2139} {"train_loss": -23.998125076293945, "global_step": 177614, "epoch": 2139} {"train_loss": -23.866012573242188, "global_step": 177615, "epoch": 2139} {"train_loss": -23.90718650817871, "global_step": 177616, "epoch": 2139} {"train_loss": -23.97601890563965, "global_step": 177617, "epoch": 2139} {"train_loss": -23.87939453125, "global_step": 177618, "epoch": 2139} {"train_loss": -23.646917044398297, "global_step": 177619, "epoch": 2139, "val_loss": 6558756.0} {"train_loss": -23.33342933654785, "global_step": 177620, "epoch": 2140} {"train_loss": -23.487966537475586, "global_step": 177621, "epoch": 2140} {"train_loss": -23.5267391204834, "global_step": 177622, "epoch": 2140} {"train_loss": -23.773025512695312, "global_step": 177623, "epoch": 2140} {"train_loss": -23.746864318847656, "global_step": 177624, "epoch": 2140} {"train_loss": -23.891756057739258, "global_step": 177625, "epoch": 2140} {"train_loss": -23.755630493164062, "global_step": 177626, "epoch": 2140} {"train_loss": -23.86121940612793, "global_step": 177627, "epoch": 2140} {"train_loss": -23.660417556762695, "global_step": 177628, "epoch": 2140} {"train_loss": -24.008642196655273, "global_step": 177629, "epoch": 2140} {"train_loss": -23.666975021362305, "global_step": 177630, "epoch": 2140} {"train_loss": -23.717023849487305, "global_step": 177631, "epoch": 2140} {"train_loss": -23.938121795654297, "global_step": 177632, "epoch": 2140} {"train_loss": -24.076528549194336, "global_step": 177633, "epoch": 2140} {"train_loss": -24.00208282470703, "global_step": 177634, "epoch": 2140} {"train_loss": -23.63651466369629, "global_step": 177635, "epoch": 2140} {"train_loss": -24.035226821899414, "global_step": 177636, "epoch": 2140} {"train_loss": -24.066247940063477, "global_step": 177637, "epoch": 2140} {"train_loss": -23.81016731262207, "global_step": 177638, "epoch": 2140} {"train_loss": -23.75933265686035, "global_step": 177639, "epoch": 2140} {"train_loss": -23.262182235717773, "global_step": 177640, "epoch": 2140} {"train_loss": -23.823068618774414, "global_step": 177641, "epoch": 2140} {"train_loss": -23.69512367248535, "global_step": 177642, "epoch": 2140} {"train_loss": -24.1815242767334, "global_step": 177643, "epoch": 2140} {"train_loss": -23.692487716674805, "global_step": 177644, "epoch": 2140} {"train_loss": -24.01827621459961, "global_step": 177645, "epoch": 2140} {"train_loss": -23.95150375366211, "global_step": 177646, "epoch": 2140} {"train_loss": -23.97205924987793, "global_step": 177647, "epoch": 2140} {"train_loss": -23.566513061523438, "global_step": 177648, "epoch": 2140} {"train_loss": -24.125396728515625, "global_step": 177649, "epoch": 2140} {"train_loss": -23.40406608581543, "global_step": 177650, "epoch": 2140} {"train_loss": -23.931894302368164, "global_step": 177651, "epoch": 2140} {"train_loss": -23.774816513061523, "global_step": 177652, "epoch": 2140} {"train_loss": -23.848846435546875, "global_step": 177653, "epoch": 2140} {"train_loss": -23.714405059814453, "global_step": 177654, "epoch": 2140} {"train_loss": -24.012819290161133, "global_step": 177655, "epoch": 2140} {"train_loss": -24.063879013061523, "global_step": 177656, "epoch": 2140} {"train_loss": -23.816516876220703, "global_step": 177657, "epoch": 2140} {"train_loss": -23.57611656188965, "global_step": 177658, "epoch": 2140} {"train_loss": -23.951126098632812, "global_step": 177659, "epoch": 2140} {"train_loss": -23.7435359954834, "global_step": 177660, "epoch": 2140} {"train_loss": -23.77235221862793, "global_step": 177661, "epoch": 2140} {"train_loss": -24.147857666015625, "global_step": 177662, "epoch": 2140} {"train_loss": -23.613636016845703, "global_step": 177663, "epoch": 2140} {"train_loss": -23.966846466064453, "global_step": 177664, "epoch": 2140} {"train_loss": -24.107404708862305, "global_step": 177665, "epoch": 2140} {"train_loss": -23.873859405517578, "global_step": 177666, "epoch": 2140} {"train_loss": -23.664813995361328, "global_step": 177667, "epoch": 2140} {"train_loss": -24.13575553894043, "global_step": 177668, "epoch": 2140} {"train_loss": -23.94658851623535, "global_step": 177669, "epoch": 2140} {"train_loss": -24.21204376220703, "global_step": 177670, "epoch": 2140} {"train_loss": -24.084585189819336, "global_step": 177671, "epoch": 2140} {"train_loss": -23.788095474243164, "global_step": 177672, "epoch": 2140} {"train_loss": -24.087425231933594, "global_step": 177673, "epoch": 2140} {"train_loss": -23.571125030517578, "global_step": 177674, "epoch": 2140} {"train_loss": -24.228271484375, "global_step": 177675, "epoch": 2140} {"train_loss": -23.95449447631836, "global_step": 177676, "epoch": 2140} {"train_loss": -24.028583526611328, "global_step": 177677, "epoch": 2140} {"train_loss": -24.187942504882812, "global_step": 177678, "epoch": 2140} {"train_loss": -24.191869735717773, "global_step": 177679, "epoch": 2140} {"train_loss": -23.868642807006836, "global_step": 177680, "epoch": 2140} {"train_loss": -23.668649673461914, "global_step": 177681, "epoch": 2140} {"train_loss": -23.972135543823242, "global_step": 177682, "epoch": 2140} {"train_loss": -23.887561798095703, "global_step": 177683, "epoch": 2140} {"train_loss": -23.860898971557617, "global_step": 177684, "epoch": 2140} {"train_loss": -23.782360076904297, "global_step": 177685, "epoch": 2140} {"train_loss": -23.168516159057617, "global_step": 177686, "epoch": 2140} {"train_loss": -23.321441650390625, "global_step": 177687, "epoch": 2140} {"train_loss": -23.917930603027344, "global_step": 177688, "epoch": 2140} {"train_loss": -23.51584243774414, "global_step": 177689, "epoch": 2140} {"train_loss": -23.52690315246582, "global_step": 177690, "epoch": 2140} {"train_loss": -23.707509994506836, "global_step": 177691, "epoch": 2140} {"train_loss": -23.77976417541504, "global_step": 177692, "epoch": 2140} {"train_loss": -23.429203033447266, "global_step": 177693, "epoch": 2140} {"train_loss": -23.540603637695312, "global_step": 177694, "epoch": 2140} {"train_loss": -24.02919578552246, "global_step": 177695, "epoch": 2140} {"train_loss": -24.095983505249023, "global_step": 177696, "epoch": 2140} {"train_loss": -23.339746475219727, "global_step": 177697, "epoch": 2140} {"train_loss": -23.838247299194336, "global_step": 177698, "epoch": 2140} {"train_loss": -23.788188934326172, "global_step": 177699, "epoch": 2140} {"train_loss": -23.49960708618164, "global_step": 177700, "epoch": 2140} {"train_loss": -24.209035873413086, "global_step": 177701, "epoch": 2140} {"train_loss": -23.826471236814935, "global_step": 177702, "epoch": 2140, "val_loss": 6434125.0} {"train_loss": -23.31839942932129, "global_step": 177703, "epoch": 2141} {"train_loss": -23.72525405883789, "global_step": 177704, "epoch": 2141} {"train_loss": -23.20977783203125, "global_step": 177705, "epoch": 2141} {"train_loss": -23.387601852416992, "global_step": 177706, "epoch": 2141} {"train_loss": -23.17918586730957, "global_step": 177707, "epoch": 2141} {"train_loss": -23.55423927307129, "global_step": 177708, "epoch": 2141} {"train_loss": -23.34122657775879, "global_step": 177709, "epoch": 2141} {"train_loss": -23.542407989501953, "global_step": 177710, "epoch": 2141} {"train_loss": -23.43751335144043, "global_step": 177711, "epoch": 2141} {"train_loss": -23.38351821899414, "global_step": 177712, "epoch": 2141} {"train_loss": -23.865915298461914, "global_step": 177713, "epoch": 2141} {"train_loss": -23.557998657226562, "global_step": 177714, "epoch": 2141} {"train_loss": -23.785696029663086, "global_step": 177715, "epoch": 2141} {"train_loss": -23.576974868774414, "global_step": 177716, "epoch": 2141} {"train_loss": -23.672372817993164, "global_step": 177717, "epoch": 2141} {"train_loss": -23.6430721282959, "global_step": 177718, "epoch": 2141} {"train_loss": -23.451536178588867, "global_step": 177719, "epoch": 2141} {"train_loss": -23.862768173217773, "global_step": 177720, "epoch": 2141} {"train_loss": -23.7104549407959, "global_step": 177721, "epoch": 2141} {"train_loss": -23.591276168823242, "global_step": 177722, "epoch": 2141} {"train_loss": -23.451953887939453, "global_step": 177723, "epoch": 2141} {"train_loss": -23.421939849853516, "global_step": 177724, "epoch": 2141} {"train_loss": -23.507436752319336, "global_step": 177725, "epoch": 2141} {"train_loss": -23.756818771362305, "global_step": 177726, "epoch": 2141} {"train_loss": -23.596176147460938, "global_step": 177727, "epoch": 2141} {"train_loss": -23.6185359954834, "global_step": 177728, "epoch": 2141} {"train_loss": -23.791536331176758, "global_step": 177729, "epoch": 2141} {"train_loss": -24.004005432128906, "global_step": 177730, "epoch": 2141} {"train_loss": -23.887205123901367, "global_step": 177731, "epoch": 2141} {"train_loss": -23.898550033569336, "global_step": 177732, "epoch": 2141} {"train_loss": -24.103515625, "global_step": 177733, "epoch": 2141} {"train_loss": -23.585912704467773, "global_step": 177734, "epoch": 2141} {"train_loss": -24.1953067779541, "global_step": 177735, "epoch": 2141} {"train_loss": -23.903676986694336, "global_step": 177736, "epoch": 2141} {"train_loss": -23.423940658569336, "global_step": 177737, "epoch": 2141} {"train_loss": -23.905078887939453, "global_step": 177738, "epoch": 2141} {"train_loss": -24.005935668945312, "global_step": 177739, "epoch": 2141} {"train_loss": -24.056106567382812, "global_step": 177740, "epoch": 2141} {"train_loss": -23.95521354675293, "global_step": 177741, "epoch": 2141} {"train_loss": -23.778839111328125, "global_step": 177742, "epoch": 2141} {"train_loss": -23.849519729614258, "global_step": 177743, "epoch": 2141} {"train_loss": -23.740060806274414, "global_step": 177744, "epoch": 2141} {"train_loss": -23.5655574798584, "global_step": 177745, "epoch": 2141} {"train_loss": -23.758169174194336, "global_step": 177746, "epoch": 2141} {"train_loss": -24.09710121154785, "global_step": 177747, "epoch": 2141} {"train_loss": -23.70162010192871, "global_step": 177748, "epoch": 2141} {"train_loss": -24.240026473999023, "global_step": 177749, "epoch": 2141} {"train_loss": -24.016401290893555, "global_step": 177750, "epoch": 2141} {"train_loss": -23.848594665527344, "global_step": 177751, "epoch": 2141} {"train_loss": -23.413333892822266, "global_step": 177752, "epoch": 2141} {"train_loss": -23.956710815429688, "global_step": 177753, "epoch": 2141} {"train_loss": -23.973073959350586, "global_step": 177754, "epoch": 2141} {"train_loss": -23.729475021362305, "global_step": 177755, "epoch": 2141} {"train_loss": -23.821714401245117, "global_step": 177756, "epoch": 2141} {"train_loss": -23.880931854248047, "global_step": 177757, "epoch": 2141} {"train_loss": -23.462905883789062, "global_step": 177758, "epoch": 2141} {"train_loss": -23.537939071655273, "global_step": 177759, "epoch": 2141} {"train_loss": -23.315853118896484, "global_step": 177760, "epoch": 2141} {"train_loss": -24.170764923095703, "global_step": 177761, "epoch": 2141} {"train_loss": -23.724002838134766, "global_step": 177762, "epoch": 2141} {"train_loss": -23.550954818725586, "global_step": 177763, "epoch": 2141} {"train_loss": -23.815500259399414, "global_step": 177764, "epoch": 2141} {"train_loss": -23.928651809692383, "global_step": 177765, "epoch": 2141} {"train_loss": -23.813032150268555, "global_step": 177766, "epoch": 2141} {"train_loss": -23.165477752685547, "global_step": 177767, "epoch": 2141} {"train_loss": -23.929044723510742, "global_step": 177768, "epoch": 2141} {"train_loss": -23.544240951538086, "global_step": 177769, "epoch": 2141} {"train_loss": -23.94984245300293, "global_step": 177770, "epoch": 2141} {"train_loss": -23.774290084838867, "global_step": 177771, "epoch": 2141} {"train_loss": -23.84131622314453, "global_step": 177772, "epoch": 2141} {"train_loss": -23.631988525390625, "global_step": 177773, "epoch": 2141} {"train_loss": -23.6734676361084, "global_step": 177774, "epoch": 2141} {"train_loss": -23.84479522705078, "global_step": 177775, "epoch": 2141} {"train_loss": -24.100963592529297, "global_step": 177776, "epoch": 2141} {"train_loss": -23.975961685180664, "global_step": 177777, "epoch": 2141} {"train_loss": -24.259571075439453, "global_step": 177778, "epoch": 2141} {"train_loss": -23.926271438598633, "global_step": 177779, "epoch": 2141} {"train_loss": -23.8508243560791, "global_step": 177780, "epoch": 2141} {"train_loss": -23.542224884033203, "global_step": 177781, "epoch": 2141} {"train_loss": -23.612533569335938, "global_step": 177782, "epoch": 2141} {"train_loss": -23.57221031188965, "global_step": 177783, "epoch": 2141} {"train_loss": -23.855432510375977, "global_step": 177784, "epoch": 2141} {"train_loss": -23.721453999898518, "global_step": 177785, "epoch": 2141, "val_loss": 6470438.0} {"train_loss": -23.308807373046875, "global_step": 177786, "epoch": 2142} {"train_loss": -23.180097579956055, "global_step": 177787, "epoch": 2142} {"train_loss": -23.575916290283203, "global_step": 177788, "epoch": 2142} {"train_loss": -23.65956687927246, "global_step": 177789, "epoch": 2142} {"train_loss": -23.185672760009766, "global_step": 177790, "epoch": 2142} {"train_loss": -23.693593978881836, "global_step": 177791, "epoch": 2142} {"train_loss": -23.631433486938477, "global_step": 177792, "epoch": 2142} {"train_loss": -23.590225219726562, "global_step": 177793, "epoch": 2142} {"train_loss": -23.40937042236328, "global_step": 177794, "epoch": 2142} {"train_loss": -23.405942916870117, "global_step": 177795, "epoch": 2142} {"train_loss": -23.657291412353516, "global_step": 177796, "epoch": 2142} {"train_loss": -23.46262550354004, "global_step": 177797, "epoch": 2142} {"train_loss": -23.977766036987305, "global_step": 177798, "epoch": 2142} {"train_loss": -23.524747848510742, "global_step": 177799, "epoch": 2142} {"train_loss": -23.939136505126953, "global_step": 177800, "epoch": 2142} {"train_loss": -23.665668487548828, "global_step": 177801, "epoch": 2142} {"train_loss": -23.86626434326172, "global_step": 177802, "epoch": 2142} {"train_loss": -23.99041175842285, "global_step": 177803, "epoch": 2142} {"train_loss": -23.82610321044922, "global_step": 177804, "epoch": 2142} {"train_loss": -23.765207290649414, "global_step": 177805, "epoch": 2142} {"train_loss": -23.890348434448242, "global_step": 177806, "epoch": 2142} {"train_loss": -23.9204158782959, "global_step": 177807, "epoch": 2142} {"train_loss": -23.36954689025879, "global_step": 177808, "epoch": 2142} {"train_loss": -23.392175674438477, "global_step": 177809, "epoch": 2142} {"train_loss": -24.0049991607666, "global_step": 177810, "epoch": 2142} {"train_loss": -23.901159286499023, "global_step": 177811, "epoch": 2142} {"train_loss": -23.87537956237793, "global_step": 177812, "epoch": 2142} {"train_loss": -23.971681594848633, "global_step": 177813, "epoch": 2142} {"train_loss": -24.18686866760254, "global_step": 177814, "epoch": 2142} {"train_loss": -23.78608512878418, "global_step": 177815, "epoch": 2142} {"train_loss": -24.0650691986084, "global_step": 177816, "epoch": 2142} {"train_loss": -23.92568588256836, "global_step": 177817, "epoch": 2142} {"train_loss": -23.752635955810547, "global_step": 177818, "epoch": 2142} {"train_loss": -23.968931198120117, "global_step": 177819, "epoch": 2142} {"train_loss": -24.127883911132812, "global_step": 177820, "epoch": 2142} {"train_loss": -23.882856369018555, "global_step": 177821, "epoch": 2142} {"train_loss": -24.03923988342285, "global_step": 177822, "epoch": 2142} {"train_loss": -23.7563419342041, "global_step": 177823, "epoch": 2142} {"train_loss": -23.815902709960938, "global_step": 177824, "epoch": 2142} {"train_loss": -23.798908233642578, "global_step": 177825, "epoch": 2142} {"train_loss": -24.12386703491211, "global_step": 177826, "epoch": 2142} {"train_loss": -24.190099716186523, "global_step": 177827, "epoch": 2142} {"train_loss": -24.173437118530273, "global_step": 177828, "epoch": 2142} {"train_loss": -23.878250122070312, "global_step": 177829, "epoch": 2142} {"train_loss": -23.66670799255371, "global_step": 177830, "epoch": 2142} {"train_loss": -24.303054809570312, "global_step": 177831, "epoch": 2142} {"train_loss": -23.982994079589844, "global_step": 177832, "epoch": 2142} {"train_loss": -23.572813034057617, "global_step": 177833, "epoch": 2142} {"train_loss": -23.19399070739746, "global_step": 177834, "epoch": 2142} {"train_loss": -23.249881744384766, "global_step": 177835, "epoch": 2142} {"train_loss": -23.475200653076172, "global_step": 177836, "epoch": 2142} {"train_loss": -23.819738388061523, "global_step": 177837, "epoch": 2142} {"train_loss": -23.769493103027344, "global_step": 177838, "epoch": 2142} {"train_loss": -23.73902130126953, "global_step": 177839, "epoch": 2142} {"train_loss": -23.90205192565918, "global_step": 177840, "epoch": 2142} {"train_loss": -23.641664505004883, "global_step": 177841, "epoch": 2142} {"train_loss": -23.451860427856445, "global_step": 177842, "epoch": 2142} {"train_loss": -23.650909423828125, "global_step": 177843, "epoch": 2142} {"train_loss": -24.256994247436523, "global_step": 177844, "epoch": 2142} {"train_loss": -23.413623809814453, "global_step": 177845, "epoch": 2142} {"train_loss": -23.91084861755371, "global_step": 177846, "epoch": 2142} {"train_loss": -23.93293571472168, "global_step": 177847, "epoch": 2142} {"train_loss": -23.760009765625, "global_step": 177848, "epoch": 2142} {"train_loss": -23.648054122924805, "global_step": 177849, "epoch": 2142} {"train_loss": -24.007675170898438, "global_step": 177850, "epoch": 2142} {"train_loss": -23.699363708496094, "global_step": 177851, "epoch": 2142} {"train_loss": -23.72071647644043, "global_step": 177852, "epoch": 2142} {"train_loss": -23.630826950073242, "global_step": 177853, "epoch": 2142} {"train_loss": -23.610572814941406, "global_step": 177854, "epoch": 2142} {"train_loss": -23.930509567260742, "global_step": 177855, "epoch": 2142} {"train_loss": -23.694190979003906, "global_step": 177856, "epoch": 2142} {"train_loss": -23.610998153686523, "global_step": 177857, "epoch": 2142} {"train_loss": -24.317745208740234, "global_step": 177858, "epoch": 2142} {"train_loss": -23.76624870300293, "global_step": 177859, "epoch": 2142} {"train_loss": -23.600553512573242, "global_step": 177860, "epoch": 2142} {"train_loss": -23.91896629333496, "global_step": 177861, "epoch": 2142} {"train_loss": -24.016284942626953, "global_step": 177862, "epoch": 2142} {"train_loss": -24.12148094177246, "global_step": 177863, "epoch": 2142} {"train_loss": -23.855804443359375, "global_step": 177864, "epoch": 2142} {"train_loss": -24.089929580688477, "global_step": 177865, "epoch": 2142} {"train_loss": -23.898115158081055, "global_step": 177866, "epoch": 2142} {"train_loss": -24.005294799804688, "global_step": 177867, "epoch": 2142} {"train_loss": -23.78611957596009, "global_step": 177868, "epoch": 2142, "val_loss": 6420342.0} {"train_loss": -23.42520523071289, "global_step": 177869, "epoch": 2143} {"train_loss": -23.198585510253906, "global_step": 177870, "epoch": 2143} {"train_loss": -23.457035064697266, "global_step": 177871, "epoch": 2143} {"train_loss": -23.59847068786621, "global_step": 177872, "epoch": 2143} {"train_loss": -23.48383140563965, "global_step": 177873, "epoch": 2143} {"train_loss": -23.549848556518555, "global_step": 177874, "epoch": 2143} {"train_loss": -23.72292137145996, "global_step": 177875, "epoch": 2143} {"train_loss": -23.958343505859375, "global_step": 177876, "epoch": 2143} {"train_loss": -23.815885543823242, "global_step": 177877, "epoch": 2143} {"train_loss": -23.51105308532715, "global_step": 177878, "epoch": 2143} {"train_loss": -23.846878051757812, "global_step": 177879, "epoch": 2143} {"train_loss": -23.74015235900879, "global_step": 177880, "epoch": 2143} {"train_loss": -23.75278091430664, "global_step": 177881, "epoch": 2143} {"train_loss": -23.562652587890625, "global_step": 177882, "epoch": 2143} {"train_loss": -23.653213500976562, "global_step": 177883, "epoch": 2143} {"train_loss": -23.591466903686523, "global_step": 177884, "epoch": 2143} {"train_loss": -23.721670150756836, "global_step": 177885, "epoch": 2143} {"train_loss": -23.43701171875, "global_step": 177886, "epoch": 2143} {"train_loss": -23.787588119506836, "global_step": 177887, "epoch": 2143} {"train_loss": -23.450117111206055, "global_step": 177888, "epoch": 2143} {"train_loss": -23.588092803955078, "global_step": 177889, "epoch": 2143} {"train_loss": -23.77248764038086, "global_step": 177890, "epoch": 2143} {"train_loss": -23.668073654174805, "global_step": 177891, "epoch": 2143} {"train_loss": -23.983917236328125, "global_step": 177892, "epoch": 2143} {"train_loss": -23.98525047302246, "global_step": 177893, "epoch": 2143} {"train_loss": -23.745702743530273, "global_step": 177894, "epoch": 2143} {"train_loss": -23.990949630737305, "global_step": 177895, "epoch": 2143} {"train_loss": -23.923032760620117, "global_step": 177896, "epoch": 2143} {"train_loss": -23.652196884155273, "global_step": 177897, "epoch": 2143} {"train_loss": -23.762327194213867, "global_step": 177898, "epoch": 2143} {"train_loss": -23.58504295349121, "global_step": 177899, "epoch": 2143} {"train_loss": -23.4394588470459, "global_step": 177900, "epoch": 2143} {"train_loss": -23.7319393157959, "global_step": 177901, "epoch": 2143} {"train_loss": -24.014745712280273, "global_step": 177902, "epoch": 2143} {"train_loss": -23.713565826416016, "global_step": 177903, "epoch": 2143} {"train_loss": -23.789823532104492, "global_step": 177904, "epoch": 2143} {"train_loss": -23.892099380493164, "global_step": 177905, "epoch": 2143} {"train_loss": -24.10784339904785, "global_step": 177906, "epoch": 2143} {"train_loss": -23.546977996826172, "global_step": 177907, "epoch": 2143} {"train_loss": -23.806514739990234, "global_step": 177908, "epoch": 2143} {"train_loss": -23.98537254333496, "global_step": 177909, "epoch": 2143} {"train_loss": -23.937068939208984, "global_step": 177910, "epoch": 2143} {"train_loss": -23.96662712097168, "global_step": 177911, "epoch": 2143} {"train_loss": -23.923627853393555, "global_step": 177912, "epoch": 2143} {"train_loss": -23.9599666595459, "global_step": 177913, "epoch": 2143} {"train_loss": -23.976728439331055, "global_step": 177914, "epoch": 2143} {"train_loss": -24.01254653930664, "global_step": 177915, "epoch": 2143} {"train_loss": -23.938154220581055, "global_step": 177916, "epoch": 2143} {"train_loss": -23.965435028076172, "global_step": 177917, "epoch": 2143} {"train_loss": -23.979507446289062, "global_step": 177918, "epoch": 2143} {"train_loss": -23.706666946411133, "global_step": 177919, "epoch": 2143} {"train_loss": -23.91025733947754, "global_step": 177920, "epoch": 2143} {"train_loss": -23.83946418762207, "global_step": 177921, "epoch": 2143} {"train_loss": -23.89747428894043, "global_step": 177922, "epoch": 2143} {"train_loss": -23.792573928833008, "global_step": 177923, "epoch": 2143} {"train_loss": -23.58379554748535, "global_step": 177924, "epoch": 2143} {"train_loss": -24.041481018066406, "global_step": 177925, "epoch": 2143} {"train_loss": -23.775266647338867, "global_step": 177926, "epoch": 2143} {"train_loss": -23.60607147216797, "global_step": 177927, "epoch": 2143} {"train_loss": -23.933805465698242, "global_step": 177928, "epoch": 2143} {"train_loss": -23.61370086669922, "global_step": 177929, "epoch": 2143} {"train_loss": -23.95198631286621, "global_step": 177930, "epoch": 2143} {"train_loss": -23.748132705688477, "global_step": 177931, "epoch": 2143} {"train_loss": -23.789213180541992, "global_step": 177932, "epoch": 2143} {"train_loss": -23.998319625854492, "global_step": 177933, "epoch": 2143} {"train_loss": -23.68623924255371, "global_step": 177934, "epoch": 2143} {"train_loss": -24.000429153442383, "global_step": 177935, "epoch": 2143} {"train_loss": -24.079675674438477, "global_step": 177936, "epoch": 2143} {"train_loss": -23.877685546875, "global_step": 177937, "epoch": 2143} {"train_loss": -24.185274124145508, "global_step": 177938, "epoch": 2143} {"train_loss": -23.581937789916992, "global_step": 177939, "epoch": 2143} {"train_loss": -24.020322799682617, "global_step": 177940, "epoch": 2143} {"train_loss": -23.828201293945312, "global_step": 177941, "epoch": 2143} {"train_loss": -23.91614532470703, "global_step": 177942, "epoch": 2143} {"train_loss": -23.811370849609375, "global_step": 177943, "epoch": 2143} {"train_loss": -24.26219940185547, "global_step": 177944, "epoch": 2143} {"train_loss": -23.806259155273438, "global_step": 177945, "epoch": 2143} {"train_loss": -24.109708786010742, "global_step": 177946, "epoch": 2143} {"train_loss": -24.017684936523438, "global_step": 177947, "epoch": 2143} {"train_loss": -23.907821655273438, "global_step": 177948, "epoch": 2143} {"train_loss": -24.211620330810547, "global_step": 177949, "epoch": 2143} {"train_loss": -23.620574951171875, "global_step": 177950, "epoch": 2143} {"train_loss": -23.809010586106634, "global_step": 177951, "epoch": 2143, "val_loss": 6423335.0} {"train_loss": -23.389005661010742, "global_step": 177952, "epoch": 2144} {"train_loss": -22.348669052124023, "global_step": 177953, "epoch": 2144} {"train_loss": -22.335790634155273, "global_step": 177954, "epoch": 2144} {"train_loss": -23.417699813842773, "global_step": 177955, "epoch": 2144} {"train_loss": -23.594785690307617, "global_step": 177956, "epoch": 2144} {"train_loss": -23.059707641601562, "global_step": 177957, "epoch": 2144} {"train_loss": -23.300657272338867, "global_step": 177958, "epoch": 2144} {"train_loss": -23.326841354370117, "global_step": 177959, "epoch": 2144} {"train_loss": -23.092029571533203, "global_step": 177960, "epoch": 2144} {"train_loss": -23.540699005126953, "global_step": 177961, "epoch": 2144} {"train_loss": -23.274991989135742, "global_step": 177962, "epoch": 2144} {"train_loss": -23.755661010742188, "global_step": 177963, "epoch": 2144} {"train_loss": -23.539236068725586, "global_step": 177964, "epoch": 2144} {"train_loss": -23.793859481811523, "global_step": 177965, "epoch": 2144} {"train_loss": -23.365446090698242, "global_step": 177966, "epoch": 2144} {"train_loss": -23.826190948486328, "global_step": 177967, "epoch": 2144} {"train_loss": -23.503341674804688, "global_step": 177968, "epoch": 2144} {"train_loss": -23.724721908569336, "global_step": 177969, "epoch": 2144} {"train_loss": -23.688411712646484, "global_step": 177970, "epoch": 2144} {"train_loss": -23.69239616394043, "global_step": 177971, "epoch": 2144} {"train_loss": -23.767499923706055, "global_step": 177972, "epoch": 2144} {"train_loss": -23.80902671813965, "global_step": 177973, "epoch": 2144} {"train_loss": -24.03696060180664, "global_step": 177974, "epoch": 2144} {"train_loss": -23.613014221191406, "global_step": 177975, "epoch": 2144} {"train_loss": -23.97214698791504, "global_step": 177976, "epoch": 2144} {"train_loss": -23.681604385375977, "global_step": 177977, "epoch": 2144} {"train_loss": -23.78922462463379, "global_step": 177978, "epoch": 2144} {"train_loss": -23.830158233642578, "global_step": 177979, "epoch": 2144} {"train_loss": -24.26495361328125, "global_step": 177980, "epoch": 2144} {"train_loss": -24.147186279296875, "global_step": 177981, "epoch": 2144} {"train_loss": -23.78045082092285, "global_step": 177982, "epoch": 2144} {"train_loss": -24.269445419311523, "global_step": 177983, "epoch": 2144} {"train_loss": -24.0610408782959, "global_step": 177984, "epoch": 2144} {"train_loss": -24.150476455688477, "global_step": 177985, "epoch": 2144} {"train_loss": -23.68230628967285, "global_step": 177986, "epoch": 2144} {"train_loss": -24.344192504882812, "global_step": 177987, "epoch": 2144} {"train_loss": -23.701913833618164, "global_step": 177988, "epoch": 2144} {"train_loss": -24.147796630859375, "global_step": 177989, "epoch": 2144} {"train_loss": -24.096038818359375, "global_step": 177990, "epoch": 2144} {"train_loss": -23.83734703063965, "global_step": 177991, "epoch": 2144} {"train_loss": -23.92520523071289, "global_step": 177992, "epoch": 2144} {"train_loss": -24.191171646118164, "global_step": 177993, "epoch": 2144} {"train_loss": -23.71807289123535, "global_step": 177994, "epoch": 2144} {"train_loss": -23.665088653564453, "global_step": 177995, "epoch": 2144} {"train_loss": -23.625720977783203, "global_step": 177996, "epoch": 2144} {"train_loss": -23.968812942504883, "global_step": 177997, "epoch": 2144} {"train_loss": -23.676481246948242, "global_step": 177998, "epoch": 2144} {"train_loss": -23.5517578125, "global_step": 177999, "epoch": 2144} {"train_loss": -23.874420166015625, "global_step": 178000, "epoch": 2144} {"train_loss": -23.65884780883789, "global_step": 178001, "epoch": 2144} {"train_loss": -23.72898292541504, "global_step": 178002, "epoch": 2144} {"train_loss": -23.743253707885742, "global_step": 178003, "epoch": 2144} {"train_loss": -23.907270431518555, "global_step": 178004, "epoch": 2144} {"train_loss": -23.791845321655273, "global_step": 178005, "epoch": 2144} {"train_loss": -23.877805709838867, "global_step": 178006, "epoch": 2144} {"train_loss": -23.562911987304688, "global_step": 178007, "epoch": 2144} {"train_loss": -24.30843734741211, "global_step": 178008, "epoch": 2144} {"train_loss": -23.604658126831055, "global_step": 178009, "epoch": 2144} {"train_loss": -23.795047760009766, "global_step": 178010, "epoch": 2144} {"train_loss": -23.763303756713867, "global_step": 178011, "epoch": 2144} {"train_loss": -23.670896530151367, "global_step": 178012, "epoch": 2144} {"train_loss": -24.021650314331055, "global_step": 178013, "epoch": 2144} {"train_loss": -23.952356338500977, "global_step": 178014, "epoch": 2144} {"train_loss": -23.935415267944336, "global_step": 178015, "epoch": 2144} {"train_loss": -24.06563949584961, "global_step": 178016, "epoch": 2144} {"train_loss": -23.8018856048584, "global_step": 178017, "epoch": 2144} {"train_loss": -24.099533081054688, "global_step": 178018, "epoch": 2144} {"train_loss": -23.769792556762695, "global_step": 178019, "epoch": 2144} {"train_loss": -23.930219650268555, "global_step": 178020, "epoch": 2144} {"train_loss": -24.234426498413086, "global_step": 178021, "epoch": 2144} {"train_loss": -24.153013229370117, "global_step": 178022, "epoch": 2144} {"train_loss": -23.901288986206055, "global_step": 178023, "epoch": 2144} {"train_loss": -24.006765365600586, "global_step": 178024, "epoch": 2144} {"train_loss": -24.107711791992188, "global_step": 178025, "epoch": 2144} {"train_loss": -24.238855361938477, "global_step": 178026, "epoch": 2144} {"train_loss": -23.787723541259766, "global_step": 178027, "epoch": 2144} {"train_loss": -23.823938369750977, "global_step": 178028, "epoch": 2144} {"train_loss": -23.776586532592773, "global_step": 178029, "epoch": 2144} {"train_loss": -23.744977951049805, "global_step": 178030, "epoch": 2144} {"train_loss": -23.945112228393555, "global_step": 178031, "epoch": 2144} {"train_loss": -23.89576530456543, "global_step": 178032, "epoch": 2144} {"train_loss": -23.865346908569336, "global_step": 178033, "epoch": 2144} {"train_loss": -23.77310470213373, "global_step": 178034, "epoch": 2144, "val_loss": 6487598.0} {"train_loss": -23.013486862182617, "global_step": 178035, "epoch": 2145} {"train_loss": -22.983949661254883, "global_step": 178036, "epoch": 2145} {"train_loss": -22.67842674255371, "global_step": 178037, "epoch": 2145} {"train_loss": -23.367399215698242, "global_step": 178038, "epoch": 2145} {"train_loss": -22.849227905273438, "global_step": 178039, "epoch": 2145} {"train_loss": -22.959630966186523, "global_step": 178040, "epoch": 2145} {"train_loss": -23.20199966430664, "global_step": 178041, "epoch": 2145} {"train_loss": -23.632923126220703, "global_step": 178042, "epoch": 2145} {"train_loss": -23.39626121520996, "global_step": 178043, "epoch": 2145} {"train_loss": -23.552377700805664, "global_step": 178044, "epoch": 2145} {"train_loss": -23.271203994750977, "global_step": 178045, "epoch": 2145} {"train_loss": -23.596359252929688, "global_step": 178046, "epoch": 2145} {"train_loss": -23.711713790893555, "global_step": 178047, "epoch": 2145} {"train_loss": -23.45163345336914, "global_step": 178048, "epoch": 2145} {"train_loss": -23.632606506347656, "global_step": 178049, "epoch": 2145} {"train_loss": -23.33899688720703, "global_step": 178050, "epoch": 2145} {"train_loss": -23.59004783630371, "global_step": 178051, "epoch": 2145} {"train_loss": -23.78312110900879, "global_step": 178052, "epoch": 2145} {"train_loss": -23.598773956298828, "global_step": 178053, "epoch": 2145} {"train_loss": -23.572139739990234, "global_step": 178054, "epoch": 2145} {"train_loss": -23.80793571472168, "global_step": 178055, "epoch": 2145} {"train_loss": -23.728891372680664, "global_step": 178056, "epoch": 2145} {"train_loss": -23.57078742980957, "global_step": 178057, "epoch": 2145} {"train_loss": -23.973852157592773, "global_step": 178058, "epoch": 2145} {"train_loss": -23.806955337524414, "global_step": 178059, "epoch": 2145} {"train_loss": -23.956220626831055, "global_step": 178060, "epoch": 2145} {"train_loss": -23.658185958862305, "global_step": 178061, "epoch": 2145} {"train_loss": -23.889516830444336, "global_step": 178062, "epoch": 2145} {"train_loss": -24.040685653686523, "global_step": 178063, "epoch": 2145} {"train_loss": -24.012920379638672, "global_step": 178064, "epoch": 2145} {"train_loss": -23.88783073425293, "global_step": 178065, "epoch": 2145} {"train_loss": -23.599197387695312, "global_step": 178066, "epoch": 2145} {"train_loss": -23.67951774597168, "global_step": 178067, "epoch": 2145} {"train_loss": -24.060598373413086, "global_step": 178068, "epoch": 2145} {"train_loss": -24.240537643432617, "global_step": 178069, "epoch": 2145} {"train_loss": -23.57166862487793, "global_step": 178070, "epoch": 2145} {"train_loss": -24.113924026489258, "global_step": 178071, "epoch": 2145} {"train_loss": -23.699981689453125, "global_step": 178072, "epoch": 2145} {"train_loss": -23.749921798706055, "global_step": 178073, "epoch": 2145} {"train_loss": -23.984390258789062, "global_step": 178074, "epoch": 2145} {"train_loss": -24.082738876342773, "global_step": 178075, "epoch": 2145} {"train_loss": -23.954973220825195, "global_step": 178076, "epoch": 2145} {"train_loss": -24.030248641967773, "global_step": 178077, "epoch": 2145} {"train_loss": -23.73727035522461, "global_step": 178078, "epoch": 2145} {"train_loss": -23.910078048706055, "global_step": 178079, "epoch": 2145} {"train_loss": -23.45659828186035, "global_step": 178080, "epoch": 2145} {"train_loss": -23.341367721557617, "global_step": 178081, "epoch": 2145} {"train_loss": -23.56770896911621, "global_step": 178082, "epoch": 2145} {"train_loss": -23.816970825195312, "global_step": 178083, "epoch": 2145} {"train_loss": -23.679794311523438, "global_step": 178084, "epoch": 2145} {"train_loss": -23.74079132080078, "global_step": 178085, "epoch": 2145} {"train_loss": -23.909902572631836, "global_step": 178086, "epoch": 2145} {"train_loss": -23.62643051147461, "global_step": 178087, "epoch": 2145} {"train_loss": -24.0692138671875, "global_step": 178088, "epoch": 2145} {"train_loss": -24.244470596313477, "global_step": 178089, "epoch": 2145} {"train_loss": -23.785322189331055, "global_step": 178090, "epoch": 2145} {"train_loss": -23.94243812561035, "global_step": 178091, "epoch": 2145} {"train_loss": -23.491384506225586, "global_step": 178092, "epoch": 2145} {"train_loss": -23.683950424194336, "global_step": 178093, "epoch": 2145} {"train_loss": -23.90420150756836, "global_step": 178094, "epoch": 2145} {"train_loss": -23.404516220092773, "global_step": 178095, "epoch": 2145} {"train_loss": -24.005155563354492, "global_step": 178096, "epoch": 2145} {"train_loss": -23.78202247619629, "global_step": 178097, "epoch": 2145} {"train_loss": -23.966279983520508, "global_step": 178098, "epoch": 2145} {"train_loss": -23.569538116455078, "global_step": 178099, "epoch": 2145} {"train_loss": -23.18918800354004, "global_step": 178100, "epoch": 2145} {"train_loss": -23.846044540405273, "global_step": 178101, "epoch": 2145} {"train_loss": -23.78658676147461, "global_step": 178102, "epoch": 2145} {"train_loss": -23.040481567382812, "global_step": 178103, "epoch": 2145} {"train_loss": -23.601123809814453, "global_step": 178104, "epoch": 2145} {"train_loss": -23.252893447875977, "global_step": 178105, "epoch": 2145} {"train_loss": -23.663175582885742, "global_step": 178106, "epoch": 2145} {"train_loss": -23.706735610961914, "global_step": 178107, "epoch": 2145} {"train_loss": -23.19666862487793, "global_step": 178108, "epoch": 2145} {"train_loss": -23.931982040405273, "global_step": 178109, "epoch": 2145} {"train_loss": -23.689878463745117, "global_step": 178110, "epoch": 2145} {"train_loss": -23.65726661682129, "global_step": 178111, "epoch": 2145} {"train_loss": -23.671030044555664, "global_step": 178112, "epoch": 2145} {"train_loss": -23.621240615844727, "global_step": 178113, "epoch": 2145} {"train_loss": -23.595548629760742, "global_step": 178114, "epoch": 2145} {"train_loss": -23.407949447631836, "global_step": 178115, "epoch": 2145} {"train_loss": -23.812515258789062, "global_step": 178116, "epoch": 2145} {"train_loss": -23.65704952377871, "global_step": 178117, "epoch": 2145, "val_loss": 6490165.0} {"train_loss": -23.83639907836914, "global_step": 178118, "epoch": 2146} {"train_loss": -23.558286666870117, "global_step": 178119, "epoch": 2146} {"train_loss": -23.456937789916992, "global_step": 178120, "epoch": 2146} {"train_loss": -23.256128311157227, "global_step": 178121, "epoch": 2146} {"train_loss": -23.51392364501953, "global_step": 178122, "epoch": 2146} {"train_loss": -23.809253692626953, "global_step": 178123, "epoch": 2146} {"train_loss": -23.711597442626953, "global_step": 178124, "epoch": 2146} {"train_loss": -23.678409576416016, "global_step": 178125, "epoch": 2146} {"train_loss": -23.56315040588379, "global_step": 178126, "epoch": 2146} {"train_loss": -23.829910278320312, "global_step": 178127, "epoch": 2146} {"train_loss": -23.398954391479492, "global_step": 178128, "epoch": 2146} {"train_loss": -23.503692626953125, "global_step": 178129, "epoch": 2146} {"train_loss": -24.094785690307617, "global_step": 178130, "epoch": 2146} {"train_loss": -23.913925170898438, "global_step": 178131, "epoch": 2146} {"train_loss": -23.67019271850586, "global_step": 178132, "epoch": 2146} {"train_loss": -24.01163101196289, "global_step": 178133, "epoch": 2146} {"train_loss": -23.853199005126953, "global_step": 178134, "epoch": 2146} {"train_loss": -23.68621826171875, "global_step": 178135, "epoch": 2146} {"train_loss": -23.85966682434082, "global_step": 178136, "epoch": 2146} {"train_loss": -24.226627349853516, "global_step": 178137, "epoch": 2146} {"train_loss": -23.714651107788086, "global_step": 178138, "epoch": 2146} {"train_loss": -23.88302993774414, "global_step": 178139, "epoch": 2146} {"train_loss": -23.773359298706055, "global_step": 178140, "epoch": 2146} {"train_loss": -24.08600616455078, "global_step": 178141, "epoch": 2146} {"train_loss": -24.011486053466797, "global_step": 178142, "epoch": 2146} {"train_loss": -23.895038604736328, "global_step": 178143, "epoch": 2146} {"train_loss": -23.832555770874023, "global_step": 178144, "epoch": 2146} {"train_loss": -23.871328353881836, "global_step": 178145, "epoch": 2146} {"train_loss": -24.16744041442871, "global_step": 178146, "epoch": 2146} {"train_loss": -24.162702560424805, "global_step": 178147, "epoch": 2146} {"train_loss": -23.566431045532227, "global_step": 178148, "epoch": 2146} {"train_loss": -23.639511108398438, "global_step": 178149, "epoch": 2146} {"train_loss": -23.894498825073242, "global_step": 178150, "epoch": 2146} {"train_loss": -24.02606773376465, "global_step": 178151, "epoch": 2146} {"train_loss": -23.500682830810547, "global_step": 178152, "epoch": 2146} {"train_loss": -24.1650447845459, "global_step": 178153, "epoch": 2146} {"train_loss": -23.572650909423828, "global_step": 178154, "epoch": 2146} {"train_loss": -23.563339233398438, "global_step": 178155, "epoch": 2146} {"train_loss": -23.60411262512207, "global_step": 178156, "epoch": 2146} {"train_loss": -23.90186882019043, "global_step": 178157, "epoch": 2146} {"train_loss": -23.90407371520996, "global_step": 178158, "epoch": 2146} {"train_loss": -23.66238021850586, "global_step": 178159, "epoch": 2146} {"train_loss": -24.066030502319336, "global_step": 178160, "epoch": 2146} {"train_loss": -24.00213050842285, "global_step": 178161, "epoch": 2146} {"train_loss": -23.687753677368164, "global_step": 178162, "epoch": 2146} {"train_loss": -23.872270584106445, "global_step": 178163, "epoch": 2146} {"train_loss": -23.606985092163086, "global_step": 178164, "epoch": 2146} {"train_loss": -23.916269302368164, "global_step": 178165, "epoch": 2146} {"train_loss": -24.005422592163086, "global_step": 178166, "epoch": 2146} {"train_loss": -23.820837020874023, "global_step": 178167, "epoch": 2146} {"train_loss": -23.675317764282227, "global_step": 178168, "epoch": 2146} {"train_loss": -23.75674819946289, "global_step": 178169, "epoch": 2146} {"train_loss": -23.621610641479492, "global_step": 178170, "epoch": 2146} {"train_loss": -24.13556480407715, "global_step": 178171, "epoch": 2146} {"train_loss": -23.660633087158203, "global_step": 178172, "epoch": 2146} {"train_loss": -24.072664260864258, "global_step": 178173, "epoch": 2146} {"train_loss": -24.156095504760742, "global_step": 178174, "epoch": 2146} {"train_loss": -23.688764572143555, "global_step": 178175, "epoch": 2146} {"train_loss": -24.267166137695312, "global_step": 178176, "epoch": 2146} {"train_loss": -23.90591812133789, "global_step": 178177, "epoch": 2146} {"train_loss": -23.62660789489746, "global_step": 178178, "epoch": 2146} {"train_loss": -24.118946075439453, "global_step": 178179, "epoch": 2146} {"train_loss": -23.783601760864258, "global_step": 178180, "epoch": 2146} {"train_loss": -24.143360137939453, "global_step": 178181, "epoch": 2146} {"train_loss": -23.81590461730957, "global_step": 178182, "epoch": 2146} {"train_loss": -23.477230072021484, "global_step": 178183, "epoch": 2146} {"train_loss": -23.502599716186523, "global_step": 178184, "epoch": 2146} {"train_loss": -23.835580825805664, "global_step": 178185, "epoch": 2146} {"train_loss": -23.990537643432617, "global_step": 178186, "epoch": 2146} {"train_loss": -23.75115394592285, "global_step": 178187, "epoch": 2146} {"train_loss": -23.589101791381836, "global_step": 178188, "epoch": 2146} {"train_loss": -23.733631134033203, "global_step": 178189, "epoch": 2146} {"train_loss": -23.905166625976562, "global_step": 178190, "epoch": 2146} {"train_loss": -23.67107582092285, "global_step": 178191, "epoch": 2146} {"train_loss": -23.71921730041504, "global_step": 178192, "epoch": 2146} {"train_loss": -24.057832717895508, "global_step": 178193, "epoch": 2146} {"train_loss": -23.57136344909668, "global_step": 178194, "epoch": 2146} {"train_loss": -24.030553817749023, "global_step": 178195, "epoch": 2146} {"train_loss": -23.646610260009766, "global_step": 178196, "epoch": 2146} {"train_loss": -23.95212173461914, "global_step": 178197, "epoch": 2146} {"train_loss": -24.076276779174805, "global_step": 178198, "epoch": 2146} {"train_loss": -24.000810623168945, "global_step": 178199, "epoch": 2146} {"train_loss": -23.822979295110127, "global_step": 178200, "epoch": 2146, "val_loss": 6505108.0} {"train_loss": -23.523847579956055, "global_step": 178201, "epoch": 2147} {"train_loss": -23.796445846557617, "global_step": 178202, "epoch": 2147} {"train_loss": -23.974491119384766, "global_step": 178203, "epoch": 2147} {"train_loss": -23.807615280151367, "global_step": 178204, "epoch": 2147} {"train_loss": -23.52705192565918, "global_step": 178205, "epoch": 2147} {"train_loss": -23.817827224731445, "global_step": 178206, "epoch": 2147} {"train_loss": -23.693151473999023, "global_step": 178207, "epoch": 2147} {"train_loss": -23.703100204467773, "global_step": 178208, "epoch": 2147} {"train_loss": -23.35403060913086, "global_step": 178209, "epoch": 2147} {"train_loss": -23.447973251342773, "global_step": 178210, "epoch": 2147} {"train_loss": -23.777202606201172, "global_step": 178211, "epoch": 2147} {"train_loss": -23.668106079101562, "global_step": 178212, "epoch": 2147} {"train_loss": -23.642501831054688, "global_step": 178213, "epoch": 2147} {"train_loss": -23.805082321166992, "global_step": 178214, "epoch": 2147} {"train_loss": -24.106449127197266, "global_step": 178215, "epoch": 2147} {"train_loss": -23.76332664489746, "global_step": 178216, "epoch": 2147} {"train_loss": -24.25535011291504, "global_step": 178217, "epoch": 2147} {"train_loss": -23.916845321655273, "global_step": 178218, "epoch": 2147} {"train_loss": -24.438400268554688, "global_step": 178219, "epoch": 2147} {"train_loss": -24.047237396240234, "global_step": 178220, "epoch": 2147} {"train_loss": -23.88616943359375, "global_step": 178221, "epoch": 2147} {"train_loss": -24.1821346282959, "global_step": 178222, "epoch": 2147} {"train_loss": -23.473947525024414, "global_step": 178223, "epoch": 2147} {"train_loss": -23.606372833251953, "global_step": 178224, "epoch": 2147} {"train_loss": -24.03840446472168, "global_step": 178225, "epoch": 2147} {"train_loss": -23.6925106048584, "global_step": 178226, "epoch": 2147} {"train_loss": -23.97064208984375, "global_step": 178227, "epoch": 2147} {"train_loss": -24.10853385925293, "global_step": 178228, "epoch": 2147} {"train_loss": -24.012216567993164, "global_step": 178229, "epoch": 2147} {"train_loss": -23.809335708618164, "global_step": 178230, "epoch": 2147} {"train_loss": -23.765043258666992, "global_step": 178231, "epoch": 2147} {"train_loss": -24.063323974609375, "global_step": 178232, "epoch": 2147} {"train_loss": -24.002477645874023, "global_step": 178233, "epoch": 2147} {"train_loss": -23.981678009033203, "global_step": 178234, "epoch": 2147} {"train_loss": -23.913936614990234, "global_step": 178235, "epoch": 2147} {"train_loss": -24.109533309936523, "global_step": 178236, "epoch": 2147} {"train_loss": -23.87630271911621, "global_step": 178237, "epoch": 2147} {"train_loss": -23.63101577758789, "global_step": 178238, "epoch": 2147} {"train_loss": -23.903654098510742, "global_step": 178239, "epoch": 2147} {"train_loss": -23.690128326416016, "global_step": 178240, "epoch": 2147} {"train_loss": -24.225126266479492, "global_step": 178241, "epoch": 2147} {"train_loss": -23.931774139404297, "global_step": 178242, "epoch": 2147} {"train_loss": -23.65290641784668, "global_step": 178243, "epoch": 2147} {"train_loss": -24.07742691040039, "global_step": 178244, "epoch": 2147} {"train_loss": -24.06900978088379, "global_step": 178245, "epoch": 2147} {"train_loss": -23.852237701416016, "global_step": 178246, "epoch": 2147} {"train_loss": -23.861846923828125, "global_step": 178247, "epoch": 2147} {"train_loss": -24.32486915588379, "global_step": 178248, "epoch": 2147} {"train_loss": -23.909717559814453, "global_step": 178249, "epoch": 2147} {"train_loss": -24.108184814453125, "global_step": 178250, "epoch": 2147} {"train_loss": -23.915075302124023, "global_step": 178251, "epoch": 2147} {"train_loss": -23.970657348632812, "global_step": 178252, "epoch": 2147} {"train_loss": -23.74212646484375, "global_step": 178253, "epoch": 2147} {"train_loss": -24.284454345703125, "global_step": 178254, "epoch": 2147} {"train_loss": -23.981245040893555, "global_step": 178255, "epoch": 2147} {"train_loss": -23.65993309020996, "global_step": 178256, "epoch": 2147} {"train_loss": -23.50080680847168, "global_step": 178257, "epoch": 2147} {"train_loss": -24.163238525390625, "global_step": 178258, "epoch": 2147} {"train_loss": -23.984140396118164, "global_step": 178259, "epoch": 2147} {"train_loss": -24.076171875, "global_step": 178260, "epoch": 2147} {"train_loss": -23.85462760925293, "global_step": 178261, "epoch": 2147} {"train_loss": -23.69144630432129, "global_step": 178262, "epoch": 2147} {"train_loss": -23.793804168701172, "global_step": 178263, "epoch": 2147} {"train_loss": -23.8446044921875, "global_step": 178264, "epoch": 2147} {"train_loss": -23.692296981811523, "global_step": 178265, "epoch": 2147} {"train_loss": -23.728498458862305, "global_step": 178266, "epoch": 2147} {"train_loss": -24.134889602661133, "global_step": 178267, "epoch": 2147} {"train_loss": -23.890947341918945, "global_step": 178268, "epoch": 2147} {"train_loss": -23.751680374145508, "global_step": 178269, "epoch": 2147} {"train_loss": -23.685529708862305, "global_step": 178270, "epoch": 2147} {"train_loss": -23.6793270111084, "global_step": 178271, "epoch": 2147} {"train_loss": -23.73737335205078, "global_step": 178272, "epoch": 2147} {"train_loss": -23.732337951660156, "global_step": 178273, "epoch": 2147} {"train_loss": -23.664955139160156, "global_step": 178274, "epoch": 2147} {"train_loss": -23.5626277923584, "global_step": 178275, "epoch": 2147} {"train_loss": -23.954378128051758, "global_step": 178276, "epoch": 2147} {"train_loss": -23.66899299621582, "global_step": 178277, "epoch": 2147} {"train_loss": -23.64887046813965, "global_step": 178278, "epoch": 2147} {"train_loss": -24.033920288085938, "global_step": 178279, "epoch": 2147} {"train_loss": -23.71282386779785, "global_step": 178280, "epoch": 2147} {"train_loss": -23.859933853149414, "global_step": 178281, "epoch": 2147} {"train_loss": -23.821802139282227, "global_step": 178282, "epoch": 2147} {"train_loss": -23.84741050076772, "global_step": 178283, "epoch": 2147, "val_loss": 6435289.0} {"train_loss": -23.356931686401367, "global_step": 178284, "epoch": 2148} {"train_loss": -23.72468376159668, "global_step": 178285, "epoch": 2148} {"train_loss": -23.797407150268555, "global_step": 178286, "epoch": 2148} {"train_loss": -23.598657608032227, "global_step": 178287, "epoch": 2148} {"train_loss": -23.351070404052734, "global_step": 178288, "epoch": 2148} {"train_loss": -23.853595733642578, "global_step": 178289, "epoch": 2148} {"train_loss": -23.633886337280273, "global_step": 178290, "epoch": 2148} {"train_loss": -23.769269943237305, "global_step": 178291, "epoch": 2148} {"train_loss": -23.650968551635742, "global_step": 178292, "epoch": 2148} {"train_loss": -23.832109451293945, "global_step": 178293, "epoch": 2148} {"train_loss": -23.555078506469727, "global_step": 178294, "epoch": 2148} {"train_loss": -23.73612403869629, "global_step": 178295, "epoch": 2148} {"train_loss": -23.713159561157227, "global_step": 178296, "epoch": 2148} {"train_loss": -23.638471603393555, "global_step": 178297, "epoch": 2148} {"train_loss": -23.368127822875977, "global_step": 178298, "epoch": 2148} {"train_loss": -24.095306396484375, "global_step": 178299, "epoch": 2148} {"train_loss": -23.927684783935547, "global_step": 178300, "epoch": 2148} {"train_loss": -23.924558639526367, "global_step": 178301, "epoch": 2148} {"train_loss": -23.745309829711914, "global_step": 178302, "epoch": 2148} {"train_loss": -24.155956268310547, "global_step": 178303, "epoch": 2148} {"train_loss": -23.62122917175293, "global_step": 178304, "epoch": 2148} {"train_loss": -23.887800216674805, "global_step": 178305, "epoch": 2148} {"train_loss": -24.1317138671875, "global_step": 178306, "epoch": 2148} {"train_loss": -23.658506393432617, "global_step": 178307, "epoch": 2148} {"train_loss": -23.90266990661621, "global_step": 178308, "epoch": 2148} {"train_loss": -23.746856689453125, "global_step": 178309, "epoch": 2148} {"train_loss": -23.718107223510742, "global_step": 178310, "epoch": 2148} {"train_loss": -23.98554039001465, "global_step": 178311, "epoch": 2148} {"train_loss": -23.72731590270996, "global_step": 178312, "epoch": 2148} {"train_loss": -23.877729415893555, "global_step": 178313, "epoch": 2148} {"train_loss": -24.07785987854004, "global_step": 178314, "epoch": 2148} {"train_loss": -23.883975982666016, "global_step": 178315, "epoch": 2148} {"train_loss": -23.981779098510742, "global_step": 178316, "epoch": 2148} {"train_loss": -23.911487579345703, "global_step": 178317, "epoch": 2148} {"train_loss": -23.97688102722168, "global_step": 178318, "epoch": 2148} {"train_loss": -23.84706687927246, "global_step": 178319, "epoch": 2148} {"train_loss": -23.91818618774414, "global_step": 178320, "epoch": 2148} {"train_loss": -24.08538246154785, "global_step": 178321, "epoch": 2148} {"train_loss": -24.389421463012695, "global_step": 178322, "epoch": 2148} {"train_loss": -24.17890739440918, "global_step": 178323, "epoch": 2148} {"train_loss": -24.185794830322266, "global_step": 178324, "epoch": 2148} {"train_loss": -24.139278411865234, "global_step": 178325, "epoch": 2148} {"train_loss": -24.045400619506836, "global_step": 178326, "epoch": 2148} {"train_loss": -23.812211990356445, "global_step": 178327, "epoch": 2148} {"train_loss": -23.838285446166992, "global_step": 178328, "epoch": 2148} {"train_loss": -23.52273941040039, "global_step": 178329, "epoch": 2148} {"train_loss": -23.870622634887695, "global_step": 178330, "epoch": 2148} {"train_loss": -24.04192543029785, "global_step": 178331, "epoch": 2148} {"train_loss": -23.741796493530273, "global_step": 178332, "epoch": 2148} {"train_loss": -24.20021629333496, "global_step": 178333, "epoch": 2148} {"train_loss": -24.161251068115234, "global_step": 178334, "epoch": 2148} {"train_loss": -23.577329635620117, "global_step": 178335, "epoch": 2148} {"train_loss": -24.120946884155273, "global_step": 178336, "epoch": 2148} {"train_loss": -23.727027893066406, "global_step": 178337, "epoch": 2148} {"train_loss": -24.0365047454834, "global_step": 178338, "epoch": 2148} {"train_loss": -23.417993545532227, "global_step": 178339, "epoch": 2148} {"train_loss": -23.708723068237305, "global_step": 178340, "epoch": 2148} {"train_loss": -23.43699836730957, "global_step": 178341, "epoch": 2148} {"train_loss": -23.994346618652344, "global_step": 178342, "epoch": 2148} {"train_loss": -23.413143157958984, "global_step": 178343, "epoch": 2148} {"train_loss": -24.199857711791992, "global_step": 178344, "epoch": 2148} {"train_loss": -23.855314254760742, "global_step": 178345, "epoch": 2148} {"train_loss": -23.51555824279785, "global_step": 178346, "epoch": 2148} {"train_loss": -23.89286231994629, "global_step": 178347, "epoch": 2148} {"train_loss": -23.774917602539062, "global_step": 178348, "epoch": 2148} {"train_loss": -23.8507080078125, "global_step": 178349, "epoch": 2148} {"train_loss": -23.34446144104004, "global_step": 178350, "epoch": 2148} {"train_loss": -23.730960845947266, "global_step": 178351, "epoch": 2148} {"train_loss": -23.661596298217773, "global_step": 178352, "epoch": 2148} {"train_loss": -23.279067993164062, "global_step": 178353, "epoch": 2148} {"train_loss": -23.78915786743164, "global_step": 178354, "epoch": 2148} {"train_loss": -23.862258911132812, "global_step": 178355, "epoch": 2148} {"train_loss": -23.540834426879883, "global_step": 178356, "epoch": 2148} {"train_loss": -23.5334529876709, "global_step": 178357, "epoch": 2148} {"train_loss": -24.180639266967773, "global_step": 178358, "epoch": 2148} {"train_loss": -23.619924545288086, "global_step": 178359, "epoch": 2148} {"train_loss": -23.77495765686035, "global_step": 178360, "epoch": 2148} {"train_loss": -23.86895751953125, "global_step": 178361, "epoch": 2148} {"train_loss": -23.714351654052734, "global_step": 178362, "epoch": 2148} {"train_loss": -23.5470027923584, "global_step": 178363, "epoch": 2148} {"train_loss": -24.22416877746582, "global_step": 178364, "epoch": 2148} {"train_loss": -23.829532623291016, "global_step": 178365, "epoch": 2148} {"train_loss": -23.81579378426793, "global_step": 178366, "epoch": 2148, "val_loss": 6525278.0} {"train_loss": -23.627796173095703, "global_step": 178367, "epoch": 2149} {"train_loss": -22.983930587768555, "global_step": 178368, "epoch": 2149} {"train_loss": -23.477617263793945, "global_step": 178369, "epoch": 2149} {"train_loss": -23.566204071044922, "global_step": 178370, "epoch": 2149} {"train_loss": -23.299888610839844, "global_step": 178371, "epoch": 2149} {"train_loss": -23.808759689331055, "global_step": 178372, "epoch": 2149} {"train_loss": -23.15384292602539, "global_step": 178373, "epoch": 2149} {"train_loss": -23.85635757446289, "global_step": 178374, "epoch": 2149} {"train_loss": -23.435007095336914, "global_step": 178375, "epoch": 2149} {"train_loss": -23.71367645263672, "global_step": 178376, "epoch": 2149} {"train_loss": -23.469783782958984, "global_step": 178377, "epoch": 2149} {"train_loss": -24.184337615966797, "global_step": 178378, "epoch": 2149} {"train_loss": -23.58436393737793, "global_step": 178379, "epoch": 2149} {"train_loss": -23.480091094970703, "global_step": 178380, "epoch": 2149} {"train_loss": -23.661401748657227, "global_step": 178381, "epoch": 2149} {"train_loss": -23.686866760253906, "global_step": 178382, "epoch": 2149} {"train_loss": -23.9063663482666, "global_step": 178383, "epoch": 2149} {"train_loss": -23.808597564697266, "global_step": 178384, "epoch": 2149} {"train_loss": -23.850645065307617, "global_step": 178385, "epoch": 2149} {"train_loss": -23.91908073425293, "global_step": 178386, "epoch": 2149} {"train_loss": -23.98483657836914, "global_step": 178387, "epoch": 2149} {"train_loss": -23.97382164001465, "global_step": 178388, "epoch": 2149} {"train_loss": -24.198789596557617, "global_step": 178389, "epoch": 2149} {"train_loss": -23.74103355407715, "global_step": 178390, "epoch": 2149} {"train_loss": -23.865205764770508, "global_step": 178391, "epoch": 2149} {"train_loss": -23.85896110534668, "global_step": 178392, "epoch": 2149} {"train_loss": -23.928335189819336, "global_step": 178393, "epoch": 2149} {"train_loss": -24.00693130493164, "global_step": 178394, "epoch": 2149} {"train_loss": -23.45887565612793, "global_step": 178395, "epoch": 2149} {"train_loss": -23.78153419494629, "global_step": 178396, "epoch": 2149} {"train_loss": -24.14316177368164, "global_step": 178397, "epoch": 2149} {"train_loss": -23.740568161010742, "global_step": 178398, "epoch": 2149} {"train_loss": -24.096715927124023, "global_step": 178399, "epoch": 2149} {"train_loss": -24.03093910217285, "global_step": 178400, "epoch": 2149} {"train_loss": -24.015438079833984, "global_step": 178401, "epoch": 2149} {"train_loss": -24.128095626831055, "global_step": 178402, "epoch": 2149} {"train_loss": -24.13924217224121, "global_step": 178403, "epoch": 2149} {"train_loss": -24.21429443359375, "global_step": 178404, "epoch": 2149} {"train_loss": -24.265220642089844, "global_step": 178405, "epoch": 2149} {"train_loss": -23.689748764038086, "global_step": 178406, "epoch": 2149} {"train_loss": -23.85121726989746, "global_step": 178407, "epoch": 2149} {"train_loss": -23.485618591308594, "global_step": 178408, "epoch": 2149} {"train_loss": -23.997547149658203, "global_step": 178409, "epoch": 2149} {"train_loss": -24.38410186767578, "global_step": 178410, "epoch": 2149} {"train_loss": -23.98853874206543, "global_step": 178411, "epoch": 2149} {"train_loss": -24.15416145324707, "global_step": 178412, "epoch": 2149} {"train_loss": -24.276334762573242, "global_step": 178413, "epoch": 2149} {"train_loss": -23.884098052978516, "global_step": 178414, "epoch": 2149} {"train_loss": -24.18301773071289, "global_step": 178415, "epoch": 2149} {"train_loss": -23.94161605834961, "global_step": 178416, "epoch": 2149} {"train_loss": -23.736328125, "global_step": 178417, "epoch": 2149} {"train_loss": -24.03028106689453, "global_step": 178418, "epoch": 2149} {"train_loss": -24.02939224243164, "global_step": 178419, "epoch": 2149} {"train_loss": -24.252836227416992, "global_step": 178420, "epoch": 2149} {"train_loss": -23.71834373474121, "global_step": 178421, "epoch": 2149} {"train_loss": -24.16574478149414, "global_step": 178422, "epoch": 2149} {"train_loss": -23.644559860229492, "global_step": 178423, "epoch": 2149} {"train_loss": -23.907686233520508, "global_step": 178424, "epoch": 2149} {"train_loss": -24.193815231323242, "global_step": 178425, "epoch": 2149} {"train_loss": -23.47889518737793, "global_step": 178426, "epoch": 2149} {"train_loss": -24.012418746948242, "global_step": 178427, "epoch": 2149} {"train_loss": -23.802927017211914, "global_step": 178428, "epoch": 2149} {"train_loss": -24.248687744140625, "global_step": 178429, "epoch": 2149} {"train_loss": -23.76144790649414, "global_step": 178430, "epoch": 2149} {"train_loss": -24.18159294128418, "global_step": 178431, "epoch": 2149} {"train_loss": -24.139678955078125, "global_step": 178432, "epoch": 2149} {"train_loss": -24.1298885345459, "global_step": 178433, "epoch": 2149} {"train_loss": -23.803009033203125, "global_step": 178434, "epoch": 2149} {"train_loss": -23.94631004333496, "global_step": 178435, "epoch": 2149} {"train_loss": -24.126205444335938, "global_step": 178436, "epoch": 2149} {"train_loss": -23.73872184753418, "global_step": 178437, "epoch": 2149} {"train_loss": -24.44065284729004, "global_step": 178438, "epoch": 2149} {"train_loss": -23.746374130249023, "global_step": 178439, "epoch": 2149} {"train_loss": -23.694091796875, "global_step": 178440, "epoch": 2149} {"train_loss": -24.02431297302246, "global_step": 178441, "epoch": 2149} {"train_loss": -23.69746971130371, "global_step": 178442, "epoch": 2149} {"train_loss": -23.850690841674805, "global_step": 178443, "epoch": 2149} {"train_loss": -24.092763900756836, "global_step": 178444, "epoch": 2149} {"train_loss": -23.808597564697266, "global_step": 178445, "epoch": 2149} {"train_loss": -23.620534896850586, "global_step": 178446, "epoch": 2149} {"train_loss": -23.607397079467773, "global_step": 178447, "epoch": 2149} {"train_loss": -23.781143188476562, "global_step": 178448, "epoch": 2149} {"train_loss": -23.857967491609504, "global_step": 178449, "epoch": 2149, "val_loss": 6436173.0} {"train_loss": -23.0216064453125, "global_step": 178450, "epoch": 2150} {"train_loss": -22.6755313873291, "global_step": 178451, "epoch": 2150} {"train_loss": -22.759464263916016, "global_step": 178452, "epoch": 2150} {"train_loss": -22.937028884887695, "global_step": 178453, "epoch": 2150} {"train_loss": -22.546743392944336, "global_step": 178454, "epoch": 2150} {"train_loss": -22.865341186523438, "global_step": 178455, "epoch": 2150} {"train_loss": -23.159700393676758, "global_step": 178456, "epoch": 2150} {"train_loss": -23.153230667114258, "global_step": 178457, "epoch": 2150} {"train_loss": -23.113300323486328, "global_step": 178458, "epoch": 2150} {"train_loss": -23.182979583740234, "global_step": 178459, "epoch": 2150} {"train_loss": -23.09603500366211, "global_step": 178460, "epoch": 2150} {"train_loss": -22.979965209960938, "global_step": 178461, "epoch": 2150} {"train_loss": -23.075185775756836, "global_step": 178462, "epoch": 2150} {"train_loss": -23.440385818481445, "global_step": 178463, "epoch": 2150} {"train_loss": -23.667776107788086, "global_step": 178464, "epoch": 2150} {"train_loss": -23.19208335876465, "global_step": 178465, "epoch": 2150} {"train_loss": -23.325414657592773, "global_step": 178466, "epoch": 2150} {"train_loss": -23.388269424438477, "global_step": 178467, "epoch": 2150} {"train_loss": -23.249235153198242, "global_step": 178468, "epoch": 2150} {"train_loss": -23.44891929626465, "global_step": 178469, "epoch": 2150} {"train_loss": -23.38714599609375, "global_step": 178470, "epoch": 2150} {"train_loss": -23.98655128479004, "global_step": 178471, "epoch": 2150} {"train_loss": -23.927000045776367, "global_step": 178472, "epoch": 2150} {"train_loss": -23.63591957092285, "global_step": 178473, "epoch": 2150} {"train_loss": -23.75876235961914, "global_step": 178474, "epoch": 2150} {"train_loss": -23.559513092041016, "global_step": 178475, "epoch": 2150} {"train_loss": -23.746065139770508, "global_step": 178476, "epoch": 2150} {"train_loss": -23.77409553527832, "global_step": 178477, "epoch": 2150} {"train_loss": -24.05161476135254, "global_step": 178478, "epoch": 2150} {"train_loss": -24.056894302368164, "global_step": 178479, "epoch": 2150} {"train_loss": -23.536270141601562, "global_step": 178480, "epoch": 2150} {"train_loss": -24.050947189331055, "global_step": 178481, "epoch": 2150} {"train_loss": -23.67786979675293, "global_step": 178482, "epoch": 2150} {"train_loss": -24.102903366088867, "global_step": 178483, "epoch": 2150} {"train_loss": -23.91712760925293, "global_step": 178484, "epoch": 2150} {"train_loss": -24.009262084960938, "global_step": 178485, "epoch": 2150} {"train_loss": -23.56756019592285, "global_step": 178486, "epoch": 2150} {"train_loss": -23.688085556030273, "global_step": 178487, "epoch": 2150} {"train_loss": -23.978397369384766, "global_step": 178488, "epoch": 2150} {"train_loss": -23.82322120666504, "global_step": 178489, "epoch": 2150} {"train_loss": -23.831195831298828, "global_step": 178490, "epoch": 2150} {"train_loss": -23.897846221923828, "global_step": 178491, "epoch": 2150} {"train_loss": -23.578487396240234, "global_step": 178492, "epoch": 2150} {"train_loss": -24.029438018798828, "global_step": 178493, "epoch": 2150} {"train_loss": -24.121902465820312, "global_step": 178494, "epoch": 2150} {"train_loss": -24.057592391967773, "global_step": 178495, "epoch": 2150} {"train_loss": -23.824731826782227, "global_step": 178496, "epoch": 2150} {"train_loss": -24.03057289123535, "global_step": 178497, "epoch": 2150} {"train_loss": -24.1517276763916, "global_step": 178498, "epoch": 2150} {"train_loss": -23.808401107788086, "global_step": 178499, "epoch": 2150} {"train_loss": -24.2152042388916, "global_step": 178500, "epoch": 2150} {"train_loss": -24.092283248901367, "global_step": 178501, "epoch": 2150} {"train_loss": -24.334537506103516, "global_step": 178502, "epoch": 2150} {"train_loss": -24.101512908935547, "global_step": 178503, "epoch": 2150} {"train_loss": -24.175565719604492, "global_step": 178504, "epoch": 2150} {"train_loss": -23.776016235351562, "global_step": 178505, "epoch": 2150} {"train_loss": -24.06024742126465, "global_step": 178506, "epoch": 2150} {"train_loss": -23.76886558532715, "global_step": 178507, "epoch": 2150} {"train_loss": -24.499073028564453, "global_step": 178508, "epoch": 2150} {"train_loss": -23.862268447875977, "global_step": 178509, "epoch": 2150} {"train_loss": -23.896488189697266, "global_step": 178510, "epoch": 2150} {"train_loss": -24.030202865600586, "global_step": 178511, "epoch": 2150} {"train_loss": -23.762277603149414, "global_step": 178512, "epoch": 2150} {"train_loss": -24.203664779663086, "global_step": 178513, "epoch": 2150} {"train_loss": -23.6771183013916, "global_step": 178514, "epoch": 2150} {"train_loss": -23.899396896362305, "global_step": 178515, "epoch": 2150} {"train_loss": -23.704092025756836, "global_step": 178516, "epoch": 2150} {"train_loss": -23.940196990966797, "global_step": 178517, "epoch": 2150} {"train_loss": -24.075944900512695, "global_step": 178518, "epoch": 2150} {"train_loss": -23.944616317749023, "global_step": 178519, "epoch": 2150} {"train_loss": -23.43722915649414, "global_step": 178520, "epoch": 2150} {"train_loss": -23.89284324645996, "global_step": 178521, "epoch": 2150} {"train_loss": -24.04874038696289, "global_step": 178522, "epoch": 2150} {"train_loss": -23.79424476623535, "global_step": 178523, "epoch": 2150} {"train_loss": -23.7164306640625, "global_step": 178524, "epoch": 2150} {"train_loss": -23.89853286743164, "global_step": 178525, "epoch": 2150} {"train_loss": -23.48457908630371, "global_step": 178526, "epoch": 2150} {"train_loss": -23.679779052734375, "global_step": 178527, "epoch": 2150} {"train_loss": -23.376327514648438, "global_step": 178528, "epoch": 2150} {"train_loss": -23.99196434020996, "global_step": 178529, "epoch": 2150} {"train_loss": -23.708784103393555, "global_step": 178530, "epoch": 2150} {"train_loss": -23.933971405029297, "global_step": 178531, "epoch": 2150} {"train_loss": -23.685263806078808, "global_step": 178532, "epoch": 2150, "train/sim_max_reward_0": 1.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4500000": 1.0, "test/sim_max_reward_4500001": 1.0, "test/sim_max_reward_4500002": 1.0, "test/sim_max_reward_4500003": 1.0, "test/sim_max_reward_4500004": 1.0, "test/sim_max_reward_4500005": 1.0, "test/sim_max_reward_4500006": 1.0, "test/sim_max_reward_4500007": 1.0, "test/sim_max_reward_4500008": 1.0, "test/sim_max_reward_4500009": 1.0, "test/sim_max_reward_4500010": 1.0, "test/sim_max_reward_4500011": 1.0, "test/sim_max_reward_4500012": 1.0, "test/sim_max_reward_4500013": 1.0, "test/sim_max_reward_4500014": 1.0, "test/sim_max_reward_4500015": 1.0, "test/sim_max_reward_4500016": 1.0, "test/sim_max_reward_4500017": 1.0, "test/sim_max_reward_4500018": 1.0, "test/sim_max_reward_4500019": 1.0, "test/sim_max_reward_4500020": 1.0, "test/sim_max_reward_4500021": 1.0, "train/mean_score": 1.0, "test/mean_score": 1.0, "val_loss": 6525294.5} {"train_loss": -23.546863555908203, "global_step": 178533, "epoch": 2151} {"train_loss": -23.08798599243164, "global_step": 178534, "epoch": 2151} {"train_loss": -23.315439224243164, "global_step": 178535, "epoch": 2151} {"train_loss": -23.43343162536621, "global_step": 178536, "epoch": 2151} {"train_loss": -23.79404640197754, "global_step": 178537, "epoch": 2151} {"train_loss": -23.904592514038086, "global_step": 178538, "epoch": 2151} {"train_loss": -23.47279930114746, "global_step": 178539, "epoch": 2151} {"train_loss": -23.584012985229492, "global_step": 178540, "epoch": 2151} {"train_loss": -23.26731300354004, "global_step": 178541, "epoch": 2151} {"train_loss": -23.650997161865234, "global_step": 178542, "epoch": 2151} {"train_loss": -23.10432243347168, "global_step": 178543, "epoch": 2151} {"train_loss": -23.59115982055664, "global_step": 178544, "epoch": 2151} {"train_loss": -23.55556297302246, "global_step": 178545, "epoch": 2151} {"train_loss": -23.639936447143555, "global_step": 178546, "epoch": 2151} {"train_loss": -23.768171310424805, "global_step": 178547, "epoch": 2151} {"train_loss": -23.741636276245117, "global_step": 178548, "epoch": 2151} {"train_loss": -23.670326232910156, "global_step": 178549, "epoch": 2151} {"train_loss": -23.733139038085938, "global_step": 178550, "epoch": 2151} {"train_loss": -23.87291717529297, "global_step": 178551, "epoch": 2151} {"train_loss": -23.26404571533203, "global_step": 178552, "epoch": 2151} {"train_loss": -23.770238876342773, "global_step": 178553, "epoch": 2151} {"train_loss": -23.563562393188477, "global_step": 178554, "epoch": 2151} {"train_loss": -23.5789852142334, "global_step": 178555, "epoch": 2151} {"train_loss": -23.77493667602539, "global_step": 178556, "epoch": 2151} {"train_loss": -23.797460556030273, "global_step": 178557, "epoch": 2151} {"train_loss": -23.849994659423828, "global_step": 178558, "epoch": 2151} {"train_loss": -23.85016441345215, "global_step": 178559, "epoch": 2151} {"train_loss": -23.824766159057617, "global_step": 178560, "epoch": 2151} {"train_loss": -23.67722511291504, "global_step": 178561, "epoch": 2151} {"train_loss": -23.863637924194336, "global_step": 178562, "epoch": 2151} {"train_loss": -23.585657119750977, "global_step": 178563, "epoch": 2151} {"train_loss": -24.200693130493164, "global_step": 178564, "epoch": 2151} {"train_loss": -23.998920440673828, "global_step": 178565, "epoch": 2151} {"train_loss": -24.03497314453125, "global_step": 178566, "epoch": 2151} {"train_loss": -23.987716674804688, "global_step": 178567, "epoch": 2151} {"train_loss": -24.181827545166016, "global_step": 178568, "epoch": 2151} {"train_loss": -24.07089614868164, "global_step": 178569, "epoch": 2151} {"train_loss": -23.902292251586914, "global_step": 178570, "epoch": 2151} {"train_loss": -23.9822998046875, "global_step": 178571, "epoch": 2151} {"train_loss": -23.962047576904297, "global_step": 178572, "epoch": 2151} {"train_loss": -23.984254837036133, "global_step": 178573, "epoch": 2151} {"train_loss": -24.2740478515625, "global_step": 178574, "epoch": 2151} {"train_loss": -23.89914894104004, "global_step": 178575, "epoch": 2151} {"train_loss": -24.067276000976562, "global_step": 178576, "epoch": 2151} {"train_loss": -23.74607276916504, "global_step": 178577, "epoch": 2151} {"train_loss": -23.961027145385742, "global_step": 178578, "epoch": 2151} {"train_loss": -24.140766143798828, "global_step": 178579, "epoch": 2151} {"train_loss": -23.891923904418945, "global_step": 178580, "epoch": 2151} {"train_loss": -24.153778076171875, "global_step": 178581, "epoch": 2151} {"train_loss": -24.01165199279785, "global_step": 178582, "epoch": 2151} {"train_loss": -24.22394371032715, "global_step": 178583, "epoch": 2151} {"train_loss": -23.822519302368164, "global_step": 178584, "epoch": 2151} {"train_loss": -23.990888595581055, "global_step": 178585, "epoch": 2151} {"train_loss": -24.14240074157715, "global_step": 178586, "epoch": 2151} {"train_loss": -23.784696578979492, "global_step": 178587, "epoch": 2151} {"train_loss": -24.110685348510742, "global_step": 178588, "epoch": 2151} {"train_loss": -24.119876861572266, "global_step": 178589, "epoch": 2151} {"train_loss": -23.935699462890625, "global_step": 178590, "epoch": 2151} {"train_loss": -23.758068084716797, "global_step": 178591, "epoch": 2151} {"train_loss": -23.861906051635742, "global_step": 178592, "epoch": 2151} {"train_loss": -24.085975646972656, "global_step": 178593, "epoch": 2151} {"train_loss": -23.590940475463867, "global_step": 178594, "epoch": 2151} {"train_loss": -23.53434181213379, "global_step": 178595, "epoch": 2151} {"train_loss": -23.771484375, "global_step": 178596, "epoch": 2151} {"train_loss": -23.8206844329834, "global_step": 178597, "epoch": 2151} {"train_loss": -23.644107818603516, "global_step": 178598, "epoch": 2151} {"train_loss": -24.0960750579834, "global_step": 178599, "epoch": 2151} {"train_loss": -24.038236618041992, "global_step": 178600, "epoch": 2151} {"train_loss": -24.19378089904785, "global_step": 178601, "epoch": 2151} {"train_loss": -23.78218650817871, "global_step": 178602, "epoch": 2151} {"train_loss": -23.56077003479004, "global_step": 178603, "epoch": 2151} {"train_loss": -23.877500534057617, "global_step": 178604, "epoch": 2151} {"train_loss": -23.794286727905273, "global_step": 178605, "epoch": 2151} {"train_loss": -23.71255874633789, "global_step": 178606, "epoch": 2151} {"train_loss": -23.938627243041992, "global_step": 178607, "epoch": 2151} {"train_loss": -23.696022033691406, "global_step": 178608, "epoch": 2151} {"train_loss": -23.616907119750977, "global_step": 178609, "epoch": 2151} {"train_loss": -24.161575317382812, "global_step": 178610, "epoch": 2151} {"train_loss": -23.74915313720703, "global_step": 178611, "epoch": 2151} {"train_loss": -23.936508178710938, "global_step": 178612, "epoch": 2151} {"train_loss": -23.772546768188477, "global_step": 178613, "epoch": 2151} {"train_loss": -23.507558822631836, "global_step": 178614, "epoch": 2151} {"train_loss": -23.807580672114728, "global_step": 178615, "epoch": 2151, "val_loss": 6523262.0} {"train_loss": -23.283227920532227, "global_step": 178616, "epoch": 2152} {"train_loss": -23.37901496887207, "global_step": 178617, "epoch": 2152} {"train_loss": -23.723697662353516, "global_step": 178618, "epoch": 2152} {"train_loss": -23.593801498413086, "global_step": 178619, "epoch": 2152} {"train_loss": -23.64275360107422, "global_step": 178620, "epoch": 2152} {"train_loss": -23.22294044494629, "global_step": 178621, "epoch": 2152} {"train_loss": -23.655546188354492, "global_step": 178622, "epoch": 2152} {"train_loss": -23.54213523864746, "global_step": 178623, "epoch": 2152} {"train_loss": -23.281757354736328, "global_step": 178624, "epoch": 2152} {"train_loss": -23.639480590820312, "global_step": 178625, "epoch": 2152} {"train_loss": -23.471742630004883, "global_step": 178626, "epoch": 2152} {"train_loss": -23.751415252685547, "global_step": 178627, "epoch": 2152} {"train_loss": -23.47876739501953, "global_step": 178628, "epoch": 2152} {"train_loss": -23.75947380065918, "global_step": 178629, "epoch": 2152} {"train_loss": -23.394607543945312, "global_step": 178630, "epoch": 2152} {"train_loss": -23.509614944458008, "global_step": 178631, "epoch": 2152} {"train_loss": -23.780935287475586, "global_step": 178632, "epoch": 2152} {"train_loss": -23.414499282836914, "global_step": 178633, "epoch": 2152} {"train_loss": -24.08014678955078, "global_step": 178634, "epoch": 2152} {"train_loss": -23.28812599182129, "global_step": 178635, "epoch": 2152} {"train_loss": -23.874187469482422, "global_step": 178636, "epoch": 2152} {"train_loss": -23.8940486907959, "global_step": 178637, "epoch": 2152} {"train_loss": -24.04641342163086, "global_step": 178638, "epoch": 2152} {"train_loss": -23.685659408569336, "global_step": 178639, "epoch": 2152} {"train_loss": -24.327423095703125, "global_step": 178640, "epoch": 2152} {"train_loss": -23.827823638916016, "global_step": 178641, "epoch": 2152} {"train_loss": -23.913175582885742, "global_step": 178642, "epoch": 2152} {"train_loss": -23.8876895904541, "global_step": 178643, "epoch": 2152} {"train_loss": -23.91579246520996, "global_step": 178644, "epoch": 2152} {"train_loss": -24.053659439086914, "global_step": 178645, "epoch": 2152} {"train_loss": -23.79453468322754, "global_step": 178646, "epoch": 2152} {"train_loss": -23.795595169067383, "global_step": 178647, "epoch": 2152} {"train_loss": -23.596237182617188, "global_step": 178648, "epoch": 2152} {"train_loss": -23.7330265045166, "global_step": 178649, "epoch": 2152} {"train_loss": -23.498010635375977, "global_step": 178650, "epoch": 2152} {"train_loss": -24.145973205566406, "global_step": 178651, "epoch": 2152} {"train_loss": -23.953699111938477, "global_step": 178652, "epoch": 2152} {"train_loss": -24.01546287536621, "global_step": 178653, "epoch": 2152} {"train_loss": -23.576793670654297, "global_step": 178654, "epoch": 2152} {"train_loss": -23.594236373901367, "global_step": 178655, "epoch": 2152} {"train_loss": -23.617795944213867, "global_step": 178656, "epoch": 2152} {"train_loss": -23.74090003967285, "global_step": 178657, "epoch": 2152} {"train_loss": -24.004926681518555, "global_step": 178658, "epoch": 2152} {"train_loss": -23.980615615844727, "global_step": 178659, "epoch": 2152} {"train_loss": -23.997711181640625, "global_step": 178660, "epoch": 2152} {"train_loss": -23.98748016357422, "global_step": 178661, "epoch": 2152} {"train_loss": -23.986249923706055, "global_step": 178662, "epoch": 2152} {"train_loss": -23.877487182617188, "global_step": 178663, "epoch": 2152} {"train_loss": -23.546527862548828, "global_step": 178664, "epoch": 2152} {"train_loss": -23.608625411987305, "global_step": 178665, "epoch": 2152} {"train_loss": -24.18927574157715, "global_step": 178666, "epoch": 2152} {"train_loss": -23.947616577148438, "global_step": 178667, "epoch": 2152} {"train_loss": -23.560924530029297, "global_step": 178668, "epoch": 2152} {"train_loss": -23.64382553100586, "global_step": 178669, "epoch": 2152} {"train_loss": -24.15572166442871, "global_step": 178670, "epoch": 2152} {"train_loss": -24.23093032836914, "global_step": 178671, "epoch": 2152} {"train_loss": -23.608800888061523, "global_step": 178672, "epoch": 2152} {"train_loss": -23.907861709594727, "global_step": 178673, "epoch": 2152} {"train_loss": -23.933591842651367, "global_step": 178674, "epoch": 2152} {"train_loss": -24.05268096923828, "global_step": 178675, "epoch": 2152} {"train_loss": -24.137136459350586, "global_step": 178676, "epoch": 2152} {"train_loss": -23.897369384765625, "global_step": 178677, "epoch": 2152} {"train_loss": -23.872968673706055, "global_step": 178678, "epoch": 2152} {"train_loss": -23.63776969909668, "global_step": 178679, "epoch": 2152} {"train_loss": -23.9825496673584, "global_step": 178680, "epoch": 2152} {"train_loss": -24.131624221801758, "global_step": 178681, "epoch": 2152} {"train_loss": -24.094533920288086, "global_step": 178682, "epoch": 2152} {"train_loss": -23.97231101989746, "global_step": 178683, "epoch": 2152} {"train_loss": -24.05106544494629, "global_step": 178684, "epoch": 2152} {"train_loss": -23.5975399017334, "global_step": 178685, "epoch": 2152} {"train_loss": -23.913084030151367, "global_step": 178686, "epoch": 2152} {"train_loss": -23.577146530151367, "global_step": 178687, "epoch": 2152} {"train_loss": -24.14312744140625, "global_step": 178688, "epoch": 2152} {"train_loss": -24.20163345336914, "global_step": 178689, "epoch": 2152} {"train_loss": -24.082670211791992, "global_step": 178690, "epoch": 2152} {"train_loss": -23.911922454833984, "global_step": 178691, "epoch": 2152} {"train_loss": -23.95131492614746, "global_step": 178692, "epoch": 2152} {"train_loss": -23.869619369506836, "global_step": 178693, "epoch": 2152} {"train_loss": -23.343690872192383, "global_step": 178694, "epoch": 2152} {"train_loss": -23.629613876342773, "global_step": 178695, "epoch": 2152} {"train_loss": -23.539976119995117, "global_step": 178696, "epoch": 2152} {"train_loss": -23.541784286499023, "global_step": 178697, "epoch": 2152} {"train_loss": -23.821319740938854, "global_step": 178698, "epoch": 2152, "val_loss": 6535979.5} {"train_loss": -23.33038902282715, "global_step": 178699, "epoch": 2153} {"train_loss": -23.611988067626953, "global_step": 178700, "epoch": 2153} {"train_loss": -23.48050880432129, "global_step": 178701, "epoch": 2153} {"train_loss": -23.571157455444336, "global_step": 178702, "epoch": 2153} {"train_loss": -23.627765655517578, "global_step": 178703, "epoch": 2153} {"train_loss": -23.505186080932617, "global_step": 178704, "epoch": 2153} {"train_loss": -23.799238204956055, "global_step": 178705, "epoch": 2153} {"train_loss": -23.687332153320312, "global_step": 178706, "epoch": 2153} {"train_loss": -23.65985679626465, "global_step": 178707, "epoch": 2153} {"train_loss": -24.01161766052246, "global_step": 178708, "epoch": 2153} {"train_loss": -23.955602645874023, "global_step": 178709, "epoch": 2153} {"train_loss": -23.6394100189209, "global_step": 178710, "epoch": 2153} {"train_loss": -23.723371505737305, "global_step": 178711, "epoch": 2153} {"train_loss": -23.886892318725586, "global_step": 178712, "epoch": 2153} {"train_loss": -23.695905685424805, "global_step": 178713, "epoch": 2153} {"train_loss": -24.04360008239746, "global_step": 178714, "epoch": 2153} {"train_loss": -23.64131736755371, "global_step": 178715, "epoch": 2153} {"train_loss": -23.84798240661621, "global_step": 178716, "epoch": 2153} {"train_loss": -24.1667537689209, "global_step": 178717, "epoch": 2153} {"train_loss": -24.213199615478516, "global_step": 178718, "epoch": 2153} {"train_loss": -23.408405303955078, "global_step": 178719, "epoch": 2153} {"train_loss": -23.60314178466797, "global_step": 178720, "epoch": 2153} {"train_loss": -24.020071029663086, "global_step": 178721, "epoch": 2153} {"train_loss": -24.069700241088867, "global_step": 178722, "epoch": 2153} {"train_loss": -23.995512008666992, "global_step": 178723, "epoch": 2153} {"train_loss": -23.662988662719727, "global_step": 178724, "epoch": 2153} {"train_loss": -23.55402374267578, "global_step": 178725, "epoch": 2153} {"train_loss": -23.295246124267578, "global_step": 178726, "epoch": 2153} {"train_loss": -23.700387954711914, "global_step": 178727, "epoch": 2153} {"train_loss": -24.474782943725586, "global_step": 178728, "epoch": 2153} {"train_loss": -23.539670944213867, "global_step": 178729, "epoch": 2153} {"train_loss": -23.767311096191406, "global_step": 178730, "epoch": 2153} {"train_loss": -23.63572883605957, "global_step": 178731, "epoch": 2153} {"train_loss": -24.0129337310791, "global_step": 178732, "epoch": 2153} {"train_loss": -23.772125244140625, "global_step": 178733, "epoch": 2153} {"train_loss": -24.029508590698242, "global_step": 178734, "epoch": 2153} {"train_loss": -23.844789505004883, "global_step": 178735, "epoch": 2153} {"train_loss": -23.849157333374023, "global_step": 178736, "epoch": 2153} {"train_loss": -23.86748695373535, "global_step": 178737, "epoch": 2153} {"train_loss": -23.690902709960938, "global_step": 178738, "epoch": 2153} {"train_loss": -24.016027450561523, "global_step": 178739, "epoch": 2153} {"train_loss": -23.549468994140625, "global_step": 178740, "epoch": 2153} {"train_loss": -23.71748924255371, "global_step": 178741, "epoch": 2153} {"train_loss": -23.855131149291992, "global_step": 178742, "epoch": 2153} {"train_loss": -24.30116844177246, "global_step": 178743, "epoch": 2153} {"train_loss": -23.92030143737793, "global_step": 178744, "epoch": 2153} {"train_loss": -23.94390869140625, "global_step": 178745, "epoch": 2153} {"train_loss": -24.020431518554688, "global_step": 178746, "epoch": 2153} {"train_loss": -23.458133697509766, "global_step": 178747, "epoch": 2153} {"train_loss": -23.710437774658203, "global_step": 178748, "epoch": 2153} {"train_loss": -24.25338363647461, "global_step": 178749, "epoch": 2153} {"train_loss": -23.81848907470703, "global_step": 178750, "epoch": 2153} {"train_loss": -24.22715187072754, "global_step": 178751, "epoch": 2153} {"train_loss": -23.874420166015625, "global_step": 178752, "epoch": 2153} {"train_loss": -23.876813888549805, "global_step": 178753, "epoch": 2153} {"train_loss": -24.262680053710938, "global_step": 178754, "epoch": 2153} {"train_loss": -23.77760124206543, "global_step": 178755, "epoch": 2153} {"train_loss": -24.3206787109375, "global_step": 178756, "epoch": 2153} {"train_loss": -24.01123809814453, "global_step": 178757, "epoch": 2153} {"train_loss": -23.47264289855957, "global_step": 178758, "epoch": 2153} {"train_loss": -23.504348754882812, "global_step": 178759, "epoch": 2153} {"train_loss": -24.53019142150879, "global_step": 178760, "epoch": 2153} {"train_loss": -23.818204879760742, "global_step": 178761, "epoch": 2153} {"train_loss": -24.21242904663086, "global_step": 178762, "epoch": 2153} {"train_loss": -23.74366569519043, "global_step": 178763, "epoch": 2153} {"train_loss": -24.05413055419922, "global_step": 178764, "epoch": 2153} {"train_loss": -23.615530014038086, "global_step": 178765, "epoch": 2153} {"train_loss": -23.87969207763672, "global_step": 178766, "epoch": 2153} {"train_loss": -24.007099151611328, "global_step": 178767, "epoch": 2153} {"train_loss": -23.51051902770996, "global_step": 178768, "epoch": 2153} {"train_loss": -24.10756492614746, "global_step": 178769, "epoch": 2153} {"train_loss": -23.76987648010254, "global_step": 178770, "epoch": 2153} {"train_loss": -24.00306510925293, "global_step": 178771, "epoch": 2153} {"train_loss": -23.787553787231445, "global_step": 178772, "epoch": 2153} {"train_loss": -23.3830509185791, "global_step": 178773, "epoch": 2153} {"train_loss": -23.801836013793945, "global_step": 178774, "epoch": 2153} {"train_loss": -23.909011840820312, "global_step": 178775, "epoch": 2153} {"train_loss": -23.5447998046875, "global_step": 178776, "epoch": 2153} {"train_loss": -23.781158447265625, "global_step": 178777, "epoch": 2153} {"train_loss": -23.574874877929688, "global_step": 178778, "epoch": 2153} {"train_loss": -23.7139892578125, "global_step": 178779, "epoch": 2153} {"train_loss": -24.017471313476562, "global_step": 178780, "epoch": 2153} {"train_loss": -23.833033113594514, "global_step": 178781, "epoch": 2153, "val_loss": 6517554.0} {"train_loss": -23.851709365844727, "global_step": 178782, "epoch": 2154} {"train_loss": -23.73467445373535, "global_step": 178783, "epoch": 2154} {"train_loss": -23.61353874206543, "global_step": 178784, "epoch": 2154} {"train_loss": -23.695913314819336, "global_step": 178785, "epoch": 2154} {"train_loss": -23.647865295410156, "global_step": 178786, "epoch": 2154} {"train_loss": -23.79884910583496, "global_step": 178787, "epoch": 2154} {"train_loss": -23.912952423095703, "global_step": 178788, "epoch": 2154} {"train_loss": -23.919178009033203, "global_step": 178789, "epoch": 2154} {"train_loss": -23.510181427001953, "global_step": 178790, "epoch": 2154} {"train_loss": -24.013870239257812, "global_step": 178791, "epoch": 2154} {"train_loss": -23.192838668823242, "global_step": 178792, "epoch": 2154} {"train_loss": -23.914640426635742, "global_step": 178793, "epoch": 2154} {"train_loss": -23.753713607788086, "global_step": 178794, "epoch": 2154} {"train_loss": -23.73733139038086, "global_step": 178795, "epoch": 2154} {"train_loss": -23.86146354675293, "global_step": 178796, "epoch": 2154} {"train_loss": -23.877660751342773, "global_step": 178797, "epoch": 2154} {"train_loss": -23.894550323486328, "global_step": 178798, "epoch": 2154} {"train_loss": -23.652061462402344, "global_step": 178799, "epoch": 2154} {"train_loss": -23.76809310913086, "global_step": 178800, "epoch": 2154} {"train_loss": -23.602949142456055, "global_step": 178801, "epoch": 2154} {"train_loss": -24.06685447692871, "global_step": 178802, "epoch": 2154} {"train_loss": -23.199079513549805, "global_step": 178803, "epoch": 2154} {"train_loss": -23.793359756469727, "global_step": 178804, "epoch": 2154} {"train_loss": -23.637956619262695, "global_step": 178805, "epoch": 2154} {"train_loss": -23.857885360717773, "global_step": 178806, "epoch": 2154} {"train_loss": -23.926069259643555, "global_step": 178807, "epoch": 2154} {"train_loss": -23.841276168823242, "global_step": 178808, "epoch": 2154} {"train_loss": -23.565549850463867, "global_step": 178809, "epoch": 2154} {"train_loss": -23.74867820739746, "global_step": 178810, "epoch": 2154} {"train_loss": -23.938644409179688, "global_step": 178811, "epoch": 2154} {"train_loss": -23.777145385742188, "global_step": 178812, "epoch": 2154} {"train_loss": -23.9356689453125, "global_step": 178813, "epoch": 2154} {"train_loss": -23.763071060180664, "global_step": 178814, "epoch": 2154} {"train_loss": -23.891141891479492, "global_step": 178815, "epoch": 2154} {"train_loss": -23.77876853942871, "global_step": 178816, "epoch": 2154} {"train_loss": -23.768293380737305, "global_step": 178817, "epoch": 2154} {"train_loss": -23.809850692749023, "global_step": 178818, "epoch": 2154} {"train_loss": -23.825048446655273, "global_step": 178819, "epoch": 2154} {"train_loss": -24.001680374145508, "global_step": 178820, "epoch": 2154} {"train_loss": -24.107023239135742, "global_step": 178821, "epoch": 2154} {"train_loss": -24.15850830078125, "global_step": 178822, "epoch": 2154} {"train_loss": -23.766620635986328, "global_step": 178823, "epoch": 2154} {"train_loss": -23.9243221282959, "global_step": 178824, "epoch": 2154} {"train_loss": -23.89944839477539, "global_step": 178825, "epoch": 2154} {"train_loss": -23.588653564453125, "global_step": 178826, "epoch": 2154} {"train_loss": -23.978683471679688, "global_step": 178827, "epoch": 2154} {"train_loss": -24.1899356842041, "global_step": 178828, "epoch": 2154} {"train_loss": -24.094167709350586, "global_step": 178829, "epoch": 2154} {"train_loss": -23.644041061401367, "global_step": 178830, "epoch": 2154} {"train_loss": -23.86842918395996, "global_step": 178831, "epoch": 2154} {"train_loss": -23.889232635498047, "global_step": 178832, "epoch": 2154} {"train_loss": -23.736572265625, "global_step": 178833, "epoch": 2154} {"train_loss": -24.285934448242188, "global_step": 178834, "epoch": 2154} {"train_loss": -24.044340133666992, "global_step": 178835, "epoch": 2154} {"train_loss": -24.015350341796875, "global_step": 178836, "epoch": 2154} {"train_loss": -23.68897247314453, "global_step": 178837, "epoch": 2154} {"train_loss": -24.017940521240234, "global_step": 178838, "epoch": 2154} {"train_loss": -23.910388946533203, "global_step": 178839, "epoch": 2154} {"train_loss": -23.43338394165039, "global_step": 178840, "epoch": 2154} {"train_loss": -24.266408920288086, "global_step": 178841, "epoch": 2154} {"train_loss": -24.13608741760254, "global_step": 178842, "epoch": 2154} {"train_loss": -24.06728172302246, "global_step": 178843, "epoch": 2154} {"train_loss": -23.720304489135742, "global_step": 178844, "epoch": 2154} {"train_loss": -23.821760177612305, "global_step": 178845, "epoch": 2154} {"train_loss": -23.771127700805664, "global_step": 178846, "epoch": 2154} {"train_loss": -23.486642837524414, "global_step": 178847, "epoch": 2154} {"train_loss": -24.221240997314453, "global_step": 178848, "epoch": 2154} {"train_loss": -23.859724044799805, "global_step": 178849, "epoch": 2154} {"train_loss": -24.067251205444336, "global_step": 178850, "epoch": 2154} {"train_loss": -23.67227554321289, "global_step": 178851, "epoch": 2154} {"train_loss": -23.966800689697266, "global_step": 178852, "epoch": 2154} {"train_loss": -23.737539291381836, "global_step": 178853, "epoch": 2154} {"train_loss": -24.002540588378906, "global_step": 178854, "epoch": 2154} {"train_loss": -24.037015914916992, "global_step": 178855, "epoch": 2154} {"train_loss": -23.740880966186523, "global_step": 178856, "epoch": 2154} {"train_loss": -23.750993728637695, "global_step": 178857, "epoch": 2154} {"train_loss": -24.17707633972168, "global_step": 178858, "epoch": 2154} {"train_loss": -23.80550193786621, "global_step": 178859, "epoch": 2154} {"train_loss": -24.040908813476562, "global_step": 178860, "epoch": 2154} {"train_loss": -23.84248161315918, "global_step": 178861, "epoch": 2154} {"train_loss": -23.71725845336914, "global_step": 178862, "epoch": 2154} {"train_loss": -23.993284225463867, "global_step": 178863, "epoch": 2154} {"train_loss": -23.84834487179676, "global_step": 178864, "epoch": 2154, "val_loss": 6543584.0} {"train_loss": -23.84998893737793, "global_step": 178865, "epoch": 2155} {"train_loss": -23.10261344909668, "global_step": 178866, "epoch": 2155} {"train_loss": -23.517358779907227, "global_step": 178867, "epoch": 2155} {"train_loss": -23.611042022705078, "global_step": 178868, "epoch": 2155} {"train_loss": -23.47659683227539, "global_step": 178869, "epoch": 2155} {"train_loss": -23.022491455078125, "global_step": 178870, "epoch": 2155} {"train_loss": -23.52872657775879, "global_step": 178871, "epoch": 2155} {"train_loss": -23.04960060119629, "global_step": 178872, "epoch": 2155} {"train_loss": -23.877582550048828, "global_step": 178873, "epoch": 2155} {"train_loss": -23.496337890625, "global_step": 178874, "epoch": 2155} {"train_loss": -23.627164840698242, "global_step": 178875, "epoch": 2155} {"train_loss": -23.20840835571289, "global_step": 178876, "epoch": 2155} {"train_loss": -23.89130210876465, "global_step": 178877, "epoch": 2155} {"train_loss": -23.484760284423828, "global_step": 178878, "epoch": 2155} {"train_loss": -23.717132568359375, "global_step": 178879, "epoch": 2155} {"train_loss": -23.426908493041992, "global_step": 178880, "epoch": 2155} {"train_loss": -23.436908721923828, "global_step": 178881, "epoch": 2155} {"train_loss": -23.76004409790039, "global_step": 178882, "epoch": 2155} {"train_loss": -23.739137649536133, "global_step": 178883, "epoch": 2155} {"train_loss": -23.319833755493164, "global_step": 178884, "epoch": 2155} {"train_loss": -23.59711265563965, "global_step": 178885, "epoch": 2155} {"train_loss": -23.322290420532227, "global_step": 178886, "epoch": 2155} {"train_loss": -23.655887603759766, "global_step": 178887, "epoch": 2155} {"train_loss": -23.853384017944336, "global_step": 178888, "epoch": 2155} {"train_loss": -23.826295852661133, "global_step": 178889, "epoch": 2155} {"train_loss": -23.89906883239746, "global_step": 178890, "epoch": 2155} {"train_loss": -24.039770126342773, "global_step": 178891, "epoch": 2155} {"train_loss": -23.633747100830078, "global_step": 178892, "epoch": 2155} {"train_loss": -24.163137435913086, "global_step": 178893, "epoch": 2155} {"train_loss": -24.131078720092773, "global_step": 178894, "epoch": 2155} {"train_loss": -23.7742977142334, "global_step": 178895, "epoch": 2155} {"train_loss": -24.18537712097168, "global_step": 178896, "epoch": 2155} {"train_loss": -23.841642379760742, "global_step": 178897, "epoch": 2155} {"train_loss": -23.5360164642334, "global_step": 178898, "epoch": 2155} {"train_loss": -23.785247802734375, "global_step": 178899, "epoch": 2155} {"train_loss": -23.81155776977539, "global_step": 178900, "epoch": 2155} {"train_loss": -24.10431480407715, "global_step": 178901, "epoch": 2155} {"train_loss": -23.964262008666992, "global_step": 178902, "epoch": 2155} {"train_loss": -23.797460556030273, "global_step": 178903, "epoch": 2155} {"train_loss": -23.931360244750977, "global_step": 178904, "epoch": 2155} {"train_loss": -24.033676147460938, "global_step": 178905, "epoch": 2155} {"train_loss": -24.07415771484375, "global_step": 178906, "epoch": 2155} {"train_loss": -23.891986846923828, "global_step": 178907, "epoch": 2155} {"train_loss": -23.59578514099121, "global_step": 178908, "epoch": 2155} {"train_loss": -23.546499252319336, "global_step": 178909, "epoch": 2155} {"train_loss": -23.98247718811035, "global_step": 178910, "epoch": 2155} {"train_loss": -23.937082290649414, "global_step": 178911, "epoch": 2155} {"train_loss": -23.87978744506836, "global_step": 178912, "epoch": 2155} {"train_loss": -24.150962829589844, "global_step": 178913, "epoch": 2155} {"train_loss": -23.918142318725586, "global_step": 178914, "epoch": 2155} {"train_loss": -23.84882926940918, "global_step": 178915, "epoch": 2155} {"train_loss": -23.860605239868164, "global_step": 178916, "epoch": 2155} {"train_loss": -24.359981536865234, "global_step": 178917, "epoch": 2155} {"train_loss": -23.62005043029785, "global_step": 178918, "epoch": 2155} {"train_loss": -23.75453758239746, "global_step": 178919, "epoch": 2155} {"train_loss": -23.65188980102539, "global_step": 178920, "epoch": 2155} {"train_loss": -23.637826919555664, "global_step": 178921, "epoch": 2155} {"train_loss": -23.567102432250977, "global_step": 178922, "epoch": 2155} {"train_loss": -24.041860580444336, "global_step": 178923, "epoch": 2155} {"train_loss": -23.648466110229492, "global_step": 178924, "epoch": 2155} {"train_loss": -23.945531845092773, "global_step": 178925, "epoch": 2155} {"train_loss": -24.176984786987305, "global_step": 178926, "epoch": 2155} {"train_loss": -24.026899337768555, "global_step": 178927, "epoch": 2155} {"train_loss": -24.02936553955078, "global_step": 178928, "epoch": 2155} {"train_loss": -23.856609344482422, "global_step": 178929, "epoch": 2155} {"train_loss": -23.836576461791992, "global_step": 178930, "epoch": 2155} {"train_loss": -24.02821159362793, "global_step": 178931, "epoch": 2155} {"train_loss": -23.741912841796875, "global_step": 178932, "epoch": 2155} {"train_loss": -24.293697357177734, "global_step": 178933, "epoch": 2155} {"train_loss": -24.069318771362305, "global_step": 178934, "epoch": 2155} {"train_loss": -23.678293228149414, "global_step": 178935, "epoch": 2155} {"train_loss": -24.24355697631836, "global_step": 178936, "epoch": 2155} {"train_loss": -23.86025047302246, "global_step": 178937, "epoch": 2155} {"train_loss": -23.690208435058594, "global_step": 178938, "epoch": 2155} {"train_loss": -23.82765007019043, "global_step": 178939, "epoch": 2155} {"train_loss": -24.236021041870117, "global_step": 178940, "epoch": 2155} {"train_loss": -24.068073272705078, "global_step": 178941, "epoch": 2155} {"train_loss": -24.130664825439453, "global_step": 178942, "epoch": 2155} {"train_loss": -23.797012329101562, "global_step": 178943, "epoch": 2155} {"train_loss": -24.265127182006836, "global_step": 178944, "epoch": 2155} {"train_loss": -23.59571647644043, "global_step": 178945, "epoch": 2155} {"train_loss": -23.928186416625977, "global_step": 178946, "epoch": 2155} {"train_loss": -23.795999756778578, "global_step": 178947, "epoch": 2155, "val_loss": 6537412.0} {"train_loss": -23.633895874023438, "global_step": 178948, "epoch": 2156} {"train_loss": -23.32843589782715, "global_step": 178949, "epoch": 2156} {"train_loss": -23.68855094909668, "global_step": 178950, "epoch": 2156} {"train_loss": -23.31722640991211, "global_step": 178951, "epoch": 2156} {"train_loss": -23.244070053100586, "global_step": 178952, "epoch": 2156} {"train_loss": -23.553268432617188, "global_step": 178953, "epoch": 2156} {"train_loss": -23.49179458618164, "global_step": 178954, "epoch": 2156} {"train_loss": -23.521102905273438, "global_step": 178955, "epoch": 2156} {"train_loss": -23.921995162963867, "global_step": 178956, "epoch": 2156} {"train_loss": -23.707881927490234, "global_step": 178957, "epoch": 2156} {"train_loss": -23.431283950805664, "global_step": 178958, "epoch": 2156} {"train_loss": -23.836509704589844, "global_step": 178959, "epoch": 2156} {"train_loss": -23.54681968688965, "global_step": 178960, "epoch": 2156} {"train_loss": -23.521276473999023, "global_step": 178961, "epoch": 2156} {"train_loss": -23.422475814819336, "global_step": 178962, "epoch": 2156} {"train_loss": -23.896150588989258, "global_step": 178963, "epoch": 2156} {"train_loss": -23.413959503173828, "global_step": 178964, "epoch": 2156} {"train_loss": -24.098026275634766, "global_step": 178965, "epoch": 2156} {"train_loss": -23.659154891967773, "global_step": 178966, "epoch": 2156} {"train_loss": -23.46445083618164, "global_step": 178967, "epoch": 2156} {"train_loss": -23.653100967407227, "global_step": 178968, "epoch": 2156} {"train_loss": -23.967805862426758, "global_step": 178969, "epoch": 2156} {"train_loss": -24.16091537475586, "global_step": 178970, "epoch": 2156} {"train_loss": -23.791305541992188, "global_step": 178971, "epoch": 2156} {"train_loss": -23.685144424438477, "global_step": 178972, "epoch": 2156} {"train_loss": -24.079992294311523, "global_step": 178973, "epoch": 2156} {"train_loss": -23.683332443237305, "global_step": 178974, "epoch": 2156} {"train_loss": -23.985685348510742, "global_step": 178975, "epoch": 2156} {"train_loss": -23.79252052307129, "global_step": 178976, "epoch": 2156} {"train_loss": -23.74884033203125, "global_step": 178977, "epoch": 2156} {"train_loss": -23.685544967651367, "global_step": 178978, "epoch": 2156} {"train_loss": -24.32252311706543, "global_step": 178979, "epoch": 2156} {"train_loss": -24.115636825561523, "global_step": 178980, "epoch": 2156} {"train_loss": -24.089597702026367, "global_step": 178981, "epoch": 2156} {"train_loss": -23.582765579223633, "global_step": 178982, "epoch": 2156} {"train_loss": -23.971172332763672, "global_step": 178983, "epoch": 2156} {"train_loss": -23.944120407104492, "global_step": 178984, "epoch": 2156} {"train_loss": -23.942066192626953, "global_step": 178985, "epoch": 2156} {"train_loss": -23.77488899230957, "global_step": 178986, "epoch": 2156} {"train_loss": -23.9957218170166, "global_step": 178987, "epoch": 2156} {"train_loss": -24.074857711791992, "global_step": 178988, "epoch": 2156} {"train_loss": -23.328886032104492, "global_step": 178989, "epoch": 2156} {"train_loss": -23.658985137939453, "global_step": 178990, "epoch": 2156} {"train_loss": -23.55081558227539, "global_step": 178991, "epoch": 2156} {"train_loss": -23.716379165649414, "global_step": 178992, "epoch": 2156} {"train_loss": -23.816770553588867, "global_step": 178993, "epoch": 2156} {"train_loss": -24.014453887939453, "global_step": 178994, "epoch": 2156} {"train_loss": -23.635021209716797, "global_step": 178995, "epoch": 2156} {"train_loss": -23.869447708129883, "global_step": 178996, "epoch": 2156} {"train_loss": -23.80946922302246, "global_step": 178997, "epoch": 2156} {"train_loss": -23.849903106689453, "global_step": 178998, "epoch": 2156} {"train_loss": -23.72657585144043, "global_step": 178999, "epoch": 2156} {"train_loss": -23.61099624633789, "global_step": 179000, "epoch": 2156} {"train_loss": -23.76874542236328, "global_step": 179001, "epoch": 2156} {"train_loss": -23.485660552978516, "global_step": 179002, "epoch": 2156} {"train_loss": -24.016273498535156, "global_step": 179003, "epoch": 2156} {"train_loss": -23.786659240722656, "global_step": 179004, "epoch": 2156} {"train_loss": -24.035415649414062, "global_step": 179005, "epoch": 2156} {"train_loss": -23.900049209594727, "global_step": 179006, "epoch": 2156} {"train_loss": -23.997709274291992, "global_step": 179007, "epoch": 2156} {"train_loss": -23.962297439575195, "global_step": 179008, "epoch": 2156} {"train_loss": -23.987354278564453, "global_step": 179009, "epoch": 2156} {"train_loss": -23.96746063232422, "global_step": 179010, "epoch": 2156} {"train_loss": -23.7635440826416, "global_step": 179011, "epoch": 2156} {"train_loss": -23.786623001098633, "global_step": 179012, "epoch": 2156} {"train_loss": -23.73781394958496, "global_step": 179013, "epoch": 2156} {"train_loss": -23.77845573425293, "global_step": 179014, "epoch": 2156} {"train_loss": -24.16547203063965, "global_step": 179015, "epoch": 2156} {"train_loss": -23.94761085510254, "global_step": 179016, "epoch": 2156} {"train_loss": -23.827604293823242, "global_step": 179017, "epoch": 2156} {"train_loss": -23.82146453857422, "global_step": 179018, "epoch": 2156} {"train_loss": -23.9682559967041, "global_step": 179019, "epoch": 2156} {"train_loss": -23.932220458984375, "global_step": 179020, "epoch": 2156} {"train_loss": -23.749622344970703, "global_step": 179021, "epoch": 2156} {"train_loss": -24.035398483276367, "global_step": 179022, "epoch": 2156} {"train_loss": -23.89344024658203, "global_step": 179023, "epoch": 2156} {"train_loss": -23.966272354125977, "global_step": 179024, "epoch": 2156} {"train_loss": -23.962141036987305, "global_step": 179025, "epoch": 2156} {"train_loss": -24.062047958374023, "global_step": 179026, "epoch": 2156} {"train_loss": -24.31776237487793, "global_step": 179027, "epoch": 2156} {"train_loss": -23.73969841003418, "global_step": 179028, "epoch": 2156} {"train_loss": -23.84963035583496, "global_step": 179029, "epoch": 2156} {"train_loss": -23.801415408950255, "global_step": 179030, "epoch": 2156, "val_loss": 6341658.0} {"train_loss": -23.27197265625, "global_step": 179031, "epoch": 2157} {"train_loss": -22.734466552734375, "global_step": 179032, "epoch": 2157} {"train_loss": -23.21373748779297, "global_step": 179033, "epoch": 2157} {"train_loss": -23.34221649169922, "global_step": 179034, "epoch": 2157} {"train_loss": -23.861164093017578, "global_step": 179035, "epoch": 2157} {"train_loss": -23.548616409301758, "global_step": 179036, "epoch": 2157} {"train_loss": -23.42350196838379, "global_step": 179037, "epoch": 2157} {"train_loss": -24.126527786254883, "global_step": 179038, "epoch": 2157} {"train_loss": -23.872928619384766, "global_step": 179039, "epoch": 2157} {"train_loss": -23.78508758544922, "global_step": 179040, "epoch": 2157} {"train_loss": -23.77627944946289, "global_step": 179041, "epoch": 2157} {"train_loss": -23.948558807373047, "global_step": 179042, "epoch": 2157} {"train_loss": -23.80905532836914, "global_step": 179043, "epoch": 2157} {"train_loss": -23.941980361938477, "global_step": 179044, "epoch": 2157} {"train_loss": -23.94467544555664, "global_step": 179045, "epoch": 2157} {"train_loss": -23.939970016479492, "global_step": 179046, "epoch": 2157} {"train_loss": -23.968564987182617, "global_step": 179047, "epoch": 2157} {"train_loss": -23.781980514526367, "global_step": 179048, "epoch": 2157} {"train_loss": -23.756479263305664, "global_step": 179049, "epoch": 2157} {"train_loss": -24.003583908081055, "global_step": 179050, "epoch": 2157} {"train_loss": -23.813278198242188, "global_step": 179051, "epoch": 2157} {"train_loss": -23.814605712890625, "global_step": 179052, "epoch": 2157} {"train_loss": -23.564279556274414, "global_step": 179053, "epoch": 2157} {"train_loss": -24.145666122436523, "global_step": 179054, "epoch": 2157} {"train_loss": -24.12432289123535, "global_step": 179055, "epoch": 2157} {"train_loss": -23.68277359008789, "global_step": 179056, "epoch": 2157} {"train_loss": -23.698118209838867, "global_step": 179057, "epoch": 2157} {"train_loss": -23.45220947265625, "global_step": 179058, "epoch": 2157} {"train_loss": -23.70992088317871, "global_step": 179059, "epoch": 2157} {"train_loss": -23.811756134033203, "global_step": 179060, "epoch": 2157} {"train_loss": -23.858030319213867, "global_step": 179061, "epoch": 2157} {"train_loss": -23.425758361816406, "global_step": 179062, "epoch": 2157} {"train_loss": -23.9107608795166, "global_step": 179063, "epoch": 2157} {"train_loss": -23.765308380126953, "global_step": 179064, "epoch": 2157} {"train_loss": -23.9570369720459, "global_step": 179065, "epoch": 2157} {"train_loss": -23.789731979370117, "global_step": 179066, "epoch": 2157} {"train_loss": -23.93733024597168, "global_step": 179067, "epoch": 2157} {"train_loss": -24.10390281677246, "global_step": 179068, "epoch": 2157} {"train_loss": -24.051410675048828, "global_step": 179069, "epoch": 2157} {"train_loss": -24.091581344604492, "global_step": 179070, "epoch": 2157} {"train_loss": -23.828205108642578, "global_step": 179071, "epoch": 2157} {"train_loss": -24.120771408081055, "global_step": 179072, "epoch": 2157} {"train_loss": -23.94757652282715, "global_step": 179073, "epoch": 2157} {"train_loss": -24.04207992553711, "global_step": 179074, "epoch": 2157} {"train_loss": -23.650680541992188, "global_step": 179075, "epoch": 2157} {"train_loss": -23.92420768737793, "global_step": 179076, "epoch": 2157} {"train_loss": -23.869766235351562, "global_step": 179077, "epoch": 2157} {"train_loss": -23.96483039855957, "global_step": 179078, "epoch": 2157} {"train_loss": -23.91315269470215, "global_step": 179079, "epoch": 2157} {"train_loss": -24.008474349975586, "global_step": 179080, "epoch": 2157} {"train_loss": -23.776203155517578, "global_step": 179081, "epoch": 2157} {"train_loss": -24.103513717651367, "global_step": 179082, "epoch": 2157} {"train_loss": -23.663909912109375, "global_step": 179083, "epoch": 2157} {"train_loss": -24.126245498657227, "global_step": 179084, "epoch": 2157} {"train_loss": -23.249576568603516, "global_step": 179085, "epoch": 2157} {"train_loss": -24.164995193481445, "global_step": 179086, "epoch": 2157} {"train_loss": -23.771343231201172, "global_step": 179087, "epoch": 2157} {"train_loss": -23.347684860229492, "global_step": 179088, "epoch": 2157} {"train_loss": -23.662431716918945, "global_step": 179089, "epoch": 2157} {"train_loss": -24.126102447509766, "global_step": 179090, "epoch": 2157} {"train_loss": -24.193117141723633, "global_step": 179091, "epoch": 2157} {"train_loss": -23.907363891601562, "global_step": 179092, "epoch": 2157} {"train_loss": -24.061452865600586, "global_step": 179093, "epoch": 2157} {"train_loss": -24.009374618530273, "global_step": 179094, "epoch": 2157} {"train_loss": -23.84320831298828, "global_step": 179095, "epoch": 2157} {"train_loss": -23.92514991760254, "global_step": 179096, "epoch": 2157} {"train_loss": -23.978195190429688, "global_step": 179097, "epoch": 2157} {"train_loss": -24.065048217773438, "global_step": 179098, "epoch": 2157} {"train_loss": -23.987943649291992, "global_step": 179099, "epoch": 2157} {"train_loss": -24.040124893188477, "global_step": 179100, "epoch": 2157} {"train_loss": -24.021717071533203, "global_step": 179101, "epoch": 2157} {"train_loss": -23.6916561126709, "global_step": 179102, "epoch": 2157} {"train_loss": -23.428234100341797, "global_step": 179103, "epoch": 2157} {"train_loss": -23.706541061401367, "global_step": 179104, "epoch": 2157} {"train_loss": -23.624683380126953, "global_step": 179105, "epoch": 2157} {"train_loss": -23.721839904785156, "global_step": 179106, "epoch": 2157} {"train_loss": -24.01003074645996, "global_step": 179107, "epoch": 2157} {"train_loss": -23.725698471069336, "global_step": 179108, "epoch": 2157} {"train_loss": -23.91971206665039, "global_step": 179109, "epoch": 2157} {"train_loss": -24.006269454956055, "global_step": 179110, "epoch": 2157} {"train_loss": -23.8538761138916, "global_step": 179111, "epoch": 2157} {"train_loss": -23.786489486694336, "global_step": 179112, "epoch": 2157} {"train_loss": -23.825244076280708, "global_step": 179113, "epoch": 2157, "val_loss": 6417062.5} {"train_loss": -22.86726188659668, "global_step": 179114, "epoch": 2158} {"train_loss": -21.265155792236328, "global_step": 179115, "epoch": 2158} {"train_loss": -23.367874145507812, "global_step": 179116, "epoch": 2158} {"train_loss": -22.726675033569336, "global_step": 179117, "epoch": 2158} {"train_loss": -22.319921493530273, "global_step": 179118, "epoch": 2158} {"train_loss": -22.89349937438965, "global_step": 179119, "epoch": 2158} {"train_loss": -22.765676498413086, "global_step": 179120, "epoch": 2158} {"train_loss": -23.3814754486084, "global_step": 179121, "epoch": 2158} {"train_loss": -23.070791244506836, "global_step": 179122, "epoch": 2158} {"train_loss": -23.21448516845703, "global_step": 179123, "epoch": 2158} {"train_loss": -22.862224578857422, "global_step": 179124, "epoch": 2158} {"train_loss": -23.19923973083496, "global_step": 179125, "epoch": 2158} {"train_loss": -22.99379539489746, "global_step": 179126, "epoch": 2158} {"train_loss": -23.402847290039062, "global_step": 179127, "epoch": 2158} {"train_loss": -23.479785919189453, "global_step": 179128, "epoch": 2158} {"train_loss": -23.210264205932617, "global_step": 179129, "epoch": 2158} {"train_loss": -23.105329513549805, "global_step": 179130, "epoch": 2158} {"train_loss": -23.284446716308594, "global_step": 179131, "epoch": 2158} {"train_loss": -23.810298919677734, "global_step": 179132, "epoch": 2158} {"train_loss": -23.497976303100586, "global_step": 179133, "epoch": 2158} {"train_loss": -23.6618595123291, "global_step": 179134, "epoch": 2158} {"train_loss": -23.776947021484375, "global_step": 179135, "epoch": 2158} {"train_loss": -23.501182556152344, "global_step": 179136, "epoch": 2158} {"train_loss": -23.708402633666992, "global_step": 179137, "epoch": 2158} {"train_loss": -23.78154182434082, "global_step": 179138, "epoch": 2158} {"train_loss": -23.88491439819336, "global_step": 179139, "epoch": 2158} {"train_loss": -23.610937118530273, "global_step": 179140, "epoch": 2158} {"train_loss": -23.893756866455078, "global_step": 179141, "epoch": 2158} {"train_loss": -23.483795166015625, "global_step": 179142, "epoch": 2158} {"train_loss": -23.43336296081543, "global_step": 179143, "epoch": 2158} {"train_loss": -23.742040634155273, "global_step": 179144, "epoch": 2158} {"train_loss": -23.80328941345215, "global_step": 179145, "epoch": 2158} {"train_loss": -23.9754695892334, "global_step": 179146, "epoch": 2158} {"train_loss": -23.723573684692383, "global_step": 179147, "epoch": 2158} {"train_loss": -24.1425838470459, "global_step": 179148, "epoch": 2158} {"train_loss": -23.801467895507812, "global_step": 179149, "epoch": 2158} {"train_loss": -24.174957275390625, "global_step": 179150, "epoch": 2158} {"train_loss": -24.341062545776367, "global_step": 179151, "epoch": 2158} {"train_loss": -24.573068618774414, "global_step": 179152, "epoch": 2158} {"train_loss": -23.756275177001953, "global_step": 179153, "epoch": 2158} {"train_loss": -23.566415786743164, "global_step": 179154, "epoch": 2158} {"train_loss": -24.207490921020508, "global_step": 179155, "epoch": 2158} {"train_loss": -24.072797775268555, "global_step": 179156, "epoch": 2158} {"train_loss": -24.122772216796875, "global_step": 179157, "epoch": 2158} {"train_loss": -23.923858642578125, "global_step": 179158, "epoch": 2158} {"train_loss": -23.946237564086914, "global_step": 179159, "epoch": 2158} {"train_loss": -24.24574851989746, "global_step": 179160, "epoch": 2158} {"train_loss": -24.022092819213867, "global_step": 179161, "epoch": 2158} {"train_loss": -23.81136703491211, "global_step": 179162, "epoch": 2158} {"train_loss": -24.239561080932617, "global_step": 179163, "epoch": 2158} {"train_loss": -23.71415138244629, "global_step": 179164, "epoch": 2158} {"train_loss": -24.03944206237793, "global_step": 179165, "epoch": 2158} {"train_loss": -24.083890914916992, "global_step": 179166, "epoch": 2158} {"train_loss": -24.085956573486328, "global_step": 179167, "epoch": 2158} {"train_loss": -24.270769119262695, "global_step": 179168, "epoch": 2158} {"train_loss": -23.5916690826416, "global_step": 179169, "epoch": 2158} {"train_loss": -23.806743621826172, "global_step": 179170, "epoch": 2158} {"train_loss": -24.349870681762695, "global_step": 179171, "epoch": 2158} {"train_loss": -24.183202743530273, "global_step": 179172, "epoch": 2158} {"train_loss": -23.894977569580078, "global_step": 179173, "epoch": 2158} {"train_loss": -23.89556312561035, "global_step": 179174, "epoch": 2158} {"train_loss": -23.608552932739258, "global_step": 179175, "epoch": 2158} {"train_loss": -23.35390281677246, "global_step": 179176, "epoch": 2158} {"train_loss": -23.47443962097168, "global_step": 179177, "epoch": 2158} {"train_loss": -23.560001373291016, "global_step": 179178, "epoch": 2158} {"train_loss": -23.949905395507812, "global_step": 179179, "epoch": 2158} {"train_loss": -23.293088912963867, "global_step": 179180, "epoch": 2158} {"train_loss": -23.449621200561523, "global_step": 179181, "epoch": 2158} {"train_loss": -24.024200439453125, "global_step": 179182, "epoch": 2158} {"train_loss": -23.385604858398438, "global_step": 179183, "epoch": 2158} {"train_loss": -23.611852645874023, "global_step": 179184, "epoch": 2158} {"train_loss": -23.714920043945312, "global_step": 179185, "epoch": 2158} {"train_loss": -23.497793197631836, "global_step": 179186, "epoch": 2158} {"train_loss": -23.7117862701416, "global_step": 179187, "epoch": 2158} {"train_loss": -23.80768394470215, "global_step": 179188, "epoch": 2158} {"train_loss": -23.88275146484375, "global_step": 179189, "epoch": 2158} {"train_loss": -23.58395004272461, "global_step": 179190, "epoch": 2158} {"train_loss": -23.51167869567871, "global_step": 179191, "epoch": 2158} {"train_loss": -23.903881072998047, "global_step": 179192, "epoch": 2158} {"train_loss": -23.7196102142334, "global_step": 179193, "epoch": 2158} {"train_loss": -23.71599006652832, "global_step": 179194, "epoch": 2158} {"train_loss": -23.748106002807617, "global_step": 179195, "epoch": 2158} {"train_loss": -23.65251315932676, "global_step": 179196, "epoch": 2158, "val_loss": 6428282.0} {"train_loss": -23.495147705078125, "global_step": 179197, "epoch": 2159} {"train_loss": -23.2463321685791, "global_step": 179198, "epoch": 2159} {"train_loss": -23.8710994720459, "global_step": 179199, "epoch": 2159} {"train_loss": -23.28898811340332, "global_step": 179200, "epoch": 2159} {"train_loss": -23.508567810058594, "global_step": 179201, "epoch": 2159} {"train_loss": -23.854520797729492, "global_step": 179202, "epoch": 2159} {"train_loss": -23.711400985717773, "global_step": 179203, "epoch": 2159} {"train_loss": -23.807861328125, "global_step": 179204, "epoch": 2159} {"train_loss": -23.409048080444336, "global_step": 179205, "epoch": 2159} {"train_loss": -23.926603317260742, "global_step": 179206, "epoch": 2159} {"train_loss": -23.490270614624023, "global_step": 179207, "epoch": 2159} {"train_loss": -23.66286277770996, "global_step": 179208, "epoch": 2159} {"train_loss": -23.74513816833496, "global_step": 179209, "epoch": 2159} {"train_loss": -23.658489227294922, "global_step": 179210, "epoch": 2159} {"train_loss": -23.56793785095215, "global_step": 179211, "epoch": 2159} {"train_loss": -23.666685104370117, "global_step": 179212, "epoch": 2159} {"train_loss": -23.724796295166016, "global_step": 179213, "epoch": 2159} {"train_loss": -23.9294376373291, "global_step": 179214, "epoch": 2159} {"train_loss": -24.003355026245117, "global_step": 179215, "epoch": 2159} {"train_loss": -23.71617889404297, "global_step": 179216, "epoch": 2159} {"train_loss": -23.9406681060791, "global_step": 179217, "epoch": 2159} {"train_loss": -24.06100845336914, "global_step": 179218, "epoch": 2159} {"train_loss": -24.111661911010742, "global_step": 179219, "epoch": 2159} {"train_loss": -23.772581100463867, "global_step": 179220, "epoch": 2159} {"train_loss": -23.499738693237305, "global_step": 179221, "epoch": 2159} {"train_loss": -23.666669845581055, "global_step": 179222, "epoch": 2159} {"train_loss": -23.76213836669922, "global_step": 179223, "epoch": 2159} {"train_loss": -23.73270034790039, "global_step": 179224, "epoch": 2159} {"train_loss": -24.173643112182617, "global_step": 179225, "epoch": 2159} {"train_loss": -23.98187255859375, "global_step": 179226, "epoch": 2159} {"train_loss": -23.8397159576416, "global_step": 179227, "epoch": 2159} {"train_loss": -23.843955993652344, "global_step": 179228, "epoch": 2159} {"train_loss": -23.655973434448242, "global_step": 179229, "epoch": 2159} {"train_loss": -24.24445915222168, "global_step": 179230, "epoch": 2159} {"train_loss": -23.914024353027344, "global_step": 179231, "epoch": 2159} {"train_loss": -23.60701560974121, "global_step": 179232, "epoch": 2159} {"train_loss": -23.917999267578125, "global_step": 179233, "epoch": 2159} {"train_loss": -24.297256469726562, "global_step": 179234, "epoch": 2159} {"train_loss": -24.071653366088867, "global_step": 179235, "epoch": 2159} {"train_loss": -23.861892700195312, "global_step": 179236, "epoch": 2159} {"train_loss": -24.378158569335938, "global_step": 179237, "epoch": 2159} {"train_loss": -23.94784927368164, "global_step": 179238, "epoch": 2159} {"train_loss": -24.071937561035156, "global_step": 179239, "epoch": 2159} {"train_loss": -24.318151473999023, "global_step": 179240, "epoch": 2159} {"train_loss": -23.903547286987305, "global_step": 179241, "epoch": 2159} {"train_loss": -24.18670654296875, "global_step": 179242, "epoch": 2159} {"train_loss": -23.91657829284668, "global_step": 179243, "epoch": 2159} {"train_loss": -23.896724700927734, "global_step": 179244, "epoch": 2159} {"train_loss": -24.111042022705078, "global_step": 179245, "epoch": 2159} {"train_loss": -23.717016220092773, "global_step": 179246, "epoch": 2159} {"train_loss": -23.92243766784668, "global_step": 179247, "epoch": 2159} {"train_loss": -24.093576431274414, "global_step": 179248, "epoch": 2159} {"train_loss": -23.593931198120117, "global_step": 179249, "epoch": 2159} {"train_loss": -23.503936767578125, "global_step": 179250, "epoch": 2159} {"train_loss": -23.665664672851562, "global_step": 179251, "epoch": 2159} {"train_loss": -24.022863388061523, "global_step": 179252, "epoch": 2159} {"train_loss": -23.990182876586914, "global_step": 179253, "epoch": 2159} {"train_loss": -23.573318481445312, "global_step": 179254, "epoch": 2159} {"train_loss": -23.511932373046875, "global_step": 179255, "epoch": 2159} {"train_loss": -23.630435943603516, "global_step": 179256, "epoch": 2159} {"train_loss": -23.832029342651367, "global_step": 179257, "epoch": 2159} {"train_loss": -23.684926986694336, "global_step": 179258, "epoch": 2159} {"train_loss": -23.632801055908203, "global_step": 179259, "epoch": 2159} {"train_loss": -23.8123836517334, "global_step": 179260, "epoch": 2159} {"train_loss": -23.79684829711914, "global_step": 179261, "epoch": 2159} {"train_loss": -24.060218811035156, "global_step": 179262, "epoch": 2159} {"train_loss": -23.65778160095215, "global_step": 179263, "epoch": 2159} {"train_loss": -23.777185440063477, "global_step": 179264, "epoch": 2159} {"train_loss": -23.85738754272461, "global_step": 179265, "epoch": 2159} {"train_loss": -23.709609985351562, "global_step": 179266, "epoch": 2159} {"train_loss": -23.827495574951172, "global_step": 179267, "epoch": 2159} {"train_loss": -23.58034324645996, "global_step": 179268, "epoch": 2159} {"train_loss": -23.80495262145996, "global_step": 179269, "epoch": 2159} {"train_loss": -24.056217193603516, "global_step": 179270, "epoch": 2159} {"train_loss": -24.115751266479492, "global_step": 179271, "epoch": 2159} {"train_loss": -23.75636863708496, "global_step": 179272, "epoch": 2159} {"train_loss": -23.9226016998291, "global_step": 179273, "epoch": 2159} {"train_loss": -23.807294845581055, "global_step": 179274, "epoch": 2159} {"train_loss": -24.05555534362793, "global_step": 179275, "epoch": 2159} {"train_loss": -23.854169845581055, "global_step": 179276, "epoch": 2159} {"train_loss": -24.06403923034668, "global_step": 179277, "epoch": 2159} {"train_loss": -23.67136573791504, "global_step": 179278, "epoch": 2159} {"train_loss": -23.820121742156616, "global_step": 179279, "epoch": 2159, "val_loss": 6376854.5} {"train_loss": -23.87478256225586, "global_step": 179280, "epoch": 2160} {"train_loss": -23.650775909423828, "global_step": 179281, "epoch": 2160} {"train_loss": -23.819095611572266, "global_step": 179282, "epoch": 2160} {"train_loss": -23.686132431030273, "global_step": 179283, "epoch": 2160} {"train_loss": -23.878026962280273, "global_step": 179284, "epoch": 2160} {"train_loss": -23.762264251708984, "global_step": 179285, "epoch": 2160} {"train_loss": -23.447050094604492, "global_step": 179286, "epoch": 2160} {"train_loss": -23.74493980407715, "global_step": 179287, "epoch": 2160} {"train_loss": -23.6232967376709, "global_step": 179288, "epoch": 2160} {"train_loss": -23.808536529541016, "global_step": 179289, "epoch": 2160} {"train_loss": -23.678394317626953, "global_step": 179290, "epoch": 2160} {"train_loss": -23.868545532226562, "global_step": 179291, "epoch": 2160} {"train_loss": -23.74184226989746, "global_step": 179292, "epoch": 2160} {"train_loss": -23.816913604736328, "global_step": 179293, "epoch": 2160} {"train_loss": -23.22085189819336, "global_step": 179294, "epoch": 2160} {"train_loss": -23.783113479614258, "global_step": 179295, "epoch": 2160} {"train_loss": -23.659696578979492, "global_step": 179296, "epoch": 2160} {"train_loss": -23.6479549407959, "global_step": 179297, "epoch": 2160} {"train_loss": -23.587987899780273, "global_step": 179298, "epoch": 2160} {"train_loss": -23.734603881835938, "global_step": 179299, "epoch": 2160} {"train_loss": -23.223533630371094, "global_step": 179300, "epoch": 2160} {"train_loss": -23.91032600402832, "global_step": 179301, "epoch": 2160} {"train_loss": -23.666339874267578, "global_step": 179302, "epoch": 2160} {"train_loss": -23.503944396972656, "global_step": 179303, "epoch": 2160} {"train_loss": -24.03803062438965, "global_step": 179304, "epoch": 2160} {"train_loss": -23.757369995117188, "global_step": 179305, "epoch": 2160} {"train_loss": -23.381240844726562, "global_step": 179306, "epoch": 2160} {"train_loss": -23.817646026611328, "global_step": 179307, "epoch": 2160} {"train_loss": -23.953954696655273, "global_step": 179308, "epoch": 2160} {"train_loss": -23.828638076782227, "global_step": 179309, "epoch": 2160} {"train_loss": -23.94989585876465, "global_step": 179310, "epoch": 2160} {"train_loss": -24.063514709472656, "global_step": 179311, "epoch": 2160} {"train_loss": -23.894683837890625, "global_step": 179312, "epoch": 2160} {"train_loss": -23.693267822265625, "global_step": 179313, "epoch": 2160} {"train_loss": -23.958850860595703, "global_step": 179314, "epoch": 2160} {"train_loss": -23.781360626220703, "global_step": 179315, "epoch": 2160} {"train_loss": -23.70962142944336, "global_step": 179316, "epoch": 2160} {"train_loss": -24.186586380004883, "global_step": 179317, "epoch": 2160} {"train_loss": -23.773151397705078, "global_step": 179318, "epoch": 2160} {"train_loss": -23.883222579956055, "global_step": 179319, "epoch": 2160} {"train_loss": -24.139238357543945, "global_step": 179320, "epoch": 2160} {"train_loss": -23.854263305664062, "global_step": 179321, "epoch": 2160} {"train_loss": -23.91131591796875, "global_step": 179322, "epoch": 2160} {"train_loss": -24.03652000427246, "global_step": 179323, "epoch": 2160} {"train_loss": -24.339445114135742, "global_step": 179324, "epoch": 2160} {"train_loss": -24.074277877807617, "global_step": 179325, "epoch": 2160} {"train_loss": -23.844558715820312, "global_step": 179326, "epoch": 2160} {"train_loss": -24.22560691833496, "global_step": 179327, "epoch": 2160} {"train_loss": -23.70908546447754, "global_step": 179328, "epoch": 2160} {"train_loss": -23.848264694213867, "global_step": 179329, "epoch": 2160} {"train_loss": -23.613595962524414, "global_step": 179330, "epoch": 2160} {"train_loss": -23.778451919555664, "global_step": 179331, "epoch": 2160} {"train_loss": -23.82045555114746, "global_step": 179332, "epoch": 2160} {"train_loss": -23.86546516418457, "global_step": 179333, "epoch": 2160} {"train_loss": -23.895751953125, "global_step": 179334, "epoch": 2160} {"train_loss": -23.68843650817871, "global_step": 179335, "epoch": 2160} {"train_loss": -24.147445678710938, "global_step": 179336, "epoch": 2160} {"train_loss": -24.052064895629883, "global_step": 179337, "epoch": 2160} {"train_loss": -23.888986587524414, "global_step": 179338, "epoch": 2160} {"train_loss": -24.127954483032227, "global_step": 179339, "epoch": 2160} {"train_loss": -24.101716995239258, "global_step": 179340, "epoch": 2160} {"train_loss": -24.094390869140625, "global_step": 179341, "epoch": 2160} {"train_loss": -24.046619415283203, "global_step": 179342, "epoch": 2160} {"train_loss": -23.994550704956055, "global_step": 179343, "epoch": 2160} {"train_loss": -24.018394470214844, "global_step": 179344, "epoch": 2160} {"train_loss": -24.022031784057617, "global_step": 179345, "epoch": 2160} {"train_loss": -23.667369842529297, "global_step": 179346, "epoch": 2160} {"train_loss": -23.95533561706543, "global_step": 179347, "epoch": 2160} {"train_loss": -23.636438369750977, "global_step": 179348, "epoch": 2160} {"train_loss": -24.157623291015625, "global_step": 179349, "epoch": 2160} {"train_loss": -23.926177978515625, "global_step": 179350, "epoch": 2160} {"train_loss": -23.8134822845459, "global_step": 179351, "epoch": 2160} {"train_loss": -24.0140438079834, "global_step": 179352, "epoch": 2160} {"train_loss": -24.04548454284668, "global_step": 179353, "epoch": 2160} {"train_loss": -23.636396408081055, "global_step": 179354, "epoch": 2160} {"train_loss": -24.035898208618164, "global_step": 179355, "epoch": 2160} {"train_loss": -24.001543045043945, "global_step": 179356, "epoch": 2160} {"train_loss": -23.92426109313965, "global_step": 179357, "epoch": 2160} {"train_loss": -24.161392211914062, "global_step": 179358, "epoch": 2160} {"train_loss": -23.655410766601562, "global_step": 179359, "epoch": 2160} {"train_loss": -24.06293296813965, "global_step": 179360, "epoch": 2160} {"train_loss": -24.125078201293945, "global_step": 179361, "epoch": 2160} {"train_loss": -23.862867102565534, "global_step": 179362, "epoch": 2160, "val_loss": 6572369.5} {"train_loss": -23.384326934814453, "global_step": 179363, "epoch": 2161} {"train_loss": -22.905410766601562, "global_step": 179364, "epoch": 2161} {"train_loss": -22.980077743530273, "global_step": 179365, "epoch": 2161} {"train_loss": -23.364566802978516, "global_step": 179366, "epoch": 2161} {"train_loss": -22.852903366088867, "global_step": 179367, "epoch": 2161} {"train_loss": -22.89103889465332, "global_step": 179368, "epoch": 2161} {"train_loss": -23.501684188842773, "global_step": 179369, "epoch": 2161} {"train_loss": -23.032304763793945, "global_step": 179370, "epoch": 2161} {"train_loss": -23.312963485717773, "global_step": 179371, "epoch": 2161} {"train_loss": -23.4724063873291, "global_step": 179372, "epoch": 2161} {"train_loss": -23.150257110595703, "global_step": 179373, "epoch": 2161} {"train_loss": -23.677997589111328, "global_step": 179374, "epoch": 2161} {"train_loss": -23.638513565063477, "global_step": 179375, "epoch": 2161} {"train_loss": -23.56820297241211, "global_step": 179376, "epoch": 2161} {"train_loss": -23.616701126098633, "global_step": 179377, "epoch": 2161} {"train_loss": -23.31564712524414, "global_step": 179378, "epoch": 2161} {"train_loss": -23.565805435180664, "global_step": 179379, "epoch": 2161} {"train_loss": -23.52143669128418, "global_step": 179380, "epoch": 2161} {"train_loss": -23.57199478149414, "global_step": 179381, "epoch": 2161} {"train_loss": -23.443262100219727, "global_step": 179382, "epoch": 2161} {"train_loss": -23.328323364257812, "global_step": 179383, "epoch": 2161} {"train_loss": -23.666269302368164, "global_step": 179384, "epoch": 2161} {"train_loss": -23.79905891418457, "global_step": 179385, "epoch": 2161} {"train_loss": -23.43571662902832, "global_step": 179386, "epoch": 2161} {"train_loss": -23.77288818359375, "global_step": 179387, "epoch": 2161} {"train_loss": -23.676040649414062, "global_step": 179388, "epoch": 2161} {"train_loss": -23.94989585876465, "global_step": 179389, "epoch": 2161} {"train_loss": -23.93440818786621, "global_step": 179390, "epoch": 2161} {"train_loss": -23.73301887512207, "global_step": 179391, "epoch": 2161} {"train_loss": -23.56235694885254, "global_step": 179392, "epoch": 2161} {"train_loss": -23.736648559570312, "global_step": 179393, "epoch": 2161} {"train_loss": -23.829456329345703, "global_step": 179394, "epoch": 2161} {"train_loss": -23.972503662109375, "global_step": 179395, "epoch": 2161} {"train_loss": -23.90011978149414, "global_step": 179396, "epoch": 2161} {"train_loss": -23.70353126525879, "global_step": 179397, "epoch": 2161} {"train_loss": -23.8038387298584, "global_step": 179398, "epoch": 2161} {"train_loss": -23.794897079467773, "global_step": 179399, "epoch": 2161} {"train_loss": -23.80348777770996, "global_step": 179400, "epoch": 2161} {"train_loss": -23.822912216186523, "global_step": 179401, "epoch": 2161} {"train_loss": -23.731801986694336, "global_step": 179402, "epoch": 2161} {"train_loss": -23.816102981567383, "global_step": 179403, "epoch": 2161} {"train_loss": -23.7659854888916, "global_step": 179404, "epoch": 2161} {"train_loss": -23.768564224243164, "global_step": 179405, "epoch": 2161} {"train_loss": -23.80216407775879, "global_step": 179406, "epoch": 2161} {"train_loss": -23.66344451904297, "global_step": 179407, "epoch": 2161} {"train_loss": -23.963834762573242, "global_step": 179408, "epoch": 2161} {"train_loss": -23.903894424438477, "global_step": 179409, "epoch": 2161} {"train_loss": -23.488073348999023, "global_step": 179410, "epoch": 2161} {"train_loss": -23.59261131286621, "global_step": 179411, "epoch": 2161} {"train_loss": -23.622238159179688, "global_step": 179412, "epoch": 2161} {"train_loss": -24.11720085144043, "global_step": 179413, "epoch": 2161} {"train_loss": -23.683090209960938, "global_step": 179414, "epoch": 2161} {"train_loss": -23.83149528503418, "global_step": 179415, "epoch": 2161} {"train_loss": -23.878095626831055, "global_step": 179416, "epoch": 2161} {"train_loss": -23.798574447631836, "global_step": 179417, "epoch": 2161} {"train_loss": -23.792871475219727, "global_step": 179418, "epoch": 2161} {"train_loss": -23.879953384399414, "global_step": 179419, "epoch": 2161} {"train_loss": -23.80769157409668, "global_step": 179420, "epoch": 2161} {"train_loss": -23.998151779174805, "global_step": 179421, "epoch": 2161} {"train_loss": -23.830148696899414, "global_step": 179422, "epoch": 2161} {"train_loss": -24.043476104736328, "global_step": 179423, "epoch": 2161} {"train_loss": -23.71698570251465, "global_step": 179424, "epoch": 2161} {"train_loss": -24.078662872314453, "global_step": 179425, "epoch": 2161} {"train_loss": -23.9934024810791, "global_step": 179426, "epoch": 2161} {"train_loss": -23.76651382446289, "global_step": 179427, "epoch": 2161} {"train_loss": -23.961536407470703, "global_step": 179428, "epoch": 2161} {"train_loss": -24.143056869506836, "global_step": 179429, "epoch": 2161} {"train_loss": -23.85853385925293, "global_step": 179430, "epoch": 2161} {"train_loss": -23.689273834228516, "global_step": 179431, "epoch": 2161} {"train_loss": -24.097238540649414, "global_step": 179432, "epoch": 2161} {"train_loss": -24.112899780273438, "global_step": 179433, "epoch": 2161} {"train_loss": -23.79060935974121, "global_step": 179434, "epoch": 2161} {"train_loss": -24.410898208618164, "global_step": 179435, "epoch": 2161} {"train_loss": -23.861892700195312, "global_step": 179436, "epoch": 2161} {"train_loss": -24.17401123046875, "global_step": 179437, "epoch": 2161} {"train_loss": -23.789081573486328, "global_step": 179438, "epoch": 2161} {"train_loss": -24.499364852905273, "global_step": 179439, "epoch": 2161} {"train_loss": -23.75908660888672, "global_step": 179440, "epoch": 2161} {"train_loss": -24.311450958251953, "global_step": 179441, "epoch": 2161} {"train_loss": -24.256114959716797, "global_step": 179442, "epoch": 2161} {"train_loss": -24.03220558166504, "global_step": 179443, "epoch": 2161} {"train_loss": -24.048797607421875, "global_step": 179444, "epoch": 2161} {"train_loss": -23.75978311285915, "global_step": 179445, "epoch": 2161, "val_loss": 6445417.0} {"train_loss": -21.11850357055664, "global_step": 179446, "epoch": 2162} {"train_loss": -23.13081169128418, "global_step": 179447, "epoch": 2162} {"train_loss": -23.427433013916016, "global_step": 179448, "epoch": 2162} {"train_loss": -23.219778060913086, "global_step": 179449, "epoch": 2162} {"train_loss": -23.623306274414062, "global_step": 179450, "epoch": 2162} {"train_loss": -23.13294219970703, "global_step": 179451, "epoch": 2162} {"train_loss": -23.225841522216797, "global_step": 179452, "epoch": 2162} {"train_loss": -23.263072967529297, "global_step": 179453, "epoch": 2162} {"train_loss": -23.419933319091797, "global_step": 179454, "epoch": 2162} {"train_loss": -23.193918228149414, "global_step": 179455, "epoch": 2162} {"train_loss": -23.215381622314453, "global_step": 179456, "epoch": 2162} {"train_loss": -23.517597198486328, "global_step": 179457, "epoch": 2162} {"train_loss": -23.402734756469727, "global_step": 179458, "epoch": 2162} {"train_loss": -23.528736114501953, "global_step": 179459, "epoch": 2162} {"train_loss": -23.476072311401367, "global_step": 179460, "epoch": 2162} {"train_loss": -23.074182510375977, "global_step": 179461, "epoch": 2162} {"train_loss": -23.531110763549805, "global_step": 179462, "epoch": 2162} {"train_loss": -23.479755401611328, "global_step": 179463, "epoch": 2162} {"train_loss": -23.764217376708984, "global_step": 179464, "epoch": 2162} {"train_loss": -23.644866943359375, "global_step": 179465, "epoch": 2162} {"train_loss": -23.693071365356445, "global_step": 179466, "epoch": 2162} {"train_loss": -23.534162521362305, "global_step": 179467, "epoch": 2162} {"train_loss": -24.0295352935791, "global_step": 179468, "epoch": 2162} {"train_loss": -23.734127044677734, "global_step": 179469, "epoch": 2162} {"train_loss": -23.566864013671875, "global_step": 179470, "epoch": 2162} {"train_loss": -23.64365577697754, "global_step": 179471, "epoch": 2162} {"train_loss": -23.70674705505371, "global_step": 179472, "epoch": 2162} {"train_loss": -23.92133331298828, "global_step": 179473, "epoch": 2162} {"train_loss": -23.589887619018555, "global_step": 179474, "epoch": 2162} {"train_loss": -23.723560333251953, "global_step": 179475, "epoch": 2162} {"train_loss": -23.922109603881836, "global_step": 179476, "epoch": 2162} {"train_loss": -23.721059799194336, "global_step": 179477, "epoch": 2162} {"train_loss": -24.028562545776367, "global_step": 179478, "epoch": 2162} {"train_loss": -23.765567779541016, "global_step": 179479, "epoch": 2162} {"train_loss": -23.773574829101562, "global_step": 179480, "epoch": 2162} {"train_loss": -23.87031364440918, "global_step": 179481, "epoch": 2162} {"train_loss": -23.724956512451172, "global_step": 179482, "epoch": 2162} {"train_loss": -23.938199996948242, "global_step": 179483, "epoch": 2162} {"train_loss": -23.973554611206055, "global_step": 179484, "epoch": 2162} {"train_loss": -24.007564544677734, "global_step": 179485, "epoch": 2162} {"train_loss": -23.840930938720703, "global_step": 179486, "epoch": 2162} {"train_loss": -24.1291561126709, "global_step": 179487, "epoch": 2162} {"train_loss": -23.7222900390625, "global_step": 179488, "epoch": 2162} {"train_loss": -23.97360610961914, "global_step": 179489, "epoch": 2162} {"train_loss": -23.8020076751709, "global_step": 179490, "epoch": 2162} {"train_loss": -23.957639694213867, "global_step": 179491, "epoch": 2162} {"train_loss": -23.826059341430664, "global_step": 179492, "epoch": 2162} {"train_loss": -23.959516525268555, "global_step": 179493, "epoch": 2162} {"train_loss": -23.792957305908203, "global_step": 179494, "epoch": 2162} {"train_loss": -23.997671127319336, "global_step": 179495, "epoch": 2162} {"train_loss": -23.866132736206055, "global_step": 179496, "epoch": 2162} {"train_loss": -24.036291122436523, "global_step": 179497, "epoch": 2162} {"train_loss": -24.421056747436523, "global_step": 179498, "epoch": 2162} {"train_loss": -23.81125259399414, "global_step": 179499, "epoch": 2162} {"train_loss": -23.95551872253418, "global_step": 179500, "epoch": 2162} {"train_loss": -24.318328857421875, "global_step": 179501, "epoch": 2162} {"train_loss": -24.064666748046875, "global_step": 179502, "epoch": 2162} {"train_loss": -24.037677764892578, "global_step": 179503, "epoch": 2162} {"train_loss": -23.82196044921875, "global_step": 179504, "epoch": 2162} {"train_loss": -23.9424991607666, "global_step": 179505, "epoch": 2162} {"train_loss": -24.326269149780273, "global_step": 179506, "epoch": 2162} {"train_loss": -23.561079025268555, "global_step": 179507, "epoch": 2162} {"train_loss": -23.897232055664062, "global_step": 179508, "epoch": 2162} {"train_loss": -23.822647094726562, "global_step": 179509, "epoch": 2162} {"train_loss": -23.925296783447266, "global_step": 179510, "epoch": 2162} {"train_loss": -23.676916122436523, "global_step": 179511, "epoch": 2162} {"train_loss": -23.514413833618164, "global_step": 179512, "epoch": 2162} {"train_loss": -23.687108993530273, "global_step": 179513, "epoch": 2162} {"train_loss": -23.985000610351562, "global_step": 179514, "epoch": 2162} {"train_loss": -24.043506622314453, "global_step": 179515, "epoch": 2162} {"train_loss": -23.757898330688477, "global_step": 179516, "epoch": 2162} {"train_loss": -23.74979591369629, "global_step": 179517, "epoch": 2162} {"train_loss": -23.883583068847656, "global_step": 179518, "epoch": 2162} {"train_loss": -23.970876693725586, "global_step": 179519, "epoch": 2162} {"train_loss": -23.905994415283203, "global_step": 179520, "epoch": 2162} {"train_loss": -23.811176300048828, "global_step": 179521, "epoch": 2162} {"train_loss": -23.950788497924805, "global_step": 179522, "epoch": 2162} {"train_loss": -23.812646865844727, "global_step": 179523, "epoch": 2162} {"train_loss": -23.92902946472168, "global_step": 179524, "epoch": 2162} {"train_loss": -24.059738159179688, "global_step": 179525, "epoch": 2162} {"train_loss": -23.89693832397461, "global_step": 179526, "epoch": 2162} {"train_loss": -24.153051376342773, "global_step": 179527, "epoch": 2162} {"train_loss": -23.732795485530993, "global_step": 179528, "epoch": 2162, "val_loss": 6430949.0} {"train_loss": -22.844757080078125, "global_step": 179529, "epoch": 2163} {"train_loss": -22.907062530517578, "global_step": 179530, "epoch": 2163} {"train_loss": -23.4349422454834, "global_step": 179531, "epoch": 2163} {"train_loss": -23.088367462158203, "global_step": 179532, "epoch": 2163} {"train_loss": -22.857206344604492, "global_step": 179533, "epoch": 2163} {"train_loss": -23.370859146118164, "global_step": 179534, "epoch": 2163} {"train_loss": -23.394956588745117, "global_step": 179535, "epoch": 2163} {"train_loss": -23.667734146118164, "global_step": 179536, "epoch": 2163} {"train_loss": -23.8712100982666, "global_step": 179537, "epoch": 2163} {"train_loss": -23.448755264282227, "global_step": 179538, "epoch": 2163} {"train_loss": -23.552900314331055, "global_step": 179539, "epoch": 2163} {"train_loss": -23.05841636657715, "global_step": 179540, "epoch": 2163} {"train_loss": -23.607341766357422, "global_step": 179541, "epoch": 2163} {"train_loss": -23.747526168823242, "global_step": 179542, "epoch": 2163} {"train_loss": -23.65428352355957, "global_step": 179543, "epoch": 2163} {"train_loss": -23.780319213867188, "global_step": 179544, "epoch": 2163} {"train_loss": -23.443750381469727, "global_step": 179545, "epoch": 2163} {"train_loss": -23.88140296936035, "global_step": 179546, "epoch": 2163} {"train_loss": -23.514450073242188, "global_step": 179547, "epoch": 2163} {"train_loss": -23.56338119506836, "global_step": 179548, "epoch": 2163} {"train_loss": -23.881975173950195, "global_step": 179549, "epoch": 2163} {"train_loss": -23.407052993774414, "global_step": 179550, "epoch": 2163} {"train_loss": -23.543663024902344, "global_step": 179551, "epoch": 2163} {"train_loss": -23.877851486206055, "global_step": 179552, "epoch": 2163} {"train_loss": -23.724933624267578, "global_step": 179553, "epoch": 2163} {"train_loss": -23.98226547241211, "global_step": 179554, "epoch": 2163} {"train_loss": -23.81465721130371, "global_step": 179555, "epoch": 2163} {"train_loss": -23.68238639831543, "global_step": 179556, "epoch": 2163} {"train_loss": -23.776123046875, "global_step": 179557, "epoch": 2163} {"train_loss": -23.831815719604492, "global_step": 179558, "epoch": 2163} {"train_loss": -24.15450668334961, "global_step": 179559, "epoch": 2163} {"train_loss": -23.895402908325195, "global_step": 179560, "epoch": 2163} {"train_loss": -24.215967178344727, "global_step": 179561, "epoch": 2163} {"train_loss": -23.889890670776367, "global_step": 179562, "epoch": 2163} {"train_loss": -23.80783462524414, "global_step": 179563, "epoch": 2163} {"train_loss": -24.081865310668945, "global_step": 179564, "epoch": 2163} {"train_loss": -24.082956314086914, "global_step": 179565, "epoch": 2163} {"train_loss": -23.93794822692871, "global_step": 179566, "epoch": 2163} {"train_loss": -24.007177352905273, "global_step": 179567, "epoch": 2163} {"train_loss": -24.029312133789062, "global_step": 179568, "epoch": 2163} {"train_loss": -23.843305587768555, "global_step": 179569, "epoch": 2163} {"train_loss": -24.185312271118164, "global_step": 179570, "epoch": 2163} {"train_loss": -23.82640266418457, "global_step": 179571, "epoch": 2163} {"train_loss": -23.887535095214844, "global_step": 179572, "epoch": 2163} {"train_loss": -24.190706253051758, "global_step": 179573, "epoch": 2163} {"train_loss": -24.059141159057617, "global_step": 179574, "epoch": 2163} {"train_loss": -23.706058502197266, "global_step": 179575, "epoch": 2163} {"train_loss": -24.227256774902344, "global_step": 179576, "epoch": 2163} {"train_loss": -24.047693252563477, "global_step": 179577, "epoch": 2163} {"train_loss": -24.034912109375, "global_step": 179578, "epoch": 2163} {"train_loss": -24.327547073364258, "global_step": 179579, "epoch": 2163} {"train_loss": -23.884449005126953, "global_step": 179580, "epoch": 2163} {"train_loss": -23.672042846679688, "global_step": 179581, "epoch": 2163} {"train_loss": -23.839956283569336, "global_step": 179582, "epoch": 2163} {"train_loss": -24.35599708557129, "global_step": 179583, "epoch": 2163} {"train_loss": -23.81048011779785, "global_step": 179584, "epoch": 2163} {"train_loss": -23.994701385498047, "global_step": 179585, "epoch": 2163} {"train_loss": -23.70527458190918, "global_step": 179586, "epoch": 2163} {"train_loss": -23.34173011779785, "global_step": 179587, "epoch": 2163} {"train_loss": -23.595731735229492, "global_step": 179588, "epoch": 2163} {"train_loss": -23.757638931274414, "global_step": 179589, "epoch": 2163} {"train_loss": -23.829137802124023, "global_step": 179590, "epoch": 2163} {"train_loss": -23.805246353149414, "global_step": 179591, "epoch": 2163} {"train_loss": -24.034141540527344, "global_step": 179592, "epoch": 2163} {"train_loss": -24.201854705810547, "global_step": 179593, "epoch": 2163} {"train_loss": -24.03714942932129, "global_step": 179594, "epoch": 2163} {"train_loss": -24.38045310974121, "global_step": 179595, "epoch": 2163} {"train_loss": -24.0513973236084, "global_step": 179596, "epoch": 2163} {"train_loss": -23.92531394958496, "global_step": 179597, "epoch": 2163} {"train_loss": -23.82744026184082, "global_step": 179598, "epoch": 2163} {"train_loss": -23.765432357788086, "global_step": 179599, "epoch": 2163} {"train_loss": -23.7335147857666, "global_step": 179600, "epoch": 2163} {"train_loss": -23.74155044555664, "global_step": 179601, "epoch": 2163} {"train_loss": -23.713132858276367, "global_step": 179602, "epoch": 2163} {"train_loss": -23.827865600585938, "global_step": 179603, "epoch": 2163} {"train_loss": -23.31096839904785, "global_step": 179604, "epoch": 2163} {"train_loss": -23.69672966003418, "global_step": 179605, "epoch": 2163} {"train_loss": -23.791349411010742, "global_step": 179606, "epoch": 2163} {"train_loss": -23.808956146240234, "global_step": 179607, "epoch": 2163} {"train_loss": -23.949689865112305, "global_step": 179608, "epoch": 2163} {"train_loss": -23.712556838989258, "global_step": 179609, "epoch": 2163} {"train_loss": -23.856489181518555, "global_step": 179610, "epoch": 2163} {"train_loss": -23.774404985358917, "global_step": 179611, "epoch": 2163, "val_loss": 6470507.0} {"train_loss": -22.45746421813965, "global_step": 179612, "epoch": 2164} {"train_loss": -23.22623062133789, "global_step": 179613, "epoch": 2164} {"train_loss": -23.230375289916992, "global_step": 179614, "epoch": 2164} {"train_loss": -22.855579376220703, "global_step": 179615, "epoch": 2164} {"train_loss": -23.355010986328125, "global_step": 179616, "epoch": 2164} {"train_loss": -23.09881591796875, "global_step": 179617, "epoch": 2164} {"train_loss": -23.096952438354492, "global_step": 179618, "epoch": 2164} {"train_loss": -23.44719123840332, "global_step": 179619, "epoch": 2164} {"train_loss": -22.886035919189453, "global_step": 179620, "epoch": 2164} {"train_loss": -23.293819427490234, "global_step": 179621, "epoch": 2164} {"train_loss": -23.294952392578125, "global_step": 179622, "epoch": 2164} {"train_loss": -23.57447624206543, "global_step": 179623, "epoch": 2164} {"train_loss": -23.410507202148438, "global_step": 179624, "epoch": 2164} {"train_loss": -23.70479393005371, "global_step": 179625, "epoch": 2164} {"train_loss": -23.591506958007812, "global_step": 179626, "epoch": 2164} {"train_loss": -23.53484535217285, "global_step": 179627, "epoch": 2164} {"train_loss": -23.454179763793945, "global_step": 179628, "epoch": 2164} {"train_loss": -23.51579475402832, "global_step": 179629, "epoch": 2164} {"train_loss": -23.51838493347168, "global_step": 179630, "epoch": 2164} {"train_loss": -23.644025802612305, "global_step": 179631, "epoch": 2164} {"train_loss": -23.37603759765625, "global_step": 179632, "epoch": 2164} {"train_loss": -23.36464500427246, "global_step": 179633, "epoch": 2164} {"train_loss": -23.59982681274414, "global_step": 179634, "epoch": 2164} {"train_loss": -23.853647232055664, "global_step": 179635, "epoch": 2164} {"train_loss": -23.645009994506836, "global_step": 179636, "epoch": 2164} {"train_loss": -23.613481521606445, "global_step": 179637, "epoch": 2164} {"train_loss": -23.823078155517578, "global_step": 179638, "epoch": 2164} {"train_loss": -23.792163848876953, "global_step": 179639, "epoch": 2164} {"train_loss": -23.537343978881836, "global_step": 179640, "epoch": 2164} {"train_loss": -23.68365478515625, "global_step": 179641, "epoch": 2164} {"train_loss": -23.664823532104492, "global_step": 179642, "epoch": 2164} {"train_loss": -23.750699996948242, "global_step": 179643, "epoch": 2164} {"train_loss": -23.598451614379883, "global_step": 179644, "epoch": 2164} {"train_loss": -23.843647003173828, "global_step": 179645, "epoch": 2164} {"train_loss": -24.244863510131836, "global_step": 179646, "epoch": 2164} {"train_loss": -23.766874313354492, "global_step": 179647, "epoch": 2164} {"train_loss": -23.846242904663086, "global_step": 179648, "epoch": 2164} {"train_loss": -23.55373191833496, "global_step": 179649, "epoch": 2164} {"train_loss": -23.84126091003418, "global_step": 179650, "epoch": 2164} {"train_loss": -24.06729507446289, "global_step": 179651, "epoch": 2164} {"train_loss": -23.793554306030273, "global_step": 179652, "epoch": 2164} {"train_loss": -23.981815338134766, "global_step": 179653, "epoch": 2164} {"train_loss": -24.46549415588379, "global_step": 179654, "epoch": 2164} {"train_loss": -23.700763702392578, "global_step": 179655, "epoch": 2164} {"train_loss": -23.639684677124023, "global_step": 179656, "epoch": 2164} {"train_loss": -24.140087127685547, "global_step": 179657, "epoch": 2164} {"train_loss": -23.952110290527344, "global_step": 179658, "epoch": 2164} {"train_loss": -24.01816177368164, "global_step": 179659, "epoch": 2164} {"train_loss": -23.96643829345703, "global_step": 179660, "epoch": 2164} {"train_loss": -23.890064239501953, "global_step": 179661, "epoch": 2164} {"train_loss": -23.614957809448242, "global_step": 179662, "epoch": 2164} {"train_loss": -24.063697814941406, "global_step": 179663, "epoch": 2164} {"train_loss": -23.9955997467041, "global_step": 179664, "epoch": 2164} {"train_loss": -24.22645378112793, "global_step": 179665, "epoch": 2164} {"train_loss": -24.038705825805664, "global_step": 179666, "epoch": 2164} {"train_loss": -24.077680587768555, "global_step": 179667, "epoch": 2164} {"train_loss": -24.15643882751465, "global_step": 179668, "epoch": 2164} {"train_loss": -24.057836532592773, "global_step": 179669, "epoch": 2164} {"train_loss": -24.042699813842773, "global_step": 179670, "epoch": 2164} {"train_loss": -23.643686294555664, "global_step": 179671, "epoch": 2164} {"train_loss": -23.908157348632812, "global_step": 179672, "epoch": 2164} {"train_loss": -23.921504974365234, "global_step": 179673, "epoch": 2164} {"train_loss": -24.199817657470703, "global_step": 179674, "epoch": 2164} {"train_loss": -24.04656982421875, "global_step": 179675, "epoch": 2164} {"train_loss": -24.307476043701172, "global_step": 179676, "epoch": 2164} {"train_loss": -24.040937423706055, "global_step": 179677, "epoch": 2164} {"train_loss": -23.873870849609375, "global_step": 179678, "epoch": 2164} {"train_loss": -24.100574493408203, "global_step": 179679, "epoch": 2164} {"train_loss": -23.678274154663086, "global_step": 179680, "epoch": 2164} {"train_loss": -24.028005599975586, "global_step": 179681, "epoch": 2164} {"train_loss": -23.881818771362305, "global_step": 179682, "epoch": 2164} {"train_loss": -23.91792106628418, "global_step": 179683, "epoch": 2164} {"train_loss": -23.72878074645996, "global_step": 179684, "epoch": 2164} {"train_loss": -23.905046463012695, "global_step": 179685, "epoch": 2164} {"train_loss": -23.453649520874023, "global_step": 179686, "epoch": 2164} {"train_loss": -23.65298080444336, "global_step": 179687, "epoch": 2164} {"train_loss": -24.018346786499023, "global_step": 179688, "epoch": 2164} {"train_loss": -24.06389045715332, "global_step": 179689, "epoch": 2164} {"train_loss": -24.01326560974121, "global_step": 179690, "epoch": 2164} {"train_loss": -23.608522415161133, "global_step": 179691, "epoch": 2164} {"train_loss": -23.740264892578125, "global_step": 179692, "epoch": 2164} {"train_loss": -24.13348388671875, "global_step": 179693, "epoch": 2164} {"train_loss": -23.750551821237586, "global_step": 179694, "epoch": 2164, "val_loss": 6442233.5} {"train_loss": -23.437055587768555, "global_step": 179695, "epoch": 2165} {"train_loss": -23.714521408081055, "global_step": 179696, "epoch": 2165} {"train_loss": -23.269943237304688, "global_step": 179697, "epoch": 2165} {"train_loss": -23.861328125, "global_step": 179698, "epoch": 2165} {"train_loss": -23.48617935180664, "global_step": 179699, "epoch": 2165} {"train_loss": -23.63551139831543, "global_step": 179700, "epoch": 2165} {"train_loss": -23.446287155151367, "global_step": 179701, "epoch": 2165} {"train_loss": -23.949419021606445, "global_step": 179702, "epoch": 2165} {"train_loss": -23.78376579284668, "global_step": 179703, "epoch": 2165} {"train_loss": -23.567686080932617, "global_step": 179704, "epoch": 2165} {"train_loss": -23.655044555664062, "global_step": 179705, "epoch": 2165} {"train_loss": -23.751379013061523, "global_step": 179706, "epoch": 2165} {"train_loss": -23.862899780273438, "global_step": 179707, "epoch": 2165} {"train_loss": -23.44040298461914, "global_step": 179708, "epoch": 2165} {"train_loss": -23.72565269470215, "global_step": 179709, "epoch": 2165} {"train_loss": -24.128578186035156, "global_step": 179710, "epoch": 2165} {"train_loss": -24.117427825927734, "global_step": 179711, "epoch": 2165} {"train_loss": -23.886722564697266, "global_step": 179712, "epoch": 2165} {"train_loss": -24.056800842285156, "global_step": 179713, "epoch": 2165} {"train_loss": -23.4925594329834, "global_step": 179714, "epoch": 2165} {"train_loss": -23.739004135131836, "global_step": 179715, "epoch": 2165} {"train_loss": -23.950260162353516, "global_step": 179716, "epoch": 2165} {"train_loss": -24.122922897338867, "global_step": 179717, "epoch": 2165} {"train_loss": -24.052440643310547, "global_step": 179718, "epoch": 2165} {"train_loss": -24.010211944580078, "global_step": 179719, "epoch": 2165} {"train_loss": -24.09549331665039, "global_step": 179720, "epoch": 2165} {"train_loss": -24.514219284057617, "global_step": 179721, "epoch": 2165} {"train_loss": -24.27016258239746, "global_step": 179722, "epoch": 2165} {"train_loss": -23.860567092895508, "global_step": 179723, "epoch": 2165} {"train_loss": -23.625286102294922, "global_step": 179724, "epoch": 2165} {"train_loss": -23.988378524780273, "global_step": 179725, "epoch": 2165} {"train_loss": -24.002397537231445, "global_step": 179726, "epoch": 2165} {"train_loss": -23.683813095092773, "global_step": 179727, "epoch": 2165} {"train_loss": -23.810489654541016, "global_step": 179728, "epoch": 2165} {"train_loss": -24.04901695251465, "global_step": 179729, "epoch": 2165} {"train_loss": -24.027769088745117, "global_step": 179730, "epoch": 2165} {"train_loss": -23.896209716796875, "global_step": 179731, "epoch": 2165} {"train_loss": -24.290586471557617, "global_step": 179732, "epoch": 2165} {"train_loss": -23.816295623779297, "global_step": 179733, "epoch": 2165} {"train_loss": -24.246353149414062, "global_step": 179734, "epoch": 2165} {"train_loss": -23.939748764038086, "global_step": 179735, "epoch": 2165} {"train_loss": -23.99757194519043, "global_step": 179736, "epoch": 2165} {"train_loss": -24.12282371520996, "global_step": 179737, "epoch": 2165} {"train_loss": -23.546924591064453, "global_step": 179738, "epoch": 2165} {"train_loss": -23.458297729492188, "global_step": 179739, "epoch": 2165} {"train_loss": -23.741287231445312, "global_step": 179740, "epoch": 2165} {"train_loss": -24.18330192565918, "global_step": 179741, "epoch": 2165} {"train_loss": -23.836002349853516, "global_step": 179742, "epoch": 2165} {"train_loss": -23.96261215209961, "global_step": 179743, "epoch": 2165} {"train_loss": -23.63112449645996, "global_step": 179744, "epoch": 2165} {"train_loss": -24.138242721557617, "global_step": 179745, "epoch": 2165} {"train_loss": -24.216991424560547, "global_step": 179746, "epoch": 2165} {"train_loss": -24.34343910217285, "global_step": 179747, "epoch": 2165} {"train_loss": -24.013134002685547, "global_step": 179748, "epoch": 2165} {"train_loss": -24.188283920288086, "global_step": 179749, "epoch": 2165} {"train_loss": -23.815982818603516, "global_step": 179750, "epoch": 2165} {"train_loss": -23.91489028930664, "global_step": 179751, "epoch": 2165} {"train_loss": -24.265213012695312, "global_step": 179752, "epoch": 2165} {"train_loss": -23.67630958557129, "global_step": 179753, "epoch": 2165} {"train_loss": -24.272850036621094, "global_step": 179754, "epoch": 2165} {"train_loss": -23.994571685791016, "global_step": 179755, "epoch": 2165} {"train_loss": -23.72824478149414, "global_step": 179756, "epoch": 2165} {"train_loss": -24.079675674438477, "global_step": 179757, "epoch": 2165} {"train_loss": -23.864648818969727, "global_step": 179758, "epoch": 2165} {"train_loss": -23.77117347717285, "global_step": 179759, "epoch": 2165} {"train_loss": -23.881235122680664, "global_step": 179760, "epoch": 2165} {"train_loss": -23.756439208984375, "global_step": 179761, "epoch": 2165} {"train_loss": -23.772830963134766, "global_step": 179762, "epoch": 2165} {"train_loss": -23.650083541870117, "global_step": 179763, "epoch": 2165} {"train_loss": -23.778419494628906, "global_step": 179764, "epoch": 2165} {"train_loss": -23.693313598632812, "global_step": 179765, "epoch": 2165} {"train_loss": -23.949039459228516, "global_step": 179766, "epoch": 2165} {"train_loss": -23.72588348388672, "global_step": 179767, "epoch": 2165} {"train_loss": -23.777814865112305, "global_step": 179768, "epoch": 2165} {"train_loss": -23.993337631225586, "global_step": 179769, "epoch": 2165} {"train_loss": -23.733173370361328, "global_step": 179770, "epoch": 2165} {"train_loss": -23.842971801757812, "global_step": 179771, "epoch": 2165} {"train_loss": -23.9692440032959, "global_step": 179772, "epoch": 2165} {"train_loss": -24.08827018737793, "global_step": 179773, "epoch": 2165} {"train_loss": -23.726224899291992, "global_step": 179774, "epoch": 2165} {"train_loss": -23.88508415222168, "global_step": 179775, "epoch": 2165} {"train_loss": -23.640851974487305, "global_step": 179776, "epoch": 2165} {"train_loss": -23.8787005091288, "global_step": 179777, "epoch": 2165, "val_loss": 6355651.0} {"train_loss": -23.5685977935791, "global_step": 179778, "epoch": 2166} {"train_loss": -23.2471923828125, "global_step": 179779, "epoch": 2166} {"train_loss": -23.80392074584961, "global_step": 179780, "epoch": 2166} {"train_loss": -23.42218589782715, "global_step": 179781, "epoch": 2166} {"train_loss": -23.266454696655273, "global_step": 179782, "epoch": 2166} {"train_loss": -23.668333053588867, "global_step": 179783, "epoch": 2166} {"train_loss": -23.77204704284668, "global_step": 179784, "epoch": 2166} {"train_loss": -23.781766891479492, "global_step": 179785, "epoch": 2166} {"train_loss": -23.404733657836914, "global_step": 179786, "epoch": 2166} {"train_loss": -23.358108520507812, "global_step": 179787, "epoch": 2166} {"train_loss": -23.322053909301758, "global_step": 179788, "epoch": 2166} {"train_loss": -23.75662612915039, "global_step": 179789, "epoch": 2166} {"train_loss": -23.732587814331055, "global_step": 179790, "epoch": 2166} {"train_loss": -23.872678756713867, "global_step": 179791, "epoch": 2166} {"train_loss": -23.61785888671875, "global_step": 179792, "epoch": 2166} {"train_loss": -24.245641708374023, "global_step": 179793, "epoch": 2166} {"train_loss": -23.81135368347168, "global_step": 179794, "epoch": 2166} {"train_loss": -23.455533981323242, "global_step": 179795, "epoch": 2166} {"train_loss": -23.867189407348633, "global_step": 179796, "epoch": 2166} {"train_loss": -24.18302345275879, "global_step": 179797, "epoch": 2166} {"train_loss": -23.82218360900879, "global_step": 179798, "epoch": 2166} {"train_loss": -23.95491600036621, "global_step": 179799, "epoch": 2166} {"train_loss": -23.682252883911133, "global_step": 179800, "epoch": 2166} {"train_loss": -24.127765655517578, "global_step": 179801, "epoch": 2166} {"train_loss": -23.85471534729004, "global_step": 179802, "epoch": 2166} {"train_loss": -24.161975860595703, "global_step": 179803, "epoch": 2166} {"train_loss": -23.754440307617188, "global_step": 179804, "epoch": 2166} {"train_loss": -23.95392417907715, "global_step": 179805, "epoch": 2166} {"train_loss": -23.921411514282227, "global_step": 179806, "epoch": 2166} {"train_loss": -23.92792510986328, "global_step": 179807, "epoch": 2166} {"train_loss": -23.89626121520996, "global_step": 179808, "epoch": 2166} {"train_loss": -23.796695709228516, "global_step": 179809, "epoch": 2166} {"train_loss": -24.044469833374023, "global_step": 179810, "epoch": 2166} {"train_loss": -23.80525016784668, "global_step": 179811, "epoch": 2166} {"train_loss": -24.102994918823242, "global_step": 179812, "epoch": 2166} {"train_loss": -23.95765495300293, "global_step": 179813, "epoch": 2166} {"train_loss": -23.80268669128418, "global_step": 179814, "epoch": 2166} {"train_loss": -23.80122184753418, "global_step": 179815, "epoch": 2166} {"train_loss": -23.79017448425293, "global_step": 179816, "epoch": 2166} {"train_loss": -23.85161781311035, "global_step": 179817, "epoch": 2166} {"train_loss": -23.937898635864258, "global_step": 179818, "epoch": 2166} {"train_loss": -23.802936553955078, "global_step": 179819, "epoch": 2166} {"train_loss": -23.675552368164062, "global_step": 179820, "epoch": 2166} {"train_loss": -23.936569213867188, "global_step": 179821, "epoch": 2166} {"train_loss": -23.816946029663086, "global_step": 179822, "epoch": 2166} {"train_loss": -24.026203155517578, "global_step": 179823, "epoch": 2166} {"train_loss": -24.064687728881836, "global_step": 179824, "epoch": 2166} {"train_loss": -23.671289443969727, "global_step": 179825, "epoch": 2166} {"train_loss": -23.62040138244629, "global_step": 179826, "epoch": 2166} {"train_loss": -23.62233543395996, "global_step": 179827, "epoch": 2166} {"train_loss": -23.999662399291992, "global_step": 179828, "epoch": 2166} {"train_loss": -24.201929092407227, "global_step": 179829, "epoch": 2166} {"train_loss": -24.20277976989746, "global_step": 179830, "epoch": 2166} {"train_loss": -23.71571922302246, "global_step": 179831, "epoch": 2166} {"train_loss": -23.844284057617188, "global_step": 179832, "epoch": 2166} {"train_loss": -23.73249626159668, "global_step": 179833, "epoch": 2166} {"train_loss": -23.721755981445312, "global_step": 179834, "epoch": 2166} {"train_loss": -24.164579391479492, "global_step": 179835, "epoch": 2166} {"train_loss": -24.30110740661621, "global_step": 179836, "epoch": 2166} {"train_loss": -24.25200843811035, "global_step": 179837, "epoch": 2166} {"train_loss": -24.011472702026367, "global_step": 179838, "epoch": 2166} {"train_loss": -24.04167938232422, "global_step": 179839, "epoch": 2166} {"train_loss": -24.367725372314453, "global_step": 179840, "epoch": 2166} {"train_loss": -23.58797264099121, "global_step": 179841, "epoch": 2166} {"train_loss": -24.148954391479492, "global_step": 179842, "epoch": 2166} {"train_loss": -23.727092742919922, "global_step": 179843, "epoch": 2166} {"train_loss": -23.527151107788086, "global_step": 179844, "epoch": 2166} {"train_loss": -23.332246780395508, "global_step": 179845, "epoch": 2166} {"train_loss": -23.53412437438965, "global_step": 179846, "epoch": 2166} {"train_loss": -23.144397735595703, "global_step": 179847, "epoch": 2166} {"train_loss": -23.49444580078125, "global_step": 179848, "epoch": 2166} {"train_loss": -24.045129776000977, "global_step": 179849, "epoch": 2166} {"train_loss": -23.455041885375977, "global_step": 179850, "epoch": 2166} {"train_loss": -23.232736587524414, "global_step": 179851, "epoch": 2166} {"train_loss": -23.925451278686523, "global_step": 179852, "epoch": 2166} {"train_loss": -23.462862014770508, "global_step": 179853, "epoch": 2166} {"train_loss": -23.724411010742188, "global_step": 179854, "epoch": 2166} {"train_loss": -23.56276512145996, "global_step": 179855, "epoch": 2166} {"train_loss": -23.73343276977539, "global_step": 179856, "epoch": 2166} {"train_loss": -23.90253257751465, "global_step": 179857, "epoch": 2166} {"train_loss": -23.968305587768555, "global_step": 179858, "epoch": 2166} {"train_loss": -23.519529342651367, "global_step": 179859, "epoch": 2166} {"train_loss": -23.78562253929046, "global_step": 179860, "epoch": 2166, "val_loss": 6417983.0} {"train_loss": -23.24417495727539, "global_step": 179861, "epoch": 2167} {"train_loss": -23.2352352142334, "global_step": 179862, "epoch": 2167} {"train_loss": -23.300689697265625, "global_step": 179863, "epoch": 2167} {"train_loss": -22.960464477539062, "global_step": 179864, "epoch": 2167} {"train_loss": -23.69007682800293, "global_step": 179865, "epoch": 2167} {"train_loss": -23.27153205871582, "global_step": 179866, "epoch": 2167} {"train_loss": -23.23299789428711, "global_step": 179867, "epoch": 2167} {"train_loss": -23.67325782775879, "global_step": 179868, "epoch": 2167} {"train_loss": -23.345335006713867, "global_step": 179869, "epoch": 2167} {"train_loss": -23.34003448486328, "global_step": 179870, "epoch": 2167} {"train_loss": -23.368112564086914, "global_step": 179871, "epoch": 2167} {"train_loss": -23.483800888061523, "global_step": 179872, "epoch": 2167} {"train_loss": -23.303428649902344, "global_step": 179873, "epoch": 2167} {"train_loss": -23.481901168823242, "global_step": 179874, "epoch": 2167} {"train_loss": -23.56483268737793, "global_step": 179875, "epoch": 2167} {"train_loss": -23.224592208862305, "global_step": 179876, "epoch": 2167} {"train_loss": -23.542612075805664, "global_step": 179877, "epoch": 2167} {"train_loss": -23.558135986328125, "global_step": 179878, "epoch": 2167} {"train_loss": -23.710691452026367, "global_step": 179879, "epoch": 2167} {"train_loss": -23.91023063659668, "global_step": 179880, "epoch": 2167} {"train_loss": -23.648847579956055, "global_step": 179881, "epoch": 2167} {"train_loss": -23.69635772705078, "global_step": 179882, "epoch": 2167} {"train_loss": -23.123123168945312, "global_step": 179883, "epoch": 2167} {"train_loss": -23.513383865356445, "global_step": 179884, "epoch": 2167} {"train_loss": -23.80559539794922, "global_step": 179885, "epoch": 2167} {"train_loss": -23.568069458007812, "global_step": 179886, "epoch": 2167} {"train_loss": -23.706693649291992, "global_step": 179887, "epoch": 2167} {"train_loss": -23.693574905395508, "global_step": 179888, "epoch": 2167} {"train_loss": -23.831192016601562, "global_step": 179889, "epoch": 2167} {"train_loss": -23.80093765258789, "global_step": 179890, "epoch": 2167} {"train_loss": -23.844741821289062, "global_step": 179891, "epoch": 2167} {"train_loss": -23.744029998779297, "global_step": 179892, "epoch": 2167} {"train_loss": -23.93299674987793, "global_step": 179893, "epoch": 2167} {"train_loss": -23.95726203918457, "global_step": 179894, "epoch": 2167} {"train_loss": -24.08672523498535, "global_step": 179895, "epoch": 2167} {"train_loss": -23.89080238342285, "global_step": 179896, "epoch": 2167} {"train_loss": -23.923995971679688, "global_step": 179897, "epoch": 2167} {"train_loss": -23.86796760559082, "global_step": 179898, "epoch": 2167} {"train_loss": -23.692052841186523, "global_step": 179899, "epoch": 2167} {"train_loss": -23.808795928955078, "global_step": 179900, "epoch": 2167} {"train_loss": -23.864994049072266, "global_step": 179901, "epoch": 2167} {"train_loss": -23.716175079345703, "global_step": 179902, "epoch": 2167} {"train_loss": -24.06072425842285, "global_step": 179903, "epoch": 2167} {"train_loss": -24.06406021118164, "global_step": 179904, "epoch": 2167} {"train_loss": -24.01333999633789, "global_step": 179905, "epoch": 2167} {"train_loss": -24.293752670288086, "global_step": 179906, "epoch": 2167} {"train_loss": -24.152603149414062, "global_step": 179907, "epoch": 2167} {"train_loss": -23.96109390258789, "global_step": 179908, "epoch": 2167} {"train_loss": -24.247777938842773, "global_step": 179909, "epoch": 2167} {"train_loss": -23.70857810974121, "global_step": 179910, "epoch": 2167} {"train_loss": -24.19660758972168, "global_step": 179911, "epoch": 2167} {"train_loss": -23.938940048217773, "global_step": 179912, "epoch": 2167} {"train_loss": -23.768709182739258, "global_step": 179913, "epoch": 2167} {"train_loss": -23.8301944732666, "global_step": 179914, "epoch": 2167} {"train_loss": -23.99989128112793, "global_step": 179915, "epoch": 2167} {"train_loss": -23.888263702392578, "global_step": 179916, "epoch": 2167} {"train_loss": -23.86683464050293, "global_step": 179917, "epoch": 2167} {"train_loss": -24.153549194335938, "global_step": 179918, "epoch": 2167} {"train_loss": -23.759756088256836, "global_step": 179919, "epoch": 2167} {"train_loss": -24.008649826049805, "global_step": 179920, "epoch": 2167} {"train_loss": -23.908435821533203, "global_step": 179921, "epoch": 2167} {"train_loss": -24.017053604125977, "global_step": 179922, "epoch": 2167} {"train_loss": -23.858591079711914, "global_step": 179923, "epoch": 2167} {"train_loss": -23.794462203979492, "global_step": 179924, "epoch": 2167} {"train_loss": -23.53980827331543, "global_step": 179925, "epoch": 2167} {"train_loss": -23.854856491088867, "global_step": 179926, "epoch": 2167} {"train_loss": -23.693622589111328, "global_step": 179927, "epoch": 2167} {"train_loss": -24.073017120361328, "global_step": 179928, "epoch": 2167} {"train_loss": -23.798494338989258, "global_step": 179929, "epoch": 2167} {"train_loss": -23.83832550048828, "global_step": 179930, "epoch": 2167} {"train_loss": -24.17823600769043, "global_step": 179931, "epoch": 2167} {"train_loss": -23.633726119995117, "global_step": 179932, "epoch": 2167} {"train_loss": -23.92837905883789, "global_step": 179933, "epoch": 2167} {"train_loss": -23.991430282592773, "global_step": 179934, "epoch": 2167} {"train_loss": -24.030139923095703, "global_step": 179935, "epoch": 2167} {"train_loss": -23.957670211791992, "global_step": 179936, "epoch": 2167} {"train_loss": -23.98598289489746, "global_step": 179937, "epoch": 2167} {"train_loss": -23.877817153930664, "global_step": 179938, "epoch": 2167} {"train_loss": -23.572830200195312, "global_step": 179939, "epoch": 2167} {"train_loss": -23.903980255126953, "global_step": 179940, "epoch": 2167} {"train_loss": -23.859905242919922, "global_step": 179941, "epoch": 2167} {"train_loss": -23.8259334564209, "global_step": 179942, "epoch": 2167} {"train_loss": -23.75269444017525, "global_step": 179943, "epoch": 2167, "val_loss": 6459297.5} {"train_loss": -23.59718894958496, "global_step": 179944, "epoch": 2168} {"train_loss": -23.493932723999023, "global_step": 179945, "epoch": 2168} {"train_loss": -23.276168823242188, "global_step": 179946, "epoch": 2168} {"train_loss": -23.643566131591797, "global_step": 179947, "epoch": 2168} {"train_loss": -23.6523494720459, "global_step": 179948, "epoch": 2168} {"train_loss": -23.55848503112793, "global_step": 179949, "epoch": 2168} {"train_loss": -23.279447555541992, "global_step": 179950, "epoch": 2168} {"train_loss": -23.54884910583496, "global_step": 179951, "epoch": 2168} {"train_loss": -23.269155502319336, "global_step": 179952, "epoch": 2168} {"train_loss": -23.768844604492188, "global_step": 179953, "epoch": 2168} {"train_loss": -23.62698745727539, "global_step": 179954, "epoch": 2168} {"train_loss": -23.27808952331543, "global_step": 179955, "epoch": 2168} {"train_loss": -23.2680721282959, "global_step": 179956, "epoch": 2168} {"train_loss": -23.71296501159668, "global_step": 179957, "epoch": 2168} {"train_loss": -23.730016708374023, "global_step": 179958, "epoch": 2168} {"train_loss": -23.807636260986328, "global_step": 179959, "epoch": 2168} {"train_loss": -23.53928565979004, "global_step": 179960, "epoch": 2168} {"train_loss": -23.18796730041504, "global_step": 179961, "epoch": 2168} {"train_loss": -23.244035720825195, "global_step": 179962, "epoch": 2168} {"train_loss": -23.357879638671875, "global_step": 179963, "epoch": 2168} {"train_loss": -23.31675148010254, "global_step": 179964, "epoch": 2168} {"train_loss": -23.652820587158203, "global_step": 179965, "epoch": 2168} {"train_loss": -23.830739974975586, "global_step": 179966, "epoch": 2168} {"train_loss": -23.74431800842285, "global_step": 179967, "epoch": 2168} {"train_loss": -23.681608200073242, "global_step": 179968, "epoch": 2168} {"train_loss": -23.429840087890625, "global_step": 179969, "epoch": 2168} {"train_loss": -23.601957321166992, "global_step": 179970, "epoch": 2168} {"train_loss": -24.027143478393555, "global_step": 179971, "epoch": 2168} {"train_loss": -23.481718063354492, "global_step": 179972, "epoch": 2168} {"train_loss": -23.811859130859375, "global_step": 179973, "epoch": 2168} {"train_loss": -24.043119430541992, "global_step": 179974, "epoch": 2168} {"train_loss": -23.743986129760742, "global_step": 179975, "epoch": 2168} {"train_loss": -23.906423568725586, "global_step": 179976, "epoch": 2168} {"train_loss": -24.044742584228516, "global_step": 179977, "epoch": 2168} {"train_loss": -23.83045196533203, "global_step": 179978, "epoch": 2168} {"train_loss": -23.735380172729492, "global_step": 179979, "epoch": 2168} {"train_loss": -24.08349609375, "global_step": 179980, "epoch": 2168} {"train_loss": -23.939245223999023, "global_step": 179981, "epoch": 2168} {"train_loss": -23.7249698638916, "global_step": 179982, "epoch": 2168} {"train_loss": -23.975250244140625, "global_step": 179983, "epoch": 2168} {"train_loss": -24.498273849487305, "global_step": 179984, "epoch": 2168} {"train_loss": -23.915693283081055, "global_step": 179985, "epoch": 2168} {"train_loss": -23.80390739440918, "global_step": 179986, "epoch": 2168} {"train_loss": -23.798826217651367, "global_step": 179987, "epoch": 2168} {"train_loss": -23.98749542236328, "global_step": 179988, "epoch": 2168} {"train_loss": -23.93286895751953, "global_step": 179989, "epoch": 2168} {"train_loss": -24.02688980102539, "global_step": 179990, "epoch": 2168} {"train_loss": -24.049375534057617, "global_step": 179991, "epoch": 2168} {"train_loss": -23.851293563842773, "global_step": 179992, "epoch": 2168} {"train_loss": -24.126768112182617, "global_step": 179993, "epoch": 2168} {"train_loss": -23.908645629882812, "global_step": 179994, "epoch": 2168} {"train_loss": -23.882667541503906, "global_step": 179995, "epoch": 2168} {"train_loss": -24.261030197143555, "global_step": 179996, "epoch": 2168} {"train_loss": -24.122976303100586, "global_step": 179997, "epoch": 2168} {"train_loss": -23.82591438293457, "global_step": 179998, "epoch": 2168} {"train_loss": -23.886310577392578, "global_step": 179999, "epoch": 2168} {"train_loss": -23.554065704345703, "global_step": 180000, "epoch": 2168} {"train_loss": -24.118322372436523, "global_step": 180001, "epoch": 2168} {"train_loss": -23.751108169555664, "global_step": 180002, "epoch": 2168} {"train_loss": -24.178295135498047, "global_step": 180003, "epoch": 2168} {"train_loss": -23.888641357421875, "global_step": 180004, "epoch": 2168} {"train_loss": -23.846973419189453, "global_step": 180005, "epoch": 2168} {"train_loss": -23.984731674194336, "global_step": 180006, "epoch": 2168} {"train_loss": -23.95538330078125, "global_step": 180007, "epoch": 2168} {"train_loss": -24.171110153198242, "global_step": 180008, "epoch": 2168} {"train_loss": -24.27274513244629, "global_step": 180009, "epoch": 2168} {"train_loss": -23.636661529541016, "global_step": 180010, "epoch": 2168} {"train_loss": -24.122486114501953, "global_step": 180011, "epoch": 2168} {"train_loss": -24.005163192749023, "global_step": 180012, "epoch": 2168} {"train_loss": -24.058897018432617, "global_step": 180013, "epoch": 2168} {"train_loss": -23.986757278442383, "global_step": 180014, "epoch": 2168} {"train_loss": -24.014841079711914, "global_step": 180015, "epoch": 2168} {"train_loss": -24.206588745117188, "global_step": 180016, "epoch": 2168} {"train_loss": -23.85898208618164, "global_step": 180017, "epoch": 2168} {"train_loss": -24.073041915893555, "global_step": 180018, "epoch": 2168} {"train_loss": -23.37010955810547, "global_step": 180019, "epoch": 2168} {"train_loss": -23.985523223876953, "global_step": 180020, "epoch": 2168} {"train_loss": -23.390249252319336, "global_step": 180021, "epoch": 2168} {"train_loss": -23.280195236206055, "global_step": 180022, "epoch": 2168} {"train_loss": -22.96766471862793, "global_step": 180023, "epoch": 2168} {"train_loss": -23.53628158569336, "global_step": 180024, "epoch": 2168} {"train_loss": -24.165760040283203, "global_step": 180025, "epoch": 2168} {"train_loss": -23.78352227268449, "global_step": 180026, "epoch": 2168, "val_loss": 6360090.0} {"train_loss": -23.49568748474121, "global_step": 180027, "epoch": 2169} {"train_loss": -23.372987747192383, "global_step": 180028, "epoch": 2169} {"train_loss": -23.053163528442383, "global_step": 180029, "epoch": 2169} {"train_loss": -23.163049697875977, "global_step": 180030, "epoch": 2169} {"train_loss": -23.24330711364746, "global_step": 180031, "epoch": 2169} {"train_loss": -23.449295043945312, "global_step": 180032, "epoch": 2169} {"train_loss": -23.531503677368164, "global_step": 180033, "epoch": 2169} {"train_loss": -23.475183486938477, "global_step": 180034, "epoch": 2169} {"train_loss": -23.434940338134766, "global_step": 180035, "epoch": 2169} {"train_loss": -22.839344024658203, "global_step": 180036, "epoch": 2169} {"train_loss": -23.263046264648438, "global_step": 180037, "epoch": 2169} {"train_loss": -23.395370483398438, "global_step": 180038, "epoch": 2169} {"train_loss": -23.471359252929688, "global_step": 180039, "epoch": 2169} {"train_loss": -23.475675582885742, "global_step": 180040, "epoch": 2169} {"train_loss": -23.28733253479004, "global_step": 180041, "epoch": 2169} {"train_loss": -23.577285766601562, "global_step": 180042, "epoch": 2169} {"train_loss": -23.472938537597656, "global_step": 180043, "epoch": 2169} {"train_loss": -23.54888343811035, "global_step": 180044, "epoch": 2169} {"train_loss": -23.852632522583008, "global_step": 180045, "epoch": 2169} {"train_loss": -23.76375389099121, "global_step": 180046, "epoch": 2169} {"train_loss": -23.83455467224121, "global_step": 180047, "epoch": 2169} {"train_loss": -23.36109733581543, "global_step": 180048, "epoch": 2169} {"train_loss": -23.726224899291992, "global_step": 180049, "epoch": 2169} {"train_loss": -23.85784149169922, "global_step": 180050, "epoch": 2169} {"train_loss": -23.67865753173828, "global_step": 180051, "epoch": 2169} {"train_loss": -23.772626876831055, "global_step": 180052, "epoch": 2169} {"train_loss": -24.092451095581055, "global_step": 180053, "epoch": 2169} {"train_loss": -24.10414695739746, "global_step": 180054, "epoch": 2169} {"train_loss": -23.940109252929688, "global_step": 180055, "epoch": 2169} {"train_loss": -23.983627319335938, "global_step": 180056, "epoch": 2169} {"train_loss": -23.567609786987305, "global_step": 180057, "epoch": 2169} {"train_loss": -23.958576202392578, "global_step": 180058, "epoch": 2169} {"train_loss": -23.462766647338867, "global_step": 180059, "epoch": 2169} {"train_loss": -23.855188369750977, "global_step": 180060, "epoch": 2169} {"train_loss": -23.888669967651367, "global_step": 180061, "epoch": 2169} {"train_loss": -24.113264083862305, "global_step": 180062, "epoch": 2169} {"train_loss": -23.511737823486328, "global_step": 180063, "epoch": 2169} {"train_loss": -23.98788833618164, "global_step": 180064, "epoch": 2169} {"train_loss": -24.21010398864746, "global_step": 180065, "epoch": 2169} {"train_loss": -23.67980194091797, "global_step": 180066, "epoch": 2169} {"train_loss": -23.534860610961914, "global_step": 180067, "epoch": 2169} {"train_loss": -23.65915298461914, "global_step": 180068, "epoch": 2169} {"train_loss": -24.055660247802734, "global_step": 180069, "epoch": 2169} {"train_loss": -23.798938751220703, "global_step": 180070, "epoch": 2169} {"train_loss": -24.189138412475586, "global_step": 180071, "epoch": 2169} {"train_loss": -23.824907302856445, "global_step": 180072, "epoch": 2169} {"train_loss": -24.00375747680664, "global_step": 180073, "epoch": 2169} {"train_loss": -24.03985023498535, "global_step": 180074, "epoch": 2169} {"train_loss": -23.740541458129883, "global_step": 180075, "epoch": 2169} {"train_loss": -23.76905632019043, "global_step": 180076, "epoch": 2169} {"train_loss": -24.068593978881836, "global_step": 180077, "epoch": 2169} {"train_loss": -23.87429428100586, "global_step": 180078, "epoch": 2169} {"train_loss": -24.016712188720703, "global_step": 180079, "epoch": 2169} {"train_loss": -23.857057571411133, "global_step": 180080, "epoch": 2169} {"train_loss": -24.24139976501465, "global_step": 180081, "epoch": 2169} {"train_loss": -24.089155197143555, "global_step": 180082, "epoch": 2169} {"train_loss": -24.42603302001953, "global_step": 180083, "epoch": 2169} {"train_loss": -23.9997615814209, "global_step": 180084, "epoch": 2169} {"train_loss": -24.054031372070312, "global_step": 180085, "epoch": 2169} {"train_loss": -24.246826171875, "global_step": 180086, "epoch": 2169} {"train_loss": -23.884700775146484, "global_step": 180087, "epoch": 2169} {"train_loss": -24.15474510192871, "global_step": 180088, "epoch": 2169} {"train_loss": -24.579084396362305, "global_step": 180089, "epoch": 2169} {"train_loss": -23.961990356445312, "global_step": 180090, "epoch": 2169} {"train_loss": -24.188047409057617, "global_step": 180091, "epoch": 2169} {"train_loss": -24.22739028930664, "global_step": 180092, "epoch": 2169} {"train_loss": -24.009611129760742, "global_step": 180093, "epoch": 2169} {"train_loss": -24.122112274169922, "global_step": 180094, "epoch": 2169} {"train_loss": -23.954599380493164, "global_step": 180095, "epoch": 2169} {"train_loss": -23.94927978515625, "global_step": 180096, "epoch": 2169} {"train_loss": -24.201284408569336, "global_step": 180097, "epoch": 2169} {"train_loss": -24.06562042236328, "global_step": 180098, "epoch": 2169} {"train_loss": -24.074743270874023, "global_step": 180099, "epoch": 2169} {"train_loss": -23.798755645751953, "global_step": 180100, "epoch": 2169} {"train_loss": -23.84283447265625, "global_step": 180101, "epoch": 2169} {"train_loss": -23.982511520385742, "global_step": 180102, "epoch": 2169} {"train_loss": -24.083284378051758, "global_step": 180103, "epoch": 2169} {"train_loss": -23.72064781188965, "global_step": 180104, "epoch": 2169} {"train_loss": -23.89411735534668, "global_step": 180105, "epoch": 2169} {"train_loss": -23.794736862182617, "global_step": 180106, "epoch": 2169} {"train_loss": -24.06903076171875, "global_step": 180107, "epoch": 2169} {"train_loss": -23.94911766052246, "global_step": 180108, "epoch": 2169} {"train_loss": -23.811863726880176, "global_step": 180109, "epoch": 2169, "val_loss": 6391415.0} {"train_loss": -22.876623153686523, "global_step": 180110, "epoch": 2170} {"train_loss": -23.142791748046875, "global_step": 180111, "epoch": 2170} {"train_loss": -23.611408233642578, "global_step": 180112, "epoch": 2170} {"train_loss": -23.4840087890625, "global_step": 180113, "epoch": 2170} {"train_loss": -23.2790584564209, "global_step": 180114, "epoch": 2170} {"train_loss": -23.605941772460938, "global_step": 180115, "epoch": 2170} {"train_loss": -23.41828727722168, "global_step": 180116, "epoch": 2170} {"train_loss": -23.649169921875, "global_step": 180117, "epoch": 2170} {"train_loss": -23.7620906829834, "global_step": 180118, "epoch": 2170} {"train_loss": -23.707815170288086, "global_step": 180119, "epoch": 2170} {"train_loss": -23.654701232910156, "global_step": 180120, "epoch": 2170} {"train_loss": -23.75135612487793, "global_step": 180121, "epoch": 2170} {"train_loss": -23.665691375732422, "global_step": 180122, "epoch": 2170} {"train_loss": -23.69805908203125, "global_step": 180123, "epoch": 2170} {"train_loss": -23.87964630126953, "global_step": 180124, "epoch": 2170} {"train_loss": -23.926490783691406, "global_step": 180125, "epoch": 2170} {"train_loss": -23.763174057006836, "global_step": 180126, "epoch": 2170} {"train_loss": -23.546751022338867, "global_step": 180127, "epoch": 2170} {"train_loss": -24.058551788330078, "global_step": 180128, "epoch": 2170} {"train_loss": -23.741437911987305, "global_step": 180129, "epoch": 2170} {"train_loss": -23.787429809570312, "global_step": 180130, "epoch": 2170} {"train_loss": -23.97186851501465, "global_step": 180131, "epoch": 2170} {"train_loss": -23.72813606262207, "global_step": 180132, "epoch": 2170} {"train_loss": -23.522159576416016, "global_step": 180133, "epoch": 2170} {"train_loss": -23.961973190307617, "global_step": 180134, "epoch": 2170} {"train_loss": -23.960037231445312, "global_step": 180135, "epoch": 2170} {"train_loss": -23.98151206970215, "global_step": 180136, "epoch": 2170} {"train_loss": -23.93989372253418, "global_step": 180137, "epoch": 2170} {"train_loss": -23.751611709594727, "global_step": 180138, "epoch": 2170} {"train_loss": -23.65653419494629, "global_step": 180139, "epoch": 2170} {"train_loss": -24.006444931030273, "global_step": 180140, "epoch": 2170} {"train_loss": -23.963022232055664, "global_step": 180141, "epoch": 2170} {"train_loss": -24.169729232788086, "global_step": 180142, "epoch": 2170} {"train_loss": -24.12125015258789, "global_step": 180143, "epoch": 2170} {"train_loss": -24.159473419189453, "global_step": 180144, "epoch": 2170} {"train_loss": -24.176252365112305, "global_step": 180145, "epoch": 2170} {"train_loss": -24.009349822998047, "global_step": 180146, "epoch": 2170} {"train_loss": -23.94548988342285, "global_step": 180147, "epoch": 2170} {"train_loss": -23.820819854736328, "global_step": 180148, "epoch": 2170} {"train_loss": -24.03761100769043, "global_step": 180149, "epoch": 2170} {"train_loss": -23.8642635345459, "global_step": 180150, "epoch": 2170} {"train_loss": -23.78784942626953, "global_step": 180151, "epoch": 2170} {"train_loss": -23.78700065612793, "global_step": 180152, "epoch": 2170} {"train_loss": -24.07792091369629, "global_step": 180153, "epoch": 2170} {"train_loss": -24.093669891357422, "global_step": 180154, "epoch": 2170} {"train_loss": -24.15384292602539, "global_step": 180155, "epoch": 2170} {"train_loss": -23.97098731994629, "global_step": 180156, "epoch": 2170} {"train_loss": -24.383495330810547, "global_step": 180157, "epoch": 2170} {"train_loss": -24.02992820739746, "global_step": 180158, "epoch": 2170} {"train_loss": -24.127416610717773, "global_step": 180159, "epoch": 2170} {"train_loss": -23.963045120239258, "global_step": 180160, "epoch": 2170} {"train_loss": -23.917051315307617, "global_step": 180161, "epoch": 2170} {"train_loss": -24.025869369506836, "global_step": 180162, "epoch": 2170} {"train_loss": -24.1873779296875, "global_step": 180163, "epoch": 2170} {"train_loss": -23.756582260131836, "global_step": 180164, "epoch": 2170} {"train_loss": -24.084754943847656, "global_step": 180165, "epoch": 2170} {"train_loss": -23.603199005126953, "global_step": 180166, "epoch": 2170} {"train_loss": -24.220186233520508, "global_step": 180167, "epoch": 2170} {"train_loss": -23.877248764038086, "global_step": 180168, "epoch": 2170} {"train_loss": -23.834697723388672, "global_step": 180169, "epoch": 2170} {"train_loss": -23.129383087158203, "global_step": 180170, "epoch": 2170} {"train_loss": -22.782272338867188, "global_step": 180171, "epoch": 2170} {"train_loss": -23.664159774780273, "global_step": 180172, "epoch": 2170} {"train_loss": -23.840621948242188, "global_step": 180173, "epoch": 2170} {"train_loss": -23.06998062133789, "global_step": 180174, "epoch": 2170} {"train_loss": -23.753799438476562, "global_step": 180175, "epoch": 2170} {"train_loss": -23.64350700378418, "global_step": 180176, "epoch": 2170} {"train_loss": -23.937475204467773, "global_step": 180177, "epoch": 2170} {"train_loss": -23.52763557434082, "global_step": 180178, "epoch": 2170} {"train_loss": -23.963207244873047, "global_step": 180179, "epoch": 2170} {"train_loss": -23.93543815612793, "global_step": 180180, "epoch": 2170} {"train_loss": -23.265384674072266, "global_step": 180181, "epoch": 2170} {"train_loss": -23.657316207885742, "global_step": 180182, "epoch": 2170} {"train_loss": -24.096466064453125, "global_step": 180183, "epoch": 2170} {"train_loss": -23.77816390991211, "global_step": 180184, "epoch": 2170} {"train_loss": -23.887863159179688, "global_step": 180185, "epoch": 2170} {"train_loss": -23.60540199279785, "global_step": 180186, "epoch": 2170} {"train_loss": -23.752410888671875, "global_step": 180187, "epoch": 2170} {"train_loss": -23.321813583374023, "global_step": 180188, "epoch": 2170} {"train_loss": -23.977766036987305, "global_step": 180189, "epoch": 2170} {"train_loss": -23.817214965820312, "global_step": 180190, "epoch": 2170} {"train_loss": -23.792606353759766, "global_step": 180191, "epoch": 2170} {"train_loss": -23.798090164919934, "global_step": 180192, "epoch": 2170, "val_loss": 6525421.0} {"train_loss": -23.41924476623535, "global_step": 180193, "epoch": 2171} {"train_loss": -23.987035751342773, "global_step": 180194, "epoch": 2171} {"train_loss": -23.518781661987305, "global_step": 180195, "epoch": 2171} {"train_loss": -23.538827896118164, "global_step": 180196, "epoch": 2171} {"train_loss": -23.728681564331055, "global_step": 180197, "epoch": 2171} {"train_loss": -23.422210693359375, "global_step": 180198, "epoch": 2171} {"train_loss": -23.842655181884766, "global_step": 180199, "epoch": 2171} {"train_loss": -23.950620651245117, "global_step": 180200, "epoch": 2171} {"train_loss": -23.892393112182617, "global_step": 180201, "epoch": 2171} {"train_loss": -23.510879516601562, "global_step": 180202, "epoch": 2171} {"train_loss": -23.727401733398438, "global_step": 180203, "epoch": 2171} {"train_loss": -23.624513626098633, "global_step": 180204, "epoch": 2171} {"train_loss": -23.90056800842285, "global_step": 180205, "epoch": 2171} {"train_loss": -23.658132553100586, "global_step": 180206, "epoch": 2171} {"train_loss": -23.66411018371582, "global_step": 180207, "epoch": 2171} {"train_loss": -24.117895126342773, "global_step": 180208, "epoch": 2171} {"train_loss": -23.92341423034668, "global_step": 180209, "epoch": 2171} {"train_loss": -24.089523315429688, "global_step": 180210, "epoch": 2171} {"train_loss": -24.282169342041016, "global_step": 180211, "epoch": 2171} {"train_loss": -23.83096694946289, "global_step": 180212, "epoch": 2171} {"train_loss": -23.788721084594727, "global_step": 180213, "epoch": 2171} {"train_loss": -23.846561431884766, "global_step": 180214, "epoch": 2171} {"train_loss": -24.041532516479492, "global_step": 180215, "epoch": 2171} {"train_loss": -23.893911361694336, "global_step": 180216, "epoch": 2171} {"train_loss": -24.054922103881836, "global_step": 180217, "epoch": 2171} {"train_loss": -24.078006744384766, "global_step": 180218, "epoch": 2171} {"train_loss": -24.177595138549805, "global_step": 180219, "epoch": 2171} {"train_loss": -24.082462310791016, "global_step": 180220, "epoch": 2171} {"train_loss": -23.57041358947754, "global_step": 180221, "epoch": 2171} {"train_loss": -23.731252670288086, "global_step": 180222, "epoch": 2171} {"train_loss": -24.11785125732422, "global_step": 180223, "epoch": 2171} {"train_loss": -23.87098503112793, "global_step": 180224, "epoch": 2171} {"train_loss": -24.19308853149414, "global_step": 180225, "epoch": 2171} {"train_loss": -24.185453414916992, "global_step": 180226, "epoch": 2171} {"train_loss": -24.05759048461914, "global_step": 180227, "epoch": 2171} {"train_loss": -23.704557418823242, "global_step": 180228, "epoch": 2171} {"train_loss": -23.891395568847656, "global_step": 180229, "epoch": 2171} {"train_loss": -24.112411499023438, "global_step": 180230, "epoch": 2171} {"train_loss": -24.210744857788086, "global_step": 180231, "epoch": 2171} {"train_loss": -23.950769424438477, "global_step": 180232, "epoch": 2171} {"train_loss": -23.78656005859375, "global_step": 180233, "epoch": 2171} {"train_loss": -23.82392692565918, "global_step": 180234, "epoch": 2171} {"train_loss": -24.013931274414062, "global_step": 180235, "epoch": 2171} {"train_loss": -23.860387802124023, "global_step": 180236, "epoch": 2171} {"train_loss": -24.262462615966797, "global_step": 180237, "epoch": 2171} {"train_loss": -24.04150390625, "global_step": 180238, "epoch": 2171} {"train_loss": -23.915868759155273, "global_step": 180239, "epoch": 2171} {"train_loss": -24.069761276245117, "global_step": 180240, "epoch": 2171} {"train_loss": -24.378480911254883, "global_step": 180241, "epoch": 2171} {"train_loss": -23.525604248046875, "global_step": 180242, "epoch": 2171} {"train_loss": -23.86012840270996, "global_step": 180243, "epoch": 2171} {"train_loss": -23.780147552490234, "global_step": 180244, "epoch": 2171} {"train_loss": -23.629087448120117, "global_step": 180245, "epoch": 2171} {"train_loss": -23.734146118164062, "global_step": 180246, "epoch": 2171} {"train_loss": -24.168624877929688, "global_step": 180247, "epoch": 2171} {"train_loss": -23.816308975219727, "global_step": 180248, "epoch": 2171} {"train_loss": -23.78737449645996, "global_step": 180249, "epoch": 2171} {"train_loss": -23.958662033081055, "global_step": 180250, "epoch": 2171} {"train_loss": -23.749977111816406, "global_step": 180251, "epoch": 2171} {"train_loss": -24.070711135864258, "global_step": 180252, "epoch": 2171} {"train_loss": -24.511159896850586, "global_step": 180253, "epoch": 2171} {"train_loss": -23.540517807006836, "global_step": 180254, "epoch": 2171} {"train_loss": -23.682233810424805, "global_step": 180255, "epoch": 2171} {"train_loss": -23.652509689331055, "global_step": 180256, "epoch": 2171} {"train_loss": -23.894515991210938, "global_step": 180257, "epoch": 2171} {"train_loss": -24.310789108276367, "global_step": 180258, "epoch": 2171} {"train_loss": -23.944843292236328, "global_step": 180259, "epoch": 2171} {"train_loss": -23.601688385009766, "global_step": 180260, "epoch": 2171} {"train_loss": -24.005788803100586, "global_step": 180261, "epoch": 2171} {"train_loss": -24.12849998474121, "global_step": 180262, "epoch": 2171} {"train_loss": -24.39581298828125, "global_step": 180263, "epoch": 2171} {"train_loss": -24.07765769958496, "global_step": 180264, "epoch": 2171} {"train_loss": -23.842466354370117, "global_step": 180265, "epoch": 2171} {"train_loss": -24.189085006713867, "global_step": 180266, "epoch": 2171} {"train_loss": -23.920852661132812, "global_step": 180267, "epoch": 2171} {"train_loss": -24.19085121154785, "global_step": 180268, "epoch": 2171} {"train_loss": -23.489980697631836, "global_step": 180269, "epoch": 2171} {"train_loss": -23.716787338256836, "global_step": 180270, "epoch": 2171} {"train_loss": -24.127790451049805, "global_step": 180271, "epoch": 2171} {"train_loss": -24.186012268066406, "global_step": 180272, "epoch": 2171} {"train_loss": -23.329465866088867, "global_step": 180273, "epoch": 2171} {"train_loss": -23.32560920715332, "global_step": 180274, "epoch": 2171} {"train_loss": -23.919647952160204, "global_step": 180275, "epoch": 2171, "val_loss": 6430747.5} {"train_loss": -23.083755493164062, "global_step": 180276, "epoch": 2172} {"train_loss": -24.16355323791504, "global_step": 180277, "epoch": 2172} {"train_loss": -23.313451766967773, "global_step": 180278, "epoch": 2172} {"train_loss": -23.683292388916016, "global_step": 180279, "epoch": 2172} {"train_loss": -23.437610626220703, "global_step": 180280, "epoch": 2172} {"train_loss": -24.095884323120117, "global_step": 180281, "epoch": 2172} {"train_loss": -23.71208953857422, "global_step": 180282, "epoch": 2172} {"train_loss": -23.61684226989746, "global_step": 180283, "epoch": 2172} {"train_loss": -23.844358444213867, "global_step": 180284, "epoch": 2172} {"train_loss": -23.680566787719727, "global_step": 180285, "epoch": 2172} {"train_loss": -23.980377197265625, "global_step": 180286, "epoch": 2172} {"train_loss": -24.019567489624023, "global_step": 180287, "epoch": 2172} {"train_loss": -24.375539779663086, "global_step": 180288, "epoch": 2172} {"train_loss": -23.805925369262695, "global_step": 180289, "epoch": 2172} {"train_loss": -23.952085494995117, "global_step": 180290, "epoch": 2172} {"train_loss": -23.534666061401367, "global_step": 180291, "epoch": 2172} {"train_loss": -23.994531631469727, "global_step": 180292, "epoch": 2172} {"train_loss": -23.805194854736328, "global_step": 180293, "epoch": 2172} {"train_loss": -23.910507202148438, "global_step": 180294, "epoch": 2172} {"train_loss": -23.791868209838867, "global_step": 180295, "epoch": 2172} {"train_loss": -24.059171676635742, "global_step": 180296, "epoch": 2172} {"train_loss": -24.09567642211914, "global_step": 180297, "epoch": 2172} {"train_loss": -23.8483943939209, "global_step": 180298, "epoch": 2172} {"train_loss": -24.14609718322754, "global_step": 180299, "epoch": 2172} {"train_loss": -24.30611228942871, "global_step": 180300, "epoch": 2172} {"train_loss": -23.724313735961914, "global_step": 180301, "epoch": 2172} {"train_loss": -23.781940460205078, "global_step": 180302, "epoch": 2172} {"train_loss": -24.102502822875977, "global_step": 180303, "epoch": 2172} {"train_loss": -23.93890380859375, "global_step": 180304, "epoch": 2172} {"train_loss": -23.645248413085938, "global_step": 180305, "epoch": 2172} {"train_loss": -23.740467071533203, "global_step": 180306, "epoch": 2172} {"train_loss": -23.86794090270996, "global_step": 180307, "epoch": 2172} {"train_loss": -23.832143783569336, "global_step": 180308, "epoch": 2172} {"train_loss": -24.04680633544922, "global_step": 180309, "epoch": 2172} {"train_loss": -23.923620223999023, "global_step": 180310, "epoch": 2172} {"train_loss": -23.97735023498535, "global_step": 180311, "epoch": 2172} {"train_loss": -23.66322898864746, "global_step": 180312, "epoch": 2172} {"train_loss": -23.66742515563965, "global_step": 180313, "epoch": 2172} {"train_loss": -23.75827980041504, "global_step": 180314, "epoch": 2172} {"train_loss": -23.76520347595215, "global_step": 180315, "epoch": 2172} {"train_loss": -24.01972198486328, "global_step": 180316, "epoch": 2172} {"train_loss": -23.629779815673828, "global_step": 180317, "epoch": 2172} {"train_loss": -24.06007957458496, "global_step": 180318, "epoch": 2172} {"train_loss": -24.073884963989258, "global_step": 180319, "epoch": 2172} {"train_loss": -24.0201473236084, "global_step": 180320, "epoch": 2172} {"train_loss": -23.82489585876465, "global_step": 180321, "epoch": 2172} {"train_loss": -24.056385040283203, "global_step": 180322, "epoch": 2172} {"train_loss": -23.863101959228516, "global_step": 180323, "epoch": 2172} {"train_loss": -23.996145248413086, "global_step": 180324, "epoch": 2172} {"train_loss": -23.822315216064453, "global_step": 180325, "epoch": 2172} {"train_loss": -23.9856014251709, "global_step": 180326, "epoch": 2172} {"train_loss": -23.813135147094727, "global_step": 180327, "epoch": 2172} {"train_loss": -23.8391170501709, "global_step": 180328, "epoch": 2172} {"train_loss": -24.0519962310791, "global_step": 180329, "epoch": 2172} {"train_loss": -23.962289810180664, "global_step": 180330, "epoch": 2172} {"train_loss": -24.383493423461914, "global_step": 180331, "epoch": 2172} {"train_loss": -23.844636917114258, "global_step": 180332, "epoch": 2172} {"train_loss": -24.12997817993164, "global_step": 180333, "epoch": 2172} {"train_loss": -24.21282196044922, "global_step": 180334, "epoch": 2172} {"train_loss": -23.92928123474121, "global_step": 180335, "epoch": 2172} {"train_loss": -24.233243942260742, "global_step": 180336, "epoch": 2172} {"train_loss": -23.992828369140625, "global_step": 180337, "epoch": 2172} {"train_loss": -23.948410034179688, "global_step": 180338, "epoch": 2172} {"train_loss": -24.037954330444336, "global_step": 180339, "epoch": 2172} {"train_loss": -24.14462661743164, "global_step": 180340, "epoch": 2172} {"train_loss": -23.86458969116211, "global_step": 180341, "epoch": 2172} {"train_loss": -23.708770751953125, "global_step": 180342, "epoch": 2172} {"train_loss": -23.804157257080078, "global_step": 180343, "epoch": 2172} {"train_loss": -23.879474639892578, "global_step": 180344, "epoch": 2172} {"train_loss": -24.388381958007812, "global_step": 180345, "epoch": 2172} {"train_loss": -23.769031524658203, "global_step": 180346, "epoch": 2172} {"train_loss": -23.683805465698242, "global_step": 180347, "epoch": 2172} {"train_loss": -23.97559928894043, "global_step": 180348, "epoch": 2172} {"train_loss": -24.056901931762695, "global_step": 180349, "epoch": 2172} {"train_loss": -23.868619918823242, "global_step": 180350, "epoch": 2172} {"train_loss": -24.193084716796875, "global_step": 180351, "epoch": 2172} {"train_loss": -23.9830322265625, "global_step": 180352, "epoch": 2172} {"train_loss": -24.278949737548828, "global_step": 180353, "epoch": 2172} {"train_loss": -24.1782283782959, "global_step": 180354, "epoch": 2172} {"train_loss": -23.934858322143555, "global_step": 180355, "epoch": 2172} {"train_loss": -23.89757537841797, "global_step": 180356, "epoch": 2172} {"train_loss": -23.87837791442871, "global_step": 180357, "epoch": 2172} {"train_loss": -23.901746566037097, "global_step": 180358, "epoch": 2172, "val_loss": 6479126.0} {"train_loss": -22.589092254638672, "global_step": 180359, "epoch": 2173} {"train_loss": -22.14389419555664, "global_step": 180360, "epoch": 2173} {"train_loss": -22.771116256713867, "global_step": 180361, "epoch": 2173} {"train_loss": -23.01021957397461, "global_step": 180362, "epoch": 2173} {"train_loss": -22.715560913085938, "global_step": 180363, "epoch": 2173} {"train_loss": -23.285476684570312, "global_step": 180364, "epoch": 2173} {"train_loss": -23.59186363220215, "global_step": 180365, "epoch": 2173} {"train_loss": -23.308284759521484, "global_step": 180366, "epoch": 2173} {"train_loss": -23.369564056396484, "global_step": 180367, "epoch": 2173} {"train_loss": -23.649049758911133, "global_step": 180368, "epoch": 2173} {"train_loss": -23.708927154541016, "global_step": 180369, "epoch": 2173} {"train_loss": -23.306995391845703, "global_step": 180370, "epoch": 2173} {"train_loss": -23.457860946655273, "global_step": 180371, "epoch": 2173} {"train_loss": -23.223350524902344, "global_step": 180372, "epoch": 2173} {"train_loss": -23.89277458190918, "global_step": 180373, "epoch": 2173} {"train_loss": -23.51114273071289, "global_step": 180374, "epoch": 2173} {"train_loss": -23.41961669921875, "global_step": 180375, "epoch": 2173} {"train_loss": -23.699907302856445, "global_step": 180376, "epoch": 2173} {"train_loss": -23.410306930541992, "global_step": 180377, "epoch": 2173} {"train_loss": -23.9129581451416, "global_step": 180378, "epoch": 2173} {"train_loss": -23.658567428588867, "global_step": 180379, "epoch": 2173} {"train_loss": -23.528833389282227, "global_step": 180380, "epoch": 2173} {"train_loss": -23.586843490600586, "global_step": 180381, "epoch": 2173} {"train_loss": -23.5529842376709, "global_step": 180382, "epoch": 2173} {"train_loss": -23.42696189880371, "global_step": 180383, "epoch": 2173} {"train_loss": -24.193281173706055, "global_step": 180384, "epoch": 2173} {"train_loss": -23.516244888305664, "global_step": 180385, "epoch": 2173} {"train_loss": -23.677757263183594, "global_step": 180386, "epoch": 2173} {"train_loss": -23.9285888671875, "global_step": 180387, "epoch": 2173} {"train_loss": -24.118457794189453, "global_step": 180388, "epoch": 2173} {"train_loss": -23.832000732421875, "global_step": 180389, "epoch": 2173} {"train_loss": -23.97626304626465, "global_step": 180390, "epoch": 2173} {"train_loss": -24.265918731689453, "global_step": 180391, "epoch": 2173} {"train_loss": -23.66120719909668, "global_step": 180392, "epoch": 2173} {"train_loss": -23.931604385375977, "global_step": 180393, "epoch": 2173} {"train_loss": -23.80729103088379, "global_step": 180394, "epoch": 2173} {"train_loss": -23.729053497314453, "global_step": 180395, "epoch": 2173} {"train_loss": -23.978473663330078, "global_step": 180396, "epoch": 2173} {"train_loss": -24.160537719726562, "global_step": 180397, "epoch": 2173} {"train_loss": -24.408823013305664, "global_step": 180398, "epoch": 2173} {"train_loss": -23.835660934448242, "global_step": 180399, "epoch": 2173} {"train_loss": -23.864376068115234, "global_step": 180400, "epoch": 2173} {"train_loss": -23.955968856811523, "global_step": 180401, "epoch": 2173} {"train_loss": -23.84058952331543, "global_step": 180402, "epoch": 2173} {"train_loss": -23.71407127380371, "global_step": 180403, "epoch": 2173} {"train_loss": -23.342294692993164, "global_step": 180404, "epoch": 2173} {"train_loss": -23.8195743560791, "global_step": 180405, "epoch": 2173} {"train_loss": -23.613758087158203, "global_step": 180406, "epoch": 2173} {"train_loss": -23.325597763061523, "global_step": 180407, "epoch": 2173} {"train_loss": -23.69161033630371, "global_step": 180408, "epoch": 2173} {"train_loss": -23.523300170898438, "global_step": 180409, "epoch": 2173} {"train_loss": -23.50394630432129, "global_step": 180410, "epoch": 2173} {"train_loss": -23.882177352905273, "global_step": 180411, "epoch": 2173} {"train_loss": -24.138639450073242, "global_step": 180412, "epoch": 2173} {"train_loss": -23.785789489746094, "global_step": 180413, "epoch": 2173} {"train_loss": -23.783588409423828, "global_step": 180414, "epoch": 2173} {"train_loss": -23.636554718017578, "global_step": 180415, "epoch": 2173} {"train_loss": -23.758943557739258, "global_step": 180416, "epoch": 2173} {"train_loss": -23.729652404785156, "global_step": 180417, "epoch": 2173} {"train_loss": -23.886110305786133, "global_step": 180418, "epoch": 2173} {"train_loss": -23.69502067565918, "global_step": 180419, "epoch": 2173} {"train_loss": -23.679121017456055, "global_step": 180420, "epoch": 2173} {"train_loss": -23.865528106689453, "global_step": 180421, "epoch": 2173} {"train_loss": -24.047090530395508, "global_step": 180422, "epoch": 2173} {"train_loss": -23.9693660736084, "global_step": 180423, "epoch": 2173} {"train_loss": -24.05051040649414, "global_step": 180424, "epoch": 2173} {"train_loss": -24.239301681518555, "global_step": 180425, "epoch": 2173} {"train_loss": -24.091320037841797, "global_step": 180426, "epoch": 2173} {"train_loss": -23.974868774414062, "global_step": 180427, "epoch": 2173} {"train_loss": -23.8497257232666, "global_step": 180428, "epoch": 2173} {"train_loss": -24.11530113220215, "global_step": 180429, "epoch": 2173} {"train_loss": -23.923755645751953, "global_step": 180430, "epoch": 2173} {"train_loss": -24.04233169555664, "global_step": 180431, "epoch": 2173} {"train_loss": -23.556371688842773, "global_step": 180432, "epoch": 2173} {"train_loss": -24.204923629760742, "global_step": 180433, "epoch": 2173} {"train_loss": -24.041940689086914, "global_step": 180434, "epoch": 2173} {"train_loss": -23.916030883789062, "global_step": 180435, "epoch": 2173} {"train_loss": -23.876012802124023, "global_step": 180436, "epoch": 2173} {"train_loss": -24.023101806640625, "global_step": 180437, "epoch": 2173} {"train_loss": -24.041458129882812, "global_step": 180438, "epoch": 2173} {"train_loss": -23.874860763549805, "global_step": 180439, "epoch": 2173} {"train_loss": -24.140958786010742, "global_step": 180440, "epoch": 2173} {"train_loss": -23.718360303396203, "global_step": 180441, "epoch": 2173, "val_loss": 6499515.0} {"train_loss": -23.506433486938477, "global_step": 180442, "epoch": 2174} {"train_loss": -23.477033615112305, "global_step": 180443, "epoch": 2174} {"train_loss": -23.35255241394043, "global_step": 180444, "epoch": 2174} {"train_loss": -23.684663772583008, "global_step": 180445, "epoch": 2174} {"train_loss": -23.59737205505371, "global_step": 180446, "epoch": 2174} {"train_loss": -23.77469825744629, "global_step": 180447, "epoch": 2174} {"train_loss": -23.343421936035156, "global_step": 180448, "epoch": 2174} {"train_loss": -23.808584213256836, "global_step": 180449, "epoch": 2174} {"train_loss": -23.4580020904541, "global_step": 180450, "epoch": 2174} {"train_loss": -23.54374885559082, "global_step": 180451, "epoch": 2174} {"train_loss": -23.728139877319336, "global_step": 180452, "epoch": 2174} {"train_loss": -24.22187614440918, "global_step": 180453, "epoch": 2174} {"train_loss": -23.70241355895996, "global_step": 180454, "epoch": 2174} {"train_loss": -23.564321517944336, "global_step": 180455, "epoch": 2174} {"train_loss": -24.09488296508789, "global_step": 180456, "epoch": 2174} {"train_loss": -23.400598526000977, "global_step": 180457, "epoch": 2174} {"train_loss": -23.616727828979492, "global_step": 180458, "epoch": 2174} {"train_loss": -23.57565689086914, "global_step": 180459, "epoch": 2174} {"train_loss": -23.807069778442383, "global_step": 180460, "epoch": 2174} {"train_loss": -23.706466674804688, "global_step": 180461, "epoch": 2174} {"train_loss": -23.80073356628418, "global_step": 180462, "epoch": 2174} {"train_loss": -23.88593101501465, "global_step": 180463, "epoch": 2174} {"train_loss": -23.73602294921875, "global_step": 180464, "epoch": 2174} {"train_loss": -24.046606063842773, "global_step": 180465, "epoch": 2174} {"train_loss": -24.01191520690918, "global_step": 180466, "epoch": 2174} {"train_loss": -23.853673934936523, "global_step": 180467, "epoch": 2174} {"train_loss": -23.616657257080078, "global_step": 180468, "epoch": 2174} {"train_loss": -23.840707778930664, "global_step": 180469, "epoch": 2174} {"train_loss": -23.999967575073242, "global_step": 180470, "epoch": 2174} {"train_loss": -23.952871322631836, "global_step": 180471, "epoch": 2174} {"train_loss": -23.868762969970703, "global_step": 180472, "epoch": 2174} {"train_loss": -23.512413024902344, "global_step": 180473, "epoch": 2174} {"train_loss": -23.866931915283203, "global_step": 180474, "epoch": 2174} {"train_loss": -23.983890533447266, "global_step": 180475, "epoch": 2174} {"train_loss": -23.92154312133789, "global_step": 180476, "epoch": 2174} {"train_loss": -24.137861251831055, "global_step": 180477, "epoch": 2174} {"train_loss": -23.930099487304688, "global_step": 180478, "epoch": 2174} {"train_loss": -24.014616012573242, "global_step": 180479, "epoch": 2174} {"train_loss": -23.4140625, "global_step": 180480, "epoch": 2174} {"train_loss": -23.790191650390625, "global_step": 180481, "epoch": 2174} {"train_loss": -24.260269165039062, "global_step": 180482, "epoch": 2174} {"train_loss": -23.19887351989746, "global_step": 180483, "epoch": 2174} {"train_loss": -23.55079460144043, "global_step": 180484, "epoch": 2174} {"train_loss": -23.358051300048828, "global_step": 180485, "epoch": 2174} {"train_loss": -23.870573043823242, "global_step": 180486, "epoch": 2174} {"train_loss": -23.692697525024414, "global_step": 180487, "epoch": 2174} {"train_loss": -23.75027847290039, "global_step": 180488, "epoch": 2174} {"train_loss": -23.801176071166992, "global_step": 180489, "epoch": 2174} {"train_loss": -23.505826950073242, "global_step": 180490, "epoch": 2174} {"train_loss": -23.75946044921875, "global_step": 180491, "epoch": 2174} {"train_loss": -23.873334884643555, "global_step": 180492, "epoch": 2174} {"train_loss": -23.982297897338867, "global_step": 180493, "epoch": 2174} {"train_loss": -23.55856704711914, "global_step": 180494, "epoch": 2174} {"train_loss": -23.80665397644043, "global_step": 180495, "epoch": 2174} {"train_loss": -23.687803268432617, "global_step": 180496, "epoch": 2174} {"train_loss": -23.82169532775879, "global_step": 180497, "epoch": 2174} {"train_loss": -23.845224380493164, "global_step": 180498, "epoch": 2174} {"train_loss": -24.126331329345703, "global_step": 180499, "epoch": 2174} {"train_loss": -24.457509994506836, "global_step": 180500, "epoch": 2174} {"train_loss": -24.28700828552246, "global_step": 180501, "epoch": 2174} {"train_loss": -24.184661865234375, "global_step": 180502, "epoch": 2174} {"train_loss": -24.210418701171875, "global_step": 180503, "epoch": 2174} {"train_loss": -23.847736358642578, "global_step": 180504, "epoch": 2174} {"train_loss": -23.73591423034668, "global_step": 180505, "epoch": 2174} {"train_loss": -23.99420166015625, "global_step": 180506, "epoch": 2174} {"train_loss": -23.80469512939453, "global_step": 180507, "epoch": 2174} {"train_loss": -24.035280227661133, "global_step": 180508, "epoch": 2174} {"train_loss": -23.76136016845703, "global_step": 180509, "epoch": 2174} {"train_loss": -23.87986946105957, "global_step": 180510, "epoch": 2174} {"train_loss": -23.898969650268555, "global_step": 180511, "epoch": 2174} {"train_loss": -24.05147933959961, "global_step": 180512, "epoch": 2174} {"train_loss": -24.00837516784668, "global_step": 180513, "epoch": 2174} {"train_loss": -23.57245445251465, "global_step": 180514, "epoch": 2174} {"train_loss": -24.089895248413086, "global_step": 180515, "epoch": 2174} {"train_loss": -23.926673889160156, "global_step": 180516, "epoch": 2174} {"train_loss": -24.152334213256836, "global_step": 180517, "epoch": 2174} {"train_loss": -23.790924072265625, "global_step": 180518, "epoch": 2174} {"train_loss": -23.628442764282227, "global_step": 180519, "epoch": 2174} {"train_loss": -23.83635139465332, "global_step": 180520, "epoch": 2174} {"train_loss": -24.17803382873535, "global_step": 180521, "epoch": 2174} {"train_loss": -23.983835220336914, "global_step": 180522, "epoch": 2174} {"train_loss": -23.701894760131836, "global_step": 180523, "epoch": 2174} {"train_loss": -23.816984544317407, "global_step": 180524, "epoch": 2174, "val_loss": 6635115.0} {"train_loss": -22.951560974121094, "global_step": 180525, "epoch": 2175} {"train_loss": -23.796049118041992, "global_step": 180526, "epoch": 2175} {"train_loss": -23.16293716430664, "global_step": 180527, "epoch": 2175} {"train_loss": -23.01655387878418, "global_step": 180528, "epoch": 2175} {"train_loss": -22.885671615600586, "global_step": 180529, "epoch": 2175} {"train_loss": -23.336755752563477, "global_step": 180530, "epoch": 2175} {"train_loss": -23.421045303344727, "global_step": 180531, "epoch": 2175} {"train_loss": -23.553674697875977, "global_step": 180532, "epoch": 2175} {"train_loss": -23.811800003051758, "global_step": 180533, "epoch": 2175} {"train_loss": -23.282230377197266, "global_step": 180534, "epoch": 2175} {"train_loss": -23.548551559448242, "global_step": 180535, "epoch": 2175} {"train_loss": -23.5751953125, "global_step": 180536, "epoch": 2175} {"train_loss": -23.971681594848633, "global_step": 180537, "epoch": 2175} {"train_loss": -23.659427642822266, "global_step": 180538, "epoch": 2175} {"train_loss": -23.66628074645996, "global_step": 180539, "epoch": 2175} {"train_loss": -23.573833465576172, "global_step": 180540, "epoch": 2175} {"train_loss": -23.850339889526367, "global_step": 180541, "epoch": 2175} {"train_loss": -23.976076126098633, "global_step": 180542, "epoch": 2175} {"train_loss": -23.48063087463379, "global_step": 180543, "epoch": 2175} {"train_loss": -23.909223556518555, "global_step": 180544, "epoch": 2175} {"train_loss": -23.63201904296875, "global_step": 180545, "epoch": 2175} {"train_loss": -23.73824119567871, "global_step": 180546, "epoch": 2175} {"train_loss": -23.845458984375, "global_step": 180547, "epoch": 2175} {"train_loss": -23.64987564086914, "global_step": 180548, "epoch": 2175} {"train_loss": -24.16368865966797, "global_step": 180549, "epoch": 2175} {"train_loss": -23.92047691345215, "global_step": 180550, "epoch": 2175} {"train_loss": -23.846227645874023, "global_step": 180551, "epoch": 2175} {"train_loss": -23.956937789916992, "global_step": 180552, "epoch": 2175} {"train_loss": -24.009037017822266, "global_step": 180553, "epoch": 2175} {"train_loss": -23.97532081604004, "global_step": 180554, "epoch": 2175} {"train_loss": -24.088369369506836, "global_step": 180555, "epoch": 2175} {"train_loss": -24.084365844726562, "global_step": 180556, "epoch": 2175} {"train_loss": -24.194717407226562, "global_step": 180557, "epoch": 2175} {"train_loss": -23.940900802612305, "global_step": 180558, "epoch": 2175} {"train_loss": -23.885761260986328, "global_step": 180559, "epoch": 2175} {"train_loss": -24.045263290405273, "global_step": 180560, "epoch": 2175} {"train_loss": -24.006460189819336, "global_step": 180561, "epoch": 2175} {"train_loss": -24.16959571838379, "global_step": 180562, "epoch": 2175} {"train_loss": -23.86529541015625, "global_step": 180563, "epoch": 2175} {"train_loss": -23.940698623657227, "global_step": 180564, "epoch": 2175} {"train_loss": -23.614612579345703, "global_step": 180565, "epoch": 2175} {"train_loss": -24.166975021362305, "global_step": 180566, "epoch": 2175} {"train_loss": -23.849210739135742, "global_step": 180567, "epoch": 2175} {"train_loss": -23.807538986206055, "global_step": 180568, "epoch": 2175} {"train_loss": -23.87546730041504, "global_step": 180569, "epoch": 2175} {"train_loss": -23.715620040893555, "global_step": 180570, "epoch": 2175} {"train_loss": -23.940977096557617, "global_step": 180571, "epoch": 2175} {"train_loss": -23.520206451416016, "global_step": 180572, "epoch": 2175} {"train_loss": -23.992341995239258, "global_step": 180573, "epoch": 2175} {"train_loss": -24.35719108581543, "global_step": 180574, "epoch": 2175} {"train_loss": -24.29147720336914, "global_step": 180575, "epoch": 2175} {"train_loss": -23.69596290588379, "global_step": 180576, "epoch": 2175} {"train_loss": -23.62163734436035, "global_step": 180577, "epoch": 2175} {"train_loss": -23.787338256835938, "global_step": 180578, "epoch": 2175} {"train_loss": -24.32906150817871, "global_step": 180579, "epoch": 2175} {"train_loss": -23.95295524597168, "global_step": 180580, "epoch": 2175} {"train_loss": -24.006643295288086, "global_step": 180581, "epoch": 2175} {"train_loss": -24.069183349609375, "global_step": 180582, "epoch": 2175} {"train_loss": -24.219532012939453, "global_step": 180583, "epoch": 2175} {"train_loss": -23.957563400268555, "global_step": 180584, "epoch": 2175} {"train_loss": -24.103107452392578, "global_step": 180585, "epoch": 2175} {"train_loss": -23.648849487304688, "global_step": 180586, "epoch": 2175} {"train_loss": -24.151609420776367, "global_step": 180587, "epoch": 2175} {"train_loss": -23.72480583190918, "global_step": 180588, "epoch": 2175} {"train_loss": -23.84354019165039, "global_step": 180589, "epoch": 2175} {"train_loss": -24.057703018188477, "global_step": 180590, "epoch": 2175} {"train_loss": -23.897708892822266, "global_step": 180591, "epoch": 2175} {"train_loss": -23.727060317993164, "global_step": 180592, "epoch": 2175} {"train_loss": -23.83489418029785, "global_step": 180593, "epoch": 2175} {"train_loss": -23.866455078125, "global_step": 180594, "epoch": 2175} {"train_loss": -23.786067962646484, "global_step": 180595, "epoch": 2175} {"train_loss": -23.584936141967773, "global_step": 180596, "epoch": 2175} {"train_loss": -23.739168167114258, "global_step": 180597, "epoch": 2175} {"train_loss": -23.856725692749023, "global_step": 180598, "epoch": 2175} {"train_loss": -23.74076271057129, "global_step": 180599, "epoch": 2175} {"train_loss": -23.62856101989746, "global_step": 180600, "epoch": 2175} {"train_loss": -23.610376358032227, "global_step": 180601, "epoch": 2175} {"train_loss": -24.02630043029785, "global_step": 180602, "epoch": 2175} {"train_loss": -23.909765243530273, "global_step": 180603, "epoch": 2175} {"train_loss": -23.715612411499023, "global_step": 180604, "epoch": 2175} {"train_loss": -23.83229637145996, "global_step": 180605, "epoch": 2175} {"train_loss": -23.9785213470459, "global_step": 180606, "epoch": 2175} {"train_loss": -23.817864567400463, "global_step": 180607, "epoch": 2175, "val_loss": 6454011.0} {"train_loss": -23.396512985229492, "global_step": 180608, "epoch": 2176} {"train_loss": -22.974197387695312, "global_step": 180609, "epoch": 2176} {"train_loss": -23.09682846069336, "global_step": 180610, "epoch": 2176} {"train_loss": -23.616718292236328, "global_step": 180611, "epoch": 2176} {"train_loss": -23.05708885192871, "global_step": 180612, "epoch": 2176} {"train_loss": -23.738468170166016, "global_step": 180613, "epoch": 2176} {"train_loss": -23.114437103271484, "global_step": 180614, "epoch": 2176} {"train_loss": -23.441070556640625, "global_step": 180615, "epoch": 2176} {"train_loss": -23.734281539916992, "global_step": 180616, "epoch": 2176} {"train_loss": -23.48487663269043, "global_step": 180617, "epoch": 2176} {"train_loss": -23.2780704498291, "global_step": 180618, "epoch": 2176} {"train_loss": -23.800256729125977, "global_step": 180619, "epoch": 2176} {"train_loss": -23.275108337402344, "global_step": 180620, "epoch": 2176} {"train_loss": -23.750431060791016, "global_step": 180621, "epoch": 2176} {"train_loss": -23.526382446289062, "global_step": 180622, "epoch": 2176} {"train_loss": -23.56477165222168, "global_step": 180623, "epoch": 2176} {"train_loss": -23.787139892578125, "global_step": 180624, "epoch": 2176} {"train_loss": -23.49968719482422, "global_step": 180625, "epoch": 2176} {"train_loss": -23.794368743896484, "global_step": 180626, "epoch": 2176} {"train_loss": -23.88864517211914, "global_step": 180627, "epoch": 2176} {"train_loss": -23.498870849609375, "global_step": 180628, "epoch": 2176} {"train_loss": -23.841754913330078, "global_step": 180629, "epoch": 2176} {"train_loss": -23.83492660522461, "global_step": 180630, "epoch": 2176} {"train_loss": -23.700862884521484, "global_step": 180631, "epoch": 2176} {"train_loss": -24.020771026611328, "global_step": 180632, "epoch": 2176} {"train_loss": -23.747793197631836, "global_step": 180633, "epoch": 2176} {"train_loss": -23.799606323242188, "global_step": 180634, "epoch": 2176} {"train_loss": -23.638364791870117, "global_step": 180635, "epoch": 2176} {"train_loss": -23.792144775390625, "global_step": 180636, "epoch": 2176} {"train_loss": -23.72209930419922, "global_step": 180637, "epoch": 2176} {"train_loss": -24.249940872192383, "global_step": 180638, "epoch": 2176} {"train_loss": -23.823238372802734, "global_step": 180639, "epoch": 2176} {"train_loss": -23.782655715942383, "global_step": 180640, "epoch": 2176} {"train_loss": -23.935304641723633, "global_step": 180641, "epoch": 2176} {"train_loss": -23.918212890625, "global_step": 180642, "epoch": 2176} {"train_loss": -23.828062057495117, "global_step": 180643, "epoch": 2176} {"train_loss": -24.0500545501709, "global_step": 180644, "epoch": 2176} {"train_loss": -23.92878532409668, "global_step": 180645, "epoch": 2176} {"train_loss": -23.60127830505371, "global_step": 180646, "epoch": 2176} {"train_loss": -23.95278549194336, "global_step": 180647, "epoch": 2176} {"train_loss": -24.151620864868164, "global_step": 180648, "epoch": 2176} {"train_loss": -23.922903060913086, "global_step": 180649, "epoch": 2176} {"train_loss": -23.40096092224121, "global_step": 180650, "epoch": 2176} {"train_loss": -23.703876495361328, "global_step": 180651, "epoch": 2176} {"train_loss": -23.973234176635742, "global_step": 180652, "epoch": 2176} {"train_loss": -23.883243560791016, "global_step": 180653, "epoch": 2176} {"train_loss": -23.75661277770996, "global_step": 180654, "epoch": 2176} {"train_loss": -24.214214324951172, "global_step": 180655, "epoch": 2176} {"train_loss": -23.67535972595215, "global_step": 180656, "epoch": 2176} {"train_loss": -23.731592178344727, "global_step": 180657, "epoch": 2176} {"train_loss": -24.0554256439209, "global_step": 180658, "epoch": 2176} {"train_loss": -23.925273895263672, "global_step": 180659, "epoch": 2176} {"train_loss": -24.012693405151367, "global_step": 180660, "epoch": 2176} {"train_loss": -23.848344802856445, "global_step": 180661, "epoch": 2176} {"train_loss": -23.88323402404785, "global_step": 180662, "epoch": 2176} {"train_loss": -24.427621841430664, "global_step": 180663, "epoch": 2176} {"train_loss": -23.62979507446289, "global_step": 180664, "epoch": 2176} {"train_loss": -23.94183921813965, "global_step": 180665, "epoch": 2176} {"train_loss": -24.121164321899414, "global_step": 180666, "epoch": 2176} {"train_loss": -23.769731521606445, "global_step": 180667, "epoch": 2176} {"train_loss": -23.83846092224121, "global_step": 180668, "epoch": 2176} {"train_loss": -23.847930908203125, "global_step": 180669, "epoch": 2176} {"train_loss": -23.811737060546875, "global_step": 180670, "epoch": 2176} {"train_loss": -24.010168075561523, "global_step": 180671, "epoch": 2176} {"train_loss": -23.89862060546875, "global_step": 180672, "epoch": 2176} {"train_loss": -24.063688278198242, "global_step": 180673, "epoch": 2176} {"train_loss": -23.45833969116211, "global_step": 180674, "epoch": 2176} {"train_loss": -23.594409942626953, "global_step": 180675, "epoch": 2176} {"train_loss": -23.620229721069336, "global_step": 180676, "epoch": 2176} {"train_loss": -24.151708602905273, "global_step": 180677, "epoch": 2176} {"train_loss": -24.074111938476562, "global_step": 180678, "epoch": 2176} {"train_loss": -24.154754638671875, "global_step": 180679, "epoch": 2176} {"train_loss": -23.842824935913086, "global_step": 180680, "epoch": 2176} {"train_loss": -24.213300704956055, "global_step": 180681, "epoch": 2176} {"train_loss": -24.36200714111328, "global_step": 180682, "epoch": 2176} {"train_loss": -24.21424674987793, "global_step": 180683, "epoch": 2176} {"train_loss": -24.265775680541992, "global_step": 180684, "epoch": 2176} {"train_loss": -24.19179344177246, "global_step": 180685, "epoch": 2176} {"train_loss": -24.128799438476562, "global_step": 180686, "epoch": 2176} {"train_loss": -23.944839477539062, "global_step": 180687, "epoch": 2176} {"train_loss": -23.955129623413086, "global_step": 180688, "epoch": 2176} {"train_loss": -23.923343658447266, "global_step": 180689, "epoch": 2176} {"train_loss": -23.788756726736047, "global_step": 180690, "epoch": 2176, "val_loss": 6557196.0} {"train_loss": -23.76816749572754, "global_step": 180691, "epoch": 2177} {"train_loss": -23.324783325195312, "global_step": 180692, "epoch": 2177} {"train_loss": -23.17950439453125, "global_step": 180693, "epoch": 2177} {"train_loss": -23.379560470581055, "global_step": 180694, "epoch": 2177} {"train_loss": -23.43837547302246, "global_step": 180695, "epoch": 2177} {"train_loss": -23.738645553588867, "global_step": 180696, "epoch": 2177} {"train_loss": -23.595991134643555, "global_step": 180697, "epoch": 2177} {"train_loss": -23.729578018188477, "global_step": 180698, "epoch": 2177} {"train_loss": -23.95857810974121, "global_step": 180699, "epoch": 2177} {"train_loss": -23.276309967041016, "global_step": 180700, "epoch": 2177} {"train_loss": -23.496366500854492, "global_step": 180701, "epoch": 2177} {"train_loss": -23.39395523071289, "global_step": 180702, "epoch": 2177} {"train_loss": -23.75235939025879, "global_step": 180703, "epoch": 2177} {"train_loss": -23.778493881225586, "global_step": 180704, "epoch": 2177} {"train_loss": -23.639820098876953, "global_step": 180705, "epoch": 2177} {"train_loss": -23.51215171813965, "global_step": 180706, "epoch": 2177} {"train_loss": -23.46431541442871, "global_step": 180707, "epoch": 2177} {"train_loss": -23.356481552124023, "global_step": 180708, "epoch": 2177} {"train_loss": -23.54689598083496, "global_step": 180709, "epoch": 2177} {"train_loss": -23.56153678894043, "global_step": 180710, "epoch": 2177} {"train_loss": -23.87763786315918, "global_step": 180711, "epoch": 2177} {"train_loss": -23.825210571289062, "global_step": 180712, "epoch": 2177} {"train_loss": -23.599836349487305, "global_step": 180713, "epoch": 2177} {"train_loss": -23.923139572143555, "global_step": 180714, "epoch": 2177} {"train_loss": -23.754056930541992, "global_step": 180715, "epoch": 2177} {"train_loss": -24.073698043823242, "global_step": 180716, "epoch": 2177} {"train_loss": -23.563871383666992, "global_step": 180717, "epoch": 2177} {"train_loss": -23.908117294311523, "global_step": 180718, "epoch": 2177} {"train_loss": -23.982946395874023, "global_step": 180719, "epoch": 2177} {"train_loss": -24.148387908935547, "global_step": 180720, "epoch": 2177} {"train_loss": -23.81098747253418, "global_step": 180721, "epoch": 2177} {"train_loss": -23.706520080566406, "global_step": 180722, "epoch": 2177} {"train_loss": -23.872936248779297, "global_step": 180723, "epoch": 2177} {"train_loss": -24.360660552978516, "global_step": 180724, "epoch": 2177} {"train_loss": -24.110939025878906, "global_step": 180725, "epoch": 2177} {"train_loss": -23.89385414123535, "global_step": 180726, "epoch": 2177} {"train_loss": -23.861642837524414, "global_step": 180727, "epoch": 2177} {"train_loss": -23.855562210083008, "global_step": 180728, "epoch": 2177} {"train_loss": -24.247116088867188, "global_step": 180729, "epoch": 2177} {"train_loss": -24.10713005065918, "global_step": 180730, "epoch": 2177} {"train_loss": -23.725326538085938, "global_step": 180731, "epoch": 2177} {"train_loss": -23.947036743164062, "global_step": 180732, "epoch": 2177} {"train_loss": -24.078916549682617, "global_step": 180733, "epoch": 2177} {"train_loss": -23.813581466674805, "global_step": 180734, "epoch": 2177} {"train_loss": -23.929136276245117, "global_step": 180735, "epoch": 2177} {"train_loss": -24.095396041870117, "global_step": 180736, "epoch": 2177} {"train_loss": -24.100095748901367, "global_step": 180737, "epoch": 2177} {"train_loss": -24.016403198242188, "global_step": 180738, "epoch": 2177} {"train_loss": -24.179916381835938, "global_step": 180739, "epoch": 2177} {"train_loss": -24.033926010131836, "global_step": 180740, "epoch": 2177} {"train_loss": -23.791913986206055, "global_step": 180741, "epoch": 2177} {"train_loss": -24.153976440429688, "global_step": 180742, "epoch": 2177} {"train_loss": -23.704748153686523, "global_step": 180743, "epoch": 2177} {"train_loss": -23.704898834228516, "global_step": 180744, "epoch": 2177} {"train_loss": -23.652755737304688, "global_step": 180745, "epoch": 2177} {"train_loss": -23.804630279541016, "global_step": 180746, "epoch": 2177} {"train_loss": -23.543264389038086, "global_step": 180747, "epoch": 2177} {"train_loss": -23.999414443969727, "global_step": 180748, "epoch": 2177} {"train_loss": -24.049585342407227, "global_step": 180749, "epoch": 2177} {"train_loss": -24.199996948242188, "global_step": 180750, "epoch": 2177} {"train_loss": -23.825998306274414, "global_step": 180751, "epoch": 2177} {"train_loss": -24.117942810058594, "global_step": 180752, "epoch": 2177} {"train_loss": -23.96750259399414, "global_step": 180753, "epoch": 2177} {"train_loss": -23.63808250427246, "global_step": 180754, "epoch": 2177} {"train_loss": -24.247821807861328, "global_step": 180755, "epoch": 2177} {"train_loss": -23.16440773010254, "global_step": 180756, "epoch": 2177} {"train_loss": -24.083406448364258, "global_step": 180757, "epoch": 2177} {"train_loss": -23.768878936767578, "global_step": 180758, "epoch": 2177} {"train_loss": -23.606767654418945, "global_step": 180759, "epoch": 2177} {"train_loss": -23.24059295654297, "global_step": 180760, "epoch": 2177} {"train_loss": -23.841903686523438, "global_step": 180761, "epoch": 2177} {"train_loss": -23.37864875793457, "global_step": 180762, "epoch": 2177} {"train_loss": -23.62796401977539, "global_step": 180763, "epoch": 2177} {"train_loss": -24.127756118774414, "global_step": 180764, "epoch": 2177} {"train_loss": -23.853012084960938, "global_step": 180765, "epoch": 2177} {"train_loss": -23.409833908081055, "global_step": 180766, "epoch": 2177} {"train_loss": -24.0237979888916, "global_step": 180767, "epoch": 2177} {"train_loss": -23.618947982788086, "global_step": 180768, "epoch": 2177} {"train_loss": -23.54783058166504, "global_step": 180769, "epoch": 2177} {"train_loss": -24.132902145385742, "global_step": 180770, "epoch": 2177} {"train_loss": -23.830968856811523, "global_step": 180771, "epoch": 2177} {"train_loss": -23.83591651916504, "global_step": 180772, "epoch": 2177} {"train_loss": -23.788619512535004, "global_step": 180773, "epoch": 2177, "val_loss": 6496152.0} {"train_loss": -24.005088806152344, "global_step": 180774, "epoch": 2178} {"train_loss": -23.718263626098633, "global_step": 180775, "epoch": 2178} {"train_loss": -23.720083236694336, "global_step": 180776, "epoch": 2178} {"train_loss": -23.668485641479492, "global_step": 180777, "epoch": 2178} {"train_loss": -23.402780532836914, "global_step": 180778, "epoch": 2178} {"train_loss": -23.37504005432129, "global_step": 180779, "epoch": 2178} {"train_loss": -23.53450584411621, "global_step": 180780, "epoch": 2178} {"train_loss": -23.586050033569336, "global_step": 180781, "epoch": 2178} {"train_loss": -23.480249404907227, "global_step": 180782, "epoch": 2178} {"train_loss": -23.67763328552246, "global_step": 180783, "epoch": 2178} {"train_loss": -23.633529663085938, "global_step": 180784, "epoch": 2178} {"train_loss": -23.459226608276367, "global_step": 180785, "epoch": 2178} {"train_loss": -23.926319122314453, "global_step": 180786, "epoch": 2178} {"train_loss": -23.804065704345703, "global_step": 180787, "epoch": 2178} {"train_loss": -23.654911041259766, "global_step": 180788, "epoch": 2178} {"train_loss": -23.837615966796875, "global_step": 180789, "epoch": 2178} {"train_loss": -23.86085319519043, "global_step": 180790, "epoch": 2178} {"train_loss": -23.68534278869629, "global_step": 180791, "epoch": 2178} {"train_loss": -24.07822036743164, "global_step": 180792, "epoch": 2178} {"train_loss": -23.655431747436523, "global_step": 180793, "epoch": 2178} {"train_loss": -23.427289962768555, "global_step": 180794, "epoch": 2178} {"train_loss": -23.59919548034668, "global_step": 180795, "epoch": 2178} {"train_loss": -23.085859298706055, "global_step": 180796, "epoch": 2178} {"train_loss": -23.668989181518555, "global_step": 180797, "epoch": 2178} {"train_loss": -23.566226959228516, "global_step": 180798, "epoch": 2178} {"train_loss": -23.642704010009766, "global_step": 180799, "epoch": 2178} {"train_loss": -23.633649826049805, "global_step": 180800, "epoch": 2178} {"train_loss": -23.89887809753418, "global_step": 180801, "epoch": 2178} {"train_loss": -23.753080368041992, "global_step": 180802, "epoch": 2178} {"train_loss": -24.020004272460938, "global_step": 180803, "epoch": 2178} {"train_loss": -24.21187400817871, "global_step": 180804, "epoch": 2178} {"train_loss": -24.12870216369629, "global_step": 180805, "epoch": 2178} {"train_loss": -23.782590866088867, "global_step": 180806, "epoch": 2178} {"train_loss": -24.062259674072266, "global_step": 180807, "epoch": 2178} {"train_loss": -23.9816951751709, "global_step": 180808, "epoch": 2178} {"train_loss": -23.948041915893555, "global_step": 180809, "epoch": 2178} {"train_loss": -23.86348533630371, "global_step": 180810, "epoch": 2178} {"train_loss": -24.024871826171875, "global_step": 180811, "epoch": 2178} {"train_loss": -23.941648483276367, "global_step": 180812, "epoch": 2178} {"train_loss": -24.004650115966797, "global_step": 180813, "epoch": 2178} {"train_loss": -24.021333694458008, "global_step": 180814, "epoch": 2178} {"train_loss": -23.575769424438477, "global_step": 180815, "epoch": 2178} {"train_loss": -23.888940811157227, "global_step": 180816, "epoch": 2178} {"train_loss": -23.84661293029785, "global_step": 180817, "epoch": 2178} {"train_loss": -23.9440860748291, "global_step": 180818, "epoch": 2178} {"train_loss": -24.046682357788086, "global_step": 180819, "epoch": 2178} {"train_loss": -24.41179656982422, "global_step": 180820, "epoch": 2178} {"train_loss": -23.67527198791504, "global_step": 180821, "epoch": 2178} {"train_loss": -23.864126205444336, "global_step": 180822, "epoch": 2178} {"train_loss": -24.025081634521484, "global_step": 180823, "epoch": 2178} {"train_loss": -23.621572494506836, "global_step": 180824, "epoch": 2178} {"train_loss": -24.472074508666992, "global_step": 180825, "epoch": 2178} {"train_loss": -23.74830436706543, "global_step": 180826, "epoch": 2178} {"train_loss": -24.021289825439453, "global_step": 180827, "epoch": 2178} {"train_loss": -23.98404312133789, "global_step": 180828, "epoch": 2178} {"train_loss": -23.782209396362305, "global_step": 180829, "epoch": 2178} {"train_loss": -24.046871185302734, "global_step": 180830, "epoch": 2178} {"train_loss": -23.978126525878906, "global_step": 180831, "epoch": 2178} {"train_loss": -24.058292388916016, "global_step": 180832, "epoch": 2178} {"train_loss": -24.181978225708008, "global_step": 180833, "epoch": 2178} {"train_loss": -23.86861801147461, "global_step": 180834, "epoch": 2178} {"train_loss": -23.979787826538086, "global_step": 180835, "epoch": 2178} {"train_loss": -23.639755249023438, "global_step": 180836, "epoch": 2178} {"train_loss": -24.14644432067871, "global_step": 180837, "epoch": 2178} {"train_loss": -23.776996612548828, "global_step": 180838, "epoch": 2178} {"train_loss": -23.772798538208008, "global_step": 180839, "epoch": 2178} {"train_loss": -23.70286750793457, "global_step": 180840, "epoch": 2178} {"train_loss": -23.96558952331543, "global_step": 180841, "epoch": 2178} {"train_loss": -24.169384002685547, "global_step": 180842, "epoch": 2178} {"train_loss": -23.86131477355957, "global_step": 180843, "epoch": 2178} {"train_loss": -23.981199264526367, "global_step": 180844, "epoch": 2178} {"train_loss": -24.12993812561035, "global_step": 180845, "epoch": 2178} {"train_loss": -23.988056182861328, "global_step": 180846, "epoch": 2178} {"train_loss": -23.678739547729492, "global_step": 180847, "epoch": 2178} {"train_loss": -24.27687644958496, "global_step": 180848, "epoch": 2178} {"train_loss": -23.490402221679688, "global_step": 180849, "epoch": 2178} {"train_loss": -23.999937057495117, "global_step": 180850, "epoch": 2178} {"train_loss": -23.978525161743164, "global_step": 180851, "epoch": 2178} {"train_loss": -23.561182022094727, "global_step": 180852, "epoch": 2178} {"train_loss": -23.63165855407715, "global_step": 180853, "epoch": 2178} {"train_loss": -24.098716735839844, "global_step": 180854, "epoch": 2178} {"train_loss": -23.58955955505371, "global_step": 180855, "epoch": 2178} {"train_loss": -23.82657912840326, "global_step": 180856, "epoch": 2178, "val_loss": 6517583.0} {"train_loss": -20.20724105834961, "global_step": 180857, "epoch": 2179} {"train_loss": -23.08489990234375, "global_step": 180858, "epoch": 2179} {"train_loss": -21.88551902770996, "global_step": 180859, "epoch": 2179} {"train_loss": -22.91632080078125, "global_step": 180860, "epoch": 2179} {"train_loss": -22.18715476989746, "global_step": 180861, "epoch": 2179} {"train_loss": -22.96906852722168, "global_step": 180862, "epoch": 2179} {"train_loss": -23.03073501586914, "global_step": 180863, "epoch": 2179} {"train_loss": -23.0682315826416, "global_step": 180864, "epoch": 2179} {"train_loss": -23.214807510375977, "global_step": 180865, "epoch": 2179} {"train_loss": -23.037403106689453, "global_step": 180866, "epoch": 2179} {"train_loss": -22.979572296142578, "global_step": 180867, "epoch": 2179} {"train_loss": -23.301130294799805, "global_step": 180868, "epoch": 2179} {"train_loss": -23.383527755737305, "global_step": 180869, "epoch": 2179} {"train_loss": -23.276248931884766, "global_step": 180870, "epoch": 2179} {"train_loss": -23.280012130737305, "global_step": 180871, "epoch": 2179} {"train_loss": -23.564279556274414, "global_step": 180872, "epoch": 2179} {"train_loss": -23.648160934448242, "global_step": 180873, "epoch": 2179} {"train_loss": -22.9831600189209, "global_step": 180874, "epoch": 2179} {"train_loss": -23.03224754333496, "global_step": 180875, "epoch": 2179} {"train_loss": -23.589588165283203, "global_step": 180876, "epoch": 2179} {"train_loss": -23.915822982788086, "global_step": 180877, "epoch": 2179} {"train_loss": -23.232608795166016, "global_step": 180878, "epoch": 2179} {"train_loss": -23.580469131469727, "global_step": 180879, "epoch": 2179} {"train_loss": -23.65546226501465, "global_step": 180880, "epoch": 2179} {"train_loss": -23.627838134765625, "global_step": 180881, "epoch": 2179} {"train_loss": -23.9923095703125, "global_step": 180882, "epoch": 2179} {"train_loss": -23.820432662963867, "global_step": 180883, "epoch": 2179} {"train_loss": -23.208513259887695, "global_step": 180884, "epoch": 2179} {"train_loss": -23.622722625732422, "global_step": 180885, "epoch": 2179} {"train_loss": -23.596860885620117, "global_step": 180886, "epoch": 2179} {"train_loss": -23.556629180908203, "global_step": 180887, "epoch": 2179} {"train_loss": -23.555648803710938, "global_step": 180888, "epoch": 2179} {"train_loss": -23.879545211791992, "global_step": 180889, "epoch": 2179} {"train_loss": -23.65074348449707, "global_step": 180890, "epoch": 2179} {"train_loss": -23.663009643554688, "global_step": 180891, "epoch": 2179} {"train_loss": -24.17079734802246, "global_step": 180892, "epoch": 2179} {"train_loss": -23.666486740112305, "global_step": 180893, "epoch": 2179} {"train_loss": -23.86649513244629, "global_step": 180894, "epoch": 2179} {"train_loss": -23.47237777709961, "global_step": 180895, "epoch": 2179} {"train_loss": -23.742650985717773, "global_step": 180896, "epoch": 2179} {"train_loss": -23.98605728149414, "global_step": 180897, "epoch": 2179} {"train_loss": -24.08045196533203, "global_step": 180898, "epoch": 2179} {"train_loss": -23.858346939086914, "global_step": 180899, "epoch": 2179} {"train_loss": -24.181310653686523, "global_step": 180900, "epoch": 2179} {"train_loss": -23.584339141845703, "global_step": 180901, "epoch": 2179} {"train_loss": -24.137088775634766, "global_step": 180902, "epoch": 2179} {"train_loss": -23.82314109802246, "global_step": 180903, "epoch": 2179} {"train_loss": -23.9803466796875, "global_step": 180904, "epoch": 2179} {"train_loss": -23.941730499267578, "global_step": 180905, "epoch": 2179} {"train_loss": -23.96369743347168, "global_step": 180906, "epoch": 2179} {"train_loss": -24.05321502685547, "global_step": 180907, "epoch": 2179} {"train_loss": -24.05426788330078, "global_step": 180908, "epoch": 2179} {"train_loss": -23.83905601501465, "global_step": 180909, "epoch": 2179} {"train_loss": -24.08194923400879, "global_step": 180910, "epoch": 2179} {"train_loss": -23.844152450561523, "global_step": 180911, "epoch": 2179} {"train_loss": -23.72075080871582, "global_step": 180912, "epoch": 2179} {"train_loss": -23.753173828125, "global_step": 180913, "epoch": 2179} {"train_loss": -24.079212188720703, "global_step": 180914, "epoch": 2179} {"train_loss": -23.623510360717773, "global_step": 180915, "epoch": 2179} {"train_loss": -23.898998260498047, "global_step": 180916, "epoch": 2179} {"train_loss": -23.891672134399414, "global_step": 180917, "epoch": 2179} {"train_loss": -24.198888778686523, "global_step": 180918, "epoch": 2179} {"train_loss": -23.77985382080078, "global_step": 180919, "epoch": 2179} {"train_loss": -24.24477195739746, "global_step": 180920, "epoch": 2179} {"train_loss": -24.084741592407227, "global_step": 180921, "epoch": 2179} {"train_loss": -23.865150451660156, "global_step": 180922, "epoch": 2179} {"train_loss": -23.919021606445312, "global_step": 180923, "epoch": 2179} {"train_loss": -24.116985321044922, "global_step": 180924, "epoch": 2179} {"train_loss": -23.85354232788086, "global_step": 180925, "epoch": 2179} {"train_loss": -24.429227828979492, "global_step": 180926, "epoch": 2179} {"train_loss": -23.85470962524414, "global_step": 180927, "epoch": 2179} {"train_loss": -24.187185287475586, "global_step": 180928, "epoch": 2179} {"train_loss": -23.882184982299805, "global_step": 180929, "epoch": 2179} {"train_loss": -23.92494773864746, "global_step": 180930, "epoch": 2179} {"train_loss": -24.03765869140625, "global_step": 180931, "epoch": 2179} {"train_loss": -24.17974281311035, "global_step": 180932, "epoch": 2179} {"train_loss": -23.765779495239258, "global_step": 180933, "epoch": 2179} {"train_loss": -24.203683853149414, "global_step": 180934, "epoch": 2179} {"train_loss": -24.160179138183594, "global_step": 180935, "epoch": 2179} {"train_loss": -24.215604782104492, "global_step": 180936, "epoch": 2179} {"train_loss": -23.581314086914062, "global_step": 180937, "epoch": 2179} {"train_loss": -23.669832229614258, "global_step": 180938, "epoch": 2179} {"train_loss": -23.653219429843396, "global_step": 180939, "epoch": 2179, "val_loss": 6423705.0} {"train_loss": -20.924884796142578, "global_step": 180940, "epoch": 2180} {"train_loss": -22.192550659179688, "global_step": 180941, "epoch": 2180} {"train_loss": -22.864953994750977, "global_step": 180942, "epoch": 2180} {"train_loss": -22.401498794555664, "global_step": 180943, "epoch": 2180} {"train_loss": -22.367931365966797, "global_step": 180944, "epoch": 2180} {"train_loss": -22.465673446655273, "global_step": 180945, "epoch": 2180} {"train_loss": -22.771255493164062, "global_step": 180946, "epoch": 2180} {"train_loss": -22.805646896362305, "global_step": 180947, "epoch": 2180} {"train_loss": -23.08182716369629, "global_step": 180948, "epoch": 2180} {"train_loss": -23.13862419128418, "global_step": 180949, "epoch": 2180} {"train_loss": -23.03997039794922, "global_step": 180950, "epoch": 2180} {"train_loss": -23.006938934326172, "global_step": 180951, "epoch": 2180} {"train_loss": -23.53099822998047, "global_step": 180952, "epoch": 2180} {"train_loss": -23.495803833007812, "global_step": 180953, "epoch": 2180} {"train_loss": -23.401403427124023, "global_step": 180954, "epoch": 2180} {"train_loss": -22.879756927490234, "global_step": 180955, "epoch": 2180} {"train_loss": -23.1238956451416, "global_step": 180956, "epoch": 2180} {"train_loss": -23.30659294128418, "global_step": 180957, "epoch": 2180} {"train_loss": -23.049955368041992, "global_step": 180958, "epoch": 2180} {"train_loss": -23.2241268157959, "global_step": 180959, "epoch": 2180} {"train_loss": -23.610071182250977, "global_step": 180960, "epoch": 2180} {"train_loss": -23.821195602416992, "global_step": 180961, "epoch": 2180} {"train_loss": -23.700363159179688, "global_step": 180962, "epoch": 2180} {"train_loss": -23.129053115844727, "global_step": 180963, "epoch": 2180} {"train_loss": -24.033916473388672, "global_step": 180964, "epoch": 2180} {"train_loss": -23.26561164855957, "global_step": 180965, "epoch": 2180} {"train_loss": -23.73188018798828, "global_step": 180966, "epoch": 2180} {"train_loss": -23.68787956237793, "global_step": 180967, "epoch": 2180} {"train_loss": -23.569501876831055, "global_step": 180968, "epoch": 2180} {"train_loss": -23.775436401367188, "global_step": 180969, "epoch": 2180} {"train_loss": -24.10822105407715, "global_step": 180970, "epoch": 2180} {"train_loss": -23.4544620513916, "global_step": 180971, "epoch": 2180} {"train_loss": -23.555322647094727, "global_step": 180972, "epoch": 2180} {"train_loss": -23.54694938659668, "global_step": 180973, "epoch": 2180} {"train_loss": -23.814085006713867, "global_step": 180974, "epoch": 2180} {"train_loss": -23.655513763427734, "global_step": 180975, "epoch": 2180} {"train_loss": -23.62918472290039, "global_step": 180976, "epoch": 2180} {"train_loss": -23.625089645385742, "global_step": 180977, "epoch": 2180} {"train_loss": -23.8272762298584, "global_step": 180978, "epoch": 2180} {"train_loss": -23.647302627563477, "global_step": 180979, "epoch": 2180} {"train_loss": -23.83963394165039, "global_step": 180980, "epoch": 2180} {"train_loss": -23.708770751953125, "global_step": 180981, "epoch": 2180} {"train_loss": -23.731494903564453, "global_step": 180982, "epoch": 2180} {"train_loss": -24.046552658081055, "global_step": 180983, "epoch": 2180} {"train_loss": -23.988248825073242, "global_step": 180984, "epoch": 2180} {"train_loss": -24.25284767150879, "global_step": 180985, "epoch": 2180} {"train_loss": -24.042264938354492, "global_step": 180986, "epoch": 2180} {"train_loss": -24.11474609375, "global_step": 180987, "epoch": 2180} {"train_loss": -24.117450714111328, "global_step": 180988, "epoch": 2180} {"train_loss": -24.163114547729492, "global_step": 180989, "epoch": 2180} {"train_loss": -24.072769165039062, "global_step": 180990, "epoch": 2180} {"train_loss": -24.1721248626709, "global_step": 180991, "epoch": 2180} {"train_loss": -23.8873348236084, "global_step": 180992, "epoch": 2180} {"train_loss": -23.8912410736084, "global_step": 180993, "epoch": 2180} {"train_loss": -23.980051040649414, "global_step": 180994, "epoch": 2180} {"train_loss": -24.189865112304688, "global_step": 180995, "epoch": 2180} {"train_loss": -23.94662094116211, "global_step": 180996, "epoch": 2180} {"train_loss": -23.945194244384766, "global_step": 180997, "epoch": 2180} {"train_loss": -24.061872482299805, "global_step": 180998, "epoch": 2180} {"train_loss": -24.056066513061523, "global_step": 180999, "epoch": 2180} {"train_loss": -23.789417266845703, "global_step": 181000, "epoch": 2180} {"train_loss": -24.189666748046875, "global_step": 181001, "epoch": 2180} {"train_loss": -23.798166275024414, "global_step": 181002, "epoch": 2180} {"train_loss": -23.892139434814453, "global_step": 181003, "epoch": 2180} {"train_loss": -24.187667846679688, "global_step": 181004, "epoch": 2180} {"train_loss": -24.2807559967041, "global_step": 181005, "epoch": 2180} {"train_loss": -23.464683532714844, "global_step": 181006, "epoch": 2180} {"train_loss": -23.764572143554688, "global_step": 181007, "epoch": 2180} {"train_loss": -23.59803009033203, "global_step": 181008, "epoch": 2180} {"train_loss": -24.14777946472168, "global_step": 181009, "epoch": 2180} {"train_loss": -23.916038513183594, "global_step": 181010, "epoch": 2180} {"train_loss": -23.8350772857666, "global_step": 181011, "epoch": 2180} {"train_loss": -24.055774688720703, "global_step": 181012, "epoch": 2180} {"train_loss": -24.378305435180664, "global_step": 181013, "epoch": 2180} {"train_loss": -23.9804630279541, "global_step": 181014, "epoch": 2180} {"train_loss": -24.11774253845215, "global_step": 181015, "epoch": 2180} {"train_loss": -24.470670700073242, "global_step": 181016, "epoch": 2180} {"train_loss": -24.017335891723633, "global_step": 181017, "epoch": 2180} {"train_loss": -23.74799156188965, "global_step": 181018, "epoch": 2180} {"train_loss": -24.09765625, "global_step": 181019, "epoch": 2180} {"train_loss": -24.28314781188965, "global_step": 181020, "epoch": 2180} {"train_loss": -24.299436569213867, "global_step": 181021, "epoch": 2180} {"train_loss": -23.643146468932372, "global_step": 181022, "epoch": 2180, "val_loss": 6516205.0} {"train_loss": -22.686534881591797, "global_step": 181023, "epoch": 2181} {"train_loss": -23.70602798461914, "global_step": 181024, "epoch": 2181} {"train_loss": -23.27607536315918, "global_step": 181025, "epoch": 2181} {"train_loss": -22.721158981323242, "global_step": 181026, "epoch": 2181} {"train_loss": -23.532291412353516, "global_step": 181027, "epoch": 2181} {"train_loss": -23.218097686767578, "global_step": 181028, "epoch": 2181} {"train_loss": -23.820737838745117, "global_step": 181029, "epoch": 2181} {"train_loss": -23.356557846069336, "global_step": 181030, "epoch": 2181} {"train_loss": -23.69849967956543, "global_step": 181031, "epoch": 2181} {"train_loss": -23.771947860717773, "global_step": 181032, "epoch": 2181} {"train_loss": -23.63934898376465, "global_step": 181033, "epoch": 2181} {"train_loss": -23.750051498413086, "global_step": 181034, "epoch": 2181} {"train_loss": -23.94944190979004, "global_step": 181035, "epoch": 2181} {"train_loss": -23.72720718383789, "global_step": 181036, "epoch": 2181} {"train_loss": -23.6967716217041, "global_step": 181037, "epoch": 2181} {"train_loss": -24.014196395874023, "global_step": 181038, "epoch": 2181} {"train_loss": -23.521846771240234, "global_step": 181039, "epoch": 2181} {"train_loss": -23.46784782409668, "global_step": 181040, "epoch": 2181} {"train_loss": -23.698150634765625, "global_step": 181041, "epoch": 2181} {"train_loss": -23.76647186279297, "global_step": 181042, "epoch": 2181} {"train_loss": -23.866559982299805, "global_step": 181043, "epoch": 2181} {"train_loss": -23.866838455200195, "global_step": 181044, "epoch": 2181} {"train_loss": -23.659360885620117, "global_step": 181045, "epoch": 2181} {"train_loss": -23.629356384277344, "global_step": 181046, "epoch": 2181} {"train_loss": -23.7220458984375, "global_step": 181047, "epoch": 2181} {"train_loss": -24.193429946899414, "global_step": 181048, "epoch": 2181} {"train_loss": -23.448938369750977, "global_step": 181049, "epoch": 2181} {"train_loss": -24.19614028930664, "global_step": 181050, "epoch": 2181} {"train_loss": -23.815433502197266, "global_step": 181051, "epoch": 2181} {"train_loss": -24.038558959960938, "global_step": 181052, "epoch": 2181} {"train_loss": -23.692333221435547, "global_step": 181053, "epoch": 2181} {"train_loss": -23.911052703857422, "global_step": 181054, "epoch": 2181} {"train_loss": -23.775409698486328, "global_step": 181055, "epoch": 2181} {"train_loss": -23.831289291381836, "global_step": 181056, "epoch": 2181} {"train_loss": -23.97531509399414, "global_step": 181057, "epoch": 2181} {"train_loss": -24.268329620361328, "global_step": 181058, "epoch": 2181} {"train_loss": -24.098464965820312, "global_step": 181059, "epoch": 2181} {"train_loss": -23.594623565673828, "global_step": 181060, "epoch": 2181} {"train_loss": -23.764644622802734, "global_step": 181061, "epoch": 2181} {"train_loss": -24.144514083862305, "global_step": 181062, "epoch": 2181} {"train_loss": -24.02290916442871, "global_step": 181063, "epoch": 2181} {"train_loss": -24.143421173095703, "global_step": 181064, "epoch": 2181} {"train_loss": -23.90679359436035, "global_step": 181065, "epoch": 2181} {"train_loss": -24.139272689819336, "global_step": 181066, "epoch": 2181} {"train_loss": -24.03722381591797, "global_step": 181067, "epoch": 2181} {"train_loss": -24.350900650024414, "global_step": 181068, "epoch": 2181} {"train_loss": -23.829526901245117, "global_step": 181069, "epoch": 2181} {"train_loss": -23.9086971282959, "global_step": 181070, "epoch": 2181} {"train_loss": -24.13559341430664, "global_step": 181071, "epoch": 2181} {"train_loss": -23.52610206604004, "global_step": 181072, "epoch": 2181} {"train_loss": -24.088882446289062, "global_step": 181073, "epoch": 2181} {"train_loss": -23.904878616333008, "global_step": 181074, "epoch": 2181} {"train_loss": -23.488616943359375, "global_step": 181075, "epoch": 2181} {"train_loss": -23.919965744018555, "global_step": 181076, "epoch": 2181} {"train_loss": -23.907865524291992, "global_step": 181077, "epoch": 2181} {"train_loss": -23.9025936126709, "global_step": 181078, "epoch": 2181} {"train_loss": -23.701547622680664, "global_step": 181079, "epoch": 2181} {"train_loss": -24.030302047729492, "global_step": 181080, "epoch": 2181} {"train_loss": -23.937955856323242, "global_step": 181081, "epoch": 2181} {"train_loss": -23.7782039642334, "global_step": 181082, "epoch": 2181} {"train_loss": -23.796464920043945, "global_step": 181083, "epoch": 2181} {"train_loss": -23.43125343322754, "global_step": 181084, "epoch": 2181} {"train_loss": -24.210248947143555, "global_step": 181085, "epoch": 2181} {"train_loss": -23.85205078125, "global_step": 181086, "epoch": 2181} {"train_loss": -23.84030532836914, "global_step": 181087, "epoch": 2181} {"train_loss": -24.147464752197266, "global_step": 181088, "epoch": 2181} {"train_loss": -23.75472068786621, "global_step": 181089, "epoch": 2181} {"train_loss": -24.013240814208984, "global_step": 181090, "epoch": 2181} {"train_loss": -24.36403465270996, "global_step": 181091, "epoch": 2181} {"train_loss": -24.108369827270508, "global_step": 181092, "epoch": 2181} {"train_loss": -24.158950805664062, "global_step": 181093, "epoch": 2181} {"train_loss": -23.947734832763672, "global_step": 181094, "epoch": 2181} {"train_loss": -23.605188369750977, "global_step": 181095, "epoch": 2181} {"train_loss": -23.344070434570312, "global_step": 181096, "epoch": 2181} {"train_loss": -23.63776397705078, "global_step": 181097, "epoch": 2181} {"train_loss": -24.18533706665039, "global_step": 181098, "epoch": 2181} {"train_loss": -24.230539321899414, "global_step": 181099, "epoch": 2181} {"train_loss": -23.888080596923828, "global_step": 181100, "epoch": 2181} {"train_loss": -23.9597225189209, "global_step": 181101, "epoch": 2181} {"train_loss": -23.90145492553711, "global_step": 181102, "epoch": 2181} {"train_loss": -24.09296417236328, "global_step": 181103, "epoch": 2181} {"train_loss": -24.106016159057617, "global_step": 181104, "epoch": 2181} {"train_loss": -23.809783085283026, "global_step": 181105, "epoch": 2181, "val_loss": 6462615.5} {"train_loss": -23.79469108581543, "global_step": 181106, "epoch": 2182} {"train_loss": -23.41228485107422, "global_step": 181107, "epoch": 2182} {"train_loss": -23.623401641845703, "global_step": 181108, "epoch": 2182} {"train_loss": -24.13975715637207, "global_step": 181109, "epoch": 2182} {"train_loss": -23.671241760253906, "global_step": 181110, "epoch": 2182} {"train_loss": -23.81154441833496, "global_step": 181111, "epoch": 2182} {"train_loss": -23.898672103881836, "global_step": 181112, "epoch": 2182} {"train_loss": -23.980045318603516, "global_step": 181113, "epoch": 2182} {"train_loss": -23.317243576049805, "global_step": 181114, "epoch": 2182} {"train_loss": -24.34444236755371, "global_step": 181115, "epoch": 2182} {"train_loss": -23.683095932006836, "global_step": 181116, "epoch": 2182} {"train_loss": -23.728906631469727, "global_step": 181117, "epoch": 2182} {"train_loss": -24.025741577148438, "global_step": 181118, "epoch": 2182} {"train_loss": -23.850339889526367, "global_step": 181119, "epoch": 2182} {"train_loss": -23.977031707763672, "global_step": 181120, "epoch": 2182} {"train_loss": -23.799266815185547, "global_step": 181121, "epoch": 2182} {"train_loss": -23.77507209777832, "global_step": 181122, "epoch": 2182} {"train_loss": -23.792865753173828, "global_step": 181123, "epoch": 2182} {"train_loss": -23.824745178222656, "global_step": 181124, "epoch": 2182} {"train_loss": -23.853525161743164, "global_step": 181125, "epoch": 2182} {"train_loss": -24.086483001708984, "global_step": 181126, "epoch": 2182} {"train_loss": -23.87166976928711, "global_step": 181127, "epoch": 2182} {"train_loss": -24.14596939086914, "global_step": 181128, "epoch": 2182} {"train_loss": -24.29597282409668, "global_step": 181129, "epoch": 2182} {"train_loss": -24.128881454467773, "global_step": 181130, "epoch": 2182} {"train_loss": -24.259252548217773, "global_step": 181131, "epoch": 2182} {"train_loss": -23.68257713317871, "global_step": 181132, "epoch": 2182} {"train_loss": -23.955188751220703, "global_step": 181133, "epoch": 2182} {"train_loss": -24.172391891479492, "global_step": 181134, "epoch": 2182} {"train_loss": -23.76348304748535, "global_step": 181135, "epoch": 2182} {"train_loss": -23.828458786010742, "global_step": 181136, "epoch": 2182} {"train_loss": -24.267431259155273, "global_step": 181137, "epoch": 2182} {"train_loss": -23.863889694213867, "global_step": 181138, "epoch": 2182} {"train_loss": -24.494525909423828, "global_step": 181139, "epoch": 2182} {"train_loss": -23.939918518066406, "global_step": 181140, "epoch": 2182} {"train_loss": -23.81071662902832, "global_step": 181141, "epoch": 2182} {"train_loss": -23.783559799194336, "global_step": 181142, "epoch": 2182} {"train_loss": -23.84773063659668, "global_step": 181143, "epoch": 2182} {"train_loss": -23.960006713867188, "global_step": 181144, "epoch": 2182} {"train_loss": -23.776620864868164, "global_step": 181145, "epoch": 2182} {"train_loss": -23.549890518188477, "global_step": 181146, "epoch": 2182} {"train_loss": -23.670881271362305, "global_step": 181147, "epoch": 2182} {"train_loss": -23.76905632019043, "global_step": 181148, "epoch": 2182} {"train_loss": -23.58656120300293, "global_step": 181149, "epoch": 2182} {"train_loss": -23.921781539916992, "global_step": 181150, "epoch": 2182} {"train_loss": -22.958768844604492, "global_step": 181151, "epoch": 2182} {"train_loss": -23.528587341308594, "global_step": 181152, "epoch": 2182} {"train_loss": -24.038639068603516, "global_step": 181153, "epoch": 2182} {"train_loss": -23.535324096679688, "global_step": 181154, "epoch": 2182} {"train_loss": -23.695037841796875, "global_step": 181155, "epoch": 2182} {"train_loss": -23.9013671875, "global_step": 181156, "epoch": 2182} {"train_loss": -23.759328842163086, "global_step": 181157, "epoch": 2182} {"train_loss": -23.887155532836914, "global_step": 181158, "epoch": 2182} {"train_loss": -23.725126266479492, "global_step": 181159, "epoch": 2182} {"train_loss": -23.84354591369629, "global_step": 181160, "epoch": 2182} {"train_loss": -23.70374870300293, "global_step": 181161, "epoch": 2182} {"train_loss": -23.198623657226562, "global_step": 181162, "epoch": 2182} {"train_loss": -23.685928344726562, "global_step": 181163, "epoch": 2182} {"train_loss": -23.53663444519043, "global_step": 181164, "epoch": 2182} {"train_loss": -23.8228702545166, "global_step": 181165, "epoch": 2182} {"train_loss": -23.867334365844727, "global_step": 181166, "epoch": 2182} {"train_loss": -23.5922794342041, "global_step": 181167, "epoch": 2182} {"train_loss": -23.773229598999023, "global_step": 181168, "epoch": 2182} {"train_loss": -23.863462448120117, "global_step": 181169, "epoch": 2182} {"train_loss": -23.580078125, "global_step": 181170, "epoch": 2182} {"train_loss": -23.950407028198242, "global_step": 181171, "epoch": 2182} {"train_loss": -23.796905517578125, "global_step": 181172, "epoch": 2182} {"train_loss": -23.649507522583008, "global_step": 181173, "epoch": 2182} {"train_loss": -23.82145118713379, "global_step": 181174, "epoch": 2182} {"train_loss": -23.900415420532227, "global_step": 181175, "epoch": 2182} {"train_loss": -24.0241756439209, "global_step": 181176, "epoch": 2182} {"train_loss": -23.76657485961914, "global_step": 181177, "epoch": 2182} {"train_loss": -23.262277603149414, "global_step": 181178, "epoch": 2182} {"train_loss": -23.611255645751953, "global_step": 181179, "epoch": 2182} {"train_loss": -23.89754295349121, "global_step": 181180, "epoch": 2182} {"train_loss": -23.747343063354492, "global_step": 181181, "epoch": 2182} {"train_loss": -23.87322235107422, "global_step": 181182, "epoch": 2182} {"train_loss": -24.047473907470703, "global_step": 181183, "epoch": 2182} {"train_loss": -23.88445472717285, "global_step": 181184, "epoch": 2182} {"train_loss": -23.66058921813965, "global_step": 181185, "epoch": 2182} {"train_loss": -24.116891860961914, "global_step": 181186, "epoch": 2182} {"train_loss": -24.016101837158203, "global_step": 181187, "epoch": 2182} {"train_loss": -23.828534965055535, "global_step": 181188, "epoch": 2182, "val_loss": 6479037.5} {"train_loss": -23.472930908203125, "global_step": 181189, "epoch": 2183} {"train_loss": -23.75924301147461, "global_step": 181190, "epoch": 2183} {"train_loss": -23.34325408935547, "global_step": 181191, "epoch": 2183} {"train_loss": -23.657550811767578, "global_step": 181192, "epoch": 2183} {"train_loss": -23.31098747253418, "global_step": 181193, "epoch": 2183} {"train_loss": -23.24830436706543, "global_step": 181194, "epoch": 2183} {"train_loss": -23.237031936645508, "global_step": 181195, "epoch": 2183} {"train_loss": -23.809431076049805, "global_step": 181196, "epoch": 2183} {"train_loss": -23.243942260742188, "global_step": 181197, "epoch": 2183} {"train_loss": -23.31488037109375, "global_step": 181198, "epoch": 2183} {"train_loss": -23.519433975219727, "global_step": 181199, "epoch": 2183} {"train_loss": -23.390661239624023, "global_step": 181200, "epoch": 2183} {"train_loss": -23.302865982055664, "global_step": 181201, "epoch": 2183} {"train_loss": -23.76255989074707, "global_step": 181202, "epoch": 2183} {"train_loss": -24.055715560913086, "global_step": 181203, "epoch": 2183} {"train_loss": -24.20902442932129, "global_step": 181204, "epoch": 2183} {"train_loss": -23.804277420043945, "global_step": 181205, "epoch": 2183} {"train_loss": -23.589635848999023, "global_step": 181206, "epoch": 2183} {"train_loss": -23.852209091186523, "global_step": 181207, "epoch": 2183} {"train_loss": -24.081851959228516, "global_step": 181208, "epoch": 2183} {"train_loss": -23.36324119567871, "global_step": 181209, "epoch": 2183} {"train_loss": -23.851144790649414, "global_step": 181210, "epoch": 2183} {"train_loss": -23.739547729492188, "global_step": 181211, "epoch": 2183} {"train_loss": -24.19378662109375, "global_step": 181212, "epoch": 2183} {"train_loss": -24.120634078979492, "global_step": 181213, "epoch": 2183} {"train_loss": -23.7548828125, "global_step": 181214, "epoch": 2183} {"train_loss": -23.735965728759766, "global_step": 181215, "epoch": 2183} {"train_loss": -23.743854522705078, "global_step": 181216, "epoch": 2183} {"train_loss": -23.585346221923828, "global_step": 181217, "epoch": 2183} {"train_loss": -24.350168228149414, "global_step": 181218, "epoch": 2183} {"train_loss": -23.995012283325195, "global_step": 181219, "epoch": 2183} {"train_loss": -24.064428329467773, "global_step": 181220, "epoch": 2183} {"train_loss": -24.251802444458008, "global_step": 181221, "epoch": 2183} {"train_loss": -24.284414291381836, "global_step": 181222, "epoch": 2183} {"train_loss": -24.357242584228516, "global_step": 181223, "epoch": 2183} {"train_loss": -24.12578773498535, "global_step": 181224, "epoch": 2183} {"train_loss": -24.054645538330078, "global_step": 181225, "epoch": 2183} {"train_loss": -23.72568130493164, "global_step": 181226, "epoch": 2183} {"train_loss": -23.91497802734375, "global_step": 181227, "epoch": 2183} {"train_loss": -24.108421325683594, "global_step": 181228, "epoch": 2183} {"train_loss": -23.91228485107422, "global_step": 181229, "epoch": 2183} {"train_loss": -24.14777946472168, "global_step": 181230, "epoch": 2183} {"train_loss": -23.91283416748047, "global_step": 181231, "epoch": 2183} {"train_loss": -23.90447998046875, "global_step": 181232, "epoch": 2183} {"train_loss": -23.93049430847168, "global_step": 181233, "epoch": 2183} {"train_loss": -24.090633392333984, "global_step": 181234, "epoch": 2183} {"train_loss": -24.166595458984375, "global_step": 181235, "epoch": 2183} {"train_loss": -23.907642364501953, "global_step": 181236, "epoch": 2183} {"train_loss": -23.98516845703125, "global_step": 181237, "epoch": 2183} {"train_loss": -24.069217681884766, "global_step": 181238, "epoch": 2183} {"train_loss": -24.36961555480957, "global_step": 181239, "epoch": 2183} {"train_loss": -24.014423370361328, "global_step": 181240, "epoch": 2183} {"train_loss": -24.107757568359375, "global_step": 181241, "epoch": 2183} {"train_loss": -23.53389549255371, "global_step": 181242, "epoch": 2183} {"train_loss": -23.18304443359375, "global_step": 181243, "epoch": 2183} {"train_loss": -23.386442184448242, "global_step": 181244, "epoch": 2183} {"train_loss": -23.895126342773438, "global_step": 181245, "epoch": 2183} {"train_loss": -23.456174850463867, "global_step": 181246, "epoch": 2183} {"train_loss": -24.16065788269043, "global_step": 181247, "epoch": 2183} {"train_loss": -23.498422622680664, "global_step": 181248, "epoch": 2183} {"train_loss": -23.95377540588379, "global_step": 181249, "epoch": 2183} {"train_loss": -24.093643188476562, "global_step": 181250, "epoch": 2183} {"train_loss": -23.790422439575195, "global_step": 181251, "epoch": 2183} {"train_loss": -23.51312828063965, "global_step": 181252, "epoch": 2183} {"train_loss": -23.917633056640625, "global_step": 181253, "epoch": 2183} {"train_loss": -23.989013671875, "global_step": 181254, "epoch": 2183} {"train_loss": -23.677541732788086, "global_step": 181255, "epoch": 2183} {"train_loss": -23.961210250854492, "global_step": 181256, "epoch": 2183} {"train_loss": -24.174789428710938, "global_step": 181257, "epoch": 2183} {"train_loss": -23.776357650756836, "global_step": 181258, "epoch": 2183} {"train_loss": -23.769927978515625, "global_step": 181259, "epoch": 2183} {"train_loss": -23.77000617980957, "global_step": 181260, "epoch": 2183} {"train_loss": -23.685630798339844, "global_step": 181261, "epoch": 2183} {"train_loss": -23.708494186401367, "global_step": 181262, "epoch": 2183} {"train_loss": -24.197113037109375, "global_step": 181263, "epoch": 2183} {"train_loss": -23.968521118164062, "global_step": 181264, "epoch": 2183} {"train_loss": -24.26139259338379, "global_step": 181265, "epoch": 2183} {"train_loss": -24.204435348510742, "global_step": 181266, "epoch": 2183} {"train_loss": -23.756052017211914, "global_step": 181267, "epoch": 2183} {"train_loss": -24.05877685546875, "global_step": 181268, "epoch": 2183} {"train_loss": -24.31450843811035, "global_step": 181269, "epoch": 2183} {"train_loss": -24.156612396240234, "global_step": 181270, "epoch": 2183} {"train_loss": -23.860193344483893, "global_step": 181271, "epoch": 2183, "val_loss": 6486790.0} {"train_loss": -23.390838623046875, "global_step": 181272, "epoch": 2184} {"train_loss": -23.815046310424805, "global_step": 181273, "epoch": 2184} {"train_loss": -23.473514556884766, "global_step": 181274, "epoch": 2184} {"train_loss": -23.87204360961914, "global_step": 181275, "epoch": 2184} {"train_loss": -23.849775314331055, "global_step": 181276, "epoch": 2184} {"train_loss": -23.538410186767578, "global_step": 181277, "epoch": 2184} {"train_loss": -23.571191787719727, "global_step": 181278, "epoch": 2184} {"train_loss": -23.916553497314453, "global_step": 181279, "epoch": 2184} {"train_loss": -23.628122329711914, "global_step": 181280, "epoch": 2184} {"train_loss": -24.15879249572754, "global_step": 181281, "epoch": 2184} {"train_loss": -23.736642837524414, "global_step": 181282, "epoch": 2184} {"train_loss": -23.892343521118164, "global_step": 181283, "epoch": 2184} {"train_loss": -23.79155921936035, "global_step": 181284, "epoch": 2184} {"train_loss": -23.842737197875977, "global_step": 181285, "epoch": 2184} {"train_loss": -23.921255111694336, "global_step": 181286, "epoch": 2184} {"train_loss": -23.735525131225586, "global_step": 181287, "epoch": 2184} {"train_loss": -23.781391143798828, "global_step": 181288, "epoch": 2184} {"train_loss": -23.851621627807617, "global_step": 181289, "epoch": 2184} {"train_loss": -23.74030876159668, "global_step": 181290, "epoch": 2184} {"train_loss": -24.128936767578125, "global_step": 181291, "epoch": 2184} {"train_loss": -23.884923934936523, "global_step": 181292, "epoch": 2184} {"train_loss": -23.719499588012695, "global_step": 181293, "epoch": 2184} {"train_loss": -23.777721405029297, "global_step": 181294, "epoch": 2184} {"train_loss": -23.869298934936523, "global_step": 181295, "epoch": 2184} {"train_loss": -23.877384185791016, "global_step": 181296, "epoch": 2184} {"train_loss": -24.170654296875, "global_step": 181297, "epoch": 2184} {"train_loss": -23.89432716369629, "global_step": 181298, "epoch": 2184} {"train_loss": -24.139266967773438, "global_step": 181299, "epoch": 2184} {"train_loss": -23.982715606689453, "global_step": 181300, "epoch": 2184} {"train_loss": -23.954526901245117, "global_step": 181301, "epoch": 2184} {"train_loss": -23.831449508666992, "global_step": 181302, "epoch": 2184} {"train_loss": -24.040454864501953, "global_step": 181303, "epoch": 2184} {"train_loss": -23.802968978881836, "global_step": 181304, "epoch": 2184} {"train_loss": -23.55418586730957, "global_step": 181305, "epoch": 2184} {"train_loss": -23.940153121948242, "global_step": 181306, "epoch": 2184} {"train_loss": -24.214738845825195, "global_step": 181307, "epoch": 2184} {"train_loss": -23.915454864501953, "global_step": 181308, "epoch": 2184} {"train_loss": -24.072736740112305, "global_step": 181309, "epoch": 2184} {"train_loss": -24.322248458862305, "global_step": 181310, "epoch": 2184} {"train_loss": -23.767791748046875, "global_step": 181311, "epoch": 2184} {"train_loss": -24.058032989501953, "global_step": 181312, "epoch": 2184} {"train_loss": -24.049156188964844, "global_step": 181313, "epoch": 2184} {"train_loss": -23.618263244628906, "global_step": 181314, "epoch": 2184} {"train_loss": -23.647140502929688, "global_step": 181315, "epoch": 2184} {"train_loss": -23.76056480407715, "global_step": 181316, "epoch": 2184} {"train_loss": -23.873342514038086, "global_step": 181317, "epoch": 2184} {"train_loss": -24.05716896057129, "global_step": 181318, "epoch": 2184} {"train_loss": -23.94991111755371, "global_step": 181319, "epoch": 2184} {"train_loss": -24.21973991394043, "global_step": 181320, "epoch": 2184} {"train_loss": -23.998647689819336, "global_step": 181321, "epoch": 2184} {"train_loss": -24.111364364624023, "global_step": 181322, "epoch": 2184} {"train_loss": -23.87470817565918, "global_step": 181323, "epoch": 2184} {"train_loss": -24.1846981048584, "global_step": 181324, "epoch": 2184} {"train_loss": -23.78499984741211, "global_step": 181325, "epoch": 2184} {"train_loss": -23.803678512573242, "global_step": 181326, "epoch": 2184} {"train_loss": -24.047346115112305, "global_step": 181327, "epoch": 2184} {"train_loss": -23.74117088317871, "global_step": 181328, "epoch": 2184} {"train_loss": -23.694843292236328, "global_step": 181329, "epoch": 2184} {"train_loss": -24.018310546875, "global_step": 181330, "epoch": 2184} {"train_loss": -24.104169845581055, "global_step": 181331, "epoch": 2184} {"train_loss": -24.0034236907959, "global_step": 181332, "epoch": 2184} {"train_loss": -23.9600772857666, "global_step": 181333, "epoch": 2184} {"train_loss": -24.072172164916992, "global_step": 181334, "epoch": 2184} {"train_loss": -23.849912643432617, "global_step": 181335, "epoch": 2184} {"train_loss": -24.1561279296875, "global_step": 181336, "epoch": 2184} {"train_loss": -23.938329696655273, "global_step": 181337, "epoch": 2184} {"train_loss": -24.346384048461914, "global_step": 181338, "epoch": 2184} {"train_loss": -23.871259689331055, "global_step": 181339, "epoch": 2184} {"train_loss": -23.52768898010254, "global_step": 181340, "epoch": 2184} {"train_loss": -23.630666732788086, "global_step": 181341, "epoch": 2184} {"train_loss": -23.904016494750977, "global_step": 181342, "epoch": 2184} {"train_loss": -24.040416717529297, "global_step": 181343, "epoch": 2184} {"train_loss": -23.73870086669922, "global_step": 181344, "epoch": 2184} {"train_loss": -24.027746200561523, "global_step": 181345, "epoch": 2184} {"train_loss": -24.099456787109375, "global_step": 181346, "epoch": 2184} {"train_loss": -23.596689224243164, "global_step": 181347, "epoch": 2184} {"train_loss": -23.942739486694336, "global_step": 181348, "epoch": 2184} {"train_loss": -23.63798713684082, "global_step": 181349, "epoch": 2184} {"train_loss": -23.886262893676758, "global_step": 181350, "epoch": 2184} {"train_loss": -23.46552276611328, "global_step": 181351, "epoch": 2184} {"train_loss": -23.71847915649414, "global_step": 181352, "epoch": 2184} {"train_loss": -23.780780792236328, "global_step": 181353, "epoch": 2184} {"train_loss": -23.883225153727704, "global_step": 181354, "epoch": 2184, "val_loss": 6437051.5} {"train_loss": -23.214529037475586, "global_step": 181355, "epoch": 2185} {"train_loss": -23.386056900024414, "global_step": 181356, "epoch": 2185} {"train_loss": -23.34921646118164, "global_step": 181357, "epoch": 2185} {"train_loss": -23.419757843017578, "global_step": 181358, "epoch": 2185} {"train_loss": -23.287418365478516, "global_step": 181359, "epoch": 2185} {"train_loss": -23.495304107666016, "global_step": 181360, "epoch": 2185} {"train_loss": -23.43826675415039, "global_step": 181361, "epoch": 2185} {"train_loss": -23.509933471679688, "global_step": 181362, "epoch": 2185} {"train_loss": -23.220829010009766, "global_step": 181363, "epoch": 2185} {"train_loss": -23.508058547973633, "global_step": 181364, "epoch": 2185} {"train_loss": -23.776046752929688, "global_step": 181365, "epoch": 2185} {"train_loss": -23.823965072631836, "global_step": 181366, "epoch": 2185} {"train_loss": -23.360416412353516, "global_step": 181367, "epoch": 2185} {"train_loss": -23.595184326171875, "global_step": 181368, "epoch": 2185} {"train_loss": -23.677621841430664, "global_step": 181369, "epoch": 2185} {"train_loss": -23.591283798217773, "global_step": 181370, "epoch": 2185} {"train_loss": -23.539026260375977, "global_step": 181371, "epoch": 2185} {"train_loss": -23.96151351928711, "global_step": 181372, "epoch": 2185} {"train_loss": -23.726377487182617, "global_step": 181373, "epoch": 2185} {"train_loss": -24.155548095703125, "global_step": 181374, "epoch": 2185} {"train_loss": -23.715024948120117, "global_step": 181375, "epoch": 2185} {"train_loss": -23.635679244995117, "global_step": 181376, "epoch": 2185} {"train_loss": -23.983617782592773, "global_step": 181377, "epoch": 2185} {"train_loss": -23.84627342224121, "global_step": 181378, "epoch": 2185} {"train_loss": -23.66948890686035, "global_step": 181379, "epoch": 2185} {"train_loss": -23.551334381103516, "global_step": 181380, "epoch": 2185} {"train_loss": -24.14521598815918, "global_step": 181381, "epoch": 2185} {"train_loss": -24.098623275756836, "global_step": 181382, "epoch": 2185} {"train_loss": -24.032976150512695, "global_step": 181383, "epoch": 2185} {"train_loss": -23.857358932495117, "global_step": 181384, "epoch": 2185} {"train_loss": -23.982370376586914, "global_step": 181385, "epoch": 2185} {"train_loss": -24.03782844543457, "global_step": 181386, "epoch": 2185} {"train_loss": -23.852272033691406, "global_step": 181387, "epoch": 2185} {"train_loss": -24.26531219482422, "global_step": 181388, "epoch": 2185} {"train_loss": -23.970890045166016, "global_step": 181389, "epoch": 2185} {"train_loss": -23.631484985351562, "global_step": 181390, "epoch": 2185} {"train_loss": -23.72236442565918, "global_step": 181391, "epoch": 2185} {"train_loss": -23.70445442199707, "global_step": 181392, "epoch": 2185} {"train_loss": -23.958581924438477, "global_step": 181393, "epoch": 2185} {"train_loss": -23.850980758666992, "global_step": 181394, "epoch": 2185} {"train_loss": -23.980424880981445, "global_step": 181395, "epoch": 2185} {"train_loss": -23.748092651367188, "global_step": 181396, "epoch": 2185} {"train_loss": -23.625640869140625, "global_step": 181397, "epoch": 2185} {"train_loss": -23.94322395324707, "global_step": 181398, "epoch": 2185} {"train_loss": -23.917837142944336, "global_step": 181399, "epoch": 2185} {"train_loss": -24.183698654174805, "global_step": 181400, "epoch": 2185} {"train_loss": -24.290027618408203, "global_step": 181401, "epoch": 2185} {"train_loss": -23.84669303894043, "global_step": 181402, "epoch": 2185} {"train_loss": -24.29824447631836, "global_step": 181403, "epoch": 2185} {"train_loss": -23.930402755737305, "global_step": 181404, "epoch": 2185} {"train_loss": -23.951248168945312, "global_step": 181405, "epoch": 2185} {"train_loss": -23.88116455078125, "global_step": 181406, "epoch": 2185} {"train_loss": -24.046728134155273, "global_step": 181407, "epoch": 2185} {"train_loss": -24.087167739868164, "global_step": 181408, "epoch": 2185} {"train_loss": -23.72692108154297, "global_step": 181409, "epoch": 2185} {"train_loss": -23.214435577392578, "global_step": 181410, "epoch": 2185} {"train_loss": -23.535175323486328, "global_step": 181411, "epoch": 2185} {"train_loss": -23.67499351501465, "global_step": 181412, "epoch": 2185} {"train_loss": -23.739055633544922, "global_step": 181413, "epoch": 2185} {"train_loss": -23.914703369140625, "global_step": 181414, "epoch": 2185} {"train_loss": -23.3039608001709, "global_step": 181415, "epoch": 2185} {"train_loss": -24.131412506103516, "global_step": 181416, "epoch": 2185} {"train_loss": -23.529136657714844, "global_step": 181417, "epoch": 2185} {"train_loss": -24.066434860229492, "global_step": 181418, "epoch": 2185} {"train_loss": -23.7357177734375, "global_step": 181419, "epoch": 2185} {"train_loss": -23.84650993347168, "global_step": 181420, "epoch": 2185} {"train_loss": -23.886791229248047, "global_step": 181421, "epoch": 2185} {"train_loss": -23.541234970092773, "global_step": 181422, "epoch": 2185} {"train_loss": -24.178560256958008, "global_step": 181423, "epoch": 2185} {"train_loss": -23.398357391357422, "global_step": 181424, "epoch": 2185} {"train_loss": -23.811206817626953, "global_step": 181425, "epoch": 2185} {"train_loss": -23.81756019592285, "global_step": 181426, "epoch": 2185} {"train_loss": -23.957456588745117, "global_step": 181427, "epoch": 2185} {"train_loss": -23.850595474243164, "global_step": 181428, "epoch": 2185} {"train_loss": -23.82204246520996, "global_step": 181429, "epoch": 2185} {"train_loss": -23.812360763549805, "global_step": 181430, "epoch": 2185} {"train_loss": -23.67462730407715, "global_step": 181431, "epoch": 2185} {"train_loss": -23.571632385253906, "global_step": 181432, "epoch": 2185} {"train_loss": -23.42449188232422, "global_step": 181433, "epoch": 2185} {"train_loss": -23.90816307067871, "global_step": 181434, "epoch": 2185} {"train_loss": -23.889774322509766, "global_step": 181435, "epoch": 2185} {"train_loss": -23.32457160949707, "global_step": 181436, "epoch": 2185} {"train_loss": -23.76262092590332, "global_step": 181437, "epoch": 2185, "val_loss": 6511156.0} {"train_loss": -23.836383819580078, "global_step": 181438, "epoch": 2186} {"train_loss": -23.565282821655273, "global_step": 181439, "epoch": 2186} {"train_loss": -23.23210334777832, "global_step": 181440, "epoch": 2186} {"train_loss": -23.581632614135742, "global_step": 181441, "epoch": 2186} {"train_loss": -23.506973266601562, "global_step": 181442, "epoch": 2186} {"train_loss": -23.627273559570312, "global_step": 181443, "epoch": 2186} {"train_loss": -23.81644630432129, "global_step": 181444, "epoch": 2186} {"train_loss": -23.357763290405273, "global_step": 181445, "epoch": 2186} {"train_loss": -23.7934627532959, "global_step": 181446, "epoch": 2186} {"train_loss": -23.466934204101562, "global_step": 181447, "epoch": 2186} {"train_loss": -23.640365600585938, "global_step": 181448, "epoch": 2186} {"train_loss": -23.151174545288086, "global_step": 181449, "epoch": 2186} {"train_loss": -23.98969078063965, "global_step": 181450, "epoch": 2186} {"train_loss": -23.575088500976562, "global_step": 181451, "epoch": 2186} {"train_loss": -23.80403709411621, "global_step": 181452, "epoch": 2186} {"train_loss": -23.785181045532227, "global_step": 181453, "epoch": 2186} {"train_loss": -24.103710174560547, "global_step": 181454, "epoch": 2186} {"train_loss": -23.89911651611328, "global_step": 181455, "epoch": 2186} {"train_loss": -23.755647659301758, "global_step": 181456, "epoch": 2186} {"train_loss": -24.24295425415039, "global_step": 181457, "epoch": 2186} {"train_loss": -23.782697677612305, "global_step": 181458, "epoch": 2186} {"train_loss": -24.043140411376953, "global_step": 181459, "epoch": 2186} {"train_loss": -23.78207778930664, "global_step": 181460, "epoch": 2186} {"train_loss": -23.77923011779785, "global_step": 181461, "epoch": 2186} {"train_loss": -23.542531967163086, "global_step": 181462, "epoch": 2186} {"train_loss": -23.759220123291016, "global_step": 181463, "epoch": 2186} {"train_loss": -23.661828994750977, "global_step": 181464, "epoch": 2186} {"train_loss": -24.062978744506836, "global_step": 181465, "epoch": 2186} {"train_loss": -23.626049041748047, "global_step": 181466, "epoch": 2186} {"train_loss": -23.812545776367188, "global_step": 181467, "epoch": 2186} {"train_loss": -23.974454879760742, "global_step": 181468, "epoch": 2186} {"train_loss": -23.832223892211914, "global_step": 181469, "epoch": 2186} {"train_loss": -24.017026901245117, "global_step": 181470, "epoch": 2186} {"train_loss": -23.84521484375, "global_step": 181471, "epoch": 2186} {"train_loss": -23.988882064819336, "global_step": 181472, "epoch": 2186} {"train_loss": -23.79329490661621, "global_step": 181473, "epoch": 2186} {"train_loss": -24.093631744384766, "global_step": 181474, "epoch": 2186} {"train_loss": -23.582395553588867, "global_step": 181475, "epoch": 2186} {"train_loss": -24.264577865600586, "global_step": 181476, "epoch": 2186} {"train_loss": -24.22540855407715, "global_step": 181477, "epoch": 2186} {"train_loss": -24.20587158203125, "global_step": 181478, "epoch": 2186} {"train_loss": -24.166217803955078, "global_step": 181479, "epoch": 2186} {"train_loss": -24.124252319335938, "global_step": 181480, "epoch": 2186} {"train_loss": -24.014196395874023, "global_step": 181481, "epoch": 2186} {"train_loss": -24.03934669494629, "global_step": 181482, "epoch": 2186} {"train_loss": -24.055431365966797, "global_step": 181483, "epoch": 2186} {"train_loss": -24.135374069213867, "global_step": 181484, "epoch": 2186} {"train_loss": -23.998451232910156, "global_step": 181485, "epoch": 2186} {"train_loss": -23.9344482421875, "global_step": 181486, "epoch": 2186} {"train_loss": -23.869848251342773, "global_step": 181487, "epoch": 2186} {"train_loss": -23.606143951416016, "global_step": 181488, "epoch": 2186} {"train_loss": -24.0791015625, "global_step": 181489, "epoch": 2186} {"train_loss": -24.068552017211914, "global_step": 181490, "epoch": 2186} {"train_loss": -24.158658981323242, "global_step": 181491, "epoch": 2186} {"train_loss": -24.220075607299805, "global_step": 181492, "epoch": 2186} {"train_loss": -24.13820457458496, "global_step": 181493, "epoch": 2186} {"train_loss": -24.006452560424805, "global_step": 181494, "epoch": 2186} {"train_loss": -23.790639877319336, "global_step": 181495, "epoch": 2186} {"train_loss": -24.608718872070312, "global_step": 181496, "epoch": 2186} {"train_loss": -23.76998519897461, "global_step": 181497, "epoch": 2186} {"train_loss": -23.739070892333984, "global_step": 181498, "epoch": 2186} {"train_loss": -23.841144561767578, "global_step": 181499, "epoch": 2186} {"train_loss": -23.919137954711914, "global_step": 181500, "epoch": 2186} {"train_loss": -23.8989315032959, "global_step": 181501, "epoch": 2186} {"train_loss": -23.897798538208008, "global_step": 181502, "epoch": 2186} {"train_loss": -23.690412521362305, "global_step": 181503, "epoch": 2186} {"train_loss": -23.59516716003418, "global_step": 181504, "epoch": 2186} {"train_loss": -23.7220458984375, "global_step": 181505, "epoch": 2186} {"train_loss": -23.92952537536621, "global_step": 181506, "epoch": 2186} {"train_loss": -23.5456485748291, "global_step": 181507, "epoch": 2186} {"train_loss": -24.0771484375, "global_step": 181508, "epoch": 2186} {"train_loss": -23.953689575195312, "global_step": 181509, "epoch": 2186} {"train_loss": -23.42331314086914, "global_step": 181510, "epoch": 2186} {"train_loss": -23.85260581970215, "global_step": 181511, "epoch": 2186} {"train_loss": -24.11366081237793, "global_step": 181512, "epoch": 2186} {"train_loss": -23.444076538085938, "global_step": 181513, "epoch": 2186} {"train_loss": -23.670934677124023, "global_step": 181514, "epoch": 2186} {"train_loss": -23.828411102294922, "global_step": 181515, "epoch": 2186} {"train_loss": -23.731565475463867, "global_step": 181516, "epoch": 2186} {"train_loss": -23.758703231811523, "global_step": 181517, "epoch": 2186} {"train_loss": -23.633501052856445, "global_step": 181518, "epoch": 2186} {"train_loss": -23.8203125, "global_step": 181519, "epoch": 2186} {"train_loss": -23.868501824068737, "global_step": 181520, "epoch": 2186, "val_loss": 6344651.0} {"train_loss": -22.738351821899414, "global_step": 181521, "epoch": 2187} {"train_loss": -23.190433502197266, "global_step": 181522, "epoch": 2187} {"train_loss": -23.300291061401367, "global_step": 181523, "epoch": 2187} {"train_loss": -23.338104248046875, "global_step": 181524, "epoch": 2187} {"train_loss": -22.428678512573242, "global_step": 181525, "epoch": 2187} {"train_loss": -22.58272361755371, "global_step": 181526, "epoch": 2187} {"train_loss": -23.02765464782715, "global_step": 181527, "epoch": 2187} {"train_loss": -23.056875228881836, "global_step": 181528, "epoch": 2187} {"train_loss": -23.32162857055664, "global_step": 181529, "epoch": 2187} {"train_loss": -23.368806838989258, "global_step": 181530, "epoch": 2187} {"train_loss": -23.739639282226562, "global_step": 181531, "epoch": 2187} {"train_loss": -23.336538314819336, "global_step": 181532, "epoch": 2187} {"train_loss": -23.300811767578125, "global_step": 181533, "epoch": 2187} {"train_loss": -23.689851760864258, "global_step": 181534, "epoch": 2187} {"train_loss": -23.697546005249023, "global_step": 181535, "epoch": 2187} {"train_loss": -23.55865478515625, "global_step": 181536, "epoch": 2187} {"train_loss": -23.531673431396484, "global_step": 181537, "epoch": 2187} {"train_loss": -23.632999420166016, "global_step": 181538, "epoch": 2187} {"train_loss": -23.49773597717285, "global_step": 181539, "epoch": 2187} {"train_loss": -23.530969619750977, "global_step": 181540, "epoch": 2187} {"train_loss": -23.436491012573242, "global_step": 181541, "epoch": 2187} {"train_loss": -23.979902267456055, "global_step": 181542, "epoch": 2187} {"train_loss": -23.86688995361328, "global_step": 181543, "epoch": 2187} {"train_loss": -23.969459533691406, "global_step": 181544, "epoch": 2187} {"train_loss": -23.685043334960938, "global_step": 181545, "epoch": 2187} {"train_loss": -23.95911979675293, "global_step": 181546, "epoch": 2187} {"train_loss": -23.652326583862305, "global_step": 181547, "epoch": 2187} {"train_loss": -23.412433624267578, "global_step": 181548, "epoch": 2187} {"train_loss": -23.993925094604492, "global_step": 181549, "epoch": 2187} {"train_loss": -23.760526657104492, "global_step": 181550, "epoch": 2187} {"train_loss": -24.001636505126953, "global_step": 181551, "epoch": 2187} {"train_loss": -23.745397567749023, "global_step": 181552, "epoch": 2187} {"train_loss": -24.047361373901367, "global_step": 181553, "epoch": 2187} {"train_loss": -24.003881454467773, "global_step": 181554, "epoch": 2187} {"train_loss": -24.198856353759766, "global_step": 181555, "epoch": 2187} {"train_loss": -23.81072998046875, "global_step": 181556, "epoch": 2187} {"train_loss": -24.1811580657959, "global_step": 181557, "epoch": 2187} {"train_loss": -24.02976417541504, "global_step": 181558, "epoch": 2187} {"train_loss": -23.785947799682617, "global_step": 181559, "epoch": 2187} {"train_loss": -23.706350326538086, "global_step": 181560, "epoch": 2187} {"train_loss": -24.158218383789062, "global_step": 181561, "epoch": 2187} {"train_loss": -23.868915557861328, "global_step": 181562, "epoch": 2187} {"train_loss": -23.786157608032227, "global_step": 181563, "epoch": 2187} {"train_loss": -23.919570922851562, "global_step": 181564, "epoch": 2187} {"train_loss": -23.813528060913086, "global_step": 181565, "epoch": 2187} {"train_loss": -24.254072189331055, "global_step": 181566, "epoch": 2187} {"train_loss": -24.088462829589844, "global_step": 181567, "epoch": 2187} {"train_loss": -23.99876594543457, "global_step": 181568, "epoch": 2187} {"train_loss": -24.104562759399414, "global_step": 181569, "epoch": 2187} {"train_loss": -24.467864990234375, "global_step": 181570, "epoch": 2187} {"train_loss": -23.800676345825195, "global_step": 181571, "epoch": 2187} {"train_loss": -24.223154067993164, "global_step": 181572, "epoch": 2187} {"train_loss": -24.149309158325195, "global_step": 181573, "epoch": 2187} {"train_loss": -24.20830726623535, "global_step": 181574, "epoch": 2187} {"train_loss": -23.86012840270996, "global_step": 181575, "epoch": 2187} {"train_loss": -23.87430191040039, "global_step": 181576, "epoch": 2187} {"train_loss": -24.396038055419922, "global_step": 181577, "epoch": 2187} {"train_loss": -23.859756469726562, "global_step": 181578, "epoch": 2187} {"train_loss": -23.87004852294922, "global_step": 181579, "epoch": 2187} {"train_loss": -24.13225555419922, "global_step": 181580, "epoch": 2187} {"train_loss": -24.299589157104492, "global_step": 181581, "epoch": 2187} {"train_loss": -23.989978790283203, "global_step": 181582, "epoch": 2187} {"train_loss": -23.939130783081055, "global_step": 181583, "epoch": 2187} {"train_loss": -23.759817123413086, "global_step": 181584, "epoch": 2187} {"train_loss": -23.996009826660156, "global_step": 181585, "epoch": 2187} {"train_loss": -23.850574493408203, "global_step": 181586, "epoch": 2187} {"train_loss": -23.953216552734375, "global_step": 181587, "epoch": 2187} {"train_loss": -23.873987197875977, "global_step": 181588, "epoch": 2187} {"train_loss": -24.079755783081055, "global_step": 181589, "epoch": 2187} {"train_loss": -24.035945892333984, "global_step": 181590, "epoch": 2187} {"train_loss": -23.669017791748047, "global_step": 181591, "epoch": 2187} {"train_loss": -23.951745986938477, "global_step": 181592, "epoch": 2187} {"train_loss": -24.10675811767578, "global_step": 181593, "epoch": 2187} {"train_loss": -24.152780532836914, "global_step": 181594, "epoch": 2187} {"train_loss": -23.938247680664062, "global_step": 181595, "epoch": 2187} {"train_loss": -23.930389404296875, "global_step": 181596, "epoch": 2187} {"train_loss": -23.760419845581055, "global_step": 181597, "epoch": 2187} {"train_loss": -23.71363639831543, "global_step": 181598, "epoch": 2187} {"train_loss": -23.753128051757812, "global_step": 181599, "epoch": 2187} {"train_loss": -23.578950881958008, "global_step": 181600, "epoch": 2187} {"train_loss": -23.603784561157227, "global_step": 181601, "epoch": 2187} {"train_loss": -23.6087589263916, "global_step": 181602, "epoch": 2187} {"train_loss": -23.781202569065325, "global_step": 181603, "epoch": 2187, "val_loss": 6438734.0} {"train_loss": -23.919700622558594, "global_step": 181604, "epoch": 2188} {"train_loss": -23.568819046020508, "global_step": 181605, "epoch": 2188} {"train_loss": -23.28985023498535, "global_step": 181606, "epoch": 2188} {"train_loss": -23.554183959960938, "global_step": 181607, "epoch": 2188} {"train_loss": -23.512508392333984, "global_step": 181608, "epoch": 2188} {"train_loss": -23.509592056274414, "global_step": 181609, "epoch": 2188} {"train_loss": -23.184770584106445, "global_step": 181610, "epoch": 2188} {"train_loss": -23.41444969177246, "global_step": 181611, "epoch": 2188} {"train_loss": -23.402952194213867, "global_step": 181612, "epoch": 2188} {"train_loss": -24.004125595092773, "global_step": 181613, "epoch": 2188} {"train_loss": -23.91713523864746, "global_step": 181614, "epoch": 2188} {"train_loss": -23.711698532104492, "global_step": 181615, "epoch": 2188} {"train_loss": -23.678369522094727, "global_step": 181616, "epoch": 2188} {"train_loss": -23.46786117553711, "global_step": 181617, "epoch": 2188} {"train_loss": -23.95815086364746, "global_step": 181618, "epoch": 2188} {"train_loss": -23.58152198791504, "global_step": 181619, "epoch": 2188} {"train_loss": -23.41632652282715, "global_step": 181620, "epoch": 2188} {"train_loss": -23.738187789916992, "global_step": 181621, "epoch": 2188} {"train_loss": -23.710126876831055, "global_step": 181622, "epoch": 2188} {"train_loss": -23.655920028686523, "global_step": 181623, "epoch": 2188} {"train_loss": -23.809619903564453, "global_step": 181624, "epoch": 2188} {"train_loss": -23.65370750427246, "global_step": 181625, "epoch": 2188} {"train_loss": -23.766324996948242, "global_step": 181626, "epoch": 2188} {"train_loss": -23.334165573120117, "global_step": 181627, "epoch": 2188} {"train_loss": -23.880857467651367, "global_step": 181628, "epoch": 2188} {"train_loss": -23.724754333496094, "global_step": 181629, "epoch": 2188} {"train_loss": -23.724546432495117, "global_step": 181630, "epoch": 2188} {"train_loss": -23.893789291381836, "global_step": 181631, "epoch": 2188} {"train_loss": -23.47908592224121, "global_step": 181632, "epoch": 2188} {"train_loss": -23.938007354736328, "global_step": 181633, "epoch": 2188} {"train_loss": -23.573198318481445, "global_step": 181634, "epoch": 2188} {"train_loss": -23.618501663208008, "global_step": 181635, "epoch": 2188} {"train_loss": -23.877737045288086, "global_step": 181636, "epoch": 2188} {"train_loss": -23.70259666442871, "global_step": 181637, "epoch": 2188} {"train_loss": -23.81498908996582, "global_step": 181638, "epoch": 2188} {"train_loss": -24.0522403717041, "global_step": 181639, "epoch": 2188} {"train_loss": -24.15264320373535, "global_step": 181640, "epoch": 2188} {"train_loss": -23.781095504760742, "global_step": 181641, "epoch": 2188} {"train_loss": -23.88118553161621, "global_step": 181642, "epoch": 2188} {"train_loss": -23.788028717041016, "global_step": 181643, "epoch": 2188} {"train_loss": -24.015844345092773, "global_step": 181644, "epoch": 2188} {"train_loss": -23.861942291259766, "global_step": 181645, "epoch": 2188} {"train_loss": -23.76068687438965, "global_step": 181646, "epoch": 2188} {"train_loss": -24.092864990234375, "global_step": 181647, "epoch": 2188} {"train_loss": -24.02170753479004, "global_step": 181648, "epoch": 2188} {"train_loss": -23.77456283569336, "global_step": 181649, "epoch": 2188} {"train_loss": -23.745311737060547, "global_step": 181650, "epoch": 2188} {"train_loss": -24.00787353515625, "global_step": 181651, "epoch": 2188} {"train_loss": -23.840473175048828, "global_step": 181652, "epoch": 2188} {"train_loss": -24.25857925415039, "global_step": 181653, "epoch": 2188} {"train_loss": -24.026884078979492, "global_step": 181654, "epoch": 2188} {"train_loss": -23.973875045776367, "global_step": 181655, "epoch": 2188} {"train_loss": -24.210721969604492, "global_step": 181656, "epoch": 2188} {"train_loss": -24.041845321655273, "global_step": 181657, "epoch": 2188} {"train_loss": -23.690649032592773, "global_step": 181658, "epoch": 2188} {"train_loss": -23.872583389282227, "global_step": 181659, "epoch": 2188} {"train_loss": -24.26889991760254, "global_step": 181660, "epoch": 2188} {"train_loss": -24.022092819213867, "global_step": 181661, "epoch": 2188} {"train_loss": -24.167734146118164, "global_step": 181662, "epoch": 2188} {"train_loss": -24.141550064086914, "global_step": 181663, "epoch": 2188} {"train_loss": -23.756399154663086, "global_step": 181664, "epoch": 2188} {"train_loss": -23.614187240600586, "global_step": 181665, "epoch": 2188} {"train_loss": -24.01026725769043, "global_step": 181666, "epoch": 2188} {"train_loss": -24.112455368041992, "global_step": 181667, "epoch": 2188} {"train_loss": -24.123929977416992, "global_step": 181668, "epoch": 2188} {"train_loss": -24.051740646362305, "global_step": 181669, "epoch": 2188} {"train_loss": -24.327173233032227, "global_step": 181670, "epoch": 2188} {"train_loss": -23.88200569152832, "global_step": 181671, "epoch": 2188} {"train_loss": -24.070554733276367, "global_step": 181672, "epoch": 2188} {"train_loss": -24.058719635009766, "global_step": 181673, "epoch": 2188} {"train_loss": -23.859149932861328, "global_step": 181674, "epoch": 2188} {"train_loss": -23.964792251586914, "global_step": 181675, "epoch": 2188} {"train_loss": -23.670028686523438, "global_step": 181676, "epoch": 2188} {"train_loss": -24.23078727722168, "global_step": 181677, "epoch": 2188} {"train_loss": -24.13370132446289, "global_step": 181678, "epoch": 2188} {"train_loss": -24.22951316833496, "global_step": 181679, "epoch": 2188} {"train_loss": -23.90436363220215, "global_step": 181680, "epoch": 2188} {"train_loss": -24.051389694213867, "global_step": 181681, "epoch": 2188} {"train_loss": -24.020723342895508, "global_step": 181682, "epoch": 2188} {"train_loss": -23.982248306274414, "global_step": 181683, "epoch": 2188} {"train_loss": -24.110410690307617, "global_step": 181684, "epoch": 2188} {"train_loss": -23.915311813354492, "global_step": 181685, "epoch": 2188} {"train_loss": -23.855351298688404, "global_step": 181686, "epoch": 2188, "val_loss": 6436323.0} {"train_loss": -23.210420608520508, "global_step": 181687, "epoch": 2189} {"train_loss": -23.37762451171875, "global_step": 181688, "epoch": 2189} {"train_loss": -23.21240234375, "global_step": 181689, "epoch": 2189} {"train_loss": -23.69355583190918, "global_step": 181690, "epoch": 2189} {"train_loss": -23.553302764892578, "global_step": 181691, "epoch": 2189} {"train_loss": -23.197904586791992, "global_step": 181692, "epoch": 2189} {"train_loss": -24.032011032104492, "global_step": 181693, "epoch": 2189} {"train_loss": -23.353809356689453, "global_step": 181694, "epoch": 2189} {"train_loss": -23.174030303955078, "global_step": 181695, "epoch": 2189} {"train_loss": -23.574331283569336, "global_step": 181696, "epoch": 2189} {"train_loss": -23.784421920776367, "global_step": 181697, "epoch": 2189} {"train_loss": -23.903379440307617, "global_step": 181698, "epoch": 2189} {"train_loss": -23.644601821899414, "global_step": 181699, "epoch": 2189} {"train_loss": -23.723430633544922, "global_step": 181700, "epoch": 2189} {"train_loss": -23.97074317932129, "global_step": 181701, "epoch": 2189} {"train_loss": -24.146663665771484, "global_step": 181702, "epoch": 2189} {"train_loss": -24.034574508666992, "global_step": 181703, "epoch": 2189} {"train_loss": -24.03118324279785, "global_step": 181704, "epoch": 2189} {"train_loss": -23.86991310119629, "global_step": 181705, "epoch": 2189} {"train_loss": -23.938566207885742, "global_step": 181706, "epoch": 2189} {"train_loss": -23.969341278076172, "global_step": 181707, "epoch": 2189} {"train_loss": -24.0511531829834, "global_step": 181708, "epoch": 2189} {"train_loss": -24.048419952392578, "global_step": 181709, "epoch": 2189} {"train_loss": -23.64414405822754, "global_step": 181710, "epoch": 2189} {"train_loss": -24.133752822875977, "global_step": 181711, "epoch": 2189} {"train_loss": -23.698945999145508, "global_step": 181712, "epoch": 2189} {"train_loss": -23.543062210083008, "global_step": 181713, "epoch": 2189} {"train_loss": -23.939016342163086, "global_step": 181714, "epoch": 2189} {"train_loss": -24.24422264099121, "global_step": 181715, "epoch": 2189} {"train_loss": -24.075231552124023, "global_step": 181716, "epoch": 2189} {"train_loss": -24.403366088867188, "global_step": 181717, "epoch": 2189} {"train_loss": -23.640783309936523, "global_step": 181718, "epoch": 2189} {"train_loss": -24.070999145507812, "global_step": 181719, "epoch": 2189} {"train_loss": -23.699630737304688, "global_step": 181720, "epoch": 2189} {"train_loss": -23.788002014160156, "global_step": 181721, "epoch": 2189} {"train_loss": -23.550302505493164, "global_step": 181722, "epoch": 2189} {"train_loss": -23.834909439086914, "global_step": 181723, "epoch": 2189} {"train_loss": -23.901912689208984, "global_step": 181724, "epoch": 2189} {"train_loss": -23.825124740600586, "global_step": 181725, "epoch": 2189} {"train_loss": -23.505218505859375, "global_step": 181726, "epoch": 2189} {"train_loss": -23.327550888061523, "global_step": 181727, "epoch": 2189} {"train_loss": -23.793737411499023, "global_step": 181728, "epoch": 2189} {"train_loss": -23.576313018798828, "global_step": 181729, "epoch": 2189} {"train_loss": -23.68802833557129, "global_step": 181730, "epoch": 2189} {"train_loss": -23.829504013061523, "global_step": 181731, "epoch": 2189} {"train_loss": -23.56568145751953, "global_step": 181732, "epoch": 2189} {"train_loss": -23.514799118041992, "global_step": 181733, "epoch": 2189} {"train_loss": -23.809743881225586, "global_step": 181734, "epoch": 2189} {"train_loss": -23.86928367614746, "global_step": 181735, "epoch": 2189} {"train_loss": -23.41632080078125, "global_step": 181736, "epoch": 2189} {"train_loss": -23.814313888549805, "global_step": 181737, "epoch": 2189} {"train_loss": -23.64994239807129, "global_step": 181738, "epoch": 2189} {"train_loss": -23.833343505859375, "global_step": 181739, "epoch": 2189} {"train_loss": -23.816781997680664, "global_step": 181740, "epoch": 2189} {"train_loss": -23.61191749572754, "global_step": 181741, "epoch": 2189} {"train_loss": -24.361499786376953, "global_step": 181742, "epoch": 2189} {"train_loss": -23.730632781982422, "global_step": 181743, "epoch": 2189} {"train_loss": -23.889774322509766, "global_step": 181744, "epoch": 2189} {"train_loss": -23.55560302734375, "global_step": 181745, "epoch": 2189} {"train_loss": -24.322635650634766, "global_step": 181746, "epoch": 2189} {"train_loss": -23.889631271362305, "global_step": 181747, "epoch": 2189} {"train_loss": -23.864118576049805, "global_step": 181748, "epoch": 2189} {"train_loss": -23.985858917236328, "global_step": 181749, "epoch": 2189} {"train_loss": -24.0474796295166, "global_step": 181750, "epoch": 2189} {"train_loss": -23.92188262939453, "global_step": 181751, "epoch": 2189} {"train_loss": -23.956750869750977, "global_step": 181752, "epoch": 2189} {"train_loss": -24.107511520385742, "global_step": 181753, "epoch": 2189} {"train_loss": -24.1159725189209, "global_step": 181754, "epoch": 2189} {"train_loss": -23.77159309387207, "global_step": 181755, "epoch": 2189} {"train_loss": -23.762102127075195, "global_step": 181756, "epoch": 2189} {"train_loss": -24.109485626220703, "global_step": 181757, "epoch": 2189} {"train_loss": -24.076988220214844, "global_step": 181758, "epoch": 2189} {"train_loss": -23.76055908203125, "global_step": 181759, "epoch": 2189} {"train_loss": -23.80358123779297, "global_step": 181760, "epoch": 2189} {"train_loss": -23.64335060119629, "global_step": 181761, "epoch": 2189} {"train_loss": -23.4224796295166, "global_step": 181762, "epoch": 2189} {"train_loss": -23.864171981811523, "global_step": 181763, "epoch": 2189} {"train_loss": -24.229923248291016, "global_step": 181764, "epoch": 2189} {"train_loss": -23.421966552734375, "global_step": 181765, "epoch": 2189} {"train_loss": -23.88190269470215, "global_step": 181766, "epoch": 2189} {"train_loss": -23.701751708984375, "global_step": 181767, "epoch": 2189} {"train_loss": -23.456750869750977, "global_step": 181768, "epoch": 2189} {"train_loss": -23.79999186044716, "global_step": 181769, "epoch": 2189, "val_loss": 6441108.0} {"train_loss": -22.93667221069336, "global_step": 181770, "epoch": 2190} {"train_loss": -23.561281204223633, "global_step": 181771, "epoch": 2190} {"train_loss": -22.954633712768555, "global_step": 181772, "epoch": 2190} {"train_loss": -23.669998168945312, "global_step": 181773, "epoch": 2190} {"train_loss": -22.884719848632812, "global_step": 181774, "epoch": 2190} {"train_loss": -23.452367782592773, "global_step": 181775, "epoch": 2190} {"train_loss": -23.18459129333496, "global_step": 181776, "epoch": 2190} {"train_loss": -23.473142623901367, "global_step": 181777, "epoch": 2190} {"train_loss": -23.06297492980957, "global_step": 181778, "epoch": 2190} {"train_loss": -23.4082088470459, "global_step": 181779, "epoch": 2190} {"train_loss": -23.74641227722168, "global_step": 181780, "epoch": 2190} {"train_loss": -23.668853759765625, "global_step": 181781, "epoch": 2190} {"train_loss": -23.351232528686523, "global_step": 181782, "epoch": 2190} {"train_loss": -23.60186004638672, "global_step": 181783, "epoch": 2190} {"train_loss": -23.8293399810791, "global_step": 181784, "epoch": 2190} {"train_loss": -23.79715347290039, "global_step": 181785, "epoch": 2190} {"train_loss": -23.665512084960938, "global_step": 181786, "epoch": 2190} {"train_loss": -24.033838272094727, "global_step": 181787, "epoch": 2190} {"train_loss": -23.480316162109375, "global_step": 181788, "epoch": 2190} {"train_loss": -23.82192611694336, "global_step": 181789, "epoch": 2190} {"train_loss": -23.598154067993164, "global_step": 181790, "epoch": 2190} {"train_loss": -23.813024520874023, "global_step": 181791, "epoch": 2190} {"train_loss": -23.884611129760742, "global_step": 181792, "epoch": 2190} {"train_loss": -23.370267868041992, "global_step": 181793, "epoch": 2190} {"train_loss": -24.19758415222168, "global_step": 181794, "epoch": 2190} {"train_loss": -23.9495792388916, "global_step": 181795, "epoch": 2190} {"train_loss": -24.17717933654785, "global_step": 181796, "epoch": 2190} {"train_loss": -24.306127548217773, "global_step": 181797, "epoch": 2190} {"train_loss": -23.930965423583984, "global_step": 181798, "epoch": 2190} {"train_loss": -24.140914916992188, "global_step": 181799, "epoch": 2190} {"train_loss": -23.911346435546875, "global_step": 181800, "epoch": 2190} {"train_loss": -23.848634719848633, "global_step": 181801, "epoch": 2190} {"train_loss": -23.8806209564209, "global_step": 181802, "epoch": 2190} {"train_loss": -24.197477340698242, "global_step": 181803, "epoch": 2190} {"train_loss": -24.1428165435791, "global_step": 181804, "epoch": 2190} {"train_loss": -23.569866180419922, "global_step": 181805, "epoch": 2190} {"train_loss": -23.618398666381836, "global_step": 181806, "epoch": 2190} {"train_loss": -24.045669555664062, "global_step": 181807, "epoch": 2190} {"train_loss": -24.370038986206055, "global_step": 181808, "epoch": 2190} {"train_loss": -23.979284286499023, "global_step": 181809, "epoch": 2190} {"train_loss": -24.41973114013672, "global_step": 181810, "epoch": 2190} {"train_loss": -24.242511749267578, "global_step": 181811, "epoch": 2190} {"train_loss": -23.65700340270996, "global_step": 181812, "epoch": 2190} {"train_loss": -24.173643112182617, "global_step": 181813, "epoch": 2190} {"train_loss": -24.09939956665039, "global_step": 181814, "epoch": 2190} {"train_loss": -23.668283462524414, "global_step": 181815, "epoch": 2190} {"train_loss": -23.815282821655273, "global_step": 181816, "epoch": 2190} {"train_loss": -23.8177547454834, "global_step": 181817, "epoch": 2190} {"train_loss": -23.649961471557617, "global_step": 181818, "epoch": 2190} {"train_loss": -23.694076538085938, "global_step": 181819, "epoch": 2190} {"train_loss": -24.021774291992188, "global_step": 181820, "epoch": 2190} {"train_loss": -23.887714385986328, "global_step": 181821, "epoch": 2190} {"train_loss": -23.298755645751953, "global_step": 181822, "epoch": 2190} {"train_loss": -23.132314682006836, "global_step": 181823, "epoch": 2190} {"train_loss": -23.737585067749023, "global_step": 181824, "epoch": 2190} {"train_loss": -23.57821273803711, "global_step": 181825, "epoch": 2190} {"train_loss": -23.29166030883789, "global_step": 181826, "epoch": 2190} {"train_loss": -24.175384521484375, "global_step": 181827, "epoch": 2190} {"train_loss": -23.296695709228516, "global_step": 181828, "epoch": 2190} {"train_loss": -23.3468074798584, "global_step": 181829, "epoch": 2190} {"train_loss": -23.903474807739258, "global_step": 181830, "epoch": 2190} {"train_loss": -23.827619552612305, "global_step": 181831, "epoch": 2190} {"train_loss": -23.8419246673584, "global_step": 181832, "epoch": 2190} {"train_loss": -23.870084762573242, "global_step": 181833, "epoch": 2190} {"train_loss": -24.03287124633789, "global_step": 181834, "epoch": 2190} {"train_loss": -24.149179458618164, "global_step": 181835, "epoch": 2190} {"train_loss": -24.001882553100586, "global_step": 181836, "epoch": 2190} {"train_loss": -23.854143142700195, "global_step": 181837, "epoch": 2190} {"train_loss": -23.984830856323242, "global_step": 181838, "epoch": 2190} {"train_loss": -24.022062301635742, "global_step": 181839, "epoch": 2190} {"train_loss": -23.80671501159668, "global_step": 181840, "epoch": 2190} {"train_loss": -23.869972229003906, "global_step": 181841, "epoch": 2190} {"train_loss": -23.809375762939453, "global_step": 181842, "epoch": 2190} {"train_loss": -24.106082916259766, "global_step": 181843, "epoch": 2190} {"train_loss": -23.76348304748535, "global_step": 181844, "epoch": 2190} {"train_loss": -23.967409133911133, "global_step": 181845, "epoch": 2190} {"train_loss": -23.90834617614746, "global_step": 181846, "epoch": 2190} {"train_loss": -23.489362716674805, "global_step": 181847, "epoch": 2190} {"train_loss": -23.945398330688477, "global_step": 181848, "epoch": 2190} {"train_loss": -23.97402000427246, "global_step": 181849, "epoch": 2190} {"train_loss": -23.601821899414062, "global_step": 181850, "epoch": 2190} {"train_loss": -24.316862106323242, "global_step": 181851, "epoch": 2190} {"train_loss": -23.785063134618554, "global_step": 181852, "epoch": 2190, "val_loss": 6501973.0} {"train_loss": -23.78948402404785, "global_step": 181853, "epoch": 2191} {"train_loss": -24.132320404052734, "global_step": 181854, "epoch": 2191} {"train_loss": -23.705854415893555, "global_step": 181855, "epoch": 2191} {"train_loss": -23.943395614624023, "global_step": 181856, "epoch": 2191} {"train_loss": -23.892683029174805, "global_step": 181857, "epoch": 2191} {"train_loss": -23.735258102416992, "global_step": 181858, "epoch": 2191} {"train_loss": -23.860538482666016, "global_step": 181859, "epoch": 2191} {"train_loss": -23.39151382446289, "global_step": 181860, "epoch": 2191} {"train_loss": -23.252504348754883, "global_step": 181861, "epoch": 2191} {"train_loss": -23.546676635742188, "global_step": 181862, "epoch": 2191} {"train_loss": -23.720809936523438, "global_step": 181863, "epoch": 2191} {"train_loss": -23.834280014038086, "global_step": 181864, "epoch": 2191} {"train_loss": -23.874191284179688, "global_step": 181865, "epoch": 2191} {"train_loss": -24.144058227539062, "global_step": 181866, "epoch": 2191} {"train_loss": -23.72127342224121, "global_step": 181867, "epoch": 2191} {"train_loss": -24.134321212768555, "global_step": 181868, "epoch": 2191} {"train_loss": -23.732160568237305, "global_step": 181869, "epoch": 2191} {"train_loss": -23.932632446289062, "global_step": 181870, "epoch": 2191} {"train_loss": -23.530261993408203, "global_step": 181871, "epoch": 2191} {"train_loss": -24.222217559814453, "global_step": 181872, "epoch": 2191} {"train_loss": -23.69819450378418, "global_step": 181873, "epoch": 2191} {"train_loss": -24.036396026611328, "global_step": 181874, "epoch": 2191} {"train_loss": -23.613615036010742, "global_step": 181875, "epoch": 2191} {"train_loss": -23.998140335083008, "global_step": 181876, "epoch": 2191} {"train_loss": -23.82613754272461, "global_step": 181877, "epoch": 2191} {"train_loss": -23.704490661621094, "global_step": 181878, "epoch": 2191} {"train_loss": -24.23318099975586, "global_step": 181879, "epoch": 2191} {"train_loss": -24.042409896850586, "global_step": 181880, "epoch": 2191} {"train_loss": -23.657718658447266, "global_step": 181881, "epoch": 2191} {"train_loss": -23.82843589782715, "global_step": 181882, "epoch": 2191} {"train_loss": -23.520273208618164, "global_step": 181883, "epoch": 2191} {"train_loss": -23.859268188476562, "global_step": 181884, "epoch": 2191} {"train_loss": -23.4542293548584, "global_step": 181885, "epoch": 2191} {"train_loss": -23.709232330322266, "global_step": 181886, "epoch": 2191} {"train_loss": -23.625564575195312, "global_step": 181887, "epoch": 2191} {"train_loss": -24.083026885986328, "global_step": 181888, "epoch": 2191} {"train_loss": -23.91827392578125, "global_step": 181889, "epoch": 2191} {"train_loss": -23.70672607421875, "global_step": 181890, "epoch": 2191} {"train_loss": -23.931865692138672, "global_step": 181891, "epoch": 2191} {"train_loss": -23.748655319213867, "global_step": 181892, "epoch": 2191} {"train_loss": -23.83243751525879, "global_step": 181893, "epoch": 2191} {"train_loss": -24.095767974853516, "global_step": 181894, "epoch": 2191} {"train_loss": -23.957504272460938, "global_step": 181895, "epoch": 2191} {"train_loss": -23.942848205566406, "global_step": 181896, "epoch": 2191} {"train_loss": -23.835317611694336, "global_step": 181897, "epoch": 2191} {"train_loss": -24.19173240661621, "global_step": 181898, "epoch": 2191} {"train_loss": -23.9315128326416, "global_step": 181899, "epoch": 2191} {"train_loss": -23.681720733642578, "global_step": 181900, "epoch": 2191} {"train_loss": -24.147262573242188, "global_step": 181901, "epoch": 2191} {"train_loss": -23.729808807373047, "global_step": 181902, "epoch": 2191} {"train_loss": -23.592748641967773, "global_step": 181903, "epoch": 2191} {"train_loss": -24.12095069885254, "global_step": 181904, "epoch": 2191} {"train_loss": -23.87867546081543, "global_step": 181905, "epoch": 2191} {"train_loss": -23.794279098510742, "global_step": 181906, "epoch": 2191} {"train_loss": -24.000791549682617, "global_step": 181907, "epoch": 2191} {"train_loss": -23.792316436767578, "global_step": 181908, "epoch": 2191} {"train_loss": -23.90357208251953, "global_step": 181909, "epoch": 2191} {"train_loss": -23.591222763061523, "global_step": 181910, "epoch": 2191} {"train_loss": -23.595279693603516, "global_step": 181911, "epoch": 2191} {"train_loss": -24.021535873413086, "global_step": 181912, "epoch": 2191} {"train_loss": -23.87909507751465, "global_step": 181913, "epoch": 2191} {"train_loss": -23.73430633544922, "global_step": 181914, "epoch": 2191} {"train_loss": -23.87746238708496, "global_step": 181915, "epoch": 2191} {"train_loss": -23.9342041015625, "global_step": 181916, "epoch": 2191} {"train_loss": -23.646787643432617, "global_step": 181917, "epoch": 2191} {"train_loss": -24.13762855529785, "global_step": 181918, "epoch": 2191} {"train_loss": -23.835765838623047, "global_step": 181919, "epoch": 2191} {"train_loss": -23.755632400512695, "global_step": 181920, "epoch": 2191} {"train_loss": -24.03859519958496, "global_step": 181921, "epoch": 2191} {"train_loss": -23.943140029907227, "global_step": 181922, "epoch": 2191} {"train_loss": -23.914846420288086, "global_step": 181923, "epoch": 2191} {"train_loss": -23.996427536010742, "global_step": 181924, "epoch": 2191} {"train_loss": -23.6321964263916, "global_step": 181925, "epoch": 2191} {"train_loss": -24.386186599731445, "global_step": 181926, "epoch": 2191} {"train_loss": -23.903608322143555, "global_step": 181927, "epoch": 2191} {"train_loss": -23.57842445373535, "global_step": 181928, "epoch": 2191} {"train_loss": -24.18330192565918, "global_step": 181929, "epoch": 2191} {"train_loss": -23.9294376373291, "global_step": 181930, "epoch": 2191} {"train_loss": -23.905202865600586, "global_step": 181931, "epoch": 2191} {"train_loss": -23.940534591674805, "global_step": 181932, "epoch": 2191} {"train_loss": -23.804059982299805, "global_step": 181933, "epoch": 2191} {"train_loss": -23.821735382080078, "global_step": 181934, "epoch": 2191} {"train_loss": -23.850911289812572, "global_step": 181935, "epoch": 2191, "val_loss": 6455301.0} {"train_loss": -23.65117835998535, "global_step": 181936, "epoch": 2192} {"train_loss": -23.93902015686035, "global_step": 181937, "epoch": 2192} {"train_loss": -23.726123809814453, "global_step": 181938, "epoch": 2192} {"train_loss": -23.98292350769043, "global_step": 181939, "epoch": 2192} {"train_loss": -23.568632125854492, "global_step": 181940, "epoch": 2192} {"train_loss": -23.68868637084961, "global_step": 181941, "epoch": 2192} {"train_loss": -23.95311164855957, "global_step": 181942, "epoch": 2192} {"train_loss": -23.60743522644043, "global_step": 181943, "epoch": 2192} {"train_loss": -23.755615234375, "global_step": 181944, "epoch": 2192} {"train_loss": -24.137407302856445, "global_step": 181945, "epoch": 2192} {"train_loss": -23.292211532592773, "global_step": 181946, "epoch": 2192} {"train_loss": -23.695423126220703, "global_step": 181947, "epoch": 2192} {"train_loss": -24.018978118896484, "global_step": 181948, "epoch": 2192} {"train_loss": -23.516000747680664, "global_step": 181949, "epoch": 2192} {"train_loss": -24.405574798583984, "global_step": 181950, "epoch": 2192} {"train_loss": -23.72041130065918, "global_step": 181951, "epoch": 2192} {"train_loss": -23.979719161987305, "global_step": 181952, "epoch": 2192} {"train_loss": -24.001611709594727, "global_step": 181953, "epoch": 2192} {"train_loss": -24.022571563720703, "global_step": 181954, "epoch": 2192} {"train_loss": -24.058473587036133, "global_step": 181955, "epoch": 2192} {"train_loss": -24.0360164642334, "global_step": 181956, "epoch": 2192} {"train_loss": -24.228185653686523, "global_step": 181957, "epoch": 2192} {"train_loss": -23.72981071472168, "global_step": 181958, "epoch": 2192} {"train_loss": -24.022674560546875, "global_step": 181959, "epoch": 2192} {"train_loss": -23.902769088745117, "global_step": 181960, "epoch": 2192} {"train_loss": -23.442031860351562, "global_step": 181961, "epoch": 2192} {"train_loss": -23.63724708557129, "global_step": 181962, "epoch": 2192} {"train_loss": -24.0898494720459, "global_step": 181963, "epoch": 2192} {"train_loss": -23.99048614501953, "global_step": 181964, "epoch": 2192} {"train_loss": -23.789331436157227, "global_step": 181965, "epoch": 2192} {"train_loss": -24.534130096435547, "global_step": 181966, "epoch": 2192} {"train_loss": -23.975454330444336, "global_step": 181967, "epoch": 2192} {"train_loss": -24.008769989013672, "global_step": 181968, "epoch": 2192} {"train_loss": -23.993927001953125, "global_step": 181969, "epoch": 2192} {"train_loss": -24.104984283447266, "global_step": 181970, "epoch": 2192} {"train_loss": -24.13340187072754, "global_step": 181971, "epoch": 2192} {"train_loss": -23.52435302734375, "global_step": 181972, "epoch": 2192} {"train_loss": -24.45342445373535, "global_step": 181973, "epoch": 2192} {"train_loss": -24.1909236907959, "global_step": 181974, "epoch": 2192} {"train_loss": -23.931447982788086, "global_step": 181975, "epoch": 2192} {"train_loss": -23.854843139648438, "global_step": 181976, "epoch": 2192} {"train_loss": -23.718595504760742, "global_step": 181977, "epoch": 2192} {"train_loss": -24.327333450317383, "global_step": 181978, "epoch": 2192} {"train_loss": -24.213850021362305, "global_step": 181979, "epoch": 2192} {"train_loss": -23.968158721923828, "global_step": 181980, "epoch": 2192} {"train_loss": -23.876060485839844, "global_step": 181981, "epoch": 2192} {"train_loss": -24.08558464050293, "global_step": 181982, "epoch": 2192} {"train_loss": -23.93845558166504, "global_step": 181983, "epoch": 2192} {"train_loss": -24.123483657836914, "global_step": 181984, "epoch": 2192} {"train_loss": -23.73799705505371, "global_step": 181985, "epoch": 2192} {"train_loss": -23.87270164489746, "global_step": 181986, "epoch": 2192} {"train_loss": -24.135488510131836, "global_step": 181987, "epoch": 2192} {"train_loss": -23.624906539916992, "global_step": 181988, "epoch": 2192} {"train_loss": -23.611286163330078, "global_step": 181989, "epoch": 2192} {"train_loss": -23.870603561401367, "global_step": 181990, "epoch": 2192} {"train_loss": -24.119003295898438, "global_step": 181991, "epoch": 2192} {"train_loss": -24.051883697509766, "global_step": 181992, "epoch": 2192} {"train_loss": -23.862272262573242, "global_step": 181993, "epoch": 2192} {"train_loss": -23.759756088256836, "global_step": 181994, "epoch": 2192} {"train_loss": -24.239337921142578, "global_step": 181995, "epoch": 2192} {"train_loss": -24.109224319458008, "global_step": 181996, "epoch": 2192} {"train_loss": -23.819931030273438, "global_step": 181997, "epoch": 2192} {"train_loss": -24.13795280456543, "global_step": 181998, "epoch": 2192} {"train_loss": -24.072208404541016, "global_step": 181999, "epoch": 2192} {"train_loss": -24.180051803588867, "global_step": 182000, "epoch": 2192} {"train_loss": -24.16856575012207, "global_step": 182001, "epoch": 2192} {"train_loss": -24.057287216186523, "global_step": 182002, "epoch": 2192} {"train_loss": -23.95958137512207, "global_step": 182003, "epoch": 2192} {"train_loss": -24.044189453125, "global_step": 182004, "epoch": 2192} {"train_loss": -23.648794174194336, "global_step": 182005, "epoch": 2192} {"train_loss": -23.654138565063477, "global_step": 182006, "epoch": 2192} {"train_loss": -23.774612426757812, "global_step": 182007, "epoch": 2192} {"train_loss": -23.782245635986328, "global_step": 182008, "epoch": 2192} {"train_loss": -24.051803588867188, "global_step": 182009, "epoch": 2192} {"train_loss": -24.134464263916016, "global_step": 182010, "epoch": 2192} {"train_loss": -23.621122360229492, "global_step": 182011, "epoch": 2192} {"train_loss": -24.154382705688477, "global_step": 182012, "epoch": 2192} {"train_loss": -24.09521484375, "global_step": 182013, "epoch": 2192} {"train_loss": -23.821691513061523, "global_step": 182014, "epoch": 2192} {"train_loss": -23.681930541992188, "global_step": 182015, "epoch": 2192} {"train_loss": -23.60750389099121, "global_step": 182016, "epoch": 2192} {"train_loss": -23.813997268676758, "global_step": 182017, "epoch": 2192} {"train_loss": -23.921358614082795, "global_step": 182018, "epoch": 2192, "val_loss": 6526695.0} {"train_loss": -23.220685958862305, "global_step": 182019, "epoch": 2193} {"train_loss": -23.160093307495117, "global_step": 182020, "epoch": 2193} {"train_loss": -22.342103958129883, "global_step": 182021, "epoch": 2193} {"train_loss": -22.86920738220215, "global_step": 182022, "epoch": 2193} {"train_loss": -22.834918975830078, "global_step": 182023, "epoch": 2193} {"train_loss": -23.08936882019043, "global_step": 182024, "epoch": 2193} {"train_loss": -23.584070205688477, "global_step": 182025, "epoch": 2193} {"train_loss": -22.764389038085938, "global_step": 182026, "epoch": 2193} {"train_loss": -23.33611488342285, "global_step": 182027, "epoch": 2193} {"train_loss": -23.288320541381836, "global_step": 182028, "epoch": 2193} {"train_loss": -23.49992561340332, "global_step": 182029, "epoch": 2193} {"train_loss": -23.2899169921875, "global_step": 182030, "epoch": 2193} {"train_loss": -22.972049713134766, "global_step": 182031, "epoch": 2193} {"train_loss": -23.309234619140625, "global_step": 182032, "epoch": 2193} {"train_loss": -23.42074203491211, "global_step": 182033, "epoch": 2193} {"train_loss": -23.803125381469727, "global_step": 182034, "epoch": 2193} {"train_loss": -23.6402530670166, "global_step": 182035, "epoch": 2193} {"train_loss": -23.74241065979004, "global_step": 182036, "epoch": 2193} {"train_loss": -23.85596466064453, "global_step": 182037, "epoch": 2193} {"train_loss": -23.375898361206055, "global_step": 182038, "epoch": 2193} {"train_loss": -23.66260528564453, "global_step": 182039, "epoch": 2193} {"train_loss": -23.332021713256836, "global_step": 182040, "epoch": 2193} {"train_loss": -23.670501708984375, "global_step": 182041, "epoch": 2193} {"train_loss": -23.5393009185791, "global_step": 182042, "epoch": 2193} {"train_loss": -23.478836059570312, "global_step": 182043, "epoch": 2193} {"train_loss": -23.451871871948242, "global_step": 182044, "epoch": 2193} {"train_loss": -23.721904754638672, "global_step": 182045, "epoch": 2193} {"train_loss": -23.6081485748291, "global_step": 182046, "epoch": 2193} {"train_loss": -24.05672264099121, "global_step": 182047, "epoch": 2193} {"train_loss": -23.601776123046875, "global_step": 182048, "epoch": 2193} {"train_loss": -23.793180465698242, "global_step": 182049, "epoch": 2193} {"train_loss": -23.88728904724121, "global_step": 182050, "epoch": 2193} {"train_loss": -23.797832489013672, "global_step": 182051, "epoch": 2193} {"train_loss": -23.685232162475586, "global_step": 182052, "epoch": 2193} {"train_loss": -23.59103012084961, "global_step": 182053, "epoch": 2193} {"train_loss": -23.97966957092285, "global_step": 182054, "epoch": 2193} {"train_loss": -23.58345603942871, "global_step": 182055, "epoch": 2193} {"train_loss": -23.58461570739746, "global_step": 182056, "epoch": 2193} {"train_loss": -23.91424560546875, "global_step": 182057, "epoch": 2193} {"train_loss": -23.556638717651367, "global_step": 182058, "epoch": 2193} {"train_loss": -24.017044067382812, "global_step": 182059, "epoch": 2193} {"train_loss": -23.610532760620117, "global_step": 182060, "epoch": 2193} {"train_loss": -23.83243751525879, "global_step": 182061, "epoch": 2193} {"train_loss": -23.933835983276367, "global_step": 182062, "epoch": 2193} {"train_loss": -23.512985229492188, "global_step": 182063, "epoch": 2193} {"train_loss": -24.225866317749023, "global_step": 182064, "epoch": 2193} {"train_loss": -23.72244644165039, "global_step": 182065, "epoch": 2193} {"train_loss": -23.912649154663086, "global_step": 182066, "epoch": 2193} {"train_loss": -24.16424560546875, "global_step": 182067, "epoch": 2193} {"train_loss": -23.972253799438477, "global_step": 182068, "epoch": 2193} {"train_loss": -23.843061447143555, "global_step": 182069, "epoch": 2193} {"train_loss": -23.852815628051758, "global_step": 182070, "epoch": 2193} {"train_loss": -23.77516746520996, "global_step": 182071, "epoch": 2193} {"train_loss": -24.13214111328125, "global_step": 182072, "epoch": 2193} {"train_loss": -24.21925926208496, "global_step": 182073, "epoch": 2193} {"train_loss": -23.898733139038086, "global_step": 182074, "epoch": 2193} {"train_loss": -24.10867691040039, "global_step": 182075, "epoch": 2193} {"train_loss": -23.977821350097656, "global_step": 182076, "epoch": 2193} {"train_loss": -23.946081161499023, "global_step": 182077, "epoch": 2193} {"train_loss": -23.9248104095459, "global_step": 182078, "epoch": 2193} {"train_loss": -23.94400405883789, "global_step": 182079, "epoch": 2193} {"train_loss": -24.20153045654297, "global_step": 182080, "epoch": 2193} {"train_loss": -24.205678939819336, "global_step": 182081, "epoch": 2193} {"train_loss": -24.430889129638672, "global_step": 182082, "epoch": 2193} {"train_loss": -24.272357940673828, "global_step": 182083, "epoch": 2193} {"train_loss": -23.835607528686523, "global_step": 182084, "epoch": 2193} {"train_loss": -23.812618255615234, "global_step": 182085, "epoch": 2193} {"train_loss": -23.776227951049805, "global_step": 182086, "epoch": 2193} {"train_loss": -24.082321166992188, "global_step": 182087, "epoch": 2193} {"train_loss": -24.1916446685791, "global_step": 182088, "epoch": 2193} {"train_loss": -24.13511085510254, "global_step": 182089, "epoch": 2193} {"train_loss": -24.18983268737793, "global_step": 182090, "epoch": 2193} {"train_loss": -24.079803466796875, "global_step": 182091, "epoch": 2193} {"train_loss": -24.25240707397461, "global_step": 182092, "epoch": 2193} {"train_loss": -24.329801559448242, "global_step": 182093, "epoch": 2193} {"train_loss": -24.157962799072266, "global_step": 182094, "epoch": 2193} {"train_loss": -23.802480697631836, "global_step": 182095, "epoch": 2193} {"train_loss": -23.921823501586914, "global_step": 182096, "epoch": 2193} {"train_loss": -23.60780143737793, "global_step": 182097, "epoch": 2193} {"train_loss": -23.839435577392578, "global_step": 182098, "epoch": 2193} {"train_loss": -24.11433982849121, "global_step": 182099, "epoch": 2193} {"train_loss": -23.730222702026367, "global_step": 182100, "epoch": 2193} {"train_loss": -23.74767337936953, "global_step": 182101, "epoch": 2193, "val_loss": 6543636.0} {"train_loss": -21.683080673217773, "global_step": 182102, "epoch": 2194} {"train_loss": -22.078168869018555, "global_step": 182103, "epoch": 2194} {"train_loss": -22.828840255737305, "global_step": 182104, "epoch": 2194} {"train_loss": -22.42562484741211, "global_step": 182105, "epoch": 2194} {"train_loss": -22.760929107666016, "global_step": 182106, "epoch": 2194} {"train_loss": -22.912689208984375, "global_step": 182107, "epoch": 2194} {"train_loss": -22.927541732788086, "global_step": 182108, "epoch": 2194} {"train_loss": -22.74629020690918, "global_step": 182109, "epoch": 2194} {"train_loss": -22.840959548950195, "global_step": 182110, "epoch": 2194} {"train_loss": -22.77765655517578, "global_step": 182111, "epoch": 2194} {"train_loss": -22.912446975708008, "global_step": 182112, "epoch": 2194} {"train_loss": -22.829784393310547, "global_step": 182113, "epoch": 2194} {"train_loss": -22.87566375732422, "global_step": 182114, "epoch": 2194} {"train_loss": -23.774648666381836, "global_step": 182115, "epoch": 2194} {"train_loss": -22.731491088867188, "global_step": 182116, "epoch": 2194} {"train_loss": -23.43985939025879, "global_step": 182117, "epoch": 2194} {"train_loss": -23.024320602416992, "global_step": 182118, "epoch": 2194} {"train_loss": -23.10999870300293, "global_step": 182119, "epoch": 2194} {"train_loss": -22.922391891479492, "global_step": 182120, "epoch": 2194} {"train_loss": -22.95420265197754, "global_step": 182121, "epoch": 2194} {"train_loss": -23.361581802368164, "global_step": 182122, "epoch": 2194} {"train_loss": -22.92967414855957, "global_step": 182123, "epoch": 2194} {"train_loss": -23.165748596191406, "global_step": 182124, "epoch": 2194} {"train_loss": -23.486534118652344, "global_step": 182125, "epoch": 2194} {"train_loss": -23.649730682373047, "global_step": 182126, "epoch": 2194} {"train_loss": -23.53411102294922, "global_step": 182127, "epoch": 2194} {"train_loss": -23.42988395690918, "global_step": 182128, "epoch": 2194} {"train_loss": -23.49277687072754, "global_step": 182129, "epoch": 2194} {"train_loss": -23.463695526123047, "global_step": 182130, "epoch": 2194} {"train_loss": -23.569896697998047, "global_step": 182131, "epoch": 2194} {"train_loss": -23.747602462768555, "global_step": 182132, "epoch": 2194} {"train_loss": -23.563047409057617, "global_step": 182133, "epoch": 2194} {"train_loss": -23.89068603515625, "global_step": 182134, "epoch": 2194} {"train_loss": -23.573158264160156, "global_step": 182135, "epoch": 2194} {"train_loss": -23.82050323486328, "global_step": 182136, "epoch": 2194} {"train_loss": -23.83552360534668, "global_step": 182137, "epoch": 2194} {"train_loss": -23.4459285736084, "global_step": 182138, "epoch": 2194} {"train_loss": -23.77416229248047, "global_step": 182139, "epoch": 2194} {"train_loss": -23.763731002807617, "global_step": 182140, "epoch": 2194} {"train_loss": -24.02819061279297, "global_step": 182141, "epoch": 2194} {"train_loss": -23.879789352416992, "global_step": 182142, "epoch": 2194} {"train_loss": -24.227964401245117, "global_step": 182143, "epoch": 2194} {"train_loss": -24.2878360748291, "global_step": 182144, "epoch": 2194} {"train_loss": -23.82684898376465, "global_step": 182145, "epoch": 2194} {"train_loss": -24.04677391052246, "global_step": 182146, "epoch": 2194} {"train_loss": -23.84100914001465, "global_step": 182147, "epoch": 2194} {"train_loss": -24.416467666625977, "global_step": 182148, "epoch": 2194} {"train_loss": -23.892553329467773, "global_step": 182149, "epoch": 2194} {"train_loss": -23.7320499420166, "global_step": 182150, "epoch": 2194} {"train_loss": -23.9143009185791, "global_step": 182151, "epoch": 2194} {"train_loss": -23.984790802001953, "global_step": 182152, "epoch": 2194} {"train_loss": -24.16073226928711, "global_step": 182153, "epoch": 2194} {"train_loss": -23.94260597229004, "global_step": 182154, "epoch": 2194} {"train_loss": -23.91200828552246, "global_step": 182155, "epoch": 2194} {"train_loss": -24.008068084716797, "global_step": 182156, "epoch": 2194} {"train_loss": -24.28852653503418, "global_step": 182157, "epoch": 2194} {"train_loss": -23.90730094909668, "global_step": 182158, "epoch": 2194} {"train_loss": -24.300586700439453, "global_step": 182159, "epoch": 2194} {"train_loss": -23.895998001098633, "global_step": 182160, "epoch": 2194} {"train_loss": -24.032133102416992, "global_step": 182161, "epoch": 2194} {"train_loss": -24.147003173828125, "global_step": 182162, "epoch": 2194} {"train_loss": -24.43900489807129, "global_step": 182163, "epoch": 2194} {"train_loss": -23.758268356323242, "global_step": 182164, "epoch": 2194} {"train_loss": -24.30386734008789, "global_step": 182165, "epoch": 2194} {"train_loss": -23.777620315551758, "global_step": 182166, "epoch": 2194} {"train_loss": -24.217153549194336, "global_step": 182167, "epoch": 2194} {"train_loss": -23.835128784179688, "global_step": 182168, "epoch": 2194} {"train_loss": -23.92055320739746, "global_step": 182169, "epoch": 2194} {"train_loss": -23.490026473999023, "global_step": 182170, "epoch": 2194} {"train_loss": -23.451398849487305, "global_step": 182171, "epoch": 2194} {"train_loss": -23.430391311645508, "global_step": 182172, "epoch": 2194} {"train_loss": -23.6708984375, "global_step": 182173, "epoch": 2194} {"train_loss": -24.187339782714844, "global_step": 182174, "epoch": 2194} {"train_loss": -23.953123092651367, "global_step": 182175, "epoch": 2194} {"train_loss": -23.938074111938477, "global_step": 182176, "epoch": 2194} {"train_loss": -24.016944885253906, "global_step": 182177, "epoch": 2194} {"train_loss": -23.448951721191406, "global_step": 182178, "epoch": 2194} {"train_loss": -23.554197311401367, "global_step": 182179, "epoch": 2194} {"train_loss": -24.007272720336914, "global_step": 182180, "epoch": 2194} {"train_loss": -24.050092697143555, "global_step": 182181, "epoch": 2194} {"train_loss": -23.487146377563477, "global_step": 182182, "epoch": 2194} {"train_loss": -24.012205123901367, "global_step": 182183, "epoch": 2194} {"train_loss": -23.599393453942724, "global_step": 182184, "epoch": 2194, "val_loss": 6438960.0} {"train_loss": -22.879117965698242, "global_step": 182185, "epoch": 2195} {"train_loss": -23.663373947143555, "global_step": 182186, "epoch": 2195} {"train_loss": -23.546106338500977, "global_step": 182187, "epoch": 2195} {"train_loss": -23.64912223815918, "global_step": 182188, "epoch": 2195} {"train_loss": -23.794336318969727, "global_step": 182189, "epoch": 2195} {"train_loss": -23.65382194519043, "global_step": 182190, "epoch": 2195} {"train_loss": -23.805776596069336, "global_step": 182191, "epoch": 2195} {"train_loss": -23.883420944213867, "global_step": 182192, "epoch": 2195} {"train_loss": -23.431964874267578, "global_step": 182193, "epoch": 2195} {"train_loss": -23.588258743286133, "global_step": 182194, "epoch": 2195} {"train_loss": -23.312910079956055, "global_step": 182195, "epoch": 2195} {"train_loss": -23.8598690032959, "global_step": 182196, "epoch": 2195} {"train_loss": -23.624099731445312, "global_step": 182197, "epoch": 2195} {"train_loss": -23.4697322845459, "global_step": 182198, "epoch": 2195} {"train_loss": -23.468774795532227, "global_step": 182199, "epoch": 2195} {"train_loss": -23.382667541503906, "global_step": 182200, "epoch": 2195} {"train_loss": -23.718101501464844, "global_step": 182201, "epoch": 2195} {"train_loss": -23.754520416259766, "global_step": 182202, "epoch": 2195} {"train_loss": -23.78143882751465, "global_step": 182203, "epoch": 2195} {"train_loss": -23.66286277770996, "global_step": 182204, "epoch": 2195} {"train_loss": -23.892431259155273, "global_step": 182205, "epoch": 2195} {"train_loss": -23.54481315612793, "global_step": 182206, "epoch": 2195} {"train_loss": -23.84341812133789, "global_step": 182207, "epoch": 2195} {"train_loss": -23.571243286132812, "global_step": 182208, "epoch": 2195} {"train_loss": -23.51679039001465, "global_step": 182209, "epoch": 2195} {"train_loss": -23.64554214477539, "global_step": 182210, "epoch": 2195} {"train_loss": -23.868268966674805, "global_step": 182211, "epoch": 2195} {"train_loss": -24.05069923400879, "global_step": 182212, "epoch": 2195} {"train_loss": -24.12764549255371, "global_step": 182213, "epoch": 2195} {"train_loss": -23.90871810913086, "global_step": 182214, "epoch": 2195} {"train_loss": -24.004077911376953, "global_step": 182215, "epoch": 2195} {"train_loss": -23.781435012817383, "global_step": 182216, "epoch": 2195} {"train_loss": -23.976877212524414, "global_step": 182217, "epoch": 2195} {"train_loss": -24.2338924407959, "global_step": 182218, "epoch": 2195} {"train_loss": -23.765775680541992, "global_step": 182219, "epoch": 2195} {"train_loss": -24.1650447845459, "global_step": 182220, "epoch": 2195} {"train_loss": -24.05692481994629, "global_step": 182221, "epoch": 2195} {"train_loss": -24.06893539428711, "global_step": 182222, "epoch": 2195} {"train_loss": -23.779006958007812, "global_step": 182223, "epoch": 2195} {"train_loss": -24.481998443603516, "global_step": 182224, "epoch": 2195} {"train_loss": -23.981298446655273, "global_step": 182225, "epoch": 2195} {"train_loss": -23.763452529907227, "global_step": 182226, "epoch": 2195} {"train_loss": -24.02666664123535, "global_step": 182227, "epoch": 2195} {"train_loss": -23.61319351196289, "global_step": 182228, "epoch": 2195} {"train_loss": -23.69429588317871, "global_step": 182229, "epoch": 2195} {"train_loss": -23.641666412353516, "global_step": 182230, "epoch": 2195} {"train_loss": -24.363174438476562, "global_step": 182231, "epoch": 2195} {"train_loss": -23.972822189331055, "global_step": 182232, "epoch": 2195} {"train_loss": -23.54231071472168, "global_step": 182233, "epoch": 2195} {"train_loss": -23.853191375732422, "global_step": 182234, "epoch": 2195} {"train_loss": -24.062530517578125, "global_step": 182235, "epoch": 2195} {"train_loss": -24.221786499023438, "global_step": 182236, "epoch": 2195} {"train_loss": -24.279897689819336, "global_step": 182237, "epoch": 2195} {"train_loss": -23.890920639038086, "global_step": 182238, "epoch": 2195} {"train_loss": -23.792314529418945, "global_step": 182239, "epoch": 2195} {"train_loss": -24.094730377197266, "global_step": 182240, "epoch": 2195} {"train_loss": -24.20770263671875, "global_step": 182241, "epoch": 2195} {"train_loss": -23.787647247314453, "global_step": 182242, "epoch": 2195} {"train_loss": -24.454315185546875, "global_step": 182243, "epoch": 2195} {"train_loss": -24.010282516479492, "global_step": 182244, "epoch": 2195} {"train_loss": -23.61075782775879, "global_step": 182245, "epoch": 2195} {"train_loss": -24.14014434814453, "global_step": 182246, "epoch": 2195} {"train_loss": -24.30582618713379, "global_step": 182247, "epoch": 2195} {"train_loss": -23.988061904907227, "global_step": 182248, "epoch": 2195} {"train_loss": -24.169086456298828, "global_step": 182249, "epoch": 2195} {"train_loss": -24.145883560180664, "global_step": 182250, "epoch": 2195} {"train_loss": -24.23891258239746, "global_step": 182251, "epoch": 2195} {"train_loss": -24.03384780883789, "global_step": 182252, "epoch": 2195} {"train_loss": -23.792081832885742, "global_step": 182253, "epoch": 2195} {"train_loss": -23.801315307617188, "global_step": 182254, "epoch": 2195} {"train_loss": -23.845808029174805, "global_step": 182255, "epoch": 2195} {"train_loss": -24.034957885742188, "global_step": 182256, "epoch": 2195} {"train_loss": -24.182018280029297, "global_step": 182257, "epoch": 2195} {"train_loss": -23.96974754333496, "global_step": 182258, "epoch": 2195} {"train_loss": -24.267105102539062, "global_step": 182259, "epoch": 2195} {"train_loss": -24.292081832885742, "global_step": 182260, "epoch": 2195} {"train_loss": -24.005361557006836, "global_step": 182261, "epoch": 2195} {"train_loss": -24.014938354492188, "global_step": 182262, "epoch": 2195} {"train_loss": -24.147504806518555, "global_step": 182263, "epoch": 2195} {"train_loss": -23.86927032470703, "global_step": 182264, "epoch": 2195} {"train_loss": -24.09903335571289, "global_step": 182265, "epoch": 2195} {"train_loss": -24.29090690612793, "global_step": 182266, "epoch": 2195} {"train_loss": -23.899958300303265, "global_step": 182267, "epoch": 2195, "val_loss": 6476546.0} {"train_loss": -23.646493911743164, "global_step": 182268, "epoch": 2196} {"train_loss": -23.56776237487793, "global_step": 182269, "epoch": 2196} {"train_loss": -23.777496337890625, "global_step": 182270, "epoch": 2196} {"train_loss": -23.27945899963379, "global_step": 182271, "epoch": 2196} {"train_loss": -23.62031364440918, "global_step": 182272, "epoch": 2196} {"train_loss": -23.80792236328125, "global_step": 182273, "epoch": 2196} {"train_loss": -23.755672454833984, "global_step": 182274, "epoch": 2196} {"train_loss": -23.4826717376709, "global_step": 182275, "epoch": 2196} {"train_loss": -23.641027450561523, "global_step": 182276, "epoch": 2196} {"train_loss": -24.078824996948242, "global_step": 182277, "epoch": 2196} {"train_loss": -23.50193977355957, "global_step": 182278, "epoch": 2196} {"train_loss": -23.617908477783203, "global_step": 182279, "epoch": 2196} {"train_loss": -23.895490646362305, "global_step": 182280, "epoch": 2196} {"train_loss": -24.094541549682617, "global_step": 182281, "epoch": 2196} {"train_loss": -23.906801223754883, "global_step": 182282, "epoch": 2196} {"train_loss": -23.714927673339844, "global_step": 182283, "epoch": 2196} {"train_loss": -23.953306198120117, "global_step": 182284, "epoch": 2196} {"train_loss": -24.202077865600586, "global_step": 182285, "epoch": 2196} {"train_loss": -23.933650970458984, "global_step": 182286, "epoch": 2196} {"train_loss": -23.842082977294922, "global_step": 182287, "epoch": 2196} {"train_loss": -23.749425888061523, "global_step": 182288, "epoch": 2196} {"train_loss": -23.956872940063477, "global_step": 182289, "epoch": 2196} {"train_loss": -23.844924926757812, "global_step": 182290, "epoch": 2196} {"train_loss": -24.119609832763672, "global_step": 182291, "epoch": 2196} {"train_loss": -23.840408325195312, "global_step": 182292, "epoch": 2196} {"train_loss": -23.998647689819336, "global_step": 182293, "epoch": 2196} {"train_loss": -24.170690536499023, "global_step": 182294, "epoch": 2196} {"train_loss": -23.876571655273438, "global_step": 182295, "epoch": 2196} {"train_loss": -23.461389541625977, "global_step": 182296, "epoch": 2196} {"train_loss": -23.672876358032227, "global_step": 182297, "epoch": 2196} {"train_loss": -23.712644577026367, "global_step": 182298, "epoch": 2196} {"train_loss": -23.628664016723633, "global_step": 182299, "epoch": 2196} {"train_loss": -23.833484649658203, "global_step": 182300, "epoch": 2196} {"train_loss": -23.577146530151367, "global_step": 182301, "epoch": 2196} {"train_loss": -23.8691463470459, "global_step": 182302, "epoch": 2196} {"train_loss": -24.232831954956055, "global_step": 182303, "epoch": 2196} {"train_loss": -24.099218368530273, "global_step": 182304, "epoch": 2196} {"train_loss": -23.748802185058594, "global_step": 182305, "epoch": 2196} {"train_loss": -23.94624900817871, "global_step": 182306, "epoch": 2196} {"train_loss": -23.991092681884766, "global_step": 182307, "epoch": 2196} {"train_loss": -23.9435977935791, "global_step": 182308, "epoch": 2196} {"train_loss": -23.9537353515625, "global_step": 182309, "epoch": 2196} {"train_loss": -24.149682998657227, "global_step": 182310, "epoch": 2196} {"train_loss": -24.07282257080078, "global_step": 182311, "epoch": 2196} {"train_loss": -23.575708389282227, "global_step": 182312, "epoch": 2196} {"train_loss": -23.556106567382812, "global_step": 182313, "epoch": 2196} {"train_loss": -24.094362258911133, "global_step": 182314, "epoch": 2196} {"train_loss": -23.79319953918457, "global_step": 182315, "epoch": 2196} {"train_loss": -23.878137588500977, "global_step": 182316, "epoch": 2196} {"train_loss": -23.587799072265625, "global_step": 182317, "epoch": 2196} {"train_loss": -24.002010345458984, "global_step": 182318, "epoch": 2196} {"train_loss": -23.967031478881836, "global_step": 182319, "epoch": 2196} {"train_loss": -23.905052185058594, "global_step": 182320, "epoch": 2196} {"train_loss": -23.697341918945312, "global_step": 182321, "epoch": 2196} {"train_loss": -23.461023330688477, "global_step": 182322, "epoch": 2196} {"train_loss": -23.9216365814209, "global_step": 182323, "epoch": 2196} {"train_loss": -23.97560691833496, "global_step": 182324, "epoch": 2196} {"train_loss": -23.827449798583984, "global_step": 182325, "epoch": 2196} {"train_loss": -23.962806701660156, "global_step": 182326, "epoch": 2196} {"train_loss": -23.749631881713867, "global_step": 182327, "epoch": 2196} {"train_loss": -24.21234130859375, "global_step": 182328, "epoch": 2196} {"train_loss": -24.219364166259766, "global_step": 182329, "epoch": 2196} {"train_loss": -24.17877769470215, "global_step": 182330, "epoch": 2196} {"train_loss": -23.70372200012207, "global_step": 182331, "epoch": 2196} {"train_loss": -23.979265213012695, "global_step": 182332, "epoch": 2196} {"train_loss": -24.180620193481445, "global_step": 182333, "epoch": 2196} {"train_loss": -24.393064498901367, "global_step": 182334, "epoch": 2196} {"train_loss": -23.781734466552734, "global_step": 182335, "epoch": 2196} {"train_loss": -23.926530838012695, "global_step": 182336, "epoch": 2196} {"train_loss": -24.068864822387695, "global_step": 182337, "epoch": 2196} {"train_loss": -23.85274314880371, "global_step": 182338, "epoch": 2196} {"train_loss": -23.940296173095703, "global_step": 182339, "epoch": 2196} {"train_loss": -24.073463439941406, "global_step": 182340, "epoch": 2196} {"train_loss": -23.67980194091797, "global_step": 182341, "epoch": 2196} {"train_loss": -24.12386131286621, "global_step": 182342, "epoch": 2196} {"train_loss": -24.39005470275879, "global_step": 182343, "epoch": 2196} {"train_loss": -24.29447364807129, "global_step": 182344, "epoch": 2196} {"train_loss": -23.972436904907227, "global_step": 182345, "epoch": 2196} {"train_loss": -24.32337188720703, "global_step": 182346, "epoch": 2196} {"train_loss": -23.931615829467773, "global_step": 182347, "epoch": 2196} {"train_loss": -23.843515396118164, "global_step": 182348, "epoch": 2196} {"train_loss": -24.22429847717285, "global_step": 182349, "epoch": 2196} {"train_loss": -23.900562309357056, "global_step": 182350, "epoch": 2196, "val_loss": 6521618.0} {"train_loss": -22.98091697692871, "global_step": 182351, "epoch": 2197} {"train_loss": -23.53179168701172, "global_step": 182352, "epoch": 2197} {"train_loss": -22.97930335998535, "global_step": 182353, "epoch": 2197} {"train_loss": -23.078433990478516, "global_step": 182354, "epoch": 2197} {"train_loss": -23.54581069946289, "global_step": 182355, "epoch": 2197} {"train_loss": -23.570539474487305, "global_step": 182356, "epoch": 2197} {"train_loss": -23.110595703125, "global_step": 182357, "epoch": 2197} {"train_loss": -23.298276901245117, "global_step": 182358, "epoch": 2197} {"train_loss": -23.23506736755371, "global_step": 182359, "epoch": 2197} {"train_loss": -23.714658737182617, "global_step": 182360, "epoch": 2197} {"train_loss": -23.792165756225586, "global_step": 182361, "epoch": 2197} {"train_loss": -23.332015991210938, "global_step": 182362, "epoch": 2197} {"train_loss": -23.64900016784668, "global_step": 182363, "epoch": 2197} {"train_loss": -23.78525733947754, "global_step": 182364, "epoch": 2197} {"train_loss": -23.48693084716797, "global_step": 182365, "epoch": 2197} {"train_loss": -23.433401107788086, "global_step": 182366, "epoch": 2197} {"train_loss": -23.657001495361328, "global_step": 182367, "epoch": 2197} {"train_loss": -23.118337631225586, "global_step": 182368, "epoch": 2197} {"train_loss": -23.28824806213379, "global_step": 182369, "epoch": 2197} {"train_loss": -23.9400577545166, "global_step": 182370, "epoch": 2197} {"train_loss": -23.853572845458984, "global_step": 182371, "epoch": 2197} {"train_loss": -23.711238861083984, "global_step": 182372, "epoch": 2197} {"train_loss": -23.76710319519043, "global_step": 182373, "epoch": 2197} {"train_loss": -23.705615997314453, "global_step": 182374, "epoch": 2197} {"train_loss": -23.87102508544922, "global_step": 182375, "epoch": 2197} {"train_loss": -23.628376007080078, "global_step": 182376, "epoch": 2197} {"train_loss": -23.599023818969727, "global_step": 182377, "epoch": 2197} {"train_loss": -23.543643951416016, "global_step": 182378, "epoch": 2197} {"train_loss": -23.719213485717773, "global_step": 182379, "epoch": 2197} {"train_loss": -23.799104690551758, "global_step": 182380, "epoch": 2197} {"train_loss": -24.258440017700195, "global_step": 182381, "epoch": 2197} {"train_loss": -23.806949615478516, "global_step": 182382, "epoch": 2197} {"train_loss": -23.777379989624023, "global_step": 182383, "epoch": 2197} {"train_loss": -23.844467163085938, "global_step": 182384, "epoch": 2197} {"train_loss": -23.799869537353516, "global_step": 182385, "epoch": 2197} {"train_loss": -23.91219139099121, "global_step": 182386, "epoch": 2197} {"train_loss": -23.876819610595703, "global_step": 182387, "epoch": 2197} {"train_loss": -23.7584171295166, "global_step": 182388, "epoch": 2197} {"train_loss": -24.04227638244629, "global_step": 182389, "epoch": 2197} {"train_loss": -24.043094635009766, "global_step": 182390, "epoch": 2197} {"train_loss": -24.24167823791504, "global_step": 182391, "epoch": 2197} {"train_loss": -23.665563583374023, "global_step": 182392, "epoch": 2197} {"train_loss": -24.08931541442871, "global_step": 182393, "epoch": 2197} {"train_loss": -23.435606002807617, "global_step": 182394, "epoch": 2197} {"train_loss": -23.78102684020996, "global_step": 182395, "epoch": 2197} {"train_loss": -23.9888858795166, "global_step": 182396, "epoch": 2197} {"train_loss": -24.200641632080078, "global_step": 182397, "epoch": 2197} {"train_loss": -24.183086395263672, "global_step": 182398, "epoch": 2197} {"train_loss": -23.965606689453125, "global_step": 182399, "epoch": 2197} {"train_loss": -23.47952651977539, "global_step": 182400, "epoch": 2197} {"train_loss": -24.043638229370117, "global_step": 182401, "epoch": 2197} {"train_loss": -23.9583797454834, "global_step": 182402, "epoch": 2197} {"train_loss": -24.15500259399414, "global_step": 182403, "epoch": 2197} {"train_loss": -23.968786239624023, "global_step": 182404, "epoch": 2197} {"train_loss": -23.94883918762207, "global_step": 182405, "epoch": 2197} {"train_loss": -23.95204734802246, "global_step": 182406, "epoch": 2197} {"train_loss": -23.6680908203125, "global_step": 182407, "epoch": 2197} {"train_loss": -23.583295822143555, "global_step": 182408, "epoch": 2197} {"train_loss": -24.008859634399414, "global_step": 182409, "epoch": 2197} {"train_loss": -24.060211181640625, "global_step": 182410, "epoch": 2197} {"train_loss": -23.79813575744629, "global_step": 182411, "epoch": 2197} {"train_loss": -24.006540298461914, "global_step": 182412, "epoch": 2197} {"train_loss": -23.707563400268555, "global_step": 182413, "epoch": 2197} {"train_loss": -24.122509002685547, "global_step": 182414, "epoch": 2197} {"train_loss": -24.283309936523438, "global_step": 182415, "epoch": 2197} {"train_loss": -23.98026466369629, "global_step": 182416, "epoch": 2197} {"train_loss": -23.654098510742188, "global_step": 182417, "epoch": 2197} {"train_loss": -24.16538429260254, "global_step": 182418, "epoch": 2197} {"train_loss": -24.360837936401367, "global_step": 182419, "epoch": 2197} {"train_loss": -24.530075073242188, "global_step": 182420, "epoch": 2197} {"train_loss": -23.990880966186523, "global_step": 182421, "epoch": 2197} {"train_loss": -24.34318733215332, "global_step": 182422, "epoch": 2197} {"train_loss": -24.23317527770996, "global_step": 182423, "epoch": 2197} {"train_loss": -24.043790817260742, "global_step": 182424, "epoch": 2197} {"train_loss": -24.065683364868164, "global_step": 182425, "epoch": 2197} {"train_loss": -24.10845947265625, "global_step": 182426, "epoch": 2197} {"train_loss": -24.3363094329834, "global_step": 182427, "epoch": 2197} {"train_loss": -23.741865158081055, "global_step": 182428, "epoch": 2197} {"train_loss": -24.01943016052246, "global_step": 182429, "epoch": 2197} {"train_loss": -24.27545738220215, "global_step": 182430, "epoch": 2197} {"train_loss": -23.835956573486328, "global_step": 182431, "epoch": 2197} {"train_loss": -23.986570358276367, "global_step": 182432, "epoch": 2197} {"train_loss": -23.833305795508696, "global_step": 182433, "epoch": 2197, "val_loss": 6419477.0} {"train_loss": -23.645153045654297, "global_step": 182434, "epoch": 2198} {"train_loss": -23.932998657226562, "global_step": 182435, "epoch": 2198} {"train_loss": -23.419631958007812, "global_step": 182436, "epoch": 2198} {"train_loss": -23.733118057250977, "global_step": 182437, "epoch": 2198} {"train_loss": -23.28883934020996, "global_step": 182438, "epoch": 2198} {"train_loss": -23.92022705078125, "global_step": 182439, "epoch": 2198} {"train_loss": -23.993871688842773, "global_step": 182440, "epoch": 2198} {"train_loss": -24.098695755004883, "global_step": 182441, "epoch": 2198} {"train_loss": -23.787578582763672, "global_step": 182442, "epoch": 2198} {"train_loss": -23.43600845336914, "global_step": 182443, "epoch": 2198} {"train_loss": -23.80621337890625, "global_step": 182444, "epoch": 2198} {"train_loss": -24.063566207885742, "global_step": 182445, "epoch": 2198} {"train_loss": -23.70110511779785, "global_step": 182446, "epoch": 2198} {"train_loss": -23.737531661987305, "global_step": 182447, "epoch": 2198} {"train_loss": -24.226543426513672, "global_step": 182448, "epoch": 2198} {"train_loss": -23.9647159576416, "global_step": 182449, "epoch": 2198} {"train_loss": -23.647907257080078, "global_step": 182450, "epoch": 2198} {"train_loss": -24.187915802001953, "global_step": 182451, "epoch": 2198} {"train_loss": -23.970651626586914, "global_step": 182452, "epoch": 2198} {"train_loss": -24.06460952758789, "global_step": 182453, "epoch": 2198} {"train_loss": -23.831878662109375, "global_step": 182454, "epoch": 2198} {"train_loss": -23.925352096557617, "global_step": 182455, "epoch": 2198} {"train_loss": -23.729541778564453, "global_step": 182456, "epoch": 2198} {"train_loss": -24.124616622924805, "global_step": 182457, "epoch": 2198} {"train_loss": -23.869176864624023, "global_step": 182458, "epoch": 2198} {"train_loss": -23.98763656616211, "global_step": 182459, "epoch": 2198} {"train_loss": -23.870576858520508, "global_step": 182460, "epoch": 2198} {"train_loss": -23.90546226501465, "global_step": 182461, "epoch": 2198} {"train_loss": -23.883520126342773, "global_step": 182462, "epoch": 2198} {"train_loss": -23.7169189453125, "global_step": 182463, "epoch": 2198} {"train_loss": -24.231353759765625, "global_step": 182464, "epoch": 2198} {"train_loss": -24.072546005249023, "global_step": 182465, "epoch": 2198} {"train_loss": -24.19448471069336, "global_step": 182466, "epoch": 2198} {"train_loss": -23.76300048828125, "global_step": 182467, "epoch": 2198} {"train_loss": -23.97931480407715, "global_step": 182468, "epoch": 2198} {"train_loss": -24.15633201599121, "global_step": 182469, "epoch": 2198} {"train_loss": -24.15083885192871, "global_step": 182470, "epoch": 2198} {"train_loss": -23.585180282592773, "global_step": 182471, "epoch": 2198} {"train_loss": -23.83185577392578, "global_step": 182472, "epoch": 2198} {"train_loss": -23.9917049407959, "global_step": 182473, "epoch": 2198} {"train_loss": -24.369659423828125, "global_step": 182474, "epoch": 2198} {"train_loss": -24.122407913208008, "global_step": 182475, "epoch": 2198} {"train_loss": -24.200199127197266, "global_step": 182476, "epoch": 2198} {"train_loss": -23.525409698486328, "global_step": 182477, "epoch": 2198} {"train_loss": -23.57773780822754, "global_step": 182478, "epoch": 2198} {"train_loss": -23.8151798248291, "global_step": 182479, "epoch": 2198} {"train_loss": -23.88722038269043, "global_step": 182480, "epoch": 2198} {"train_loss": -23.819082260131836, "global_step": 182481, "epoch": 2198} {"train_loss": -23.981170654296875, "global_step": 182482, "epoch": 2198} {"train_loss": -23.907730102539062, "global_step": 182483, "epoch": 2198} {"train_loss": -23.8510799407959, "global_step": 182484, "epoch": 2198} {"train_loss": -24.284650802612305, "global_step": 182485, "epoch": 2198} {"train_loss": -24.07016944885254, "global_step": 182486, "epoch": 2198} {"train_loss": -24.111751556396484, "global_step": 182487, "epoch": 2198} {"train_loss": -23.786563873291016, "global_step": 182488, "epoch": 2198} {"train_loss": -24.24164390563965, "global_step": 182489, "epoch": 2198} {"train_loss": -23.83172607421875, "global_step": 182490, "epoch": 2198} {"train_loss": -23.959524154663086, "global_step": 182491, "epoch": 2198} {"train_loss": -24.34762954711914, "global_step": 182492, "epoch": 2198} {"train_loss": -24.368349075317383, "global_step": 182493, "epoch": 2198} {"train_loss": -23.90557289123535, "global_step": 182494, "epoch": 2198} {"train_loss": -23.858224868774414, "global_step": 182495, "epoch": 2198} {"train_loss": -23.98534393310547, "global_step": 182496, "epoch": 2198} {"train_loss": -23.96746826171875, "global_step": 182497, "epoch": 2198} {"train_loss": -24.209558486938477, "global_step": 182498, "epoch": 2198} {"train_loss": -23.742422103881836, "global_step": 182499, "epoch": 2198} {"train_loss": -23.64644432067871, "global_step": 182500, "epoch": 2198} {"train_loss": -24.020200729370117, "global_step": 182501, "epoch": 2198} {"train_loss": -23.783842086791992, "global_step": 182502, "epoch": 2198} {"train_loss": -24.007169723510742, "global_step": 182503, "epoch": 2198} {"train_loss": -24.21125030517578, "global_step": 182504, "epoch": 2198} {"train_loss": -23.863346099853516, "global_step": 182505, "epoch": 2198} {"train_loss": -24.025222778320312, "global_step": 182506, "epoch": 2198} {"train_loss": -23.89222526550293, "global_step": 182507, "epoch": 2198} {"train_loss": -23.629941940307617, "global_step": 182508, "epoch": 2198} {"train_loss": -24.045682907104492, "global_step": 182509, "epoch": 2198} {"train_loss": -23.86176109313965, "global_step": 182510, "epoch": 2198} {"train_loss": -23.985204696655273, "global_step": 182511, "epoch": 2198} {"train_loss": -23.535619735717773, "global_step": 182512, "epoch": 2198} {"train_loss": -24.044010162353516, "global_step": 182513, "epoch": 2198} {"train_loss": -23.576200485229492, "global_step": 182514, "epoch": 2198} {"train_loss": -24.588579177856445, "global_step": 182515, "epoch": 2198} {"train_loss": -23.945643712239093, "global_step": 182516, "epoch": 2198, "val_loss": 6566822.0} {"train_loss": -22.842458724975586, "global_step": 182517, "epoch": 2199} {"train_loss": -22.594650268554688, "global_step": 182518, "epoch": 2199} {"train_loss": -23.538433074951172, "global_step": 182519, "epoch": 2199} {"train_loss": -23.13262176513672, "global_step": 182520, "epoch": 2199} {"train_loss": -23.83625602722168, "global_step": 182521, "epoch": 2199} {"train_loss": -23.138402938842773, "global_step": 182522, "epoch": 2199} {"train_loss": -23.24678611755371, "global_step": 182523, "epoch": 2199} {"train_loss": -23.37725257873535, "global_step": 182524, "epoch": 2199} {"train_loss": -23.549123764038086, "global_step": 182525, "epoch": 2199} {"train_loss": -23.08223533630371, "global_step": 182526, "epoch": 2199} {"train_loss": -22.970205307006836, "global_step": 182527, "epoch": 2199} {"train_loss": -23.390960693359375, "global_step": 182528, "epoch": 2199} {"train_loss": -23.43120002746582, "global_step": 182529, "epoch": 2199} {"train_loss": -23.63982582092285, "global_step": 182530, "epoch": 2199} {"train_loss": -23.3870906829834, "global_step": 182531, "epoch": 2199} {"train_loss": -23.50653648376465, "global_step": 182532, "epoch": 2199} {"train_loss": -23.165433883666992, "global_step": 182533, "epoch": 2199} {"train_loss": -23.344623565673828, "global_step": 182534, "epoch": 2199} {"train_loss": -23.753538131713867, "global_step": 182535, "epoch": 2199} {"train_loss": -23.764068603515625, "global_step": 182536, "epoch": 2199} {"train_loss": -23.2806339263916, "global_step": 182537, "epoch": 2199} {"train_loss": -23.946605682373047, "global_step": 182538, "epoch": 2199} {"train_loss": -23.66798210144043, "global_step": 182539, "epoch": 2199} {"train_loss": -23.723596572875977, "global_step": 182540, "epoch": 2199} {"train_loss": -23.850971221923828, "global_step": 182541, "epoch": 2199} {"train_loss": -23.937572479248047, "global_step": 182542, "epoch": 2199} {"train_loss": -23.676267623901367, "global_step": 182543, "epoch": 2199} {"train_loss": -24.077468872070312, "global_step": 182544, "epoch": 2199} {"train_loss": -23.815786361694336, "global_step": 182545, "epoch": 2199} {"train_loss": -24.09806251525879, "global_step": 182546, "epoch": 2199} {"train_loss": -23.843847274780273, "global_step": 182547, "epoch": 2199} {"train_loss": -23.620655059814453, "global_step": 182548, "epoch": 2199} {"train_loss": -23.568655014038086, "global_step": 182549, "epoch": 2199} {"train_loss": -24.296422958374023, "global_step": 182550, "epoch": 2199} {"train_loss": -23.765052795410156, "global_step": 182551, "epoch": 2199} {"train_loss": -24.133737564086914, "global_step": 182552, "epoch": 2199} {"train_loss": -23.721969604492188, "global_step": 182553, "epoch": 2199} {"train_loss": -23.930418014526367, "global_step": 182554, "epoch": 2199} {"train_loss": -23.95697021484375, "global_step": 182555, "epoch": 2199} {"train_loss": -24.244266510009766, "global_step": 182556, "epoch": 2199} {"train_loss": -24.02988624572754, "global_step": 182557, "epoch": 2199} {"train_loss": -23.959714889526367, "global_step": 182558, "epoch": 2199} {"train_loss": -23.91303062438965, "global_step": 182559, "epoch": 2199} {"train_loss": -23.710678100585938, "global_step": 182560, "epoch": 2199} {"train_loss": -23.713796615600586, "global_step": 182561, "epoch": 2199} {"train_loss": -24.086162567138672, "global_step": 182562, "epoch": 2199} {"train_loss": -24.028705596923828, "global_step": 182563, "epoch": 2199} {"train_loss": -24.079730987548828, "global_step": 182564, "epoch": 2199} {"train_loss": -24.50204849243164, "global_step": 182565, "epoch": 2199} {"train_loss": -23.84381103515625, "global_step": 182566, "epoch": 2199} {"train_loss": -23.73567008972168, "global_step": 182567, "epoch": 2199} {"train_loss": -24.15631675720215, "global_step": 182568, "epoch": 2199} {"train_loss": -23.450178146362305, "global_step": 182569, "epoch": 2199} {"train_loss": -23.651697158813477, "global_step": 182570, "epoch": 2199} {"train_loss": -24.1838436126709, "global_step": 182571, "epoch": 2199} {"train_loss": -23.958377838134766, "global_step": 182572, "epoch": 2199} {"train_loss": -23.6906681060791, "global_step": 182573, "epoch": 2199} {"train_loss": -23.644638061523438, "global_step": 182574, "epoch": 2199} {"train_loss": -24.078596115112305, "global_step": 182575, "epoch": 2199} {"train_loss": -23.827306747436523, "global_step": 182576, "epoch": 2199} {"train_loss": -23.809661865234375, "global_step": 182577, "epoch": 2199} {"train_loss": -23.57413673400879, "global_step": 182578, "epoch": 2199} {"train_loss": -23.83760643005371, "global_step": 182579, "epoch": 2199} {"train_loss": -23.8070125579834, "global_step": 182580, "epoch": 2199} {"train_loss": -23.357070922851562, "global_step": 182581, "epoch": 2199} {"train_loss": -24.335006713867188, "global_step": 182582, "epoch": 2199} {"train_loss": -24.040185928344727, "global_step": 182583, "epoch": 2199} {"train_loss": -23.76667594909668, "global_step": 182584, "epoch": 2199} {"train_loss": -23.992725372314453, "global_step": 182585, "epoch": 2199} {"train_loss": -24.07162094116211, "global_step": 182586, "epoch": 2199} {"train_loss": -23.23980140686035, "global_step": 182587, "epoch": 2199} {"train_loss": -24.2451229095459, "global_step": 182588, "epoch": 2199} {"train_loss": -23.774045944213867, "global_step": 182589, "epoch": 2199} {"train_loss": -23.800153732299805, "global_step": 182590, "epoch": 2199} {"train_loss": -23.99502182006836, "global_step": 182591, "epoch": 2199} {"train_loss": -23.845300674438477, "global_step": 182592, "epoch": 2199} {"train_loss": -23.79683494567871, "global_step": 182593, "epoch": 2199} {"train_loss": -24.288122177124023, "global_step": 182594, "epoch": 2199} {"train_loss": -23.886629104614258, "global_step": 182595, "epoch": 2199} {"train_loss": -23.987546920776367, "global_step": 182596, "epoch": 2199} {"train_loss": -23.875858306884766, "global_step": 182597, "epoch": 2199} {"train_loss": -23.735692977905273, "global_step": 182598, "epoch": 2199} {"train_loss": -23.74774211286062, "global_step": 182599, "epoch": 2199, "val_loss": 6483802.0} {"train_loss": -23.13933753967285, "global_step": 182600, "epoch": 2200} {"train_loss": -23.646530151367188, "global_step": 182601, "epoch": 2200} {"train_loss": -23.55726432800293, "global_step": 182602, "epoch": 2200} {"train_loss": -23.468381881713867, "global_step": 182603, "epoch": 2200} {"train_loss": -23.364822387695312, "global_step": 182604, "epoch": 2200} {"train_loss": -23.350677490234375, "global_step": 182605, "epoch": 2200} {"train_loss": -23.438474655151367, "global_step": 182606, "epoch": 2200} {"train_loss": -23.7142391204834, "global_step": 182607, "epoch": 2200} {"train_loss": -23.77801513671875, "global_step": 182608, "epoch": 2200} {"train_loss": -23.54300880432129, "global_step": 182609, "epoch": 2200} {"train_loss": -23.600444793701172, "global_step": 182610, "epoch": 2200} {"train_loss": -23.533342361450195, "global_step": 182611, "epoch": 2200} {"train_loss": -23.421875, "global_step": 182612, "epoch": 2200} {"train_loss": -23.559680938720703, "global_step": 182613, "epoch": 2200} {"train_loss": -23.5457763671875, "global_step": 182614, "epoch": 2200} {"train_loss": -23.79412841796875, "global_step": 182615, "epoch": 2200} {"train_loss": -23.64605140686035, "global_step": 182616, "epoch": 2200} {"train_loss": -23.85713768005371, "global_step": 182617, "epoch": 2200} {"train_loss": -23.582677841186523, "global_step": 182618, "epoch": 2200} {"train_loss": -23.409347534179688, "global_step": 182619, "epoch": 2200} {"train_loss": -23.38602638244629, "global_step": 182620, "epoch": 2200} {"train_loss": -23.36799430847168, "global_step": 182621, "epoch": 2200} {"train_loss": -23.85178565979004, "global_step": 182622, "epoch": 2200} {"train_loss": -23.840879440307617, "global_step": 182623, "epoch": 2200} {"train_loss": -23.956045150756836, "global_step": 182624, "epoch": 2200} {"train_loss": -23.593271255493164, "global_step": 182625, "epoch": 2200} {"train_loss": -24.02247428894043, "global_step": 182626, "epoch": 2200} {"train_loss": -23.466205596923828, "global_step": 182627, "epoch": 2200} {"train_loss": -24.06636619567871, "global_step": 182628, "epoch": 2200} {"train_loss": -23.893136978149414, "global_step": 182629, "epoch": 2200} {"train_loss": -24.021942138671875, "global_step": 182630, "epoch": 2200} {"train_loss": -24.106813430786133, "global_step": 182631, "epoch": 2200} {"train_loss": -23.83322525024414, "global_step": 182632, "epoch": 2200} {"train_loss": -23.921009063720703, "global_step": 182633, "epoch": 2200} {"train_loss": -23.786773681640625, "global_step": 182634, "epoch": 2200} {"train_loss": -24.034229278564453, "global_step": 182635, "epoch": 2200} {"train_loss": -24.028379440307617, "global_step": 182636, "epoch": 2200} {"train_loss": -23.871566772460938, "global_step": 182637, "epoch": 2200} {"train_loss": -24.528860092163086, "global_step": 182638, "epoch": 2200} {"train_loss": -24.004281997680664, "global_step": 182639, "epoch": 2200} {"train_loss": -23.750225067138672, "global_step": 182640, "epoch": 2200} {"train_loss": -24.01092529296875, "global_step": 182641, "epoch": 2200} {"train_loss": -24.201047897338867, "global_step": 182642, "epoch": 2200} {"train_loss": -24.07386016845703, "global_step": 182643, "epoch": 2200} {"train_loss": -23.938302993774414, "global_step": 182644, "epoch": 2200} {"train_loss": -24.322635650634766, "global_step": 182645, "epoch": 2200} {"train_loss": -24.25389862060547, "global_step": 182646, "epoch": 2200} {"train_loss": -24.207056045532227, "global_step": 182647, "epoch": 2200} {"train_loss": -24.5029239654541, "global_step": 182648, "epoch": 2200} {"train_loss": -24.08785629272461, "global_step": 182649, "epoch": 2200} {"train_loss": -24.317035675048828, "global_step": 182650, "epoch": 2200} {"train_loss": -23.885196685791016, "global_step": 182651, "epoch": 2200} {"train_loss": -24.1577205657959, "global_step": 182652, "epoch": 2200} {"train_loss": -24.195783615112305, "global_step": 182653, "epoch": 2200} {"train_loss": -23.62710952758789, "global_step": 182654, "epoch": 2200} {"train_loss": -24.06943130493164, "global_step": 182655, "epoch": 2200} {"train_loss": -23.576662063598633, "global_step": 182656, "epoch": 2200} {"train_loss": -23.838743209838867, "global_step": 182657, "epoch": 2200} {"train_loss": -23.77077293395996, "global_step": 182658, "epoch": 2200} {"train_loss": -23.779155731201172, "global_step": 182659, "epoch": 2200} {"train_loss": -23.908405303955078, "global_step": 182660, "epoch": 2200} {"train_loss": -24.035614013671875, "global_step": 182661, "epoch": 2200} {"train_loss": -23.95094108581543, "global_step": 182662, "epoch": 2200} {"train_loss": -23.839181900024414, "global_step": 182663, "epoch": 2200} {"train_loss": -23.76580810546875, "global_step": 182664, "epoch": 2200} {"train_loss": -24.2550048828125, "global_step": 182665, "epoch": 2200} {"train_loss": -24.031946182250977, "global_step": 182666, "epoch": 2200} {"train_loss": -23.721921920776367, "global_step": 182667, "epoch": 2200} {"train_loss": -24.10475730895996, "global_step": 182668, "epoch": 2200} {"train_loss": -24.152524948120117, "global_step": 182669, "epoch": 2200} {"train_loss": -24.161401748657227, "global_step": 182670, "epoch": 2200} {"train_loss": -23.736282348632812, "global_step": 182671, "epoch": 2200} {"train_loss": -23.817279815673828, "global_step": 182672, "epoch": 2200} {"train_loss": -23.80791664123535, "global_step": 182673, "epoch": 2200} {"train_loss": -23.905948638916016, "global_step": 182674, "epoch": 2200} {"train_loss": -24.070383071899414, "global_step": 182675, "epoch": 2200} {"train_loss": -24.033761978149414, "global_step": 182676, "epoch": 2200} {"train_loss": -24.01460075378418, "global_step": 182677, "epoch": 2200} {"train_loss": -23.969003677368164, "global_step": 182678, "epoch": 2200} {"train_loss": -23.748579025268555, "global_step": 182679, "epoch": 2200} {"train_loss": -24.1634464263916, "global_step": 182680, "epoch": 2200} {"train_loss": -24.106586456298828, "global_step": 182681, "epoch": 2200} {"train_loss": -23.846656730376093, "global_step": 182682, "epoch": 2200, "train/sim_max_reward_0": 1.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4500000": 1.0, "test/sim_max_reward_4500001": 1.0, "test/sim_max_reward_4500002": 1.0, "test/sim_max_reward_4500003": 1.0, "test/sim_max_reward_4500004": 0.0, "test/sim_max_reward_4500005": 1.0, "test/sim_max_reward_4500006": 1.0, "test/sim_max_reward_4500007": 0.0, "test/sim_max_reward_4500008": 1.0, "test/sim_max_reward_4500009": 1.0, "test/sim_max_reward_4500010": 1.0, "test/sim_max_reward_4500011": 1.0, "test/sim_max_reward_4500012": 1.0, "test/sim_max_reward_4500013": 1.0, "test/sim_max_reward_4500014": 1.0, "test/sim_max_reward_4500015": 1.0, "test/sim_max_reward_4500016": 1.0, "test/sim_max_reward_4500017": 1.0, "test/sim_max_reward_4500018": 1.0, "test/sim_max_reward_4500019": 1.0, "test/sim_max_reward_4500020": 1.0, "test/sim_max_reward_4500021": 1.0, "train/mean_score": 1.0, "test/mean_score": 0.9090909090909091, "val_loss": 6429745.0} {"train_loss": -23.692564010620117, "global_step": 182683, "epoch": 2201} {"train_loss": -23.784528732299805, "global_step": 182684, "epoch": 2201} {"train_loss": -23.882360458374023, "global_step": 182685, "epoch": 2201} {"train_loss": -23.824066162109375, "global_step": 182686, "epoch": 2201} {"train_loss": -23.9110050201416, "global_step": 182687, "epoch": 2201} {"train_loss": -23.407255172729492, "global_step": 182688, "epoch": 2201} {"train_loss": -24.132150650024414, "global_step": 182689, "epoch": 2201} {"train_loss": -24.073993682861328, "global_step": 182690, "epoch": 2201} {"train_loss": -23.650650024414062, "global_step": 182691, "epoch": 2201} {"train_loss": -23.667011260986328, "global_step": 182692, "epoch": 2201} {"train_loss": -23.92644500732422, "global_step": 182693, "epoch": 2201} {"train_loss": -23.52559471130371, "global_step": 182694, "epoch": 2201} {"train_loss": -23.805831909179688, "global_step": 182695, "epoch": 2201} {"train_loss": -23.75492286682129, "global_step": 182696, "epoch": 2201} {"train_loss": -23.730138778686523, "global_step": 182697, "epoch": 2201} {"train_loss": -24.084184646606445, "global_step": 182698, "epoch": 2201} {"train_loss": -24.231321334838867, "global_step": 182699, "epoch": 2201} {"train_loss": -24.029565811157227, "global_step": 182700, "epoch": 2201} {"train_loss": -23.776758193969727, "global_step": 182701, "epoch": 2201} {"train_loss": -24.29656982421875, "global_step": 182702, "epoch": 2201} {"train_loss": -23.93630027770996, "global_step": 182703, "epoch": 2201} {"train_loss": -23.85634994506836, "global_step": 182704, "epoch": 2201} {"train_loss": -24.111692428588867, "global_step": 182705, "epoch": 2201} {"train_loss": -24.133054733276367, "global_step": 182706, "epoch": 2201} {"train_loss": -24.169849395751953, "global_step": 182707, "epoch": 2201} {"train_loss": -24.713775634765625, "global_step": 182708, "epoch": 2201} {"train_loss": -24.006593704223633, "global_step": 182709, "epoch": 2201} {"train_loss": -23.668798446655273, "global_step": 182710, "epoch": 2201} {"train_loss": -24.004240036010742, "global_step": 182711, "epoch": 2201} {"train_loss": -24.087629318237305, "global_step": 182712, "epoch": 2201} {"train_loss": -24.069040298461914, "global_step": 182713, "epoch": 2201} {"train_loss": -24.03242301940918, "global_step": 182714, "epoch": 2201} {"train_loss": -24.141361236572266, "global_step": 182715, "epoch": 2201} {"train_loss": -24.06769561767578, "global_step": 182716, "epoch": 2201} {"train_loss": -23.98285484313965, "global_step": 182717, "epoch": 2201} {"train_loss": -23.96925926208496, "global_step": 182718, "epoch": 2201} {"train_loss": -24.06905746459961, "global_step": 182719, "epoch": 2201} {"train_loss": -23.736188888549805, "global_step": 182720, "epoch": 2201} {"train_loss": -24.2363224029541, "global_step": 182721, "epoch": 2201} {"train_loss": -24.002248764038086, "global_step": 182722, "epoch": 2201} {"train_loss": -24.086849212646484, "global_step": 182723, "epoch": 2201} {"train_loss": -24.036239624023438, "global_step": 182724, "epoch": 2201} {"train_loss": -23.60298728942871, "global_step": 182725, "epoch": 2201} {"train_loss": -24.041545867919922, "global_step": 182726, "epoch": 2201} {"train_loss": -23.800678253173828, "global_step": 182727, "epoch": 2201} {"train_loss": -23.247753143310547, "global_step": 182728, "epoch": 2201} {"train_loss": -23.863555908203125, "global_step": 182729, "epoch": 2201} {"train_loss": -23.42817497253418, "global_step": 182730, "epoch": 2201} {"train_loss": -23.885400772094727, "global_step": 182731, "epoch": 2201} {"train_loss": -23.575225830078125, "global_step": 182732, "epoch": 2201} {"train_loss": -23.639795303344727, "global_step": 182733, "epoch": 2201} {"train_loss": -23.751049041748047, "global_step": 182734, "epoch": 2201} {"train_loss": -23.79163360595703, "global_step": 182735, "epoch": 2201} {"train_loss": -24.064666748046875, "global_step": 182736, "epoch": 2201} {"train_loss": -24.040014266967773, "global_step": 182737, "epoch": 2201} {"train_loss": -23.491405487060547, "global_step": 182738, "epoch": 2201} {"train_loss": -24.0590763092041, "global_step": 182739, "epoch": 2201} {"train_loss": -23.918888092041016, "global_step": 182740, "epoch": 2201} {"train_loss": -23.68457794189453, "global_step": 182741, "epoch": 2201} {"train_loss": -23.918262481689453, "global_step": 182742, "epoch": 2201} {"train_loss": -23.707151412963867, "global_step": 182743, "epoch": 2201} {"train_loss": -23.937726974487305, "global_step": 182744, "epoch": 2201} {"train_loss": -23.893129348754883, "global_step": 182745, "epoch": 2201} {"train_loss": -23.839136123657227, "global_step": 182746, "epoch": 2201} {"train_loss": -24.176931381225586, "global_step": 182747, "epoch": 2201} {"train_loss": -23.85896873474121, "global_step": 182748, "epoch": 2201} {"train_loss": -23.626203536987305, "global_step": 182749, "epoch": 2201} {"train_loss": -23.7401065826416, "global_step": 182750, "epoch": 2201} {"train_loss": -24.342714309692383, "global_step": 182751, "epoch": 2201} {"train_loss": -24.133237838745117, "global_step": 182752, "epoch": 2201} {"train_loss": -24.122472763061523, "global_step": 182753, "epoch": 2201} {"train_loss": -23.72015380859375, "global_step": 182754, "epoch": 2201} {"train_loss": -24.163375854492188, "global_step": 182755, "epoch": 2201} {"train_loss": -24.04856300354004, "global_step": 182756, "epoch": 2201} {"train_loss": -24.211082458496094, "global_step": 182757, "epoch": 2201} {"train_loss": -23.9819393157959, "global_step": 182758, "epoch": 2201} {"train_loss": -24.10548973083496, "global_step": 182759, "epoch": 2201} {"train_loss": -23.954071044921875, "global_step": 182760, "epoch": 2201} {"train_loss": -23.768529891967773, "global_step": 182761, "epoch": 2201} {"train_loss": -24.513547897338867, "global_step": 182762, "epoch": 2201} {"train_loss": -24.19512367248535, "global_step": 182763, "epoch": 2201} {"train_loss": -23.889118194580078, "global_step": 182764, "epoch": 2201} {"train_loss": -23.933041997702723, "global_step": 182765, "epoch": 2201, "val_loss": 6576962.0} {"train_loss": -22.95600700378418, "global_step": 182766, "epoch": 2202} {"train_loss": -21.64729881286621, "global_step": 182767, "epoch": 2202} {"train_loss": -23.47977638244629, "global_step": 182768, "epoch": 2202} {"train_loss": -23.172611236572266, "global_step": 182769, "epoch": 2202} {"train_loss": -22.82670021057129, "global_step": 182770, "epoch": 2202} {"train_loss": -23.116344451904297, "global_step": 182771, "epoch": 2202} {"train_loss": -23.689546585083008, "global_step": 182772, "epoch": 2202} {"train_loss": -23.407684326171875, "global_step": 182773, "epoch": 2202} {"train_loss": -23.679214477539062, "global_step": 182774, "epoch": 2202} {"train_loss": -23.2257022857666, "global_step": 182775, "epoch": 2202} {"train_loss": -23.839946746826172, "global_step": 182776, "epoch": 2202} {"train_loss": -23.281896591186523, "global_step": 182777, "epoch": 2202} {"train_loss": -23.535968780517578, "global_step": 182778, "epoch": 2202} {"train_loss": -23.736221313476562, "global_step": 182779, "epoch": 2202} {"train_loss": -23.835599899291992, "global_step": 182780, "epoch": 2202} {"train_loss": -23.632986068725586, "global_step": 182781, "epoch": 2202} {"train_loss": -23.68368911743164, "global_step": 182782, "epoch": 2202} {"train_loss": -23.944007873535156, "global_step": 182783, "epoch": 2202} {"train_loss": -23.8418025970459, "global_step": 182784, "epoch": 2202} {"train_loss": -23.630287170410156, "global_step": 182785, "epoch": 2202} {"train_loss": -23.8773136138916, "global_step": 182786, "epoch": 2202} {"train_loss": -23.7587890625, "global_step": 182787, "epoch": 2202} {"train_loss": -23.976932525634766, "global_step": 182788, "epoch": 2202} {"train_loss": -23.741470336914062, "global_step": 182789, "epoch": 2202} {"train_loss": -24.007722854614258, "global_step": 182790, "epoch": 2202} {"train_loss": -23.925992965698242, "global_step": 182791, "epoch": 2202} {"train_loss": -23.84333610534668, "global_step": 182792, "epoch": 2202} {"train_loss": -23.864347457885742, "global_step": 182793, "epoch": 2202} {"train_loss": -23.924894332885742, "global_step": 182794, "epoch": 2202} {"train_loss": -23.91394805908203, "global_step": 182795, "epoch": 2202} {"train_loss": -23.78177261352539, "global_step": 182796, "epoch": 2202} {"train_loss": -24.387104034423828, "global_step": 182797, "epoch": 2202} {"train_loss": -24.080474853515625, "global_step": 182798, "epoch": 2202} {"train_loss": -23.94379997253418, "global_step": 182799, "epoch": 2202} {"train_loss": -24.135766983032227, "global_step": 182800, "epoch": 2202} {"train_loss": -23.878681182861328, "global_step": 182801, "epoch": 2202} {"train_loss": -24.199838638305664, "global_step": 182802, "epoch": 2202} {"train_loss": -24.19167137145996, "global_step": 182803, "epoch": 2202} {"train_loss": -23.744033813476562, "global_step": 182804, "epoch": 2202} {"train_loss": -23.846593856811523, "global_step": 182805, "epoch": 2202} {"train_loss": -23.790119171142578, "global_step": 182806, "epoch": 2202} {"train_loss": -24.082435607910156, "global_step": 182807, "epoch": 2202} {"train_loss": -24.35329246520996, "global_step": 182808, "epoch": 2202} {"train_loss": -23.598814010620117, "global_step": 182809, "epoch": 2202} {"train_loss": -23.908376693725586, "global_step": 182810, "epoch": 2202} {"train_loss": -23.941226959228516, "global_step": 182811, "epoch": 2202} {"train_loss": -23.734495162963867, "global_step": 182812, "epoch": 2202} {"train_loss": -24.06190299987793, "global_step": 182813, "epoch": 2202} {"train_loss": -23.836294174194336, "global_step": 182814, "epoch": 2202} {"train_loss": -24.345481872558594, "global_step": 182815, "epoch": 2202} {"train_loss": -24.273473739624023, "global_step": 182816, "epoch": 2202} {"train_loss": -23.72589111328125, "global_step": 182817, "epoch": 2202} {"train_loss": -23.387826919555664, "global_step": 182818, "epoch": 2202} {"train_loss": -24.309295654296875, "global_step": 182819, "epoch": 2202} {"train_loss": -23.917417526245117, "global_step": 182820, "epoch": 2202} {"train_loss": -24.155364990234375, "global_step": 182821, "epoch": 2202} {"train_loss": -24.151121139526367, "global_step": 182822, "epoch": 2202} {"train_loss": -24.134809494018555, "global_step": 182823, "epoch": 2202} {"train_loss": -23.89751434326172, "global_step": 182824, "epoch": 2202} {"train_loss": -23.962371826171875, "global_step": 182825, "epoch": 2202} {"train_loss": -23.76020622253418, "global_step": 182826, "epoch": 2202} {"train_loss": -23.691001892089844, "global_step": 182827, "epoch": 2202} {"train_loss": -23.87138557434082, "global_step": 182828, "epoch": 2202} {"train_loss": -24.163362503051758, "global_step": 182829, "epoch": 2202} {"train_loss": -24.15223503112793, "global_step": 182830, "epoch": 2202} {"train_loss": -24.093698501586914, "global_step": 182831, "epoch": 2202} {"train_loss": -23.8897705078125, "global_step": 182832, "epoch": 2202} {"train_loss": -24.189062118530273, "global_step": 182833, "epoch": 2202} {"train_loss": -24.22469711303711, "global_step": 182834, "epoch": 2202} {"train_loss": -23.897336959838867, "global_step": 182835, "epoch": 2202} {"train_loss": -23.908782958984375, "global_step": 182836, "epoch": 2202} {"train_loss": -24.088926315307617, "global_step": 182837, "epoch": 2202} {"train_loss": -23.9344539642334, "global_step": 182838, "epoch": 2202} {"train_loss": -24.009782791137695, "global_step": 182839, "epoch": 2202} {"train_loss": -23.878385543823242, "global_step": 182840, "epoch": 2202} {"train_loss": -24.09100341796875, "global_step": 182841, "epoch": 2202} {"train_loss": -24.375669479370117, "global_step": 182842, "epoch": 2202} {"train_loss": -24.001066207885742, "global_step": 182843, "epoch": 2202} {"train_loss": -23.85259437561035, "global_step": 182844, "epoch": 2202} {"train_loss": -23.972131729125977, "global_step": 182845, "epoch": 2202} {"train_loss": -23.877511978149414, "global_step": 182846, "epoch": 2202} {"train_loss": -24.18013572692871, "global_step": 182847, "epoch": 2202} {"train_loss": -23.831616344222102, "global_step": 182848, "epoch": 2202, "val_loss": 6584537.0} {"train_loss": -23.30076789855957, "global_step": 182849, "epoch": 2203} {"train_loss": -23.038448333740234, "global_step": 182850, "epoch": 2203} {"train_loss": -23.734737396240234, "global_step": 182851, "epoch": 2203} {"train_loss": -23.52791404724121, "global_step": 182852, "epoch": 2203} {"train_loss": -22.878934860229492, "global_step": 182853, "epoch": 2203} {"train_loss": -23.716642379760742, "global_step": 182854, "epoch": 2203} {"train_loss": -23.20643424987793, "global_step": 182855, "epoch": 2203} {"train_loss": -23.444028854370117, "global_step": 182856, "epoch": 2203} {"train_loss": -23.5432186126709, "global_step": 182857, "epoch": 2203} {"train_loss": -23.697975158691406, "global_step": 182858, "epoch": 2203} {"train_loss": -23.785924911499023, "global_step": 182859, "epoch": 2203} {"train_loss": -23.376632690429688, "global_step": 182860, "epoch": 2203} {"train_loss": -23.51904296875, "global_step": 182861, "epoch": 2203} {"train_loss": -23.7574462890625, "global_step": 182862, "epoch": 2203} {"train_loss": -23.858001708984375, "global_step": 182863, "epoch": 2203} {"train_loss": -23.93165397644043, "global_step": 182864, "epoch": 2203} {"train_loss": -23.874465942382812, "global_step": 182865, "epoch": 2203} {"train_loss": -23.85345458984375, "global_step": 182866, "epoch": 2203} {"train_loss": -23.866920471191406, "global_step": 182867, "epoch": 2203} {"train_loss": -24.045276641845703, "global_step": 182868, "epoch": 2203} {"train_loss": -23.896413803100586, "global_step": 182869, "epoch": 2203} {"train_loss": -23.889774322509766, "global_step": 182870, "epoch": 2203} {"train_loss": -23.867401123046875, "global_step": 182871, "epoch": 2203} {"train_loss": -23.894420623779297, "global_step": 182872, "epoch": 2203} {"train_loss": -23.283597946166992, "global_step": 182873, "epoch": 2203} {"train_loss": -23.747812271118164, "global_step": 182874, "epoch": 2203} {"train_loss": -24.115406036376953, "global_step": 182875, "epoch": 2203} {"train_loss": -24.0933837890625, "global_step": 182876, "epoch": 2203} {"train_loss": -24.10870361328125, "global_step": 182877, "epoch": 2203} {"train_loss": -23.95331382751465, "global_step": 182878, "epoch": 2203} {"train_loss": -24.147817611694336, "global_step": 182879, "epoch": 2203} {"train_loss": -24.138402938842773, "global_step": 182880, "epoch": 2203} {"train_loss": -23.943601608276367, "global_step": 182881, "epoch": 2203} {"train_loss": -24.026159286499023, "global_step": 182882, "epoch": 2203} {"train_loss": -24.0908260345459, "global_step": 182883, "epoch": 2203} {"train_loss": -24.239381790161133, "global_step": 182884, "epoch": 2203} {"train_loss": -24.228946685791016, "global_step": 182885, "epoch": 2203} {"train_loss": -23.83823585510254, "global_step": 182886, "epoch": 2203} {"train_loss": -23.79736328125, "global_step": 182887, "epoch": 2203} {"train_loss": -24.250900268554688, "global_step": 182888, "epoch": 2203} {"train_loss": -24.02923583984375, "global_step": 182889, "epoch": 2203} {"train_loss": -23.905445098876953, "global_step": 182890, "epoch": 2203} {"train_loss": -23.811079025268555, "global_step": 182891, "epoch": 2203} {"train_loss": -24.172048568725586, "global_step": 182892, "epoch": 2203} {"train_loss": -24.04697036743164, "global_step": 182893, "epoch": 2203} {"train_loss": -24.34290885925293, "global_step": 182894, "epoch": 2203} {"train_loss": -23.791595458984375, "global_step": 182895, "epoch": 2203} {"train_loss": -24.343366622924805, "global_step": 182896, "epoch": 2203} {"train_loss": -24.04688262939453, "global_step": 182897, "epoch": 2203} {"train_loss": -23.91769790649414, "global_step": 182898, "epoch": 2203} {"train_loss": -23.79693031311035, "global_step": 182899, "epoch": 2203} {"train_loss": -24.1402530670166, "global_step": 182900, "epoch": 2203} {"train_loss": -23.709741592407227, "global_step": 182901, "epoch": 2203} {"train_loss": -24.090469360351562, "global_step": 182902, "epoch": 2203} {"train_loss": -24.265419006347656, "global_step": 182903, "epoch": 2203} {"train_loss": -24.021169662475586, "global_step": 182904, "epoch": 2203} {"train_loss": -23.666858673095703, "global_step": 182905, "epoch": 2203} {"train_loss": -23.8825626373291, "global_step": 182906, "epoch": 2203} {"train_loss": -24.1682186126709, "global_step": 182907, "epoch": 2203} {"train_loss": -23.514434814453125, "global_step": 182908, "epoch": 2203} {"train_loss": -23.82752227783203, "global_step": 182909, "epoch": 2203} {"train_loss": -23.669879913330078, "global_step": 182910, "epoch": 2203} {"train_loss": -23.617650985717773, "global_step": 182911, "epoch": 2203} {"train_loss": -23.70365333557129, "global_step": 182912, "epoch": 2203} {"train_loss": -24.068449020385742, "global_step": 182913, "epoch": 2203} {"train_loss": -24.000694274902344, "global_step": 182914, "epoch": 2203} {"train_loss": -23.882810592651367, "global_step": 182915, "epoch": 2203} {"train_loss": -24.1197509765625, "global_step": 182916, "epoch": 2203} {"train_loss": -23.833200454711914, "global_step": 182917, "epoch": 2203} {"train_loss": -23.91981315612793, "global_step": 182918, "epoch": 2203} {"train_loss": -24.23891258239746, "global_step": 182919, "epoch": 2203} {"train_loss": -24.5164794921875, "global_step": 182920, "epoch": 2203} {"train_loss": -24.05458641052246, "global_step": 182921, "epoch": 2203} {"train_loss": -24.401111602783203, "global_step": 182922, "epoch": 2203} {"train_loss": -23.824342727661133, "global_step": 182923, "epoch": 2203} {"train_loss": -24.136123657226562, "global_step": 182924, "epoch": 2203} {"train_loss": -23.8876895904541, "global_step": 182925, "epoch": 2203} {"train_loss": -24.021543502807617, "global_step": 182926, "epoch": 2203} {"train_loss": -24.295215606689453, "global_step": 182927, "epoch": 2203} {"train_loss": -23.69580078125, "global_step": 182928, "epoch": 2203} {"train_loss": -23.9212589263916, "global_step": 182929, "epoch": 2203} {"train_loss": -23.82265281677246, "global_step": 182930, "epoch": 2203} {"train_loss": -23.880761410816607, "global_step": 182931, "epoch": 2203, "val_loss": 6435514.5} {"train_loss": -23.372419357299805, "global_step": 182932, "epoch": 2204} {"train_loss": -23.909290313720703, "global_step": 182933, "epoch": 2204} {"train_loss": -23.719287872314453, "global_step": 182934, "epoch": 2204} {"train_loss": -23.718143463134766, "global_step": 182935, "epoch": 2204} {"train_loss": -22.934656143188477, "global_step": 182936, "epoch": 2204} {"train_loss": -23.56014060974121, "global_step": 182937, "epoch": 2204} {"train_loss": -23.299942016601562, "global_step": 182938, "epoch": 2204} {"train_loss": -24.00374412536621, "global_step": 182939, "epoch": 2204} {"train_loss": -23.6729793548584, "global_step": 182940, "epoch": 2204} {"train_loss": -23.181535720825195, "global_step": 182941, "epoch": 2204} {"train_loss": -23.629222869873047, "global_step": 182942, "epoch": 2204} {"train_loss": -23.53725242614746, "global_step": 182943, "epoch": 2204} {"train_loss": -23.494970321655273, "global_step": 182944, "epoch": 2204} {"train_loss": -23.614530563354492, "global_step": 182945, "epoch": 2204} {"train_loss": -23.599760055541992, "global_step": 182946, "epoch": 2204} {"train_loss": -24.341472625732422, "global_step": 182947, "epoch": 2204} {"train_loss": -23.47357177734375, "global_step": 182948, "epoch": 2204} {"train_loss": -23.99483299255371, "global_step": 182949, "epoch": 2204} {"train_loss": -23.678022384643555, "global_step": 182950, "epoch": 2204} {"train_loss": -23.904098510742188, "global_step": 182951, "epoch": 2204} {"train_loss": -23.95841407775879, "global_step": 182952, "epoch": 2204} {"train_loss": -23.6502685546875, "global_step": 182953, "epoch": 2204} {"train_loss": -23.88062858581543, "global_step": 182954, "epoch": 2204} {"train_loss": -23.632177352905273, "global_step": 182955, "epoch": 2204} {"train_loss": -23.216100692749023, "global_step": 182956, "epoch": 2204} {"train_loss": -23.981008529663086, "global_step": 182957, "epoch": 2204} {"train_loss": -24.0463809967041, "global_step": 182958, "epoch": 2204} {"train_loss": -24.28837013244629, "global_step": 182959, "epoch": 2204} {"train_loss": -23.725454330444336, "global_step": 182960, "epoch": 2204} {"train_loss": -24.06557273864746, "global_step": 182961, "epoch": 2204} {"train_loss": -23.72954559326172, "global_step": 182962, "epoch": 2204} {"train_loss": -23.869230270385742, "global_step": 182963, "epoch": 2204} {"train_loss": -24.11652374267578, "global_step": 182964, "epoch": 2204} {"train_loss": -23.608139038085938, "global_step": 182965, "epoch": 2204} {"train_loss": -24.011451721191406, "global_step": 182966, "epoch": 2204} {"train_loss": -23.7263240814209, "global_step": 182967, "epoch": 2204} {"train_loss": -23.953893661499023, "global_step": 182968, "epoch": 2204} {"train_loss": -23.768007278442383, "global_step": 182969, "epoch": 2204} {"train_loss": -24.114587783813477, "global_step": 182970, "epoch": 2204} {"train_loss": -24.062074661254883, "global_step": 182971, "epoch": 2204} {"train_loss": -23.88763999938965, "global_step": 182972, "epoch": 2204} {"train_loss": -23.7421817779541, "global_step": 182973, "epoch": 2204} {"train_loss": -24.027912139892578, "global_step": 182974, "epoch": 2204} {"train_loss": -24.06209373474121, "global_step": 182975, "epoch": 2204} {"train_loss": -24.05158805847168, "global_step": 182976, "epoch": 2204} {"train_loss": -23.687326431274414, "global_step": 182977, "epoch": 2204} {"train_loss": -24.150941848754883, "global_step": 182978, "epoch": 2204} {"train_loss": -24.048322677612305, "global_step": 182979, "epoch": 2204} {"train_loss": -24.033527374267578, "global_step": 182980, "epoch": 2204} {"train_loss": -23.932523727416992, "global_step": 182981, "epoch": 2204} {"train_loss": -24.05604362487793, "global_step": 182982, "epoch": 2204} {"train_loss": -23.977249145507812, "global_step": 182983, "epoch": 2204} {"train_loss": -24.11050033569336, "global_step": 182984, "epoch": 2204} {"train_loss": -24.084400177001953, "global_step": 182985, "epoch": 2204} {"train_loss": -23.522016525268555, "global_step": 182986, "epoch": 2204} {"train_loss": -23.476858139038086, "global_step": 182987, "epoch": 2204} {"train_loss": -23.686050415039062, "global_step": 182988, "epoch": 2204} {"train_loss": -23.78401756286621, "global_step": 182989, "epoch": 2204} {"train_loss": -23.83570671081543, "global_step": 182990, "epoch": 2204} {"train_loss": -23.907705307006836, "global_step": 182991, "epoch": 2204} {"train_loss": -24.235326766967773, "global_step": 182992, "epoch": 2204} {"train_loss": -23.890233993530273, "global_step": 182993, "epoch": 2204} {"train_loss": -24.08847999572754, "global_step": 182994, "epoch": 2204} {"train_loss": -23.98329734802246, "global_step": 182995, "epoch": 2204} {"train_loss": -24.1898136138916, "global_step": 182996, "epoch": 2204} {"train_loss": -24.174522399902344, "global_step": 182997, "epoch": 2204} {"train_loss": -23.97762107849121, "global_step": 182998, "epoch": 2204} {"train_loss": -23.870065689086914, "global_step": 182999, "epoch": 2204} {"train_loss": -24.10573959350586, "global_step": 183000, "epoch": 2204} {"train_loss": -24.197710037231445, "global_step": 183001, "epoch": 2204} {"train_loss": -24.22466468811035, "global_step": 183002, "epoch": 2204} {"train_loss": -23.686309814453125, "global_step": 183003, "epoch": 2204} {"train_loss": -23.95658302307129, "global_step": 183004, "epoch": 2204} {"train_loss": -23.931880950927734, "global_step": 183005, "epoch": 2204} {"train_loss": -24.1256046295166, "global_step": 183006, "epoch": 2204} {"train_loss": -24.094751358032227, "global_step": 183007, "epoch": 2204} {"train_loss": -23.760068893432617, "global_step": 183008, "epoch": 2204} {"train_loss": -23.854999542236328, "global_step": 183009, "epoch": 2204} {"train_loss": -24.393617630004883, "global_step": 183010, "epoch": 2204} {"train_loss": -24.305946350097656, "global_step": 183011, "epoch": 2204} {"train_loss": -24.046630859375, "global_step": 183012, "epoch": 2204} {"train_loss": -23.980443954467773, "global_step": 183013, "epoch": 2204} {"train_loss": -23.86900908688465, "global_step": 183014, "epoch": 2204, "val_loss": 6434371.0} {"train_loss": -22.715612411499023, "global_step": 183015, "epoch": 2205} {"train_loss": -21.613384246826172, "global_step": 183016, "epoch": 2205} {"train_loss": -22.6986026763916, "global_step": 183017, "epoch": 2205} {"train_loss": -23.242887496948242, "global_step": 183018, "epoch": 2205} {"train_loss": -22.684722900390625, "global_step": 183019, "epoch": 2205} {"train_loss": -23.06485366821289, "global_step": 183020, "epoch": 2205} {"train_loss": -22.86972999572754, "global_step": 183021, "epoch": 2205} {"train_loss": -22.53908348083496, "global_step": 183022, "epoch": 2205} {"train_loss": -23.697721481323242, "global_step": 183023, "epoch": 2205} {"train_loss": -22.82123374938965, "global_step": 183024, "epoch": 2205} {"train_loss": -23.43244743347168, "global_step": 183025, "epoch": 2205} {"train_loss": -23.113126754760742, "global_step": 183026, "epoch": 2205} {"train_loss": -23.24564552307129, "global_step": 183027, "epoch": 2205} {"train_loss": -23.65757942199707, "global_step": 183028, "epoch": 2205} {"train_loss": -23.72829246520996, "global_step": 183029, "epoch": 2205} {"train_loss": -23.198835372924805, "global_step": 183030, "epoch": 2205} {"train_loss": -23.616052627563477, "global_step": 183031, "epoch": 2205} {"train_loss": -23.562402725219727, "global_step": 183032, "epoch": 2205} {"train_loss": -23.293750762939453, "global_step": 183033, "epoch": 2205} {"train_loss": -23.475494384765625, "global_step": 183034, "epoch": 2205} {"train_loss": -23.229738235473633, "global_step": 183035, "epoch": 2205} {"train_loss": -23.838693618774414, "global_step": 183036, "epoch": 2205} {"train_loss": -23.635183334350586, "global_step": 183037, "epoch": 2205} {"train_loss": -23.690486907958984, "global_step": 183038, "epoch": 2205} {"train_loss": -23.510074615478516, "global_step": 183039, "epoch": 2205} {"train_loss": -23.717979431152344, "global_step": 183040, "epoch": 2205} {"train_loss": -24.004741668701172, "global_step": 183041, "epoch": 2205} {"train_loss": -23.586353302001953, "global_step": 183042, "epoch": 2205} {"train_loss": -23.845462799072266, "global_step": 183043, "epoch": 2205} {"train_loss": -23.71114158630371, "global_step": 183044, "epoch": 2205} {"train_loss": -23.855897903442383, "global_step": 183045, "epoch": 2205} {"train_loss": -24.081512451171875, "global_step": 183046, "epoch": 2205} {"train_loss": -24.06000328063965, "global_step": 183047, "epoch": 2205} {"train_loss": -24.037487030029297, "global_step": 183048, "epoch": 2205} {"train_loss": -23.97129249572754, "global_step": 183049, "epoch": 2205} {"train_loss": -23.877044677734375, "global_step": 183050, "epoch": 2205} {"train_loss": -24.04150390625, "global_step": 183051, "epoch": 2205} {"train_loss": -23.759017944335938, "global_step": 183052, "epoch": 2205} {"train_loss": -24.285139083862305, "global_step": 183053, "epoch": 2205} {"train_loss": -23.88861656188965, "global_step": 183054, "epoch": 2205} {"train_loss": -24.13313102722168, "global_step": 183055, "epoch": 2205} {"train_loss": -24.387474060058594, "global_step": 183056, "epoch": 2205} {"train_loss": -23.95084571838379, "global_step": 183057, "epoch": 2205} {"train_loss": -23.85235023498535, "global_step": 183058, "epoch": 2205} {"train_loss": -24.071340560913086, "global_step": 183059, "epoch": 2205} {"train_loss": -24.04494285583496, "global_step": 183060, "epoch": 2205} {"train_loss": -23.906360626220703, "global_step": 183061, "epoch": 2205} {"train_loss": -23.863018035888672, "global_step": 183062, "epoch": 2205} {"train_loss": -23.9084529876709, "global_step": 183063, "epoch": 2205} {"train_loss": -23.795324325561523, "global_step": 183064, "epoch": 2205} {"train_loss": -24.247386932373047, "global_step": 183065, "epoch": 2205} {"train_loss": -23.77168846130371, "global_step": 183066, "epoch": 2205} {"train_loss": -23.79559326171875, "global_step": 183067, "epoch": 2205} {"train_loss": -23.94655418395996, "global_step": 183068, "epoch": 2205} {"train_loss": -24.045446395874023, "global_step": 183069, "epoch": 2205} {"train_loss": -24.117111206054688, "global_step": 183070, "epoch": 2205} {"train_loss": -24.032278060913086, "global_step": 183071, "epoch": 2205} {"train_loss": -24.034448623657227, "global_step": 183072, "epoch": 2205} {"train_loss": -23.95906639099121, "global_step": 183073, "epoch": 2205} {"train_loss": -24.084779739379883, "global_step": 183074, "epoch": 2205} {"train_loss": -24.027523040771484, "global_step": 183075, "epoch": 2205} {"train_loss": -23.808917999267578, "global_step": 183076, "epoch": 2205} {"train_loss": -23.595094680786133, "global_step": 183077, "epoch": 2205} {"train_loss": -23.370059967041016, "global_step": 183078, "epoch": 2205} {"train_loss": -23.99251365661621, "global_step": 183079, "epoch": 2205} {"train_loss": -23.75673484802246, "global_step": 183080, "epoch": 2205} {"train_loss": -23.843515396118164, "global_step": 183081, "epoch": 2205} {"train_loss": -23.576871871948242, "global_step": 183082, "epoch": 2205} {"train_loss": -23.82185935974121, "global_step": 183083, "epoch": 2205} {"train_loss": -24.025053024291992, "global_step": 183084, "epoch": 2205} {"train_loss": -23.696130752563477, "global_step": 183085, "epoch": 2205} {"train_loss": -23.92830467224121, "global_step": 183086, "epoch": 2205} {"train_loss": -24.016477584838867, "global_step": 183087, "epoch": 2205} {"train_loss": -23.67317771911621, "global_step": 183088, "epoch": 2205} {"train_loss": -23.661516189575195, "global_step": 183089, "epoch": 2205} {"train_loss": -23.406572341918945, "global_step": 183090, "epoch": 2205} {"train_loss": -24.051223754882812, "global_step": 183091, "epoch": 2205} {"train_loss": -23.92903709411621, "global_step": 183092, "epoch": 2205} {"train_loss": -24.319873809814453, "global_step": 183093, "epoch": 2205} {"train_loss": -23.789804458618164, "global_step": 183094, "epoch": 2205} {"train_loss": -24.439294815063477, "global_step": 183095, "epoch": 2205} {"train_loss": -24.067676544189453, "global_step": 183096, "epoch": 2205} {"train_loss": -23.72635898819889, "global_step": 183097, "epoch": 2205, "val_loss": 6438645.0} {"train_loss": -23.989368438720703, "global_step": 183098, "epoch": 2206} {"train_loss": -24.102449417114258, "global_step": 183099, "epoch": 2206} {"train_loss": -23.80576515197754, "global_step": 183100, "epoch": 2206} {"train_loss": -24.026782989501953, "global_step": 183101, "epoch": 2206} {"train_loss": -23.54450225830078, "global_step": 183102, "epoch": 2206} {"train_loss": -23.98233413696289, "global_step": 183103, "epoch": 2206} {"train_loss": -23.99116325378418, "global_step": 183104, "epoch": 2206} {"train_loss": -23.925079345703125, "global_step": 183105, "epoch": 2206} {"train_loss": -23.87740707397461, "global_step": 183106, "epoch": 2206} {"train_loss": -24.11929702758789, "global_step": 183107, "epoch": 2206} {"train_loss": -23.922163009643555, "global_step": 183108, "epoch": 2206} {"train_loss": -24.22160530090332, "global_step": 183109, "epoch": 2206} {"train_loss": -23.830425262451172, "global_step": 183110, "epoch": 2206} {"train_loss": -23.97601890563965, "global_step": 183111, "epoch": 2206} {"train_loss": -24.15947914123535, "global_step": 183112, "epoch": 2206} {"train_loss": -23.77090835571289, "global_step": 183113, "epoch": 2206} {"train_loss": -24.17129898071289, "global_step": 183114, "epoch": 2206} {"train_loss": -23.885784149169922, "global_step": 183115, "epoch": 2206} {"train_loss": -23.82232093811035, "global_step": 183116, "epoch": 2206} {"train_loss": -24.15791893005371, "global_step": 183117, "epoch": 2206} {"train_loss": -23.6536865234375, "global_step": 183118, "epoch": 2206} {"train_loss": -23.801816940307617, "global_step": 183119, "epoch": 2206} {"train_loss": -24.12302017211914, "global_step": 183120, "epoch": 2206} {"train_loss": -24.210861206054688, "global_step": 183121, "epoch": 2206} {"train_loss": -24.100936889648438, "global_step": 183122, "epoch": 2206} {"train_loss": -23.892385482788086, "global_step": 183123, "epoch": 2206} {"train_loss": -23.737897872924805, "global_step": 183124, "epoch": 2206} {"train_loss": -24.142127990722656, "global_step": 183125, "epoch": 2206} {"train_loss": -24.081787109375, "global_step": 183126, "epoch": 2206} {"train_loss": -24.24236488342285, "global_step": 183127, "epoch": 2206} {"train_loss": -24.21004867553711, "global_step": 183128, "epoch": 2206} {"train_loss": -23.907520294189453, "global_step": 183129, "epoch": 2206} {"train_loss": -23.95045280456543, "global_step": 183130, "epoch": 2206} {"train_loss": -23.984113693237305, "global_step": 183131, "epoch": 2206} {"train_loss": -23.7412166595459, "global_step": 183132, "epoch": 2206} {"train_loss": -23.685821533203125, "global_step": 183133, "epoch": 2206} {"train_loss": -24.07904815673828, "global_step": 183134, "epoch": 2206} {"train_loss": -23.62599754333496, "global_step": 183135, "epoch": 2206} {"train_loss": -23.776243209838867, "global_step": 183136, "epoch": 2206} {"train_loss": -23.487241744995117, "global_step": 183137, "epoch": 2206} {"train_loss": -23.9935245513916, "global_step": 183138, "epoch": 2206} {"train_loss": -23.735891342163086, "global_step": 183139, "epoch": 2206} {"train_loss": -24.05143165588379, "global_step": 183140, "epoch": 2206} {"train_loss": -23.70724868774414, "global_step": 183141, "epoch": 2206} {"train_loss": -23.85164451599121, "global_step": 183142, "epoch": 2206} {"train_loss": -23.835369110107422, "global_step": 183143, "epoch": 2206} {"train_loss": -23.690237045288086, "global_step": 183144, "epoch": 2206} {"train_loss": -24.057706832885742, "global_step": 183145, "epoch": 2206} {"train_loss": -23.8721981048584, "global_step": 183146, "epoch": 2206} {"train_loss": -23.903921127319336, "global_step": 183147, "epoch": 2206} {"train_loss": -23.754703521728516, "global_step": 183148, "epoch": 2206} {"train_loss": -23.654447555541992, "global_step": 183149, "epoch": 2206} {"train_loss": -23.828901290893555, "global_step": 183150, "epoch": 2206} {"train_loss": -23.614465713500977, "global_step": 183151, "epoch": 2206} {"train_loss": -24.040807723999023, "global_step": 183152, "epoch": 2206} {"train_loss": -24.328750610351562, "global_step": 183153, "epoch": 2206} {"train_loss": -24.38778305053711, "global_step": 183154, "epoch": 2206} {"train_loss": -24.457128524780273, "global_step": 183155, "epoch": 2206} {"train_loss": -24.161184310913086, "global_step": 183156, "epoch": 2206} {"train_loss": -24.20546531677246, "global_step": 183157, "epoch": 2206} {"train_loss": -24.076679229736328, "global_step": 183158, "epoch": 2206} {"train_loss": -23.719791412353516, "global_step": 183159, "epoch": 2206} {"train_loss": -23.946157455444336, "global_step": 183160, "epoch": 2206} {"train_loss": -23.703550338745117, "global_step": 183161, "epoch": 2206} {"train_loss": -24.296531677246094, "global_step": 183162, "epoch": 2206} {"train_loss": -24.00507164001465, "global_step": 183163, "epoch": 2206} {"train_loss": -23.256271362304688, "global_step": 183164, "epoch": 2206} {"train_loss": -23.64687156677246, "global_step": 183165, "epoch": 2206} {"train_loss": -23.247167587280273, "global_step": 183166, "epoch": 2206} {"train_loss": -23.863449096679688, "global_step": 183167, "epoch": 2206} {"train_loss": -24.021509170532227, "global_step": 183168, "epoch": 2206} {"train_loss": -23.875341415405273, "global_step": 183169, "epoch": 2206} {"train_loss": -23.7203311920166, "global_step": 183170, "epoch": 2206} {"train_loss": -23.71307945251465, "global_step": 183171, "epoch": 2206} {"train_loss": -23.841794967651367, "global_step": 183172, "epoch": 2206} {"train_loss": -23.696945190429688, "global_step": 183173, "epoch": 2206} {"train_loss": -23.882978439331055, "global_step": 183174, "epoch": 2206} {"train_loss": -23.584558486938477, "global_step": 183175, "epoch": 2206} {"train_loss": -23.49643325805664, "global_step": 183176, "epoch": 2206} {"train_loss": -23.737354278564453, "global_step": 183177, "epoch": 2206} {"train_loss": -24.101821899414062, "global_step": 183178, "epoch": 2206} {"train_loss": -23.611316680908203, "global_step": 183179, "epoch": 2206} {"train_loss": -23.878259635833373, "global_step": 183180, "epoch": 2206, "val_loss": 6353669.0} {"train_loss": -23.091567993164062, "global_step": 183181, "epoch": 2207} {"train_loss": -23.54119300842285, "global_step": 183182, "epoch": 2207} {"train_loss": -22.676517486572266, "global_step": 183183, "epoch": 2207} {"train_loss": -23.29350471496582, "global_step": 183184, "epoch": 2207} {"train_loss": -23.22357940673828, "global_step": 183185, "epoch": 2207} {"train_loss": -23.46388053894043, "global_step": 183186, "epoch": 2207} {"train_loss": -23.191211700439453, "global_step": 183187, "epoch": 2207} {"train_loss": -23.730554580688477, "global_step": 183188, "epoch": 2207} {"train_loss": -23.491336822509766, "global_step": 183189, "epoch": 2207} {"train_loss": -23.334457397460938, "global_step": 183190, "epoch": 2207} {"train_loss": -23.475170135498047, "global_step": 183191, "epoch": 2207} {"train_loss": -23.346046447753906, "global_step": 183192, "epoch": 2207} {"train_loss": -23.993465423583984, "global_step": 183193, "epoch": 2207} {"train_loss": -23.20465087890625, "global_step": 183194, "epoch": 2207} {"train_loss": -23.799243927001953, "global_step": 183195, "epoch": 2207} {"train_loss": -23.269832611083984, "global_step": 183196, "epoch": 2207} {"train_loss": -24.034852981567383, "global_step": 183197, "epoch": 2207} {"train_loss": -23.142337799072266, "global_step": 183198, "epoch": 2207} {"train_loss": -24.03590965270996, "global_step": 183199, "epoch": 2207} {"train_loss": -23.86484718322754, "global_step": 183200, "epoch": 2207} {"train_loss": -23.750900268554688, "global_step": 183201, "epoch": 2207} {"train_loss": -24.03443717956543, "global_step": 183202, "epoch": 2207} {"train_loss": -24.179126739501953, "global_step": 183203, "epoch": 2207} {"train_loss": -23.441320419311523, "global_step": 183204, "epoch": 2207} {"train_loss": -23.714731216430664, "global_step": 183205, "epoch": 2207} {"train_loss": -24.023515701293945, "global_step": 183206, "epoch": 2207} {"train_loss": -23.848636627197266, "global_step": 183207, "epoch": 2207} {"train_loss": -23.62611198425293, "global_step": 183208, "epoch": 2207} {"train_loss": -23.660327911376953, "global_step": 183209, "epoch": 2207} {"train_loss": -23.587261199951172, "global_step": 183210, "epoch": 2207} {"train_loss": -23.770267486572266, "global_step": 183211, "epoch": 2207} {"train_loss": -24.005752563476562, "global_step": 183212, "epoch": 2207} {"train_loss": -23.923913955688477, "global_step": 183213, "epoch": 2207} {"train_loss": -24.000160217285156, "global_step": 183214, "epoch": 2207} {"train_loss": -23.839405059814453, "global_step": 183215, "epoch": 2207} {"train_loss": -23.81493377685547, "global_step": 183216, "epoch": 2207} {"train_loss": -24.11347007751465, "global_step": 183217, "epoch": 2207} {"train_loss": -23.922359466552734, "global_step": 183218, "epoch": 2207} {"train_loss": -23.843923568725586, "global_step": 183219, "epoch": 2207} {"train_loss": -23.661767959594727, "global_step": 183220, "epoch": 2207} {"train_loss": -24.268272399902344, "global_step": 183221, "epoch": 2207} {"train_loss": -23.752782821655273, "global_step": 183222, "epoch": 2207} {"train_loss": -23.812454223632812, "global_step": 183223, "epoch": 2207} {"train_loss": -24.02671241760254, "global_step": 183224, "epoch": 2207} {"train_loss": -24.023704528808594, "global_step": 183225, "epoch": 2207} {"train_loss": -23.785961151123047, "global_step": 183226, "epoch": 2207} {"train_loss": -23.945072174072266, "global_step": 183227, "epoch": 2207} {"train_loss": -23.369064331054688, "global_step": 183228, "epoch": 2207} {"train_loss": -23.96527099609375, "global_step": 183229, "epoch": 2207} {"train_loss": -23.81682014465332, "global_step": 183230, "epoch": 2207} {"train_loss": -23.755830764770508, "global_step": 183231, "epoch": 2207} {"train_loss": -24.589170455932617, "global_step": 183232, "epoch": 2207} {"train_loss": -23.780588150024414, "global_step": 183233, "epoch": 2207} {"train_loss": -24.26398277282715, "global_step": 183234, "epoch": 2207} {"train_loss": -24.137109756469727, "global_step": 183235, "epoch": 2207} {"train_loss": -23.977598190307617, "global_step": 183236, "epoch": 2207} {"train_loss": -23.907602310180664, "global_step": 183237, "epoch": 2207} {"train_loss": -23.86349868774414, "global_step": 183238, "epoch": 2207} {"train_loss": -23.73048210144043, "global_step": 183239, "epoch": 2207} {"train_loss": -24.070234298706055, "global_step": 183240, "epoch": 2207} {"train_loss": -24.088605880737305, "global_step": 183241, "epoch": 2207} {"train_loss": -24.100534439086914, "global_step": 183242, "epoch": 2207} {"train_loss": -23.753658294677734, "global_step": 183243, "epoch": 2207} {"train_loss": -23.814294815063477, "global_step": 183244, "epoch": 2207} {"train_loss": -24.221765518188477, "global_step": 183245, "epoch": 2207} {"train_loss": -23.971845626831055, "global_step": 183246, "epoch": 2207} {"train_loss": -23.410064697265625, "global_step": 183247, "epoch": 2207} {"train_loss": -24.015649795532227, "global_step": 183248, "epoch": 2207} {"train_loss": -24.099061965942383, "global_step": 183249, "epoch": 2207} {"train_loss": -23.459651947021484, "global_step": 183250, "epoch": 2207} {"train_loss": -23.30010414123535, "global_step": 183251, "epoch": 2207} {"train_loss": -24.008466720581055, "global_step": 183252, "epoch": 2207} {"train_loss": -23.804712295532227, "global_step": 183253, "epoch": 2207} {"train_loss": -23.933008193969727, "global_step": 183254, "epoch": 2207} {"train_loss": -23.809614181518555, "global_step": 183255, "epoch": 2207} {"train_loss": -23.97645378112793, "global_step": 183256, "epoch": 2207} {"train_loss": -24.089889526367188, "global_step": 183257, "epoch": 2207} {"train_loss": -24.142980575561523, "global_step": 183258, "epoch": 2207} {"train_loss": -23.700340270996094, "global_step": 183259, "epoch": 2207} {"train_loss": -23.932836532592773, "global_step": 183260, "epoch": 2207} {"train_loss": -24.142288208007812, "global_step": 183261, "epoch": 2207} {"train_loss": -23.559823989868164, "global_step": 183262, "epoch": 2207} {"train_loss": -23.780978191329773, "global_step": 183263, "epoch": 2207, "val_loss": 6448742.0} {"train_loss": -23.874404907226562, "global_step": 183264, "epoch": 2208} {"train_loss": -24.130207061767578, "global_step": 183265, "epoch": 2208} {"train_loss": -23.983001708984375, "global_step": 183266, "epoch": 2208} {"train_loss": -24.007349014282227, "global_step": 183267, "epoch": 2208} {"train_loss": -23.571151733398438, "global_step": 183268, "epoch": 2208} {"train_loss": -23.622934341430664, "global_step": 183269, "epoch": 2208} {"train_loss": -24.015554428100586, "global_step": 183270, "epoch": 2208} {"train_loss": -23.419584274291992, "global_step": 183271, "epoch": 2208} {"train_loss": -23.792348861694336, "global_step": 183272, "epoch": 2208} {"train_loss": -23.88986587524414, "global_step": 183273, "epoch": 2208} {"train_loss": -23.703784942626953, "global_step": 183274, "epoch": 2208} {"train_loss": -23.83675765991211, "global_step": 183275, "epoch": 2208} {"train_loss": -24.083362579345703, "global_step": 183276, "epoch": 2208} {"train_loss": -23.965784072875977, "global_step": 183277, "epoch": 2208} {"train_loss": -23.930479049682617, "global_step": 183278, "epoch": 2208} {"train_loss": -24.019643783569336, "global_step": 183279, "epoch": 2208} {"train_loss": -24.411367416381836, "global_step": 183280, "epoch": 2208} {"train_loss": -23.88044548034668, "global_step": 183281, "epoch": 2208} {"train_loss": -23.496625900268555, "global_step": 183282, "epoch": 2208} {"train_loss": -23.89023208618164, "global_step": 183283, "epoch": 2208} {"train_loss": -24.020124435424805, "global_step": 183284, "epoch": 2208} {"train_loss": -23.754989624023438, "global_step": 183285, "epoch": 2208} {"train_loss": -24.076459884643555, "global_step": 183286, "epoch": 2208} {"train_loss": -23.798828125, "global_step": 183287, "epoch": 2208} {"train_loss": -23.91304588317871, "global_step": 183288, "epoch": 2208} {"train_loss": -24.164785385131836, "global_step": 183289, "epoch": 2208} {"train_loss": -24.061307907104492, "global_step": 183290, "epoch": 2208} {"train_loss": -24.067981719970703, "global_step": 183291, "epoch": 2208} {"train_loss": -23.79598617553711, "global_step": 183292, "epoch": 2208} {"train_loss": -24.100366592407227, "global_step": 183293, "epoch": 2208} {"train_loss": -23.927621841430664, "global_step": 183294, "epoch": 2208} {"train_loss": -23.84833335876465, "global_step": 183295, "epoch": 2208} {"train_loss": -23.876760482788086, "global_step": 183296, "epoch": 2208} {"train_loss": -24.114887237548828, "global_step": 183297, "epoch": 2208} {"train_loss": -23.72454261779785, "global_step": 183298, "epoch": 2208} {"train_loss": -24.217430114746094, "global_step": 183299, "epoch": 2208} {"train_loss": -23.683378219604492, "global_step": 183300, "epoch": 2208} {"train_loss": -24.38875961303711, "global_step": 183301, "epoch": 2208} {"train_loss": -24.10073471069336, "global_step": 183302, "epoch": 2208} {"train_loss": -23.886991500854492, "global_step": 183303, "epoch": 2208} {"train_loss": -24.27100944519043, "global_step": 183304, "epoch": 2208} {"train_loss": -24.04469108581543, "global_step": 183305, "epoch": 2208} {"train_loss": -23.691110610961914, "global_step": 183306, "epoch": 2208} {"train_loss": -23.989389419555664, "global_step": 183307, "epoch": 2208} {"train_loss": -23.6534423828125, "global_step": 183308, "epoch": 2208} {"train_loss": -23.982236862182617, "global_step": 183309, "epoch": 2208} {"train_loss": -23.684720993041992, "global_step": 183310, "epoch": 2208} {"train_loss": -23.933897018432617, "global_step": 183311, "epoch": 2208} {"train_loss": -23.31546974182129, "global_step": 183312, "epoch": 2208} {"train_loss": -23.838930130004883, "global_step": 183313, "epoch": 2208} {"train_loss": -23.686697006225586, "global_step": 183314, "epoch": 2208} {"train_loss": -23.881406784057617, "global_step": 183315, "epoch": 2208} {"train_loss": -23.715421676635742, "global_step": 183316, "epoch": 2208} {"train_loss": -24.179458618164062, "global_step": 183317, "epoch": 2208} {"train_loss": -23.423866271972656, "global_step": 183318, "epoch": 2208} {"train_loss": -23.885671615600586, "global_step": 183319, "epoch": 2208} {"train_loss": -24.222625732421875, "global_step": 183320, "epoch": 2208} {"train_loss": -23.5731258392334, "global_step": 183321, "epoch": 2208} {"train_loss": -24.021711349487305, "global_step": 183322, "epoch": 2208} {"train_loss": -23.95186424255371, "global_step": 183323, "epoch": 2208} {"train_loss": -23.79523468017578, "global_step": 183324, "epoch": 2208} {"train_loss": -23.548294067382812, "global_step": 183325, "epoch": 2208} {"train_loss": -23.76365089416504, "global_step": 183326, "epoch": 2208} {"train_loss": -23.75465965270996, "global_step": 183327, "epoch": 2208} {"train_loss": -23.748779296875, "global_step": 183328, "epoch": 2208} {"train_loss": -23.754823684692383, "global_step": 183329, "epoch": 2208} {"train_loss": -24.14163589477539, "global_step": 183330, "epoch": 2208} {"train_loss": -24.12607192993164, "global_step": 183331, "epoch": 2208} {"train_loss": -23.92328453063965, "global_step": 183332, "epoch": 2208} {"train_loss": -23.904842376708984, "global_step": 183333, "epoch": 2208} {"train_loss": -23.8726863861084, "global_step": 183334, "epoch": 2208} {"train_loss": -23.54690170288086, "global_step": 183335, "epoch": 2208} {"train_loss": -24.16751480102539, "global_step": 183336, "epoch": 2208} {"train_loss": -23.855939865112305, "global_step": 183337, "epoch": 2208} {"train_loss": -24.0544490814209, "global_step": 183338, "epoch": 2208} {"train_loss": -23.992198944091797, "global_step": 183339, "epoch": 2208} {"train_loss": -24.12221908569336, "global_step": 183340, "epoch": 2208} {"train_loss": -23.830076217651367, "global_step": 183341, "epoch": 2208} {"train_loss": -23.450109481811523, "global_step": 183342, "epoch": 2208} {"train_loss": -23.99867057800293, "global_step": 183343, "epoch": 2208} {"train_loss": -23.998146057128906, "global_step": 183344, "epoch": 2208} {"train_loss": -23.88372802734375, "global_step": 183345, "epoch": 2208} {"train_loss": -23.87877496466579, "global_step": 183346, "epoch": 2208, "val_loss": 6610071.0} {"train_loss": -23.47890281677246, "global_step": 183347, "epoch": 2209} {"train_loss": -23.693532943725586, "global_step": 183348, "epoch": 2209} {"train_loss": -23.61899185180664, "global_step": 183349, "epoch": 2209} {"train_loss": -24.07733726501465, "global_step": 183350, "epoch": 2209} {"train_loss": -24.142240524291992, "global_step": 183351, "epoch": 2209} {"train_loss": -23.857519149780273, "global_step": 183352, "epoch": 2209} {"train_loss": -24.264318466186523, "global_step": 183353, "epoch": 2209} {"train_loss": -23.474288940429688, "global_step": 183354, "epoch": 2209} {"train_loss": -23.64961814880371, "global_step": 183355, "epoch": 2209} {"train_loss": -23.837158203125, "global_step": 183356, "epoch": 2209} {"train_loss": -24.131254196166992, "global_step": 183357, "epoch": 2209} {"train_loss": -23.081106185913086, "global_step": 183358, "epoch": 2209} {"train_loss": -23.381114959716797, "global_step": 183359, "epoch": 2209} {"train_loss": -24.039953231811523, "global_step": 183360, "epoch": 2209} {"train_loss": -23.556440353393555, "global_step": 183361, "epoch": 2209} {"train_loss": -24.11697006225586, "global_step": 183362, "epoch": 2209} {"train_loss": -24.011741638183594, "global_step": 183363, "epoch": 2209} {"train_loss": -23.863441467285156, "global_step": 183364, "epoch": 2209} {"train_loss": -24.22601890563965, "global_step": 183365, "epoch": 2209} {"train_loss": -23.553144454956055, "global_step": 183366, "epoch": 2209} {"train_loss": -23.872270584106445, "global_step": 183367, "epoch": 2209} {"train_loss": -23.738399505615234, "global_step": 183368, "epoch": 2209} {"train_loss": -23.9423885345459, "global_step": 183369, "epoch": 2209} {"train_loss": -23.88578987121582, "global_step": 183370, "epoch": 2209} {"train_loss": -24.16937828063965, "global_step": 183371, "epoch": 2209} {"train_loss": -23.799318313598633, "global_step": 183372, "epoch": 2209} {"train_loss": -24.05810546875, "global_step": 183373, "epoch": 2209} {"train_loss": -23.96082878112793, "global_step": 183374, "epoch": 2209} {"train_loss": -23.987228393554688, "global_step": 183375, "epoch": 2209} {"train_loss": -23.981882095336914, "global_step": 183376, "epoch": 2209} {"train_loss": -23.806198120117188, "global_step": 183377, "epoch": 2209} {"train_loss": -23.997488021850586, "global_step": 183378, "epoch": 2209} {"train_loss": -23.73409652709961, "global_step": 183379, "epoch": 2209} {"train_loss": -23.9874267578125, "global_step": 183380, "epoch": 2209} {"train_loss": -24.177003860473633, "global_step": 183381, "epoch": 2209} {"train_loss": -24.239896774291992, "global_step": 183382, "epoch": 2209} {"train_loss": -23.95851707458496, "global_step": 183383, "epoch": 2209} {"train_loss": -24.012542724609375, "global_step": 183384, "epoch": 2209} {"train_loss": -23.5769100189209, "global_step": 183385, "epoch": 2209} {"train_loss": -24.322158813476562, "global_step": 183386, "epoch": 2209} {"train_loss": -24.173973083496094, "global_step": 183387, "epoch": 2209} {"train_loss": -23.759456634521484, "global_step": 183388, "epoch": 2209} {"train_loss": -24.088735580444336, "global_step": 183389, "epoch": 2209} {"train_loss": -24.154956817626953, "global_step": 183390, "epoch": 2209} {"train_loss": -24.230785369873047, "global_step": 183391, "epoch": 2209} {"train_loss": -24.252660751342773, "global_step": 183392, "epoch": 2209} {"train_loss": -23.808860778808594, "global_step": 183393, "epoch": 2209} {"train_loss": -23.68123435974121, "global_step": 183394, "epoch": 2209} {"train_loss": -23.816892623901367, "global_step": 183395, "epoch": 2209} {"train_loss": -23.784584045410156, "global_step": 183396, "epoch": 2209} {"train_loss": -23.72930908203125, "global_step": 183397, "epoch": 2209} {"train_loss": -23.966203689575195, "global_step": 183398, "epoch": 2209} {"train_loss": -23.577260971069336, "global_step": 183399, "epoch": 2209} {"train_loss": -24.150327682495117, "global_step": 183400, "epoch": 2209} {"train_loss": -24.07340431213379, "global_step": 183401, "epoch": 2209} {"train_loss": -24.14716911315918, "global_step": 183402, "epoch": 2209} {"train_loss": -24.13104820251465, "global_step": 183403, "epoch": 2209} {"train_loss": -23.43122673034668, "global_step": 183404, "epoch": 2209} {"train_loss": -23.727497100830078, "global_step": 183405, "epoch": 2209} {"train_loss": -24.201297760009766, "global_step": 183406, "epoch": 2209} {"train_loss": -24.143518447875977, "global_step": 183407, "epoch": 2209} {"train_loss": -24.290353775024414, "global_step": 183408, "epoch": 2209} {"train_loss": -23.80795669555664, "global_step": 183409, "epoch": 2209} {"train_loss": -23.977426528930664, "global_step": 183410, "epoch": 2209} {"train_loss": -23.8420467376709, "global_step": 183411, "epoch": 2209} {"train_loss": -24.10187339782715, "global_step": 183412, "epoch": 2209} {"train_loss": -23.55378532409668, "global_step": 183413, "epoch": 2209} {"train_loss": -23.95913314819336, "global_step": 183414, "epoch": 2209} {"train_loss": -23.91818618774414, "global_step": 183415, "epoch": 2209} {"train_loss": -23.97909927368164, "global_step": 183416, "epoch": 2209} {"train_loss": -23.96370506286621, "global_step": 183417, "epoch": 2209} {"train_loss": -24.227060317993164, "global_step": 183418, "epoch": 2209} {"train_loss": -24.015527725219727, "global_step": 183419, "epoch": 2209} {"train_loss": -24.049802780151367, "global_step": 183420, "epoch": 2209} {"train_loss": -24.177888870239258, "global_step": 183421, "epoch": 2209} {"train_loss": -23.873098373413086, "global_step": 183422, "epoch": 2209} {"train_loss": -24.001962661743164, "global_step": 183423, "epoch": 2209} {"train_loss": -23.975234985351562, "global_step": 183424, "epoch": 2209} {"train_loss": -23.82097625732422, "global_step": 183425, "epoch": 2209} {"train_loss": -23.82098960876465, "global_step": 183426, "epoch": 2209} {"train_loss": -24.145750045776367, "global_step": 183427, "epoch": 2209} {"train_loss": -24.168928146362305, "global_step": 183428, "epoch": 2209} {"train_loss": -23.928419710641883, "global_step": 183429, "epoch": 2209, "val_loss": 6516080.0} {"train_loss": -23.396631240844727, "global_step": 183430, "epoch": 2210} {"train_loss": -23.735998153686523, "global_step": 183431, "epoch": 2210} {"train_loss": -23.936704635620117, "global_step": 183432, "epoch": 2210} {"train_loss": -23.723180770874023, "global_step": 183433, "epoch": 2210} {"train_loss": -23.664243698120117, "global_step": 183434, "epoch": 2210} {"train_loss": -23.65006446838379, "global_step": 183435, "epoch": 2210} {"train_loss": -23.54542350769043, "global_step": 183436, "epoch": 2210} {"train_loss": -23.921133041381836, "global_step": 183437, "epoch": 2210} {"train_loss": -24.03369140625, "global_step": 183438, "epoch": 2210} {"train_loss": -23.840991973876953, "global_step": 183439, "epoch": 2210} {"train_loss": -23.705097198486328, "global_step": 183440, "epoch": 2210} {"train_loss": -23.870534896850586, "global_step": 183441, "epoch": 2210} {"train_loss": -23.847599029541016, "global_step": 183442, "epoch": 2210} {"train_loss": -23.756704330444336, "global_step": 183443, "epoch": 2210} {"train_loss": -23.990198135375977, "global_step": 183444, "epoch": 2210} {"train_loss": -23.73953628540039, "global_step": 183445, "epoch": 2210} {"train_loss": -23.865713119506836, "global_step": 183446, "epoch": 2210} {"train_loss": -23.696035385131836, "global_step": 183447, "epoch": 2210} {"train_loss": -23.76513671875, "global_step": 183448, "epoch": 2210} {"train_loss": -23.8402042388916, "global_step": 183449, "epoch": 2210} {"train_loss": -24.16856575012207, "global_step": 183450, "epoch": 2210} {"train_loss": -24.10953712463379, "global_step": 183451, "epoch": 2210} {"train_loss": -23.706918716430664, "global_step": 183452, "epoch": 2210} {"train_loss": -24.252735137939453, "global_step": 183453, "epoch": 2210} {"train_loss": -24.03678321838379, "global_step": 183454, "epoch": 2210} {"train_loss": -24.059377670288086, "global_step": 183455, "epoch": 2210} {"train_loss": -24.12445831298828, "global_step": 183456, "epoch": 2210} {"train_loss": -23.779478073120117, "global_step": 183457, "epoch": 2210} {"train_loss": -23.584644317626953, "global_step": 183458, "epoch": 2210} {"train_loss": -24.10846710205078, "global_step": 183459, "epoch": 2210} {"train_loss": -24.225004196166992, "global_step": 183460, "epoch": 2210} {"train_loss": -23.560331344604492, "global_step": 183461, "epoch": 2210} {"train_loss": -23.920469284057617, "global_step": 183462, "epoch": 2210} {"train_loss": -24.1025333404541, "global_step": 183463, "epoch": 2210} {"train_loss": -24.228300094604492, "global_step": 183464, "epoch": 2210} {"train_loss": -24.55112648010254, "global_step": 183465, "epoch": 2210} {"train_loss": -23.918249130249023, "global_step": 183466, "epoch": 2210} {"train_loss": -23.876184463500977, "global_step": 183467, "epoch": 2210} {"train_loss": -23.93500328063965, "global_step": 183468, "epoch": 2210} {"train_loss": -24.036977767944336, "global_step": 183469, "epoch": 2210} {"train_loss": -24.28090476989746, "global_step": 183470, "epoch": 2210} {"train_loss": -23.835588455200195, "global_step": 183471, "epoch": 2210} {"train_loss": -24.0131893157959, "global_step": 183472, "epoch": 2210} {"train_loss": -23.489194869995117, "global_step": 183473, "epoch": 2210} {"train_loss": -23.960338592529297, "global_step": 183474, "epoch": 2210} {"train_loss": -24.102548599243164, "global_step": 183475, "epoch": 2210} {"train_loss": -24.102754592895508, "global_step": 183476, "epoch": 2210} {"train_loss": -24.333175659179688, "global_step": 183477, "epoch": 2210} {"train_loss": -23.94468116760254, "global_step": 183478, "epoch": 2210} {"train_loss": -23.752883911132812, "global_step": 183479, "epoch": 2210} {"train_loss": -23.77652359008789, "global_step": 183480, "epoch": 2210} {"train_loss": -24.253271102905273, "global_step": 183481, "epoch": 2210} {"train_loss": -24.417953491210938, "global_step": 183482, "epoch": 2210} {"train_loss": -24.400060653686523, "global_step": 183483, "epoch": 2210} {"train_loss": -24.088857650756836, "global_step": 183484, "epoch": 2210} {"train_loss": -24.034271240234375, "global_step": 183485, "epoch": 2210} {"train_loss": -24.14566421508789, "global_step": 183486, "epoch": 2210} {"train_loss": -23.69600486755371, "global_step": 183487, "epoch": 2210} {"train_loss": -24.131610870361328, "global_step": 183488, "epoch": 2210} {"train_loss": -23.964139938354492, "global_step": 183489, "epoch": 2210} {"train_loss": -23.81863784790039, "global_step": 183490, "epoch": 2210} {"train_loss": -24.203001022338867, "global_step": 183491, "epoch": 2210} {"train_loss": -24.44173240661621, "global_step": 183492, "epoch": 2210} {"train_loss": -23.98702621459961, "global_step": 183493, "epoch": 2210} {"train_loss": -24.067846298217773, "global_step": 183494, "epoch": 2210} {"train_loss": -24.252248764038086, "global_step": 183495, "epoch": 2210} {"train_loss": -24.23801040649414, "global_step": 183496, "epoch": 2210} {"train_loss": -24.074634552001953, "global_step": 183497, "epoch": 2210} {"train_loss": -24.09908103942871, "global_step": 183498, "epoch": 2210} {"train_loss": -24.00855827331543, "global_step": 183499, "epoch": 2210} {"train_loss": -24.05074119567871, "global_step": 183500, "epoch": 2210} {"train_loss": -24.234878540039062, "global_step": 183501, "epoch": 2210} {"train_loss": -23.892227172851562, "global_step": 183502, "epoch": 2210} {"train_loss": -24.397558212280273, "global_step": 183503, "epoch": 2210} {"train_loss": -23.89539337158203, "global_step": 183504, "epoch": 2210} {"train_loss": -24.183086395263672, "global_step": 183505, "epoch": 2210} {"train_loss": -23.708768844604492, "global_step": 183506, "epoch": 2210} {"train_loss": -24.111478805541992, "global_step": 183507, "epoch": 2210} {"train_loss": -24.131229400634766, "global_step": 183508, "epoch": 2210} {"train_loss": -24.106000900268555, "global_step": 183509, "epoch": 2210} {"train_loss": -23.55513572692871, "global_step": 183510, "epoch": 2210} {"train_loss": -24.086959838867188, "global_step": 183511, "epoch": 2210} {"train_loss": -23.97995891341244, "global_step": 183512, "epoch": 2210, "val_loss": 6629467.0} {"train_loss": -22.751615524291992, "global_step": 183513, "epoch": 2211} {"train_loss": -22.34100341796875, "global_step": 183514, "epoch": 2211} {"train_loss": -22.292827606201172, "global_step": 183515, "epoch": 2211} {"train_loss": -22.902692794799805, "global_step": 183516, "epoch": 2211} {"train_loss": -23.27663230895996, "global_step": 183517, "epoch": 2211} {"train_loss": -23.025842666625977, "global_step": 183518, "epoch": 2211} {"train_loss": -22.89627456665039, "global_step": 183519, "epoch": 2211} {"train_loss": -23.3156681060791, "global_step": 183520, "epoch": 2211} {"train_loss": -23.129806518554688, "global_step": 183521, "epoch": 2211} {"train_loss": -23.102720260620117, "global_step": 183522, "epoch": 2211} {"train_loss": -23.5073299407959, "global_step": 183523, "epoch": 2211} {"train_loss": -23.59459686279297, "global_step": 183524, "epoch": 2211} {"train_loss": -23.763673782348633, "global_step": 183525, "epoch": 2211} {"train_loss": -23.240575790405273, "global_step": 183526, "epoch": 2211} {"train_loss": -23.365419387817383, "global_step": 183527, "epoch": 2211} {"train_loss": -23.19768714904785, "global_step": 183528, "epoch": 2211} {"train_loss": -23.44854736328125, "global_step": 183529, "epoch": 2211} {"train_loss": -24.071470260620117, "global_step": 183530, "epoch": 2211} {"train_loss": -23.85279655456543, "global_step": 183531, "epoch": 2211} {"train_loss": -23.678251266479492, "global_step": 183532, "epoch": 2211} {"train_loss": -23.512313842773438, "global_step": 183533, "epoch": 2211} {"train_loss": -23.841699600219727, "global_step": 183534, "epoch": 2211} {"train_loss": -23.68701171875, "global_step": 183535, "epoch": 2211} {"train_loss": -23.862049102783203, "global_step": 183536, "epoch": 2211} {"train_loss": -23.857656478881836, "global_step": 183537, "epoch": 2211} {"train_loss": -23.944015502929688, "global_step": 183538, "epoch": 2211} {"train_loss": -23.576141357421875, "global_step": 183539, "epoch": 2211} {"train_loss": -23.73578643798828, "global_step": 183540, "epoch": 2211} {"train_loss": -23.846179962158203, "global_step": 183541, "epoch": 2211} {"train_loss": -23.953649520874023, "global_step": 183542, "epoch": 2211} {"train_loss": -23.9588680267334, "global_step": 183543, "epoch": 2211} {"train_loss": -23.911901473999023, "global_step": 183544, "epoch": 2211} {"train_loss": -24.304351806640625, "global_step": 183545, "epoch": 2211} {"train_loss": -23.86445426940918, "global_step": 183546, "epoch": 2211} {"train_loss": -23.68115997314453, "global_step": 183547, "epoch": 2211} {"train_loss": -23.79180908203125, "global_step": 183548, "epoch": 2211} {"train_loss": -23.875198364257812, "global_step": 183549, "epoch": 2211} {"train_loss": -23.99540138244629, "global_step": 183550, "epoch": 2211} {"train_loss": -24.005971908569336, "global_step": 183551, "epoch": 2211} {"train_loss": -23.837221145629883, "global_step": 183552, "epoch": 2211} {"train_loss": -24.442380905151367, "global_step": 183553, "epoch": 2211} {"train_loss": -24.101938247680664, "global_step": 183554, "epoch": 2211} {"train_loss": -24.10086441040039, "global_step": 183555, "epoch": 2211} {"train_loss": -24.453397750854492, "global_step": 183556, "epoch": 2211} {"train_loss": -24.500024795532227, "global_step": 183557, "epoch": 2211} {"train_loss": -24.181724548339844, "global_step": 183558, "epoch": 2211} {"train_loss": -23.92059898376465, "global_step": 183559, "epoch": 2211} {"train_loss": -24.126041412353516, "global_step": 183560, "epoch": 2211} {"train_loss": -23.977720260620117, "global_step": 183561, "epoch": 2211} {"train_loss": -24.156871795654297, "global_step": 183562, "epoch": 2211} {"train_loss": -24.19100570678711, "global_step": 183563, "epoch": 2211} {"train_loss": -24.05422019958496, "global_step": 183564, "epoch": 2211} {"train_loss": -23.961942672729492, "global_step": 183565, "epoch": 2211} {"train_loss": -24.169719696044922, "global_step": 183566, "epoch": 2211} {"train_loss": -24.30986213684082, "global_step": 183567, "epoch": 2211} {"train_loss": -23.869741439819336, "global_step": 183568, "epoch": 2211} {"train_loss": -23.620067596435547, "global_step": 183569, "epoch": 2211} {"train_loss": -23.982519149780273, "global_step": 183570, "epoch": 2211} {"train_loss": -24.21364402770996, "global_step": 183571, "epoch": 2211} {"train_loss": -23.43096351623535, "global_step": 183572, "epoch": 2211} {"train_loss": -24.06892204284668, "global_step": 183573, "epoch": 2211} {"train_loss": -23.86128044128418, "global_step": 183574, "epoch": 2211} {"train_loss": -24.080890655517578, "global_step": 183575, "epoch": 2211} {"train_loss": -23.935726165771484, "global_step": 183576, "epoch": 2211} {"train_loss": -24.108610153198242, "global_step": 183577, "epoch": 2211} {"train_loss": -23.66529655456543, "global_step": 183578, "epoch": 2211} {"train_loss": -23.943302154541016, "global_step": 183579, "epoch": 2211} {"train_loss": -24.400291442871094, "global_step": 183580, "epoch": 2211} {"train_loss": -23.979883193969727, "global_step": 183581, "epoch": 2211} {"train_loss": -23.865468978881836, "global_step": 183582, "epoch": 2211} {"train_loss": -24.002904891967773, "global_step": 183583, "epoch": 2211} {"train_loss": -24.01881980895996, "global_step": 183584, "epoch": 2211} {"train_loss": -24.066577911376953, "global_step": 183585, "epoch": 2211} {"train_loss": -23.76677894592285, "global_step": 183586, "epoch": 2211} {"train_loss": -23.973003387451172, "global_step": 183587, "epoch": 2211} {"train_loss": -23.944644927978516, "global_step": 183588, "epoch": 2211} {"train_loss": -24.17891502380371, "global_step": 183589, "epoch": 2211} {"train_loss": -23.893985748291016, "global_step": 183590, "epoch": 2211} {"train_loss": -23.67711639404297, "global_step": 183591, "epoch": 2211} {"train_loss": -24.000110626220703, "global_step": 183592, "epoch": 2211} {"train_loss": -24.418230056762695, "global_step": 183593, "epoch": 2211} {"train_loss": -24.311927795410156, "global_step": 183594, "epoch": 2211} {"train_loss": -23.811839299029614, "global_step": 183595, "epoch": 2211, "val_loss": 6543151.0} {"train_loss": -23.615283966064453, "global_step": 183596, "epoch": 2212} {"train_loss": -23.50496482849121, "global_step": 183597, "epoch": 2212} {"train_loss": -23.673871994018555, "global_step": 183598, "epoch": 2212} {"train_loss": -23.168357849121094, "global_step": 183599, "epoch": 2212} {"train_loss": -23.497772216796875, "global_step": 183600, "epoch": 2212} {"train_loss": -23.546823501586914, "global_step": 183601, "epoch": 2212} {"train_loss": -23.423337936401367, "global_step": 183602, "epoch": 2212} {"train_loss": -23.742368698120117, "global_step": 183603, "epoch": 2212} {"train_loss": -23.664936065673828, "global_step": 183604, "epoch": 2212} {"train_loss": -23.756895065307617, "global_step": 183605, "epoch": 2212} {"train_loss": -23.416372299194336, "global_step": 183606, "epoch": 2212} {"train_loss": -23.586328506469727, "global_step": 183607, "epoch": 2212} {"train_loss": -23.66905975341797, "global_step": 183608, "epoch": 2212} {"train_loss": -23.522794723510742, "global_step": 183609, "epoch": 2212} {"train_loss": -23.61384391784668, "global_step": 183610, "epoch": 2212} {"train_loss": -24.0104923248291, "global_step": 183611, "epoch": 2212} {"train_loss": -23.8350887298584, "global_step": 183612, "epoch": 2212} {"train_loss": -24.02906608581543, "global_step": 183613, "epoch": 2212} {"train_loss": -23.83699607849121, "global_step": 183614, "epoch": 2212} {"train_loss": -23.774938583374023, "global_step": 183615, "epoch": 2212} {"train_loss": -23.63457489013672, "global_step": 183616, "epoch": 2212} {"train_loss": -24.02832794189453, "global_step": 183617, "epoch": 2212} {"train_loss": -23.82649040222168, "global_step": 183618, "epoch": 2212} {"train_loss": -24.144834518432617, "global_step": 183619, "epoch": 2212} {"train_loss": -23.991979598999023, "global_step": 183620, "epoch": 2212} {"train_loss": -24.05194091796875, "global_step": 183621, "epoch": 2212} {"train_loss": -23.499923706054688, "global_step": 183622, "epoch": 2212} {"train_loss": -23.834278106689453, "global_step": 183623, "epoch": 2212} {"train_loss": -23.816965103149414, "global_step": 183624, "epoch": 2212} {"train_loss": -23.80948829650879, "global_step": 183625, "epoch": 2212} {"train_loss": -24.141019821166992, "global_step": 183626, "epoch": 2212} {"train_loss": -23.499380111694336, "global_step": 183627, "epoch": 2212} {"train_loss": -23.714780807495117, "global_step": 183628, "epoch": 2212} {"train_loss": -23.797809600830078, "global_step": 183629, "epoch": 2212} {"train_loss": -24.058353424072266, "global_step": 183630, "epoch": 2212} {"train_loss": -23.832815170288086, "global_step": 183631, "epoch": 2212} {"train_loss": -24.15215492248535, "global_step": 183632, "epoch": 2212} {"train_loss": -24.149887084960938, "global_step": 183633, "epoch": 2212} {"train_loss": -24.087568283081055, "global_step": 183634, "epoch": 2212} {"train_loss": -24.027400970458984, "global_step": 183635, "epoch": 2212} {"train_loss": -23.930492401123047, "global_step": 183636, "epoch": 2212} {"train_loss": -23.87733268737793, "global_step": 183637, "epoch": 2212} {"train_loss": -24.311342239379883, "global_step": 183638, "epoch": 2212} {"train_loss": -23.846057891845703, "global_step": 183639, "epoch": 2212} {"train_loss": -23.467500686645508, "global_step": 183640, "epoch": 2212} {"train_loss": -24.015642166137695, "global_step": 183641, "epoch": 2212} {"train_loss": -23.89832878112793, "global_step": 183642, "epoch": 2212} {"train_loss": -23.871503829956055, "global_step": 183643, "epoch": 2212} {"train_loss": -23.880910873413086, "global_step": 183644, "epoch": 2212} {"train_loss": -24.002609252929688, "global_step": 183645, "epoch": 2212} {"train_loss": -24.307600021362305, "global_step": 183646, "epoch": 2212} {"train_loss": -23.555051803588867, "global_step": 183647, "epoch": 2212} {"train_loss": -23.60899543762207, "global_step": 183648, "epoch": 2212} {"train_loss": -24.059345245361328, "global_step": 183649, "epoch": 2212} {"train_loss": -24.18720245361328, "global_step": 183650, "epoch": 2212} {"train_loss": -24.255661010742188, "global_step": 183651, "epoch": 2212} {"train_loss": -23.447853088378906, "global_step": 183652, "epoch": 2212} {"train_loss": -24.33587074279785, "global_step": 183653, "epoch": 2212} {"train_loss": -24.0041561126709, "global_step": 183654, "epoch": 2212} {"train_loss": -24.074804306030273, "global_step": 183655, "epoch": 2212} {"train_loss": -24.069746017456055, "global_step": 183656, "epoch": 2212} {"train_loss": -24.496179580688477, "global_step": 183657, "epoch": 2212} {"train_loss": -23.994606018066406, "global_step": 183658, "epoch": 2212} {"train_loss": -24.056453704833984, "global_step": 183659, "epoch": 2212} {"train_loss": -23.826358795166016, "global_step": 183660, "epoch": 2212} {"train_loss": -24.077579498291016, "global_step": 183661, "epoch": 2212} {"train_loss": -24.2834529876709, "global_step": 183662, "epoch": 2212} {"train_loss": -24.1757869720459, "global_step": 183663, "epoch": 2212} {"train_loss": -24.344472885131836, "global_step": 183664, "epoch": 2212} {"train_loss": -24.287721633911133, "global_step": 183665, "epoch": 2212} {"train_loss": -23.995716094970703, "global_step": 183666, "epoch": 2212} {"train_loss": -23.9231014251709, "global_step": 183667, "epoch": 2212} {"train_loss": -24.085447311401367, "global_step": 183668, "epoch": 2212} {"train_loss": -24.2801570892334, "global_step": 183669, "epoch": 2212} {"train_loss": -23.94559097290039, "global_step": 183670, "epoch": 2212} {"train_loss": -24.082822799682617, "global_step": 183671, "epoch": 2212} {"train_loss": -24.41493034362793, "global_step": 183672, "epoch": 2212} {"train_loss": -24.122385025024414, "global_step": 183673, "epoch": 2212} {"train_loss": -24.177379608154297, "global_step": 183674, "epoch": 2212} {"train_loss": -24.06429672241211, "global_step": 183675, "epoch": 2212} {"train_loss": -24.368274688720703, "global_step": 183676, "epoch": 2212} {"train_loss": -24.060361862182617, "global_step": 183677, "epoch": 2212} {"train_loss": -23.915784628994494, "global_step": 183678, "epoch": 2212, "val_loss": 6432243.0} {"train_loss": -23.370059967041016, "global_step": 183679, "epoch": 2213} {"train_loss": -23.485944747924805, "global_step": 183680, "epoch": 2213} {"train_loss": -23.665084838867188, "global_step": 183681, "epoch": 2213} {"train_loss": -23.430288314819336, "global_step": 183682, "epoch": 2213} {"train_loss": -23.60291290283203, "global_step": 183683, "epoch": 2213} {"train_loss": -23.409818649291992, "global_step": 183684, "epoch": 2213} {"train_loss": -23.568281173706055, "global_step": 183685, "epoch": 2213} {"train_loss": -23.815534591674805, "global_step": 183686, "epoch": 2213} {"train_loss": -23.673583984375, "global_step": 183687, "epoch": 2213} {"train_loss": -23.806726455688477, "global_step": 183688, "epoch": 2213} {"train_loss": -23.42304039001465, "global_step": 183689, "epoch": 2213} {"train_loss": -23.55013084411621, "global_step": 183690, "epoch": 2213} {"train_loss": -23.50429344177246, "global_step": 183691, "epoch": 2213} {"train_loss": -23.79656982421875, "global_step": 183692, "epoch": 2213} {"train_loss": -24.030399322509766, "global_step": 183693, "epoch": 2213} {"train_loss": -23.896488189697266, "global_step": 183694, "epoch": 2213} {"train_loss": -24.015432357788086, "global_step": 183695, "epoch": 2213} {"train_loss": -23.948148727416992, "global_step": 183696, "epoch": 2213} {"train_loss": -24.06812858581543, "global_step": 183697, "epoch": 2213} {"train_loss": -24.277917861938477, "global_step": 183698, "epoch": 2213} {"train_loss": -23.99239158630371, "global_step": 183699, "epoch": 2213} {"train_loss": -24.29158592224121, "global_step": 183700, "epoch": 2213} {"train_loss": -23.85312271118164, "global_step": 183701, "epoch": 2213} {"train_loss": -23.659162521362305, "global_step": 183702, "epoch": 2213} {"train_loss": -24.13381004333496, "global_step": 183703, "epoch": 2213} {"train_loss": -24.15719985961914, "global_step": 183704, "epoch": 2213} {"train_loss": -23.889850616455078, "global_step": 183705, "epoch": 2213} {"train_loss": -24.074838638305664, "global_step": 183706, "epoch": 2213} {"train_loss": -24.04385757446289, "global_step": 183707, "epoch": 2213} {"train_loss": -24.275047302246094, "global_step": 183708, "epoch": 2213} {"train_loss": -24.03892707824707, "global_step": 183709, "epoch": 2213} {"train_loss": -23.843881607055664, "global_step": 183710, "epoch": 2213} {"train_loss": -23.68263816833496, "global_step": 183711, "epoch": 2213} {"train_loss": -24.044904708862305, "global_step": 183712, "epoch": 2213} {"train_loss": -23.894550323486328, "global_step": 183713, "epoch": 2213} {"train_loss": -24.20998191833496, "global_step": 183714, "epoch": 2213} {"train_loss": -23.676223754882812, "global_step": 183715, "epoch": 2213} {"train_loss": -23.984853744506836, "global_step": 183716, "epoch": 2213} {"train_loss": -24.243515014648438, "global_step": 183717, "epoch": 2213} {"train_loss": -24.125268936157227, "global_step": 183718, "epoch": 2213} {"train_loss": -23.944211959838867, "global_step": 183719, "epoch": 2213} {"train_loss": -23.922040939331055, "global_step": 183720, "epoch": 2213} {"train_loss": -24.07570457458496, "global_step": 183721, "epoch": 2213} {"train_loss": -24.151655197143555, "global_step": 183722, "epoch": 2213} {"train_loss": -23.96225929260254, "global_step": 183723, "epoch": 2213} {"train_loss": -24.10343360900879, "global_step": 183724, "epoch": 2213} {"train_loss": -23.93086814880371, "global_step": 183725, "epoch": 2213} {"train_loss": -24.362659454345703, "global_step": 183726, "epoch": 2213} {"train_loss": -23.985437393188477, "global_step": 183727, "epoch": 2213} {"train_loss": -24.095439910888672, "global_step": 183728, "epoch": 2213} {"train_loss": -23.746660232543945, "global_step": 183729, "epoch": 2213} {"train_loss": -23.585250854492188, "global_step": 183730, "epoch": 2213} {"train_loss": -23.401329040527344, "global_step": 183731, "epoch": 2213} {"train_loss": -23.731704711914062, "global_step": 183732, "epoch": 2213} {"train_loss": -23.390134811401367, "global_step": 183733, "epoch": 2213} {"train_loss": -23.32889175415039, "global_step": 183734, "epoch": 2213} {"train_loss": -23.61557388305664, "global_step": 183735, "epoch": 2213} {"train_loss": -23.67551612854004, "global_step": 183736, "epoch": 2213} {"train_loss": -23.855762481689453, "global_step": 183737, "epoch": 2213} {"train_loss": -23.473052978515625, "global_step": 183738, "epoch": 2213} {"train_loss": -24.075302124023438, "global_step": 183739, "epoch": 2213} {"train_loss": -23.527408599853516, "global_step": 183740, "epoch": 2213} {"train_loss": -23.55879020690918, "global_step": 183741, "epoch": 2213} {"train_loss": -23.894010543823242, "global_step": 183742, "epoch": 2213} {"train_loss": -23.913705825805664, "global_step": 183743, "epoch": 2213} {"train_loss": -23.7838191986084, "global_step": 183744, "epoch": 2213} {"train_loss": -23.579580307006836, "global_step": 183745, "epoch": 2213} {"train_loss": -23.71760368347168, "global_step": 183746, "epoch": 2213} {"train_loss": -23.374113082885742, "global_step": 183747, "epoch": 2213} {"train_loss": -23.467496871948242, "global_step": 183748, "epoch": 2213} {"train_loss": -24.27640151977539, "global_step": 183749, "epoch": 2213} {"train_loss": -23.67597770690918, "global_step": 183750, "epoch": 2213} {"train_loss": -23.660297393798828, "global_step": 183751, "epoch": 2213} {"train_loss": -23.990814208984375, "global_step": 183752, "epoch": 2213} {"train_loss": -23.947479248046875, "global_step": 183753, "epoch": 2213} {"train_loss": -23.743818283081055, "global_step": 183754, "epoch": 2213} {"train_loss": -23.649036407470703, "global_step": 183755, "epoch": 2213} {"train_loss": -23.734769821166992, "global_step": 183756, "epoch": 2213} {"train_loss": -23.894081115722656, "global_step": 183757, "epoch": 2213} {"train_loss": -24.137744903564453, "global_step": 183758, "epoch": 2213} {"train_loss": -24.256479263305664, "global_step": 183759, "epoch": 2213} {"train_loss": -23.82328224182129, "global_step": 183760, "epoch": 2213} {"train_loss": -23.83158908981875, "global_step": 183761, "epoch": 2213, "val_loss": 6491596.0} {"train_loss": -23.78327751159668, "global_step": 183762, "epoch": 2214} {"train_loss": -23.021108627319336, "global_step": 183763, "epoch": 2214} {"train_loss": -24.299495697021484, "global_step": 183764, "epoch": 2214} {"train_loss": -23.59153938293457, "global_step": 183765, "epoch": 2214} {"train_loss": -23.678363800048828, "global_step": 183766, "epoch": 2214} {"train_loss": -23.424802780151367, "global_step": 183767, "epoch": 2214} {"train_loss": -23.67890739440918, "global_step": 183768, "epoch": 2214} {"train_loss": -23.978450775146484, "global_step": 183769, "epoch": 2214} {"train_loss": -23.798847198486328, "global_step": 183770, "epoch": 2214} {"train_loss": -24.054283142089844, "global_step": 183771, "epoch": 2214} {"train_loss": -24.042577743530273, "global_step": 183772, "epoch": 2214} {"train_loss": -23.71318817138672, "global_step": 183773, "epoch": 2214} {"train_loss": -23.91830825805664, "global_step": 183774, "epoch": 2214} {"train_loss": -23.902851104736328, "global_step": 183775, "epoch": 2214} {"train_loss": -24.00849723815918, "global_step": 183776, "epoch": 2214} {"train_loss": -24.00113296508789, "global_step": 183777, "epoch": 2214} {"train_loss": -23.6712646484375, "global_step": 183778, "epoch": 2214} {"train_loss": -24.11427879333496, "global_step": 183779, "epoch": 2214} {"train_loss": -24.331544876098633, "global_step": 183780, "epoch": 2214} {"train_loss": -24.05045509338379, "global_step": 183781, "epoch": 2214} {"train_loss": -23.756011962890625, "global_step": 183782, "epoch": 2214} {"train_loss": -23.726652145385742, "global_step": 183783, "epoch": 2214} {"train_loss": -23.586294174194336, "global_step": 183784, "epoch": 2214} {"train_loss": -24.224058151245117, "global_step": 183785, "epoch": 2214} {"train_loss": -23.797727584838867, "global_step": 183786, "epoch": 2214} {"train_loss": -24.133176803588867, "global_step": 183787, "epoch": 2214} {"train_loss": -23.95623779296875, "global_step": 183788, "epoch": 2214} {"train_loss": -23.842315673828125, "global_step": 183789, "epoch": 2214} {"train_loss": -24.047767639160156, "global_step": 183790, "epoch": 2214} {"train_loss": -23.793495178222656, "global_step": 183791, "epoch": 2214} {"train_loss": -24.0898380279541, "global_step": 183792, "epoch": 2214} {"train_loss": -23.979623794555664, "global_step": 183793, "epoch": 2214} {"train_loss": -24.00333023071289, "global_step": 183794, "epoch": 2214} {"train_loss": -24.008468627929688, "global_step": 183795, "epoch": 2214} {"train_loss": -24.088911056518555, "global_step": 183796, "epoch": 2214} {"train_loss": -24.031850814819336, "global_step": 183797, "epoch": 2214} {"train_loss": -24.343103408813477, "global_step": 183798, "epoch": 2214} {"train_loss": -24.026578903198242, "global_step": 183799, "epoch": 2214} {"train_loss": -24.123281478881836, "global_step": 183800, "epoch": 2214} {"train_loss": -24.14617156982422, "global_step": 183801, "epoch": 2214} {"train_loss": -23.862939834594727, "global_step": 183802, "epoch": 2214} {"train_loss": -24.108049392700195, "global_step": 183803, "epoch": 2214} {"train_loss": -24.31068229675293, "global_step": 183804, "epoch": 2214} {"train_loss": -24.015880584716797, "global_step": 183805, "epoch": 2214} {"train_loss": -24.17310905456543, "global_step": 183806, "epoch": 2214} {"train_loss": -23.975812911987305, "global_step": 183807, "epoch": 2214} {"train_loss": -23.961889266967773, "global_step": 183808, "epoch": 2214} {"train_loss": -24.110801696777344, "global_step": 183809, "epoch": 2214} {"train_loss": -24.337322235107422, "global_step": 183810, "epoch": 2214} {"train_loss": -24.436111450195312, "global_step": 183811, "epoch": 2214} {"train_loss": -23.782686233520508, "global_step": 183812, "epoch": 2214} {"train_loss": -24.06694221496582, "global_step": 183813, "epoch": 2214} {"train_loss": -24.076833724975586, "global_step": 183814, "epoch": 2214} {"train_loss": -24.257360458374023, "global_step": 183815, "epoch": 2214} {"train_loss": -23.77394676208496, "global_step": 183816, "epoch": 2214} {"train_loss": -24.42466163635254, "global_step": 183817, "epoch": 2214} {"train_loss": -23.922855377197266, "global_step": 183818, "epoch": 2214} {"train_loss": -23.639068603515625, "global_step": 183819, "epoch": 2214} {"train_loss": -24.06740379333496, "global_step": 183820, "epoch": 2214} {"train_loss": -23.47333526611328, "global_step": 183821, "epoch": 2214} {"train_loss": -23.56898307800293, "global_step": 183822, "epoch": 2214} {"train_loss": -24.073307037353516, "global_step": 183823, "epoch": 2214} {"train_loss": -23.763227462768555, "global_step": 183824, "epoch": 2214} {"train_loss": -24.213058471679688, "global_step": 183825, "epoch": 2214} {"train_loss": -23.91546630859375, "global_step": 183826, "epoch": 2214} {"train_loss": -24.096237182617188, "global_step": 183827, "epoch": 2214} {"train_loss": -23.81142807006836, "global_step": 183828, "epoch": 2214} {"train_loss": -23.934396743774414, "global_step": 183829, "epoch": 2214} {"train_loss": -23.983572006225586, "global_step": 183830, "epoch": 2214} {"train_loss": -23.840179443359375, "global_step": 183831, "epoch": 2214} {"train_loss": -23.909162521362305, "global_step": 183832, "epoch": 2214} {"train_loss": -24.345083236694336, "global_step": 183833, "epoch": 2214} {"train_loss": -23.81528663635254, "global_step": 183834, "epoch": 2214} {"train_loss": -23.61383819580078, "global_step": 183835, "epoch": 2214} {"train_loss": -24.199995040893555, "global_step": 183836, "epoch": 2214} {"train_loss": -23.95411491394043, "global_step": 183837, "epoch": 2214} {"train_loss": -24.17073631286621, "global_step": 183838, "epoch": 2214} {"train_loss": -24.135910034179688, "global_step": 183839, "epoch": 2214} {"train_loss": -23.523237228393555, "global_step": 183840, "epoch": 2214} {"train_loss": -23.901010513305664, "global_step": 183841, "epoch": 2214} {"train_loss": -23.942258834838867, "global_step": 183842, "epoch": 2214} {"train_loss": -23.892093658447266, "global_step": 183843, "epoch": 2214} {"train_loss": -23.94287343772061, "global_step": 183844, "epoch": 2214, "val_loss": 6568068.5} {"train_loss": -23.499855041503906, "global_step": 183845, "epoch": 2215} {"train_loss": -24.053009033203125, "global_step": 183846, "epoch": 2215} {"train_loss": -23.633686065673828, "global_step": 183847, "epoch": 2215} {"train_loss": -23.51137351989746, "global_step": 183848, "epoch": 2215} {"train_loss": -23.613052368164062, "global_step": 183849, "epoch": 2215} {"train_loss": -23.64336585998535, "global_step": 183850, "epoch": 2215} {"train_loss": -24.17363929748535, "global_step": 183851, "epoch": 2215} {"train_loss": -24.207956314086914, "global_step": 183852, "epoch": 2215} {"train_loss": -23.891611099243164, "global_step": 183853, "epoch": 2215} {"train_loss": -23.456958770751953, "global_step": 183854, "epoch": 2215} {"train_loss": -23.69295310974121, "global_step": 183855, "epoch": 2215} {"train_loss": -23.607297897338867, "global_step": 183856, "epoch": 2215} {"train_loss": -23.79434585571289, "global_step": 183857, "epoch": 2215} {"train_loss": -23.65758514404297, "global_step": 183858, "epoch": 2215} {"train_loss": -24.175256729125977, "global_step": 183859, "epoch": 2215} {"train_loss": -23.733007431030273, "global_step": 183860, "epoch": 2215} {"train_loss": -24.149646759033203, "global_step": 183861, "epoch": 2215} {"train_loss": -23.892648696899414, "global_step": 183862, "epoch": 2215} {"train_loss": -23.955839157104492, "global_step": 183863, "epoch": 2215} {"train_loss": -24.18650245666504, "global_step": 183864, "epoch": 2215} {"train_loss": -23.86090660095215, "global_step": 183865, "epoch": 2215} {"train_loss": -24.200069427490234, "global_step": 183866, "epoch": 2215} {"train_loss": -23.90281105041504, "global_step": 183867, "epoch": 2215} {"train_loss": -24.029287338256836, "global_step": 183868, "epoch": 2215} {"train_loss": -23.92995834350586, "global_step": 183869, "epoch": 2215} {"train_loss": -23.857765197753906, "global_step": 183870, "epoch": 2215} {"train_loss": -23.656766891479492, "global_step": 183871, "epoch": 2215} {"train_loss": -24.10088539123535, "global_step": 183872, "epoch": 2215} {"train_loss": -23.822189331054688, "global_step": 183873, "epoch": 2215} {"train_loss": -24.253564834594727, "global_step": 183874, "epoch": 2215} {"train_loss": -24.058752059936523, "global_step": 183875, "epoch": 2215} {"train_loss": -24.140636444091797, "global_step": 183876, "epoch": 2215} {"train_loss": -24.37156105041504, "global_step": 183877, "epoch": 2215} {"train_loss": -24.255403518676758, "global_step": 183878, "epoch": 2215} {"train_loss": -23.717361450195312, "global_step": 183879, "epoch": 2215} {"train_loss": -24.30771255493164, "global_step": 183880, "epoch": 2215} {"train_loss": -23.9636287689209, "global_step": 183881, "epoch": 2215} {"train_loss": -23.839757919311523, "global_step": 183882, "epoch": 2215} {"train_loss": -23.35172462463379, "global_step": 183883, "epoch": 2215} {"train_loss": -23.187746047973633, "global_step": 183884, "epoch": 2215} {"train_loss": -23.6590633392334, "global_step": 183885, "epoch": 2215} {"train_loss": -24.019559860229492, "global_step": 183886, "epoch": 2215} {"train_loss": -23.616376876831055, "global_step": 183887, "epoch": 2215} {"train_loss": -23.817466735839844, "global_step": 183888, "epoch": 2215} {"train_loss": -23.7583065032959, "global_step": 183889, "epoch": 2215} {"train_loss": -23.734235763549805, "global_step": 183890, "epoch": 2215} {"train_loss": -23.615434646606445, "global_step": 183891, "epoch": 2215} {"train_loss": -23.610599517822266, "global_step": 183892, "epoch": 2215} {"train_loss": -23.635244369506836, "global_step": 183893, "epoch": 2215} {"train_loss": -24.0933837890625, "global_step": 183894, "epoch": 2215} {"train_loss": -23.864410400390625, "global_step": 183895, "epoch": 2215} {"train_loss": -24.005924224853516, "global_step": 183896, "epoch": 2215} {"train_loss": -24.090566635131836, "global_step": 183897, "epoch": 2215} {"train_loss": -24.163177490234375, "global_step": 183898, "epoch": 2215} {"train_loss": -23.990659713745117, "global_step": 183899, "epoch": 2215} {"train_loss": -23.872190475463867, "global_step": 183900, "epoch": 2215} {"train_loss": -24.047348022460938, "global_step": 183901, "epoch": 2215} {"train_loss": -24.046171188354492, "global_step": 183902, "epoch": 2215} {"train_loss": -24.324491500854492, "global_step": 183903, "epoch": 2215} {"train_loss": -23.818326950073242, "global_step": 183904, "epoch": 2215} {"train_loss": -24.339534759521484, "global_step": 183905, "epoch": 2215} {"train_loss": -23.966968536376953, "global_step": 183906, "epoch": 2215} {"train_loss": -24.03057289123535, "global_step": 183907, "epoch": 2215} {"train_loss": -24.10489273071289, "global_step": 183908, "epoch": 2215} {"train_loss": -24.25452995300293, "global_step": 183909, "epoch": 2215} {"train_loss": -24.027868270874023, "global_step": 183910, "epoch": 2215} {"train_loss": -24.01508903503418, "global_step": 183911, "epoch": 2215} {"train_loss": -23.966419219970703, "global_step": 183912, "epoch": 2215} {"train_loss": -24.11567497253418, "global_step": 183913, "epoch": 2215} {"train_loss": -23.87880516052246, "global_step": 183914, "epoch": 2215} {"train_loss": -24.203977584838867, "global_step": 183915, "epoch": 2215} {"train_loss": -24.11603355407715, "global_step": 183916, "epoch": 2215} {"train_loss": -23.932003021240234, "global_step": 183917, "epoch": 2215} {"train_loss": -24.1177978515625, "global_step": 183918, "epoch": 2215} {"train_loss": -23.889883041381836, "global_step": 183919, "epoch": 2215} {"train_loss": -23.695981979370117, "global_step": 183920, "epoch": 2215} {"train_loss": -23.996057510375977, "global_step": 183921, "epoch": 2215} {"train_loss": -23.72735595703125, "global_step": 183922, "epoch": 2215} {"train_loss": -23.801774978637695, "global_step": 183923, "epoch": 2215} {"train_loss": -23.86703872680664, "global_step": 183924, "epoch": 2215} {"train_loss": -23.574636459350586, "global_step": 183925, "epoch": 2215} {"train_loss": -23.908544540405273, "global_step": 183926, "epoch": 2215} {"train_loss": -23.909447865313794, "global_step": 183927, "epoch": 2215, "val_loss": 6564943.0} {"train_loss": -23.958484649658203, "global_step": 183928, "epoch": 2216} {"train_loss": -23.938188552856445, "global_step": 183929, "epoch": 2216} {"train_loss": -23.883930206298828, "global_step": 183930, "epoch": 2216} {"train_loss": -23.901575088500977, "global_step": 183931, "epoch": 2216} {"train_loss": -23.86720848083496, "global_step": 183932, "epoch": 2216} {"train_loss": -24.02010154724121, "global_step": 183933, "epoch": 2216} {"train_loss": -23.994834899902344, "global_step": 183934, "epoch": 2216} {"train_loss": -24.229005813598633, "global_step": 183935, "epoch": 2216} {"train_loss": -23.85968589782715, "global_step": 183936, "epoch": 2216} {"train_loss": -23.978343963623047, "global_step": 183937, "epoch": 2216} {"train_loss": -24.228790283203125, "global_step": 183938, "epoch": 2216} {"train_loss": -23.921354293823242, "global_step": 183939, "epoch": 2216} {"train_loss": -23.996793746948242, "global_step": 183940, "epoch": 2216} {"train_loss": -24.28401756286621, "global_step": 183941, "epoch": 2216} {"train_loss": -23.68021011352539, "global_step": 183942, "epoch": 2216} {"train_loss": -24.03594207763672, "global_step": 183943, "epoch": 2216} {"train_loss": -24.00992774963379, "global_step": 183944, "epoch": 2216} {"train_loss": -23.643571853637695, "global_step": 183945, "epoch": 2216} {"train_loss": -23.93163299560547, "global_step": 183946, "epoch": 2216} {"train_loss": -24.01895523071289, "global_step": 183947, "epoch": 2216} {"train_loss": -24.136030197143555, "global_step": 183948, "epoch": 2216} {"train_loss": -23.736621856689453, "global_step": 183949, "epoch": 2216} {"train_loss": -23.979049682617188, "global_step": 183950, "epoch": 2216} {"train_loss": -24.20864486694336, "global_step": 183951, "epoch": 2216} {"train_loss": -23.80246925354004, "global_step": 183952, "epoch": 2216} {"train_loss": -23.998939514160156, "global_step": 183953, "epoch": 2216} {"train_loss": -24.1449031829834, "global_step": 183954, "epoch": 2216} {"train_loss": -23.75753402709961, "global_step": 183955, "epoch": 2216} {"train_loss": -23.6812744140625, "global_step": 183956, "epoch": 2216} {"train_loss": -24.3183536529541, "global_step": 183957, "epoch": 2216} {"train_loss": -23.9310245513916, "global_step": 183958, "epoch": 2216} {"train_loss": -23.51722526550293, "global_step": 183959, "epoch": 2216} {"train_loss": -23.863271713256836, "global_step": 183960, "epoch": 2216} {"train_loss": -24.1213436126709, "global_step": 183961, "epoch": 2216} {"train_loss": -23.951095581054688, "global_step": 183962, "epoch": 2216} {"train_loss": -24.17612648010254, "global_step": 183963, "epoch": 2216} {"train_loss": -24.188232421875, "global_step": 183964, "epoch": 2216} {"train_loss": -24.28317642211914, "global_step": 183965, "epoch": 2216} {"train_loss": -24.16254997253418, "global_step": 183966, "epoch": 2216} {"train_loss": -24.073627471923828, "global_step": 183967, "epoch": 2216} {"train_loss": -23.893091201782227, "global_step": 183968, "epoch": 2216} {"train_loss": -24.01846694946289, "global_step": 183969, "epoch": 2216} {"train_loss": -23.599002838134766, "global_step": 183970, "epoch": 2216} {"train_loss": -23.84354591369629, "global_step": 183971, "epoch": 2216} {"train_loss": -24.146934509277344, "global_step": 183972, "epoch": 2216} {"train_loss": -23.917938232421875, "global_step": 183973, "epoch": 2216} {"train_loss": -23.89287757873535, "global_step": 183974, "epoch": 2216} {"train_loss": -23.785202026367188, "global_step": 183975, "epoch": 2216} {"train_loss": -23.99066734313965, "global_step": 183976, "epoch": 2216} {"train_loss": -23.975181579589844, "global_step": 183977, "epoch": 2216} {"train_loss": -23.614606857299805, "global_step": 183978, "epoch": 2216} {"train_loss": -24.21241569519043, "global_step": 183979, "epoch": 2216} {"train_loss": -24.109058380126953, "global_step": 183980, "epoch": 2216} {"train_loss": -23.728086471557617, "global_step": 183981, "epoch": 2216} {"train_loss": -23.40452766418457, "global_step": 183982, "epoch": 2216} {"train_loss": -24.102317810058594, "global_step": 183983, "epoch": 2216} {"train_loss": -23.215234756469727, "global_step": 183984, "epoch": 2216} {"train_loss": -23.743528366088867, "global_step": 183985, "epoch": 2216} {"train_loss": -24.550769805908203, "global_step": 183986, "epoch": 2216} {"train_loss": -23.675355911254883, "global_step": 183987, "epoch": 2216} {"train_loss": -24.099380493164062, "global_step": 183988, "epoch": 2216} {"train_loss": -23.914716720581055, "global_step": 183989, "epoch": 2216} {"train_loss": -23.447046279907227, "global_step": 183990, "epoch": 2216} {"train_loss": -23.68802261352539, "global_step": 183991, "epoch": 2216} {"train_loss": -24.152084350585938, "global_step": 183992, "epoch": 2216} {"train_loss": -23.94173240661621, "global_step": 183993, "epoch": 2216} {"train_loss": -24.09352684020996, "global_step": 183994, "epoch": 2216} {"train_loss": -23.938026428222656, "global_step": 183995, "epoch": 2216} {"train_loss": -24.1682186126709, "global_step": 183996, "epoch": 2216} {"train_loss": -23.9945011138916, "global_step": 183997, "epoch": 2216} {"train_loss": -23.93507194519043, "global_step": 183998, "epoch": 2216} {"train_loss": -23.982707977294922, "global_step": 183999, "epoch": 2216} {"train_loss": -23.87643051147461, "global_step": 184000, "epoch": 2216} {"train_loss": -23.98040008544922, "global_step": 184001, "epoch": 2216} {"train_loss": -24.041555404663086, "global_step": 184002, "epoch": 2216} {"train_loss": -24.333505630493164, "global_step": 184003, "epoch": 2216} {"train_loss": -24.27646255493164, "global_step": 184004, "epoch": 2216} {"train_loss": -24.175397872924805, "global_step": 184005, "epoch": 2216} {"train_loss": -24.054412841796875, "global_step": 184006, "epoch": 2216} {"train_loss": -24.36600685119629, "global_step": 184007, "epoch": 2216} {"train_loss": -24.202768325805664, "global_step": 184008, "epoch": 2216} {"train_loss": -23.900907516479492, "global_step": 184009, "epoch": 2216} {"train_loss": -23.976230920079242, "global_step": 184010, "epoch": 2216, "val_loss": 6550543.5} {"train_loss": -23.001779556274414, "global_step": 184011, "epoch": 2217} {"train_loss": -23.125831604003906, "global_step": 184012, "epoch": 2217} {"train_loss": -22.901052474975586, "global_step": 184013, "epoch": 2217} {"train_loss": -22.99321937561035, "global_step": 184014, "epoch": 2217} {"train_loss": -23.06524085998535, "global_step": 184015, "epoch": 2217} {"train_loss": -23.298490524291992, "global_step": 184016, "epoch": 2217} {"train_loss": -23.345062255859375, "global_step": 184017, "epoch": 2217} {"train_loss": -23.04349708557129, "global_step": 184018, "epoch": 2217} {"train_loss": -23.304990768432617, "global_step": 184019, "epoch": 2217} {"train_loss": -23.287567138671875, "global_step": 184020, "epoch": 2217} {"train_loss": -23.3591365814209, "global_step": 184021, "epoch": 2217} {"train_loss": -23.55497932434082, "global_step": 184022, "epoch": 2217} {"train_loss": -23.212095260620117, "global_step": 184023, "epoch": 2217} {"train_loss": -23.445701599121094, "global_step": 184024, "epoch": 2217} {"train_loss": -23.582351684570312, "global_step": 184025, "epoch": 2217} {"train_loss": -23.78598403930664, "global_step": 184026, "epoch": 2217} {"train_loss": -23.703771591186523, "global_step": 184027, "epoch": 2217} {"train_loss": -23.651439666748047, "global_step": 184028, "epoch": 2217} {"train_loss": -23.41924476623535, "global_step": 184029, "epoch": 2217} {"train_loss": -23.71272087097168, "global_step": 184030, "epoch": 2217} {"train_loss": -23.369266510009766, "global_step": 184031, "epoch": 2217} {"train_loss": -23.808706283569336, "global_step": 184032, "epoch": 2217} {"train_loss": -23.822921752929688, "global_step": 184033, "epoch": 2217} {"train_loss": -23.860578536987305, "global_step": 184034, "epoch": 2217} {"train_loss": -23.71504783630371, "global_step": 184035, "epoch": 2217} {"train_loss": -23.790771484375, "global_step": 184036, "epoch": 2217} {"train_loss": -23.961719512939453, "global_step": 184037, "epoch": 2217} {"train_loss": -23.6301212310791, "global_step": 184038, "epoch": 2217} {"train_loss": -23.82307243347168, "global_step": 184039, "epoch": 2217} {"train_loss": -23.900562286376953, "global_step": 184040, "epoch": 2217} {"train_loss": -24.026803970336914, "global_step": 184041, "epoch": 2217} {"train_loss": -23.93608856201172, "global_step": 184042, "epoch": 2217} {"train_loss": -24.28570556640625, "global_step": 184043, "epoch": 2217} {"train_loss": -24.42235565185547, "global_step": 184044, "epoch": 2217} {"train_loss": -23.967254638671875, "global_step": 184045, "epoch": 2217} {"train_loss": -23.89329719543457, "global_step": 184046, "epoch": 2217} {"train_loss": -24.127668380737305, "global_step": 184047, "epoch": 2217} {"train_loss": -24.224939346313477, "global_step": 184048, "epoch": 2217} {"train_loss": -23.953149795532227, "global_step": 184049, "epoch": 2217} {"train_loss": -23.713163375854492, "global_step": 184050, "epoch": 2217} {"train_loss": -23.862646102905273, "global_step": 184051, "epoch": 2217} {"train_loss": -23.853214263916016, "global_step": 184052, "epoch": 2217} {"train_loss": -24.193634033203125, "global_step": 184053, "epoch": 2217} {"train_loss": -23.84038734436035, "global_step": 184054, "epoch": 2217} {"train_loss": -23.810895919799805, "global_step": 184055, "epoch": 2217} {"train_loss": -24.2963924407959, "global_step": 184056, "epoch": 2217} {"train_loss": -23.76087760925293, "global_step": 184057, "epoch": 2217} {"train_loss": -24.135635375976562, "global_step": 184058, "epoch": 2217} {"train_loss": -24.343826293945312, "global_step": 184059, "epoch": 2217} {"train_loss": -24.350391387939453, "global_step": 184060, "epoch": 2217} {"train_loss": -24.027423858642578, "global_step": 184061, "epoch": 2217} {"train_loss": -24.283287048339844, "global_step": 184062, "epoch": 2217} {"train_loss": -23.768848419189453, "global_step": 184063, "epoch": 2217} {"train_loss": -24.130714416503906, "global_step": 184064, "epoch": 2217} {"train_loss": -24.24976921081543, "global_step": 184065, "epoch": 2217} {"train_loss": -24.429128646850586, "global_step": 184066, "epoch": 2217} {"train_loss": -23.99915885925293, "global_step": 184067, "epoch": 2217} {"train_loss": -23.864513397216797, "global_step": 184068, "epoch": 2217} {"train_loss": -23.870817184448242, "global_step": 184069, "epoch": 2217} {"train_loss": -23.9021053314209, "global_step": 184070, "epoch": 2217} {"train_loss": -23.85523223876953, "global_step": 184071, "epoch": 2217} {"train_loss": -23.787660598754883, "global_step": 184072, "epoch": 2217} {"train_loss": -23.89296531677246, "global_step": 184073, "epoch": 2217} {"train_loss": -23.97342872619629, "global_step": 184074, "epoch": 2217} {"train_loss": -23.64613914489746, "global_step": 184075, "epoch": 2217} {"train_loss": -24.049165725708008, "global_step": 184076, "epoch": 2217} {"train_loss": -23.806982040405273, "global_step": 184077, "epoch": 2217} {"train_loss": -24.064380645751953, "global_step": 184078, "epoch": 2217} {"train_loss": -24.210412979125977, "global_step": 184079, "epoch": 2217} {"train_loss": -23.672292709350586, "global_step": 184080, "epoch": 2217} {"train_loss": -24.104211807250977, "global_step": 184081, "epoch": 2217} {"train_loss": -23.947904586791992, "global_step": 184082, "epoch": 2217} {"train_loss": -24.15863037109375, "global_step": 184083, "epoch": 2217} {"train_loss": -24.092824935913086, "global_step": 184084, "epoch": 2217} {"train_loss": -24.172042846679688, "global_step": 184085, "epoch": 2217} {"train_loss": -24.09285545349121, "global_step": 184086, "epoch": 2217} {"train_loss": -23.753803253173828, "global_step": 184087, "epoch": 2217} {"train_loss": -24.285913467407227, "global_step": 184088, "epoch": 2217} {"train_loss": -23.81978988647461, "global_step": 184089, "epoch": 2217} {"train_loss": -23.5455379486084, "global_step": 184090, "epoch": 2217} {"train_loss": -23.861997604370117, "global_step": 184091, "epoch": 2217} {"train_loss": -24.133502960205078, "global_step": 184092, "epoch": 2217} {"train_loss": -23.830154372985106, "global_step": 184093, "epoch": 2217, "val_loss": 6616853.0} {"train_loss": -23.928407669067383, "global_step": 184094, "epoch": 2218} {"train_loss": -23.313404083251953, "global_step": 184095, "epoch": 2218} {"train_loss": -23.341659545898438, "global_step": 184096, "epoch": 2218} {"train_loss": -23.187116622924805, "global_step": 184097, "epoch": 2218} {"train_loss": -23.00088882446289, "global_step": 184098, "epoch": 2218} {"train_loss": -23.657398223876953, "global_step": 184099, "epoch": 2218} {"train_loss": -23.703004837036133, "global_step": 184100, "epoch": 2218} {"train_loss": -23.2989559173584, "global_step": 184101, "epoch": 2218} {"train_loss": -23.81685447692871, "global_step": 184102, "epoch": 2218} {"train_loss": -23.561731338500977, "global_step": 184103, "epoch": 2218} {"train_loss": -23.50590705871582, "global_step": 184104, "epoch": 2218} {"train_loss": -24.159168243408203, "global_step": 184105, "epoch": 2218} {"train_loss": -23.49979591369629, "global_step": 184106, "epoch": 2218} {"train_loss": -23.915842056274414, "global_step": 184107, "epoch": 2218} {"train_loss": -23.905078887939453, "global_step": 184108, "epoch": 2218} {"train_loss": -23.777816772460938, "global_step": 184109, "epoch": 2218} {"train_loss": -23.63075065612793, "global_step": 184110, "epoch": 2218} {"train_loss": -23.87758445739746, "global_step": 184111, "epoch": 2218} {"train_loss": -23.786239624023438, "global_step": 184112, "epoch": 2218} {"train_loss": -23.57554054260254, "global_step": 184113, "epoch": 2218} {"train_loss": -24.154478073120117, "global_step": 184114, "epoch": 2218} {"train_loss": -24.19559669494629, "global_step": 184115, "epoch": 2218} {"train_loss": -24.18968963623047, "global_step": 184116, "epoch": 2218} {"train_loss": -23.79574966430664, "global_step": 184117, "epoch": 2218} {"train_loss": -23.86427879333496, "global_step": 184118, "epoch": 2218} {"train_loss": -23.98552703857422, "global_step": 184119, "epoch": 2218} {"train_loss": -23.881311416625977, "global_step": 184120, "epoch": 2218} {"train_loss": -24.086181640625, "global_step": 184121, "epoch": 2218} {"train_loss": -23.726057052612305, "global_step": 184122, "epoch": 2218} {"train_loss": -23.988107681274414, "global_step": 184123, "epoch": 2218} {"train_loss": -23.788667678833008, "global_step": 184124, "epoch": 2218} {"train_loss": -24.291906356811523, "global_step": 184125, "epoch": 2218} {"train_loss": -24.073755264282227, "global_step": 184126, "epoch": 2218} {"train_loss": -23.742433547973633, "global_step": 184127, "epoch": 2218} {"train_loss": -24.129484176635742, "global_step": 184128, "epoch": 2218} {"train_loss": -24.1036376953125, "global_step": 184129, "epoch": 2218} {"train_loss": -23.932998657226562, "global_step": 184130, "epoch": 2218} {"train_loss": -24.309314727783203, "global_step": 184131, "epoch": 2218} {"train_loss": -24.01410484313965, "global_step": 184132, "epoch": 2218} {"train_loss": -24.000181198120117, "global_step": 184133, "epoch": 2218} {"train_loss": -23.89594841003418, "global_step": 184134, "epoch": 2218} {"train_loss": -23.96962547302246, "global_step": 184135, "epoch": 2218} {"train_loss": -24.18942642211914, "global_step": 184136, "epoch": 2218} {"train_loss": -23.996662139892578, "global_step": 184137, "epoch": 2218} {"train_loss": -24.542776107788086, "global_step": 184138, "epoch": 2218} {"train_loss": -24.007665634155273, "global_step": 184139, "epoch": 2218} {"train_loss": -23.32639503479004, "global_step": 184140, "epoch": 2218} {"train_loss": -23.62285614013672, "global_step": 184141, "epoch": 2218} {"train_loss": -23.67698097229004, "global_step": 184142, "epoch": 2218} {"train_loss": -24.069271087646484, "global_step": 184143, "epoch": 2218} {"train_loss": -24.249570846557617, "global_step": 184144, "epoch": 2218} {"train_loss": -23.92620277404785, "global_step": 184145, "epoch": 2218} {"train_loss": -23.441654205322266, "global_step": 184146, "epoch": 2218} {"train_loss": -23.772350311279297, "global_step": 184147, "epoch": 2218} {"train_loss": -23.870573043823242, "global_step": 184148, "epoch": 2218} {"train_loss": -23.932363510131836, "global_step": 184149, "epoch": 2218} {"train_loss": -24.16067123413086, "global_step": 184150, "epoch": 2218} {"train_loss": -24.00668716430664, "global_step": 184151, "epoch": 2218} {"train_loss": -24.420852661132812, "global_step": 184152, "epoch": 2218} {"train_loss": -23.790382385253906, "global_step": 184153, "epoch": 2218} {"train_loss": -23.941526412963867, "global_step": 184154, "epoch": 2218} {"train_loss": -23.718368530273438, "global_step": 184155, "epoch": 2218} {"train_loss": -23.664350509643555, "global_step": 184156, "epoch": 2218} {"train_loss": -24.081541061401367, "global_step": 184157, "epoch": 2218} {"train_loss": -24.193649291992188, "global_step": 184158, "epoch": 2218} {"train_loss": -24.1612606048584, "global_step": 184159, "epoch": 2218} {"train_loss": -24.0919132232666, "global_step": 184160, "epoch": 2218} {"train_loss": -23.960187911987305, "global_step": 184161, "epoch": 2218} {"train_loss": -24.01841163635254, "global_step": 184162, "epoch": 2218} {"train_loss": -24.098987579345703, "global_step": 184163, "epoch": 2218} {"train_loss": -23.835779190063477, "global_step": 184164, "epoch": 2218} {"train_loss": -23.70157814025879, "global_step": 184165, "epoch": 2218} {"train_loss": -23.768829345703125, "global_step": 184166, "epoch": 2218} {"train_loss": -23.552663803100586, "global_step": 184167, "epoch": 2218} {"train_loss": -24.185121536254883, "global_step": 184168, "epoch": 2218} {"train_loss": -23.907825469970703, "global_step": 184169, "epoch": 2218} {"train_loss": -24.19745445251465, "global_step": 184170, "epoch": 2218} {"train_loss": -23.78724479675293, "global_step": 184171, "epoch": 2218} {"train_loss": -24.495996475219727, "global_step": 184172, "epoch": 2218} {"train_loss": -23.900678634643555, "global_step": 184173, "epoch": 2218} {"train_loss": -23.545087814331055, "global_step": 184174, "epoch": 2218} {"train_loss": -24.279829025268555, "global_step": 184175, "epoch": 2218} {"train_loss": -23.878788844648614, "global_step": 184176, "epoch": 2218, "val_loss": 6474548.5} {"train_loss": -23.47714614868164, "global_step": 184177, "epoch": 2219} {"train_loss": -23.594970703125, "global_step": 184178, "epoch": 2219} {"train_loss": -23.71425437927246, "global_step": 184179, "epoch": 2219} {"train_loss": -23.769676208496094, "global_step": 184180, "epoch": 2219} {"train_loss": -23.531997680664062, "global_step": 184181, "epoch": 2219} {"train_loss": -24.062429428100586, "global_step": 184182, "epoch": 2219} {"train_loss": -23.606372833251953, "global_step": 184183, "epoch": 2219} {"train_loss": -23.7840633392334, "global_step": 184184, "epoch": 2219} {"train_loss": -23.619531631469727, "global_step": 184185, "epoch": 2219} {"train_loss": -23.55476188659668, "global_step": 184186, "epoch": 2219} {"train_loss": -23.903982162475586, "global_step": 184187, "epoch": 2219} {"train_loss": -23.97208023071289, "global_step": 184188, "epoch": 2219} {"train_loss": -23.8745174407959, "global_step": 184189, "epoch": 2219} {"train_loss": -23.589767456054688, "global_step": 184190, "epoch": 2219} {"train_loss": -24.034997940063477, "global_step": 184191, "epoch": 2219} {"train_loss": -23.707855224609375, "global_step": 184192, "epoch": 2219} {"train_loss": -23.814743041992188, "global_step": 184193, "epoch": 2219} {"train_loss": -24.255218505859375, "global_step": 184194, "epoch": 2219} {"train_loss": -23.60662269592285, "global_step": 184195, "epoch": 2219} {"train_loss": -24.322900772094727, "global_step": 184196, "epoch": 2219} {"train_loss": -24.181394577026367, "global_step": 184197, "epoch": 2219} {"train_loss": -23.98194122314453, "global_step": 184198, "epoch": 2219} {"train_loss": -24.311071395874023, "global_step": 184199, "epoch": 2219} {"train_loss": -24.295345306396484, "global_step": 184200, "epoch": 2219} {"train_loss": -23.579938888549805, "global_step": 184201, "epoch": 2219} {"train_loss": -24.08030128479004, "global_step": 184202, "epoch": 2219} {"train_loss": -23.675796508789062, "global_step": 184203, "epoch": 2219} {"train_loss": -24.326993942260742, "global_step": 184204, "epoch": 2219} {"train_loss": -23.987226486206055, "global_step": 184205, "epoch": 2219} {"train_loss": -24.267780303955078, "global_step": 184206, "epoch": 2219} {"train_loss": -23.930299758911133, "global_step": 184207, "epoch": 2219} {"train_loss": -24.007293701171875, "global_step": 184208, "epoch": 2219} {"train_loss": -24.02907371520996, "global_step": 184209, "epoch": 2219} {"train_loss": -24.030954360961914, "global_step": 184210, "epoch": 2219} {"train_loss": -23.71733283996582, "global_step": 184211, "epoch": 2219} {"train_loss": -24.149927139282227, "global_step": 184212, "epoch": 2219} {"train_loss": -24.008541107177734, "global_step": 184213, "epoch": 2219} {"train_loss": -23.95612907409668, "global_step": 184214, "epoch": 2219} {"train_loss": -23.18319320678711, "global_step": 184215, "epoch": 2219} {"train_loss": -23.77806282043457, "global_step": 184216, "epoch": 2219} {"train_loss": -23.898040771484375, "global_step": 184217, "epoch": 2219} {"train_loss": -23.711210250854492, "global_step": 184218, "epoch": 2219} {"train_loss": -23.592254638671875, "global_step": 184219, "epoch": 2219} {"train_loss": -23.931699752807617, "global_step": 184220, "epoch": 2219} {"train_loss": -24.41762351989746, "global_step": 184221, "epoch": 2219} {"train_loss": -23.92840576171875, "global_step": 184222, "epoch": 2219} {"train_loss": -23.9129638671875, "global_step": 184223, "epoch": 2219} {"train_loss": -24.053037643432617, "global_step": 184224, "epoch": 2219} {"train_loss": -24.065868377685547, "global_step": 184225, "epoch": 2219} {"train_loss": -23.39168357849121, "global_step": 184226, "epoch": 2219} {"train_loss": -23.655521392822266, "global_step": 184227, "epoch": 2219} {"train_loss": -23.860660552978516, "global_step": 184228, "epoch": 2219} {"train_loss": -23.617368698120117, "global_step": 184229, "epoch": 2219} {"train_loss": -23.823627471923828, "global_step": 184230, "epoch": 2219} {"train_loss": -24.281339645385742, "global_step": 184231, "epoch": 2219} {"train_loss": -23.737051010131836, "global_step": 184232, "epoch": 2219} {"train_loss": -23.94840431213379, "global_step": 184233, "epoch": 2219} {"train_loss": -24.00140380859375, "global_step": 184234, "epoch": 2219} {"train_loss": -23.90333366394043, "global_step": 184235, "epoch": 2219} {"train_loss": -23.7377872467041, "global_step": 184236, "epoch": 2219} {"train_loss": -23.619970321655273, "global_step": 184237, "epoch": 2219} {"train_loss": -24.38612174987793, "global_step": 184238, "epoch": 2219} {"train_loss": -23.94295310974121, "global_step": 184239, "epoch": 2219} {"train_loss": -23.990467071533203, "global_step": 184240, "epoch": 2219} {"train_loss": -24.173452377319336, "global_step": 184241, "epoch": 2219} {"train_loss": -24.409460067749023, "global_step": 184242, "epoch": 2219} {"train_loss": -23.502609252929688, "global_step": 184243, "epoch": 2219} {"train_loss": -24.27243423461914, "global_step": 184244, "epoch": 2219} {"train_loss": -23.752182006835938, "global_step": 184245, "epoch": 2219} {"train_loss": -23.723474502563477, "global_step": 184246, "epoch": 2219} {"train_loss": -24.03389549255371, "global_step": 184247, "epoch": 2219} {"train_loss": -24.020246505737305, "global_step": 184248, "epoch": 2219} {"train_loss": -23.868223190307617, "global_step": 184249, "epoch": 2219} {"train_loss": -24.234432220458984, "global_step": 184250, "epoch": 2219} {"train_loss": -23.994548797607422, "global_step": 184251, "epoch": 2219} {"train_loss": -24.102231979370117, "global_step": 184252, "epoch": 2219} {"train_loss": -23.34638786315918, "global_step": 184253, "epoch": 2219} {"train_loss": -23.89807891845703, "global_step": 184254, "epoch": 2219} {"train_loss": -23.955400466918945, "global_step": 184255, "epoch": 2219} {"train_loss": -23.988019943237305, "global_step": 184256, "epoch": 2219} {"train_loss": -23.749181747436523, "global_step": 184257, "epoch": 2219} {"train_loss": -24.023120880126953, "global_step": 184258, "epoch": 2219} {"train_loss": -23.894337964345173, "global_step": 184259, "epoch": 2219, "val_loss": 6634073.0} {"train_loss": -23.255151748657227, "global_step": 184260, "epoch": 2220} {"train_loss": -23.561080932617188, "global_step": 184261, "epoch": 2220} {"train_loss": -23.5882511138916, "global_step": 184262, "epoch": 2220} {"train_loss": -23.555194854736328, "global_step": 184263, "epoch": 2220} {"train_loss": -23.468353271484375, "global_step": 184264, "epoch": 2220} {"train_loss": -23.154722213745117, "global_step": 184265, "epoch": 2220} {"train_loss": -24.124258041381836, "global_step": 184266, "epoch": 2220} {"train_loss": -23.273380279541016, "global_step": 184267, "epoch": 2220} {"train_loss": -23.243093490600586, "global_step": 184268, "epoch": 2220} {"train_loss": -23.64656639099121, "global_step": 184269, "epoch": 2220} {"train_loss": -23.32293128967285, "global_step": 184270, "epoch": 2220} {"train_loss": -23.583322525024414, "global_step": 184271, "epoch": 2220} {"train_loss": -23.8240966796875, "global_step": 184272, "epoch": 2220} {"train_loss": -23.28876495361328, "global_step": 184273, "epoch": 2220} {"train_loss": -23.692996978759766, "global_step": 184274, "epoch": 2220} {"train_loss": -24.176584243774414, "global_step": 184275, "epoch": 2220} {"train_loss": -23.685962677001953, "global_step": 184276, "epoch": 2220} {"train_loss": -23.52923011779785, "global_step": 184277, "epoch": 2220} {"train_loss": -23.612335205078125, "global_step": 184278, "epoch": 2220} {"train_loss": -23.613340377807617, "global_step": 184279, "epoch": 2220} {"train_loss": -23.72433090209961, "global_step": 184280, "epoch": 2220} {"train_loss": -23.50812339782715, "global_step": 184281, "epoch": 2220} {"train_loss": -23.919137954711914, "global_step": 184282, "epoch": 2220} {"train_loss": -23.666372299194336, "global_step": 184283, "epoch": 2220} {"train_loss": -23.70969581604004, "global_step": 184284, "epoch": 2220} {"train_loss": -23.944780349731445, "global_step": 184285, "epoch": 2220} {"train_loss": -23.94148826599121, "global_step": 184286, "epoch": 2220} {"train_loss": -23.989347457885742, "global_step": 184287, "epoch": 2220} {"train_loss": -23.723388671875, "global_step": 184288, "epoch": 2220} {"train_loss": -23.874664306640625, "global_step": 184289, "epoch": 2220} {"train_loss": -23.838281631469727, "global_step": 184290, "epoch": 2220} {"train_loss": -24.06429100036621, "global_step": 184291, "epoch": 2220} {"train_loss": -23.729637145996094, "global_step": 184292, "epoch": 2220} {"train_loss": -24.311674118041992, "global_step": 184293, "epoch": 2220} {"train_loss": -24.33020782470703, "global_step": 184294, "epoch": 2220} {"train_loss": -24.07529067993164, "global_step": 184295, "epoch": 2220} {"train_loss": -23.873022079467773, "global_step": 184296, "epoch": 2220} {"train_loss": -23.70144271850586, "global_step": 184297, "epoch": 2220} {"train_loss": -23.9460506439209, "global_step": 184298, "epoch": 2220} {"train_loss": -24.051258087158203, "global_step": 184299, "epoch": 2220} {"train_loss": -24.485397338867188, "global_step": 184300, "epoch": 2220} {"train_loss": -23.861265182495117, "global_step": 184301, "epoch": 2220} {"train_loss": -23.830102920532227, "global_step": 184302, "epoch": 2220} {"train_loss": -24.21232032775879, "global_step": 184303, "epoch": 2220} {"train_loss": -24.084409713745117, "global_step": 184304, "epoch": 2220} {"train_loss": -23.822101593017578, "global_step": 184305, "epoch": 2220} {"train_loss": -24.049909591674805, "global_step": 184306, "epoch": 2220} {"train_loss": -24.087289810180664, "global_step": 184307, "epoch": 2220} {"train_loss": -23.87821388244629, "global_step": 184308, "epoch": 2220} {"train_loss": -24.176023483276367, "global_step": 184309, "epoch": 2220} {"train_loss": -24.246719360351562, "global_step": 184310, "epoch": 2220} {"train_loss": -23.680753707885742, "global_step": 184311, "epoch": 2220} {"train_loss": -23.949071884155273, "global_step": 184312, "epoch": 2220} {"train_loss": -24.27829933166504, "global_step": 184313, "epoch": 2220} {"train_loss": -24.114212036132812, "global_step": 184314, "epoch": 2220} {"train_loss": -23.762332916259766, "global_step": 184315, "epoch": 2220} {"train_loss": -23.665332794189453, "global_step": 184316, "epoch": 2220} {"train_loss": -23.85854721069336, "global_step": 184317, "epoch": 2220} {"train_loss": -24.189218521118164, "global_step": 184318, "epoch": 2220} {"train_loss": -23.820280075073242, "global_step": 184319, "epoch": 2220} {"train_loss": -24.19670867919922, "global_step": 184320, "epoch": 2220} {"train_loss": -24.073997497558594, "global_step": 184321, "epoch": 2220} {"train_loss": -24.123090744018555, "global_step": 184322, "epoch": 2220} {"train_loss": -23.943103790283203, "global_step": 184323, "epoch": 2220} {"train_loss": -23.840606689453125, "global_step": 184324, "epoch": 2220} {"train_loss": -24.2356014251709, "global_step": 184325, "epoch": 2220} {"train_loss": -24.246702194213867, "global_step": 184326, "epoch": 2220} {"train_loss": -24.5357723236084, "global_step": 184327, "epoch": 2220} {"train_loss": -24.20577049255371, "global_step": 184328, "epoch": 2220} {"train_loss": -24.40201759338379, "global_step": 184329, "epoch": 2220} {"train_loss": -24.30225944519043, "global_step": 184330, "epoch": 2220} {"train_loss": -24.20136833190918, "global_step": 184331, "epoch": 2220} {"train_loss": -24.604907989501953, "global_step": 184332, "epoch": 2220} {"train_loss": -24.130172729492188, "global_step": 184333, "epoch": 2220} {"train_loss": -24.008333206176758, "global_step": 184334, "epoch": 2220} {"train_loss": -24.17144775390625, "global_step": 184335, "epoch": 2220} {"train_loss": -24.080204010009766, "global_step": 184336, "epoch": 2220} {"train_loss": -24.05996322631836, "global_step": 184337, "epoch": 2220} {"train_loss": -24.309404373168945, "global_step": 184338, "epoch": 2220} {"train_loss": -24.050146102905273, "global_step": 184339, "epoch": 2220} {"train_loss": -24.259031295776367, "global_step": 184340, "epoch": 2220} {"train_loss": -24.284603118896484, "global_step": 184341, "epoch": 2220} {"train_loss": -23.93111125532403, "global_step": 184342, "epoch": 2220, "val_loss": 6584515.5} {"train_loss": -23.950769424438477, "global_step": 184343, "epoch": 2221} {"train_loss": -23.405643463134766, "global_step": 184344, "epoch": 2221} {"train_loss": -23.3923282623291, "global_step": 184345, "epoch": 2221} {"train_loss": -23.82332992553711, "global_step": 184346, "epoch": 2221} {"train_loss": -23.623884201049805, "global_step": 184347, "epoch": 2221} {"train_loss": -24.012611389160156, "global_step": 184348, "epoch": 2221} {"train_loss": -23.584333419799805, "global_step": 184349, "epoch": 2221} {"train_loss": -23.927968978881836, "global_step": 184350, "epoch": 2221} {"train_loss": -23.658174514770508, "global_step": 184351, "epoch": 2221} {"train_loss": -24.203840255737305, "global_step": 184352, "epoch": 2221} {"train_loss": -23.733869552612305, "global_step": 184353, "epoch": 2221} {"train_loss": -23.708267211914062, "global_step": 184354, "epoch": 2221} {"train_loss": -24.114913940429688, "global_step": 184355, "epoch": 2221} {"train_loss": -23.727567672729492, "global_step": 184356, "epoch": 2221} {"train_loss": -23.932790756225586, "global_step": 184357, "epoch": 2221} {"train_loss": -23.602537155151367, "global_step": 184358, "epoch": 2221} {"train_loss": -23.997295379638672, "global_step": 184359, "epoch": 2221} {"train_loss": -23.78864860534668, "global_step": 184360, "epoch": 2221} {"train_loss": -23.899751663208008, "global_step": 184361, "epoch": 2221} {"train_loss": -23.669132232666016, "global_step": 184362, "epoch": 2221} {"train_loss": -24.009550094604492, "global_step": 184363, "epoch": 2221} {"train_loss": -23.82880973815918, "global_step": 184364, "epoch": 2221} {"train_loss": -23.90738868713379, "global_step": 184365, "epoch": 2221} {"train_loss": -24.567472457885742, "global_step": 184366, "epoch": 2221} {"train_loss": -23.729413986206055, "global_step": 184367, "epoch": 2221} {"train_loss": -23.842214584350586, "global_step": 184368, "epoch": 2221} {"train_loss": -23.994924545288086, "global_step": 184369, "epoch": 2221} {"train_loss": -23.94809341430664, "global_step": 184370, "epoch": 2221} {"train_loss": -23.910064697265625, "global_step": 184371, "epoch": 2221} {"train_loss": -24.028263092041016, "global_step": 184372, "epoch": 2221} {"train_loss": -23.8674259185791, "global_step": 184373, "epoch": 2221} {"train_loss": -23.914525985717773, "global_step": 184374, "epoch": 2221} {"train_loss": -23.975526809692383, "global_step": 184375, "epoch": 2221} {"train_loss": -23.991764068603516, "global_step": 184376, "epoch": 2221} {"train_loss": -24.42844581604004, "global_step": 184377, "epoch": 2221} {"train_loss": -23.995494842529297, "global_step": 184378, "epoch": 2221} {"train_loss": -23.762176513671875, "global_step": 184379, "epoch": 2221} {"train_loss": -23.682483673095703, "global_step": 184380, "epoch": 2221} {"train_loss": -23.715423583984375, "global_step": 184381, "epoch": 2221} {"train_loss": -24.04681396484375, "global_step": 184382, "epoch": 2221} {"train_loss": -24.110319137573242, "global_step": 184383, "epoch": 2221} {"train_loss": -23.49751091003418, "global_step": 184384, "epoch": 2221} {"train_loss": -24.141489028930664, "global_step": 184385, "epoch": 2221} {"train_loss": -23.9715518951416, "global_step": 184386, "epoch": 2221} {"train_loss": -24.012725830078125, "global_step": 184387, "epoch": 2221} {"train_loss": -24.206552505493164, "global_step": 184388, "epoch": 2221} {"train_loss": -24.10342788696289, "global_step": 184389, "epoch": 2221} {"train_loss": -24.22135353088379, "global_step": 184390, "epoch": 2221} {"train_loss": -23.739004135131836, "global_step": 184391, "epoch": 2221} {"train_loss": -24.098806381225586, "global_step": 184392, "epoch": 2221} {"train_loss": -24.26471710205078, "global_step": 184393, "epoch": 2221} {"train_loss": -24.376306533813477, "global_step": 184394, "epoch": 2221} {"train_loss": -24.132658004760742, "global_step": 184395, "epoch": 2221} {"train_loss": -24.0622615814209, "global_step": 184396, "epoch": 2221} {"train_loss": -23.67283058166504, "global_step": 184397, "epoch": 2221} {"train_loss": -24.222469329833984, "global_step": 184398, "epoch": 2221} {"train_loss": -24.002798080444336, "global_step": 184399, "epoch": 2221} {"train_loss": -24.351224899291992, "global_step": 184400, "epoch": 2221} {"train_loss": -24.30792236328125, "global_step": 184401, "epoch": 2221} {"train_loss": -24.420927047729492, "global_step": 184402, "epoch": 2221} {"train_loss": -24.372116088867188, "global_step": 184403, "epoch": 2221} {"train_loss": -24.548559188842773, "global_step": 184404, "epoch": 2221} {"train_loss": -24.01175308227539, "global_step": 184405, "epoch": 2221} {"train_loss": -24.187671661376953, "global_step": 184406, "epoch": 2221} {"train_loss": -23.732135772705078, "global_step": 184407, "epoch": 2221} {"train_loss": -23.842992782592773, "global_step": 184408, "epoch": 2221} {"train_loss": -24.121173858642578, "global_step": 184409, "epoch": 2221} {"train_loss": -24.341211318969727, "global_step": 184410, "epoch": 2221} {"train_loss": -24.480789184570312, "global_step": 184411, "epoch": 2221} {"train_loss": -23.99570083618164, "global_step": 184412, "epoch": 2221} {"train_loss": -23.575090408325195, "global_step": 184413, "epoch": 2221} {"train_loss": -23.804601669311523, "global_step": 184414, "epoch": 2221} {"train_loss": -23.977216720581055, "global_step": 184415, "epoch": 2221} {"train_loss": -24.138107299804688, "global_step": 184416, "epoch": 2221} {"train_loss": -24.411333084106445, "global_step": 184417, "epoch": 2221} {"train_loss": -24.404634475708008, "global_step": 184418, "epoch": 2221} {"train_loss": -24.046125411987305, "global_step": 184419, "epoch": 2221} {"train_loss": -23.79448699951172, "global_step": 184420, "epoch": 2221} {"train_loss": -24.16652488708496, "global_step": 184421, "epoch": 2221} {"train_loss": -24.07288932800293, "global_step": 184422, "epoch": 2221} {"train_loss": -23.879276275634766, "global_step": 184423, "epoch": 2221} {"train_loss": -23.951496124267578, "global_step": 184424, "epoch": 2221} {"train_loss": -23.986358757478644, "global_step": 184425, "epoch": 2221, "val_loss": 6431879.0} {"train_loss": -23.393665313720703, "global_step": 184426, "epoch": 2222} {"train_loss": -23.555362701416016, "global_step": 184427, "epoch": 2222} {"train_loss": -23.385345458984375, "global_step": 184428, "epoch": 2222} {"train_loss": -22.85236930847168, "global_step": 184429, "epoch": 2222} {"train_loss": -22.898666381835938, "global_step": 184430, "epoch": 2222} {"train_loss": -23.881549835205078, "global_step": 184431, "epoch": 2222} {"train_loss": -23.735334396362305, "global_step": 184432, "epoch": 2222} {"train_loss": -23.231779098510742, "global_step": 184433, "epoch": 2222} {"train_loss": -23.92713737487793, "global_step": 184434, "epoch": 2222} {"train_loss": -23.409231185913086, "global_step": 184435, "epoch": 2222} {"train_loss": -23.539541244506836, "global_step": 184436, "epoch": 2222} {"train_loss": -23.766408920288086, "global_step": 184437, "epoch": 2222} {"train_loss": -23.32978630065918, "global_step": 184438, "epoch": 2222} {"train_loss": -23.3359432220459, "global_step": 184439, "epoch": 2222} {"train_loss": -23.751611709594727, "global_step": 184440, "epoch": 2222} {"train_loss": -23.883865356445312, "global_step": 184441, "epoch": 2222} {"train_loss": -23.665802001953125, "global_step": 184442, "epoch": 2222} {"train_loss": -23.804956436157227, "global_step": 184443, "epoch": 2222} {"train_loss": -24.049245834350586, "global_step": 184444, "epoch": 2222} {"train_loss": -23.710412979125977, "global_step": 184445, "epoch": 2222} {"train_loss": -23.979061126708984, "global_step": 184446, "epoch": 2222} {"train_loss": -23.61847686767578, "global_step": 184447, "epoch": 2222} {"train_loss": -23.807851791381836, "global_step": 184448, "epoch": 2222} {"train_loss": -23.92194938659668, "global_step": 184449, "epoch": 2222} {"train_loss": -23.640302658081055, "global_step": 184450, "epoch": 2222} {"train_loss": -23.85960578918457, "global_step": 184451, "epoch": 2222} {"train_loss": -23.84999656677246, "global_step": 184452, "epoch": 2222} {"train_loss": -24.19148063659668, "global_step": 184453, "epoch": 2222} {"train_loss": -23.95002555847168, "global_step": 184454, "epoch": 2222} {"train_loss": -24.06507682800293, "global_step": 184455, "epoch": 2222} {"train_loss": -24.108417510986328, "global_step": 184456, "epoch": 2222} {"train_loss": -24.268646240234375, "global_step": 184457, "epoch": 2222} {"train_loss": -24.11890983581543, "global_step": 184458, "epoch": 2222} {"train_loss": -23.84864616394043, "global_step": 184459, "epoch": 2222} {"train_loss": -23.992420196533203, "global_step": 184460, "epoch": 2222} {"train_loss": -23.82132911682129, "global_step": 184461, "epoch": 2222} {"train_loss": -24.39222526550293, "global_step": 184462, "epoch": 2222} {"train_loss": -24.114151000976562, "global_step": 184463, "epoch": 2222} {"train_loss": -23.882970809936523, "global_step": 184464, "epoch": 2222} {"train_loss": -23.942907333374023, "global_step": 184465, "epoch": 2222} {"train_loss": -24.3494815826416, "global_step": 184466, "epoch": 2222} {"train_loss": -24.270835876464844, "global_step": 184467, "epoch": 2222} {"train_loss": -24.060720443725586, "global_step": 184468, "epoch": 2222} {"train_loss": -24.06318473815918, "global_step": 184469, "epoch": 2222} {"train_loss": -23.76376724243164, "global_step": 184470, "epoch": 2222} {"train_loss": -24.27571678161621, "global_step": 184471, "epoch": 2222} {"train_loss": -24.019407272338867, "global_step": 184472, "epoch": 2222} {"train_loss": -23.99782371520996, "global_step": 184473, "epoch": 2222} {"train_loss": -24.214597702026367, "global_step": 184474, "epoch": 2222} {"train_loss": -24.2867488861084, "global_step": 184475, "epoch": 2222} {"train_loss": -24.121471405029297, "global_step": 184476, "epoch": 2222} {"train_loss": -24.2740478515625, "global_step": 184477, "epoch": 2222} {"train_loss": -24.253419876098633, "global_step": 184478, "epoch": 2222} {"train_loss": -24.150663375854492, "global_step": 184479, "epoch": 2222} {"train_loss": -24.454975128173828, "global_step": 184480, "epoch": 2222} {"train_loss": -24.56378173828125, "global_step": 184481, "epoch": 2222} {"train_loss": -23.778318405151367, "global_step": 184482, "epoch": 2222} {"train_loss": -24.338895797729492, "global_step": 184483, "epoch": 2222} {"train_loss": -24.073806762695312, "global_step": 184484, "epoch": 2222} {"train_loss": -24.232397079467773, "global_step": 184485, "epoch": 2222} {"train_loss": -24.02570915222168, "global_step": 184486, "epoch": 2222} {"train_loss": -23.841949462890625, "global_step": 184487, "epoch": 2222} {"train_loss": -24.358245849609375, "global_step": 184488, "epoch": 2222} {"train_loss": -23.704172134399414, "global_step": 184489, "epoch": 2222} {"train_loss": -23.65033531188965, "global_step": 184490, "epoch": 2222} {"train_loss": -23.6585636138916, "global_step": 184491, "epoch": 2222} {"train_loss": -24.26084327697754, "global_step": 184492, "epoch": 2222} {"train_loss": -23.93438720703125, "global_step": 184493, "epoch": 2222} {"train_loss": -23.95457649230957, "global_step": 184494, "epoch": 2222} {"train_loss": -23.93136215209961, "global_step": 184495, "epoch": 2222} {"train_loss": -23.92124366760254, "global_step": 184496, "epoch": 2222} {"train_loss": -23.985559463500977, "global_step": 184497, "epoch": 2222} {"train_loss": -24.03030776977539, "global_step": 184498, "epoch": 2222} {"train_loss": -24.191831588745117, "global_step": 184499, "epoch": 2222} {"train_loss": -24.08523178100586, "global_step": 184500, "epoch": 2222} {"train_loss": -23.836515426635742, "global_step": 184501, "epoch": 2222} {"train_loss": -24.115055084228516, "global_step": 184502, "epoch": 2222} {"train_loss": -23.813405990600586, "global_step": 184503, "epoch": 2222} {"train_loss": -23.951732635498047, "global_step": 184504, "epoch": 2222} {"train_loss": -24.093189239501953, "global_step": 184505, "epoch": 2222} {"train_loss": -23.90199851989746, "global_step": 184506, "epoch": 2222} {"train_loss": -24.135345458984375, "global_step": 184507, "epoch": 2222} {"train_loss": -23.903401110545698, "global_step": 184508, "epoch": 2222, "val_loss": 6506810.5} {"train_loss": -23.18576431274414, "global_step": 184509, "epoch": 2223} {"train_loss": -23.52429962158203, "global_step": 184510, "epoch": 2223} {"train_loss": -23.727283477783203, "global_step": 184511, "epoch": 2223} {"train_loss": -23.49971580505371, "global_step": 184512, "epoch": 2223} {"train_loss": -23.35481071472168, "global_step": 184513, "epoch": 2223} {"train_loss": -23.400938034057617, "global_step": 184514, "epoch": 2223} {"train_loss": -23.888898849487305, "global_step": 184515, "epoch": 2223} {"train_loss": -23.449085235595703, "global_step": 184516, "epoch": 2223} {"train_loss": -23.82508659362793, "global_step": 184517, "epoch": 2223} {"train_loss": -23.719343185424805, "global_step": 184518, "epoch": 2223} {"train_loss": -23.88534927368164, "global_step": 184519, "epoch": 2223} {"train_loss": -23.43413734436035, "global_step": 184520, "epoch": 2223} {"train_loss": -23.988971710205078, "global_step": 184521, "epoch": 2223} {"train_loss": -23.77423858642578, "global_step": 184522, "epoch": 2223} {"train_loss": -23.519542694091797, "global_step": 184523, "epoch": 2223} {"train_loss": -23.85198402404785, "global_step": 184524, "epoch": 2223} {"train_loss": -23.590904235839844, "global_step": 184525, "epoch": 2223} {"train_loss": -24.123987197875977, "global_step": 184526, "epoch": 2223} {"train_loss": -24.045175552368164, "global_step": 184527, "epoch": 2223} {"train_loss": -24.15035057067871, "global_step": 184528, "epoch": 2223} {"train_loss": -24.016681671142578, "global_step": 184529, "epoch": 2223} {"train_loss": -24.02363395690918, "global_step": 184530, "epoch": 2223} {"train_loss": -24.007305145263672, "global_step": 184531, "epoch": 2223} {"train_loss": -23.624120712280273, "global_step": 184532, "epoch": 2223} {"train_loss": -23.98284912109375, "global_step": 184533, "epoch": 2223} {"train_loss": -23.79342269897461, "global_step": 184534, "epoch": 2223} {"train_loss": -23.942514419555664, "global_step": 184535, "epoch": 2223} {"train_loss": -24.336090087890625, "global_step": 184536, "epoch": 2223} {"train_loss": -24.132204055786133, "global_step": 184537, "epoch": 2223} {"train_loss": -24.11688804626465, "global_step": 184538, "epoch": 2223} {"train_loss": -24.303434371948242, "global_step": 184539, "epoch": 2223} {"train_loss": -24.086332321166992, "global_step": 184540, "epoch": 2223} {"train_loss": -24.147092819213867, "global_step": 184541, "epoch": 2223} {"train_loss": -24.021270751953125, "global_step": 184542, "epoch": 2223} {"train_loss": -24.186086654663086, "global_step": 184543, "epoch": 2223} {"train_loss": -24.155569076538086, "global_step": 184544, "epoch": 2223} {"train_loss": -24.127567291259766, "global_step": 184545, "epoch": 2223} {"train_loss": -24.201231002807617, "global_step": 184546, "epoch": 2223} {"train_loss": -23.926603317260742, "global_step": 184547, "epoch": 2223} {"train_loss": -24.027196884155273, "global_step": 184548, "epoch": 2223} {"train_loss": -24.325414657592773, "global_step": 184549, "epoch": 2223} {"train_loss": -24.236059188842773, "global_step": 184550, "epoch": 2223} {"train_loss": -24.128664016723633, "global_step": 184551, "epoch": 2223} {"train_loss": -23.9434814453125, "global_step": 184552, "epoch": 2223} {"train_loss": -24.556631088256836, "global_step": 184553, "epoch": 2223} {"train_loss": -24.173795700073242, "global_step": 184554, "epoch": 2223} {"train_loss": -24.007749557495117, "global_step": 184555, "epoch": 2223} {"train_loss": -23.848718643188477, "global_step": 184556, "epoch": 2223} {"train_loss": -23.823413848876953, "global_step": 184557, "epoch": 2223} {"train_loss": -23.884857177734375, "global_step": 184558, "epoch": 2223} {"train_loss": -22.90456199645996, "global_step": 184559, "epoch": 2223} {"train_loss": -22.323387145996094, "global_step": 184560, "epoch": 2223} {"train_loss": -22.880956649780273, "global_step": 184561, "epoch": 2223} {"train_loss": -23.839406967163086, "global_step": 184562, "epoch": 2223} {"train_loss": -23.95937156677246, "global_step": 184563, "epoch": 2223} {"train_loss": -23.12798500061035, "global_step": 184564, "epoch": 2223} {"train_loss": -23.760765075683594, "global_step": 184565, "epoch": 2223} {"train_loss": -23.567035675048828, "global_step": 184566, "epoch": 2223} {"train_loss": -23.76152992248535, "global_step": 184567, "epoch": 2223} {"train_loss": -23.43316650390625, "global_step": 184568, "epoch": 2223} {"train_loss": -23.761871337890625, "global_step": 184569, "epoch": 2223} {"train_loss": -23.705167770385742, "global_step": 184570, "epoch": 2223} {"train_loss": -23.882795333862305, "global_step": 184571, "epoch": 2223} {"train_loss": -23.838932037353516, "global_step": 184572, "epoch": 2223} {"train_loss": -23.74457359313965, "global_step": 184573, "epoch": 2223} {"train_loss": -23.96393394470215, "global_step": 184574, "epoch": 2223} {"train_loss": -23.80854606628418, "global_step": 184575, "epoch": 2223} {"train_loss": -23.93105125427246, "global_step": 184576, "epoch": 2223} {"train_loss": -23.56968116760254, "global_step": 184577, "epoch": 2223} {"train_loss": -23.986419677734375, "global_step": 184578, "epoch": 2223} {"train_loss": -23.870798110961914, "global_step": 184579, "epoch": 2223} {"train_loss": -23.778799057006836, "global_step": 184580, "epoch": 2223} {"train_loss": -23.656015396118164, "global_step": 184581, "epoch": 2223} {"train_loss": -24.047996520996094, "global_step": 184582, "epoch": 2223} {"train_loss": -23.902053833007812, "global_step": 184583, "epoch": 2223} {"train_loss": -23.602832794189453, "global_step": 184584, "epoch": 2223} {"train_loss": -24.091135025024414, "global_step": 184585, "epoch": 2223} {"train_loss": -23.893848419189453, "global_step": 184586, "epoch": 2223} {"train_loss": -23.795740127563477, "global_step": 184587, "epoch": 2223} {"train_loss": -24.057601928710938, "global_step": 184588, "epoch": 2223} {"train_loss": -24.15717887878418, "global_step": 184589, "epoch": 2223} {"train_loss": -24.436851501464844, "global_step": 184590, "epoch": 2223} {"train_loss": -23.83823601596327, "global_step": 184591, "epoch": 2223, "val_loss": 6415333.0} {"train_loss": -23.71786117553711, "global_step": 184592, "epoch": 2224} {"train_loss": -23.66684341430664, "global_step": 184593, "epoch": 2224} {"train_loss": -23.45868492126465, "global_step": 184594, "epoch": 2224} {"train_loss": -23.772916793823242, "global_step": 184595, "epoch": 2224} {"train_loss": -24.024829864501953, "global_step": 184596, "epoch": 2224} {"train_loss": -23.873971939086914, "global_step": 184597, "epoch": 2224} {"train_loss": -24.11298370361328, "global_step": 184598, "epoch": 2224} {"train_loss": -23.964611053466797, "global_step": 184599, "epoch": 2224} {"train_loss": -23.885271072387695, "global_step": 184600, "epoch": 2224} {"train_loss": -24.065122604370117, "global_step": 184601, "epoch": 2224} {"train_loss": -23.6667537689209, "global_step": 184602, "epoch": 2224} {"train_loss": -23.848859786987305, "global_step": 184603, "epoch": 2224} {"train_loss": -24.002222061157227, "global_step": 184604, "epoch": 2224} {"train_loss": -23.774621963500977, "global_step": 184605, "epoch": 2224} {"train_loss": -24.096729278564453, "global_step": 184606, "epoch": 2224} {"train_loss": -24.04102897644043, "global_step": 184607, "epoch": 2224} {"train_loss": -23.877511978149414, "global_step": 184608, "epoch": 2224} {"train_loss": -23.96360206604004, "global_step": 184609, "epoch": 2224} {"train_loss": -23.634428024291992, "global_step": 184610, "epoch": 2224} {"train_loss": -23.95099639892578, "global_step": 184611, "epoch": 2224} {"train_loss": -23.931446075439453, "global_step": 184612, "epoch": 2224} {"train_loss": -23.654251098632812, "global_step": 184613, "epoch": 2224} {"train_loss": -23.88544273376465, "global_step": 184614, "epoch": 2224} {"train_loss": -23.710920333862305, "global_step": 184615, "epoch": 2224} {"train_loss": -23.669973373413086, "global_step": 184616, "epoch": 2224} {"train_loss": -24.500690460205078, "global_step": 184617, "epoch": 2224} {"train_loss": -23.82450294494629, "global_step": 184618, "epoch": 2224} {"train_loss": -24.04815673828125, "global_step": 184619, "epoch": 2224} {"train_loss": -24.103618621826172, "global_step": 184620, "epoch": 2224} {"train_loss": -24.185653686523438, "global_step": 184621, "epoch": 2224} {"train_loss": -24.384096145629883, "global_step": 184622, "epoch": 2224} {"train_loss": -23.8421573638916, "global_step": 184623, "epoch": 2224} {"train_loss": -24.21644401550293, "global_step": 184624, "epoch": 2224} {"train_loss": -24.131423950195312, "global_step": 184625, "epoch": 2224} {"train_loss": -23.83346176147461, "global_step": 184626, "epoch": 2224} {"train_loss": -24.16015625, "global_step": 184627, "epoch": 2224} {"train_loss": -24.187211990356445, "global_step": 184628, "epoch": 2224} {"train_loss": -23.698532104492188, "global_step": 184629, "epoch": 2224} {"train_loss": -24.0234375, "global_step": 184630, "epoch": 2224} {"train_loss": -24.204565048217773, "global_step": 184631, "epoch": 2224} {"train_loss": -24.20735740661621, "global_step": 184632, "epoch": 2224} {"train_loss": -23.888816833496094, "global_step": 184633, "epoch": 2224} {"train_loss": -24.413755416870117, "global_step": 184634, "epoch": 2224} {"train_loss": -24.12529945373535, "global_step": 184635, "epoch": 2224} {"train_loss": -23.893753051757812, "global_step": 184636, "epoch": 2224} {"train_loss": -23.763198852539062, "global_step": 184637, "epoch": 2224} {"train_loss": -24.037921905517578, "global_step": 184638, "epoch": 2224} {"train_loss": -24.184598922729492, "global_step": 184639, "epoch": 2224} {"train_loss": -23.705005645751953, "global_step": 184640, "epoch": 2224} {"train_loss": -23.86093521118164, "global_step": 184641, "epoch": 2224} {"train_loss": -24.274869918823242, "global_step": 184642, "epoch": 2224} {"train_loss": -23.907194137573242, "global_step": 184643, "epoch": 2224} {"train_loss": -23.81876564025879, "global_step": 184644, "epoch": 2224} {"train_loss": -24.1003360748291, "global_step": 184645, "epoch": 2224} {"train_loss": -23.80044937133789, "global_step": 184646, "epoch": 2224} {"train_loss": -24.274961471557617, "global_step": 184647, "epoch": 2224} {"train_loss": -24.1099910736084, "global_step": 184648, "epoch": 2224} {"train_loss": -24.156156539916992, "global_step": 184649, "epoch": 2224} {"train_loss": -24.098648071289062, "global_step": 184650, "epoch": 2224} {"train_loss": -23.904508590698242, "global_step": 184651, "epoch": 2224} {"train_loss": -23.905845642089844, "global_step": 184652, "epoch": 2224} {"train_loss": -23.638111114501953, "global_step": 184653, "epoch": 2224} {"train_loss": -24.166105270385742, "global_step": 184654, "epoch": 2224} {"train_loss": -23.89776611328125, "global_step": 184655, "epoch": 2224} {"train_loss": -23.79740333557129, "global_step": 184656, "epoch": 2224} {"train_loss": -23.952682495117188, "global_step": 184657, "epoch": 2224} {"train_loss": -24.190763473510742, "global_step": 184658, "epoch": 2224} {"train_loss": -24.125991821289062, "global_step": 184659, "epoch": 2224} {"train_loss": -23.737829208374023, "global_step": 184660, "epoch": 2224} {"train_loss": -23.73639488220215, "global_step": 184661, "epoch": 2224} {"train_loss": -23.603857040405273, "global_step": 184662, "epoch": 2224} {"train_loss": -23.852371215820312, "global_step": 184663, "epoch": 2224} {"train_loss": -23.925565719604492, "global_step": 184664, "epoch": 2224} {"train_loss": -23.669729232788086, "global_step": 184665, "epoch": 2224} {"train_loss": -23.74539566040039, "global_step": 184666, "epoch": 2224} {"train_loss": -23.79789161682129, "global_step": 184667, "epoch": 2224} {"train_loss": -23.909610748291016, "global_step": 184668, "epoch": 2224} {"train_loss": -23.652217864990234, "global_step": 184669, "epoch": 2224} {"train_loss": -24.19215965270996, "global_step": 184670, "epoch": 2224} {"train_loss": -24.13873863220215, "global_step": 184671, "epoch": 2224} {"train_loss": -23.972787857055664, "global_step": 184672, "epoch": 2224} {"train_loss": -24.011510848999023, "global_step": 184673, "epoch": 2224} {"train_loss": -23.953084623957256, "global_step": 184674, "epoch": 2224, "val_loss": 6597304.0} {"train_loss": -22.896947860717773, "global_step": 184675, "epoch": 2225} {"train_loss": -22.587032318115234, "global_step": 184676, "epoch": 2225} {"train_loss": -23.23386001586914, "global_step": 184677, "epoch": 2225} {"train_loss": -23.177881240844727, "global_step": 184678, "epoch": 2225} {"train_loss": -23.236448287963867, "global_step": 184679, "epoch": 2225} {"train_loss": -23.19159507751465, "global_step": 184680, "epoch": 2225} {"train_loss": -23.183135986328125, "global_step": 184681, "epoch": 2225} {"train_loss": -23.412996292114258, "global_step": 184682, "epoch": 2225} {"train_loss": -23.51323890686035, "global_step": 184683, "epoch": 2225} {"train_loss": -23.31479835510254, "global_step": 184684, "epoch": 2225} {"train_loss": -23.37552261352539, "global_step": 184685, "epoch": 2225} {"train_loss": -23.23602867126465, "global_step": 184686, "epoch": 2225} {"train_loss": -23.344236373901367, "global_step": 184687, "epoch": 2225} {"train_loss": -23.297260284423828, "global_step": 184688, "epoch": 2225} {"train_loss": -23.538524627685547, "global_step": 184689, "epoch": 2225} {"train_loss": -23.559865951538086, "global_step": 184690, "epoch": 2225} {"train_loss": -24.22963523864746, "global_step": 184691, "epoch": 2225} {"train_loss": -23.59760856628418, "global_step": 184692, "epoch": 2225} {"train_loss": -23.553762435913086, "global_step": 184693, "epoch": 2225} {"train_loss": -24.136079788208008, "global_step": 184694, "epoch": 2225} {"train_loss": -23.642751693725586, "global_step": 184695, "epoch": 2225} {"train_loss": -23.86990737915039, "global_step": 184696, "epoch": 2225} {"train_loss": -23.678817749023438, "global_step": 184697, "epoch": 2225} {"train_loss": -24.192289352416992, "global_step": 184698, "epoch": 2225} {"train_loss": -24.065465927124023, "global_step": 184699, "epoch": 2225} {"train_loss": -23.706151962280273, "global_step": 184700, "epoch": 2225} {"train_loss": -23.88936996459961, "global_step": 184701, "epoch": 2225} {"train_loss": -23.608951568603516, "global_step": 184702, "epoch": 2225} {"train_loss": -23.83907127380371, "global_step": 184703, "epoch": 2225} {"train_loss": -23.95332145690918, "global_step": 184704, "epoch": 2225} {"train_loss": -24.166982650756836, "global_step": 184705, "epoch": 2225} {"train_loss": -23.941091537475586, "global_step": 184706, "epoch": 2225} {"train_loss": -24.19050407409668, "global_step": 184707, "epoch": 2225} {"train_loss": -23.759119033813477, "global_step": 184708, "epoch": 2225} {"train_loss": -23.74445152282715, "global_step": 184709, "epoch": 2225} {"train_loss": -23.699880599975586, "global_step": 184710, "epoch": 2225} {"train_loss": -24.03677749633789, "global_step": 184711, "epoch": 2225} {"train_loss": -23.535785675048828, "global_step": 184712, "epoch": 2225} {"train_loss": -24.137903213500977, "global_step": 184713, "epoch": 2225} {"train_loss": -24.087474822998047, "global_step": 184714, "epoch": 2225} {"train_loss": -24.242584228515625, "global_step": 184715, "epoch": 2225} {"train_loss": -23.826396942138672, "global_step": 184716, "epoch": 2225} {"train_loss": -24.089948654174805, "global_step": 184717, "epoch": 2225} {"train_loss": -24.478328704833984, "global_step": 184718, "epoch": 2225} {"train_loss": -24.559127807617188, "global_step": 184719, "epoch": 2225} {"train_loss": -23.921072006225586, "global_step": 184720, "epoch": 2225} {"train_loss": -24.166990280151367, "global_step": 184721, "epoch": 2225} {"train_loss": -23.901540756225586, "global_step": 184722, "epoch": 2225} {"train_loss": -24.08057975769043, "global_step": 184723, "epoch": 2225} {"train_loss": -23.858060836791992, "global_step": 184724, "epoch": 2225} {"train_loss": -23.914241790771484, "global_step": 184725, "epoch": 2225} {"train_loss": -23.857324600219727, "global_step": 184726, "epoch": 2225} {"train_loss": -24.066394805908203, "global_step": 184727, "epoch": 2225} {"train_loss": -23.598987579345703, "global_step": 184728, "epoch": 2225} {"train_loss": -24.2589111328125, "global_step": 184729, "epoch": 2225} {"train_loss": -23.884653091430664, "global_step": 184730, "epoch": 2225} {"train_loss": -24.079259872436523, "global_step": 184731, "epoch": 2225} {"train_loss": -23.882465362548828, "global_step": 184732, "epoch": 2225} {"train_loss": -24.265380859375, "global_step": 184733, "epoch": 2225} {"train_loss": -23.897443771362305, "global_step": 184734, "epoch": 2225} {"train_loss": -24.291662216186523, "global_step": 184735, "epoch": 2225} {"train_loss": -24.41196060180664, "global_step": 184736, "epoch": 2225} {"train_loss": -24.141759872436523, "global_step": 184737, "epoch": 2225} {"train_loss": -23.85385513305664, "global_step": 184738, "epoch": 2225} {"train_loss": -24.06271743774414, "global_step": 184739, "epoch": 2225} {"train_loss": -23.85450553894043, "global_step": 184740, "epoch": 2225} {"train_loss": -24.490827560424805, "global_step": 184741, "epoch": 2225} {"train_loss": -24.292442321777344, "global_step": 184742, "epoch": 2225} {"train_loss": -23.8513126373291, "global_step": 184743, "epoch": 2225} {"train_loss": -23.955673217773438, "global_step": 184744, "epoch": 2225} {"train_loss": -24.033552169799805, "global_step": 184745, "epoch": 2225} {"train_loss": -23.75393295288086, "global_step": 184746, "epoch": 2225} {"train_loss": -23.805936813354492, "global_step": 184747, "epoch": 2225} {"train_loss": -24.237272262573242, "global_step": 184748, "epoch": 2225} {"train_loss": -24.15382194519043, "global_step": 184749, "epoch": 2225} {"train_loss": -23.85243034362793, "global_step": 184750, "epoch": 2225} {"train_loss": -23.843286514282227, "global_step": 184751, "epoch": 2225} {"train_loss": -24.37439727783203, "global_step": 184752, "epoch": 2225} {"train_loss": -23.984012603759766, "global_step": 184753, "epoch": 2225} {"train_loss": -23.987417221069336, "global_step": 184754, "epoch": 2225} {"train_loss": -24.08145523071289, "global_step": 184755, "epoch": 2225} {"train_loss": -24.12491226196289, "global_step": 184756, "epoch": 2225} {"train_loss": -23.862200495708418, "global_step": 184757, "epoch": 2225, "val_loss": 6503320.0} {"train_loss": -23.655237197875977, "global_step": 184758, "epoch": 2226} {"train_loss": -23.743494033813477, "global_step": 184759, "epoch": 2226} {"train_loss": -23.89271354675293, "global_step": 184760, "epoch": 2226} {"train_loss": -23.7304744720459, "global_step": 184761, "epoch": 2226} {"train_loss": -23.631101608276367, "global_step": 184762, "epoch": 2226} {"train_loss": -23.568204879760742, "global_step": 184763, "epoch": 2226} {"train_loss": -23.93106460571289, "global_step": 184764, "epoch": 2226} {"train_loss": -23.62034797668457, "global_step": 184765, "epoch": 2226} {"train_loss": -23.78432273864746, "global_step": 184766, "epoch": 2226} {"train_loss": -24.08209991455078, "global_step": 184767, "epoch": 2226} {"train_loss": -23.509336471557617, "global_step": 184768, "epoch": 2226} {"train_loss": -23.58932876586914, "global_step": 184769, "epoch": 2226} {"train_loss": -24.157150268554688, "global_step": 184770, "epoch": 2226} {"train_loss": -24.36591148376465, "global_step": 184771, "epoch": 2226} {"train_loss": -23.591903686523438, "global_step": 184772, "epoch": 2226} {"train_loss": -24.127269744873047, "global_step": 184773, "epoch": 2226} {"train_loss": -23.721527099609375, "global_step": 184774, "epoch": 2226} {"train_loss": -24.057315826416016, "global_step": 184775, "epoch": 2226} {"train_loss": -23.992393493652344, "global_step": 184776, "epoch": 2226} {"train_loss": -24.05501365661621, "global_step": 184777, "epoch": 2226} {"train_loss": -23.700634002685547, "global_step": 184778, "epoch": 2226} {"train_loss": -24.113080978393555, "global_step": 184779, "epoch": 2226} {"train_loss": -23.6074161529541, "global_step": 184780, "epoch": 2226} {"train_loss": -24.266016006469727, "global_step": 184781, "epoch": 2226} {"train_loss": -23.737611770629883, "global_step": 184782, "epoch": 2226} {"train_loss": -23.848981857299805, "global_step": 184783, "epoch": 2226} {"train_loss": -24.06328010559082, "global_step": 184784, "epoch": 2226} {"train_loss": -24.21272087097168, "global_step": 184785, "epoch": 2226} {"train_loss": -24.114456176757812, "global_step": 184786, "epoch": 2226} {"train_loss": -23.861772537231445, "global_step": 184787, "epoch": 2226} {"train_loss": -24.395217895507812, "global_step": 184788, "epoch": 2226} {"train_loss": -24.251516342163086, "global_step": 184789, "epoch": 2226} {"train_loss": -24.171070098876953, "global_step": 184790, "epoch": 2226} {"train_loss": -23.91456413269043, "global_step": 184791, "epoch": 2226} {"train_loss": -24.472776412963867, "global_step": 184792, "epoch": 2226} {"train_loss": -24.248987197875977, "global_step": 184793, "epoch": 2226} {"train_loss": -23.84664535522461, "global_step": 184794, "epoch": 2226} {"train_loss": -23.972309112548828, "global_step": 184795, "epoch": 2226} {"train_loss": -23.80219078063965, "global_step": 184796, "epoch": 2226} {"train_loss": -23.735950469970703, "global_step": 184797, "epoch": 2226} {"train_loss": -24.09690284729004, "global_step": 184798, "epoch": 2226} {"train_loss": -24.05362319946289, "global_step": 184799, "epoch": 2226} {"train_loss": -23.876562118530273, "global_step": 184800, "epoch": 2226} {"train_loss": -23.688888549804688, "global_step": 184801, "epoch": 2226} {"train_loss": -23.96786880493164, "global_step": 184802, "epoch": 2226} {"train_loss": -23.98903465270996, "global_step": 184803, "epoch": 2226} {"train_loss": -23.865764617919922, "global_step": 184804, "epoch": 2226} {"train_loss": -24.198734283447266, "global_step": 184805, "epoch": 2226} {"train_loss": -24.327198028564453, "global_step": 184806, "epoch": 2226} {"train_loss": -23.501012802124023, "global_step": 184807, "epoch": 2226} {"train_loss": -23.951990127563477, "global_step": 184808, "epoch": 2226} {"train_loss": -24.12526512145996, "global_step": 184809, "epoch": 2226} {"train_loss": -24.18440818786621, "global_step": 184810, "epoch": 2226} {"train_loss": -23.954654693603516, "global_step": 184811, "epoch": 2226} {"train_loss": -24.159727096557617, "global_step": 184812, "epoch": 2226} {"train_loss": -24.18817710876465, "global_step": 184813, "epoch": 2226} {"train_loss": -23.86066246032715, "global_step": 184814, "epoch": 2226} {"train_loss": -24.11008644104004, "global_step": 184815, "epoch": 2226} {"train_loss": -24.099828720092773, "global_step": 184816, "epoch": 2226} {"train_loss": -23.971588134765625, "global_step": 184817, "epoch": 2226} {"train_loss": -24.267194747924805, "global_step": 184818, "epoch": 2226} {"train_loss": -23.9301700592041, "global_step": 184819, "epoch": 2226} {"train_loss": -23.82674789428711, "global_step": 184820, "epoch": 2226} {"train_loss": -24.317651748657227, "global_step": 184821, "epoch": 2226} {"train_loss": -24.142776489257812, "global_step": 184822, "epoch": 2226} {"train_loss": -24.150413513183594, "global_step": 184823, "epoch": 2226} {"train_loss": -24.015527725219727, "global_step": 184824, "epoch": 2226} {"train_loss": -24.399185180664062, "global_step": 184825, "epoch": 2226} {"train_loss": -23.98898696899414, "global_step": 184826, "epoch": 2226} {"train_loss": -24.169328689575195, "global_step": 184827, "epoch": 2226} {"train_loss": -24.192346572875977, "global_step": 184828, "epoch": 2226} {"train_loss": -24.121274948120117, "global_step": 184829, "epoch": 2226} {"train_loss": -23.756399154663086, "global_step": 184830, "epoch": 2226} {"train_loss": -23.931171417236328, "global_step": 184831, "epoch": 2226} {"train_loss": -24.073965072631836, "global_step": 184832, "epoch": 2226} {"train_loss": -24.290109634399414, "global_step": 184833, "epoch": 2226} {"train_loss": -23.95563316345215, "global_step": 184834, "epoch": 2226} {"train_loss": -23.35218620300293, "global_step": 184835, "epoch": 2226} {"train_loss": -23.688873291015625, "global_step": 184836, "epoch": 2226} {"train_loss": -24.034391403198242, "global_step": 184837, "epoch": 2226} {"train_loss": -23.869768142700195, "global_step": 184838, "epoch": 2226} {"train_loss": -24.026399612426758, "global_step": 184839, "epoch": 2226} {"train_loss": -23.9780892291701, "global_step": 184840, "epoch": 2226, "val_loss": 6449443.0} {"train_loss": -23.443540573120117, "global_step": 184841, "epoch": 2227} {"train_loss": -23.85064697265625, "global_step": 184842, "epoch": 2227} {"train_loss": -23.174724578857422, "global_step": 184843, "epoch": 2227} {"train_loss": -23.639841079711914, "global_step": 184844, "epoch": 2227} {"train_loss": -23.404922485351562, "global_step": 184845, "epoch": 2227} {"train_loss": -23.636322021484375, "global_step": 184846, "epoch": 2227} {"train_loss": -23.69488525390625, "global_step": 184847, "epoch": 2227} {"train_loss": -23.45631217956543, "global_step": 184848, "epoch": 2227} {"train_loss": -23.8343448638916, "global_step": 184849, "epoch": 2227} {"train_loss": -23.73250389099121, "global_step": 184850, "epoch": 2227} {"train_loss": -23.68484878540039, "global_step": 184851, "epoch": 2227} {"train_loss": -23.699081420898438, "global_step": 184852, "epoch": 2227} {"train_loss": -23.459476470947266, "global_step": 184853, "epoch": 2227} {"train_loss": -23.901004791259766, "global_step": 184854, "epoch": 2227} {"train_loss": -23.44074821472168, "global_step": 184855, "epoch": 2227} {"train_loss": -23.54044532775879, "global_step": 184856, "epoch": 2227} {"train_loss": -23.655019760131836, "global_step": 184857, "epoch": 2227} {"train_loss": -23.62425422668457, "global_step": 184858, "epoch": 2227} {"train_loss": -23.733915328979492, "global_step": 184859, "epoch": 2227} {"train_loss": -23.647932052612305, "global_step": 184860, "epoch": 2227} {"train_loss": -23.410844802856445, "global_step": 184861, "epoch": 2227} {"train_loss": -24.169950485229492, "global_step": 184862, "epoch": 2227} {"train_loss": -23.96026611328125, "global_step": 184863, "epoch": 2227} {"train_loss": -24.423654556274414, "global_step": 184864, "epoch": 2227} {"train_loss": -23.689899444580078, "global_step": 184865, "epoch": 2227} {"train_loss": -24.18926429748535, "global_step": 184866, "epoch": 2227} {"train_loss": -23.958539962768555, "global_step": 184867, "epoch": 2227} {"train_loss": -23.81707000732422, "global_step": 184868, "epoch": 2227} {"train_loss": -23.847148895263672, "global_step": 184869, "epoch": 2227} {"train_loss": -23.949735641479492, "global_step": 184870, "epoch": 2227} {"train_loss": -23.942262649536133, "global_step": 184871, "epoch": 2227} {"train_loss": -23.98473358154297, "global_step": 184872, "epoch": 2227} {"train_loss": -24.282197952270508, "global_step": 184873, "epoch": 2227} {"train_loss": -24.2804012298584, "global_step": 184874, "epoch": 2227} {"train_loss": -24.330101013183594, "global_step": 184875, "epoch": 2227} {"train_loss": -24.099082946777344, "global_step": 184876, "epoch": 2227} {"train_loss": -24.437732696533203, "global_step": 184877, "epoch": 2227} {"train_loss": -24.378177642822266, "global_step": 184878, "epoch": 2227} {"train_loss": -24.0795955657959, "global_step": 184879, "epoch": 2227} {"train_loss": -24.185211181640625, "global_step": 184880, "epoch": 2227} {"train_loss": -24.350473403930664, "global_step": 184881, "epoch": 2227} {"train_loss": -24.293487548828125, "global_step": 184882, "epoch": 2227} {"train_loss": -24.19413948059082, "global_step": 184883, "epoch": 2227} {"train_loss": -24.063724517822266, "global_step": 184884, "epoch": 2227} {"train_loss": -24.009336471557617, "global_step": 184885, "epoch": 2227} {"train_loss": -24.210813522338867, "global_step": 184886, "epoch": 2227} {"train_loss": -24.23702049255371, "global_step": 184887, "epoch": 2227} {"train_loss": -24.090057373046875, "global_step": 184888, "epoch": 2227} {"train_loss": -23.8361873626709, "global_step": 184889, "epoch": 2227} {"train_loss": -23.816028594970703, "global_step": 184890, "epoch": 2227} {"train_loss": -23.584333419799805, "global_step": 184891, "epoch": 2227} {"train_loss": -23.51271629333496, "global_step": 184892, "epoch": 2227} {"train_loss": -23.10127830505371, "global_step": 184893, "epoch": 2227} {"train_loss": -22.878726959228516, "global_step": 184894, "epoch": 2227} {"train_loss": -23.78579330444336, "global_step": 184895, "epoch": 2227} {"train_loss": -23.959400177001953, "global_step": 184896, "epoch": 2227} {"train_loss": -23.612308502197266, "global_step": 184897, "epoch": 2227} {"train_loss": -23.753633499145508, "global_step": 184898, "epoch": 2227} {"train_loss": -23.3353214263916, "global_step": 184899, "epoch": 2227} {"train_loss": -23.751300811767578, "global_step": 184900, "epoch": 2227} {"train_loss": -24.317092895507812, "global_step": 184901, "epoch": 2227} {"train_loss": -23.55002784729004, "global_step": 184902, "epoch": 2227} {"train_loss": -24.083173751831055, "global_step": 184903, "epoch": 2227} {"train_loss": -23.413236618041992, "global_step": 184904, "epoch": 2227} {"train_loss": -23.52431297302246, "global_step": 184905, "epoch": 2227} {"train_loss": -23.845203399658203, "global_step": 184906, "epoch": 2227} {"train_loss": -23.821672439575195, "global_step": 184907, "epoch": 2227} {"train_loss": -23.793636322021484, "global_step": 184908, "epoch": 2227} {"train_loss": -23.813217163085938, "global_step": 184909, "epoch": 2227} {"train_loss": -23.884319305419922, "global_step": 184910, "epoch": 2227} {"train_loss": -24.076644897460938, "global_step": 184911, "epoch": 2227} {"train_loss": -23.631479263305664, "global_step": 184912, "epoch": 2227} {"train_loss": -23.6828670501709, "global_step": 184913, "epoch": 2227} {"train_loss": -24.07606315612793, "global_step": 184914, "epoch": 2227} {"train_loss": -23.718551635742188, "global_step": 184915, "epoch": 2227} {"train_loss": -23.837961196899414, "global_step": 184916, "epoch": 2227} {"train_loss": -23.751081466674805, "global_step": 184917, "epoch": 2227} {"train_loss": -23.683786392211914, "global_step": 184918, "epoch": 2227} {"train_loss": -23.767004013061523, "global_step": 184919, "epoch": 2227} {"train_loss": -23.742616653442383, "global_step": 184920, "epoch": 2227} {"train_loss": -23.91263198852539, "global_step": 184921, "epoch": 2227} {"train_loss": -24.131916046142578, "global_step": 184922, "epoch": 2227} {"train_loss": -23.822691997849798, "global_step": 184923, "epoch": 2227, "val_loss": 6451059.0} {"train_loss": -24.13994598388672, "global_step": 184924, "epoch": 2228} {"train_loss": -23.801544189453125, "global_step": 184925, "epoch": 2228} {"train_loss": -23.734851837158203, "global_step": 184926, "epoch": 2228} {"train_loss": -23.81755256652832, "global_step": 184927, "epoch": 2228} {"train_loss": -23.7740478515625, "global_step": 184928, "epoch": 2228} {"train_loss": -23.66904067993164, "global_step": 184929, "epoch": 2228} {"train_loss": -23.87000846862793, "global_step": 184930, "epoch": 2228} {"train_loss": -24.033649444580078, "global_step": 184931, "epoch": 2228} {"train_loss": -24.01692771911621, "global_step": 184932, "epoch": 2228} {"train_loss": -23.746051788330078, "global_step": 184933, "epoch": 2228} {"train_loss": -23.710174560546875, "global_step": 184934, "epoch": 2228} {"train_loss": -23.75388526916504, "global_step": 184935, "epoch": 2228} {"train_loss": -23.688426971435547, "global_step": 184936, "epoch": 2228} {"train_loss": -23.549936294555664, "global_step": 184937, "epoch": 2228} {"train_loss": -23.678659439086914, "global_step": 184938, "epoch": 2228} {"train_loss": -24.2069034576416, "global_step": 184939, "epoch": 2228} {"train_loss": -23.945356369018555, "global_step": 184940, "epoch": 2228} {"train_loss": -23.989469528198242, "global_step": 184941, "epoch": 2228} {"train_loss": -24.014175415039062, "global_step": 184942, "epoch": 2228} {"train_loss": -24.117313385009766, "global_step": 184943, "epoch": 2228} {"train_loss": -23.632570266723633, "global_step": 184944, "epoch": 2228} {"train_loss": -24.163984298706055, "global_step": 184945, "epoch": 2228} {"train_loss": -23.959049224853516, "global_step": 184946, "epoch": 2228} {"train_loss": -23.999591827392578, "global_step": 184947, "epoch": 2228} {"train_loss": -23.862768173217773, "global_step": 184948, "epoch": 2228} {"train_loss": -23.998523712158203, "global_step": 184949, "epoch": 2228} {"train_loss": -24.019039154052734, "global_step": 184950, "epoch": 2228} {"train_loss": -23.789093017578125, "global_step": 184951, "epoch": 2228} {"train_loss": -24.459726333618164, "global_step": 184952, "epoch": 2228} {"train_loss": -23.8902645111084, "global_step": 184953, "epoch": 2228} {"train_loss": -24.134546279907227, "global_step": 184954, "epoch": 2228} {"train_loss": -24.21638298034668, "global_step": 184955, "epoch": 2228} {"train_loss": -24.000890731811523, "global_step": 184956, "epoch": 2228} {"train_loss": -24.28958511352539, "global_step": 184957, "epoch": 2228} {"train_loss": -24.334415435791016, "global_step": 184958, "epoch": 2228} {"train_loss": -23.738157272338867, "global_step": 184959, "epoch": 2228} {"train_loss": -23.63892936706543, "global_step": 184960, "epoch": 2228} {"train_loss": -23.801664352416992, "global_step": 184961, "epoch": 2228} {"train_loss": -23.670846939086914, "global_step": 184962, "epoch": 2228} {"train_loss": -24.08209800720215, "global_step": 184963, "epoch": 2228} {"train_loss": -23.871122360229492, "global_step": 184964, "epoch": 2228} {"train_loss": -24.23593521118164, "global_step": 184965, "epoch": 2228} {"train_loss": -24.24827766418457, "global_step": 184966, "epoch": 2228} {"train_loss": -23.511661529541016, "global_step": 184967, "epoch": 2228} {"train_loss": -24.198610305786133, "global_step": 184968, "epoch": 2228} {"train_loss": -23.86087989807129, "global_step": 184969, "epoch": 2228} {"train_loss": -23.956159591674805, "global_step": 184970, "epoch": 2228} {"train_loss": -23.571334838867188, "global_step": 184971, "epoch": 2228} {"train_loss": -24.028085708618164, "global_step": 184972, "epoch": 2228} {"train_loss": -24.07781982421875, "global_step": 184973, "epoch": 2228} {"train_loss": -23.687978744506836, "global_step": 184974, "epoch": 2228} {"train_loss": -23.9901180267334, "global_step": 184975, "epoch": 2228} {"train_loss": -23.984312057495117, "global_step": 184976, "epoch": 2228} {"train_loss": -23.91570472717285, "global_step": 184977, "epoch": 2228} {"train_loss": -23.791112899780273, "global_step": 184978, "epoch": 2228} {"train_loss": -23.83477783203125, "global_step": 184979, "epoch": 2228} {"train_loss": -23.472061157226562, "global_step": 184980, "epoch": 2228} {"train_loss": -24.013137817382812, "global_step": 184981, "epoch": 2228} {"train_loss": -23.467693328857422, "global_step": 184982, "epoch": 2228} {"train_loss": -23.580184936523438, "global_step": 184983, "epoch": 2228} {"train_loss": -24.0219783782959, "global_step": 184984, "epoch": 2228} {"train_loss": -23.7294864654541, "global_step": 184985, "epoch": 2228} {"train_loss": -24.04298210144043, "global_step": 184986, "epoch": 2228} {"train_loss": -24.09805679321289, "global_step": 184987, "epoch": 2228} {"train_loss": -24.14406394958496, "global_step": 184988, "epoch": 2228} {"train_loss": -24.28767967224121, "global_step": 184989, "epoch": 2228} {"train_loss": -23.931259155273438, "global_step": 184990, "epoch": 2228} {"train_loss": -23.90955924987793, "global_step": 184991, "epoch": 2228} {"train_loss": -24.122821807861328, "global_step": 184992, "epoch": 2228} {"train_loss": -24.18690299987793, "global_step": 184993, "epoch": 2228} {"train_loss": -24.537311553955078, "global_step": 184994, "epoch": 2228} {"train_loss": -23.86079216003418, "global_step": 184995, "epoch": 2228} {"train_loss": -24.50661277770996, "global_step": 184996, "epoch": 2228} {"train_loss": -24.006790161132812, "global_step": 184997, "epoch": 2228} {"train_loss": -23.993574142456055, "global_step": 184998, "epoch": 2228} {"train_loss": -24.39957618713379, "global_step": 184999, "epoch": 2228} {"train_loss": -24.08631706237793, "global_step": 185000, "epoch": 2228} {"train_loss": -24.303564071655273, "global_step": 185001, "epoch": 2228} {"train_loss": -24.286930084228516, "global_step": 185002, "epoch": 2228} {"train_loss": -24.391040802001953, "global_step": 185003, "epoch": 2228} {"train_loss": -24.201017379760742, "global_step": 185004, "epoch": 2228} {"train_loss": -24.22641372680664, "global_step": 185005, "epoch": 2228} {"train_loss": -23.951072003467974, "global_step": 185006, "epoch": 2228, "val_loss": 6407443.0} {"train_loss": -23.637067794799805, "global_step": 185007, "epoch": 2229} {"train_loss": -23.898221969604492, "global_step": 185008, "epoch": 2229} {"train_loss": -23.552391052246094, "global_step": 185009, "epoch": 2229} {"train_loss": -23.410673141479492, "global_step": 185010, "epoch": 2229} {"train_loss": -23.250600814819336, "global_step": 185011, "epoch": 2229} {"train_loss": -23.642362594604492, "global_step": 185012, "epoch": 2229} {"train_loss": -23.49772834777832, "global_step": 185013, "epoch": 2229} {"train_loss": -23.810863494873047, "global_step": 185014, "epoch": 2229} {"train_loss": -23.735387802124023, "global_step": 185015, "epoch": 2229} {"train_loss": -23.837982177734375, "global_step": 185016, "epoch": 2229} {"train_loss": -23.871217727661133, "global_step": 185017, "epoch": 2229} {"train_loss": -23.175064086914062, "global_step": 185018, "epoch": 2229} {"train_loss": -23.38922119140625, "global_step": 185019, "epoch": 2229} {"train_loss": -24.030010223388672, "global_step": 185020, "epoch": 2229} {"train_loss": -23.919828414916992, "global_step": 185021, "epoch": 2229} {"train_loss": -24.25186538696289, "global_step": 185022, "epoch": 2229} {"train_loss": -23.607385635375977, "global_step": 185023, "epoch": 2229} {"train_loss": -23.459726333618164, "global_step": 185024, "epoch": 2229} {"train_loss": -24.009597778320312, "global_step": 185025, "epoch": 2229} {"train_loss": -23.594654083251953, "global_step": 185026, "epoch": 2229} {"train_loss": -23.65239143371582, "global_step": 185027, "epoch": 2229} {"train_loss": -23.95182991027832, "global_step": 185028, "epoch": 2229} {"train_loss": -23.410953521728516, "global_step": 185029, "epoch": 2229} {"train_loss": -23.449722290039062, "global_step": 185030, "epoch": 2229} {"train_loss": -23.90228843688965, "global_step": 185031, "epoch": 2229} {"train_loss": -23.696470260620117, "global_step": 185032, "epoch": 2229} {"train_loss": -23.732501983642578, "global_step": 185033, "epoch": 2229} {"train_loss": -23.7391300201416, "global_step": 185034, "epoch": 2229} {"train_loss": -24.301618576049805, "global_step": 185035, "epoch": 2229} {"train_loss": -23.353757858276367, "global_step": 185036, "epoch": 2229} {"train_loss": -23.90046501159668, "global_step": 185037, "epoch": 2229} {"train_loss": -24.15338706970215, "global_step": 185038, "epoch": 2229} {"train_loss": -23.954574584960938, "global_step": 185039, "epoch": 2229} {"train_loss": -23.952810287475586, "global_step": 185040, "epoch": 2229} {"train_loss": -23.84995460510254, "global_step": 185041, "epoch": 2229} {"train_loss": -24.147674560546875, "global_step": 185042, "epoch": 2229} {"train_loss": -24.058820724487305, "global_step": 185043, "epoch": 2229} {"train_loss": -24.05353355407715, "global_step": 185044, "epoch": 2229} {"train_loss": -23.926477432250977, "global_step": 185045, "epoch": 2229} {"train_loss": -23.72665786743164, "global_step": 185046, "epoch": 2229} {"train_loss": -24.439393997192383, "global_step": 185047, "epoch": 2229} {"train_loss": -24.072832107543945, "global_step": 185048, "epoch": 2229} {"train_loss": -23.735794067382812, "global_step": 185049, "epoch": 2229} {"train_loss": -24.256467819213867, "global_step": 185050, "epoch": 2229} {"train_loss": -24.127634048461914, "global_step": 185051, "epoch": 2229} {"train_loss": -23.692846298217773, "global_step": 185052, "epoch": 2229} {"train_loss": -23.94862174987793, "global_step": 185053, "epoch": 2229} {"train_loss": -24.009140014648438, "global_step": 185054, "epoch": 2229} {"train_loss": -23.682828903198242, "global_step": 185055, "epoch": 2229} {"train_loss": -23.99367332458496, "global_step": 185056, "epoch": 2229} {"train_loss": -23.617431640625, "global_step": 185057, "epoch": 2229} {"train_loss": -23.97109031677246, "global_step": 185058, "epoch": 2229} {"train_loss": -23.974042892456055, "global_step": 185059, "epoch": 2229} {"train_loss": -24.18135643005371, "global_step": 185060, "epoch": 2229} {"train_loss": -23.977277755737305, "global_step": 185061, "epoch": 2229} {"train_loss": -23.919034957885742, "global_step": 185062, "epoch": 2229} {"train_loss": -24.212045669555664, "global_step": 185063, "epoch": 2229} {"train_loss": -24.03150749206543, "global_step": 185064, "epoch": 2229} {"train_loss": -24.134851455688477, "global_step": 185065, "epoch": 2229} {"train_loss": -23.763620376586914, "global_step": 185066, "epoch": 2229} {"train_loss": -23.943588256835938, "global_step": 185067, "epoch": 2229} {"train_loss": -24.100656509399414, "global_step": 185068, "epoch": 2229} {"train_loss": -23.690044403076172, "global_step": 185069, "epoch": 2229} {"train_loss": -23.747398376464844, "global_step": 185070, "epoch": 2229} {"train_loss": -23.777612686157227, "global_step": 185071, "epoch": 2229} {"train_loss": -23.992252349853516, "global_step": 185072, "epoch": 2229} {"train_loss": -23.636030197143555, "global_step": 185073, "epoch": 2229} {"train_loss": -23.79837417602539, "global_step": 185074, "epoch": 2229} {"train_loss": -24.348642349243164, "global_step": 185075, "epoch": 2229} {"train_loss": -24.202238082885742, "global_step": 185076, "epoch": 2229} {"train_loss": -24.068052291870117, "global_step": 185077, "epoch": 2229} {"train_loss": -24.220861434936523, "global_step": 185078, "epoch": 2229} {"train_loss": -23.989091873168945, "global_step": 185079, "epoch": 2229} {"train_loss": -24.0387020111084, "global_step": 185080, "epoch": 2229} {"train_loss": -23.80661392211914, "global_step": 185081, "epoch": 2229} {"train_loss": -23.691675186157227, "global_step": 185082, "epoch": 2229} {"train_loss": -24.03957748413086, "global_step": 185083, "epoch": 2229} {"train_loss": -23.807373046875, "global_step": 185084, "epoch": 2229} {"train_loss": -23.79887580871582, "global_step": 185085, "epoch": 2229} {"train_loss": -23.760269165039062, "global_step": 185086, "epoch": 2229} {"train_loss": -24.20014762878418, "global_step": 185087, "epoch": 2229} {"train_loss": -24.110700607299805, "global_step": 185088, "epoch": 2229} {"train_loss": -23.854553935039473, "global_step": 185089, "epoch": 2229, "val_loss": 6513468.0} {"train_loss": -24.156875610351562, "global_step": 185090, "epoch": 2230} {"train_loss": -23.694049835205078, "global_step": 185091, "epoch": 2230} {"train_loss": -24.036285400390625, "global_step": 185092, "epoch": 2230} {"train_loss": -23.956558227539062, "global_step": 185093, "epoch": 2230} {"train_loss": -23.263595581054688, "global_step": 185094, "epoch": 2230} {"train_loss": -24.01675796508789, "global_step": 185095, "epoch": 2230} {"train_loss": -24.1104679107666, "global_step": 185096, "epoch": 2230} {"train_loss": -24.1676025390625, "global_step": 185097, "epoch": 2230} {"train_loss": -23.459638595581055, "global_step": 185098, "epoch": 2230} {"train_loss": -24.200828552246094, "global_step": 185099, "epoch": 2230} {"train_loss": -23.841257095336914, "global_step": 185100, "epoch": 2230} {"train_loss": -23.784452438354492, "global_step": 185101, "epoch": 2230} {"train_loss": -24.01287841796875, "global_step": 185102, "epoch": 2230} {"train_loss": -23.838851928710938, "global_step": 185103, "epoch": 2230} {"train_loss": -24.355031967163086, "global_step": 185104, "epoch": 2230} {"train_loss": -23.939300537109375, "global_step": 185105, "epoch": 2230} {"train_loss": -24.116546630859375, "global_step": 185106, "epoch": 2230} {"train_loss": -23.945363998413086, "global_step": 185107, "epoch": 2230} {"train_loss": -23.906177520751953, "global_step": 185108, "epoch": 2230} {"train_loss": -24.092008590698242, "global_step": 185109, "epoch": 2230} {"train_loss": -23.77058219909668, "global_step": 185110, "epoch": 2230} {"train_loss": -24.0449275970459, "global_step": 185111, "epoch": 2230} {"train_loss": -23.6392879486084, "global_step": 185112, "epoch": 2230} {"train_loss": -23.945173263549805, "global_step": 185113, "epoch": 2230} {"train_loss": -24.182031631469727, "global_step": 185114, "epoch": 2230} {"train_loss": -23.705638885498047, "global_step": 185115, "epoch": 2230} {"train_loss": -24.14198112487793, "global_step": 185116, "epoch": 2230} {"train_loss": -23.964391708374023, "global_step": 185117, "epoch": 2230} {"train_loss": -24.33827018737793, "global_step": 185118, "epoch": 2230} {"train_loss": -24.19055938720703, "global_step": 185119, "epoch": 2230} {"train_loss": -24.387060165405273, "global_step": 185120, "epoch": 2230} {"train_loss": -23.950410842895508, "global_step": 185121, "epoch": 2230} {"train_loss": -23.892288208007812, "global_step": 185122, "epoch": 2230} {"train_loss": -24.031810760498047, "global_step": 185123, "epoch": 2230} {"train_loss": -24.514684677124023, "global_step": 185124, "epoch": 2230} {"train_loss": -24.142589569091797, "global_step": 185125, "epoch": 2230} {"train_loss": -24.08284568786621, "global_step": 185126, "epoch": 2230} {"train_loss": -23.824453353881836, "global_step": 185127, "epoch": 2230} {"train_loss": -24.127004623413086, "global_step": 185128, "epoch": 2230} {"train_loss": -23.699647903442383, "global_step": 185129, "epoch": 2230} {"train_loss": -23.956750869750977, "global_step": 185130, "epoch": 2230} {"train_loss": -24.25957679748535, "global_step": 185131, "epoch": 2230} {"train_loss": -23.965869903564453, "global_step": 185132, "epoch": 2230} {"train_loss": -23.65936851501465, "global_step": 185133, "epoch": 2230} {"train_loss": -24.05059814453125, "global_step": 185134, "epoch": 2230} {"train_loss": -23.841934204101562, "global_step": 185135, "epoch": 2230} {"train_loss": -23.478422164916992, "global_step": 185136, "epoch": 2230} {"train_loss": -23.689517974853516, "global_step": 185137, "epoch": 2230} {"train_loss": -24.005170822143555, "global_step": 185138, "epoch": 2230} {"train_loss": -24.0238037109375, "global_step": 185139, "epoch": 2230} {"train_loss": -23.808124542236328, "global_step": 185140, "epoch": 2230} {"train_loss": -24.02685546875, "global_step": 185141, "epoch": 2230} {"train_loss": -24.325695037841797, "global_step": 185142, "epoch": 2230} {"train_loss": -24.185834884643555, "global_step": 185143, "epoch": 2230} {"train_loss": -24.272123336791992, "global_step": 185144, "epoch": 2230} {"train_loss": -23.84232521057129, "global_step": 185145, "epoch": 2230} {"train_loss": -23.7966251373291, "global_step": 185146, "epoch": 2230} {"train_loss": -24.077238082885742, "global_step": 185147, "epoch": 2230} {"train_loss": -24.304731369018555, "global_step": 185148, "epoch": 2230} {"train_loss": -24.05666732788086, "global_step": 185149, "epoch": 2230} {"train_loss": -24.000837326049805, "global_step": 185150, "epoch": 2230} {"train_loss": -23.858171463012695, "global_step": 185151, "epoch": 2230} {"train_loss": -24.223852157592773, "global_step": 185152, "epoch": 2230} {"train_loss": -24.206592559814453, "global_step": 185153, "epoch": 2230} {"train_loss": -23.69854164123535, "global_step": 185154, "epoch": 2230} {"train_loss": -23.670095443725586, "global_step": 185155, "epoch": 2230} {"train_loss": -24.050750732421875, "global_step": 185156, "epoch": 2230} {"train_loss": -23.834550857543945, "global_step": 185157, "epoch": 2230} {"train_loss": -24.27247428894043, "global_step": 185158, "epoch": 2230} {"train_loss": -23.998498916625977, "global_step": 185159, "epoch": 2230} {"train_loss": -24.014881134033203, "global_step": 185160, "epoch": 2230} {"train_loss": -24.095441818237305, "global_step": 185161, "epoch": 2230} {"train_loss": -23.818771362304688, "global_step": 185162, "epoch": 2230} {"train_loss": -24.112476348876953, "global_step": 185163, "epoch": 2230} {"train_loss": -24.312070846557617, "global_step": 185164, "epoch": 2230} {"train_loss": -23.988563537597656, "global_step": 185165, "epoch": 2230} {"train_loss": -24.25929069519043, "global_step": 185166, "epoch": 2230} {"train_loss": -24.275541305541992, "global_step": 185167, "epoch": 2230} {"train_loss": -24.30280876159668, "global_step": 185168, "epoch": 2230} {"train_loss": -24.072574615478516, "global_step": 185169, "epoch": 2230} {"train_loss": -24.227712631225586, "global_step": 185170, "epoch": 2230} {"train_loss": -24.0050048828125, "global_step": 185171, "epoch": 2230} {"train_loss": -24.026085934007025, "global_step": 185172, "epoch": 2230, "val_loss": 6550560.0} {"train_loss": -23.151447296142578, "global_step": 185173, "epoch": 2231} {"train_loss": -23.7714900970459, "global_step": 185174, "epoch": 2231} {"train_loss": -23.149873733520508, "global_step": 185175, "epoch": 2231} {"train_loss": -23.602670669555664, "global_step": 185176, "epoch": 2231} {"train_loss": -23.68492889404297, "global_step": 185177, "epoch": 2231} {"train_loss": -23.461477279663086, "global_step": 185178, "epoch": 2231} {"train_loss": -23.547643661499023, "global_step": 185179, "epoch": 2231} {"train_loss": -23.44217872619629, "global_step": 185180, "epoch": 2231} {"train_loss": -24.128101348876953, "global_step": 185181, "epoch": 2231} {"train_loss": -23.312089920043945, "global_step": 185182, "epoch": 2231} {"train_loss": -23.776124954223633, "global_step": 185183, "epoch": 2231} {"train_loss": -24.195837020874023, "global_step": 185184, "epoch": 2231} {"train_loss": -24.028478622436523, "global_step": 185185, "epoch": 2231} {"train_loss": -23.633161544799805, "global_step": 185186, "epoch": 2231} {"train_loss": -23.727807998657227, "global_step": 185187, "epoch": 2231} {"train_loss": -24.0224666595459, "global_step": 185188, "epoch": 2231} {"train_loss": -23.396020889282227, "global_step": 185189, "epoch": 2231} {"train_loss": -23.753015518188477, "global_step": 185190, "epoch": 2231} {"train_loss": -23.778093338012695, "global_step": 185191, "epoch": 2231} {"train_loss": -23.269575119018555, "global_step": 185192, "epoch": 2231} {"train_loss": -23.645387649536133, "global_step": 185193, "epoch": 2231} {"train_loss": -23.959074020385742, "global_step": 185194, "epoch": 2231} {"train_loss": -23.643993377685547, "global_step": 185195, "epoch": 2231} {"train_loss": -23.881052017211914, "global_step": 185196, "epoch": 2231} {"train_loss": -24.27412986755371, "global_step": 185197, "epoch": 2231} {"train_loss": -24.172529220581055, "global_step": 185198, "epoch": 2231} {"train_loss": -23.961774826049805, "global_step": 185199, "epoch": 2231} {"train_loss": -23.87571907043457, "global_step": 185200, "epoch": 2231} {"train_loss": -23.885215759277344, "global_step": 185201, "epoch": 2231} {"train_loss": -24.05661964416504, "global_step": 185202, "epoch": 2231} {"train_loss": -24.03026008605957, "global_step": 185203, "epoch": 2231} {"train_loss": -23.57537269592285, "global_step": 185204, "epoch": 2231} {"train_loss": -23.790971755981445, "global_step": 185205, "epoch": 2231} {"train_loss": -23.883350372314453, "global_step": 185206, "epoch": 2231} {"train_loss": -24.230417251586914, "global_step": 185207, "epoch": 2231} {"train_loss": -24.200620651245117, "global_step": 185208, "epoch": 2231} {"train_loss": -23.82896614074707, "global_step": 185209, "epoch": 2231} {"train_loss": -24.02143669128418, "global_step": 185210, "epoch": 2231} {"train_loss": -24.126422882080078, "global_step": 185211, "epoch": 2231} {"train_loss": -24.223527908325195, "global_step": 185212, "epoch": 2231} {"train_loss": -23.867719650268555, "global_step": 185213, "epoch": 2231} {"train_loss": -24.143529891967773, "global_step": 185214, "epoch": 2231} {"train_loss": -23.918954849243164, "global_step": 185215, "epoch": 2231} {"train_loss": -23.50248908996582, "global_step": 185216, "epoch": 2231} {"train_loss": -23.974119186401367, "global_step": 185217, "epoch": 2231} {"train_loss": -23.935888290405273, "global_step": 185218, "epoch": 2231} {"train_loss": -23.429677963256836, "global_step": 185219, "epoch": 2231} {"train_loss": -24.05035400390625, "global_step": 185220, "epoch": 2231} {"train_loss": -23.786890029907227, "global_step": 185221, "epoch": 2231} {"train_loss": -24.148462295532227, "global_step": 185222, "epoch": 2231} {"train_loss": -23.57447052001953, "global_step": 185223, "epoch": 2231} {"train_loss": -23.87375259399414, "global_step": 185224, "epoch": 2231} {"train_loss": -24.02195930480957, "global_step": 185225, "epoch": 2231} {"train_loss": -24.006738662719727, "global_step": 185226, "epoch": 2231} {"train_loss": -23.874013900756836, "global_step": 185227, "epoch": 2231} {"train_loss": -23.919536590576172, "global_step": 185228, "epoch": 2231} {"train_loss": -23.508953094482422, "global_step": 185229, "epoch": 2231} {"train_loss": -23.820180892944336, "global_step": 185230, "epoch": 2231} {"train_loss": -23.979482650756836, "global_step": 185231, "epoch": 2231} {"train_loss": -24.28887939453125, "global_step": 185232, "epoch": 2231} {"train_loss": -24.33823585510254, "global_step": 185233, "epoch": 2231} {"train_loss": -23.89225959777832, "global_step": 185234, "epoch": 2231} {"train_loss": -23.94609832763672, "global_step": 185235, "epoch": 2231} {"train_loss": -23.939224243164062, "global_step": 185236, "epoch": 2231} {"train_loss": -23.968273162841797, "global_step": 185237, "epoch": 2231} {"train_loss": -24.053712844848633, "global_step": 185238, "epoch": 2231} {"train_loss": -24.194820404052734, "global_step": 185239, "epoch": 2231} {"train_loss": -24.255773544311523, "global_step": 185240, "epoch": 2231} {"train_loss": -24.08742332458496, "global_step": 185241, "epoch": 2231} {"train_loss": -24.114225387573242, "global_step": 185242, "epoch": 2231} {"train_loss": -23.74561882019043, "global_step": 185243, "epoch": 2231} {"train_loss": -23.557924270629883, "global_step": 185244, "epoch": 2231} {"train_loss": -23.699918746948242, "global_step": 185245, "epoch": 2231} {"train_loss": -23.73970603942871, "global_step": 185246, "epoch": 2231} {"train_loss": -24.2646427154541, "global_step": 185247, "epoch": 2231} {"train_loss": -23.97989273071289, "global_step": 185248, "epoch": 2231} {"train_loss": -24.292985916137695, "global_step": 185249, "epoch": 2231} {"train_loss": -24.390121459960938, "global_step": 185250, "epoch": 2231} {"train_loss": -23.99030876159668, "global_step": 185251, "epoch": 2231} {"train_loss": -23.8526554107666, "global_step": 185252, "epoch": 2231} {"train_loss": -24.386526107788086, "global_step": 185253, "epoch": 2231} {"train_loss": -23.980329513549805, "global_step": 185254, "epoch": 2231} {"train_loss": -23.880193963108294, "global_step": 185255, "epoch": 2231, "val_loss": 6545851.0} {"train_loss": -20.3513240814209, "global_step": 185256, "epoch": 2232} {"train_loss": -22.55555534362793, "global_step": 185257, "epoch": 2232} {"train_loss": -22.32657814025879, "global_step": 185258, "epoch": 2232} {"train_loss": -23.283655166625977, "global_step": 185259, "epoch": 2232} {"train_loss": -22.11248779296875, "global_step": 185260, "epoch": 2232} {"train_loss": -23.10502815246582, "global_step": 185261, "epoch": 2232} {"train_loss": -23.310428619384766, "global_step": 185262, "epoch": 2232} {"train_loss": -22.940019607543945, "global_step": 185263, "epoch": 2232} {"train_loss": -23.381444931030273, "global_step": 185264, "epoch": 2232} {"train_loss": -23.38360595703125, "global_step": 185265, "epoch": 2232} {"train_loss": -23.331701278686523, "global_step": 185266, "epoch": 2232} {"train_loss": -22.863290786743164, "global_step": 185267, "epoch": 2232} {"train_loss": -23.422029495239258, "global_step": 185268, "epoch": 2232} {"train_loss": -22.9210147857666, "global_step": 185269, "epoch": 2232} {"train_loss": -23.139240264892578, "global_step": 185270, "epoch": 2232} {"train_loss": -23.285572052001953, "global_step": 185271, "epoch": 2232} {"train_loss": -23.61048126220703, "global_step": 185272, "epoch": 2232} {"train_loss": -23.572851181030273, "global_step": 185273, "epoch": 2232} {"train_loss": -23.737634658813477, "global_step": 185274, "epoch": 2232} {"train_loss": -23.13019371032715, "global_step": 185275, "epoch": 2232} {"train_loss": -23.52176856994629, "global_step": 185276, "epoch": 2232} {"train_loss": -23.440109252929688, "global_step": 185277, "epoch": 2232} {"train_loss": -23.27699089050293, "global_step": 185278, "epoch": 2232} {"train_loss": -23.4184513092041, "global_step": 185279, "epoch": 2232} {"train_loss": -22.939905166625977, "global_step": 185280, "epoch": 2232} {"train_loss": -23.03850555419922, "global_step": 185281, "epoch": 2232} {"train_loss": -23.97798728942871, "global_step": 185282, "epoch": 2232} {"train_loss": -23.24322509765625, "global_step": 185283, "epoch": 2232} {"train_loss": -23.77811050415039, "global_step": 185284, "epoch": 2232} {"train_loss": -23.155929565429688, "global_step": 185285, "epoch": 2232} {"train_loss": -23.650943756103516, "global_step": 185286, "epoch": 2232} {"train_loss": -23.692068099975586, "global_step": 185287, "epoch": 2232} {"train_loss": -23.438278198242188, "global_step": 185288, "epoch": 2232} {"train_loss": -23.2954158782959, "global_step": 185289, "epoch": 2232} {"train_loss": -23.396631240844727, "global_step": 185290, "epoch": 2232} {"train_loss": -23.6536865234375, "global_step": 185291, "epoch": 2232} {"train_loss": -23.565052032470703, "global_step": 185292, "epoch": 2232} {"train_loss": -23.663888931274414, "global_step": 185293, "epoch": 2232} {"train_loss": -23.701261520385742, "global_step": 185294, "epoch": 2232} {"train_loss": -23.98025131225586, "global_step": 185295, "epoch": 2232} {"train_loss": -24.023853302001953, "global_step": 185296, "epoch": 2232} {"train_loss": -23.745101928710938, "global_step": 185297, "epoch": 2232} {"train_loss": -24.158159255981445, "global_step": 185298, "epoch": 2232} {"train_loss": -23.75624656677246, "global_step": 185299, "epoch": 2232} {"train_loss": -24.058629989624023, "global_step": 185300, "epoch": 2232} {"train_loss": -23.68768310546875, "global_step": 185301, "epoch": 2232} {"train_loss": -24.279220581054688, "global_step": 185302, "epoch": 2232} {"train_loss": -23.817384719848633, "global_step": 185303, "epoch": 2232} {"train_loss": -24.009077072143555, "global_step": 185304, "epoch": 2232} {"train_loss": -24.06842613220215, "global_step": 185305, "epoch": 2232} {"train_loss": -24.020254135131836, "global_step": 185306, "epoch": 2232} {"train_loss": -23.842456817626953, "global_step": 185307, "epoch": 2232} {"train_loss": -23.948503494262695, "global_step": 185308, "epoch": 2232} {"train_loss": -24.173175811767578, "global_step": 185309, "epoch": 2232} {"train_loss": -23.662395477294922, "global_step": 185310, "epoch": 2232} {"train_loss": -24.00315284729004, "global_step": 185311, "epoch": 2232} {"train_loss": -23.84242820739746, "global_step": 185312, "epoch": 2232} {"train_loss": -24.016935348510742, "global_step": 185313, "epoch": 2232} {"train_loss": -24.356874465942383, "global_step": 185314, "epoch": 2232} {"train_loss": -23.840620040893555, "global_step": 185315, "epoch": 2232} {"train_loss": -23.821989059448242, "global_step": 185316, "epoch": 2232} {"train_loss": -24.047351837158203, "global_step": 185317, "epoch": 2232} {"train_loss": -24.18845558166504, "global_step": 185318, "epoch": 2232} {"train_loss": -24.228248596191406, "global_step": 185319, "epoch": 2232} {"train_loss": -24.281742095947266, "global_step": 185320, "epoch": 2232} {"train_loss": -24.32438087463379, "global_step": 185321, "epoch": 2232} {"train_loss": -24.037784576416016, "global_step": 185322, "epoch": 2232} {"train_loss": -24.509546279907227, "global_step": 185323, "epoch": 2232} {"train_loss": -24.241052627563477, "global_step": 185324, "epoch": 2232} {"train_loss": -23.986194610595703, "global_step": 185325, "epoch": 2232} {"train_loss": -23.645099639892578, "global_step": 185326, "epoch": 2232} {"train_loss": -23.84954833984375, "global_step": 185327, "epoch": 2232} {"train_loss": -23.910842895507812, "global_step": 185328, "epoch": 2232} {"train_loss": -24.05858039855957, "global_step": 185329, "epoch": 2232} {"train_loss": -23.852643966674805, "global_step": 185330, "epoch": 2232} {"train_loss": -24.172252655029297, "global_step": 185331, "epoch": 2232} {"train_loss": -23.92313003540039, "global_step": 185332, "epoch": 2232} {"train_loss": -24.12688636779785, "global_step": 185333, "epoch": 2232} {"train_loss": -24.486129760742188, "global_step": 185334, "epoch": 2232} {"train_loss": -24.334896087646484, "global_step": 185335, "epoch": 2232} {"train_loss": -23.887338638305664, "global_step": 185336, "epoch": 2232} {"train_loss": -24.136415481567383, "global_step": 185337, "epoch": 2232} {"train_loss": -23.653015182678956, "global_step": 185338, "epoch": 2232, "val_loss": 6521417.0} {"train_loss": -23.14420509338379, "global_step": 185339, "epoch": 2233} {"train_loss": -23.135465621948242, "global_step": 185340, "epoch": 2233} {"train_loss": -23.71221923828125, "global_step": 185341, "epoch": 2233} {"train_loss": -23.646711349487305, "global_step": 185342, "epoch": 2233} {"train_loss": -23.360700607299805, "global_step": 185343, "epoch": 2233} {"train_loss": -23.596960067749023, "global_step": 185344, "epoch": 2233} {"train_loss": -23.848081588745117, "global_step": 185345, "epoch": 2233} {"train_loss": -23.858476638793945, "global_step": 185346, "epoch": 2233} {"train_loss": -23.694623947143555, "global_step": 185347, "epoch": 2233} {"train_loss": -23.973735809326172, "global_step": 185348, "epoch": 2233} {"train_loss": -23.653608322143555, "global_step": 185349, "epoch": 2233} {"train_loss": -23.662094116210938, "global_step": 185350, "epoch": 2233} {"train_loss": -24.03965187072754, "global_step": 185351, "epoch": 2233} {"train_loss": -23.90753173828125, "global_step": 185352, "epoch": 2233} {"train_loss": -23.93695068359375, "global_step": 185353, "epoch": 2233} {"train_loss": -24.11745262145996, "global_step": 185354, "epoch": 2233} {"train_loss": -23.701900482177734, "global_step": 185355, "epoch": 2233} {"train_loss": -24.2069149017334, "global_step": 185356, "epoch": 2233} {"train_loss": -24.10909080505371, "global_step": 185357, "epoch": 2233} {"train_loss": -23.712156295776367, "global_step": 185358, "epoch": 2233} {"train_loss": -24.02483558654785, "global_step": 185359, "epoch": 2233} {"train_loss": -23.84376335144043, "global_step": 185360, "epoch": 2233} {"train_loss": -24.164196014404297, "global_step": 185361, "epoch": 2233} {"train_loss": -23.91576385498047, "global_step": 185362, "epoch": 2233} {"train_loss": -23.954687118530273, "global_step": 185363, "epoch": 2233} {"train_loss": -23.724985122680664, "global_step": 185364, "epoch": 2233} {"train_loss": -23.933673858642578, "global_step": 185365, "epoch": 2233} {"train_loss": -23.905471801757812, "global_step": 185366, "epoch": 2233} {"train_loss": -23.929075241088867, "global_step": 185367, "epoch": 2233} {"train_loss": -24.128990173339844, "global_step": 185368, "epoch": 2233} {"train_loss": -23.971139907836914, "global_step": 185369, "epoch": 2233} {"train_loss": -24.15509605407715, "global_step": 185370, "epoch": 2233} {"train_loss": -23.905797958374023, "global_step": 185371, "epoch": 2233} {"train_loss": -23.849172592163086, "global_step": 185372, "epoch": 2233} {"train_loss": -23.8380184173584, "global_step": 185373, "epoch": 2233} {"train_loss": -23.953292846679688, "global_step": 185374, "epoch": 2233} {"train_loss": -23.877239227294922, "global_step": 185375, "epoch": 2233} {"train_loss": -23.82285499572754, "global_step": 185376, "epoch": 2233} {"train_loss": -23.974599838256836, "global_step": 185377, "epoch": 2233} {"train_loss": -24.145811080932617, "global_step": 185378, "epoch": 2233} {"train_loss": -24.0830078125, "global_step": 185379, "epoch": 2233} {"train_loss": -23.979848861694336, "global_step": 185380, "epoch": 2233} {"train_loss": -24.109088897705078, "global_step": 185381, "epoch": 2233} {"train_loss": -23.795984268188477, "global_step": 185382, "epoch": 2233} {"train_loss": -23.83890724182129, "global_step": 185383, "epoch": 2233} {"train_loss": -23.88791275024414, "global_step": 185384, "epoch": 2233} {"train_loss": -23.879077911376953, "global_step": 185385, "epoch": 2233} {"train_loss": -23.915925979614258, "global_step": 185386, "epoch": 2233} {"train_loss": -24.228567123413086, "global_step": 185387, "epoch": 2233} {"train_loss": -24.060596466064453, "global_step": 185388, "epoch": 2233} {"train_loss": -23.717267990112305, "global_step": 185389, "epoch": 2233} {"train_loss": -24.111679077148438, "global_step": 185390, "epoch": 2233} {"train_loss": -24.1132869720459, "global_step": 185391, "epoch": 2233} {"train_loss": -24.170766830444336, "global_step": 185392, "epoch": 2233} {"train_loss": -24.03409194946289, "global_step": 185393, "epoch": 2233} {"train_loss": -23.796249389648438, "global_step": 185394, "epoch": 2233} {"train_loss": -23.840087890625, "global_step": 185395, "epoch": 2233} {"train_loss": -23.951702117919922, "global_step": 185396, "epoch": 2233} {"train_loss": -24.35386085510254, "global_step": 185397, "epoch": 2233} {"train_loss": -23.939563751220703, "global_step": 185398, "epoch": 2233} {"train_loss": -23.900070190429688, "global_step": 185399, "epoch": 2233} {"train_loss": -24.199506759643555, "global_step": 185400, "epoch": 2233} {"train_loss": -24.045480728149414, "global_step": 185401, "epoch": 2233} {"train_loss": -24.133718490600586, "global_step": 185402, "epoch": 2233} {"train_loss": -23.851959228515625, "global_step": 185403, "epoch": 2233} {"train_loss": -24.209577560424805, "global_step": 185404, "epoch": 2233} {"train_loss": -24.06668472290039, "global_step": 185405, "epoch": 2233} {"train_loss": -23.74704360961914, "global_step": 185406, "epoch": 2233} {"train_loss": -24.166521072387695, "global_step": 185407, "epoch": 2233} {"train_loss": -24.059431076049805, "global_step": 185408, "epoch": 2233} {"train_loss": -23.848758697509766, "global_step": 185409, "epoch": 2233} {"train_loss": -24.19404411315918, "global_step": 185410, "epoch": 2233} {"train_loss": -24.097156524658203, "global_step": 185411, "epoch": 2233} {"train_loss": -24.035720825195312, "global_step": 185412, "epoch": 2233} {"train_loss": -24.013750076293945, "global_step": 185413, "epoch": 2233} {"train_loss": -23.83475685119629, "global_step": 185414, "epoch": 2233} {"train_loss": -23.85200309753418, "global_step": 185415, "epoch": 2233} {"train_loss": -24.15863609313965, "global_step": 185416, "epoch": 2233} {"train_loss": -24.0299072265625, "global_step": 185417, "epoch": 2233} {"train_loss": -23.945798873901367, "global_step": 185418, "epoch": 2233} {"train_loss": -23.887704849243164, "global_step": 185419, "epoch": 2233} {"train_loss": -23.60077667236328, "global_step": 185420, "epoch": 2233} {"train_loss": -23.912927512662957, "global_step": 185421, "epoch": 2233, "val_loss": 6587397.5} {"train_loss": -23.445819854736328, "global_step": 185422, "epoch": 2234} {"train_loss": -23.3247127532959, "global_step": 185423, "epoch": 2234} {"train_loss": -23.43116569519043, "global_step": 185424, "epoch": 2234} {"train_loss": -23.285036087036133, "global_step": 185425, "epoch": 2234} {"train_loss": -23.597715377807617, "global_step": 185426, "epoch": 2234} {"train_loss": -23.2991943359375, "global_step": 185427, "epoch": 2234} {"train_loss": -23.49806022644043, "global_step": 185428, "epoch": 2234} {"train_loss": -23.95540428161621, "global_step": 185429, "epoch": 2234} {"train_loss": -23.56934928894043, "global_step": 185430, "epoch": 2234} {"train_loss": -23.844053268432617, "global_step": 185431, "epoch": 2234} {"train_loss": -23.962921142578125, "global_step": 185432, "epoch": 2234} {"train_loss": -23.70318031311035, "global_step": 185433, "epoch": 2234} {"train_loss": -23.600622177124023, "global_step": 185434, "epoch": 2234} {"train_loss": -23.830930709838867, "global_step": 185435, "epoch": 2234} {"train_loss": -23.811267852783203, "global_step": 185436, "epoch": 2234} {"train_loss": -24.128543853759766, "global_step": 185437, "epoch": 2234} {"train_loss": -24.071195602416992, "global_step": 185438, "epoch": 2234} {"train_loss": -23.946659088134766, "global_step": 185439, "epoch": 2234} {"train_loss": -23.995140075683594, "global_step": 185440, "epoch": 2234} {"train_loss": -23.9082088470459, "global_step": 185441, "epoch": 2234} {"train_loss": -24.30078125, "global_step": 185442, "epoch": 2234} {"train_loss": -24.015024185180664, "global_step": 185443, "epoch": 2234} {"train_loss": -24.17732810974121, "global_step": 185444, "epoch": 2234} {"train_loss": -24.55269432067871, "global_step": 185445, "epoch": 2234} {"train_loss": -24.080785751342773, "global_step": 185446, "epoch": 2234} {"train_loss": -24.35645866394043, "global_step": 185447, "epoch": 2234} {"train_loss": -24.055679321289062, "global_step": 185448, "epoch": 2234} {"train_loss": -23.9586181640625, "global_step": 185449, "epoch": 2234} {"train_loss": -23.765146255493164, "global_step": 185450, "epoch": 2234} {"train_loss": -24.099925994873047, "global_step": 185451, "epoch": 2234} {"train_loss": -24.15863800048828, "global_step": 185452, "epoch": 2234} {"train_loss": -24.073575973510742, "global_step": 185453, "epoch": 2234} {"train_loss": -24.224864959716797, "global_step": 185454, "epoch": 2234} {"train_loss": -24.190885543823242, "global_step": 185455, "epoch": 2234} {"train_loss": -23.890304565429688, "global_step": 185456, "epoch": 2234} {"train_loss": -24.157058715820312, "global_step": 185457, "epoch": 2234} {"train_loss": -24.09064292907715, "global_step": 185458, "epoch": 2234} {"train_loss": -23.566320419311523, "global_step": 185459, "epoch": 2234} {"train_loss": -24.003015518188477, "global_step": 185460, "epoch": 2234} {"train_loss": -24.22336769104004, "global_step": 185461, "epoch": 2234} {"train_loss": -23.69959831237793, "global_step": 185462, "epoch": 2234} {"train_loss": -24.025192260742188, "global_step": 185463, "epoch": 2234} {"train_loss": -24.375669479370117, "global_step": 185464, "epoch": 2234} {"train_loss": -23.729764938354492, "global_step": 185465, "epoch": 2234} {"train_loss": -24.24647331237793, "global_step": 185466, "epoch": 2234} {"train_loss": -23.892179489135742, "global_step": 185467, "epoch": 2234} {"train_loss": -24.07912254333496, "global_step": 185468, "epoch": 2234} {"train_loss": -23.652677536010742, "global_step": 185469, "epoch": 2234} {"train_loss": -24.21675682067871, "global_step": 185470, "epoch": 2234} {"train_loss": -24.016355514526367, "global_step": 185471, "epoch": 2234} {"train_loss": -24.22544288635254, "global_step": 185472, "epoch": 2234} {"train_loss": -23.88031578063965, "global_step": 185473, "epoch": 2234} {"train_loss": -23.61110496520996, "global_step": 185474, "epoch": 2234} {"train_loss": -24.315378189086914, "global_step": 185475, "epoch": 2234} {"train_loss": -24.513431549072266, "global_step": 185476, "epoch": 2234} {"train_loss": -24.036468505859375, "global_step": 185477, "epoch": 2234} {"train_loss": -24.16144371032715, "global_step": 185478, "epoch": 2234} {"train_loss": -23.82868766784668, "global_step": 185479, "epoch": 2234} {"train_loss": -24.1732177734375, "global_step": 185480, "epoch": 2234} {"train_loss": -24.261598587036133, "global_step": 185481, "epoch": 2234} {"train_loss": -24.09321403503418, "global_step": 185482, "epoch": 2234} {"train_loss": -24.13388442993164, "global_step": 185483, "epoch": 2234} {"train_loss": -23.949861526489258, "global_step": 185484, "epoch": 2234} {"train_loss": -24.11432456970215, "global_step": 185485, "epoch": 2234} {"train_loss": -23.92519187927246, "global_step": 185486, "epoch": 2234} {"train_loss": -24.130638122558594, "global_step": 185487, "epoch": 2234} {"train_loss": -24.097715377807617, "global_step": 185488, "epoch": 2234} {"train_loss": -23.992740631103516, "global_step": 185489, "epoch": 2234} {"train_loss": -24.34370231628418, "global_step": 185490, "epoch": 2234} {"train_loss": -23.889591217041016, "global_step": 185491, "epoch": 2234} {"train_loss": -23.617061614990234, "global_step": 185492, "epoch": 2234} {"train_loss": -24.156333923339844, "global_step": 185493, "epoch": 2234} {"train_loss": -24.236675262451172, "global_step": 185494, "epoch": 2234} {"train_loss": -23.792341232299805, "global_step": 185495, "epoch": 2234} {"train_loss": -24.001874923706055, "global_step": 185496, "epoch": 2234} {"train_loss": -23.73647117614746, "global_step": 185497, "epoch": 2234} {"train_loss": -24.15423011779785, "global_step": 185498, "epoch": 2234} {"train_loss": -24.03036880493164, "global_step": 185499, "epoch": 2234} {"train_loss": -24.107458114624023, "global_step": 185500, "epoch": 2234} {"train_loss": -24.0638427734375, "global_step": 185501, "epoch": 2234} {"train_loss": -24.248201370239258, "global_step": 185502, "epoch": 2234} {"train_loss": -24.0084285736084, "global_step": 185503, "epoch": 2234} {"train_loss": -23.982247685811604, "global_step": 185504, "epoch": 2234, "val_loss": 6522169.5} {"train_loss": -23.13612174987793, "global_step": 185505, "epoch": 2235} {"train_loss": -23.68842887878418, "global_step": 185506, "epoch": 2235} {"train_loss": -23.34653663635254, "global_step": 185507, "epoch": 2235} {"train_loss": -23.55662727355957, "global_step": 185508, "epoch": 2235} {"train_loss": -23.44639015197754, "global_step": 185509, "epoch": 2235} {"train_loss": -23.6801815032959, "global_step": 185510, "epoch": 2235} {"train_loss": -23.577739715576172, "global_step": 185511, "epoch": 2235} {"train_loss": -23.591114044189453, "global_step": 185512, "epoch": 2235} {"train_loss": -24.024850845336914, "global_step": 185513, "epoch": 2235} {"train_loss": -23.365869522094727, "global_step": 185514, "epoch": 2235} {"train_loss": -23.77249526977539, "global_step": 185515, "epoch": 2235} {"train_loss": -23.48187255859375, "global_step": 185516, "epoch": 2235} {"train_loss": -23.801790237426758, "global_step": 185517, "epoch": 2235} {"train_loss": -23.896055221557617, "global_step": 185518, "epoch": 2235} {"train_loss": -23.72907829284668, "global_step": 185519, "epoch": 2235} {"train_loss": -23.83084487915039, "global_step": 185520, "epoch": 2235} {"train_loss": -23.87598991394043, "global_step": 185521, "epoch": 2235} {"train_loss": -23.372596740722656, "global_step": 185522, "epoch": 2235} {"train_loss": -23.538244247436523, "global_step": 185523, "epoch": 2235} {"train_loss": -23.98183250427246, "global_step": 185524, "epoch": 2235} {"train_loss": -23.923141479492188, "global_step": 185525, "epoch": 2235} {"train_loss": -23.671545028686523, "global_step": 185526, "epoch": 2235} {"train_loss": -23.89275550842285, "global_step": 185527, "epoch": 2235} {"train_loss": -24.273527145385742, "global_step": 185528, "epoch": 2235} {"train_loss": -23.736661911010742, "global_step": 185529, "epoch": 2235} {"train_loss": -23.876834869384766, "global_step": 185530, "epoch": 2235} {"train_loss": -24.073577880859375, "global_step": 185531, "epoch": 2235} {"train_loss": -23.956762313842773, "global_step": 185532, "epoch": 2235} {"train_loss": -23.987579345703125, "global_step": 185533, "epoch": 2235} {"train_loss": -23.949308395385742, "global_step": 185534, "epoch": 2235} {"train_loss": -24.1467342376709, "global_step": 185535, "epoch": 2235} {"train_loss": -23.618057250976562, "global_step": 185536, "epoch": 2235} {"train_loss": -23.828210830688477, "global_step": 185537, "epoch": 2235} {"train_loss": -23.866065979003906, "global_step": 185538, "epoch": 2235} {"train_loss": -23.944189071655273, "global_step": 185539, "epoch": 2235} {"train_loss": -24.117746353149414, "global_step": 185540, "epoch": 2235} {"train_loss": -24.252281188964844, "global_step": 185541, "epoch": 2235} {"train_loss": -23.965103149414062, "global_step": 185542, "epoch": 2235} {"train_loss": -24.169973373413086, "global_step": 185543, "epoch": 2235} {"train_loss": -23.76116180419922, "global_step": 185544, "epoch": 2235} {"train_loss": -24.272647857666016, "global_step": 185545, "epoch": 2235} {"train_loss": -23.929519653320312, "global_step": 185546, "epoch": 2235} {"train_loss": -24.154144287109375, "global_step": 185547, "epoch": 2235} {"train_loss": -23.915470123291016, "global_step": 185548, "epoch": 2235} {"train_loss": -24.165334701538086, "global_step": 185549, "epoch": 2235} {"train_loss": -23.811086654663086, "global_step": 185550, "epoch": 2235} {"train_loss": -23.96741485595703, "global_step": 185551, "epoch": 2235} {"train_loss": -23.9150333404541, "global_step": 185552, "epoch": 2235} {"train_loss": -24.295751571655273, "global_step": 185553, "epoch": 2235} {"train_loss": -24.58285903930664, "global_step": 185554, "epoch": 2235} {"train_loss": -23.854557037353516, "global_step": 185555, "epoch": 2235} {"train_loss": -24.454082489013672, "global_step": 185556, "epoch": 2235} {"train_loss": -23.908496856689453, "global_step": 185557, "epoch": 2235} {"train_loss": -24.23358726501465, "global_step": 185558, "epoch": 2235} {"train_loss": -23.972164154052734, "global_step": 185559, "epoch": 2235} {"train_loss": -24.10309410095215, "global_step": 185560, "epoch": 2235} {"train_loss": -24.308393478393555, "global_step": 185561, "epoch": 2235} {"train_loss": -24.004714965820312, "global_step": 185562, "epoch": 2235} {"train_loss": -23.986404418945312, "global_step": 185563, "epoch": 2235} {"train_loss": -24.01923179626465, "global_step": 185564, "epoch": 2235} {"train_loss": -23.959136962890625, "global_step": 185565, "epoch": 2235} {"train_loss": -24.343130111694336, "global_step": 185566, "epoch": 2235} {"train_loss": -23.996553421020508, "global_step": 185567, "epoch": 2235} {"train_loss": -23.94533348083496, "global_step": 185568, "epoch": 2235} {"train_loss": -24.1634464263916, "global_step": 185569, "epoch": 2235} {"train_loss": -23.669713973999023, "global_step": 185570, "epoch": 2235} {"train_loss": -23.860809326171875, "global_step": 185571, "epoch": 2235} {"train_loss": -24.16454315185547, "global_step": 185572, "epoch": 2235} {"train_loss": -23.968223571777344, "global_step": 185573, "epoch": 2235} {"train_loss": -23.457290649414062, "global_step": 185574, "epoch": 2235} {"train_loss": -23.721216201782227, "global_step": 185575, "epoch": 2235} {"train_loss": -23.523523330688477, "global_step": 185576, "epoch": 2235} {"train_loss": -23.43918228149414, "global_step": 185577, "epoch": 2235} {"train_loss": -23.582691192626953, "global_step": 185578, "epoch": 2235} {"train_loss": -24.046945571899414, "global_step": 185579, "epoch": 2235} {"train_loss": -23.468067169189453, "global_step": 185580, "epoch": 2235} {"train_loss": -23.605173110961914, "global_step": 185581, "epoch": 2235} {"train_loss": -23.671165466308594, "global_step": 185582, "epoch": 2235} {"train_loss": -24.038288116455078, "global_step": 185583, "epoch": 2235} {"train_loss": -23.638811111450195, "global_step": 185584, "epoch": 2235} {"train_loss": -23.848615646362305, "global_step": 185585, "epoch": 2235} {"train_loss": -23.912107467651367, "global_step": 185586, "epoch": 2235} {"train_loss": -23.872497650514166, "global_step": 185587, "epoch": 2235, "val_loss": 6510336.5} {"train_loss": -23.1859188079834, "global_step": 185588, "epoch": 2236} {"train_loss": -23.80295181274414, "global_step": 185589, "epoch": 2236} {"train_loss": -23.038904190063477, "global_step": 185590, "epoch": 2236} {"train_loss": -23.52656364440918, "global_step": 185591, "epoch": 2236} {"train_loss": -23.66666603088379, "global_step": 185592, "epoch": 2236} {"train_loss": -23.1532039642334, "global_step": 185593, "epoch": 2236} {"train_loss": -24.018461227416992, "global_step": 185594, "epoch": 2236} {"train_loss": -24.086278915405273, "global_step": 185595, "epoch": 2236} {"train_loss": -23.663360595703125, "global_step": 185596, "epoch": 2236} {"train_loss": -23.49983024597168, "global_step": 185597, "epoch": 2236} {"train_loss": -23.578510284423828, "global_step": 185598, "epoch": 2236} {"train_loss": -23.614892959594727, "global_step": 185599, "epoch": 2236} {"train_loss": -24.003767013549805, "global_step": 185600, "epoch": 2236} {"train_loss": -24.10603141784668, "global_step": 185601, "epoch": 2236} {"train_loss": -23.986032485961914, "global_step": 185602, "epoch": 2236} {"train_loss": -24.012842178344727, "global_step": 185603, "epoch": 2236} {"train_loss": -23.673635482788086, "global_step": 185604, "epoch": 2236} {"train_loss": -23.805387496948242, "global_step": 185605, "epoch": 2236} {"train_loss": -23.91047477722168, "global_step": 185606, "epoch": 2236} {"train_loss": -23.575912475585938, "global_step": 185607, "epoch": 2236} {"train_loss": -23.71539878845215, "global_step": 185608, "epoch": 2236} {"train_loss": -23.62163734436035, "global_step": 185609, "epoch": 2236} {"train_loss": -23.6790714263916, "global_step": 185610, "epoch": 2236} {"train_loss": -24.073495864868164, "global_step": 185611, "epoch": 2236} {"train_loss": -23.934057235717773, "global_step": 185612, "epoch": 2236} {"train_loss": -23.952268600463867, "global_step": 185613, "epoch": 2236} {"train_loss": -23.892751693725586, "global_step": 185614, "epoch": 2236} {"train_loss": -24.074478149414062, "global_step": 185615, "epoch": 2236} {"train_loss": -23.982908248901367, "global_step": 185616, "epoch": 2236} {"train_loss": -24.10464096069336, "global_step": 185617, "epoch": 2236} {"train_loss": -23.940927505493164, "global_step": 185618, "epoch": 2236} {"train_loss": -24.224340438842773, "global_step": 185619, "epoch": 2236} {"train_loss": -24.044170379638672, "global_step": 185620, "epoch": 2236} {"train_loss": -24.01136589050293, "global_step": 185621, "epoch": 2236} {"train_loss": -24.00239372253418, "global_step": 185622, "epoch": 2236} {"train_loss": -24.261707305908203, "global_step": 185623, "epoch": 2236} {"train_loss": -24.33147621154785, "global_step": 185624, "epoch": 2236} {"train_loss": -23.567794799804688, "global_step": 185625, "epoch": 2236} {"train_loss": -24.03404426574707, "global_step": 185626, "epoch": 2236} {"train_loss": -23.953245162963867, "global_step": 185627, "epoch": 2236} {"train_loss": -23.752126693725586, "global_step": 185628, "epoch": 2236} {"train_loss": -24.112417221069336, "global_step": 185629, "epoch": 2236} {"train_loss": -24.01698875427246, "global_step": 185630, "epoch": 2236} {"train_loss": -23.888925552368164, "global_step": 185631, "epoch": 2236} {"train_loss": -24.124143600463867, "global_step": 185632, "epoch": 2236} {"train_loss": -23.983976364135742, "global_step": 185633, "epoch": 2236} {"train_loss": -24.1859130859375, "global_step": 185634, "epoch": 2236} {"train_loss": -23.681896209716797, "global_step": 185635, "epoch": 2236} {"train_loss": -23.998872756958008, "global_step": 185636, "epoch": 2236} {"train_loss": -23.644920349121094, "global_step": 185637, "epoch": 2236} {"train_loss": -23.937297821044922, "global_step": 185638, "epoch": 2236} {"train_loss": -23.956342697143555, "global_step": 185639, "epoch": 2236} {"train_loss": -23.878461837768555, "global_step": 185640, "epoch": 2236} {"train_loss": -23.825040817260742, "global_step": 185641, "epoch": 2236} {"train_loss": -23.632429122924805, "global_step": 185642, "epoch": 2236} {"train_loss": -24.03478240966797, "global_step": 185643, "epoch": 2236} {"train_loss": -24.01807975769043, "global_step": 185644, "epoch": 2236} {"train_loss": -23.724538803100586, "global_step": 185645, "epoch": 2236} {"train_loss": -24.150129318237305, "global_step": 185646, "epoch": 2236} {"train_loss": -23.772520065307617, "global_step": 185647, "epoch": 2236} {"train_loss": -23.96294593811035, "global_step": 185648, "epoch": 2236} {"train_loss": -23.72820472717285, "global_step": 185649, "epoch": 2236} {"train_loss": -24.30328941345215, "global_step": 185650, "epoch": 2236} {"train_loss": -23.89613151550293, "global_step": 185651, "epoch": 2236} {"train_loss": -23.923303604125977, "global_step": 185652, "epoch": 2236} {"train_loss": -23.57107925415039, "global_step": 185653, "epoch": 2236} {"train_loss": -23.994049072265625, "global_step": 185654, "epoch": 2236} {"train_loss": -24.087377548217773, "global_step": 185655, "epoch": 2236} {"train_loss": -23.787660598754883, "global_step": 185656, "epoch": 2236} {"train_loss": -23.707265853881836, "global_step": 185657, "epoch": 2236} {"train_loss": -23.685047149658203, "global_step": 185658, "epoch": 2236} {"train_loss": -24.47196388244629, "global_step": 185659, "epoch": 2236} {"train_loss": -23.640562057495117, "global_step": 185660, "epoch": 2236} {"train_loss": -23.944684982299805, "global_step": 185661, "epoch": 2236} {"train_loss": -23.857995986938477, "global_step": 185662, "epoch": 2236} {"train_loss": -24.310945510864258, "global_step": 185663, "epoch": 2236} {"train_loss": -24.32025718688965, "global_step": 185664, "epoch": 2236} {"train_loss": -24.224563598632812, "global_step": 185665, "epoch": 2236} {"train_loss": -24.05922508239746, "global_step": 185666, "epoch": 2236} {"train_loss": -23.928756713867188, "global_step": 185667, "epoch": 2236} {"train_loss": -24.319339752197266, "global_step": 185668, "epoch": 2236} {"train_loss": -24.149555206298828, "global_step": 185669, "epoch": 2236} {"train_loss": -23.89085222726845, "global_step": 185670, "epoch": 2236, "val_loss": 6632516.0} {"train_loss": -23.813323974609375, "global_step": 185671, "epoch": 2237} {"train_loss": -23.40142250061035, "global_step": 185672, "epoch": 2237} {"train_loss": -23.91043472290039, "global_step": 185673, "epoch": 2237} {"train_loss": -23.307939529418945, "global_step": 185674, "epoch": 2237} {"train_loss": -23.33741569519043, "global_step": 185675, "epoch": 2237} {"train_loss": -24.33123207092285, "global_step": 185676, "epoch": 2237} {"train_loss": -23.73445701599121, "global_step": 185677, "epoch": 2237} {"train_loss": -23.948986053466797, "global_step": 185678, "epoch": 2237} {"train_loss": -23.575159072875977, "global_step": 185679, "epoch": 2237} {"train_loss": -23.708253860473633, "global_step": 185680, "epoch": 2237} {"train_loss": -23.781888961791992, "global_step": 185681, "epoch": 2237} {"train_loss": -23.810821533203125, "global_step": 185682, "epoch": 2237} {"train_loss": -23.730854034423828, "global_step": 185683, "epoch": 2237} {"train_loss": -23.90529441833496, "global_step": 185684, "epoch": 2237} {"train_loss": -23.799619674682617, "global_step": 185685, "epoch": 2237} {"train_loss": -24.16707420349121, "global_step": 185686, "epoch": 2237} {"train_loss": -23.694480895996094, "global_step": 185687, "epoch": 2237} {"train_loss": -23.84309959411621, "global_step": 185688, "epoch": 2237} {"train_loss": -23.99239158630371, "global_step": 185689, "epoch": 2237} {"train_loss": -23.944761276245117, "global_step": 185690, "epoch": 2237} {"train_loss": -24.028066635131836, "global_step": 185691, "epoch": 2237} {"train_loss": -24.13245391845703, "global_step": 185692, "epoch": 2237} {"train_loss": -23.745075225830078, "global_step": 185693, "epoch": 2237} {"train_loss": -23.871471405029297, "global_step": 185694, "epoch": 2237} {"train_loss": -24.18037986755371, "global_step": 185695, "epoch": 2237} {"train_loss": -23.79593276977539, "global_step": 185696, "epoch": 2237} {"train_loss": -23.825361251831055, "global_step": 185697, "epoch": 2237} {"train_loss": -23.91487693786621, "global_step": 185698, "epoch": 2237} {"train_loss": -24.3157958984375, "global_step": 185699, "epoch": 2237} {"train_loss": -23.931415557861328, "global_step": 185700, "epoch": 2237} {"train_loss": -24.16312026977539, "global_step": 185701, "epoch": 2237} {"train_loss": -24.059621810913086, "global_step": 185702, "epoch": 2237} {"train_loss": -24.104717254638672, "global_step": 185703, "epoch": 2237} {"train_loss": -24.2587890625, "global_step": 185704, "epoch": 2237} {"train_loss": -24.02351188659668, "global_step": 185705, "epoch": 2237} {"train_loss": -23.804107666015625, "global_step": 185706, "epoch": 2237} {"train_loss": -24.5130615234375, "global_step": 185707, "epoch": 2237} {"train_loss": -24.031442642211914, "global_step": 185708, "epoch": 2237} {"train_loss": -23.974136352539062, "global_step": 185709, "epoch": 2237} {"train_loss": -24.243703842163086, "global_step": 185710, "epoch": 2237} {"train_loss": -23.98085594177246, "global_step": 185711, "epoch": 2237} {"train_loss": -24.13374900817871, "global_step": 185712, "epoch": 2237} {"train_loss": -23.99361228942871, "global_step": 185713, "epoch": 2237} {"train_loss": -24.191131591796875, "global_step": 185714, "epoch": 2237} {"train_loss": -24.306333541870117, "global_step": 185715, "epoch": 2237} {"train_loss": -24.072927474975586, "global_step": 185716, "epoch": 2237} {"train_loss": -24.079376220703125, "global_step": 185717, "epoch": 2237} {"train_loss": -24.048744201660156, "global_step": 185718, "epoch": 2237} {"train_loss": -23.842655181884766, "global_step": 185719, "epoch": 2237} {"train_loss": -24.345212936401367, "global_step": 185720, "epoch": 2237} {"train_loss": -24.264371871948242, "global_step": 185721, "epoch": 2237} {"train_loss": -24.336456298828125, "global_step": 185722, "epoch": 2237} {"train_loss": -23.716527938842773, "global_step": 185723, "epoch": 2237} {"train_loss": -23.818592071533203, "global_step": 185724, "epoch": 2237} {"train_loss": -23.620014190673828, "global_step": 185725, "epoch": 2237} {"train_loss": -23.79075813293457, "global_step": 185726, "epoch": 2237} {"train_loss": -23.900680541992188, "global_step": 185727, "epoch": 2237} {"train_loss": -24.384916305541992, "global_step": 185728, "epoch": 2237} {"train_loss": -24.01979637145996, "global_step": 185729, "epoch": 2237} {"train_loss": -24.090723037719727, "global_step": 185730, "epoch": 2237} {"train_loss": -23.823537826538086, "global_step": 185731, "epoch": 2237} {"train_loss": -24.163442611694336, "global_step": 185732, "epoch": 2237} {"train_loss": -24.02520179748535, "global_step": 185733, "epoch": 2237} {"train_loss": -24.394540786743164, "global_step": 185734, "epoch": 2237} {"train_loss": -23.91200828552246, "global_step": 185735, "epoch": 2237} {"train_loss": -23.94237518310547, "global_step": 185736, "epoch": 2237} {"train_loss": -24.1778564453125, "global_step": 185737, "epoch": 2237} {"train_loss": -24.128934860229492, "global_step": 185738, "epoch": 2237} {"train_loss": -23.846820831298828, "global_step": 185739, "epoch": 2237} {"train_loss": -24.38442611694336, "global_step": 185740, "epoch": 2237} {"train_loss": -24.077733993530273, "global_step": 185741, "epoch": 2237} {"train_loss": -24.387115478515625, "global_step": 185742, "epoch": 2237} {"train_loss": -24.15397071838379, "global_step": 185743, "epoch": 2237} {"train_loss": -23.82855796813965, "global_step": 185744, "epoch": 2237} {"train_loss": -24.049104690551758, "global_step": 185745, "epoch": 2237} {"train_loss": -23.921894073486328, "global_step": 185746, "epoch": 2237} {"train_loss": -24.124897003173828, "global_step": 185747, "epoch": 2237} {"train_loss": -24.091354370117188, "global_step": 185748, "epoch": 2237} {"train_loss": -24.031007766723633, "global_step": 185749, "epoch": 2237} {"train_loss": -24.0330810546875, "global_step": 185750, "epoch": 2237} {"train_loss": -23.887907028198242, "global_step": 185751, "epoch": 2237} {"train_loss": -24.115049362182617, "global_step": 185752, "epoch": 2237} {"train_loss": -23.99642447965691, "global_step": 185753, "epoch": 2237, "val_loss": 6536397.0} {"train_loss": -24.014135360717773, "global_step": 185754, "epoch": 2238} {"train_loss": -23.064144134521484, "global_step": 185755, "epoch": 2238} {"train_loss": -22.29775047302246, "global_step": 185756, "epoch": 2238} {"train_loss": -22.214021682739258, "global_step": 185757, "epoch": 2238} {"train_loss": -23.933197021484375, "global_step": 185758, "epoch": 2238} {"train_loss": -22.11545181274414, "global_step": 185759, "epoch": 2238} {"train_loss": -22.447843551635742, "global_step": 185760, "epoch": 2238} {"train_loss": -23.44635009765625, "global_step": 185761, "epoch": 2238} {"train_loss": -22.965585708618164, "global_step": 185762, "epoch": 2238} {"train_loss": -23.578571319580078, "global_step": 185763, "epoch": 2238} {"train_loss": -23.700130462646484, "global_step": 185764, "epoch": 2238} {"train_loss": -23.554983139038086, "global_step": 185765, "epoch": 2238} {"train_loss": -23.451005935668945, "global_step": 185766, "epoch": 2238} {"train_loss": -23.69367790222168, "global_step": 185767, "epoch": 2238} {"train_loss": -23.044851303100586, "global_step": 185768, "epoch": 2238} {"train_loss": -23.50482749938965, "global_step": 185769, "epoch": 2238} {"train_loss": -23.76780128479004, "global_step": 185770, "epoch": 2238} {"train_loss": -23.743804931640625, "global_step": 185771, "epoch": 2238} {"train_loss": -24.096384048461914, "global_step": 185772, "epoch": 2238} {"train_loss": -23.518383026123047, "global_step": 185773, "epoch": 2238} {"train_loss": -23.258508682250977, "global_step": 185774, "epoch": 2238} {"train_loss": -23.71611976623535, "global_step": 185775, "epoch": 2238} {"train_loss": -23.58034324645996, "global_step": 185776, "epoch": 2238} {"train_loss": -23.812681198120117, "global_step": 185777, "epoch": 2238} {"train_loss": -23.6929988861084, "global_step": 185778, "epoch": 2238} {"train_loss": -23.52337074279785, "global_step": 185779, "epoch": 2238} {"train_loss": -23.920352935791016, "global_step": 185780, "epoch": 2238} {"train_loss": -23.741573333740234, "global_step": 185781, "epoch": 2238} {"train_loss": -23.913488388061523, "global_step": 185782, "epoch": 2238} {"train_loss": -24.104379653930664, "global_step": 185783, "epoch": 2238} {"train_loss": -23.739686965942383, "global_step": 185784, "epoch": 2238} {"train_loss": -23.73430824279785, "global_step": 185785, "epoch": 2238} {"train_loss": -23.87887954711914, "global_step": 185786, "epoch": 2238} {"train_loss": -23.987504959106445, "global_step": 185787, "epoch": 2238} {"train_loss": -23.850435256958008, "global_step": 185788, "epoch": 2238} {"train_loss": -24.129928588867188, "global_step": 185789, "epoch": 2238} {"train_loss": -23.853185653686523, "global_step": 185790, "epoch": 2238} {"train_loss": -24.27766990661621, "global_step": 185791, "epoch": 2238} {"train_loss": -23.436553955078125, "global_step": 185792, "epoch": 2238} {"train_loss": -24.09614372253418, "global_step": 185793, "epoch": 2238} {"train_loss": -24.175537109375, "global_step": 185794, "epoch": 2238} {"train_loss": -23.800230026245117, "global_step": 185795, "epoch": 2238} {"train_loss": -23.989057540893555, "global_step": 185796, "epoch": 2238} {"train_loss": -23.86554527282715, "global_step": 185797, "epoch": 2238} {"train_loss": -24.060039520263672, "global_step": 185798, "epoch": 2238} {"train_loss": -23.92325210571289, "global_step": 185799, "epoch": 2238} {"train_loss": -24.13437271118164, "global_step": 185800, "epoch": 2238} {"train_loss": -24.155363082885742, "global_step": 185801, "epoch": 2238} {"train_loss": -23.847864151000977, "global_step": 185802, "epoch": 2238} {"train_loss": -24.135211944580078, "global_step": 185803, "epoch": 2238} {"train_loss": -24.55537223815918, "global_step": 185804, "epoch": 2238} {"train_loss": -24.15956687927246, "global_step": 185805, "epoch": 2238} {"train_loss": -24.091089248657227, "global_step": 185806, "epoch": 2238} {"train_loss": -24.21730613708496, "global_step": 185807, "epoch": 2238} {"train_loss": -24.14645004272461, "global_step": 185808, "epoch": 2238} {"train_loss": -23.93385887145996, "global_step": 185809, "epoch": 2238} {"train_loss": -23.887805938720703, "global_step": 185810, "epoch": 2238} {"train_loss": -24.033447265625, "global_step": 185811, "epoch": 2238} {"train_loss": -24.04709815979004, "global_step": 185812, "epoch": 2238} {"train_loss": -24.20839500427246, "global_step": 185813, "epoch": 2238} {"train_loss": -24.1242618560791, "global_step": 185814, "epoch": 2238} {"train_loss": -23.998336791992188, "global_step": 185815, "epoch": 2238} {"train_loss": -23.9273624420166, "global_step": 185816, "epoch": 2238} {"train_loss": -24.167469024658203, "global_step": 185817, "epoch": 2238} {"train_loss": -23.8342342376709, "global_step": 185818, "epoch": 2238} {"train_loss": -23.94062614440918, "global_step": 185819, "epoch": 2238} {"train_loss": -23.86385154724121, "global_step": 185820, "epoch": 2238} {"train_loss": -24.053329467773438, "global_step": 185821, "epoch": 2238} {"train_loss": -23.85917854309082, "global_step": 185822, "epoch": 2238} {"train_loss": -23.964752197265625, "global_step": 185823, "epoch": 2238} {"train_loss": -23.841405868530273, "global_step": 185824, "epoch": 2238} {"train_loss": -23.966794967651367, "global_step": 185825, "epoch": 2238} {"train_loss": -24.259084701538086, "global_step": 185826, "epoch": 2238} {"train_loss": -23.966279983520508, "global_step": 185827, "epoch": 2238} {"train_loss": -23.71409034729004, "global_step": 185828, "epoch": 2238} {"train_loss": -24.16991424560547, "global_step": 185829, "epoch": 2238} {"train_loss": -24.016056060791016, "global_step": 185830, "epoch": 2238} {"train_loss": -24.08111572265625, "global_step": 185831, "epoch": 2238} {"train_loss": -23.928319931030273, "global_step": 185832, "epoch": 2238} {"train_loss": -24.43497085571289, "global_step": 185833, "epoch": 2238} {"train_loss": -23.975542068481445, "global_step": 185834, "epoch": 2238} {"train_loss": -23.779722213745117, "global_step": 185835, "epoch": 2238} {"train_loss": -23.813246439738446, "global_step": 185836, "epoch": 2238, "val_loss": 6386028.0} {"train_loss": -23.663488388061523, "global_step": 185837, "epoch": 2239} {"train_loss": -23.620967864990234, "global_step": 185838, "epoch": 2239} {"train_loss": -23.95290184020996, "global_step": 185839, "epoch": 2239} {"train_loss": -23.05179214477539, "global_step": 185840, "epoch": 2239} {"train_loss": -23.066879272460938, "global_step": 185841, "epoch": 2239} {"train_loss": -22.939395904541016, "global_step": 185842, "epoch": 2239} {"train_loss": -23.898025512695312, "global_step": 185843, "epoch": 2239} {"train_loss": -23.14592933654785, "global_step": 185844, "epoch": 2239} {"train_loss": -23.31601905822754, "global_step": 185845, "epoch": 2239} {"train_loss": -23.643787384033203, "global_step": 185846, "epoch": 2239} {"train_loss": -23.38927459716797, "global_step": 185847, "epoch": 2239} {"train_loss": -23.72711181640625, "global_step": 185848, "epoch": 2239} {"train_loss": -23.149763107299805, "global_step": 185849, "epoch": 2239} {"train_loss": -23.56900405883789, "global_step": 185850, "epoch": 2239} {"train_loss": -23.68408203125, "global_step": 185851, "epoch": 2239} {"train_loss": -23.37351417541504, "global_step": 185852, "epoch": 2239} {"train_loss": -23.894790649414062, "global_step": 185853, "epoch": 2239} {"train_loss": -23.762998580932617, "global_step": 185854, "epoch": 2239} {"train_loss": -23.78525733947754, "global_step": 185855, "epoch": 2239} {"train_loss": -24.070363998413086, "global_step": 185856, "epoch": 2239} {"train_loss": -23.704893112182617, "global_step": 185857, "epoch": 2239} {"train_loss": -23.65723991394043, "global_step": 185858, "epoch": 2239} {"train_loss": -23.7353515625, "global_step": 185859, "epoch": 2239} {"train_loss": -23.806421279907227, "global_step": 185860, "epoch": 2239} {"train_loss": -24.14595603942871, "global_step": 185861, "epoch": 2239} {"train_loss": -23.812423706054688, "global_step": 185862, "epoch": 2239} {"train_loss": -23.728626251220703, "global_step": 185863, "epoch": 2239} {"train_loss": -23.95139503479004, "global_step": 185864, "epoch": 2239} {"train_loss": -23.835805892944336, "global_step": 185865, "epoch": 2239} {"train_loss": -23.49598503112793, "global_step": 185866, "epoch": 2239} {"train_loss": -23.626094818115234, "global_step": 185867, "epoch": 2239} {"train_loss": -24.113027572631836, "global_step": 185868, "epoch": 2239} {"train_loss": -24.047565460205078, "global_step": 185869, "epoch": 2239} {"train_loss": -24.25221061706543, "global_step": 185870, "epoch": 2239} {"train_loss": -23.88655662536621, "global_step": 185871, "epoch": 2239} {"train_loss": -23.897397994995117, "global_step": 185872, "epoch": 2239} {"train_loss": -23.875892639160156, "global_step": 185873, "epoch": 2239} {"train_loss": -24.02398109436035, "global_step": 185874, "epoch": 2239} {"train_loss": -23.928112030029297, "global_step": 185875, "epoch": 2239} {"train_loss": -23.966825485229492, "global_step": 185876, "epoch": 2239} {"train_loss": -24.14723014831543, "global_step": 185877, "epoch": 2239} {"train_loss": -23.93183708190918, "global_step": 185878, "epoch": 2239} {"train_loss": -23.93337059020996, "global_step": 185879, "epoch": 2239} {"train_loss": -24.197036743164062, "global_step": 185880, "epoch": 2239} {"train_loss": -24.429861068725586, "global_step": 185881, "epoch": 2239} {"train_loss": -23.904682159423828, "global_step": 185882, "epoch": 2239} {"train_loss": -24.155609130859375, "global_step": 185883, "epoch": 2239} {"train_loss": -23.967069625854492, "global_step": 185884, "epoch": 2239} {"train_loss": -24.272497177124023, "global_step": 185885, "epoch": 2239} {"train_loss": -23.957378387451172, "global_step": 185886, "epoch": 2239} {"train_loss": -24.115493774414062, "global_step": 185887, "epoch": 2239} {"train_loss": -23.997838973999023, "global_step": 185888, "epoch": 2239} {"train_loss": -23.668352127075195, "global_step": 185889, "epoch": 2239} {"train_loss": -24.08473014831543, "global_step": 185890, "epoch": 2239} {"train_loss": -23.800275802612305, "global_step": 185891, "epoch": 2239} {"train_loss": -23.791961669921875, "global_step": 185892, "epoch": 2239} {"train_loss": -24.335784912109375, "global_step": 185893, "epoch": 2239} {"train_loss": -23.971534729003906, "global_step": 185894, "epoch": 2239} {"train_loss": -23.951684951782227, "global_step": 185895, "epoch": 2239} {"train_loss": -23.84781265258789, "global_step": 185896, "epoch": 2239} {"train_loss": -23.864151000976562, "global_step": 185897, "epoch": 2239} {"train_loss": -24.292478561401367, "global_step": 185898, "epoch": 2239} {"train_loss": -23.992618560791016, "global_step": 185899, "epoch": 2239} {"train_loss": -24.21196937561035, "global_step": 185900, "epoch": 2239} {"train_loss": -24.12262725830078, "global_step": 185901, "epoch": 2239} {"train_loss": -24.133481979370117, "global_step": 185902, "epoch": 2239} {"train_loss": -24.222415924072266, "global_step": 185903, "epoch": 2239} {"train_loss": -23.98062515258789, "global_step": 185904, "epoch": 2239} {"train_loss": -24.125755310058594, "global_step": 185905, "epoch": 2239} {"train_loss": -24.009387969970703, "global_step": 185906, "epoch": 2239} {"train_loss": -23.92537498474121, "global_step": 185907, "epoch": 2239} {"train_loss": -23.802230834960938, "global_step": 185908, "epoch": 2239} {"train_loss": -23.977218627929688, "global_step": 185909, "epoch": 2239} {"train_loss": -24.090024948120117, "global_step": 185910, "epoch": 2239} {"train_loss": -24.102384567260742, "global_step": 185911, "epoch": 2239} {"train_loss": -24.010726928710938, "global_step": 185912, "epoch": 2239} {"train_loss": -24.525724411010742, "global_step": 185913, "epoch": 2239} {"train_loss": -24.00360679626465, "global_step": 185914, "epoch": 2239} {"train_loss": -24.320724487304688, "global_step": 185915, "epoch": 2239} {"train_loss": -24.212800979614258, "global_step": 185916, "epoch": 2239} {"train_loss": -23.69709587097168, "global_step": 185917, "epoch": 2239} {"train_loss": -23.84881019592285, "global_step": 185918, "epoch": 2239} {"train_loss": -23.864341000476514, "global_step": 185919, "epoch": 2239, "val_loss": 6622199.5} {"train_loss": -23.357681274414062, "global_step": 185920, "epoch": 2240} {"train_loss": -23.958139419555664, "global_step": 185921, "epoch": 2240} {"train_loss": -23.329334259033203, "global_step": 185922, "epoch": 2240} {"train_loss": -23.763086318969727, "global_step": 185923, "epoch": 2240} {"train_loss": -24.04312515258789, "global_step": 185924, "epoch": 2240} {"train_loss": -24.102256774902344, "global_step": 185925, "epoch": 2240} {"train_loss": -23.398483276367188, "global_step": 185926, "epoch": 2240} {"train_loss": -23.4615421295166, "global_step": 185927, "epoch": 2240} {"train_loss": -23.913841247558594, "global_step": 185928, "epoch": 2240} {"train_loss": -23.642423629760742, "global_step": 185929, "epoch": 2240} {"train_loss": -23.175312042236328, "global_step": 185930, "epoch": 2240} {"train_loss": -23.57904624938965, "global_step": 185931, "epoch": 2240} {"train_loss": -23.8607234954834, "global_step": 185932, "epoch": 2240} {"train_loss": -23.729867935180664, "global_step": 185933, "epoch": 2240} {"train_loss": -23.55183982849121, "global_step": 185934, "epoch": 2240} {"train_loss": -23.7083740234375, "global_step": 185935, "epoch": 2240} {"train_loss": -23.864337921142578, "global_step": 185936, "epoch": 2240} {"train_loss": -23.827970504760742, "global_step": 185937, "epoch": 2240} {"train_loss": -23.620824813842773, "global_step": 185938, "epoch": 2240} {"train_loss": -24.29521942138672, "global_step": 185939, "epoch": 2240} {"train_loss": -23.572050094604492, "global_step": 185940, "epoch": 2240} {"train_loss": -24.118810653686523, "global_step": 185941, "epoch": 2240} {"train_loss": -23.87372398376465, "global_step": 185942, "epoch": 2240} {"train_loss": -23.911405563354492, "global_step": 185943, "epoch": 2240} {"train_loss": -23.883403778076172, "global_step": 185944, "epoch": 2240} {"train_loss": -23.908554077148438, "global_step": 185945, "epoch": 2240} {"train_loss": -23.78742790222168, "global_step": 185946, "epoch": 2240} {"train_loss": -23.8861083984375, "global_step": 185947, "epoch": 2240} {"train_loss": -23.7921199798584, "global_step": 185948, "epoch": 2240} {"train_loss": -24.37428092956543, "global_step": 185949, "epoch": 2240} {"train_loss": -23.81585121154785, "global_step": 185950, "epoch": 2240} {"train_loss": -23.81390953063965, "global_step": 185951, "epoch": 2240} {"train_loss": -23.856000900268555, "global_step": 185952, "epoch": 2240} {"train_loss": -23.909255981445312, "global_step": 185953, "epoch": 2240} {"train_loss": -23.79140281677246, "global_step": 185954, "epoch": 2240} {"train_loss": -24.095884323120117, "global_step": 185955, "epoch": 2240} {"train_loss": -24.223678588867188, "global_step": 185956, "epoch": 2240} {"train_loss": -24.11811637878418, "global_step": 185957, "epoch": 2240} {"train_loss": -23.91071319580078, "global_step": 185958, "epoch": 2240} {"train_loss": -23.9312686920166, "global_step": 185959, "epoch": 2240} {"train_loss": -24.0012149810791, "global_step": 185960, "epoch": 2240} {"train_loss": -23.886194229125977, "global_step": 185961, "epoch": 2240} {"train_loss": -24.156911849975586, "global_step": 185962, "epoch": 2240} {"train_loss": -23.48883628845215, "global_step": 185963, "epoch": 2240} {"train_loss": -24.20499038696289, "global_step": 185964, "epoch": 2240} {"train_loss": -24.028125762939453, "global_step": 185965, "epoch": 2240} {"train_loss": -23.90275764465332, "global_step": 185966, "epoch": 2240} {"train_loss": -23.998075485229492, "global_step": 185967, "epoch": 2240} {"train_loss": -23.87636375427246, "global_step": 185968, "epoch": 2240} {"train_loss": -23.772502899169922, "global_step": 185969, "epoch": 2240} {"train_loss": -24.05584716796875, "global_step": 185970, "epoch": 2240} {"train_loss": -23.887556076049805, "global_step": 185971, "epoch": 2240} {"train_loss": -24.02053451538086, "global_step": 185972, "epoch": 2240} {"train_loss": -23.704315185546875, "global_step": 185973, "epoch": 2240} {"train_loss": -24.07590103149414, "global_step": 185974, "epoch": 2240} {"train_loss": -23.861881256103516, "global_step": 185975, "epoch": 2240} {"train_loss": -23.568199157714844, "global_step": 185976, "epoch": 2240} {"train_loss": -23.749155044555664, "global_step": 185977, "epoch": 2240} {"train_loss": -23.96697998046875, "global_step": 185978, "epoch": 2240} {"train_loss": -23.81208610534668, "global_step": 185979, "epoch": 2240} {"train_loss": -23.83723258972168, "global_step": 185980, "epoch": 2240} {"train_loss": -24.228900909423828, "global_step": 185981, "epoch": 2240} {"train_loss": -23.945398330688477, "global_step": 185982, "epoch": 2240} {"train_loss": -23.699790954589844, "global_step": 185983, "epoch": 2240} {"train_loss": -23.8660888671875, "global_step": 185984, "epoch": 2240} {"train_loss": -23.992155075073242, "global_step": 185985, "epoch": 2240} {"train_loss": -24.136844635009766, "global_step": 185986, "epoch": 2240} {"train_loss": -24.11720085144043, "global_step": 185987, "epoch": 2240} {"train_loss": -23.974592208862305, "global_step": 185988, "epoch": 2240} {"train_loss": -23.780046463012695, "global_step": 185989, "epoch": 2240} {"train_loss": -23.83507537841797, "global_step": 185990, "epoch": 2240} {"train_loss": -23.659404754638672, "global_step": 185991, "epoch": 2240} {"train_loss": -24.23268699645996, "global_step": 185992, "epoch": 2240} {"train_loss": -23.91386604309082, "global_step": 185993, "epoch": 2240} {"train_loss": -24.134170532226562, "global_step": 185994, "epoch": 2240} {"train_loss": -23.923166275024414, "global_step": 185995, "epoch": 2240} {"train_loss": -24.19489097595215, "global_step": 185996, "epoch": 2240} {"train_loss": -24.151168823242188, "global_step": 185997, "epoch": 2240} {"train_loss": -24.244272232055664, "global_step": 185998, "epoch": 2240} {"train_loss": -23.684751510620117, "global_step": 185999, "epoch": 2240} {"train_loss": -24.119461059570312, "global_step": 186000, "epoch": 2240} {"train_loss": -24.101154327392578, "global_step": 186001, "epoch": 2240} {"train_loss": -23.904505051762225, "global_step": 186002, "epoch": 2240, "val_loss": 6451832.0} {"train_loss": -23.230321884155273, "global_step": 186003, "epoch": 2241} {"train_loss": -24.00725746154785, "global_step": 186004, "epoch": 2241} {"train_loss": -23.740432739257812, "global_step": 186005, "epoch": 2241} {"train_loss": -23.469120025634766, "global_step": 186006, "epoch": 2241} {"train_loss": -23.711393356323242, "global_step": 186007, "epoch": 2241} {"train_loss": -23.83770751953125, "global_step": 186008, "epoch": 2241} {"train_loss": -23.695798873901367, "global_step": 186009, "epoch": 2241} {"train_loss": -23.481809616088867, "global_step": 186010, "epoch": 2241} {"train_loss": -23.916534423828125, "global_step": 186011, "epoch": 2241} {"train_loss": -23.673301696777344, "global_step": 186012, "epoch": 2241} {"train_loss": -23.9920654296875, "global_step": 186013, "epoch": 2241} {"train_loss": -23.87615966796875, "global_step": 186014, "epoch": 2241} {"train_loss": -23.971433639526367, "global_step": 186015, "epoch": 2241} {"train_loss": -23.80610466003418, "global_step": 186016, "epoch": 2241} {"train_loss": -23.753253936767578, "global_step": 186017, "epoch": 2241} {"train_loss": -24.108051300048828, "global_step": 186018, "epoch": 2241} {"train_loss": -23.627653121948242, "global_step": 186019, "epoch": 2241} {"train_loss": -23.941137313842773, "global_step": 186020, "epoch": 2241} {"train_loss": -23.47217559814453, "global_step": 186021, "epoch": 2241} {"train_loss": -23.908517837524414, "global_step": 186022, "epoch": 2241} {"train_loss": -23.92323875427246, "global_step": 186023, "epoch": 2241} {"train_loss": -23.957748413085938, "global_step": 186024, "epoch": 2241} {"train_loss": -24.032278060913086, "global_step": 186025, "epoch": 2241} {"train_loss": -24.050382614135742, "global_step": 186026, "epoch": 2241} {"train_loss": -23.668701171875, "global_step": 186027, "epoch": 2241} {"train_loss": -23.555997848510742, "global_step": 186028, "epoch": 2241} {"train_loss": -23.938135147094727, "global_step": 186029, "epoch": 2241} {"train_loss": -23.985748291015625, "global_step": 186030, "epoch": 2241} {"train_loss": -24.10028648376465, "global_step": 186031, "epoch": 2241} {"train_loss": -23.895036697387695, "global_step": 186032, "epoch": 2241} {"train_loss": -23.545642852783203, "global_step": 186033, "epoch": 2241} {"train_loss": -23.78277015686035, "global_step": 186034, "epoch": 2241} {"train_loss": -23.991870880126953, "global_step": 186035, "epoch": 2241} {"train_loss": -24.048574447631836, "global_step": 186036, "epoch": 2241} {"train_loss": -23.691333770751953, "global_step": 186037, "epoch": 2241} {"train_loss": -24.159727096557617, "global_step": 186038, "epoch": 2241} {"train_loss": -24.467187881469727, "global_step": 186039, "epoch": 2241} {"train_loss": -23.93954849243164, "global_step": 186040, "epoch": 2241} {"train_loss": -24.10099220275879, "global_step": 186041, "epoch": 2241} {"train_loss": -24.136423110961914, "global_step": 186042, "epoch": 2241} {"train_loss": -23.849214553833008, "global_step": 186043, "epoch": 2241} {"train_loss": -24.071746826171875, "global_step": 186044, "epoch": 2241} {"train_loss": -24.0585994720459, "global_step": 186045, "epoch": 2241} {"train_loss": -24.277145385742188, "global_step": 186046, "epoch": 2241} {"train_loss": -24.261682510375977, "global_step": 186047, "epoch": 2241} {"train_loss": -24.19685935974121, "global_step": 186048, "epoch": 2241} {"train_loss": -24.166202545166016, "global_step": 186049, "epoch": 2241} {"train_loss": -24.25571632385254, "global_step": 186050, "epoch": 2241} {"train_loss": -24.263418197631836, "global_step": 186051, "epoch": 2241} {"train_loss": -24.113643646240234, "global_step": 186052, "epoch": 2241} {"train_loss": -24.17652702331543, "global_step": 186053, "epoch": 2241} {"train_loss": -24.148193359375, "global_step": 186054, "epoch": 2241} {"train_loss": -24.01531219482422, "global_step": 186055, "epoch": 2241} {"train_loss": -24.026504516601562, "global_step": 186056, "epoch": 2241} {"train_loss": -24.511577606201172, "global_step": 186057, "epoch": 2241} {"train_loss": -23.98318862915039, "global_step": 186058, "epoch": 2241} {"train_loss": -23.398977279663086, "global_step": 186059, "epoch": 2241} {"train_loss": -23.676618576049805, "global_step": 186060, "epoch": 2241} {"train_loss": -23.820743560791016, "global_step": 186061, "epoch": 2241} {"train_loss": -24.368078231811523, "global_step": 186062, "epoch": 2241} {"train_loss": -24.172826766967773, "global_step": 186063, "epoch": 2241} {"train_loss": -24.051801681518555, "global_step": 186064, "epoch": 2241} {"train_loss": -24.24290657043457, "global_step": 186065, "epoch": 2241} {"train_loss": -23.910022735595703, "global_step": 186066, "epoch": 2241} {"train_loss": -23.965822219848633, "global_step": 186067, "epoch": 2241} {"train_loss": -23.662607192993164, "global_step": 186068, "epoch": 2241} {"train_loss": -23.948169708251953, "global_step": 186069, "epoch": 2241} {"train_loss": -23.833511352539062, "global_step": 186070, "epoch": 2241} {"train_loss": -23.877721786499023, "global_step": 186071, "epoch": 2241} {"train_loss": -24.061277389526367, "global_step": 186072, "epoch": 2241} {"train_loss": -24.187414169311523, "global_step": 186073, "epoch": 2241} {"train_loss": -23.975772857666016, "global_step": 186074, "epoch": 2241} {"train_loss": -23.74722671508789, "global_step": 186075, "epoch": 2241} {"train_loss": -24.169775009155273, "global_step": 186076, "epoch": 2241} {"train_loss": -23.83681297302246, "global_step": 186077, "epoch": 2241} {"train_loss": -24.1102352142334, "global_step": 186078, "epoch": 2241} {"train_loss": -23.964160919189453, "global_step": 186079, "epoch": 2241} {"train_loss": -24.100736618041992, "global_step": 186080, "epoch": 2241} {"train_loss": -24.012466430664062, "global_step": 186081, "epoch": 2241} {"train_loss": -23.99010467529297, "global_step": 186082, "epoch": 2241} {"train_loss": -23.969270706176758, "global_step": 186083, "epoch": 2241} {"train_loss": -24.300678253173828, "global_step": 186084, "epoch": 2241} {"train_loss": -23.95470290586173, "global_step": 186085, "epoch": 2241, "val_loss": 6495131.0} {"train_loss": -23.345430374145508, "global_step": 186086, "epoch": 2242} {"train_loss": -24.030590057373047, "global_step": 186087, "epoch": 2242} {"train_loss": -23.85602569580078, "global_step": 186088, "epoch": 2242} {"train_loss": -23.12434196472168, "global_step": 186089, "epoch": 2242} {"train_loss": -23.519750595092773, "global_step": 186090, "epoch": 2242} {"train_loss": -23.66899299621582, "global_step": 186091, "epoch": 2242} {"train_loss": -23.57428741455078, "global_step": 186092, "epoch": 2242} {"train_loss": -23.86313819885254, "global_step": 186093, "epoch": 2242} {"train_loss": -23.53364372253418, "global_step": 186094, "epoch": 2242} {"train_loss": -23.744794845581055, "global_step": 186095, "epoch": 2242} {"train_loss": -23.945697784423828, "global_step": 186096, "epoch": 2242} {"train_loss": -23.92011833190918, "global_step": 186097, "epoch": 2242} {"train_loss": -23.39455223083496, "global_step": 186098, "epoch": 2242} {"train_loss": -23.66011619567871, "global_step": 186099, "epoch": 2242} {"train_loss": -23.752450942993164, "global_step": 186100, "epoch": 2242} {"train_loss": -23.53336524963379, "global_step": 186101, "epoch": 2242} {"train_loss": -23.897563934326172, "global_step": 186102, "epoch": 2242} {"train_loss": -23.60689353942871, "global_step": 186103, "epoch": 2242} {"train_loss": -23.811750411987305, "global_step": 186104, "epoch": 2242} {"train_loss": -24.306730270385742, "global_step": 186105, "epoch": 2242} {"train_loss": -24.125091552734375, "global_step": 186106, "epoch": 2242} {"train_loss": -24.136859893798828, "global_step": 186107, "epoch": 2242} {"train_loss": -24.2028865814209, "global_step": 186108, "epoch": 2242} {"train_loss": -23.710407257080078, "global_step": 186109, "epoch": 2242} {"train_loss": -24.18866539001465, "global_step": 186110, "epoch": 2242} {"train_loss": -23.852102279663086, "global_step": 186111, "epoch": 2242} {"train_loss": -24.29290008544922, "global_step": 186112, "epoch": 2242} {"train_loss": -23.922422409057617, "global_step": 186113, "epoch": 2242} {"train_loss": -23.75958824157715, "global_step": 186114, "epoch": 2242} {"train_loss": -23.669849395751953, "global_step": 186115, "epoch": 2242} {"train_loss": -23.7486515045166, "global_step": 186116, "epoch": 2242} {"train_loss": -24.155925750732422, "global_step": 186117, "epoch": 2242} {"train_loss": -24.09159278869629, "global_step": 186118, "epoch": 2242} {"train_loss": -23.682453155517578, "global_step": 186119, "epoch": 2242} {"train_loss": -24.215564727783203, "global_step": 186120, "epoch": 2242} {"train_loss": -23.809167861938477, "global_step": 186121, "epoch": 2242} {"train_loss": -23.77948760986328, "global_step": 186122, "epoch": 2242} {"train_loss": -24.20975112915039, "global_step": 186123, "epoch": 2242} {"train_loss": -24.091867446899414, "global_step": 186124, "epoch": 2242} {"train_loss": -24.0295352935791, "global_step": 186125, "epoch": 2242} {"train_loss": -24.285524368286133, "global_step": 186126, "epoch": 2242} {"train_loss": -23.753814697265625, "global_step": 186127, "epoch": 2242} {"train_loss": -24.340486526489258, "global_step": 186128, "epoch": 2242} {"train_loss": -23.835012435913086, "global_step": 186129, "epoch": 2242} {"train_loss": -23.719724655151367, "global_step": 186130, "epoch": 2242} {"train_loss": -24.012115478515625, "global_step": 186131, "epoch": 2242} {"train_loss": -24.119956970214844, "global_step": 186132, "epoch": 2242} {"train_loss": -23.634885787963867, "global_step": 186133, "epoch": 2242} {"train_loss": -24.132932662963867, "global_step": 186134, "epoch": 2242} {"train_loss": -23.88422966003418, "global_step": 186135, "epoch": 2242} {"train_loss": -23.88471031188965, "global_step": 186136, "epoch": 2242} {"train_loss": -24.207998275756836, "global_step": 186137, "epoch": 2242} {"train_loss": -24.111663818359375, "global_step": 186138, "epoch": 2242} {"train_loss": -24.11747169494629, "global_step": 186139, "epoch": 2242} {"train_loss": -23.706748962402344, "global_step": 186140, "epoch": 2242} {"train_loss": -23.80068588256836, "global_step": 186141, "epoch": 2242} {"train_loss": -24.06569480895996, "global_step": 186142, "epoch": 2242} {"train_loss": -24.117216110229492, "global_step": 186143, "epoch": 2242} {"train_loss": -23.892744064331055, "global_step": 186144, "epoch": 2242} {"train_loss": -24.336458206176758, "global_step": 186145, "epoch": 2242} {"train_loss": -24.035968780517578, "global_step": 186146, "epoch": 2242} {"train_loss": -24.06593894958496, "global_step": 186147, "epoch": 2242} {"train_loss": -24.012529373168945, "global_step": 186148, "epoch": 2242} {"train_loss": -24.07460594177246, "global_step": 186149, "epoch": 2242} {"train_loss": -23.74307632446289, "global_step": 186150, "epoch": 2242} {"train_loss": -23.79911231994629, "global_step": 186151, "epoch": 2242} {"train_loss": -23.607765197753906, "global_step": 186152, "epoch": 2242} {"train_loss": -23.782995223999023, "global_step": 186153, "epoch": 2242} {"train_loss": -23.912485122680664, "global_step": 186154, "epoch": 2242} {"train_loss": -23.940204620361328, "global_step": 186155, "epoch": 2242} {"train_loss": -23.687782287597656, "global_step": 186156, "epoch": 2242} {"train_loss": -23.493986129760742, "global_step": 186157, "epoch": 2242} {"train_loss": -23.816436767578125, "global_step": 186158, "epoch": 2242} {"train_loss": -24.155996322631836, "global_step": 186159, "epoch": 2242} {"train_loss": -23.969554901123047, "global_step": 186160, "epoch": 2242} {"train_loss": -23.631183624267578, "global_step": 186161, "epoch": 2242} {"train_loss": -23.515485763549805, "global_step": 186162, "epoch": 2242} {"train_loss": -23.873916625976562, "global_step": 186163, "epoch": 2242} {"train_loss": -23.918874740600586, "global_step": 186164, "epoch": 2242} {"train_loss": -23.77110481262207, "global_step": 186165, "epoch": 2242} {"train_loss": -24.24599266052246, "global_step": 186166, "epoch": 2242} {"train_loss": -23.838293075561523, "global_step": 186167, "epoch": 2242} {"train_loss": -23.87995129320995, "global_step": 186168, "epoch": 2242, "val_loss": 6441851.0} {"train_loss": -24.038976669311523, "global_step": 186169, "epoch": 2243} {"train_loss": -23.7957820892334, "global_step": 186170, "epoch": 2243} {"train_loss": -24.11716079711914, "global_step": 186171, "epoch": 2243} {"train_loss": -24.02019500732422, "global_step": 186172, "epoch": 2243} {"train_loss": -23.388273239135742, "global_step": 186173, "epoch": 2243} {"train_loss": -23.950550079345703, "global_step": 186174, "epoch": 2243} {"train_loss": -23.743085861206055, "global_step": 186175, "epoch": 2243} {"train_loss": -23.799474716186523, "global_step": 186176, "epoch": 2243} {"train_loss": -23.727434158325195, "global_step": 186177, "epoch": 2243} {"train_loss": -23.802330017089844, "global_step": 186178, "epoch": 2243} {"train_loss": -24.078258514404297, "global_step": 186179, "epoch": 2243} {"train_loss": -23.965145111083984, "global_step": 186180, "epoch": 2243} {"train_loss": -23.880582809448242, "global_step": 186181, "epoch": 2243} {"train_loss": -24.09175682067871, "global_step": 186182, "epoch": 2243} {"train_loss": -23.954687118530273, "global_step": 186183, "epoch": 2243} {"train_loss": -24.01413345336914, "global_step": 186184, "epoch": 2243} {"train_loss": -24.09638023376465, "global_step": 186185, "epoch": 2243} {"train_loss": -24.12870216369629, "global_step": 186186, "epoch": 2243} {"train_loss": -24.114646911621094, "global_step": 186187, "epoch": 2243} {"train_loss": -24.256895065307617, "global_step": 186188, "epoch": 2243} {"train_loss": -23.809860229492188, "global_step": 186189, "epoch": 2243} {"train_loss": -24.110280990600586, "global_step": 186190, "epoch": 2243} {"train_loss": -24.094823837280273, "global_step": 186191, "epoch": 2243} {"train_loss": -23.972288131713867, "global_step": 186192, "epoch": 2243} {"train_loss": -24.199357986450195, "global_step": 186193, "epoch": 2243} {"train_loss": -24.378238677978516, "global_step": 186194, "epoch": 2243} {"train_loss": -23.9415283203125, "global_step": 186195, "epoch": 2243} {"train_loss": -24.227441787719727, "global_step": 186196, "epoch": 2243} {"train_loss": -23.86750030517578, "global_step": 186197, "epoch": 2243} {"train_loss": -23.64362907409668, "global_step": 186198, "epoch": 2243} {"train_loss": -23.583372116088867, "global_step": 186199, "epoch": 2243} {"train_loss": -24.283233642578125, "global_step": 186200, "epoch": 2243} {"train_loss": -24.11494255065918, "global_step": 186201, "epoch": 2243} {"train_loss": -23.723390579223633, "global_step": 186202, "epoch": 2243} {"train_loss": -23.80684471130371, "global_step": 186203, "epoch": 2243} {"train_loss": -24.025754928588867, "global_step": 186204, "epoch": 2243} {"train_loss": -24.340925216674805, "global_step": 186205, "epoch": 2243} {"train_loss": -24.053558349609375, "global_step": 186206, "epoch": 2243} {"train_loss": -24.093847274780273, "global_step": 186207, "epoch": 2243} {"train_loss": -23.80714988708496, "global_step": 186208, "epoch": 2243} {"train_loss": -24.42964744567871, "global_step": 186209, "epoch": 2243} {"train_loss": -24.204498291015625, "global_step": 186210, "epoch": 2243} {"train_loss": -24.043291091918945, "global_step": 186211, "epoch": 2243} {"train_loss": -24.06976318359375, "global_step": 186212, "epoch": 2243} {"train_loss": -23.99367904663086, "global_step": 186213, "epoch": 2243} {"train_loss": -23.895811080932617, "global_step": 186214, "epoch": 2243} {"train_loss": -24.05660057067871, "global_step": 186215, "epoch": 2243} {"train_loss": -24.069501876831055, "global_step": 186216, "epoch": 2243} {"train_loss": -24.066452026367188, "global_step": 186217, "epoch": 2243} {"train_loss": -24.19638442993164, "global_step": 186218, "epoch": 2243} {"train_loss": -24.063642501831055, "global_step": 186219, "epoch": 2243} {"train_loss": -24.177167892456055, "global_step": 186220, "epoch": 2243} {"train_loss": -24.13483238220215, "global_step": 186221, "epoch": 2243} {"train_loss": -23.923246383666992, "global_step": 186222, "epoch": 2243} {"train_loss": -23.419174194335938, "global_step": 186223, "epoch": 2243} {"train_loss": -23.897174835205078, "global_step": 186224, "epoch": 2243} {"train_loss": -23.941877365112305, "global_step": 186225, "epoch": 2243} {"train_loss": -23.739416122436523, "global_step": 186226, "epoch": 2243} {"train_loss": -23.702863693237305, "global_step": 186227, "epoch": 2243} {"train_loss": -23.928434371948242, "global_step": 186228, "epoch": 2243} {"train_loss": -24.34661865234375, "global_step": 186229, "epoch": 2243} {"train_loss": -23.96238899230957, "global_step": 186230, "epoch": 2243} {"train_loss": -23.632896423339844, "global_step": 186231, "epoch": 2243} {"train_loss": -23.9749813079834, "global_step": 186232, "epoch": 2243} {"train_loss": -23.95404815673828, "global_step": 186233, "epoch": 2243} {"train_loss": -24.42399787902832, "global_step": 186234, "epoch": 2243} {"train_loss": -24.10400390625, "global_step": 186235, "epoch": 2243} {"train_loss": -24.394784927368164, "global_step": 186236, "epoch": 2243} {"train_loss": -24.12453842163086, "global_step": 186237, "epoch": 2243} {"train_loss": -24.400909423828125, "global_step": 186238, "epoch": 2243} {"train_loss": -24.033370971679688, "global_step": 186239, "epoch": 2243} {"train_loss": -23.984176635742188, "global_step": 186240, "epoch": 2243} {"train_loss": -24.372207641601562, "global_step": 186241, "epoch": 2243} {"train_loss": -24.32967185974121, "global_step": 186242, "epoch": 2243} {"train_loss": -24.04315185546875, "global_step": 186243, "epoch": 2243} {"train_loss": -24.254873275756836, "global_step": 186244, "epoch": 2243} {"train_loss": -24.03506088256836, "global_step": 186245, "epoch": 2243} {"train_loss": -23.971975326538086, "global_step": 186246, "epoch": 2243} {"train_loss": -23.913986206054688, "global_step": 186247, "epoch": 2243} {"train_loss": -23.88578224182129, "global_step": 186248, "epoch": 2243} {"train_loss": -24.05158042907715, "global_step": 186249, "epoch": 2243} {"train_loss": -23.879615783691406, "global_step": 186250, "epoch": 2243} {"train_loss": -23.99016646879265, "global_step": 186251, "epoch": 2243, "val_loss": 6487323.0} {"train_loss": -23.216506958007812, "global_step": 186252, "epoch": 2244} {"train_loss": -23.433210372924805, "global_step": 186253, "epoch": 2244} {"train_loss": -23.76197624206543, "global_step": 186254, "epoch": 2244} {"train_loss": -23.723241806030273, "global_step": 186255, "epoch": 2244} {"train_loss": -23.687570571899414, "global_step": 186256, "epoch": 2244} {"train_loss": -23.33660888671875, "global_step": 186257, "epoch": 2244} {"train_loss": -23.84834861755371, "global_step": 186258, "epoch": 2244} {"train_loss": -23.886571884155273, "global_step": 186259, "epoch": 2244} {"train_loss": -23.993289947509766, "global_step": 186260, "epoch": 2244} {"train_loss": -23.84185791015625, "global_step": 186261, "epoch": 2244} {"train_loss": -23.813138961791992, "global_step": 186262, "epoch": 2244} {"train_loss": -23.681758880615234, "global_step": 186263, "epoch": 2244} {"train_loss": -24.068538665771484, "global_step": 186264, "epoch": 2244} {"train_loss": -23.876340866088867, "global_step": 186265, "epoch": 2244} {"train_loss": -23.84078025817871, "global_step": 186266, "epoch": 2244} {"train_loss": -23.816823959350586, "global_step": 186267, "epoch": 2244} {"train_loss": -23.839759826660156, "global_step": 186268, "epoch": 2244} {"train_loss": -23.907047271728516, "global_step": 186269, "epoch": 2244} {"train_loss": -23.783479690551758, "global_step": 186270, "epoch": 2244} {"train_loss": -23.914997100830078, "global_step": 186271, "epoch": 2244} {"train_loss": -24.039196014404297, "global_step": 186272, "epoch": 2244} {"train_loss": -24.18221092224121, "global_step": 186273, "epoch": 2244} {"train_loss": -24.210033416748047, "global_step": 186274, "epoch": 2244} {"train_loss": -23.82367706298828, "global_step": 186275, "epoch": 2244} {"train_loss": -23.627857208251953, "global_step": 186276, "epoch": 2244} {"train_loss": -23.749542236328125, "global_step": 186277, "epoch": 2244} {"train_loss": -23.82845687866211, "global_step": 186278, "epoch": 2244} {"train_loss": -23.649646759033203, "global_step": 186279, "epoch": 2244} {"train_loss": -24.05735206604004, "global_step": 186280, "epoch": 2244} {"train_loss": -23.94319725036621, "global_step": 186281, "epoch": 2244} {"train_loss": -23.865041732788086, "global_step": 186282, "epoch": 2244} {"train_loss": -23.985055923461914, "global_step": 186283, "epoch": 2244} {"train_loss": -24.513456344604492, "global_step": 186284, "epoch": 2244} {"train_loss": -24.2639217376709, "global_step": 186285, "epoch": 2244} {"train_loss": -24.06059455871582, "global_step": 186286, "epoch": 2244} {"train_loss": -24.21323013305664, "global_step": 186287, "epoch": 2244} {"train_loss": -23.979841232299805, "global_step": 186288, "epoch": 2244} {"train_loss": -24.243810653686523, "global_step": 186289, "epoch": 2244} {"train_loss": -24.085617065429688, "global_step": 186290, "epoch": 2244} {"train_loss": -24.192279815673828, "global_step": 186291, "epoch": 2244} {"train_loss": -24.384353637695312, "global_step": 186292, "epoch": 2244} {"train_loss": -24.238265991210938, "global_step": 186293, "epoch": 2244} {"train_loss": -23.977712631225586, "global_step": 186294, "epoch": 2244} {"train_loss": -24.36155128479004, "global_step": 186295, "epoch": 2244} {"train_loss": -24.466068267822266, "global_step": 186296, "epoch": 2244} {"train_loss": -24.156099319458008, "global_step": 186297, "epoch": 2244} {"train_loss": -23.836170196533203, "global_step": 186298, "epoch": 2244} {"train_loss": -24.00116539001465, "global_step": 186299, "epoch": 2244} {"train_loss": -24.10149574279785, "global_step": 186300, "epoch": 2244} {"train_loss": -24.16786003112793, "global_step": 186301, "epoch": 2244} {"train_loss": -24.10846519470215, "global_step": 186302, "epoch": 2244} {"train_loss": -24.02125358581543, "global_step": 186303, "epoch": 2244} {"train_loss": -24.077255249023438, "global_step": 186304, "epoch": 2244} {"train_loss": -24.111055374145508, "global_step": 186305, "epoch": 2244} {"train_loss": -24.110549926757812, "global_step": 186306, "epoch": 2244} {"train_loss": -24.053787231445312, "global_step": 186307, "epoch": 2244} {"train_loss": -24.106826782226562, "global_step": 186308, "epoch": 2244} {"train_loss": -24.138425827026367, "global_step": 186309, "epoch": 2244} {"train_loss": -24.125152587890625, "global_step": 186310, "epoch": 2244} {"train_loss": -23.791276931762695, "global_step": 186311, "epoch": 2244} {"train_loss": -24.34098243713379, "global_step": 186312, "epoch": 2244} {"train_loss": -23.89238166809082, "global_step": 186313, "epoch": 2244} {"train_loss": -23.728179931640625, "global_step": 186314, "epoch": 2244} {"train_loss": -23.92534637451172, "global_step": 186315, "epoch": 2244} {"train_loss": -23.958919525146484, "global_step": 186316, "epoch": 2244} {"train_loss": -24.313806533813477, "global_step": 186317, "epoch": 2244} {"train_loss": -23.661884307861328, "global_step": 186318, "epoch": 2244} {"train_loss": -23.926856994628906, "global_step": 186319, "epoch": 2244} {"train_loss": -23.627925872802734, "global_step": 186320, "epoch": 2244} {"train_loss": -24.115201950073242, "global_step": 186321, "epoch": 2244} {"train_loss": -24.19770622253418, "global_step": 186322, "epoch": 2244} {"train_loss": -24.032718658447266, "global_step": 186323, "epoch": 2244} {"train_loss": -23.927326202392578, "global_step": 186324, "epoch": 2244} {"train_loss": -23.711639404296875, "global_step": 186325, "epoch": 2244} {"train_loss": -23.825197219848633, "global_step": 186326, "epoch": 2244} {"train_loss": -24.38509178161621, "global_step": 186327, "epoch": 2244} {"train_loss": -23.681419372558594, "global_step": 186328, "epoch": 2244} {"train_loss": -23.629037857055664, "global_step": 186329, "epoch": 2244} {"train_loss": -23.9251766204834, "global_step": 186330, "epoch": 2244} {"train_loss": -24.305509567260742, "global_step": 186331, "epoch": 2244} {"train_loss": -23.455841064453125, "global_step": 186332, "epoch": 2244} {"train_loss": -23.93695068359375, "global_step": 186333, "epoch": 2244} {"train_loss": -23.93693974506424, "global_step": 186334, "epoch": 2244, "val_loss": 6496292.0} {"train_loss": -23.24583625793457, "global_step": 186335, "epoch": 2245} {"train_loss": -23.03621482849121, "global_step": 186336, "epoch": 2245} {"train_loss": -23.618732452392578, "global_step": 186337, "epoch": 2245} {"train_loss": -22.800737380981445, "global_step": 186338, "epoch": 2245} {"train_loss": -23.607925415039062, "global_step": 186339, "epoch": 2245} {"train_loss": -23.36324119567871, "global_step": 186340, "epoch": 2245} {"train_loss": -23.1748046875, "global_step": 186341, "epoch": 2245} {"train_loss": -23.645971298217773, "global_step": 186342, "epoch": 2245} {"train_loss": -23.488752365112305, "global_step": 186343, "epoch": 2245} {"train_loss": -23.61345863342285, "global_step": 186344, "epoch": 2245} {"train_loss": -23.768526077270508, "global_step": 186345, "epoch": 2245} {"train_loss": -23.77471160888672, "global_step": 186346, "epoch": 2245} {"train_loss": -23.201025009155273, "global_step": 186347, "epoch": 2245} {"train_loss": -23.568748474121094, "global_step": 186348, "epoch": 2245} {"train_loss": -23.730300903320312, "global_step": 186349, "epoch": 2245} {"train_loss": -23.993274688720703, "global_step": 186350, "epoch": 2245} {"train_loss": -23.802734375, "global_step": 186351, "epoch": 2245} {"train_loss": -23.72127914428711, "global_step": 186352, "epoch": 2245} {"train_loss": -23.468002319335938, "global_step": 186353, "epoch": 2245} {"train_loss": -24.122215270996094, "global_step": 186354, "epoch": 2245} {"train_loss": -23.74945640563965, "global_step": 186355, "epoch": 2245} {"train_loss": -24.024938583374023, "global_step": 186356, "epoch": 2245} {"train_loss": -23.725515365600586, "global_step": 186357, "epoch": 2245} {"train_loss": -23.442245483398438, "global_step": 186358, "epoch": 2245} {"train_loss": -23.809898376464844, "global_step": 186359, "epoch": 2245} {"train_loss": -24.13926887512207, "global_step": 186360, "epoch": 2245} {"train_loss": -23.617101669311523, "global_step": 186361, "epoch": 2245} {"train_loss": -24.15481948852539, "global_step": 186362, "epoch": 2245} {"train_loss": -23.7021541595459, "global_step": 186363, "epoch": 2245} {"train_loss": -23.74115753173828, "global_step": 186364, "epoch": 2245} {"train_loss": -23.775501251220703, "global_step": 186365, "epoch": 2245} {"train_loss": -24.117856979370117, "global_step": 186366, "epoch": 2245} {"train_loss": -23.71613883972168, "global_step": 186367, "epoch": 2245} {"train_loss": -23.910585403442383, "global_step": 186368, "epoch": 2245} {"train_loss": -23.93260383605957, "global_step": 186369, "epoch": 2245} {"train_loss": -24.071399688720703, "global_step": 186370, "epoch": 2245} {"train_loss": -24.090240478515625, "global_step": 186371, "epoch": 2245} {"train_loss": -23.5952205657959, "global_step": 186372, "epoch": 2245} {"train_loss": -24.133777618408203, "global_step": 186373, "epoch": 2245} {"train_loss": -24.030643463134766, "global_step": 186374, "epoch": 2245} {"train_loss": -23.812589645385742, "global_step": 186375, "epoch": 2245} {"train_loss": -23.760150909423828, "global_step": 186376, "epoch": 2245} {"train_loss": -24.0450496673584, "global_step": 186377, "epoch": 2245} {"train_loss": -23.772296905517578, "global_step": 186378, "epoch": 2245} {"train_loss": -24.223142623901367, "global_step": 186379, "epoch": 2245} {"train_loss": -23.99095916748047, "global_step": 186380, "epoch": 2245} {"train_loss": -23.807804107666016, "global_step": 186381, "epoch": 2245} {"train_loss": -23.91265869140625, "global_step": 186382, "epoch": 2245} {"train_loss": -24.150075912475586, "global_step": 186383, "epoch": 2245} {"train_loss": -24.1181640625, "global_step": 186384, "epoch": 2245} {"train_loss": -24.01974868774414, "global_step": 186385, "epoch": 2245} {"train_loss": -23.733701705932617, "global_step": 186386, "epoch": 2245} {"train_loss": -24.077505111694336, "global_step": 186387, "epoch": 2245} {"train_loss": -23.65424156188965, "global_step": 186388, "epoch": 2245} {"train_loss": -24.215978622436523, "global_step": 186389, "epoch": 2245} {"train_loss": -24.267179489135742, "global_step": 186390, "epoch": 2245} {"train_loss": -23.745372772216797, "global_step": 186391, "epoch": 2245} {"train_loss": -24.06903648376465, "global_step": 186392, "epoch": 2245} {"train_loss": -24.541095733642578, "global_step": 186393, "epoch": 2245} {"train_loss": -24.062454223632812, "global_step": 186394, "epoch": 2245} {"train_loss": -23.98020362854004, "global_step": 186395, "epoch": 2245} {"train_loss": -23.87172508239746, "global_step": 186396, "epoch": 2245} {"train_loss": -24.20157814025879, "global_step": 186397, "epoch": 2245} {"train_loss": -24.016382217407227, "global_step": 186398, "epoch": 2245} {"train_loss": -24.189956665039062, "global_step": 186399, "epoch": 2245} {"train_loss": -24.05866241455078, "global_step": 186400, "epoch": 2245} {"train_loss": -23.972869873046875, "global_step": 186401, "epoch": 2245} {"train_loss": -24.191862106323242, "global_step": 186402, "epoch": 2245} {"train_loss": -24.228145599365234, "global_step": 186403, "epoch": 2245} {"train_loss": -24.23760414123535, "global_step": 186404, "epoch": 2245} {"train_loss": -24.031539916992188, "global_step": 186405, "epoch": 2245} {"train_loss": -24.301836013793945, "global_step": 186406, "epoch": 2245} {"train_loss": -24.519926071166992, "global_step": 186407, "epoch": 2245} {"train_loss": -23.92340660095215, "global_step": 186408, "epoch": 2245} {"train_loss": -24.1295166015625, "global_step": 186409, "epoch": 2245} {"train_loss": -23.95106315612793, "global_step": 186410, "epoch": 2245} {"train_loss": -24.20881462097168, "global_step": 186411, "epoch": 2245} {"train_loss": -24.088171005249023, "global_step": 186412, "epoch": 2245} {"train_loss": -24.011571884155273, "global_step": 186413, "epoch": 2245} {"train_loss": -24.300987243652344, "global_step": 186414, "epoch": 2245} {"train_loss": -24.082035064697266, "global_step": 186415, "epoch": 2245} {"train_loss": -24.41579246520996, "global_step": 186416, "epoch": 2245} {"train_loss": -23.90240117727992, "global_step": 186417, "epoch": 2245, "val_loss": 6404706.0} {"train_loss": -23.927148818969727, "global_step": 186418, "epoch": 2246} {"train_loss": -23.454212188720703, "global_step": 186419, "epoch": 2246} {"train_loss": -23.05006980895996, "global_step": 186420, "epoch": 2246} {"train_loss": -23.61106300354004, "global_step": 186421, "epoch": 2246} {"train_loss": -23.4929256439209, "global_step": 186422, "epoch": 2246} {"train_loss": -23.692398071289062, "global_step": 186423, "epoch": 2246} {"train_loss": -23.495227813720703, "global_step": 186424, "epoch": 2246} {"train_loss": -24.114866256713867, "global_step": 186425, "epoch": 2246} {"train_loss": -23.689550399780273, "global_step": 186426, "epoch": 2246} {"train_loss": -23.422164916992188, "global_step": 186427, "epoch": 2246} {"train_loss": -23.468530654907227, "global_step": 186428, "epoch": 2246} {"train_loss": -23.988855361938477, "global_step": 186429, "epoch": 2246} {"train_loss": -24.037046432495117, "global_step": 186430, "epoch": 2246} {"train_loss": -24.04448127746582, "global_step": 186431, "epoch": 2246} {"train_loss": -23.537466049194336, "global_step": 186432, "epoch": 2246} {"train_loss": -23.788061141967773, "global_step": 186433, "epoch": 2246} {"train_loss": -24.005285263061523, "global_step": 186434, "epoch": 2246} {"train_loss": -23.907861709594727, "global_step": 186435, "epoch": 2246} {"train_loss": -24.258480072021484, "global_step": 186436, "epoch": 2246} {"train_loss": -24.34060287475586, "global_step": 186437, "epoch": 2246} {"train_loss": -24.199487686157227, "global_step": 186438, "epoch": 2246} {"train_loss": -24.217212677001953, "global_step": 186439, "epoch": 2246} {"train_loss": -24.05027198791504, "global_step": 186440, "epoch": 2246} {"train_loss": -24.18057632446289, "global_step": 186441, "epoch": 2246} {"train_loss": -23.693683624267578, "global_step": 186442, "epoch": 2246} {"train_loss": -24.220396041870117, "global_step": 186443, "epoch": 2246} {"train_loss": -24.197463989257812, "global_step": 186444, "epoch": 2246} {"train_loss": -23.72769546508789, "global_step": 186445, "epoch": 2246} {"train_loss": -23.89569664001465, "global_step": 186446, "epoch": 2246} {"train_loss": -23.635513305664062, "global_step": 186447, "epoch": 2246} {"train_loss": -24.44057846069336, "global_step": 186448, "epoch": 2246} {"train_loss": -24.169958114624023, "global_step": 186449, "epoch": 2246} {"train_loss": -24.16364097595215, "global_step": 186450, "epoch": 2246} {"train_loss": -24.081024169921875, "global_step": 186451, "epoch": 2246} {"train_loss": -23.91082763671875, "global_step": 186452, "epoch": 2246} {"train_loss": -24.127323150634766, "global_step": 186453, "epoch": 2246} {"train_loss": -23.688434600830078, "global_step": 186454, "epoch": 2246} {"train_loss": -24.104093551635742, "global_step": 186455, "epoch": 2246} {"train_loss": -23.98541831970215, "global_step": 186456, "epoch": 2246} {"train_loss": -24.077030181884766, "global_step": 186457, "epoch": 2246} {"train_loss": -23.800769805908203, "global_step": 186458, "epoch": 2246} {"train_loss": -23.76242446899414, "global_step": 186459, "epoch": 2246} {"train_loss": -23.97440528869629, "global_step": 186460, "epoch": 2246} {"train_loss": -24.061262130737305, "global_step": 186461, "epoch": 2246} {"train_loss": -24.16756248474121, "global_step": 186462, "epoch": 2246} {"train_loss": -24.228084564208984, "global_step": 186463, "epoch": 2246} {"train_loss": -23.919057846069336, "global_step": 186464, "epoch": 2246} {"train_loss": -24.114089965820312, "global_step": 186465, "epoch": 2246} {"train_loss": -23.646642684936523, "global_step": 186466, "epoch": 2246} {"train_loss": -24.01590919494629, "global_step": 186467, "epoch": 2246} {"train_loss": -24.14295768737793, "global_step": 186468, "epoch": 2246} {"train_loss": -23.7995662689209, "global_step": 186469, "epoch": 2246} {"train_loss": -24.13494110107422, "global_step": 186470, "epoch": 2246} {"train_loss": -24.3546199798584, "global_step": 186471, "epoch": 2246} {"train_loss": -24.2185001373291, "global_step": 186472, "epoch": 2246} {"train_loss": -23.901517868041992, "global_step": 186473, "epoch": 2246} {"train_loss": -24.447216033935547, "global_step": 186474, "epoch": 2246} {"train_loss": -24.34919548034668, "global_step": 186475, "epoch": 2246} {"train_loss": -24.27435302734375, "global_step": 186476, "epoch": 2246} {"train_loss": -24.176557540893555, "global_step": 186477, "epoch": 2246} {"train_loss": -23.982765197753906, "global_step": 186478, "epoch": 2246} {"train_loss": -23.819747924804688, "global_step": 186479, "epoch": 2246} {"train_loss": -24.044044494628906, "global_step": 186480, "epoch": 2246} {"train_loss": -24.08791160583496, "global_step": 186481, "epoch": 2246} {"train_loss": -24.198333740234375, "global_step": 186482, "epoch": 2246} {"train_loss": -24.245731353759766, "global_step": 186483, "epoch": 2246} {"train_loss": -23.9506893157959, "global_step": 186484, "epoch": 2246} {"train_loss": -24.192197799682617, "global_step": 186485, "epoch": 2246} {"train_loss": -24.29535484313965, "global_step": 186486, "epoch": 2246} {"train_loss": -23.983816146850586, "global_step": 186487, "epoch": 2246} {"train_loss": -24.279508590698242, "global_step": 186488, "epoch": 2246} {"train_loss": -24.140762329101562, "global_step": 186489, "epoch": 2246} {"train_loss": -24.11859703063965, "global_step": 186490, "epoch": 2246} {"train_loss": -24.001012802124023, "global_step": 186491, "epoch": 2246} {"train_loss": -23.795127868652344, "global_step": 186492, "epoch": 2246} {"train_loss": -24.001554489135742, "global_step": 186493, "epoch": 2246} {"train_loss": -24.082136154174805, "global_step": 186494, "epoch": 2246} {"train_loss": -23.934619903564453, "global_step": 186495, "epoch": 2246} {"train_loss": -24.198299407958984, "global_step": 186496, "epoch": 2246} {"train_loss": -23.77313232421875, "global_step": 186497, "epoch": 2246} {"train_loss": -24.091053009033203, "global_step": 186498, "epoch": 2246} {"train_loss": -24.382850646972656, "global_step": 186499, "epoch": 2246} {"train_loss": -23.98309790369976, "global_step": 186500, "epoch": 2246, "val_loss": 6576375.5} {"train_loss": -24.194223403930664, "global_step": 186501, "epoch": 2247} {"train_loss": -23.696292877197266, "global_step": 186502, "epoch": 2247} {"train_loss": -23.65738296508789, "global_step": 186503, "epoch": 2247} {"train_loss": -23.803869247436523, "global_step": 186504, "epoch": 2247} {"train_loss": -24.091516494750977, "global_step": 186505, "epoch": 2247} {"train_loss": -23.89304542541504, "global_step": 186506, "epoch": 2247} {"train_loss": -23.685928344726562, "global_step": 186507, "epoch": 2247} {"train_loss": -24.282821655273438, "global_step": 186508, "epoch": 2247} {"train_loss": -23.82416343688965, "global_step": 186509, "epoch": 2247} {"train_loss": -23.437158584594727, "global_step": 186510, "epoch": 2247} {"train_loss": -23.682815551757812, "global_step": 186511, "epoch": 2247} {"train_loss": -23.749364852905273, "global_step": 186512, "epoch": 2247} {"train_loss": -23.886795043945312, "global_step": 186513, "epoch": 2247} {"train_loss": -23.545732498168945, "global_step": 186514, "epoch": 2247} {"train_loss": -23.74062156677246, "global_step": 186515, "epoch": 2247} {"train_loss": -24.05142593383789, "global_step": 186516, "epoch": 2247} {"train_loss": -23.805471420288086, "global_step": 186517, "epoch": 2247} {"train_loss": -23.5616512298584, "global_step": 186518, "epoch": 2247} {"train_loss": -24.09869384765625, "global_step": 186519, "epoch": 2247} {"train_loss": -24.16411781311035, "global_step": 186520, "epoch": 2247} {"train_loss": -23.920480728149414, "global_step": 186521, "epoch": 2247} {"train_loss": -23.960376739501953, "global_step": 186522, "epoch": 2247} {"train_loss": -24.114362716674805, "global_step": 186523, "epoch": 2247} {"train_loss": -23.985204696655273, "global_step": 186524, "epoch": 2247} {"train_loss": -24.245542526245117, "global_step": 186525, "epoch": 2247} {"train_loss": -23.859228134155273, "global_step": 186526, "epoch": 2247} {"train_loss": -24.269079208374023, "global_step": 186527, "epoch": 2247} {"train_loss": -24.368228912353516, "global_step": 186528, "epoch": 2247} {"train_loss": -24.053180694580078, "global_step": 186529, "epoch": 2247} {"train_loss": -24.258363723754883, "global_step": 186530, "epoch": 2247} {"train_loss": -24.324886322021484, "global_step": 186531, "epoch": 2247} {"train_loss": -24.22303009033203, "global_step": 186532, "epoch": 2247} {"train_loss": -24.353269577026367, "global_step": 186533, "epoch": 2247} {"train_loss": -24.20732879638672, "global_step": 186534, "epoch": 2247} {"train_loss": -24.100086212158203, "global_step": 186535, "epoch": 2247} {"train_loss": -24.116056442260742, "global_step": 186536, "epoch": 2247} {"train_loss": -23.969839096069336, "global_step": 186537, "epoch": 2247} {"train_loss": -23.84670066833496, "global_step": 186538, "epoch": 2247} {"train_loss": -24.25834083557129, "global_step": 186539, "epoch": 2247} {"train_loss": -24.03663444519043, "global_step": 186540, "epoch": 2247} {"train_loss": -23.810354232788086, "global_step": 186541, "epoch": 2247} {"train_loss": -23.92734146118164, "global_step": 186542, "epoch": 2247} {"train_loss": -24.269025802612305, "global_step": 186543, "epoch": 2247} {"train_loss": -23.956083297729492, "global_step": 186544, "epoch": 2247} {"train_loss": -23.458850860595703, "global_step": 186545, "epoch": 2247} {"train_loss": -23.698392868041992, "global_step": 186546, "epoch": 2247} {"train_loss": -23.90437126159668, "global_step": 186547, "epoch": 2247} {"train_loss": -23.15717124938965, "global_step": 186548, "epoch": 2247} {"train_loss": -23.871610641479492, "global_step": 186549, "epoch": 2247} {"train_loss": -23.804136276245117, "global_step": 186550, "epoch": 2247} {"train_loss": -24.068952560424805, "global_step": 186551, "epoch": 2247} {"train_loss": -24.039844512939453, "global_step": 186552, "epoch": 2247} {"train_loss": -23.86680030822754, "global_step": 186553, "epoch": 2247} {"train_loss": -24.108509063720703, "global_step": 186554, "epoch": 2247} {"train_loss": -23.86710548400879, "global_step": 186555, "epoch": 2247} {"train_loss": -23.632587432861328, "global_step": 186556, "epoch": 2247} {"train_loss": -23.92116928100586, "global_step": 186557, "epoch": 2247} {"train_loss": -23.911405563354492, "global_step": 186558, "epoch": 2247} {"train_loss": -23.826196670532227, "global_step": 186559, "epoch": 2247} {"train_loss": -23.766286849975586, "global_step": 186560, "epoch": 2247} {"train_loss": -23.73069953918457, "global_step": 186561, "epoch": 2247} {"train_loss": -24.183124542236328, "global_step": 186562, "epoch": 2247} {"train_loss": -23.99571418762207, "global_step": 186563, "epoch": 2247} {"train_loss": -24.041961669921875, "global_step": 186564, "epoch": 2247} {"train_loss": -23.962121963500977, "global_step": 186565, "epoch": 2247} {"train_loss": -24.088735580444336, "global_step": 186566, "epoch": 2247} {"train_loss": -23.962509155273438, "global_step": 186567, "epoch": 2247} {"train_loss": -23.94194984436035, "global_step": 186568, "epoch": 2247} {"train_loss": -23.961374282836914, "global_step": 186569, "epoch": 2247} {"train_loss": -24.313501358032227, "global_step": 186570, "epoch": 2247} {"train_loss": -24.095142364501953, "global_step": 186571, "epoch": 2247} {"train_loss": -23.99503517150879, "global_step": 186572, "epoch": 2247} {"train_loss": -24.188039779663086, "global_step": 186573, "epoch": 2247} {"train_loss": -24.04524803161621, "global_step": 186574, "epoch": 2247} {"train_loss": -24.369495391845703, "global_step": 186575, "epoch": 2247} {"train_loss": -23.823501586914062, "global_step": 186576, "epoch": 2247} {"train_loss": -23.96031951904297, "global_step": 186577, "epoch": 2247} {"train_loss": -24.005596160888672, "global_step": 186578, "epoch": 2247} {"train_loss": -24.00069808959961, "global_step": 186579, "epoch": 2247} {"train_loss": -24.298492431640625, "global_step": 186580, "epoch": 2247} {"train_loss": -24.002002716064453, "global_step": 186581, "epoch": 2247} {"train_loss": -24.302318572998047, "global_step": 186582, "epoch": 2247} {"train_loss": -23.961516368820007, "global_step": 186583, "epoch": 2247, "val_loss": 6582352.0} {"train_loss": -22.869049072265625, "global_step": 186584, "epoch": 2248} {"train_loss": -23.662906646728516, "global_step": 186585, "epoch": 2248} {"train_loss": -23.382192611694336, "global_step": 186586, "epoch": 2248} {"train_loss": -23.401145935058594, "global_step": 186587, "epoch": 2248} {"train_loss": -23.20586585998535, "global_step": 186588, "epoch": 2248} {"train_loss": -22.893762588500977, "global_step": 186589, "epoch": 2248} {"train_loss": -23.515958786010742, "global_step": 186590, "epoch": 2248} {"train_loss": -23.250530242919922, "global_step": 186591, "epoch": 2248} {"train_loss": -23.638364791870117, "global_step": 186592, "epoch": 2248} {"train_loss": -23.137800216674805, "global_step": 186593, "epoch": 2248} {"train_loss": -24.089025497436523, "global_step": 186594, "epoch": 2248} {"train_loss": -23.14288902282715, "global_step": 186595, "epoch": 2248} {"train_loss": -23.727807998657227, "global_step": 186596, "epoch": 2248} {"train_loss": -23.43429946899414, "global_step": 186597, "epoch": 2248} {"train_loss": -23.45210075378418, "global_step": 186598, "epoch": 2248} {"train_loss": -23.505645751953125, "global_step": 186599, "epoch": 2248} {"train_loss": -23.526403427124023, "global_step": 186600, "epoch": 2248} {"train_loss": -23.30840301513672, "global_step": 186601, "epoch": 2248} {"train_loss": -23.846006393432617, "global_step": 186602, "epoch": 2248} {"train_loss": -23.9272518157959, "global_step": 186603, "epoch": 2248} {"train_loss": -23.7977294921875, "global_step": 186604, "epoch": 2248} {"train_loss": -23.895627975463867, "global_step": 186605, "epoch": 2248} {"train_loss": -23.4736385345459, "global_step": 186606, "epoch": 2248} {"train_loss": -23.626760482788086, "global_step": 186607, "epoch": 2248} {"train_loss": -23.772520065307617, "global_step": 186608, "epoch": 2248} {"train_loss": -23.801847457885742, "global_step": 186609, "epoch": 2248} {"train_loss": -23.66953468322754, "global_step": 186610, "epoch": 2248} {"train_loss": -23.980905532836914, "global_step": 186611, "epoch": 2248} {"train_loss": -24.350313186645508, "global_step": 186612, "epoch": 2248} {"train_loss": -24.146142959594727, "global_step": 186613, "epoch": 2248} {"train_loss": -23.90659523010254, "global_step": 186614, "epoch": 2248} {"train_loss": -24.247968673706055, "global_step": 186615, "epoch": 2248} {"train_loss": -24.217458724975586, "global_step": 186616, "epoch": 2248} {"train_loss": -23.764739990234375, "global_step": 186617, "epoch": 2248} {"train_loss": -23.819732666015625, "global_step": 186618, "epoch": 2248} {"train_loss": -23.942285537719727, "global_step": 186619, "epoch": 2248} {"train_loss": -24.02778434753418, "global_step": 186620, "epoch": 2248} {"train_loss": -23.682035446166992, "global_step": 186621, "epoch": 2248} {"train_loss": -23.91379165649414, "global_step": 186622, "epoch": 2248} {"train_loss": -24.190366744995117, "global_step": 186623, "epoch": 2248} {"train_loss": -24.272789001464844, "global_step": 186624, "epoch": 2248} {"train_loss": -24.357328414916992, "global_step": 186625, "epoch": 2248} {"train_loss": -23.78631019592285, "global_step": 186626, "epoch": 2248} {"train_loss": -24.03934097290039, "global_step": 186627, "epoch": 2248} {"train_loss": -24.134714126586914, "global_step": 186628, "epoch": 2248} {"train_loss": -24.238187789916992, "global_step": 186629, "epoch": 2248} {"train_loss": -24.043977737426758, "global_step": 186630, "epoch": 2248} {"train_loss": -24.1112003326416, "global_step": 186631, "epoch": 2248} {"train_loss": -24.034318923950195, "global_step": 186632, "epoch": 2248} {"train_loss": -23.83574867248535, "global_step": 186633, "epoch": 2248} {"train_loss": -24.29766845703125, "global_step": 186634, "epoch": 2248} {"train_loss": -24.119403839111328, "global_step": 186635, "epoch": 2248} {"train_loss": -23.813520431518555, "global_step": 186636, "epoch": 2248} {"train_loss": -24.236743927001953, "global_step": 186637, "epoch": 2248} {"train_loss": -23.97454071044922, "global_step": 186638, "epoch": 2248} {"train_loss": -24.130325317382812, "global_step": 186639, "epoch": 2248} {"train_loss": -23.5142879486084, "global_step": 186640, "epoch": 2248} {"train_loss": -23.132604598999023, "global_step": 186641, "epoch": 2248} {"train_loss": -23.759000778198242, "global_step": 186642, "epoch": 2248} {"train_loss": -24.20568084716797, "global_step": 186643, "epoch": 2248} {"train_loss": -23.919620513916016, "global_step": 186644, "epoch": 2248} {"train_loss": -23.714094161987305, "global_step": 186645, "epoch": 2248} {"train_loss": -24.07712745666504, "global_step": 186646, "epoch": 2248} {"train_loss": -24.0780029296875, "global_step": 186647, "epoch": 2248} {"train_loss": -23.810434341430664, "global_step": 186648, "epoch": 2248} {"train_loss": -24.07717514038086, "global_step": 186649, "epoch": 2248} {"train_loss": -24.331893920898438, "global_step": 186650, "epoch": 2248} {"train_loss": -24.08441162109375, "global_step": 186651, "epoch": 2248} {"train_loss": -24.20465850830078, "global_step": 186652, "epoch": 2248} {"train_loss": -23.887357711791992, "global_step": 186653, "epoch": 2248} {"train_loss": -23.75356101989746, "global_step": 186654, "epoch": 2248} {"train_loss": -23.85505485534668, "global_step": 186655, "epoch": 2248} {"train_loss": -24.037904739379883, "global_step": 186656, "epoch": 2248} {"train_loss": -24.16681480407715, "global_step": 186657, "epoch": 2248} {"train_loss": -24.295944213867188, "global_step": 186658, "epoch": 2248} {"train_loss": -24.434823989868164, "global_step": 186659, "epoch": 2248} {"train_loss": -24.19907569885254, "global_step": 186660, "epoch": 2248} {"train_loss": -24.046140670776367, "global_step": 186661, "epoch": 2248} {"train_loss": -24.09169578552246, "global_step": 186662, "epoch": 2248} {"train_loss": -24.05574607849121, "global_step": 186663, "epoch": 2248} {"train_loss": -24.248411178588867, "global_step": 186664, "epoch": 2248} {"train_loss": -24.12726402282715, "global_step": 186665, "epoch": 2248} {"train_loss": -23.86496840327619, "global_step": 186666, "epoch": 2248, "val_loss": 6477227.0} {"train_loss": -23.582626342773438, "global_step": 186667, "epoch": 2249} {"train_loss": -23.96857261657715, "global_step": 186668, "epoch": 2249} {"train_loss": -23.926651000976562, "global_step": 186669, "epoch": 2249} {"train_loss": -23.9890193939209, "global_step": 186670, "epoch": 2249} {"train_loss": -23.946556091308594, "global_step": 186671, "epoch": 2249} {"train_loss": -24.14705467224121, "global_step": 186672, "epoch": 2249} {"train_loss": -23.829069137573242, "global_step": 186673, "epoch": 2249} {"train_loss": -24.03626823425293, "global_step": 186674, "epoch": 2249} {"train_loss": -23.879648208618164, "global_step": 186675, "epoch": 2249} {"train_loss": -23.888742446899414, "global_step": 186676, "epoch": 2249} {"train_loss": -24.03260612487793, "global_step": 186677, "epoch": 2249} {"train_loss": -24.02457618713379, "global_step": 186678, "epoch": 2249} {"train_loss": -23.730863571166992, "global_step": 186679, "epoch": 2249} {"train_loss": -23.507095336914062, "global_step": 186680, "epoch": 2249} {"train_loss": -23.9354305267334, "global_step": 186681, "epoch": 2249} {"train_loss": -23.558698654174805, "global_step": 186682, "epoch": 2249} {"train_loss": -24.07386589050293, "global_step": 186683, "epoch": 2249} {"train_loss": -24.15206527709961, "global_step": 186684, "epoch": 2249} {"train_loss": -23.842985153198242, "global_step": 186685, "epoch": 2249} {"train_loss": -24.038925170898438, "global_step": 186686, "epoch": 2249} {"train_loss": -24.01255226135254, "global_step": 186687, "epoch": 2249} {"train_loss": -24.147384643554688, "global_step": 186688, "epoch": 2249} {"train_loss": -23.96489715576172, "global_step": 186689, "epoch": 2249} {"train_loss": -23.92279052734375, "global_step": 186690, "epoch": 2249} {"train_loss": -23.85288429260254, "global_step": 186691, "epoch": 2249} {"train_loss": -24.46161460876465, "global_step": 186692, "epoch": 2249} {"train_loss": -24.276403427124023, "global_step": 186693, "epoch": 2249} {"train_loss": -24.29152488708496, "global_step": 186694, "epoch": 2249} {"train_loss": -24.17725944519043, "global_step": 186695, "epoch": 2249} {"train_loss": -23.850683212280273, "global_step": 186696, "epoch": 2249} {"train_loss": -23.849567413330078, "global_step": 186697, "epoch": 2249} {"train_loss": -23.785688400268555, "global_step": 186698, "epoch": 2249} {"train_loss": -23.904964447021484, "global_step": 186699, "epoch": 2249} {"train_loss": -24.703954696655273, "global_step": 186700, "epoch": 2249} {"train_loss": -23.812917709350586, "global_step": 186701, "epoch": 2249} {"train_loss": -24.151826858520508, "global_step": 186702, "epoch": 2249} {"train_loss": -24.02231216430664, "global_step": 186703, "epoch": 2249} {"train_loss": -24.13637351989746, "global_step": 186704, "epoch": 2249} {"train_loss": -24.165525436401367, "global_step": 186705, "epoch": 2249} {"train_loss": -24.486011505126953, "global_step": 186706, "epoch": 2249} {"train_loss": -24.193241119384766, "global_step": 186707, "epoch": 2249} {"train_loss": -24.355314254760742, "global_step": 186708, "epoch": 2249} {"train_loss": -24.149076461791992, "global_step": 186709, "epoch": 2249} {"train_loss": -23.892702102661133, "global_step": 186710, "epoch": 2249} {"train_loss": -23.949811935424805, "global_step": 186711, "epoch": 2249} {"train_loss": -24.144306182861328, "global_step": 186712, "epoch": 2249} {"train_loss": -23.851224899291992, "global_step": 186713, "epoch": 2249} {"train_loss": -24.242313385009766, "global_step": 186714, "epoch": 2249} {"train_loss": -23.753467559814453, "global_step": 186715, "epoch": 2249} {"train_loss": -24.07035255432129, "global_step": 186716, "epoch": 2249} {"train_loss": -24.203458786010742, "global_step": 186717, "epoch": 2249} {"train_loss": -24.214941024780273, "global_step": 186718, "epoch": 2249} {"train_loss": -23.767282485961914, "global_step": 186719, "epoch": 2249} {"train_loss": -23.88953971862793, "global_step": 186720, "epoch": 2249} {"train_loss": -24.07734489440918, "global_step": 186721, "epoch": 2249} {"train_loss": -23.969070434570312, "global_step": 186722, "epoch": 2249} {"train_loss": -24.162643432617188, "global_step": 186723, "epoch": 2249} {"train_loss": -24.004186630249023, "global_step": 186724, "epoch": 2249} {"train_loss": -23.891651153564453, "global_step": 186725, "epoch": 2249} {"train_loss": -23.73166847229004, "global_step": 186726, "epoch": 2249} {"train_loss": -23.819488525390625, "global_step": 186727, "epoch": 2249} {"train_loss": -23.65182876586914, "global_step": 186728, "epoch": 2249} {"train_loss": -23.886953353881836, "global_step": 186729, "epoch": 2249} {"train_loss": -23.570362091064453, "global_step": 186730, "epoch": 2249} {"train_loss": -23.851245880126953, "global_step": 186731, "epoch": 2249} {"train_loss": -24.226390838623047, "global_step": 186732, "epoch": 2249} {"train_loss": -23.9412899017334, "global_step": 186733, "epoch": 2249} {"train_loss": -24.019384384155273, "global_step": 186734, "epoch": 2249} {"train_loss": -24.200754165649414, "global_step": 186735, "epoch": 2249} {"train_loss": -24.179929733276367, "global_step": 186736, "epoch": 2249} {"train_loss": -23.986467361450195, "global_step": 186737, "epoch": 2249} {"train_loss": -24.2142391204834, "global_step": 186738, "epoch": 2249} {"train_loss": -23.766740798950195, "global_step": 186739, "epoch": 2249} {"train_loss": -24.10824966430664, "global_step": 186740, "epoch": 2249} {"train_loss": -24.04108428955078, "global_step": 186741, "epoch": 2249} {"train_loss": -23.85234832763672, "global_step": 186742, "epoch": 2249} {"train_loss": -23.903789520263672, "global_step": 186743, "epoch": 2249} {"train_loss": -23.566043853759766, "global_step": 186744, "epoch": 2249} {"train_loss": -23.713668823242188, "global_step": 186745, "epoch": 2249} {"train_loss": -24.066923141479492, "global_step": 186746, "epoch": 2249} {"train_loss": -23.580469131469727, "global_step": 186747, "epoch": 2249} {"train_loss": -23.186317443847656, "global_step": 186748, "epoch": 2249} {"train_loss": -23.95812845804605, "global_step": 186749, "epoch": 2249, "val_loss": 6507505.0} {"train_loss": -20.84852409362793, "global_step": 186750, "epoch": 2250} {"train_loss": -22.649608612060547, "global_step": 186751, "epoch": 2250} {"train_loss": -22.201154708862305, "global_step": 186752, "epoch": 2250} {"train_loss": -22.919416427612305, "global_step": 186753, "epoch": 2250} {"train_loss": -21.80078887939453, "global_step": 186754, "epoch": 2250} {"train_loss": -23.324127197265625, "global_step": 186755, "epoch": 2250} {"train_loss": -22.221399307250977, "global_step": 186756, "epoch": 2250} {"train_loss": -23.02467155456543, "global_step": 186757, "epoch": 2250} {"train_loss": -23.22616958618164, "global_step": 186758, "epoch": 2250} {"train_loss": -22.786300659179688, "global_step": 186759, "epoch": 2250} {"train_loss": -23.06610679626465, "global_step": 186760, "epoch": 2250} {"train_loss": -23.131484985351562, "global_step": 186761, "epoch": 2250} {"train_loss": -23.379941940307617, "global_step": 186762, "epoch": 2250} {"train_loss": -23.348960876464844, "global_step": 186763, "epoch": 2250} {"train_loss": -23.372848510742188, "global_step": 186764, "epoch": 2250} {"train_loss": -23.056310653686523, "global_step": 186765, "epoch": 2250} {"train_loss": -23.39577293395996, "global_step": 186766, "epoch": 2250} {"train_loss": -23.646146774291992, "global_step": 186767, "epoch": 2250} {"train_loss": -23.477331161499023, "global_step": 186768, "epoch": 2250} {"train_loss": -23.312599182128906, "global_step": 186769, "epoch": 2250} {"train_loss": -23.593385696411133, "global_step": 186770, "epoch": 2250} {"train_loss": -23.366987228393555, "global_step": 186771, "epoch": 2250} {"train_loss": -23.434423446655273, "global_step": 186772, "epoch": 2250} {"train_loss": -23.427488327026367, "global_step": 186773, "epoch": 2250} {"train_loss": -23.933685302734375, "global_step": 186774, "epoch": 2250} {"train_loss": -23.634632110595703, "global_step": 186775, "epoch": 2250} {"train_loss": -23.55946922302246, "global_step": 186776, "epoch": 2250} {"train_loss": -23.5955867767334, "global_step": 186777, "epoch": 2250} {"train_loss": -23.225934982299805, "global_step": 186778, "epoch": 2250} {"train_loss": -23.43059539794922, "global_step": 186779, "epoch": 2250} {"train_loss": -23.577056884765625, "global_step": 186780, "epoch": 2250} {"train_loss": -23.367483139038086, "global_step": 186781, "epoch": 2250} {"train_loss": -23.7066650390625, "global_step": 186782, "epoch": 2250} {"train_loss": -23.589832305908203, "global_step": 186783, "epoch": 2250} {"train_loss": -23.474075317382812, "global_step": 186784, "epoch": 2250} {"train_loss": -23.87397575378418, "global_step": 186785, "epoch": 2250} {"train_loss": -23.76705551147461, "global_step": 186786, "epoch": 2250} {"train_loss": -24.233884811401367, "global_step": 186787, "epoch": 2250} {"train_loss": -23.758686065673828, "global_step": 186788, "epoch": 2250} {"train_loss": -24.085662841796875, "global_step": 186789, "epoch": 2250} {"train_loss": -23.663597106933594, "global_step": 186790, "epoch": 2250} {"train_loss": -23.930288314819336, "global_step": 186791, "epoch": 2250} {"train_loss": -23.706573486328125, "global_step": 186792, "epoch": 2250} {"train_loss": -24.036951065063477, "global_step": 186793, "epoch": 2250} {"train_loss": -24.088693618774414, "global_step": 186794, "epoch": 2250} {"train_loss": -23.945661544799805, "global_step": 186795, "epoch": 2250} {"train_loss": -23.945066452026367, "global_step": 186796, "epoch": 2250} {"train_loss": -23.899816513061523, "global_step": 186797, "epoch": 2250} {"train_loss": -24.196094512939453, "global_step": 186798, "epoch": 2250} {"train_loss": -23.99640655517578, "global_step": 186799, "epoch": 2250} {"train_loss": -23.959264755249023, "global_step": 186800, "epoch": 2250} {"train_loss": -24.35967445373535, "global_step": 186801, "epoch": 2250} {"train_loss": -23.66971778869629, "global_step": 186802, "epoch": 2250} {"train_loss": -23.994718551635742, "global_step": 186803, "epoch": 2250} {"train_loss": -24.05232048034668, "global_step": 186804, "epoch": 2250} {"train_loss": -24.17328643798828, "global_step": 186805, "epoch": 2250} {"train_loss": -24.112043380737305, "global_step": 186806, "epoch": 2250} {"train_loss": -23.80596351623535, "global_step": 186807, "epoch": 2250} {"train_loss": -23.76207160949707, "global_step": 186808, "epoch": 2250} {"train_loss": -24.08247184753418, "global_step": 186809, "epoch": 2250} {"train_loss": -24.23763084411621, "global_step": 186810, "epoch": 2250} {"train_loss": -24.149320602416992, "global_step": 186811, "epoch": 2250} {"train_loss": -24.071918487548828, "global_step": 186812, "epoch": 2250} {"train_loss": -24.22843360900879, "global_step": 186813, "epoch": 2250} {"train_loss": -23.992910385131836, "global_step": 186814, "epoch": 2250} {"train_loss": -24.180362701416016, "global_step": 186815, "epoch": 2250} {"train_loss": -23.778772354125977, "global_step": 186816, "epoch": 2250} {"train_loss": -23.84026527404785, "global_step": 186817, "epoch": 2250} {"train_loss": -24.005386352539062, "global_step": 186818, "epoch": 2250} {"train_loss": -23.748746871948242, "global_step": 186819, "epoch": 2250} {"train_loss": -23.887258529663086, "global_step": 186820, "epoch": 2250} {"train_loss": -23.825801849365234, "global_step": 186821, "epoch": 2250} {"train_loss": -24.356916427612305, "global_step": 186822, "epoch": 2250} {"train_loss": -24.26259422302246, "global_step": 186823, "epoch": 2250} {"train_loss": -24.363679885864258, "global_step": 186824, "epoch": 2250} {"train_loss": -24.22507095336914, "global_step": 186825, "epoch": 2250} {"train_loss": -24.216754913330078, "global_step": 186826, "epoch": 2250} {"train_loss": -24.25168228149414, "global_step": 186827, "epoch": 2250} {"train_loss": -24.159940719604492, "global_step": 186828, "epoch": 2250} {"train_loss": -24.363323211669922, "global_step": 186829, "epoch": 2250} {"train_loss": -24.26228904724121, "global_step": 186830, "epoch": 2250} {"train_loss": -24.215059280395508, "global_step": 186831, "epoch": 2250} {"train_loss": -23.657452502882624, "global_step": 186832, "epoch": 2250, "train/sim_max_reward_0": 1.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4500000": 1.0, "test/sim_max_reward_4500001": 1.0, "test/sim_max_reward_4500002": 1.0, "test/sim_max_reward_4500003": 1.0, "test/sim_max_reward_4500004": 1.0, "test/sim_max_reward_4500005": 1.0, "test/sim_max_reward_4500006": 1.0, "test/sim_max_reward_4500007": 0.0, "test/sim_max_reward_4500008": 1.0, "test/sim_max_reward_4500009": 1.0, "test/sim_max_reward_4500010": 1.0, "test/sim_max_reward_4500011": 1.0, "test/sim_max_reward_4500012": 1.0, "test/sim_max_reward_4500013": 1.0, "test/sim_max_reward_4500014": 1.0, "test/sim_max_reward_4500015": 1.0, "test/sim_max_reward_4500016": 1.0, "test/sim_max_reward_4500017": 1.0, "test/sim_max_reward_4500018": 1.0, "test/sim_max_reward_4500019": 0.0, "test/sim_max_reward_4500020": 1.0, "test/sim_max_reward_4500021": 1.0, "train/mean_score": 1.0, "test/mean_score": 0.9090909090909091, "val_loss": 6517452.0} {"train_loss": -23.801488876342773, "global_step": 186833, "epoch": 2251} {"train_loss": -23.764225006103516, "global_step": 186834, "epoch": 2251} {"train_loss": -23.192886352539062, "global_step": 186835, "epoch": 2251} {"train_loss": -23.88926887512207, "global_step": 186836, "epoch": 2251} {"train_loss": -23.615436553955078, "global_step": 186837, "epoch": 2251} {"train_loss": -23.16290283203125, "global_step": 186838, "epoch": 2251} {"train_loss": -23.902875900268555, "global_step": 186839, "epoch": 2251} {"train_loss": -23.467496871948242, "global_step": 186840, "epoch": 2251} {"train_loss": -23.626399993896484, "global_step": 186841, "epoch": 2251} {"train_loss": -23.95372772216797, "global_step": 186842, "epoch": 2251} {"train_loss": -23.681005477905273, "global_step": 186843, "epoch": 2251} {"train_loss": -23.793642044067383, "global_step": 186844, "epoch": 2251} {"train_loss": -24.13679313659668, "global_step": 186845, "epoch": 2251} {"train_loss": -23.712671279907227, "global_step": 186846, "epoch": 2251} {"train_loss": -23.894575119018555, "global_step": 186847, "epoch": 2251} {"train_loss": -23.6226863861084, "global_step": 186848, "epoch": 2251} {"train_loss": -24.080366134643555, "global_step": 186849, "epoch": 2251} {"train_loss": -24.08090591430664, "global_step": 186850, "epoch": 2251} {"train_loss": -23.61360740661621, "global_step": 186851, "epoch": 2251} {"train_loss": -23.73678970336914, "global_step": 186852, "epoch": 2251} {"train_loss": -23.931062698364258, "global_step": 186853, "epoch": 2251} {"train_loss": -23.75666618347168, "global_step": 186854, "epoch": 2251} {"train_loss": -23.97902488708496, "global_step": 186855, "epoch": 2251} {"train_loss": -23.83267593383789, "global_step": 186856, "epoch": 2251} {"train_loss": -24.222766876220703, "global_step": 186857, "epoch": 2251} {"train_loss": -24.268871307373047, "global_step": 186858, "epoch": 2251} {"train_loss": -24.30971336364746, "global_step": 186859, "epoch": 2251} {"train_loss": -23.959365844726562, "global_step": 186860, "epoch": 2251} {"train_loss": -24.461915969848633, "global_step": 186861, "epoch": 2251} {"train_loss": -24.404794692993164, "global_step": 186862, "epoch": 2251} {"train_loss": -24.175537109375, "global_step": 186863, "epoch": 2251} {"train_loss": -24.112760543823242, "global_step": 186864, "epoch": 2251} {"train_loss": -24.120824813842773, "global_step": 186865, "epoch": 2251} {"train_loss": -23.975046157836914, "global_step": 186866, "epoch": 2251} {"train_loss": -23.937299728393555, "global_step": 186867, "epoch": 2251} {"train_loss": -24.31923484802246, "global_step": 186868, "epoch": 2251} {"train_loss": -24.05759048461914, "global_step": 186869, "epoch": 2251} {"train_loss": -24.157777786254883, "global_step": 186870, "epoch": 2251} {"train_loss": -23.982242584228516, "global_step": 186871, "epoch": 2251} {"train_loss": -24.231143951416016, "global_step": 186872, "epoch": 2251} {"train_loss": -24.379907608032227, "global_step": 186873, "epoch": 2251} {"train_loss": -24.048301696777344, "global_step": 186874, "epoch": 2251} {"train_loss": -23.93427085876465, "global_step": 186875, "epoch": 2251} {"train_loss": -24.164783477783203, "global_step": 186876, "epoch": 2251} {"train_loss": -23.96449851989746, "global_step": 186877, "epoch": 2251} {"train_loss": -24.34491729736328, "global_step": 186878, "epoch": 2251} {"train_loss": -24.088768005371094, "global_step": 186879, "epoch": 2251} {"train_loss": -24.164592742919922, "global_step": 186880, "epoch": 2251} {"train_loss": -23.98672866821289, "global_step": 186881, "epoch": 2251} {"train_loss": -24.037641525268555, "global_step": 186882, "epoch": 2251} {"train_loss": -23.792381286621094, "global_step": 186883, "epoch": 2251} {"train_loss": -23.957595825195312, "global_step": 186884, "epoch": 2251} {"train_loss": -24.022369384765625, "global_step": 186885, "epoch": 2251} {"train_loss": -24.210657119750977, "global_step": 186886, "epoch": 2251} {"train_loss": -24.149099349975586, "global_step": 186887, "epoch": 2251} {"train_loss": -23.94483757019043, "global_step": 186888, "epoch": 2251} {"train_loss": -24.35053062438965, "global_step": 186889, "epoch": 2251} {"train_loss": -24.337711334228516, "global_step": 186890, "epoch": 2251} {"train_loss": -24.133359909057617, "global_step": 186891, "epoch": 2251} {"train_loss": -23.97531509399414, "global_step": 186892, "epoch": 2251} {"train_loss": -24.11050033569336, "global_step": 186893, "epoch": 2251} {"train_loss": -23.98185157775879, "global_step": 186894, "epoch": 2251} {"train_loss": -23.915000915527344, "global_step": 186895, "epoch": 2251} {"train_loss": -24.065540313720703, "global_step": 186896, "epoch": 2251} {"train_loss": -23.88543128967285, "global_step": 186897, "epoch": 2251} {"train_loss": -24.18946647644043, "global_step": 186898, "epoch": 2251} {"train_loss": -24.417890548706055, "global_step": 186899, "epoch": 2251} {"train_loss": -24.02449607849121, "global_step": 186900, "epoch": 2251} {"train_loss": -23.975936889648438, "global_step": 186901, "epoch": 2251} {"train_loss": -24.354978561401367, "global_step": 186902, "epoch": 2251} {"train_loss": -23.849884033203125, "global_step": 186903, "epoch": 2251} {"train_loss": -23.955801010131836, "global_step": 186904, "epoch": 2251} {"train_loss": -23.66570472717285, "global_step": 186905, "epoch": 2251} {"train_loss": -24.339176177978516, "global_step": 186906, "epoch": 2251} {"train_loss": -23.932950973510742, "global_step": 186907, "epoch": 2251} {"train_loss": -23.90291404724121, "global_step": 186908, "epoch": 2251} {"train_loss": -24.278478622436523, "global_step": 186909, "epoch": 2251} {"train_loss": -24.0662784576416, "global_step": 186910, "epoch": 2251} {"train_loss": -24.200952529907227, "global_step": 186911, "epoch": 2251} {"train_loss": -24.484983444213867, "global_step": 186912, "epoch": 2251} {"train_loss": -23.72138786315918, "global_step": 186913, "epoch": 2251} {"train_loss": -24.031864166259766, "global_step": 186914, "epoch": 2251} {"train_loss": -24.01424090833549, "global_step": 186915, "epoch": 2251, "val_loss": 6398947.5} {"train_loss": -23.72138786315918, "global_step": 186916, "epoch": 2252} {"train_loss": -23.629796981811523, "global_step": 186917, "epoch": 2252} {"train_loss": -23.87560272216797, "global_step": 186918, "epoch": 2252} {"train_loss": -23.298999786376953, "global_step": 186919, "epoch": 2252} {"train_loss": -23.473814010620117, "global_step": 186920, "epoch": 2252} {"train_loss": -23.607988357543945, "global_step": 186921, "epoch": 2252} {"train_loss": -23.171483993530273, "global_step": 186922, "epoch": 2252} {"train_loss": -23.599267959594727, "global_step": 186923, "epoch": 2252} {"train_loss": -23.827123641967773, "global_step": 186924, "epoch": 2252} {"train_loss": -23.33555793762207, "global_step": 186925, "epoch": 2252} {"train_loss": -23.604923248291016, "global_step": 186926, "epoch": 2252} {"train_loss": -23.997087478637695, "global_step": 186927, "epoch": 2252} {"train_loss": -24.230009078979492, "global_step": 186928, "epoch": 2252} {"train_loss": -23.993040084838867, "global_step": 186929, "epoch": 2252} {"train_loss": -23.994543075561523, "global_step": 186930, "epoch": 2252} {"train_loss": -23.970138549804688, "global_step": 186931, "epoch": 2252} {"train_loss": -24.31290626525879, "global_step": 186932, "epoch": 2252} {"train_loss": -23.8865966796875, "global_step": 186933, "epoch": 2252} {"train_loss": -24.324121475219727, "global_step": 186934, "epoch": 2252} {"train_loss": -24.067670822143555, "global_step": 186935, "epoch": 2252} {"train_loss": -24.332866668701172, "global_step": 186936, "epoch": 2252} {"train_loss": -24.179513931274414, "global_step": 186937, "epoch": 2252} {"train_loss": -24.192821502685547, "global_step": 186938, "epoch": 2252} {"train_loss": -24.12757682800293, "global_step": 186939, "epoch": 2252} {"train_loss": -24.187387466430664, "global_step": 186940, "epoch": 2252} {"train_loss": -23.8654842376709, "global_step": 186941, "epoch": 2252} {"train_loss": -23.94617462158203, "global_step": 186942, "epoch": 2252} {"train_loss": -23.850255966186523, "global_step": 186943, "epoch": 2252} {"train_loss": -24.097705841064453, "global_step": 186944, "epoch": 2252} {"train_loss": -24.360065460205078, "global_step": 186945, "epoch": 2252} {"train_loss": -24.439987182617188, "global_step": 186946, "epoch": 2252} {"train_loss": -24.107744216918945, "global_step": 186947, "epoch": 2252} {"train_loss": -23.764530181884766, "global_step": 186948, "epoch": 2252} {"train_loss": -23.6854305267334, "global_step": 186949, "epoch": 2252} {"train_loss": -23.536026000976562, "global_step": 186950, "epoch": 2252} {"train_loss": -24.26961326599121, "global_step": 186951, "epoch": 2252} {"train_loss": -24.07101821899414, "global_step": 186952, "epoch": 2252} {"train_loss": -24.318227767944336, "global_step": 186953, "epoch": 2252} {"train_loss": -24.267175674438477, "global_step": 186954, "epoch": 2252} {"train_loss": -24.155902862548828, "global_step": 186955, "epoch": 2252} {"train_loss": -23.858800888061523, "global_step": 186956, "epoch": 2252} {"train_loss": -23.926044464111328, "global_step": 186957, "epoch": 2252} {"train_loss": -24.058374404907227, "global_step": 186958, "epoch": 2252} {"train_loss": -24.001895904541016, "global_step": 186959, "epoch": 2252} {"train_loss": -23.91465187072754, "global_step": 186960, "epoch": 2252} {"train_loss": -24.05547523498535, "global_step": 186961, "epoch": 2252} {"train_loss": -23.965665817260742, "global_step": 186962, "epoch": 2252} {"train_loss": -24.13334846496582, "global_step": 186963, "epoch": 2252} {"train_loss": -24.20018196105957, "global_step": 186964, "epoch": 2252} {"train_loss": -23.909351348876953, "global_step": 186965, "epoch": 2252} {"train_loss": -23.87396812438965, "global_step": 186966, "epoch": 2252} {"train_loss": -24.170766830444336, "global_step": 186967, "epoch": 2252} {"train_loss": -23.901159286499023, "global_step": 186968, "epoch": 2252} {"train_loss": -23.977148056030273, "global_step": 186969, "epoch": 2252} {"train_loss": -23.827054977416992, "global_step": 186970, "epoch": 2252} {"train_loss": -24.508207321166992, "global_step": 186971, "epoch": 2252} {"train_loss": -23.811548233032227, "global_step": 186972, "epoch": 2252} {"train_loss": -23.80103874206543, "global_step": 186973, "epoch": 2252} {"train_loss": -23.463285446166992, "global_step": 186974, "epoch": 2252} {"train_loss": -24.013423919677734, "global_step": 186975, "epoch": 2252} {"train_loss": -24.19515609741211, "global_step": 186976, "epoch": 2252} {"train_loss": -24.13669776916504, "global_step": 186977, "epoch": 2252} {"train_loss": -24.464263916015625, "global_step": 186978, "epoch": 2252} {"train_loss": -24.15117835998535, "global_step": 186979, "epoch": 2252} {"train_loss": -24.48206901550293, "global_step": 186980, "epoch": 2252} {"train_loss": -24.050146102905273, "global_step": 186981, "epoch": 2252} {"train_loss": -24.02921485900879, "global_step": 186982, "epoch": 2252} {"train_loss": -24.039644241333008, "global_step": 186983, "epoch": 2252} {"train_loss": -23.92612648010254, "global_step": 186984, "epoch": 2252} {"train_loss": -24.083229064941406, "global_step": 186985, "epoch": 2252} {"train_loss": -23.690977096557617, "global_step": 186986, "epoch": 2252} {"train_loss": -23.92752456665039, "global_step": 186987, "epoch": 2252} {"train_loss": -24.07576560974121, "global_step": 186988, "epoch": 2252} {"train_loss": -24.219192504882812, "global_step": 186989, "epoch": 2252} {"train_loss": -24.273761749267578, "global_step": 186990, "epoch": 2252} {"train_loss": -24.50324058532715, "global_step": 186991, "epoch": 2252} {"train_loss": -24.36738395690918, "global_step": 186992, "epoch": 2252} {"train_loss": -24.16632080078125, "global_step": 186993, "epoch": 2252} {"train_loss": -24.132492065429688, "global_step": 186994, "epoch": 2252} {"train_loss": -24.085947036743164, "global_step": 186995, "epoch": 2252} {"train_loss": -24.155508041381836, "global_step": 186996, "epoch": 2252} {"train_loss": -24.0184383392334, "global_step": 186997, "epoch": 2252} {"train_loss": -24.00593314113387, "global_step": 186998, "epoch": 2252, "val_loss": 6500494.0} {"train_loss": -23.642908096313477, "global_step": 186999, "epoch": 2253} {"train_loss": -22.992155075073242, "global_step": 187000, "epoch": 2253} {"train_loss": -23.6390323638916, "global_step": 187001, "epoch": 2253} {"train_loss": -23.207170486450195, "global_step": 187002, "epoch": 2253} {"train_loss": -23.39044189453125, "global_step": 187003, "epoch": 2253} {"train_loss": -23.423614501953125, "global_step": 187004, "epoch": 2253} {"train_loss": -23.635934829711914, "global_step": 187005, "epoch": 2253} {"train_loss": -23.860822677612305, "global_step": 187006, "epoch": 2253} {"train_loss": -23.97292137145996, "global_step": 187007, "epoch": 2253} {"train_loss": -24.017393112182617, "global_step": 187008, "epoch": 2253} {"train_loss": -23.76650619506836, "global_step": 187009, "epoch": 2253} {"train_loss": -23.706045150756836, "global_step": 187010, "epoch": 2253} {"train_loss": -23.711999893188477, "global_step": 187011, "epoch": 2253} {"train_loss": -23.634124755859375, "global_step": 187012, "epoch": 2253} {"train_loss": -23.85917091369629, "global_step": 187013, "epoch": 2253} {"train_loss": -24.104400634765625, "global_step": 187014, "epoch": 2253} {"train_loss": -23.826982498168945, "global_step": 187015, "epoch": 2253} {"train_loss": -23.920242309570312, "global_step": 187016, "epoch": 2253} {"train_loss": -24.046058654785156, "global_step": 187017, "epoch": 2253} {"train_loss": -24.272871017456055, "global_step": 187018, "epoch": 2253} {"train_loss": -24.09332275390625, "global_step": 187019, "epoch": 2253} {"train_loss": -24.069721221923828, "global_step": 187020, "epoch": 2253} {"train_loss": -24.236495971679688, "global_step": 187021, "epoch": 2253} {"train_loss": -23.887290954589844, "global_step": 187022, "epoch": 2253} {"train_loss": -23.8737850189209, "global_step": 187023, "epoch": 2253} {"train_loss": -23.677785873413086, "global_step": 187024, "epoch": 2253} {"train_loss": -24.13401222229004, "global_step": 187025, "epoch": 2253} {"train_loss": -24.139114379882812, "global_step": 187026, "epoch": 2253} {"train_loss": -24.14542007446289, "global_step": 187027, "epoch": 2253} {"train_loss": -23.75367546081543, "global_step": 187028, "epoch": 2253} {"train_loss": -24.132009506225586, "global_step": 187029, "epoch": 2253} {"train_loss": -23.910070419311523, "global_step": 187030, "epoch": 2253} {"train_loss": -24.04242515563965, "global_step": 187031, "epoch": 2253} {"train_loss": -23.94235610961914, "global_step": 187032, "epoch": 2253} {"train_loss": -23.950658798217773, "global_step": 187033, "epoch": 2253} {"train_loss": -24.381925582885742, "global_step": 187034, "epoch": 2253} {"train_loss": -24.161123275756836, "global_step": 187035, "epoch": 2253} {"train_loss": -24.36565589904785, "global_step": 187036, "epoch": 2253} {"train_loss": -24.041706085205078, "global_step": 187037, "epoch": 2253} {"train_loss": -23.9943904876709, "global_step": 187038, "epoch": 2253} {"train_loss": -23.794240951538086, "global_step": 187039, "epoch": 2253} {"train_loss": -23.906749725341797, "global_step": 187040, "epoch": 2253} {"train_loss": -24.005210876464844, "global_step": 187041, "epoch": 2253} {"train_loss": -24.038707733154297, "global_step": 187042, "epoch": 2253} {"train_loss": -24.026813507080078, "global_step": 187043, "epoch": 2253} {"train_loss": -24.1153621673584, "global_step": 187044, "epoch": 2253} {"train_loss": -24.247724533081055, "global_step": 187045, "epoch": 2253} {"train_loss": -24.040279388427734, "global_step": 187046, "epoch": 2253} {"train_loss": -23.907794952392578, "global_step": 187047, "epoch": 2253} {"train_loss": -23.81220817565918, "global_step": 187048, "epoch": 2253} {"train_loss": -24.174833297729492, "global_step": 187049, "epoch": 2253} {"train_loss": -23.89406394958496, "global_step": 187050, "epoch": 2253} {"train_loss": -24.300947189331055, "global_step": 187051, "epoch": 2253} {"train_loss": -24.19320297241211, "global_step": 187052, "epoch": 2253} {"train_loss": -24.13261604309082, "global_step": 187053, "epoch": 2253} {"train_loss": -24.32879066467285, "global_step": 187054, "epoch": 2253} {"train_loss": -24.20259666442871, "global_step": 187055, "epoch": 2253} {"train_loss": -24.58715057373047, "global_step": 187056, "epoch": 2253} {"train_loss": -24.04829978942871, "global_step": 187057, "epoch": 2253} {"train_loss": -24.163122177124023, "global_step": 187058, "epoch": 2253} {"train_loss": -24.342304229736328, "global_step": 187059, "epoch": 2253} {"train_loss": -24.062515258789062, "global_step": 187060, "epoch": 2253} {"train_loss": -23.78819465637207, "global_step": 187061, "epoch": 2253} {"train_loss": -23.773101806640625, "global_step": 187062, "epoch": 2253} {"train_loss": -23.769834518432617, "global_step": 187063, "epoch": 2253} {"train_loss": -23.84996795654297, "global_step": 187064, "epoch": 2253} {"train_loss": -23.98433494567871, "global_step": 187065, "epoch": 2253} {"train_loss": -23.855533599853516, "global_step": 187066, "epoch": 2253} {"train_loss": -24.058536529541016, "global_step": 187067, "epoch": 2253} {"train_loss": -23.981658935546875, "global_step": 187068, "epoch": 2253} {"train_loss": -24.15816879272461, "global_step": 187069, "epoch": 2253} {"train_loss": -23.745603561401367, "global_step": 187070, "epoch": 2253} {"train_loss": -23.971607208251953, "global_step": 187071, "epoch": 2253} {"train_loss": -23.465375900268555, "global_step": 187072, "epoch": 2253} {"train_loss": -24.128604888916016, "global_step": 187073, "epoch": 2253} {"train_loss": -24.228513717651367, "global_step": 187074, "epoch": 2253} {"train_loss": -23.90425682067871, "global_step": 187075, "epoch": 2253} {"train_loss": -23.932424545288086, "global_step": 187076, "epoch": 2253} {"train_loss": -24.249969482421875, "global_step": 187077, "epoch": 2253} {"train_loss": -23.87904167175293, "global_step": 187078, "epoch": 2253} {"train_loss": -23.75199317932129, "global_step": 187079, "epoch": 2253} {"train_loss": -23.93064308166504, "global_step": 187080, "epoch": 2253} {"train_loss": -23.949495936014568, "global_step": 187081, "epoch": 2253, "val_loss": 6449813.0} {"train_loss": -23.91798210144043, "global_step": 187082, "epoch": 2254} {"train_loss": -23.736616134643555, "global_step": 187083, "epoch": 2254} {"train_loss": -23.76059341430664, "global_step": 187084, "epoch": 2254} {"train_loss": -23.64583396911621, "global_step": 187085, "epoch": 2254} {"train_loss": -23.705291748046875, "global_step": 187086, "epoch": 2254} {"train_loss": -23.977981567382812, "global_step": 187087, "epoch": 2254} {"train_loss": -23.35638427734375, "global_step": 187088, "epoch": 2254} {"train_loss": -23.564077377319336, "global_step": 187089, "epoch": 2254} {"train_loss": -24.062498092651367, "global_step": 187090, "epoch": 2254} {"train_loss": -23.296239852905273, "global_step": 187091, "epoch": 2254} {"train_loss": -23.678617477416992, "global_step": 187092, "epoch": 2254} {"train_loss": -23.7816219329834, "global_step": 187093, "epoch": 2254} {"train_loss": -23.716793060302734, "global_step": 187094, "epoch": 2254} {"train_loss": -24.00462532043457, "global_step": 187095, "epoch": 2254} {"train_loss": -23.651464462280273, "global_step": 187096, "epoch": 2254} {"train_loss": -24.061132431030273, "global_step": 187097, "epoch": 2254} {"train_loss": -23.829959869384766, "global_step": 187098, "epoch": 2254} {"train_loss": -23.857160568237305, "global_step": 187099, "epoch": 2254} {"train_loss": -23.889049530029297, "global_step": 187100, "epoch": 2254} {"train_loss": -23.77267837524414, "global_step": 187101, "epoch": 2254} {"train_loss": -23.812530517578125, "global_step": 187102, "epoch": 2254} {"train_loss": -23.756593704223633, "global_step": 187103, "epoch": 2254} {"train_loss": -23.74184799194336, "global_step": 187104, "epoch": 2254} {"train_loss": -23.505590438842773, "global_step": 187105, "epoch": 2254} {"train_loss": -23.83282470703125, "global_step": 187106, "epoch": 2254} {"train_loss": -23.66573715209961, "global_step": 187107, "epoch": 2254} {"train_loss": -23.371139526367188, "global_step": 187108, "epoch": 2254} {"train_loss": -23.6470890045166, "global_step": 187109, "epoch": 2254} {"train_loss": -23.6529598236084, "global_step": 187110, "epoch": 2254} {"train_loss": -24.010549545288086, "global_step": 187111, "epoch": 2254} {"train_loss": -24.074392318725586, "global_step": 187112, "epoch": 2254} {"train_loss": -23.72480010986328, "global_step": 187113, "epoch": 2254} {"train_loss": -24.102231979370117, "global_step": 187114, "epoch": 2254} {"train_loss": -23.663549423217773, "global_step": 187115, "epoch": 2254} {"train_loss": -24.027313232421875, "global_step": 187116, "epoch": 2254} {"train_loss": -23.83161735534668, "global_step": 187117, "epoch": 2254} {"train_loss": -24.33210563659668, "global_step": 187118, "epoch": 2254} {"train_loss": -23.935394287109375, "global_step": 187119, "epoch": 2254} {"train_loss": -24.12255859375, "global_step": 187120, "epoch": 2254} {"train_loss": -24.02387809753418, "global_step": 187121, "epoch": 2254} {"train_loss": -24.042112350463867, "global_step": 187122, "epoch": 2254} {"train_loss": -24.112125396728516, "global_step": 187123, "epoch": 2254} {"train_loss": -23.876150131225586, "global_step": 187124, "epoch": 2254} {"train_loss": -23.719324111938477, "global_step": 187125, "epoch": 2254} {"train_loss": -23.666379928588867, "global_step": 187126, "epoch": 2254} {"train_loss": -24.171096801757812, "global_step": 187127, "epoch": 2254} {"train_loss": -24.425443649291992, "global_step": 187128, "epoch": 2254} {"train_loss": -24.46259117126465, "global_step": 187129, "epoch": 2254} {"train_loss": -23.930051803588867, "global_step": 187130, "epoch": 2254} {"train_loss": -24.115697860717773, "global_step": 187131, "epoch": 2254} {"train_loss": -23.89027976989746, "global_step": 187132, "epoch": 2254} {"train_loss": -24.142349243164062, "global_step": 187133, "epoch": 2254} {"train_loss": -24.276466369628906, "global_step": 187134, "epoch": 2254} {"train_loss": -24.138830184936523, "global_step": 187135, "epoch": 2254} {"train_loss": -23.935483932495117, "global_step": 187136, "epoch": 2254} {"train_loss": -24.090906143188477, "global_step": 187137, "epoch": 2254} {"train_loss": -24.456649780273438, "global_step": 187138, "epoch": 2254} {"train_loss": -24.150400161743164, "global_step": 187139, "epoch": 2254} {"train_loss": -24.05452537536621, "global_step": 187140, "epoch": 2254} {"train_loss": -24.567567825317383, "global_step": 187141, "epoch": 2254} {"train_loss": -24.01595115661621, "global_step": 187142, "epoch": 2254} {"train_loss": -24.30075454711914, "global_step": 187143, "epoch": 2254} {"train_loss": -24.312517166137695, "global_step": 187144, "epoch": 2254} {"train_loss": -24.18207359313965, "global_step": 187145, "epoch": 2254} {"train_loss": -24.18861198425293, "global_step": 187146, "epoch": 2254} {"train_loss": -23.896930694580078, "global_step": 187147, "epoch": 2254} {"train_loss": -23.939510345458984, "global_step": 187148, "epoch": 2254} {"train_loss": -24.062551498413086, "global_step": 187149, "epoch": 2254} {"train_loss": -24.291852951049805, "global_step": 187150, "epoch": 2254} {"train_loss": -23.991811752319336, "global_step": 187151, "epoch": 2254} {"train_loss": -24.08210563659668, "global_step": 187152, "epoch": 2254} {"train_loss": -24.105880737304688, "global_step": 187153, "epoch": 2254} {"train_loss": -24.050729751586914, "global_step": 187154, "epoch": 2254} {"train_loss": -23.999420166015625, "global_step": 187155, "epoch": 2254} {"train_loss": -23.9711971282959, "global_step": 187156, "epoch": 2254} {"train_loss": -24.03627586364746, "global_step": 187157, "epoch": 2254} {"train_loss": -24.17772674560547, "global_step": 187158, "epoch": 2254} {"train_loss": -24.324556350708008, "global_step": 187159, "epoch": 2254} {"train_loss": -24.207136154174805, "global_step": 187160, "epoch": 2254} {"train_loss": -23.947803497314453, "global_step": 187161, "epoch": 2254} {"train_loss": -23.893590927124023, "global_step": 187162, "epoch": 2254} {"train_loss": -23.295507431030273, "global_step": 187163, "epoch": 2254} {"train_loss": -23.932266648993433, "global_step": 187164, "epoch": 2254, "val_loss": 6476414.0} {"train_loss": -22.08612632751465, "global_step": 187165, "epoch": 2255} {"train_loss": -22.633865356445312, "global_step": 187166, "epoch": 2255} {"train_loss": -22.939794540405273, "global_step": 187167, "epoch": 2255} {"train_loss": -22.680139541625977, "global_step": 187168, "epoch": 2255} {"train_loss": -22.90778160095215, "global_step": 187169, "epoch": 2255} {"train_loss": -23.144071578979492, "global_step": 187170, "epoch": 2255} {"train_loss": -23.317319869995117, "global_step": 187171, "epoch": 2255} {"train_loss": -22.980310440063477, "global_step": 187172, "epoch": 2255} {"train_loss": -23.322858810424805, "global_step": 187173, "epoch": 2255} {"train_loss": -23.61366081237793, "global_step": 187174, "epoch": 2255} {"train_loss": -23.239810943603516, "global_step": 187175, "epoch": 2255} {"train_loss": -23.384851455688477, "global_step": 187176, "epoch": 2255} {"train_loss": -23.48716163635254, "global_step": 187177, "epoch": 2255} {"train_loss": -23.400938034057617, "global_step": 187178, "epoch": 2255} {"train_loss": -23.545730590820312, "global_step": 187179, "epoch": 2255} {"train_loss": -23.454099655151367, "global_step": 187180, "epoch": 2255} {"train_loss": -23.6757869720459, "global_step": 187181, "epoch": 2255} {"train_loss": -23.71515464782715, "global_step": 187182, "epoch": 2255} {"train_loss": -23.532337188720703, "global_step": 187183, "epoch": 2255} {"train_loss": -23.78697967529297, "global_step": 187184, "epoch": 2255} {"train_loss": -23.893049240112305, "global_step": 187185, "epoch": 2255} {"train_loss": -24.012842178344727, "global_step": 187186, "epoch": 2255} {"train_loss": -23.656179428100586, "global_step": 187187, "epoch": 2255} {"train_loss": -23.837291717529297, "global_step": 187188, "epoch": 2255} {"train_loss": -23.865509033203125, "global_step": 187189, "epoch": 2255} {"train_loss": -23.667333602905273, "global_step": 187190, "epoch": 2255} {"train_loss": -23.664724349975586, "global_step": 187191, "epoch": 2255} {"train_loss": -23.994688034057617, "global_step": 187192, "epoch": 2255} {"train_loss": -23.713661193847656, "global_step": 187193, "epoch": 2255} {"train_loss": -23.6402587890625, "global_step": 187194, "epoch": 2255} {"train_loss": -23.90899658203125, "global_step": 187195, "epoch": 2255} {"train_loss": -23.809547424316406, "global_step": 187196, "epoch": 2255} {"train_loss": -23.786352157592773, "global_step": 187197, "epoch": 2255} {"train_loss": -23.571256637573242, "global_step": 187198, "epoch": 2255} {"train_loss": -23.890228271484375, "global_step": 187199, "epoch": 2255} {"train_loss": -24.226730346679688, "global_step": 187200, "epoch": 2255} {"train_loss": -23.944561004638672, "global_step": 187201, "epoch": 2255} {"train_loss": -24.07573890686035, "global_step": 187202, "epoch": 2255} {"train_loss": -24.286441802978516, "global_step": 187203, "epoch": 2255} {"train_loss": -24.19097900390625, "global_step": 187204, "epoch": 2255} {"train_loss": -24.36368751525879, "global_step": 187205, "epoch": 2255} {"train_loss": -24.134042739868164, "global_step": 187206, "epoch": 2255} {"train_loss": -23.86790657043457, "global_step": 187207, "epoch": 2255} {"train_loss": -24.374082565307617, "global_step": 187208, "epoch": 2255} {"train_loss": -23.842790603637695, "global_step": 187209, "epoch": 2255} {"train_loss": -23.96466636657715, "global_step": 187210, "epoch": 2255} {"train_loss": -24.119123458862305, "global_step": 187211, "epoch": 2255} {"train_loss": -23.762514114379883, "global_step": 187212, "epoch": 2255} {"train_loss": -23.795434951782227, "global_step": 187213, "epoch": 2255} {"train_loss": -24.146390914916992, "global_step": 187214, "epoch": 2255} {"train_loss": -24.26956558227539, "global_step": 187215, "epoch": 2255} {"train_loss": -24.336668014526367, "global_step": 187216, "epoch": 2255} {"train_loss": -23.984113693237305, "global_step": 187217, "epoch": 2255} {"train_loss": -23.71143913269043, "global_step": 187218, "epoch": 2255} {"train_loss": -24.22564697265625, "global_step": 187219, "epoch": 2255} {"train_loss": -24.139617919921875, "global_step": 187220, "epoch": 2255} {"train_loss": -24.022918701171875, "global_step": 187221, "epoch": 2255} {"train_loss": -23.64432144165039, "global_step": 187222, "epoch": 2255} {"train_loss": -24.0678768157959, "global_step": 187223, "epoch": 2255} {"train_loss": -23.979772567749023, "global_step": 187224, "epoch": 2255} {"train_loss": -24.1939754486084, "global_step": 187225, "epoch": 2255} {"train_loss": -23.669513702392578, "global_step": 187226, "epoch": 2255} {"train_loss": -23.810739517211914, "global_step": 187227, "epoch": 2255} {"train_loss": -24.1883602142334, "global_step": 187228, "epoch": 2255} {"train_loss": -24.029449462890625, "global_step": 187229, "epoch": 2255} {"train_loss": -23.881229400634766, "global_step": 187230, "epoch": 2255} {"train_loss": -24.074737548828125, "global_step": 187231, "epoch": 2255} {"train_loss": -23.756914138793945, "global_step": 187232, "epoch": 2255} {"train_loss": -24.223766326904297, "global_step": 187233, "epoch": 2255} {"train_loss": -24.120664596557617, "global_step": 187234, "epoch": 2255} {"train_loss": -24.335933685302734, "global_step": 187235, "epoch": 2255} {"train_loss": -24.292104721069336, "global_step": 187236, "epoch": 2255} {"train_loss": -24.12513542175293, "global_step": 187237, "epoch": 2255} {"train_loss": -24.103086471557617, "global_step": 187238, "epoch": 2255} {"train_loss": -24.062658309936523, "global_step": 187239, "epoch": 2255} {"train_loss": -23.83737564086914, "global_step": 187240, "epoch": 2255} {"train_loss": -24.070158004760742, "global_step": 187241, "epoch": 2255} {"train_loss": -24.053632736206055, "global_step": 187242, "epoch": 2255} {"train_loss": -24.302539825439453, "global_step": 187243, "epoch": 2255} {"train_loss": -24.07834815979004, "global_step": 187244, "epoch": 2255} {"train_loss": -24.33397674560547, "global_step": 187245, "epoch": 2255} {"train_loss": -24.334108352661133, "global_step": 187246, "epoch": 2255} {"train_loss": -23.819699827446996, "global_step": 187247, "epoch": 2255, "val_loss": 6384726.0} {"train_loss": -23.31454086303711, "global_step": 187248, "epoch": 2256} {"train_loss": -24.261112213134766, "global_step": 187249, "epoch": 2256} {"train_loss": -23.683408737182617, "global_step": 187250, "epoch": 2256} {"train_loss": -23.60995864868164, "global_step": 187251, "epoch": 2256} {"train_loss": -24.195871353149414, "global_step": 187252, "epoch": 2256} {"train_loss": -23.068967819213867, "global_step": 187253, "epoch": 2256} {"train_loss": -23.63934898376465, "global_step": 187254, "epoch": 2256} {"train_loss": -23.891769409179688, "global_step": 187255, "epoch": 2256} {"train_loss": -23.718860626220703, "global_step": 187256, "epoch": 2256} {"train_loss": -23.560178756713867, "global_step": 187257, "epoch": 2256} {"train_loss": -23.624032974243164, "global_step": 187258, "epoch": 2256} {"train_loss": -23.656339645385742, "global_step": 187259, "epoch": 2256} {"train_loss": -23.93293571472168, "global_step": 187260, "epoch": 2256} {"train_loss": -23.53476333618164, "global_step": 187261, "epoch": 2256} {"train_loss": -23.607812881469727, "global_step": 187262, "epoch": 2256} {"train_loss": -23.680517196655273, "global_step": 187263, "epoch": 2256} {"train_loss": -24.018369674682617, "global_step": 187264, "epoch": 2256} {"train_loss": -23.765365600585938, "global_step": 187265, "epoch": 2256} {"train_loss": -24.189727783203125, "global_step": 187266, "epoch": 2256} {"train_loss": -23.51502799987793, "global_step": 187267, "epoch": 2256} {"train_loss": -23.724498748779297, "global_step": 187268, "epoch": 2256} {"train_loss": -23.708904266357422, "global_step": 187269, "epoch": 2256} {"train_loss": -23.662065505981445, "global_step": 187270, "epoch": 2256} {"train_loss": -24.166019439697266, "global_step": 187271, "epoch": 2256} {"train_loss": -24.009403228759766, "global_step": 187272, "epoch": 2256} {"train_loss": -24.117944717407227, "global_step": 187273, "epoch": 2256} {"train_loss": -23.763669967651367, "global_step": 187274, "epoch": 2256} {"train_loss": -23.75197410583496, "global_step": 187275, "epoch": 2256} {"train_loss": -23.808576583862305, "global_step": 187276, "epoch": 2256} {"train_loss": -23.94124984741211, "global_step": 187277, "epoch": 2256} {"train_loss": -23.68531608581543, "global_step": 187278, "epoch": 2256} {"train_loss": -23.970861434936523, "global_step": 187279, "epoch": 2256} {"train_loss": -24.08424949645996, "global_step": 187280, "epoch": 2256} {"train_loss": -23.94740104675293, "global_step": 187281, "epoch": 2256} {"train_loss": -23.70699119567871, "global_step": 187282, "epoch": 2256} {"train_loss": -24.220050811767578, "global_step": 187283, "epoch": 2256} {"train_loss": -23.66688346862793, "global_step": 187284, "epoch": 2256} {"train_loss": -24.0018367767334, "global_step": 187285, "epoch": 2256} {"train_loss": -23.92437171936035, "global_step": 187286, "epoch": 2256} {"train_loss": -23.95192527770996, "global_step": 187287, "epoch": 2256} {"train_loss": -23.7572021484375, "global_step": 187288, "epoch": 2256} {"train_loss": -24.070594787597656, "global_step": 187289, "epoch": 2256} {"train_loss": -23.922653198242188, "global_step": 187290, "epoch": 2256} {"train_loss": -23.721773147583008, "global_step": 187291, "epoch": 2256} {"train_loss": -24.103580474853516, "global_step": 187292, "epoch": 2256} {"train_loss": -24.12712287902832, "global_step": 187293, "epoch": 2256} {"train_loss": -24.000699996948242, "global_step": 187294, "epoch": 2256} {"train_loss": -24.029367446899414, "global_step": 187295, "epoch": 2256} {"train_loss": -24.029268264770508, "global_step": 187296, "epoch": 2256} {"train_loss": -23.768489837646484, "global_step": 187297, "epoch": 2256} {"train_loss": -24.17844581604004, "global_step": 187298, "epoch": 2256} {"train_loss": -24.071496963500977, "global_step": 187299, "epoch": 2256} {"train_loss": -24.1333065032959, "global_step": 187300, "epoch": 2256} {"train_loss": -23.783123016357422, "global_step": 187301, "epoch": 2256} {"train_loss": -23.77579116821289, "global_step": 187302, "epoch": 2256} {"train_loss": -24.092992782592773, "global_step": 187303, "epoch": 2256} {"train_loss": -23.747522354125977, "global_step": 187304, "epoch": 2256} {"train_loss": -23.725027084350586, "global_step": 187305, "epoch": 2256} {"train_loss": -24.071279525756836, "global_step": 187306, "epoch": 2256} {"train_loss": -23.479415893554688, "global_step": 187307, "epoch": 2256} {"train_loss": -23.768198013305664, "global_step": 187308, "epoch": 2256} {"train_loss": -23.7110652923584, "global_step": 187309, "epoch": 2256} {"train_loss": -24.160306930541992, "global_step": 187310, "epoch": 2256} {"train_loss": -23.72444725036621, "global_step": 187311, "epoch": 2256} {"train_loss": -23.604955673217773, "global_step": 187312, "epoch": 2256} {"train_loss": -24.041963577270508, "global_step": 187313, "epoch": 2256} {"train_loss": -23.714027404785156, "global_step": 187314, "epoch": 2256} {"train_loss": -24.06325340270996, "global_step": 187315, "epoch": 2256} {"train_loss": -23.867450714111328, "global_step": 187316, "epoch": 2256} {"train_loss": -24.016881942749023, "global_step": 187317, "epoch": 2256} {"train_loss": -23.996740341186523, "global_step": 187318, "epoch": 2256} {"train_loss": -23.851348876953125, "global_step": 187319, "epoch": 2256} {"train_loss": -23.745338439941406, "global_step": 187320, "epoch": 2256} {"train_loss": -24.078500747680664, "global_step": 187321, "epoch": 2256} {"train_loss": -23.74104118347168, "global_step": 187322, "epoch": 2256} {"train_loss": -24.263235092163086, "global_step": 187323, "epoch": 2256} {"train_loss": -24.232501983642578, "global_step": 187324, "epoch": 2256} {"train_loss": -23.999786376953125, "global_step": 187325, "epoch": 2256} {"train_loss": -23.791732788085938, "global_step": 187326, "epoch": 2256} {"train_loss": -24.152908325195312, "global_step": 187327, "epoch": 2256} {"train_loss": -24.505041122436523, "global_step": 187328, "epoch": 2256} {"train_loss": -23.896121978759766, "global_step": 187329, "epoch": 2256} {"train_loss": -23.883482186191053, "global_step": 187330, "epoch": 2256, "val_loss": 6416300.0} {"train_loss": -23.180768966674805, "global_step": 187331, "epoch": 2257} {"train_loss": -23.727705001831055, "global_step": 187332, "epoch": 2257} {"train_loss": -23.215946197509766, "global_step": 187333, "epoch": 2257} {"train_loss": -23.833499908447266, "global_step": 187334, "epoch": 2257} {"train_loss": -23.758089065551758, "global_step": 187335, "epoch": 2257} {"train_loss": -23.15643882751465, "global_step": 187336, "epoch": 2257} {"train_loss": -23.729223251342773, "global_step": 187337, "epoch": 2257} {"train_loss": -23.318559646606445, "global_step": 187338, "epoch": 2257} {"train_loss": -23.616987228393555, "global_step": 187339, "epoch": 2257} {"train_loss": -23.60989761352539, "global_step": 187340, "epoch": 2257} {"train_loss": -23.471487045288086, "global_step": 187341, "epoch": 2257} {"train_loss": -23.660070419311523, "global_step": 187342, "epoch": 2257} {"train_loss": -23.951915740966797, "global_step": 187343, "epoch": 2257} {"train_loss": -23.844316482543945, "global_step": 187344, "epoch": 2257} {"train_loss": -23.41937255859375, "global_step": 187345, "epoch": 2257} {"train_loss": -23.988792419433594, "global_step": 187346, "epoch": 2257} {"train_loss": -24.030763626098633, "global_step": 187347, "epoch": 2257} {"train_loss": -23.877347946166992, "global_step": 187348, "epoch": 2257} {"train_loss": -24.142351150512695, "global_step": 187349, "epoch": 2257} {"train_loss": -23.587961196899414, "global_step": 187350, "epoch": 2257} {"train_loss": -24.07895851135254, "global_step": 187351, "epoch": 2257} {"train_loss": -23.91532325744629, "global_step": 187352, "epoch": 2257} {"train_loss": -24.193286895751953, "global_step": 187353, "epoch": 2257} {"train_loss": -23.68573570251465, "global_step": 187354, "epoch": 2257} {"train_loss": -24.130340576171875, "global_step": 187355, "epoch": 2257} {"train_loss": -24.113004684448242, "global_step": 187356, "epoch": 2257} {"train_loss": -23.719627380371094, "global_step": 187357, "epoch": 2257} {"train_loss": -24.1654109954834, "global_step": 187358, "epoch": 2257} {"train_loss": -24.139602661132812, "global_step": 187359, "epoch": 2257} {"train_loss": -24.058523178100586, "global_step": 187360, "epoch": 2257} {"train_loss": -24.055585861206055, "global_step": 187361, "epoch": 2257} {"train_loss": -24.14046287536621, "global_step": 187362, "epoch": 2257} {"train_loss": -24.233739852905273, "global_step": 187363, "epoch": 2257} {"train_loss": -23.96241569519043, "global_step": 187364, "epoch": 2257} {"train_loss": -24.188745498657227, "global_step": 187365, "epoch": 2257} {"train_loss": -23.986379623413086, "global_step": 187366, "epoch": 2257} {"train_loss": -24.359453201293945, "global_step": 187367, "epoch": 2257} {"train_loss": -24.131528854370117, "global_step": 187368, "epoch": 2257} {"train_loss": -23.7033634185791, "global_step": 187369, "epoch": 2257} {"train_loss": -24.3255558013916, "global_step": 187370, "epoch": 2257} {"train_loss": -23.92804718017578, "global_step": 187371, "epoch": 2257} {"train_loss": -24.343055725097656, "global_step": 187372, "epoch": 2257} {"train_loss": -24.075529098510742, "global_step": 187373, "epoch": 2257} {"train_loss": -24.146604537963867, "global_step": 187374, "epoch": 2257} {"train_loss": -24.222219467163086, "global_step": 187375, "epoch": 2257} {"train_loss": -24.047887802124023, "global_step": 187376, "epoch": 2257} {"train_loss": -24.271621704101562, "global_step": 187377, "epoch": 2257} {"train_loss": -24.185272216796875, "global_step": 187378, "epoch": 2257} {"train_loss": -24.219457626342773, "global_step": 187379, "epoch": 2257} {"train_loss": -24.039274215698242, "global_step": 187380, "epoch": 2257} {"train_loss": -24.022092819213867, "global_step": 187381, "epoch": 2257} {"train_loss": -24.077619552612305, "global_step": 187382, "epoch": 2257} {"train_loss": -24.42043113708496, "global_step": 187383, "epoch": 2257} {"train_loss": -24.222883224487305, "global_step": 187384, "epoch": 2257} {"train_loss": -24.204986572265625, "global_step": 187385, "epoch": 2257} {"train_loss": -23.80464744567871, "global_step": 187386, "epoch": 2257} {"train_loss": -23.859825134277344, "global_step": 187387, "epoch": 2257} {"train_loss": -23.816448211669922, "global_step": 187388, "epoch": 2257} {"train_loss": -23.330991744995117, "global_step": 187389, "epoch": 2257} {"train_loss": -23.728723526000977, "global_step": 187390, "epoch": 2257} {"train_loss": -24.34084129333496, "global_step": 187391, "epoch": 2257} {"train_loss": -24.325666427612305, "global_step": 187392, "epoch": 2257} {"train_loss": -23.94606590270996, "global_step": 187393, "epoch": 2257} {"train_loss": -23.57615852355957, "global_step": 187394, "epoch": 2257} {"train_loss": -23.800270080566406, "global_step": 187395, "epoch": 2257} {"train_loss": -23.987201690673828, "global_step": 187396, "epoch": 2257} {"train_loss": -24.551105499267578, "global_step": 187397, "epoch": 2257} {"train_loss": -23.879867553710938, "global_step": 187398, "epoch": 2257} {"train_loss": -23.752187728881836, "global_step": 187399, "epoch": 2257} {"train_loss": -23.910337448120117, "global_step": 187400, "epoch": 2257} {"train_loss": -23.954580307006836, "global_step": 187401, "epoch": 2257} {"train_loss": -23.792606353759766, "global_step": 187402, "epoch": 2257} {"train_loss": -23.994064331054688, "global_step": 187403, "epoch": 2257} {"train_loss": -23.98988151550293, "global_step": 187404, "epoch": 2257} {"train_loss": -24.02520179748535, "global_step": 187405, "epoch": 2257} {"train_loss": -24.19131851196289, "global_step": 187406, "epoch": 2257} {"train_loss": -24.02969741821289, "global_step": 187407, "epoch": 2257} {"train_loss": -24.26848793029785, "global_step": 187408, "epoch": 2257} {"train_loss": -24.17243003845215, "global_step": 187409, "epoch": 2257} {"train_loss": -24.14520835876465, "global_step": 187410, "epoch": 2257} {"train_loss": -23.91751480102539, "global_step": 187411, "epoch": 2257} {"train_loss": -23.99150276184082, "global_step": 187412, "epoch": 2257} {"train_loss": -23.95946789936847, "global_step": 187413, "epoch": 2257, "val_loss": 6502761.5} {"train_loss": -23.911094665527344, "global_step": 187414, "epoch": 2258} {"train_loss": -24.176559448242188, "global_step": 187415, "epoch": 2258} {"train_loss": -24.109695434570312, "global_step": 187416, "epoch": 2258} {"train_loss": -24.424097061157227, "global_step": 187417, "epoch": 2258} {"train_loss": -23.86441993713379, "global_step": 187418, "epoch": 2258} {"train_loss": -23.826749801635742, "global_step": 187419, "epoch": 2258} {"train_loss": -23.74797821044922, "global_step": 187420, "epoch": 2258} {"train_loss": -24.013872146606445, "global_step": 187421, "epoch": 2258} {"train_loss": -23.899938583374023, "global_step": 187422, "epoch": 2258} {"train_loss": -23.957534790039062, "global_step": 187423, "epoch": 2258} {"train_loss": -23.812902450561523, "global_step": 187424, "epoch": 2258} {"train_loss": -23.7821102142334, "global_step": 187425, "epoch": 2258} {"train_loss": -23.77223014831543, "global_step": 187426, "epoch": 2258} {"train_loss": -24.121009826660156, "global_step": 187427, "epoch": 2258} {"train_loss": -24.090585708618164, "global_step": 187428, "epoch": 2258} {"train_loss": -24.012042999267578, "global_step": 187429, "epoch": 2258} {"train_loss": -23.734235763549805, "global_step": 187430, "epoch": 2258} {"train_loss": -24.050525665283203, "global_step": 187431, "epoch": 2258} {"train_loss": -23.71965217590332, "global_step": 187432, "epoch": 2258} {"train_loss": -24.127307891845703, "global_step": 187433, "epoch": 2258} {"train_loss": -23.921228408813477, "global_step": 187434, "epoch": 2258} {"train_loss": -23.587738037109375, "global_step": 187435, "epoch": 2258} {"train_loss": -23.797693252563477, "global_step": 187436, "epoch": 2258} {"train_loss": -23.929136276245117, "global_step": 187437, "epoch": 2258} {"train_loss": -23.79562759399414, "global_step": 187438, "epoch": 2258} {"train_loss": -24.092269897460938, "global_step": 187439, "epoch": 2258} {"train_loss": -24.52620506286621, "global_step": 187440, "epoch": 2258} {"train_loss": -23.945764541625977, "global_step": 187441, "epoch": 2258} {"train_loss": -24.22688865661621, "global_step": 187442, "epoch": 2258} {"train_loss": -23.876602172851562, "global_step": 187443, "epoch": 2258} {"train_loss": -24.174436569213867, "global_step": 187444, "epoch": 2258} {"train_loss": -24.040815353393555, "global_step": 187445, "epoch": 2258} {"train_loss": -23.908601760864258, "global_step": 187446, "epoch": 2258} {"train_loss": -24.03519630432129, "global_step": 187447, "epoch": 2258} {"train_loss": -23.851289749145508, "global_step": 187448, "epoch": 2258} {"train_loss": -23.486373901367188, "global_step": 187449, "epoch": 2258} {"train_loss": -24.187620162963867, "global_step": 187450, "epoch": 2258} {"train_loss": -24.217395782470703, "global_step": 187451, "epoch": 2258} {"train_loss": -24.05710792541504, "global_step": 187452, "epoch": 2258} {"train_loss": -23.96400260925293, "global_step": 187453, "epoch": 2258} {"train_loss": -23.977508544921875, "global_step": 187454, "epoch": 2258} {"train_loss": -23.79079246520996, "global_step": 187455, "epoch": 2258} {"train_loss": -23.803464889526367, "global_step": 187456, "epoch": 2258} {"train_loss": -23.896039962768555, "global_step": 187457, "epoch": 2258} {"train_loss": -24.441511154174805, "global_step": 187458, "epoch": 2258} {"train_loss": -24.072839736938477, "global_step": 187459, "epoch": 2258} {"train_loss": -23.946863174438477, "global_step": 187460, "epoch": 2258} {"train_loss": -24.465055465698242, "global_step": 187461, "epoch": 2258} {"train_loss": -24.197134017944336, "global_step": 187462, "epoch": 2258} {"train_loss": -24.252593994140625, "global_step": 187463, "epoch": 2258} {"train_loss": -24.071401596069336, "global_step": 187464, "epoch": 2258} {"train_loss": -23.90032196044922, "global_step": 187465, "epoch": 2258} {"train_loss": -24.179706573486328, "global_step": 187466, "epoch": 2258} {"train_loss": -24.35295295715332, "global_step": 187467, "epoch": 2258} {"train_loss": -24.185264587402344, "global_step": 187468, "epoch": 2258} {"train_loss": -23.967941284179688, "global_step": 187469, "epoch": 2258} {"train_loss": -24.039304733276367, "global_step": 187470, "epoch": 2258} {"train_loss": -23.741199493408203, "global_step": 187471, "epoch": 2258} {"train_loss": -23.84699821472168, "global_step": 187472, "epoch": 2258} {"train_loss": -23.96429443359375, "global_step": 187473, "epoch": 2258} {"train_loss": -23.863819122314453, "global_step": 187474, "epoch": 2258} {"train_loss": -24.158674240112305, "global_step": 187475, "epoch": 2258} {"train_loss": -24.103742599487305, "global_step": 187476, "epoch": 2258} {"train_loss": -24.481781005859375, "global_step": 187477, "epoch": 2258} {"train_loss": -24.099853515625, "global_step": 187478, "epoch": 2258} {"train_loss": -24.03973960876465, "global_step": 187479, "epoch": 2258} {"train_loss": -23.581079483032227, "global_step": 187480, "epoch": 2258} {"train_loss": -23.64970588684082, "global_step": 187481, "epoch": 2258} {"train_loss": -23.509952545166016, "global_step": 187482, "epoch": 2258} {"train_loss": -24.083433151245117, "global_step": 187483, "epoch": 2258} {"train_loss": -24.04120635986328, "global_step": 187484, "epoch": 2258} {"train_loss": -23.94803237915039, "global_step": 187485, "epoch": 2258} {"train_loss": -23.837116241455078, "global_step": 187486, "epoch": 2258} {"train_loss": -23.723600387573242, "global_step": 187487, "epoch": 2258} {"train_loss": -24.27162742614746, "global_step": 187488, "epoch": 2258} {"train_loss": -23.922353744506836, "global_step": 187489, "epoch": 2258} {"train_loss": -23.939985275268555, "global_step": 187490, "epoch": 2258} {"train_loss": -24.149953842163086, "global_step": 187491, "epoch": 2258} {"train_loss": -23.809402465820312, "global_step": 187492, "epoch": 2258} {"train_loss": -24.152746200561523, "global_step": 187493, "epoch": 2258} {"train_loss": -24.27023696899414, "global_step": 187494, "epoch": 2258} {"train_loss": -24.030248641967773, "global_step": 187495, "epoch": 2258} {"train_loss": -23.996139319546252, "global_step": 187496, "epoch": 2258, "val_loss": 6522827.0} {"train_loss": -23.45624351501465, "global_step": 187497, "epoch": 2259} {"train_loss": -23.66583251953125, "global_step": 187498, "epoch": 2259} {"train_loss": -23.88370132446289, "global_step": 187499, "epoch": 2259} {"train_loss": -23.262174606323242, "global_step": 187500, "epoch": 2259} {"train_loss": -23.689823150634766, "global_step": 187501, "epoch": 2259} {"train_loss": -23.842248916625977, "global_step": 187502, "epoch": 2259} {"train_loss": -24.12650489807129, "global_step": 187503, "epoch": 2259} {"train_loss": -24.224079132080078, "global_step": 187504, "epoch": 2259} {"train_loss": -24.29324722290039, "global_step": 187505, "epoch": 2259} {"train_loss": -23.94294548034668, "global_step": 187506, "epoch": 2259} {"train_loss": -23.9151611328125, "global_step": 187507, "epoch": 2259} {"train_loss": -23.940603256225586, "global_step": 187508, "epoch": 2259} {"train_loss": -23.640640258789062, "global_step": 187509, "epoch": 2259} {"train_loss": -24.133331298828125, "global_step": 187510, "epoch": 2259} {"train_loss": -24.115802764892578, "global_step": 187511, "epoch": 2259} {"train_loss": -24.02452278137207, "global_step": 187512, "epoch": 2259} {"train_loss": -23.772432327270508, "global_step": 187513, "epoch": 2259} {"train_loss": -23.997461318969727, "global_step": 187514, "epoch": 2259} {"train_loss": -24.11907386779785, "global_step": 187515, "epoch": 2259} {"train_loss": -24.065872192382812, "global_step": 187516, "epoch": 2259} {"train_loss": -23.622699737548828, "global_step": 187517, "epoch": 2259} {"train_loss": -24.09257698059082, "global_step": 187518, "epoch": 2259} {"train_loss": -24.239898681640625, "global_step": 187519, "epoch": 2259} {"train_loss": -23.896787643432617, "global_step": 187520, "epoch": 2259} {"train_loss": -23.9606990814209, "global_step": 187521, "epoch": 2259} {"train_loss": -23.821372985839844, "global_step": 187522, "epoch": 2259} {"train_loss": -24.011829376220703, "global_step": 187523, "epoch": 2259} {"train_loss": -23.717565536499023, "global_step": 187524, "epoch": 2259} {"train_loss": -24.11090660095215, "global_step": 187525, "epoch": 2259} {"train_loss": -23.82960319519043, "global_step": 187526, "epoch": 2259} {"train_loss": -24.1737117767334, "global_step": 187527, "epoch": 2259} {"train_loss": -24.414112091064453, "global_step": 187528, "epoch": 2259} {"train_loss": -23.907608032226562, "global_step": 187529, "epoch": 2259} {"train_loss": -23.898900985717773, "global_step": 187530, "epoch": 2259} {"train_loss": -23.881994247436523, "global_step": 187531, "epoch": 2259} {"train_loss": -24.541105270385742, "global_step": 187532, "epoch": 2259} {"train_loss": -23.879175186157227, "global_step": 187533, "epoch": 2259} {"train_loss": -24.311017990112305, "global_step": 187534, "epoch": 2259} {"train_loss": -23.950754165649414, "global_step": 187535, "epoch": 2259} {"train_loss": -24.359140396118164, "global_step": 187536, "epoch": 2259} {"train_loss": -24.1386661529541, "global_step": 187537, "epoch": 2259} {"train_loss": -24.1218318939209, "global_step": 187538, "epoch": 2259} {"train_loss": -23.518596649169922, "global_step": 187539, "epoch": 2259} {"train_loss": -24.067506790161133, "global_step": 187540, "epoch": 2259} {"train_loss": -24.106536865234375, "global_step": 187541, "epoch": 2259} {"train_loss": -23.523273468017578, "global_step": 187542, "epoch": 2259} {"train_loss": -23.54043197631836, "global_step": 187543, "epoch": 2259} {"train_loss": -23.816673278808594, "global_step": 187544, "epoch": 2259} {"train_loss": -23.903287887573242, "global_step": 187545, "epoch": 2259} {"train_loss": -23.58844566345215, "global_step": 187546, "epoch": 2259} {"train_loss": -23.880590438842773, "global_step": 187547, "epoch": 2259} {"train_loss": -24.06654930114746, "global_step": 187548, "epoch": 2259} {"train_loss": -24.043119430541992, "global_step": 187549, "epoch": 2259} {"train_loss": -23.667068481445312, "global_step": 187550, "epoch": 2259} {"train_loss": -23.917633056640625, "global_step": 187551, "epoch": 2259} {"train_loss": -24.210859298706055, "global_step": 187552, "epoch": 2259} {"train_loss": -24.170194625854492, "global_step": 187553, "epoch": 2259} {"train_loss": -24.2171688079834, "global_step": 187554, "epoch": 2259} {"train_loss": -23.9952449798584, "global_step": 187555, "epoch": 2259} {"train_loss": -23.617233276367188, "global_step": 187556, "epoch": 2259} {"train_loss": -24.091650009155273, "global_step": 187557, "epoch": 2259} {"train_loss": -23.84429359436035, "global_step": 187558, "epoch": 2259} {"train_loss": -24.481081008911133, "global_step": 187559, "epoch": 2259} {"train_loss": -24.091907501220703, "global_step": 187560, "epoch": 2259} {"train_loss": -23.94337272644043, "global_step": 187561, "epoch": 2259} {"train_loss": -24.03754997253418, "global_step": 187562, "epoch": 2259} {"train_loss": -23.903961181640625, "global_step": 187563, "epoch": 2259} {"train_loss": -23.967199325561523, "global_step": 187564, "epoch": 2259} {"train_loss": -24.028615951538086, "global_step": 187565, "epoch": 2259} {"train_loss": -24.219825744628906, "global_step": 187566, "epoch": 2259} {"train_loss": -23.868499755859375, "global_step": 187567, "epoch": 2259} {"train_loss": -23.923858642578125, "global_step": 187568, "epoch": 2259} {"train_loss": -24.411771774291992, "global_step": 187569, "epoch": 2259} {"train_loss": -24.475997924804688, "global_step": 187570, "epoch": 2259} {"train_loss": -23.934316635131836, "global_step": 187571, "epoch": 2259} {"train_loss": -24.0824031829834, "global_step": 187572, "epoch": 2259} {"train_loss": -23.938940048217773, "global_step": 187573, "epoch": 2259} {"train_loss": -23.984180450439453, "global_step": 187574, "epoch": 2259} {"train_loss": -24.256628036499023, "global_step": 187575, "epoch": 2259} {"train_loss": -24.066059112548828, "global_step": 187576, "epoch": 2259} {"train_loss": -24.150259017944336, "global_step": 187577, "epoch": 2259} {"train_loss": -24.029373168945312, "global_step": 187578, "epoch": 2259} {"train_loss": -23.98534407098609, "global_step": 187579, "epoch": 2259, "val_loss": 6479820.0} {"train_loss": -22.337854385375977, "global_step": 187580, "epoch": 2260} {"train_loss": -22.92498779296875, "global_step": 187581, "epoch": 2260} {"train_loss": -22.538833618164062, "global_step": 187582, "epoch": 2260} {"train_loss": -23.017189025878906, "global_step": 187583, "epoch": 2260} {"train_loss": -22.59893226623535, "global_step": 187584, "epoch": 2260} {"train_loss": -23.500782012939453, "global_step": 187585, "epoch": 2260} {"train_loss": -23.05158233642578, "global_step": 187586, "epoch": 2260} {"train_loss": -22.930654525756836, "global_step": 187587, "epoch": 2260} {"train_loss": -23.305150985717773, "global_step": 187588, "epoch": 2260} {"train_loss": -22.563936233520508, "global_step": 187589, "epoch": 2260} {"train_loss": -23.37439727783203, "global_step": 187590, "epoch": 2260} {"train_loss": -23.134647369384766, "global_step": 187591, "epoch": 2260} {"train_loss": -23.055957794189453, "global_step": 187592, "epoch": 2260} {"train_loss": -23.43939208984375, "global_step": 187593, "epoch": 2260} {"train_loss": -23.34027099609375, "global_step": 187594, "epoch": 2260} {"train_loss": -23.450292587280273, "global_step": 187595, "epoch": 2260} {"train_loss": -23.495603561401367, "global_step": 187596, "epoch": 2260} {"train_loss": -23.345300674438477, "global_step": 187597, "epoch": 2260} {"train_loss": -23.31887435913086, "global_step": 187598, "epoch": 2260} {"train_loss": -23.4605770111084, "global_step": 187599, "epoch": 2260} {"train_loss": -23.886234283447266, "global_step": 187600, "epoch": 2260} {"train_loss": -23.599241256713867, "global_step": 187601, "epoch": 2260} {"train_loss": -23.384498596191406, "global_step": 187602, "epoch": 2260} {"train_loss": -23.78431510925293, "global_step": 187603, "epoch": 2260} {"train_loss": -23.675718307495117, "global_step": 187604, "epoch": 2260} {"train_loss": -23.53528594970703, "global_step": 187605, "epoch": 2260} {"train_loss": -23.8012638092041, "global_step": 187606, "epoch": 2260} {"train_loss": -23.4870548248291, "global_step": 187607, "epoch": 2260} {"train_loss": -23.640605926513672, "global_step": 187608, "epoch": 2260} {"train_loss": -23.663894653320312, "global_step": 187609, "epoch": 2260} {"train_loss": -23.929309844970703, "global_step": 187610, "epoch": 2260} {"train_loss": -23.858863830566406, "global_step": 187611, "epoch": 2260} {"train_loss": -24.084196090698242, "global_step": 187612, "epoch": 2260} {"train_loss": -23.939903259277344, "global_step": 187613, "epoch": 2260} {"train_loss": -23.833850860595703, "global_step": 187614, "epoch": 2260} {"train_loss": -23.921262741088867, "global_step": 187615, "epoch": 2260} {"train_loss": -24.207082748413086, "global_step": 187616, "epoch": 2260} {"train_loss": -23.814863204956055, "global_step": 187617, "epoch": 2260} {"train_loss": -23.870338439941406, "global_step": 187618, "epoch": 2260} {"train_loss": -24.025211334228516, "global_step": 187619, "epoch": 2260} {"train_loss": -23.93019676208496, "global_step": 187620, "epoch": 2260} {"train_loss": -23.619413375854492, "global_step": 187621, "epoch": 2260} {"train_loss": -24.30702018737793, "global_step": 187622, "epoch": 2260} {"train_loss": -23.63275146484375, "global_step": 187623, "epoch": 2260} {"train_loss": -23.929977416992188, "global_step": 187624, "epoch": 2260} {"train_loss": -23.956497192382812, "global_step": 187625, "epoch": 2260} {"train_loss": -24.150259017944336, "global_step": 187626, "epoch": 2260} {"train_loss": -24.03805160522461, "global_step": 187627, "epoch": 2260} {"train_loss": -24.0959415435791, "global_step": 187628, "epoch": 2260} {"train_loss": -24.41070556640625, "global_step": 187629, "epoch": 2260} {"train_loss": -24.119504928588867, "global_step": 187630, "epoch": 2260} {"train_loss": -24.131515502929688, "global_step": 187631, "epoch": 2260} {"train_loss": -24.09249496459961, "global_step": 187632, "epoch": 2260} {"train_loss": -24.191797256469727, "global_step": 187633, "epoch": 2260} {"train_loss": -24.274484634399414, "global_step": 187634, "epoch": 2260} {"train_loss": -24.022476196289062, "global_step": 187635, "epoch": 2260} {"train_loss": -24.025659561157227, "global_step": 187636, "epoch": 2260} {"train_loss": -23.75129508972168, "global_step": 187637, "epoch": 2260} {"train_loss": -24.183523178100586, "global_step": 187638, "epoch": 2260} {"train_loss": -23.87593650817871, "global_step": 187639, "epoch": 2260} {"train_loss": -23.667814254760742, "global_step": 187640, "epoch": 2260} {"train_loss": -24.32722282409668, "global_step": 187641, "epoch": 2260} {"train_loss": -23.94748878479004, "global_step": 187642, "epoch": 2260} {"train_loss": -24.09048080444336, "global_step": 187643, "epoch": 2260} {"train_loss": -23.86736297607422, "global_step": 187644, "epoch": 2260} {"train_loss": -23.793128967285156, "global_step": 187645, "epoch": 2260} {"train_loss": -23.98148536682129, "global_step": 187646, "epoch": 2260} {"train_loss": -23.850156784057617, "global_step": 187647, "epoch": 2260} {"train_loss": -23.906009674072266, "global_step": 187648, "epoch": 2260} {"train_loss": -23.751737594604492, "global_step": 187649, "epoch": 2260} {"train_loss": -24.139738082885742, "global_step": 187650, "epoch": 2260} {"train_loss": -24.16531753540039, "global_step": 187651, "epoch": 2260} {"train_loss": -24.358821868896484, "global_step": 187652, "epoch": 2260} {"train_loss": -23.975662231445312, "global_step": 187653, "epoch": 2260} {"train_loss": -24.479827880859375, "global_step": 187654, "epoch": 2260} {"train_loss": -24.13379669189453, "global_step": 187655, "epoch": 2260} {"train_loss": -24.22359275817871, "global_step": 187656, "epoch": 2260} {"train_loss": -24.274015426635742, "global_step": 187657, "epoch": 2260} {"train_loss": -24.250333786010742, "global_step": 187658, "epoch": 2260} {"train_loss": -24.47220802307129, "global_step": 187659, "epoch": 2260} {"train_loss": -24.321460723876953, "global_step": 187660, "epoch": 2260} {"train_loss": -23.9553165435791, "global_step": 187661, "epoch": 2260} {"train_loss": -23.773645791662744, "global_step": 187662, "epoch": 2260, "val_loss": 6565926.0} {"train_loss": -22.93910026550293, "global_step": 187663, "epoch": 2261} {"train_loss": -22.568418502807617, "global_step": 187664, "epoch": 2261} {"train_loss": -23.10232925415039, "global_step": 187665, "epoch": 2261} {"train_loss": -23.652442932128906, "global_step": 187666, "epoch": 2261} {"train_loss": -22.872684478759766, "global_step": 187667, "epoch": 2261} {"train_loss": -23.964691162109375, "global_step": 187668, "epoch": 2261} {"train_loss": -23.241596221923828, "global_step": 187669, "epoch": 2261} {"train_loss": -23.80965232849121, "global_step": 187670, "epoch": 2261} {"train_loss": -23.440906524658203, "global_step": 187671, "epoch": 2261} {"train_loss": -23.42458152770996, "global_step": 187672, "epoch": 2261} {"train_loss": -23.896055221557617, "global_step": 187673, "epoch": 2261} {"train_loss": -23.205835342407227, "global_step": 187674, "epoch": 2261} {"train_loss": -23.900617599487305, "global_step": 187675, "epoch": 2261} {"train_loss": -24.122882843017578, "global_step": 187676, "epoch": 2261} {"train_loss": -23.45063591003418, "global_step": 187677, "epoch": 2261} {"train_loss": -23.70648765563965, "global_step": 187678, "epoch": 2261} {"train_loss": -23.609664916992188, "global_step": 187679, "epoch": 2261} {"train_loss": -23.598691940307617, "global_step": 187680, "epoch": 2261} {"train_loss": -23.5806941986084, "global_step": 187681, "epoch": 2261} {"train_loss": -23.9227352142334, "global_step": 187682, "epoch": 2261} {"train_loss": -23.867504119873047, "global_step": 187683, "epoch": 2261} {"train_loss": -23.7628231048584, "global_step": 187684, "epoch": 2261} {"train_loss": -23.917211532592773, "global_step": 187685, "epoch": 2261} {"train_loss": -24.100299835205078, "global_step": 187686, "epoch": 2261} {"train_loss": -23.9108943939209, "global_step": 187687, "epoch": 2261} {"train_loss": -24.018667221069336, "global_step": 187688, "epoch": 2261} {"train_loss": -23.910425186157227, "global_step": 187689, "epoch": 2261} {"train_loss": -24.06781005859375, "global_step": 187690, "epoch": 2261} {"train_loss": -24.044172286987305, "global_step": 187691, "epoch": 2261} {"train_loss": -24.143386840820312, "global_step": 187692, "epoch": 2261} {"train_loss": -24.314855575561523, "global_step": 187693, "epoch": 2261} {"train_loss": -24.16428565979004, "global_step": 187694, "epoch": 2261} {"train_loss": -24.23213768005371, "global_step": 187695, "epoch": 2261} {"train_loss": -24.28101921081543, "global_step": 187696, "epoch": 2261} {"train_loss": -24.045984268188477, "global_step": 187697, "epoch": 2261} {"train_loss": -23.86897087097168, "global_step": 187698, "epoch": 2261} {"train_loss": -24.215177536010742, "global_step": 187699, "epoch": 2261} {"train_loss": -23.96563720703125, "global_step": 187700, "epoch": 2261} {"train_loss": -24.339841842651367, "global_step": 187701, "epoch": 2261} {"train_loss": -24.029891967773438, "global_step": 187702, "epoch": 2261} {"train_loss": -23.75923728942871, "global_step": 187703, "epoch": 2261} {"train_loss": -24.15333366394043, "global_step": 187704, "epoch": 2261} {"train_loss": -23.79283905029297, "global_step": 187705, "epoch": 2261} {"train_loss": -24.17579460144043, "global_step": 187706, "epoch": 2261} {"train_loss": -24.14426040649414, "global_step": 187707, "epoch": 2261} {"train_loss": -23.699827194213867, "global_step": 187708, "epoch": 2261} {"train_loss": -24.185012817382812, "global_step": 187709, "epoch": 2261} {"train_loss": -24.181974411010742, "global_step": 187710, "epoch": 2261} {"train_loss": -24.16016960144043, "global_step": 187711, "epoch": 2261} {"train_loss": -24.4207820892334, "global_step": 187712, "epoch": 2261} {"train_loss": -23.912338256835938, "global_step": 187713, "epoch": 2261} {"train_loss": -23.806291580200195, "global_step": 187714, "epoch": 2261} {"train_loss": -24.00262451171875, "global_step": 187715, "epoch": 2261} {"train_loss": -24.158472061157227, "global_step": 187716, "epoch": 2261} {"train_loss": -23.59161949157715, "global_step": 187717, "epoch": 2261} {"train_loss": -24.00743293762207, "global_step": 187718, "epoch": 2261} {"train_loss": -23.982297897338867, "global_step": 187719, "epoch": 2261} {"train_loss": -24.232402801513672, "global_step": 187720, "epoch": 2261} {"train_loss": -24.21030616760254, "global_step": 187721, "epoch": 2261} {"train_loss": -24.309507369995117, "global_step": 187722, "epoch": 2261} {"train_loss": -24.174829483032227, "global_step": 187723, "epoch": 2261} {"train_loss": -23.928998947143555, "global_step": 187724, "epoch": 2261} {"train_loss": -24.050674438476562, "global_step": 187725, "epoch": 2261} {"train_loss": -24.287067413330078, "global_step": 187726, "epoch": 2261} {"train_loss": -23.9254207611084, "global_step": 187727, "epoch": 2261} {"train_loss": -24.260679244995117, "global_step": 187728, "epoch": 2261} {"train_loss": -24.105545043945312, "global_step": 187729, "epoch": 2261} {"train_loss": -24.254470825195312, "global_step": 187730, "epoch": 2261} {"train_loss": -24.071014404296875, "global_step": 187731, "epoch": 2261} {"train_loss": -23.845020294189453, "global_step": 187732, "epoch": 2261} {"train_loss": -23.95194435119629, "global_step": 187733, "epoch": 2261} {"train_loss": -23.977746963500977, "global_step": 187734, "epoch": 2261} {"train_loss": -24.221662521362305, "global_step": 187735, "epoch": 2261} {"train_loss": -24.197330474853516, "global_step": 187736, "epoch": 2261} {"train_loss": -23.92166519165039, "global_step": 187737, "epoch": 2261} {"train_loss": -24.17207145690918, "global_step": 187738, "epoch": 2261} {"train_loss": -23.545175552368164, "global_step": 187739, "epoch": 2261} {"train_loss": -23.928882598876953, "global_step": 187740, "epoch": 2261} {"train_loss": -24.01007080078125, "global_step": 187741, "epoch": 2261} {"train_loss": -23.850048065185547, "global_step": 187742, "epoch": 2261} {"train_loss": -23.87120819091797, "global_step": 187743, "epoch": 2261} {"train_loss": -24.0655460357666, "global_step": 187744, "epoch": 2261} {"train_loss": -23.90085746581296, "global_step": 187745, "epoch": 2261, "val_loss": 6507836.0} {"train_loss": -23.58932113647461, "global_step": 187746, "epoch": 2262} {"train_loss": -23.436325073242188, "global_step": 187747, "epoch": 2262} {"train_loss": -23.681161880493164, "global_step": 187748, "epoch": 2262} {"train_loss": -23.012836456298828, "global_step": 187749, "epoch": 2262} {"train_loss": -23.19947624206543, "global_step": 187750, "epoch": 2262} {"train_loss": -23.329029083251953, "global_step": 187751, "epoch": 2262} {"train_loss": -23.3750057220459, "global_step": 187752, "epoch": 2262} {"train_loss": -23.72519302368164, "global_step": 187753, "epoch": 2262} {"train_loss": -23.25431251525879, "global_step": 187754, "epoch": 2262} {"train_loss": -23.607816696166992, "global_step": 187755, "epoch": 2262} {"train_loss": -23.533742904663086, "global_step": 187756, "epoch": 2262} {"train_loss": -24.01841163635254, "global_step": 187757, "epoch": 2262} {"train_loss": -23.661495208740234, "global_step": 187758, "epoch": 2262} {"train_loss": -23.886703491210938, "global_step": 187759, "epoch": 2262} {"train_loss": -23.95804214477539, "global_step": 187760, "epoch": 2262} {"train_loss": -23.25115966796875, "global_step": 187761, "epoch": 2262} {"train_loss": -23.701574325561523, "global_step": 187762, "epoch": 2262} {"train_loss": -23.77408218383789, "global_step": 187763, "epoch": 2262} {"train_loss": -23.48583984375, "global_step": 187764, "epoch": 2262} {"train_loss": -23.777801513671875, "global_step": 187765, "epoch": 2262} {"train_loss": -23.920774459838867, "global_step": 187766, "epoch": 2262} {"train_loss": -24.069644927978516, "global_step": 187767, "epoch": 2262} {"train_loss": -23.910978317260742, "global_step": 187768, "epoch": 2262} {"train_loss": -23.80887794494629, "global_step": 187769, "epoch": 2262} {"train_loss": -24.29286766052246, "global_step": 187770, "epoch": 2262} {"train_loss": -23.975616455078125, "global_step": 187771, "epoch": 2262} {"train_loss": -23.930692672729492, "global_step": 187772, "epoch": 2262} {"train_loss": -24.056982040405273, "global_step": 187773, "epoch": 2262} {"train_loss": -24.164997100830078, "global_step": 187774, "epoch": 2262} {"train_loss": -23.75000762939453, "global_step": 187775, "epoch": 2262} {"train_loss": -24.01521110534668, "global_step": 187776, "epoch": 2262} {"train_loss": -24.15882682800293, "global_step": 187777, "epoch": 2262} {"train_loss": -24.06854820251465, "global_step": 187778, "epoch": 2262} {"train_loss": -23.963939666748047, "global_step": 187779, "epoch": 2262} {"train_loss": -24.113637924194336, "global_step": 187780, "epoch": 2262} {"train_loss": -23.998903274536133, "global_step": 187781, "epoch": 2262} {"train_loss": -24.177091598510742, "global_step": 187782, "epoch": 2262} {"train_loss": -24.18158531188965, "global_step": 187783, "epoch": 2262} {"train_loss": -23.989721298217773, "global_step": 187784, "epoch": 2262} {"train_loss": -24.051090240478516, "global_step": 187785, "epoch": 2262} {"train_loss": -24.056804656982422, "global_step": 187786, "epoch": 2262} {"train_loss": -23.91411781311035, "global_step": 187787, "epoch": 2262} {"train_loss": -23.85878562927246, "global_step": 187788, "epoch": 2262} {"train_loss": -24.178661346435547, "global_step": 187789, "epoch": 2262} {"train_loss": -24.12629508972168, "global_step": 187790, "epoch": 2262} {"train_loss": -24.564184188842773, "global_step": 187791, "epoch": 2262} {"train_loss": -24.267927169799805, "global_step": 187792, "epoch": 2262} {"train_loss": -23.900487899780273, "global_step": 187793, "epoch": 2262} {"train_loss": -23.90146255493164, "global_step": 187794, "epoch": 2262} {"train_loss": -24.073455810546875, "global_step": 187795, "epoch": 2262} {"train_loss": -23.74252700805664, "global_step": 187796, "epoch": 2262} {"train_loss": -24.067920684814453, "global_step": 187797, "epoch": 2262} {"train_loss": -24.252824783325195, "global_step": 187798, "epoch": 2262} {"train_loss": -23.96434211730957, "global_step": 187799, "epoch": 2262} {"train_loss": -24.230100631713867, "global_step": 187800, "epoch": 2262} {"train_loss": -24.19869041442871, "global_step": 187801, "epoch": 2262} {"train_loss": -24.032360076904297, "global_step": 187802, "epoch": 2262} {"train_loss": -24.533842086791992, "global_step": 187803, "epoch": 2262} {"train_loss": -23.71003532409668, "global_step": 187804, "epoch": 2262} {"train_loss": -24.08943748474121, "global_step": 187805, "epoch": 2262} {"train_loss": -23.782373428344727, "global_step": 187806, "epoch": 2262} {"train_loss": -23.857154846191406, "global_step": 187807, "epoch": 2262} {"train_loss": -23.823246002197266, "global_step": 187808, "epoch": 2262} {"train_loss": -24.023351669311523, "global_step": 187809, "epoch": 2262} {"train_loss": -23.81201171875, "global_step": 187810, "epoch": 2262} {"train_loss": -24.21394920349121, "global_step": 187811, "epoch": 2262} {"train_loss": -23.73499870300293, "global_step": 187812, "epoch": 2262} {"train_loss": -24.21603775024414, "global_step": 187813, "epoch": 2262} {"train_loss": -24.21201515197754, "global_step": 187814, "epoch": 2262} {"train_loss": -24.05808448791504, "global_step": 187815, "epoch": 2262} {"train_loss": -24.095924377441406, "global_step": 187816, "epoch": 2262} {"train_loss": -24.333593368530273, "global_step": 187817, "epoch": 2262} {"train_loss": -24.037073135375977, "global_step": 187818, "epoch": 2262} {"train_loss": -24.21465301513672, "global_step": 187819, "epoch": 2262} {"train_loss": -24.09522819519043, "global_step": 187820, "epoch": 2262} {"train_loss": -24.35365104675293, "global_step": 187821, "epoch": 2262} {"train_loss": -24.24129295349121, "global_step": 187822, "epoch": 2262} {"train_loss": -24.141056060791016, "global_step": 187823, "epoch": 2262} {"train_loss": -24.178680419921875, "global_step": 187824, "epoch": 2262} {"train_loss": -24.38112449645996, "global_step": 187825, "epoch": 2262} {"train_loss": -23.957029342651367, "global_step": 187826, "epoch": 2262} {"train_loss": -24.0150203704834, "global_step": 187827, "epoch": 2262} {"train_loss": -23.943396878529743, "global_step": 187828, "epoch": 2262, "val_loss": 6570081.0} {"train_loss": -23.466402053833008, "global_step": 187829, "epoch": 2263} {"train_loss": -23.49888801574707, "global_step": 187830, "epoch": 2263} {"train_loss": -23.44656753540039, "global_step": 187831, "epoch": 2263} {"train_loss": -23.34015464782715, "global_step": 187832, "epoch": 2263} {"train_loss": -23.18844985961914, "global_step": 187833, "epoch": 2263} {"train_loss": -23.574493408203125, "global_step": 187834, "epoch": 2263} {"train_loss": -22.933568954467773, "global_step": 187835, "epoch": 2263} {"train_loss": -23.628828048706055, "global_step": 187836, "epoch": 2263} {"train_loss": -23.30307960510254, "global_step": 187837, "epoch": 2263} {"train_loss": -23.197294235229492, "global_step": 187838, "epoch": 2263} {"train_loss": -23.670360565185547, "global_step": 187839, "epoch": 2263} {"train_loss": -23.601428985595703, "global_step": 187840, "epoch": 2263} {"train_loss": -23.652738571166992, "global_step": 187841, "epoch": 2263} {"train_loss": -23.49666976928711, "global_step": 187842, "epoch": 2263} {"train_loss": -23.631628036499023, "global_step": 187843, "epoch": 2263} {"train_loss": -23.773868560791016, "global_step": 187844, "epoch": 2263} {"train_loss": -23.886930465698242, "global_step": 187845, "epoch": 2263} {"train_loss": -23.624237060546875, "global_step": 187846, "epoch": 2263} {"train_loss": -23.647789001464844, "global_step": 187847, "epoch": 2263} {"train_loss": -24.000749588012695, "global_step": 187848, "epoch": 2263} {"train_loss": -24.01333236694336, "global_step": 187849, "epoch": 2263} {"train_loss": -24.066213607788086, "global_step": 187850, "epoch": 2263} {"train_loss": -23.922285079956055, "global_step": 187851, "epoch": 2263} {"train_loss": -23.819440841674805, "global_step": 187852, "epoch": 2263} {"train_loss": -23.74085235595703, "global_step": 187853, "epoch": 2263} {"train_loss": -24.201322555541992, "global_step": 187854, "epoch": 2263} {"train_loss": -23.770626068115234, "global_step": 187855, "epoch": 2263} {"train_loss": -24.226945877075195, "global_step": 187856, "epoch": 2263} {"train_loss": -24.283742904663086, "global_step": 187857, "epoch": 2263} {"train_loss": -23.78733253479004, "global_step": 187858, "epoch": 2263} {"train_loss": -23.954530715942383, "global_step": 187859, "epoch": 2263} {"train_loss": -23.992080688476562, "global_step": 187860, "epoch": 2263} {"train_loss": -24.109338760375977, "global_step": 187861, "epoch": 2263} {"train_loss": -24.323959350585938, "global_step": 187862, "epoch": 2263} {"train_loss": -23.665027618408203, "global_step": 187863, "epoch": 2263} {"train_loss": -24.01023292541504, "global_step": 187864, "epoch": 2263} {"train_loss": -24.312803268432617, "global_step": 187865, "epoch": 2263} {"train_loss": -23.562217712402344, "global_step": 187866, "epoch": 2263} {"train_loss": -23.892019271850586, "global_step": 187867, "epoch": 2263} {"train_loss": -23.962156295776367, "global_step": 187868, "epoch": 2263} {"train_loss": -23.61709976196289, "global_step": 187869, "epoch": 2263} {"train_loss": -24.048952102661133, "global_step": 187870, "epoch": 2263} {"train_loss": -24.118986129760742, "global_step": 187871, "epoch": 2263} {"train_loss": -24.02151870727539, "global_step": 187872, "epoch": 2263} {"train_loss": -23.851720809936523, "global_step": 187873, "epoch": 2263} {"train_loss": -24.152786254882812, "global_step": 187874, "epoch": 2263} {"train_loss": -23.849042892456055, "global_step": 187875, "epoch": 2263} {"train_loss": -24.1632137298584, "global_step": 187876, "epoch": 2263} {"train_loss": -24.209543228149414, "global_step": 187877, "epoch": 2263} {"train_loss": -24.202909469604492, "global_step": 187878, "epoch": 2263} {"train_loss": -24.172826766967773, "global_step": 187879, "epoch": 2263} {"train_loss": -23.990022659301758, "global_step": 187880, "epoch": 2263} {"train_loss": -24.097320556640625, "global_step": 187881, "epoch": 2263} {"train_loss": -24.06485366821289, "global_step": 187882, "epoch": 2263} {"train_loss": -24.164276123046875, "global_step": 187883, "epoch": 2263} {"train_loss": -24.065670013427734, "global_step": 187884, "epoch": 2263} {"train_loss": -24.030658721923828, "global_step": 187885, "epoch": 2263} {"train_loss": -24.048070907592773, "global_step": 187886, "epoch": 2263} {"train_loss": -24.4427547454834, "global_step": 187887, "epoch": 2263} {"train_loss": -24.240224838256836, "global_step": 187888, "epoch": 2263} {"train_loss": -24.5799560546875, "global_step": 187889, "epoch": 2263} {"train_loss": -24.271360397338867, "global_step": 187890, "epoch": 2263} {"train_loss": -24.094038009643555, "global_step": 187891, "epoch": 2263} {"train_loss": -24.159339904785156, "global_step": 187892, "epoch": 2263} {"train_loss": -24.01411247253418, "global_step": 187893, "epoch": 2263} {"train_loss": -24.197797775268555, "global_step": 187894, "epoch": 2263} {"train_loss": -23.7437801361084, "global_step": 187895, "epoch": 2263} {"train_loss": -23.98799705505371, "global_step": 187896, "epoch": 2263} {"train_loss": -24.02513313293457, "global_step": 187897, "epoch": 2263} {"train_loss": -24.68848991394043, "global_step": 187898, "epoch": 2263} {"train_loss": -23.662839889526367, "global_step": 187899, "epoch": 2263} {"train_loss": -23.738290786743164, "global_step": 187900, "epoch": 2263} {"train_loss": -24.046831130981445, "global_step": 187901, "epoch": 2263} {"train_loss": -23.726335525512695, "global_step": 187902, "epoch": 2263} {"train_loss": -23.741785049438477, "global_step": 187903, "epoch": 2263} {"train_loss": -23.59412956237793, "global_step": 187904, "epoch": 2263} {"train_loss": -24.23886489868164, "global_step": 187905, "epoch": 2263} {"train_loss": -23.684431076049805, "global_step": 187906, "epoch": 2263} {"train_loss": -24.03311538696289, "global_step": 187907, "epoch": 2263} {"train_loss": -24.207948684692383, "global_step": 187908, "epoch": 2263} {"train_loss": -24.201101303100586, "global_step": 187909, "epoch": 2263} {"train_loss": -23.536014556884766, "global_step": 187910, "epoch": 2263} {"train_loss": -23.898477876042744, "global_step": 187911, "epoch": 2263, "val_loss": 6452262.0} {"train_loss": -23.876771926879883, "global_step": 187912, "epoch": 2264} {"train_loss": -23.938627243041992, "global_step": 187913, "epoch": 2264} {"train_loss": -23.967517852783203, "global_step": 187914, "epoch": 2264} {"train_loss": -24.012781143188477, "global_step": 187915, "epoch": 2264} {"train_loss": -23.143068313598633, "global_step": 187916, "epoch": 2264} {"train_loss": -23.90506362915039, "global_step": 187917, "epoch": 2264} {"train_loss": -24.046035766601562, "global_step": 187918, "epoch": 2264} {"train_loss": -23.831438064575195, "global_step": 187919, "epoch": 2264} {"train_loss": -23.952733993530273, "global_step": 187920, "epoch": 2264} {"train_loss": -23.716367721557617, "global_step": 187921, "epoch": 2264} {"train_loss": -24.039047241210938, "global_step": 187922, "epoch": 2264} {"train_loss": -23.776662826538086, "global_step": 187923, "epoch": 2264} {"train_loss": -24.112995147705078, "global_step": 187924, "epoch": 2264} {"train_loss": -23.828327178955078, "global_step": 187925, "epoch": 2264} {"train_loss": -24.045400619506836, "global_step": 187926, "epoch": 2264} {"train_loss": -23.792654037475586, "global_step": 187927, "epoch": 2264} {"train_loss": -24.1046199798584, "global_step": 187928, "epoch": 2264} {"train_loss": -23.81387710571289, "global_step": 187929, "epoch": 2264} {"train_loss": -23.979019165039062, "global_step": 187930, "epoch": 2264} {"train_loss": -24.103591918945312, "global_step": 187931, "epoch": 2264} {"train_loss": -24.11621856689453, "global_step": 187932, "epoch": 2264} {"train_loss": -23.90443992614746, "global_step": 187933, "epoch": 2264} {"train_loss": -24.398082733154297, "global_step": 187934, "epoch": 2264} {"train_loss": -24.391645431518555, "global_step": 187935, "epoch": 2264} {"train_loss": -23.85713768005371, "global_step": 187936, "epoch": 2264} {"train_loss": -24.126708984375, "global_step": 187937, "epoch": 2264} {"train_loss": -23.73664665222168, "global_step": 187938, "epoch": 2264} {"train_loss": -24.54437828063965, "global_step": 187939, "epoch": 2264} {"train_loss": -24.052566528320312, "global_step": 187940, "epoch": 2264} {"train_loss": -24.409076690673828, "global_step": 187941, "epoch": 2264} {"train_loss": -24.1668758392334, "global_step": 187942, "epoch": 2264} {"train_loss": -24.209529876708984, "global_step": 187943, "epoch": 2264} {"train_loss": -23.9438419342041, "global_step": 187944, "epoch": 2264} {"train_loss": -24.096952438354492, "global_step": 187945, "epoch": 2264} {"train_loss": -24.29629898071289, "global_step": 187946, "epoch": 2264} {"train_loss": -24.400131225585938, "global_step": 187947, "epoch": 2264} {"train_loss": -24.14100456237793, "global_step": 187948, "epoch": 2264} {"train_loss": -24.08222770690918, "global_step": 187949, "epoch": 2264} {"train_loss": -24.192283630371094, "global_step": 187950, "epoch": 2264} {"train_loss": -23.953771591186523, "global_step": 187951, "epoch": 2264} {"train_loss": -24.032154083251953, "global_step": 187952, "epoch": 2264} {"train_loss": -24.112585067749023, "global_step": 187953, "epoch": 2264} {"train_loss": -24.23206901550293, "global_step": 187954, "epoch": 2264} {"train_loss": -24.30311393737793, "global_step": 187955, "epoch": 2264} {"train_loss": -23.784841537475586, "global_step": 187956, "epoch": 2264} {"train_loss": -23.998441696166992, "global_step": 187957, "epoch": 2264} {"train_loss": -24.04254150390625, "global_step": 187958, "epoch": 2264} {"train_loss": -24.247827529907227, "global_step": 187959, "epoch": 2264} {"train_loss": -24.01462173461914, "global_step": 187960, "epoch": 2264} {"train_loss": -23.96099090576172, "global_step": 187961, "epoch": 2264} {"train_loss": -23.992095947265625, "global_step": 187962, "epoch": 2264} {"train_loss": -23.771793365478516, "global_step": 187963, "epoch": 2264} {"train_loss": -24.26622200012207, "global_step": 187964, "epoch": 2264} {"train_loss": -24.187862396240234, "global_step": 187965, "epoch": 2264} {"train_loss": -24.242284774780273, "global_step": 187966, "epoch": 2264} {"train_loss": -24.05527687072754, "global_step": 187967, "epoch": 2264} {"train_loss": -24.026395797729492, "global_step": 187968, "epoch": 2264} {"train_loss": -24.262845993041992, "global_step": 187969, "epoch": 2264} {"train_loss": -24.053197860717773, "global_step": 187970, "epoch": 2264} {"train_loss": -23.633312225341797, "global_step": 187971, "epoch": 2264} {"train_loss": -23.755338668823242, "global_step": 187972, "epoch": 2264} {"train_loss": -24.05341339111328, "global_step": 187973, "epoch": 2264} {"train_loss": -24.22056007385254, "global_step": 187974, "epoch": 2264} {"train_loss": -23.72762680053711, "global_step": 187975, "epoch": 2264} {"train_loss": -23.81532859802246, "global_step": 187976, "epoch": 2264} {"train_loss": -23.6942081451416, "global_step": 187977, "epoch": 2264} {"train_loss": -23.8250732421875, "global_step": 187978, "epoch": 2264} {"train_loss": -23.986692428588867, "global_step": 187979, "epoch": 2264} {"train_loss": -23.779489517211914, "global_step": 187980, "epoch": 2264} {"train_loss": -24.190351486206055, "global_step": 187981, "epoch": 2264} {"train_loss": -24.051658630371094, "global_step": 187982, "epoch": 2264} {"train_loss": -23.858739852905273, "global_step": 187983, "epoch": 2264} {"train_loss": -23.848901748657227, "global_step": 187984, "epoch": 2264} {"train_loss": -24.108734130859375, "global_step": 187985, "epoch": 2264} {"train_loss": -24.202529907226562, "global_step": 187986, "epoch": 2264} {"train_loss": -24.185741424560547, "global_step": 187987, "epoch": 2264} {"train_loss": -24.196619033813477, "global_step": 187988, "epoch": 2264} {"train_loss": -24.112340927124023, "global_step": 187989, "epoch": 2264} {"train_loss": -24.162710189819336, "global_step": 187990, "epoch": 2264} {"train_loss": -23.94929313659668, "global_step": 187991, "epoch": 2264} {"train_loss": -24.524761199951172, "global_step": 187992, "epoch": 2264} {"train_loss": -23.889347076416016, "global_step": 187993, "epoch": 2264} {"train_loss": -24.023984380515223, "global_step": 187994, "epoch": 2264, "val_loss": 6475132.0} {"train_loss": -23.247220993041992, "global_step": 187995, "epoch": 2265} {"train_loss": -23.405908584594727, "global_step": 187996, "epoch": 2265} {"train_loss": -23.52518653869629, "global_step": 187997, "epoch": 2265} {"train_loss": -22.95011329650879, "global_step": 187998, "epoch": 2265} {"train_loss": -23.509811401367188, "global_step": 187999, "epoch": 2265} {"train_loss": -23.659826278686523, "global_step": 188000, "epoch": 2265} {"train_loss": -23.67217445373535, "global_step": 188001, "epoch": 2265} {"train_loss": -23.648040771484375, "global_step": 188002, "epoch": 2265} {"train_loss": -23.39240264892578, "global_step": 188003, "epoch": 2265} {"train_loss": -23.60260581970215, "global_step": 188004, "epoch": 2265} {"train_loss": -23.613805770874023, "global_step": 188005, "epoch": 2265} {"train_loss": -24.03582191467285, "global_step": 188006, "epoch": 2265} {"train_loss": -23.725635528564453, "global_step": 188007, "epoch": 2265} {"train_loss": -23.896833419799805, "global_step": 188008, "epoch": 2265} {"train_loss": -23.97869873046875, "global_step": 188009, "epoch": 2265} {"train_loss": -23.87702751159668, "global_step": 188010, "epoch": 2265} {"train_loss": -23.463544845581055, "global_step": 188011, "epoch": 2265} {"train_loss": -24.102354049682617, "global_step": 188012, "epoch": 2265} {"train_loss": -23.560495376586914, "global_step": 188013, "epoch": 2265} {"train_loss": -24.235198974609375, "global_step": 188014, "epoch": 2265} {"train_loss": -23.91144371032715, "global_step": 188015, "epoch": 2265} {"train_loss": -23.62880516052246, "global_step": 188016, "epoch": 2265} {"train_loss": -24.27950096130371, "global_step": 188017, "epoch": 2265} {"train_loss": -23.879131317138672, "global_step": 188018, "epoch": 2265} {"train_loss": -23.97109031677246, "global_step": 188019, "epoch": 2265} {"train_loss": -23.576566696166992, "global_step": 188020, "epoch": 2265} {"train_loss": -24.080646514892578, "global_step": 188021, "epoch": 2265} {"train_loss": -24.250768661499023, "global_step": 188022, "epoch": 2265} {"train_loss": -23.76612663269043, "global_step": 188023, "epoch": 2265} {"train_loss": -24.175947189331055, "global_step": 188024, "epoch": 2265} {"train_loss": -24.182029724121094, "global_step": 188025, "epoch": 2265} {"train_loss": -23.941747665405273, "global_step": 188026, "epoch": 2265} {"train_loss": -24.014387130737305, "global_step": 188027, "epoch": 2265} {"train_loss": -24.137418746948242, "global_step": 188028, "epoch": 2265} {"train_loss": -23.923974990844727, "global_step": 188029, "epoch": 2265} {"train_loss": -24.034713745117188, "global_step": 188030, "epoch": 2265} {"train_loss": -23.956106185913086, "global_step": 188031, "epoch": 2265} {"train_loss": -23.830810546875, "global_step": 188032, "epoch": 2265} {"train_loss": -24.26563835144043, "global_step": 188033, "epoch": 2265} {"train_loss": -24.203222274780273, "global_step": 188034, "epoch": 2265} {"train_loss": -23.969064712524414, "global_step": 188035, "epoch": 2265} {"train_loss": -23.94379234313965, "global_step": 188036, "epoch": 2265} {"train_loss": -24.192363739013672, "global_step": 188037, "epoch": 2265} {"train_loss": -24.10335350036621, "global_step": 188038, "epoch": 2265} {"train_loss": -24.22296142578125, "global_step": 188039, "epoch": 2265} {"train_loss": -23.902917861938477, "global_step": 188040, "epoch": 2265} {"train_loss": -24.241628646850586, "global_step": 188041, "epoch": 2265} {"train_loss": -23.981515884399414, "global_step": 188042, "epoch": 2265} {"train_loss": -24.299829483032227, "global_step": 188043, "epoch": 2265} {"train_loss": -23.9283447265625, "global_step": 188044, "epoch": 2265} {"train_loss": -24.046878814697266, "global_step": 188045, "epoch": 2265} {"train_loss": -24.163257598876953, "global_step": 188046, "epoch": 2265} {"train_loss": -24.00240135192871, "global_step": 188047, "epoch": 2265} {"train_loss": -23.776657104492188, "global_step": 188048, "epoch": 2265} {"train_loss": -24.24835777282715, "global_step": 188049, "epoch": 2265} {"train_loss": -24.049325942993164, "global_step": 188050, "epoch": 2265} {"train_loss": -23.97320556640625, "global_step": 188051, "epoch": 2265} {"train_loss": -23.983293533325195, "global_step": 188052, "epoch": 2265} {"train_loss": -23.757766723632812, "global_step": 188053, "epoch": 2265} {"train_loss": -23.71451759338379, "global_step": 188054, "epoch": 2265} {"train_loss": -24.035818099975586, "global_step": 188055, "epoch": 2265} {"train_loss": -24.11701774597168, "global_step": 188056, "epoch": 2265} {"train_loss": -24.025449752807617, "global_step": 188057, "epoch": 2265} {"train_loss": -23.947723388671875, "global_step": 188058, "epoch": 2265} {"train_loss": -23.8933048248291, "global_step": 188059, "epoch": 2265} {"train_loss": -24.26883316040039, "global_step": 188060, "epoch": 2265} {"train_loss": -24.372848510742188, "global_step": 188061, "epoch": 2265} {"train_loss": -24.00776481628418, "global_step": 188062, "epoch": 2265} {"train_loss": -24.403430938720703, "global_step": 188063, "epoch": 2265} {"train_loss": -24.151824951171875, "global_step": 188064, "epoch": 2265} {"train_loss": -24.303329467773438, "global_step": 188065, "epoch": 2265} {"train_loss": -24.09714698791504, "global_step": 188066, "epoch": 2265} {"train_loss": -24.05596160888672, "global_step": 188067, "epoch": 2265} {"train_loss": -24.442773818969727, "global_step": 188068, "epoch": 2265} {"train_loss": -24.29328155517578, "global_step": 188069, "epoch": 2265} {"train_loss": -23.95623016357422, "global_step": 188070, "epoch": 2265} {"train_loss": -24.315893173217773, "global_step": 188071, "epoch": 2265} {"train_loss": -24.400190353393555, "global_step": 188072, "epoch": 2265} {"train_loss": -24.438251495361328, "global_step": 188073, "epoch": 2265} {"train_loss": -24.042518615722656, "global_step": 188074, "epoch": 2265} {"train_loss": -24.173503875732422, "global_step": 188075, "epoch": 2265} {"train_loss": -24.129323959350586, "global_step": 188076, "epoch": 2265} {"train_loss": -23.98599422408874, "global_step": 188077, "epoch": 2265, "val_loss": 6588646.5} {"train_loss": -23.66633415222168, "global_step": 188078, "epoch": 2266} {"train_loss": -22.997879028320312, "global_step": 188079, "epoch": 2266} {"train_loss": -23.512985229492188, "global_step": 188080, "epoch": 2266} {"train_loss": -23.635435104370117, "global_step": 188081, "epoch": 2266} {"train_loss": -23.224729537963867, "global_step": 188082, "epoch": 2266} {"train_loss": -23.37618637084961, "global_step": 188083, "epoch": 2266} {"train_loss": -23.47755241394043, "global_step": 188084, "epoch": 2266} {"train_loss": -23.515302658081055, "global_step": 188085, "epoch": 2266} {"train_loss": -23.694576263427734, "global_step": 188086, "epoch": 2266} {"train_loss": -23.414134979248047, "global_step": 188087, "epoch": 2266} {"train_loss": -23.899015426635742, "global_step": 188088, "epoch": 2266} {"train_loss": -23.299480438232422, "global_step": 188089, "epoch": 2266} {"train_loss": -24.2323055267334, "global_step": 188090, "epoch": 2266} {"train_loss": -23.690698623657227, "global_step": 188091, "epoch": 2266} {"train_loss": -23.700956344604492, "global_step": 188092, "epoch": 2266} {"train_loss": -23.177778244018555, "global_step": 188093, "epoch": 2266} {"train_loss": -23.816083908081055, "global_step": 188094, "epoch": 2266} {"train_loss": -23.680437088012695, "global_step": 188095, "epoch": 2266} {"train_loss": -23.610458374023438, "global_step": 188096, "epoch": 2266} {"train_loss": -23.891422271728516, "global_step": 188097, "epoch": 2266} {"train_loss": -23.979778289794922, "global_step": 188098, "epoch": 2266} {"train_loss": -23.65178871154785, "global_step": 188099, "epoch": 2266} {"train_loss": -23.764026641845703, "global_step": 188100, "epoch": 2266} {"train_loss": -23.663618087768555, "global_step": 188101, "epoch": 2266} {"train_loss": -23.6937313079834, "global_step": 188102, "epoch": 2266} {"train_loss": -24.324054718017578, "global_step": 188103, "epoch": 2266} {"train_loss": -23.95575714111328, "global_step": 188104, "epoch": 2266} {"train_loss": -24.221328735351562, "global_step": 188105, "epoch": 2266} {"train_loss": -24.173789978027344, "global_step": 188106, "epoch": 2266} {"train_loss": -24.1020450592041, "global_step": 188107, "epoch": 2266} {"train_loss": -23.845373153686523, "global_step": 188108, "epoch": 2266} {"train_loss": -23.92041015625, "global_step": 188109, "epoch": 2266} {"train_loss": -23.731443405151367, "global_step": 188110, "epoch": 2266} {"train_loss": -24.148536682128906, "global_step": 188111, "epoch": 2266} {"train_loss": -23.955347061157227, "global_step": 188112, "epoch": 2266} {"train_loss": -23.938512802124023, "global_step": 188113, "epoch": 2266} {"train_loss": -24.092472076416016, "global_step": 188114, "epoch": 2266} {"train_loss": -23.97378921508789, "global_step": 188115, "epoch": 2266} {"train_loss": -24.17518424987793, "global_step": 188116, "epoch": 2266} {"train_loss": -24.457983016967773, "global_step": 188117, "epoch": 2266} {"train_loss": -23.924070358276367, "global_step": 188118, "epoch": 2266} {"train_loss": -23.809843063354492, "global_step": 188119, "epoch": 2266} {"train_loss": -23.85502052307129, "global_step": 188120, "epoch": 2266} {"train_loss": -24.158531188964844, "global_step": 188121, "epoch": 2266} {"train_loss": -24.09296417236328, "global_step": 188122, "epoch": 2266} {"train_loss": -24.059650421142578, "global_step": 188123, "epoch": 2266} {"train_loss": -24.229785919189453, "global_step": 188124, "epoch": 2266} {"train_loss": -24.076276779174805, "global_step": 188125, "epoch": 2266} {"train_loss": -24.41893196105957, "global_step": 188126, "epoch": 2266} {"train_loss": -24.236858367919922, "global_step": 188127, "epoch": 2266} {"train_loss": -23.93302345275879, "global_step": 188128, "epoch": 2266} {"train_loss": -24.120908737182617, "global_step": 188129, "epoch": 2266} {"train_loss": -23.954954147338867, "global_step": 188130, "epoch": 2266} {"train_loss": -24.158836364746094, "global_step": 188131, "epoch": 2266} {"train_loss": -24.219709396362305, "global_step": 188132, "epoch": 2266} {"train_loss": -24.20420265197754, "global_step": 188133, "epoch": 2266} {"train_loss": -23.985036849975586, "global_step": 188134, "epoch": 2266} {"train_loss": -24.009201049804688, "global_step": 188135, "epoch": 2266} {"train_loss": -24.071325302124023, "global_step": 188136, "epoch": 2266} {"train_loss": -24.26744270324707, "global_step": 188137, "epoch": 2266} {"train_loss": -23.956186294555664, "global_step": 188138, "epoch": 2266} {"train_loss": -24.336599349975586, "global_step": 188139, "epoch": 2266} {"train_loss": -23.972675323486328, "global_step": 188140, "epoch": 2266} {"train_loss": -24.168291091918945, "global_step": 188141, "epoch": 2266} {"train_loss": -23.98728370666504, "global_step": 188142, "epoch": 2266} {"train_loss": -24.124374389648438, "global_step": 188143, "epoch": 2266} {"train_loss": -24.08563232421875, "global_step": 188144, "epoch": 2266} {"train_loss": -24.30057144165039, "global_step": 188145, "epoch": 2266} {"train_loss": -24.29155921936035, "global_step": 188146, "epoch": 2266} {"train_loss": -24.167760848999023, "global_step": 188147, "epoch": 2266} {"train_loss": -24.069223403930664, "global_step": 188148, "epoch": 2266} {"train_loss": -24.116668701171875, "global_step": 188149, "epoch": 2266} {"train_loss": -24.2462158203125, "global_step": 188150, "epoch": 2266} {"train_loss": -23.93037223815918, "global_step": 188151, "epoch": 2266} {"train_loss": -23.987197875976562, "global_step": 188152, "epoch": 2266} {"train_loss": -24.319543838500977, "global_step": 188153, "epoch": 2266} {"train_loss": -24.318801879882812, "global_step": 188154, "epoch": 2266} {"train_loss": -24.57898712158203, "global_step": 188155, "epoch": 2266} {"train_loss": -24.091543197631836, "global_step": 188156, "epoch": 2266} {"train_loss": -24.04636001586914, "global_step": 188157, "epoch": 2266} {"train_loss": -23.85738182067871, "global_step": 188158, "epoch": 2266} {"train_loss": -23.99187660217285, "global_step": 188159, "epoch": 2266} {"train_loss": -23.966093982558654, "global_step": 188160, "epoch": 2266, "val_loss": 6484340.0} {"train_loss": -23.690162658691406, "global_step": 188161, "epoch": 2267} {"train_loss": -23.218549728393555, "global_step": 188162, "epoch": 2267} {"train_loss": -23.348031997680664, "global_step": 188163, "epoch": 2267} {"train_loss": -23.835620880126953, "global_step": 188164, "epoch": 2267} {"train_loss": -23.68758201599121, "global_step": 188165, "epoch": 2267} {"train_loss": -22.913257598876953, "global_step": 188166, "epoch": 2267} {"train_loss": -23.54927635192871, "global_step": 188167, "epoch": 2267} {"train_loss": -23.792173385620117, "global_step": 188168, "epoch": 2267} {"train_loss": -23.429533004760742, "global_step": 188169, "epoch": 2267} {"train_loss": -23.700029373168945, "global_step": 188170, "epoch": 2267} {"train_loss": -23.569995880126953, "global_step": 188171, "epoch": 2267} {"train_loss": -23.827377319335938, "global_step": 188172, "epoch": 2267} {"train_loss": -23.61318588256836, "global_step": 188173, "epoch": 2267} {"train_loss": -23.504159927368164, "global_step": 188174, "epoch": 2267} {"train_loss": -23.57183074951172, "global_step": 188175, "epoch": 2267} {"train_loss": -23.505855560302734, "global_step": 188176, "epoch": 2267} {"train_loss": -23.89163589477539, "global_step": 188177, "epoch": 2267} {"train_loss": -23.74175453186035, "global_step": 188178, "epoch": 2267} {"train_loss": -23.5117244720459, "global_step": 188179, "epoch": 2267} {"train_loss": -23.551321029663086, "global_step": 188180, "epoch": 2267} {"train_loss": -24.029638290405273, "global_step": 188181, "epoch": 2267} {"train_loss": -23.469680786132812, "global_step": 188182, "epoch": 2267} {"train_loss": -23.663820266723633, "global_step": 188183, "epoch": 2267} {"train_loss": -23.279531478881836, "global_step": 188184, "epoch": 2267} {"train_loss": -23.732574462890625, "global_step": 188185, "epoch": 2267} {"train_loss": -23.743696212768555, "global_step": 188186, "epoch": 2267} {"train_loss": -23.664501190185547, "global_step": 188187, "epoch": 2267} {"train_loss": -23.714868545532227, "global_step": 188188, "epoch": 2267} {"train_loss": -23.578662872314453, "global_step": 188189, "epoch": 2267} {"train_loss": -23.781131744384766, "global_step": 188190, "epoch": 2267} {"train_loss": -23.77529525756836, "global_step": 188191, "epoch": 2267} {"train_loss": -23.948331832885742, "global_step": 188192, "epoch": 2267} {"train_loss": -23.514894485473633, "global_step": 188193, "epoch": 2267} {"train_loss": -23.81336784362793, "global_step": 188194, "epoch": 2267} {"train_loss": -23.84221076965332, "global_step": 188195, "epoch": 2267} {"train_loss": -24.20615005493164, "global_step": 188196, "epoch": 2267} {"train_loss": -23.917387008666992, "global_step": 188197, "epoch": 2267} {"train_loss": -23.947301864624023, "global_step": 188198, "epoch": 2267} {"train_loss": -24.012422561645508, "global_step": 188199, "epoch": 2267} {"train_loss": -23.775583267211914, "global_step": 188200, "epoch": 2267} {"train_loss": -24.36854362487793, "global_step": 188201, "epoch": 2267} {"train_loss": -24.22663688659668, "global_step": 188202, "epoch": 2267} {"train_loss": -23.665813446044922, "global_step": 188203, "epoch": 2267} {"train_loss": -24.15370750427246, "global_step": 188204, "epoch": 2267} {"train_loss": -24.17426109313965, "global_step": 188205, "epoch": 2267} {"train_loss": -24.163808822631836, "global_step": 188206, "epoch": 2267} {"train_loss": -23.83738136291504, "global_step": 188207, "epoch": 2267} {"train_loss": -24.405378341674805, "global_step": 188208, "epoch": 2267} {"train_loss": -23.881086349487305, "global_step": 188209, "epoch": 2267} {"train_loss": -24.12738609313965, "global_step": 188210, "epoch": 2267} {"train_loss": -23.916696548461914, "global_step": 188211, "epoch": 2267} {"train_loss": -23.910261154174805, "global_step": 188212, "epoch": 2267} {"train_loss": -23.910202026367188, "global_step": 188213, "epoch": 2267} {"train_loss": -24.432674407958984, "global_step": 188214, "epoch": 2267} {"train_loss": -23.940494537353516, "global_step": 188215, "epoch": 2267} {"train_loss": -24.018985748291016, "global_step": 188216, "epoch": 2267} {"train_loss": -24.203861236572266, "global_step": 188217, "epoch": 2267} {"train_loss": -23.969358444213867, "global_step": 188218, "epoch": 2267} {"train_loss": -24.067670822143555, "global_step": 188219, "epoch": 2267} {"train_loss": -23.837247848510742, "global_step": 188220, "epoch": 2267} {"train_loss": -24.102807998657227, "global_step": 188221, "epoch": 2267} {"train_loss": -23.58063316345215, "global_step": 188222, "epoch": 2267} {"train_loss": -24.084436416625977, "global_step": 188223, "epoch": 2267} {"train_loss": -24.67359733581543, "global_step": 188224, "epoch": 2267} {"train_loss": -24.235340118408203, "global_step": 188225, "epoch": 2267} {"train_loss": -24.323444366455078, "global_step": 188226, "epoch": 2267} {"train_loss": -24.16750144958496, "global_step": 188227, "epoch": 2267} {"train_loss": -24.344987869262695, "global_step": 188228, "epoch": 2267} {"train_loss": -24.067705154418945, "global_step": 188229, "epoch": 2267} {"train_loss": -24.06862449645996, "global_step": 188230, "epoch": 2267} {"train_loss": -24.31330680847168, "global_step": 188231, "epoch": 2267} {"train_loss": -24.422870635986328, "global_step": 188232, "epoch": 2267} {"train_loss": -24.7098388671875, "global_step": 188233, "epoch": 2267} {"train_loss": -24.367597579956055, "global_step": 188234, "epoch": 2267} {"train_loss": -24.053726196289062, "global_step": 188235, "epoch": 2267} {"train_loss": -24.236906051635742, "global_step": 188236, "epoch": 2267} {"train_loss": -24.22467613220215, "global_step": 188237, "epoch": 2267} {"train_loss": -24.31100845336914, "global_step": 188238, "epoch": 2267} {"train_loss": -23.787506103515625, "global_step": 188239, "epoch": 2267} {"train_loss": -24.12485694885254, "global_step": 188240, "epoch": 2267} {"train_loss": -24.156269073486328, "global_step": 188241, "epoch": 2267} {"train_loss": -23.84907341003418, "global_step": 188242, "epoch": 2267} {"train_loss": -23.88824382460261, "global_step": 188243, "epoch": 2267, "val_loss": 6700830.0} {"train_loss": -22.706621170043945, "global_step": 188244, "epoch": 2268} {"train_loss": -21.13726806640625, "global_step": 188245, "epoch": 2268} {"train_loss": -22.825281143188477, "global_step": 188246, "epoch": 2268} {"train_loss": -21.824064254760742, "global_step": 188247, "epoch": 2268} {"train_loss": -22.116270065307617, "global_step": 188248, "epoch": 2268} {"train_loss": -23.22820472717285, "global_step": 188249, "epoch": 2268} {"train_loss": -22.716344833374023, "global_step": 188250, "epoch": 2268} {"train_loss": -22.794706344604492, "global_step": 188251, "epoch": 2268} {"train_loss": -22.834545135498047, "global_step": 188252, "epoch": 2268} {"train_loss": -22.89238929748535, "global_step": 188253, "epoch": 2268} {"train_loss": -23.197643280029297, "global_step": 188254, "epoch": 2268} {"train_loss": -22.974536895751953, "global_step": 188255, "epoch": 2268} {"train_loss": -23.043752670288086, "global_step": 188256, "epoch": 2268} {"train_loss": -23.12712860107422, "global_step": 188257, "epoch": 2268} {"train_loss": -23.374225616455078, "global_step": 188258, "epoch": 2268} {"train_loss": -23.35848045349121, "global_step": 188259, "epoch": 2268} {"train_loss": -22.803180694580078, "global_step": 188260, "epoch": 2268} {"train_loss": -22.86690902709961, "global_step": 188261, "epoch": 2268} {"train_loss": -23.383121490478516, "global_step": 188262, "epoch": 2268} {"train_loss": -23.081689834594727, "global_step": 188263, "epoch": 2268} {"train_loss": -23.451648712158203, "global_step": 188264, "epoch": 2268} {"train_loss": -23.31477165222168, "global_step": 188265, "epoch": 2268} {"train_loss": -23.4279727935791, "global_step": 188266, "epoch": 2268} {"train_loss": -23.83159828186035, "global_step": 188267, "epoch": 2268} {"train_loss": -23.434329986572266, "global_step": 188268, "epoch": 2268} {"train_loss": -23.281972885131836, "global_step": 188269, "epoch": 2268} {"train_loss": -23.248029708862305, "global_step": 188270, "epoch": 2268} {"train_loss": -24.028303146362305, "global_step": 188271, "epoch": 2268} {"train_loss": -23.628019332885742, "global_step": 188272, "epoch": 2268} {"train_loss": -23.699066162109375, "global_step": 188273, "epoch": 2268} {"train_loss": -23.568788528442383, "global_step": 188274, "epoch": 2268} {"train_loss": -23.96199607849121, "global_step": 188275, "epoch": 2268} {"train_loss": -23.753881454467773, "global_step": 188276, "epoch": 2268} {"train_loss": -23.731103897094727, "global_step": 188277, "epoch": 2268} {"train_loss": -23.49709701538086, "global_step": 188278, "epoch": 2268} {"train_loss": -23.90460777282715, "global_step": 188279, "epoch": 2268} {"train_loss": -24.192689895629883, "global_step": 188280, "epoch": 2268} {"train_loss": -24.04541015625, "global_step": 188281, "epoch": 2268} {"train_loss": -23.802078247070312, "global_step": 188282, "epoch": 2268} {"train_loss": -23.858701705932617, "global_step": 188283, "epoch": 2268} {"train_loss": -24.09054946899414, "global_step": 188284, "epoch": 2268} {"train_loss": -23.87507438659668, "global_step": 188285, "epoch": 2268} {"train_loss": -23.947843551635742, "global_step": 188286, "epoch": 2268} {"train_loss": -24.01435661315918, "global_step": 188287, "epoch": 2268} {"train_loss": -23.996122360229492, "global_step": 188288, "epoch": 2268} {"train_loss": -23.747936248779297, "global_step": 188289, "epoch": 2268} {"train_loss": -24.656599044799805, "global_step": 188290, "epoch": 2268} {"train_loss": -23.870500564575195, "global_step": 188291, "epoch": 2268} {"train_loss": -23.949567794799805, "global_step": 188292, "epoch": 2268} {"train_loss": -24.02412223815918, "global_step": 188293, "epoch": 2268} {"train_loss": -24.119112014770508, "global_step": 188294, "epoch": 2268} {"train_loss": -23.82175636291504, "global_step": 188295, "epoch": 2268} {"train_loss": -24.01173973083496, "global_step": 188296, "epoch": 2268} {"train_loss": -23.93583106994629, "global_step": 188297, "epoch": 2268} {"train_loss": -23.452898025512695, "global_step": 188298, "epoch": 2268} {"train_loss": -24.283859252929688, "global_step": 188299, "epoch": 2268} {"train_loss": -24.1570987701416, "global_step": 188300, "epoch": 2268} {"train_loss": -23.953948974609375, "global_step": 188301, "epoch": 2268} {"train_loss": -24.09656524658203, "global_step": 188302, "epoch": 2268} {"train_loss": -23.928146362304688, "global_step": 188303, "epoch": 2268} {"train_loss": -23.86979103088379, "global_step": 188304, "epoch": 2268} {"train_loss": -23.55170249938965, "global_step": 188305, "epoch": 2268} {"train_loss": -24.02735710144043, "global_step": 188306, "epoch": 2268} {"train_loss": -23.7104549407959, "global_step": 188307, "epoch": 2268} {"train_loss": -24.034753799438477, "global_step": 188308, "epoch": 2268} {"train_loss": -23.904577255249023, "global_step": 188309, "epoch": 2268} {"train_loss": -23.659658432006836, "global_step": 188310, "epoch": 2268} {"train_loss": -24.121267318725586, "global_step": 188311, "epoch": 2268} {"train_loss": -24.244356155395508, "global_step": 188312, "epoch": 2268} {"train_loss": -23.981321334838867, "global_step": 188313, "epoch": 2268} {"train_loss": -24.250276565551758, "global_step": 188314, "epoch": 2268} {"train_loss": -24.118789672851562, "global_step": 188315, "epoch": 2268} {"train_loss": -23.61980628967285, "global_step": 188316, "epoch": 2268} {"train_loss": -23.85495948791504, "global_step": 188317, "epoch": 2268} {"train_loss": -24.157743453979492, "global_step": 188318, "epoch": 2268} {"train_loss": -23.883926391601562, "global_step": 188319, "epoch": 2268} {"train_loss": -23.860013961791992, "global_step": 188320, "epoch": 2268} {"train_loss": -23.809066772460938, "global_step": 188321, "epoch": 2268} {"train_loss": -24.065847396850586, "global_step": 188322, "epoch": 2268} {"train_loss": -24.21712303161621, "global_step": 188323, "epoch": 2268} {"train_loss": -24.472274780273438, "global_step": 188324, "epoch": 2268} {"train_loss": -24.29066276550293, "global_step": 188325, "epoch": 2268} {"train_loss": -23.61689944439624, "global_step": 188326, "epoch": 2268, "val_loss": 6524318.5} {"train_loss": -23.817129135131836, "global_step": 188327, "epoch": 2269} {"train_loss": -23.71876335144043, "global_step": 188328, "epoch": 2269} {"train_loss": -23.489002227783203, "global_step": 188329, "epoch": 2269} {"train_loss": -23.145246505737305, "global_step": 188330, "epoch": 2269} {"train_loss": -23.78217124938965, "global_step": 188331, "epoch": 2269} {"train_loss": -23.25141716003418, "global_step": 188332, "epoch": 2269} {"train_loss": -23.709632873535156, "global_step": 188333, "epoch": 2269} {"train_loss": -24.09331703186035, "global_step": 188334, "epoch": 2269} {"train_loss": -23.481229782104492, "global_step": 188335, "epoch": 2269} {"train_loss": -23.22651481628418, "global_step": 188336, "epoch": 2269} {"train_loss": -23.85503578186035, "global_step": 188337, "epoch": 2269} {"train_loss": -23.588275909423828, "global_step": 188338, "epoch": 2269} {"train_loss": -23.78934097290039, "global_step": 188339, "epoch": 2269} {"train_loss": -23.419187545776367, "global_step": 188340, "epoch": 2269} {"train_loss": -23.55821990966797, "global_step": 188341, "epoch": 2269} {"train_loss": -23.324243545532227, "global_step": 188342, "epoch": 2269} {"train_loss": -23.99875831604004, "global_step": 188343, "epoch": 2269} {"train_loss": -23.765464782714844, "global_step": 188344, "epoch": 2269} {"train_loss": -24.10162353515625, "global_step": 188345, "epoch": 2269} {"train_loss": -24.154699325561523, "global_step": 188346, "epoch": 2269} {"train_loss": -23.35843849182129, "global_step": 188347, "epoch": 2269} {"train_loss": -23.774534225463867, "global_step": 188348, "epoch": 2269} {"train_loss": -24.267362594604492, "global_step": 188349, "epoch": 2269} {"train_loss": -23.793447494506836, "global_step": 188350, "epoch": 2269} {"train_loss": -24.40168571472168, "global_step": 188351, "epoch": 2269} {"train_loss": -23.74228858947754, "global_step": 188352, "epoch": 2269} {"train_loss": -24.146135330200195, "global_step": 188353, "epoch": 2269} {"train_loss": -23.806364059448242, "global_step": 188354, "epoch": 2269} {"train_loss": -23.952539443969727, "global_step": 188355, "epoch": 2269} {"train_loss": -24.22154998779297, "global_step": 188356, "epoch": 2269} {"train_loss": -24.092981338500977, "global_step": 188357, "epoch": 2269} {"train_loss": -24.075698852539062, "global_step": 188358, "epoch": 2269} {"train_loss": -24.269113540649414, "global_step": 188359, "epoch": 2269} {"train_loss": -23.958072662353516, "global_step": 188360, "epoch": 2269} {"train_loss": -24.18875503540039, "global_step": 188361, "epoch": 2269} {"train_loss": -24.285776138305664, "global_step": 188362, "epoch": 2269} {"train_loss": -24.46189308166504, "global_step": 188363, "epoch": 2269} {"train_loss": -24.118221282958984, "global_step": 188364, "epoch": 2269} {"train_loss": -24.17329216003418, "global_step": 188365, "epoch": 2269} {"train_loss": -24.38739013671875, "global_step": 188366, "epoch": 2269} {"train_loss": -24.31423568725586, "global_step": 188367, "epoch": 2269} {"train_loss": -24.121234893798828, "global_step": 188368, "epoch": 2269} {"train_loss": -24.218013763427734, "global_step": 188369, "epoch": 2269} {"train_loss": -24.381135940551758, "global_step": 188370, "epoch": 2269} {"train_loss": -24.16359519958496, "global_step": 188371, "epoch": 2269} {"train_loss": -24.083402633666992, "global_step": 188372, "epoch": 2269} {"train_loss": -24.008193969726562, "global_step": 188373, "epoch": 2269} {"train_loss": -23.552915573120117, "global_step": 188374, "epoch": 2269} {"train_loss": -23.819171905517578, "global_step": 188375, "epoch": 2269} {"train_loss": -23.939611434936523, "global_step": 188376, "epoch": 2269} {"train_loss": -24.10914421081543, "global_step": 188377, "epoch": 2269} {"train_loss": -23.89212989807129, "global_step": 188378, "epoch": 2269} {"train_loss": -23.821765899658203, "global_step": 188379, "epoch": 2269} {"train_loss": -24.05967140197754, "global_step": 188380, "epoch": 2269} {"train_loss": -23.857833862304688, "global_step": 188381, "epoch": 2269} {"train_loss": -24.320964813232422, "global_step": 188382, "epoch": 2269} {"train_loss": -23.663013458251953, "global_step": 188383, "epoch": 2269} {"train_loss": -24.087757110595703, "global_step": 188384, "epoch": 2269} {"train_loss": -23.885324478149414, "global_step": 188385, "epoch": 2269} {"train_loss": -23.924312591552734, "global_step": 188386, "epoch": 2269} {"train_loss": -24.008344650268555, "global_step": 188387, "epoch": 2269} {"train_loss": -23.664093017578125, "global_step": 188388, "epoch": 2269} {"train_loss": -24.34946632385254, "global_step": 188389, "epoch": 2269} {"train_loss": -24.26851463317871, "global_step": 188390, "epoch": 2269} {"train_loss": -23.917001724243164, "global_step": 188391, "epoch": 2269} {"train_loss": -24.18739891052246, "global_step": 188392, "epoch": 2269} {"train_loss": -24.065053939819336, "global_step": 188393, "epoch": 2269} {"train_loss": -24.19109535217285, "global_step": 188394, "epoch": 2269} {"train_loss": -23.855030059814453, "global_step": 188395, "epoch": 2269} {"train_loss": -24.07289695739746, "global_step": 188396, "epoch": 2269} {"train_loss": -24.250795364379883, "global_step": 188397, "epoch": 2269} {"train_loss": -24.0141544342041, "global_step": 188398, "epoch": 2269} {"train_loss": -24.64002799987793, "global_step": 188399, "epoch": 2269} {"train_loss": -24.210418701171875, "global_step": 188400, "epoch": 2269} {"train_loss": -24.084321975708008, "global_step": 188401, "epoch": 2269} {"train_loss": -24.158065795898438, "global_step": 188402, "epoch": 2269} {"train_loss": -23.980300903320312, "global_step": 188403, "epoch": 2269} {"train_loss": -24.158681869506836, "global_step": 188404, "epoch": 2269} {"train_loss": -24.201942443847656, "global_step": 188405, "epoch": 2269} {"train_loss": -24.085079193115234, "global_step": 188406, "epoch": 2269} {"train_loss": -24.105758666992188, "global_step": 188407, "epoch": 2269} {"train_loss": -23.991857528686523, "global_step": 188408, "epoch": 2269} {"train_loss": -23.963921604386297, "global_step": 188409, "epoch": 2269, "val_loss": 6588934.0} {"train_loss": -23.83666229248047, "global_step": 188410, "epoch": 2270} {"train_loss": -22.631677627563477, "global_step": 188411, "epoch": 2270} {"train_loss": -22.872440338134766, "global_step": 188412, "epoch": 2270} {"train_loss": -23.430692672729492, "global_step": 188413, "epoch": 2270} {"train_loss": -23.681732177734375, "global_step": 188414, "epoch": 2270} {"train_loss": -23.625080108642578, "global_step": 188415, "epoch": 2270} {"train_loss": -23.492292404174805, "global_step": 188416, "epoch": 2270} {"train_loss": -23.90094566345215, "global_step": 188417, "epoch": 2270} {"train_loss": -23.36770248413086, "global_step": 188418, "epoch": 2270} {"train_loss": -23.685800552368164, "global_step": 188419, "epoch": 2270} {"train_loss": -23.3512020111084, "global_step": 188420, "epoch": 2270} {"train_loss": -23.806867599487305, "global_step": 188421, "epoch": 2270} {"train_loss": -23.77117919921875, "global_step": 188422, "epoch": 2270} {"train_loss": -23.640335083007812, "global_step": 188423, "epoch": 2270} {"train_loss": -23.806499481201172, "global_step": 188424, "epoch": 2270} {"train_loss": -24.158994674682617, "global_step": 188425, "epoch": 2270} {"train_loss": -23.892141342163086, "global_step": 188426, "epoch": 2270} {"train_loss": -23.987396240234375, "global_step": 188427, "epoch": 2270} {"train_loss": -23.5954647064209, "global_step": 188428, "epoch": 2270} {"train_loss": -23.94454002380371, "global_step": 188429, "epoch": 2270} {"train_loss": -23.317493438720703, "global_step": 188430, "epoch": 2270} {"train_loss": -23.700885772705078, "global_step": 188431, "epoch": 2270} {"train_loss": -24.2405948638916, "global_step": 188432, "epoch": 2270} {"train_loss": -23.702701568603516, "global_step": 188433, "epoch": 2270} {"train_loss": -24.117345809936523, "global_step": 188434, "epoch": 2270} {"train_loss": -23.619693756103516, "global_step": 188435, "epoch": 2270} {"train_loss": -23.793704986572266, "global_step": 188436, "epoch": 2270} {"train_loss": -23.927749633789062, "global_step": 188437, "epoch": 2270} {"train_loss": -23.967308044433594, "global_step": 188438, "epoch": 2270} {"train_loss": -24.001554489135742, "global_step": 188439, "epoch": 2270} {"train_loss": -23.9422550201416, "global_step": 188440, "epoch": 2270} {"train_loss": -23.908666610717773, "global_step": 188441, "epoch": 2270} {"train_loss": -23.85920524597168, "global_step": 188442, "epoch": 2270} {"train_loss": -23.850133895874023, "global_step": 188443, "epoch": 2270} {"train_loss": -24.438596725463867, "global_step": 188444, "epoch": 2270} {"train_loss": -24.178058624267578, "global_step": 188445, "epoch": 2270} {"train_loss": -24.261743545532227, "global_step": 188446, "epoch": 2270} {"train_loss": -23.956750869750977, "global_step": 188447, "epoch": 2270} {"train_loss": -23.913665771484375, "global_step": 188448, "epoch": 2270} {"train_loss": -24.05257225036621, "global_step": 188449, "epoch": 2270} {"train_loss": -23.83070945739746, "global_step": 188450, "epoch": 2270} {"train_loss": -24.468950271606445, "global_step": 188451, "epoch": 2270} {"train_loss": -24.46920394897461, "global_step": 188452, "epoch": 2270} {"train_loss": -23.73508071899414, "global_step": 188453, "epoch": 2270} {"train_loss": -24.021535873413086, "global_step": 188454, "epoch": 2270} {"train_loss": -23.939950942993164, "global_step": 188455, "epoch": 2270} {"train_loss": -23.950824737548828, "global_step": 188456, "epoch": 2270} {"train_loss": -23.849599838256836, "global_step": 188457, "epoch": 2270} {"train_loss": -23.85861587524414, "global_step": 188458, "epoch": 2270} {"train_loss": -23.842960357666016, "global_step": 188459, "epoch": 2270} {"train_loss": -23.996843338012695, "global_step": 188460, "epoch": 2270} {"train_loss": -24.34333038330078, "global_step": 188461, "epoch": 2270} {"train_loss": -24.09931755065918, "global_step": 188462, "epoch": 2270} {"train_loss": -24.066162109375, "global_step": 188463, "epoch": 2270} {"train_loss": -23.90748405456543, "global_step": 188464, "epoch": 2270} {"train_loss": -24.3084716796875, "global_step": 188465, "epoch": 2270} {"train_loss": -24.106107711791992, "global_step": 188466, "epoch": 2270} {"train_loss": -24.127445220947266, "global_step": 188467, "epoch": 2270} {"train_loss": -24.209911346435547, "global_step": 188468, "epoch": 2270} {"train_loss": -24.29366111755371, "global_step": 188469, "epoch": 2270} {"train_loss": -24.31048583984375, "global_step": 188470, "epoch": 2270} {"train_loss": -23.94991111755371, "global_step": 188471, "epoch": 2270} {"train_loss": -24.037809371948242, "global_step": 188472, "epoch": 2270} {"train_loss": -24.238744735717773, "global_step": 188473, "epoch": 2270} {"train_loss": -24.33999252319336, "global_step": 188474, "epoch": 2270} {"train_loss": -24.370615005493164, "global_step": 188475, "epoch": 2270} {"train_loss": -24.14874839782715, "global_step": 188476, "epoch": 2270} {"train_loss": -24.373306274414062, "global_step": 188477, "epoch": 2270} {"train_loss": -24.0154972076416, "global_step": 188478, "epoch": 2270} {"train_loss": -24.5390682220459, "global_step": 188479, "epoch": 2270} {"train_loss": -24.35580825805664, "global_step": 188480, "epoch": 2270} {"train_loss": -24.474958419799805, "global_step": 188481, "epoch": 2270} {"train_loss": -24.149023056030273, "global_step": 188482, "epoch": 2270} {"train_loss": -24.196287155151367, "global_step": 188483, "epoch": 2270} {"train_loss": -24.408151626586914, "global_step": 188484, "epoch": 2270} {"train_loss": -24.09372329711914, "global_step": 188485, "epoch": 2270} {"train_loss": -24.48334312438965, "global_step": 188486, "epoch": 2270} {"train_loss": -24.189111709594727, "global_step": 188487, "epoch": 2270} {"train_loss": -23.65428352355957, "global_step": 188488, "epoch": 2270} {"train_loss": -24.430774688720703, "global_step": 188489, "epoch": 2270} {"train_loss": -24.19344711303711, "global_step": 188490, "epoch": 2270} {"train_loss": -24.00058364868164, "global_step": 188491, "epoch": 2270} {"train_loss": -23.989649807114198, "global_step": 188492, "epoch": 2270, "val_loss": 6565979.5} {"train_loss": -23.632095336914062, "global_step": 188493, "epoch": 2271} {"train_loss": -23.519824981689453, "global_step": 188494, "epoch": 2271} {"train_loss": -24.365686416625977, "global_step": 188495, "epoch": 2271} {"train_loss": -23.560440063476562, "global_step": 188496, "epoch": 2271} {"train_loss": -24.036062240600586, "global_step": 188497, "epoch": 2271} {"train_loss": -23.953256607055664, "global_step": 188498, "epoch": 2271} {"train_loss": -23.974576950073242, "global_step": 188499, "epoch": 2271} {"train_loss": -23.435400009155273, "global_step": 188500, "epoch": 2271} {"train_loss": -24.14711570739746, "global_step": 188501, "epoch": 2271} {"train_loss": -24.05282974243164, "global_step": 188502, "epoch": 2271} {"train_loss": -23.532058715820312, "global_step": 188503, "epoch": 2271} {"train_loss": -24.22365379333496, "global_step": 188504, "epoch": 2271} {"train_loss": -23.955570220947266, "global_step": 188505, "epoch": 2271} {"train_loss": -23.739839553833008, "global_step": 188506, "epoch": 2271} {"train_loss": -23.985387802124023, "global_step": 188507, "epoch": 2271} {"train_loss": -23.996679306030273, "global_step": 188508, "epoch": 2271} {"train_loss": -24.030515670776367, "global_step": 188509, "epoch": 2271} {"train_loss": -24.0307674407959, "global_step": 188510, "epoch": 2271} {"train_loss": -24.005399703979492, "global_step": 188511, "epoch": 2271} {"train_loss": -24.119577407836914, "global_step": 188512, "epoch": 2271} {"train_loss": -24.01090431213379, "global_step": 188513, "epoch": 2271} {"train_loss": -24.20672607421875, "global_step": 188514, "epoch": 2271} {"train_loss": -23.880170822143555, "global_step": 188515, "epoch": 2271} {"train_loss": -24.39143180847168, "global_step": 188516, "epoch": 2271} {"train_loss": -23.878313064575195, "global_step": 188517, "epoch": 2271} {"train_loss": -23.95313835144043, "global_step": 188518, "epoch": 2271} {"train_loss": -24.056310653686523, "global_step": 188519, "epoch": 2271} {"train_loss": -24.345998764038086, "global_step": 188520, "epoch": 2271} {"train_loss": -23.730878829956055, "global_step": 188521, "epoch": 2271} {"train_loss": -23.782323837280273, "global_step": 188522, "epoch": 2271} {"train_loss": -23.88360595703125, "global_step": 188523, "epoch": 2271} {"train_loss": -24.146854400634766, "global_step": 188524, "epoch": 2271} {"train_loss": -23.82904815673828, "global_step": 188525, "epoch": 2271} {"train_loss": -23.76729965209961, "global_step": 188526, "epoch": 2271} {"train_loss": -24.2034912109375, "global_step": 188527, "epoch": 2271} {"train_loss": -24.201841354370117, "global_step": 188528, "epoch": 2271} {"train_loss": -23.68584632873535, "global_step": 188529, "epoch": 2271} {"train_loss": -24.40618133544922, "global_step": 188530, "epoch": 2271} {"train_loss": -24.086050033569336, "global_step": 188531, "epoch": 2271} {"train_loss": -23.766878128051758, "global_step": 188532, "epoch": 2271} {"train_loss": -24.252506256103516, "global_step": 188533, "epoch": 2271} {"train_loss": -24.4187068939209, "global_step": 188534, "epoch": 2271} {"train_loss": -23.908939361572266, "global_step": 188535, "epoch": 2271} {"train_loss": -23.952152252197266, "global_step": 188536, "epoch": 2271} {"train_loss": -24.016864776611328, "global_step": 188537, "epoch": 2271} {"train_loss": -24.47304344177246, "global_step": 188538, "epoch": 2271} {"train_loss": -24.46150016784668, "global_step": 188539, "epoch": 2271} {"train_loss": -24.325992584228516, "global_step": 188540, "epoch": 2271} {"train_loss": -23.810972213745117, "global_step": 188541, "epoch": 2271} {"train_loss": -24.013580322265625, "global_step": 188542, "epoch": 2271} {"train_loss": -23.731948852539062, "global_step": 188543, "epoch": 2271} {"train_loss": -24.04447364807129, "global_step": 188544, "epoch": 2271} {"train_loss": -23.748920440673828, "global_step": 188545, "epoch": 2271} {"train_loss": -23.96491813659668, "global_step": 188546, "epoch": 2271} {"train_loss": -23.7277889251709, "global_step": 188547, "epoch": 2271} {"train_loss": -23.608234405517578, "global_step": 188548, "epoch": 2271} {"train_loss": -24.29347038269043, "global_step": 188549, "epoch": 2271} {"train_loss": -23.78090476989746, "global_step": 188550, "epoch": 2271} {"train_loss": -23.6945858001709, "global_step": 188551, "epoch": 2271} {"train_loss": -24.24563980102539, "global_step": 188552, "epoch": 2271} {"train_loss": -24.012226104736328, "global_step": 188553, "epoch": 2271} {"train_loss": -23.702713012695312, "global_step": 188554, "epoch": 2271} {"train_loss": -24.105497360229492, "global_step": 188555, "epoch": 2271} {"train_loss": -24.023927688598633, "global_step": 188556, "epoch": 2271} {"train_loss": -23.891355514526367, "global_step": 188557, "epoch": 2271} {"train_loss": -23.933374404907227, "global_step": 188558, "epoch": 2271} {"train_loss": -24.185346603393555, "global_step": 188559, "epoch": 2271} {"train_loss": -23.756086349487305, "global_step": 188560, "epoch": 2271} {"train_loss": -24.217750549316406, "global_step": 188561, "epoch": 2271} {"train_loss": -24.1287899017334, "global_step": 188562, "epoch": 2271} {"train_loss": -24.342309951782227, "global_step": 188563, "epoch": 2271} {"train_loss": -24.28590965270996, "global_step": 188564, "epoch": 2271} {"train_loss": -24.11793327331543, "global_step": 188565, "epoch": 2271} {"train_loss": -24.155302047729492, "global_step": 188566, "epoch": 2271} {"train_loss": -24.113988876342773, "global_step": 188567, "epoch": 2271} {"train_loss": -24.136274337768555, "global_step": 188568, "epoch": 2271} {"train_loss": -24.097455978393555, "global_step": 188569, "epoch": 2271} {"train_loss": -24.157867431640625, "global_step": 188570, "epoch": 2271} {"train_loss": -24.32423210144043, "global_step": 188571, "epoch": 2271} {"train_loss": -23.98902702331543, "global_step": 188572, "epoch": 2271} {"train_loss": -23.600814819335938, "global_step": 188573, "epoch": 2271} {"train_loss": -23.55367088317871, "global_step": 188574, "epoch": 2271} {"train_loss": -24.022559522146203, "global_step": 188575, "epoch": 2271, "val_loss": 6577064.0} {"train_loss": -23.40244483947754, "global_step": 188576, "epoch": 2272} {"train_loss": -23.915592193603516, "global_step": 188577, "epoch": 2272} {"train_loss": -23.585561752319336, "global_step": 188578, "epoch": 2272} {"train_loss": -23.525358200073242, "global_step": 188579, "epoch": 2272} {"train_loss": -23.252622604370117, "global_step": 188580, "epoch": 2272} {"train_loss": -23.82720947265625, "global_step": 188581, "epoch": 2272} {"train_loss": -23.64884376525879, "global_step": 188582, "epoch": 2272} {"train_loss": -23.763275146484375, "global_step": 188583, "epoch": 2272} {"train_loss": -22.995859146118164, "global_step": 188584, "epoch": 2272} {"train_loss": -23.826440811157227, "global_step": 188585, "epoch": 2272} {"train_loss": -23.364032745361328, "global_step": 188586, "epoch": 2272} {"train_loss": -23.401348114013672, "global_step": 188587, "epoch": 2272} {"train_loss": -24.160186767578125, "global_step": 188588, "epoch": 2272} {"train_loss": -23.61400032043457, "global_step": 188589, "epoch": 2272} {"train_loss": -23.9304256439209, "global_step": 188590, "epoch": 2272} {"train_loss": -23.65807342529297, "global_step": 188591, "epoch": 2272} {"train_loss": -23.494115829467773, "global_step": 188592, "epoch": 2272} {"train_loss": -23.779958724975586, "global_step": 188593, "epoch": 2272} {"train_loss": -23.755584716796875, "global_step": 188594, "epoch": 2272} {"train_loss": -23.428436279296875, "global_step": 188595, "epoch": 2272} {"train_loss": -23.9781551361084, "global_step": 188596, "epoch": 2272} {"train_loss": -23.627822875976562, "global_step": 188597, "epoch": 2272} {"train_loss": -23.41545295715332, "global_step": 188598, "epoch": 2272} {"train_loss": -24.31302261352539, "global_step": 188599, "epoch": 2272} {"train_loss": -24.109983444213867, "global_step": 188600, "epoch": 2272} {"train_loss": -23.92384147644043, "global_step": 188601, "epoch": 2272} {"train_loss": -24.069442749023438, "global_step": 188602, "epoch": 2272} {"train_loss": -23.929813385009766, "global_step": 188603, "epoch": 2272} {"train_loss": -24.057170867919922, "global_step": 188604, "epoch": 2272} {"train_loss": -23.697940826416016, "global_step": 188605, "epoch": 2272} {"train_loss": -23.883996963500977, "global_step": 188606, "epoch": 2272} {"train_loss": -24.296772003173828, "global_step": 188607, "epoch": 2272} {"train_loss": -24.11720848083496, "global_step": 188608, "epoch": 2272} {"train_loss": -23.80604362487793, "global_step": 188609, "epoch": 2272} {"train_loss": -23.9179744720459, "global_step": 188610, "epoch": 2272} {"train_loss": -24.14045524597168, "global_step": 188611, "epoch": 2272} {"train_loss": -24.453075408935547, "global_step": 188612, "epoch": 2272} {"train_loss": -24.2576904296875, "global_step": 188613, "epoch": 2272} {"train_loss": -23.908674240112305, "global_step": 188614, "epoch": 2272} {"train_loss": -23.928831100463867, "global_step": 188615, "epoch": 2272} {"train_loss": -23.862262725830078, "global_step": 188616, "epoch": 2272} {"train_loss": -24.46630096435547, "global_step": 188617, "epoch": 2272} {"train_loss": -23.698989868164062, "global_step": 188618, "epoch": 2272} {"train_loss": -24.096555709838867, "global_step": 188619, "epoch": 2272} {"train_loss": -24.015613555908203, "global_step": 188620, "epoch": 2272} {"train_loss": -24.2727108001709, "global_step": 188621, "epoch": 2272} {"train_loss": -24.171585083007812, "global_step": 188622, "epoch": 2272} {"train_loss": -24.042875289916992, "global_step": 188623, "epoch": 2272} {"train_loss": -24.164735794067383, "global_step": 188624, "epoch": 2272} {"train_loss": -23.378799438476562, "global_step": 188625, "epoch": 2272} {"train_loss": -24.378097534179688, "global_step": 188626, "epoch": 2272} {"train_loss": -23.977434158325195, "global_step": 188627, "epoch": 2272} {"train_loss": -23.467586517333984, "global_step": 188628, "epoch": 2272} {"train_loss": -23.9425106048584, "global_step": 188629, "epoch": 2272} {"train_loss": -24.162826538085938, "global_step": 188630, "epoch": 2272} {"train_loss": -24.059226989746094, "global_step": 188631, "epoch": 2272} {"train_loss": -23.99161720275879, "global_step": 188632, "epoch": 2272} {"train_loss": -23.865514755249023, "global_step": 188633, "epoch": 2272} {"train_loss": -24.07600212097168, "global_step": 188634, "epoch": 2272} {"train_loss": -23.854001998901367, "global_step": 188635, "epoch": 2272} {"train_loss": -24.192625045776367, "global_step": 188636, "epoch": 2272} {"train_loss": -24.4241943359375, "global_step": 188637, "epoch": 2272} {"train_loss": -23.983108520507812, "global_step": 188638, "epoch": 2272} {"train_loss": -24.325820922851562, "global_step": 188639, "epoch": 2272} {"train_loss": -24.014524459838867, "global_step": 188640, "epoch": 2272} {"train_loss": -24.352542877197266, "global_step": 188641, "epoch": 2272} {"train_loss": -24.15230369567871, "global_step": 188642, "epoch": 2272} {"train_loss": -24.127479553222656, "global_step": 188643, "epoch": 2272} {"train_loss": -24.210195541381836, "global_step": 188644, "epoch": 2272} {"train_loss": -24.015798568725586, "global_step": 188645, "epoch": 2272} {"train_loss": -24.236894607543945, "global_step": 188646, "epoch": 2272} {"train_loss": -24.322240829467773, "global_step": 188647, "epoch": 2272} {"train_loss": -23.577911376953125, "global_step": 188648, "epoch": 2272} {"train_loss": -23.9798583984375, "global_step": 188649, "epoch": 2272} {"train_loss": -24.3559513092041, "global_step": 188650, "epoch": 2272} {"train_loss": -24.19761085510254, "global_step": 188651, "epoch": 2272} {"train_loss": -24.184146881103516, "global_step": 188652, "epoch": 2272} {"train_loss": -24.300146102905273, "global_step": 188653, "epoch": 2272} {"train_loss": -24.355539321899414, "global_step": 188654, "epoch": 2272} {"train_loss": -24.145681381225586, "global_step": 188655, "epoch": 2272} {"train_loss": -23.94563865661621, "global_step": 188656, "epoch": 2272} {"train_loss": -23.910987854003906, "global_step": 188657, "epoch": 2272} {"train_loss": -23.97065585492605, "global_step": 188658, "epoch": 2272, "val_loss": 6617841.0} {"train_loss": -23.605243682861328, "global_step": 188659, "epoch": 2273} {"train_loss": -23.697280883789062, "global_step": 188660, "epoch": 2273} {"train_loss": -23.121503829956055, "global_step": 188661, "epoch": 2273} {"train_loss": -23.655210494995117, "global_step": 188662, "epoch": 2273} {"train_loss": -23.87531852722168, "global_step": 188663, "epoch": 2273} {"train_loss": -23.777135848999023, "global_step": 188664, "epoch": 2273} {"train_loss": -23.64576530456543, "global_step": 188665, "epoch": 2273} {"train_loss": -23.5203800201416, "global_step": 188666, "epoch": 2273} {"train_loss": -23.75531578063965, "global_step": 188667, "epoch": 2273} {"train_loss": -23.699565887451172, "global_step": 188668, "epoch": 2273} {"train_loss": -23.472681045532227, "global_step": 188669, "epoch": 2273} {"train_loss": -23.8944091796875, "global_step": 188670, "epoch": 2273} {"train_loss": -23.598011016845703, "global_step": 188671, "epoch": 2273} {"train_loss": -23.835546493530273, "global_step": 188672, "epoch": 2273} {"train_loss": -24.004060745239258, "global_step": 188673, "epoch": 2273} {"train_loss": -23.883411407470703, "global_step": 188674, "epoch": 2273} {"train_loss": -23.86411476135254, "global_step": 188675, "epoch": 2273} {"train_loss": -23.989118576049805, "global_step": 188676, "epoch": 2273} {"train_loss": -23.816099166870117, "global_step": 188677, "epoch": 2273} {"train_loss": -23.958148956298828, "global_step": 188678, "epoch": 2273} {"train_loss": -24.23154640197754, "global_step": 188679, "epoch": 2273} {"train_loss": -23.921091079711914, "global_step": 188680, "epoch": 2273} {"train_loss": -23.802846908569336, "global_step": 188681, "epoch": 2273} {"train_loss": -23.97125816345215, "global_step": 188682, "epoch": 2273} {"train_loss": -23.760608673095703, "global_step": 188683, "epoch": 2273} {"train_loss": -24.225692749023438, "global_step": 188684, "epoch": 2273} {"train_loss": -24.30840492248535, "global_step": 188685, "epoch": 2273} {"train_loss": -23.706954956054688, "global_step": 188686, "epoch": 2273} {"train_loss": -24.029630661010742, "global_step": 188687, "epoch": 2273} {"train_loss": -24.213422775268555, "global_step": 188688, "epoch": 2273} {"train_loss": -24.205810546875, "global_step": 188689, "epoch": 2273} {"train_loss": -24.17186164855957, "global_step": 188690, "epoch": 2273} {"train_loss": -23.876911163330078, "global_step": 188691, "epoch": 2273} {"train_loss": -24.348291397094727, "global_step": 188692, "epoch": 2273} {"train_loss": -23.82215690612793, "global_step": 188693, "epoch": 2273} {"train_loss": -24.133634567260742, "global_step": 188694, "epoch": 2273} {"train_loss": -24.0391902923584, "global_step": 188695, "epoch": 2273} {"train_loss": -24.172117233276367, "global_step": 188696, "epoch": 2273} {"train_loss": -23.957975387573242, "global_step": 188697, "epoch": 2273} {"train_loss": -24.229412078857422, "global_step": 188698, "epoch": 2273} {"train_loss": -24.061092376708984, "global_step": 188699, "epoch": 2273} {"train_loss": -24.143070220947266, "global_step": 188700, "epoch": 2273} {"train_loss": -24.487085342407227, "global_step": 188701, "epoch": 2273} {"train_loss": -23.953414916992188, "global_step": 188702, "epoch": 2273} {"train_loss": -24.1967716217041, "global_step": 188703, "epoch": 2273} {"train_loss": -24.232519149780273, "global_step": 188704, "epoch": 2273} {"train_loss": -24.343332290649414, "global_step": 188705, "epoch": 2273} {"train_loss": -24.47633171081543, "global_step": 188706, "epoch": 2273} {"train_loss": -24.312314987182617, "global_step": 188707, "epoch": 2273} {"train_loss": -24.005186080932617, "global_step": 188708, "epoch": 2273} {"train_loss": -24.036540985107422, "global_step": 188709, "epoch": 2273} {"train_loss": -24.47743034362793, "global_step": 188710, "epoch": 2273} {"train_loss": -24.002376556396484, "global_step": 188711, "epoch": 2273} {"train_loss": -24.51935386657715, "global_step": 188712, "epoch": 2273} {"train_loss": -24.0424861907959, "global_step": 188713, "epoch": 2273} {"train_loss": -23.816923141479492, "global_step": 188714, "epoch": 2273} {"train_loss": -23.958951950073242, "global_step": 188715, "epoch": 2273} {"train_loss": -24.198028564453125, "global_step": 188716, "epoch": 2273} {"train_loss": -24.48630714416504, "global_step": 188717, "epoch": 2273} {"train_loss": -24.2822322845459, "global_step": 188718, "epoch": 2273} {"train_loss": -24.231515884399414, "global_step": 188719, "epoch": 2273} {"train_loss": -24.365570068359375, "global_step": 188720, "epoch": 2273} {"train_loss": -24.014545440673828, "global_step": 188721, "epoch": 2273} {"train_loss": -24.063461303710938, "global_step": 188722, "epoch": 2273} {"train_loss": -24.080415725708008, "global_step": 188723, "epoch": 2273} {"train_loss": -24.11848258972168, "global_step": 188724, "epoch": 2273} {"train_loss": -24.47328758239746, "global_step": 188725, "epoch": 2273} {"train_loss": -24.207067489624023, "global_step": 188726, "epoch": 2273} {"train_loss": -24.309362411499023, "global_step": 188727, "epoch": 2273} {"train_loss": -24.02267074584961, "global_step": 188728, "epoch": 2273} {"train_loss": -23.069015502929688, "global_step": 188729, "epoch": 2273} {"train_loss": -23.093652725219727, "global_step": 188730, "epoch": 2273} {"train_loss": -23.29360008239746, "global_step": 188731, "epoch": 2273} {"train_loss": -24.068323135375977, "global_step": 188732, "epoch": 2273} {"train_loss": -23.4785099029541, "global_step": 188733, "epoch": 2273} {"train_loss": -23.612457275390625, "global_step": 188734, "epoch": 2273} {"train_loss": -23.92221450805664, "global_step": 188735, "epoch": 2273} {"train_loss": -24.03188133239746, "global_step": 188736, "epoch": 2273} {"train_loss": -23.737953186035156, "global_step": 188737, "epoch": 2273} {"train_loss": -23.630617141723633, "global_step": 188738, "epoch": 2273} {"train_loss": -24.16752052307129, "global_step": 188739, "epoch": 2273} {"train_loss": -23.859121322631836, "global_step": 188740, "epoch": 2273} {"train_loss": -23.963884169796863, "global_step": 188741, "epoch": 2273, "val_loss": 6533749.0} {"train_loss": -24.036449432373047, "global_step": 188742, "epoch": 2274} {"train_loss": -24.06800079345703, "global_step": 188743, "epoch": 2274} {"train_loss": -23.945358276367188, "global_step": 188744, "epoch": 2274} {"train_loss": -23.885164260864258, "global_step": 188745, "epoch": 2274} {"train_loss": -23.80433464050293, "global_step": 188746, "epoch": 2274} {"train_loss": -23.98546028137207, "global_step": 188747, "epoch": 2274} {"train_loss": -23.76220703125, "global_step": 188748, "epoch": 2274} {"train_loss": -23.3961181640625, "global_step": 188749, "epoch": 2274} {"train_loss": -24.135229110717773, "global_step": 188750, "epoch": 2274} {"train_loss": -23.96550941467285, "global_step": 188751, "epoch": 2274} {"train_loss": -23.788480758666992, "global_step": 188752, "epoch": 2274} {"train_loss": -24.41387367248535, "global_step": 188753, "epoch": 2274} {"train_loss": -24.086591720581055, "global_step": 188754, "epoch": 2274} {"train_loss": -24.420597076416016, "global_step": 188755, "epoch": 2274} {"train_loss": -24.0545597076416, "global_step": 188756, "epoch": 2274} {"train_loss": -24.24904441833496, "global_step": 188757, "epoch": 2274} {"train_loss": -24.203927993774414, "global_step": 188758, "epoch": 2274} {"train_loss": -23.93448829650879, "global_step": 188759, "epoch": 2274} {"train_loss": -24.26180076599121, "global_step": 188760, "epoch": 2274} {"train_loss": -24.333240509033203, "global_step": 188761, "epoch": 2274} {"train_loss": -24.024791717529297, "global_step": 188762, "epoch": 2274} {"train_loss": -24.30071449279785, "global_step": 188763, "epoch": 2274} {"train_loss": -24.05455780029297, "global_step": 188764, "epoch": 2274} {"train_loss": -24.247478485107422, "global_step": 188765, "epoch": 2274} {"train_loss": -24.13534927368164, "global_step": 188766, "epoch": 2274} {"train_loss": -23.6922664642334, "global_step": 188767, "epoch": 2274} {"train_loss": -24.17963218688965, "global_step": 188768, "epoch": 2274} {"train_loss": -23.984718322753906, "global_step": 188769, "epoch": 2274} {"train_loss": -24.063720703125, "global_step": 188770, "epoch": 2274} {"train_loss": -23.79631996154785, "global_step": 188771, "epoch": 2274} {"train_loss": -23.66478157043457, "global_step": 188772, "epoch": 2274} {"train_loss": -23.881973266601562, "global_step": 188773, "epoch": 2274} {"train_loss": -24.01215362548828, "global_step": 188774, "epoch": 2274} {"train_loss": -23.83245849609375, "global_step": 188775, "epoch": 2274} {"train_loss": -24.3170166015625, "global_step": 188776, "epoch": 2274} {"train_loss": -23.847837448120117, "global_step": 188777, "epoch": 2274} {"train_loss": -24.217817306518555, "global_step": 188778, "epoch": 2274} {"train_loss": -24.252836227416992, "global_step": 188779, "epoch": 2274} {"train_loss": -24.446718215942383, "global_step": 188780, "epoch": 2274} {"train_loss": -24.0575008392334, "global_step": 188781, "epoch": 2274} {"train_loss": -23.838571548461914, "global_step": 188782, "epoch": 2274} {"train_loss": -23.998804092407227, "global_step": 188783, "epoch": 2274} {"train_loss": -23.95490074157715, "global_step": 188784, "epoch": 2274} {"train_loss": -23.960046768188477, "global_step": 188785, "epoch": 2274} {"train_loss": -24.039155960083008, "global_step": 188786, "epoch": 2274} {"train_loss": -24.249479293823242, "global_step": 188787, "epoch": 2274} {"train_loss": -23.957120895385742, "global_step": 188788, "epoch": 2274} {"train_loss": -24.00740623474121, "global_step": 188789, "epoch": 2274} {"train_loss": -24.0185546875, "global_step": 188790, "epoch": 2274} {"train_loss": -24.3637752532959, "global_step": 188791, "epoch": 2274} {"train_loss": -23.89330291748047, "global_step": 188792, "epoch": 2274} {"train_loss": -24.01801109313965, "global_step": 188793, "epoch": 2274} {"train_loss": -24.463727951049805, "global_step": 188794, "epoch": 2274} {"train_loss": -24.412187576293945, "global_step": 188795, "epoch": 2274} {"train_loss": -24.101476669311523, "global_step": 188796, "epoch": 2274} {"train_loss": -23.9660701751709, "global_step": 188797, "epoch": 2274} {"train_loss": -24.22881507873535, "global_step": 188798, "epoch": 2274} {"train_loss": -24.09288787841797, "global_step": 188799, "epoch": 2274} {"train_loss": -24.198413848876953, "global_step": 188800, "epoch": 2274} {"train_loss": -24.18453025817871, "global_step": 188801, "epoch": 2274} {"train_loss": -23.89643669128418, "global_step": 188802, "epoch": 2274} {"train_loss": -23.914037704467773, "global_step": 188803, "epoch": 2274} {"train_loss": -24.055652618408203, "global_step": 188804, "epoch": 2274} {"train_loss": -24.145660400390625, "global_step": 188805, "epoch": 2274} {"train_loss": -23.15778160095215, "global_step": 188806, "epoch": 2274} {"train_loss": -22.79499626159668, "global_step": 188807, "epoch": 2274} {"train_loss": -23.691661834716797, "global_step": 188808, "epoch": 2274} {"train_loss": -23.838031768798828, "global_step": 188809, "epoch": 2274} {"train_loss": -23.79179573059082, "global_step": 188810, "epoch": 2274} {"train_loss": -23.514219284057617, "global_step": 188811, "epoch": 2274} {"train_loss": -23.757431030273438, "global_step": 188812, "epoch": 2274} {"train_loss": -24.406631469726562, "global_step": 188813, "epoch": 2274} {"train_loss": -23.78912925720215, "global_step": 188814, "epoch": 2274} {"train_loss": -22.91860008239746, "global_step": 188815, "epoch": 2274} {"train_loss": -24.367313385009766, "global_step": 188816, "epoch": 2274} {"train_loss": -23.38123321533203, "global_step": 188817, "epoch": 2274} {"train_loss": -24.014179229736328, "global_step": 188818, "epoch": 2274} {"train_loss": -24.072484970092773, "global_step": 188819, "epoch": 2274} {"train_loss": -24.46278190612793, "global_step": 188820, "epoch": 2274} {"train_loss": -23.83072280883789, "global_step": 188821, "epoch": 2274} {"train_loss": -23.800100326538086, "global_step": 188822, "epoch": 2274} {"train_loss": -23.59925079345703, "global_step": 188823, "epoch": 2274} {"train_loss": -23.999078061207232, "global_step": 188824, "epoch": 2274, "val_loss": 6504498.0} {"train_loss": -23.213993072509766, "global_step": 188825, "epoch": 2275} {"train_loss": -23.902023315429688, "global_step": 188826, "epoch": 2275} {"train_loss": -23.401765823364258, "global_step": 188827, "epoch": 2275} {"train_loss": -23.59752655029297, "global_step": 188828, "epoch": 2275} {"train_loss": -23.983552932739258, "global_step": 188829, "epoch": 2275} {"train_loss": -23.30122947692871, "global_step": 188830, "epoch": 2275} {"train_loss": -23.555870056152344, "global_step": 188831, "epoch": 2275} {"train_loss": -23.7630558013916, "global_step": 188832, "epoch": 2275} {"train_loss": -23.761783599853516, "global_step": 188833, "epoch": 2275} {"train_loss": -24.006853103637695, "global_step": 188834, "epoch": 2275} {"train_loss": -23.907079696655273, "global_step": 188835, "epoch": 2275} {"train_loss": -24.039478302001953, "global_step": 188836, "epoch": 2275} {"train_loss": -23.99843978881836, "global_step": 188837, "epoch": 2275} {"train_loss": -23.724088668823242, "global_step": 188838, "epoch": 2275} {"train_loss": -23.84566307067871, "global_step": 188839, "epoch": 2275} {"train_loss": -23.982168197631836, "global_step": 188840, "epoch": 2275} {"train_loss": -24.11313819885254, "global_step": 188841, "epoch": 2275} {"train_loss": -23.70645523071289, "global_step": 188842, "epoch": 2275} {"train_loss": -24.179244995117188, "global_step": 188843, "epoch": 2275} {"train_loss": -23.80696678161621, "global_step": 188844, "epoch": 2275} {"train_loss": -23.966842651367188, "global_step": 188845, "epoch": 2275} {"train_loss": -24.067502975463867, "global_step": 188846, "epoch": 2275} {"train_loss": -23.83661460876465, "global_step": 188847, "epoch": 2275} {"train_loss": -23.839496612548828, "global_step": 188848, "epoch": 2275} {"train_loss": -24.154584884643555, "global_step": 188849, "epoch": 2275} {"train_loss": -24.249271392822266, "global_step": 188850, "epoch": 2275} {"train_loss": -23.90582847595215, "global_step": 188851, "epoch": 2275} {"train_loss": -24.226795196533203, "global_step": 188852, "epoch": 2275} {"train_loss": -24.051895141601562, "global_step": 188853, "epoch": 2275} {"train_loss": -23.673423767089844, "global_step": 188854, "epoch": 2275} {"train_loss": -24.118404388427734, "global_step": 188855, "epoch": 2275} {"train_loss": -24.127227783203125, "global_step": 188856, "epoch": 2275} {"train_loss": -24.015579223632812, "global_step": 188857, "epoch": 2275} {"train_loss": -24.028640747070312, "global_step": 188858, "epoch": 2275} {"train_loss": -23.877714157104492, "global_step": 188859, "epoch": 2275} {"train_loss": -24.00563621520996, "global_step": 188860, "epoch": 2275} {"train_loss": -23.787630081176758, "global_step": 188861, "epoch": 2275} {"train_loss": -24.502798080444336, "global_step": 188862, "epoch": 2275} {"train_loss": -24.31005096435547, "global_step": 188863, "epoch": 2275} {"train_loss": -24.230953216552734, "global_step": 188864, "epoch": 2275} {"train_loss": -24.31098747253418, "global_step": 188865, "epoch": 2275} {"train_loss": -24.022602081298828, "global_step": 188866, "epoch": 2275} {"train_loss": -23.90671157836914, "global_step": 188867, "epoch": 2275} {"train_loss": -24.592741012573242, "global_step": 188868, "epoch": 2275} {"train_loss": -24.218732833862305, "global_step": 188869, "epoch": 2275} {"train_loss": -23.763168334960938, "global_step": 188870, "epoch": 2275} {"train_loss": -24.67466163635254, "global_step": 188871, "epoch": 2275} {"train_loss": -23.961273193359375, "global_step": 188872, "epoch": 2275} {"train_loss": -23.977018356323242, "global_step": 188873, "epoch": 2275} {"train_loss": -24.36236000061035, "global_step": 188874, "epoch": 2275} {"train_loss": -24.13010025024414, "global_step": 188875, "epoch": 2275} {"train_loss": -23.861997604370117, "global_step": 188876, "epoch": 2275} {"train_loss": -23.723936080932617, "global_step": 188877, "epoch": 2275} {"train_loss": -24.17574119567871, "global_step": 188878, "epoch": 2275} {"train_loss": -24.333715438842773, "global_step": 188879, "epoch": 2275} {"train_loss": -24.12993812561035, "global_step": 188880, "epoch": 2275} {"train_loss": -23.803377151489258, "global_step": 188881, "epoch": 2275} {"train_loss": -24.025876998901367, "global_step": 188882, "epoch": 2275} {"train_loss": -24.018796920776367, "global_step": 188883, "epoch": 2275} {"train_loss": -23.94272804260254, "global_step": 188884, "epoch": 2275} {"train_loss": -24.371164321899414, "global_step": 188885, "epoch": 2275} {"train_loss": -24.39243507385254, "global_step": 188886, "epoch": 2275} {"train_loss": -24.543094635009766, "global_step": 188887, "epoch": 2275} {"train_loss": -24.176273345947266, "global_step": 188888, "epoch": 2275} {"train_loss": -23.837299346923828, "global_step": 188889, "epoch": 2275} {"train_loss": -24.05777359008789, "global_step": 188890, "epoch": 2275} {"train_loss": -23.896963119506836, "global_step": 188891, "epoch": 2275} {"train_loss": -23.939579010009766, "global_step": 188892, "epoch": 2275} {"train_loss": -24.01170539855957, "global_step": 188893, "epoch": 2275} {"train_loss": -24.260595321655273, "global_step": 188894, "epoch": 2275} {"train_loss": -24.048547744750977, "global_step": 188895, "epoch": 2275} {"train_loss": -23.990665435791016, "global_step": 188896, "epoch": 2275} {"train_loss": -23.721914291381836, "global_step": 188897, "epoch": 2275} {"train_loss": -24.056055068969727, "global_step": 188898, "epoch": 2275} {"train_loss": -24.374197006225586, "global_step": 188899, "epoch": 2275} {"train_loss": -24.016332626342773, "global_step": 188900, "epoch": 2275} {"train_loss": -24.290464401245117, "global_step": 188901, "epoch": 2275} {"train_loss": -23.994436264038086, "global_step": 188902, "epoch": 2275} {"train_loss": -24.14346694946289, "global_step": 188903, "epoch": 2275} {"train_loss": -24.28719139099121, "global_step": 188904, "epoch": 2275} {"train_loss": -24.295042037963867, "global_step": 188905, "epoch": 2275} {"train_loss": -23.896879196166992, "global_step": 188906, "epoch": 2275} {"train_loss": -24.028635323765766, "global_step": 188907, "epoch": 2275, "val_loss": 6512473.5} {"train_loss": -22.979736328125, "global_step": 188908, "epoch": 2276} {"train_loss": -22.531217575073242, "global_step": 188909, "epoch": 2276} {"train_loss": -23.09833335876465, "global_step": 188910, "epoch": 2276} {"train_loss": -22.603778839111328, "global_step": 188911, "epoch": 2276} {"train_loss": -23.200237274169922, "global_step": 188912, "epoch": 2276} {"train_loss": -23.6401309967041, "global_step": 188913, "epoch": 2276} {"train_loss": -23.224395751953125, "global_step": 188914, "epoch": 2276} {"train_loss": -23.35013771057129, "global_step": 188915, "epoch": 2276} {"train_loss": -23.830162048339844, "global_step": 188916, "epoch": 2276} {"train_loss": -23.391448974609375, "global_step": 188917, "epoch": 2276} {"train_loss": -23.400758743286133, "global_step": 188918, "epoch": 2276} {"train_loss": -23.42799186706543, "global_step": 188919, "epoch": 2276} {"train_loss": -23.79326629638672, "global_step": 188920, "epoch": 2276} {"train_loss": -23.600481033325195, "global_step": 188921, "epoch": 2276} {"train_loss": -23.620628356933594, "global_step": 188922, "epoch": 2276} {"train_loss": -23.681854248046875, "global_step": 188923, "epoch": 2276} {"train_loss": -23.542068481445312, "global_step": 188924, "epoch": 2276} {"train_loss": -23.848676681518555, "global_step": 188925, "epoch": 2276} {"train_loss": -23.17974853515625, "global_step": 188926, "epoch": 2276} {"train_loss": -23.695280075073242, "global_step": 188927, "epoch": 2276} {"train_loss": -23.64216423034668, "global_step": 188928, "epoch": 2276} {"train_loss": -23.458187103271484, "global_step": 188929, "epoch": 2276} {"train_loss": -23.857990264892578, "global_step": 188930, "epoch": 2276} {"train_loss": -23.37616539001465, "global_step": 188931, "epoch": 2276} {"train_loss": -23.688688278198242, "global_step": 188932, "epoch": 2276} {"train_loss": -23.09903907775879, "global_step": 188933, "epoch": 2276} {"train_loss": -23.96986961364746, "global_step": 188934, "epoch": 2276} {"train_loss": -24.176054000854492, "global_step": 188935, "epoch": 2276} {"train_loss": -23.91995620727539, "global_step": 188936, "epoch": 2276} {"train_loss": -24.025014877319336, "global_step": 188937, "epoch": 2276} {"train_loss": -23.63570213317871, "global_step": 188938, "epoch": 2276} {"train_loss": -24.167293548583984, "global_step": 188939, "epoch": 2276} {"train_loss": -23.987285614013672, "global_step": 188940, "epoch": 2276} {"train_loss": -23.732494354248047, "global_step": 188941, "epoch": 2276} {"train_loss": -24.45710563659668, "global_step": 188942, "epoch": 2276} {"train_loss": -23.597034454345703, "global_step": 188943, "epoch": 2276} {"train_loss": -23.898038864135742, "global_step": 188944, "epoch": 2276} {"train_loss": -24.31879997253418, "global_step": 188945, "epoch": 2276} {"train_loss": -23.63010597229004, "global_step": 188946, "epoch": 2276} {"train_loss": -23.951112747192383, "global_step": 188947, "epoch": 2276} {"train_loss": -24.179105758666992, "global_step": 188948, "epoch": 2276} {"train_loss": -23.91878318786621, "global_step": 188949, "epoch": 2276} {"train_loss": -24.135251998901367, "global_step": 188950, "epoch": 2276} {"train_loss": -24.654844284057617, "global_step": 188951, "epoch": 2276} {"train_loss": -24.135602951049805, "global_step": 188952, "epoch": 2276} {"train_loss": -23.968124389648438, "global_step": 188953, "epoch": 2276} {"train_loss": -24.058828353881836, "global_step": 188954, "epoch": 2276} {"train_loss": -24.244873046875, "global_step": 188955, "epoch": 2276} {"train_loss": -24.20749855041504, "global_step": 188956, "epoch": 2276} {"train_loss": -23.856258392333984, "global_step": 188957, "epoch": 2276} {"train_loss": -23.923107147216797, "global_step": 188958, "epoch": 2276} {"train_loss": -24.291751861572266, "global_step": 188959, "epoch": 2276} {"train_loss": -23.996442794799805, "global_step": 188960, "epoch": 2276} {"train_loss": -24.232975006103516, "global_step": 188961, "epoch": 2276} {"train_loss": -24.125991821289062, "global_step": 188962, "epoch": 2276} {"train_loss": -23.94135093688965, "global_step": 188963, "epoch": 2276} {"train_loss": -24.07611846923828, "global_step": 188964, "epoch": 2276} {"train_loss": -24.383377075195312, "global_step": 188965, "epoch": 2276} {"train_loss": -24.054819107055664, "global_step": 188966, "epoch": 2276} {"train_loss": -24.67443084716797, "global_step": 188967, "epoch": 2276} {"train_loss": -23.803247451782227, "global_step": 188968, "epoch": 2276} {"train_loss": -23.94415855407715, "global_step": 188969, "epoch": 2276} {"train_loss": -24.27543067932129, "global_step": 188970, "epoch": 2276} {"train_loss": -24.020835876464844, "global_step": 188971, "epoch": 2276} {"train_loss": -24.14363670349121, "global_step": 188972, "epoch": 2276} {"train_loss": -23.644453048706055, "global_step": 188973, "epoch": 2276} {"train_loss": -23.42901611328125, "global_step": 188974, "epoch": 2276} {"train_loss": -23.98295783996582, "global_step": 188975, "epoch": 2276} {"train_loss": -23.877941131591797, "global_step": 188976, "epoch": 2276} {"train_loss": -23.808748245239258, "global_step": 188977, "epoch": 2276} {"train_loss": -23.732797622680664, "global_step": 188978, "epoch": 2276} {"train_loss": -23.462905883789062, "global_step": 188979, "epoch": 2276} {"train_loss": -24.154138565063477, "global_step": 188980, "epoch": 2276} {"train_loss": -24.231252670288086, "global_step": 188981, "epoch": 2276} {"train_loss": -24.035999298095703, "global_step": 188982, "epoch": 2276} {"train_loss": -24.375423431396484, "global_step": 188983, "epoch": 2276} {"train_loss": -24.111722946166992, "global_step": 188984, "epoch": 2276} {"train_loss": -23.957712173461914, "global_step": 188985, "epoch": 2276} {"train_loss": -24.23042869567871, "global_step": 188986, "epoch": 2276} {"train_loss": -24.433507919311523, "global_step": 188987, "epoch": 2276} {"train_loss": -24.34823989868164, "global_step": 188988, "epoch": 2276} {"train_loss": -24.138425827026367, "global_step": 188989, "epoch": 2276} {"train_loss": -23.848899795348387, "global_step": 188990, "epoch": 2276, "val_loss": 6446207.5} {"train_loss": -23.946613311767578, "global_step": 188991, "epoch": 2277} {"train_loss": -23.395065307617188, "global_step": 188992, "epoch": 2277} {"train_loss": -23.315820693969727, "global_step": 188993, "epoch": 2277} {"train_loss": -23.62440299987793, "global_step": 188994, "epoch": 2277} {"train_loss": -23.94959831237793, "global_step": 188995, "epoch": 2277} {"train_loss": -24.1064453125, "global_step": 188996, "epoch": 2277} {"train_loss": -23.89812660217285, "global_step": 188997, "epoch": 2277} {"train_loss": -23.964385986328125, "global_step": 188998, "epoch": 2277} {"train_loss": -23.20917320251465, "global_step": 188999, "epoch": 2277} {"train_loss": -23.61612892150879, "global_step": 189000, "epoch": 2277} {"train_loss": -23.405561447143555, "global_step": 189001, "epoch": 2277} {"train_loss": -23.648603439331055, "global_step": 189002, "epoch": 2277} {"train_loss": -23.869815826416016, "global_step": 189003, "epoch": 2277} {"train_loss": -23.93865966796875, "global_step": 189004, "epoch": 2277} {"train_loss": -23.762605667114258, "global_step": 189005, "epoch": 2277} {"train_loss": -24.1247615814209, "global_step": 189006, "epoch": 2277} {"train_loss": -23.65667724609375, "global_step": 189007, "epoch": 2277} {"train_loss": -23.874807357788086, "global_step": 189008, "epoch": 2277} {"train_loss": -23.66007423400879, "global_step": 189009, "epoch": 2277} {"train_loss": -23.847211837768555, "global_step": 189010, "epoch": 2277} {"train_loss": -23.682022094726562, "global_step": 189011, "epoch": 2277} {"train_loss": -23.866683959960938, "global_step": 189012, "epoch": 2277} {"train_loss": -24.08586883544922, "global_step": 189013, "epoch": 2277} {"train_loss": -23.760223388671875, "global_step": 189014, "epoch": 2277} {"train_loss": -24.091930389404297, "global_step": 189015, "epoch": 2277} {"train_loss": -23.70368766784668, "global_step": 189016, "epoch": 2277} {"train_loss": -24.329132080078125, "global_step": 189017, "epoch": 2277} {"train_loss": -24.064090728759766, "global_step": 189018, "epoch": 2277} {"train_loss": -24.00556755065918, "global_step": 189019, "epoch": 2277} {"train_loss": -23.9891300201416, "global_step": 189020, "epoch": 2277} {"train_loss": -24.412778854370117, "global_step": 189021, "epoch": 2277} {"train_loss": -24.082050323486328, "global_step": 189022, "epoch": 2277} {"train_loss": -24.0698299407959, "global_step": 189023, "epoch": 2277} {"train_loss": -24.013263702392578, "global_step": 189024, "epoch": 2277} {"train_loss": -24.13447380065918, "global_step": 189025, "epoch": 2277} {"train_loss": -24.74676513671875, "global_step": 189026, "epoch": 2277} {"train_loss": -24.069616317749023, "global_step": 189027, "epoch": 2277} {"train_loss": -24.224872589111328, "global_step": 189028, "epoch": 2277} {"train_loss": -24.074462890625, "global_step": 189029, "epoch": 2277} {"train_loss": -24.168428421020508, "global_step": 189030, "epoch": 2277} {"train_loss": -24.377103805541992, "global_step": 189031, "epoch": 2277} {"train_loss": -24.2624568939209, "global_step": 189032, "epoch": 2277} {"train_loss": -24.025741577148438, "global_step": 189033, "epoch": 2277} {"train_loss": -24.239627838134766, "global_step": 189034, "epoch": 2277} {"train_loss": -23.873661041259766, "global_step": 189035, "epoch": 2277} {"train_loss": -24.21634864807129, "global_step": 189036, "epoch": 2277} {"train_loss": -24.985610961914062, "global_step": 189037, "epoch": 2277} {"train_loss": -24.133365631103516, "global_step": 189038, "epoch": 2277} {"train_loss": -24.36921501159668, "global_step": 189039, "epoch": 2277} {"train_loss": -24.014728546142578, "global_step": 189040, "epoch": 2277} {"train_loss": -23.854339599609375, "global_step": 189041, "epoch": 2277} {"train_loss": -23.83499526977539, "global_step": 189042, "epoch": 2277} {"train_loss": -24.17446517944336, "global_step": 189043, "epoch": 2277} {"train_loss": -24.31717300415039, "global_step": 189044, "epoch": 2277} {"train_loss": -24.164052963256836, "global_step": 189045, "epoch": 2277} {"train_loss": -24.167098999023438, "global_step": 189046, "epoch": 2277} {"train_loss": -23.595380783081055, "global_step": 189047, "epoch": 2277} {"train_loss": -24.235387802124023, "global_step": 189048, "epoch": 2277} {"train_loss": -24.496217727661133, "global_step": 189049, "epoch": 2277} {"train_loss": -24.7030029296875, "global_step": 189050, "epoch": 2277} {"train_loss": -23.94837760925293, "global_step": 189051, "epoch": 2277} {"train_loss": -24.344715118408203, "global_step": 189052, "epoch": 2277} {"train_loss": -24.350162506103516, "global_step": 189053, "epoch": 2277} {"train_loss": -23.97538185119629, "global_step": 189054, "epoch": 2277} {"train_loss": -23.710737228393555, "global_step": 189055, "epoch": 2277} {"train_loss": -24.013639450073242, "global_step": 189056, "epoch": 2277} {"train_loss": -23.652990341186523, "global_step": 189057, "epoch": 2277} {"train_loss": -23.59520149230957, "global_step": 189058, "epoch": 2277} {"train_loss": -23.215682983398438, "global_step": 189059, "epoch": 2277} {"train_loss": -23.61775016784668, "global_step": 189060, "epoch": 2277} {"train_loss": -24.096010208129883, "global_step": 189061, "epoch": 2277} {"train_loss": -23.850086212158203, "global_step": 189062, "epoch": 2277} {"train_loss": -23.965585708618164, "global_step": 189063, "epoch": 2277} {"train_loss": -23.820714950561523, "global_step": 189064, "epoch": 2277} {"train_loss": -24.129135131835938, "global_step": 189065, "epoch": 2277} {"train_loss": -23.997404098510742, "global_step": 189066, "epoch": 2277} {"train_loss": -24.400169372558594, "global_step": 189067, "epoch": 2277} {"train_loss": -24.247074127197266, "global_step": 189068, "epoch": 2277} {"train_loss": -24.057621002197266, "global_step": 189069, "epoch": 2277} {"train_loss": -24.47014045715332, "global_step": 189070, "epoch": 2277} {"train_loss": -24.279756546020508, "global_step": 189071, "epoch": 2277} {"train_loss": -24.129995346069336, "global_step": 189072, "epoch": 2277} {"train_loss": -24.00851810409362, "global_step": 189073, "epoch": 2277, "val_loss": 6516989.0} {"train_loss": -24.279590606689453, "global_step": 189074, "epoch": 2278} {"train_loss": -24.10086441040039, "global_step": 189075, "epoch": 2278} {"train_loss": -23.798784255981445, "global_step": 189076, "epoch": 2278} {"train_loss": -23.88131332397461, "global_step": 189077, "epoch": 2278} {"train_loss": -23.800504684448242, "global_step": 189078, "epoch": 2278} {"train_loss": -23.905975341796875, "global_step": 189079, "epoch": 2278} {"train_loss": -24.468069076538086, "global_step": 189080, "epoch": 2278} {"train_loss": -24.092336654663086, "global_step": 189081, "epoch": 2278} {"train_loss": -24.188411712646484, "global_step": 189082, "epoch": 2278} {"train_loss": -24.331375122070312, "global_step": 189083, "epoch": 2278} {"train_loss": -24.174617767333984, "global_step": 189084, "epoch": 2278} {"train_loss": -23.846715927124023, "global_step": 189085, "epoch": 2278} {"train_loss": -24.58818244934082, "global_step": 189086, "epoch": 2278} {"train_loss": -24.34493064880371, "global_step": 189087, "epoch": 2278} {"train_loss": -24.056325912475586, "global_step": 189088, "epoch": 2278} {"train_loss": -24.0555477142334, "global_step": 189089, "epoch": 2278} {"train_loss": -23.807132720947266, "global_step": 189090, "epoch": 2278} {"train_loss": -24.259803771972656, "global_step": 189091, "epoch": 2278} {"train_loss": -24.360349655151367, "global_step": 189092, "epoch": 2278} {"train_loss": -24.12771987915039, "global_step": 189093, "epoch": 2278} {"train_loss": -23.927412033081055, "global_step": 189094, "epoch": 2278} {"train_loss": -24.12990951538086, "global_step": 189095, "epoch": 2278} {"train_loss": -24.150068283081055, "global_step": 189096, "epoch": 2278} {"train_loss": -23.921628952026367, "global_step": 189097, "epoch": 2278} {"train_loss": -23.77326011657715, "global_step": 189098, "epoch": 2278} {"train_loss": -24.030942916870117, "global_step": 189099, "epoch": 2278} {"train_loss": -23.639577865600586, "global_step": 189100, "epoch": 2278} {"train_loss": -24.038915634155273, "global_step": 189101, "epoch": 2278} {"train_loss": -24.171281814575195, "global_step": 189102, "epoch": 2278} {"train_loss": -24.085235595703125, "global_step": 189103, "epoch": 2278} {"train_loss": -24.059919357299805, "global_step": 189104, "epoch": 2278} {"train_loss": -23.832679748535156, "global_step": 189105, "epoch": 2278} {"train_loss": -23.936857223510742, "global_step": 189106, "epoch": 2278} {"train_loss": -24.100622177124023, "global_step": 189107, "epoch": 2278} {"train_loss": -24.111148834228516, "global_step": 189108, "epoch": 2278} {"train_loss": -24.05837059020996, "global_step": 189109, "epoch": 2278} {"train_loss": -24.458505630493164, "global_step": 189110, "epoch": 2278} {"train_loss": -24.230375289916992, "global_step": 189111, "epoch": 2278} {"train_loss": -24.067005157470703, "global_step": 189112, "epoch": 2278} {"train_loss": -23.71170997619629, "global_step": 189113, "epoch": 2278} {"train_loss": -24.343036651611328, "global_step": 189114, "epoch": 2278} {"train_loss": -24.021284103393555, "global_step": 189115, "epoch": 2278} {"train_loss": -23.482303619384766, "global_step": 189116, "epoch": 2278} {"train_loss": -24.280248641967773, "global_step": 189117, "epoch": 2278} {"train_loss": -24.080068588256836, "global_step": 189118, "epoch": 2278} {"train_loss": -23.933500289916992, "global_step": 189119, "epoch": 2278} {"train_loss": -24.260292053222656, "global_step": 189120, "epoch": 2278} {"train_loss": -23.770383834838867, "global_step": 189121, "epoch": 2278} {"train_loss": -23.86450958251953, "global_step": 189122, "epoch": 2278} {"train_loss": -24.00575065612793, "global_step": 189123, "epoch": 2278} {"train_loss": -24.061527252197266, "global_step": 189124, "epoch": 2278} {"train_loss": -23.87398338317871, "global_step": 189125, "epoch": 2278} {"train_loss": -23.87031364440918, "global_step": 189126, "epoch": 2278} {"train_loss": -23.846792221069336, "global_step": 189127, "epoch": 2278} {"train_loss": -24.205780029296875, "global_step": 189128, "epoch": 2278} {"train_loss": -24.080839157104492, "global_step": 189129, "epoch": 2278} {"train_loss": -24.254093170166016, "global_step": 189130, "epoch": 2278} {"train_loss": -23.935400009155273, "global_step": 189131, "epoch": 2278} {"train_loss": -23.94056510925293, "global_step": 189132, "epoch": 2278} {"train_loss": -24.029172897338867, "global_step": 189133, "epoch": 2278} {"train_loss": -24.163923263549805, "global_step": 189134, "epoch": 2278} {"train_loss": -23.805959701538086, "global_step": 189135, "epoch": 2278} {"train_loss": -23.698837280273438, "global_step": 189136, "epoch": 2278} {"train_loss": -23.220731735229492, "global_step": 189137, "epoch": 2278} {"train_loss": -22.95589256286621, "global_step": 189138, "epoch": 2278} {"train_loss": -23.048542022705078, "global_step": 189139, "epoch": 2278} {"train_loss": -24.045705795288086, "global_step": 189140, "epoch": 2278} {"train_loss": -23.822452545166016, "global_step": 189141, "epoch": 2278} {"train_loss": -24.05139923095703, "global_step": 189142, "epoch": 2278} {"train_loss": -23.978464126586914, "global_step": 189143, "epoch": 2278} {"train_loss": -23.95093536376953, "global_step": 189144, "epoch": 2278} {"train_loss": -23.72890281677246, "global_step": 189145, "epoch": 2278} {"train_loss": -23.61201286315918, "global_step": 189146, "epoch": 2278} {"train_loss": -24.002490997314453, "global_step": 189147, "epoch": 2278} {"train_loss": -23.950780868530273, "global_step": 189148, "epoch": 2278} {"train_loss": -23.70253562927246, "global_step": 189149, "epoch": 2278} {"train_loss": -23.954893112182617, "global_step": 189150, "epoch": 2278} {"train_loss": -23.786487579345703, "global_step": 189151, "epoch": 2278} {"train_loss": -24.215662002563477, "global_step": 189152, "epoch": 2278} {"train_loss": -23.980905532836914, "global_step": 189153, "epoch": 2278} {"train_loss": -23.93526268005371, "global_step": 189154, "epoch": 2278} {"train_loss": -24.22308921813965, "global_step": 189155, "epoch": 2278} {"train_loss": -24.003533076090985, "global_step": 189156, "epoch": 2278, "val_loss": 6371583.0} {"train_loss": -23.24954605102539, "global_step": 189157, "epoch": 2279} {"train_loss": -23.306238174438477, "global_step": 189158, "epoch": 2279} {"train_loss": -23.52286720275879, "global_step": 189159, "epoch": 2279} {"train_loss": -23.68055534362793, "global_step": 189160, "epoch": 2279} {"train_loss": -23.0260066986084, "global_step": 189161, "epoch": 2279} {"train_loss": -23.52778434753418, "global_step": 189162, "epoch": 2279} {"train_loss": -23.19354248046875, "global_step": 189163, "epoch": 2279} {"train_loss": -23.674739837646484, "global_step": 189164, "epoch": 2279} {"train_loss": -23.81793212890625, "global_step": 189165, "epoch": 2279} {"train_loss": -23.267683029174805, "global_step": 189166, "epoch": 2279} {"train_loss": -23.71538734436035, "global_step": 189167, "epoch": 2279} {"train_loss": -23.96661949157715, "global_step": 189168, "epoch": 2279} {"train_loss": -23.54994010925293, "global_step": 189169, "epoch": 2279} {"train_loss": -23.987773895263672, "global_step": 189170, "epoch": 2279} {"train_loss": -23.675140380859375, "global_step": 189171, "epoch": 2279} {"train_loss": -23.448974609375, "global_step": 189172, "epoch": 2279} {"train_loss": -23.511417388916016, "global_step": 189173, "epoch": 2279} {"train_loss": -23.681119918823242, "global_step": 189174, "epoch": 2279} {"train_loss": -23.686254501342773, "global_step": 189175, "epoch": 2279} {"train_loss": -24.158292770385742, "global_step": 189176, "epoch": 2279} {"train_loss": -23.9473819732666, "global_step": 189177, "epoch": 2279} {"train_loss": -24.18897819519043, "global_step": 189178, "epoch": 2279} {"train_loss": -24.113866806030273, "global_step": 189179, "epoch": 2279} {"train_loss": -24.1408748626709, "global_step": 189180, "epoch": 2279} {"train_loss": -23.886005401611328, "global_step": 189181, "epoch": 2279} {"train_loss": -24.092565536499023, "global_step": 189182, "epoch": 2279} {"train_loss": -24.14328384399414, "global_step": 189183, "epoch": 2279} {"train_loss": -24.17103385925293, "global_step": 189184, "epoch": 2279} {"train_loss": -24.118749618530273, "global_step": 189185, "epoch": 2279} {"train_loss": -23.752384185791016, "global_step": 189186, "epoch": 2279} {"train_loss": -24.340452194213867, "global_step": 189187, "epoch": 2279} {"train_loss": -24.0690860748291, "global_step": 189188, "epoch": 2279} {"train_loss": -23.84763526916504, "global_step": 189189, "epoch": 2279} {"train_loss": -24.028804779052734, "global_step": 189190, "epoch": 2279} {"train_loss": -24.007871627807617, "global_step": 189191, "epoch": 2279} {"train_loss": -24.23236656188965, "global_step": 189192, "epoch": 2279} {"train_loss": -23.793630599975586, "global_step": 189193, "epoch": 2279} {"train_loss": -24.197040557861328, "global_step": 189194, "epoch": 2279} {"train_loss": -24.539871215820312, "global_step": 189195, "epoch": 2279} {"train_loss": -23.931352615356445, "global_step": 189196, "epoch": 2279} {"train_loss": -24.348852157592773, "global_step": 189197, "epoch": 2279} {"train_loss": -23.95160675048828, "global_step": 189198, "epoch": 2279} {"train_loss": -24.165693283081055, "global_step": 189199, "epoch": 2279} {"train_loss": -24.420398712158203, "global_step": 189200, "epoch": 2279} {"train_loss": -24.19846534729004, "global_step": 189201, "epoch": 2279} {"train_loss": -24.084064483642578, "global_step": 189202, "epoch": 2279} {"train_loss": -24.273040771484375, "global_step": 189203, "epoch": 2279} {"train_loss": -24.43171501159668, "global_step": 189204, "epoch": 2279} {"train_loss": -24.05093765258789, "global_step": 189205, "epoch": 2279} {"train_loss": -24.093870162963867, "global_step": 189206, "epoch": 2279} {"train_loss": -24.167078018188477, "global_step": 189207, "epoch": 2279} {"train_loss": -24.030759811401367, "global_step": 189208, "epoch": 2279} {"train_loss": -24.00144386291504, "global_step": 189209, "epoch": 2279} {"train_loss": -24.26620101928711, "global_step": 189210, "epoch": 2279} {"train_loss": -24.326955795288086, "global_step": 189211, "epoch": 2279} {"train_loss": -24.167770385742188, "global_step": 189212, "epoch": 2279} {"train_loss": -23.718013763427734, "global_step": 189213, "epoch": 2279} {"train_loss": -24.091384887695312, "global_step": 189214, "epoch": 2279} {"train_loss": -24.03700828552246, "global_step": 189215, "epoch": 2279} {"train_loss": -24.027700424194336, "global_step": 189216, "epoch": 2279} {"train_loss": -23.924123764038086, "global_step": 189217, "epoch": 2279} {"train_loss": -24.303430557250977, "global_step": 189218, "epoch": 2279} {"train_loss": -24.262683868408203, "global_step": 189219, "epoch": 2279} {"train_loss": -23.95478630065918, "global_step": 189220, "epoch": 2279} {"train_loss": -24.25916862487793, "global_step": 189221, "epoch": 2279} {"train_loss": -24.22906494140625, "global_step": 189222, "epoch": 2279} {"train_loss": -24.080137252807617, "global_step": 189223, "epoch": 2279} {"train_loss": -23.744192123413086, "global_step": 189224, "epoch": 2279} {"train_loss": -24.085912704467773, "global_step": 189225, "epoch": 2279} {"train_loss": -24.25678825378418, "global_step": 189226, "epoch": 2279} {"train_loss": -24.20912742614746, "global_step": 189227, "epoch": 2279} {"train_loss": -23.762685775756836, "global_step": 189228, "epoch": 2279} {"train_loss": -23.897708892822266, "global_step": 189229, "epoch": 2279} {"train_loss": -23.93907928466797, "global_step": 189230, "epoch": 2279} {"train_loss": -23.70524024963379, "global_step": 189231, "epoch": 2279} {"train_loss": -23.966552734375, "global_step": 189232, "epoch": 2279} {"train_loss": -24.420894622802734, "global_step": 189233, "epoch": 2279} {"train_loss": -24.06721305847168, "global_step": 189234, "epoch": 2279} {"train_loss": -24.373489379882812, "global_step": 189235, "epoch": 2279} {"train_loss": -23.864547729492188, "global_step": 189236, "epoch": 2279} {"train_loss": -23.950153350830078, "global_step": 189237, "epoch": 2279} {"train_loss": -24.148513793945312, "global_step": 189238, "epoch": 2279} {"train_loss": -23.968242966985127, "global_step": 189239, "epoch": 2279, "val_loss": 6503425.5} {"train_loss": -23.413063049316406, "global_step": 189240, "epoch": 2280} {"train_loss": -23.67159080505371, "global_step": 189241, "epoch": 2280} {"train_loss": -23.391149520874023, "global_step": 189242, "epoch": 2280} {"train_loss": -23.406614303588867, "global_step": 189243, "epoch": 2280} {"train_loss": -23.469511032104492, "global_step": 189244, "epoch": 2280} {"train_loss": -23.8891544342041, "global_step": 189245, "epoch": 2280} {"train_loss": -23.90210723876953, "global_step": 189246, "epoch": 2280} {"train_loss": -23.596227645874023, "global_step": 189247, "epoch": 2280} {"train_loss": -23.422155380249023, "global_step": 189248, "epoch": 2280} {"train_loss": -23.529102325439453, "global_step": 189249, "epoch": 2280} {"train_loss": -23.67157554626465, "global_step": 189250, "epoch": 2280} {"train_loss": -23.965566635131836, "global_step": 189251, "epoch": 2280} {"train_loss": -23.62692642211914, "global_step": 189252, "epoch": 2280} {"train_loss": -23.72051429748535, "global_step": 189253, "epoch": 2280} {"train_loss": -23.751556396484375, "global_step": 189254, "epoch": 2280} {"train_loss": -24.113561630249023, "global_step": 189255, "epoch": 2280} {"train_loss": -24.482465744018555, "global_step": 189256, "epoch": 2280} {"train_loss": -23.997379302978516, "global_step": 189257, "epoch": 2280} {"train_loss": -23.926023483276367, "global_step": 189258, "epoch": 2280} {"train_loss": -23.99199867248535, "global_step": 189259, "epoch": 2280} {"train_loss": -23.85157585144043, "global_step": 189260, "epoch": 2280} {"train_loss": -24.000198364257812, "global_step": 189261, "epoch": 2280} {"train_loss": -24.154970169067383, "global_step": 189262, "epoch": 2280} {"train_loss": -24.182537078857422, "global_step": 189263, "epoch": 2280} {"train_loss": -24.11528968811035, "global_step": 189264, "epoch": 2280} {"train_loss": -23.65462303161621, "global_step": 189265, "epoch": 2280} {"train_loss": -23.94547462463379, "global_step": 189266, "epoch": 2280} {"train_loss": -23.786121368408203, "global_step": 189267, "epoch": 2280} {"train_loss": -24.112497329711914, "global_step": 189268, "epoch": 2280} {"train_loss": -24.346439361572266, "global_step": 189269, "epoch": 2280} {"train_loss": -24.251869201660156, "global_step": 189270, "epoch": 2280} {"train_loss": -24.14603614807129, "global_step": 189271, "epoch": 2280} {"train_loss": -24.21291160583496, "global_step": 189272, "epoch": 2280} {"train_loss": -24.090320587158203, "global_step": 189273, "epoch": 2280} {"train_loss": -24.20352554321289, "global_step": 189274, "epoch": 2280} {"train_loss": -24.25477409362793, "global_step": 189275, "epoch": 2280} {"train_loss": -24.441572189331055, "global_step": 189276, "epoch": 2280} {"train_loss": -24.194860458374023, "global_step": 189277, "epoch": 2280} {"train_loss": -24.297260284423828, "global_step": 189278, "epoch": 2280} {"train_loss": -24.20484733581543, "global_step": 189279, "epoch": 2280} {"train_loss": -24.175342559814453, "global_step": 189280, "epoch": 2280} {"train_loss": -24.25355339050293, "global_step": 189281, "epoch": 2280} {"train_loss": -23.943973541259766, "global_step": 189282, "epoch": 2280} {"train_loss": -23.85515022277832, "global_step": 189283, "epoch": 2280} {"train_loss": -23.931400299072266, "global_step": 189284, "epoch": 2280} {"train_loss": -24.288782119750977, "global_step": 189285, "epoch": 2280} {"train_loss": -24.381956100463867, "global_step": 189286, "epoch": 2280} {"train_loss": -24.131479263305664, "global_step": 189287, "epoch": 2280} {"train_loss": -24.066293716430664, "global_step": 189288, "epoch": 2280} {"train_loss": -23.974903106689453, "global_step": 189289, "epoch": 2280} {"train_loss": -24.278554916381836, "global_step": 189290, "epoch": 2280} {"train_loss": -24.147920608520508, "global_step": 189291, "epoch": 2280} {"train_loss": -23.86098289489746, "global_step": 189292, "epoch": 2280} {"train_loss": -23.852947235107422, "global_step": 189293, "epoch": 2280} {"train_loss": -24.02686882019043, "global_step": 189294, "epoch": 2280} {"train_loss": -23.673681259155273, "global_step": 189295, "epoch": 2280} {"train_loss": -23.947845458984375, "global_step": 189296, "epoch": 2280} {"train_loss": -24.251033782958984, "global_step": 189297, "epoch": 2280} {"train_loss": -24.053030014038086, "global_step": 189298, "epoch": 2280} {"train_loss": -24.170175552368164, "global_step": 189299, "epoch": 2280} {"train_loss": -23.684978485107422, "global_step": 189300, "epoch": 2280} {"train_loss": -24.02779197692871, "global_step": 189301, "epoch": 2280} {"train_loss": -24.05256462097168, "global_step": 189302, "epoch": 2280} {"train_loss": -24.168075561523438, "global_step": 189303, "epoch": 2280} {"train_loss": -24.478845596313477, "global_step": 189304, "epoch": 2280} {"train_loss": -23.83131217956543, "global_step": 189305, "epoch": 2280} {"train_loss": -24.229358673095703, "global_step": 189306, "epoch": 2280} {"train_loss": -24.245988845825195, "global_step": 189307, "epoch": 2280} {"train_loss": -24.087934494018555, "global_step": 189308, "epoch": 2280} {"train_loss": -24.18594741821289, "global_step": 189309, "epoch": 2280} {"train_loss": -23.898967742919922, "global_step": 189310, "epoch": 2280} {"train_loss": -24.021961212158203, "global_step": 189311, "epoch": 2280} {"train_loss": -24.049375534057617, "global_step": 189312, "epoch": 2280} {"train_loss": -23.71076202392578, "global_step": 189313, "epoch": 2280} {"train_loss": -23.76354217529297, "global_step": 189314, "epoch": 2280} {"train_loss": -24.109844207763672, "global_step": 189315, "epoch": 2280} {"train_loss": -24.228666305541992, "global_step": 189316, "epoch": 2280} {"train_loss": -24.200912475585938, "global_step": 189317, "epoch": 2280} {"train_loss": -23.993993759155273, "global_step": 189318, "epoch": 2280} {"train_loss": -23.7301025390625, "global_step": 189319, "epoch": 2280} {"train_loss": -24.274005889892578, "global_step": 189320, "epoch": 2280} {"train_loss": -24.402002334594727, "global_step": 189321, "epoch": 2280} {"train_loss": -24.015142233974963, "global_step": 189322, "epoch": 2280, "val_loss": 6669658.0} {"train_loss": -22.93416404724121, "global_step": 189323, "epoch": 2281} {"train_loss": -22.501888275146484, "global_step": 189324, "epoch": 2281} {"train_loss": -22.954191207885742, "global_step": 189325, "epoch": 2281} {"train_loss": -23.44095802307129, "global_step": 189326, "epoch": 2281} {"train_loss": -23.161319732666016, "global_step": 189327, "epoch": 2281} {"train_loss": -23.69794273376465, "global_step": 189328, "epoch": 2281} {"train_loss": -23.43645668029785, "global_step": 189329, "epoch": 2281} {"train_loss": -23.422956466674805, "global_step": 189330, "epoch": 2281} {"train_loss": -22.66971778869629, "global_step": 189331, "epoch": 2281} {"train_loss": -23.745223999023438, "global_step": 189332, "epoch": 2281} {"train_loss": -23.49323272705078, "global_step": 189333, "epoch": 2281} {"train_loss": -23.518890380859375, "global_step": 189334, "epoch": 2281} {"train_loss": -23.621225357055664, "global_step": 189335, "epoch": 2281} {"train_loss": -23.774072647094727, "global_step": 189336, "epoch": 2281} {"train_loss": -23.6951847076416, "global_step": 189337, "epoch": 2281} {"train_loss": -23.410247802734375, "global_step": 189338, "epoch": 2281} {"train_loss": -23.730649948120117, "global_step": 189339, "epoch": 2281} {"train_loss": -23.829145431518555, "global_step": 189340, "epoch": 2281} {"train_loss": -23.742246627807617, "global_step": 189341, "epoch": 2281} {"train_loss": -23.786766052246094, "global_step": 189342, "epoch": 2281} {"train_loss": -23.5593318939209, "global_step": 189343, "epoch": 2281} {"train_loss": -23.762052536010742, "global_step": 189344, "epoch": 2281} {"train_loss": -23.65191078186035, "global_step": 189345, "epoch": 2281} {"train_loss": -24.024723052978516, "global_step": 189346, "epoch": 2281} {"train_loss": -23.945667266845703, "global_step": 189347, "epoch": 2281} {"train_loss": -24.22636604309082, "global_step": 189348, "epoch": 2281} {"train_loss": -24.01825523376465, "global_step": 189349, "epoch": 2281} {"train_loss": -23.66907501220703, "global_step": 189350, "epoch": 2281} {"train_loss": -23.785289764404297, "global_step": 189351, "epoch": 2281} {"train_loss": -23.924453735351562, "global_step": 189352, "epoch": 2281} {"train_loss": -24.142065048217773, "global_step": 189353, "epoch": 2281} {"train_loss": -23.830429077148438, "global_step": 189354, "epoch": 2281} {"train_loss": -23.84844398498535, "global_step": 189355, "epoch": 2281} {"train_loss": -24.254379272460938, "global_step": 189356, "epoch": 2281} {"train_loss": -24.302785873413086, "global_step": 189357, "epoch": 2281} {"train_loss": -24.049123764038086, "global_step": 189358, "epoch": 2281} {"train_loss": -24.121543884277344, "global_step": 189359, "epoch": 2281} {"train_loss": -24.171768188476562, "global_step": 189360, "epoch": 2281} {"train_loss": -24.419513702392578, "global_step": 189361, "epoch": 2281} {"train_loss": -23.757343292236328, "global_step": 189362, "epoch": 2281} {"train_loss": -24.077152252197266, "global_step": 189363, "epoch": 2281} {"train_loss": -24.139095306396484, "global_step": 189364, "epoch": 2281} {"train_loss": -24.380512237548828, "global_step": 189365, "epoch": 2281} {"train_loss": -23.953784942626953, "global_step": 189366, "epoch": 2281} {"train_loss": -24.522127151489258, "global_step": 189367, "epoch": 2281} {"train_loss": -24.316593170166016, "global_step": 189368, "epoch": 2281} {"train_loss": -24.044723510742188, "global_step": 189369, "epoch": 2281} {"train_loss": -23.9678897857666, "global_step": 189370, "epoch": 2281} {"train_loss": -24.501720428466797, "global_step": 189371, "epoch": 2281} {"train_loss": -24.38172721862793, "global_step": 189372, "epoch": 2281} {"train_loss": -24.477495193481445, "global_step": 189373, "epoch": 2281} {"train_loss": -24.326194763183594, "global_step": 189374, "epoch": 2281} {"train_loss": -24.05976676940918, "global_step": 189375, "epoch": 2281} {"train_loss": -24.0250301361084, "global_step": 189376, "epoch": 2281} {"train_loss": -24.11529541015625, "global_step": 189377, "epoch": 2281} {"train_loss": -23.633520126342773, "global_step": 189378, "epoch": 2281} {"train_loss": -24.251373291015625, "global_step": 189379, "epoch": 2281} {"train_loss": -23.873098373413086, "global_step": 189380, "epoch": 2281} {"train_loss": -23.937026977539062, "global_step": 189381, "epoch": 2281} {"train_loss": -24.186599731445312, "global_step": 189382, "epoch": 2281} {"train_loss": -24.088830947875977, "global_step": 189383, "epoch": 2281} {"train_loss": -24.08057975769043, "global_step": 189384, "epoch": 2281} {"train_loss": -24.009489059448242, "global_step": 189385, "epoch": 2281} {"train_loss": -23.432029724121094, "global_step": 189386, "epoch": 2281} {"train_loss": -23.938417434692383, "global_step": 189387, "epoch": 2281} {"train_loss": -24.425254821777344, "global_step": 189388, "epoch": 2281} {"train_loss": -23.892927169799805, "global_step": 189389, "epoch": 2281} {"train_loss": -23.99933433532715, "global_step": 189390, "epoch": 2281} {"train_loss": -24.000835418701172, "global_step": 189391, "epoch": 2281} {"train_loss": -23.69182777404785, "global_step": 189392, "epoch": 2281} {"train_loss": -24.029672622680664, "global_step": 189393, "epoch": 2281} {"train_loss": -24.022396087646484, "global_step": 189394, "epoch": 2281} {"train_loss": -24.020315170288086, "global_step": 189395, "epoch": 2281} {"train_loss": -24.168188095092773, "global_step": 189396, "epoch": 2281} {"train_loss": -24.009746551513672, "global_step": 189397, "epoch": 2281} {"train_loss": -23.75553321838379, "global_step": 189398, "epoch": 2281} {"train_loss": -23.975955963134766, "global_step": 189399, "epoch": 2281} {"train_loss": -23.880329132080078, "global_step": 189400, "epoch": 2281} {"train_loss": -24.22768211364746, "global_step": 189401, "epoch": 2281} {"train_loss": -23.9959659576416, "global_step": 189402, "epoch": 2281} {"train_loss": -24.307321548461914, "global_step": 189403, "epoch": 2281} {"train_loss": -24.405282974243164, "global_step": 189404, "epoch": 2281} {"train_loss": -23.89783946577325, "global_step": 189405, "epoch": 2281, "val_loss": 6433073.0} {"train_loss": -23.905546188354492, "global_step": 189406, "epoch": 2282} {"train_loss": -23.83682632446289, "global_step": 189407, "epoch": 2282} {"train_loss": -23.534727096557617, "global_step": 189408, "epoch": 2282} {"train_loss": -23.76650619506836, "global_step": 189409, "epoch": 2282} {"train_loss": -23.62189292907715, "global_step": 189410, "epoch": 2282} {"train_loss": -23.934614181518555, "global_step": 189411, "epoch": 2282} {"train_loss": -23.887680053710938, "global_step": 189412, "epoch": 2282} {"train_loss": -23.558626174926758, "global_step": 189413, "epoch": 2282} {"train_loss": -24.136093139648438, "global_step": 189414, "epoch": 2282} {"train_loss": -23.828256607055664, "global_step": 189415, "epoch": 2282} {"train_loss": -23.831594467163086, "global_step": 189416, "epoch": 2282} {"train_loss": -23.561038970947266, "global_step": 189417, "epoch": 2282} {"train_loss": -23.50642967224121, "global_step": 189418, "epoch": 2282} {"train_loss": -23.803028106689453, "global_step": 189419, "epoch": 2282} {"train_loss": -23.89167594909668, "global_step": 189420, "epoch": 2282} {"train_loss": -23.691524505615234, "global_step": 189421, "epoch": 2282} {"train_loss": -24.03099822998047, "global_step": 189422, "epoch": 2282} {"train_loss": -24.229036331176758, "global_step": 189423, "epoch": 2282} {"train_loss": -23.91356086730957, "global_step": 189424, "epoch": 2282} {"train_loss": -23.54721450805664, "global_step": 189425, "epoch": 2282} {"train_loss": -24.19123649597168, "global_step": 189426, "epoch": 2282} {"train_loss": -23.570959091186523, "global_step": 189427, "epoch": 2282} {"train_loss": -23.797250747680664, "global_step": 189428, "epoch": 2282} {"train_loss": -23.65440559387207, "global_step": 189429, "epoch": 2282} {"train_loss": -24.24595832824707, "global_step": 189430, "epoch": 2282} {"train_loss": -23.804092407226562, "global_step": 189431, "epoch": 2282} {"train_loss": -23.96146011352539, "global_step": 189432, "epoch": 2282} {"train_loss": -23.779277801513672, "global_step": 189433, "epoch": 2282} {"train_loss": -24.1225643157959, "global_step": 189434, "epoch": 2282} {"train_loss": -24.082181930541992, "global_step": 189435, "epoch": 2282} {"train_loss": -24.023784637451172, "global_step": 189436, "epoch": 2282} {"train_loss": -24.02157974243164, "global_step": 189437, "epoch": 2282} {"train_loss": -24.095264434814453, "global_step": 189438, "epoch": 2282} {"train_loss": -24.1853084564209, "global_step": 189439, "epoch": 2282} {"train_loss": -24.256027221679688, "global_step": 189440, "epoch": 2282} {"train_loss": -24.166799545288086, "global_step": 189441, "epoch": 2282} {"train_loss": -24.178503036499023, "global_step": 189442, "epoch": 2282} {"train_loss": -23.841049194335938, "global_step": 189443, "epoch": 2282} {"train_loss": -24.30543327331543, "global_step": 189444, "epoch": 2282} {"train_loss": -24.17191505432129, "global_step": 189445, "epoch": 2282} {"train_loss": -24.30643653869629, "global_step": 189446, "epoch": 2282} {"train_loss": -24.0576171875, "global_step": 189447, "epoch": 2282} {"train_loss": -24.057140350341797, "global_step": 189448, "epoch": 2282} {"train_loss": -24.010700225830078, "global_step": 189449, "epoch": 2282} {"train_loss": -24.085439682006836, "global_step": 189450, "epoch": 2282} {"train_loss": -24.093496322631836, "global_step": 189451, "epoch": 2282} {"train_loss": -23.997163772583008, "global_step": 189452, "epoch": 2282} {"train_loss": -24.004037857055664, "global_step": 189453, "epoch": 2282} {"train_loss": -24.098127365112305, "global_step": 189454, "epoch": 2282} {"train_loss": -23.896230697631836, "global_step": 189455, "epoch": 2282} {"train_loss": -24.091154098510742, "global_step": 189456, "epoch": 2282} {"train_loss": -24.090429306030273, "global_step": 189457, "epoch": 2282} {"train_loss": -23.927072525024414, "global_step": 189458, "epoch": 2282} {"train_loss": -24.350914001464844, "global_step": 189459, "epoch": 2282} {"train_loss": -23.92972183227539, "global_step": 189460, "epoch": 2282} {"train_loss": -24.010583877563477, "global_step": 189461, "epoch": 2282} {"train_loss": -24.018510818481445, "global_step": 189462, "epoch": 2282} {"train_loss": -24.05832290649414, "global_step": 189463, "epoch": 2282} {"train_loss": -24.026643753051758, "global_step": 189464, "epoch": 2282} {"train_loss": -24.369749069213867, "global_step": 189465, "epoch": 2282} {"train_loss": -23.72846794128418, "global_step": 189466, "epoch": 2282} {"train_loss": -24.054471969604492, "global_step": 189467, "epoch": 2282} {"train_loss": -23.898256301879883, "global_step": 189468, "epoch": 2282} {"train_loss": -24.107282638549805, "global_step": 189469, "epoch": 2282} {"train_loss": -24.148208618164062, "global_step": 189470, "epoch": 2282} {"train_loss": -24.033212661743164, "global_step": 189471, "epoch": 2282} {"train_loss": -24.278745651245117, "global_step": 189472, "epoch": 2282} {"train_loss": -24.416738510131836, "global_step": 189473, "epoch": 2282} {"train_loss": -24.339359283447266, "global_step": 189474, "epoch": 2282} {"train_loss": -23.99176025390625, "global_step": 189475, "epoch": 2282} {"train_loss": -23.988056182861328, "global_step": 189476, "epoch": 2282} {"train_loss": -23.748258590698242, "global_step": 189477, "epoch": 2282} {"train_loss": -24.212682723999023, "global_step": 189478, "epoch": 2282} {"train_loss": -24.07602310180664, "global_step": 189479, "epoch": 2282} {"train_loss": -24.057600021362305, "global_step": 189480, "epoch": 2282} {"train_loss": -24.108972549438477, "global_step": 189481, "epoch": 2282} {"train_loss": -23.77796745300293, "global_step": 189482, "epoch": 2282} {"train_loss": -23.907577514648438, "global_step": 189483, "epoch": 2282} {"train_loss": -24.254493713378906, "global_step": 189484, "epoch": 2282} {"train_loss": -24.122854232788086, "global_step": 189485, "epoch": 2282} {"train_loss": -24.131868362426758, "global_step": 189486, "epoch": 2282} {"train_loss": -24.235361099243164, "global_step": 189487, "epoch": 2282} {"train_loss": -23.992066073130413, "global_step": 189488, "epoch": 2282, "val_loss": 6466553.0} {"train_loss": -22.810726165771484, "global_step": 189489, "epoch": 2283} {"train_loss": -22.031604766845703, "global_step": 189490, "epoch": 2283} {"train_loss": -22.793241500854492, "global_step": 189491, "epoch": 2283} {"train_loss": -23.003421783447266, "global_step": 189492, "epoch": 2283} {"train_loss": -23.37483024597168, "global_step": 189493, "epoch": 2283} {"train_loss": -23.41155433654785, "global_step": 189494, "epoch": 2283} {"train_loss": -23.203718185424805, "global_step": 189495, "epoch": 2283} {"train_loss": -23.03920555114746, "global_step": 189496, "epoch": 2283} {"train_loss": -23.3638973236084, "global_step": 189497, "epoch": 2283} {"train_loss": -23.30354881286621, "global_step": 189498, "epoch": 2283} {"train_loss": -23.6785831451416, "global_step": 189499, "epoch": 2283} {"train_loss": -23.489622116088867, "global_step": 189500, "epoch": 2283} {"train_loss": -23.395483016967773, "global_step": 189501, "epoch": 2283} {"train_loss": -23.626699447631836, "global_step": 189502, "epoch": 2283} {"train_loss": -23.458301544189453, "global_step": 189503, "epoch": 2283} {"train_loss": -23.568994522094727, "global_step": 189504, "epoch": 2283} {"train_loss": -23.61396598815918, "global_step": 189505, "epoch": 2283} {"train_loss": -23.510419845581055, "global_step": 189506, "epoch": 2283} {"train_loss": -23.676898956298828, "global_step": 189507, "epoch": 2283} {"train_loss": -23.883359909057617, "global_step": 189508, "epoch": 2283} {"train_loss": -23.869653701782227, "global_step": 189509, "epoch": 2283} {"train_loss": -23.928831100463867, "global_step": 189510, "epoch": 2283} {"train_loss": -23.87162208557129, "global_step": 189511, "epoch": 2283} {"train_loss": -23.953081130981445, "global_step": 189512, "epoch": 2283} {"train_loss": -23.672086715698242, "global_step": 189513, "epoch": 2283} {"train_loss": -24.204181671142578, "global_step": 189514, "epoch": 2283} {"train_loss": -23.78360939025879, "global_step": 189515, "epoch": 2283} {"train_loss": -23.740507125854492, "global_step": 189516, "epoch": 2283} {"train_loss": -24.02822494506836, "global_step": 189517, "epoch": 2283} {"train_loss": -23.871870040893555, "global_step": 189518, "epoch": 2283} {"train_loss": -23.98151397705078, "global_step": 189519, "epoch": 2283} {"train_loss": -23.828155517578125, "global_step": 189520, "epoch": 2283} {"train_loss": -24.164777755737305, "global_step": 189521, "epoch": 2283} {"train_loss": -23.761308670043945, "global_step": 189522, "epoch": 2283} {"train_loss": -23.853452682495117, "global_step": 189523, "epoch": 2283} {"train_loss": -23.903188705444336, "global_step": 189524, "epoch": 2283} {"train_loss": -23.758859634399414, "global_step": 189525, "epoch": 2283} {"train_loss": -23.864938735961914, "global_step": 189526, "epoch": 2283} {"train_loss": -24.418405532836914, "global_step": 189527, "epoch": 2283} {"train_loss": -24.0882568359375, "global_step": 189528, "epoch": 2283} {"train_loss": -24.296186447143555, "global_step": 189529, "epoch": 2283} {"train_loss": -24.04465103149414, "global_step": 189530, "epoch": 2283} {"train_loss": -24.041851043701172, "global_step": 189531, "epoch": 2283} {"train_loss": -23.90240478515625, "global_step": 189532, "epoch": 2283} {"train_loss": -24.09415054321289, "global_step": 189533, "epoch": 2283} {"train_loss": -24.292835235595703, "global_step": 189534, "epoch": 2283} {"train_loss": -23.928424835205078, "global_step": 189535, "epoch": 2283} {"train_loss": -24.204145431518555, "global_step": 189536, "epoch": 2283} {"train_loss": -24.148771286010742, "global_step": 189537, "epoch": 2283} {"train_loss": -24.295440673828125, "global_step": 189538, "epoch": 2283} {"train_loss": -24.342130661010742, "global_step": 189539, "epoch": 2283} {"train_loss": -24.295522689819336, "global_step": 189540, "epoch": 2283} {"train_loss": -24.19285011291504, "global_step": 189541, "epoch": 2283} {"train_loss": -24.31244468688965, "global_step": 189542, "epoch": 2283} {"train_loss": -24.72358512878418, "global_step": 189543, "epoch": 2283} {"train_loss": -23.953332901000977, "global_step": 189544, "epoch": 2283} {"train_loss": -24.46240234375, "global_step": 189545, "epoch": 2283} {"train_loss": -24.282278060913086, "global_step": 189546, "epoch": 2283} {"train_loss": -24.05826759338379, "global_step": 189547, "epoch": 2283} {"train_loss": -23.58249282836914, "global_step": 189548, "epoch": 2283} {"train_loss": -24.389469146728516, "global_step": 189549, "epoch": 2283} {"train_loss": -24.444807052612305, "global_step": 189550, "epoch": 2283} {"train_loss": -24.35849952697754, "global_step": 189551, "epoch": 2283} {"train_loss": -24.16591453552246, "global_step": 189552, "epoch": 2283} {"train_loss": -24.068296432495117, "global_step": 189553, "epoch": 2283} {"train_loss": -24.48552894592285, "global_step": 189554, "epoch": 2283} {"train_loss": -24.17316246032715, "global_step": 189555, "epoch": 2283} {"train_loss": -23.811609268188477, "global_step": 189556, "epoch": 2283} {"train_loss": -23.94141960144043, "global_step": 189557, "epoch": 2283} {"train_loss": -23.95038414001465, "global_step": 189558, "epoch": 2283} {"train_loss": -24.363496780395508, "global_step": 189559, "epoch": 2283} {"train_loss": -24.24583625793457, "global_step": 189560, "epoch": 2283} {"train_loss": -23.831266403198242, "global_step": 189561, "epoch": 2283} {"train_loss": -24.264341354370117, "global_step": 189562, "epoch": 2283} {"train_loss": -23.99741554260254, "global_step": 189563, "epoch": 2283} {"train_loss": -24.090524673461914, "global_step": 189564, "epoch": 2283} {"train_loss": -24.071550369262695, "global_step": 189565, "epoch": 2283} {"train_loss": -24.23023796081543, "global_step": 189566, "epoch": 2283} {"train_loss": -24.30756950378418, "global_step": 189567, "epoch": 2283} {"train_loss": -24.149925231933594, "global_step": 189568, "epoch": 2283} {"train_loss": -24.10625457763672, "global_step": 189569, "epoch": 2283} {"train_loss": -23.98907470703125, "global_step": 189570, "epoch": 2283} {"train_loss": -23.87823920652091, "global_step": 189571, "epoch": 2283, "val_loss": 6480597.0} {"train_loss": -23.978551864624023, "global_step": 189572, "epoch": 2284} {"train_loss": -23.612646102905273, "global_step": 189573, "epoch": 2284} {"train_loss": -23.922677993774414, "global_step": 189574, "epoch": 2284} {"train_loss": -24.084009170532227, "global_step": 189575, "epoch": 2284} {"train_loss": -24.26138687133789, "global_step": 189576, "epoch": 2284} {"train_loss": -23.93024444580078, "global_step": 189577, "epoch": 2284} {"train_loss": -23.9074649810791, "global_step": 189578, "epoch": 2284} {"train_loss": -24.14423942565918, "global_step": 189579, "epoch": 2284} {"train_loss": -23.84764289855957, "global_step": 189580, "epoch": 2284} {"train_loss": -23.853267669677734, "global_step": 189581, "epoch": 2284} {"train_loss": -23.909658432006836, "global_step": 189582, "epoch": 2284} {"train_loss": -24.27750015258789, "global_step": 189583, "epoch": 2284} {"train_loss": -24.0111141204834, "global_step": 189584, "epoch": 2284} {"train_loss": -24.00495719909668, "global_step": 189585, "epoch": 2284} {"train_loss": -23.627431869506836, "global_step": 189586, "epoch": 2284} {"train_loss": -24.092578887939453, "global_step": 189587, "epoch": 2284} {"train_loss": -24.315195083618164, "global_step": 189588, "epoch": 2284} {"train_loss": -24.334060668945312, "global_step": 189589, "epoch": 2284} {"train_loss": -23.72314453125, "global_step": 189590, "epoch": 2284} {"train_loss": -24.085697174072266, "global_step": 189591, "epoch": 2284} {"train_loss": -24.352340698242188, "global_step": 189592, "epoch": 2284} {"train_loss": -24.196622848510742, "global_step": 189593, "epoch": 2284} {"train_loss": -24.44874382019043, "global_step": 189594, "epoch": 2284} {"train_loss": -24.1825008392334, "global_step": 189595, "epoch": 2284} {"train_loss": -24.313512802124023, "global_step": 189596, "epoch": 2284} {"train_loss": -23.96906852722168, "global_step": 189597, "epoch": 2284} {"train_loss": -24.2309627532959, "global_step": 189598, "epoch": 2284} {"train_loss": -24.078027725219727, "global_step": 189599, "epoch": 2284} {"train_loss": -24.32805824279785, "global_step": 189600, "epoch": 2284} {"train_loss": -24.269638061523438, "global_step": 189601, "epoch": 2284} {"train_loss": -24.062650680541992, "global_step": 189602, "epoch": 2284} {"train_loss": -24.097206115722656, "global_step": 189603, "epoch": 2284} {"train_loss": -24.499536514282227, "global_step": 189604, "epoch": 2284} {"train_loss": -24.177492141723633, "global_step": 189605, "epoch": 2284} {"train_loss": -23.99561882019043, "global_step": 189606, "epoch": 2284} {"train_loss": -23.764623641967773, "global_step": 189607, "epoch": 2284} {"train_loss": -24.188024520874023, "global_step": 189608, "epoch": 2284} {"train_loss": -24.27840232849121, "global_step": 189609, "epoch": 2284} {"train_loss": -24.26649284362793, "global_step": 189610, "epoch": 2284} {"train_loss": -24.0432071685791, "global_step": 189611, "epoch": 2284} {"train_loss": -24.343189239501953, "global_step": 189612, "epoch": 2284} {"train_loss": -24.041784286499023, "global_step": 189613, "epoch": 2284} {"train_loss": -23.86117935180664, "global_step": 189614, "epoch": 2284} {"train_loss": -24.026094436645508, "global_step": 189615, "epoch": 2284} {"train_loss": -24.225671768188477, "global_step": 189616, "epoch": 2284} {"train_loss": -24.244874954223633, "global_step": 189617, "epoch": 2284} {"train_loss": -24.10477066040039, "global_step": 189618, "epoch": 2284} {"train_loss": -24.264875411987305, "global_step": 189619, "epoch": 2284} {"train_loss": -23.960763931274414, "global_step": 189620, "epoch": 2284} {"train_loss": -23.60259246826172, "global_step": 189621, "epoch": 2284} {"train_loss": -24.061914443969727, "global_step": 189622, "epoch": 2284} {"train_loss": -23.775983810424805, "global_step": 189623, "epoch": 2284} {"train_loss": -23.566640853881836, "global_step": 189624, "epoch": 2284} {"train_loss": -23.52144432067871, "global_step": 189625, "epoch": 2284} {"train_loss": -24.406225204467773, "global_step": 189626, "epoch": 2284} {"train_loss": -24.00455093383789, "global_step": 189627, "epoch": 2284} {"train_loss": -23.86670684814453, "global_step": 189628, "epoch": 2284} {"train_loss": -24.14908790588379, "global_step": 189629, "epoch": 2284} {"train_loss": -24.192148208618164, "global_step": 189630, "epoch": 2284} {"train_loss": -24.119827270507812, "global_step": 189631, "epoch": 2284} {"train_loss": -23.899124145507812, "global_step": 189632, "epoch": 2284} {"train_loss": -23.928024291992188, "global_step": 189633, "epoch": 2284} {"train_loss": -23.967519760131836, "global_step": 189634, "epoch": 2284} {"train_loss": -24.376144409179688, "global_step": 189635, "epoch": 2284} {"train_loss": -24.041152954101562, "global_step": 189636, "epoch": 2284} {"train_loss": -23.88504981994629, "global_step": 189637, "epoch": 2284} {"train_loss": -23.945941925048828, "global_step": 189638, "epoch": 2284} {"train_loss": -23.83157730102539, "global_step": 189639, "epoch": 2284} {"train_loss": -23.881336212158203, "global_step": 189640, "epoch": 2284} {"train_loss": -23.976675033569336, "global_step": 189641, "epoch": 2284} {"train_loss": -24.03529167175293, "global_step": 189642, "epoch": 2284} {"train_loss": -24.39082145690918, "global_step": 189643, "epoch": 2284} {"train_loss": -24.152231216430664, "global_step": 189644, "epoch": 2284} {"train_loss": -24.404760360717773, "global_step": 189645, "epoch": 2284} {"train_loss": -23.310178756713867, "global_step": 189646, "epoch": 2284} {"train_loss": -23.729900360107422, "global_step": 189647, "epoch": 2284} {"train_loss": -23.788938522338867, "global_step": 189648, "epoch": 2284} {"train_loss": -24.25006675720215, "global_step": 189649, "epoch": 2284} {"train_loss": -24.034360885620117, "global_step": 189650, "epoch": 2284} {"train_loss": -23.554227828979492, "global_step": 189651, "epoch": 2284} {"train_loss": -23.97163200378418, "global_step": 189652, "epoch": 2284} {"train_loss": -24.053485870361328, "global_step": 189653, "epoch": 2284} {"train_loss": -24.030473295464574, "global_step": 189654, "epoch": 2284, "val_loss": 6581944.0} {"train_loss": -22.963205337524414, "global_step": 189655, "epoch": 2285} {"train_loss": -23.90566062927246, "global_step": 189656, "epoch": 2285} {"train_loss": -23.430326461791992, "global_step": 189657, "epoch": 2285} {"train_loss": -23.56129264831543, "global_step": 189658, "epoch": 2285} {"train_loss": -23.174983978271484, "global_step": 189659, "epoch": 2285} {"train_loss": -23.425037384033203, "global_step": 189660, "epoch": 2285} {"train_loss": -23.25624656677246, "global_step": 189661, "epoch": 2285} {"train_loss": -23.919363021850586, "global_step": 189662, "epoch": 2285} {"train_loss": -23.59566307067871, "global_step": 189663, "epoch": 2285} {"train_loss": -23.079256057739258, "global_step": 189664, "epoch": 2285} {"train_loss": -23.894834518432617, "global_step": 189665, "epoch": 2285} {"train_loss": -23.55470848083496, "global_step": 189666, "epoch": 2285} {"train_loss": -23.577497482299805, "global_step": 189667, "epoch": 2285} {"train_loss": -23.929906845092773, "global_step": 189668, "epoch": 2285} {"train_loss": -24.042463302612305, "global_step": 189669, "epoch": 2285} {"train_loss": -23.945953369140625, "global_step": 189670, "epoch": 2285} {"train_loss": -24.11731719970703, "global_step": 189671, "epoch": 2285} {"train_loss": -23.674579620361328, "global_step": 189672, "epoch": 2285} {"train_loss": -23.9097957611084, "global_step": 189673, "epoch": 2285} {"train_loss": -24.08416748046875, "global_step": 189674, "epoch": 2285} {"train_loss": -23.76984977722168, "global_step": 189675, "epoch": 2285} {"train_loss": -23.888187408447266, "global_step": 189676, "epoch": 2285} {"train_loss": -24.068740844726562, "global_step": 189677, "epoch": 2285} {"train_loss": -23.727354049682617, "global_step": 189678, "epoch": 2285} {"train_loss": -23.9437313079834, "global_step": 189679, "epoch": 2285} {"train_loss": -24.36236572265625, "global_step": 189680, "epoch": 2285} {"train_loss": -23.999235153198242, "global_step": 189681, "epoch": 2285} {"train_loss": -23.959196090698242, "global_step": 189682, "epoch": 2285} {"train_loss": -23.939313888549805, "global_step": 189683, "epoch": 2285} {"train_loss": -24.089563369750977, "global_step": 189684, "epoch": 2285} {"train_loss": -23.92235565185547, "global_step": 189685, "epoch": 2285} {"train_loss": -23.776742935180664, "global_step": 189686, "epoch": 2285} {"train_loss": -23.690744400024414, "global_step": 189687, "epoch": 2285} {"train_loss": -24.07953453063965, "global_step": 189688, "epoch": 2285} {"train_loss": -23.82954216003418, "global_step": 189689, "epoch": 2285} {"train_loss": -23.970125198364258, "global_step": 189690, "epoch": 2285} {"train_loss": -24.104427337646484, "global_step": 189691, "epoch": 2285} {"train_loss": -24.141263961791992, "global_step": 189692, "epoch": 2285} {"train_loss": -24.45722007751465, "global_step": 189693, "epoch": 2285} {"train_loss": -24.069473266601562, "global_step": 189694, "epoch": 2285} {"train_loss": -24.041858673095703, "global_step": 189695, "epoch": 2285} {"train_loss": -23.83794593811035, "global_step": 189696, "epoch": 2285} {"train_loss": -23.850505828857422, "global_step": 189697, "epoch": 2285} {"train_loss": -24.263946533203125, "global_step": 189698, "epoch": 2285} {"train_loss": -23.971242904663086, "global_step": 189699, "epoch": 2285} {"train_loss": -23.89432144165039, "global_step": 189700, "epoch": 2285} {"train_loss": -24.108102798461914, "global_step": 189701, "epoch": 2285} {"train_loss": -23.975767135620117, "global_step": 189702, "epoch": 2285} {"train_loss": -24.143211364746094, "global_step": 189703, "epoch": 2285} {"train_loss": -24.41181755065918, "global_step": 189704, "epoch": 2285} {"train_loss": -24.012592315673828, "global_step": 189705, "epoch": 2285} {"train_loss": -24.17903709411621, "global_step": 189706, "epoch": 2285} {"train_loss": -24.318317413330078, "global_step": 189707, "epoch": 2285} {"train_loss": -24.143281936645508, "global_step": 189708, "epoch": 2285} {"train_loss": -24.116321563720703, "global_step": 189709, "epoch": 2285} {"train_loss": -23.888059616088867, "global_step": 189710, "epoch": 2285} {"train_loss": -24.05985450744629, "global_step": 189711, "epoch": 2285} {"train_loss": -24.2708683013916, "global_step": 189712, "epoch": 2285} {"train_loss": -24.47966194152832, "global_step": 189713, "epoch": 2285} {"train_loss": -24.328500747680664, "global_step": 189714, "epoch": 2285} {"train_loss": -24.11650848388672, "global_step": 189715, "epoch": 2285} {"train_loss": -24.2839412689209, "global_step": 189716, "epoch": 2285} {"train_loss": -24.07210350036621, "global_step": 189717, "epoch": 2285} {"train_loss": -23.98654556274414, "global_step": 189718, "epoch": 2285} {"train_loss": -24.40419578552246, "global_step": 189719, "epoch": 2285} {"train_loss": -24.1107177734375, "global_step": 189720, "epoch": 2285} {"train_loss": -24.199811935424805, "global_step": 189721, "epoch": 2285} {"train_loss": -24.23211669921875, "global_step": 189722, "epoch": 2285} {"train_loss": -24.275146484375, "global_step": 189723, "epoch": 2285} {"train_loss": -23.880460739135742, "global_step": 189724, "epoch": 2285} {"train_loss": -23.758037567138672, "global_step": 189725, "epoch": 2285} {"train_loss": -24.338422775268555, "global_step": 189726, "epoch": 2285} {"train_loss": -24.26253318786621, "global_step": 189727, "epoch": 2285} {"train_loss": -23.84685707092285, "global_step": 189728, "epoch": 2285} {"train_loss": -23.624679565429688, "global_step": 189729, "epoch": 2285} {"train_loss": -23.920486450195312, "global_step": 189730, "epoch": 2285} {"train_loss": -24.57209014892578, "global_step": 189731, "epoch": 2285} {"train_loss": -24.147308349609375, "global_step": 189732, "epoch": 2285} {"train_loss": -24.25623893737793, "global_step": 189733, "epoch": 2285} {"train_loss": -24.348987579345703, "global_step": 189734, "epoch": 2285} {"train_loss": -24.02266502380371, "global_step": 189735, "epoch": 2285} {"train_loss": -24.292268753051758, "global_step": 189736, "epoch": 2285} {"train_loss": -23.983356108148413, "global_step": 189737, "epoch": 2285, "val_loss": 6450445.0} {"train_loss": -23.722217559814453, "global_step": 189738, "epoch": 2286} {"train_loss": -23.296873092651367, "global_step": 189739, "epoch": 2286} {"train_loss": -23.8867244720459, "global_step": 189740, "epoch": 2286} {"train_loss": -23.18360710144043, "global_step": 189741, "epoch": 2286} {"train_loss": -22.96465301513672, "global_step": 189742, "epoch": 2286} {"train_loss": -23.108198165893555, "global_step": 189743, "epoch": 2286} {"train_loss": -23.535829544067383, "global_step": 189744, "epoch": 2286} {"train_loss": -23.404417037963867, "global_step": 189745, "epoch": 2286} {"train_loss": -23.52265739440918, "global_step": 189746, "epoch": 2286} {"train_loss": -23.56330108642578, "global_step": 189747, "epoch": 2286} {"train_loss": -23.563234329223633, "global_step": 189748, "epoch": 2286} {"train_loss": -23.997526168823242, "global_step": 189749, "epoch": 2286} {"train_loss": -23.705324172973633, "global_step": 189750, "epoch": 2286} {"train_loss": -23.530553817749023, "global_step": 189751, "epoch": 2286} {"train_loss": -23.88738250732422, "global_step": 189752, "epoch": 2286} {"train_loss": -23.484256744384766, "global_step": 189753, "epoch": 2286} {"train_loss": -23.676477432250977, "global_step": 189754, "epoch": 2286} {"train_loss": -23.550661087036133, "global_step": 189755, "epoch": 2286} {"train_loss": -23.647037506103516, "global_step": 189756, "epoch": 2286} {"train_loss": -24.05039405822754, "global_step": 189757, "epoch": 2286} {"train_loss": -23.906570434570312, "global_step": 189758, "epoch": 2286} {"train_loss": -23.59894371032715, "global_step": 189759, "epoch": 2286} {"train_loss": -24.020666122436523, "global_step": 189760, "epoch": 2286} {"train_loss": -23.737918853759766, "global_step": 189761, "epoch": 2286} {"train_loss": -24.066267013549805, "global_step": 189762, "epoch": 2286} {"train_loss": -23.702945709228516, "global_step": 189763, "epoch": 2286} {"train_loss": -24.22370719909668, "global_step": 189764, "epoch": 2286} {"train_loss": -24.052143096923828, "global_step": 189765, "epoch": 2286} {"train_loss": -23.775196075439453, "global_step": 189766, "epoch": 2286} {"train_loss": -24.1366024017334, "global_step": 189767, "epoch": 2286} {"train_loss": -24.141597747802734, "global_step": 189768, "epoch": 2286} {"train_loss": -23.787229537963867, "global_step": 189769, "epoch": 2286} {"train_loss": -23.806772232055664, "global_step": 189770, "epoch": 2286} {"train_loss": -24.30344581604004, "global_step": 189771, "epoch": 2286} {"train_loss": -24.082136154174805, "global_step": 189772, "epoch": 2286} {"train_loss": -24.01975440979004, "global_step": 189773, "epoch": 2286} {"train_loss": -24.296964645385742, "global_step": 189774, "epoch": 2286} {"train_loss": -24.145282745361328, "global_step": 189775, "epoch": 2286} {"train_loss": -23.968402862548828, "global_step": 189776, "epoch": 2286} {"train_loss": -24.193456649780273, "global_step": 189777, "epoch": 2286} {"train_loss": -23.932401657104492, "global_step": 189778, "epoch": 2286} {"train_loss": -24.207218170166016, "global_step": 189779, "epoch": 2286} {"train_loss": -24.374698638916016, "global_step": 189780, "epoch": 2286} {"train_loss": -24.219207763671875, "global_step": 189781, "epoch": 2286} {"train_loss": -24.373945236206055, "global_step": 189782, "epoch": 2286} {"train_loss": -23.88600730895996, "global_step": 189783, "epoch": 2286} {"train_loss": -24.243864059448242, "global_step": 189784, "epoch": 2286} {"train_loss": -24.255661010742188, "global_step": 189785, "epoch": 2286} {"train_loss": -24.288238525390625, "global_step": 189786, "epoch": 2286} {"train_loss": -24.399507522583008, "global_step": 189787, "epoch": 2286} {"train_loss": -24.015119552612305, "global_step": 189788, "epoch": 2286} {"train_loss": -24.194307327270508, "global_step": 189789, "epoch": 2286} {"train_loss": -24.064477920532227, "global_step": 189790, "epoch": 2286} {"train_loss": -24.0842227935791, "global_step": 189791, "epoch": 2286} {"train_loss": -23.878820419311523, "global_step": 189792, "epoch": 2286} {"train_loss": -24.0891170501709, "global_step": 189793, "epoch": 2286} {"train_loss": -23.846149444580078, "global_step": 189794, "epoch": 2286} {"train_loss": -23.25226402282715, "global_step": 189795, "epoch": 2286} {"train_loss": -23.491596221923828, "global_step": 189796, "epoch": 2286} {"train_loss": -23.917699813842773, "global_step": 189797, "epoch": 2286} {"train_loss": -23.880460739135742, "global_step": 189798, "epoch": 2286} {"train_loss": -23.542774200439453, "global_step": 189799, "epoch": 2286} {"train_loss": -23.630985260009766, "global_step": 189800, "epoch": 2286} {"train_loss": -24.061574935913086, "global_step": 189801, "epoch": 2286} {"train_loss": -24.185287475585938, "global_step": 189802, "epoch": 2286} {"train_loss": -23.50065040588379, "global_step": 189803, "epoch": 2286} {"train_loss": -23.907838821411133, "global_step": 189804, "epoch": 2286} {"train_loss": -24.023193359375, "global_step": 189805, "epoch": 2286} {"train_loss": -24.134443283081055, "global_step": 189806, "epoch": 2286} {"train_loss": -23.974254608154297, "global_step": 189807, "epoch": 2286} {"train_loss": -24.260419845581055, "global_step": 189808, "epoch": 2286} {"train_loss": -23.924253463745117, "global_step": 189809, "epoch": 2286} {"train_loss": -23.777647018432617, "global_step": 189810, "epoch": 2286} {"train_loss": -24.255102157592773, "global_step": 189811, "epoch": 2286} {"train_loss": -23.99088478088379, "global_step": 189812, "epoch": 2286} {"train_loss": -24.141096115112305, "global_step": 189813, "epoch": 2286} {"train_loss": -24.224416732788086, "global_step": 189814, "epoch": 2286} {"train_loss": -24.243274688720703, "global_step": 189815, "epoch": 2286} {"train_loss": -24.029769897460938, "global_step": 189816, "epoch": 2286} {"train_loss": -24.24684715270996, "global_step": 189817, "epoch": 2286} {"train_loss": -23.69784927368164, "global_step": 189818, "epoch": 2286} {"train_loss": -24.001501083374023, "global_step": 189819, "epoch": 2286} {"train_loss": -23.90721148755177, "global_step": 189820, "epoch": 2286, "val_loss": 6333034.0} {"train_loss": -23.814220428466797, "global_step": 189821, "epoch": 2287} {"train_loss": -23.97237205505371, "global_step": 189822, "epoch": 2287} {"train_loss": -23.48520278930664, "global_step": 189823, "epoch": 2287} {"train_loss": -23.744571685791016, "global_step": 189824, "epoch": 2287} {"train_loss": -24.016454696655273, "global_step": 189825, "epoch": 2287} {"train_loss": -23.967714309692383, "global_step": 189826, "epoch": 2287} {"train_loss": -23.82515525817871, "global_step": 189827, "epoch": 2287} {"train_loss": -23.931835174560547, "global_step": 189828, "epoch": 2287} {"train_loss": -24.06913948059082, "global_step": 189829, "epoch": 2287} {"train_loss": -24.073827743530273, "global_step": 189830, "epoch": 2287} {"train_loss": -24.03461265563965, "global_step": 189831, "epoch": 2287} {"train_loss": -24.108449935913086, "global_step": 189832, "epoch": 2287} {"train_loss": -24.220502853393555, "global_step": 189833, "epoch": 2287} {"train_loss": -23.99997329711914, "global_step": 189834, "epoch": 2287} {"train_loss": -24.295339584350586, "global_step": 189835, "epoch": 2287} {"train_loss": -24.71749496459961, "global_step": 189836, "epoch": 2287} {"train_loss": -23.755643844604492, "global_step": 189837, "epoch": 2287} {"train_loss": -24.396150588989258, "global_step": 189838, "epoch": 2287} {"train_loss": -24.239826202392578, "global_step": 189839, "epoch": 2287} {"train_loss": -24.281204223632812, "global_step": 189840, "epoch": 2287} {"train_loss": -23.945154190063477, "global_step": 189841, "epoch": 2287} {"train_loss": -24.04433822631836, "global_step": 189842, "epoch": 2287} {"train_loss": -23.940021514892578, "global_step": 189843, "epoch": 2287} {"train_loss": -24.291091918945312, "global_step": 189844, "epoch": 2287} {"train_loss": -24.54705047607422, "global_step": 189845, "epoch": 2287} {"train_loss": -24.600013732910156, "global_step": 189846, "epoch": 2287} {"train_loss": -24.50676918029785, "global_step": 189847, "epoch": 2287} {"train_loss": -24.470478057861328, "global_step": 189848, "epoch": 2287} {"train_loss": -24.242374420166016, "global_step": 189849, "epoch": 2287} {"train_loss": -24.41823959350586, "global_step": 189850, "epoch": 2287} {"train_loss": -24.286861419677734, "global_step": 189851, "epoch": 2287} {"train_loss": -24.171371459960938, "global_step": 189852, "epoch": 2287} {"train_loss": -24.331823348999023, "global_step": 189853, "epoch": 2287} {"train_loss": -23.953886032104492, "global_step": 189854, "epoch": 2287} {"train_loss": -23.90256118774414, "global_step": 189855, "epoch": 2287} {"train_loss": -23.894332885742188, "global_step": 189856, "epoch": 2287} {"train_loss": -24.203184127807617, "global_step": 189857, "epoch": 2287} {"train_loss": -24.030080795288086, "global_step": 189858, "epoch": 2287} {"train_loss": -23.937618255615234, "global_step": 189859, "epoch": 2287} {"train_loss": -24.1516170501709, "global_step": 189860, "epoch": 2287} {"train_loss": -23.973270416259766, "global_step": 189861, "epoch": 2287} {"train_loss": -24.014307022094727, "global_step": 189862, "epoch": 2287} {"train_loss": -24.012449264526367, "global_step": 189863, "epoch": 2287} {"train_loss": -24.236083984375, "global_step": 189864, "epoch": 2287} {"train_loss": -23.870712280273438, "global_step": 189865, "epoch": 2287} {"train_loss": -23.91444969177246, "global_step": 189866, "epoch": 2287} {"train_loss": -23.87564468383789, "global_step": 189867, "epoch": 2287} {"train_loss": -23.994617462158203, "global_step": 189868, "epoch": 2287} {"train_loss": -24.058475494384766, "global_step": 189869, "epoch": 2287} {"train_loss": -23.868404388427734, "global_step": 189870, "epoch": 2287} {"train_loss": -24.25442886352539, "global_step": 189871, "epoch": 2287} {"train_loss": -23.874914169311523, "global_step": 189872, "epoch": 2287} {"train_loss": -24.307493209838867, "global_step": 189873, "epoch": 2287} {"train_loss": -24.207361221313477, "global_step": 189874, "epoch": 2287} {"train_loss": -24.222158432006836, "global_step": 189875, "epoch": 2287} {"train_loss": -23.880273818969727, "global_step": 189876, "epoch": 2287} {"train_loss": -24.245986938476562, "global_step": 189877, "epoch": 2287} {"train_loss": -23.962812423706055, "global_step": 189878, "epoch": 2287} {"train_loss": -24.119335174560547, "global_step": 189879, "epoch": 2287} {"train_loss": -24.110414505004883, "global_step": 189880, "epoch": 2287} {"train_loss": -24.128469467163086, "global_step": 189881, "epoch": 2287} {"train_loss": -24.11470603942871, "global_step": 189882, "epoch": 2287} {"train_loss": -24.318626403808594, "global_step": 189883, "epoch": 2287} {"train_loss": -24.642545700073242, "global_step": 189884, "epoch": 2287} {"train_loss": -23.80682373046875, "global_step": 189885, "epoch": 2287} {"train_loss": -24.108015060424805, "global_step": 189886, "epoch": 2287} {"train_loss": -24.192474365234375, "global_step": 189887, "epoch": 2287} {"train_loss": -23.839570999145508, "global_step": 189888, "epoch": 2287} {"train_loss": -23.982725143432617, "global_step": 189889, "epoch": 2287} {"train_loss": -24.28053092956543, "global_step": 189890, "epoch": 2287} {"train_loss": -23.981475830078125, "global_step": 189891, "epoch": 2287} {"train_loss": -23.791486740112305, "global_step": 189892, "epoch": 2287} {"train_loss": -24.359663009643555, "global_step": 189893, "epoch": 2287} {"train_loss": -23.90673828125, "global_step": 189894, "epoch": 2287} {"train_loss": -24.226064682006836, "global_step": 189895, "epoch": 2287} {"train_loss": -24.21567153930664, "global_step": 189896, "epoch": 2287} {"train_loss": -23.927377700805664, "global_step": 189897, "epoch": 2287} {"train_loss": -24.153369903564453, "global_step": 189898, "epoch": 2287} {"train_loss": -23.8053035736084, "global_step": 189899, "epoch": 2287} {"train_loss": -24.214923858642578, "global_step": 189900, "epoch": 2287} {"train_loss": -24.19158935546875, "global_step": 189901, "epoch": 2287} {"train_loss": -23.849048614501953, "global_step": 189902, "epoch": 2287} {"train_loss": -24.08992588089173, "global_step": 189903, "epoch": 2287, "val_loss": 6616883.5} {"train_loss": -20.646831512451172, "global_step": 189904, "epoch": 2288} {"train_loss": -22.02803611755371, "global_step": 189905, "epoch": 2288} {"train_loss": -21.159902572631836, "global_step": 189906, "epoch": 2288} {"train_loss": -23.009767532348633, "global_step": 189907, "epoch": 2288} {"train_loss": -21.435503005981445, "global_step": 189908, "epoch": 2288} {"train_loss": -22.7861270904541, "global_step": 189909, "epoch": 2288} {"train_loss": -22.405271530151367, "global_step": 189910, "epoch": 2288} {"train_loss": -22.18247413635254, "global_step": 189911, "epoch": 2288} {"train_loss": -23.030282974243164, "global_step": 189912, "epoch": 2288} {"train_loss": -22.844833374023438, "global_step": 189913, "epoch": 2288} {"train_loss": -22.6910343170166, "global_step": 189914, "epoch": 2288} {"train_loss": -22.837804794311523, "global_step": 189915, "epoch": 2288} {"train_loss": -23.051013946533203, "global_step": 189916, "epoch": 2288} {"train_loss": -22.989593505859375, "global_step": 189917, "epoch": 2288} {"train_loss": -22.862445831298828, "global_step": 189918, "epoch": 2288} {"train_loss": -22.96990394592285, "global_step": 189919, "epoch": 2288} {"train_loss": -22.952510833740234, "global_step": 189920, "epoch": 2288} {"train_loss": -23.34435272216797, "global_step": 189921, "epoch": 2288} {"train_loss": -23.104862213134766, "global_step": 189922, "epoch": 2288} {"train_loss": -23.105438232421875, "global_step": 189923, "epoch": 2288} {"train_loss": -22.988739013671875, "global_step": 189924, "epoch": 2288} {"train_loss": -23.200910568237305, "global_step": 189925, "epoch": 2288} {"train_loss": -23.39179229736328, "global_step": 189926, "epoch": 2288} {"train_loss": -23.587602615356445, "global_step": 189927, "epoch": 2288} {"train_loss": -23.273353576660156, "global_step": 189928, "epoch": 2288} {"train_loss": -23.14752197265625, "global_step": 189929, "epoch": 2288} {"train_loss": -23.37796974182129, "global_step": 189930, "epoch": 2288} {"train_loss": -23.157499313354492, "global_step": 189931, "epoch": 2288} {"train_loss": -23.606374740600586, "global_step": 189932, "epoch": 2288} {"train_loss": -23.402929306030273, "global_step": 189933, "epoch": 2288} {"train_loss": -23.751649856567383, "global_step": 189934, "epoch": 2288} {"train_loss": -23.61661720275879, "global_step": 189935, "epoch": 2288} {"train_loss": -23.61969757080078, "global_step": 189936, "epoch": 2288} {"train_loss": -24.0638484954834, "global_step": 189937, "epoch": 2288} {"train_loss": -23.626935958862305, "global_step": 189938, "epoch": 2288} {"train_loss": -23.90756607055664, "global_step": 189939, "epoch": 2288} {"train_loss": -23.485107421875, "global_step": 189940, "epoch": 2288} {"train_loss": -23.521276473999023, "global_step": 189941, "epoch": 2288} {"train_loss": -23.81678581237793, "global_step": 189942, "epoch": 2288} {"train_loss": -23.612211227416992, "global_step": 189943, "epoch": 2288} {"train_loss": -23.544418334960938, "global_step": 189944, "epoch": 2288} {"train_loss": -23.919702529907227, "global_step": 189945, "epoch": 2288} {"train_loss": -23.489065170288086, "global_step": 189946, "epoch": 2288} {"train_loss": -24.17792320251465, "global_step": 189947, "epoch": 2288} {"train_loss": -23.72856330871582, "global_step": 189948, "epoch": 2288} {"train_loss": -23.885122299194336, "global_step": 189949, "epoch": 2288} {"train_loss": -23.994775772094727, "global_step": 189950, "epoch": 2288} {"train_loss": -24.037553787231445, "global_step": 189951, "epoch": 2288} {"train_loss": -24.153663635253906, "global_step": 189952, "epoch": 2288} {"train_loss": -23.86012077331543, "global_step": 189953, "epoch": 2288} {"train_loss": -23.4375057220459, "global_step": 189954, "epoch": 2288} {"train_loss": -24.345869064331055, "global_step": 189955, "epoch": 2288} {"train_loss": -23.6009464263916, "global_step": 189956, "epoch": 2288} {"train_loss": -24.09278678894043, "global_step": 189957, "epoch": 2288} {"train_loss": -23.97150993347168, "global_step": 189958, "epoch": 2288} {"train_loss": -24.10858726501465, "global_step": 189959, "epoch": 2288} {"train_loss": -24.33742332458496, "global_step": 189960, "epoch": 2288} {"train_loss": -24.80235481262207, "global_step": 189961, "epoch": 2288} {"train_loss": -24.132356643676758, "global_step": 189962, "epoch": 2288} {"train_loss": -24.06207847595215, "global_step": 189963, "epoch": 2288} {"train_loss": -24.14005470275879, "global_step": 189964, "epoch": 2288} {"train_loss": -24.03656005859375, "global_step": 189965, "epoch": 2288} {"train_loss": -23.792299270629883, "global_step": 189966, "epoch": 2288} {"train_loss": -24.13193130493164, "global_step": 189967, "epoch": 2288} {"train_loss": -24.381887435913086, "global_step": 189968, "epoch": 2288} {"train_loss": -24.511411666870117, "global_step": 189969, "epoch": 2288} {"train_loss": -24.202686309814453, "global_step": 189970, "epoch": 2288} {"train_loss": -23.876953125, "global_step": 189971, "epoch": 2288} {"train_loss": -24.111364364624023, "global_step": 189972, "epoch": 2288} {"train_loss": -24.532299041748047, "global_step": 189973, "epoch": 2288} {"train_loss": -24.18252944946289, "global_step": 189974, "epoch": 2288} {"train_loss": -23.85772132873535, "global_step": 189975, "epoch": 2288} {"train_loss": -24.263172149658203, "global_step": 189976, "epoch": 2288} {"train_loss": -23.93525505065918, "global_step": 189977, "epoch": 2288} {"train_loss": -24.37299156188965, "global_step": 189978, "epoch": 2288} {"train_loss": -24.24058723449707, "global_step": 189979, "epoch": 2288} {"train_loss": -24.327571868896484, "global_step": 189980, "epoch": 2288} {"train_loss": -24.076946258544922, "global_step": 189981, "epoch": 2288} {"train_loss": -24.1243896484375, "global_step": 189982, "epoch": 2288} {"train_loss": -24.253225326538086, "global_step": 189983, "epoch": 2288} {"train_loss": -24.03922462463379, "global_step": 189984, "epoch": 2288} {"train_loss": -23.96396255493164, "global_step": 189985, "epoch": 2288} {"train_loss": -23.574459144868047, "global_step": 189986, "epoch": 2288, "val_loss": 6490172.0} {"train_loss": -23.856386184692383, "global_step": 189987, "epoch": 2289} {"train_loss": -24.16633415222168, "global_step": 189988, "epoch": 2289} {"train_loss": -24.013986587524414, "global_step": 189989, "epoch": 2289} {"train_loss": -24.191978454589844, "global_step": 189990, "epoch": 2289} {"train_loss": -24.06593894958496, "global_step": 189991, "epoch": 2289} {"train_loss": -24.289081573486328, "global_step": 189992, "epoch": 2289} {"train_loss": -23.96702003479004, "global_step": 189993, "epoch": 2289} {"train_loss": -24.03999137878418, "global_step": 189994, "epoch": 2289} {"train_loss": -23.91692543029785, "global_step": 189995, "epoch": 2289} {"train_loss": -24.20446014404297, "global_step": 189996, "epoch": 2289} {"train_loss": -23.961137771606445, "global_step": 189997, "epoch": 2289} {"train_loss": -23.845134735107422, "global_step": 189998, "epoch": 2289} {"train_loss": -24.080108642578125, "global_step": 189999, "epoch": 2289} {"train_loss": -23.73602867126465, "global_step": 190000, "epoch": 2289} {"train_loss": -24.0289363861084, "global_step": 190001, "epoch": 2289} {"train_loss": -23.876073837280273, "global_step": 190002, "epoch": 2289} {"train_loss": -24.120412826538086, "global_step": 190003, "epoch": 2289} {"train_loss": -23.980365753173828, "global_step": 190004, "epoch": 2289} {"train_loss": -23.992040634155273, "global_step": 190005, "epoch": 2289} {"train_loss": -24.05911636352539, "global_step": 190006, "epoch": 2289} {"train_loss": -23.881357192993164, "global_step": 190007, "epoch": 2289} {"train_loss": -23.79096031188965, "global_step": 190008, "epoch": 2289} {"train_loss": -24.156850814819336, "global_step": 190009, "epoch": 2289} {"train_loss": -24.19729995727539, "global_step": 190010, "epoch": 2289} {"train_loss": -24.327253341674805, "global_step": 190011, "epoch": 2289} {"train_loss": -24.282554626464844, "global_step": 190012, "epoch": 2289} {"train_loss": -23.918521881103516, "global_step": 190013, "epoch": 2289} {"train_loss": -24.289762496948242, "global_step": 190014, "epoch": 2289} {"train_loss": -24.21530532836914, "global_step": 190015, "epoch": 2289} {"train_loss": -24.041751861572266, "global_step": 190016, "epoch": 2289} {"train_loss": -23.947656631469727, "global_step": 190017, "epoch": 2289} {"train_loss": -24.198957443237305, "global_step": 190018, "epoch": 2289} {"train_loss": -24.27326774597168, "global_step": 190019, "epoch": 2289} {"train_loss": -24.27362632751465, "global_step": 190020, "epoch": 2289} {"train_loss": -24.06938934326172, "global_step": 190021, "epoch": 2289} {"train_loss": -23.900327682495117, "global_step": 190022, "epoch": 2289} {"train_loss": -24.347597122192383, "global_step": 190023, "epoch": 2289} {"train_loss": -23.847501754760742, "global_step": 190024, "epoch": 2289} {"train_loss": -24.232492446899414, "global_step": 190025, "epoch": 2289} {"train_loss": -24.06456184387207, "global_step": 190026, "epoch": 2289} {"train_loss": -24.392560958862305, "global_step": 190027, "epoch": 2289} {"train_loss": -23.925222396850586, "global_step": 190028, "epoch": 2289} {"train_loss": -24.309831619262695, "global_step": 190029, "epoch": 2289} {"train_loss": -24.245101928710938, "global_step": 190030, "epoch": 2289} {"train_loss": -24.281274795532227, "global_step": 190031, "epoch": 2289} {"train_loss": -24.075428009033203, "global_step": 190032, "epoch": 2289} {"train_loss": -24.094228744506836, "global_step": 190033, "epoch": 2289} {"train_loss": -24.15366554260254, "global_step": 190034, "epoch": 2289} {"train_loss": -24.216995239257812, "global_step": 190035, "epoch": 2289} {"train_loss": -24.477468490600586, "global_step": 190036, "epoch": 2289} {"train_loss": -24.305744171142578, "global_step": 190037, "epoch": 2289} {"train_loss": -23.924543380737305, "global_step": 190038, "epoch": 2289} {"train_loss": -24.00927734375, "global_step": 190039, "epoch": 2289} {"train_loss": -24.01895523071289, "global_step": 190040, "epoch": 2289} {"train_loss": -24.152456283569336, "global_step": 190041, "epoch": 2289} {"train_loss": -23.925214767456055, "global_step": 190042, "epoch": 2289} {"train_loss": -24.18046760559082, "global_step": 190043, "epoch": 2289} {"train_loss": -24.08514404296875, "global_step": 190044, "epoch": 2289} {"train_loss": -24.174020767211914, "global_step": 190045, "epoch": 2289} {"train_loss": -24.251680374145508, "global_step": 190046, "epoch": 2289} {"train_loss": -24.27631187438965, "global_step": 190047, "epoch": 2289} {"train_loss": -23.9827938079834, "global_step": 190048, "epoch": 2289} {"train_loss": -23.988155364990234, "global_step": 190049, "epoch": 2289} {"train_loss": -23.88992691040039, "global_step": 190050, "epoch": 2289} {"train_loss": -24.14456558227539, "global_step": 190051, "epoch": 2289} {"train_loss": -24.019187927246094, "global_step": 190052, "epoch": 2289} {"train_loss": -24.349693298339844, "global_step": 190053, "epoch": 2289} {"train_loss": -23.876569747924805, "global_step": 190054, "epoch": 2289} {"train_loss": -23.85221290588379, "global_step": 190055, "epoch": 2289} {"train_loss": -23.91351890563965, "global_step": 190056, "epoch": 2289} {"train_loss": -24.009252548217773, "global_step": 190057, "epoch": 2289} {"train_loss": -24.28278160095215, "global_step": 190058, "epoch": 2289} {"train_loss": -24.525320053100586, "global_step": 190059, "epoch": 2289} {"train_loss": -24.087644577026367, "global_step": 190060, "epoch": 2289} {"train_loss": -24.206329345703125, "global_step": 190061, "epoch": 2289} {"train_loss": -24.119104385375977, "global_step": 190062, "epoch": 2289} {"train_loss": -24.109283447265625, "global_step": 190063, "epoch": 2289} {"train_loss": -23.91973876953125, "global_step": 190064, "epoch": 2289} {"train_loss": -23.836551666259766, "global_step": 190065, "epoch": 2289} {"train_loss": -23.80449867248535, "global_step": 190066, "epoch": 2289} {"train_loss": -23.91400718688965, "global_step": 190067, "epoch": 2289} {"train_loss": -23.943748474121094, "global_step": 190068, "epoch": 2289} {"train_loss": -24.065332964242224, "global_step": 190069, "epoch": 2289, "val_loss": 6424949.0} {"train_loss": -23.61349868774414, "global_step": 190070, "epoch": 2290} {"train_loss": -23.679731369018555, "global_step": 190071, "epoch": 2290} {"train_loss": -23.89558982849121, "global_step": 190072, "epoch": 2290} {"train_loss": -23.647201538085938, "global_step": 190073, "epoch": 2290} {"train_loss": -23.418813705444336, "global_step": 190074, "epoch": 2290} {"train_loss": -23.785449981689453, "global_step": 190075, "epoch": 2290} {"train_loss": -23.55478286743164, "global_step": 190076, "epoch": 2290} {"train_loss": -23.898590087890625, "global_step": 190077, "epoch": 2290} {"train_loss": -24.318809509277344, "global_step": 190078, "epoch": 2290} {"train_loss": -24.19523048400879, "global_step": 190079, "epoch": 2290} {"train_loss": -23.856779098510742, "global_step": 190080, "epoch": 2290} {"train_loss": -24.395362854003906, "global_step": 190081, "epoch": 2290} {"train_loss": -24.089189529418945, "global_step": 190082, "epoch": 2290} {"train_loss": -23.573915481567383, "global_step": 190083, "epoch": 2290} {"train_loss": -24.075515747070312, "global_step": 190084, "epoch": 2290} {"train_loss": -23.998937606811523, "global_step": 190085, "epoch": 2290} {"train_loss": -24.02115249633789, "global_step": 190086, "epoch": 2290} {"train_loss": -23.711429595947266, "global_step": 190087, "epoch": 2290} {"train_loss": -23.877517700195312, "global_step": 190088, "epoch": 2290} {"train_loss": -23.79315185546875, "global_step": 190089, "epoch": 2290} {"train_loss": -24.187360763549805, "global_step": 190090, "epoch": 2290} {"train_loss": -23.728553771972656, "global_step": 190091, "epoch": 2290} {"train_loss": -24.205707550048828, "global_step": 190092, "epoch": 2290} {"train_loss": -23.780866622924805, "global_step": 190093, "epoch": 2290} {"train_loss": -23.9205322265625, "global_step": 190094, "epoch": 2290} {"train_loss": -24.06056022644043, "global_step": 190095, "epoch": 2290} {"train_loss": -23.90744972229004, "global_step": 190096, "epoch": 2290} {"train_loss": -24.005544662475586, "global_step": 190097, "epoch": 2290} {"train_loss": -23.97835350036621, "global_step": 190098, "epoch": 2290} {"train_loss": -24.25374412536621, "global_step": 190099, "epoch": 2290} {"train_loss": -23.89116096496582, "global_step": 190100, "epoch": 2290} {"train_loss": -23.785438537597656, "global_step": 190101, "epoch": 2290} {"train_loss": -23.87550163269043, "global_step": 190102, "epoch": 2290} {"train_loss": -23.73060417175293, "global_step": 190103, "epoch": 2290} {"train_loss": -23.891080856323242, "global_step": 190104, "epoch": 2290} {"train_loss": -23.719547271728516, "global_step": 190105, "epoch": 2290} {"train_loss": -24.04119300842285, "global_step": 190106, "epoch": 2290} {"train_loss": -23.47294807434082, "global_step": 190107, "epoch": 2290} {"train_loss": -23.790454864501953, "global_step": 190108, "epoch": 2290} {"train_loss": -24.038894653320312, "global_step": 190109, "epoch": 2290} {"train_loss": -23.720783233642578, "global_step": 190110, "epoch": 2290} {"train_loss": -23.754384994506836, "global_step": 190111, "epoch": 2290} {"train_loss": -23.903228759765625, "global_step": 190112, "epoch": 2290} {"train_loss": -23.849332809448242, "global_step": 190113, "epoch": 2290} {"train_loss": -24.124027252197266, "global_step": 190114, "epoch": 2290} {"train_loss": -23.96811866760254, "global_step": 190115, "epoch": 2290} {"train_loss": -24.179410934448242, "global_step": 190116, "epoch": 2290} {"train_loss": -23.695850372314453, "global_step": 190117, "epoch": 2290} {"train_loss": -23.775283813476562, "global_step": 190118, "epoch": 2290} {"train_loss": -23.952789306640625, "global_step": 190119, "epoch": 2290} {"train_loss": -23.984756469726562, "global_step": 190120, "epoch": 2290} {"train_loss": -24.091440200805664, "global_step": 190121, "epoch": 2290} {"train_loss": -23.87665367126465, "global_step": 190122, "epoch": 2290} {"train_loss": -23.894704818725586, "global_step": 190123, "epoch": 2290} {"train_loss": -23.92941665649414, "global_step": 190124, "epoch": 2290} {"train_loss": -24.233015060424805, "global_step": 190125, "epoch": 2290} {"train_loss": -23.927244186401367, "global_step": 190126, "epoch": 2290} {"train_loss": -24.01277732849121, "global_step": 190127, "epoch": 2290} {"train_loss": -24.105871200561523, "global_step": 190128, "epoch": 2290} {"train_loss": -24.194833755493164, "global_step": 190129, "epoch": 2290} {"train_loss": -24.295602798461914, "global_step": 190130, "epoch": 2290} {"train_loss": -24.385908126831055, "global_step": 190131, "epoch": 2290} {"train_loss": -24.278514862060547, "global_step": 190132, "epoch": 2290} {"train_loss": -24.152496337890625, "global_step": 190133, "epoch": 2290} {"train_loss": -23.8282527923584, "global_step": 190134, "epoch": 2290} {"train_loss": -23.77839469909668, "global_step": 190135, "epoch": 2290} {"train_loss": -23.867956161499023, "global_step": 190136, "epoch": 2290} {"train_loss": -24.308029174804688, "global_step": 190137, "epoch": 2290} {"train_loss": -24.161834716796875, "global_step": 190138, "epoch": 2290} {"train_loss": -24.60513687133789, "global_step": 190139, "epoch": 2290} {"train_loss": -24.21200942993164, "global_step": 190140, "epoch": 2290} {"train_loss": -24.415523529052734, "global_step": 190141, "epoch": 2290} {"train_loss": -23.83474349975586, "global_step": 190142, "epoch": 2290} {"train_loss": -24.240222930908203, "global_step": 190143, "epoch": 2290} {"train_loss": -23.877552032470703, "global_step": 190144, "epoch": 2290} {"train_loss": -24.35584831237793, "global_step": 190145, "epoch": 2290} {"train_loss": -24.32662010192871, "global_step": 190146, "epoch": 2290} {"train_loss": -24.35053062438965, "global_step": 190147, "epoch": 2290} {"train_loss": -24.21044921875, "global_step": 190148, "epoch": 2290} {"train_loss": -24.360275268554688, "global_step": 190149, "epoch": 2290} {"train_loss": -24.47751808166504, "global_step": 190150, "epoch": 2290} {"train_loss": -24.19172477722168, "global_step": 190151, "epoch": 2290} {"train_loss": -24.004173876291297, "global_step": 190152, "epoch": 2290, "val_loss": 6525144.0} {"train_loss": -23.708585739135742, "global_step": 190153, "epoch": 2291} {"train_loss": -22.774906158447266, "global_step": 190154, "epoch": 2291} {"train_loss": -23.403348922729492, "global_step": 190155, "epoch": 2291} {"train_loss": -22.81873893737793, "global_step": 190156, "epoch": 2291} {"train_loss": -23.278993606567383, "global_step": 190157, "epoch": 2291} {"train_loss": -23.915557861328125, "global_step": 190158, "epoch": 2291} {"train_loss": -23.481149673461914, "global_step": 190159, "epoch": 2291} {"train_loss": -23.19327735900879, "global_step": 190160, "epoch": 2291} {"train_loss": -23.324878692626953, "global_step": 190161, "epoch": 2291} {"train_loss": -23.441801071166992, "global_step": 190162, "epoch": 2291} {"train_loss": -23.557279586791992, "global_step": 190163, "epoch": 2291} {"train_loss": -23.48567771911621, "global_step": 190164, "epoch": 2291} {"train_loss": -23.10732078552246, "global_step": 190165, "epoch": 2291} {"train_loss": -23.550859451293945, "global_step": 190166, "epoch": 2291} {"train_loss": -23.726911544799805, "global_step": 190167, "epoch": 2291} {"train_loss": -23.36623191833496, "global_step": 190168, "epoch": 2291} {"train_loss": -23.81180191040039, "global_step": 190169, "epoch": 2291} {"train_loss": -23.551733016967773, "global_step": 190170, "epoch": 2291} {"train_loss": -23.83662223815918, "global_step": 190171, "epoch": 2291} {"train_loss": -23.92072868347168, "global_step": 190172, "epoch": 2291} {"train_loss": -23.887311935424805, "global_step": 190173, "epoch": 2291} {"train_loss": -23.897199630737305, "global_step": 190174, "epoch": 2291} {"train_loss": -23.81475257873535, "global_step": 190175, "epoch": 2291} {"train_loss": -24.071866989135742, "global_step": 190176, "epoch": 2291} {"train_loss": -23.516984939575195, "global_step": 190177, "epoch": 2291} {"train_loss": -23.783475875854492, "global_step": 190178, "epoch": 2291} {"train_loss": -24.340801239013672, "global_step": 190179, "epoch": 2291} {"train_loss": -23.995222091674805, "global_step": 190180, "epoch": 2291} {"train_loss": -24.01715660095215, "global_step": 190181, "epoch": 2291} {"train_loss": -23.98856544494629, "global_step": 190182, "epoch": 2291} {"train_loss": -23.733091354370117, "global_step": 190183, "epoch": 2291} {"train_loss": -24.039297103881836, "global_step": 190184, "epoch": 2291} {"train_loss": -24.242841720581055, "global_step": 190185, "epoch": 2291} {"train_loss": -24.12848472595215, "global_step": 190186, "epoch": 2291} {"train_loss": -24.093997955322266, "global_step": 190187, "epoch": 2291} {"train_loss": -24.372608184814453, "global_step": 190188, "epoch": 2291} {"train_loss": -23.80971336364746, "global_step": 190189, "epoch": 2291} {"train_loss": -24.081268310546875, "global_step": 190190, "epoch": 2291} {"train_loss": -24.087661743164062, "global_step": 190191, "epoch": 2291} {"train_loss": -24.007381439208984, "global_step": 190192, "epoch": 2291} {"train_loss": -23.841659545898438, "global_step": 190193, "epoch": 2291} {"train_loss": -23.99418830871582, "global_step": 190194, "epoch": 2291} {"train_loss": -23.83193016052246, "global_step": 190195, "epoch": 2291} {"train_loss": -24.004501342773438, "global_step": 190196, "epoch": 2291} {"train_loss": -24.086376190185547, "global_step": 190197, "epoch": 2291} {"train_loss": -23.720041275024414, "global_step": 190198, "epoch": 2291} {"train_loss": -24.11748695373535, "global_step": 190199, "epoch": 2291} {"train_loss": -23.61368751525879, "global_step": 190200, "epoch": 2291} {"train_loss": -23.960607528686523, "global_step": 190201, "epoch": 2291} {"train_loss": -24.143146514892578, "global_step": 190202, "epoch": 2291} {"train_loss": -23.69056510925293, "global_step": 190203, "epoch": 2291} {"train_loss": -24.21453285217285, "global_step": 190204, "epoch": 2291} {"train_loss": -23.57213592529297, "global_step": 190205, "epoch": 2291} {"train_loss": -24.115217208862305, "global_step": 190206, "epoch": 2291} {"train_loss": -23.93643569946289, "global_step": 190207, "epoch": 2291} {"train_loss": -24.304563522338867, "global_step": 190208, "epoch": 2291} {"train_loss": -24.14632225036621, "global_step": 190209, "epoch": 2291} {"train_loss": -24.296321868896484, "global_step": 190210, "epoch": 2291} {"train_loss": -24.095256805419922, "global_step": 190211, "epoch": 2291} {"train_loss": -24.40152931213379, "global_step": 190212, "epoch": 2291} {"train_loss": -24.362375259399414, "global_step": 190213, "epoch": 2291} {"train_loss": -24.04305076599121, "global_step": 190214, "epoch": 2291} {"train_loss": -24.404926300048828, "global_step": 190215, "epoch": 2291} {"train_loss": -24.414512634277344, "global_step": 190216, "epoch": 2291} {"train_loss": -24.015317916870117, "global_step": 190217, "epoch": 2291} {"train_loss": -23.99277114868164, "global_step": 190218, "epoch": 2291} {"train_loss": -24.35062026977539, "global_step": 190219, "epoch": 2291} {"train_loss": -24.2866268157959, "global_step": 190220, "epoch": 2291} {"train_loss": -23.66718292236328, "global_step": 190221, "epoch": 2291} {"train_loss": -23.60700798034668, "global_step": 190222, "epoch": 2291} {"train_loss": -24.033187866210938, "global_step": 190223, "epoch": 2291} {"train_loss": -24.284746170043945, "global_step": 190224, "epoch": 2291} {"train_loss": -24.500577926635742, "global_step": 190225, "epoch": 2291} {"train_loss": -24.38894271850586, "global_step": 190226, "epoch": 2291} {"train_loss": -24.292814254760742, "global_step": 190227, "epoch": 2291} {"train_loss": -24.215742111206055, "global_step": 190228, "epoch": 2291} {"train_loss": -24.164709091186523, "global_step": 190229, "epoch": 2291} {"train_loss": -23.919660568237305, "global_step": 190230, "epoch": 2291} {"train_loss": -24.179868698120117, "global_step": 190231, "epoch": 2291} {"train_loss": -23.875289916992188, "global_step": 190232, "epoch": 2291} {"train_loss": -24.26204490661621, "global_step": 190233, "epoch": 2291} {"train_loss": -23.688146591186523, "global_step": 190234, "epoch": 2291} {"train_loss": -23.912004654666028, "global_step": 190235, "epoch": 2291, "val_loss": 6550498.0} {"train_loss": -24.110502243041992, "global_step": 190236, "epoch": 2292} {"train_loss": -24.178802490234375, "global_step": 190237, "epoch": 2292} {"train_loss": -23.803918838500977, "global_step": 190238, "epoch": 2292} {"train_loss": -24.027114868164062, "global_step": 190239, "epoch": 2292} {"train_loss": -23.518571853637695, "global_step": 190240, "epoch": 2292} {"train_loss": -24.08318519592285, "global_step": 190241, "epoch": 2292} {"train_loss": -23.939401626586914, "global_step": 190242, "epoch": 2292} {"train_loss": -24.219982147216797, "global_step": 190243, "epoch": 2292} {"train_loss": -23.878101348876953, "global_step": 190244, "epoch": 2292} {"train_loss": -23.82613182067871, "global_step": 190245, "epoch": 2292} {"train_loss": -23.51382064819336, "global_step": 190246, "epoch": 2292} {"train_loss": -24.14740562438965, "global_step": 190247, "epoch": 2292} {"train_loss": -24.072757720947266, "global_step": 190248, "epoch": 2292} {"train_loss": -24.013235092163086, "global_step": 190249, "epoch": 2292} {"train_loss": -24.608665466308594, "global_step": 190250, "epoch": 2292} {"train_loss": -24.146080017089844, "global_step": 190251, "epoch": 2292} {"train_loss": -23.492918014526367, "global_step": 190252, "epoch": 2292} {"train_loss": -24.077177047729492, "global_step": 190253, "epoch": 2292} {"train_loss": -24.236478805541992, "global_step": 190254, "epoch": 2292} {"train_loss": -24.29665756225586, "global_step": 190255, "epoch": 2292} {"train_loss": -23.64042091369629, "global_step": 190256, "epoch": 2292} {"train_loss": -24.041751861572266, "global_step": 190257, "epoch": 2292} {"train_loss": -24.11663055419922, "global_step": 190258, "epoch": 2292} {"train_loss": -23.8957576751709, "global_step": 190259, "epoch": 2292} {"train_loss": -23.9379825592041, "global_step": 190260, "epoch": 2292} {"train_loss": -24.14182472229004, "global_step": 190261, "epoch": 2292} {"train_loss": -24.126937866210938, "global_step": 190262, "epoch": 2292} {"train_loss": -23.926477432250977, "global_step": 190263, "epoch": 2292} {"train_loss": -24.206466674804688, "global_step": 190264, "epoch": 2292} {"train_loss": -24.103708267211914, "global_step": 190265, "epoch": 2292} {"train_loss": -23.7226619720459, "global_step": 190266, "epoch": 2292} {"train_loss": -24.18756675720215, "global_step": 190267, "epoch": 2292} {"train_loss": -23.973045349121094, "global_step": 190268, "epoch": 2292} {"train_loss": -23.938169479370117, "global_step": 190269, "epoch": 2292} {"train_loss": -24.005615234375, "global_step": 190270, "epoch": 2292} {"train_loss": -23.76080894470215, "global_step": 190271, "epoch": 2292} {"train_loss": -23.62212562561035, "global_step": 190272, "epoch": 2292} {"train_loss": -24.03057861328125, "global_step": 190273, "epoch": 2292} {"train_loss": -23.7669734954834, "global_step": 190274, "epoch": 2292} {"train_loss": -24.08217430114746, "global_step": 190275, "epoch": 2292} {"train_loss": -23.95142936706543, "global_step": 190276, "epoch": 2292} {"train_loss": -23.849750518798828, "global_step": 190277, "epoch": 2292} {"train_loss": -24.068681716918945, "global_step": 190278, "epoch": 2292} {"train_loss": -24.00136375427246, "global_step": 190279, "epoch": 2292} {"train_loss": -23.86868667602539, "global_step": 190280, "epoch": 2292} {"train_loss": -24.41733169555664, "global_step": 190281, "epoch": 2292} {"train_loss": -24.34193992614746, "global_step": 190282, "epoch": 2292} {"train_loss": -24.173709869384766, "global_step": 190283, "epoch": 2292} {"train_loss": -24.36630630493164, "global_step": 190284, "epoch": 2292} {"train_loss": -24.498870849609375, "global_step": 190285, "epoch": 2292} {"train_loss": -24.2246150970459, "global_step": 190286, "epoch": 2292} {"train_loss": -24.111562728881836, "global_step": 190287, "epoch": 2292} {"train_loss": -24.26815414428711, "global_step": 190288, "epoch": 2292} {"train_loss": -24.375858306884766, "global_step": 190289, "epoch": 2292} {"train_loss": -24.297388076782227, "global_step": 190290, "epoch": 2292} {"train_loss": -24.34508514404297, "global_step": 190291, "epoch": 2292} {"train_loss": -23.987302780151367, "global_step": 190292, "epoch": 2292} {"train_loss": -24.230728149414062, "global_step": 190293, "epoch": 2292} {"train_loss": -24.190353393554688, "global_step": 190294, "epoch": 2292} {"train_loss": -24.15604591369629, "global_step": 190295, "epoch": 2292} {"train_loss": -24.31781578063965, "global_step": 190296, "epoch": 2292} {"train_loss": -24.033369064331055, "global_step": 190297, "epoch": 2292} {"train_loss": -24.06707191467285, "global_step": 190298, "epoch": 2292} {"train_loss": -23.761905670166016, "global_step": 190299, "epoch": 2292} {"train_loss": -24.288043975830078, "global_step": 190300, "epoch": 2292} {"train_loss": -24.15179443359375, "global_step": 190301, "epoch": 2292} {"train_loss": -24.38551902770996, "global_step": 190302, "epoch": 2292} {"train_loss": -24.39420509338379, "global_step": 190303, "epoch": 2292} {"train_loss": -24.8160343170166, "global_step": 190304, "epoch": 2292} {"train_loss": -24.31389617919922, "global_step": 190305, "epoch": 2292} {"train_loss": -24.653459548950195, "global_step": 190306, "epoch": 2292} {"train_loss": -24.04343032836914, "global_step": 190307, "epoch": 2292} {"train_loss": -24.210784912109375, "global_step": 190308, "epoch": 2292} {"train_loss": -23.99909210205078, "global_step": 190309, "epoch": 2292} {"train_loss": -24.00141716003418, "global_step": 190310, "epoch": 2292} {"train_loss": -23.987462997436523, "global_step": 190311, "epoch": 2292} {"train_loss": -24.11547088623047, "global_step": 190312, "epoch": 2292} {"train_loss": -24.119962692260742, "global_step": 190313, "epoch": 2292} {"train_loss": -23.73969841003418, "global_step": 190314, "epoch": 2292} {"train_loss": -24.051679611206055, "global_step": 190315, "epoch": 2292} {"train_loss": -24.087486267089844, "global_step": 190316, "epoch": 2292} {"train_loss": -23.567310333251953, "global_step": 190317, "epoch": 2292} {"train_loss": -24.071665223822535, "global_step": 190318, "epoch": 2292, "val_loss": 6683238.0} {"train_loss": -19.635374069213867, "global_step": 190319, "epoch": 2293} {"train_loss": -22.7098331451416, "global_step": 190320, "epoch": 2293} {"train_loss": -21.416805267333984, "global_step": 190321, "epoch": 2293} {"train_loss": -22.47566032409668, "global_step": 190322, "epoch": 2293} {"train_loss": -22.481754302978516, "global_step": 190323, "epoch": 2293} {"train_loss": -22.2230224609375, "global_step": 190324, "epoch": 2293} {"train_loss": -22.800251007080078, "global_step": 190325, "epoch": 2293} {"train_loss": -22.784378051757812, "global_step": 190326, "epoch": 2293} {"train_loss": -23.685754776000977, "global_step": 190327, "epoch": 2293} {"train_loss": -22.919879913330078, "global_step": 190328, "epoch": 2293} {"train_loss": -22.816465377807617, "global_step": 190329, "epoch": 2293} {"train_loss": -22.701337814331055, "global_step": 190330, "epoch": 2293} {"train_loss": -23.021453857421875, "global_step": 190331, "epoch": 2293} {"train_loss": -23.222089767456055, "global_step": 190332, "epoch": 2293} {"train_loss": -23.051210403442383, "global_step": 190333, "epoch": 2293} {"train_loss": -23.44814682006836, "global_step": 190334, "epoch": 2293} {"train_loss": -23.495437622070312, "global_step": 190335, "epoch": 2293} {"train_loss": -23.298606872558594, "global_step": 190336, "epoch": 2293} {"train_loss": -23.286222457885742, "global_step": 190337, "epoch": 2293} {"train_loss": -23.545337677001953, "global_step": 190338, "epoch": 2293} {"train_loss": -23.30580711364746, "global_step": 190339, "epoch": 2293} {"train_loss": -23.4692325592041, "global_step": 190340, "epoch": 2293} {"train_loss": -23.636001586914062, "global_step": 190341, "epoch": 2293} {"train_loss": -23.361223220825195, "global_step": 190342, "epoch": 2293} {"train_loss": -23.494556427001953, "global_step": 190343, "epoch": 2293} {"train_loss": -23.731042861938477, "global_step": 190344, "epoch": 2293} {"train_loss": -23.661752700805664, "global_step": 190345, "epoch": 2293} {"train_loss": -23.87702178955078, "global_step": 190346, "epoch": 2293} {"train_loss": -23.42805290222168, "global_step": 190347, "epoch": 2293} {"train_loss": -23.818471908569336, "global_step": 190348, "epoch": 2293} {"train_loss": -23.614572525024414, "global_step": 190349, "epoch": 2293} {"train_loss": -23.674509048461914, "global_step": 190350, "epoch": 2293} {"train_loss": -23.833166122436523, "global_step": 190351, "epoch": 2293} {"train_loss": -24.077373504638672, "global_step": 190352, "epoch": 2293} {"train_loss": -23.610937118530273, "global_step": 190353, "epoch": 2293} {"train_loss": -23.823623657226562, "global_step": 190354, "epoch": 2293} {"train_loss": -23.784650802612305, "global_step": 190355, "epoch": 2293} {"train_loss": -23.871685028076172, "global_step": 190356, "epoch": 2293} {"train_loss": -23.837705612182617, "global_step": 190357, "epoch": 2293} {"train_loss": -23.833648681640625, "global_step": 190358, "epoch": 2293} {"train_loss": -24.186044692993164, "global_step": 190359, "epoch": 2293} {"train_loss": -24.1097412109375, "global_step": 190360, "epoch": 2293} {"train_loss": -23.77205467224121, "global_step": 190361, "epoch": 2293} {"train_loss": -23.87577247619629, "global_step": 190362, "epoch": 2293} {"train_loss": -23.760009765625, "global_step": 190363, "epoch": 2293} {"train_loss": -23.9239501953125, "global_step": 190364, "epoch": 2293} {"train_loss": -23.770946502685547, "global_step": 190365, "epoch": 2293} {"train_loss": -24.090229034423828, "global_step": 190366, "epoch": 2293} {"train_loss": -23.952484130859375, "global_step": 190367, "epoch": 2293} {"train_loss": -23.999425888061523, "global_step": 190368, "epoch": 2293} {"train_loss": -23.99042510986328, "global_step": 190369, "epoch": 2293} {"train_loss": -24.344934463500977, "global_step": 190370, "epoch": 2293} {"train_loss": -24.314565658569336, "global_step": 190371, "epoch": 2293} {"train_loss": -24.22535514831543, "global_step": 190372, "epoch": 2293} {"train_loss": -24.072107315063477, "global_step": 190373, "epoch": 2293} {"train_loss": -24.211292266845703, "global_step": 190374, "epoch": 2293} {"train_loss": -24.213905334472656, "global_step": 190375, "epoch": 2293} {"train_loss": -24.378549575805664, "global_step": 190376, "epoch": 2293} {"train_loss": -23.945907592773438, "global_step": 190377, "epoch": 2293} {"train_loss": -23.933622360229492, "global_step": 190378, "epoch": 2293} {"train_loss": -24.088464736938477, "global_step": 190379, "epoch": 2293} {"train_loss": -24.110042572021484, "global_step": 190380, "epoch": 2293} {"train_loss": -24.109392166137695, "global_step": 190381, "epoch": 2293} {"train_loss": -24.336973190307617, "global_step": 190382, "epoch": 2293} {"train_loss": -24.298980712890625, "global_step": 190383, "epoch": 2293} {"train_loss": -23.883481979370117, "global_step": 190384, "epoch": 2293} {"train_loss": -24.1294002532959, "global_step": 190385, "epoch": 2293} {"train_loss": -24.31136131286621, "global_step": 190386, "epoch": 2293} {"train_loss": -24.313817977905273, "global_step": 190387, "epoch": 2293} {"train_loss": -24.122068405151367, "global_step": 190388, "epoch": 2293} {"train_loss": -23.856943130493164, "global_step": 190389, "epoch": 2293} {"train_loss": -24.17770767211914, "global_step": 190390, "epoch": 2293} {"train_loss": -24.515344619750977, "global_step": 190391, "epoch": 2293} {"train_loss": -24.127113342285156, "global_step": 190392, "epoch": 2293} {"train_loss": -24.122234344482422, "global_step": 190393, "epoch": 2293} {"train_loss": -24.476022720336914, "global_step": 190394, "epoch": 2293} {"train_loss": -24.344541549682617, "global_step": 190395, "epoch": 2293} {"train_loss": -24.040103912353516, "global_step": 190396, "epoch": 2293} {"train_loss": -24.009000778198242, "global_step": 190397, "epoch": 2293} {"train_loss": -23.89151954650879, "global_step": 190398, "epoch": 2293} {"train_loss": -23.78036117553711, "global_step": 190399, "epoch": 2293} {"train_loss": -23.628835678100586, "global_step": 190400, "epoch": 2293} {"train_loss": -23.667697653712995, "global_step": 190401, "epoch": 2293, "val_loss": 6534018.0} {"train_loss": -24.207826614379883, "global_step": 190402, "epoch": 2294} {"train_loss": -23.44630241394043, "global_step": 190403, "epoch": 2294} {"train_loss": -23.953018188476562, "global_step": 190404, "epoch": 2294} {"train_loss": -23.68671989440918, "global_step": 190405, "epoch": 2294} {"train_loss": -23.9132137298584, "global_step": 190406, "epoch": 2294} {"train_loss": -23.881662368774414, "global_step": 190407, "epoch": 2294} {"train_loss": -23.590368270874023, "global_step": 190408, "epoch": 2294} {"train_loss": -23.68338394165039, "global_step": 190409, "epoch": 2294} {"train_loss": -23.730854034423828, "global_step": 190410, "epoch": 2294} {"train_loss": -23.36510467529297, "global_step": 190411, "epoch": 2294} {"train_loss": -23.837352752685547, "global_step": 190412, "epoch": 2294} {"train_loss": -23.84934425354004, "global_step": 190413, "epoch": 2294} {"train_loss": -23.891408920288086, "global_step": 190414, "epoch": 2294} {"train_loss": -23.807851791381836, "global_step": 190415, "epoch": 2294} {"train_loss": -23.760129928588867, "global_step": 190416, "epoch": 2294} {"train_loss": -23.868492126464844, "global_step": 190417, "epoch": 2294} {"train_loss": -23.5905818939209, "global_step": 190418, "epoch": 2294} {"train_loss": -24.169767379760742, "global_step": 190419, "epoch": 2294} {"train_loss": -23.9078369140625, "global_step": 190420, "epoch": 2294} {"train_loss": -24.172395706176758, "global_step": 190421, "epoch": 2294} {"train_loss": -23.772354125976562, "global_step": 190422, "epoch": 2294} {"train_loss": -23.894926071166992, "global_step": 190423, "epoch": 2294} {"train_loss": -24.241735458374023, "global_step": 190424, "epoch": 2294} {"train_loss": -23.955400466918945, "global_step": 190425, "epoch": 2294} {"train_loss": -24.146848678588867, "global_step": 190426, "epoch": 2294} {"train_loss": -23.905004501342773, "global_step": 190427, "epoch": 2294} {"train_loss": -23.91029167175293, "global_step": 190428, "epoch": 2294} {"train_loss": -24.046506881713867, "global_step": 190429, "epoch": 2294} {"train_loss": -24.340002059936523, "global_step": 190430, "epoch": 2294} {"train_loss": -24.132190704345703, "global_step": 190431, "epoch": 2294} {"train_loss": -24.151330947875977, "global_step": 190432, "epoch": 2294} {"train_loss": -23.976171493530273, "global_step": 190433, "epoch": 2294} {"train_loss": -24.050031661987305, "global_step": 190434, "epoch": 2294} {"train_loss": -24.421070098876953, "global_step": 190435, "epoch": 2294} {"train_loss": -23.951248168945312, "global_step": 190436, "epoch": 2294} {"train_loss": -24.06818199157715, "global_step": 190437, "epoch": 2294} {"train_loss": -23.59584617614746, "global_step": 190438, "epoch": 2294} {"train_loss": -23.772785186767578, "global_step": 190439, "epoch": 2294} {"train_loss": -23.863157272338867, "global_step": 190440, "epoch": 2294} {"train_loss": -24.170520782470703, "global_step": 190441, "epoch": 2294} {"train_loss": -24.04025650024414, "global_step": 190442, "epoch": 2294} {"train_loss": -24.570619583129883, "global_step": 190443, "epoch": 2294} {"train_loss": -24.386667251586914, "global_step": 190444, "epoch": 2294} {"train_loss": -23.926118850708008, "global_step": 190445, "epoch": 2294} {"train_loss": -23.87013816833496, "global_step": 190446, "epoch": 2294} {"train_loss": -24.098066329956055, "global_step": 190447, "epoch": 2294} {"train_loss": -24.366865158081055, "global_step": 190448, "epoch": 2294} {"train_loss": -23.953413009643555, "global_step": 190449, "epoch": 2294} {"train_loss": -24.035850524902344, "global_step": 190450, "epoch": 2294} {"train_loss": -24.004169464111328, "global_step": 190451, "epoch": 2294} {"train_loss": -24.236120223999023, "global_step": 190452, "epoch": 2294} {"train_loss": -24.118139266967773, "global_step": 190453, "epoch": 2294} {"train_loss": -24.171146392822266, "global_step": 190454, "epoch": 2294} {"train_loss": -24.57012939453125, "global_step": 190455, "epoch": 2294} {"train_loss": -24.432287216186523, "global_step": 190456, "epoch": 2294} {"train_loss": -23.818649291992188, "global_step": 190457, "epoch": 2294} {"train_loss": -24.44160270690918, "global_step": 190458, "epoch": 2294} {"train_loss": -23.97140121459961, "global_step": 190459, "epoch": 2294} {"train_loss": -24.276573181152344, "global_step": 190460, "epoch": 2294} {"train_loss": -23.723180770874023, "global_step": 190461, "epoch": 2294} {"train_loss": -24.1655330657959, "global_step": 190462, "epoch": 2294} {"train_loss": -24.219688415527344, "global_step": 190463, "epoch": 2294} {"train_loss": -24.123600006103516, "global_step": 190464, "epoch": 2294} {"train_loss": -24.351154327392578, "global_step": 190465, "epoch": 2294} {"train_loss": -24.504453659057617, "global_step": 190466, "epoch": 2294} {"train_loss": -24.72030258178711, "global_step": 190467, "epoch": 2294} {"train_loss": -24.185636520385742, "global_step": 190468, "epoch": 2294} {"train_loss": -23.920291900634766, "global_step": 190469, "epoch": 2294} {"train_loss": -24.14204978942871, "global_step": 190470, "epoch": 2294} {"train_loss": -24.468647003173828, "global_step": 190471, "epoch": 2294} {"train_loss": -24.039058685302734, "global_step": 190472, "epoch": 2294} {"train_loss": -24.274993896484375, "global_step": 190473, "epoch": 2294} {"train_loss": -24.0502986907959, "global_step": 190474, "epoch": 2294} {"train_loss": -24.50307846069336, "global_step": 190475, "epoch": 2294} {"train_loss": -23.994251251220703, "global_step": 190476, "epoch": 2294} {"train_loss": -24.225208282470703, "global_step": 190477, "epoch": 2294} {"train_loss": -23.98362159729004, "global_step": 190478, "epoch": 2294} {"train_loss": -24.177162170410156, "global_step": 190479, "epoch": 2294} {"train_loss": -24.19610595703125, "global_step": 190480, "epoch": 2294} {"train_loss": -24.09234046936035, "global_step": 190481, "epoch": 2294} {"train_loss": -24.393402099609375, "global_step": 190482, "epoch": 2294} {"train_loss": -24.02845001220703, "global_step": 190483, "epoch": 2294} {"train_loss": -24.060195693050524, "global_step": 190484, "epoch": 2294, "val_loss": 6526780.5} {"train_loss": -23.638994216918945, "global_step": 190485, "epoch": 2295} {"train_loss": -24.010671615600586, "global_step": 190486, "epoch": 2295} {"train_loss": -23.47230339050293, "global_step": 190487, "epoch": 2295} {"train_loss": -23.52280616760254, "global_step": 190488, "epoch": 2295} {"train_loss": -23.840194702148438, "global_step": 190489, "epoch": 2295} {"train_loss": -23.90359878540039, "global_step": 190490, "epoch": 2295} {"train_loss": -23.663244247436523, "global_step": 190491, "epoch": 2295} {"train_loss": -23.652006149291992, "global_step": 190492, "epoch": 2295} {"train_loss": -23.44496726989746, "global_step": 190493, "epoch": 2295} {"train_loss": -24.03485679626465, "global_step": 190494, "epoch": 2295} {"train_loss": -23.463533401489258, "global_step": 190495, "epoch": 2295} {"train_loss": -23.318958282470703, "global_step": 190496, "epoch": 2295} {"train_loss": -23.84309959411621, "global_step": 190497, "epoch": 2295} {"train_loss": -23.74999237060547, "global_step": 190498, "epoch": 2295} {"train_loss": -23.690073013305664, "global_step": 190499, "epoch": 2295} {"train_loss": -23.716867446899414, "global_step": 190500, "epoch": 2295} {"train_loss": -23.85890769958496, "global_step": 190501, "epoch": 2295} {"train_loss": -23.5122127532959, "global_step": 190502, "epoch": 2295} {"train_loss": -23.702539443969727, "global_step": 190503, "epoch": 2295} {"train_loss": -23.83294677734375, "global_step": 190504, "epoch": 2295} {"train_loss": -24.269132614135742, "global_step": 190505, "epoch": 2295} {"train_loss": -24.02364158630371, "global_step": 190506, "epoch": 2295} {"train_loss": -23.867155075073242, "global_step": 190507, "epoch": 2295} {"train_loss": -23.817731857299805, "global_step": 190508, "epoch": 2295} {"train_loss": -23.598852157592773, "global_step": 190509, "epoch": 2295} {"train_loss": -24.126407623291016, "global_step": 190510, "epoch": 2295} {"train_loss": -23.683622360229492, "global_step": 190511, "epoch": 2295} {"train_loss": -24.110395431518555, "global_step": 190512, "epoch": 2295} {"train_loss": -23.481124877929688, "global_step": 190513, "epoch": 2295} {"train_loss": -23.624235153198242, "global_step": 190514, "epoch": 2295} {"train_loss": -24.273717880249023, "global_step": 190515, "epoch": 2295} {"train_loss": -24.105356216430664, "global_step": 190516, "epoch": 2295} {"train_loss": -24.392972946166992, "global_step": 190517, "epoch": 2295} {"train_loss": -24.11948585510254, "global_step": 190518, "epoch": 2295} {"train_loss": -24.230628967285156, "global_step": 190519, "epoch": 2295} {"train_loss": -24.072019577026367, "global_step": 190520, "epoch": 2295} {"train_loss": -24.357450485229492, "global_step": 190521, "epoch": 2295} {"train_loss": -24.028303146362305, "global_step": 190522, "epoch": 2295} {"train_loss": -24.369173049926758, "global_step": 190523, "epoch": 2295} {"train_loss": -23.892894744873047, "global_step": 190524, "epoch": 2295} {"train_loss": -24.07537841796875, "global_step": 190525, "epoch": 2295} {"train_loss": -23.968708038330078, "global_step": 190526, "epoch": 2295} {"train_loss": -24.237592697143555, "global_step": 190527, "epoch": 2295} {"train_loss": -24.190372467041016, "global_step": 190528, "epoch": 2295} {"train_loss": -24.21657371520996, "global_step": 190529, "epoch": 2295} {"train_loss": -24.08861541748047, "global_step": 190530, "epoch": 2295} {"train_loss": -23.922266006469727, "global_step": 190531, "epoch": 2295} {"train_loss": -24.148204803466797, "global_step": 190532, "epoch": 2295} {"train_loss": -24.224985122680664, "global_step": 190533, "epoch": 2295} {"train_loss": -24.283151626586914, "global_step": 190534, "epoch": 2295} {"train_loss": -23.96204376220703, "global_step": 190535, "epoch": 2295} {"train_loss": -23.93121910095215, "global_step": 190536, "epoch": 2295} {"train_loss": -23.72515869140625, "global_step": 190537, "epoch": 2295} {"train_loss": -24.097578048706055, "global_step": 190538, "epoch": 2295} {"train_loss": -24.155744552612305, "global_step": 190539, "epoch": 2295} {"train_loss": -24.075963973999023, "global_step": 190540, "epoch": 2295} {"train_loss": -24.479900360107422, "global_step": 190541, "epoch": 2295} {"train_loss": -24.13095474243164, "global_step": 190542, "epoch": 2295} {"train_loss": -23.967554092407227, "global_step": 190543, "epoch": 2295} {"train_loss": -24.17030906677246, "global_step": 190544, "epoch": 2295} {"train_loss": -24.27484703063965, "global_step": 190545, "epoch": 2295} {"train_loss": -23.652639389038086, "global_step": 190546, "epoch": 2295} {"train_loss": -24.28098487854004, "global_step": 190547, "epoch": 2295} {"train_loss": -23.62369155883789, "global_step": 190548, "epoch": 2295} {"train_loss": -24.296401977539062, "global_step": 190549, "epoch": 2295} {"train_loss": -23.87932014465332, "global_step": 190550, "epoch": 2295} {"train_loss": -24.00306510925293, "global_step": 190551, "epoch": 2295} {"train_loss": -24.227462768554688, "global_step": 190552, "epoch": 2295} {"train_loss": -24.412540435791016, "global_step": 190553, "epoch": 2295} {"train_loss": -24.116252899169922, "global_step": 190554, "epoch": 2295} {"train_loss": -23.868322372436523, "global_step": 190555, "epoch": 2295} {"train_loss": -23.851980209350586, "global_step": 190556, "epoch": 2295} {"train_loss": -24.075057983398438, "global_step": 190557, "epoch": 2295} {"train_loss": -23.94554901123047, "global_step": 190558, "epoch": 2295} {"train_loss": -24.4552059173584, "global_step": 190559, "epoch": 2295} {"train_loss": -23.997154235839844, "global_step": 190560, "epoch": 2295} {"train_loss": -23.849563598632812, "global_step": 190561, "epoch": 2295} {"train_loss": -24.09765625, "global_step": 190562, "epoch": 2295} {"train_loss": -23.77323341369629, "global_step": 190563, "epoch": 2295} {"train_loss": -23.859827041625977, "global_step": 190564, "epoch": 2295} {"train_loss": -24.035322189331055, "global_step": 190565, "epoch": 2295} {"train_loss": -24.0104923248291, "global_step": 190566, "epoch": 2295} {"train_loss": -23.970400729811335, "global_step": 190567, "epoch": 2295, "val_loss": 6523963.0} {"train_loss": -23.805612564086914, "global_step": 190568, "epoch": 2296} {"train_loss": -24.214237213134766, "global_step": 190569, "epoch": 2296} {"train_loss": -23.914976119995117, "global_step": 190570, "epoch": 2296} {"train_loss": -24.0075740814209, "global_step": 190571, "epoch": 2296} {"train_loss": -23.900022506713867, "global_step": 190572, "epoch": 2296} {"train_loss": -23.819644927978516, "global_step": 190573, "epoch": 2296} {"train_loss": -23.65937614440918, "global_step": 190574, "epoch": 2296} {"train_loss": -24.122526168823242, "global_step": 190575, "epoch": 2296} {"train_loss": -23.771631240844727, "global_step": 190576, "epoch": 2296} {"train_loss": -23.990819931030273, "global_step": 190577, "epoch": 2296} {"train_loss": -23.90635108947754, "global_step": 190578, "epoch": 2296} {"train_loss": -23.961313247680664, "global_step": 190579, "epoch": 2296} {"train_loss": -23.812894821166992, "global_step": 190580, "epoch": 2296} {"train_loss": -24.098722457885742, "global_step": 190581, "epoch": 2296} {"train_loss": -23.74273681640625, "global_step": 190582, "epoch": 2296} {"train_loss": -24.41448974609375, "global_step": 190583, "epoch": 2296} {"train_loss": -23.893476486206055, "global_step": 190584, "epoch": 2296} {"train_loss": -24.282001495361328, "global_step": 190585, "epoch": 2296} {"train_loss": -24.001983642578125, "global_step": 190586, "epoch": 2296} {"train_loss": -24.057844161987305, "global_step": 190587, "epoch": 2296} {"train_loss": -23.924482345581055, "global_step": 190588, "epoch": 2296} {"train_loss": -24.315134048461914, "global_step": 190589, "epoch": 2296} {"train_loss": -23.85877799987793, "global_step": 190590, "epoch": 2296} {"train_loss": -24.197275161743164, "global_step": 190591, "epoch": 2296} {"train_loss": -23.911605834960938, "global_step": 190592, "epoch": 2296} {"train_loss": -24.110532760620117, "global_step": 190593, "epoch": 2296} {"train_loss": -24.4584903717041, "global_step": 190594, "epoch": 2296} {"train_loss": -23.98579978942871, "global_step": 190595, "epoch": 2296} {"train_loss": -24.195775985717773, "global_step": 190596, "epoch": 2296} {"train_loss": -24.175626754760742, "global_step": 190597, "epoch": 2296} {"train_loss": -23.528350830078125, "global_step": 190598, "epoch": 2296} {"train_loss": -24.2912540435791, "global_step": 190599, "epoch": 2296} {"train_loss": -23.987516403198242, "global_step": 190600, "epoch": 2296} {"train_loss": -24.33005714416504, "global_step": 190601, "epoch": 2296} {"train_loss": -23.6484432220459, "global_step": 190602, "epoch": 2296} {"train_loss": -23.74310874938965, "global_step": 190603, "epoch": 2296} {"train_loss": -24.482330322265625, "global_step": 190604, "epoch": 2296} {"train_loss": -24.10896110534668, "global_step": 190605, "epoch": 2296} {"train_loss": -24.042558670043945, "global_step": 190606, "epoch": 2296} {"train_loss": -24.034778594970703, "global_step": 190607, "epoch": 2296} {"train_loss": -24.178701400756836, "global_step": 190608, "epoch": 2296} {"train_loss": -24.031448364257812, "global_step": 190609, "epoch": 2296} {"train_loss": -24.2302303314209, "global_step": 190610, "epoch": 2296} {"train_loss": -24.05916404724121, "global_step": 190611, "epoch": 2296} {"train_loss": -24.221349716186523, "global_step": 190612, "epoch": 2296} {"train_loss": -24.154340744018555, "global_step": 190613, "epoch": 2296} {"train_loss": -23.941287994384766, "global_step": 190614, "epoch": 2296} {"train_loss": -24.140548706054688, "global_step": 190615, "epoch": 2296} {"train_loss": -23.882598876953125, "global_step": 190616, "epoch": 2296} {"train_loss": -24.34320068359375, "global_step": 190617, "epoch": 2296} {"train_loss": -24.050186157226562, "global_step": 190618, "epoch": 2296} {"train_loss": -23.99805450439453, "global_step": 190619, "epoch": 2296} {"train_loss": -23.993267059326172, "global_step": 190620, "epoch": 2296} {"train_loss": -24.12125587463379, "global_step": 190621, "epoch": 2296} {"train_loss": -23.81009292602539, "global_step": 190622, "epoch": 2296} {"train_loss": -24.337955474853516, "global_step": 190623, "epoch": 2296} {"train_loss": -24.3737850189209, "global_step": 190624, "epoch": 2296} {"train_loss": -23.960342407226562, "global_step": 190625, "epoch": 2296} {"train_loss": -23.650390625, "global_step": 190626, "epoch": 2296} {"train_loss": -24.165315628051758, "global_step": 190627, "epoch": 2296} {"train_loss": -23.99228286743164, "global_step": 190628, "epoch": 2296} {"train_loss": -23.920867919921875, "global_step": 190629, "epoch": 2296} {"train_loss": -24.15416145324707, "global_step": 190630, "epoch": 2296} {"train_loss": -23.879409790039062, "global_step": 190631, "epoch": 2296} {"train_loss": -24.104835510253906, "global_step": 190632, "epoch": 2296} {"train_loss": -24.18783950805664, "global_step": 190633, "epoch": 2296} {"train_loss": -24.206281661987305, "global_step": 190634, "epoch": 2296} {"train_loss": -23.904367446899414, "global_step": 190635, "epoch": 2296} {"train_loss": -24.289016723632812, "global_step": 190636, "epoch": 2296} {"train_loss": -23.825397491455078, "global_step": 190637, "epoch": 2296} {"train_loss": -23.55624771118164, "global_step": 190638, "epoch": 2296} {"train_loss": -24.028940200805664, "global_step": 190639, "epoch": 2296} {"train_loss": -24.33124351501465, "global_step": 190640, "epoch": 2296} {"train_loss": -24.580570220947266, "global_step": 190641, "epoch": 2296} {"train_loss": -24.267404556274414, "global_step": 190642, "epoch": 2296} {"train_loss": -24.24228286743164, "global_step": 190643, "epoch": 2296} {"train_loss": -24.750417709350586, "global_step": 190644, "epoch": 2296} {"train_loss": -24.29994773864746, "global_step": 190645, "epoch": 2296} {"train_loss": -24.09409523010254, "global_step": 190646, "epoch": 2296} {"train_loss": -24.369287490844727, "global_step": 190647, "epoch": 2296} {"train_loss": -24.34372901916504, "global_step": 190648, "epoch": 2296} {"train_loss": -23.915199279785156, "global_step": 190649, "epoch": 2296} {"train_loss": -24.08064796263913, "global_step": 190650, "epoch": 2296, "val_loss": 6384742.0} {"train_loss": -23.168914794921875, "global_step": 190651, "epoch": 2297} {"train_loss": -22.23166275024414, "global_step": 190652, "epoch": 2297} {"train_loss": -22.87615394592285, "global_step": 190653, "epoch": 2297} {"train_loss": -23.41287612915039, "global_step": 190654, "epoch": 2297} {"train_loss": -23.45306968688965, "global_step": 190655, "epoch": 2297} {"train_loss": -23.1523494720459, "global_step": 190656, "epoch": 2297} {"train_loss": -23.244131088256836, "global_step": 190657, "epoch": 2297} {"train_loss": -23.661359786987305, "global_step": 190658, "epoch": 2297} {"train_loss": -23.250337600708008, "global_step": 190659, "epoch": 2297} {"train_loss": -23.407516479492188, "global_step": 190660, "epoch": 2297} {"train_loss": -23.388586044311523, "global_step": 190661, "epoch": 2297} {"train_loss": -23.451993942260742, "global_step": 190662, "epoch": 2297} {"train_loss": -23.73810386657715, "global_step": 190663, "epoch": 2297} {"train_loss": -23.673877716064453, "global_step": 190664, "epoch": 2297} {"train_loss": -23.346607208251953, "global_step": 190665, "epoch": 2297} {"train_loss": -23.707109451293945, "global_step": 190666, "epoch": 2297} {"train_loss": -23.383331298828125, "global_step": 190667, "epoch": 2297} {"train_loss": -23.664968490600586, "global_step": 190668, "epoch": 2297} {"train_loss": -23.55527114868164, "global_step": 190669, "epoch": 2297} {"train_loss": -23.694433212280273, "global_step": 190670, "epoch": 2297} {"train_loss": -23.868030548095703, "global_step": 190671, "epoch": 2297} {"train_loss": -23.624059677124023, "global_step": 190672, "epoch": 2297} {"train_loss": -23.7467041015625, "global_step": 190673, "epoch": 2297} {"train_loss": -23.485692977905273, "global_step": 190674, "epoch": 2297} {"train_loss": -23.72681427001953, "global_step": 190675, "epoch": 2297} {"train_loss": -23.958465576171875, "global_step": 190676, "epoch": 2297} {"train_loss": -23.86600112915039, "global_step": 190677, "epoch": 2297} {"train_loss": -23.731325149536133, "global_step": 190678, "epoch": 2297} {"train_loss": -23.93458366394043, "global_step": 190679, "epoch": 2297} {"train_loss": -23.7706356048584, "global_step": 190680, "epoch": 2297} {"train_loss": -24.063608169555664, "global_step": 190681, "epoch": 2297} {"train_loss": -23.8150691986084, "global_step": 190682, "epoch": 2297} {"train_loss": -23.751789093017578, "global_step": 190683, "epoch": 2297} {"train_loss": -23.888919830322266, "global_step": 190684, "epoch": 2297} {"train_loss": -23.842533111572266, "global_step": 190685, "epoch": 2297} {"train_loss": -24.31072998046875, "global_step": 190686, "epoch": 2297} {"train_loss": -23.826522827148438, "global_step": 190687, "epoch": 2297} {"train_loss": -23.719331741333008, "global_step": 190688, "epoch": 2297} {"train_loss": -23.86545181274414, "global_step": 190689, "epoch": 2297} {"train_loss": -23.91744041442871, "global_step": 190690, "epoch": 2297} {"train_loss": -23.592451095581055, "global_step": 190691, "epoch": 2297} {"train_loss": -23.955533981323242, "global_step": 190692, "epoch": 2297} {"train_loss": -23.9632625579834, "global_step": 190693, "epoch": 2297} {"train_loss": -24.083084106445312, "global_step": 190694, "epoch": 2297} {"train_loss": -24.33164405822754, "global_step": 190695, "epoch": 2297} {"train_loss": -24.0856990814209, "global_step": 190696, "epoch": 2297} {"train_loss": -24.135549545288086, "global_step": 190697, "epoch": 2297} {"train_loss": -24.071949005126953, "global_step": 190698, "epoch": 2297} {"train_loss": -23.9414005279541, "global_step": 190699, "epoch": 2297} {"train_loss": -24.494199752807617, "global_step": 190700, "epoch": 2297} {"train_loss": -24.257726669311523, "global_step": 190701, "epoch": 2297} {"train_loss": -24.13735008239746, "global_step": 190702, "epoch": 2297} {"train_loss": -24.1409912109375, "global_step": 190703, "epoch": 2297} {"train_loss": -24.101560592651367, "global_step": 190704, "epoch": 2297} {"train_loss": -24.090436935424805, "global_step": 190705, "epoch": 2297} {"train_loss": -24.14750862121582, "global_step": 190706, "epoch": 2297} {"train_loss": -24.67058563232422, "global_step": 190707, "epoch": 2297} {"train_loss": -23.94965934753418, "global_step": 190708, "epoch": 2297} {"train_loss": -24.527780532836914, "global_step": 190709, "epoch": 2297} {"train_loss": -24.20208740234375, "global_step": 190710, "epoch": 2297} {"train_loss": -24.07178497314453, "global_step": 190711, "epoch": 2297} {"train_loss": -24.0094051361084, "global_step": 190712, "epoch": 2297} {"train_loss": -23.915714263916016, "global_step": 190713, "epoch": 2297} {"train_loss": -24.256607055664062, "global_step": 190714, "epoch": 2297} {"train_loss": -23.963712692260742, "global_step": 190715, "epoch": 2297} {"train_loss": -24.02275848388672, "global_step": 190716, "epoch": 2297} {"train_loss": -23.789222717285156, "global_step": 190717, "epoch": 2297} {"train_loss": -24.31339454650879, "global_step": 190718, "epoch": 2297} {"train_loss": -24.12338638305664, "global_step": 190719, "epoch": 2297} {"train_loss": -23.897682189941406, "global_step": 190720, "epoch": 2297} {"train_loss": -24.233442306518555, "global_step": 190721, "epoch": 2297} {"train_loss": -24.194631576538086, "global_step": 190722, "epoch": 2297} {"train_loss": -23.852689743041992, "global_step": 190723, "epoch": 2297} {"train_loss": -23.975339889526367, "global_step": 190724, "epoch": 2297} {"train_loss": -23.9138240814209, "global_step": 190725, "epoch": 2297} {"train_loss": -24.227994918823242, "global_step": 190726, "epoch": 2297} {"train_loss": -24.046781539916992, "global_step": 190727, "epoch": 2297} {"train_loss": -24.664581298828125, "global_step": 190728, "epoch": 2297} {"train_loss": -23.99448013305664, "global_step": 190729, "epoch": 2297} {"train_loss": -23.91968536376953, "global_step": 190730, "epoch": 2297} {"train_loss": -23.894357681274414, "global_step": 190731, "epoch": 2297} {"train_loss": -24.14646339416504, "global_step": 190732, "epoch": 2297} {"train_loss": -23.86410720089832, "global_step": 190733, "epoch": 2297, "val_loss": 6429709.0} {"train_loss": -22.783588409423828, "global_step": 190734, "epoch": 2298} {"train_loss": -23.19950294494629, "global_step": 190735, "epoch": 2298} {"train_loss": -23.71487808227539, "global_step": 190736, "epoch": 2298} {"train_loss": -23.54826545715332, "global_step": 190737, "epoch": 2298} {"train_loss": -23.21384620666504, "global_step": 190738, "epoch": 2298} {"train_loss": -23.986066818237305, "global_step": 190739, "epoch": 2298} {"train_loss": -23.258817672729492, "global_step": 190740, "epoch": 2298} {"train_loss": -23.639245986938477, "global_step": 190741, "epoch": 2298} {"train_loss": -23.81501579284668, "global_step": 190742, "epoch": 2298} {"train_loss": -23.881452560424805, "global_step": 190743, "epoch": 2298} {"train_loss": -23.565176010131836, "global_step": 190744, "epoch": 2298} {"train_loss": -23.478370666503906, "global_step": 190745, "epoch": 2298} {"train_loss": -24.000646591186523, "global_step": 190746, "epoch": 2298} {"train_loss": -23.911827087402344, "global_step": 190747, "epoch": 2298} {"train_loss": -23.726184844970703, "global_step": 190748, "epoch": 2298} {"train_loss": -23.75019645690918, "global_step": 190749, "epoch": 2298} {"train_loss": -23.679367065429688, "global_step": 190750, "epoch": 2298} {"train_loss": -23.731430053710938, "global_step": 190751, "epoch": 2298} {"train_loss": -23.577865600585938, "global_step": 190752, "epoch": 2298} {"train_loss": -23.809341430664062, "global_step": 190753, "epoch": 2298} {"train_loss": -23.701126098632812, "global_step": 190754, "epoch": 2298} {"train_loss": -23.93099021911621, "global_step": 190755, "epoch": 2298} {"train_loss": -23.62924575805664, "global_step": 190756, "epoch": 2298} {"train_loss": -23.795902252197266, "global_step": 190757, "epoch": 2298} {"train_loss": -23.977340698242188, "global_step": 190758, "epoch": 2298} {"train_loss": -24.035261154174805, "global_step": 190759, "epoch": 2298} {"train_loss": -23.952533721923828, "global_step": 190760, "epoch": 2298} {"train_loss": -23.95839500427246, "global_step": 190761, "epoch": 2298} {"train_loss": -24.001920700073242, "global_step": 190762, "epoch": 2298} {"train_loss": -24.09317398071289, "global_step": 190763, "epoch": 2298} {"train_loss": -23.801166534423828, "global_step": 190764, "epoch": 2298} {"train_loss": -24.338485717773438, "global_step": 190765, "epoch": 2298} {"train_loss": -24.440534591674805, "global_step": 190766, "epoch": 2298} {"train_loss": -23.919233322143555, "global_step": 190767, "epoch": 2298} {"train_loss": -24.172361373901367, "global_step": 190768, "epoch": 2298} {"train_loss": -24.22007942199707, "global_step": 190769, "epoch": 2298} {"train_loss": -24.020389556884766, "global_step": 190770, "epoch": 2298} {"train_loss": -24.436058044433594, "global_step": 190771, "epoch": 2298} {"train_loss": -23.97905158996582, "global_step": 190772, "epoch": 2298} {"train_loss": -24.076200485229492, "global_step": 190773, "epoch": 2298} {"train_loss": -23.858884811401367, "global_step": 190774, "epoch": 2298} {"train_loss": -24.026376724243164, "global_step": 190775, "epoch": 2298} {"train_loss": -24.23389434814453, "global_step": 190776, "epoch": 2298} {"train_loss": -23.790969848632812, "global_step": 190777, "epoch": 2298} {"train_loss": -24.350927352905273, "global_step": 190778, "epoch": 2298} {"train_loss": -23.934541702270508, "global_step": 190779, "epoch": 2298} {"train_loss": -23.67763328552246, "global_step": 190780, "epoch": 2298} {"train_loss": -24.185070037841797, "global_step": 190781, "epoch": 2298} {"train_loss": -23.826261520385742, "global_step": 190782, "epoch": 2298} {"train_loss": -23.952880859375, "global_step": 190783, "epoch": 2298} {"train_loss": -24.173154830932617, "global_step": 190784, "epoch": 2298} {"train_loss": -24.48225975036621, "global_step": 190785, "epoch": 2298} {"train_loss": -24.09335708618164, "global_step": 190786, "epoch": 2298} {"train_loss": -23.76291275024414, "global_step": 190787, "epoch": 2298} {"train_loss": -24.318572998046875, "global_step": 190788, "epoch": 2298} {"train_loss": -24.494367599487305, "global_step": 190789, "epoch": 2298} {"train_loss": -23.678062438964844, "global_step": 190790, "epoch": 2298} {"train_loss": -24.414602279663086, "global_step": 190791, "epoch": 2298} {"train_loss": -23.983427047729492, "global_step": 190792, "epoch": 2298} {"train_loss": -24.461776733398438, "global_step": 190793, "epoch": 2298} {"train_loss": -24.355546951293945, "global_step": 190794, "epoch": 2298} {"train_loss": -24.078140258789062, "global_step": 190795, "epoch": 2298} {"train_loss": -24.36820411682129, "global_step": 190796, "epoch": 2298} {"train_loss": -24.421669006347656, "global_step": 190797, "epoch": 2298} {"train_loss": -24.30498504638672, "global_step": 190798, "epoch": 2298} {"train_loss": -24.056133270263672, "global_step": 190799, "epoch": 2298} {"train_loss": -24.370386123657227, "global_step": 190800, "epoch": 2298} {"train_loss": -24.277204513549805, "global_step": 190801, "epoch": 2298} {"train_loss": -23.956527709960938, "global_step": 190802, "epoch": 2298} {"train_loss": -24.449787139892578, "global_step": 190803, "epoch": 2298} {"train_loss": -24.360315322875977, "global_step": 190804, "epoch": 2298} {"train_loss": -24.22260856628418, "global_step": 190805, "epoch": 2298} {"train_loss": -24.169891357421875, "global_step": 190806, "epoch": 2298} {"train_loss": -24.33169937133789, "global_step": 190807, "epoch": 2298} {"train_loss": -24.3746395111084, "global_step": 190808, "epoch": 2298} {"train_loss": -24.0904541015625, "global_step": 190809, "epoch": 2298} {"train_loss": -24.406265258789062, "global_step": 190810, "epoch": 2298} {"train_loss": -24.412986755371094, "global_step": 190811, "epoch": 2298} {"train_loss": -24.456327438354492, "global_step": 190812, "epoch": 2298} {"train_loss": -24.173477172851562, "global_step": 190813, "epoch": 2298} {"train_loss": -23.682647705078125, "global_step": 190814, "epoch": 2298} {"train_loss": -23.879432678222656, "global_step": 190815, "epoch": 2298} {"train_loss": -23.980973507984576, "global_step": 190816, "epoch": 2298, "val_loss": 6512656.0} {"train_loss": -21.549579620361328, "global_step": 190817, "epoch": 2299} {"train_loss": -21.868972778320312, "global_step": 190818, "epoch": 2299} {"train_loss": -21.3127384185791, "global_step": 190819, "epoch": 2299} {"train_loss": -22.089136123657227, "global_step": 190820, "epoch": 2299} {"train_loss": -22.040863037109375, "global_step": 190821, "epoch": 2299} {"train_loss": -22.302927017211914, "global_step": 190822, "epoch": 2299} {"train_loss": -21.927316665649414, "global_step": 190823, "epoch": 2299} {"train_loss": -23.159399032592773, "global_step": 190824, "epoch": 2299} {"train_loss": -22.498554229736328, "global_step": 190825, "epoch": 2299} {"train_loss": -22.644271850585938, "global_step": 190826, "epoch": 2299} {"train_loss": -22.59903907775879, "global_step": 190827, "epoch": 2299} {"train_loss": -22.812536239624023, "global_step": 190828, "epoch": 2299} {"train_loss": -23.00611686706543, "global_step": 190829, "epoch": 2299} {"train_loss": -22.690292358398438, "global_step": 190830, "epoch": 2299} {"train_loss": -23.012712478637695, "global_step": 190831, "epoch": 2299} {"train_loss": -22.914506912231445, "global_step": 190832, "epoch": 2299} {"train_loss": -23.069053649902344, "global_step": 190833, "epoch": 2299} {"train_loss": -22.768768310546875, "global_step": 190834, "epoch": 2299} {"train_loss": -23.16831398010254, "global_step": 190835, "epoch": 2299} {"train_loss": -23.062435150146484, "global_step": 190836, "epoch": 2299} {"train_loss": -23.211763381958008, "global_step": 190837, "epoch": 2299} {"train_loss": -23.60211753845215, "global_step": 190838, "epoch": 2299} {"train_loss": -23.49713897705078, "global_step": 190839, "epoch": 2299} {"train_loss": -23.720962524414062, "global_step": 190840, "epoch": 2299} {"train_loss": -23.307912826538086, "global_step": 190841, "epoch": 2299} {"train_loss": -23.519947052001953, "global_step": 190842, "epoch": 2299} {"train_loss": -23.488494873046875, "global_step": 190843, "epoch": 2299} {"train_loss": -23.668066024780273, "global_step": 190844, "epoch": 2299} {"train_loss": -23.773902893066406, "global_step": 190845, "epoch": 2299} {"train_loss": -23.760591506958008, "global_step": 190846, "epoch": 2299} {"train_loss": -23.443796157836914, "global_step": 190847, "epoch": 2299} {"train_loss": -23.924640655517578, "global_step": 190848, "epoch": 2299} {"train_loss": -23.690471649169922, "global_step": 190849, "epoch": 2299} {"train_loss": -23.567230224609375, "global_step": 190850, "epoch": 2299} {"train_loss": -23.776975631713867, "global_step": 190851, "epoch": 2299} {"train_loss": -23.769474029541016, "global_step": 190852, "epoch": 2299} {"train_loss": -23.682689666748047, "global_step": 190853, "epoch": 2299} {"train_loss": -23.765670776367188, "global_step": 190854, "epoch": 2299} {"train_loss": -23.97907829284668, "global_step": 190855, "epoch": 2299} {"train_loss": -24.06161880493164, "global_step": 190856, "epoch": 2299} {"train_loss": -23.86433982849121, "global_step": 190857, "epoch": 2299} {"train_loss": -24.011396408081055, "global_step": 190858, "epoch": 2299} {"train_loss": -24.527944564819336, "global_step": 190859, "epoch": 2299} {"train_loss": -24.297271728515625, "global_step": 190860, "epoch": 2299} {"train_loss": -23.860130310058594, "global_step": 190861, "epoch": 2299} {"train_loss": -24.002302169799805, "global_step": 190862, "epoch": 2299} {"train_loss": -24.302770614624023, "global_step": 190863, "epoch": 2299} {"train_loss": -23.977441787719727, "global_step": 190864, "epoch": 2299} {"train_loss": -24.306453704833984, "global_step": 190865, "epoch": 2299} {"train_loss": -24.220693588256836, "global_step": 190866, "epoch": 2299} {"train_loss": -24.270727157592773, "global_step": 190867, "epoch": 2299} {"train_loss": -24.185758590698242, "global_step": 190868, "epoch": 2299} {"train_loss": -24.345840454101562, "global_step": 190869, "epoch": 2299} {"train_loss": -23.9199161529541, "global_step": 190870, "epoch": 2299} {"train_loss": -24.022123336791992, "global_step": 190871, "epoch": 2299} {"train_loss": -23.87407875061035, "global_step": 190872, "epoch": 2299} {"train_loss": -24.019994735717773, "global_step": 190873, "epoch": 2299} {"train_loss": -24.164716720581055, "global_step": 190874, "epoch": 2299} {"train_loss": -24.054426193237305, "global_step": 190875, "epoch": 2299} {"train_loss": -23.971899032592773, "global_step": 190876, "epoch": 2299} {"train_loss": -24.195505142211914, "global_step": 190877, "epoch": 2299} {"train_loss": -24.138818740844727, "global_step": 190878, "epoch": 2299} {"train_loss": -24.354877471923828, "global_step": 190879, "epoch": 2299} {"train_loss": -23.761783599853516, "global_step": 190880, "epoch": 2299} {"train_loss": -23.992277145385742, "global_step": 190881, "epoch": 2299} {"train_loss": -24.100500106811523, "global_step": 190882, "epoch": 2299} {"train_loss": -24.510543823242188, "global_step": 190883, "epoch": 2299} {"train_loss": -24.468793869018555, "global_step": 190884, "epoch": 2299} {"train_loss": -24.17405891418457, "global_step": 190885, "epoch": 2299} {"train_loss": -24.32901382446289, "global_step": 190886, "epoch": 2299} {"train_loss": -24.163137435913086, "global_step": 190887, "epoch": 2299} {"train_loss": -24.077823638916016, "global_step": 190888, "epoch": 2299} {"train_loss": -24.369861602783203, "global_step": 190889, "epoch": 2299} {"train_loss": -24.06104850769043, "global_step": 190890, "epoch": 2299} {"train_loss": -23.714208602905273, "global_step": 190891, "epoch": 2299} {"train_loss": -24.097036361694336, "global_step": 190892, "epoch": 2299} {"train_loss": -24.294021606445312, "global_step": 190893, "epoch": 2299} {"train_loss": -23.985382080078125, "global_step": 190894, "epoch": 2299} {"train_loss": -24.342294692993164, "global_step": 190895, "epoch": 2299} {"train_loss": -24.160306930541992, "global_step": 190896, "epoch": 2299} {"train_loss": -24.23190689086914, "global_step": 190897, "epoch": 2299} {"train_loss": -24.266231536865234, "global_step": 190898, "epoch": 2299} {"train_loss": -23.640186792396637, "global_step": 190899, "epoch": 2299, "val_loss": 6540139.0} {"train_loss": -23.46982765197754, "global_step": 190900, "epoch": 2300} {"train_loss": -23.28938865661621, "global_step": 190901, "epoch": 2300} {"train_loss": -23.641660690307617, "global_step": 190902, "epoch": 2300} {"train_loss": -23.424762725830078, "global_step": 190903, "epoch": 2300} {"train_loss": -23.96091651916504, "global_step": 190904, "epoch": 2300} {"train_loss": -23.621740341186523, "global_step": 190905, "epoch": 2300} {"train_loss": -23.982105255126953, "global_step": 190906, "epoch": 2300} {"train_loss": -23.927677154541016, "global_step": 190907, "epoch": 2300} {"train_loss": -23.573638916015625, "global_step": 190908, "epoch": 2300} {"train_loss": -23.78505516052246, "global_step": 190909, "epoch": 2300} {"train_loss": -23.984224319458008, "global_step": 190910, "epoch": 2300} {"train_loss": -23.552871704101562, "global_step": 190911, "epoch": 2300} {"train_loss": -24.053756713867188, "global_step": 190912, "epoch": 2300} {"train_loss": -23.77448844909668, "global_step": 190913, "epoch": 2300} {"train_loss": -23.93256187438965, "global_step": 190914, "epoch": 2300} {"train_loss": -24.078882217407227, "global_step": 190915, "epoch": 2300} {"train_loss": -24.209394454956055, "global_step": 190916, "epoch": 2300} {"train_loss": -24.1618709564209, "global_step": 190917, "epoch": 2300} {"train_loss": -23.466413497924805, "global_step": 190918, "epoch": 2300} {"train_loss": -23.981672286987305, "global_step": 190919, "epoch": 2300} {"train_loss": -23.94369888305664, "global_step": 190920, "epoch": 2300} {"train_loss": -23.952856063842773, "global_step": 190921, "epoch": 2300} {"train_loss": -24.053556442260742, "global_step": 190922, "epoch": 2300} {"train_loss": -24.078128814697266, "global_step": 190923, "epoch": 2300} {"train_loss": -23.897741317749023, "global_step": 190924, "epoch": 2300} {"train_loss": -23.97167205810547, "global_step": 190925, "epoch": 2300} {"train_loss": -23.782583236694336, "global_step": 190926, "epoch": 2300} {"train_loss": -23.9558162689209, "global_step": 190927, "epoch": 2300} {"train_loss": -23.955076217651367, "global_step": 190928, "epoch": 2300} {"train_loss": -23.91912841796875, "global_step": 190929, "epoch": 2300} {"train_loss": -23.714786529541016, "global_step": 190930, "epoch": 2300} {"train_loss": -23.978992462158203, "global_step": 190931, "epoch": 2300} {"train_loss": -24.266225814819336, "global_step": 190932, "epoch": 2300} {"train_loss": -24.21000099182129, "global_step": 190933, "epoch": 2300} {"train_loss": -24.05591583251953, "global_step": 190934, "epoch": 2300} {"train_loss": -24.8358154296875, "global_step": 190935, "epoch": 2300} {"train_loss": -24.362722396850586, "global_step": 190936, "epoch": 2300} {"train_loss": -24.465742111206055, "global_step": 190937, "epoch": 2300} {"train_loss": -24.22464370727539, "global_step": 190938, "epoch": 2300} {"train_loss": -23.872678756713867, "global_step": 190939, "epoch": 2300} {"train_loss": -24.0172176361084, "global_step": 190940, "epoch": 2300} {"train_loss": -24.401517868041992, "global_step": 190941, "epoch": 2300} {"train_loss": -24.160924911499023, "global_step": 190942, "epoch": 2300} {"train_loss": -24.687244415283203, "global_step": 190943, "epoch": 2300} {"train_loss": -24.197729110717773, "global_step": 190944, "epoch": 2300} {"train_loss": -24.26449966430664, "global_step": 190945, "epoch": 2300} {"train_loss": -24.39177131652832, "global_step": 190946, "epoch": 2300} {"train_loss": -24.235427856445312, "global_step": 190947, "epoch": 2300} {"train_loss": -24.379898071289062, "global_step": 190948, "epoch": 2300} {"train_loss": -23.702503204345703, "global_step": 190949, "epoch": 2300} {"train_loss": -24.17195701599121, "global_step": 190950, "epoch": 2300} {"train_loss": -24.380155563354492, "global_step": 190951, "epoch": 2300} {"train_loss": -24.14918327331543, "global_step": 190952, "epoch": 2300} {"train_loss": -24.06630516052246, "global_step": 190953, "epoch": 2300} {"train_loss": -23.945974349975586, "global_step": 190954, "epoch": 2300} {"train_loss": -24.18318748474121, "global_step": 190955, "epoch": 2300} {"train_loss": -24.08075523376465, "global_step": 190956, "epoch": 2300} {"train_loss": -23.930423736572266, "global_step": 190957, "epoch": 2300} {"train_loss": -23.991010665893555, "global_step": 190958, "epoch": 2300} {"train_loss": -23.989439010620117, "global_step": 190959, "epoch": 2300} {"train_loss": -23.791616439819336, "global_step": 190960, "epoch": 2300} {"train_loss": -24.21152114868164, "global_step": 190961, "epoch": 2300} {"train_loss": -24.134611129760742, "global_step": 190962, "epoch": 2300} {"train_loss": -23.946266174316406, "global_step": 190963, "epoch": 2300} {"train_loss": -23.96192741394043, "global_step": 190964, "epoch": 2300} {"train_loss": -24.22321128845215, "global_step": 190965, "epoch": 2300} {"train_loss": -23.95156478881836, "global_step": 190966, "epoch": 2300} {"train_loss": -24.333030700683594, "global_step": 190967, "epoch": 2300} {"train_loss": -23.788522720336914, "global_step": 190968, "epoch": 2300} {"train_loss": -24.327856063842773, "global_step": 190969, "epoch": 2300} {"train_loss": -24.04904556274414, "global_step": 190970, "epoch": 2300} {"train_loss": -24.326379776000977, "global_step": 190971, "epoch": 2300} {"train_loss": -23.43206214904785, "global_step": 190972, "epoch": 2300} {"train_loss": -23.933881759643555, "global_step": 190973, "epoch": 2300} {"train_loss": -23.885482788085938, "global_step": 190974, "epoch": 2300} {"train_loss": -24.168058395385742, "global_step": 190975, "epoch": 2300} {"train_loss": -23.895933151245117, "global_step": 190976, "epoch": 2300} {"train_loss": -23.96693229675293, "global_step": 190977, "epoch": 2300} {"train_loss": -24.186080932617188, "global_step": 190978, "epoch": 2300} {"train_loss": -24.455068588256836, "global_step": 190979, "epoch": 2300} {"train_loss": -23.650136947631836, "global_step": 190980, "epoch": 2300} {"train_loss": -24.167118072509766, "global_step": 190981, "epoch": 2300} {"train_loss": -24.026632446840583, "global_step": 190982, "epoch": 2300, "train/sim_max_reward_0": 1.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 0.0, "test/sim_max_reward_4500000": 1.0, "test/sim_max_reward_4500001": 1.0, "test/sim_max_reward_4500002": 1.0, "test/sim_max_reward_4500003": 1.0, "test/sim_max_reward_4500004": 1.0, "test/sim_max_reward_4500005": 1.0, "test/sim_max_reward_4500006": 1.0, "test/sim_max_reward_4500007": 1.0, "test/sim_max_reward_4500008": 1.0, "test/sim_max_reward_4500009": 1.0, "test/sim_max_reward_4500010": 1.0, "test/sim_max_reward_4500011": 1.0, "test/sim_max_reward_4500012": 1.0, "test/sim_max_reward_4500013": 1.0, "test/sim_max_reward_4500014": 1.0, "test/sim_max_reward_4500015": 1.0, "test/sim_max_reward_4500016": 1.0, "test/sim_max_reward_4500017": 1.0, "test/sim_max_reward_4500018": 1.0, "test/sim_max_reward_4500019": 1.0, "test/sim_max_reward_4500020": 1.0, "test/sim_max_reward_4500021": 1.0, "train/mean_score": 0.8333333333333334, "test/mean_score": 1.0, "val_loss": 6378170.0} {"train_loss": -23.20318603515625, "global_step": 190983, "epoch": 2301} {"train_loss": -23.57981300354004, "global_step": 190984, "epoch": 2301} {"train_loss": -23.784727096557617, "global_step": 190985, "epoch": 2301} {"train_loss": -23.534513473510742, "global_step": 190986, "epoch": 2301} {"train_loss": -23.554523468017578, "global_step": 190987, "epoch": 2301} {"train_loss": -23.679515838623047, "global_step": 190988, "epoch": 2301} {"train_loss": -24.35929298400879, "global_step": 190989, "epoch": 2301} {"train_loss": -23.5894832611084, "global_step": 190990, "epoch": 2301} {"train_loss": -23.588529586791992, "global_step": 190991, "epoch": 2301} {"train_loss": -23.870376586914062, "global_step": 190992, "epoch": 2301} {"train_loss": -23.753114700317383, "global_step": 190993, "epoch": 2301} {"train_loss": -23.99281883239746, "global_step": 190994, "epoch": 2301} {"train_loss": -24.004676818847656, "global_step": 190995, "epoch": 2301} {"train_loss": -23.618499755859375, "global_step": 190996, "epoch": 2301} {"train_loss": -23.81611442565918, "global_step": 190997, "epoch": 2301} {"train_loss": -23.965709686279297, "global_step": 190998, "epoch": 2301} {"train_loss": -23.986059188842773, "global_step": 190999, "epoch": 2301} {"train_loss": -23.475690841674805, "global_step": 191000, "epoch": 2301} {"train_loss": -23.874082565307617, "global_step": 191001, "epoch": 2301} {"train_loss": -23.788618087768555, "global_step": 191002, "epoch": 2301} {"train_loss": -24.062728881835938, "global_step": 191003, "epoch": 2301} {"train_loss": -23.797910690307617, "global_step": 191004, "epoch": 2301} {"train_loss": -24.21146011352539, "global_step": 191005, "epoch": 2301} {"train_loss": -24.037860870361328, "global_step": 191006, "epoch": 2301} {"train_loss": -23.906143188476562, "global_step": 191007, "epoch": 2301} {"train_loss": -24.074493408203125, "global_step": 191008, "epoch": 2301} {"train_loss": -24.338340759277344, "global_step": 191009, "epoch": 2301} {"train_loss": -23.981698989868164, "global_step": 191010, "epoch": 2301} {"train_loss": -24.26988983154297, "global_step": 191011, "epoch": 2301} {"train_loss": -23.914857864379883, "global_step": 191012, "epoch": 2301} {"train_loss": -24.356653213500977, "global_step": 191013, "epoch": 2301} {"train_loss": -24.17720603942871, "global_step": 191014, "epoch": 2301} {"train_loss": -24.0307559967041, "global_step": 191015, "epoch": 2301} {"train_loss": -24.1014347076416, "global_step": 191016, "epoch": 2301} {"train_loss": -24.29087257385254, "global_step": 191017, "epoch": 2301} {"train_loss": -23.990217208862305, "global_step": 191018, "epoch": 2301} {"train_loss": -23.855682373046875, "global_step": 191019, "epoch": 2301} {"train_loss": -24.369428634643555, "global_step": 191020, "epoch": 2301} {"train_loss": -24.51274299621582, "global_step": 191021, "epoch": 2301} {"train_loss": -24.21771812438965, "global_step": 191022, "epoch": 2301} {"train_loss": -24.0128231048584, "global_step": 191023, "epoch": 2301} {"train_loss": -24.066823959350586, "global_step": 191024, "epoch": 2301} {"train_loss": -24.214038848876953, "global_step": 191025, "epoch": 2301} {"train_loss": -24.23710823059082, "global_step": 191026, "epoch": 2301} {"train_loss": -23.66507911682129, "global_step": 191027, "epoch": 2301} {"train_loss": -24.30829429626465, "global_step": 191028, "epoch": 2301} {"train_loss": -24.4066219329834, "global_step": 191029, "epoch": 2301} {"train_loss": -23.767948150634766, "global_step": 191030, "epoch": 2301} {"train_loss": -24.303571701049805, "global_step": 191031, "epoch": 2301} {"train_loss": -24.27587890625, "global_step": 191032, "epoch": 2301} {"train_loss": -23.7308349609375, "global_step": 191033, "epoch": 2301} {"train_loss": -24.142663955688477, "global_step": 191034, "epoch": 2301} {"train_loss": -24.4231014251709, "global_step": 191035, "epoch": 2301} {"train_loss": -24.51637840270996, "global_step": 191036, "epoch": 2301} {"train_loss": -24.154489517211914, "global_step": 191037, "epoch": 2301} {"train_loss": -24.207324981689453, "global_step": 191038, "epoch": 2301} {"train_loss": -24.201242446899414, "global_step": 191039, "epoch": 2301} {"train_loss": -24.482786178588867, "global_step": 191040, "epoch": 2301} {"train_loss": -24.46035385131836, "global_step": 191041, "epoch": 2301} {"train_loss": -24.471338272094727, "global_step": 191042, "epoch": 2301} {"train_loss": -24.221420288085938, "global_step": 191043, "epoch": 2301} {"train_loss": -24.093156814575195, "global_step": 191044, "epoch": 2301} {"train_loss": -24.15171241760254, "global_step": 191045, "epoch": 2301} {"train_loss": -24.576847076416016, "global_step": 191046, "epoch": 2301} {"train_loss": -24.068233489990234, "global_step": 191047, "epoch": 2301} {"train_loss": -24.186100006103516, "global_step": 191048, "epoch": 2301} {"train_loss": -24.10776710510254, "global_step": 191049, "epoch": 2301} {"train_loss": -24.163375854492188, "global_step": 191050, "epoch": 2301} {"train_loss": -24.112245559692383, "global_step": 191051, "epoch": 2301} {"train_loss": -24.204448699951172, "global_step": 191052, "epoch": 2301} {"train_loss": -24.471418380737305, "global_step": 191053, "epoch": 2301} {"train_loss": -24.385520935058594, "global_step": 191054, "epoch": 2301} {"train_loss": -24.128957748413086, "global_step": 191055, "epoch": 2301} {"train_loss": -24.09272575378418, "global_step": 191056, "epoch": 2301} {"train_loss": -23.914793014526367, "global_step": 191057, "epoch": 2301} {"train_loss": -23.776391983032227, "global_step": 191058, "epoch": 2301} {"train_loss": -24.133264541625977, "global_step": 191059, "epoch": 2301} {"train_loss": -23.845346450805664, "global_step": 191060, "epoch": 2301} {"train_loss": -24.426258087158203, "global_step": 191061, "epoch": 2301} {"train_loss": -24.120210647583008, "global_step": 191062, "epoch": 2301} {"train_loss": -24.16315269470215, "global_step": 191063, "epoch": 2301} {"train_loss": -23.943532943725586, "global_step": 191064, "epoch": 2301} {"train_loss": -24.061329485422156, "global_step": 191065, "epoch": 2301, "val_loss": 6540544.0} {"train_loss": -23.35968780517578, "global_step": 191066, "epoch": 2302} {"train_loss": -23.44148063659668, "global_step": 191067, "epoch": 2302} {"train_loss": -24.153013229370117, "global_step": 191068, "epoch": 2302} {"train_loss": -23.404251098632812, "global_step": 191069, "epoch": 2302} {"train_loss": -23.8692684173584, "global_step": 191070, "epoch": 2302} {"train_loss": -23.698322296142578, "global_step": 191071, "epoch": 2302} {"train_loss": -23.626068115234375, "global_step": 191072, "epoch": 2302} {"train_loss": -23.78530502319336, "global_step": 191073, "epoch": 2302} {"train_loss": -23.578332901000977, "global_step": 191074, "epoch": 2302} {"train_loss": -23.399539947509766, "global_step": 191075, "epoch": 2302} {"train_loss": -24.022886276245117, "global_step": 191076, "epoch": 2302} {"train_loss": -23.4019832611084, "global_step": 191077, "epoch": 2302} {"train_loss": -23.708471298217773, "global_step": 191078, "epoch": 2302} {"train_loss": -23.60544776916504, "global_step": 191079, "epoch": 2302} {"train_loss": -23.28838539123535, "global_step": 191080, "epoch": 2302} {"train_loss": -24.165996551513672, "global_step": 191081, "epoch": 2302} {"train_loss": -23.785547256469727, "global_step": 191082, "epoch": 2302} {"train_loss": -23.398550033569336, "global_step": 191083, "epoch": 2302} {"train_loss": -23.53731346130371, "global_step": 191084, "epoch": 2302} {"train_loss": -23.87799072265625, "global_step": 191085, "epoch": 2302} {"train_loss": -23.8275203704834, "global_step": 191086, "epoch": 2302} {"train_loss": -23.672590255737305, "global_step": 191087, "epoch": 2302} {"train_loss": -24.168344497680664, "global_step": 191088, "epoch": 2302} {"train_loss": -23.608219146728516, "global_step": 191089, "epoch": 2302} {"train_loss": -23.868988037109375, "global_step": 191090, "epoch": 2302} {"train_loss": -23.961448669433594, "global_step": 191091, "epoch": 2302} {"train_loss": -23.87714958190918, "global_step": 191092, "epoch": 2302} {"train_loss": -23.87145233154297, "global_step": 191093, "epoch": 2302} {"train_loss": -23.962406158447266, "global_step": 191094, "epoch": 2302} {"train_loss": -24.1340389251709, "global_step": 191095, "epoch": 2302} {"train_loss": -24.117231369018555, "global_step": 191096, "epoch": 2302} {"train_loss": -24.120891571044922, "global_step": 191097, "epoch": 2302} {"train_loss": -23.97020721435547, "global_step": 191098, "epoch": 2302} {"train_loss": -24.337305068969727, "global_step": 191099, "epoch": 2302} {"train_loss": -24.274070739746094, "global_step": 191100, "epoch": 2302} {"train_loss": -24.328519821166992, "global_step": 191101, "epoch": 2302} {"train_loss": -24.33403968811035, "global_step": 191102, "epoch": 2302} {"train_loss": -24.125646591186523, "global_step": 191103, "epoch": 2302} {"train_loss": -24.370290756225586, "global_step": 191104, "epoch": 2302} {"train_loss": -24.08038902282715, "global_step": 191105, "epoch": 2302} {"train_loss": -24.15279197692871, "global_step": 191106, "epoch": 2302} {"train_loss": -24.054759979248047, "global_step": 191107, "epoch": 2302} {"train_loss": -23.8592529296875, "global_step": 191108, "epoch": 2302} {"train_loss": -24.274612426757812, "global_step": 191109, "epoch": 2302} {"train_loss": -24.20363998413086, "global_step": 191110, "epoch": 2302} {"train_loss": -24.163402557373047, "global_step": 191111, "epoch": 2302} {"train_loss": -24.070236206054688, "global_step": 191112, "epoch": 2302} {"train_loss": -23.904895782470703, "global_step": 191113, "epoch": 2302} {"train_loss": -24.126728057861328, "global_step": 191114, "epoch": 2302} {"train_loss": -24.35447120666504, "global_step": 191115, "epoch": 2302} {"train_loss": -23.763769149780273, "global_step": 191116, "epoch": 2302} {"train_loss": -23.847440719604492, "global_step": 191117, "epoch": 2302} {"train_loss": -24.369314193725586, "global_step": 191118, "epoch": 2302} {"train_loss": -23.695377349853516, "global_step": 191119, "epoch": 2302} {"train_loss": -23.816640853881836, "global_step": 191120, "epoch": 2302} {"train_loss": -24.59747886657715, "global_step": 191121, "epoch": 2302} {"train_loss": -23.92597770690918, "global_step": 191122, "epoch": 2302} {"train_loss": -23.90252113342285, "global_step": 191123, "epoch": 2302} {"train_loss": -24.249591827392578, "global_step": 191124, "epoch": 2302} {"train_loss": -23.721277236938477, "global_step": 191125, "epoch": 2302} {"train_loss": -24.554285049438477, "global_step": 191126, "epoch": 2302} {"train_loss": -23.847640991210938, "global_step": 191127, "epoch": 2302} {"train_loss": -24.25465965270996, "global_step": 191128, "epoch": 2302} {"train_loss": -23.723037719726562, "global_step": 191129, "epoch": 2302} {"train_loss": -23.861167907714844, "global_step": 191130, "epoch": 2302} {"train_loss": -23.940532684326172, "global_step": 191131, "epoch": 2302} {"train_loss": -24.271507263183594, "global_step": 191132, "epoch": 2302} {"train_loss": -24.03997802734375, "global_step": 191133, "epoch": 2302} {"train_loss": -23.87519073486328, "global_step": 191134, "epoch": 2302} {"train_loss": -24.119653701782227, "global_step": 191135, "epoch": 2302} {"train_loss": -24.376237869262695, "global_step": 191136, "epoch": 2302} {"train_loss": -23.902938842773438, "global_step": 191137, "epoch": 2302} {"train_loss": -24.183805465698242, "global_step": 191138, "epoch": 2302} {"train_loss": -23.634870529174805, "global_step": 191139, "epoch": 2302} {"train_loss": -24.718717575073242, "global_step": 191140, "epoch": 2302} {"train_loss": -23.884906768798828, "global_step": 191141, "epoch": 2302} {"train_loss": -24.354578018188477, "global_step": 191142, "epoch": 2302} {"train_loss": -24.221603393554688, "global_step": 191143, "epoch": 2302} {"train_loss": -24.398178100585938, "global_step": 191144, "epoch": 2302} {"train_loss": -24.13178825378418, "global_step": 191145, "epoch": 2302} {"train_loss": -24.158750534057617, "global_step": 191146, "epoch": 2302} {"train_loss": -24.04530906677246, "global_step": 191147, "epoch": 2302} {"train_loss": -23.979616808604046, "global_step": 191148, "epoch": 2302, "val_loss": 6536011.0} {"train_loss": -23.1634578704834, "global_step": 191149, "epoch": 2303} {"train_loss": -23.76869010925293, "global_step": 191150, "epoch": 2303} {"train_loss": -23.17042350769043, "global_step": 191151, "epoch": 2303} {"train_loss": -23.81556510925293, "global_step": 191152, "epoch": 2303} {"train_loss": -23.60663414001465, "global_step": 191153, "epoch": 2303} {"train_loss": -23.696340560913086, "global_step": 191154, "epoch": 2303} {"train_loss": -23.682575225830078, "global_step": 191155, "epoch": 2303} {"train_loss": -23.848365783691406, "global_step": 191156, "epoch": 2303} {"train_loss": -23.990055084228516, "global_step": 191157, "epoch": 2303} {"train_loss": -23.41948890686035, "global_step": 191158, "epoch": 2303} {"train_loss": -23.81275749206543, "global_step": 191159, "epoch": 2303} {"train_loss": -23.965076446533203, "global_step": 191160, "epoch": 2303} {"train_loss": -23.738689422607422, "global_step": 191161, "epoch": 2303} {"train_loss": -23.9443302154541, "global_step": 191162, "epoch": 2303} {"train_loss": -23.783044815063477, "global_step": 191163, "epoch": 2303} {"train_loss": -23.72739028930664, "global_step": 191164, "epoch": 2303} {"train_loss": -23.739276885986328, "global_step": 191165, "epoch": 2303} {"train_loss": -23.929166793823242, "global_step": 191166, "epoch": 2303} {"train_loss": -24.05527687072754, "global_step": 191167, "epoch": 2303} {"train_loss": -23.94601821899414, "global_step": 191168, "epoch": 2303} {"train_loss": -23.829519271850586, "global_step": 191169, "epoch": 2303} {"train_loss": -23.86895751953125, "global_step": 191170, "epoch": 2303} {"train_loss": -23.673688888549805, "global_step": 191171, "epoch": 2303} {"train_loss": -23.82986068725586, "global_step": 191172, "epoch": 2303} {"train_loss": -24.005294799804688, "global_step": 191173, "epoch": 2303} {"train_loss": -24.012861251831055, "global_step": 191174, "epoch": 2303} {"train_loss": -23.799150466918945, "global_step": 191175, "epoch": 2303} {"train_loss": -24.053979873657227, "global_step": 191176, "epoch": 2303} {"train_loss": -24.01837158203125, "global_step": 191177, "epoch": 2303} {"train_loss": -24.140180587768555, "global_step": 191178, "epoch": 2303} {"train_loss": -24.15384292602539, "global_step": 191179, "epoch": 2303} {"train_loss": -24.117521286010742, "global_step": 191180, "epoch": 2303} {"train_loss": -23.77064323425293, "global_step": 191181, "epoch": 2303} {"train_loss": -24.293909072875977, "global_step": 191182, "epoch": 2303} {"train_loss": -23.733373641967773, "global_step": 191183, "epoch": 2303} {"train_loss": -24.005434036254883, "global_step": 191184, "epoch": 2303} {"train_loss": -24.379741668701172, "global_step": 191185, "epoch": 2303} {"train_loss": -24.300195693969727, "global_step": 191186, "epoch": 2303} {"train_loss": -24.140363693237305, "global_step": 191187, "epoch": 2303} {"train_loss": -24.308189392089844, "global_step": 191188, "epoch": 2303} {"train_loss": -24.177352905273438, "global_step": 191189, "epoch": 2303} {"train_loss": -24.628158569335938, "global_step": 191190, "epoch": 2303} {"train_loss": -24.268146514892578, "global_step": 191191, "epoch": 2303} {"train_loss": -23.999353408813477, "global_step": 191192, "epoch": 2303} {"train_loss": -23.92915916442871, "global_step": 191193, "epoch": 2303} {"train_loss": -24.290586471557617, "global_step": 191194, "epoch": 2303} {"train_loss": -24.426006317138672, "global_step": 191195, "epoch": 2303} {"train_loss": -24.343961715698242, "global_step": 191196, "epoch": 2303} {"train_loss": -24.16786003112793, "global_step": 191197, "epoch": 2303} {"train_loss": -24.315784454345703, "global_step": 191198, "epoch": 2303} {"train_loss": -24.156482696533203, "global_step": 191199, "epoch": 2303} {"train_loss": -24.10663414001465, "global_step": 191200, "epoch": 2303} {"train_loss": -23.9683837890625, "global_step": 191201, "epoch": 2303} {"train_loss": -23.585416793823242, "global_step": 191202, "epoch": 2303} {"train_loss": -23.90916633605957, "global_step": 191203, "epoch": 2303} {"train_loss": -24.004697799682617, "global_step": 191204, "epoch": 2303} {"train_loss": -23.97348403930664, "global_step": 191205, "epoch": 2303} {"train_loss": -24.416303634643555, "global_step": 191206, "epoch": 2303} {"train_loss": -24.36356544494629, "global_step": 191207, "epoch": 2303} {"train_loss": -23.94441032409668, "global_step": 191208, "epoch": 2303} {"train_loss": -24.408781051635742, "global_step": 191209, "epoch": 2303} {"train_loss": -24.25860023498535, "global_step": 191210, "epoch": 2303} {"train_loss": -24.011499404907227, "global_step": 191211, "epoch": 2303} {"train_loss": -23.669347763061523, "global_step": 191212, "epoch": 2303} {"train_loss": -24.498037338256836, "global_step": 191213, "epoch": 2303} {"train_loss": -23.82719612121582, "global_step": 191214, "epoch": 2303} {"train_loss": -24.1704158782959, "global_step": 191215, "epoch": 2303} {"train_loss": -24.028030395507812, "global_step": 191216, "epoch": 2303} {"train_loss": -24.059900283813477, "global_step": 191217, "epoch": 2303} {"train_loss": -24.289173126220703, "global_step": 191218, "epoch": 2303} {"train_loss": -24.155675888061523, "global_step": 191219, "epoch": 2303} {"train_loss": -24.220197677612305, "global_step": 191220, "epoch": 2303} {"train_loss": -24.03203773498535, "global_step": 191221, "epoch": 2303} {"train_loss": -24.291940689086914, "global_step": 191222, "epoch": 2303} {"train_loss": -24.287525177001953, "global_step": 191223, "epoch": 2303} {"train_loss": -24.086111068725586, "global_step": 191224, "epoch": 2303} {"train_loss": -24.21738624572754, "global_step": 191225, "epoch": 2303} {"train_loss": -24.13075828552246, "global_step": 191226, "epoch": 2303} {"train_loss": -23.516225814819336, "global_step": 191227, "epoch": 2303} {"train_loss": -24.198606491088867, "global_step": 191228, "epoch": 2303} {"train_loss": -24.230104446411133, "global_step": 191229, "epoch": 2303} {"train_loss": -24.119617462158203, "global_step": 191230, "epoch": 2303} {"train_loss": -24.0018482667854, "global_step": 191231, "epoch": 2303, "val_loss": 6545536.0} {"train_loss": -23.341552734375, "global_step": 191232, "epoch": 2304} {"train_loss": -24.019899368286133, "global_step": 191233, "epoch": 2304} {"train_loss": -23.646011352539062, "global_step": 191234, "epoch": 2304} {"train_loss": -24.12118148803711, "global_step": 191235, "epoch": 2304} {"train_loss": -23.82174301147461, "global_step": 191236, "epoch": 2304} {"train_loss": -23.653173446655273, "global_step": 191237, "epoch": 2304} {"train_loss": -23.799243927001953, "global_step": 191238, "epoch": 2304} {"train_loss": -23.8957462310791, "global_step": 191239, "epoch": 2304} {"train_loss": -24.147336959838867, "global_step": 191240, "epoch": 2304} {"train_loss": -23.418825149536133, "global_step": 191241, "epoch": 2304} {"train_loss": -23.529056549072266, "global_step": 191242, "epoch": 2304} {"train_loss": -23.61422348022461, "global_step": 191243, "epoch": 2304} {"train_loss": -23.864267349243164, "global_step": 191244, "epoch": 2304} {"train_loss": -24.105899810791016, "global_step": 191245, "epoch": 2304} {"train_loss": -23.66712188720703, "global_step": 191246, "epoch": 2304} {"train_loss": -24.0048828125, "global_step": 191247, "epoch": 2304} {"train_loss": -24.058670043945312, "global_step": 191248, "epoch": 2304} {"train_loss": -23.875503540039062, "global_step": 191249, "epoch": 2304} {"train_loss": -24.074167251586914, "global_step": 191250, "epoch": 2304} {"train_loss": -24.09906578063965, "global_step": 191251, "epoch": 2304} {"train_loss": -24.159339904785156, "global_step": 191252, "epoch": 2304} {"train_loss": -24.08808135986328, "global_step": 191253, "epoch": 2304} {"train_loss": -23.835325241088867, "global_step": 191254, "epoch": 2304} {"train_loss": -23.9829158782959, "global_step": 191255, "epoch": 2304} {"train_loss": -24.236425399780273, "global_step": 191256, "epoch": 2304} {"train_loss": -23.904691696166992, "global_step": 191257, "epoch": 2304} {"train_loss": -23.89320182800293, "global_step": 191258, "epoch": 2304} {"train_loss": -23.927213668823242, "global_step": 191259, "epoch": 2304} {"train_loss": -24.603836059570312, "global_step": 191260, "epoch": 2304} {"train_loss": -24.17236328125, "global_step": 191261, "epoch": 2304} {"train_loss": -24.164642333984375, "global_step": 191262, "epoch": 2304} {"train_loss": -24.20091438293457, "global_step": 191263, "epoch": 2304} {"train_loss": -23.98978614807129, "global_step": 191264, "epoch": 2304} {"train_loss": -24.048330307006836, "global_step": 191265, "epoch": 2304} {"train_loss": -23.843021392822266, "global_step": 191266, "epoch": 2304} {"train_loss": -24.06068992614746, "global_step": 191267, "epoch": 2304} {"train_loss": -24.063587188720703, "global_step": 191268, "epoch": 2304} {"train_loss": -24.00288200378418, "global_step": 191269, "epoch": 2304} {"train_loss": -24.011159896850586, "global_step": 191270, "epoch": 2304} {"train_loss": -23.947994232177734, "global_step": 191271, "epoch": 2304} {"train_loss": -24.319509506225586, "global_step": 191272, "epoch": 2304} {"train_loss": -23.968591690063477, "global_step": 191273, "epoch": 2304} {"train_loss": -23.886417388916016, "global_step": 191274, "epoch": 2304} {"train_loss": -24.032712936401367, "global_step": 191275, "epoch": 2304} {"train_loss": -24.258760452270508, "global_step": 191276, "epoch": 2304} {"train_loss": -23.91165542602539, "global_step": 191277, "epoch": 2304} {"train_loss": -24.053024291992188, "global_step": 191278, "epoch": 2304} {"train_loss": -24.154935836791992, "global_step": 191279, "epoch": 2304} {"train_loss": -23.93699836730957, "global_step": 191280, "epoch": 2304} {"train_loss": -24.153989791870117, "global_step": 191281, "epoch": 2304} {"train_loss": -23.846410751342773, "global_step": 191282, "epoch": 2304} {"train_loss": -23.755186080932617, "global_step": 191283, "epoch": 2304} {"train_loss": -24.447834014892578, "global_step": 191284, "epoch": 2304} {"train_loss": -24.129621505737305, "global_step": 191285, "epoch": 2304} {"train_loss": -23.97650146484375, "global_step": 191286, "epoch": 2304} {"train_loss": -24.40644645690918, "global_step": 191287, "epoch": 2304} {"train_loss": -24.03339195251465, "global_step": 191288, "epoch": 2304} {"train_loss": -24.083654403686523, "global_step": 191289, "epoch": 2304} {"train_loss": -24.087491989135742, "global_step": 191290, "epoch": 2304} {"train_loss": -24.19741439819336, "global_step": 191291, "epoch": 2304} {"train_loss": -24.399093627929688, "global_step": 191292, "epoch": 2304} {"train_loss": -23.8940486907959, "global_step": 191293, "epoch": 2304} {"train_loss": -23.927295684814453, "global_step": 191294, "epoch": 2304} {"train_loss": -24.176626205444336, "global_step": 191295, "epoch": 2304} {"train_loss": -23.930137634277344, "global_step": 191296, "epoch": 2304} {"train_loss": -23.38055992126465, "global_step": 191297, "epoch": 2304} {"train_loss": -23.801715850830078, "global_step": 191298, "epoch": 2304} {"train_loss": -23.9652156829834, "global_step": 191299, "epoch": 2304} {"train_loss": -23.672739028930664, "global_step": 191300, "epoch": 2304} {"train_loss": -23.775117874145508, "global_step": 191301, "epoch": 2304} {"train_loss": -23.901777267456055, "global_step": 191302, "epoch": 2304} {"train_loss": -24.383079528808594, "global_step": 191303, "epoch": 2304} {"train_loss": -24.10544776916504, "global_step": 191304, "epoch": 2304} {"train_loss": -23.964065551757812, "global_step": 191305, "epoch": 2304} {"train_loss": -23.55216407775879, "global_step": 191306, "epoch": 2304} {"train_loss": -24.13862419128418, "global_step": 191307, "epoch": 2304} {"train_loss": -24.20930290222168, "global_step": 191308, "epoch": 2304} {"train_loss": -24.16547966003418, "global_step": 191309, "epoch": 2304} {"train_loss": -24.4710636138916, "global_step": 191310, "epoch": 2304} {"train_loss": -24.193204879760742, "global_step": 191311, "epoch": 2304} {"train_loss": -23.803768157958984, "global_step": 191312, "epoch": 2304} {"train_loss": -24.20210838317871, "global_step": 191313, "epoch": 2304} {"train_loss": -24.006514882466877, "global_step": 191314, "epoch": 2304, "val_loss": 6521613.0} {"train_loss": -23.160802841186523, "global_step": 191315, "epoch": 2305} {"train_loss": -22.96268653869629, "global_step": 191316, "epoch": 2305} {"train_loss": -23.85964012145996, "global_step": 191317, "epoch": 2305} {"train_loss": -23.36879539489746, "global_step": 191318, "epoch": 2305} {"train_loss": -22.990304946899414, "global_step": 191319, "epoch": 2305} {"train_loss": -24.017797470092773, "global_step": 191320, "epoch": 2305} {"train_loss": -23.282175064086914, "global_step": 191321, "epoch": 2305} {"train_loss": -23.1802921295166, "global_step": 191322, "epoch": 2305} {"train_loss": -23.31465721130371, "global_step": 191323, "epoch": 2305} {"train_loss": -23.405017852783203, "global_step": 191324, "epoch": 2305} {"train_loss": -23.79205322265625, "global_step": 191325, "epoch": 2305} {"train_loss": -23.720678329467773, "global_step": 191326, "epoch": 2305} {"train_loss": -24.111820220947266, "global_step": 191327, "epoch": 2305} {"train_loss": -23.759449005126953, "global_step": 191328, "epoch": 2305} {"train_loss": -23.611915588378906, "global_step": 191329, "epoch": 2305} {"train_loss": -23.561548233032227, "global_step": 191330, "epoch": 2305} {"train_loss": -23.823699951171875, "global_step": 191331, "epoch": 2305} {"train_loss": -24.08108901977539, "global_step": 191332, "epoch": 2305} {"train_loss": -24.39269256591797, "global_step": 191333, "epoch": 2305} {"train_loss": -24.097692489624023, "global_step": 191334, "epoch": 2305} {"train_loss": -24.08275032043457, "global_step": 191335, "epoch": 2305} {"train_loss": -23.946149826049805, "global_step": 191336, "epoch": 2305} {"train_loss": -24.21194839477539, "global_step": 191337, "epoch": 2305} {"train_loss": -24.025815963745117, "global_step": 191338, "epoch": 2305} {"train_loss": -23.898847579956055, "global_step": 191339, "epoch": 2305} {"train_loss": -23.802183151245117, "global_step": 191340, "epoch": 2305} {"train_loss": -24.11053466796875, "global_step": 191341, "epoch": 2305} {"train_loss": -24.177066802978516, "global_step": 191342, "epoch": 2305} {"train_loss": -23.904991149902344, "global_step": 191343, "epoch": 2305} {"train_loss": -23.86482810974121, "global_step": 191344, "epoch": 2305} {"train_loss": -24.510549545288086, "global_step": 191345, "epoch": 2305} {"train_loss": -24.194509506225586, "global_step": 191346, "epoch": 2305} {"train_loss": -24.185758590698242, "global_step": 191347, "epoch": 2305} {"train_loss": -24.50958251953125, "global_step": 191348, "epoch": 2305} {"train_loss": -24.33237075805664, "global_step": 191349, "epoch": 2305} {"train_loss": -24.44771385192871, "global_step": 191350, "epoch": 2305} {"train_loss": -23.727130889892578, "global_step": 191351, "epoch": 2305} {"train_loss": -23.986570358276367, "global_step": 191352, "epoch": 2305} {"train_loss": -24.157787322998047, "global_step": 191353, "epoch": 2305} {"train_loss": -24.332189559936523, "global_step": 191354, "epoch": 2305} {"train_loss": -24.311222076416016, "global_step": 191355, "epoch": 2305} {"train_loss": -24.126832962036133, "global_step": 191356, "epoch": 2305} {"train_loss": -23.73066520690918, "global_step": 191357, "epoch": 2305} {"train_loss": -23.971460342407227, "global_step": 191358, "epoch": 2305} {"train_loss": -24.428781509399414, "global_step": 191359, "epoch": 2305} {"train_loss": -24.288305282592773, "global_step": 191360, "epoch": 2305} {"train_loss": -23.9388370513916, "global_step": 191361, "epoch": 2305} {"train_loss": -24.13136100769043, "global_step": 191362, "epoch": 2305} {"train_loss": -24.199132919311523, "global_step": 191363, "epoch": 2305} {"train_loss": -23.911828994750977, "global_step": 191364, "epoch": 2305} {"train_loss": -24.084909439086914, "global_step": 191365, "epoch": 2305} {"train_loss": -24.162946701049805, "global_step": 191366, "epoch": 2305} {"train_loss": -24.035663604736328, "global_step": 191367, "epoch": 2305} {"train_loss": -24.371213912963867, "global_step": 191368, "epoch": 2305} {"train_loss": -24.084487915039062, "global_step": 191369, "epoch": 2305} {"train_loss": -24.083759307861328, "global_step": 191370, "epoch": 2305} {"train_loss": -23.95947265625, "global_step": 191371, "epoch": 2305} {"train_loss": -24.167236328125, "global_step": 191372, "epoch": 2305} {"train_loss": -23.653200149536133, "global_step": 191373, "epoch": 2305} {"train_loss": -23.925432205200195, "global_step": 191374, "epoch": 2305} {"train_loss": -24.217727661132812, "global_step": 191375, "epoch": 2305} {"train_loss": -24.355449676513672, "global_step": 191376, "epoch": 2305} {"train_loss": -24.04596519470215, "global_step": 191377, "epoch": 2305} {"train_loss": -24.21576499938965, "global_step": 191378, "epoch": 2305} {"train_loss": -24.58807945251465, "global_step": 191379, "epoch": 2305} {"train_loss": -24.366601943969727, "global_step": 191380, "epoch": 2305} {"train_loss": -23.9566650390625, "global_step": 191381, "epoch": 2305} {"train_loss": -24.514699935913086, "global_step": 191382, "epoch": 2305} {"train_loss": -24.252567291259766, "global_step": 191383, "epoch": 2305} {"train_loss": -24.3127384185791, "global_step": 191384, "epoch": 2305} {"train_loss": -24.23762321472168, "global_step": 191385, "epoch": 2305} {"train_loss": -24.130517959594727, "global_step": 191386, "epoch": 2305} {"train_loss": -24.495302200317383, "global_step": 191387, "epoch": 2305} {"train_loss": -24.171802520751953, "global_step": 191388, "epoch": 2305} {"train_loss": -24.262659072875977, "global_step": 191389, "epoch": 2305} {"train_loss": -24.298139572143555, "global_step": 191390, "epoch": 2305} {"train_loss": -24.351119995117188, "global_step": 191391, "epoch": 2305} {"train_loss": -24.176939010620117, "global_step": 191392, "epoch": 2305} {"train_loss": -24.236574172973633, "global_step": 191393, "epoch": 2305} {"train_loss": -24.184860229492188, "global_step": 191394, "epoch": 2305} {"train_loss": -23.977285385131836, "global_step": 191395, "epoch": 2305} {"train_loss": -24.209430694580078, "global_step": 191396, "epoch": 2305} {"train_loss": -24.027606389608728, "global_step": 191397, "epoch": 2305, "val_loss": 6583370.0} {"train_loss": -23.857023239135742, "global_step": 191398, "epoch": 2306} {"train_loss": -23.88083839416504, "global_step": 191399, "epoch": 2306} {"train_loss": -23.933120727539062, "global_step": 191400, "epoch": 2306} {"train_loss": -24.181344985961914, "global_step": 191401, "epoch": 2306} {"train_loss": -24.034717559814453, "global_step": 191402, "epoch": 2306} {"train_loss": -23.759138107299805, "global_step": 191403, "epoch": 2306} {"train_loss": -23.989639282226562, "global_step": 191404, "epoch": 2306} {"train_loss": -23.5811824798584, "global_step": 191405, "epoch": 2306} {"train_loss": -23.878707885742188, "global_step": 191406, "epoch": 2306} {"train_loss": -23.9901180267334, "global_step": 191407, "epoch": 2306} {"train_loss": -23.67745590209961, "global_step": 191408, "epoch": 2306} {"train_loss": -23.94854164123535, "global_step": 191409, "epoch": 2306} {"train_loss": -24.065279006958008, "global_step": 191410, "epoch": 2306} {"train_loss": -23.35160255432129, "global_step": 191411, "epoch": 2306} {"train_loss": -24.311508178710938, "global_step": 191412, "epoch": 2306} {"train_loss": -23.716781616210938, "global_step": 191413, "epoch": 2306} {"train_loss": -23.864957809448242, "global_step": 191414, "epoch": 2306} {"train_loss": -23.633026123046875, "global_step": 191415, "epoch": 2306} {"train_loss": -24.001935958862305, "global_step": 191416, "epoch": 2306} {"train_loss": -23.995553970336914, "global_step": 191417, "epoch": 2306} {"train_loss": -24.099767684936523, "global_step": 191418, "epoch": 2306} {"train_loss": -23.95344352722168, "global_step": 191419, "epoch": 2306} {"train_loss": -24.02998161315918, "global_step": 191420, "epoch": 2306} {"train_loss": -24.24393653869629, "global_step": 191421, "epoch": 2306} {"train_loss": -23.6397647857666, "global_step": 191422, "epoch": 2306} {"train_loss": -23.99397850036621, "global_step": 191423, "epoch": 2306} {"train_loss": -24.179380416870117, "global_step": 191424, "epoch": 2306} {"train_loss": -23.886425018310547, "global_step": 191425, "epoch": 2306} {"train_loss": -23.787260055541992, "global_step": 191426, "epoch": 2306} {"train_loss": -23.774343490600586, "global_step": 191427, "epoch": 2306} {"train_loss": -24.079198837280273, "global_step": 191428, "epoch": 2306} {"train_loss": -23.97139549255371, "global_step": 191429, "epoch": 2306} {"train_loss": -24.355955123901367, "global_step": 191430, "epoch": 2306} {"train_loss": -24.162662506103516, "global_step": 191431, "epoch": 2306} {"train_loss": -23.92742919921875, "global_step": 191432, "epoch": 2306} {"train_loss": -24.29550552368164, "global_step": 191433, "epoch": 2306} {"train_loss": -24.12064552307129, "global_step": 191434, "epoch": 2306} {"train_loss": -23.84385108947754, "global_step": 191435, "epoch": 2306} {"train_loss": -24.1835994720459, "global_step": 191436, "epoch": 2306} {"train_loss": -24.152692794799805, "global_step": 191437, "epoch": 2306} {"train_loss": -24.0006160736084, "global_step": 191438, "epoch": 2306} {"train_loss": -24.43313217163086, "global_step": 191439, "epoch": 2306} {"train_loss": -23.97661018371582, "global_step": 191440, "epoch": 2306} {"train_loss": -24.352752685546875, "global_step": 191441, "epoch": 2306} {"train_loss": -24.015865325927734, "global_step": 191442, "epoch": 2306} {"train_loss": -23.818634033203125, "global_step": 191443, "epoch": 2306} {"train_loss": -24.088327407836914, "global_step": 191444, "epoch": 2306} {"train_loss": -24.300527572631836, "global_step": 191445, "epoch": 2306} {"train_loss": -23.88881492614746, "global_step": 191446, "epoch": 2306} {"train_loss": -24.316556930541992, "global_step": 191447, "epoch": 2306} {"train_loss": -24.060199737548828, "global_step": 191448, "epoch": 2306} {"train_loss": -24.041034698486328, "global_step": 191449, "epoch": 2306} {"train_loss": -24.01922607421875, "global_step": 191450, "epoch": 2306} {"train_loss": -23.79757308959961, "global_step": 191451, "epoch": 2306} {"train_loss": -24.3044376373291, "global_step": 191452, "epoch": 2306} {"train_loss": -23.93243980407715, "global_step": 191453, "epoch": 2306} {"train_loss": -24.158201217651367, "global_step": 191454, "epoch": 2306} {"train_loss": -24.15700340270996, "global_step": 191455, "epoch": 2306} {"train_loss": -24.349164962768555, "global_step": 191456, "epoch": 2306} {"train_loss": -24.35126304626465, "global_step": 191457, "epoch": 2306} {"train_loss": -23.838117599487305, "global_step": 191458, "epoch": 2306} {"train_loss": -24.197317123413086, "global_step": 191459, "epoch": 2306} {"train_loss": -24.410429000854492, "global_step": 191460, "epoch": 2306} {"train_loss": -24.336868286132812, "global_step": 191461, "epoch": 2306} {"train_loss": -23.882747650146484, "global_step": 191462, "epoch": 2306} {"train_loss": -24.065771102905273, "global_step": 191463, "epoch": 2306} {"train_loss": -24.16208839416504, "global_step": 191464, "epoch": 2306} {"train_loss": -24.048269271850586, "global_step": 191465, "epoch": 2306} {"train_loss": -24.281124114990234, "global_step": 191466, "epoch": 2306} {"train_loss": -23.80035972595215, "global_step": 191467, "epoch": 2306} {"train_loss": -24.165048599243164, "global_step": 191468, "epoch": 2306} {"train_loss": -23.992767333984375, "global_step": 191469, "epoch": 2306} {"train_loss": -24.25054359436035, "global_step": 191470, "epoch": 2306} {"train_loss": -24.3594970703125, "global_step": 191471, "epoch": 2306} {"train_loss": -24.436161041259766, "global_step": 191472, "epoch": 2306} {"train_loss": -24.032329559326172, "global_step": 191473, "epoch": 2306} {"train_loss": -24.01319694519043, "global_step": 191474, "epoch": 2306} {"train_loss": -24.248634338378906, "global_step": 191475, "epoch": 2306} {"train_loss": -24.02907371520996, "global_step": 191476, "epoch": 2306} {"train_loss": -24.185590744018555, "global_step": 191477, "epoch": 2306} {"train_loss": -24.143980026245117, "global_step": 191478, "epoch": 2306} {"train_loss": -23.974565505981445, "global_step": 191479, "epoch": 2306} {"train_loss": -24.03514209425593, "global_step": 191480, "epoch": 2306, "val_loss": 6586014.0} {"train_loss": -23.67774200439453, "global_step": 191481, "epoch": 2307} {"train_loss": -23.9870548248291, "global_step": 191482, "epoch": 2307} {"train_loss": -23.877676010131836, "global_step": 191483, "epoch": 2307} {"train_loss": -23.519466400146484, "global_step": 191484, "epoch": 2307} {"train_loss": -23.37141227722168, "global_step": 191485, "epoch": 2307} {"train_loss": -23.562719345092773, "global_step": 191486, "epoch": 2307} {"train_loss": -23.61174964904785, "global_step": 191487, "epoch": 2307} {"train_loss": -23.900869369506836, "global_step": 191488, "epoch": 2307} {"train_loss": -23.527448654174805, "global_step": 191489, "epoch": 2307} {"train_loss": -23.4804630279541, "global_step": 191490, "epoch": 2307} {"train_loss": -23.568174362182617, "global_step": 191491, "epoch": 2307} {"train_loss": -23.878250122070312, "global_step": 191492, "epoch": 2307} {"train_loss": -23.625455856323242, "global_step": 191493, "epoch": 2307} {"train_loss": -23.895557403564453, "global_step": 191494, "epoch": 2307} {"train_loss": -24.04560661315918, "global_step": 191495, "epoch": 2307} {"train_loss": -23.854124069213867, "global_step": 191496, "epoch": 2307} {"train_loss": -23.831525802612305, "global_step": 191497, "epoch": 2307} {"train_loss": -23.68641471862793, "global_step": 191498, "epoch": 2307} {"train_loss": -24.164342880249023, "global_step": 191499, "epoch": 2307} {"train_loss": -24.064247131347656, "global_step": 191500, "epoch": 2307} {"train_loss": -23.628402709960938, "global_step": 191501, "epoch": 2307} {"train_loss": -23.652896881103516, "global_step": 191502, "epoch": 2307} {"train_loss": -23.617464065551758, "global_step": 191503, "epoch": 2307} {"train_loss": -24.1217098236084, "global_step": 191504, "epoch": 2307} {"train_loss": -23.90158462524414, "global_step": 191505, "epoch": 2307} {"train_loss": -23.4521541595459, "global_step": 191506, "epoch": 2307} {"train_loss": -23.883108139038086, "global_step": 191507, "epoch": 2307} {"train_loss": -24.000469207763672, "global_step": 191508, "epoch": 2307} {"train_loss": -24.11952781677246, "global_step": 191509, "epoch": 2307} {"train_loss": -24.0915584564209, "global_step": 191510, "epoch": 2307} {"train_loss": -23.981914520263672, "global_step": 191511, "epoch": 2307} {"train_loss": -24.13813591003418, "global_step": 191512, "epoch": 2307} {"train_loss": -24.295352935791016, "global_step": 191513, "epoch": 2307} {"train_loss": -24.71317481994629, "global_step": 191514, "epoch": 2307} {"train_loss": -24.563526153564453, "global_step": 191515, "epoch": 2307} {"train_loss": -24.258642196655273, "global_step": 191516, "epoch": 2307} {"train_loss": -24.37696075439453, "global_step": 191517, "epoch": 2307} {"train_loss": -24.039438247680664, "global_step": 191518, "epoch": 2307} {"train_loss": -24.133283615112305, "global_step": 191519, "epoch": 2307} {"train_loss": -24.3681697845459, "global_step": 191520, "epoch": 2307} {"train_loss": -24.028594970703125, "global_step": 191521, "epoch": 2307} {"train_loss": -24.643606185913086, "global_step": 191522, "epoch": 2307} {"train_loss": -24.379562377929688, "global_step": 191523, "epoch": 2307} {"train_loss": -24.06810760498047, "global_step": 191524, "epoch": 2307} {"train_loss": -24.22393226623535, "global_step": 191525, "epoch": 2307} {"train_loss": -24.281625747680664, "global_step": 191526, "epoch": 2307} {"train_loss": -23.801860809326172, "global_step": 191527, "epoch": 2307} {"train_loss": -23.678115844726562, "global_step": 191528, "epoch": 2307} {"train_loss": -23.995447158813477, "global_step": 191529, "epoch": 2307} {"train_loss": -23.781347274780273, "global_step": 191530, "epoch": 2307} {"train_loss": -23.70366668701172, "global_step": 191531, "epoch": 2307} {"train_loss": -23.728376388549805, "global_step": 191532, "epoch": 2307} {"train_loss": -23.985578536987305, "global_step": 191533, "epoch": 2307} {"train_loss": -23.768835067749023, "global_step": 191534, "epoch": 2307} {"train_loss": -24.00000762939453, "global_step": 191535, "epoch": 2307} {"train_loss": -24.292173385620117, "global_step": 191536, "epoch": 2307} {"train_loss": -23.92754554748535, "global_step": 191537, "epoch": 2307} {"train_loss": -24.163740158081055, "global_step": 191538, "epoch": 2307} {"train_loss": -24.179363250732422, "global_step": 191539, "epoch": 2307} {"train_loss": -23.90237808227539, "global_step": 191540, "epoch": 2307} {"train_loss": -24.138790130615234, "global_step": 191541, "epoch": 2307} {"train_loss": -24.15248680114746, "global_step": 191542, "epoch": 2307} {"train_loss": -23.87394905090332, "global_step": 191543, "epoch": 2307} {"train_loss": -24.18509292602539, "global_step": 191544, "epoch": 2307} {"train_loss": -24.29572868347168, "global_step": 191545, "epoch": 2307} {"train_loss": -23.89993667602539, "global_step": 191546, "epoch": 2307} {"train_loss": -24.241226196289062, "global_step": 191547, "epoch": 2307} {"train_loss": -24.446550369262695, "global_step": 191548, "epoch": 2307} {"train_loss": -23.88116455078125, "global_step": 191549, "epoch": 2307} {"train_loss": -23.95964813232422, "global_step": 191550, "epoch": 2307} {"train_loss": -24.3066349029541, "global_step": 191551, "epoch": 2307} {"train_loss": -24.252416610717773, "global_step": 191552, "epoch": 2307} {"train_loss": -24.28133201599121, "global_step": 191553, "epoch": 2307} {"train_loss": -24.5059757232666, "global_step": 191554, "epoch": 2307} {"train_loss": -24.017698287963867, "global_step": 191555, "epoch": 2307} {"train_loss": -24.26833152770996, "global_step": 191556, "epoch": 2307} {"train_loss": -24.081256866455078, "global_step": 191557, "epoch": 2307} {"train_loss": -24.233936309814453, "global_step": 191558, "epoch": 2307} {"train_loss": -24.02849006652832, "global_step": 191559, "epoch": 2307} {"train_loss": -24.607925415039062, "global_step": 191560, "epoch": 2307} {"train_loss": -24.126394271850586, "global_step": 191561, "epoch": 2307} {"train_loss": -23.91288948059082, "global_step": 191562, "epoch": 2307} {"train_loss": -24.035896485110364, "global_step": 191563, "epoch": 2307, "val_loss": 6503455.0} {"train_loss": -23.708383560180664, "global_step": 191564, "epoch": 2308} {"train_loss": -23.21379852294922, "global_step": 191565, "epoch": 2308} {"train_loss": -23.540616989135742, "global_step": 191566, "epoch": 2308} {"train_loss": -24.04422378540039, "global_step": 191567, "epoch": 2308} {"train_loss": -22.854293823242188, "global_step": 191568, "epoch": 2308} {"train_loss": -23.55022621154785, "global_step": 191569, "epoch": 2308} {"train_loss": -23.16710090637207, "global_step": 191570, "epoch": 2308} {"train_loss": -23.531660079956055, "global_step": 191571, "epoch": 2308} {"train_loss": -23.408870697021484, "global_step": 191572, "epoch": 2308} {"train_loss": -23.989538192749023, "global_step": 191573, "epoch": 2308} {"train_loss": -23.34981346130371, "global_step": 191574, "epoch": 2308} {"train_loss": -23.984695434570312, "global_step": 191575, "epoch": 2308} {"train_loss": -23.680150985717773, "global_step": 191576, "epoch": 2308} {"train_loss": -23.6773681640625, "global_step": 191577, "epoch": 2308} {"train_loss": -23.82147789001465, "global_step": 191578, "epoch": 2308} {"train_loss": -23.4910831451416, "global_step": 191579, "epoch": 2308} {"train_loss": -24.065643310546875, "global_step": 191580, "epoch": 2308} {"train_loss": -23.821414947509766, "global_step": 191581, "epoch": 2308} {"train_loss": -23.605104446411133, "global_step": 191582, "epoch": 2308} {"train_loss": -23.873075485229492, "global_step": 191583, "epoch": 2308} {"train_loss": -23.636816024780273, "global_step": 191584, "epoch": 2308} {"train_loss": -23.505878448486328, "global_step": 191585, "epoch": 2308} {"train_loss": -23.964765548706055, "global_step": 191586, "epoch": 2308} {"train_loss": -24.047075271606445, "global_step": 191587, "epoch": 2308} {"train_loss": -23.7279052734375, "global_step": 191588, "epoch": 2308} {"train_loss": -23.934303283691406, "global_step": 191589, "epoch": 2308} {"train_loss": -23.3734188079834, "global_step": 191590, "epoch": 2308} {"train_loss": -23.547195434570312, "global_step": 191591, "epoch": 2308} {"train_loss": -24.132678985595703, "global_step": 191592, "epoch": 2308} {"train_loss": -23.568721771240234, "global_step": 191593, "epoch": 2308} {"train_loss": -23.558008193969727, "global_step": 191594, "epoch": 2308} {"train_loss": -23.85425567626953, "global_step": 191595, "epoch": 2308} {"train_loss": -23.83619499206543, "global_step": 191596, "epoch": 2308} {"train_loss": -24.05891990661621, "global_step": 191597, "epoch": 2308} {"train_loss": -24.189044952392578, "global_step": 191598, "epoch": 2308} {"train_loss": -23.877544403076172, "global_step": 191599, "epoch": 2308} {"train_loss": -23.9776611328125, "global_step": 191600, "epoch": 2308} {"train_loss": -24.132604598999023, "global_step": 191601, "epoch": 2308} {"train_loss": -24.13654899597168, "global_step": 191602, "epoch": 2308} {"train_loss": -24.169763565063477, "global_step": 191603, "epoch": 2308} {"train_loss": -24.28255271911621, "global_step": 191604, "epoch": 2308} {"train_loss": -24.130712509155273, "global_step": 191605, "epoch": 2308} {"train_loss": -24.321332931518555, "global_step": 191606, "epoch": 2308} {"train_loss": -24.25682830810547, "global_step": 191607, "epoch": 2308} {"train_loss": -24.512290954589844, "global_step": 191608, "epoch": 2308} {"train_loss": -24.03779411315918, "global_step": 191609, "epoch": 2308} {"train_loss": -23.980789184570312, "global_step": 191610, "epoch": 2308} {"train_loss": -24.140905380249023, "global_step": 191611, "epoch": 2308} {"train_loss": -24.340200424194336, "global_step": 191612, "epoch": 2308} {"train_loss": -23.714136123657227, "global_step": 191613, "epoch": 2308} {"train_loss": -24.37757110595703, "global_step": 191614, "epoch": 2308} {"train_loss": -23.94902992248535, "global_step": 191615, "epoch": 2308} {"train_loss": -24.17530632019043, "global_step": 191616, "epoch": 2308} {"train_loss": -24.411895751953125, "global_step": 191617, "epoch": 2308} {"train_loss": -24.027475357055664, "global_step": 191618, "epoch": 2308} {"train_loss": -24.05483627319336, "global_step": 191619, "epoch": 2308} {"train_loss": -24.575620651245117, "global_step": 191620, "epoch": 2308} {"train_loss": -24.35334587097168, "global_step": 191621, "epoch": 2308} {"train_loss": -24.12990951538086, "global_step": 191622, "epoch": 2308} {"train_loss": -24.409809112548828, "global_step": 191623, "epoch": 2308} {"train_loss": -24.52520751953125, "global_step": 191624, "epoch": 2308} {"train_loss": -24.116994857788086, "global_step": 191625, "epoch": 2308} {"train_loss": -24.163236618041992, "global_step": 191626, "epoch": 2308} {"train_loss": -24.400012969970703, "global_step": 191627, "epoch": 2308} {"train_loss": -24.546756744384766, "global_step": 191628, "epoch": 2308} {"train_loss": -24.260013580322266, "global_step": 191629, "epoch": 2308} {"train_loss": -24.28116798400879, "global_step": 191630, "epoch": 2308} {"train_loss": -24.102365493774414, "global_step": 191631, "epoch": 2308} {"train_loss": -24.624038696289062, "global_step": 191632, "epoch": 2308} {"train_loss": -24.408279418945312, "global_step": 191633, "epoch": 2308} {"train_loss": -24.616409301757812, "global_step": 191634, "epoch": 2308} {"train_loss": -24.16707420349121, "global_step": 191635, "epoch": 2308} {"train_loss": -24.721786499023438, "global_step": 191636, "epoch": 2308} {"train_loss": -24.614561080932617, "global_step": 191637, "epoch": 2308} {"train_loss": -24.31190299987793, "global_step": 191638, "epoch": 2308} {"train_loss": -24.3619384765625, "global_step": 191639, "epoch": 2308} {"train_loss": -24.091445922851562, "global_step": 191640, "epoch": 2308} {"train_loss": -24.12576675415039, "global_step": 191641, "epoch": 2308} {"train_loss": -23.533178329467773, "global_step": 191642, "epoch": 2308} {"train_loss": -24.305784225463867, "global_step": 191643, "epoch": 2308} {"train_loss": -23.933290481567383, "global_step": 191644, "epoch": 2308} {"train_loss": -23.945789337158203, "global_step": 191645, "epoch": 2308} {"train_loss": -23.995302728859777, "global_step": 191646, "epoch": 2308, "val_loss": 6493350.0} {"train_loss": -23.01234245300293, "global_step": 191647, "epoch": 2309} {"train_loss": -21.82573699951172, "global_step": 191648, "epoch": 2309} {"train_loss": -22.668533325195312, "global_step": 191649, "epoch": 2309} {"train_loss": -22.980539321899414, "global_step": 191650, "epoch": 2309} {"train_loss": -23.140602111816406, "global_step": 191651, "epoch": 2309} {"train_loss": -23.351245880126953, "global_step": 191652, "epoch": 2309} {"train_loss": -23.155954360961914, "global_step": 191653, "epoch": 2309} {"train_loss": -23.24717903137207, "global_step": 191654, "epoch": 2309} {"train_loss": -23.26282501220703, "global_step": 191655, "epoch": 2309} {"train_loss": -23.4259090423584, "global_step": 191656, "epoch": 2309} {"train_loss": -23.28165054321289, "global_step": 191657, "epoch": 2309} {"train_loss": -23.41333770751953, "global_step": 191658, "epoch": 2309} {"train_loss": -23.769428253173828, "global_step": 191659, "epoch": 2309} {"train_loss": -23.56644630432129, "global_step": 191660, "epoch": 2309} {"train_loss": -23.572683334350586, "global_step": 191661, "epoch": 2309} {"train_loss": -23.437488555908203, "global_step": 191662, "epoch": 2309} {"train_loss": -23.76016616821289, "global_step": 191663, "epoch": 2309} {"train_loss": -23.651718139648438, "global_step": 191664, "epoch": 2309} {"train_loss": -23.25754165649414, "global_step": 191665, "epoch": 2309} {"train_loss": -23.60553550720215, "global_step": 191666, "epoch": 2309} {"train_loss": -23.986722946166992, "global_step": 191667, "epoch": 2309} {"train_loss": -23.70050621032715, "global_step": 191668, "epoch": 2309} {"train_loss": -23.630788803100586, "global_step": 191669, "epoch": 2309} {"train_loss": -24.1366024017334, "global_step": 191670, "epoch": 2309} {"train_loss": -23.920639038085938, "global_step": 191671, "epoch": 2309} {"train_loss": -23.951786041259766, "global_step": 191672, "epoch": 2309} {"train_loss": -24.0721378326416, "global_step": 191673, "epoch": 2309} {"train_loss": -23.480932235717773, "global_step": 191674, "epoch": 2309} {"train_loss": -23.8515682220459, "global_step": 191675, "epoch": 2309} {"train_loss": -24.12200164794922, "global_step": 191676, "epoch": 2309} {"train_loss": -24.173538208007812, "global_step": 191677, "epoch": 2309} {"train_loss": -23.93782615661621, "global_step": 191678, "epoch": 2309} {"train_loss": -23.89655876159668, "global_step": 191679, "epoch": 2309} {"train_loss": -23.8345947265625, "global_step": 191680, "epoch": 2309} {"train_loss": -24.0142822265625, "global_step": 191681, "epoch": 2309} {"train_loss": -24.015790939331055, "global_step": 191682, "epoch": 2309} {"train_loss": -24.079776763916016, "global_step": 191683, "epoch": 2309} {"train_loss": -24.116056442260742, "global_step": 191684, "epoch": 2309} {"train_loss": -24.136066436767578, "global_step": 191685, "epoch": 2309} {"train_loss": -24.220182418823242, "global_step": 191686, "epoch": 2309} {"train_loss": -24.007551193237305, "global_step": 191687, "epoch": 2309} {"train_loss": -24.224252700805664, "global_step": 191688, "epoch": 2309} {"train_loss": -24.115808486938477, "global_step": 191689, "epoch": 2309} {"train_loss": -24.31447410583496, "global_step": 191690, "epoch": 2309} {"train_loss": -24.094755172729492, "global_step": 191691, "epoch": 2309} {"train_loss": -24.15274429321289, "global_step": 191692, "epoch": 2309} {"train_loss": -24.327892303466797, "global_step": 191693, "epoch": 2309} {"train_loss": -24.182861328125, "global_step": 191694, "epoch": 2309} {"train_loss": -24.296567916870117, "global_step": 191695, "epoch": 2309} {"train_loss": -24.118236541748047, "global_step": 191696, "epoch": 2309} {"train_loss": -24.039270401000977, "global_step": 191697, "epoch": 2309} {"train_loss": -24.177724838256836, "global_step": 191698, "epoch": 2309} {"train_loss": -24.196212768554688, "global_step": 191699, "epoch": 2309} {"train_loss": -24.147130966186523, "global_step": 191700, "epoch": 2309} {"train_loss": -24.264728546142578, "global_step": 191701, "epoch": 2309} {"train_loss": -24.256637573242188, "global_step": 191702, "epoch": 2309} {"train_loss": -24.622722625732422, "global_step": 191703, "epoch": 2309} {"train_loss": -23.796537399291992, "global_step": 191704, "epoch": 2309} {"train_loss": -24.045209884643555, "global_step": 191705, "epoch": 2309} {"train_loss": -24.595046997070312, "global_step": 191706, "epoch": 2309} {"train_loss": -24.295576095581055, "global_step": 191707, "epoch": 2309} {"train_loss": -24.418798446655273, "global_step": 191708, "epoch": 2309} {"train_loss": -24.21540641784668, "global_step": 191709, "epoch": 2309} {"train_loss": -24.202552795410156, "global_step": 191710, "epoch": 2309} {"train_loss": -24.3279972076416, "global_step": 191711, "epoch": 2309} {"train_loss": -24.32227325439453, "global_step": 191712, "epoch": 2309} {"train_loss": -24.43305015563965, "global_step": 191713, "epoch": 2309} {"train_loss": -24.336292266845703, "global_step": 191714, "epoch": 2309} {"train_loss": -23.88239097595215, "global_step": 191715, "epoch": 2309} {"train_loss": -23.90504264831543, "global_step": 191716, "epoch": 2309} {"train_loss": -24.206602096557617, "global_step": 191717, "epoch": 2309} {"train_loss": -24.134933471679688, "global_step": 191718, "epoch": 2309} {"train_loss": -24.049585342407227, "global_step": 191719, "epoch": 2309} {"train_loss": -23.95649528503418, "global_step": 191720, "epoch": 2309} {"train_loss": -23.92765235900879, "global_step": 191721, "epoch": 2309} {"train_loss": -24.16887855529785, "global_step": 191722, "epoch": 2309} {"train_loss": -23.883451461791992, "global_step": 191723, "epoch": 2309} {"train_loss": -24.161535263061523, "global_step": 191724, "epoch": 2309} {"train_loss": -24.00830841064453, "global_step": 191725, "epoch": 2309} {"train_loss": -24.228191375732422, "global_step": 191726, "epoch": 2309} {"train_loss": -24.326330184936523, "global_step": 191727, "epoch": 2309} {"train_loss": -24.166961669921875, "global_step": 191728, "epoch": 2309} {"train_loss": -23.915289154971937, "global_step": 191729, "epoch": 2309, "val_loss": 6483836.0} {"train_loss": -23.557538986206055, "global_step": 191730, "epoch": 2310} {"train_loss": -23.192014694213867, "global_step": 191731, "epoch": 2310} {"train_loss": -23.251432418823242, "global_step": 191732, "epoch": 2310} {"train_loss": -23.27716636657715, "global_step": 191733, "epoch": 2310} {"train_loss": -23.560285568237305, "global_step": 191734, "epoch": 2310} {"train_loss": -23.353652954101562, "global_step": 191735, "epoch": 2310} {"train_loss": -23.18181800842285, "global_step": 191736, "epoch": 2310} {"train_loss": -23.60703468322754, "global_step": 191737, "epoch": 2310} {"train_loss": -23.239540100097656, "global_step": 191738, "epoch": 2310} {"train_loss": -23.67884063720703, "global_step": 191739, "epoch": 2310} {"train_loss": -23.478818893432617, "global_step": 191740, "epoch": 2310} {"train_loss": -23.639554977416992, "global_step": 191741, "epoch": 2310} {"train_loss": -23.638378143310547, "global_step": 191742, "epoch": 2310} {"train_loss": -23.978151321411133, "global_step": 191743, "epoch": 2310} {"train_loss": -23.41368293762207, "global_step": 191744, "epoch": 2310} {"train_loss": -24.163320541381836, "global_step": 191745, "epoch": 2310} {"train_loss": -23.767929077148438, "global_step": 191746, "epoch": 2310} {"train_loss": -23.85963249206543, "global_step": 191747, "epoch": 2310} {"train_loss": -23.55610466003418, "global_step": 191748, "epoch": 2310} {"train_loss": -23.96485710144043, "global_step": 191749, "epoch": 2310} {"train_loss": -23.723405838012695, "global_step": 191750, "epoch": 2310} {"train_loss": -23.80245018005371, "global_step": 191751, "epoch": 2310} {"train_loss": -23.976062774658203, "global_step": 191752, "epoch": 2310} {"train_loss": -23.566673278808594, "global_step": 191753, "epoch": 2310} {"train_loss": -24.26609992980957, "global_step": 191754, "epoch": 2310} {"train_loss": -24.27068519592285, "global_step": 191755, "epoch": 2310} {"train_loss": -24.1285343170166, "global_step": 191756, "epoch": 2310} {"train_loss": -24.019323348999023, "global_step": 191757, "epoch": 2310} {"train_loss": -23.730865478515625, "global_step": 191758, "epoch": 2310} {"train_loss": -24.20876693725586, "global_step": 191759, "epoch": 2310} {"train_loss": -24.424571990966797, "global_step": 191760, "epoch": 2310} {"train_loss": -23.988798141479492, "global_step": 191761, "epoch": 2310} {"train_loss": -24.21791648864746, "global_step": 191762, "epoch": 2310} {"train_loss": -24.418354034423828, "global_step": 191763, "epoch": 2310} {"train_loss": -24.29829978942871, "global_step": 191764, "epoch": 2310} {"train_loss": -24.462543487548828, "global_step": 191765, "epoch": 2310} {"train_loss": -24.069839477539062, "global_step": 191766, "epoch": 2310} {"train_loss": -24.492446899414062, "global_step": 191767, "epoch": 2310} {"train_loss": -24.263195037841797, "global_step": 191768, "epoch": 2310} {"train_loss": -24.268766403198242, "global_step": 191769, "epoch": 2310} {"train_loss": -24.21222686767578, "global_step": 191770, "epoch": 2310} {"train_loss": -24.620527267456055, "global_step": 191771, "epoch": 2310} {"train_loss": -24.35353660583496, "global_step": 191772, "epoch": 2310} {"train_loss": -24.15468406677246, "global_step": 191773, "epoch": 2310} {"train_loss": -24.27512550354004, "global_step": 191774, "epoch": 2310} {"train_loss": -24.566381454467773, "global_step": 191775, "epoch": 2310} {"train_loss": -23.747785568237305, "global_step": 191776, "epoch": 2310} {"train_loss": -24.06166648864746, "global_step": 191777, "epoch": 2310} {"train_loss": -24.200031280517578, "global_step": 191778, "epoch": 2310} {"train_loss": -23.895450592041016, "global_step": 191779, "epoch": 2310} {"train_loss": -23.908985137939453, "global_step": 191780, "epoch": 2310} {"train_loss": -24.26456069946289, "global_step": 191781, "epoch": 2310} {"train_loss": -23.83517837524414, "global_step": 191782, "epoch": 2310} {"train_loss": -24.294843673706055, "global_step": 191783, "epoch": 2310} {"train_loss": -24.041940689086914, "global_step": 191784, "epoch": 2310} {"train_loss": -24.217071533203125, "global_step": 191785, "epoch": 2310} {"train_loss": -23.920265197753906, "global_step": 191786, "epoch": 2310} {"train_loss": -24.11534881591797, "global_step": 191787, "epoch": 2310} {"train_loss": -24.011873245239258, "global_step": 191788, "epoch": 2310} {"train_loss": -24.321447372436523, "global_step": 191789, "epoch": 2310} {"train_loss": -24.288442611694336, "global_step": 191790, "epoch": 2310} {"train_loss": -23.865692138671875, "global_step": 191791, "epoch": 2310} {"train_loss": -24.32284927368164, "global_step": 191792, "epoch": 2310} {"train_loss": -24.188636779785156, "global_step": 191793, "epoch": 2310} {"train_loss": -24.04707908630371, "global_step": 191794, "epoch": 2310} {"train_loss": -24.098506927490234, "global_step": 191795, "epoch": 2310} {"train_loss": -24.551706314086914, "global_step": 191796, "epoch": 2310} {"train_loss": -24.43531608581543, "global_step": 191797, "epoch": 2310} {"train_loss": -24.3521671295166, "global_step": 191798, "epoch": 2310} {"train_loss": -24.394622802734375, "global_step": 191799, "epoch": 2310} {"train_loss": -24.387100219726562, "global_step": 191800, "epoch": 2310} {"train_loss": -24.27980613708496, "global_step": 191801, "epoch": 2310} {"train_loss": -24.234899520874023, "global_step": 191802, "epoch": 2310} {"train_loss": -24.167770385742188, "global_step": 191803, "epoch": 2310} {"train_loss": -24.15703582763672, "global_step": 191804, "epoch": 2310} {"train_loss": -24.262298583984375, "global_step": 191805, "epoch": 2310} {"train_loss": -23.872777938842773, "global_step": 191806, "epoch": 2310} {"train_loss": -23.83712387084961, "global_step": 191807, "epoch": 2310} {"train_loss": -23.907100677490234, "global_step": 191808, "epoch": 2310} {"train_loss": -23.96748924255371, "global_step": 191809, "epoch": 2310} {"train_loss": -24.19961166381836, "global_step": 191810, "epoch": 2310} {"train_loss": -24.083093643188477, "global_step": 191811, "epoch": 2310} {"train_loss": -24.006295353533275, "global_step": 191812, "epoch": 2310, "val_loss": 6329771.0} {"train_loss": -23.383365631103516, "global_step": 191813, "epoch": 2311} {"train_loss": -23.6944522857666, "global_step": 191814, "epoch": 2311} {"train_loss": -23.70304298400879, "global_step": 191815, "epoch": 2311} {"train_loss": -22.99250602722168, "global_step": 191816, "epoch": 2311} {"train_loss": -23.66853904724121, "global_step": 191817, "epoch": 2311} {"train_loss": -23.739500045776367, "global_step": 191818, "epoch": 2311} {"train_loss": -23.735849380493164, "global_step": 191819, "epoch": 2311} {"train_loss": -23.50397300720215, "global_step": 191820, "epoch": 2311} {"train_loss": -23.728391647338867, "global_step": 191821, "epoch": 2311} {"train_loss": -23.748828887939453, "global_step": 191822, "epoch": 2311} {"train_loss": -24.016630172729492, "global_step": 191823, "epoch": 2311} {"train_loss": -23.654159545898438, "global_step": 191824, "epoch": 2311} {"train_loss": -23.92591667175293, "global_step": 191825, "epoch": 2311} {"train_loss": -23.522008895874023, "global_step": 191826, "epoch": 2311} {"train_loss": -23.88618278503418, "global_step": 191827, "epoch": 2311} {"train_loss": -23.764835357666016, "global_step": 191828, "epoch": 2311} {"train_loss": -23.800827026367188, "global_step": 191829, "epoch": 2311} {"train_loss": -23.762537002563477, "global_step": 191830, "epoch": 2311} {"train_loss": -23.939599990844727, "global_step": 191831, "epoch": 2311} {"train_loss": -24.0163631439209, "global_step": 191832, "epoch": 2311} {"train_loss": -23.535863876342773, "global_step": 191833, "epoch": 2311} {"train_loss": -23.717144012451172, "global_step": 191834, "epoch": 2311} {"train_loss": -24.007659912109375, "global_step": 191835, "epoch": 2311} {"train_loss": -24.17292594909668, "global_step": 191836, "epoch": 2311} {"train_loss": -23.98297119140625, "global_step": 191837, "epoch": 2311} {"train_loss": -24.238866806030273, "global_step": 191838, "epoch": 2311} {"train_loss": -24.144681930541992, "global_step": 191839, "epoch": 2311} {"train_loss": -24.052635192871094, "global_step": 191840, "epoch": 2311} {"train_loss": -24.20985984802246, "global_step": 191841, "epoch": 2311} {"train_loss": -23.894819259643555, "global_step": 191842, "epoch": 2311} {"train_loss": -24.149234771728516, "global_step": 191843, "epoch": 2311} {"train_loss": -24.486217498779297, "global_step": 191844, "epoch": 2311} {"train_loss": -23.898529052734375, "global_step": 191845, "epoch": 2311} {"train_loss": -24.010292053222656, "global_step": 191846, "epoch": 2311} {"train_loss": -23.935422897338867, "global_step": 191847, "epoch": 2311} {"train_loss": -24.289321899414062, "global_step": 191848, "epoch": 2311} {"train_loss": -24.315139770507812, "global_step": 191849, "epoch": 2311} {"train_loss": -24.106643676757812, "global_step": 191850, "epoch": 2311} {"train_loss": -24.05875587463379, "global_step": 191851, "epoch": 2311} {"train_loss": -24.196956634521484, "global_step": 191852, "epoch": 2311} {"train_loss": -24.132373809814453, "global_step": 191853, "epoch": 2311} {"train_loss": -23.872772216796875, "global_step": 191854, "epoch": 2311} {"train_loss": -24.41737174987793, "global_step": 191855, "epoch": 2311} {"train_loss": -24.272069931030273, "global_step": 191856, "epoch": 2311} {"train_loss": -24.10774040222168, "global_step": 191857, "epoch": 2311} {"train_loss": -23.90387725830078, "global_step": 191858, "epoch": 2311} {"train_loss": -24.285322189331055, "global_step": 191859, "epoch": 2311} {"train_loss": -24.088891983032227, "global_step": 191860, "epoch": 2311} {"train_loss": -24.141036987304688, "global_step": 191861, "epoch": 2311} {"train_loss": -24.351903915405273, "global_step": 191862, "epoch": 2311} {"train_loss": -24.247467041015625, "global_step": 191863, "epoch": 2311} {"train_loss": -24.14483642578125, "global_step": 191864, "epoch": 2311} {"train_loss": -24.500659942626953, "global_step": 191865, "epoch": 2311} {"train_loss": -24.22716522216797, "global_step": 191866, "epoch": 2311} {"train_loss": -24.35877799987793, "global_step": 191867, "epoch": 2311} {"train_loss": -24.017614364624023, "global_step": 191868, "epoch": 2311} {"train_loss": -24.2528133392334, "global_step": 191869, "epoch": 2311} {"train_loss": -24.18368911743164, "global_step": 191870, "epoch": 2311} {"train_loss": -24.194656372070312, "global_step": 191871, "epoch": 2311} {"train_loss": -24.0477352142334, "global_step": 191872, "epoch": 2311} {"train_loss": -24.033893585205078, "global_step": 191873, "epoch": 2311} {"train_loss": -24.33530616760254, "global_step": 191874, "epoch": 2311} {"train_loss": -23.95319175720215, "global_step": 191875, "epoch": 2311} {"train_loss": -24.779708862304688, "global_step": 191876, "epoch": 2311} {"train_loss": -24.320554733276367, "global_step": 191877, "epoch": 2311} {"train_loss": -24.349828720092773, "global_step": 191878, "epoch": 2311} {"train_loss": -24.121566772460938, "global_step": 191879, "epoch": 2311} {"train_loss": -24.063232421875, "global_step": 191880, "epoch": 2311} {"train_loss": -24.028430938720703, "global_step": 191881, "epoch": 2311} {"train_loss": -23.729215621948242, "global_step": 191882, "epoch": 2311} {"train_loss": -24.242326736450195, "global_step": 191883, "epoch": 2311} {"train_loss": -23.87173843383789, "global_step": 191884, "epoch": 2311} {"train_loss": -24.053253173828125, "global_step": 191885, "epoch": 2311} {"train_loss": -24.15167236328125, "global_step": 191886, "epoch": 2311} {"train_loss": -23.834718704223633, "global_step": 191887, "epoch": 2311} {"train_loss": -24.3706111907959, "global_step": 191888, "epoch": 2311} {"train_loss": -24.294647216796875, "global_step": 191889, "epoch": 2311} {"train_loss": -24.20650291442871, "global_step": 191890, "epoch": 2311} {"train_loss": -23.997241973876953, "global_step": 191891, "epoch": 2311} {"train_loss": -24.40570831298828, "global_step": 191892, "epoch": 2311} {"train_loss": -24.35151481628418, "global_step": 191893, "epoch": 2311} {"train_loss": -23.888351440429688, "global_step": 191894, "epoch": 2311} {"train_loss": -24.027731240513813, "global_step": 191895, "epoch": 2311, "val_loss": 6565590.0} {"train_loss": -23.581628799438477, "global_step": 191896, "epoch": 2312} {"train_loss": -23.494476318359375, "global_step": 191897, "epoch": 2312} {"train_loss": -23.54603385925293, "global_step": 191898, "epoch": 2312} {"train_loss": -23.7613525390625, "global_step": 191899, "epoch": 2312} {"train_loss": -23.635351181030273, "global_step": 191900, "epoch": 2312} {"train_loss": -23.70548439025879, "global_step": 191901, "epoch": 2312} {"train_loss": -23.7054443359375, "global_step": 191902, "epoch": 2312} {"train_loss": -24.044235229492188, "global_step": 191903, "epoch": 2312} {"train_loss": -23.664297103881836, "global_step": 191904, "epoch": 2312} {"train_loss": -24.033939361572266, "global_step": 191905, "epoch": 2312} {"train_loss": -24.08460235595703, "global_step": 191906, "epoch": 2312} {"train_loss": -23.71771812438965, "global_step": 191907, "epoch": 2312} {"train_loss": -23.624805450439453, "global_step": 191908, "epoch": 2312} {"train_loss": -23.7205753326416, "global_step": 191909, "epoch": 2312} {"train_loss": -23.28509521484375, "global_step": 191910, "epoch": 2312} {"train_loss": -23.825117111206055, "global_step": 191911, "epoch": 2312} {"train_loss": -23.906652450561523, "global_step": 191912, "epoch": 2312} {"train_loss": -24.01981544494629, "global_step": 191913, "epoch": 2312} {"train_loss": -23.8826847076416, "global_step": 191914, "epoch": 2312} {"train_loss": -24.302616119384766, "global_step": 191915, "epoch": 2312} {"train_loss": -24.265033721923828, "global_step": 191916, "epoch": 2312} {"train_loss": -24.18961524963379, "global_step": 191917, "epoch": 2312} {"train_loss": -24.141613006591797, "global_step": 191918, "epoch": 2312} {"train_loss": -24.1521053314209, "global_step": 191919, "epoch": 2312} {"train_loss": -23.952884674072266, "global_step": 191920, "epoch": 2312} {"train_loss": -23.99598503112793, "global_step": 191921, "epoch": 2312} {"train_loss": -23.789304733276367, "global_step": 191922, "epoch": 2312} {"train_loss": -24.378135681152344, "global_step": 191923, "epoch": 2312} {"train_loss": -23.91724967956543, "global_step": 191924, "epoch": 2312} {"train_loss": -24.246862411499023, "global_step": 191925, "epoch": 2312} {"train_loss": -24.211063385009766, "global_step": 191926, "epoch": 2312} {"train_loss": -23.758237838745117, "global_step": 191927, "epoch": 2312} {"train_loss": -23.838830947875977, "global_step": 191928, "epoch": 2312} {"train_loss": -24.31665802001953, "global_step": 191929, "epoch": 2312} {"train_loss": -24.285484313964844, "global_step": 191930, "epoch": 2312} {"train_loss": -23.994335174560547, "global_step": 191931, "epoch": 2312} {"train_loss": -23.99118995666504, "global_step": 191932, "epoch": 2312} {"train_loss": -24.194517135620117, "global_step": 191933, "epoch": 2312} {"train_loss": -24.2889347076416, "global_step": 191934, "epoch": 2312} {"train_loss": -24.16133689880371, "global_step": 191935, "epoch": 2312} {"train_loss": -24.126089096069336, "global_step": 191936, "epoch": 2312} {"train_loss": -24.337846755981445, "global_step": 191937, "epoch": 2312} {"train_loss": -23.963245391845703, "global_step": 191938, "epoch": 2312} {"train_loss": -24.13282585144043, "global_step": 191939, "epoch": 2312} {"train_loss": -23.742284774780273, "global_step": 191940, "epoch": 2312} {"train_loss": -24.194660186767578, "global_step": 191941, "epoch": 2312} {"train_loss": -24.405227661132812, "global_step": 191942, "epoch": 2312} {"train_loss": -24.140464782714844, "global_step": 191943, "epoch": 2312} {"train_loss": -24.367406845092773, "global_step": 191944, "epoch": 2312} {"train_loss": -23.877273559570312, "global_step": 191945, "epoch": 2312} {"train_loss": -24.36713409423828, "global_step": 191946, "epoch": 2312} {"train_loss": -24.33205795288086, "global_step": 191947, "epoch": 2312} {"train_loss": -24.096832275390625, "global_step": 191948, "epoch": 2312} {"train_loss": -24.20057487487793, "global_step": 191949, "epoch": 2312} {"train_loss": -24.240224838256836, "global_step": 191950, "epoch": 2312} {"train_loss": -24.18450927734375, "global_step": 191951, "epoch": 2312} {"train_loss": -24.317047119140625, "global_step": 191952, "epoch": 2312} {"train_loss": -23.86894989013672, "global_step": 191953, "epoch": 2312} {"train_loss": -24.219690322875977, "global_step": 191954, "epoch": 2312} {"train_loss": -23.98907470703125, "global_step": 191955, "epoch": 2312} {"train_loss": -24.043195724487305, "global_step": 191956, "epoch": 2312} {"train_loss": -23.618906021118164, "global_step": 191957, "epoch": 2312} {"train_loss": -23.95880699157715, "global_step": 191958, "epoch": 2312} {"train_loss": -23.99831199645996, "global_step": 191959, "epoch": 2312} {"train_loss": -23.501211166381836, "global_step": 191960, "epoch": 2312} {"train_loss": -24.03570556640625, "global_step": 191961, "epoch": 2312} {"train_loss": -23.62474250793457, "global_step": 191962, "epoch": 2312} {"train_loss": -24.095983505249023, "global_step": 191963, "epoch": 2312} {"train_loss": -23.826797485351562, "global_step": 191964, "epoch": 2312} {"train_loss": -24.171194076538086, "global_step": 191965, "epoch": 2312} {"train_loss": -24.206506729125977, "global_step": 191966, "epoch": 2312} {"train_loss": -24.058090209960938, "global_step": 191967, "epoch": 2312} {"train_loss": -23.70245933532715, "global_step": 191968, "epoch": 2312} {"train_loss": -24.17781639099121, "global_step": 191969, "epoch": 2312} {"train_loss": -23.545494079589844, "global_step": 191970, "epoch": 2312} {"train_loss": -23.826358795166016, "global_step": 191971, "epoch": 2312} {"train_loss": -24.370359420776367, "global_step": 191972, "epoch": 2312} {"train_loss": -23.89032554626465, "global_step": 191973, "epoch": 2312} {"train_loss": -24.02919578552246, "global_step": 191974, "epoch": 2312} {"train_loss": -24.079147338867188, "global_step": 191975, "epoch": 2312} {"train_loss": -24.025230407714844, "global_step": 191976, "epoch": 2312} {"train_loss": -23.971572875976562, "global_step": 191977, "epoch": 2312} {"train_loss": -23.998390979077442, "global_step": 191978, "epoch": 2312, "val_loss": 6659853.0} {"train_loss": -23.43849754333496, "global_step": 191979, "epoch": 2313} {"train_loss": -23.9215145111084, "global_step": 191980, "epoch": 2313} {"train_loss": -23.709943771362305, "global_step": 191981, "epoch": 2313} {"train_loss": -23.734943389892578, "global_step": 191982, "epoch": 2313} {"train_loss": -23.595182418823242, "global_step": 191983, "epoch": 2313} {"train_loss": -24.143478393554688, "global_step": 191984, "epoch": 2313} {"train_loss": -23.498552322387695, "global_step": 191985, "epoch": 2313} {"train_loss": -23.808088302612305, "global_step": 191986, "epoch": 2313} {"train_loss": -23.813005447387695, "global_step": 191987, "epoch": 2313} {"train_loss": -23.800460815429688, "global_step": 191988, "epoch": 2313} {"train_loss": -23.815845489501953, "global_step": 191989, "epoch": 2313} {"train_loss": -23.987150192260742, "global_step": 191990, "epoch": 2313} {"train_loss": -23.939361572265625, "global_step": 191991, "epoch": 2313} {"train_loss": -23.906551361083984, "global_step": 191992, "epoch": 2313} {"train_loss": -23.66320037841797, "global_step": 191993, "epoch": 2313} {"train_loss": -24.092676162719727, "global_step": 191994, "epoch": 2313} {"train_loss": -24.05605125427246, "global_step": 191995, "epoch": 2313} {"train_loss": -24.331769943237305, "global_step": 191996, "epoch": 2313} {"train_loss": -24.128482818603516, "global_step": 191997, "epoch": 2313} {"train_loss": -24.21120262145996, "global_step": 191998, "epoch": 2313} {"train_loss": -23.91643714904785, "global_step": 191999, "epoch": 2313} {"train_loss": -24.045719146728516, "global_step": 192000, "epoch": 2313} {"train_loss": -24.072248458862305, "global_step": 192001, "epoch": 2313} {"train_loss": -23.899333953857422, "global_step": 192002, "epoch": 2313} {"train_loss": -24.321374893188477, "global_step": 192003, "epoch": 2313} {"train_loss": -24.44318199157715, "global_step": 192004, "epoch": 2313} {"train_loss": -23.98432731628418, "global_step": 192005, "epoch": 2313} {"train_loss": -24.115373611450195, "global_step": 192006, "epoch": 2313} {"train_loss": -24.176456451416016, "global_step": 192007, "epoch": 2313} {"train_loss": -23.784406661987305, "global_step": 192008, "epoch": 2313} {"train_loss": -23.87391471862793, "global_step": 192009, "epoch": 2313} {"train_loss": -24.102087020874023, "global_step": 192010, "epoch": 2313} {"train_loss": -24.179479598999023, "global_step": 192011, "epoch": 2313} {"train_loss": -24.149555206298828, "global_step": 192012, "epoch": 2313} {"train_loss": -24.372455596923828, "global_step": 192013, "epoch": 2313} {"train_loss": -24.576126098632812, "global_step": 192014, "epoch": 2313} {"train_loss": -24.30502700805664, "global_step": 192015, "epoch": 2313} {"train_loss": -24.21917152404785, "global_step": 192016, "epoch": 2313} {"train_loss": -24.34173583984375, "global_step": 192017, "epoch": 2313} {"train_loss": -24.19148826599121, "global_step": 192018, "epoch": 2313} {"train_loss": -24.3886661529541, "global_step": 192019, "epoch": 2313} {"train_loss": -24.2740478515625, "global_step": 192020, "epoch": 2313} {"train_loss": -24.470853805541992, "global_step": 192021, "epoch": 2313} {"train_loss": -24.161954879760742, "global_step": 192022, "epoch": 2313} {"train_loss": -24.33855628967285, "global_step": 192023, "epoch": 2313} {"train_loss": -23.945384979248047, "global_step": 192024, "epoch": 2313} {"train_loss": -24.103498458862305, "global_step": 192025, "epoch": 2313} {"train_loss": -24.15289306640625, "global_step": 192026, "epoch": 2313} {"train_loss": -24.21603775024414, "global_step": 192027, "epoch": 2313} {"train_loss": -23.9852352142334, "global_step": 192028, "epoch": 2313} {"train_loss": -24.4062557220459, "global_step": 192029, "epoch": 2313} {"train_loss": -24.07417106628418, "global_step": 192030, "epoch": 2313} {"train_loss": -24.429569244384766, "global_step": 192031, "epoch": 2313} {"train_loss": -24.052417755126953, "global_step": 192032, "epoch": 2313} {"train_loss": -24.375980377197266, "global_step": 192033, "epoch": 2313} {"train_loss": -24.465017318725586, "global_step": 192034, "epoch": 2313} {"train_loss": -24.614221572875977, "global_step": 192035, "epoch": 2313} {"train_loss": -24.32093620300293, "global_step": 192036, "epoch": 2313} {"train_loss": -24.352476119995117, "global_step": 192037, "epoch": 2313} {"train_loss": -24.163896560668945, "global_step": 192038, "epoch": 2313} {"train_loss": -24.29987144470215, "global_step": 192039, "epoch": 2313} {"train_loss": -24.092975616455078, "global_step": 192040, "epoch": 2313} {"train_loss": -24.355382919311523, "global_step": 192041, "epoch": 2313} {"train_loss": -24.092702865600586, "global_step": 192042, "epoch": 2313} {"train_loss": -24.088363647460938, "global_step": 192043, "epoch": 2313} {"train_loss": -23.987112045288086, "global_step": 192044, "epoch": 2313} {"train_loss": -23.84384536743164, "global_step": 192045, "epoch": 2313} {"train_loss": -23.9575252532959, "global_step": 192046, "epoch": 2313} {"train_loss": -24.119766235351562, "global_step": 192047, "epoch": 2313} {"train_loss": -24.481945037841797, "global_step": 192048, "epoch": 2313} {"train_loss": -24.039365768432617, "global_step": 192049, "epoch": 2313} {"train_loss": -24.44283676147461, "global_step": 192050, "epoch": 2313} {"train_loss": -23.850826263427734, "global_step": 192051, "epoch": 2313} {"train_loss": -24.101430892944336, "global_step": 192052, "epoch": 2313} {"train_loss": -23.860828399658203, "global_step": 192053, "epoch": 2313} {"train_loss": -23.8732852935791, "global_step": 192054, "epoch": 2313} {"train_loss": -23.97554588317871, "global_step": 192055, "epoch": 2313} {"train_loss": -24.194517135620117, "global_step": 192056, "epoch": 2313} {"train_loss": -23.74336051940918, "global_step": 192057, "epoch": 2313} {"train_loss": -23.85178565979004, "global_step": 192058, "epoch": 2313} {"train_loss": -24.032773971557617, "global_step": 192059, "epoch": 2313} {"train_loss": -24.211421966552734, "global_step": 192060, "epoch": 2313} {"train_loss": -24.10270348514419, "global_step": 192061, "epoch": 2313, "val_loss": 6526250.0} {"train_loss": -22.698495864868164, "global_step": 192062, "epoch": 2314} {"train_loss": -23.034704208374023, "global_step": 192063, "epoch": 2314} {"train_loss": -23.03761863708496, "global_step": 192064, "epoch": 2314} {"train_loss": -23.45592498779297, "global_step": 192065, "epoch": 2314} {"train_loss": -23.26891326904297, "global_step": 192066, "epoch": 2314} {"train_loss": -23.17224884033203, "global_step": 192067, "epoch": 2314} {"train_loss": -23.648283004760742, "global_step": 192068, "epoch": 2314} {"train_loss": -22.980669021606445, "global_step": 192069, "epoch": 2314} {"train_loss": -23.715351104736328, "global_step": 192070, "epoch": 2314} {"train_loss": -23.179725646972656, "global_step": 192071, "epoch": 2314} {"train_loss": -23.246068954467773, "global_step": 192072, "epoch": 2314} {"train_loss": -23.572546005249023, "global_step": 192073, "epoch": 2314} {"train_loss": -23.56756591796875, "global_step": 192074, "epoch": 2314} {"train_loss": -23.726959228515625, "global_step": 192075, "epoch": 2314} {"train_loss": -23.563644409179688, "global_step": 192076, "epoch": 2314} {"train_loss": -23.574140548706055, "global_step": 192077, "epoch": 2314} {"train_loss": -23.838939666748047, "global_step": 192078, "epoch": 2314} {"train_loss": -23.831668853759766, "global_step": 192079, "epoch": 2314} {"train_loss": -23.858083724975586, "global_step": 192080, "epoch": 2314} {"train_loss": -23.987668991088867, "global_step": 192081, "epoch": 2314} {"train_loss": -23.638654708862305, "global_step": 192082, "epoch": 2314} {"train_loss": -24.209896087646484, "global_step": 192083, "epoch": 2314} {"train_loss": -24.121078491210938, "global_step": 192084, "epoch": 2314} {"train_loss": -24.176156997680664, "global_step": 192085, "epoch": 2314} {"train_loss": -24.023990631103516, "global_step": 192086, "epoch": 2314} {"train_loss": -24.051321029663086, "global_step": 192087, "epoch": 2314} {"train_loss": -23.596689224243164, "global_step": 192088, "epoch": 2314} {"train_loss": -23.57317543029785, "global_step": 192089, "epoch": 2314} {"train_loss": -23.882780075073242, "global_step": 192090, "epoch": 2314} {"train_loss": -23.80010986328125, "global_step": 192091, "epoch": 2314} {"train_loss": -23.963489532470703, "global_step": 192092, "epoch": 2314} {"train_loss": -24.115259170532227, "global_step": 192093, "epoch": 2314} {"train_loss": -23.700803756713867, "global_step": 192094, "epoch": 2314} {"train_loss": -24.268199920654297, "global_step": 192095, "epoch": 2314} {"train_loss": -23.98440933227539, "global_step": 192096, "epoch": 2314} {"train_loss": -24.046951293945312, "global_step": 192097, "epoch": 2314} {"train_loss": -24.277746200561523, "global_step": 192098, "epoch": 2314} {"train_loss": -24.064376831054688, "global_step": 192099, "epoch": 2314} {"train_loss": -24.010833740234375, "global_step": 192100, "epoch": 2314} {"train_loss": -23.861825942993164, "global_step": 192101, "epoch": 2314} {"train_loss": -24.248022079467773, "global_step": 192102, "epoch": 2314} {"train_loss": -23.823400497436523, "global_step": 192103, "epoch": 2314} {"train_loss": -23.89598846435547, "global_step": 192104, "epoch": 2314} {"train_loss": -23.92671012878418, "global_step": 192105, "epoch": 2314} {"train_loss": -24.05849266052246, "global_step": 192106, "epoch": 2314} {"train_loss": -23.926597595214844, "global_step": 192107, "epoch": 2314} {"train_loss": -24.115201950073242, "global_step": 192108, "epoch": 2314} {"train_loss": -23.997066497802734, "global_step": 192109, "epoch": 2314} {"train_loss": -24.31216812133789, "global_step": 192110, "epoch": 2314} {"train_loss": -24.214712142944336, "global_step": 192111, "epoch": 2314} {"train_loss": -24.054344177246094, "global_step": 192112, "epoch": 2314} {"train_loss": -24.03973960876465, "global_step": 192113, "epoch": 2314} {"train_loss": -24.231863021850586, "global_step": 192114, "epoch": 2314} {"train_loss": -24.4149169921875, "global_step": 192115, "epoch": 2314} {"train_loss": -24.00516700744629, "global_step": 192116, "epoch": 2314} {"train_loss": -24.100894927978516, "global_step": 192117, "epoch": 2314} {"train_loss": -24.375545501708984, "global_step": 192118, "epoch": 2314} {"train_loss": -24.045963287353516, "global_step": 192119, "epoch": 2314} {"train_loss": -24.29673194885254, "global_step": 192120, "epoch": 2314} {"train_loss": -24.287769317626953, "global_step": 192121, "epoch": 2314} {"train_loss": -24.09261131286621, "global_step": 192122, "epoch": 2314} {"train_loss": -23.830341339111328, "global_step": 192123, "epoch": 2314} {"train_loss": -24.317554473876953, "global_step": 192124, "epoch": 2314} {"train_loss": -24.482797622680664, "global_step": 192125, "epoch": 2314} {"train_loss": -24.240131378173828, "global_step": 192126, "epoch": 2314} {"train_loss": -24.1457462310791, "global_step": 192127, "epoch": 2314} {"train_loss": -24.281652450561523, "global_step": 192128, "epoch": 2314} {"train_loss": -24.105304718017578, "global_step": 192129, "epoch": 2314} {"train_loss": -23.900279998779297, "global_step": 192130, "epoch": 2314} {"train_loss": -24.17963981628418, "global_step": 192131, "epoch": 2314} {"train_loss": -24.098962783813477, "global_step": 192132, "epoch": 2314} {"train_loss": -23.976287841796875, "global_step": 192133, "epoch": 2314} {"train_loss": -23.91472816467285, "global_step": 192134, "epoch": 2314} {"train_loss": -24.045597076416016, "global_step": 192135, "epoch": 2314} {"train_loss": -23.99285316467285, "global_step": 192136, "epoch": 2314} {"train_loss": -24.098405838012695, "global_step": 192137, "epoch": 2314} {"train_loss": -24.323720932006836, "global_step": 192138, "epoch": 2314} {"train_loss": -23.8348445892334, "global_step": 192139, "epoch": 2314} {"train_loss": -23.623510360717773, "global_step": 192140, "epoch": 2314} {"train_loss": -24.007736206054688, "global_step": 192141, "epoch": 2314} {"train_loss": -23.995397567749023, "global_step": 192142, "epoch": 2314} {"train_loss": -24.264135360717773, "global_step": 192143, "epoch": 2314} {"train_loss": -23.919182788894837, "global_step": 192144, "epoch": 2314, "val_loss": 6482656.0} {"train_loss": -23.704065322875977, "global_step": 192145, "epoch": 2315} {"train_loss": -23.20835304260254, "global_step": 192146, "epoch": 2315} {"train_loss": -23.575193405151367, "global_step": 192147, "epoch": 2315} {"train_loss": -23.469146728515625, "global_step": 192148, "epoch": 2315} {"train_loss": -23.286142349243164, "global_step": 192149, "epoch": 2315} {"train_loss": -23.4263916015625, "global_step": 192150, "epoch": 2315} {"train_loss": -23.627655029296875, "global_step": 192151, "epoch": 2315} {"train_loss": -23.794065475463867, "global_step": 192152, "epoch": 2315} {"train_loss": -24.106517791748047, "global_step": 192153, "epoch": 2315} {"train_loss": -23.655887603759766, "global_step": 192154, "epoch": 2315} {"train_loss": -23.747406005859375, "global_step": 192155, "epoch": 2315} {"train_loss": -24.183311462402344, "global_step": 192156, "epoch": 2315} {"train_loss": -23.56198501586914, "global_step": 192157, "epoch": 2315} {"train_loss": -24.032691955566406, "global_step": 192158, "epoch": 2315} {"train_loss": -23.658414840698242, "global_step": 192159, "epoch": 2315} {"train_loss": -23.69582176208496, "global_step": 192160, "epoch": 2315} {"train_loss": -23.604019165039062, "global_step": 192161, "epoch": 2315} {"train_loss": -23.600465774536133, "global_step": 192162, "epoch": 2315} {"train_loss": -24.06012725830078, "global_step": 192163, "epoch": 2315} {"train_loss": -23.874147415161133, "global_step": 192164, "epoch": 2315} {"train_loss": -23.8089542388916, "global_step": 192165, "epoch": 2315} {"train_loss": -24.087308883666992, "global_step": 192166, "epoch": 2315} {"train_loss": -23.73884391784668, "global_step": 192167, "epoch": 2315} {"train_loss": -23.96095848083496, "global_step": 192168, "epoch": 2315} {"train_loss": -24.239362716674805, "global_step": 192169, "epoch": 2315} {"train_loss": -23.97818374633789, "global_step": 192170, "epoch": 2315} {"train_loss": -24.110816955566406, "global_step": 192171, "epoch": 2315} {"train_loss": -23.86041259765625, "global_step": 192172, "epoch": 2315} {"train_loss": -24.356815338134766, "global_step": 192173, "epoch": 2315} {"train_loss": -24.026901245117188, "global_step": 192174, "epoch": 2315} {"train_loss": -24.253887176513672, "global_step": 192175, "epoch": 2315} {"train_loss": -24.091934204101562, "global_step": 192176, "epoch": 2315} {"train_loss": -24.026323318481445, "global_step": 192177, "epoch": 2315} {"train_loss": -24.23421287536621, "global_step": 192178, "epoch": 2315} {"train_loss": -24.350820541381836, "global_step": 192179, "epoch": 2315} {"train_loss": -24.282453536987305, "global_step": 192180, "epoch": 2315} {"train_loss": -24.143125534057617, "global_step": 192181, "epoch": 2315} {"train_loss": -24.602956771850586, "global_step": 192182, "epoch": 2315} {"train_loss": -24.067296981811523, "global_step": 192183, "epoch": 2315} {"train_loss": -24.265987396240234, "global_step": 192184, "epoch": 2315} {"train_loss": -24.2161808013916, "global_step": 192185, "epoch": 2315} {"train_loss": -23.796527862548828, "global_step": 192186, "epoch": 2315} {"train_loss": -24.106603622436523, "global_step": 192187, "epoch": 2315} {"train_loss": -24.048315048217773, "global_step": 192188, "epoch": 2315} {"train_loss": -24.002944946289062, "global_step": 192189, "epoch": 2315} {"train_loss": -23.831844329833984, "global_step": 192190, "epoch": 2315} {"train_loss": -24.017324447631836, "global_step": 192191, "epoch": 2315} {"train_loss": -24.220718383789062, "global_step": 192192, "epoch": 2315} {"train_loss": -23.509031295776367, "global_step": 192193, "epoch": 2315} {"train_loss": -24.05228614807129, "global_step": 192194, "epoch": 2315} {"train_loss": -24.084980010986328, "global_step": 192195, "epoch": 2315} {"train_loss": -23.892669677734375, "global_step": 192196, "epoch": 2315} {"train_loss": -24.1005802154541, "global_step": 192197, "epoch": 2315} {"train_loss": -23.93779945373535, "global_step": 192198, "epoch": 2315} {"train_loss": -24.29426383972168, "global_step": 192199, "epoch": 2315} {"train_loss": -23.86094856262207, "global_step": 192200, "epoch": 2315} {"train_loss": -24.376182556152344, "global_step": 192201, "epoch": 2315} {"train_loss": -23.990339279174805, "global_step": 192202, "epoch": 2315} {"train_loss": -24.298419952392578, "global_step": 192203, "epoch": 2315} {"train_loss": -23.901626586914062, "global_step": 192204, "epoch": 2315} {"train_loss": -24.171192169189453, "global_step": 192205, "epoch": 2315} {"train_loss": -23.823755264282227, "global_step": 192206, "epoch": 2315} {"train_loss": -24.256418228149414, "global_step": 192207, "epoch": 2315} {"train_loss": -23.7255802154541, "global_step": 192208, "epoch": 2315} {"train_loss": -24.146451950073242, "global_step": 192209, "epoch": 2315} {"train_loss": -24.183696746826172, "global_step": 192210, "epoch": 2315} {"train_loss": -23.457117080688477, "global_step": 192211, "epoch": 2315} {"train_loss": -24.24692153930664, "global_step": 192212, "epoch": 2315} {"train_loss": -24.499141693115234, "global_step": 192213, "epoch": 2315} {"train_loss": -23.94990348815918, "global_step": 192214, "epoch": 2315} {"train_loss": -24.047466278076172, "global_step": 192215, "epoch": 2315} {"train_loss": -23.908374786376953, "global_step": 192216, "epoch": 2315} {"train_loss": -23.896610260009766, "global_step": 192217, "epoch": 2315} {"train_loss": -24.058300018310547, "global_step": 192218, "epoch": 2315} {"train_loss": -23.870519638061523, "global_step": 192219, "epoch": 2315} {"train_loss": -24.035593032836914, "global_step": 192220, "epoch": 2315} {"train_loss": -24.032730102539062, "global_step": 192221, "epoch": 2315} {"train_loss": -23.977746963500977, "global_step": 192222, "epoch": 2315} {"train_loss": -23.703048706054688, "global_step": 192223, "epoch": 2315} {"train_loss": -24.44287109375, "global_step": 192224, "epoch": 2315} {"train_loss": -23.929624557495117, "global_step": 192225, "epoch": 2315} {"train_loss": -24.031309127807617, "global_step": 192226, "epoch": 2315} {"train_loss": -23.963515660848962, "global_step": 192227, "epoch": 2315, "val_loss": 6514785.5} {"train_loss": -23.22566795349121, "global_step": 192228, "epoch": 2316} {"train_loss": -24.1216983795166, "global_step": 192229, "epoch": 2316} {"train_loss": -23.17218589782715, "global_step": 192230, "epoch": 2316} {"train_loss": -23.384689331054688, "global_step": 192231, "epoch": 2316} {"train_loss": -23.697946548461914, "global_step": 192232, "epoch": 2316} {"train_loss": -23.6811580657959, "global_step": 192233, "epoch": 2316} {"train_loss": -23.683908462524414, "global_step": 192234, "epoch": 2316} {"train_loss": -23.447534561157227, "global_step": 192235, "epoch": 2316} {"train_loss": -24.202375411987305, "global_step": 192236, "epoch": 2316} {"train_loss": -23.668975830078125, "global_step": 192237, "epoch": 2316} {"train_loss": -23.657228469848633, "global_step": 192238, "epoch": 2316} {"train_loss": -24.259613037109375, "global_step": 192239, "epoch": 2316} {"train_loss": -23.82234764099121, "global_step": 192240, "epoch": 2316} {"train_loss": -23.686071395874023, "global_step": 192241, "epoch": 2316} {"train_loss": -23.983413696289062, "global_step": 192242, "epoch": 2316} {"train_loss": -24.289899826049805, "global_step": 192243, "epoch": 2316} {"train_loss": -23.901103973388672, "global_step": 192244, "epoch": 2316} {"train_loss": -23.89767837524414, "global_step": 192245, "epoch": 2316} {"train_loss": -24.15557289123535, "global_step": 192246, "epoch": 2316} {"train_loss": -23.63655662536621, "global_step": 192247, "epoch": 2316} {"train_loss": -23.913698196411133, "global_step": 192248, "epoch": 2316} {"train_loss": -23.77723503112793, "global_step": 192249, "epoch": 2316} {"train_loss": -24.154504776000977, "global_step": 192250, "epoch": 2316} {"train_loss": -24.22589111328125, "global_step": 192251, "epoch": 2316} {"train_loss": -24.43641471862793, "global_step": 192252, "epoch": 2316} {"train_loss": -24.410078048706055, "global_step": 192253, "epoch": 2316} {"train_loss": -24.321979522705078, "global_step": 192254, "epoch": 2316} {"train_loss": -24.46902084350586, "global_step": 192255, "epoch": 2316} {"train_loss": -24.42521095275879, "global_step": 192256, "epoch": 2316} {"train_loss": -24.218076705932617, "global_step": 192257, "epoch": 2316} {"train_loss": -24.42351531982422, "global_step": 192258, "epoch": 2316} {"train_loss": -24.03716468811035, "global_step": 192259, "epoch": 2316} {"train_loss": -24.092758178710938, "global_step": 192260, "epoch": 2316} {"train_loss": -24.378049850463867, "global_step": 192261, "epoch": 2316} {"train_loss": -24.41860008239746, "global_step": 192262, "epoch": 2316} {"train_loss": -24.36042594909668, "global_step": 192263, "epoch": 2316} {"train_loss": -24.094806671142578, "global_step": 192264, "epoch": 2316} {"train_loss": -24.49729347229004, "global_step": 192265, "epoch": 2316} {"train_loss": -24.647146224975586, "global_step": 192266, "epoch": 2316} {"train_loss": -24.35514259338379, "global_step": 192267, "epoch": 2316} {"train_loss": -24.053293228149414, "global_step": 192268, "epoch": 2316} {"train_loss": -24.228849411010742, "global_step": 192269, "epoch": 2316} {"train_loss": -23.794906616210938, "global_step": 192270, "epoch": 2316} {"train_loss": -24.143695831298828, "global_step": 192271, "epoch": 2316} {"train_loss": -23.65250015258789, "global_step": 192272, "epoch": 2316} {"train_loss": -24.245464324951172, "global_step": 192273, "epoch": 2316} {"train_loss": -24.09564781188965, "global_step": 192274, "epoch": 2316} {"train_loss": -24.023895263671875, "global_step": 192275, "epoch": 2316} {"train_loss": -23.781705856323242, "global_step": 192276, "epoch": 2316} {"train_loss": -24.190574645996094, "global_step": 192277, "epoch": 2316} {"train_loss": -24.06959342956543, "global_step": 192278, "epoch": 2316} {"train_loss": -24.151411056518555, "global_step": 192279, "epoch": 2316} {"train_loss": -24.003816604614258, "global_step": 192280, "epoch": 2316} {"train_loss": -24.041080474853516, "global_step": 192281, "epoch": 2316} {"train_loss": -23.96978187561035, "global_step": 192282, "epoch": 2316} {"train_loss": -24.06553840637207, "global_step": 192283, "epoch": 2316} {"train_loss": -23.833576202392578, "global_step": 192284, "epoch": 2316} {"train_loss": -24.40780258178711, "global_step": 192285, "epoch": 2316} {"train_loss": -24.0572452545166, "global_step": 192286, "epoch": 2316} {"train_loss": -23.90016746520996, "global_step": 192287, "epoch": 2316} {"train_loss": -23.942398071289062, "global_step": 192288, "epoch": 2316} {"train_loss": -24.242551803588867, "global_step": 192289, "epoch": 2316} {"train_loss": -23.864871978759766, "global_step": 192290, "epoch": 2316} {"train_loss": -24.35292625427246, "global_step": 192291, "epoch": 2316} {"train_loss": -24.57305908203125, "global_step": 192292, "epoch": 2316} {"train_loss": -24.05426025390625, "global_step": 192293, "epoch": 2316} {"train_loss": -24.398868560791016, "global_step": 192294, "epoch": 2316} {"train_loss": -23.981168746948242, "global_step": 192295, "epoch": 2316} {"train_loss": -24.079269409179688, "global_step": 192296, "epoch": 2316} {"train_loss": -24.263092041015625, "global_step": 192297, "epoch": 2316} {"train_loss": -24.306806564331055, "global_step": 192298, "epoch": 2316} {"train_loss": -24.226728439331055, "global_step": 192299, "epoch": 2316} {"train_loss": -23.91653823852539, "global_step": 192300, "epoch": 2316} {"train_loss": -24.437744140625, "global_step": 192301, "epoch": 2316} {"train_loss": -24.240510940551758, "global_step": 192302, "epoch": 2316} {"train_loss": -24.331771850585938, "global_step": 192303, "epoch": 2316} {"train_loss": -23.998807907104492, "global_step": 192304, "epoch": 2316} {"train_loss": -24.109464645385742, "global_step": 192305, "epoch": 2316} {"train_loss": -24.424097061157227, "global_step": 192306, "epoch": 2316} {"train_loss": -24.165197372436523, "global_step": 192307, "epoch": 2316} {"train_loss": -24.255643844604492, "global_step": 192308, "epoch": 2316} {"train_loss": -24.058740615844727, "global_step": 192309, "epoch": 2316} {"train_loss": -24.066654894725385, "global_step": 192310, "epoch": 2316, "val_loss": 6382356.0} {"train_loss": -23.347667694091797, "global_step": 192311, "epoch": 2317} {"train_loss": -23.43193244934082, "global_step": 192312, "epoch": 2317} {"train_loss": -23.67608642578125, "global_step": 192313, "epoch": 2317} {"train_loss": -23.286052703857422, "global_step": 192314, "epoch": 2317} {"train_loss": -23.55860137939453, "global_step": 192315, "epoch": 2317} {"train_loss": -23.4554443359375, "global_step": 192316, "epoch": 2317} {"train_loss": -23.284183502197266, "global_step": 192317, "epoch": 2317} {"train_loss": -23.550291061401367, "global_step": 192318, "epoch": 2317} {"train_loss": -23.97359275817871, "global_step": 192319, "epoch": 2317} {"train_loss": -23.691495895385742, "global_step": 192320, "epoch": 2317} {"train_loss": -23.602956771850586, "global_step": 192321, "epoch": 2317} {"train_loss": -23.730024337768555, "global_step": 192322, "epoch": 2317} {"train_loss": -23.974760055541992, "global_step": 192323, "epoch": 2317} {"train_loss": -23.57570457458496, "global_step": 192324, "epoch": 2317} {"train_loss": -23.701276779174805, "global_step": 192325, "epoch": 2317} {"train_loss": -23.818754196166992, "global_step": 192326, "epoch": 2317} {"train_loss": -23.993215560913086, "global_step": 192327, "epoch": 2317} {"train_loss": -24.118566513061523, "global_step": 192328, "epoch": 2317} {"train_loss": -23.86520767211914, "global_step": 192329, "epoch": 2317} {"train_loss": -23.798721313476562, "global_step": 192330, "epoch": 2317} {"train_loss": -23.913726806640625, "global_step": 192331, "epoch": 2317} {"train_loss": -24.213354110717773, "global_step": 192332, "epoch": 2317} {"train_loss": -23.93729591369629, "global_step": 192333, "epoch": 2317} {"train_loss": -24.114633560180664, "global_step": 192334, "epoch": 2317} {"train_loss": -23.91751480102539, "global_step": 192335, "epoch": 2317} {"train_loss": -24.369749069213867, "global_step": 192336, "epoch": 2317} {"train_loss": -23.845151901245117, "global_step": 192337, "epoch": 2317} {"train_loss": -24.388635635375977, "global_step": 192338, "epoch": 2317} {"train_loss": -24.240564346313477, "global_step": 192339, "epoch": 2317} {"train_loss": -23.757871627807617, "global_step": 192340, "epoch": 2317} {"train_loss": -23.976627349853516, "global_step": 192341, "epoch": 2317} {"train_loss": -24.342864990234375, "global_step": 192342, "epoch": 2317} {"train_loss": -24.141098022460938, "global_step": 192343, "epoch": 2317} {"train_loss": -24.241596221923828, "global_step": 192344, "epoch": 2317} {"train_loss": -24.0117130279541, "global_step": 192345, "epoch": 2317} {"train_loss": -24.232994079589844, "global_step": 192346, "epoch": 2317} {"train_loss": -24.30671501159668, "global_step": 192347, "epoch": 2317} {"train_loss": -24.19865608215332, "global_step": 192348, "epoch": 2317} {"train_loss": -23.89140510559082, "global_step": 192349, "epoch": 2317} {"train_loss": -23.688968658447266, "global_step": 192350, "epoch": 2317} {"train_loss": -24.35784339904785, "global_step": 192351, "epoch": 2317} {"train_loss": -23.938947677612305, "global_step": 192352, "epoch": 2317} {"train_loss": -24.167551040649414, "global_step": 192353, "epoch": 2317} {"train_loss": -24.271390914916992, "global_step": 192354, "epoch": 2317} {"train_loss": -24.382177352905273, "global_step": 192355, "epoch": 2317} {"train_loss": -24.173181533813477, "global_step": 192356, "epoch": 2317} {"train_loss": -24.32162857055664, "global_step": 192357, "epoch": 2317} {"train_loss": -24.116308212280273, "global_step": 192358, "epoch": 2317} {"train_loss": -24.17877769470215, "global_step": 192359, "epoch": 2317} {"train_loss": -23.70558738708496, "global_step": 192360, "epoch": 2317} {"train_loss": -24.08631706237793, "global_step": 192361, "epoch": 2317} {"train_loss": -23.8815860748291, "global_step": 192362, "epoch": 2317} {"train_loss": -24.284194946289062, "global_step": 192363, "epoch": 2317} {"train_loss": -24.142433166503906, "global_step": 192364, "epoch": 2317} {"train_loss": -24.410436630249023, "global_step": 192365, "epoch": 2317} {"train_loss": -24.4488468170166, "global_step": 192366, "epoch": 2317} {"train_loss": -23.83791160583496, "global_step": 192367, "epoch": 2317} {"train_loss": -24.096973419189453, "global_step": 192368, "epoch": 2317} {"train_loss": -24.138208389282227, "global_step": 192369, "epoch": 2317} {"train_loss": -23.99300193786621, "global_step": 192370, "epoch": 2317} {"train_loss": -24.347309112548828, "global_step": 192371, "epoch": 2317} {"train_loss": -24.302978515625, "global_step": 192372, "epoch": 2317} {"train_loss": -24.39197540283203, "global_step": 192373, "epoch": 2317} {"train_loss": -24.532201766967773, "global_step": 192374, "epoch": 2317} {"train_loss": -24.21170425415039, "global_step": 192375, "epoch": 2317} {"train_loss": -24.247100830078125, "global_step": 192376, "epoch": 2317} {"train_loss": -24.540475845336914, "global_step": 192377, "epoch": 2317} {"train_loss": -24.11412811279297, "global_step": 192378, "epoch": 2317} {"train_loss": -24.152217864990234, "global_step": 192379, "epoch": 2317} {"train_loss": -24.473737716674805, "global_step": 192380, "epoch": 2317} {"train_loss": -24.095457077026367, "global_step": 192381, "epoch": 2317} {"train_loss": -24.172544479370117, "global_step": 192382, "epoch": 2317} {"train_loss": -24.22055435180664, "global_step": 192383, "epoch": 2317} {"train_loss": -24.436635971069336, "global_step": 192384, "epoch": 2317} {"train_loss": -24.47263526916504, "global_step": 192385, "epoch": 2317} {"train_loss": -24.351266860961914, "global_step": 192386, "epoch": 2317} {"train_loss": -24.175825119018555, "global_step": 192387, "epoch": 2317} {"train_loss": -24.244592666625977, "global_step": 192388, "epoch": 2317} {"train_loss": -24.360309600830078, "global_step": 192389, "epoch": 2317} {"train_loss": -24.392059326171875, "global_step": 192390, "epoch": 2317} {"train_loss": -24.45256805419922, "global_step": 192391, "epoch": 2317} {"train_loss": -24.131023406982422, "global_step": 192392, "epoch": 2317} {"train_loss": -24.060788143112, "global_step": 192393, "epoch": 2317, "val_loss": 6515804.5} {"train_loss": -23.873310089111328, "global_step": 192394, "epoch": 2318} {"train_loss": -23.963077545166016, "global_step": 192395, "epoch": 2318} {"train_loss": -23.858154296875, "global_step": 192396, "epoch": 2318} {"train_loss": -23.54226303100586, "global_step": 192397, "epoch": 2318} {"train_loss": -23.482913970947266, "global_step": 192398, "epoch": 2318} {"train_loss": -23.794586181640625, "global_step": 192399, "epoch": 2318} {"train_loss": -24.2312068939209, "global_step": 192400, "epoch": 2318} {"train_loss": -23.925189971923828, "global_step": 192401, "epoch": 2318} {"train_loss": -23.96624183654785, "global_step": 192402, "epoch": 2318} {"train_loss": -24.18951416015625, "global_step": 192403, "epoch": 2318} {"train_loss": -24.153358459472656, "global_step": 192404, "epoch": 2318} {"train_loss": -23.80470085144043, "global_step": 192405, "epoch": 2318} {"train_loss": -24.051910400390625, "global_step": 192406, "epoch": 2318} {"train_loss": -24.180587768554688, "global_step": 192407, "epoch": 2318} {"train_loss": -23.570863723754883, "global_step": 192408, "epoch": 2318} {"train_loss": -23.833086013793945, "global_step": 192409, "epoch": 2318} {"train_loss": -24.18001937866211, "global_step": 192410, "epoch": 2318} {"train_loss": -23.8403377532959, "global_step": 192411, "epoch": 2318} {"train_loss": -24.259363174438477, "global_step": 192412, "epoch": 2318} {"train_loss": -23.963973999023438, "global_step": 192413, "epoch": 2318} {"train_loss": -24.279661178588867, "global_step": 192414, "epoch": 2318} {"train_loss": -24.047515869140625, "global_step": 192415, "epoch": 2318} {"train_loss": -24.088459014892578, "global_step": 192416, "epoch": 2318} {"train_loss": -24.269489288330078, "global_step": 192417, "epoch": 2318} {"train_loss": -24.21159553527832, "global_step": 192418, "epoch": 2318} {"train_loss": -24.288022994995117, "global_step": 192419, "epoch": 2318} {"train_loss": -24.322296142578125, "global_step": 192420, "epoch": 2318} {"train_loss": -24.359743118286133, "global_step": 192421, "epoch": 2318} {"train_loss": -23.795103073120117, "global_step": 192422, "epoch": 2318} {"train_loss": -24.12348747253418, "global_step": 192423, "epoch": 2318} {"train_loss": -24.530656814575195, "global_step": 192424, "epoch": 2318} {"train_loss": -24.192039489746094, "global_step": 192425, "epoch": 2318} {"train_loss": -24.512388229370117, "global_step": 192426, "epoch": 2318} {"train_loss": -24.175907135009766, "global_step": 192427, "epoch": 2318} {"train_loss": -23.851259231567383, "global_step": 192428, "epoch": 2318} {"train_loss": -23.915082931518555, "global_step": 192429, "epoch": 2318} {"train_loss": -24.083044052124023, "global_step": 192430, "epoch": 2318} {"train_loss": -23.800537109375, "global_step": 192431, "epoch": 2318} {"train_loss": -23.838979721069336, "global_step": 192432, "epoch": 2318} {"train_loss": -23.473251342773438, "global_step": 192433, "epoch": 2318} {"train_loss": -23.82985496520996, "global_step": 192434, "epoch": 2318} {"train_loss": -23.608509063720703, "global_step": 192435, "epoch": 2318} {"train_loss": -23.959552764892578, "global_step": 192436, "epoch": 2318} {"train_loss": -23.76287078857422, "global_step": 192437, "epoch": 2318} {"train_loss": -24.326078414916992, "global_step": 192438, "epoch": 2318} {"train_loss": -23.829986572265625, "global_step": 192439, "epoch": 2318} {"train_loss": -23.820878982543945, "global_step": 192440, "epoch": 2318} {"train_loss": -23.71224021911621, "global_step": 192441, "epoch": 2318} {"train_loss": -24.17799949645996, "global_step": 192442, "epoch": 2318} {"train_loss": -24.189590454101562, "global_step": 192443, "epoch": 2318} {"train_loss": -24.17414665222168, "global_step": 192444, "epoch": 2318} {"train_loss": -23.766929626464844, "global_step": 192445, "epoch": 2318} {"train_loss": -24.181005477905273, "global_step": 192446, "epoch": 2318} {"train_loss": -23.90741539001465, "global_step": 192447, "epoch": 2318} {"train_loss": -23.926889419555664, "global_step": 192448, "epoch": 2318} {"train_loss": -24.221988677978516, "global_step": 192449, "epoch": 2318} {"train_loss": -23.740604400634766, "global_step": 192450, "epoch": 2318} {"train_loss": -24.29865074157715, "global_step": 192451, "epoch": 2318} {"train_loss": -23.821409225463867, "global_step": 192452, "epoch": 2318} {"train_loss": -24.490577697753906, "global_step": 192453, "epoch": 2318} {"train_loss": -23.895727157592773, "global_step": 192454, "epoch": 2318} {"train_loss": -24.235782623291016, "global_step": 192455, "epoch": 2318} {"train_loss": -23.854598999023438, "global_step": 192456, "epoch": 2318} {"train_loss": -24.060148239135742, "global_step": 192457, "epoch": 2318} {"train_loss": -24.31727409362793, "global_step": 192458, "epoch": 2318} {"train_loss": -24.31068992614746, "global_step": 192459, "epoch": 2318} {"train_loss": -24.072349548339844, "global_step": 192460, "epoch": 2318} {"train_loss": -24.354360580444336, "global_step": 192461, "epoch": 2318} {"train_loss": -24.32403564453125, "global_step": 192462, "epoch": 2318} {"train_loss": -24.22883415222168, "global_step": 192463, "epoch": 2318} {"train_loss": -24.334177017211914, "global_step": 192464, "epoch": 2318} {"train_loss": -24.058124542236328, "global_step": 192465, "epoch": 2318} {"train_loss": -24.346097946166992, "global_step": 192466, "epoch": 2318} {"train_loss": -24.18617057800293, "global_step": 192467, "epoch": 2318} {"train_loss": -24.089603424072266, "global_step": 192468, "epoch": 2318} {"train_loss": -24.681228637695312, "global_step": 192469, "epoch": 2318} {"train_loss": -24.077041625976562, "global_step": 192470, "epoch": 2318} {"train_loss": -23.673503875732422, "global_step": 192471, "epoch": 2318} {"train_loss": -24.174198150634766, "global_step": 192472, "epoch": 2318} {"train_loss": -23.807514190673828, "global_step": 192473, "epoch": 2318} {"train_loss": -23.791418075561523, "global_step": 192474, "epoch": 2318} {"train_loss": -23.93155288696289, "global_step": 192475, "epoch": 2318} {"train_loss": -24.054714065000237, "global_step": 192476, "epoch": 2318, "val_loss": 6616619.0} {"train_loss": -21.675342559814453, "global_step": 192477, "epoch": 2319} {"train_loss": -23.06015396118164, "global_step": 192478, "epoch": 2319} {"train_loss": -22.821897506713867, "global_step": 192479, "epoch": 2319} {"train_loss": -23.041114807128906, "global_step": 192480, "epoch": 2319} {"train_loss": -23.128538131713867, "global_step": 192481, "epoch": 2319} {"train_loss": -23.199148178100586, "global_step": 192482, "epoch": 2319} {"train_loss": -23.219783782958984, "global_step": 192483, "epoch": 2319} {"train_loss": -23.082250595092773, "global_step": 192484, "epoch": 2319} {"train_loss": -23.56979751586914, "global_step": 192485, "epoch": 2319} {"train_loss": -23.564661026000977, "global_step": 192486, "epoch": 2319} {"train_loss": -23.484766006469727, "global_step": 192487, "epoch": 2319} {"train_loss": -23.556543350219727, "global_step": 192488, "epoch": 2319} {"train_loss": -23.571067810058594, "global_step": 192489, "epoch": 2319} {"train_loss": -23.501699447631836, "global_step": 192490, "epoch": 2319} {"train_loss": -23.989944458007812, "global_step": 192491, "epoch": 2319} {"train_loss": -23.092933654785156, "global_step": 192492, "epoch": 2319} {"train_loss": -23.521575927734375, "global_step": 192493, "epoch": 2319} {"train_loss": -23.37909698486328, "global_step": 192494, "epoch": 2319} {"train_loss": -23.4610595703125, "global_step": 192495, "epoch": 2319} {"train_loss": -23.81300163269043, "global_step": 192496, "epoch": 2319} {"train_loss": -23.488483428955078, "global_step": 192497, "epoch": 2319} {"train_loss": -23.96124267578125, "global_step": 192498, "epoch": 2319} {"train_loss": -23.47712516784668, "global_step": 192499, "epoch": 2319} {"train_loss": -23.991174697875977, "global_step": 192500, "epoch": 2319} {"train_loss": -24.017154693603516, "global_step": 192501, "epoch": 2319} {"train_loss": -23.764463424682617, "global_step": 192502, "epoch": 2319} {"train_loss": -24.0072078704834, "global_step": 192503, "epoch": 2319} {"train_loss": -23.82317543029785, "global_step": 192504, "epoch": 2319} {"train_loss": -23.887413024902344, "global_step": 192505, "epoch": 2319} {"train_loss": -23.9785099029541, "global_step": 192506, "epoch": 2319} {"train_loss": -24.014982223510742, "global_step": 192507, "epoch": 2319} {"train_loss": -23.814176559448242, "global_step": 192508, "epoch": 2319} {"train_loss": -23.987995147705078, "global_step": 192509, "epoch": 2319} {"train_loss": -23.96184730529785, "global_step": 192510, "epoch": 2319} {"train_loss": -23.988998413085938, "global_step": 192511, "epoch": 2319} {"train_loss": -23.896440505981445, "global_step": 192512, "epoch": 2319} {"train_loss": -24.325849533081055, "global_step": 192513, "epoch": 2319} {"train_loss": -24.023681640625, "global_step": 192514, "epoch": 2319} {"train_loss": -24.227313995361328, "global_step": 192515, "epoch": 2319} {"train_loss": -24.206924438476562, "global_step": 192516, "epoch": 2319} {"train_loss": -24.2281494140625, "global_step": 192517, "epoch": 2319} {"train_loss": -23.931455612182617, "global_step": 192518, "epoch": 2319} {"train_loss": -23.706289291381836, "global_step": 192519, "epoch": 2319} {"train_loss": -24.02239990234375, "global_step": 192520, "epoch": 2319} {"train_loss": -24.226377487182617, "global_step": 192521, "epoch": 2319} {"train_loss": -24.3335018157959, "global_step": 192522, "epoch": 2319} {"train_loss": -24.163442611694336, "global_step": 192523, "epoch": 2319} {"train_loss": -24.135169982910156, "global_step": 192524, "epoch": 2319} {"train_loss": -24.000532150268555, "global_step": 192525, "epoch": 2319} {"train_loss": -24.245479583740234, "global_step": 192526, "epoch": 2319} {"train_loss": -24.035327911376953, "global_step": 192527, "epoch": 2319} {"train_loss": -24.304458618164062, "global_step": 192528, "epoch": 2319} {"train_loss": -24.435985565185547, "global_step": 192529, "epoch": 2319} {"train_loss": -24.225643157958984, "global_step": 192530, "epoch": 2319} {"train_loss": -24.3385009765625, "global_step": 192531, "epoch": 2319} {"train_loss": -23.838214874267578, "global_step": 192532, "epoch": 2319} {"train_loss": -24.155542373657227, "global_step": 192533, "epoch": 2319} {"train_loss": -24.206771850585938, "global_step": 192534, "epoch": 2319} {"train_loss": -24.757083892822266, "global_step": 192535, "epoch": 2319} {"train_loss": -23.81340980529785, "global_step": 192536, "epoch": 2319} {"train_loss": -24.282175064086914, "global_step": 192537, "epoch": 2319} {"train_loss": -24.0097713470459, "global_step": 192538, "epoch": 2319} {"train_loss": -23.630298614501953, "global_step": 192539, "epoch": 2319} {"train_loss": -23.897764205932617, "global_step": 192540, "epoch": 2319} {"train_loss": -24.024961471557617, "global_step": 192541, "epoch": 2319} {"train_loss": -24.22246742248535, "global_step": 192542, "epoch": 2319} {"train_loss": -24.146892547607422, "global_step": 192543, "epoch": 2319} {"train_loss": -24.089275360107422, "global_step": 192544, "epoch": 2319} {"train_loss": -24.213605880737305, "global_step": 192545, "epoch": 2319} {"train_loss": -23.981786727905273, "global_step": 192546, "epoch": 2319} {"train_loss": -24.050132751464844, "global_step": 192547, "epoch": 2319} {"train_loss": -24.212488174438477, "global_step": 192548, "epoch": 2319} {"train_loss": -24.279699325561523, "global_step": 192549, "epoch": 2319} {"train_loss": -23.698856353759766, "global_step": 192550, "epoch": 2319} {"train_loss": -24.311355590820312, "global_step": 192551, "epoch": 2319} {"train_loss": -24.40467643737793, "global_step": 192552, "epoch": 2319} {"train_loss": -23.957889556884766, "global_step": 192553, "epoch": 2319} {"train_loss": -24.478485107421875, "global_step": 192554, "epoch": 2319} {"train_loss": -24.120344161987305, "global_step": 192555, "epoch": 2319} {"train_loss": -24.1539249420166, "global_step": 192556, "epoch": 2319} {"train_loss": -24.452960968017578, "global_step": 192557, "epoch": 2319} {"train_loss": -24.037887573242188, "global_step": 192558, "epoch": 2319} {"train_loss": -23.892547216760107, "global_step": 192559, "epoch": 2319, "val_loss": 6440871.5} {"train_loss": -23.717060089111328, "global_step": 192560, "epoch": 2320} {"train_loss": -23.735553741455078, "global_step": 192561, "epoch": 2320} {"train_loss": -23.73845100402832, "global_step": 192562, "epoch": 2320} {"train_loss": -24.020980834960938, "global_step": 192563, "epoch": 2320} {"train_loss": -23.679533004760742, "global_step": 192564, "epoch": 2320} {"train_loss": -23.732196807861328, "global_step": 192565, "epoch": 2320} {"train_loss": -23.823650360107422, "global_step": 192566, "epoch": 2320} {"train_loss": -23.959516525268555, "global_step": 192567, "epoch": 2320} {"train_loss": -24.410680770874023, "global_step": 192568, "epoch": 2320} {"train_loss": -24.241613388061523, "global_step": 192569, "epoch": 2320} {"train_loss": -23.816646575927734, "global_step": 192570, "epoch": 2320} {"train_loss": -24.005460739135742, "global_step": 192571, "epoch": 2320} {"train_loss": -24.242780685424805, "global_step": 192572, "epoch": 2320} {"train_loss": -23.842201232910156, "global_step": 192573, "epoch": 2320} {"train_loss": -24.09809684753418, "global_step": 192574, "epoch": 2320} {"train_loss": -24.174009323120117, "global_step": 192575, "epoch": 2320} {"train_loss": -24.05958366394043, "global_step": 192576, "epoch": 2320} {"train_loss": -23.865829467773438, "global_step": 192577, "epoch": 2320} {"train_loss": -24.205183029174805, "global_step": 192578, "epoch": 2320} {"train_loss": -23.63359832763672, "global_step": 192579, "epoch": 2320} {"train_loss": -24.045835494995117, "global_step": 192580, "epoch": 2320} {"train_loss": -24.37687110900879, "global_step": 192581, "epoch": 2320} {"train_loss": -23.473499298095703, "global_step": 192582, "epoch": 2320} {"train_loss": -24.180654525756836, "global_step": 192583, "epoch": 2320} {"train_loss": -23.844308853149414, "global_step": 192584, "epoch": 2320} {"train_loss": -24.321699142456055, "global_step": 192585, "epoch": 2320} {"train_loss": -24.46761131286621, "global_step": 192586, "epoch": 2320} {"train_loss": -24.35739517211914, "global_step": 192587, "epoch": 2320} {"train_loss": -24.269126892089844, "global_step": 192588, "epoch": 2320} {"train_loss": -24.365148544311523, "global_step": 192589, "epoch": 2320} {"train_loss": -23.943586349487305, "global_step": 192590, "epoch": 2320} {"train_loss": -24.050968170166016, "global_step": 192591, "epoch": 2320} {"train_loss": -24.483922958374023, "global_step": 192592, "epoch": 2320} {"train_loss": -24.30266571044922, "global_step": 192593, "epoch": 2320} {"train_loss": -24.447757720947266, "global_step": 192594, "epoch": 2320} {"train_loss": -23.899354934692383, "global_step": 192595, "epoch": 2320} {"train_loss": -24.302154541015625, "global_step": 192596, "epoch": 2320} {"train_loss": -24.223636627197266, "global_step": 192597, "epoch": 2320} {"train_loss": -23.866714477539062, "global_step": 192598, "epoch": 2320} {"train_loss": -24.18665885925293, "global_step": 192599, "epoch": 2320} {"train_loss": -24.309289932250977, "global_step": 192600, "epoch": 2320} {"train_loss": -24.021121978759766, "global_step": 192601, "epoch": 2320} {"train_loss": -24.117507934570312, "global_step": 192602, "epoch": 2320} {"train_loss": -24.268131256103516, "global_step": 192603, "epoch": 2320} {"train_loss": -24.40907096862793, "global_step": 192604, "epoch": 2320} {"train_loss": -24.49217414855957, "global_step": 192605, "epoch": 2320} {"train_loss": -23.79950523376465, "global_step": 192606, "epoch": 2320} {"train_loss": -24.039148330688477, "global_step": 192607, "epoch": 2320} {"train_loss": -23.768213272094727, "global_step": 192608, "epoch": 2320} {"train_loss": -24.244632720947266, "global_step": 192609, "epoch": 2320} {"train_loss": -24.08085060119629, "global_step": 192610, "epoch": 2320} {"train_loss": -24.292598724365234, "global_step": 192611, "epoch": 2320} {"train_loss": -24.092161178588867, "global_step": 192612, "epoch": 2320} {"train_loss": -24.06978416442871, "global_step": 192613, "epoch": 2320} {"train_loss": -24.089231491088867, "global_step": 192614, "epoch": 2320} {"train_loss": -24.305192947387695, "global_step": 192615, "epoch": 2320} {"train_loss": -23.92652702331543, "global_step": 192616, "epoch": 2320} {"train_loss": -24.147262573242188, "global_step": 192617, "epoch": 2320} {"train_loss": -24.27948570251465, "global_step": 192618, "epoch": 2320} {"train_loss": -24.291799545288086, "global_step": 192619, "epoch": 2320} {"train_loss": -23.814437866210938, "global_step": 192620, "epoch": 2320} {"train_loss": -23.777673721313477, "global_step": 192621, "epoch": 2320} {"train_loss": -24.08965492248535, "global_step": 192622, "epoch": 2320} {"train_loss": -24.189496994018555, "global_step": 192623, "epoch": 2320} {"train_loss": -24.15382957458496, "global_step": 192624, "epoch": 2320} {"train_loss": -24.437978744506836, "global_step": 192625, "epoch": 2320} {"train_loss": -24.0498104095459, "global_step": 192626, "epoch": 2320} {"train_loss": -24.05824089050293, "global_step": 192627, "epoch": 2320} {"train_loss": -24.193696975708008, "global_step": 192628, "epoch": 2320} {"train_loss": -24.018766403198242, "global_step": 192629, "epoch": 2320} {"train_loss": -24.040143966674805, "global_step": 192630, "epoch": 2320} {"train_loss": -24.059192657470703, "global_step": 192631, "epoch": 2320} {"train_loss": -24.083066940307617, "global_step": 192632, "epoch": 2320} {"train_loss": -24.10304832458496, "global_step": 192633, "epoch": 2320} {"train_loss": -24.30154800415039, "global_step": 192634, "epoch": 2320} {"train_loss": -24.37184715270996, "global_step": 192635, "epoch": 2320} {"train_loss": -24.108558654785156, "global_step": 192636, "epoch": 2320} {"train_loss": -24.25543212890625, "global_step": 192637, "epoch": 2320} {"train_loss": -24.264066696166992, "global_step": 192638, "epoch": 2320} {"train_loss": -24.368967056274414, "global_step": 192639, "epoch": 2320} {"train_loss": -24.121679306030273, "global_step": 192640, "epoch": 2320} {"train_loss": -24.09827423095703, "global_step": 192641, "epoch": 2320} {"train_loss": -24.114958452891155, "global_step": 192642, "epoch": 2320, "val_loss": 6654925.0} {"train_loss": -23.828126907348633, "global_step": 192643, "epoch": 2321} {"train_loss": -23.813215255737305, "global_step": 192644, "epoch": 2321} {"train_loss": -24.0094051361084, "global_step": 192645, "epoch": 2321} {"train_loss": -23.45489501953125, "global_step": 192646, "epoch": 2321} {"train_loss": -23.865110397338867, "global_step": 192647, "epoch": 2321} {"train_loss": -24.02509117126465, "global_step": 192648, "epoch": 2321} {"train_loss": -24.129079818725586, "global_step": 192649, "epoch": 2321} {"train_loss": -23.896963119506836, "global_step": 192650, "epoch": 2321} {"train_loss": -24.57294273376465, "global_step": 192651, "epoch": 2321} {"train_loss": -23.85638999938965, "global_step": 192652, "epoch": 2321} {"train_loss": -23.72972869873047, "global_step": 192653, "epoch": 2321} {"train_loss": -23.959945678710938, "global_step": 192654, "epoch": 2321} {"train_loss": -24.093923568725586, "global_step": 192655, "epoch": 2321} {"train_loss": -24.055801391601562, "global_step": 192656, "epoch": 2321} {"train_loss": -24.042444229125977, "global_step": 192657, "epoch": 2321} {"train_loss": -23.721149444580078, "global_step": 192658, "epoch": 2321} {"train_loss": -24.330968856811523, "global_step": 192659, "epoch": 2321} {"train_loss": -24.058881759643555, "global_step": 192660, "epoch": 2321} {"train_loss": -23.97447395324707, "global_step": 192661, "epoch": 2321} {"train_loss": -24.167240142822266, "global_step": 192662, "epoch": 2321} {"train_loss": -23.649240493774414, "global_step": 192663, "epoch": 2321} {"train_loss": -23.983051300048828, "global_step": 192664, "epoch": 2321} {"train_loss": -23.84765625, "global_step": 192665, "epoch": 2321} {"train_loss": -23.714813232421875, "global_step": 192666, "epoch": 2321} {"train_loss": -24.08633804321289, "global_step": 192667, "epoch": 2321} {"train_loss": -24.212177276611328, "global_step": 192668, "epoch": 2321} {"train_loss": -23.82733726501465, "global_step": 192669, "epoch": 2321} {"train_loss": -23.979124069213867, "global_step": 192670, "epoch": 2321} {"train_loss": -23.66498374938965, "global_step": 192671, "epoch": 2321} {"train_loss": -24.215167999267578, "global_step": 192672, "epoch": 2321} {"train_loss": -23.952655792236328, "global_step": 192673, "epoch": 2321} {"train_loss": -24.46339988708496, "global_step": 192674, "epoch": 2321} {"train_loss": -24.079376220703125, "global_step": 192675, "epoch": 2321} {"train_loss": -23.887975692749023, "global_step": 192676, "epoch": 2321} {"train_loss": -24.24037742614746, "global_step": 192677, "epoch": 2321} {"train_loss": -23.830039978027344, "global_step": 192678, "epoch": 2321} {"train_loss": -24.369779586791992, "global_step": 192679, "epoch": 2321} {"train_loss": -23.739973068237305, "global_step": 192680, "epoch": 2321} {"train_loss": -24.120512008666992, "global_step": 192681, "epoch": 2321} {"train_loss": -24.151931762695312, "global_step": 192682, "epoch": 2321} {"train_loss": -24.154155731201172, "global_step": 192683, "epoch": 2321} {"train_loss": -24.1378173828125, "global_step": 192684, "epoch": 2321} {"train_loss": -24.047094345092773, "global_step": 192685, "epoch": 2321} {"train_loss": -24.45287322998047, "global_step": 192686, "epoch": 2321} {"train_loss": -24.263425827026367, "global_step": 192687, "epoch": 2321} {"train_loss": -24.481321334838867, "global_step": 192688, "epoch": 2321} {"train_loss": -24.2122859954834, "global_step": 192689, "epoch": 2321} {"train_loss": -24.526409149169922, "global_step": 192690, "epoch": 2321} {"train_loss": -24.569263458251953, "global_step": 192691, "epoch": 2321} {"train_loss": -24.09375762939453, "global_step": 192692, "epoch": 2321} {"train_loss": -24.235191345214844, "global_step": 192693, "epoch": 2321} {"train_loss": -24.469900131225586, "global_step": 192694, "epoch": 2321} {"train_loss": -24.510690689086914, "global_step": 192695, "epoch": 2321} {"train_loss": -24.460363388061523, "global_step": 192696, "epoch": 2321} {"train_loss": -24.22348403930664, "global_step": 192697, "epoch": 2321} {"train_loss": -24.187528610229492, "global_step": 192698, "epoch": 2321} {"train_loss": -23.939353942871094, "global_step": 192699, "epoch": 2321} {"train_loss": -24.34200096130371, "global_step": 192700, "epoch": 2321} {"train_loss": -24.45488929748535, "global_step": 192701, "epoch": 2321} {"train_loss": -24.082746505737305, "global_step": 192702, "epoch": 2321} {"train_loss": -24.12399673461914, "global_step": 192703, "epoch": 2321} {"train_loss": -24.268756866455078, "global_step": 192704, "epoch": 2321} {"train_loss": -24.107038497924805, "global_step": 192705, "epoch": 2321} {"train_loss": -24.557254791259766, "global_step": 192706, "epoch": 2321} {"train_loss": -24.37508773803711, "global_step": 192707, "epoch": 2321} {"train_loss": -24.337156295776367, "global_step": 192708, "epoch": 2321} {"train_loss": -24.17246437072754, "global_step": 192709, "epoch": 2321} {"train_loss": -24.456039428710938, "global_step": 192710, "epoch": 2321} {"train_loss": -23.79828453063965, "global_step": 192711, "epoch": 2321} {"train_loss": -23.8828125, "global_step": 192712, "epoch": 2321} {"train_loss": -24.0166072845459, "global_step": 192713, "epoch": 2321} {"train_loss": -23.546260833740234, "global_step": 192714, "epoch": 2321} {"train_loss": -23.693002700805664, "global_step": 192715, "epoch": 2321} {"train_loss": -23.9813175201416, "global_step": 192716, "epoch": 2321} {"train_loss": -24.17804527282715, "global_step": 192717, "epoch": 2321} {"train_loss": -23.8404598236084, "global_step": 192718, "epoch": 2321} {"train_loss": -24.035871505737305, "global_step": 192719, "epoch": 2321} {"train_loss": -24.132598876953125, "global_step": 192720, "epoch": 2321} {"train_loss": -24.186782836914062, "global_step": 192721, "epoch": 2321} {"train_loss": -24.04213523864746, "global_step": 192722, "epoch": 2321} {"train_loss": -23.92587661743164, "global_step": 192723, "epoch": 2321} {"train_loss": -23.998987197875977, "global_step": 192724, "epoch": 2321} {"train_loss": -24.10030776334096, "global_step": 192725, "epoch": 2321, "val_loss": 6497056.0} {"train_loss": -23.669164657592773, "global_step": 192726, "epoch": 2322} {"train_loss": -23.826553344726562, "global_step": 192727, "epoch": 2322} {"train_loss": -23.831478118896484, "global_step": 192728, "epoch": 2322} {"train_loss": -23.69032859802246, "global_step": 192729, "epoch": 2322} {"train_loss": -24.275999069213867, "global_step": 192730, "epoch": 2322} {"train_loss": -23.94296646118164, "global_step": 192731, "epoch": 2322} {"train_loss": -23.8572998046875, "global_step": 192732, "epoch": 2322} {"train_loss": -24.06519889831543, "global_step": 192733, "epoch": 2322} {"train_loss": -23.837451934814453, "global_step": 192734, "epoch": 2322} {"train_loss": -23.78603172302246, "global_step": 192735, "epoch": 2322} {"train_loss": -23.85171890258789, "global_step": 192736, "epoch": 2322} {"train_loss": -23.698087692260742, "global_step": 192737, "epoch": 2322} {"train_loss": -23.966384887695312, "global_step": 192738, "epoch": 2322} {"train_loss": -24.090551376342773, "global_step": 192739, "epoch": 2322} {"train_loss": -24.152889251708984, "global_step": 192740, "epoch": 2322} {"train_loss": -24.247297286987305, "global_step": 192741, "epoch": 2322} {"train_loss": -23.925756454467773, "global_step": 192742, "epoch": 2322} {"train_loss": -24.113391876220703, "global_step": 192743, "epoch": 2322} {"train_loss": -23.708507537841797, "global_step": 192744, "epoch": 2322} {"train_loss": -23.72317123413086, "global_step": 192745, "epoch": 2322} {"train_loss": -23.905805587768555, "global_step": 192746, "epoch": 2322} {"train_loss": -23.999942779541016, "global_step": 192747, "epoch": 2322} {"train_loss": -24.685272216796875, "global_step": 192748, "epoch": 2322} {"train_loss": -23.92486572265625, "global_step": 192749, "epoch": 2322} {"train_loss": -24.627946853637695, "global_step": 192750, "epoch": 2322} {"train_loss": -24.234643936157227, "global_step": 192751, "epoch": 2322} {"train_loss": -24.1772518157959, "global_step": 192752, "epoch": 2322} {"train_loss": -24.254453659057617, "global_step": 192753, "epoch": 2322} {"train_loss": -24.11748695373535, "global_step": 192754, "epoch": 2322} {"train_loss": -24.122953414916992, "global_step": 192755, "epoch": 2322} {"train_loss": -24.14971923828125, "global_step": 192756, "epoch": 2322} {"train_loss": -24.203702926635742, "global_step": 192757, "epoch": 2322} {"train_loss": -23.77424430847168, "global_step": 192758, "epoch": 2322} {"train_loss": -24.1219425201416, "global_step": 192759, "epoch": 2322} {"train_loss": -23.821237564086914, "global_step": 192760, "epoch": 2322} {"train_loss": -23.5134220123291, "global_step": 192761, "epoch": 2322} {"train_loss": -24.327259063720703, "global_step": 192762, "epoch": 2322} {"train_loss": -24.077919006347656, "global_step": 192763, "epoch": 2322} {"train_loss": -23.805265426635742, "global_step": 192764, "epoch": 2322} {"train_loss": -23.9921932220459, "global_step": 192765, "epoch": 2322} {"train_loss": -23.595754623413086, "global_step": 192766, "epoch": 2322} {"train_loss": -23.3358097076416, "global_step": 192767, "epoch": 2322} {"train_loss": -23.78336524963379, "global_step": 192768, "epoch": 2322} {"train_loss": -23.854352951049805, "global_step": 192769, "epoch": 2322} {"train_loss": -23.59242057800293, "global_step": 192770, "epoch": 2322} {"train_loss": -24.110898971557617, "global_step": 192771, "epoch": 2322} {"train_loss": -24.08050537109375, "global_step": 192772, "epoch": 2322} {"train_loss": -24.15919303894043, "global_step": 192773, "epoch": 2322} {"train_loss": -23.742263793945312, "global_step": 192774, "epoch": 2322} {"train_loss": -24.011089324951172, "global_step": 192775, "epoch": 2322} {"train_loss": -23.661678314208984, "global_step": 192776, "epoch": 2322} {"train_loss": -23.796178817749023, "global_step": 192777, "epoch": 2322} {"train_loss": -24.420276641845703, "global_step": 192778, "epoch": 2322} {"train_loss": -24.367219924926758, "global_step": 192779, "epoch": 2322} {"train_loss": -24.074588775634766, "global_step": 192780, "epoch": 2322} {"train_loss": -24.16111946105957, "global_step": 192781, "epoch": 2322} {"train_loss": -24.296239852905273, "global_step": 192782, "epoch": 2322} {"train_loss": -24.123355865478516, "global_step": 192783, "epoch": 2322} {"train_loss": -24.131799697875977, "global_step": 192784, "epoch": 2322} {"train_loss": -24.145587921142578, "global_step": 192785, "epoch": 2322} {"train_loss": -24.200769424438477, "global_step": 192786, "epoch": 2322} {"train_loss": -24.337263107299805, "global_step": 192787, "epoch": 2322} {"train_loss": -23.875782012939453, "global_step": 192788, "epoch": 2322} {"train_loss": -24.142675399780273, "global_step": 192789, "epoch": 2322} {"train_loss": -23.902847290039062, "global_step": 192790, "epoch": 2322} {"train_loss": -24.126367568969727, "global_step": 192791, "epoch": 2322} {"train_loss": -23.781835556030273, "global_step": 192792, "epoch": 2322} {"train_loss": -23.96910858154297, "global_step": 192793, "epoch": 2322} {"train_loss": -24.103591918945312, "global_step": 192794, "epoch": 2322} {"train_loss": -23.82377815246582, "global_step": 192795, "epoch": 2322} {"train_loss": -24.0982723236084, "global_step": 192796, "epoch": 2322} {"train_loss": -24.08802604675293, "global_step": 192797, "epoch": 2322} {"train_loss": -23.833507537841797, "global_step": 192798, "epoch": 2322} {"train_loss": -24.06766128540039, "global_step": 192799, "epoch": 2322} {"train_loss": -23.846479415893555, "global_step": 192800, "epoch": 2322} {"train_loss": -24.08135223388672, "global_step": 192801, "epoch": 2322} {"train_loss": -24.006444931030273, "global_step": 192802, "epoch": 2322} {"train_loss": -24.284494400024414, "global_step": 192803, "epoch": 2322} {"train_loss": -23.940866470336914, "global_step": 192804, "epoch": 2322} {"train_loss": -23.704357147216797, "global_step": 192805, "epoch": 2322} {"train_loss": -24.3181209564209, "global_step": 192806, "epoch": 2322} {"train_loss": -24.411344528198242, "global_step": 192807, "epoch": 2322} {"train_loss": -24.005446882133025, "global_step": 192808, "epoch": 2322, "val_loss": 6453626.0} {"train_loss": -23.778072357177734, "global_step": 192809, "epoch": 2323} {"train_loss": -23.723878860473633, "global_step": 192810, "epoch": 2323} {"train_loss": -23.624542236328125, "global_step": 192811, "epoch": 2323} {"train_loss": -23.359914779663086, "global_step": 192812, "epoch": 2323} {"train_loss": -23.422931671142578, "global_step": 192813, "epoch": 2323} {"train_loss": -23.815326690673828, "global_step": 192814, "epoch": 2323} {"train_loss": -23.659168243408203, "global_step": 192815, "epoch": 2323} {"train_loss": -23.357988357543945, "global_step": 192816, "epoch": 2323} {"train_loss": -23.9100341796875, "global_step": 192817, "epoch": 2323} {"train_loss": -23.501752853393555, "global_step": 192818, "epoch": 2323} {"train_loss": -23.79645538330078, "global_step": 192819, "epoch": 2323} {"train_loss": -23.840152740478516, "global_step": 192820, "epoch": 2323} {"train_loss": -23.459985733032227, "global_step": 192821, "epoch": 2323} {"train_loss": -23.83967399597168, "global_step": 192822, "epoch": 2323} {"train_loss": -24.035825729370117, "global_step": 192823, "epoch": 2323} {"train_loss": -24.106107711791992, "global_step": 192824, "epoch": 2323} {"train_loss": -23.992664337158203, "global_step": 192825, "epoch": 2323} {"train_loss": -24.054534912109375, "global_step": 192826, "epoch": 2323} {"train_loss": -24.006595611572266, "global_step": 192827, "epoch": 2323} {"train_loss": -23.759593963623047, "global_step": 192828, "epoch": 2323} {"train_loss": -24.171710968017578, "global_step": 192829, "epoch": 2323} {"train_loss": -24.195846557617188, "global_step": 192830, "epoch": 2323} {"train_loss": -24.243061065673828, "global_step": 192831, "epoch": 2323} {"train_loss": -23.725738525390625, "global_step": 192832, "epoch": 2323} {"train_loss": -24.158641815185547, "global_step": 192833, "epoch": 2323} {"train_loss": -24.191434860229492, "global_step": 192834, "epoch": 2323} {"train_loss": -23.8304443359375, "global_step": 192835, "epoch": 2323} {"train_loss": -23.894031524658203, "global_step": 192836, "epoch": 2323} {"train_loss": -24.192584991455078, "global_step": 192837, "epoch": 2323} {"train_loss": -24.05573844909668, "global_step": 192838, "epoch": 2323} {"train_loss": -24.0556640625, "global_step": 192839, "epoch": 2323} {"train_loss": -24.332590103149414, "global_step": 192840, "epoch": 2323} {"train_loss": -24.494827270507812, "global_step": 192841, "epoch": 2323} {"train_loss": -24.437610626220703, "global_step": 192842, "epoch": 2323} {"train_loss": -24.310068130493164, "global_step": 192843, "epoch": 2323} {"train_loss": -24.48429298400879, "global_step": 192844, "epoch": 2323} {"train_loss": -24.220617294311523, "global_step": 192845, "epoch": 2323} {"train_loss": -24.113798141479492, "global_step": 192846, "epoch": 2323} {"train_loss": -24.243345260620117, "global_step": 192847, "epoch": 2323} {"train_loss": -24.252973556518555, "global_step": 192848, "epoch": 2323} {"train_loss": -24.4654541015625, "global_step": 192849, "epoch": 2323} {"train_loss": -24.533498764038086, "global_step": 192850, "epoch": 2323} {"train_loss": -24.1529483795166, "global_step": 192851, "epoch": 2323} {"train_loss": -24.17509651184082, "global_step": 192852, "epoch": 2323} {"train_loss": -24.164623260498047, "global_step": 192853, "epoch": 2323} {"train_loss": -24.544816970825195, "global_step": 192854, "epoch": 2323} {"train_loss": -24.18739891052246, "global_step": 192855, "epoch": 2323} {"train_loss": -23.873876571655273, "global_step": 192856, "epoch": 2323} {"train_loss": -24.123144149780273, "global_step": 192857, "epoch": 2323} {"train_loss": -23.764389038085938, "global_step": 192858, "epoch": 2323} {"train_loss": -23.716842651367188, "global_step": 192859, "epoch": 2323} {"train_loss": -23.996479034423828, "global_step": 192860, "epoch": 2323} {"train_loss": -23.762771606445312, "global_step": 192861, "epoch": 2323} {"train_loss": -23.818418502807617, "global_step": 192862, "epoch": 2323} {"train_loss": -24.264867782592773, "global_step": 192863, "epoch": 2323} {"train_loss": -23.469757080078125, "global_step": 192864, "epoch": 2323} {"train_loss": -23.717758178710938, "global_step": 192865, "epoch": 2323} {"train_loss": -24.417724609375, "global_step": 192866, "epoch": 2323} {"train_loss": -23.98579978942871, "global_step": 192867, "epoch": 2323} {"train_loss": -23.98781394958496, "global_step": 192868, "epoch": 2323} {"train_loss": -24.280641555786133, "global_step": 192869, "epoch": 2323} {"train_loss": -23.939130783081055, "global_step": 192870, "epoch": 2323} {"train_loss": -23.83751678466797, "global_step": 192871, "epoch": 2323} {"train_loss": -23.918380737304688, "global_step": 192872, "epoch": 2323} {"train_loss": -23.918655395507812, "global_step": 192873, "epoch": 2323} {"train_loss": -24.23297119140625, "global_step": 192874, "epoch": 2323} {"train_loss": -24.26507568359375, "global_step": 192875, "epoch": 2323} {"train_loss": -24.056486129760742, "global_step": 192876, "epoch": 2323} {"train_loss": -24.018020629882812, "global_step": 192877, "epoch": 2323} {"train_loss": -23.912303924560547, "global_step": 192878, "epoch": 2323} {"train_loss": -24.016447067260742, "global_step": 192879, "epoch": 2323} {"train_loss": -24.179733276367188, "global_step": 192880, "epoch": 2323} {"train_loss": -24.228713989257812, "global_step": 192881, "epoch": 2323} {"train_loss": -23.85835075378418, "global_step": 192882, "epoch": 2323} {"train_loss": -24.10748291015625, "global_step": 192883, "epoch": 2323} {"train_loss": -23.864364624023438, "global_step": 192884, "epoch": 2323} {"train_loss": -24.425268173217773, "global_step": 192885, "epoch": 2323} {"train_loss": -23.802536010742188, "global_step": 192886, "epoch": 2323} {"train_loss": -23.99567413330078, "global_step": 192887, "epoch": 2323} {"train_loss": -24.46624183654785, "global_step": 192888, "epoch": 2323} {"train_loss": -23.74534034729004, "global_step": 192889, "epoch": 2323} {"train_loss": -23.969953536987305, "global_step": 192890, "epoch": 2323} {"train_loss": -24.01029729268637, "global_step": 192891, "epoch": 2323, "val_loss": 6589361.0} {"train_loss": -24.054792404174805, "global_step": 192892, "epoch": 2324} {"train_loss": -23.543174743652344, "global_step": 192893, "epoch": 2324} {"train_loss": -23.606611251831055, "global_step": 192894, "epoch": 2324} {"train_loss": -24.187292098999023, "global_step": 192895, "epoch": 2324} {"train_loss": -23.37299919128418, "global_step": 192896, "epoch": 2324} {"train_loss": -23.54555320739746, "global_step": 192897, "epoch": 2324} {"train_loss": -24.29290771484375, "global_step": 192898, "epoch": 2324} {"train_loss": -23.704601287841797, "global_step": 192899, "epoch": 2324} {"train_loss": -24.102203369140625, "global_step": 192900, "epoch": 2324} {"train_loss": -24.07411003112793, "global_step": 192901, "epoch": 2324} {"train_loss": -23.91546630859375, "global_step": 192902, "epoch": 2324} {"train_loss": -23.634403228759766, "global_step": 192903, "epoch": 2324} {"train_loss": -24.163259506225586, "global_step": 192904, "epoch": 2324} {"train_loss": -24.162643432617188, "global_step": 192905, "epoch": 2324} {"train_loss": -24.107166290283203, "global_step": 192906, "epoch": 2324} {"train_loss": -24.151931762695312, "global_step": 192907, "epoch": 2324} {"train_loss": -24.273412704467773, "global_step": 192908, "epoch": 2324} {"train_loss": -23.93939781188965, "global_step": 192909, "epoch": 2324} {"train_loss": -24.19723129272461, "global_step": 192910, "epoch": 2324} {"train_loss": -24.519886016845703, "global_step": 192911, "epoch": 2324} {"train_loss": -23.859743118286133, "global_step": 192912, "epoch": 2324} {"train_loss": -24.027359008789062, "global_step": 192913, "epoch": 2324} {"train_loss": -24.30511474609375, "global_step": 192914, "epoch": 2324} {"train_loss": -24.354990005493164, "global_step": 192915, "epoch": 2324} {"train_loss": -24.489301681518555, "global_step": 192916, "epoch": 2324} {"train_loss": -24.16806983947754, "global_step": 192917, "epoch": 2324} {"train_loss": -23.87308120727539, "global_step": 192918, "epoch": 2324} {"train_loss": -23.820175170898438, "global_step": 192919, "epoch": 2324} {"train_loss": -23.78814125061035, "global_step": 192920, "epoch": 2324} {"train_loss": -24.139484405517578, "global_step": 192921, "epoch": 2324} {"train_loss": -24.15604591369629, "global_step": 192922, "epoch": 2324} {"train_loss": -24.005842208862305, "global_step": 192923, "epoch": 2324} {"train_loss": -24.1170711517334, "global_step": 192924, "epoch": 2324} {"train_loss": -23.974872589111328, "global_step": 192925, "epoch": 2324} {"train_loss": -24.038610458374023, "global_step": 192926, "epoch": 2324} {"train_loss": -24.211017608642578, "global_step": 192927, "epoch": 2324} {"train_loss": -24.098623275756836, "global_step": 192928, "epoch": 2324} {"train_loss": -23.725858688354492, "global_step": 192929, "epoch": 2324} {"train_loss": -23.97269058227539, "global_step": 192930, "epoch": 2324} {"train_loss": -24.314990997314453, "global_step": 192931, "epoch": 2324} {"train_loss": -23.89244270324707, "global_step": 192932, "epoch": 2324} {"train_loss": -24.340749740600586, "global_step": 192933, "epoch": 2324} {"train_loss": -24.239320755004883, "global_step": 192934, "epoch": 2324} {"train_loss": -23.966459274291992, "global_step": 192935, "epoch": 2324} {"train_loss": -24.077667236328125, "global_step": 192936, "epoch": 2324} {"train_loss": -24.562543869018555, "global_step": 192937, "epoch": 2324} {"train_loss": -24.237361907958984, "global_step": 192938, "epoch": 2324} {"train_loss": -24.39676856994629, "global_step": 192939, "epoch": 2324} {"train_loss": -24.477758407592773, "global_step": 192940, "epoch": 2324} {"train_loss": -24.228771209716797, "global_step": 192941, "epoch": 2324} {"train_loss": -24.4356689453125, "global_step": 192942, "epoch": 2324} {"train_loss": -24.176685333251953, "global_step": 192943, "epoch": 2324} {"train_loss": -24.110952377319336, "global_step": 192944, "epoch": 2324} {"train_loss": -24.285776138305664, "global_step": 192945, "epoch": 2324} {"train_loss": -24.47178077697754, "global_step": 192946, "epoch": 2324} {"train_loss": -24.268537521362305, "global_step": 192947, "epoch": 2324} {"train_loss": -23.9773006439209, "global_step": 192948, "epoch": 2324} {"train_loss": -23.471712112426758, "global_step": 192949, "epoch": 2324} {"train_loss": -24.000707626342773, "global_step": 192950, "epoch": 2324} {"train_loss": -23.89468002319336, "global_step": 192951, "epoch": 2324} {"train_loss": -24.219348907470703, "global_step": 192952, "epoch": 2324} {"train_loss": -23.522842407226562, "global_step": 192953, "epoch": 2324} {"train_loss": -23.53029441833496, "global_step": 192954, "epoch": 2324} {"train_loss": -24.165987014770508, "global_step": 192955, "epoch": 2324} {"train_loss": -24.371065139770508, "global_step": 192956, "epoch": 2324} {"train_loss": -24.121387481689453, "global_step": 192957, "epoch": 2324} {"train_loss": -24.302946090698242, "global_step": 192958, "epoch": 2324} {"train_loss": -24.443342208862305, "global_step": 192959, "epoch": 2324} {"train_loss": -24.203039169311523, "global_step": 192960, "epoch": 2324} {"train_loss": -24.22148323059082, "global_step": 192961, "epoch": 2324} {"train_loss": -23.945693969726562, "global_step": 192962, "epoch": 2324} {"train_loss": -24.062301635742188, "global_step": 192963, "epoch": 2324} {"train_loss": -24.388877868652344, "global_step": 192964, "epoch": 2324} {"train_loss": -24.205148696899414, "global_step": 192965, "epoch": 2324} {"train_loss": -23.95216941833496, "global_step": 192966, "epoch": 2324} {"train_loss": -24.107999801635742, "global_step": 192967, "epoch": 2324} {"train_loss": -24.21929168701172, "global_step": 192968, "epoch": 2324} {"train_loss": -24.25088882446289, "global_step": 192969, "epoch": 2324} {"train_loss": -24.056344985961914, "global_step": 192970, "epoch": 2324} {"train_loss": -24.395179748535156, "global_step": 192971, "epoch": 2324} {"train_loss": -24.110309600830078, "global_step": 192972, "epoch": 2324} {"train_loss": -24.1993465423584, "global_step": 192973, "epoch": 2324} {"train_loss": -24.091134151780462, "global_step": 192974, "epoch": 2324, "val_loss": 6479381.0} {"train_loss": -24.082386016845703, "global_step": 192975, "epoch": 2325} {"train_loss": -24.337268829345703, "global_step": 192976, "epoch": 2325} {"train_loss": -23.95889663696289, "global_step": 192977, "epoch": 2325} {"train_loss": -23.755538940429688, "global_step": 192978, "epoch": 2325} {"train_loss": -23.879384994506836, "global_step": 192979, "epoch": 2325} {"train_loss": -24.055627822875977, "global_step": 192980, "epoch": 2325} {"train_loss": -23.963369369506836, "global_step": 192981, "epoch": 2325} {"train_loss": -23.99690055847168, "global_step": 192982, "epoch": 2325} {"train_loss": -24.152585983276367, "global_step": 192983, "epoch": 2325} {"train_loss": -24.04446792602539, "global_step": 192984, "epoch": 2325} {"train_loss": -24.43302345275879, "global_step": 192985, "epoch": 2325} {"train_loss": -23.83599281311035, "global_step": 192986, "epoch": 2325} {"train_loss": -23.880537033081055, "global_step": 192987, "epoch": 2325} {"train_loss": -23.819366455078125, "global_step": 192988, "epoch": 2325} {"train_loss": -24.1827335357666, "global_step": 192989, "epoch": 2325} {"train_loss": -24.15035057067871, "global_step": 192990, "epoch": 2325} {"train_loss": -24.12666130065918, "global_step": 192991, "epoch": 2325} {"train_loss": -24.313217163085938, "global_step": 192992, "epoch": 2325} {"train_loss": -23.73629379272461, "global_step": 192993, "epoch": 2325} {"train_loss": -23.902685165405273, "global_step": 192994, "epoch": 2325} {"train_loss": -24.066186904907227, "global_step": 192995, "epoch": 2325} {"train_loss": -24.36932945251465, "global_step": 192996, "epoch": 2325} {"train_loss": -24.108068466186523, "global_step": 192997, "epoch": 2325} {"train_loss": -23.816116333007812, "global_step": 192998, "epoch": 2325} {"train_loss": -24.06676483154297, "global_step": 192999, "epoch": 2325} {"train_loss": -24.139312744140625, "global_step": 193000, "epoch": 2325} {"train_loss": -24.005237579345703, "global_step": 193001, "epoch": 2325} {"train_loss": -24.407941818237305, "global_step": 193002, "epoch": 2325} {"train_loss": -23.816526412963867, "global_step": 193003, "epoch": 2325} {"train_loss": -24.269508361816406, "global_step": 193004, "epoch": 2325} {"train_loss": -24.21524429321289, "global_step": 193005, "epoch": 2325} {"train_loss": -24.403196334838867, "global_step": 193006, "epoch": 2325} {"train_loss": -24.60751724243164, "global_step": 193007, "epoch": 2325} {"train_loss": -23.984310150146484, "global_step": 193008, "epoch": 2325} {"train_loss": -24.309343338012695, "global_step": 193009, "epoch": 2325} {"train_loss": -24.04121208190918, "global_step": 193010, "epoch": 2325} {"train_loss": -24.0200252532959, "global_step": 193011, "epoch": 2325} {"train_loss": -24.491947174072266, "global_step": 193012, "epoch": 2325} {"train_loss": -24.37668228149414, "global_step": 193013, "epoch": 2325} {"train_loss": -24.11457061767578, "global_step": 193014, "epoch": 2325} {"train_loss": -24.28734588623047, "global_step": 193015, "epoch": 2325} {"train_loss": -24.39249610900879, "global_step": 193016, "epoch": 2325} {"train_loss": -24.161808013916016, "global_step": 193017, "epoch": 2325} {"train_loss": -24.36614418029785, "global_step": 193018, "epoch": 2325} {"train_loss": -24.15357780456543, "global_step": 193019, "epoch": 2325} {"train_loss": -24.050691604614258, "global_step": 193020, "epoch": 2325} {"train_loss": -24.225391387939453, "global_step": 193021, "epoch": 2325} {"train_loss": -24.426231384277344, "global_step": 193022, "epoch": 2325} {"train_loss": -24.072538375854492, "global_step": 193023, "epoch": 2325} {"train_loss": -24.113231658935547, "global_step": 193024, "epoch": 2325} {"train_loss": -24.081134796142578, "global_step": 193025, "epoch": 2325} {"train_loss": -24.341604232788086, "global_step": 193026, "epoch": 2325} {"train_loss": -23.89272117614746, "global_step": 193027, "epoch": 2325} {"train_loss": -23.807849884033203, "global_step": 193028, "epoch": 2325} {"train_loss": -23.491247177124023, "global_step": 193029, "epoch": 2325} {"train_loss": -23.940948486328125, "global_step": 193030, "epoch": 2325} {"train_loss": -23.592609405517578, "global_step": 193031, "epoch": 2325} {"train_loss": -23.938539505004883, "global_step": 193032, "epoch": 2325} {"train_loss": -23.622589111328125, "global_step": 193033, "epoch": 2325} {"train_loss": -23.84506607055664, "global_step": 193034, "epoch": 2325} {"train_loss": -23.67673110961914, "global_step": 193035, "epoch": 2325} {"train_loss": -24.176557540893555, "global_step": 193036, "epoch": 2325} {"train_loss": -24.11958885192871, "global_step": 193037, "epoch": 2325} {"train_loss": -23.786067962646484, "global_step": 193038, "epoch": 2325} {"train_loss": -24.119354248046875, "global_step": 193039, "epoch": 2325} {"train_loss": -23.950733184814453, "global_step": 193040, "epoch": 2325} {"train_loss": -23.992618560791016, "global_step": 193041, "epoch": 2325} {"train_loss": -24.224515914916992, "global_step": 193042, "epoch": 2325} {"train_loss": -24.326574325561523, "global_step": 193043, "epoch": 2325} {"train_loss": -23.988117218017578, "global_step": 193044, "epoch": 2325} {"train_loss": -24.062339782714844, "global_step": 193045, "epoch": 2325} {"train_loss": -24.273706436157227, "global_step": 193046, "epoch": 2325} {"train_loss": -23.929325103759766, "global_step": 193047, "epoch": 2325} {"train_loss": -24.08444595336914, "global_step": 193048, "epoch": 2325} {"train_loss": -24.207965850830078, "global_step": 193049, "epoch": 2325} {"train_loss": -23.800352096557617, "global_step": 193050, "epoch": 2325} {"train_loss": -24.188207626342773, "global_step": 193051, "epoch": 2325} {"train_loss": -24.28314781188965, "global_step": 193052, "epoch": 2325} {"train_loss": -24.350629806518555, "global_step": 193053, "epoch": 2325} {"train_loss": -23.986536026000977, "global_step": 193054, "epoch": 2325} {"train_loss": -23.73868179321289, "global_step": 193055, "epoch": 2325} {"train_loss": -23.758975982666016, "global_step": 193056, "epoch": 2325} {"train_loss": -24.088387983391083, "global_step": 193057, "epoch": 2325, "val_loss": 6565791.0} {"train_loss": -23.857492446899414, "global_step": 193058, "epoch": 2326} {"train_loss": -23.883121490478516, "global_step": 193059, "epoch": 2326} {"train_loss": -24.21870994567871, "global_step": 193060, "epoch": 2326} {"train_loss": -24.03009605407715, "global_step": 193061, "epoch": 2326} {"train_loss": -23.554258346557617, "global_step": 193062, "epoch": 2326} {"train_loss": -24.076454162597656, "global_step": 193063, "epoch": 2326} {"train_loss": -24.370540618896484, "global_step": 193064, "epoch": 2326} {"train_loss": -23.875965118408203, "global_step": 193065, "epoch": 2326} {"train_loss": -24.106252670288086, "global_step": 193066, "epoch": 2326} {"train_loss": -23.633874893188477, "global_step": 193067, "epoch": 2326} {"train_loss": -24.015554428100586, "global_step": 193068, "epoch": 2326} {"train_loss": -23.924266815185547, "global_step": 193069, "epoch": 2326} {"train_loss": -23.94209861755371, "global_step": 193070, "epoch": 2326} {"train_loss": -23.718158721923828, "global_step": 193071, "epoch": 2326} {"train_loss": -24.221120834350586, "global_step": 193072, "epoch": 2326} {"train_loss": -23.91414451599121, "global_step": 193073, "epoch": 2326} {"train_loss": -23.64161491394043, "global_step": 193074, "epoch": 2326} {"train_loss": -24.16016960144043, "global_step": 193075, "epoch": 2326} {"train_loss": -23.71547508239746, "global_step": 193076, "epoch": 2326} {"train_loss": -23.92024040222168, "global_step": 193077, "epoch": 2326} {"train_loss": -23.922786712646484, "global_step": 193078, "epoch": 2326} {"train_loss": -23.54939842224121, "global_step": 193079, "epoch": 2326} {"train_loss": -24.05384635925293, "global_step": 193080, "epoch": 2326} {"train_loss": -24.147886276245117, "global_step": 193081, "epoch": 2326} {"train_loss": -24.242416381835938, "global_step": 193082, "epoch": 2326} {"train_loss": -24.070005416870117, "global_step": 193083, "epoch": 2326} {"train_loss": -24.427078247070312, "global_step": 193084, "epoch": 2326} {"train_loss": -23.87922477722168, "global_step": 193085, "epoch": 2326} {"train_loss": -24.129230499267578, "global_step": 193086, "epoch": 2326} {"train_loss": -23.93783187866211, "global_step": 193087, "epoch": 2326} {"train_loss": -24.30556297302246, "global_step": 193088, "epoch": 2326} {"train_loss": -24.14136505126953, "global_step": 193089, "epoch": 2326} {"train_loss": -24.0688533782959, "global_step": 193090, "epoch": 2326} {"train_loss": -24.378707885742188, "global_step": 193091, "epoch": 2326} {"train_loss": -24.368070602416992, "global_step": 193092, "epoch": 2326} {"train_loss": -24.25516700744629, "global_step": 193093, "epoch": 2326} {"train_loss": -23.935758590698242, "global_step": 193094, "epoch": 2326} {"train_loss": -23.975940704345703, "global_step": 193095, "epoch": 2326} {"train_loss": -24.285829544067383, "global_step": 193096, "epoch": 2326} {"train_loss": -24.42988395690918, "global_step": 193097, "epoch": 2326} {"train_loss": -24.40802574157715, "global_step": 193098, "epoch": 2326} {"train_loss": -24.457935333251953, "global_step": 193099, "epoch": 2326} {"train_loss": -24.106441497802734, "global_step": 193100, "epoch": 2326} {"train_loss": -24.175474166870117, "global_step": 193101, "epoch": 2326} {"train_loss": -24.129592895507812, "global_step": 193102, "epoch": 2326} {"train_loss": -24.37213134765625, "global_step": 193103, "epoch": 2326} {"train_loss": -24.364852905273438, "global_step": 193104, "epoch": 2326} {"train_loss": -24.414321899414062, "global_step": 193105, "epoch": 2326} {"train_loss": -24.33911895751953, "global_step": 193106, "epoch": 2326} {"train_loss": -24.233192443847656, "global_step": 193107, "epoch": 2326} {"train_loss": -24.2586727142334, "global_step": 193108, "epoch": 2326} {"train_loss": -24.183929443359375, "global_step": 193109, "epoch": 2326} {"train_loss": -24.27899742126465, "global_step": 193110, "epoch": 2326} {"train_loss": -24.537519454956055, "global_step": 193111, "epoch": 2326} {"train_loss": -24.707738876342773, "global_step": 193112, "epoch": 2326} {"train_loss": -23.920047760009766, "global_step": 193113, "epoch": 2326} {"train_loss": -24.112716674804688, "global_step": 193114, "epoch": 2326} {"train_loss": -23.724729537963867, "global_step": 193115, "epoch": 2326} {"train_loss": -23.04836082458496, "global_step": 193116, "epoch": 2326} {"train_loss": -23.04140281677246, "global_step": 193117, "epoch": 2326} {"train_loss": -23.54520606994629, "global_step": 193118, "epoch": 2326} {"train_loss": -23.989866256713867, "global_step": 193119, "epoch": 2326} {"train_loss": -23.37681007385254, "global_step": 193120, "epoch": 2326} {"train_loss": -23.645742416381836, "global_step": 193121, "epoch": 2326} {"train_loss": -24.050371170043945, "global_step": 193122, "epoch": 2326} {"train_loss": -24.05588150024414, "global_step": 193123, "epoch": 2326} {"train_loss": -24.147214889526367, "global_step": 193124, "epoch": 2326} {"train_loss": -23.762784957885742, "global_step": 193125, "epoch": 2326} {"train_loss": -24.25363540649414, "global_step": 193126, "epoch": 2326} {"train_loss": -23.927270889282227, "global_step": 193127, "epoch": 2326} {"train_loss": -23.94887351989746, "global_step": 193128, "epoch": 2326} {"train_loss": -24.193449020385742, "global_step": 193129, "epoch": 2326} {"train_loss": -23.976858139038086, "global_step": 193130, "epoch": 2326} {"train_loss": -24.340110778808594, "global_step": 193131, "epoch": 2326} {"train_loss": -24.083572387695312, "global_step": 193132, "epoch": 2326} {"train_loss": -24.14101219177246, "global_step": 193133, "epoch": 2326} {"train_loss": -23.991979598999023, "global_step": 193134, "epoch": 2326} {"train_loss": -23.927520751953125, "global_step": 193135, "epoch": 2326} {"train_loss": -24.247961044311523, "global_step": 193136, "epoch": 2326} {"train_loss": -23.889434814453125, "global_step": 193137, "epoch": 2326} {"train_loss": -24.104047775268555, "global_step": 193138, "epoch": 2326} {"train_loss": -23.78556251525879, "global_step": 193139, "epoch": 2326} {"train_loss": -24.041086081998895, "global_step": 193140, "epoch": 2326, "val_loss": 6436992.0} {"train_loss": -23.87018585205078, "global_step": 193141, "epoch": 2327} {"train_loss": -23.036130905151367, "global_step": 193142, "epoch": 2327} {"train_loss": -23.652414321899414, "global_step": 193143, "epoch": 2327} {"train_loss": -23.6761417388916, "global_step": 193144, "epoch": 2327} {"train_loss": -23.853086471557617, "global_step": 193145, "epoch": 2327} {"train_loss": -23.80971336364746, "global_step": 193146, "epoch": 2327} {"train_loss": -23.54779624938965, "global_step": 193147, "epoch": 2327} {"train_loss": -23.827054977416992, "global_step": 193148, "epoch": 2327} {"train_loss": -23.445785522460938, "global_step": 193149, "epoch": 2327} {"train_loss": -23.5662899017334, "global_step": 193150, "epoch": 2327} {"train_loss": -23.649290084838867, "global_step": 193151, "epoch": 2327} {"train_loss": -23.90181541442871, "global_step": 193152, "epoch": 2327} {"train_loss": -23.83465003967285, "global_step": 193153, "epoch": 2327} {"train_loss": -23.992841720581055, "global_step": 193154, "epoch": 2327} {"train_loss": -23.890634536743164, "global_step": 193155, "epoch": 2327} {"train_loss": -24.03620719909668, "global_step": 193156, "epoch": 2327} {"train_loss": -23.819232940673828, "global_step": 193157, "epoch": 2327} {"train_loss": -24.1651668548584, "global_step": 193158, "epoch": 2327} {"train_loss": -23.887939453125, "global_step": 193159, "epoch": 2327} {"train_loss": -23.96598243713379, "global_step": 193160, "epoch": 2327} {"train_loss": -24.08090591430664, "global_step": 193161, "epoch": 2327} {"train_loss": -23.93534278869629, "global_step": 193162, "epoch": 2327} {"train_loss": -24.418867111206055, "global_step": 193163, "epoch": 2327} {"train_loss": -23.897125244140625, "global_step": 193164, "epoch": 2327} {"train_loss": -24.378238677978516, "global_step": 193165, "epoch": 2327} {"train_loss": -23.986186981201172, "global_step": 193166, "epoch": 2327} {"train_loss": -24.16078758239746, "global_step": 193167, "epoch": 2327} {"train_loss": -24.292123794555664, "global_step": 193168, "epoch": 2327} {"train_loss": -24.133586883544922, "global_step": 193169, "epoch": 2327} {"train_loss": -23.904314041137695, "global_step": 193170, "epoch": 2327} {"train_loss": -24.027013778686523, "global_step": 193171, "epoch": 2327} {"train_loss": -24.18568229675293, "global_step": 193172, "epoch": 2327} {"train_loss": -24.52086639404297, "global_step": 193173, "epoch": 2327} {"train_loss": -23.75033187866211, "global_step": 193174, "epoch": 2327} {"train_loss": -24.371795654296875, "global_step": 193175, "epoch": 2327} {"train_loss": -24.570158004760742, "global_step": 193176, "epoch": 2327} {"train_loss": -24.094327926635742, "global_step": 193177, "epoch": 2327} {"train_loss": -24.31553077697754, "global_step": 193178, "epoch": 2327} {"train_loss": -24.01509666442871, "global_step": 193179, "epoch": 2327} {"train_loss": -24.1630916595459, "global_step": 193180, "epoch": 2327} {"train_loss": -23.788328170776367, "global_step": 193181, "epoch": 2327} {"train_loss": -24.424518585205078, "global_step": 193182, "epoch": 2327} {"train_loss": -23.973398208618164, "global_step": 193183, "epoch": 2327} {"train_loss": -24.50255584716797, "global_step": 193184, "epoch": 2327} {"train_loss": -24.204294204711914, "global_step": 193185, "epoch": 2327} {"train_loss": -24.3294677734375, "global_step": 193186, "epoch": 2327} {"train_loss": -24.613481521606445, "global_step": 193187, "epoch": 2327} {"train_loss": -23.9952449798584, "global_step": 193188, "epoch": 2327} {"train_loss": -23.976560592651367, "global_step": 193189, "epoch": 2327} {"train_loss": -24.008426666259766, "global_step": 193190, "epoch": 2327} {"train_loss": -24.46310806274414, "global_step": 193191, "epoch": 2327} {"train_loss": -24.312381744384766, "global_step": 193192, "epoch": 2327} {"train_loss": -24.435440063476562, "global_step": 193193, "epoch": 2327} {"train_loss": -23.830053329467773, "global_step": 193194, "epoch": 2327} {"train_loss": -24.11293601989746, "global_step": 193195, "epoch": 2327} {"train_loss": -24.159841537475586, "global_step": 193196, "epoch": 2327} {"train_loss": -24.017484664916992, "global_step": 193197, "epoch": 2327} {"train_loss": -24.54664421081543, "global_step": 193198, "epoch": 2327} {"train_loss": -24.608518600463867, "global_step": 193199, "epoch": 2327} {"train_loss": -24.124330520629883, "global_step": 193200, "epoch": 2327} {"train_loss": -24.031278610229492, "global_step": 193201, "epoch": 2327} {"train_loss": -23.9696102142334, "global_step": 193202, "epoch": 2327} {"train_loss": -24.33184814453125, "global_step": 193203, "epoch": 2327} {"train_loss": -23.998233795166016, "global_step": 193204, "epoch": 2327} {"train_loss": -24.2586727142334, "global_step": 193205, "epoch": 2327} {"train_loss": -24.394058227539062, "global_step": 193206, "epoch": 2327} {"train_loss": -24.379865646362305, "global_step": 193207, "epoch": 2327} {"train_loss": -23.88346290588379, "global_step": 193208, "epoch": 2327} {"train_loss": -23.87870979309082, "global_step": 193209, "epoch": 2327} {"train_loss": -24.469406127929688, "global_step": 193210, "epoch": 2327} {"train_loss": -24.200576782226562, "global_step": 193211, "epoch": 2327} {"train_loss": -24.033018112182617, "global_step": 193212, "epoch": 2327} {"train_loss": -24.061904907226562, "global_step": 193213, "epoch": 2327} {"train_loss": -24.21272087097168, "global_step": 193214, "epoch": 2327} {"train_loss": -24.647174835205078, "global_step": 193215, "epoch": 2327} {"train_loss": -24.2142391204834, "global_step": 193216, "epoch": 2327} {"train_loss": -24.406110763549805, "global_step": 193217, "epoch": 2327} {"train_loss": -24.057676315307617, "global_step": 193218, "epoch": 2327} {"train_loss": -23.98607063293457, "global_step": 193219, "epoch": 2327} {"train_loss": -24.140613555908203, "global_step": 193220, "epoch": 2327} {"train_loss": -23.915042877197266, "global_step": 193221, "epoch": 2327} {"train_loss": -24.300634384155273, "global_step": 193222, "epoch": 2327} {"train_loss": -24.07842845227345, "global_step": 193223, "epoch": 2327, "val_loss": 6591630.0} {"train_loss": -23.7049560546875, "global_step": 193224, "epoch": 2328} {"train_loss": -23.494688034057617, "global_step": 193225, "epoch": 2328} {"train_loss": -24.070833206176758, "global_step": 193226, "epoch": 2328} {"train_loss": -23.766523361206055, "global_step": 193227, "epoch": 2328} {"train_loss": -23.332204818725586, "global_step": 193228, "epoch": 2328} {"train_loss": -23.877973556518555, "global_step": 193229, "epoch": 2328} {"train_loss": -23.679672241210938, "global_step": 193230, "epoch": 2328} {"train_loss": -23.915029525756836, "global_step": 193231, "epoch": 2328} {"train_loss": -24.09284019470215, "global_step": 193232, "epoch": 2328} {"train_loss": -23.728208541870117, "global_step": 193233, "epoch": 2328} {"train_loss": -23.859106063842773, "global_step": 193234, "epoch": 2328} {"train_loss": -23.828983306884766, "global_step": 193235, "epoch": 2328} {"train_loss": -23.803730010986328, "global_step": 193236, "epoch": 2328} {"train_loss": -23.582529067993164, "global_step": 193237, "epoch": 2328} {"train_loss": -23.704944610595703, "global_step": 193238, "epoch": 2328} {"train_loss": -24.233715057373047, "global_step": 193239, "epoch": 2328} {"train_loss": -23.72271728515625, "global_step": 193240, "epoch": 2328} {"train_loss": -24.058401107788086, "global_step": 193241, "epoch": 2328} {"train_loss": -23.979965209960938, "global_step": 193242, "epoch": 2328} {"train_loss": -23.961217880249023, "global_step": 193243, "epoch": 2328} {"train_loss": -24.270376205444336, "global_step": 193244, "epoch": 2328} {"train_loss": -24.142173767089844, "global_step": 193245, "epoch": 2328} {"train_loss": -24.025089263916016, "global_step": 193246, "epoch": 2328} {"train_loss": -23.73052978515625, "global_step": 193247, "epoch": 2328} {"train_loss": -23.9390811920166, "global_step": 193248, "epoch": 2328} {"train_loss": -24.23969078063965, "global_step": 193249, "epoch": 2328} {"train_loss": -24.16187858581543, "global_step": 193250, "epoch": 2328} {"train_loss": -24.122831344604492, "global_step": 193251, "epoch": 2328} {"train_loss": -23.73333740234375, "global_step": 193252, "epoch": 2328} {"train_loss": -24.17032814025879, "global_step": 193253, "epoch": 2328} {"train_loss": -24.053695678710938, "global_step": 193254, "epoch": 2328} {"train_loss": -24.166006088256836, "global_step": 193255, "epoch": 2328} {"train_loss": -24.179868698120117, "global_step": 193256, "epoch": 2328} {"train_loss": -23.986438751220703, "global_step": 193257, "epoch": 2328} {"train_loss": -24.528461456298828, "global_step": 193258, "epoch": 2328} {"train_loss": -24.39405632019043, "global_step": 193259, "epoch": 2328} {"train_loss": -23.863889694213867, "global_step": 193260, "epoch": 2328} {"train_loss": -24.078594207763672, "global_step": 193261, "epoch": 2328} {"train_loss": -24.163089752197266, "global_step": 193262, "epoch": 2328} {"train_loss": -24.370685577392578, "global_step": 193263, "epoch": 2328} {"train_loss": -24.46418571472168, "global_step": 193264, "epoch": 2328} {"train_loss": -24.268739700317383, "global_step": 193265, "epoch": 2328} {"train_loss": -24.396291732788086, "global_step": 193266, "epoch": 2328} {"train_loss": -24.187057495117188, "global_step": 193267, "epoch": 2328} {"train_loss": -24.268339157104492, "global_step": 193268, "epoch": 2328} {"train_loss": -24.392383575439453, "global_step": 193269, "epoch": 2328} {"train_loss": -24.489526748657227, "global_step": 193270, "epoch": 2328} {"train_loss": -24.28010368347168, "global_step": 193271, "epoch": 2328} {"train_loss": -24.360197067260742, "global_step": 193272, "epoch": 2328} {"train_loss": -24.27817726135254, "global_step": 193273, "epoch": 2328} {"train_loss": -24.442642211914062, "global_step": 193274, "epoch": 2328} {"train_loss": -24.368125915527344, "global_step": 193275, "epoch": 2328} {"train_loss": -24.358869552612305, "global_step": 193276, "epoch": 2328} {"train_loss": -24.666488647460938, "global_step": 193277, "epoch": 2328} {"train_loss": -24.26040267944336, "global_step": 193278, "epoch": 2328} {"train_loss": -24.060964584350586, "global_step": 193279, "epoch": 2328} {"train_loss": -24.083850860595703, "global_step": 193280, "epoch": 2328} {"train_loss": -23.77617835998535, "global_step": 193281, "epoch": 2328} {"train_loss": -24.216337203979492, "global_step": 193282, "epoch": 2328} {"train_loss": -23.63215446472168, "global_step": 193283, "epoch": 2328} {"train_loss": -24.264142990112305, "global_step": 193284, "epoch": 2328} {"train_loss": -24.115371704101562, "global_step": 193285, "epoch": 2328} {"train_loss": -23.96681022644043, "global_step": 193286, "epoch": 2328} {"train_loss": -24.29475975036621, "global_step": 193287, "epoch": 2328} {"train_loss": -23.946613311767578, "global_step": 193288, "epoch": 2328} {"train_loss": -24.521018981933594, "global_step": 193289, "epoch": 2328} {"train_loss": -23.87295913696289, "global_step": 193290, "epoch": 2328} {"train_loss": -24.37053680419922, "global_step": 193291, "epoch": 2328} {"train_loss": -24.14790916442871, "global_step": 193292, "epoch": 2328} {"train_loss": -24.286745071411133, "global_step": 193293, "epoch": 2328} {"train_loss": -24.244726181030273, "global_step": 193294, "epoch": 2328} {"train_loss": -24.254871368408203, "global_step": 193295, "epoch": 2328} {"train_loss": -24.140037536621094, "global_step": 193296, "epoch": 2328} {"train_loss": -24.259540557861328, "global_step": 193297, "epoch": 2328} {"train_loss": -24.137435913085938, "global_step": 193298, "epoch": 2328} {"train_loss": -23.911184310913086, "global_step": 193299, "epoch": 2328} {"train_loss": -24.044189453125, "global_step": 193300, "epoch": 2328} {"train_loss": -23.9907169342041, "global_step": 193301, "epoch": 2328} {"train_loss": -24.356002807617188, "global_step": 193302, "epoch": 2328} {"train_loss": -24.510663986206055, "global_step": 193303, "epoch": 2328} {"train_loss": -24.2297420501709, "global_step": 193304, "epoch": 2328} {"train_loss": -24.193071365356445, "global_step": 193305, "epoch": 2328} {"train_loss": -24.100271339876105, "global_step": 193306, "epoch": 2328, "val_loss": 6636233.0} {"train_loss": -22.030107498168945, "global_step": 193307, "epoch": 2329} {"train_loss": -20.885713577270508, "global_step": 193308, "epoch": 2329} {"train_loss": -23.124799728393555, "global_step": 193309, "epoch": 2329} {"train_loss": -23.044740676879883, "global_step": 193310, "epoch": 2329} {"train_loss": -22.23122215270996, "global_step": 193311, "epoch": 2329} {"train_loss": -23.661890029907227, "global_step": 193312, "epoch": 2329} {"train_loss": -22.96674919128418, "global_step": 193313, "epoch": 2329} {"train_loss": -22.893844604492188, "global_step": 193314, "epoch": 2329} {"train_loss": -22.880233764648438, "global_step": 193315, "epoch": 2329} {"train_loss": -22.676944732666016, "global_step": 193316, "epoch": 2329} {"train_loss": -22.9977970123291, "global_step": 193317, "epoch": 2329} {"train_loss": -23.018478393554688, "global_step": 193318, "epoch": 2329} {"train_loss": -22.935152053833008, "global_step": 193319, "epoch": 2329} {"train_loss": -23.303176879882812, "global_step": 193320, "epoch": 2329} {"train_loss": -23.04543113708496, "global_step": 193321, "epoch": 2329} {"train_loss": -23.371475219726562, "global_step": 193322, "epoch": 2329} {"train_loss": -23.389936447143555, "global_step": 193323, "epoch": 2329} {"train_loss": -23.305444717407227, "global_step": 193324, "epoch": 2329} {"train_loss": -23.522586822509766, "global_step": 193325, "epoch": 2329} {"train_loss": -23.58829116821289, "global_step": 193326, "epoch": 2329} {"train_loss": -23.73172950744629, "global_step": 193327, "epoch": 2329} {"train_loss": -23.681358337402344, "global_step": 193328, "epoch": 2329} {"train_loss": -23.187545776367188, "global_step": 193329, "epoch": 2329} {"train_loss": -23.458667755126953, "global_step": 193330, "epoch": 2329} {"train_loss": -23.51645278930664, "global_step": 193331, "epoch": 2329} {"train_loss": -23.552555084228516, "global_step": 193332, "epoch": 2329} {"train_loss": -23.301633834838867, "global_step": 193333, "epoch": 2329} {"train_loss": -23.875917434692383, "global_step": 193334, "epoch": 2329} {"train_loss": -23.733627319335938, "global_step": 193335, "epoch": 2329} {"train_loss": -23.598085403442383, "global_step": 193336, "epoch": 2329} {"train_loss": -23.783605575561523, "global_step": 193337, "epoch": 2329} {"train_loss": -23.779571533203125, "global_step": 193338, "epoch": 2329} {"train_loss": -23.99262809753418, "global_step": 193339, "epoch": 2329} {"train_loss": -23.919631958007812, "global_step": 193340, "epoch": 2329} {"train_loss": -24.290319442749023, "global_step": 193341, "epoch": 2329} {"train_loss": -23.95556640625, "global_step": 193342, "epoch": 2329} {"train_loss": -24.099645614624023, "global_step": 193343, "epoch": 2329} {"train_loss": -23.993757247924805, "global_step": 193344, "epoch": 2329} {"train_loss": -24.267629623413086, "global_step": 193345, "epoch": 2329} {"train_loss": -23.95674705505371, "global_step": 193346, "epoch": 2329} {"train_loss": -23.954898834228516, "global_step": 193347, "epoch": 2329} {"train_loss": -24.14110565185547, "global_step": 193348, "epoch": 2329} {"train_loss": -23.935474395751953, "global_step": 193349, "epoch": 2329} {"train_loss": -24.25290870666504, "global_step": 193350, "epoch": 2329} {"train_loss": -24.180374145507812, "global_step": 193351, "epoch": 2329} {"train_loss": -24.14499282836914, "global_step": 193352, "epoch": 2329} {"train_loss": -24.28394889831543, "global_step": 193353, "epoch": 2329} {"train_loss": -24.04175567626953, "global_step": 193354, "epoch": 2329} {"train_loss": -24.35274314880371, "global_step": 193355, "epoch": 2329} {"train_loss": -24.29706382751465, "global_step": 193356, "epoch": 2329} {"train_loss": -24.18642234802246, "global_step": 193357, "epoch": 2329} {"train_loss": -24.340320587158203, "global_step": 193358, "epoch": 2329} {"train_loss": -24.34237289428711, "global_step": 193359, "epoch": 2329} {"train_loss": -24.437938690185547, "global_step": 193360, "epoch": 2329} {"train_loss": -24.281024932861328, "global_step": 193361, "epoch": 2329} {"train_loss": -24.35821533203125, "global_step": 193362, "epoch": 2329} {"train_loss": -24.358600616455078, "global_step": 193363, "epoch": 2329} {"train_loss": -24.148422241210938, "global_step": 193364, "epoch": 2329} {"train_loss": -24.15228843688965, "global_step": 193365, "epoch": 2329} {"train_loss": -23.909666061401367, "global_step": 193366, "epoch": 2329} {"train_loss": -23.8756046295166, "global_step": 193367, "epoch": 2329} {"train_loss": -24.64874267578125, "global_step": 193368, "epoch": 2329} {"train_loss": -24.172204971313477, "global_step": 193369, "epoch": 2329} {"train_loss": -24.22295570373535, "global_step": 193370, "epoch": 2329} {"train_loss": -24.08119010925293, "global_step": 193371, "epoch": 2329} {"train_loss": -24.087995529174805, "global_step": 193372, "epoch": 2329} {"train_loss": -24.48455810546875, "global_step": 193373, "epoch": 2329} {"train_loss": -23.779470443725586, "global_step": 193374, "epoch": 2329} {"train_loss": -23.725400924682617, "global_step": 193375, "epoch": 2329} {"train_loss": -24.09545135498047, "global_step": 193376, "epoch": 2329} {"train_loss": -24.173259735107422, "global_step": 193377, "epoch": 2329} {"train_loss": -24.18878936767578, "global_step": 193378, "epoch": 2329} {"train_loss": -24.47318458557129, "global_step": 193379, "epoch": 2329} {"train_loss": -24.236190795898438, "global_step": 193380, "epoch": 2329} {"train_loss": -24.195905685424805, "global_step": 193381, "epoch": 2329} {"train_loss": -24.166229248046875, "global_step": 193382, "epoch": 2329} {"train_loss": -24.186100006103516, "global_step": 193383, "epoch": 2329} {"train_loss": -23.928184509277344, "global_step": 193384, "epoch": 2329} {"train_loss": -24.134084701538086, "global_step": 193385, "epoch": 2329} {"train_loss": -24.144412994384766, "global_step": 193386, "epoch": 2329} {"train_loss": -23.894790649414062, "global_step": 193387, "epoch": 2329} {"train_loss": -23.96907615661621, "global_step": 193388, "epoch": 2329} {"train_loss": -23.784584482032134, "global_step": 193389, "epoch": 2329, "val_loss": 6541867.5} {"train_loss": -24.145965576171875, "global_step": 193390, "epoch": 2330} {"train_loss": -24.157468795776367, "global_step": 193391, "epoch": 2330} {"train_loss": -24.057361602783203, "global_step": 193392, "epoch": 2330} {"train_loss": -23.903837203979492, "global_step": 193393, "epoch": 2330} {"train_loss": -24.03040885925293, "global_step": 193394, "epoch": 2330} {"train_loss": -24.000913619995117, "global_step": 193395, "epoch": 2330} {"train_loss": -23.799421310424805, "global_step": 193396, "epoch": 2330} {"train_loss": -23.796741485595703, "global_step": 193397, "epoch": 2330} {"train_loss": -23.51138687133789, "global_step": 193398, "epoch": 2330} {"train_loss": -24.04945182800293, "global_step": 193399, "epoch": 2330} {"train_loss": -24.101850509643555, "global_step": 193400, "epoch": 2330} {"train_loss": -23.944290161132812, "global_step": 193401, "epoch": 2330} {"train_loss": -23.85945701599121, "global_step": 193402, "epoch": 2330} {"train_loss": -23.84821891784668, "global_step": 193403, "epoch": 2330} {"train_loss": -24.331363677978516, "global_step": 193404, "epoch": 2330} {"train_loss": -23.99567413330078, "global_step": 193405, "epoch": 2330} {"train_loss": -24.311141967773438, "global_step": 193406, "epoch": 2330} {"train_loss": -23.946386337280273, "global_step": 193407, "epoch": 2330} {"train_loss": -23.995878219604492, "global_step": 193408, "epoch": 2330} {"train_loss": -24.209203720092773, "global_step": 193409, "epoch": 2330} {"train_loss": -24.08449363708496, "global_step": 193410, "epoch": 2330} {"train_loss": -24.246320724487305, "global_step": 193411, "epoch": 2330} {"train_loss": -24.39756965637207, "global_step": 193412, "epoch": 2330} {"train_loss": -24.181562423706055, "global_step": 193413, "epoch": 2330} {"train_loss": -24.19078826904297, "global_step": 193414, "epoch": 2330} {"train_loss": -24.064189910888672, "global_step": 193415, "epoch": 2330} {"train_loss": -24.044828414916992, "global_step": 193416, "epoch": 2330} {"train_loss": -24.640966415405273, "global_step": 193417, "epoch": 2330} {"train_loss": -24.04804801940918, "global_step": 193418, "epoch": 2330} {"train_loss": -24.290437698364258, "global_step": 193419, "epoch": 2330} {"train_loss": -24.144840240478516, "global_step": 193420, "epoch": 2330} {"train_loss": -24.211027145385742, "global_step": 193421, "epoch": 2330} {"train_loss": -24.391664505004883, "global_step": 193422, "epoch": 2330} {"train_loss": -24.103933334350586, "global_step": 193423, "epoch": 2330} {"train_loss": -24.278888702392578, "global_step": 193424, "epoch": 2330} {"train_loss": -24.210725784301758, "global_step": 193425, "epoch": 2330} {"train_loss": -24.0028018951416, "global_step": 193426, "epoch": 2330} {"train_loss": -24.012516021728516, "global_step": 193427, "epoch": 2330} {"train_loss": -24.194700241088867, "global_step": 193428, "epoch": 2330} {"train_loss": -24.359418869018555, "global_step": 193429, "epoch": 2330} {"train_loss": -24.509078979492188, "global_step": 193430, "epoch": 2330} {"train_loss": -24.44385528564453, "global_step": 193431, "epoch": 2330} {"train_loss": -24.077957153320312, "global_step": 193432, "epoch": 2330} {"train_loss": -24.14267349243164, "global_step": 193433, "epoch": 2330} {"train_loss": -24.146169662475586, "global_step": 193434, "epoch": 2330} {"train_loss": -24.725675582885742, "global_step": 193435, "epoch": 2330} {"train_loss": -24.306533813476562, "global_step": 193436, "epoch": 2330} {"train_loss": -24.471721649169922, "global_step": 193437, "epoch": 2330} {"train_loss": -24.31031608581543, "global_step": 193438, "epoch": 2330} {"train_loss": -24.460718154907227, "global_step": 193439, "epoch": 2330} {"train_loss": -23.944517135620117, "global_step": 193440, "epoch": 2330} {"train_loss": -23.97275161743164, "global_step": 193441, "epoch": 2330} {"train_loss": -24.06235122680664, "global_step": 193442, "epoch": 2330} {"train_loss": -23.953371047973633, "global_step": 193443, "epoch": 2330} {"train_loss": -23.977521896362305, "global_step": 193444, "epoch": 2330} {"train_loss": -24.0726318359375, "global_step": 193445, "epoch": 2330} {"train_loss": -24.141199111938477, "global_step": 193446, "epoch": 2330} {"train_loss": -24.390045166015625, "global_step": 193447, "epoch": 2330} {"train_loss": -24.053056716918945, "global_step": 193448, "epoch": 2330} {"train_loss": -24.014951705932617, "global_step": 193449, "epoch": 2330} {"train_loss": -24.10204315185547, "global_step": 193450, "epoch": 2330} {"train_loss": -24.3256893157959, "global_step": 193451, "epoch": 2330} {"train_loss": -24.293668746948242, "global_step": 193452, "epoch": 2330} {"train_loss": -23.86787986755371, "global_step": 193453, "epoch": 2330} {"train_loss": -24.356870651245117, "global_step": 193454, "epoch": 2330} {"train_loss": -24.08970069885254, "global_step": 193455, "epoch": 2330} {"train_loss": -23.865970611572266, "global_step": 193456, "epoch": 2330} {"train_loss": -24.027738571166992, "global_step": 193457, "epoch": 2330} {"train_loss": -24.29987144470215, "global_step": 193458, "epoch": 2330} {"train_loss": -23.968189239501953, "global_step": 193459, "epoch": 2330} {"train_loss": -24.149494171142578, "global_step": 193460, "epoch": 2330} {"train_loss": -24.061843872070312, "global_step": 193461, "epoch": 2330} {"train_loss": -23.98979377746582, "global_step": 193462, "epoch": 2330} {"train_loss": -24.245071411132812, "global_step": 193463, "epoch": 2330} {"train_loss": -24.169668197631836, "global_step": 193464, "epoch": 2330} {"train_loss": -24.013151168823242, "global_step": 193465, "epoch": 2330} {"train_loss": -24.084980010986328, "global_step": 193466, "epoch": 2330} {"train_loss": -24.446910858154297, "global_step": 193467, "epoch": 2330} {"train_loss": -24.044876098632812, "global_step": 193468, "epoch": 2330} {"train_loss": -24.346006393432617, "global_step": 193469, "epoch": 2330} {"train_loss": -24.641525268554688, "global_step": 193470, "epoch": 2330} {"train_loss": -23.993030548095703, "global_step": 193471, "epoch": 2330} {"train_loss": -24.154859450926264, "global_step": 193472, "epoch": 2330, "val_loss": 6511076.0} {"train_loss": -23.726154327392578, "global_step": 193473, "epoch": 2331} {"train_loss": -23.427690505981445, "global_step": 193474, "epoch": 2331} {"train_loss": -23.680830001831055, "global_step": 193475, "epoch": 2331} {"train_loss": -23.397268295288086, "global_step": 193476, "epoch": 2331} {"train_loss": -23.53309440612793, "global_step": 193477, "epoch": 2331} {"train_loss": -23.509174346923828, "global_step": 193478, "epoch": 2331} {"train_loss": -23.824583053588867, "global_step": 193479, "epoch": 2331} {"train_loss": -23.654712677001953, "global_step": 193480, "epoch": 2331} {"train_loss": -23.175630569458008, "global_step": 193481, "epoch": 2331} {"train_loss": -24.154203414916992, "global_step": 193482, "epoch": 2331} {"train_loss": -23.70868492126465, "global_step": 193483, "epoch": 2331} {"train_loss": -24.165512084960938, "global_step": 193484, "epoch": 2331} {"train_loss": -23.65496253967285, "global_step": 193485, "epoch": 2331} {"train_loss": -24.296154022216797, "global_step": 193486, "epoch": 2331} {"train_loss": -24.088659286499023, "global_step": 193487, "epoch": 2331} {"train_loss": -24.25996208190918, "global_step": 193488, "epoch": 2331} {"train_loss": -24.206159591674805, "global_step": 193489, "epoch": 2331} {"train_loss": -23.8046932220459, "global_step": 193490, "epoch": 2331} {"train_loss": -23.91895866394043, "global_step": 193491, "epoch": 2331} {"train_loss": -23.673755645751953, "global_step": 193492, "epoch": 2331} {"train_loss": -24.117813110351562, "global_step": 193493, "epoch": 2331} {"train_loss": -23.885013580322266, "global_step": 193494, "epoch": 2331} {"train_loss": -24.274612426757812, "global_step": 193495, "epoch": 2331} {"train_loss": -24.25127601623535, "global_step": 193496, "epoch": 2331} {"train_loss": -24.275524139404297, "global_step": 193497, "epoch": 2331} {"train_loss": -23.90506362915039, "global_step": 193498, "epoch": 2331} {"train_loss": -23.835783004760742, "global_step": 193499, "epoch": 2331} {"train_loss": -24.371854782104492, "global_step": 193500, "epoch": 2331} {"train_loss": -23.82002067565918, "global_step": 193501, "epoch": 2331} {"train_loss": -24.26869773864746, "global_step": 193502, "epoch": 2331} {"train_loss": -24.389127731323242, "global_step": 193503, "epoch": 2331} {"train_loss": -23.87347412109375, "global_step": 193504, "epoch": 2331} {"train_loss": -24.206069946289062, "global_step": 193505, "epoch": 2331} {"train_loss": -24.088409423828125, "global_step": 193506, "epoch": 2331} {"train_loss": -24.343107223510742, "global_step": 193507, "epoch": 2331} {"train_loss": -24.138423919677734, "global_step": 193508, "epoch": 2331} {"train_loss": -24.232139587402344, "global_step": 193509, "epoch": 2331} {"train_loss": -24.041051864624023, "global_step": 193510, "epoch": 2331} {"train_loss": -24.178131103515625, "global_step": 193511, "epoch": 2331} {"train_loss": -24.203847885131836, "global_step": 193512, "epoch": 2331} {"train_loss": -24.03977394104004, "global_step": 193513, "epoch": 2331} {"train_loss": -24.448434829711914, "global_step": 193514, "epoch": 2331} {"train_loss": -23.862701416015625, "global_step": 193515, "epoch": 2331} {"train_loss": -24.437891006469727, "global_step": 193516, "epoch": 2331} {"train_loss": -24.325641632080078, "global_step": 193517, "epoch": 2331} {"train_loss": -23.93558120727539, "global_step": 193518, "epoch": 2331} {"train_loss": -24.1533260345459, "global_step": 193519, "epoch": 2331} {"train_loss": -24.162874221801758, "global_step": 193520, "epoch": 2331} {"train_loss": -24.190570831298828, "global_step": 193521, "epoch": 2331} {"train_loss": -24.509506225585938, "global_step": 193522, "epoch": 2331} {"train_loss": -24.418556213378906, "global_step": 193523, "epoch": 2331} {"train_loss": -24.017833709716797, "global_step": 193524, "epoch": 2331} {"train_loss": -24.008134841918945, "global_step": 193525, "epoch": 2331} {"train_loss": -24.057025909423828, "global_step": 193526, "epoch": 2331} {"train_loss": -24.104034423828125, "global_step": 193527, "epoch": 2331} {"train_loss": -24.212507247924805, "global_step": 193528, "epoch": 2331} {"train_loss": -23.772253036499023, "global_step": 193529, "epoch": 2331} {"train_loss": -24.05510711669922, "global_step": 193530, "epoch": 2331} {"train_loss": -24.252920150756836, "global_step": 193531, "epoch": 2331} {"train_loss": -24.217771530151367, "global_step": 193532, "epoch": 2331} {"train_loss": -23.970062255859375, "global_step": 193533, "epoch": 2331} {"train_loss": -23.933639526367188, "global_step": 193534, "epoch": 2331} {"train_loss": -24.144813537597656, "global_step": 193535, "epoch": 2331} {"train_loss": -24.04720687866211, "global_step": 193536, "epoch": 2331} {"train_loss": -24.12989044189453, "global_step": 193537, "epoch": 2331} {"train_loss": -24.261255264282227, "global_step": 193538, "epoch": 2331} {"train_loss": -24.16361427307129, "global_step": 193539, "epoch": 2331} {"train_loss": -24.1458797454834, "global_step": 193540, "epoch": 2331} {"train_loss": -24.120630264282227, "global_step": 193541, "epoch": 2331} {"train_loss": -23.856689453125, "global_step": 193542, "epoch": 2331} {"train_loss": -24.060592651367188, "global_step": 193543, "epoch": 2331} {"train_loss": -23.959630966186523, "global_step": 193544, "epoch": 2331} {"train_loss": -23.981643676757812, "global_step": 193545, "epoch": 2331} {"train_loss": -24.00872802734375, "global_step": 193546, "epoch": 2331} {"train_loss": -24.053447723388672, "global_step": 193547, "epoch": 2331} {"train_loss": -23.80192756652832, "global_step": 193548, "epoch": 2331} {"train_loss": -24.196781158447266, "global_step": 193549, "epoch": 2331} {"train_loss": -24.29591178894043, "global_step": 193550, "epoch": 2331} {"train_loss": -24.090084075927734, "global_step": 193551, "epoch": 2331} {"train_loss": -24.265928268432617, "global_step": 193552, "epoch": 2331} {"train_loss": -24.137420654296875, "global_step": 193553, "epoch": 2331} {"train_loss": -24.13529396057129, "global_step": 193554, "epoch": 2331} {"train_loss": -24.042236236204584, "global_step": 193555, "epoch": 2331, "val_loss": 6651582.5} {"train_loss": -23.904722213745117, "global_step": 193556, "epoch": 2332} {"train_loss": -24.07765769958496, "global_step": 193557, "epoch": 2332} {"train_loss": -23.878225326538086, "global_step": 193558, "epoch": 2332} {"train_loss": -23.906421661376953, "global_step": 193559, "epoch": 2332} {"train_loss": -23.776823043823242, "global_step": 193560, "epoch": 2332} {"train_loss": -24.149606704711914, "global_step": 193561, "epoch": 2332} {"train_loss": -24.189178466796875, "global_step": 193562, "epoch": 2332} {"train_loss": -24.013111114501953, "global_step": 193563, "epoch": 2332} {"train_loss": -24.198644638061523, "global_step": 193564, "epoch": 2332} {"train_loss": -23.731382369995117, "global_step": 193565, "epoch": 2332} {"train_loss": -23.371265411376953, "global_step": 193566, "epoch": 2332} {"train_loss": -23.546457290649414, "global_step": 193567, "epoch": 2332} {"train_loss": -24.09130096435547, "global_step": 193568, "epoch": 2332} {"train_loss": -23.700172424316406, "global_step": 193569, "epoch": 2332} {"train_loss": -24.050329208374023, "global_step": 193570, "epoch": 2332} {"train_loss": -23.75553321838379, "global_step": 193571, "epoch": 2332} {"train_loss": -24.17989158630371, "global_step": 193572, "epoch": 2332} {"train_loss": -23.8968563079834, "global_step": 193573, "epoch": 2332} {"train_loss": -24.028427124023438, "global_step": 193574, "epoch": 2332} {"train_loss": -23.826658248901367, "global_step": 193575, "epoch": 2332} {"train_loss": -24.162921905517578, "global_step": 193576, "epoch": 2332} {"train_loss": -24.104352951049805, "global_step": 193577, "epoch": 2332} {"train_loss": -23.799707412719727, "global_step": 193578, "epoch": 2332} {"train_loss": -24.27118492126465, "global_step": 193579, "epoch": 2332} {"train_loss": -24.171152114868164, "global_step": 193580, "epoch": 2332} {"train_loss": -23.89183807373047, "global_step": 193581, "epoch": 2332} {"train_loss": -24.120758056640625, "global_step": 193582, "epoch": 2332} {"train_loss": -24.38961410522461, "global_step": 193583, "epoch": 2332} {"train_loss": -23.99838638305664, "global_step": 193584, "epoch": 2332} {"train_loss": -23.583791732788086, "global_step": 193585, "epoch": 2332} {"train_loss": -24.59507942199707, "global_step": 193586, "epoch": 2332} {"train_loss": -24.017637252807617, "global_step": 193587, "epoch": 2332} {"train_loss": -24.300113677978516, "global_step": 193588, "epoch": 2332} {"train_loss": -24.179576873779297, "global_step": 193589, "epoch": 2332} {"train_loss": -24.436670303344727, "global_step": 193590, "epoch": 2332} {"train_loss": -24.133411407470703, "global_step": 193591, "epoch": 2332} {"train_loss": -24.155189514160156, "global_step": 193592, "epoch": 2332} {"train_loss": -23.94854164123535, "global_step": 193593, "epoch": 2332} {"train_loss": -24.1064395904541, "global_step": 193594, "epoch": 2332} {"train_loss": -24.33466148376465, "global_step": 193595, "epoch": 2332} {"train_loss": -24.11574363708496, "global_step": 193596, "epoch": 2332} {"train_loss": -24.115930557250977, "global_step": 193597, "epoch": 2332} {"train_loss": -23.685440063476562, "global_step": 193598, "epoch": 2332} {"train_loss": -24.244518280029297, "global_step": 193599, "epoch": 2332} {"train_loss": -23.800321578979492, "global_step": 193600, "epoch": 2332} {"train_loss": -24.0120906829834, "global_step": 193601, "epoch": 2332} {"train_loss": -24.102798461914062, "global_step": 193602, "epoch": 2332} {"train_loss": -24.49262809753418, "global_step": 193603, "epoch": 2332} {"train_loss": -24.211652755737305, "global_step": 193604, "epoch": 2332} {"train_loss": -24.070348739624023, "global_step": 193605, "epoch": 2332} {"train_loss": -23.9509334564209, "global_step": 193606, "epoch": 2332} {"train_loss": -23.99775505065918, "global_step": 193607, "epoch": 2332} {"train_loss": -23.749229431152344, "global_step": 193608, "epoch": 2332} {"train_loss": -24.25977897644043, "global_step": 193609, "epoch": 2332} {"train_loss": -24.254194259643555, "global_step": 193610, "epoch": 2332} {"train_loss": -24.134546279907227, "global_step": 193611, "epoch": 2332} {"train_loss": -24.267419815063477, "global_step": 193612, "epoch": 2332} {"train_loss": -24.194486618041992, "global_step": 193613, "epoch": 2332} {"train_loss": -23.898483276367188, "global_step": 193614, "epoch": 2332} {"train_loss": -23.92024040222168, "global_step": 193615, "epoch": 2332} {"train_loss": -24.078580856323242, "global_step": 193616, "epoch": 2332} {"train_loss": -23.967594146728516, "global_step": 193617, "epoch": 2332} {"train_loss": -24.24001121520996, "global_step": 193618, "epoch": 2332} {"train_loss": -24.10883140563965, "global_step": 193619, "epoch": 2332} {"train_loss": -24.350048065185547, "global_step": 193620, "epoch": 2332} {"train_loss": -23.9921817779541, "global_step": 193621, "epoch": 2332} {"train_loss": -24.08698081970215, "global_step": 193622, "epoch": 2332} {"train_loss": -24.10931396484375, "global_step": 193623, "epoch": 2332} {"train_loss": -24.11191177368164, "global_step": 193624, "epoch": 2332} {"train_loss": -24.105512619018555, "global_step": 193625, "epoch": 2332} {"train_loss": -24.19870948791504, "global_step": 193626, "epoch": 2332} {"train_loss": -24.326221466064453, "global_step": 193627, "epoch": 2332} {"train_loss": -24.078903198242188, "global_step": 193628, "epoch": 2332} {"train_loss": -24.37052345275879, "global_step": 193629, "epoch": 2332} {"train_loss": -24.14931869506836, "global_step": 193630, "epoch": 2332} {"train_loss": -24.07871437072754, "global_step": 193631, "epoch": 2332} {"train_loss": -24.02996253967285, "global_step": 193632, "epoch": 2332} {"train_loss": -24.213850021362305, "global_step": 193633, "epoch": 2332} {"train_loss": -24.13946533203125, "global_step": 193634, "epoch": 2332} {"train_loss": -24.056106567382812, "global_step": 193635, "epoch": 2332} {"train_loss": -24.50606346130371, "global_step": 193636, "epoch": 2332} {"train_loss": -24.14703941345215, "global_step": 193637, "epoch": 2332} {"train_loss": -24.064831170691065, "global_step": 193638, "epoch": 2332, "val_loss": 6491365.0} {"train_loss": -22.593486785888672, "global_step": 193639, "epoch": 2333} {"train_loss": -23.216054916381836, "global_step": 193640, "epoch": 2333} {"train_loss": -23.6322021484375, "global_step": 193641, "epoch": 2333} {"train_loss": -22.911161422729492, "global_step": 193642, "epoch": 2333} {"train_loss": -23.790746688842773, "global_step": 193643, "epoch": 2333} {"train_loss": -23.833158493041992, "global_step": 193644, "epoch": 2333} {"train_loss": -23.58038330078125, "global_step": 193645, "epoch": 2333} {"train_loss": -23.597150802612305, "global_step": 193646, "epoch": 2333} {"train_loss": -23.63093376159668, "global_step": 193647, "epoch": 2333} {"train_loss": -24.282949447631836, "global_step": 193648, "epoch": 2333} {"train_loss": -23.24896240234375, "global_step": 193649, "epoch": 2333} {"train_loss": -23.9486026763916, "global_step": 193650, "epoch": 2333} {"train_loss": -23.608367919921875, "global_step": 193651, "epoch": 2333} {"train_loss": -23.409317016601562, "global_step": 193652, "epoch": 2333} {"train_loss": -23.88566017150879, "global_step": 193653, "epoch": 2333} {"train_loss": -24.047313690185547, "global_step": 193654, "epoch": 2333} {"train_loss": -23.95781898498535, "global_step": 193655, "epoch": 2333} {"train_loss": -23.872806549072266, "global_step": 193656, "epoch": 2333} {"train_loss": -23.91609001159668, "global_step": 193657, "epoch": 2333} {"train_loss": -24.030654907226562, "global_step": 193658, "epoch": 2333} {"train_loss": -24.056377410888672, "global_step": 193659, "epoch": 2333} {"train_loss": -24.2207088470459, "global_step": 193660, "epoch": 2333} {"train_loss": -23.93303871154785, "global_step": 193661, "epoch": 2333} {"train_loss": -24.291715621948242, "global_step": 193662, "epoch": 2333} {"train_loss": -24.05751609802246, "global_step": 193663, "epoch": 2333} {"train_loss": -23.863849639892578, "global_step": 193664, "epoch": 2333} {"train_loss": -23.841995239257812, "global_step": 193665, "epoch": 2333} {"train_loss": -23.929508209228516, "global_step": 193666, "epoch": 2333} {"train_loss": -24.049962997436523, "global_step": 193667, "epoch": 2333} {"train_loss": -24.294279098510742, "global_step": 193668, "epoch": 2333} {"train_loss": -23.942615509033203, "global_step": 193669, "epoch": 2333} {"train_loss": -24.38478660583496, "global_step": 193670, "epoch": 2333} {"train_loss": -24.14650535583496, "global_step": 193671, "epoch": 2333} {"train_loss": -24.27362632751465, "global_step": 193672, "epoch": 2333} {"train_loss": -24.05434226989746, "global_step": 193673, "epoch": 2333} {"train_loss": -24.37619972229004, "global_step": 193674, "epoch": 2333} {"train_loss": -24.167123794555664, "global_step": 193675, "epoch": 2333} {"train_loss": -24.15692710876465, "global_step": 193676, "epoch": 2333} {"train_loss": -24.05462074279785, "global_step": 193677, "epoch": 2333} {"train_loss": -24.218061447143555, "global_step": 193678, "epoch": 2333} {"train_loss": -24.35857582092285, "global_step": 193679, "epoch": 2333} {"train_loss": -23.904714584350586, "global_step": 193680, "epoch": 2333} {"train_loss": -24.30304527282715, "global_step": 193681, "epoch": 2333} {"train_loss": -24.06572914123535, "global_step": 193682, "epoch": 2333} {"train_loss": -23.9586238861084, "global_step": 193683, "epoch": 2333} {"train_loss": -24.424285888671875, "global_step": 193684, "epoch": 2333} {"train_loss": -23.917818069458008, "global_step": 193685, "epoch": 2333} {"train_loss": -24.057058334350586, "global_step": 193686, "epoch": 2333} {"train_loss": -24.244144439697266, "global_step": 193687, "epoch": 2333} {"train_loss": -24.15423583984375, "global_step": 193688, "epoch": 2333} {"train_loss": -24.15506935119629, "global_step": 193689, "epoch": 2333} {"train_loss": -24.053239822387695, "global_step": 193690, "epoch": 2333} {"train_loss": -24.411855697631836, "global_step": 193691, "epoch": 2333} {"train_loss": -23.813148498535156, "global_step": 193692, "epoch": 2333} {"train_loss": -23.776037216186523, "global_step": 193693, "epoch": 2333} {"train_loss": -23.9472713470459, "global_step": 193694, "epoch": 2333} {"train_loss": -24.394994735717773, "global_step": 193695, "epoch": 2333} {"train_loss": -24.353729248046875, "global_step": 193696, "epoch": 2333} {"train_loss": -24.450849533081055, "global_step": 193697, "epoch": 2333} {"train_loss": -24.235897064208984, "global_step": 193698, "epoch": 2333} {"train_loss": -24.259231567382812, "global_step": 193699, "epoch": 2333} {"train_loss": -24.249420166015625, "global_step": 193700, "epoch": 2333} {"train_loss": -24.27716827392578, "global_step": 193701, "epoch": 2333} {"train_loss": -24.078121185302734, "global_step": 193702, "epoch": 2333} {"train_loss": -24.008556365966797, "global_step": 193703, "epoch": 2333} {"train_loss": -24.26759147644043, "global_step": 193704, "epoch": 2333} {"train_loss": -24.185029983520508, "global_step": 193705, "epoch": 2333} {"train_loss": -24.10371971130371, "global_step": 193706, "epoch": 2333} {"train_loss": -24.160676956176758, "global_step": 193707, "epoch": 2333} {"train_loss": -24.080432891845703, "global_step": 193708, "epoch": 2333} {"train_loss": -24.124692916870117, "global_step": 193709, "epoch": 2333} {"train_loss": -24.58635711669922, "global_step": 193710, "epoch": 2333} {"train_loss": -24.18427848815918, "global_step": 193711, "epoch": 2333} {"train_loss": -24.535459518432617, "global_step": 193712, "epoch": 2333} {"train_loss": -24.143125534057617, "global_step": 193713, "epoch": 2333} {"train_loss": -24.342304229736328, "global_step": 193714, "epoch": 2333} {"train_loss": -24.036762237548828, "global_step": 193715, "epoch": 2333} {"train_loss": -24.437271118164062, "global_step": 193716, "epoch": 2333} {"train_loss": -24.207298278808594, "global_step": 193717, "epoch": 2333} {"train_loss": -24.18719482421875, "global_step": 193718, "epoch": 2333} {"train_loss": -23.898832321166992, "global_step": 193719, "epoch": 2333} {"train_loss": -24.145376205444336, "global_step": 193720, "epoch": 2333} {"train_loss": -24.02033445059535, "global_step": 193721, "epoch": 2333, "val_loss": 6412633.5} {"train_loss": -23.812406539916992, "global_step": 193722, "epoch": 2334} {"train_loss": -23.6505126953125, "global_step": 193723, "epoch": 2334} {"train_loss": -23.79593276977539, "global_step": 193724, "epoch": 2334} {"train_loss": -23.63338279724121, "global_step": 193725, "epoch": 2334} {"train_loss": -23.943655014038086, "global_step": 193726, "epoch": 2334} {"train_loss": -23.778600692749023, "global_step": 193727, "epoch": 2334} {"train_loss": -23.45512580871582, "global_step": 193728, "epoch": 2334} {"train_loss": -23.403675079345703, "global_step": 193729, "epoch": 2334} {"train_loss": -23.642948150634766, "global_step": 193730, "epoch": 2334} {"train_loss": -23.554763793945312, "global_step": 193731, "epoch": 2334} {"train_loss": -23.997726440429688, "global_step": 193732, "epoch": 2334} {"train_loss": -23.955198287963867, "global_step": 193733, "epoch": 2334} {"train_loss": -24.39365005493164, "global_step": 193734, "epoch": 2334} {"train_loss": -24.132347106933594, "global_step": 193735, "epoch": 2334} {"train_loss": -23.925745010375977, "global_step": 193736, "epoch": 2334} {"train_loss": -23.919677734375, "global_step": 193737, "epoch": 2334} {"train_loss": -23.87643814086914, "global_step": 193738, "epoch": 2334} {"train_loss": -24.324249267578125, "global_step": 193739, "epoch": 2334} {"train_loss": -23.768159866333008, "global_step": 193740, "epoch": 2334} {"train_loss": -24.088403701782227, "global_step": 193741, "epoch": 2334} {"train_loss": -24.176084518432617, "global_step": 193742, "epoch": 2334} {"train_loss": -23.514728546142578, "global_step": 193743, "epoch": 2334} {"train_loss": -24.273420333862305, "global_step": 193744, "epoch": 2334} {"train_loss": -23.898487091064453, "global_step": 193745, "epoch": 2334} {"train_loss": -23.896533966064453, "global_step": 193746, "epoch": 2334} {"train_loss": -24.074460983276367, "global_step": 193747, "epoch": 2334} {"train_loss": -23.969301223754883, "global_step": 193748, "epoch": 2334} {"train_loss": -24.043949127197266, "global_step": 193749, "epoch": 2334} {"train_loss": -24.00489616394043, "global_step": 193750, "epoch": 2334} {"train_loss": -23.867549896240234, "global_step": 193751, "epoch": 2334} {"train_loss": -23.86729621887207, "global_step": 193752, "epoch": 2334} {"train_loss": -23.84413719177246, "global_step": 193753, "epoch": 2334} {"train_loss": -24.25551414489746, "global_step": 193754, "epoch": 2334} {"train_loss": -24.394861221313477, "global_step": 193755, "epoch": 2334} {"train_loss": -24.475807189941406, "global_step": 193756, "epoch": 2334} {"train_loss": -24.208837509155273, "global_step": 193757, "epoch": 2334} {"train_loss": -24.25685691833496, "global_step": 193758, "epoch": 2334} {"train_loss": -24.32286834716797, "global_step": 193759, "epoch": 2334} {"train_loss": -24.289953231811523, "global_step": 193760, "epoch": 2334} {"train_loss": -24.011350631713867, "global_step": 193761, "epoch": 2334} {"train_loss": -24.144872665405273, "global_step": 193762, "epoch": 2334} {"train_loss": -24.13041114807129, "global_step": 193763, "epoch": 2334} {"train_loss": -24.56216812133789, "global_step": 193764, "epoch": 2334} {"train_loss": -24.264863967895508, "global_step": 193765, "epoch": 2334} {"train_loss": -24.05293083190918, "global_step": 193766, "epoch": 2334} {"train_loss": -24.152830123901367, "global_step": 193767, "epoch": 2334} {"train_loss": -24.23468017578125, "global_step": 193768, "epoch": 2334} {"train_loss": -24.10417938232422, "global_step": 193769, "epoch": 2334} {"train_loss": -23.73909568786621, "global_step": 193770, "epoch": 2334} {"train_loss": -24.014265060424805, "global_step": 193771, "epoch": 2334} {"train_loss": -24.425840377807617, "global_step": 193772, "epoch": 2334} {"train_loss": -24.238937377929688, "global_step": 193773, "epoch": 2334} {"train_loss": -24.355009078979492, "global_step": 193774, "epoch": 2334} {"train_loss": -23.68778419494629, "global_step": 193775, "epoch": 2334} {"train_loss": -24.200571060180664, "global_step": 193776, "epoch": 2334} {"train_loss": -24.201757431030273, "global_step": 193777, "epoch": 2334} {"train_loss": -24.253541946411133, "global_step": 193778, "epoch": 2334} {"train_loss": -24.00090980529785, "global_step": 193779, "epoch": 2334} {"train_loss": -24.289653778076172, "global_step": 193780, "epoch": 2334} {"train_loss": -24.0769100189209, "global_step": 193781, "epoch": 2334} {"train_loss": -24.072111129760742, "global_step": 193782, "epoch": 2334} {"train_loss": -24.504270553588867, "global_step": 193783, "epoch": 2334} {"train_loss": -24.25034523010254, "global_step": 193784, "epoch": 2334} {"train_loss": -24.482437133789062, "global_step": 193785, "epoch": 2334} {"train_loss": -24.131092071533203, "global_step": 193786, "epoch": 2334} {"train_loss": -24.466550827026367, "global_step": 193787, "epoch": 2334} {"train_loss": -24.401819229125977, "global_step": 193788, "epoch": 2334} {"train_loss": -24.062223434448242, "global_step": 193789, "epoch": 2334} {"train_loss": -24.37183952331543, "global_step": 193790, "epoch": 2334} {"train_loss": -24.067123413085938, "global_step": 193791, "epoch": 2334} {"train_loss": -24.18046760559082, "global_step": 193792, "epoch": 2334} {"train_loss": -24.259193420410156, "global_step": 193793, "epoch": 2334} {"train_loss": -24.027868270874023, "global_step": 193794, "epoch": 2334} {"train_loss": -23.9996395111084, "global_step": 193795, "epoch": 2334} {"train_loss": -24.545278549194336, "global_step": 193796, "epoch": 2334} {"train_loss": -23.97787857055664, "global_step": 193797, "epoch": 2334} {"train_loss": -24.238037109375, "global_step": 193798, "epoch": 2334} {"train_loss": -24.47908592224121, "global_step": 193799, "epoch": 2334} {"train_loss": -24.058364868164062, "global_step": 193800, "epoch": 2334} {"train_loss": -24.45768165588379, "global_step": 193801, "epoch": 2334} {"train_loss": -24.32891273498535, "global_step": 193802, "epoch": 2334} {"train_loss": -24.197751998901367, "global_step": 193803, "epoch": 2334} {"train_loss": -24.08719276520143, "global_step": 193804, "epoch": 2334, "val_loss": 6441992.5} {"train_loss": -23.605417251586914, "global_step": 193805, "epoch": 2335} {"train_loss": -22.37302017211914, "global_step": 193806, "epoch": 2335} {"train_loss": -21.555953979492188, "global_step": 193807, "epoch": 2335} {"train_loss": -23.086286544799805, "global_step": 193808, "epoch": 2335} {"train_loss": -22.9731502532959, "global_step": 193809, "epoch": 2335} {"train_loss": -23.345489501953125, "global_step": 193810, "epoch": 2335} {"train_loss": -23.184797286987305, "global_step": 193811, "epoch": 2335} {"train_loss": -22.972537994384766, "global_step": 193812, "epoch": 2335} {"train_loss": -23.70503807067871, "global_step": 193813, "epoch": 2335} {"train_loss": -23.039297103881836, "global_step": 193814, "epoch": 2335} {"train_loss": -23.5406551361084, "global_step": 193815, "epoch": 2335} {"train_loss": -23.20331573486328, "global_step": 193816, "epoch": 2335} {"train_loss": -23.133405685424805, "global_step": 193817, "epoch": 2335} {"train_loss": -23.749914169311523, "global_step": 193818, "epoch": 2335} {"train_loss": -23.638465881347656, "global_step": 193819, "epoch": 2335} {"train_loss": -23.263776779174805, "global_step": 193820, "epoch": 2335} {"train_loss": -23.78885269165039, "global_step": 193821, "epoch": 2335} {"train_loss": -23.55609130859375, "global_step": 193822, "epoch": 2335} {"train_loss": -23.608379364013672, "global_step": 193823, "epoch": 2335} {"train_loss": -23.495315551757812, "global_step": 193824, "epoch": 2335} {"train_loss": -23.6662654876709, "global_step": 193825, "epoch": 2335} {"train_loss": -23.645299911499023, "global_step": 193826, "epoch": 2335} {"train_loss": -23.891324996948242, "global_step": 193827, "epoch": 2335} {"train_loss": -23.88905906677246, "global_step": 193828, "epoch": 2335} {"train_loss": -23.7988338470459, "global_step": 193829, "epoch": 2335} {"train_loss": -23.480693817138672, "global_step": 193830, "epoch": 2335} {"train_loss": -23.265100479125977, "global_step": 193831, "epoch": 2335} {"train_loss": -24.268478393554688, "global_step": 193832, "epoch": 2335} {"train_loss": -24.030548095703125, "global_step": 193833, "epoch": 2335} {"train_loss": -24.061355590820312, "global_step": 193834, "epoch": 2335} {"train_loss": -23.530466079711914, "global_step": 193835, "epoch": 2335} {"train_loss": -23.966171264648438, "global_step": 193836, "epoch": 2335} {"train_loss": -23.7341251373291, "global_step": 193837, "epoch": 2335} {"train_loss": -24.03931999206543, "global_step": 193838, "epoch": 2335} {"train_loss": -23.95475196838379, "global_step": 193839, "epoch": 2335} {"train_loss": -24.219236373901367, "global_step": 193840, "epoch": 2335} {"train_loss": -24.328182220458984, "global_step": 193841, "epoch": 2335} {"train_loss": -24.1126708984375, "global_step": 193842, "epoch": 2335} {"train_loss": -23.8941707611084, "global_step": 193843, "epoch": 2335} {"train_loss": -23.90674591064453, "global_step": 193844, "epoch": 2335} {"train_loss": -24.347166061401367, "global_step": 193845, "epoch": 2335} {"train_loss": -23.9725341796875, "global_step": 193846, "epoch": 2335} {"train_loss": -23.731124877929688, "global_step": 193847, "epoch": 2335} {"train_loss": -23.947378158569336, "global_step": 193848, "epoch": 2335} {"train_loss": -24.2618350982666, "global_step": 193849, "epoch": 2335} {"train_loss": -24.252304077148438, "global_step": 193850, "epoch": 2335} {"train_loss": -24.29582405090332, "global_step": 193851, "epoch": 2335} {"train_loss": -23.884735107421875, "global_step": 193852, "epoch": 2335} {"train_loss": -24.214481353759766, "global_step": 193853, "epoch": 2335} {"train_loss": -24.109983444213867, "global_step": 193854, "epoch": 2335} {"train_loss": -24.124120712280273, "global_step": 193855, "epoch": 2335} {"train_loss": -24.434925079345703, "global_step": 193856, "epoch": 2335} {"train_loss": -24.241958618164062, "global_step": 193857, "epoch": 2335} {"train_loss": -24.14354133605957, "global_step": 193858, "epoch": 2335} {"train_loss": -24.077665328979492, "global_step": 193859, "epoch": 2335} {"train_loss": -24.48355484008789, "global_step": 193860, "epoch": 2335} {"train_loss": -24.027570724487305, "global_step": 193861, "epoch": 2335} {"train_loss": -24.10739517211914, "global_step": 193862, "epoch": 2335} {"train_loss": -24.083114624023438, "global_step": 193863, "epoch": 2335} {"train_loss": -24.187135696411133, "global_step": 193864, "epoch": 2335} {"train_loss": -24.1147518157959, "global_step": 193865, "epoch": 2335} {"train_loss": -24.462738037109375, "global_step": 193866, "epoch": 2335} {"train_loss": -24.139190673828125, "global_step": 193867, "epoch": 2335} {"train_loss": -24.35358238220215, "global_step": 193868, "epoch": 2335} {"train_loss": -24.076147079467773, "global_step": 193869, "epoch": 2335} {"train_loss": -24.650625228881836, "global_step": 193870, "epoch": 2335} {"train_loss": -24.06079864501953, "global_step": 193871, "epoch": 2335} {"train_loss": -24.488847732543945, "global_step": 193872, "epoch": 2335} {"train_loss": -24.1340274810791, "global_step": 193873, "epoch": 2335} {"train_loss": -24.3223934173584, "global_step": 193874, "epoch": 2335} {"train_loss": -24.53645896911621, "global_step": 193875, "epoch": 2335} {"train_loss": -24.22023582458496, "global_step": 193876, "epoch": 2335} {"train_loss": -23.9352970123291, "global_step": 193877, "epoch": 2335} {"train_loss": -24.662240982055664, "global_step": 193878, "epoch": 2335} {"train_loss": -24.146757125854492, "global_step": 193879, "epoch": 2335} {"train_loss": -24.163034439086914, "global_step": 193880, "epoch": 2335} {"train_loss": -23.94607925415039, "global_step": 193881, "epoch": 2335} {"train_loss": -24.4051513671875, "global_step": 193882, "epoch": 2335} {"train_loss": -24.5805721282959, "global_step": 193883, "epoch": 2335} {"train_loss": -24.18491554260254, "global_step": 193884, "epoch": 2335} {"train_loss": -23.962656021118164, "global_step": 193885, "epoch": 2335} {"train_loss": -24.424057006835938, "global_step": 193886, "epoch": 2335} {"train_loss": -23.91596559731357, "global_step": 193887, "epoch": 2335, "val_loss": 6572910.5} {"train_loss": -22.189970016479492, "global_step": 193888, "epoch": 2336} {"train_loss": -22.6416072845459, "global_step": 193889, "epoch": 2336} {"train_loss": -23.179088592529297, "global_step": 193890, "epoch": 2336} {"train_loss": -23.326704025268555, "global_step": 193891, "epoch": 2336} {"train_loss": -23.19746971130371, "global_step": 193892, "epoch": 2336} {"train_loss": -23.750404357910156, "global_step": 193893, "epoch": 2336} {"train_loss": -23.358993530273438, "global_step": 193894, "epoch": 2336} {"train_loss": -23.101076126098633, "global_step": 193895, "epoch": 2336} {"train_loss": -23.34883689880371, "global_step": 193896, "epoch": 2336} {"train_loss": -23.780681610107422, "global_step": 193897, "epoch": 2336} {"train_loss": -23.55189323425293, "global_step": 193898, "epoch": 2336} {"train_loss": -23.596460342407227, "global_step": 193899, "epoch": 2336} {"train_loss": -23.613252639770508, "global_step": 193900, "epoch": 2336} {"train_loss": -23.414798736572266, "global_step": 193901, "epoch": 2336} {"train_loss": -23.538419723510742, "global_step": 193902, "epoch": 2336} {"train_loss": -23.52164649963379, "global_step": 193903, "epoch": 2336} {"train_loss": -23.613386154174805, "global_step": 193904, "epoch": 2336} {"train_loss": -23.718769073486328, "global_step": 193905, "epoch": 2336} {"train_loss": -23.964372634887695, "global_step": 193906, "epoch": 2336} {"train_loss": -23.806564331054688, "global_step": 193907, "epoch": 2336} {"train_loss": -23.592992782592773, "global_step": 193908, "epoch": 2336} {"train_loss": -23.5511474609375, "global_step": 193909, "epoch": 2336} {"train_loss": -23.779129028320312, "global_step": 193910, "epoch": 2336} {"train_loss": -23.90384292602539, "global_step": 193911, "epoch": 2336} {"train_loss": -24.025924682617188, "global_step": 193912, "epoch": 2336} {"train_loss": -23.762258529663086, "global_step": 193913, "epoch": 2336} {"train_loss": -24.011354446411133, "global_step": 193914, "epoch": 2336} {"train_loss": -24.03255271911621, "global_step": 193915, "epoch": 2336} {"train_loss": -24.266206741333008, "global_step": 193916, "epoch": 2336} {"train_loss": -24.17188262939453, "global_step": 193917, "epoch": 2336} {"train_loss": -24.1212158203125, "global_step": 193918, "epoch": 2336} {"train_loss": -24.28915786743164, "global_step": 193919, "epoch": 2336} {"train_loss": -24.22061538696289, "global_step": 193920, "epoch": 2336} {"train_loss": -24.00913429260254, "global_step": 193921, "epoch": 2336} {"train_loss": -24.15498161315918, "global_step": 193922, "epoch": 2336} {"train_loss": -24.363929748535156, "global_step": 193923, "epoch": 2336} {"train_loss": -24.000600814819336, "global_step": 193924, "epoch": 2336} {"train_loss": -24.372724533081055, "global_step": 193925, "epoch": 2336} {"train_loss": -24.15104103088379, "global_step": 193926, "epoch": 2336} {"train_loss": -24.110811233520508, "global_step": 193927, "epoch": 2336} {"train_loss": -24.484848022460938, "global_step": 193928, "epoch": 2336} {"train_loss": -24.4175968170166, "global_step": 193929, "epoch": 2336} {"train_loss": -24.184499740600586, "global_step": 193930, "epoch": 2336} {"train_loss": -24.135456085205078, "global_step": 193931, "epoch": 2336} {"train_loss": -23.821088790893555, "global_step": 193932, "epoch": 2336} {"train_loss": -23.908185958862305, "global_step": 193933, "epoch": 2336} {"train_loss": -24.28265380859375, "global_step": 193934, "epoch": 2336} {"train_loss": -24.302379608154297, "global_step": 193935, "epoch": 2336} {"train_loss": -23.97352409362793, "global_step": 193936, "epoch": 2336} {"train_loss": -24.306011199951172, "global_step": 193937, "epoch": 2336} {"train_loss": -23.979711532592773, "global_step": 193938, "epoch": 2336} {"train_loss": -24.287723541259766, "global_step": 193939, "epoch": 2336} {"train_loss": -24.377017974853516, "global_step": 193940, "epoch": 2336} {"train_loss": -24.544811248779297, "global_step": 193941, "epoch": 2336} {"train_loss": -24.163406372070312, "global_step": 193942, "epoch": 2336} {"train_loss": -24.259693145751953, "global_step": 193943, "epoch": 2336} {"train_loss": -23.982341766357422, "global_step": 193944, "epoch": 2336} {"train_loss": -24.537443161010742, "global_step": 193945, "epoch": 2336} {"train_loss": -24.353281021118164, "global_step": 193946, "epoch": 2336} {"train_loss": -24.211313247680664, "global_step": 193947, "epoch": 2336} {"train_loss": -24.373416900634766, "global_step": 193948, "epoch": 2336} {"train_loss": -24.341876983642578, "global_step": 193949, "epoch": 2336} {"train_loss": -23.990873336791992, "global_step": 193950, "epoch": 2336} {"train_loss": -24.320032119750977, "global_step": 193951, "epoch": 2336} {"train_loss": -24.563308715820312, "global_step": 193952, "epoch": 2336} {"train_loss": -24.503467559814453, "global_step": 193953, "epoch": 2336} {"train_loss": -24.3214111328125, "global_step": 193954, "epoch": 2336} {"train_loss": -24.54245948791504, "global_step": 193955, "epoch": 2336} {"train_loss": -24.274150848388672, "global_step": 193956, "epoch": 2336} {"train_loss": -24.474294662475586, "global_step": 193957, "epoch": 2336} {"train_loss": -24.33445167541504, "global_step": 193958, "epoch": 2336} {"train_loss": -24.12369728088379, "global_step": 193959, "epoch": 2336} {"train_loss": -24.78732681274414, "global_step": 193960, "epoch": 2336} {"train_loss": -24.28891944885254, "global_step": 193961, "epoch": 2336} {"train_loss": -24.299341201782227, "global_step": 193962, "epoch": 2336} {"train_loss": -24.406478881835938, "global_step": 193963, "epoch": 2336} {"train_loss": -24.144689559936523, "global_step": 193964, "epoch": 2336} {"train_loss": -24.450979232788086, "global_step": 193965, "epoch": 2336} {"train_loss": -24.388545989990234, "global_step": 193966, "epoch": 2336} {"train_loss": -24.38289451599121, "global_step": 193967, "epoch": 2336} {"train_loss": -24.004837036132812, "global_step": 193968, "epoch": 2336} {"train_loss": -24.379135131835938, "global_step": 193969, "epoch": 2336} {"train_loss": -24.02504780780838, "global_step": 193970, "epoch": 2336, "val_loss": 6575668.0} {"train_loss": -24.3737735748291, "global_step": 193971, "epoch": 2337} {"train_loss": -23.32056999206543, "global_step": 193972, "epoch": 2337} {"train_loss": -21.95965576171875, "global_step": 193973, "epoch": 2337} {"train_loss": -21.790327072143555, "global_step": 193974, "epoch": 2337} {"train_loss": -23.18537712097168, "global_step": 193975, "epoch": 2337} {"train_loss": -23.088706970214844, "global_step": 193976, "epoch": 2337} {"train_loss": -23.39629554748535, "global_step": 193977, "epoch": 2337} {"train_loss": -23.205251693725586, "global_step": 193978, "epoch": 2337} {"train_loss": -23.245040893554688, "global_step": 193979, "epoch": 2337} {"train_loss": -23.748441696166992, "global_step": 193980, "epoch": 2337} {"train_loss": -23.049102783203125, "global_step": 193981, "epoch": 2337} {"train_loss": -23.279958724975586, "global_step": 193982, "epoch": 2337} {"train_loss": -23.694171905517578, "global_step": 193983, "epoch": 2337} {"train_loss": -23.575468063354492, "global_step": 193984, "epoch": 2337} {"train_loss": -23.40131950378418, "global_step": 193985, "epoch": 2337} {"train_loss": -23.67899513244629, "global_step": 193986, "epoch": 2337} {"train_loss": -23.59259033203125, "global_step": 193987, "epoch": 2337} {"train_loss": -23.662763595581055, "global_step": 193988, "epoch": 2337} {"train_loss": -23.90337371826172, "global_step": 193989, "epoch": 2337} {"train_loss": -23.948471069335938, "global_step": 193990, "epoch": 2337} {"train_loss": -23.59918212890625, "global_step": 193991, "epoch": 2337} {"train_loss": -24.082910537719727, "global_step": 193992, "epoch": 2337} {"train_loss": -23.799589157104492, "global_step": 193993, "epoch": 2337} {"train_loss": -23.847087860107422, "global_step": 193994, "epoch": 2337} {"train_loss": -23.986648559570312, "global_step": 193995, "epoch": 2337} {"train_loss": -23.851547241210938, "global_step": 193996, "epoch": 2337} {"train_loss": -24.071731567382812, "global_step": 193997, "epoch": 2337} {"train_loss": -23.885480880737305, "global_step": 193998, "epoch": 2337} {"train_loss": -24.08803367614746, "global_step": 193999, "epoch": 2337} {"train_loss": -23.90817642211914, "global_step": 194000, "epoch": 2337} {"train_loss": -24.323139190673828, "global_step": 194001, "epoch": 2337} {"train_loss": -23.948963165283203, "global_step": 194002, "epoch": 2337} {"train_loss": -23.76919937133789, "global_step": 194003, "epoch": 2337} {"train_loss": -24.115455627441406, "global_step": 194004, "epoch": 2337} {"train_loss": -23.782730102539062, "global_step": 194005, "epoch": 2337} {"train_loss": -24.354476928710938, "global_step": 194006, "epoch": 2337} {"train_loss": -23.853384017944336, "global_step": 194007, "epoch": 2337} {"train_loss": -24.18439292907715, "global_step": 194008, "epoch": 2337} {"train_loss": -24.0466251373291, "global_step": 194009, "epoch": 2337} {"train_loss": -24.221975326538086, "global_step": 194010, "epoch": 2337} {"train_loss": -24.52680015563965, "global_step": 194011, "epoch": 2337} {"train_loss": -24.24027442932129, "global_step": 194012, "epoch": 2337} {"train_loss": -23.8770694732666, "global_step": 194013, "epoch": 2337} {"train_loss": -24.414081573486328, "global_step": 194014, "epoch": 2337} {"train_loss": -24.327245712280273, "global_step": 194015, "epoch": 2337} {"train_loss": -24.054182052612305, "global_step": 194016, "epoch": 2337} {"train_loss": -24.293787002563477, "global_step": 194017, "epoch": 2337} {"train_loss": -24.393842697143555, "global_step": 194018, "epoch": 2337} {"train_loss": -24.444135665893555, "global_step": 194019, "epoch": 2337} {"train_loss": -24.05466651916504, "global_step": 194020, "epoch": 2337} {"train_loss": -24.365833282470703, "global_step": 194021, "epoch": 2337} {"train_loss": -24.07050895690918, "global_step": 194022, "epoch": 2337} {"train_loss": -24.571640014648438, "global_step": 194023, "epoch": 2337} {"train_loss": -24.14944076538086, "global_step": 194024, "epoch": 2337} {"train_loss": -24.12392234802246, "global_step": 194025, "epoch": 2337} {"train_loss": -24.402565002441406, "global_step": 194026, "epoch": 2337} {"train_loss": -24.080739974975586, "global_step": 194027, "epoch": 2337} {"train_loss": -23.896953582763672, "global_step": 194028, "epoch": 2337} {"train_loss": -24.110088348388672, "global_step": 194029, "epoch": 2337} {"train_loss": -24.314809799194336, "global_step": 194030, "epoch": 2337} {"train_loss": -23.778308868408203, "global_step": 194031, "epoch": 2337} {"train_loss": -24.013826370239258, "global_step": 194032, "epoch": 2337} {"train_loss": -24.19782066345215, "global_step": 194033, "epoch": 2337} {"train_loss": -24.163671493530273, "global_step": 194034, "epoch": 2337} {"train_loss": -24.103525161743164, "global_step": 194035, "epoch": 2337} {"train_loss": -23.88079071044922, "global_step": 194036, "epoch": 2337} {"train_loss": -24.346878051757812, "global_step": 194037, "epoch": 2337} {"train_loss": -24.117029190063477, "global_step": 194038, "epoch": 2337} {"train_loss": -24.234655380249023, "global_step": 194039, "epoch": 2337} {"train_loss": -24.143726348876953, "global_step": 194040, "epoch": 2337} {"train_loss": -23.789209365844727, "global_step": 194041, "epoch": 2337} {"train_loss": -24.193099975585938, "global_step": 194042, "epoch": 2337} {"train_loss": -23.938432693481445, "global_step": 194043, "epoch": 2337} {"train_loss": -24.198888778686523, "global_step": 194044, "epoch": 2337} {"train_loss": -24.25736427307129, "global_step": 194045, "epoch": 2337} {"train_loss": -24.249053955078125, "global_step": 194046, "epoch": 2337} {"train_loss": -24.174230575561523, "global_step": 194047, "epoch": 2337} {"train_loss": -24.273862838745117, "global_step": 194048, "epoch": 2337} {"train_loss": -24.346208572387695, "global_step": 194049, "epoch": 2337} {"train_loss": -23.757551193237305, "global_step": 194050, "epoch": 2337} {"train_loss": -23.798246383666992, "global_step": 194051, "epoch": 2337} {"train_loss": -24.126188278198242, "global_step": 194052, "epoch": 2337} {"train_loss": -23.925717204450123, "global_step": 194053, "epoch": 2337, "val_loss": 6570282.0} {"train_loss": -23.740711212158203, "global_step": 194054, "epoch": 2338} {"train_loss": -23.636754989624023, "global_step": 194055, "epoch": 2338} {"train_loss": -23.86654281616211, "global_step": 194056, "epoch": 2338} {"train_loss": -23.829010009765625, "global_step": 194057, "epoch": 2338} {"train_loss": -24.207334518432617, "global_step": 194058, "epoch": 2338} {"train_loss": -23.97657585144043, "global_step": 194059, "epoch": 2338} {"train_loss": -24.195859909057617, "global_step": 194060, "epoch": 2338} {"train_loss": -24.039236068725586, "global_step": 194061, "epoch": 2338} {"train_loss": -23.836084365844727, "global_step": 194062, "epoch": 2338} {"train_loss": -24.06154441833496, "global_step": 194063, "epoch": 2338} {"train_loss": -24.078393936157227, "global_step": 194064, "epoch": 2338} {"train_loss": -24.250797271728516, "global_step": 194065, "epoch": 2338} {"train_loss": -24.0814208984375, "global_step": 194066, "epoch": 2338} {"train_loss": -24.162216186523438, "global_step": 194067, "epoch": 2338} {"train_loss": -24.270048141479492, "global_step": 194068, "epoch": 2338} {"train_loss": -23.983810424804688, "global_step": 194069, "epoch": 2338} {"train_loss": -24.253921508789062, "global_step": 194070, "epoch": 2338} {"train_loss": -23.671003341674805, "global_step": 194071, "epoch": 2338} {"train_loss": -24.305255889892578, "global_step": 194072, "epoch": 2338} {"train_loss": -24.5317325592041, "global_step": 194073, "epoch": 2338} {"train_loss": -24.336503982543945, "global_step": 194074, "epoch": 2338} {"train_loss": -24.102928161621094, "global_step": 194075, "epoch": 2338} {"train_loss": -24.0550594329834, "global_step": 194076, "epoch": 2338} {"train_loss": -24.253589630126953, "global_step": 194077, "epoch": 2338} {"train_loss": -24.168710708618164, "global_step": 194078, "epoch": 2338} {"train_loss": -23.993988037109375, "global_step": 194079, "epoch": 2338} {"train_loss": -24.046615600585938, "global_step": 194080, "epoch": 2338} {"train_loss": -24.546140670776367, "global_step": 194081, "epoch": 2338} {"train_loss": -23.926809310913086, "global_step": 194082, "epoch": 2338} {"train_loss": -24.119844436645508, "global_step": 194083, "epoch": 2338} {"train_loss": -23.847936630249023, "global_step": 194084, "epoch": 2338} {"train_loss": -24.315319061279297, "global_step": 194085, "epoch": 2338} {"train_loss": -24.0618896484375, "global_step": 194086, "epoch": 2338} {"train_loss": -24.17154884338379, "global_step": 194087, "epoch": 2338} {"train_loss": -24.40611457824707, "global_step": 194088, "epoch": 2338} {"train_loss": -24.190353393554688, "global_step": 194089, "epoch": 2338} {"train_loss": -24.272642135620117, "global_step": 194090, "epoch": 2338} {"train_loss": -24.44281768798828, "global_step": 194091, "epoch": 2338} {"train_loss": -24.664020538330078, "global_step": 194092, "epoch": 2338} {"train_loss": -23.956815719604492, "global_step": 194093, "epoch": 2338} {"train_loss": -24.259174346923828, "global_step": 194094, "epoch": 2338} {"train_loss": -24.310684204101562, "global_step": 194095, "epoch": 2338} {"train_loss": -23.936452865600586, "global_step": 194096, "epoch": 2338} {"train_loss": -24.2498779296875, "global_step": 194097, "epoch": 2338} {"train_loss": -24.056812286376953, "global_step": 194098, "epoch": 2338} {"train_loss": -24.12210464477539, "global_step": 194099, "epoch": 2338} {"train_loss": -24.192440032958984, "global_step": 194100, "epoch": 2338} {"train_loss": -23.715757369995117, "global_step": 194101, "epoch": 2338} {"train_loss": -23.70663070678711, "global_step": 194102, "epoch": 2338} {"train_loss": -23.99078941345215, "global_step": 194103, "epoch": 2338} {"train_loss": -24.198728561401367, "global_step": 194104, "epoch": 2338} {"train_loss": -24.56049919128418, "global_step": 194105, "epoch": 2338} {"train_loss": -24.35744857788086, "global_step": 194106, "epoch": 2338} {"train_loss": -23.893468856811523, "global_step": 194107, "epoch": 2338} {"train_loss": -24.12437629699707, "global_step": 194108, "epoch": 2338} {"train_loss": -24.12827491760254, "global_step": 194109, "epoch": 2338} {"train_loss": -23.941450119018555, "global_step": 194110, "epoch": 2338} {"train_loss": -24.53288459777832, "global_step": 194111, "epoch": 2338} {"train_loss": -24.195499420166016, "global_step": 194112, "epoch": 2338} {"train_loss": -24.309768676757812, "global_step": 194113, "epoch": 2338} {"train_loss": -24.25733184814453, "global_step": 194114, "epoch": 2338} {"train_loss": -24.45612335205078, "global_step": 194115, "epoch": 2338} {"train_loss": -24.250337600708008, "global_step": 194116, "epoch": 2338} {"train_loss": -24.10365104675293, "global_step": 194117, "epoch": 2338} {"train_loss": -24.12953758239746, "global_step": 194118, "epoch": 2338} {"train_loss": -24.24802017211914, "global_step": 194119, "epoch": 2338} {"train_loss": -24.335786819458008, "global_step": 194120, "epoch": 2338} {"train_loss": -24.15180778503418, "global_step": 194121, "epoch": 2338} {"train_loss": -24.256322860717773, "global_step": 194122, "epoch": 2338} {"train_loss": -24.071104049682617, "global_step": 194123, "epoch": 2338} {"train_loss": -24.312557220458984, "global_step": 194124, "epoch": 2338} {"train_loss": -24.094135284423828, "global_step": 194125, "epoch": 2338} {"train_loss": -24.55513572692871, "global_step": 194126, "epoch": 2338} {"train_loss": -24.034543991088867, "global_step": 194127, "epoch": 2338} {"train_loss": -24.422697067260742, "global_step": 194128, "epoch": 2338} {"train_loss": -23.946231842041016, "global_step": 194129, "epoch": 2338} {"train_loss": -24.3488826751709, "global_step": 194130, "epoch": 2338} {"train_loss": -24.303770065307617, "global_step": 194131, "epoch": 2338} {"train_loss": -24.25385856628418, "global_step": 194132, "epoch": 2338} {"train_loss": -23.81723403930664, "global_step": 194133, "epoch": 2338} {"train_loss": -24.185287475585938, "global_step": 194134, "epoch": 2338} {"train_loss": -24.142297744750977, "global_step": 194135, "epoch": 2338} {"train_loss": -24.157682556703865, "global_step": 194136, "epoch": 2338, "val_loss": 6544395.0} {"train_loss": -23.8253116607666, "global_step": 194137, "epoch": 2339} {"train_loss": -24.238887786865234, "global_step": 194138, "epoch": 2339} {"train_loss": -23.5602970123291, "global_step": 194139, "epoch": 2339} {"train_loss": -23.720123291015625, "global_step": 194140, "epoch": 2339} {"train_loss": -24.093730926513672, "global_step": 194141, "epoch": 2339} {"train_loss": -24.218080520629883, "global_step": 194142, "epoch": 2339} {"train_loss": -23.447669982910156, "global_step": 194143, "epoch": 2339} {"train_loss": -23.917905807495117, "global_step": 194144, "epoch": 2339} {"train_loss": -23.79383659362793, "global_step": 194145, "epoch": 2339} {"train_loss": -23.882375717163086, "global_step": 194146, "epoch": 2339} {"train_loss": -23.927377700805664, "global_step": 194147, "epoch": 2339} {"train_loss": -23.730146408081055, "global_step": 194148, "epoch": 2339} {"train_loss": -23.82569694519043, "global_step": 194149, "epoch": 2339} {"train_loss": -23.835357666015625, "global_step": 194150, "epoch": 2339} {"train_loss": -23.539077758789062, "global_step": 194151, "epoch": 2339} {"train_loss": -23.660715103149414, "global_step": 194152, "epoch": 2339} {"train_loss": -24.068925857543945, "global_step": 194153, "epoch": 2339} {"train_loss": -23.886869430541992, "global_step": 194154, "epoch": 2339} {"train_loss": -24.42350196838379, "global_step": 194155, "epoch": 2339} {"train_loss": -23.497066497802734, "global_step": 194156, "epoch": 2339} {"train_loss": -23.930339813232422, "global_step": 194157, "epoch": 2339} {"train_loss": -24.435771942138672, "global_step": 194158, "epoch": 2339} {"train_loss": -24.176816940307617, "global_step": 194159, "epoch": 2339} {"train_loss": -24.062877655029297, "global_step": 194160, "epoch": 2339} {"train_loss": -24.13263702392578, "global_step": 194161, "epoch": 2339} {"train_loss": -24.195022583007812, "global_step": 194162, "epoch": 2339} {"train_loss": -24.21854019165039, "global_step": 194163, "epoch": 2339} {"train_loss": -24.22935676574707, "global_step": 194164, "epoch": 2339} {"train_loss": -24.185413360595703, "global_step": 194165, "epoch": 2339} {"train_loss": -24.134796142578125, "global_step": 194166, "epoch": 2339} {"train_loss": -24.254987716674805, "global_step": 194167, "epoch": 2339} {"train_loss": -24.367128372192383, "global_step": 194168, "epoch": 2339} {"train_loss": -24.387754440307617, "global_step": 194169, "epoch": 2339} {"train_loss": -24.15325355529785, "global_step": 194170, "epoch": 2339} {"train_loss": -23.98810386657715, "global_step": 194171, "epoch": 2339} {"train_loss": -24.03605079650879, "global_step": 194172, "epoch": 2339} {"train_loss": -24.348058700561523, "global_step": 194173, "epoch": 2339} {"train_loss": -24.283010482788086, "global_step": 194174, "epoch": 2339} {"train_loss": -24.028564453125, "global_step": 194175, "epoch": 2339} {"train_loss": -24.068681716918945, "global_step": 194176, "epoch": 2339} {"train_loss": -24.140361785888672, "global_step": 194177, "epoch": 2339} {"train_loss": -24.105255126953125, "global_step": 194178, "epoch": 2339} {"train_loss": -24.198719024658203, "global_step": 194179, "epoch": 2339} {"train_loss": -24.4345645904541, "global_step": 194180, "epoch": 2339} {"train_loss": -24.090436935424805, "global_step": 194181, "epoch": 2339} {"train_loss": -24.412240982055664, "global_step": 194182, "epoch": 2339} {"train_loss": -24.25013542175293, "global_step": 194183, "epoch": 2339} {"train_loss": -24.554433822631836, "global_step": 194184, "epoch": 2339} {"train_loss": -24.1874942779541, "global_step": 194185, "epoch": 2339} {"train_loss": -23.898347854614258, "global_step": 194186, "epoch": 2339} {"train_loss": -24.023487091064453, "global_step": 194187, "epoch": 2339} {"train_loss": -24.156885147094727, "global_step": 194188, "epoch": 2339} {"train_loss": -24.52686309814453, "global_step": 194189, "epoch": 2339} {"train_loss": -24.390417098999023, "global_step": 194190, "epoch": 2339} {"train_loss": -24.04438018798828, "global_step": 194191, "epoch": 2339} {"train_loss": -24.08043670654297, "global_step": 194192, "epoch": 2339} {"train_loss": -24.328895568847656, "global_step": 194193, "epoch": 2339} {"train_loss": -23.98031997680664, "global_step": 194194, "epoch": 2339} {"train_loss": -24.30702781677246, "global_step": 194195, "epoch": 2339} {"train_loss": -23.938119888305664, "global_step": 194196, "epoch": 2339} {"train_loss": -24.183338165283203, "global_step": 194197, "epoch": 2339} {"train_loss": -23.813879013061523, "global_step": 194198, "epoch": 2339} {"train_loss": -23.983295440673828, "global_step": 194199, "epoch": 2339} {"train_loss": -24.19495964050293, "global_step": 194200, "epoch": 2339} {"train_loss": -24.194618225097656, "global_step": 194201, "epoch": 2339} {"train_loss": -23.95501136779785, "global_step": 194202, "epoch": 2339} {"train_loss": -24.12015151977539, "global_step": 194203, "epoch": 2339} {"train_loss": -24.062515258789062, "global_step": 194204, "epoch": 2339} {"train_loss": -24.17283821105957, "global_step": 194205, "epoch": 2339} {"train_loss": -24.26503562927246, "global_step": 194206, "epoch": 2339} {"train_loss": -24.11090660095215, "global_step": 194207, "epoch": 2339} {"train_loss": -24.100528717041016, "global_step": 194208, "epoch": 2339} {"train_loss": -24.288862228393555, "global_step": 194209, "epoch": 2339} {"train_loss": -24.117773056030273, "global_step": 194210, "epoch": 2339} {"train_loss": -24.3377742767334, "global_step": 194211, "epoch": 2339} {"train_loss": -24.15633201599121, "global_step": 194212, "epoch": 2339} {"train_loss": -24.3991641998291, "global_step": 194213, "epoch": 2339} {"train_loss": -24.232633590698242, "global_step": 194214, "epoch": 2339} {"train_loss": -24.355213165283203, "global_step": 194215, "epoch": 2339} {"train_loss": -24.212350845336914, "global_step": 194216, "epoch": 2339} {"train_loss": -24.20722198486328, "global_step": 194217, "epoch": 2339} {"train_loss": -24.168548583984375, "global_step": 194218, "epoch": 2339} {"train_loss": -24.092926737773848, "global_step": 194219, "epoch": 2339, "val_loss": 6396846.5} {"train_loss": -24.07315444946289, "global_step": 194220, "epoch": 2340} {"train_loss": -23.756498336791992, "global_step": 194221, "epoch": 2340} {"train_loss": -23.469526290893555, "global_step": 194222, "epoch": 2340} {"train_loss": -23.597684860229492, "global_step": 194223, "epoch": 2340} {"train_loss": -24.005939483642578, "global_step": 194224, "epoch": 2340} {"train_loss": -24.04104995727539, "global_step": 194225, "epoch": 2340} {"train_loss": -23.755260467529297, "global_step": 194226, "epoch": 2340} {"train_loss": -23.70961570739746, "global_step": 194227, "epoch": 2340} {"train_loss": -24.03106117248535, "global_step": 194228, "epoch": 2340} {"train_loss": -24.014633178710938, "global_step": 194229, "epoch": 2340} {"train_loss": -23.885812759399414, "global_step": 194230, "epoch": 2340} {"train_loss": -24.27515983581543, "global_step": 194231, "epoch": 2340} {"train_loss": -23.958768844604492, "global_step": 194232, "epoch": 2340} {"train_loss": -23.660802841186523, "global_step": 194233, "epoch": 2340} {"train_loss": -23.981861114501953, "global_step": 194234, "epoch": 2340} {"train_loss": -23.76593589782715, "global_step": 194235, "epoch": 2340} {"train_loss": -24.290517807006836, "global_step": 194236, "epoch": 2340} {"train_loss": -23.99004554748535, "global_step": 194237, "epoch": 2340} {"train_loss": -24.265426635742188, "global_step": 194238, "epoch": 2340} {"train_loss": -24.068912506103516, "global_step": 194239, "epoch": 2340} {"train_loss": -24.245576858520508, "global_step": 194240, "epoch": 2340} {"train_loss": -23.94569969177246, "global_step": 194241, "epoch": 2340} {"train_loss": -24.220849990844727, "global_step": 194242, "epoch": 2340} {"train_loss": -23.956823348999023, "global_step": 194243, "epoch": 2340} {"train_loss": -24.094675064086914, "global_step": 194244, "epoch": 2340} {"train_loss": -24.053396224975586, "global_step": 194245, "epoch": 2340} {"train_loss": -23.798370361328125, "global_step": 194246, "epoch": 2340} {"train_loss": -24.244098663330078, "global_step": 194247, "epoch": 2340} {"train_loss": -24.09587860107422, "global_step": 194248, "epoch": 2340} {"train_loss": -24.5119571685791, "global_step": 194249, "epoch": 2340} {"train_loss": -24.321500778198242, "global_step": 194250, "epoch": 2340} {"train_loss": -24.124216079711914, "global_step": 194251, "epoch": 2340} {"train_loss": -23.969955444335938, "global_step": 194252, "epoch": 2340} {"train_loss": -24.106197357177734, "global_step": 194253, "epoch": 2340} {"train_loss": -24.06570816040039, "global_step": 194254, "epoch": 2340} {"train_loss": -24.202043533325195, "global_step": 194255, "epoch": 2340} {"train_loss": -24.164060592651367, "global_step": 194256, "epoch": 2340} {"train_loss": -24.363901138305664, "global_step": 194257, "epoch": 2340} {"train_loss": -23.96455955505371, "global_step": 194258, "epoch": 2340} {"train_loss": -24.35337257385254, "global_step": 194259, "epoch": 2340} {"train_loss": -24.106111526489258, "global_step": 194260, "epoch": 2340} {"train_loss": -24.161376953125, "global_step": 194261, "epoch": 2340} {"train_loss": -23.9620418548584, "global_step": 194262, "epoch": 2340} {"train_loss": -24.335790634155273, "global_step": 194263, "epoch": 2340} {"train_loss": -23.91828727722168, "global_step": 194264, "epoch": 2340} {"train_loss": -24.373525619506836, "global_step": 194265, "epoch": 2340} {"train_loss": -24.266035079956055, "global_step": 194266, "epoch": 2340} {"train_loss": -24.080907821655273, "global_step": 194267, "epoch": 2340} {"train_loss": -24.39862632751465, "global_step": 194268, "epoch": 2340} {"train_loss": -24.53952980041504, "global_step": 194269, "epoch": 2340} {"train_loss": -24.240127563476562, "global_step": 194270, "epoch": 2340} {"train_loss": -24.158920288085938, "global_step": 194271, "epoch": 2340} {"train_loss": -23.961633682250977, "global_step": 194272, "epoch": 2340} {"train_loss": -24.129592895507812, "global_step": 194273, "epoch": 2340} {"train_loss": -23.997638702392578, "global_step": 194274, "epoch": 2340} {"train_loss": -24.13541030883789, "global_step": 194275, "epoch": 2340} {"train_loss": -23.69293975830078, "global_step": 194276, "epoch": 2340} {"train_loss": -24.626483917236328, "global_step": 194277, "epoch": 2340} {"train_loss": -24.432157516479492, "global_step": 194278, "epoch": 2340} {"train_loss": -24.031713485717773, "global_step": 194279, "epoch": 2340} {"train_loss": -23.37795066833496, "global_step": 194280, "epoch": 2340} {"train_loss": -23.713542938232422, "global_step": 194281, "epoch": 2340} {"train_loss": -24.02370262145996, "global_step": 194282, "epoch": 2340} {"train_loss": -24.213041305541992, "global_step": 194283, "epoch": 2340} {"train_loss": -24.022031784057617, "global_step": 194284, "epoch": 2340} {"train_loss": -23.40152931213379, "global_step": 194285, "epoch": 2340} {"train_loss": -23.9532413482666, "global_step": 194286, "epoch": 2340} {"train_loss": -23.843427658081055, "global_step": 194287, "epoch": 2340} {"train_loss": -23.732229232788086, "global_step": 194288, "epoch": 2340} {"train_loss": -24.39666748046875, "global_step": 194289, "epoch": 2340} {"train_loss": -23.639265060424805, "global_step": 194290, "epoch": 2340} {"train_loss": -23.935420989990234, "global_step": 194291, "epoch": 2340} {"train_loss": -23.99241065979004, "global_step": 194292, "epoch": 2340} {"train_loss": -24.048385620117188, "global_step": 194293, "epoch": 2340} {"train_loss": -24.204456329345703, "global_step": 194294, "epoch": 2340} {"train_loss": -23.833282470703125, "global_step": 194295, "epoch": 2340} {"train_loss": -24.183820724487305, "global_step": 194296, "epoch": 2340} {"train_loss": -24.2512264251709, "global_step": 194297, "epoch": 2340} {"train_loss": -24.023330688476562, "global_step": 194298, "epoch": 2340} {"train_loss": -24.43281364440918, "global_step": 194299, "epoch": 2340} {"train_loss": -24.305835723876953, "global_step": 194300, "epoch": 2340} {"train_loss": -24.031505584716797, "global_step": 194301, "epoch": 2340} {"train_loss": -24.050509854971644, "global_step": 194302, "epoch": 2340, "val_loss": 6433684.0} {"train_loss": -23.916074752807617, "global_step": 194303, "epoch": 2341} {"train_loss": -23.798118591308594, "global_step": 194304, "epoch": 2341} {"train_loss": -23.792598724365234, "global_step": 194305, "epoch": 2341} {"train_loss": -23.757450103759766, "global_step": 194306, "epoch": 2341} {"train_loss": -23.69285011291504, "global_step": 194307, "epoch": 2341} {"train_loss": -23.81715202331543, "global_step": 194308, "epoch": 2341} {"train_loss": -23.64841651916504, "global_step": 194309, "epoch": 2341} {"train_loss": -23.683439254760742, "global_step": 194310, "epoch": 2341} {"train_loss": -23.707504272460938, "global_step": 194311, "epoch": 2341} {"train_loss": -24.095556259155273, "global_step": 194312, "epoch": 2341} {"train_loss": -23.48940086364746, "global_step": 194313, "epoch": 2341} {"train_loss": -24.10680389404297, "global_step": 194314, "epoch": 2341} {"train_loss": -23.772541046142578, "global_step": 194315, "epoch": 2341} {"train_loss": -23.830949783325195, "global_step": 194316, "epoch": 2341} {"train_loss": -23.87635040283203, "global_step": 194317, "epoch": 2341} {"train_loss": -24.145544052124023, "global_step": 194318, "epoch": 2341} {"train_loss": -23.941164016723633, "global_step": 194319, "epoch": 2341} {"train_loss": -23.86094093322754, "global_step": 194320, "epoch": 2341} {"train_loss": -24.042743682861328, "global_step": 194321, "epoch": 2341} {"train_loss": -24.045974731445312, "global_step": 194322, "epoch": 2341} {"train_loss": -23.614675521850586, "global_step": 194323, "epoch": 2341} {"train_loss": -24.21170997619629, "global_step": 194324, "epoch": 2341} {"train_loss": -23.97513198852539, "global_step": 194325, "epoch": 2341} {"train_loss": -23.964096069335938, "global_step": 194326, "epoch": 2341} {"train_loss": -23.91713523864746, "global_step": 194327, "epoch": 2341} {"train_loss": -24.18021583557129, "global_step": 194328, "epoch": 2341} {"train_loss": -23.98232650756836, "global_step": 194329, "epoch": 2341} {"train_loss": -24.05953598022461, "global_step": 194330, "epoch": 2341} {"train_loss": -23.96941566467285, "global_step": 194331, "epoch": 2341} {"train_loss": -24.060413360595703, "global_step": 194332, "epoch": 2341} {"train_loss": -24.267393112182617, "global_step": 194333, "epoch": 2341} {"train_loss": -24.267004013061523, "global_step": 194334, "epoch": 2341} {"train_loss": -24.114164352416992, "global_step": 194335, "epoch": 2341} {"train_loss": -24.389392852783203, "global_step": 194336, "epoch": 2341} {"train_loss": -24.431970596313477, "global_step": 194337, "epoch": 2341} {"train_loss": -24.36724853515625, "global_step": 194338, "epoch": 2341} {"train_loss": -24.341588973999023, "global_step": 194339, "epoch": 2341} {"train_loss": -24.38566017150879, "global_step": 194340, "epoch": 2341} {"train_loss": -23.901084899902344, "global_step": 194341, "epoch": 2341} {"train_loss": -24.274738311767578, "global_step": 194342, "epoch": 2341} {"train_loss": -24.050159454345703, "global_step": 194343, "epoch": 2341} {"train_loss": -24.233442306518555, "global_step": 194344, "epoch": 2341} {"train_loss": -24.215116500854492, "global_step": 194345, "epoch": 2341} {"train_loss": -24.109256744384766, "global_step": 194346, "epoch": 2341} {"train_loss": -23.694072723388672, "global_step": 194347, "epoch": 2341} {"train_loss": -24.138751983642578, "global_step": 194348, "epoch": 2341} {"train_loss": -23.811872482299805, "global_step": 194349, "epoch": 2341} {"train_loss": -24.124893188476562, "global_step": 194350, "epoch": 2341} {"train_loss": -24.158519744873047, "global_step": 194351, "epoch": 2341} {"train_loss": -24.46295928955078, "global_step": 194352, "epoch": 2341} {"train_loss": -24.273738861083984, "global_step": 194353, "epoch": 2341} {"train_loss": -24.003925323486328, "global_step": 194354, "epoch": 2341} {"train_loss": -23.941299438476562, "global_step": 194355, "epoch": 2341} {"train_loss": -24.19844627380371, "global_step": 194356, "epoch": 2341} {"train_loss": -24.09620475769043, "global_step": 194357, "epoch": 2341} {"train_loss": -23.971158981323242, "global_step": 194358, "epoch": 2341} {"train_loss": -24.35818862915039, "global_step": 194359, "epoch": 2341} {"train_loss": -24.172992706298828, "global_step": 194360, "epoch": 2341} {"train_loss": -24.149179458618164, "global_step": 194361, "epoch": 2341} {"train_loss": -24.09393310546875, "global_step": 194362, "epoch": 2341} {"train_loss": -24.281755447387695, "global_step": 194363, "epoch": 2341} {"train_loss": -24.02107810974121, "global_step": 194364, "epoch": 2341} {"train_loss": -24.72064208984375, "global_step": 194365, "epoch": 2341} {"train_loss": -23.915870666503906, "global_step": 194366, "epoch": 2341} {"train_loss": -24.334280014038086, "global_step": 194367, "epoch": 2341} {"train_loss": -23.92803955078125, "global_step": 194368, "epoch": 2341} {"train_loss": -24.076129913330078, "global_step": 194369, "epoch": 2341} {"train_loss": -24.108274459838867, "global_step": 194370, "epoch": 2341} {"train_loss": -23.85150718688965, "global_step": 194371, "epoch": 2341} {"train_loss": -24.327890396118164, "global_step": 194372, "epoch": 2341} {"train_loss": -23.900495529174805, "global_step": 194373, "epoch": 2341} {"train_loss": -23.43314552307129, "global_step": 194374, "epoch": 2341} {"train_loss": -24.168739318847656, "global_step": 194375, "epoch": 2341} {"train_loss": -23.751693725585938, "global_step": 194376, "epoch": 2341} {"train_loss": -24.091882705688477, "global_step": 194377, "epoch": 2341} {"train_loss": -24.48258399963379, "global_step": 194378, "epoch": 2341} {"train_loss": -24.150955200195312, "global_step": 194379, "epoch": 2341} {"train_loss": -24.528743743896484, "global_step": 194380, "epoch": 2341} {"train_loss": -24.30544090270996, "global_step": 194381, "epoch": 2341} {"train_loss": -24.199777603149414, "global_step": 194382, "epoch": 2341} {"train_loss": -24.514944076538086, "global_step": 194383, "epoch": 2341} {"train_loss": -24.429615020751953, "global_step": 194384, "epoch": 2341} {"train_loss": -24.079394512865917, "global_step": 194385, "epoch": 2341, "val_loss": 6462692.5} {"train_loss": -23.82185173034668, "global_step": 194386, "epoch": 2342} {"train_loss": -23.902875900268555, "global_step": 194387, "epoch": 2342} {"train_loss": -23.865503311157227, "global_step": 194388, "epoch": 2342} {"train_loss": -23.99141502380371, "global_step": 194389, "epoch": 2342} {"train_loss": -24.449237823486328, "global_step": 194390, "epoch": 2342} {"train_loss": -23.816347122192383, "global_step": 194391, "epoch": 2342} {"train_loss": -23.993337631225586, "global_step": 194392, "epoch": 2342} {"train_loss": -24.132532119750977, "global_step": 194393, "epoch": 2342} {"train_loss": -24.607297897338867, "global_step": 194394, "epoch": 2342} {"train_loss": -23.87002944946289, "global_step": 194395, "epoch": 2342} {"train_loss": -24.149911880493164, "global_step": 194396, "epoch": 2342} {"train_loss": -23.979785919189453, "global_step": 194397, "epoch": 2342} {"train_loss": -24.266225814819336, "global_step": 194398, "epoch": 2342} {"train_loss": -24.277345657348633, "global_step": 194399, "epoch": 2342} {"train_loss": -24.359907150268555, "global_step": 194400, "epoch": 2342} {"train_loss": -24.33280372619629, "global_step": 194401, "epoch": 2342} {"train_loss": -24.605100631713867, "global_step": 194402, "epoch": 2342} {"train_loss": -24.605365753173828, "global_step": 194403, "epoch": 2342} {"train_loss": -24.384977340698242, "global_step": 194404, "epoch": 2342} {"train_loss": -24.231002807617188, "global_step": 194405, "epoch": 2342} {"train_loss": -24.295082092285156, "global_step": 194406, "epoch": 2342} {"train_loss": -24.076156616210938, "global_step": 194407, "epoch": 2342} {"train_loss": -24.35672950744629, "global_step": 194408, "epoch": 2342} {"train_loss": -23.987031936645508, "global_step": 194409, "epoch": 2342} {"train_loss": -24.472867965698242, "global_step": 194410, "epoch": 2342} {"train_loss": -24.24244499206543, "global_step": 194411, "epoch": 2342} {"train_loss": -24.167760848999023, "global_step": 194412, "epoch": 2342} {"train_loss": -23.690420150756836, "global_step": 194413, "epoch": 2342} {"train_loss": -23.965147018432617, "global_step": 194414, "epoch": 2342} {"train_loss": -24.240100860595703, "global_step": 194415, "epoch": 2342} {"train_loss": -24.02845573425293, "global_step": 194416, "epoch": 2342} {"train_loss": -24.147014617919922, "global_step": 194417, "epoch": 2342} {"train_loss": -24.35297966003418, "global_step": 194418, "epoch": 2342} {"train_loss": -23.923978805541992, "global_step": 194419, "epoch": 2342} {"train_loss": -24.213624954223633, "global_step": 194420, "epoch": 2342} {"train_loss": -23.851648330688477, "global_step": 194421, "epoch": 2342} {"train_loss": -23.771989822387695, "global_step": 194422, "epoch": 2342} {"train_loss": -24.610471725463867, "global_step": 194423, "epoch": 2342} {"train_loss": -24.03010368347168, "global_step": 194424, "epoch": 2342} {"train_loss": -24.29859733581543, "global_step": 194425, "epoch": 2342} {"train_loss": -24.44820785522461, "global_step": 194426, "epoch": 2342} {"train_loss": -24.386159896850586, "global_step": 194427, "epoch": 2342} {"train_loss": -23.894515991210938, "global_step": 194428, "epoch": 2342} {"train_loss": -24.452014923095703, "global_step": 194429, "epoch": 2342} {"train_loss": -24.207868576049805, "global_step": 194430, "epoch": 2342} {"train_loss": -24.139856338500977, "global_step": 194431, "epoch": 2342} {"train_loss": -24.380538940429688, "global_step": 194432, "epoch": 2342} {"train_loss": -24.1865291595459, "global_step": 194433, "epoch": 2342} {"train_loss": -24.2355899810791, "global_step": 194434, "epoch": 2342} {"train_loss": -24.293502807617188, "global_step": 194435, "epoch": 2342} {"train_loss": -23.97919273376465, "global_step": 194436, "epoch": 2342} {"train_loss": -24.2584228515625, "global_step": 194437, "epoch": 2342} {"train_loss": -24.26502799987793, "global_step": 194438, "epoch": 2342} {"train_loss": -24.167743682861328, "global_step": 194439, "epoch": 2342} {"train_loss": -23.929357528686523, "global_step": 194440, "epoch": 2342} {"train_loss": -24.473365783691406, "global_step": 194441, "epoch": 2342} {"train_loss": -24.272029876708984, "global_step": 194442, "epoch": 2342} {"train_loss": -24.28192901611328, "global_step": 194443, "epoch": 2342} {"train_loss": -24.103593826293945, "global_step": 194444, "epoch": 2342} {"train_loss": -24.26542854309082, "global_step": 194445, "epoch": 2342} {"train_loss": -24.254566192626953, "global_step": 194446, "epoch": 2342} {"train_loss": -24.26980972290039, "global_step": 194447, "epoch": 2342} {"train_loss": -24.62139320373535, "global_step": 194448, "epoch": 2342} {"train_loss": -24.223600387573242, "global_step": 194449, "epoch": 2342} {"train_loss": -24.428802490234375, "global_step": 194450, "epoch": 2342} {"train_loss": -24.148502349853516, "global_step": 194451, "epoch": 2342} {"train_loss": -24.289587020874023, "global_step": 194452, "epoch": 2342} {"train_loss": -24.448535919189453, "global_step": 194453, "epoch": 2342} {"train_loss": -24.259626388549805, "global_step": 194454, "epoch": 2342} {"train_loss": -24.04066276550293, "global_step": 194455, "epoch": 2342} {"train_loss": -23.947174072265625, "global_step": 194456, "epoch": 2342} {"train_loss": -23.38336753845215, "global_step": 194457, "epoch": 2342} {"train_loss": -24.08317756652832, "global_step": 194458, "epoch": 2342} {"train_loss": -24.230833053588867, "global_step": 194459, "epoch": 2342} {"train_loss": -24.45751953125, "global_step": 194460, "epoch": 2342} {"train_loss": -24.350406646728516, "global_step": 194461, "epoch": 2342} {"train_loss": -24.26103973388672, "global_step": 194462, "epoch": 2342} {"train_loss": -24.011371612548828, "global_step": 194463, "epoch": 2342} {"train_loss": -24.38010597229004, "global_step": 194464, "epoch": 2342} {"train_loss": -24.558940887451172, "global_step": 194465, "epoch": 2342} {"train_loss": -24.107799530029297, "global_step": 194466, "epoch": 2342} {"train_loss": -24.908334732055664, "global_step": 194467, "epoch": 2342} {"train_loss": -24.202280228396496, "global_step": 194468, "epoch": 2342, "val_loss": 6549673.0} {"train_loss": -23.308120727539062, "global_step": 194469, "epoch": 2343} {"train_loss": -23.025060653686523, "global_step": 194470, "epoch": 2343} {"train_loss": -23.937870025634766, "global_step": 194471, "epoch": 2343} {"train_loss": -23.7722110748291, "global_step": 194472, "epoch": 2343} {"train_loss": -23.88002586364746, "global_step": 194473, "epoch": 2343} {"train_loss": -23.806577682495117, "global_step": 194474, "epoch": 2343} {"train_loss": -23.847959518432617, "global_step": 194475, "epoch": 2343} {"train_loss": -23.5255184173584, "global_step": 194476, "epoch": 2343} {"train_loss": -24.120208740234375, "global_step": 194477, "epoch": 2343} {"train_loss": -24.0131778717041, "global_step": 194478, "epoch": 2343} {"train_loss": -23.618640899658203, "global_step": 194479, "epoch": 2343} {"train_loss": -24.098981857299805, "global_step": 194480, "epoch": 2343} {"train_loss": -23.688329696655273, "global_step": 194481, "epoch": 2343} {"train_loss": -23.706708908081055, "global_step": 194482, "epoch": 2343} {"train_loss": -24.111284255981445, "global_step": 194483, "epoch": 2343} {"train_loss": -24.07076072692871, "global_step": 194484, "epoch": 2343} {"train_loss": -23.74688720703125, "global_step": 194485, "epoch": 2343} {"train_loss": -23.618139266967773, "global_step": 194486, "epoch": 2343} {"train_loss": -24.205041885375977, "global_step": 194487, "epoch": 2343} {"train_loss": -23.866676330566406, "global_step": 194488, "epoch": 2343} {"train_loss": -23.735736846923828, "global_step": 194489, "epoch": 2343} {"train_loss": -23.977807998657227, "global_step": 194490, "epoch": 2343} {"train_loss": -23.83272361755371, "global_step": 194491, "epoch": 2343} {"train_loss": -23.993431091308594, "global_step": 194492, "epoch": 2343} {"train_loss": -23.913116455078125, "global_step": 194493, "epoch": 2343} {"train_loss": -24.18524742126465, "global_step": 194494, "epoch": 2343} {"train_loss": -24.2648983001709, "global_step": 194495, "epoch": 2343} {"train_loss": -24.220001220703125, "global_step": 194496, "epoch": 2343} {"train_loss": -24.141191482543945, "global_step": 194497, "epoch": 2343} {"train_loss": -24.239791870117188, "global_step": 194498, "epoch": 2343} {"train_loss": -24.04494285583496, "global_step": 194499, "epoch": 2343} {"train_loss": -23.99806022644043, "global_step": 194500, "epoch": 2343} {"train_loss": -24.06233024597168, "global_step": 194501, "epoch": 2343} {"train_loss": -24.30671501159668, "global_step": 194502, "epoch": 2343} {"train_loss": -23.727157592773438, "global_step": 194503, "epoch": 2343} {"train_loss": -24.102949142456055, "global_step": 194504, "epoch": 2343} {"train_loss": -24.301485061645508, "global_step": 194505, "epoch": 2343} {"train_loss": -24.445356369018555, "global_step": 194506, "epoch": 2343} {"train_loss": -24.452356338500977, "global_step": 194507, "epoch": 2343} {"train_loss": -24.3835506439209, "global_step": 194508, "epoch": 2343} {"train_loss": -24.190519332885742, "global_step": 194509, "epoch": 2343} {"train_loss": -23.85587501525879, "global_step": 194510, "epoch": 2343} {"train_loss": -23.925933837890625, "global_step": 194511, "epoch": 2343} {"train_loss": -24.177553176879883, "global_step": 194512, "epoch": 2343} {"train_loss": -24.264753341674805, "global_step": 194513, "epoch": 2343} {"train_loss": -24.59431266784668, "global_step": 194514, "epoch": 2343} {"train_loss": -24.06261444091797, "global_step": 194515, "epoch": 2343} {"train_loss": -24.0678768157959, "global_step": 194516, "epoch": 2343} {"train_loss": -24.296934127807617, "global_step": 194517, "epoch": 2343} {"train_loss": -24.084400177001953, "global_step": 194518, "epoch": 2343} {"train_loss": -24.139768600463867, "global_step": 194519, "epoch": 2343} {"train_loss": -24.62495231628418, "global_step": 194520, "epoch": 2343} {"train_loss": -24.325546264648438, "global_step": 194521, "epoch": 2343} {"train_loss": -24.326231002807617, "global_step": 194522, "epoch": 2343} {"train_loss": -24.246456146240234, "global_step": 194523, "epoch": 2343} {"train_loss": -24.459138870239258, "global_step": 194524, "epoch": 2343} {"train_loss": -24.2069034576416, "global_step": 194525, "epoch": 2343} {"train_loss": -24.08428955078125, "global_step": 194526, "epoch": 2343} {"train_loss": -24.406564712524414, "global_step": 194527, "epoch": 2343} {"train_loss": -24.350997924804688, "global_step": 194528, "epoch": 2343} {"train_loss": -24.5118408203125, "global_step": 194529, "epoch": 2343} {"train_loss": -24.10788917541504, "global_step": 194530, "epoch": 2343} {"train_loss": -24.432973861694336, "global_step": 194531, "epoch": 2343} {"train_loss": -24.541309356689453, "global_step": 194532, "epoch": 2343} {"train_loss": -24.14203453063965, "global_step": 194533, "epoch": 2343} {"train_loss": -24.520116806030273, "global_step": 194534, "epoch": 2343} {"train_loss": -23.737882614135742, "global_step": 194535, "epoch": 2343} {"train_loss": -24.31037712097168, "global_step": 194536, "epoch": 2343} {"train_loss": -23.96442985534668, "global_step": 194537, "epoch": 2343} {"train_loss": -24.151168823242188, "global_step": 194538, "epoch": 2343} {"train_loss": -24.012388229370117, "global_step": 194539, "epoch": 2343} {"train_loss": -24.120229721069336, "global_step": 194540, "epoch": 2343} {"train_loss": -23.910818099975586, "global_step": 194541, "epoch": 2343} {"train_loss": -24.201271057128906, "global_step": 194542, "epoch": 2343} {"train_loss": -23.92633056640625, "global_step": 194543, "epoch": 2343} {"train_loss": -24.3588924407959, "global_step": 194544, "epoch": 2343} {"train_loss": -23.88385009765625, "global_step": 194545, "epoch": 2343} {"train_loss": -23.73926544189453, "global_step": 194546, "epoch": 2343} {"train_loss": -23.80214500427246, "global_step": 194547, "epoch": 2343} {"train_loss": -23.75114631652832, "global_step": 194548, "epoch": 2343} {"train_loss": -23.970748901367188, "global_step": 194549, "epoch": 2343} {"train_loss": -23.787353515625, "global_step": 194550, "epoch": 2343} {"train_loss": -24.063168996787933, "global_step": 194551, "epoch": 2343, "val_loss": 6491026.5} {"train_loss": -23.56839370727539, "global_step": 194552, "epoch": 2344} {"train_loss": -23.129812240600586, "global_step": 194553, "epoch": 2344} {"train_loss": -23.888519287109375, "global_step": 194554, "epoch": 2344} {"train_loss": -23.590312957763672, "global_step": 194555, "epoch": 2344} {"train_loss": -23.635751724243164, "global_step": 194556, "epoch": 2344} {"train_loss": -24.041549682617188, "global_step": 194557, "epoch": 2344} {"train_loss": -23.758747100830078, "global_step": 194558, "epoch": 2344} {"train_loss": -23.79985237121582, "global_step": 194559, "epoch": 2344} {"train_loss": -23.862836837768555, "global_step": 194560, "epoch": 2344} {"train_loss": -23.755605697631836, "global_step": 194561, "epoch": 2344} {"train_loss": -23.696300506591797, "global_step": 194562, "epoch": 2344} {"train_loss": -23.866779327392578, "global_step": 194563, "epoch": 2344} {"train_loss": -23.870559692382812, "global_step": 194564, "epoch": 2344} {"train_loss": -23.916746139526367, "global_step": 194565, "epoch": 2344} {"train_loss": -24.1269588470459, "global_step": 194566, "epoch": 2344} {"train_loss": -24.354761123657227, "global_step": 194567, "epoch": 2344} {"train_loss": -23.92460060119629, "global_step": 194568, "epoch": 2344} {"train_loss": -24.131067276000977, "global_step": 194569, "epoch": 2344} {"train_loss": -24.14141845703125, "global_step": 194570, "epoch": 2344} {"train_loss": -24.28569793701172, "global_step": 194571, "epoch": 2344} {"train_loss": -24.215839385986328, "global_step": 194572, "epoch": 2344} {"train_loss": -24.30767822265625, "global_step": 194573, "epoch": 2344} {"train_loss": -24.14551544189453, "global_step": 194574, "epoch": 2344} {"train_loss": -24.136518478393555, "global_step": 194575, "epoch": 2344} {"train_loss": -24.53230857849121, "global_step": 194576, "epoch": 2344} {"train_loss": -24.392446517944336, "global_step": 194577, "epoch": 2344} {"train_loss": -24.16022491455078, "global_step": 194578, "epoch": 2344} {"train_loss": -24.369617462158203, "global_step": 194579, "epoch": 2344} {"train_loss": -24.056081771850586, "global_step": 194580, "epoch": 2344} {"train_loss": -24.409143447875977, "global_step": 194581, "epoch": 2344} {"train_loss": -24.13123893737793, "global_step": 194582, "epoch": 2344} {"train_loss": -24.30598258972168, "global_step": 194583, "epoch": 2344} {"train_loss": -24.650510787963867, "global_step": 194584, "epoch": 2344} {"train_loss": -24.77692985534668, "global_step": 194585, "epoch": 2344} {"train_loss": -24.243661880493164, "global_step": 194586, "epoch": 2344} {"train_loss": -24.11188507080078, "global_step": 194587, "epoch": 2344} {"train_loss": -24.374170303344727, "global_step": 194588, "epoch": 2344} {"train_loss": -24.3676815032959, "global_step": 194589, "epoch": 2344} {"train_loss": -24.71865463256836, "global_step": 194590, "epoch": 2344} {"train_loss": -24.635271072387695, "global_step": 194591, "epoch": 2344} {"train_loss": -24.002906799316406, "global_step": 194592, "epoch": 2344} {"train_loss": -24.011764526367188, "global_step": 194593, "epoch": 2344} {"train_loss": -23.91641616821289, "global_step": 194594, "epoch": 2344} {"train_loss": -24.492300033569336, "global_step": 194595, "epoch": 2344} {"train_loss": -23.969552993774414, "global_step": 194596, "epoch": 2344} {"train_loss": -24.43199348449707, "global_step": 194597, "epoch": 2344} {"train_loss": -24.10856819152832, "global_step": 194598, "epoch": 2344} {"train_loss": -24.23976707458496, "global_step": 194599, "epoch": 2344} {"train_loss": -24.338254928588867, "global_step": 194600, "epoch": 2344} {"train_loss": -24.07894515991211, "global_step": 194601, "epoch": 2344} {"train_loss": -24.461856842041016, "global_step": 194602, "epoch": 2344} {"train_loss": -24.273263931274414, "global_step": 194603, "epoch": 2344} {"train_loss": -23.49796485900879, "global_step": 194604, "epoch": 2344} {"train_loss": -24.32349967956543, "global_step": 194605, "epoch": 2344} {"train_loss": -24.111494064331055, "global_step": 194606, "epoch": 2344} {"train_loss": -24.256139755249023, "global_step": 194607, "epoch": 2344} {"train_loss": -24.203794479370117, "global_step": 194608, "epoch": 2344} {"train_loss": -24.064538955688477, "global_step": 194609, "epoch": 2344} {"train_loss": -24.018672943115234, "global_step": 194610, "epoch": 2344} {"train_loss": -24.468048095703125, "global_step": 194611, "epoch": 2344} {"train_loss": -23.86736488342285, "global_step": 194612, "epoch": 2344} {"train_loss": -24.005813598632812, "global_step": 194613, "epoch": 2344} {"train_loss": -24.08367347717285, "global_step": 194614, "epoch": 2344} {"train_loss": -24.019798278808594, "global_step": 194615, "epoch": 2344} {"train_loss": -24.093172073364258, "global_step": 194616, "epoch": 2344} {"train_loss": -24.701961517333984, "global_step": 194617, "epoch": 2344} {"train_loss": -24.3657169342041, "global_step": 194618, "epoch": 2344} {"train_loss": -24.24934959411621, "global_step": 194619, "epoch": 2344} {"train_loss": -24.300207138061523, "global_step": 194620, "epoch": 2344} {"train_loss": -24.265409469604492, "global_step": 194621, "epoch": 2344} {"train_loss": -24.068288803100586, "global_step": 194622, "epoch": 2344} {"train_loss": -24.147300720214844, "global_step": 194623, "epoch": 2344} {"train_loss": -24.080190658569336, "global_step": 194624, "epoch": 2344} {"train_loss": -24.229249954223633, "global_step": 194625, "epoch": 2344} {"train_loss": -24.2940731048584, "global_step": 194626, "epoch": 2344} {"train_loss": -24.165170669555664, "global_step": 194627, "epoch": 2344} {"train_loss": -24.226551055908203, "global_step": 194628, "epoch": 2344} {"train_loss": -24.134092330932617, "global_step": 194629, "epoch": 2344} {"train_loss": -23.87728500366211, "global_step": 194630, "epoch": 2344} {"train_loss": -24.062837600708008, "global_step": 194631, "epoch": 2344} {"train_loss": -23.802396774291992, "global_step": 194632, "epoch": 2344} {"train_loss": -24.357498168945312, "global_step": 194633, "epoch": 2344} {"train_loss": -24.12751423019961, "global_step": 194634, "epoch": 2344, "val_loss": 6469529.0} {"train_loss": -23.12564468383789, "global_step": 194635, "epoch": 2345} {"train_loss": -23.25958824157715, "global_step": 194636, "epoch": 2345} {"train_loss": -22.909643173217773, "global_step": 194637, "epoch": 2345} {"train_loss": -23.754331588745117, "global_step": 194638, "epoch": 2345} {"train_loss": -24.01527976989746, "global_step": 194639, "epoch": 2345} {"train_loss": -23.65713882446289, "global_step": 194640, "epoch": 2345} {"train_loss": -23.2000675201416, "global_step": 194641, "epoch": 2345} {"train_loss": -23.857465744018555, "global_step": 194642, "epoch": 2345} {"train_loss": -23.519933700561523, "global_step": 194643, "epoch": 2345} {"train_loss": -23.40993309020996, "global_step": 194644, "epoch": 2345} {"train_loss": -23.723600387573242, "global_step": 194645, "epoch": 2345} {"train_loss": -23.36104393005371, "global_step": 194646, "epoch": 2345} {"train_loss": -24.05887222290039, "global_step": 194647, "epoch": 2345} {"train_loss": -24.003864288330078, "global_step": 194648, "epoch": 2345} {"train_loss": -23.923139572143555, "global_step": 194649, "epoch": 2345} {"train_loss": -23.806631088256836, "global_step": 194650, "epoch": 2345} {"train_loss": -24.047475814819336, "global_step": 194651, "epoch": 2345} {"train_loss": -23.8487548828125, "global_step": 194652, "epoch": 2345} {"train_loss": -23.97714614868164, "global_step": 194653, "epoch": 2345} {"train_loss": -23.835296630859375, "global_step": 194654, "epoch": 2345} {"train_loss": -24.2585391998291, "global_step": 194655, "epoch": 2345} {"train_loss": -24.192581176757812, "global_step": 194656, "epoch": 2345} {"train_loss": -24.211688995361328, "global_step": 194657, "epoch": 2345} {"train_loss": -24.10795021057129, "global_step": 194658, "epoch": 2345} {"train_loss": -23.98679542541504, "global_step": 194659, "epoch": 2345} {"train_loss": -24.260112762451172, "global_step": 194660, "epoch": 2345} {"train_loss": -23.988712310791016, "global_step": 194661, "epoch": 2345} {"train_loss": -23.81044578552246, "global_step": 194662, "epoch": 2345} {"train_loss": -24.02012825012207, "global_step": 194663, "epoch": 2345} {"train_loss": -24.13641929626465, "global_step": 194664, "epoch": 2345} {"train_loss": -24.06814956665039, "global_step": 194665, "epoch": 2345} {"train_loss": -24.134540557861328, "global_step": 194666, "epoch": 2345} {"train_loss": -24.596012115478516, "global_step": 194667, "epoch": 2345} {"train_loss": -23.91834831237793, "global_step": 194668, "epoch": 2345} {"train_loss": -24.10062026977539, "global_step": 194669, "epoch": 2345} {"train_loss": -24.02789306640625, "global_step": 194670, "epoch": 2345} {"train_loss": -24.433979034423828, "global_step": 194671, "epoch": 2345} {"train_loss": -24.238481521606445, "global_step": 194672, "epoch": 2345} {"train_loss": -24.53087043762207, "global_step": 194673, "epoch": 2345} {"train_loss": -24.607696533203125, "global_step": 194674, "epoch": 2345} {"train_loss": -24.22758674621582, "global_step": 194675, "epoch": 2345} {"train_loss": -24.537891387939453, "global_step": 194676, "epoch": 2345} {"train_loss": -24.269895553588867, "global_step": 194677, "epoch": 2345} {"train_loss": -24.10707664489746, "global_step": 194678, "epoch": 2345} {"train_loss": -23.880615234375, "global_step": 194679, "epoch": 2345} {"train_loss": -24.423969268798828, "global_step": 194680, "epoch": 2345} {"train_loss": -23.853574752807617, "global_step": 194681, "epoch": 2345} {"train_loss": -24.007596969604492, "global_step": 194682, "epoch": 2345} {"train_loss": -23.910999298095703, "global_step": 194683, "epoch": 2345} {"train_loss": -24.33103370666504, "global_step": 194684, "epoch": 2345} {"train_loss": -24.298494338989258, "global_step": 194685, "epoch": 2345} {"train_loss": -24.48027992248535, "global_step": 194686, "epoch": 2345} {"train_loss": -24.137676239013672, "global_step": 194687, "epoch": 2345} {"train_loss": -24.289752960205078, "global_step": 194688, "epoch": 2345} {"train_loss": -24.079233169555664, "global_step": 194689, "epoch": 2345} {"train_loss": -24.245561599731445, "global_step": 194690, "epoch": 2345} {"train_loss": -24.472442626953125, "global_step": 194691, "epoch": 2345} {"train_loss": -24.36903953552246, "global_step": 194692, "epoch": 2345} {"train_loss": -24.065580368041992, "global_step": 194693, "epoch": 2345} {"train_loss": -24.219005584716797, "global_step": 194694, "epoch": 2345} {"train_loss": -23.880308151245117, "global_step": 194695, "epoch": 2345} {"train_loss": -24.451589584350586, "global_step": 194696, "epoch": 2345} {"train_loss": -23.889856338500977, "global_step": 194697, "epoch": 2345} {"train_loss": -24.201215744018555, "global_step": 194698, "epoch": 2345} {"train_loss": -24.1954345703125, "global_step": 194699, "epoch": 2345} {"train_loss": -24.274877548217773, "global_step": 194700, "epoch": 2345} {"train_loss": -24.522939682006836, "global_step": 194701, "epoch": 2345} {"train_loss": -24.24625015258789, "global_step": 194702, "epoch": 2345} {"train_loss": -24.228666305541992, "global_step": 194703, "epoch": 2345} {"train_loss": -24.268878936767578, "global_step": 194704, "epoch": 2345} {"train_loss": -24.10969352722168, "global_step": 194705, "epoch": 2345} {"train_loss": -24.389678955078125, "global_step": 194706, "epoch": 2345} {"train_loss": -24.363683700561523, "global_step": 194707, "epoch": 2345} {"train_loss": -24.595718383789062, "global_step": 194708, "epoch": 2345} {"train_loss": -23.856555938720703, "global_step": 194709, "epoch": 2345} {"train_loss": -24.072710037231445, "global_step": 194710, "epoch": 2345} {"train_loss": -24.140357971191406, "global_step": 194711, "epoch": 2345} {"train_loss": -23.957088470458984, "global_step": 194712, "epoch": 2345} {"train_loss": -24.02735137939453, "global_step": 194713, "epoch": 2345} {"train_loss": -24.081809997558594, "global_step": 194714, "epoch": 2345} {"train_loss": -24.097869873046875, "global_step": 194715, "epoch": 2345} {"train_loss": -24.3414249420166, "global_step": 194716, "epoch": 2345} {"train_loss": -24.050743401768695, "global_step": 194717, "epoch": 2345, "val_loss": 6665331.0} {"train_loss": -23.535810470581055, "global_step": 194718, "epoch": 2346} {"train_loss": -23.480928421020508, "global_step": 194719, "epoch": 2346} {"train_loss": -23.376188278198242, "global_step": 194720, "epoch": 2346} {"train_loss": -23.710397720336914, "global_step": 194721, "epoch": 2346} {"train_loss": -23.679311752319336, "global_step": 194722, "epoch": 2346} {"train_loss": -23.583471298217773, "global_step": 194723, "epoch": 2346} {"train_loss": -23.789630889892578, "global_step": 194724, "epoch": 2346} {"train_loss": -23.826921463012695, "global_step": 194725, "epoch": 2346} {"train_loss": -23.66956329345703, "global_step": 194726, "epoch": 2346} {"train_loss": -24.09511375427246, "global_step": 194727, "epoch": 2346} {"train_loss": -24.151880264282227, "global_step": 194728, "epoch": 2346} {"train_loss": -23.69342803955078, "global_step": 194729, "epoch": 2346} {"train_loss": -23.595203399658203, "global_step": 194730, "epoch": 2346} {"train_loss": -23.426189422607422, "global_step": 194731, "epoch": 2346} {"train_loss": -23.89809226989746, "global_step": 194732, "epoch": 2346} {"train_loss": -24.022571563720703, "global_step": 194733, "epoch": 2346} {"train_loss": -23.95609474182129, "global_step": 194734, "epoch": 2346} {"train_loss": -23.803367614746094, "global_step": 194735, "epoch": 2346} {"train_loss": -24.039716720581055, "global_step": 194736, "epoch": 2346} {"train_loss": -24.041994094848633, "global_step": 194737, "epoch": 2346} {"train_loss": -23.927282333374023, "global_step": 194738, "epoch": 2346} {"train_loss": -24.25368309020996, "global_step": 194739, "epoch": 2346} {"train_loss": -24.184873580932617, "global_step": 194740, "epoch": 2346} {"train_loss": -23.90910530090332, "global_step": 194741, "epoch": 2346} {"train_loss": -24.101911544799805, "global_step": 194742, "epoch": 2346} {"train_loss": -23.96637535095215, "global_step": 194743, "epoch": 2346} {"train_loss": -24.103614807128906, "global_step": 194744, "epoch": 2346} {"train_loss": -24.387269973754883, "global_step": 194745, "epoch": 2346} {"train_loss": -23.996702194213867, "global_step": 194746, "epoch": 2346} {"train_loss": -24.063730239868164, "global_step": 194747, "epoch": 2346} {"train_loss": -24.210336685180664, "global_step": 194748, "epoch": 2346} {"train_loss": -23.80364990234375, "global_step": 194749, "epoch": 2346} {"train_loss": -24.282987594604492, "global_step": 194750, "epoch": 2346} {"train_loss": -24.044849395751953, "global_step": 194751, "epoch": 2346} {"train_loss": -23.81609344482422, "global_step": 194752, "epoch": 2346} {"train_loss": -24.542898178100586, "global_step": 194753, "epoch": 2346} {"train_loss": -24.28478240966797, "global_step": 194754, "epoch": 2346} {"train_loss": -23.959157943725586, "global_step": 194755, "epoch": 2346} {"train_loss": -24.152183532714844, "global_step": 194756, "epoch": 2346} {"train_loss": -24.15737533569336, "global_step": 194757, "epoch": 2346} {"train_loss": -24.16874122619629, "global_step": 194758, "epoch": 2346} {"train_loss": -23.9309139251709, "global_step": 194759, "epoch": 2346} {"train_loss": -24.27834129333496, "global_step": 194760, "epoch": 2346} {"train_loss": -24.127408981323242, "global_step": 194761, "epoch": 2346} {"train_loss": -24.463083267211914, "global_step": 194762, "epoch": 2346} {"train_loss": -23.890872955322266, "global_step": 194763, "epoch": 2346} {"train_loss": -24.127960205078125, "global_step": 194764, "epoch": 2346} {"train_loss": -24.201383590698242, "global_step": 194765, "epoch": 2346} {"train_loss": -24.517248153686523, "global_step": 194766, "epoch": 2346} {"train_loss": -24.065366744995117, "global_step": 194767, "epoch": 2346} {"train_loss": -24.24120330810547, "global_step": 194768, "epoch": 2346} {"train_loss": -24.118268966674805, "global_step": 194769, "epoch": 2346} {"train_loss": -24.203420639038086, "global_step": 194770, "epoch": 2346} {"train_loss": -24.29573631286621, "global_step": 194771, "epoch": 2346} {"train_loss": -24.22397804260254, "global_step": 194772, "epoch": 2346} {"train_loss": -24.246536254882812, "global_step": 194773, "epoch": 2346} {"train_loss": -23.977170944213867, "global_step": 194774, "epoch": 2346} {"train_loss": -24.087589263916016, "global_step": 194775, "epoch": 2346} {"train_loss": -24.174436569213867, "global_step": 194776, "epoch": 2346} {"train_loss": -24.461688995361328, "global_step": 194777, "epoch": 2346} {"train_loss": -24.12682342529297, "global_step": 194778, "epoch": 2346} {"train_loss": -24.281843185424805, "global_step": 194779, "epoch": 2346} {"train_loss": -24.002750396728516, "global_step": 194780, "epoch": 2346} {"train_loss": -24.74517822265625, "global_step": 194781, "epoch": 2346} {"train_loss": -24.318479537963867, "global_step": 194782, "epoch": 2346} {"train_loss": -24.400243759155273, "global_step": 194783, "epoch": 2346} {"train_loss": -24.446962356567383, "global_step": 194784, "epoch": 2346} {"train_loss": -24.368886947631836, "global_step": 194785, "epoch": 2346} {"train_loss": -24.109968185424805, "global_step": 194786, "epoch": 2346} {"train_loss": -24.003692626953125, "global_step": 194787, "epoch": 2346} {"train_loss": -24.496652603149414, "global_step": 194788, "epoch": 2346} {"train_loss": -24.40449333190918, "global_step": 194789, "epoch": 2346} {"train_loss": -24.43345069885254, "global_step": 194790, "epoch": 2346} {"train_loss": -24.076419830322266, "global_step": 194791, "epoch": 2346} {"train_loss": -23.508596420288086, "global_step": 194792, "epoch": 2346} {"train_loss": -24.011974334716797, "global_step": 194793, "epoch": 2346} {"train_loss": -23.663490295410156, "global_step": 194794, "epoch": 2346} {"train_loss": -24.209991455078125, "global_step": 194795, "epoch": 2346} {"train_loss": -23.69797706604004, "global_step": 194796, "epoch": 2346} {"train_loss": -23.55401039123535, "global_step": 194797, "epoch": 2346} {"train_loss": -24.3512020111084, "global_step": 194798, "epoch": 2346} {"train_loss": -24.019933700561523, "global_step": 194799, "epoch": 2346} {"train_loss": -24.051892108227833, "global_step": 194800, "epoch": 2346, "val_loss": 6610127.0} {"train_loss": -23.995779037475586, "global_step": 194801, "epoch": 2347} {"train_loss": -23.68051528930664, "global_step": 194802, "epoch": 2347} {"train_loss": -23.86237907409668, "global_step": 194803, "epoch": 2347} {"train_loss": -24.237680435180664, "global_step": 194804, "epoch": 2347} {"train_loss": -23.874038696289062, "global_step": 194805, "epoch": 2347} {"train_loss": -23.446081161499023, "global_step": 194806, "epoch": 2347} {"train_loss": -23.73065757751465, "global_step": 194807, "epoch": 2347} {"train_loss": -23.884113311767578, "global_step": 194808, "epoch": 2347} {"train_loss": -23.845428466796875, "global_step": 194809, "epoch": 2347} {"train_loss": -24.13947105407715, "global_step": 194810, "epoch": 2347} {"train_loss": -23.7923583984375, "global_step": 194811, "epoch": 2347} {"train_loss": -24.079294204711914, "global_step": 194812, "epoch": 2347} {"train_loss": -24.283193588256836, "global_step": 194813, "epoch": 2347} {"train_loss": -24.195829391479492, "global_step": 194814, "epoch": 2347} {"train_loss": -24.089237213134766, "global_step": 194815, "epoch": 2347} {"train_loss": -24.24738311767578, "global_step": 194816, "epoch": 2347} {"train_loss": -24.208829879760742, "global_step": 194817, "epoch": 2347} {"train_loss": -24.1521053314209, "global_step": 194818, "epoch": 2347} {"train_loss": -24.174854278564453, "global_step": 194819, "epoch": 2347} {"train_loss": -24.47151756286621, "global_step": 194820, "epoch": 2347} {"train_loss": -24.460376739501953, "global_step": 194821, "epoch": 2347} {"train_loss": -24.270187377929688, "global_step": 194822, "epoch": 2347} {"train_loss": -24.150455474853516, "global_step": 194823, "epoch": 2347} {"train_loss": -23.864316940307617, "global_step": 194824, "epoch": 2347} {"train_loss": -24.19681739807129, "global_step": 194825, "epoch": 2347} {"train_loss": -24.054697036743164, "global_step": 194826, "epoch": 2347} {"train_loss": -24.336027145385742, "global_step": 194827, "epoch": 2347} {"train_loss": -24.066190719604492, "global_step": 194828, "epoch": 2347} {"train_loss": -24.190778732299805, "global_step": 194829, "epoch": 2347} {"train_loss": -24.456363677978516, "global_step": 194830, "epoch": 2347} {"train_loss": -24.567707061767578, "global_step": 194831, "epoch": 2347} {"train_loss": -24.504545211791992, "global_step": 194832, "epoch": 2347} {"train_loss": -24.24080467224121, "global_step": 194833, "epoch": 2347} {"train_loss": -24.520877838134766, "global_step": 194834, "epoch": 2347} {"train_loss": -24.27956199645996, "global_step": 194835, "epoch": 2347} {"train_loss": -24.041961669921875, "global_step": 194836, "epoch": 2347} {"train_loss": -24.1820125579834, "global_step": 194837, "epoch": 2347} {"train_loss": -24.18235206604004, "global_step": 194838, "epoch": 2347} {"train_loss": -24.466222763061523, "global_step": 194839, "epoch": 2347} {"train_loss": -24.438888549804688, "global_step": 194840, "epoch": 2347} {"train_loss": -24.499805450439453, "global_step": 194841, "epoch": 2347} {"train_loss": -24.044668197631836, "global_step": 194842, "epoch": 2347} {"train_loss": -24.297584533691406, "global_step": 194843, "epoch": 2347} {"train_loss": -24.30609703063965, "global_step": 194844, "epoch": 2347} {"train_loss": -23.896060943603516, "global_step": 194845, "epoch": 2347} {"train_loss": -23.25689697265625, "global_step": 194846, "epoch": 2347} {"train_loss": -23.28863525390625, "global_step": 194847, "epoch": 2347} {"train_loss": -23.78248405456543, "global_step": 194848, "epoch": 2347} {"train_loss": -24.3551082611084, "global_step": 194849, "epoch": 2347} {"train_loss": -24.169919967651367, "global_step": 194850, "epoch": 2347} {"train_loss": -23.356237411499023, "global_step": 194851, "epoch": 2347} {"train_loss": -23.8991756439209, "global_step": 194852, "epoch": 2347} {"train_loss": -24.103967666625977, "global_step": 194853, "epoch": 2347} {"train_loss": -23.994430541992188, "global_step": 194854, "epoch": 2347} {"train_loss": -24.228605270385742, "global_step": 194855, "epoch": 2347} {"train_loss": -24.11092185974121, "global_step": 194856, "epoch": 2347} {"train_loss": -23.963735580444336, "global_step": 194857, "epoch": 2347} {"train_loss": -24.069917678833008, "global_step": 194858, "epoch": 2347} {"train_loss": -23.901386260986328, "global_step": 194859, "epoch": 2347} {"train_loss": -24.049732208251953, "global_step": 194860, "epoch": 2347} {"train_loss": -24.06928253173828, "global_step": 194861, "epoch": 2347} {"train_loss": -23.856094360351562, "global_step": 194862, "epoch": 2347} {"train_loss": -24.135334014892578, "global_step": 194863, "epoch": 2347} {"train_loss": -24.073715209960938, "global_step": 194864, "epoch": 2347} {"train_loss": -24.283544540405273, "global_step": 194865, "epoch": 2347} {"train_loss": -23.7420597076416, "global_step": 194866, "epoch": 2347} {"train_loss": -24.349523544311523, "global_step": 194867, "epoch": 2347} {"train_loss": -24.462345123291016, "global_step": 194868, "epoch": 2347} {"train_loss": -24.00618553161621, "global_step": 194869, "epoch": 2347} {"train_loss": -24.713651657104492, "global_step": 194870, "epoch": 2347} {"train_loss": -24.09588050842285, "global_step": 194871, "epoch": 2347} {"train_loss": -24.496761322021484, "global_step": 194872, "epoch": 2347} {"train_loss": -24.02930450439453, "global_step": 194873, "epoch": 2347} {"train_loss": -24.378110885620117, "global_step": 194874, "epoch": 2347} {"train_loss": -23.979246139526367, "global_step": 194875, "epoch": 2347} {"train_loss": -23.896509170532227, "global_step": 194876, "epoch": 2347} {"train_loss": -24.356786727905273, "global_step": 194877, "epoch": 2347} {"train_loss": -24.222341537475586, "global_step": 194878, "epoch": 2347} {"train_loss": -24.256336212158203, "global_step": 194879, "epoch": 2347} {"train_loss": -24.12153434753418, "global_step": 194880, "epoch": 2347} {"train_loss": -24.236642837524414, "global_step": 194881, "epoch": 2347} {"train_loss": -24.482379913330078, "global_step": 194882, "epoch": 2347} {"train_loss": -24.12804270365152, "global_step": 194883, "epoch": 2347, "val_loss": 6534655.0} {"train_loss": -24.3316650390625, "global_step": 194884, "epoch": 2348} {"train_loss": -23.670324325561523, "global_step": 194885, "epoch": 2348} {"train_loss": -23.15049171447754, "global_step": 194886, "epoch": 2348} {"train_loss": -23.570234298706055, "global_step": 194887, "epoch": 2348} {"train_loss": -24.087003707885742, "global_step": 194888, "epoch": 2348} {"train_loss": -23.60165786743164, "global_step": 194889, "epoch": 2348} {"train_loss": -23.259597778320312, "global_step": 194890, "epoch": 2348} {"train_loss": -22.223716735839844, "global_step": 194891, "epoch": 2348} {"train_loss": -22.867734909057617, "global_step": 194892, "epoch": 2348} {"train_loss": -23.149457931518555, "global_step": 194893, "epoch": 2348} {"train_loss": -23.64600944519043, "global_step": 194894, "epoch": 2348} {"train_loss": -23.300846099853516, "global_step": 194895, "epoch": 2348} {"train_loss": -23.7686824798584, "global_step": 194896, "epoch": 2348} {"train_loss": -23.764963150024414, "global_step": 194897, "epoch": 2348} {"train_loss": -23.674768447875977, "global_step": 194898, "epoch": 2348} {"train_loss": -23.154104232788086, "global_step": 194899, "epoch": 2348} {"train_loss": -23.293668746948242, "global_step": 194900, "epoch": 2348} {"train_loss": -23.740293502807617, "global_step": 194901, "epoch": 2348} {"train_loss": -23.84346580505371, "global_step": 194902, "epoch": 2348} {"train_loss": -23.84065818786621, "global_step": 194903, "epoch": 2348} {"train_loss": -23.93151092529297, "global_step": 194904, "epoch": 2348} {"train_loss": -23.520498275756836, "global_step": 194905, "epoch": 2348} {"train_loss": -23.97848892211914, "global_step": 194906, "epoch": 2348} {"train_loss": -23.760772705078125, "global_step": 194907, "epoch": 2348} {"train_loss": -23.888103485107422, "global_step": 194908, "epoch": 2348} {"train_loss": -23.880075454711914, "global_step": 194909, "epoch": 2348} {"train_loss": -23.939250946044922, "global_step": 194910, "epoch": 2348} {"train_loss": -23.979787826538086, "global_step": 194911, "epoch": 2348} {"train_loss": -24.27467155456543, "global_step": 194912, "epoch": 2348} {"train_loss": -24.18330192565918, "global_step": 194913, "epoch": 2348} {"train_loss": -23.950361251831055, "global_step": 194914, "epoch": 2348} {"train_loss": -24.128738403320312, "global_step": 194915, "epoch": 2348} {"train_loss": -24.210586547851562, "global_step": 194916, "epoch": 2348} {"train_loss": -24.20977210998535, "global_step": 194917, "epoch": 2348} {"train_loss": -24.597625732421875, "global_step": 194918, "epoch": 2348} {"train_loss": -24.48115348815918, "global_step": 194919, "epoch": 2348} {"train_loss": -24.174419403076172, "global_step": 194920, "epoch": 2348} {"train_loss": -24.35820960998535, "global_step": 194921, "epoch": 2348} {"train_loss": -23.852262496948242, "global_step": 194922, "epoch": 2348} {"train_loss": -24.13776206970215, "global_step": 194923, "epoch": 2348} {"train_loss": -24.169694900512695, "global_step": 194924, "epoch": 2348} {"train_loss": -24.189340591430664, "global_step": 194925, "epoch": 2348} {"train_loss": -24.158706665039062, "global_step": 194926, "epoch": 2348} {"train_loss": -24.07210350036621, "global_step": 194927, "epoch": 2348} {"train_loss": -24.2891845703125, "global_step": 194928, "epoch": 2348} {"train_loss": -24.27191734313965, "global_step": 194929, "epoch": 2348} {"train_loss": -24.33974266052246, "global_step": 194930, "epoch": 2348} {"train_loss": -24.232017517089844, "global_step": 194931, "epoch": 2348} {"train_loss": -24.21745491027832, "global_step": 194932, "epoch": 2348} {"train_loss": -24.448270797729492, "global_step": 194933, "epoch": 2348} {"train_loss": -24.181888580322266, "global_step": 194934, "epoch": 2348} {"train_loss": -24.479324340820312, "global_step": 194935, "epoch": 2348} {"train_loss": -24.161596298217773, "global_step": 194936, "epoch": 2348} {"train_loss": -24.85948944091797, "global_step": 194937, "epoch": 2348} {"train_loss": -24.171436309814453, "global_step": 194938, "epoch": 2348} {"train_loss": -24.34033203125, "global_step": 194939, "epoch": 2348} {"train_loss": -24.42815399169922, "global_step": 194940, "epoch": 2348} {"train_loss": -24.260351181030273, "global_step": 194941, "epoch": 2348} {"train_loss": -24.28517723083496, "global_step": 194942, "epoch": 2348} {"train_loss": -24.395357131958008, "global_step": 194943, "epoch": 2348} {"train_loss": -24.340566635131836, "global_step": 194944, "epoch": 2348} {"train_loss": -24.104589462280273, "global_step": 194945, "epoch": 2348} {"train_loss": -24.41774559020996, "global_step": 194946, "epoch": 2348} {"train_loss": -24.151796340942383, "global_step": 194947, "epoch": 2348} {"train_loss": -24.3582763671875, "global_step": 194948, "epoch": 2348} {"train_loss": -24.155569076538086, "global_step": 194949, "epoch": 2348} {"train_loss": -24.419921875, "global_step": 194950, "epoch": 2348} {"train_loss": -24.218708038330078, "global_step": 194951, "epoch": 2348} {"train_loss": -24.382980346679688, "global_step": 194952, "epoch": 2348} {"train_loss": -24.254486083984375, "global_step": 194953, "epoch": 2348} {"train_loss": -24.086050033569336, "global_step": 194954, "epoch": 2348} {"train_loss": -23.66344451904297, "global_step": 194955, "epoch": 2348} {"train_loss": -23.768295288085938, "global_step": 194956, "epoch": 2348} {"train_loss": -23.83340835571289, "global_step": 194957, "epoch": 2348} {"train_loss": -24.074127197265625, "global_step": 194958, "epoch": 2348} {"train_loss": -23.92450523376465, "global_step": 194959, "epoch": 2348} {"train_loss": -23.9202938079834, "global_step": 194960, "epoch": 2348} {"train_loss": -23.599504470825195, "global_step": 194961, "epoch": 2348} {"train_loss": -23.593730926513672, "global_step": 194962, "epoch": 2348} {"train_loss": -24.333724975585938, "global_step": 194963, "epoch": 2348} {"train_loss": -24.19207763671875, "global_step": 194964, "epoch": 2348} {"train_loss": -24.330726623535156, "global_step": 194965, "epoch": 2348} {"train_loss": -23.990904405892614, "global_step": 194966, "epoch": 2348, "val_loss": 6563455.0} {"train_loss": -23.532957077026367, "global_step": 194967, "epoch": 2349} {"train_loss": -23.589452743530273, "global_step": 194968, "epoch": 2349} {"train_loss": -23.82826042175293, "global_step": 194969, "epoch": 2349} {"train_loss": -24.039846420288086, "global_step": 194970, "epoch": 2349} {"train_loss": -23.46492576599121, "global_step": 194971, "epoch": 2349} {"train_loss": -23.76449966430664, "global_step": 194972, "epoch": 2349} {"train_loss": -23.935869216918945, "global_step": 194973, "epoch": 2349} {"train_loss": -23.95466423034668, "global_step": 194974, "epoch": 2349} {"train_loss": -24.027624130249023, "global_step": 194975, "epoch": 2349} {"train_loss": -23.587400436401367, "global_step": 194976, "epoch": 2349} {"train_loss": -24.038118362426758, "global_step": 194977, "epoch": 2349} {"train_loss": -23.665903091430664, "global_step": 194978, "epoch": 2349} {"train_loss": -24.261783599853516, "global_step": 194979, "epoch": 2349} {"train_loss": -24.06558609008789, "global_step": 194980, "epoch": 2349} {"train_loss": -23.992046356201172, "global_step": 194981, "epoch": 2349} {"train_loss": -24.248310089111328, "global_step": 194982, "epoch": 2349} {"train_loss": -24.161191940307617, "global_step": 194983, "epoch": 2349} {"train_loss": -24.019550323486328, "global_step": 194984, "epoch": 2349} {"train_loss": -24.014699935913086, "global_step": 194985, "epoch": 2349} {"train_loss": -24.028520584106445, "global_step": 194986, "epoch": 2349} {"train_loss": -24.113956451416016, "global_step": 194987, "epoch": 2349} {"train_loss": -24.444272994995117, "global_step": 194988, "epoch": 2349} {"train_loss": -24.072782516479492, "global_step": 194989, "epoch": 2349} {"train_loss": -24.098997116088867, "global_step": 194990, "epoch": 2349} {"train_loss": -24.170284271240234, "global_step": 194991, "epoch": 2349} {"train_loss": -24.06620216369629, "global_step": 194992, "epoch": 2349} {"train_loss": -24.223173141479492, "global_step": 194993, "epoch": 2349} {"train_loss": -24.051477432250977, "global_step": 194994, "epoch": 2349} {"train_loss": -24.25527000427246, "global_step": 194995, "epoch": 2349} {"train_loss": -24.6828556060791, "global_step": 194996, "epoch": 2349} {"train_loss": -24.70363426208496, "global_step": 194997, "epoch": 2349} {"train_loss": -24.212905883789062, "global_step": 194998, "epoch": 2349} {"train_loss": -24.08762550354004, "global_step": 194999, "epoch": 2349} {"train_loss": -24.60504722595215, "global_step": 195000, "epoch": 2349} {"train_loss": -24.393869400024414, "global_step": 195001, "epoch": 2349} {"train_loss": -24.161901473999023, "global_step": 195002, "epoch": 2349} {"train_loss": -24.329898834228516, "global_step": 195003, "epoch": 2349} {"train_loss": -24.17368507385254, "global_step": 195004, "epoch": 2349} {"train_loss": -24.1123046875, "global_step": 195005, "epoch": 2349} {"train_loss": -24.60651969909668, "global_step": 195006, "epoch": 2349} {"train_loss": -24.338468551635742, "global_step": 195007, "epoch": 2349} {"train_loss": -24.095661163330078, "global_step": 195008, "epoch": 2349} {"train_loss": -24.187108993530273, "global_step": 195009, "epoch": 2349} {"train_loss": -24.462522506713867, "global_step": 195010, "epoch": 2349} {"train_loss": -24.414623260498047, "global_step": 195011, "epoch": 2349} {"train_loss": -24.541305541992188, "global_step": 195012, "epoch": 2349} {"train_loss": -24.37977409362793, "global_step": 195013, "epoch": 2349} {"train_loss": -24.764602661132812, "global_step": 195014, "epoch": 2349} {"train_loss": -24.360517501831055, "global_step": 195015, "epoch": 2349} {"train_loss": -24.121763229370117, "global_step": 195016, "epoch": 2349} {"train_loss": -24.666906356811523, "global_step": 195017, "epoch": 2349} {"train_loss": -24.250478744506836, "global_step": 195018, "epoch": 2349} {"train_loss": -24.25380516052246, "global_step": 195019, "epoch": 2349} {"train_loss": -23.90773582458496, "global_step": 195020, "epoch": 2349} {"train_loss": -23.86130142211914, "global_step": 195021, "epoch": 2349} {"train_loss": -23.701452255249023, "global_step": 195022, "epoch": 2349} {"train_loss": -24.03057098388672, "global_step": 195023, "epoch": 2349} {"train_loss": -23.262977600097656, "global_step": 195024, "epoch": 2349} {"train_loss": -23.921607971191406, "global_step": 195025, "epoch": 2349} {"train_loss": -24.257123947143555, "global_step": 195026, "epoch": 2349} {"train_loss": -24.09657859802246, "global_step": 195027, "epoch": 2349} {"train_loss": -23.761730194091797, "global_step": 195028, "epoch": 2349} {"train_loss": -23.878807067871094, "global_step": 195029, "epoch": 2349} {"train_loss": -23.74239158630371, "global_step": 195030, "epoch": 2349} {"train_loss": -24.358930587768555, "global_step": 195031, "epoch": 2349} {"train_loss": -23.89156150817871, "global_step": 195032, "epoch": 2349} {"train_loss": -24.101703643798828, "global_step": 195033, "epoch": 2349} {"train_loss": -24.033430099487305, "global_step": 195034, "epoch": 2349} {"train_loss": -24.14729118347168, "global_step": 195035, "epoch": 2349} {"train_loss": -23.97565269470215, "global_step": 195036, "epoch": 2349} {"train_loss": -24.054441452026367, "global_step": 195037, "epoch": 2349} {"train_loss": -24.009885787963867, "global_step": 195038, "epoch": 2349} {"train_loss": -24.077529907226562, "global_step": 195039, "epoch": 2349} {"train_loss": -24.31010627746582, "global_step": 195040, "epoch": 2349} {"train_loss": -23.906259536743164, "global_step": 195041, "epoch": 2349} {"train_loss": -24.18442726135254, "global_step": 195042, "epoch": 2349} {"train_loss": -24.02425193786621, "global_step": 195043, "epoch": 2349} {"train_loss": -23.883811950683594, "global_step": 195044, "epoch": 2349} {"train_loss": -24.111921310424805, "global_step": 195045, "epoch": 2349} {"train_loss": -23.904804229736328, "global_step": 195046, "epoch": 2349} {"train_loss": -24.07027244567871, "global_step": 195047, "epoch": 2349} {"train_loss": -24.35262107849121, "global_step": 195048, "epoch": 2349} {"train_loss": -24.1060957161777, "global_step": 195049, "epoch": 2349, "val_loss": 6456370.0} {"train_loss": -23.837451934814453, "global_step": 195050, "epoch": 2350} {"train_loss": -23.567258834838867, "global_step": 195051, "epoch": 2350} {"train_loss": -23.998594284057617, "global_step": 195052, "epoch": 2350} {"train_loss": -23.59769630432129, "global_step": 195053, "epoch": 2350} {"train_loss": -23.757787704467773, "global_step": 195054, "epoch": 2350} {"train_loss": -23.58135414123535, "global_step": 195055, "epoch": 2350} {"train_loss": -23.92023277282715, "global_step": 195056, "epoch": 2350} {"train_loss": -24.120737075805664, "global_step": 195057, "epoch": 2350} {"train_loss": -23.657222747802734, "global_step": 195058, "epoch": 2350} {"train_loss": -23.62590980529785, "global_step": 195059, "epoch": 2350} {"train_loss": -24.140607833862305, "global_step": 195060, "epoch": 2350} {"train_loss": -24.255102157592773, "global_step": 195061, "epoch": 2350} {"train_loss": -24.004581451416016, "global_step": 195062, "epoch": 2350} {"train_loss": -24.423622131347656, "global_step": 195063, "epoch": 2350} {"train_loss": -24.161169052124023, "global_step": 195064, "epoch": 2350} {"train_loss": -24.028783798217773, "global_step": 195065, "epoch": 2350} {"train_loss": -24.06599998474121, "global_step": 195066, "epoch": 2350} {"train_loss": -24.108884811401367, "global_step": 195067, "epoch": 2350} {"train_loss": -24.101858139038086, "global_step": 195068, "epoch": 2350} {"train_loss": -24.373132705688477, "global_step": 195069, "epoch": 2350} {"train_loss": -24.21062469482422, "global_step": 195070, "epoch": 2350} {"train_loss": -24.003158569335938, "global_step": 195071, "epoch": 2350} {"train_loss": -24.245635986328125, "global_step": 195072, "epoch": 2350} {"train_loss": -24.32532501220703, "global_step": 195073, "epoch": 2350} {"train_loss": -24.224424362182617, "global_step": 195074, "epoch": 2350} {"train_loss": -24.2229061126709, "global_step": 195075, "epoch": 2350} {"train_loss": -24.078083038330078, "global_step": 195076, "epoch": 2350} {"train_loss": -24.329687118530273, "global_step": 195077, "epoch": 2350} {"train_loss": -24.156415939331055, "global_step": 195078, "epoch": 2350} {"train_loss": -24.132587432861328, "global_step": 195079, "epoch": 2350} {"train_loss": -23.993759155273438, "global_step": 195080, "epoch": 2350} {"train_loss": -24.151443481445312, "global_step": 195081, "epoch": 2350} {"train_loss": -24.429492950439453, "global_step": 195082, "epoch": 2350} {"train_loss": -24.123565673828125, "global_step": 195083, "epoch": 2350} {"train_loss": -24.18014907836914, "global_step": 195084, "epoch": 2350} {"train_loss": -24.310806274414062, "global_step": 195085, "epoch": 2350} {"train_loss": -23.896554946899414, "global_step": 195086, "epoch": 2350} {"train_loss": -24.161787033081055, "global_step": 195087, "epoch": 2350} {"train_loss": -23.92328643798828, "global_step": 195088, "epoch": 2350} {"train_loss": -24.012582778930664, "global_step": 195089, "epoch": 2350} {"train_loss": -24.207361221313477, "global_step": 195090, "epoch": 2350} {"train_loss": -23.63165283203125, "global_step": 195091, "epoch": 2350} {"train_loss": -24.112247467041016, "global_step": 195092, "epoch": 2350} {"train_loss": -24.020511627197266, "global_step": 195093, "epoch": 2350} {"train_loss": -24.34775733947754, "global_step": 195094, "epoch": 2350} {"train_loss": -24.039752960205078, "global_step": 195095, "epoch": 2350} {"train_loss": -24.046157836914062, "global_step": 195096, "epoch": 2350} {"train_loss": -24.009899139404297, "global_step": 195097, "epoch": 2350} {"train_loss": -24.314088821411133, "global_step": 195098, "epoch": 2350} {"train_loss": -24.245634078979492, "global_step": 195099, "epoch": 2350} {"train_loss": -24.077817916870117, "global_step": 195100, "epoch": 2350} {"train_loss": -24.3150634765625, "global_step": 195101, "epoch": 2350} {"train_loss": -24.080148696899414, "global_step": 195102, "epoch": 2350} {"train_loss": -23.729957580566406, "global_step": 195103, "epoch": 2350} {"train_loss": -24.204023361206055, "global_step": 195104, "epoch": 2350} {"train_loss": -24.755651473999023, "global_step": 195105, "epoch": 2350} {"train_loss": -24.36410903930664, "global_step": 195106, "epoch": 2350} {"train_loss": -24.422182083129883, "global_step": 195107, "epoch": 2350} {"train_loss": -24.327499389648438, "global_step": 195108, "epoch": 2350} {"train_loss": -24.123018264770508, "global_step": 195109, "epoch": 2350} {"train_loss": -24.240474700927734, "global_step": 195110, "epoch": 2350} {"train_loss": -24.083974838256836, "global_step": 195111, "epoch": 2350} {"train_loss": -24.155771255493164, "global_step": 195112, "epoch": 2350} {"train_loss": -24.45307731628418, "global_step": 195113, "epoch": 2350} {"train_loss": -24.36174964904785, "global_step": 195114, "epoch": 2350} {"train_loss": -24.372562408447266, "global_step": 195115, "epoch": 2350} {"train_loss": -24.222110748291016, "global_step": 195116, "epoch": 2350} {"train_loss": -24.154756546020508, "global_step": 195117, "epoch": 2350} {"train_loss": -24.157529830932617, "global_step": 195118, "epoch": 2350} {"train_loss": -24.043554306030273, "global_step": 195119, "epoch": 2350} {"train_loss": -24.323667526245117, "global_step": 195120, "epoch": 2350} {"train_loss": -24.16188621520996, "global_step": 195121, "epoch": 2350} {"train_loss": -23.80878257751465, "global_step": 195122, "epoch": 2350} {"train_loss": -23.63958168029785, "global_step": 195123, "epoch": 2350} {"train_loss": -23.69338035583496, "global_step": 195124, "epoch": 2350} {"train_loss": -24.151229858398438, "global_step": 195125, "epoch": 2350} {"train_loss": -23.87459945678711, "global_step": 195126, "epoch": 2350} {"train_loss": -23.8983211517334, "global_step": 195127, "epoch": 2350} {"train_loss": -24.38258171081543, "global_step": 195128, "epoch": 2350} {"train_loss": -24.157194137573242, "global_step": 195129, "epoch": 2350} {"train_loss": -23.934202194213867, "global_step": 195130, "epoch": 2350} {"train_loss": -23.870397567749023, "global_step": 195131, "epoch": 2350} {"train_loss": -24.097808194447712, "global_step": 195132, "epoch": 2350, "train/sim_max_reward_0": 1.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 0.0, "test/sim_max_reward_4500000": 1.0, "test/sim_max_reward_4500001": 1.0, "test/sim_max_reward_4500002": 1.0, "test/sim_max_reward_4500003": 1.0, "test/sim_max_reward_4500004": 1.0, "test/sim_max_reward_4500005": 1.0, "test/sim_max_reward_4500006": 1.0, "test/sim_max_reward_4500007": 1.0, "test/sim_max_reward_4500008": 1.0, "test/sim_max_reward_4500009": 1.0, "test/sim_max_reward_4500010": 1.0, "test/sim_max_reward_4500011": 1.0, "test/sim_max_reward_4500012": 1.0, "test/sim_max_reward_4500013": 1.0, "test/sim_max_reward_4500014": 1.0, "test/sim_max_reward_4500015": 1.0, "test/sim_max_reward_4500016": 1.0, "test/sim_max_reward_4500017": 1.0, "test/sim_max_reward_4500018": 1.0, "test/sim_max_reward_4500019": 1.0, "test/sim_max_reward_4500020": 1.0, "test/sim_max_reward_4500021": 1.0, "train/mean_score": 0.8333333333333334, "test/mean_score": 1.0, "val_loss": 6360632.0} {"train_loss": -21.254423141479492, "global_step": 195133, "epoch": 2351} {"train_loss": -21.885847091674805, "global_step": 195134, "epoch": 2351} {"train_loss": -22.75188636779785, "global_step": 195135, "epoch": 2351} {"train_loss": -22.447067260742188, "global_step": 195136, "epoch": 2351} {"train_loss": -22.176366806030273, "global_step": 195137, "epoch": 2351} {"train_loss": -23.370269775390625, "global_step": 195138, "epoch": 2351} {"train_loss": -23.1834659576416, "global_step": 195139, "epoch": 2351} {"train_loss": -23.28396987915039, "global_step": 195140, "epoch": 2351} {"train_loss": -23.35537338256836, "global_step": 195141, "epoch": 2351} {"train_loss": -23.080795288085938, "global_step": 195142, "epoch": 2351} {"train_loss": -23.477197647094727, "global_step": 195143, "epoch": 2351} {"train_loss": -23.03753662109375, "global_step": 195144, "epoch": 2351} {"train_loss": -23.044265747070312, "global_step": 195145, "epoch": 2351} {"train_loss": -23.35199737548828, "global_step": 195146, "epoch": 2351} {"train_loss": -23.582788467407227, "global_step": 195147, "epoch": 2351} {"train_loss": -23.991613388061523, "global_step": 195148, "epoch": 2351} {"train_loss": -23.232059478759766, "global_step": 195149, "epoch": 2351} {"train_loss": -23.865440368652344, "global_step": 195150, "epoch": 2351} {"train_loss": -23.3156795501709, "global_step": 195151, "epoch": 2351} {"train_loss": -23.632856369018555, "global_step": 195152, "epoch": 2351} {"train_loss": -23.801176071166992, "global_step": 195153, "epoch": 2351} {"train_loss": -24.04725456237793, "global_step": 195154, "epoch": 2351} {"train_loss": -23.909378051757812, "global_step": 195155, "epoch": 2351} {"train_loss": -23.676137924194336, "global_step": 195156, "epoch": 2351} {"train_loss": -23.811450958251953, "global_step": 195157, "epoch": 2351} {"train_loss": -23.69416618347168, "global_step": 195158, "epoch": 2351} {"train_loss": -23.610300064086914, "global_step": 195159, "epoch": 2351} {"train_loss": -23.729310989379883, "global_step": 195160, "epoch": 2351} {"train_loss": -23.732505798339844, "global_step": 195161, "epoch": 2351} {"train_loss": -23.494064331054688, "global_step": 195162, "epoch": 2351} {"train_loss": -23.925962448120117, "global_step": 195163, "epoch": 2351} {"train_loss": -23.872785568237305, "global_step": 195164, "epoch": 2351} {"train_loss": -24.34845542907715, "global_step": 195165, "epoch": 2351} {"train_loss": -24.089109420776367, "global_step": 195166, "epoch": 2351} {"train_loss": -24.38144302368164, "global_step": 195167, "epoch": 2351} {"train_loss": -23.789278030395508, "global_step": 195168, "epoch": 2351} {"train_loss": -24.24445915222168, "global_step": 195169, "epoch": 2351} {"train_loss": -23.975797653198242, "global_step": 195170, "epoch": 2351} {"train_loss": -24.072463989257812, "global_step": 195171, "epoch": 2351} {"train_loss": -24.2127628326416, "global_step": 195172, "epoch": 2351} {"train_loss": -24.291959762573242, "global_step": 195173, "epoch": 2351} {"train_loss": -24.33334732055664, "global_step": 195174, "epoch": 2351} {"train_loss": -24.119869232177734, "global_step": 195175, "epoch": 2351} {"train_loss": -24.227155685424805, "global_step": 195176, "epoch": 2351} {"train_loss": -24.4195613861084, "global_step": 195177, "epoch": 2351} {"train_loss": -24.04227066040039, "global_step": 195178, "epoch": 2351} {"train_loss": -24.090194702148438, "global_step": 195179, "epoch": 2351} {"train_loss": -24.23026466369629, "global_step": 195180, "epoch": 2351} {"train_loss": -24.37823486328125, "global_step": 195181, "epoch": 2351} {"train_loss": -24.101064682006836, "global_step": 195182, "epoch": 2351} {"train_loss": -24.12775993347168, "global_step": 195183, "epoch": 2351} {"train_loss": -24.636117935180664, "global_step": 195184, "epoch": 2351} {"train_loss": -24.086441040039062, "global_step": 195185, "epoch": 2351} {"train_loss": -24.144704818725586, "global_step": 195186, "epoch": 2351} {"train_loss": -23.813690185546875, "global_step": 195187, "epoch": 2351} {"train_loss": -24.2702579498291, "global_step": 195188, "epoch": 2351} {"train_loss": -24.393905639648438, "global_step": 195189, "epoch": 2351} {"train_loss": -24.34050941467285, "global_step": 195190, "epoch": 2351} {"train_loss": -24.111474990844727, "global_step": 195191, "epoch": 2351} {"train_loss": -24.627119064331055, "global_step": 195192, "epoch": 2351} {"train_loss": -24.00937271118164, "global_step": 195193, "epoch": 2351} {"train_loss": -24.461191177368164, "global_step": 195194, "epoch": 2351} {"train_loss": -24.420351028442383, "global_step": 195195, "epoch": 2351} {"train_loss": -24.505277633666992, "global_step": 195196, "epoch": 2351} {"train_loss": -24.060056686401367, "global_step": 195197, "epoch": 2351} {"train_loss": -24.33021354675293, "global_step": 195198, "epoch": 2351} {"train_loss": -24.061548233032227, "global_step": 195199, "epoch": 2351} {"train_loss": -23.885602951049805, "global_step": 195200, "epoch": 2351} {"train_loss": -24.129743576049805, "global_step": 195201, "epoch": 2351} {"train_loss": -24.480939865112305, "global_step": 195202, "epoch": 2351} {"train_loss": -24.221256256103516, "global_step": 195203, "epoch": 2351} {"train_loss": -23.999164581298828, "global_step": 195204, "epoch": 2351} {"train_loss": -24.054697036743164, "global_step": 195205, "epoch": 2351} {"train_loss": -24.154409408569336, "global_step": 195206, "epoch": 2351} {"train_loss": -24.148054122924805, "global_step": 195207, "epoch": 2351} {"train_loss": -24.063831329345703, "global_step": 195208, "epoch": 2351} {"train_loss": -24.58260726928711, "global_step": 195209, "epoch": 2351} {"train_loss": -24.205875396728516, "global_step": 195210, "epoch": 2351} {"train_loss": -24.41312026977539, "global_step": 195211, "epoch": 2351} {"train_loss": -24.381587982177734, "global_step": 195212, "epoch": 2351} {"train_loss": -24.307737350463867, "global_step": 195213, "epoch": 2351} {"train_loss": -24.18825340270996, "global_step": 195214, "epoch": 2351} {"train_loss": -23.870760354651026, "global_step": 195215, "epoch": 2351, "val_loss": 6512537.0} {"train_loss": -23.726398468017578, "global_step": 195216, "epoch": 2352} {"train_loss": -23.855838775634766, "global_step": 195217, "epoch": 2352} {"train_loss": -24.094074249267578, "global_step": 195218, "epoch": 2352} {"train_loss": -23.764528274536133, "global_step": 195219, "epoch": 2352} {"train_loss": -23.598224639892578, "global_step": 195220, "epoch": 2352} {"train_loss": -23.75031852722168, "global_step": 195221, "epoch": 2352} {"train_loss": -23.975711822509766, "global_step": 195222, "epoch": 2352} {"train_loss": -23.92059326171875, "global_step": 195223, "epoch": 2352} {"train_loss": -24.1468448638916, "global_step": 195224, "epoch": 2352} {"train_loss": -23.886295318603516, "global_step": 195225, "epoch": 2352} {"train_loss": -23.96050453186035, "global_step": 195226, "epoch": 2352} {"train_loss": -24.052406311035156, "global_step": 195227, "epoch": 2352} {"train_loss": -24.32368278503418, "global_step": 195228, "epoch": 2352} {"train_loss": -23.925260543823242, "global_step": 195229, "epoch": 2352} {"train_loss": -24.319921493530273, "global_step": 195230, "epoch": 2352} {"train_loss": -23.82730484008789, "global_step": 195231, "epoch": 2352} {"train_loss": -23.9710693359375, "global_step": 195232, "epoch": 2352} {"train_loss": -23.510778427124023, "global_step": 195233, "epoch": 2352} {"train_loss": -23.989334106445312, "global_step": 195234, "epoch": 2352} {"train_loss": -24.0408992767334, "global_step": 195235, "epoch": 2352} {"train_loss": -24.164188385009766, "global_step": 195236, "epoch": 2352} {"train_loss": -24.37994956970215, "global_step": 195237, "epoch": 2352} {"train_loss": -24.122282028198242, "global_step": 195238, "epoch": 2352} {"train_loss": -24.208026885986328, "global_step": 195239, "epoch": 2352} {"train_loss": -24.35919952392578, "global_step": 195240, "epoch": 2352} {"train_loss": -23.789798736572266, "global_step": 195241, "epoch": 2352} {"train_loss": -24.463993072509766, "global_step": 195242, "epoch": 2352} {"train_loss": -23.834619522094727, "global_step": 195243, "epoch": 2352} {"train_loss": -24.49233055114746, "global_step": 195244, "epoch": 2352} {"train_loss": -24.27583885192871, "global_step": 195245, "epoch": 2352} {"train_loss": -24.17779541015625, "global_step": 195246, "epoch": 2352} {"train_loss": -24.03439712524414, "global_step": 195247, "epoch": 2352} {"train_loss": -24.399621963500977, "global_step": 195248, "epoch": 2352} {"train_loss": -24.210430145263672, "global_step": 195249, "epoch": 2352} {"train_loss": -23.936471939086914, "global_step": 195250, "epoch": 2352} {"train_loss": -24.192947387695312, "global_step": 195251, "epoch": 2352} {"train_loss": -24.07197380065918, "global_step": 195252, "epoch": 2352} {"train_loss": -24.41512680053711, "global_step": 195253, "epoch": 2352} {"train_loss": -24.170974731445312, "global_step": 195254, "epoch": 2352} {"train_loss": -24.208511352539062, "global_step": 195255, "epoch": 2352} {"train_loss": -24.361141204833984, "global_step": 195256, "epoch": 2352} {"train_loss": -24.482234954833984, "global_step": 195257, "epoch": 2352} {"train_loss": -24.232927322387695, "global_step": 195258, "epoch": 2352} {"train_loss": -24.35199546813965, "global_step": 195259, "epoch": 2352} {"train_loss": -24.196762084960938, "global_step": 195260, "epoch": 2352} {"train_loss": -24.23719596862793, "global_step": 195261, "epoch": 2352} {"train_loss": -24.37833595275879, "global_step": 195262, "epoch": 2352} {"train_loss": -24.17347526550293, "global_step": 195263, "epoch": 2352} {"train_loss": -24.313507080078125, "global_step": 195264, "epoch": 2352} {"train_loss": -24.135862350463867, "global_step": 195265, "epoch": 2352} {"train_loss": -24.170379638671875, "global_step": 195266, "epoch": 2352} {"train_loss": -24.44683265686035, "global_step": 195267, "epoch": 2352} {"train_loss": -24.16473388671875, "global_step": 195268, "epoch": 2352} {"train_loss": -24.449359893798828, "global_step": 195269, "epoch": 2352} {"train_loss": -24.22441864013672, "global_step": 195270, "epoch": 2352} {"train_loss": -24.272558212280273, "global_step": 195271, "epoch": 2352} {"train_loss": -24.62001609802246, "global_step": 195272, "epoch": 2352} {"train_loss": -23.919767379760742, "global_step": 195273, "epoch": 2352} {"train_loss": -23.896512985229492, "global_step": 195274, "epoch": 2352} {"train_loss": -24.33613395690918, "global_step": 195275, "epoch": 2352} {"train_loss": -24.366086959838867, "global_step": 195276, "epoch": 2352} {"train_loss": -24.242801666259766, "global_step": 195277, "epoch": 2352} {"train_loss": -24.29432487487793, "global_step": 195278, "epoch": 2352} {"train_loss": -24.0938777923584, "global_step": 195279, "epoch": 2352} {"train_loss": -24.325345993041992, "global_step": 195280, "epoch": 2352} {"train_loss": -24.69264030456543, "global_step": 195281, "epoch": 2352} {"train_loss": -24.35525894165039, "global_step": 195282, "epoch": 2352} {"train_loss": -24.3740234375, "global_step": 195283, "epoch": 2352} {"train_loss": -24.191247940063477, "global_step": 195284, "epoch": 2352} {"train_loss": -24.474611282348633, "global_step": 195285, "epoch": 2352} {"train_loss": -24.119733810424805, "global_step": 195286, "epoch": 2352} {"train_loss": -24.475473403930664, "global_step": 195287, "epoch": 2352} {"train_loss": -24.2913875579834, "global_step": 195288, "epoch": 2352} {"train_loss": -24.209613800048828, "global_step": 195289, "epoch": 2352} {"train_loss": -23.900840759277344, "global_step": 195290, "epoch": 2352} {"train_loss": -24.51336097717285, "global_step": 195291, "epoch": 2352} {"train_loss": -24.15019989013672, "global_step": 195292, "epoch": 2352} {"train_loss": -24.010543823242188, "global_step": 195293, "epoch": 2352} {"train_loss": -23.836965560913086, "global_step": 195294, "epoch": 2352} {"train_loss": -23.924760818481445, "global_step": 195295, "epoch": 2352} {"train_loss": -24.49237060546875, "global_step": 195296, "epoch": 2352} {"train_loss": -24.07982063293457, "global_step": 195297, "epoch": 2352} {"train_loss": -24.163269226809582, "global_step": 195298, "epoch": 2352, "val_loss": 6538225.0} {"train_loss": -23.445966720581055, "global_step": 195299, "epoch": 2353} {"train_loss": -23.866872787475586, "global_step": 195300, "epoch": 2353} {"train_loss": -23.469390869140625, "global_step": 195301, "epoch": 2353} {"train_loss": -23.799713134765625, "global_step": 195302, "epoch": 2353} {"train_loss": -23.497854232788086, "global_step": 195303, "epoch": 2353} {"train_loss": -23.85417366027832, "global_step": 195304, "epoch": 2353} {"train_loss": -23.37894058227539, "global_step": 195305, "epoch": 2353} {"train_loss": -23.65909767150879, "global_step": 195306, "epoch": 2353} {"train_loss": -23.769384384155273, "global_step": 195307, "epoch": 2353} {"train_loss": -23.821104049682617, "global_step": 195308, "epoch": 2353} {"train_loss": -23.488142013549805, "global_step": 195309, "epoch": 2353} {"train_loss": -24.01412010192871, "global_step": 195310, "epoch": 2353} {"train_loss": -23.96872901916504, "global_step": 195311, "epoch": 2353} {"train_loss": -23.937299728393555, "global_step": 195312, "epoch": 2353} {"train_loss": -23.777448654174805, "global_step": 195313, "epoch": 2353} {"train_loss": -24.217426300048828, "global_step": 195314, "epoch": 2353} {"train_loss": -23.68363380432129, "global_step": 195315, "epoch": 2353} {"train_loss": -23.690032958984375, "global_step": 195316, "epoch": 2353} {"train_loss": -23.743328094482422, "global_step": 195317, "epoch": 2353} {"train_loss": -23.938343048095703, "global_step": 195318, "epoch": 2353} {"train_loss": -23.850936889648438, "global_step": 195319, "epoch": 2353} {"train_loss": -24.000654220581055, "global_step": 195320, "epoch": 2353} {"train_loss": -24.06080436706543, "global_step": 195321, "epoch": 2353} {"train_loss": -23.921371459960938, "global_step": 195322, "epoch": 2353} {"train_loss": -23.882125854492188, "global_step": 195323, "epoch": 2353} {"train_loss": -24.072891235351562, "global_step": 195324, "epoch": 2353} {"train_loss": -23.671693801879883, "global_step": 195325, "epoch": 2353} {"train_loss": -23.892929077148438, "global_step": 195326, "epoch": 2353} {"train_loss": -24.048858642578125, "global_step": 195327, "epoch": 2353} {"train_loss": -24.218496322631836, "global_step": 195328, "epoch": 2353} {"train_loss": -24.250751495361328, "global_step": 195329, "epoch": 2353} {"train_loss": -23.794879913330078, "global_step": 195330, "epoch": 2353} {"train_loss": -24.345136642456055, "global_step": 195331, "epoch": 2353} {"train_loss": -24.353458404541016, "global_step": 195332, "epoch": 2353} {"train_loss": -24.405981063842773, "global_step": 195333, "epoch": 2353} {"train_loss": -24.016550064086914, "global_step": 195334, "epoch": 2353} {"train_loss": -24.38897132873535, "global_step": 195335, "epoch": 2353} {"train_loss": -24.027793884277344, "global_step": 195336, "epoch": 2353} {"train_loss": -24.0018310546875, "global_step": 195337, "epoch": 2353} {"train_loss": -24.019662857055664, "global_step": 195338, "epoch": 2353} {"train_loss": -24.284177780151367, "global_step": 195339, "epoch": 2353} {"train_loss": -24.508934020996094, "global_step": 195340, "epoch": 2353} {"train_loss": -24.258852005004883, "global_step": 195341, "epoch": 2353} {"train_loss": -23.471576690673828, "global_step": 195342, "epoch": 2353} {"train_loss": -23.857702255249023, "global_step": 195343, "epoch": 2353} {"train_loss": -24.199392318725586, "global_step": 195344, "epoch": 2353} {"train_loss": -23.95033836364746, "global_step": 195345, "epoch": 2353} {"train_loss": -24.33131980895996, "global_step": 195346, "epoch": 2353} {"train_loss": -24.055679321289062, "global_step": 195347, "epoch": 2353} {"train_loss": -24.232559204101562, "global_step": 195348, "epoch": 2353} {"train_loss": -23.98789405822754, "global_step": 195349, "epoch": 2353} {"train_loss": -24.53898048400879, "global_step": 195350, "epoch": 2353} {"train_loss": -24.05600357055664, "global_step": 195351, "epoch": 2353} {"train_loss": -24.18608856201172, "global_step": 195352, "epoch": 2353} {"train_loss": -24.21843910217285, "global_step": 195353, "epoch": 2353} {"train_loss": -24.486896514892578, "global_step": 195354, "epoch": 2353} {"train_loss": -24.122119903564453, "global_step": 195355, "epoch": 2353} {"train_loss": -24.487852096557617, "global_step": 195356, "epoch": 2353} {"train_loss": -24.079730987548828, "global_step": 195357, "epoch": 2353} {"train_loss": -24.573911666870117, "global_step": 195358, "epoch": 2353} {"train_loss": -24.63795280456543, "global_step": 195359, "epoch": 2353} {"train_loss": -24.03664779663086, "global_step": 195360, "epoch": 2353} {"train_loss": -24.098636627197266, "global_step": 195361, "epoch": 2353} {"train_loss": -24.35479736328125, "global_step": 195362, "epoch": 2353} {"train_loss": -24.20001792907715, "global_step": 195363, "epoch": 2353} {"train_loss": -24.465015411376953, "global_step": 195364, "epoch": 2353} {"train_loss": -24.312986373901367, "global_step": 195365, "epoch": 2353} {"train_loss": -23.996429443359375, "global_step": 195366, "epoch": 2353} {"train_loss": -23.96718406677246, "global_step": 195367, "epoch": 2353} {"train_loss": -24.34097671508789, "global_step": 195368, "epoch": 2353} {"train_loss": -23.857542037963867, "global_step": 195369, "epoch": 2353} {"train_loss": -23.816556930541992, "global_step": 195370, "epoch": 2353} {"train_loss": -23.57506561279297, "global_step": 195371, "epoch": 2353} {"train_loss": -23.8782958984375, "global_step": 195372, "epoch": 2353} {"train_loss": -23.880006790161133, "global_step": 195373, "epoch": 2353} {"train_loss": -24.065692901611328, "global_step": 195374, "epoch": 2353} {"train_loss": -23.525562286376953, "global_step": 195375, "epoch": 2353} {"train_loss": -24.38692283630371, "global_step": 195376, "epoch": 2353} {"train_loss": -23.97852325439453, "global_step": 195377, "epoch": 2353} {"train_loss": -23.902128219604492, "global_step": 195378, "epoch": 2353} {"train_loss": -23.9737491607666, "global_step": 195379, "epoch": 2353} {"train_loss": -24.39194107055664, "global_step": 195380, "epoch": 2353} {"train_loss": -24.02162554177893, "global_step": 195381, "epoch": 2353, "val_loss": 6516976.0} {"train_loss": -23.467788696289062, "global_step": 195382, "epoch": 2354} {"train_loss": -22.43967628479004, "global_step": 195383, "epoch": 2354} {"train_loss": -22.929616928100586, "global_step": 195384, "epoch": 2354} {"train_loss": -23.370834350585938, "global_step": 195385, "epoch": 2354} {"train_loss": -23.035083770751953, "global_step": 195386, "epoch": 2354} {"train_loss": -23.41632652282715, "global_step": 195387, "epoch": 2354} {"train_loss": -23.6346435546875, "global_step": 195388, "epoch": 2354} {"train_loss": -23.04590606689453, "global_step": 195389, "epoch": 2354} {"train_loss": -23.491498947143555, "global_step": 195390, "epoch": 2354} {"train_loss": -23.50038719177246, "global_step": 195391, "epoch": 2354} {"train_loss": -23.322202682495117, "global_step": 195392, "epoch": 2354} {"train_loss": -23.38627052307129, "global_step": 195393, "epoch": 2354} {"train_loss": -23.207380294799805, "global_step": 195394, "epoch": 2354} {"train_loss": -23.345033645629883, "global_step": 195395, "epoch": 2354} {"train_loss": -23.570741653442383, "global_step": 195396, "epoch": 2354} {"train_loss": -23.56342887878418, "global_step": 195397, "epoch": 2354} {"train_loss": -23.574169158935547, "global_step": 195398, "epoch": 2354} {"train_loss": -23.520780563354492, "global_step": 195399, "epoch": 2354} {"train_loss": -23.703611373901367, "global_step": 195400, "epoch": 2354} {"train_loss": -23.801862716674805, "global_step": 195401, "epoch": 2354} {"train_loss": -23.500755310058594, "global_step": 195402, "epoch": 2354} {"train_loss": -23.544605255126953, "global_step": 195403, "epoch": 2354} {"train_loss": -23.822799682617188, "global_step": 195404, "epoch": 2354} {"train_loss": -23.445302963256836, "global_step": 195405, "epoch": 2354} {"train_loss": -23.681991577148438, "global_step": 195406, "epoch": 2354} {"train_loss": -24.021163940429688, "global_step": 195407, "epoch": 2354} {"train_loss": -23.71647071838379, "global_step": 195408, "epoch": 2354} {"train_loss": -23.78759765625, "global_step": 195409, "epoch": 2354} {"train_loss": -23.803770065307617, "global_step": 195410, "epoch": 2354} {"train_loss": -23.533475875854492, "global_step": 195411, "epoch": 2354} {"train_loss": -23.679824829101562, "global_step": 195412, "epoch": 2354} {"train_loss": -23.888748168945312, "global_step": 195413, "epoch": 2354} {"train_loss": -24.0682373046875, "global_step": 195414, "epoch": 2354} {"train_loss": -23.638526916503906, "global_step": 195415, "epoch": 2354} {"train_loss": -24.28485679626465, "global_step": 195416, "epoch": 2354} {"train_loss": -24.15835952758789, "global_step": 195417, "epoch": 2354} {"train_loss": -24.18503761291504, "global_step": 195418, "epoch": 2354} {"train_loss": -24.2372989654541, "global_step": 195419, "epoch": 2354} {"train_loss": -24.251169204711914, "global_step": 195420, "epoch": 2354} {"train_loss": -23.529775619506836, "global_step": 195421, "epoch": 2354} {"train_loss": -24.15252113342285, "global_step": 195422, "epoch": 2354} {"train_loss": -24.273099899291992, "global_step": 195423, "epoch": 2354} {"train_loss": -24.186176300048828, "global_step": 195424, "epoch": 2354} {"train_loss": -24.29237174987793, "global_step": 195425, "epoch": 2354} {"train_loss": -24.225881576538086, "global_step": 195426, "epoch": 2354} {"train_loss": -24.6384220123291, "global_step": 195427, "epoch": 2354} {"train_loss": -24.337255477905273, "global_step": 195428, "epoch": 2354} {"train_loss": -24.342723846435547, "global_step": 195429, "epoch": 2354} {"train_loss": -24.110063552856445, "global_step": 195430, "epoch": 2354} {"train_loss": -24.50996971130371, "global_step": 195431, "epoch": 2354} {"train_loss": -24.251615524291992, "global_step": 195432, "epoch": 2354} {"train_loss": -24.200407028198242, "global_step": 195433, "epoch": 2354} {"train_loss": -24.238298416137695, "global_step": 195434, "epoch": 2354} {"train_loss": -24.237844467163086, "global_step": 195435, "epoch": 2354} {"train_loss": -24.336063385009766, "global_step": 195436, "epoch": 2354} {"train_loss": -24.31981086730957, "global_step": 195437, "epoch": 2354} {"train_loss": -24.090681076049805, "global_step": 195438, "epoch": 2354} {"train_loss": -24.48929786682129, "global_step": 195439, "epoch": 2354} {"train_loss": -24.742841720581055, "global_step": 195440, "epoch": 2354} {"train_loss": -24.101774215698242, "global_step": 195441, "epoch": 2354} {"train_loss": -24.16596031188965, "global_step": 195442, "epoch": 2354} {"train_loss": -24.07720375061035, "global_step": 195443, "epoch": 2354} {"train_loss": -24.46959114074707, "global_step": 195444, "epoch": 2354} {"train_loss": -24.496145248413086, "global_step": 195445, "epoch": 2354} {"train_loss": -24.646541595458984, "global_step": 195446, "epoch": 2354} {"train_loss": -23.87746238708496, "global_step": 195447, "epoch": 2354} {"train_loss": -24.29412269592285, "global_step": 195448, "epoch": 2354} {"train_loss": -24.619108200073242, "global_step": 195449, "epoch": 2354} {"train_loss": -23.917543411254883, "global_step": 195450, "epoch": 2354} {"train_loss": -24.48240852355957, "global_step": 195451, "epoch": 2354} {"train_loss": -24.343236923217773, "global_step": 195452, "epoch": 2354} {"train_loss": -24.247726440429688, "global_step": 195453, "epoch": 2354} {"train_loss": -24.268213272094727, "global_step": 195454, "epoch": 2354} {"train_loss": -24.12027931213379, "global_step": 195455, "epoch": 2354} {"train_loss": -24.557817459106445, "global_step": 195456, "epoch": 2354} {"train_loss": -24.043115615844727, "global_step": 195457, "epoch": 2354} {"train_loss": -23.760038375854492, "global_step": 195458, "epoch": 2354} {"train_loss": -23.86761474609375, "global_step": 195459, "epoch": 2354} {"train_loss": -23.74266242980957, "global_step": 195460, "epoch": 2354} {"train_loss": -24.353717803955078, "global_step": 195461, "epoch": 2354} {"train_loss": -24.466840744018555, "global_step": 195462, "epoch": 2354} {"train_loss": -24.162734985351562, "global_step": 195463, "epoch": 2354} {"train_loss": -23.937998806137635, "global_step": 195464, "epoch": 2354, "val_loss": 6474153.5} {"train_loss": -24.062217712402344, "global_step": 195465, "epoch": 2355} {"train_loss": -23.66530418395996, "global_step": 195466, "epoch": 2355} {"train_loss": -23.579578399658203, "global_step": 195467, "epoch": 2355} {"train_loss": -24.373144149780273, "global_step": 195468, "epoch": 2355} {"train_loss": -24.03224754333496, "global_step": 195469, "epoch": 2355} {"train_loss": -24.19546890258789, "global_step": 195470, "epoch": 2355} {"train_loss": -23.936086654663086, "global_step": 195471, "epoch": 2355} {"train_loss": -23.736835479736328, "global_step": 195472, "epoch": 2355} {"train_loss": -24.1048526763916, "global_step": 195473, "epoch": 2355} {"train_loss": -24.534486770629883, "global_step": 195474, "epoch": 2355} {"train_loss": -23.80106544494629, "global_step": 195475, "epoch": 2355} {"train_loss": -24.011457443237305, "global_step": 195476, "epoch": 2355} {"train_loss": -24.112070083618164, "global_step": 195477, "epoch": 2355} {"train_loss": -24.449237823486328, "global_step": 195478, "epoch": 2355} {"train_loss": -24.036516189575195, "global_step": 195479, "epoch": 2355} {"train_loss": -24.273962020874023, "global_step": 195480, "epoch": 2355} {"train_loss": -23.9083194732666, "global_step": 195481, "epoch": 2355} {"train_loss": -24.25191307067871, "global_step": 195482, "epoch": 2355} {"train_loss": -24.064672470092773, "global_step": 195483, "epoch": 2355} {"train_loss": -24.019315719604492, "global_step": 195484, "epoch": 2355} {"train_loss": -24.166738510131836, "global_step": 195485, "epoch": 2355} {"train_loss": -24.6946964263916, "global_step": 195486, "epoch": 2355} {"train_loss": -24.49353790283203, "global_step": 195487, "epoch": 2355} {"train_loss": -24.227054595947266, "global_step": 195488, "epoch": 2355} {"train_loss": -24.687490463256836, "global_step": 195489, "epoch": 2355} {"train_loss": -24.610464096069336, "global_step": 195490, "epoch": 2355} {"train_loss": -24.31863021850586, "global_step": 195491, "epoch": 2355} {"train_loss": -24.270401000976562, "global_step": 195492, "epoch": 2355} {"train_loss": -24.35664176940918, "global_step": 195493, "epoch": 2355} {"train_loss": -24.090486526489258, "global_step": 195494, "epoch": 2355} {"train_loss": -24.05191993713379, "global_step": 195495, "epoch": 2355} {"train_loss": -24.271146774291992, "global_step": 195496, "epoch": 2355} {"train_loss": -24.082721710205078, "global_step": 195497, "epoch": 2355} {"train_loss": -24.210739135742188, "global_step": 195498, "epoch": 2355} {"train_loss": -24.08718490600586, "global_step": 195499, "epoch": 2355} {"train_loss": -24.114017486572266, "global_step": 195500, "epoch": 2355} {"train_loss": -24.460599899291992, "global_step": 195501, "epoch": 2355} {"train_loss": -24.26966667175293, "global_step": 195502, "epoch": 2355} {"train_loss": -24.479902267456055, "global_step": 195503, "epoch": 2355} {"train_loss": -24.407419204711914, "global_step": 195504, "epoch": 2355} {"train_loss": -24.082815170288086, "global_step": 195505, "epoch": 2355} {"train_loss": -23.85576820373535, "global_step": 195506, "epoch": 2355} {"train_loss": -24.06954002380371, "global_step": 195507, "epoch": 2355} {"train_loss": -23.923152923583984, "global_step": 195508, "epoch": 2355} {"train_loss": -24.283239364624023, "global_step": 195509, "epoch": 2355} {"train_loss": -24.11849021911621, "global_step": 195510, "epoch": 2355} {"train_loss": -24.270490646362305, "global_step": 195511, "epoch": 2355} {"train_loss": -24.213687896728516, "global_step": 195512, "epoch": 2355} {"train_loss": -23.744237899780273, "global_step": 195513, "epoch": 2355} {"train_loss": -24.424291610717773, "global_step": 195514, "epoch": 2355} {"train_loss": -24.278324127197266, "global_step": 195515, "epoch": 2355} {"train_loss": -24.207996368408203, "global_step": 195516, "epoch": 2355} {"train_loss": -24.060482025146484, "global_step": 195517, "epoch": 2355} {"train_loss": -24.1450252532959, "global_step": 195518, "epoch": 2355} {"train_loss": -24.50916862487793, "global_step": 195519, "epoch": 2355} {"train_loss": -24.111112594604492, "global_step": 195520, "epoch": 2355} {"train_loss": -23.903568267822266, "global_step": 195521, "epoch": 2355} {"train_loss": -24.09653663635254, "global_step": 195522, "epoch": 2355} {"train_loss": -24.336002349853516, "global_step": 195523, "epoch": 2355} {"train_loss": -24.284408569335938, "global_step": 195524, "epoch": 2355} {"train_loss": -24.28412437438965, "global_step": 195525, "epoch": 2355} {"train_loss": -24.078630447387695, "global_step": 195526, "epoch": 2355} {"train_loss": -23.970680236816406, "global_step": 195527, "epoch": 2355} {"train_loss": -24.185083389282227, "global_step": 195528, "epoch": 2355} {"train_loss": -24.42853355407715, "global_step": 195529, "epoch": 2355} {"train_loss": -24.049528121948242, "global_step": 195530, "epoch": 2355} {"train_loss": -24.255765914916992, "global_step": 195531, "epoch": 2355} {"train_loss": -24.242494583129883, "global_step": 195532, "epoch": 2355} {"train_loss": -24.53696632385254, "global_step": 195533, "epoch": 2355} {"train_loss": -24.479129791259766, "global_step": 195534, "epoch": 2355} {"train_loss": -24.358484268188477, "global_step": 195535, "epoch": 2355} {"train_loss": -24.19118881225586, "global_step": 195536, "epoch": 2355} {"train_loss": -24.17157554626465, "global_step": 195537, "epoch": 2355} {"train_loss": -24.072423934936523, "global_step": 195538, "epoch": 2355} {"train_loss": -24.282901763916016, "global_step": 195539, "epoch": 2355} {"train_loss": -23.984338760375977, "global_step": 195540, "epoch": 2355} {"train_loss": -24.469100952148438, "global_step": 195541, "epoch": 2355} {"train_loss": -23.905729293823242, "global_step": 195542, "epoch": 2355} {"train_loss": -24.05409812927246, "global_step": 195543, "epoch": 2355} {"train_loss": -24.27864646911621, "global_step": 195544, "epoch": 2355} {"train_loss": -23.828161239624023, "global_step": 195545, "epoch": 2355} {"train_loss": -24.22538185119629, "global_step": 195546, "epoch": 2355} {"train_loss": -24.1921197592494, "global_step": 195547, "epoch": 2355, "val_loss": 6554195.0} {"train_loss": -23.253808975219727, "global_step": 195548, "epoch": 2356} {"train_loss": -22.920867919921875, "global_step": 195549, "epoch": 2356} {"train_loss": -23.68990135192871, "global_step": 195550, "epoch": 2356} {"train_loss": -23.269941329956055, "global_step": 195551, "epoch": 2356} {"train_loss": -23.191417694091797, "global_step": 195552, "epoch": 2356} {"train_loss": -23.65265464782715, "global_step": 195553, "epoch": 2356} {"train_loss": -23.60670280456543, "global_step": 195554, "epoch": 2356} {"train_loss": -23.697032928466797, "global_step": 195555, "epoch": 2356} {"train_loss": -23.369237899780273, "global_step": 195556, "epoch": 2356} {"train_loss": -23.867246627807617, "global_step": 195557, "epoch": 2356} {"train_loss": -23.744199752807617, "global_step": 195558, "epoch": 2356} {"train_loss": -24.058643341064453, "global_step": 195559, "epoch": 2356} {"train_loss": -23.48464012145996, "global_step": 195560, "epoch": 2356} {"train_loss": -23.763622283935547, "global_step": 195561, "epoch": 2356} {"train_loss": -23.565336227416992, "global_step": 195562, "epoch": 2356} {"train_loss": -23.82151222229004, "global_step": 195563, "epoch": 2356} {"train_loss": -23.908905029296875, "global_step": 195564, "epoch": 2356} {"train_loss": -23.970687866210938, "global_step": 195565, "epoch": 2356} {"train_loss": -23.66484832763672, "global_step": 195566, "epoch": 2356} {"train_loss": -23.888376235961914, "global_step": 195567, "epoch": 2356} {"train_loss": -23.907833099365234, "global_step": 195568, "epoch": 2356} {"train_loss": -23.992908477783203, "global_step": 195569, "epoch": 2356} {"train_loss": -23.842876434326172, "global_step": 195570, "epoch": 2356} {"train_loss": -23.955358505249023, "global_step": 195571, "epoch": 2356} {"train_loss": -23.804555892944336, "global_step": 195572, "epoch": 2356} {"train_loss": -23.806928634643555, "global_step": 195573, "epoch": 2356} {"train_loss": -23.920135498046875, "global_step": 195574, "epoch": 2356} {"train_loss": -24.267215728759766, "global_step": 195575, "epoch": 2356} {"train_loss": -24.503589630126953, "global_step": 195576, "epoch": 2356} {"train_loss": -23.9671688079834, "global_step": 195577, "epoch": 2356} {"train_loss": -23.817365646362305, "global_step": 195578, "epoch": 2356} {"train_loss": -24.123279571533203, "global_step": 195579, "epoch": 2356} {"train_loss": -23.96492576599121, "global_step": 195580, "epoch": 2356} {"train_loss": -24.20851707458496, "global_step": 195581, "epoch": 2356} {"train_loss": -24.185794830322266, "global_step": 195582, "epoch": 2356} {"train_loss": -24.335424423217773, "global_step": 195583, "epoch": 2356} {"train_loss": -24.50780487060547, "global_step": 195584, "epoch": 2356} {"train_loss": -24.22588539123535, "global_step": 195585, "epoch": 2356} {"train_loss": -24.539112091064453, "global_step": 195586, "epoch": 2356} {"train_loss": -24.11576271057129, "global_step": 195587, "epoch": 2356} {"train_loss": -24.35440444946289, "global_step": 195588, "epoch": 2356} {"train_loss": -24.310596466064453, "global_step": 195589, "epoch": 2356} {"train_loss": -24.410276412963867, "global_step": 195590, "epoch": 2356} {"train_loss": -24.739242553710938, "global_step": 195591, "epoch": 2356} {"train_loss": -24.30194091796875, "global_step": 195592, "epoch": 2356} {"train_loss": -24.188947677612305, "global_step": 195593, "epoch": 2356} {"train_loss": -24.49532127380371, "global_step": 195594, "epoch": 2356} {"train_loss": -24.159360885620117, "global_step": 195595, "epoch": 2356} {"train_loss": -24.423912048339844, "global_step": 195596, "epoch": 2356} {"train_loss": -23.897563934326172, "global_step": 195597, "epoch": 2356} {"train_loss": -24.225269317626953, "global_step": 195598, "epoch": 2356} {"train_loss": -24.469579696655273, "global_step": 195599, "epoch": 2356} {"train_loss": -24.70515251159668, "global_step": 195600, "epoch": 2356} {"train_loss": -24.03864097595215, "global_step": 195601, "epoch": 2356} {"train_loss": -24.36478614807129, "global_step": 195602, "epoch": 2356} {"train_loss": -24.170740127563477, "global_step": 195603, "epoch": 2356} {"train_loss": -24.38077735900879, "global_step": 195604, "epoch": 2356} {"train_loss": -24.29391860961914, "global_step": 195605, "epoch": 2356} {"train_loss": -24.31418800354004, "global_step": 195606, "epoch": 2356} {"train_loss": -23.848682403564453, "global_step": 195607, "epoch": 2356} {"train_loss": -24.324337005615234, "global_step": 195608, "epoch": 2356} {"train_loss": -24.062501907348633, "global_step": 195609, "epoch": 2356} {"train_loss": -24.32333755493164, "global_step": 195610, "epoch": 2356} {"train_loss": -24.59712028503418, "global_step": 195611, "epoch": 2356} {"train_loss": -24.07370948791504, "global_step": 195612, "epoch": 2356} {"train_loss": -24.221698760986328, "global_step": 195613, "epoch": 2356} {"train_loss": -24.540729522705078, "global_step": 195614, "epoch": 2356} {"train_loss": -24.22583770751953, "global_step": 195615, "epoch": 2356} {"train_loss": -23.989276885986328, "global_step": 195616, "epoch": 2356} {"train_loss": -24.110294342041016, "global_step": 195617, "epoch": 2356} {"train_loss": -24.267316818237305, "global_step": 195618, "epoch": 2356} {"train_loss": -24.10727882385254, "global_step": 195619, "epoch": 2356} {"train_loss": -23.861913681030273, "global_step": 195620, "epoch": 2356} {"train_loss": -24.09971046447754, "global_step": 195621, "epoch": 2356} {"train_loss": -24.365888595581055, "global_step": 195622, "epoch": 2356} {"train_loss": -24.06142234802246, "global_step": 195623, "epoch": 2356} {"train_loss": -24.313621520996094, "global_step": 195624, "epoch": 2356} {"train_loss": -24.324216842651367, "global_step": 195625, "epoch": 2356} {"train_loss": -24.29451560974121, "global_step": 195626, "epoch": 2356} {"train_loss": -24.243959426879883, "global_step": 195627, "epoch": 2356} {"train_loss": -24.107364654541016, "global_step": 195628, "epoch": 2356} {"train_loss": -24.304105758666992, "global_step": 195629, "epoch": 2356} {"train_loss": -24.075003911213702, "global_step": 195630, "epoch": 2356, "val_loss": 6497278.0} {"train_loss": -24.037599563598633, "global_step": 195631, "epoch": 2357} {"train_loss": -23.592578887939453, "global_step": 195632, "epoch": 2357} {"train_loss": -23.864988327026367, "global_step": 195633, "epoch": 2357} {"train_loss": -23.9029541015625, "global_step": 195634, "epoch": 2357} {"train_loss": -24.151460647583008, "global_step": 195635, "epoch": 2357} {"train_loss": -23.850461959838867, "global_step": 195636, "epoch": 2357} {"train_loss": -24.12616539001465, "global_step": 195637, "epoch": 2357} {"train_loss": -24.268877029418945, "global_step": 195638, "epoch": 2357} {"train_loss": -23.604726791381836, "global_step": 195639, "epoch": 2357} {"train_loss": -24.211944580078125, "global_step": 195640, "epoch": 2357} {"train_loss": -23.567975997924805, "global_step": 195641, "epoch": 2357} {"train_loss": -24.08619499206543, "global_step": 195642, "epoch": 2357} {"train_loss": -24.160737991333008, "global_step": 195643, "epoch": 2357} {"train_loss": -24.07291603088379, "global_step": 195644, "epoch": 2357} {"train_loss": -23.98218536376953, "global_step": 195645, "epoch": 2357} {"train_loss": -24.324222564697266, "global_step": 195646, "epoch": 2357} {"train_loss": -24.149614334106445, "global_step": 195647, "epoch": 2357} {"train_loss": -23.58211326599121, "global_step": 195648, "epoch": 2357} {"train_loss": -24.106779098510742, "global_step": 195649, "epoch": 2357} {"train_loss": -24.537567138671875, "global_step": 195650, "epoch": 2357} {"train_loss": -24.088449478149414, "global_step": 195651, "epoch": 2357} {"train_loss": -24.386337280273438, "global_step": 195652, "epoch": 2357} {"train_loss": -24.3060302734375, "global_step": 195653, "epoch": 2357} {"train_loss": -24.040048599243164, "global_step": 195654, "epoch": 2357} {"train_loss": -23.941728591918945, "global_step": 195655, "epoch": 2357} {"train_loss": -24.137353897094727, "global_step": 195656, "epoch": 2357} {"train_loss": -24.298816680908203, "global_step": 195657, "epoch": 2357} {"train_loss": -23.942005157470703, "global_step": 195658, "epoch": 2357} {"train_loss": -24.20907974243164, "global_step": 195659, "epoch": 2357} {"train_loss": -24.09686279296875, "global_step": 195660, "epoch": 2357} {"train_loss": -24.34014129638672, "global_step": 195661, "epoch": 2357} {"train_loss": -24.51094627380371, "global_step": 195662, "epoch": 2357} {"train_loss": -24.177183151245117, "global_step": 195663, "epoch": 2357} {"train_loss": -24.47199058532715, "global_step": 195664, "epoch": 2357} {"train_loss": -24.373289108276367, "global_step": 195665, "epoch": 2357} {"train_loss": -23.876195907592773, "global_step": 195666, "epoch": 2357} {"train_loss": -23.96335792541504, "global_step": 195667, "epoch": 2357} {"train_loss": -24.5234375, "global_step": 195668, "epoch": 2357} {"train_loss": -24.180017471313477, "global_step": 195669, "epoch": 2357} {"train_loss": -24.248756408691406, "global_step": 195670, "epoch": 2357} {"train_loss": -24.132291793823242, "global_step": 195671, "epoch": 2357} {"train_loss": -24.19025993347168, "global_step": 195672, "epoch": 2357} {"train_loss": -24.108989715576172, "global_step": 195673, "epoch": 2357} {"train_loss": -24.100482940673828, "global_step": 195674, "epoch": 2357} {"train_loss": -24.285505294799805, "global_step": 195675, "epoch": 2357} {"train_loss": -24.30585289001465, "global_step": 195676, "epoch": 2357} {"train_loss": -23.995800018310547, "global_step": 195677, "epoch": 2357} {"train_loss": -24.01582908630371, "global_step": 195678, "epoch": 2357} {"train_loss": -24.093656539916992, "global_step": 195679, "epoch": 2357} {"train_loss": -22.975889205932617, "global_step": 195680, "epoch": 2357} {"train_loss": -23.154226303100586, "global_step": 195681, "epoch": 2357} {"train_loss": -23.437973022460938, "global_step": 195682, "epoch": 2357} {"train_loss": -23.925296783447266, "global_step": 195683, "epoch": 2357} {"train_loss": -22.850500106811523, "global_step": 195684, "epoch": 2357} {"train_loss": -24.10721778869629, "global_step": 195685, "epoch": 2357} {"train_loss": -23.64637565612793, "global_step": 195686, "epoch": 2357} {"train_loss": -23.466541290283203, "global_step": 195687, "epoch": 2357} {"train_loss": -23.968416213989258, "global_step": 195688, "epoch": 2357} {"train_loss": -23.299270629882812, "global_step": 195689, "epoch": 2357} {"train_loss": -24.195825576782227, "global_step": 195690, "epoch": 2357} {"train_loss": -23.728729248046875, "global_step": 195691, "epoch": 2357} {"train_loss": -24.055028915405273, "global_step": 195692, "epoch": 2357} {"train_loss": -23.86433219909668, "global_step": 195693, "epoch": 2357} {"train_loss": -24.198331832885742, "global_step": 195694, "epoch": 2357} {"train_loss": -23.950937271118164, "global_step": 195695, "epoch": 2357} {"train_loss": -24.240907669067383, "global_step": 195696, "epoch": 2357} {"train_loss": -24.10858726501465, "global_step": 195697, "epoch": 2357} {"train_loss": -23.89700698852539, "global_step": 195698, "epoch": 2357} {"train_loss": -24.146547317504883, "global_step": 195699, "epoch": 2357} {"train_loss": -23.71553611755371, "global_step": 195700, "epoch": 2357} {"train_loss": -23.956680297851562, "global_step": 195701, "epoch": 2357} {"train_loss": -23.958681106567383, "global_step": 195702, "epoch": 2357} {"train_loss": -23.983505249023438, "global_step": 195703, "epoch": 2357} {"train_loss": -24.23488426208496, "global_step": 195704, "epoch": 2357} {"train_loss": -24.17741584777832, "global_step": 195705, "epoch": 2357} {"train_loss": -24.324851989746094, "global_step": 195706, "epoch": 2357} {"train_loss": -24.35110092163086, "global_step": 195707, "epoch": 2357} {"train_loss": -23.989290237426758, "global_step": 195708, "epoch": 2357} {"train_loss": -23.708444595336914, "global_step": 195709, "epoch": 2357} {"train_loss": -24.07417106628418, "global_step": 195710, "epoch": 2357} {"train_loss": -24.151809692382812, "global_step": 195711, "epoch": 2357} {"train_loss": -24.024869918823242, "global_step": 195712, "epoch": 2357} {"train_loss": -24.014589677374047, "global_step": 195713, "epoch": 2357, "val_loss": 6454088.0} {"train_loss": -23.726232528686523, "global_step": 195714, "epoch": 2358} {"train_loss": -23.576208114624023, "global_step": 195715, "epoch": 2358} {"train_loss": -23.407644271850586, "global_step": 195716, "epoch": 2358} {"train_loss": -23.747610092163086, "global_step": 195717, "epoch": 2358} {"train_loss": -23.721269607543945, "global_step": 195718, "epoch": 2358} {"train_loss": -23.791656494140625, "global_step": 195719, "epoch": 2358} {"train_loss": -24.022939682006836, "global_step": 195720, "epoch": 2358} {"train_loss": -23.62926483154297, "global_step": 195721, "epoch": 2358} {"train_loss": -23.75922393798828, "global_step": 195722, "epoch": 2358} {"train_loss": -23.890140533447266, "global_step": 195723, "epoch": 2358} {"train_loss": -23.988656997680664, "global_step": 195724, "epoch": 2358} {"train_loss": -24.009729385375977, "global_step": 195725, "epoch": 2358} {"train_loss": -23.89653968811035, "global_step": 195726, "epoch": 2358} {"train_loss": -23.683874130249023, "global_step": 195727, "epoch": 2358} {"train_loss": -23.756929397583008, "global_step": 195728, "epoch": 2358} {"train_loss": -24.034948348999023, "global_step": 195729, "epoch": 2358} {"train_loss": -23.990203857421875, "global_step": 195730, "epoch": 2358} {"train_loss": -24.136920928955078, "global_step": 195731, "epoch": 2358} {"train_loss": -24.04714012145996, "global_step": 195732, "epoch": 2358} {"train_loss": -23.935619354248047, "global_step": 195733, "epoch": 2358} {"train_loss": -24.26116371154785, "global_step": 195734, "epoch": 2358} {"train_loss": -23.988727569580078, "global_step": 195735, "epoch": 2358} {"train_loss": -23.744579315185547, "global_step": 195736, "epoch": 2358} {"train_loss": -24.272550582885742, "global_step": 195737, "epoch": 2358} {"train_loss": -24.581449508666992, "global_step": 195738, "epoch": 2358} {"train_loss": -24.104909896850586, "global_step": 195739, "epoch": 2358} {"train_loss": -24.518741607666016, "global_step": 195740, "epoch": 2358} {"train_loss": -24.079681396484375, "global_step": 195741, "epoch": 2358} {"train_loss": -24.26042938232422, "global_step": 195742, "epoch": 2358} {"train_loss": -24.208288192749023, "global_step": 195743, "epoch": 2358} {"train_loss": -24.300207138061523, "global_step": 195744, "epoch": 2358} {"train_loss": -23.987897872924805, "global_step": 195745, "epoch": 2358} {"train_loss": -24.350595474243164, "global_step": 195746, "epoch": 2358} {"train_loss": -24.095149993896484, "global_step": 195747, "epoch": 2358} {"train_loss": -24.34797477722168, "global_step": 195748, "epoch": 2358} {"train_loss": -23.917688369750977, "global_step": 195749, "epoch": 2358} {"train_loss": -24.119049072265625, "global_step": 195750, "epoch": 2358} {"train_loss": -24.14527702331543, "global_step": 195751, "epoch": 2358} {"train_loss": -23.583404541015625, "global_step": 195752, "epoch": 2358} {"train_loss": -23.126998901367188, "global_step": 195753, "epoch": 2358} {"train_loss": -23.552274703979492, "global_step": 195754, "epoch": 2358} {"train_loss": -24.393800735473633, "global_step": 195755, "epoch": 2358} {"train_loss": -24.138381958007812, "global_step": 195756, "epoch": 2358} {"train_loss": -24.160400390625, "global_step": 195757, "epoch": 2358} {"train_loss": -23.876358032226562, "global_step": 195758, "epoch": 2358} {"train_loss": -24.059402465820312, "global_step": 195759, "epoch": 2358} {"train_loss": -24.012052536010742, "global_step": 195760, "epoch": 2358} {"train_loss": -23.986597061157227, "global_step": 195761, "epoch": 2358} {"train_loss": -24.4639949798584, "global_step": 195762, "epoch": 2358} {"train_loss": -24.449186325073242, "global_step": 195763, "epoch": 2358} {"train_loss": -24.564889907836914, "global_step": 195764, "epoch": 2358} {"train_loss": -24.220523834228516, "global_step": 195765, "epoch": 2358} {"train_loss": -24.170881271362305, "global_step": 195766, "epoch": 2358} {"train_loss": -24.161405563354492, "global_step": 195767, "epoch": 2358} {"train_loss": -24.0927677154541, "global_step": 195768, "epoch": 2358} {"train_loss": -23.90557289123535, "global_step": 195769, "epoch": 2358} {"train_loss": -24.27364730834961, "global_step": 195770, "epoch": 2358} {"train_loss": -24.01798439025879, "global_step": 195771, "epoch": 2358} {"train_loss": -24.39066505432129, "global_step": 195772, "epoch": 2358} {"train_loss": -24.44325065612793, "global_step": 195773, "epoch": 2358} {"train_loss": -24.029495239257812, "global_step": 195774, "epoch": 2358} {"train_loss": -24.091489791870117, "global_step": 195775, "epoch": 2358} {"train_loss": -24.11152458190918, "global_step": 195776, "epoch": 2358} {"train_loss": -23.955764770507812, "global_step": 195777, "epoch": 2358} {"train_loss": -23.991199493408203, "global_step": 195778, "epoch": 2358} {"train_loss": -24.52328872680664, "global_step": 195779, "epoch": 2358} {"train_loss": -24.171100616455078, "global_step": 195780, "epoch": 2358} {"train_loss": -24.223785400390625, "global_step": 195781, "epoch": 2358} {"train_loss": -24.2409725189209, "global_step": 195782, "epoch": 2358} {"train_loss": -24.335529327392578, "global_step": 195783, "epoch": 2358} {"train_loss": -24.46419334411621, "global_step": 195784, "epoch": 2358} {"train_loss": -23.907089233398438, "global_step": 195785, "epoch": 2358} {"train_loss": -24.682912826538086, "global_step": 195786, "epoch": 2358} {"train_loss": -24.50444984436035, "global_step": 195787, "epoch": 2358} {"train_loss": -24.10842514038086, "global_step": 195788, "epoch": 2358} {"train_loss": -24.616172790527344, "global_step": 195789, "epoch": 2358} {"train_loss": -24.56426429748535, "global_step": 195790, "epoch": 2358} {"train_loss": -24.35861587524414, "global_step": 195791, "epoch": 2358} {"train_loss": -24.18670082092285, "global_step": 195792, "epoch": 2358} {"train_loss": -24.18035316467285, "global_step": 195793, "epoch": 2358} {"train_loss": -24.34126853942871, "global_step": 195794, "epoch": 2358} {"train_loss": -24.27180290222168, "global_step": 195795, "epoch": 2358} {"train_loss": -24.089897270662238, "global_step": 195796, "epoch": 2358, "val_loss": 6575469.5} {"train_loss": -23.91120719909668, "global_step": 195797, "epoch": 2359} {"train_loss": -23.97810935974121, "global_step": 195798, "epoch": 2359} {"train_loss": -23.823041915893555, "global_step": 195799, "epoch": 2359} {"train_loss": -24.057138442993164, "global_step": 195800, "epoch": 2359} {"train_loss": -23.827421188354492, "global_step": 195801, "epoch": 2359} {"train_loss": -23.77228546142578, "global_step": 195802, "epoch": 2359} {"train_loss": -24.017637252807617, "global_step": 195803, "epoch": 2359} {"train_loss": -24.335437774658203, "global_step": 195804, "epoch": 2359} {"train_loss": -24.081323623657227, "global_step": 195805, "epoch": 2359} {"train_loss": -23.755407333374023, "global_step": 195806, "epoch": 2359} {"train_loss": -23.857572555541992, "global_step": 195807, "epoch": 2359} {"train_loss": -23.718233108520508, "global_step": 195808, "epoch": 2359} {"train_loss": -23.674280166625977, "global_step": 195809, "epoch": 2359} {"train_loss": -24.40804100036621, "global_step": 195810, "epoch": 2359} {"train_loss": -23.950946807861328, "global_step": 195811, "epoch": 2359} {"train_loss": -24.192707061767578, "global_step": 195812, "epoch": 2359} {"train_loss": -24.368919372558594, "global_step": 195813, "epoch": 2359} {"train_loss": -24.040414810180664, "global_step": 195814, "epoch": 2359} {"train_loss": -23.788787841796875, "global_step": 195815, "epoch": 2359} {"train_loss": -23.99355125427246, "global_step": 195816, "epoch": 2359} {"train_loss": -24.05434226989746, "global_step": 195817, "epoch": 2359} {"train_loss": -24.271120071411133, "global_step": 195818, "epoch": 2359} {"train_loss": -23.555252075195312, "global_step": 195819, "epoch": 2359} {"train_loss": -24.48998260498047, "global_step": 195820, "epoch": 2359} {"train_loss": -23.881391525268555, "global_step": 195821, "epoch": 2359} {"train_loss": -24.07513427734375, "global_step": 195822, "epoch": 2359} {"train_loss": -23.960742950439453, "global_step": 195823, "epoch": 2359} {"train_loss": -24.359600067138672, "global_step": 195824, "epoch": 2359} {"train_loss": -24.338348388671875, "global_step": 195825, "epoch": 2359} {"train_loss": -24.09646224975586, "global_step": 195826, "epoch": 2359} {"train_loss": -24.319204330444336, "global_step": 195827, "epoch": 2359} {"train_loss": -23.972200393676758, "global_step": 195828, "epoch": 2359} {"train_loss": -24.29080581665039, "global_step": 195829, "epoch": 2359} {"train_loss": -24.120542526245117, "global_step": 195830, "epoch": 2359} {"train_loss": -24.202701568603516, "global_step": 195831, "epoch": 2359} {"train_loss": -24.3721923828125, "global_step": 195832, "epoch": 2359} {"train_loss": -24.390920639038086, "global_step": 195833, "epoch": 2359} {"train_loss": -24.107812881469727, "global_step": 195834, "epoch": 2359} {"train_loss": -24.460872650146484, "global_step": 195835, "epoch": 2359} {"train_loss": -24.247617721557617, "global_step": 195836, "epoch": 2359} {"train_loss": -24.440773010253906, "global_step": 195837, "epoch": 2359} {"train_loss": -24.004806518554688, "global_step": 195838, "epoch": 2359} {"train_loss": -24.19843101501465, "global_step": 195839, "epoch": 2359} {"train_loss": -24.05293846130371, "global_step": 195840, "epoch": 2359} {"train_loss": -23.908628463745117, "global_step": 195841, "epoch": 2359} {"train_loss": -24.20711898803711, "global_step": 195842, "epoch": 2359} {"train_loss": -24.13650894165039, "global_step": 195843, "epoch": 2359} {"train_loss": -24.338214874267578, "global_step": 195844, "epoch": 2359} {"train_loss": -24.318601608276367, "global_step": 195845, "epoch": 2359} {"train_loss": -24.182981491088867, "global_step": 195846, "epoch": 2359} {"train_loss": -24.208866119384766, "global_step": 195847, "epoch": 2359} {"train_loss": -24.299169540405273, "global_step": 195848, "epoch": 2359} {"train_loss": -23.98480224609375, "global_step": 195849, "epoch": 2359} {"train_loss": -24.293039321899414, "global_step": 195850, "epoch": 2359} {"train_loss": -24.029911041259766, "global_step": 195851, "epoch": 2359} {"train_loss": -24.1295223236084, "global_step": 195852, "epoch": 2359} {"train_loss": -24.291181564331055, "global_step": 195853, "epoch": 2359} {"train_loss": -24.420642852783203, "global_step": 195854, "epoch": 2359} {"train_loss": -24.09437370300293, "global_step": 195855, "epoch": 2359} {"train_loss": -23.873659133911133, "global_step": 195856, "epoch": 2359} {"train_loss": -23.18353843688965, "global_step": 195857, "epoch": 2359} {"train_loss": -23.698484420776367, "global_step": 195858, "epoch": 2359} {"train_loss": -24.06296157836914, "global_step": 195859, "epoch": 2359} {"train_loss": -24.136804580688477, "global_step": 195860, "epoch": 2359} {"train_loss": -24.119199752807617, "global_step": 195861, "epoch": 2359} {"train_loss": -23.73929214477539, "global_step": 195862, "epoch": 2359} {"train_loss": -24.343311309814453, "global_step": 195863, "epoch": 2359} {"train_loss": -23.74506187438965, "global_step": 195864, "epoch": 2359} {"train_loss": -23.87998390197754, "global_step": 195865, "epoch": 2359} {"train_loss": -23.9283504486084, "global_step": 195866, "epoch": 2359} {"train_loss": -24.1925048828125, "global_step": 195867, "epoch": 2359} {"train_loss": -23.892719268798828, "global_step": 195868, "epoch": 2359} {"train_loss": -24.424596786499023, "global_step": 195869, "epoch": 2359} {"train_loss": -24.305286407470703, "global_step": 195870, "epoch": 2359} {"train_loss": -24.24338722229004, "global_step": 195871, "epoch": 2359} {"train_loss": -24.369436264038086, "global_step": 195872, "epoch": 2359} {"train_loss": -24.25958824157715, "global_step": 195873, "epoch": 2359} {"train_loss": -24.06964111328125, "global_step": 195874, "epoch": 2359} {"train_loss": -24.338634490966797, "global_step": 195875, "epoch": 2359} {"train_loss": -24.280004501342773, "global_step": 195876, "epoch": 2359} {"train_loss": -24.2338924407959, "global_step": 195877, "epoch": 2359} {"train_loss": -24.006454467773438, "global_step": 195878, "epoch": 2359} {"train_loss": -24.09977264863899, "global_step": 195879, "epoch": 2359, "val_loss": 6510937.0} {"train_loss": -24.172779083251953, "global_step": 195880, "epoch": 2360} {"train_loss": -24.252286911010742, "global_step": 195881, "epoch": 2360} {"train_loss": -24.112930297851562, "global_step": 195882, "epoch": 2360} {"train_loss": -24.307477951049805, "global_step": 195883, "epoch": 2360} {"train_loss": -24.133838653564453, "global_step": 195884, "epoch": 2360} {"train_loss": -24.181407928466797, "global_step": 195885, "epoch": 2360} {"train_loss": -24.06496238708496, "global_step": 195886, "epoch": 2360} {"train_loss": -23.954923629760742, "global_step": 195887, "epoch": 2360} {"train_loss": -23.85228729248047, "global_step": 195888, "epoch": 2360} {"train_loss": -23.991682052612305, "global_step": 195889, "epoch": 2360} {"train_loss": -23.59030532836914, "global_step": 195890, "epoch": 2360} {"train_loss": -23.86537742614746, "global_step": 195891, "epoch": 2360} {"train_loss": -23.60591697692871, "global_step": 195892, "epoch": 2360} {"train_loss": -23.858455657958984, "global_step": 195893, "epoch": 2360} {"train_loss": -23.88237190246582, "global_step": 195894, "epoch": 2360} {"train_loss": -24.230854034423828, "global_step": 195895, "epoch": 2360} {"train_loss": -23.982152938842773, "global_step": 195896, "epoch": 2360} {"train_loss": -23.860727310180664, "global_step": 195897, "epoch": 2360} {"train_loss": -23.977514266967773, "global_step": 195898, "epoch": 2360} {"train_loss": -23.805498123168945, "global_step": 195899, "epoch": 2360} {"train_loss": -24.248037338256836, "global_step": 195900, "epoch": 2360} {"train_loss": -23.79751205444336, "global_step": 195901, "epoch": 2360} {"train_loss": -23.997421264648438, "global_step": 195902, "epoch": 2360} {"train_loss": -24.427885055541992, "global_step": 195903, "epoch": 2360} {"train_loss": -23.825773239135742, "global_step": 195904, "epoch": 2360} {"train_loss": -24.1080379486084, "global_step": 195905, "epoch": 2360} {"train_loss": -24.2218074798584, "global_step": 195906, "epoch": 2360} {"train_loss": -24.35920524597168, "global_step": 195907, "epoch": 2360} {"train_loss": -23.762990951538086, "global_step": 195908, "epoch": 2360} {"train_loss": -23.71820068359375, "global_step": 195909, "epoch": 2360} {"train_loss": -24.304550170898438, "global_step": 195910, "epoch": 2360} {"train_loss": -24.04206657409668, "global_step": 195911, "epoch": 2360} {"train_loss": -24.504741668701172, "global_step": 195912, "epoch": 2360} {"train_loss": -24.51463508605957, "global_step": 195913, "epoch": 2360} {"train_loss": -24.209022521972656, "global_step": 195914, "epoch": 2360} {"train_loss": -24.158456802368164, "global_step": 195915, "epoch": 2360} {"train_loss": -23.848875045776367, "global_step": 195916, "epoch": 2360} {"train_loss": -24.20718765258789, "global_step": 195917, "epoch": 2360} {"train_loss": -24.292585372924805, "global_step": 195918, "epoch": 2360} {"train_loss": -24.165525436401367, "global_step": 195919, "epoch": 2360} {"train_loss": -24.479665756225586, "global_step": 195920, "epoch": 2360} {"train_loss": -24.25789451599121, "global_step": 195921, "epoch": 2360} {"train_loss": -24.345966339111328, "global_step": 195922, "epoch": 2360} {"train_loss": -24.158130645751953, "global_step": 195923, "epoch": 2360} {"train_loss": -24.128507614135742, "global_step": 195924, "epoch": 2360} {"train_loss": -24.43671226501465, "global_step": 195925, "epoch": 2360} {"train_loss": -24.40799331665039, "global_step": 195926, "epoch": 2360} {"train_loss": -24.129674911499023, "global_step": 195927, "epoch": 2360} {"train_loss": -24.06947135925293, "global_step": 195928, "epoch": 2360} {"train_loss": -23.863136291503906, "global_step": 195929, "epoch": 2360} {"train_loss": -23.985591888427734, "global_step": 195930, "epoch": 2360} {"train_loss": -24.260540008544922, "global_step": 195931, "epoch": 2360} {"train_loss": -24.14655303955078, "global_step": 195932, "epoch": 2360} {"train_loss": -24.073850631713867, "global_step": 195933, "epoch": 2360} {"train_loss": -24.062744140625, "global_step": 195934, "epoch": 2360} {"train_loss": -24.332393646240234, "global_step": 195935, "epoch": 2360} {"train_loss": -24.378694534301758, "global_step": 195936, "epoch": 2360} {"train_loss": -24.183032989501953, "global_step": 195937, "epoch": 2360} {"train_loss": -24.044010162353516, "global_step": 195938, "epoch": 2360} {"train_loss": -24.41901206970215, "global_step": 195939, "epoch": 2360} {"train_loss": -24.24614906311035, "global_step": 195940, "epoch": 2360} {"train_loss": -24.403076171875, "global_step": 195941, "epoch": 2360} {"train_loss": -24.03635025024414, "global_step": 195942, "epoch": 2360} {"train_loss": -23.904531478881836, "global_step": 195943, "epoch": 2360} {"train_loss": -24.117481231689453, "global_step": 195944, "epoch": 2360} {"train_loss": -24.257774353027344, "global_step": 195945, "epoch": 2360} {"train_loss": -23.880491256713867, "global_step": 195946, "epoch": 2360} {"train_loss": -24.54693603515625, "global_step": 195947, "epoch": 2360} {"train_loss": -24.297359466552734, "global_step": 195948, "epoch": 2360} {"train_loss": -24.01658058166504, "global_step": 195949, "epoch": 2360} {"train_loss": -24.499055862426758, "global_step": 195950, "epoch": 2360} {"train_loss": -24.15095329284668, "global_step": 195951, "epoch": 2360} {"train_loss": -23.938241958618164, "global_step": 195952, "epoch": 2360} {"train_loss": -24.55169677734375, "global_step": 195953, "epoch": 2360} {"train_loss": -24.16132926940918, "global_step": 195954, "epoch": 2360} {"train_loss": -24.445661544799805, "global_step": 195955, "epoch": 2360} {"train_loss": -24.247272491455078, "global_step": 195956, "epoch": 2360} {"train_loss": -24.64661407470703, "global_step": 195957, "epoch": 2360} {"train_loss": -24.461118698120117, "global_step": 195958, "epoch": 2360} {"train_loss": -24.083744049072266, "global_step": 195959, "epoch": 2360} {"train_loss": -24.59243392944336, "global_step": 195960, "epoch": 2360} {"train_loss": -24.346410751342773, "global_step": 195961, "epoch": 2360} {"train_loss": -24.17103971917945, "global_step": 195962, "epoch": 2360, "val_loss": 6772888.5} {"train_loss": -23.393692016601562, "global_step": 195963, "epoch": 2361} {"train_loss": -22.429645538330078, "global_step": 195964, "epoch": 2361} {"train_loss": -23.117107391357422, "global_step": 195965, "epoch": 2361} {"train_loss": -23.406448364257812, "global_step": 195966, "epoch": 2361} {"train_loss": -23.085678100585938, "global_step": 195967, "epoch": 2361} {"train_loss": -23.68880844116211, "global_step": 195968, "epoch": 2361} {"train_loss": -23.554773330688477, "global_step": 195969, "epoch": 2361} {"train_loss": -23.57594871520996, "global_step": 195970, "epoch": 2361} {"train_loss": -23.62100601196289, "global_step": 195971, "epoch": 2361} {"train_loss": -24.04682731628418, "global_step": 195972, "epoch": 2361} {"train_loss": -23.271381378173828, "global_step": 195973, "epoch": 2361} {"train_loss": -23.9510555267334, "global_step": 195974, "epoch": 2361} {"train_loss": -23.8242130279541, "global_step": 195975, "epoch": 2361} {"train_loss": -24.182355880737305, "global_step": 195976, "epoch": 2361} {"train_loss": -23.909711837768555, "global_step": 195977, "epoch": 2361} {"train_loss": -23.938196182250977, "global_step": 195978, "epoch": 2361} {"train_loss": -24.069433212280273, "global_step": 195979, "epoch": 2361} {"train_loss": -24.244108200073242, "global_step": 195980, "epoch": 2361} {"train_loss": -24.473176956176758, "global_step": 195981, "epoch": 2361} {"train_loss": -23.908872604370117, "global_step": 195982, "epoch": 2361} {"train_loss": -23.807838439941406, "global_step": 195983, "epoch": 2361} {"train_loss": -23.957929611206055, "global_step": 195984, "epoch": 2361} {"train_loss": -23.468685150146484, "global_step": 195985, "epoch": 2361} {"train_loss": -23.71763038635254, "global_step": 195986, "epoch": 2361} {"train_loss": -24.169897079467773, "global_step": 195987, "epoch": 2361} {"train_loss": -23.981779098510742, "global_step": 195988, "epoch": 2361} {"train_loss": -23.866792678833008, "global_step": 195989, "epoch": 2361} {"train_loss": -24.35675048828125, "global_step": 195990, "epoch": 2361} {"train_loss": -24.121980667114258, "global_step": 195991, "epoch": 2361} {"train_loss": -23.79184913635254, "global_step": 195992, "epoch": 2361} {"train_loss": -24.16513442993164, "global_step": 195993, "epoch": 2361} {"train_loss": -24.37898063659668, "global_step": 195994, "epoch": 2361} {"train_loss": -23.875125885009766, "global_step": 195995, "epoch": 2361} {"train_loss": -24.083986282348633, "global_step": 195996, "epoch": 2361} {"train_loss": -24.139328002929688, "global_step": 195997, "epoch": 2361} {"train_loss": -24.154478073120117, "global_step": 195998, "epoch": 2361} {"train_loss": -24.24070930480957, "global_step": 195999, "epoch": 2361} {"train_loss": -24.248031616210938, "global_step": 196000, "epoch": 2361} {"train_loss": -24.423776626586914, "global_step": 196001, "epoch": 2361} {"train_loss": -24.3651180267334, "global_step": 196002, "epoch": 2361} {"train_loss": -24.293928146362305, "global_step": 196003, "epoch": 2361} {"train_loss": -24.374855041503906, "global_step": 196004, "epoch": 2361} {"train_loss": -24.105619430541992, "global_step": 196005, "epoch": 2361} {"train_loss": -24.37733268737793, "global_step": 196006, "epoch": 2361} {"train_loss": -24.219785690307617, "global_step": 196007, "epoch": 2361} {"train_loss": -24.80885887145996, "global_step": 196008, "epoch": 2361} {"train_loss": -24.38950538635254, "global_step": 196009, "epoch": 2361} {"train_loss": -24.0633602142334, "global_step": 196010, "epoch": 2361} {"train_loss": -24.08729362487793, "global_step": 196011, "epoch": 2361} {"train_loss": -23.88078498840332, "global_step": 196012, "epoch": 2361} {"train_loss": -24.491918563842773, "global_step": 196013, "epoch": 2361} {"train_loss": -24.54764747619629, "global_step": 196014, "epoch": 2361} {"train_loss": -23.992034912109375, "global_step": 196015, "epoch": 2361} {"train_loss": -23.640216827392578, "global_step": 196016, "epoch": 2361} {"train_loss": -23.96680450439453, "global_step": 196017, "epoch": 2361} {"train_loss": -24.109033584594727, "global_step": 196018, "epoch": 2361} {"train_loss": -24.407550811767578, "global_step": 196019, "epoch": 2361} {"train_loss": -24.25445556640625, "global_step": 196020, "epoch": 2361} {"train_loss": -24.145919799804688, "global_step": 196021, "epoch": 2361} {"train_loss": -24.087459564208984, "global_step": 196022, "epoch": 2361} {"train_loss": -24.272926330566406, "global_step": 196023, "epoch": 2361} {"train_loss": -24.339651107788086, "global_step": 196024, "epoch": 2361} {"train_loss": -24.295223236083984, "global_step": 196025, "epoch": 2361} {"train_loss": -24.122509002685547, "global_step": 196026, "epoch": 2361} {"train_loss": -24.009963989257812, "global_step": 196027, "epoch": 2361} {"train_loss": -24.14171028137207, "global_step": 196028, "epoch": 2361} {"train_loss": -24.678068161010742, "global_step": 196029, "epoch": 2361} {"train_loss": -24.098730087280273, "global_step": 196030, "epoch": 2361} {"train_loss": -24.089393615722656, "global_step": 196031, "epoch": 2361} {"train_loss": -24.36587142944336, "global_step": 196032, "epoch": 2361} {"train_loss": -24.442590713500977, "global_step": 196033, "epoch": 2361} {"train_loss": -24.409841537475586, "global_step": 196034, "epoch": 2361} {"train_loss": -24.308134078979492, "global_step": 196035, "epoch": 2361} {"train_loss": -24.601110458374023, "global_step": 196036, "epoch": 2361} {"train_loss": -24.3731689453125, "global_step": 196037, "epoch": 2361} {"train_loss": -24.183900833129883, "global_step": 196038, "epoch": 2361} {"train_loss": -24.470251083374023, "global_step": 196039, "epoch": 2361} {"train_loss": -24.14208984375, "global_step": 196040, "epoch": 2361} {"train_loss": -24.322851181030273, "global_step": 196041, "epoch": 2361} {"train_loss": -24.329492568969727, "global_step": 196042, "epoch": 2361} {"train_loss": -24.357595443725586, "global_step": 196043, "epoch": 2361} {"train_loss": -24.390913009643555, "global_step": 196044, "epoch": 2361} {"train_loss": -24.091928619936287, "global_step": 196045, "epoch": 2361, "val_loss": 6418534.0} {"train_loss": -24.085119247436523, "global_step": 196046, "epoch": 2362} {"train_loss": -23.717126846313477, "global_step": 196047, "epoch": 2362} {"train_loss": -24.11427879333496, "global_step": 196048, "epoch": 2362} {"train_loss": -24.066364288330078, "global_step": 196049, "epoch": 2362} {"train_loss": -23.99501609802246, "global_step": 196050, "epoch": 2362} {"train_loss": -24.435483932495117, "global_step": 196051, "epoch": 2362} {"train_loss": -24.24811363220215, "global_step": 196052, "epoch": 2362} {"train_loss": -23.7337589263916, "global_step": 196053, "epoch": 2362} {"train_loss": -23.862503051757812, "global_step": 196054, "epoch": 2362} {"train_loss": -24.00617790222168, "global_step": 196055, "epoch": 2362} {"train_loss": -24.51746368408203, "global_step": 196056, "epoch": 2362} {"train_loss": -24.12640380859375, "global_step": 196057, "epoch": 2362} {"train_loss": -23.95368766784668, "global_step": 196058, "epoch": 2362} {"train_loss": -24.109146118164062, "global_step": 196059, "epoch": 2362} {"train_loss": -23.993223190307617, "global_step": 196060, "epoch": 2362} {"train_loss": -24.337665557861328, "global_step": 196061, "epoch": 2362} {"train_loss": -23.948312759399414, "global_step": 196062, "epoch": 2362} {"train_loss": -24.06402015686035, "global_step": 196063, "epoch": 2362} {"train_loss": -24.378860473632812, "global_step": 196064, "epoch": 2362} {"train_loss": -24.120389938354492, "global_step": 196065, "epoch": 2362} {"train_loss": -24.398906707763672, "global_step": 196066, "epoch": 2362} {"train_loss": -24.289953231811523, "global_step": 196067, "epoch": 2362} {"train_loss": -23.942350387573242, "global_step": 196068, "epoch": 2362} {"train_loss": -24.405868530273438, "global_step": 196069, "epoch": 2362} {"train_loss": -24.373952865600586, "global_step": 196070, "epoch": 2362} {"train_loss": -24.588512420654297, "global_step": 196071, "epoch": 2362} {"train_loss": -24.39478874206543, "global_step": 196072, "epoch": 2362} {"train_loss": -24.01999855041504, "global_step": 196073, "epoch": 2362} {"train_loss": -24.37394905090332, "global_step": 196074, "epoch": 2362} {"train_loss": -24.474714279174805, "global_step": 196075, "epoch": 2362} {"train_loss": -24.211933135986328, "global_step": 196076, "epoch": 2362} {"train_loss": -24.2105655670166, "global_step": 196077, "epoch": 2362} {"train_loss": -24.08384132385254, "global_step": 196078, "epoch": 2362} {"train_loss": -24.543798446655273, "global_step": 196079, "epoch": 2362} {"train_loss": -24.258638381958008, "global_step": 196080, "epoch": 2362} {"train_loss": -24.2501277923584, "global_step": 196081, "epoch": 2362} {"train_loss": -24.006633758544922, "global_step": 196082, "epoch": 2362} {"train_loss": -23.615346908569336, "global_step": 196083, "epoch": 2362} {"train_loss": -23.803815841674805, "global_step": 196084, "epoch": 2362} {"train_loss": -23.700529098510742, "global_step": 196085, "epoch": 2362} {"train_loss": -24.00726318359375, "global_step": 196086, "epoch": 2362} {"train_loss": -24.082199096679688, "global_step": 196087, "epoch": 2362} {"train_loss": -23.80192756652832, "global_step": 196088, "epoch": 2362} {"train_loss": -24.307104110717773, "global_step": 196089, "epoch": 2362} {"train_loss": -24.152896881103516, "global_step": 196090, "epoch": 2362} {"train_loss": -24.278060913085938, "global_step": 196091, "epoch": 2362} {"train_loss": -24.33665657043457, "global_step": 196092, "epoch": 2362} {"train_loss": -24.292312622070312, "global_step": 196093, "epoch": 2362} {"train_loss": -24.291898727416992, "global_step": 196094, "epoch": 2362} {"train_loss": -24.196931838989258, "global_step": 196095, "epoch": 2362} {"train_loss": -23.770193099975586, "global_step": 196096, "epoch": 2362} {"train_loss": -24.072084426879883, "global_step": 196097, "epoch": 2362} {"train_loss": -24.3637752532959, "global_step": 196098, "epoch": 2362} {"train_loss": -24.291213989257812, "global_step": 196099, "epoch": 2362} {"train_loss": -24.291460037231445, "global_step": 196100, "epoch": 2362} {"train_loss": -24.591480255126953, "global_step": 196101, "epoch": 2362} {"train_loss": -24.480579376220703, "global_step": 196102, "epoch": 2362} {"train_loss": -24.27145767211914, "global_step": 196103, "epoch": 2362} {"train_loss": -24.2539119720459, "global_step": 196104, "epoch": 2362} {"train_loss": -24.40155792236328, "global_step": 196105, "epoch": 2362} {"train_loss": -24.344167709350586, "global_step": 196106, "epoch": 2362} {"train_loss": -24.035776138305664, "global_step": 196107, "epoch": 2362} {"train_loss": -24.309017181396484, "global_step": 196108, "epoch": 2362} {"train_loss": -23.84658432006836, "global_step": 196109, "epoch": 2362} {"train_loss": -24.11519432067871, "global_step": 196110, "epoch": 2362} {"train_loss": -24.29966163635254, "global_step": 196111, "epoch": 2362} {"train_loss": -24.129486083984375, "global_step": 196112, "epoch": 2362} {"train_loss": -24.229957580566406, "global_step": 196113, "epoch": 2362} {"train_loss": -24.4179744720459, "global_step": 196114, "epoch": 2362} {"train_loss": -24.295198440551758, "global_step": 196115, "epoch": 2362} {"train_loss": -24.057804107666016, "global_step": 196116, "epoch": 2362} {"train_loss": -24.447433471679688, "global_step": 196117, "epoch": 2362} {"train_loss": -24.410404205322266, "global_step": 196118, "epoch": 2362} {"train_loss": -24.34535789489746, "global_step": 196119, "epoch": 2362} {"train_loss": -24.457555770874023, "global_step": 196120, "epoch": 2362} {"train_loss": -24.08873176574707, "global_step": 196121, "epoch": 2362} {"train_loss": -24.160654067993164, "global_step": 196122, "epoch": 2362} {"train_loss": -24.210094451904297, "global_step": 196123, "epoch": 2362} {"train_loss": -24.329687118530273, "global_step": 196124, "epoch": 2362} {"train_loss": -24.39092445373535, "global_step": 196125, "epoch": 2362} {"train_loss": -24.458410263061523, "global_step": 196126, "epoch": 2362} {"train_loss": -24.01828956604004, "global_step": 196127, "epoch": 2362} {"train_loss": -24.20710276408368, "global_step": 196128, "epoch": 2362, "val_loss": 6526424.0} {"train_loss": -23.694622039794922, "global_step": 196129, "epoch": 2363} {"train_loss": -23.661697387695312, "global_step": 196130, "epoch": 2363} {"train_loss": -23.32832908630371, "global_step": 196131, "epoch": 2363} {"train_loss": -22.95115089416504, "global_step": 196132, "epoch": 2363} {"train_loss": -23.772125244140625, "global_step": 196133, "epoch": 2363} {"train_loss": -23.885740280151367, "global_step": 196134, "epoch": 2363} {"train_loss": -23.52815818786621, "global_step": 196135, "epoch": 2363} {"train_loss": -23.775989532470703, "global_step": 196136, "epoch": 2363} {"train_loss": -23.875333786010742, "global_step": 196137, "epoch": 2363} {"train_loss": -23.5313777923584, "global_step": 196138, "epoch": 2363} {"train_loss": -24.162145614624023, "global_step": 196139, "epoch": 2363} {"train_loss": -23.596635818481445, "global_step": 196140, "epoch": 2363} {"train_loss": -23.538244247436523, "global_step": 196141, "epoch": 2363} {"train_loss": -23.907461166381836, "global_step": 196142, "epoch": 2363} {"train_loss": -24.090970993041992, "global_step": 196143, "epoch": 2363} {"train_loss": -23.91552734375, "global_step": 196144, "epoch": 2363} {"train_loss": -23.844345092773438, "global_step": 196145, "epoch": 2363} {"train_loss": -24.10420036315918, "global_step": 196146, "epoch": 2363} {"train_loss": -24.20009422302246, "global_step": 196147, "epoch": 2363} {"train_loss": -23.84505271911621, "global_step": 196148, "epoch": 2363} {"train_loss": -24.22861099243164, "global_step": 196149, "epoch": 2363} {"train_loss": -23.782556533813477, "global_step": 196150, "epoch": 2363} {"train_loss": -24.342525482177734, "global_step": 196151, "epoch": 2363} {"train_loss": -24.25187110900879, "global_step": 196152, "epoch": 2363} {"train_loss": -24.067712783813477, "global_step": 196153, "epoch": 2363} {"train_loss": -24.70255470275879, "global_step": 196154, "epoch": 2363} {"train_loss": -23.945148468017578, "global_step": 196155, "epoch": 2363} {"train_loss": -24.1759090423584, "global_step": 196156, "epoch": 2363} {"train_loss": -24.44132423400879, "global_step": 196157, "epoch": 2363} {"train_loss": -23.852169036865234, "global_step": 196158, "epoch": 2363} {"train_loss": -24.077289581298828, "global_step": 196159, "epoch": 2363} {"train_loss": -23.9012508392334, "global_step": 196160, "epoch": 2363} {"train_loss": -24.097522735595703, "global_step": 196161, "epoch": 2363} {"train_loss": -23.931392669677734, "global_step": 196162, "epoch": 2363} {"train_loss": -24.478647232055664, "global_step": 196163, "epoch": 2363} {"train_loss": -24.227039337158203, "global_step": 196164, "epoch": 2363} {"train_loss": -24.275455474853516, "global_step": 196165, "epoch": 2363} {"train_loss": -24.280981063842773, "global_step": 196166, "epoch": 2363} {"train_loss": -24.259035110473633, "global_step": 196167, "epoch": 2363} {"train_loss": -24.113100051879883, "global_step": 196168, "epoch": 2363} {"train_loss": -23.907209396362305, "global_step": 196169, "epoch": 2363} {"train_loss": -24.330711364746094, "global_step": 196170, "epoch": 2363} {"train_loss": -24.321887969970703, "global_step": 196171, "epoch": 2363} {"train_loss": -24.029338836669922, "global_step": 196172, "epoch": 2363} {"train_loss": -23.832273483276367, "global_step": 196173, "epoch": 2363} {"train_loss": -24.200176239013672, "global_step": 196174, "epoch": 2363} {"train_loss": -24.64607810974121, "global_step": 196175, "epoch": 2363} {"train_loss": -24.31431007385254, "global_step": 196176, "epoch": 2363} {"train_loss": -24.442607879638672, "global_step": 196177, "epoch": 2363} {"train_loss": -23.876989364624023, "global_step": 196178, "epoch": 2363} {"train_loss": -24.32025718688965, "global_step": 196179, "epoch": 2363} {"train_loss": -24.452348709106445, "global_step": 196180, "epoch": 2363} {"train_loss": -24.41229820251465, "global_step": 196181, "epoch": 2363} {"train_loss": -24.138019561767578, "global_step": 196182, "epoch": 2363} {"train_loss": -24.37810707092285, "global_step": 196183, "epoch": 2363} {"train_loss": -24.51022720336914, "global_step": 196184, "epoch": 2363} {"train_loss": -23.585622787475586, "global_step": 196185, "epoch": 2363} {"train_loss": -23.597604751586914, "global_step": 196186, "epoch": 2363} {"train_loss": -23.653806686401367, "global_step": 196187, "epoch": 2363} {"train_loss": -23.900094985961914, "global_step": 196188, "epoch": 2363} {"train_loss": -24.2023983001709, "global_step": 196189, "epoch": 2363} {"train_loss": -23.715301513671875, "global_step": 196190, "epoch": 2363} {"train_loss": -23.92133140563965, "global_step": 196191, "epoch": 2363} {"train_loss": -24.198484420776367, "global_step": 196192, "epoch": 2363} {"train_loss": -23.90970802307129, "global_step": 196193, "epoch": 2363} {"train_loss": -23.666749954223633, "global_step": 196194, "epoch": 2363} {"train_loss": -23.918996810913086, "global_step": 196195, "epoch": 2363} {"train_loss": -23.89986801147461, "global_step": 196196, "epoch": 2363} {"train_loss": -23.80939292907715, "global_step": 196197, "epoch": 2363} {"train_loss": -23.861719131469727, "global_step": 196198, "epoch": 2363} {"train_loss": -24.13392448425293, "global_step": 196199, "epoch": 2363} {"train_loss": -23.855192184448242, "global_step": 196200, "epoch": 2363} {"train_loss": -24.158369064331055, "global_step": 196201, "epoch": 2363} {"train_loss": -24.013078689575195, "global_step": 196202, "epoch": 2363} {"train_loss": -24.1368350982666, "global_step": 196203, "epoch": 2363} {"train_loss": -23.786283493041992, "global_step": 196204, "epoch": 2363} {"train_loss": -23.95717430114746, "global_step": 196205, "epoch": 2363} {"train_loss": -23.811203002929688, "global_step": 196206, "epoch": 2363} {"train_loss": -24.039636611938477, "global_step": 196207, "epoch": 2363} {"train_loss": -23.905576705932617, "global_step": 196208, "epoch": 2363} {"train_loss": -23.987760543823242, "global_step": 196209, "epoch": 2363} {"train_loss": -23.97493553161621, "global_step": 196210, "epoch": 2363} {"train_loss": -24.01819913933076, "global_step": 196211, "epoch": 2363, "val_loss": 6571877.0} {"train_loss": -23.587894439697266, "global_step": 196212, "epoch": 2364} {"train_loss": -23.614471435546875, "global_step": 196213, "epoch": 2364} {"train_loss": -23.795705795288086, "global_step": 196214, "epoch": 2364} {"train_loss": -23.847171783447266, "global_step": 196215, "epoch": 2364} {"train_loss": -24.005752563476562, "global_step": 196216, "epoch": 2364} {"train_loss": -24.025543212890625, "global_step": 196217, "epoch": 2364} {"train_loss": -23.919963836669922, "global_step": 196218, "epoch": 2364} {"train_loss": -24.093067169189453, "global_step": 196219, "epoch": 2364} {"train_loss": -23.954608917236328, "global_step": 196220, "epoch": 2364} {"train_loss": -24.30446434020996, "global_step": 196221, "epoch": 2364} {"train_loss": -23.837162017822266, "global_step": 196222, "epoch": 2364} {"train_loss": -24.22397232055664, "global_step": 196223, "epoch": 2364} {"train_loss": -23.90620231628418, "global_step": 196224, "epoch": 2364} {"train_loss": -23.749975204467773, "global_step": 196225, "epoch": 2364} {"train_loss": -24.03531265258789, "global_step": 196226, "epoch": 2364} {"train_loss": -24.230146408081055, "global_step": 196227, "epoch": 2364} {"train_loss": -24.07636260986328, "global_step": 196228, "epoch": 2364} {"train_loss": -24.387744903564453, "global_step": 196229, "epoch": 2364} {"train_loss": -23.998441696166992, "global_step": 196230, "epoch": 2364} {"train_loss": -24.039386749267578, "global_step": 196231, "epoch": 2364} {"train_loss": -23.93858528137207, "global_step": 196232, "epoch": 2364} {"train_loss": -23.938413619995117, "global_step": 196233, "epoch": 2364} {"train_loss": -24.375402450561523, "global_step": 196234, "epoch": 2364} {"train_loss": -24.23825454711914, "global_step": 196235, "epoch": 2364} {"train_loss": -24.040143966674805, "global_step": 196236, "epoch": 2364} {"train_loss": -24.41550064086914, "global_step": 196237, "epoch": 2364} {"train_loss": -23.99406623840332, "global_step": 196238, "epoch": 2364} {"train_loss": -24.299938201904297, "global_step": 196239, "epoch": 2364} {"train_loss": -23.899076461791992, "global_step": 196240, "epoch": 2364} {"train_loss": -24.387954711914062, "global_step": 196241, "epoch": 2364} {"train_loss": -24.625089645385742, "global_step": 196242, "epoch": 2364} {"train_loss": -24.2456111907959, "global_step": 196243, "epoch": 2364} {"train_loss": -24.05524253845215, "global_step": 196244, "epoch": 2364} {"train_loss": -24.096607208251953, "global_step": 196245, "epoch": 2364} {"train_loss": -24.422317504882812, "global_step": 196246, "epoch": 2364} {"train_loss": -24.472951889038086, "global_step": 196247, "epoch": 2364} {"train_loss": -24.020767211914062, "global_step": 196248, "epoch": 2364} {"train_loss": -24.428298950195312, "global_step": 196249, "epoch": 2364} {"train_loss": -23.943689346313477, "global_step": 196250, "epoch": 2364} {"train_loss": -23.927534103393555, "global_step": 196251, "epoch": 2364} {"train_loss": -24.242815017700195, "global_step": 196252, "epoch": 2364} {"train_loss": -24.573139190673828, "global_step": 196253, "epoch": 2364} {"train_loss": -23.997610092163086, "global_step": 196254, "epoch": 2364} {"train_loss": -24.38605499267578, "global_step": 196255, "epoch": 2364} {"train_loss": -24.00145149230957, "global_step": 196256, "epoch": 2364} {"train_loss": -24.319446563720703, "global_step": 196257, "epoch": 2364} {"train_loss": -24.4072322845459, "global_step": 196258, "epoch": 2364} {"train_loss": -24.027511596679688, "global_step": 196259, "epoch": 2364} {"train_loss": -24.379310607910156, "global_step": 196260, "epoch": 2364} {"train_loss": -24.29355239868164, "global_step": 196261, "epoch": 2364} {"train_loss": -23.706682205200195, "global_step": 196262, "epoch": 2364} {"train_loss": -24.88691520690918, "global_step": 196263, "epoch": 2364} {"train_loss": -24.707387924194336, "global_step": 196264, "epoch": 2364} {"train_loss": -24.517667770385742, "global_step": 196265, "epoch": 2364} {"train_loss": -24.14278221130371, "global_step": 196266, "epoch": 2364} {"train_loss": -24.017486572265625, "global_step": 196267, "epoch": 2364} {"train_loss": -24.201780319213867, "global_step": 196268, "epoch": 2364} {"train_loss": -24.455350875854492, "global_step": 196269, "epoch": 2364} {"train_loss": -23.929214477539062, "global_step": 196270, "epoch": 2364} {"train_loss": -24.135656356811523, "global_step": 196271, "epoch": 2364} {"train_loss": -23.9837703704834, "global_step": 196272, "epoch": 2364} {"train_loss": -23.964704513549805, "global_step": 196273, "epoch": 2364} {"train_loss": -24.085678100585938, "global_step": 196274, "epoch": 2364} {"train_loss": -24.04155731201172, "global_step": 196275, "epoch": 2364} {"train_loss": -23.889917373657227, "global_step": 196276, "epoch": 2364} {"train_loss": -23.939748764038086, "global_step": 196277, "epoch": 2364} {"train_loss": -24.08754539489746, "global_step": 196278, "epoch": 2364} {"train_loss": -23.829254150390625, "global_step": 196279, "epoch": 2364} {"train_loss": -23.573291778564453, "global_step": 196280, "epoch": 2364} {"train_loss": -24.172775268554688, "global_step": 196281, "epoch": 2364} {"train_loss": -23.79274559020996, "global_step": 196282, "epoch": 2364} {"train_loss": -24.016040802001953, "global_step": 196283, "epoch": 2364} {"train_loss": -23.864543914794922, "global_step": 196284, "epoch": 2364} {"train_loss": -23.849279403686523, "global_step": 196285, "epoch": 2364} {"train_loss": -24.1784725189209, "global_step": 196286, "epoch": 2364} {"train_loss": -23.82023048400879, "global_step": 196287, "epoch": 2364} {"train_loss": -24.191200256347656, "global_step": 196288, "epoch": 2364} {"train_loss": -24.20746612548828, "global_step": 196289, "epoch": 2364} {"train_loss": -23.908105850219727, "global_step": 196290, "epoch": 2364} {"train_loss": -24.123022079467773, "global_step": 196291, "epoch": 2364} {"train_loss": -24.2181396484375, "global_step": 196292, "epoch": 2364} {"train_loss": -24.376253128051758, "global_step": 196293, "epoch": 2364} {"train_loss": -24.085361526673097, "global_step": 196294, "epoch": 2364, "val_loss": 6530609.5} {"train_loss": -23.698394775390625, "global_step": 196295, "epoch": 2365} {"train_loss": -23.920019149780273, "global_step": 196296, "epoch": 2365} {"train_loss": -24.07250213623047, "global_step": 196297, "epoch": 2365} {"train_loss": -23.833250045776367, "global_step": 196298, "epoch": 2365} {"train_loss": -24.10822868347168, "global_step": 196299, "epoch": 2365} {"train_loss": -23.37330436706543, "global_step": 196300, "epoch": 2365} {"train_loss": -23.743560791015625, "global_step": 196301, "epoch": 2365} {"train_loss": -23.98461151123047, "global_step": 196302, "epoch": 2365} {"train_loss": -24.12507438659668, "global_step": 196303, "epoch": 2365} {"train_loss": -23.39217758178711, "global_step": 196304, "epoch": 2365} {"train_loss": -23.78669548034668, "global_step": 196305, "epoch": 2365} {"train_loss": -24.21669578552246, "global_step": 196306, "epoch": 2365} {"train_loss": -23.962873458862305, "global_step": 196307, "epoch": 2365} {"train_loss": -24.300296783447266, "global_step": 196308, "epoch": 2365} {"train_loss": -23.951581954956055, "global_step": 196309, "epoch": 2365} {"train_loss": -24.287134170532227, "global_step": 196310, "epoch": 2365} {"train_loss": -24.420007705688477, "global_step": 196311, "epoch": 2365} {"train_loss": -24.05563735961914, "global_step": 196312, "epoch": 2365} {"train_loss": -24.267284393310547, "global_step": 196313, "epoch": 2365} {"train_loss": -24.018774032592773, "global_step": 196314, "epoch": 2365} {"train_loss": -24.320693969726562, "global_step": 196315, "epoch": 2365} {"train_loss": -24.635469436645508, "global_step": 196316, "epoch": 2365} {"train_loss": -24.325162887573242, "global_step": 196317, "epoch": 2365} {"train_loss": -24.226367950439453, "global_step": 196318, "epoch": 2365} {"train_loss": -24.08881187438965, "global_step": 196319, "epoch": 2365} {"train_loss": -24.302738189697266, "global_step": 196320, "epoch": 2365} {"train_loss": -24.169452667236328, "global_step": 196321, "epoch": 2365} {"train_loss": -24.704469680786133, "global_step": 196322, "epoch": 2365} {"train_loss": -24.17987823486328, "global_step": 196323, "epoch": 2365} {"train_loss": -24.200456619262695, "global_step": 196324, "epoch": 2365} {"train_loss": -24.173185348510742, "global_step": 196325, "epoch": 2365} {"train_loss": -24.384695053100586, "global_step": 196326, "epoch": 2365} {"train_loss": -24.277257919311523, "global_step": 196327, "epoch": 2365} {"train_loss": -24.29138946533203, "global_step": 196328, "epoch": 2365} {"train_loss": -24.513601303100586, "global_step": 196329, "epoch": 2365} {"train_loss": -23.9312801361084, "global_step": 196330, "epoch": 2365} {"train_loss": -23.999265670776367, "global_step": 196331, "epoch": 2365} {"train_loss": -24.458202362060547, "global_step": 196332, "epoch": 2365} {"train_loss": -24.431861877441406, "global_step": 196333, "epoch": 2365} {"train_loss": -24.416162490844727, "global_step": 196334, "epoch": 2365} {"train_loss": -24.027517318725586, "global_step": 196335, "epoch": 2365} {"train_loss": -24.285057067871094, "global_step": 196336, "epoch": 2365} {"train_loss": -24.518041610717773, "global_step": 196337, "epoch": 2365} {"train_loss": -24.135129928588867, "global_step": 196338, "epoch": 2365} {"train_loss": -24.121002197265625, "global_step": 196339, "epoch": 2365} {"train_loss": -24.185333251953125, "global_step": 196340, "epoch": 2365} {"train_loss": -24.263151168823242, "global_step": 196341, "epoch": 2365} {"train_loss": -24.09541130065918, "global_step": 196342, "epoch": 2365} {"train_loss": -24.15666961669922, "global_step": 196343, "epoch": 2365} {"train_loss": -24.19191551208496, "global_step": 196344, "epoch": 2365} {"train_loss": -24.197067260742188, "global_step": 196345, "epoch": 2365} {"train_loss": -24.301162719726562, "global_step": 196346, "epoch": 2365} {"train_loss": -24.169082641601562, "global_step": 196347, "epoch": 2365} {"train_loss": -24.330591201782227, "global_step": 196348, "epoch": 2365} {"train_loss": -24.10712242126465, "global_step": 196349, "epoch": 2365} {"train_loss": -24.396543502807617, "global_step": 196350, "epoch": 2365} {"train_loss": -24.09808921813965, "global_step": 196351, "epoch": 2365} {"train_loss": -23.97345542907715, "global_step": 196352, "epoch": 2365} {"train_loss": -23.963388442993164, "global_step": 196353, "epoch": 2365} {"train_loss": -23.985782623291016, "global_step": 196354, "epoch": 2365} {"train_loss": -24.408737182617188, "global_step": 196355, "epoch": 2365} {"train_loss": -24.469343185424805, "global_step": 196356, "epoch": 2365} {"train_loss": -24.23428726196289, "global_step": 196357, "epoch": 2365} {"train_loss": -24.070999145507812, "global_step": 196358, "epoch": 2365} {"train_loss": -23.984914779663086, "global_step": 196359, "epoch": 2365} {"train_loss": -23.68608856201172, "global_step": 196360, "epoch": 2365} {"train_loss": -23.57474136352539, "global_step": 196361, "epoch": 2365} {"train_loss": -23.95490837097168, "global_step": 196362, "epoch": 2365} {"train_loss": -24.067174911499023, "global_step": 196363, "epoch": 2365} {"train_loss": -23.581634521484375, "global_step": 196364, "epoch": 2365} {"train_loss": -24.027233123779297, "global_step": 196365, "epoch": 2365} {"train_loss": -24.00162124633789, "global_step": 196366, "epoch": 2365} {"train_loss": -23.98027992248535, "global_step": 196367, "epoch": 2365} {"train_loss": -23.98849868774414, "global_step": 196368, "epoch": 2365} {"train_loss": -24.22654151916504, "global_step": 196369, "epoch": 2365} {"train_loss": -23.775938034057617, "global_step": 196370, "epoch": 2365} {"train_loss": -24.415090560913086, "global_step": 196371, "epoch": 2365} {"train_loss": -23.71631622314453, "global_step": 196372, "epoch": 2365} {"train_loss": -24.07520294189453, "global_step": 196373, "epoch": 2365} {"train_loss": -23.756025314331055, "global_step": 196374, "epoch": 2365} {"train_loss": -23.855894088745117, "global_step": 196375, "epoch": 2365} {"train_loss": -24.14497184753418, "global_step": 196376, "epoch": 2365} {"train_loss": -24.106791760548052, "global_step": 196377, "epoch": 2365, "val_loss": 6596039.0} {"train_loss": -23.628131866455078, "global_step": 196378, "epoch": 2366} {"train_loss": -23.86334800720215, "global_step": 196379, "epoch": 2366} {"train_loss": -24.023191452026367, "global_step": 196380, "epoch": 2366} {"train_loss": -23.914255142211914, "global_step": 196381, "epoch": 2366} {"train_loss": -23.99126434326172, "global_step": 196382, "epoch": 2366} {"train_loss": -24.174203872680664, "global_step": 196383, "epoch": 2366} {"train_loss": -24.195589065551758, "global_step": 196384, "epoch": 2366} {"train_loss": -23.730560302734375, "global_step": 196385, "epoch": 2366} {"train_loss": -24.033166885375977, "global_step": 196386, "epoch": 2366} {"train_loss": -24.12601089477539, "global_step": 196387, "epoch": 2366} {"train_loss": -23.436094284057617, "global_step": 196388, "epoch": 2366} {"train_loss": -23.662919998168945, "global_step": 196389, "epoch": 2366} {"train_loss": -23.57807731628418, "global_step": 196390, "epoch": 2366} {"train_loss": -24.242971420288086, "global_step": 196391, "epoch": 2366} {"train_loss": -23.888809204101562, "global_step": 196392, "epoch": 2366} {"train_loss": -24.18755340576172, "global_step": 196393, "epoch": 2366} {"train_loss": -24.219440460205078, "global_step": 196394, "epoch": 2366} {"train_loss": -24.303125381469727, "global_step": 196395, "epoch": 2366} {"train_loss": -24.06084632873535, "global_step": 196396, "epoch": 2366} {"train_loss": -24.25971031188965, "global_step": 196397, "epoch": 2366} {"train_loss": -24.154069900512695, "global_step": 196398, "epoch": 2366} {"train_loss": -24.10377311706543, "global_step": 196399, "epoch": 2366} {"train_loss": -24.014249801635742, "global_step": 196400, "epoch": 2366} {"train_loss": -24.27581787109375, "global_step": 196401, "epoch": 2366} {"train_loss": -24.317041397094727, "global_step": 196402, "epoch": 2366} {"train_loss": -23.591266632080078, "global_step": 196403, "epoch": 2366} {"train_loss": -24.055265426635742, "global_step": 196404, "epoch": 2366} {"train_loss": -24.1313533782959, "global_step": 196405, "epoch": 2366} {"train_loss": -24.03334617614746, "global_step": 196406, "epoch": 2366} {"train_loss": -24.084266662597656, "global_step": 196407, "epoch": 2366} {"train_loss": -24.635284423828125, "global_step": 196408, "epoch": 2366} {"train_loss": -24.37874412536621, "global_step": 196409, "epoch": 2366} {"train_loss": -24.350217819213867, "global_step": 196410, "epoch": 2366} {"train_loss": -24.24274253845215, "global_step": 196411, "epoch": 2366} {"train_loss": -24.327199935913086, "global_step": 196412, "epoch": 2366} {"train_loss": -23.92611312866211, "global_step": 196413, "epoch": 2366} {"train_loss": -24.656721115112305, "global_step": 196414, "epoch": 2366} {"train_loss": -24.38819694519043, "global_step": 196415, "epoch": 2366} {"train_loss": -24.716087341308594, "global_step": 196416, "epoch": 2366} {"train_loss": -24.00306510925293, "global_step": 196417, "epoch": 2366} {"train_loss": -24.265830993652344, "global_step": 196418, "epoch": 2366} {"train_loss": -24.11368751525879, "global_step": 196419, "epoch": 2366} {"train_loss": -24.72042465209961, "global_step": 196420, "epoch": 2366} {"train_loss": -24.54831886291504, "global_step": 196421, "epoch": 2366} {"train_loss": -24.544008255004883, "global_step": 196422, "epoch": 2366} {"train_loss": -24.47632598876953, "global_step": 196423, "epoch": 2366} {"train_loss": -24.249723434448242, "global_step": 196424, "epoch": 2366} {"train_loss": -23.890836715698242, "global_step": 196425, "epoch": 2366} {"train_loss": -24.09121322631836, "global_step": 196426, "epoch": 2366} {"train_loss": -24.346120834350586, "global_step": 196427, "epoch": 2366} {"train_loss": -24.137189865112305, "global_step": 196428, "epoch": 2366} {"train_loss": -24.081525802612305, "global_step": 196429, "epoch": 2366} {"train_loss": -24.55391502380371, "global_step": 196430, "epoch": 2366} {"train_loss": -24.311525344848633, "global_step": 196431, "epoch": 2366} {"train_loss": -24.41621208190918, "global_step": 196432, "epoch": 2366} {"train_loss": -24.252151489257812, "global_step": 196433, "epoch": 2366} {"train_loss": -24.10084342956543, "global_step": 196434, "epoch": 2366} {"train_loss": -24.23931121826172, "global_step": 196435, "epoch": 2366} {"train_loss": -24.10975456237793, "global_step": 196436, "epoch": 2366} {"train_loss": -24.082717895507812, "global_step": 196437, "epoch": 2366} {"train_loss": -23.972305297851562, "global_step": 196438, "epoch": 2366} {"train_loss": -24.418127059936523, "global_step": 196439, "epoch": 2366} {"train_loss": -24.632694244384766, "global_step": 196440, "epoch": 2366} {"train_loss": -24.281644821166992, "global_step": 196441, "epoch": 2366} {"train_loss": -24.313913345336914, "global_step": 196442, "epoch": 2366} {"train_loss": -24.24704933166504, "global_step": 196443, "epoch": 2366} {"train_loss": -24.321001052856445, "global_step": 196444, "epoch": 2366} {"train_loss": -24.298229217529297, "global_step": 196445, "epoch": 2366} {"train_loss": -24.207788467407227, "global_step": 196446, "epoch": 2366} {"train_loss": -24.770803451538086, "global_step": 196447, "epoch": 2366} {"train_loss": -23.955310821533203, "global_step": 196448, "epoch": 2366} {"train_loss": -24.08917808532715, "global_step": 196449, "epoch": 2366} {"train_loss": -24.141647338867188, "global_step": 196450, "epoch": 2366} {"train_loss": -24.191162109375, "global_step": 196451, "epoch": 2366} {"train_loss": -23.95196533203125, "global_step": 196452, "epoch": 2366} {"train_loss": -24.04294204711914, "global_step": 196453, "epoch": 2366} {"train_loss": -24.087238311767578, "global_step": 196454, "epoch": 2366} {"train_loss": -23.911054611206055, "global_step": 196455, "epoch": 2366} {"train_loss": -24.071598052978516, "global_step": 196456, "epoch": 2366} {"train_loss": -24.202062606811523, "global_step": 196457, "epoch": 2366} {"train_loss": -24.009485244750977, "global_step": 196458, "epoch": 2366} {"train_loss": -24.207326889038086, "global_step": 196459, "epoch": 2366} {"train_loss": -24.16916548487652, "global_step": 196460, "epoch": 2366, "val_loss": 6561373.5} {"train_loss": -23.510406494140625, "global_step": 196461, "epoch": 2367} {"train_loss": -23.517587661743164, "global_step": 196462, "epoch": 2367} {"train_loss": -23.65242576599121, "global_step": 196463, "epoch": 2367} {"train_loss": -23.829668045043945, "global_step": 196464, "epoch": 2367} {"train_loss": -24.00274658203125, "global_step": 196465, "epoch": 2367} {"train_loss": -23.88246726989746, "global_step": 196466, "epoch": 2367} {"train_loss": -23.644697189331055, "global_step": 196467, "epoch": 2367} {"train_loss": -23.803150177001953, "global_step": 196468, "epoch": 2367} {"train_loss": -23.58087158203125, "global_step": 196469, "epoch": 2367} {"train_loss": -23.94647216796875, "global_step": 196470, "epoch": 2367} {"train_loss": -23.650190353393555, "global_step": 196471, "epoch": 2367} {"train_loss": -23.977094650268555, "global_step": 196472, "epoch": 2367} {"train_loss": -23.790815353393555, "global_step": 196473, "epoch": 2367} {"train_loss": -23.551532745361328, "global_step": 196474, "epoch": 2367} {"train_loss": -23.956912994384766, "global_step": 196475, "epoch": 2367} {"train_loss": -24.27616310119629, "global_step": 196476, "epoch": 2367} {"train_loss": -23.901962280273438, "global_step": 196477, "epoch": 2367} {"train_loss": -23.78793716430664, "global_step": 196478, "epoch": 2367} {"train_loss": -23.797447204589844, "global_step": 196479, "epoch": 2367} {"train_loss": -24.4344482421875, "global_step": 196480, "epoch": 2367} {"train_loss": -24.435537338256836, "global_step": 196481, "epoch": 2367} {"train_loss": -24.44405174255371, "global_step": 196482, "epoch": 2367} {"train_loss": -23.765121459960938, "global_step": 196483, "epoch": 2367} {"train_loss": -24.292150497436523, "global_step": 196484, "epoch": 2367} {"train_loss": -23.840829849243164, "global_step": 196485, "epoch": 2367} {"train_loss": -23.906293869018555, "global_step": 196486, "epoch": 2367} {"train_loss": -24.4246768951416, "global_step": 196487, "epoch": 2367} {"train_loss": -24.278352737426758, "global_step": 196488, "epoch": 2367} {"train_loss": -24.305973052978516, "global_step": 196489, "epoch": 2367} {"train_loss": -24.497976303100586, "global_step": 196490, "epoch": 2367} {"train_loss": -24.326570510864258, "global_step": 196491, "epoch": 2367} {"train_loss": -24.287006378173828, "global_step": 196492, "epoch": 2367} {"train_loss": -24.192367553710938, "global_step": 196493, "epoch": 2367} {"train_loss": -24.087430953979492, "global_step": 196494, "epoch": 2367} {"train_loss": -24.24268913269043, "global_step": 196495, "epoch": 2367} {"train_loss": -24.513463973999023, "global_step": 196496, "epoch": 2367} {"train_loss": -24.1884822845459, "global_step": 196497, "epoch": 2367} {"train_loss": -24.531389236450195, "global_step": 196498, "epoch": 2367} {"train_loss": -24.402570724487305, "global_step": 196499, "epoch": 2367} {"train_loss": -24.70796012878418, "global_step": 196500, "epoch": 2367} {"train_loss": -24.27741050720215, "global_step": 196501, "epoch": 2367} {"train_loss": -24.02680015563965, "global_step": 196502, "epoch": 2367} {"train_loss": -24.43940544128418, "global_step": 196503, "epoch": 2367} {"train_loss": -24.370031356811523, "global_step": 196504, "epoch": 2367} {"train_loss": -24.533950805664062, "global_step": 196505, "epoch": 2367} {"train_loss": -23.781463623046875, "global_step": 196506, "epoch": 2367} {"train_loss": -23.859712600708008, "global_step": 196507, "epoch": 2367} {"train_loss": -24.462574005126953, "global_step": 196508, "epoch": 2367} {"train_loss": -24.28529930114746, "global_step": 196509, "epoch": 2367} {"train_loss": -23.893115997314453, "global_step": 196510, "epoch": 2367} {"train_loss": -24.324907302856445, "global_step": 196511, "epoch": 2367} {"train_loss": -24.58477210998535, "global_step": 196512, "epoch": 2367} {"train_loss": -24.280832290649414, "global_step": 196513, "epoch": 2367} {"train_loss": -24.338293075561523, "global_step": 196514, "epoch": 2367} {"train_loss": -24.30190086364746, "global_step": 196515, "epoch": 2367} {"train_loss": -23.939197540283203, "global_step": 196516, "epoch": 2367} {"train_loss": -24.14285659790039, "global_step": 196517, "epoch": 2367} {"train_loss": -24.105539321899414, "global_step": 196518, "epoch": 2367} {"train_loss": -24.227420806884766, "global_step": 196519, "epoch": 2367} {"train_loss": -23.961692810058594, "global_step": 196520, "epoch": 2367} {"train_loss": -23.88104820251465, "global_step": 196521, "epoch": 2367} {"train_loss": -23.68178367614746, "global_step": 196522, "epoch": 2367} {"train_loss": -24.269561767578125, "global_step": 196523, "epoch": 2367} {"train_loss": -24.27788734436035, "global_step": 196524, "epoch": 2367} {"train_loss": -24.380224227905273, "global_step": 196525, "epoch": 2367} {"train_loss": -24.105152130126953, "global_step": 196526, "epoch": 2367} {"train_loss": -24.399932861328125, "global_step": 196527, "epoch": 2367} {"train_loss": -24.06343650817871, "global_step": 196528, "epoch": 2367} {"train_loss": -24.319538116455078, "global_step": 196529, "epoch": 2367} {"train_loss": -24.145462036132812, "global_step": 196530, "epoch": 2367} {"train_loss": -24.127519607543945, "global_step": 196531, "epoch": 2367} {"train_loss": -24.031198501586914, "global_step": 196532, "epoch": 2367} {"train_loss": -23.894702911376953, "global_step": 196533, "epoch": 2367} {"train_loss": -24.275712966918945, "global_step": 196534, "epoch": 2367} {"train_loss": -24.065017700195312, "global_step": 196535, "epoch": 2367} {"train_loss": -23.99466896057129, "global_step": 196536, "epoch": 2367} {"train_loss": -24.24036979675293, "global_step": 196537, "epoch": 2367} {"train_loss": -23.990896224975586, "global_step": 196538, "epoch": 2367} {"train_loss": -24.19215202331543, "global_step": 196539, "epoch": 2367} {"train_loss": -24.205162048339844, "global_step": 196540, "epoch": 2367} {"train_loss": -23.9688720703125, "global_step": 196541, "epoch": 2367} {"train_loss": -24.20171356201172, "global_step": 196542, "epoch": 2367} {"train_loss": -24.103658630187255, "global_step": 196543, "epoch": 2367, "val_loss": 6535017.0} {"train_loss": -23.132522583007812, "global_step": 196544, "epoch": 2368} {"train_loss": -23.035064697265625, "global_step": 196545, "epoch": 2368} {"train_loss": -23.786619186401367, "global_step": 196546, "epoch": 2368} {"train_loss": -23.60677146911621, "global_step": 196547, "epoch": 2368} {"train_loss": -23.578397750854492, "global_step": 196548, "epoch": 2368} {"train_loss": -23.442493438720703, "global_step": 196549, "epoch": 2368} {"train_loss": -23.571313858032227, "global_step": 196550, "epoch": 2368} {"train_loss": -23.610857009887695, "global_step": 196551, "epoch": 2368} {"train_loss": -23.835708618164062, "global_step": 196552, "epoch": 2368} {"train_loss": -24.216184616088867, "global_step": 196553, "epoch": 2368} {"train_loss": -23.52303123474121, "global_step": 196554, "epoch": 2368} {"train_loss": -24.031591415405273, "global_step": 196555, "epoch": 2368} {"train_loss": -23.84037971496582, "global_step": 196556, "epoch": 2368} {"train_loss": -23.696395874023438, "global_step": 196557, "epoch": 2368} {"train_loss": -24.04817008972168, "global_step": 196558, "epoch": 2368} {"train_loss": -23.671676635742188, "global_step": 196559, "epoch": 2368} {"train_loss": -23.74603271484375, "global_step": 196560, "epoch": 2368} {"train_loss": -24.011022567749023, "global_step": 196561, "epoch": 2368} {"train_loss": -23.822477340698242, "global_step": 196562, "epoch": 2368} {"train_loss": -24.17909812927246, "global_step": 196563, "epoch": 2368} {"train_loss": -23.6340389251709, "global_step": 196564, "epoch": 2368} {"train_loss": -24.242618560791016, "global_step": 196565, "epoch": 2368} {"train_loss": -24.0985164642334, "global_step": 196566, "epoch": 2368} {"train_loss": -24.079437255859375, "global_step": 196567, "epoch": 2368} {"train_loss": -24.040943145751953, "global_step": 196568, "epoch": 2368} {"train_loss": -24.1861629486084, "global_step": 196569, "epoch": 2368} {"train_loss": -24.140094757080078, "global_step": 196570, "epoch": 2368} {"train_loss": -24.057897567749023, "global_step": 196571, "epoch": 2368} {"train_loss": -24.213918685913086, "global_step": 196572, "epoch": 2368} {"train_loss": -24.507097244262695, "global_step": 196573, "epoch": 2368} {"train_loss": -24.279394149780273, "global_step": 196574, "epoch": 2368} {"train_loss": -24.27796745300293, "global_step": 196575, "epoch": 2368} {"train_loss": -24.454442977905273, "global_step": 196576, "epoch": 2368} {"train_loss": -24.13987159729004, "global_step": 196577, "epoch": 2368} {"train_loss": -24.194747924804688, "global_step": 196578, "epoch": 2368} {"train_loss": -24.091156005859375, "global_step": 196579, "epoch": 2368} {"train_loss": -24.490188598632812, "global_step": 196580, "epoch": 2368} {"train_loss": -24.07164764404297, "global_step": 196581, "epoch": 2368} {"train_loss": -24.466205596923828, "global_step": 196582, "epoch": 2368} {"train_loss": -24.203927993774414, "global_step": 196583, "epoch": 2368} {"train_loss": -24.236494064331055, "global_step": 196584, "epoch": 2368} {"train_loss": -24.20945167541504, "global_step": 196585, "epoch": 2368} {"train_loss": -24.26595687866211, "global_step": 196586, "epoch": 2368} {"train_loss": -24.405948638916016, "global_step": 196587, "epoch": 2368} {"train_loss": -24.555416107177734, "global_step": 196588, "epoch": 2368} {"train_loss": -24.313180923461914, "global_step": 196589, "epoch": 2368} {"train_loss": -24.381378173828125, "global_step": 196590, "epoch": 2368} {"train_loss": -24.487401962280273, "global_step": 196591, "epoch": 2368} {"train_loss": -24.087350845336914, "global_step": 196592, "epoch": 2368} {"train_loss": -23.89118003845215, "global_step": 196593, "epoch": 2368} {"train_loss": -24.462482452392578, "global_step": 196594, "epoch": 2368} {"train_loss": -24.36952781677246, "global_step": 196595, "epoch": 2368} {"train_loss": -24.155309677124023, "global_step": 196596, "epoch": 2368} {"train_loss": -24.421287536621094, "global_step": 196597, "epoch": 2368} {"train_loss": -24.348194122314453, "global_step": 196598, "epoch": 2368} {"train_loss": -24.3021297454834, "global_step": 196599, "epoch": 2368} {"train_loss": -24.15581703186035, "global_step": 196600, "epoch": 2368} {"train_loss": -24.536483764648438, "global_step": 196601, "epoch": 2368} {"train_loss": -23.816837310791016, "global_step": 196602, "epoch": 2368} {"train_loss": -24.24539566040039, "global_step": 196603, "epoch": 2368} {"train_loss": -24.137922286987305, "global_step": 196604, "epoch": 2368} {"train_loss": -24.19399070739746, "global_step": 196605, "epoch": 2368} {"train_loss": -24.51316261291504, "global_step": 196606, "epoch": 2368} {"train_loss": -23.880382537841797, "global_step": 196607, "epoch": 2368} {"train_loss": -24.201566696166992, "global_step": 196608, "epoch": 2368} {"train_loss": -24.27046775817871, "global_step": 196609, "epoch": 2368} {"train_loss": -24.74507713317871, "global_step": 196610, "epoch": 2368} {"train_loss": -23.985300064086914, "global_step": 196611, "epoch": 2368} {"train_loss": -24.463294982910156, "global_step": 196612, "epoch": 2368} {"train_loss": -24.236278533935547, "global_step": 196613, "epoch": 2368} {"train_loss": -24.02094841003418, "global_step": 196614, "epoch": 2368} {"train_loss": -24.582168579101562, "global_step": 196615, "epoch": 2368} {"train_loss": -24.17146873474121, "global_step": 196616, "epoch": 2368} {"train_loss": -24.232290267944336, "global_step": 196617, "epoch": 2368} {"train_loss": -24.155292510986328, "global_step": 196618, "epoch": 2368} {"train_loss": -24.03413963317871, "global_step": 196619, "epoch": 2368} {"train_loss": -24.071048736572266, "global_step": 196620, "epoch": 2368} {"train_loss": -24.029043197631836, "global_step": 196621, "epoch": 2368} {"train_loss": -24.39426040649414, "global_step": 196622, "epoch": 2368} {"train_loss": -24.202590942382812, "global_step": 196623, "epoch": 2368} {"train_loss": -24.650205612182617, "global_step": 196624, "epoch": 2368} {"train_loss": -24.44024085998535, "global_step": 196625, "epoch": 2368} {"train_loss": -24.121105929455126, "global_step": 196626, "epoch": 2368, "val_loss": 6523610.0} {"train_loss": -23.6881046295166, "global_step": 196627, "epoch": 2369} {"train_loss": -24.407617568969727, "global_step": 196628, "epoch": 2369} {"train_loss": -24.11393165588379, "global_step": 196629, "epoch": 2369} {"train_loss": -24.12212562561035, "global_step": 196630, "epoch": 2369} {"train_loss": -24.2329158782959, "global_step": 196631, "epoch": 2369} {"train_loss": -24.505741119384766, "global_step": 196632, "epoch": 2369} {"train_loss": -24.319488525390625, "global_step": 196633, "epoch": 2369} {"train_loss": -24.102182388305664, "global_step": 196634, "epoch": 2369} {"train_loss": -24.18904685974121, "global_step": 196635, "epoch": 2369} {"train_loss": -24.481809616088867, "global_step": 196636, "epoch": 2369} {"train_loss": -23.910661697387695, "global_step": 196637, "epoch": 2369} {"train_loss": -23.914648056030273, "global_step": 196638, "epoch": 2369} {"train_loss": -24.060537338256836, "global_step": 196639, "epoch": 2369} {"train_loss": -23.860097885131836, "global_step": 196640, "epoch": 2369} {"train_loss": -23.91835594177246, "global_step": 196641, "epoch": 2369} {"train_loss": -23.874418258666992, "global_step": 196642, "epoch": 2369} {"train_loss": -24.38825035095215, "global_step": 196643, "epoch": 2369} {"train_loss": -24.258182525634766, "global_step": 196644, "epoch": 2369} {"train_loss": -24.075658798217773, "global_step": 196645, "epoch": 2369} {"train_loss": -24.19435691833496, "global_step": 196646, "epoch": 2369} {"train_loss": -24.142126083374023, "global_step": 196647, "epoch": 2369} {"train_loss": -23.694446563720703, "global_step": 196648, "epoch": 2369} {"train_loss": -24.292922973632812, "global_step": 196649, "epoch": 2369} {"train_loss": -23.94087028503418, "global_step": 196650, "epoch": 2369} {"train_loss": -24.710058212280273, "global_step": 196651, "epoch": 2369} {"train_loss": -23.787094116210938, "global_step": 196652, "epoch": 2369} {"train_loss": -24.058271408081055, "global_step": 196653, "epoch": 2369} {"train_loss": -24.188831329345703, "global_step": 196654, "epoch": 2369} {"train_loss": -23.6180362701416, "global_step": 196655, "epoch": 2369} {"train_loss": -24.177200317382812, "global_step": 196656, "epoch": 2369} {"train_loss": -24.28741455078125, "global_step": 196657, "epoch": 2369} {"train_loss": -24.205223083496094, "global_step": 196658, "epoch": 2369} {"train_loss": -24.16139793395996, "global_step": 196659, "epoch": 2369} {"train_loss": -24.113828659057617, "global_step": 196660, "epoch": 2369} {"train_loss": -24.43256187438965, "global_step": 196661, "epoch": 2369} {"train_loss": -23.884374618530273, "global_step": 196662, "epoch": 2369} {"train_loss": -24.052337646484375, "global_step": 196663, "epoch": 2369} {"train_loss": -24.03008270263672, "global_step": 196664, "epoch": 2369} {"train_loss": -24.010135650634766, "global_step": 196665, "epoch": 2369} {"train_loss": -23.94778823852539, "global_step": 196666, "epoch": 2369} {"train_loss": -24.404590606689453, "global_step": 196667, "epoch": 2369} {"train_loss": -24.156835556030273, "global_step": 196668, "epoch": 2369} {"train_loss": -24.3137264251709, "global_step": 196669, "epoch": 2369} {"train_loss": -24.36337661743164, "global_step": 196670, "epoch": 2369} {"train_loss": -24.05865478515625, "global_step": 196671, "epoch": 2369} {"train_loss": -24.724811553955078, "global_step": 196672, "epoch": 2369} {"train_loss": -23.89522361755371, "global_step": 196673, "epoch": 2369} {"train_loss": -24.197847366333008, "global_step": 196674, "epoch": 2369} {"train_loss": -24.47654151916504, "global_step": 196675, "epoch": 2369} {"train_loss": -24.03071403503418, "global_step": 196676, "epoch": 2369} {"train_loss": -24.283615112304688, "global_step": 196677, "epoch": 2369} {"train_loss": -24.2435302734375, "global_step": 196678, "epoch": 2369} {"train_loss": -24.298349380493164, "global_step": 196679, "epoch": 2369} {"train_loss": -24.288379669189453, "global_step": 196680, "epoch": 2369} {"train_loss": -24.148855209350586, "global_step": 196681, "epoch": 2369} {"train_loss": -23.748254776000977, "global_step": 196682, "epoch": 2369} {"train_loss": -23.147531509399414, "global_step": 196683, "epoch": 2369} {"train_loss": -23.831830978393555, "global_step": 196684, "epoch": 2369} {"train_loss": -24.132247924804688, "global_step": 196685, "epoch": 2369} {"train_loss": -23.906137466430664, "global_step": 196686, "epoch": 2369} {"train_loss": -24.0368709564209, "global_step": 196687, "epoch": 2369} {"train_loss": -24.55462074279785, "global_step": 196688, "epoch": 2369} {"train_loss": -23.805068969726562, "global_step": 196689, "epoch": 2369} {"train_loss": -24.319223403930664, "global_step": 196690, "epoch": 2369} {"train_loss": -24.08967399597168, "global_step": 196691, "epoch": 2369} {"train_loss": -24.038389205932617, "global_step": 196692, "epoch": 2369} {"train_loss": -23.85260009765625, "global_step": 196693, "epoch": 2369} {"train_loss": -24.08009910583496, "global_step": 196694, "epoch": 2369} {"train_loss": -23.977460861206055, "global_step": 196695, "epoch": 2369} {"train_loss": -23.42875099182129, "global_step": 196696, "epoch": 2369} {"train_loss": -23.580753326416016, "global_step": 196697, "epoch": 2369} {"train_loss": -23.91819190979004, "global_step": 196698, "epoch": 2369} {"train_loss": -24.238143920898438, "global_step": 196699, "epoch": 2369} {"train_loss": -24.043926239013672, "global_step": 196700, "epoch": 2369} {"train_loss": -24.061328887939453, "global_step": 196701, "epoch": 2369} {"train_loss": -24.160005569458008, "global_step": 196702, "epoch": 2369} {"train_loss": -24.082965850830078, "global_step": 196703, "epoch": 2369} {"train_loss": -24.621057510375977, "global_step": 196704, "epoch": 2369} {"train_loss": -24.008895874023438, "global_step": 196705, "epoch": 2369} {"train_loss": -24.050039291381836, "global_step": 196706, "epoch": 2369} {"train_loss": -23.824460983276367, "global_step": 196707, "epoch": 2369} {"train_loss": -24.30002212524414, "global_step": 196708, "epoch": 2369} {"train_loss": -24.108446213136236, "global_step": 196709, "epoch": 2369, "val_loss": 6452099.5} {"train_loss": -21.8716983795166, "global_step": 196710, "epoch": 2370} {"train_loss": -21.545927047729492, "global_step": 196711, "epoch": 2370} {"train_loss": -21.864423751831055, "global_step": 196712, "epoch": 2370} {"train_loss": -22.88445472717285, "global_step": 196713, "epoch": 2370} {"train_loss": -22.45583152770996, "global_step": 196714, "epoch": 2370} {"train_loss": -22.564804077148438, "global_step": 196715, "epoch": 2370} {"train_loss": -22.455564498901367, "global_step": 196716, "epoch": 2370} {"train_loss": -22.983572006225586, "global_step": 196717, "epoch": 2370} {"train_loss": -22.490028381347656, "global_step": 196718, "epoch": 2370} {"train_loss": -23.224172592163086, "global_step": 196719, "epoch": 2370} {"train_loss": -22.493213653564453, "global_step": 196720, "epoch": 2370} {"train_loss": -23.340890884399414, "global_step": 196721, "epoch": 2370} {"train_loss": -23.223485946655273, "global_step": 196722, "epoch": 2370} {"train_loss": -23.31215476989746, "global_step": 196723, "epoch": 2370} {"train_loss": -23.313135147094727, "global_step": 196724, "epoch": 2370} {"train_loss": -23.277982711791992, "global_step": 196725, "epoch": 2370} {"train_loss": -23.297449111938477, "global_step": 196726, "epoch": 2370} {"train_loss": -23.491058349609375, "global_step": 196727, "epoch": 2370} {"train_loss": -23.626087188720703, "global_step": 196728, "epoch": 2370} {"train_loss": -23.730443954467773, "global_step": 196729, "epoch": 2370} {"train_loss": -23.359027862548828, "global_step": 196730, "epoch": 2370} {"train_loss": -23.892839431762695, "global_step": 196731, "epoch": 2370} {"train_loss": -23.432832717895508, "global_step": 196732, "epoch": 2370} {"train_loss": -23.616491317749023, "global_step": 196733, "epoch": 2370} {"train_loss": -23.44650650024414, "global_step": 196734, "epoch": 2370} {"train_loss": -23.71534538269043, "global_step": 196735, "epoch": 2370} {"train_loss": -24.27030372619629, "global_step": 196736, "epoch": 2370} {"train_loss": -24.218603134155273, "global_step": 196737, "epoch": 2370} {"train_loss": -24.07189178466797, "global_step": 196738, "epoch": 2370} {"train_loss": -23.84659194946289, "global_step": 196739, "epoch": 2370} {"train_loss": -23.987333297729492, "global_step": 196740, "epoch": 2370} {"train_loss": -23.750247955322266, "global_step": 196741, "epoch": 2370} {"train_loss": -24.232351303100586, "global_step": 196742, "epoch": 2370} {"train_loss": -24.059553146362305, "global_step": 196743, "epoch": 2370} {"train_loss": -23.801410675048828, "global_step": 196744, "epoch": 2370} {"train_loss": -24.49911117553711, "global_step": 196745, "epoch": 2370} {"train_loss": -23.674489974975586, "global_step": 196746, "epoch": 2370} {"train_loss": -24.305509567260742, "global_step": 196747, "epoch": 2370} {"train_loss": -24.170780181884766, "global_step": 196748, "epoch": 2370} {"train_loss": -23.785903930664062, "global_step": 196749, "epoch": 2370} {"train_loss": -23.902719497680664, "global_step": 196750, "epoch": 2370} {"train_loss": -24.06302261352539, "global_step": 196751, "epoch": 2370} {"train_loss": -24.12031364440918, "global_step": 196752, "epoch": 2370} {"train_loss": -24.346694946289062, "global_step": 196753, "epoch": 2370} {"train_loss": -24.064315795898438, "global_step": 196754, "epoch": 2370} {"train_loss": -24.528024673461914, "global_step": 196755, "epoch": 2370} {"train_loss": -24.41902732849121, "global_step": 196756, "epoch": 2370} {"train_loss": -24.327680587768555, "global_step": 196757, "epoch": 2370} {"train_loss": -24.179182052612305, "global_step": 196758, "epoch": 2370} {"train_loss": -24.3055419921875, "global_step": 196759, "epoch": 2370} {"train_loss": -24.18927001953125, "global_step": 196760, "epoch": 2370} {"train_loss": -24.4078311920166, "global_step": 196761, "epoch": 2370} {"train_loss": -24.001785278320312, "global_step": 196762, "epoch": 2370} {"train_loss": -23.999982833862305, "global_step": 196763, "epoch": 2370} {"train_loss": -24.040029525756836, "global_step": 196764, "epoch": 2370} {"train_loss": -24.068241119384766, "global_step": 196765, "epoch": 2370} {"train_loss": -24.044652938842773, "global_step": 196766, "epoch": 2370} {"train_loss": -23.99256706237793, "global_step": 196767, "epoch": 2370} {"train_loss": -24.044370651245117, "global_step": 196768, "epoch": 2370} {"train_loss": -23.781715393066406, "global_step": 196769, "epoch": 2370} {"train_loss": -23.813457489013672, "global_step": 196770, "epoch": 2370} {"train_loss": -23.66261100769043, "global_step": 196771, "epoch": 2370} {"train_loss": -23.45932960510254, "global_step": 196772, "epoch": 2370} {"train_loss": -24.051273345947266, "global_step": 196773, "epoch": 2370} {"train_loss": -23.890846252441406, "global_step": 196774, "epoch": 2370} {"train_loss": -24.078689575195312, "global_step": 196775, "epoch": 2370} {"train_loss": -24.065990447998047, "global_step": 196776, "epoch": 2370} {"train_loss": -24.09284019470215, "global_step": 196777, "epoch": 2370} {"train_loss": -24.292936325073242, "global_step": 196778, "epoch": 2370} {"train_loss": -24.52157974243164, "global_step": 196779, "epoch": 2370} {"train_loss": -24.369474411010742, "global_step": 196780, "epoch": 2370} {"train_loss": -24.33583641052246, "global_step": 196781, "epoch": 2370} {"train_loss": -24.03574562072754, "global_step": 196782, "epoch": 2370} {"train_loss": -23.966127395629883, "global_step": 196783, "epoch": 2370} {"train_loss": -24.045230865478516, "global_step": 196784, "epoch": 2370} {"train_loss": -24.26877212524414, "global_step": 196785, "epoch": 2370} {"train_loss": -24.080392837524414, "global_step": 196786, "epoch": 2370} {"train_loss": -24.26395606994629, "global_step": 196787, "epoch": 2370} {"train_loss": -24.164684295654297, "global_step": 196788, "epoch": 2370} {"train_loss": -24.28513526916504, "global_step": 196789, "epoch": 2370} {"train_loss": -24.42951774597168, "global_step": 196790, "epoch": 2370} {"train_loss": -23.845609664916992, "global_step": 196791, "epoch": 2370} {"train_loss": -23.74716567993164, "global_step": 196792, "epoch": 2370, "val_loss": 6717291.0} {"train_loss": -23.869787216186523, "global_step": 196793, "epoch": 2371} {"train_loss": -22.58603858947754, "global_step": 196794, "epoch": 2371} {"train_loss": -22.32510757446289, "global_step": 196795, "epoch": 2371} {"train_loss": -22.810394287109375, "global_step": 196796, "epoch": 2371} {"train_loss": -23.49337387084961, "global_step": 196797, "epoch": 2371} {"train_loss": -23.325292587280273, "global_step": 196798, "epoch": 2371} {"train_loss": -23.45523452758789, "global_step": 196799, "epoch": 2371} {"train_loss": -23.4504451751709, "global_step": 196800, "epoch": 2371} {"train_loss": -23.566396713256836, "global_step": 196801, "epoch": 2371} {"train_loss": -23.6721248626709, "global_step": 196802, "epoch": 2371} {"train_loss": -23.5196590423584, "global_step": 196803, "epoch": 2371} {"train_loss": -23.65558433532715, "global_step": 196804, "epoch": 2371} {"train_loss": -23.737186431884766, "global_step": 196805, "epoch": 2371} {"train_loss": -23.820159912109375, "global_step": 196806, "epoch": 2371} {"train_loss": -23.905973434448242, "global_step": 196807, "epoch": 2371} {"train_loss": -23.882410049438477, "global_step": 196808, "epoch": 2371} {"train_loss": -23.598255157470703, "global_step": 196809, "epoch": 2371} {"train_loss": -23.883939743041992, "global_step": 196810, "epoch": 2371} {"train_loss": -23.54880714416504, "global_step": 196811, "epoch": 2371} {"train_loss": -24.214109420776367, "global_step": 196812, "epoch": 2371} {"train_loss": -23.795202255249023, "global_step": 196813, "epoch": 2371} {"train_loss": -23.696537017822266, "global_step": 196814, "epoch": 2371} {"train_loss": -24.03966522216797, "global_step": 196815, "epoch": 2371} {"train_loss": -23.684040069580078, "global_step": 196816, "epoch": 2371} {"train_loss": -24.073511123657227, "global_step": 196817, "epoch": 2371} {"train_loss": -24.06246566772461, "global_step": 196818, "epoch": 2371} {"train_loss": -24.1423397064209, "global_step": 196819, "epoch": 2371} {"train_loss": -23.838830947875977, "global_step": 196820, "epoch": 2371} {"train_loss": -24.38539695739746, "global_step": 196821, "epoch": 2371} {"train_loss": -23.89370346069336, "global_step": 196822, "epoch": 2371} {"train_loss": -23.890094757080078, "global_step": 196823, "epoch": 2371} {"train_loss": -24.268590927124023, "global_step": 196824, "epoch": 2371} {"train_loss": -23.91988754272461, "global_step": 196825, "epoch": 2371} {"train_loss": -24.133893966674805, "global_step": 196826, "epoch": 2371} {"train_loss": -24.467830657958984, "global_step": 196827, "epoch": 2371} {"train_loss": -24.120105743408203, "global_step": 196828, "epoch": 2371} {"train_loss": -24.17142677307129, "global_step": 196829, "epoch": 2371} {"train_loss": -24.767480850219727, "global_step": 196830, "epoch": 2371} {"train_loss": -23.92727279663086, "global_step": 196831, "epoch": 2371} {"train_loss": -24.157262802124023, "global_step": 196832, "epoch": 2371} {"train_loss": -24.312734603881836, "global_step": 196833, "epoch": 2371} {"train_loss": -24.384132385253906, "global_step": 196834, "epoch": 2371} {"train_loss": -24.219701766967773, "global_step": 196835, "epoch": 2371} {"train_loss": -24.544822692871094, "global_step": 196836, "epoch": 2371} {"train_loss": -24.210065841674805, "global_step": 196837, "epoch": 2371} {"train_loss": -24.19398307800293, "global_step": 196838, "epoch": 2371} {"train_loss": -24.19609832763672, "global_step": 196839, "epoch": 2371} {"train_loss": -24.24790382385254, "global_step": 196840, "epoch": 2371} {"train_loss": -24.209474563598633, "global_step": 196841, "epoch": 2371} {"train_loss": -24.40132713317871, "global_step": 196842, "epoch": 2371} {"train_loss": -24.633556365966797, "global_step": 196843, "epoch": 2371} {"train_loss": -24.253768920898438, "global_step": 196844, "epoch": 2371} {"train_loss": -24.29972267150879, "global_step": 196845, "epoch": 2371} {"train_loss": -24.3461856842041, "global_step": 196846, "epoch": 2371} {"train_loss": -23.736764907836914, "global_step": 196847, "epoch": 2371} {"train_loss": -24.281808853149414, "global_step": 196848, "epoch": 2371} {"train_loss": -24.1192569732666, "global_step": 196849, "epoch": 2371} {"train_loss": -24.373872756958008, "global_step": 196850, "epoch": 2371} {"train_loss": -24.17892074584961, "global_step": 196851, "epoch": 2371} {"train_loss": -24.52344512939453, "global_step": 196852, "epoch": 2371} {"train_loss": -24.171493530273438, "global_step": 196853, "epoch": 2371} {"train_loss": -24.497163772583008, "global_step": 196854, "epoch": 2371} {"train_loss": -24.286012649536133, "global_step": 196855, "epoch": 2371} {"train_loss": -24.405494689941406, "global_step": 196856, "epoch": 2371} {"train_loss": -24.22735595703125, "global_step": 196857, "epoch": 2371} {"train_loss": -23.525436401367188, "global_step": 196858, "epoch": 2371} {"train_loss": -24.233686447143555, "global_step": 196859, "epoch": 2371} {"train_loss": -24.458417892456055, "global_step": 196860, "epoch": 2371} {"train_loss": -24.02399444580078, "global_step": 196861, "epoch": 2371} {"train_loss": -24.546276092529297, "global_step": 196862, "epoch": 2371} {"train_loss": -24.252485275268555, "global_step": 196863, "epoch": 2371} {"train_loss": -24.201568603515625, "global_step": 196864, "epoch": 2371} {"train_loss": -24.279457092285156, "global_step": 196865, "epoch": 2371} {"train_loss": -24.453777313232422, "global_step": 196866, "epoch": 2371} {"train_loss": -23.959959030151367, "global_step": 196867, "epoch": 2371} {"train_loss": -24.142038345336914, "global_step": 196868, "epoch": 2371} {"train_loss": -23.91547966003418, "global_step": 196869, "epoch": 2371} {"train_loss": -24.258514404296875, "global_step": 196870, "epoch": 2371} {"train_loss": -24.100677490234375, "global_step": 196871, "epoch": 2371} {"train_loss": -24.186288833618164, "global_step": 196872, "epoch": 2371} {"train_loss": -24.32062339782715, "global_step": 196873, "epoch": 2371} {"train_loss": -24.45656394958496, "global_step": 196874, "epoch": 2371} {"train_loss": -24.023226266883942, "global_step": 196875, "epoch": 2371, "val_loss": 6600788.0} {"train_loss": -23.38511848449707, "global_step": 196876, "epoch": 2372} {"train_loss": -23.584165573120117, "global_step": 196877, "epoch": 2372} {"train_loss": -24.02291488647461, "global_step": 196878, "epoch": 2372} {"train_loss": -23.60943603515625, "global_step": 196879, "epoch": 2372} {"train_loss": -23.731393814086914, "global_step": 196880, "epoch": 2372} {"train_loss": -23.785314559936523, "global_step": 196881, "epoch": 2372} {"train_loss": -23.570890426635742, "global_step": 196882, "epoch": 2372} {"train_loss": -24.02800178527832, "global_step": 196883, "epoch": 2372} {"train_loss": -24.25196647644043, "global_step": 196884, "epoch": 2372} {"train_loss": -23.865690231323242, "global_step": 196885, "epoch": 2372} {"train_loss": -24.30204963684082, "global_step": 196886, "epoch": 2372} {"train_loss": -24.23040199279785, "global_step": 196887, "epoch": 2372} {"train_loss": -24.12325668334961, "global_step": 196888, "epoch": 2372} {"train_loss": -24.290822982788086, "global_step": 196889, "epoch": 2372} {"train_loss": -24.178546905517578, "global_step": 196890, "epoch": 2372} {"train_loss": -24.40558433532715, "global_step": 196891, "epoch": 2372} {"train_loss": -24.01448631286621, "global_step": 196892, "epoch": 2372} {"train_loss": -24.12427520751953, "global_step": 196893, "epoch": 2372} {"train_loss": -24.360029220581055, "global_step": 196894, "epoch": 2372} {"train_loss": -23.970413208007812, "global_step": 196895, "epoch": 2372} {"train_loss": -24.49967384338379, "global_step": 196896, "epoch": 2372} {"train_loss": -24.3579044342041, "global_step": 196897, "epoch": 2372} {"train_loss": -24.15727424621582, "global_step": 196898, "epoch": 2372} {"train_loss": -23.793716430664062, "global_step": 196899, "epoch": 2372} {"train_loss": -24.568359375, "global_step": 196900, "epoch": 2372} {"train_loss": -24.51529312133789, "global_step": 196901, "epoch": 2372} {"train_loss": -24.23166847229004, "global_step": 196902, "epoch": 2372} {"train_loss": -24.042200088500977, "global_step": 196903, "epoch": 2372} {"train_loss": -24.18944549560547, "global_step": 196904, "epoch": 2372} {"train_loss": -24.48302459716797, "global_step": 196905, "epoch": 2372} {"train_loss": -24.55836296081543, "global_step": 196906, "epoch": 2372} {"train_loss": -24.68194580078125, "global_step": 196907, "epoch": 2372} {"train_loss": -24.095123291015625, "global_step": 196908, "epoch": 2372} {"train_loss": -24.04876708984375, "global_step": 196909, "epoch": 2372} {"train_loss": -24.19209861755371, "global_step": 196910, "epoch": 2372} {"train_loss": -24.054004669189453, "global_step": 196911, "epoch": 2372} {"train_loss": -24.160017013549805, "global_step": 196912, "epoch": 2372} {"train_loss": -24.40282440185547, "global_step": 196913, "epoch": 2372} {"train_loss": -24.13887596130371, "global_step": 196914, "epoch": 2372} {"train_loss": -24.14044952392578, "global_step": 196915, "epoch": 2372} {"train_loss": -24.052095413208008, "global_step": 196916, "epoch": 2372} {"train_loss": -24.267532348632812, "global_step": 196917, "epoch": 2372} {"train_loss": -24.335092544555664, "global_step": 196918, "epoch": 2372} {"train_loss": -24.138731002807617, "global_step": 196919, "epoch": 2372} {"train_loss": -24.262664794921875, "global_step": 196920, "epoch": 2372} {"train_loss": -24.0400447845459, "global_step": 196921, "epoch": 2372} {"train_loss": -24.352319717407227, "global_step": 196922, "epoch": 2372} {"train_loss": -24.103376388549805, "global_step": 196923, "epoch": 2372} {"train_loss": -24.543819427490234, "global_step": 196924, "epoch": 2372} {"train_loss": -23.94110107421875, "global_step": 196925, "epoch": 2372} {"train_loss": -24.06166648864746, "global_step": 196926, "epoch": 2372} {"train_loss": -23.89491081237793, "global_step": 196927, "epoch": 2372} {"train_loss": -24.111061096191406, "global_step": 196928, "epoch": 2372} {"train_loss": -24.282888412475586, "global_step": 196929, "epoch": 2372} {"train_loss": -24.363540649414062, "global_step": 196930, "epoch": 2372} {"train_loss": -24.139057159423828, "global_step": 196931, "epoch": 2372} {"train_loss": -24.383432388305664, "global_step": 196932, "epoch": 2372} {"train_loss": -24.338150024414062, "global_step": 196933, "epoch": 2372} {"train_loss": -24.11698341369629, "global_step": 196934, "epoch": 2372} {"train_loss": -24.386310577392578, "global_step": 196935, "epoch": 2372} {"train_loss": -24.11130714416504, "global_step": 196936, "epoch": 2372} {"train_loss": -24.139759063720703, "global_step": 196937, "epoch": 2372} {"train_loss": -24.686355590820312, "global_step": 196938, "epoch": 2372} {"train_loss": -24.197616577148438, "global_step": 196939, "epoch": 2372} {"train_loss": -23.930023193359375, "global_step": 196940, "epoch": 2372} {"train_loss": -24.07946014404297, "global_step": 196941, "epoch": 2372} {"train_loss": -24.282957077026367, "global_step": 196942, "epoch": 2372} {"train_loss": -24.309368133544922, "global_step": 196943, "epoch": 2372} {"train_loss": -24.263507843017578, "global_step": 196944, "epoch": 2372} {"train_loss": -24.222620010375977, "global_step": 196945, "epoch": 2372} {"train_loss": -24.292043685913086, "global_step": 196946, "epoch": 2372} {"train_loss": -24.190673828125, "global_step": 196947, "epoch": 2372} {"train_loss": -24.02120018005371, "global_step": 196948, "epoch": 2372} {"train_loss": -24.51104164123535, "global_step": 196949, "epoch": 2372} {"train_loss": -24.56233787536621, "global_step": 196950, "epoch": 2372} {"train_loss": -24.020893096923828, "global_step": 196951, "epoch": 2372} {"train_loss": -24.06388282775879, "global_step": 196952, "epoch": 2372} {"train_loss": -24.242603302001953, "global_step": 196953, "epoch": 2372} {"train_loss": -23.996936798095703, "global_step": 196954, "epoch": 2372} {"train_loss": -24.39405632019043, "global_step": 196955, "epoch": 2372} {"train_loss": -23.96164321899414, "global_step": 196956, "epoch": 2372} {"train_loss": -24.09316062927246, "global_step": 196957, "epoch": 2372} {"train_loss": -24.1642648168357, "global_step": 196958, "epoch": 2372, "val_loss": 6476797.0} {"train_loss": -23.863317489624023, "global_step": 196959, "epoch": 2373} {"train_loss": -22.65643882751465, "global_step": 196960, "epoch": 2373} {"train_loss": -22.575862884521484, "global_step": 196961, "epoch": 2373} {"train_loss": -23.906112670898438, "global_step": 196962, "epoch": 2373} {"train_loss": -23.226049423217773, "global_step": 196963, "epoch": 2373} {"train_loss": -23.26601219177246, "global_step": 196964, "epoch": 2373} {"train_loss": -23.28829574584961, "global_step": 196965, "epoch": 2373} {"train_loss": -24.15479278564453, "global_step": 196966, "epoch": 2373} {"train_loss": -24.150503158569336, "global_step": 196967, "epoch": 2373} {"train_loss": -23.95722198486328, "global_step": 196968, "epoch": 2373} {"train_loss": -23.51983642578125, "global_step": 196969, "epoch": 2373} {"train_loss": -23.75909996032715, "global_step": 196970, "epoch": 2373} {"train_loss": -23.92557144165039, "global_step": 196971, "epoch": 2373} {"train_loss": -23.32215690612793, "global_step": 196972, "epoch": 2373} {"train_loss": -23.69908332824707, "global_step": 196973, "epoch": 2373} {"train_loss": -23.91510772705078, "global_step": 196974, "epoch": 2373} {"train_loss": -23.905057907104492, "global_step": 196975, "epoch": 2373} {"train_loss": -24.209293365478516, "global_step": 196976, "epoch": 2373} {"train_loss": -23.797256469726562, "global_step": 196977, "epoch": 2373} {"train_loss": -23.92892074584961, "global_step": 196978, "epoch": 2373} {"train_loss": -24.0178279876709, "global_step": 196979, "epoch": 2373} {"train_loss": -23.78616714477539, "global_step": 196980, "epoch": 2373} {"train_loss": -23.881750106811523, "global_step": 196981, "epoch": 2373} {"train_loss": -24.139156341552734, "global_step": 196982, "epoch": 2373} {"train_loss": -24.06256866455078, "global_step": 196983, "epoch": 2373} {"train_loss": -23.872556686401367, "global_step": 196984, "epoch": 2373} {"train_loss": -24.21991539001465, "global_step": 196985, "epoch": 2373} {"train_loss": -23.82277488708496, "global_step": 196986, "epoch": 2373} {"train_loss": -24.269596099853516, "global_step": 196987, "epoch": 2373} {"train_loss": -23.974964141845703, "global_step": 196988, "epoch": 2373} {"train_loss": -24.192340850830078, "global_step": 196989, "epoch": 2373} {"train_loss": -23.961410522460938, "global_step": 196990, "epoch": 2373} {"train_loss": -24.321149826049805, "global_step": 196991, "epoch": 2373} {"train_loss": -24.128711700439453, "global_step": 196992, "epoch": 2373} {"train_loss": -23.8283748626709, "global_step": 196993, "epoch": 2373} {"train_loss": -24.398290634155273, "global_step": 196994, "epoch": 2373} {"train_loss": -24.37810707092285, "global_step": 196995, "epoch": 2373} {"train_loss": -24.43218994140625, "global_step": 196996, "epoch": 2373} {"train_loss": -24.21912956237793, "global_step": 196997, "epoch": 2373} {"train_loss": -23.99396324157715, "global_step": 196998, "epoch": 2373} {"train_loss": -24.17519187927246, "global_step": 196999, "epoch": 2373} {"train_loss": -24.4340763092041, "global_step": 197000, "epoch": 2373} {"train_loss": -24.269397735595703, "global_step": 197001, "epoch": 2373} {"train_loss": -24.362770080566406, "global_step": 197002, "epoch": 2373} {"train_loss": -24.28664207458496, "global_step": 197003, "epoch": 2373} {"train_loss": -24.13117027282715, "global_step": 197004, "epoch": 2373} {"train_loss": -23.95676040649414, "global_step": 197005, "epoch": 2373} {"train_loss": -24.61697769165039, "global_step": 197006, "epoch": 2373} {"train_loss": -24.3064022064209, "global_step": 197007, "epoch": 2373} {"train_loss": -24.346120834350586, "global_step": 197008, "epoch": 2373} {"train_loss": -24.464420318603516, "global_step": 197009, "epoch": 2373} {"train_loss": -24.398473739624023, "global_step": 197010, "epoch": 2373} {"train_loss": -24.01980972290039, "global_step": 197011, "epoch": 2373} {"train_loss": -24.433286666870117, "global_step": 197012, "epoch": 2373} {"train_loss": -23.9693660736084, "global_step": 197013, "epoch": 2373} {"train_loss": -24.302034378051758, "global_step": 197014, "epoch": 2373} {"train_loss": -24.17049217224121, "global_step": 197015, "epoch": 2373} {"train_loss": -24.357837677001953, "global_step": 197016, "epoch": 2373} {"train_loss": -24.104074478149414, "global_step": 197017, "epoch": 2373} {"train_loss": -24.19712257385254, "global_step": 197018, "epoch": 2373} {"train_loss": -24.027753829956055, "global_step": 197019, "epoch": 2373} {"train_loss": -24.24445152282715, "global_step": 197020, "epoch": 2373} {"train_loss": -23.909221649169922, "global_step": 197021, "epoch": 2373} {"train_loss": -24.305688858032227, "global_step": 197022, "epoch": 2373} {"train_loss": -24.497821807861328, "global_step": 197023, "epoch": 2373} {"train_loss": -24.345548629760742, "global_step": 197024, "epoch": 2373} {"train_loss": -24.510902404785156, "global_step": 197025, "epoch": 2373} {"train_loss": -24.55732536315918, "global_step": 197026, "epoch": 2373} {"train_loss": -24.143159866333008, "global_step": 197027, "epoch": 2373} {"train_loss": -24.32352066040039, "global_step": 197028, "epoch": 2373} {"train_loss": -23.87281608581543, "global_step": 197029, "epoch": 2373} {"train_loss": -24.526687622070312, "global_step": 197030, "epoch": 2373} {"train_loss": -24.55414390563965, "global_step": 197031, "epoch": 2373} {"train_loss": -24.167957305908203, "global_step": 197032, "epoch": 2373} {"train_loss": -24.07499122619629, "global_step": 197033, "epoch": 2373} {"train_loss": -24.34071159362793, "global_step": 197034, "epoch": 2373} {"train_loss": -24.045835494995117, "global_step": 197035, "epoch": 2373} {"train_loss": -24.19701385498047, "global_step": 197036, "epoch": 2373} {"train_loss": -24.077131271362305, "global_step": 197037, "epoch": 2373} {"train_loss": -24.168622970581055, "global_step": 197038, "epoch": 2373} {"train_loss": -24.438596725463867, "global_step": 197039, "epoch": 2373} {"train_loss": -24.103012084960938, "global_step": 197040, "epoch": 2373} {"train_loss": -24.073700801435724, "global_step": 197041, "epoch": 2373, "val_loss": 6604105.0} {"train_loss": -24.021390914916992, "global_step": 197042, "epoch": 2374} {"train_loss": -24.127761840820312, "global_step": 197043, "epoch": 2374} {"train_loss": -24.14740562438965, "global_step": 197044, "epoch": 2374} {"train_loss": -24.272214889526367, "global_step": 197045, "epoch": 2374} {"train_loss": -24.164472579956055, "global_step": 197046, "epoch": 2374} {"train_loss": -24.25656509399414, "global_step": 197047, "epoch": 2374} {"train_loss": -24.271299362182617, "global_step": 197048, "epoch": 2374} {"train_loss": -24.248794555664062, "global_step": 197049, "epoch": 2374} {"train_loss": -24.108299255371094, "global_step": 197050, "epoch": 2374} {"train_loss": -24.388900756835938, "global_step": 197051, "epoch": 2374} {"train_loss": -24.410720825195312, "global_step": 197052, "epoch": 2374} {"train_loss": -24.49818229675293, "global_step": 197053, "epoch": 2374} {"train_loss": -24.258686065673828, "global_step": 197054, "epoch": 2374} {"train_loss": -24.199541091918945, "global_step": 197055, "epoch": 2374} {"train_loss": -24.087413787841797, "global_step": 197056, "epoch": 2374} {"train_loss": -24.40212059020996, "global_step": 197057, "epoch": 2374} {"train_loss": -24.014484405517578, "global_step": 197058, "epoch": 2374} {"train_loss": -24.15510368347168, "global_step": 197059, "epoch": 2374} {"train_loss": -24.10630226135254, "global_step": 197060, "epoch": 2374} {"train_loss": -24.067445755004883, "global_step": 197061, "epoch": 2374} {"train_loss": -24.10377311706543, "global_step": 197062, "epoch": 2374} {"train_loss": -24.294109344482422, "global_step": 197063, "epoch": 2374} {"train_loss": -24.05824851989746, "global_step": 197064, "epoch": 2374} {"train_loss": -24.0722599029541, "global_step": 197065, "epoch": 2374} {"train_loss": -24.485118865966797, "global_step": 197066, "epoch": 2374} {"train_loss": -24.133319854736328, "global_step": 197067, "epoch": 2374} {"train_loss": -24.2832088470459, "global_step": 197068, "epoch": 2374} {"train_loss": -24.30902671813965, "global_step": 197069, "epoch": 2374} {"train_loss": -24.30061912536621, "global_step": 197070, "epoch": 2374} {"train_loss": -24.263145446777344, "global_step": 197071, "epoch": 2374} {"train_loss": -24.016258239746094, "global_step": 197072, "epoch": 2374} {"train_loss": -24.404617309570312, "global_step": 197073, "epoch": 2374} {"train_loss": -24.067224502563477, "global_step": 197074, "epoch": 2374} {"train_loss": -24.716642379760742, "global_step": 197075, "epoch": 2374} {"train_loss": -24.7088680267334, "global_step": 197076, "epoch": 2374} {"train_loss": -24.24103355407715, "global_step": 197077, "epoch": 2374} {"train_loss": -24.40744972229004, "global_step": 197078, "epoch": 2374} {"train_loss": -23.827394485473633, "global_step": 197079, "epoch": 2374} {"train_loss": -24.423494338989258, "global_step": 197080, "epoch": 2374} {"train_loss": -24.70379638671875, "global_step": 197081, "epoch": 2374} {"train_loss": -24.322599411010742, "global_step": 197082, "epoch": 2374} {"train_loss": -24.11188316345215, "global_step": 197083, "epoch": 2374} {"train_loss": -24.22739028930664, "global_step": 197084, "epoch": 2374} {"train_loss": -24.398014068603516, "global_step": 197085, "epoch": 2374} {"train_loss": -24.811689376831055, "global_step": 197086, "epoch": 2374} {"train_loss": -24.37838363647461, "global_step": 197087, "epoch": 2374} {"train_loss": -24.056354522705078, "global_step": 197088, "epoch": 2374} {"train_loss": -24.40361785888672, "global_step": 197089, "epoch": 2374} {"train_loss": -24.139862060546875, "global_step": 197090, "epoch": 2374} {"train_loss": -24.072751998901367, "global_step": 197091, "epoch": 2374} {"train_loss": -24.064924240112305, "global_step": 197092, "epoch": 2374} {"train_loss": -24.22063636779785, "global_step": 197093, "epoch": 2374} {"train_loss": -24.09168815612793, "global_step": 197094, "epoch": 2374} {"train_loss": -24.57997703552246, "global_step": 197095, "epoch": 2374} {"train_loss": -24.442028045654297, "global_step": 197096, "epoch": 2374} {"train_loss": -24.34217643737793, "global_step": 197097, "epoch": 2374} {"train_loss": -24.026479721069336, "global_step": 197098, "epoch": 2374} {"train_loss": -24.355772018432617, "global_step": 197099, "epoch": 2374} {"train_loss": -24.50745964050293, "global_step": 197100, "epoch": 2374} {"train_loss": -24.119821548461914, "global_step": 197101, "epoch": 2374} {"train_loss": -23.630666732788086, "global_step": 197102, "epoch": 2374} {"train_loss": -23.9072322845459, "global_step": 197103, "epoch": 2374} {"train_loss": -24.006343841552734, "global_step": 197104, "epoch": 2374} {"train_loss": -24.355649948120117, "global_step": 197105, "epoch": 2374} {"train_loss": -23.966466903686523, "global_step": 197106, "epoch": 2374} {"train_loss": -24.21400260925293, "global_step": 197107, "epoch": 2374} {"train_loss": -24.232851028442383, "global_step": 197108, "epoch": 2374} {"train_loss": -24.401336669921875, "global_step": 197109, "epoch": 2374} {"train_loss": -24.652503967285156, "global_step": 197110, "epoch": 2374} {"train_loss": -24.145587921142578, "global_step": 197111, "epoch": 2374} {"train_loss": -24.117950439453125, "global_step": 197112, "epoch": 2374} {"train_loss": -24.281658172607422, "global_step": 197113, "epoch": 2374} {"train_loss": -23.79402732849121, "global_step": 197114, "epoch": 2374} {"train_loss": -24.4442138671875, "global_step": 197115, "epoch": 2374} {"train_loss": -24.228288650512695, "global_step": 197116, "epoch": 2374} {"train_loss": -24.127164840698242, "global_step": 197117, "epoch": 2374} {"train_loss": -24.322330474853516, "global_step": 197118, "epoch": 2374} {"train_loss": -24.15070152282715, "global_step": 197119, "epoch": 2374} {"train_loss": -24.277996063232422, "global_step": 197120, "epoch": 2374} {"train_loss": -24.34224510192871, "global_step": 197121, "epoch": 2374} {"train_loss": -23.67043113708496, "global_step": 197122, "epoch": 2374} {"train_loss": -24.11507225036621, "global_step": 197123, "epoch": 2374} {"train_loss": -24.237205987953278, "global_step": 197124, "epoch": 2374, "val_loss": 6567476.0} {"train_loss": -23.66869354248047, "global_step": 197125, "epoch": 2375} {"train_loss": -22.703649520874023, "global_step": 197126, "epoch": 2375} {"train_loss": -23.621414184570312, "global_step": 197127, "epoch": 2375} {"train_loss": -23.583751678466797, "global_step": 197128, "epoch": 2375} {"train_loss": -23.126781463623047, "global_step": 197129, "epoch": 2375} {"train_loss": -23.567630767822266, "global_step": 197130, "epoch": 2375} {"train_loss": -23.649085998535156, "global_step": 197131, "epoch": 2375} {"train_loss": -23.57679557800293, "global_step": 197132, "epoch": 2375} {"train_loss": -23.676048278808594, "global_step": 197133, "epoch": 2375} {"train_loss": -23.9499568939209, "global_step": 197134, "epoch": 2375} {"train_loss": -23.906164169311523, "global_step": 197135, "epoch": 2375} {"train_loss": -23.655776977539062, "global_step": 197136, "epoch": 2375} {"train_loss": -24.05107879638672, "global_step": 197137, "epoch": 2375} {"train_loss": -23.770509719848633, "global_step": 197138, "epoch": 2375} {"train_loss": -24.25802993774414, "global_step": 197139, "epoch": 2375} {"train_loss": -23.900815963745117, "global_step": 197140, "epoch": 2375} {"train_loss": -23.753604888916016, "global_step": 197141, "epoch": 2375} {"train_loss": -24.00916862487793, "global_step": 197142, "epoch": 2375} {"train_loss": -23.85101318359375, "global_step": 197143, "epoch": 2375} {"train_loss": -24.144174575805664, "global_step": 197144, "epoch": 2375} {"train_loss": -23.99222755432129, "global_step": 197145, "epoch": 2375} {"train_loss": -23.545652389526367, "global_step": 197146, "epoch": 2375} {"train_loss": -24.196958541870117, "global_step": 197147, "epoch": 2375} {"train_loss": -24.171314239501953, "global_step": 197148, "epoch": 2375} {"train_loss": -24.57636833190918, "global_step": 197149, "epoch": 2375} {"train_loss": -24.242525100708008, "global_step": 197150, "epoch": 2375} {"train_loss": -23.897449493408203, "global_step": 197151, "epoch": 2375} {"train_loss": -24.02544593811035, "global_step": 197152, "epoch": 2375} {"train_loss": -23.9848575592041, "global_step": 197153, "epoch": 2375} {"train_loss": -24.035621643066406, "global_step": 197154, "epoch": 2375} {"train_loss": -24.0888729095459, "global_step": 197155, "epoch": 2375} {"train_loss": -24.478506088256836, "global_step": 197156, "epoch": 2375} {"train_loss": -24.083173751831055, "global_step": 197157, "epoch": 2375} {"train_loss": -24.044960021972656, "global_step": 197158, "epoch": 2375} {"train_loss": -24.1560115814209, "global_step": 197159, "epoch": 2375} {"train_loss": -24.059499740600586, "global_step": 197160, "epoch": 2375} {"train_loss": -24.1074161529541, "global_step": 197161, "epoch": 2375} {"train_loss": -24.5587215423584, "global_step": 197162, "epoch": 2375} {"train_loss": -24.550207138061523, "global_step": 197163, "epoch": 2375} {"train_loss": -24.4826717376709, "global_step": 197164, "epoch": 2375} {"train_loss": -23.99916648864746, "global_step": 197165, "epoch": 2375} {"train_loss": -24.514732360839844, "global_step": 197166, "epoch": 2375} {"train_loss": -24.67498016357422, "global_step": 197167, "epoch": 2375} {"train_loss": -24.320676803588867, "global_step": 197168, "epoch": 2375} {"train_loss": -24.46363067626953, "global_step": 197169, "epoch": 2375} {"train_loss": -23.690048217773438, "global_step": 197170, "epoch": 2375} {"train_loss": -24.112741470336914, "global_step": 197171, "epoch": 2375} {"train_loss": -24.062864303588867, "global_step": 197172, "epoch": 2375} {"train_loss": -24.21468162536621, "global_step": 197173, "epoch": 2375} {"train_loss": -24.43177604675293, "global_step": 197174, "epoch": 2375} {"train_loss": -24.29422950744629, "global_step": 197175, "epoch": 2375} {"train_loss": -24.64409637451172, "global_step": 197176, "epoch": 2375} {"train_loss": -24.081892013549805, "global_step": 197177, "epoch": 2375} {"train_loss": -23.99201774597168, "global_step": 197178, "epoch": 2375} {"train_loss": -24.036884307861328, "global_step": 197179, "epoch": 2375} {"train_loss": -24.248952865600586, "global_step": 197180, "epoch": 2375} {"train_loss": -24.338638305664062, "global_step": 197181, "epoch": 2375} {"train_loss": -24.098291397094727, "global_step": 197182, "epoch": 2375} {"train_loss": -23.980947494506836, "global_step": 197183, "epoch": 2375} {"train_loss": -24.47802734375, "global_step": 197184, "epoch": 2375} {"train_loss": -24.198348999023438, "global_step": 197185, "epoch": 2375} {"train_loss": -24.18120765686035, "global_step": 197186, "epoch": 2375} {"train_loss": -24.4144287109375, "global_step": 197187, "epoch": 2375} {"train_loss": -24.39515495300293, "global_step": 197188, "epoch": 2375} {"train_loss": -24.2098445892334, "global_step": 197189, "epoch": 2375} {"train_loss": -24.45418930053711, "global_step": 197190, "epoch": 2375} {"train_loss": -24.253787994384766, "global_step": 197191, "epoch": 2375} {"train_loss": -24.173110961914062, "global_step": 197192, "epoch": 2375} {"train_loss": -24.32988929748535, "global_step": 197193, "epoch": 2375} {"train_loss": -24.15099334716797, "global_step": 197194, "epoch": 2375} {"train_loss": -24.521953582763672, "global_step": 197195, "epoch": 2375} {"train_loss": -24.31964111328125, "global_step": 197196, "epoch": 2375} {"train_loss": -24.19559669494629, "global_step": 197197, "epoch": 2375} {"train_loss": -24.153257369995117, "global_step": 197198, "epoch": 2375} {"train_loss": -24.27008628845215, "global_step": 197199, "epoch": 2375} {"train_loss": -24.132802963256836, "global_step": 197200, "epoch": 2375} {"train_loss": -24.310239791870117, "global_step": 197201, "epoch": 2375} {"train_loss": -24.29659080505371, "global_step": 197202, "epoch": 2375} {"train_loss": -24.23793601989746, "global_step": 197203, "epoch": 2375} {"train_loss": -24.221158981323242, "global_step": 197204, "epoch": 2375} {"train_loss": -24.215791702270508, "global_step": 197205, "epoch": 2375} {"train_loss": -24.4453182220459, "global_step": 197206, "epoch": 2375} {"train_loss": -24.13751186232969, "global_step": 197207, "epoch": 2375, "val_loss": 6603072.5} {"train_loss": -23.70955467224121, "global_step": 197208, "epoch": 2376} {"train_loss": -23.79364013671875, "global_step": 197209, "epoch": 2376} {"train_loss": -23.939041137695312, "global_step": 197210, "epoch": 2376} {"train_loss": -24.00361442565918, "global_step": 197211, "epoch": 2376} {"train_loss": -23.99403953552246, "global_step": 197212, "epoch": 2376} {"train_loss": -24.18208885192871, "global_step": 197213, "epoch": 2376} {"train_loss": -23.980422973632812, "global_step": 197214, "epoch": 2376} {"train_loss": -23.504179000854492, "global_step": 197215, "epoch": 2376} {"train_loss": -23.92082977294922, "global_step": 197216, "epoch": 2376} {"train_loss": -23.981569290161133, "global_step": 197217, "epoch": 2376} {"train_loss": -24.155048370361328, "global_step": 197218, "epoch": 2376} {"train_loss": -24.083175659179688, "global_step": 197219, "epoch": 2376} {"train_loss": -24.669174194335938, "global_step": 197220, "epoch": 2376} {"train_loss": -23.834497451782227, "global_step": 197221, "epoch": 2376} {"train_loss": -24.0888614654541, "global_step": 197222, "epoch": 2376} {"train_loss": -24.217103958129883, "global_step": 197223, "epoch": 2376} {"train_loss": -24.141246795654297, "global_step": 197224, "epoch": 2376} {"train_loss": -24.16651153564453, "global_step": 197225, "epoch": 2376} {"train_loss": -23.981977462768555, "global_step": 197226, "epoch": 2376} {"train_loss": -24.22651481628418, "global_step": 197227, "epoch": 2376} {"train_loss": -24.253522872924805, "global_step": 197228, "epoch": 2376} {"train_loss": -23.987234115600586, "global_step": 197229, "epoch": 2376} {"train_loss": -24.164365768432617, "global_step": 197230, "epoch": 2376} {"train_loss": -24.03383445739746, "global_step": 197231, "epoch": 2376} {"train_loss": -24.52011489868164, "global_step": 197232, "epoch": 2376} {"train_loss": -24.198612213134766, "global_step": 197233, "epoch": 2376} {"train_loss": -24.441579818725586, "global_step": 197234, "epoch": 2376} {"train_loss": -24.056230545043945, "global_step": 197235, "epoch": 2376} {"train_loss": -23.79661750793457, "global_step": 197236, "epoch": 2376} {"train_loss": -24.44688606262207, "global_step": 197237, "epoch": 2376} {"train_loss": -24.309402465820312, "global_step": 197238, "epoch": 2376} {"train_loss": -24.12514305114746, "global_step": 197239, "epoch": 2376} {"train_loss": -24.237430572509766, "global_step": 197240, "epoch": 2376} {"train_loss": -24.086151123046875, "global_step": 197241, "epoch": 2376} {"train_loss": -23.921003341674805, "global_step": 197242, "epoch": 2376} {"train_loss": -24.31215476989746, "global_step": 197243, "epoch": 2376} {"train_loss": -24.051069259643555, "global_step": 197244, "epoch": 2376} {"train_loss": -24.120697021484375, "global_step": 197245, "epoch": 2376} {"train_loss": -24.3673152923584, "global_step": 197246, "epoch": 2376} {"train_loss": -24.368206024169922, "global_step": 197247, "epoch": 2376} {"train_loss": -24.478988647460938, "global_step": 197248, "epoch": 2376} {"train_loss": -24.073183059692383, "global_step": 197249, "epoch": 2376} {"train_loss": -24.016157150268555, "global_step": 197250, "epoch": 2376} {"train_loss": -24.227888107299805, "global_step": 197251, "epoch": 2376} {"train_loss": -24.100011825561523, "global_step": 197252, "epoch": 2376} {"train_loss": -24.176359176635742, "global_step": 197253, "epoch": 2376} {"train_loss": -23.935789108276367, "global_step": 197254, "epoch": 2376} {"train_loss": -24.488975524902344, "global_step": 197255, "epoch": 2376} {"train_loss": -24.329904556274414, "global_step": 197256, "epoch": 2376} {"train_loss": -24.091825485229492, "global_step": 197257, "epoch": 2376} {"train_loss": -24.18199920654297, "global_step": 197258, "epoch": 2376} {"train_loss": -24.722036361694336, "global_step": 197259, "epoch": 2376} {"train_loss": -24.253726959228516, "global_step": 197260, "epoch": 2376} {"train_loss": -24.289655685424805, "global_step": 197261, "epoch": 2376} {"train_loss": -23.368602752685547, "global_step": 197262, "epoch": 2376} {"train_loss": -24.044897079467773, "global_step": 197263, "epoch": 2376} {"train_loss": -24.104145050048828, "global_step": 197264, "epoch": 2376} {"train_loss": -24.23824119567871, "global_step": 197265, "epoch": 2376} {"train_loss": -24.150978088378906, "global_step": 197266, "epoch": 2376} {"train_loss": -24.1950740814209, "global_step": 197267, "epoch": 2376} {"train_loss": -23.79767608642578, "global_step": 197268, "epoch": 2376} {"train_loss": -23.825899124145508, "global_step": 197269, "epoch": 2376} {"train_loss": -24.455774307250977, "global_step": 197270, "epoch": 2376} {"train_loss": -24.33148956298828, "global_step": 197271, "epoch": 2376} {"train_loss": -23.539766311645508, "global_step": 197272, "epoch": 2376} {"train_loss": -23.958711624145508, "global_step": 197273, "epoch": 2376} {"train_loss": -24.256393432617188, "global_step": 197274, "epoch": 2376} {"train_loss": -24.222492218017578, "global_step": 197275, "epoch": 2376} {"train_loss": -23.955068588256836, "global_step": 197276, "epoch": 2376} {"train_loss": -24.47696876525879, "global_step": 197277, "epoch": 2376} {"train_loss": -24.33805274963379, "global_step": 197278, "epoch": 2376} {"train_loss": -24.35175895690918, "global_step": 197279, "epoch": 2376} {"train_loss": -24.148670196533203, "global_step": 197280, "epoch": 2376} {"train_loss": -24.59673500061035, "global_step": 197281, "epoch": 2376} {"train_loss": -24.16251564025879, "global_step": 197282, "epoch": 2376} {"train_loss": -24.289499282836914, "global_step": 197283, "epoch": 2376} {"train_loss": -24.446290969848633, "global_step": 197284, "epoch": 2376} {"train_loss": -24.40312957763672, "global_step": 197285, "epoch": 2376} {"train_loss": -24.26912498474121, "global_step": 197286, "epoch": 2376} {"train_loss": -24.328161239624023, "global_step": 197287, "epoch": 2376} {"train_loss": -24.23839569091797, "global_step": 197288, "epoch": 2376} {"train_loss": -24.310503005981445, "global_step": 197289, "epoch": 2376} {"train_loss": -24.173807213105352, "global_step": 197290, "epoch": 2376, "val_loss": 6674394.0} {"train_loss": -24.095300674438477, "global_step": 197291, "epoch": 2377} {"train_loss": -23.80061149597168, "global_step": 197292, "epoch": 2377} {"train_loss": -23.874685287475586, "global_step": 197293, "epoch": 2377} {"train_loss": -23.726463317871094, "global_step": 197294, "epoch": 2377} {"train_loss": -23.659332275390625, "global_step": 197295, "epoch": 2377} {"train_loss": -24.002925872802734, "global_step": 197296, "epoch": 2377} {"train_loss": -23.99988555908203, "global_step": 197297, "epoch": 2377} {"train_loss": -23.758684158325195, "global_step": 197298, "epoch": 2377} {"train_loss": -24.2937068939209, "global_step": 197299, "epoch": 2377} {"train_loss": -24.028669357299805, "global_step": 197300, "epoch": 2377} {"train_loss": -24.30214500427246, "global_step": 197301, "epoch": 2377} {"train_loss": -24.124902725219727, "global_step": 197302, "epoch": 2377} {"train_loss": -24.086023330688477, "global_step": 197303, "epoch": 2377} {"train_loss": -24.107954025268555, "global_step": 197304, "epoch": 2377} {"train_loss": -23.856430053710938, "global_step": 197305, "epoch": 2377} {"train_loss": -23.609813690185547, "global_step": 197306, "epoch": 2377} {"train_loss": -24.243122100830078, "global_step": 197307, "epoch": 2377} {"train_loss": -24.092594146728516, "global_step": 197308, "epoch": 2377} {"train_loss": -23.998640060424805, "global_step": 197309, "epoch": 2377} {"train_loss": -24.16944694519043, "global_step": 197310, "epoch": 2377} {"train_loss": -24.059913635253906, "global_step": 197311, "epoch": 2377} {"train_loss": -24.595657348632812, "global_step": 197312, "epoch": 2377} {"train_loss": -23.98835563659668, "global_step": 197313, "epoch": 2377} {"train_loss": -24.02724266052246, "global_step": 197314, "epoch": 2377} {"train_loss": -23.73737144470215, "global_step": 197315, "epoch": 2377} {"train_loss": -24.443944931030273, "global_step": 197316, "epoch": 2377} {"train_loss": -23.92633056640625, "global_step": 197317, "epoch": 2377} {"train_loss": -24.04413414001465, "global_step": 197318, "epoch": 2377} {"train_loss": -24.124189376831055, "global_step": 197319, "epoch": 2377} {"train_loss": -24.237293243408203, "global_step": 197320, "epoch": 2377} {"train_loss": -24.173240661621094, "global_step": 197321, "epoch": 2377} {"train_loss": -24.182096481323242, "global_step": 197322, "epoch": 2377} {"train_loss": -24.27031135559082, "global_step": 197323, "epoch": 2377} {"train_loss": -24.43897819519043, "global_step": 197324, "epoch": 2377} {"train_loss": -24.384077072143555, "global_step": 197325, "epoch": 2377} {"train_loss": -24.342243194580078, "global_step": 197326, "epoch": 2377} {"train_loss": -24.394309997558594, "global_step": 197327, "epoch": 2377} {"train_loss": -24.147695541381836, "global_step": 197328, "epoch": 2377} {"train_loss": -24.08893394470215, "global_step": 197329, "epoch": 2377} {"train_loss": -24.251798629760742, "global_step": 197330, "epoch": 2377} {"train_loss": -24.205184936523438, "global_step": 197331, "epoch": 2377} {"train_loss": -24.027671813964844, "global_step": 197332, "epoch": 2377} {"train_loss": -24.20232582092285, "global_step": 197333, "epoch": 2377} {"train_loss": -24.164525985717773, "global_step": 197334, "epoch": 2377} {"train_loss": -24.42610740661621, "global_step": 197335, "epoch": 2377} {"train_loss": -24.050342559814453, "global_step": 197336, "epoch": 2377} {"train_loss": -24.446491241455078, "global_step": 197337, "epoch": 2377} {"train_loss": -24.151838302612305, "global_step": 197338, "epoch": 2377} {"train_loss": -24.48101806640625, "global_step": 197339, "epoch": 2377} {"train_loss": -24.462162017822266, "global_step": 197340, "epoch": 2377} {"train_loss": -24.082134246826172, "global_step": 197341, "epoch": 2377} {"train_loss": -24.016584396362305, "global_step": 197342, "epoch": 2377} {"train_loss": -24.16961669921875, "global_step": 197343, "epoch": 2377} {"train_loss": -24.52534294128418, "global_step": 197344, "epoch": 2377} {"train_loss": -24.439199447631836, "global_step": 197345, "epoch": 2377} {"train_loss": -24.592876434326172, "global_step": 197346, "epoch": 2377} {"train_loss": -24.493318557739258, "global_step": 197347, "epoch": 2377} {"train_loss": -24.328733444213867, "global_step": 197348, "epoch": 2377} {"train_loss": -24.092248916625977, "global_step": 197349, "epoch": 2377} {"train_loss": -24.221097946166992, "global_step": 197350, "epoch": 2377} {"train_loss": -23.7053279876709, "global_step": 197351, "epoch": 2377} {"train_loss": -23.70146942138672, "global_step": 197352, "epoch": 2377} {"train_loss": -23.524038314819336, "global_step": 197353, "epoch": 2377} {"train_loss": -24.172836303710938, "global_step": 197354, "epoch": 2377} {"train_loss": -23.940343856811523, "global_step": 197355, "epoch": 2377} {"train_loss": -23.85432243347168, "global_step": 197356, "epoch": 2377} {"train_loss": -24.01264762878418, "global_step": 197357, "epoch": 2377} {"train_loss": -24.1428279876709, "global_step": 197358, "epoch": 2377} {"train_loss": -24.089128494262695, "global_step": 197359, "epoch": 2377} {"train_loss": -24.0068416595459, "global_step": 197360, "epoch": 2377} {"train_loss": -23.876211166381836, "global_step": 197361, "epoch": 2377} {"train_loss": -24.14664649963379, "global_step": 197362, "epoch": 2377} {"train_loss": -24.19080924987793, "global_step": 197363, "epoch": 2377} {"train_loss": -24.224035263061523, "global_step": 197364, "epoch": 2377} {"train_loss": -23.849035263061523, "global_step": 197365, "epoch": 2377} {"train_loss": -24.33026695251465, "global_step": 197366, "epoch": 2377} {"train_loss": -24.068405151367188, "global_step": 197367, "epoch": 2377} {"train_loss": -23.974538803100586, "global_step": 197368, "epoch": 2377} {"train_loss": -24.102645874023438, "global_step": 197369, "epoch": 2377} {"train_loss": -24.14993667602539, "global_step": 197370, "epoch": 2377} {"train_loss": -24.08192253112793, "global_step": 197371, "epoch": 2377} {"train_loss": -24.241050720214844, "global_step": 197372, "epoch": 2377} {"train_loss": -24.11341965916645, "global_step": 197373, "epoch": 2377, "val_loss": 6587608.0} {"train_loss": -23.675527572631836, "global_step": 197374, "epoch": 2378} {"train_loss": -23.651060104370117, "global_step": 197375, "epoch": 2378} {"train_loss": -23.69715690612793, "global_step": 197376, "epoch": 2378} {"train_loss": -23.900501251220703, "global_step": 197377, "epoch": 2378} {"train_loss": -23.8863468170166, "global_step": 197378, "epoch": 2378} {"train_loss": -23.78394317626953, "global_step": 197379, "epoch": 2378} {"train_loss": -23.65226173400879, "global_step": 197380, "epoch": 2378} {"train_loss": -23.828819274902344, "global_step": 197381, "epoch": 2378} {"train_loss": -24.19002342224121, "global_step": 197382, "epoch": 2378} {"train_loss": -23.948192596435547, "global_step": 197383, "epoch": 2378} {"train_loss": -23.88437843322754, "global_step": 197384, "epoch": 2378} {"train_loss": -24.094356536865234, "global_step": 197385, "epoch": 2378} {"train_loss": -24.009052276611328, "global_step": 197386, "epoch": 2378} {"train_loss": -24.301971435546875, "global_step": 197387, "epoch": 2378} {"train_loss": -23.7937068939209, "global_step": 197388, "epoch": 2378} {"train_loss": -23.94746971130371, "global_step": 197389, "epoch": 2378} {"train_loss": -24.42220115661621, "global_step": 197390, "epoch": 2378} {"train_loss": -24.732755661010742, "global_step": 197391, "epoch": 2378} {"train_loss": -23.91190528869629, "global_step": 197392, "epoch": 2378} {"train_loss": -24.473072052001953, "global_step": 197393, "epoch": 2378} {"train_loss": -24.234312057495117, "global_step": 197394, "epoch": 2378} {"train_loss": -24.674592971801758, "global_step": 197395, "epoch": 2378} {"train_loss": -24.13017463684082, "global_step": 197396, "epoch": 2378} {"train_loss": -24.480735778808594, "global_step": 197397, "epoch": 2378} {"train_loss": -23.941617965698242, "global_step": 197398, "epoch": 2378} {"train_loss": -24.224912643432617, "global_step": 197399, "epoch": 2378} {"train_loss": -24.654521942138672, "global_step": 197400, "epoch": 2378} {"train_loss": -23.889118194580078, "global_step": 197401, "epoch": 2378} {"train_loss": -23.966691970825195, "global_step": 197402, "epoch": 2378} {"train_loss": -24.170108795166016, "global_step": 197403, "epoch": 2378} {"train_loss": -24.101476669311523, "global_step": 197404, "epoch": 2378} {"train_loss": -23.961181640625, "global_step": 197405, "epoch": 2378} {"train_loss": -24.63246726989746, "global_step": 197406, "epoch": 2378} {"train_loss": -24.46006202697754, "global_step": 197407, "epoch": 2378} {"train_loss": -24.201000213623047, "global_step": 197408, "epoch": 2378} {"train_loss": -24.36270523071289, "global_step": 197409, "epoch": 2378} {"train_loss": -23.85942268371582, "global_step": 197410, "epoch": 2378} {"train_loss": -24.539152145385742, "global_step": 197411, "epoch": 2378} {"train_loss": -24.56960105895996, "global_step": 197412, "epoch": 2378} {"train_loss": -24.261320114135742, "global_step": 197413, "epoch": 2378} {"train_loss": -24.092512130737305, "global_step": 197414, "epoch": 2378} {"train_loss": -24.01978874206543, "global_step": 197415, "epoch": 2378} {"train_loss": -24.56900978088379, "global_step": 197416, "epoch": 2378} {"train_loss": -24.089277267456055, "global_step": 197417, "epoch": 2378} {"train_loss": -24.22252082824707, "global_step": 197418, "epoch": 2378} {"train_loss": -24.03029441833496, "global_step": 197419, "epoch": 2378} {"train_loss": -24.339879989624023, "global_step": 197420, "epoch": 2378} {"train_loss": -23.9676456451416, "global_step": 197421, "epoch": 2378} {"train_loss": -24.090030670166016, "global_step": 197422, "epoch": 2378} {"train_loss": -24.28495979309082, "global_step": 197423, "epoch": 2378} {"train_loss": -24.390884399414062, "global_step": 197424, "epoch": 2378} {"train_loss": -24.485675811767578, "global_step": 197425, "epoch": 2378} {"train_loss": -24.150421142578125, "global_step": 197426, "epoch": 2378} {"train_loss": -24.05595588684082, "global_step": 197427, "epoch": 2378} {"train_loss": -24.420150756835938, "global_step": 197428, "epoch": 2378} {"train_loss": -24.14162254333496, "global_step": 197429, "epoch": 2378} {"train_loss": -24.477787017822266, "global_step": 197430, "epoch": 2378} {"train_loss": -24.2625789642334, "global_step": 197431, "epoch": 2378} {"train_loss": -24.250085830688477, "global_step": 197432, "epoch": 2378} {"train_loss": -24.206022262573242, "global_step": 197433, "epoch": 2378} {"train_loss": -24.47754669189453, "global_step": 197434, "epoch": 2378} {"train_loss": -23.98958396911621, "global_step": 197435, "epoch": 2378} {"train_loss": -24.46009063720703, "global_step": 197436, "epoch": 2378} {"train_loss": -24.27054214477539, "global_step": 197437, "epoch": 2378} {"train_loss": -24.395109176635742, "global_step": 197438, "epoch": 2378} {"train_loss": -24.181943893432617, "global_step": 197439, "epoch": 2378} {"train_loss": -24.43280601501465, "global_step": 197440, "epoch": 2378} {"train_loss": -24.148405075073242, "global_step": 197441, "epoch": 2378} {"train_loss": -24.398712158203125, "global_step": 197442, "epoch": 2378} {"train_loss": -24.3975772857666, "global_step": 197443, "epoch": 2378} {"train_loss": -24.50684928894043, "global_step": 197444, "epoch": 2378} {"train_loss": -24.277311325073242, "global_step": 197445, "epoch": 2378} {"train_loss": -24.409570693969727, "global_step": 197446, "epoch": 2378} {"train_loss": -24.240997314453125, "global_step": 197447, "epoch": 2378} {"train_loss": -24.187129974365234, "global_step": 197448, "epoch": 2378} {"train_loss": -24.352991104125977, "global_step": 197449, "epoch": 2378} {"train_loss": -24.32454490661621, "global_step": 197450, "epoch": 2378} {"train_loss": -24.382104873657227, "global_step": 197451, "epoch": 2378} {"train_loss": -23.978879928588867, "global_step": 197452, "epoch": 2378} {"train_loss": -23.884004592895508, "global_step": 197453, "epoch": 2378} {"train_loss": -24.097681045532227, "global_step": 197454, "epoch": 2378} {"train_loss": -24.582218170166016, "global_step": 197455, "epoch": 2378} {"train_loss": -24.190324714384882, "global_step": 197456, "epoch": 2378, "val_loss": 6597657.5} {"train_loss": -23.843759536743164, "global_step": 197457, "epoch": 2379} {"train_loss": -23.031930923461914, "global_step": 197458, "epoch": 2379} {"train_loss": -23.980024337768555, "global_step": 197459, "epoch": 2379} {"train_loss": -23.481338500976562, "global_step": 197460, "epoch": 2379} {"train_loss": -23.766036987304688, "global_step": 197461, "epoch": 2379} {"train_loss": -23.3203125, "global_step": 197462, "epoch": 2379} {"train_loss": -23.674924850463867, "global_step": 197463, "epoch": 2379} {"train_loss": -23.84415054321289, "global_step": 197464, "epoch": 2379} {"train_loss": -23.716886520385742, "global_step": 197465, "epoch": 2379} {"train_loss": -23.85477638244629, "global_step": 197466, "epoch": 2379} {"train_loss": -23.832599639892578, "global_step": 197467, "epoch": 2379} {"train_loss": -23.662771224975586, "global_step": 197468, "epoch": 2379} {"train_loss": -23.847028732299805, "global_step": 197469, "epoch": 2379} {"train_loss": -23.614168167114258, "global_step": 197470, "epoch": 2379} {"train_loss": -24.072093963623047, "global_step": 197471, "epoch": 2379} {"train_loss": -23.967687606811523, "global_step": 197472, "epoch": 2379} {"train_loss": -23.916873931884766, "global_step": 197473, "epoch": 2379} {"train_loss": -24.210744857788086, "global_step": 197474, "epoch": 2379} {"train_loss": -23.88057518005371, "global_step": 197475, "epoch": 2379} {"train_loss": -23.892581939697266, "global_step": 197476, "epoch": 2379} {"train_loss": -24.055709838867188, "global_step": 197477, "epoch": 2379} {"train_loss": -23.903615951538086, "global_step": 197478, "epoch": 2379} {"train_loss": -24.206893920898438, "global_step": 197479, "epoch": 2379} {"train_loss": -23.94434928894043, "global_step": 197480, "epoch": 2379} {"train_loss": -23.863401412963867, "global_step": 197481, "epoch": 2379} {"train_loss": -23.914133071899414, "global_step": 197482, "epoch": 2379} {"train_loss": -24.09291648864746, "global_step": 197483, "epoch": 2379} {"train_loss": -24.03101921081543, "global_step": 197484, "epoch": 2379} {"train_loss": -23.792905807495117, "global_step": 197485, "epoch": 2379} {"train_loss": -24.326696395874023, "global_step": 197486, "epoch": 2379} {"train_loss": -24.193552017211914, "global_step": 197487, "epoch": 2379} {"train_loss": -24.04315757751465, "global_step": 197488, "epoch": 2379} {"train_loss": -24.487380981445312, "global_step": 197489, "epoch": 2379} {"train_loss": -24.588842391967773, "global_step": 197490, "epoch": 2379} {"train_loss": -23.794431686401367, "global_step": 197491, "epoch": 2379} {"train_loss": -23.943017959594727, "global_step": 197492, "epoch": 2379} {"train_loss": -24.06496238708496, "global_step": 197493, "epoch": 2379} {"train_loss": -24.221071243286133, "global_step": 197494, "epoch": 2379} {"train_loss": -24.115005493164062, "global_step": 197495, "epoch": 2379} {"train_loss": -24.469839096069336, "global_step": 197496, "epoch": 2379} {"train_loss": -24.381547927856445, "global_step": 197497, "epoch": 2379} {"train_loss": -24.31161880493164, "global_step": 197498, "epoch": 2379} {"train_loss": -24.25593376159668, "global_step": 197499, "epoch": 2379} {"train_loss": -24.26206398010254, "global_step": 197500, "epoch": 2379} {"train_loss": -24.306438446044922, "global_step": 197501, "epoch": 2379} {"train_loss": -23.98988914489746, "global_step": 197502, "epoch": 2379} {"train_loss": -24.153722763061523, "global_step": 197503, "epoch": 2379} {"train_loss": -24.273595809936523, "global_step": 197504, "epoch": 2379} {"train_loss": -24.46525001525879, "global_step": 197505, "epoch": 2379} {"train_loss": -23.894250869750977, "global_step": 197506, "epoch": 2379} {"train_loss": -24.585830688476562, "global_step": 197507, "epoch": 2379} {"train_loss": -24.655445098876953, "global_step": 197508, "epoch": 2379} {"train_loss": -24.285531997680664, "global_step": 197509, "epoch": 2379} {"train_loss": -24.040571212768555, "global_step": 197510, "epoch": 2379} {"train_loss": -23.96531105041504, "global_step": 197511, "epoch": 2379} {"train_loss": -24.4165096282959, "global_step": 197512, "epoch": 2379} {"train_loss": -24.545499801635742, "global_step": 197513, "epoch": 2379} {"train_loss": -24.21548843383789, "global_step": 197514, "epoch": 2379} {"train_loss": -24.1859130859375, "global_step": 197515, "epoch": 2379} {"train_loss": -24.11789894104004, "global_step": 197516, "epoch": 2379} {"train_loss": -24.408193588256836, "global_step": 197517, "epoch": 2379} {"train_loss": -24.15752410888672, "global_step": 197518, "epoch": 2379} {"train_loss": -24.516651153564453, "global_step": 197519, "epoch": 2379} {"train_loss": -23.99432945251465, "global_step": 197520, "epoch": 2379} {"train_loss": -24.671354293823242, "global_step": 197521, "epoch": 2379} {"train_loss": -23.984867095947266, "global_step": 197522, "epoch": 2379} {"train_loss": -24.16107749938965, "global_step": 197523, "epoch": 2379} {"train_loss": -24.2279109954834, "global_step": 197524, "epoch": 2379} {"train_loss": -24.55304718017578, "global_step": 197525, "epoch": 2379} {"train_loss": -24.27949333190918, "global_step": 197526, "epoch": 2379} {"train_loss": -24.670637130737305, "global_step": 197527, "epoch": 2379} {"train_loss": -24.447744369506836, "global_step": 197528, "epoch": 2379} {"train_loss": -24.295936584472656, "global_step": 197529, "epoch": 2379} {"train_loss": -24.467519760131836, "global_step": 197530, "epoch": 2379} {"train_loss": -24.284711837768555, "global_step": 197531, "epoch": 2379} {"train_loss": -23.96106719970703, "global_step": 197532, "epoch": 2379} {"train_loss": -24.331192016601562, "global_step": 197533, "epoch": 2379} {"train_loss": -24.150859832763672, "global_step": 197534, "epoch": 2379} {"train_loss": -24.73438262939453, "global_step": 197535, "epoch": 2379} {"train_loss": -23.923913955688477, "global_step": 197536, "epoch": 2379} {"train_loss": -24.141162872314453, "global_step": 197537, "epoch": 2379} {"train_loss": -24.591123580932617, "global_step": 197538, "epoch": 2379} {"train_loss": -24.117214869303876, "global_step": 197539, "epoch": 2379, "val_loss": 6716908.5} {"train_loss": -23.74736213684082, "global_step": 197540, "epoch": 2380} {"train_loss": -24.0109806060791, "global_step": 197541, "epoch": 2380} {"train_loss": -23.909637451171875, "global_step": 197542, "epoch": 2380} {"train_loss": -23.979223251342773, "global_step": 197543, "epoch": 2380} {"train_loss": -23.813451766967773, "global_step": 197544, "epoch": 2380} {"train_loss": -24.101892471313477, "global_step": 197545, "epoch": 2380} {"train_loss": -23.906309127807617, "global_step": 197546, "epoch": 2380} {"train_loss": -23.90141487121582, "global_step": 197547, "epoch": 2380} {"train_loss": -23.937015533447266, "global_step": 197548, "epoch": 2380} {"train_loss": -24.232131958007812, "global_step": 197549, "epoch": 2380} {"train_loss": -24.08721351623535, "global_step": 197550, "epoch": 2380} {"train_loss": -23.83767318725586, "global_step": 197551, "epoch": 2380} {"train_loss": -23.964277267456055, "global_step": 197552, "epoch": 2380} {"train_loss": -24.256071090698242, "global_step": 197553, "epoch": 2380} {"train_loss": -23.706523895263672, "global_step": 197554, "epoch": 2380} {"train_loss": -24.562763214111328, "global_step": 197555, "epoch": 2380} {"train_loss": -23.77859878540039, "global_step": 197556, "epoch": 2380} {"train_loss": -23.558996200561523, "global_step": 197557, "epoch": 2380} {"train_loss": -24.44161033630371, "global_step": 197558, "epoch": 2380} {"train_loss": -23.993749618530273, "global_step": 197559, "epoch": 2380} {"train_loss": -24.20550537109375, "global_step": 197560, "epoch": 2380} {"train_loss": -24.303668975830078, "global_step": 197561, "epoch": 2380} {"train_loss": -24.023740768432617, "global_step": 197562, "epoch": 2380} {"train_loss": -24.24173927307129, "global_step": 197563, "epoch": 2380} {"train_loss": -23.908111572265625, "global_step": 197564, "epoch": 2380} {"train_loss": -24.15502166748047, "global_step": 197565, "epoch": 2380} {"train_loss": -23.878345489501953, "global_step": 197566, "epoch": 2380} {"train_loss": -23.715072631835938, "global_step": 197567, "epoch": 2380} {"train_loss": -23.96441650390625, "global_step": 197568, "epoch": 2380} {"train_loss": -24.057876586914062, "global_step": 197569, "epoch": 2380} {"train_loss": -24.1719970703125, "global_step": 197570, "epoch": 2380} {"train_loss": -23.909833908081055, "global_step": 197571, "epoch": 2380} {"train_loss": -24.066091537475586, "global_step": 197572, "epoch": 2380} {"train_loss": -24.187923431396484, "global_step": 197573, "epoch": 2380} {"train_loss": -24.546470642089844, "global_step": 197574, "epoch": 2380} {"train_loss": -24.01294708251953, "global_step": 197575, "epoch": 2380} {"train_loss": -24.40309715270996, "global_step": 197576, "epoch": 2380} {"train_loss": -23.984769821166992, "global_step": 197577, "epoch": 2380} {"train_loss": -24.18642234802246, "global_step": 197578, "epoch": 2380} {"train_loss": -24.053354263305664, "global_step": 197579, "epoch": 2380} {"train_loss": -24.055923461914062, "global_step": 197580, "epoch": 2380} {"train_loss": -24.250802993774414, "global_step": 197581, "epoch": 2380} {"train_loss": -23.970691680908203, "global_step": 197582, "epoch": 2380} {"train_loss": -24.19675064086914, "global_step": 197583, "epoch": 2380} {"train_loss": -24.33847427368164, "global_step": 197584, "epoch": 2380} {"train_loss": -24.23958396911621, "global_step": 197585, "epoch": 2380} {"train_loss": -23.910444259643555, "global_step": 197586, "epoch": 2380} {"train_loss": -23.864782333374023, "global_step": 197587, "epoch": 2380} {"train_loss": -23.996408462524414, "global_step": 197588, "epoch": 2380} {"train_loss": -24.307912826538086, "global_step": 197589, "epoch": 2380} {"train_loss": -23.657390594482422, "global_step": 197590, "epoch": 2380} {"train_loss": -24.29798698425293, "global_step": 197591, "epoch": 2380} {"train_loss": -24.49738883972168, "global_step": 197592, "epoch": 2380} {"train_loss": -24.23512077331543, "global_step": 197593, "epoch": 2380} {"train_loss": -24.057069778442383, "global_step": 197594, "epoch": 2380} {"train_loss": -24.009111404418945, "global_step": 197595, "epoch": 2380} {"train_loss": -23.829023361206055, "global_step": 197596, "epoch": 2380} {"train_loss": -24.25922966003418, "global_step": 197597, "epoch": 2380} {"train_loss": -24.243080139160156, "global_step": 197598, "epoch": 2380} {"train_loss": -24.067380905151367, "global_step": 197599, "epoch": 2380} {"train_loss": -24.30768394470215, "global_step": 197600, "epoch": 2380} {"train_loss": -23.90467643737793, "global_step": 197601, "epoch": 2380} {"train_loss": -24.086503982543945, "global_step": 197602, "epoch": 2380} {"train_loss": -24.258913040161133, "global_step": 197603, "epoch": 2380} {"train_loss": -24.364456176757812, "global_step": 197604, "epoch": 2380} {"train_loss": -24.03291130065918, "global_step": 197605, "epoch": 2380} {"train_loss": -24.535659790039062, "global_step": 197606, "epoch": 2380} {"train_loss": -24.203271865844727, "global_step": 197607, "epoch": 2380} {"train_loss": -24.48249626159668, "global_step": 197608, "epoch": 2380} {"train_loss": -24.495508193969727, "global_step": 197609, "epoch": 2380} {"train_loss": -24.728586196899414, "global_step": 197610, "epoch": 2380} {"train_loss": -24.618080139160156, "global_step": 197611, "epoch": 2380} {"train_loss": -24.167911529541016, "global_step": 197612, "epoch": 2380} {"train_loss": -24.363662719726562, "global_step": 197613, "epoch": 2380} {"train_loss": -24.296186447143555, "global_step": 197614, "epoch": 2380} {"train_loss": -23.912683486938477, "global_step": 197615, "epoch": 2380} {"train_loss": -23.80940055847168, "global_step": 197616, "epoch": 2380} {"train_loss": -24.297012329101562, "global_step": 197617, "epoch": 2380} {"train_loss": -24.071332931518555, "global_step": 197618, "epoch": 2380} {"train_loss": -23.759830474853516, "global_step": 197619, "epoch": 2380} {"train_loss": -23.43865203857422, "global_step": 197620, "epoch": 2380} {"train_loss": -24.191349029541016, "global_step": 197621, "epoch": 2380} {"train_loss": -24.108105142432525, "global_step": 197622, "epoch": 2380, "val_loss": 6692638.0} {"train_loss": -23.452802658081055, "global_step": 197623, "epoch": 2381} {"train_loss": -23.68155288696289, "global_step": 197624, "epoch": 2381} {"train_loss": -23.12233543395996, "global_step": 197625, "epoch": 2381} {"train_loss": -23.923559188842773, "global_step": 197626, "epoch": 2381} {"train_loss": -23.643285751342773, "global_step": 197627, "epoch": 2381} {"train_loss": -23.78174591064453, "global_step": 197628, "epoch": 2381} {"train_loss": -24.081710815429688, "global_step": 197629, "epoch": 2381} {"train_loss": -23.330841064453125, "global_step": 197630, "epoch": 2381} {"train_loss": -23.627538681030273, "global_step": 197631, "epoch": 2381} {"train_loss": -23.99948501586914, "global_step": 197632, "epoch": 2381} {"train_loss": -23.702796936035156, "global_step": 197633, "epoch": 2381} {"train_loss": -24.11328887939453, "global_step": 197634, "epoch": 2381} {"train_loss": -23.991352081298828, "global_step": 197635, "epoch": 2381} {"train_loss": -23.625246047973633, "global_step": 197636, "epoch": 2381} {"train_loss": -23.633380889892578, "global_step": 197637, "epoch": 2381} {"train_loss": -24.051237106323242, "global_step": 197638, "epoch": 2381} {"train_loss": -24.117694854736328, "global_step": 197639, "epoch": 2381} {"train_loss": -24.041950225830078, "global_step": 197640, "epoch": 2381} {"train_loss": -23.8292293548584, "global_step": 197641, "epoch": 2381} {"train_loss": -24.09942054748535, "global_step": 197642, "epoch": 2381} {"train_loss": -24.230186462402344, "global_step": 197643, "epoch": 2381} {"train_loss": -24.419601440429688, "global_step": 197644, "epoch": 2381} {"train_loss": -24.34946060180664, "global_step": 197645, "epoch": 2381} {"train_loss": -24.209068298339844, "global_step": 197646, "epoch": 2381} {"train_loss": -24.239486694335938, "global_step": 197647, "epoch": 2381} {"train_loss": -24.318044662475586, "global_step": 197648, "epoch": 2381} {"train_loss": -24.24537467956543, "global_step": 197649, "epoch": 2381} {"train_loss": -23.89400291442871, "global_step": 197650, "epoch": 2381} {"train_loss": -24.15834617614746, "global_step": 197651, "epoch": 2381} {"train_loss": -23.895193099975586, "global_step": 197652, "epoch": 2381} {"train_loss": -24.341703414916992, "global_step": 197653, "epoch": 2381} {"train_loss": -24.15458106994629, "global_step": 197654, "epoch": 2381} {"train_loss": -24.3258113861084, "global_step": 197655, "epoch": 2381} {"train_loss": -24.50084686279297, "global_step": 197656, "epoch": 2381} {"train_loss": -24.023656845092773, "global_step": 197657, "epoch": 2381} {"train_loss": -24.340585708618164, "global_step": 197658, "epoch": 2381} {"train_loss": -24.170331954956055, "global_step": 197659, "epoch": 2381} {"train_loss": -24.0862979888916, "global_step": 197660, "epoch": 2381} {"train_loss": -24.65413475036621, "global_step": 197661, "epoch": 2381} {"train_loss": -24.24818229675293, "global_step": 197662, "epoch": 2381} {"train_loss": -24.2348575592041, "global_step": 197663, "epoch": 2381} {"train_loss": -23.962560653686523, "global_step": 197664, "epoch": 2381} {"train_loss": -24.65361785888672, "global_step": 197665, "epoch": 2381} {"train_loss": -24.02686882019043, "global_step": 197666, "epoch": 2381} {"train_loss": -24.396474838256836, "global_step": 197667, "epoch": 2381} {"train_loss": -24.556339263916016, "global_step": 197668, "epoch": 2381} {"train_loss": -24.091337203979492, "global_step": 197669, "epoch": 2381} {"train_loss": -24.28237533569336, "global_step": 197670, "epoch": 2381} {"train_loss": -24.248538970947266, "global_step": 197671, "epoch": 2381} {"train_loss": -24.652156829833984, "global_step": 197672, "epoch": 2381} {"train_loss": -24.19650650024414, "global_step": 197673, "epoch": 2381} {"train_loss": -24.337133407592773, "global_step": 197674, "epoch": 2381} {"train_loss": -24.298616409301758, "global_step": 197675, "epoch": 2381} {"train_loss": -24.175947189331055, "global_step": 197676, "epoch": 2381} {"train_loss": -24.337987899780273, "global_step": 197677, "epoch": 2381} {"train_loss": -24.115764617919922, "global_step": 197678, "epoch": 2381} {"train_loss": -24.121109008789062, "global_step": 197679, "epoch": 2381} {"train_loss": -24.433080673217773, "global_step": 197680, "epoch": 2381} {"train_loss": -24.31019401550293, "global_step": 197681, "epoch": 2381} {"train_loss": -24.3867130279541, "global_step": 197682, "epoch": 2381} {"train_loss": -24.37354850769043, "global_step": 197683, "epoch": 2381} {"train_loss": -24.1947021484375, "global_step": 197684, "epoch": 2381} {"train_loss": -24.469961166381836, "global_step": 197685, "epoch": 2381} {"train_loss": -24.160919189453125, "global_step": 197686, "epoch": 2381} {"train_loss": -23.984107971191406, "global_step": 197687, "epoch": 2381} {"train_loss": -23.8848819732666, "global_step": 197688, "epoch": 2381} {"train_loss": -23.954517364501953, "global_step": 197689, "epoch": 2381} {"train_loss": -24.54612922668457, "global_step": 197690, "epoch": 2381} {"train_loss": -24.38277816772461, "global_step": 197691, "epoch": 2381} {"train_loss": -24.56731414794922, "global_step": 197692, "epoch": 2381} {"train_loss": -24.097715377807617, "global_step": 197693, "epoch": 2381} {"train_loss": -23.97286033630371, "global_step": 197694, "epoch": 2381} {"train_loss": -23.91608238220215, "global_step": 197695, "epoch": 2381} {"train_loss": -24.08261489868164, "global_step": 197696, "epoch": 2381} {"train_loss": -24.233182907104492, "global_step": 197697, "epoch": 2381} {"train_loss": -24.010181427001953, "global_step": 197698, "epoch": 2381} {"train_loss": -24.353242874145508, "global_step": 197699, "epoch": 2381} {"train_loss": -24.446630477905273, "global_step": 197700, "epoch": 2381} {"train_loss": -24.052309036254883, "global_step": 197701, "epoch": 2381} {"train_loss": -24.2119197845459, "global_step": 197702, "epoch": 2381} {"train_loss": -24.38216209411621, "global_step": 197703, "epoch": 2381} {"train_loss": -24.273971557617188, "global_step": 197704, "epoch": 2381} {"train_loss": -24.10866578803005, "global_step": 197705, "epoch": 2381, "val_loss": 6425351.0} {"train_loss": -23.723236083984375, "global_step": 197706, "epoch": 2382} {"train_loss": -24.13910484313965, "global_step": 197707, "epoch": 2382} {"train_loss": -23.72696304321289, "global_step": 197708, "epoch": 2382} {"train_loss": -23.85938262939453, "global_step": 197709, "epoch": 2382} {"train_loss": -23.92801856994629, "global_step": 197710, "epoch": 2382} {"train_loss": -23.96565055847168, "global_step": 197711, "epoch": 2382} {"train_loss": -23.784269332885742, "global_step": 197712, "epoch": 2382} {"train_loss": -23.494230270385742, "global_step": 197713, "epoch": 2382} {"train_loss": -23.920347213745117, "global_step": 197714, "epoch": 2382} {"train_loss": -24.12879180908203, "global_step": 197715, "epoch": 2382} {"train_loss": -23.779966354370117, "global_step": 197716, "epoch": 2382} {"train_loss": -23.618398666381836, "global_step": 197717, "epoch": 2382} {"train_loss": -24.014524459838867, "global_step": 197718, "epoch": 2382} {"train_loss": -23.965564727783203, "global_step": 197719, "epoch": 2382} {"train_loss": -23.590002059936523, "global_step": 197720, "epoch": 2382} {"train_loss": -24.203475952148438, "global_step": 197721, "epoch": 2382} {"train_loss": -23.73676109313965, "global_step": 197722, "epoch": 2382} {"train_loss": -23.866422653198242, "global_step": 197723, "epoch": 2382} {"train_loss": -24.164737701416016, "global_step": 197724, "epoch": 2382} {"train_loss": -24.09149742126465, "global_step": 197725, "epoch": 2382} {"train_loss": -24.08479881286621, "global_step": 197726, "epoch": 2382} {"train_loss": -24.05866241455078, "global_step": 197727, "epoch": 2382} {"train_loss": -24.3758544921875, "global_step": 197728, "epoch": 2382} {"train_loss": -24.13617515563965, "global_step": 197729, "epoch": 2382} {"train_loss": -24.018146514892578, "global_step": 197730, "epoch": 2382} {"train_loss": -24.412765502929688, "global_step": 197731, "epoch": 2382} {"train_loss": -24.173259735107422, "global_step": 197732, "epoch": 2382} {"train_loss": -24.03217887878418, "global_step": 197733, "epoch": 2382} {"train_loss": -23.976316452026367, "global_step": 197734, "epoch": 2382} {"train_loss": -24.145383834838867, "global_step": 197735, "epoch": 2382} {"train_loss": -24.229904174804688, "global_step": 197736, "epoch": 2382} {"train_loss": -24.331226348876953, "global_step": 197737, "epoch": 2382} {"train_loss": -23.88016128540039, "global_step": 197738, "epoch": 2382} {"train_loss": -24.157739639282227, "global_step": 197739, "epoch": 2382} {"train_loss": -24.63405418395996, "global_step": 197740, "epoch": 2382} {"train_loss": -24.489871978759766, "global_step": 197741, "epoch": 2382} {"train_loss": -24.485027313232422, "global_step": 197742, "epoch": 2382} {"train_loss": -23.97266960144043, "global_step": 197743, "epoch": 2382} {"train_loss": -24.540287017822266, "global_step": 197744, "epoch": 2382} {"train_loss": -24.403287887573242, "global_step": 197745, "epoch": 2382} {"train_loss": -24.19582176208496, "global_step": 197746, "epoch": 2382} {"train_loss": -24.54548454284668, "global_step": 197747, "epoch": 2382} {"train_loss": -24.423513412475586, "global_step": 197748, "epoch": 2382} {"train_loss": -24.316608428955078, "global_step": 197749, "epoch": 2382} {"train_loss": -24.084623336791992, "global_step": 197750, "epoch": 2382} {"train_loss": -24.452741622924805, "global_step": 197751, "epoch": 2382} {"train_loss": -24.07756805419922, "global_step": 197752, "epoch": 2382} {"train_loss": -24.173120498657227, "global_step": 197753, "epoch": 2382} {"train_loss": -24.707489013671875, "global_step": 197754, "epoch": 2382} {"train_loss": -24.76915168762207, "global_step": 197755, "epoch": 2382} {"train_loss": -24.80605125427246, "global_step": 197756, "epoch": 2382} {"train_loss": -24.46901512145996, "global_step": 197757, "epoch": 2382} {"train_loss": -24.131315231323242, "global_step": 197758, "epoch": 2382} {"train_loss": -24.676095962524414, "global_step": 197759, "epoch": 2382} {"train_loss": -24.2726993560791, "global_step": 197760, "epoch": 2382} {"train_loss": -24.22081184387207, "global_step": 197761, "epoch": 2382} {"train_loss": -24.211456298828125, "global_step": 197762, "epoch": 2382} {"train_loss": -24.467737197875977, "global_step": 197763, "epoch": 2382} {"train_loss": -24.200687408447266, "global_step": 197764, "epoch": 2382} {"train_loss": -24.063232421875, "global_step": 197765, "epoch": 2382} {"train_loss": -24.253332138061523, "global_step": 197766, "epoch": 2382} {"train_loss": -24.19095230102539, "global_step": 197767, "epoch": 2382} {"train_loss": -23.78603172302246, "global_step": 197768, "epoch": 2382} {"train_loss": -24.530216217041016, "global_step": 197769, "epoch": 2382} {"train_loss": -24.121326446533203, "global_step": 197770, "epoch": 2382} {"train_loss": -23.90572166442871, "global_step": 197771, "epoch": 2382} {"train_loss": -23.89462661743164, "global_step": 197772, "epoch": 2382} {"train_loss": -23.8603515625, "global_step": 197773, "epoch": 2382} {"train_loss": -24.192672729492188, "global_step": 197774, "epoch": 2382} {"train_loss": -24.132064819335938, "global_step": 197775, "epoch": 2382} {"train_loss": -24.168935775756836, "global_step": 197776, "epoch": 2382} {"train_loss": -24.094152450561523, "global_step": 197777, "epoch": 2382} {"train_loss": -24.220077514648438, "global_step": 197778, "epoch": 2382} {"train_loss": -24.30462074279785, "global_step": 197779, "epoch": 2382} {"train_loss": -23.962915420532227, "global_step": 197780, "epoch": 2382} {"train_loss": -24.018150329589844, "global_step": 197781, "epoch": 2382} {"train_loss": -24.08211326599121, "global_step": 197782, "epoch": 2382} {"train_loss": -24.3333683013916, "global_step": 197783, "epoch": 2382} {"train_loss": -24.025033950805664, "global_step": 197784, "epoch": 2382} {"train_loss": -24.220218658447266, "global_step": 197785, "epoch": 2382} {"train_loss": -24.11714744567871, "global_step": 197786, "epoch": 2382} {"train_loss": -24.189085006713867, "global_step": 197787, "epoch": 2382} {"train_loss": -24.148564074412885, "global_step": 197788, "epoch": 2382, "val_loss": 6513621.0} {"train_loss": -23.31410789489746, "global_step": 197789, "epoch": 2383} {"train_loss": -23.842151641845703, "global_step": 197790, "epoch": 2383} {"train_loss": -23.8695068359375, "global_step": 197791, "epoch": 2383} {"train_loss": -23.247541427612305, "global_step": 197792, "epoch": 2383} {"train_loss": -24.134437561035156, "global_step": 197793, "epoch": 2383} {"train_loss": -23.7742977142334, "global_step": 197794, "epoch": 2383} {"train_loss": -23.83856201171875, "global_step": 197795, "epoch": 2383} {"train_loss": -23.864511489868164, "global_step": 197796, "epoch": 2383} {"train_loss": -23.58100700378418, "global_step": 197797, "epoch": 2383} {"train_loss": -24.00360107421875, "global_step": 197798, "epoch": 2383} {"train_loss": -23.667062759399414, "global_step": 197799, "epoch": 2383} {"train_loss": -23.830951690673828, "global_step": 197800, "epoch": 2383} {"train_loss": -23.8212947845459, "global_step": 197801, "epoch": 2383} {"train_loss": -24.307720184326172, "global_step": 197802, "epoch": 2383} {"train_loss": -23.910398483276367, "global_step": 197803, "epoch": 2383} {"train_loss": -24.017562866210938, "global_step": 197804, "epoch": 2383} {"train_loss": -24.069826126098633, "global_step": 197805, "epoch": 2383} {"train_loss": -24.113121032714844, "global_step": 197806, "epoch": 2383} {"train_loss": -23.724506378173828, "global_step": 197807, "epoch": 2383} {"train_loss": -24.237035751342773, "global_step": 197808, "epoch": 2383} {"train_loss": -24.016427993774414, "global_step": 197809, "epoch": 2383} {"train_loss": -24.06908416748047, "global_step": 197810, "epoch": 2383} {"train_loss": -23.76666259765625, "global_step": 197811, "epoch": 2383} {"train_loss": -23.78042984008789, "global_step": 197812, "epoch": 2383} {"train_loss": -24.189773559570312, "global_step": 197813, "epoch": 2383} {"train_loss": -24.35573959350586, "global_step": 197814, "epoch": 2383} {"train_loss": -24.263757705688477, "global_step": 197815, "epoch": 2383} {"train_loss": -24.068317413330078, "global_step": 197816, "epoch": 2383} {"train_loss": -24.151952743530273, "global_step": 197817, "epoch": 2383} {"train_loss": -23.72864532470703, "global_step": 197818, "epoch": 2383} {"train_loss": -24.34360122680664, "global_step": 197819, "epoch": 2383} {"train_loss": -23.3336238861084, "global_step": 197820, "epoch": 2383} {"train_loss": -24.38262939453125, "global_step": 197821, "epoch": 2383} {"train_loss": -24.466766357421875, "global_step": 197822, "epoch": 2383} {"train_loss": -23.9226016998291, "global_step": 197823, "epoch": 2383} {"train_loss": -24.459949493408203, "global_step": 197824, "epoch": 2383} {"train_loss": -23.611454010009766, "global_step": 197825, "epoch": 2383} {"train_loss": -24.323532104492188, "global_step": 197826, "epoch": 2383} {"train_loss": -23.741117477416992, "global_step": 197827, "epoch": 2383} {"train_loss": -23.91346549987793, "global_step": 197828, "epoch": 2383} {"train_loss": -24.267929077148438, "global_step": 197829, "epoch": 2383} {"train_loss": -23.82978057861328, "global_step": 197830, "epoch": 2383} {"train_loss": -23.458486557006836, "global_step": 197831, "epoch": 2383} {"train_loss": -23.607419967651367, "global_step": 197832, "epoch": 2383} {"train_loss": -24.19070816040039, "global_step": 197833, "epoch": 2383} {"train_loss": -24.08208656311035, "global_step": 197834, "epoch": 2383} {"train_loss": -23.980022430419922, "global_step": 197835, "epoch": 2383} {"train_loss": -24.10938262939453, "global_step": 197836, "epoch": 2383} {"train_loss": -23.996835708618164, "global_step": 197837, "epoch": 2383} {"train_loss": -24.05525016784668, "global_step": 197838, "epoch": 2383} {"train_loss": -23.807086944580078, "global_step": 197839, "epoch": 2383} {"train_loss": -24.009267807006836, "global_step": 197840, "epoch": 2383} {"train_loss": -24.046728134155273, "global_step": 197841, "epoch": 2383} {"train_loss": -24.043045043945312, "global_step": 197842, "epoch": 2383} {"train_loss": -24.10410499572754, "global_step": 197843, "epoch": 2383} {"train_loss": -24.00042152404785, "global_step": 197844, "epoch": 2383} {"train_loss": -24.05104637145996, "global_step": 197845, "epoch": 2383} {"train_loss": -23.906314849853516, "global_step": 197846, "epoch": 2383} {"train_loss": -23.844762802124023, "global_step": 197847, "epoch": 2383} {"train_loss": -24.31220054626465, "global_step": 197848, "epoch": 2383} {"train_loss": -24.14101219177246, "global_step": 197849, "epoch": 2383} {"train_loss": -24.235395431518555, "global_step": 197850, "epoch": 2383} {"train_loss": -24.257553100585938, "global_step": 197851, "epoch": 2383} {"train_loss": -24.283344268798828, "global_step": 197852, "epoch": 2383} {"train_loss": -24.39873695373535, "global_step": 197853, "epoch": 2383} {"train_loss": -24.372802734375, "global_step": 197854, "epoch": 2383} {"train_loss": -24.313398361206055, "global_step": 197855, "epoch": 2383} {"train_loss": -24.42485809326172, "global_step": 197856, "epoch": 2383} {"train_loss": -24.287485122680664, "global_step": 197857, "epoch": 2383} {"train_loss": -24.202043533325195, "global_step": 197858, "epoch": 2383} {"train_loss": -24.55985450744629, "global_step": 197859, "epoch": 2383} {"train_loss": -24.452367782592773, "global_step": 197860, "epoch": 2383} {"train_loss": -24.710369110107422, "global_step": 197861, "epoch": 2383} {"train_loss": -24.512170791625977, "global_step": 197862, "epoch": 2383} {"train_loss": -24.0665340423584, "global_step": 197863, "epoch": 2383} {"train_loss": -23.80750274658203, "global_step": 197864, "epoch": 2383} {"train_loss": -24.354999542236328, "global_step": 197865, "epoch": 2383} {"train_loss": -24.182504653930664, "global_step": 197866, "epoch": 2383} {"train_loss": -24.807754516601562, "global_step": 197867, "epoch": 2383} {"train_loss": -24.286460876464844, "global_step": 197868, "epoch": 2383} {"train_loss": -24.467893600463867, "global_step": 197869, "epoch": 2383} {"train_loss": -24.44463539123535, "global_step": 197870, "epoch": 2383} {"train_loss": -24.074725346392896, "global_step": 197871, "epoch": 2383, "val_loss": 6520894.0} {"train_loss": -23.988309860229492, "global_step": 197872, "epoch": 2384} {"train_loss": -23.784854888916016, "global_step": 197873, "epoch": 2384} {"train_loss": -23.66419792175293, "global_step": 197874, "epoch": 2384} {"train_loss": -23.510496139526367, "global_step": 197875, "epoch": 2384} {"train_loss": -24.10785484313965, "global_step": 197876, "epoch": 2384} {"train_loss": -23.8663272857666, "global_step": 197877, "epoch": 2384} {"train_loss": -23.955625534057617, "global_step": 197878, "epoch": 2384} {"train_loss": -23.690784454345703, "global_step": 197879, "epoch": 2384} {"train_loss": -24.246702194213867, "global_step": 197880, "epoch": 2384} {"train_loss": -24.102087020874023, "global_step": 197881, "epoch": 2384} {"train_loss": -23.836572647094727, "global_step": 197882, "epoch": 2384} {"train_loss": -23.893814086914062, "global_step": 197883, "epoch": 2384} {"train_loss": -24.078615188598633, "global_step": 197884, "epoch": 2384} {"train_loss": -24.170181274414062, "global_step": 197885, "epoch": 2384} {"train_loss": -24.3018741607666, "global_step": 197886, "epoch": 2384} {"train_loss": -24.081518173217773, "global_step": 197887, "epoch": 2384} {"train_loss": -24.348512649536133, "global_step": 197888, "epoch": 2384} {"train_loss": -24.471946716308594, "global_step": 197889, "epoch": 2384} {"train_loss": -24.218994140625, "global_step": 197890, "epoch": 2384} {"train_loss": -24.18175506591797, "global_step": 197891, "epoch": 2384} {"train_loss": -24.14105796813965, "global_step": 197892, "epoch": 2384} {"train_loss": -24.19828224182129, "global_step": 197893, "epoch": 2384} {"train_loss": -23.944461822509766, "global_step": 197894, "epoch": 2384} {"train_loss": -24.269081115722656, "global_step": 197895, "epoch": 2384} {"train_loss": -24.42619514465332, "global_step": 197896, "epoch": 2384} {"train_loss": -24.23026466369629, "global_step": 197897, "epoch": 2384} {"train_loss": -24.1833553314209, "global_step": 197898, "epoch": 2384} {"train_loss": -24.293502807617188, "global_step": 197899, "epoch": 2384} {"train_loss": -24.478788375854492, "global_step": 197900, "epoch": 2384} {"train_loss": -23.97848129272461, "global_step": 197901, "epoch": 2384} {"train_loss": -24.0109920501709, "global_step": 197902, "epoch": 2384} {"train_loss": -24.275344848632812, "global_step": 197903, "epoch": 2384} {"train_loss": -23.955907821655273, "global_step": 197904, "epoch": 2384} {"train_loss": -24.23537254333496, "global_step": 197905, "epoch": 2384} {"train_loss": -24.313735961914062, "global_step": 197906, "epoch": 2384} {"train_loss": -24.19875144958496, "global_step": 197907, "epoch": 2384} {"train_loss": -24.23954200744629, "global_step": 197908, "epoch": 2384} {"train_loss": -24.65064811706543, "global_step": 197909, "epoch": 2384} {"train_loss": -24.50445556640625, "global_step": 197910, "epoch": 2384} {"train_loss": -24.329181671142578, "global_step": 197911, "epoch": 2384} {"train_loss": -23.659006118774414, "global_step": 197912, "epoch": 2384} {"train_loss": -24.434097290039062, "global_step": 197913, "epoch": 2384} {"train_loss": -24.158838272094727, "global_step": 197914, "epoch": 2384} {"train_loss": -23.687406539916992, "global_step": 197915, "epoch": 2384} {"train_loss": -24.329893112182617, "global_step": 197916, "epoch": 2384} {"train_loss": -24.031946182250977, "global_step": 197917, "epoch": 2384} {"train_loss": -24.16375160217285, "global_step": 197918, "epoch": 2384} {"train_loss": -24.178979873657227, "global_step": 197919, "epoch": 2384} {"train_loss": -24.120100021362305, "global_step": 197920, "epoch": 2384} {"train_loss": -24.002838134765625, "global_step": 197921, "epoch": 2384} {"train_loss": -24.19405746459961, "global_step": 197922, "epoch": 2384} {"train_loss": -24.100881576538086, "global_step": 197923, "epoch": 2384} {"train_loss": -24.192584991455078, "global_step": 197924, "epoch": 2384} {"train_loss": -24.15883445739746, "global_step": 197925, "epoch": 2384} {"train_loss": -24.093259811401367, "global_step": 197926, "epoch": 2384} {"train_loss": -24.2813663482666, "global_step": 197927, "epoch": 2384} {"train_loss": -24.13620948791504, "global_step": 197928, "epoch": 2384} {"train_loss": -24.4935302734375, "global_step": 197929, "epoch": 2384} {"train_loss": -24.41566276550293, "global_step": 197930, "epoch": 2384} {"train_loss": -24.223173141479492, "global_step": 197931, "epoch": 2384} {"train_loss": -24.042940139770508, "global_step": 197932, "epoch": 2384} {"train_loss": -24.303546905517578, "global_step": 197933, "epoch": 2384} {"train_loss": -24.193357467651367, "global_step": 197934, "epoch": 2384} {"train_loss": -24.545175552368164, "global_step": 197935, "epoch": 2384} {"train_loss": -24.306446075439453, "global_step": 197936, "epoch": 2384} {"train_loss": -24.24787712097168, "global_step": 197937, "epoch": 2384} {"train_loss": -24.606475830078125, "global_step": 197938, "epoch": 2384} {"train_loss": -24.16277503967285, "global_step": 197939, "epoch": 2384} {"train_loss": -24.27485466003418, "global_step": 197940, "epoch": 2384} {"train_loss": -24.478361129760742, "global_step": 197941, "epoch": 2384} {"train_loss": -24.11177635192871, "global_step": 197942, "epoch": 2384} {"train_loss": -24.132638931274414, "global_step": 197943, "epoch": 2384} {"train_loss": -24.64238929748535, "global_step": 197944, "epoch": 2384} {"train_loss": -24.33136558532715, "global_step": 197945, "epoch": 2384} {"train_loss": -24.260725021362305, "global_step": 197946, "epoch": 2384} {"train_loss": -24.08113670349121, "global_step": 197947, "epoch": 2384} {"train_loss": -24.18291664123535, "global_step": 197948, "epoch": 2384} {"train_loss": -23.97462272644043, "global_step": 197949, "epoch": 2384} {"train_loss": -24.05666160583496, "global_step": 197950, "epoch": 2384} {"train_loss": -24.34190559387207, "global_step": 197951, "epoch": 2384} {"train_loss": -24.255477905273438, "global_step": 197952, "epoch": 2384} {"train_loss": -24.418418884277344, "global_step": 197953, "epoch": 2384} {"train_loss": -24.177762318806476, "global_step": 197954, "epoch": 2384, "val_loss": 6673399.0} {"train_loss": -21.273725509643555, "global_step": 197955, "epoch": 2385} {"train_loss": -22.56130027770996, "global_step": 197956, "epoch": 2385} {"train_loss": -23.440935134887695, "global_step": 197957, "epoch": 2385} {"train_loss": -23.73467445373535, "global_step": 197958, "epoch": 2385} {"train_loss": -23.138282775878906, "global_step": 197959, "epoch": 2385} {"train_loss": -23.838083267211914, "global_step": 197960, "epoch": 2385} {"train_loss": -23.346288681030273, "global_step": 197961, "epoch": 2385} {"train_loss": -24.15010643005371, "global_step": 197962, "epoch": 2385} {"train_loss": -23.43238639831543, "global_step": 197963, "epoch": 2385} {"train_loss": -23.789369583129883, "global_step": 197964, "epoch": 2385} {"train_loss": -23.599519729614258, "global_step": 197965, "epoch": 2385} {"train_loss": -23.888179779052734, "global_step": 197966, "epoch": 2385} {"train_loss": -23.665729522705078, "global_step": 197967, "epoch": 2385} {"train_loss": -23.7065372467041, "global_step": 197968, "epoch": 2385} {"train_loss": -23.82817840576172, "global_step": 197969, "epoch": 2385} {"train_loss": -23.583547592163086, "global_step": 197970, "epoch": 2385} {"train_loss": -23.433822631835938, "global_step": 197971, "epoch": 2385} {"train_loss": -23.863265991210938, "global_step": 197972, "epoch": 2385} {"train_loss": -23.8692569732666, "global_step": 197973, "epoch": 2385} {"train_loss": -24.055747985839844, "global_step": 197974, "epoch": 2385} {"train_loss": -24.02901268005371, "global_step": 197975, "epoch": 2385} {"train_loss": -23.944774627685547, "global_step": 197976, "epoch": 2385} {"train_loss": -24.279504776000977, "global_step": 197977, "epoch": 2385} {"train_loss": -23.915164947509766, "global_step": 197978, "epoch": 2385} {"train_loss": -24.073400497436523, "global_step": 197979, "epoch": 2385} {"train_loss": -24.068674087524414, "global_step": 197980, "epoch": 2385} {"train_loss": -24.089569091796875, "global_step": 197981, "epoch": 2385} {"train_loss": -24.313642501831055, "global_step": 197982, "epoch": 2385} {"train_loss": -24.37136459350586, "global_step": 197983, "epoch": 2385} {"train_loss": -24.1644229888916, "global_step": 197984, "epoch": 2385} {"train_loss": -24.39682388305664, "global_step": 197985, "epoch": 2385} {"train_loss": -24.10361671447754, "global_step": 197986, "epoch": 2385} {"train_loss": -24.295530319213867, "global_step": 197987, "epoch": 2385} {"train_loss": -24.304410934448242, "global_step": 197988, "epoch": 2385} {"train_loss": -24.022842407226562, "global_step": 197989, "epoch": 2385} {"train_loss": -23.919937133789062, "global_step": 197990, "epoch": 2385} {"train_loss": -24.166305541992188, "global_step": 197991, "epoch": 2385} {"train_loss": -24.70552635192871, "global_step": 197992, "epoch": 2385} {"train_loss": -24.21439552307129, "global_step": 197993, "epoch": 2385} {"train_loss": -24.13547706604004, "global_step": 197994, "epoch": 2385} {"train_loss": -24.668867111206055, "global_step": 197995, "epoch": 2385} {"train_loss": -24.166501998901367, "global_step": 197996, "epoch": 2385} {"train_loss": -24.331424713134766, "global_step": 197997, "epoch": 2385} {"train_loss": -24.45131492614746, "global_step": 197998, "epoch": 2385} {"train_loss": -24.15447235107422, "global_step": 197999, "epoch": 2385} {"train_loss": -24.109481811523438, "global_step": 198000, "epoch": 2385} {"train_loss": -24.53968620300293, "global_step": 198001, "epoch": 2385} {"train_loss": -24.382694244384766, "global_step": 198002, "epoch": 2385} {"train_loss": -24.210220336914062, "global_step": 198003, "epoch": 2385} {"train_loss": -24.546995162963867, "global_step": 198004, "epoch": 2385} {"train_loss": -24.274566650390625, "global_step": 198005, "epoch": 2385} {"train_loss": -24.107257843017578, "global_step": 198006, "epoch": 2385} {"train_loss": -24.58957862854004, "global_step": 198007, "epoch": 2385} {"train_loss": -24.39470863342285, "global_step": 198008, "epoch": 2385} {"train_loss": -24.462055206298828, "global_step": 198009, "epoch": 2385} {"train_loss": -24.2548770904541, "global_step": 198010, "epoch": 2385} {"train_loss": -24.1666202545166, "global_step": 198011, "epoch": 2385} {"train_loss": -24.37641716003418, "global_step": 198012, "epoch": 2385} {"train_loss": -24.357168197631836, "global_step": 198013, "epoch": 2385} {"train_loss": -24.110858917236328, "global_step": 198014, "epoch": 2385} {"train_loss": -24.314226150512695, "global_step": 198015, "epoch": 2385} {"train_loss": -24.070512771606445, "global_step": 198016, "epoch": 2385} {"train_loss": -23.830875396728516, "global_step": 198017, "epoch": 2385} {"train_loss": -24.118173599243164, "global_step": 198018, "epoch": 2385} {"train_loss": -23.977502822875977, "global_step": 198019, "epoch": 2385} {"train_loss": -24.447904586791992, "global_step": 198020, "epoch": 2385} {"train_loss": -24.114866256713867, "global_step": 198021, "epoch": 2385} {"train_loss": -24.196447372436523, "global_step": 198022, "epoch": 2385} {"train_loss": -24.454648971557617, "global_step": 198023, "epoch": 2385} {"train_loss": -24.198884963989258, "global_step": 198024, "epoch": 2385} {"train_loss": -24.24732208251953, "global_step": 198025, "epoch": 2385} {"train_loss": -24.42213249206543, "global_step": 198026, "epoch": 2385} {"train_loss": -24.322967529296875, "global_step": 198027, "epoch": 2385} {"train_loss": -24.25432777404785, "global_step": 198028, "epoch": 2385} {"train_loss": -24.052488327026367, "global_step": 198029, "epoch": 2385} {"train_loss": -24.263513565063477, "global_step": 198030, "epoch": 2385} {"train_loss": -24.25568962097168, "global_step": 198031, "epoch": 2385} {"train_loss": -24.11918067932129, "global_step": 198032, "epoch": 2385} {"train_loss": -24.405874252319336, "global_step": 198033, "epoch": 2385} {"train_loss": -23.934722900390625, "global_step": 198034, "epoch": 2385} {"train_loss": -24.040220260620117, "global_step": 198035, "epoch": 2385} {"train_loss": -24.253477096557617, "global_step": 198036, "epoch": 2385} {"train_loss": -24.06071961644184, "global_step": 198037, "epoch": 2385, "val_loss": 6780072.0} {"train_loss": -23.09641456604004, "global_step": 198038, "epoch": 2386} {"train_loss": -22.942636489868164, "global_step": 198039, "epoch": 2386} {"train_loss": -23.471485137939453, "global_step": 198040, "epoch": 2386} {"train_loss": -23.44035530090332, "global_step": 198041, "epoch": 2386} {"train_loss": -23.593114852905273, "global_step": 198042, "epoch": 2386} {"train_loss": -23.659835815429688, "global_step": 198043, "epoch": 2386} {"train_loss": -23.73843002319336, "global_step": 198044, "epoch": 2386} {"train_loss": -23.43634605407715, "global_step": 198045, "epoch": 2386} {"train_loss": -23.743375778198242, "global_step": 198046, "epoch": 2386} {"train_loss": -23.653045654296875, "global_step": 198047, "epoch": 2386} {"train_loss": -23.819499969482422, "global_step": 198048, "epoch": 2386} {"train_loss": -23.96928596496582, "global_step": 198049, "epoch": 2386} {"train_loss": -23.932382583618164, "global_step": 198050, "epoch": 2386} {"train_loss": -24.028865814208984, "global_step": 198051, "epoch": 2386} {"train_loss": -24.025129318237305, "global_step": 198052, "epoch": 2386} {"train_loss": -24.12166976928711, "global_step": 198053, "epoch": 2386} {"train_loss": -23.936079025268555, "global_step": 198054, "epoch": 2386} {"train_loss": -24.408456802368164, "global_step": 198055, "epoch": 2386} {"train_loss": -24.13319969177246, "global_step": 198056, "epoch": 2386} {"train_loss": -23.961896896362305, "global_step": 198057, "epoch": 2386} {"train_loss": -23.998523712158203, "global_step": 198058, "epoch": 2386} {"train_loss": -24.045284271240234, "global_step": 198059, "epoch": 2386} {"train_loss": -24.238168716430664, "global_step": 198060, "epoch": 2386} {"train_loss": -24.141794204711914, "global_step": 198061, "epoch": 2386} {"train_loss": -24.269149780273438, "global_step": 198062, "epoch": 2386} {"train_loss": -24.036104202270508, "global_step": 198063, "epoch": 2386} {"train_loss": -24.261865615844727, "global_step": 198064, "epoch": 2386} {"train_loss": -23.98732566833496, "global_step": 198065, "epoch": 2386} {"train_loss": -24.19512939453125, "global_step": 198066, "epoch": 2386} {"train_loss": -24.476680755615234, "global_step": 198067, "epoch": 2386} {"train_loss": -23.990095138549805, "global_step": 198068, "epoch": 2386} {"train_loss": -24.211688995361328, "global_step": 198069, "epoch": 2386} {"train_loss": -24.38734245300293, "global_step": 198070, "epoch": 2386} {"train_loss": -23.895349502563477, "global_step": 198071, "epoch": 2386} {"train_loss": -24.036157608032227, "global_step": 198072, "epoch": 2386} {"train_loss": -24.091171264648438, "global_step": 198073, "epoch": 2386} {"train_loss": -24.392667770385742, "global_step": 198074, "epoch": 2386} {"train_loss": -24.297958374023438, "global_step": 198075, "epoch": 2386} {"train_loss": -24.112226486206055, "global_step": 198076, "epoch": 2386} {"train_loss": -24.349096298217773, "global_step": 198077, "epoch": 2386} {"train_loss": -24.364484786987305, "global_step": 198078, "epoch": 2386} {"train_loss": -24.4829158782959, "global_step": 198079, "epoch": 2386} {"train_loss": -24.36895751953125, "global_step": 198080, "epoch": 2386} {"train_loss": -24.286863327026367, "global_step": 198081, "epoch": 2386} {"train_loss": -24.237180709838867, "global_step": 198082, "epoch": 2386} {"train_loss": -24.225894927978516, "global_step": 198083, "epoch": 2386} {"train_loss": -24.16252326965332, "global_step": 198084, "epoch": 2386} {"train_loss": -24.423721313476562, "global_step": 198085, "epoch": 2386} {"train_loss": -24.333707809448242, "global_step": 198086, "epoch": 2386} {"train_loss": -24.278532028198242, "global_step": 198087, "epoch": 2386} {"train_loss": -23.56484031677246, "global_step": 198088, "epoch": 2386} {"train_loss": -23.827056884765625, "global_step": 198089, "epoch": 2386} {"train_loss": -24.077247619628906, "global_step": 198090, "epoch": 2386} {"train_loss": -24.15989112854004, "global_step": 198091, "epoch": 2386} {"train_loss": -23.952627182006836, "global_step": 198092, "epoch": 2386} {"train_loss": -23.941923141479492, "global_step": 198093, "epoch": 2386} {"train_loss": -24.292516708374023, "global_step": 198094, "epoch": 2386} {"train_loss": -24.334562301635742, "global_step": 198095, "epoch": 2386} {"train_loss": -23.739248275756836, "global_step": 198096, "epoch": 2386} {"train_loss": -24.130680084228516, "global_step": 198097, "epoch": 2386} {"train_loss": -23.88703727722168, "global_step": 198098, "epoch": 2386} {"train_loss": -23.914403915405273, "global_step": 198099, "epoch": 2386} {"train_loss": -24.188562393188477, "global_step": 198100, "epoch": 2386} {"train_loss": -24.39096450805664, "global_step": 198101, "epoch": 2386} {"train_loss": -24.48356056213379, "global_step": 198102, "epoch": 2386} {"train_loss": -24.43379783630371, "global_step": 198103, "epoch": 2386} {"train_loss": -24.150964736938477, "global_step": 198104, "epoch": 2386} {"train_loss": -24.15097427368164, "global_step": 198105, "epoch": 2386} {"train_loss": -24.277708053588867, "global_step": 198106, "epoch": 2386} {"train_loss": -23.97173309326172, "global_step": 198107, "epoch": 2386} {"train_loss": -23.985925674438477, "global_step": 198108, "epoch": 2386} {"train_loss": -24.08888816833496, "global_step": 198109, "epoch": 2386} {"train_loss": -24.137975692749023, "global_step": 198110, "epoch": 2386} {"train_loss": -24.388870239257812, "global_step": 198111, "epoch": 2386} {"train_loss": -24.286407470703125, "global_step": 198112, "epoch": 2386} {"train_loss": -24.07291030883789, "global_step": 198113, "epoch": 2386} {"train_loss": -24.386598587036133, "global_step": 198114, "epoch": 2386} {"train_loss": -24.27754020690918, "global_step": 198115, "epoch": 2386} {"train_loss": -24.220075607299805, "global_step": 198116, "epoch": 2386} {"train_loss": -24.25090789794922, "global_step": 198117, "epoch": 2386} {"train_loss": -24.126123428344727, "global_step": 198118, "epoch": 2386} {"train_loss": -24.67348289489746, "global_step": 198119, "epoch": 2386} {"train_loss": -24.082616231527673, "global_step": 198120, "epoch": 2386, "val_loss": 6543968.0} {"train_loss": -23.55068016052246, "global_step": 198121, "epoch": 2387} {"train_loss": -24.169828414916992, "global_step": 198122, "epoch": 2387} {"train_loss": -24.069334030151367, "global_step": 198123, "epoch": 2387} {"train_loss": -23.681875228881836, "global_step": 198124, "epoch": 2387} {"train_loss": -23.985776901245117, "global_step": 198125, "epoch": 2387} {"train_loss": -24.09292984008789, "global_step": 198126, "epoch": 2387} {"train_loss": -23.93155288696289, "global_step": 198127, "epoch": 2387} {"train_loss": -24.244693756103516, "global_step": 198128, "epoch": 2387} {"train_loss": -24.144287109375, "global_step": 198129, "epoch": 2387} {"train_loss": -24.028392791748047, "global_step": 198130, "epoch": 2387} {"train_loss": -23.853191375732422, "global_step": 198131, "epoch": 2387} {"train_loss": -24.18737030029297, "global_step": 198132, "epoch": 2387} {"train_loss": -23.9111270904541, "global_step": 198133, "epoch": 2387} {"train_loss": -24.04750633239746, "global_step": 198134, "epoch": 2387} {"train_loss": -23.978788375854492, "global_step": 198135, "epoch": 2387} {"train_loss": -24.073198318481445, "global_step": 198136, "epoch": 2387} {"train_loss": -24.071985244750977, "global_step": 198137, "epoch": 2387} {"train_loss": -24.63068962097168, "global_step": 198138, "epoch": 2387} {"train_loss": -23.96053123474121, "global_step": 198139, "epoch": 2387} {"train_loss": -24.149694442749023, "global_step": 198140, "epoch": 2387} {"train_loss": -24.06569480895996, "global_step": 198141, "epoch": 2387} {"train_loss": -24.20003318786621, "global_step": 198142, "epoch": 2387} {"train_loss": -24.285568237304688, "global_step": 198143, "epoch": 2387} {"train_loss": -24.009321212768555, "global_step": 198144, "epoch": 2387} {"train_loss": -24.29750633239746, "global_step": 198145, "epoch": 2387} {"train_loss": -24.229251861572266, "global_step": 198146, "epoch": 2387} {"train_loss": -23.471424102783203, "global_step": 198147, "epoch": 2387} {"train_loss": -24.14698028564453, "global_step": 198148, "epoch": 2387} {"train_loss": -24.69881820678711, "global_step": 198149, "epoch": 2387} {"train_loss": -24.077972412109375, "global_step": 198150, "epoch": 2387} {"train_loss": -24.451242446899414, "global_step": 198151, "epoch": 2387} {"train_loss": -24.2938175201416, "global_step": 198152, "epoch": 2387} {"train_loss": -24.30605125427246, "global_step": 198153, "epoch": 2387} {"train_loss": -24.297101974487305, "global_step": 198154, "epoch": 2387} {"train_loss": -24.355680465698242, "global_step": 198155, "epoch": 2387} {"train_loss": -23.95606231689453, "global_step": 198156, "epoch": 2387} {"train_loss": -23.79305076599121, "global_step": 198157, "epoch": 2387} {"train_loss": -24.126041412353516, "global_step": 198158, "epoch": 2387} {"train_loss": -24.328533172607422, "global_step": 198159, "epoch": 2387} {"train_loss": -24.416488647460938, "global_step": 198160, "epoch": 2387} {"train_loss": -24.131765365600586, "global_step": 198161, "epoch": 2387} {"train_loss": -24.4163818359375, "global_step": 198162, "epoch": 2387} {"train_loss": -24.134187698364258, "global_step": 198163, "epoch": 2387} {"train_loss": -23.965578079223633, "global_step": 198164, "epoch": 2387} {"train_loss": -24.460519790649414, "global_step": 198165, "epoch": 2387} {"train_loss": -24.25935935974121, "global_step": 198166, "epoch": 2387} {"train_loss": -24.2769718170166, "global_step": 198167, "epoch": 2387} {"train_loss": -23.97047996520996, "global_step": 198168, "epoch": 2387} {"train_loss": -23.869226455688477, "global_step": 198169, "epoch": 2387} {"train_loss": -24.059467315673828, "global_step": 198170, "epoch": 2387} {"train_loss": -24.471887588500977, "global_step": 198171, "epoch": 2387} {"train_loss": -24.170347213745117, "global_step": 198172, "epoch": 2387} {"train_loss": -24.391239166259766, "global_step": 198173, "epoch": 2387} {"train_loss": -24.51396369934082, "global_step": 198174, "epoch": 2387} {"train_loss": -24.41436195373535, "global_step": 198175, "epoch": 2387} {"train_loss": -24.291627883911133, "global_step": 198176, "epoch": 2387} {"train_loss": -24.15289878845215, "global_step": 198177, "epoch": 2387} {"train_loss": -23.830305099487305, "global_step": 198178, "epoch": 2387} {"train_loss": -23.87006950378418, "global_step": 198179, "epoch": 2387} {"train_loss": -24.30500602722168, "global_step": 198180, "epoch": 2387} {"train_loss": -24.236154556274414, "global_step": 198181, "epoch": 2387} {"train_loss": -23.696475982666016, "global_step": 198182, "epoch": 2387} {"train_loss": -24.18427085876465, "global_step": 198183, "epoch": 2387} {"train_loss": -23.987897872924805, "global_step": 198184, "epoch": 2387} {"train_loss": -24.152658462524414, "global_step": 198185, "epoch": 2387} {"train_loss": -24.313446044921875, "global_step": 198186, "epoch": 2387} {"train_loss": -24.265905380249023, "global_step": 198187, "epoch": 2387} {"train_loss": -24.126550674438477, "global_step": 198188, "epoch": 2387} {"train_loss": -24.25315284729004, "global_step": 198189, "epoch": 2387} {"train_loss": -24.497182846069336, "global_step": 198190, "epoch": 2387} {"train_loss": -24.045984268188477, "global_step": 198191, "epoch": 2387} {"train_loss": -24.374906539916992, "global_step": 198192, "epoch": 2387} {"train_loss": -24.32143211364746, "global_step": 198193, "epoch": 2387} {"train_loss": -24.3055419921875, "global_step": 198194, "epoch": 2387} {"train_loss": -24.451608657836914, "global_step": 198195, "epoch": 2387} {"train_loss": -24.223012924194336, "global_step": 198196, "epoch": 2387} {"train_loss": -23.954694747924805, "global_step": 198197, "epoch": 2387} {"train_loss": -24.6646785736084, "global_step": 198198, "epoch": 2387} {"train_loss": -24.306964874267578, "global_step": 198199, "epoch": 2387} {"train_loss": -24.5765380859375, "global_step": 198200, "epoch": 2387} {"train_loss": -24.263334274291992, "global_step": 198201, "epoch": 2387} {"train_loss": -24.316368103027344, "global_step": 198202, "epoch": 2387} {"train_loss": -24.174711411257825, "global_step": 198203, "epoch": 2387, "val_loss": 6510672.0} {"train_loss": -24.506183624267578, "global_step": 198204, "epoch": 2388} {"train_loss": -23.853490829467773, "global_step": 198205, "epoch": 2388} {"train_loss": -23.978370666503906, "global_step": 198206, "epoch": 2388} {"train_loss": -24.222003936767578, "global_step": 198207, "epoch": 2388} {"train_loss": -23.98549461364746, "global_step": 198208, "epoch": 2388} {"train_loss": -24.240829467773438, "global_step": 198209, "epoch": 2388} {"train_loss": -24.017993927001953, "global_step": 198210, "epoch": 2388} {"train_loss": -24.030309677124023, "global_step": 198211, "epoch": 2388} {"train_loss": -24.153305053710938, "global_step": 198212, "epoch": 2388} {"train_loss": -24.019872665405273, "global_step": 198213, "epoch": 2388} {"train_loss": -23.984256744384766, "global_step": 198214, "epoch": 2388} {"train_loss": -24.361526489257812, "global_step": 198215, "epoch": 2388} {"train_loss": -24.304983139038086, "global_step": 198216, "epoch": 2388} {"train_loss": -24.450544357299805, "global_step": 198217, "epoch": 2388} {"train_loss": -24.11358070373535, "global_step": 198218, "epoch": 2388} {"train_loss": -24.63434410095215, "global_step": 198219, "epoch": 2388} {"train_loss": -24.0336856842041, "global_step": 198220, "epoch": 2388} {"train_loss": -24.20808982849121, "global_step": 198221, "epoch": 2388} {"train_loss": -24.232791900634766, "global_step": 198222, "epoch": 2388} {"train_loss": -24.572345733642578, "global_step": 198223, "epoch": 2388} {"train_loss": -24.084447860717773, "global_step": 198224, "epoch": 2388} {"train_loss": -23.960243225097656, "global_step": 198225, "epoch": 2388} {"train_loss": -24.05219078063965, "global_step": 198226, "epoch": 2388} {"train_loss": -24.000425338745117, "global_step": 198227, "epoch": 2388} {"train_loss": -24.156538009643555, "global_step": 198228, "epoch": 2388} {"train_loss": -23.955923080444336, "global_step": 198229, "epoch": 2388} {"train_loss": -24.580917358398438, "global_step": 198230, "epoch": 2388} {"train_loss": -24.23261833190918, "global_step": 198231, "epoch": 2388} {"train_loss": -24.456357955932617, "global_step": 198232, "epoch": 2388} {"train_loss": -24.243392944335938, "global_step": 198233, "epoch": 2388} {"train_loss": -24.042997360229492, "global_step": 198234, "epoch": 2388} {"train_loss": -24.04866600036621, "global_step": 198235, "epoch": 2388} {"train_loss": -24.317712783813477, "global_step": 198236, "epoch": 2388} {"train_loss": -24.263208389282227, "global_step": 198237, "epoch": 2388} {"train_loss": -24.16773796081543, "global_step": 198238, "epoch": 2388} {"train_loss": -24.29751968383789, "global_step": 198239, "epoch": 2388} {"train_loss": -24.14948272705078, "global_step": 198240, "epoch": 2388} {"train_loss": -23.851064682006836, "global_step": 198241, "epoch": 2388} {"train_loss": -24.336444854736328, "global_step": 198242, "epoch": 2388} {"train_loss": -23.990421295166016, "global_step": 198243, "epoch": 2388} {"train_loss": -24.35906982421875, "global_step": 198244, "epoch": 2388} {"train_loss": -24.39217185974121, "global_step": 198245, "epoch": 2388} {"train_loss": -24.41080093383789, "global_step": 198246, "epoch": 2388} {"train_loss": -23.961328506469727, "global_step": 198247, "epoch": 2388} {"train_loss": -24.29456901550293, "global_step": 198248, "epoch": 2388} {"train_loss": -24.058841705322266, "global_step": 198249, "epoch": 2388} {"train_loss": -24.644681930541992, "global_step": 198250, "epoch": 2388} {"train_loss": -23.935869216918945, "global_step": 198251, "epoch": 2388} {"train_loss": -24.27987289428711, "global_step": 198252, "epoch": 2388} {"train_loss": -23.970502853393555, "global_step": 198253, "epoch": 2388} {"train_loss": -24.08721160888672, "global_step": 198254, "epoch": 2388} {"train_loss": -24.2431583404541, "global_step": 198255, "epoch": 2388} {"train_loss": -24.489112854003906, "global_step": 198256, "epoch": 2388} {"train_loss": -24.29248809814453, "global_step": 198257, "epoch": 2388} {"train_loss": -24.598512649536133, "global_step": 198258, "epoch": 2388} {"train_loss": -24.481687545776367, "global_step": 198259, "epoch": 2388} {"train_loss": -24.52213478088379, "global_step": 198260, "epoch": 2388} {"train_loss": -24.470579147338867, "global_step": 198261, "epoch": 2388} {"train_loss": -24.0361328125, "global_step": 198262, "epoch": 2388} {"train_loss": -24.215986251831055, "global_step": 198263, "epoch": 2388} {"train_loss": -24.333784103393555, "global_step": 198264, "epoch": 2388} {"train_loss": -24.37900161743164, "global_step": 198265, "epoch": 2388} {"train_loss": -24.37323570251465, "global_step": 198266, "epoch": 2388} {"train_loss": -24.101730346679688, "global_step": 198267, "epoch": 2388} {"train_loss": -24.4437313079834, "global_step": 198268, "epoch": 2388} {"train_loss": -24.23833656311035, "global_step": 198269, "epoch": 2388} {"train_loss": -24.47536277770996, "global_step": 198270, "epoch": 2388} {"train_loss": -24.540029525756836, "global_step": 198271, "epoch": 2388} {"train_loss": -24.179943084716797, "global_step": 198272, "epoch": 2388} {"train_loss": -24.414480209350586, "global_step": 198273, "epoch": 2388} {"train_loss": -24.164098739624023, "global_step": 198274, "epoch": 2388} {"train_loss": -24.28133201599121, "global_step": 198275, "epoch": 2388} {"train_loss": -24.801376342773438, "global_step": 198276, "epoch": 2388} {"train_loss": -24.00800132751465, "global_step": 198277, "epoch": 2388} {"train_loss": -24.426679611206055, "global_step": 198278, "epoch": 2388} {"train_loss": -24.07961082458496, "global_step": 198279, "epoch": 2388} {"train_loss": -24.45530128479004, "global_step": 198280, "epoch": 2388} {"train_loss": -24.24464988708496, "global_step": 198281, "epoch": 2388} {"train_loss": -24.672483444213867, "global_step": 198282, "epoch": 2388} {"train_loss": -24.162092208862305, "global_step": 198283, "epoch": 2388} {"train_loss": -24.37148666381836, "global_step": 198284, "epoch": 2388} {"train_loss": -24.110441207885742, "global_step": 198285, "epoch": 2388} {"train_loss": -24.23327425301793, "global_step": 198286, "epoch": 2388, "val_loss": 6571400.0} {"train_loss": -24.137130737304688, "global_step": 198287, "epoch": 2389} {"train_loss": -23.786161422729492, "global_step": 198288, "epoch": 2389} {"train_loss": -24.151824951171875, "global_step": 198289, "epoch": 2389} {"train_loss": -24.285003662109375, "global_step": 198290, "epoch": 2389} {"train_loss": -23.721981048583984, "global_step": 198291, "epoch": 2389} {"train_loss": -24.125104904174805, "global_step": 198292, "epoch": 2389} {"train_loss": -24.368335723876953, "global_step": 198293, "epoch": 2389} {"train_loss": -24.23909568786621, "global_step": 198294, "epoch": 2389} {"train_loss": -24.406049728393555, "global_step": 198295, "epoch": 2389} {"train_loss": -24.363025665283203, "global_step": 198296, "epoch": 2389} {"train_loss": -23.871938705444336, "global_step": 198297, "epoch": 2389} {"train_loss": -23.97605323791504, "global_step": 198298, "epoch": 2389} {"train_loss": -24.202547073364258, "global_step": 198299, "epoch": 2389} {"train_loss": -24.28606605529785, "global_step": 198300, "epoch": 2389} {"train_loss": -24.395544052124023, "global_step": 198301, "epoch": 2389} {"train_loss": -24.260162353515625, "global_step": 198302, "epoch": 2389} {"train_loss": -23.749860763549805, "global_step": 198303, "epoch": 2389} {"train_loss": -23.75147819519043, "global_step": 198304, "epoch": 2389} {"train_loss": -24.010540008544922, "global_step": 198305, "epoch": 2389} {"train_loss": -24.005935668945312, "global_step": 198306, "epoch": 2389} {"train_loss": -23.879043579101562, "global_step": 198307, "epoch": 2389} {"train_loss": -23.88611602783203, "global_step": 198308, "epoch": 2389} {"train_loss": -24.033788681030273, "global_step": 198309, "epoch": 2389} {"train_loss": -24.027185440063477, "global_step": 198310, "epoch": 2389} {"train_loss": -23.738672256469727, "global_step": 198311, "epoch": 2389} {"train_loss": -24.197647094726562, "global_step": 198312, "epoch": 2389} {"train_loss": -24.11983299255371, "global_step": 198313, "epoch": 2389} {"train_loss": -24.145294189453125, "global_step": 198314, "epoch": 2389} {"train_loss": -24.292667388916016, "global_step": 198315, "epoch": 2389} {"train_loss": -23.930198669433594, "global_step": 198316, "epoch": 2389} {"train_loss": -24.49619483947754, "global_step": 198317, "epoch": 2389} {"train_loss": -24.116247177124023, "global_step": 198318, "epoch": 2389} {"train_loss": -24.30251121520996, "global_step": 198319, "epoch": 2389} {"train_loss": -24.314151763916016, "global_step": 198320, "epoch": 2389} {"train_loss": -23.87049674987793, "global_step": 198321, "epoch": 2389} {"train_loss": -24.16412925720215, "global_step": 198322, "epoch": 2389} {"train_loss": -24.279272079467773, "global_step": 198323, "epoch": 2389} {"train_loss": -24.25908660888672, "global_step": 198324, "epoch": 2389} {"train_loss": -24.419370651245117, "global_step": 198325, "epoch": 2389} {"train_loss": -24.243486404418945, "global_step": 198326, "epoch": 2389} {"train_loss": -24.015522003173828, "global_step": 198327, "epoch": 2389} {"train_loss": -24.212331771850586, "global_step": 198328, "epoch": 2389} {"train_loss": -24.23261070251465, "global_step": 198329, "epoch": 2389} {"train_loss": -24.107070922851562, "global_step": 198330, "epoch": 2389} {"train_loss": -24.169179916381836, "global_step": 198331, "epoch": 2389} {"train_loss": -24.14129638671875, "global_step": 198332, "epoch": 2389} {"train_loss": -24.35847282409668, "global_step": 198333, "epoch": 2389} {"train_loss": -24.53395652770996, "global_step": 198334, "epoch": 2389} {"train_loss": -24.17548179626465, "global_step": 198335, "epoch": 2389} {"train_loss": -24.17531394958496, "global_step": 198336, "epoch": 2389} {"train_loss": -24.295827865600586, "global_step": 198337, "epoch": 2389} {"train_loss": -24.506315231323242, "global_step": 198338, "epoch": 2389} {"train_loss": -23.97857666015625, "global_step": 198339, "epoch": 2389} {"train_loss": -24.420263290405273, "global_step": 198340, "epoch": 2389} {"train_loss": -24.278379440307617, "global_step": 198341, "epoch": 2389} {"train_loss": -24.409912109375, "global_step": 198342, "epoch": 2389} {"train_loss": -24.4700984954834, "global_step": 198343, "epoch": 2389} {"train_loss": -24.08133888244629, "global_step": 198344, "epoch": 2389} {"train_loss": -23.95993423461914, "global_step": 198345, "epoch": 2389} {"train_loss": -23.87859535217285, "global_step": 198346, "epoch": 2389} {"train_loss": -24.27695655822754, "global_step": 198347, "epoch": 2389} {"train_loss": -24.36109161376953, "global_step": 198348, "epoch": 2389} {"train_loss": -24.081424713134766, "global_step": 198349, "epoch": 2389} {"train_loss": -23.80272674560547, "global_step": 198350, "epoch": 2389} {"train_loss": -23.994794845581055, "global_step": 198351, "epoch": 2389} {"train_loss": -24.245569229125977, "global_step": 198352, "epoch": 2389} {"train_loss": -24.126310348510742, "global_step": 198353, "epoch": 2389} {"train_loss": -24.169919967651367, "global_step": 198354, "epoch": 2389} {"train_loss": -24.30853271484375, "global_step": 198355, "epoch": 2389} {"train_loss": -24.460172653198242, "global_step": 198356, "epoch": 2389} {"train_loss": -24.429716110229492, "global_step": 198357, "epoch": 2389} {"train_loss": -23.904762268066406, "global_step": 198358, "epoch": 2389} {"train_loss": -24.036386489868164, "global_step": 198359, "epoch": 2389} {"train_loss": -23.882963180541992, "global_step": 198360, "epoch": 2389} {"train_loss": -24.18532371520996, "global_step": 198361, "epoch": 2389} {"train_loss": -24.118026733398438, "global_step": 198362, "epoch": 2389} {"train_loss": -24.51283073425293, "global_step": 198363, "epoch": 2389} {"train_loss": -24.800790786743164, "global_step": 198364, "epoch": 2389} {"train_loss": -24.40425682067871, "global_step": 198365, "epoch": 2389} {"train_loss": -24.445104598999023, "global_step": 198366, "epoch": 2389} {"train_loss": -24.241668701171875, "global_step": 198367, "epoch": 2389} {"train_loss": -24.390012741088867, "global_step": 198368, "epoch": 2389} {"train_loss": -24.179631980068713, "global_step": 198369, "epoch": 2389, "val_loss": 6641358.0} {"train_loss": -23.851341247558594, "global_step": 198370, "epoch": 2390} {"train_loss": -23.94428062438965, "global_step": 198371, "epoch": 2390} {"train_loss": -23.667753219604492, "global_step": 198372, "epoch": 2390} {"train_loss": -23.735605239868164, "global_step": 198373, "epoch": 2390} {"train_loss": -23.87483787536621, "global_step": 198374, "epoch": 2390} {"train_loss": -23.74582862854004, "global_step": 198375, "epoch": 2390} {"train_loss": -23.94875144958496, "global_step": 198376, "epoch": 2390} {"train_loss": -23.506561279296875, "global_step": 198377, "epoch": 2390} {"train_loss": -23.72352409362793, "global_step": 198378, "epoch": 2390} {"train_loss": -24.09256935119629, "global_step": 198379, "epoch": 2390} {"train_loss": -23.820011138916016, "global_step": 198380, "epoch": 2390} {"train_loss": -24.21253776550293, "global_step": 198381, "epoch": 2390} {"train_loss": -23.54119300842285, "global_step": 198382, "epoch": 2390} {"train_loss": -23.906293869018555, "global_step": 198383, "epoch": 2390} {"train_loss": -23.803747177124023, "global_step": 198384, "epoch": 2390} {"train_loss": -24.043304443359375, "global_step": 198385, "epoch": 2390} {"train_loss": -23.63372230529785, "global_step": 198386, "epoch": 2390} {"train_loss": -23.923908233642578, "global_step": 198387, "epoch": 2390} {"train_loss": -24.01789093017578, "global_step": 198388, "epoch": 2390} {"train_loss": -24.242074966430664, "global_step": 198389, "epoch": 2390} {"train_loss": -23.88871192932129, "global_step": 198390, "epoch": 2390} {"train_loss": -23.940156936645508, "global_step": 198391, "epoch": 2390} {"train_loss": -23.948537826538086, "global_step": 198392, "epoch": 2390} {"train_loss": -24.041309356689453, "global_step": 198393, "epoch": 2390} {"train_loss": -24.385522842407227, "global_step": 198394, "epoch": 2390} {"train_loss": -24.43100929260254, "global_step": 198395, "epoch": 2390} {"train_loss": -24.09720230102539, "global_step": 198396, "epoch": 2390} {"train_loss": -24.029006958007812, "global_step": 198397, "epoch": 2390} {"train_loss": -24.358060836791992, "global_step": 198398, "epoch": 2390} {"train_loss": -24.547754287719727, "global_step": 198399, "epoch": 2390} {"train_loss": -24.620059967041016, "global_step": 198400, "epoch": 2390} {"train_loss": -24.313886642456055, "global_step": 198401, "epoch": 2390} {"train_loss": -24.04136085510254, "global_step": 198402, "epoch": 2390} {"train_loss": -24.326923370361328, "global_step": 198403, "epoch": 2390} {"train_loss": -24.03989028930664, "global_step": 198404, "epoch": 2390} {"train_loss": -24.24196434020996, "global_step": 198405, "epoch": 2390} {"train_loss": -24.504663467407227, "global_step": 198406, "epoch": 2390} {"train_loss": -24.263620376586914, "global_step": 198407, "epoch": 2390} {"train_loss": -24.208898544311523, "global_step": 198408, "epoch": 2390} {"train_loss": -24.427061080932617, "global_step": 198409, "epoch": 2390} {"train_loss": -24.269948959350586, "global_step": 198410, "epoch": 2390} {"train_loss": -24.352895736694336, "global_step": 198411, "epoch": 2390} {"train_loss": -24.532089233398438, "global_step": 198412, "epoch": 2390} {"train_loss": -24.14817237854004, "global_step": 198413, "epoch": 2390} {"train_loss": -23.931276321411133, "global_step": 198414, "epoch": 2390} {"train_loss": -24.590423583984375, "global_step": 198415, "epoch": 2390} {"train_loss": -24.02372169494629, "global_step": 198416, "epoch": 2390} {"train_loss": -24.37114906311035, "global_step": 198417, "epoch": 2390} {"train_loss": -24.194705963134766, "global_step": 198418, "epoch": 2390} {"train_loss": -24.199115753173828, "global_step": 198419, "epoch": 2390} {"train_loss": -23.95583152770996, "global_step": 198420, "epoch": 2390} {"train_loss": -24.391040802001953, "global_step": 198421, "epoch": 2390} {"train_loss": -24.7554931640625, "global_step": 198422, "epoch": 2390} {"train_loss": -24.340002059936523, "global_step": 198423, "epoch": 2390} {"train_loss": -24.24907875061035, "global_step": 198424, "epoch": 2390} {"train_loss": -24.692983627319336, "global_step": 198425, "epoch": 2390} {"train_loss": -24.3614501953125, "global_step": 198426, "epoch": 2390} {"train_loss": -24.2376766204834, "global_step": 198427, "epoch": 2390} {"train_loss": -24.276350021362305, "global_step": 198428, "epoch": 2390} {"train_loss": -24.05793571472168, "global_step": 198429, "epoch": 2390} {"train_loss": -24.161739349365234, "global_step": 198430, "epoch": 2390} {"train_loss": -24.458158493041992, "global_step": 198431, "epoch": 2390} {"train_loss": -24.46327781677246, "global_step": 198432, "epoch": 2390} {"train_loss": -24.284194946289062, "global_step": 198433, "epoch": 2390} {"train_loss": -24.158180236816406, "global_step": 198434, "epoch": 2390} {"train_loss": -24.14734649658203, "global_step": 198435, "epoch": 2390} {"train_loss": -24.2435302734375, "global_step": 198436, "epoch": 2390} {"train_loss": -24.027692794799805, "global_step": 198437, "epoch": 2390} {"train_loss": -24.008024215698242, "global_step": 198438, "epoch": 2390} {"train_loss": -24.10529136657715, "global_step": 198439, "epoch": 2390} {"train_loss": -24.091833114624023, "global_step": 198440, "epoch": 2390} {"train_loss": -24.246753692626953, "global_step": 198441, "epoch": 2390} {"train_loss": -24.349233627319336, "global_step": 198442, "epoch": 2390} {"train_loss": -24.5022029876709, "global_step": 198443, "epoch": 2390} {"train_loss": -24.089460372924805, "global_step": 198444, "epoch": 2390} {"train_loss": -24.030973434448242, "global_step": 198445, "epoch": 2390} {"train_loss": -24.23396873474121, "global_step": 198446, "epoch": 2390} {"train_loss": -24.2027530670166, "global_step": 198447, "epoch": 2390} {"train_loss": -24.56669807434082, "global_step": 198448, "epoch": 2390} {"train_loss": -24.26261329650879, "global_step": 198449, "epoch": 2390} {"train_loss": -24.167570114135742, "global_step": 198450, "epoch": 2390} {"train_loss": -24.42278289794922, "global_step": 198451, "epoch": 2390} {"train_loss": -24.15765346389219, "global_step": 198452, "epoch": 2390, "val_loss": 6553280.0} {"train_loss": -24.122928619384766, "global_step": 198453, "epoch": 2391} {"train_loss": -23.863258361816406, "global_step": 198454, "epoch": 2391} {"train_loss": -24.39576530456543, "global_step": 198455, "epoch": 2391} {"train_loss": -23.7512149810791, "global_step": 198456, "epoch": 2391} {"train_loss": -24.102888107299805, "global_step": 198457, "epoch": 2391} {"train_loss": -23.93105125427246, "global_step": 198458, "epoch": 2391} {"train_loss": -23.715965270996094, "global_step": 198459, "epoch": 2391} {"train_loss": -23.794328689575195, "global_step": 198460, "epoch": 2391} {"train_loss": -23.834819793701172, "global_step": 198461, "epoch": 2391} {"train_loss": -24.120241165161133, "global_step": 198462, "epoch": 2391} {"train_loss": -24.18403434753418, "global_step": 198463, "epoch": 2391} {"train_loss": -23.99091911315918, "global_step": 198464, "epoch": 2391} {"train_loss": -23.763980865478516, "global_step": 198465, "epoch": 2391} {"train_loss": -24.44484519958496, "global_step": 198466, "epoch": 2391} {"train_loss": -24.2337589263916, "global_step": 198467, "epoch": 2391} {"train_loss": -23.89474868774414, "global_step": 198468, "epoch": 2391} {"train_loss": -24.402280807495117, "global_step": 198469, "epoch": 2391} {"train_loss": -24.36787986755371, "global_step": 198470, "epoch": 2391} {"train_loss": -24.050390243530273, "global_step": 198471, "epoch": 2391} {"train_loss": -23.992080688476562, "global_step": 198472, "epoch": 2391} {"train_loss": -24.135671615600586, "global_step": 198473, "epoch": 2391} {"train_loss": -24.458797454833984, "global_step": 198474, "epoch": 2391} {"train_loss": -24.284250259399414, "global_step": 198475, "epoch": 2391} {"train_loss": -24.293537139892578, "global_step": 198476, "epoch": 2391} {"train_loss": -24.121509552001953, "global_step": 198477, "epoch": 2391} {"train_loss": -24.209583282470703, "global_step": 198478, "epoch": 2391} {"train_loss": -24.514921188354492, "global_step": 198479, "epoch": 2391} {"train_loss": -24.508638381958008, "global_step": 198480, "epoch": 2391} {"train_loss": -24.33601951599121, "global_step": 198481, "epoch": 2391} {"train_loss": -24.268817901611328, "global_step": 198482, "epoch": 2391} {"train_loss": -24.695058822631836, "global_step": 198483, "epoch": 2391} {"train_loss": -24.26161003112793, "global_step": 198484, "epoch": 2391} {"train_loss": -24.238365173339844, "global_step": 198485, "epoch": 2391} {"train_loss": -23.911575317382812, "global_step": 198486, "epoch": 2391} {"train_loss": -24.233121871948242, "global_step": 198487, "epoch": 2391} {"train_loss": -24.329030990600586, "global_step": 198488, "epoch": 2391} {"train_loss": -24.06821060180664, "global_step": 198489, "epoch": 2391} {"train_loss": -24.476404190063477, "global_step": 198490, "epoch": 2391} {"train_loss": -24.66228485107422, "global_step": 198491, "epoch": 2391} {"train_loss": -24.52377700805664, "global_step": 198492, "epoch": 2391} {"train_loss": -24.713891983032227, "global_step": 198493, "epoch": 2391} {"train_loss": -24.33338737487793, "global_step": 198494, "epoch": 2391} {"train_loss": -24.635549545288086, "global_step": 198495, "epoch": 2391} {"train_loss": -24.455535888671875, "global_step": 198496, "epoch": 2391} {"train_loss": -24.518701553344727, "global_step": 198497, "epoch": 2391} {"train_loss": -24.28934669494629, "global_step": 198498, "epoch": 2391} {"train_loss": -24.308218002319336, "global_step": 198499, "epoch": 2391} {"train_loss": -24.216901779174805, "global_step": 198500, "epoch": 2391} {"train_loss": -24.258991241455078, "global_step": 198501, "epoch": 2391} {"train_loss": -24.527013778686523, "global_step": 198502, "epoch": 2391} {"train_loss": -24.292295455932617, "global_step": 198503, "epoch": 2391} {"train_loss": -24.70749855041504, "global_step": 198504, "epoch": 2391} {"train_loss": -24.264892578125, "global_step": 198505, "epoch": 2391} {"train_loss": -24.105527877807617, "global_step": 198506, "epoch": 2391} {"train_loss": -23.847482681274414, "global_step": 198507, "epoch": 2391} {"train_loss": -24.097803115844727, "global_step": 198508, "epoch": 2391} {"train_loss": -24.02422523498535, "global_step": 198509, "epoch": 2391} {"train_loss": -23.718090057373047, "global_step": 198510, "epoch": 2391} {"train_loss": -23.388547897338867, "global_step": 198511, "epoch": 2391} {"train_loss": -23.67190933227539, "global_step": 198512, "epoch": 2391} {"train_loss": -23.963380813598633, "global_step": 198513, "epoch": 2391} {"train_loss": -24.073974609375, "global_step": 198514, "epoch": 2391} {"train_loss": -23.58734703063965, "global_step": 198515, "epoch": 2391} {"train_loss": -24.04770851135254, "global_step": 198516, "epoch": 2391} {"train_loss": -24.34765625, "global_step": 198517, "epoch": 2391} {"train_loss": -24.063522338867188, "global_step": 198518, "epoch": 2391} {"train_loss": -23.87101173400879, "global_step": 198519, "epoch": 2391} {"train_loss": -24.333860397338867, "global_step": 198520, "epoch": 2391} {"train_loss": -23.987009048461914, "global_step": 198521, "epoch": 2391} {"train_loss": -23.961442947387695, "global_step": 198522, "epoch": 2391} {"train_loss": -24.013227462768555, "global_step": 198523, "epoch": 2391} {"train_loss": -24.35968589782715, "global_step": 198524, "epoch": 2391} {"train_loss": -23.85456657409668, "global_step": 198525, "epoch": 2391} {"train_loss": -24.32122039794922, "global_step": 198526, "epoch": 2391} {"train_loss": -24.081439971923828, "global_step": 198527, "epoch": 2391} {"train_loss": -23.758285522460938, "global_step": 198528, "epoch": 2391} {"train_loss": -24.116260528564453, "global_step": 198529, "epoch": 2391} {"train_loss": -24.386857986450195, "global_step": 198530, "epoch": 2391} {"train_loss": -24.31186866760254, "global_step": 198531, "epoch": 2391} {"train_loss": -24.283960342407227, "global_step": 198532, "epoch": 2391} {"train_loss": -24.08258628845215, "global_step": 198533, "epoch": 2391} {"train_loss": -24.554901123046875, "global_step": 198534, "epoch": 2391} {"train_loss": -24.16645050048828, "global_step": 198535, "epoch": 2391, "val_loss": 6423997.0} {"train_loss": -24.230512619018555, "global_step": 198536, "epoch": 2392} {"train_loss": -24.33046531677246, "global_step": 198537, "epoch": 2392} {"train_loss": -24.30605125427246, "global_step": 198538, "epoch": 2392} {"train_loss": -23.664756774902344, "global_step": 198539, "epoch": 2392} {"train_loss": -24.267820358276367, "global_step": 198540, "epoch": 2392} {"train_loss": -23.70725440979004, "global_step": 198541, "epoch": 2392} {"train_loss": -23.90069580078125, "global_step": 198542, "epoch": 2392} {"train_loss": -24.129880905151367, "global_step": 198543, "epoch": 2392} {"train_loss": -24.402496337890625, "global_step": 198544, "epoch": 2392} {"train_loss": -24.02703285217285, "global_step": 198545, "epoch": 2392} {"train_loss": -23.95411491394043, "global_step": 198546, "epoch": 2392} {"train_loss": -24.384517669677734, "global_step": 198547, "epoch": 2392} {"train_loss": -24.032737731933594, "global_step": 198548, "epoch": 2392} {"train_loss": -24.357749938964844, "global_step": 198549, "epoch": 2392} {"train_loss": -24.255353927612305, "global_step": 198550, "epoch": 2392} {"train_loss": -24.180463790893555, "global_step": 198551, "epoch": 2392} {"train_loss": -24.482778549194336, "global_step": 198552, "epoch": 2392} {"train_loss": -24.044095993041992, "global_step": 198553, "epoch": 2392} {"train_loss": -24.202045440673828, "global_step": 198554, "epoch": 2392} {"train_loss": -24.3665828704834, "global_step": 198555, "epoch": 2392} {"train_loss": -24.493932723999023, "global_step": 198556, "epoch": 2392} {"train_loss": -24.05120086669922, "global_step": 198557, "epoch": 2392} {"train_loss": -24.53607749938965, "global_step": 198558, "epoch": 2392} {"train_loss": -24.360525131225586, "global_step": 198559, "epoch": 2392} {"train_loss": -24.42922019958496, "global_step": 198560, "epoch": 2392} {"train_loss": -24.261886596679688, "global_step": 198561, "epoch": 2392} {"train_loss": -23.801502227783203, "global_step": 198562, "epoch": 2392} {"train_loss": -23.883995056152344, "global_step": 198563, "epoch": 2392} {"train_loss": -24.38144874572754, "global_step": 198564, "epoch": 2392} {"train_loss": -24.600976943969727, "global_step": 198565, "epoch": 2392} {"train_loss": -24.37099838256836, "global_step": 198566, "epoch": 2392} {"train_loss": -23.982839584350586, "global_step": 198567, "epoch": 2392} {"train_loss": -24.35846519470215, "global_step": 198568, "epoch": 2392} {"train_loss": -23.847761154174805, "global_step": 198569, "epoch": 2392} {"train_loss": -24.78257179260254, "global_step": 198570, "epoch": 2392} {"train_loss": -23.82691764831543, "global_step": 198571, "epoch": 2392} {"train_loss": -24.388334274291992, "global_step": 198572, "epoch": 2392} {"train_loss": -23.92698860168457, "global_step": 198573, "epoch": 2392} {"train_loss": -24.464887619018555, "global_step": 198574, "epoch": 2392} {"train_loss": -24.123838424682617, "global_step": 198575, "epoch": 2392} {"train_loss": -24.19430160522461, "global_step": 198576, "epoch": 2392} {"train_loss": -24.34926986694336, "global_step": 198577, "epoch": 2392} {"train_loss": -24.25556755065918, "global_step": 198578, "epoch": 2392} {"train_loss": -24.055538177490234, "global_step": 198579, "epoch": 2392} {"train_loss": -24.211978912353516, "global_step": 198580, "epoch": 2392} {"train_loss": -24.444931030273438, "global_step": 198581, "epoch": 2392} {"train_loss": -24.055715560913086, "global_step": 198582, "epoch": 2392} {"train_loss": -24.24122428894043, "global_step": 198583, "epoch": 2392} {"train_loss": -24.30338478088379, "global_step": 198584, "epoch": 2392} {"train_loss": -24.248178482055664, "global_step": 198585, "epoch": 2392} {"train_loss": -24.093088150024414, "global_step": 198586, "epoch": 2392} {"train_loss": -24.569028854370117, "global_step": 198587, "epoch": 2392} {"train_loss": -24.27246856689453, "global_step": 198588, "epoch": 2392} {"train_loss": -24.375364303588867, "global_step": 198589, "epoch": 2392} {"train_loss": -24.255796432495117, "global_step": 198590, "epoch": 2392} {"train_loss": -24.212560653686523, "global_step": 198591, "epoch": 2392} {"train_loss": -24.34097671508789, "global_step": 198592, "epoch": 2392} {"train_loss": -23.985837936401367, "global_step": 198593, "epoch": 2392} {"train_loss": -24.015472412109375, "global_step": 198594, "epoch": 2392} {"train_loss": -24.114946365356445, "global_step": 198595, "epoch": 2392} {"train_loss": -24.280105590820312, "global_step": 198596, "epoch": 2392} {"train_loss": -24.275562286376953, "global_step": 198597, "epoch": 2392} {"train_loss": -24.21639633178711, "global_step": 198598, "epoch": 2392} {"train_loss": -24.222339630126953, "global_step": 198599, "epoch": 2392} {"train_loss": -24.003324508666992, "global_step": 198600, "epoch": 2392} {"train_loss": -24.323610305786133, "global_step": 198601, "epoch": 2392} {"train_loss": -24.630672454833984, "global_step": 198602, "epoch": 2392} {"train_loss": -24.022680282592773, "global_step": 198603, "epoch": 2392} {"train_loss": -24.404306411743164, "global_step": 198604, "epoch": 2392} {"train_loss": -24.128515243530273, "global_step": 198605, "epoch": 2392} {"train_loss": -24.35529136657715, "global_step": 198606, "epoch": 2392} {"train_loss": -23.902236938476562, "global_step": 198607, "epoch": 2392} {"train_loss": -24.070022583007812, "global_step": 198608, "epoch": 2392} {"train_loss": -24.59004783630371, "global_step": 198609, "epoch": 2392} {"train_loss": -24.068744659423828, "global_step": 198610, "epoch": 2392} {"train_loss": -24.452285766601562, "global_step": 198611, "epoch": 2392} {"train_loss": -24.2402400970459, "global_step": 198612, "epoch": 2392} {"train_loss": -24.213804244995117, "global_step": 198613, "epoch": 2392} {"train_loss": -24.191808700561523, "global_step": 198614, "epoch": 2392} {"train_loss": -24.265666961669922, "global_step": 198615, "epoch": 2392} {"train_loss": -24.015981674194336, "global_step": 198616, "epoch": 2392} {"train_loss": -24.401700973510742, "global_step": 198617, "epoch": 2392} {"train_loss": -24.22984091057835, "global_step": 198618, "epoch": 2392, "val_loss": 6647691.5} {"train_loss": -24.04559326171875, "global_step": 198619, "epoch": 2393} {"train_loss": -23.617822647094727, "global_step": 198620, "epoch": 2393} {"train_loss": -23.769025802612305, "global_step": 198621, "epoch": 2393} {"train_loss": -23.94061851501465, "global_step": 198622, "epoch": 2393} {"train_loss": -24.12580680847168, "global_step": 198623, "epoch": 2393} {"train_loss": -24.001922607421875, "global_step": 198624, "epoch": 2393} {"train_loss": -24.291425704956055, "global_step": 198625, "epoch": 2393} {"train_loss": -23.969619750976562, "global_step": 198626, "epoch": 2393} {"train_loss": -24.221389770507812, "global_step": 198627, "epoch": 2393} {"train_loss": -23.659732818603516, "global_step": 198628, "epoch": 2393} {"train_loss": -24.34522819519043, "global_step": 198629, "epoch": 2393} {"train_loss": -23.667728424072266, "global_step": 198630, "epoch": 2393} {"train_loss": -23.664653778076172, "global_step": 198631, "epoch": 2393} {"train_loss": -23.806772232055664, "global_step": 198632, "epoch": 2393} {"train_loss": -24.185531616210938, "global_step": 198633, "epoch": 2393} {"train_loss": -24.274606704711914, "global_step": 198634, "epoch": 2393} {"train_loss": -23.886816024780273, "global_step": 198635, "epoch": 2393} {"train_loss": -24.03151512145996, "global_step": 198636, "epoch": 2393} {"train_loss": -24.06978416442871, "global_step": 198637, "epoch": 2393} {"train_loss": -24.33075714111328, "global_step": 198638, "epoch": 2393} {"train_loss": -24.332345962524414, "global_step": 198639, "epoch": 2393} {"train_loss": -23.782678604125977, "global_step": 198640, "epoch": 2393} {"train_loss": -24.265365600585938, "global_step": 198641, "epoch": 2393} {"train_loss": -24.251501083374023, "global_step": 198642, "epoch": 2393} {"train_loss": -24.06691551208496, "global_step": 198643, "epoch": 2393} {"train_loss": -24.154747009277344, "global_step": 198644, "epoch": 2393} {"train_loss": -24.199094772338867, "global_step": 198645, "epoch": 2393} {"train_loss": -24.011341094970703, "global_step": 198646, "epoch": 2393} {"train_loss": -24.42557144165039, "global_step": 198647, "epoch": 2393} {"train_loss": -24.50218963623047, "global_step": 198648, "epoch": 2393} {"train_loss": -23.924514770507812, "global_step": 198649, "epoch": 2393} {"train_loss": -24.111967086791992, "global_step": 198650, "epoch": 2393} {"train_loss": -24.165435791015625, "global_step": 198651, "epoch": 2393} {"train_loss": -23.671878814697266, "global_step": 198652, "epoch": 2393} {"train_loss": -24.45026969909668, "global_step": 198653, "epoch": 2393} {"train_loss": -24.065397262573242, "global_step": 198654, "epoch": 2393} {"train_loss": -24.183353424072266, "global_step": 198655, "epoch": 2393} {"train_loss": -24.272602081298828, "global_step": 198656, "epoch": 2393} {"train_loss": -24.85274314880371, "global_step": 198657, "epoch": 2393} {"train_loss": -23.982398986816406, "global_step": 198658, "epoch": 2393} {"train_loss": -24.427688598632812, "global_step": 198659, "epoch": 2393} {"train_loss": -24.01296043395996, "global_step": 198660, "epoch": 2393} {"train_loss": -24.517353057861328, "global_step": 198661, "epoch": 2393} {"train_loss": -24.212894439697266, "global_step": 198662, "epoch": 2393} {"train_loss": -23.874168395996094, "global_step": 198663, "epoch": 2393} {"train_loss": -24.604740142822266, "global_step": 198664, "epoch": 2393} {"train_loss": -24.2474308013916, "global_step": 198665, "epoch": 2393} {"train_loss": -24.63188362121582, "global_step": 198666, "epoch": 2393} {"train_loss": -24.228139877319336, "global_step": 198667, "epoch": 2393} {"train_loss": -24.175580978393555, "global_step": 198668, "epoch": 2393} {"train_loss": -24.325143814086914, "global_step": 198669, "epoch": 2393} {"train_loss": -24.039892196655273, "global_step": 198670, "epoch": 2393} {"train_loss": -24.55143165588379, "global_step": 198671, "epoch": 2393} {"train_loss": -23.781801223754883, "global_step": 198672, "epoch": 2393} {"train_loss": -23.978866577148438, "global_step": 198673, "epoch": 2393} {"train_loss": -24.29910659790039, "global_step": 198674, "epoch": 2393} {"train_loss": -24.26151466369629, "global_step": 198675, "epoch": 2393} {"train_loss": -24.273178100585938, "global_step": 198676, "epoch": 2393} {"train_loss": -24.5007381439209, "global_step": 198677, "epoch": 2393} {"train_loss": -24.404325485229492, "global_step": 198678, "epoch": 2393} {"train_loss": -23.766128540039062, "global_step": 198679, "epoch": 2393} {"train_loss": -24.678363800048828, "global_step": 198680, "epoch": 2393} {"train_loss": -24.21458625793457, "global_step": 198681, "epoch": 2393} {"train_loss": -24.166574478149414, "global_step": 198682, "epoch": 2393} {"train_loss": -24.10304832458496, "global_step": 198683, "epoch": 2393} {"train_loss": -24.279483795166016, "global_step": 198684, "epoch": 2393} {"train_loss": -24.1458740234375, "global_step": 198685, "epoch": 2393} {"train_loss": -23.9454288482666, "global_step": 198686, "epoch": 2393} {"train_loss": -24.132795333862305, "global_step": 198687, "epoch": 2393} {"train_loss": -24.21916961669922, "global_step": 198688, "epoch": 2393} {"train_loss": -24.648698806762695, "global_step": 198689, "epoch": 2393} {"train_loss": -24.494075775146484, "global_step": 198690, "epoch": 2393} {"train_loss": -24.02509117126465, "global_step": 198691, "epoch": 2393} {"train_loss": -24.07801628112793, "global_step": 198692, "epoch": 2393} {"train_loss": -24.4161376953125, "global_step": 198693, "epoch": 2393} {"train_loss": -24.330001831054688, "global_step": 198694, "epoch": 2393} {"train_loss": -24.278867721557617, "global_step": 198695, "epoch": 2393} {"train_loss": -24.16605567932129, "global_step": 198696, "epoch": 2393} {"train_loss": -24.621715545654297, "global_step": 198697, "epoch": 2393} {"train_loss": -24.260208129882812, "global_step": 198698, "epoch": 2393} {"train_loss": -23.996912002563477, "global_step": 198699, "epoch": 2393} {"train_loss": -24.241985321044922, "global_step": 198700, "epoch": 2393} {"train_loss": -24.155340746224645, "global_step": 198701, "epoch": 2393, "val_loss": 6626272.0} {"train_loss": -23.672792434692383, "global_step": 198702, "epoch": 2394} {"train_loss": -23.361997604370117, "global_step": 198703, "epoch": 2394} {"train_loss": -23.871061325073242, "global_step": 198704, "epoch": 2394} {"train_loss": -23.73072624206543, "global_step": 198705, "epoch": 2394} {"train_loss": -24.3365535736084, "global_step": 198706, "epoch": 2394} {"train_loss": -24.13167381286621, "global_step": 198707, "epoch": 2394} {"train_loss": -23.852920532226562, "global_step": 198708, "epoch": 2394} {"train_loss": -24.143918991088867, "global_step": 198709, "epoch": 2394} {"train_loss": -24.14161491394043, "global_step": 198710, "epoch": 2394} {"train_loss": -23.999536514282227, "global_step": 198711, "epoch": 2394} {"train_loss": -23.884611129760742, "global_step": 198712, "epoch": 2394} {"train_loss": -24.196853637695312, "global_step": 198713, "epoch": 2394} {"train_loss": -23.875959396362305, "global_step": 198714, "epoch": 2394} {"train_loss": -24.14844512939453, "global_step": 198715, "epoch": 2394} {"train_loss": -23.963314056396484, "global_step": 198716, "epoch": 2394} {"train_loss": -23.685949325561523, "global_step": 198717, "epoch": 2394} {"train_loss": -23.931060791015625, "global_step": 198718, "epoch": 2394} {"train_loss": -23.931522369384766, "global_step": 198719, "epoch": 2394} {"train_loss": -23.943607330322266, "global_step": 198720, "epoch": 2394} {"train_loss": -24.092370986938477, "global_step": 198721, "epoch": 2394} {"train_loss": -24.255849838256836, "global_step": 198722, "epoch": 2394} {"train_loss": -24.48777198791504, "global_step": 198723, "epoch": 2394} {"train_loss": -24.020681381225586, "global_step": 198724, "epoch": 2394} {"train_loss": -24.290616989135742, "global_step": 198725, "epoch": 2394} {"train_loss": -24.220687866210938, "global_step": 198726, "epoch": 2394} {"train_loss": -23.910572052001953, "global_step": 198727, "epoch": 2394} {"train_loss": -24.009418487548828, "global_step": 198728, "epoch": 2394} {"train_loss": -24.019062042236328, "global_step": 198729, "epoch": 2394} {"train_loss": -24.64225196838379, "global_step": 198730, "epoch": 2394} {"train_loss": -24.074132919311523, "global_step": 198731, "epoch": 2394} {"train_loss": -24.410337448120117, "global_step": 198732, "epoch": 2394} {"train_loss": -24.37572479248047, "global_step": 198733, "epoch": 2394} {"train_loss": -24.350500106811523, "global_step": 198734, "epoch": 2394} {"train_loss": -24.34820556640625, "global_step": 198735, "epoch": 2394} {"train_loss": -24.0892391204834, "global_step": 198736, "epoch": 2394} {"train_loss": -24.135526657104492, "global_step": 198737, "epoch": 2394} {"train_loss": -23.93800163269043, "global_step": 198738, "epoch": 2394} {"train_loss": -24.203205108642578, "global_step": 198739, "epoch": 2394} {"train_loss": -24.346729278564453, "global_step": 198740, "epoch": 2394} {"train_loss": -24.166919708251953, "global_step": 198741, "epoch": 2394} {"train_loss": -23.95939826965332, "global_step": 198742, "epoch": 2394} {"train_loss": -24.232519149780273, "global_step": 198743, "epoch": 2394} {"train_loss": -24.399511337280273, "global_step": 198744, "epoch": 2394} {"train_loss": -24.22663116455078, "global_step": 198745, "epoch": 2394} {"train_loss": -24.624557495117188, "global_step": 198746, "epoch": 2394} {"train_loss": -24.489912033081055, "global_step": 198747, "epoch": 2394} {"train_loss": -23.959827423095703, "global_step": 198748, "epoch": 2394} {"train_loss": -24.189468383789062, "global_step": 198749, "epoch": 2394} {"train_loss": -24.294281005859375, "global_step": 198750, "epoch": 2394} {"train_loss": -24.19391441345215, "global_step": 198751, "epoch": 2394} {"train_loss": -24.373579025268555, "global_step": 198752, "epoch": 2394} {"train_loss": -24.1898136138916, "global_step": 198753, "epoch": 2394} {"train_loss": -24.28751564025879, "global_step": 198754, "epoch": 2394} {"train_loss": -24.436767578125, "global_step": 198755, "epoch": 2394} {"train_loss": -24.151443481445312, "global_step": 198756, "epoch": 2394} {"train_loss": -24.25440788269043, "global_step": 198757, "epoch": 2394} {"train_loss": -24.3067684173584, "global_step": 198758, "epoch": 2394} {"train_loss": -24.52610206604004, "global_step": 198759, "epoch": 2394} {"train_loss": -24.041034698486328, "global_step": 198760, "epoch": 2394} {"train_loss": -24.280261993408203, "global_step": 198761, "epoch": 2394} {"train_loss": -24.294355392456055, "global_step": 198762, "epoch": 2394} {"train_loss": -24.70502281188965, "global_step": 198763, "epoch": 2394} {"train_loss": -24.594497680664062, "global_step": 198764, "epoch": 2394} {"train_loss": -24.850296020507812, "global_step": 198765, "epoch": 2394} {"train_loss": -24.2923526763916, "global_step": 198766, "epoch": 2394} {"train_loss": -24.637025833129883, "global_step": 198767, "epoch": 2394} {"train_loss": -24.6929931640625, "global_step": 198768, "epoch": 2394} {"train_loss": -24.421289443969727, "global_step": 198769, "epoch": 2394} {"train_loss": -24.455795288085938, "global_step": 198770, "epoch": 2394} {"train_loss": -24.11680030822754, "global_step": 198771, "epoch": 2394} {"train_loss": -24.470699310302734, "global_step": 198772, "epoch": 2394} {"train_loss": -24.2285213470459, "global_step": 198773, "epoch": 2394} {"train_loss": -24.10637855529785, "global_step": 198774, "epoch": 2394} {"train_loss": -24.24468994140625, "global_step": 198775, "epoch": 2394} {"train_loss": -24.418615341186523, "global_step": 198776, "epoch": 2394} {"train_loss": -24.17555809020996, "global_step": 198777, "epoch": 2394} {"train_loss": -23.893510818481445, "global_step": 198778, "epoch": 2394} {"train_loss": -24.374820709228516, "global_step": 198779, "epoch": 2394} {"train_loss": -24.035964965820312, "global_step": 198780, "epoch": 2394} {"train_loss": -24.603158950805664, "global_step": 198781, "epoch": 2394} {"train_loss": -24.37368392944336, "global_step": 198782, "epoch": 2394} {"train_loss": -24.297260284423828, "global_step": 198783, "epoch": 2394} {"train_loss": -24.19000170604292, "global_step": 198784, "epoch": 2394, "val_loss": 6575520.5} {"train_loss": -23.150461196899414, "global_step": 198785, "epoch": 2395} {"train_loss": -22.214618682861328, "global_step": 198786, "epoch": 2395} {"train_loss": -23.123355865478516, "global_step": 198787, "epoch": 2395} {"train_loss": -22.731733322143555, "global_step": 198788, "epoch": 2395} {"train_loss": -22.319656372070312, "global_step": 198789, "epoch": 2395} {"train_loss": -22.644561767578125, "global_step": 198790, "epoch": 2395} {"train_loss": -23.19374656677246, "global_step": 198791, "epoch": 2395} {"train_loss": -22.97498893737793, "global_step": 198792, "epoch": 2395} {"train_loss": -23.119619369506836, "global_step": 198793, "epoch": 2395} {"train_loss": -23.238332748413086, "global_step": 198794, "epoch": 2395} {"train_loss": -23.455127716064453, "global_step": 198795, "epoch": 2395} {"train_loss": -23.36838150024414, "global_step": 198796, "epoch": 2395} {"train_loss": -23.281757354736328, "global_step": 198797, "epoch": 2395} {"train_loss": -23.051280975341797, "global_step": 198798, "epoch": 2395} {"train_loss": -23.27000617980957, "global_step": 198799, "epoch": 2395} {"train_loss": -23.566211700439453, "global_step": 198800, "epoch": 2395} {"train_loss": -23.456592559814453, "global_step": 198801, "epoch": 2395} {"train_loss": -23.964384078979492, "global_step": 198802, "epoch": 2395} {"train_loss": -23.73975372314453, "global_step": 198803, "epoch": 2395} {"train_loss": -23.753416061401367, "global_step": 198804, "epoch": 2395} {"train_loss": -23.8172664642334, "global_step": 198805, "epoch": 2395} {"train_loss": -23.7023868560791, "global_step": 198806, "epoch": 2395} {"train_loss": -23.732702255249023, "global_step": 198807, "epoch": 2395} {"train_loss": -23.321636199951172, "global_step": 198808, "epoch": 2395} {"train_loss": -23.790771484375, "global_step": 198809, "epoch": 2395} {"train_loss": -23.739091873168945, "global_step": 198810, "epoch": 2395} {"train_loss": -23.716360092163086, "global_step": 198811, "epoch": 2395} {"train_loss": -23.79874038696289, "global_step": 198812, "epoch": 2395} {"train_loss": -23.94232749938965, "global_step": 198813, "epoch": 2395} {"train_loss": -23.631622314453125, "global_step": 198814, "epoch": 2395} {"train_loss": -24.019702911376953, "global_step": 198815, "epoch": 2395} {"train_loss": -23.65056800842285, "global_step": 198816, "epoch": 2395} {"train_loss": -23.766773223876953, "global_step": 198817, "epoch": 2395} {"train_loss": -24.147552490234375, "global_step": 198818, "epoch": 2395} {"train_loss": -24.230009078979492, "global_step": 198819, "epoch": 2395} {"train_loss": -23.778440475463867, "global_step": 198820, "epoch": 2395} {"train_loss": -24.249486923217773, "global_step": 198821, "epoch": 2395} {"train_loss": -23.90105438232422, "global_step": 198822, "epoch": 2395} {"train_loss": -24.127775192260742, "global_step": 198823, "epoch": 2395} {"train_loss": -24.081932067871094, "global_step": 198824, "epoch": 2395} {"train_loss": -24.180612564086914, "global_step": 198825, "epoch": 2395} {"train_loss": -24.02294921875, "global_step": 198826, "epoch": 2395} {"train_loss": -24.01766014099121, "global_step": 198827, "epoch": 2395} {"train_loss": -24.071992874145508, "global_step": 198828, "epoch": 2395} {"train_loss": -23.787189483642578, "global_step": 198829, "epoch": 2395} {"train_loss": -24.294776916503906, "global_step": 198830, "epoch": 2395} {"train_loss": -24.22364616394043, "global_step": 198831, "epoch": 2395} {"train_loss": -24.18356704711914, "global_step": 198832, "epoch": 2395} {"train_loss": -23.949628829956055, "global_step": 198833, "epoch": 2395} {"train_loss": -23.93593978881836, "global_step": 198834, "epoch": 2395} {"train_loss": -24.237762451171875, "global_step": 198835, "epoch": 2395} {"train_loss": -24.03005027770996, "global_step": 198836, "epoch": 2395} {"train_loss": -24.46670150756836, "global_step": 198837, "epoch": 2395} {"train_loss": -24.160310745239258, "global_step": 198838, "epoch": 2395} {"train_loss": -24.109113693237305, "global_step": 198839, "epoch": 2395} {"train_loss": -24.01570701599121, "global_step": 198840, "epoch": 2395} {"train_loss": -24.576553344726562, "global_step": 198841, "epoch": 2395} {"train_loss": -24.185527801513672, "global_step": 198842, "epoch": 2395} {"train_loss": -24.169355392456055, "global_step": 198843, "epoch": 2395} {"train_loss": -23.934412002563477, "global_step": 198844, "epoch": 2395} {"train_loss": -24.320261001586914, "global_step": 198845, "epoch": 2395} {"train_loss": -24.535024642944336, "global_step": 198846, "epoch": 2395} {"train_loss": -23.754993438720703, "global_step": 198847, "epoch": 2395} {"train_loss": -24.373836517333984, "global_step": 198848, "epoch": 2395} {"train_loss": -24.26824188232422, "global_step": 198849, "epoch": 2395} {"train_loss": -23.571659088134766, "global_step": 198850, "epoch": 2395} {"train_loss": -23.983091354370117, "global_step": 198851, "epoch": 2395} {"train_loss": -24.46511459350586, "global_step": 198852, "epoch": 2395} {"train_loss": -23.999509811401367, "global_step": 198853, "epoch": 2395} {"train_loss": -24.378448486328125, "global_step": 198854, "epoch": 2395} {"train_loss": -24.31693458557129, "global_step": 198855, "epoch": 2395} {"train_loss": -24.599040985107422, "global_step": 198856, "epoch": 2395} {"train_loss": -24.3123836517334, "global_step": 198857, "epoch": 2395} {"train_loss": -24.429353713989258, "global_step": 198858, "epoch": 2395} {"train_loss": -24.646759033203125, "global_step": 198859, "epoch": 2395} {"train_loss": -24.33890151977539, "global_step": 198860, "epoch": 2395} {"train_loss": -23.95699119567871, "global_step": 198861, "epoch": 2395} {"train_loss": -24.309709548950195, "global_step": 198862, "epoch": 2395} {"train_loss": -24.365509033203125, "global_step": 198863, "epoch": 2395} {"train_loss": -24.74091148376465, "global_step": 198864, "epoch": 2395} {"train_loss": -24.333606719970703, "global_step": 198865, "epoch": 2395} {"train_loss": -23.984867095947266, "global_step": 198866, "epoch": 2395} {"train_loss": -23.88042061587414, "global_step": 198867, "epoch": 2395, "val_loss": 6525220.0} {"train_loss": -23.785005569458008, "global_step": 198868, "epoch": 2396} {"train_loss": -23.434404373168945, "global_step": 198869, "epoch": 2396} {"train_loss": -23.126331329345703, "global_step": 198870, "epoch": 2396} {"train_loss": -22.967039108276367, "global_step": 198871, "epoch": 2396} {"train_loss": -23.563232421875, "global_step": 198872, "epoch": 2396} {"train_loss": -23.578227996826172, "global_step": 198873, "epoch": 2396} {"train_loss": -23.28896141052246, "global_step": 198874, "epoch": 2396} {"train_loss": -23.304906845092773, "global_step": 198875, "epoch": 2396} {"train_loss": -23.71471405029297, "global_step": 198876, "epoch": 2396} {"train_loss": -23.17560386657715, "global_step": 198877, "epoch": 2396} {"train_loss": -23.5674991607666, "global_step": 198878, "epoch": 2396} {"train_loss": -23.81167221069336, "global_step": 198879, "epoch": 2396} {"train_loss": -23.451618194580078, "global_step": 198880, "epoch": 2396} {"train_loss": -24.08841323852539, "global_step": 198881, "epoch": 2396} {"train_loss": -23.641983032226562, "global_step": 198882, "epoch": 2396} {"train_loss": -24.003232955932617, "global_step": 198883, "epoch": 2396} {"train_loss": -23.539825439453125, "global_step": 198884, "epoch": 2396} {"train_loss": -23.911832809448242, "global_step": 198885, "epoch": 2396} {"train_loss": -23.449148178100586, "global_step": 198886, "epoch": 2396} {"train_loss": -23.996309280395508, "global_step": 198887, "epoch": 2396} {"train_loss": -23.801467895507812, "global_step": 198888, "epoch": 2396} {"train_loss": -23.654701232910156, "global_step": 198889, "epoch": 2396} {"train_loss": -23.596694946289062, "global_step": 198890, "epoch": 2396} {"train_loss": -24.301631927490234, "global_step": 198891, "epoch": 2396} {"train_loss": -24.168176651000977, "global_step": 198892, "epoch": 2396} {"train_loss": -23.81717300415039, "global_step": 198893, "epoch": 2396} {"train_loss": -24.148212432861328, "global_step": 198894, "epoch": 2396} {"train_loss": -24.041288375854492, "global_step": 198895, "epoch": 2396} {"train_loss": -24.0615234375, "global_step": 198896, "epoch": 2396} {"train_loss": -24.310758590698242, "global_step": 198897, "epoch": 2396} {"train_loss": -24.243976593017578, "global_step": 198898, "epoch": 2396} {"train_loss": -24.248544692993164, "global_step": 198899, "epoch": 2396} {"train_loss": -23.945749282836914, "global_step": 198900, "epoch": 2396} {"train_loss": -24.050870895385742, "global_step": 198901, "epoch": 2396} {"train_loss": -24.20340347290039, "global_step": 198902, "epoch": 2396} {"train_loss": -24.17245101928711, "global_step": 198903, "epoch": 2396} {"train_loss": -23.74710464477539, "global_step": 198904, "epoch": 2396} {"train_loss": -23.87188148498535, "global_step": 198905, "epoch": 2396} {"train_loss": -23.92103385925293, "global_step": 198906, "epoch": 2396} {"train_loss": -24.1041202545166, "global_step": 198907, "epoch": 2396} {"train_loss": -24.139724731445312, "global_step": 198908, "epoch": 2396} {"train_loss": -23.90576171875, "global_step": 198909, "epoch": 2396} {"train_loss": -24.48180389404297, "global_step": 198910, "epoch": 2396} {"train_loss": -23.9739990234375, "global_step": 198911, "epoch": 2396} {"train_loss": -23.873294830322266, "global_step": 198912, "epoch": 2396} {"train_loss": -24.233734130859375, "global_step": 198913, "epoch": 2396} {"train_loss": -24.352060317993164, "global_step": 198914, "epoch": 2396} {"train_loss": -24.26161766052246, "global_step": 198915, "epoch": 2396} {"train_loss": -24.189008712768555, "global_step": 198916, "epoch": 2396} {"train_loss": -23.938222885131836, "global_step": 198917, "epoch": 2396} {"train_loss": -24.433399200439453, "global_step": 198918, "epoch": 2396} {"train_loss": -23.990182876586914, "global_step": 198919, "epoch": 2396} {"train_loss": -24.354516983032227, "global_step": 198920, "epoch": 2396} {"train_loss": -24.39540672302246, "global_step": 198921, "epoch": 2396} {"train_loss": -24.142650604248047, "global_step": 198922, "epoch": 2396} {"train_loss": -24.24581527709961, "global_step": 198923, "epoch": 2396} {"train_loss": -23.99787712097168, "global_step": 198924, "epoch": 2396} {"train_loss": -23.95069694519043, "global_step": 198925, "epoch": 2396} {"train_loss": -24.501754760742188, "global_step": 198926, "epoch": 2396} {"train_loss": -24.026424407958984, "global_step": 198927, "epoch": 2396} {"train_loss": -24.337369918823242, "global_step": 198928, "epoch": 2396} {"train_loss": -24.101526260375977, "global_step": 198929, "epoch": 2396} {"train_loss": -24.35401725769043, "global_step": 198930, "epoch": 2396} {"train_loss": -24.0227108001709, "global_step": 198931, "epoch": 2396} {"train_loss": -23.87087059020996, "global_step": 198932, "epoch": 2396} {"train_loss": -24.282779693603516, "global_step": 198933, "epoch": 2396} {"train_loss": -24.546422958374023, "global_step": 198934, "epoch": 2396} {"train_loss": -24.094934463500977, "global_step": 198935, "epoch": 2396} {"train_loss": -24.519601821899414, "global_step": 198936, "epoch": 2396} {"train_loss": -24.492509841918945, "global_step": 198937, "epoch": 2396} {"train_loss": -24.60312843322754, "global_step": 198938, "epoch": 2396} {"train_loss": -24.603313446044922, "global_step": 198939, "epoch": 2396} {"train_loss": -24.158767700195312, "global_step": 198940, "epoch": 2396} {"train_loss": -24.347593307495117, "global_step": 198941, "epoch": 2396} {"train_loss": -24.62928009033203, "global_step": 198942, "epoch": 2396} {"train_loss": -24.332468032836914, "global_step": 198943, "epoch": 2396} {"train_loss": -24.529769897460938, "global_step": 198944, "epoch": 2396} {"train_loss": -24.290136337280273, "global_step": 198945, "epoch": 2396} {"train_loss": -24.14302635192871, "global_step": 198946, "epoch": 2396} {"train_loss": -24.42876625061035, "global_step": 198947, "epoch": 2396} {"train_loss": -24.26767921447754, "global_step": 198948, "epoch": 2396} {"train_loss": -24.593669891357422, "global_step": 198949, "epoch": 2396} {"train_loss": -24.03850631254265, "global_step": 198950, "epoch": 2396, "val_loss": 6580227.5} {"train_loss": -23.28583335876465, "global_step": 198951, "epoch": 2397} {"train_loss": -23.601398468017578, "global_step": 198952, "epoch": 2397} {"train_loss": -23.913362503051758, "global_step": 198953, "epoch": 2397} {"train_loss": -23.498594284057617, "global_step": 198954, "epoch": 2397} {"train_loss": -23.955078125, "global_step": 198955, "epoch": 2397} {"train_loss": -23.67946434020996, "global_step": 198956, "epoch": 2397} {"train_loss": -23.721773147583008, "global_step": 198957, "epoch": 2397} {"train_loss": -24.193801879882812, "global_step": 198958, "epoch": 2397} {"train_loss": -23.787260055541992, "global_step": 198959, "epoch": 2397} {"train_loss": -24.20376968383789, "global_step": 198960, "epoch": 2397} {"train_loss": -24.273311614990234, "global_step": 198961, "epoch": 2397} {"train_loss": -24.229022979736328, "global_step": 198962, "epoch": 2397} {"train_loss": -24.133237838745117, "global_step": 198963, "epoch": 2397} {"train_loss": -24.251516342163086, "global_step": 198964, "epoch": 2397} {"train_loss": -24.20807456970215, "global_step": 198965, "epoch": 2397} {"train_loss": -24.03900909423828, "global_step": 198966, "epoch": 2397} {"train_loss": -24.34366226196289, "global_step": 198967, "epoch": 2397} {"train_loss": -24.037338256835938, "global_step": 198968, "epoch": 2397} {"train_loss": -24.139331817626953, "global_step": 198969, "epoch": 2397} {"train_loss": -24.237119674682617, "global_step": 198970, "epoch": 2397} {"train_loss": -24.623380661010742, "global_step": 198971, "epoch": 2397} {"train_loss": -24.574718475341797, "global_step": 198972, "epoch": 2397} {"train_loss": -24.18212127685547, "global_step": 198973, "epoch": 2397} {"train_loss": -24.766250610351562, "global_step": 198974, "epoch": 2397} {"train_loss": -24.320425033569336, "global_step": 198975, "epoch": 2397} {"train_loss": -23.994321823120117, "global_step": 198976, "epoch": 2397} {"train_loss": -24.1864070892334, "global_step": 198977, "epoch": 2397} {"train_loss": -24.407529830932617, "global_step": 198978, "epoch": 2397} {"train_loss": -24.203615188598633, "global_step": 198979, "epoch": 2397} {"train_loss": -24.173038482666016, "global_step": 198980, "epoch": 2397} {"train_loss": -24.29343605041504, "global_step": 198981, "epoch": 2397} {"train_loss": -24.141326904296875, "global_step": 198982, "epoch": 2397} {"train_loss": -24.102832794189453, "global_step": 198983, "epoch": 2397} {"train_loss": -24.435094833374023, "global_step": 198984, "epoch": 2397} {"train_loss": -23.931150436401367, "global_step": 198985, "epoch": 2397} {"train_loss": -24.0559139251709, "global_step": 198986, "epoch": 2397} {"train_loss": -24.10222816467285, "global_step": 198987, "epoch": 2397} {"train_loss": -23.946609497070312, "global_step": 198988, "epoch": 2397} {"train_loss": -24.342586517333984, "global_step": 198989, "epoch": 2397} {"train_loss": -24.02925682067871, "global_step": 198990, "epoch": 2397} {"train_loss": -24.26315689086914, "global_step": 198991, "epoch": 2397} {"train_loss": -24.173959732055664, "global_step": 198992, "epoch": 2397} {"train_loss": -24.483884811401367, "global_step": 198993, "epoch": 2397} {"train_loss": -24.134601593017578, "global_step": 198994, "epoch": 2397} {"train_loss": -23.93626594543457, "global_step": 198995, "epoch": 2397} {"train_loss": -24.519756317138672, "global_step": 198996, "epoch": 2397} {"train_loss": -24.589094161987305, "global_step": 198997, "epoch": 2397} {"train_loss": -24.198474884033203, "global_step": 198998, "epoch": 2397} {"train_loss": -24.138690948486328, "global_step": 198999, "epoch": 2397} {"train_loss": -24.148319244384766, "global_step": 199000, "epoch": 2397} {"train_loss": -24.58951759338379, "global_step": 199001, "epoch": 2397} {"train_loss": -24.329538345336914, "global_step": 199002, "epoch": 2397} {"train_loss": -24.30954360961914, "global_step": 199003, "epoch": 2397} {"train_loss": -24.202985763549805, "global_step": 199004, "epoch": 2397} {"train_loss": -24.43954086303711, "global_step": 199005, "epoch": 2397} {"train_loss": -24.150602340698242, "global_step": 199006, "epoch": 2397} {"train_loss": -24.3243465423584, "global_step": 199007, "epoch": 2397} {"train_loss": -24.13168716430664, "global_step": 199008, "epoch": 2397} {"train_loss": -24.25647735595703, "global_step": 199009, "epoch": 2397} {"train_loss": -24.42132568359375, "global_step": 199010, "epoch": 2397} {"train_loss": -23.79108238220215, "global_step": 199011, "epoch": 2397} {"train_loss": -24.23282241821289, "global_step": 199012, "epoch": 2397} {"train_loss": -23.720617294311523, "global_step": 199013, "epoch": 2397} {"train_loss": -24.23133087158203, "global_step": 199014, "epoch": 2397} {"train_loss": -24.332897186279297, "global_step": 199015, "epoch": 2397} {"train_loss": -24.178813934326172, "global_step": 199016, "epoch": 2397} {"train_loss": -23.471115112304688, "global_step": 199017, "epoch": 2397} {"train_loss": -24.271644592285156, "global_step": 199018, "epoch": 2397} {"train_loss": -24.15251922607422, "global_step": 199019, "epoch": 2397} {"train_loss": -24.021644592285156, "global_step": 199020, "epoch": 2397} {"train_loss": -23.910839080810547, "global_step": 199021, "epoch": 2397} {"train_loss": -24.478778839111328, "global_step": 199022, "epoch": 2397} {"train_loss": -23.887014389038086, "global_step": 199023, "epoch": 2397} {"train_loss": -24.463136672973633, "global_step": 199024, "epoch": 2397} {"train_loss": -24.245691299438477, "global_step": 199025, "epoch": 2397} {"train_loss": -23.583242416381836, "global_step": 199026, "epoch": 2397} {"train_loss": -24.219985961914062, "global_step": 199027, "epoch": 2397} {"train_loss": -24.385766983032227, "global_step": 199028, "epoch": 2397} {"train_loss": -24.301834106445312, "global_step": 199029, "epoch": 2397} {"train_loss": -24.244001388549805, "global_step": 199030, "epoch": 2397} {"train_loss": -24.26325798034668, "global_step": 199031, "epoch": 2397} {"train_loss": -24.02618980407715, "global_step": 199032, "epoch": 2397} {"train_loss": -24.175015575914497, "global_step": 199033, "epoch": 2397, "val_loss": 6560806.5} {"train_loss": -23.691205978393555, "global_step": 199034, "epoch": 2398} {"train_loss": -24.237035751342773, "global_step": 199035, "epoch": 2398} {"train_loss": -24.29764175415039, "global_step": 199036, "epoch": 2398} {"train_loss": -23.680572509765625, "global_step": 199037, "epoch": 2398} {"train_loss": -23.88897132873535, "global_step": 199038, "epoch": 2398} {"train_loss": -23.879947662353516, "global_step": 199039, "epoch": 2398} {"train_loss": -24.809860229492188, "global_step": 199040, "epoch": 2398} {"train_loss": -23.7187442779541, "global_step": 199041, "epoch": 2398} {"train_loss": -24.05638885498047, "global_step": 199042, "epoch": 2398} {"train_loss": -24.024648666381836, "global_step": 199043, "epoch": 2398} {"train_loss": -24.0056209564209, "global_step": 199044, "epoch": 2398} {"train_loss": -23.889535903930664, "global_step": 199045, "epoch": 2398} {"train_loss": -24.084232330322266, "global_step": 199046, "epoch": 2398} {"train_loss": -24.216594696044922, "global_step": 199047, "epoch": 2398} {"train_loss": -24.099225997924805, "global_step": 199048, "epoch": 2398} {"train_loss": -24.270429611206055, "global_step": 199049, "epoch": 2398} {"train_loss": -24.431676864624023, "global_step": 199050, "epoch": 2398} {"train_loss": -23.769027709960938, "global_step": 199051, "epoch": 2398} {"train_loss": -24.4176082611084, "global_step": 199052, "epoch": 2398} {"train_loss": -24.119258880615234, "global_step": 199053, "epoch": 2398} {"train_loss": -24.050939559936523, "global_step": 199054, "epoch": 2398} {"train_loss": -24.335296630859375, "global_step": 199055, "epoch": 2398} {"train_loss": -24.196439743041992, "global_step": 199056, "epoch": 2398} {"train_loss": -24.377487182617188, "global_step": 199057, "epoch": 2398} {"train_loss": -24.67197608947754, "global_step": 199058, "epoch": 2398} {"train_loss": -24.121109008789062, "global_step": 199059, "epoch": 2398} {"train_loss": -24.571325302124023, "global_step": 199060, "epoch": 2398} {"train_loss": -24.42853355407715, "global_step": 199061, "epoch": 2398} {"train_loss": -24.657535552978516, "global_step": 199062, "epoch": 2398} {"train_loss": -24.160545349121094, "global_step": 199063, "epoch": 2398} {"train_loss": -24.12409782409668, "global_step": 199064, "epoch": 2398} {"train_loss": -24.301626205444336, "global_step": 199065, "epoch": 2398} {"train_loss": -24.512046813964844, "global_step": 199066, "epoch": 2398} {"train_loss": -24.341373443603516, "global_step": 199067, "epoch": 2398} {"train_loss": -24.560110092163086, "global_step": 199068, "epoch": 2398} {"train_loss": -24.367069244384766, "global_step": 199069, "epoch": 2398} {"train_loss": -24.224143981933594, "global_step": 199070, "epoch": 2398} {"train_loss": -23.85753631591797, "global_step": 199071, "epoch": 2398} {"train_loss": -24.048551559448242, "global_step": 199072, "epoch": 2398} {"train_loss": -24.513029098510742, "global_step": 199073, "epoch": 2398} {"train_loss": -24.274545669555664, "global_step": 199074, "epoch": 2398} {"train_loss": -24.22285270690918, "global_step": 199075, "epoch": 2398} {"train_loss": -24.138044357299805, "global_step": 199076, "epoch": 2398} {"train_loss": -24.28853988647461, "global_step": 199077, "epoch": 2398} {"train_loss": -23.919221878051758, "global_step": 199078, "epoch": 2398} {"train_loss": -24.403005599975586, "global_step": 199079, "epoch": 2398} {"train_loss": -24.027135848999023, "global_step": 199080, "epoch": 2398} {"train_loss": -24.437612533569336, "global_step": 199081, "epoch": 2398} {"train_loss": -24.469898223876953, "global_step": 199082, "epoch": 2398} {"train_loss": -24.317564010620117, "global_step": 199083, "epoch": 2398} {"train_loss": -24.570903778076172, "global_step": 199084, "epoch": 2398} {"train_loss": -24.135114669799805, "global_step": 199085, "epoch": 2398} {"train_loss": -23.99288558959961, "global_step": 199086, "epoch": 2398} {"train_loss": -24.325450897216797, "global_step": 199087, "epoch": 2398} {"train_loss": -24.10296630859375, "global_step": 199088, "epoch": 2398} {"train_loss": -24.489532470703125, "global_step": 199089, "epoch": 2398} {"train_loss": -24.427040100097656, "global_step": 199090, "epoch": 2398} {"train_loss": -24.182973861694336, "global_step": 199091, "epoch": 2398} {"train_loss": -24.44297218322754, "global_step": 199092, "epoch": 2398} {"train_loss": -24.073057174682617, "global_step": 199093, "epoch": 2398} {"train_loss": -24.287912368774414, "global_step": 199094, "epoch": 2398} {"train_loss": -24.33790397644043, "global_step": 199095, "epoch": 2398} {"train_loss": -24.14004898071289, "global_step": 199096, "epoch": 2398} {"train_loss": -24.25079917907715, "global_step": 199097, "epoch": 2398} {"train_loss": -24.093490600585938, "global_step": 199098, "epoch": 2398} {"train_loss": -24.365459442138672, "global_step": 199099, "epoch": 2398} {"train_loss": -24.671192169189453, "global_step": 199100, "epoch": 2398} {"train_loss": -24.210329055786133, "global_step": 199101, "epoch": 2398} {"train_loss": -23.9869441986084, "global_step": 199102, "epoch": 2398} {"train_loss": -24.099063873291016, "global_step": 199103, "epoch": 2398} {"train_loss": -24.116880416870117, "global_step": 199104, "epoch": 2398} {"train_loss": -24.59752655029297, "global_step": 199105, "epoch": 2398} {"train_loss": -23.910507202148438, "global_step": 199106, "epoch": 2398} {"train_loss": -24.434476852416992, "global_step": 199107, "epoch": 2398} {"train_loss": -24.308256149291992, "global_step": 199108, "epoch": 2398} {"train_loss": -24.07179069519043, "global_step": 199109, "epoch": 2398} {"train_loss": -24.411375045776367, "global_step": 199110, "epoch": 2398} {"train_loss": -23.8018856048584, "global_step": 199111, "epoch": 2398} {"train_loss": -24.32140350341797, "global_step": 199112, "epoch": 2398} {"train_loss": -24.22071075439453, "global_step": 199113, "epoch": 2398} {"train_loss": -24.262012481689453, "global_step": 199114, "epoch": 2398} {"train_loss": -24.289066314697266, "global_step": 199115, "epoch": 2398} {"train_loss": -24.23353098673993, "global_step": 199116, "epoch": 2398, "val_loss": 6460729.0} {"train_loss": -23.480815887451172, "global_step": 199117, "epoch": 2399} {"train_loss": -23.5183048248291, "global_step": 199118, "epoch": 2399} {"train_loss": -23.861658096313477, "global_step": 199119, "epoch": 2399} {"train_loss": -23.62436866760254, "global_step": 199120, "epoch": 2399} {"train_loss": -23.742145538330078, "global_step": 199121, "epoch": 2399} {"train_loss": -23.90122413635254, "global_step": 199122, "epoch": 2399} {"train_loss": -23.701637268066406, "global_step": 199123, "epoch": 2399} {"train_loss": -24.0858097076416, "global_step": 199124, "epoch": 2399} {"train_loss": -23.96401023864746, "global_step": 199125, "epoch": 2399} {"train_loss": -23.85504722595215, "global_step": 199126, "epoch": 2399} {"train_loss": -24.369205474853516, "global_step": 199127, "epoch": 2399} {"train_loss": -24.254880905151367, "global_step": 199128, "epoch": 2399} {"train_loss": -23.943756103515625, "global_step": 199129, "epoch": 2399} {"train_loss": -24.14383316040039, "global_step": 199130, "epoch": 2399} {"train_loss": -24.172555923461914, "global_step": 199131, "epoch": 2399} {"train_loss": -24.148386001586914, "global_step": 199132, "epoch": 2399} {"train_loss": -24.331655502319336, "global_step": 199133, "epoch": 2399} {"train_loss": -24.096542358398438, "global_step": 199134, "epoch": 2399} {"train_loss": -24.127649307250977, "global_step": 199135, "epoch": 2399} {"train_loss": -24.082059860229492, "global_step": 199136, "epoch": 2399} {"train_loss": -24.762989044189453, "global_step": 199137, "epoch": 2399} {"train_loss": -24.392202377319336, "global_step": 199138, "epoch": 2399} {"train_loss": -23.66639518737793, "global_step": 199139, "epoch": 2399} {"train_loss": -24.224714279174805, "global_step": 199140, "epoch": 2399} {"train_loss": -24.07707977294922, "global_step": 199141, "epoch": 2399} {"train_loss": -24.2706356048584, "global_step": 199142, "epoch": 2399} {"train_loss": -24.25129508972168, "global_step": 199143, "epoch": 2399} {"train_loss": -24.106924057006836, "global_step": 199144, "epoch": 2399} {"train_loss": -24.319116592407227, "global_step": 199145, "epoch": 2399} {"train_loss": -24.1922550201416, "global_step": 199146, "epoch": 2399} {"train_loss": -24.2135066986084, "global_step": 199147, "epoch": 2399} {"train_loss": -24.314117431640625, "global_step": 199148, "epoch": 2399} {"train_loss": -24.19837760925293, "global_step": 199149, "epoch": 2399} {"train_loss": -24.526445388793945, "global_step": 199150, "epoch": 2399} {"train_loss": -24.219446182250977, "global_step": 199151, "epoch": 2399} {"train_loss": -23.9665470123291, "global_step": 199152, "epoch": 2399} {"train_loss": -24.62178611755371, "global_step": 199153, "epoch": 2399} {"train_loss": -23.725324630737305, "global_step": 199154, "epoch": 2399} {"train_loss": -23.965356826782227, "global_step": 199155, "epoch": 2399} {"train_loss": -24.173049926757812, "global_step": 199156, "epoch": 2399} {"train_loss": -24.109495162963867, "global_step": 199157, "epoch": 2399} {"train_loss": -24.369728088378906, "global_step": 199158, "epoch": 2399} {"train_loss": -24.42095947265625, "global_step": 199159, "epoch": 2399} {"train_loss": -24.476789474487305, "global_step": 199160, "epoch": 2399} {"train_loss": -24.39409065246582, "global_step": 199161, "epoch": 2399} {"train_loss": -24.389902114868164, "global_step": 199162, "epoch": 2399} {"train_loss": -24.297677993774414, "global_step": 199163, "epoch": 2399} {"train_loss": -24.201705932617188, "global_step": 199164, "epoch": 2399} {"train_loss": -24.163671493530273, "global_step": 199165, "epoch": 2399} {"train_loss": -23.768423080444336, "global_step": 199166, "epoch": 2399} {"train_loss": -24.0728816986084, "global_step": 199167, "epoch": 2399} {"train_loss": -24.600629806518555, "global_step": 199168, "epoch": 2399} {"train_loss": -24.536680221557617, "global_step": 199169, "epoch": 2399} {"train_loss": -23.936246871948242, "global_step": 199170, "epoch": 2399} {"train_loss": -23.696378707885742, "global_step": 199171, "epoch": 2399} {"train_loss": -24.163246154785156, "global_step": 199172, "epoch": 2399} {"train_loss": -24.416168212890625, "global_step": 199173, "epoch": 2399} {"train_loss": -23.94424819946289, "global_step": 199174, "epoch": 2399} {"train_loss": -23.78197479248047, "global_step": 199175, "epoch": 2399} {"train_loss": -24.12523651123047, "global_step": 199176, "epoch": 2399} {"train_loss": -24.374311447143555, "global_step": 199177, "epoch": 2399} {"train_loss": -24.21888542175293, "global_step": 199178, "epoch": 2399} {"train_loss": -24.212825775146484, "global_step": 199179, "epoch": 2399} {"train_loss": -24.07758331298828, "global_step": 199180, "epoch": 2399} {"train_loss": -24.41290855407715, "global_step": 199181, "epoch": 2399} {"train_loss": -24.048030853271484, "global_step": 199182, "epoch": 2399} {"train_loss": -24.547605514526367, "global_step": 199183, "epoch": 2399} {"train_loss": -23.825490951538086, "global_step": 199184, "epoch": 2399} {"train_loss": -24.277143478393555, "global_step": 199185, "epoch": 2399} {"train_loss": -24.13172721862793, "global_step": 199186, "epoch": 2399} {"train_loss": -24.166492462158203, "global_step": 199187, "epoch": 2399} {"train_loss": -23.89940643310547, "global_step": 199188, "epoch": 2399} {"train_loss": -24.394506454467773, "global_step": 199189, "epoch": 2399} {"train_loss": -24.193195343017578, "global_step": 199190, "epoch": 2399} {"train_loss": -24.696422576904297, "global_step": 199191, "epoch": 2399} {"train_loss": -23.93216896057129, "global_step": 199192, "epoch": 2399} {"train_loss": -24.35687255859375, "global_step": 199193, "epoch": 2399} {"train_loss": -24.047998428344727, "global_step": 199194, "epoch": 2399} {"train_loss": -24.324302673339844, "global_step": 199195, "epoch": 2399} {"train_loss": -24.330514907836914, "global_step": 199196, "epoch": 2399} {"train_loss": -24.11170768737793, "global_step": 199197, "epoch": 2399} {"train_loss": -24.23788070678711, "global_step": 199198, "epoch": 2399} {"train_loss": -24.175050758453736, "global_step": 199199, "epoch": 2399, "val_loss": 6541954.5} {"train_loss": -23.650854110717773, "global_step": 199200, "epoch": 2400} {"train_loss": -24.11868667602539, "global_step": 199201, "epoch": 2400} {"train_loss": -23.927270889282227, "global_step": 199202, "epoch": 2400} {"train_loss": -23.534528732299805, "global_step": 199203, "epoch": 2400} {"train_loss": -24.21059226989746, "global_step": 199204, "epoch": 2400} {"train_loss": -24.032503128051758, "global_step": 199205, "epoch": 2400} {"train_loss": -23.594043731689453, "global_step": 199206, "epoch": 2400} {"train_loss": -24.239391326904297, "global_step": 199207, "epoch": 2400} {"train_loss": -24.148366928100586, "global_step": 199208, "epoch": 2400} {"train_loss": -24.151411056518555, "global_step": 199209, "epoch": 2400} {"train_loss": -24.443679809570312, "global_step": 199210, "epoch": 2400} {"train_loss": -23.421606063842773, "global_step": 199211, "epoch": 2400} {"train_loss": -24.04471206665039, "global_step": 199212, "epoch": 2400} {"train_loss": -24.00697898864746, "global_step": 199213, "epoch": 2400} {"train_loss": -24.056100845336914, "global_step": 199214, "epoch": 2400} {"train_loss": -24.188711166381836, "global_step": 199215, "epoch": 2400} {"train_loss": -23.840200424194336, "global_step": 199216, "epoch": 2400} {"train_loss": -24.222900390625, "global_step": 199217, "epoch": 2400} {"train_loss": -23.90750503540039, "global_step": 199218, "epoch": 2400} {"train_loss": -24.151182174682617, "global_step": 199219, "epoch": 2400} {"train_loss": -23.812246322631836, "global_step": 199220, "epoch": 2400} {"train_loss": -24.061203002929688, "global_step": 199221, "epoch": 2400} {"train_loss": -23.84052848815918, "global_step": 199222, "epoch": 2400} {"train_loss": -24.312101364135742, "global_step": 199223, "epoch": 2400} {"train_loss": -24.114192962646484, "global_step": 199224, "epoch": 2400} {"train_loss": -24.07941246032715, "global_step": 199225, "epoch": 2400} {"train_loss": -24.106786727905273, "global_step": 199226, "epoch": 2400} {"train_loss": -24.13149070739746, "global_step": 199227, "epoch": 2400} {"train_loss": -24.18812370300293, "global_step": 199228, "epoch": 2400} {"train_loss": -24.069974899291992, "global_step": 199229, "epoch": 2400} {"train_loss": -23.9132137298584, "global_step": 199230, "epoch": 2400} {"train_loss": -24.098947525024414, "global_step": 199231, "epoch": 2400} {"train_loss": -24.422399520874023, "global_step": 199232, "epoch": 2400} {"train_loss": -24.22847557067871, "global_step": 199233, "epoch": 2400} {"train_loss": -24.10133171081543, "global_step": 199234, "epoch": 2400} {"train_loss": -24.155597686767578, "global_step": 199235, "epoch": 2400} {"train_loss": -24.73722267150879, "global_step": 199236, "epoch": 2400} {"train_loss": -24.14680290222168, "global_step": 199237, "epoch": 2400} {"train_loss": -24.05979347229004, "global_step": 199238, "epoch": 2400} {"train_loss": -24.36592674255371, "global_step": 199239, "epoch": 2400} {"train_loss": -24.06945037841797, "global_step": 199240, "epoch": 2400} {"train_loss": -24.255908966064453, "global_step": 199241, "epoch": 2400} {"train_loss": -24.49799919128418, "global_step": 199242, "epoch": 2400} {"train_loss": -24.398101806640625, "global_step": 199243, "epoch": 2400} {"train_loss": -24.118772506713867, "global_step": 199244, "epoch": 2400} {"train_loss": -24.575565338134766, "global_step": 199245, "epoch": 2400} {"train_loss": -24.254878997802734, "global_step": 199246, "epoch": 2400} {"train_loss": -23.724668502807617, "global_step": 199247, "epoch": 2400} {"train_loss": -24.196645736694336, "global_step": 199248, "epoch": 2400} {"train_loss": -24.148290634155273, "global_step": 199249, "epoch": 2400} {"train_loss": -23.83738136291504, "global_step": 199250, "epoch": 2400} {"train_loss": -23.879106521606445, "global_step": 199251, "epoch": 2400} {"train_loss": -24.443880081176758, "global_step": 199252, "epoch": 2400} {"train_loss": -24.322999954223633, "global_step": 199253, "epoch": 2400} {"train_loss": -24.628393173217773, "global_step": 199254, "epoch": 2400} {"train_loss": -24.464405059814453, "global_step": 199255, "epoch": 2400} {"train_loss": -24.148969650268555, "global_step": 199256, "epoch": 2400} {"train_loss": -24.480199813842773, "global_step": 199257, "epoch": 2400} {"train_loss": -23.953338623046875, "global_step": 199258, "epoch": 2400} {"train_loss": -24.140979766845703, "global_step": 199259, "epoch": 2400} {"train_loss": -24.196386337280273, "global_step": 199260, "epoch": 2400} {"train_loss": -24.599891662597656, "global_step": 199261, "epoch": 2400} {"train_loss": -24.06757164001465, "global_step": 199262, "epoch": 2400} {"train_loss": -24.180076599121094, "global_step": 199263, "epoch": 2400} {"train_loss": -24.278884887695312, "global_step": 199264, "epoch": 2400} {"train_loss": -24.428768157958984, "global_step": 199265, "epoch": 2400} {"train_loss": -24.241636276245117, "global_step": 199266, "epoch": 2400} {"train_loss": -24.33037567138672, "global_step": 199267, "epoch": 2400} {"train_loss": -24.469221115112305, "global_step": 199268, "epoch": 2400} {"train_loss": -24.1829891204834, "global_step": 199269, "epoch": 2400} {"train_loss": -24.503437042236328, "global_step": 199270, "epoch": 2400} {"train_loss": -24.249807357788086, "global_step": 199271, "epoch": 2400} {"train_loss": -23.914243698120117, "global_step": 199272, "epoch": 2400} {"train_loss": -24.918785095214844, "global_step": 199273, "epoch": 2400} {"train_loss": -24.322959899902344, "global_step": 199274, "epoch": 2400} {"train_loss": -24.270376205444336, "global_step": 199275, "epoch": 2400} {"train_loss": -24.194412231445312, "global_step": 199276, "epoch": 2400} {"train_loss": -24.330913543701172, "global_step": 199277, "epoch": 2400} {"train_loss": -24.40203285217285, "global_step": 199278, "epoch": 2400} {"train_loss": -24.006818771362305, "global_step": 199279, "epoch": 2400} {"train_loss": -23.913639068603516, "global_step": 199280, "epoch": 2400} {"train_loss": -24.027938842773438, "global_step": 199281, "epoch": 2400} {"train_loss": -24.197193467473408, "global_step": 199282, "epoch": 2400, "train/sim_max_reward_0": 1.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4500000": 1.0, "test/sim_max_reward_4500001": 1.0, "test/sim_max_reward_4500002": 1.0, "test/sim_max_reward_4500003": 1.0, "test/sim_max_reward_4500004": 1.0, "test/sim_max_reward_4500005": 1.0, "test/sim_max_reward_4500006": 1.0, "test/sim_max_reward_4500007": 0.0, "test/sim_max_reward_4500008": 1.0, "test/sim_max_reward_4500009": 1.0, "test/sim_max_reward_4500010": 1.0, "test/sim_max_reward_4500011": 1.0, "test/sim_max_reward_4500012": 1.0, "test/sim_max_reward_4500013": 1.0, "test/sim_max_reward_4500014": 1.0, "test/sim_max_reward_4500015": 1.0, "test/sim_max_reward_4500016": 1.0, "test/sim_max_reward_4500017": 1.0, "test/sim_max_reward_4500018": 1.0, "test/sim_max_reward_4500019": 1.0, "test/sim_max_reward_4500020": 1.0, "test/sim_max_reward_4500021": 1.0, "train/mean_score": 1.0, "test/mean_score": 0.9545454545454546, "val_loss": 6674143.0} {"train_loss": -24.0828857421875, "global_step": 199283, "epoch": 2401} {"train_loss": -23.756925582885742, "global_step": 199284, "epoch": 2401} {"train_loss": -23.93269157409668, "global_step": 199285, "epoch": 2401} {"train_loss": -23.862024307250977, "global_step": 199286, "epoch": 2401} {"train_loss": -24.27564811706543, "global_step": 199287, "epoch": 2401} {"train_loss": -23.715795516967773, "global_step": 199288, "epoch": 2401} {"train_loss": -23.374746322631836, "global_step": 199289, "epoch": 2401} {"train_loss": -23.948413848876953, "global_step": 199290, "epoch": 2401} {"train_loss": -23.964994430541992, "global_step": 199291, "epoch": 2401} {"train_loss": -24.26564598083496, "global_step": 199292, "epoch": 2401} {"train_loss": -23.89565086364746, "global_step": 199293, "epoch": 2401} {"train_loss": -23.902008056640625, "global_step": 199294, "epoch": 2401} {"train_loss": -24.03733253479004, "global_step": 199295, "epoch": 2401} {"train_loss": -24.33968162536621, "global_step": 199296, "epoch": 2401} {"train_loss": -23.780445098876953, "global_step": 199297, "epoch": 2401} {"train_loss": -24.129026412963867, "global_step": 199298, "epoch": 2401} {"train_loss": -23.79876136779785, "global_step": 199299, "epoch": 2401} {"train_loss": -24.08067512512207, "global_step": 199300, "epoch": 2401} {"train_loss": -24.17696762084961, "global_step": 199301, "epoch": 2401} {"train_loss": -23.85940933227539, "global_step": 199302, "epoch": 2401} {"train_loss": -24.09281349182129, "global_step": 199303, "epoch": 2401} {"train_loss": -24.15217399597168, "global_step": 199304, "epoch": 2401} {"train_loss": -24.30243682861328, "global_step": 199305, "epoch": 2401} {"train_loss": -24.062461853027344, "global_step": 199306, "epoch": 2401} {"train_loss": -24.22791862487793, "global_step": 199307, "epoch": 2401} {"train_loss": -23.92601776123047, "global_step": 199308, "epoch": 2401} {"train_loss": -24.276098251342773, "global_step": 199309, "epoch": 2401} {"train_loss": -24.421762466430664, "global_step": 199310, "epoch": 2401} {"train_loss": -24.237272262573242, "global_step": 199311, "epoch": 2401} {"train_loss": -24.262929916381836, "global_step": 199312, "epoch": 2401} {"train_loss": -24.42222785949707, "global_step": 199313, "epoch": 2401} {"train_loss": -24.118112564086914, "global_step": 199314, "epoch": 2401} {"train_loss": -24.21004295349121, "global_step": 199315, "epoch": 2401} {"train_loss": -24.392471313476562, "global_step": 199316, "epoch": 2401} {"train_loss": -24.201095581054688, "global_step": 199317, "epoch": 2401} {"train_loss": -24.439924240112305, "global_step": 199318, "epoch": 2401} {"train_loss": -24.222633361816406, "global_step": 199319, "epoch": 2401} {"train_loss": -24.022796630859375, "global_step": 199320, "epoch": 2401} {"train_loss": -24.292133331298828, "global_step": 199321, "epoch": 2401} {"train_loss": -24.462766647338867, "global_step": 199322, "epoch": 2401} {"train_loss": -24.140697479248047, "global_step": 199323, "epoch": 2401} {"train_loss": -24.258255004882812, "global_step": 199324, "epoch": 2401} {"train_loss": -24.105810165405273, "global_step": 199325, "epoch": 2401} {"train_loss": -24.406593322753906, "global_step": 199326, "epoch": 2401} {"train_loss": -23.967012405395508, "global_step": 199327, "epoch": 2401} {"train_loss": -24.097841262817383, "global_step": 199328, "epoch": 2401} {"train_loss": -24.252296447753906, "global_step": 199329, "epoch": 2401} {"train_loss": -24.35569190979004, "global_step": 199330, "epoch": 2401} {"train_loss": -23.916645050048828, "global_step": 199331, "epoch": 2401} {"train_loss": -24.139514923095703, "global_step": 199332, "epoch": 2401} {"train_loss": -24.456010818481445, "global_step": 199333, "epoch": 2401} {"train_loss": -24.459083557128906, "global_step": 199334, "epoch": 2401} {"train_loss": -24.278112411499023, "global_step": 199335, "epoch": 2401} {"train_loss": -24.666257858276367, "global_step": 199336, "epoch": 2401} {"train_loss": -24.39406967163086, "global_step": 199337, "epoch": 2401} {"train_loss": -24.763776779174805, "global_step": 199338, "epoch": 2401} {"train_loss": -24.542362213134766, "global_step": 199339, "epoch": 2401} {"train_loss": -24.1870174407959, "global_step": 199340, "epoch": 2401} {"train_loss": -24.169296264648438, "global_step": 199341, "epoch": 2401} {"train_loss": -24.770177841186523, "global_step": 199342, "epoch": 2401} {"train_loss": -24.015958786010742, "global_step": 199343, "epoch": 2401} {"train_loss": -24.06385040283203, "global_step": 199344, "epoch": 2401} {"train_loss": -24.2171630859375, "global_step": 199345, "epoch": 2401} {"train_loss": -24.124576568603516, "global_step": 199346, "epoch": 2401} {"train_loss": -24.049283981323242, "global_step": 199347, "epoch": 2401} {"train_loss": -24.51987075805664, "global_step": 199348, "epoch": 2401} {"train_loss": -24.425142288208008, "global_step": 199349, "epoch": 2401} {"train_loss": -23.964384078979492, "global_step": 199350, "epoch": 2401} {"train_loss": -24.28126335144043, "global_step": 199351, "epoch": 2401} {"train_loss": -24.265716552734375, "global_step": 199352, "epoch": 2401} {"train_loss": -24.14345359802246, "global_step": 199353, "epoch": 2401} {"train_loss": -24.39025115966797, "global_step": 199354, "epoch": 2401} {"train_loss": -24.256591796875, "global_step": 199355, "epoch": 2401} {"train_loss": -24.15331268310547, "global_step": 199356, "epoch": 2401} {"train_loss": -24.389461517333984, "global_step": 199357, "epoch": 2401} {"train_loss": -24.197708129882812, "global_step": 199358, "epoch": 2401} {"train_loss": -24.470203399658203, "global_step": 199359, "epoch": 2401} {"train_loss": -24.31681251525879, "global_step": 199360, "epoch": 2401} {"train_loss": -24.319005966186523, "global_step": 199361, "epoch": 2401} {"train_loss": -24.298864364624023, "global_step": 199362, "epoch": 2401} {"train_loss": -24.276060104370117, "global_step": 199363, "epoch": 2401} {"train_loss": -24.1901798248291, "global_step": 199364, "epoch": 2401} {"train_loss": -24.201313915022883, "global_step": 199365, "epoch": 2401, "val_loss": 6510514.5} {"train_loss": -24.01970863342285, "global_step": 199366, "epoch": 2402} {"train_loss": -23.77396583557129, "global_step": 199367, "epoch": 2402} {"train_loss": -24.057575225830078, "global_step": 199368, "epoch": 2402} {"train_loss": -24.142169952392578, "global_step": 199369, "epoch": 2402} {"train_loss": -23.779356002807617, "global_step": 199370, "epoch": 2402} {"train_loss": -23.92855453491211, "global_step": 199371, "epoch": 2402} {"train_loss": -23.824092864990234, "global_step": 199372, "epoch": 2402} {"train_loss": -23.92389678955078, "global_step": 199373, "epoch": 2402} {"train_loss": -23.88570213317871, "global_step": 199374, "epoch": 2402} {"train_loss": -24.157907485961914, "global_step": 199375, "epoch": 2402} {"train_loss": -23.809568405151367, "global_step": 199376, "epoch": 2402} {"train_loss": -23.7504825592041, "global_step": 199377, "epoch": 2402} {"train_loss": -24.033695220947266, "global_step": 199378, "epoch": 2402} {"train_loss": -24.24734878540039, "global_step": 199379, "epoch": 2402} {"train_loss": -24.36419105529785, "global_step": 199380, "epoch": 2402} {"train_loss": -23.84333610534668, "global_step": 199381, "epoch": 2402} {"train_loss": -24.160306930541992, "global_step": 199382, "epoch": 2402} {"train_loss": -24.556270599365234, "global_step": 199383, "epoch": 2402} {"train_loss": -23.982439041137695, "global_step": 199384, "epoch": 2402} {"train_loss": -24.120487213134766, "global_step": 199385, "epoch": 2402} {"train_loss": -24.153440475463867, "global_step": 199386, "epoch": 2402} {"train_loss": -24.17032814025879, "global_step": 199387, "epoch": 2402} {"train_loss": -24.21185302734375, "global_step": 199388, "epoch": 2402} {"train_loss": -23.829893112182617, "global_step": 199389, "epoch": 2402} {"train_loss": -24.35566520690918, "global_step": 199390, "epoch": 2402} {"train_loss": -24.33548927307129, "global_step": 199391, "epoch": 2402} {"train_loss": -24.31096649169922, "global_step": 199392, "epoch": 2402} {"train_loss": -24.192630767822266, "global_step": 199393, "epoch": 2402} {"train_loss": -24.116113662719727, "global_step": 199394, "epoch": 2402} {"train_loss": -24.183359146118164, "global_step": 199395, "epoch": 2402} {"train_loss": -24.187294006347656, "global_step": 199396, "epoch": 2402} {"train_loss": -24.410465240478516, "global_step": 199397, "epoch": 2402} {"train_loss": -24.360328674316406, "global_step": 199398, "epoch": 2402} {"train_loss": -24.142316818237305, "global_step": 199399, "epoch": 2402} {"train_loss": -24.22478675842285, "global_step": 199400, "epoch": 2402} {"train_loss": -24.224733352661133, "global_step": 199401, "epoch": 2402} {"train_loss": -24.11738395690918, "global_step": 199402, "epoch": 2402} {"train_loss": -23.732568740844727, "global_step": 199403, "epoch": 2402} {"train_loss": -24.287643432617188, "global_step": 199404, "epoch": 2402} {"train_loss": -24.346616744995117, "global_step": 199405, "epoch": 2402} {"train_loss": -24.45215606689453, "global_step": 199406, "epoch": 2402} {"train_loss": -24.403554916381836, "global_step": 199407, "epoch": 2402} {"train_loss": -24.254419326782227, "global_step": 199408, "epoch": 2402} {"train_loss": -24.1029052734375, "global_step": 199409, "epoch": 2402} {"train_loss": -24.23801612854004, "global_step": 199410, "epoch": 2402} {"train_loss": -23.90146255493164, "global_step": 199411, "epoch": 2402} {"train_loss": -24.39852523803711, "global_step": 199412, "epoch": 2402} {"train_loss": -24.203744888305664, "global_step": 199413, "epoch": 2402} {"train_loss": -24.31563377380371, "global_step": 199414, "epoch": 2402} {"train_loss": -24.350528717041016, "global_step": 199415, "epoch": 2402} {"train_loss": -24.158864974975586, "global_step": 199416, "epoch": 2402} {"train_loss": -24.30586051940918, "global_step": 199417, "epoch": 2402} {"train_loss": -24.53182601928711, "global_step": 199418, "epoch": 2402} {"train_loss": -24.59292221069336, "global_step": 199419, "epoch": 2402} {"train_loss": -24.381811141967773, "global_step": 199420, "epoch": 2402} {"train_loss": -24.492712020874023, "global_step": 199421, "epoch": 2402} {"train_loss": -24.5123233795166, "global_step": 199422, "epoch": 2402} {"train_loss": -24.28599739074707, "global_step": 199423, "epoch": 2402} {"train_loss": -24.520980834960938, "global_step": 199424, "epoch": 2402} {"train_loss": -24.631052017211914, "global_step": 199425, "epoch": 2402} {"train_loss": -24.506128311157227, "global_step": 199426, "epoch": 2402} {"train_loss": -24.26849937438965, "global_step": 199427, "epoch": 2402} {"train_loss": -24.268442153930664, "global_step": 199428, "epoch": 2402} {"train_loss": -24.02889633178711, "global_step": 199429, "epoch": 2402} {"train_loss": -24.589008331298828, "global_step": 199430, "epoch": 2402} {"train_loss": -24.462411880493164, "global_step": 199431, "epoch": 2402} {"train_loss": -24.454702377319336, "global_step": 199432, "epoch": 2402} {"train_loss": -24.043190002441406, "global_step": 199433, "epoch": 2402} {"train_loss": -24.65997886657715, "global_step": 199434, "epoch": 2402} {"train_loss": -24.17762565612793, "global_step": 199435, "epoch": 2402} {"train_loss": -24.37320327758789, "global_step": 199436, "epoch": 2402} {"train_loss": -24.07672691345215, "global_step": 199437, "epoch": 2402} {"train_loss": -24.4730167388916, "global_step": 199438, "epoch": 2402} {"train_loss": -24.487594604492188, "global_step": 199439, "epoch": 2402} {"train_loss": -24.48445701599121, "global_step": 199440, "epoch": 2402} {"train_loss": -24.365888595581055, "global_step": 199441, "epoch": 2402} {"train_loss": -23.483081817626953, "global_step": 199442, "epoch": 2402} {"train_loss": -24.44672966003418, "global_step": 199443, "epoch": 2402} {"train_loss": -24.07478904724121, "global_step": 199444, "epoch": 2402} {"train_loss": -24.255447387695312, "global_step": 199445, "epoch": 2402} {"train_loss": -24.232574462890625, "global_step": 199446, "epoch": 2402} {"train_loss": -24.061737060546875, "global_step": 199447, "epoch": 2402} {"train_loss": -24.21461698233363, "global_step": 199448, "epoch": 2402, "val_loss": 6519962.0} {"train_loss": -22.896774291992188, "global_step": 199449, "epoch": 2403} {"train_loss": -23.671947479248047, "global_step": 199450, "epoch": 2403} {"train_loss": -23.016204833984375, "global_step": 199451, "epoch": 2403} {"train_loss": -23.95058250427246, "global_step": 199452, "epoch": 2403} {"train_loss": -23.34759521484375, "global_step": 199453, "epoch": 2403} {"train_loss": -23.4709415435791, "global_step": 199454, "epoch": 2403} {"train_loss": -23.623022079467773, "global_step": 199455, "epoch": 2403} {"train_loss": -23.557113647460938, "global_step": 199456, "epoch": 2403} {"train_loss": -23.572851181030273, "global_step": 199457, "epoch": 2403} {"train_loss": -24.095186233520508, "global_step": 199458, "epoch": 2403} {"train_loss": -23.80180549621582, "global_step": 199459, "epoch": 2403} {"train_loss": -23.86775016784668, "global_step": 199460, "epoch": 2403} {"train_loss": -24.240079879760742, "global_step": 199461, "epoch": 2403} {"train_loss": -23.821311950683594, "global_step": 199462, "epoch": 2403} {"train_loss": -23.86695098876953, "global_step": 199463, "epoch": 2403} {"train_loss": -23.982288360595703, "global_step": 199464, "epoch": 2403} {"train_loss": -24.087203979492188, "global_step": 199465, "epoch": 2403} {"train_loss": -23.681116104125977, "global_step": 199466, "epoch": 2403} {"train_loss": -23.624189376831055, "global_step": 199467, "epoch": 2403} {"train_loss": -24.02773094177246, "global_step": 199468, "epoch": 2403} {"train_loss": -23.969404220581055, "global_step": 199469, "epoch": 2403} {"train_loss": -24.026212692260742, "global_step": 199470, "epoch": 2403} {"train_loss": -24.013212203979492, "global_step": 199471, "epoch": 2403} {"train_loss": -24.006664276123047, "global_step": 199472, "epoch": 2403} {"train_loss": -24.058393478393555, "global_step": 199473, "epoch": 2403} {"train_loss": -24.25640869140625, "global_step": 199474, "epoch": 2403} {"train_loss": -24.259675979614258, "global_step": 199475, "epoch": 2403} {"train_loss": -24.16952133178711, "global_step": 199476, "epoch": 2403} {"train_loss": -24.194629669189453, "global_step": 199477, "epoch": 2403} {"train_loss": -24.010221481323242, "global_step": 199478, "epoch": 2403} {"train_loss": -24.37948226928711, "global_step": 199479, "epoch": 2403} {"train_loss": -24.123510360717773, "global_step": 199480, "epoch": 2403} {"train_loss": -24.40675926208496, "global_step": 199481, "epoch": 2403} {"train_loss": -24.260526657104492, "global_step": 199482, "epoch": 2403} {"train_loss": -23.855066299438477, "global_step": 199483, "epoch": 2403} {"train_loss": -24.283538818359375, "global_step": 199484, "epoch": 2403} {"train_loss": -24.36775016784668, "global_step": 199485, "epoch": 2403} {"train_loss": -24.106752395629883, "global_step": 199486, "epoch": 2403} {"train_loss": -23.978994369506836, "global_step": 199487, "epoch": 2403} {"train_loss": -24.017318725585938, "global_step": 199488, "epoch": 2403} {"train_loss": -24.36543083190918, "global_step": 199489, "epoch": 2403} {"train_loss": -24.026578903198242, "global_step": 199490, "epoch": 2403} {"train_loss": -24.290023803710938, "global_step": 199491, "epoch": 2403} {"train_loss": -23.756664276123047, "global_step": 199492, "epoch": 2403} {"train_loss": -23.89338493347168, "global_step": 199493, "epoch": 2403} {"train_loss": -23.934036254882812, "global_step": 199494, "epoch": 2403} {"train_loss": -23.73807144165039, "global_step": 199495, "epoch": 2403} {"train_loss": -23.942676544189453, "global_step": 199496, "epoch": 2403} {"train_loss": -23.58260154724121, "global_step": 199497, "epoch": 2403} {"train_loss": -24.39141845703125, "global_step": 199498, "epoch": 2403} {"train_loss": -24.143699645996094, "global_step": 199499, "epoch": 2403} {"train_loss": -24.334684371948242, "global_step": 199500, "epoch": 2403} {"train_loss": -24.173131942749023, "global_step": 199501, "epoch": 2403} {"train_loss": -24.1289119720459, "global_step": 199502, "epoch": 2403} {"train_loss": -24.118499755859375, "global_step": 199503, "epoch": 2403} {"train_loss": -24.630489349365234, "global_step": 199504, "epoch": 2403} {"train_loss": -24.12726402282715, "global_step": 199505, "epoch": 2403} {"train_loss": -24.355710983276367, "global_step": 199506, "epoch": 2403} {"train_loss": -24.395837783813477, "global_step": 199507, "epoch": 2403} {"train_loss": -24.354787826538086, "global_step": 199508, "epoch": 2403} {"train_loss": -24.00656509399414, "global_step": 199509, "epoch": 2403} {"train_loss": -24.52894401550293, "global_step": 199510, "epoch": 2403} {"train_loss": -24.29957389831543, "global_step": 199511, "epoch": 2403} {"train_loss": -24.031166076660156, "global_step": 199512, "epoch": 2403} {"train_loss": -23.836009979248047, "global_step": 199513, "epoch": 2403} {"train_loss": -23.956655502319336, "global_step": 199514, "epoch": 2403} {"train_loss": -23.925119400024414, "global_step": 199515, "epoch": 2403} {"train_loss": -24.43332290649414, "global_step": 199516, "epoch": 2403} {"train_loss": -24.173124313354492, "global_step": 199517, "epoch": 2403} {"train_loss": -23.9647159576416, "global_step": 199518, "epoch": 2403} {"train_loss": -24.067163467407227, "global_step": 199519, "epoch": 2403} {"train_loss": -24.188308715820312, "global_step": 199520, "epoch": 2403} {"train_loss": -23.900314331054688, "global_step": 199521, "epoch": 2403} {"train_loss": -24.316009521484375, "global_step": 199522, "epoch": 2403} {"train_loss": -24.1818790435791, "global_step": 199523, "epoch": 2403} {"train_loss": -24.23309326171875, "global_step": 199524, "epoch": 2403} {"train_loss": -24.420175552368164, "global_step": 199525, "epoch": 2403} {"train_loss": -24.190311431884766, "global_step": 199526, "epoch": 2403} {"train_loss": -24.258344650268555, "global_step": 199527, "epoch": 2403} {"train_loss": -24.224393844604492, "global_step": 199528, "epoch": 2403} {"train_loss": -24.4282283782959, "global_step": 199529, "epoch": 2403} {"train_loss": -24.193532943725586, "global_step": 199530, "epoch": 2403} {"train_loss": -24.05206321808229, "global_step": 199531, "epoch": 2403, "val_loss": 6545814.0} {"train_loss": -23.975709915161133, "global_step": 199532, "epoch": 2404} {"train_loss": -23.920774459838867, "global_step": 199533, "epoch": 2404} {"train_loss": -24.06690788269043, "global_step": 199534, "epoch": 2404} {"train_loss": -23.470212936401367, "global_step": 199535, "epoch": 2404} {"train_loss": -24.18867301940918, "global_step": 199536, "epoch": 2404} {"train_loss": -23.977174758911133, "global_step": 199537, "epoch": 2404} {"train_loss": -23.972715377807617, "global_step": 199538, "epoch": 2404} {"train_loss": -23.806730270385742, "global_step": 199539, "epoch": 2404} {"train_loss": -23.674985885620117, "global_step": 199540, "epoch": 2404} {"train_loss": -23.895469665527344, "global_step": 199541, "epoch": 2404} {"train_loss": -23.868701934814453, "global_step": 199542, "epoch": 2404} {"train_loss": -24.161283493041992, "global_step": 199543, "epoch": 2404} {"train_loss": -24.330787658691406, "global_step": 199544, "epoch": 2404} {"train_loss": -23.964582443237305, "global_step": 199545, "epoch": 2404} {"train_loss": -24.288217544555664, "global_step": 199546, "epoch": 2404} {"train_loss": -24.3419189453125, "global_step": 199547, "epoch": 2404} {"train_loss": -23.862796783447266, "global_step": 199548, "epoch": 2404} {"train_loss": -24.25590705871582, "global_step": 199549, "epoch": 2404} {"train_loss": -24.077848434448242, "global_step": 199550, "epoch": 2404} {"train_loss": -24.106586456298828, "global_step": 199551, "epoch": 2404} {"train_loss": -24.018840789794922, "global_step": 199552, "epoch": 2404} {"train_loss": -24.290185928344727, "global_step": 199553, "epoch": 2404} {"train_loss": -24.36893653869629, "global_step": 199554, "epoch": 2404} {"train_loss": -24.081348419189453, "global_step": 199555, "epoch": 2404} {"train_loss": -24.378713607788086, "global_step": 199556, "epoch": 2404} {"train_loss": -24.2845401763916, "global_step": 199557, "epoch": 2404} {"train_loss": -24.352859497070312, "global_step": 199558, "epoch": 2404} {"train_loss": -23.72223472595215, "global_step": 199559, "epoch": 2404} {"train_loss": -23.83796501159668, "global_step": 199560, "epoch": 2404} {"train_loss": -24.197586059570312, "global_step": 199561, "epoch": 2404} {"train_loss": -24.714296340942383, "global_step": 199562, "epoch": 2404} {"train_loss": -24.409852981567383, "global_step": 199563, "epoch": 2404} {"train_loss": -24.302610397338867, "global_step": 199564, "epoch": 2404} {"train_loss": -24.470046997070312, "global_step": 199565, "epoch": 2404} {"train_loss": -24.16998291015625, "global_step": 199566, "epoch": 2404} {"train_loss": -24.31947898864746, "global_step": 199567, "epoch": 2404} {"train_loss": -24.374866485595703, "global_step": 199568, "epoch": 2404} {"train_loss": -24.175676345825195, "global_step": 199569, "epoch": 2404} {"train_loss": -24.58562660217285, "global_step": 199570, "epoch": 2404} {"train_loss": -24.227563858032227, "global_step": 199571, "epoch": 2404} {"train_loss": -24.194110870361328, "global_step": 199572, "epoch": 2404} {"train_loss": -24.251182556152344, "global_step": 199573, "epoch": 2404} {"train_loss": -24.19190788269043, "global_step": 199574, "epoch": 2404} {"train_loss": -24.42081069946289, "global_step": 199575, "epoch": 2404} {"train_loss": -24.259891510009766, "global_step": 199576, "epoch": 2404} {"train_loss": -24.2471923828125, "global_step": 199577, "epoch": 2404} {"train_loss": -23.890199661254883, "global_step": 199578, "epoch": 2404} {"train_loss": -24.195999145507812, "global_step": 199579, "epoch": 2404} {"train_loss": -23.870594024658203, "global_step": 199580, "epoch": 2404} {"train_loss": -24.25614356994629, "global_step": 199581, "epoch": 2404} {"train_loss": -24.05203628540039, "global_step": 199582, "epoch": 2404} {"train_loss": -23.878223419189453, "global_step": 199583, "epoch": 2404} {"train_loss": -24.2017879486084, "global_step": 199584, "epoch": 2404} {"train_loss": -24.139551162719727, "global_step": 199585, "epoch": 2404} {"train_loss": -24.22963523864746, "global_step": 199586, "epoch": 2404} {"train_loss": -24.244590759277344, "global_step": 199587, "epoch": 2404} {"train_loss": -24.226057052612305, "global_step": 199588, "epoch": 2404} {"train_loss": -24.194957733154297, "global_step": 199589, "epoch": 2404} {"train_loss": -24.64326286315918, "global_step": 199590, "epoch": 2404} {"train_loss": -24.635786056518555, "global_step": 199591, "epoch": 2404} {"train_loss": -24.18720817565918, "global_step": 199592, "epoch": 2404} {"train_loss": -24.326955795288086, "global_step": 199593, "epoch": 2404} {"train_loss": -24.31577491760254, "global_step": 199594, "epoch": 2404} {"train_loss": -24.293479919433594, "global_step": 199595, "epoch": 2404} {"train_loss": -24.30318260192871, "global_step": 199596, "epoch": 2404} {"train_loss": -24.413299560546875, "global_step": 199597, "epoch": 2404} {"train_loss": -24.291547775268555, "global_step": 199598, "epoch": 2404} {"train_loss": -24.309206008911133, "global_step": 199599, "epoch": 2404} {"train_loss": -24.318105697631836, "global_step": 199600, "epoch": 2404} {"train_loss": -24.039243698120117, "global_step": 199601, "epoch": 2404} {"train_loss": -24.795394897460938, "global_step": 199602, "epoch": 2404} {"train_loss": -24.394866943359375, "global_step": 199603, "epoch": 2404} {"train_loss": -24.549041748046875, "global_step": 199604, "epoch": 2404} {"train_loss": -24.331462860107422, "global_step": 199605, "epoch": 2404} {"train_loss": -24.3963680267334, "global_step": 199606, "epoch": 2404} {"train_loss": -24.72037696838379, "global_step": 199607, "epoch": 2404} {"train_loss": -24.566640853881836, "global_step": 199608, "epoch": 2404} {"train_loss": -24.572547912597656, "global_step": 199609, "epoch": 2404} {"train_loss": -24.088537216186523, "global_step": 199610, "epoch": 2404} {"train_loss": -24.4132137298584, "global_step": 199611, "epoch": 2404} {"train_loss": -24.449382781982422, "global_step": 199612, "epoch": 2404} {"train_loss": -24.589048385620117, "global_step": 199613, "epoch": 2404} {"train_loss": -24.22570037841797, "global_step": 199614, "epoch": 2404, "val_loss": 6532403.0} {"train_loss": -24.138654708862305, "global_step": 199615, "epoch": 2405} {"train_loss": -23.9881591796875, "global_step": 199616, "epoch": 2405} {"train_loss": -24.215147018432617, "global_step": 199617, "epoch": 2405} {"train_loss": -23.98409080505371, "global_step": 199618, "epoch": 2405} {"train_loss": -24.0745906829834, "global_step": 199619, "epoch": 2405} {"train_loss": -24.188413619995117, "global_step": 199620, "epoch": 2405} {"train_loss": -24.014631271362305, "global_step": 199621, "epoch": 2405} {"train_loss": -24.12039566040039, "global_step": 199622, "epoch": 2405} {"train_loss": -23.693164825439453, "global_step": 199623, "epoch": 2405} {"train_loss": -23.799497604370117, "global_step": 199624, "epoch": 2405} {"train_loss": -24.228435516357422, "global_step": 199625, "epoch": 2405} {"train_loss": -24.345998764038086, "global_step": 199626, "epoch": 2405} {"train_loss": -24.105243682861328, "global_step": 199627, "epoch": 2405} {"train_loss": -24.34894371032715, "global_step": 199628, "epoch": 2405} {"train_loss": -24.401412963867188, "global_step": 199629, "epoch": 2405} {"train_loss": -24.77041244506836, "global_step": 199630, "epoch": 2405} {"train_loss": -24.487558364868164, "global_step": 199631, "epoch": 2405} {"train_loss": -24.16042137145996, "global_step": 199632, "epoch": 2405} {"train_loss": -24.472379684448242, "global_step": 199633, "epoch": 2405} {"train_loss": -24.317583084106445, "global_step": 199634, "epoch": 2405} {"train_loss": -24.31959342956543, "global_step": 199635, "epoch": 2405} {"train_loss": -24.06296730041504, "global_step": 199636, "epoch": 2405} {"train_loss": -24.367834091186523, "global_step": 199637, "epoch": 2405} {"train_loss": -24.191984176635742, "global_step": 199638, "epoch": 2405} {"train_loss": -24.045894622802734, "global_step": 199639, "epoch": 2405} {"train_loss": -24.375516891479492, "global_step": 199640, "epoch": 2405} {"train_loss": -24.437265396118164, "global_step": 199641, "epoch": 2405} {"train_loss": -24.217090606689453, "global_step": 199642, "epoch": 2405} {"train_loss": -24.389307022094727, "global_step": 199643, "epoch": 2405} {"train_loss": -23.722719192504883, "global_step": 199644, "epoch": 2405} {"train_loss": -24.4085693359375, "global_step": 199645, "epoch": 2405} {"train_loss": -23.964879989624023, "global_step": 199646, "epoch": 2405} {"train_loss": -24.579858779907227, "global_step": 199647, "epoch": 2405} {"train_loss": -24.011571884155273, "global_step": 199648, "epoch": 2405} {"train_loss": -24.324621200561523, "global_step": 199649, "epoch": 2405} {"train_loss": -23.722400665283203, "global_step": 199650, "epoch": 2405} {"train_loss": -23.822193145751953, "global_step": 199651, "epoch": 2405} {"train_loss": -24.001195907592773, "global_step": 199652, "epoch": 2405} {"train_loss": -24.160703659057617, "global_step": 199653, "epoch": 2405} {"train_loss": -24.318050384521484, "global_step": 199654, "epoch": 2405} {"train_loss": -23.75029182434082, "global_step": 199655, "epoch": 2405} {"train_loss": -24.586530685424805, "global_step": 199656, "epoch": 2405} {"train_loss": -24.20379066467285, "global_step": 199657, "epoch": 2405} {"train_loss": -24.144031524658203, "global_step": 199658, "epoch": 2405} {"train_loss": -24.171218872070312, "global_step": 199659, "epoch": 2405} {"train_loss": -24.012983322143555, "global_step": 199660, "epoch": 2405} {"train_loss": -23.668319702148438, "global_step": 199661, "epoch": 2405} {"train_loss": -24.171173095703125, "global_step": 199662, "epoch": 2405} {"train_loss": -24.44569969177246, "global_step": 199663, "epoch": 2405} {"train_loss": -23.931665420532227, "global_step": 199664, "epoch": 2405} {"train_loss": -24.052244186401367, "global_step": 199665, "epoch": 2405} {"train_loss": -24.25540542602539, "global_step": 199666, "epoch": 2405} {"train_loss": -23.94457244873047, "global_step": 199667, "epoch": 2405} {"train_loss": -24.398313522338867, "global_step": 199668, "epoch": 2405} {"train_loss": -24.090431213378906, "global_step": 199669, "epoch": 2405} {"train_loss": -24.513320922851562, "global_step": 199670, "epoch": 2405} {"train_loss": -24.126895904541016, "global_step": 199671, "epoch": 2405} {"train_loss": -24.190128326416016, "global_step": 199672, "epoch": 2405} {"train_loss": -24.255603790283203, "global_step": 199673, "epoch": 2405} {"train_loss": -23.907146453857422, "global_step": 199674, "epoch": 2405} {"train_loss": -23.884868621826172, "global_step": 199675, "epoch": 2405} {"train_loss": -24.298866271972656, "global_step": 199676, "epoch": 2405} {"train_loss": -24.352882385253906, "global_step": 199677, "epoch": 2405} {"train_loss": -24.442642211914062, "global_step": 199678, "epoch": 2405} {"train_loss": -23.946014404296875, "global_step": 199679, "epoch": 2405} {"train_loss": -24.29427146911621, "global_step": 199680, "epoch": 2405} {"train_loss": -24.43744468688965, "global_step": 199681, "epoch": 2405} {"train_loss": -24.248580932617188, "global_step": 199682, "epoch": 2405} {"train_loss": -24.205591201782227, "global_step": 199683, "epoch": 2405} {"train_loss": -24.547311782836914, "global_step": 199684, "epoch": 2405} {"train_loss": -24.457300186157227, "global_step": 199685, "epoch": 2405} {"train_loss": -24.244592666625977, "global_step": 199686, "epoch": 2405} {"train_loss": -24.61284065246582, "global_step": 199687, "epoch": 2405} {"train_loss": -24.096364974975586, "global_step": 199688, "epoch": 2405} {"train_loss": -24.297687530517578, "global_step": 199689, "epoch": 2405} {"train_loss": -24.494659423828125, "global_step": 199690, "epoch": 2405} {"train_loss": -24.464811325073242, "global_step": 199691, "epoch": 2405} {"train_loss": -24.245187759399414, "global_step": 199692, "epoch": 2405} {"train_loss": -24.325489044189453, "global_step": 199693, "epoch": 2405} {"train_loss": -24.63779640197754, "global_step": 199694, "epoch": 2405} {"train_loss": -24.092432022094727, "global_step": 199695, "epoch": 2405} {"train_loss": -24.353984832763672, "global_step": 199696, "epoch": 2405} {"train_loss": -24.187641649361115, "global_step": 199697, "epoch": 2405, "val_loss": 6582512.0} {"train_loss": -21.564651489257812, "global_step": 199698, "epoch": 2406} {"train_loss": -21.93380355834961, "global_step": 199699, "epoch": 2406} {"train_loss": -23.124265670776367, "global_step": 199700, "epoch": 2406} {"train_loss": -22.857913970947266, "global_step": 199701, "epoch": 2406} {"train_loss": -23.202552795410156, "global_step": 199702, "epoch": 2406} {"train_loss": -23.20754051208496, "global_step": 199703, "epoch": 2406} {"train_loss": -23.617141723632812, "global_step": 199704, "epoch": 2406} {"train_loss": -23.553180694580078, "global_step": 199705, "epoch": 2406} {"train_loss": -23.703821182250977, "global_step": 199706, "epoch": 2406} {"train_loss": -23.51740074157715, "global_step": 199707, "epoch": 2406} {"train_loss": -23.2828369140625, "global_step": 199708, "epoch": 2406} {"train_loss": -23.76613998413086, "global_step": 199709, "epoch": 2406} {"train_loss": -23.740638732910156, "global_step": 199710, "epoch": 2406} {"train_loss": -23.56233024597168, "global_step": 199711, "epoch": 2406} {"train_loss": -23.767927169799805, "global_step": 199712, "epoch": 2406} {"train_loss": -23.644317626953125, "global_step": 199713, "epoch": 2406} {"train_loss": -23.611337661743164, "global_step": 199714, "epoch": 2406} {"train_loss": -23.943967819213867, "global_step": 199715, "epoch": 2406} {"train_loss": -23.59663963317871, "global_step": 199716, "epoch": 2406} {"train_loss": -23.48914909362793, "global_step": 199717, "epoch": 2406} {"train_loss": -23.763954162597656, "global_step": 199718, "epoch": 2406} {"train_loss": -23.911582946777344, "global_step": 199719, "epoch": 2406} {"train_loss": -23.51386833190918, "global_step": 199720, "epoch": 2406} {"train_loss": -23.896377563476562, "global_step": 199721, "epoch": 2406} {"train_loss": -23.884994506835938, "global_step": 199722, "epoch": 2406} {"train_loss": -24.2352294921875, "global_step": 199723, "epoch": 2406} {"train_loss": -24.458255767822266, "global_step": 199724, "epoch": 2406} {"train_loss": -24.044248580932617, "global_step": 199725, "epoch": 2406} {"train_loss": -24.25355339050293, "global_step": 199726, "epoch": 2406} {"train_loss": -24.271442413330078, "global_step": 199727, "epoch": 2406} {"train_loss": -23.95775032043457, "global_step": 199728, "epoch": 2406} {"train_loss": -24.45949363708496, "global_step": 199729, "epoch": 2406} {"train_loss": -24.43366050720215, "global_step": 199730, "epoch": 2406} {"train_loss": -24.410856246948242, "global_step": 199731, "epoch": 2406} {"train_loss": -24.642030715942383, "global_step": 199732, "epoch": 2406} {"train_loss": -24.122055053710938, "global_step": 199733, "epoch": 2406} {"train_loss": -24.122634887695312, "global_step": 199734, "epoch": 2406} {"train_loss": -24.5279541015625, "global_step": 199735, "epoch": 2406} {"train_loss": -23.92120361328125, "global_step": 199736, "epoch": 2406} {"train_loss": -24.075809478759766, "global_step": 199737, "epoch": 2406} {"train_loss": -24.3935489654541, "global_step": 199738, "epoch": 2406} {"train_loss": -24.591733932495117, "global_step": 199739, "epoch": 2406} {"train_loss": -24.195341110229492, "global_step": 199740, "epoch": 2406} {"train_loss": -24.26993179321289, "global_step": 199741, "epoch": 2406} {"train_loss": -24.368032455444336, "global_step": 199742, "epoch": 2406} {"train_loss": -24.312559127807617, "global_step": 199743, "epoch": 2406} {"train_loss": -24.494688034057617, "global_step": 199744, "epoch": 2406} {"train_loss": -24.48206901550293, "global_step": 199745, "epoch": 2406} {"train_loss": -24.513473510742188, "global_step": 199746, "epoch": 2406} {"train_loss": -24.416397094726562, "global_step": 199747, "epoch": 2406} {"train_loss": -24.390995025634766, "global_step": 199748, "epoch": 2406} {"train_loss": -24.31548309326172, "global_step": 199749, "epoch": 2406} {"train_loss": -24.40497398376465, "global_step": 199750, "epoch": 2406} {"train_loss": -23.9805965423584, "global_step": 199751, "epoch": 2406} {"train_loss": -24.25452423095703, "global_step": 199752, "epoch": 2406} {"train_loss": -24.265958786010742, "global_step": 199753, "epoch": 2406} {"train_loss": -24.402524948120117, "global_step": 199754, "epoch": 2406} {"train_loss": -24.38022232055664, "global_step": 199755, "epoch": 2406} {"train_loss": -24.194656372070312, "global_step": 199756, "epoch": 2406} {"train_loss": -24.092788696289062, "global_step": 199757, "epoch": 2406} {"train_loss": -24.166292190551758, "global_step": 199758, "epoch": 2406} {"train_loss": -23.984464645385742, "global_step": 199759, "epoch": 2406} {"train_loss": -24.486425399780273, "global_step": 199760, "epoch": 2406} {"train_loss": -24.016632080078125, "global_step": 199761, "epoch": 2406} {"train_loss": -24.34718894958496, "global_step": 199762, "epoch": 2406} {"train_loss": -24.1473388671875, "global_step": 199763, "epoch": 2406} {"train_loss": -24.2626953125, "global_step": 199764, "epoch": 2406} {"train_loss": -24.75860023498535, "global_step": 199765, "epoch": 2406} {"train_loss": -24.330101013183594, "global_step": 199766, "epoch": 2406} {"train_loss": -23.932004928588867, "global_step": 199767, "epoch": 2406} {"train_loss": -24.41013526916504, "global_step": 199768, "epoch": 2406} {"train_loss": -24.072046279907227, "global_step": 199769, "epoch": 2406} {"train_loss": -24.294849395751953, "global_step": 199770, "epoch": 2406} {"train_loss": -24.257658004760742, "global_step": 199771, "epoch": 2406} {"train_loss": -24.322145462036133, "global_step": 199772, "epoch": 2406} {"train_loss": -24.2674503326416, "global_step": 199773, "epoch": 2406} {"train_loss": -23.86884880065918, "global_step": 199774, "epoch": 2406} {"train_loss": -24.167449951171875, "global_step": 199775, "epoch": 2406} {"train_loss": -24.087085723876953, "global_step": 199776, "epoch": 2406} {"train_loss": -24.25941276550293, "global_step": 199777, "epoch": 2406} {"train_loss": -23.97671127319336, "global_step": 199778, "epoch": 2406} {"train_loss": -24.049585342407227, "global_step": 199779, "epoch": 2406} {"train_loss": -24.022183222943042, "global_step": 199780, "epoch": 2406, "val_loss": 6603861.0} {"train_loss": -24.25958824157715, "global_step": 199781, "epoch": 2407} {"train_loss": -23.27960968017578, "global_step": 199782, "epoch": 2407} {"train_loss": -23.6254940032959, "global_step": 199783, "epoch": 2407} {"train_loss": -23.512556076049805, "global_step": 199784, "epoch": 2407} {"train_loss": -23.006635665893555, "global_step": 199785, "epoch": 2407} {"train_loss": -23.805377960205078, "global_step": 199786, "epoch": 2407} {"train_loss": -23.733631134033203, "global_step": 199787, "epoch": 2407} {"train_loss": -23.781789779663086, "global_step": 199788, "epoch": 2407} {"train_loss": -23.54119300842285, "global_step": 199789, "epoch": 2407} {"train_loss": -24.024351119995117, "global_step": 199790, "epoch": 2407} {"train_loss": -23.690570831298828, "global_step": 199791, "epoch": 2407} {"train_loss": -23.748830795288086, "global_step": 199792, "epoch": 2407} {"train_loss": -23.9326229095459, "global_step": 199793, "epoch": 2407} {"train_loss": -23.693023681640625, "global_step": 199794, "epoch": 2407} {"train_loss": -23.744548797607422, "global_step": 199795, "epoch": 2407} {"train_loss": -23.95536231994629, "global_step": 199796, "epoch": 2407} {"train_loss": -23.74007225036621, "global_step": 199797, "epoch": 2407} {"train_loss": -24.018417358398438, "global_step": 199798, "epoch": 2407} {"train_loss": -23.622238159179688, "global_step": 199799, "epoch": 2407} {"train_loss": -24.060117721557617, "global_step": 199800, "epoch": 2407} {"train_loss": -24.098316192626953, "global_step": 199801, "epoch": 2407} {"train_loss": -23.676443099975586, "global_step": 199802, "epoch": 2407} {"train_loss": -24.21550750732422, "global_step": 199803, "epoch": 2407} {"train_loss": -23.87335205078125, "global_step": 199804, "epoch": 2407} {"train_loss": -24.151840209960938, "global_step": 199805, "epoch": 2407} {"train_loss": -24.09773063659668, "global_step": 199806, "epoch": 2407} {"train_loss": -24.415992736816406, "global_step": 199807, "epoch": 2407} {"train_loss": -24.36778450012207, "global_step": 199808, "epoch": 2407} {"train_loss": -23.77621841430664, "global_step": 199809, "epoch": 2407} {"train_loss": -24.012662887573242, "global_step": 199810, "epoch": 2407} {"train_loss": -24.360010147094727, "global_step": 199811, "epoch": 2407} {"train_loss": -23.837844848632812, "global_step": 199812, "epoch": 2407} {"train_loss": -24.355363845825195, "global_step": 199813, "epoch": 2407} {"train_loss": -24.014387130737305, "global_step": 199814, "epoch": 2407} {"train_loss": -24.026559829711914, "global_step": 199815, "epoch": 2407} {"train_loss": -24.02983283996582, "global_step": 199816, "epoch": 2407} {"train_loss": -24.45477867126465, "global_step": 199817, "epoch": 2407} {"train_loss": -24.337879180908203, "global_step": 199818, "epoch": 2407} {"train_loss": -24.40663719177246, "global_step": 199819, "epoch": 2407} {"train_loss": -24.176849365234375, "global_step": 199820, "epoch": 2407} {"train_loss": -24.220144271850586, "global_step": 199821, "epoch": 2407} {"train_loss": -24.511693954467773, "global_step": 199822, "epoch": 2407} {"train_loss": -24.303075790405273, "global_step": 199823, "epoch": 2407} {"train_loss": -23.964759826660156, "global_step": 199824, "epoch": 2407} {"train_loss": -24.225692749023438, "global_step": 199825, "epoch": 2407} {"train_loss": -24.43062400817871, "global_step": 199826, "epoch": 2407} {"train_loss": -24.479101181030273, "global_step": 199827, "epoch": 2407} {"train_loss": -24.190622329711914, "global_step": 199828, "epoch": 2407} {"train_loss": -24.378042221069336, "global_step": 199829, "epoch": 2407} {"train_loss": -24.186784744262695, "global_step": 199830, "epoch": 2407} {"train_loss": -24.394092559814453, "global_step": 199831, "epoch": 2407} {"train_loss": -24.452186584472656, "global_step": 199832, "epoch": 2407} {"train_loss": -24.12790870666504, "global_step": 199833, "epoch": 2407} {"train_loss": -23.719106674194336, "global_step": 199834, "epoch": 2407} {"train_loss": -23.70188331604004, "global_step": 199835, "epoch": 2407} {"train_loss": -24.39127540588379, "global_step": 199836, "epoch": 2407} {"train_loss": -24.317930221557617, "global_step": 199837, "epoch": 2407} {"train_loss": -23.784337997436523, "global_step": 199838, "epoch": 2407} {"train_loss": -24.21286964416504, "global_step": 199839, "epoch": 2407} {"train_loss": -23.99650001525879, "global_step": 199840, "epoch": 2407} {"train_loss": -24.589847564697266, "global_step": 199841, "epoch": 2407} {"train_loss": -24.154651641845703, "global_step": 199842, "epoch": 2407} {"train_loss": -23.934551239013672, "global_step": 199843, "epoch": 2407} {"train_loss": -24.399490356445312, "global_step": 199844, "epoch": 2407} {"train_loss": -24.59836769104004, "global_step": 199845, "epoch": 2407} {"train_loss": -23.871490478515625, "global_step": 199846, "epoch": 2407} {"train_loss": -24.196264266967773, "global_step": 199847, "epoch": 2407} {"train_loss": -24.63418197631836, "global_step": 199848, "epoch": 2407} {"train_loss": -24.461679458618164, "global_step": 199849, "epoch": 2407} {"train_loss": -24.13831901550293, "global_step": 199850, "epoch": 2407} {"train_loss": -24.039653778076172, "global_step": 199851, "epoch": 2407} {"train_loss": -24.826181411743164, "global_step": 199852, "epoch": 2407} {"train_loss": -24.286746978759766, "global_step": 199853, "epoch": 2407} {"train_loss": -24.6408634185791, "global_step": 199854, "epoch": 2407} {"train_loss": -24.662399291992188, "global_step": 199855, "epoch": 2407} {"train_loss": -24.542028427124023, "global_step": 199856, "epoch": 2407} {"train_loss": -24.347902297973633, "global_step": 199857, "epoch": 2407} {"train_loss": -24.498315811157227, "global_step": 199858, "epoch": 2407} {"train_loss": -24.422964096069336, "global_step": 199859, "epoch": 2407} {"train_loss": -24.48166847229004, "global_step": 199860, "epoch": 2407} {"train_loss": -24.427337646484375, "global_step": 199861, "epoch": 2407} {"train_loss": -24.825077056884766, "global_step": 199862, "epoch": 2407} {"train_loss": -24.1309757002865, "global_step": 199863, "epoch": 2407, "val_loss": 6498167.0} {"train_loss": -23.869152069091797, "global_step": 199864, "epoch": 2408} {"train_loss": -23.84228515625, "global_step": 199865, "epoch": 2408} {"train_loss": -24.136383056640625, "global_step": 199866, "epoch": 2408} {"train_loss": -23.44346046447754, "global_step": 199867, "epoch": 2408} {"train_loss": -23.728975296020508, "global_step": 199868, "epoch": 2408} {"train_loss": -24.141695022583008, "global_step": 199869, "epoch": 2408} {"train_loss": -23.881101608276367, "global_step": 199870, "epoch": 2408} {"train_loss": -23.894006729125977, "global_step": 199871, "epoch": 2408} {"train_loss": -24.15517234802246, "global_step": 199872, "epoch": 2408} {"train_loss": -23.94575309753418, "global_step": 199873, "epoch": 2408} {"train_loss": -24.19386100769043, "global_step": 199874, "epoch": 2408} {"train_loss": -24.259368896484375, "global_step": 199875, "epoch": 2408} {"train_loss": -23.950374603271484, "global_step": 199876, "epoch": 2408} {"train_loss": -24.268415451049805, "global_step": 199877, "epoch": 2408} {"train_loss": -23.938138961791992, "global_step": 199878, "epoch": 2408} {"train_loss": -24.169641494750977, "global_step": 199879, "epoch": 2408} {"train_loss": -23.887731552124023, "global_step": 199880, "epoch": 2408} {"train_loss": -24.153961181640625, "global_step": 199881, "epoch": 2408} {"train_loss": -24.43562126159668, "global_step": 199882, "epoch": 2408} {"train_loss": -23.927343368530273, "global_step": 199883, "epoch": 2408} {"train_loss": -24.10744857788086, "global_step": 199884, "epoch": 2408} {"train_loss": -24.37434196472168, "global_step": 199885, "epoch": 2408} {"train_loss": -24.31928253173828, "global_step": 199886, "epoch": 2408} {"train_loss": -24.325037002563477, "global_step": 199887, "epoch": 2408} {"train_loss": -24.198484420776367, "global_step": 199888, "epoch": 2408} {"train_loss": -24.01470947265625, "global_step": 199889, "epoch": 2408} {"train_loss": -23.835094451904297, "global_step": 199890, "epoch": 2408} {"train_loss": -24.462987899780273, "global_step": 199891, "epoch": 2408} {"train_loss": -24.3352108001709, "global_step": 199892, "epoch": 2408} {"train_loss": -24.50295066833496, "global_step": 199893, "epoch": 2408} {"train_loss": -24.125560760498047, "global_step": 199894, "epoch": 2408} {"train_loss": -24.521255493164062, "global_step": 199895, "epoch": 2408} {"train_loss": -24.348718643188477, "global_step": 199896, "epoch": 2408} {"train_loss": -24.18171501159668, "global_step": 199897, "epoch": 2408} {"train_loss": -24.461593627929688, "global_step": 199898, "epoch": 2408} {"train_loss": -24.33876609802246, "global_step": 199899, "epoch": 2408} {"train_loss": -24.51215171813965, "global_step": 199900, "epoch": 2408} {"train_loss": -24.403438568115234, "global_step": 199901, "epoch": 2408} {"train_loss": -24.361764907836914, "global_step": 199902, "epoch": 2408} {"train_loss": -24.24920082092285, "global_step": 199903, "epoch": 2408} {"train_loss": -24.396432876586914, "global_step": 199904, "epoch": 2408} {"train_loss": -24.2188663482666, "global_step": 199905, "epoch": 2408} {"train_loss": -24.267894744873047, "global_step": 199906, "epoch": 2408} {"train_loss": -24.421525955200195, "global_step": 199907, "epoch": 2408} {"train_loss": -24.072248458862305, "global_step": 199908, "epoch": 2408} {"train_loss": -24.148839950561523, "global_step": 199909, "epoch": 2408} {"train_loss": -24.306720733642578, "global_step": 199910, "epoch": 2408} {"train_loss": -24.54401206970215, "global_step": 199911, "epoch": 2408} {"train_loss": -23.893911361694336, "global_step": 199912, "epoch": 2408} {"train_loss": -24.31269645690918, "global_step": 199913, "epoch": 2408} {"train_loss": -24.373126983642578, "global_step": 199914, "epoch": 2408} {"train_loss": -23.9427547454834, "global_step": 199915, "epoch": 2408} {"train_loss": -24.290233612060547, "global_step": 199916, "epoch": 2408} {"train_loss": -24.69577407836914, "global_step": 199917, "epoch": 2408} {"train_loss": -24.51307487487793, "global_step": 199918, "epoch": 2408} {"train_loss": -24.28584861755371, "global_step": 199919, "epoch": 2408} {"train_loss": -24.22176170349121, "global_step": 199920, "epoch": 2408} {"train_loss": -24.093669891357422, "global_step": 199921, "epoch": 2408} {"train_loss": -24.41924285888672, "global_step": 199922, "epoch": 2408} {"train_loss": -24.28352165222168, "global_step": 199923, "epoch": 2408} {"train_loss": -24.758895874023438, "global_step": 199924, "epoch": 2408} {"train_loss": -24.29224967956543, "global_step": 199925, "epoch": 2408} {"train_loss": -23.98834800720215, "global_step": 199926, "epoch": 2408} {"train_loss": -24.278249740600586, "global_step": 199927, "epoch": 2408} {"train_loss": -24.15138816833496, "global_step": 199928, "epoch": 2408} {"train_loss": -24.649906158447266, "global_step": 199929, "epoch": 2408} {"train_loss": -24.05830955505371, "global_step": 199930, "epoch": 2408} {"train_loss": -24.18857765197754, "global_step": 199931, "epoch": 2408} {"train_loss": -24.259002685546875, "global_step": 199932, "epoch": 2408} {"train_loss": -24.056241989135742, "global_step": 199933, "epoch": 2408} {"train_loss": -24.190235137939453, "global_step": 199934, "epoch": 2408} {"train_loss": -24.066064834594727, "global_step": 199935, "epoch": 2408} {"train_loss": -24.592029571533203, "global_step": 199936, "epoch": 2408} {"train_loss": -23.995811462402344, "global_step": 199937, "epoch": 2408} {"train_loss": -24.56218147277832, "global_step": 199938, "epoch": 2408} {"train_loss": -24.826526641845703, "global_step": 199939, "epoch": 2408} {"train_loss": -24.296323776245117, "global_step": 199940, "epoch": 2408} {"train_loss": -24.387248992919922, "global_step": 199941, "epoch": 2408} {"train_loss": -24.117162704467773, "global_step": 199942, "epoch": 2408} {"train_loss": -23.897994995117188, "global_step": 199943, "epoch": 2408} {"train_loss": -24.352811813354492, "global_step": 199944, "epoch": 2408} {"train_loss": -24.11764907836914, "global_step": 199945, "epoch": 2408} {"train_loss": -24.207470032105963, "global_step": 199946, "epoch": 2408, "val_loss": 6549682.5} {"train_loss": -24.158872604370117, "global_step": 199947, "epoch": 2409} {"train_loss": -24.424880981445312, "global_step": 199948, "epoch": 2409} {"train_loss": -23.8057918548584, "global_step": 199949, "epoch": 2409} {"train_loss": -23.500690460205078, "global_step": 199950, "epoch": 2409} {"train_loss": -24.219680786132812, "global_step": 199951, "epoch": 2409} {"train_loss": -24.132272720336914, "global_step": 199952, "epoch": 2409} {"train_loss": -23.49542808532715, "global_step": 199953, "epoch": 2409} {"train_loss": -23.927005767822266, "global_step": 199954, "epoch": 2409} {"train_loss": -24.058319091796875, "global_step": 199955, "epoch": 2409} {"train_loss": -23.697853088378906, "global_step": 199956, "epoch": 2409} {"train_loss": -24.217451095581055, "global_step": 199957, "epoch": 2409} {"train_loss": -23.994556427001953, "global_step": 199958, "epoch": 2409} {"train_loss": -23.951566696166992, "global_step": 199959, "epoch": 2409} {"train_loss": -24.254247665405273, "global_step": 199960, "epoch": 2409} {"train_loss": -24.17947769165039, "global_step": 199961, "epoch": 2409} {"train_loss": -24.255685806274414, "global_step": 199962, "epoch": 2409} {"train_loss": -23.961606979370117, "global_step": 199963, "epoch": 2409} {"train_loss": -24.1534366607666, "global_step": 199964, "epoch": 2409} {"train_loss": -24.202417373657227, "global_step": 199965, "epoch": 2409} {"train_loss": -24.215845108032227, "global_step": 199966, "epoch": 2409} {"train_loss": -24.20902442932129, "global_step": 199967, "epoch": 2409} {"train_loss": -24.10309410095215, "global_step": 199968, "epoch": 2409} {"train_loss": -24.443811416625977, "global_step": 199969, "epoch": 2409} {"train_loss": -24.18140411376953, "global_step": 199970, "epoch": 2409} {"train_loss": -24.075746536254883, "global_step": 199971, "epoch": 2409} {"train_loss": -24.102752685546875, "global_step": 199972, "epoch": 2409} {"train_loss": -24.3371524810791, "global_step": 199973, "epoch": 2409} {"train_loss": -24.348892211914062, "global_step": 199974, "epoch": 2409} {"train_loss": -24.36858558654785, "global_step": 199975, "epoch": 2409} {"train_loss": -24.202415466308594, "global_step": 199976, "epoch": 2409} {"train_loss": -24.51243782043457, "global_step": 199977, "epoch": 2409} {"train_loss": -23.765254974365234, "global_step": 199978, "epoch": 2409} {"train_loss": -24.703136444091797, "global_step": 199979, "epoch": 2409} {"train_loss": -24.306562423706055, "global_step": 199980, "epoch": 2409} {"train_loss": -24.085302352905273, "global_step": 199981, "epoch": 2409} {"train_loss": -24.257007598876953, "global_step": 199982, "epoch": 2409} {"train_loss": -24.527170181274414, "global_step": 199983, "epoch": 2409} {"train_loss": -23.994564056396484, "global_step": 199984, "epoch": 2409} {"train_loss": -24.07175636291504, "global_step": 199985, "epoch": 2409} {"train_loss": -24.126174926757812, "global_step": 199986, "epoch": 2409} {"train_loss": -24.614303588867188, "global_step": 199987, "epoch": 2409} {"train_loss": -24.114700317382812, "global_step": 199988, "epoch": 2409} {"train_loss": -24.125463485717773, "global_step": 199989, "epoch": 2409} {"train_loss": -24.235734939575195, "global_step": 199990, "epoch": 2409} {"train_loss": -24.500511169433594, "global_step": 199991, "epoch": 2409} {"train_loss": -24.258665084838867, "global_step": 199992, "epoch": 2409} {"train_loss": -24.38157081604004, "global_step": 199993, "epoch": 2409} {"train_loss": -24.331859588623047, "global_step": 199994, "epoch": 2409} {"train_loss": -24.40989112854004, "global_step": 199995, "epoch": 2409} {"train_loss": -24.34842872619629, "global_step": 199996, "epoch": 2409} {"train_loss": -24.02791404724121, "global_step": 199997, "epoch": 2409} {"train_loss": -23.92307472229004, "global_step": 199998, "epoch": 2409} {"train_loss": -24.199420928955078, "global_step": 199999, "epoch": 2409} {"train_loss": -23.948949813842773, "global_step": 200000, "epoch": 2409} {"train_loss": -23.912378311157227, "global_step": 200001, "epoch": 2409} {"train_loss": -23.862173080444336, "global_step": 200002, "epoch": 2409} {"train_loss": -23.962080001831055, "global_step": 200003, "epoch": 2409} {"train_loss": -23.913774490356445, "global_step": 200004, "epoch": 2409} {"train_loss": -24.115642547607422, "global_step": 200005, "epoch": 2409} {"train_loss": -24.066862106323242, "global_step": 200006, "epoch": 2409} {"train_loss": -23.843387603759766, "global_step": 200007, "epoch": 2409} {"train_loss": -24.314756393432617, "global_step": 200008, "epoch": 2409} {"train_loss": -24.164472579956055, "global_step": 200009, "epoch": 2409} {"train_loss": -24.085519790649414, "global_step": 200010, "epoch": 2409} {"train_loss": -24.225540161132812, "global_step": 200011, "epoch": 2409} {"train_loss": -24.130779266357422, "global_step": 200012, "epoch": 2409} {"train_loss": -24.342853546142578, "global_step": 200013, "epoch": 2409} {"train_loss": -24.251245498657227, "global_step": 200014, "epoch": 2409} {"train_loss": -23.986379623413086, "global_step": 200015, "epoch": 2409} {"train_loss": -24.241230010986328, "global_step": 200016, "epoch": 2409} {"train_loss": -23.98236083984375, "global_step": 200017, "epoch": 2409} {"train_loss": -24.060943603515625, "global_step": 200018, "epoch": 2409} {"train_loss": -24.287012100219727, "global_step": 200019, "epoch": 2409} {"train_loss": -24.328449249267578, "global_step": 200020, "epoch": 2409} {"train_loss": -24.162683486938477, "global_step": 200021, "epoch": 2409} {"train_loss": -24.16156005859375, "global_step": 200022, "epoch": 2409} {"train_loss": -24.22144317626953, "global_step": 200023, "epoch": 2409} {"train_loss": -24.25697898864746, "global_step": 200024, "epoch": 2409} {"train_loss": -24.22637367248535, "global_step": 200025, "epoch": 2409} {"train_loss": -24.47542381286621, "global_step": 200026, "epoch": 2409} {"train_loss": -24.423730850219727, "global_step": 200027, "epoch": 2409} {"train_loss": -23.96280288696289, "global_step": 200028, "epoch": 2409} {"train_loss": -24.15264274413327, "global_step": 200029, "epoch": 2409, "val_loss": 6577420.0} {"train_loss": -23.643625259399414, "global_step": 200030, "epoch": 2410} {"train_loss": -23.585142135620117, "global_step": 200031, "epoch": 2410} {"train_loss": -23.73805809020996, "global_step": 200032, "epoch": 2410} {"train_loss": -23.935773849487305, "global_step": 200033, "epoch": 2410} {"train_loss": -23.56182861328125, "global_step": 200034, "epoch": 2410} {"train_loss": -24.231260299682617, "global_step": 200035, "epoch": 2410} {"train_loss": -24.216854095458984, "global_step": 200036, "epoch": 2410} {"train_loss": -24.00245475769043, "global_step": 200037, "epoch": 2410} {"train_loss": -24.001428604125977, "global_step": 200038, "epoch": 2410} {"train_loss": -23.887235641479492, "global_step": 200039, "epoch": 2410} {"train_loss": -24.269893646240234, "global_step": 200040, "epoch": 2410} {"train_loss": -23.592208862304688, "global_step": 200041, "epoch": 2410} {"train_loss": -24.26875114440918, "global_step": 200042, "epoch": 2410} {"train_loss": -23.977771759033203, "global_step": 200043, "epoch": 2410} {"train_loss": -23.99761390686035, "global_step": 200044, "epoch": 2410} {"train_loss": -23.7496395111084, "global_step": 200045, "epoch": 2410} {"train_loss": -24.09873390197754, "global_step": 200046, "epoch": 2410} {"train_loss": -24.014280319213867, "global_step": 200047, "epoch": 2410} {"train_loss": -24.135639190673828, "global_step": 200048, "epoch": 2410} {"train_loss": -24.048553466796875, "global_step": 200049, "epoch": 2410} {"train_loss": -23.957136154174805, "global_step": 200050, "epoch": 2410} {"train_loss": -23.857404708862305, "global_step": 200051, "epoch": 2410} {"train_loss": -23.631311416625977, "global_step": 200052, "epoch": 2410} {"train_loss": -24.046918869018555, "global_step": 200053, "epoch": 2410} {"train_loss": -24.427932739257812, "global_step": 200054, "epoch": 2410} {"train_loss": -24.067306518554688, "global_step": 200055, "epoch": 2410} {"train_loss": -24.132797241210938, "global_step": 200056, "epoch": 2410} {"train_loss": -23.934310913085938, "global_step": 200057, "epoch": 2410} {"train_loss": -24.328004837036133, "global_step": 200058, "epoch": 2410} {"train_loss": -23.688613891601562, "global_step": 200059, "epoch": 2410} {"train_loss": -23.913347244262695, "global_step": 200060, "epoch": 2410} {"train_loss": -24.125720977783203, "global_step": 200061, "epoch": 2410} {"train_loss": -24.269397735595703, "global_step": 200062, "epoch": 2410} {"train_loss": -24.29256248474121, "global_step": 200063, "epoch": 2410} {"train_loss": -24.408512115478516, "global_step": 200064, "epoch": 2410} {"train_loss": -24.08325958251953, "global_step": 200065, "epoch": 2410} {"train_loss": -24.022823333740234, "global_step": 200066, "epoch": 2410} {"train_loss": -24.146015167236328, "global_step": 200067, "epoch": 2410} {"train_loss": -23.99485206604004, "global_step": 200068, "epoch": 2410} {"train_loss": -24.167631149291992, "global_step": 200069, "epoch": 2410} {"train_loss": -24.356460571289062, "global_step": 200070, "epoch": 2410} {"train_loss": -24.412841796875, "global_step": 200071, "epoch": 2410} {"train_loss": -24.280597686767578, "global_step": 200072, "epoch": 2410} {"train_loss": -24.29183006286621, "global_step": 200073, "epoch": 2410} {"train_loss": -24.538043975830078, "global_step": 200074, "epoch": 2410} {"train_loss": -24.221668243408203, "global_step": 200075, "epoch": 2410} {"train_loss": -24.015060424804688, "global_step": 200076, "epoch": 2410} {"train_loss": -24.190292358398438, "global_step": 200077, "epoch": 2410} {"train_loss": -24.286258697509766, "global_step": 200078, "epoch": 2410} {"train_loss": -24.202489852905273, "global_step": 200079, "epoch": 2410} {"train_loss": -24.81146812438965, "global_step": 200080, "epoch": 2410} {"train_loss": -23.850624084472656, "global_step": 200081, "epoch": 2410} {"train_loss": -24.289236068725586, "global_step": 200082, "epoch": 2410} {"train_loss": -24.08744239807129, "global_step": 200083, "epoch": 2410} {"train_loss": -25.3138484954834, "global_step": 200084, "epoch": 2410} {"train_loss": -24.11713981628418, "global_step": 200085, "epoch": 2410} {"train_loss": -24.61971092224121, "global_step": 200086, "epoch": 2410} {"train_loss": -23.950977325439453, "global_step": 200087, "epoch": 2410} {"train_loss": -24.6094970703125, "global_step": 200088, "epoch": 2410} {"train_loss": -24.460803985595703, "global_step": 200089, "epoch": 2410} {"train_loss": -24.140104293823242, "global_step": 200090, "epoch": 2410} {"train_loss": -23.994924545288086, "global_step": 200091, "epoch": 2410} {"train_loss": -23.724401473999023, "global_step": 200092, "epoch": 2410} {"train_loss": -24.25296974182129, "global_step": 200093, "epoch": 2410} {"train_loss": -24.16298484802246, "global_step": 200094, "epoch": 2410} {"train_loss": -24.093427658081055, "global_step": 200095, "epoch": 2410} {"train_loss": -23.713415145874023, "global_step": 200096, "epoch": 2410} {"train_loss": -24.272010803222656, "global_step": 200097, "epoch": 2410} {"train_loss": -24.09116554260254, "global_step": 200098, "epoch": 2410} {"train_loss": -24.171051025390625, "global_step": 200099, "epoch": 2410} {"train_loss": -24.388872146606445, "global_step": 200100, "epoch": 2410} {"train_loss": -24.214962005615234, "global_step": 200101, "epoch": 2410} {"train_loss": -24.147218704223633, "global_step": 200102, "epoch": 2410} {"train_loss": -24.528175354003906, "global_step": 200103, "epoch": 2410} {"train_loss": -24.398229598999023, "global_step": 200104, "epoch": 2410} {"train_loss": -24.12497901916504, "global_step": 200105, "epoch": 2410} {"train_loss": -24.340251922607422, "global_step": 200106, "epoch": 2410} {"train_loss": -24.123092651367188, "global_step": 200107, "epoch": 2410} {"train_loss": -24.146167755126953, "global_step": 200108, "epoch": 2410} {"train_loss": -23.72715187072754, "global_step": 200109, "epoch": 2410} {"train_loss": -23.699176788330078, "global_step": 200110, "epoch": 2410} {"train_loss": -24.070301055908203, "global_step": 200111, "epoch": 2410} {"train_loss": -24.10621482205678, "global_step": 200112, "epoch": 2410, "val_loss": 6592503.0} {"train_loss": -23.577816009521484, "global_step": 200113, "epoch": 2411} {"train_loss": -23.996170043945312, "global_step": 200114, "epoch": 2411} {"train_loss": -23.885690689086914, "global_step": 200115, "epoch": 2411} {"train_loss": -23.805007934570312, "global_step": 200116, "epoch": 2411} {"train_loss": -23.293725967407227, "global_step": 200117, "epoch": 2411} {"train_loss": -23.776744842529297, "global_step": 200118, "epoch": 2411} {"train_loss": -23.381118774414062, "global_step": 200119, "epoch": 2411} {"train_loss": -23.22329330444336, "global_step": 200120, "epoch": 2411} {"train_loss": -23.685901641845703, "global_step": 200121, "epoch": 2411} {"train_loss": -23.646207809448242, "global_step": 200122, "epoch": 2411} {"train_loss": -23.95355796813965, "global_step": 200123, "epoch": 2411} {"train_loss": -23.53539276123047, "global_step": 200124, "epoch": 2411} {"train_loss": -23.849496841430664, "global_step": 200125, "epoch": 2411} {"train_loss": -23.84364128112793, "global_step": 200126, "epoch": 2411} {"train_loss": -23.40732192993164, "global_step": 200127, "epoch": 2411} {"train_loss": -23.66817283630371, "global_step": 200128, "epoch": 2411} {"train_loss": -23.99391746520996, "global_step": 200129, "epoch": 2411} {"train_loss": -23.79912757873535, "global_step": 200130, "epoch": 2411} {"train_loss": -23.5134220123291, "global_step": 200131, "epoch": 2411} {"train_loss": -23.552295684814453, "global_step": 200132, "epoch": 2411} {"train_loss": -24.129274368286133, "global_step": 200133, "epoch": 2411} {"train_loss": -23.92074203491211, "global_step": 200134, "epoch": 2411} {"train_loss": -24.113454818725586, "global_step": 200135, "epoch": 2411} {"train_loss": -23.891138076782227, "global_step": 200136, "epoch": 2411} {"train_loss": -23.55030632019043, "global_step": 200137, "epoch": 2411} {"train_loss": -24.510244369506836, "global_step": 200138, "epoch": 2411} {"train_loss": -23.69370460510254, "global_step": 200139, "epoch": 2411} {"train_loss": -24.449478149414062, "global_step": 200140, "epoch": 2411} {"train_loss": -23.916147232055664, "global_step": 200141, "epoch": 2411} {"train_loss": -24.3381404876709, "global_step": 200142, "epoch": 2411} {"train_loss": -24.046354293823242, "global_step": 200143, "epoch": 2411} {"train_loss": -23.93099021911621, "global_step": 200144, "epoch": 2411} {"train_loss": -24.314855575561523, "global_step": 200145, "epoch": 2411} {"train_loss": -24.361465454101562, "global_step": 200146, "epoch": 2411} {"train_loss": -24.331453323364258, "global_step": 200147, "epoch": 2411} {"train_loss": -24.634544372558594, "global_step": 200148, "epoch": 2411} {"train_loss": -24.164255142211914, "global_step": 200149, "epoch": 2411} {"train_loss": -24.30569839477539, "global_step": 200150, "epoch": 2411} {"train_loss": -24.058063507080078, "global_step": 200151, "epoch": 2411} {"train_loss": -24.270532608032227, "global_step": 200152, "epoch": 2411} {"train_loss": -24.179943084716797, "global_step": 200153, "epoch": 2411} {"train_loss": -24.694150924682617, "global_step": 200154, "epoch": 2411} {"train_loss": -24.40846061706543, "global_step": 200155, "epoch": 2411} {"train_loss": -24.223384857177734, "global_step": 200156, "epoch": 2411} {"train_loss": -24.597759246826172, "global_step": 200157, "epoch": 2411} {"train_loss": -24.206937789916992, "global_step": 200158, "epoch": 2411} {"train_loss": -24.03985595703125, "global_step": 200159, "epoch": 2411} {"train_loss": -24.10077476501465, "global_step": 200160, "epoch": 2411} {"train_loss": -24.51363754272461, "global_step": 200161, "epoch": 2411} {"train_loss": -24.4669246673584, "global_step": 200162, "epoch": 2411} {"train_loss": -24.068761825561523, "global_step": 200163, "epoch": 2411} {"train_loss": -24.08893394470215, "global_step": 200164, "epoch": 2411} {"train_loss": -24.32804298400879, "global_step": 200165, "epoch": 2411} {"train_loss": -23.953527450561523, "global_step": 200166, "epoch": 2411} {"train_loss": -24.378890991210938, "global_step": 200167, "epoch": 2411} {"train_loss": -24.62975311279297, "global_step": 200168, "epoch": 2411} {"train_loss": -24.525972366333008, "global_step": 200169, "epoch": 2411} {"train_loss": -24.29421615600586, "global_step": 200170, "epoch": 2411} {"train_loss": -24.210617065429688, "global_step": 200171, "epoch": 2411} {"train_loss": -24.223615646362305, "global_step": 200172, "epoch": 2411} {"train_loss": -24.503005981445312, "global_step": 200173, "epoch": 2411} {"train_loss": -24.280813217163086, "global_step": 200174, "epoch": 2411} {"train_loss": -24.68660545349121, "global_step": 200175, "epoch": 2411} {"train_loss": -24.56570816040039, "global_step": 200176, "epoch": 2411} {"train_loss": -24.24330711364746, "global_step": 200177, "epoch": 2411} {"train_loss": -24.535324096679688, "global_step": 200178, "epoch": 2411} {"train_loss": -24.406787872314453, "global_step": 200179, "epoch": 2411} {"train_loss": -24.451963424682617, "global_step": 200180, "epoch": 2411} {"train_loss": -24.431501388549805, "global_step": 200181, "epoch": 2411} {"train_loss": -24.486310958862305, "global_step": 200182, "epoch": 2411} {"train_loss": -24.126667022705078, "global_step": 200183, "epoch": 2411} {"train_loss": -24.68814468383789, "global_step": 200184, "epoch": 2411} {"train_loss": -24.026254653930664, "global_step": 200185, "epoch": 2411} {"train_loss": -24.162094116210938, "global_step": 200186, "epoch": 2411} {"train_loss": -24.07264518737793, "global_step": 200187, "epoch": 2411} {"train_loss": -24.09021759033203, "global_step": 200188, "epoch": 2411} {"train_loss": -24.23366928100586, "global_step": 200189, "epoch": 2411} {"train_loss": -24.426809310913086, "global_step": 200190, "epoch": 2411} {"train_loss": -24.2789363861084, "global_step": 200191, "epoch": 2411} {"train_loss": -24.337017059326172, "global_step": 200192, "epoch": 2411} {"train_loss": -24.848785400390625, "global_step": 200193, "epoch": 2411} {"train_loss": -24.071640014648438, "global_step": 200194, "epoch": 2411} {"train_loss": -24.138354427843208, "global_step": 200195, "epoch": 2411, "val_loss": 6445733.0} {"train_loss": -23.56235122680664, "global_step": 200196, "epoch": 2412} {"train_loss": -23.05655860900879, "global_step": 200197, "epoch": 2412} {"train_loss": -23.52813720703125, "global_step": 200198, "epoch": 2412} {"train_loss": -23.857215881347656, "global_step": 200199, "epoch": 2412} {"train_loss": -23.627609252929688, "global_step": 200200, "epoch": 2412} {"train_loss": -23.982450485229492, "global_step": 200201, "epoch": 2412} {"train_loss": -23.494474411010742, "global_step": 200202, "epoch": 2412} {"train_loss": -23.905630111694336, "global_step": 200203, "epoch": 2412} {"train_loss": -23.880796432495117, "global_step": 200204, "epoch": 2412} {"train_loss": -24.21973991394043, "global_step": 200205, "epoch": 2412} {"train_loss": -24.312021255493164, "global_step": 200206, "epoch": 2412} {"train_loss": -23.934423446655273, "global_step": 200207, "epoch": 2412} {"train_loss": -24.047876358032227, "global_step": 200208, "epoch": 2412} {"train_loss": -24.18885612487793, "global_step": 200209, "epoch": 2412} {"train_loss": -24.00272560119629, "global_step": 200210, "epoch": 2412} {"train_loss": -23.943204879760742, "global_step": 200211, "epoch": 2412} {"train_loss": -24.11146354675293, "global_step": 200212, "epoch": 2412} {"train_loss": -24.358966827392578, "global_step": 200213, "epoch": 2412} {"train_loss": -24.18157386779785, "global_step": 200214, "epoch": 2412} {"train_loss": -24.03006935119629, "global_step": 200215, "epoch": 2412} {"train_loss": -24.080076217651367, "global_step": 200216, "epoch": 2412} {"train_loss": -24.285436630249023, "global_step": 200217, "epoch": 2412} {"train_loss": -24.184072494506836, "global_step": 200218, "epoch": 2412} {"train_loss": -24.08255386352539, "global_step": 200219, "epoch": 2412} {"train_loss": -24.436925888061523, "global_step": 200220, "epoch": 2412} {"train_loss": -24.563928604125977, "global_step": 200221, "epoch": 2412} {"train_loss": -23.90607261657715, "global_step": 200222, "epoch": 2412} {"train_loss": -24.212203979492188, "global_step": 200223, "epoch": 2412} {"train_loss": -23.987886428833008, "global_step": 200224, "epoch": 2412} {"train_loss": -24.30928611755371, "global_step": 200225, "epoch": 2412} {"train_loss": -24.180330276489258, "global_step": 200226, "epoch": 2412} {"train_loss": -24.366291046142578, "global_step": 200227, "epoch": 2412} {"train_loss": -24.147075653076172, "global_step": 200228, "epoch": 2412} {"train_loss": -24.198083877563477, "global_step": 200229, "epoch": 2412} {"train_loss": -24.35795021057129, "global_step": 200230, "epoch": 2412} {"train_loss": -24.253173828125, "global_step": 200231, "epoch": 2412} {"train_loss": -24.51097869873047, "global_step": 200232, "epoch": 2412} {"train_loss": -24.121625900268555, "global_step": 200233, "epoch": 2412} {"train_loss": -24.129732131958008, "global_step": 200234, "epoch": 2412} {"train_loss": -23.898847579956055, "global_step": 200235, "epoch": 2412} {"train_loss": -24.228689193725586, "global_step": 200236, "epoch": 2412} {"train_loss": -24.580656051635742, "global_step": 200237, "epoch": 2412} {"train_loss": -24.306140899658203, "global_step": 200238, "epoch": 2412} {"train_loss": -24.355667114257812, "global_step": 200239, "epoch": 2412} {"train_loss": -24.803945541381836, "global_step": 200240, "epoch": 2412} {"train_loss": -24.25600242614746, "global_step": 200241, "epoch": 2412} {"train_loss": -24.176856994628906, "global_step": 200242, "epoch": 2412} {"train_loss": -24.621047973632812, "global_step": 200243, "epoch": 2412} {"train_loss": -24.2742919921875, "global_step": 200244, "epoch": 2412} {"train_loss": -24.625961303710938, "global_step": 200245, "epoch": 2412} {"train_loss": -24.12276268005371, "global_step": 200246, "epoch": 2412} {"train_loss": -24.344961166381836, "global_step": 200247, "epoch": 2412} {"train_loss": -24.517087936401367, "global_step": 200248, "epoch": 2412} {"train_loss": -24.475370407104492, "global_step": 200249, "epoch": 2412} {"train_loss": -23.936033248901367, "global_step": 200250, "epoch": 2412} {"train_loss": -24.187175750732422, "global_step": 200251, "epoch": 2412} {"train_loss": -23.9212589263916, "global_step": 200252, "epoch": 2412} {"train_loss": -23.962337493896484, "global_step": 200253, "epoch": 2412} {"train_loss": -23.949392318725586, "global_step": 200254, "epoch": 2412} {"train_loss": -24.307743072509766, "global_step": 200255, "epoch": 2412} {"train_loss": -23.41107940673828, "global_step": 200256, "epoch": 2412} {"train_loss": -23.100879669189453, "global_step": 200257, "epoch": 2412} {"train_loss": -24.694610595703125, "global_step": 200258, "epoch": 2412} {"train_loss": -23.676109313964844, "global_step": 200259, "epoch": 2412} {"train_loss": -23.95980453491211, "global_step": 200260, "epoch": 2412} {"train_loss": -23.959941864013672, "global_step": 200261, "epoch": 2412} {"train_loss": -24.029569625854492, "global_step": 200262, "epoch": 2412} {"train_loss": -23.9046573638916, "global_step": 200263, "epoch": 2412} {"train_loss": -24.018857955932617, "global_step": 200264, "epoch": 2412} {"train_loss": -23.612817764282227, "global_step": 200265, "epoch": 2412} {"train_loss": -23.976789474487305, "global_step": 200266, "epoch": 2412} {"train_loss": -24.15460777282715, "global_step": 200267, "epoch": 2412} {"train_loss": -23.65073013305664, "global_step": 200268, "epoch": 2412} {"train_loss": -24.133676528930664, "global_step": 200269, "epoch": 2412} {"train_loss": -23.915882110595703, "global_step": 200270, "epoch": 2412} {"train_loss": -24.014204025268555, "global_step": 200271, "epoch": 2412} {"train_loss": -24.368757247924805, "global_step": 200272, "epoch": 2412} {"train_loss": -24.171419143676758, "global_step": 200273, "epoch": 2412} {"train_loss": -24.02950096130371, "global_step": 200274, "epoch": 2412} {"train_loss": -24.409334182739258, "global_step": 200275, "epoch": 2412} {"train_loss": -23.94489097595215, "global_step": 200276, "epoch": 2412} {"train_loss": -24.164506912231445, "global_step": 200277, "epoch": 2412} {"train_loss": -24.112388197197973, "global_step": 200278, "epoch": 2412, "val_loss": 6549395.0} {"train_loss": -24.047321319580078, "global_step": 200279, "epoch": 2413} {"train_loss": -23.782093048095703, "global_step": 200280, "epoch": 2413} {"train_loss": -23.587257385253906, "global_step": 200281, "epoch": 2413} {"train_loss": -24.00642967224121, "global_step": 200282, "epoch": 2413} {"train_loss": -23.835493087768555, "global_step": 200283, "epoch": 2413} {"train_loss": -23.97600746154785, "global_step": 200284, "epoch": 2413} {"train_loss": -23.580493927001953, "global_step": 200285, "epoch": 2413} {"train_loss": -23.87135887145996, "global_step": 200286, "epoch": 2413} {"train_loss": -24.141376495361328, "global_step": 200287, "epoch": 2413} {"train_loss": -24.040542602539062, "global_step": 200288, "epoch": 2413} {"train_loss": -23.892969131469727, "global_step": 200289, "epoch": 2413} {"train_loss": -24.212881088256836, "global_step": 200290, "epoch": 2413} {"train_loss": -23.874425888061523, "global_step": 200291, "epoch": 2413} {"train_loss": -23.73567771911621, "global_step": 200292, "epoch": 2413} {"train_loss": -24.03567886352539, "global_step": 200293, "epoch": 2413} {"train_loss": -23.819461822509766, "global_step": 200294, "epoch": 2413} {"train_loss": -23.9444522857666, "global_step": 200295, "epoch": 2413} {"train_loss": -23.515493392944336, "global_step": 200296, "epoch": 2413} {"train_loss": -23.924468994140625, "global_step": 200297, "epoch": 2413} {"train_loss": -24.382278442382812, "global_step": 200298, "epoch": 2413} {"train_loss": -23.95926856994629, "global_step": 200299, "epoch": 2413} {"train_loss": -24.403432846069336, "global_step": 200300, "epoch": 2413} {"train_loss": -24.229951858520508, "global_step": 200301, "epoch": 2413} {"train_loss": -24.86105728149414, "global_step": 200302, "epoch": 2413} {"train_loss": -24.1536808013916, "global_step": 200303, "epoch": 2413} {"train_loss": -24.25404167175293, "global_step": 200304, "epoch": 2413} {"train_loss": -24.273550033569336, "global_step": 200305, "epoch": 2413} {"train_loss": -24.49614906311035, "global_step": 200306, "epoch": 2413} {"train_loss": -24.341245651245117, "global_step": 200307, "epoch": 2413} {"train_loss": -24.327598571777344, "global_step": 200308, "epoch": 2413} {"train_loss": -24.389822006225586, "global_step": 200309, "epoch": 2413} {"train_loss": -24.114736557006836, "global_step": 200310, "epoch": 2413} {"train_loss": -24.039026260375977, "global_step": 200311, "epoch": 2413} {"train_loss": -24.08405876159668, "global_step": 200312, "epoch": 2413} {"train_loss": -24.45893096923828, "global_step": 200313, "epoch": 2413} {"train_loss": -24.182706832885742, "global_step": 200314, "epoch": 2413} {"train_loss": -24.192777633666992, "global_step": 200315, "epoch": 2413} {"train_loss": -24.126066207885742, "global_step": 200316, "epoch": 2413} {"train_loss": -24.44768524169922, "global_step": 200317, "epoch": 2413} {"train_loss": -24.1566104888916, "global_step": 200318, "epoch": 2413} {"train_loss": -23.728271484375, "global_step": 200319, "epoch": 2413} {"train_loss": -24.403751373291016, "global_step": 200320, "epoch": 2413} {"train_loss": -24.01003646850586, "global_step": 200321, "epoch": 2413} {"train_loss": -24.157699584960938, "global_step": 200322, "epoch": 2413} {"train_loss": -24.54758071899414, "global_step": 200323, "epoch": 2413} {"train_loss": -23.85610008239746, "global_step": 200324, "epoch": 2413} {"train_loss": -24.41629409790039, "global_step": 200325, "epoch": 2413} {"train_loss": -24.64918327331543, "global_step": 200326, "epoch": 2413} {"train_loss": -24.469587326049805, "global_step": 200327, "epoch": 2413} {"train_loss": -24.5470027923584, "global_step": 200328, "epoch": 2413} {"train_loss": -24.76854705810547, "global_step": 200329, "epoch": 2413} {"train_loss": -24.260814666748047, "global_step": 200330, "epoch": 2413} {"train_loss": -24.629230499267578, "global_step": 200331, "epoch": 2413} {"train_loss": -24.484703063964844, "global_step": 200332, "epoch": 2413} {"train_loss": -24.479995727539062, "global_step": 200333, "epoch": 2413} {"train_loss": -24.528928756713867, "global_step": 200334, "epoch": 2413} {"train_loss": -24.381296157836914, "global_step": 200335, "epoch": 2413} {"train_loss": -24.484739303588867, "global_step": 200336, "epoch": 2413} {"train_loss": -24.712909698486328, "global_step": 200337, "epoch": 2413} {"train_loss": -24.409326553344727, "global_step": 200338, "epoch": 2413} {"train_loss": -24.732980728149414, "global_step": 200339, "epoch": 2413} {"train_loss": -24.66145896911621, "global_step": 200340, "epoch": 2413} {"train_loss": -24.091163635253906, "global_step": 200341, "epoch": 2413} {"train_loss": -24.012521743774414, "global_step": 200342, "epoch": 2413} {"train_loss": -24.50495719909668, "global_step": 200343, "epoch": 2413} {"train_loss": -24.187049865722656, "global_step": 200344, "epoch": 2413} {"train_loss": -24.14080238342285, "global_step": 200345, "epoch": 2413} {"train_loss": -23.985443115234375, "global_step": 200346, "epoch": 2413} {"train_loss": -24.032888412475586, "global_step": 200347, "epoch": 2413} {"train_loss": -24.50080680847168, "global_step": 200348, "epoch": 2413} {"train_loss": -24.42327117919922, "global_step": 200349, "epoch": 2413} {"train_loss": -24.427305221557617, "global_step": 200350, "epoch": 2413} {"train_loss": -24.207412719726562, "global_step": 200351, "epoch": 2413} {"train_loss": -24.40227699279785, "global_step": 200352, "epoch": 2413} {"train_loss": -24.240467071533203, "global_step": 200353, "epoch": 2413} {"train_loss": -24.49155044555664, "global_step": 200354, "epoch": 2413} {"train_loss": -24.4258975982666, "global_step": 200355, "epoch": 2413} {"train_loss": -24.63153839111328, "global_step": 200356, "epoch": 2413} {"train_loss": -24.546127319335938, "global_step": 200357, "epoch": 2413} {"train_loss": -24.078725814819336, "global_step": 200358, "epoch": 2413} {"train_loss": -24.492734909057617, "global_step": 200359, "epoch": 2413} {"train_loss": -24.371929168701172, "global_step": 200360, "epoch": 2413} {"train_loss": -24.239583716335066, "global_step": 200361, "epoch": 2413, "val_loss": 6554406.0} {"train_loss": -24.281234741210938, "global_step": 200362, "epoch": 2414} {"train_loss": -23.84098243713379, "global_step": 200363, "epoch": 2414} {"train_loss": -24.17205238342285, "global_step": 200364, "epoch": 2414} {"train_loss": -23.945297241210938, "global_step": 200365, "epoch": 2414} {"train_loss": -24.021286010742188, "global_step": 200366, "epoch": 2414} {"train_loss": -23.837200164794922, "global_step": 200367, "epoch": 2414} {"train_loss": -23.9541072845459, "global_step": 200368, "epoch": 2414} {"train_loss": -23.995922088623047, "global_step": 200369, "epoch": 2414} {"train_loss": -24.09031105041504, "global_step": 200370, "epoch": 2414} {"train_loss": -23.986000061035156, "global_step": 200371, "epoch": 2414} {"train_loss": -23.957571029663086, "global_step": 200372, "epoch": 2414} {"train_loss": -24.18341064453125, "global_step": 200373, "epoch": 2414} {"train_loss": -24.258930206298828, "global_step": 200374, "epoch": 2414} {"train_loss": -24.38382339477539, "global_step": 200375, "epoch": 2414} {"train_loss": -23.810697555541992, "global_step": 200376, "epoch": 2414} {"train_loss": -24.470787048339844, "global_step": 200377, "epoch": 2414} {"train_loss": -24.097766876220703, "global_step": 200378, "epoch": 2414} {"train_loss": -24.06759262084961, "global_step": 200379, "epoch": 2414} {"train_loss": -24.15070343017578, "global_step": 200380, "epoch": 2414} {"train_loss": -24.145666122436523, "global_step": 200381, "epoch": 2414} {"train_loss": -24.423789978027344, "global_step": 200382, "epoch": 2414} {"train_loss": -24.40903091430664, "global_step": 200383, "epoch": 2414} {"train_loss": -24.645816802978516, "global_step": 200384, "epoch": 2414} {"train_loss": -24.243925094604492, "global_step": 200385, "epoch": 2414} {"train_loss": -24.312992095947266, "global_step": 200386, "epoch": 2414} {"train_loss": -24.278696060180664, "global_step": 200387, "epoch": 2414} {"train_loss": -24.13630485534668, "global_step": 200388, "epoch": 2414} {"train_loss": -24.122854232788086, "global_step": 200389, "epoch": 2414} {"train_loss": -24.580570220947266, "global_step": 200390, "epoch": 2414} {"train_loss": -24.513776779174805, "global_step": 200391, "epoch": 2414} {"train_loss": -24.339000701904297, "global_step": 200392, "epoch": 2414} {"train_loss": -24.604154586791992, "global_step": 200393, "epoch": 2414} {"train_loss": -24.313034057617188, "global_step": 200394, "epoch": 2414} {"train_loss": -24.2252140045166, "global_step": 200395, "epoch": 2414} {"train_loss": -24.442825317382812, "global_step": 200396, "epoch": 2414} {"train_loss": -24.38444709777832, "global_step": 200397, "epoch": 2414} {"train_loss": -24.230987548828125, "global_step": 200398, "epoch": 2414} {"train_loss": -24.260133743286133, "global_step": 200399, "epoch": 2414} {"train_loss": -24.4356746673584, "global_step": 200400, "epoch": 2414} {"train_loss": -24.223037719726562, "global_step": 200401, "epoch": 2414} {"train_loss": -24.485509872436523, "global_step": 200402, "epoch": 2414} {"train_loss": -24.27655601501465, "global_step": 200403, "epoch": 2414} {"train_loss": -24.048145294189453, "global_step": 200404, "epoch": 2414} {"train_loss": -24.214946746826172, "global_step": 200405, "epoch": 2414} {"train_loss": -24.58555030822754, "global_step": 200406, "epoch": 2414} {"train_loss": -23.91633415222168, "global_step": 200407, "epoch": 2414} {"train_loss": -24.05938148498535, "global_step": 200408, "epoch": 2414} {"train_loss": -23.920135498046875, "global_step": 200409, "epoch": 2414} {"train_loss": -23.92526626586914, "global_step": 200410, "epoch": 2414} {"train_loss": -24.029905319213867, "global_step": 200411, "epoch": 2414} {"train_loss": -24.006732940673828, "global_step": 200412, "epoch": 2414} {"train_loss": -24.442340850830078, "global_step": 200413, "epoch": 2414} {"train_loss": -24.2687931060791, "global_step": 200414, "epoch": 2414} {"train_loss": -23.923131942749023, "global_step": 200415, "epoch": 2414} {"train_loss": -24.23301124572754, "global_step": 200416, "epoch": 2414} {"train_loss": -24.250520706176758, "global_step": 200417, "epoch": 2414} {"train_loss": -23.988651275634766, "global_step": 200418, "epoch": 2414} {"train_loss": -23.861658096313477, "global_step": 200419, "epoch": 2414} {"train_loss": -23.960119247436523, "global_step": 200420, "epoch": 2414} {"train_loss": -23.869543075561523, "global_step": 200421, "epoch": 2414} {"train_loss": -24.319372177124023, "global_step": 200422, "epoch": 2414} {"train_loss": -24.354782104492188, "global_step": 200423, "epoch": 2414} {"train_loss": -24.077909469604492, "global_step": 200424, "epoch": 2414} {"train_loss": -24.167762756347656, "global_step": 200425, "epoch": 2414} {"train_loss": -24.457975387573242, "global_step": 200426, "epoch": 2414} {"train_loss": -24.34673309326172, "global_step": 200427, "epoch": 2414} {"train_loss": -24.2835636138916, "global_step": 200428, "epoch": 2414} {"train_loss": -24.55514907836914, "global_step": 200429, "epoch": 2414} {"train_loss": -24.35077476501465, "global_step": 200430, "epoch": 2414} {"train_loss": -24.44209861755371, "global_step": 200431, "epoch": 2414} {"train_loss": -24.494400024414062, "global_step": 200432, "epoch": 2414} {"train_loss": -24.267166137695312, "global_step": 200433, "epoch": 2414} {"train_loss": -24.275524139404297, "global_step": 200434, "epoch": 2414} {"train_loss": -24.102210998535156, "global_step": 200435, "epoch": 2414} {"train_loss": -24.473987579345703, "global_step": 200436, "epoch": 2414} {"train_loss": -24.503150939941406, "global_step": 200437, "epoch": 2414} {"train_loss": -24.422536849975586, "global_step": 200438, "epoch": 2414} {"train_loss": -24.299449920654297, "global_step": 200439, "epoch": 2414} {"train_loss": -24.46412467956543, "global_step": 200440, "epoch": 2414} {"train_loss": -24.402475357055664, "global_step": 200441, "epoch": 2414} {"train_loss": -24.32581901550293, "global_step": 200442, "epoch": 2414} {"train_loss": -24.43711280822754, "global_step": 200443, "epoch": 2414} {"train_loss": -24.247948267373694, "global_step": 200444, "epoch": 2414, "val_loss": 6564599.0} {"train_loss": -21.170988082885742, "global_step": 200445, "epoch": 2415} {"train_loss": -21.959829330444336, "global_step": 200446, "epoch": 2415} {"train_loss": -22.025959014892578, "global_step": 200447, "epoch": 2415} {"train_loss": -23.223133087158203, "global_step": 200448, "epoch": 2415} {"train_loss": -22.60538101196289, "global_step": 200449, "epoch": 2415} {"train_loss": -23.14711570739746, "global_step": 200450, "epoch": 2415} {"train_loss": -23.467811584472656, "global_step": 200451, "epoch": 2415} {"train_loss": -23.02288246154785, "global_step": 200452, "epoch": 2415} {"train_loss": -23.381757736206055, "global_step": 200453, "epoch": 2415} {"train_loss": -23.476856231689453, "global_step": 200454, "epoch": 2415} {"train_loss": -23.10682487487793, "global_step": 200455, "epoch": 2415} {"train_loss": -23.733470916748047, "global_step": 200456, "epoch": 2415} {"train_loss": -23.66901969909668, "global_step": 200457, "epoch": 2415} {"train_loss": -23.328001022338867, "global_step": 200458, "epoch": 2415} {"train_loss": -23.475326538085938, "global_step": 200459, "epoch": 2415} {"train_loss": -23.360706329345703, "global_step": 200460, "epoch": 2415} {"train_loss": -23.88551902770996, "global_step": 200461, "epoch": 2415} {"train_loss": -23.384174346923828, "global_step": 200462, "epoch": 2415} {"train_loss": -23.456357955932617, "global_step": 200463, "epoch": 2415} {"train_loss": -24.1522274017334, "global_step": 200464, "epoch": 2415} {"train_loss": -23.297155380249023, "global_step": 200465, "epoch": 2415} {"train_loss": -23.529773712158203, "global_step": 200466, "epoch": 2415} {"train_loss": -23.86292839050293, "global_step": 200467, "epoch": 2415} {"train_loss": -23.711288452148438, "global_step": 200468, "epoch": 2415} {"train_loss": -24.164308547973633, "global_step": 200469, "epoch": 2415} {"train_loss": -24.097049713134766, "global_step": 200470, "epoch": 2415} {"train_loss": -24.117116928100586, "global_step": 200471, "epoch": 2415} {"train_loss": -24.092390060424805, "global_step": 200472, "epoch": 2415} {"train_loss": -24.218847274780273, "global_step": 200473, "epoch": 2415} {"train_loss": -24.096250534057617, "global_step": 200474, "epoch": 2415} {"train_loss": -24.13362693786621, "global_step": 200475, "epoch": 2415} {"train_loss": -23.90134620666504, "global_step": 200476, "epoch": 2415} {"train_loss": -24.386016845703125, "global_step": 200477, "epoch": 2415} {"train_loss": -24.093862533569336, "global_step": 200478, "epoch": 2415} {"train_loss": -23.97307777404785, "global_step": 200479, "epoch": 2415} {"train_loss": -24.373319625854492, "global_step": 200480, "epoch": 2415} {"train_loss": -24.07118034362793, "global_step": 200481, "epoch": 2415} {"train_loss": -23.839643478393555, "global_step": 200482, "epoch": 2415} {"train_loss": -24.003131866455078, "global_step": 200483, "epoch": 2415} {"train_loss": -24.39582633972168, "global_step": 200484, "epoch": 2415} {"train_loss": -24.090917587280273, "global_step": 200485, "epoch": 2415} {"train_loss": -24.298532485961914, "global_step": 200486, "epoch": 2415} {"train_loss": -24.37958335876465, "global_step": 200487, "epoch": 2415} {"train_loss": -24.108793258666992, "global_step": 200488, "epoch": 2415} {"train_loss": -24.54983901977539, "global_step": 200489, "epoch": 2415} {"train_loss": -24.258453369140625, "global_step": 200490, "epoch": 2415} {"train_loss": -24.437841415405273, "global_step": 200491, "epoch": 2415} {"train_loss": -24.193876266479492, "global_step": 200492, "epoch": 2415} {"train_loss": -24.48333168029785, "global_step": 200493, "epoch": 2415} {"train_loss": -24.470684051513672, "global_step": 200494, "epoch": 2415} {"train_loss": -24.223386764526367, "global_step": 200495, "epoch": 2415} {"train_loss": -24.42378807067871, "global_step": 200496, "epoch": 2415} {"train_loss": -24.08820152282715, "global_step": 200497, "epoch": 2415} {"train_loss": -24.37398338317871, "global_step": 200498, "epoch": 2415} {"train_loss": -24.38429832458496, "global_step": 200499, "epoch": 2415} {"train_loss": -24.032217025756836, "global_step": 200500, "epoch": 2415} {"train_loss": -24.17693328857422, "global_step": 200501, "epoch": 2415} {"train_loss": -24.56364631652832, "global_step": 200502, "epoch": 2415} {"train_loss": -24.02762794494629, "global_step": 200503, "epoch": 2415} {"train_loss": -23.959976196289062, "global_step": 200504, "epoch": 2415} {"train_loss": -24.218082427978516, "global_step": 200505, "epoch": 2415} {"train_loss": -24.11171531677246, "global_step": 200506, "epoch": 2415} {"train_loss": -24.00983238220215, "global_step": 200507, "epoch": 2415} {"train_loss": -24.24755859375, "global_step": 200508, "epoch": 2415} {"train_loss": -23.637985229492188, "global_step": 200509, "epoch": 2415} {"train_loss": -24.463991165161133, "global_step": 200510, "epoch": 2415} {"train_loss": -24.220945358276367, "global_step": 200511, "epoch": 2415} {"train_loss": -23.97821617126465, "global_step": 200512, "epoch": 2415} {"train_loss": -23.873971939086914, "global_step": 200513, "epoch": 2415} {"train_loss": -24.240833282470703, "global_step": 200514, "epoch": 2415} {"train_loss": -24.497404098510742, "global_step": 200515, "epoch": 2415} {"train_loss": -24.011051177978516, "global_step": 200516, "epoch": 2415} {"train_loss": -24.148792266845703, "global_step": 200517, "epoch": 2415} {"train_loss": -24.16566276550293, "global_step": 200518, "epoch": 2415} {"train_loss": -24.291173934936523, "global_step": 200519, "epoch": 2415} {"train_loss": -24.250715255737305, "global_step": 200520, "epoch": 2415} {"train_loss": -23.984941482543945, "global_step": 200521, "epoch": 2415} {"train_loss": -24.458873748779297, "global_step": 200522, "epoch": 2415} {"train_loss": -24.397851943969727, "global_step": 200523, "epoch": 2415} {"train_loss": -24.612218856811523, "global_step": 200524, "epoch": 2415} {"train_loss": -24.386627197265625, "global_step": 200525, "epoch": 2415} {"train_loss": -24.268218994140625, "global_step": 200526, "epoch": 2415} {"train_loss": -23.914065464433417, "global_step": 200527, "epoch": 2415, "val_loss": 6569228.0} {"train_loss": -23.429588317871094, "global_step": 200528, "epoch": 2416} {"train_loss": -24.072189331054688, "global_step": 200529, "epoch": 2416} {"train_loss": -23.47389030456543, "global_step": 200530, "epoch": 2416} {"train_loss": -24.2503719329834, "global_step": 200531, "epoch": 2416} {"train_loss": -23.3582763671875, "global_step": 200532, "epoch": 2416} {"train_loss": -23.804609298706055, "global_step": 200533, "epoch": 2416} {"train_loss": -24.188291549682617, "global_step": 200534, "epoch": 2416} {"train_loss": -24.219572067260742, "global_step": 200535, "epoch": 2416} {"train_loss": -24.171411514282227, "global_step": 200536, "epoch": 2416} {"train_loss": -24.033206939697266, "global_step": 200537, "epoch": 2416} {"train_loss": -24.05640411376953, "global_step": 200538, "epoch": 2416} {"train_loss": -24.11398696899414, "global_step": 200539, "epoch": 2416} {"train_loss": -23.968860626220703, "global_step": 200540, "epoch": 2416} {"train_loss": -24.18060302734375, "global_step": 200541, "epoch": 2416} {"train_loss": -24.071807861328125, "global_step": 200542, "epoch": 2416} {"train_loss": -24.500629425048828, "global_step": 200543, "epoch": 2416} {"train_loss": -24.532438278198242, "global_step": 200544, "epoch": 2416} {"train_loss": -24.280014038085938, "global_step": 200545, "epoch": 2416} {"train_loss": -24.083309173583984, "global_step": 200546, "epoch": 2416} {"train_loss": -24.196115493774414, "global_step": 200547, "epoch": 2416} {"train_loss": -24.54609489440918, "global_step": 200548, "epoch": 2416} {"train_loss": -24.29668617248535, "global_step": 200549, "epoch": 2416} {"train_loss": -24.509033203125, "global_step": 200550, "epoch": 2416} {"train_loss": -24.300779342651367, "global_step": 200551, "epoch": 2416} {"train_loss": -24.490095138549805, "global_step": 200552, "epoch": 2416} {"train_loss": -24.364953994750977, "global_step": 200553, "epoch": 2416} {"train_loss": -24.2606258392334, "global_step": 200554, "epoch": 2416} {"train_loss": -23.835018157958984, "global_step": 200555, "epoch": 2416} {"train_loss": -24.20549774169922, "global_step": 200556, "epoch": 2416} {"train_loss": -24.69243621826172, "global_step": 200557, "epoch": 2416} {"train_loss": -24.361263275146484, "global_step": 200558, "epoch": 2416} {"train_loss": -24.17909812927246, "global_step": 200559, "epoch": 2416} {"train_loss": -24.41139030456543, "global_step": 200560, "epoch": 2416} {"train_loss": -24.090471267700195, "global_step": 200561, "epoch": 2416} {"train_loss": -24.48992919921875, "global_step": 200562, "epoch": 2416} {"train_loss": -24.152734756469727, "global_step": 200563, "epoch": 2416} {"train_loss": -23.9544734954834, "global_step": 200564, "epoch": 2416} {"train_loss": -24.45329475402832, "global_step": 200565, "epoch": 2416} {"train_loss": -24.289066314697266, "global_step": 200566, "epoch": 2416} {"train_loss": -24.267730712890625, "global_step": 200567, "epoch": 2416} {"train_loss": -24.188947677612305, "global_step": 200568, "epoch": 2416} {"train_loss": -24.69029998779297, "global_step": 200569, "epoch": 2416} {"train_loss": -24.626678466796875, "global_step": 200570, "epoch": 2416} {"train_loss": -24.441396713256836, "global_step": 200571, "epoch": 2416} {"train_loss": -24.154165267944336, "global_step": 200572, "epoch": 2416} {"train_loss": -24.062734603881836, "global_step": 200573, "epoch": 2416} {"train_loss": -24.600568771362305, "global_step": 200574, "epoch": 2416} {"train_loss": -24.046035766601562, "global_step": 200575, "epoch": 2416} {"train_loss": -24.60935401916504, "global_step": 200576, "epoch": 2416} {"train_loss": -24.032499313354492, "global_step": 200577, "epoch": 2416} {"train_loss": -24.35382843017578, "global_step": 200578, "epoch": 2416} {"train_loss": -24.23662757873535, "global_step": 200579, "epoch": 2416} {"train_loss": -24.275949478149414, "global_step": 200580, "epoch": 2416} {"train_loss": -23.906606674194336, "global_step": 200581, "epoch": 2416} {"train_loss": -24.49794578552246, "global_step": 200582, "epoch": 2416} {"train_loss": -24.63941764831543, "global_step": 200583, "epoch": 2416} {"train_loss": -24.531646728515625, "global_step": 200584, "epoch": 2416} {"train_loss": -24.676542282104492, "global_step": 200585, "epoch": 2416} {"train_loss": -24.088943481445312, "global_step": 200586, "epoch": 2416} {"train_loss": -24.21286964416504, "global_step": 200587, "epoch": 2416} {"train_loss": -24.29097557067871, "global_step": 200588, "epoch": 2416} {"train_loss": -24.31788444519043, "global_step": 200589, "epoch": 2416} {"train_loss": -24.382244110107422, "global_step": 200590, "epoch": 2416} {"train_loss": -24.345901489257812, "global_step": 200591, "epoch": 2416} {"train_loss": -24.07167625427246, "global_step": 200592, "epoch": 2416} {"train_loss": -24.089725494384766, "global_step": 200593, "epoch": 2416} {"train_loss": -23.979360580444336, "global_step": 200594, "epoch": 2416} {"train_loss": -24.281415939331055, "global_step": 200595, "epoch": 2416} {"train_loss": -24.424436569213867, "global_step": 200596, "epoch": 2416} {"train_loss": -24.348163604736328, "global_step": 200597, "epoch": 2416} {"train_loss": -24.28822898864746, "global_step": 200598, "epoch": 2416} {"train_loss": -24.270599365234375, "global_step": 200599, "epoch": 2416} {"train_loss": -24.300565719604492, "global_step": 200600, "epoch": 2416} {"train_loss": -24.385305404663086, "global_step": 200601, "epoch": 2416} {"train_loss": -23.91119384765625, "global_step": 200602, "epoch": 2416} {"train_loss": -24.145584106445312, "global_step": 200603, "epoch": 2416} {"train_loss": -23.8155517578125, "global_step": 200604, "epoch": 2416} {"train_loss": -24.16111183166504, "global_step": 200605, "epoch": 2416} {"train_loss": -23.86591148376465, "global_step": 200606, "epoch": 2416} {"train_loss": -23.877883911132812, "global_step": 200607, "epoch": 2416} {"train_loss": -24.193450927734375, "global_step": 200608, "epoch": 2416} {"train_loss": -24.084375381469727, "global_step": 200609, "epoch": 2416} {"train_loss": -24.205681950212963, "global_step": 200610, "epoch": 2416, "val_loss": 6609501.0} {"train_loss": -23.33254051208496, "global_step": 200611, "epoch": 2417} {"train_loss": -23.839258193969727, "global_step": 200612, "epoch": 2417} {"train_loss": -24.094995498657227, "global_step": 200613, "epoch": 2417} {"train_loss": -23.724340438842773, "global_step": 200614, "epoch": 2417} {"train_loss": -23.76108741760254, "global_step": 200615, "epoch": 2417} {"train_loss": -23.624160766601562, "global_step": 200616, "epoch": 2417} {"train_loss": -23.97181510925293, "global_step": 200617, "epoch": 2417} {"train_loss": -23.35243034362793, "global_step": 200618, "epoch": 2417} {"train_loss": -23.911571502685547, "global_step": 200619, "epoch": 2417} {"train_loss": -23.93829917907715, "global_step": 200620, "epoch": 2417} {"train_loss": -24.354673385620117, "global_step": 200621, "epoch": 2417} {"train_loss": -24.093713760375977, "global_step": 200622, "epoch": 2417} {"train_loss": -24.207101821899414, "global_step": 200623, "epoch": 2417} {"train_loss": -23.95703125, "global_step": 200624, "epoch": 2417} {"train_loss": -24.056669235229492, "global_step": 200625, "epoch": 2417} {"train_loss": -24.19185447692871, "global_step": 200626, "epoch": 2417} {"train_loss": -24.012048721313477, "global_step": 200627, "epoch": 2417} {"train_loss": -24.001609802246094, "global_step": 200628, "epoch": 2417} {"train_loss": -24.150882720947266, "global_step": 200629, "epoch": 2417} {"train_loss": -24.084514617919922, "global_step": 200630, "epoch": 2417} {"train_loss": -24.109140396118164, "global_step": 200631, "epoch": 2417} {"train_loss": -24.177377700805664, "global_step": 200632, "epoch": 2417} {"train_loss": -24.288328170776367, "global_step": 200633, "epoch": 2417} {"train_loss": -24.175695419311523, "global_step": 200634, "epoch": 2417} {"train_loss": -24.152585983276367, "global_step": 200635, "epoch": 2417} {"train_loss": -24.23542594909668, "global_step": 200636, "epoch": 2417} {"train_loss": -24.087207794189453, "global_step": 200637, "epoch": 2417} {"train_loss": -24.2164363861084, "global_step": 200638, "epoch": 2417} {"train_loss": -24.168378829956055, "global_step": 200639, "epoch": 2417} {"train_loss": -24.262649536132812, "global_step": 200640, "epoch": 2417} {"train_loss": -24.090320587158203, "global_step": 200641, "epoch": 2417} {"train_loss": -24.050168991088867, "global_step": 200642, "epoch": 2417} {"train_loss": -24.108701705932617, "global_step": 200643, "epoch": 2417} {"train_loss": -24.234298706054688, "global_step": 200644, "epoch": 2417} {"train_loss": -24.172483444213867, "global_step": 200645, "epoch": 2417} {"train_loss": -24.529800415039062, "global_step": 200646, "epoch": 2417} {"train_loss": -24.483449935913086, "global_step": 200647, "epoch": 2417} {"train_loss": -24.40032386779785, "global_step": 200648, "epoch": 2417} {"train_loss": -24.482229232788086, "global_step": 200649, "epoch": 2417} {"train_loss": -23.987855911254883, "global_step": 200650, "epoch": 2417} {"train_loss": -24.314645767211914, "global_step": 200651, "epoch": 2417} {"train_loss": -24.426633834838867, "global_step": 200652, "epoch": 2417} {"train_loss": -24.58588981628418, "global_step": 200653, "epoch": 2417} {"train_loss": -24.42205047607422, "global_step": 200654, "epoch": 2417} {"train_loss": -24.050512313842773, "global_step": 200655, "epoch": 2417} {"train_loss": -24.248281478881836, "global_step": 200656, "epoch": 2417} {"train_loss": -24.615346908569336, "global_step": 200657, "epoch": 2417} {"train_loss": -24.07122039794922, "global_step": 200658, "epoch": 2417} {"train_loss": -24.380218505859375, "global_step": 200659, "epoch": 2417} {"train_loss": -24.334247589111328, "global_step": 200660, "epoch": 2417} {"train_loss": -24.33395004272461, "global_step": 200661, "epoch": 2417} {"train_loss": -24.601388931274414, "global_step": 200662, "epoch": 2417} {"train_loss": -24.354772567749023, "global_step": 200663, "epoch": 2417} {"train_loss": -24.43074607849121, "global_step": 200664, "epoch": 2417} {"train_loss": -23.793399810791016, "global_step": 200665, "epoch": 2417} {"train_loss": -24.34861183166504, "global_step": 200666, "epoch": 2417} {"train_loss": -24.24024772644043, "global_step": 200667, "epoch": 2417} {"train_loss": -24.340818405151367, "global_step": 200668, "epoch": 2417} {"train_loss": -24.26127052307129, "global_step": 200669, "epoch": 2417} {"train_loss": -24.03578758239746, "global_step": 200670, "epoch": 2417} {"train_loss": -24.38813591003418, "global_step": 200671, "epoch": 2417} {"train_loss": -24.139171600341797, "global_step": 200672, "epoch": 2417} {"train_loss": -24.286880493164062, "global_step": 200673, "epoch": 2417} {"train_loss": -24.160465240478516, "global_step": 200674, "epoch": 2417} {"train_loss": -24.425827026367188, "global_step": 200675, "epoch": 2417} {"train_loss": -24.734338760375977, "global_step": 200676, "epoch": 2417} {"train_loss": -24.29364776611328, "global_step": 200677, "epoch": 2417} {"train_loss": -24.19268226623535, "global_step": 200678, "epoch": 2417} {"train_loss": -24.654756546020508, "global_step": 200679, "epoch": 2417} {"train_loss": -24.21821403503418, "global_step": 200680, "epoch": 2417} {"train_loss": -24.476011276245117, "global_step": 200681, "epoch": 2417} {"train_loss": -24.283151626586914, "global_step": 200682, "epoch": 2417} {"train_loss": -24.6450252532959, "global_step": 200683, "epoch": 2417} {"train_loss": -24.233001708984375, "global_step": 200684, "epoch": 2417} {"train_loss": -24.02532386779785, "global_step": 200685, "epoch": 2417} {"train_loss": -24.551557540893555, "global_step": 200686, "epoch": 2417} {"train_loss": -24.407522201538086, "global_step": 200687, "epoch": 2417} {"train_loss": -24.21271514892578, "global_step": 200688, "epoch": 2417} {"train_loss": -24.356548309326172, "global_step": 200689, "epoch": 2417} {"train_loss": -24.155296325683594, "global_step": 200690, "epoch": 2417} {"train_loss": -24.122882843017578, "global_step": 200691, "epoch": 2417} {"train_loss": -24.400833129882812, "global_step": 200692, "epoch": 2417} {"train_loss": -24.190239550119422, "global_step": 200693, "epoch": 2417, "val_loss": 6404992.0} {"train_loss": -24.095373153686523, "global_step": 200694, "epoch": 2418} {"train_loss": -23.565134048461914, "global_step": 200695, "epoch": 2418} {"train_loss": -23.838729858398438, "global_step": 200696, "epoch": 2418} {"train_loss": -23.358373641967773, "global_step": 200697, "epoch": 2418} {"train_loss": -23.55341911315918, "global_step": 200698, "epoch": 2418} {"train_loss": -23.798154830932617, "global_step": 200699, "epoch": 2418} {"train_loss": -23.91864013671875, "global_step": 200700, "epoch": 2418} {"train_loss": -23.699325561523438, "global_step": 200701, "epoch": 2418} {"train_loss": -23.606863021850586, "global_step": 200702, "epoch": 2418} {"train_loss": -23.98358154296875, "global_step": 200703, "epoch": 2418} {"train_loss": -23.988285064697266, "global_step": 200704, "epoch": 2418} {"train_loss": -23.834714889526367, "global_step": 200705, "epoch": 2418} {"train_loss": -24.062274932861328, "global_step": 200706, "epoch": 2418} {"train_loss": -23.72138214111328, "global_step": 200707, "epoch": 2418} {"train_loss": -24.10814094543457, "global_step": 200708, "epoch": 2418} {"train_loss": -23.97454833984375, "global_step": 200709, "epoch": 2418} {"train_loss": -24.10271453857422, "global_step": 200710, "epoch": 2418} {"train_loss": -23.996814727783203, "global_step": 200711, "epoch": 2418} {"train_loss": -24.113609313964844, "global_step": 200712, "epoch": 2418} {"train_loss": -24.000732421875, "global_step": 200713, "epoch": 2418} {"train_loss": -24.461885452270508, "global_step": 200714, "epoch": 2418} {"train_loss": -24.021896362304688, "global_step": 200715, "epoch": 2418} {"train_loss": -23.849287033081055, "global_step": 200716, "epoch": 2418} {"train_loss": -23.890705108642578, "global_step": 200717, "epoch": 2418} {"train_loss": -23.985013961791992, "global_step": 200718, "epoch": 2418} {"train_loss": -24.124399185180664, "global_step": 200719, "epoch": 2418} {"train_loss": -23.957416534423828, "global_step": 200720, "epoch": 2418} {"train_loss": -24.092252731323242, "global_step": 200721, "epoch": 2418} {"train_loss": -24.252164840698242, "global_step": 200722, "epoch": 2418} {"train_loss": -24.337690353393555, "global_step": 200723, "epoch": 2418} {"train_loss": -24.194313049316406, "global_step": 200724, "epoch": 2418} {"train_loss": -24.0838565826416, "global_step": 200725, "epoch": 2418} {"train_loss": -24.022939682006836, "global_step": 200726, "epoch": 2418} {"train_loss": -24.265066146850586, "global_step": 200727, "epoch": 2418} {"train_loss": -24.173465728759766, "global_step": 200728, "epoch": 2418} {"train_loss": -24.162353515625, "global_step": 200729, "epoch": 2418} {"train_loss": -24.381994247436523, "global_step": 200730, "epoch": 2418} {"train_loss": -24.403348922729492, "global_step": 200731, "epoch": 2418} {"train_loss": -24.419645309448242, "global_step": 200732, "epoch": 2418} {"train_loss": -24.5628719329834, "global_step": 200733, "epoch": 2418} {"train_loss": -24.830581665039062, "global_step": 200734, "epoch": 2418} {"train_loss": -24.133047103881836, "global_step": 200735, "epoch": 2418} {"train_loss": -24.28696060180664, "global_step": 200736, "epoch": 2418} {"train_loss": -24.583784103393555, "global_step": 200737, "epoch": 2418} {"train_loss": -24.31245994567871, "global_step": 200738, "epoch": 2418} {"train_loss": -24.0451717376709, "global_step": 200739, "epoch": 2418} {"train_loss": -24.02812385559082, "global_step": 200740, "epoch": 2418} {"train_loss": -24.198078155517578, "global_step": 200741, "epoch": 2418} {"train_loss": -23.986886978149414, "global_step": 200742, "epoch": 2418} {"train_loss": -24.05287742614746, "global_step": 200743, "epoch": 2418} {"train_loss": -24.128034591674805, "global_step": 200744, "epoch": 2418} {"train_loss": -24.144302368164062, "global_step": 200745, "epoch": 2418} {"train_loss": -24.20273208618164, "global_step": 200746, "epoch": 2418} {"train_loss": -24.311471939086914, "global_step": 200747, "epoch": 2418} {"train_loss": -24.497167587280273, "global_step": 200748, "epoch": 2418} {"train_loss": -24.274545669555664, "global_step": 200749, "epoch": 2418} {"train_loss": -24.33526039123535, "global_step": 200750, "epoch": 2418} {"train_loss": -24.225814819335938, "global_step": 200751, "epoch": 2418} {"train_loss": -24.151254653930664, "global_step": 200752, "epoch": 2418} {"train_loss": -24.206039428710938, "global_step": 200753, "epoch": 2418} {"train_loss": -24.51263427734375, "global_step": 200754, "epoch": 2418} {"train_loss": -24.310550689697266, "global_step": 200755, "epoch": 2418} {"train_loss": -24.03830909729004, "global_step": 200756, "epoch": 2418} {"train_loss": -24.438993453979492, "global_step": 200757, "epoch": 2418} {"train_loss": -24.02294158935547, "global_step": 200758, "epoch": 2418} {"train_loss": -24.33515739440918, "global_step": 200759, "epoch": 2418} {"train_loss": -24.189847946166992, "global_step": 200760, "epoch": 2418} {"train_loss": -24.09842872619629, "global_step": 200761, "epoch": 2418} {"train_loss": -24.579193115234375, "global_step": 200762, "epoch": 2418} {"train_loss": -24.333547592163086, "global_step": 200763, "epoch": 2418} {"train_loss": -24.430028915405273, "global_step": 200764, "epoch": 2418} {"train_loss": -24.39307975769043, "global_step": 200765, "epoch": 2418} {"train_loss": -24.602828979492188, "global_step": 200766, "epoch": 2418} {"train_loss": -24.503576278686523, "global_step": 200767, "epoch": 2418} {"train_loss": -24.409255981445312, "global_step": 200768, "epoch": 2418} {"train_loss": -24.385456085205078, "global_step": 200769, "epoch": 2418} {"train_loss": -24.092090606689453, "global_step": 200770, "epoch": 2418} {"train_loss": -24.488754272460938, "global_step": 200771, "epoch": 2418} {"train_loss": -24.41039276123047, "global_step": 200772, "epoch": 2418} {"train_loss": -24.321744918823242, "global_step": 200773, "epoch": 2418} {"train_loss": -24.246885299682617, "global_step": 200774, "epoch": 2418} {"train_loss": -24.25834083557129, "global_step": 200775, "epoch": 2418} {"train_loss": -24.156195629073913, "global_step": 200776, "epoch": 2418, "val_loss": 6551651.0} {"train_loss": -23.97330665588379, "global_step": 200777, "epoch": 2419} {"train_loss": -23.592369079589844, "global_step": 200778, "epoch": 2419} {"train_loss": -23.35492515563965, "global_step": 200779, "epoch": 2419} {"train_loss": -23.856266021728516, "global_step": 200780, "epoch": 2419} {"train_loss": -23.87034034729004, "global_step": 200781, "epoch": 2419} {"train_loss": -23.898195266723633, "global_step": 200782, "epoch": 2419} {"train_loss": -24.204029083251953, "global_step": 200783, "epoch": 2419} {"train_loss": -24.44745445251465, "global_step": 200784, "epoch": 2419} {"train_loss": -23.966785430908203, "global_step": 200785, "epoch": 2419} {"train_loss": -24.030826568603516, "global_step": 200786, "epoch": 2419} {"train_loss": -23.670101165771484, "global_step": 200787, "epoch": 2419} {"train_loss": -24.31058692932129, "global_step": 200788, "epoch": 2419} {"train_loss": -24.296438217163086, "global_step": 200789, "epoch": 2419} {"train_loss": -23.877897262573242, "global_step": 200790, "epoch": 2419} {"train_loss": -24.143587112426758, "global_step": 200791, "epoch": 2419} {"train_loss": -23.800540924072266, "global_step": 200792, "epoch": 2419} {"train_loss": -24.648645401000977, "global_step": 200793, "epoch": 2419} {"train_loss": -24.11444091796875, "global_step": 200794, "epoch": 2419} {"train_loss": -24.361724853515625, "global_step": 200795, "epoch": 2419} {"train_loss": -24.48602867126465, "global_step": 200796, "epoch": 2419} {"train_loss": -24.049575805664062, "global_step": 200797, "epoch": 2419} {"train_loss": -24.112646102905273, "global_step": 200798, "epoch": 2419} {"train_loss": -24.547574996948242, "global_step": 200799, "epoch": 2419} {"train_loss": -23.87116813659668, "global_step": 200800, "epoch": 2419} {"train_loss": -24.174823760986328, "global_step": 200801, "epoch": 2419} {"train_loss": -24.097949981689453, "global_step": 200802, "epoch": 2419} {"train_loss": -24.528913497924805, "global_step": 200803, "epoch": 2419} {"train_loss": -24.121370315551758, "global_step": 200804, "epoch": 2419} {"train_loss": -24.078834533691406, "global_step": 200805, "epoch": 2419} {"train_loss": -24.122800827026367, "global_step": 200806, "epoch": 2419} {"train_loss": -24.1800537109375, "global_step": 200807, "epoch": 2419} {"train_loss": -24.214574813842773, "global_step": 200808, "epoch": 2419} {"train_loss": -24.390764236450195, "global_step": 200809, "epoch": 2419} {"train_loss": -24.148862838745117, "global_step": 200810, "epoch": 2419} {"train_loss": -24.186609268188477, "global_step": 200811, "epoch": 2419} {"train_loss": -24.24242401123047, "global_step": 200812, "epoch": 2419} {"train_loss": -23.925033569335938, "global_step": 200813, "epoch": 2419} {"train_loss": -24.348066329956055, "global_step": 200814, "epoch": 2419} {"train_loss": -24.179548263549805, "global_step": 200815, "epoch": 2419} {"train_loss": -24.229467391967773, "global_step": 200816, "epoch": 2419} {"train_loss": -24.018335342407227, "global_step": 200817, "epoch": 2419} {"train_loss": -24.847614288330078, "global_step": 200818, "epoch": 2419} {"train_loss": -24.456981658935547, "global_step": 200819, "epoch": 2419} {"train_loss": -24.37360191345215, "global_step": 200820, "epoch": 2419} {"train_loss": -24.172243118286133, "global_step": 200821, "epoch": 2419} {"train_loss": -24.163724899291992, "global_step": 200822, "epoch": 2419} {"train_loss": -24.086734771728516, "global_step": 200823, "epoch": 2419} {"train_loss": -23.95948600769043, "global_step": 200824, "epoch": 2419} {"train_loss": -24.202329635620117, "global_step": 200825, "epoch": 2419} {"train_loss": -24.346609115600586, "global_step": 200826, "epoch": 2419} {"train_loss": -24.227962493896484, "global_step": 200827, "epoch": 2419} {"train_loss": -23.86941909790039, "global_step": 200828, "epoch": 2419} {"train_loss": -24.229053497314453, "global_step": 200829, "epoch": 2419} {"train_loss": -24.266681671142578, "global_step": 200830, "epoch": 2419} {"train_loss": -24.234880447387695, "global_step": 200831, "epoch": 2419} {"train_loss": -24.295602798461914, "global_step": 200832, "epoch": 2419} {"train_loss": -24.51628875732422, "global_step": 200833, "epoch": 2419} {"train_loss": -24.256319046020508, "global_step": 200834, "epoch": 2419} {"train_loss": -23.929040908813477, "global_step": 200835, "epoch": 2419} {"train_loss": -24.50046730041504, "global_step": 200836, "epoch": 2419} {"train_loss": -24.067642211914062, "global_step": 200837, "epoch": 2419} {"train_loss": -24.401418685913086, "global_step": 200838, "epoch": 2419} {"train_loss": -23.95875358581543, "global_step": 200839, "epoch": 2419} {"train_loss": -24.27346420288086, "global_step": 200840, "epoch": 2419} {"train_loss": -24.438634872436523, "global_step": 200841, "epoch": 2419} {"train_loss": -23.90734100341797, "global_step": 200842, "epoch": 2419} {"train_loss": -24.227338790893555, "global_step": 200843, "epoch": 2419} {"train_loss": -24.130109786987305, "global_step": 200844, "epoch": 2419} {"train_loss": -24.24167823791504, "global_step": 200845, "epoch": 2419} {"train_loss": -23.95166778564453, "global_step": 200846, "epoch": 2419} {"train_loss": -24.20212173461914, "global_step": 200847, "epoch": 2419} {"train_loss": -24.368566513061523, "global_step": 200848, "epoch": 2419} {"train_loss": -24.01252555847168, "global_step": 200849, "epoch": 2419} {"train_loss": -24.166168212890625, "global_step": 200850, "epoch": 2419} {"train_loss": -24.1390438079834, "global_step": 200851, "epoch": 2419} {"train_loss": -24.41762351989746, "global_step": 200852, "epoch": 2419} {"train_loss": -24.019723892211914, "global_step": 200853, "epoch": 2419} {"train_loss": -24.531436920166016, "global_step": 200854, "epoch": 2419} {"train_loss": -24.441757202148438, "global_step": 200855, "epoch": 2419} {"train_loss": -23.989606857299805, "global_step": 200856, "epoch": 2419} {"train_loss": -24.6755428314209, "global_step": 200857, "epoch": 2419} {"train_loss": -24.3040771484375, "global_step": 200858, "epoch": 2419} {"train_loss": -24.188643122293865, "global_step": 200859, "epoch": 2419, "val_loss": 6519586.0} {"train_loss": -24.133390426635742, "global_step": 200860, "epoch": 2420} {"train_loss": -23.580963134765625, "global_step": 200861, "epoch": 2420} {"train_loss": -23.9056396484375, "global_step": 200862, "epoch": 2420} {"train_loss": -24.240644454956055, "global_step": 200863, "epoch": 2420} {"train_loss": -23.557313919067383, "global_step": 200864, "epoch": 2420} {"train_loss": -23.940156936645508, "global_step": 200865, "epoch": 2420} {"train_loss": -24.013471603393555, "global_step": 200866, "epoch": 2420} {"train_loss": -23.8640193939209, "global_step": 200867, "epoch": 2420} {"train_loss": -24.10772132873535, "global_step": 200868, "epoch": 2420} {"train_loss": -23.72251319885254, "global_step": 200869, "epoch": 2420} {"train_loss": -24.238924026489258, "global_step": 200870, "epoch": 2420} {"train_loss": -24.012561798095703, "global_step": 200871, "epoch": 2420} {"train_loss": -24.205947875976562, "global_step": 200872, "epoch": 2420} {"train_loss": -24.481260299682617, "global_step": 200873, "epoch": 2420} {"train_loss": -24.124425888061523, "global_step": 200874, "epoch": 2420} {"train_loss": -24.297143936157227, "global_step": 200875, "epoch": 2420} {"train_loss": -23.86124038696289, "global_step": 200876, "epoch": 2420} {"train_loss": -23.817020416259766, "global_step": 200877, "epoch": 2420} {"train_loss": -24.297391891479492, "global_step": 200878, "epoch": 2420} {"train_loss": -24.14374351501465, "global_step": 200879, "epoch": 2420} {"train_loss": -24.177061080932617, "global_step": 200880, "epoch": 2420} {"train_loss": -23.79047203063965, "global_step": 200881, "epoch": 2420} {"train_loss": -24.383291244506836, "global_step": 200882, "epoch": 2420} {"train_loss": -24.730329513549805, "global_step": 200883, "epoch": 2420} {"train_loss": -24.2529296875, "global_step": 200884, "epoch": 2420} {"train_loss": -24.24314308166504, "global_step": 200885, "epoch": 2420} {"train_loss": -24.04240608215332, "global_step": 200886, "epoch": 2420} {"train_loss": -24.269132614135742, "global_step": 200887, "epoch": 2420} {"train_loss": -24.24837875366211, "global_step": 200888, "epoch": 2420} {"train_loss": -24.208402633666992, "global_step": 200889, "epoch": 2420} {"train_loss": -24.229597091674805, "global_step": 200890, "epoch": 2420} {"train_loss": -24.240278244018555, "global_step": 200891, "epoch": 2420} {"train_loss": -24.40138053894043, "global_step": 200892, "epoch": 2420} {"train_loss": -24.39130210876465, "global_step": 200893, "epoch": 2420} {"train_loss": -24.58824920654297, "global_step": 200894, "epoch": 2420} {"train_loss": -24.38496971130371, "global_step": 200895, "epoch": 2420} {"train_loss": -24.60319709777832, "global_step": 200896, "epoch": 2420} {"train_loss": -24.12040138244629, "global_step": 200897, "epoch": 2420} {"train_loss": -24.479080200195312, "global_step": 200898, "epoch": 2420} {"train_loss": -24.69520378112793, "global_step": 200899, "epoch": 2420} {"train_loss": -24.443571090698242, "global_step": 200900, "epoch": 2420} {"train_loss": -24.352928161621094, "global_step": 200901, "epoch": 2420} {"train_loss": -23.901308059692383, "global_step": 200902, "epoch": 2420} {"train_loss": -24.154773712158203, "global_step": 200903, "epoch": 2420} {"train_loss": -24.23279571533203, "global_step": 200904, "epoch": 2420} {"train_loss": -24.13227653503418, "global_step": 200905, "epoch": 2420} {"train_loss": -24.23508071899414, "global_step": 200906, "epoch": 2420} {"train_loss": -24.423505783081055, "global_step": 200907, "epoch": 2420} {"train_loss": -24.476497650146484, "global_step": 200908, "epoch": 2420} {"train_loss": -24.531604766845703, "global_step": 200909, "epoch": 2420} {"train_loss": -23.6677303314209, "global_step": 200910, "epoch": 2420} {"train_loss": -23.711877822875977, "global_step": 200911, "epoch": 2420} {"train_loss": -23.17384147644043, "global_step": 200912, "epoch": 2420} {"train_loss": -23.200658798217773, "global_step": 200913, "epoch": 2420} {"train_loss": -23.73702049255371, "global_step": 200914, "epoch": 2420} {"train_loss": -24.74869728088379, "global_step": 200915, "epoch": 2420} {"train_loss": -23.74000358581543, "global_step": 200916, "epoch": 2420} {"train_loss": -23.992244720458984, "global_step": 200917, "epoch": 2420} {"train_loss": -24.474815368652344, "global_step": 200918, "epoch": 2420} {"train_loss": -24.103281021118164, "global_step": 200919, "epoch": 2420} {"train_loss": -23.56751823425293, "global_step": 200920, "epoch": 2420} {"train_loss": -24.212644577026367, "global_step": 200921, "epoch": 2420} {"train_loss": -24.03968048095703, "global_step": 200922, "epoch": 2420} {"train_loss": -24.17496109008789, "global_step": 200923, "epoch": 2420} {"train_loss": -23.977685928344727, "global_step": 200924, "epoch": 2420} {"train_loss": -24.18789291381836, "global_step": 200925, "epoch": 2420} {"train_loss": -24.02458953857422, "global_step": 200926, "epoch": 2420} {"train_loss": -23.99458122253418, "global_step": 200927, "epoch": 2420} {"train_loss": -24.23185920715332, "global_step": 200928, "epoch": 2420} {"train_loss": -23.944047927856445, "global_step": 200929, "epoch": 2420} {"train_loss": -24.261783599853516, "global_step": 200930, "epoch": 2420} {"train_loss": -23.961435317993164, "global_step": 200931, "epoch": 2420} {"train_loss": -24.02201271057129, "global_step": 200932, "epoch": 2420} {"train_loss": -24.286495208740234, "global_step": 200933, "epoch": 2420} {"train_loss": -24.242422103881836, "global_step": 200934, "epoch": 2420} {"train_loss": -24.325057983398438, "global_step": 200935, "epoch": 2420} {"train_loss": -24.12917137145996, "global_step": 200936, "epoch": 2420} {"train_loss": -24.624753952026367, "global_step": 200937, "epoch": 2420} {"train_loss": -24.35426139831543, "global_step": 200938, "epoch": 2420} {"train_loss": -24.277326583862305, "global_step": 200939, "epoch": 2420} {"train_loss": -24.336427688598633, "global_step": 200940, "epoch": 2420} {"train_loss": -24.643104553222656, "global_step": 200941, "epoch": 2420} {"train_loss": -24.147476196289062, "global_step": 200942, "epoch": 2420, "val_loss": 6589904.5} {"train_loss": -23.871479034423828, "global_step": 200943, "epoch": 2421} {"train_loss": -23.882247924804688, "global_step": 200944, "epoch": 2421} {"train_loss": -24.105804443359375, "global_step": 200945, "epoch": 2421} {"train_loss": -23.81488037109375, "global_step": 200946, "epoch": 2421} {"train_loss": -23.423704147338867, "global_step": 200947, "epoch": 2421} {"train_loss": -23.84433937072754, "global_step": 200948, "epoch": 2421} {"train_loss": -23.656726837158203, "global_step": 200949, "epoch": 2421} {"train_loss": -23.9429931640625, "global_step": 200950, "epoch": 2421} {"train_loss": -23.815210342407227, "global_step": 200951, "epoch": 2421} {"train_loss": -23.84649085998535, "global_step": 200952, "epoch": 2421} {"train_loss": -23.975996017456055, "global_step": 200953, "epoch": 2421} {"train_loss": -23.53489112854004, "global_step": 200954, "epoch": 2421} {"train_loss": -23.94822120666504, "global_step": 200955, "epoch": 2421} {"train_loss": -23.679157257080078, "global_step": 200956, "epoch": 2421} {"train_loss": -23.950180053710938, "global_step": 200957, "epoch": 2421} {"train_loss": -23.643491744995117, "global_step": 200958, "epoch": 2421} {"train_loss": -23.752290725708008, "global_step": 200959, "epoch": 2421} {"train_loss": -23.964609146118164, "global_step": 200960, "epoch": 2421} {"train_loss": -23.987003326416016, "global_step": 200961, "epoch": 2421} {"train_loss": -24.029085159301758, "global_step": 200962, "epoch": 2421} {"train_loss": -24.04483985900879, "global_step": 200963, "epoch": 2421} {"train_loss": -24.182085037231445, "global_step": 200964, "epoch": 2421} {"train_loss": -24.09355926513672, "global_step": 200965, "epoch": 2421} {"train_loss": -23.890295028686523, "global_step": 200966, "epoch": 2421} {"train_loss": -23.981901168823242, "global_step": 200967, "epoch": 2421} {"train_loss": -24.21363639831543, "global_step": 200968, "epoch": 2421} {"train_loss": -24.060401916503906, "global_step": 200969, "epoch": 2421} {"train_loss": -24.104419708251953, "global_step": 200970, "epoch": 2421} {"train_loss": -23.923734664916992, "global_step": 200971, "epoch": 2421} {"train_loss": -24.46905517578125, "global_step": 200972, "epoch": 2421} {"train_loss": -24.19074821472168, "global_step": 200973, "epoch": 2421} {"train_loss": -24.314340591430664, "global_step": 200974, "epoch": 2421} {"train_loss": -24.24196434020996, "global_step": 200975, "epoch": 2421} {"train_loss": -24.16518211364746, "global_step": 200976, "epoch": 2421} {"train_loss": -24.199722290039062, "global_step": 200977, "epoch": 2421} {"train_loss": -23.64939308166504, "global_step": 200978, "epoch": 2421} {"train_loss": -24.185699462890625, "global_step": 200979, "epoch": 2421} {"train_loss": -24.109445571899414, "global_step": 200980, "epoch": 2421} {"train_loss": -24.03249168395996, "global_step": 200981, "epoch": 2421} {"train_loss": -24.08185577392578, "global_step": 200982, "epoch": 2421} {"train_loss": -24.24070167541504, "global_step": 200983, "epoch": 2421} {"train_loss": -24.29190444946289, "global_step": 200984, "epoch": 2421} {"train_loss": -24.35746192932129, "global_step": 200985, "epoch": 2421} {"train_loss": -24.36147689819336, "global_step": 200986, "epoch": 2421} {"train_loss": -24.33492088317871, "global_step": 200987, "epoch": 2421} {"train_loss": -24.581466674804688, "global_step": 200988, "epoch": 2421} {"train_loss": -24.497684478759766, "global_step": 200989, "epoch": 2421} {"train_loss": -24.352441787719727, "global_step": 200990, "epoch": 2421} {"train_loss": -24.59136390686035, "global_step": 200991, "epoch": 2421} {"train_loss": -24.548450469970703, "global_step": 200992, "epoch": 2421} {"train_loss": -24.024063110351562, "global_step": 200993, "epoch": 2421} {"train_loss": -24.2791690826416, "global_step": 200994, "epoch": 2421} {"train_loss": -24.096389770507812, "global_step": 200995, "epoch": 2421} {"train_loss": -24.177326202392578, "global_step": 200996, "epoch": 2421} {"train_loss": -24.404069900512695, "global_step": 200997, "epoch": 2421} {"train_loss": -24.353586196899414, "global_step": 200998, "epoch": 2421} {"train_loss": -24.296316146850586, "global_step": 200999, "epoch": 2421} {"train_loss": -24.38814353942871, "global_step": 201000, "epoch": 2421} {"train_loss": -24.40827751159668, "global_step": 201001, "epoch": 2421} {"train_loss": -24.562192916870117, "global_step": 201002, "epoch": 2421} {"train_loss": -24.38427734375, "global_step": 201003, "epoch": 2421} {"train_loss": -24.28635597229004, "global_step": 201004, "epoch": 2421} {"train_loss": -24.13204574584961, "global_step": 201005, "epoch": 2421} {"train_loss": -24.475324630737305, "global_step": 201006, "epoch": 2421} {"train_loss": -24.46894645690918, "global_step": 201007, "epoch": 2421} {"train_loss": -24.381515502929688, "global_step": 201008, "epoch": 2421} {"train_loss": -24.64023780822754, "global_step": 201009, "epoch": 2421} {"train_loss": -24.240476608276367, "global_step": 201010, "epoch": 2421} {"train_loss": -24.643766403198242, "global_step": 201011, "epoch": 2421} {"train_loss": -24.17887306213379, "global_step": 201012, "epoch": 2421} {"train_loss": -24.422712326049805, "global_step": 201013, "epoch": 2421} {"train_loss": -24.476612091064453, "global_step": 201014, "epoch": 2421} {"train_loss": -24.39927101135254, "global_step": 201015, "epoch": 2421} {"train_loss": -24.36531639099121, "global_step": 201016, "epoch": 2421} {"train_loss": -24.607030868530273, "global_step": 201017, "epoch": 2421} {"train_loss": -24.476835250854492, "global_step": 201018, "epoch": 2421} {"train_loss": -24.66459083557129, "global_step": 201019, "epoch": 2421} {"train_loss": -24.2069034576416, "global_step": 201020, "epoch": 2421} {"train_loss": -24.779199600219727, "global_step": 201021, "epoch": 2421} {"train_loss": -23.949237823486328, "global_step": 201022, "epoch": 2421} {"train_loss": -24.504043579101562, "global_step": 201023, "epoch": 2421} {"train_loss": -24.878686904907227, "global_step": 201024, "epoch": 2421} {"train_loss": -24.179840777293744, "global_step": 201025, "epoch": 2421, "val_loss": 6562333.0} {"train_loss": -23.69737434387207, "global_step": 201026, "epoch": 2422} {"train_loss": -24.00613784790039, "global_step": 201027, "epoch": 2422} {"train_loss": -24.278913497924805, "global_step": 201028, "epoch": 2422} {"train_loss": -23.417686462402344, "global_step": 201029, "epoch": 2422} {"train_loss": -22.762409210205078, "global_step": 201030, "epoch": 2422} {"train_loss": -22.359512329101562, "global_step": 201031, "epoch": 2422} {"train_loss": -23.61298179626465, "global_step": 201032, "epoch": 2422} {"train_loss": -23.783132553100586, "global_step": 201033, "epoch": 2422} {"train_loss": -23.512792587280273, "global_step": 201034, "epoch": 2422} {"train_loss": -23.99812126159668, "global_step": 201035, "epoch": 2422} {"train_loss": -23.675552368164062, "global_step": 201036, "epoch": 2422} {"train_loss": -23.654020309448242, "global_step": 201037, "epoch": 2422} {"train_loss": -23.444536209106445, "global_step": 201038, "epoch": 2422} {"train_loss": -23.794118881225586, "global_step": 201039, "epoch": 2422} {"train_loss": -24.300573348999023, "global_step": 201040, "epoch": 2422} {"train_loss": -24.194013595581055, "global_step": 201041, "epoch": 2422} {"train_loss": -23.8635196685791, "global_step": 201042, "epoch": 2422} {"train_loss": -24.031394958496094, "global_step": 201043, "epoch": 2422} {"train_loss": -24.138044357299805, "global_step": 201044, "epoch": 2422} {"train_loss": -23.990745544433594, "global_step": 201045, "epoch": 2422} {"train_loss": -24.310623168945312, "global_step": 201046, "epoch": 2422} {"train_loss": -23.926883697509766, "global_step": 201047, "epoch": 2422} {"train_loss": -24.2971248626709, "global_step": 201048, "epoch": 2422} {"train_loss": -24.011892318725586, "global_step": 201049, "epoch": 2422} {"train_loss": -23.957324981689453, "global_step": 201050, "epoch": 2422} {"train_loss": -23.608783721923828, "global_step": 201051, "epoch": 2422} {"train_loss": -23.850635528564453, "global_step": 201052, "epoch": 2422} {"train_loss": -24.09885025024414, "global_step": 201053, "epoch": 2422} {"train_loss": -24.407630920410156, "global_step": 201054, "epoch": 2422} {"train_loss": -23.89170265197754, "global_step": 201055, "epoch": 2422} {"train_loss": -24.206459045410156, "global_step": 201056, "epoch": 2422} {"train_loss": -24.328725814819336, "global_step": 201057, "epoch": 2422} {"train_loss": -24.208805084228516, "global_step": 201058, "epoch": 2422} {"train_loss": -23.953094482421875, "global_step": 201059, "epoch": 2422} {"train_loss": -24.437524795532227, "global_step": 201060, "epoch": 2422} {"train_loss": -24.346195220947266, "global_step": 201061, "epoch": 2422} {"train_loss": -24.43572425842285, "global_step": 201062, "epoch": 2422} {"train_loss": -24.53424644470215, "global_step": 201063, "epoch": 2422} {"train_loss": -24.113967895507812, "global_step": 201064, "epoch": 2422} {"train_loss": -24.008502960205078, "global_step": 201065, "epoch": 2422} {"train_loss": -24.268230438232422, "global_step": 201066, "epoch": 2422} {"train_loss": -24.571935653686523, "global_step": 201067, "epoch": 2422} {"train_loss": -24.17586326599121, "global_step": 201068, "epoch": 2422} {"train_loss": -24.93722915649414, "global_step": 201069, "epoch": 2422} {"train_loss": -24.3383846282959, "global_step": 201070, "epoch": 2422} {"train_loss": -24.358600616455078, "global_step": 201071, "epoch": 2422} {"train_loss": -24.056175231933594, "global_step": 201072, "epoch": 2422} {"train_loss": -24.550016403198242, "global_step": 201073, "epoch": 2422} {"train_loss": -24.06036949157715, "global_step": 201074, "epoch": 2422} {"train_loss": -24.25351905822754, "global_step": 201075, "epoch": 2422} {"train_loss": -24.61332130432129, "global_step": 201076, "epoch": 2422} {"train_loss": -24.177661895751953, "global_step": 201077, "epoch": 2422} {"train_loss": -24.394710540771484, "global_step": 201078, "epoch": 2422} {"train_loss": -24.430423736572266, "global_step": 201079, "epoch": 2422} {"train_loss": -24.121397018432617, "global_step": 201080, "epoch": 2422} {"train_loss": -24.24550437927246, "global_step": 201081, "epoch": 2422} {"train_loss": -24.156726837158203, "global_step": 201082, "epoch": 2422} {"train_loss": -24.947065353393555, "global_step": 201083, "epoch": 2422} {"train_loss": -24.101795196533203, "global_step": 201084, "epoch": 2422} {"train_loss": -24.16181755065918, "global_step": 201085, "epoch": 2422} {"train_loss": -24.44626235961914, "global_step": 201086, "epoch": 2422} {"train_loss": -24.528623580932617, "global_step": 201087, "epoch": 2422} {"train_loss": -24.291553497314453, "global_step": 201088, "epoch": 2422} {"train_loss": -24.164777755737305, "global_step": 201089, "epoch": 2422} {"train_loss": -24.60355567932129, "global_step": 201090, "epoch": 2422} {"train_loss": -24.22041130065918, "global_step": 201091, "epoch": 2422} {"train_loss": -24.440414428710938, "global_step": 201092, "epoch": 2422} {"train_loss": -24.142541885375977, "global_step": 201093, "epoch": 2422} {"train_loss": -24.492843627929688, "global_step": 201094, "epoch": 2422} {"train_loss": -24.330350875854492, "global_step": 201095, "epoch": 2422} {"train_loss": -24.46182632446289, "global_step": 201096, "epoch": 2422} {"train_loss": -24.20413589477539, "global_step": 201097, "epoch": 2422} {"train_loss": -24.53511619567871, "global_step": 201098, "epoch": 2422} {"train_loss": -24.230501174926758, "global_step": 201099, "epoch": 2422} {"train_loss": -24.5030517578125, "global_step": 201100, "epoch": 2422} {"train_loss": -24.45517921447754, "global_step": 201101, "epoch": 2422} {"train_loss": -24.834766387939453, "global_step": 201102, "epoch": 2422} {"train_loss": -24.62737464904785, "global_step": 201103, "epoch": 2422} {"train_loss": -24.69808006286621, "global_step": 201104, "epoch": 2422} {"train_loss": -24.573139190673828, "global_step": 201105, "epoch": 2422} {"train_loss": -24.12521743774414, "global_step": 201106, "epoch": 2422} {"train_loss": -23.99137306213379, "global_step": 201107, "epoch": 2422} {"train_loss": -24.160551898450738, "global_step": 201108, "epoch": 2422, "val_loss": 6559627.0} {"train_loss": -23.27311134338379, "global_step": 201109, "epoch": 2423} {"train_loss": -23.077085494995117, "global_step": 201110, "epoch": 2423} {"train_loss": -23.366621017456055, "global_step": 201111, "epoch": 2423} {"train_loss": -23.232072830200195, "global_step": 201112, "epoch": 2423} {"train_loss": -23.90382194519043, "global_step": 201113, "epoch": 2423} {"train_loss": -23.27335548400879, "global_step": 201114, "epoch": 2423} {"train_loss": -23.54636001586914, "global_step": 201115, "epoch": 2423} {"train_loss": -23.73419189453125, "global_step": 201116, "epoch": 2423} {"train_loss": -23.796178817749023, "global_step": 201117, "epoch": 2423} {"train_loss": -23.8496150970459, "global_step": 201118, "epoch": 2423} {"train_loss": -23.7629337310791, "global_step": 201119, "epoch": 2423} {"train_loss": -23.49299430847168, "global_step": 201120, "epoch": 2423} {"train_loss": -23.632843017578125, "global_step": 201121, "epoch": 2423} {"train_loss": -24.15643882751465, "global_step": 201122, "epoch": 2423} {"train_loss": -23.494274139404297, "global_step": 201123, "epoch": 2423} {"train_loss": -23.852811813354492, "global_step": 201124, "epoch": 2423} {"train_loss": -23.748815536499023, "global_step": 201125, "epoch": 2423} {"train_loss": -23.758935928344727, "global_step": 201126, "epoch": 2423} {"train_loss": -24.006078720092773, "global_step": 201127, "epoch": 2423} {"train_loss": -24.122730255126953, "global_step": 201128, "epoch": 2423} {"train_loss": -24.053924560546875, "global_step": 201129, "epoch": 2423} {"train_loss": -23.851438522338867, "global_step": 201130, "epoch": 2423} {"train_loss": -23.989242553710938, "global_step": 201131, "epoch": 2423} {"train_loss": -23.875255584716797, "global_step": 201132, "epoch": 2423} {"train_loss": -24.31438636779785, "global_step": 201133, "epoch": 2423} {"train_loss": -24.06208038330078, "global_step": 201134, "epoch": 2423} {"train_loss": -24.213293075561523, "global_step": 201135, "epoch": 2423} {"train_loss": -23.95650291442871, "global_step": 201136, "epoch": 2423} {"train_loss": -24.43147850036621, "global_step": 201137, "epoch": 2423} {"train_loss": -24.459693908691406, "global_step": 201138, "epoch": 2423} {"train_loss": -24.05826187133789, "global_step": 201139, "epoch": 2423} {"train_loss": -23.869787216186523, "global_step": 201140, "epoch": 2423} {"train_loss": -24.7032470703125, "global_step": 201141, "epoch": 2423} {"train_loss": -24.45551872253418, "global_step": 201142, "epoch": 2423} {"train_loss": -24.283531188964844, "global_step": 201143, "epoch": 2423} {"train_loss": -23.978336334228516, "global_step": 201144, "epoch": 2423} {"train_loss": -24.33624267578125, "global_step": 201145, "epoch": 2423} {"train_loss": -24.43149757385254, "global_step": 201146, "epoch": 2423} {"train_loss": -24.203857421875, "global_step": 201147, "epoch": 2423} {"train_loss": -24.534805297851562, "global_step": 201148, "epoch": 2423} {"train_loss": -24.254833221435547, "global_step": 201149, "epoch": 2423} {"train_loss": -24.18263053894043, "global_step": 201150, "epoch": 2423} {"train_loss": -24.21425437927246, "global_step": 201151, "epoch": 2423} {"train_loss": -24.153600692749023, "global_step": 201152, "epoch": 2423} {"train_loss": -24.224761962890625, "global_step": 201153, "epoch": 2423} {"train_loss": -23.74798583984375, "global_step": 201154, "epoch": 2423} {"train_loss": -24.46922492980957, "global_step": 201155, "epoch": 2423} {"train_loss": -24.226774215698242, "global_step": 201156, "epoch": 2423} {"train_loss": -24.26358985900879, "global_step": 201157, "epoch": 2423} {"train_loss": -24.200271606445312, "global_step": 201158, "epoch": 2423} {"train_loss": -24.285888671875, "global_step": 201159, "epoch": 2423} {"train_loss": -24.347787857055664, "global_step": 201160, "epoch": 2423} {"train_loss": -24.399316787719727, "global_step": 201161, "epoch": 2423} {"train_loss": -24.66985511779785, "global_step": 201162, "epoch": 2423} {"train_loss": -24.37132453918457, "global_step": 201163, "epoch": 2423} {"train_loss": -24.126920700073242, "global_step": 201164, "epoch": 2423} {"train_loss": -24.150583267211914, "global_step": 201165, "epoch": 2423} {"train_loss": -24.217817306518555, "global_step": 201166, "epoch": 2423} {"train_loss": -24.386619567871094, "global_step": 201167, "epoch": 2423} {"train_loss": -24.21707534790039, "global_step": 201168, "epoch": 2423} {"train_loss": -24.434995651245117, "global_step": 201169, "epoch": 2423} {"train_loss": -24.620500564575195, "global_step": 201170, "epoch": 2423} {"train_loss": -24.22681999206543, "global_step": 201171, "epoch": 2423} {"train_loss": -23.529966354370117, "global_step": 201172, "epoch": 2423} {"train_loss": -23.578510284423828, "global_step": 201173, "epoch": 2423} {"train_loss": -23.205106735229492, "global_step": 201174, "epoch": 2423} {"train_loss": -24.239656448364258, "global_step": 201175, "epoch": 2423} {"train_loss": -23.88266944885254, "global_step": 201176, "epoch": 2423} {"train_loss": -23.911054611206055, "global_step": 201177, "epoch": 2423} {"train_loss": -23.655057907104492, "global_step": 201178, "epoch": 2423} {"train_loss": -24.17793083190918, "global_step": 201179, "epoch": 2423} {"train_loss": -23.7790584564209, "global_step": 201180, "epoch": 2423} {"train_loss": -24.255813598632812, "global_step": 201181, "epoch": 2423} {"train_loss": -23.944395065307617, "global_step": 201182, "epoch": 2423} {"train_loss": -24.003986358642578, "global_step": 201183, "epoch": 2423} {"train_loss": -23.845426559448242, "global_step": 201184, "epoch": 2423} {"train_loss": -24.352523803710938, "global_step": 201185, "epoch": 2423} {"train_loss": -23.93145179748535, "global_step": 201186, "epoch": 2423} {"train_loss": -24.1610050201416, "global_step": 201187, "epoch": 2423} {"train_loss": -23.8830623626709, "global_step": 201188, "epoch": 2423} {"train_loss": -23.91713523864746, "global_step": 201189, "epoch": 2423} {"train_loss": -24.057296752929688, "global_step": 201190, "epoch": 2423} {"train_loss": -24.036678452089607, "global_step": 201191, "epoch": 2423, "val_loss": 6516796.0} {"train_loss": -24.28076171875, "global_step": 201192, "epoch": 2424} {"train_loss": -24.067655563354492, "global_step": 201193, "epoch": 2424} {"train_loss": -23.79781150817871, "global_step": 201194, "epoch": 2424} {"train_loss": -24.04425048828125, "global_step": 201195, "epoch": 2424} {"train_loss": -24.333843231201172, "global_step": 201196, "epoch": 2424} {"train_loss": -24.564979553222656, "global_step": 201197, "epoch": 2424} {"train_loss": -23.914113998413086, "global_step": 201198, "epoch": 2424} {"train_loss": -24.566946029663086, "global_step": 201199, "epoch": 2424} {"train_loss": -24.06172752380371, "global_step": 201200, "epoch": 2424} {"train_loss": -24.199161529541016, "global_step": 201201, "epoch": 2424} {"train_loss": -24.327322006225586, "global_step": 201202, "epoch": 2424} {"train_loss": -24.271867752075195, "global_step": 201203, "epoch": 2424} {"train_loss": -24.49137306213379, "global_step": 201204, "epoch": 2424} {"train_loss": -24.59085464477539, "global_step": 201205, "epoch": 2424} {"train_loss": -24.21442985534668, "global_step": 201206, "epoch": 2424} {"train_loss": -24.434574127197266, "global_step": 201207, "epoch": 2424} {"train_loss": -24.29996109008789, "global_step": 201208, "epoch": 2424} {"train_loss": -24.460906982421875, "global_step": 201209, "epoch": 2424} {"train_loss": -24.476993560791016, "global_step": 201210, "epoch": 2424} {"train_loss": -24.50290870666504, "global_step": 201211, "epoch": 2424} {"train_loss": -24.332834243774414, "global_step": 201212, "epoch": 2424} {"train_loss": -24.128686904907227, "global_step": 201213, "epoch": 2424} {"train_loss": -24.36883544921875, "global_step": 201214, "epoch": 2424} {"train_loss": -24.105113983154297, "global_step": 201215, "epoch": 2424} {"train_loss": -24.346906661987305, "global_step": 201216, "epoch": 2424} {"train_loss": -24.435165405273438, "global_step": 201217, "epoch": 2424} {"train_loss": -24.55900764465332, "global_step": 201218, "epoch": 2424} {"train_loss": -24.29530143737793, "global_step": 201219, "epoch": 2424} {"train_loss": -24.24825096130371, "global_step": 201220, "epoch": 2424} {"train_loss": -24.279340744018555, "global_step": 201221, "epoch": 2424} {"train_loss": -24.059247970581055, "global_step": 201222, "epoch": 2424} {"train_loss": -24.527664184570312, "global_step": 201223, "epoch": 2424} {"train_loss": -24.311704635620117, "global_step": 201224, "epoch": 2424} {"train_loss": -24.673452377319336, "global_step": 201225, "epoch": 2424} {"train_loss": -24.257095336914062, "global_step": 201226, "epoch": 2424} {"train_loss": -24.154388427734375, "global_step": 201227, "epoch": 2424} {"train_loss": -24.278066635131836, "global_step": 201228, "epoch": 2424} {"train_loss": -24.155805587768555, "global_step": 201229, "epoch": 2424} {"train_loss": -24.36177635192871, "global_step": 201230, "epoch": 2424} {"train_loss": -24.416738510131836, "global_step": 201231, "epoch": 2424} {"train_loss": -24.357633590698242, "global_step": 201232, "epoch": 2424} {"train_loss": -24.23467254638672, "global_step": 201233, "epoch": 2424} {"train_loss": -24.339717864990234, "global_step": 201234, "epoch": 2424} {"train_loss": -24.038928985595703, "global_step": 201235, "epoch": 2424} {"train_loss": -24.104591369628906, "global_step": 201236, "epoch": 2424} {"train_loss": -23.801794052124023, "global_step": 201237, "epoch": 2424} {"train_loss": -24.208078384399414, "global_step": 201238, "epoch": 2424} {"train_loss": -24.21491813659668, "global_step": 201239, "epoch": 2424} {"train_loss": -24.09173011779785, "global_step": 201240, "epoch": 2424} {"train_loss": -24.159318923950195, "global_step": 201241, "epoch": 2424} {"train_loss": -24.317886352539062, "global_step": 201242, "epoch": 2424} {"train_loss": -24.367429733276367, "global_step": 201243, "epoch": 2424} {"train_loss": -24.34996223449707, "global_step": 201244, "epoch": 2424} {"train_loss": -24.076322555541992, "global_step": 201245, "epoch": 2424} {"train_loss": -24.513837814331055, "global_step": 201246, "epoch": 2424} {"train_loss": -24.146568298339844, "global_step": 201247, "epoch": 2424} {"train_loss": -23.843645095825195, "global_step": 201248, "epoch": 2424} {"train_loss": -24.208860397338867, "global_step": 201249, "epoch": 2424} {"train_loss": -24.394916534423828, "global_step": 201250, "epoch": 2424} {"train_loss": -23.53278160095215, "global_step": 201251, "epoch": 2424} {"train_loss": -24.16615104675293, "global_step": 201252, "epoch": 2424} {"train_loss": -24.17365837097168, "global_step": 201253, "epoch": 2424} {"train_loss": -24.093225479125977, "global_step": 201254, "epoch": 2424} {"train_loss": -24.0648136138916, "global_step": 201255, "epoch": 2424} {"train_loss": -24.65608787536621, "global_step": 201256, "epoch": 2424} {"train_loss": -24.368759155273438, "global_step": 201257, "epoch": 2424} {"train_loss": -24.44403648376465, "global_step": 201258, "epoch": 2424} {"train_loss": -24.368377685546875, "global_step": 201259, "epoch": 2424} {"train_loss": -24.457284927368164, "global_step": 201260, "epoch": 2424} {"train_loss": -24.234434127807617, "global_step": 201261, "epoch": 2424} {"train_loss": -24.724760055541992, "global_step": 201262, "epoch": 2424} {"train_loss": -24.191831588745117, "global_step": 201263, "epoch": 2424} {"train_loss": -24.294086456298828, "global_step": 201264, "epoch": 2424} {"train_loss": -24.2977237701416, "global_step": 201265, "epoch": 2424} {"train_loss": -24.637531280517578, "global_step": 201266, "epoch": 2424} {"train_loss": -24.45792007446289, "global_step": 201267, "epoch": 2424} {"train_loss": -24.272741317749023, "global_step": 201268, "epoch": 2424} {"train_loss": -24.43439292907715, "global_step": 201269, "epoch": 2424} {"train_loss": -24.19503402709961, "global_step": 201270, "epoch": 2424} {"train_loss": -24.445281982421875, "global_step": 201271, "epoch": 2424} {"train_loss": -24.312692642211914, "global_step": 201272, "epoch": 2424} {"train_loss": -24.57994270324707, "global_step": 201273, "epoch": 2424} {"train_loss": -24.29747634336173, "global_step": 201274, "epoch": 2424, "val_loss": 6472993.0} {"train_loss": -23.97165298461914, "global_step": 201275, "epoch": 2425} {"train_loss": -23.531625747680664, "global_step": 201276, "epoch": 2425} {"train_loss": -24.00253677368164, "global_step": 201277, "epoch": 2425} {"train_loss": -23.343046188354492, "global_step": 201278, "epoch": 2425} {"train_loss": -23.64389419555664, "global_step": 201279, "epoch": 2425} {"train_loss": -23.847524642944336, "global_step": 201280, "epoch": 2425} {"train_loss": -23.861555099487305, "global_step": 201281, "epoch": 2425} {"train_loss": -23.808069229125977, "global_step": 201282, "epoch": 2425} {"train_loss": -23.95145606994629, "global_step": 201283, "epoch": 2425} {"train_loss": -24.052587509155273, "global_step": 201284, "epoch": 2425} {"train_loss": -24.342893600463867, "global_step": 201285, "epoch": 2425} {"train_loss": -23.602659225463867, "global_step": 201286, "epoch": 2425} {"train_loss": -23.839136123657227, "global_step": 201287, "epoch": 2425} {"train_loss": -23.66016960144043, "global_step": 201288, "epoch": 2425} {"train_loss": -24.169357299804688, "global_step": 201289, "epoch": 2425} {"train_loss": -24.112619400024414, "global_step": 201290, "epoch": 2425} {"train_loss": -24.089975357055664, "global_step": 201291, "epoch": 2425} {"train_loss": -23.62190818786621, "global_step": 201292, "epoch": 2425} {"train_loss": -24.089553833007812, "global_step": 201293, "epoch": 2425} {"train_loss": -24.090673446655273, "global_step": 201294, "epoch": 2425} {"train_loss": -24.090070724487305, "global_step": 201295, "epoch": 2425} {"train_loss": -24.36890983581543, "global_step": 201296, "epoch": 2425} {"train_loss": -23.920764923095703, "global_step": 201297, "epoch": 2425} {"train_loss": -24.401288986206055, "global_step": 201298, "epoch": 2425} {"train_loss": -24.08707046508789, "global_step": 201299, "epoch": 2425} {"train_loss": -24.369951248168945, "global_step": 201300, "epoch": 2425} {"train_loss": -24.111204147338867, "global_step": 201301, "epoch": 2425} {"train_loss": -24.218765258789062, "global_step": 201302, "epoch": 2425} {"train_loss": -24.15167808532715, "global_step": 201303, "epoch": 2425} {"train_loss": -23.77162742614746, "global_step": 201304, "epoch": 2425} {"train_loss": -24.30206871032715, "global_step": 201305, "epoch": 2425} {"train_loss": -24.22802734375, "global_step": 201306, "epoch": 2425} {"train_loss": -24.46661949157715, "global_step": 201307, "epoch": 2425} {"train_loss": -24.101715087890625, "global_step": 201308, "epoch": 2425} {"train_loss": -24.255849838256836, "global_step": 201309, "epoch": 2425} {"train_loss": -23.733556747436523, "global_step": 201310, "epoch": 2425} {"train_loss": -24.403371810913086, "global_step": 201311, "epoch": 2425} {"train_loss": -24.784345626831055, "global_step": 201312, "epoch": 2425} {"train_loss": -24.314794540405273, "global_step": 201313, "epoch": 2425} {"train_loss": -24.25790786743164, "global_step": 201314, "epoch": 2425} {"train_loss": -24.6652889251709, "global_step": 201315, "epoch": 2425} {"train_loss": -24.620634078979492, "global_step": 201316, "epoch": 2425} {"train_loss": -24.349170684814453, "global_step": 201317, "epoch": 2425} {"train_loss": -24.246356964111328, "global_step": 201318, "epoch": 2425} {"train_loss": -24.32301902770996, "global_step": 201319, "epoch": 2425} {"train_loss": -24.114736557006836, "global_step": 201320, "epoch": 2425} {"train_loss": -24.380746841430664, "global_step": 201321, "epoch": 2425} {"train_loss": -24.422861099243164, "global_step": 201322, "epoch": 2425} {"train_loss": -24.88600730895996, "global_step": 201323, "epoch": 2425} {"train_loss": -24.582571029663086, "global_step": 201324, "epoch": 2425} {"train_loss": -24.431257247924805, "global_step": 201325, "epoch": 2425} {"train_loss": -24.092498779296875, "global_step": 201326, "epoch": 2425} {"train_loss": -24.36531639099121, "global_step": 201327, "epoch": 2425} {"train_loss": -24.235023498535156, "global_step": 201328, "epoch": 2425} {"train_loss": -23.872709274291992, "global_step": 201329, "epoch": 2425} {"train_loss": -24.10919761657715, "global_step": 201330, "epoch": 2425} {"train_loss": -24.122724533081055, "global_step": 201331, "epoch": 2425} {"train_loss": -24.442068099975586, "global_step": 201332, "epoch": 2425} {"train_loss": -24.352697372436523, "global_step": 201333, "epoch": 2425} {"train_loss": -24.387025833129883, "global_step": 201334, "epoch": 2425} {"train_loss": -24.419336318969727, "global_step": 201335, "epoch": 2425} {"train_loss": -24.53000259399414, "global_step": 201336, "epoch": 2425} {"train_loss": -24.28646469116211, "global_step": 201337, "epoch": 2425} {"train_loss": -24.291854858398438, "global_step": 201338, "epoch": 2425} {"train_loss": -24.70191192626953, "global_step": 201339, "epoch": 2425} {"train_loss": -24.282066345214844, "global_step": 201340, "epoch": 2425} {"train_loss": -24.37725257873535, "global_step": 201341, "epoch": 2425} {"train_loss": -24.190820693969727, "global_step": 201342, "epoch": 2425} {"train_loss": -24.735815048217773, "global_step": 201343, "epoch": 2425} {"train_loss": -24.474027633666992, "global_step": 201344, "epoch": 2425} {"train_loss": -24.246702194213867, "global_step": 201345, "epoch": 2425} {"train_loss": -24.571388244628906, "global_step": 201346, "epoch": 2425} {"train_loss": -24.17665672302246, "global_step": 201347, "epoch": 2425} {"train_loss": -24.474491119384766, "global_step": 201348, "epoch": 2425} {"train_loss": -24.050588607788086, "global_step": 201349, "epoch": 2425} {"train_loss": -24.36705780029297, "global_step": 201350, "epoch": 2425} {"train_loss": -24.32686424255371, "global_step": 201351, "epoch": 2425} {"train_loss": -24.302051544189453, "global_step": 201352, "epoch": 2425} {"train_loss": -24.2985897064209, "global_step": 201353, "epoch": 2425} {"train_loss": -24.415679931640625, "global_step": 201354, "epoch": 2425} {"train_loss": -24.51718521118164, "global_step": 201355, "epoch": 2425} {"train_loss": -24.097930908203125, "global_step": 201356, "epoch": 2425} {"train_loss": -24.20334094403738, "global_step": 201357, "epoch": 2425, "val_loss": 6730824.5} {"train_loss": -20.73177146911621, "global_step": 201358, "epoch": 2426} {"train_loss": -20.902545928955078, "global_step": 201359, "epoch": 2426} {"train_loss": -21.64234161376953, "global_step": 201360, "epoch": 2426} {"train_loss": -21.557069778442383, "global_step": 201361, "epoch": 2426} {"train_loss": -21.935062408447266, "global_step": 201362, "epoch": 2426} {"train_loss": -22.34075927734375, "global_step": 201363, "epoch": 2426} {"train_loss": -21.906909942626953, "global_step": 201364, "epoch": 2426} {"train_loss": -22.11033058166504, "global_step": 201365, "epoch": 2426} {"train_loss": -22.65909767150879, "global_step": 201366, "epoch": 2426} {"train_loss": -22.5920467376709, "global_step": 201367, "epoch": 2426} {"train_loss": -22.487226486206055, "global_step": 201368, "epoch": 2426} {"train_loss": -22.67449951171875, "global_step": 201369, "epoch": 2426} {"train_loss": -22.59311294555664, "global_step": 201370, "epoch": 2426} {"train_loss": -22.612890243530273, "global_step": 201371, "epoch": 2426} {"train_loss": -23.103893280029297, "global_step": 201372, "epoch": 2426} {"train_loss": -22.709678649902344, "global_step": 201373, "epoch": 2426} {"train_loss": -23.035032272338867, "global_step": 201374, "epoch": 2426} {"train_loss": -22.964515686035156, "global_step": 201375, "epoch": 2426} {"train_loss": -23.447620391845703, "global_step": 201376, "epoch": 2426} {"train_loss": -22.99163246154785, "global_step": 201377, "epoch": 2426} {"train_loss": -23.174787521362305, "global_step": 201378, "epoch": 2426} {"train_loss": -23.018310546875, "global_step": 201379, "epoch": 2426} {"train_loss": -23.4312801361084, "global_step": 201380, "epoch": 2426} {"train_loss": -23.279638290405273, "global_step": 201381, "epoch": 2426} {"train_loss": -23.505064010620117, "global_step": 201382, "epoch": 2426} {"train_loss": -23.204458236694336, "global_step": 201383, "epoch": 2426} {"train_loss": -23.530624389648438, "global_step": 201384, "epoch": 2426} {"train_loss": -23.540708541870117, "global_step": 201385, "epoch": 2426} {"train_loss": -23.62462043762207, "global_step": 201386, "epoch": 2426} {"train_loss": -23.315195083618164, "global_step": 201387, "epoch": 2426} {"train_loss": -23.589624404907227, "global_step": 201388, "epoch": 2426} {"train_loss": -23.710132598876953, "global_step": 201389, "epoch": 2426} {"train_loss": -23.74094581604004, "global_step": 201390, "epoch": 2426} {"train_loss": -23.744680404663086, "global_step": 201391, "epoch": 2426} {"train_loss": -23.884790420532227, "global_step": 201392, "epoch": 2426} {"train_loss": -23.95660972595215, "global_step": 201393, "epoch": 2426} {"train_loss": -23.83734893798828, "global_step": 201394, "epoch": 2426} {"train_loss": -24.17342185974121, "global_step": 201395, "epoch": 2426} {"train_loss": -24.254776000976562, "global_step": 201396, "epoch": 2426} {"train_loss": -24.047183990478516, "global_step": 201397, "epoch": 2426} {"train_loss": -24.091949462890625, "global_step": 201398, "epoch": 2426} {"train_loss": -23.970218658447266, "global_step": 201399, "epoch": 2426} {"train_loss": -24.119709014892578, "global_step": 201400, "epoch": 2426} {"train_loss": -23.9337100982666, "global_step": 201401, "epoch": 2426} {"train_loss": -24.461156845092773, "global_step": 201402, "epoch": 2426} {"train_loss": -24.143884658813477, "global_step": 201403, "epoch": 2426} {"train_loss": -24.447046279907227, "global_step": 201404, "epoch": 2426} {"train_loss": -24.32163429260254, "global_step": 201405, "epoch": 2426} {"train_loss": -24.177841186523438, "global_step": 201406, "epoch": 2426} {"train_loss": -24.486080169677734, "global_step": 201407, "epoch": 2426} {"train_loss": -24.343050003051758, "global_step": 201408, "epoch": 2426} {"train_loss": -24.42451286315918, "global_step": 201409, "epoch": 2426} {"train_loss": -24.001747131347656, "global_step": 201410, "epoch": 2426} {"train_loss": -23.990161895751953, "global_step": 201411, "epoch": 2426} {"train_loss": -24.171241760253906, "global_step": 201412, "epoch": 2426} {"train_loss": -24.189441680908203, "global_step": 201413, "epoch": 2426} {"train_loss": -24.095678329467773, "global_step": 201414, "epoch": 2426} {"train_loss": -24.028074264526367, "global_step": 201415, "epoch": 2426} {"train_loss": -24.23126220703125, "global_step": 201416, "epoch": 2426} {"train_loss": -24.362348556518555, "global_step": 201417, "epoch": 2426} {"train_loss": -24.539810180664062, "global_step": 201418, "epoch": 2426} {"train_loss": -24.15363311767578, "global_step": 201419, "epoch": 2426} {"train_loss": -24.11275291442871, "global_step": 201420, "epoch": 2426} {"train_loss": -24.582605361938477, "global_step": 201421, "epoch": 2426} {"train_loss": -24.346601486206055, "global_step": 201422, "epoch": 2426} {"train_loss": -24.15958595275879, "global_step": 201423, "epoch": 2426} {"train_loss": -24.106143951416016, "global_step": 201424, "epoch": 2426} {"train_loss": -24.672212600708008, "global_step": 201425, "epoch": 2426} {"train_loss": -24.43877601623535, "global_step": 201426, "epoch": 2426} {"train_loss": -24.9096736907959, "global_step": 201427, "epoch": 2426} {"train_loss": -24.149459838867188, "global_step": 201428, "epoch": 2426} {"train_loss": -24.312673568725586, "global_step": 201429, "epoch": 2426} {"train_loss": -24.438434600830078, "global_step": 201430, "epoch": 2426} {"train_loss": -24.555103302001953, "global_step": 201431, "epoch": 2426} {"train_loss": -24.23507308959961, "global_step": 201432, "epoch": 2426} {"train_loss": -24.175460815429688, "global_step": 201433, "epoch": 2426} {"train_loss": -24.254262924194336, "global_step": 201434, "epoch": 2426} {"train_loss": -24.308332443237305, "global_step": 201435, "epoch": 2426} {"train_loss": -24.75178337097168, "global_step": 201436, "epoch": 2426} {"train_loss": -24.444473266601562, "global_step": 201437, "epoch": 2426} {"train_loss": -24.89636993408203, "global_step": 201438, "epoch": 2426} {"train_loss": -24.30218505859375, "global_step": 201439, "epoch": 2426} {"train_loss": -23.67419403719615, "global_step": 201440, "epoch": 2426, "val_loss": 6611183.0} {"train_loss": -23.853422164916992, "global_step": 201441, "epoch": 2427} {"train_loss": -24.39557456970215, "global_step": 201442, "epoch": 2427} {"train_loss": -23.624008178710938, "global_step": 201443, "epoch": 2427} {"train_loss": -23.931211471557617, "global_step": 201444, "epoch": 2427} {"train_loss": -23.892688751220703, "global_step": 201445, "epoch": 2427} {"train_loss": -23.963144302368164, "global_step": 201446, "epoch": 2427} {"train_loss": -24.101720809936523, "global_step": 201447, "epoch": 2427} {"train_loss": -24.01670265197754, "global_step": 201448, "epoch": 2427} {"train_loss": -23.991313934326172, "global_step": 201449, "epoch": 2427} {"train_loss": -23.961782455444336, "global_step": 201450, "epoch": 2427} {"train_loss": -24.220279693603516, "global_step": 201451, "epoch": 2427} {"train_loss": -24.148269653320312, "global_step": 201452, "epoch": 2427} {"train_loss": -24.617918014526367, "global_step": 201453, "epoch": 2427} {"train_loss": -24.124755859375, "global_step": 201454, "epoch": 2427} {"train_loss": -23.748960494995117, "global_step": 201455, "epoch": 2427} {"train_loss": -24.18984031677246, "global_step": 201456, "epoch": 2427} {"train_loss": -24.074594497680664, "global_step": 201457, "epoch": 2427} {"train_loss": -24.425687789916992, "global_step": 201458, "epoch": 2427} {"train_loss": -24.25543212890625, "global_step": 201459, "epoch": 2427} {"train_loss": -24.416431427001953, "global_step": 201460, "epoch": 2427} {"train_loss": -24.76679801940918, "global_step": 201461, "epoch": 2427} {"train_loss": -24.154701232910156, "global_step": 201462, "epoch": 2427} {"train_loss": -24.261322021484375, "global_step": 201463, "epoch": 2427} {"train_loss": -23.829885482788086, "global_step": 201464, "epoch": 2427} {"train_loss": -24.107011795043945, "global_step": 201465, "epoch": 2427} {"train_loss": -24.28521156311035, "global_step": 201466, "epoch": 2427} {"train_loss": -24.200836181640625, "global_step": 201467, "epoch": 2427} {"train_loss": -23.271564483642578, "global_step": 201468, "epoch": 2427} {"train_loss": -24.224950790405273, "global_step": 201469, "epoch": 2427} {"train_loss": -24.376693725585938, "global_step": 201470, "epoch": 2427} {"train_loss": -23.99177360534668, "global_step": 201471, "epoch": 2427} {"train_loss": -24.1258487701416, "global_step": 201472, "epoch": 2427} {"train_loss": -24.107746124267578, "global_step": 201473, "epoch": 2427} {"train_loss": -24.33498191833496, "global_step": 201474, "epoch": 2427} {"train_loss": -24.538326263427734, "global_step": 201475, "epoch": 2427} {"train_loss": -23.982568740844727, "global_step": 201476, "epoch": 2427} {"train_loss": -24.18581771850586, "global_step": 201477, "epoch": 2427} {"train_loss": -24.049131393432617, "global_step": 201478, "epoch": 2427} {"train_loss": -24.067365646362305, "global_step": 201479, "epoch": 2427} {"train_loss": -24.643497467041016, "global_step": 201480, "epoch": 2427} {"train_loss": -24.021780014038086, "global_step": 201481, "epoch": 2427} {"train_loss": -24.097761154174805, "global_step": 201482, "epoch": 2427} {"train_loss": -24.663135528564453, "global_step": 201483, "epoch": 2427} {"train_loss": -24.052438735961914, "global_step": 201484, "epoch": 2427} {"train_loss": -24.403438568115234, "global_step": 201485, "epoch": 2427} {"train_loss": -24.511568069458008, "global_step": 201486, "epoch": 2427} {"train_loss": -24.336027145385742, "global_step": 201487, "epoch": 2427} {"train_loss": -24.27129554748535, "global_step": 201488, "epoch": 2427} {"train_loss": -24.091955184936523, "global_step": 201489, "epoch": 2427} {"train_loss": -24.148944854736328, "global_step": 201490, "epoch": 2427} {"train_loss": -24.20935821533203, "global_step": 201491, "epoch": 2427} {"train_loss": -24.520105361938477, "global_step": 201492, "epoch": 2427} {"train_loss": -24.32274627685547, "global_step": 201493, "epoch": 2427} {"train_loss": -24.590970993041992, "global_step": 201494, "epoch": 2427} {"train_loss": -24.337236404418945, "global_step": 201495, "epoch": 2427} {"train_loss": -24.164688110351562, "global_step": 201496, "epoch": 2427} {"train_loss": -24.003585815429688, "global_step": 201497, "epoch": 2427} {"train_loss": -24.529417037963867, "global_step": 201498, "epoch": 2427} {"train_loss": -24.192535400390625, "global_step": 201499, "epoch": 2427} {"train_loss": -24.561059951782227, "global_step": 201500, "epoch": 2427} {"train_loss": -24.467710494995117, "global_step": 201501, "epoch": 2427} {"train_loss": -24.252182006835938, "global_step": 201502, "epoch": 2427} {"train_loss": -24.27200698852539, "global_step": 201503, "epoch": 2427} {"train_loss": -24.35344886779785, "global_step": 201504, "epoch": 2427} {"train_loss": -24.545122146606445, "global_step": 201505, "epoch": 2427} {"train_loss": -24.41326904296875, "global_step": 201506, "epoch": 2427} {"train_loss": -24.499591827392578, "global_step": 201507, "epoch": 2427} {"train_loss": -24.502910614013672, "global_step": 201508, "epoch": 2427} {"train_loss": -24.179189682006836, "global_step": 201509, "epoch": 2427} {"train_loss": -24.977828979492188, "global_step": 201510, "epoch": 2427} {"train_loss": -24.38678550720215, "global_step": 201511, "epoch": 2427} {"train_loss": -24.317678451538086, "global_step": 201512, "epoch": 2427} {"train_loss": -23.73235511779785, "global_step": 201513, "epoch": 2427} {"train_loss": -23.73957061767578, "global_step": 201514, "epoch": 2427} {"train_loss": -23.723947525024414, "global_step": 201515, "epoch": 2427} {"train_loss": -24.373056411743164, "global_step": 201516, "epoch": 2427} {"train_loss": -24.72608757019043, "global_step": 201517, "epoch": 2427} {"train_loss": -24.437238693237305, "global_step": 201518, "epoch": 2427} {"train_loss": -24.052919387817383, "global_step": 201519, "epoch": 2427} {"train_loss": -24.386178970336914, "global_step": 201520, "epoch": 2427} {"train_loss": -24.372364044189453, "global_step": 201521, "epoch": 2427} {"train_loss": -23.738628387451172, "global_step": 201522, "epoch": 2427} {"train_loss": -24.209468680692005, "global_step": 201523, "epoch": 2427, "val_loss": 6677343.0} {"train_loss": -24.234350204467773, "global_step": 201524, "epoch": 2428} {"train_loss": -24.196975708007812, "global_step": 201525, "epoch": 2428} {"train_loss": -23.90260124206543, "global_step": 201526, "epoch": 2428} {"train_loss": -24.041852951049805, "global_step": 201527, "epoch": 2428} {"train_loss": -23.974451065063477, "global_step": 201528, "epoch": 2428} {"train_loss": -24.218048095703125, "global_step": 201529, "epoch": 2428} {"train_loss": -24.256357192993164, "global_step": 201530, "epoch": 2428} {"train_loss": -23.9285945892334, "global_step": 201531, "epoch": 2428} {"train_loss": -24.44382667541504, "global_step": 201532, "epoch": 2428} {"train_loss": -23.821369171142578, "global_step": 201533, "epoch": 2428} {"train_loss": -23.78462791442871, "global_step": 201534, "epoch": 2428} {"train_loss": -24.461503982543945, "global_step": 201535, "epoch": 2428} {"train_loss": -23.8616943359375, "global_step": 201536, "epoch": 2428} {"train_loss": -24.24786376953125, "global_step": 201537, "epoch": 2428} {"train_loss": -24.525848388671875, "global_step": 201538, "epoch": 2428} {"train_loss": -24.326885223388672, "global_step": 201539, "epoch": 2428} {"train_loss": -24.39345359802246, "global_step": 201540, "epoch": 2428} {"train_loss": -24.489709854125977, "global_step": 201541, "epoch": 2428} {"train_loss": -24.066755294799805, "global_step": 201542, "epoch": 2428} {"train_loss": -24.14939308166504, "global_step": 201543, "epoch": 2428} {"train_loss": -23.957881927490234, "global_step": 201544, "epoch": 2428} {"train_loss": -24.5866641998291, "global_step": 201545, "epoch": 2428} {"train_loss": -24.381778717041016, "global_step": 201546, "epoch": 2428} {"train_loss": -24.55815887451172, "global_step": 201547, "epoch": 2428} {"train_loss": -24.629735946655273, "global_step": 201548, "epoch": 2428} {"train_loss": -24.51586151123047, "global_step": 201549, "epoch": 2428} {"train_loss": -24.44270133972168, "global_step": 201550, "epoch": 2428} {"train_loss": -23.937789916992188, "global_step": 201551, "epoch": 2428} {"train_loss": -24.15790367126465, "global_step": 201552, "epoch": 2428} {"train_loss": -24.388702392578125, "global_step": 201553, "epoch": 2428} {"train_loss": -23.82839012145996, "global_step": 201554, "epoch": 2428} {"train_loss": -24.586502075195312, "global_step": 201555, "epoch": 2428} {"train_loss": -24.322694778442383, "global_step": 201556, "epoch": 2428} {"train_loss": -23.551794052124023, "global_step": 201557, "epoch": 2428} {"train_loss": -24.42585563659668, "global_step": 201558, "epoch": 2428} {"train_loss": -24.07571792602539, "global_step": 201559, "epoch": 2428} {"train_loss": -24.216644287109375, "global_step": 201560, "epoch": 2428} {"train_loss": -23.928224563598633, "global_step": 201561, "epoch": 2428} {"train_loss": -24.060773849487305, "global_step": 201562, "epoch": 2428} {"train_loss": -24.3250732421875, "global_step": 201563, "epoch": 2428} {"train_loss": -24.117904663085938, "global_step": 201564, "epoch": 2428} {"train_loss": -24.295795440673828, "global_step": 201565, "epoch": 2428} {"train_loss": -24.151338577270508, "global_step": 201566, "epoch": 2428} {"train_loss": -24.667285919189453, "global_step": 201567, "epoch": 2428} {"train_loss": -24.059568405151367, "global_step": 201568, "epoch": 2428} {"train_loss": -24.362905502319336, "global_step": 201569, "epoch": 2428} {"train_loss": -24.593740463256836, "global_step": 201570, "epoch": 2428} {"train_loss": -24.472116470336914, "global_step": 201571, "epoch": 2428} {"train_loss": -24.57089614868164, "global_step": 201572, "epoch": 2428} {"train_loss": -23.9644718170166, "global_step": 201573, "epoch": 2428} {"train_loss": -24.12793731689453, "global_step": 201574, "epoch": 2428} {"train_loss": -24.48151397705078, "global_step": 201575, "epoch": 2428} {"train_loss": -24.839460372924805, "global_step": 201576, "epoch": 2428} {"train_loss": -24.126083374023438, "global_step": 201577, "epoch": 2428} {"train_loss": -24.464529037475586, "global_step": 201578, "epoch": 2428} {"train_loss": -24.261844635009766, "global_step": 201579, "epoch": 2428} {"train_loss": -24.35959243774414, "global_step": 201580, "epoch": 2428} {"train_loss": -24.113994598388672, "global_step": 201581, "epoch": 2428} {"train_loss": -24.54094696044922, "global_step": 201582, "epoch": 2428} {"train_loss": -24.5476016998291, "global_step": 201583, "epoch": 2428} {"train_loss": -24.657583236694336, "global_step": 201584, "epoch": 2428} {"train_loss": -24.468019485473633, "global_step": 201585, "epoch": 2428} {"train_loss": -24.546979904174805, "global_step": 201586, "epoch": 2428} {"train_loss": -24.013776779174805, "global_step": 201587, "epoch": 2428} {"train_loss": -24.147462844848633, "global_step": 201588, "epoch": 2428} {"train_loss": -24.4534854888916, "global_step": 201589, "epoch": 2428} {"train_loss": -23.963035583496094, "global_step": 201590, "epoch": 2428} {"train_loss": -24.35956382751465, "global_step": 201591, "epoch": 2428} {"train_loss": -24.332067489624023, "global_step": 201592, "epoch": 2428} {"train_loss": -24.230083465576172, "global_step": 201593, "epoch": 2428} {"train_loss": -24.314573287963867, "global_step": 201594, "epoch": 2428} {"train_loss": -23.75978660583496, "global_step": 201595, "epoch": 2428} {"train_loss": -23.926767349243164, "global_step": 201596, "epoch": 2428} {"train_loss": -24.326126098632812, "global_step": 201597, "epoch": 2428} {"train_loss": -24.249122619628906, "global_step": 201598, "epoch": 2428} {"train_loss": -24.179916381835938, "global_step": 201599, "epoch": 2428} {"train_loss": -24.184804916381836, "global_step": 201600, "epoch": 2428} {"train_loss": -24.41276741027832, "global_step": 201601, "epoch": 2428} {"train_loss": -24.352407455444336, "global_step": 201602, "epoch": 2428} {"train_loss": -24.59956169128418, "global_step": 201603, "epoch": 2428} {"train_loss": -24.207365036010742, "global_step": 201604, "epoch": 2428} {"train_loss": -24.249143600463867, "global_step": 201605, "epoch": 2428} {"train_loss": -24.27839554936053, "global_step": 201606, "epoch": 2428, "val_loss": 6541077.5} {"train_loss": -23.540334701538086, "global_step": 201607, "epoch": 2429} {"train_loss": -23.51067543029785, "global_step": 201608, "epoch": 2429} {"train_loss": -24.184797286987305, "global_step": 201609, "epoch": 2429} {"train_loss": -23.65670394897461, "global_step": 201610, "epoch": 2429} {"train_loss": -23.935373306274414, "global_step": 201611, "epoch": 2429} {"train_loss": -24.020627975463867, "global_step": 201612, "epoch": 2429} {"train_loss": -23.95064926147461, "global_step": 201613, "epoch": 2429} {"train_loss": -23.90883445739746, "global_step": 201614, "epoch": 2429} {"train_loss": -24.171178817749023, "global_step": 201615, "epoch": 2429} {"train_loss": -24.037357330322266, "global_step": 201616, "epoch": 2429} {"train_loss": -24.4245662689209, "global_step": 201617, "epoch": 2429} {"train_loss": -23.634065628051758, "global_step": 201618, "epoch": 2429} {"train_loss": -24.174821853637695, "global_step": 201619, "epoch": 2429} {"train_loss": -24.1058349609375, "global_step": 201620, "epoch": 2429} {"train_loss": -24.176115036010742, "global_step": 201621, "epoch": 2429} {"train_loss": -24.075895309448242, "global_step": 201622, "epoch": 2429} {"train_loss": -24.287826538085938, "global_step": 201623, "epoch": 2429} {"train_loss": -24.14318084716797, "global_step": 201624, "epoch": 2429} {"train_loss": -24.271961212158203, "global_step": 201625, "epoch": 2429} {"train_loss": -24.07801055908203, "global_step": 201626, "epoch": 2429} {"train_loss": -24.0097713470459, "global_step": 201627, "epoch": 2429} {"train_loss": -24.3006591796875, "global_step": 201628, "epoch": 2429} {"train_loss": -24.05413246154785, "global_step": 201629, "epoch": 2429} {"train_loss": -24.534475326538086, "global_step": 201630, "epoch": 2429} {"train_loss": -24.57303810119629, "global_step": 201631, "epoch": 2429} {"train_loss": -24.366971969604492, "global_step": 201632, "epoch": 2429} {"train_loss": -24.134855270385742, "global_step": 201633, "epoch": 2429} {"train_loss": -24.535991668701172, "global_step": 201634, "epoch": 2429} {"train_loss": -24.395769119262695, "global_step": 201635, "epoch": 2429} {"train_loss": -24.86676025390625, "global_step": 201636, "epoch": 2429} {"train_loss": -24.02882957458496, "global_step": 201637, "epoch": 2429} {"train_loss": -24.48729705810547, "global_step": 201638, "epoch": 2429} {"train_loss": -24.307004928588867, "global_step": 201639, "epoch": 2429} {"train_loss": -24.042577743530273, "global_step": 201640, "epoch": 2429} {"train_loss": -24.099225997924805, "global_step": 201641, "epoch": 2429} {"train_loss": -24.202573776245117, "global_step": 201642, "epoch": 2429} {"train_loss": -24.01434326171875, "global_step": 201643, "epoch": 2429} {"train_loss": -24.45941734313965, "global_step": 201644, "epoch": 2429} {"train_loss": -24.406843185424805, "global_step": 201645, "epoch": 2429} {"train_loss": -24.384246826171875, "global_step": 201646, "epoch": 2429} {"train_loss": -24.497106552124023, "global_step": 201647, "epoch": 2429} {"train_loss": -24.23813819885254, "global_step": 201648, "epoch": 2429} {"train_loss": -24.44317626953125, "global_step": 201649, "epoch": 2429} {"train_loss": -24.073087692260742, "global_step": 201650, "epoch": 2429} {"train_loss": -23.993488311767578, "global_step": 201651, "epoch": 2429} {"train_loss": -24.67205238342285, "global_step": 201652, "epoch": 2429} {"train_loss": -24.58887481689453, "global_step": 201653, "epoch": 2429} {"train_loss": -24.069076538085938, "global_step": 201654, "epoch": 2429} {"train_loss": -24.0966854095459, "global_step": 201655, "epoch": 2429} {"train_loss": -24.528417587280273, "global_step": 201656, "epoch": 2429} {"train_loss": -23.854999542236328, "global_step": 201657, "epoch": 2429} {"train_loss": -24.462182998657227, "global_step": 201658, "epoch": 2429} {"train_loss": -24.386510848999023, "global_step": 201659, "epoch": 2429} {"train_loss": -24.127399444580078, "global_step": 201660, "epoch": 2429} {"train_loss": -24.251245498657227, "global_step": 201661, "epoch": 2429} {"train_loss": -24.00016975402832, "global_step": 201662, "epoch": 2429} {"train_loss": -24.078685760498047, "global_step": 201663, "epoch": 2429} {"train_loss": -24.405929565429688, "global_step": 201664, "epoch": 2429} {"train_loss": -24.25876235961914, "global_step": 201665, "epoch": 2429} {"train_loss": -24.319395065307617, "global_step": 201666, "epoch": 2429} {"train_loss": -23.89545249938965, "global_step": 201667, "epoch": 2429} {"train_loss": -24.30963706970215, "global_step": 201668, "epoch": 2429} {"train_loss": -24.22464942932129, "global_step": 201669, "epoch": 2429} {"train_loss": -24.394575119018555, "global_step": 201670, "epoch": 2429} {"train_loss": -24.096210479736328, "global_step": 201671, "epoch": 2429} {"train_loss": -24.155231475830078, "global_step": 201672, "epoch": 2429} {"train_loss": -23.9464111328125, "global_step": 201673, "epoch": 2429} {"train_loss": -24.13054847717285, "global_step": 201674, "epoch": 2429} {"train_loss": -24.335111618041992, "global_step": 201675, "epoch": 2429} {"train_loss": -24.31690788269043, "global_step": 201676, "epoch": 2429} {"train_loss": -24.186908721923828, "global_step": 201677, "epoch": 2429} {"train_loss": -24.07859230041504, "global_step": 201678, "epoch": 2429} {"train_loss": -24.56243896484375, "global_step": 201679, "epoch": 2429} {"train_loss": -24.046016693115234, "global_step": 201680, "epoch": 2429} {"train_loss": -24.477127075195312, "global_step": 201681, "epoch": 2429} {"train_loss": -23.964651107788086, "global_step": 201682, "epoch": 2429} {"train_loss": -24.360502243041992, "global_step": 201683, "epoch": 2429} {"train_loss": -24.014286041259766, "global_step": 201684, "epoch": 2429} {"train_loss": -24.371185302734375, "global_step": 201685, "epoch": 2429} {"train_loss": -23.938888549804688, "global_step": 201686, "epoch": 2429} {"train_loss": -24.30422019958496, "global_step": 201687, "epoch": 2429} {"train_loss": -24.089391708374023, "global_step": 201688, "epoch": 2429} {"train_loss": -24.184339776096575, "global_step": 201689, "epoch": 2429, "val_loss": 6647664.0} {"train_loss": -24.054407119750977, "global_step": 201690, "epoch": 2430} {"train_loss": -24.483091354370117, "global_step": 201691, "epoch": 2430} {"train_loss": -24.429180145263672, "global_step": 201692, "epoch": 2430} {"train_loss": -24.45575523376465, "global_step": 201693, "epoch": 2430} {"train_loss": -24.374807357788086, "global_step": 201694, "epoch": 2430} {"train_loss": -24.260549545288086, "global_step": 201695, "epoch": 2430} {"train_loss": -24.02583885192871, "global_step": 201696, "epoch": 2430} {"train_loss": -23.956979751586914, "global_step": 201697, "epoch": 2430} {"train_loss": -24.06197166442871, "global_step": 201698, "epoch": 2430} {"train_loss": -24.526784896850586, "global_step": 201699, "epoch": 2430} {"train_loss": -24.299419403076172, "global_step": 201700, "epoch": 2430} {"train_loss": -24.23158836364746, "global_step": 201701, "epoch": 2430} {"train_loss": -24.352054595947266, "global_step": 201702, "epoch": 2430} {"train_loss": -24.291852951049805, "global_step": 201703, "epoch": 2430} {"train_loss": -24.328123092651367, "global_step": 201704, "epoch": 2430} {"train_loss": -24.80194664001465, "global_step": 201705, "epoch": 2430} {"train_loss": -24.097187042236328, "global_step": 201706, "epoch": 2430} {"train_loss": -24.320449829101562, "global_step": 201707, "epoch": 2430} {"train_loss": -24.0620059967041, "global_step": 201708, "epoch": 2430} {"train_loss": -24.078916549682617, "global_step": 201709, "epoch": 2430} {"train_loss": -24.291433334350586, "global_step": 201710, "epoch": 2430} {"train_loss": -24.482511520385742, "global_step": 201711, "epoch": 2430} {"train_loss": -24.27802085876465, "global_step": 201712, "epoch": 2430} {"train_loss": -23.82037925720215, "global_step": 201713, "epoch": 2430} {"train_loss": -24.84429931640625, "global_step": 201714, "epoch": 2430} {"train_loss": -24.4014949798584, "global_step": 201715, "epoch": 2430} {"train_loss": -24.181440353393555, "global_step": 201716, "epoch": 2430} {"train_loss": -23.886051177978516, "global_step": 201717, "epoch": 2430} {"train_loss": -24.31831932067871, "global_step": 201718, "epoch": 2430} {"train_loss": -24.198171615600586, "global_step": 201719, "epoch": 2430} {"train_loss": -23.817514419555664, "global_step": 201720, "epoch": 2430} {"train_loss": -24.538692474365234, "global_step": 201721, "epoch": 2430} {"train_loss": -23.851898193359375, "global_step": 201722, "epoch": 2430} {"train_loss": -24.36124610900879, "global_step": 201723, "epoch": 2430} {"train_loss": -24.468278884887695, "global_step": 201724, "epoch": 2430} {"train_loss": -24.16673469543457, "global_step": 201725, "epoch": 2430} {"train_loss": -24.355344772338867, "global_step": 201726, "epoch": 2430} {"train_loss": -24.18964958190918, "global_step": 201727, "epoch": 2430} {"train_loss": -24.708845138549805, "global_step": 201728, "epoch": 2430} {"train_loss": -24.454389572143555, "global_step": 201729, "epoch": 2430} {"train_loss": -24.219562530517578, "global_step": 201730, "epoch": 2430} {"train_loss": -24.505638122558594, "global_step": 201731, "epoch": 2430} {"train_loss": -24.55325698852539, "global_step": 201732, "epoch": 2430} {"train_loss": -24.03853416442871, "global_step": 201733, "epoch": 2430} {"train_loss": -24.575885772705078, "global_step": 201734, "epoch": 2430} {"train_loss": -24.243770599365234, "global_step": 201735, "epoch": 2430} {"train_loss": -24.43661117553711, "global_step": 201736, "epoch": 2430} {"train_loss": -24.389545440673828, "global_step": 201737, "epoch": 2430} {"train_loss": -24.12135124206543, "global_step": 201738, "epoch": 2430} {"train_loss": -24.161134719848633, "global_step": 201739, "epoch": 2430} {"train_loss": -24.27798843383789, "global_step": 201740, "epoch": 2430} {"train_loss": -24.71478271484375, "global_step": 201741, "epoch": 2430} {"train_loss": -24.347578048706055, "global_step": 201742, "epoch": 2430} {"train_loss": -24.16487693786621, "global_step": 201743, "epoch": 2430} {"train_loss": -24.594032287597656, "global_step": 201744, "epoch": 2430} {"train_loss": -24.54829978942871, "global_step": 201745, "epoch": 2430} {"train_loss": -24.116653442382812, "global_step": 201746, "epoch": 2430} {"train_loss": -24.528995513916016, "global_step": 201747, "epoch": 2430} {"train_loss": -24.611547470092773, "global_step": 201748, "epoch": 2430} {"train_loss": -24.121013641357422, "global_step": 201749, "epoch": 2430} {"train_loss": -24.28217124938965, "global_step": 201750, "epoch": 2430} {"train_loss": -24.122236251831055, "global_step": 201751, "epoch": 2430} {"train_loss": -23.965240478515625, "global_step": 201752, "epoch": 2430} {"train_loss": -23.378108978271484, "global_step": 201753, "epoch": 2430} {"train_loss": -23.458444595336914, "global_step": 201754, "epoch": 2430} {"train_loss": -24.3732967376709, "global_step": 201755, "epoch": 2430} {"train_loss": -24.04783058166504, "global_step": 201756, "epoch": 2430} {"train_loss": -24.06695556640625, "global_step": 201757, "epoch": 2430} {"train_loss": -23.98096466064453, "global_step": 201758, "epoch": 2430} {"train_loss": -23.942157745361328, "global_step": 201759, "epoch": 2430} {"train_loss": -24.64377212524414, "global_step": 201760, "epoch": 2430} {"train_loss": -23.924997329711914, "global_step": 201761, "epoch": 2430} {"train_loss": -24.223552703857422, "global_step": 201762, "epoch": 2430} {"train_loss": -24.37123680114746, "global_step": 201763, "epoch": 2430} {"train_loss": -24.47124671936035, "global_step": 201764, "epoch": 2430} {"train_loss": -24.185606002807617, "global_step": 201765, "epoch": 2430} {"train_loss": -24.427310943603516, "global_step": 201766, "epoch": 2430} {"train_loss": -24.074710845947266, "global_step": 201767, "epoch": 2430} {"train_loss": -24.142925262451172, "global_step": 201768, "epoch": 2430} {"train_loss": -24.157228469848633, "global_step": 201769, "epoch": 2430} {"train_loss": -24.00032615661621, "global_step": 201770, "epoch": 2430} {"train_loss": -24.221757888793945, "global_step": 201771, "epoch": 2430} {"train_loss": -24.26127298194242, "global_step": 201772, "epoch": 2430, "val_loss": 6386270.5} {"train_loss": -24.032611846923828, "global_step": 201773, "epoch": 2431} {"train_loss": -23.927900314331055, "global_step": 201774, "epoch": 2431} {"train_loss": -24.027828216552734, "global_step": 201775, "epoch": 2431} {"train_loss": -24.07429313659668, "global_step": 201776, "epoch": 2431} {"train_loss": -24.071941375732422, "global_step": 201777, "epoch": 2431} {"train_loss": -24.116743087768555, "global_step": 201778, "epoch": 2431} {"train_loss": -24.136112213134766, "global_step": 201779, "epoch": 2431} {"train_loss": -24.003326416015625, "global_step": 201780, "epoch": 2431} {"train_loss": -24.401737213134766, "global_step": 201781, "epoch": 2431} {"train_loss": -24.2454891204834, "global_step": 201782, "epoch": 2431} {"train_loss": -24.20857810974121, "global_step": 201783, "epoch": 2431} {"train_loss": -24.278013229370117, "global_step": 201784, "epoch": 2431} {"train_loss": -23.9553165435791, "global_step": 201785, "epoch": 2431} {"train_loss": -24.36927604675293, "global_step": 201786, "epoch": 2431} {"train_loss": -24.741506576538086, "global_step": 201787, "epoch": 2431} {"train_loss": -24.01270866394043, "global_step": 201788, "epoch": 2431} {"train_loss": -24.53046226501465, "global_step": 201789, "epoch": 2431} {"train_loss": -24.629901885986328, "global_step": 201790, "epoch": 2431} {"train_loss": -24.541296005249023, "global_step": 201791, "epoch": 2431} {"train_loss": -24.168041229248047, "global_step": 201792, "epoch": 2431} {"train_loss": -24.369672775268555, "global_step": 201793, "epoch": 2431} {"train_loss": -24.21959686279297, "global_step": 201794, "epoch": 2431} {"train_loss": -24.46700096130371, "global_step": 201795, "epoch": 2431} {"train_loss": -24.6273136138916, "global_step": 201796, "epoch": 2431} {"train_loss": -24.080673217773438, "global_step": 201797, "epoch": 2431} {"train_loss": -24.501737594604492, "global_step": 201798, "epoch": 2431} {"train_loss": -24.085620880126953, "global_step": 201799, "epoch": 2431} {"train_loss": -24.39887046813965, "global_step": 201800, "epoch": 2431} {"train_loss": -24.411720275878906, "global_step": 201801, "epoch": 2431} {"train_loss": -24.422348022460938, "global_step": 201802, "epoch": 2431} {"train_loss": -24.57718276977539, "global_step": 201803, "epoch": 2431} {"train_loss": -24.4213924407959, "global_step": 201804, "epoch": 2431} {"train_loss": -24.214859008789062, "global_step": 201805, "epoch": 2431} {"train_loss": -24.50994110107422, "global_step": 201806, "epoch": 2431} {"train_loss": -24.341005325317383, "global_step": 201807, "epoch": 2431} {"train_loss": -24.19767951965332, "global_step": 201808, "epoch": 2431} {"train_loss": -24.110624313354492, "global_step": 201809, "epoch": 2431} {"train_loss": -23.94378662109375, "global_step": 201810, "epoch": 2431} {"train_loss": -24.636377334594727, "global_step": 201811, "epoch": 2431} {"train_loss": -24.392765045166016, "global_step": 201812, "epoch": 2431} {"train_loss": -24.450489044189453, "global_step": 201813, "epoch": 2431} {"train_loss": -24.209718704223633, "global_step": 201814, "epoch": 2431} {"train_loss": -23.761377334594727, "global_step": 201815, "epoch": 2431} {"train_loss": -24.29166030883789, "global_step": 201816, "epoch": 2431} {"train_loss": -24.298620223999023, "global_step": 201817, "epoch": 2431} {"train_loss": -24.338953018188477, "global_step": 201818, "epoch": 2431} {"train_loss": -24.38313865661621, "global_step": 201819, "epoch": 2431} {"train_loss": -24.02326774597168, "global_step": 201820, "epoch": 2431} {"train_loss": -24.286300659179688, "global_step": 201821, "epoch": 2431} {"train_loss": -24.283506393432617, "global_step": 201822, "epoch": 2431} {"train_loss": -24.280838012695312, "global_step": 201823, "epoch": 2431} {"train_loss": -24.3551025390625, "global_step": 201824, "epoch": 2431} {"train_loss": -24.262319564819336, "global_step": 201825, "epoch": 2431} {"train_loss": -24.155134201049805, "global_step": 201826, "epoch": 2431} {"train_loss": -23.88538932800293, "global_step": 201827, "epoch": 2431} {"train_loss": -23.993898391723633, "global_step": 201828, "epoch": 2431} {"train_loss": -24.37606430053711, "global_step": 201829, "epoch": 2431} {"train_loss": -23.93332290649414, "global_step": 201830, "epoch": 2431} {"train_loss": -23.93806266784668, "global_step": 201831, "epoch": 2431} {"train_loss": -24.025022506713867, "global_step": 201832, "epoch": 2431} {"train_loss": -24.05586051940918, "global_step": 201833, "epoch": 2431} {"train_loss": -24.070161819458008, "global_step": 201834, "epoch": 2431} {"train_loss": -23.71634864807129, "global_step": 201835, "epoch": 2431} {"train_loss": -24.236501693725586, "global_step": 201836, "epoch": 2431} {"train_loss": -24.021224975585938, "global_step": 201837, "epoch": 2431} {"train_loss": -24.11537742614746, "global_step": 201838, "epoch": 2431} {"train_loss": -24.206205368041992, "global_step": 201839, "epoch": 2431} {"train_loss": -24.320863723754883, "global_step": 201840, "epoch": 2431} {"train_loss": -24.173242568969727, "global_step": 201841, "epoch": 2431} {"train_loss": -24.195968627929688, "global_step": 201842, "epoch": 2431} {"train_loss": -24.290164947509766, "global_step": 201843, "epoch": 2431} {"train_loss": -23.909093856811523, "global_step": 201844, "epoch": 2431} {"train_loss": -24.714324951171875, "global_step": 201845, "epoch": 2431} {"train_loss": -24.048139572143555, "global_step": 201846, "epoch": 2431} {"train_loss": -24.524621963500977, "global_step": 201847, "epoch": 2431} {"train_loss": -24.2745361328125, "global_step": 201848, "epoch": 2431} {"train_loss": -24.452573776245117, "global_step": 201849, "epoch": 2431} {"train_loss": -24.471860885620117, "global_step": 201850, "epoch": 2431} {"train_loss": -23.963211059570312, "global_step": 201851, "epoch": 2431} {"train_loss": -24.308914184570312, "global_step": 201852, "epoch": 2431} {"train_loss": -24.024120330810547, "global_step": 201853, "epoch": 2431} {"train_loss": -24.369592666625977, "global_step": 201854, "epoch": 2431} {"train_loss": -24.2517153039036, "global_step": 201855, "epoch": 2431, "val_loss": 6516823.0} {"train_loss": -23.537044525146484, "global_step": 201856, "epoch": 2432} {"train_loss": -23.81546974182129, "global_step": 201857, "epoch": 2432} {"train_loss": -23.10709571838379, "global_step": 201858, "epoch": 2432} {"train_loss": -23.848966598510742, "global_step": 201859, "epoch": 2432} {"train_loss": -23.75823402404785, "global_step": 201860, "epoch": 2432} {"train_loss": -23.335620880126953, "global_step": 201861, "epoch": 2432} {"train_loss": -23.935287475585938, "global_step": 201862, "epoch": 2432} {"train_loss": -23.683080673217773, "global_step": 201863, "epoch": 2432} {"train_loss": -23.912309646606445, "global_step": 201864, "epoch": 2432} {"train_loss": -23.91419792175293, "global_step": 201865, "epoch": 2432} {"train_loss": -23.999149322509766, "global_step": 201866, "epoch": 2432} {"train_loss": -23.68467903137207, "global_step": 201867, "epoch": 2432} {"train_loss": -23.929655075073242, "global_step": 201868, "epoch": 2432} {"train_loss": -23.920656204223633, "global_step": 201869, "epoch": 2432} {"train_loss": -24.1376895904541, "global_step": 201870, "epoch": 2432} {"train_loss": -24.170024871826172, "global_step": 201871, "epoch": 2432} {"train_loss": -24.282485961914062, "global_step": 201872, "epoch": 2432} {"train_loss": -24.100902557373047, "global_step": 201873, "epoch": 2432} {"train_loss": -23.859107971191406, "global_step": 201874, "epoch": 2432} {"train_loss": -24.312131881713867, "global_step": 201875, "epoch": 2432} {"train_loss": -24.215930938720703, "global_step": 201876, "epoch": 2432} {"train_loss": -23.893199920654297, "global_step": 201877, "epoch": 2432} {"train_loss": -24.34644889831543, "global_step": 201878, "epoch": 2432} {"train_loss": -24.495431900024414, "global_step": 201879, "epoch": 2432} {"train_loss": -24.300046920776367, "global_step": 201880, "epoch": 2432} {"train_loss": -24.174659729003906, "global_step": 201881, "epoch": 2432} {"train_loss": -24.093671798706055, "global_step": 201882, "epoch": 2432} {"train_loss": -24.626953125, "global_step": 201883, "epoch": 2432} {"train_loss": -24.350942611694336, "global_step": 201884, "epoch": 2432} {"train_loss": -24.428510665893555, "global_step": 201885, "epoch": 2432} {"train_loss": -24.28632354736328, "global_step": 201886, "epoch": 2432} {"train_loss": -24.263626098632812, "global_step": 201887, "epoch": 2432} {"train_loss": -24.342782974243164, "global_step": 201888, "epoch": 2432} {"train_loss": -24.3862247467041, "global_step": 201889, "epoch": 2432} {"train_loss": -24.531492233276367, "global_step": 201890, "epoch": 2432} {"train_loss": -24.288747787475586, "global_step": 201891, "epoch": 2432} {"train_loss": -24.426361083984375, "global_step": 201892, "epoch": 2432} {"train_loss": -24.620052337646484, "global_step": 201893, "epoch": 2432} {"train_loss": -24.109806060791016, "global_step": 201894, "epoch": 2432} {"train_loss": -24.134647369384766, "global_step": 201895, "epoch": 2432} {"train_loss": -24.520742416381836, "global_step": 201896, "epoch": 2432} {"train_loss": -24.427106857299805, "global_step": 201897, "epoch": 2432} {"train_loss": -24.576868057250977, "global_step": 201898, "epoch": 2432} {"train_loss": -24.510175704956055, "global_step": 201899, "epoch": 2432} {"train_loss": -24.855009078979492, "global_step": 201900, "epoch": 2432} {"train_loss": -24.502225875854492, "global_step": 201901, "epoch": 2432} {"train_loss": -24.568571090698242, "global_step": 201902, "epoch": 2432} {"train_loss": -24.375276565551758, "global_step": 201903, "epoch": 2432} {"train_loss": -24.385116577148438, "global_step": 201904, "epoch": 2432} {"train_loss": -24.17984390258789, "global_step": 201905, "epoch": 2432} {"train_loss": -24.365150451660156, "global_step": 201906, "epoch": 2432} {"train_loss": -24.47970962524414, "global_step": 201907, "epoch": 2432} {"train_loss": -24.396259307861328, "global_step": 201908, "epoch": 2432} {"train_loss": -24.288177490234375, "global_step": 201909, "epoch": 2432} {"train_loss": -24.255931854248047, "global_step": 201910, "epoch": 2432} {"train_loss": -24.31354331970215, "global_step": 201911, "epoch": 2432} {"train_loss": -24.497276306152344, "global_step": 201912, "epoch": 2432} {"train_loss": -24.229808807373047, "global_step": 201913, "epoch": 2432} {"train_loss": -24.3400936126709, "global_step": 201914, "epoch": 2432} {"train_loss": -24.508344650268555, "global_step": 201915, "epoch": 2432} {"train_loss": -24.663284301757812, "global_step": 201916, "epoch": 2432} {"train_loss": -24.39702033996582, "global_step": 201917, "epoch": 2432} {"train_loss": -24.38678550720215, "global_step": 201918, "epoch": 2432} {"train_loss": -24.2589168548584, "global_step": 201919, "epoch": 2432} {"train_loss": -24.768980026245117, "global_step": 201920, "epoch": 2432} {"train_loss": -24.489206314086914, "global_step": 201921, "epoch": 2432} {"train_loss": -24.588939666748047, "global_step": 201922, "epoch": 2432} {"train_loss": -24.217313766479492, "global_step": 201923, "epoch": 2432} {"train_loss": -24.45697593688965, "global_step": 201924, "epoch": 2432} {"train_loss": -24.251697540283203, "global_step": 201925, "epoch": 2432} {"train_loss": -23.845932006835938, "global_step": 201926, "epoch": 2432} {"train_loss": -24.326675415039062, "global_step": 201927, "epoch": 2432} {"train_loss": -24.39398193359375, "global_step": 201928, "epoch": 2432} {"train_loss": -24.332561492919922, "global_step": 201929, "epoch": 2432} {"train_loss": -24.6046142578125, "global_step": 201930, "epoch": 2432} {"train_loss": -24.16303062438965, "global_step": 201931, "epoch": 2432} {"train_loss": -24.0754337310791, "global_step": 201932, "epoch": 2432} {"train_loss": -24.088254928588867, "global_step": 201933, "epoch": 2432} {"train_loss": -24.72795295715332, "global_step": 201934, "epoch": 2432} {"train_loss": -24.0706787109375, "global_step": 201935, "epoch": 2432} {"train_loss": -23.94829750061035, "global_step": 201936, "epoch": 2432} {"train_loss": -24.04018211364746, "global_step": 201937, "epoch": 2432} {"train_loss": -24.235261664333112, "global_step": 201938, "epoch": 2432, "val_loss": 6716102.0} {"train_loss": -23.50270652770996, "global_step": 201939, "epoch": 2433} {"train_loss": -23.335235595703125, "global_step": 201940, "epoch": 2433} {"train_loss": -23.590850830078125, "global_step": 201941, "epoch": 2433} {"train_loss": -24.188812255859375, "global_step": 201942, "epoch": 2433} {"train_loss": -23.620519638061523, "global_step": 201943, "epoch": 2433} {"train_loss": -23.86167335510254, "global_step": 201944, "epoch": 2433} {"train_loss": -23.787490844726562, "global_step": 201945, "epoch": 2433} {"train_loss": -24.014923095703125, "global_step": 201946, "epoch": 2433} {"train_loss": -23.705350875854492, "global_step": 201947, "epoch": 2433} {"train_loss": -23.858469009399414, "global_step": 201948, "epoch": 2433} {"train_loss": -23.791339874267578, "global_step": 201949, "epoch": 2433} {"train_loss": -24.011728286743164, "global_step": 201950, "epoch": 2433} {"train_loss": -23.642227172851562, "global_step": 201951, "epoch": 2433} {"train_loss": -23.868146896362305, "global_step": 201952, "epoch": 2433} {"train_loss": -23.901254653930664, "global_step": 201953, "epoch": 2433} {"train_loss": -24.17279052734375, "global_step": 201954, "epoch": 2433} {"train_loss": -23.96693992614746, "global_step": 201955, "epoch": 2433} {"train_loss": -23.804462432861328, "global_step": 201956, "epoch": 2433} {"train_loss": -24.015419006347656, "global_step": 201957, "epoch": 2433} {"train_loss": -24.31369972229004, "global_step": 201958, "epoch": 2433} {"train_loss": -23.94681739807129, "global_step": 201959, "epoch": 2433} {"train_loss": -24.339370727539062, "global_step": 201960, "epoch": 2433} {"train_loss": -24.11970329284668, "global_step": 201961, "epoch": 2433} {"train_loss": -24.297164916992188, "global_step": 201962, "epoch": 2433} {"train_loss": -23.978395462036133, "global_step": 201963, "epoch": 2433} {"train_loss": -24.373332977294922, "global_step": 201964, "epoch": 2433} {"train_loss": -24.6149845123291, "global_step": 201965, "epoch": 2433} {"train_loss": -24.013656616210938, "global_step": 201966, "epoch": 2433} {"train_loss": -24.78388786315918, "global_step": 201967, "epoch": 2433} {"train_loss": -23.754322052001953, "global_step": 201968, "epoch": 2433} {"train_loss": -24.18825340270996, "global_step": 201969, "epoch": 2433} {"train_loss": -24.429868698120117, "global_step": 201970, "epoch": 2433} {"train_loss": -23.924728393554688, "global_step": 201971, "epoch": 2433} {"train_loss": -24.095638275146484, "global_step": 201972, "epoch": 2433} {"train_loss": -24.228673934936523, "global_step": 201973, "epoch": 2433} {"train_loss": -24.24527931213379, "global_step": 201974, "epoch": 2433} {"train_loss": -24.01259422302246, "global_step": 201975, "epoch": 2433} {"train_loss": -24.39992332458496, "global_step": 201976, "epoch": 2433} {"train_loss": -24.476516723632812, "global_step": 201977, "epoch": 2433} {"train_loss": -24.320659637451172, "global_step": 201978, "epoch": 2433} {"train_loss": -24.236867904663086, "global_step": 201979, "epoch": 2433} {"train_loss": -24.68121910095215, "global_step": 201980, "epoch": 2433} {"train_loss": -24.783859252929688, "global_step": 201981, "epoch": 2433} {"train_loss": -24.124784469604492, "global_step": 201982, "epoch": 2433} {"train_loss": -24.526962280273438, "global_step": 201983, "epoch": 2433} {"train_loss": -24.33930015563965, "global_step": 201984, "epoch": 2433} {"train_loss": -24.42837142944336, "global_step": 201985, "epoch": 2433} {"train_loss": -24.236373901367188, "global_step": 201986, "epoch": 2433} {"train_loss": -24.143718719482422, "global_step": 201987, "epoch": 2433} {"train_loss": -23.815458297729492, "global_step": 201988, "epoch": 2433} {"train_loss": -23.851871490478516, "global_step": 201989, "epoch": 2433} {"train_loss": -24.306564331054688, "global_step": 201990, "epoch": 2433} {"train_loss": -24.54775047302246, "global_step": 201991, "epoch": 2433} {"train_loss": -24.212308883666992, "global_step": 201992, "epoch": 2433} {"train_loss": -24.327791213989258, "global_step": 201993, "epoch": 2433} {"train_loss": -24.31496810913086, "global_step": 201994, "epoch": 2433} {"train_loss": -24.21678352355957, "global_step": 201995, "epoch": 2433} {"train_loss": -24.528594970703125, "global_step": 201996, "epoch": 2433} {"train_loss": -24.218730926513672, "global_step": 201997, "epoch": 2433} {"train_loss": -24.228933334350586, "global_step": 201998, "epoch": 2433} {"train_loss": -24.055883407592773, "global_step": 201999, "epoch": 2433} {"train_loss": -24.238901138305664, "global_step": 202000, "epoch": 2433} {"train_loss": -24.393529891967773, "global_step": 202001, "epoch": 2433} {"train_loss": -24.47835350036621, "global_step": 202002, "epoch": 2433} {"train_loss": -24.28802490234375, "global_step": 202003, "epoch": 2433} {"train_loss": -24.499006271362305, "global_step": 202004, "epoch": 2433} {"train_loss": -24.221176147460938, "global_step": 202005, "epoch": 2433} {"train_loss": -24.443458557128906, "global_step": 202006, "epoch": 2433} {"train_loss": -24.37412452697754, "global_step": 202007, "epoch": 2433} {"train_loss": -24.281824111938477, "global_step": 202008, "epoch": 2433} {"train_loss": -24.478139877319336, "global_step": 202009, "epoch": 2433} {"train_loss": -24.218015670776367, "global_step": 202010, "epoch": 2433} {"train_loss": -24.454069137573242, "global_step": 202011, "epoch": 2433} {"train_loss": -24.62674331665039, "global_step": 202012, "epoch": 2433} {"train_loss": -24.361406326293945, "global_step": 202013, "epoch": 2433} {"train_loss": -24.989225387573242, "global_step": 202014, "epoch": 2433} {"train_loss": -24.21335792541504, "global_step": 202015, "epoch": 2433} {"train_loss": -24.775815963745117, "global_step": 202016, "epoch": 2433} {"train_loss": -24.42635154724121, "global_step": 202017, "epoch": 2433} {"train_loss": -24.31793785095215, "global_step": 202018, "epoch": 2433} {"train_loss": -24.706823348999023, "global_step": 202019, "epoch": 2433} {"train_loss": -24.37448501586914, "global_step": 202020, "epoch": 2433} {"train_loss": -24.21718537663839, "global_step": 202021, "epoch": 2433, "val_loss": 6613406.5} {"train_loss": -22.947858810424805, "global_step": 202022, "epoch": 2434} {"train_loss": -21.554458618164062, "global_step": 202023, "epoch": 2434} {"train_loss": -21.860815048217773, "global_step": 202024, "epoch": 2434} {"train_loss": -23.32032585144043, "global_step": 202025, "epoch": 2434} {"train_loss": -22.9075870513916, "global_step": 202026, "epoch": 2434} {"train_loss": -22.894916534423828, "global_step": 202027, "epoch": 2434} {"train_loss": -23.10426902770996, "global_step": 202028, "epoch": 2434} {"train_loss": -23.339038848876953, "global_step": 202029, "epoch": 2434} {"train_loss": -22.824857711791992, "global_step": 202030, "epoch": 2434} {"train_loss": -23.195512771606445, "global_step": 202031, "epoch": 2434} {"train_loss": -23.288536071777344, "global_step": 202032, "epoch": 2434} {"train_loss": -23.335006713867188, "global_step": 202033, "epoch": 2434} {"train_loss": -23.377172470092773, "global_step": 202034, "epoch": 2434} {"train_loss": -23.24026107788086, "global_step": 202035, "epoch": 2434} {"train_loss": -23.51152992248535, "global_step": 202036, "epoch": 2434} {"train_loss": -23.743091583251953, "global_step": 202037, "epoch": 2434} {"train_loss": -23.58480453491211, "global_step": 202038, "epoch": 2434} {"train_loss": -23.444171905517578, "global_step": 202039, "epoch": 2434} {"train_loss": -23.718183517456055, "global_step": 202040, "epoch": 2434} {"train_loss": -23.23297691345215, "global_step": 202041, "epoch": 2434} {"train_loss": -23.622676849365234, "global_step": 202042, "epoch": 2434} {"train_loss": -23.71418571472168, "global_step": 202043, "epoch": 2434} {"train_loss": -23.8523006439209, "global_step": 202044, "epoch": 2434} {"train_loss": -23.61716651916504, "global_step": 202045, "epoch": 2434} {"train_loss": -24.057796478271484, "global_step": 202046, "epoch": 2434} {"train_loss": -23.75807762145996, "global_step": 202047, "epoch": 2434} {"train_loss": -24.02436637878418, "global_step": 202048, "epoch": 2434} {"train_loss": -24.101572036743164, "global_step": 202049, "epoch": 2434} {"train_loss": -23.96116065979004, "global_step": 202050, "epoch": 2434} {"train_loss": -23.89015007019043, "global_step": 202051, "epoch": 2434} {"train_loss": -24.19704246520996, "global_step": 202052, "epoch": 2434} {"train_loss": -24.284299850463867, "global_step": 202053, "epoch": 2434} {"train_loss": -23.90281105041504, "global_step": 202054, "epoch": 2434} {"train_loss": -23.92880630493164, "global_step": 202055, "epoch": 2434} {"train_loss": -24.002193450927734, "global_step": 202056, "epoch": 2434} {"train_loss": -24.003570556640625, "global_step": 202057, "epoch": 2434} {"train_loss": -24.295318603515625, "global_step": 202058, "epoch": 2434} {"train_loss": -24.402633666992188, "global_step": 202059, "epoch": 2434} {"train_loss": -24.23120880126953, "global_step": 202060, "epoch": 2434} {"train_loss": -24.207305908203125, "global_step": 202061, "epoch": 2434} {"train_loss": -24.077960968017578, "global_step": 202062, "epoch": 2434} {"train_loss": -24.456409454345703, "global_step": 202063, "epoch": 2434} {"train_loss": -24.086923599243164, "global_step": 202064, "epoch": 2434} {"train_loss": -24.507654190063477, "global_step": 202065, "epoch": 2434} {"train_loss": -24.5358943939209, "global_step": 202066, "epoch": 2434} {"train_loss": -24.31842041015625, "global_step": 202067, "epoch": 2434} {"train_loss": -24.508066177368164, "global_step": 202068, "epoch": 2434} {"train_loss": -24.22711181640625, "global_step": 202069, "epoch": 2434} {"train_loss": -24.232486724853516, "global_step": 202070, "epoch": 2434} {"train_loss": -24.363431930541992, "global_step": 202071, "epoch": 2434} {"train_loss": -24.20619010925293, "global_step": 202072, "epoch": 2434} {"train_loss": -23.95328140258789, "global_step": 202073, "epoch": 2434} {"train_loss": -24.433704376220703, "global_step": 202074, "epoch": 2434} {"train_loss": -24.025802612304688, "global_step": 202075, "epoch": 2434} {"train_loss": -24.318286895751953, "global_step": 202076, "epoch": 2434} {"train_loss": -24.140243530273438, "global_step": 202077, "epoch": 2434} {"train_loss": -24.33864974975586, "global_step": 202078, "epoch": 2434} {"train_loss": -24.354345321655273, "global_step": 202079, "epoch": 2434} {"train_loss": -24.16034507751465, "global_step": 202080, "epoch": 2434} {"train_loss": -24.08160400390625, "global_step": 202081, "epoch": 2434} {"train_loss": -24.65595817565918, "global_step": 202082, "epoch": 2434} {"train_loss": -23.77815818786621, "global_step": 202083, "epoch": 2434} {"train_loss": -24.29685401916504, "global_step": 202084, "epoch": 2434} {"train_loss": -24.35982322692871, "global_step": 202085, "epoch": 2434} {"train_loss": -24.167234420776367, "global_step": 202086, "epoch": 2434} {"train_loss": -24.7877197265625, "global_step": 202087, "epoch": 2434} {"train_loss": -24.28786277770996, "global_step": 202088, "epoch": 2434} {"train_loss": -24.262767791748047, "global_step": 202089, "epoch": 2434} {"train_loss": -24.445926666259766, "global_step": 202090, "epoch": 2434} {"train_loss": -24.442729949951172, "global_step": 202091, "epoch": 2434} {"train_loss": -24.839210510253906, "global_step": 202092, "epoch": 2434} {"train_loss": -24.316682815551758, "global_step": 202093, "epoch": 2434} {"train_loss": -24.043746948242188, "global_step": 202094, "epoch": 2434} {"train_loss": -24.232650756835938, "global_step": 202095, "epoch": 2434} {"train_loss": -24.078067779541016, "global_step": 202096, "epoch": 2434} {"train_loss": -24.65418815612793, "global_step": 202097, "epoch": 2434} {"train_loss": -23.97227668762207, "global_step": 202098, "epoch": 2434} {"train_loss": -23.936012268066406, "global_step": 202099, "epoch": 2434} {"train_loss": -24.403640747070312, "global_step": 202100, "epoch": 2434} {"train_loss": -23.992557525634766, "global_step": 202101, "epoch": 2434} {"train_loss": -24.29072380065918, "global_step": 202102, "epoch": 2434} {"train_loss": -24.35386848449707, "global_step": 202103, "epoch": 2434} {"train_loss": -23.93997642792851, "global_step": 202104, "epoch": 2434, "val_loss": 6520681.0} {"train_loss": -23.669818878173828, "global_step": 202105, "epoch": 2435} {"train_loss": -23.65875244140625, "global_step": 202106, "epoch": 2435} {"train_loss": -23.56325340270996, "global_step": 202107, "epoch": 2435} {"train_loss": -23.276174545288086, "global_step": 202108, "epoch": 2435} {"train_loss": -23.441373825073242, "global_step": 202109, "epoch": 2435} {"train_loss": -23.583833694458008, "global_step": 202110, "epoch": 2435} {"train_loss": -23.723487854003906, "global_step": 202111, "epoch": 2435} {"train_loss": -24.18312644958496, "global_step": 202112, "epoch": 2435} {"train_loss": -24.05183219909668, "global_step": 202113, "epoch": 2435} {"train_loss": -23.78483009338379, "global_step": 202114, "epoch": 2435} {"train_loss": -23.488245010375977, "global_step": 202115, "epoch": 2435} {"train_loss": -23.655813217163086, "global_step": 202116, "epoch": 2435} {"train_loss": -23.870107650756836, "global_step": 202117, "epoch": 2435} {"train_loss": -23.69234275817871, "global_step": 202118, "epoch": 2435} {"train_loss": -23.72848892211914, "global_step": 202119, "epoch": 2435} {"train_loss": -23.83994483947754, "global_step": 202120, "epoch": 2435} {"train_loss": -24.066984176635742, "global_step": 202121, "epoch": 2435} {"train_loss": -23.95546531677246, "global_step": 202122, "epoch": 2435} {"train_loss": -23.846643447875977, "global_step": 202123, "epoch": 2435} {"train_loss": -24.033018112182617, "global_step": 202124, "epoch": 2435} {"train_loss": -24.028486251831055, "global_step": 202125, "epoch": 2435} {"train_loss": -24.26163101196289, "global_step": 202126, "epoch": 2435} {"train_loss": -24.09125328063965, "global_step": 202127, "epoch": 2435} {"train_loss": -24.245519638061523, "global_step": 202128, "epoch": 2435} {"train_loss": -24.272886276245117, "global_step": 202129, "epoch": 2435} {"train_loss": -24.181848526000977, "global_step": 202130, "epoch": 2435} {"train_loss": -24.184009552001953, "global_step": 202131, "epoch": 2435} {"train_loss": -24.3443660736084, "global_step": 202132, "epoch": 2435} {"train_loss": -24.230854034423828, "global_step": 202133, "epoch": 2435} {"train_loss": -24.092803955078125, "global_step": 202134, "epoch": 2435} {"train_loss": -24.5545654296875, "global_step": 202135, "epoch": 2435} {"train_loss": -24.483030319213867, "global_step": 202136, "epoch": 2435} {"train_loss": -24.277450561523438, "global_step": 202137, "epoch": 2435} {"train_loss": -24.358545303344727, "global_step": 202138, "epoch": 2435} {"train_loss": -24.340667724609375, "global_step": 202139, "epoch": 2435} {"train_loss": -24.021358489990234, "global_step": 202140, "epoch": 2435} {"train_loss": -24.51991081237793, "global_step": 202141, "epoch": 2435} {"train_loss": -23.941635131835938, "global_step": 202142, "epoch": 2435} {"train_loss": -24.101665496826172, "global_step": 202143, "epoch": 2435} {"train_loss": -24.324026107788086, "global_step": 202144, "epoch": 2435} {"train_loss": -24.393840789794922, "global_step": 202145, "epoch": 2435} {"train_loss": -24.569318771362305, "global_step": 202146, "epoch": 2435} {"train_loss": -24.62586212158203, "global_step": 202147, "epoch": 2435} {"train_loss": -24.343963623046875, "global_step": 202148, "epoch": 2435} {"train_loss": -24.575815200805664, "global_step": 202149, "epoch": 2435} {"train_loss": -24.564313888549805, "global_step": 202150, "epoch": 2435} {"train_loss": -24.296220779418945, "global_step": 202151, "epoch": 2435} {"train_loss": -24.37808609008789, "global_step": 202152, "epoch": 2435} {"train_loss": -24.463748931884766, "global_step": 202153, "epoch": 2435} {"train_loss": -24.504079818725586, "global_step": 202154, "epoch": 2435} {"train_loss": -24.383502960205078, "global_step": 202155, "epoch": 2435} {"train_loss": -24.44051170349121, "global_step": 202156, "epoch": 2435} {"train_loss": -24.259552001953125, "global_step": 202157, "epoch": 2435} {"train_loss": -24.06171226501465, "global_step": 202158, "epoch": 2435} {"train_loss": -24.060516357421875, "global_step": 202159, "epoch": 2435} {"train_loss": -24.412996292114258, "global_step": 202160, "epoch": 2435} {"train_loss": -23.983179092407227, "global_step": 202161, "epoch": 2435} {"train_loss": -23.61067771911621, "global_step": 202162, "epoch": 2435} {"train_loss": -23.832536697387695, "global_step": 202163, "epoch": 2435} {"train_loss": -24.001373291015625, "global_step": 202164, "epoch": 2435} {"train_loss": -23.98671531677246, "global_step": 202165, "epoch": 2435} {"train_loss": -24.183317184448242, "global_step": 202166, "epoch": 2435} {"train_loss": -24.613187789916992, "global_step": 202167, "epoch": 2435} {"train_loss": -24.119447708129883, "global_step": 202168, "epoch": 2435} {"train_loss": -24.649770736694336, "global_step": 202169, "epoch": 2435} {"train_loss": -24.192123413085938, "global_step": 202170, "epoch": 2435} {"train_loss": -24.15306854248047, "global_step": 202171, "epoch": 2435} {"train_loss": -24.226043701171875, "global_step": 202172, "epoch": 2435} {"train_loss": -23.96018409729004, "global_step": 202173, "epoch": 2435} {"train_loss": -24.429407119750977, "global_step": 202174, "epoch": 2435} {"train_loss": -24.217309951782227, "global_step": 202175, "epoch": 2435} {"train_loss": -24.24688720703125, "global_step": 202176, "epoch": 2435} {"train_loss": -24.52956199645996, "global_step": 202177, "epoch": 2435} {"train_loss": -24.351537704467773, "global_step": 202178, "epoch": 2435} {"train_loss": -24.003158569335938, "global_step": 202179, "epoch": 2435} {"train_loss": -24.20690155029297, "global_step": 202180, "epoch": 2435} {"train_loss": -23.872861862182617, "global_step": 202181, "epoch": 2435} {"train_loss": -24.38936996459961, "global_step": 202182, "epoch": 2435} {"train_loss": -24.032073974609375, "global_step": 202183, "epoch": 2435} {"train_loss": -24.3786678314209, "global_step": 202184, "epoch": 2435} {"train_loss": -23.92487144470215, "global_step": 202185, "epoch": 2435} {"train_loss": -24.361896514892578, "global_step": 202186, "epoch": 2435} {"train_loss": -24.1367238975433, "global_step": 202187, "epoch": 2435, "val_loss": 6476855.0} {"train_loss": -23.480562210083008, "global_step": 202188, "epoch": 2436} {"train_loss": -23.478620529174805, "global_step": 202189, "epoch": 2436} {"train_loss": -24.41354751586914, "global_step": 202190, "epoch": 2436} {"train_loss": -24.00021743774414, "global_step": 202191, "epoch": 2436} {"train_loss": -23.692441940307617, "global_step": 202192, "epoch": 2436} {"train_loss": -23.833066940307617, "global_step": 202193, "epoch": 2436} {"train_loss": -24.043704986572266, "global_step": 202194, "epoch": 2436} {"train_loss": -23.792692184448242, "global_step": 202195, "epoch": 2436} {"train_loss": -23.995264053344727, "global_step": 202196, "epoch": 2436} {"train_loss": -24.027511596679688, "global_step": 202197, "epoch": 2436} {"train_loss": -23.719018936157227, "global_step": 202198, "epoch": 2436} {"train_loss": -24.154020309448242, "global_step": 202199, "epoch": 2436} {"train_loss": -24.030532836914062, "global_step": 202200, "epoch": 2436} {"train_loss": -24.397705078125, "global_step": 202201, "epoch": 2436} {"train_loss": -24.27644920349121, "global_step": 202202, "epoch": 2436} {"train_loss": -23.990222930908203, "global_step": 202203, "epoch": 2436} {"train_loss": -24.580167770385742, "global_step": 202204, "epoch": 2436} {"train_loss": -24.389799118041992, "global_step": 202205, "epoch": 2436} {"train_loss": -24.234344482421875, "global_step": 202206, "epoch": 2436} {"train_loss": -24.534305572509766, "global_step": 202207, "epoch": 2436} {"train_loss": -24.244752883911133, "global_step": 202208, "epoch": 2436} {"train_loss": -24.254520416259766, "global_step": 202209, "epoch": 2436} {"train_loss": -24.49091911315918, "global_step": 202210, "epoch": 2436} {"train_loss": -24.13677406311035, "global_step": 202211, "epoch": 2436} {"train_loss": -24.223249435424805, "global_step": 202212, "epoch": 2436} {"train_loss": -24.58226776123047, "global_step": 202213, "epoch": 2436} {"train_loss": -24.4455509185791, "global_step": 202214, "epoch": 2436} {"train_loss": -24.46006965637207, "global_step": 202215, "epoch": 2436} {"train_loss": -24.125280380249023, "global_step": 202216, "epoch": 2436} {"train_loss": -24.020822525024414, "global_step": 202217, "epoch": 2436} {"train_loss": -24.161056518554688, "global_step": 202218, "epoch": 2436} {"train_loss": -24.26594352722168, "global_step": 202219, "epoch": 2436} {"train_loss": -24.472915649414062, "global_step": 202220, "epoch": 2436} {"train_loss": -24.179824829101562, "global_step": 202221, "epoch": 2436} {"train_loss": -24.779821395874023, "global_step": 202222, "epoch": 2436} {"train_loss": -24.65092658996582, "global_step": 202223, "epoch": 2436} {"train_loss": -24.421646118164062, "global_step": 202224, "epoch": 2436} {"train_loss": -24.32076072692871, "global_step": 202225, "epoch": 2436} {"train_loss": -24.250272750854492, "global_step": 202226, "epoch": 2436} {"train_loss": -24.823102951049805, "global_step": 202227, "epoch": 2436} {"train_loss": -24.55279541015625, "global_step": 202228, "epoch": 2436} {"train_loss": -24.48756217956543, "global_step": 202229, "epoch": 2436} {"train_loss": -24.492874145507812, "global_step": 202230, "epoch": 2436} {"train_loss": -24.294479370117188, "global_step": 202231, "epoch": 2436} {"train_loss": -24.344085693359375, "global_step": 202232, "epoch": 2436} {"train_loss": -24.535106658935547, "global_step": 202233, "epoch": 2436} {"train_loss": -24.2390079498291, "global_step": 202234, "epoch": 2436} {"train_loss": -24.400407791137695, "global_step": 202235, "epoch": 2436} {"train_loss": -24.2257080078125, "global_step": 202236, "epoch": 2436} {"train_loss": -24.450721740722656, "global_step": 202237, "epoch": 2436} {"train_loss": -24.263639450073242, "global_step": 202238, "epoch": 2436} {"train_loss": -24.413253784179688, "global_step": 202239, "epoch": 2436} {"train_loss": -24.483097076416016, "global_step": 202240, "epoch": 2436} {"train_loss": -24.44343376159668, "global_step": 202241, "epoch": 2436} {"train_loss": -24.097429275512695, "global_step": 202242, "epoch": 2436} {"train_loss": -24.235258102416992, "global_step": 202243, "epoch": 2436} {"train_loss": -24.450162887573242, "global_step": 202244, "epoch": 2436} {"train_loss": -24.457386016845703, "global_step": 202245, "epoch": 2436} {"train_loss": -24.256649017333984, "global_step": 202246, "epoch": 2436} {"train_loss": -24.346515655517578, "global_step": 202247, "epoch": 2436} {"train_loss": -24.532398223876953, "global_step": 202248, "epoch": 2436} {"train_loss": -24.532434463500977, "global_step": 202249, "epoch": 2436} {"train_loss": -24.435434341430664, "global_step": 202250, "epoch": 2436} {"train_loss": -24.052148818969727, "global_step": 202251, "epoch": 2436} {"train_loss": -24.22214126586914, "global_step": 202252, "epoch": 2436} {"train_loss": -24.393390655517578, "global_step": 202253, "epoch": 2436} {"train_loss": -24.188404083251953, "global_step": 202254, "epoch": 2436} {"train_loss": -24.292800903320312, "global_step": 202255, "epoch": 2436} {"train_loss": -24.48493003845215, "global_step": 202256, "epoch": 2436} {"train_loss": -24.364704132080078, "global_step": 202257, "epoch": 2436} {"train_loss": -24.045591354370117, "global_step": 202258, "epoch": 2436} {"train_loss": -24.627729415893555, "global_step": 202259, "epoch": 2436} {"train_loss": -24.483003616333008, "global_step": 202260, "epoch": 2436} {"train_loss": -24.248098373413086, "global_step": 202261, "epoch": 2436} {"train_loss": -24.411794662475586, "global_step": 202262, "epoch": 2436} {"train_loss": -24.717979431152344, "global_step": 202263, "epoch": 2436} {"train_loss": -23.85092544555664, "global_step": 202264, "epoch": 2436} {"train_loss": -24.160268783569336, "global_step": 202265, "epoch": 2436} {"train_loss": -24.508493423461914, "global_step": 202266, "epoch": 2436} {"train_loss": -24.341047286987305, "global_step": 202267, "epoch": 2436} {"train_loss": -24.087987899780273, "global_step": 202268, "epoch": 2436} {"train_loss": -24.373075485229492, "global_step": 202269, "epoch": 2436} {"train_loss": -24.28632170895496, "global_step": 202270, "epoch": 2436, "val_loss": 6673645.0} {"train_loss": -23.378612518310547, "global_step": 202271, "epoch": 2437} {"train_loss": -24.073139190673828, "global_step": 202272, "epoch": 2437} {"train_loss": -23.65060806274414, "global_step": 202273, "epoch": 2437} {"train_loss": -23.78449821472168, "global_step": 202274, "epoch": 2437} {"train_loss": -23.83072853088379, "global_step": 202275, "epoch": 2437} {"train_loss": -23.832935333251953, "global_step": 202276, "epoch": 2437} {"train_loss": -23.673715591430664, "global_step": 202277, "epoch": 2437} {"train_loss": -23.95759391784668, "global_step": 202278, "epoch": 2437} {"train_loss": -23.809528350830078, "global_step": 202279, "epoch": 2437} {"train_loss": -24.113632202148438, "global_step": 202280, "epoch": 2437} {"train_loss": -23.636695861816406, "global_step": 202281, "epoch": 2437} {"train_loss": -23.897581100463867, "global_step": 202282, "epoch": 2437} {"train_loss": -24.07976722717285, "global_step": 202283, "epoch": 2437} {"train_loss": -24.194599151611328, "global_step": 202284, "epoch": 2437} {"train_loss": -24.107004165649414, "global_step": 202285, "epoch": 2437} {"train_loss": -24.247310638427734, "global_step": 202286, "epoch": 2437} {"train_loss": -23.857223510742188, "global_step": 202287, "epoch": 2437} {"train_loss": -24.06032371520996, "global_step": 202288, "epoch": 2437} {"train_loss": -24.32651138305664, "global_step": 202289, "epoch": 2437} {"train_loss": -24.423383712768555, "global_step": 202290, "epoch": 2437} {"train_loss": -23.725324630737305, "global_step": 202291, "epoch": 2437} {"train_loss": -24.018320083618164, "global_step": 202292, "epoch": 2437} {"train_loss": -24.027000427246094, "global_step": 202293, "epoch": 2437} {"train_loss": -24.165035247802734, "global_step": 202294, "epoch": 2437} {"train_loss": -24.37837791442871, "global_step": 202295, "epoch": 2437} {"train_loss": -23.944902420043945, "global_step": 202296, "epoch": 2437} {"train_loss": -23.84368896484375, "global_step": 202297, "epoch": 2437} {"train_loss": -24.24391746520996, "global_step": 202298, "epoch": 2437} {"train_loss": -24.230199813842773, "global_step": 202299, "epoch": 2437} {"train_loss": -24.206937789916992, "global_step": 202300, "epoch": 2437} {"train_loss": -24.135150909423828, "global_step": 202301, "epoch": 2437} {"train_loss": -24.02627182006836, "global_step": 202302, "epoch": 2437} {"train_loss": -24.399749755859375, "global_step": 202303, "epoch": 2437} {"train_loss": -24.261960983276367, "global_step": 202304, "epoch": 2437} {"train_loss": -24.165903091430664, "global_step": 202305, "epoch": 2437} {"train_loss": -24.16030502319336, "global_step": 202306, "epoch": 2437} {"train_loss": -24.58402442932129, "global_step": 202307, "epoch": 2437} {"train_loss": -24.234586715698242, "global_step": 202308, "epoch": 2437} {"train_loss": -24.26302146911621, "global_step": 202309, "epoch": 2437} {"train_loss": -24.35794448852539, "global_step": 202310, "epoch": 2437} {"train_loss": -24.416086196899414, "global_step": 202311, "epoch": 2437} {"train_loss": -24.08684730529785, "global_step": 202312, "epoch": 2437} {"train_loss": -24.260700225830078, "global_step": 202313, "epoch": 2437} {"train_loss": -24.16106605529785, "global_step": 202314, "epoch": 2437} {"train_loss": -24.01053810119629, "global_step": 202315, "epoch": 2437} {"train_loss": -24.088184356689453, "global_step": 202316, "epoch": 2437} {"train_loss": -24.35991859436035, "global_step": 202317, "epoch": 2437} {"train_loss": -24.390796661376953, "global_step": 202318, "epoch": 2437} {"train_loss": -24.658720016479492, "global_step": 202319, "epoch": 2437} {"train_loss": -24.018367767333984, "global_step": 202320, "epoch": 2437} {"train_loss": -24.545331954956055, "global_step": 202321, "epoch": 2437} {"train_loss": -24.388463973999023, "global_step": 202322, "epoch": 2437} {"train_loss": -24.552343368530273, "global_step": 202323, "epoch": 2437} {"train_loss": -24.46485137939453, "global_step": 202324, "epoch": 2437} {"train_loss": -24.327774047851562, "global_step": 202325, "epoch": 2437} {"train_loss": -24.661945343017578, "global_step": 202326, "epoch": 2437} {"train_loss": -24.179641723632812, "global_step": 202327, "epoch": 2437} {"train_loss": -24.300662994384766, "global_step": 202328, "epoch": 2437} {"train_loss": -24.183837890625, "global_step": 202329, "epoch": 2437} {"train_loss": -24.504281997680664, "global_step": 202330, "epoch": 2437} {"train_loss": -24.493789672851562, "global_step": 202331, "epoch": 2437} {"train_loss": -24.7730770111084, "global_step": 202332, "epoch": 2437} {"train_loss": -24.144027709960938, "global_step": 202333, "epoch": 2437} {"train_loss": -24.17447853088379, "global_step": 202334, "epoch": 2437} {"train_loss": -24.479969024658203, "global_step": 202335, "epoch": 2437} {"train_loss": -24.499713897705078, "global_step": 202336, "epoch": 2437} {"train_loss": -24.089948654174805, "global_step": 202337, "epoch": 2437} {"train_loss": -24.49867820739746, "global_step": 202338, "epoch": 2437} {"train_loss": -24.51569938659668, "global_step": 202339, "epoch": 2437} {"train_loss": -24.37911033630371, "global_step": 202340, "epoch": 2437} {"train_loss": -24.3767147064209, "global_step": 202341, "epoch": 2437} {"train_loss": -24.696996688842773, "global_step": 202342, "epoch": 2437} {"train_loss": -24.55605125427246, "global_step": 202343, "epoch": 2437} {"train_loss": -24.38401222229004, "global_step": 202344, "epoch": 2437} {"train_loss": -24.33544921875, "global_step": 202345, "epoch": 2437} {"train_loss": -24.06916618347168, "global_step": 202346, "epoch": 2437} {"train_loss": -24.366750717163086, "global_step": 202347, "epoch": 2437} {"train_loss": -23.97389030456543, "global_step": 202348, "epoch": 2437} {"train_loss": -24.319250106811523, "global_step": 202349, "epoch": 2437} {"train_loss": -24.442768096923828, "global_step": 202350, "epoch": 2437} {"train_loss": -24.19270896911621, "global_step": 202351, "epoch": 2437} {"train_loss": -24.15012550354004, "global_step": 202352, "epoch": 2437} {"train_loss": -24.210829746292298, "global_step": 202353, "epoch": 2437, "val_loss": 6647376.0} {"train_loss": -24.1223201751709, "global_step": 202354, "epoch": 2438} {"train_loss": -23.973217010498047, "global_step": 202355, "epoch": 2438} {"train_loss": -23.73828125, "global_step": 202356, "epoch": 2438} {"train_loss": -23.486181259155273, "global_step": 202357, "epoch": 2438} {"train_loss": -24.04780387878418, "global_step": 202358, "epoch": 2438} {"train_loss": -24.21556854248047, "global_step": 202359, "epoch": 2438} {"train_loss": -23.703779220581055, "global_step": 202360, "epoch": 2438} {"train_loss": -23.918842315673828, "global_step": 202361, "epoch": 2438} {"train_loss": -23.904251098632812, "global_step": 202362, "epoch": 2438} {"train_loss": -23.484548568725586, "global_step": 202363, "epoch": 2438} {"train_loss": -23.412948608398438, "global_step": 202364, "epoch": 2438} {"train_loss": -23.808713912963867, "global_step": 202365, "epoch": 2438} {"train_loss": -23.62801170349121, "global_step": 202366, "epoch": 2438} {"train_loss": -23.548686981201172, "global_step": 202367, "epoch": 2438} {"train_loss": -23.885669708251953, "global_step": 202368, "epoch": 2438} {"train_loss": -23.50107765197754, "global_step": 202369, "epoch": 2438} {"train_loss": -23.54449462890625, "global_step": 202370, "epoch": 2438} {"train_loss": -23.786029815673828, "global_step": 202371, "epoch": 2438} {"train_loss": -23.685733795166016, "global_step": 202372, "epoch": 2438} {"train_loss": -23.719322204589844, "global_step": 202373, "epoch": 2438} {"train_loss": -24.363996505737305, "global_step": 202374, "epoch": 2438} {"train_loss": -23.836585998535156, "global_step": 202375, "epoch": 2438} {"train_loss": -24.037250518798828, "global_step": 202376, "epoch": 2438} {"train_loss": -23.94980812072754, "global_step": 202377, "epoch": 2438} {"train_loss": -24.299373626708984, "global_step": 202378, "epoch": 2438} {"train_loss": -24.07594108581543, "global_step": 202379, "epoch": 2438} {"train_loss": -23.64543342590332, "global_step": 202380, "epoch": 2438} {"train_loss": -23.93633270263672, "global_step": 202381, "epoch": 2438} {"train_loss": -24.0023193359375, "global_step": 202382, "epoch": 2438} {"train_loss": -24.210186004638672, "global_step": 202383, "epoch": 2438} {"train_loss": -23.89348030090332, "global_step": 202384, "epoch": 2438} {"train_loss": -24.181676864624023, "global_step": 202385, "epoch": 2438} {"train_loss": -24.581262588500977, "global_step": 202386, "epoch": 2438} {"train_loss": -24.32123374938965, "global_step": 202387, "epoch": 2438} {"train_loss": -24.27079200744629, "global_step": 202388, "epoch": 2438} {"train_loss": -24.188413619995117, "global_step": 202389, "epoch": 2438} {"train_loss": -24.43849754333496, "global_step": 202390, "epoch": 2438} {"train_loss": -24.248079299926758, "global_step": 202391, "epoch": 2438} {"train_loss": -24.648433685302734, "global_step": 202392, "epoch": 2438} {"train_loss": -24.294097900390625, "global_step": 202393, "epoch": 2438} {"train_loss": -23.97504234313965, "global_step": 202394, "epoch": 2438} {"train_loss": -24.579914093017578, "global_step": 202395, "epoch": 2438} {"train_loss": -24.09291648864746, "global_step": 202396, "epoch": 2438} {"train_loss": -24.73126220703125, "global_step": 202397, "epoch": 2438} {"train_loss": -24.07894515991211, "global_step": 202398, "epoch": 2438} {"train_loss": -24.323591232299805, "global_step": 202399, "epoch": 2438} {"train_loss": -24.446699142456055, "global_step": 202400, "epoch": 2438} {"train_loss": -24.47011947631836, "global_step": 202401, "epoch": 2438} {"train_loss": -24.14206314086914, "global_step": 202402, "epoch": 2438} {"train_loss": -24.2484073638916, "global_step": 202403, "epoch": 2438} {"train_loss": -24.453176498413086, "global_step": 202404, "epoch": 2438} {"train_loss": -24.524717330932617, "global_step": 202405, "epoch": 2438} {"train_loss": -24.474918365478516, "global_step": 202406, "epoch": 2438} {"train_loss": -24.125349044799805, "global_step": 202407, "epoch": 2438} {"train_loss": -24.533205032348633, "global_step": 202408, "epoch": 2438} {"train_loss": -24.12580680847168, "global_step": 202409, "epoch": 2438} {"train_loss": -24.396528244018555, "global_step": 202410, "epoch": 2438} {"train_loss": -24.514318466186523, "global_step": 202411, "epoch": 2438} {"train_loss": -24.045419692993164, "global_step": 202412, "epoch": 2438} {"train_loss": -23.91670036315918, "global_step": 202413, "epoch": 2438} {"train_loss": -24.245893478393555, "global_step": 202414, "epoch": 2438} {"train_loss": -24.162967681884766, "global_step": 202415, "epoch": 2438} {"train_loss": -24.08156967163086, "global_step": 202416, "epoch": 2438} {"train_loss": -24.181163787841797, "global_step": 202417, "epoch": 2438} {"train_loss": -24.149423599243164, "global_step": 202418, "epoch": 2438} {"train_loss": -24.476062774658203, "global_step": 202419, "epoch": 2438} {"train_loss": -24.326797485351562, "global_step": 202420, "epoch": 2438} {"train_loss": -24.22062110900879, "global_step": 202421, "epoch": 2438} {"train_loss": -23.922155380249023, "global_step": 202422, "epoch": 2438} {"train_loss": -24.392911911010742, "global_step": 202423, "epoch": 2438} {"train_loss": -24.22085952758789, "global_step": 202424, "epoch": 2438} {"train_loss": -24.21296501159668, "global_step": 202425, "epoch": 2438} {"train_loss": -24.088760375976562, "global_step": 202426, "epoch": 2438} {"train_loss": -24.365032196044922, "global_step": 202427, "epoch": 2438} {"train_loss": -24.637540817260742, "global_step": 202428, "epoch": 2438} {"train_loss": -24.248565673828125, "global_step": 202429, "epoch": 2438} {"train_loss": -24.214645385742188, "global_step": 202430, "epoch": 2438} {"train_loss": -24.363550186157227, "global_step": 202431, "epoch": 2438} {"train_loss": -23.732816696166992, "global_step": 202432, "epoch": 2438} {"train_loss": -24.18625259399414, "global_step": 202433, "epoch": 2438} {"train_loss": -24.250743865966797, "global_step": 202434, "epoch": 2438} {"train_loss": -24.353992462158203, "global_step": 202435, "epoch": 2438} {"train_loss": -24.120900625205902, "global_step": 202436, "epoch": 2438, "val_loss": 6448216.5} {"train_loss": -23.779829025268555, "global_step": 202437, "epoch": 2439} {"train_loss": -23.43829917907715, "global_step": 202438, "epoch": 2439} {"train_loss": -23.875228881835938, "global_step": 202439, "epoch": 2439} {"train_loss": -24.07132339477539, "global_step": 202440, "epoch": 2439} {"train_loss": -23.83600425720215, "global_step": 202441, "epoch": 2439} {"train_loss": -24.249357223510742, "global_step": 202442, "epoch": 2439} {"train_loss": -23.642074584960938, "global_step": 202443, "epoch": 2439} {"train_loss": -24.135210037231445, "global_step": 202444, "epoch": 2439} {"train_loss": -23.677648544311523, "global_step": 202445, "epoch": 2439} {"train_loss": -23.63509178161621, "global_step": 202446, "epoch": 2439} {"train_loss": -24.08600425720215, "global_step": 202447, "epoch": 2439} {"train_loss": -23.52358055114746, "global_step": 202448, "epoch": 2439} {"train_loss": -23.861209869384766, "global_step": 202449, "epoch": 2439} {"train_loss": -24.28741455078125, "global_step": 202450, "epoch": 2439} {"train_loss": -23.63345718383789, "global_step": 202451, "epoch": 2439} {"train_loss": -24.027814865112305, "global_step": 202452, "epoch": 2439} {"train_loss": -24.06834602355957, "global_step": 202453, "epoch": 2439} {"train_loss": -23.903003692626953, "global_step": 202454, "epoch": 2439} {"train_loss": -23.717741012573242, "global_step": 202455, "epoch": 2439} {"train_loss": -23.805204391479492, "global_step": 202456, "epoch": 2439} {"train_loss": -24.218963623046875, "global_step": 202457, "epoch": 2439} {"train_loss": -23.99234390258789, "global_step": 202458, "epoch": 2439} {"train_loss": -23.889636993408203, "global_step": 202459, "epoch": 2439} {"train_loss": -23.88343048095703, "global_step": 202460, "epoch": 2439} {"train_loss": -24.331972122192383, "global_step": 202461, "epoch": 2439} {"train_loss": -23.860443115234375, "global_step": 202462, "epoch": 2439} {"train_loss": -24.223941802978516, "global_step": 202463, "epoch": 2439} {"train_loss": -24.038610458374023, "global_step": 202464, "epoch": 2439} {"train_loss": -24.297319412231445, "global_step": 202465, "epoch": 2439} {"train_loss": -24.264623641967773, "global_step": 202466, "epoch": 2439} {"train_loss": -24.06695556640625, "global_step": 202467, "epoch": 2439} {"train_loss": -24.15622329711914, "global_step": 202468, "epoch": 2439} {"train_loss": -24.128507614135742, "global_step": 202469, "epoch": 2439} {"train_loss": -24.414953231811523, "global_step": 202470, "epoch": 2439} {"train_loss": -24.400074005126953, "global_step": 202471, "epoch": 2439} {"train_loss": -24.71144676208496, "global_step": 202472, "epoch": 2439} {"train_loss": -24.389442443847656, "global_step": 202473, "epoch": 2439} {"train_loss": -24.251632690429688, "global_step": 202474, "epoch": 2439} {"train_loss": -24.075637817382812, "global_step": 202475, "epoch": 2439} {"train_loss": -24.046619415283203, "global_step": 202476, "epoch": 2439} {"train_loss": -24.34286117553711, "global_step": 202477, "epoch": 2439} {"train_loss": -24.269323348999023, "global_step": 202478, "epoch": 2439} {"train_loss": -24.34653663635254, "global_step": 202479, "epoch": 2439} {"train_loss": -24.314376831054688, "global_step": 202480, "epoch": 2439} {"train_loss": -24.022130966186523, "global_step": 202481, "epoch": 2439} {"train_loss": -24.30279541015625, "global_step": 202482, "epoch": 2439} {"train_loss": -24.375080108642578, "global_step": 202483, "epoch": 2439} {"train_loss": -24.361286163330078, "global_step": 202484, "epoch": 2439} {"train_loss": -24.131887435913086, "global_step": 202485, "epoch": 2439} {"train_loss": -24.409154891967773, "global_step": 202486, "epoch": 2439} {"train_loss": -24.045148849487305, "global_step": 202487, "epoch": 2439} {"train_loss": -23.76686668395996, "global_step": 202488, "epoch": 2439} {"train_loss": -24.740955352783203, "global_step": 202489, "epoch": 2439} {"train_loss": -24.468215942382812, "global_step": 202490, "epoch": 2439} {"train_loss": -24.030250549316406, "global_step": 202491, "epoch": 2439} {"train_loss": -24.100971221923828, "global_step": 202492, "epoch": 2439} {"train_loss": -24.20701026916504, "global_step": 202493, "epoch": 2439} {"train_loss": -24.628023147583008, "global_step": 202494, "epoch": 2439} {"train_loss": -24.237340927124023, "global_step": 202495, "epoch": 2439} {"train_loss": -24.29466438293457, "global_step": 202496, "epoch": 2439} {"train_loss": -24.608116149902344, "global_step": 202497, "epoch": 2439} {"train_loss": -24.224462509155273, "global_step": 202498, "epoch": 2439} {"train_loss": -24.316085815429688, "global_step": 202499, "epoch": 2439} {"train_loss": -24.20549964904785, "global_step": 202500, "epoch": 2439} {"train_loss": -24.109146118164062, "global_step": 202501, "epoch": 2439} {"train_loss": -24.39139175415039, "global_step": 202502, "epoch": 2439} {"train_loss": -23.979393005371094, "global_step": 202503, "epoch": 2439} {"train_loss": -24.475934982299805, "global_step": 202504, "epoch": 2439} {"train_loss": -24.132644653320312, "global_step": 202505, "epoch": 2439} {"train_loss": -24.61112403869629, "global_step": 202506, "epoch": 2439} {"train_loss": -24.239561080932617, "global_step": 202507, "epoch": 2439} {"train_loss": -24.696531295776367, "global_step": 202508, "epoch": 2439} {"train_loss": -23.915843963623047, "global_step": 202509, "epoch": 2439} {"train_loss": -24.102447509765625, "global_step": 202510, "epoch": 2439} {"train_loss": -24.022329330444336, "global_step": 202511, "epoch": 2439} {"train_loss": -24.407615661621094, "global_step": 202512, "epoch": 2439} {"train_loss": -24.263671875, "global_step": 202513, "epoch": 2439} {"train_loss": -24.504743576049805, "global_step": 202514, "epoch": 2439} {"train_loss": -24.774845123291016, "global_step": 202515, "epoch": 2439} {"train_loss": -24.230398178100586, "global_step": 202516, "epoch": 2439} {"train_loss": -24.356155395507812, "global_step": 202517, "epoch": 2439} {"train_loss": -24.439586639404297, "global_step": 202518, "epoch": 2439} {"train_loss": -24.16680942673281, "global_step": 202519, "epoch": 2439, "val_loss": 6637890.0} {"train_loss": -23.786771774291992, "global_step": 202520, "epoch": 2440} {"train_loss": -23.636398315429688, "global_step": 202521, "epoch": 2440} {"train_loss": -23.53356170654297, "global_step": 202522, "epoch": 2440} {"train_loss": -23.498544692993164, "global_step": 202523, "epoch": 2440} {"train_loss": -23.487333297729492, "global_step": 202524, "epoch": 2440} {"train_loss": -23.926374435424805, "global_step": 202525, "epoch": 2440} {"train_loss": -23.81399917602539, "global_step": 202526, "epoch": 2440} {"train_loss": -24.327314376831055, "global_step": 202527, "epoch": 2440} {"train_loss": -23.705488204956055, "global_step": 202528, "epoch": 2440} {"train_loss": -23.90130615234375, "global_step": 202529, "epoch": 2440} {"train_loss": -23.953907012939453, "global_step": 202530, "epoch": 2440} {"train_loss": -23.714773178100586, "global_step": 202531, "epoch": 2440} {"train_loss": -24.492656707763672, "global_step": 202532, "epoch": 2440} {"train_loss": -24.037466049194336, "global_step": 202533, "epoch": 2440} {"train_loss": -24.12311363220215, "global_step": 202534, "epoch": 2440} {"train_loss": -24.15754508972168, "global_step": 202535, "epoch": 2440} {"train_loss": -23.997438430786133, "global_step": 202536, "epoch": 2440} {"train_loss": -24.245105743408203, "global_step": 202537, "epoch": 2440} {"train_loss": -23.955913543701172, "global_step": 202538, "epoch": 2440} {"train_loss": -24.001623153686523, "global_step": 202539, "epoch": 2440} {"train_loss": -24.282617568969727, "global_step": 202540, "epoch": 2440} {"train_loss": -24.146570205688477, "global_step": 202541, "epoch": 2440} {"train_loss": -23.990766525268555, "global_step": 202542, "epoch": 2440} {"train_loss": -24.562292098999023, "global_step": 202543, "epoch": 2440} {"train_loss": -23.903608322143555, "global_step": 202544, "epoch": 2440} {"train_loss": -24.189300537109375, "global_step": 202545, "epoch": 2440} {"train_loss": -24.105335235595703, "global_step": 202546, "epoch": 2440} {"train_loss": -24.082368850708008, "global_step": 202547, "epoch": 2440} {"train_loss": -24.397207260131836, "global_step": 202548, "epoch": 2440} {"train_loss": -24.190500259399414, "global_step": 202549, "epoch": 2440} {"train_loss": -24.28742027282715, "global_step": 202550, "epoch": 2440} {"train_loss": -24.331518173217773, "global_step": 202551, "epoch": 2440} {"train_loss": -24.303897857666016, "global_step": 202552, "epoch": 2440} {"train_loss": -24.458898544311523, "global_step": 202553, "epoch": 2440} {"train_loss": -24.153966903686523, "global_step": 202554, "epoch": 2440} {"train_loss": -23.85294532775879, "global_step": 202555, "epoch": 2440} {"train_loss": -24.13161277770996, "global_step": 202556, "epoch": 2440} {"train_loss": -24.717905044555664, "global_step": 202557, "epoch": 2440} {"train_loss": -24.098388671875, "global_step": 202558, "epoch": 2440} {"train_loss": -24.684823989868164, "global_step": 202559, "epoch": 2440} {"train_loss": -24.339599609375, "global_step": 202560, "epoch": 2440} {"train_loss": -24.504770278930664, "global_step": 202561, "epoch": 2440} {"train_loss": -24.153160095214844, "global_step": 202562, "epoch": 2440} {"train_loss": -24.62819480895996, "global_step": 202563, "epoch": 2440} {"train_loss": -24.50452423095703, "global_step": 202564, "epoch": 2440} {"train_loss": -24.194740295410156, "global_step": 202565, "epoch": 2440} {"train_loss": -24.190732955932617, "global_step": 202566, "epoch": 2440} {"train_loss": -24.540468215942383, "global_step": 202567, "epoch": 2440} {"train_loss": -24.374557495117188, "global_step": 202568, "epoch": 2440} {"train_loss": -24.15104866027832, "global_step": 202569, "epoch": 2440} {"train_loss": -24.31073760986328, "global_step": 202570, "epoch": 2440} {"train_loss": -24.240793228149414, "global_step": 202571, "epoch": 2440} {"train_loss": -24.0482234954834, "global_step": 202572, "epoch": 2440} {"train_loss": -24.379108428955078, "global_step": 202573, "epoch": 2440} {"train_loss": -24.54792022705078, "global_step": 202574, "epoch": 2440} {"train_loss": -24.25396156311035, "global_step": 202575, "epoch": 2440} {"train_loss": -24.346633911132812, "global_step": 202576, "epoch": 2440} {"train_loss": -24.323379516601562, "global_step": 202577, "epoch": 2440} {"train_loss": -24.315587997436523, "global_step": 202578, "epoch": 2440} {"train_loss": -24.57022476196289, "global_step": 202579, "epoch": 2440} {"train_loss": -24.52375602722168, "global_step": 202580, "epoch": 2440} {"train_loss": -24.463476181030273, "global_step": 202581, "epoch": 2440} {"train_loss": -24.723957061767578, "global_step": 202582, "epoch": 2440} {"train_loss": -24.271520614624023, "global_step": 202583, "epoch": 2440} {"train_loss": -24.44561195373535, "global_step": 202584, "epoch": 2440} {"train_loss": -23.98105812072754, "global_step": 202585, "epoch": 2440} {"train_loss": -24.07732391357422, "global_step": 202586, "epoch": 2440} {"train_loss": -24.2208309173584, "global_step": 202587, "epoch": 2440} {"train_loss": -24.153467178344727, "global_step": 202588, "epoch": 2440} {"train_loss": -24.09784698486328, "global_step": 202589, "epoch": 2440} {"train_loss": -24.340953826904297, "global_step": 202590, "epoch": 2440} {"train_loss": -24.233673095703125, "global_step": 202591, "epoch": 2440} {"train_loss": -24.256986618041992, "global_step": 202592, "epoch": 2440} {"train_loss": -24.461057662963867, "global_step": 202593, "epoch": 2440} {"train_loss": -24.465129852294922, "global_step": 202594, "epoch": 2440} {"train_loss": -24.384111404418945, "global_step": 202595, "epoch": 2440} {"train_loss": -24.447513580322266, "global_step": 202596, "epoch": 2440} {"train_loss": -24.31324577331543, "global_step": 202597, "epoch": 2440} {"train_loss": -24.58795166015625, "global_step": 202598, "epoch": 2440} {"train_loss": -24.292373657226562, "global_step": 202599, "epoch": 2440} {"train_loss": -24.234817504882812, "global_step": 202600, "epoch": 2440} {"train_loss": -24.770580291748047, "global_step": 202601, "epoch": 2440} {"train_loss": -24.221218017210443, "global_step": 202602, "epoch": 2440, "val_loss": 6670451.0} {"train_loss": -23.784069061279297, "global_step": 202603, "epoch": 2441} {"train_loss": -23.66157341003418, "global_step": 202604, "epoch": 2441} {"train_loss": -23.447233200073242, "global_step": 202605, "epoch": 2441} {"train_loss": -24.219757080078125, "global_step": 202606, "epoch": 2441} {"train_loss": -23.967105865478516, "global_step": 202607, "epoch": 2441} {"train_loss": -23.82796287536621, "global_step": 202608, "epoch": 2441} {"train_loss": -23.838590621948242, "global_step": 202609, "epoch": 2441} {"train_loss": -23.758792877197266, "global_step": 202610, "epoch": 2441} {"train_loss": -24.249713897705078, "global_step": 202611, "epoch": 2441} {"train_loss": -23.654253005981445, "global_step": 202612, "epoch": 2441} {"train_loss": -24.226993560791016, "global_step": 202613, "epoch": 2441} {"train_loss": -24.067432403564453, "global_step": 202614, "epoch": 2441} {"train_loss": -23.611377716064453, "global_step": 202615, "epoch": 2441} {"train_loss": -24.116291046142578, "global_step": 202616, "epoch": 2441} {"train_loss": -23.570730209350586, "global_step": 202617, "epoch": 2441} {"train_loss": -23.91185188293457, "global_step": 202618, "epoch": 2441} {"train_loss": -23.656965255737305, "global_step": 202619, "epoch": 2441} {"train_loss": -23.701099395751953, "global_step": 202620, "epoch": 2441} {"train_loss": -23.95589256286621, "global_step": 202621, "epoch": 2441} {"train_loss": -24.148517608642578, "global_step": 202622, "epoch": 2441} {"train_loss": -23.75065040588379, "global_step": 202623, "epoch": 2441} {"train_loss": -24.311262130737305, "global_step": 202624, "epoch": 2441} {"train_loss": -23.806915283203125, "global_step": 202625, "epoch": 2441} {"train_loss": -23.609779357910156, "global_step": 202626, "epoch": 2441} {"train_loss": -23.996097564697266, "global_step": 202627, "epoch": 2441} {"train_loss": -24.133224487304688, "global_step": 202628, "epoch": 2441} {"train_loss": -24.119796752929688, "global_step": 202629, "epoch": 2441} {"train_loss": -24.217561721801758, "global_step": 202630, "epoch": 2441} {"train_loss": -24.489276885986328, "global_step": 202631, "epoch": 2441} {"train_loss": -24.04167938232422, "global_step": 202632, "epoch": 2441} {"train_loss": -24.490070343017578, "global_step": 202633, "epoch": 2441} {"train_loss": -24.043737411499023, "global_step": 202634, "epoch": 2441} {"train_loss": -24.461732864379883, "global_step": 202635, "epoch": 2441} {"train_loss": -23.993467330932617, "global_step": 202636, "epoch": 2441} {"train_loss": -24.282007217407227, "global_step": 202637, "epoch": 2441} {"train_loss": -24.109933853149414, "global_step": 202638, "epoch": 2441} {"train_loss": -24.165328979492188, "global_step": 202639, "epoch": 2441} {"train_loss": -24.26703453063965, "global_step": 202640, "epoch": 2441} {"train_loss": -24.422943115234375, "global_step": 202641, "epoch": 2441} {"train_loss": -24.245569229125977, "global_step": 202642, "epoch": 2441} {"train_loss": -24.4383487701416, "global_step": 202643, "epoch": 2441} {"train_loss": -24.514780044555664, "global_step": 202644, "epoch": 2441} {"train_loss": -24.38634490966797, "global_step": 202645, "epoch": 2441} {"train_loss": -24.12959098815918, "global_step": 202646, "epoch": 2441} {"train_loss": -24.138656616210938, "global_step": 202647, "epoch": 2441} {"train_loss": -24.581424713134766, "global_step": 202648, "epoch": 2441} {"train_loss": -24.726293563842773, "global_step": 202649, "epoch": 2441} {"train_loss": -24.241058349609375, "global_step": 202650, "epoch": 2441} {"train_loss": -24.77858543395996, "global_step": 202651, "epoch": 2441} {"train_loss": -24.675832748413086, "global_step": 202652, "epoch": 2441} {"train_loss": -24.263925552368164, "global_step": 202653, "epoch": 2441} {"train_loss": -24.13518714904785, "global_step": 202654, "epoch": 2441} {"train_loss": -23.834623336791992, "global_step": 202655, "epoch": 2441} {"train_loss": -23.836597442626953, "global_step": 202656, "epoch": 2441} {"train_loss": -24.141971588134766, "global_step": 202657, "epoch": 2441} {"train_loss": -24.063207626342773, "global_step": 202658, "epoch": 2441} {"train_loss": -24.395095825195312, "global_step": 202659, "epoch": 2441} {"train_loss": -24.31874656677246, "global_step": 202660, "epoch": 2441} {"train_loss": -24.011789321899414, "global_step": 202661, "epoch": 2441} {"train_loss": -24.271047592163086, "global_step": 202662, "epoch": 2441} {"train_loss": -24.378448486328125, "global_step": 202663, "epoch": 2441} {"train_loss": -23.948389053344727, "global_step": 202664, "epoch": 2441} {"train_loss": -23.909048080444336, "global_step": 202665, "epoch": 2441} {"train_loss": -24.324066162109375, "global_step": 202666, "epoch": 2441} {"train_loss": -24.39656639099121, "global_step": 202667, "epoch": 2441} {"train_loss": -24.482372283935547, "global_step": 202668, "epoch": 2441} {"train_loss": -24.455915451049805, "global_step": 202669, "epoch": 2441} {"train_loss": -24.238048553466797, "global_step": 202670, "epoch": 2441} {"train_loss": -24.531354904174805, "global_step": 202671, "epoch": 2441} {"train_loss": -24.13105010986328, "global_step": 202672, "epoch": 2441} {"train_loss": -24.15387725830078, "global_step": 202673, "epoch": 2441} {"train_loss": -24.523845672607422, "global_step": 202674, "epoch": 2441} {"train_loss": -24.14143180847168, "global_step": 202675, "epoch": 2441} {"train_loss": -24.420835494995117, "global_step": 202676, "epoch": 2441} {"train_loss": -24.236042022705078, "global_step": 202677, "epoch": 2441} {"train_loss": -23.950254440307617, "global_step": 202678, "epoch": 2441} {"train_loss": -24.322118759155273, "global_step": 202679, "epoch": 2441} {"train_loss": -24.431257247924805, "global_step": 202680, "epoch": 2441} {"train_loss": -24.132299423217773, "global_step": 202681, "epoch": 2441} {"train_loss": -24.46837043762207, "global_step": 202682, "epoch": 2441} {"train_loss": -23.944276809692383, "global_step": 202683, "epoch": 2441} {"train_loss": -24.030054092407227, "global_step": 202684, "epoch": 2441} {"train_loss": -24.143379579107446, "global_step": 202685, "epoch": 2441, "val_loss": 6654336.0} {"train_loss": -23.24709129333496, "global_step": 202686, "epoch": 2442} {"train_loss": -23.49024772644043, "global_step": 202687, "epoch": 2442} {"train_loss": -24.282196044921875, "global_step": 202688, "epoch": 2442} {"train_loss": -22.986106872558594, "global_step": 202689, "epoch": 2442} {"train_loss": -24.046728134155273, "global_step": 202690, "epoch": 2442} {"train_loss": -23.795629501342773, "global_step": 202691, "epoch": 2442} {"train_loss": -23.715938568115234, "global_step": 202692, "epoch": 2442} {"train_loss": -24.28038215637207, "global_step": 202693, "epoch": 2442} {"train_loss": -24.041940689086914, "global_step": 202694, "epoch": 2442} {"train_loss": -23.84504508972168, "global_step": 202695, "epoch": 2442} {"train_loss": -24.064590454101562, "global_step": 202696, "epoch": 2442} {"train_loss": -24.2553768157959, "global_step": 202697, "epoch": 2442} {"train_loss": -23.909765243530273, "global_step": 202698, "epoch": 2442} {"train_loss": -24.022424697875977, "global_step": 202699, "epoch": 2442} {"train_loss": -23.937528610229492, "global_step": 202700, "epoch": 2442} {"train_loss": -24.126142501831055, "global_step": 202701, "epoch": 2442} {"train_loss": -24.033044815063477, "global_step": 202702, "epoch": 2442} {"train_loss": -24.103139877319336, "global_step": 202703, "epoch": 2442} {"train_loss": -24.266834259033203, "global_step": 202704, "epoch": 2442} {"train_loss": -24.121152877807617, "global_step": 202705, "epoch": 2442} {"train_loss": -24.430551528930664, "global_step": 202706, "epoch": 2442} {"train_loss": -24.136783599853516, "global_step": 202707, "epoch": 2442} {"train_loss": -24.45525550842285, "global_step": 202708, "epoch": 2442} {"train_loss": -24.000732421875, "global_step": 202709, "epoch": 2442} {"train_loss": -23.887672424316406, "global_step": 202710, "epoch": 2442} {"train_loss": -24.4404239654541, "global_step": 202711, "epoch": 2442} {"train_loss": -24.436262130737305, "global_step": 202712, "epoch": 2442} {"train_loss": -24.424530029296875, "global_step": 202713, "epoch": 2442} {"train_loss": -24.334518432617188, "global_step": 202714, "epoch": 2442} {"train_loss": -24.875455856323242, "global_step": 202715, "epoch": 2442} {"train_loss": -24.390140533447266, "global_step": 202716, "epoch": 2442} {"train_loss": -24.369735717773438, "global_step": 202717, "epoch": 2442} {"train_loss": -24.51507568359375, "global_step": 202718, "epoch": 2442} {"train_loss": -24.362796783447266, "global_step": 202719, "epoch": 2442} {"train_loss": -24.52616310119629, "global_step": 202720, "epoch": 2442} {"train_loss": -24.36220932006836, "global_step": 202721, "epoch": 2442} {"train_loss": -24.60444450378418, "global_step": 202722, "epoch": 2442} {"train_loss": -24.250627517700195, "global_step": 202723, "epoch": 2442} {"train_loss": -24.185771942138672, "global_step": 202724, "epoch": 2442} {"train_loss": -24.43545913696289, "global_step": 202725, "epoch": 2442} {"train_loss": -24.152509689331055, "global_step": 202726, "epoch": 2442} {"train_loss": -24.38564109802246, "global_step": 202727, "epoch": 2442} {"train_loss": -23.940431594848633, "global_step": 202728, "epoch": 2442} {"train_loss": -23.71296501159668, "global_step": 202729, "epoch": 2442} {"train_loss": -24.056957244873047, "global_step": 202730, "epoch": 2442} {"train_loss": -24.325468063354492, "global_step": 202731, "epoch": 2442} {"train_loss": -23.56764030456543, "global_step": 202732, "epoch": 2442} {"train_loss": -24.61762809753418, "global_step": 202733, "epoch": 2442} {"train_loss": -23.537633895874023, "global_step": 202734, "epoch": 2442} {"train_loss": -24.299726486206055, "global_step": 202735, "epoch": 2442} {"train_loss": -24.051311492919922, "global_step": 202736, "epoch": 2442} {"train_loss": -24.23469352722168, "global_step": 202737, "epoch": 2442} {"train_loss": -24.324207305908203, "global_step": 202738, "epoch": 2442} {"train_loss": -24.265562057495117, "global_step": 202739, "epoch": 2442} {"train_loss": -24.41793441772461, "global_step": 202740, "epoch": 2442} {"train_loss": -24.095367431640625, "global_step": 202741, "epoch": 2442} {"train_loss": -24.61495018005371, "global_step": 202742, "epoch": 2442} {"train_loss": -23.941781997680664, "global_step": 202743, "epoch": 2442} {"train_loss": -24.441991806030273, "global_step": 202744, "epoch": 2442} {"train_loss": -24.225553512573242, "global_step": 202745, "epoch": 2442} {"train_loss": -24.464147567749023, "global_step": 202746, "epoch": 2442} {"train_loss": -24.26043701171875, "global_step": 202747, "epoch": 2442} {"train_loss": -24.316974639892578, "global_step": 202748, "epoch": 2442} {"train_loss": -24.4309139251709, "global_step": 202749, "epoch": 2442} {"train_loss": -24.398237228393555, "global_step": 202750, "epoch": 2442} {"train_loss": -24.534339904785156, "global_step": 202751, "epoch": 2442} {"train_loss": -24.280893325805664, "global_step": 202752, "epoch": 2442} {"train_loss": -24.485321044921875, "global_step": 202753, "epoch": 2442} {"train_loss": -24.136484146118164, "global_step": 202754, "epoch": 2442} {"train_loss": -24.49554443359375, "global_step": 202755, "epoch": 2442} {"train_loss": -24.293426513671875, "global_step": 202756, "epoch": 2442} {"train_loss": -24.16757583618164, "global_step": 202757, "epoch": 2442} {"train_loss": -24.641244888305664, "global_step": 202758, "epoch": 2442} {"train_loss": -24.471088409423828, "global_step": 202759, "epoch": 2442} {"train_loss": -24.543848037719727, "global_step": 202760, "epoch": 2442} {"train_loss": -24.211544036865234, "global_step": 202761, "epoch": 2442} {"train_loss": -24.125049591064453, "global_step": 202762, "epoch": 2442} {"train_loss": -24.354421615600586, "global_step": 202763, "epoch": 2442} {"train_loss": -24.51429557800293, "global_step": 202764, "epoch": 2442} {"train_loss": -24.167516708374023, "global_step": 202765, "epoch": 2442} {"train_loss": -24.345077514648438, "global_step": 202766, "epoch": 2442} {"train_loss": -24.712209701538086, "global_step": 202767, "epoch": 2442} {"train_loss": -24.215466947440643, "global_step": 202768, "epoch": 2442, "val_loss": 6814904.0} {"train_loss": -23.98115348815918, "global_step": 202769, "epoch": 2443} {"train_loss": -23.52899742126465, "global_step": 202770, "epoch": 2443} {"train_loss": -23.837202072143555, "global_step": 202771, "epoch": 2443} {"train_loss": -23.690174102783203, "global_step": 202772, "epoch": 2443} {"train_loss": -23.503585815429688, "global_step": 202773, "epoch": 2443} {"train_loss": -23.834054946899414, "global_step": 202774, "epoch": 2443} {"train_loss": -23.786039352416992, "global_step": 202775, "epoch": 2443} {"train_loss": -24.002046585083008, "global_step": 202776, "epoch": 2443} {"train_loss": -23.831480026245117, "global_step": 202777, "epoch": 2443} {"train_loss": -24.07429313659668, "global_step": 202778, "epoch": 2443} {"train_loss": -24.239551544189453, "global_step": 202779, "epoch": 2443} {"train_loss": -23.80564308166504, "global_step": 202780, "epoch": 2443} {"train_loss": -23.842206954956055, "global_step": 202781, "epoch": 2443} {"train_loss": -24.475383758544922, "global_step": 202782, "epoch": 2443} {"train_loss": -24.037979125976562, "global_step": 202783, "epoch": 2443} {"train_loss": -24.307483673095703, "global_step": 202784, "epoch": 2443} {"train_loss": -23.660690307617188, "global_step": 202785, "epoch": 2443} {"train_loss": -23.95033836364746, "global_step": 202786, "epoch": 2443} {"train_loss": -24.24759864807129, "global_step": 202787, "epoch": 2443} {"train_loss": -23.695524215698242, "global_step": 202788, "epoch": 2443} {"train_loss": -24.17378807067871, "global_step": 202789, "epoch": 2443} {"train_loss": -23.883325576782227, "global_step": 202790, "epoch": 2443} {"train_loss": -24.023183822631836, "global_step": 202791, "epoch": 2443} {"train_loss": -24.173458099365234, "global_step": 202792, "epoch": 2443} {"train_loss": -23.86274528503418, "global_step": 202793, "epoch": 2443} {"train_loss": -24.0272216796875, "global_step": 202794, "epoch": 2443} {"train_loss": -24.00409698486328, "global_step": 202795, "epoch": 2443} {"train_loss": -24.151884078979492, "global_step": 202796, "epoch": 2443} {"train_loss": -24.099740982055664, "global_step": 202797, "epoch": 2443} {"train_loss": -24.355390548706055, "global_step": 202798, "epoch": 2443} {"train_loss": -24.15847396850586, "global_step": 202799, "epoch": 2443} {"train_loss": -24.010303497314453, "global_step": 202800, "epoch": 2443} {"train_loss": -23.9942626953125, "global_step": 202801, "epoch": 2443} {"train_loss": -24.583005905151367, "global_step": 202802, "epoch": 2443} {"train_loss": -24.39955711364746, "global_step": 202803, "epoch": 2443} {"train_loss": -24.524707794189453, "global_step": 202804, "epoch": 2443} {"train_loss": -24.226652145385742, "global_step": 202805, "epoch": 2443} {"train_loss": -24.455724716186523, "global_step": 202806, "epoch": 2443} {"train_loss": -24.6506404876709, "global_step": 202807, "epoch": 2443} {"train_loss": -24.361682891845703, "global_step": 202808, "epoch": 2443} {"train_loss": -24.429365158081055, "global_step": 202809, "epoch": 2443} {"train_loss": -24.248138427734375, "global_step": 202810, "epoch": 2443} {"train_loss": -24.34250259399414, "global_step": 202811, "epoch": 2443} {"train_loss": -24.325092315673828, "global_step": 202812, "epoch": 2443} {"train_loss": -24.204912185668945, "global_step": 202813, "epoch": 2443} {"train_loss": -24.538087844848633, "global_step": 202814, "epoch": 2443} {"train_loss": -24.791889190673828, "global_step": 202815, "epoch": 2443} {"train_loss": -24.661663055419922, "global_step": 202816, "epoch": 2443} {"train_loss": -24.38068962097168, "global_step": 202817, "epoch": 2443} {"train_loss": -24.3250789642334, "global_step": 202818, "epoch": 2443} {"train_loss": -24.2316951751709, "global_step": 202819, "epoch": 2443} {"train_loss": -24.47709083557129, "global_step": 202820, "epoch": 2443} {"train_loss": -24.1953125, "global_step": 202821, "epoch": 2443} {"train_loss": -24.372495651245117, "global_step": 202822, "epoch": 2443} {"train_loss": -24.79190444946289, "global_step": 202823, "epoch": 2443} {"train_loss": -24.331480026245117, "global_step": 202824, "epoch": 2443} {"train_loss": -24.384456634521484, "global_step": 202825, "epoch": 2443} {"train_loss": -24.47256088256836, "global_step": 202826, "epoch": 2443} {"train_loss": -24.519590377807617, "global_step": 202827, "epoch": 2443} {"train_loss": -24.51593589782715, "global_step": 202828, "epoch": 2443} {"train_loss": -24.297916412353516, "global_step": 202829, "epoch": 2443} {"train_loss": -24.517011642456055, "global_step": 202830, "epoch": 2443} {"train_loss": -24.174915313720703, "global_step": 202831, "epoch": 2443} {"train_loss": -24.222679138183594, "global_step": 202832, "epoch": 2443} {"train_loss": -24.476760864257812, "global_step": 202833, "epoch": 2443} {"train_loss": -24.422622680664062, "global_step": 202834, "epoch": 2443} {"train_loss": -24.45365333557129, "global_step": 202835, "epoch": 2443} {"train_loss": -24.698753356933594, "global_step": 202836, "epoch": 2443} {"train_loss": -24.46124839782715, "global_step": 202837, "epoch": 2443} {"train_loss": -24.299795150756836, "global_step": 202838, "epoch": 2443} {"train_loss": -24.372251510620117, "global_step": 202839, "epoch": 2443} {"train_loss": -24.39434814453125, "global_step": 202840, "epoch": 2443} {"train_loss": -24.56785011291504, "global_step": 202841, "epoch": 2443} {"train_loss": -24.18491554260254, "global_step": 202842, "epoch": 2443} {"train_loss": -24.72681999206543, "global_step": 202843, "epoch": 2443} {"train_loss": -24.48697280883789, "global_step": 202844, "epoch": 2443} {"train_loss": -24.18086051940918, "global_step": 202845, "epoch": 2443} {"train_loss": -24.7623348236084, "global_step": 202846, "epoch": 2443} {"train_loss": -24.39468765258789, "global_step": 202847, "epoch": 2443} {"train_loss": -24.631187438964844, "global_step": 202848, "epoch": 2443} {"train_loss": -23.883132934570312, "global_step": 202849, "epoch": 2443} {"train_loss": -24.140378952026367, "global_step": 202850, "epoch": 2443} {"train_loss": -24.246791012315864, "global_step": 202851, "epoch": 2443, "val_loss": 6574697.0} {"train_loss": -23.46677589416504, "global_step": 202852, "epoch": 2444} {"train_loss": -23.2957706451416, "global_step": 202853, "epoch": 2444} {"train_loss": -23.91730499267578, "global_step": 202854, "epoch": 2444} {"train_loss": -23.469039916992188, "global_step": 202855, "epoch": 2444} {"train_loss": -23.917261123657227, "global_step": 202856, "epoch": 2444} {"train_loss": -23.683391571044922, "global_step": 202857, "epoch": 2444} {"train_loss": -23.89874267578125, "global_step": 202858, "epoch": 2444} {"train_loss": -23.629051208496094, "global_step": 202859, "epoch": 2444} {"train_loss": -23.939533233642578, "global_step": 202860, "epoch": 2444} {"train_loss": -23.694589614868164, "global_step": 202861, "epoch": 2444} {"train_loss": -23.725069046020508, "global_step": 202862, "epoch": 2444} {"train_loss": -24.05167579650879, "global_step": 202863, "epoch": 2444} {"train_loss": -23.721906661987305, "global_step": 202864, "epoch": 2444} {"train_loss": -24.247621536254883, "global_step": 202865, "epoch": 2444} {"train_loss": -24.08601951599121, "global_step": 202866, "epoch": 2444} {"train_loss": -24.24554443359375, "global_step": 202867, "epoch": 2444} {"train_loss": -23.835893630981445, "global_step": 202868, "epoch": 2444} {"train_loss": -24.140653610229492, "global_step": 202869, "epoch": 2444} {"train_loss": -24.248647689819336, "global_step": 202870, "epoch": 2444} {"train_loss": -24.07101821899414, "global_step": 202871, "epoch": 2444} {"train_loss": -23.834644317626953, "global_step": 202872, "epoch": 2444} {"train_loss": -23.712238311767578, "global_step": 202873, "epoch": 2444} {"train_loss": -23.850505828857422, "global_step": 202874, "epoch": 2444} {"train_loss": -24.459623336791992, "global_step": 202875, "epoch": 2444} {"train_loss": -24.31534194946289, "global_step": 202876, "epoch": 2444} {"train_loss": -24.057830810546875, "global_step": 202877, "epoch": 2444} {"train_loss": -24.015766143798828, "global_step": 202878, "epoch": 2444} {"train_loss": -24.134754180908203, "global_step": 202879, "epoch": 2444} {"train_loss": -24.124736785888672, "global_step": 202880, "epoch": 2444} {"train_loss": -24.223159790039062, "global_step": 202881, "epoch": 2444} {"train_loss": -24.670639038085938, "global_step": 202882, "epoch": 2444} {"train_loss": -24.168548583984375, "global_step": 202883, "epoch": 2444} {"train_loss": -24.456012725830078, "global_step": 202884, "epoch": 2444} {"train_loss": -24.363304138183594, "global_step": 202885, "epoch": 2444} {"train_loss": -24.150205612182617, "global_step": 202886, "epoch": 2444} {"train_loss": -24.168912887573242, "global_step": 202887, "epoch": 2444} {"train_loss": -24.451370239257812, "global_step": 202888, "epoch": 2444} {"train_loss": -24.653411865234375, "global_step": 202889, "epoch": 2444} {"train_loss": -24.45006561279297, "global_step": 202890, "epoch": 2444} {"train_loss": -24.574817657470703, "global_step": 202891, "epoch": 2444} {"train_loss": -24.652326583862305, "global_step": 202892, "epoch": 2444} {"train_loss": -24.35890769958496, "global_step": 202893, "epoch": 2444} {"train_loss": -24.540157318115234, "global_step": 202894, "epoch": 2444} {"train_loss": -24.404434204101562, "global_step": 202895, "epoch": 2444} {"train_loss": -24.311941146850586, "global_step": 202896, "epoch": 2444} {"train_loss": -24.73737907409668, "global_step": 202897, "epoch": 2444} {"train_loss": -24.249618530273438, "global_step": 202898, "epoch": 2444} {"train_loss": -23.985158920288086, "global_step": 202899, "epoch": 2444} {"train_loss": -24.305627822875977, "global_step": 202900, "epoch": 2444} {"train_loss": -24.20966148376465, "global_step": 202901, "epoch": 2444} {"train_loss": -23.912687301635742, "global_step": 202902, "epoch": 2444} {"train_loss": -24.260501861572266, "global_step": 202903, "epoch": 2444} {"train_loss": -24.218217849731445, "global_step": 202904, "epoch": 2444} {"train_loss": -24.3723201751709, "global_step": 202905, "epoch": 2444} {"train_loss": -23.905540466308594, "global_step": 202906, "epoch": 2444} {"train_loss": -24.311681747436523, "global_step": 202907, "epoch": 2444} {"train_loss": -24.110464096069336, "global_step": 202908, "epoch": 2444} {"train_loss": -24.341455459594727, "global_step": 202909, "epoch": 2444} {"train_loss": -24.290668487548828, "global_step": 202910, "epoch": 2444} {"train_loss": -24.023481369018555, "global_step": 202911, "epoch": 2444} {"train_loss": -24.140043258666992, "global_step": 202912, "epoch": 2444} {"train_loss": -24.010488510131836, "global_step": 202913, "epoch": 2444} {"train_loss": -24.529571533203125, "global_step": 202914, "epoch": 2444} {"train_loss": -24.36244010925293, "global_step": 202915, "epoch": 2444} {"train_loss": -24.220258712768555, "global_step": 202916, "epoch": 2444} {"train_loss": -24.20469093322754, "global_step": 202917, "epoch": 2444} {"train_loss": -24.23941421508789, "global_step": 202918, "epoch": 2444} {"train_loss": -24.488842010498047, "global_step": 202919, "epoch": 2444} {"train_loss": -24.244070053100586, "global_step": 202920, "epoch": 2444} {"train_loss": -24.30952262878418, "global_step": 202921, "epoch": 2444} {"train_loss": -23.518957138061523, "global_step": 202922, "epoch": 2444} {"train_loss": -24.305612564086914, "global_step": 202923, "epoch": 2444} {"train_loss": -24.183958053588867, "global_step": 202924, "epoch": 2444} {"train_loss": -24.172283172607422, "global_step": 202925, "epoch": 2444} {"train_loss": -24.381071090698242, "global_step": 202926, "epoch": 2444} {"train_loss": -24.371206283569336, "global_step": 202927, "epoch": 2444} {"train_loss": -24.19965362548828, "global_step": 202928, "epoch": 2444} {"train_loss": -24.360877990722656, "global_step": 202929, "epoch": 2444} {"train_loss": -24.495532989501953, "global_step": 202930, "epoch": 2444} {"train_loss": -24.54783058166504, "global_step": 202931, "epoch": 2444} {"train_loss": -24.228452682495117, "global_step": 202932, "epoch": 2444} {"train_loss": -24.561126708984375, "global_step": 202933, "epoch": 2444} {"train_loss": -24.16488054574254, "global_step": 202934, "epoch": 2444, "val_loss": 6517433.0} {"train_loss": -24.52630615234375, "global_step": 202935, "epoch": 2445} {"train_loss": -24.129947662353516, "global_step": 202936, "epoch": 2445} {"train_loss": -24.129396438598633, "global_step": 202937, "epoch": 2445} {"train_loss": -24.402437210083008, "global_step": 202938, "epoch": 2445} {"train_loss": -24.446308135986328, "global_step": 202939, "epoch": 2445} {"train_loss": -23.9022216796875, "global_step": 202940, "epoch": 2445} {"train_loss": -24.20611000061035, "global_step": 202941, "epoch": 2445} {"train_loss": -24.088464736938477, "global_step": 202942, "epoch": 2445} {"train_loss": -24.432392120361328, "global_step": 202943, "epoch": 2445} {"train_loss": -24.15511703491211, "global_step": 202944, "epoch": 2445} {"train_loss": -24.300050735473633, "global_step": 202945, "epoch": 2445} {"train_loss": -24.547592163085938, "global_step": 202946, "epoch": 2445} {"train_loss": -24.45635986328125, "global_step": 202947, "epoch": 2445} {"train_loss": -24.170856475830078, "global_step": 202948, "epoch": 2445} {"train_loss": -24.608572006225586, "global_step": 202949, "epoch": 2445} {"train_loss": -24.152151107788086, "global_step": 202950, "epoch": 2445} {"train_loss": -24.579092025756836, "global_step": 202951, "epoch": 2445} {"train_loss": -24.173452377319336, "global_step": 202952, "epoch": 2445} {"train_loss": -24.2247314453125, "global_step": 202953, "epoch": 2445} {"train_loss": -24.397687911987305, "global_step": 202954, "epoch": 2445} {"train_loss": -24.71718406677246, "global_step": 202955, "epoch": 2445} {"train_loss": -24.201261520385742, "global_step": 202956, "epoch": 2445} {"train_loss": -24.039691925048828, "global_step": 202957, "epoch": 2445} {"train_loss": -24.212459564208984, "global_step": 202958, "epoch": 2445} {"train_loss": -24.1203670501709, "global_step": 202959, "epoch": 2445} {"train_loss": -24.105592727661133, "global_step": 202960, "epoch": 2445} {"train_loss": -24.675451278686523, "global_step": 202961, "epoch": 2445} {"train_loss": -24.093067169189453, "global_step": 202962, "epoch": 2445} {"train_loss": -24.209890365600586, "global_step": 202963, "epoch": 2445} {"train_loss": -24.343427658081055, "global_step": 202964, "epoch": 2445} {"train_loss": -24.98733901977539, "global_step": 202965, "epoch": 2445} {"train_loss": -24.215133666992188, "global_step": 202966, "epoch": 2445} {"train_loss": -24.155241012573242, "global_step": 202967, "epoch": 2445} {"train_loss": -24.530811309814453, "global_step": 202968, "epoch": 2445} {"train_loss": -24.281139373779297, "global_step": 202969, "epoch": 2445} {"train_loss": -24.387720108032227, "global_step": 202970, "epoch": 2445} {"train_loss": -24.2100830078125, "global_step": 202971, "epoch": 2445} {"train_loss": -24.201385498046875, "global_step": 202972, "epoch": 2445} {"train_loss": -24.42951774597168, "global_step": 202973, "epoch": 2445} {"train_loss": -24.1428279876709, "global_step": 202974, "epoch": 2445} {"train_loss": -24.53550148010254, "global_step": 202975, "epoch": 2445} {"train_loss": -24.210594177246094, "global_step": 202976, "epoch": 2445} {"train_loss": -24.337461471557617, "global_step": 202977, "epoch": 2445} {"train_loss": -24.310461044311523, "global_step": 202978, "epoch": 2445} {"train_loss": -24.512737274169922, "global_step": 202979, "epoch": 2445} {"train_loss": -24.18416404724121, "global_step": 202980, "epoch": 2445} {"train_loss": -24.049917221069336, "global_step": 202981, "epoch": 2445} {"train_loss": -24.301979064941406, "global_step": 202982, "epoch": 2445} {"train_loss": -24.518781661987305, "global_step": 202983, "epoch": 2445} {"train_loss": -24.181049346923828, "global_step": 202984, "epoch": 2445} {"train_loss": -24.097749710083008, "global_step": 202985, "epoch": 2445} {"train_loss": -24.0709228515625, "global_step": 202986, "epoch": 2445} {"train_loss": -24.37908363342285, "global_step": 202987, "epoch": 2445} {"train_loss": -24.71646499633789, "global_step": 202988, "epoch": 2445} {"train_loss": -24.35999870300293, "global_step": 202989, "epoch": 2445} {"train_loss": -24.268644332885742, "global_step": 202990, "epoch": 2445} {"train_loss": -24.326536178588867, "global_step": 202991, "epoch": 2445} {"train_loss": -24.424951553344727, "global_step": 202992, "epoch": 2445} {"train_loss": -24.204059600830078, "global_step": 202993, "epoch": 2445} {"train_loss": -24.582372665405273, "global_step": 202994, "epoch": 2445} {"train_loss": -24.517454147338867, "global_step": 202995, "epoch": 2445} {"train_loss": -24.52889633178711, "global_step": 202996, "epoch": 2445} {"train_loss": -24.43705940246582, "global_step": 202997, "epoch": 2445} {"train_loss": -24.52943229675293, "global_step": 202998, "epoch": 2445} {"train_loss": -24.522958755493164, "global_step": 202999, "epoch": 2445} {"train_loss": -24.240238189697266, "global_step": 203000, "epoch": 2445} {"train_loss": -24.344079971313477, "global_step": 203001, "epoch": 2445} {"train_loss": -24.138965606689453, "global_step": 203002, "epoch": 2445} {"train_loss": -24.173038482666016, "global_step": 203003, "epoch": 2445} {"train_loss": -24.459314346313477, "global_step": 203004, "epoch": 2445} {"train_loss": -24.34221839904785, "global_step": 203005, "epoch": 2445} {"train_loss": -24.488262176513672, "global_step": 203006, "epoch": 2445} {"train_loss": -24.588043212890625, "global_step": 203007, "epoch": 2445} {"train_loss": -24.729244232177734, "global_step": 203008, "epoch": 2445} {"train_loss": -23.953908920288086, "global_step": 203009, "epoch": 2445} {"train_loss": -24.001462936401367, "global_step": 203010, "epoch": 2445} {"train_loss": -24.323986053466797, "global_step": 203011, "epoch": 2445} {"train_loss": -24.1838436126709, "global_step": 203012, "epoch": 2445} {"train_loss": -24.058441162109375, "global_step": 203013, "epoch": 2445} {"train_loss": -23.985830307006836, "global_step": 203014, "epoch": 2445} {"train_loss": -24.372303009033203, "global_step": 203015, "epoch": 2445} {"train_loss": -24.308263778686523, "global_step": 203016, "epoch": 2445} {"train_loss": -24.311915684895343, "global_step": 203017, "epoch": 2445, "val_loss": 6659009.0} {"train_loss": -23.742284774780273, "global_step": 203018, "epoch": 2446} {"train_loss": -23.73392105102539, "global_step": 203019, "epoch": 2446} {"train_loss": -24.09103775024414, "global_step": 203020, "epoch": 2446} {"train_loss": -23.650314331054688, "global_step": 203021, "epoch": 2446} {"train_loss": -24.00579833984375, "global_step": 203022, "epoch": 2446} {"train_loss": -23.835111618041992, "global_step": 203023, "epoch": 2446} {"train_loss": -23.789831161499023, "global_step": 203024, "epoch": 2446} {"train_loss": -23.574050903320312, "global_step": 203025, "epoch": 2446} {"train_loss": -23.981082916259766, "global_step": 203026, "epoch": 2446} {"train_loss": -23.919666290283203, "global_step": 203027, "epoch": 2446} {"train_loss": -23.434097290039062, "global_step": 203028, "epoch": 2446} {"train_loss": -24.443281173706055, "global_step": 203029, "epoch": 2446} {"train_loss": -24.111040115356445, "global_step": 203030, "epoch": 2446} {"train_loss": -24.206012725830078, "global_step": 203031, "epoch": 2446} {"train_loss": -24.284570693969727, "global_step": 203032, "epoch": 2446} {"train_loss": -23.855815887451172, "global_step": 203033, "epoch": 2446} {"train_loss": -24.17160987854004, "global_step": 203034, "epoch": 2446} {"train_loss": -24.661367416381836, "global_step": 203035, "epoch": 2446} {"train_loss": -24.53389549255371, "global_step": 203036, "epoch": 2446} {"train_loss": -24.299043655395508, "global_step": 203037, "epoch": 2446} {"train_loss": -24.27901840209961, "global_step": 203038, "epoch": 2446} {"train_loss": -24.316099166870117, "global_step": 203039, "epoch": 2446} {"train_loss": -24.500640869140625, "global_step": 203040, "epoch": 2446} {"train_loss": -24.57671546936035, "global_step": 203041, "epoch": 2446} {"train_loss": -24.782920837402344, "global_step": 203042, "epoch": 2446} {"train_loss": -24.218719482421875, "global_step": 203043, "epoch": 2446} {"train_loss": -24.239648818969727, "global_step": 203044, "epoch": 2446} {"train_loss": -24.224822998046875, "global_step": 203045, "epoch": 2446} {"train_loss": -24.459732055664062, "global_step": 203046, "epoch": 2446} {"train_loss": -24.349655151367188, "global_step": 203047, "epoch": 2446} {"train_loss": -24.62734031677246, "global_step": 203048, "epoch": 2446} {"train_loss": -23.96101951599121, "global_step": 203049, "epoch": 2446} {"train_loss": -24.301319122314453, "global_step": 203050, "epoch": 2446} {"train_loss": -24.575763702392578, "global_step": 203051, "epoch": 2446} {"train_loss": -24.077939987182617, "global_step": 203052, "epoch": 2446} {"train_loss": -24.186941146850586, "global_step": 203053, "epoch": 2446} {"train_loss": -24.352659225463867, "global_step": 203054, "epoch": 2446} {"train_loss": -24.11452293395996, "global_step": 203055, "epoch": 2446} {"train_loss": -24.202878952026367, "global_step": 203056, "epoch": 2446} {"train_loss": -24.309356689453125, "global_step": 203057, "epoch": 2446} {"train_loss": -24.371196746826172, "global_step": 203058, "epoch": 2446} {"train_loss": -24.289339065551758, "global_step": 203059, "epoch": 2446} {"train_loss": -24.36211585998535, "global_step": 203060, "epoch": 2446} {"train_loss": -24.514577865600586, "global_step": 203061, "epoch": 2446} {"train_loss": -24.06930923461914, "global_step": 203062, "epoch": 2446} {"train_loss": -24.187917709350586, "global_step": 203063, "epoch": 2446} {"train_loss": -24.236600875854492, "global_step": 203064, "epoch": 2446} {"train_loss": -24.785551071166992, "global_step": 203065, "epoch": 2446} {"train_loss": -24.3886775970459, "global_step": 203066, "epoch": 2446} {"train_loss": -24.354543685913086, "global_step": 203067, "epoch": 2446} {"train_loss": -24.362014770507812, "global_step": 203068, "epoch": 2446} {"train_loss": -23.858062744140625, "global_step": 203069, "epoch": 2446} {"train_loss": -23.72035789489746, "global_step": 203070, "epoch": 2446} {"train_loss": -23.826738357543945, "global_step": 203071, "epoch": 2446} {"train_loss": -23.59895133972168, "global_step": 203072, "epoch": 2446} {"train_loss": -23.770095825195312, "global_step": 203073, "epoch": 2446} {"train_loss": -24.33071517944336, "global_step": 203074, "epoch": 2446} {"train_loss": -24.353042602539062, "global_step": 203075, "epoch": 2446} {"train_loss": -23.980854034423828, "global_step": 203076, "epoch": 2446} {"train_loss": -24.488788604736328, "global_step": 203077, "epoch": 2446} {"train_loss": -24.408418655395508, "global_step": 203078, "epoch": 2446} {"train_loss": -24.24713134765625, "global_step": 203079, "epoch": 2446} {"train_loss": -24.481428146362305, "global_step": 203080, "epoch": 2446} {"train_loss": -24.155364990234375, "global_step": 203081, "epoch": 2446} {"train_loss": -24.421043395996094, "global_step": 203082, "epoch": 2446} {"train_loss": -24.299869537353516, "global_step": 203083, "epoch": 2446} {"train_loss": -24.442033767700195, "global_step": 203084, "epoch": 2446} {"train_loss": -24.12828826904297, "global_step": 203085, "epoch": 2446} {"train_loss": -24.212324142456055, "global_step": 203086, "epoch": 2446} {"train_loss": -24.308134078979492, "global_step": 203087, "epoch": 2446} {"train_loss": -24.453195571899414, "global_step": 203088, "epoch": 2446} {"train_loss": -24.37176513671875, "global_step": 203089, "epoch": 2446} {"train_loss": -24.34797477722168, "global_step": 203090, "epoch": 2446} {"train_loss": -24.621463775634766, "global_step": 203091, "epoch": 2446} {"train_loss": -24.37738609313965, "global_step": 203092, "epoch": 2446} {"train_loss": -24.539939880371094, "global_step": 203093, "epoch": 2446} {"train_loss": -24.37554931640625, "global_step": 203094, "epoch": 2446} {"train_loss": -24.463912963867188, "global_step": 203095, "epoch": 2446} {"train_loss": -24.417097091674805, "global_step": 203096, "epoch": 2446} {"train_loss": -24.247121810913086, "global_step": 203097, "epoch": 2446} {"train_loss": -24.607824325561523, "global_step": 203098, "epoch": 2446} {"train_loss": -24.524328231811523, "global_step": 203099, "epoch": 2446} {"train_loss": -24.254431965839434, "global_step": 203100, "epoch": 2446, "val_loss": 6595969.0} {"train_loss": -24.305253982543945, "global_step": 203101, "epoch": 2447} {"train_loss": -23.914222717285156, "global_step": 203102, "epoch": 2447} {"train_loss": -24.00569725036621, "global_step": 203103, "epoch": 2447} {"train_loss": -23.82416343688965, "global_step": 203104, "epoch": 2447} {"train_loss": -24.02499771118164, "global_step": 203105, "epoch": 2447} {"train_loss": -23.901220321655273, "global_step": 203106, "epoch": 2447} {"train_loss": -23.963098526000977, "global_step": 203107, "epoch": 2447} {"train_loss": -23.772642135620117, "global_step": 203108, "epoch": 2447} {"train_loss": -24.03293800354004, "global_step": 203109, "epoch": 2447} {"train_loss": -24.26399803161621, "global_step": 203110, "epoch": 2447} {"train_loss": -23.857009887695312, "global_step": 203111, "epoch": 2447} {"train_loss": -23.878034591674805, "global_step": 203112, "epoch": 2447} {"train_loss": -24.148666381835938, "global_step": 203113, "epoch": 2447} {"train_loss": -23.89076805114746, "global_step": 203114, "epoch": 2447} {"train_loss": -24.069395065307617, "global_step": 203115, "epoch": 2447} {"train_loss": -23.97202491760254, "global_step": 203116, "epoch": 2447} {"train_loss": -24.168363571166992, "global_step": 203117, "epoch": 2447} {"train_loss": -24.129058837890625, "global_step": 203118, "epoch": 2447} {"train_loss": -24.019596099853516, "global_step": 203119, "epoch": 2447} {"train_loss": -24.18037223815918, "global_step": 203120, "epoch": 2447} {"train_loss": -24.252944946289062, "global_step": 203121, "epoch": 2447} {"train_loss": -24.28242301940918, "global_step": 203122, "epoch": 2447} {"train_loss": -23.802932739257812, "global_step": 203123, "epoch": 2447} {"train_loss": -24.177976608276367, "global_step": 203124, "epoch": 2447} {"train_loss": -24.262985229492188, "global_step": 203125, "epoch": 2447} {"train_loss": -24.495588302612305, "global_step": 203126, "epoch": 2447} {"train_loss": -24.319259643554688, "global_step": 203127, "epoch": 2447} {"train_loss": -24.36563491821289, "global_step": 203128, "epoch": 2447} {"train_loss": -24.062822341918945, "global_step": 203129, "epoch": 2447} {"train_loss": -24.378273010253906, "global_step": 203130, "epoch": 2447} {"train_loss": -24.283361434936523, "global_step": 203131, "epoch": 2447} {"train_loss": -24.327743530273438, "global_step": 203132, "epoch": 2447} {"train_loss": -24.41573143005371, "global_step": 203133, "epoch": 2447} {"train_loss": -24.149871826171875, "global_step": 203134, "epoch": 2447} {"train_loss": -24.203323364257812, "global_step": 203135, "epoch": 2447} {"train_loss": -24.448209762573242, "global_step": 203136, "epoch": 2447} {"train_loss": -24.24494743347168, "global_step": 203137, "epoch": 2447} {"train_loss": -24.29429054260254, "global_step": 203138, "epoch": 2447} {"train_loss": -24.502384185791016, "global_step": 203139, "epoch": 2447} {"train_loss": -24.545862197875977, "global_step": 203140, "epoch": 2447} {"train_loss": -24.449216842651367, "global_step": 203141, "epoch": 2447} {"train_loss": -24.715051651000977, "global_step": 203142, "epoch": 2447} {"train_loss": -24.425769805908203, "global_step": 203143, "epoch": 2447} {"train_loss": -24.71875, "global_step": 203144, "epoch": 2447} {"train_loss": -24.160680770874023, "global_step": 203145, "epoch": 2447} {"train_loss": -24.846921920776367, "global_step": 203146, "epoch": 2447} {"train_loss": -24.409748077392578, "global_step": 203147, "epoch": 2447} {"train_loss": -23.893510818481445, "global_step": 203148, "epoch": 2447} {"train_loss": -24.19932746887207, "global_step": 203149, "epoch": 2447} {"train_loss": -24.037761688232422, "global_step": 203150, "epoch": 2447} {"train_loss": -24.028074264526367, "global_step": 203151, "epoch": 2447} {"train_loss": -24.37196159362793, "global_step": 203152, "epoch": 2447} {"train_loss": -24.00279998779297, "global_step": 203153, "epoch": 2447} {"train_loss": -24.502180099487305, "global_step": 203154, "epoch": 2447} {"train_loss": -24.102590560913086, "global_step": 203155, "epoch": 2447} {"train_loss": -24.41053581237793, "global_step": 203156, "epoch": 2447} {"train_loss": -24.400053024291992, "global_step": 203157, "epoch": 2447} {"train_loss": -24.166732788085938, "global_step": 203158, "epoch": 2447} {"train_loss": -24.114856719970703, "global_step": 203159, "epoch": 2447} {"train_loss": -24.234392166137695, "global_step": 203160, "epoch": 2447} {"train_loss": -24.440826416015625, "global_step": 203161, "epoch": 2447} {"train_loss": -24.332794189453125, "global_step": 203162, "epoch": 2447} {"train_loss": -24.066640853881836, "global_step": 203163, "epoch": 2447} {"train_loss": -24.096006393432617, "global_step": 203164, "epoch": 2447} {"train_loss": -24.415149688720703, "global_step": 203165, "epoch": 2447} {"train_loss": -24.214658737182617, "global_step": 203166, "epoch": 2447} {"train_loss": -24.24677848815918, "global_step": 203167, "epoch": 2447} {"train_loss": -23.703039169311523, "global_step": 203168, "epoch": 2447} {"train_loss": -24.013120651245117, "global_step": 203169, "epoch": 2447} {"train_loss": -24.43372917175293, "global_step": 203170, "epoch": 2447} {"train_loss": -24.187166213989258, "global_step": 203171, "epoch": 2447} {"train_loss": -24.179105758666992, "global_step": 203172, "epoch": 2447} {"train_loss": -24.51650619506836, "global_step": 203173, "epoch": 2447} {"train_loss": -24.263076782226562, "global_step": 203174, "epoch": 2447} {"train_loss": -24.50079345703125, "global_step": 203175, "epoch": 2447} {"train_loss": -24.19244384765625, "global_step": 203176, "epoch": 2447} {"train_loss": -24.346662521362305, "global_step": 203177, "epoch": 2447} {"train_loss": -24.328556060791016, "global_step": 203178, "epoch": 2447} {"train_loss": -24.349889755249023, "global_step": 203179, "epoch": 2447} {"train_loss": -24.486316680908203, "global_step": 203180, "epoch": 2447} {"train_loss": -24.318639755249023, "global_step": 203181, "epoch": 2447} {"train_loss": -24.236841201782227, "global_step": 203182, "epoch": 2447} {"train_loss": -24.24200880671122, "global_step": 203183, "epoch": 2447, "val_loss": 6607308.5} {"train_loss": -23.87325096130371, "global_step": 203184, "epoch": 2448} {"train_loss": -23.947742462158203, "global_step": 203185, "epoch": 2448} {"train_loss": -23.804893493652344, "global_step": 203186, "epoch": 2448} {"train_loss": -24.19391441345215, "global_step": 203187, "epoch": 2448} {"train_loss": -24.386701583862305, "global_step": 203188, "epoch": 2448} {"train_loss": -23.93478775024414, "global_step": 203189, "epoch": 2448} {"train_loss": -24.613004684448242, "global_step": 203190, "epoch": 2448} {"train_loss": -23.87982177734375, "global_step": 203191, "epoch": 2448} {"train_loss": -24.035062789916992, "global_step": 203192, "epoch": 2448} {"train_loss": -23.924667358398438, "global_step": 203193, "epoch": 2448} {"train_loss": -24.134193420410156, "global_step": 203194, "epoch": 2448} {"train_loss": -24.3500919342041, "global_step": 203195, "epoch": 2448} {"train_loss": -24.398664474487305, "global_step": 203196, "epoch": 2448} {"train_loss": -24.084989547729492, "global_step": 203197, "epoch": 2448} {"train_loss": -24.03476333618164, "global_step": 203198, "epoch": 2448} {"train_loss": -24.003019332885742, "global_step": 203199, "epoch": 2448} {"train_loss": -24.22792625427246, "global_step": 203200, "epoch": 2448} {"train_loss": -24.7486629486084, "global_step": 203201, "epoch": 2448} {"train_loss": -24.40012550354004, "global_step": 203202, "epoch": 2448} {"train_loss": -24.425384521484375, "global_step": 203203, "epoch": 2448} {"train_loss": -24.339303970336914, "global_step": 203204, "epoch": 2448} {"train_loss": -24.189334869384766, "global_step": 203205, "epoch": 2448} {"train_loss": -24.217456817626953, "global_step": 203206, "epoch": 2448} {"train_loss": -24.57366371154785, "global_step": 203207, "epoch": 2448} {"train_loss": -24.643234252929688, "global_step": 203208, "epoch": 2448} {"train_loss": -24.269773483276367, "global_step": 203209, "epoch": 2448} {"train_loss": -24.177413940429688, "global_step": 203210, "epoch": 2448} {"train_loss": -24.025983810424805, "global_step": 203211, "epoch": 2448} {"train_loss": -24.515024185180664, "global_step": 203212, "epoch": 2448} {"train_loss": -23.934131622314453, "global_step": 203213, "epoch": 2448} {"train_loss": -24.540828704833984, "global_step": 203214, "epoch": 2448} {"train_loss": -24.453853607177734, "global_step": 203215, "epoch": 2448} {"train_loss": -24.408926010131836, "global_step": 203216, "epoch": 2448} {"train_loss": -24.429075241088867, "global_step": 203217, "epoch": 2448} {"train_loss": -24.355804443359375, "global_step": 203218, "epoch": 2448} {"train_loss": -24.292760848999023, "global_step": 203219, "epoch": 2448} {"train_loss": -24.250303268432617, "global_step": 203220, "epoch": 2448} {"train_loss": -24.136119842529297, "global_step": 203221, "epoch": 2448} {"train_loss": -24.061481475830078, "global_step": 203222, "epoch": 2448} {"train_loss": -24.603750228881836, "global_step": 203223, "epoch": 2448} {"train_loss": -24.03449821472168, "global_step": 203224, "epoch": 2448} {"train_loss": -24.12403678894043, "global_step": 203225, "epoch": 2448} {"train_loss": -24.404874801635742, "global_step": 203226, "epoch": 2448} {"train_loss": -24.12346839904785, "global_step": 203227, "epoch": 2448} {"train_loss": -24.14727783203125, "global_step": 203228, "epoch": 2448} {"train_loss": -24.245576858520508, "global_step": 203229, "epoch": 2448} {"train_loss": -24.475088119506836, "global_step": 203230, "epoch": 2448} {"train_loss": -24.39078712463379, "global_step": 203231, "epoch": 2448} {"train_loss": -24.481475830078125, "global_step": 203232, "epoch": 2448} {"train_loss": -24.49315643310547, "global_step": 203233, "epoch": 2448} {"train_loss": -24.47372817993164, "global_step": 203234, "epoch": 2448} {"train_loss": -23.84554100036621, "global_step": 203235, "epoch": 2448} {"train_loss": -24.12950897216797, "global_step": 203236, "epoch": 2448} {"train_loss": -24.9728946685791, "global_step": 203237, "epoch": 2448} {"train_loss": -24.356069564819336, "global_step": 203238, "epoch": 2448} {"train_loss": -24.407150268554688, "global_step": 203239, "epoch": 2448} {"train_loss": -24.304807662963867, "global_step": 203240, "epoch": 2448} {"train_loss": -24.44000244140625, "global_step": 203241, "epoch": 2448} {"train_loss": -24.54130744934082, "global_step": 203242, "epoch": 2448} {"train_loss": -24.612417221069336, "global_step": 203243, "epoch": 2448} {"train_loss": -24.314617156982422, "global_step": 203244, "epoch": 2448} {"train_loss": -24.049423217773438, "global_step": 203245, "epoch": 2448} {"train_loss": -24.49500274658203, "global_step": 203246, "epoch": 2448} {"train_loss": -24.486743927001953, "global_step": 203247, "epoch": 2448} {"train_loss": -24.220041275024414, "global_step": 203248, "epoch": 2448} {"train_loss": -24.363210678100586, "global_step": 203249, "epoch": 2448} {"train_loss": -24.278837203979492, "global_step": 203250, "epoch": 2448} {"train_loss": -24.47164535522461, "global_step": 203251, "epoch": 2448} {"train_loss": -23.902164459228516, "global_step": 203252, "epoch": 2448} {"train_loss": -24.440418243408203, "global_step": 203253, "epoch": 2448} {"train_loss": -24.345767974853516, "global_step": 203254, "epoch": 2448} {"train_loss": -24.215803146362305, "global_step": 203255, "epoch": 2448} {"train_loss": -24.35089111328125, "global_step": 203256, "epoch": 2448} {"train_loss": -24.230224609375, "global_step": 203257, "epoch": 2448} {"train_loss": -24.41994285583496, "global_step": 203258, "epoch": 2448} {"train_loss": -24.132904052734375, "global_step": 203259, "epoch": 2448} {"train_loss": -24.156024932861328, "global_step": 203260, "epoch": 2448} {"train_loss": -24.250913619995117, "global_step": 203261, "epoch": 2448} {"train_loss": -24.271493911743164, "global_step": 203262, "epoch": 2448} {"train_loss": -24.418739318847656, "global_step": 203263, "epoch": 2448} {"train_loss": -24.406721115112305, "global_step": 203264, "epoch": 2448} {"train_loss": -24.610986709594727, "global_step": 203265, "epoch": 2448} {"train_loss": -24.29080740227757, "global_step": 203266, "epoch": 2448, "val_loss": 6707514.0} {"train_loss": -24.281953811645508, "global_step": 203267, "epoch": 2449} {"train_loss": -24.259313583374023, "global_step": 203268, "epoch": 2449} {"train_loss": -24.25811004638672, "global_step": 203269, "epoch": 2449} {"train_loss": -24.275861740112305, "global_step": 203270, "epoch": 2449} {"train_loss": -24.264902114868164, "global_step": 203271, "epoch": 2449} {"train_loss": -24.288423538208008, "global_step": 203272, "epoch": 2449} {"train_loss": -24.491764068603516, "global_step": 203273, "epoch": 2449} {"train_loss": -24.12631607055664, "global_step": 203274, "epoch": 2449} {"train_loss": -24.31412696838379, "global_step": 203275, "epoch": 2449} {"train_loss": -24.06253433227539, "global_step": 203276, "epoch": 2449} {"train_loss": -24.40097427368164, "global_step": 203277, "epoch": 2449} {"train_loss": -24.443214416503906, "global_step": 203278, "epoch": 2449} {"train_loss": -24.46489715576172, "global_step": 203279, "epoch": 2449} {"train_loss": -24.333053588867188, "global_step": 203280, "epoch": 2449} {"train_loss": -24.16222381591797, "global_step": 203281, "epoch": 2449} {"train_loss": -23.721647262573242, "global_step": 203282, "epoch": 2449} {"train_loss": -24.199573516845703, "global_step": 203283, "epoch": 2449} {"train_loss": -24.5029354095459, "global_step": 203284, "epoch": 2449} {"train_loss": -23.997438430786133, "global_step": 203285, "epoch": 2449} {"train_loss": -24.530237197875977, "global_step": 203286, "epoch": 2449} {"train_loss": -24.3640079498291, "global_step": 203287, "epoch": 2449} {"train_loss": -24.28597640991211, "global_step": 203288, "epoch": 2449} {"train_loss": -24.31068229675293, "global_step": 203289, "epoch": 2449} {"train_loss": -24.445106506347656, "global_step": 203290, "epoch": 2449} {"train_loss": -24.242387771606445, "global_step": 203291, "epoch": 2449} {"train_loss": -24.715749740600586, "global_step": 203292, "epoch": 2449} {"train_loss": -24.47382926940918, "global_step": 203293, "epoch": 2449} {"train_loss": -24.299192428588867, "global_step": 203294, "epoch": 2449} {"train_loss": -24.367441177368164, "global_step": 203295, "epoch": 2449} {"train_loss": -24.34247398376465, "global_step": 203296, "epoch": 2449} {"train_loss": -24.3841495513916, "global_step": 203297, "epoch": 2449} {"train_loss": -24.294076919555664, "global_step": 203298, "epoch": 2449} {"train_loss": -24.320920944213867, "global_step": 203299, "epoch": 2449} {"train_loss": -23.89594841003418, "global_step": 203300, "epoch": 2449} {"train_loss": -24.583311080932617, "global_step": 203301, "epoch": 2449} {"train_loss": -24.74275779724121, "global_step": 203302, "epoch": 2449} {"train_loss": -24.52829933166504, "global_step": 203303, "epoch": 2449} {"train_loss": -24.557729721069336, "global_step": 203304, "epoch": 2449} {"train_loss": -24.588560104370117, "global_step": 203305, "epoch": 2449} {"train_loss": -24.80478858947754, "global_step": 203306, "epoch": 2449} {"train_loss": -24.369659423828125, "global_step": 203307, "epoch": 2449} {"train_loss": -24.42369270324707, "global_step": 203308, "epoch": 2449} {"train_loss": -24.513166427612305, "global_step": 203309, "epoch": 2449} {"train_loss": -24.54546546936035, "global_step": 203310, "epoch": 2449} {"train_loss": -24.353055953979492, "global_step": 203311, "epoch": 2449} {"train_loss": -24.58302879333496, "global_step": 203312, "epoch": 2449} {"train_loss": -24.53223991394043, "global_step": 203313, "epoch": 2449} {"train_loss": -24.54050636291504, "global_step": 203314, "epoch": 2449} {"train_loss": -24.337751388549805, "global_step": 203315, "epoch": 2449} {"train_loss": -24.441823959350586, "global_step": 203316, "epoch": 2449} {"train_loss": -24.149269104003906, "global_step": 203317, "epoch": 2449} {"train_loss": -24.37502670288086, "global_step": 203318, "epoch": 2449} {"train_loss": -24.474905014038086, "global_step": 203319, "epoch": 2449} {"train_loss": -24.471054077148438, "global_step": 203320, "epoch": 2449} {"train_loss": -24.388004302978516, "global_step": 203321, "epoch": 2449} {"train_loss": -24.12034034729004, "global_step": 203322, "epoch": 2449} {"train_loss": -24.090360641479492, "global_step": 203323, "epoch": 2449} {"train_loss": -24.200851440429688, "global_step": 203324, "epoch": 2449} {"train_loss": -24.383014678955078, "global_step": 203325, "epoch": 2449} {"train_loss": -24.09405517578125, "global_step": 203326, "epoch": 2449} {"train_loss": -23.238683700561523, "global_step": 203327, "epoch": 2449} {"train_loss": -23.749759674072266, "global_step": 203328, "epoch": 2449} {"train_loss": -24.122793197631836, "global_step": 203329, "epoch": 2449} {"train_loss": -23.763530731201172, "global_step": 203330, "epoch": 2449} {"train_loss": -24.00123405456543, "global_step": 203331, "epoch": 2449} {"train_loss": -23.954294204711914, "global_step": 203332, "epoch": 2449} {"train_loss": -24.480358123779297, "global_step": 203333, "epoch": 2449} {"train_loss": -24.347774505615234, "global_step": 203334, "epoch": 2449} {"train_loss": -24.268856048583984, "global_step": 203335, "epoch": 2449} {"train_loss": -24.014713287353516, "global_step": 203336, "epoch": 2449} {"train_loss": -24.399377822875977, "global_step": 203337, "epoch": 2449} {"train_loss": -24.148168563842773, "global_step": 203338, "epoch": 2449} {"train_loss": -24.2757568359375, "global_step": 203339, "epoch": 2449} {"train_loss": -24.276254653930664, "global_step": 203340, "epoch": 2449} {"train_loss": -24.39072608947754, "global_step": 203341, "epoch": 2449} {"train_loss": -24.26457405090332, "global_step": 203342, "epoch": 2449} {"train_loss": -24.12379264831543, "global_step": 203343, "epoch": 2449} {"train_loss": -24.10346794128418, "global_step": 203344, "epoch": 2449} {"train_loss": -24.292407989501953, "global_step": 203345, "epoch": 2449} {"train_loss": -24.328046798706055, "global_step": 203346, "epoch": 2449} {"train_loss": -24.508615493774414, "global_step": 203347, "epoch": 2449} {"train_loss": -24.515649795532227, "global_step": 203348, "epoch": 2449} {"train_loss": -24.293474634009673, "global_step": 203349, "epoch": 2449, "val_loss": 6719960.0} {"train_loss": -23.567249298095703, "global_step": 203350, "epoch": 2450} {"train_loss": -23.849401473999023, "global_step": 203351, "epoch": 2450} {"train_loss": -23.433887481689453, "global_step": 203352, "epoch": 2450} {"train_loss": -23.602588653564453, "global_step": 203353, "epoch": 2450} {"train_loss": -23.837491989135742, "global_step": 203354, "epoch": 2450} {"train_loss": -23.9371395111084, "global_step": 203355, "epoch": 2450} {"train_loss": -23.81987190246582, "global_step": 203356, "epoch": 2450} {"train_loss": -24.18324089050293, "global_step": 203357, "epoch": 2450} {"train_loss": -23.53527069091797, "global_step": 203358, "epoch": 2450} {"train_loss": -24.044803619384766, "global_step": 203359, "epoch": 2450} {"train_loss": -24.022306442260742, "global_step": 203360, "epoch": 2450} {"train_loss": -24.295995712280273, "global_step": 203361, "epoch": 2450} {"train_loss": -23.932722091674805, "global_step": 203362, "epoch": 2450} {"train_loss": -24.087099075317383, "global_step": 203363, "epoch": 2450} {"train_loss": -24.427871704101562, "global_step": 203364, "epoch": 2450} {"train_loss": -24.506559371948242, "global_step": 203365, "epoch": 2450} {"train_loss": -24.11396598815918, "global_step": 203366, "epoch": 2450} {"train_loss": -24.258535385131836, "global_step": 203367, "epoch": 2450} {"train_loss": -24.31662940979004, "global_step": 203368, "epoch": 2450} {"train_loss": -24.30743980407715, "global_step": 203369, "epoch": 2450} {"train_loss": -24.126813888549805, "global_step": 203370, "epoch": 2450} {"train_loss": -24.126073837280273, "global_step": 203371, "epoch": 2450} {"train_loss": -24.23223876953125, "global_step": 203372, "epoch": 2450} {"train_loss": -24.13642692565918, "global_step": 203373, "epoch": 2450} {"train_loss": -24.037343978881836, "global_step": 203374, "epoch": 2450} {"train_loss": -24.336698532104492, "global_step": 203375, "epoch": 2450} {"train_loss": -23.77251625061035, "global_step": 203376, "epoch": 2450} {"train_loss": -24.226455688476562, "global_step": 203377, "epoch": 2450} {"train_loss": -24.321809768676758, "global_step": 203378, "epoch": 2450} {"train_loss": -24.154020309448242, "global_step": 203379, "epoch": 2450} {"train_loss": -23.920795440673828, "global_step": 203380, "epoch": 2450} {"train_loss": -23.889543533325195, "global_step": 203381, "epoch": 2450} {"train_loss": -24.34462547302246, "global_step": 203382, "epoch": 2450} {"train_loss": -24.523834228515625, "global_step": 203383, "epoch": 2450} {"train_loss": -24.286184310913086, "global_step": 203384, "epoch": 2450} {"train_loss": -24.23722267150879, "global_step": 203385, "epoch": 2450} {"train_loss": -24.381332397460938, "global_step": 203386, "epoch": 2450} {"train_loss": -24.34474754333496, "global_step": 203387, "epoch": 2450} {"train_loss": -24.15894889831543, "global_step": 203388, "epoch": 2450} {"train_loss": -24.146169662475586, "global_step": 203389, "epoch": 2450} {"train_loss": -24.488962173461914, "global_step": 203390, "epoch": 2450} {"train_loss": -24.516233444213867, "global_step": 203391, "epoch": 2450} {"train_loss": -24.695112228393555, "global_step": 203392, "epoch": 2450} {"train_loss": -24.526147842407227, "global_step": 203393, "epoch": 2450} {"train_loss": -24.51897621154785, "global_step": 203394, "epoch": 2450} {"train_loss": -24.964628219604492, "global_step": 203395, "epoch": 2450} {"train_loss": -24.704381942749023, "global_step": 203396, "epoch": 2450} {"train_loss": -24.75906753540039, "global_step": 203397, "epoch": 2450} {"train_loss": -24.78766441345215, "global_step": 203398, "epoch": 2450} {"train_loss": -24.329174041748047, "global_step": 203399, "epoch": 2450} {"train_loss": -23.94208335876465, "global_step": 203400, "epoch": 2450} {"train_loss": -24.24024772644043, "global_step": 203401, "epoch": 2450} {"train_loss": -24.54598045349121, "global_step": 203402, "epoch": 2450} {"train_loss": -24.335037231445312, "global_step": 203403, "epoch": 2450} {"train_loss": -24.234394073486328, "global_step": 203404, "epoch": 2450} {"train_loss": -24.5579833984375, "global_step": 203405, "epoch": 2450} {"train_loss": -24.494171142578125, "global_step": 203406, "epoch": 2450} {"train_loss": -24.330801010131836, "global_step": 203407, "epoch": 2450} {"train_loss": -24.120141983032227, "global_step": 203408, "epoch": 2450} {"train_loss": -24.29680633544922, "global_step": 203409, "epoch": 2450} {"train_loss": -24.280012130737305, "global_step": 203410, "epoch": 2450} {"train_loss": -24.8554630279541, "global_step": 203411, "epoch": 2450} {"train_loss": -24.243955612182617, "global_step": 203412, "epoch": 2450} {"train_loss": -23.929061889648438, "global_step": 203413, "epoch": 2450} {"train_loss": -24.011220932006836, "global_step": 203414, "epoch": 2450} {"train_loss": -24.244043350219727, "global_step": 203415, "epoch": 2450} {"train_loss": -24.453393936157227, "global_step": 203416, "epoch": 2450} {"train_loss": -23.698183059692383, "global_step": 203417, "epoch": 2450} {"train_loss": -24.331520080566406, "global_step": 203418, "epoch": 2450} {"train_loss": -24.38763427734375, "global_step": 203419, "epoch": 2450} {"train_loss": -24.342069625854492, "global_step": 203420, "epoch": 2450} {"train_loss": -23.896642684936523, "global_step": 203421, "epoch": 2450} {"train_loss": -24.324892044067383, "global_step": 203422, "epoch": 2450} {"train_loss": -24.202550888061523, "global_step": 203423, "epoch": 2450} {"train_loss": -24.142013549804688, "global_step": 203424, "epoch": 2450} {"train_loss": -24.28580665588379, "global_step": 203425, "epoch": 2450} {"train_loss": -24.24903678894043, "global_step": 203426, "epoch": 2450} {"train_loss": -24.380878448486328, "global_step": 203427, "epoch": 2450} {"train_loss": -24.395706176757812, "global_step": 203428, "epoch": 2450} {"train_loss": -23.915416717529297, "global_step": 203429, "epoch": 2450} {"train_loss": -24.43480110168457, "global_step": 203430, "epoch": 2450} {"train_loss": -23.712575912475586, "global_step": 203431, "epoch": 2450} {"train_loss": -24.233378123088055, "global_step": 203432, "epoch": 2450, "train/sim_max_reward_0": 1.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4500000": 1.0, "test/sim_max_reward_4500001": 1.0, "test/sim_max_reward_4500002": 1.0, "test/sim_max_reward_4500003": 1.0, "test/sim_max_reward_4500004": 1.0, "test/sim_max_reward_4500005": 1.0, "test/sim_max_reward_4500006": 1.0, "test/sim_max_reward_4500007": 1.0, "test/sim_max_reward_4500008": 1.0, "test/sim_max_reward_4500009": 1.0, "test/sim_max_reward_4500010": 1.0, "test/sim_max_reward_4500011": 1.0, "test/sim_max_reward_4500012": 1.0, "test/sim_max_reward_4500013": 1.0, "test/sim_max_reward_4500014": 1.0, "test/sim_max_reward_4500015": 1.0, "test/sim_max_reward_4500016": 1.0, "test/sim_max_reward_4500017": 1.0, "test/sim_max_reward_4500018": 1.0, "test/sim_max_reward_4500019": 1.0, "test/sim_max_reward_4500020": 1.0, "test/sim_max_reward_4500021": 1.0, "train/mean_score": 1.0, "test/mean_score": 1.0, "val_loss": 6543805.5} {"train_loss": -23.915342330932617, "global_step": 203433, "epoch": 2451} {"train_loss": -23.888181686401367, "global_step": 203434, "epoch": 2451} {"train_loss": -23.621244430541992, "global_step": 203435, "epoch": 2451} {"train_loss": -23.531089782714844, "global_step": 203436, "epoch": 2451} {"train_loss": -23.679826736450195, "global_step": 203437, "epoch": 2451} {"train_loss": -23.6323184967041, "global_step": 203438, "epoch": 2451} {"train_loss": -23.722469329833984, "global_step": 203439, "epoch": 2451} {"train_loss": -23.8554630279541, "global_step": 203440, "epoch": 2451} {"train_loss": -24.276479721069336, "global_step": 203441, "epoch": 2451} {"train_loss": -24.15950584411621, "global_step": 203442, "epoch": 2451} {"train_loss": -24.212890625, "global_step": 203443, "epoch": 2451} {"train_loss": -23.7935791015625, "global_step": 203444, "epoch": 2451} {"train_loss": -24.072113037109375, "global_step": 203445, "epoch": 2451} {"train_loss": -24.096805572509766, "global_step": 203446, "epoch": 2451} {"train_loss": -24.2136287689209, "global_step": 203447, "epoch": 2451} {"train_loss": -24.144794464111328, "global_step": 203448, "epoch": 2451} {"train_loss": -24.34851837158203, "global_step": 203449, "epoch": 2451} {"train_loss": -24.035186767578125, "global_step": 203450, "epoch": 2451} {"train_loss": -23.998706817626953, "global_step": 203451, "epoch": 2451} {"train_loss": -24.28975486755371, "global_step": 203452, "epoch": 2451} {"train_loss": -24.499013900756836, "global_step": 203453, "epoch": 2451} {"train_loss": -24.004547119140625, "global_step": 203454, "epoch": 2451} {"train_loss": -24.754526138305664, "global_step": 203455, "epoch": 2451} {"train_loss": -23.944807052612305, "global_step": 203456, "epoch": 2451} {"train_loss": -24.207149505615234, "global_step": 203457, "epoch": 2451} {"train_loss": -24.483572006225586, "global_step": 203458, "epoch": 2451} {"train_loss": -24.53108024597168, "global_step": 203459, "epoch": 2451} {"train_loss": -24.301025390625, "global_step": 203460, "epoch": 2451} {"train_loss": -24.032733917236328, "global_step": 203461, "epoch": 2451} {"train_loss": -24.2384090423584, "global_step": 203462, "epoch": 2451} {"train_loss": -24.374130249023438, "global_step": 203463, "epoch": 2451} {"train_loss": -24.09272575378418, "global_step": 203464, "epoch": 2451} {"train_loss": -24.59095001220703, "global_step": 203465, "epoch": 2451} {"train_loss": -24.493162155151367, "global_step": 203466, "epoch": 2451} {"train_loss": -24.499343872070312, "global_step": 203467, "epoch": 2451} {"train_loss": -24.355287551879883, "global_step": 203468, "epoch": 2451} {"train_loss": -24.487611770629883, "global_step": 203469, "epoch": 2451} {"train_loss": -24.50655174255371, "global_step": 203470, "epoch": 2451} {"train_loss": -24.33282470703125, "global_step": 203471, "epoch": 2451} {"train_loss": -24.270793914794922, "global_step": 203472, "epoch": 2451} {"train_loss": -24.145103454589844, "global_step": 203473, "epoch": 2451} {"train_loss": -24.32273292541504, "global_step": 203474, "epoch": 2451} {"train_loss": -24.362987518310547, "global_step": 203475, "epoch": 2451} {"train_loss": -24.95130157470703, "global_step": 203476, "epoch": 2451} {"train_loss": -24.277240753173828, "global_step": 203477, "epoch": 2451} {"train_loss": -24.2270565032959, "global_step": 203478, "epoch": 2451} {"train_loss": -24.26719856262207, "global_step": 203479, "epoch": 2451} {"train_loss": -24.410749435424805, "global_step": 203480, "epoch": 2451} {"train_loss": -23.96834373474121, "global_step": 203481, "epoch": 2451} {"train_loss": -24.527917861938477, "global_step": 203482, "epoch": 2451} {"train_loss": -24.4720516204834, "global_step": 203483, "epoch": 2451} {"train_loss": -23.920412063598633, "global_step": 203484, "epoch": 2451} {"train_loss": -24.302717208862305, "global_step": 203485, "epoch": 2451} {"train_loss": -24.161619186401367, "global_step": 203486, "epoch": 2451} {"train_loss": -24.11371421813965, "global_step": 203487, "epoch": 2451} {"train_loss": -24.015796661376953, "global_step": 203488, "epoch": 2451} {"train_loss": -23.70722770690918, "global_step": 203489, "epoch": 2451} {"train_loss": -24.161970138549805, "global_step": 203490, "epoch": 2451} {"train_loss": -24.2199764251709, "global_step": 203491, "epoch": 2451} {"train_loss": -24.114070892333984, "global_step": 203492, "epoch": 2451} {"train_loss": -24.639968872070312, "global_step": 203493, "epoch": 2451} {"train_loss": -24.304880142211914, "global_step": 203494, "epoch": 2451} {"train_loss": -24.350482940673828, "global_step": 203495, "epoch": 2451} {"train_loss": -24.12238121032715, "global_step": 203496, "epoch": 2451} {"train_loss": -24.250179290771484, "global_step": 203497, "epoch": 2451} {"train_loss": -24.56386947631836, "global_step": 203498, "epoch": 2451} {"train_loss": -24.08345603942871, "global_step": 203499, "epoch": 2451} {"train_loss": -24.448219299316406, "global_step": 203500, "epoch": 2451} {"train_loss": -24.31861114501953, "global_step": 203501, "epoch": 2451} {"train_loss": -24.312843322753906, "global_step": 203502, "epoch": 2451} {"train_loss": -23.83662986755371, "global_step": 203503, "epoch": 2451} {"train_loss": -24.286479949951172, "global_step": 203504, "epoch": 2451} {"train_loss": -24.225379943847656, "global_step": 203505, "epoch": 2451} {"train_loss": -24.257768630981445, "global_step": 203506, "epoch": 2451} {"train_loss": -24.120418548583984, "global_step": 203507, "epoch": 2451} {"train_loss": -24.016813278198242, "global_step": 203508, "epoch": 2451} {"train_loss": -24.48834228515625, "global_step": 203509, "epoch": 2451} {"train_loss": -24.665630340576172, "global_step": 203510, "epoch": 2451} {"train_loss": -24.155834197998047, "global_step": 203511, "epoch": 2451} {"train_loss": -24.230243682861328, "global_step": 203512, "epoch": 2451} {"train_loss": -24.204303741455078, "global_step": 203513, "epoch": 2451} {"train_loss": -23.954792022705078, "global_step": 203514, "epoch": 2451} {"train_loss": -24.193667790975915, "global_step": 203515, "epoch": 2451, "val_loss": 6622226.0} {"train_loss": -24.144927978515625, "global_step": 203516, "epoch": 2452} {"train_loss": -24.26582908630371, "global_step": 203517, "epoch": 2452} {"train_loss": -24.435134887695312, "global_step": 203518, "epoch": 2452} {"train_loss": -24.5841007232666, "global_step": 203519, "epoch": 2452} {"train_loss": -24.47800064086914, "global_step": 203520, "epoch": 2452} {"train_loss": -24.25806999206543, "global_step": 203521, "epoch": 2452} {"train_loss": -24.35418701171875, "global_step": 203522, "epoch": 2452} {"train_loss": -23.793973922729492, "global_step": 203523, "epoch": 2452} {"train_loss": -24.22149658203125, "global_step": 203524, "epoch": 2452} {"train_loss": -24.505496978759766, "global_step": 203525, "epoch": 2452} {"train_loss": -24.27565574645996, "global_step": 203526, "epoch": 2452} {"train_loss": -24.64716339111328, "global_step": 203527, "epoch": 2452} {"train_loss": -24.44904136657715, "global_step": 203528, "epoch": 2452} {"train_loss": -24.18621826171875, "global_step": 203529, "epoch": 2452} {"train_loss": -24.166147232055664, "global_step": 203530, "epoch": 2452} {"train_loss": -24.136295318603516, "global_step": 203531, "epoch": 2452} {"train_loss": -24.625247955322266, "global_step": 203532, "epoch": 2452} {"train_loss": -24.054136276245117, "global_step": 203533, "epoch": 2452} {"train_loss": -24.447385787963867, "global_step": 203534, "epoch": 2452} {"train_loss": -24.006750106811523, "global_step": 203535, "epoch": 2452} {"train_loss": -24.252038955688477, "global_step": 203536, "epoch": 2452} {"train_loss": -24.087392807006836, "global_step": 203537, "epoch": 2452} {"train_loss": -24.250776290893555, "global_step": 203538, "epoch": 2452} {"train_loss": -24.528038024902344, "global_step": 203539, "epoch": 2452} {"train_loss": -24.51080894470215, "global_step": 203540, "epoch": 2452} {"train_loss": -24.305578231811523, "global_step": 203541, "epoch": 2452} {"train_loss": -24.176746368408203, "global_step": 203542, "epoch": 2452} {"train_loss": -24.62857437133789, "global_step": 203543, "epoch": 2452} {"train_loss": -24.0939884185791, "global_step": 203544, "epoch": 2452} {"train_loss": -24.785337448120117, "global_step": 203545, "epoch": 2452} {"train_loss": -24.137332916259766, "global_step": 203546, "epoch": 2452} {"train_loss": -24.291824340820312, "global_step": 203547, "epoch": 2452} {"train_loss": -23.8719482421875, "global_step": 203548, "epoch": 2452} {"train_loss": -24.296051025390625, "global_step": 203549, "epoch": 2452} {"train_loss": -24.054513931274414, "global_step": 203550, "epoch": 2452} {"train_loss": -24.21424674987793, "global_step": 203551, "epoch": 2452} {"train_loss": -24.23451805114746, "global_step": 203552, "epoch": 2452} {"train_loss": -24.77747917175293, "global_step": 203553, "epoch": 2452} {"train_loss": -24.39613914489746, "global_step": 203554, "epoch": 2452} {"train_loss": -24.1852970123291, "global_step": 203555, "epoch": 2452} {"train_loss": -23.991230010986328, "global_step": 203556, "epoch": 2452} {"train_loss": -23.874826431274414, "global_step": 203557, "epoch": 2452} {"train_loss": -24.294052124023438, "global_step": 203558, "epoch": 2452} {"train_loss": -24.18946075439453, "global_step": 203559, "epoch": 2452} {"train_loss": -23.596342086791992, "global_step": 203560, "epoch": 2452} {"train_loss": -24.23175048828125, "global_step": 203561, "epoch": 2452} {"train_loss": -23.8505916595459, "global_step": 203562, "epoch": 2452} {"train_loss": -24.002155303955078, "global_step": 203563, "epoch": 2452} {"train_loss": -23.91511344909668, "global_step": 203564, "epoch": 2452} {"train_loss": -24.217769622802734, "global_step": 203565, "epoch": 2452} {"train_loss": -24.270381927490234, "global_step": 203566, "epoch": 2452} {"train_loss": -24.300785064697266, "global_step": 203567, "epoch": 2452} {"train_loss": -24.1104793548584, "global_step": 203568, "epoch": 2452} {"train_loss": -24.244089126586914, "global_step": 203569, "epoch": 2452} {"train_loss": -23.982751846313477, "global_step": 203570, "epoch": 2452} {"train_loss": -24.319684982299805, "global_step": 203571, "epoch": 2452} {"train_loss": -24.22747802734375, "global_step": 203572, "epoch": 2452} {"train_loss": -24.206069946289062, "global_step": 203573, "epoch": 2452} {"train_loss": -24.238393783569336, "global_step": 203574, "epoch": 2452} {"train_loss": -24.33709144592285, "global_step": 203575, "epoch": 2452} {"train_loss": -24.350290298461914, "global_step": 203576, "epoch": 2452} {"train_loss": -24.296255111694336, "global_step": 203577, "epoch": 2452} {"train_loss": -24.264148712158203, "global_step": 203578, "epoch": 2452} {"train_loss": -24.188623428344727, "global_step": 203579, "epoch": 2452} {"train_loss": -24.274677276611328, "global_step": 203580, "epoch": 2452} {"train_loss": -24.420045852661133, "global_step": 203581, "epoch": 2452} {"train_loss": -23.935178756713867, "global_step": 203582, "epoch": 2452} {"train_loss": -24.55286979675293, "global_step": 203583, "epoch": 2452} {"train_loss": -24.328855514526367, "global_step": 203584, "epoch": 2452} {"train_loss": -24.36144256591797, "global_step": 203585, "epoch": 2452} {"train_loss": -24.441259384155273, "global_step": 203586, "epoch": 2452} {"train_loss": -24.177047729492188, "global_step": 203587, "epoch": 2452} {"train_loss": -24.505035400390625, "global_step": 203588, "epoch": 2452} {"train_loss": -24.27910041809082, "global_step": 203589, "epoch": 2452} {"train_loss": -24.101301193237305, "global_step": 203590, "epoch": 2452} {"train_loss": -24.284099578857422, "global_step": 203591, "epoch": 2452} {"train_loss": -24.22799301147461, "global_step": 203592, "epoch": 2452} {"train_loss": -24.47979164123535, "global_step": 203593, "epoch": 2452} {"train_loss": -24.511539459228516, "global_step": 203594, "epoch": 2452} {"train_loss": -24.193952560424805, "global_step": 203595, "epoch": 2452} {"train_loss": -24.24311637878418, "global_step": 203596, "epoch": 2452} {"train_loss": -24.359891891479492, "global_step": 203597, "epoch": 2452} {"train_loss": -24.25754756238087, "global_step": 203598, "epoch": 2452, "val_loss": 6491292.0} {"train_loss": -24.016748428344727, "global_step": 203599, "epoch": 2453} {"train_loss": -24.224483489990234, "global_step": 203600, "epoch": 2453} {"train_loss": -23.767847061157227, "global_step": 203601, "epoch": 2453} {"train_loss": -23.39235496520996, "global_step": 203602, "epoch": 2453} {"train_loss": -23.72117805480957, "global_step": 203603, "epoch": 2453} {"train_loss": -23.625747680664062, "global_step": 203604, "epoch": 2453} {"train_loss": -23.844207763671875, "global_step": 203605, "epoch": 2453} {"train_loss": -23.823745727539062, "global_step": 203606, "epoch": 2453} {"train_loss": -23.826221466064453, "global_step": 203607, "epoch": 2453} {"train_loss": -23.849807739257812, "global_step": 203608, "epoch": 2453} {"train_loss": -24.04977798461914, "global_step": 203609, "epoch": 2453} {"train_loss": -24.25153160095215, "global_step": 203610, "epoch": 2453} {"train_loss": -23.87043571472168, "global_step": 203611, "epoch": 2453} {"train_loss": -24.139402389526367, "global_step": 203612, "epoch": 2453} {"train_loss": -23.784292221069336, "global_step": 203613, "epoch": 2453} {"train_loss": -24.06992530822754, "global_step": 203614, "epoch": 2453} {"train_loss": -24.094820022583008, "global_step": 203615, "epoch": 2453} {"train_loss": -23.918720245361328, "global_step": 203616, "epoch": 2453} {"train_loss": -24.205961227416992, "global_step": 203617, "epoch": 2453} {"train_loss": -24.01462745666504, "global_step": 203618, "epoch": 2453} {"train_loss": -23.816068649291992, "global_step": 203619, "epoch": 2453} {"train_loss": -23.52197265625, "global_step": 203620, "epoch": 2453} {"train_loss": -23.90072250366211, "global_step": 203621, "epoch": 2453} {"train_loss": -23.999710083007812, "global_step": 203622, "epoch": 2453} {"train_loss": -23.755735397338867, "global_step": 203623, "epoch": 2453} {"train_loss": -24.187421798706055, "global_step": 203624, "epoch": 2453} {"train_loss": -24.39306640625, "global_step": 203625, "epoch": 2453} {"train_loss": -24.13447380065918, "global_step": 203626, "epoch": 2453} {"train_loss": -24.506887435913086, "global_step": 203627, "epoch": 2453} {"train_loss": -24.028894424438477, "global_step": 203628, "epoch": 2453} {"train_loss": -24.4096622467041, "global_step": 203629, "epoch": 2453} {"train_loss": -24.078134536743164, "global_step": 203630, "epoch": 2453} {"train_loss": -24.121124267578125, "global_step": 203631, "epoch": 2453} {"train_loss": -24.366771697998047, "global_step": 203632, "epoch": 2453} {"train_loss": -24.108930587768555, "global_step": 203633, "epoch": 2453} {"train_loss": -24.374929428100586, "global_step": 203634, "epoch": 2453} {"train_loss": -24.386899948120117, "global_step": 203635, "epoch": 2453} {"train_loss": -24.61225128173828, "global_step": 203636, "epoch": 2453} {"train_loss": -23.871337890625, "global_step": 203637, "epoch": 2453} {"train_loss": -24.353429794311523, "global_step": 203638, "epoch": 2453} {"train_loss": -24.492511749267578, "global_step": 203639, "epoch": 2453} {"train_loss": -24.084518432617188, "global_step": 203640, "epoch": 2453} {"train_loss": -24.234376907348633, "global_step": 203641, "epoch": 2453} {"train_loss": -24.306236267089844, "global_step": 203642, "epoch": 2453} {"train_loss": -24.491119384765625, "global_step": 203643, "epoch": 2453} {"train_loss": -24.481088638305664, "global_step": 203644, "epoch": 2453} {"train_loss": -24.419509887695312, "global_step": 203645, "epoch": 2453} {"train_loss": -24.297489166259766, "global_step": 203646, "epoch": 2453} {"train_loss": -24.65555191040039, "global_step": 203647, "epoch": 2453} {"train_loss": -24.738040924072266, "global_step": 203648, "epoch": 2453} {"train_loss": -24.439144134521484, "global_step": 203649, "epoch": 2453} {"train_loss": -24.50092887878418, "global_step": 203650, "epoch": 2453} {"train_loss": -24.116487503051758, "global_step": 203651, "epoch": 2453} {"train_loss": -24.359439849853516, "global_step": 203652, "epoch": 2453} {"train_loss": -24.719449996948242, "global_step": 203653, "epoch": 2453} {"train_loss": -24.20317840576172, "global_step": 203654, "epoch": 2453} {"train_loss": -24.3232421875, "global_step": 203655, "epoch": 2453} {"train_loss": -23.699542999267578, "global_step": 203656, "epoch": 2453} {"train_loss": -24.009634017944336, "global_step": 203657, "epoch": 2453} {"train_loss": -24.14893913269043, "global_step": 203658, "epoch": 2453} {"train_loss": -24.466867446899414, "global_step": 203659, "epoch": 2453} {"train_loss": -24.06155776977539, "global_step": 203660, "epoch": 2453} {"train_loss": -24.21433448791504, "global_step": 203661, "epoch": 2453} {"train_loss": -24.27801513671875, "global_step": 203662, "epoch": 2453} {"train_loss": -24.460155487060547, "global_step": 203663, "epoch": 2453} {"train_loss": -24.344533920288086, "global_step": 203664, "epoch": 2453} {"train_loss": -24.3812198638916, "global_step": 203665, "epoch": 2453} {"train_loss": -23.866613388061523, "global_step": 203666, "epoch": 2453} {"train_loss": -24.151620864868164, "global_step": 203667, "epoch": 2453} {"train_loss": -24.202106475830078, "global_step": 203668, "epoch": 2453} {"train_loss": -24.222959518432617, "global_step": 203669, "epoch": 2453} {"train_loss": -24.391386032104492, "global_step": 203670, "epoch": 2453} {"train_loss": -23.913808822631836, "global_step": 203671, "epoch": 2453} {"train_loss": -24.816085815429688, "global_step": 203672, "epoch": 2453} {"train_loss": -24.494131088256836, "global_step": 203673, "epoch": 2453} {"train_loss": -24.42336082458496, "global_step": 203674, "epoch": 2453} {"train_loss": -24.104572296142578, "global_step": 203675, "epoch": 2453} {"train_loss": -24.23018455505371, "global_step": 203676, "epoch": 2453} {"train_loss": -24.44191551208496, "global_step": 203677, "epoch": 2453} {"train_loss": -24.4455509185791, "global_step": 203678, "epoch": 2453} {"train_loss": -24.26409339904785, "global_step": 203679, "epoch": 2453} {"train_loss": -24.522098541259766, "global_step": 203680, "epoch": 2453} {"train_loss": -24.198083234120563, "global_step": 203681, "epoch": 2453, "val_loss": 6567470.0} {"train_loss": -23.83805274963379, "global_step": 203682, "epoch": 2454} {"train_loss": -24.05129051208496, "global_step": 203683, "epoch": 2454} {"train_loss": -24.272565841674805, "global_step": 203684, "epoch": 2454} {"train_loss": -24.322853088378906, "global_step": 203685, "epoch": 2454} {"train_loss": -24.239017486572266, "global_step": 203686, "epoch": 2454} {"train_loss": -24.14013671875, "global_step": 203687, "epoch": 2454} {"train_loss": -24.55569839477539, "global_step": 203688, "epoch": 2454} {"train_loss": -24.151268005371094, "global_step": 203689, "epoch": 2454} {"train_loss": -24.247257232666016, "global_step": 203690, "epoch": 2454} {"train_loss": -24.12447166442871, "global_step": 203691, "epoch": 2454} {"train_loss": -24.177183151245117, "global_step": 203692, "epoch": 2454} {"train_loss": -24.15592384338379, "global_step": 203693, "epoch": 2454} {"train_loss": -24.225950241088867, "global_step": 203694, "epoch": 2454} {"train_loss": -24.36814308166504, "global_step": 203695, "epoch": 2454} {"train_loss": -24.08844566345215, "global_step": 203696, "epoch": 2454} {"train_loss": -24.57729721069336, "global_step": 203697, "epoch": 2454} {"train_loss": -24.257518768310547, "global_step": 203698, "epoch": 2454} {"train_loss": -24.42762565612793, "global_step": 203699, "epoch": 2454} {"train_loss": -23.77107048034668, "global_step": 203700, "epoch": 2454} {"train_loss": -24.208873748779297, "global_step": 203701, "epoch": 2454} {"train_loss": -24.256040573120117, "global_step": 203702, "epoch": 2454} {"train_loss": -24.34029197692871, "global_step": 203703, "epoch": 2454} {"train_loss": -24.15353775024414, "global_step": 203704, "epoch": 2454} {"train_loss": -24.40565299987793, "global_step": 203705, "epoch": 2454} {"train_loss": -24.288818359375, "global_step": 203706, "epoch": 2454} {"train_loss": -24.314481735229492, "global_step": 203707, "epoch": 2454} {"train_loss": -24.129865646362305, "global_step": 203708, "epoch": 2454} {"train_loss": -24.34698486328125, "global_step": 203709, "epoch": 2454} {"train_loss": -23.972593307495117, "global_step": 203710, "epoch": 2454} {"train_loss": -24.012968063354492, "global_step": 203711, "epoch": 2454} {"train_loss": -24.558425903320312, "global_step": 203712, "epoch": 2454} {"train_loss": -24.407590866088867, "global_step": 203713, "epoch": 2454} {"train_loss": -23.985254287719727, "global_step": 203714, "epoch": 2454} {"train_loss": -24.343311309814453, "global_step": 203715, "epoch": 2454} {"train_loss": -24.18818473815918, "global_step": 203716, "epoch": 2454} {"train_loss": -24.464574813842773, "global_step": 203717, "epoch": 2454} {"train_loss": -24.41945457458496, "global_step": 203718, "epoch": 2454} {"train_loss": -24.26089859008789, "global_step": 203719, "epoch": 2454} {"train_loss": -24.48139762878418, "global_step": 203720, "epoch": 2454} {"train_loss": -24.26295280456543, "global_step": 203721, "epoch": 2454} {"train_loss": -24.53095817565918, "global_step": 203722, "epoch": 2454} {"train_loss": -24.366750717163086, "global_step": 203723, "epoch": 2454} {"train_loss": -24.486486434936523, "global_step": 203724, "epoch": 2454} {"train_loss": -24.272985458374023, "global_step": 203725, "epoch": 2454} {"train_loss": -24.243976593017578, "global_step": 203726, "epoch": 2454} {"train_loss": -24.283689498901367, "global_step": 203727, "epoch": 2454} {"train_loss": -24.46183967590332, "global_step": 203728, "epoch": 2454} {"train_loss": -24.47805404663086, "global_step": 203729, "epoch": 2454} {"train_loss": -24.411550521850586, "global_step": 203730, "epoch": 2454} {"train_loss": -24.33180046081543, "global_step": 203731, "epoch": 2454} {"train_loss": -24.180877685546875, "global_step": 203732, "epoch": 2454} {"train_loss": -24.55008316040039, "global_step": 203733, "epoch": 2454} {"train_loss": -24.237043380737305, "global_step": 203734, "epoch": 2454} {"train_loss": -24.40074348449707, "global_step": 203735, "epoch": 2454} {"train_loss": -24.752866744995117, "global_step": 203736, "epoch": 2454} {"train_loss": -23.96022605895996, "global_step": 203737, "epoch": 2454} {"train_loss": -24.29278564453125, "global_step": 203738, "epoch": 2454} {"train_loss": -24.0634765625, "global_step": 203739, "epoch": 2454} {"train_loss": -24.393638610839844, "global_step": 203740, "epoch": 2454} {"train_loss": -24.84796714782715, "global_step": 203741, "epoch": 2454} {"train_loss": -24.78727149963379, "global_step": 203742, "epoch": 2454} {"train_loss": -24.802112579345703, "global_step": 203743, "epoch": 2454} {"train_loss": -24.61741065979004, "global_step": 203744, "epoch": 2454} {"train_loss": -24.864185333251953, "global_step": 203745, "epoch": 2454} {"train_loss": -24.324237823486328, "global_step": 203746, "epoch": 2454} {"train_loss": -24.69596290588379, "global_step": 203747, "epoch": 2454} {"train_loss": -24.894840240478516, "global_step": 203748, "epoch": 2454} {"train_loss": -24.004499435424805, "global_step": 203749, "epoch": 2454} {"train_loss": -24.354156494140625, "global_step": 203750, "epoch": 2454} {"train_loss": -24.307920455932617, "global_step": 203751, "epoch": 2454} {"train_loss": -24.339513778686523, "global_step": 203752, "epoch": 2454} {"train_loss": -24.43684196472168, "global_step": 203753, "epoch": 2454} {"train_loss": -24.439062118530273, "global_step": 203754, "epoch": 2454} {"train_loss": -24.548480987548828, "global_step": 203755, "epoch": 2454} {"train_loss": -24.65839958190918, "global_step": 203756, "epoch": 2454} {"train_loss": -24.02276611328125, "global_step": 203757, "epoch": 2454} {"train_loss": -24.104679107666016, "global_step": 203758, "epoch": 2454} {"train_loss": -23.739521026611328, "global_step": 203759, "epoch": 2454} {"train_loss": -23.905874252319336, "global_step": 203760, "epoch": 2454} {"train_loss": -24.094141006469727, "global_step": 203761, "epoch": 2454} {"train_loss": -24.14044761657715, "global_step": 203762, "epoch": 2454} {"train_loss": -24.43885612487793, "global_step": 203763, "epoch": 2454} {"train_loss": -24.32761401440724, "global_step": 203764, "epoch": 2454, "val_loss": 6651337.0} {"train_loss": -24.24934959411621, "global_step": 203765, "epoch": 2455} {"train_loss": -24.16525650024414, "global_step": 203766, "epoch": 2455} {"train_loss": -24.021955490112305, "global_step": 203767, "epoch": 2455} {"train_loss": -24.583877563476562, "global_step": 203768, "epoch": 2455} {"train_loss": -23.730329513549805, "global_step": 203769, "epoch": 2455} {"train_loss": -23.911239624023438, "global_step": 203770, "epoch": 2455} {"train_loss": -23.98081398010254, "global_step": 203771, "epoch": 2455} {"train_loss": -23.786083221435547, "global_step": 203772, "epoch": 2455} {"train_loss": -24.193391799926758, "global_step": 203773, "epoch": 2455} {"train_loss": -23.862293243408203, "global_step": 203774, "epoch": 2455} {"train_loss": -24.143789291381836, "global_step": 203775, "epoch": 2455} {"train_loss": -24.112852096557617, "global_step": 203776, "epoch": 2455} {"train_loss": -23.940441131591797, "global_step": 203777, "epoch": 2455} {"train_loss": -24.080968856811523, "global_step": 203778, "epoch": 2455} {"train_loss": -24.093524932861328, "global_step": 203779, "epoch": 2455} {"train_loss": -24.325286865234375, "global_step": 203780, "epoch": 2455} {"train_loss": -23.9445858001709, "global_step": 203781, "epoch": 2455} {"train_loss": -24.173986434936523, "global_step": 203782, "epoch": 2455} {"train_loss": -24.365921020507812, "global_step": 203783, "epoch": 2455} {"train_loss": -24.301254272460938, "global_step": 203784, "epoch": 2455} {"train_loss": -24.414743423461914, "global_step": 203785, "epoch": 2455} {"train_loss": -24.456634521484375, "global_step": 203786, "epoch": 2455} {"train_loss": -24.249141693115234, "global_step": 203787, "epoch": 2455} {"train_loss": -24.26590347290039, "global_step": 203788, "epoch": 2455} {"train_loss": -24.52410125732422, "global_step": 203789, "epoch": 2455} {"train_loss": -24.38494300842285, "global_step": 203790, "epoch": 2455} {"train_loss": -24.305273056030273, "global_step": 203791, "epoch": 2455} {"train_loss": -24.172073364257812, "global_step": 203792, "epoch": 2455} {"train_loss": -24.500816345214844, "global_step": 203793, "epoch": 2455} {"train_loss": -24.426130294799805, "global_step": 203794, "epoch": 2455} {"train_loss": -24.45421600341797, "global_step": 203795, "epoch": 2455} {"train_loss": -24.24941062927246, "global_step": 203796, "epoch": 2455} {"train_loss": -24.582197189331055, "global_step": 203797, "epoch": 2455} {"train_loss": -24.35917091369629, "global_step": 203798, "epoch": 2455} {"train_loss": -24.22972297668457, "global_step": 203799, "epoch": 2455} {"train_loss": -24.74275016784668, "global_step": 203800, "epoch": 2455} {"train_loss": -24.50981903076172, "global_step": 203801, "epoch": 2455} {"train_loss": -24.158266067504883, "global_step": 203802, "epoch": 2455} {"train_loss": -24.25111198425293, "global_step": 203803, "epoch": 2455} {"train_loss": -24.274545669555664, "global_step": 203804, "epoch": 2455} {"train_loss": -24.45370101928711, "global_step": 203805, "epoch": 2455} {"train_loss": -23.82979393005371, "global_step": 203806, "epoch": 2455} {"train_loss": -24.28367042541504, "global_step": 203807, "epoch": 2455} {"train_loss": -23.5213565826416, "global_step": 203808, "epoch": 2455} {"train_loss": -23.66585350036621, "global_step": 203809, "epoch": 2455} {"train_loss": -23.630929946899414, "global_step": 203810, "epoch": 2455} {"train_loss": -23.965818405151367, "global_step": 203811, "epoch": 2455} {"train_loss": -23.85236930847168, "global_step": 203812, "epoch": 2455} {"train_loss": -23.47076416015625, "global_step": 203813, "epoch": 2455} {"train_loss": -23.531126022338867, "global_step": 203814, "epoch": 2455} {"train_loss": -23.67637062072754, "global_step": 203815, "epoch": 2455} {"train_loss": -23.646730422973633, "global_step": 203816, "epoch": 2455} {"train_loss": -23.739337921142578, "global_step": 203817, "epoch": 2455} {"train_loss": -23.5510196685791, "global_step": 203818, "epoch": 2455} {"train_loss": -23.661352157592773, "global_step": 203819, "epoch": 2455} {"train_loss": -24.310285568237305, "global_step": 203820, "epoch": 2455} {"train_loss": -23.732593536376953, "global_step": 203821, "epoch": 2455} {"train_loss": -24.16533851623535, "global_step": 203822, "epoch": 2455} {"train_loss": -23.846147537231445, "global_step": 203823, "epoch": 2455} {"train_loss": -23.98343276977539, "global_step": 203824, "epoch": 2455} {"train_loss": -23.697433471679688, "global_step": 203825, "epoch": 2455} {"train_loss": -24.156814575195312, "global_step": 203826, "epoch": 2455} {"train_loss": -24.308544158935547, "global_step": 203827, "epoch": 2455} {"train_loss": -24.250991821289062, "global_step": 203828, "epoch": 2455} {"train_loss": -24.178659439086914, "global_step": 203829, "epoch": 2455} {"train_loss": -24.003482818603516, "global_step": 203830, "epoch": 2455} {"train_loss": -24.02318572998047, "global_step": 203831, "epoch": 2455} {"train_loss": -23.560758590698242, "global_step": 203832, "epoch": 2455} {"train_loss": -24.260080337524414, "global_step": 203833, "epoch": 2455} {"train_loss": -24.340604782104492, "global_step": 203834, "epoch": 2455} {"train_loss": -24.224491119384766, "global_step": 203835, "epoch": 2455} {"train_loss": -24.03034210205078, "global_step": 203836, "epoch": 2455} {"train_loss": -24.18330955505371, "global_step": 203837, "epoch": 2455} {"train_loss": -24.383058547973633, "global_step": 203838, "epoch": 2455} {"train_loss": -24.203603744506836, "global_step": 203839, "epoch": 2455} {"train_loss": -24.07748794555664, "global_step": 203840, "epoch": 2455} {"train_loss": -24.4055233001709, "global_step": 203841, "epoch": 2455} {"train_loss": -24.248510360717773, "global_step": 203842, "epoch": 2455} {"train_loss": -23.849334716796875, "global_step": 203843, "epoch": 2455} {"train_loss": -24.474924087524414, "global_step": 203844, "epoch": 2455} {"train_loss": -24.403379440307617, "global_step": 203845, "epoch": 2455} {"train_loss": -24.22062873840332, "global_step": 203846, "epoch": 2455} {"train_loss": -24.10877673597221, "global_step": 203847, "epoch": 2455, "val_loss": 6810908.0} {"train_loss": -23.328481674194336, "global_step": 203848, "epoch": 2456} {"train_loss": -22.35370445251465, "global_step": 203849, "epoch": 2456} {"train_loss": -23.213180541992188, "global_step": 203850, "epoch": 2456} {"train_loss": -23.937122344970703, "global_step": 203851, "epoch": 2456} {"train_loss": -23.679731369018555, "global_step": 203852, "epoch": 2456} {"train_loss": -23.313730239868164, "global_step": 203853, "epoch": 2456} {"train_loss": -24.17505645751953, "global_step": 203854, "epoch": 2456} {"train_loss": -24.495874404907227, "global_step": 203855, "epoch": 2456} {"train_loss": -23.912588119506836, "global_step": 203856, "epoch": 2456} {"train_loss": -24.293323516845703, "global_step": 203857, "epoch": 2456} {"train_loss": -23.999361038208008, "global_step": 203858, "epoch": 2456} {"train_loss": -24.113672256469727, "global_step": 203859, "epoch": 2456} {"train_loss": -23.772262573242188, "global_step": 203860, "epoch": 2456} {"train_loss": -23.90362548828125, "global_step": 203861, "epoch": 2456} {"train_loss": -24.39723777770996, "global_step": 203862, "epoch": 2456} {"train_loss": -23.862472534179688, "global_step": 203863, "epoch": 2456} {"train_loss": -24.02933692932129, "global_step": 203864, "epoch": 2456} {"train_loss": -24.035507202148438, "global_step": 203865, "epoch": 2456} {"train_loss": -23.945209503173828, "global_step": 203866, "epoch": 2456} {"train_loss": -24.454381942749023, "global_step": 203867, "epoch": 2456} {"train_loss": -24.210737228393555, "global_step": 203868, "epoch": 2456} {"train_loss": -23.87067413330078, "global_step": 203869, "epoch": 2456} {"train_loss": -24.19451141357422, "global_step": 203870, "epoch": 2456} {"train_loss": -24.374576568603516, "global_step": 203871, "epoch": 2456} {"train_loss": -24.139745712280273, "global_step": 203872, "epoch": 2456} {"train_loss": -24.18397331237793, "global_step": 203873, "epoch": 2456} {"train_loss": -24.188217163085938, "global_step": 203874, "epoch": 2456} {"train_loss": -23.780813217163086, "global_step": 203875, "epoch": 2456} {"train_loss": -24.49763298034668, "global_step": 203876, "epoch": 2456} {"train_loss": -24.392295837402344, "global_step": 203877, "epoch": 2456} {"train_loss": -24.1804141998291, "global_step": 203878, "epoch": 2456} {"train_loss": -24.58223533630371, "global_step": 203879, "epoch": 2456} {"train_loss": -24.35045051574707, "global_step": 203880, "epoch": 2456} {"train_loss": -24.393712997436523, "global_step": 203881, "epoch": 2456} {"train_loss": -24.679962158203125, "global_step": 203882, "epoch": 2456} {"train_loss": -24.14446449279785, "global_step": 203883, "epoch": 2456} {"train_loss": -24.452362060546875, "global_step": 203884, "epoch": 2456} {"train_loss": -24.42831802368164, "global_step": 203885, "epoch": 2456} {"train_loss": -24.24542808532715, "global_step": 203886, "epoch": 2456} {"train_loss": -24.256412506103516, "global_step": 203887, "epoch": 2456} {"train_loss": -24.344581604003906, "global_step": 203888, "epoch": 2456} {"train_loss": -24.26857566833496, "global_step": 203889, "epoch": 2456} {"train_loss": -24.676116943359375, "global_step": 203890, "epoch": 2456} {"train_loss": -24.529638290405273, "global_step": 203891, "epoch": 2456} {"train_loss": -24.47266960144043, "global_step": 203892, "epoch": 2456} {"train_loss": -24.374454498291016, "global_step": 203893, "epoch": 2456} {"train_loss": -24.87649917602539, "global_step": 203894, "epoch": 2456} {"train_loss": -24.466947555541992, "global_step": 203895, "epoch": 2456} {"train_loss": -24.404617309570312, "global_step": 203896, "epoch": 2456} {"train_loss": -24.089527130126953, "global_step": 203897, "epoch": 2456} {"train_loss": -24.027698516845703, "global_step": 203898, "epoch": 2456} {"train_loss": -24.601343154907227, "global_step": 203899, "epoch": 2456} {"train_loss": -24.23018455505371, "global_step": 203900, "epoch": 2456} {"train_loss": -24.186914443969727, "global_step": 203901, "epoch": 2456} {"train_loss": -24.658740997314453, "global_step": 203902, "epoch": 2456} {"train_loss": -24.30866050720215, "global_step": 203903, "epoch": 2456} {"train_loss": -24.03545570373535, "global_step": 203904, "epoch": 2456} {"train_loss": -24.29522132873535, "global_step": 203905, "epoch": 2456} {"train_loss": -24.397686004638672, "global_step": 203906, "epoch": 2456} {"train_loss": -24.41721534729004, "global_step": 203907, "epoch": 2456} {"train_loss": -24.890188217163086, "global_step": 203908, "epoch": 2456} {"train_loss": -24.65716552734375, "global_step": 203909, "epoch": 2456} {"train_loss": -24.417699813842773, "global_step": 203910, "epoch": 2456} {"train_loss": -24.490856170654297, "global_step": 203911, "epoch": 2456} {"train_loss": -24.54163932800293, "global_step": 203912, "epoch": 2456} {"train_loss": -24.44019317626953, "global_step": 203913, "epoch": 2456} {"train_loss": -24.63935661315918, "global_step": 203914, "epoch": 2456} {"train_loss": -24.329492568969727, "global_step": 203915, "epoch": 2456} {"train_loss": -24.120750427246094, "global_step": 203916, "epoch": 2456} {"train_loss": -24.230701446533203, "global_step": 203917, "epoch": 2456} {"train_loss": -23.950063705444336, "global_step": 203918, "epoch": 2456} {"train_loss": -24.300230026245117, "global_step": 203919, "epoch": 2456} {"train_loss": -24.887935638427734, "global_step": 203920, "epoch": 2456} {"train_loss": -24.108354568481445, "global_step": 203921, "epoch": 2456} {"train_loss": -24.31510353088379, "global_step": 203922, "epoch": 2456} {"train_loss": -24.535873413085938, "global_step": 203923, "epoch": 2456} {"train_loss": -23.828895568847656, "global_step": 203924, "epoch": 2456} {"train_loss": -24.074750900268555, "global_step": 203925, "epoch": 2456} {"train_loss": -24.01932144165039, "global_step": 203926, "epoch": 2456} {"train_loss": -24.461233139038086, "global_step": 203927, "epoch": 2456} {"train_loss": -24.495468139648438, "global_step": 203928, "epoch": 2456} {"train_loss": -24.447681427001953, "global_step": 203929, "epoch": 2456} {"train_loss": -24.22634793476886, "global_step": 203930, "epoch": 2456, "val_loss": 6802164.0} {"train_loss": -24.049785614013672, "global_step": 203931, "epoch": 2457} {"train_loss": -23.91804313659668, "global_step": 203932, "epoch": 2457} {"train_loss": -23.728551864624023, "global_step": 203933, "epoch": 2457} {"train_loss": -23.872533798217773, "global_step": 203934, "epoch": 2457} {"train_loss": -24.47218132019043, "global_step": 203935, "epoch": 2457} {"train_loss": -23.8331356048584, "global_step": 203936, "epoch": 2457} {"train_loss": -23.81790542602539, "global_step": 203937, "epoch": 2457} {"train_loss": -24.19526481628418, "global_step": 203938, "epoch": 2457} {"train_loss": -24.076196670532227, "global_step": 203939, "epoch": 2457} {"train_loss": -24.050851821899414, "global_step": 203940, "epoch": 2457} {"train_loss": -23.70168113708496, "global_step": 203941, "epoch": 2457} {"train_loss": -23.710691452026367, "global_step": 203942, "epoch": 2457} {"train_loss": -24.033897399902344, "global_step": 203943, "epoch": 2457} {"train_loss": -23.959707260131836, "global_step": 203944, "epoch": 2457} {"train_loss": -24.17679214477539, "global_step": 203945, "epoch": 2457} {"train_loss": -24.067060470581055, "global_step": 203946, "epoch": 2457} {"train_loss": -23.911558151245117, "global_step": 203947, "epoch": 2457} {"train_loss": -24.064558029174805, "global_step": 203948, "epoch": 2457} {"train_loss": -23.806974411010742, "global_step": 203949, "epoch": 2457} {"train_loss": -24.078001022338867, "global_step": 203950, "epoch": 2457} {"train_loss": -23.974695205688477, "global_step": 203951, "epoch": 2457} {"train_loss": -24.417558670043945, "global_step": 203952, "epoch": 2457} {"train_loss": -24.292875289916992, "global_step": 203953, "epoch": 2457} {"train_loss": -23.977462768554688, "global_step": 203954, "epoch": 2457} {"train_loss": -23.546045303344727, "global_step": 203955, "epoch": 2457} {"train_loss": -23.997211456298828, "global_step": 203956, "epoch": 2457} {"train_loss": -24.112905502319336, "global_step": 203957, "epoch": 2457} {"train_loss": -24.091814041137695, "global_step": 203958, "epoch": 2457} {"train_loss": -23.85193634033203, "global_step": 203959, "epoch": 2457} {"train_loss": -24.138517379760742, "global_step": 203960, "epoch": 2457} {"train_loss": -24.006351470947266, "global_step": 203961, "epoch": 2457} {"train_loss": -24.2589168548584, "global_step": 203962, "epoch": 2457} {"train_loss": -24.347763061523438, "global_step": 203963, "epoch": 2457} {"train_loss": -24.40765953063965, "global_step": 203964, "epoch": 2457} {"train_loss": -24.67805290222168, "global_step": 203965, "epoch": 2457} {"train_loss": -24.2139892578125, "global_step": 203966, "epoch": 2457} {"train_loss": -24.463205337524414, "global_step": 203967, "epoch": 2457} {"train_loss": -24.34904670715332, "global_step": 203968, "epoch": 2457} {"train_loss": -24.00178337097168, "global_step": 203969, "epoch": 2457} {"train_loss": -24.554677963256836, "global_step": 203970, "epoch": 2457} {"train_loss": -24.14851951599121, "global_step": 203971, "epoch": 2457} {"train_loss": -24.588529586791992, "global_step": 203972, "epoch": 2457} {"train_loss": -24.185239791870117, "global_step": 203973, "epoch": 2457} {"train_loss": -24.276996612548828, "global_step": 203974, "epoch": 2457} {"train_loss": -24.173664093017578, "global_step": 203975, "epoch": 2457} {"train_loss": -24.321487426757812, "global_step": 203976, "epoch": 2457} {"train_loss": -24.42827796936035, "global_step": 203977, "epoch": 2457} {"train_loss": -24.385229110717773, "global_step": 203978, "epoch": 2457} {"train_loss": -24.17616081237793, "global_step": 203979, "epoch": 2457} {"train_loss": -24.407480239868164, "global_step": 203980, "epoch": 2457} {"train_loss": -24.06629180908203, "global_step": 203981, "epoch": 2457} {"train_loss": -24.63251304626465, "global_step": 203982, "epoch": 2457} {"train_loss": -24.17946434020996, "global_step": 203983, "epoch": 2457} {"train_loss": -24.428226470947266, "global_step": 203984, "epoch": 2457} {"train_loss": -24.85320472717285, "global_step": 203985, "epoch": 2457} {"train_loss": -24.1776180267334, "global_step": 203986, "epoch": 2457} {"train_loss": -24.393159866333008, "global_step": 203987, "epoch": 2457} {"train_loss": -24.287824630737305, "global_step": 203988, "epoch": 2457} {"train_loss": -24.507497787475586, "global_step": 203989, "epoch": 2457} {"train_loss": -24.493223190307617, "global_step": 203990, "epoch": 2457} {"train_loss": -24.082693099975586, "global_step": 203991, "epoch": 2457} {"train_loss": -24.39687156677246, "global_step": 203992, "epoch": 2457} {"train_loss": -24.519704818725586, "global_step": 203993, "epoch": 2457} {"train_loss": -24.521177291870117, "global_step": 203994, "epoch": 2457} {"train_loss": -24.12871742248535, "global_step": 203995, "epoch": 2457} {"train_loss": -24.250078201293945, "global_step": 203996, "epoch": 2457} {"train_loss": -24.356433868408203, "global_step": 203997, "epoch": 2457} {"train_loss": -24.413156509399414, "global_step": 203998, "epoch": 2457} {"train_loss": -24.211566925048828, "global_step": 203999, "epoch": 2457} {"train_loss": -24.213165283203125, "global_step": 204000, "epoch": 2457} {"train_loss": -24.372800827026367, "global_step": 204001, "epoch": 2457} {"train_loss": -23.777801513671875, "global_step": 204002, "epoch": 2457} {"train_loss": -24.463136672973633, "global_step": 204003, "epoch": 2457} {"train_loss": -24.2455997467041, "global_step": 204004, "epoch": 2457} {"train_loss": -23.957778930664062, "global_step": 204005, "epoch": 2457} {"train_loss": -24.340648651123047, "global_step": 204006, "epoch": 2457} {"train_loss": -24.150617599487305, "global_step": 204007, "epoch": 2457} {"train_loss": -24.10597038269043, "global_step": 204008, "epoch": 2457} {"train_loss": -24.441730499267578, "global_step": 204009, "epoch": 2457} {"train_loss": -23.876352310180664, "global_step": 204010, "epoch": 2457} {"train_loss": -23.8883056640625, "global_step": 204011, "epoch": 2457} {"train_loss": -24.05890464782715, "global_step": 204012, "epoch": 2457} {"train_loss": -24.20024733945548, "global_step": 204013, "epoch": 2457, "val_loss": 6662054.0} {"train_loss": -22.45081901550293, "global_step": 204014, "epoch": 2458} {"train_loss": -22.42131996154785, "global_step": 204015, "epoch": 2458} {"train_loss": -23.649015426635742, "global_step": 204016, "epoch": 2458} {"train_loss": -22.377849578857422, "global_step": 204017, "epoch": 2458} {"train_loss": -22.9533634185791, "global_step": 204018, "epoch": 2458} {"train_loss": -23.02443504333496, "global_step": 204019, "epoch": 2458} {"train_loss": -22.225540161132812, "global_step": 204020, "epoch": 2458} {"train_loss": -23.34390640258789, "global_step": 204021, "epoch": 2458} {"train_loss": -23.276811599731445, "global_step": 204022, "epoch": 2458} {"train_loss": -23.353124618530273, "global_step": 204023, "epoch": 2458} {"train_loss": -23.214536666870117, "global_step": 204024, "epoch": 2458} {"train_loss": -23.5676326751709, "global_step": 204025, "epoch": 2458} {"train_loss": -22.91266441345215, "global_step": 204026, "epoch": 2458} {"train_loss": -23.72733497619629, "global_step": 204027, "epoch": 2458} {"train_loss": -23.136383056640625, "global_step": 204028, "epoch": 2458} {"train_loss": -23.528308868408203, "global_step": 204029, "epoch": 2458} {"train_loss": -23.766035079956055, "global_step": 204030, "epoch": 2458} {"train_loss": -23.714111328125, "global_step": 204031, "epoch": 2458} {"train_loss": -23.7095947265625, "global_step": 204032, "epoch": 2458} {"train_loss": -23.812665939331055, "global_step": 204033, "epoch": 2458} {"train_loss": -23.909231185913086, "global_step": 204034, "epoch": 2458} {"train_loss": -23.74617576599121, "global_step": 204035, "epoch": 2458} {"train_loss": -23.736488342285156, "global_step": 204036, "epoch": 2458} {"train_loss": -24.217802047729492, "global_step": 204037, "epoch": 2458} {"train_loss": -24.228424072265625, "global_step": 204038, "epoch": 2458} {"train_loss": -23.900848388671875, "global_step": 204039, "epoch": 2458} {"train_loss": -23.774457931518555, "global_step": 204040, "epoch": 2458} {"train_loss": -24.30422019958496, "global_step": 204041, "epoch": 2458} {"train_loss": -24.20046615600586, "global_step": 204042, "epoch": 2458} {"train_loss": -24.287765502929688, "global_step": 204043, "epoch": 2458} {"train_loss": -24.017850875854492, "global_step": 204044, "epoch": 2458} {"train_loss": -24.067777633666992, "global_step": 204045, "epoch": 2458} {"train_loss": -24.208059310913086, "global_step": 204046, "epoch": 2458} {"train_loss": -23.926761627197266, "global_step": 204047, "epoch": 2458} {"train_loss": -24.46392822265625, "global_step": 204048, "epoch": 2458} {"train_loss": -24.268508911132812, "global_step": 204049, "epoch": 2458} {"train_loss": -24.45221519470215, "global_step": 204050, "epoch": 2458} {"train_loss": -24.438858032226562, "global_step": 204051, "epoch": 2458} {"train_loss": -24.316375732421875, "global_step": 204052, "epoch": 2458} {"train_loss": -24.666765213012695, "global_step": 204053, "epoch": 2458} {"train_loss": -24.2949161529541, "global_step": 204054, "epoch": 2458} {"train_loss": -24.134374618530273, "global_step": 204055, "epoch": 2458} {"train_loss": -24.243213653564453, "global_step": 204056, "epoch": 2458} {"train_loss": -24.65509033203125, "global_step": 204057, "epoch": 2458} {"train_loss": -24.62518882751465, "global_step": 204058, "epoch": 2458} {"train_loss": -24.102842330932617, "global_step": 204059, "epoch": 2458} {"train_loss": -24.43216323852539, "global_step": 204060, "epoch": 2458} {"train_loss": -24.25164222717285, "global_step": 204061, "epoch": 2458} {"train_loss": -24.45831298828125, "global_step": 204062, "epoch": 2458} {"train_loss": -24.04998779296875, "global_step": 204063, "epoch": 2458} {"train_loss": -24.631595611572266, "global_step": 204064, "epoch": 2458} {"train_loss": -24.554706573486328, "global_step": 204065, "epoch": 2458} {"train_loss": -24.317737579345703, "global_step": 204066, "epoch": 2458} {"train_loss": -24.517431259155273, "global_step": 204067, "epoch": 2458} {"train_loss": -24.57558250427246, "global_step": 204068, "epoch": 2458} {"train_loss": -24.403440475463867, "global_step": 204069, "epoch": 2458} {"train_loss": -24.1143741607666, "global_step": 204070, "epoch": 2458} {"train_loss": -24.52013397216797, "global_step": 204071, "epoch": 2458} {"train_loss": -24.174177169799805, "global_step": 204072, "epoch": 2458} {"train_loss": -24.634963989257812, "global_step": 204073, "epoch": 2458} {"train_loss": -24.699453353881836, "global_step": 204074, "epoch": 2458} {"train_loss": -24.622236251831055, "global_step": 204075, "epoch": 2458} {"train_loss": -24.690837860107422, "global_step": 204076, "epoch": 2458} {"train_loss": -24.602731704711914, "global_step": 204077, "epoch": 2458} {"train_loss": -24.084177017211914, "global_step": 204078, "epoch": 2458} {"train_loss": -24.58446502685547, "global_step": 204079, "epoch": 2458} {"train_loss": -24.44514274597168, "global_step": 204080, "epoch": 2458} {"train_loss": -24.291606903076172, "global_step": 204081, "epoch": 2458} {"train_loss": -24.268238067626953, "global_step": 204082, "epoch": 2458} {"train_loss": -24.353351593017578, "global_step": 204083, "epoch": 2458} {"train_loss": -24.375885009765625, "global_step": 204084, "epoch": 2458} {"train_loss": -24.450162887573242, "global_step": 204085, "epoch": 2458} {"train_loss": -24.276609420776367, "global_step": 204086, "epoch": 2458} {"train_loss": -24.17572593688965, "global_step": 204087, "epoch": 2458} {"train_loss": -24.500503540039062, "global_step": 204088, "epoch": 2458} {"train_loss": -24.328327178955078, "global_step": 204089, "epoch": 2458} {"train_loss": -23.982807159423828, "global_step": 204090, "epoch": 2458} {"train_loss": -24.23590660095215, "global_step": 204091, "epoch": 2458} {"train_loss": -24.40216064453125, "global_step": 204092, "epoch": 2458} {"train_loss": -24.189510345458984, "global_step": 204093, "epoch": 2458} {"train_loss": -24.39693832397461, "global_step": 204094, "epoch": 2458} {"train_loss": -24.27365493774414, "global_step": 204095, "epoch": 2458} {"train_loss": -24.033616881772698, "global_step": 204096, "epoch": 2458, "val_loss": 6470329.5} {"train_loss": -22.085142135620117, "global_step": 204097, "epoch": 2459} {"train_loss": -21.072967529296875, "global_step": 204098, "epoch": 2459} {"train_loss": -23.431623458862305, "global_step": 204099, "epoch": 2459} {"train_loss": -22.51608657836914, "global_step": 204100, "epoch": 2459} {"train_loss": -23.32581329345703, "global_step": 204101, "epoch": 2459} {"train_loss": -22.84463882446289, "global_step": 204102, "epoch": 2459} {"train_loss": -23.414493560791016, "global_step": 204103, "epoch": 2459} {"train_loss": -22.659780502319336, "global_step": 204104, "epoch": 2459} {"train_loss": -23.782073974609375, "global_step": 204105, "epoch": 2459} {"train_loss": -23.47237777709961, "global_step": 204106, "epoch": 2459} {"train_loss": -22.794818878173828, "global_step": 204107, "epoch": 2459} {"train_loss": -23.631439208984375, "global_step": 204108, "epoch": 2459} {"train_loss": -23.636674880981445, "global_step": 204109, "epoch": 2459} {"train_loss": -23.59797477722168, "global_step": 204110, "epoch": 2459} {"train_loss": -23.594879150390625, "global_step": 204111, "epoch": 2459} {"train_loss": -23.503150939941406, "global_step": 204112, "epoch": 2459} {"train_loss": -23.66966438293457, "global_step": 204113, "epoch": 2459} {"train_loss": -23.771656036376953, "global_step": 204114, "epoch": 2459} {"train_loss": -23.639190673828125, "global_step": 204115, "epoch": 2459} {"train_loss": -23.81235694885254, "global_step": 204116, "epoch": 2459} {"train_loss": -23.417804718017578, "global_step": 204117, "epoch": 2459} {"train_loss": -23.60910987854004, "global_step": 204118, "epoch": 2459} {"train_loss": -23.773000717163086, "global_step": 204119, "epoch": 2459} {"train_loss": -23.43201446533203, "global_step": 204120, "epoch": 2459} {"train_loss": -23.548473358154297, "global_step": 204121, "epoch": 2459} {"train_loss": -23.864669799804688, "global_step": 204122, "epoch": 2459} {"train_loss": -23.933326721191406, "global_step": 204123, "epoch": 2459} {"train_loss": -23.91402244567871, "global_step": 204124, "epoch": 2459} {"train_loss": -24.05491828918457, "global_step": 204125, "epoch": 2459} {"train_loss": -23.95195198059082, "global_step": 204126, "epoch": 2459} {"train_loss": -24.09429359436035, "global_step": 204127, "epoch": 2459} {"train_loss": -24.031442642211914, "global_step": 204128, "epoch": 2459} {"train_loss": -24.204267501831055, "global_step": 204129, "epoch": 2459} {"train_loss": -23.926740646362305, "global_step": 204130, "epoch": 2459} {"train_loss": -23.939207077026367, "global_step": 204131, "epoch": 2459} {"train_loss": -24.64725112915039, "global_step": 204132, "epoch": 2459} {"train_loss": -24.150609970092773, "global_step": 204133, "epoch": 2459} {"train_loss": -24.431669235229492, "global_step": 204134, "epoch": 2459} {"train_loss": -24.108137130737305, "global_step": 204135, "epoch": 2459} {"train_loss": -24.537418365478516, "global_step": 204136, "epoch": 2459} {"train_loss": -24.09307289123535, "global_step": 204137, "epoch": 2459} {"train_loss": -24.30304527282715, "global_step": 204138, "epoch": 2459} {"train_loss": -24.38954734802246, "global_step": 204139, "epoch": 2459} {"train_loss": -24.29286766052246, "global_step": 204140, "epoch": 2459} {"train_loss": -24.464534759521484, "global_step": 204141, "epoch": 2459} {"train_loss": -24.228763580322266, "global_step": 204142, "epoch": 2459} {"train_loss": -24.29130744934082, "global_step": 204143, "epoch": 2459} {"train_loss": -24.679855346679688, "global_step": 204144, "epoch": 2459} {"train_loss": -24.531890869140625, "global_step": 204145, "epoch": 2459} {"train_loss": -24.38395118713379, "global_step": 204146, "epoch": 2459} {"train_loss": -24.62420654296875, "global_step": 204147, "epoch": 2459} {"train_loss": -24.340219497680664, "global_step": 204148, "epoch": 2459} {"train_loss": -24.48748779296875, "global_step": 204149, "epoch": 2459} {"train_loss": -24.38396453857422, "global_step": 204150, "epoch": 2459} {"train_loss": -24.623647689819336, "global_step": 204151, "epoch": 2459} {"train_loss": -24.406267166137695, "global_step": 204152, "epoch": 2459} {"train_loss": -24.52248191833496, "global_step": 204153, "epoch": 2459} {"train_loss": -24.688905715942383, "global_step": 204154, "epoch": 2459} {"train_loss": -24.34759521484375, "global_step": 204155, "epoch": 2459} {"train_loss": -24.25799560546875, "global_step": 204156, "epoch": 2459} {"train_loss": -24.1756591796875, "global_step": 204157, "epoch": 2459} {"train_loss": -24.103361129760742, "global_step": 204158, "epoch": 2459} {"train_loss": -24.53628921508789, "global_step": 204159, "epoch": 2459} {"train_loss": -24.358415603637695, "global_step": 204160, "epoch": 2459} {"train_loss": -24.29886817932129, "global_step": 204161, "epoch": 2459} {"train_loss": -24.468767166137695, "global_step": 204162, "epoch": 2459} {"train_loss": -24.286535263061523, "global_step": 204163, "epoch": 2459} {"train_loss": -24.7813663482666, "global_step": 204164, "epoch": 2459} {"train_loss": -24.594343185424805, "global_step": 204165, "epoch": 2459} {"train_loss": -24.560108184814453, "global_step": 204166, "epoch": 2459} {"train_loss": -24.737409591674805, "global_step": 204167, "epoch": 2459} {"train_loss": -24.254667282104492, "global_step": 204168, "epoch": 2459} {"train_loss": -24.261016845703125, "global_step": 204169, "epoch": 2459} {"train_loss": -24.12337303161621, "global_step": 204170, "epoch": 2459} {"train_loss": -24.415206909179688, "global_step": 204171, "epoch": 2459} {"train_loss": -24.45819854736328, "global_step": 204172, "epoch": 2459} {"train_loss": -23.80621910095215, "global_step": 204173, "epoch": 2459} {"train_loss": -24.551122665405273, "global_step": 204174, "epoch": 2459} {"train_loss": -24.156410217285156, "global_step": 204175, "epoch": 2459} {"train_loss": -24.39759635925293, "global_step": 204176, "epoch": 2459} {"train_loss": -24.63730812072754, "global_step": 204177, "epoch": 2459} {"train_loss": -24.6660213470459, "global_step": 204178, "epoch": 2459} {"train_loss": -24.009119884077325, "global_step": 204179, "epoch": 2459, "val_loss": 6390690.0} {"train_loss": -24.40571403503418, "global_step": 204180, "epoch": 2460} {"train_loss": -23.701852798461914, "global_step": 204181, "epoch": 2460} {"train_loss": -24.067276000976562, "global_step": 204182, "epoch": 2460} {"train_loss": -23.36226463317871, "global_step": 204183, "epoch": 2460} {"train_loss": -23.99114990234375, "global_step": 204184, "epoch": 2460} {"train_loss": -23.555356979370117, "global_step": 204185, "epoch": 2460} {"train_loss": -23.61117935180664, "global_step": 204186, "epoch": 2460} {"train_loss": -23.580188751220703, "global_step": 204187, "epoch": 2460} {"train_loss": -23.827468872070312, "global_step": 204188, "epoch": 2460} {"train_loss": -23.58998680114746, "global_step": 204189, "epoch": 2460} {"train_loss": -24.035032272338867, "global_step": 204190, "epoch": 2460} {"train_loss": -23.66335678100586, "global_step": 204191, "epoch": 2460} {"train_loss": -24.29837417602539, "global_step": 204192, "epoch": 2460} {"train_loss": -24.108245849609375, "global_step": 204193, "epoch": 2460} {"train_loss": -24.427207946777344, "global_step": 204194, "epoch": 2460} {"train_loss": -23.96551513671875, "global_step": 204195, "epoch": 2460} {"train_loss": -24.312271118164062, "global_step": 204196, "epoch": 2460} {"train_loss": -24.061986923217773, "global_step": 204197, "epoch": 2460} {"train_loss": -24.233625411987305, "global_step": 204198, "epoch": 2460} {"train_loss": -24.153818130493164, "global_step": 204199, "epoch": 2460} {"train_loss": -24.3147029876709, "global_step": 204200, "epoch": 2460} {"train_loss": -24.11661720275879, "global_step": 204201, "epoch": 2460} {"train_loss": -24.36763572692871, "global_step": 204202, "epoch": 2460} {"train_loss": -24.459692001342773, "global_step": 204203, "epoch": 2460} {"train_loss": -24.4960994720459, "global_step": 204204, "epoch": 2460} {"train_loss": -24.105878829956055, "global_step": 204205, "epoch": 2460} {"train_loss": -24.31686019897461, "global_step": 204206, "epoch": 2460} {"train_loss": -24.38134765625, "global_step": 204207, "epoch": 2460} {"train_loss": -24.104738235473633, "global_step": 204208, "epoch": 2460} {"train_loss": -24.39743995666504, "global_step": 204209, "epoch": 2460} {"train_loss": -24.001819610595703, "global_step": 204210, "epoch": 2460} {"train_loss": -24.499067306518555, "global_step": 204211, "epoch": 2460} {"train_loss": -24.174436569213867, "global_step": 204212, "epoch": 2460} {"train_loss": -24.32088279724121, "global_step": 204213, "epoch": 2460} {"train_loss": -24.54261589050293, "global_step": 204214, "epoch": 2460} {"train_loss": -24.661819458007812, "global_step": 204215, "epoch": 2460} {"train_loss": -24.269994735717773, "global_step": 204216, "epoch": 2460} {"train_loss": -24.63071060180664, "global_step": 204217, "epoch": 2460} {"train_loss": -24.712438583374023, "global_step": 204218, "epoch": 2460} {"train_loss": -24.5263729095459, "global_step": 204219, "epoch": 2460} {"train_loss": -24.135395050048828, "global_step": 204220, "epoch": 2460} {"train_loss": -24.517786026000977, "global_step": 204221, "epoch": 2460} {"train_loss": -24.446063995361328, "global_step": 204222, "epoch": 2460} {"train_loss": -24.36594009399414, "global_step": 204223, "epoch": 2460} {"train_loss": -24.40130615234375, "global_step": 204224, "epoch": 2460} {"train_loss": -24.539350509643555, "global_step": 204225, "epoch": 2460} {"train_loss": -23.99214744567871, "global_step": 204226, "epoch": 2460} {"train_loss": -24.40754508972168, "global_step": 204227, "epoch": 2460} {"train_loss": -24.531118392944336, "global_step": 204228, "epoch": 2460} {"train_loss": -23.972923278808594, "global_step": 204229, "epoch": 2460} {"train_loss": -23.569869995117188, "global_step": 204230, "epoch": 2460} {"train_loss": -23.866552352905273, "global_step": 204231, "epoch": 2460} {"train_loss": -24.153244018554688, "global_step": 204232, "epoch": 2460} {"train_loss": -24.062705993652344, "global_step": 204233, "epoch": 2460} {"train_loss": -24.220327377319336, "global_step": 204234, "epoch": 2460} {"train_loss": -23.841447830200195, "global_step": 204235, "epoch": 2460} {"train_loss": -23.70147132873535, "global_step": 204236, "epoch": 2460} {"train_loss": -23.99237632751465, "global_step": 204237, "epoch": 2460} {"train_loss": -23.563217163085938, "global_step": 204238, "epoch": 2460} {"train_loss": -24.04914093017578, "global_step": 204239, "epoch": 2460} {"train_loss": -23.964481353759766, "global_step": 204240, "epoch": 2460} {"train_loss": -23.443565368652344, "global_step": 204241, "epoch": 2460} {"train_loss": -23.90555191040039, "global_step": 204242, "epoch": 2460} {"train_loss": -23.788599014282227, "global_step": 204243, "epoch": 2460} {"train_loss": -23.623462677001953, "global_step": 204244, "epoch": 2460} {"train_loss": -24.429365158081055, "global_step": 204245, "epoch": 2460} {"train_loss": -23.658964157104492, "global_step": 204246, "epoch": 2460} {"train_loss": -23.958553314208984, "global_step": 204247, "epoch": 2460} {"train_loss": -23.79136085510254, "global_step": 204248, "epoch": 2460} {"train_loss": -24.454544067382812, "global_step": 204249, "epoch": 2460} {"train_loss": -24.446630477905273, "global_step": 204250, "epoch": 2460} {"train_loss": -23.827558517456055, "global_step": 204251, "epoch": 2460} {"train_loss": -23.951913833618164, "global_step": 204252, "epoch": 2460} {"train_loss": -24.109729766845703, "global_step": 204253, "epoch": 2460} {"train_loss": -24.326688766479492, "global_step": 204254, "epoch": 2460} {"train_loss": -23.91829490661621, "global_step": 204255, "epoch": 2460} {"train_loss": -24.21340560913086, "global_step": 204256, "epoch": 2460} {"train_loss": -24.012556076049805, "global_step": 204257, "epoch": 2460} {"train_loss": -24.234214782714844, "global_step": 204258, "epoch": 2460} {"train_loss": -24.19866943359375, "global_step": 204259, "epoch": 2460} {"train_loss": -24.4665584564209, "global_step": 204260, "epoch": 2460} {"train_loss": -24.352725982666016, "global_step": 204261, "epoch": 2460} {"train_loss": -24.122305881546204, "global_step": 204262, "epoch": 2460, "val_loss": 6615475.0} {"train_loss": -24.014591217041016, "global_step": 204263, "epoch": 2461} {"train_loss": -24.51650047302246, "global_step": 204264, "epoch": 2461} {"train_loss": -24.021242141723633, "global_step": 204265, "epoch": 2461} {"train_loss": -23.935895919799805, "global_step": 204266, "epoch": 2461} {"train_loss": -24.209827423095703, "global_step": 204267, "epoch": 2461} {"train_loss": -23.739999771118164, "global_step": 204268, "epoch": 2461} {"train_loss": -23.769699096679688, "global_step": 204269, "epoch": 2461} {"train_loss": -24.09532356262207, "global_step": 204270, "epoch": 2461} {"train_loss": -24.22702407836914, "global_step": 204271, "epoch": 2461} {"train_loss": -23.842166900634766, "global_step": 204272, "epoch": 2461} {"train_loss": -24.100358963012695, "global_step": 204273, "epoch": 2461} {"train_loss": -23.82179832458496, "global_step": 204274, "epoch": 2461} {"train_loss": -23.798221588134766, "global_step": 204275, "epoch": 2461} {"train_loss": -24.04974365234375, "global_step": 204276, "epoch": 2461} {"train_loss": -24.29182243347168, "global_step": 204277, "epoch": 2461} {"train_loss": -24.213638305664062, "global_step": 204278, "epoch": 2461} {"train_loss": -24.02703857421875, "global_step": 204279, "epoch": 2461} {"train_loss": -24.236326217651367, "global_step": 204280, "epoch": 2461} {"train_loss": -24.03221893310547, "global_step": 204281, "epoch": 2461} {"train_loss": -24.365402221679688, "global_step": 204282, "epoch": 2461} {"train_loss": -24.550357818603516, "global_step": 204283, "epoch": 2461} {"train_loss": -23.9969539642334, "global_step": 204284, "epoch": 2461} {"train_loss": -24.335540771484375, "global_step": 204285, "epoch": 2461} {"train_loss": -23.942914962768555, "global_step": 204286, "epoch": 2461} {"train_loss": -24.161645889282227, "global_step": 204287, "epoch": 2461} {"train_loss": -24.06943130493164, "global_step": 204288, "epoch": 2461} {"train_loss": -24.271240234375, "global_step": 204289, "epoch": 2461} {"train_loss": -24.417871475219727, "global_step": 204290, "epoch": 2461} {"train_loss": -24.13860511779785, "global_step": 204291, "epoch": 2461} {"train_loss": -24.13286781311035, "global_step": 204292, "epoch": 2461} {"train_loss": -24.471097946166992, "global_step": 204293, "epoch": 2461} {"train_loss": -24.11899757385254, "global_step": 204294, "epoch": 2461} {"train_loss": -24.42043685913086, "global_step": 204295, "epoch": 2461} {"train_loss": -24.205015182495117, "global_step": 204296, "epoch": 2461} {"train_loss": -24.31807518005371, "global_step": 204297, "epoch": 2461} {"train_loss": -24.1743221282959, "global_step": 204298, "epoch": 2461} {"train_loss": -24.068265914916992, "global_step": 204299, "epoch": 2461} {"train_loss": -24.490360260009766, "global_step": 204300, "epoch": 2461} {"train_loss": -24.099302291870117, "global_step": 204301, "epoch": 2461} {"train_loss": -24.19722557067871, "global_step": 204302, "epoch": 2461} {"train_loss": -24.441408157348633, "global_step": 204303, "epoch": 2461} {"train_loss": -24.20454216003418, "global_step": 204304, "epoch": 2461} {"train_loss": -24.316858291625977, "global_step": 204305, "epoch": 2461} {"train_loss": -24.461734771728516, "global_step": 204306, "epoch": 2461} {"train_loss": -24.34367561340332, "global_step": 204307, "epoch": 2461} {"train_loss": -24.428829193115234, "global_step": 204308, "epoch": 2461} {"train_loss": -24.430025100708008, "global_step": 204309, "epoch": 2461} {"train_loss": -24.1646728515625, "global_step": 204310, "epoch": 2461} {"train_loss": -24.55220603942871, "global_step": 204311, "epoch": 2461} {"train_loss": -24.1342716217041, "global_step": 204312, "epoch": 2461} {"train_loss": -24.58819580078125, "global_step": 204313, "epoch": 2461} {"train_loss": -24.09705924987793, "global_step": 204314, "epoch": 2461} {"train_loss": -24.479522705078125, "global_step": 204315, "epoch": 2461} {"train_loss": -24.249008178710938, "global_step": 204316, "epoch": 2461} {"train_loss": -24.3599853515625, "global_step": 204317, "epoch": 2461} {"train_loss": -24.774442672729492, "global_step": 204318, "epoch": 2461} {"train_loss": -24.26566505432129, "global_step": 204319, "epoch": 2461} {"train_loss": -24.123645782470703, "global_step": 204320, "epoch": 2461} {"train_loss": -24.261459350585938, "global_step": 204321, "epoch": 2461} {"train_loss": -24.11512565612793, "global_step": 204322, "epoch": 2461} {"train_loss": -24.44631576538086, "global_step": 204323, "epoch": 2461} {"train_loss": -24.507484436035156, "global_step": 204324, "epoch": 2461} {"train_loss": -24.323705673217773, "global_step": 204325, "epoch": 2461} {"train_loss": -24.370588302612305, "global_step": 204326, "epoch": 2461} {"train_loss": -24.39841079711914, "global_step": 204327, "epoch": 2461} {"train_loss": -24.14768409729004, "global_step": 204328, "epoch": 2461} {"train_loss": -24.168472290039062, "global_step": 204329, "epoch": 2461} {"train_loss": -24.799152374267578, "global_step": 204330, "epoch": 2461} {"train_loss": -24.60022735595703, "global_step": 204331, "epoch": 2461} {"train_loss": -24.362144470214844, "global_step": 204332, "epoch": 2461} {"train_loss": -24.796592712402344, "global_step": 204333, "epoch": 2461} {"train_loss": -24.541051864624023, "global_step": 204334, "epoch": 2461} {"train_loss": -24.199995040893555, "global_step": 204335, "epoch": 2461} {"train_loss": -24.337522506713867, "global_step": 204336, "epoch": 2461} {"train_loss": -24.191495895385742, "global_step": 204337, "epoch": 2461} {"train_loss": -24.537694931030273, "global_step": 204338, "epoch": 2461} {"train_loss": -24.00568199157715, "global_step": 204339, "epoch": 2461} {"train_loss": -24.6143798828125, "global_step": 204340, "epoch": 2461} {"train_loss": -24.57781219482422, "global_step": 204341, "epoch": 2461} {"train_loss": -24.773334503173828, "global_step": 204342, "epoch": 2461} {"train_loss": -24.629892349243164, "global_step": 204343, "epoch": 2461} {"train_loss": -24.816125869750977, "global_step": 204344, "epoch": 2461} {"train_loss": -24.277019914374293, "global_step": 204345, "epoch": 2461, "val_loss": 6495806.0} {"train_loss": -23.849138259887695, "global_step": 204346, "epoch": 2462} {"train_loss": -24.412309646606445, "global_step": 204347, "epoch": 2462} {"train_loss": -23.98511505126953, "global_step": 204348, "epoch": 2462} {"train_loss": -24.211015701293945, "global_step": 204349, "epoch": 2462} {"train_loss": -23.8172607421875, "global_step": 204350, "epoch": 2462} {"train_loss": -23.877098083496094, "global_step": 204351, "epoch": 2462} {"train_loss": -24.02164077758789, "global_step": 204352, "epoch": 2462} {"train_loss": -24.009122848510742, "global_step": 204353, "epoch": 2462} {"train_loss": -23.862884521484375, "global_step": 204354, "epoch": 2462} {"train_loss": -24.433698654174805, "global_step": 204355, "epoch": 2462} {"train_loss": -24.153478622436523, "global_step": 204356, "epoch": 2462} {"train_loss": -23.75801658630371, "global_step": 204357, "epoch": 2462} {"train_loss": -24.497608184814453, "global_step": 204358, "epoch": 2462} {"train_loss": -24.317380905151367, "global_step": 204359, "epoch": 2462} {"train_loss": -23.87921714782715, "global_step": 204360, "epoch": 2462} {"train_loss": -24.602930068969727, "global_step": 204361, "epoch": 2462} {"train_loss": -24.276363372802734, "global_step": 204362, "epoch": 2462} {"train_loss": -23.896085739135742, "global_step": 204363, "epoch": 2462} {"train_loss": -23.829296112060547, "global_step": 204364, "epoch": 2462} {"train_loss": -24.02345085144043, "global_step": 204365, "epoch": 2462} {"train_loss": -24.114423751831055, "global_step": 204366, "epoch": 2462} {"train_loss": -24.372913360595703, "global_step": 204367, "epoch": 2462} {"train_loss": -24.188369750976562, "global_step": 204368, "epoch": 2462} {"train_loss": -24.731191635131836, "global_step": 204369, "epoch": 2462} {"train_loss": -23.664648056030273, "global_step": 204370, "epoch": 2462} {"train_loss": -24.296329498291016, "global_step": 204371, "epoch": 2462} {"train_loss": -24.25327491760254, "global_step": 204372, "epoch": 2462} {"train_loss": -24.20735740661621, "global_step": 204373, "epoch": 2462} {"train_loss": -24.38706398010254, "global_step": 204374, "epoch": 2462} {"train_loss": -24.070812225341797, "global_step": 204375, "epoch": 2462} {"train_loss": -24.3555850982666, "global_step": 204376, "epoch": 2462} {"train_loss": -24.448301315307617, "global_step": 204377, "epoch": 2462} {"train_loss": -24.696147918701172, "global_step": 204378, "epoch": 2462} {"train_loss": -24.397293090820312, "global_step": 204379, "epoch": 2462} {"train_loss": -24.331039428710938, "global_step": 204380, "epoch": 2462} {"train_loss": -24.570453643798828, "global_step": 204381, "epoch": 2462} {"train_loss": -24.529691696166992, "global_step": 204382, "epoch": 2462} {"train_loss": -24.285165786743164, "global_step": 204383, "epoch": 2462} {"train_loss": -24.26960563659668, "global_step": 204384, "epoch": 2462} {"train_loss": -24.194461822509766, "global_step": 204385, "epoch": 2462} {"train_loss": -24.262582778930664, "global_step": 204386, "epoch": 2462} {"train_loss": -24.311298370361328, "global_step": 204387, "epoch": 2462} {"train_loss": -24.51143455505371, "global_step": 204388, "epoch": 2462} {"train_loss": -24.228382110595703, "global_step": 204389, "epoch": 2462} {"train_loss": -24.251953125, "global_step": 204390, "epoch": 2462} {"train_loss": -24.63655662536621, "global_step": 204391, "epoch": 2462} {"train_loss": -24.228839874267578, "global_step": 204392, "epoch": 2462} {"train_loss": -24.441774368286133, "global_step": 204393, "epoch": 2462} {"train_loss": -24.0983943939209, "global_step": 204394, "epoch": 2462} {"train_loss": -24.54227066040039, "global_step": 204395, "epoch": 2462} {"train_loss": -24.622760772705078, "global_step": 204396, "epoch": 2462} {"train_loss": -24.385135650634766, "global_step": 204397, "epoch": 2462} {"train_loss": -24.33994483947754, "global_step": 204398, "epoch": 2462} {"train_loss": -24.55942726135254, "global_step": 204399, "epoch": 2462} {"train_loss": -24.476741790771484, "global_step": 204400, "epoch": 2462} {"train_loss": -24.496238708496094, "global_step": 204401, "epoch": 2462} {"train_loss": -24.40667724609375, "global_step": 204402, "epoch": 2462} {"train_loss": -24.416900634765625, "global_step": 204403, "epoch": 2462} {"train_loss": -24.715478897094727, "global_step": 204404, "epoch": 2462} {"train_loss": -24.410612106323242, "global_step": 204405, "epoch": 2462} {"train_loss": -24.28822898864746, "global_step": 204406, "epoch": 2462} {"train_loss": -24.499975204467773, "global_step": 204407, "epoch": 2462} {"train_loss": -24.19512939453125, "global_step": 204408, "epoch": 2462} {"train_loss": -24.547948837280273, "global_step": 204409, "epoch": 2462} {"train_loss": -24.246383666992188, "global_step": 204410, "epoch": 2462} {"train_loss": -24.055219650268555, "global_step": 204411, "epoch": 2462} {"train_loss": -24.434499740600586, "global_step": 204412, "epoch": 2462} {"train_loss": -24.535600662231445, "global_step": 204413, "epoch": 2462} {"train_loss": -24.728788375854492, "global_step": 204414, "epoch": 2462} {"train_loss": -24.17340087890625, "global_step": 204415, "epoch": 2462} {"train_loss": -24.22295570373535, "global_step": 204416, "epoch": 2462} {"train_loss": -24.338071823120117, "global_step": 204417, "epoch": 2462} {"train_loss": -24.4044132232666, "global_step": 204418, "epoch": 2462} {"train_loss": -24.26267433166504, "global_step": 204419, "epoch": 2462} {"train_loss": -24.463930130004883, "global_step": 204420, "epoch": 2462} {"train_loss": -24.343427658081055, "global_step": 204421, "epoch": 2462} {"train_loss": -24.89857292175293, "global_step": 204422, "epoch": 2462} {"train_loss": -24.680803298950195, "global_step": 204423, "epoch": 2462} {"train_loss": -24.485376358032227, "global_step": 204424, "epoch": 2462} {"train_loss": -24.834989547729492, "global_step": 204425, "epoch": 2462} {"train_loss": -24.1573429107666, "global_step": 204426, "epoch": 2462} {"train_loss": -24.31341552734375, "global_step": 204427, "epoch": 2462} {"train_loss": -24.313424052962336, "global_step": 204428, "epoch": 2462, "val_loss": 6691478.5} {"train_loss": -23.992294311523438, "global_step": 204429, "epoch": 2463} {"train_loss": -23.863914489746094, "global_step": 204430, "epoch": 2463} {"train_loss": -24.290517807006836, "global_step": 204431, "epoch": 2463} {"train_loss": -24.244937896728516, "global_step": 204432, "epoch": 2463} {"train_loss": -24.106298446655273, "global_step": 204433, "epoch": 2463} {"train_loss": -23.9814395904541, "global_step": 204434, "epoch": 2463} {"train_loss": -24.361902236938477, "global_step": 204435, "epoch": 2463} {"train_loss": -24.194351196289062, "global_step": 204436, "epoch": 2463} {"train_loss": -23.94349479675293, "global_step": 204437, "epoch": 2463} {"train_loss": -24.387136459350586, "global_step": 204438, "epoch": 2463} {"train_loss": -23.912662506103516, "global_step": 204439, "epoch": 2463} {"train_loss": -24.415868759155273, "global_step": 204440, "epoch": 2463} {"train_loss": -24.19080924987793, "global_step": 204441, "epoch": 2463} {"train_loss": -24.52437400817871, "global_step": 204442, "epoch": 2463} {"train_loss": -24.465478897094727, "global_step": 204443, "epoch": 2463} {"train_loss": -24.345645904541016, "global_step": 204444, "epoch": 2463} {"train_loss": -24.380064010620117, "global_step": 204445, "epoch": 2463} {"train_loss": -24.198598861694336, "global_step": 204446, "epoch": 2463} {"train_loss": -24.26808738708496, "global_step": 204447, "epoch": 2463} {"train_loss": -24.462072372436523, "global_step": 204448, "epoch": 2463} {"train_loss": -24.23409080505371, "global_step": 204449, "epoch": 2463} {"train_loss": -24.00759506225586, "global_step": 204450, "epoch": 2463} {"train_loss": -24.17689323425293, "global_step": 204451, "epoch": 2463} {"train_loss": -24.04061508178711, "global_step": 204452, "epoch": 2463} {"train_loss": -23.916440963745117, "global_step": 204453, "epoch": 2463} {"train_loss": -24.419492721557617, "global_step": 204454, "epoch": 2463} {"train_loss": -24.025386810302734, "global_step": 204455, "epoch": 2463} {"train_loss": -24.109750747680664, "global_step": 204456, "epoch": 2463} {"train_loss": -24.076351165771484, "global_step": 204457, "epoch": 2463} {"train_loss": -24.155630111694336, "global_step": 204458, "epoch": 2463} {"train_loss": -24.34040069580078, "global_step": 204459, "epoch": 2463} {"train_loss": -24.724044799804688, "global_step": 204460, "epoch": 2463} {"train_loss": -24.34684944152832, "global_step": 204461, "epoch": 2463} {"train_loss": -24.28997230529785, "global_step": 204462, "epoch": 2463} {"train_loss": -24.600875854492188, "global_step": 204463, "epoch": 2463} {"train_loss": -24.12839126586914, "global_step": 204464, "epoch": 2463} {"train_loss": -24.336191177368164, "global_step": 204465, "epoch": 2463} {"train_loss": -24.664562225341797, "global_step": 204466, "epoch": 2463} {"train_loss": -24.278366088867188, "global_step": 204467, "epoch": 2463} {"train_loss": -24.08704948425293, "global_step": 204468, "epoch": 2463} {"train_loss": -24.801753997802734, "global_step": 204469, "epoch": 2463} {"train_loss": -24.374666213989258, "global_step": 204470, "epoch": 2463} {"train_loss": -24.431838989257812, "global_step": 204471, "epoch": 2463} {"train_loss": -24.53175926208496, "global_step": 204472, "epoch": 2463} {"train_loss": -24.514877319335938, "global_step": 204473, "epoch": 2463} {"train_loss": -24.40509605407715, "global_step": 204474, "epoch": 2463} {"train_loss": -24.46870994567871, "global_step": 204475, "epoch": 2463} {"train_loss": -24.274490356445312, "global_step": 204476, "epoch": 2463} {"train_loss": -24.534183502197266, "global_step": 204477, "epoch": 2463} {"train_loss": -24.4255428314209, "global_step": 204478, "epoch": 2463} {"train_loss": -24.319805145263672, "global_step": 204479, "epoch": 2463} {"train_loss": -24.431730270385742, "global_step": 204480, "epoch": 2463} {"train_loss": -24.643936157226562, "global_step": 204481, "epoch": 2463} {"train_loss": -24.109176635742188, "global_step": 204482, "epoch": 2463} {"train_loss": -24.16375732421875, "global_step": 204483, "epoch": 2463} {"train_loss": -24.25524139404297, "global_step": 204484, "epoch": 2463} {"train_loss": -24.260290145874023, "global_step": 204485, "epoch": 2463} {"train_loss": -24.199663162231445, "global_step": 204486, "epoch": 2463} {"train_loss": -24.30303955078125, "global_step": 204487, "epoch": 2463} {"train_loss": -24.327783584594727, "global_step": 204488, "epoch": 2463} {"train_loss": -24.419708251953125, "global_step": 204489, "epoch": 2463} {"train_loss": -23.890291213989258, "global_step": 204490, "epoch": 2463} {"train_loss": -24.48985481262207, "global_step": 204491, "epoch": 2463} {"train_loss": -24.27153778076172, "global_step": 204492, "epoch": 2463} {"train_loss": -24.43568992614746, "global_step": 204493, "epoch": 2463} {"train_loss": -24.770971298217773, "global_step": 204494, "epoch": 2463} {"train_loss": -24.522565841674805, "global_step": 204495, "epoch": 2463} {"train_loss": -24.012798309326172, "global_step": 204496, "epoch": 2463} {"train_loss": -24.395090103149414, "global_step": 204497, "epoch": 2463} {"train_loss": -24.31049346923828, "global_step": 204498, "epoch": 2463} {"train_loss": -24.37860107421875, "global_step": 204499, "epoch": 2463} {"train_loss": -24.343862533569336, "global_step": 204500, "epoch": 2463} {"train_loss": -24.38578987121582, "global_step": 204501, "epoch": 2463} {"train_loss": -24.454526901245117, "global_step": 204502, "epoch": 2463} {"train_loss": -23.722463607788086, "global_step": 204503, "epoch": 2463} {"train_loss": -24.198078155517578, "global_step": 204504, "epoch": 2463} {"train_loss": -24.84136962890625, "global_step": 204505, "epoch": 2463} {"train_loss": -24.327239990234375, "global_step": 204506, "epoch": 2463} {"train_loss": -24.3646240234375, "global_step": 204507, "epoch": 2463} {"train_loss": -24.482080459594727, "global_step": 204508, "epoch": 2463} {"train_loss": -24.043750762939453, "global_step": 204509, "epoch": 2463} {"train_loss": -24.66704750061035, "global_step": 204510, "epoch": 2463} {"train_loss": -24.30009021529232, "global_step": 204511, "epoch": 2463, "val_loss": 6588726.5} {"train_loss": -24.38353157043457, "global_step": 204512, "epoch": 2464} {"train_loss": -24.16265106201172, "global_step": 204513, "epoch": 2464} {"train_loss": -24.45464515686035, "global_step": 204514, "epoch": 2464} {"train_loss": -24.019073486328125, "global_step": 204515, "epoch": 2464} {"train_loss": -24.198047637939453, "global_step": 204516, "epoch": 2464} {"train_loss": -24.15183448791504, "global_step": 204517, "epoch": 2464} {"train_loss": -24.340436935424805, "global_step": 204518, "epoch": 2464} {"train_loss": -23.516706466674805, "global_step": 204519, "epoch": 2464} {"train_loss": -24.432920455932617, "global_step": 204520, "epoch": 2464} {"train_loss": -23.990692138671875, "global_step": 204521, "epoch": 2464} {"train_loss": -24.378070831298828, "global_step": 204522, "epoch": 2464} {"train_loss": -23.899656295776367, "global_step": 204523, "epoch": 2464} {"train_loss": -23.95477294921875, "global_step": 204524, "epoch": 2464} {"train_loss": -23.86067771911621, "global_step": 204525, "epoch": 2464} {"train_loss": -24.254919052124023, "global_step": 204526, "epoch": 2464} {"train_loss": -24.34264373779297, "global_step": 204527, "epoch": 2464} {"train_loss": -24.148235321044922, "global_step": 204528, "epoch": 2464} {"train_loss": -24.284055709838867, "global_step": 204529, "epoch": 2464} {"train_loss": -24.266447067260742, "global_step": 204530, "epoch": 2464} {"train_loss": -24.094511032104492, "global_step": 204531, "epoch": 2464} {"train_loss": -24.222013473510742, "global_step": 204532, "epoch": 2464} {"train_loss": -24.184846878051758, "global_step": 204533, "epoch": 2464} {"train_loss": -24.65647315979004, "global_step": 204534, "epoch": 2464} {"train_loss": -24.428382873535156, "global_step": 204535, "epoch": 2464} {"train_loss": -24.362117767333984, "global_step": 204536, "epoch": 2464} {"train_loss": -24.620359420776367, "global_step": 204537, "epoch": 2464} {"train_loss": -24.466405868530273, "global_step": 204538, "epoch": 2464} {"train_loss": -24.359201431274414, "global_step": 204539, "epoch": 2464} {"train_loss": -24.390052795410156, "global_step": 204540, "epoch": 2464} {"train_loss": -24.33677101135254, "global_step": 204541, "epoch": 2464} {"train_loss": -24.347875595092773, "global_step": 204542, "epoch": 2464} {"train_loss": -24.173521041870117, "global_step": 204543, "epoch": 2464} {"train_loss": -24.22795295715332, "global_step": 204544, "epoch": 2464} {"train_loss": -24.010141372680664, "global_step": 204545, "epoch": 2464} {"train_loss": -24.288314819335938, "global_step": 204546, "epoch": 2464} {"train_loss": -24.445377349853516, "global_step": 204547, "epoch": 2464} {"train_loss": -24.362852096557617, "global_step": 204548, "epoch": 2464} {"train_loss": -24.356117248535156, "global_step": 204549, "epoch": 2464} {"train_loss": -24.303983688354492, "global_step": 204550, "epoch": 2464} {"train_loss": -24.212873458862305, "global_step": 204551, "epoch": 2464} {"train_loss": -24.45684242248535, "global_step": 204552, "epoch": 2464} {"train_loss": -24.748291015625, "global_step": 204553, "epoch": 2464} {"train_loss": -24.25254249572754, "global_step": 204554, "epoch": 2464} {"train_loss": -24.10367202758789, "global_step": 204555, "epoch": 2464} {"train_loss": -24.325267791748047, "global_step": 204556, "epoch": 2464} {"train_loss": -24.14405632019043, "global_step": 204557, "epoch": 2464} {"train_loss": -24.010807037353516, "global_step": 204558, "epoch": 2464} {"train_loss": -24.583303451538086, "global_step": 204559, "epoch": 2464} {"train_loss": -24.398202896118164, "global_step": 204560, "epoch": 2464} {"train_loss": -24.517093658447266, "global_step": 204561, "epoch": 2464} {"train_loss": -24.579116821289062, "global_step": 204562, "epoch": 2464} {"train_loss": -24.25428009033203, "global_step": 204563, "epoch": 2464} {"train_loss": -24.195541381835938, "global_step": 204564, "epoch": 2464} {"train_loss": -24.481901168823242, "global_step": 204565, "epoch": 2464} {"train_loss": -24.51215171813965, "global_step": 204566, "epoch": 2464} {"train_loss": -24.6433048248291, "global_step": 204567, "epoch": 2464} {"train_loss": -24.25494384765625, "global_step": 204568, "epoch": 2464} {"train_loss": -24.27642250061035, "global_step": 204569, "epoch": 2464} {"train_loss": -24.427719116210938, "global_step": 204570, "epoch": 2464} {"train_loss": -24.428382873535156, "global_step": 204571, "epoch": 2464} {"train_loss": -24.56658935546875, "global_step": 204572, "epoch": 2464} {"train_loss": -24.227554321289062, "global_step": 204573, "epoch": 2464} {"train_loss": -24.783700942993164, "global_step": 204574, "epoch": 2464} {"train_loss": -24.208139419555664, "global_step": 204575, "epoch": 2464} {"train_loss": -24.30059051513672, "global_step": 204576, "epoch": 2464} {"train_loss": -24.182769775390625, "global_step": 204577, "epoch": 2464} {"train_loss": -24.215787887573242, "global_step": 204578, "epoch": 2464} {"train_loss": -24.515043258666992, "global_step": 204579, "epoch": 2464} {"train_loss": -23.652868270874023, "global_step": 204580, "epoch": 2464} {"train_loss": -24.529563903808594, "global_step": 204581, "epoch": 2464} {"train_loss": -24.5948486328125, "global_step": 204582, "epoch": 2464} {"train_loss": -24.487573623657227, "global_step": 204583, "epoch": 2464} {"train_loss": -24.798574447631836, "global_step": 204584, "epoch": 2464} {"train_loss": -24.574844360351562, "global_step": 204585, "epoch": 2464} {"train_loss": -24.234554290771484, "global_step": 204586, "epoch": 2464} {"train_loss": -24.295812606811523, "global_step": 204587, "epoch": 2464} {"train_loss": -24.72579002380371, "global_step": 204588, "epoch": 2464} {"train_loss": -24.372066497802734, "global_step": 204589, "epoch": 2464} {"train_loss": -24.331926345825195, "global_step": 204590, "epoch": 2464} {"train_loss": -24.47527503967285, "global_step": 204591, "epoch": 2464} {"train_loss": -24.25824546813965, "global_step": 204592, "epoch": 2464} {"train_loss": -24.417264938354492, "global_step": 204593, "epoch": 2464} {"train_loss": -24.31260081371629, "global_step": 204594, "epoch": 2464, "val_loss": 6572689.0} {"train_loss": -23.663240432739258, "global_step": 204595, "epoch": 2465} {"train_loss": -23.140888214111328, "global_step": 204596, "epoch": 2465} {"train_loss": -23.96687889099121, "global_step": 204597, "epoch": 2465} {"train_loss": -23.68184471130371, "global_step": 204598, "epoch": 2465} {"train_loss": -23.741384506225586, "global_step": 204599, "epoch": 2465} {"train_loss": -23.690732955932617, "global_step": 204600, "epoch": 2465} {"train_loss": -24.006216049194336, "global_step": 204601, "epoch": 2465} {"train_loss": -23.690671920776367, "global_step": 204602, "epoch": 2465} {"train_loss": -24.046762466430664, "global_step": 204603, "epoch": 2465} {"train_loss": -24.110477447509766, "global_step": 204604, "epoch": 2465} {"train_loss": -24.260276794433594, "global_step": 204605, "epoch": 2465} {"train_loss": -24.245098114013672, "global_step": 204606, "epoch": 2465} {"train_loss": -23.86396598815918, "global_step": 204607, "epoch": 2465} {"train_loss": -24.4761962890625, "global_step": 204608, "epoch": 2465} {"train_loss": -23.948965072631836, "global_step": 204609, "epoch": 2465} {"train_loss": -24.043867111206055, "global_step": 204610, "epoch": 2465} {"train_loss": -24.110355377197266, "global_step": 204611, "epoch": 2465} {"train_loss": -23.882984161376953, "global_step": 204612, "epoch": 2465} {"train_loss": -24.463544845581055, "global_step": 204613, "epoch": 2465} {"train_loss": -24.366777420043945, "global_step": 204614, "epoch": 2465} {"train_loss": -24.30820083618164, "global_step": 204615, "epoch": 2465} {"train_loss": -24.399890899658203, "global_step": 204616, "epoch": 2465} {"train_loss": -24.252294540405273, "global_step": 204617, "epoch": 2465} {"train_loss": -24.268836975097656, "global_step": 204618, "epoch": 2465} {"train_loss": -24.291412353515625, "global_step": 204619, "epoch": 2465} {"train_loss": -24.07597541809082, "global_step": 204620, "epoch": 2465} {"train_loss": -24.313247680664062, "global_step": 204621, "epoch": 2465} {"train_loss": -24.373815536499023, "global_step": 204622, "epoch": 2465} {"train_loss": -24.296072006225586, "global_step": 204623, "epoch": 2465} {"train_loss": -24.57832908630371, "global_step": 204624, "epoch": 2465} {"train_loss": -24.523405075073242, "global_step": 204625, "epoch": 2465} {"train_loss": -24.2568416595459, "global_step": 204626, "epoch": 2465} {"train_loss": -24.456880569458008, "global_step": 204627, "epoch": 2465} {"train_loss": -24.378324508666992, "global_step": 204628, "epoch": 2465} {"train_loss": -24.216367721557617, "global_step": 204629, "epoch": 2465} {"train_loss": -24.341445922851562, "global_step": 204630, "epoch": 2465} {"train_loss": -24.001672744750977, "global_step": 204631, "epoch": 2465} {"train_loss": -24.276857376098633, "global_step": 204632, "epoch": 2465} {"train_loss": -24.094623565673828, "global_step": 204633, "epoch": 2465} {"train_loss": -24.239917755126953, "global_step": 204634, "epoch": 2465} {"train_loss": -24.374963760375977, "global_step": 204635, "epoch": 2465} {"train_loss": -24.1448974609375, "global_step": 204636, "epoch": 2465} {"train_loss": -24.367300033569336, "global_step": 204637, "epoch": 2465} {"train_loss": -24.615997314453125, "global_step": 204638, "epoch": 2465} {"train_loss": -24.411630630493164, "global_step": 204639, "epoch": 2465} {"train_loss": -24.635610580444336, "global_step": 204640, "epoch": 2465} {"train_loss": -24.185075759887695, "global_step": 204641, "epoch": 2465} {"train_loss": -24.674840927124023, "global_step": 204642, "epoch": 2465} {"train_loss": -24.51698112487793, "global_step": 204643, "epoch": 2465} {"train_loss": -24.345415115356445, "global_step": 204644, "epoch": 2465} {"train_loss": -24.476642608642578, "global_step": 204645, "epoch": 2465} {"train_loss": -24.460906982421875, "global_step": 204646, "epoch": 2465} {"train_loss": -24.433353424072266, "global_step": 204647, "epoch": 2465} {"train_loss": -24.65825843811035, "global_step": 204648, "epoch": 2465} {"train_loss": -24.499454498291016, "global_step": 204649, "epoch": 2465} {"train_loss": -24.51358985900879, "global_step": 204650, "epoch": 2465} {"train_loss": -24.387523651123047, "global_step": 204651, "epoch": 2465} {"train_loss": -24.449386596679688, "global_step": 204652, "epoch": 2465} {"train_loss": -24.444232940673828, "global_step": 204653, "epoch": 2465} {"train_loss": -24.67133140563965, "global_step": 204654, "epoch": 2465} {"train_loss": -24.199501037597656, "global_step": 204655, "epoch": 2465} {"train_loss": -24.218135833740234, "global_step": 204656, "epoch": 2465} {"train_loss": -24.279874801635742, "global_step": 204657, "epoch": 2465} {"train_loss": -24.303499221801758, "global_step": 204658, "epoch": 2465} {"train_loss": -24.427865982055664, "global_step": 204659, "epoch": 2465} {"train_loss": -24.343229293823242, "global_step": 204660, "epoch": 2465} {"train_loss": -23.64301109313965, "global_step": 204661, "epoch": 2465} {"train_loss": -24.081113815307617, "global_step": 204662, "epoch": 2465} {"train_loss": -23.993858337402344, "global_step": 204663, "epoch": 2465} {"train_loss": -24.05915069580078, "global_step": 204664, "epoch": 2465} {"train_loss": -23.984935760498047, "global_step": 204665, "epoch": 2465} {"train_loss": -24.202621459960938, "global_step": 204666, "epoch": 2465} {"train_loss": -24.516359329223633, "global_step": 204667, "epoch": 2465} {"train_loss": -24.67214012145996, "global_step": 204668, "epoch": 2465} {"train_loss": -24.43243980407715, "global_step": 204669, "epoch": 2465} {"train_loss": -24.333463668823242, "global_step": 204670, "epoch": 2465} {"train_loss": -24.083784103393555, "global_step": 204671, "epoch": 2465} {"train_loss": -24.609601974487305, "global_step": 204672, "epoch": 2465} {"train_loss": -24.500612258911133, "global_step": 204673, "epoch": 2465} {"train_loss": -24.10548210144043, "global_step": 204674, "epoch": 2465} {"train_loss": -24.437515258789062, "global_step": 204675, "epoch": 2465} {"train_loss": -24.538984298706055, "global_step": 204676, "epoch": 2465} {"train_loss": -24.244378377156085, "global_step": 204677, "epoch": 2465, "val_loss": 6635031.0} {"train_loss": -23.661592483520508, "global_step": 204678, "epoch": 2466} {"train_loss": -23.954648971557617, "global_step": 204679, "epoch": 2466} {"train_loss": -23.92030143737793, "global_step": 204680, "epoch": 2466} {"train_loss": -23.71697998046875, "global_step": 204681, "epoch": 2466} {"train_loss": -24.295454025268555, "global_step": 204682, "epoch": 2466} {"train_loss": -23.89927864074707, "global_step": 204683, "epoch": 2466} {"train_loss": -23.8045597076416, "global_step": 204684, "epoch": 2466} {"train_loss": -24.016273498535156, "global_step": 204685, "epoch": 2466} {"train_loss": -24.26889419555664, "global_step": 204686, "epoch": 2466} {"train_loss": -24.096975326538086, "global_step": 204687, "epoch": 2466} {"train_loss": -24.071170806884766, "global_step": 204688, "epoch": 2466} {"train_loss": -24.233144760131836, "global_step": 204689, "epoch": 2466} {"train_loss": -23.684814453125, "global_step": 204690, "epoch": 2466} {"train_loss": -24.331727981567383, "global_step": 204691, "epoch": 2466} {"train_loss": -24.106979370117188, "global_step": 204692, "epoch": 2466} {"train_loss": -24.358627319335938, "global_step": 204693, "epoch": 2466} {"train_loss": -24.236099243164062, "global_step": 204694, "epoch": 2466} {"train_loss": -24.370595932006836, "global_step": 204695, "epoch": 2466} {"train_loss": -23.912281036376953, "global_step": 204696, "epoch": 2466} {"train_loss": -24.32931900024414, "global_step": 204697, "epoch": 2466} {"train_loss": -24.455829620361328, "global_step": 204698, "epoch": 2466} {"train_loss": -24.246089935302734, "global_step": 204699, "epoch": 2466} {"train_loss": -24.095218658447266, "global_step": 204700, "epoch": 2466} {"train_loss": -24.311124801635742, "global_step": 204701, "epoch": 2466} {"train_loss": -24.391677856445312, "global_step": 204702, "epoch": 2466} {"train_loss": -24.282224655151367, "global_step": 204703, "epoch": 2466} {"train_loss": -24.031583786010742, "global_step": 204704, "epoch": 2466} {"train_loss": -24.32288932800293, "global_step": 204705, "epoch": 2466} {"train_loss": -24.324132919311523, "global_step": 204706, "epoch": 2466} {"train_loss": -24.162174224853516, "global_step": 204707, "epoch": 2466} {"train_loss": -24.318979263305664, "global_step": 204708, "epoch": 2466} {"train_loss": -24.25432014465332, "global_step": 204709, "epoch": 2466} {"train_loss": -24.41582489013672, "global_step": 204710, "epoch": 2466} {"train_loss": -24.504318237304688, "global_step": 204711, "epoch": 2466} {"train_loss": -24.65924072265625, "global_step": 204712, "epoch": 2466} {"train_loss": -24.469905853271484, "global_step": 204713, "epoch": 2466} {"train_loss": -24.151798248291016, "global_step": 204714, "epoch": 2466} {"train_loss": -24.479446411132812, "global_step": 204715, "epoch": 2466} {"train_loss": -24.53873062133789, "global_step": 204716, "epoch": 2466} {"train_loss": -24.578256607055664, "global_step": 204717, "epoch": 2466} {"train_loss": -24.174713134765625, "global_step": 204718, "epoch": 2466} {"train_loss": -24.532155990600586, "global_step": 204719, "epoch": 2466} {"train_loss": -24.2894229888916, "global_step": 204720, "epoch": 2466} {"train_loss": -24.639190673828125, "global_step": 204721, "epoch": 2466} {"train_loss": -24.578901290893555, "global_step": 204722, "epoch": 2466} {"train_loss": -24.441131591796875, "global_step": 204723, "epoch": 2466} {"train_loss": -24.367258071899414, "global_step": 204724, "epoch": 2466} {"train_loss": -24.62510871887207, "global_step": 204725, "epoch": 2466} {"train_loss": -24.604204177856445, "global_step": 204726, "epoch": 2466} {"train_loss": -24.09415626525879, "global_step": 204727, "epoch": 2466} {"train_loss": -24.422325134277344, "global_step": 204728, "epoch": 2466} {"train_loss": -24.08294105529785, "global_step": 204729, "epoch": 2466} {"train_loss": -24.579715728759766, "global_step": 204730, "epoch": 2466} {"train_loss": -24.189016342163086, "global_step": 204731, "epoch": 2466} {"train_loss": -24.32069969177246, "global_step": 204732, "epoch": 2466} {"train_loss": -24.61301612854004, "global_step": 204733, "epoch": 2466} {"train_loss": -24.029144287109375, "global_step": 204734, "epoch": 2466} {"train_loss": -24.596006393432617, "global_step": 204735, "epoch": 2466} {"train_loss": -24.545074462890625, "global_step": 204736, "epoch": 2466} {"train_loss": -24.333669662475586, "global_step": 204737, "epoch": 2466} {"train_loss": -24.54107666015625, "global_step": 204738, "epoch": 2466} {"train_loss": -24.443103790283203, "global_step": 204739, "epoch": 2466} {"train_loss": -24.325658798217773, "global_step": 204740, "epoch": 2466} {"train_loss": -24.1401424407959, "global_step": 204741, "epoch": 2466} {"train_loss": -24.369232177734375, "global_step": 204742, "epoch": 2466} {"train_loss": -24.116403579711914, "global_step": 204743, "epoch": 2466} {"train_loss": -24.40894317626953, "global_step": 204744, "epoch": 2466} {"train_loss": -24.722166061401367, "global_step": 204745, "epoch": 2466} {"train_loss": -24.263120651245117, "global_step": 204746, "epoch": 2466} {"train_loss": -24.536346435546875, "global_step": 204747, "epoch": 2466} {"train_loss": -24.22592544555664, "global_step": 204748, "epoch": 2466} {"train_loss": -24.645368576049805, "global_step": 204749, "epoch": 2466} {"train_loss": -24.26447105407715, "global_step": 204750, "epoch": 2466} {"train_loss": -24.38202476501465, "global_step": 204751, "epoch": 2466} {"train_loss": -24.484477996826172, "global_step": 204752, "epoch": 2466} {"train_loss": -24.255895614624023, "global_step": 204753, "epoch": 2466} {"train_loss": -24.674793243408203, "global_step": 204754, "epoch": 2466} {"train_loss": -24.865293502807617, "global_step": 204755, "epoch": 2466} {"train_loss": -24.54593276977539, "global_step": 204756, "epoch": 2466} {"train_loss": -24.612146377563477, "global_step": 204757, "epoch": 2466} {"train_loss": -24.289472579956055, "global_step": 204758, "epoch": 2466} {"train_loss": -24.51355743408203, "global_step": 204759, "epoch": 2466} {"train_loss": -24.315057019153272, "global_step": 204760, "epoch": 2466, "val_loss": 6532906.5} {"train_loss": -24.14809226989746, "global_step": 204761, "epoch": 2467} {"train_loss": -23.4180908203125, "global_step": 204762, "epoch": 2467} {"train_loss": -23.49945640563965, "global_step": 204763, "epoch": 2467} {"train_loss": -23.529436111450195, "global_step": 204764, "epoch": 2467} {"train_loss": -24.119266510009766, "global_step": 204765, "epoch": 2467} {"train_loss": -23.858373641967773, "global_step": 204766, "epoch": 2467} {"train_loss": -23.64458465576172, "global_step": 204767, "epoch": 2467} {"train_loss": -24.27247428894043, "global_step": 204768, "epoch": 2467} {"train_loss": -24.090045928955078, "global_step": 204769, "epoch": 2467} {"train_loss": -24.017789840698242, "global_step": 204770, "epoch": 2467} {"train_loss": -23.97715187072754, "global_step": 204771, "epoch": 2467} {"train_loss": -24.037540435791016, "global_step": 204772, "epoch": 2467} {"train_loss": -24.14992332458496, "global_step": 204773, "epoch": 2467} {"train_loss": -23.934221267700195, "global_step": 204774, "epoch": 2467} {"train_loss": -24.270078659057617, "global_step": 204775, "epoch": 2467} {"train_loss": -23.995908737182617, "global_step": 204776, "epoch": 2467} {"train_loss": -24.007944107055664, "global_step": 204777, "epoch": 2467} {"train_loss": -24.268972396850586, "global_step": 204778, "epoch": 2467} {"train_loss": -23.840137481689453, "global_step": 204779, "epoch": 2467} {"train_loss": -23.983192443847656, "global_step": 204780, "epoch": 2467} {"train_loss": -24.252796173095703, "global_step": 204781, "epoch": 2467} {"train_loss": -24.589828491210938, "global_step": 204782, "epoch": 2467} {"train_loss": -24.26229476928711, "global_step": 204783, "epoch": 2467} {"train_loss": -24.318706512451172, "global_step": 204784, "epoch": 2467} {"train_loss": -24.113489151000977, "global_step": 204785, "epoch": 2467} {"train_loss": -24.23450469970703, "global_step": 204786, "epoch": 2467} {"train_loss": -24.334487915039062, "global_step": 204787, "epoch": 2467} {"train_loss": -24.396989822387695, "global_step": 204788, "epoch": 2467} {"train_loss": -24.589801788330078, "global_step": 204789, "epoch": 2467} {"train_loss": -24.57358741760254, "global_step": 204790, "epoch": 2467} {"train_loss": -24.042539596557617, "global_step": 204791, "epoch": 2467} {"train_loss": -24.40177345275879, "global_step": 204792, "epoch": 2467} {"train_loss": -24.206226348876953, "global_step": 204793, "epoch": 2467} {"train_loss": -24.308584213256836, "global_step": 204794, "epoch": 2467} {"train_loss": -24.696134567260742, "global_step": 204795, "epoch": 2467} {"train_loss": -24.496618270874023, "global_step": 204796, "epoch": 2467} {"train_loss": -24.64786148071289, "global_step": 204797, "epoch": 2467} {"train_loss": -24.585477828979492, "global_step": 204798, "epoch": 2467} {"train_loss": -24.113176345825195, "global_step": 204799, "epoch": 2467} {"train_loss": -24.63636589050293, "global_step": 204800, "epoch": 2467} {"train_loss": -24.577327728271484, "global_step": 204801, "epoch": 2467} {"train_loss": -24.45675277709961, "global_step": 204802, "epoch": 2467} {"train_loss": -23.79531478881836, "global_step": 204803, "epoch": 2467} {"train_loss": -23.893264770507812, "global_step": 204804, "epoch": 2467} {"train_loss": -24.666011810302734, "global_step": 204805, "epoch": 2467} {"train_loss": -24.397146224975586, "global_step": 204806, "epoch": 2467} {"train_loss": -24.449018478393555, "global_step": 204807, "epoch": 2467} {"train_loss": -24.356002807617188, "global_step": 204808, "epoch": 2467} {"train_loss": -24.351484298706055, "global_step": 204809, "epoch": 2467} {"train_loss": -24.309476852416992, "global_step": 204810, "epoch": 2467} {"train_loss": -24.233442306518555, "global_step": 204811, "epoch": 2467} {"train_loss": -24.44965934753418, "global_step": 204812, "epoch": 2467} {"train_loss": -23.98061180114746, "global_step": 204813, "epoch": 2467} {"train_loss": -23.8864803314209, "global_step": 204814, "epoch": 2467} {"train_loss": -23.3876953125, "global_step": 204815, "epoch": 2467} {"train_loss": -22.884632110595703, "global_step": 204816, "epoch": 2467} {"train_loss": -24.113187789916992, "global_step": 204817, "epoch": 2467} {"train_loss": -24.2458553314209, "global_step": 204818, "epoch": 2467} {"train_loss": -23.973508834838867, "global_step": 204819, "epoch": 2467} {"train_loss": -23.6785945892334, "global_step": 204820, "epoch": 2467} {"train_loss": -24.44318199157715, "global_step": 204821, "epoch": 2467} {"train_loss": -24.072383880615234, "global_step": 204822, "epoch": 2467} {"train_loss": -24.349292755126953, "global_step": 204823, "epoch": 2467} {"train_loss": -24.12210464477539, "global_step": 204824, "epoch": 2467} {"train_loss": -24.04138946533203, "global_step": 204825, "epoch": 2467} {"train_loss": -24.253202438354492, "global_step": 204826, "epoch": 2467} {"train_loss": -23.99444007873535, "global_step": 204827, "epoch": 2467} {"train_loss": -23.974063873291016, "global_step": 204828, "epoch": 2467} {"train_loss": -24.45379638671875, "global_step": 204829, "epoch": 2467} {"train_loss": -24.1130428314209, "global_step": 204830, "epoch": 2467} {"train_loss": -24.453350067138672, "global_step": 204831, "epoch": 2467} {"train_loss": -24.226839065551758, "global_step": 204832, "epoch": 2467} {"train_loss": -24.256216049194336, "global_step": 204833, "epoch": 2467} {"train_loss": -23.9542293548584, "global_step": 204834, "epoch": 2467} {"train_loss": -24.33321189880371, "global_step": 204835, "epoch": 2467} {"train_loss": -24.09400749206543, "global_step": 204836, "epoch": 2467} {"train_loss": -24.31488037109375, "global_step": 204837, "epoch": 2467} {"train_loss": -24.214969635009766, "global_step": 204838, "epoch": 2467} {"train_loss": -24.35590171813965, "global_step": 204839, "epoch": 2467} {"train_loss": -24.411542892456055, "global_step": 204840, "epoch": 2467} {"train_loss": -24.458240509033203, "global_step": 204841, "epoch": 2467} {"train_loss": -24.412622451782227, "global_step": 204842, "epoch": 2467} {"train_loss": -24.168445426297474, "global_step": 204843, "epoch": 2467, "val_loss": 6575501.0} {"train_loss": -24.059720993041992, "global_step": 204844, "epoch": 2468} {"train_loss": -24.344823837280273, "global_step": 204845, "epoch": 2468} {"train_loss": -24.288888931274414, "global_step": 204846, "epoch": 2468} {"train_loss": -24.56890296936035, "global_step": 204847, "epoch": 2468} {"train_loss": -24.00710678100586, "global_step": 204848, "epoch": 2468} {"train_loss": -24.3166561126709, "global_step": 204849, "epoch": 2468} {"train_loss": -24.15915298461914, "global_step": 204850, "epoch": 2468} {"train_loss": -24.188762664794922, "global_step": 204851, "epoch": 2468} {"train_loss": -24.060081481933594, "global_step": 204852, "epoch": 2468} {"train_loss": -24.210769653320312, "global_step": 204853, "epoch": 2468} {"train_loss": -24.03687858581543, "global_step": 204854, "epoch": 2468} {"train_loss": -24.67106819152832, "global_step": 204855, "epoch": 2468} {"train_loss": -24.422687530517578, "global_step": 204856, "epoch": 2468} {"train_loss": -24.351247787475586, "global_step": 204857, "epoch": 2468} {"train_loss": -24.431467056274414, "global_step": 204858, "epoch": 2468} {"train_loss": -24.48082733154297, "global_step": 204859, "epoch": 2468} {"train_loss": -24.378564834594727, "global_step": 204860, "epoch": 2468} {"train_loss": -24.40606117248535, "global_step": 204861, "epoch": 2468} {"train_loss": -24.34306526184082, "global_step": 204862, "epoch": 2468} {"train_loss": -24.523113250732422, "global_step": 204863, "epoch": 2468} {"train_loss": -24.871309280395508, "global_step": 204864, "epoch": 2468} {"train_loss": -23.937620162963867, "global_step": 204865, "epoch": 2468} {"train_loss": -24.47980308532715, "global_step": 204866, "epoch": 2468} {"train_loss": -24.66559410095215, "global_step": 204867, "epoch": 2468} {"train_loss": -24.10689353942871, "global_step": 204868, "epoch": 2468} {"train_loss": -24.7325439453125, "global_step": 204869, "epoch": 2468} {"train_loss": -24.29052734375, "global_step": 204870, "epoch": 2468} {"train_loss": -24.705978393554688, "global_step": 204871, "epoch": 2468} {"train_loss": -24.068790435791016, "global_step": 204872, "epoch": 2468} {"train_loss": -24.302892684936523, "global_step": 204873, "epoch": 2468} {"train_loss": -24.25276756286621, "global_step": 204874, "epoch": 2468} {"train_loss": -24.726011276245117, "global_step": 204875, "epoch": 2468} {"train_loss": -24.26865577697754, "global_step": 204876, "epoch": 2468} {"train_loss": -24.46880531311035, "global_step": 204877, "epoch": 2468} {"train_loss": -24.334617614746094, "global_step": 204878, "epoch": 2468} {"train_loss": -24.264734268188477, "global_step": 204879, "epoch": 2468} {"train_loss": -24.926956176757812, "global_step": 204880, "epoch": 2468} {"train_loss": -24.665903091430664, "global_step": 204881, "epoch": 2468} {"train_loss": -24.388723373413086, "global_step": 204882, "epoch": 2468} {"train_loss": -24.592384338378906, "global_step": 204883, "epoch": 2468} {"train_loss": -24.194793701171875, "global_step": 204884, "epoch": 2468} {"train_loss": -24.005020141601562, "global_step": 204885, "epoch": 2468} {"train_loss": -24.336515426635742, "global_step": 204886, "epoch": 2468} {"train_loss": -24.62681007385254, "global_step": 204887, "epoch": 2468} {"train_loss": -24.3576717376709, "global_step": 204888, "epoch": 2468} {"train_loss": -24.284469604492188, "global_step": 204889, "epoch": 2468} {"train_loss": -24.465158462524414, "global_step": 204890, "epoch": 2468} {"train_loss": -24.38384246826172, "global_step": 204891, "epoch": 2468} {"train_loss": -24.449262619018555, "global_step": 204892, "epoch": 2468} {"train_loss": -24.611616134643555, "global_step": 204893, "epoch": 2468} {"train_loss": -24.235807418823242, "global_step": 204894, "epoch": 2468} {"train_loss": -24.262800216674805, "global_step": 204895, "epoch": 2468} {"train_loss": -24.34674835205078, "global_step": 204896, "epoch": 2468} {"train_loss": -24.34212303161621, "global_step": 204897, "epoch": 2468} {"train_loss": -24.419462203979492, "global_step": 204898, "epoch": 2468} {"train_loss": -23.773094177246094, "global_step": 204899, "epoch": 2468} {"train_loss": -24.382471084594727, "global_step": 204900, "epoch": 2468} {"train_loss": -24.2392578125, "global_step": 204901, "epoch": 2468} {"train_loss": -23.946247100830078, "global_step": 204902, "epoch": 2468} {"train_loss": -24.212549209594727, "global_step": 204903, "epoch": 2468} {"train_loss": -24.299299240112305, "global_step": 204904, "epoch": 2468} {"train_loss": -24.29192543029785, "global_step": 204905, "epoch": 2468} {"train_loss": -24.373762130737305, "global_step": 204906, "epoch": 2468} {"train_loss": -24.500259399414062, "global_step": 204907, "epoch": 2468} {"train_loss": -24.41019630432129, "global_step": 204908, "epoch": 2468} {"train_loss": -24.48593521118164, "global_step": 204909, "epoch": 2468} {"train_loss": -24.336477279663086, "global_step": 204910, "epoch": 2468} {"train_loss": -24.317609786987305, "global_step": 204911, "epoch": 2468} {"train_loss": -24.569089889526367, "global_step": 204912, "epoch": 2468} {"train_loss": -24.67099380493164, "global_step": 204913, "epoch": 2468} {"train_loss": -24.24028968811035, "global_step": 204914, "epoch": 2468} {"train_loss": -24.384592056274414, "global_step": 204915, "epoch": 2468} {"train_loss": -24.137250900268555, "global_step": 204916, "epoch": 2468} {"train_loss": -24.291059494018555, "global_step": 204917, "epoch": 2468} {"train_loss": -24.69240379333496, "global_step": 204918, "epoch": 2468} {"train_loss": -24.475688934326172, "global_step": 204919, "epoch": 2468} {"train_loss": -24.516849517822266, "global_step": 204920, "epoch": 2468} {"train_loss": -24.095191955566406, "global_step": 204921, "epoch": 2468} {"train_loss": -24.37189292907715, "global_step": 204922, "epoch": 2468} {"train_loss": -24.59514617919922, "global_step": 204923, "epoch": 2468} {"train_loss": -24.323965072631836, "global_step": 204924, "epoch": 2468} {"train_loss": -24.330625534057617, "global_step": 204925, "epoch": 2468} {"train_loss": -24.373753076576325, "global_step": 204926, "epoch": 2468, "val_loss": 6699012.0} {"train_loss": -23.925973892211914, "global_step": 204927, "epoch": 2469} {"train_loss": -22.836620330810547, "global_step": 204928, "epoch": 2469} {"train_loss": -22.2082462310791, "global_step": 204929, "epoch": 2469} {"train_loss": -23.62735366821289, "global_step": 204930, "epoch": 2469} {"train_loss": -23.314434051513672, "global_step": 204931, "epoch": 2469} {"train_loss": -22.85284996032715, "global_step": 204932, "epoch": 2469} {"train_loss": -23.4209041595459, "global_step": 204933, "epoch": 2469} {"train_loss": -23.440961837768555, "global_step": 204934, "epoch": 2469} {"train_loss": -23.793798446655273, "global_step": 204935, "epoch": 2469} {"train_loss": -23.80647087097168, "global_step": 204936, "epoch": 2469} {"train_loss": -23.429414749145508, "global_step": 204937, "epoch": 2469} {"train_loss": -23.63987159729004, "global_step": 204938, "epoch": 2469} {"train_loss": -23.722946166992188, "global_step": 204939, "epoch": 2469} {"train_loss": -23.93963623046875, "global_step": 204940, "epoch": 2469} {"train_loss": -23.311450958251953, "global_step": 204941, "epoch": 2469} {"train_loss": -23.94178581237793, "global_step": 204942, "epoch": 2469} {"train_loss": -23.95662498474121, "global_step": 204943, "epoch": 2469} {"train_loss": -23.772092819213867, "global_step": 204944, "epoch": 2469} {"train_loss": -23.658199310302734, "global_step": 204945, "epoch": 2469} {"train_loss": -23.656675338745117, "global_step": 204946, "epoch": 2469} {"train_loss": -23.7122802734375, "global_step": 204947, "epoch": 2469} {"train_loss": -24.1838436126709, "global_step": 204948, "epoch": 2469} {"train_loss": -23.836088180541992, "global_step": 204949, "epoch": 2469} {"train_loss": -23.710620880126953, "global_step": 204950, "epoch": 2469} {"train_loss": -23.87150001525879, "global_step": 204951, "epoch": 2469} {"train_loss": -24.06743621826172, "global_step": 204952, "epoch": 2469} {"train_loss": -23.849409103393555, "global_step": 204953, "epoch": 2469} {"train_loss": -24.140478134155273, "global_step": 204954, "epoch": 2469} {"train_loss": -24.19479751586914, "global_step": 204955, "epoch": 2469} {"train_loss": -24.328248977661133, "global_step": 204956, "epoch": 2469} {"train_loss": -24.564172744750977, "global_step": 204957, "epoch": 2469} {"train_loss": -24.169593811035156, "global_step": 204958, "epoch": 2469} {"train_loss": -24.250516891479492, "global_step": 204959, "epoch": 2469} {"train_loss": -23.951642990112305, "global_step": 204960, "epoch": 2469} {"train_loss": -23.86984634399414, "global_step": 204961, "epoch": 2469} {"train_loss": -24.425430297851562, "global_step": 204962, "epoch": 2469} {"train_loss": -24.256006240844727, "global_step": 204963, "epoch": 2469} {"train_loss": -24.24048614501953, "global_step": 204964, "epoch": 2469} {"train_loss": -24.485830307006836, "global_step": 204965, "epoch": 2469} {"train_loss": -24.198026657104492, "global_step": 204966, "epoch": 2469} {"train_loss": -24.006874084472656, "global_step": 204967, "epoch": 2469} {"train_loss": -23.948596954345703, "global_step": 204968, "epoch": 2469} {"train_loss": -24.37323570251465, "global_step": 204969, "epoch": 2469} {"train_loss": -24.071056365966797, "global_step": 204970, "epoch": 2469} {"train_loss": -24.260326385498047, "global_step": 204971, "epoch": 2469} {"train_loss": -24.497411727905273, "global_step": 204972, "epoch": 2469} {"train_loss": -23.967979431152344, "global_step": 204973, "epoch": 2469} {"train_loss": -24.230018615722656, "global_step": 204974, "epoch": 2469} {"train_loss": -24.946950912475586, "global_step": 204975, "epoch": 2469} {"train_loss": -24.610509872436523, "global_step": 204976, "epoch": 2469} {"train_loss": -24.35092544555664, "global_step": 204977, "epoch": 2469} {"train_loss": -24.492965698242188, "global_step": 204978, "epoch": 2469} {"train_loss": -24.578954696655273, "global_step": 204979, "epoch": 2469} {"train_loss": -24.45139503479004, "global_step": 204980, "epoch": 2469} {"train_loss": -24.40900230407715, "global_step": 204981, "epoch": 2469} {"train_loss": -24.75955581665039, "global_step": 204982, "epoch": 2469} {"train_loss": -24.377683639526367, "global_step": 204983, "epoch": 2469} {"train_loss": -24.567590713500977, "global_step": 204984, "epoch": 2469} {"train_loss": -24.67690086364746, "global_step": 204985, "epoch": 2469} {"train_loss": -24.436704635620117, "global_step": 204986, "epoch": 2469} {"train_loss": -24.298978805541992, "global_step": 204987, "epoch": 2469} {"train_loss": -24.352407455444336, "global_step": 204988, "epoch": 2469} {"train_loss": -24.253124237060547, "global_step": 204989, "epoch": 2469} {"train_loss": -24.609472274780273, "global_step": 204990, "epoch": 2469} {"train_loss": -24.347143173217773, "global_step": 204991, "epoch": 2469} {"train_loss": -24.301071166992188, "global_step": 204992, "epoch": 2469} {"train_loss": -23.723342895507812, "global_step": 204993, "epoch": 2469} {"train_loss": -24.109235763549805, "global_step": 204994, "epoch": 2469} {"train_loss": -24.332706451416016, "global_step": 204995, "epoch": 2469} {"train_loss": -24.113197326660156, "global_step": 204996, "epoch": 2469} {"train_loss": -24.185791015625, "global_step": 204997, "epoch": 2469} {"train_loss": -24.490880966186523, "global_step": 204998, "epoch": 2469} {"train_loss": -24.487396240234375, "global_step": 204999, "epoch": 2469} {"train_loss": -24.31324577331543, "global_step": 205000, "epoch": 2469} {"train_loss": -23.967206954956055, "global_step": 205001, "epoch": 2469} {"train_loss": -24.20392417907715, "global_step": 205002, "epoch": 2469} {"train_loss": -24.496366500854492, "global_step": 205003, "epoch": 2469} {"train_loss": -24.176755905151367, "global_step": 205004, "epoch": 2469} {"train_loss": -24.53985595703125, "global_step": 205005, "epoch": 2469} {"train_loss": -24.12717628479004, "global_step": 205006, "epoch": 2469} {"train_loss": -24.39204216003418, "global_step": 205007, "epoch": 2469} {"train_loss": -24.299123764038086, "global_step": 205008, "epoch": 2469} {"train_loss": -24.082413041448017, "global_step": 205009, "epoch": 2469, "val_loss": 6638237.0} {"train_loss": -23.78559684753418, "global_step": 205010, "epoch": 2470} {"train_loss": -23.106679916381836, "global_step": 205011, "epoch": 2470} {"train_loss": -23.654333114624023, "global_step": 205012, "epoch": 2470} {"train_loss": -23.64814567565918, "global_step": 205013, "epoch": 2470} {"train_loss": -23.743261337280273, "global_step": 205014, "epoch": 2470} {"train_loss": -23.70396614074707, "global_step": 205015, "epoch": 2470} {"train_loss": -23.568681716918945, "global_step": 205016, "epoch": 2470} {"train_loss": -24.253173828125, "global_step": 205017, "epoch": 2470} {"train_loss": -24.368824005126953, "global_step": 205018, "epoch": 2470} {"train_loss": -23.859830856323242, "global_step": 205019, "epoch": 2470} {"train_loss": -23.80852508544922, "global_step": 205020, "epoch": 2470} {"train_loss": -23.93898582458496, "global_step": 205021, "epoch": 2470} {"train_loss": -24.125900268554688, "global_step": 205022, "epoch": 2470} {"train_loss": -24.267230987548828, "global_step": 205023, "epoch": 2470} {"train_loss": -23.98025894165039, "global_step": 205024, "epoch": 2470} {"train_loss": -24.27973175048828, "global_step": 205025, "epoch": 2470} {"train_loss": -24.476709365844727, "global_step": 205026, "epoch": 2470} {"train_loss": -24.096874237060547, "global_step": 205027, "epoch": 2470} {"train_loss": -24.198104858398438, "global_step": 205028, "epoch": 2470} {"train_loss": -24.322988510131836, "global_step": 205029, "epoch": 2470} {"train_loss": -24.167098999023438, "global_step": 205030, "epoch": 2470} {"train_loss": -24.22609519958496, "global_step": 205031, "epoch": 2470} {"train_loss": -24.541250228881836, "global_step": 205032, "epoch": 2470} {"train_loss": -24.5417537689209, "global_step": 205033, "epoch": 2470} {"train_loss": -24.30112648010254, "global_step": 205034, "epoch": 2470} {"train_loss": -24.458412170410156, "global_step": 205035, "epoch": 2470} {"train_loss": -24.53962516784668, "global_step": 205036, "epoch": 2470} {"train_loss": -24.353206634521484, "global_step": 205037, "epoch": 2470} {"train_loss": -24.40138816833496, "global_step": 205038, "epoch": 2470} {"train_loss": -24.037067413330078, "global_step": 205039, "epoch": 2470} {"train_loss": -24.612274169921875, "global_step": 205040, "epoch": 2470} {"train_loss": -24.051198959350586, "global_step": 205041, "epoch": 2470} {"train_loss": -24.411666870117188, "global_step": 205042, "epoch": 2470} {"train_loss": -24.23798942565918, "global_step": 205043, "epoch": 2470} {"train_loss": -24.340030670166016, "global_step": 205044, "epoch": 2470} {"train_loss": -24.2280216217041, "global_step": 205045, "epoch": 2470} {"train_loss": -24.197538375854492, "global_step": 205046, "epoch": 2470} {"train_loss": -24.19771385192871, "global_step": 205047, "epoch": 2470} {"train_loss": -24.37461280822754, "global_step": 205048, "epoch": 2470} {"train_loss": -24.017784118652344, "global_step": 205049, "epoch": 2470} {"train_loss": -24.926471710205078, "global_step": 205050, "epoch": 2470} {"train_loss": -24.388822555541992, "global_step": 205051, "epoch": 2470} {"train_loss": -24.255008697509766, "global_step": 205052, "epoch": 2470} {"train_loss": -24.124113082885742, "global_step": 205053, "epoch": 2470} {"train_loss": -24.54811668395996, "global_step": 205054, "epoch": 2470} {"train_loss": -24.40240478515625, "global_step": 205055, "epoch": 2470} {"train_loss": -24.066564559936523, "global_step": 205056, "epoch": 2470} {"train_loss": -24.437084197998047, "global_step": 205057, "epoch": 2470} {"train_loss": -24.218347549438477, "global_step": 205058, "epoch": 2470} {"train_loss": -24.753734588623047, "global_step": 205059, "epoch": 2470} {"train_loss": -24.094707489013672, "global_step": 205060, "epoch": 2470} {"train_loss": -23.73427391052246, "global_step": 205061, "epoch": 2470} {"train_loss": -24.09114646911621, "global_step": 205062, "epoch": 2470} {"train_loss": -24.314672470092773, "global_step": 205063, "epoch": 2470} {"train_loss": -24.440929412841797, "global_step": 205064, "epoch": 2470} {"train_loss": -24.05804443359375, "global_step": 205065, "epoch": 2470} {"train_loss": -23.763124465942383, "global_step": 205066, "epoch": 2470} {"train_loss": -24.192920684814453, "global_step": 205067, "epoch": 2470} {"train_loss": -24.417545318603516, "global_step": 205068, "epoch": 2470} {"train_loss": -24.177703857421875, "global_step": 205069, "epoch": 2470} {"train_loss": -24.54148292541504, "global_step": 205070, "epoch": 2470} {"train_loss": -24.674100875854492, "global_step": 205071, "epoch": 2470} {"train_loss": -23.952762603759766, "global_step": 205072, "epoch": 2470} {"train_loss": -24.266849517822266, "global_step": 205073, "epoch": 2470} {"train_loss": -24.681110382080078, "global_step": 205074, "epoch": 2470} {"train_loss": -24.619672775268555, "global_step": 205075, "epoch": 2470} {"train_loss": -24.478673934936523, "global_step": 205076, "epoch": 2470} {"train_loss": -24.582067489624023, "global_step": 205077, "epoch": 2470} {"train_loss": -24.09967613220215, "global_step": 205078, "epoch": 2470} {"train_loss": -24.58431053161621, "global_step": 205079, "epoch": 2470} {"train_loss": -24.039264678955078, "global_step": 205080, "epoch": 2470} {"train_loss": -24.33699607849121, "global_step": 205081, "epoch": 2470} {"train_loss": -24.20973014831543, "global_step": 205082, "epoch": 2470} {"train_loss": -24.481199264526367, "global_step": 205083, "epoch": 2470} {"train_loss": -24.55459976196289, "global_step": 205084, "epoch": 2470} {"train_loss": -24.531362533569336, "global_step": 205085, "epoch": 2470} {"train_loss": -24.656097412109375, "global_step": 205086, "epoch": 2470} {"train_loss": -24.323827743530273, "global_step": 205087, "epoch": 2470} {"train_loss": -24.016855239868164, "global_step": 205088, "epoch": 2470} {"train_loss": -24.725406646728516, "global_step": 205089, "epoch": 2470} {"train_loss": -24.114118576049805, "global_step": 205090, "epoch": 2470} {"train_loss": -24.396883010864258, "global_step": 205091, "epoch": 2470} {"train_loss": -24.23737530535962, "global_step": 205092, "epoch": 2470, "val_loss": 6600461.0} {"train_loss": -23.484006881713867, "global_step": 205093, "epoch": 2471} {"train_loss": -23.625526428222656, "global_step": 205094, "epoch": 2471} {"train_loss": -24.064407348632812, "global_step": 205095, "epoch": 2471} {"train_loss": -23.769695281982422, "global_step": 205096, "epoch": 2471} {"train_loss": -24.289024353027344, "global_step": 205097, "epoch": 2471} {"train_loss": -24.1308650970459, "global_step": 205098, "epoch": 2471} {"train_loss": -24.666746139526367, "global_step": 205099, "epoch": 2471} {"train_loss": -23.90376853942871, "global_step": 205100, "epoch": 2471} {"train_loss": -23.991472244262695, "global_step": 205101, "epoch": 2471} {"train_loss": -24.402448654174805, "global_step": 205102, "epoch": 2471} {"train_loss": -23.97493553161621, "global_step": 205103, "epoch": 2471} {"train_loss": -24.204620361328125, "global_step": 205104, "epoch": 2471} {"train_loss": -24.352447509765625, "global_step": 205105, "epoch": 2471} {"train_loss": -24.26186752319336, "global_step": 205106, "epoch": 2471} {"train_loss": -23.83111572265625, "global_step": 205107, "epoch": 2471} {"train_loss": -24.557249069213867, "global_step": 205108, "epoch": 2471} {"train_loss": -24.323848724365234, "global_step": 205109, "epoch": 2471} {"train_loss": -24.268247604370117, "global_step": 205110, "epoch": 2471} {"train_loss": -24.243885040283203, "global_step": 205111, "epoch": 2471} {"train_loss": -24.467336654663086, "global_step": 205112, "epoch": 2471} {"train_loss": -24.013357162475586, "global_step": 205113, "epoch": 2471} {"train_loss": -24.37369155883789, "global_step": 205114, "epoch": 2471} {"train_loss": -24.2001895904541, "global_step": 205115, "epoch": 2471} {"train_loss": -24.274938583374023, "global_step": 205116, "epoch": 2471} {"train_loss": -24.02351951599121, "global_step": 205117, "epoch": 2471} {"train_loss": -24.142677307128906, "global_step": 205118, "epoch": 2471} {"train_loss": -24.49458122253418, "global_step": 205119, "epoch": 2471} {"train_loss": -24.300363540649414, "global_step": 205120, "epoch": 2471} {"train_loss": -24.18509864807129, "global_step": 205121, "epoch": 2471} {"train_loss": -24.687368392944336, "global_step": 205122, "epoch": 2471} {"train_loss": -24.52714729309082, "global_step": 205123, "epoch": 2471} {"train_loss": -24.588666915893555, "global_step": 205124, "epoch": 2471} {"train_loss": -24.38347816467285, "global_step": 205125, "epoch": 2471} {"train_loss": -24.489805221557617, "global_step": 205126, "epoch": 2471} {"train_loss": -24.33698081970215, "global_step": 205127, "epoch": 2471} {"train_loss": -24.602834701538086, "global_step": 205128, "epoch": 2471} {"train_loss": -24.50594711303711, "global_step": 205129, "epoch": 2471} {"train_loss": -24.301374435424805, "global_step": 205130, "epoch": 2471} {"train_loss": -24.40639305114746, "global_step": 205131, "epoch": 2471} {"train_loss": -24.493139266967773, "global_step": 205132, "epoch": 2471} {"train_loss": -24.27495574951172, "global_step": 205133, "epoch": 2471} {"train_loss": -23.987224578857422, "global_step": 205134, "epoch": 2471} {"train_loss": -24.054813385009766, "global_step": 205135, "epoch": 2471} {"train_loss": -24.114315032958984, "global_step": 205136, "epoch": 2471} {"train_loss": -24.250864028930664, "global_step": 205137, "epoch": 2471} {"train_loss": -24.564102172851562, "global_step": 205138, "epoch": 2471} {"train_loss": -24.302534103393555, "global_step": 205139, "epoch": 2471} {"train_loss": -24.324058532714844, "global_step": 205140, "epoch": 2471} {"train_loss": -24.244604110717773, "global_step": 205141, "epoch": 2471} {"train_loss": -24.411203384399414, "global_step": 205142, "epoch": 2471} {"train_loss": -24.05926513671875, "global_step": 205143, "epoch": 2471} {"train_loss": -24.798765182495117, "global_step": 205144, "epoch": 2471} {"train_loss": -23.89084243774414, "global_step": 205145, "epoch": 2471} {"train_loss": -24.451557159423828, "global_step": 205146, "epoch": 2471} {"train_loss": -23.970428466796875, "global_step": 205147, "epoch": 2471} {"train_loss": -23.992080688476562, "global_step": 205148, "epoch": 2471} {"train_loss": -24.181657791137695, "global_step": 205149, "epoch": 2471} {"train_loss": -24.203550338745117, "global_step": 205150, "epoch": 2471} {"train_loss": -24.278718948364258, "global_step": 205151, "epoch": 2471} {"train_loss": -24.070941925048828, "global_step": 205152, "epoch": 2471} {"train_loss": -24.223737716674805, "global_step": 205153, "epoch": 2471} {"train_loss": -24.22567367553711, "global_step": 205154, "epoch": 2471} {"train_loss": -24.10480308532715, "global_step": 205155, "epoch": 2471} {"train_loss": -24.407482147216797, "global_step": 205156, "epoch": 2471} {"train_loss": -24.17462730407715, "global_step": 205157, "epoch": 2471} {"train_loss": -23.999801635742188, "global_step": 205158, "epoch": 2471} {"train_loss": -24.19878387451172, "global_step": 205159, "epoch": 2471} {"train_loss": -24.549903869628906, "global_step": 205160, "epoch": 2471} {"train_loss": -24.42630958557129, "global_step": 205161, "epoch": 2471} {"train_loss": -24.065641403198242, "global_step": 205162, "epoch": 2471} {"train_loss": -24.174421310424805, "global_step": 205163, "epoch": 2471} {"train_loss": -23.945880889892578, "global_step": 205164, "epoch": 2471} {"train_loss": -24.010190963745117, "global_step": 205165, "epoch": 2471} {"train_loss": -24.14165687561035, "global_step": 205166, "epoch": 2471} {"train_loss": -24.1005916595459, "global_step": 205167, "epoch": 2471} {"train_loss": -24.727115631103516, "global_step": 205168, "epoch": 2471} {"train_loss": -24.191783905029297, "global_step": 205169, "epoch": 2471} {"train_loss": -24.292203903198242, "global_step": 205170, "epoch": 2471} {"train_loss": -24.435989379882812, "global_step": 205171, "epoch": 2471} {"train_loss": -24.242372512817383, "global_step": 205172, "epoch": 2471} {"train_loss": -24.36081886291504, "global_step": 205173, "epoch": 2471} {"train_loss": -24.434904098510742, "global_step": 205174, "epoch": 2471} {"train_loss": -24.26105492373547, "global_step": 205175, "epoch": 2471, "val_loss": 6594146.5} {"train_loss": -23.739410400390625, "global_step": 205176, "epoch": 2472} {"train_loss": -23.96942138671875, "global_step": 205177, "epoch": 2472} {"train_loss": -24.24794578552246, "global_step": 205178, "epoch": 2472} {"train_loss": -23.6671142578125, "global_step": 205179, "epoch": 2472} {"train_loss": -23.81207275390625, "global_step": 205180, "epoch": 2472} {"train_loss": -23.851455688476562, "global_step": 205181, "epoch": 2472} {"train_loss": -24.14302635192871, "global_step": 205182, "epoch": 2472} {"train_loss": -24.009109497070312, "global_step": 205183, "epoch": 2472} {"train_loss": -24.2800350189209, "global_step": 205184, "epoch": 2472} {"train_loss": -24.191940307617188, "global_step": 205185, "epoch": 2472} {"train_loss": -24.220510482788086, "global_step": 205186, "epoch": 2472} {"train_loss": -24.205102920532227, "global_step": 205187, "epoch": 2472} {"train_loss": -23.977272033691406, "global_step": 205188, "epoch": 2472} {"train_loss": -24.24043846130371, "global_step": 205189, "epoch": 2472} {"train_loss": -23.98067283630371, "global_step": 205190, "epoch": 2472} {"train_loss": -23.862350463867188, "global_step": 205191, "epoch": 2472} {"train_loss": -24.047988891601562, "global_step": 205192, "epoch": 2472} {"train_loss": -24.060413360595703, "global_step": 205193, "epoch": 2472} {"train_loss": -24.507553100585938, "global_step": 205194, "epoch": 2472} {"train_loss": -24.53097915649414, "global_step": 205195, "epoch": 2472} {"train_loss": -24.07135581970215, "global_step": 205196, "epoch": 2472} {"train_loss": -24.149784088134766, "global_step": 205197, "epoch": 2472} {"train_loss": -24.49201774597168, "global_step": 205198, "epoch": 2472} {"train_loss": -24.554960250854492, "global_step": 205199, "epoch": 2472} {"train_loss": -24.52054214477539, "global_step": 205200, "epoch": 2472} {"train_loss": -24.269577026367188, "global_step": 205201, "epoch": 2472} {"train_loss": -24.559284210205078, "global_step": 205202, "epoch": 2472} {"train_loss": -24.2703914642334, "global_step": 205203, "epoch": 2472} {"train_loss": -24.530128479003906, "global_step": 205204, "epoch": 2472} {"train_loss": -24.328922271728516, "global_step": 205205, "epoch": 2472} {"train_loss": -24.694000244140625, "global_step": 205206, "epoch": 2472} {"train_loss": -24.320951461791992, "global_step": 205207, "epoch": 2472} {"train_loss": -24.43929100036621, "global_step": 205208, "epoch": 2472} {"train_loss": -24.366281509399414, "global_step": 205209, "epoch": 2472} {"train_loss": -23.9917049407959, "global_step": 205210, "epoch": 2472} {"train_loss": -24.194141387939453, "global_step": 205211, "epoch": 2472} {"train_loss": -24.44969940185547, "global_step": 205212, "epoch": 2472} {"train_loss": -24.386180877685547, "global_step": 205213, "epoch": 2472} {"train_loss": -24.293155670166016, "global_step": 205214, "epoch": 2472} {"train_loss": -24.299442291259766, "global_step": 205215, "epoch": 2472} {"train_loss": -24.284284591674805, "global_step": 205216, "epoch": 2472} {"train_loss": -24.25895118713379, "global_step": 205217, "epoch": 2472} {"train_loss": -24.353641510009766, "global_step": 205218, "epoch": 2472} {"train_loss": -24.589580535888672, "global_step": 205219, "epoch": 2472} {"train_loss": -24.421457290649414, "global_step": 205220, "epoch": 2472} {"train_loss": -24.514728546142578, "global_step": 205221, "epoch": 2472} {"train_loss": -23.936643600463867, "global_step": 205222, "epoch": 2472} {"train_loss": -24.705808639526367, "global_step": 205223, "epoch": 2472} {"train_loss": -24.148096084594727, "global_step": 205224, "epoch": 2472} {"train_loss": -24.120824813842773, "global_step": 205225, "epoch": 2472} {"train_loss": -24.28549575805664, "global_step": 205226, "epoch": 2472} {"train_loss": -23.92724609375, "global_step": 205227, "epoch": 2472} {"train_loss": -24.305660247802734, "global_step": 205228, "epoch": 2472} {"train_loss": -24.23736000061035, "global_step": 205229, "epoch": 2472} {"train_loss": -24.61043930053711, "global_step": 205230, "epoch": 2472} {"train_loss": -24.457653045654297, "global_step": 205231, "epoch": 2472} {"train_loss": -24.320425033569336, "global_step": 205232, "epoch": 2472} {"train_loss": -24.333663940429688, "global_step": 205233, "epoch": 2472} {"train_loss": -24.69593620300293, "global_step": 205234, "epoch": 2472} {"train_loss": -23.856637954711914, "global_step": 205235, "epoch": 2472} {"train_loss": -24.35163688659668, "global_step": 205236, "epoch": 2472} {"train_loss": -24.128942489624023, "global_step": 205237, "epoch": 2472} {"train_loss": -24.259735107421875, "global_step": 205238, "epoch": 2472} {"train_loss": -24.374561309814453, "global_step": 205239, "epoch": 2472} {"train_loss": -24.49679946899414, "global_step": 205240, "epoch": 2472} {"train_loss": -24.523969650268555, "global_step": 205241, "epoch": 2472} {"train_loss": -24.375635147094727, "global_step": 205242, "epoch": 2472} {"train_loss": -24.252483367919922, "global_step": 205243, "epoch": 2472} {"train_loss": -24.2797908782959, "global_step": 205244, "epoch": 2472} {"train_loss": -24.414710998535156, "global_step": 205245, "epoch": 2472} {"train_loss": -24.315826416015625, "global_step": 205246, "epoch": 2472} {"train_loss": -24.418943405151367, "global_step": 205247, "epoch": 2472} {"train_loss": -24.509109497070312, "global_step": 205248, "epoch": 2472} {"train_loss": -24.438077926635742, "global_step": 205249, "epoch": 2472} {"train_loss": -24.760568618774414, "global_step": 205250, "epoch": 2472} {"train_loss": -24.403688430786133, "global_step": 205251, "epoch": 2472} {"train_loss": -24.63912010192871, "global_step": 205252, "epoch": 2472} {"train_loss": -24.550678253173828, "global_step": 205253, "epoch": 2472} {"train_loss": -24.408796310424805, "global_step": 205254, "epoch": 2472} {"train_loss": -24.368871688842773, "global_step": 205255, "epoch": 2472} {"train_loss": -24.337787628173828, "global_step": 205256, "epoch": 2472} {"train_loss": -24.486597061157227, "global_step": 205257, "epoch": 2472} {"train_loss": -24.2887014366058, "global_step": 205258, "epoch": 2472, "val_loss": 6545349.0} {"train_loss": -24.275375366210938, "global_step": 205259, "epoch": 2473} {"train_loss": -24.025144577026367, "global_step": 205260, "epoch": 2473} {"train_loss": -24.205596923828125, "global_step": 205261, "epoch": 2473} {"train_loss": -24.244810104370117, "global_step": 205262, "epoch": 2473} {"train_loss": -24.220638275146484, "global_step": 205263, "epoch": 2473} {"train_loss": -24.111337661743164, "global_step": 205264, "epoch": 2473} {"train_loss": -24.250782012939453, "global_step": 205265, "epoch": 2473} {"train_loss": -24.36215591430664, "global_step": 205266, "epoch": 2473} {"train_loss": -23.96782875061035, "global_step": 205267, "epoch": 2473} {"train_loss": -24.06159782409668, "global_step": 205268, "epoch": 2473} {"train_loss": -24.227651596069336, "global_step": 205269, "epoch": 2473} {"train_loss": -24.260618209838867, "global_step": 205270, "epoch": 2473} {"train_loss": -23.834714889526367, "global_step": 205271, "epoch": 2473} {"train_loss": -24.403804779052734, "global_step": 205272, "epoch": 2473} {"train_loss": -24.02440071105957, "global_step": 205273, "epoch": 2473} {"train_loss": -24.312429428100586, "global_step": 205274, "epoch": 2473} {"train_loss": -24.17511558532715, "global_step": 205275, "epoch": 2473} {"train_loss": -24.025671005249023, "global_step": 205276, "epoch": 2473} {"train_loss": -23.736248016357422, "global_step": 205277, "epoch": 2473} {"train_loss": -24.64716148376465, "global_step": 205278, "epoch": 2473} {"train_loss": -24.371444702148438, "global_step": 205279, "epoch": 2473} {"train_loss": -24.53509521484375, "global_step": 205280, "epoch": 2473} {"train_loss": -24.364944458007812, "global_step": 205281, "epoch": 2473} {"train_loss": -24.501150131225586, "global_step": 205282, "epoch": 2473} {"train_loss": -24.529260635375977, "global_step": 205283, "epoch": 2473} {"train_loss": -24.185861587524414, "global_step": 205284, "epoch": 2473} {"train_loss": -23.989749908447266, "global_step": 205285, "epoch": 2473} {"train_loss": -24.47153091430664, "global_step": 205286, "epoch": 2473} {"train_loss": -24.3492488861084, "global_step": 205287, "epoch": 2473} {"train_loss": -24.254011154174805, "global_step": 205288, "epoch": 2473} {"train_loss": -24.23225975036621, "global_step": 205289, "epoch": 2473} {"train_loss": -24.573932647705078, "global_step": 205290, "epoch": 2473} {"train_loss": -24.518789291381836, "global_step": 205291, "epoch": 2473} {"train_loss": -24.905609130859375, "global_step": 205292, "epoch": 2473} {"train_loss": -24.20907974243164, "global_step": 205293, "epoch": 2473} {"train_loss": -24.368303298950195, "global_step": 205294, "epoch": 2473} {"train_loss": -24.88150978088379, "global_step": 205295, "epoch": 2473} {"train_loss": -24.424604415893555, "global_step": 205296, "epoch": 2473} {"train_loss": -24.169286727905273, "global_step": 205297, "epoch": 2473} {"train_loss": -24.3306884765625, "global_step": 205298, "epoch": 2473} {"train_loss": -24.284696578979492, "global_step": 205299, "epoch": 2473} {"train_loss": -24.63570213317871, "global_step": 205300, "epoch": 2473} {"train_loss": -24.572874069213867, "global_step": 205301, "epoch": 2473} {"train_loss": -24.47403907775879, "global_step": 205302, "epoch": 2473} {"train_loss": -24.119976043701172, "global_step": 205303, "epoch": 2473} {"train_loss": -24.480133056640625, "global_step": 205304, "epoch": 2473} {"train_loss": -25.051834106445312, "global_step": 205305, "epoch": 2473} {"train_loss": -24.481412887573242, "global_step": 205306, "epoch": 2473} {"train_loss": -24.34010887145996, "global_step": 205307, "epoch": 2473} {"train_loss": -24.462839126586914, "global_step": 205308, "epoch": 2473} {"train_loss": -24.43329620361328, "global_step": 205309, "epoch": 2473} {"train_loss": -24.4151554107666, "global_step": 205310, "epoch": 2473} {"train_loss": -24.680831909179688, "global_step": 205311, "epoch": 2473} {"train_loss": -24.207477569580078, "global_step": 205312, "epoch": 2473} {"train_loss": -24.21564483642578, "global_step": 205313, "epoch": 2473} {"train_loss": -24.45692253112793, "global_step": 205314, "epoch": 2473} {"train_loss": -23.61550521850586, "global_step": 205315, "epoch": 2473} {"train_loss": -23.2258243560791, "global_step": 205316, "epoch": 2473} {"train_loss": -24.240686416625977, "global_step": 205317, "epoch": 2473} {"train_loss": -24.37685203552246, "global_step": 205318, "epoch": 2473} {"train_loss": -24.184484481811523, "global_step": 205319, "epoch": 2473} {"train_loss": -24.348087310791016, "global_step": 205320, "epoch": 2473} {"train_loss": -23.91619873046875, "global_step": 205321, "epoch": 2473} {"train_loss": -23.849000930786133, "global_step": 205322, "epoch": 2473} {"train_loss": -24.052194595336914, "global_step": 205323, "epoch": 2473} {"train_loss": -24.219717025756836, "global_step": 205324, "epoch": 2473} {"train_loss": -24.077016830444336, "global_step": 205325, "epoch": 2473} {"train_loss": -23.92844581604004, "global_step": 205326, "epoch": 2473} {"train_loss": -24.658735275268555, "global_step": 205327, "epoch": 2473} {"train_loss": -23.842609405517578, "global_step": 205328, "epoch": 2473} {"train_loss": -24.6699161529541, "global_step": 205329, "epoch": 2473} {"train_loss": -24.003602981567383, "global_step": 205330, "epoch": 2473} {"train_loss": -24.184938430786133, "global_step": 205331, "epoch": 2473} {"train_loss": -23.964710235595703, "global_step": 205332, "epoch": 2473} {"train_loss": -24.75840187072754, "global_step": 205333, "epoch": 2473} {"train_loss": -23.939163208007812, "global_step": 205334, "epoch": 2473} {"train_loss": -23.838918685913086, "global_step": 205335, "epoch": 2473} {"train_loss": -24.092031478881836, "global_step": 205336, "epoch": 2473} {"train_loss": -24.223724365234375, "global_step": 205337, "epoch": 2473} {"train_loss": -24.32622528076172, "global_step": 205338, "epoch": 2473} {"train_loss": -24.31569480895996, "global_step": 205339, "epoch": 2473} {"train_loss": -24.78679847717285, "global_step": 205340, "epoch": 2473} {"train_loss": -24.2776366084455, "global_step": 205341, "epoch": 2473, "val_loss": 6633448.0} {"train_loss": -23.6776180267334, "global_step": 205342, "epoch": 2474} {"train_loss": -23.929597854614258, "global_step": 205343, "epoch": 2474} {"train_loss": -23.63411521911621, "global_step": 205344, "epoch": 2474} {"train_loss": -23.78321647644043, "global_step": 205345, "epoch": 2474} {"train_loss": -23.943603515625, "global_step": 205346, "epoch": 2474} {"train_loss": -23.643081665039062, "global_step": 205347, "epoch": 2474} {"train_loss": -23.693952560424805, "global_step": 205348, "epoch": 2474} {"train_loss": -23.54677391052246, "global_step": 205349, "epoch": 2474} {"train_loss": -23.93324089050293, "global_step": 205350, "epoch": 2474} {"train_loss": -23.645139694213867, "global_step": 205351, "epoch": 2474} {"train_loss": -24.003807067871094, "global_step": 205352, "epoch": 2474} {"train_loss": -24.429580688476562, "global_step": 205353, "epoch": 2474} {"train_loss": -24.1411190032959, "global_step": 205354, "epoch": 2474} {"train_loss": -23.95014762878418, "global_step": 205355, "epoch": 2474} {"train_loss": -24.073078155517578, "global_step": 205356, "epoch": 2474} {"train_loss": -23.95949363708496, "global_step": 205357, "epoch": 2474} {"train_loss": -23.951929092407227, "global_step": 205358, "epoch": 2474} {"train_loss": -24.193201065063477, "global_step": 205359, "epoch": 2474} {"train_loss": -23.629560470581055, "global_step": 205360, "epoch": 2474} {"train_loss": -24.052885055541992, "global_step": 205361, "epoch": 2474} {"train_loss": -24.270864486694336, "global_step": 205362, "epoch": 2474} {"train_loss": -24.216821670532227, "global_step": 205363, "epoch": 2474} {"train_loss": -24.169967651367188, "global_step": 205364, "epoch": 2474} {"train_loss": -23.92587661743164, "global_step": 205365, "epoch": 2474} {"train_loss": -24.268110275268555, "global_step": 205366, "epoch": 2474} {"train_loss": -23.930435180664062, "global_step": 205367, "epoch": 2474} {"train_loss": -24.352279663085938, "global_step": 205368, "epoch": 2474} {"train_loss": -24.117431640625, "global_step": 205369, "epoch": 2474} {"train_loss": -24.224597930908203, "global_step": 205370, "epoch": 2474} {"train_loss": -24.214956283569336, "global_step": 205371, "epoch": 2474} {"train_loss": -24.422208786010742, "global_step": 205372, "epoch": 2474} {"train_loss": -24.568845748901367, "global_step": 205373, "epoch": 2474} {"train_loss": -24.091577529907227, "global_step": 205374, "epoch": 2474} {"train_loss": -24.7259464263916, "global_step": 205375, "epoch": 2474} {"train_loss": -24.28957176208496, "global_step": 205376, "epoch": 2474} {"train_loss": -24.54031753540039, "global_step": 205377, "epoch": 2474} {"train_loss": -24.32085609436035, "global_step": 205378, "epoch": 2474} {"train_loss": -24.486114501953125, "global_step": 205379, "epoch": 2474} {"train_loss": -24.36872100830078, "global_step": 205380, "epoch": 2474} {"train_loss": -24.56790542602539, "global_step": 205381, "epoch": 2474} {"train_loss": -24.648941040039062, "global_step": 205382, "epoch": 2474} {"train_loss": -24.504886627197266, "global_step": 205383, "epoch": 2474} {"train_loss": -24.458343505859375, "global_step": 205384, "epoch": 2474} {"train_loss": -24.176776885986328, "global_step": 205385, "epoch": 2474} {"train_loss": -24.58481216430664, "global_step": 205386, "epoch": 2474} {"train_loss": -24.399639129638672, "global_step": 205387, "epoch": 2474} {"train_loss": -24.49643325805664, "global_step": 205388, "epoch": 2474} {"train_loss": -24.311338424682617, "global_step": 205389, "epoch": 2474} {"train_loss": -24.486183166503906, "global_step": 205390, "epoch": 2474} {"train_loss": -24.356576919555664, "global_step": 205391, "epoch": 2474} {"train_loss": -24.57551383972168, "global_step": 205392, "epoch": 2474} {"train_loss": -24.564695358276367, "global_step": 205393, "epoch": 2474} {"train_loss": -24.320449829101562, "global_step": 205394, "epoch": 2474} {"train_loss": -24.290205001831055, "global_step": 205395, "epoch": 2474} {"train_loss": -24.282108306884766, "global_step": 205396, "epoch": 2474} {"train_loss": -24.574466705322266, "global_step": 205397, "epoch": 2474} {"train_loss": -24.27215576171875, "global_step": 205398, "epoch": 2474} {"train_loss": -24.32415771484375, "global_step": 205399, "epoch": 2474} {"train_loss": -24.56157875061035, "global_step": 205400, "epoch": 2474} {"train_loss": -24.11713981628418, "global_step": 205401, "epoch": 2474} {"train_loss": -23.97138023376465, "global_step": 205402, "epoch": 2474} {"train_loss": -24.452640533447266, "global_step": 205403, "epoch": 2474} {"train_loss": -24.36208724975586, "global_step": 205404, "epoch": 2474} {"train_loss": -24.66263198852539, "global_step": 205405, "epoch": 2474} {"train_loss": -23.981386184692383, "global_step": 205406, "epoch": 2474} {"train_loss": -24.250701904296875, "global_step": 205407, "epoch": 2474} {"train_loss": -24.167144775390625, "global_step": 205408, "epoch": 2474} {"train_loss": -24.52589988708496, "global_step": 205409, "epoch": 2474} {"train_loss": -24.424711227416992, "global_step": 205410, "epoch": 2474} {"train_loss": -24.506723403930664, "global_step": 205411, "epoch": 2474} {"train_loss": -24.264968872070312, "global_step": 205412, "epoch": 2474} {"train_loss": -24.54060935974121, "global_step": 205413, "epoch": 2474} {"train_loss": -24.449710845947266, "global_step": 205414, "epoch": 2474} {"train_loss": -24.295700073242188, "global_step": 205415, "epoch": 2474} {"train_loss": -24.282752990722656, "global_step": 205416, "epoch": 2474} {"train_loss": -24.644636154174805, "global_step": 205417, "epoch": 2474} {"train_loss": -24.445234298706055, "global_step": 205418, "epoch": 2474} {"train_loss": -24.404998779296875, "global_step": 205419, "epoch": 2474} {"train_loss": -24.394399642944336, "global_step": 205420, "epoch": 2474} {"train_loss": -24.324142456054688, "global_step": 205421, "epoch": 2474} {"train_loss": -24.299514770507812, "global_step": 205422, "epoch": 2474} {"train_loss": -24.217252731323242, "global_step": 205423, "epoch": 2474} {"train_loss": -24.250967899000788, "global_step": 205424, "epoch": 2474, "val_loss": 6645307.0} {"train_loss": -23.832412719726562, "global_step": 205425, "epoch": 2475} {"train_loss": -23.697355270385742, "global_step": 205426, "epoch": 2475} {"train_loss": -23.72098731994629, "global_step": 205427, "epoch": 2475} {"train_loss": -24.40921401977539, "global_step": 205428, "epoch": 2475} {"train_loss": -23.890920639038086, "global_step": 205429, "epoch": 2475} {"train_loss": -24.271596908569336, "global_step": 205430, "epoch": 2475} {"train_loss": -24.111982345581055, "global_step": 205431, "epoch": 2475} {"train_loss": -24.060871124267578, "global_step": 205432, "epoch": 2475} {"train_loss": -23.957670211791992, "global_step": 205433, "epoch": 2475} {"train_loss": -24.141122817993164, "global_step": 205434, "epoch": 2475} {"train_loss": -23.96993064880371, "global_step": 205435, "epoch": 2475} {"train_loss": -24.25111198425293, "global_step": 205436, "epoch": 2475} {"train_loss": -23.856220245361328, "global_step": 205437, "epoch": 2475} {"train_loss": -24.42574119567871, "global_step": 205438, "epoch": 2475} {"train_loss": -23.8267822265625, "global_step": 205439, "epoch": 2475} {"train_loss": -24.066831588745117, "global_step": 205440, "epoch": 2475} {"train_loss": -24.073631286621094, "global_step": 205441, "epoch": 2475} {"train_loss": -24.054731369018555, "global_step": 205442, "epoch": 2475} {"train_loss": -24.326847076416016, "global_step": 205443, "epoch": 2475} {"train_loss": -23.90500831604004, "global_step": 205444, "epoch": 2475} {"train_loss": -24.11313247680664, "global_step": 205445, "epoch": 2475} {"train_loss": -24.01780128479004, "global_step": 205446, "epoch": 2475} {"train_loss": -24.363637924194336, "global_step": 205447, "epoch": 2475} {"train_loss": -24.034082412719727, "global_step": 205448, "epoch": 2475} {"train_loss": -24.24309730529785, "global_step": 205449, "epoch": 2475} {"train_loss": -24.090463638305664, "global_step": 205450, "epoch": 2475} {"train_loss": -24.37738037109375, "global_step": 205451, "epoch": 2475} {"train_loss": -24.1767520904541, "global_step": 205452, "epoch": 2475} {"train_loss": -23.993375778198242, "global_step": 205453, "epoch": 2475} {"train_loss": -24.331504821777344, "global_step": 205454, "epoch": 2475} {"train_loss": -24.10710334777832, "global_step": 205455, "epoch": 2475} {"train_loss": -24.47743797302246, "global_step": 205456, "epoch": 2475} {"train_loss": -24.46428871154785, "global_step": 205457, "epoch": 2475} {"train_loss": -24.32939338684082, "global_step": 205458, "epoch": 2475} {"train_loss": -24.421710968017578, "global_step": 205459, "epoch": 2475} {"train_loss": -24.394193649291992, "global_step": 205460, "epoch": 2475} {"train_loss": -24.224578857421875, "global_step": 205461, "epoch": 2475} {"train_loss": -24.27609634399414, "global_step": 205462, "epoch": 2475} {"train_loss": -24.465682983398438, "global_step": 205463, "epoch": 2475} {"train_loss": -23.979812622070312, "global_step": 205464, "epoch": 2475} {"train_loss": -24.072507858276367, "global_step": 205465, "epoch": 2475} {"train_loss": -24.668987274169922, "global_step": 205466, "epoch": 2475} {"train_loss": -23.961332321166992, "global_step": 205467, "epoch": 2475} {"train_loss": -24.245874404907227, "global_step": 205468, "epoch": 2475} {"train_loss": -24.538000106811523, "global_step": 205469, "epoch": 2475} {"train_loss": -24.17635154724121, "global_step": 205470, "epoch": 2475} {"train_loss": -24.514333724975586, "global_step": 205471, "epoch": 2475} {"train_loss": -24.014591217041016, "global_step": 205472, "epoch": 2475} {"train_loss": -24.8259220123291, "global_step": 205473, "epoch": 2475} {"train_loss": -24.725561141967773, "global_step": 205474, "epoch": 2475} {"train_loss": -24.277921676635742, "global_step": 205475, "epoch": 2475} {"train_loss": -24.08540916442871, "global_step": 205476, "epoch": 2475} {"train_loss": -24.586469650268555, "global_step": 205477, "epoch": 2475} {"train_loss": -24.29339599609375, "global_step": 205478, "epoch": 2475} {"train_loss": -24.64656639099121, "global_step": 205479, "epoch": 2475} {"train_loss": -24.59403419494629, "global_step": 205480, "epoch": 2475} {"train_loss": -24.41375732421875, "global_step": 205481, "epoch": 2475} {"train_loss": -24.901601791381836, "global_step": 205482, "epoch": 2475} {"train_loss": -24.235450744628906, "global_step": 205483, "epoch": 2475} {"train_loss": -24.534761428833008, "global_step": 205484, "epoch": 2475} {"train_loss": -24.503154754638672, "global_step": 205485, "epoch": 2475} {"train_loss": -24.37592887878418, "global_step": 205486, "epoch": 2475} {"train_loss": -24.44736099243164, "global_step": 205487, "epoch": 2475} {"train_loss": -24.386539459228516, "global_step": 205488, "epoch": 2475} {"train_loss": -24.149444580078125, "global_step": 205489, "epoch": 2475} {"train_loss": -24.059274673461914, "global_step": 205490, "epoch": 2475} {"train_loss": -24.130146026611328, "global_step": 205491, "epoch": 2475} {"train_loss": -24.504566192626953, "global_step": 205492, "epoch": 2475} {"train_loss": -24.201589584350586, "global_step": 205493, "epoch": 2475} {"train_loss": -24.061140060424805, "global_step": 205494, "epoch": 2475} {"train_loss": -24.473087310791016, "global_step": 205495, "epoch": 2475} {"train_loss": -24.04459571838379, "global_step": 205496, "epoch": 2475} {"train_loss": -24.362709045410156, "global_step": 205497, "epoch": 2475} {"train_loss": -24.46170997619629, "global_step": 205498, "epoch": 2475} {"train_loss": -24.09228515625, "global_step": 205499, "epoch": 2475} {"train_loss": -24.28537940979004, "global_step": 205500, "epoch": 2475} {"train_loss": -24.21027183532715, "global_step": 205501, "epoch": 2475} {"train_loss": -24.090612411499023, "global_step": 205502, "epoch": 2475} {"train_loss": -24.916614532470703, "global_step": 205503, "epoch": 2475} {"train_loss": -24.368070602416992, "global_step": 205504, "epoch": 2475} {"train_loss": -24.206424713134766, "global_step": 205505, "epoch": 2475} {"train_loss": -24.201297760009766, "global_step": 205506, "epoch": 2475} {"train_loss": -24.266114499195513, "global_step": 205507, "epoch": 2475, "val_loss": 6537288.0} {"train_loss": -23.542490005493164, "global_step": 205508, "epoch": 2476} {"train_loss": -24.086347579956055, "global_step": 205509, "epoch": 2476} {"train_loss": -24.09406852722168, "global_step": 205510, "epoch": 2476} {"train_loss": -23.84419822692871, "global_step": 205511, "epoch": 2476} {"train_loss": -23.915739059448242, "global_step": 205512, "epoch": 2476} {"train_loss": -23.76219367980957, "global_step": 205513, "epoch": 2476} {"train_loss": -23.921457290649414, "global_step": 205514, "epoch": 2476} {"train_loss": -23.804794311523438, "global_step": 205515, "epoch": 2476} {"train_loss": -24.032270431518555, "global_step": 205516, "epoch": 2476} {"train_loss": -24.093076705932617, "global_step": 205517, "epoch": 2476} {"train_loss": -24.17313575744629, "global_step": 205518, "epoch": 2476} {"train_loss": -24.020959854125977, "global_step": 205519, "epoch": 2476} {"train_loss": -24.111501693725586, "global_step": 205520, "epoch": 2476} {"train_loss": -24.299179077148438, "global_step": 205521, "epoch": 2476} {"train_loss": -24.327289581298828, "global_step": 205522, "epoch": 2476} {"train_loss": -24.365488052368164, "global_step": 205523, "epoch": 2476} {"train_loss": -24.466703414916992, "global_step": 205524, "epoch": 2476} {"train_loss": -24.04864501953125, "global_step": 205525, "epoch": 2476} {"train_loss": -24.189029693603516, "global_step": 205526, "epoch": 2476} {"train_loss": -24.22430419921875, "global_step": 205527, "epoch": 2476} {"train_loss": -24.249435424804688, "global_step": 205528, "epoch": 2476} {"train_loss": -24.3746280670166, "global_step": 205529, "epoch": 2476} {"train_loss": -23.940649032592773, "global_step": 205530, "epoch": 2476} {"train_loss": -24.493967056274414, "global_step": 205531, "epoch": 2476} {"train_loss": -24.514507293701172, "global_step": 205532, "epoch": 2476} {"train_loss": -24.2347354888916, "global_step": 205533, "epoch": 2476} {"train_loss": -24.501325607299805, "global_step": 205534, "epoch": 2476} {"train_loss": -24.45306968688965, "global_step": 205535, "epoch": 2476} {"train_loss": -24.18696403503418, "global_step": 205536, "epoch": 2476} {"train_loss": -24.651077270507812, "global_step": 205537, "epoch": 2476} {"train_loss": -24.695783615112305, "global_step": 205538, "epoch": 2476} {"train_loss": -24.643529891967773, "global_step": 205539, "epoch": 2476} {"train_loss": -24.376951217651367, "global_step": 205540, "epoch": 2476} {"train_loss": -24.72711181640625, "global_step": 205541, "epoch": 2476} {"train_loss": -24.255949020385742, "global_step": 205542, "epoch": 2476} {"train_loss": -24.580503463745117, "global_step": 205543, "epoch": 2476} {"train_loss": -24.290512084960938, "global_step": 205544, "epoch": 2476} {"train_loss": -24.296560287475586, "global_step": 205545, "epoch": 2476} {"train_loss": -24.1939754486084, "global_step": 205546, "epoch": 2476} {"train_loss": -24.48143768310547, "global_step": 205547, "epoch": 2476} {"train_loss": -24.16269302368164, "global_step": 205548, "epoch": 2476} {"train_loss": -24.336816787719727, "global_step": 205549, "epoch": 2476} {"train_loss": -24.216588973999023, "global_step": 205550, "epoch": 2476} {"train_loss": -24.557174682617188, "global_step": 205551, "epoch": 2476} {"train_loss": -24.484411239624023, "global_step": 205552, "epoch": 2476} {"train_loss": -24.28718376159668, "global_step": 205553, "epoch": 2476} {"train_loss": -24.433502197265625, "global_step": 205554, "epoch": 2476} {"train_loss": -24.35542106628418, "global_step": 205555, "epoch": 2476} {"train_loss": -23.949853897094727, "global_step": 205556, "epoch": 2476} {"train_loss": -24.37137222290039, "global_step": 205557, "epoch": 2476} {"train_loss": -24.128767013549805, "global_step": 205558, "epoch": 2476} {"train_loss": -24.613283157348633, "global_step": 205559, "epoch": 2476} {"train_loss": -24.60198974609375, "global_step": 205560, "epoch": 2476} {"train_loss": -24.36213493347168, "global_step": 205561, "epoch": 2476} {"train_loss": -25.00827980041504, "global_step": 205562, "epoch": 2476} {"train_loss": -24.382665634155273, "global_step": 205563, "epoch": 2476} {"train_loss": -24.43088150024414, "global_step": 205564, "epoch": 2476} {"train_loss": -24.82649803161621, "global_step": 205565, "epoch": 2476} {"train_loss": -24.354455947875977, "global_step": 205566, "epoch": 2476} {"train_loss": -24.403514862060547, "global_step": 205567, "epoch": 2476} {"train_loss": -24.04425048828125, "global_step": 205568, "epoch": 2476} {"train_loss": -24.357877731323242, "global_step": 205569, "epoch": 2476} {"train_loss": -24.186290740966797, "global_step": 205570, "epoch": 2476} {"train_loss": -24.746950149536133, "global_step": 205571, "epoch": 2476} {"train_loss": -24.517080307006836, "global_step": 205572, "epoch": 2476} {"train_loss": -24.428565979003906, "global_step": 205573, "epoch": 2476} {"train_loss": -24.4188289642334, "global_step": 205574, "epoch": 2476} {"train_loss": -24.25312614440918, "global_step": 205575, "epoch": 2476} {"train_loss": -24.217390060424805, "global_step": 205576, "epoch": 2476} {"train_loss": -24.848913192749023, "global_step": 205577, "epoch": 2476} {"train_loss": -23.94692039489746, "global_step": 205578, "epoch": 2476} {"train_loss": -24.49323081970215, "global_step": 205579, "epoch": 2476} {"train_loss": -24.39200210571289, "global_step": 205580, "epoch": 2476} {"train_loss": -24.17070198059082, "global_step": 205581, "epoch": 2476} {"train_loss": -24.598600387573242, "global_step": 205582, "epoch": 2476} {"train_loss": -24.110273361206055, "global_step": 205583, "epoch": 2476} {"train_loss": -24.709125518798828, "global_step": 205584, "epoch": 2476} {"train_loss": -24.16172218322754, "global_step": 205585, "epoch": 2476} {"train_loss": -24.497455596923828, "global_step": 205586, "epoch": 2476} {"train_loss": -24.308897018432617, "global_step": 205587, "epoch": 2476} {"train_loss": -24.34052085876465, "global_step": 205588, "epoch": 2476} {"train_loss": -24.36862564086914, "global_step": 205589, "epoch": 2476} {"train_loss": -24.31160526965038, "global_step": 205590, "epoch": 2476, "val_loss": 6627683.5} {"train_loss": -23.788312911987305, "global_step": 205591, "epoch": 2477} {"train_loss": -23.883346557617188, "global_step": 205592, "epoch": 2477} {"train_loss": -23.786983489990234, "global_step": 205593, "epoch": 2477} {"train_loss": -23.718229293823242, "global_step": 205594, "epoch": 2477} {"train_loss": -23.70176124572754, "global_step": 205595, "epoch": 2477} {"train_loss": -24.32061195373535, "global_step": 205596, "epoch": 2477} {"train_loss": -23.726282119750977, "global_step": 205597, "epoch": 2477} {"train_loss": -24.160905838012695, "global_step": 205598, "epoch": 2477} {"train_loss": -23.71142578125, "global_step": 205599, "epoch": 2477} {"train_loss": -24.009008407592773, "global_step": 205600, "epoch": 2477} {"train_loss": -23.671350479125977, "global_step": 205601, "epoch": 2477} {"train_loss": -23.885278701782227, "global_step": 205602, "epoch": 2477} {"train_loss": -23.897817611694336, "global_step": 205603, "epoch": 2477} {"train_loss": -23.952314376831055, "global_step": 205604, "epoch": 2477} {"train_loss": -24.52414321899414, "global_step": 205605, "epoch": 2477} {"train_loss": -24.29167366027832, "global_step": 205606, "epoch": 2477} {"train_loss": -24.49547004699707, "global_step": 205607, "epoch": 2477} {"train_loss": -24.37993812561035, "global_step": 205608, "epoch": 2477} {"train_loss": -24.065271377563477, "global_step": 205609, "epoch": 2477} {"train_loss": -24.191877365112305, "global_step": 205610, "epoch": 2477} {"train_loss": -24.383756637573242, "global_step": 205611, "epoch": 2477} {"train_loss": -23.675445556640625, "global_step": 205612, "epoch": 2477} {"train_loss": -24.475873947143555, "global_step": 205613, "epoch": 2477} {"train_loss": -24.132415771484375, "global_step": 205614, "epoch": 2477} {"train_loss": -23.582056045532227, "global_step": 205615, "epoch": 2477} {"train_loss": -24.419843673706055, "global_step": 205616, "epoch": 2477} {"train_loss": -24.259817123413086, "global_step": 205617, "epoch": 2477} {"train_loss": -24.06098175048828, "global_step": 205618, "epoch": 2477} {"train_loss": -24.14400291442871, "global_step": 205619, "epoch": 2477} {"train_loss": -24.165678024291992, "global_step": 205620, "epoch": 2477} {"train_loss": -24.014972686767578, "global_step": 205621, "epoch": 2477} {"train_loss": -23.9383602142334, "global_step": 205622, "epoch": 2477} {"train_loss": -23.846923828125, "global_step": 205623, "epoch": 2477} {"train_loss": -24.345136642456055, "global_step": 205624, "epoch": 2477} {"train_loss": -24.04341697692871, "global_step": 205625, "epoch": 2477} {"train_loss": -24.330047607421875, "global_step": 205626, "epoch": 2477} {"train_loss": -24.29644775390625, "global_step": 205627, "epoch": 2477} {"train_loss": -24.30670166015625, "global_step": 205628, "epoch": 2477} {"train_loss": -24.4788875579834, "global_step": 205629, "epoch": 2477} {"train_loss": -24.4300479888916, "global_step": 205630, "epoch": 2477} {"train_loss": -24.282438278198242, "global_step": 205631, "epoch": 2477} {"train_loss": -24.40924644470215, "global_step": 205632, "epoch": 2477} {"train_loss": -24.813016891479492, "global_step": 205633, "epoch": 2477} {"train_loss": -24.363576889038086, "global_step": 205634, "epoch": 2477} {"train_loss": -24.62312889099121, "global_step": 205635, "epoch": 2477} {"train_loss": -24.18282127380371, "global_step": 205636, "epoch": 2477} {"train_loss": -24.385086059570312, "global_step": 205637, "epoch": 2477} {"train_loss": -24.707324981689453, "global_step": 205638, "epoch": 2477} {"train_loss": -24.46648597717285, "global_step": 205639, "epoch": 2477} {"train_loss": -24.645071029663086, "global_step": 205640, "epoch": 2477} {"train_loss": -24.01063346862793, "global_step": 205641, "epoch": 2477} {"train_loss": -24.034290313720703, "global_step": 205642, "epoch": 2477} {"train_loss": -24.583202362060547, "global_step": 205643, "epoch": 2477} {"train_loss": -24.0784912109375, "global_step": 205644, "epoch": 2477} {"train_loss": -24.63192367553711, "global_step": 205645, "epoch": 2477} {"train_loss": -24.475194931030273, "global_step": 205646, "epoch": 2477} {"train_loss": -24.482852935791016, "global_step": 205647, "epoch": 2477} {"train_loss": -24.077787399291992, "global_step": 205648, "epoch": 2477} {"train_loss": -24.130285263061523, "global_step": 205649, "epoch": 2477} {"train_loss": -24.497617721557617, "global_step": 205650, "epoch": 2477} {"train_loss": -24.13568115234375, "global_step": 205651, "epoch": 2477} {"train_loss": -24.20794105529785, "global_step": 205652, "epoch": 2477} {"train_loss": -24.093658447265625, "global_step": 205653, "epoch": 2477} {"train_loss": -24.09381675720215, "global_step": 205654, "epoch": 2477} {"train_loss": -23.882482528686523, "global_step": 205655, "epoch": 2477} {"train_loss": -24.32673454284668, "global_step": 205656, "epoch": 2477} {"train_loss": -24.562164306640625, "global_step": 205657, "epoch": 2477} {"train_loss": -23.898168563842773, "global_step": 205658, "epoch": 2477} {"train_loss": -24.05743980407715, "global_step": 205659, "epoch": 2477} {"train_loss": -24.128925323486328, "global_step": 205660, "epoch": 2477} {"train_loss": -24.200824737548828, "global_step": 205661, "epoch": 2477} {"train_loss": -24.41263771057129, "global_step": 205662, "epoch": 2477} {"train_loss": -24.253488540649414, "global_step": 205663, "epoch": 2477} {"train_loss": -24.304494857788086, "global_step": 205664, "epoch": 2477} {"train_loss": -24.541547775268555, "global_step": 205665, "epoch": 2477} {"train_loss": -24.077329635620117, "global_step": 205666, "epoch": 2477} {"train_loss": -24.416784286499023, "global_step": 205667, "epoch": 2477} {"train_loss": -24.429311752319336, "global_step": 205668, "epoch": 2477} {"train_loss": -24.591388702392578, "global_step": 205669, "epoch": 2477} {"train_loss": -24.380401611328125, "global_step": 205670, "epoch": 2477} {"train_loss": -24.399890899658203, "global_step": 205671, "epoch": 2477} {"train_loss": -24.08266830444336, "global_step": 205672, "epoch": 2477} {"train_loss": -24.21030731660774, "global_step": 205673, "epoch": 2477, "val_loss": 6598870.0} {"train_loss": -23.919782638549805, "global_step": 205674, "epoch": 2478} {"train_loss": -24.268497467041016, "global_step": 205675, "epoch": 2478} {"train_loss": -23.725425720214844, "global_step": 205676, "epoch": 2478} {"train_loss": -23.82815170288086, "global_step": 205677, "epoch": 2478} {"train_loss": -23.64504051208496, "global_step": 205678, "epoch": 2478} {"train_loss": -24.32161521911621, "global_step": 205679, "epoch": 2478} {"train_loss": -23.802160263061523, "global_step": 205680, "epoch": 2478} {"train_loss": -24.534276962280273, "global_step": 205681, "epoch": 2478} {"train_loss": -23.65216827392578, "global_step": 205682, "epoch": 2478} {"train_loss": -23.983861923217773, "global_step": 205683, "epoch": 2478} {"train_loss": -23.770227432250977, "global_step": 205684, "epoch": 2478} {"train_loss": -24.11676025390625, "global_step": 205685, "epoch": 2478} {"train_loss": -24.204547882080078, "global_step": 205686, "epoch": 2478} {"train_loss": -24.373483657836914, "global_step": 205687, "epoch": 2478} {"train_loss": -24.108800888061523, "global_step": 205688, "epoch": 2478} {"train_loss": -23.990081787109375, "global_step": 205689, "epoch": 2478} {"train_loss": -24.22037124633789, "global_step": 205690, "epoch": 2478} {"train_loss": -24.31631088256836, "global_step": 205691, "epoch": 2478} {"train_loss": -23.743492126464844, "global_step": 205692, "epoch": 2478} {"train_loss": -24.24568748474121, "global_step": 205693, "epoch": 2478} {"train_loss": -24.290138244628906, "global_step": 205694, "epoch": 2478} {"train_loss": -23.89652442932129, "global_step": 205695, "epoch": 2478} {"train_loss": -24.14742660522461, "global_step": 205696, "epoch": 2478} {"train_loss": -23.934955596923828, "global_step": 205697, "epoch": 2478} {"train_loss": -24.423891067504883, "global_step": 205698, "epoch": 2478} {"train_loss": -24.473312377929688, "global_step": 205699, "epoch": 2478} {"train_loss": -24.19370460510254, "global_step": 205700, "epoch": 2478} {"train_loss": -24.376535415649414, "global_step": 205701, "epoch": 2478} {"train_loss": -24.29560661315918, "global_step": 205702, "epoch": 2478} {"train_loss": -24.071664810180664, "global_step": 205703, "epoch": 2478} {"train_loss": -24.508825302124023, "global_step": 205704, "epoch": 2478} {"train_loss": -24.73359489440918, "global_step": 205705, "epoch": 2478} {"train_loss": -24.44955825805664, "global_step": 205706, "epoch": 2478} {"train_loss": -23.853818893432617, "global_step": 205707, "epoch": 2478} {"train_loss": -24.186763763427734, "global_step": 205708, "epoch": 2478} {"train_loss": -24.344541549682617, "global_step": 205709, "epoch": 2478} {"train_loss": -24.65201759338379, "global_step": 205710, "epoch": 2478} {"train_loss": -24.71217155456543, "global_step": 205711, "epoch": 2478} {"train_loss": -24.55457878112793, "global_step": 205712, "epoch": 2478} {"train_loss": -24.43818473815918, "global_step": 205713, "epoch": 2478} {"train_loss": -24.067516326904297, "global_step": 205714, "epoch": 2478} {"train_loss": -24.340314865112305, "global_step": 205715, "epoch": 2478} {"train_loss": -24.016660690307617, "global_step": 205716, "epoch": 2478} {"train_loss": -24.58760643005371, "global_step": 205717, "epoch": 2478} {"train_loss": -24.589920043945312, "global_step": 205718, "epoch": 2478} {"train_loss": -24.576984405517578, "global_step": 205719, "epoch": 2478} {"train_loss": -24.593448638916016, "global_step": 205720, "epoch": 2478} {"train_loss": -23.938722610473633, "global_step": 205721, "epoch": 2478} {"train_loss": -24.62648582458496, "global_step": 205722, "epoch": 2478} {"train_loss": -24.631153106689453, "global_step": 205723, "epoch": 2478} {"train_loss": -24.45326042175293, "global_step": 205724, "epoch": 2478} {"train_loss": -24.536762237548828, "global_step": 205725, "epoch": 2478} {"train_loss": -24.07124900817871, "global_step": 205726, "epoch": 2478} {"train_loss": -24.468534469604492, "global_step": 205727, "epoch": 2478} {"train_loss": -24.487808227539062, "global_step": 205728, "epoch": 2478} {"train_loss": -24.276161193847656, "global_step": 205729, "epoch": 2478} {"train_loss": -24.137527465820312, "global_step": 205730, "epoch": 2478} {"train_loss": -24.553794860839844, "global_step": 205731, "epoch": 2478} {"train_loss": -24.555418014526367, "global_step": 205732, "epoch": 2478} {"train_loss": -24.447385787963867, "global_step": 205733, "epoch": 2478} {"train_loss": -24.368955612182617, "global_step": 205734, "epoch": 2478} {"train_loss": -24.111501693725586, "global_step": 205735, "epoch": 2478} {"train_loss": -24.162233352661133, "global_step": 205736, "epoch": 2478} {"train_loss": -24.476953506469727, "global_step": 205737, "epoch": 2478} {"train_loss": -24.458438873291016, "global_step": 205738, "epoch": 2478} {"train_loss": -24.620656967163086, "global_step": 205739, "epoch": 2478} {"train_loss": -24.190288543701172, "global_step": 205740, "epoch": 2478} {"train_loss": -24.319974899291992, "global_step": 205741, "epoch": 2478} {"train_loss": -24.609670639038086, "global_step": 205742, "epoch": 2478} {"train_loss": -24.293363571166992, "global_step": 205743, "epoch": 2478} {"train_loss": -24.181943893432617, "global_step": 205744, "epoch": 2478} {"train_loss": -24.444473266601562, "global_step": 205745, "epoch": 2478} {"train_loss": -24.075946807861328, "global_step": 205746, "epoch": 2478} {"train_loss": -24.461565017700195, "global_step": 205747, "epoch": 2478} {"train_loss": -24.389036178588867, "global_step": 205748, "epoch": 2478} {"train_loss": -24.232791900634766, "global_step": 205749, "epoch": 2478} {"train_loss": -24.03790855407715, "global_step": 205750, "epoch": 2478} {"train_loss": -23.896482467651367, "global_step": 205751, "epoch": 2478} {"train_loss": -24.13651466369629, "global_step": 205752, "epoch": 2478} {"train_loss": -24.386571884155273, "global_step": 205753, "epoch": 2478} {"train_loss": -24.569921493530273, "global_step": 205754, "epoch": 2478} {"train_loss": -24.258132934570312, "global_step": 205755, "epoch": 2478} {"train_loss": -24.25430722983487, "global_step": 205756, "epoch": 2478, "val_loss": 6491733.0} {"train_loss": -23.312231063842773, "global_step": 205757, "epoch": 2479} {"train_loss": -23.695316314697266, "global_step": 205758, "epoch": 2479} {"train_loss": -23.488903045654297, "global_step": 205759, "epoch": 2479} {"train_loss": -23.873886108398438, "global_step": 205760, "epoch": 2479} {"train_loss": -23.5577449798584, "global_step": 205761, "epoch": 2479} {"train_loss": -23.76521110534668, "global_step": 205762, "epoch": 2479} {"train_loss": -23.36406898498535, "global_step": 205763, "epoch": 2479} {"train_loss": -23.638534545898438, "global_step": 205764, "epoch": 2479} {"train_loss": -23.69867515563965, "global_step": 205765, "epoch": 2479} {"train_loss": -23.616130828857422, "global_step": 205766, "epoch": 2479} {"train_loss": -23.728605270385742, "global_step": 205767, "epoch": 2479} {"train_loss": -24.021316528320312, "global_step": 205768, "epoch": 2479} {"train_loss": -23.688871383666992, "global_step": 205769, "epoch": 2479} {"train_loss": -24.162967681884766, "global_step": 205770, "epoch": 2479} {"train_loss": -24.22821617126465, "global_step": 205771, "epoch": 2479} {"train_loss": -23.721038818359375, "global_step": 205772, "epoch": 2479} {"train_loss": -24.068042755126953, "global_step": 205773, "epoch": 2479} {"train_loss": -23.906517028808594, "global_step": 205774, "epoch": 2479} {"train_loss": -23.7504940032959, "global_step": 205775, "epoch": 2479} {"train_loss": -24.256431579589844, "global_step": 205776, "epoch": 2479} {"train_loss": -23.99500846862793, "global_step": 205777, "epoch": 2479} {"train_loss": -24.305700302124023, "global_step": 205778, "epoch": 2479} {"train_loss": -24.009811401367188, "global_step": 205779, "epoch": 2479} {"train_loss": -23.878097534179688, "global_step": 205780, "epoch": 2479} {"train_loss": -24.349061965942383, "global_step": 205781, "epoch": 2479} {"train_loss": -24.134815216064453, "global_step": 205782, "epoch": 2479} {"train_loss": -24.03904151916504, "global_step": 205783, "epoch": 2479} {"train_loss": -24.03773307800293, "global_step": 205784, "epoch": 2479} {"train_loss": -24.3297176361084, "global_step": 205785, "epoch": 2479} {"train_loss": -24.01592445373535, "global_step": 205786, "epoch": 2479} {"train_loss": -24.143844604492188, "global_step": 205787, "epoch": 2479} {"train_loss": -24.356582641601562, "global_step": 205788, "epoch": 2479} {"train_loss": -24.385801315307617, "global_step": 205789, "epoch": 2479} {"train_loss": -24.545307159423828, "global_step": 205790, "epoch": 2479} {"train_loss": -24.560962677001953, "global_step": 205791, "epoch": 2479} {"train_loss": -24.47772979736328, "global_step": 205792, "epoch": 2479} {"train_loss": -24.017318725585938, "global_step": 205793, "epoch": 2479} {"train_loss": -24.488515853881836, "global_step": 205794, "epoch": 2479} {"train_loss": -24.786731719970703, "global_step": 205795, "epoch": 2479} {"train_loss": -24.213754653930664, "global_step": 205796, "epoch": 2479} {"train_loss": -24.43577003479004, "global_step": 205797, "epoch": 2479} {"train_loss": -24.35566520690918, "global_step": 205798, "epoch": 2479} {"train_loss": -24.667339324951172, "global_step": 205799, "epoch": 2479} {"train_loss": -24.24358558654785, "global_step": 205800, "epoch": 2479} {"train_loss": -24.266916275024414, "global_step": 205801, "epoch": 2479} {"train_loss": -24.511472702026367, "global_step": 205802, "epoch": 2479} {"train_loss": -24.1937255859375, "global_step": 205803, "epoch": 2479} {"train_loss": -24.369539260864258, "global_step": 205804, "epoch": 2479} {"train_loss": -24.183704376220703, "global_step": 205805, "epoch": 2479} {"train_loss": -24.590713500976562, "global_step": 205806, "epoch": 2479} {"train_loss": -24.401472091674805, "global_step": 205807, "epoch": 2479} {"train_loss": -24.482898712158203, "global_step": 205808, "epoch": 2479} {"train_loss": -24.40845489501953, "global_step": 205809, "epoch": 2479} {"train_loss": -24.7005615234375, "global_step": 205810, "epoch": 2479} {"train_loss": -24.452360153198242, "global_step": 205811, "epoch": 2479} {"train_loss": -24.02278709411621, "global_step": 205812, "epoch": 2479} {"train_loss": -24.30999755859375, "global_step": 205813, "epoch": 2479} {"train_loss": -24.316329956054688, "global_step": 205814, "epoch": 2479} {"train_loss": -24.401966094970703, "global_step": 205815, "epoch": 2479} {"train_loss": -24.515953063964844, "global_step": 205816, "epoch": 2479} {"train_loss": -24.168607711791992, "global_step": 205817, "epoch": 2479} {"train_loss": -24.344772338867188, "global_step": 205818, "epoch": 2479} {"train_loss": -24.589492797851562, "global_step": 205819, "epoch": 2479} {"train_loss": -24.65119743347168, "global_step": 205820, "epoch": 2479} {"train_loss": -24.739187240600586, "global_step": 205821, "epoch": 2479} {"train_loss": -24.58730125427246, "global_step": 205822, "epoch": 2479} {"train_loss": -24.66127586364746, "global_step": 205823, "epoch": 2479} {"train_loss": -24.588048934936523, "global_step": 205824, "epoch": 2479} {"train_loss": -24.522802352905273, "global_step": 205825, "epoch": 2479} {"train_loss": -24.106945037841797, "global_step": 205826, "epoch": 2479} {"train_loss": -24.258970260620117, "global_step": 205827, "epoch": 2479} {"train_loss": -24.367477416992188, "global_step": 205828, "epoch": 2479} {"train_loss": -23.79336929321289, "global_step": 205829, "epoch": 2479} {"train_loss": -24.19454002380371, "global_step": 205830, "epoch": 2479} {"train_loss": -24.1151065826416, "global_step": 205831, "epoch": 2479} {"train_loss": -23.493261337280273, "global_step": 205832, "epoch": 2479} {"train_loss": -24.4267578125, "global_step": 205833, "epoch": 2479} {"train_loss": -24.071569442749023, "global_step": 205834, "epoch": 2479} {"train_loss": -23.869977951049805, "global_step": 205835, "epoch": 2479} {"train_loss": -24.246816635131836, "global_step": 205836, "epoch": 2479} {"train_loss": -24.79134178161621, "global_step": 205837, "epoch": 2479} {"train_loss": -23.94666862487793, "global_step": 205838, "epoch": 2479} {"train_loss": -24.187887237732667, "global_step": 205839, "epoch": 2479, "val_loss": 6631473.0} {"train_loss": -23.76350212097168, "global_step": 205840, "epoch": 2480} {"train_loss": -24.118980407714844, "global_step": 205841, "epoch": 2480} {"train_loss": -23.891674041748047, "global_step": 205842, "epoch": 2480} {"train_loss": -23.825641632080078, "global_step": 205843, "epoch": 2480} {"train_loss": -23.771883010864258, "global_step": 205844, "epoch": 2480} {"train_loss": -23.849668502807617, "global_step": 205845, "epoch": 2480} {"train_loss": -24.20489501953125, "global_step": 205846, "epoch": 2480} {"train_loss": -23.946857452392578, "global_step": 205847, "epoch": 2480} {"train_loss": -24.10471534729004, "global_step": 205848, "epoch": 2480} {"train_loss": -24.124189376831055, "global_step": 205849, "epoch": 2480} {"train_loss": -24.275251388549805, "global_step": 205850, "epoch": 2480} {"train_loss": -24.21714973449707, "global_step": 205851, "epoch": 2480} {"train_loss": -24.384536743164062, "global_step": 205852, "epoch": 2480} {"train_loss": -24.10573387145996, "global_step": 205853, "epoch": 2480} {"train_loss": -24.028955459594727, "global_step": 205854, "epoch": 2480} {"train_loss": -24.429807662963867, "global_step": 205855, "epoch": 2480} {"train_loss": -24.095720291137695, "global_step": 205856, "epoch": 2480} {"train_loss": -24.17879295349121, "global_step": 205857, "epoch": 2480} {"train_loss": -24.337663650512695, "global_step": 205858, "epoch": 2480} {"train_loss": -24.227270126342773, "global_step": 205859, "epoch": 2480} {"train_loss": -24.30915641784668, "global_step": 205860, "epoch": 2480} {"train_loss": -24.526517868041992, "global_step": 205861, "epoch": 2480} {"train_loss": -24.567731857299805, "global_step": 205862, "epoch": 2480} {"train_loss": -24.589635848999023, "global_step": 205863, "epoch": 2480} {"train_loss": -24.38314437866211, "global_step": 205864, "epoch": 2480} {"train_loss": -24.1132755279541, "global_step": 205865, "epoch": 2480} {"train_loss": -24.50887107849121, "global_step": 205866, "epoch": 2480} {"train_loss": -24.30307960510254, "global_step": 205867, "epoch": 2480} {"train_loss": -24.495317459106445, "global_step": 205868, "epoch": 2480} {"train_loss": -24.159637451171875, "global_step": 205869, "epoch": 2480} {"train_loss": -24.50571632385254, "global_step": 205870, "epoch": 2480} {"train_loss": -24.36073875427246, "global_step": 205871, "epoch": 2480} {"train_loss": -24.36245346069336, "global_step": 205872, "epoch": 2480} {"train_loss": -24.232864379882812, "global_step": 205873, "epoch": 2480} {"train_loss": -24.705913543701172, "global_step": 205874, "epoch": 2480} {"train_loss": -24.55686378479004, "global_step": 205875, "epoch": 2480} {"train_loss": -24.470197677612305, "global_step": 205876, "epoch": 2480} {"train_loss": -24.94129753112793, "global_step": 205877, "epoch": 2480} {"train_loss": -24.44699478149414, "global_step": 205878, "epoch": 2480} {"train_loss": -24.565685272216797, "global_step": 205879, "epoch": 2480} {"train_loss": -24.48748779296875, "global_step": 205880, "epoch": 2480} {"train_loss": -24.258892059326172, "global_step": 205881, "epoch": 2480} {"train_loss": -24.25162124633789, "global_step": 205882, "epoch": 2480} {"train_loss": -24.383703231811523, "global_step": 205883, "epoch": 2480} {"train_loss": -24.250303268432617, "global_step": 205884, "epoch": 2480} {"train_loss": -24.063085556030273, "global_step": 205885, "epoch": 2480} {"train_loss": -24.05060386657715, "global_step": 205886, "epoch": 2480} {"train_loss": -24.28946876525879, "global_step": 205887, "epoch": 2480} {"train_loss": -24.5633602142334, "global_step": 205888, "epoch": 2480} {"train_loss": -24.159408569335938, "global_step": 205889, "epoch": 2480} {"train_loss": -24.03365135192871, "global_step": 205890, "epoch": 2480} {"train_loss": -24.526111602783203, "global_step": 205891, "epoch": 2480} {"train_loss": -24.251127243041992, "global_step": 205892, "epoch": 2480} {"train_loss": -24.340673446655273, "global_step": 205893, "epoch": 2480} {"train_loss": -24.523906707763672, "global_step": 205894, "epoch": 2480} {"train_loss": -24.195697784423828, "global_step": 205895, "epoch": 2480} {"train_loss": -24.544790267944336, "global_step": 205896, "epoch": 2480} {"train_loss": -24.350465774536133, "global_step": 205897, "epoch": 2480} {"train_loss": -24.8260498046875, "global_step": 205898, "epoch": 2480} {"train_loss": -24.11684226989746, "global_step": 205899, "epoch": 2480} {"train_loss": -24.00083351135254, "global_step": 205900, "epoch": 2480} {"train_loss": -24.33217430114746, "global_step": 205901, "epoch": 2480} {"train_loss": -24.6872615814209, "global_step": 205902, "epoch": 2480} {"train_loss": -24.62265396118164, "global_step": 205903, "epoch": 2480} {"train_loss": -24.28258514404297, "global_step": 205904, "epoch": 2480} {"train_loss": -24.41023826599121, "global_step": 205905, "epoch": 2480} {"train_loss": -24.137426376342773, "global_step": 205906, "epoch": 2480} {"train_loss": -24.587976455688477, "global_step": 205907, "epoch": 2480} {"train_loss": -24.696271896362305, "global_step": 205908, "epoch": 2480} {"train_loss": -24.902877807617188, "global_step": 205909, "epoch": 2480} {"train_loss": -24.430105209350586, "global_step": 205910, "epoch": 2480} {"train_loss": -24.03304100036621, "global_step": 205911, "epoch": 2480} {"train_loss": -24.110092163085938, "global_step": 205912, "epoch": 2480} {"train_loss": -24.340869903564453, "global_step": 205913, "epoch": 2480} {"train_loss": -24.396100997924805, "global_step": 205914, "epoch": 2480} {"train_loss": -24.024717330932617, "global_step": 205915, "epoch": 2480} {"train_loss": -24.345001220703125, "global_step": 205916, "epoch": 2480} {"train_loss": -24.397628784179688, "global_step": 205917, "epoch": 2480} {"train_loss": -24.877119064331055, "global_step": 205918, "epoch": 2480} {"train_loss": -24.419490814208984, "global_step": 205919, "epoch": 2480} {"train_loss": -24.443580627441406, "global_step": 205920, "epoch": 2480} {"train_loss": -24.21889305114746, "global_step": 205921, "epoch": 2480} {"train_loss": -24.31919867733875, "global_step": 205922, "epoch": 2480, "val_loss": 6551538.0} {"train_loss": -23.932050704956055, "global_step": 205923, "epoch": 2481} {"train_loss": -24.102630615234375, "global_step": 205924, "epoch": 2481} {"train_loss": -23.916217803955078, "global_step": 205925, "epoch": 2481} {"train_loss": -24.070220947265625, "global_step": 205926, "epoch": 2481} {"train_loss": -24.40608024597168, "global_step": 205927, "epoch": 2481} {"train_loss": -23.983957290649414, "global_step": 205928, "epoch": 2481} {"train_loss": -24.013425827026367, "global_step": 205929, "epoch": 2481} {"train_loss": -24.150150299072266, "global_step": 205930, "epoch": 2481} {"train_loss": -24.358356475830078, "global_step": 205931, "epoch": 2481} {"train_loss": -24.214706420898438, "global_step": 205932, "epoch": 2481} {"train_loss": -24.577640533447266, "global_step": 205933, "epoch": 2481} {"train_loss": -24.294479370117188, "global_step": 205934, "epoch": 2481} {"train_loss": -24.459501266479492, "global_step": 205935, "epoch": 2481} {"train_loss": -24.252365112304688, "global_step": 205936, "epoch": 2481} {"train_loss": -24.34613609313965, "global_step": 205937, "epoch": 2481} {"train_loss": -24.399412155151367, "global_step": 205938, "epoch": 2481} {"train_loss": -24.265703201293945, "global_step": 205939, "epoch": 2481} {"train_loss": -24.329456329345703, "global_step": 205940, "epoch": 2481} {"train_loss": -23.984792709350586, "global_step": 205941, "epoch": 2481} {"train_loss": -24.16438102722168, "global_step": 205942, "epoch": 2481} {"train_loss": -24.302570343017578, "global_step": 205943, "epoch": 2481} {"train_loss": -24.561508178710938, "global_step": 205944, "epoch": 2481} {"train_loss": -24.540990829467773, "global_step": 205945, "epoch": 2481} {"train_loss": -24.497915267944336, "global_step": 205946, "epoch": 2481} {"train_loss": -24.53377342224121, "global_step": 205947, "epoch": 2481} {"train_loss": -24.54426383972168, "global_step": 205948, "epoch": 2481} {"train_loss": -24.215028762817383, "global_step": 205949, "epoch": 2481} {"train_loss": -24.305461883544922, "global_step": 205950, "epoch": 2481} {"train_loss": -24.60371208190918, "global_step": 205951, "epoch": 2481} {"train_loss": -24.42037582397461, "global_step": 205952, "epoch": 2481} {"train_loss": -24.521535873413086, "global_step": 205953, "epoch": 2481} {"train_loss": -24.24393653869629, "global_step": 205954, "epoch": 2481} {"train_loss": -24.345333099365234, "global_step": 205955, "epoch": 2481} {"train_loss": -24.24793243408203, "global_step": 205956, "epoch": 2481} {"train_loss": -24.16475486755371, "global_step": 205957, "epoch": 2481} {"train_loss": -24.297401428222656, "global_step": 205958, "epoch": 2481} {"train_loss": -24.667282104492188, "global_step": 205959, "epoch": 2481} {"train_loss": -24.424833297729492, "global_step": 205960, "epoch": 2481} {"train_loss": -24.539968490600586, "global_step": 205961, "epoch": 2481} {"train_loss": -24.921674728393555, "global_step": 205962, "epoch": 2481} {"train_loss": -24.38191795349121, "global_step": 205963, "epoch": 2481} {"train_loss": -24.434280395507812, "global_step": 205964, "epoch": 2481} {"train_loss": -24.47352409362793, "global_step": 205965, "epoch": 2481} {"train_loss": -24.410512924194336, "global_step": 205966, "epoch": 2481} {"train_loss": -24.3145694732666, "global_step": 205967, "epoch": 2481} {"train_loss": -24.61786651611328, "global_step": 205968, "epoch": 2481} {"train_loss": -24.61107063293457, "global_step": 205969, "epoch": 2481} {"train_loss": -24.56207275390625, "global_step": 205970, "epoch": 2481} {"train_loss": -24.611923217773438, "global_step": 205971, "epoch": 2481} {"train_loss": -24.727537155151367, "global_step": 205972, "epoch": 2481} {"train_loss": -24.274459838867188, "global_step": 205973, "epoch": 2481} {"train_loss": -24.423513412475586, "global_step": 205974, "epoch": 2481} {"train_loss": -24.723236083984375, "global_step": 205975, "epoch": 2481} {"train_loss": -24.252685546875, "global_step": 205976, "epoch": 2481} {"train_loss": -24.542476654052734, "global_step": 205977, "epoch": 2481} {"train_loss": -24.74271011352539, "global_step": 205978, "epoch": 2481} {"train_loss": -24.56281280517578, "global_step": 205979, "epoch": 2481} {"train_loss": -24.582063674926758, "global_step": 205980, "epoch": 2481} {"train_loss": -24.47752571105957, "global_step": 205981, "epoch": 2481} {"train_loss": -24.892595291137695, "global_step": 205982, "epoch": 2481} {"train_loss": -24.602680206298828, "global_step": 205983, "epoch": 2481} {"train_loss": -24.585111618041992, "global_step": 205984, "epoch": 2481} {"train_loss": -24.0693359375, "global_step": 205985, "epoch": 2481} {"train_loss": -24.49616813659668, "global_step": 205986, "epoch": 2481} {"train_loss": -24.439878463745117, "global_step": 205987, "epoch": 2481} {"train_loss": -24.32942008972168, "global_step": 205988, "epoch": 2481} {"train_loss": -24.13771629333496, "global_step": 205989, "epoch": 2481} {"train_loss": -24.347143173217773, "global_step": 205990, "epoch": 2481} {"train_loss": -23.469423294067383, "global_step": 205991, "epoch": 2481} {"train_loss": -23.902746200561523, "global_step": 205992, "epoch": 2481} {"train_loss": -24.160526275634766, "global_step": 205993, "epoch": 2481} {"train_loss": -23.742422103881836, "global_step": 205994, "epoch": 2481} {"train_loss": -22.679716110229492, "global_step": 205995, "epoch": 2481} {"train_loss": -23.818952560424805, "global_step": 205996, "epoch": 2481} {"train_loss": -24.35671615600586, "global_step": 205997, "epoch": 2481} {"train_loss": -23.09519386291504, "global_step": 205998, "epoch": 2481} {"train_loss": -23.397111892700195, "global_step": 205999, "epoch": 2481} {"train_loss": -22.854106903076172, "global_step": 206000, "epoch": 2481} {"train_loss": -23.974706649780273, "global_step": 206001, "epoch": 2481} {"train_loss": -23.219724655151367, "global_step": 206002, "epoch": 2481} {"train_loss": -23.93584632873535, "global_step": 206003, "epoch": 2481} {"train_loss": -23.759628295898438, "global_step": 206004, "epoch": 2481} {"train_loss": -24.2527313921825, "global_step": 206005, "epoch": 2481, "val_loss": 6612938.0} {"train_loss": -23.999448776245117, "global_step": 206006, "epoch": 2482} {"train_loss": -23.900997161865234, "global_step": 206007, "epoch": 2482} {"train_loss": -23.94244384765625, "global_step": 206008, "epoch": 2482} {"train_loss": -23.686973571777344, "global_step": 206009, "epoch": 2482} {"train_loss": -23.617883682250977, "global_step": 206010, "epoch": 2482} {"train_loss": -23.601009368896484, "global_step": 206011, "epoch": 2482} {"train_loss": -23.73561668395996, "global_step": 206012, "epoch": 2482} {"train_loss": -23.591888427734375, "global_step": 206013, "epoch": 2482} {"train_loss": -23.893125534057617, "global_step": 206014, "epoch": 2482} {"train_loss": -23.817495346069336, "global_step": 206015, "epoch": 2482} {"train_loss": -24.120412826538086, "global_step": 206016, "epoch": 2482} {"train_loss": -24.020397186279297, "global_step": 206017, "epoch": 2482} {"train_loss": -23.9029598236084, "global_step": 206018, "epoch": 2482} {"train_loss": -24.53120231628418, "global_step": 206019, "epoch": 2482} {"train_loss": -24.143613815307617, "global_step": 206020, "epoch": 2482} {"train_loss": -24.084749221801758, "global_step": 206021, "epoch": 2482} {"train_loss": -24.41152572631836, "global_step": 206022, "epoch": 2482} {"train_loss": -24.26308250427246, "global_step": 206023, "epoch": 2482} {"train_loss": -23.871112823486328, "global_step": 206024, "epoch": 2482} {"train_loss": -24.452693939208984, "global_step": 206025, "epoch": 2482} {"train_loss": -24.012001037597656, "global_step": 206026, "epoch": 2482} {"train_loss": -24.099302291870117, "global_step": 206027, "epoch": 2482} {"train_loss": -24.300748825073242, "global_step": 206028, "epoch": 2482} {"train_loss": -24.29181480407715, "global_step": 206029, "epoch": 2482} {"train_loss": -24.15652847290039, "global_step": 206030, "epoch": 2482} {"train_loss": -24.4033260345459, "global_step": 206031, "epoch": 2482} {"train_loss": -24.061267852783203, "global_step": 206032, "epoch": 2482} {"train_loss": -23.91276741027832, "global_step": 206033, "epoch": 2482} {"train_loss": -24.41364860534668, "global_step": 206034, "epoch": 2482} {"train_loss": -24.132497787475586, "global_step": 206035, "epoch": 2482} {"train_loss": -23.852813720703125, "global_step": 206036, "epoch": 2482} {"train_loss": -24.359901428222656, "global_step": 206037, "epoch": 2482} {"train_loss": -24.39865493774414, "global_step": 206038, "epoch": 2482} {"train_loss": -24.09601402282715, "global_step": 206039, "epoch": 2482} {"train_loss": -24.54475975036621, "global_step": 206040, "epoch": 2482} {"train_loss": -24.465341567993164, "global_step": 206041, "epoch": 2482} {"train_loss": -24.42851448059082, "global_step": 206042, "epoch": 2482} {"train_loss": -24.13515281677246, "global_step": 206043, "epoch": 2482} {"train_loss": -24.398563385009766, "global_step": 206044, "epoch": 2482} {"train_loss": -24.54745864868164, "global_step": 206045, "epoch": 2482} {"train_loss": -24.55805015563965, "global_step": 206046, "epoch": 2482} {"train_loss": -24.359045028686523, "global_step": 206047, "epoch": 2482} {"train_loss": -24.659496307373047, "global_step": 206048, "epoch": 2482} {"train_loss": -24.52729034423828, "global_step": 206049, "epoch": 2482} {"train_loss": -24.717416763305664, "global_step": 206050, "epoch": 2482} {"train_loss": -24.12875747680664, "global_step": 206051, "epoch": 2482} {"train_loss": -24.546396255493164, "global_step": 206052, "epoch": 2482} {"train_loss": -24.599502563476562, "global_step": 206053, "epoch": 2482} {"train_loss": -24.204004287719727, "global_step": 206054, "epoch": 2482} {"train_loss": -24.749479293823242, "global_step": 206055, "epoch": 2482} {"train_loss": -24.70413589477539, "global_step": 206056, "epoch": 2482} {"train_loss": -24.57027244567871, "global_step": 206057, "epoch": 2482} {"train_loss": -24.35689353942871, "global_step": 206058, "epoch": 2482} {"train_loss": -24.327207565307617, "global_step": 206059, "epoch": 2482} {"train_loss": -24.388015747070312, "global_step": 206060, "epoch": 2482} {"train_loss": -24.422529220581055, "global_step": 206061, "epoch": 2482} {"train_loss": -24.375112533569336, "global_step": 206062, "epoch": 2482} {"train_loss": -24.176252365112305, "global_step": 206063, "epoch": 2482} {"train_loss": -24.174795150756836, "global_step": 206064, "epoch": 2482} {"train_loss": -24.32723045349121, "global_step": 206065, "epoch": 2482} {"train_loss": -24.22479248046875, "global_step": 206066, "epoch": 2482} {"train_loss": -24.17356300354004, "global_step": 206067, "epoch": 2482} {"train_loss": -24.304922103881836, "global_step": 206068, "epoch": 2482} {"train_loss": -24.327829360961914, "global_step": 206069, "epoch": 2482} {"train_loss": -24.084226608276367, "global_step": 206070, "epoch": 2482} {"train_loss": -24.217470169067383, "global_step": 206071, "epoch": 2482} {"train_loss": -24.03640365600586, "global_step": 206072, "epoch": 2482} {"train_loss": -24.068803787231445, "global_step": 206073, "epoch": 2482} {"train_loss": -23.735488891601562, "global_step": 206074, "epoch": 2482} {"train_loss": -24.464385986328125, "global_step": 206075, "epoch": 2482} {"train_loss": -24.193143844604492, "global_step": 206076, "epoch": 2482} {"train_loss": -23.986587524414062, "global_step": 206077, "epoch": 2482} {"train_loss": -24.18697166442871, "global_step": 206078, "epoch": 2482} {"train_loss": -24.379375457763672, "global_step": 206079, "epoch": 2482} {"train_loss": -24.436927795410156, "global_step": 206080, "epoch": 2482} {"train_loss": -24.331064224243164, "global_step": 206081, "epoch": 2482} {"train_loss": -24.253250122070312, "global_step": 206082, "epoch": 2482} {"train_loss": -24.400009155273438, "global_step": 206083, "epoch": 2482} {"train_loss": -24.26785659790039, "global_step": 206084, "epoch": 2482} {"train_loss": -24.416141510009766, "global_step": 206085, "epoch": 2482} {"train_loss": -24.169178009033203, "global_step": 206086, "epoch": 2482} {"train_loss": -24.561262130737305, "global_step": 206087, "epoch": 2482} {"train_loss": -24.22041102489793, "global_step": 206088, "epoch": 2482, "val_loss": 6600583.0} {"train_loss": -24.050739288330078, "global_step": 206089, "epoch": 2483} {"train_loss": -24.298816680908203, "global_step": 206090, "epoch": 2483} {"train_loss": -23.392902374267578, "global_step": 206091, "epoch": 2483} {"train_loss": -23.541362762451172, "global_step": 206092, "epoch": 2483} {"train_loss": -23.233327865600586, "global_step": 206093, "epoch": 2483} {"train_loss": -24.09859848022461, "global_step": 206094, "epoch": 2483} {"train_loss": -24.096118927001953, "global_step": 206095, "epoch": 2483} {"train_loss": -23.832050323486328, "global_step": 206096, "epoch": 2483} {"train_loss": -23.896867752075195, "global_step": 206097, "epoch": 2483} {"train_loss": -24.182491302490234, "global_step": 206098, "epoch": 2483} {"train_loss": -23.60031509399414, "global_step": 206099, "epoch": 2483} {"train_loss": -23.993568420410156, "global_step": 206100, "epoch": 2483} {"train_loss": -24.304039001464844, "global_step": 206101, "epoch": 2483} {"train_loss": -24.033178329467773, "global_step": 206102, "epoch": 2483} {"train_loss": -24.608673095703125, "global_step": 206103, "epoch": 2483} {"train_loss": -24.180437088012695, "global_step": 206104, "epoch": 2483} {"train_loss": -24.26251220703125, "global_step": 206105, "epoch": 2483} {"train_loss": -24.117633819580078, "global_step": 206106, "epoch": 2483} {"train_loss": -24.20310401916504, "global_step": 206107, "epoch": 2483} {"train_loss": -24.437131881713867, "global_step": 206108, "epoch": 2483} {"train_loss": -24.026498794555664, "global_step": 206109, "epoch": 2483} {"train_loss": -24.076440811157227, "global_step": 206110, "epoch": 2483} {"train_loss": -24.136571884155273, "global_step": 206111, "epoch": 2483} {"train_loss": -23.875314712524414, "global_step": 206112, "epoch": 2483} {"train_loss": -24.159509658813477, "global_step": 206113, "epoch": 2483} {"train_loss": -24.225513458251953, "global_step": 206114, "epoch": 2483} {"train_loss": -24.44098472595215, "global_step": 206115, "epoch": 2483} {"train_loss": -24.309736251831055, "global_step": 206116, "epoch": 2483} {"train_loss": -24.119766235351562, "global_step": 206117, "epoch": 2483} {"train_loss": -24.252500534057617, "global_step": 206118, "epoch": 2483} {"train_loss": -24.607603073120117, "global_step": 206119, "epoch": 2483} {"train_loss": -24.02358055114746, "global_step": 206120, "epoch": 2483} {"train_loss": -24.292325973510742, "global_step": 206121, "epoch": 2483} {"train_loss": -24.38154411315918, "global_step": 206122, "epoch": 2483} {"train_loss": -24.4455623626709, "global_step": 206123, "epoch": 2483} {"train_loss": -24.30862045288086, "global_step": 206124, "epoch": 2483} {"train_loss": -24.280912399291992, "global_step": 206125, "epoch": 2483} {"train_loss": -24.02774429321289, "global_step": 206126, "epoch": 2483} {"train_loss": -24.22495460510254, "global_step": 206127, "epoch": 2483} {"train_loss": -23.989049911499023, "global_step": 206128, "epoch": 2483} {"train_loss": -24.43528175354004, "global_step": 206129, "epoch": 2483} {"train_loss": -24.145742416381836, "global_step": 206130, "epoch": 2483} {"train_loss": -24.47947883605957, "global_step": 206131, "epoch": 2483} {"train_loss": -24.142568588256836, "global_step": 206132, "epoch": 2483} {"train_loss": -23.906177520751953, "global_step": 206133, "epoch": 2483} {"train_loss": -24.04994773864746, "global_step": 206134, "epoch": 2483} {"train_loss": -24.460615158081055, "global_step": 206135, "epoch": 2483} {"train_loss": -24.334577560424805, "global_step": 206136, "epoch": 2483} {"train_loss": -24.47150230407715, "global_step": 206137, "epoch": 2483} {"train_loss": -24.320219039916992, "global_step": 206138, "epoch": 2483} {"train_loss": -24.278852462768555, "global_step": 206139, "epoch": 2483} {"train_loss": -24.157169342041016, "global_step": 206140, "epoch": 2483} {"train_loss": -24.13072967529297, "global_step": 206141, "epoch": 2483} {"train_loss": -24.365680694580078, "global_step": 206142, "epoch": 2483} {"train_loss": -24.369855880737305, "global_step": 206143, "epoch": 2483} {"train_loss": -24.27655601501465, "global_step": 206144, "epoch": 2483} {"train_loss": -24.287240982055664, "global_step": 206145, "epoch": 2483} {"train_loss": -24.4536075592041, "global_step": 206146, "epoch": 2483} {"train_loss": -24.554636001586914, "global_step": 206147, "epoch": 2483} {"train_loss": -24.42355728149414, "global_step": 206148, "epoch": 2483} {"train_loss": -24.769189834594727, "global_step": 206149, "epoch": 2483} {"train_loss": -24.368431091308594, "global_step": 206150, "epoch": 2483} {"train_loss": -24.445283889770508, "global_step": 206151, "epoch": 2483} {"train_loss": -24.73297691345215, "global_step": 206152, "epoch": 2483} {"train_loss": -24.498966217041016, "global_step": 206153, "epoch": 2483} {"train_loss": -24.494382858276367, "global_step": 206154, "epoch": 2483} {"train_loss": -24.70992088317871, "global_step": 206155, "epoch": 2483} {"train_loss": -25.00027084350586, "global_step": 206156, "epoch": 2483} {"train_loss": -24.43446922302246, "global_step": 206157, "epoch": 2483} {"train_loss": -24.367040634155273, "global_step": 206158, "epoch": 2483} {"train_loss": -24.3087215423584, "global_step": 206159, "epoch": 2483} {"train_loss": -24.087575912475586, "global_step": 206160, "epoch": 2483} {"train_loss": -24.546934127807617, "global_step": 206161, "epoch": 2483} {"train_loss": -24.164356231689453, "global_step": 206162, "epoch": 2483} {"train_loss": -24.421451568603516, "global_step": 206163, "epoch": 2483} {"train_loss": -24.177854537963867, "global_step": 206164, "epoch": 2483} {"train_loss": -24.343616485595703, "global_step": 206165, "epoch": 2483} {"train_loss": -24.594528198242188, "global_step": 206166, "epoch": 2483} {"train_loss": -24.444194793701172, "global_step": 206167, "epoch": 2483} {"train_loss": -24.384450912475586, "global_step": 206168, "epoch": 2483} {"train_loss": -24.32080078125, "global_step": 206169, "epoch": 2483} {"train_loss": -24.398786544799805, "global_step": 206170, "epoch": 2483} {"train_loss": -24.26585034289992, "global_step": 206171, "epoch": 2483, "val_loss": 6610624.5} {"train_loss": -24.049713134765625, "global_step": 206172, "epoch": 2484} {"train_loss": -24.067852020263672, "global_step": 206173, "epoch": 2484} {"train_loss": -24.156892776489258, "global_step": 206174, "epoch": 2484} {"train_loss": -23.79203224182129, "global_step": 206175, "epoch": 2484} {"train_loss": -24.147464752197266, "global_step": 206176, "epoch": 2484} {"train_loss": -24.336942672729492, "global_step": 206177, "epoch": 2484} {"train_loss": -24.532522201538086, "global_step": 206178, "epoch": 2484} {"train_loss": -24.390878677368164, "global_step": 206179, "epoch": 2484} {"train_loss": -24.246353149414062, "global_step": 206180, "epoch": 2484} {"train_loss": -23.930768966674805, "global_step": 206181, "epoch": 2484} {"train_loss": -24.048280715942383, "global_step": 206182, "epoch": 2484} {"train_loss": -24.117433547973633, "global_step": 206183, "epoch": 2484} {"train_loss": -24.459516525268555, "global_step": 206184, "epoch": 2484} {"train_loss": -24.228748321533203, "global_step": 206185, "epoch": 2484} {"train_loss": -24.228900909423828, "global_step": 206186, "epoch": 2484} {"train_loss": -24.645389556884766, "global_step": 206187, "epoch": 2484} {"train_loss": -23.992263793945312, "global_step": 206188, "epoch": 2484} {"train_loss": -24.299457550048828, "global_step": 206189, "epoch": 2484} {"train_loss": -24.30498695373535, "global_step": 206190, "epoch": 2484} {"train_loss": -24.01617431640625, "global_step": 206191, "epoch": 2484} {"train_loss": -24.472074508666992, "global_step": 206192, "epoch": 2484} {"train_loss": -24.293415069580078, "global_step": 206193, "epoch": 2484} {"train_loss": -24.45525550842285, "global_step": 206194, "epoch": 2484} {"train_loss": -23.609888076782227, "global_step": 206195, "epoch": 2484} {"train_loss": -24.307342529296875, "global_step": 206196, "epoch": 2484} {"train_loss": -24.168596267700195, "global_step": 206197, "epoch": 2484} {"train_loss": -23.961750030517578, "global_step": 206198, "epoch": 2484} {"train_loss": -24.346948623657227, "global_step": 206199, "epoch": 2484} {"train_loss": -24.47202491760254, "global_step": 206200, "epoch": 2484} {"train_loss": -24.470932006835938, "global_step": 206201, "epoch": 2484} {"train_loss": -24.678495407104492, "global_step": 206202, "epoch": 2484} {"train_loss": -24.353103637695312, "global_step": 206203, "epoch": 2484} {"train_loss": -24.36057472229004, "global_step": 206204, "epoch": 2484} {"train_loss": -24.531484603881836, "global_step": 206205, "epoch": 2484} {"train_loss": -24.32008934020996, "global_step": 206206, "epoch": 2484} {"train_loss": -24.314462661743164, "global_step": 206207, "epoch": 2484} {"train_loss": -24.150646209716797, "global_step": 206208, "epoch": 2484} {"train_loss": -24.73065757751465, "global_step": 206209, "epoch": 2484} {"train_loss": -24.615039825439453, "global_step": 206210, "epoch": 2484} {"train_loss": -24.454669952392578, "global_step": 206211, "epoch": 2484} {"train_loss": -24.386693954467773, "global_step": 206212, "epoch": 2484} {"train_loss": -24.490386962890625, "global_step": 206213, "epoch": 2484} {"train_loss": -24.362329483032227, "global_step": 206214, "epoch": 2484} {"train_loss": -24.28334617614746, "global_step": 206215, "epoch": 2484} {"train_loss": -24.62691879272461, "global_step": 206216, "epoch": 2484} {"train_loss": -24.746498107910156, "global_step": 206217, "epoch": 2484} {"train_loss": -24.429073333740234, "global_step": 206218, "epoch": 2484} {"train_loss": -24.48257827758789, "global_step": 206219, "epoch": 2484} {"train_loss": -24.202537536621094, "global_step": 206220, "epoch": 2484} {"train_loss": -24.300092697143555, "global_step": 206221, "epoch": 2484} {"train_loss": -24.20442008972168, "global_step": 206222, "epoch": 2484} {"train_loss": -24.42414665222168, "global_step": 206223, "epoch": 2484} {"train_loss": -24.430410385131836, "global_step": 206224, "epoch": 2484} {"train_loss": -24.263660430908203, "global_step": 206225, "epoch": 2484} {"train_loss": -24.552762985229492, "global_step": 206226, "epoch": 2484} {"train_loss": -24.18655776977539, "global_step": 206227, "epoch": 2484} {"train_loss": -23.95676612854004, "global_step": 206228, "epoch": 2484} {"train_loss": -23.91538429260254, "global_step": 206229, "epoch": 2484} {"train_loss": -24.17249870300293, "global_step": 206230, "epoch": 2484} {"train_loss": -24.41644859313965, "global_step": 206231, "epoch": 2484} {"train_loss": -24.58079719543457, "global_step": 206232, "epoch": 2484} {"train_loss": -24.231422424316406, "global_step": 206233, "epoch": 2484} {"train_loss": -24.307077407836914, "global_step": 206234, "epoch": 2484} {"train_loss": -24.225570678710938, "global_step": 206235, "epoch": 2484} {"train_loss": -24.30647087097168, "global_step": 206236, "epoch": 2484} {"train_loss": -24.007936477661133, "global_step": 206237, "epoch": 2484} {"train_loss": -24.33168601989746, "global_step": 206238, "epoch": 2484} {"train_loss": -24.159584045410156, "global_step": 206239, "epoch": 2484} {"train_loss": -23.89133071899414, "global_step": 206240, "epoch": 2484} {"train_loss": -23.947940826416016, "global_step": 206241, "epoch": 2484} {"train_loss": -24.17151641845703, "global_step": 206242, "epoch": 2484} {"train_loss": -24.28437042236328, "global_step": 206243, "epoch": 2484} {"train_loss": -24.251617431640625, "global_step": 206244, "epoch": 2484} {"train_loss": -23.982206344604492, "global_step": 206245, "epoch": 2484} {"train_loss": -24.45806312561035, "global_step": 206246, "epoch": 2484} {"train_loss": -24.31416130065918, "global_step": 206247, "epoch": 2484} {"train_loss": -24.37109375, "global_step": 206248, "epoch": 2484} {"train_loss": -24.088857650756836, "global_step": 206249, "epoch": 2484} {"train_loss": -24.48171043395996, "global_step": 206250, "epoch": 2484} {"train_loss": -24.351530075073242, "global_step": 206251, "epoch": 2484} {"train_loss": -24.4168758392334, "global_step": 206252, "epoch": 2484} {"train_loss": -24.364599227905273, "global_step": 206253, "epoch": 2484} {"train_loss": -24.292469553200597, "global_step": 206254, "epoch": 2484, "val_loss": 6720922.5} {"train_loss": -24.07350730895996, "global_step": 206255, "epoch": 2485} {"train_loss": -24.49475860595703, "global_step": 206256, "epoch": 2485} {"train_loss": -24.35609245300293, "global_step": 206257, "epoch": 2485} {"train_loss": -24.18113136291504, "global_step": 206258, "epoch": 2485} {"train_loss": -24.141387939453125, "global_step": 206259, "epoch": 2485} {"train_loss": -24.206785202026367, "global_step": 206260, "epoch": 2485} {"train_loss": -24.06201171875, "global_step": 206261, "epoch": 2485} {"train_loss": -24.27973747253418, "global_step": 206262, "epoch": 2485} {"train_loss": -24.51504898071289, "global_step": 206263, "epoch": 2485} {"train_loss": -24.224485397338867, "global_step": 206264, "epoch": 2485} {"train_loss": -24.027494430541992, "global_step": 206265, "epoch": 2485} {"train_loss": -24.129426956176758, "global_step": 206266, "epoch": 2485} {"train_loss": -24.303512573242188, "global_step": 206267, "epoch": 2485} {"train_loss": -24.457448959350586, "global_step": 206268, "epoch": 2485} {"train_loss": -24.36931800842285, "global_step": 206269, "epoch": 2485} {"train_loss": -24.148324966430664, "global_step": 206270, "epoch": 2485} {"train_loss": -24.317951202392578, "global_step": 206271, "epoch": 2485} {"train_loss": -24.276792526245117, "global_step": 206272, "epoch": 2485} {"train_loss": -24.448741912841797, "global_step": 206273, "epoch": 2485} {"train_loss": -24.672279357910156, "global_step": 206274, "epoch": 2485} {"train_loss": -24.136526107788086, "global_step": 206275, "epoch": 2485} {"train_loss": -24.129520416259766, "global_step": 206276, "epoch": 2485} {"train_loss": -24.34912872314453, "global_step": 206277, "epoch": 2485} {"train_loss": -24.456449508666992, "global_step": 206278, "epoch": 2485} {"train_loss": -24.32209587097168, "global_step": 206279, "epoch": 2485} {"train_loss": -23.855667114257812, "global_step": 206280, "epoch": 2485} {"train_loss": -24.322668075561523, "global_step": 206281, "epoch": 2485} {"train_loss": -24.558446884155273, "global_step": 206282, "epoch": 2485} {"train_loss": -24.263111114501953, "global_step": 206283, "epoch": 2485} {"train_loss": -24.3093204498291, "global_step": 206284, "epoch": 2485} {"train_loss": -24.470746994018555, "global_step": 206285, "epoch": 2485} {"train_loss": -24.747116088867188, "global_step": 206286, "epoch": 2485} {"train_loss": -24.263757705688477, "global_step": 206287, "epoch": 2485} {"train_loss": -24.642471313476562, "global_step": 206288, "epoch": 2485} {"train_loss": -24.061925888061523, "global_step": 206289, "epoch": 2485} {"train_loss": -24.489456176757812, "global_step": 206290, "epoch": 2485} {"train_loss": -24.447803497314453, "global_step": 206291, "epoch": 2485} {"train_loss": -24.329418182373047, "global_step": 206292, "epoch": 2485} {"train_loss": -24.58021354675293, "global_step": 206293, "epoch": 2485} {"train_loss": -24.180561065673828, "global_step": 206294, "epoch": 2485} {"train_loss": -23.966779708862305, "global_step": 206295, "epoch": 2485} {"train_loss": -24.695417404174805, "global_step": 206296, "epoch": 2485} {"train_loss": -24.487695693969727, "global_step": 206297, "epoch": 2485} {"train_loss": -24.596723556518555, "global_step": 206298, "epoch": 2485} {"train_loss": -24.20369529724121, "global_step": 206299, "epoch": 2485} {"train_loss": -24.543643951416016, "global_step": 206300, "epoch": 2485} {"train_loss": -24.69253921508789, "global_step": 206301, "epoch": 2485} {"train_loss": -24.42486000061035, "global_step": 206302, "epoch": 2485} {"train_loss": -23.951425552368164, "global_step": 206303, "epoch": 2485} {"train_loss": -24.296945571899414, "global_step": 206304, "epoch": 2485} {"train_loss": -24.41489601135254, "global_step": 206305, "epoch": 2485} {"train_loss": -23.958194732666016, "global_step": 206306, "epoch": 2485} {"train_loss": -24.501468658447266, "global_step": 206307, "epoch": 2485} {"train_loss": -24.084402084350586, "global_step": 206308, "epoch": 2485} {"train_loss": -24.369064331054688, "global_step": 206309, "epoch": 2485} {"train_loss": -24.305694580078125, "global_step": 206310, "epoch": 2485} {"train_loss": -24.74371337890625, "global_step": 206311, "epoch": 2485} {"train_loss": -24.11604118347168, "global_step": 206312, "epoch": 2485} {"train_loss": -24.26297950744629, "global_step": 206313, "epoch": 2485} {"train_loss": -24.351850509643555, "global_step": 206314, "epoch": 2485} {"train_loss": -24.223852157592773, "global_step": 206315, "epoch": 2485} {"train_loss": -24.500476837158203, "global_step": 206316, "epoch": 2485} {"train_loss": -24.386606216430664, "global_step": 206317, "epoch": 2485} {"train_loss": -24.47074317932129, "global_step": 206318, "epoch": 2485} {"train_loss": -24.77085304260254, "global_step": 206319, "epoch": 2485} {"train_loss": -24.182077407836914, "global_step": 206320, "epoch": 2485} {"train_loss": -24.354236602783203, "global_step": 206321, "epoch": 2485} {"train_loss": -24.193191528320312, "global_step": 206322, "epoch": 2485} {"train_loss": -24.550846099853516, "global_step": 206323, "epoch": 2485} {"train_loss": -24.597692489624023, "global_step": 206324, "epoch": 2485} {"train_loss": -24.38191795349121, "global_step": 206325, "epoch": 2485} {"train_loss": -24.436588287353516, "global_step": 206326, "epoch": 2485} {"train_loss": -24.450172424316406, "global_step": 206327, "epoch": 2485} {"train_loss": -24.536483764648438, "global_step": 206328, "epoch": 2485} {"train_loss": -24.27669334411621, "global_step": 206329, "epoch": 2485} {"train_loss": -24.33066749572754, "global_step": 206330, "epoch": 2485} {"train_loss": -24.094921112060547, "global_step": 206331, "epoch": 2485} {"train_loss": -24.480911254882812, "global_step": 206332, "epoch": 2485} {"train_loss": -24.00284767150879, "global_step": 206333, "epoch": 2485} {"train_loss": -24.24717140197754, "global_step": 206334, "epoch": 2485} {"train_loss": -24.67526626586914, "global_step": 206335, "epoch": 2485} {"train_loss": -24.345462799072266, "global_step": 206336, "epoch": 2485} {"train_loss": -24.32675563858216, "global_step": 206337, "epoch": 2485, "val_loss": 6630605.0} {"train_loss": -23.691659927368164, "global_step": 206338, "epoch": 2486} {"train_loss": -23.31201171875, "global_step": 206339, "epoch": 2486} {"train_loss": -23.73585319519043, "global_step": 206340, "epoch": 2486} {"train_loss": -23.563024520874023, "global_step": 206341, "epoch": 2486} {"train_loss": -23.679471969604492, "global_step": 206342, "epoch": 2486} {"train_loss": -23.434106826782227, "global_step": 206343, "epoch": 2486} {"train_loss": -23.85454559326172, "global_step": 206344, "epoch": 2486} {"train_loss": -24.07562828063965, "global_step": 206345, "epoch": 2486} {"train_loss": -23.89578628540039, "global_step": 206346, "epoch": 2486} {"train_loss": -23.63561248779297, "global_step": 206347, "epoch": 2486} {"train_loss": -24.072738647460938, "global_step": 206348, "epoch": 2486} {"train_loss": -23.918060302734375, "global_step": 206349, "epoch": 2486} {"train_loss": -24.106611251831055, "global_step": 206350, "epoch": 2486} {"train_loss": -24.001367568969727, "global_step": 206351, "epoch": 2486} {"train_loss": -24.17241859436035, "global_step": 206352, "epoch": 2486} {"train_loss": -24.41463279724121, "global_step": 206353, "epoch": 2486} {"train_loss": -23.88478660583496, "global_step": 206354, "epoch": 2486} {"train_loss": -23.98811912536621, "global_step": 206355, "epoch": 2486} {"train_loss": -24.03285026550293, "global_step": 206356, "epoch": 2486} {"train_loss": -23.828739166259766, "global_step": 206357, "epoch": 2486} {"train_loss": -24.21488380432129, "global_step": 206358, "epoch": 2486} {"train_loss": -24.234493255615234, "global_step": 206359, "epoch": 2486} {"train_loss": -24.177581787109375, "global_step": 206360, "epoch": 2486} {"train_loss": -24.31993293762207, "global_step": 206361, "epoch": 2486} {"train_loss": -24.001541137695312, "global_step": 206362, "epoch": 2486} {"train_loss": -24.39810562133789, "global_step": 206363, "epoch": 2486} {"train_loss": -24.47427749633789, "global_step": 206364, "epoch": 2486} {"train_loss": -24.68752098083496, "global_step": 206365, "epoch": 2486} {"train_loss": -24.39457130432129, "global_step": 206366, "epoch": 2486} {"train_loss": -24.239709854125977, "global_step": 206367, "epoch": 2486} {"train_loss": -24.08015251159668, "global_step": 206368, "epoch": 2486} {"train_loss": -24.492277145385742, "global_step": 206369, "epoch": 2486} {"train_loss": -24.41358757019043, "global_step": 206370, "epoch": 2486} {"train_loss": -24.252288818359375, "global_step": 206371, "epoch": 2486} {"train_loss": -24.29953956604004, "global_step": 206372, "epoch": 2486} {"train_loss": -24.26250648498535, "global_step": 206373, "epoch": 2486} {"train_loss": -24.455495834350586, "global_step": 206374, "epoch": 2486} {"train_loss": -24.79762840270996, "global_step": 206375, "epoch": 2486} {"train_loss": -24.218090057373047, "global_step": 206376, "epoch": 2486} {"train_loss": -24.44740104675293, "global_step": 206377, "epoch": 2486} {"train_loss": -24.26221466064453, "global_step": 206378, "epoch": 2486} {"train_loss": -24.042829513549805, "global_step": 206379, "epoch": 2486} {"train_loss": -24.36529541015625, "global_step": 206380, "epoch": 2486} {"train_loss": -24.248497009277344, "global_step": 206381, "epoch": 2486} {"train_loss": -24.52334976196289, "global_step": 206382, "epoch": 2486} {"train_loss": -24.468158721923828, "global_step": 206383, "epoch": 2486} {"train_loss": -24.341039657592773, "global_step": 206384, "epoch": 2486} {"train_loss": -24.1480770111084, "global_step": 206385, "epoch": 2486} {"train_loss": -24.307836532592773, "global_step": 206386, "epoch": 2486} {"train_loss": -24.21962547302246, "global_step": 206387, "epoch": 2486} {"train_loss": -24.743000030517578, "global_step": 206388, "epoch": 2486} {"train_loss": -24.352209091186523, "global_step": 206389, "epoch": 2486} {"train_loss": -24.25832176208496, "global_step": 206390, "epoch": 2486} {"train_loss": -24.675006866455078, "global_step": 206391, "epoch": 2486} {"train_loss": -24.55086326599121, "global_step": 206392, "epoch": 2486} {"train_loss": -24.4768009185791, "global_step": 206393, "epoch": 2486} {"train_loss": -24.327163696289062, "global_step": 206394, "epoch": 2486} {"train_loss": -24.498140335083008, "global_step": 206395, "epoch": 2486} {"train_loss": -24.31634521484375, "global_step": 206396, "epoch": 2486} {"train_loss": -24.3808536529541, "global_step": 206397, "epoch": 2486} {"train_loss": -24.524892807006836, "global_step": 206398, "epoch": 2486} {"train_loss": -24.272079467773438, "global_step": 206399, "epoch": 2486} {"train_loss": -24.417007446289062, "global_step": 206400, "epoch": 2486} {"train_loss": -24.462833404541016, "global_step": 206401, "epoch": 2486} {"train_loss": -24.5380916595459, "global_step": 206402, "epoch": 2486} {"train_loss": -24.457048416137695, "global_step": 206403, "epoch": 2486} {"train_loss": -24.28916358947754, "global_step": 206404, "epoch": 2486} {"train_loss": -24.234006881713867, "global_step": 206405, "epoch": 2486} {"train_loss": -24.14994239807129, "global_step": 206406, "epoch": 2486} {"train_loss": -24.005475997924805, "global_step": 206407, "epoch": 2486} {"train_loss": -24.403629302978516, "global_step": 206408, "epoch": 2486} {"train_loss": -24.413249969482422, "global_step": 206409, "epoch": 2486} {"train_loss": -24.592893600463867, "global_step": 206410, "epoch": 2486} {"train_loss": -24.512508392333984, "global_step": 206411, "epoch": 2486} {"train_loss": -24.697803497314453, "global_step": 206412, "epoch": 2486} {"train_loss": -24.619787216186523, "global_step": 206413, "epoch": 2486} {"train_loss": -24.627527236938477, "global_step": 206414, "epoch": 2486} {"train_loss": -24.446224212646484, "global_step": 206415, "epoch": 2486} {"train_loss": -24.27532958984375, "global_step": 206416, "epoch": 2486} {"train_loss": -24.526853561401367, "global_step": 206417, "epoch": 2486} {"train_loss": -24.453336715698242, "global_step": 206418, "epoch": 2486} {"train_loss": -24.46756362915039, "global_step": 206419, "epoch": 2486} {"train_loss": -24.239324523741942, "global_step": 206420, "epoch": 2486, "val_loss": 6676732.0} {"train_loss": -21.58820152282715, "global_step": 206421, "epoch": 2487} {"train_loss": -22.30960464477539, "global_step": 206422, "epoch": 2487} {"train_loss": -22.945884704589844, "global_step": 206423, "epoch": 2487} {"train_loss": -23.045164108276367, "global_step": 206424, "epoch": 2487} {"train_loss": -22.778728485107422, "global_step": 206425, "epoch": 2487} {"train_loss": -23.37013053894043, "global_step": 206426, "epoch": 2487} {"train_loss": -22.912015914916992, "global_step": 206427, "epoch": 2487} {"train_loss": -23.366451263427734, "global_step": 206428, "epoch": 2487} {"train_loss": -23.29256248474121, "global_step": 206429, "epoch": 2487} {"train_loss": -23.344717025756836, "global_step": 206430, "epoch": 2487} {"train_loss": -23.737585067749023, "global_step": 206431, "epoch": 2487} {"train_loss": -23.833297729492188, "global_step": 206432, "epoch": 2487} {"train_loss": -23.50723648071289, "global_step": 206433, "epoch": 2487} {"train_loss": -23.692428588867188, "global_step": 206434, "epoch": 2487} {"train_loss": -23.466459274291992, "global_step": 206435, "epoch": 2487} {"train_loss": -23.43195915222168, "global_step": 206436, "epoch": 2487} {"train_loss": -23.868425369262695, "global_step": 206437, "epoch": 2487} {"train_loss": -23.737241744995117, "global_step": 206438, "epoch": 2487} {"train_loss": -23.525177001953125, "global_step": 206439, "epoch": 2487} {"train_loss": -24.04085350036621, "global_step": 206440, "epoch": 2487} {"train_loss": -23.82619857788086, "global_step": 206441, "epoch": 2487} {"train_loss": -24.052778244018555, "global_step": 206442, "epoch": 2487} {"train_loss": -24.010696411132812, "global_step": 206443, "epoch": 2487} {"train_loss": -23.630586624145508, "global_step": 206444, "epoch": 2487} {"train_loss": -23.86094093322754, "global_step": 206445, "epoch": 2487} {"train_loss": -23.919675827026367, "global_step": 206446, "epoch": 2487} {"train_loss": -23.81233787536621, "global_step": 206447, "epoch": 2487} {"train_loss": -24.290205001831055, "global_step": 206448, "epoch": 2487} {"train_loss": -23.778335571289062, "global_step": 206449, "epoch": 2487} {"train_loss": -24.21257972717285, "global_step": 206450, "epoch": 2487} {"train_loss": -24.23662757873535, "global_step": 206451, "epoch": 2487} {"train_loss": -24.464664459228516, "global_step": 206452, "epoch": 2487} {"train_loss": -24.092100143432617, "global_step": 206453, "epoch": 2487} {"train_loss": -24.021686553955078, "global_step": 206454, "epoch": 2487} {"train_loss": -24.123685836791992, "global_step": 206455, "epoch": 2487} {"train_loss": -24.387788772583008, "global_step": 206456, "epoch": 2487} {"train_loss": -24.352981567382812, "global_step": 206457, "epoch": 2487} {"train_loss": -24.460176467895508, "global_step": 206458, "epoch": 2487} {"train_loss": -24.59881591796875, "global_step": 206459, "epoch": 2487} {"train_loss": -24.28451919555664, "global_step": 206460, "epoch": 2487} {"train_loss": -24.31570816040039, "global_step": 206461, "epoch": 2487} {"train_loss": -24.339828491210938, "global_step": 206462, "epoch": 2487} {"train_loss": -24.30415153503418, "global_step": 206463, "epoch": 2487} {"train_loss": -24.402557373046875, "global_step": 206464, "epoch": 2487} {"train_loss": -24.18695831298828, "global_step": 206465, "epoch": 2487} {"train_loss": -24.158201217651367, "global_step": 206466, "epoch": 2487} {"train_loss": -24.537139892578125, "global_step": 206467, "epoch": 2487} {"train_loss": -24.732288360595703, "global_step": 206468, "epoch": 2487} {"train_loss": -24.25927734375, "global_step": 206469, "epoch": 2487} {"train_loss": -24.579683303833008, "global_step": 206470, "epoch": 2487} {"train_loss": -24.647239685058594, "global_step": 206471, "epoch": 2487} {"train_loss": -24.2431640625, "global_step": 206472, "epoch": 2487} {"train_loss": -24.653690338134766, "global_step": 206473, "epoch": 2487} {"train_loss": -24.641672134399414, "global_step": 206474, "epoch": 2487} {"train_loss": -24.12881851196289, "global_step": 206475, "epoch": 2487} {"train_loss": -24.342273712158203, "global_step": 206476, "epoch": 2487} {"train_loss": -24.535526275634766, "global_step": 206477, "epoch": 2487} {"train_loss": -24.028409957885742, "global_step": 206478, "epoch": 2487} {"train_loss": -24.337482452392578, "global_step": 206479, "epoch": 2487} {"train_loss": -24.574813842773438, "global_step": 206480, "epoch": 2487} {"train_loss": -24.506540298461914, "global_step": 206481, "epoch": 2487} {"train_loss": -24.153844833374023, "global_step": 206482, "epoch": 2487} {"train_loss": -24.58103370666504, "global_step": 206483, "epoch": 2487} {"train_loss": -24.491220474243164, "global_step": 206484, "epoch": 2487} {"train_loss": -24.165695190429688, "global_step": 206485, "epoch": 2487} {"train_loss": -24.17943572998047, "global_step": 206486, "epoch": 2487} {"train_loss": -24.354612350463867, "global_step": 206487, "epoch": 2487} {"train_loss": -24.24226951599121, "global_step": 206488, "epoch": 2487} {"train_loss": -24.3988094329834, "global_step": 206489, "epoch": 2487} {"train_loss": -24.43022918701172, "global_step": 206490, "epoch": 2487} {"train_loss": -24.3432559967041, "global_step": 206491, "epoch": 2487} {"train_loss": -24.6109676361084, "global_step": 206492, "epoch": 2487} {"train_loss": -24.460811614990234, "global_step": 206493, "epoch": 2487} {"train_loss": -24.169099807739258, "global_step": 206494, "epoch": 2487} {"train_loss": -24.261869430541992, "global_step": 206495, "epoch": 2487} {"train_loss": -23.862396240234375, "global_step": 206496, "epoch": 2487} {"train_loss": -23.891315460205078, "global_step": 206497, "epoch": 2487} {"train_loss": -24.20472526550293, "global_step": 206498, "epoch": 2487} {"train_loss": -24.362348556518555, "global_step": 206499, "epoch": 2487} {"train_loss": -24.355270385742188, "global_step": 206500, "epoch": 2487} {"train_loss": -24.132495880126953, "global_step": 206501, "epoch": 2487} {"train_loss": -24.36183738708496, "global_step": 206502, "epoch": 2487} {"train_loss": -24.035860544227692, "global_step": 206503, "epoch": 2487, "val_loss": 6666985.0} {"train_loss": -24.02712059020996, "global_step": 206504, "epoch": 2488} {"train_loss": -24.124509811401367, "global_step": 206505, "epoch": 2488} {"train_loss": -23.960002899169922, "global_step": 206506, "epoch": 2488} {"train_loss": -24.221920013427734, "global_step": 206507, "epoch": 2488} {"train_loss": -24.41607093811035, "global_step": 206508, "epoch": 2488} {"train_loss": -24.220190048217773, "global_step": 206509, "epoch": 2488} {"train_loss": -24.004901885986328, "global_step": 206510, "epoch": 2488} {"train_loss": -24.201751708984375, "global_step": 206511, "epoch": 2488} {"train_loss": -24.370885848999023, "global_step": 206512, "epoch": 2488} {"train_loss": -23.934213638305664, "global_step": 206513, "epoch": 2488} {"train_loss": -24.29779815673828, "global_step": 206514, "epoch": 2488} {"train_loss": -23.928110122680664, "global_step": 206515, "epoch": 2488} {"train_loss": -23.857746124267578, "global_step": 206516, "epoch": 2488} {"train_loss": -23.926156997680664, "global_step": 206517, "epoch": 2488} {"train_loss": -24.236146926879883, "global_step": 206518, "epoch": 2488} {"train_loss": -24.223325729370117, "global_step": 206519, "epoch": 2488} {"train_loss": -24.412565231323242, "global_step": 206520, "epoch": 2488} {"train_loss": -23.88916015625, "global_step": 206521, "epoch": 2488} {"train_loss": -24.392080307006836, "global_step": 206522, "epoch": 2488} {"train_loss": -24.317535400390625, "global_step": 206523, "epoch": 2488} {"train_loss": -24.391143798828125, "global_step": 206524, "epoch": 2488} {"train_loss": -24.45329475402832, "global_step": 206525, "epoch": 2488} {"train_loss": -24.479875564575195, "global_step": 206526, "epoch": 2488} {"train_loss": -24.334882736206055, "global_step": 206527, "epoch": 2488} {"train_loss": -24.661773681640625, "global_step": 206528, "epoch": 2488} {"train_loss": -24.18458366394043, "global_step": 206529, "epoch": 2488} {"train_loss": -24.476707458496094, "global_step": 206530, "epoch": 2488} {"train_loss": -24.277450561523438, "global_step": 206531, "epoch": 2488} {"train_loss": -24.20209312438965, "global_step": 206532, "epoch": 2488} {"train_loss": -24.423599243164062, "global_step": 206533, "epoch": 2488} {"train_loss": -24.5518856048584, "global_step": 206534, "epoch": 2488} {"train_loss": -24.538978576660156, "global_step": 206535, "epoch": 2488} {"train_loss": -24.79029655456543, "global_step": 206536, "epoch": 2488} {"train_loss": -24.809194564819336, "global_step": 206537, "epoch": 2488} {"train_loss": -24.569599151611328, "global_step": 206538, "epoch": 2488} {"train_loss": -24.79009246826172, "global_step": 206539, "epoch": 2488} {"train_loss": -24.055652618408203, "global_step": 206540, "epoch": 2488} {"train_loss": -24.608556747436523, "global_step": 206541, "epoch": 2488} {"train_loss": -24.45302391052246, "global_step": 206542, "epoch": 2488} {"train_loss": -24.58595085144043, "global_step": 206543, "epoch": 2488} {"train_loss": -24.283798217773438, "global_step": 206544, "epoch": 2488} {"train_loss": -24.406574249267578, "global_step": 206545, "epoch": 2488} {"train_loss": -24.658924102783203, "global_step": 206546, "epoch": 2488} {"train_loss": -24.26633071899414, "global_step": 206547, "epoch": 2488} {"train_loss": -24.557607650756836, "global_step": 206548, "epoch": 2488} {"train_loss": -24.149572372436523, "global_step": 206549, "epoch": 2488} {"train_loss": -24.480236053466797, "global_step": 206550, "epoch": 2488} {"train_loss": -24.43768310546875, "global_step": 206551, "epoch": 2488} {"train_loss": -24.473922729492188, "global_step": 206552, "epoch": 2488} {"train_loss": -24.650182723999023, "global_step": 206553, "epoch": 2488} {"train_loss": -24.619136810302734, "global_step": 206554, "epoch": 2488} {"train_loss": -24.434301376342773, "global_step": 206555, "epoch": 2488} {"train_loss": -24.39992904663086, "global_step": 206556, "epoch": 2488} {"train_loss": -24.110855102539062, "global_step": 206557, "epoch": 2488} {"train_loss": -24.072975158691406, "global_step": 206558, "epoch": 2488} {"train_loss": -24.0274658203125, "global_step": 206559, "epoch": 2488} {"train_loss": -23.77809715270996, "global_step": 206560, "epoch": 2488} {"train_loss": -24.270273208618164, "global_step": 206561, "epoch": 2488} {"train_loss": -24.426406860351562, "global_step": 206562, "epoch": 2488} {"train_loss": -23.999929428100586, "global_step": 206563, "epoch": 2488} {"train_loss": -23.69049644470215, "global_step": 206564, "epoch": 2488} {"train_loss": -24.300695419311523, "global_step": 206565, "epoch": 2488} {"train_loss": -24.239070892333984, "global_step": 206566, "epoch": 2488} {"train_loss": -24.197452545166016, "global_step": 206567, "epoch": 2488} {"train_loss": -24.560880661010742, "global_step": 206568, "epoch": 2488} {"train_loss": -24.242948532104492, "global_step": 206569, "epoch": 2488} {"train_loss": -24.428274154663086, "global_step": 206570, "epoch": 2488} {"train_loss": -24.418914794921875, "global_step": 206571, "epoch": 2488} {"train_loss": -24.521530151367188, "global_step": 206572, "epoch": 2488} {"train_loss": -24.33656883239746, "global_step": 206573, "epoch": 2488} {"train_loss": -24.483943939208984, "global_step": 206574, "epoch": 2488} {"train_loss": -24.440465927124023, "global_step": 206575, "epoch": 2488} {"train_loss": -24.676191329956055, "global_step": 206576, "epoch": 2488} {"train_loss": -24.377920150756836, "global_step": 206577, "epoch": 2488} {"train_loss": -24.21961784362793, "global_step": 206578, "epoch": 2488} {"train_loss": -24.56938934326172, "global_step": 206579, "epoch": 2488} {"train_loss": -24.710391998291016, "global_step": 206580, "epoch": 2488} {"train_loss": -24.2460880279541, "global_step": 206581, "epoch": 2488} {"train_loss": -24.296947479248047, "global_step": 206582, "epoch": 2488} {"train_loss": -24.3615779876709, "global_step": 206583, "epoch": 2488} {"train_loss": -24.120174407958984, "global_step": 206584, "epoch": 2488} {"train_loss": -24.379657745361328, "global_step": 206585, "epoch": 2488} {"train_loss": -24.33553077513913, "global_step": 206586, "epoch": 2488, "val_loss": 6693819.0} {"train_loss": -24.52247428894043, "global_step": 206587, "epoch": 2489} {"train_loss": -23.988269805908203, "global_step": 206588, "epoch": 2489} {"train_loss": -24.424087524414062, "global_step": 206589, "epoch": 2489} {"train_loss": -24.29609489440918, "global_step": 206590, "epoch": 2489} {"train_loss": -24.008359909057617, "global_step": 206591, "epoch": 2489} {"train_loss": -24.01209259033203, "global_step": 206592, "epoch": 2489} {"train_loss": -24.052358627319336, "global_step": 206593, "epoch": 2489} {"train_loss": -24.13069725036621, "global_step": 206594, "epoch": 2489} {"train_loss": -24.075170516967773, "global_step": 206595, "epoch": 2489} {"train_loss": -24.69475746154785, "global_step": 206596, "epoch": 2489} {"train_loss": -24.145551681518555, "global_step": 206597, "epoch": 2489} {"train_loss": -24.687597274780273, "global_step": 206598, "epoch": 2489} {"train_loss": -24.315345764160156, "global_step": 206599, "epoch": 2489} {"train_loss": -23.958276748657227, "global_step": 206600, "epoch": 2489} {"train_loss": -24.26539421081543, "global_step": 206601, "epoch": 2489} {"train_loss": -24.605236053466797, "global_step": 206602, "epoch": 2489} {"train_loss": -24.15273094177246, "global_step": 206603, "epoch": 2489} {"train_loss": -24.125869750976562, "global_step": 206604, "epoch": 2489} {"train_loss": -24.657217025756836, "global_step": 206605, "epoch": 2489} {"train_loss": -24.32643699645996, "global_step": 206606, "epoch": 2489} {"train_loss": -24.258466720581055, "global_step": 206607, "epoch": 2489} {"train_loss": -23.50185203552246, "global_step": 206608, "epoch": 2489} {"train_loss": -23.872867584228516, "global_step": 206609, "epoch": 2489} {"train_loss": -23.917495727539062, "global_step": 206610, "epoch": 2489} {"train_loss": -23.678186416625977, "global_step": 206611, "epoch": 2489} {"train_loss": -24.21510124206543, "global_step": 206612, "epoch": 2489} {"train_loss": -24.207765579223633, "global_step": 206613, "epoch": 2489} {"train_loss": -24.12843132019043, "global_step": 206614, "epoch": 2489} {"train_loss": -24.21118927001953, "global_step": 206615, "epoch": 2489} {"train_loss": -24.625446319580078, "global_step": 206616, "epoch": 2489} {"train_loss": -24.234628677368164, "global_step": 206617, "epoch": 2489} {"train_loss": -24.464460372924805, "global_step": 206618, "epoch": 2489} {"train_loss": -24.28132438659668, "global_step": 206619, "epoch": 2489} {"train_loss": -23.813358306884766, "global_step": 206620, "epoch": 2489} {"train_loss": -24.150516510009766, "global_step": 206621, "epoch": 2489} {"train_loss": -24.733991622924805, "global_step": 206622, "epoch": 2489} {"train_loss": -24.493576049804688, "global_step": 206623, "epoch": 2489} {"train_loss": -24.43890953063965, "global_step": 206624, "epoch": 2489} {"train_loss": -24.281696319580078, "global_step": 206625, "epoch": 2489} {"train_loss": -24.01349449157715, "global_step": 206626, "epoch": 2489} {"train_loss": -24.13758659362793, "global_step": 206627, "epoch": 2489} {"train_loss": -24.548675537109375, "global_step": 206628, "epoch": 2489} {"train_loss": -24.13840103149414, "global_step": 206629, "epoch": 2489} {"train_loss": -24.325437545776367, "global_step": 206630, "epoch": 2489} {"train_loss": -24.097457885742188, "global_step": 206631, "epoch": 2489} {"train_loss": -24.463382720947266, "global_step": 206632, "epoch": 2489} {"train_loss": -24.275537490844727, "global_step": 206633, "epoch": 2489} {"train_loss": -24.260488510131836, "global_step": 206634, "epoch": 2489} {"train_loss": -24.183792114257812, "global_step": 206635, "epoch": 2489} {"train_loss": -24.241422653198242, "global_step": 206636, "epoch": 2489} {"train_loss": -24.132869720458984, "global_step": 206637, "epoch": 2489} {"train_loss": -24.096338272094727, "global_step": 206638, "epoch": 2489} {"train_loss": -24.223114013671875, "global_step": 206639, "epoch": 2489} {"train_loss": -24.65236473083496, "global_step": 206640, "epoch": 2489} {"train_loss": -24.68356704711914, "global_step": 206641, "epoch": 2489} {"train_loss": -24.55571174621582, "global_step": 206642, "epoch": 2489} {"train_loss": -24.630056381225586, "global_step": 206643, "epoch": 2489} {"train_loss": -24.653793334960938, "global_step": 206644, "epoch": 2489} {"train_loss": -24.31646156311035, "global_step": 206645, "epoch": 2489} {"train_loss": -24.279773712158203, "global_step": 206646, "epoch": 2489} {"train_loss": -24.361774444580078, "global_step": 206647, "epoch": 2489} {"train_loss": -24.22464370727539, "global_step": 206648, "epoch": 2489} {"train_loss": -24.184602737426758, "global_step": 206649, "epoch": 2489} {"train_loss": -24.240318298339844, "global_step": 206650, "epoch": 2489} {"train_loss": -24.75291633605957, "global_step": 206651, "epoch": 2489} {"train_loss": -24.420440673828125, "global_step": 206652, "epoch": 2489} {"train_loss": -24.350683212280273, "global_step": 206653, "epoch": 2489} {"train_loss": -24.493989944458008, "global_step": 206654, "epoch": 2489} {"train_loss": -24.443246841430664, "global_step": 206655, "epoch": 2489} {"train_loss": -24.385141372680664, "global_step": 206656, "epoch": 2489} {"train_loss": -24.36622428894043, "global_step": 206657, "epoch": 2489} {"train_loss": -24.362268447875977, "global_step": 206658, "epoch": 2489} {"train_loss": -24.18947410583496, "global_step": 206659, "epoch": 2489} {"train_loss": -24.395523071289062, "global_step": 206660, "epoch": 2489} {"train_loss": -24.369781494140625, "global_step": 206661, "epoch": 2489} {"train_loss": -24.139616012573242, "global_step": 206662, "epoch": 2489} {"train_loss": -24.121061325073242, "global_step": 206663, "epoch": 2489} {"train_loss": -23.606605529785156, "global_step": 206664, "epoch": 2489} {"train_loss": -24.013639450073242, "global_step": 206665, "epoch": 2489} {"train_loss": -24.375459671020508, "global_step": 206666, "epoch": 2489} {"train_loss": -23.83772087097168, "global_step": 206667, "epoch": 2489} {"train_loss": -23.74151611328125, "global_step": 206668, "epoch": 2489} {"train_loss": -24.259971802493176, "global_step": 206669, "epoch": 2489, "val_loss": 6535893.5} {"train_loss": -23.51839256286621, "global_step": 206670, "epoch": 2490} {"train_loss": -23.337841033935547, "global_step": 206671, "epoch": 2490} {"train_loss": -23.841947555541992, "global_step": 206672, "epoch": 2490} {"train_loss": -23.373184204101562, "global_step": 206673, "epoch": 2490} {"train_loss": -23.661603927612305, "global_step": 206674, "epoch": 2490} {"train_loss": -23.513620376586914, "global_step": 206675, "epoch": 2490} {"train_loss": -23.911169052124023, "global_step": 206676, "epoch": 2490} {"train_loss": -23.89154052734375, "global_step": 206677, "epoch": 2490} {"train_loss": -23.55378532409668, "global_step": 206678, "epoch": 2490} {"train_loss": -23.695459365844727, "global_step": 206679, "epoch": 2490} {"train_loss": -23.86210823059082, "global_step": 206680, "epoch": 2490} {"train_loss": -24.217695236206055, "global_step": 206681, "epoch": 2490} {"train_loss": -23.999361038208008, "global_step": 206682, "epoch": 2490} {"train_loss": -23.86797332763672, "global_step": 206683, "epoch": 2490} {"train_loss": -23.9888916015625, "global_step": 206684, "epoch": 2490} {"train_loss": -24.32321548461914, "global_step": 206685, "epoch": 2490} {"train_loss": -24.30246353149414, "global_step": 206686, "epoch": 2490} {"train_loss": -24.319862365722656, "global_step": 206687, "epoch": 2490} {"train_loss": -24.171737670898438, "global_step": 206688, "epoch": 2490} {"train_loss": -24.06331443786621, "global_step": 206689, "epoch": 2490} {"train_loss": -24.08807373046875, "global_step": 206690, "epoch": 2490} {"train_loss": -23.992050170898438, "global_step": 206691, "epoch": 2490} {"train_loss": -24.222082138061523, "global_step": 206692, "epoch": 2490} {"train_loss": -24.515945434570312, "global_step": 206693, "epoch": 2490} {"train_loss": -24.340295791625977, "global_step": 206694, "epoch": 2490} {"train_loss": -24.26148796081543, "global_step": 206695, "epoch": 2490} {"train_loss": -24.09473991394043, "global_step": 206696, "epoch": 2490} {"train_loss": -24.462360382080078, "global_step": 206697, "epoch": 2490} {"train_loss": -24.49122428894043, "global_step": 206698, "epoch": 2490} {"train_loss": -24.632471084594727, "global_step": 206699, "epoch": 2490} {"train_loss": -24.273962020874023, "global_step": 206700, "epoch": 2490} {"train_loss": -24.441421508789062, "global_step": 206701, "epoch": 2490} {"train_loss": -24.285425186157227, "global_step": 206702, "epoch": 2490} {"train_loss": -24.213369369506836, "global_step": 206703, "epoch": 2490} {"train_loss": -24.625, "global_step": 206704, "epoch": 2490} {"train_loss": -24.301101684570312, "global_step": 206705, "epoch": 2490} {"train_loss": -24.62525749206543, "global_step": 206706, "epoch": 2490} {"train_loss": -24.418075561523438, "global_step": 206707, "epoch": 2490} {"train_loss": -24.651708602905273, "global_step": 206708, "epoch": 2490} {"train_loss": -24.410852432250977, "global_step": 206709, "epoch": 2490} {"train_loss": -24.801246643066406, "global_step": 206710, "epoch": 2490} {"train_loss": -24.492170333862305, "global_step": 206711, "epoch": 2490} {"train_loss": -24.180891036987305, "global_step": 206712, "epoch": 2490} {"train_loss": -24.452566146850586, "global_step": 206713, "epoch": 2490} {"train_loss": -25.019805908203125, "global_step": 206714, "epoch": 2490} {"train_loss": -24.006698608398438, "global_step": 206715, "epoch": 2490} {"train_loss": -24.313343048095703, "global_step": 206716, "epoch": 2490} {"train_loss": -24.267658233642578, "global_step": 206717, "epoch": 2490} {"train_loss": -23.98148536682129, "global_step": 206718, "epoch": 2490} {"train_loss": -24.179887771606445, "global_step": 206719, "epoch": 2490} {"train_loss": -24.45564842224121, "global_step": 206720, "epoch": 2490} {"train_loss": -24.161813735961914, "global_step": 206721, "epoch": 2490} {"train_loss": -23.979856491088867, "global_step": 206722, "epoch": 2490} {"train_loss": -24.435850143432617, "global_step": 206723, "epoch": 2490} {"train_loss": -23.940183639526367, "global_step": 206724, "epoch": 2490} {"train_loss": -24.411436080932617, "global_step": 206725, "epoch": 2490} {"train_loss": -24.20721435546875, "global_step": 206726, "epoch": 2490} {"train_loss": -24.255367279052734, "global_step": 206727, "epoch": 2490} {"train_loss": -23.94202995300293, "global_step": 206728, "epoch": 2490} {"train_loss": -24.145675659179688, "global_step": 206729, "epoch": 2490} {"train_loss": -24.553457260131836, "global_step": 206730, "epoch": 2490} {"train_loss": -24.282445907592773, "global_step": 206731, "epoch": 2490} {"train_loss": -24.233671188354492, "global_step": 206732, "epoch": 2490} {"train_loss": -23.98213768005371, "global_step": 206733, "epoch": 2490} {"train_loss": -24.617895126342773, "global_step": 206734, "epoch": 2490} {"train_loss": -24.35796546936035, "global_step": 206735, "epoch": 2490} {"train_loss": -24.48443031311035, "global_step": 206736, "epoch": 2490} {"train_loss": -24.65831756591797, "global_step": 206737, "epoch": 2490} {"train_loss": -24.116912841796875, "global_step": 206738, "epoch": 2490} {"train_loss": -24.83499526977539, "global_step": 206739, "epoch": 2490} {"train_loss": -24.2696533203125, "global_step": 206740, "epoch": 2490} {"train_loss": -24.30449867248535, "global_step": 206741, "epoch": 2490} {"train_loss": -24.564786911010742, "global_step": 206742, "epoch": 2490} {"train_loss": -24.28447151184082, "global_step": 206743, "epoch": 2490} {"train_loss": -24.284589767456055, "global_step": 206744, "epoch": 2490} {"train_loss": -24.41623878479004, "global_step": 206745, "epoch": 2490} {"train_loss": -24.61669921875, "global_step": 206746, "epoch": 2490} {"train_loss": -24.592519760131836, "global_step": 206747, "epoch": 2490} {"train_loss": -24.51042366027832, "global_step": 206748, "epoch": 2490} {"train_loss": -24.22898292541504, "global_step": 206749, "epoch": 2490} {"train_loss": -24.710744857788086, "global_step": 206750, "epoch": 2490} {"train_loss": -24.85550308227539, "global_step": 206751, "epoch": 2490} {"train_loss": -24.24615025807576, "global_step": 206752, "epoch": 2490, "val_loss": 6739108.5} {"train_loss": -23.218645095825195, "global_step": 206753, "epoch": 2491} {"train_loss": -24.328594207763672, "global_step": 206754, "epoch": 2491} {"train_loss": -23.924463272094727, "global_step": 206755, "epoch": 2491} {"train_loss": -24.011865615844727, "global_step": 206756, "epoch": 2491} {"train_loss": -24.216169357299805, "global_step": 206757, "epoch": 2491} {"train_loss": -24.003217697143555, "global_step": 206758, "epoch": 2491} {"train_loss": -23.796300888061523, "global_step": 206759, "epoch": 2491} {"train_loss": -24.03273582458496, "global_step": 206760, "epoch": 2491} {"train_loss": -24.48126792907715, "global_step": 206761, "epoch": 2491} {"train_loss": -24.0874080657959, "global_step": 206762, "epoch": 2491} {"train_loss": -23.96562385559082, "global_step": 206763, "epoch": 2491} {"train_loss": -24.075162887573242, "global_step": 206764, "epoch": 2491} {"train_loss": -23.953542709350586, "global_step": 206765, "epoch": 2491} {"train_loss": -24.017744064331055, "global_step": 206766, "epoch": 2491} {"train_loss": -24.109689712524414, "global_step": 206767, "epoch": 2491} {"train_loss": -24.0849609375, "global_step": 206768, "epoch": 2491} {"train_loss": -24.146398544311523, "global_step": 206769, "epoch": 2491} {"train_loss": -24.09153175354004, "global_step": 206770, "epoch": 2491} {"train_loss": -24.366779327392578, "global_step": 206771, "epoch": 2491} {"train_loss": -24.2735652923584, "global_step": 206772, "epoch": 2491} {"train_loss": -24.496877670288086, "global_step": 206773, "epoch": 2491} {"train_loss": -24.475072860717773, "global_step": 206774, "epoch": 2491} {"train_loss": -24.39594841003418, "global_step": 206775, "epoch": 2491} {"train_loss": -24.0562801361084, "global_step": 206776, "epoch": 2491} {"train_loss": -24.685758590698242, "global_step": 206777, "epoch": 2491} {"train_loss": -24.32105255126953, "global_step": 206778, "epoch": 2491} {"train_loss": -24.146793365478516, "global_step": 206779, "epoch": 2491} {"train_loss": -24.4812068939209, "global_step": 206780, "epoch": 2491} {"train_loss": -24.66560173034668, "global_step": 206781, "epoch": 2491} {"train_loss": -24.45186424255371, "global_step": 206782, "epoch": 2491} {"train_loss": -24.28790283203125, "global_step": 206783, "epoch": 2491} {"train_loss": -24.71187400817871, "global_step": 206784, "epoch": 2491} {"train_loss": -24.709505081176758, "global_step": 206785, "epoch": 2491} {"train_loss": -24.30105209350586, "global_step": 206786, "epoch": 2491} {"train_loss": -24.31943130493164, "global_step": 206787, "epoch": 2491} {"train_loss": -24.42662239074707, "global_step": 206788, "epoch": 2491} {"train_loss": -24.498151779174805, "global_step": 206789, "epoch": 2491} {"train_loss": -24.861202239990234, "global_step": 206790, "epoch": 2491} {"train_loss": -24.52235984802246, "global_step": 206791, "epoch": 2491} {"train_loss": -24.369794845581055, "global_step": 206792, "epoch": 2491} {"train_loss": -24.35158348083496, "global_step": 206793, "epoch": 2491} {"train_loss": -24.2014102935791, "global_step": 206794, "epoch": 2491} {"train_loss": -24.74070167541504, "global_step": 206795, "epoch": 2491} {"train_loss": -24.328214645385742, "global_step": 206796, "epoch": 2491} {"train_loss": -24.409040451049805, "global_step": 206797, "epoch": 2491} {"train_loss": -24.350692749023438, "global_step": 206798, "epoch": 2491} {"train_loss": -24.364547729492188, "global_step": 206799, "epoch": 2491} {"train_loss": -24.536169052124023, "global_step": 206800, "epoch": 2491} {"train_loss": -24.50507164001465, "global_step": 206801, "epoch": 2491} {"train_loss": -24.411352157592773, "global_step": 206802, "epoch": 2491} {"train_loss": -24.269685745239258, "global_step": 206803, "epoch": 2491} {"train_loss": -24.53355598449707, "global_step": 206804, "epoch": 2491} {"train_loss": -24.57950210571289, "global_step": 206805, "epoch": 2491} {"train_loss": -24.70358657836914, "global_step": 206806, "epoch": 2491} {"train_loss": -24.246992111206055, "global_step": 206807, "epoch": 2491} {"train_loss": -24.50690269470215, "global_step": 206808, "epoch": 2491} {"train_loss": -24.258859634399414, "global_step": 206809, "epoch": 2491} {"train_loss": -24.377756118774414, "global_step": 206810, "epoch": 2491} {"train_loss": -24.239389419555664, "global_step": 206811, "epoch": 2491} {"train_loss": -24.187978744506836, "global_step": 206812, "epoch": 2491} {"train_loss": -24.29034996032715, "global_step": 206813, "epoch": 2491} {"train_loss": -24.442773818969727, "global_step": 206814, "epoch": 2491} {"train_loss": -24.36564826965332, "global_step": 206815, "epoch": 2491} {"train_loss": -24.73744010925293, "global_step": 206816, "epoch": 2491} {"train_loss": -24.48579978942871, "global_step": 206817, "epoch": 2491} {"train_loss": -25.158292770385742, "global_step": 206818, "epoch": 2491} {"train_loss": -24.282957077026367, "global_step": 206819, "epoch": 2491} {"train_loss": -24.396564483642578, "global_step": 206820, "epoch": 2491} {"train_loss": -24.467025756835938, "global_step": 206821, "epoch": 2491} {"train_loss": -24.270158767700195, "global_step": 206822, "epoch": 2491} {"train_loss": -23.82501792907715, "global_step": 206823, "epoch": 2491} {"train_loss": -24.499385833740234, "global_step": 206824, "epoch": 2491} {"train_loss": -24.405887603759766, "global_step": 206825, "epoch": 2491} {"train_loss": -24.542980194091797, "global_step": 206826, "epoch": 2491} {"train_loss": -24.665250778198242, "global_step": 206827, "epoch": 2491} {"train_loss": -24.550039291381836, "global_step": 206828, "epoch": 2491} {"train_loss": -24.578054428100586, "global_step": 206829, "epoch": 2491} {"train_loss": -24.306934356689453, "global_step": 206830, "epoch": 2491} {"train_loss": -24.344905853271484, "global_step": 206831, "epoch": 2491} {"train_loss": -24.133365631103516, "global_step": 206832, "epoch": 2491} {"train_loss": -24.658470153808594, "global_step": 206833, "epoch": 2491} {"train_loss": -24.55727195739746, "global_step": 206834, "epoch": 2491} {"train_loss": -24.36615987570889, "global_step": 206835, "epoch": 2491, "val_loss": 6611392.0} {"train_loss": -24.2112979888916, "global_step": 206836, "epoch": 2492} {"train_loss": -23.99416732788086, "global_step": 206837, "epoch": 2492} {"train_loss": -23.8857364654541, "global_step": 206838, "epoch": 2492} {"train_loss": -24.10529899597168, "global_step": 206839, "epoch": 2492} {"train_loss": -23.9171085357666, "global_step": 206840, "epoch": 2492} {"train_loss": -24.068923950195312, "global_step": 206841, "epoch": 2492} {"train_loss": -24.30744743347168, "global_step": 206842, "epoch": 2492} {"train_loss": -24.536317825317383, "global_step": 206843, "epoch": 2492} {"train_loss": -24.121139526367188, "global_step": 206844, "epoch": 2492} {"train_loss": -24.083816528320312, "global_step": 206845, "epoch": 2492} {"train_loss": -24.13022232055664, "global_step": 206846, "epoch": 2492} {"train_loss": -24.544876098632812, "global_step": 206847, "epoch": 2492} {"train_loss": -24.274890899658203, "global_step": 206848, "epoch": 2492} {"train_loss": -24.283742904663086, "global_step": 206849, "epoch": 2492} {"train_loss": -24.247081756591797, "global_step": 206850, "epoch": 2492} {"train_loss": -24.28026580810547, "global_step": 206851, "epoch": 2492} {"train_loss": -24.426319122314453, "global_step": 206852, "epoch": 2492} {"train_loss": -23.90386199951172, "global_step": 206853, "epoch": 2492} {"train_loss": -24.311317443847656, "global_step": 206854, "epoch": 2492} {"train_loss": -24.517423629760742, "global_step": 206855, "epoch": 2492} {"train_loss": -24.371519088745117, "global_step": 206856, "epoch": 2492} {"train_loss": -24.395498275756836, "global_step": 206857, "epoch": 2492} {"train_loss": -24.535064697265625, "global_step": 206858, "epoch": 2492} {"train_loss": -24.461166381835938, "global_step": 206859, "epoch": 2492} {"train_loss": -24.584095001220703, "global_step": 206860, "epoch": 2492} {"train_loss": -24.8111572265625, "global_step": 206861, "epoch": 2492} {"train_loss": -24.423269271850586, "global_step": 206862, "epoch": 2492} {"train_loss": -24.04719352722168, "global_step": 206863, "epoch": 2492} {"train_loss": -24.66444969177246, "global_step": 206864, "epoch": 2492} {"train_loss": -24.707778930664062, "global_step": 206865, "epoch": 2492} {"train_loss": -24.63257598876953, "global_step": 206866, "epoch": 2492} {"train_loss": -24.354358673095703, "global_step": 206867, "epoch": 2492} {"train_loss": -24.47855567932129, "global_step": 206868, "epoch": 2492} {"train_loss": -24.461368560791016, "global_step": 206869, "epoch": 2492} {"train_loss": -24.38339614868164, "global_step": 206870, "epoch": 2492} {"train_loss": -24.10222053527832, "global_step": 206871, "epoch": 2492} {"train_loss": -24.601106643676758, "global_step": 206872, "epoch": 2492} {"train_loss": -24.5665340423584, "global_step": 206873, "epoch": 2492} {"train_loss": -24.21017074584961, "global_step": 206874, "epoch": 2492} {"train_loss": -24.167133331298828, "global_step": 206875, "epoch": 2492} {"train_loss": -24.5335750579834, "global_step": 206876, "epoch": 2492} {"train_loss": -24.705350875854492, "global_step": 206877, "epoch": 2492} {"train_loss": -23.897497177124023, "global_step": 206878, "epoch": 2492} {"train_loss": -24.42795181274414, "global_step": 206879, "epoch": 2492} {"train_loss": -24.661556243896484, "global_step": 206880, "epoch": 2492} {"train_loss": -24.176071166992188, "global_step": 206881, "epoch": 2492} {"train_loss": -24.424062728881836, "global_step": 206882, "epoch": 2492} {"train_loss": -23.863574981689453, "global_step": 206883, "epoch": 2492} {"train_loss": -24.50870132446289, "global_step": 206884, "epoch": 2492} {"train_loss": -23.959692001342773, "global_step": 206885, "epoch": 2492} {"train_loss": -24.201501846313477, "global_step": 206886, "epoch": 2492} {"train_loss": -23.867551803588867, "global_step": 206887, "epoch": 2492} {"train_loss": -24.434768676757812, "global_step": 206888, "epoch": 2492} {"train_loss": -24.770605087280273, "global_step": 206889, "epoch": 2492} {"train_loss": -24.140756607055664, "global_step": 206890, "epoch": 2492} {"train_loss": -23.999542236328125, "global_step": 206891, "epoch": 2492} {"train_loss": -24.52213478088379, "global_step": 206892, "epoch": 2492} {"train_loss": -24.008472442626953, "global_step": 206893, "epoch": 2492} {"train_loss": -23.964879989624023, "global_step": 206894, "epoch": 2492} {"train_loss": -24.3538875579834, "global_step": 206895, "epoch": 2492} {"train_loss": -24.2430477142334, "global_step": 206896, "epoch": 2492} {"train_loss": -23.983760833740234, "global_step": 206897, "epoch": 2492} {"train_loss": -24.141338348388672, "global_step": 206898, "epoch": 2492} {"train_loss": -24.482070922851562, "global_step": 206899, "epoch": 2492} {"train_loss": -24.37111473083496, "global_step": 206900, "epoch": 2492} {"train_loss": -24.10246467590332, "global_step": 206901, "epoch": 2492} {"train_loss": -24.250225067138672, "global_step": 206902, "epoch": 2492} {"train_loss": -24.232852935791016, "global_step": 206903, "epoch": 2492} {"train_loss": -24.202951431274414, "global_step": 206904, "epoch": 2492} {"train_loss": -24.3077392578125, "global_step": 206905, "epoch": 2492} {"train_loss": -24.18977165222168, "global_step": 206906, "epoch": 2492} {"train_loss": -24.415916442871094, "global_step": 206907, "epoch": 2492} {"train_loss": -24.546010971069336, "global_step": 206908, "epoch": 2492} {"train_loss": -24.4161434173584, "global_step": 206909, "epoch": 2492} {"train_loss": -24.847522735595703, "global_step": 206910, "epoch": 2492} {"train_loss": -24.408666610717773, "global_step": 206911, "epoch": 2492} {"train_loss": -24.342849731445312, "global_step": 206912, "epoch": 2492} {"train_loss": -24.655494689941406, "global_step": 206913, "epoch": 2492} {"train_loss": -24.48944664001465, "global_step": 206914, "epoch": 2492} {"train_loss": -24.635648727416992, "global_step": 206915, "epoch": 2492} {"train_loss": -24.452621459960938, "global_step": 206916, "epoch": 2492} {"train_loss": -24.46211051940918, "global_step": 206917, "epoch": 2492} {"train_loss": -24.318367349096093, "global_step": 206918, "epoch": 2492, "val_loss": 6710538.5} {"train_loss": -24.285802841186523, "global_step": 206919, "epoch": 2493} {"train_loss": -24.363813400268555, "global_step": 206920, "epoch": 2493} {"train_loss": -24.3731689453125, "global_step": 206921, "epoch": 2493} {"train_loss": -24.42209815979004, "global_step": 206922, "epoch": 2493} {"train_loss": -24.410551071166992, "global_step": 206923, "epoch": 2493} {"train_loss": -24.336618423461914, "global_step": 206924, "epoch": 2493} {"train_loss": -24.453231811523438, "global_step": 206925, "epoch": 2493} {"train_loss": -24.243417739868164, "global_step": 206926, "epoch": 2493} {"train_loss": -24.190393447875977, "global_step": 206927, "epoch": 2493} {"train_loss": -24.410429000854492, "global_step": 206928, "epoch": 2493} {"train_loss": -24.00343132019043, "global_step": 206929, "epoch": 2493} {"train_loss": -24.112239837646484, "global_step": 206930, "epoch": 2493} {"train_loss": -24.428442001342773, "global_step": 206931, "epoch": 2493} {"train_loss": -24.091712951660156, "global_step": 206932, "epoch": 2493} {"train_loss": -24.24051856994629, "global_step": 206933, "epoch": 2493} {"train_loss": -24.87220573425293, "global_step": 206934, "epoch": 2493} {"train_loss": -24.23024559020996, "global_step": 206935, "epoch": 2493} {"train_loss": -23.917741775512695, "global_step": 206936, "epoch": 2493} {"train_loss": -24.200443267822266, "global_step": 206937, "epoch": 2493} {"train_loss": -24.069324493408203, "global_step": 206938, "epoch": 2493} {"train_loss": -24.470748901367188, "global_step": 206939, "epoch": 2493} {"train_loss": -24.104867935180664, "global_step": 206940, "epoch": 2493} {"train_loss": -24.229684829711914, "global_step": 206941, "epoch": 2493} {"train_loss": -24.248275756835938, "global_step": 206942, "epoch": 2493} {"train_loss": -23.994728088378906, "global_step": 206943, "epoch": 2493} {"train_loss": -24.29497528076172, "global_step": 206944, "epoch": 2493} {"train_loss": -23.693572998046875, "global_step": 206945, "epoch": 2493} {"train_loss": -24.48274040222168, "global_step": 206946, "epoch": 2493} {"train_loss": -24.101381301879883, "global_step": 206947, "epoch": 2493} {"train_loss": -24.4373836517334, "global_step": 206948, "epoch": 2493} {"train_loss": -23.663419723510742, "global_step": 206949, "epoch": 2493} {"train_loss": -24.010679244995117, "global_step": 206950, "epoch": 2493} {"train_loss": -24.317808151245117, "global_step": 206951, "epoch": 2493} {"train_loss": -24.323850631713867, "global_step": 206952, "epoch": 2493} {"train_loss": -24.16900062561035, "global_step": 206953, "epoch": 2493} {"train_loss": -24.170948028564453, "global_step": 206954, "epoch": 2493} {"train_loss": -24.192584991455078, "global_step": 206955, "epoch": 2493} {"train_loss": -24.250045776367188, "global_step": 206956, "epoch": 2493} {"train_loss": -24.217809677124023, "global_step": 206957, "epoch": 2493} {"train_loss": -24.55945587158203, "global_step": 206958, "epoch": 2493} {"train_loss": -24.252729415893555, "global_step": 206959, "epoch": 2493} {"train_loss": -23.749353408813477, "global_step": 206960, "epoch": 2493} {"train_loss": -24.335195541381836, "global_step": 206961, "epoch": 2493} {"train_loss": -24.291662216186523, "global_step": 206962, "epoch": 2493} {"train_loss": -24.423309326171875, "global_step": 206963, "epoch": 2493} {"train_loss": -24.655319213867188, "global_step": 206964, "epoch": 2493} {"train_loss": -24.401216506958008, "global_step": 206965, "epoch": 2493} {"train_loss": -24.191843032836914, "global_step": 206966, "epoch": 2493} {"train_loss": -24.57317543029785, "global_step": 206967, "epoch": 2493} {"train_loss": -24.019927978515625, "global_step": 206968, "epoch": 2493} {"train_loss": -24.27071762084961, "global_step": 206969, "epoch": 2493} {"train_loss": -24.270811080932617, "global_step": 206970, "epoch": 2493} {"train_loss": -24.441265106201172, "global_step": 206971, "epoch": 2493} {"train_loss": -24.283376693725586, "global_step": 206972, "epoch": 2493} {"train_loss": -24.371435165405273, "global_step": 206973, "epoch": 2493} {"train_loss": -24.50868797302246, "global_step": 206974, "epoch": 2493} {"train_loss": -24.669279098510742, "global_step": 206975, "epoch": 2493} {"train_loss": -24.351627349853516, "global_step": 206976, "epoch": 2493} {"train_loss": -24.552566528320312, "global_step": 206977, "epoch": 2493} {"train_loss": -24.226682662963867, "global_step": 206978, "epoch": 2493} {"train_loss": -24.34812355041504, "global_step": 206979, "epoch": 2493} {"train_loss": -24.598421096801758, "global_step": 206980, "epoch": 2493} {"train_loss": -24.649295806884766, "global_step": 206981, "epoch": 2493} {"train_loss": -24.403234481811523, "global_step": 206982, "epoch": 2493} {"train_loss": -24.622251510620117, "global_step": 206983, "epoch": 2493} {"train_loss": -24.369125366210938, "global_step": 206984, "epoch": 2493} {"train_loss": -24.3780574798584, "global_step": 206985, "epoch": 2493} {"train_loss": -24.515836715698242, "global_step": 206986, "epoch": 2493} {"train_loss": -24.67805290222168, "global_step": 206987, "epoch": 2493} {"train_loss": -24.376604080200195, "global_step": 206988, "epoch": 2493} {"train_loss": -24.451784133911133, "global_step": 206989, "epoch": 2493} {"train_loss": -24.409446716308594, "global_step": 206990, "epoch": 2493} {"train_loss": -24.516586303710938, "global_step": 206991, "epoch": 2493} {"train_loss": -24.841588973999023, "global_step": 206992, "epoch": 2493} {"train_loss": -24.356822967529297, "global_step": 206993, "epoch": 2493} {"train_loss": -25.033926010131836, "global_step": 206994, "epoch": 2493} {"train_loss": -24.30601692199707, "global_step": 206995, "epoch": 2493} {"train_loss": -24.611101150512695, "global_step": 206996, "epoch": 2493} {"train_loss": -24.391551971435547, "global_step": 206997, "epoch": 2493} {"train_loss": -24.47297477722168, "global_step": 206998, "epoch": 2493} {"train_loss": -24.28995704650879, "global_step": 206999, "epoch": 2493} {"train_loss": -24.30398941040039, "global_step": 207000, "epoch": 2493} {"train_loss": -24.32776349998382, "global_step": 207001, "epoch": 2493, "val_loss": 6657443.0} {"train_loss": -23.5385684967041, "global_step": 207002, "epoch": 2494} {"train_loss": -23.618741989135742, "global_step": 207003, "epoch": 2494} {"train_loss": -23.880970001220703, "global_step": 207004, "epoch": 2494} {"train_loss": -23.830463409423828, "global_step": 207005, "epoch": 2494} {"train_loss": -23.85025978088379, "global_step": 207006, "epoch": 2494} {"train_loss": -24.048812866210938, "global_step": 207007, "epoch": 2494} {"train_loss": -23.760360717773438, "global_step": 207008, "epoch": 2494} {"train_loss": -24.21435546875, "global_step": 207009, "epoch": 2494} {"train_loss": -24.0584659576416, "global_step": 207010, "epoch": 2494} {"train_loss": -23.8763484954834, "global_step": 207011, "epoch": 2494} {"train_loss": -24.72187614440918, "global_step": 207012, "epoch": 2494} {"train_loss": -24.104291915893555, "global_step": 207013, "epoch": 2494} {"train_loss": -24.388986587524414, "global_step": 207014, "epoch": 2494} {"train_loss": -23.958742141723633, "global_step": 207015, "epoch": 2494} {"train_loss": -24.1040096282959, "global_step": 207016, "epoch": 2494} {"train_loss": -24.13163185119629, "global_step": 207017, "epoch": 2494} {"train_loss": -23.909404754638672, "global_step": 207018, "epoch": 2494} {"train_loss": -23.967649459838867, "global_step": 207019, "epoch": 2494} {"train_loss": -23.839170455932617, "global_step": 207020, "epoch": 2494} {"train_loss": -23.707468032836914, "global_step": 207021, "epoch": 2494} {"train_loss": -24.25620460510254, "global_step": 207022, "epoch": 2494} {"train_loss": -24.367847442626953, "global_step": 207023, "epoch": 2494} {"train_loss": -24.291318893432617, "global_step": 207024, "epoch": 2494} {"train_loss": -24.01106834411621, "global_step": 207025, "epoch": 2494} {"train_loss": -24.68891716003418, "global_step": 207026, "epoch": 2494} {"train_loss": -24.2474308013916, "global_step": 207027, "epoch": 2494} {"train_loss": -23.937267303466797, "global_step": 207028, "epoch": 2494} {"train_loss": -24.4987850189209, "global_step": 207029, "epoch": 2494} {"train_loss": -24.214338302612305, "global_step": 207030, "epoch": 2494} {"train_loss": -24.252716064453125, "global_step": 207031, "epoch": 2494} {"train_loss": -24.58930778503418, "global_step": 207032, "epoch": 2494} {"train_loss": -24.678377151489258, "global_step": 207033, "epoch": 2494} {"train_loss": -24.34646987915039, "global_step": 207034, "epoch": 2494} {"train_loss": -24.573963165283203, "global_step": 207035, "epoch": 2494} {"train_loss": -24.1840877532959, "global_step": 207036, "epoch": 2494} {"train_loss": -24.361835479736328, "global_step": 207037, "epoch": 2494} {"train_loss": -24.40504264831543, "global_step": 207038, "epoch": 2494} {"train_loss": -24.416656494140625, "global_step": 207039, "epoch": 2494} {"train_loss": -24.37640953063965, "global_step": 207040, "epoch": 2494} {"train_loss": -24.39888572692871, "global_step": 207041, "epoch": 2494} {"train_loss": -24.41533088684082, "global_step": 207042, "epoch": 2494} {"train_loss": -24.534822463989258, "global_step": 207043, "epoch": 2494} {"train_loss": -24.408079147338867, "global_step": 207044, "epoch": 2494} {"train_loss": -24.628644943237305, "global_step": 207045, "epoch": 2494} {"train_loss": -24.46918296813965, "global_step": 207046, "epoch": 2494} {"train_loss": -24.40693473815918, "global_step": 207047, "epoch": 2494} {"train_loss": -23.973148345947266, "global_step": 207048, "epoch": 2494} {"train_loss": -24.156017303466797, "global_step": 207049, "epoch": 2494} {"train_loss": -24.422504425048828, "global_step": 207050, "epoch": 2494} {"train_loss": -24.317121505737305, "global_step": 207051, "epoch": 2494} {"train_loss": -24.512584686279297, "global_step": 207052, "epoch": 2494} {"train_loss": -24.425817489624023, "global_step": 207053, "epoch": 2494} {"train_loss": -24.686750411987305, "global_step": 207054, "epoch": 2494} {"train_loss": -24.508451461791992, "global_step": 207055, "epoch": 2494} {"train_loss": -24.33779525756836, "global_step": 207056, "epoch": 2494} {"train_loss": -24.48044776916504, "global_step": 207057, "epoch": 2494} {"train_loss": -24.493301391601562, "global_step": 207058, "epoch": 2494} {"train_loss": -23.850576400756836, "global_step": 207059, "epoch": 2494} {"train_loss": -24.906278610229492, "global_step": 207060, "epoch": 2494} {"train_loss": -24.296052932739258, "global_step": 207061, "epoch": 2494} {"train_loss": -24.09834861755371, "global_step": 207062, "epoch": 2494} {"train_loss": -24.245166778564453, "global_step": 207063, "epoch": 2494} {"train_loss": -24.42976188659668, "global_step": 207064, "epoch": 2494} {"train_loss": -24.216720581054688, "global_step": 207065, "epoch": 2494} {"train_loss": -24.1929874420166, "global_step": 207066, "epoch": 2494} {"train_loss": -24.180709838867188, "global_step": 207067, "epoch": 2494} {"train_loss": -24.48456382751465, "global_step": 207068, "epoch": 2494} {"train_loss": -24.33327293395996, "global_step": 207069, "epoch": 2494} {"train_loss": -24.561843872070312, "global_step": 207070, "epoch": 2494} {"train_loss": -24.546541213989258, "global_step": 207071, "epoch": 2494} {"train_loss": -24.375783920288086, "global_step": 207072, "epoch": 2494} {"train_loss": -24.382831573486328, "global_step": 207073, "epoch": 2494} {"train_loss": -24.32277488708496, "global_step": 207074, "epoch": 2494} {"train_loss": -24.458084106445312, "global_step": 207075, "epoch": 2494} {"train_loss": -24.63545799255371, "global_step": 207076, "epoch": 2494} {"train_loss": -24.47993278503418, "global_step": 207077, "epoch": 2494} {"train_loss": -24.217872619628906, "global_step": 207078, "epoch": 2494} {"train_loss": -24.41282081604004, "global_step": 207079, "epoch": 2494} {"train_loss": -24.624744415283203, "global_step": 207080, "epoch": 2494} {"train_loss": -24.414878845214844, "global_step": 207081, "epoch": 2494} {"train_loss": -24.58692741394043, "global_step": 207082, "epoch": 2494} {"train_loss": -24.55573081970215, "global_step": 207083, "epoch": 2494} {"train_loss": -24.29549996249647, "global_step": 207084, "epoch": 2494, "val_loss": 6633544.5} {"train_loss": -23.58257293701172, "global_step": 207085, "epoch": 2495} {"train_loss": -24.02983856201172, "global_step": 207086, "epoch": 2495} {"train_loss": -23.735898971557617, "global_step": 207087, "epoch": 2495} {"train_loss": -24.182764053344727, "global_step": 207088, "epoch": 2495} {"train_loss": -24.26228141784668, "global_step": 207089, "epoch": 2495} {"train_loss": -24.10002899169922, "global_step": 207090, "epoch": 2495} {"train_loss": -23.806547164916992, "global_step": 207091, "epoch": 2495} {"train_loss": -24.13138198852539, "global_step": 207092, "epoch": 2495} {"train_loss": -24.13384246826172, "global_step": 207093, "epoch": 2495} {"train_loss": -24.23729705810547, "global_step": 207094, "epoch": 2495} {"train_loss": -24.14855194091797, "global_step": 207095, "epoch": 2495} {"train_loss": -24.16286277770996, "global_step": 207096, "epoch": 2495} {"train_loss": -23.97499656677246, "global_step": 207097, "epoch": 2495} {"train_loss": -24.04625701904297, "global_step": 207098, "epoch": 2495} {"train_loss": -24.207626342773438, "global_step": 207099, "epoch": 2495} {"train_loss": -24.155593872070312, "global_step": 207100, "epoch": 2495} {"train_loss": -24.409786224365234, "global_step": 207101, "epoch": 2495} {"train_loss": -23.83966636657715, "global_step": 207102, "epoch": 2495} {"train_loss": -24.23512077331543, "global_step": 207103, "epoch": 2495} {"train_loss": -24.42595672607422, "global_step": 207104, "epoch": 2495} {"train_loss": -24.32487678527832, "global_step": 207105, "epoch": 2495} {"train_loss": -24.429784774780273, "global_step": 207106, "epoch": 2495} {"train_loss": -24.185436248779297, "global_step": 207107, "epoch": 2495} {"train_loss": -24.073400497436523, "global_step": 207108, "epoch": 2495} {"train_loss": -23.976224899291992, "global_step": 207109, "epoch": 2495} {"train_loss": -24.557952880859375, "global_step": 207110, "epoch": 2495} {"train_loss": -24.465116500854492, "global_step": 207111, "epoch": 2495} {"train_loss": -24.14339256286621, "global_step": 207112, "epoch": 2495} {"train_loss": -24.006013870239258, "global_step": 207113, "epoch": 2495} {"train_loss": -24.23206901550293, "global_step": 207114, "epoch": 2495} {"train_loss": -24.11130142211914, "global_step": 207115, "epoch": 2495} {"train_loss": -24.16331672668457, "global_step": 207116, "epoch": 2495} {"train_loss": -24.284975051879883, "global_step": 207117, "epoch": 2495} {"train_loss": -24.300214767456055, "global_step": 207118, "epoch": 2495} {"train_loss": -24.70884132385254, "global_step": 207119, "epoch": 2495} {"train_loss": -24.118457794189453, "global_step": 207120, "epoch": 2495} {"train_loss": -24.45295524597168, "global_step": 207121, "epoch": 2495} {"train_loss": -24.441598892211914, "global_step": 207122, "epoch": 2495} {"train_loss": -24.42287254333496, "global_step": 207123, "epoch": 2495} {"train_loss": -24.128604888916016, "global_step": 207124, "epoch": 2495} {"train_loss": -24.147550582885742, "global_step": 207125, "epoch": 2495} {"train_loss": -24.5212459564209, "global_step": 207126, "epoch": 2495} {"train_loss": -24.78093147277832, "global_step": 207127, "epoch": 2495} {"train_loss": -24.090429306030273, "global_step": 207128, "epoch": 2495} {"train_loss": -24.469327926635742, "global_step": 207129, "epoch": 2495} {"train_loss": -24.460784912109375, "global_step": 207130, "epoch": 2495} {"train_loss": -24.52784538269043, "global_step": 207131, "epoch": 2495} {"train_loss": -24.371641159057617, "global_step": 207132, "epoch": 2495} {"train_loss": -24.219655990600586, "global_step": 207133, "epoch": 2495} {"train_loss": -24.159093856811523, "global_step": 207134, "epoch": 2495} {"train_loss": -24.56289291381836, "global_step": 207135, "epoch": 2495} {"train_loss": -24.6856632232666, "global_step": 207136, "epoch": 2495} {"train_loss": -24.311378479003906, "global_step": 207137, "epoch": 2495} {"train_loss": -24.565832138061523, "global_step": 207138, "epoch": 2495} {"train_loss": -24.477067947387695, "global_step": 207139, "epoch": 2495} {"train_loss": -24.47443199157715, "global_step": 207140, "epoch": 2495} {"train_loss": -23.909719467163086, "global_step": 207141, "epoch": 2495} {"train_loss": -24.534317016601562, "global_step": 207142, "epoch": 2495} {"train_loss": -24.339895248413086, "global_step": 207143, "epoch": 2495} {"train_loss": -24.579721450805664, "global_step": 207144, "epoch": 2495} {"train_loss": -24.51569175720215, "global_step": 207145, "epoch": 2495} {"train_loss": -24.170263290405273, "global_step": 207146, "epoch": 2495} {"train_loss": -24.189220428466797, "global_step": 207147, "epoch": 2495} {"train_loss": -24.184728622436523, "global_step": 207148, "epoch": 2495} {"train_loss": -24.18330192565918, "global_step": 207149, "epoch": 2495} {"train_loss": -24.62164878845215, "global_step": 207150, "epoch": 2495} {"train_loss": -24.594928741455078, "global_step": 207151, "epoch": 2495} {"train_loss": -24.072660446166992, "global_step": 207152, "epoch": 2495} {"train_loss": -24.380462646484375, "global_step": 207153, "epoch": 2495} {"train_loss": -24.660667419433594, "global_step": 207154, "epoch": 2495} {"train_loss": -24.468685150146484, "global_step": 207155, "epoch": 2495} {"train_loss": -24.511966705322266, "global_step": 207156, "epoch": 2495} {"train_loss": -24.43912696838379, "global_step": 207157, "epoch": 2495} {"train_loss": -24.356201171875, "global_step": 207158, "epoch": 2495} {"train_loss": -24.17047691345215, "global_step": 207159, "epoch": 2495} {"train_loss": -24.479223251342773, "global_step": 207160, "epoch": 2495} {"train_loss": -24.459272384643555, "global_step": 207161, "epoch": 2495} {"train_loss": -24.773136138916016, "global_step": 207162, "epoch": 2495} {"train_loss": -24.551965713500977, "global_step": 207163, "epoch": 2495} {"train_loss": -24.568395614624023, "global_step": 207164, "epoch": 2495} {"train_loss": -24.474393844604492, "global_step": 207165, "epoch": 2495} {"train_loss": -24.138317108154297, "global_step": 207166, "epoch": 2495} {"train_loss": -24.306394944708032, "global_step": 207167, "epoch": 2495, "val_loss": 6599486.5} {"train_loss": -23.935157775878906, "global_step": 207168, "epoch": 2496} {"train_loss": -23.49259376525879, "global_step": 207169, "epoch": 2496} {"train_loss": -23.65277099609375, "global_step": 207170, "epoch": 2496} {"train_loss": -23.8107852935791, "global_step": 207171, "epoch": 2496} {"train_loss": -23.99127197265625, "global_step": 207172, "epoch": 2496} {"train_loss": -23.675710678100586, "global_step": 207173, "epoch": 2496} {"train_loss": -24.67948341369629, "global_step": 207174, "epoch": 2496} {"train_loss": -23.85091209411621, "global_step": 207175, "epoch": 2496} {"train_loss": -24.138355255126953, "global_step": 207176, "epoch": 2496} {"train_loss": -24.085323333740234, "global_step": 207177, "epoch": 2496} {"train_loss": -24.087934494018555, "global_step": 207178, "epoch": 2496} {"train_loss": -23.701614379882812, "global_step": 207179, "epoch": 2496} {"train_loss": -24.351781845092773, "global_step": 207180, "epoch": 2496} {"train_loss": -23.970609664916992, "global_step": 207181, "epoch": 2496} {"train_loss": -24.205097198486328, "global_step": 207182, "epoch": 2496} {"train_loss": -24.092397689819336, "global_step": 207183, "epoch": 2496} {"train_loss": -24.306119918823242, "global_step": 207184, "epoch": 2496} {"train_loss": -24.243650436401367, "global_step": 207185, "epoch": 2496} {"train_loss": -24.21126937866211, "global_step": 207186, "epoch": 2496} {"train_loss": -24.471263885498047, "global_step": 207187, "epoch": 2496} {"train_loss": -24.1601619720459, "global_step": 207188, "epoch": 2496} {"train_loss": -24.07894515991211, "global_step": 207189, "epoch": 2496} {"train_loss": -24.203514099121094, "global_step": 207190, "epoch": 2496} {"train_loss": -24.337533950805664, "global_step": 207191, "epoch": 2496} {"train_loss": -24.09049415588379, "global_step": 207192, "epoch": 2496} {"train_loss": -24.187427520751953, "global_step": 207193, "epoch": 2496} {"train_loss": -24.591712951660156, "global_step": 207194, "epoch": 2496} {"train_loss": -24.555875778198242, "global_step": 207195, "epoch": 2496} {"train_loss": -24.269174575805664, "global_step": 207196, "epoch": 2496} {"train_loss": -23.89453125, "global_step": 207197, "epoch": 2496} {"train_loss": -24.543384552001953, "global_step": 207198, "epoch": 2496} {"train_loss": -23.85865592956543, "global_step": 207199, "epoch": 2496} {"train_loss": -24.179122924804688, "global_step": 207200, "epoch": 2496} {"train_loss": -24.2614688873291, "global_step": 207201, "epoch": 2496} {"train_loss": -24.429643630981445, "global_step": 207202, "epoch": 2496} {"train_loss": -24.195415496826172, "global_step": 207203, "epoch": 2496} {"train_loss": -24.21070671081543, "global_step": 207204, "epoch": 2496} {"train_loss": -24.18221664428711, "global_step": 207205, "epoch": 2496} {"train_loss": -24.321821212768555, "global_step": 207206, "epoch": 2496} {"train_loss": -24.653043746948242, "global_step": 207207, "epoch": 2496} {"train_loss": -24.316808700561523, "global_step": 207208, "epoch": 2496} {"train_loss": -24.15894889831543, "global_step": 207209, "epoch": 2496} {"train_loss": -24.29408073425293, "global_step": 207210, "epoch": 2496} {"train_loss": -24.463050842285156, "global_step": 207211, "epoch": 2496} {"train_loss": -24.46236228942871, "global_step": 207212, "epoch": 2496} {"train_loss": -24.19182777404785, "global_step": 207213, "epoch": 2496} {"train_loss": -24.077451705932617, "global_step": 207214, "epoch": 2496} {"train_loss": -24.4124698638916, "global_step": 207215, "epoch": 2496} {"train_loss": -24.954885482788086, "global_step": 207216, "epoch": 2496} {"train_loss": -24.381397247314453, "global_step": 207217, "epoch": 2496} {"train_loss": -24.557260513305664, "global_step": 207218, "epoch": 2496} {"train_loss": -24.281986236572266, "global_step": 207219, "epoch": 2496} {"train_loss": -24.38435173034668, "global_step": 207220, "epoch": 2496} {"train_loss": -24.594417572021484, "global_step": 207221, "epoch": 2496} {"train_loss": -24.157773971557617, "global_step": 207222, "epoch": 2496} {"train_loss": -24.064542770385742, "global_step": 207223, "epoch": 2496} {"train_loss": -24.21847152709961, "global_step": 207224, "epoch": 2496} {"train_loss": -24.49014663696289, "global_step": 207225, "epoch": 2496} {"train_loss": -24.048574447631836, "global_step": 207226, "epoch": 2496} {"train_loss": -24.390470504760742, "global_step": 207227, "epoch": 2496} {"train_loss": -24.248987197875977, "global_step": 207228, "epoch": 2496} {"train_loss": -24.47450065612793, "global_step": 207229, "epoch": 2496} {"train_loss": -24.32997703552246, "global_step": 207230, "epoch": 2496} {"train_loss": -24.625524520874023, "global_step": 207231, "epoch": 2496} {"train_loss": -24.662046432495117, "global_step": 207232, "epoch": 2496} {"train_loss": -24.490312576293945, "global_step": 207233, "epoch": 2496} {"train_loss": -24.761938095092773, "global_step": 207234, "epoch": 2496} {"train_loss": -24.411056518554688, "global_step": 207235, "epoch": 2496} {"train_loss": -24.26270866394043, "global_step": 207236, "epoch": 2496} {"train_loss": -24.30409049987793, "global_step": 207237, "epoch": 2496} {"train_loss": -24.615039825439453, "global_step": 207238, "epoch": 2496} {"train_loss": -24.4409122467041, "global_step": 207239, "epoch": 2496} {"train_loss": -24.357879638671875, "global_step": 207240, "epoch": 2496} {"train_loss": -24.340131759643555, "global_step": 207241, "epoch": 2496} {"train_loss": -24.910932540893555, "global_step": 207242, "epoch": 2496} {"train_loss": -24.440128326416016, "global_step": 207243, "epoch": 2496} {"train_loss": -24.803945541381836, "global_step": 207244, "epoch": 2496} {"train_loss": -24.209564208984375, "global_step": 207245, "epoch": 2496} {"train_loss": -24.23542594909668, "global_step": 207246, "epoch": 2496} {"train_loss": -24.351743698120117, "global_step": 207247, "epoch": 2496} {"train_loss": -24.70246696472168, "global_step": 207248, "epoch": 2496} {"train_loss": -24.662860870361328, "global_step": 207249, "epoch": 2496} {"train_loss": -24.278655936919062, "global_step": 207250, "epoch": 2496, "val_loss": 6701977.5} {"train_loss": -23.698183059692383, "global_step": 207251, "epoch": 2497} {"train_loss": -23.89190101623535, "global_step": 207252, "epoch": 2497} {"train_loss": -22.9543399810791, "global_step": 207253, "epoch": 2497} {"train_loss": -23.7808780670166, "global_step": 207254, "epoch": 2497} {"train_loss": -23.656360626220703, "global_step": 207255, "epoch": 2497} {"train_loss": -23.640844345092773, "global_step": 207256, "epoch": 2497} {"train_loss": -23.961233139038086, "global_step": 207257, "epoch": 2497} {"train_loss": -24.00130844116211, "global_step": 207258, "epoch": 2497} {"train_loss": -23.95098304748535, "global_step": 207259, "epoch": 2497} {"train_loss": -23.967926025390625, "global_step": 207260, "epoch": 2497} {"train_loss": -23.736425399780273, "global_step": 207261, "epoch": 2497} {"train_loss": -24.099334716796875, "global_step": 207262, "epoch": 2497} {"train_loss": -24.43155860900879, "global_step": 207263, "epoch": 2497} {"train_loss": -24.101285934448242, "global_step": 207264, "epoch": 2497} {"train_loss": -24.19504737854004, "global_step": 207265, "epoch": 2497} {"train_loss": -23.97772789001465, "global_step": 207266, "epoch": 2497} {"train_loss": -24.15581512451172, "global_step": 207267, "epoch": 2497} {"train_loss": -23.924718856811523, "global_step": 207268, "epoch": 2497} {"train_loss": -24.239151000976562, "global_step": 207269, "epoch": 2497} {"train_loss": -23.925687789916992, "global_step": 207270, "epoch": 2497} {"train_loss": -24.6892147064209, "global_step": 207271, "epoch": 2497} {"train_loss": -24.304899215698242, "global_step": 207272, "epoch": 2497} {"train_loss": -23.92799186706543, "global_step": 207273, "epoch": 2497} {"train_loss": -24.217300415039062, "global_step": 207274, "epoch": 2497} {"train_loss": -24.391376495361328, "global_step": 207275, "epoch": 2497} {"train_loss": -23.925506591796875, "global_step": 207276, "epoch": 2497} {"train_loss": -24.690860748291016, "global_step": 207277, "epoch": 2497} {"train_loss": -24.05046272277832, "global_step": 207278, "epoch": 2497} {"train_loss": -24.258132934570312, "global_step": 207279, "epoch": 2497} {"train_loss": -24.314489364624023, "global_step": 207280, "epoch": 2497} {"train_loss": -24.576093673706055, "global_step": 207281, "epoch": 2497} {"train_loss": -24.375864028930664, "global_step": 207282, "epoch": 2497} {"train_loss": -24.25434684753418, "global_step": 207283, "epoch": 2497} {"train_loss": -24.199499130249023, "global_step": 207284, "epoch": 2497} {"train_loss": -24.31195640563965, "global_step": 207285, "epoch": 2497} {"train_loss": -24.407819747924805, "global_step": 207286, "epoch": 2497} {"train_loss": -24.24458122253418, "global_step": 207287, "epoch": 2497} {"train_loss": -24.087228775024414, "global_step": 207288, "epoch": 2497} {"train_loss": -24.13467788696289, "global_step": 207289, "epoch": 2497} {"train_loss": -24.223649978637695, "global_step": 207290, "epoch": 2497} {"train_loss": -24.15326499938965, "global_step": 207291, "epoch": 2497} {"train_loss": -24.439762115478516, "global_step": 207292, "epoch": 2497} {"train_loss": -24.162019729614258, "global_step": 207293, "epoch": 2497} {"train_loss": -24.049753189086914, "global_step": 207294, "epoch": 2497} {"train_loss": -24.4002742767334, "global_step": 207295, "epoch": 2497} {"train_loss": -24.41240692138672, "global_step": 207296, "epoch": 2497} {"train_loss": -24.504653930664062, "global_step": 207297, "epoch": 2497} {"train_loss": -24.325002670288086, "global_step": 207298, "epoch": 2497} {"train_loss": -24.664621353149414, "global_step": 207299, "epoch": 2497} {"train_loss": -24.404205322265625, "global_step": 207300, "epoch": 2497} {"train_loss": -23.97890853881836, "global_step": 207301, "epoch": 2497} {"train_loss": -24.99720001220703, "global_step": 207302, "epoch": 2497} {"train_loss": -24.705053329467773, "global_step": 207303, "epoch": 2497} {"train_loss": -24.64981460571289, "global_step": 207304, "epoch": 2497} {"train_loss": -24.599271774291992, "global_step": 207305, "epoch": 2497} {"train_loss": -24.50111961364746, "global_step": 207306, "epoch": 2497} {"train_loss": -24.855642318725586, "global_step": 207307, "epoch": 2497} {"train_loss": -24.955780029296875, "global_step": 207308, "epoch": 2497} {"train_loss": -24.492666244506836, "global_step": 207309, "epoch": 2497} {"train_loss": -24.38951301574707, "global_step": 207310, "epoch": 2497} {"train_loss": -24.254348754882812, "global_step": 207311, "epoch": 2497} {"train_loss": -24.84737205505371, "global_step": 207312, "epoch": 2497} {"train_loss": -24.277379989624023, "global_step": 207313, "epoch": 2497} {"train_loss": -24.331226348876953, "global_step": 207314, "epoch": 2497} {"train_loss": -24.2462215423584, "global_step": 207315, "epoch": 2497} {"train_loss": -24.309688568115234, "global_step": 207316, "epoch": 2497} {"train_loss": -24.51642417907715, "global_step": 207317, "epoch": 2497} {"train_loss": -24.38750457763672, "global_step": 207318, "epoch": 2497} {"train_loss": -24.369155883789062, "global_step": 207319, "epoch": 2497} {"train_loss": -24.22484588623047, "global_step": 207320, "epoch": 2497} {"train_loss": -24.40396499633789, "global_step": 207321, "epoch": 2497} {"train_loss": -24.208786010742188, "global_step": 207322, "epoch": 2497} {"train_loss": -24.215192794799805, "global_step": 207323, "epoch": 2497} {"train_loss": -24.596799850463867, "global_step": 207324, "epoch": 2497} {"train_loss": -24.485076904296875, "global_step": 207325, "epoch": 2497} {"train_loss": -24.26848030090332, "global_step": 207326, "epoch": 2497} {"train_loss": -24.216398239135742, "global_step": 207327, "epoch": 2497} {"train_loss": -24.451669692993164, "global_step": 207328, "epoch": 2497} {"train_loss": -24.3681640625, "global_step": 207329, "epoch": 2497} {"train_loss": -24.284774780273438, "global_step": 207330, "epoch": 2497} {"train_loss": -24.241674423217773, "global_step": 207331, "epoch": 2497} {"train_loss": -24.06241226196289, "global_step": 207332, "epoch": 2497} {"train_loss": -24.236710490950617, "global_step": 207333, "epoch": 2497, "val_loss": 6679148.0} {"train_loss": -21.217864990234375, "global_step": 207334, "epoch": 2498} {"train_loss": -22.03644561767578, "global_step": 207335, "epoch": 2498} {"train_loss": -22.955581665039062, "global_step": 207336, "epoch": 2498} {"train_loss": -22.431774139404297, "global_step": 207337, "epoch": 2498} {"train_loss": -22.731504440307617, "global_step": 207338, "epoch": 2498} {"train_loss": -23.701452255249023, "global_step": 207339, "epoch": 2498} {"train_loss": -23.03571128845215, "global_step": 207340, "epoch": 2498} {"train_loss": -23.450510025024414, "global_step": 207341, "epoch": 2498} {"train_loss": -23.00431251525879, "global_step": 207342, "epoch": 2498} {"train_loss": -23.548110961914062, "global_step": 207343, "epoch": 2498} {"train_loss": -23.197052001953125, "global_step": 207344, "epoch": 2498} {"train_loss": -23.393413543701172, "global_step": 207345, "epoch": 2498} {"train_loss": -23.70747947692871, "global_step": 207346, "epoch": 2498} {"train_loss": -23.387622833251953, "global_step": 207347, "epoch": 2498} {"train_loss": -23.69941520690918, "global_step": 207348, "epoch": 2498} {"train_loss": -23.748279571533203, "global_step": 207349, "epoch": 2498} {"train_loss": -23.41412925720215, "global_step": 207350, "epoch": 2498} {"train_loss": -23.31048011779785, "global_step": 207351, "epoch": 2498} {"train_loss": -23.871051788330078, "global_step": 207352, "epoch": 2498} {"train_loss": -23.750181198120117, "global_step": 207353, "epoch": 2498} {"train_loss": -23.358417510986328, "global_step": 207354, "epoch": 2498} {"train_loss": -23.661380767822266, "global_step": 207355, "epoch": 2498} {"train_loss": -23.689191818237305, "global_step": 207356, "epoch": 2498} {"train_loss": -23.633264541625977, "global_step": 207357, "epoch": 2498} {"train_loss": -23.788410186767578, "global_step": 207358, "epoch": 2498} {"train_loss": -23.97310447692871, "global_step": 207359, "epoch": 2498} {"train_loss": -23.83531951904297, "global_step": 207360, "epoch": 2498} {"train_loss": -24.192066192626953, "global_step": 207361, "epoch": 2498} {"train_loss": -23.70525360107422, "global_step": 207362, "epoch": 2498} {"train_loss": -23.442602157592773, "global_step": 207363, "epoch": 2498} {"train_loss": -24.231117248535156, "global_step": 207364, "epoch": 2498} {"train_loss": -23.815824508666992, "global_step": 207365, "epoch": 2498} {"train_loss": -24.073104858398438, "global_step": 207366, "epoch": 2498} {"train_loss": -24.12754249572754, "global_step": 207367, "epoch": 2498} {"train_loss": -24.08782958984375, "global_step": 207368, "epoch": 2498} {"train_loss": -24.471776962280273, "global_step": 207369, "epoch": 2498} {"train_loss": -24.35981559753418, "global_step": 207370, "epoch": 2498} {"train_loss": -24.219608306884766, "global_step": 207371, "epoch": 2498} {"train_loss": -24.50369644165039, "global_step": 207372, "epoch": 2498} {"train_loss": -24.344745635986328, "global_step": 207373, "epoch": 2498} {"train_loss": -24.59693717956543, "global_step": 207374, "epoch": 2498} {"train_loss": -24.363828659057617, "global_step": 207375, "epoch": 2498} {"train_loss": -24.071210861206055, "global_step": 207376, "epoch": 2498} {"train_loss": -24.44074058532715, "global_step": 207377, "epoch": 2498} {"train_loss": -24.263296127319336, "global_step": 207378, "epoch": 2498} {"train_loss": -24.0775089263916, "global_step": 207379, "epoch": 2498} {"train_loss": -24.263532638549805, "global_step": 207380, "epoch": 2498} {"train_loss": -24.479665756225586, "global_step": 207381, "epoch": 2498} {"train_loss": -24.060903549194336, "global_step": 207382, "epoch": 2498} {"train_loss": -24.217992782592773, "global_step": 207383, "epoch": 2498} {"train_loss": -24.300565719604492, "global_step": 207384, "epoch": 2498} {"train_loss": -24.022476196289062, "global_step": 207385, "epoch": 2498} {"train_loss": -24.08369255065918, "global_step": 207386, "epoch": 2498} {"train_loss": -24.29019546508789, "global_step": 207387, "epoch": 2498} {"train_loss": -24.233121871948242, "global_step": 207388, "epoch": 2498} {"train_loss": -24.643295288085938, "global_step": 207389, "epoch": 2498} {"train_loss": -24.166820526123047, "global_step": 207390, "epoch": 2498} {"train_loss": -24.34575653076172, "global_step": 207391, "epoch": 2498} {"train_loss": -24.409032821655273, "global_step": 207392, "epoch": 2498} {"train_loss": -24.211334228515625, "global_step": 207393, "epoch": 2498} {"train_loss": -24.695165634155273, "global_step": 207394, "epoch": 2498} {"train_loss": -24.29083824157715, "global_step": 207395, "epoch": 2498} {"train_loss": -24.294218063354492, "global_step": 207396, "epoch": 2498} {"train_loss": -24.123828887939453, "global_step": 207397, "epoch": 2498} {"train_loss": -23.774276733398438, "global_step": 207398, "epoch": 2498} {"train_loss": -24.360815048217773, "global_step": 207399, "epoch": 2498} {"train_loss": -24.582561492919922, "global_step": 207400, "epoch": 2498} {"train_loss": -24.412702560424805, "global_step": 207401, "epoch": 2498} {"train_loss": -23.90464973449707, "global_step": 207402, "epoch": 2498} {"train_loss": -24.445310592651367, "global_step": 207403, "epoch": 2498} {"train_loss": -24.058408737182617, "global_step": 207404, "epoch": 2498} {"train_loss": -24.173648834228516, "global_step": 207405, "epoch": 2498} {"train_loss": -24.374237060546875, "global_step": 207406, "epoch": 2498} {"train_loss": -24.711999893188477, "global_step": 207407, "epoch": 2498} {"train_loss": -24.405475616455078, "global_step": 207408, "epoch": 2498} {"train_loss": -25.141103744506836, "global_step": 207409, "epoch": 2498} {"train_loss": -24.235126495361328, "global_step": 207410, "epoch": 2498} {"train_loss": -24.471742630004883, "global_step": 207411, "epoch": 2498} {"train_loss": -24.580387115478516, "global_step": 207412, "epoch": 2498} {"train_loss": -24.269926071166992, "global_step": 207413, "epoch": 2498} {"train_loss": -24.592870712280273, "global_step": 207414, "epoch": 2498} {"train_loss": -24.216869354248047, "global_step": 207415, "epoch": 2498} {"train_loss": -23.948476791381836, "global_step": 207416, "epoch": 2498, "val_loss": 6582616.0} {"train_loss": -23.988737106323242, "global_step": 207417, "epoch": 2499} {"train_loss": -23.911130905151367, "global_step": 207418, "epoch": 2499} {"train_loss": -23.521947860717773, "global_step": 207419, "epoch": 2499} {"train_loss": -24.061445236206055, "global_step": 207420, "epoch": 2499} {"train_loss": -23.772022247314453, "global_step": 207421, "epoch": 2499} {"train_loss": -23.662153244018555, "global_step": 207422, "epoch": 2499} {"train_loss": -24.03745460510254, "global_step": 207423, "epoch": 2499} {"train_loss": -23.811756134033203, "global_step": 207424, "epoch": 2499} {"train_loss": -23.91016960144043, "global_step": 207425, "epoch": 2499} {"train_loss": -23.79835319519043, "global_step": 207426, "epoch": 2499} {"train_loss": -24.061607360839844, "global_step": 207427, "epoch": 2499} {"train_loss": -23.786596298217773, "global_step": 207428, "epoch": 2499} {"train_loss": -23.93036460876465, "global_step": 207429, "epoch": 2499} {"train_loss": -23.582155227661133, "global_step": 207430, "epoch": 2499} {"train_loss": -23.712377548217773, "global_step": 207431, "epoch": 2499} {"train_loss": -24.2965087890625, "global_step": 207432, "epoch": 2499} {"train_loss": -24.1289119720459, "global_step": 207433, "epoch": 2499} {"train_loss": -23.800878524780273, "global_step": 207434, "epoch": 2499} {"train_loss": -24.087690353393555, "global_step": 207435, "epoch": 2499} {"train_loss": -24.272817611694336, "global_step": 207436, "epoch": 2499} {"train_loss": -24.328861236572266, "global_step": 207437, "epoch": 2499} {"train_loss": -24.308210372924805, "global_step": 207438, "epoch": 2499} {"train_loss": -24.33457374572754, "global_step": 207439, "epoch": 2499} {"train_loss": -24.061429977416992, "global_step": 207440, "epoch": 2499} {"train_loss": -24.201467514038086, "global_step": 207441, "epoch": 2499} {"train_loss": -24.32901382446289, "global_step": 207442, "epoch": 2499} {"train_loss": -24.522735595703125, "global_step": 207443, "epoch": 2499} {"train_loss": -24.012067794799805, "global_step": 207444, "epoch": 2499} {"train_loss": -24.079105377197266, "global_step": 207445, "epoch": 2499} {"train_loss": -24.12449073791504, "global_step": 207446, "epoch": 2499} {"train_loss": -24.367528915405273, "global_step": 207447, "epoch": 2499} {"train_loss": -24.45570945739746, "global_step": 207448, "epoch": 2499} {"train_loss": -24.024768829345703, "global_step": 207449, "epoch": 2499} {"train_loss": -24.228696823120117, "global_step": 207450, "epoch": 2499} {"train_loss": -24.31772804260254, "global_step": 207451, "epoch": 2499} {"train_loss": -24.297012329101562, "global_step": 207452, "epoch": 2499} {"train_loss": -24.535627365112305, "global_step": 207453, "epoch": 2499} {"train_loss": -24.275999069213867, "global_step": 207454, "epoch": 2499} {"train_loss": -24.341278076171875, "global_step": 207455, "epoch": 2499} {"train_loss": -24.16792106628418, "global_step": 207456, "epoch": 2499} {"train_loss": -24.60257911682129, "global_step": 207457, "epoch": 2499} {"train_loss": -24.363962173461914, "global_step": 207458, "epoch": 2499} {"train_loss": -24.28537940979004, "global_step": 207459, "epoch": 2499} {"train_loss": -24.22372817993164, "global_step": 207460, "epoch": 2499} {"train_loss": -24.496084213256836, "global_step": 207461, "epoch": 2499} {"train_loss": -24.693769454956055, "global_step": 207462, "epoch": 2499} {"train_loss": -24.20364761352539, "global_step": 207463, "epoch": 2499} {"train_loss": -24.69074821472168, "global_step": 207464, "epoch": 2499} {"train_loss": -24.439010620117188, "global_step": 207465, "epoch": 2499} {"train_loss": -24.637399673461914, "global_step": 207466, "epoch": 2499} {"train_loss": -24.5054874420166, "global_step": 207467, "epoch": 2499} {"train_loss": -24.52916717529297, "global_step": 207468, "epoch": 2499} {"train_loss": -24.53595733642578, "global_step": 207469, "epoch": 2499} {"train_loss": -24.547285079956055, "global_step": 207470, "epoch": 2499} {"train_loss": -24.508460998535156, "global_step": 207471, "epoch": 2499} {"train_loss": -24.079648971557617, "global_step": 207472, "epoch": 2499} {"train_loss": -24.101886749267578, "global_step": 207473, "epoch": 2499} {"train_loss": -23.957277297973633, "global_step": 207474, "epoch": 2499} {"train_loss": -24.065946578979492, "global_step": 207475, "epoch": 2499} {"train_loss": -24.561315536499023, "global_step": 207476, "epoch": 2499} {"train_loss": -23.985952377319336, "global_step": 207477, "epoch": 2499} {"train_loss": -24.419456481933594, "global_step": 207478, "epoch": 2499} {"train_loss": -24.572294235229492, "global_step": 207479, "epoch": 2499} {"train_loss": -24.717090606689453, "global_step": 207480, "epoch": 2499} {"train_loss": -24.112791061401367, "global_step": 207481, "epoch": 2499} {"train_loss": -24.203113555908203, "global_step": 207482, "epoch": 2499} {"train_loss": -24.496938705444336, "global_step": 207483, "epoch": 2499} {"train_loss": -24.407148361206055, "global_step": 207484, "epoch": 2499} {"train_loss": -24.349422454833984, "global_step": 207485, "epoch": 2499} {"train_loss": -24.183988571166992, "global_step": 207486, "epoch": 2499} {"train_loss": -24.72732162475586, "global_step": 207487, "epoch": 2499} {"train_loss": -24.475162506103516, "global_step": 207488, "epoch": 2499} {"train_loss": -24.36093521118164, "global_step": 207489, "epoch": 2499} {"train_loss": -24.28229331970215, "global_step": 207490, "epoch": 2499} {"train_loss": -24.1965274810791, "global_step": 207491, "epoch": 2499} {"train_loss": -24.31827735900879, "global_step": 207492, "epoch": 2499} {"train_loss": -24.134496688842773, "global_step": 207493, "epoch": 2499} {"train_loss": -24.239606857299805, "global_step": 207494, "epoch": 2499} {"train_loss": -24.592010498046875, "global_step": 207495, "epoch": 2499} {"train_loss": -24.39467430114746, "global_step": 207496, "epoch": 2499} {"train_loss": -24.5633602142334, "global_step": 207497, "epoch": 2499} {"train_loss": -24.284448623657227, "global_step": 207498, "epoch": 2499} {"train_loss": -24.24516183784209, "global_step": 207499, "epoch": 2499, "val_loss": 6680147.0} {"train_loss": -24.13302993774414, "global_step": 207500, "epoch": 2500} {"train_loss": -23.737903594970703, "global_step": 207501, "epoch": 2500} {"train_loss": -24.28364372253418, "global_step": 207502, "epoch": 2500} {"train_loss": -24.17084312438965, "global_step": 207503, "epoch": 2500} {"train_loss": -24.148168563842773, "global_step": 207504, "epoch": 2500} {"train_loss": -23.901243209838867, "global_step": 207505, "epoch": 2500} {"train_loss": -24.079158782958984, "global_step": 207506, "epoch": 2500} {"train_loss": -24.23599624633789, "global_step": 207507, "epoch": 2500} {"train_loss": -23.5821590423584, "global_step": 207508, "epoch": 2500} {"train_loss": -23.56040382385254, "global_step": 207509, "epoch": 2500} {"train_loss": -24.300296783447266, "global_step": 207510, "epoch": 2500} {"train_loss": -24.124725341796875, "global_step": 207511, "epoch": 2500} {"train_loss": -23.708194732666016, "global_step": 207512, "epoch": 2500} {"train_loss": -23.998945236206055, "global_step": 207513, "epoch": 2500} {"train_loss": -24.479013442993164, "global_step": 207514, "epoch": 2500} {"train_loss": -24.08968162536621, "global_step": 207515, "epoch": 2500} {"train_loss": -24.321386337280273, "global_step": 207516, "epoch": 2500} {"train_loss": -24.74359703063965, "global_step": 207517, "epoch": 2500} {"train_loss": -23.900436401367188, "global_step": 207518, "epoch": 2500} {"train_loss": -24.286514282226562, "global_step": 207519, "epoch": 2500} {"train_loss": -24.372465133666992, "global_step": 207520, "epoch": 2500} {"train_loss": -24.10550880432129, "global_step": 207521, "epoch": 2500} {"train_loss": -24.344196319580078, "global_step": 207522, "epoch": 2500} {"train_loss": -23.93659210205078, "global_step": 207523, "epoch": 2500} {"train_loss": -24.17026710510254, "global_step": 207524, "epoch": 2500} {"train_loss": -24.33109474182129, "global_step": 207525, "epoch": 2500} {"train_loss": -23.925247192382812, "global_step": 207526, "epoch": 2500} {"train_loss": -24.519357681274414, "global_step": 207527, "epoch": 2500} {"train_loss": -24.354833602905273, "global_step": 207528, "epoch": 2500} {"train_loss": -24.34377670288086, "global_step": 207529, "epoch": 2500} {"train_loss": -24.285322189331055, "global_step": 207530, "epoch": 2500} {"train_loss": -24.337509155273438, "global_step": 207531, "epoch": 2500} {"train_loss": -24.0743350982666, "global_step": 207532, "epoch": 2500} {"train_loss": -24.32924461364746, "global_step": 207533, "epoch": 2500} {"train_loss": -24.509191513061523, "global_step": 207534, "epoch": 2500} {"train_loss": -24.458759307861328, "global_step": 207535, "epoch": 2500} {"train_loss": -24.434415817260742, "global_step": 207536, "epoch": 2500} {"train_loss": -24.081357955932617, "global_step": 207537, "epoch": 2500} {"train_loss": -24.530942916870117, "global_step": 207538, "epoch": 2500} {"train_loss": -24.586389541625977, "global_step": 207539, "epoch": 2500} {"train_loss": -24.2510929107666, "global_step": 207540, "epoch": 2500} {"train_loss": -24.603979110717773, "global_step": 207541, "epoch": 2500} {"train_loss": -24.65285301208496, "global_step": 207542, "epoch": 2500} {"train_loss": -24.7008056640625, "global_step": 207543, "epoch": 2500} {"train_loss": -24.51541519165039, "global_step": 207544, "epoch": 2500} {"train_loss": -24.5907039642334, "global_step": 207545, "epoch": 2500} {"train_loss": -24.505741119384766, "global_step": 207546, "epoch": 2500} {"train_loss": -24.517059326171875, "global_step": 207547, "epoch": 2500} {"train_loss": -24.69308853149414, "global_step": 207548, "epoch": 2500} {"train_loss": -24.298789978027344, "global_step": 207549, "epoch": 2500} {"train_loss": -24.542251586914062, "global_step": 207550, "epoch": 2500} {"train_loss": -24.264089584350586, "global_step": 207551, "epoch": 2500} {"train_loss": -24.82501792907715, "global_step": 207552, "epoch": 2500} {"train_loss": -24.656888961791992, "global_step": 207553, "epoch": 2500} {"train_loss": -24.78192710876465, "global_step": 207554, "epoch": 2500} {"train_loss": -24.17500877380371, "global_step": 207555, "epoch": 2500} {"train_loss": -24.464597702026367, "global_step": 207556, "epoch": 2500} {"train_loss": -24.142744064331055, "global_step": 207557, "epoch": 2500} {"train_loss": -24.323209762573242, "global_step": 207558, "epoch": 2500} {"train_loss": -24.417062759399414, "global_step": 207559, "epoch": 2500} {"train_loss": -24.397071838378906, "global_step": 207560, "epoch": 2500} {"train_loss": -23.528642654418945, "global_step": 207561, "epoch": 2500} {"train_loss": -24.135086059570312, "global_step": 207562, "epoch": 2500} {"train_loss": -24.31159019470215, "global_step": 207563, "epoch": 2500} {"train_loss": -24.037689208984375, "global_step": 207564, "epoch": 2500} {"train_loss": -24.1124267578125, "global_step": 207565, "epoch": 2500} {"train_loss": -24.38100242614746, "global_step": 207566, "epoch": 2500} {"train_loss": -24.08715057373047, "global_step": 207567, "epoch": 2500} {"train_loss": -24.354501724243164, "global_step": 207568, "epoch": 2500} {"train_loss": -24.177518844604492, "global_step": 207569, "epoch": 2500} {"train_loss": -24.3746395111084, "global_step": 207570, "epoch": 2500} {"train_loss": -24.395505905151367, "global_step": 207571, "epoch": 2500} {"train_loss": -24.17960548400879, "global_step": 207572, "epoch": 2500} {"train_loss": -24.447858810424805, "global_step": 207573, "epoch": 2500} {"train_loss": -24.22959327697754, "global_step": 207574, "epoch": 2500} {"train_loss": -24.13422203063965, "global_step": 207575, "epoch": 2500} {"train_loss": -24.531957626342773, "global_step": 207576, "epoch": 2500} {"train_loss": -24.628210067749023, "global_step": 207577, "epoch": 2500} {"train_loss": -24.350488662719727, "global_step": 207578, "epoch": 2500} {"train_loss": -24.592483520507812, "global_step": 207579, "epoch": 2500} {"train_loss": -24.62505531311035, "global_step": 207580, "epoch": 2500} {"train_loss": -24.628026962280273, "global_step": 207581, "epoch": 2500} {"train_loss": -24.307326075542402, "global_step": 207582, "epoch": 2500, "train/sim_max_reward_0": 1.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 0.0, "test/sim_max_reward_4500000": 1.0, "test/sim_max_reward_4500001": 1.0, "test/sim_max_reward_4500002": 1.0, "test/sim_max_reward_4500003": 1.0, "test/sim_max_reward_4500004": 1.0, "test/sim_max_reward_4500005": 1.0, "test/sim_max_reward_4500006": 1.0, "test/sim_max_reward_4500007": 1.0, "test/sim_max_reward_4500008": 1.0, "test/sim_max_reward_4500009": 1.0, "test/sim_max_reward_4500010": 1.0, "test/sim_max_reward_4500011": 1.0, "test/sim_max_reward_4500012": 1.0, "test/sim_max_reward_4500013": 1.0, "test/sim_max_reward_4500014": 1.0, "test/sim_max_reward_4500015": 1.0, "test/sim_max_reward_4500016": 1.0, "test/sim_max_reward_4500017": 1.0, "test/sim_max_reward_4500018": 1.0, "test/sim_max_reward_4500019": 0.0, "test/sim_max_reward_4500020": 1.0, "test/sim_max_reward_4500021": 1.0, "train/mean_score": 0.8333333333333334, "test/mean_score": 0.9545454545454546, "val_loss": 6413189.0} {"train_loss": -24.046018600463867, "global_step": 207583, "epoch": 2501} {"train_loss": -23.666868209838867, "global_step": 207584, "epoch": 2501} {"train_loss": -24.267370223999023, "global_step": 207585, "epoch": 2501} {"train_loss": -24.25970458984375, "global_step": 207586, "epoch": 2501} {"train_loss": -23.90260887145996, "global_step": 207587, "epoch": 2501} {"train_loss": -24.048192977905273, "global_step": 207588, "epoch": 2501} {"train_loss": -24.380970001220703, "global_step": 207589, "epoch": 2501} {"train_loss": -24.11379051208496, "global_step": 207590, "epoch": 2501} {"train_loss": -24.56546401977539, "global_step": 207591, "epoch": 2501} {"train_loss": -24.18111801147461, "global_step": 207592, "epoch": 2501} {"train_loss": -24.065670013427734, "global_step": 207593, "epoch": 2501} {"train_loss": -24.188453674316406, "global_step": 207594, "epoch": 2501} {"train_loss": -24.212650299072266, "global_step": 207595, "epoch": 2501} {"train_loss": -24.077590942382812, "global_step": 207596, "epoch": 2501} {"train_loss": -24.363693237304688, "global_step": 207597, "epoch": 2501} {"train_loss": -24.04387092590332, "global_step": 207598, "epoch": 2501} {"train_loss": -24.030319213867188, "global_step": 207599, "epoch": 2501} {"train_loss": -24.038293838500977, "global_step": 207600, "epoch": 2501} {"train_loss": -24.500722885131836, "global_step": 207601, "epoch": 2501} {"train_loss": -24.513172149658203, "global_step": 207602, "epoch": 2501} {"train_loss": -24.181594848632812, "global_step": 207603, "epoch": 2501} {"train_loss": -24.075483322143555, "global_step": 207604, "epoch": 2501} {"train_loss": -24.503026962280273, "global_step": 207605, "epoch": 2501} {"train_loss": -24.47163963317871, "global_step": 207606, "epoch": 2501} {"train_loss": -24.388086318969727, "global_step": 207607, "epoch": 2501} {"train_loss": -24.533184051513672, "global_step": 207608, "epoch": 2501} {"train_loss": -24.383792877197266, "global_step": 207609, "epoch": 2501} {"train_loss": -24.368616104125977, "global_step": 207610, "epoch": 2501} {"train_loss": -24.267688751220703, "global_step": 207611, "epoch": 2501} {"train_loss": -24.194480895996094, "global_step": 207612, "epoch": 2501} {"train_loss": -24.42868995666504, "global_step": 207613, "epoch": 2501} {"train_loss": -24.12932777404785, "global_step": 207614, "epoch": 2501} {"train_loss": -23.921241760253906, "global_step": 207615, "epoch": 2501} {"train_loss": -24.42384147644043, "global_step": 207616, "epoch": 2501} {"train_loss": -24.658954620361328, "global_step": 207617, "epoch": 2501} {"train_loss": -24.253860473632812, "global_step": 207618, "epoch": 2501} {"train_loss": -24.93811798095703, "global_step": 207619, "epoch": 2501} {"train_loss": -24.518516540527344, "global_step": 207620, "epoch": 2501} {"train_loss": -24.522687911987305, "global_step": 207621, "epoch": 2501} {"train_loss": -24.228458404541016, "global_step": 207622, "epoch": 2501} {"train_loss": -24.441831588745117, "global_step": 207623, "epoch": 2501} {"train_loss": -24.242721557617188, "global_step": 207624, "epoch": 2501} {"train_loss": -24.376359939575195, "global_step": 207625, "epoch": 2501} {"train_loss": -24.248592376708984, "global_step": 207626, "epoch": 2501} {"train_loss": -24.22757911682129, "global_step": 207627, "epoch": 2501} {"train_loss": -24.467927932739258, "global_step": 207628, "epoch": 2501} {"train_loss": -24.59178924560547, "global_step": 207629, "epoch": 2501} {"train_loss": -24.53472900390625, "global_step": 207630, "epoch": 2501} {"train_loss": -24.62233543395996, "global_step": 207631, "epoch": 2501} {"train_loss": -24.605247497558594, "global_step": 207632, "epoch": 2501} {"train_loss": -24.564014434814453, "global_step": 207633, "epoch": 2501} {"train_loss": -24.669416427612305, "global_step": 207634, "epoch": 2501} {"train_loss": -24.547216415405273, "global_step": 207635, "epoch": 2501} {"train_loss": -24.271347045898438, "global_step": 207636, "epoch": 2501} {"train_loss": -24.234907150268555, "global_step": 207637, "epoch": 2501} {"train_loss": -24.584726333618164, "global_step": 207638, "epoch": 2501} {"train_loss": -24.39813232421875, "global_step": 207639, "epoch": 2501} {"train_loss": -24.481962203979492, "global_step": 207640, "epoch": 2501} {"train_loss": -24.547517776489258, "global_step": 207641, "epoch": 2501} {"train_loss": -24.0401668548584, "global_step": 207642, "epoch": 2501} {"train_loss": -24.138395309448242, "global_step": 207643, "epoch": 2501} {"train_loss": -24.35748863220215, "global_step": 207644, "epoch": 2501} {"train_loss": -24.03266716003418, "global_step": 207645, "epoch": 2501} {"train_loss": -24.580251693725586, "global_step": 207646, "epoch": 2501} {"train_loss": -24.35892677307129, "global_step": 207647, "epoch": 2501} {"train_loss": -24.36849021911621, "global_step": 207648, "epoch": 2501} {"train_loss": -24.3139705657959, "global_step": 207649, "epoch": 2501} {"train_loss": -24.37493324279785, "global_step": 207650, "epoch": 2501} {"train_loss": -24.67779541015625, "global_step": 207651, "epoch": 2501} {"train_loss": -24.265453338623047, "global_step": 207652, "epoch": 2501} {"train_loss": -24.37155532836914, "global_step": 207653, "epoch": 2501} {"train_loss": -24.26641845703125, "global_step": 207654, "epoch": 2501} {"train_loss": -24.655424118041992, "global_step": 207655, "epoch": 2501} {"train_loss": -24.51133918762207, "global_step": 207656, "epoch": 2501} {"train_loss": -24.170019149780273, "global_step": 207657, "epoch": 2501} {"train_loss": -24.481901168823242, "global_step": 207658, "epoch": 2501} {"train_loss": -24.30531120300293, "global_step": 207659, "epoch": 2501} {"train_loss": -24.18385124206543, "global_step": 207660, "epoch": 2501} {"train_loss": -24.309053421020508, "global_step": 207661, "epoch": 2501} {"train_loss": -24.206661224365234, "global_step": 207662, "epoch": 2501} {"train_loss": -24.561382293701172, "global_step": 207663, "epoch": 2501} {"train_loss": -24.379241943359375, "global_step": 207664, "epoch": 2501} {"train_loss": -24.330558363213598, "global_step": 207665, "epoch": 2501, "val_loss": 6643704.0} {"train_loss": -23.726560592651367, "global_step": 207666, "epoch": 2502} {"train_loss": -24.044315338134766, "global_step": 207667, "epoch": 2502} {"train_loss": -23.77263832092285, "global_step": 207668, "epoch": 2502} {"train_loss": -23.947019577026367, "global_step": 207669, "epoch": 2502} {"train_loss": -23.63380241394043, "global_step": 207670, "epoch": 2502} {"train_loss": -24.0058650970459, "global_step": 207671, "epoch": 2502} {"train_loss": -24.07291030883789, "global_step": 207672, "epoch": 2502} {"train_loss": -23.96161460876465, "global_step": 207673, "epoch": 2502} {"train_loss": -24.313079833984375, "global_step": 207674, "epoch": 2502} {"train_loss": -24.025562286376953, "global_step": 207675, "epoch": 2502} {"train_loss": -24.11347007751465, "global_step": 207676, "epoch": 2502} {"train_loss": -24.298242568969727, "global_step": 207677, "epoch": 2502} {"train_loss": -24.288681030273438, "global_step": 207678, "epoch": 2502} {"train_loss": -24.6995849609375, "global_step": 207679, "epoch": 2502} {"train_loss": -24.475666046142578, "global_step": 207680, "epoch": 2502} {"train_loss": -24.569053649902344, "global_step": 207681, "epoch": 2502} {"train_loss": -24.146390914916992, "global_step": 207682, "epoch": 2502} {"train_loss": -24.184919357299805, "global_step": 207683, "epoch": 2502} {"train_loss": -24.21382713317871, "global_step": 207684, "epoch": 2502} {"train_loss": -24.420089721679688, "global_step": 207685, "epoch": 2502} {"train_loss": -24.78325843811035, "global_step": 207686, "epoch": 2502} {"train_loss": -24.728607177734375, "global_step": 207687, "epoch": 2502} {"train_loss": -24.591598510742188, "global_step": 207688, "epoch": 2502} {"train_loss": -24.248014450073242, "global_step": 207689, "epoch": 2502} {"train_loss": -24.33283805847168, "global_step": 207690, "epoch": 2502} {"train_loss": -24.50594139099121, "global_step": 207691, "epoch": 2502} {"train_loss": -24.51203727722168, "global_step": 207692, "epoch": 2502} {"train_loss": -24.51974105834961, "global_step": 207693, "epoch": 2502} {"train_loss": -24.78348159790039, "global_step": 207694, "epoch": 2502} {"train_loss": -24.49229621887207, "global_step": 207695, "epoch": 2502} {"train_loss": -24.5771541595459, "global_step": 207696, "epoch": 2502} {"train_loss": -24.061838150024414, "global_step": 207697, "epoch": 2502} {"train_loss": -24.845260620117188, "global_step": 207698, "epoch": 2502} {"train_loss": -24.75081443786621, "global_step": 207699, "epoch": 2502} {"train_loss": -24.501842498779297, "global_step": 207700, "epoch": 2502} {"train_loss": -24.444156646728516, "global_step": 207701, "epoch": 2502} {"train_loss": -24.467592239379883, "global_step": 207702, "epoch": 2502} {"train_loss": -24.453927993774414, "global_step": 207703, "epoch": 2502} {"train_loss": -24.45124626159668, "global_step": 207704, "epoch": 2502} {"train_loss": -24.726776123046875, "global_step": 207705, "epoch": 2502} {"train_loss": -24.937702178955078, "global_step": 207706, "epoch": 2502} {"train_loss": -24.378530502319336, "global_step": 207707, "epoch": 2502} {"train_loss": -24.564157485961914, "global_step": 207708, "epoch": 2502} {"train_loss": -24.161136627197266, "global_step": 207709, "epoch": 2502} {"train_loss": -24.232595443725586, "global_step": 207710, "epoch": 2502} {"train_loss": -24.77320098876953, "global_step": 207711, "epoch": 2502} {"train_loss": -24.61884880065918, "global_step": 207712, "epoch": 2502} {"train_loss": -24.42030143737793, "global_step": 207713, "epoch": 2502} {"train_loss": -24.337646484375, "global_step": 207714, "epoch": 2502} {"train_loss": -24.304458618164062, "global_step": 207715, "epoch": 2502} {"train_loss": -24.02011489868164, "global_step": 207716, "epoch": 2502} {"train_loss": -23.727190017700195, "global_step": 207717, "epoch": 2502} {"train_loss": -23.400386810302734, "global_step": 207718, "epoch": 2502} {"train_loss": -23.9449405670166, "global_step": 207719, "epoch": 2502} {"train_loss": -24.46856689453125, "global_step": 207720, "epoch": 2502} {"train_loss": -24.018497467041016, "global_step": 207721, "epoch": 2502} {"train_loss": -24.23369789123535, "global_step": 207722, "epoch": 2502} {"train_loss": -24.099435806274414, "global_step": 207723, "epoch": 2502} {"train_loss": -24.50242042541504, "global_step": 207724, "epoch": 2502} {"train_loss": -24.015295028686523, "global_step": 207725, "epoch": 2502} {"train_loss": -24.361919403076172, "global_step": 207726, "epoch": 2502} {"train_loss": -24.40140151977539, "global_step": 207727, "epoch": 2502} {"train_loss": -24.413278579711914, "global_step": 207728, "epoch": 2502} {"train_loss": -24.623300552368164, "global_step": 207729, "epoch": 2502} {"train_loss": -24.364892959594727, "global_step": 207730, "epoch": 2502} {"train_loss": -24.380449295043945, "global_step": 207731, "epoch": 2502} {"train_loss": -24.642166137695312, "global_step": 207732, "epoch": 2502} {"train_loss": -24.324718475341797, "global_step": 207733, "epoch": 2502} {"train_loss": -24.511930465698242, "global_step": 207734, "epoch": 2502} {"train_loss": -24.599502563476562, "global_step": 207735, "epoch": 2502} {"train_loss": -24.664989471435547, "global_step": 207736, "epoch": 2502} {"train_loss": -24.4398193359375, "global_step": 207737, "epoch": 2502} {"train_loss": -24.56007957458496, "global_step": 207738, "epoch": 2502} {"train_loss": -24.13111686706543, "global_step": 207739, "epoch": 2502} {"train_loss": -24.533367156982422, "global_step": 207740, "epoch": 2502} {"train_loss": -24.201292037963867, "global_step": 207741, "epoch": 2502} {"train_loss": -24.335224151611328, "global_step": 207742, "epoch": 2502} {"train_loss": -24.307239532470703, "global_step": 207743, "epoch": 2502} {"train_loss": -24.50508689880371, "global_step": 207744, "epoch": 2502} {"train_loss": -24.2897891998291, "global_step": 207745, "epoch": 2502} {"train_loss": -24.162755966186523, "global_step": 207746, "epoch": 2502} {"train_loss": -24.38921546936035, "global_step": 207747, "epoch": 2502} {"train_loss": -24.345899489988764, "global_step": 207748, "epoch": 2502, "val_loss": 6585962.0} {"train_loss": -23.0922908782959, "global_step": 207749, "epoch": 2503} {"train_loss": -23.85874366760254, "global_step": 207750, "epoch": 2503} {"train_loss": -23.670190811157227, "global_step": 207751, "epoch": 2503} {"train_loss": -23.801471710205078, "global_step": 207752, "epoch": 2503} {"train_loss": -23.7004451751709, "global_step": 207753, "epoch": 2503} {"train_loss": -23.760692596435547, "global_step": 207754, "epoch": 2503} {"train_loss": -24.002525329589844, "global_step": 207755, "epoch": 2503} {"train_loss": -23.9177188873291, "global_step": 207756, "epoch": 2503} {"train_loss": -23.972463607788086, "global_step": 207757, "epoch": 2503} {"train_loss": -24.310611724853516, "global_step": 207758, "epoch": 2503} {"train_loss": -23.81766128540039, "global_step": 207759, "epoch": 2503} {"train_loss": -23.785053253173828, "global_step": 207760, "epoch": 2503} {"train_loss": -24.10198974609375, "global_step": 207761, "epoch": 2503} {"train_loss": -24.12692642211914, "global_step": 207762, "epoch": 2503} {"train_loss": -24.142057418823242, "global_step": 207763, "epoch": 2503} {"train_loss": -23.78128433227539, "global_step": 207764, "epoch": 2503} {"train_loss": -24.19138526916504, "global_step": 207765, "epoch": 2503} {"train_loss": -24.16768455505371, "global_step": 207766, "epoch": 2503} {"train_loss": -23.821531295776367, "global_step": 207767, "epoch": 2503} {"train_loss": -24.095869064331055, "global_step": 207768, "epoch": 2503} {"train_loss": -24.04266357421875, "global_step": 207769, "epoch": 2503} {"train_loss": -24.01123046875, "global_step": 207770, "epoch": 2503} {"train_loss": -24.122737884521484, "global_step": 207771, "epoch": 2503} {"train_loss": -24.483030319213867, "global_step": 207772, "epoch": 2503} {"train_loss": -24.140588760375977, "global_step": 207773, "epoch": 2503} {"train_loss": -24.32309913635254, "global_step": 207774, "epoch": 2503} {"train_loss": -24.457868576049805, "global_step": 207775, "epoch": 2503} {"train_loss": -24.36531639099121, "global_step": 207776, "epoch": 2503} {"train_loss": -24.722248077392578, "global_step": 207777, "epoch": 2503} {"train_loss": -24.5501651763916, "global_step": 207778, "epoch": 2503} {"train_loss": -24.707416534423828, "global_step": 207779, "epoch": 2503} {"train_loss": -24.468610763549805, "global_step": 207780, "epoch": 2503} {"train_loss": -24.68140411376953, "global_step": 207781, "epoch": 2503} {"train_loss": -24.19003677368164, "global_step": 207782, "epoch": 2503} {"train_loss": -24.634489059448242, "global_step": 207783, "epoch": 2503} {"train_loss": -24.705322265625, "global_step": 207784, "epoch": 2503} {"train_loss": -24.308883666992188, "global_step": 207785, "epoch": 2503} {"train_loss": -24.273645401000977, "global_step": 207786, "epoch": 2503} {"train_loss": -24.382953643798828, "global_step": 207787, "epoch": 2503} {"train_loss": -24.21773338317871, "global_step": 207788, "epoch": 2503} {"train_loss": -24.234649658203125, "global_step": 207789, "epoch": 2503} {"train_loss": -24.30398178100586, "global_step": 207790, "epoch": 2503} {"train_loss": -24.59609603881836, "global_step": 207791, "epoch": 2503} {"train_loss": -24.261938095092773, "global_step": 207792, "epoch": 2503} {"train_loss": -24.584278106689453, "global_step": 207793, "epoch": 2503} {"train_loss": -24.389116287231445, "global_step": 207794, "epoch": 2503} {"train_loss": -24.673139572143555, "global_step": 207795, "epoch": 2503} {"train_loss": -24.137399673461914, "global_step": 207796, "epoch": 2503} {"train_loss": -24.269399642944336, "global_step": 207797, "epoch": 2503} {"train_loss": -24.39273452758789, "global_step": 207798, "epoch": 2503} {"train_loss": -24.303442001342773, "global_step": 207799, "epoch": 2503} {"train_loss": -24.6509952545166, "global_step": 207800, "epoch": 2503} {"train_loss": -24.027679443359375, "global_step": 207801, "epoch": 2503} {"train_loss": -24.411169052124023, "global_step": 207802, "epoch": 2503} {"train_loss": -24.27972412109375, "global_step": 207803, "epoch": 2503} {"train_loss": -24.1505069732666, "global_step": 207804, "epoch": 2503} {"train_loss": -24.758092880249023, "global_step": 207805, "epoch": 2503} {"train_loss": -24.445180892944336, "global_step": 207806, "epoch": 2503} {"train_loss": -24.180532455444336, "global_step": 207807, "epoch": 2503} {"train_loss": -24.696317672729492, "global_step": 207808, "epoch": 2503} {"train_loss": -24.20699119567871, "global_step": 207809, "epoch": 2503} {"train_loss": -24.280906677246094, "global_step": 207810, "epoch": 2503} {"train_loss": -24.08900260925293, "global_step": 207811, "epoch": 2503} {"train_loss": -24.433757781982422, "global_step": 207812, "epoch": 2503} {"train_loss": -24.663330078125, "global_step": 207813, "epoch": 2503} {"train_loss": -24.391271591186523, "global_step": 207814, "epoch": 2503} {"train_loss": -24.365955352783203, "global_step": 207815, "epoch": 2503} {"train_loss": -24.624906539916992, "global_step": 207816, "epoch": 2503} {"train_loss": -24.41529083251953, "global_step": 207817, "epoch": 2503} {"train_loss": -24.196269989013672, "global_step": 207818, "epoch": 2503} {"train_loss": -23.98542594909668, "global_step": 207819, "epoch": 2503} {"train_loss": -24.257583618164062, "global_step": 207820, "epoch": 2503} {"train_loss": -24.45176887512207, "global_step": 207821, "epoch": 2503} {"train_loss": -24.148380279541016, "global_step": 207822, "epoch": 2503} {"train_loss": -24.3709716796875, "global_step": 207823, "epoch": 2503} {"train_loss": -24.184629440307617, "global_step": 207824, "epoch": 2503} {"train_loss": -24.275436401367188, "global_step": 207825, "epoch": 2503} {"train_loss": -24.477264404296875, "global_step": 207826, "epoch": 2503} {"train_loss": -24.475505828857422, "global_step": 207827, "epoch": 2503} {"train_loss": -24.5384464263916, "global_step": 207828, "epoch": 2503} {"train_loss": -24.466123580932617, "global_step": 207829, "epoch": 2503} {"train_loss": -24.237897872924805, "global_step": 207830, "epoch": 2503} {"train_loss": -24.253969100584467, "global_step": 207831, "epoch": 2503, "val_loss": 6555362.0} {"train_loss": -21.44767189025879, "global_step": 207832, "epoch": 2504} {"train_loss": -23.850570678710938, "global_step": 207833, "epoch": 2504} {"train_loss": -22.602079391479492, "global_step": 207834, "epoch": 2504} {"train_loss": -23.40137481689453, "global_step": 207835, "epoch": 2504} {"train_loss": -23.399585723876953, "global_step": 207836, "epoch": 2504} {"train_loss": -23.38874626159668, "global_step": 207837, "epoch": 2504} {"train_loss": -23.628366470336914, "global_step": 207838, "epoch": 2504} {"train_loss": -23.63963508605957, "global_step": 207839, "epoch": 2504} {"train_loss": -24.295373916625977, "global_step": 207840, "epoch": 2504} {"train_loss": -24.129653930664062, "global_step": 207841, "epoch": 2504} {"train_loss": -23.680612564086914, "global_step": 207842, "epoch": 2504} {"train_loss": -24.030981063842773, "global_step": 207843, "epoch": 2504} {"train_loss": -23.724977493286133, "global_step": 207844, "epoch": 2504} {"train_loss": -23.928043365478516, "global_step": 207845, "epoch": 2504} {"train_loss": -24.024145126342773, "global_step": 207846, "epoch": 2504} {"train_loss": -23.7847900390625, "global_step": 207847, "epoch": 2504} {"train_loss": -23.850875854492188, "global_step": 207848, "epoch": 2504} {"train_loss": -24.300174713134766, "global_step": 207849, "epoch": 2504} {"train_loss": -23.81929588317871, "global_step": 207850, "epoch": 2504} {"train_loss": -24.154077529907227, "global_step": 207851, "epoch": 2504} {"train_loss": -24.51422119140625, "global_step": 207852, "epoch": 2504} {"train_loss": -24.258832931518555, "global_step": 207853, "epoch": 2504} {"train_loss": -23.973974227905273, "global_step": 207854, "epoch": 2504} {"train_loss": -24.323896408081055, "global_step": 207855, "epoch": 2504} {"train_loss": -24.427291870117188, "global_step": 207856, "epoch": 2504} {"train_loss": -24.466999053955078, "global_step": 207857, "epoch": 2504} {"train_loss": -24.366201400756836, "global_step": 207858, "epoch": 2504} {"train_loss": -23.79298973083496, "global_step": 207859, "epoch": 2504} {"train_loss": -24.160757064819336, "global_step": 207860, "epoch": 2504} {"train_loss": -24.190654754638672, "global_step": 207861, "epoch": 2504} {"train_loss": -24.4105281829834, "global_step": 207862, "epoch": 2504} {"train_loss": -24.527097702026367, "global_step": 207863, "epoch": 2504} {"train_loss": -24.147123336791992, "global_step": 207864, "epoch": 2504} {"train_loss": -24.245161056518555, "global_step": 207865, "epoch": 2504} {"train_loss": -24.355789184570312, "global_step": 207866, "epoch": 2504} {"train_loss": -24.174880981445312, "global_step": 207867, "epoch": 2504} {"train_loss": -23.911361694335938, "global_step": 207868, "epoch": 2504} {"train_loss": -24.221487045288086, "global_step": 207869, "epoch": 2504} {"train_loss": -24.450824737548828, "global_step": 207870, "epoch": 2504} {"train_loss": -24.108341217041016, "global_step": 207871, "epoch": 2504} {"train_loss": -24.34157371520996, "global_step": 207872, "epoch": 2504} {"train_loss": -24.404178619384766, "global_step": 207873, "epoch": 2504} {"train_loss": -24.462697982788086, "global_step": 207874, "epoch": 2504} {"train_loss": -24.405309677124023, "global_step": 207875, "epoch": 2504} {"train_loss": -24.396970748901367, "global_step": 207876, "epoch": 2504} {"train_loss": -24.856870651245117, "global_step": 207877, "epoch": 2504} {"train_loss": -24.620290756225586, "global_step": 207878, "epoch": 2504} {"train_loss": -24.661584854125977, "global_step": 207879, "epoch": 2504} {"train_loss": -24.462736129760742, "global_step": 207880, "epoch": 2504} {"train_loss": -24.531057357788086, "global_step": 207881, "epoch": 2504} {"train_loss": -24.594335556030273, "global_step": 207882, "epoch": 2504} {"train_loss": -24.672605514526367, "global_step": 207883, "epoch": 2504} {"train_loss": -23.982166290283203, "global_step": 207884, "epoch": 2504} {"train_loss": -24.3984375, "global_step": 207885, "epoch": 2504} {"train_loss": -24.565160751342773, "global_step": 207886, "epoch": 2504} {"train_loss": -24.400938034057617, "global_step": 207887, "epoch": 2504} {"train_loss": -24.36298942565918, "global_step": 207888, "epoch": 2504} {"train_loss": -24.735036849975586, "global_step": 207889, "epoch": 2504} {"train_loss": -24.37484359741211, "global_step": 207890, "epoch": 2504} {"train_loss": -24.344253540039062, "global_step": 207891, "epoch": 2504} {"train_loss": -24.117206573486328, "global_step": 207892, "epoch": 2504} {"train_loss": -24.860883712768555, "global_step": 207893, "epoch": 2504} {"train_loss": -24.127765655517578, "global_step": 207894, "epoch": 2504} {"train_loss": -24.254186630249023, "global_step": 207895, "epoch": 2504} {"train_loss": -24.54594612121582, "global_step": 207896, "epoch": 2504} {"train_loss": -24.1497745513916, "global_step": 207897, "epoch": 2504} {"train_loss": -24.507444381713867, "global_step": 207898, "epoch": 2504} {"train_loss": -24.667442321777344, "global_step": 207899, "epoch": 2504} {"train_loss": -24.181074142456055, "global_step": 207900, "epoch": 2504} {"train_loss": -24.045717239379883, "global_step": 207901, "epoch": 2504} {"train_loss": -24.122892379760742, "global_step": 207902, "epoch": 2504} {"train_loss": -24.25168800354004, "global_step": 207903, "epoch": 2504} {"train_loss": -24.53754997253418, "global_step": 207904, "epoch": 2504} {"train_loss": -24.23405647277832, "global_step": 207905, "epoch": 2504} {"train_loss": -24.518264770507812, "global_step": 207906, "epoch": 2504} {"train_loss": -24.60890007019043, "global_step": 207907, "epoch": 2504} {"train_loss": -24.20962142944336, "global_step": 207908, "epoch": 2504} {"train_loss": -24.05443572998047, "global_step": 207909, "epoch": 2504} {"train_loss": -24.19892692565918, "global_step": 207910, "epoch": 2504} {"train_loss": -24.454490661621094, "global_step": 207911, "epoch": 2504} {"train_loss": -24.766006469726562, "global_step": 207912, "epoch": 2504} {"train_loss": -24.5865535736084, "global_step": 207913, "epoch": 2504} {"train_loss": -24.218848377825267, "global_step": 207914, "epoch": 2504, "val_loss": 6456979.0} {"train_loss": -24.038257598876953, "global_step": 207915, "epoch": 2505} {"train_loss": -24.103330612182617, "global_step": 207916, "epoch": 2505} {"train_loss": -24.15901756286621, "global_step": 207917, "epoch": 2505} {"train_loss": -24.420303344726562, "global_step": 207918, "epoch": 2505} {"train_loss": -23.980289459228516, "global_step": 207919, "epoch": 2505} {"train_loss": -24.21634292602539, "global_step": 207920, "epoch": 2505} {"train_loss": -24.697223663330078, "global_step": 207921, "epoch": 2505} {"train_loss": -24.16706657409668, "global_step": 207922, "epoch": 2505} {"train_loss": -23.964582443237305, "global_step": 207923, "epoch": 2505} {"train_loss": -24.411985397338867, "global_step": 207924, "epoch": 2505} {"train_loss": -24.136714935302734, "global_step": 207925, "epoch": 2505} {"train_loss": -24.014562606811523, "global_step": 207926, "epoch": 2505} {"train_loss": -24.36778450012207, "global_step": 207927, "epoch": 2505} {"train_loss": -24.369478225708008, "global_step": 207928, "epoch": 2505} {"train_loss": -24.10695457458496, "global_step": 207929, "epoch": 2505} {"train_loss": -24.80376625061035, "global_step": 207930, "epoch": 2505} {"train_loss": -24.710508346557617, "global_step": 207931, "epoch": 2505} {"train_loss": -24.62074851989746, "global_step": 207932, "epoch": 2505} {"train_loss": -24.50531005859375, "global_step": 207933, "epoch": 2505} {"train_loss": -24.49799346923828, "global_step": 207934, "epoch": 2505} {"train_loss": -24.38348960876465, "global_step": 207935, "epoch": 2505} {"train_loss": -24.87521743774414, "global_step": 207936, "epoch": 2505} {"train_loss": -24.340736389160156, "global_step": 207937, "epoch": 2505} {"train_loss": -24.21988296508789, "global_step": 207938, "epoch": 2505} {"train_loss": -24.486083984375, "global_step": 207939, "epoch": 2505} {"train_loss": -24.693071365356445, "global_step": 207940, "epoch": 2505} {"train_loss": -24.43015480041504, "global_step": 207941, "epoch": 2505} {"train_loss": -24.456594467163086, "global_step": 207942, "epoch": 2505} {"train_loss": -24.593950271606445, "global_step": 207943, "epoch": 2505} {"train_loss": -24.578725814819336, "global_step": 207944, "epoch": 2505} {"train_loss": -24.160985946655273, "global_step": 207945, "epoch": 2505} {"train_loss": -24.019479751586914, "global_step": 207946, "epoch": 2505} {"train_loss": -24.193496704101562, "global_step": 207947, "epoch": 2505} {"train_loss": -24.164325714111328, "global_step": 207948, "epoch": 2505} {"train_loss": -24.65498924255371, "global_step": 207949, "epoch": 2505} {"train_loss": -24.599233627319336, "global_step": 207950, "epoch": 2505} {"train_loss": -24.557958602905273, "global_step": 207951, "epoch": 2505} {"train_loss": -24.479536056518555, "global_step": 207952, "epoch": 2505} {"train_loss": -24.11471176147461, "global_step": 207953, "epoch": 2505} {"train_loss": -24.118284225463867, "global_step": 207954, "epoch": 2505} {"train_loss": -24.815717697143555, "global_step": 207955, "epoch": 2505} {"train_loss": -24.423091888427734, "global_step": 207956, "epoch": 2505} {"train_loss": -24.29237937927246, "global_step": 207957, "epoch": 2505} {"train_loss": -24.677892684936523, "global_step": 207958, "epoch": 2505} {"train_loss": -24.7803955078125, "global_step": 207959, "epoch": 2505} {"train_loss": -24.242904663085938, "global_step": 207960, "epoch": 2505} {"train_loss": -24.855926513671875, "global_step": 207961, "epoch": 2505} {"train_loss": -24.543556213378906, "global_step": 207962, "epoch": 2505} {"train_loss": -24.65091896057129, "global_step": 207963, "epoch": 2505} {"train_loss": -24.31776237487793, "global_step": 207964, "epoch": 2505} {"train_loss": -24.870264053344727, "global_step": 207965, "epoch": 2505} {"train_loss": -24.75809097290039, "global_step": 207966, "epoch": 2505} {"train_loss": -24.65760612487793, "global_step": 207967, "epoch": 2505} {"train_loss": -24.212289810180664, "global_step": 207968, "epoch": 2505} {"train_loss": -24.468551635742188, "global_step": 207969, "epoch": 2505} {"train_loss": -24.670196533203125, "global_step": 207970, "epoch": 2505} {"train_loss": -24.4624080657959, "global_step": 207971, "epoch": 2505} {"train_loss": -24.47278594970703, "global_step": 207972, "epoch": 2505} {"train_loss": -24.20221710205078, "global_step": 207973, "epoch": 2505} {"train_loss": -24.49053955078125, "global_step": 207974, "epoch": 2505} {"train_loss": -24.6242733001709, "global_step": 207975, "epoch": 2505} {"train_loss": -24.46223258972168, "global_step": 207976, "epoch": 2505} {"train_loss": -24.562732696533203, "global_step": 207977, "epoch": 2505} {"train_loss": -24.55482292175293, "global_step": 207978, "epoch": 2505} {"train_loss": -24.252561569213867, "global_step": 207979, "epoch": 2505} {"train_loss": -24.65165901184082, "global_step": 207980, "epoch": 2505} {"train_loss": -24.633317947387695, "global_step": 207981, "epoch": 2505} {"train_loss": -24.55596351623535, "global_step": 207982, "epoch": 2505} {"train_loss": -24.77095603942871, "global_step": 207983, "epoch": 2505} {"train_loss": -24.495534896850586, "global_step": 207984, "epoch": 2505} {"train_loss": -24.641721725463867, "global_step": 207985, "epoch": 2505} {"train_loss": -24.353628158569336, "global_step": 207986, "epoch": 2505} {"train_loss": -24.350788116455078, "global_step": 207987, "epoch": 2505} {"train_loss": -24.4851016998291, "global_step": 207988, "epoch": 2505} {"train_loss": -24.6508846282959, "global_step": 207989, "epoch": 2505} {"train_loss": -25.133039474487305, "global_step": 207990, "epoch": 2505} {"train_loss": -24.163501739501953, "global_step": 207991, "epoch": 2505} {"train_loss": -24.539419174194336, "global_step": 207992, "epoch": 2505} {"train_loss": -24.431640625, "global_step": 207993, "epoch": 2505} {"train_loss": -24.582117080688477, "global_step": 207994, "epoch": 2505} {"train_loss": -24.414844512939453, "global_step": 207995, "epoch": 2505} {"train_loss": -24.357534408569336, "global_step": 207996, "epoch": 2505} {"train_loss": -24.43354257330837, "global_step": 207997, "epoch": 2505, "val_loss": 6662052.5} {"train_loss": -22.001445770263672, "global_step": 207998, "epoch": 2506} {"train_loss": -22.4776668548584, "global_step": 207999, "epoch": 2506} {"train_loss": -24.088333129882812, "global_step": 208000, "epoch": 2506} {"train_loss": -22.972148895263672, "global_step": 208001, "epoch": 2506} {"train_loss": -23.428937911987305, "global_step": 208002, "epoch": 2506} {"train_loss": -23.62769317626953, "global_step": 208003, "epoch": 2506} {"train_loss": -23.8934326171875, "global_step": 208004, "epoch": 2506} {"train_loss": -23.84810447692871, "global_step": 208005, "epoch": 2506} {"train_loss": -23.3260498046875, "global_step": 208006, "epoch": 2506} {"train_loss": -23.511404037475586, "global_step": 208007, "epoch": 2506} {"train_loss": -23.789987564086914, "global_step": 208008, "epoch": 2506} {"train_loss": -23.927139282226562, "global_step": 208009, "epoch": 2506} {"train_loss": -23.25148582458496, "global_step": 208010, "epoch": 2506} {"train_loss": -23.775861740112305, "global_step": 208011, "epoch": 2506} {"train_loss": -24.116180419921875, "global_step": 208012, "epoch": 2506} {"train_loss": -23.978391647338867, "global_step": 208013, "epoch": 2506} {"train_loss": -23.52730369567871, "global_step": 208014, "epoch": 2506} {"train_loss": -23.84689712524414, "global_step": 208015, "epoch": 2506} {"train_loss": -24.048826217651367, "global_step": 208016, "epoch": 2506} {"train_loss": -23.881458282470703, "global_step": 208017, "epoch": 2506} {"train_loss": -24.04134178161621, "global_step": 208018, "epoch": 2506} {"train_loss": -24.051227569580078, "global_step": 208019, "epoch": 2506} {"train_loss": -24.057336807250977, "global_step": 208020, "epoch": 2506} {"train_loss": -23.896072387695312, "global_step": 208021, "epoch": 2506} {"train_loss": -24.0351505279541, "global_step": 208022, "epoch": 2506} {"train_loss": -24.250593185424805, "global_step": 208023, "epoch": 2506} {"train_loss": -24.359067916870117, "global_step": 208024, "epoch": 2506} {"train_loss": -24.483726501464844, "global_step": 208025, "epoch": 2506} {"train_loss": -24.026546478271484, "global_step": 208026, "epoch": 2506} {"train_loss": -24.207809448242188, "global_step": 208027, "epoch": 2506} {"train_loss": -24.088708877563477, "global_step": 208028, "epoch": 2506} {"train_loss": -24.266815185546875, "global_step": 208029, "epoch": 2506} {"train_loss": -23.87099266052246, "global_step": 208030, "epoch": 2506} {"train_loss": -24.444150924682617, "global_step": 208031, "epoch": 2506} {"train_loss": -24.307851791381836, "global_step": 208032, "epoch": 2506} {"train_loss": -24.111576080322266, "global_step": 208033, "epoch": 2506} {"train_loss": -24.462581634521484, "global_step": 208034, "epoch": 2506} {"train_loss": -24.4360294342041, "global_step": 208035, "epoch": 2506} {"train_loss": -24.154897689819336, "global_step": 208036, "epoch": 2506} {"train_loss": -24.030622482299805, "global_step": 208037, "epoch": 2506} {"train_loss": -24.265241622924805, "global_step": 208038, "epoch": 2506} {"train_loss": -24.04347801208496, "global_step": 208039, "epoch": 2506} {"train_loss": -24.21750831604004, "global_step": 208040, "epoch": 2506} {"train_loss": -24.285266876220703, "global_step": 208041, "epoch": 2506} {"train_loss": -24.74061393737793, "global_step": 208042, "epoch": 2506} {"train_loss": -24.05324363708496, "global_step": 208043, "epoch": 2506} {"train_loss": -24.370410919189453, "global_step": 208044, "epoch": 2506} {"train_loss": -24.353118896484375, "global_step": 208045, "epoch": 2506} {"train_loss": -24.515851974487305, "global_step": 208046, "epoch": 2506} {"train_loss": -24.17915916442871, "global_step": 208047, "epoch": 2506} {"train_loss": -24.625829696655273, "global_step": 208048, "epoch": 2506} {"train_loss": -24.0236759185791, "global_step": 208049, "epoch": 2506} {"train_loss": -24.24409294128418, "global_step": 208050, "epoch": 2506} {"train_loss": -24.373388290405273, "global_step": 208051, "epoch": 2506} {"train_loss": -24.72774314880371, "global_step": 208052, "epoch": 2506} {"train_loss": -24.229352951049805, "global_step": 208053, "epoch": 2506} {"train_loss": -24.132068634033203, "global_step": 208054, "epoch": 2506} {"train_loss": -24.30364418029785, "global_step": 208055, "epoch": 2506} {"train_loss": -24.1307315826416, "global_step": 208056, "epoch": 2506} {"train_loss": -24.317201614379883, "global_step": 208057, "epoch": 2506} {"train_loss": -24.160429000854492, "global_step": 208058, "epoch": 2506} {"train_loss": -24.464508056640625, "global_step": 208059, "epoch": 2506} {"train_loss": -24.096403121948242, "global_step": 208060, "epoch": 2506} {"train_loss": -24.415246963500977, "global_step": 208061, "epoch": 2506} {"train_loss": -24.30384063720703, "global_step": 208062, "epoch": 2506} {"train_loss": -24.479345321655273, "global_step": 208063, "epoch": 2506} {"train_loss": -24.16327667236328, "global_step": 208064, "epoch": 2506} {"train_loss": -24.233762741088867, "global_step": 208065, "epoch": 2506} {"train_loss": -24.51300048828125, "global_step": 208066, "epoch": 2506} {"train_loss": -24.576757431030273, "global_step": 208067, "epoch": 2506} {"train_loss": -24.413991928100586, "global_step": 208068, "epoch": 2506} {"train_loss": -24.298917770385742, "global_step": 208069, "epoch": 2506} {"train_loss": -24.17439842224121, "global_step": 208070, "epoch": 2506} {"train_loss": -24.1040096282959, "global_step": 208071, "epoch": 2506} {"train_loss": -23.423635482788086, "global_step": 208072, "epoch": 2506} {"train_loss": -23.797801971435547, "global_step": 208073, "epoch": 2506} {"train_loss": -24.315353393554688, "global_step": 208074, "epoch": 2506} {"train_loss": -24.051660537719727, "global_step": 208075, "epoch": 2506} {"train_loss": -23.942508697509766, "global_step": 208076, "epoch": 2506} {"train_loss": -23.9926815032959, "global_step": 208077, "epoch": 2506} {"train_loss": -24.65394401550293, "global_step": 208078, "epoch": 2506} {"train_loss": -24.076980590820312, "global_step": 208079, "epoch": 2506} {"train_loss": -24.061390819319758, "global_step": 208080, "epoch": 2506, "val_loss": 6541181.5} {"train_loss": -23.901884078979492, "global_step": 208081, "epoch": 2507} {"train_loss": -23.031766891479492, "global_step": 208082, "epoch": 2507} {"train_loss": -24.028339385986328, "global_step": 208083, "epoch": 2507} {"train_loss": -23.810596466064453, "global_step": 208084, "epoch": 2507} {"train_loss": -23.117721557617188, "global_step": 208085, "epoch": 2507} {"train_loss": -24.02423667907715, "global_step": 208086, "epoch": 2507} {"train_loss": -23.17036247253418, "global_step": 208087, "epoch": 2507} {"train_loss": -23.70098304748535, "global_step": 208088, "epoch": 2507} {"train_loss": -23.835798263549805, "global_step": 208089, "epoch": 2507} {"train_loss": -23.822385787963867, "global_step": 208090, "epoch": 2507} {"train_loss": -23.94959831237793, "global_step": 208091, "epoch": 2507} {"train_loss": -23.760896682739258, "global_step": 208092, "epoch": 2507} {"train_loss": -23.98577117919922, "global_step": 208093, "epoch": 2507} {"train_loss": -24.26251983642578, "global_step": 208094, "epoch": 2507} {"train_loss": -24.098703384399414, "global_step": 208095, "epoch": 2507} {"train_loss": -24.00935173034668, "global_step": 208096, "epoch": 2507} {"train_loss": -23.862436294555664, "global_step": 208097, "epoch": 2507} {"train_loss": -24.204763412475586, "global_step": 208098, "epoch": 2507} {"train_loss": -24.566587448120117, "global_step": 208099, "epoch": 2507} {"train_loss": -23.902612686157227, "global_step": 208100, "epoch": 2507} {"train_loss": -24.337064743041992, "global_step": 208101, "epoch": 2507} {"train_loss": -24.03104591369629, "global_step": 208102, "epoch": 2507} {"train_loss": -24.4602108001709, "global_step": 208103, "epoch": 2507} {"train_loss": -24.064281463623047, "global_step": 208104, "epoch": 2507} {"train_loss": -24.257587432861328, "global_step": 208105, "epoch": 2507} {"train_loss": -24.450313568115234, "global_step": 208106, "epoch": 2507} {"train_loss": -23.990646362304688, "global_step": 208107, "epoch": 2507} {"train_loss": -24.503583908081055, "global_step": 208108, "epoch": 2507} {"train_loss": -24.401464462280273, "global_step": 208109, "epoch": 2507} {"train_loss": -24.5225887298584, "global_step": 208110, "epoch": 2507} {"train_loss": -24.457887649536133, "global_step": 208111, "epoch": 2507} {"train_loss": -24.16779899597168, "global_step": 208112, "epoch": 2507} {"train_loss": -24.429590225219727, "global_step": 208113, "epoch": 2507} {"train_loss": -24.423358917236328, "global_step": 208114, "epoch": 2507} {"train_loss": -24.375320434570312, "global_step": 208115, "epoch": 2507} {"train_loss": -24.577377319335938, "global_step": 208116, "epoch": 2507} {"train_loss": -24.23685646057129, "global_step": 208117, "epoch": 2507} {"train_loss": -24.4504451751709, "global_step": 208118, "epoch": 2507} {"train_loss": -24.422956466674805, "global_step": 208119, "epoch": 2507} {"train_loss": -24.161706924438477, "global_step": 208120, "epoch": 2507} {"train_loss": -24.70088768005371, "global_step": 208121, "epoch": 2507} {"train_loss": -24.03544044494629, "global_step": 208122, "epoch": 2507} {"train_loss": -24.299100875854492, "global_step": 208123, "epoch": 2507} {"train_loss": -24.442495346069336, "global_step": 208124, "epoch": 2507} {"train_loss": -24.397815704345703, "global_step": 208125, "epoch": 2507} {"train_loss": -24.18537712097168, "global_step": 208126, "epoch": 2507} {"train_loss": -24.495840072631836, "global_step": 208127, "epoch": 2507} {"train_loss": -24.310749053955078, "global_step": 208128, "epoch": 2507} {"train_loss": -24.1592960357666, "global_step": 208129, "epoch": 2507} {"train_loss": -24.18287467956543, "global_step": 208130, "epoch": 2507} {"train_loss": -23.985395431518555, "global_step": 208131, "epoch": 2507} {"train_loss": -24.298629760742188, "global_step": 208132, "epoch": 2507} {"train_loss": -24.472150802612305, "global_step": 208133, "epoch": 2507} {"train_loss": -23.971527099609375, "global_step": 208134, "epoch": 2507} {"train_loss": -24.00178337097168, "global_step": 208135, "epoch": 2507} {"train_loss": -24.632461547851562, "global_step": 208136, "epoch": 2507} {"train_loss": -24.267562866210938, "global_step": 208137, "epoch": 2507} {"train_loss": -23.66121482849121, "global_step": 208138, "epoch": 2507} {"train_loss": -23.612428665161133, "global_step": 208139, "epoch": 2507} {"train_loss": -24.489614486694336, "global_step": 208140, "epoch": 2507} {"train_loss": -24.07029151916504, "global_step": 208141, "epoch": 2507} {"train_loss": -24.014394760131836, "global_step": 208142, "epoch": 2507} {"train_loss": -24.51171112060547, "global_step": 208143, "epoch": 2507} {"train_loss": -24.23722267150879, "global_step": 208144, "epoch": 2507} {"train_loss": -24.355844497680664, "global_step": 208145, "epoch": 2507} {"train_loss": -24.198387145996094, "global_step": 208146, "epoch": 2507} {"train_loss": -24.413597106933594, "global_step": 208147, "epoch": 2507} {"train_loss": -24.459213256835938, "global_step": 208148, "epoch": 2507} {"train_loss": -24.067630767822266, "global_step": 208149, "epoch": 2507} {"train_loss": -24.308462142944336, "global_step": 208150, "epoch": 2507} {"train_loss": -23.990758895874023, "global_step": 208151, "epoch": 2507} {"train_loss": -24.154621124267578, "global_step": 208152, "epoch": 2507} {"train_loss": -24.454864501953125, "global_step": 208153, "epoch": 2507} {"train_loss": -24.246017456054688, "global_step": 208154, "epoch": 2507} {"train_loss": -24.184812545776367, "global_step": 208155, "epoch": 2507} {"train_loss": -24.212343215942383, "global_step": 208156, "epoch": 2507} {"train_loss": -24.541410446166992, "global_step": 208157, "epoch": 2507} {"train_loss": -24.296812057495117, "global_step": 208158, "epoch": 2507} {"train_loss": -24.595869064331055, "global_step": 208159, "epoch": 2507} {"train_loss": -24.42477798461914, "global_step": 208160, "epoch": 2507} {"train_loss": -24.26591682434082, "global_step": 208161, "epoch": 2507} {"train_loss": -24.65537452697754, "global_step": 208162, "epoch": 2507} {"train_loss": -24.19312686230763, "global_step": 208163, "epoch": 2507, "val_loss": 6702084.0} {"train_loss": -24.074522018432617, "global_step": 208164, "epoch": 2508} {"train_loss": -24.242843627929688, "global_step": 208165, "epoch": 2508} {"train_loss": -24.366039276123047, "global_step": 208166, "epoch": 2508} {"train_loss": -24.527524948120117, "global_step": 208167, "epoch": 2508} {"train_loss": -24.378005981445312, "global_step": 208168, "epoch": 2508} {"train_loss": -24.202871322631836, "global_step": 208169, "epoch": 2508} {"train_loss": -24.35713768005371, "global_step": 208170, "epoch": 2508} {"train_loss": -24.31287956237793, "global_step": 208171, "epoch": 2508} {"train_loss": -24.40677833557129, "global_step": 208172, "epoch": 2508} {"train_loss": -24.494386672973633, "global_step": 208173, "epoch": 2508} {"train_loss": -23.861358642578125, "global_step": 208174, "epoch": 2508} {"train_loss": -24.550758361816406, "global_step": 208175, "epoch": 2508} {"train_loss": -24.090911865234375, "global_step": 208176, "epoch": 2508} {"train_loss": -24.068065643310547, "global_step": 208177, "epoch": 2508} {"train_loss": -23.883573532104492, "global_step": 208178, "epoch": 2508} {"train_loss": -24.63663101196289, "global_step": 208179, "epoch": 2508} {"train_loss": -24.021886825561523, "global_step": 208180, "epoch": 2508} {"train_loss": -24.570541381835938, "global_step": 208181, "epoch": 2508} {"train_loss": -24.33929443359375, "global_step": 208182, "epoch": 2508} {"train_loss": -24.338176727294922, "global_step": 208183, "epoch": 2508} {"train_loss": -24.198896408081055, "global_step": 208184, "epoch": 2508} {"train_loss": -23.999361038208008, "global_step": 208185, "epoch": 2508} {"train_loss": -24.435394287109375, "global_step": 208186, "epoch": 2508} {"train_loss": -24.01974868774414, "global_step": 208187, "epoch": 2508} {"train_loss": -24.292034149169922, "global_step": 208188, "epoch": 2508} {"train_loss": -24.450544357299805, "global_step": 208189, "epoch": 2508} {"train_loss": -24.811532974243164, "global_step": 208190, "epoch": 2508} {"train_loss": -24.302888870239258, "global_step": 208191, "epoch": 2508} {"train_loss": -24.281057357788086, "global_step": 208192, "epoch": 2508} {"train_loss": -24.132003784179688, "global_step": 208193, "epoch": 2508} {"train_loss": -24.22828483581543, "global_step": 208194, "epoch": 2508} {"train_loss": -24.521514892578125, "global_step": 208195, "epoch": 2508} {"train_loss": -24.53513526916504, "global_step": 208196, "epoch": 2508} {"train_loss": -24.041990280151367, "global_step": 208197, "epoch": 2508} {"train_loss": -24.232515335083008, "global_step": 208198, "epoch": 2508} {"train_loss": -24.525606155395508, "global_step": 208199, "epoch": 2508} {"train_loss": -24.16613006591797, "global_step": 208200, "epoch": 2508} {"train_loss": -24.120187759399414, "global_step": 208201, "epoch": 2508} {"train_loss": -24.6683406829834, "global_step": 208202, "epoch": 2508} {"train_loss": -24.205097198486328, "global_step": 208203, "epoch": 2508} {"train_loss": -24.405731201171875, "global_step": 208204, "epoch": 2508} {"train_loss": -24.454618453979492, "global_step": 208205, "epoch": 2508} {"train_loss": -24.22603416442871, "global_step": 208206, "epoch": 2508} {"train_loss": -24.295461654663086, "global_step": 208207, "epoch": 2508} {"train_loss": -23.846975326538086, "global_step": 208208, "epoch": 2508} {"train_loss": -24.395545959472656, "global_step": 208209, "epoch": 2508} {"train_loss": -24.53207778930664, "global_step": 208210, "epoch": 2508} {"train_loss": -24.390886306762695, "global_step": 208211, "epoch": 2508} {"train_loss": -24.473051071166992, "global_step": 208212, "epoch": 2508} {"train_loss": -24.323904037475586, "global_step": 208213, "epoch": 2508} {"train_loss": -24.273603439331055, "global_step": 208214, "epoch": 2508} {"train_loss": -24.697973251342773, "global_step": 208215, "epoch": 2508} {"train_loss": -24.500110626220703, "global_step": 208216, "epoch": 2508} {"train_loss": -24.602407455444336, "global_step": 208217, "epoch": 2508} {"train_loss": -24.182836532592773, "global_step": 208218, "epoch": 2508} {"train_loss": -24.451101303100586, "global_step": 208219, "epoch": 2508} {"train_loss": -24.523048400878906, "global_step": 208220, "epoch": 2508} {"train_loss": -24.253305435180664, "global_step": 208221, "epoch": 2508} {"train_loss": -24.392333984375, "global_step": 208222, "epoch": 2508} {"train_loss": -24.457242965698242, "global_step": 208223, "epoch": 2508} {"train_loss": -24.46871566772461, "global_step": 208224, "epoch": 2508} {"train_loss": -24.586566925048828, "global_step": 208225, "epoch": 2508} {"train_loss": -24.373390197753906, "global_step": 208226, "epoch": 2508} {"train_loss": -24.21228790283203, "global_step": 208227, "epoch": 2508} {"train_loss": -24.364776611328125, "global_step": 208228, "epoch": 2508} {"train_loss": -24.562946319580078, "global_step": 208229, "epoch": 2508} {"train_loss": -24.560043334960938, "global_step": 208230, "epoch": 2508} {"train_loss": -24.411909103393555, "global_step": 208231, "epoch": 2508} {"train_loss": -24.650999069213867, "global_step": 208232, "epoch": 2508} {"train_loss": -24.58070945739746, "global_step": 208233, "epoch": 2508} {"train_loss": -24.538724899291992, "global_step": 208234, "epoch": 2508} {"train_loss": -24.007328033447266, "global_step": 208235, "epoch": 2508} {"train_loss": -24.314056396484375, "global_step": 208236, "epoch": 2508} {"train_loss": -24.157934188842773, "global_step": 208237, "epoch": 2508} {"train_loss": -24.40185546875, "global_step": 208238, "epoch": 2508} {"train_loss": -24.9652042388916, "global_step": 208239, "epoch": 2508} {"train_loss": -24.228782653808594, "global_step": 208240, "epoch": 2508} {"train_loss": -24.185632705688477, "global_step": 208241, "epoch": 2508} {"train_loss": -24.127700805664062, "global_step": 208242, "epoch": 2508} {"train_loss": -24.401662826538086, "global_step": 208243, "epoch": 2508} {"train_loss": -23.797805786132812, "global_step": 208244, "epoch": 2508} {"train_loss": -24.31352996826172, "global_step": 208245, "epoch": 2508} {"train_loss": -24.33970713328166, "global_step": 208246, "epoch": 2508, "val_loss": 6680641.0} {"train_loss": -23.16245460510254, "global_step": 208247, "epoch": 2509} {"train_loss": -23.276260375976562, "global_step": 208248, "epoch": 2509} {"train_loss": -23.67409324645996, "global_step": 208249, "epoch": 2509} {"train_loss": -23.709890365600586, "global_step": 208250, "epoch": 2509} {"train_loss": -23.291282653808594, "global_step": 208251, "epoch": 2509} {"train_loss": -23.621484756469727, "global_step": 208252, "epoch": 2509} {"train_loss": -23.774442672729492, "global_step": 208253, "epoch": 2509} {"train_loss": -23.671674728393555, "global_step": 208254, "epoch": 2509} {"train_loss": -23.701196670532227, "global_step": 208255, "epoch": 2509} {"train_loss": -24.109235763549805, "global_step": 208256, "epoch": 2509} {"train_loss": -23.929656982421875, "global_step": 208257, "epoch": 2509} {"train_loss": -23.611440658569336, "global_step": 208258, "epoch": 2509} {"train_loss": -23.776641845703125, "global_step": 208259, "epoch": 2509} {"train_loss": -24.155332565307617, "global_step": 208260, "epoch": 2509} {"train_loss": -24.055356979370117, "global_step": 208261, "epoch": 2509} {"train_loss": -24.10857582092285, "global_step": 208262, "epoch": 2509} {"train_loss": -23.863525390625, "global_step": 208263, "epoch": 2509} {"train_loss": -23.980449676513672, "global_step": 208264, "epoch": 2509} {"train_loss": -24.310903549194336, "global_step": 208265, "epoch": 2509} {"train_loss": -24.235092163085938, "global_step": 208266, "epoch": 2509} {"train_loss": -24.257837295532227, "global_step": 208267, "epoch": 2509} {"train_loss": -23.87122917175293, "global_step": 208268, "epoch": 2509} {"train_loss": -24.445560455322266, "global_step": 208269, "epoch": 2509} {"train_loss": -24.328367233276367, "global_step": 208270, "epoch": 2509} {"train_loss": -24.33646011352539, "global_step": 208271, "epoch": 2509} {"train_loss": -24.23250389099121, "global_step": 208272, "epoch": 2509} {"train_loss": -24.306737899780273, "global_step": 208273, "epoch": 2509} {"train_loss": -24.617088317871094, "global_step": 208274, "epoch": 2509} {"train_loss": -24.509796142578125, "global_step": 208275, "epoch": 2509} {"train_loss": -24.476713180541992, "global_step": 208276, "epoch": 2509} {"train_loss": -24.371658325195312, "global_step": 208277, "epoch": 2509} {"train_loss": -24.184293746948242, "global_step": 208278, "epoch": 2509} {"train_loss": -24.19490623474121, "global_step": 208279, "epoch": 2509} {"train_loss": -24.425601959228516, "global_step": 208280, "epoch": 2509} {"train_loss": -24.473875045776367, "global_step": 208281, "epoch": 2509} {"train_loss": -24.174726486206055, "global_step": 208282, "epoch": 2509} {"train_loss": -24.579021453857422, "global_step": 208283, "epoch": 2509} {"train_loss": -24.62453269958496, "global_step": 208284, "epoch": 2509} {"train_loss": -24.774499893188477, "global_step": 208285, "epoch": 2509} {"train_loss": -24.385129928588867, "global_step": 208286, "epoch": 2509} {"train_loss": -23.944522857666016, "global_step": 208287, "epoch": 2509} {"train_loss": -24.166975021362305, "global_step": 208288, "epoch": 2509} {"train_loss": -24.377166748046875, "global_step": 208289, "epoch": 2509} {"train_loss": -24.385101318359375, "global_step": 208290, "epoch": 2509} {"train_loss": -24.004657745361328, "global_step": 208291, "epoch": 2509} {"train_loss": -24.4410400390625, "global_step": 208292, "epoch": 2509} {"train_loss": -24.35986328125, "global_step": 208293, "epoch": 2509} {"train_loss": -24.919986724853516, "global_step": 208294, "epoch": 2509} {"train_loss": -24.551349639892578, "global_step": 208295, "epoch": 2509} {"train_loss": -24.495817184448242, "global_step": 208296, "epoch": 2509} {"train_loss": -24.194364547729492, "global_step": 208297, "epoch": 2509} {"train_loss": -24.554168701171875, "global_step": 208298, "epoch": 2509} {"train_loss": -24.441255569458008, "global_step": 208299, "epoch": 2509} {"train_loss": -24.368408203125, "global_step": 208300, "epoch": 2509} {"train_loss": -24.01007652282715, "global_step": 208301, "epoch": 2509} {"train_loss": -24.56315040588379, "global_step": 208302, "epoch": 2509} {"train_loss": -23.97125816345215, "global_step": 208303, "epoch": 2509} {"train_loss": -24.179914474487305, "global_step": 208304, "epoch": 2509} {"train_loss": -24.33547019958496, "global_step": 208305, "epoch": 2509} {"train_loss": -23.961978912353516, "global_step": 208306, "epoch": 2509} {"train_loss": -24.385215759277344, "global_step": 208307, "epoch": 2509} {"train_loss": -24.575197219848633, "global_step": 208308, "epoch": 2509} {"train_loss": -24.35439109802246, "global_step": 208309, "epoch": 2509} {"train_loss": -24.221487045288086, "global_step": 208310, "epoch": 2509} {"train_loss": -24.64691162109375, "global_step": 208311, "epoch": 2509} {"train_loss": -24.470306396484375, "global_step": 208312, "epoch": 2509} {"train_loss": -24.445215225219727, "global_step": 208313, "epoch": 2509} {"train_loss": -24.735260009765625, "global_step": 208314, "epoch": 2509} {"train_loss": -24.185312271118164, "global_step": 208315, "epoch": 2509} {"train_loss": -24.651412963867188, "global_step": 208316, "epoch": 2509} {"train_loss": -24.225141525268555, "global_step": 208317, "epoch": 2509} {"train_loss": -24.258987426757812, "global_step": 208318, "epoch": 2509} {"train_loss": -24.527259826660156, "global_step": 208319, "epoch": 2509} {"train_loss": -24.267597198486328, "global_step": 208320, "epoch": 2509} {"train_loss": -24.605314254760742, "global_step": 208321, "epoch": 2509} {"train_loss": -24.165565490722656, "global_step": 208322, "epoch": 2509} {"train_loss": -24.448280334472656, "global_step": 208323, "epoch": 2509} {"train_loss": -24.37555503845215, "global_step": 208324, "epoch": 2509} {"train_loss": -24.754867553710938, "global_step": 208325, "epoch": 2509} {"train_loss": -24.418806076049805, "global_step": 208326, "epoch": 2509} {"train_loss": -24.5968017578125, "global_step": 208327, "epoch": 2509} {"train_loss": -24.484865188598633, "global_step": 208328, "epoch": 2509} {"train_loss": -24.215914599866753, "global_step": 208329, "epoch": 2509, "val_loss": 6657365.0} {"train_loss": -24.139738082885742, "global_step": 208330, "epoch": 2510} {"train_loss": -23.66066551208496, "global_step": 208331, "epoch": 2510} {"train_loss": -23.901586532592773, "global_step": 208332, "epoch": 2510} {"train_loss": -24.61312484741211, "global_step": 208333, "epoch": 2510} {"train_loss": -23.68195152282715, "global_step": 208334, "epoch": 2510} {"train_loss": -23.84903335571289, "global_step": 208335, "epoch": 2510} {"train_loss": -24.339242935180664, "global_step": 208336, "epoch": 2510} {"train_loss": -23.867691040039062, "global_step": 208337, "epoch": 2510} {"train_loss": -24.270954132080078, "global_step": 208338, "epoch": 2510} {"train_loss": -24.508573532104492, "global_step": 208339, "epoch": 2510} {"train_loss": -23.793323516845703, "global_step": 208340, "epoch": 2510} {"train_loss": -24.069141387939453, "global_step": 208341, "epoch": 2510} {"train_loss": -24.18586540222168, "global_step": 208342, "epoch": 2510} {"train_loss": -23.837358474731445, "global_step": 208343, "epoch": 2510} {"train_loss": -24.116037368774414, "global_step": 208344, "epoch": 2510} {"train_loss": -24.56757926940918, "global_step": 208345, "epoch": 2510} {"train_loss": -24.144201278686523, "global_step": 208346, "epoch": 2510} {"train_loss": -24.781293869018555, "global_step": 208347, "epoch": 2510} {"train_loss": -24.2965030670166, "global_step": 208348, "epoch": 2510} {"train_loss": -24.105091094970703, "global_step": 208349, "epoch": 2510} {"train_loss": -24.235492706298828, "global_step": 208350, "epoch": 2510} {"train_loss": -24.256820678710938, "global_step": 208351, "epoch": 2510} {"train_loss": -24.802854537963867, "global_step": 208352, "epoch": 2510} {"train_loss": -24.295101165771484, "global_step": 208353, "epoch": 2510} {"train_loss": -24.44398307800293, "global_step": 208354, "epoch": 2510} {"train_loss": -24.261777877807617, "global_step": 208355, "epoch": 2510} {"train_loss": -24.42364501953125, "global_step": 208356, "epoch": 2510} {"train_loss": -24.407886505126953, "global_step": 208357, "epoch": 2510} {"train_loss": -24.471389770507812, "global_step": 208358, "epoch": 2510} {"train_loss": -24.294662475585938, "global_step": 208359, "epoch": 2510} {"train_loss": -24.743803024291992, "global_step": 208360, "epoch": 2510} {"train_loss": -24.267837524414062, "global_step": 208361, "epoch": 2510} {"train_loss": -24.72417449951172, "global_step": 208362, "epoch": 2510} {"train_loss": -24.495840072631836, "global_step": 208363, "epoch": 2510} {"train_loss": -24.6993465423584, "global_step": 208364, "epoch": 2510} {"train_loss": -24.57980728149414, "global_step": 208365, "epoch": 2510} {"train_loss": -24.620798110961914, "global_step": 208366, "epoch": 2510} {"train_loss": -24.333484649658203, "global_step": 208367, "epoch": 2510} {"train_loss": -24.470203399658203, "global_step": 208368, "epoch": 2510} {"train_loss": -24.47014617919922, "global_step": 208369, "epoch": 2510} {"train_loss": -24.798784255981445, "global_step": 208370, "epoch": 2510} {"train_loss": -24.55868911743164, "global_step": 208371, "epoch": 2510} {"train_loss": -24.259939193725586, "global_step": 208372, "epoch": 2510} {"train_loss": -24.828773498535156, "global_step": 208373, "epoch": 2510} {"train_loss": -24.209959030151367, "global_step": 208374, "epoch": 2510} {"train_loss": -24.379932403564453, "global_step": 208375, "epoch": 2510} {"train_loss": -24.357097625732422, "global_step": 208376, "epoch": 2510} {"train_loss": -24.295339584350586, "global_step": 208377, "epoch": 2510} {"train_loss": -24.65535545349121, "global_step": 208378, "epoch": 2510} {"train_loss": -24.324033737182617, "global_step": 208379, "epoch": 2510} {"train_loss": -24.521577835083008, "global_step": 208380, "epoch": 2510} {"train_loss": -24.756561279296875, "global_step": 208381, "epoch": 2510} {"train_loss": -24.390287399291992, "global_step": 208382, "epoch": 2510} {"train_loss": -24.526264190673828, "global_step": 208383, "epoch": 2510} {"train_loss": -24.31959342956543, "global_step": 208384, "epoch": 2510} {"train_loss": -24.390954971313477, "global_step": 208385, "epoch": 2510} {"train_loss": -24.495067596435547, "global_step": 208386, "epoch": 2510} {"train_loss": -24.493270874023438, "global_step": 208387, "epoch": 2510} {"train_loss": -24.64445686340332, "global_step": 208388, "epoch": 2510} {"train_loss": -24.447509765625, "global_step": 208389, "epoch": 2510} {"train_loss": -24.196622848510742, "global_step": 208390, "epoch": 2510} {"train_loss": -24.444021224975586, "global_step": 208391, "epoch": 2510} {"train_loss": -24.362533569335938, "global_step": 208392, "epoch": 2510} {"train_loss": -24.75217628479004, "global_step": 208393, "epoch": 2510} {"train_loss": -24.562808990478516, "global_step": 208394, "epoch": 2510} {"train_loss": -24.10463523864746, "global_step": 208395, "epoch": 2510} {"train_loss": -23.74667739868164, "global_step": 208396, "epoch": 2510} {"train_loss": -23.808841705322266, "global_step": 208397, "epoch": 2510} {"train_loss": -24.42266845703125, "global_step": 208398, "epoch": 2510} {"train_loss": -24.288171768188477, "global_step": 208399, "epoch": 2510} {"train_loss": -24.048442840576172, "global_step": 208400, "epoch": 2510} {"train_loss": -24.045530319213867, "global_step": 208401, "epoch": 2510} {"train_loss": -24.170751571655273, "global_step": 208402, "epoch": 2510} {"train_loss": -24.16046714782715, "global_step": 208403, "epoch": 2510} {"train_loss": -23.98692512512207, "global_step": 208404, "epoch": 2510} {"train_loss": -23.59126091003418, "global_step": 208405, "epoch": 2510} {"train_loss": -24.335954666137695, "global_step": 208406, "epoch": 2510} {"train_loss": -24.471837997436523, "global_step": 208407, "epoch": 2510} {"train_loss": -24.23356056213379, "global_step": 208408, "epoch": 2510} {"train_loss": -24.583200454711914, "global_step": 208409, "epoch": 2510} {"train_loss": -23.97150993347168, "global_step": 208410, "epoch": 2510} {"train_loss": -24.3347225189209, "global_step": 208411, "epoch": 2510} {"train_loss": -24.328746198171594, "global_step": 208412, "epoch": 2510, "val_loss": 6615030.0} {"train_loss": -23.74616241455078, "global_step": 208413, "epoch": 2511} {"train_loss": -23.923057556152344, "global_step": 208414, "epoch": 2511} {"train_loss": -24.057636260986328, "global_step": 208415, "epoch": 2511} {"train_loss": -24.038482666015625, "global_step": 208416, "epoch": 2511} {"train_loss": -23.837026596069336, "global_step": 208417, "epoch": 2511} {"train_loss": -23.907621383666992, "global_step": 208418, "epoch": 2511} {"train_loss": -23.750423431396484, "global_step": 208419, "epoch": 2511} {"train_loss": -24.166810989379883, "global_step": 208420, "epoch": 2511} {"train_loss": -24.485700607299805, "global_step": 208421, "epoch": 2511} {"train_loss": -23.85060691833496, "global_step": 208422, "epoch": 2511} {"train_loss": -24.055164337158203, "global_step": 208423, "epoch": 2511} {"train_loss": -24.445056915283203, "global_step": 208424, "epoch": 2511} {"train_loss": -24.067068099975586, "global_step": 208425, "epoch": 2511} {"train_loss": -24.615049362182617, "global_step": 208426, "epoch": 2511} {"train_loss": -24.214759826660156, "global_step": 208427, "epoch": 2511} {"train_loss": -23.96868324279785, "global_step": 208428, "epoch": 2511} {"train_loss": -24.66364860534668, "global_step": 208429, "epoch": 2511} {"train_loss": -24.40695571899414, "global_step": 208430, "epoch": 2511} {"train_loss": -24.36203384399414, "global_step": 208431, "epoch": 2511} {"train_loss": -24.440872192382812, "global_step": 208432, "epoch": 2511} {"train_loss": -24.68218421936035, "global_step": 208433, "epoch": 2511} {"train_loss": -24.068246841430664, "global_step": 208434, "epoch": 2511} {"train_loss": -24.919034957885742, "global_step": 208435, "epoch": 2511} {"train_loss": -24.4768009185791, "global_step": 208436, "epoch": 2511} {"train_loss": -24.464624404907227, "global_step": 208437, "epoch": 2511} {"train_loss": -24.150259017944336, "global_step": 208438, "epoch": 2511} {"train_loss": -24.392446517944336, "global_step": 208439, "epoch": 2511} {"train_loss": -24.486572265625, "global_step": 208440, "epoch": 2511} {"train_loss": -24.337491989135742, "global_step": 208441, "epoch": 2511} {"train_loss": -24.642621994018555, "global_step": 208442, "epoch": 2511} {"train_loss": -24.31515884399414, "global_step": 208443, "epoch": 2511} {"train_loss": -24.57790756225586, "global_step": 208444, "epoch": 2511} {"train_loss": -24.065340042114258, "global_step": 208445, "epoch": 2511} {"train_loss": -24.47715187072754, "global_step": 208446, "epoch": 2511} {"train_loss": -24.2794246673584, "global_step": 208447, "epoch": 2511} {"train_loss": -24.223690032958984, "global_step": 208448, "epoch": 2511} {"train_loss": -24.0312557220459, "global_step": 208449, "epoch": 2511} {"train_loss": -23.991785049438477, "global_step": 208450, "epoch": 2511} {"train_loss": -24.312034606933594, "global_step": 208451, "epoch": 2511} {"train_loss": -24.495563507080078, "global_step": 208452, "epoch": 2511} {"train_loss": -24.675689697265625, "global_step": 208453, "epoch": 2511} {"train_loss": -24.39717674255371, "global_step": 208454, "epoch": 2511} {"train_loss": -24.184547424316406, "global_step": 208455, "epoch": 2511} {"train_loss": -24.34571647644043, "global_step": 208456, "epoch": 2511} {"train_loss": -24.372989654541016, "global_step": 208457, "epoch": 2511} {"train_loss": -24.206212997436523, "global_step": 208458, "epoch": 2511} {"train_loss": -24.321380615234375, "global_step": 208459, "epoch": 2511} {"train_loss": -24.47100830078125, "global_step": 208460, "epoch": 2511} {"train_loss": -24.3455867767334, "global_step": 208461, "epoch": 2511} {"train_loss": -24.161794662475586, "global_step": 208462, "epoch": 2511} {"train_loss": -24.35100746154785, "global_step": 208463, "epoch": 2511} {"train_loss": -24.20758819580078, "global_step": 208464, "epoch": 2511} {"train_loss": -24.168142318725586, "global_step": 208465, "epoch": 2511} {"train_loss": -24.36307716369629, "global_step": 208466, "epoch": 2511} {"train_loss": -24.673847198486328, "global_step": 208467, "epoch": 2511} {"train_loss": -24.293432235717773, "global_step": 208468, "epoch": 2511} {"train_loss": -24.455841064453125, "global_step": 208469, "epoch": 2511} {"train_loss": -24.592975616455078, "global_step": 208470, "epoch": 2511} {"train_loss": -24.41511344909668, "global_step": 208471, "epoch": 2511} {"train_loss": -24.47043228149414, "global_step": 208472, "epoch": 2511} {"train_loss": -24.522239685058594, "global_step": 208473, "epoch": 2511} {"train_loss": -24.618915557861328, "global_step": 208474, "epoch": 2511} {"train_loss": -24.454118728637695, "global_step": 208475, "epoch": 2511} {"train_loss": -24.46608543395996, "global_step": 208476, "epoch": 2511} {"train_loss": -24.558385848999023, "global_step": 208477, "epoch": 2511} {"train_loss": -24.480422973632812, "global_step": 208478, "epoch": 2511} {"train_loss": -24.12484359741211, "global_step": 208479, "epoch": 2511} {"train_loss": -24.439071655273438, "global_step": 208480, "epoch": 2511} {"train_loss": -24.066028594970703, "global_step": 208481, "epoch": 2511} {"train_loss": -24.491039276123047, "global_step": 208482, "epoch": 2511} {"train_loss": -24.751829147338867, "global_step": 208483, "epoch": 2511} {"train_loss": -24.14271354675293, "global_step": 208484, "epoch": 2511} {"train_loss": -24.55630874633789, "global_step": 208485, "epoch": 2511} {"train_loss": -24.678268432617188, "global_step": 208486, "epoch": 2511} {"train_loss": -24.398893356323242, "global_step": 208487, "epoch": 2511} {"train_loss": -24.34811019897461, "global_step": 208488, "epoch": 2511} {"train_loss": -24.035402297973633, "global_step": 208489, "epoch": 2511} {"train_loss": -24.19556427001953, "global_step": 208490, "epoch": 2511} {"train_loss": -24.218290328979492, "global_step": 208491, "epoch": 2511} {"train_loss": -23.869403839111328, "global_step": 208492, "epoch": 2511} {"train_loss": -23.632291793823242, "global_step": 208493, "epoch": 2511} {"train_loss": -24.385618209838867, "global_step": 208494, "epoch": 2511} {"train_loss": -24.31900808035609, "global_step": 208495, "epoch": 2511, "val_loss": 6513341.0} {"train_loss": -23.891355514526367, "global_step": 208496, "epoch": 2512} {"train_loss": -23.780719757080078, "global_step": 208497, "epoch": 2512} {"train_loss": -24.20136070251465, "global_step": 208498, "epoch": 2512} {"train_loss": -23.717029571533203, "global_step": 208499, "epoch": 2512} {"train_loss": -23.931005477905273, "global_step": 208500, "epoch": 2512} {"train_loss": -24.08062171936035, "global_step": 208501, "epoch": 2512} {"train_loss": -23.651992797851562, "global_step": 208502, "epoch": 2512} {"train_loss": -23.769559860229492, "global_step": 208503, "epoch": 2512} {"train_loss": -23.676050186157227, "global_step": 208504, "epoch": 2512} {"train_loss": -23.869749069213867, "global_step": 208505, "epoch": 2512} {"train_loss": -23.50916862487793, "global_step": 208506, "epoch": 2512} {"train_loss": -24.252742767333984, "global_step": 208507, "epoch": 2512} {"train_loss": -23.961618423461914, "global_step": 208508, "epoch": 2512} {"train_loss": -23.799924850463867, "global_step": 208509, "epoch": 2512} {"train_loss": -24.348464965820312, "global_step": 208510, "epoch": 2512} {"train_loss": -23.850427627563477, "global_step": 208511, "epoch": 2512} {"train_loss": -24.14704132080078, "global_step": 208512, "epoch": 2512} {"train_loss": -23.683700561523438, "global_step": 208513, "epoch": 2512} {"train_loss": -24.23863983154297, "global_step": 208514, "epoch": 2512} {"train_loss": -24.218427658081055, "global_step": 208515, "epoch": 2512} {"train_loss": -24.324474334716797, "global_step": 208516, "epoch": 2512} {"train_loss": -24.214101791381836, "global_step": 208517, "epoch": 2512} {"train_loss": -24.164447784423828, "global_step": 208518, "epoch": 2512} {"train_loss": -24.299795150756836, "global_step": 208519, "epoch": 2512} {"train_loss": -24.2574462890625, "global_step": 208520, "epoch": 2512} {"train_loss": -24.159204483032227, "global_step": 208521, "epoch": 2512} {"train_loss": -24.380239486694336, "global_step": 208522, "epoch": 2512} {"train_loss": -24.2583065032959, "global_step": 208523, "epoch": 2512} {"train_loss": -24.539640426635742, "global_step": 208524, "epoch": 2512} {"train_loss": -24.465744018554688, "global_step": 208525, "epoch": 2512} {"train_loss": -24.426660537719727, "global_step": 208526, "epoch": 2512} {"train_loss": -24.024274826049805, "global_step": 208527, "epoch": 2512} {"train_loss": -24.24151039123535, "global_step": 208528, "epoch": 2512} {"train_loss": -24.690404891967773, "global_step": 208529, "epoch": 2512} {"train_loss": -24.451704025268555, "global_step": 208530, "epoch": 2512} {"train_loss": -24.281320571899414, "global_step": 208531, "epoch": 2512} {"train_loss": -24.61100196838379, "global_step": 208532, "epoch": 2512} {"train_loss": -24.152856826782227, "global_step": 208533, "epoch": 2512} {"train_loss": -24.642202377319336, "global_step": 208534, "epoch": 2512} {"train_loss": -24.40958595275879, "global_step": 208535, "epoch": 2512} {"train_loss": -24.571670532226562, "global_step": 208536, "epoch": 2512} {"train_loss": -24.391799926757812, "global_step": 208537, "epoch": 2512} {"train_loss": -24.54705047607422, "global_step": 208538, "epoch": 2512} {"train_loss": -24.470783233642578, "global_step": 208539, "epoch": 2512} {"train_loss": -24.535186767578125, "global_step": 208540, "epoch": 2512} {"train_loss": -24.50630760192871, "global_step": 208541, "epoch": 2512} {"train_loss": -24.594989776611328, "global_step": 208542, "epoch": 2512} {"train_loss": -24.246091842651367, "global_step": 208543, "epoch": 2512} {"train_loss": -24.727087020874023, "global_step": 208544, "epoch": 2512} {"train_loss": -24.437685012817383, "global_step": 208545, "epoch": 2512} {"train_loss": -24.280941009521484, "global_step": 208546, "epoch": 2512} {"train_loss": -24.70020866394043, "global_step": 208547, "epoch": 2512} {"train_loss": -24.21744155883789, "global_step": 208548, "epoch": 2512} {"train_loss": -24.500839233398438, "global_step": 208549, "epoch": 2512} {"train_loss": -24.557363510131836, "global_step": 208550, "epoch": 2512} {"train_loss": -24.623416900634766, "global_step": 208551, "epoch": 2512} {"train_loss": -24.50735855102539, "global_step": 208552, "epoch": 2512} {"train_loss": -24.19135093688965, "global_step": 208553, "epoch": 2512} {"train_loss": -24.42960548400879, "global_step": 208554, "epoch": 2512} {"train_loss": -24.2283878326416, "global_step": 208555, "epoch": 2512} {"train_loss": -24.526885986328125, "global_step": 208556, "epoch": 2512} {"train_loss": -24.76017951965332, "global_step": 208557, "epoch": 2512} {"train_loss": -24.417125701904297, "global_step": 208558, "epoch": 2512} {"train_loss": -24.446317672729492, "global_step": 208559, "epoch": 2512} {"train_loss": -24.525766372680664, "global_step": 208560, "epoch": 2512} {"train_loss": -24.035261154174805, "global_step": 208561, "epoch": 2512} {"train_loss": -24.391218185424805, "global_step": 208562, "epoch": 2512} {"train_loss": -24.10245704650879, "global_step": 208563, "epoch": 2512} {"train_loss": -24.39478302001953, "global_step": 208564, "epoch": 2512} {"train_loss": -24.301427841186523, "global_step": 208565, "epoch": 2512} {"train_loss": -24.432851791381836, "global_step": 208566, "epoch": 2512} {"train_loss": -24.36126136779785, "global_step": 208567, "epoch": 2512} {"train_loss": -24.64461326599121, "global_step": 208568, "epoch": 2512} {"train_loss": -24.48443603515625, "global_step": 208569, "epoch": 2512} {"train_loss": -24.40928077697754, "global_step": 208570, "epoch": 2512} {"train_loss": -24.5849552154541, "global_step": 208571, "epoch": 2512} {"train_loss": -24.2443904876709, "global_step": 208572, "epoch": 2512} {"train_loss": -24.53687858581543, "global_step": 208573, "epoch": 2512} {"train_loss": -24.884014129638672, "global_step": 208574, "epoch": 2512} {"train_loss": -24.421171188354492, "global_step": 208575, "epoch": 2512} {"train_loss": -24.63221549987793, "global_step": 208576, "epoch": 2512} {"train_loss": -24.178525924682617, "global_step": 208577, "epoch": 2512} {"train_loss": -24.31444721911327, "global_step": 208578, "epoch": 2512, "val_loss": 6676649.0} {"train_loss": -24.318544387817383, "global_step": 208579, "epoch": 2513} {"train_loss": -24.315519332885742, "global_step": 208580, "epoch": 2513} {"train_loss": -24.1971378326416, "global_step": 208581, "epoch": 2513} {"train_loss": -24.817392349243164, "global_step": 208582, "epoch": 2513} {"train_loss": -24.226465225219727, "global_step": 208583, "epoch": 2513} {"train_loss": -24.602542877197266, "global_step": 208584, "epoch": 2513} {"train_loss": -24.319074630737305, "global_step": 208585, "epoch": 2513} {"train_loss": -24.311864852905273, "global_step": 208586, "epoch": 2513} {"train_loss": -24.326566696166992, "global_step": 208587, "epoch": 2513} {"train_loss": -24.42252540588379, "global_step": 208588, "epoch": 2513} {"train_loss": -24.335922241210938, "global_step": 208589, "epoch": 2513} {"train_loss": -24.449121475219727, "global_step": 208590, "epoch": 2513} {"train_loss": -24.19524574279785, "global_step": 208591, "epoch": 2513} {"train_loss": -25.00485610961914, "global_step": 208592, "epoch": 2513} {"train_loss": -25.001798629760742, "global_step": 208593, "epoch": 2513} {"train_loss": -24.498332977294922, "global_step": 208594, "epoch": 2513} {"train_loss": -24.860794067382812, "global_step": 208595, "epoch": 2513} {"train_loss": -24.144277572631836, "global_step": 208596, "epoch": 2513} {"train_loss": -24.142929077148438, "global_step": 208597, "epoch": 2513} {"train_loss": -24.08905601501465, "global_step": 208598, "epoch": 2513} {"train_loss": -24.42316246032715, "global_step": 208599, "epoch": 2513} {"train_loss": -24.32861328125, "global_step": 208600, "epoch": 2513} {"train_loss": -24.57893180847168, "global_step": 208601, "epoch": 2513} {"train_loss": -24.110044479370117, "global_step": 208602, "epoch": 2513} {"train_loss": -24.66937828063965, "global_step": 208603, "epoch": 2513} {"train_loss": -24.647724151611328, "global_step": 208604, "epoch": 2513} {"train_loss": -23.601184844970703, "global_step": 208605, "epoch": 2513} {"train_loss": -24.414236068725586, "global_step": 208606, "epoch": 2513} {"train_loss": -24.1564884185791, "global_step": 208607, "epoch": 2513} {"train_loss": -24.120168685913086, "global_step": 208608, "epoch": 2513} {"train_loss": -24.06073760986328, "global_step": 208609, "epoch": 2513} {"train_loss": -23.918197631835938, "global_step": 208610, "epoch": 2513} {"train_loss": -24.28570556640625, "global_step": 208611, "epoch": 2513} {"train_loss": -24.539295196533203, "global_step": 208612, "epoch": 2513} {"train_loss": -24.345693588256836, "global_step": 208613, "epoch": 2513} {"train_loss": -23.800573348999023, "global_step": 208614, "epoch": 2513} {"train_loss": -24.516775131225586, "global_step": 208615, "epoch": 2513} {"train_loss": -24.088272094726562, "global_step": 208616, "epoch": 2513} {"train_loss": -24.627002716064453, "global_step": 208617, "epoch": 2513} {"train_loss": -24.53885841369629, "global_step": 208618, "epoch": 2513} {"train_loss": -24.55672264099121, "global_step": 208619, "epoch": 2513} {"train_loss": -24.5095157623291, "global_step": 208620, "epoch": 2513} {"train_loss": -24.264984130859375, "global_step": 208621, "epoch": 2513} {"train_loss": -24.2994384765625, "global_step": 208622, "epoch": 2513} {"train_loss": -24.259435653686523, "global_step": 208623, "epoch": 2513} {"train_loss": -24.55967140197754, "global_step": 208624, "epoch": 2513} {"train_loss": -24.239267349243164, "global_step": 208625, "epoch": 2513} {"train_loss": -24.57680320739746, "global_step": 208626, "epoch": 2513} {"train_loss": -24.684934616088867, "global_step": 208627, "epoch": 2513} {"train_loss": -24.174169540405273, "global_step": 208628, "epoch": 2513} {"train_loss": -24.627723693847656, "global_step": 208629, "epoch": 2513} {"train_loss": -24.612916946411133, "global_step": 208630, "epoch": 2513} {"train_loss": -24.427757263183594, "global_step": 208631, "epoch": 2513} {"train_loss": -24.4211368560791, "global_step": 208632, "epoch": 2513} {"train_loss": -24.847501754760742, "global_step": 208633, "epoch": 2513} {"train_loss": -24.213485717773438, "global_step": 208634, "epoch": 2513} {"train_loss": -24.584033966064453, "global_step": 208635, "epoch": 2513} {"train_loss": -24.50410270690918, "global_step": 208636, "epoch": 2513} {"train_loss": -24.611061096191406, "global_step": 208637, "epoch": 2513} {"train_loss": -24.72788429260254, "global_step": 208638, "epoch": 2513} {"train_loss": -24.302209854125977, "global_step": 208639, "epoch": 2513} {"train_loss": -24.9061336517334, "global_step": 208640, "epoch": 2513} {"train_loss": -24.454740524291992, "global_step": 208641, "epoch": 2513} {"train_loss": -24.325241088867188, "global_step": 208642, "epoch": 2513} {"train_loss": -24.772424697875977, "global_step": 208643, "epoch": 2513} {"train_loss": -24.40241813659668, "global_step": 208644, "epoch": 2513} {"train_loss": -24.202302932739258, "global_step": 208645, "epoch": 2513} {"train_loss": -23.490022659301758, "global_step": 208646, "epoch": 2513} {"train_loss": -23.225494384765625, "global_step": 208647, "epoch": 2513} {"train_loss": -23.718515396118164, "global_step": 208648, "epoch": 2513} {"train_loss": -24.092004776000977, "global_step": 208649, "epoch": 2513} {"train_loss": -24.076858520507812, "global_step": 208650, "epoch": 2513} {"train_loss": -24.15589141845703, "global_step": 208651, "epoch": 2513} {"train_loss": -24.224672317504883, "global_step": 208652, "epoch": 2513} {"train_loss": -23.996061325073242, "global_step": 208653, "epoch": 2513} {"train_loss": -24.24315071105957, "global_step": 208654, "epoch": 2513} {"train_loss": -24.33344841003418, "global_step": 208655, "epoch": 2513} {"train_loss": -24.373233795166016, "global_step": 208656, "epoch": 2513} {"train_loss": -24.688840866088867, "global_step": 208657, "epoch": 2513} {"train_loss": -24.103178024291992, "global_step": 208658, "epoch": 2513} {"train_loss": -24.09575843811035, "global_step": 208659, "epoch": 2513} {"train_loss": -24.014089584350586, "global_step": 208660, "epoch": 2513} {"train_loss": -24.352246181074396, "global_step": 208661, "epoch": 2513, "val_loss": 6650227.5} {"train_loss": -23.365488052368164, "global_step": 208662, "epoch": 2514} {"train_loss": -24.592044830322266, "global_step": 208663, "epoch": 2514} {"train_loss": -23.988746643066406, "global_step": 208664, "epoch": 2514} {"train_loss": -24.313274383544922, "global_step": 208665, "epoch": 2514} {"train_loss": -24.173696517944336, "global_step": 208666, "epoch": 2514} {"train_loss": -23.895973205566406, "global_step": 208667, "epoch": 2514} {"train_loss": -24.31661033630371, "global_step": 208668, "epoch": 2514} {"train_loss": -23.72938346862793, "global_step": 208669, "epoch": 2514} {"train_loss": -24.09907341003418, "global_step": 208670, "epoch": 2514} {"train_loss": -24.639272689819336, "global_step": 208671, "epoch": 2514} {"train_loss": -24.241323471069336, "global_step": 208672, "epoch": 2514} {"train_loss": -24.407028198242188, "global_step": 208673, "epoch": 2514} {"train_loss": -23.927392959594727, "global_step": 208674, "epoch": 2514} {"train_loss": -24.505369186401367, "global_step": 208675, "epoch": 2514} {"train_loss": -23.871578216552734, "global_step": 208676, "epoch": 2514} {"train_loss": -24.151601791381836, "global_step": 208677, "epoch": 2514} {"train_loss": -24.719804763793945, "global_step": 208678, "epoch": 2514} {"train_loss": -24.06945037841797, "global_step": 208679, "epoch": 2514} {"train_loss": -24.545352935791016, "global_step": 208680, "epoch": 2514} {"train_loss": -24.13447380065918, "global_step": 208681, "epoch": 2514} {"train_loss": -24.435070037841797, "global_step": 208682, "epoch": 2514} {"train_loss": -24.286396026611328, "global_step": 208683, "epoch": 2514} {"train_loss": -24.49928092956543, "global_step": 208684, "epoch": 2514} {"train_loss": -24.2208194732666, "global_step": 208685, "epoch": 2514} {"train_loss": -24.53167724609375, "global_step": 208686, "epoch": 2514} {"train_loss": -24.281234741210938, "global_step": 208687, "epoch": 2514} {"train_loss": -24.28350830078125, "global_step": 208688, "epoch": 2514} {"train_loss": -24.366819381713867, "global_step": 208689, "epoch": 2514} {"train_loss": -24.355276107788086, "global_step": 208690, "epoch": 2514} {"train_loss": -23.887845993041992, "global_step": 208691, "epoch": 2514} {"train_loss": -24.44879722595215, "global_step": 208692, "epoch": 2514} {"train_loss": -24.268157958984375, "global_step": 208693, "epoch": 2514} {"train_loss": -24.25836753845215, "global_step": 208694, "epoch": 2514} {"train_loss": -24.682748794555664, "global_step": 208695, "epoch": 2514} {"train_loss": -24.45722198486328, "global_step": 208696, "epoch": 2514} {"train_loss": -24.64360809326172, "global_step": 208697, "epoch": 2514} {"train_loss": -24.593509674072266, "global_step": 208698, "epoch": 2514} {"train_loss": -24.613611221313477, "global_step": 208699, "epoch": 2514} {"train_loss": -24.762338638305664, "global_step": 208700, "epoch": 2514} {"train_loss": -24.284265518188477, "global_step": 208701, "epoch": 2514} {"train_loss": -24.355112075805664, "global_step": 208702, "epoch": 2514} {"train_loss": -24.55220603942871, "global_step": 208703, "epoch": 2514} {"train_loss": -24.557828903198242, "global_step": 208704, "epoch": 2514} {"train_loss": -24.490835189819336, "global_step": 208705, "epoch": 2514} {"train_loss": -24.70210838317871, "global_step": 208706, "epoch": 2514} {"train_loss": -24.45418357849121, "global_step": 208707, "epoch": 2514} {"train_loss": -24.437850952148438, "global_step": 208708, "epoch": 2514} {"train_loss": -24.120975494384766, "global_step": 208709, "epoch": 2514} {"train_loss": -24.533658981323242, "global_step": 208710, "epoch": 2514} {"train_loss": -24.464153289794922, "global_step": 208711, "epoch": 2514} {"train_loss": -24.373188018798828, "global_step": 208712, "epoch": 2514} {"train_loss": -23.95008659362793, "global_step": 208713, "epoch": 2514} {"train_loss": -24.43855857849121, "global_step": 208714, "epoch": 2514} {"train_loss": -24.580148696899414, "global_step": 208715, "epoch": 2514} {"train_loss": -24.6605224609375, "global_step": 208716, "epoch": 2514} {"train_loss": -24.694059371948242, "global_step": 208717, "epoch": 2514} {"train_loss": -24.44463539123535, "global_step": 208718, "epoch": 2514} {"train_loss": -24.27560806274414, "global_step": 208719, "epoch": 2514} {"train_loss": -24.23044204711914, "global_step": 208720, "epoch": 2514} {"train_loss": -24.594329833984375, "global_step": 208721, "epoch": 2514} {"train_loss": -24.549636840820312, "global_step": 208722, "epoch": 2514} {"train_loss": -24.181711196899414, "global_step": 208723, "epoch": 2514} {"train_loss": -24.130155563354492, "global_step": 208724, "epoch": 2514} {"train_loss": -24.363554000854492, "global_step": 208725, "epoch": 2514} {"train_loss": -24.460479736328125, "global_step": 208726, "epoch": 2514} {"train_loss": -24.698192596435547, "global_step": 208727, "epoch": 2514} {"train_loss": -24.59905433654785, "global_step": 208728, "epoch": 2514} {"train_loss": -24.549898147583008, "global_step": 208729, "epoch": 2514} {"train_loss": -24.413604736328125, "global_step": 208730, "epoch": 2514} {"train_loss": -24.543521881103516, "global_step": 208731, "epoch": 2514} {"train_loss": -24.781505584716797, "global_step": 208732, "epoch": 2514} {"train_loss": -24.413238525390625, "global_step": 208733, "epoch": 2514} {"train_loss": -24.350828170776367, "global_step": 208734, "epoch": 2514} {"train_loss": -24.680784225463867, "global_step": 208735, "epoch": 2514} {"train_loss": -24.678186416625977, "global_step": 208736, "epoch": 2514} {"train_loss": -24.58534812927246, "global_step": 208737, "epoch": 2514} {"train_loss": -24.562538146972656, "global_step": 208738, "epoch": 2514} {"train_loss": -24.456268310546875, "global_step": 208739, "epoch": 2514} {"train_loss": -24.27029800415039, "global_step": 208740, "epoch": 2514} {"train_loss": -24.625158309936523, "global_step": 208741, "epoch": 2514} {"train_loss": -24.52088165283203, "global_step": 208742, "epoch": 2514} {"train_loss": -24.340106964111328, "global_step": 208743, "epoch": 2514} {"train_loss": -24.381976437855915, "global_step": 208744, "epoch": 2514, "val_loss": 6707447.0} {"train_loss": -24.646026611328125, "global_step": 208745, "epoch": 2515} {"train_loss": -24.35744857788086, "global_step": 208746, "epoch": 2515} {"train_loss": -23.816390991210938, "global_step": 208747, "epoch": 2515} {"train_loss": -24.38374137878418, "global_step": 208748, "epoch": 2515} {"train_loss": -24.495656967163086, "global_step": 208749, "epoch": 2515} {"train_loss": -24.105112075805664, "global_step": 208750, "epoch": 2515} {"train_loss": -24.26943016052246, "global_step": 208751, "epoch": 2515} {"train_loss": -23.7988338470459, "global_step": 208752, "epoch": 2515} {"train_loss": -24.578405380249023, "global_step": 208753, "epoch": 2515} {"train_loss": -24.138294219970703, "global_step": 208754, "epoch": 2515} {"train_loss": -24.17085075378418, "global_step": 208755, "epoch": 2515} {"train_loss": -24.00614356994629, "global_step": 208756, "epoch": 2515} {"train_loss": -23.890134811401367, "global_step": 208757, "epoch": 2515} {"train_loss": -23.936498641967773, "global_step": 208758, "epoch": 2515} {"train_loss": -24.139005661010742, "global_step": 208759, "epoch": 2515} {"train_loss": -24.598264694213867, "global_step": 208760, "epoch": 2515} {"train_loss": -24.23470115661621, "global_step": 208761, "epoch": 2515} {"train_loss": -24.439926147460938, "global_step": 208762, "epoch": 2515} {"train_loss": -24.106626510620117, "global_step": 208763, "epoch": 2515} {"train_loss": -24.3500919342041, "global_step": 208764, "epoch": 2515} {"train_loss": -24.171646118164062, "global_step": 208765, "epoch": 2515} {"train_loss": -24.408180236816406, "global_step": 208766, "epoch": 2515} {"train_loss": -24.163389205932617, "global_step": 208767, "epoch": 2515} {"train_loss": -24.26279640197754, "global_step": 208768, "epoch": 2515} {"train_loss": -24.06375503540039, "global_step": 208769, "epoch": 2515} {"train_loss": -23.860319137573242, "global_step": 208770, "epoch": 2515} {"train_loss": -24.560514450073242, "global_step": 208771, "epoch": 2515} {"train_loss": -24.34514808654785, "global_step": 208772, "epoch": 2515} {"train_loss": -24.33270835876465, "global_step": 208773, "epoch": 2515} {"train_loss": -24.272907257080078, "global_step": 208774, "epoch": 2515} {"train_loss": -24.520017623901367, "global_step": 208775, "epoch": 2515} {"train_loss": -24.500747680664062, "global_step": 208776, "epoch": 2515} {"train_loss": -24.160396575927734, "global_step": 208777, "epoch": 2515} {"train_loss": -23.987518310546875, "global_step": 208778, "epoch": 2515} {"train_loss": -24.332996368408203, "global_step": 208779, "epoch": 2515} {"train_loss": -24.31891632080078, "global_step": 208780, "epoch": 2515} {"train_loss": -24.301267623901367, "global_step": 208781, "epoch": 2515} {"train_loss": -24.18165397644043, "global_step": 208782, "epoch": 2515} {"train_loss": -24.140573501586914, "global_step": 208783, "epoch": 2515} {"train_loss": -24.174945831298828, "global_step": 208784, "epoch": 2515} {"train_loss": -24.414011001586914, "global_step": 208785, "epoch": 2515} {"train_loss": -24.231555938720703, "global_step": 208786, "epoch": 2515} {"train_loss": -24.160104751586914, "global_step": 208787, "epoch": 2515} {"train_loss": -24.520797729492188, "global_step": 208788, "epoch": 2515} {"train_loss": -24.21879005432129, "global_step": 208789, "epoch": 2515} {"train_loss": -24.426530838012695, "global_step": 208790, "epoch": 2515} {"train_loss": -24.29137420654297, "global_step": 208791, "epoch": 2515} {"train_loss": -24.1810245513916, "global_step": 208792, "epoch": 2515} {"train_loss": -24.639617919921875, "global_step": 208793, "epoch": 2515} {"train_loss": -24.11343765258789, "global_step": 208794, "epoch": 2515} {"train_loss": -24.732559204101562, "global_step": 208795, "epoch": 2515} {"train_loss": -24.702375411987305, "global_step": 208796, "epoch": 2515} {"train_loss": -24.310068130493164, "global_step": 208797, "epoch": 2515} {"train_loss": -24.733606338500977, "global_step": 208798, "epoch": 2515} {"train_loss": -24.67302894592285, "global_step": 208799, "epoch": 2515} {"train_loss": -24.618183135986328, "global_step": 208800, "epoch": 2515} {"train_loss": -24.79273223876953, "global_step": 208801, "epoch": 2515} {"train_loss": -24.549802780151367, "global_step": 208802, "epoch": 2515} {"train_loss": -24.466201782226562, "global_step": 208803, "epoch": 2515} {"train_loss": -24.676910400390625, "global_step": 208804, "epoch": 2515} {"train_loss": -24.380859375, "global_step": 208805, "epoch": 2515} {"train_loss": -24.367666244506836, "global_step": 208806, "epoch": 2515} {"train_loss": -24.635223388671875, "global_step": 208807, "epoch": 2515} {"train_loss": -24.59429359436035, "global_step": 208808, "epoch": 2515} {"train_loss": -24.46113395690918, "global_step": 208809, "epoch": 2515} {"train_loss": -24.192358016967773, "global_step": 208810, "epoch": 2515} {"train_loss": -24.73968505859375, "global_step": 208811, "epoch": 2515} {"train_loss": -24.106468200683594, "global_step": 208812, "epoch": 2515} {"train_loss": -24.667850494384766, "global_step": 208813, "epoch": 2515} {"train_loss": -24.937665939331055, "global_step": 208814, "epoch": 2515} {"train_loss": -24.423770904541016, "global_step": 208815, "epoch": 2515} {"train_loss": -24.34480857849121, "global_step": 208816, "epoch": 2515} {"train_loss": -24.331830978393555, "global_step": 208817, "epoch": 2515} {"train_loss": -24.87312889099121, "global_step": 208818, "epoch": 2515} {"train_loss": -24.08332633972168, "global_step": 208819, "epoch": 2515} {"train_loss": -24.221094131469727, "global_step": 208820, "epoch": 2515} {"train_loss": -24.34297752380371, "global_step": 208821, "epoch": 2515} {"train_loss": -24.41391944885254, "global_step": 208822, "epoch": 2515} {"train_loss": -24.344106674194336, "global_step": 208823, "epoch": 2515} {"train_loss": -24.327877044677734, "global_step": 208824, "epoch": 2515} {"train_loss": -24.568235397338867, "global_step": 208825, "epoch": 2515} {"train_loss": -24.142236709594727, "global_step": 208826, "epoch": 2515} {"train_loss": -24.350979517741376, "global_step": 208827, "epoch": 2515, "val_loss": 6570224.5} {"train_loss": -24.519498825073242, "global_step": 208828, "epoch": 2516} {"train_loss": -24.463584899902344, "global_step": 208829, "epoch": 2516} {"train_loss": -24.012792587280273, "global_step": 208830, "epoch": 2516} {"train_loss": -23.875112533569336, "global_step": 208831, "epoch": 2516} {"train_loss": -24.082311630249023, "global_step": 208832, "epoch": 2516} {"train_loss": -24.35108757019043, "global_step": 208833, "epoch": 2516} {"train_loss": -23.548742294311523, "global_step": 208834, "epoch": 2516} {"train_loss": -24.621496200561523, "global_step": 208835, "epoch": 2516} {"train_loss": -24.747642517089844, "global_step": 208836, "epoch": 2516} {"train_loss": -24.37535858154297, "global_step": 208837, "epoch": 2516} {"train_loss": -23.951904296875, "global_step": 208838, "epoch": 2516} {"train_loss": -24.520553588867188, "global_step": 208839, "epoch": 2516} {"train_loss": -24.154111862182617, "global_step": 208840, "epoch": 2516} {"train_loss": -24.157567977905273, "global_step": 208841, "epoch": 2516} {"train_loss": -24.52117919921875, "global_step": 208842, "epoch": 2516} {"train_loss": -24.3953800201416, "global_step": 208843, "epoch": 2516} {"train_loss": -24.501617431640625, "global_step": 208844, "epoch": 2516} {"train_loss": -24.243255615234375, "global_step": 208845, "epoch": 2516} {"train_loss": -24.242828369140625, "global_step": 208846, "epoch": 2516} {"train_loss": -24.46761131286621, "global_step": 208847, "epoch": 2516} {"train_loss": -24.052026748657227, "global_step": 208848, "epoch": 2516} {"train_loss": -24.068632125854492, "global_step": 208849, "epoch": 2516} {"train_loss": -24.587650299072266, "global_step": 208850, "epoch": 2516} {"train_loss": -24.658222198486328, "global_step": 208851, "epoch": 2516} {"train_loss": -24.305959701538086, "global_step": 208852, "epoch": 2516} {"train_loss": -24.65346336364746, "global_step": 208853, "epoch": 2516} {"train_loss": -24.311187744140625, "global_step": 208854, "epoch": 2516} {"train_loss": -24.512718200683594, "global_step": 208855, "epoch": 2516} {"train_loss": -24.082265853881836, "global_step": 208856, "epoch": 2516} {"train_loss": -24.267133712768555, "global_step": 208857, "epoch": 2516} {"train_loss": -24.361051559448242, "global_step": 208858, "epoch": 2516} {"train_loss": -24.4183292388916, "global_step": 208859, "epoch": 2516} {"train_loss": -24.39861297607422, "global_step": 208860, "epoch": 2516} {"train_loss": -24.573850631713867, "global_step": 208861, "epoch": 2516} {"train_loss": -24.481359481811523, "global_step": 208862, "epoch": 2516} {"train_loss": -24.520666122436523, "global_step": 208863, "epoch": 2516} {"train_loss": -24.744165420532227, "global_step": 208864, "epoch": 2516} {"train_loss": -24.495193481445312, "global_step": 208865, "epoch": 2516} {"train_loss": -24.578832626342773, "global_step": 208866, "epoch": 2516} {"train_loss": -24.81458282470703, "global_step": 208867, "epoch": 2516} {"train_loss": -24.617921829223633, "global_step": 208868, "epoch": 2516} {"train_loss": -24.473899841308594, "global_step": 208869, "epoch": 2516} {"train_loss": -24.60331916809082, "global_step": 208870, "epoch": 2516} {"train_loss": -24.347990036010742, "global_step": 208871, "epoch": 2516} {"train_loss": -24.601831436157227, "global_step": 208872, "epoch": 2516} {"train_loss": -24.6475887298584, "global_step": 208873, "epoch": 2516} {"train_loss": -24.23697853088379, "global_step": 208874, "epoch": 2516} {"train_loss": -24.824005126953125, "global_step": 208875, "epoch": 2516} {"train_loss": -24.36107635498047, "global_step": 208876, "epoch": 2516} {"train_loss": -24.14009666442871, "global_step": 208877, "epoch": 2516} {"train_loss": -24.05665397644043, "global_step": 208878, "epoch": 2516} {"train_loss": -24.112524032592773, "global_step": 208879, "epoch": 2516} {"train_loss": -24.319595336914062, "global_step": 208880, "epoch": 2516} {"train_loss": -24.38838768005371, "global_step": 208881, "epoch": 2516} {"train_loss": -24.383127212524414, "global_step": 208882, "epoch": 2516} {"train_loss": -24.073938369750977, "global_step": 208883, "epoch": 2516} {"train_loss": -24.4165096282959, "global_step": 208884, "epoch": 2516} {"train_loss": -24.324127197265625, "global_step": 208885, "epoch": 2516} {"train_loss": -24.297500610351562, "global_step": 208886, "epoch": 2516} {"train_loss": -24.28468132019043, "global_step": 208887, "epoch": 2516} {"train_loss": -24.11191749572754, "global_step": 208888, "epoch": 2516} {"train_loss": -24.1283016204834, "global_step": 208889, "epoch": 2516} {"train_loss": -24.645278930664062, "global_step": 208890, "epoch": 2516} {"train_loss": -24.164764404296875, "global_step": 208891, "epoch": 2516} {"train_loss": -24.60956382751465, "global_step": 208892, "epoch": 2516} {"train_loss": -24.6513729095459, "global_step": 208893, "epoch": 2516} {"train_loss": -24.49772071838379, "global_step": 208894, "epoch": 2516} {"train_loss": -24.5228271484375, "global_step": 208895, "epoch": 2516} {"train_loss": -24.85422134399414, "global_step": 208896, "epoch": 2516} {"train_loss": -24.869054794311523, "global_step": 208897, "epoch": 2516} {"train_loss": -24.597265243530273, "global_step": 208898, "epoch": 2516} {"train_loss": -24.349210739135742, "global_step": 208899, "epoch": 2516} {"train_loss": -24.533170700073242, "global_step": 208900, "epoch": 2516} {"train_loss": -24.4586238861084, "global_step": 208901, "epoch": 2516} {"train_loss": -24.590940475463867, "global_step": 208902, "epoch": 2516} {"train_loss": -24.326330184936523, "global_step": 208903, "epoch": 2516} {"train_loss": -24.5101318359375, "global_step": 208904, "epoch": 2516} {"train_loss": -24.250608444213867, "global_step": 208905, "epoch": 2516} {"train_loss": -24.478612899780273, "global_step": 208906, "epoch": 2516} {"train_loss": -24.34834098815918, "global_step": 208907, "epoch": 2516} {"train_loss": -24.33295440673828, "global_step": 208908, "epoch": 2516} {"train_loss": -24.62697982788086, "global_step": 208909, "epoch": 2516} {"train_loss": -24.39062254112887, "global_step": 208910, "epoch": 2516, "val_loss": 6563557.0} {"train_loss": -23.689443588256836, "global_step": 208911, "epoch": 2517} {"train_loss": -23.165376663208008, "global_step": 208912, "epoch": 2517} {"train_loss": -23.437259674072266, "global_step": 208913, "epoch": 2517} {"train_loss": -23.591352462768555, "global_step": 208914, "epoch": 2517} {"train_loss": -23.76506996154785, "global_step": 208915, "epoch": 2517} {"train_loss": -23.722169876098633, "global_step": 208916, "epoch": 2517} {"train_loss": -24.577651977539062, "global_step": 208917, "epoch": 2517} {"train_loss": -23.497915267944336, "global_step": 208918, "epoch": 2517} {"train_loss": -23.838552474975586, "global_step": 208919, "epoch": 2517} {"train_loss": -23.77086067199707, "global_step": 208920, "epoch": 2517} {"train_loss": -23.584320068359375, "global_step": 208921, "epoch": 2517} {"train_loss": -24.0010986328125, "global_step": 208922, "epoch": 2517} {"train_loss": -24.363540649414062, "global_step": 208923, "epoch": 2517} {"train_loss": -23.827117919921875, "global_step": 208924, "epoch": 2517} {"train_loss": -24.07869529724121, "global_step": 208925, "epoch": 2517} {"train_loss": -23.857669830322266, "global_step": 208926, "epoch": 2517} {"train_loss": -23.547704696655273, "global_step": 208927, "epoch": 2517} {"train_loss": -23.912771224975586, "global_step": 208928, "epoch": 2517} {"train_loss": -24.190567016601562, "global_step": 208929, "epoch": 2517} {"train_loss": -24.2440242767334, "global_step": 208930, "epoch": 2517} {"train_loss": -23.836166381835938, "global_step": 208931, "epoch": 2517} {"train_loss": -24.513097763061523, "global_step": 208932, "epoch": 2517} {"train_loss": -24.020578384399414, "global_step": 208933, "epoch": 2517} {"train_loss": -24.410165786743164, "global_step": 208934, "epoch": 2517} {"train_loss": -24.42598533630371, "global_step": 208935, "epoch": 2517} {"train_loss": -24.031259536743164, "global_step": 208936, "epoch": 2517} {"train_loss": -24.3659725189209, "global_step": 208937, "epoch": 2517} {"train_loss": -24.439701080322266, "global_step": 208938, "epoch": 2517} {"train_loss": -24.35616683959961, "global_step": 208939, "epoch": 2517} {"train_loss": -24.18377113342285, "global_step": 208940, "epoch": 2517} {"train_loss": -24.46361541748047, "global_step": 208941, "epoch": 2517} {"train_loss": -24.944860458374023, "global_step": 208942, "epoch": 2517} {"train_loss": -24.36576271057129, "global_step": 208943, "epoch": 2517} {"train_loss": -24.428050994873047, "global_step": 208944, "epoch": 2517} {"train_loss": -24.32985496520996, "global_step": 208945, "epoch": 2517} {"train_loss": -24.282148361206055, "global_step": 208946, "epoch": 2517} {"train_loss": -24.473224639892578, "global_step": 208947, "epoch": 2517} {"train_loss": -24.68177604675293, "global_step": 208948, "epoch": 2517} {"train_loss": -24.620532989501953, "global_step": 208949, "epoch": 2517} {"train_loss": -24.52689552307129, "global_step": 208950, "epoch": 2517} {"train_loss": -24.68635368347168, "global_step": 208951, "epoch": 2517} {"train_loss": -24.298871994018555, "global_step": 208952, "epoch": 2517} {"train_loss": -24.491846084594727, "global_step": 208953, "epoch": 2517} {"train_loss": -24.457334518432617, "global_step": 208954, "epoch": 2517} {"train_loss": -24.302234649658203, "global_step": 208955, "epoch": 2517} {"train_loss": -24.42718505859375, "global_step": 208956, "epoch": 2517} {"train_loss": -24.4736385345459, "global_step": 208957, "epoch": 2517} {"train_loss": -24.418058395385742, "global_step": 208958, "epoch": 2517} {"train_loss": -24.507904052734375, "global_step": 208959, "epoch": 2517} {"train_loss": -24.256689071655273, "global_step": 208960, "epoch": 2517} {"train_loss": -24.176654815673828, "global_step": 208961, "epoch": 2517} {"train_loss": -24.707914352416992, "global_step": 208962, "epoch": 2517} {"train_loss": -24.242326736450195, "global_step": 208963, "epoch": 2517} {"train_loss": -24.632177352905273, "global_step": 208964, "epoch": 2517} {"train_loss": -24.38270378112793, "global_step": 208965, "epoch": 2517} {"train_loss": -24.507658004760742, "global_step": 208966, "epoch": 2517} {"train_loss": -24.26776123046875, "global_step": 208967, "epoch": 2517} {"train_loss": -24.139938354492188, "global_step": 208968, "epoch": 2517} {"train_loss": -24.082399368286133, "global_step": 208969, "epoch": 2517} {"train_loss": -24.62734031677246, "global_step": 208970, "epoch": 2517} {"train_loss": -24.637170791625977, "global_step": 208971, "epoch": 2517} {"train_loss": -24.207468032836914, "global_step": 208972, "epoch": 2517} {"train_loss": -24.215179443359375, "global_step": 208973, "epoch": 2517} {"train_loss": -24.39316177368164, "global_step": 208974, "epoch": 2517} {"train_loss": -24.300378799438477, "global_step": 208975, "epoch": 2517} {"train_loss": -24.321269989013672, "global_step": 208976, "epoch": 2517} {"train_loss": -24.2277889251709, "global_step": 208977, "epoch": 2517} {"train_loss": -24.370147705078125, "global_step": 208978, "epoch": 2517} {"train_loss": -23.835384368896484, "global_step": 208979, "epoch": 2517} {"train_loss": -24.577030181884766, "global_step": 208980, "epoch": 2517} {"train_loss": -24.271453857421875, "global_step": 208981, "epoch": 2517} {"train_loss": -24.469791412353516, "global_step": 208982, "epoch": 2517} {"train_loss": -24.38364601135254, "global_step": 208983, "epoch": 2517} {"train_loss": -24.227144241333008, "global_step": 208984, "epoch": 2517} {"train_loss": -24.463788986206055, "global_step": 208985, "epoch": 2517} {"train_loss": -24.567659378051758, "global_step": 208986, "epoch": 2517} {"train_loss": -24.52939796447754, "global_step": 208987, "epoch": 2517} {"train_loss": -24.408262252807617, "global_step": 208988, "epoch": 2517} {"train_loss": -24.53205680847168, "global_step": 208989, "epoch": 2517} {"train_loss": -24.333656311035156, "global_step": 208990, "epoch": 2517} {"train_loss": -24.547042846679688, "global_step": 208991, "epoch": 2517} {"train_loss": -24.717056274414062, "global_step": 208992, "epoch": 2517} {"train_loss": -24.26273221854704, "global_step": 208993, "epoch": 2517, "val_loss": 6560145.0} {"train_loss": -24.07236099243164, "global_step": 208994, "epoch": 2518} {"train_loss": -24.13376235961914, "global_step": 208995, "epoch": 2518} {"train_loss": -24.054744720458984, "global_step": 208996, "epoch": 2518} {"train_loss": -24.022310256958008, "global_step": 208997, "epoch": 2518} {"train_loss": -23.964229583740234, "global_step": 208998, "epoch": 2518} {"train_loss": -24.16802406311035, "global_step": 208999, "epoch": 2518} {"train_loss": -23.919092178344727, "global_step": 209000, "epoch": 2518} {"train_loss": -23.98152732849121, "global_step": 209001, "epoch": 2518} {"train_loss": -23.87269401550293, "global_step": 209002, "epoch": 2518} {"train_loss": -23.97850799560547, "global_step": 209003, "epoch": 2518} {"train_loss": -23.716482162475586, "global_step": 209004, "epoch": 2518} {"train_loss": -24.544572830200195, "global_step": 209005, "epoch": 2518} {"train_loss": -24.114519119262695, "global_step": 209006, "epoch": 2518} {"train_loss": -24.695106506347656, "global_step": 209007, "epoch": 2518} {"train_loss": -24.45945167541504, "global_step": 209008, "epoch": 2518} {"train_loss": -23.846553802490234, "global_step": 209009, "epoch": 2518} {"train_loss": -24.303451538085938, "global_step": 209010, "epoch": 2518} {"train_loss": -24.449405670166016, "global_step": 209011, "epoch": 2518} {"train_loss": -24.05971336364746, "global_step": 209012, "epoch": 2518} {"train_loss": -24.2691593170166, "global_step": 209013, "epoch": 2518} {"train_loss": -24.224796295166016, "global_step": 209014, "epoch": 2518} {"train_loss": -24.39418601989746, "global_step": 209015, "epoch": 2518} {"train_loss": -24.18768882751465, "global_step": 209016, "epoch": 2518} {"train_loss": -24.542509078979492, "global_step": 209017, "epoch": 2518} {"train_loss": -24.35860824584961, "global_step": 209018, "epoch": 2518} {"train_loss": -24.235305786132812, "global_step": 209019, "epoch": 2518} {"train_loss": -24.166324615478516, "global_step": 209020, "epoch": 2518} {"train_loss": -24.409461975097656, "global_step": 209021, "epoch": 2518} {"train_loss": -24.44917106628418, "global_step": 209022, "epoch": 2518} {"train_loss": -24.54581069946289, "global_step": 209023, "epoch": 2518} {"train_loss": -24.682249069213867, "global_step": 209024, "epoch": 2518} {"train_loss": -24.53036880493164, "global_step": 209025, "epoch": 2518} {"train_loss": -24.44707679748535, "global_step": 209026, "epoch": 2518} {"train_loss": -24.632049560546875, "global_step": 209027, "epoch": 2518} {"train_loss": -24.5943660736084, "global_step": 209028, "epoch": 2518} {"train_loss": -24.223894119262695, "global_step": 209029, "epoch": 2518} {"train_loss": -24.466711044311523, "global_step": 209030, "epoch": 2518} {"train_loss": -24.062774658203125, "global_step": 209031, "epoch": 2518} {"train_loss": -24.477157592773438, "global_step": 209032, "epoch": 2518} {"train_loss": -24.26898193359375, "global_step": 209033, "epoch": 2518} {"train_loss": -24.148452758789062, "global_step": 209034, "epoch": 2518} {"train_loss": -24.36078453063965, "global_step": 209035, "epoch": 2518} {"train_loss": -24.544038772583008, "global_step": 209036, "epoch": 2518} {"train_loss": -24.10581398010254, "global_step": 209037, "epoch": 2518} {"train_loss": -24.320056915283203, "global_step": 209038, "epoch": 2518} {"train_loss": -24.012895584106445, "global_step": 209039, "epoch": 2518} {"train_loss": -23.993406295776367, "global_step": 209040, "epoch": 2518} {"train_loss": -24.471223831176758, "global_step": 209041, "epoch": 2518} {"train_loss": -24.520851135253906, "global_step": 209042, "epoch": 2518} {"train_loss": -24.450368881225586, "global_step": 209043, "epoch": 2518} {"train_loss": -24.115032196044922, "global_step": 209044, "epoch": 2518} {"train_loss": -24.734018325805664, "global_step": 209045, "epoch": 2518} {"train_loss": -24.424211502075195, "global_step": 209046, "epoch": 2518} {"train_loss": -24.383621215820312, "global_step": 209047, "epoch": 2518} {"train_loss": -24.571109771728516, "global_step": 209048, "epoch": 2518} {"train_loss": -24.64726448059082, "global_step": 209049, "epoch": 2518} {"train_loss": -24.609233856201172, "global_step": 209050, "epoch": 2518} {"train_loss": -24.579782485961914, "global_step": 209051, "epoch": 2518} {"train_loss": -24.5919189453125, "global_step": 209052, "epoch": 2518} {"train_loss": -24.200063705444336, "global_step": 209053, "epoch": 2518} {"train_loss": -24.12757110595703, "global_step": 209054, "epoch": 2518} {"train_loss": -24.65886688232422, "global_step": 209055, "epoch": 2518} {"train_loss": -24.43033218383789, "global_step": 209056, "epoch": 2518} {"train_loss": -24.68885612487793, "global_step": 209057, "epoch": 2518} {"train_loss": -24.811071395874023, "global_step": 209058, "epoch": 2518} {"train_loss": -24.746721267700195, "global_step": 209059, "epoch": 2518} {"train_loss": -24.10009765625, "global_step": 209060, "epoch": 2518} {"train_loss": -24.184545516967773, "global_step": 209061, "epoch": 2518} {"train_loss": -24.728178024291992, "global_step": 209062, "epoch": 2518} {"train_loss": -24.509702682495117, "global_step": 209063, "epoch": 2518} {"train_loss": -24.405546188354492, "global_step": 209064, "epoch": 2518} {"train_loss": -24.473865509033203, "global_step": 209065, "epoch": 2518} {"train_loss": -24.27189064025879, "global_step": 209066, "epoch": 2518} {"train_loss": -24.44350242614746, "global_step": 209067, "epoch": 2518} {"train_loss": -24.605154037475586, "global_step": 209068, "epoch": 2518} {"train_loss": -24.34342384338379, "global_step": 209069, "epoch": 2518} {"train_loss": -24.611555099487305, "global_step": 209070, "epoch": 2518} {"train_loss": -24.113954544067383, "global_step": 209071, "epoch": 2518} {"train_loss": -24.687101364135742, "global_step": 209072, "epoch": 2518} {"train_loss": -24.642688751220703, "global_step": 209073, "epoch": 2518} {"train_loss": -24.63388442993164, "global_step": 209074, "epoch": 2518} {"train_loss": -24.642847061157227, "global_step": 209075, "epoch": 2518} {"train_loss": -24.358771197767144, "global_step": 209076, "epoch": 2518, "val_loss": 6553350.0} {"train_loss": -23.994064331054688, "global_step": 209077, "epoch": 2519} {"train_loss": -23.935327529907227, "global_step": 209078, "epoch": 2519} {"train_loss": -23.75779151916504, "global_step": 209079, "epoch": 2519} {"train_loss": -23.597076416015625, "global_step": 209080, "epoch": 2519} {"train_loss": -23.660497665405273, "global_step": 209081, "epoch": 2519} {"train_loss": -24.42664909362793, "global_step": 209082, "epoch": 2519} {"train_loss": -23.81344985961914, "global_step": 209083, "epoch": 2519} {"train_loss": -24.31212615966797, "global_step": 209084, "epoch": 2519} {"train_loss": -24.08761215209961, "global_step": 209085, "epoch": 2519} {"train_loss": -24.18414306640625, "global_step": 209086, "epoch": 2519} {"train_loss": -24.327726364135742, "global_step": 209087, "epoch": 2519} {"train_loss": -23.938461303710938, "global_step": 209088, "epoch": 2519} {"train_loss": -24.02036476135254, "global_step": 209089, "epoch": 2519} {"train_loss": -24.70098304748535, "global_step": 209090, "epoch": 2519} {"train_loss": -24.39293670654297, "global_step": 209091, "epoch": 2519} {"train_loss": -23.870405197143555, "global_step": 209092, "epoch": 2519} {"train_loss": -24.17414665222168, "global_step": 209093, "epoch": 2519} {"train_loss": -23.970489501953125, "global_step": 209094, "epoch": 2519} {"train_loss": -24.277801513671875, "global_step": 209095, "epoch": 2519} {"train_loss": -24.52705192565918, "global_step": 209096, "epoch": 2519} {"train_loss": -24.093048095703125, "global_step": 209097, "epoch": 2519} {"train_loss": -24.516801834106445, "global_step": 209098, "epoch": 2519} {"train_loss": -23.98194694519043, "global_step": 209099, "epoch": 2519} {"train_loss": -24.23760414123535, "global_step": 209100, "epoch": 2519} {"train_loss": -24.097232818603516, "global_step": 209101, "epoch": 2519} {"train_loss": -24.405471801757812, "global_step": 209102, "epoch": 2519} {"train_loss": -24.446401596069336, "global_step": 209103, "epoch": 2519} {"train_loss": -24.22836685180664, "global_step": 209104, "epoch": 2519} {"train_loss": -24.44229507446289, "global_step": 209105, "epoch": 2519} {"train_loss": -24.2347354888916, "global_step": 209106, "epoch": 2519} {"train_loss": -24.428146362304688, "global_step": 209107, "epoch": 2519} {"train_loss": -24.556060791015625, "global_step": 209108, "epoch": 2519} {"train_loss": -24.051000595092773, "global_step": 209109, "epoch": 2519} {"train_loss": -24.474397659301758, "global_step": 209110, "epoch": 2519} {"train_loss": -24.613887786865234, "global_step": 209111, "epoch": 2519} {"train_loss": -24.535696029663086, "global_step": 209112, "epoch": 2519} {"train_loss": -24.388540267944336, "global_step": 209113, "epoch": 2519} {"train_loss": -24.119365692138672, "global_step": 209114, "epoch": 2519} {"train_loss": -24.173364639282227, "global_step": 209115, "epoch": 2519} {"train_loss": -24.62679672241211, "global_step": 209116, "epoch": 2519} {"train_loss": -24.270166397094727, "global_step": 209117, "epoch": 2519} {"train_loss": -24.093454360961914, "global_step": 209118, "epoch": 2519} {"train_loss": -24.282941818237305, "global_step": 209119, "epoch": 2519} {"train_loss": -24.43849754333496, "global_step": 209120, "epoch": 2519} {"train_loss": -24.395055770874023, "global_step": 209121, "epoch": 2519} {"train_loss": -24.162452697753906, "global_step": 209122, "epoch": 2519} {"train_loss": -24.77798843383789, "global_step": 209123, "epoch": 2519} {"train_loss": -24.623910903930664, "global_step": 209124, "epoch": 2519} {"train_loss": -24.58416748046875, "global_step": 209125, "epoch": 2519} {"train_loss": -24.460020065307617, "global_step": 209126, "epoch": 2519} {"train_loss": -24.544462203979492, "global_step": 209127, "epoch": 2519} {"train_loss": -24.361766815185547, "global_step": 209128, "epoch": 2519} {"train_loss": -24.36154556274414, "global_step": 209129, "epoch": 2519} {"train_loss": -24.564311981201172, "global_step": 209130, "epoch": 2519} {"train_loss": -24.60101890563965, "global_step": 209131, "epoch": 2519} {"train_loss": -24.170028686523438, "global_step": 209132, "epoch": 2519} {"train_loss": -24.4854679107666, "global_step": 209133, "epoch": 2519} {"train_loss": -24.517860412597656, "global_step": 209134, "epoch": 2519} {"train_loss": -24.419809341430664, "global_step": 209135, "epoch": 2519} {"train_loss": -24.22987174987793, "global_step": 209136, "epoch": 2519} {"train_loss": -24.4813232421875, "global_step": 209137, "epoch": 2519} {"train_loss": -24.327226638793945, "global_step": 209138, "epoch": 2519} {"train_loss": -24.04169273376465, "global_step": 209139, "epoch": 2519} {"train_loss": -24.599206924438477, "global_step": 209140, "epoch": 2519} {"train_loss": -24.46102523803711, "global_step": 209141, "epoch": 2519} {"train_loss": -24.484159469604492, "global_step": 209142, "epoch": 2519} {"train_loss": -24.728069305419922, "global_step": 209143, "epoch": 2519} {"train_loss": -24.015380859375, "global_step": 209144, "epoch": 2519} {"train_loss": -24.08213233947754, "global_step": 209145, "epoch": 2519} {"train_loss": -24.2041072845459, "global_step": 209146, "epoch": 2519} {"train_loss": -24.768239974975586, "global_step": 209147, "epoch": 2519} {"train_loss": -24.15302848815918, "global_step": 209148, "epoch": 2519} {"train_loss": -24.596410751342773, "global_step": 209149, "epoch": 2519} {"train_loss": -24.290616989135742, "global_step": 209150, "epoch": 2519} {"train_loss": -24.241926193237305, "global_step": 209151, "epoch": 2519} {"train_loss": -24.15104103088379, "global_step": 209152, "epoch": 2519} {"train_loss": -24.69014549255371, "global_step": 209153, "epoch": 2519} {"train_loss": -24.13739585876465, "global_step": 209154, "epoch": 2519} {"train_loss": -24.448549270629883, "global_step": 209155, "epoch": 2519} {"train_loss": -24.516254425048828, "global_step": 209156, "epoch": 2519} {"train_loss": -24.43459129333496, "global_step": 209157, "epoch": 2519} {"train_loss": -24.235000610351562, "global_step": 209158, "epoch": 2519} {"train_loss": -24.297413975359447, "global_step": 209159, "epoch": 2519, "val_loss": 6575074.0} {"train_loss": -24.25162124633789, "global_step": 209160, "epoch": 2520} {"train_loss": -24.03228187561035, "global_step": 209161, "epoch": 2520} {"train_loss": -24.256872177124023, "global_step": 209162, "epoch": 2520} {"train_loss": -23.7744140625, "global_step": 209163, "epoch": 2520} {"train_loss": -24.280670166015625, "global_step": 209164, "epoch": 2520} {"train_loss": -24.03900718688965, "global_step": 209165, "epoch": 2520} {"train_loss": -23.940208435058594, "global_step": 209166, "epoch": 2520} {"train_loss": -24.297605514526367, "global_step": 209167, "epoch": 2520} {"train_loss": -24.39341163635254, "global_step": 209168, "epoch": 2520} {"train_loss": -24.289230346679688, "global_step": 209169, "epoch": 2520} {"train_loss": -24.212051391601562, "global_step": 209170, "epoch": 2520} {"train_loss": -24.191368103027344, "global_step": 209171, "epoch": 2520} {"train_loss": -24.334184646606445, "global_step": 209172, "epoch": 2520} {"train_loss": -24.639591217041016, "global_step": 209173, "epoch": 2520} {"train_loss": -24.479536056518555, "global_step": 209174, "epoch": 2520} {"train_loss": -24.113574981689453, "global_step": 209175, "epoch": 2520} {"train_loss": -24.09685707092285, "global_step": 209176, "epoch": 2520} {"train_loss": -24.715835571289062, "global_step": 209177, "epoch": 2520} {"train_loss": -24.461715698242188, "global_step": 209178, "epoch": 2520} {"train_loss": -24.23526954650879, "global_step": 209179, "epoch": 2520} {"train_loss": -24.68335723876953, "global_step": 209180, "epoch": 2520} {"train_loss": -24.70124626159668, "global_step": 209181, "epoch": 2520} {"train_loss": -24.410200119018555, "global_step": 209182, "epoch": 2520} {"train_loss": -24.58805274963379, "global_step": 209183, "epoch": 2520} {"train_loss": -24.420963287353516, "global_step": 209184, "epoch": 2520} {"train_loss": -24.41977310180664, "global_step": 209185, "epoch": 2520} {"train_loss": -24.523353576660156, "global_step": 209186, "epoch": 2520} {"train_loss": -24.657968521118164, "global_step": 209187, "epoch": 2520} {"train_loss": -24.42769432067871, "global_step": 209188, "epoch": 2520} {"train_loss": -24.290668487548828, "global_step": 209189, "epoch": 2520} {"train_loss": -24.45575523376465, "global_step": 209190, "epoch": 2520} {"train_loss": -24.619382858276367, "global_step": 209191, "epoch": 2520} {"train_loss": -24.378767013549805, "global_step": 209192, "epoch": 2520} {"train_loss": -24.747812271118164, "global_step": 209193, "epoch": 2520} {"train_loss": -24.501829147338867, "global_step": 209194, "epoch": 2520} {"train_loss": -24.809799194335938, "global_step": 209195, "epoch": 2520} {"train_loss": -24.691553115844727, "global_step": 209196, "epoch": 2520} {"train_loss": -24.565675735473633, "global_step": 209197, "epoch": 2520} {"train_loss": -24.668445587158203, "global_step": 209198, "epoch": 2520} {"train_loss": -24.456045150756836, "global_step": 209199, "epoch": 2520} {"train_loss": -24.30744743347168, "global_step": 209200, "epoch": 2520} {"train_loss": -24.25452423095703, "global_step": 209201, "epoch": 2520} {"train_loss": -24.62318229675293, "global_step": 209202, "epoch": 2520} {"train_loss": -24.666898727416992, "global_step": 209203, "epoch": 2520} {"train_loss": -24.507028579711914, "global_step": 209204, "epoch": 2520} {"train_loss": -24.142683029174805, "global_step": 209205, "epoch": 2520} {"train_loss": -24.69778060913086, "global_step": 209206, "epoch": 2520} {"train_loss": -24.36612319946289, "global_step": 209207, "epoch": 2520} {"train_loss": -24.508045196533203, "global_step": 209208, "epoch": 2520} {"train_loss": -23.823808670043945, "global_step": 209209, "epoch": 2520} {"train_loss": -23.692331314086914, "global_step": 209210, "epoch": 2520} {"train_loss": -23.873241424560547, "global_step": 209211, "epoch": 2520} {"train_loss": -24.1568603515625, "global_step": 209212, "epoch": 2520} {"train_loss": -24.34899139404297, "global_step": 209213, "epoch": 2520} {"train_loss": -24.208593368530273, "global_step": 209214, "epoch": 2520} {"train_loss": -24.28299903869629, "global_step": 209215, "epoch": 2520} {"train_loss": -24.346923828125, "global_step": 209216, "epoch": 2520} {"train_loss": -24.328397750854492, "global_step": 209217, "epoch": 2520} {"train_loss": -24.15329360961914, "global_step": 209218, "epoch": 2520} {"train_loss": -24.20625114440918, "global_step": 209219, "epoch": 2520} {"train_loss": -24.30954933166504, "global_step": 209220, "epoch": 2520} {"train_loss": -24.0540828704834, "global_step": 209221, "epoch": 2520} {"train_loss": -24.05885887145996, "global_step": 209222, "epoch": 2520} {"train_loss": -24.341358184814453, "global_step": 209223, "epoch": 2520} {"train_loss": -24.475475311279297, "global_step": 209224, "epoch": 2520} {"train_loss": -24.352188110351562, "global_step": 209225, "epoch": 2520} {"train_loss": -24.158395767211914, "global_step": 209226, "epoch": 2520} {"train_loss": -24.326995849609375, "global_step": 209227, "epoch": 2520} {"train_loss": -24.226961135864258, "global_step": 209228, "epoch": 2520} {"train_loss": -24.46380615234375, "global_step": 209229, "epoch": 2520} {"train_loss": -24.386247634887695, "global_step": 209230, "epoch": 2520} {"train_loss": -24.257919311523438, "global_step": 209231, "epoch": 2520} {"train_loss": -24.32716178894043, "global_step": 209232, "epoch": 2520} {"train_loss": -24.490863800048828, "global_step": 209233, "epoch": 2520} {"train_loss": -24.41241455078125, "global_step": 209234, "epoch": 2520} {"train_loss": -24.23201560974121, "global_step": 209235, "epoch": 2520} {"train_loss": -24.678497314453125, "global_step": 209236, "epoch": 2520} {"train_loss": -24.83876609802246, "global_step": 209237, "epoch": 2520} {"train_loss": -24.830965042114258, "global_step": 209238, "epoch": 2520} {"train_loss": -24.620532989501953, "global_step": 209239, "epoch": 2520} {"train_loss": -24.413827896118164, "global_step": 209240, "epoch": 2520} {"train_loss": -23.934438705444336, "global_step": 209241, "epoch": 2520} {"train_loss": -24.348883479474537, "global_step": 209242, "epoch": 2520, "val_loss": 6640404.0} {"train_loss": -24.038034439086914, "global_step": 209243, "epoch": 2521} {"train_loss": -23.904502868652344, "global_step": 209244, "epoch": 2521} {"train_loss": -23.856243133544922, "global_step": 209245, "epoch": 2521} {"train_loss": -23.639928817749023, "global_step": 209246, "epoch": 2521} {"train_loss": -23.695871353149414, "global_step": 209247, "epoch": 2521} {"train_loss": -24.22792625427246, "global_step": 209248, "epoch": 2521} {"train_loss": -24.149585723876953, "global_step": 209249, "epoch": 2521} {"train_loss": -23.977989196777344, "global_step": 209250, "epoch": 2521} {"train_loss": -23.929325103759766, "global_step": 209251, "epoch": 2521} {"train_loss": -24.150846481323242, "global_step": 209252, "epoch": 2521} {"train_loss": -24.085113525390625, "global_step": 209253, "epoch": 2521} {"train_loss": -24.370840072631836, "global_step": 209254, "epoch": 2521} {"train_loss": -23.84598731994629, "global_step": 209255, "epoch": 2521} {"train_loss": -24.400314331054688, "global_step": 209256, "epoch": 2521} {"train_loss": -24.45572280883789, "global_step": 209257, "epoch": 2521} {"train_loss": -24.3237247467041, "global_step": 209258, "epoch": 2521} {"train_loss": -24.147260665893555, "global_step": 209259, "epoch": 2521} {"train_loss": -24.40365219116211, "global_step": 209260, "epoch": 2521} {"train_loss": -24.352441787719727, "global_step": 209261, "epoch": 2521} {"train_loss": -24.590354919433594, "global_step": 209262, "epoch": 2521} {"train_loss": -24.504629135131836, "global_step": 209263, "epoch": 2521} {"train_loss": -24.794675827026367, "global_step": 209264, "epoch": 2521} {"train_loss": -24.595319747924805, "global_step": 209265, "epoch": 2521} {"train_loss": -24.489765167236328, "global_step": 209266, "epoch": 2521} {"train_loss": -24.35813331604004, "global_step": 209267, "epoch": 2521} {"train_loss": -24.132848739624023, "global_step": 209268, "epoch": 2521} {"train_loss": -24.585187911987305, "global_step": 209269, "epoch": 2521} {"train_loss": -24.752582550048828, "global_step": 209270, "epoch": 2521} {"train_loss": -24.27482032775879, "global_step": 209271, "epoch": 2521} {"train_loss": -24.715682983398438, "global_step": 209272, "epoch": 2521} {"train_loss": -24.171354293823242, "global_step": 209273, "epoch": 2521} {"train_loss": -24.20914649963379, "global_step": 209274, "epoch": 2521} {"train_loss": -24.692312240600586, "global_step": 209275, "epoch": 2521} {"train_loss": -24.407344818115234, "global_step": 209276, "epoch": 2521} {"train_loss": -24.357297897338867, "global_step": 209277, "epoch": 2521} {"train_loss": -24.166818618774414, "global_step": 209278, "epoch": 2521} {"train_loss": -23.89228630065918, "global_step": 209279, "epoch": 2521} {"train_loss": -24.945425033569336, "global_step": 209280, "epoch": 2521} {"train_loss": -24.1263484954834, "global_step": 209281, "epoch": 2521} {"train_loss": -24.517499923706055, "global_step": 209282, "epoch": 2521} {"train_loss": -24.40903663635254, "global_step": 209283, "epoch": 2521} {"train_loss": -24.39397621154785, "global_step": 209284, "epoch": 2521} {"train_loss": -24.387418746948242, "global_step": 209285, "epoch": 2521} {"train_loss": -24.1033878326416, "global_step": 209286, "epoch": 2521} {"train_loss": -24.8245906829834, "global_step": 209287, "epoch": 2521} {"train_loss": -24.4514102935791, "global_step": 209288, "epoch": 2521} {"train_loss": -24.583494186401367, "global_step": 209289, "epoch": 2521} {"train_loss": -24.170509338378906, "global_step": 209290, "epoch": 2521} {"train_loss": -24.51853370666504, "global_step": 209291, "epoch": 2521} {"train_loss": -24.151037216186523, "global_step": 209292, "epoch": 2521} {"train_loss": -23.886289596557617, "global_step": 209293, "epoch": 2521} {"train_loss": -24.327966690063477, "global_step": 209294, "epoch": 2521} {"train_loss": -24.556331634521484, "global_step": 209295, "epoch": 2521} {"train_loss": -24.247060775756836, "global_step": 209296, "epoch": 2521} {"train_loss": -24.24045181274414, "global_step": 209297, "epoch": 2521} {"train_loss": -24.367496490478516, "global_step": 209298, "epoch": 2521} {"train_loss": -24.2810115814209, "global_step": 209299, "epoch": 2521} {"train_loss": -24.25867462158203, "global_step": 209300, "epoch": 2521} {"train_loss": -24.90691566467285, "global_step": 209301, "epoch": 2521} {"train_loss": -24.31386375427246, "global_step": 209302, "epoch": 2521} {"train_loss": -24.6878604888916, "global_step": 209303, "epoch": 2521} {"train_loss": -24.37092399597168, "global_step": 209304, "epoch": 2521} {"train_loss": -24.47205924987793, "global_step": 209305, "epoch": 2521} {"train_loss": -24.469223022460938, "global_step": 209306, "epoch": 2521} {"train_loss": -24.62333106994629, "global_step": 209307, "epoch": 2521} {"train_loss": -24.416349411010742, "global_step": 209308, "epoch": 2521} {"train_loss": -24.424072265625, "global_step": 209309, "epoch": 2521} {"train_loss": -24.534992218017578, "global_step": 209310, "epoch": 2521} {"train_loss": -24.37395668029785, "global_step": 209311, "epoch": 2521} {"train_loss": -24.488513946533203, "global_step": 209312, "epoch": 2521} {"train_loss": -24.48693084716797, "global_step": 209313, "epoch": 2521} {"train_loss": -24.71236228942871, "global_step": 209314, "epoch": 2521} {"train_loss": -24.67439842224121, "global_step": 209315, "epoch": 2521} {"train_loss": -24.1117000579834, "global_step": 209316, "epoch": 2521} {"train_loss": -24.287464141845703, "global_step": 209317, "epoch": 2521} {"train_loss": -24.42738914489746, "global_step": 209318, "epoch": 2521} {"train_loss": -24.437353134155273, "global_step": 209319, "epoch": 2521} {"train_loss": -24.69349479675293, "global_step": 209320, "epoch": 2521} {"train_loss": -24.693754196166992, "global_step": 209321, "epoch": 2521} {"train_loss": -24.417715072631836, "global_step": 209322, "epoch": 2521} {"train_loss": -24.287866592407227, "global_step": 209323, "epoch": 2521} {"train_loss": -24.491168975830078, "global_step": 209324, "epoch": 2521} {"train_loss": -24.360674662762378, "global_step": 209325, "epoch": 2521, "val_loss": 6655801.0} {"train_loss": -23.86879539489746, "global_step": 209326, "epoch": 2522} {"train_loss": -23.995519638061523, "global_step": 209327, "epoch": 2522} {"train_loss": -24.168790817260742, "global_step": 209328, "epoch": 2522} {"train_loss": -23.792266845703125, "global_step": 209329, "epoch": 2522} {"train_loss": -24.414106369018555, "global_step": 209330, "epoch": 2522} {"train_loss": -23.99985694885254, "global_step": 209331, "epoch": 2522} {"train_loss": -24.073129653930664, "global_step": 209332, "epoch": 2522} {"train_loss": -23.903562545776367, "global_step": 209333, "epoch": 2522} {"train_loss": -24.04296875, "global_step": 209334, "epoch": 2522} {"train_loss": -24.16990089416504, "global_step": 209335, "epoch": 2522} {"train_loss": -24.089250564575195, "global_step": 209336, "epoch": 2522} {"train_loss": -23.916152954101562, "global_step": 209337, "epoch": 2522} {"train_loss": -24.580913543701172, "global_step": 209338, "epoch": 2522} {"train_loss": -24.16152572631836, "global_step": 209339, "epoch": 2522} {"train_loss": -24.348915100097656, "global_step": 209340, "epoch": 2522} {"train_loss": -24.5689697265625, "global_step": 209341, "epoch": 2522} {"train_loss": -24.50429344177246, "global_step": 209342, "epoch": 2522} {"train_loss": -24.19178581237793, "global_step": 209343, "epoch": 2522} {"train_loss": -24.312759399414062, "global_step": 209344, "epoch": 2522} {"train_loss": -24.426807403564453, "global_step": 209345, "epoch": 2522} {"train_loss": -24.259138107299805, "global_step": 209346, "epoch": 2522} {"train_loss": -24.259366989135742, "global_step": 209347, "epoch": 2522} {"train_loss": -24.300765991210938, "global_step": 209348, "epoch": 2522} {"train_loss": -24.070707321166992, "global_step": 209349, "epoch": 2522} {"train_loss": -24.47635269165039, "global_step": 209350, "epoch": 2522} {"train_loss": -24.276798248291016, "global_step": 209351, "epoch": 2522} {"train_loss": -24.29660415649414, "global_step": 209352, "epoch": 2522} {"train_loss": -24.35441017150879, "global_step": 209353, "epoch": 2522} {"train_loss": -24.544950485229492, "global_step": 209354, "epoch": 2522} {"train_loss": -24.23478126525879, "global_step": 209355, "epoch": 2522} {"train_loss": -24.68770980834961, "global_step": 209356, "epoch": 2522} {"train_loss": -24.436838150024414, "global_step": 209357, "epoch": 2522} {"train_loss": -24.733205795288086, "global_step": 209358, "epoch": 2522} {"train_loss": -24.75783348083496, "global_step": 209359, "epoch": 2522} {"train_loss": -24.314971923828125, "global_step": 209360, "epoch": 2522} {"train_loss": -24.562564849853516, "global_step": 209361, "epoch": 2522} {"train_loss": -24.395633697509766, "global_step": 209362, "epoch": 2522} {"train_loss": -24.44170379638672, "global_step": 209363, "epoch": 2522} {"train_loss": -24.617103576660156, "global_step": 209364, "epoch": 2522} {"train_loss": -24.125925064086914, "global_step": 209365, "epoch": 2522} {"train_loss": -24.592626571655273, "global_step": 209366, "epoch": 2522} {"train_loss": -24.266157150268555, "global_step": 209367, "epoch": 2522} {"train_loss": -24.47998809814453, "global_step": 209368, "epoch": 2522} {"train_loss": -24.66245460510254, "global_step": 209369, "epoch": 2522} {"train_loss": -24.473743438720703, "global_step": 209370, "epoch": 2522} {"train_loss": -24.800687789916992, "global_step": 209371, "epoch": 2522} {"train_loss": -24.529081344604492, "global_step": 209372, "epoch": 2522} {"train_loss": -24.65977668762207, "global_step": 209373, "epoch": 2522} {"train_loss": -24.727201461791992, "global_step": 209374, "epoch": 2522} {"train_loss": -24.507450103759766, "global_step": 209375, "epoch": 2522} {"train_loss": -24.116561889648438, "global_step": 209376, "epoch": 2522} {"train_loss": -23.6932430267334, "global_step": 209377, "epoch": 2522} {"train_loss": -23.650182723999023, "global_step": 209378, "epoch": 2522} {"train_loss": -23.91517448425293, "global_step": 209379, "epoch": 2522} {"train_loss": -24.370222091674805, "global_step": 209380, "epoch": 2522} {"train_loss": -24.164274215698242, "global_step": 209381, "epoch": 2522} {"train_loss": -24.170333862304688, "global_step": 209382, "epoch": 2522} {"train_loss": -24.536439895629883, "global_step": 209383, "epoch": 2522} {"train_loss": -24.801042556762695, "global_step": 209384, "epoch": 2522} {"train_loss": -24.351486206054688, "global_step": 209385, "epoch": 2522} {"train_loss": -24.231552124023438, "global_step": 209386, "epoch": 2522} {"train_loss": -24.3728084564209, "global_step": 209387, "epoch": 2522} {"train_loss": -24.4589900970459, "global_step": 209388, "epoch": 2522} {"train_loss": -24.325742721557617, "global_step": 209389, "epoch": 2522} {"train_loss": -24.326705932617188, "global_step": 209390, "epoch": 2522} {"train_loss": -24.816055297851562, "global_step": 209391, "epoch": 2522} {"train_loss": -24.634538650512695, "global_step": 209392, "epoch": 2522} {"train_loss": -24.829050064086914, "global_step": 209393, "epoch": 2522} {"train_loss": -24.347387313842773, "global_step": 209394, "epoch": 2522} {"train_loss": -24.25782585144043, "global_step": 209395, "epoch": 2522} {"train_loss": -24.24144744873047, "global_step": 209396, "epoch": 2522} {"train_loss": -24.27833366394043, "global_step": 209397, "epoch": 2522} {"train_loss": -24.467870712280273, "global_step": 209398, "epoch": 2522} {"train_loss": -24.387893676757812, "global_step": 209399, "epoch": 2522} {"train_loss": -24.4124813079834, "global_step": 209400, "epoch": 2522} {"train_loss": -24.386560440063477, "global_step": 209401, "epoch": 2522} {"train_loss": -24.295698165893555, "global_step": 209402, "epoch": 2522} {"train_loss": -24.400480270385742, "global_step": 209403, "epoch": 2522} {"train_loss": -24.724639892578125, "global_step": 209404, "epoch": 2522} {"train_loss": -24.6354923248291, "global_step": 209405, "epoch": 2522} {"train_loss": -24.58510398864746, "global_step": 209406, "epoch": 2522} {"train_loss": -23.85309410095215, "global_step": 209407, "epoch": 2522} {"train_loss": -24.35138134784009, "global_step": 209408, "epoch": 2522, "val_loss": 6664543.0} {"train_loss": -24.20745849609375, "global_step": 209409, "epoch": 2523} {"train_loss": -24.0072021484375, "global_step": 209410, "epoch": 2523} {"train_loss": -24.168785095214844, "global_step": 209411, "epoch": 2523} {"train_loss": -23.781631469726562, "global_step": 209412, "epoch": 2523} {"train_loss": -24.405887603759766, "global_step": 209413, "epoch": 2523} {"train_loss": -23.54259490966797, "global_step": 209414, "epoch": 2523} {"train_loss": -24.1202449798584, "global_step": 209415, "epoch": 2523} {"train_loss": -24.254505157470703, "global_step": 209416, "epoch": 2523} {"train_loss": -23.81111717224121, "global_step": 209417, "epoch": 2523} {"train_loss": -24.075254440307617, "global_step": 209418, "epoch": 2523} {"train_loss": -24.046356201171875, "global_step": 209419, "epoch": 2523} {"train_loss": -24.12946128845215, "global_step": 209420, "epoch": 2523} {"train_loss": -24.030887603759766, "global_step": 209421, "epoch": 2523} {"train_loss": -24.14945411682129, "global_step": 209422, "epoch": 2523} {"train_loss": -24.283798217773438, "global_step": 209423, "epoch": 2523} {"train_loss": -24.221792221069336, "global_step": 209424, "epoch": 2523} {"train_loss": -24.351367950439453, "global_step": 209425, "epoch": 2523} {"train_loss": -24.36343765258789, "global_step": 209426, "epoch": 2523} {"train_loss": -24.154138565063477, "global_step": 209427, "epoch": 2523} {"train_loss": -24.581886291503906, "global_step": 209428, "epoch": 2523} {"train_loss": -24.308862686157227, "global_step": 209429, "epoch": 2523} {"train_loss": -24.535139083862305, "global_step": 209430, "epoch": 2523} {"train_loss": -24.47773551940918, "global_step": 209431, "epoch": 2523} {"train_loss": -24.345117568969727, "global_step": 209432, "epoch": 2523} {"train_loss": -24.524600982666016, "global_step": 209433, "epoch": 2523} {"train_loss": -24.04736328125, "global_step": 209434, "epoch": 2523} {"train_loss": -24.35778045654297, "global_step": 209435, "epoch": 2523} {"train_loss": -24.389062881469727, "global_step": 209436, "epoch": 2523} {"train_loss": -24.075170516967773, "global_step": 209437, "epoch": 2523} {"train_loss": -24.41990089416504, "global_step": 209438, "epoch": 2523} {"train_loss": -24.718839645385742, "global_step": 209439, "epoch": 2523} {"train_loss": -24.43343162536621, "global_step": 209440, "epoch": 2523} {"train_loss": -24.291534423828125, "global_step": 209441, "epoch": 2523} {"train_loss": -24.409814834594727, "global_step": 209442, "epoch": 2523} {"train_loss": -24.218748092651367, "global_step": 209443, "epoch": 2523} {"train_loss": -24.479969024658203, "global_step": 209444, "epoch": 2523} {"train_loss": -24.4368896484375, "global_step": 209445, "epoch": 2523} {"train_loss": -24.613554000854492, "global_step": 209446, "epoch": 2523} {"train_loss": -24.795883178710938, "global_step": 209447, "epoch": 2523} {"train_loss": -24.583341598510742, "global_step": 209448, "epoch": 2523} {"train_loss": -24.552942276000977, "global_step": 209449, "epoch": 2523} {"train_loss": -24.372602462768555, "global_step": 209450, "epoch": 2523} {"train_loss": -24.005964279174805, "global_step": 209451, "epoch": 2523} {"train_loss": -24.41802215576172, "global_step": 209452, "epoch": 2523} {"train_loss": -24.345767974853516, "global_step": 209453, "epoch": 2523} {"train_loss": -23.547574996948242, "global_step": 209454, "epoch": 2523} {"train_loss": -23.56817054748535, "global_step": 209455, "epoch": 2523} {"train_loss": -23.9931640625, "global_step": 209456, "epoch": 2523} {"train_loss": -24.006940841674805, "global_step": 209457, "epoch": 2523} {"train_loss": -24.799846649169922, "global_step": 209458, "epoch": 2523} {"train_loss": -24.22631072998047, "global_step": 209459, "epoch": 2523} {"train_loss": -23.970930099487305, "global_step": 209460, "epoch": 2523} {"train_loss": -24.36266326904297, "global_step": 209461, "epoch": 2523} {"train_loss": -24.630054473876953, "global_step": 209462, "epoch": 2523} {"train_loss": -24.3643856048584, "global_step": 209463, "epoch": 2523} {"train_loss": -24.366718292236328, "global_step": 209464, "epoch": 2523} {"train_loss": -24.540830612182617, "global_step": 209465, "epoch": 2523} {"train_loss": -24.704174041748047, "global_step": 209466, "epoch": 2523} {"train_loss": -24.39463996887207, "global_step": 209467, "epoch": 2523} {"train_loss": -24.283491134643555, "global_step": 209468, "epoch": 2523} {"train_loss": -24.540781021118164, "global_step": 209469, "epoch": 2523} {"train_loss": -24.19870948791504, "global_step": 209470, "epoch": 2523} {"train_loss": -24.3234920501709, "global_step": 209471, "epoch": 2523} {"train_loss": -24.80612564086914, "global_step": 209472, "epoch": 2523} {"train_loss": -24.322772979736328, "global_step": 209473, "epoch": 2523} {"train_loss": -24.62564468383789, "global_step": 209474, "epoch": 2523} {"train_loss": -24.70575523376465, "global_step": 209475, "epoch": 2523} {"train_loss": -24.738021850585938, "global_step": 209476, "epoch": 2523} {"train_loss": -24.436567306518555, "global_step": 209477, "epoch": 2523} {"train_loss": -24.619888305664062, "global_step": 209478, "epoch": 2523} {"train_loss": -24.806488037109375, "global_step": 209479, "epoch": 2523} {"train_loss": -24.151681900024414, "global_step": 209480, "epoch": 2523} {"train_loss": -24.73162841796875, "global_step": 209481, "epoch": 2523} {"train_loss": -24.353792190551758, "global_step": 209482, "epoch": 2523} {"train_loss": -24.63665771484375, "global_step": 209483, "epoch": 2523} {"train_loss": -24.49272346496582, "global_step": 209484, "epoch": 2523} {"train_loss": -24.710668563842773, "global_step": 209485, "epoch": 2523} {"train_loss": -24.321063995361328, "global_step": 209486, "epoch": 2523} {"train_loss": -24.534109115600586, "global_step": 209487, "epoch": 2523} {"train_loss": -24.713850021362305, "global_step": 209488, "epoch": 2523} {"train_loss": -24.300687789916992, "global_step": 209489, "epoch": 2523} {"train_loss": -24.68754768371582, "global_step": 209490, "epoch": 2523} {"train_loss": -24.352462837495, "global_step": 209491, "epoch": 2523, "val_loss": 6601402.0} {"train_loss": -23.13643455505371, "global_step": 209492, "epoch": 2524} {"train_loss": -23.260629653930664, "global_step": 209493, "epoch": 2524} {"train_loss": -24.043527603149414, "global_step": 209494, "epoch": 2524} {"train_loss": -22.968549728393555, "global_step": 209495, "epoch": 2524} {"train_loss": -23.9390811920166, "global_step": 209496, "epoch": 2524} {"train_loss": -23.306446075439453, "global_step": 209497, "epoch": 2524} {"train_loss": -23.52682876586914, "global_step": 209498, "epoch": 2524} {"train_loss": -23.100006103515625, "global_step": 209499, "epoch": 2524} {"train_loss": -23.910688400268555, "global_step": 209500, "epoch": 2524} {"train_loss": -23.836408615112305, "global_step": 209501, "epoch": 2524} {"train_loss": -23.6754093170166, "global_step": 209502, "epoch": 2524} {"train_loss": -23.47953224182129, "global_step": 209503, "epoch": 2524} {"train_loss": -23.568639755249023, "global_step": 209504, "epoch": 2524} {"train_loss": -23.288034439086914, "global_step": 209505, "epoch": 2524} {"train_loss": -23.359113693237305, "global_step": 209506, "epoch": 2524} {"train_loss": -23.6597957611084, "global_step": 209507, "epoch": 2524} {"train_loss": -23.62888526916504, "global_step": 209508, "epoch": 2524} {"train_loss": -23.4541072845459, "global_step": 209509, "epoch": 2524} {"train_loss": -23.600025177001953, "global_step": 209510, "epoch": 2524} {"train_loss": -23.61104965209961, "global_step": 209511, "epoch": 2524} {"train_loss": -24.5007266998291, "global_step": 209512, "epoch": 2524} {"train_loss": -23.82075309753418, "global_step": 209513, "epoch": 2524} {"train_loss": -24.173643112182617, "global_step": 209514, "epoch": 2524} {"train_loss": -23.766164779663086, "global_step": 209515, "epoch": 2524} {"train_loss": -24.264087677001953, "global_step": 209516, "epoch": 2524} {"train_loss": -23.803451538085938, "global_step": 209517, "epoch": 2524} {"train_loss": -24.259796142578125, "global_step": 209518, "epoch": 2524} {"train_loss": -24.069883346557617, "global_step": 209519, "epoch": 2524} {"train_loss": -24.033849716186523, "global_step": 209520, "epoch": 2524} {"train_loss": -24.086912155151367, "global_step": 209521, "epoch": 2524} {"train_loss": -24.186357498168945, "global_step": 209522, "epoch": 2524} {"train_loss": -24.42847442626953, "global_step": 209523, "epoch": 2524} {"train_loss": -24.090129852294922, "global_step": 209524, "epoch": 2524} {"train_loss": -24.263063430786133, "global_step": 209525, "epoch": 2524} {"train_loss": -24.11448860168457, "global_step": 209526, "epoch": 2524} {"train_loss": -24.372474670410156, "global_step": 209527, "epoch": 2524} {"train_loss": -24.312305450439453, "global_step": 209528, "epoch": 2524} {"train_loss": -24.244449615478516, "global_step": 209529, "epoch": 2524} {"train_loss": -24.47140884399414, "global_step": 209530, "epoch": 2524} {"train_loss": -24.35138511657715, "global_step": 209531, "epoch": 2524} {"train_loss": -24.503713607788086, "global_step": 209532, "epoch": 2524} {"train_loss": -24.151731491088867, "global_step": 209533, "epoch": 2524} {"train_loss": -24.325237274169922, "global_step": 209534, "epoch": 2524} {"train_loss": -24.36625099182129, "global_step": 209535, "epoch": 2524} {"train_loss": -24.34504508972168, "global_step": 209536, "epoch": 2524} {"train_loss": -24.29995346069336, "global_step": 209537, "epoch": 2524} {"train_loss": -24.65764808654785, "global_step": 209538, "epoch": 2524} {"train_loss": -24.595033645629883, "global_step": 209539, "epoch": 2524} {"train_loss": -24.717519760131836, "global_step": 209540, "epoch": 2524} {"train_loss": -24.51719093322754, "global_step": 209541, "epoch": 2524} {"train_loss": -24.75692367553711, "global_step": 209542, "epoch": 2524} {"train_loss": -24.678253173828125, "global_step": 209543, "epoch": 2524} {"train_loss": -24.465890884399414, "global_step": 209544, "epoch": 2524} {"train_loss": -24.810409545898438, "global_step": 209545, "epoch": 2524} {"train_loss": -24.47517967224121, "global_step": 209546, "epoch": 2524} {"train_loss": -24.679428100585938, "global_step": 209547, "epoch": 2524} {"train_loss": -24.755859375, "global_step": 209548, "epoch": 2524} {"train_loss": -24.27292823791504, "global_step": 209549, "epoch": 2524} {"train_loss": -23.856740951538086, "global_step": 209550, "epoch": 2524} {"train_loss": -24.211530685424805, "global_step": 209551, "epoch": 2524} {"train_loss": -24.296018600463867, "global_step": 209552, "epoch": 2524} {"train_loss": -24.568449020385742, "global_step": 209553, "epoch": 2524} {"train_loss": -24.08736228942871, "global_step": 209554, "epoch": 2524} {"train_loss": -24.85236167907715, "global_step": 209555, "epoch": 2524} {"train_loss": -24.468534469604492, "global_step": 209556, "epoch": 2524} {"train_loss": -24.602460861206055, "global_step": 209557, "epoch": 2524} {"train_loss": -24.330829620361328, "global_step": 209558, "epoch": 2524} {"train_loss": -24.730987548828125, "global_step": 209559, "epoch": 2524} {"train_loss": -24.018844604492188, "global_step": 209560, "epoch": 2524} {"train_loss": -24.405534744262695, "global_step": 209561, "epoch": 2524} {"train_loss": -24.50444221496582, "global_step": 209562, "epoch": 2524} {"train_loss": -24.338882446289062, "global_step": 209563, "epoch": 2524} {"train_loss": -24.310150146484375, "global_step": 209564, "epoch": 2524} {"train_loss": -24.689733505249023, "global_step": 209565, "epoch": 2524} {"train_loss": -24.40345573425293, "global_step": 209566, "epoch": 2524} {"train_loss": -24.270584106445312, "global_step": 209567, "epoch": 2524} {"train_loss": -24.3194522857666, "global_step": 209568, "epoch": 2524} {"train_loss": -24.280569076538086, "global_step": 209569, "epoch": 2524} {"train_loss": -23.93212890625, "global_step": 209570, "epoch": 2524} {"train_loss": -24.20204734802246, "global_step": 209571, "epoch": 2524} {"train_loss": -24.6353816986084, "global_step": 209572, "epoch": 2524} {"train_loss": -24.56764030456543, "global_step": 209573, "epoch": 2524} {"train_loss": -24.14438562508089, "global_step": 209574, "epoch": 2524, "val_loss": 6514480.0} {"train_loss": -23.989580154418945, "global_step": 209575, "epoch": 2525} {"train_loss": -23.788284301757812, "global_step": 209576, "epoch": 2525} {"train_loss": -23.719982147216797, "global_step": 209577, "epoch": 2525} {"train_loss": -23.940067291259766, "global_step": 209578, "epoch": 2525} {"train_loss": -23.874643325805664, "global_step": 209579, "epoch": 2525} {"train_loss": -24.21657371520996, "global_step": 209580, "epoch": 2525} {"train_loss": -23.93293571472168, "global_step": 209581, "epoch": 2525} {"train_loss": -24.2888240814209, "global_step": 209582, "epoch": 2525} {"train_loss": -24.068134307861328, "global_step": 209583, "epoch": 2525} {"train_loss": -24.296981811523438, "global_step": 209584, "epoch": 2525} {"train_loss": -24.1373233795166, "global_step": 209585, "epoch": 2525} {"train_loss": -24.196548461914062, "global_step": 209586, "epoch": 2525} {"train_loss": -24.07758140563965, "global_step": 209587, "epoch": 2525} {"train_loss": -24.316328048706055, "global_step": 209588, "epoch": 2525} {"train_loss": -24.278993606567383, "global_step": 209589, "epoch": 2525} {"train_loss": -24.558767318725586, "global_step": 209590, "epoch": 2525} {"train_loss": -24.62360954284668, "global_step": 209591, "epoch": 2525} {"train_loss": -24.36545181274414, "global_step": 209592, "epoch": 2525} {"train_loss": -24.098777770996094, "global_step": 209593, "epoch": 2525} {"train_loss": -24.579496383666992, "global_step": 209594, "epoch": 2525} {"train_loss": -24.325986862182617, "global_step": 209595, "epoch": 2525} {"train_loss": -24.57699966430664, "global_step": 209596, "epoch": 2525} {"train_loss": -24.646963119506836, "global_step": 209597, "epoch": 2525} {"train_loss": -24.5261173248291, "global_step": 209598, "epoch": 2525} {"train_loss": -24.46683120727539, "global_step": 209599, "epoch": 2525} {"train_loss": -24.027652740478516, "global_step": 209600, "epoch": 2525} {"train_loss": -23.950439453125, "global_step": 209601, "epoch": 2525} {"train_loss": -24.464004516601562, "global_step": 209602, "epoch": 2525} {"train_loss": -24.228609085083008, "global_step": 209603, "epoch": 2525} {"train_loss": -24.156911849975586, "global_step": 209604, "epoch": 2525} {"train_loss": -24.652984619140625, "global_step": 209605, "epoch": 2525} {"train_loss": -24.610660552978516, "global_step": 209606, "epoch": 2525} {"train_loss": -24.558347702026367, "global_step": 209607, "epoch": 2525} {"train_loss": -24.704893112182617, "global_step": 209608, "epoch": 2525} {"train_loss": -24.640405654907227, "global_step": 209609, "epoch": 2525} {"train_loss": -24.40182113647461, "global_step": 209610, "epoch": 2525} {"train_loss": -24.6835994720459, "global_step": 209611, "epoch": 2525} {"train_loss": -24.4960994720459, "global_step": 209612, "epoch": 2525} {"train_loss": -24.61456871032715, "global_step": 209613, "epoch": 2525} {"train_loss": -24.490951538085938, "global_step": 209614, "epoch": 2525} {"train_loss": -24.93315315246582, "global_step": 209615, "epoch": 2525} {"train_loss": -24.2557373046875, "global_step": 209616, "epoch": 2525} {"train_loss": -24.5637149810791, "global_step": 209617, "epoch": 2525} {"train_loss": -24.401283264160156, "global_step": 209618, "epoch": 2525} {"train_loss": -24.545761108398438, "global_step": 209619, "epoch": 2525} {"train_loss": -23.98451042175293, "global_step": 209620, "epoch": 2525} {"train_loss": -24.33893394470215, "global_step": 209621, "epoch": 2525} {"train_loss": -24.084665298461914, "global_step": 209622, "epoch": 2525} {"train_loss": -24.27980613708496, "global_step": 209623, "epoch": 2525} {"train_loss": -24.79448890686035, "global_step": 209624, "epoch": 2525} {"train_loss": -24.72922706604004, "global_step": 209625, "epoch": 2525} {"train_loss": -24.444232940673828, "global_step": 209626, "epoch": 2525} {"train_loss": -24.70383071899414, "global_step": 209627, "epoch": 2525} {"train_loss": -24.566749572753906, "global_step": 209628, "epoch": 2525} {"train_loss": -24.650144577026367, "global_step": 209629, "epoch": 2525} {"train_loss": -24.184003829956055, "global_step": 209630, "epoch": 2525} {"train_loss": -24.583166122436523, "global_step": 209631, "epoch": 2525} {"train_loss": -24.599334716796875, "global_step": 209632, "epoch": 2525} {"train_loss": -24.208908081054688, "global_step": 209633, "epoch": 2525} {"train_loss": -24.314712524414062, "global_step": 209634, "epoch": 2525} {"train_loss": -24.15038299560547, "global_step": 209635, "epoch": 2525} {"train_loss": -23.878196716308594, "global_step": 209636, "epoch": 2525} {"train_loss": -24.297086715698242, "global_step": 209637, "epoch": 2525} {"train_loss": -24.333040237426758, "global_step": 209638, "epoch": 2525} {"train_loss": -24.40374755859375, "global_step": 209639, "epoch": 2525} {"train_loss": -24.559770584106445, "global_step": 209640, "epoch": 2525} {"train_loss": -23.991540908813477, "global_step": 209641, "epoch": 2525} {"train_loss": -24.37630271911621, "global_step": 209642, "epoch": 2525} {"train_loss": -24.411224365234375, "global_step": 209643, "epoch": 2525} {"train_loss": -24.29298210144043, "global_step": 209644, "epoch": 2525} {"train_loss": -24.430034637451172, "global_step": 209645, "epoch": 2525} {"train_loss": -24.43204689025879, "global_step": 209646, "epoch": 2525} {"train_loss": -24.476200103759766, "global_step": 209647, "epoch": 2525} {"train_loss": -24.54946517944336, "global_step": 209648, "epoch": 2525} {"train_loss": -24.4257869720459, "global_step": 209649, "epoch": 2525} {"train_loss": -24.341297149658203, "global_step": 209650, "epoch": 2525} {"train_loss": -24.62861442565918, "global_step": 209651, "epoch": 2525} {"train_loss": -24.203357696533203, "global_step": 209652, "epoch": 2525} {"train_loss": -24.619970321655273, "global_step": 209653, "epoch": 2525} {"train_loss": -24.156288146972656, "global_step": 209654, "epoch": 2525} {"train_loss": -24.540136337280273, "global_step": 209655, "epoch": 2525} {"train_loss": -24.491140365600586, "global_step": 209656, "epoch": 2525} {"train_loss": -24.36038931881089, "global_step": 209657, "epoch": 2525, "val_loss": 6610849.0} {"train_loss": -24.559972763061523, "global_step": 209658, "epoch": 2526} {"train_loss": -24.373008728027344, "global_step": 209659, "epoch": 2526} {"train_loss": -24.38335609436035, "global_step": 209660, "epoch": 2526} {"train_loss": -24.301677703857422, "global_step": 209661, "epoch": 2526} {"train_loss": -24.44614601135254, "global_step": 209662, "epoch": 2526} {"train_loss": -23.92353630065918, "global_step": 209663, "epoch": 2526} {"train_loss": -24.513280868530273, "global_step": 209664, "epoch": 2526} {"train_loss": -24.587982177734375, "global_step": 209665, "epoch": 2526} {"train_loss": -24.289548873901367, "global_step": 209666, "epoch": 2526} {"train_loss": -24.394580841064453, "global_step": 209667, "epoch": 2526} {"train_loss": -24.476682662963867, "global_step": 209668, "epoch": 2526} {"train_loss": -24.094999313354492, "global_step": 209669, "epoch": 2526} {"train_loss": -24.508329391479492, "global_step": 209670, "epoch": 2526} {"train_loss": -24.498464584350586, "global_step": 209671, "epoch": 2526} {"train_loss": -24.90882682800293, "global_step": 209672, "epoch": 2526} {"train_loss": -24.51715850830078, "global_step": 209673, "epoch": 2526} {"train_loss": -24.460880279541016, "global_step": 209674, "epoch": 2526} {"train_loss": -24.787906646728516, "global_step": 209675, "epoch": 2526} {"train_loss": -24.956226348876953, "global_step": 209676, "epoch": 2526} {"train_loss": -24.464542388916016, "global_step": 209677, "epoch": 2526} {"train_loss": -24.65113639831543, "global_step": 209678, "epoch": 2526} {"train_loss": -24.743337631225586, "global_step": 209679, "epoch": 2526} {"train_loss": -24.450529098510742, "global_step": 209680, "epoch": 2526} {"train_loss": -24.792173385620117, "global_step": 209681, "epoch": 2526} {"train_loss": -25.189794540405273, "global_step": 209682, "epoch": 2526} {"train_loss": -24.670902252197266, "global_step": 209683, "epoch": 2526} {"train_loss": -24.220457077026367, "global_step": 209684, "epoch": 2526} {"train_loss": -24.705331802368164, "global_step": 209685, "epoch": 2526} {"train_loss": -24.15216064453125, "global_step": 209686, "epoch": 2526} {"train_loss": -23.92336654663086, "global_step": 209687, "epoch": 2526} {"train_loss": -24.323026657104492, "global_step": 209688, "epoch": 2526} {"train_loss": -24.6060733795166, "global_step": 209689, "epoch": 2526} {"train_loss": -23.827163696289062, "global_step": 209690, "epoch": 2526} {"train_loss": -24.105627059936523, "global_step": 209691, "epoch": 2526} {"train_loss": -24.669301986694336, "global_step": 209692, "epoch": 2526} {"train_loss": -24.243640899658203, "global_step": 209693, "epoch": 2526} {"train_loss": -24.57676124572754, "global_step": 209694, "epoch": 2526} {"train_loss": -24.744470596313477, "global_step": 209695, "epoch": 2526} {"train_loss": -24.48143768310547, "global_step": 209696, "epoch": 2526} {"train_loss": -24.652793884277344, "global_step": 209697, "epoch": 2526} {"train_loss": -24.022096633911133, "global_step": 209698, "epoch": 2526} {"train_loss": -24.16399383544922, "global_step": 209699, "epoch": 2526} {"train_loss": -24.941919326782227, "global_step": 209700, "epoch": 2526} {"train_loss": -24.16263771057129, "global_step": 209701, "epoch": 2526} {"train_loss": -24.459508895874023, "global_step": 209702, "epoch": 2526} {"train_loss": -24.3975887298584, "global_step": 209703, "epoch": 2526} {"train_loss": -24.721960067749023, "global_step": 209704, "epoch": 2526} {"train_loss": -24.650907516479492, "global_step": 209705, "epoch": 2526} {"train_loss": -24.185791015625, "global_step": 209706, "epoch": 2526} {"train_loss": -23.895078659057617, "global_step": 209707, "epoch": 2526} {"train_loss": -23.781816482543945, "global_step": 209708, "epoch": 2526} {"train_loss": -24.085006713867188, "global_step": 209709, "epoch": 2526} {"train_loss": -24.11764907836914, "global_step": 209710, "epoch": 2526} {"train_loss": -24.107158660888672, "global_step": 209711, "epoch": 2526} {"train_loss": -24.21699333190918, "global_step": 209712, "epoch": 2526} {"train_loss": -24.373497009277344, "global_step": 209713, "epoch": 2526} {"train_loss": -24.363386154174805, "global_step": 209714, "epoch": 2526} {"train_loss": -24.41815185546875, "global_step": 209715, "epoch": 2526} {"train_loss": -24.280948638916016, "global_step": 209716, "epoch": 2526} {"train_loss": -24.134885787963867, "global_step": 209717, "epoch": 2526} {"train_loss": -24.3377742767334, "global_step": 209718, "epoch": 2526} {"train_loss": -24.557199478149414, "global_step": 209719, "epoch": 2526} {"train_loss": -24.27469825744629, "global_step": 209720, "epoch": 2526} {"train_loss": -24.42059898376465, "global_step": 209721, "epoch": 2526} {"train_loss": -24.275617599487305, "global_step": 209722, "epoch": 2526} {"train_loss": -24.34419059753418, "global_step": 209723, "epoch": 2526} {"train_loss": -24.228836059570312, "global_step": 209724, "epoch": 2526} {"train_loss": -24.3132266998291, "global_step": 209725, "epoch": 2526} {"train_loss": -24.209623336791992, "global_step": 209726, "epoch": 2526} {"train_loss": -24.32594871520996, "global_step": 209727, "epoch": 2526} {"train_loss": -24.631332397460938, "global_step": 209728, "epoch": 2526} {"train_loss": -24.243183135986328, "global_step": 209729, "epoch": 2526} {"train_loss": -24.688945770263672, "global_step": 209730, "epoch": 2526} {"train_loss": -24.703115463256836, "global_step": 209731, "epoch": 2526} {"train_loss": -24.611169815063477, "global_step": 209732, "epoch": 2526} {"train_loss": -24.631391525268555, "global_step": 209733, "epoch": 2526} {"train_loss": -24.7908935546875, "global_step": 209734, "epoch": 2526} {"train_loss": -24.533065795898438, "global_step": 209735, "epoch": 2526} {"train_loss": -24.921613693237305, "global_step": 209736, "epoch": 2526} {"train_loss": -24.757909774780273, "global_step": 209737, "epoch": 2526} {"train_loss": -23.854345321655273, "global_step": 209738, "epoch": 2526} {"train_loss": -24.232154846191406, "global_step": 209739, "epoch": 2526} {"train_loss": -24.423962535628352, "global_step": 209740, "epoch": 2526, "val_loss": 6694775.0} {"train_loss": -23.540390014648438, "global_step": 209741, "epoch": 2527} {"train_loss": -23.82860565185547, "global_step": 209742, "epoch": 2527} {"train_loss": -24.12525749206543, "global_step": 209743, "epoch": 2527} {"train_loss": -24.26067352294922, "global_step": 209744, "epoch": 2527} {"train_loss": -24.348615646362305, "global_step": 209745, "epoch": 2527} {"train_loss": -24.0474910736084, "global_step": 209746, "epoch": 2527} {"train_loss": -24.50663185119629, "global_step": 209747, "epoch": 2527} {"train_loss": -24.32234001159668, "global_step": 209748, "epoch": 2527} {"train_loss": -24.334714889526367, "global_step": 209749, "epoch": 2527} {"train_loss": -24.00712013244629, "global_step": 209750, "epoch": 2527} {"train_loss": -24.032508850097656, "global_step": 209751, "epoch": 2527} {"train_loss": -24.458515167236328, "global_step": 209752, "epoch": 2527} {"train_loss": -24.086740493774414, "global_step": 209753, "epoch": 2527} {"train_loss": -24.142255783081055, "global_step": 209754, "epoch": 2527} {"train_loss": -24.28649139404297, "global_step": 209755, "epoch": 2527} {"train_loss": -24.2602481842041, "global_step": 209756, "epoch": 2527} {"train_loss": -24.223310470581055, "global_step": 209757, "epoch": 2527} {"train_loss": -24.331918716430664, "global_step": 209758, "epoch": 2527} {"train_loss": -24.350332260131836, "global_step": 209759, "epoch": 2527} {"train_loss": -24.577863693237305, "global_step": 209760, "epoch": 2527} {"train_loss": -24.30570411682129, "global_step": 209761, "epoch": 2527} {"train_loss": -24.0758113861084, "global_step": 209762, "epoch": 2527} {"train_loss": -24.00166893005371, "global_step": 209763, "epoch": 2527} {"train_loss": -24.38896942138672, "global_step": 209764, "epoch": 2527} {"train_loss": -24.25260353088379, "global_step": 209765, "epoch": 2527} {"train_loss": -24.14765167236328, "global_step": 209766, "epoch": 2527} {"train_loss": -24.392568588256836, "global_step": 209767, "epoch": 2527} {"train_loss": -24.294458389282227, "global_step": 209768, "epoch": 2527} {"train_loss": -24.235157012939453, "global_step": 209769, "epoch": 2527} {"train_loss": -24.154579162597656, "global_step": 209770, "epoch": 2527} {"train_loss": -24.28354835510254, "global_step": 209771, "epoch": 2527} {"train_loss": -24.64510726928711, "global_step": 209772, "epoch": 2527} {"train_loss": -24.106794357299805, "global_step": 209773, "epoch": 2527} {"train_loss": -24.392932891845703, "global_step": 209774, "epoch": 2527} {"train_loss": -24.35659408569336, "global_step": 209775, "epoch": 2527} {"train_loss": -24.49651527404785, "global_step": 209776, "epoch": 2527} {"train_loss": -24.742216110229492, "global_step": 209777, "epoch": 2527} {"train_loss": -24.327608108520508, "global_step": 209778, "epoch": 2527} {"train_loss": -24.170120239257812, "global_step": 209779, "epoch": 2527} {"train_loss": -24.22616958618164, "global_step": 209780, "epoch": 2527} {"train_loss": -24.533899307250977, "global_step": 209781, "epoch": 2527} {"train_loss": -24.128910064697266, "global_step": 209782, "epoch": 2527} {"train_loss": -24.417043685913086, "global_step": 209783, "epoch": 2527} {"train_loss": -24.201955795288086, "global_step": 209784, "epoch": 2527} {"train_loss": -24.531274795532227, "global_step": 209785, "epoch": 2527} {"train_loss": -24.22085952758789, "global_step": 209786, "epoch": 2527} {"train_loss": -24.17359733581543, "global_step": 209787, "epoch": 2527} {"train_loss": -24.42505645751953, "global_step": 209788, "epoch": 2527} {"train_loss": -24.527822494506836, "global_step": 209789, "epoch": 2527} {"train_loss": -24.065547943115234, "global_step": 209790, "epoch": 2527} {"train_loss": -24.127214431762695, "global_step": 209791, "epoch": 2527} {"train_loss": -24.27054214477539, "global_step": 209792, "epoch": 2527} {"train_loss": -24.78421974182129, "global_step": 209793, "epoch": 2527} {"train_loss": -24.6597957611084, "global_step": 209794, "epoch": 2527} {"train_loss": -24.436384201049805, "global_step": 209795, "epoch": 2527} {"train_loss": -24.443655014038086, "global_step": 209796, "epoch": 2527} {"train_loss": -24.281042098999023, "global_step": 209797, "epoch": 2527} {"train_loss": -24.4638614654541, "global_step": 209798, "epoch": 2527} {"train_loss": -24.596426010131836, "global_step": 209799, "epoch": 2527} {"train_loss": -24.404783248901367, "global_step": 209800, "epoch": 2527} {"train_loss": -24.844186782836914, "global_step": 209801, "epoch": 2527} {"train_loss": -24.379985809326172, "global_step": 209802, "epoch": 2527} {"train_loss": -24.57299041748047, "global_step": 209803, "epoch": 2527} {"train_loss": -24.389663696289062, "global_step": 209804, "epoch": 2527} {"train_loss": -24.61868667602539, "global_step": 209805, "epoch": 2527} {"train_loss": -24.429908752441406, "global_step": 209806, "epoch": 2527} {"train_loss": -24.710168838500977, "global_step": 209807, "epoch": 2527} {"train_loss": -24.350244522094727, "global_step": 209808, "epoch": 2527} {"train_loss": -24.831806182861328, "global_step": 209809, "epoch": 2527} {"train_loss": -24.33333396911621, "global_step": 209810, "epoch": 2527} {"train_loss": -24.474498748779297, "global_step": 209811, "epoch": 2527} {"train_loss": -24.24067497253418, "global_step": 209812, "epoch": 2527} {"train_loss": -24.815677642822266, "global_step": 209813, "epoch": 2527} {"train_loss": -23.752416610717773, "global_step": 209814, "epoch": 2527} {"train_loss": -24.05886459350586, "global_step": 209815, "epoch": 2527} {"train_loss": -24.164236068725586, "global_step": 209816, "epoch": 2527} {"train_loss": -24.481252670288086, "global_step": 209817, "epoch": 2527} {"train_loss": -24.587299346923828, "global_step": 209818, "epoch": 2527} {"train_loss": -24.29921531677246, "global_step": 209819, "epoch": 2527} {"train_loss": -24.778493881225586, "global_step": 209820, "epoch": 2527} {"train_loss": -24.457698822021484, "global_step": 209821, "epoch": 2527} {"train_loss": -24.70587158203125, "global_step": 209822, "epoch": 2527} {"train_loss": -24.334939887724726, "global_step": 209823, "epoch": 2527, "val_loss": 6649639.0} {"train_loss": -23.48486328125, "global_step": 209824, "epoch": 2528} {"train_loss": -23.760263442993164, "global_step": 209825, "epoch": 2528} {"train_loss": -24.250043869018555, "global_step": 209826, "epoch": 2528} {"train_loss": -23.79218101501465, "global_step": 209827, "epoch": 2528} {"train_loss": -23.515844345092773, "global_step": 209828, "epoch": 2528} {"train_loss": -24.23682975769043, "global_step": 209829, "epoch": 2528} {"train_loss": -24.00550651550293, "global_step": 209830, "epoch": 2528} {"train_loss": -24.234411239624023, "global_step": 209831, "epoch": 2528} {"train_loss": -24.184154510498047, "global_step": 209832, "epoch": 2528} {"train_loss": -23.756391525268555, "global_step": 209833, "epoch": 2528} {"train_loss": -23.958974838256836, "global_step": 209834, "epoch": 2528} {"train_loss": -23.91810417175293, "global_step": 209835, "epoch": 2528} {"train_loss": -24.348569869995117, "global_step": 209836, "epoch": 2528} {"train_loss": -24.22224998474121, "global_step": 209837, "epoch": 2528} {"train_loss": -24.20761489868164, "global_step": 209838, "epoch": 2528} {"train_loss": -24.19172477722168, "global_step": 209839, "epoch": 2528} {"train_loss": -24.526294708251953, "global_step": 209840, "epoch": 2528} {"train_loss": -24.26219940185547, "global_step": 209841, "epoch": 2528} {"train_loss": -24.128902435302734, "global_step": 209842, "epoch": 2528} {"train_loss": -24.447071075439453, "global_step": 209843, "epoch": 2528} {"train_loss": -24.38226890563965, "global_step": 209844, "epoch": 2528} {"train_loss": -24.4852294921875, "global_step": 209845, "epoch": 2528} {"train_loss": -24.296157836914062, "global_step": 209846, "epoch": 2528} {"train_loss": -24.54341697692871, "global_step": 209847, "epoch": 2528} {"train_loss": -24.219417572021484, "global_step": 209848, "epoch": 2528} {"train_loss": -24.52886390686035, "global_step": 209849, "epoch": 2528} {"train_loss": -24.536487579345703, "global_step": 209850, "epoch": 2528} {"train_loss": -24.66932487487793, "global_step": 209851, "epoch": 2528} {"train_loss": -24.79807472229004, "global_step": 209852, "epoch": 2528} {"train_loss": -24.546964645385742, "global_step": 209853, "epoch": 2528} {"train_loss": -24.832792282104492, "global_step": 209854, "epoch": 2528} {"train_loss": -24.55560874938965, "global_step": 209855, "epoch": 2528} {"train_loss": -24.405099868774414, "global_step": 209856, "epoch": 2528} {"train_loss": -24.681354522705078, "global_step": 209857, "epoch": 2528} {"train_loss": -24.812484741210938, "global_step": 209858, "epoch": 2528} {"train_loss": -24.12492561340332, "global_step": 209859, "epoch": 2528} {"train_loss": -24.58668327331543, "global_step": 209860, "epoch": 2528} {"train_loss": -24.304065704345703, "global_step": 209861, "epoch": 2528} {"train_loss": -24.27882957458496, "global_step": 209862, "epoch": 2528} {"train_loss": -24.266687393188477, "global_step": 209863, "epoch": 2528} {"train_loss": -24.71187400817871, "global_step": 209864, "epoch": 2528} {"train_loss": -24.3143253326416, "global_step": 209865, "epoch": 2528} {"train_loss": -24.184919357299805, "global_step": 209866, "epoch": 2528} {"train_loss": -24.228424072265625, "global_step": 209867, "epoch": 2528} {"train_loss": -24.599781036376953, "global_step": 209868, "epoch": 2528} {"train_loss": -24.131845474243164, "global_step": 209869, "epoch": 2528} {"train_loss": -24.325925827026367, "global_step": 209870, "epoch": 2528} {"train_loss": -24.477638244628906, "global_step": 209871, "epoch": 2528} {"train_loss": -24.3143367767334, "global_step": 209872, "epoch": 2528} {"train_loss": -24.050546646118164, "global_step": 209873, "epoch": 2528} {"train_loss": -24.532772064208984, "global_step": 209874, "epoch": 2528} {"train_loss": -24.47821044921875, "global_step": 209875, "epoch": 2528} {"train_loss": -24.567459106445312, "global_step": 209876, "epoch": 2528} {"train_loss": -24.25110626220703, "global_step": 209877, "epoch": 2528} {"train_loss": -24.559534072875977, "global_step": 209878, "epoch": 2528} {"train_loss": -24.472536087036133, "global_step": 209879, "epoch": 2528} {"train_loss": -24.259244918823242, "global_step": 209880, "epoch": 2528} {"train_loss": -24.17324447631836, "global_step": 209881, "epoch": 2528} {"train_loss": -24.301015853881836, "global_step": 209882, "epoch": 2528} {"train_loss": -24.443532943725586, "global_step": 209883, "epoch": 2528} {"train_loss": -24.46034812927246, "global_step": 209884, "epoch": 2528} {"train_loss": -24.7926082611084, "global_step": 209885, "epoch": 2528} {"train_loss": -24.550222396850586, "global_step": 209886, "epoch": 2528} {"train_loss": -24.71516990661621, "global_step": 209887, "epoch": 2528} {"train_loss": -24.561935424804688, "global_step": 209888, "epoch": 2528} {"train_loss": -24.844785690307617, "global_step": 209889, "epoch": 2528} {"train_loss": -24.809772491455078, "global_step": 209890, "epoch": 2528} {"train_loss": -24.5153751373291, "global_step": 209891, "epoch": 2528} {"train_loss": -24.422182083129883, "global_step": 209892, "epoch": 2528} {"train_loss": -24.25771141052246, "global_step": 209893, "epoch": 2528} {"train_loss": -24.447965621948242, "global_step": 209894, "epoch": 2528} {"train_loss": -24.459060668945312, "global_step": 209895, "epoch": 2528} {"train_loss": -24.360807418823242, "global_step": 209896, "epoch": 2528} {"train_loss": -24.6248779296875, "global_step": 209897, "epoch": 2528} {"train_loss": -24.86704444885254, "global_step": 209898, "epoch": 2528} {"train_loss": -24.226428985595703, "global_step": 209899, "epoch": 2528} {"train_loss": -24.604061126708984, "global_step": 209900, "epoch": 2528} {"train_loss": -24.436321258544922, "global_step": 209901, "epoch": 2528} {"train_loss": -24.621017456054688, "global_step": 209902, "epoch": 2528} {"train_loss": -24.472537994384766, "global_step": 209903, "epoch": 2528} {"train_loss": -24.49675941467285, "global_step": 209904, "epoch": 2528} {"train_loss": -24.320880889892578, "global_step": 209905, "epoch": 2528} {"train_loss": -24.389534134462654, "global_step": 209906, "epoch": 2528, "val_loss": 6602749.5} {"train_loss": -23.572614669799805, "global_step": 209907, "epoch": 2529} {"train_loss": -23.109678268432617, "global_step": 209908, "epoch": 2529} {"train_loss": -22.89568519592285, "global_step": 209909, "epoch": 2529} {"train_loss": -24.064178466796875, "global_step": 209910, "epoch": 2529} {"train_loss": -23.4893856048584, "global_step": 209911, "epoch": 2529} {"train_loss": -23.54443359375, "global_step": 209912, "epoch": 2529} {"train_loss": -23.99012565612793, "global_step": 209913, "epoch": 2529} {"train_loss": -23.496339797973633, "global_step": 209914, "epoch": 2529} {"train_loss": -24.039670944213867, "global_step": 209915, "epoch": 2529} {"train_loss": -23.82254409790039, "global_step": 209916, "epoch": 2529} {"train_loss": -23.882648468017578, "global_step": 209917, "epoch": 2529} {"train_loss": -23.74815559387207, "global_step": 209918, "epoch": 2529} {"train_loss": -24.286306381225586, "global_step": 209919, "epoch": 2529} {"train_loss": -23.82827377319336, "global_step": 209920, "epoch": 2529} {"train_loss": -24.17274284362793, "global_step": 209921, "epoch": 2529} {"train_loss": -23.635717391967773, "global_step": 209922, "epoch": 2529} {"train_loss": -23.9937744140625, "global_step": 209923, "epoch": 2529} {"train_loss": -23.882450103759766, "global_step": 209924, "epoch": 2529} {"train_loss": -23.870573043823242, "global_step": 209925, "epoch": 2529} {"train_loss": -24.014665603637695, "global_step": 209926, "epoch": 2529} {"train_loss": -24.231958389282227, "global_step": 209927, "epoch": 2529} {"train_loss": -24.061986923217773, "global_step": 209928, "epoch": 2529} {"train_loss": -24.499792098999023, "global_step": 209929, "epoch": 2529} {"train_loss": -24.057687759399414, "global_step": 209930, "epoch": 2529} {"train_loss": -24.128625869750977, "global_step": 209931, "epoch": 2529} {"train_loss": -24.068267822265625, "global_step": 209932, "epoch": 2529} {"train_loss": -24.24806022644043, "global_step": 209933, "epoch": 2529} {"train_loss": -24.893251419067383, "global_step": 209934, "epoch": 2529} {"train_loss": -24.34510612487793, "global_step": 209935, "epoch": 2529} {"train_loss": -24.4725341796875, "global_step": 209936, "epoch": 2529} {"train_loss": -24.178329467773438, "global_step": 209937, "epoch": 2529} {"train_loss": -24.727407455444336, "global_step": 209938, "epoch": 2529} {"train_loss": -24.251699447631836, "global_step": 209939, "epoch": 2529} {"train_loss": -24.679218292236328, "global_step": 209940, "epoch": 2529} {"train_loss": -24.30728530883789, "global_step": 209941, "epoch": 2529} {"train_loss": -24.838924407958984, "global_step": 209942, "epoch": 2529} {"train_loss": -24.430723190307617, "global_step": 209943, "epoch": 2529} {"train_loss": -24.38504981994629, "global_step": 209944, "epoch": 2529} {"train_loss": -24.8704776763916, "global_step": 209945, "epoch": 2529} {"train_loss": -24.599164962768555, "global_step": 209946, "epoch": 2529} {"train_loss": -24.459381103515625, "global_step": 209947, "epoch": 2529} {"train_loss": -24.819379806518555, "global_step": 209948, "epoch": 2529} {"train_loss": -24.413999557495117, "global_step": 209949, "epoch": 2529} {"train_loss": -24.79839515686035, "global_step": 209950, "epoch": 2529} {"train_loss": -24.663267135620117, "global_step": 209951, "epoch": 2529} {"train_loss": -24.71405029296875, "global_step": 209952, "epoch": 2529} {"train_loss": -24.234182357788086, "global_step": 209953, "epoch": 2529} {"train_loss": -24.820384979248047, "global_step": 209954, "epoch": 2529} {"train_loss": -24.74488639831543, "global_step": 209955, "epoch": 2529} {"train_loss": -24.60892105102539, "global_step": 209956, "epoch": 2529} {"train_loss": -24.405231475830078, "global_step": 209957, "epoch": 2529} {"train_loss": -24.513425827026367, "global_step": 209958, "epoch": 2529} {"train_loss": -23.910526275634766, "global_step": 209959, "epoch": 2529} {"train_loss": -24.560754776000977, "global_step": 209960, "epoch": 2529} {"train_loss": -24.112545013427734, "global_step": 209961, "epoch": 2529} {"train_loss": -24.4031982421875, "global_step": 209962, "epoch": 2529} {"train_loss": -24.504316329956055, "global_step": 209963, "epoch": 2529} {"train_loss": -24.292827606201172, "global_step": 209964, "epoch": 2529} {"train_loss": -24.450973510742188, "global_step": 209965, "epoch": 2529} {"train_loss": -24.41337013244629, "global_step": 209966, "epoch": 2529} {"train_loss": -24.598806381225586, "global_step": 209967, "epoch": 2529} {"train_loss": -24.24920654296875, "global_step": 209968, "epoch": 2529} {"train_loss": -24.215999603271484, "global_step": 209969, "epoch": 2529} {"train_loss": -24.044748306274414, "global_step": 209970, "epoch": 2529} {"train_loss": -24.41646385192871, "global_step": 209971, "epoch": 2529} {"train_loss": -24.514272689819336, "global_step": 209972, "epoch": 2529} {"train_loss": -24.03937339782715, "global_step": 209973, "epoch": 2529} {"train_loss": -24.2125186920166, "global_step": 209974, "epoch": 2529} {"train_loss": -24.57073211669922, "global_step": 209975, "epoch": 2529} {"train_loss": -24.564966201782227, "global_step": 209976, "epoch": 2529} {"train_loss": -24.38772201538086, "global_step": 209977, "epoch": 2529} {"train_loss": -24.380720138549805, "global_step": 209978, "epoch": 2529} {"train_loss": -24.156253814697266, "global_step": 209979, "epoch": 2529} {"train_loss": -24.08962059020996, "global_step": 209980, "epoch": 2529} {"train_loss": -24.436269760131836, "global_step": 209981, "epoch": 2529} {"train_loss": -23.938220977783203, "global_step": 209982, "epoch": 2529} {"train_loss": -24.557621002197266, "global_step": 209983, "epoch": 2529} {"train_loss": -24.438173294067383, "global_step": 209984, "epoch": 2529} {"train_loss": -24.6136531829834, "global_step": 209985, "epoch": 2529} {"train_loss": -24.4857120513916, "global_step": 209986, "epoch": 2529} {"train_loss": -24.357786178588867, "global_step": 209987, "epoch": 2529} {"train_loss": -24.405176162719727, "global_step": 209988, "epoch": 2529} {"train_loss": -24.256896788815418, "global_step": 209989, "epoch": 2529, "val_loss": 6802454.5} {"train_loss": -23.8542537689209, "global_step": 209990, "epoch": 2530} {"train_loss": -23.864530563354492, "global_step": 209991, "epoch": 2530} {"train_loss": -23.8011531829834, "global_step": 209992, "epoch": 2530} {"train_loss": -24.148038864135742, "global_step": 209993, "epoch": 2530} {"train_loss": -24.171865463256836, "global_step": 209994, "epoch": 2530} {"train_loss": -24.243146896362305, "global_step": 209995, "epoch": 2530} {"train_loss": -24.222150802612305, "global_step": 209996, "epoch": 2530} {"train_loss": -23.972675323486328, "global_step": 209997, "epoch": 2530} {"train_loss": -24.105545043945312, "global_step": 209998, "epoch": 2530} {"train_loss": -24.27787208557129, "global_step": 209999, "epoch": 2530} {"train_loss": -23.77516746520996, "global_step": 210000, "epoch": 2530} {"train_loss": -24.25571632385254, "global_step": 210001, "epoch": 2530} {"train_loss": -23.969825744628906, "global_step": 210002, "epoch": 2530} {"train_loss": -24.105030059814453, "global_step": 210003, "epoch": 2530} {"train_loss": -24.307687759399414, "global_step": 210004, "epoch": 2530} {"train_loss": -24.135095596313477, "global_step": 210005, "epoch": 2530} {"train_loss": -24.6776123046875, "global_step": 210006, "epoch": 2530} {"train_loss": -24.520517349243164, "global_step": 210007, "epoch": 2530} {"train_loss": -24.558162689208984, "global_step": 210008, "epoch": 2530} {"train_loss": -24.649322509765625, "global_step": 210009, "epoch": 2530} {"train_loss": -24.6802978515625, "global_step": 210010, "epoch": 2530} {"train_loss": -24.398042678833008, "global_step": 210011, "epoch": 2530} {"train_loss": -24.726577758789062, "global_step": 210012, "epoch": 2530} {"train_loss": -24.547903060913086, "global_step": 210013, "epoch": 2530} {"train_loss": -24.230039596557617, "global_step": 210014, "epoch": 2530} {"train_loss": -24.494842529296875, "global_step": 210015, "epoch": 2530} {"train_loss": -24.48739242553711, "global_step": 210016, "epoch": 2530} {"train_loss": -24.089677810668945, "global_step": 210017, "epoch": 2530} {"train_loss": -24.248653411865234, "global_step": 210018, "epoch": 2530} {"train_loss": -24.34232521057129, "global_step": 210019, "epoch": 2530} {"train_loss": -24.431604385375977, "global_step": 210020, "epoch": 2530} {"train_loss": -24.82944107055664, "global_step": 210021, "epoch": 2530} {"train_loss": -24.21742057800293, "global_step": 210022, "epoch": 2530} {"train_loss": -24.755037307739258, "global_step": 210023, "epoch": 2530} {"train_loss": -24.667673110961914, "global_step": 210024, "epoch": 2530} {"train_loss": -24.885358810424805, "global_step": 210025, "epoch": 2530} {"train_loss": -24.61185073852539, "global_step": 210026, "epoch": 2530} {"train_loss": -24.62465476989746, "global_step": 210027, "epoch": 2530} {"train_loss": -24.683120727539062, "global_step": 210028, "epoch": 2530} {"train_loss": -24.44504165649414, "global_step": 210029, "epoch": 2530} {"train_loss": -24.412090301513672, "global_step": 210030, "epoch": 2530} {"train_loss": -24.32114028930664, "global_step": 210031, "epoch": 2530} {"train_loss": -24.60079002380371, "global_step": 210032, "epoch": 2530} {"train_loss": -24.497861862182617, "global_step": 210033, "epoch": 2530} {"train_loss": -24.536941528320312, "global_step": 210034, "epoch": 2530} {"train_loss": -24.561323165893555, "global_step": 210035, "epoch": 2530} {"train_loss": -24.793424606323242, "global_step": 210036, "epoch": 2530} {"train_loss": -24.27220916748047, "global_step": 210037, "epoch": 2530} {"train_loss": -24.432680130004883, "global_step": 210038, "epoch": 2530} {"train_loss": -24.232563018798828, "global_step": 210039, "epoch": 2530} {"train_loss": -24.60206413269043, "global_step": 210040, "epoch": 2530} {"train_loss": -24.424030303955078, "global_step": 210041, "epoch": 2530} {"train_loss": -24.32105827331543, "global_step": 210042, "epoch": 2530} {"train_loss": -24.532289505004883, "global_step": 210043, "epoch": 2530} {"train_loss": -24.56565284729004, "global_step": 210044, "epoch": 2530} {"train_loss": -24.42460060119629, "global_step": 210045, "epoch": 2530} {"train_loss": -24.612627029418945, "global_step": 210046, "epoch": 2530} {"train_loss": -24.913320541381836, "global_step": 210047, "epoch": 2530} {"train_loss": -24.252151489257812, "global_step": 210048, "epoch": 2530} {"train_loss": -24.428327560424805, "global_step": 210049, "epoch": 2530} {"train_loss": -24.35523223876953, "global_step": 210050, "epoch": 2530} {"train_loss": -24.510828018188477, "global_step": 210051, "epoch": 2530} {"train_loss": -24.219526290893555, "global_step": 210052, "epoch": 2530} {"train_loss": -24.601083755493164, "global_step": 210053, "epoch": 2530} {"train_loss": -24.372568130493164, "global_step": 210054, "epoch": 2530} {"train_loss": -24.680295944213867, "global_step": 210055, "epoch": 2530} {"train_loss": -24.546688079833984, "global_step": 210056, "epoch": 2530} {"train_loss": -24.46675682067871, "global_step": 210057, "epoch": 2530} {"train_loss": -24.558353424072266, "global_step": 210058, "epoch": 2530} {"train_loss": -24.27627182006836, "global_step": 210059, "epoch": 2530} {"train_loss": -24.540151596069336, "global_step": 210060, "epoch": 2530} {"train_loss": -24.256439208984375, "global_step": 210061, "epoch": 2530} {"train_loss": -24.55512809753418, "global_step": 210062, "epoch": 2530} {"train_loss": -24.589298248291016, "global_step": 210063, "epoch": 2530} {"train_loss": -24.484323501586914, "global_step": 210064, "epoch": 2530} {"train_loss": -23.9339542388916, "global_step": 210065, "epoch": 2530} {"train_loss": -24.515199661254883, "global_step": 210066, "epoch": 2530} {"train_loss": -24.366376876831055, "global_step": 210067, "epoch": 2530} {"train_loss": -24.23537254333496, "global_step": 210068, "epoch": 2530} {"train_loss": -24.326358795166016, "global_step": 210069, "epoch": 2530} {"train_loss": -24.309423446655273, "global_step": 210070, "epoch": 2530} {"train_loss": -24.7043514251709, "global_step": 210071, "epoch": 2530} {"train_loss": -24.403507393526745, "global_step": 210072, "epoch": 2530, "val_loss": 6709104.0} {"train_loss": -23.702816009521484, "global_step": 210073, "epoch": 2531} {"train_loss": -24.350492477416992, "global_step": 210074, "epoch": 2531} {"train_loss": -23.66636848449707, "global_step": 210075, "epoch": 2531} {"train_loss": -24.26139259338379, "global_step": 210076, "epoch": 2531} {"train_loss": -24.409025192260742, "global_step": 210077, "epoch": 2531} {"train_loss": -24.281827926635742, "global_step": 210078, "epoch": 2531} {"train_loss": -24.18674087524414, "global_step": 210079, "epoch": 2531} {"train_loss": -24.457590103149414, "global_step": 210080, "epoch": 2531} {"train_loss": -24.491727828979492, "global_step": 210081, "epoch": 2531} {"train_loss": -24.62763786315918, "global_step": 210082, "epoch": 2531} {"train_loss": -24.047679901123047, "global_step": 210083, "epoch": 2531} {"train_loss": -24.325855255126953, "global_step": 210084, "epoch": 2531} {"train_loss": -24.581974029541016, "global_step": 210085, "epoch": 2531} {"train_loss": -24.322284698486328, "global_step": 210086, "epoch": 2531} {"train_loss": -24.82046890258789, "global_step": 210087, "epoch": 2531} {"train_loss": -24.26799774169922, "global_step": 210088, "epoch": 2531} {"train_loss": -24.935461044311523, "global_step": 210089, "epoch": 2531} {"train_loss": -24.454605102539062, "global_step": 210090, "epoch": 2531} {"train_loss": -24.83497428894043, "global_step": 210091, "epoch": 2531} {"train_loss": -25.040205001831055, "global_step": 210092, "epoch": 2531} {"train_loss": -24.7520809173584, "global_step": 210093, "epoch": 2531} {"train_loss": -24.411361694335938, "global_step": 210094, "epoch": 2531} {"train_loss": -24.292346954345703, "global_step": 210095, "epoch": 2531} {"train_loss": -24.177993774414062, "global_step": 210096, "epoch": 2531} {"train_loss": -24.523380279541016, "global_step": 210097, "epoch": 2531} {"train_loss": -24.04471206665039, "global_step": 210098, "epoch": 2531} {"train_loss": -24.166505813598633, "global_step": 210099, "epoch": 2531} {"train_loss": -24.748620986938477, "global_step": 210100, "epoch": 2531} {"train_loss": -24.459470748901367, "global_step": 210101, "epoch": 2531} {"train_loss": -23.992164611816406, "global_step": 210102, "epoch": 2531} {"train_loss": -24.081912994384766, "global_step": 210103, "epoch": 2531} {"train_loss": -24.145681381225586, "global_step": 210104, "epoch": 2531} {"train_loss": -24.289772033691406, "global_step": 210105, "epoch": 2531} {"train_loss": -24.883438110351562, "global_step": 210106, "epoch": 2531} {"train_loss": -24.212331771850586, "global_step": 210107, "epoch": 2531} {"train_loss": -24.343826293945312, "global_step": 210108, "epoch": 2531} {"train_loss": -24.3653621673584, "global_step": 210109, "epoch": 2531} {"train_loss": -24.19687843322754, "global_step": 210110, "epoch": 2531} {"train_loss": -24.26914405822754, "global_step": 210111, "epoch": 2531} {"train_loss": -24.464834213256836, "global_step": 210112, "epoch": 2531} {"train_loss": -24.5609130859375, "global_step": 210113, "epoch": 2531} {"train_loss": -24.084470748901367, "global_step": 210114, "epoch": 2531} {"train_loss": -24.430681228637695, "global_step": 210115, "epoch": 2531} {"train_loss": -24.572547912597656, "global_step": 210116, "epoch": 2531} {"train_loss": -24.106565475463867, "global_step": 210117, "epoch": 2531} {"train_loss": -24.234338760375977, "global_step": 210118, "epoch": 2531} {"train_loss": -24.148962020874023, "global_step": 210119, "epoch": 2531} {"train_loss": -24.88937759399414, "global_step": 210120, "epoch": 2531} {"train_loss": -24.49853515625, "global_step": 210121, "epoch": 2531} {"train_loss": -24.623218536376953, "global_step": 210122, "epoch": 2531} {"train_loss": -24.3140869140625, "global_step": 210123, "epoch": 2531} {"train_loss": -24.512052536010742, "global_step": 210124, "epoch": 2531} {"train_loss": -24.257343292236328, "global_step": 210125, "epoch": 2531} {"train_loss": -24.526472091674805, "global_step": 210126, "epoch": 2531} {"train_loss": -24.608991622924805, "global_step": 210127, "epoch": 2531} {"train_loss": -24.452646255493164, "global_step": 210128, "epoch": 2531} {"train_loss": -24.595678329467773, "global_step": 210129, "epoch": 2531} {"train_loss": -24.66270637512207, "global_step": 210130, "epoch": 2531} {"train_loss": -24.36021614074707, "global_step": 210131, "epoch": 2531} {"train_loss": -24.823028564453125, "global_step": 210132, "epoch": 2531} {"train_loss": -24.616029739379883, "global_step": 210133, "epoch": 2531} {"train_loss": -24.41416358947754, "global_step": 210134, "epoch": 2531} {"train_loss": -24.74376106262207, "global_step": 210135, "epoch": 2531} {"train_loss": -24.716747283935547, "global_step": 210136, "epoch": 2531} {"train_loss": -24.587661743164062, "global_step": 210137, "epoch": 2531} {"train_loss": -24.581613540649414, "global_step": 210138, "epoch": 2531} {"train_loss": -24.532512664794922, "global_step": 210139, "epoch": 2531} {"train_loss": -24.54838752746582, "global_step": 210140, "epoch": 2531} {"train_loss": -24.374168395996094, "global_step": 210141, "epoch": 2531} {"train_loss": -24.603195190429688, "global_step": 210142, "epoch": 2531} {"train_loss": -24.665307998657227, "global_step": 210143, "epoch": 2531} {"train_loss": -24.4758243560791, "global_step": 210144, "epoch": 2531} {"train_loss": -24.56423568725586, "global_step": 210145, "epoch": 2531} {"train_loss": -24.67104148864746, "global_step": 210146, "epoch": 2531} {"train_loss": -24.454832077026367, "global_step": 210147, "epoch": 2531} {"train_loss": -24.792219161987305, "global_step": 210148, "epoch": 2531} {"train_loss": -24.299163818359375, "global_step": 210149, "epoch": 2531} {"train_loss": -24.75352668762207, "global_step": 210150, "epoch": 2531} {"train_loss": -24.274200439453125, "global_step": 210151, "epoch": 2531} {"train_loss": -24.39944839477539, "global_step": 210152, "epoch": 2531} {"train_loss": -24.567136764526367, "global_step": 210153, "epoch": 2531} {"train_loss": -24.529020309448242, "global_step": 210154, "epoch": 2531} {"train_loss": -24.44922435714538, "global_step": 210155, "epoch": 2531, "val_loss": 6619229.0} {"train_loss": -24.208688735961914, "global_step": 210156, "epoch": 2532} {"train_loss": -23.67828941345215, "global_step": 210157, "epoch": 2532} {"train_loss": -23.64776611328125, "global_step": 210158, "epoch": 2532} {"train_loss": -23.857046127319336, "global_step": 210159, "epoch": 2532} {"train_loss": -24.327556610107422, "global_step": 210160, "epoch": 2532} {"train_loss": -23.807567596435547, "global_step": 210161, "epoch": 2532} {"train_loss": -24.306114196777344, "global_step": 210162, "epoch": 2532} {"train_loss": -24.345571517944336, "global_step": 210163, "epoch": 2532} {"train_loss": -24.1324405670166, "global_step": 210164, "epoch": 2532} {"train_loss": -23.98225975036621, "global_step": 210165, "epoch": 2532} {"train_loss": -24.141530990600586, "global_step": 210166, "epoch": 2532} {"train_loss": -23.997343063354492, "global_step": 210167, "epoch": 2532} {"train_loss": -24.0336971282959, "global_step": 210168, "epoch": 2532} {"train_loss": -24.31796646118164, "global_step": 210169, "epoch": 2532} {"train_loss": -24.223087310791016, "global_step": 210170, "epoch": 2532} {"train_loss": -23.95937156677246, "global_step": 210171, "epoch": 2532} {"train_loss": -24.155424118041992, "global_step": 210172, "epoch": 2532} {"train_loss": -24.497411727905273, "global_step": 210173, "epoch": 2532} {"train_loss": -24.273456573486328, "global_step": 210174, "epoch": 2532} {"train_loss": -24.15167808532715, "global_step": 210175, "epoch": 2532} {"train_loss": -24.551321029663086, "global_step": 210176, "epoch": 2532} {"train_loss": -24.487356185913086, "global_step": 210177, "epoch": 2532} {"train_loss": -24.504837036132812, "global_step": 210178, "epoch": 2532} {"train_loss": -24.32985496520996, "global_step": 210179, "epoch": 2532} {"train_loss": -24.28314971923828, "global_step": 210180, "epoch": 2532} {"train_loss": -24.66196060180664, "global_step": 210181, "epoch": 2532} {"train_loss": -24.384580612182617, "global_step": 210182, "epoch": 2532} {"train_loss": -24.34669303894043, "global_step": 210183, "epoch": 2532} {"train_loss": -24.312458038330078, "global_step": 210184, "epoch": 2532} {"train_loss": -24.586942672729492, "global_step": 210185, "epoch": 2532} {"train_loss": -24.540681838989258, "global_step": 210186, "epoch": 2532} {"train_loss": -24.49580192565918, "global_step": 210187, "epoch": 2532} {"train_loss": -24.549951553344727, "global_step": 210188, "epoch": 2532} {"train_loss": -24.759851455688477, "global_step": 210189, "epoch": 2532} {"train_loss": -24.447826385498047, "global_step": 210190, "epoch": 2532} {"train_loss": -24.83623504638672, "global_step": 210191, "epoch": 2532} {"train_loss": -24.294986724853516, "global_step": 210192, "epoch": 2532} {"train_loss": -24.584121704101562, "global_step": 210193, "epoch": 2532} {"train_loss": -24.5131893157959, "global_step": 210194, "epoch": 2532} {"train_loss": -24.5625, "global_step": 210195, "epoch": 2532} {"train_loss": -24.664081573486328, "global_step": 210196, "epoch": 2532} {"train_loss": -24.465408325195312, "global_step": 210197, "epoch": 2532} {"train_loss": -24.61886215209961, "global_step": 210198, "epoch": 2532} {"train_loss": -24.86517333984375, "global_step": 210199, "epoch": 2532} {"train_loss": -24.399362564086914, "global_step": 210200, "epoch": 2532} {"train_loss": -24.25710105895996, "global_step": 210201, "epoch": 2532} {"train_loss": -24.5384578704834, "global_step": 210202, "epoch": 2532} {"train_loss": -24.456573486328125, "global_step": 210203, "epoch": 2532} {"train_loss": -24.53458595275879, "global_step": 210204, "epoch": 2532} {"train_loss": -24.59295654296875, "global_step": 210205, "epoch": 2532} {"train_loss": -24.212615966796875, "global_step": 210206, "epoch": 2532} {"train_loss": -24.504413604736328, "global_step": 210207, "epoch": 2532} {"train_loss": -24.483604431152344, "global_step": 210208, "epoch": 2532} {"train_loss": -24.25954818725586, "global_step": 210209, "epoch": 2532} {"train_loss": -23.94746208190918, "global_step": 210210, "epoch": 2532} {"train_loss": -24.01732635498047, "global_step": 210211, "epoch": 2532} {"train_loss": -23.962736129760742, "global_step": 210212, "epoch": 2532} {"train_loss": -23.994813919067383, "global_step": 210213, "epoch": 2532} {"train_loss": -23.702789306640625, "global_step": 210214, "epoch": 2532} {"train_loss": -24.354459762573242, "global_step": 210215, "epoch": 2532} {"train_loss": -24.29561424255371, "global_step": 210216, "epoch": 2532} {"train_loss": -23.990198135375977, "global_step": 210217, "epoch": 2532} {"train_loss": -23.96310806274414, "global_step": 210218, "epoch": 2532} {"train_loss": -23.90191078186035, "global_step": 210219, "epoch": 2532} {"train_loss": -24.4129638671875, "global_step": 210220, "epoch": 2532} {"train_loss": -24.483097076416016, "global_step": 210221, "epoch": 2532} {"train_loss": -24.40450668334961, "global_step": 210222, "epoch": 2532} {"train_loss": -24.37045669555664, "global_step": 210223, "epoch": 2532} {"train_loss": -24.190271377563477, "global_step": 210224, "epoch": 2532} {"train_loss": -24.9090518951416, "global_step": 210225, "epoch": 2532} {"train_loss": -24.74900245666504, "global_step": 210226, "epoch": 2532} {"train_loss": -24.477401733398438, "global_step": 210227, "epoch": 2532} {"train_loss": -24.408422470092773, "global_step": 210228, "epoch": 2532} {"train_loss": -24.958372116088867, "global_step": 210229, "epoch": 2532} {"train_loss": -24.73261833190918, "global_step": 210230, "epoch": 2532} {"train_loss": -24.671812057495117, "global_step": 210231, "epoch": 2532} {"train_loss": -24.530324935913086, "global_step": 210232, "epoch": 2532} {"train_loss": -24.60519790649414, "global_step": 210233, "epoch": 2532} {"train_loss": -24.481107711791992, "global_step": 210234, "epoch": 2532} {"train_loss": -24.125349044799805, "global_step": 210235, "epoch": 2532} {"train_loss": -24.620710372924805, "global_step": 210236, "epoch": 2532} {"train_loss": -24.594160079956055, "global_step": 210237, "epoch": 2532} {"train_loss": -24.356701563639813, "global_step": 210238, "epoch": 2532, "val_loss": 6576301.0} {"train_loss": -24.086278915405273, "global_step": 210239, "epoch": 2533} {"train_loss": -24.630685806274414, "global_step": 210240, "epoch": 2533} {"train_loss": -24.364967346191406, "global_step": 210241, "epoch": 2533} {"train_loss": -24.011075973510742, "global_step": 210242, "epoch": 2533} {"train_loss": -24.39724349975586, "global_step": 210243, "epoch": 2533} {"train_loss": -23.765289306640625, "global_step": 210244, "epoch": 2533} {"train_loss": -24.21799659729004, "global_step": 210245, "epoch": 2533} {"train_loss": -24.371137619018555, "global_step": 210246, "epoch": 2533} {"train_loss": -24.2445011138916, "global_step": 210247, "epoch": 2533} {"train_loss": -23.955461502075195, "global_step": 210248, "epoch": 2533} {"train_loss": -24.400676727294922, "global_step": 210249, "epoch": 2533} {"train_loss": -24.682453155517578, "global_step": 210250, "epoch": 2533} {"train_loss": -24.61184310913086, "global_step": 210251, "epoch": 2533} {"train_loss": -24.11720085144043, "global_step": 210252, "epoch": 2533} {"train_loss": -23.72037124633789, "global_step": 210253, "epoch": 2533} {"train_loss": -24.5465087890625, "global_step": 210254, "epoch": 2533} {"train_loss": -24.516250610351562, "global_step": 210255, "epoch": 2533} {"train_loss": -24.41340446472168, "global_step": 210256, "epoch": 2533} {"train_loss": -24.437591552734375, "global_step": 210257, "epoch": 2533} {"train_loss": -24.387638092041016, "global_step": 210258, "epoch": 2533} {"train_loss": -24.208646774291992, "global_step": 210259, "epoch": 2533} {"train_loss": -24.1854305267334, "global_step": 210260, "epoch": 2533} {"train_loss": -24.42488670349121, "global_step": 210261, "epoch": 2533} {"train_loss": -24.070295333862305, "global_step": 210262, "epoch": 2533} {"train_loss": -24.409082412719727, "global_step": 210263, "epoch": 2533} {"train_loss": -24.113473892211914, "global_step": 210264, "epoch": 2533} {"train_loss": -24.588239669799805, "global_step": 210265, "epoch": 2533} {"train_loss": -24.49102020263672, "global_step": 210266, "epoch": 2533} {"train_loss": -24.41741180419922, "global_step": 210267, "epoch": 2533} {"train_loss": -24.42026138305664, "global_step": 210268, "epoch": 2533} {"train_loss": -24.145795822143555, "global_step": 210269, "epoch": 2533} {"train_loss": -24.30314064025879, "global_step": 210270, "epoch": 2533} {"train_loss": -23.93330955505371, "global_step": 210271, "epoch": 2533} {"train_loss": -24.12257194519043, "global_step": 210272, "epoch": 2533} {"train_loss": -24.535375595092773, "global_step": 210273, "epoch": 2533} {"train_loss": -24.143651962280273, "global_step": 210274, "epoch": 2533} {"train_loss": -24.156951904296875, "global_step": 210275, "epoch": 2533} {"train_loss": -24.674802780151367, "global_step": 210276, "epoch": 2533} {"train_loss": -24.334415435791016, "global_step": 210277, "epoch": 2533} {"train_loss": -23.759531021118164, "global_step": 210278, "epoch": 2533} {"train_loss": -24.13887596130371, "global_step": 210279, "epoch": 2533} {"train_loss": -24.270732879638672, "global_step": 210280, "epoch": 2533} {"train_loss": -24.72947120666504, "global_step": 210281, "epoch": 2533} {"train_loss": -24.232723236083984, "global_step": 210282, "epoch": 2533} {"train_loss": -24.257471084594727, "global_step": 210283, "epoch": 2533} {"train_loss": -24.310888290405273, "global_step": 210284, "epoch": 2533} {"train_loss": -24.19172477722168, "global_step": 210285, "epoch": 2533} {"train_loss": -24.606863021850586, "global_step": 210286, "epoch": 2533} {"train_loss": -24.48646354675293, "global_step": 210287, "epoch": 2533} {"train_loss": -24.259214401245117, "global_step": 210288, "epoch": 2533} {"train_loss": -24.407358169555664, "global_step": 210289, "epoch": 2533} {"train_loss": -24.680055618286133, "global_step": 210290, "epoch": 2533} {"train_loss": -24.427858352661133, "global_step": 210291, "epoch": 2533} {"train_loss": -24.35072898864746, "global_step": 210292, "epoch": 2533} {"train_loss": -24.206018447875977, "global_step": 210293, "epoch": 2533} {"train_loss": -24.05678367614746, "global_step": 210294, "epoch": 2533} {"train_loss": -24.209266662597656, "global_step": 210295, "epoch": 2533} {"train_loss": -24.182308197021484, "global_step": 210296, "epoch": 2533} {"train_loss": -24.56733512878418, "global_step": 210297, "epoch": 2533} {"train_loss": -24.35738182067871, "global_step": 210298, "epoch": 2533} {"train_loss": -24.52931785583496, "global_step": 210299, "epoch": 2533} {"train_loss": -24.109577178955078, "global_step": 210300, "epoch": 2533} {"train_loss": -24.4388484954834, "global_step": 210301, "epoch": 2533} {"train_loss": -23.91420555114746, "global_step": 210302, "epoch": 2533} {"train_loss": -24.522443771362305, "global_step": 210303, "epoch": 2533} {"train_loss": -24.079824447631836, "global_step": 210304, "epoch": 2533} {"train_loss": -24.47469711303711, "global_step": 210305, "epoch": 2533} {"train_loss": -24.283597946166992, "global_step": 210306, "epoch": 2533} {"train_loss": -24.269453048706055, "global_step": 210307, "epoch": 2533} {"train_loss": -24.725845336914062, "global_step": 210308, "epoch": 2533} {"train_loss": -24.558937072753906, "global_step": 210309, "epoch": 2533} {"train_loss": -24.08986473083496, "global_step": 210310, "epoch": 2533} {"train_loss": -24.485544204711914, "global_step": 210311, "epoch": 2533} {"train_loss": -24.37914276123047, "global_step": 210312, "epoch": 2533} {"train_loss": -24.20987892150879, "global_step": 210313, "epoch": 2533} {"train_loss": -24.49690055847168, "global_step": 210314, "epoch": 2533} {"train_loss": -24.329376220703125, "global_step": 210315, "epoch": 2533} {"train_loss": -24.060211181640625, "global_step": 210316, "epoch": 2533} {"train_loss": -24.177886962890625, "global_step": 210317, "epoch": 2533} {"train_loss": -24.46510887145996, "global_step": 210318, "epoch": 2533} {"train_loss": -24.517927169799805, "global_step": 210319, "epoch": 2533} {"train_loss": -24.452260971069336, "global_step": 210320, "epoch": 2533} {"train_loss": -24.312297338462738, "global_step": 210321, "epoch": 2533, "val_loss": 6652707.0} {"train_loss": -23.54400634765625, "global_step": 210322, "epoch": 2534} {"train_loss": -22.85684585571289, "global_step": 210323, "epoch": 2534} {"train_loss": -21.80570411682129, "global_step": 210324, "epoch": 2534} {"train_loss": -23.543712615966797, "global_step": 210325, "epoch": 2534} {"train_loss": -22.743824005126953, "global_step": 210326, "epoch": 2534} {"train_loss": -23.735851287841797, "global_step": 210327, "epoch": 2534} {"train_loss": -23.77254295349121, "global_step": 210328, "epoch": 2534} {"train_loss": -23.514699935913086, "global_step": 210329, "epoch": 2534} {"train_loss": -23.69819450378418, "global_step": 210330, "epoch": 2534} {"train_loss": -23.58820343017578, "global_step": 210331, "epoch": 2534} {"train_loss": -23.226179122924805, "global_step": 210332, "epoch": 2534} {"train_loss": -23.80048179626465, "global_step": 210333, "epoch": 2534} {"train_loss": -23.323423385620117, "global_step": 210334, "epoch": 2534} {"train_loss": -23.91938591003418, "global_step": 210335, "epoch": 2534} {"train_loss": -23.66886329650879, "global_step": 210336, "epoch": 2534} {"train_loss": -24.0320987701416, "global_step": 210337, "epoch": 2534} {"train_loss": -23.557050704956055, "global_step": 210338, "epoch": 2534} {"train_loss": -23.545743942260742, "global_step": 210339, "epoch": 2534} {"train_loss": -23.988534927368164, "global_step": 210340, "epoch": 2534} {"train_loss": -24.0290470123291, "global_step": 210341, "epoch": 2534} {"train_loss": -24.035131454467773, "global_step": 210342, "epoch": 2534} {"train_loss": -23.7954044342041, "global_step": 210343, "epoch": 2534} {"train_loss": -23.995807647705078, "global_step": 210344, "epoch": 2534} {"train_loss": -23.767547607421875, "global_step": 210345, "epoch": 2534} {"train_loss": -24.287277221679688, "global_step": 210346, "epoch": 2534} {"train_loss": -23.844755172729492, "global_step": 210347, "epoch": 2534} {"train_loss": -23.838937759399414, "global_step": 210348, "epoch": 2534} {"train_loss": -23.951974868774414, "global_step": 210349, "epoch": 2534} {"train_loss": -24.107868194580078, "global_step": 210350, "epoch": 2534} {"train_loss": -24.31549072265625, "global_step": 210351, "epoch": 2534} {"train_loss": -24.033954620361328, "global_step": 210352, "epoch": 2534} {"train_loss": -24.46954917907715, "global_step": 210353, "epoch": 2534} {"train_loss": -24.041231155395508, "global_step": 210354, "epoch": 2534} {"train_loss": -23.996065139770508, "global_step": 210355, "epoch": 2534} {"train_loss": -24.340436935424805, "global_step": 210356, "epoch": 2534} {"train_loss": -24.088132858276367, "global_step": 210357, "epoch": 2534} {"train_loss": -24.393573760986328, "global_step": 210358, "epoch": 2534} {"train_loss": -24.31403160095215, "global_step": 210359, "epoch": 2534} {"train_loss": -24.185516357421875, "global_step": 210360, "epoch": 2534} {"train_loss": -24.575809478759766, "global_step": 210361, "epoch": 2534} {"train_loss": -24.433433532714844, "global_step": 210362, "epoch": 2534} {"train_loss": -24.26193618774414, "global_step": 210363, "epoch": 2534} {"train_loss": -24.372217178344727, "global_step": 210364, "epoch": 2534} {"train_loss": -24.344600677490234, "global_step": 210365, "epoch": 2534} {"train_loss": -24.40169334411621, "global_step": 210366, "epoch": 2534} {"train_loss": -24.414276123046875, "global_step": 210367, "epoch": 2534} {"train_loss": -24.3530330657959, "global_step": 210368, "epoch": 2534} {"train_loss": -24.45066261291504, "global_step": 210369, "epoch": 2534} {"train_loss": -24.925769805908203, "global_step": 210370, "epoch": 2534} {"train_loss": -24.37550163269043, "global_step": 210371, "epoch": 2534} {"train_loss": -24.36049461364746, "global_step": 210372, "epoch": 2534} {"train_loss": -24.996761322021484, "global_step": 210373, "epoch": 2534} {"train_loss": -24.59429359436035, "global_step": 210374, "epoch": 2534} {"train_loss": -24.301294326782227, "global_step": 210375, "epoch": 2534} {"train_loss": -24.227863311767578, "global_step": 210376, "epoch": 2534} {"train_loss": -24.479595184326172, "global_step": 210377, "epoch": 2534} {"train_loss": -24.27734375, "global_step": 210378, "epoch": 2534} {"train_loss": -24.516984939575195, "global_step": 210379, "epoch": 2534} {"train_loss": -24.696460723876953, "global_step": 210380, "epoch": 2534} {"train_loss": -24.643951416015625, "global_step": 210381, "epoch": 2534} {"train_loss": -24.46088981628418, "global_step": 210382, "epoch": 2534} {"train_loss": -24.28822898864746, "global_step": 210383, "epoch": 2534} {"train_loss": -24.52243423461914, "global_step": 210384, "epoch": 2534} {"train_loss": -24.945743560791016, "global_step": 210385, "epoch": 2534} {"train_loss": -24.643163681030273, "global_step": 210386, "epoch": 2534} {"train_loss": -24.609533309936523, "global_step": 210387, "epoch": 2534} {"train_loss": -24.71742057800293, "global_step": 210388, "epoch": 2534} {"train_loss": -24.597341537475586, "global_step": 210389, "epoch": 2534} {"train_loss": -24.62408447265625, "global_step": 210390, "epoch": 2534} {"train_loss": -24.49672508239746, "global_step": 210391, "epoch": 2534} {"train_loss": -24.668682098388672, "global_step": 210392, "epoch": 2534} {"train_loss": -24.320077896118164, "global_step": 210393, "epoch": 2534} {"train_loss": -24.709793090820312, "global_step": 210394, "epoch": 2534} {"train_loss": -24.60575294494629, "global_step": 210395, "epoch": 2534} {"train_loss": -24.470659255981445, "global_step": 210396, "epoch": 2534} {"train_loss": -24.445764541625977, "global_step": 210397, "epoch": 2534} {"train_loss": -24.580923080444336, "global_step": 210398, "epoch": 2534} {"train_loss": -24.661375045776367, "global_step": 210399, "epoch": 2534} {"train_loss": -24.54401969909668, "global_step": 210400, "epoch": 2534} {"train_loss": -24.27005958557129, "global_step": 210401, "epoch": 2534} {"train_loss": -24.890544891357422, "global_step": 210402, "epoch": 2534} {"train_loss": -24.297428131103516, "global_step": 210403, "epoch": 2534} {"train_loss": -24.169450070484576, "global_step": 210404, "epoch": 2534, "val_loss": 6730844.0} {"train_loss": -23.724891662597656, "global_step": 210405, "epoch": 2535} {"train_loss": -23.888002395629883, "global_step": 210406, "epoch": 2535} {"train_loss": -23.80925941467285, "global_step": 210407, "epoch": 2535} {"train_loss": -23.879552841186523, "global_step": 210408, "epoch": 2535} {"train_loss": -23.96533203125, "global_step": 210409, "epoch": 2535} {"train_loss": -24.007017135620117, "global_step": 210410, "epoch": 2535} {"train_loss": -24.23919677734375, "global_step": 210411, "epoch": 2535} {"train_loss": -24.3585147857666, "global_step": 210412, "epoch": 2535} {"train_loss": -23.838911056518555, "global_step": 210413, "epoch": 2535} {"train_loss": -24.22466468811035, "global_step": 210414, "epoch": 2535} {"train_loss": -24.1446590423584, "global_step": 210415, "epoch": 2535} {"train_loss": -23.91168975830078, "global_step": 210416, "epoch": 2535} {"train_loss": -24.33405113220215, "global_step": 210417, "epoch": 2535} {"train_loss": -24.179473876953125, "global_step": 210418, "epoch": 2535} {"train_loss": -23.840381622314453, "global_step": 210419, "epoch": 2535} {"train_loss": -24.297025680541992, "global_step": 210420, "epoch": 2535} {"train_loss": -24.236652374267578, "global_step": 210421, "epoch": 2535} {"train_loss": -24.32647132873535, "global_step": 210422, "epoch": 2535} {"train_loss": -24.053247451782227, "global_step": 210423, "epoch": 2535} {"train_loss": -24.43534278869629, "global_step": 210424, "epoch": 2535} {"train_loss": -24.024639129638672, "global_step": 210425, "epoch": 2535} {"train_loss": -24.187667846679688, "global_step": 210426, "epoch": 2535} {"train_loss": -24.192901611328125, "global_step": 210427, "epoch": 2535} {"train_loss": -24.223533630371094, "global_step": 210428, "epoch": 2535} {"train_loss": -24.41634178161621, "global_step": 210429, "epoch": 2535} {"train_loss": -24.369897842407227, "global_step": 210430, "epoch": 2535} {"train_loss": -24.52248191833496, "global_step": 210431, "epoch": 2535} {"train_loss": -24.457462310791016, "global_step": 210432, "epoch": 2535} {"train_loss": -24.314401626586914, "global_step": 210433, "epoch": 2535} {"train_loss": -24.501983642578125, "global_step": 210434, "epoch": 2535} {"train_loss": -24.434938430786133, "global_step": 210435, "epoch": 2535} {"train_loss": -24.26088523864746, "global_step": 210436, "epoch": 2535} {"train_loss": -24.559789657592773, "global_step": 210437, "epoch": 2535} {"train_loss": -24.647235870361328, "global_step": 210438, "epoch": 2535} {"train_loss": -24.142038345336914, "global_step": 210439, "epoch": 2535} {"train_loss": -24.692739486694336, "global_step": 210440, "epoch": 2535} {"train_loss": -24.831327438354492, "global_step": 210441, "epoch": 2535} {"train_loss": -24.307279586791992, "global_step": 210442, "epoch": 2535} {"train_loss": -24.267562866210938, "global_step": 210443, "epoch": 2535} {"train_loss": -24.120357513427734, "global_step": 210444, "epoch": 2535} {"train_loss": -24.504138946533203, "global_step": 210445, "epoch": 2535} {"train_loss": -24.7058162689209, "global_step": 210446, "epoch": 2535} {"train_loss": -24.61213493347168, "global_step": 210447, "epoch": 2535} {"train_loss": -24.408891677856445, "global_step": 210448, "epoch": 2535} {"train_loss": -24.657821655273438, "global_step": 210449, "epoch": 2535} {"train_loss": -24.403377532958984, "global_step": 210450, "epoch": 2535} {"train_loss": -24.351587295532227, "global_step": 210451, "epoch": 2535} {"train_loss": -23.756776809692383, "global_step": 210452, "epoch": 2535} {"train_loss": -24.143953323364258, "global_step": 210453, "epoch": 2535} {"train_loss": -24.621780395507812, "global_step": 210454, "epoch": 2535} {"train_loss": -24.417959213256836, "global_step": 210455, "epoch": 2535} {"train_loss": -24.107894897460938, "global_step": 210456, "epoch": 2535} {"train_loss": -24.433807373046875, "global_step": 210457, "epoch": 2535} {"train_loss": -24.43573570251465, "global_step": 210458, "epoch": 2535} {"train_loss": -24.800134658813477, "global_step": 210459, "epoch": 2535} {"train_loss": -24.24709129333496, "global_step": 210460, "epoch": 2535} {"train_loss": -24.622663497924805, "global_step": 210461, "epoch": 2535} {"train_loss": -24.053592681884766, "global_step": 210462, "epoch": 2535} {"train_loss": -24.34440040588379, "global_step": 210463, "epoch": 2535} {"train_loss": -24.55984878540039, "global_step": 210464, "epoch": 2535} {"train_loss": -24.485742568969727, "global_step": 210465, "epoch": 2535} {"train_loss": -24.310035705566406, "global_step": 210466, "epoch": 2535} {"train_loss": -24.411733627319336, "global_step": 210467, "epoch": 2535} {"train_loss": -24.087081909179688, "global_step": 210468, "epoch": 2535} {"train_loss": -24.131484985351562, "global_step": 210469, "epoch": 2535} {"train_loss": -24.56912612915039, "global_step": 210470, "epoch": 2535} {"train_loss": -24.470611572265625, "global_step": 210471, "epoch": 2535} {"train_loss": -24.869749069213867, "global_step": 210472, "epoch": 2535} {"train_loss": -24.479700088500977, "global_step": 210473, "epoch": 2535} {"train_loss": -24.2861328125, "global_step": 210474, "epoch": 2535} {"train_loss": -24.678319931030273, "global_step": 210475, "epoch": 2535} {"train_loss": -24.653600692749023, "global_step": 210476, "epoch": 2535} {"train_loss": -24.229442596435547, "global_step": 210477, "epoch": 2535} {"train_loss": -24.38728141784668, "global_step": 210478, "epoch": 2535} {"train_loss": -24.420923233032227, "global_step": 210479, "epoch": 2535} {"train_loss": -24.36707878112793, "global_step": 210480, "epoch": 2535} {"train_loss": -24.037643432617188, "global_step": 210481, "epoch": 2535} {"train_loss": -24.408926010131836, "global_step": 210482, "epoch": 2535} {"train_loss": -24.108474731445312, "global_step": 210483, "epoch": 2535} {"train_loss": -24.257532119750977, "global_step": 210484, "epoch": 2535} {"train_loss": -24.55167579650879, "global_step": 210485, "epoch": 2535} {"train_loss": -24.1757869720459, "global_step": 210486, "epoch": 2535} {"train_loss": -24.31018967226327, "global_step": 210487, "epoch": 2535, "val_loss": 6675269.5} {"train_loss": -24.034975051879883, "global_step": 210488, "epoch": 2536} {"train_loss": -24.310638427734375, "global_step": 210489, "epoch": 2536} {"train_loss": -24.579978942871094, "global_step": 210490, "epoch": 2536} {"train_loss": -24.35296058654785, "global_step": 210491, "epoch": 2536} {"train_loss": -24.384775161743164, "global_step": 210492, "epoch": 2536} {"train_loss": -24.190509796142578, "global_step": 210493, "epoch": 2536} {"train_loss": -24.5257625579834, "global_step": 210494, "epoch": 2536} {"train_loss": -23.95775032043457, "global_step": 210495, "epoch": 2536} {"train_loss": -24.357990264892578, "global_step": 210496, "epoch": 2536} {"train_loss": -24.190174102783203, "global_step": 210497, "epoch": 2536} {"train_loss": -24.029483795166016, "global_step": 210498, "epoch": 2536} {"train_loss": -24.140457153320312, "global_step": 210499, "epoch": 2536} {"train_loss": -24.47233009338379, "global_step": 210500, "epoch": 2536} {"train_loss": -24.12830924987793, "global_step": 210501, "epoch": 2536} {"train_loss": -24.233373641967773, "global_step": 210502, "epoch": 2536} {"train_loss": -24.238359451293945, "global_step": 210503, "epoch": 2536} {"train_loss": -24.30335235595703, "global_step": 210504, "epoch": 2536} {"train_loss": -24.12330436706543, "global_step": 210505, "epoch": 2536} {"train_loss": -24.09469985961914, "global_step": 210506, "epoch": 2536} {"train_loss": -24.21938133239746, "global_step": 210507, "epoch": 2536} {"train_loss": -23.81439781188965, "global_step": 210508, "epoch": 2536} {"train_loss": -24.083961486816406, "global_step": 210509, "epoch": 2536} {"train_loss": -24.391315460205078, "global_step": 210510, "epoch": 2536} {"train_loss": -23.903039932250977, "global_step": 210511, "epoch": 2536} {"train_loss": -24.489267349243164, "global_step": 210512, "epoch": 2536} {"train_loss": -24.53654670715332, "global_step": 210513, "epoch": 2536} {"train_loss": -24.520780563354492, "global_step": 210514, "epoch": 2536} {"train_loss": -24.240055084228516, "global_step": 210515, "epoch": 2536} {"train_loss": -24.411060333251953, "global_step": 210516, "epoch": 2536} {"train_loss": -24.50015640258789, "global_step": 210517, "epoch": 2536} {"train_loss": -24.35544204711914, "global_step": 210518, "epoch": 2536} {"train_loss": -24.47554588317871, "global_step": 210519, "epoch": 2536} {"train_loss": -24.665725708007812, "global_step": 210520, "epoch": 2536} {"train_loss": -24.157459259033203, "global_step": 210521, "epoch": 2536} {"train_loss": -24.62747573852539, "global_step": 210522, "epoch": 2536} {"train_loss": -24.29800033569336, "global_step": 210523, "epoch": 2536} {"train_loss": -24.060842514038086, "global_step": 210524, "epoch": 2536} {"train_loss": -24.674461364746094, "global_step": 210525, "epoch": 2536} {"train_loss": -24.002601623535156, "global_step": 210526, "epoch": 2536} {"train_loss": -24.253643035888672, "global_step": 210527, "epoch": 2536} {"train_loss": -24.183063507080078, "global_step": 210528, "epoch": 2536} {"train_loss": -24.732316970825195, "global_step": 210529, "epoch": 2536} {"train_loss": -24.60733985900879, "global_step": 210530, "epoch": 2536} {"train_loss": -24.364017486572266, "global_step": 210531, "epoch": 2536} {"train_loss": -24.557357788085938, "global_step": 210532, "epoch": 2536} {"train_loss": -24.33909797668457, "global_step": 210533, "epoch": 2536} {"train_loss": -24.485599517822266, "global_step": 210534, "epoch": 2536} {"train_loss": -24.43547248840332, "global_step": 210535, "epoch": 2536} {"train_loss": -24.32440757751465, "global_step": 210536, "epoch": 2536} {"train_loss": -24.15460777282715, "global_step": 210537, "epoch": 2536} {"train_loss": -24.146804809570312, "global_step": 210538, "epoch": 2536} {"train_loss": -24.40220832824707, "global_step": 210539, "epoch": 2536} {"train_loss": -24.276100158691406, "global_step": 210540, "epoch": 2536} {"train_loss": -24.244022369384766, "global_step": 210541, "epoch": 2536} {"train_loss": -24.431577682495117, "global_step": 210542, "epoch": 2536} {"train_loss": -24.47200584411621, "global_step": 210543, "epoch": 2536} {"train_loss": -24.17262840270996, "global_step": 210544, "epoch": 2536} {"train_loss": -24.096424102783203, "global_step": 210545, "epoch": 2536} {"train_loss": -24.422040939331055, "global_step": 210546, "epoch": 2536} {"train_loss": -24.307748794555664, "global_step": 210547, "epoch": 2536} {"train_loss": -24.500093460083008, "global_step": 210548, "epoch": 2536} {"train_loss": -24.478979110717773, "global_step": 210549, "epoch": 2536} {"train_loss": -24.647706985473633, "global_step": 210550, "epoch": 2536} {"train_loss": -24.3227481842041, "global_step": 210551, "epoch": 2536} {"train_loss": -24.326040267944336, "global_step": 210552, "epoch": 2536} {"train_loss": -24.243886947631836, "global_step": 210553, "epoch": 2536} {"train_loss": -24.511167526245117, "global_step": 210554, "epoch": 2536} {"train_loss": -24.753910064697266, "global_step": 210555, "epoch": 2536} {"train_loss": -24.397262573242188, "global_step": 210556, "epoch": 2536} {"train_loss": -24.389083862304688, "global_step": 210557, "epoch": 2536} {"train_loss": -24.584375381469727, "global_step": 210558, "epoch": 2536} {"train_loss": -24.591684341430664, "global_step": 210559, "epoch": 2536} {"train_loss": -24.429758071899414, "global_step": 210560, "epoch": 2536} {"train_loss": -24.459943771362305, "global_step": 210561, "epoch": 2536} {"train_loss": -24.601518630981445, "global_step": 210562, "epoch": 2536} {"train_loss": -24.41413688659668, "global_step": 210563, "epoch": 2536} {"train_loss": -24.287717819213867, "global_step": 210564, "epoch": 2536} {"train_loss": -24.34228515625, "global_step": 210565, "epoch": 2536} {"train_loss": -24.306272506713867, "global_step": 210566, "epoch": 2536} {"train_loss": -24.876493453979492, "global_step": 210567, "epoch": 2536} {"train_loss": -24.441354751586914, "global_step": 210568, "epoch": 2536} {"train_loss": -24.384592056274414, "global_step": 210569, "epoch": 2536} {"train_loss": -24.351969707443054, "global_step": 210570, "epoch": 2536, "val_loss": 6715139.0} {"train_loss": -24.155353546142578, "global_step": 210571, "epoch": 2537} {"train_loss": -24.04837417602539, "global_step": 210572, "epoch": 2537} {"train_loss": -24.200525283813477, "global_step": 210573, "epoch": 2537} {"train_loss": -24.10184669494629, "global_step": 210574, "epoch": 2537} {"train_loss": -23.77882194519043, "global_step": 210575, "epoch": 2537} {"train_loss": -24.48981285095215, "global_step": 210576, "epoch": 2537} {"train_loss": -23.897199630737305, "global_step": 210577, "epoch": 2537} {"train_loss": -24.332792282104492, "global_step": 210578, "epoch": 2537} {"train_loss": -24.49689292907715, "global_step": 210579, "epoch": 2537} {"train_loss": -24.284242630004883, "global_step": 210580, "epoch": 2537} {"train_loss": -24.182912826538086, "global_step": 210581, "epoch": 2537} {"train_loss": -24.595478057861328, "global_step": 210582, "epoch": 2537} {"train_loss": -24.431020736694336, "global_step": 210583, "epoch": 2537} {"train_loss": -24.32135009765625, "global_step": 210584, "epoch": 2537} {"train_loss": -24.30514144897461, "global_step": 210585, "epoch": 2537} {"train_loss": -24.824554443359375, "global_step": 210586, "epoch": 2537} {"train_loss": -24.665504455566406, "global_step": 210587, "epoch": 2537} {"train_loss": -24.434467315673828, "global_step": 210588, "epoch": 2537} {"train_loss": -24.17753028869629, "global_step": 210589, "epoch": 2537} {"train_loss": -24.775623321533203, "global_step": 210590, "epoch": 2537} {"train_loss": -24.444564819335938, "global_step": 210591, "epoch": 2537} {"train_loss": -24.194910049438477, "global_step": 210592, "epoch": 2537} {"train_loss": -24.404388427734375, "global_step": 210593, "epoch": 2537} {"train_loss": -24.5217342376709, "global_step": 210594, "epoch": 2537} {"train_loss": -24.673946380615234, "global_step": 210595, "epoch": 2537} {"train_loss": -24.597305297851562, "global_step": 210596, "epoch": 2537} {"train_loss": -24.507131576538086, "global_step": 210597, "epoch": 2537} {"train_loss": -24.319021224975586, "global_step": 210598, "epoch": 2537} {"train_loss": -24.45279884338379, "global_step": 210599, "epoch": 2537} {"train_loss": -24.44351577758789, "global_step": 210600, "epoch": 2537} {"train_loss": -24.593097686767578, "global_step": 210601, "epoch": 2537} {"train_loss": -24.36370086669922, "global_step": 210602, "epoch": 2537} {"train_loss": -24.558130264282227, "global_step": 210603, "epoch": 2537} {"train_loss": -24.66929054260254, "global_step": 210604, "epoch": 2537} {"train_loss": -24.882600784301758, "global_step": 210605, "epoch": 2537} {"train_loss": -24.395715713500977, "global_step": 210606, "epoch": 2537} {"train_loss": -24.295541763305664, "global_step": 210607, "epoch": 2537} {"train_loss": -24.5263729095459, "global_step": 210608, "epoch": 2537} {"train_loss": -24.085647583007812, "global_step": 210609, "epoch": 2537} {"train_loss": -23.68802833557129, "global_step": 210610, "epoch": 2537} {"train_loss": -23.947805404663086, "global_step": 210611, "epoch": 2537} {"train_loss": -24.06486701965332, "global_step": 210612, "epoch": 2537} {"train_loss": -24.287315368652344, "global_step": 210613, "epoch": 2537} {"train_loss": -24.162338256835938, "global_step": 210614, "epoch": 2537} {"train_loss": -24.163660049438477, "global_step": 210615, "epoch": 2537} {"train_loss": -24.559314727783203, "global_step": 210616, "epoch": 2537} {"train_loss": -24.200342178344727, "global_step": 210617, "epoch": 2537} {"train_loss": -24.187395095825195, "global_step": 210618, "epoch": 2537} {"train_loss": -24.3155517578125, "global_step": 210619, "epoch": 2537} {"train_loss": -23.865577697753906, "global_step": 210620, "epoch": 2537} {"train_loss": -24.15627098083496, "global_step": 210621, "epoch": 2537} {"train_loss": -24.17374038696289, "global_step": 210622, "epoch": 2537} {"train_loss": -24.313955307006836, "global_step": 210623, "epoch": 2537} {"train_loss": -24.28124237060547, "global_step": 210624, "epoch": 2537} {"train_loss": -24.849729537963867, "global_step": 210625, "epoch": 2537} {"train_loss": -24.334264755249023, "global_step": 210626, "epoch": 2537} {"train_loss": -24.483442306518555, "global_step": 210627, "epoch": 2537} {"train_loss": -24.70940399169922, "global_step": 210628, "epoch": 2537} {"train_loss": -24.67889976501465, "global_step": 210629, "epoch": 2537} {"train_loss": -24.223081588745117, "global_step": 210630, "epoch": 2537} {"train_loss": -24.492244720458984, "global_step": 210631, "epoch": 2537} {"train_loss": -24.683931350708008, "global_step": 210632, "epoch": 2537} {"train_loss": -24.332250595092773, "global_step": 210633, "epoch": 2537} {"train_loss": -24.47893714904785, "global_step": 210634, "epoch": 2537} {"train_loss": -24.093015670776367, "global_step": 210635, "epoch": 2537} {"train_loss": -24.58700180053711, "global_step": 210636, "epoch": 2537} {"train_loss": -24.601242065429688, "global_step": 210637, "epoch": 2537} {"train_loss": -24.6519775390625, "global_step": 210638, "epoch": 2537} {"train_loss": -24.776639938354492, "global_step": 210639, "epoch": 2537} {"train_loss": -24.716550827026367, "global_step": 210640, "epoch": 2537} {"train_loss": -24.592456817626953, "global_step": 210641, "epoch": 2537} {"train_loss": -24.23291015625, "global_step": 210642, "epoch": 2537} {"train_loss": -24.24503517150879, "global_step": 210643, "epoch": 2537} {"train_loss": -24.783926010131836, "global_step": 210644, "epoch": 2537} {"train_loss": -24.64995002746582, "global_step": 210645, "epoch": 2537} {"train_loss": -24.3973445892334, "global_step": 210646, "epoch": 2537} {"train_loss": -24.624906539916992, "global_step": 210647, "epoch": 2537} {"train_loss": -24.717397689819336, "global_step": 210648, "epoch": 2537} {"train_loss": -24.784006118774414, "global_step": 210649, "epoch": 2537} {"train_loss": -24.627182006835938, "global_step": 210650, "epoch": 2537} {"train_loss": -24.803842544555664, "global_step": 210651, "epoch": 2537} {"train_loss": -24.410764694213867, "global_step": 210652, "epoch": 2537} {"train_loss": -24.427319974784393, "global_step": 210653, "epoch": 2537, "val_loss": 6693089.0} {"train_loss": -22.791990280151367, "global_step": 210654, "epoch": 2538} {"train_loss": -20.875333786010742, "global_step": 210655, "epoch": 2538} {"train_loss": -20.634912490844727, "global_step": 210656, "epoch": 2538} {"train_loss": -23.537343978881836, "global_step": 210657, "epoch": 2538} {"train_loss": -23.53635025024414, "global_step": 210658, "epoch": 2538} {"train_loss": -23.49974250793457, "global_step": 210659, "epoch": 2538} {"train_loss": -23.271169662475586, "global_step": 210660, "epoch": 2538} {"train_loss": -23.82925796508789, "global_step": 210661, "epoch": 2538} {"train_loss": -23.84471893310547, "global_step": 210662, "epoch": 2538} {"train_loss": -23.97285270690918, "global_step": 210663, "epoch": 2538} {"train_loss": -23.8297176361084, "global_step": 210664, "epoch": 2538} {"train_loss": -23.751005172729492, "global_step": 210665, "epoch": 2538} {"train_loss": -23.915258407592773, "global_step": 210666, "epoch": 2538} {"train_loss": -23.89571189880371, "global_step": 210667, "epoch": 2538} {"train_loss": -23.84377098083496, "global_step": 210668, "epoch": 2538} {"train_loss": -23.81583023071289, "global_step": 210669, "epoch": 2538} {"train_loss": -23.807058334350586, "global_step": 210670, "epoch": 2538} {"train_loss": -23.836429595947266, "global_step": 210671, "epoch": 2538} {"train_loss": -24.0544490814209, "global_step": 210672, "epoch": 2538} {"train_loss": -24.060592651367188, "global_step": 210673, "epoch": 2538} {"train_loss": -23.88427734375, "global_step": 210674, "epoch": 2538} {"train_loss": -23.980831146240234, "global_step": 210675, "epoch": 2538} {"train_loss": -23.963634490966797, "global_step": 210676, "epoch": 2538} {"train_loss": -24.033422470092773, "global_step": 210677, "epoch": 2538} {"train_loss": -24.303653717041016, "global_step": 210678, "epoch": 2538} {"train_loss": -24.02227783203125, "global_step": 210679, "epoch": 2538} {"train_loss": -24.348854064941406, "global_step": 210680, "epoch": 2538} {"train_loss": -24.383424758911133, "global_step": 210681, "epoch": 2538} {"train_loss": -24.226232528686523, "global_step": 210682, "epoch": 2538} {"train_loss": -24.203266143798828, "global_step": 210683, "epoch": 2538} {"train_loss": -24.46982765197754, "global_step": 210684, "epoch": 2538} {"train_loss": -24.26714324951172, "global_step": 210685, "epoch": 2538} {"train_loss": -24.224199295043945, "global_step": 210686, "epoch": 2538} {"train_loss": -24.377355575561523, "global_step": 210687, "epoch": 2538} {"train_loss": -24.0113468170166, "global_step": 210688, "epoch": 2538} {"train_loss": -24.402454376220703, "global_step": 210689, "epoch": 2538} {"train_loss": -24.698883056640625, "global_step": 210690, "epoch": 2538} {"train_loss": -24.5507869720459, "global_step": 210691, "epoch": 2538} {"train_loss": -24.44187355041504, "global_step": 210692, "epoch": 2538} {"train_loss": -24.344430923461914, "global_step": 210693, "epoch": 2538} {"train_loss": -24.63227653503418, "global_step": 210694, "epoch": 2538} {"train_loss": -24.348876953125, "global_step": 210695, "epoch": 2538} {"train_loss": -24.075817108154297, "global_step": 210696, "epoch": 2538} {"train_loss": -24.491832733154297, "global_step": 210697, "epoch": 2538} {"train_loss": -24.84703254699707, "global_step": 210698, "epoch": 2538} {"train_loss": -24.37694549560547, "global_step": 210699, "epoch": 2538} {"train_loss": -24.31916618347168, "global_step": 210700, "epoch": 2538} {"train_loss": -24.880521774291992, "global_step": 210701, "epoch": 2538} {"train_loss": -24.32778549194336, "global_step": 210702, "epoch": 2538} {"train_loss": -24.63178062438965, "global_step": 210703, "epoch": 2538} {"train_loss": -24.123241424560547, "global_step": 210704, "epoch": 2538} {"train_loss": -24.305477142333984, "global_step": 210705, "epoch": 2538} {"train_loss": -24.583621978759766, "global_step": 210706, "epoch": 2538} {"train_loss": -24.29986572265625, "global_step": 210707, "epoch": 2538} {"train_loss": -24.45197868347168, "global_step": 210708, "epoch": 2538} {"train_loss": -24.452892303466797, "global_step": 210709, "epoch": 2538} {"train_loss": -24.422962188720703, "global_step": 210710, "epoch": 2538} {"train_loss": -24.140899658203125, "global_step": 210711, "epoch": 2538} {"train_loss": -24.3195858001709, "global_step": 210712, "epoch": 2538} {"train_loss": -24.53920555114746, "global_step": 210713, "epoch": 2538} {"train_loss": -24.608861923217773, "global_step": 210714, "epoch": 2538} {"train_loss": -24.468358993530273, "global_step": 210715, "epoch": 2538} {"train_loss": -24.605684280395508, "global_step": 210716, "epoch": 2538} {"train_loss": -24.378204345703125, "global_step": 210717, "epoch": 2538} {"train_loss": -24.042997360229492, "global_step": 210718, "epoch": 2538} {"train_loss": -24.239002227783203, "global_step": 210719, "epoch": 2538} {"train_loss": -24.553091049194336, "global_step": 210720, "epoch": 2538} {"train_loss": -24.49357032775879, "global_step": 210721, "epoch": 2538} {"train_loss": -24.615312576293945, "global_step": 210722, "epoch": 2538} {"train_loss": -24.534772872924805, "global_step": 210723, "epoch": 2538} {"train_loss": -24.617631912231445, "global_step": 210724, "epoch": 2538} {"train_loss": -24.725202560424805, "global_step": 210725, "epoch": 2538} {"train_loss": -24.618305206298828, "global_step": 210726, "epoch": 2538} {"train_loss": -24.852985382080078, "global_step": 210727, "epoch": 2538} {"train_loss": -24.452213287353516, "global_step": 210728, "epoch": 2538} {"train_loss": -24.74907684326172, "global_step": 210729, "epoch": 2538} {"train_loss": -24.41077995300293, "global_step": 210730, "epoch": 2538} {"train_loss": -24.241682052612305, "global_step": 210731, "epoch": 2538} {"train_loss": -24.37043571472168, "global_step": 210732, "epoch": 2538} {"train_loss": -24.532047271728516, "global_step": 210733, "epoch": 2538} {"train_loss": -24.586084365844727, "global_step": 210734, "epoch": 2538} {"train_loss": -24.526798248291016, "global_step": 210735, "epoch": 2538} {"train_loss": -24.15549333411527, "global_step": 210736, "epoch": 2538, "val_loss": 6593432.0} {"train_loss": -22.651927947998047, "global_step": 210737, "epoch": 2539} {"train_loss": -21.49308204650879, "global_step": 210738, "epoch": 2539} {"train_loss": -23.75168228149414, "global_step": 210739, "epoch": 2539} {"train_loss": -23.050058364868164, "global_step": 210740, "epoch": 2539} {"train_loss": -23.507583618164062, "global_step": 210741, "epoch": 2539} {"train_loss": -23.363920211791992, "global_step": 210742, "epoch": 2539} {"train_loss": -23.5599422454834, "global_step": 210743, "epoch": 2539} {"train_loss": -23.448993682861328, "global_step": 210744, "epoch": 2539} {"train_loss": -23.74676513671875, "global_step": 210745, "epoch": 2539} {"train_loss": -23.952835083007812, "global_step": 210746, "epoch": 2539} {"train_loss": -23.924928665161133, "global_step": 210747, "epoch": 2539} {"train_loss": -23.96595573425293, "global_step": 210748, "epoch": 2539} {"train_loss": -23.79224395751953, "global_step": 210749, "epoch": 2539} {"train_loss": -24.153806686401367, "global_step": 210750, "epoch": 2539} {"train_loss": -24.300989151000977, "global_step": 210751, "epoch": 2539} {"train_loss": -23.95000648498535, "global_step": 210752, "epoch": 2539} {"train_loss": -24.15834617614746, "global_step": 210753, "epoch": 2539} {"train_loss": -23.904895782470703, "global_step": 210754, "epoch": 2539} {"train_loss": -24.0242862701416, "global_step": 210755, "epoch": 2539} {"train_loss": -24.08547019958496, "global_step": 210756, "epoch": 2539} {"train_loss": -24.15517234802246, "global_step": 210757, "epoch": 2539} {"train_loss": -24.206228256225586, "global_step": 210758, "epoch": 2539} {"train_loss": -24.25406837463379, "global_step": 210759, "epoch": 2539} {"train_loss": -24.562963485717773, "global_step": 210760, "epoch": 2539} {"train_loss": -24.757410049438477, "global_step": 210761, "epoch": 2539} {"train_loss": -24.461820602416992, "global_step": 210762, "epoch": 2539} {"train_loss": -24.496875762939453, "global_step": 210763, "epoch": 2539} {"train_loss": -24.21868133544922, "global_step": 210764, "epoch": 2539} {"train_loss": -24.608165740966797, "global_step": 210765, "epoch": 2539} {"train_loss": -24.286880493164062, "global_step": 210766, "epoch": 2539} {"train_loss": -24.517486572265625, "global_step": 210767, "epoch": 2539} {"train_loss": -24.774765014648438, "global_step": 210768, "epoch": 2539} {"train_loss": -24.401426315307617, "global_step": 210769, "epoch": 2539} {"train_loss": -24.409465789794922, "global_step": 210770, "epoch": 2539} {"train_loss": -24.509632110595703, "global_step": 210771, "epoch": 2539} {"train_loss": -24.563322067260742, "global_step": 210772, "epoch": 2539} {"train_loss": -24.11574363708496, "global_step": 210773, "epoch": 2539} {"train_loss": -24.221654891967773, "global_step": 210774, "epoch": 2539} {"train_loss": -24.387954711914062, "global_step": 210775, "epoch": 2539} {"train_loss": -24.52813720703125, "global_step": 210776, "epoch": 2539} {"train_loss": -24.4287052154541, "global_step": 210777, "epoch": 2539} {"train_loss": -24.304838180541992, "global_step": 210778, "epoch": 2539} {"train_loss": -24.330480575561523, "global_step": 210779, "epoch": 2539} {"train_loss": -24.347646713256836, "global_step": 210780, "epoch": 2539} {"train_loss": -24.878398895263672, "global_step": 210781, "epoch": 2539} {"train_loss": -24.15460777282715, "global_step": 210782, "epoch": 2539} {"train_loss": -24.164657592773438, "global_step": 210783, "epoch": 2539} {"train_loss": -24.262283325195312, "global_step": 210784, "epoch": 2539} {"train_loss": -24.06631088256836, "global_step": 210785, "epoch": 2539} {"train_loss": -24.20657730102539, "global_step": 210786, "epoch": 2539} {"train_loss": -24.42456817626953, "global_step": 210787, "epoch": 2539} {"train_loss": -24.350332260131836, "global_step": 210788, "epoch": 2539} {"train_loss": -24.23292350769043, "global_step": 210789, "epoch": 2539} {"train_loss": -24.535852432250977, "global_step": 210790, "epoch": 2539} {"train_loss": -24.533254623413086, "global_step": 210791, "epoch": 2539} {"train_loss": -24.658254623413086, "global_step": 210792, "epoch": 2539} {"train_loss": -24.371566772460938, "global_step": 210793, "epoch": 2539} {"train_loss": -24.384815216064453, "global_step": 210794, "epoch": 2539} {"train_loss": -24.432743072509766, "global_step": 210795, "epoch": 2539} {"train_loss": -24.657041549682617, "global_step": 210796, "epoch": 2539} {"train_loss": -24.153480529785156, "global_step": 210797, "epoch": 2539} {"train_loss": -24.53008270263672, "global_step": 210798, "epoch": 2539} {"train_loss": -24.435840606689453, "global_step": 210799, "epoch": 2539} {"train_loss": -24.439603805541992, "global_step": 210800, "epoch": 2539} {"train_loss": -24.724180221557617, "global_step": 210801, "epoch": 2539} {"train_loss": -24.457901000976562, "global_step": 210802, "epoch": 2539} {"train_loss": -24.477445602416992, "global_step": 210803, "epoch": 2539} {"train_loss": -24.70743751525879, "global_step": 210804, "epoch": 2539} {"train_loss": -24.378934860229492, "global_step": 210805, "epoch": 2539} {"train_loss": -24.679594039916992, "global_step": 210806, "epoch": 2539} {"train_loss": -24.320322036743164, "global_step": 210807, "epoch": 2539} {"train_loss": -24.497098922729492, "global_step": 210808, "epoch": 2539} {"train_loss": -24.758642196655273, "global_step": 210809, "epoch": 2539} {"train_loss": -24.681320190429688, "global_step": 210810, "epoch": 2539} {"train_loss": -24.625244140625, "global_step": 210811, "epoch": 2539} {"train_loss": -24.562538146972656, "global_step": 210812, "epoch": 2539} {"train_loss": -24.350866317749023, "global_step": 210813, "epoch": 2539} {"train_loss": -24.541948318481445, "global_step": 210814, "epoch": 2539} {"train_loss": -24.427812576293945, "global_step": 210815, "epoch": 2539} {"train_loss": -24.533863067626953, "global_step": 210816, "epoch": 2539} {"train_loss": -24.200265884399414, "global_step": 210817, "epoch": 2539} {"train_loss": -24.516218185424805, "global_step": 210818, "epoch": 2539} {"train_loss": -24.241169136690807, "global_step": 210819, "epoch": 2539, "val_loss": 6587015.0} {"train_loss": -23.719694137573242, "global_step": 210820, "epoch": 2540} {"train_loss": -23.955734252929688, "global_step": 210821, "epoch": 2540} {"train_loss": -23.976858139038086, "global_step": 210822, "epoch": 2540} {"train_loss": -24.058982849121094, "global_step": 210823, "epoch": 2540} {"train_loss": -24.059890747070312, "global_step": 210824, "epoch": 2540} {"train_loss": -23.87331199645996, "global_step": 210825, "epoch": 2540} {"train_loss": -24.079626083374023, "global_step": 210826, "epoch": 2540} {"train_loss": -24.32152557373047, "global_step": 210827, "epoch": 2540} {"train_loss": -24.33511734008789, "global_step": 210828, "epoch": 2540} {"train_loss": -24.473134994506836, "global_step": 210829, "epoch": 2540} {"train_loss": -24.175508499145508, "global_step": 210830, "epoch": 2540} {"train_loss": -24.36842918395996, "global_step": 210831, "epoch": 2540} {"train_loss": -24.13303565979004, "global_step": 210832, "epoch": 2540} {"train_loss": -24.158994674682617, "global_step": 210833, "epoch": 2540} {"train_loss": -24.524871826171875, "global_step": 210834, "epoch": 2540} {"train_loss": -24.298763275146484, "global_step": 210835, "epoch": 2540} {"train_loss": -24.37063980102539, "global_step": 210836, "epoch": 2540} {"train_loss": -24.482803344726562, "global_step": 210837, "epoch": 2540} {"train_loss": -24.50237274169922, "global_step": 210838, "epoch": 2540} {"train_loss": -24.079538345336914, "global_step": 210839, "epoch": 2540} {"train_loss": -24.3153133392334, "global_step": 210840, "epoch": 2540} {"train_loss": -24.43436622619629, "global_step": 210841, "epoch": 2540} {"train_loss": -24.304187774658203, "global_step": 210842, "epoch": 2540} {"train_loss": -24.279071807861328, "global_step": 210843, "epoch": 2540} {"train_loss": -24.312267303466797, "global_step": 210844, "epoch": 2540} {"train_loss": -24.5366268157959, "global_step": 210845, "epoch": 2540} {"train_loss": -24.365158081054688, "global_step": 210846, "epoch": 2540} {"train_loss": -24.642635345458984, "global_step": 210847, "epoch": 2540} {"train_loss": -24.73402214050293, "global_step": 210848, "epoch": 2540} {"train_loss": -24.374441146850586, "global_step": 210849, "epoch": 2540} {"train_loss": -24.73788833618164, "global_step": 210850, "epoch": 2540} {"train_loss": -24.47701644897461, "global_step": 210851, "epoch": 2540} {"train_loss": -24.135610580444336, "global_step": 210852, "epoch": 2540} {"train_loss": -24.554853439331055, "global_step": 210853, "epoch": 2540} {"train_loss": -24.32011604309082, "global_step": 210854, "epoch": 2540} {"train_loss": -24.631492614746094, "global_step": 210855, "epoch": 2540} {"train_loss": -24.6295166015625, "global_step": 210856, "epoch": 2540} {"train_loss": -24.708829879760742, "global_step": 210857, "epoch": 2540} {"train_loss": -24.53128433227539, "global_step": 210858, "epoch": 2540} {"train_loss": -24.846097946166992, "global_step": 210859, "epoch": 2540} {"train_loss": -24.52644157409668, "global_step": 210860, "epoch": 2540} {"train_loss": -24.66367530822754, "global_step": 210861, "epoch": 2540} {"train_loss": -24.43843650817871, "global_step": 210862, "epoch": 2540} {"train_loss": -24.929012298583984, "global_step": 210863, "epoch": 2540} {"train_loss": -24.366512298583984, "global_step": 210864, "epoch": 2540} {"train_loss": -24.384519577026367, "global_step": 210865, "epoch": 2540} {"train_loss": -24.35670280456543, "global_step": 210866, "epoch": 2540} {"train_loss": -24.737974166870117, "global_step": 210867, "epoch": 2540} {"train_loss": -24.607229232788086, "global_step": 210868, "epoch": 2540} {"train_loss": -24.42685890197754, "global_step": 210869, "epoch": 2540} {"train_loss": -24.638551712036133, "global_step": 210870, "epoch": 2540} {"train_loss": -24.606809616088867, "global_step": 210871, "epoch": 2540} {"train_loss": -24.84112548828125, "global_step": 210872, "epoch": 2540} {"train_loss": -24.802152633666992, "global_step": 210873, "epoch": 2540} {"train_loss": -24.78671646118164, "global_step": 210874, "epoch": 2540} {"train_loss": -24.337793350219727, "global_step": 210875, "epoch": 2540} {"train_loss": -24.626197814941406, "global_step": 210876, "epoch": 2540} {"train_loss": -24.48463249206543, "global_step": 210877, "epoch": 2540} {"train_loss": -24.711517333984375, "global_step": 210878, "epoch": 2540} {"train_loss": -24.649229049682617, "global_step": 210879, "epoch": 2540} {"train_loss": -24.474966049194336, "global_step": 210880, "epoch": 2540} {"train_loss": -24.133943557739258, "global_step": 210881, "epoch": 2540} {"train_loss": -24.6027774810791, "global_step": 210882, "epoch": 2540} {"train_loss": -24.461633682250977, "global_step": 210883, "epoch": 2540} {"train_loss": -24.65552520751953, "global_step": 210884, "epoch": 2540} {"train_loss": -24.368473052978516, "global_step": 210885, "epoch": 2540} {"train_loss": -24.43820571899414, "global_step": 210886, "epoch": 2540} {"train_loss": -24.102588653564453, "global_step": 210887, "epoch": 2540} {"train_loss": -24.607328414916992, "global_step": 210888, "epoch": 2540} {"train_loss": -24.25629997253418, "global_step": 210889, "epoch": 2540} {"train_loss": -24.421350479125977, "global_step": 210890, "epoch": 2540} {"train_loss": -24.2923641204834, "global_step": 210891, "epoch": 2540} {"train_loss": -24.355985641479492, "global_step": 210892, "epoch": 2540} {"train_loss": -24.626514434814453, "global_step": 210893, "epoch": 2540} {"train_loss": -24.389698028564453, "global_step": 210894, "epoch": 2540} {"train_loss": -24.449504852294922, "global_step": 210895, "epoch": 2540} {"train_loss": -24.444538116455078, "global_step": 210896, "epoch": 2540} {"train_loss": -24.45912742614746, "global_step": 210897, "epoch": 2540} {"train_loss": -24.590778350830078, "global_step": 210898, "epoch": 2540} {"train_loss": -24.534067153930664, "global_step": 210899, "epoch": 2540} {"train_loss": -24.73423194885254, "global_step": 210900, "epoch": 2540} {"train_loss": -24.510196685791016, "global_step": 210901, "epoch": 2540} {"train_loss": -24.4352511670216, "global_step": 210902, "epoch": 2540, "val_loss": 6631722.0} {"train_loss": -23.94211769104004, "global_step": 210903, "epoch": 2541} {"train_loss": -23.326501846313477, "global_step": 210904, "epoch": 2541} {"train_loss": -24.455228805541992, "global_step": 210905, "epoch": 2541} {"train_loss": -23.493518829345703, "global_step": 210906, "epoch": 2541} {"train_loss": -24.27001953125, "global_step": 210907, "epoch": 2541} {"train_loss": -24.147863388061523, "global_step": 210908, "epoch": 2541} {"train_loss": -24.072616577148438, "global_step": 210909, "epoch": 2541} {"train_loss": -24.13633918762207, "global_step": 210910, "epoch": 2541} {"train_loss": -24.063140869140625, "global_step": 210911, "epoch": 2541} {"train_loss": -23.866256713867188, "global_step": 210912, "epoch": 2541} {"train_loss": -23.50205421447754, "global_step": 210913, "epoch": 2541} {"train_loss": -24.32703971862793, "global_step": 210914, "epoch": 2541} {"train_loss": -24.0676212310791, "global_step": 210915, "epoch": 2541} {"train_loss": -23.859989166259766, "global_step": 210916, "epoch": 2541} {"train_loss": -24.341663360595703, "global_step": 210917, "epoch": 2541} {"train_loss": -24.170982360839844, "global_step": 210918, "epoch": 2541} {"train_loss": -24.302772521972656, "global_step": 210919, "epoch": 2541} {"train_loss": -24.2451171875, "global_step": 210920, "epoch": 2541} {"train_loss": -23.866315841674805, "global_step": 210921, "epoch": 2541} {"train_loss": -23.776199340820312, "global_step": 210922, "epoch": 2541} {"train_loss": -23.838315963745117, "global_step": 210923, "epoch": 2541} {"train_loss": -24.257802963256836, "global_step": 210924, "epoch": 2541} {"train_loss": -24.30535316467285, "global_step": 210925, "epoch": 2541} {"train_loss": -24.39557456970215, "global_step": 210926, "epoch": 2541} {"train_loss": -24.5, "global_step": 210927, "epoch": 2541} {"train_loss": -24.44158935546875, "global_step": 210928, "epoch": 2541} {"train_loss": -24.326108932495117, "global_step": 210929, "epoch": 2541} {"train_loss": -24.229026794433594, "global_step": 210930, "epoch": 2541} {"train_loss": -24.549028396606445, "global_step": 210931, "epoch": 2541} {"train_loss": -23.969898223876953, "global_step": 210932, "epoch": 2541} {"train_loss": -24.46271324157715, "global_step": 210933, "epoch": 2541} {"train_loss": -24.49905014038086, "global_step": 210934, "epoch": 2541} {"train_loss": -23.967248916625977, "global_step": 210935, "epoch": 2541} {"train_loss": -24.51987075805664, "global_step": 210936, "epoch": 2541} {"train_loss": -24.267105102539062, "global_step": 210937, "epoch": 2541} {"train_loss": -24.58089828491211, "global_step": 210938, "epoch": 2541} {"train_loss": -24.271337509155273, "global_step": 210939, "epoch": 2541} {"train_loss": -24.329164505004883, "global_step": 210940, "epoch": 2541} {"train_loss": -24.638391494750977, "global_step": 210941, "epoch": 2541} {"train_loss": -24.702234268188477, "global_step": 210942, "epoch": 2541} {"train_loss": -24.563304901123047, "global_step": 210943, "epoch": 2541} {"train_loss": -24.682851791381836, "global_step": 210944, "epoch": 2541} {"train_loss": -24.4467830657959, "global_step": 210945, "epoch": 2541} {"train_loss": -24.6749324798584, "global_step": 210946, "epoch": 2541} {"train_loss": -24.383703231811523, "global_step": 210947, "epoch": 2541} {"train_loss": -24.43706703186035, "global_step": 210948, "epoch": 2541} {"train_loss": -24.870603561401367, "global_step": 210949, "epoch": 2541} {"train_loss": -24.556028366088867, "global_step": 210950, "epoch": 2541} {"train_loss": -24.68169593811035, "global_step": 210951, "epoch": 2541} {"train_loss": -24.471797943115234, "global_step": 210952, "epoch": 2541} {"train_loss": -24.390592575073242, "global_step": 210953, "epoch": 2541} {"train_loss": -24.572683334350586, "global_step": 210954, "epoch": 2541} {"train_loss": -24.70014762878418, "global_step": 210955, "epoch": 2541} {"train_loss": -24.782052993774414, "global_step": 210956, "epoch": 2541} {"train_loss": -24.245710372924805, "global_step": 210957, "epoch": 2541} {"train_loss": -24.748043060302734, "global_step": 210958, "epoch": 2541} {"train_loss": -24.378692626953125, "global_step": 210959, "epoch": 2541} {"train_loss": -24.41265296936035, "global_step": 210960, "epoch": 2541} {"train_loss": -24.849699020385742, "global_step": 210961, "epoch": 2541} {"train_loss": -24.20526123046875, "global_step": 210962, "epoch": 2541} {"train_loss": -24.406749725341797, "global_step": 210963, "epoch": 2541} {"train_loss": -24.430130004882812, "global_step": 210964, "epoch": 2541} {"train_loss": -24.499757766723633, "global_step": 210965, "epoch": 2541} {"train_loss": -24.357290267944336, "global_step": 210966, "epoch": 2541} {"train_loss": -24.670236587524414, "global_step": 210967, "epoch": 2541} {"train_loss": -24.4315128326416, "global_step": 210968, "epoch": 2541} {"train_loss": -24.069271087646484, "global_step": 210969, "epoch": 2541} {"train_loss": -24.516111373901367, "global_step": 210970, "epoch": 2541} {"train_loss": -24.499330520629883, "global_step": 210971, "epoch": 2541} {"train_loss": -24.660383224487305, "global_step": 210972, "epoch": 2541} {"train_loss": -24.550567626953125, "global_step": 210973, "epoch": 2541} {"train_loss": -24.429122924804688, "global_step": 210974, "epoch": 2541} {"train_loss": -24.40227508544922, "global_step": 210975, "epoch": 2541} {"train_loss": -24.73316192626953, "global_step": 210976, "epoch": 2541} {"train_loss": -24.653905868530273, "global_step": 210977, "epoch": 2541} {"train_loss": -24.695762634277344, "global_step": 210978, "epoch": 2541} {"train_loss": -24.469167709350586, "global_step": 210979, "epoch": 2541} {"train_loss": -24.284183502197266, "global_step": 210980, "epoch": 2541} {"train_loss": -24.589096069335938, "global_step": 210981, "epoch": 2541} {"train_loss": -24.804637908935547, "global_step": 210982, "epoch": 2541} {"train_loss": -24.751312255859375, "global_step": 210983, "epoch": 2541} {"train_loss": -24.183164596557617, "global_step": 210984, "epoch": 2541} {"train_loss": -24.35937123126294, "global_step": 210985, "epoch": 2541, "val_loss": 6609743.5} {"train_loss": -24.273962020874023, "global_step": 210986, "epoch": 2542} {"train_loss": -24.102375030517578, "global_step": 210987, "epoch": 2542} {"train_loss": -24.125900268554688, "global_step": 210988, "epoch": 2542} {"train_loss": -24.41388511657715, "global_step": 210989, "epoch": 2542} {"train_loss": -24.324106216430664, "global_step": 210990, "epoch": 2542} {"train_loss": -24.119586944580078, "global_step": 210991, "epoch": 2542} {"train_loss": -24.30409812927246, "global_step": 210992, "epoch": 2542} {"train_loss": -23.775671005249023, "global_step": 210993, "epoch": 2542} {"train_loss": -24.18643569946289, "global_step": 210994, "epoch": 2542} {"train_loss": -24.19312286376953, "global_step": 210995, "epoch": 2542} {"train_loss": -24.3790340423584, "global_step": 210996, "epoch": 2542} {"train_loss": -24.66596031188965, "global_step": 210997, "epoch": 2542} {"train_loss": -24.36260986328125, "global_step": 210998, "epoch": 2542} {"train_loss": -24.499670028686523, "global_step": 210999, "epoch": 2542} {"train_loss": -24.387149810791016, "global_step": 211000, "epoch": 2542} {"train_loss": -24.541500091552734, "global_step": 211001, "epoch": 2542} {"train_loss": -24.46902847290039, "global_step": 211002, "epoch": 2542} {"train_loss": -24.474477767944336, "global_step": 211003, "epoch": 2542} {"train_loss": -24.400676727294922, "global_step": 211004, "epoch": 2542} {"train_loss": -24.229724884033203, "global_step": 211005, "epoch": 2542} {"train_loss": -24.23931121826172, "global_step": 211006, "epoch": 2542} {"train_loss": -24.464630126953125, "global_step": 211007, "epoch": 2542} {"train_loss": -24.600351333618164, "global_step": 211008, "epoch": 2542} {"train_loss": -24.58795166015625, "global_step": 211009, "epoch": 2542} {"train_loss": -23.965408325195312, "global_step": 211010, "epoch": 2542} {"train_loss": -24.585355758666992, "global_step": 211011, "epoch": 2542} {"train_loss": -24.740346908569336, "global_step": 211012, "epoch": 2542} {"train_loss": -24.637693405151367, "global_step": 211013, "epoch": 2542} {"train_loss": -24.035282135009766, "global_step": 211014, "epoch": 2542} {"train_loss": -24.46338653564453, "global_step": 211015, "epoch": 2542} {"train_loss": -24.30877685546875, "global_step": 211016, "epoch": 2542} {"train_loss": -24.478696823120117, "global_step": 211017, "epoch": 2542} {"train_loss": -24.456708908081055, "global_step": 211018, "epoch": 2542} {"train_loss": -24.37436866760254, "global_step": 211019, "epoch": 2542} {"train_loss": -24.458642959594727, "global_step": 211020, "epoch": 2542} {"train_loss": -24.328826904296875, "global_step": 211021, "epoch": 2542} {"train_loss": -24.56341552734375, "global_step": 211022, "epoch": 2542} {"train_loss": -24.800207138061523, "global_step": 211023, "epoch": 2542} {"train_loss": -24.177900314331055, "global_step": 211024, "epoch": 2542} {"train_loss": -24.294055938720703, "global_step": 211025, "epoch": 2542} {"train_loss": -24.385717391967773, "global_step": 211026, "epoch": 2542} {"train_loss": -24.134138107299805, "global_step": 211027, "epoch": 2542} {"train_loss": -23.727323532104492, "global_step": 211028, "epoch": 2542} {"train_loss": -24.476293563842773, "global_step": 211029, "epoch": 2542} {"train_loss": -24.712751388549805, "global_step": 211030, "epoch": 2542} {"train_loss": -24.202756881713867, "global_step": 211031, "epoch": 2542} {"train_loss": -23.65386390686035, "global_step": 211032, "epoch": 2542} {"train_loss": -24.18239402770996, "global_step": 211033, "epoch": 2542} {"train_loss": -24.629226684570312, "global_step": 211034, "epoch": 2542} {"train_loss": -24.462141036987305, "global_step": 211035, "epoch": 2542} {"train_loss": -24.303678512573242, "global_step": 211036, "epoch": 2542} {"train_loss": -24.34885025024414, "global_step": 211037, "epoch": 2542} {"train_loss": -24.179405212402344, "global_step": 211038, "epoch": 2542} {"train_loss": -24.52935218811035, "global_step": 211039, "epoch": 2542} {"train_loss": -24.71443748474121, "global_step": 211040, "epoch": 2542} {"train_loss": -24.482507705688477, "global_step": 211041, "epoch": 2542} {"train_loss": -24.554094314575195, "global_step": 211042, "epoch": 2542} {"train_loss": -24.317081451416016, "global_step": 211043, "epoch": 2542} {"train_loss": -24.418325424194336, "global_step": 211044, "epoch": 2542} {"train_loss": -24.710695266723633, "global_step": 211045, "epoch": 2542} {"train_loss": -24.41083526611328, "global_step": 211046, "epoch": 2542} {"train_loss": -24.451740264892578, "global_step": 211047, "epoch": 2542} {"train_loss": -24.52631187438965, "global_step": 211048, "epoch": 2542} {"train_loss": -24.59443473815918, "global_step": 211049, "epoch": 2542} {"train_loss": -24.35148048400879, "global_step": 211050, "epoch": 2542} {"train_loss": -24.923208236694336, "global_step": 211051, "epoch": 2542} {"train_loss": -24.32417106628418, "global_step": 211052, "epoch": 2542} {"train_loss": -24.119327545166016, "global_step": 211053, "epoch": 2542} {"train_loss": -24.740089416503906, "global_step": 211054, "epoch": 2542} {"train_loss": -24.546329498291016, "global_step": 211055, "epoch": 2542} {"train_loss": -24.479917526245117, "global_step": 211056, "epoch": 2542} {"train_loss": -24.606786727905273, "global_step": 211057, "epoch": 2542} {"train_loss": -24.799480438232422, "global_step": 211058, "epoch": 2542} {"train_loss": -24.40779685974121, "global_step": 211059, "epoch": 2542} {"train_loss": -24.45015525817871, "global_step": 211060, "epoch": 2542} {"train_loss": -24.379196166992188, "global_step": 211061, "epoch": 2542} {"train_loss": -24.64459228515625, "global_step": 211062, "epoch": 2542} {"train_loss": -24.834518432617188, "global_step": 211063, "epoch": 2542} {"train_loss": -24.473661422729492, "global_step": 211064, "epoch": 2542} {"train_loss": -24.715717315673828, "global_step": 211065, "epoch": 2542} {"train_loss": -24.560354232788086, "global_step": 211066, "epoch": 2542} {"train_loss": -24.641239166259766, "global_step": 211067, "epoch": 2542} {"train_loss": -24.41113400746541, "global_step": 211068, "epoch": 2542, "val_loss": 6677345.0} {"train_loss": -24.159725189208984, "global_step": 211069, "epoch": 2543} {"train_loss": -24.07442283630371, "global_step": 211070, "epoch": 2543} {"train_loss": -24.30280113220215, "global_step": 211071, "epoch": 2543} {"train_loss": -23.927167892456055, "global_step": 211072, "epoch": 2543} {"train_loss": -23.97357177734375, "global_step": 211073, "epoch": 2543} {"train_loss": -24.333847045898438, "global_step": 211074, "epoch": 2543} {"train_loss": -24.476774215698242, "global_step": 211075, "epoch": 2543} {"train_loss": -24.277481079101562, "global_step": 211076, "epoch": 2543} {"train_loss": -24.281665802001953, "global_step": 211077, "epoch": 2543} {"train_loss": -24.47498893737793, "global_step": 211078, "epoch": 2543} {"train_loss": -24.280263900756836, "global_step": 211079, "epoch": 2543} {"train_loss": -24.346033096313477, "global_step": 211080, "epoch": 2543} {"train_loss": -23.977062225341797, "global_step": 211081, "epoch": 2543} {"train_loss": -24.621057510375977, "global_step": 211082, "epoch": 2543} {"train_loss": -24.31756591796875, "global_step": 211083, "epoch": 2543} {"train_loss": -24.561717987060547, "global_step": 211084, "epoch": 2543} {"train_loss": -24.024747848510742, "global_step": 211085, "epoch": 2543} {"train_loss": -24.41092872619629, "global_step": 211086, "epoch": 2543} {"train_loss": -24.451614379882812, "global_step": 211087, "epoch": 2543} {"train_loss": -24.62200355529785, "global_step": 211088, "epoch": 2543} {"train_loss": -24.416748046875, "global_step": 211089, "epoch": 2543} {"train_loss": -24.214492797851562, "global_step": 211090, "epoch": 2543} {"train_loss": -24.260953903198242, "global_step": 211091, "epoch": 2543} {"train_loss": -24.845680236816406, "global_step": 211092, "epoch": 2543} {"train_loss": -24.387754440307617, "global_step": 211093, "epoch": 2543} {"train_loss": -24.06140899658203, "global_step": 211094, "epoch": 2543} {"train_loss": -24.08170509338379, "global_step": 211095, "epoch": 2543} {"train_loss": -24.34907341003418, "global_step": 211096, "epoch": 2543} {"train_loss": -24.196908950805664, "global_step": 211097, "epoch": 2543} {"train_loss": -24.595449447631836, "global_step": 211098, "epoch": 2543} {"train_loss": -24.216266632080078, "global_step": 211099, "epoch": 2543} {"train_loss": -24.4046573638916, "global_step": 211100, "epoch": 2543} {"train_loss": -24.40578269958496, "global_step": 211101, "epoch": 2543} {"train_loss": -24.38063621520996, "global_step": 211102, "epoch": 2543} {"train_loss": -24.55878257751465, "global_step": 211103, "epoch": 2543} {"train_loss": -24.787519454956055, "global_step": 211104, "epoch": 2543} {"train_loss": -24.449926376342773, "global_step": 211105, "epoch": 2543} {"train_loss": -24.24593162536621, "global_step": 211106, "epoch": 2543} {"train_loss": -24.528839111328125, "global_step": 211107, "epoch": 2543} {"train_loss": -24.189950942993164, "global_step": 211108, "epoch": 2543} {"train_loss": -24.670852661132812, "global_step": 211109, "epoch": 2543} {"train_loss": -24.65167236328125, "global_step": 211110, "epoch": 2543} {"train_loss": -24.528364181518555, "global_step": 211111, "epoch": 2543} {"train_loss": -24.648513793945312, "global_step": 211112, "epoch": 2543} {"train_loss": -25.034297943115234, "global_step": 211113, "epoch": 2543} {"train_loss": -24.359647750854492, "global_step": 211114, "epoch": 2543} {"train_loss": -24.684598922729492, "global_step": 211115, "epoch": 2543} {"train_loss": -24.484100341796875, "global_step": 211116, "epoch": 2543} {"train_loss": -24.581411361694336, "global_step": 211117, "epoch": 2543} {"train_loss": -24.48106575012207, "global_step": 211118, "epoch": 2543} {"train_loss": -24.38787269592285, "global_step": 211119, "epoch": 2543} {"train_loss": -24.510976791381836, "global_step": 211120, "epoch": 2543} {"train_loss": -24.56305503845215, "global_step": 211121, "epoch": 2543} {"train_loss": -24.223892211914062, "global_step": 211122, "epoch": 2543} {"train_loss": -23.915504455566406, "global_step": 211123, "epoch": 2543} {"train_loss": -23.936954498291016, "global_step": 211124, "epoch": 2543} {"train_loss": -23.825519561767578, "global_step": 211125, "epoch": 2543} {"train_loss": -24.488454818725586, "global_step": 211126, "epoch": 2543} {"train_loss": -24.73457145690918, "global_step": 211127, "epoch": 2543} {"train_loss": -24.00911521911621, "global_step": 211128, "epoch": 2543} {"train_loss": -24.10912322998047, "global_step": 211129, "epoch": 2543} {"train_loss": -24.49925994873047, "global_step": 211130, "epoch": 2543} {"train_loss": -23.994680404663086, "global_step": 211131, "epoch": 2543} {"train_loss": -23.909109115600586, "global_step": 211132, "epoch": 2543} {"train_loss": -24.603113174438477, "global_step": 211133, "epoch": 2543} {"train_loss": -24.330045700073242, "global_step": 211134, "epoch": 2543} {"train_loss": -24.69978141784668, "global_step": 211135, "epoch": 2543} {"train_loss": -24.11664390563965, "global_step": 211136, "epoch": 2543} {"train_loss": -24.551889419555664, "global_step": 211137, "epoch": 2543} {"train_loss": -24.159955978393555, "global_step": 211138, "epoch": 2543} {"train_loss": -24.216108322143555, "global_step": 211139, "epoch": 2543} {"train_loss": -24.322940826416016, "global_step": 211140, "epoch": 2543} {"train_loss": -24.230350494384766, "global_step": 211141, "epoch": 2543} {"train_loss": -24.092260360717773, "global_step": 211142, "epoch": 2543} {"train_loss": -24.15009880065918, "global_step": 211143, "epoch": 2543} {"train_loss": -24.24234962463379, "global_step": 211144, "epoch": 2543} {"train_loss": -24.497831344604492, "global_step": 211145, "epoch": 2543} {"train_loss": -24.571365356445312, "global_step": 211146, "epoch": 2543} {"train_loss": -24.162687301635742, "global_step": 211147, "epoch": 2543} {"train_loss": -24.420522689819336, "global_step": 211148, "epoch": 2543} {"train_loss": -24.176265716552734, "global_step": 211149, "epoch": 2543} {"train_loss": -24.108001708984375, "global_step": 211150, "epoch": 2543} {"train_loss": -24.350477241608033, "global_step": 211151, "epoch": 2543, "val_loss": 6556506.0} {"train_loss": -23.871294021606445, "global_step": 211152, "epoch": 2544} {"train_loss": -24.03689956665039, "global_step": 211153, "epoch": 2544} {"train_loss": -24.32935905456543, "global_step": 211154, "epoch": 2544} {"train_loss": -23.958242416381836, "global_step": 211155, "epoch": 2544} {"train_loss": -24.266199111938477, "global_step": 211156, "epoch": 2544} {"train_loss": -24.290430068969727, "global_step": 211157, "epoch": 2544} {"train_loss": -24.265121459960938, "global_step": 211158, "epoch": 2544} {"train_loss": -24.356828689575195, "global_step": 211159, "epoch": 2544} {"train_loss": -24.280317306518555, "global_step": 211160, "epoch": 2544} {"train_loss": -24.204404830932617, "global_step": 211161, "epoch": 2544} {"train_loss": -24.380979537963867, "global_step": 211162, "epoch": 2544} {"train_loss": -24.058210372924805, "global_step": 211163, "epoch": 2544} {"train_loss": -24.262475967407227, "global_step": 211164, "epoch": 2544} {"train_loss": -24.243986129760742, "global_step": 211165, "epoch": 2544} {"train_loss": -24.23418617248535, "global_step": 211166, "epoch": 2544} {"train_loss": -24.26152992248535, "global_step": 211167, "epoch": 2544} {"train_loss": -24.295278549194336, "global_step": 211168, "epoch": 2544} {"train_loss": -24.47519302368164, "global_step": 211169, "epoch": 2544} {"train_loss": -24.45822525024414, "global_step": 211170, "epoch": 2544} {"train_loss": -24.263595581054688, "global_step": 211171, "epoch": 2544} {"train_loss": -24.612384796142578, "global_step": 211172, "epoch": 2544} {"train_loss": -24.458192825317383, "global_step": 211173, "epoch": 2544} {"train_loss": -24.33241844177246, "global_step": 211174, "epoch": 2544} {"train_loss": -24.819683074951172, "global_step": 211175, "epoch": 2544} {"train_loss": -24.525787353515625, "global_step": 211176, "epoch": 2544} {"train_loss": -24.770479202270508, "global_step": 211177, "epoch": 2544} {"train_loss": -24.520185470581055, "global_step": 211178, "epoch": 2544} {"train_loss": -24.373218536376953, "global_step": 211179, "epoch": 2544} {"train_loss": -24.638015747070312, "global_step": 211180, "epoch": 2544} {"train_loss": -24.50860595703125, "global_step": 211181, "epoch": 2544} {"train_loss": -24.38524627685547, "global_step": 211182, "epoch": 2544} {"train_loss": -25.140722274780273, "global_step": 211183, "epoch": 2544} {"train_loss": -24.71820640563965, "global_step": 211184, "epoch": 2544} {"train_loss": -24.71516227722168, "global_step": 211185, "epoch": 2544} {"train_loss": -24.74012565612793, "global_step": 211186, "epoch": 2544} {"train_loss": -24.61863899230957, "global_step": 211187, "epoch": 2544} {"train_loss": -24.809711456298828, "global_step": 211188, "epoch": 2544} {"train_loss": -24.336416244506836, "global_step": 211189, "epoch": 2544} {"train_loss": -24.18218231201172, "global_step": 211190, "epoch": 2544} {"train_loss": -24.290300369262695, "global_step": 211191, "epoch": 2544} {"train_loss": -24.49244499206543, "global_step": 211192, "epoch": 2544} {"train_loss": -24.333410263061523, "global_step": 211193, "epoch": 2544} {"train_loss": -24.66914176940918, "global_step": 211194, "epoch": 2544} {"train_loss": -24.22373390197754, "global_step": 211195, "epoch": 2544} {"train_loss": -24.326282501220703, "global_step": 211196, "epoch": 2544} {"train_loss": -24.414142608642578, "global_step": 211197, "epoch": 2544} {"train_loss": -24.697101593017578, "global_step": 211198, "epoch": 2544} {"train_loss": -24.64374351501465, "global_step": 211199, "epoch": 2544} {"train_loss": -24.71906280517578, "global_step": 211200, "epoch": 2544} {"train_loss": -24.415332794189453, "global_step": 211201, "epoch": 2544} {"train_loss": -24.317983627319336, "global_step": 211202, "epoch": 2544} {"train_loss": -24.30042839050293, "global_step": 211203, "epoch": 2544} {"train_loss": -24.45247459411621, "global_step": 211204, "epoch": 2544} {"train_loss": -24.409387588500977, "global_step": 211205, "epoch": 2544} {"train_loss": -24.16455078125, "global_step": 211206, "epoch": 2544} {"train_loss": -24.52704429626465, "global_step": 211207, "epoch": 2544} {"train_loss": -24.667465209960938, "global_step": 211208, "epoch": 2544} {"train_loss": -24.150182723999023, "global_step": 211209, "epoch": 2544} {"train_loss": -24.191572189331055, "global_step": 211210, "epoch": 2544} {"train_loss": -24.502294540405273, "global_step": 211211, "epoch": 2544} {"train_loss": -24.454771041870117, "global_step": 211212, "epoch": 2544} {"train_loss": -24.276044845581055, "global_step": 211213, "epoch": 2544} {"train_loss": -24.52973175048828, "global_step": 211214, "epoch": 2544} {"train_loss": -24.26207733154297, "global_step": 211215, "epoch": 2544} {"train_loss": -24.545917510986328, "global_step": 211216, "epoch": 2544} {"train_loss": -24.556848526000977, "global_step": 211217, "epoch": 2544} {"train_loss": -24.330657958984375, "global_step": 211218, "epoch": 2544} {"train_loss": -24.230283737182617, "global_step": 211219, "epoch": 2544} {"train_loss": -24.320453643798828, "global_step": 211220, "epoch": 2544} {"train_loss": -24.445083618164062, "global_step": 211221, "epoch": 2544} {"train_loss": -24.557004928588867, "global_step": 211222, "epoch": 2544} {"train_loss": -24.587047576904297, "global_step": 211223, "epoch": 2544} {"train_loss": -24.435720443725586, "global_step": 211224, "epoch": 2544} {"train_loss": -24.69869041442871, "global_step": 211225, "epoch": 2544} {"train_loss": -24.395587921142578, "global_step": 211226, "epoch": 2544} {"train_loss": -24.331287384033203, "global_step": 211227, "epoch": 2544} {"train_loss": -24.593822479248047, "global_step": 211228, "epoch": 2544} {"train_loss": -24.574705123901367, "global_step": 211229, "epoch": 2544} {"train_loss": -24.799009323120117, "global_step": 211230, "epoch": 2544} {"train_loss": -24.5578670501709, "global_step": 211231, "epoch": 2544} {"train_loss": -24.348529815673828, "global_step": 211232, "epoch": 2544} {"train_loss": -24.458389282226562, "global_step": 211233, "epoch": 2544} {"train_loss": -24.452583404908697, "global_step": 211234, "epoch": 2544, "val_loss": 6482927.0} {"train_loss": -23.256332397460938, "global_step": 211235, "epoch": 2545} {"train_loss": -22.77815055847168, "global_step": 211236, "epoch": 2545} {"train_loss": -23.778156280517578, "global_step": 211237, "epoch": 2545} {"train_loss": -22.975858688354492, "global_step": 211238, "epoch": 2545} {"train_loss": -23.496606826782227, "global_step": 211239, "epoch": 2545} {"train_loss": -23.29598045349121, "global_step": 211240, "epoch": 2545} {"train_loss": -23.57777976989746, "global_step": 211241, "epoch": 2545} {"train_loss": -23.891799926757812, "global_step": 211242, "epoch": 2545} {"train_loss": -23.830793380737305, "global_step": 211243, "epoch": 2545} {"train_loss": -23.69656753540039, "global_step": 211244, "epoch": 2545} {"train_loss": -23.646820068359375, "global_step": 211245, "epoch": 2545} {"train_loss": -23.610963821411133, "global_step": 211246, "epoch": 2545} {"train_loss": -24.03371238708496, "global_step": 211247, "epoch": 2545} {"train_loss": -23.978683471679688, "global_step": 211248, "epoch": 2545} {"train_loss": -24.02273178100586, "global_step": 211249, "epoch": 2545} {"train_loss": -24.030948638916016, "global_step": 211250, "epoch": 2545} {"train_loss": -23.791183471679688, "global_step": 211251, "epoch": 2545} {"train_loss": -24.37906837463379, "global_step": 211252, "epoch": 2545} {"train_loss": -24.14467430114746, "global_step": 211253, "epoch": 2545} {"train_loss": -24.04315757751465, "global_step": 211254, "epoch": 2545} {"train_loss": -23.96730613708496, "global_step": 211255, "epoch": 2545} {"train_loss": -24.04231834411621, "global_step": 211256, "epoch": 2545} {"train_loss": -24.24612045288086, "global_step": 211257, "epoch": 2545} {"train_loss": -24.181371688842773, "global_step": 211258, "epoch": 2545} {"train_loss": -23.81973648071289, "global_step": 211259, "epoch": 2545} {"train_loss": -24.008665084838867, "global_step": 211260, "epoch": 2545} {"train_loss": -24.776527404785156, "global_step": 211261, "epoch": 2545} {"train_loss": -24.312715530395508, "global_step": 211262, "epoch": 2545} {"train_loss": -24.667539596557617, "global_step": 211263, "epoch": 2545} {"train_loss": -24.370399475097656, "global_step": 211264, "epoch": 2545} {"train_loss": -24.389413833618164, "global_step": 211265, "epoch": 2545} {"train_loss": -24.063058853149414, "global_step": 211266, "epoch": 2545} {"train_loss": -24.320707321166992, "global_step": 211267, "epoch": 2545} {"train_loss": -24.4415225982666, "global_step": 211268, "epoch": 2545} {"train_loss": -24.07414436340332, "global_step": 211269, "epoch": 2545} {"train_loss": -24.41621208190918, "global_step": 211270, "epoch": 2545} {"train_loss": -24.710926055908203, "global_step": 211271, "epoch": 2545} {"train_loss": -24.281490325927734, "global_step": 211272, "epoch": 2545} {"train_loss": -24.66448974609375, "global_step": 211273, "epoch": 2545} {"train_loss": -24.392927169799805, "global_step": 211274, "epoch": 2545} {"train_loss": -24.5461368560791, "global_step": 211275, "epoch": 2545} {"train_loss": -24.526874542236328, "global_step": 211276, "epoch": 2545} {"train_loss": -24.684616088867188, "global_step": 211277, "epoch": 2545} {"train_loss": -24.50203514099121, "global_step": 211278, "epoch": 2545} {"train_loss": -24.065067291259766, "global_step": 211279, "epoch": 2545} {"train_loss": -24.437889099121094, "global_step": 211280, "epoch": 2545} {"train_loss": -24.396284103393555, "global_step": 211281, "epoch": 2545} {"train_loss": -24.629154205322266, "global_step": 211282, "epoch": 2545} {"train_loss": -24.314096450805664, "global_step": 211283, "epoch": 2545} {"train_loss": -24.67624855041504, "global_step": 211284, "epoch": 2545} {"train_loss": -24.58155632019043, "global_step": 211285, "epoch": 2545} {"train_loss": -24.927974700927734, "global_step": 211286, "epoch": 2545} {"train_loss": -24.28291893005371, "global_step": 211287, "epoch": 2545} {"train_loss": -24.10566520690918, "global_step": 211288, "epoch": 2545} {"train_loss": -24.508752822875977, "global_step": 211289, "epoch": 2545} {"train_loss": -24.73005485534668, "global_step": 211290, "epoch": 2545} {"train_loss": -24.51064109802246, "global_step": 211291, "epoch": 2545} {"train_loss": -24.181638717651367, "global_step": 211292, "epoch": 2545} {"train_loss": -24.275104522705078, "global_step": 211293, "epoch": 2545} {"train_loss": -24.48691177368164, "global_step": 211294, "epoch": 2545} {"train_loss": -24.496885299682617, "global_step": 211295, "epoch": 2545} {"train_loss": -24.36046600341797, "global_step": 211296, "epoch": 2545} {"train_loss": -24.675682067871094, "global_step": 211297, "epoch": 2545} {"train_loss": -24.455453872680664, "global_step": 211298, "epoch": 2545} {"train_loss": -24.42073631286621, "global_step": 211299, "epoch": 2545} {"train_loss": -24.387922286987305, "global_step": 211300, "epoch": 2545} {"train_loss": -24.429475784301758, "global_step": 211301, "epoch": 2545} {"train_loss": -24.6538143157959, "global_step": 211302, "epoch": 2545} {"train_loss": -24.466350555419922, "global_step": 211303, "epoch": 2545} {"train_loss": -24.239885330200195, "global_step": 211304, "epoch": 2545} {"train_loss": -24.347305297851562, "global_step": 211305, "epoch": 2545} {"train_loss": -24.6030216217041, "global_step": 211306, "epoch": 2545} {"train_loss": -24.351415634155273, "global_step": 211307, "epoch": 2545} {"train_loss": -24.17453956604004, "global_step": 211308, "epoch": 2545} {"train_loss": -24.11562728881836, "global_step": 211309, "epoch": 2545} {"train_loss": -24.482013702392578, "global_step": 211310, "epoch": 2545} {"train_loss": -24.38701629638672, "global_step": 211311, "epoch": 2545} {"train_loss": -24.30475425720215, "global_step": 211312, "epoch": 2545} {"train_loss": -24.64250373840332, "global_step": 211313, "epoch": 2545} {"train_loss": -24.169466018676758, "global_step": 211314, "epoch": 2545} {"train_loss": -24.266489028930664, "global_step": 211315, "epoch": 2545} {"train_loss": -23.87470054626465, "global_step": 211316, "epoch": 2545} {"train_loss": -24.228814021650567, "global_step": 211317, "epoch": 2545, "val_loss": 6581683.5} {"train_loss": -23.904024124145508, "global_step": 211318, "epoch": 2546} {"train_loss": -23.854223251342773, "global_step": 211319, "epoch": 2546} {"train_loss": -23.52875518798828, "global_step": 211320, "epoch": 2546} {"train_loss": -23.571836471557617, "global_step": 211321, "epoch": 2546} {"train_loss": -23.777158737182617, "global_step": 211322, "epoch": 2546} {"train_loss": -23.53862953186035, "global_step": 211323, "epoch": 2546} {"train_loss": -24.155290603637695, "global_step": 211324, "epoch": 2546} {"train_loss": -23.61223030090332, "global_step": 211325, "epoch": 2546} {"train_loss": -24.155183792114258, "global_step": 211326, "epoch": 2546} {"train_loss": -23.841413497924805, "global_step": 211327, "epoch": 2546} {"train_loss": -23.941923141479492, "global_step": 211328, "epoch": 2546} {"train_loss": -24.16595458984375, "global_step": 211329, "epoch": 2546} {"train_loss": -24.00135612487793, "global_step": 211330, "epoch": 2546} {"train_loss": -24.218791961669922, "global_step": 211331, "epoch": 2546} {"train_loss": -23.93679428100586, "global_step": 211332, "epoch": 2546} {"train_loss": -24.089391708374023, "global_step": 211333, "epoch": 2546} {"train_loss": -24.021194458007812, "global_step": 211334, "epoch": 2546} {"train_loss": -24.072675704956055, "global_step": 211335, "epoch": 2546} {"train_loss": -24.1816349029541, "global_step": 211336, "epoch": 2546} {"train_loss": -23.981525421142578, "global_step": 211337, "epoch": 2546} {"train_loss": -24.04313087463379, "global_step": 211338, "epoch": 2546} {"train_loss": -23.708173751831055, "global_step": 211339, "epoch": 2546} {"train_loss": -24.272537231445312, "global_step": 211340, "epoch": 2546} {"train_loss": -24.5186824798584, "global_step": 211341, "epoch": 2546} {"train_loss": -24.22426414489746, "global_step": 211342, "epoch": 2546} {"train_loss": -24.424274444580078, "global_step": 211343, "epoch": 2546} {"train_loss": -24.140207290649414, "global_step": 211344, "epoch": 2546} {"train_loss": -24.26560401916504, "global_step": 211345, "epoch": 2546} {"train_loss": -24.342252731323242, "global_step": 211346, "epoch": 2546} {"train_loss": -24.178447723388672, "global_step": 211347, "epoch": 2546} {"train_loss": -24.408432006835938, "global_step": 211348, "epoch": 2546} {"train_loss": -24.116981506347656, "global_step": 211349, "epoch": 2546} {"train_loss": -24.200788497924805, "global_step": 211350, "epoch": 2546} {"train_loss": -24.55536460876465, "global_step": 211351, "epoch": 2546} {"train_loss": -24.274242401123047, "global_step": 211352, "epoch": 2546} {"train_loss": -24.54060173034668, "global_step": 211353, "epoch": 2546} {"train_loss": -24.64411163330078, "global_step": 211354, "epoch": 2546} {"train_loss": -24.32745933532715, "global_step": 211355, "epoch": 2546} {"train_loss": -24.525423049926758, "global_step": 211356, "epoch": 2546} {"train_loss": -24.603513717651367, "global_step": 211357, "epoch": 2546} {"train_loss": -24.420576095581055, "global_step": 211358, "epoch": 2546} {"train_loss": -24.302326202392578, "global_step": 211359, "epoch": 2546} {"train_loss": -24.396196365356445, "global_step": 211360, "epoch": 2546} {"train_loss": -24.68393325805664, "global_step": 211361, "epoch": 2546} {"train_loss": -24.65505027770996, "global_step": 211362, "epoch": 2546} {"train_loss": -24.168354034423828, "global_step": 211363, "epoch": 2546} {"train_loss": -24.48756217956543, "global_step": 211364, "epoch": 2546} {"train_loss": -24.788408279418945, "global_step": 211365, "epoch": 2546} {"train_loss": -24.31804656982422, "global_step": 211366, "epoch": 2546} {"train_loss": -24.799158096313477, "global_step": 211367, "epoch": 2546} {"train_loss": -24.564008712768555, "global_step": 211368, "epoch": 2546} {"train_loss": -24.563003540039062, "global_step": 211369, "epoch": 2546} {"train_loss": -24.74196434020996, "global_step": 211370, "epoch": 2546} {"train_loss": -24.62823486328125, "global_step": 211371, "epoch": 2546} {"train_loss": -24.649438858032227, "global_step": 211372, "epoch": 2546} {"train_loss": -24.36408042907715, "global_step": 211373, "epoch": 2546} {"train_loss": -24.324026107788086, "global_step": 211374, "epoch": 2546} {"train_loss": -24.057226181030273, "global_step": 211375, "epoch": 2546} {"train_loss": -24.198253631591797, "global_step": 211376, "epoch": 2546} {"train_loss": -24.237497329711914, "global_step": 211377, "epoch": 2546} {"train_loss": -23.945098876953125, "global_step": 211378, "epoch": 2546} {"train_loss": -24.24142837524414, "global_step": 211379, "epoch": 2546} {"train_loss": -24.324819564819336, "global_step": 211380, "epoch": 2546} {"train_loss": -24.929960250854492, "global_step": 211381, "epoch": 2546} {"train_loss": -24.433908462524414, "global_step": 211382, "epoch": 2546} {"train_loss": -24.647415161132812, "global_step": 211383, "epoch": 2546} {"train_loss": -24.436338424682617, "global_step": 211384, "epoch": 2546} {"train_loss": -24.460596084594727, "global_step": 211385, "epoch": 2546} {"train_loss": -24.268529891967773, "global_step": 211386, "epoch": 2546} {"train_loss": -24.401458740234375, "global_step": 211387, "epoch": 2546} {"train_loss": -24.219547271728516, "global_step": 211388, "epoch": 2546} {"train_loss": -24.311220169067383, "global_step": 211389, "epoch": 2546} {"train_loss": -24.58477783203125, "global_step": 211390, "epoch": 2546} {"train_loss": -24.410297393798828, "global_step": 211391, "epoch": 2546} {"train_loss": -24.531938552856445, "global_step": 211392, "epoch": 2546} {"train_loss": -24.414920806884766, "global_step": 211393, "epoch": 2546} {"train_loss": -24.099164962768555, "global_step": 211394, "epoch": 2546} {"train_loss": -24.14600944519043, "global_step": 211395, "epoch": 2546} {"train_loss": -24.60238265991211, "global_step": 211396, "epoch": 2546} {"train_loss": -24.25567054748535, "global_step": 211397, "epoch": 2546} {"train_loss": -24.75335693359375, "global_step": 211398, "epoch": 2546} {"train_loss": -24.46720314025879, "global_step": 211399, "epoch": 2546} {"train_loss": -24.29369331267943, "global_step": 211400, "epoch": 2546, "val_loss": 6669272.0} {"train_loss": -23.880929946899414, "global_step": 211401, "epoch": 2547} {"train_loss": -24.210294723510742, "global_step": 211402, "epoch": 2547} {"train_loss": -24.2298526763916, "global_step": 211403, "epoch": 2547} {"train_loss": -24.280643463134766, "global_step": 211404, "epoch": 2547} {"train_loss": -24.060041427612305, "global_step": 211405, "epoch": 2547} {"train_loss": -24.240924835205078, "global_step": 211406, "epoch": 2547} {"train_loss": -24.119613647460938, "global_step": 211407, "epoch": 2547} {"train_loss": -24.420291900634766, "global_step": 211408, "epoch": 2547} {"train_loss": -24.342731475830078, "global_step": 211409, "epoch": 2547} {"train_loss": -24.395803451538086, "global_step": 211410, "epoch": 2547} {"train_loss": -24.0582332611084, "global_step": 211411, "epoch": 2547} {"train_loss": -24.11227035522461, "global_step": 211412, "epoch": 2547} {"train_loss": -24.32765007019043, "global_step": 211413, "epoch": 2547} {"train_loss": -24.13340187072754, "global_step": 211414, "epoch": 2547} {"train_loss": -24.436264038085938, "global_step": 211415, "epoch": 2547} {"train_loss": -24.590307235717773, "global_step": 211416, "epoch": 2547} {"train_loss": -24.294458389282227, "global_step": 211417, "epoch": 2547} {"train_loss": -24.53549575805664, "global_step": 211418, "epoch": 2547} {"train_loss": -23.898523330688477, "global_step": 211419, "epoch": 2547} {"train_loss": -24.3496150970459, "global_step": 211420, "epoch": 2547} {"train_loss": -23.852062225341797, "global_step": 211421, "epoch": 2547} {"train_loss": -24.45857810974121, "global_step": 211422, "epoch": 2547} {"train_loss": -24.439558029174805, "global_step": 211423, "epoch": 2547} {"train_loss": -24.440587997436523, "global_step": 211424, "epoch": 2547} {"train_loss": -24.469364166259766, "global_step": 211425, "epoch": 2547} {"train_loss": -24.5073299407959, "global_step": 211426, "epoch": 2547} {"train_loss": -24.404565811157227, "global_step": 211427, "epoch": 2547} {"train_loss": -24.4116153717041, "global_step": 211428, "epoch": 2547} {"train_loss": -24.423839569091797, "global_step": 211429, "epoch": 2547} {"train_loss": -24.60879898071289, "global_step": 211430, "epoch": 2547} {"train_loss": -24.099637985229492, "global_step": 211431, "epoch": 2547} {"train_loss": -24.1389102935791, "global_step": 211432, "epoch": 2547} {"train_loss": -24.627195358276367, "global_step": 211433, "epoch": 2547} {"train_loss": -24.122577667236328, "global_step": 211434, "epoch": 2547} {"train_loss": -24.20237159729004, "global_step": 211435, "epoch": 2547} {"train_loss": -24.11833381652832, "global_step": 211436, "epoch": 2547} {"train_loss": -24.639652252197266, "global_step": 211437, "epoch": 2547} {"train_loss": -24.2833309173584, "global_step": 211438, "epoch": 2547} {"train_loss": -24.180225372314453, "global_step": 211439, "epoch": 2547} {"train_loss": -24.435100555419922, "global_step": 211440, "epoch": 2547} {"train_loss": -24.377290725708008, "global_step": 211441, "epoch": 2547} {"train_loss": -24.422460556030273, "global_step": 211442, "epoch": 2547} {"train_loss": -23.991758346557617, "global_step": 211443, "epoch": 2547} {"train_loss": -24.6568546295166, "global_step": 211444, "epoch": 2547} {"train_loss": -24.248197555541992, "global_step": 211445, "epoch": 2547} {"train_loss": -24.74907875061035, "global_step": 211446, "epoch": 2547} {"train_loss": -24.800128936767578, "global_step": 211447, "epoch": 2547} {"train_loss": -24.138086318969727, "global_step": 211448, "epoch": 2547} {"train_loss": -24.2244815826416, "global_step": 211449, "epoch": 2547} {"train_loss": -24.81474494934082, "global_step": 211450, "epoch": 2547} {"train_loss": -24.575529098510742, "global_step": 211451, "epoch": 2547} {"train_loss": -24.61945343017578, "global_step": 211452, "epoch": 2547} {"train_loss": -24.56925392150879, "global_step": 211453, "epoch": 2547} {"train_loss": -24.594724655151367, "global_step": 211454, "epoch": 2547} {"train_loss": -24.409770965576172, "global_step": 211455, "epoch": 2547} {"train_loss": -24.193082809448242, "global_step": 211456, "epoch": 2547} {"train_loss": -24.455171585083008, "global_step": 211457, "epoch": 2547} {"train_loss": -24.58993148803711, "global_step": 211458, "epoch": 2547} {"train_loss": -24.716529846191406, "global_step": 211459, "epoch": 2547} {"train_loss": -24.53191375732422, "global_step": 211460, "epoch": 2547} {"train_loss": -24.424488067626953, "global_step": 211461, "epoch": 2547} {"train_loss": -24.401269912719727, "global_step": 211462, "epoch": 2547} {"train_loss": -24.785825729370117, "global_step": 211463, "epoch": 2547} {"train_loss": -24.616474151611328, "global_step": 211464, "epoch": 2547} {"train_loss": -24.48204803466797, "global_step": 211465, "epoch": 2547} {"train_loss": -24.655248641967773, "global_step": 211466, "epoch": 2547} {"train_loss": -24.22028160095215, "global_step": 211467, "epoch": 2547} {"train_loss": -24.592605590820312, "global_step": 211468, "epoch": 2547} {"train_loss": -24.61603546142578, "global_step": 211469, "epoch": 2547} {"train_loss": -24.65262794494629, "global_step": 211470, "epoch": 2547} {"train_loss": -24.652978897094727, "global_step": 211471, "epoch": 2547} {"train_loss": -24.57051658630371, "global_step": 211472, "epoch": 2547} {"train_loss": -24.504247665405273, "global_step": 211473, "epoch": 2547} {"train_loss": -24.42555809020996, "global_step": 211474, "epoch": 2547} {"train_loss": -24.68989372253418, "global_step": 211475, "epoch": 2547} {"train_loss": -24.37574577331543, "global_step": 211476, "epoch": 2547} {"train_loss": -24.490459442138672, "global_step": 211477, "epoch": 2547} {"train_loss": -24.797733306884766, "global_step": 211478, "epoch": 2547} {"train_loss": -24.801830291748047, "global_step": 211479, "epoch": 2547} {"train_loss": -24.865497589111328, "global_step": 211480, "epoch": 2547} {"train_loss": -24.56418228149414, "global_step": 211481, "epoch": 2547} {"train_loss": -24.53568458557129, "global_step": 211482, "epoch": 2547} {"train_loss": -24.427294949451124, "global_step": 211483, "epoch": 2547, "val_loss": 6661018.0} {"train_loss": -24.262956619262695, "global_step": 211484, "epoch": 2548} {"train_loss": -23.620847702026367, "global_step": 211485, "epoch": 2548} {"train_loss": -24.500425338745117, "global_step": 211486, "epoch": 2548} {"train_loss": -23.881223678588867, "global_step": 211487, "epoch": 2548} {"train_loss": -23.852874755859375, "global_step": 211488, "epoch": 2548} {"train_loss": -23.618227005004883, "global_step": 211489, "epoch": 2548} {"train_loss": -23.519546508789062, "global_step": 211490, "epoch": 2548} {"train_loss": -24.039487838745117, "global_step": 211491, "epoch": 2548} {"train_loss": -24.039854049682617, "global_step": 211492, "epoch": 2548} {"train_loss": -24.432514190673828, "global_step": 211493, "epoch": 2548} {"train_loss": -24.050460815429688, "global_step": 211494, "epoch": 2548} {"train_loss": -24.140098571777344, "global_step": 211495, "epoch": 2548} {"train_loss": -24.133602142333984, "global_step": 211496, "epoch": 2548} {"train_loss": -24.26032066345215, "global_step": 211497, "epoch": 2548} {"train_loss": -24.492116928100586, "global_step": 211498, "epoch": 2548} {"train_loss": -24.263696670532227, "global_step": 211499, "epoch": 2548} {"train_loss": -24.46488380432129, "global_step": 211500, "epoch": 2548} {"train_loss": -24.123411178588867, "global_step": 211501, "epoch": 2548} {"train_loss": -24.602283477783203, "global_step": 211502, "epoch": 2548} {"train_loss": -24.034414291381836, "global_step": 211503, "epoch": 2548} {"train_loss": -24.21049690246582, "global_step": 211504, "epoch": 2548} {"train_loss": -24.231595993041992, "global_step": 211505, "epoch": 2548} {"train_loss": -24.614337921142578, "global_step": 211506, "epoch": 2548} {"train_loss": -24.580419540405273, "global_step": 211507, "epoch": 2548} {"train_loss": -24.08705711364746, "global_step": 211508, "epoch": 2548} {"train_loss": -24.4243106842041, "global_step": 211509, "epoch": 2548} {"train_loss": -24.372907638549805, "global_step": 211510, "epoch": 2548} {"train_loss": -24.6188907623291, "global_step": 211511, "epoch": 2548} {"train_loss": -24.285722732543945, "global_step": 211512, "epoch": 2548} {"train_loss": -24.280569076538086, "global_step": 211513, "epoch": 2548} {"train_loss": -24.262882232666016, "global_step": 211514, "epoch": 2548} {"train_loss": -24.698339462280273, "global_step": 211515, "epoch": 2548} {"train_loss": -24.683847427368164, "global_step": 211516, "epoch": 2548} {"train_loss": -24.55583381652832, "global_step": 211517, "epoch": 2548} {"train_loss": -24.595434188842773, "global_step": 211518, "epoch": 2548} {"train_loss": -24.341428756713867, "global_step": 211519, "epoch": 2548} {"train_loss": -24.733936309814453, "global_step": 211520, "epoch": 2548} {"train_loss": -24.6026668548584, "global_step": 211521, "epoch": 2548} {"train_loss": -24.42835807800293, "global_step": 211522, "epoch": 2548} {"train_loss": -24.485740661621094, "global_step": 211523, "epoch": 2548} {"train_loss": -24.37433433532715, "global_step": 211524, "epoch": 2548} {"train_loss": -24.69656753540039, "global_step": 211525, "epoch": 2548} {"train_loss": -24.797910690307617, "global_step": 211526, "epoch": 2548} {"train_loss": -24.310707092285156, "global_step": 211527, "epoch": 2548} {"train_loss": -24.985889434814453, "global_step": 211528, "epoch": 2548} {"train_loss": -24.988433837890625, "global_step": 211529, "epoch": 2548} {"train_loss": -24.562162399291992, "global_step": 211530, "epoch": 2548} {"train_loss": -24.42296600341797, "global_step": 211531, "epoch": 2548} {"train_loss": -24.65622329711914, "global_step": 211532, "epoch": 2548} {"train_loss": -24.45221519470215, "global_step": 211533, "epoch": 2548} {"train_loss": -24.27265739440918, "global_step": 211534, "epoch": 2548} {"train_loss": -24.73099708557129, "global_step": 211535, "epoch": 2548} {"train_loss": -24.745269775390625, "global_step": 211536, "epoch": 2548} {"train_loss": -24.579519271850586, "global_step": 211537, "epoch": 2548} {"train_loss": -25.197654724121094, "global_step": 211538, "epoch": 2548} {"train_loss": -24.969839096069336, "global_step": 211539, "epoch": 2548} {"train_loss": -24.191558837890625, "global_step": 211540, "epoch": 2548} {"train_loss": -24.585466384887695, "global_step": 211541, "epoch": 2548} {"train_loss": -24.2473087310791, "global_step": 211542, "epoch": 2548} {"train_loss": -23.966405868530273, "global_step": 211543, "epoch": 2548} {"train_loss": -24.78857421875, "global_step": 211544, "epoch": 2548} {"train_loss": -24.688745498657227, "global_step": 211545, "epoch": 2548} {"train_loss": -24.755706787109375, "global_step": 211546, "epoch": 2548} {"train_loss": -23.9549503326416, "global_step": 211547, "epoch": 2548} {"train_loss": -24.342926025390625, "global_step": 211548, "epoch": 2548} {"train_loss": -24.189970016479492, "global_step": 211549, "epoch": 2548} {"train_loss": -24.11604118347168, "global_step": 211550, "epoch": 2548} {"train_loss": -24.28741455078125, "global_step": 211551, "epoch": 2548} {"train_loss": -24.023733139038086, "global_step": 211552, "epoch": 2548} {"train_loss": -24.661279678344727, "global_step": 211553, "epoch": 2548} {"train_loss": -24.349855422973633, "global_step": 211554, "epoch": 2548} {"train_loss": -24.3435001373291, "global_step": 211555, "epoch": 2548} {"train_loss": -24.386348724365234, "global_step": 211556, "epoch": 2548} {"train_loss": -24.41850471496582, "global_step": 211557, "epoch": 2548} {"train_loss": -24.4372615814209, "global_step": 211558, "epoch": 2548} {"train_loss": -24.76263427734375, "global_step": 211559, "epoch": 2548} {"train_loss": -24.59441566467285, "global_step": 211560, "epoch": 2548} {"train_loss": -24.474040985107422, "global_step": 211561, "epoch": 2548} {"train_loss": -24.565441131591797, "global_step": 211562, "epoch": 2548} {"train_loss": -24.48049545288086, "global_step": 211563, "epoch": 2548} {"train_loss": -24.43306541442871, "global_step": 211564, "epoch": 2548} {"train_loss": -24.196880340576172, "global_step": 211565, "epoch": 2548} {"train_loss": -24.392795608704347, "global_step": 211566, "epoch": 2548, "val_loss": 6783054.0} {"train_loss": -24.364665985107422, "global_step": 211567, "epoch": 2549} {"train_loss": -24.090682983398438, "global_step": 211568, "epoch": 2549} {"train_loss": -24.013586044311523, "global_step": 211569, "epoch": 2549} {"train_loss": -23.87028694152832, "global_step": 211570, "epoch": 2549} {"train_loss": -24.13959503173828, "global_step": 211571, "epoch": 2549} {"train_loss": -24.19951820373535, "global_step": 211572, "epoch": 2549} {"train_loss": -24.51236343383789, "global_step": 211573, "epoch": 2549} {"train_loss": -24.214862823486328, "global_step": 211574, "epoch": 2549} {"train_loss": -24.086883544921875, "global_step": 211575, "epoch": 2549} {"train_loss": -23.959976196289062, "global_step": 211576, "epoch": 2549} {"train_loss": -24.62506103515625, "global_step": 211577, "epoch": 2549} {"train_loss": -24.302581787109375, "global_step": 211578, "epoch": 2549} {"train_loss": -24.17552947998047, "global_step": 211579, "epoch": 2549} {"train_loss": -24.030515670776367, "global_step": 211580, "epoch": 2549} {"train_loss": -24.424070358276367, "global_step": 211581, "epoch": 2549} {"train_loss": -24.358434677124023, "global_step": 211582, "epoch": 2549} {"train_loss": -24.27360725402832, "global_step": 211583, "epoch": 2549} {"train_loss": -24.583213806152344, "global_step": 211584, "epoch": 2549} {"train_loss": -24.652019500732422, "global_step": 211585, "epoch": 2549} {"train_loss": -24.183609008789062, "global_step": 211586, "epoch": 2549} {"train_loss": -24.25, "global_step": 211587, "epoch": 2549} {"train_loss": -24.33327865600586, "global_step": 211588, "epoch": 2549} {"train_loss": -24.626209259033203, "global_step": 211589, "epoch": 2549} {"train_loss": -24.555217742919922, "global_step": 211590, "epoch": 2549} {"train_loss": -24.030492782592773, "global_step": 211591, "epoch": 2549} {"train_loss": -24.64494514465332, "global_step": 211592, "epoch": 2549} {"train_loss": -24.368820190429688, "global_step": 211593, "epoch": 2549} {"train_loss": -24.355976104736328, "global_step": 211594, "epoch": 2549} {"train_loss": -24.799278259277344, "global_step": 211595, "epoch": 2549} {"train_loss": -23.91864585876465, "global_step": 211596, "epoch": 2549} {"train_loss": -24.34641456604004, "global_step": 211597, "epoch": 2549} {"train_loss": -24.37464714050293, "global_step": 211598, "epoch": 2549} {"train_loss": -24.350261688232422, "global_step": 211599, "epoch": 2549} {"train_loss": -24.72991943359375, "global_step": 211600, "epoch": 2549} {"train_loss": -24.798215866088867, "global_step": 211601, "epoch": 2549} {"train_loss": -24.204519271850586, "global_step": 211602, "epoch": 2549} {"train_loss": -24.419645309448242, "global_step": 211603, "epoch": 2549} {"train_loss": -24.444753646850586, "global_step": 211604, "epoch": 2549} {"train_loss": -24.607877731323242, "global_step": 211605, "epoch": 2549} {"train_loss": -24.713834762573242, "global_step": 211606, "epoch": 2549} {"train_loss": -24.73124122619629, "global_step": 211607, "epoch": 2549} {"train_loss": -24.596118927001953, "global_step": 211608, "epoch": 2549} {"train_loss": -24.74883460998535, "global_step": 211609, "epoch": 2549} {"train_loss": -24.318851470947266, "global_step": 211610, "epoch": 2549} {"train_loss": -24.58608055114746, "global_step": 211611, "epoch": 2549} {"train_loss": -24.381467819213867, "global_step": 211612, "epoch": 2549} {"train_loss": -24.263517379760742, "global_step": 211613, "epoch": 2549} {"train_loss": -24.712488174438477, "global_step": 211614, "epoch": 2549} {"train_loss": -24.35914421081543, "global_step": 211615, "epoch": 2549} {"train_loss": -24.713308334350586, "global_step": 211616, "epoch": 2549} {"train_loss": -24.78217887878418, "global_step": 211617, "epoch": 2549} {"train_loss": -24.545141220092773, "global_step": 211618, "epoch": 2549} {"train_loss": -24.754003524780273, "global_step": 211619, "epoch": 2549} {"train_loss": -24.335712432861328, "global_step": 211620, "epoch": 2549} {"train_loss": -24.43332290649414, "global_step": 211621, "epoch": 2549} {"train_loss": -24.748273849487305, "global_step": 211622, "epoch": 2549} {"train_loss": -24.352048873901367, "global_step": 211623, "epoch": 2549} {"train_loss": -24.52728843688965, "global_step": 211624, "epoch": 2549} {"train_loss": -24.262205123901367, "global_step": 211625, "epoch": 2549} {"train_loss": -24.93634605407715, "global_step": 211626, "epoch": 2549} {"train_loss": -24.568592071533203, "global_step": 211627, "epoch": 2549} {"train_loss": -24.55301856994629, "global_step": 211628, "epoch": 2549} {"train_loss": -24.431060791015625, "global_step": 211629, "epoch": 2549} {"train_loss": -24.364734649658203, "global_step": 211630, "epoch": 2549} {"train_loss": -24.32847023010254, "global_step": 211631, "epoch": 2549} {"train_loss": -24.60808753967285, "global_step": 211632, "epoch": 2549} {"train_loss": -24.58768653869629, "global_step": 211633, "epoch": 2549} {"train_loss": -24.580524444580078, "global_step": 211634, "epoch": 2549} {"train_loss": -24.453283309936523, "global_step": 211635, "epoch": 2549} {"train_loss": -24.525524139404297, "global_step": 211636, "epoch": 2549} {"train_loss": -24.61910057067871, "global_step": 211637, "epoch": 2549} {"train_loss": -24.070453643798828, "global_step": 211638, "epoch": 2549} {"train_loss": -24.606077194213867, "global_step": 211639, "epoch": 2549} {"train_loss": -24.504451751708984, "global_step": 211640, "epoch": 2549} {"train_loss": -24.174264907836914, "global_step": 211641, "epoch": 2549} {"train_loss": -24.03696060180664, "global_step": 211642, "epoch": 2549} {"train_loss": -24.426755905151367, "global_step": 211643, "epoch": 2549} {"train_loss": -24.220457077026367, "global_step": 211644, "epoch": 2549} {"train_loss": -24.545480728149414, "global_step": 211645, "epoch": 2549} {"train_loss": -24.69489860534668, "global_step": 211646, "epoch": 2549} {"train_loss": -24.48262596130371, "global_step": 211647, "epoch": 2549} {"train_loss": -24.179441452026367, "global_step": 211648, "epoch": 2549} {"train_loss": -24.43602679149214, "global_step": 211649, "epoch": 2549, "val_loss": 6541565.0} {"train_loss": -23.81549835205078, "global_step": 211650, "epoch": 2550} {"train_loss": -23.609867095947266, "global_step": 211651, "epoch": 2550} {"train_loss": -23.826147079467773, "global_step": 211652, "epoch": 2550} {"train_loss": -23.65268898010254, "global_step": 211653, "epoch": 2550} {"train_loss": -23.575275421142578, "global_step": 211654, "epoch": 2550} {"train_loss": -23.93316650390625, "global_step": 211655, "epoch": 2550} {"train_loss": -23.45248794555664, "global_step": 211656, "epoch": 2550} {"train_loss": -24.03230094909668, "global_step": 211657, "epoch": 2550} {"train_loss": -23.72914695739746, "global_step": 211658, "epoch": 2550} {"train_loss": -24.213985443115234, "global_step": 211659, "epoch": 2550} {"train_loss": -24.353164672851562, "global_step": 211660, "epoch": 2550} {"train_loss": -24.114948272705078, "global_step": 211661, "epoch": 2550} {"train_loss": -24.38223648071289, "global_step": 211662, "epoch": 2550} {"train_loss": -24.02705955505371, "global_step": 211663, "epoch": 2550} {"train_loss": -24.012903213500977, "global_step": 211664, "epoch": 2550} {"train_loss": -24.019119262695312, "global_step": 211665, "epoch": 2550} {"train_loss": -24.279943466186523, "global_step": 211666, "epoch": 2550} {"train_loss": -24.006072998046875, "global_step": 211667, "epoch": 2550} {"train_loss": -23.791776657104492, "global_step": 211668, "epoch": 2550} {"train_loss": -24.218910217285156, "global_step": 211669, "epoch": 2550} {"train_loss": -24.258731842041016, "global_step": 211670, "epoch": 2550} {"train_loss": -24.15049171447754, "global_step": 211671, "epoch": 2550} {"train_loss": -24.1889705657959, "global_step": 211672, "epoch": 2550} {"train_loss": -23.95711326599121, "global_step": 211673, "epoch": 2550} {"train_loss": -23.95237159729004, "global_step": 211674, "epoch": 2550} {"train_loss": -24.30289649963379, "global_step": 211675, "epoch": 2550} {"train_loss": -23.999845504760742, "global_step": 211676, "epoch": 2550} {"train_loss": -24.483827590942383, "global_step": 211677, "epoch": 2550} {"train_loss": -24.354412078857422, "global_step": 211678, "epoch": 2550} {"train_loss": -24.353866577148438, "global_step": 211679, "epoch": 2550} {"train_loss": -24.369070053100586, "global_step": 211680, "epoch": 2550} {"train_loss": -24.269250869750977, "global_step": 211681, "epoch": 2550} {"train_loss": -24.546554565429688, "global_step": 211682, "epoch": 2550} {"train_loss": -24.14691734313965, "global_step": 211683, "epoch": 2550} {"train_loss": -24.584300994873047, "global_step": 211684, "epoch": 2550} {"train_loss": -24.48982810974121, "global_step": 211685, "epoch": 2550} {"train_loss": -24.57562828063965, "global_step": 211686, "epoch": 2550} {"train_loss": -24.717187881469727, "global_step": 211687, "epoch": 2550} {"train_loss": -24.835159301757812, "global_step": 211688, "epoch": 2550} {"train_loss": -24.33365821838379, "global_step": 211689, "epoch": 2550} {"train_loss": -24.659399032592773, "global_step": 211690, "epoch": 2550} {"train_loss": -24.50893211364746, "global_step": 211691, "epoch": 2550} {"train_loss": -24.60114860534668, "global_step": 211692, "epoch": 2550} {"train_loss": -24.16100311279297, "global_step": 211693, "epoch": 2550} {"train_loss": -24.529661178588867, "global_step": 211694, "epoch": 2550} {"train_loss": -24.550825119018555, "global_step": 211695, "epoch": 2550} {"train_loss": -24.672504425048828, "global_step": 211696, "epoch": 2550} {"train_loss": -24.80377960205078, "global_step": 211697, "epoch": 2550} {"train_loss": -24.689697265625, "global_step": 211698, "epoch": 2550} {"train_loss": -24.337671279907227, "global_step": 211699, "epoch": 2550} {"train_loss": -24.436845779418945, "global_step": 211700, "epoch": 2550} {"train_loss": -24.327472686767578, "global_step": 211701, "epoch": 2550} {"train_loss": -24.114152908325195, "global_step": 211702, "epoch": 2550} {"train_loss": -24.591718673706055, "global_step": 211703, "epoch": 2550} {"train_loss": -24.234832763671875, "global_step": 211704, "epoch": 2550} {"train_loss": -24.300830841064453, "global_step": 211705, "epoch": 2550} {"train_loss": -24.64100456237793, "global_step": 211706, "epoch": 2550} {"train_loss": -24.724008560180664, "global_step": 211707, "epoch": 2550} {"train_loss": -24.1133975982666, "global_step": 211708, "epoch": 2550} {"train_loss": -24.823034286499023, "global_step": 211709, "epoch": 2550} {"train_loss": -24.11794090270996, "global_step": 211710, "epoch": 2550} {"train_loss": -24.344125747680664, "global_step": 211711, "epoch": 2550} {"train_loss": -24.33632469177246, "global_step": 211712, "epoch": 2550} {"train_loss": -24.471500396728516, "global_step": 211713, "epoch": 2550} {"train_loss": -24.014869689941406, "global_step": 211714, "epoch": 2550} {"train_loss": -24.507217407226562, "global_step": 211715, "epoch": 2550} {"train_loss": -24.120487213134766, "global_step": 211716, "epoch": 2550} {"train_loss": -24.506324768066406, "global_step": 211717, "epoch": 2550} {"train_loss": -24.600492477416992, "global_step": 211718, "epoch": 2550} {"train_loss": -24.012619018554688, "global_step": 211719, "epoch": 2550} {"train_loss": -24.604839324951172, "global_step": 211720, "epoch": 2550} {"train_loss": -24.209779739379883, "global_step": 211721, "epoch": 2550} {"train_loss": -24.175106048583984, "global_step": 211722, "epoch": 2550} {"train_loss": -24.426904678344727, "global_step": 211723, "epoch": 2550} {"train_loss": -24.638246536254883, "global_step": 211724, "epoch": 2550} {"train_loss": -24.77809715270996, "global_step": 211725, "epoch": 2550} {"train_loss": -24.194067001342773, "global_step": 211726, "epoch": 2550} {"train_loss": -24.248809814453125, "global_step": 211727, "epoch": 2550} {"train_loss": -24.480201721191406, "global_step": 211728, "epoch": 2550} {"train_loss": -24.32720375061035, "global_step": 211729, "epoch": 2550} {"train_loss": -24.275114059448242, "global_step": 211730, "epoch": 2550} {"train_loss": -24.265165328979492, "global_step": 211731, "epoch": 2550} {"train_loss": -24.3056216642081, "global_step": 211732, "epoch": 2550, "train/sim_max_reward_0": 1.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4500000": 1.0, "test/sim_max_reward_4500001": 1.0, "test/sim_max_reward_4500002": 1.0, "test/sim_max_reward_4500003": 1.0, "test/sim_max_reward_4500004": 0.0, "test/sim_max_reward_4500005": 1.0, "test/sim_max_reward_4500006": 1.0, "test/sim_max_reward_4500007": 1.0, "test/sim_max_reward_4500008": 1.0, "test/sim_max_reward_4500009": 1.0, "test/sim_max_reward_4500010": 1.0, "test/sim_max_reward_4500011": 1.0, "test/sim_max_reward_4500012": 1.0, "test/sim_max_reward_4500013": 1.0, "test/sim_max_reward_4500014": 1.0, "test/sim_max_reward_4500015": 1.0, "test/sim_max_reward_4500016": 1.0, "test/sim_max_reward_4500017": 1.0, "test/sim_max_reward_4500018": 1.0, "test/sim_max_reward_4500019": 0.0, "test/sim_max_reward_4500020": 1.0, "test/sim_max_reward_4500021": 1.0, "train/mean_score": 1.0, "test/mean_score": 0.9090909090909091, "val_loss": 6697371.0} {"train_loss": -24.00187110900879, "global_step": 211733, "epoch": 2551} {"train_loss": -23.74469566345215, "global_step": 211734, "epoch": 2551} {"train_loss": -23.825767517089844, "global_step": 211735, "epoch": 2551} {"train_loss": -24.18476676940918, "global_step": 211736, "epoch": 2551} {"train_loss": -23.689319610595703, "global_step": 211737, "epoch": 2551} {"train_loss": -23.969919204711914, "global_step": 211738, "epoch": 2551} {"train_loss": -24.242385864257812, "global_step": 211739, "epoch": 2551} {"train_loss": -24.173538208007812, "global_step": 211740, "epoch": 2551} {"train_loss": -24.219482421875, "global_step": 211741, "epoch": 2551} {"train_loss": -24.380273818969727, "global_step": 211742, "epoch": 2551} {"train_loss": -24.221837997436523, "global_step": 211743, "epoch": 2551} {"train_loss": -24.128646850585938, "global_step": 211744, "epoch": 2551} {"train_loss": -24.32279396057129, "global_step": 211745, "epoch": 2551} {"train_loss": -24.218700408935547, "global_step": 211746, "epoch": 2551} {"train_loss": -24.190364837646484, "global_step": 211747, "epoch": 2551} {"train_loss": -24.39176368713379, "global_step": 211748, "epoch": 2551} {"train_loss": -24.609943389892578, "global_step": 211749, "epoch": 2551} {"train_loss": -24.597675323486328, "global_step": 211750, "epoch": 2551} {"train_loss": -24.302753448486328, "global_step": 211751, "epoch": 2551} {"train_loss": -24.31884765625, "global_step": 211752, "epoch": 2551} {"train_loss": -24.332012176513672, "global_step": 211753, "epoch": 2551} {"train_loss": -24.965349197387695, "global_step": 211754, "epoch": 2551} {"train_loss": -24.336456298828125, "global_step": 211755, "epoch": 2551} {"train_loss": -24.62757682800293, "global_step": 211756, "epoch": 2551} {"train_loss": -24.526212692260742, "global_step": 211757, "epoch": 2551} {"train_loss": -24.518341064453125, "global_step": 211758, "epoch": 2551} {"train_loss": -24.19742774963379, "global_step": 211759, "epoch": 2551} {"train_loss": -24.17409324645996, "global_step": 211760, "epoch": 2551} {"train_loss": -24.216510772705078, "global_step": 211761, "epoch": 2551} {"train_loss": -24.354114532470703, "global_step": 211762, "epoch": 2551} {"train_loss": -24.50773048400879, "global_step": 211763, "epoch": 2551} {"train_loss": -24.282638549804688, "global_step": 211764, "epoch": 2551} {"train_loss": -24.61769676208496, "global_step": 211765, "epoch": 2551} {"train_loss": -24.331098556518555, "global_step": 211766, "epoch": 2551} {"train_loss": -24.430294036865234, "global_step": 211767, "epoch": 2551} {"train_loss": -24.48052978515625, "global_step": 211768, "epoch": 2551} {"train_loss": -24.426401138305664, "global_step": 211769, "epoch": 2551} {"train_loss": -24.49980926513672, "global_step": 211770, "epoch": 2551} {"train_loss": -24.538101196289062, "global_step": 211771, "epoch": 2551} {"train_loss": -24.53090476989746, "global_step": 211772, "epoch": 2551} {"train_loss": -24.572134017944336, "global_step": 211773, "epoch": 2551} {"train_loss": -24.395092010498047, "global_step": 211774, "epoch": 2551} {"train_loss": -24.361783981323242, "global_step": 211775, "epoch": 2551} {"train_loss": -24.531278610229492, "global_step": 211776, "epoch": 2551} {"train_loss": -24.58685874938965, "global_step": 211777, "epoch": 2551} {"train_loss": -24.392772674560547, "global_step": 211778, "epoch": 2551} {"train_loss": -24.639495849609375, "global_step": 211779, "epoch": 2551} {"train_loss": -24.130199432373047, "global_step": 211780, "epoch": 2551} {"train_loss": -24.414875030517578, "global_step": 211781, "epoch": 2551} {"train_loss": -24.474462509155273, "global_step": 211782, "epoch": 2551} {"train_loss": -24.510801315307617, "global_step": 211783, "epoch": 2551} {"train_loss": -24.25118064880371, "global_step": 211784, "epoch": 2551} {"train_loss": -24.9658145904541, "global_step": 211785, "epoch": 2551} {"train_loss": -24.735990524291992, "global_step": 211786, "epoch": 2551} {"train_loss": -24.421560287475586, "global_step": 211787, "epoch": 2551} {"train_loss": -24.465118408203125, "global_step": 211788, "epoch": 2551} {"train_loss": -24.824548721313477, "global_step": 211789, "epoch": 2551} {"train_loss": -24.325820922851562, "global_step": 211790, "epoch": 2551} {"train_loss": -24.38633155822754, "global_step": 211791, "epoch": 2551} {"train_loss": -24.442413330078125, "global_step": 211792, "epoch": 2551} {"train_loss": -24.191680908203125, "global_step": 211793, "epoch": 2551} {"train_loss": -24.37918472290039, "global_step": 211794, "epoch": 2551} {"train_loss": -24.530193328857422, "global_step": 211795, "epoch": 2551} {"train_loss": -24.842182159423828, "global_step": 211796, "epoch": 2551} {"train_loss": -24.41832160949707, "global_step": 211797, "epoch": 2551} {"train_loss": -24.44228172302246, "global_step": 211798, "epoch": 2551} {"train_loss": -24.3543701171875, "global_step": 211799, "epoch": 2551} {"train_loss": -24.03481101989746, "global_step": 211800, "epoch": 2551} {"train_loss": -24.690332412719727, "global_step": 211801, "epoch": 2551} {"train_loss": -24.410993576049805, "global_step": 211802, "epoch": 2551} {"train_loss": -24.207571029663086, "global_step": 211803, "epoch": 2551} {"train_loss": -24.1600284576416, "global_step": 211804, "epoch": 2551} {"train_loss": -24.587995529174805, "global_step": 211805, "epoch": 2551} {"train_loss": -24.83108139038086, "global_step": 211806, "epoch": 2551} {"train_loss": -24.24761962890625, "global_step": 211807, "epoch": 2551} {"train_loss": -24.416519165039062, "global_step": 211808, "epoch": 2551} {"train_loss": -24.16851043701172, "global_step": 211809, "epoch": 2551} {"train_loss": -24.362125396728516, "global_step": 211810, "epoch": 2551} {"train_loss": -24.390087127685547, "global_step": 211811, "epoch": 2551} {"train_loss": -24.013416290283203, "global_step": 211812, "epoch": 2551} {"train_loss": -24.115413665771484, "global_step": 211813, "epoch": 2551} {"train_loss": -24.145353317260742, "global_step": 211814, "epoch": 2551} {"train_loss": -24.365955237882684, "global_step": 211815, "epoch": 2551, "val_loss": 6763019.5} {"train_loss": -24.32366943359375, "global_step": 211816, "epoch": 2552} {"train_loss": -24.103153228759766, "global_step": 211817, "epoch": 2552} {"train_loss": -24.03514862060547, "global_step": 211818, "epoch": 2552} {"train_loss": -24.34113883972168, "global_step": 211819, "epoch": 2552} {"train_loss": -23.774761199951172, "global_step": 211820, "epoch": 2552} {"train_loss": -24.223587036132812, "global_step": 211821, "epoch": 2552} {"train_loss": -24.126739501953125, "global_step": 211822, "epoch": 2552} {"train_loss": -24.297645568847656, "global_step": 211823, "epoch": 2552} {"train_loss": -24.306989669799805, "global_step": 211824, "epoch": 2552} {"train_loss": -24.609119415283203, "global_step": 211825, "epoch": 2552} {"train_loss": -24.57679557800293, "global_step": 211826, "epoch": 2552} {"train_loss": -24.28835105895996, "global_step": 211827, "epoch": 2552} {"train_loss": -24.330224990844727, "global_step": 211828, "epoch": 2552} {"train_loss": -24.567960739135742, "global_step": 211829, "epoch": 2552} {"train_loss": -24.746152877807617, "global_step": 211830, "epoch": 2552} {"train_loss": -24.646467208862305, "global_step": 211831, "epoch": 2552} {"train_loss": -24.131025314331055, "global_step": 211832, "epoch": 2552} {"train_loss": -24.4482479095459, "global_step": 211833, "epoch": 2552} {"train_loss": -24.49403190612793, "global_step": 211834, "epoch": 2552} {"train_loss": -24.287094116210938, "global_step": 211835, "epoch": 2552} {"train_loss": -24.248422622680664, "global_step": 211836, "epoch": 2552} {"train_loss": -24.236230850219727, "global_step": 211837, "epoch": 2552} {"train_loss": -24.462858200073242, "global_step": 211838, "epoch": 2552} {"train_loss": -24.400049209594727, "global_step": 211839, "epoch": 2552} {"train_loss": -24.150978088378906, "global_step": 211840, "epoch": 2552} {"train_loss": -24.69756317138672, "global_step": 211841, "epoch": 2552} {"train_loss": -24.517078399658203, "global_step": 211842, "epoch": 2552} {"train_loss": -24.6799259185791, "global_step": 211843, "epoch": 2552} {"train_loss": -24.227102279663086, "global_step": 211844, "epoch": 2552} {"train_loss": -24.8075008392334, "global_step": 211845, "epoch": 2552} {"train_loss": -24.555618286132812, "global_step": 211846, "epoch": 2552} {"train_loss": -24.496519088745117, "global_step": 211847, "epoch": 2552} {"train_loss": -24.21746253967285, "global_step": 211848, "epoch": 2552} {"train_loss": -24.012887954711914, "global_step": 211849, "epoch": 2552} {"train_loss": -24.44161033630371, "global_step": 211850, "epoch": 2552} {"train_loss": -24.45536231994629, "global_step": 211851, "epoch": 2552} {"train_loss": -24.35480308532715, "global_step": 211852, "epoch": 2552} {"train_loss": -24.415632247924805, "global_step": 211853, "epoch": 2552} {"train_loss": -24.598526000976562, "global_step": 211854, "epoch": 2552} {"train_loss": -24.501455307006836, "global_step": 211855, "epoch": 2552} {"train_loss": -24.641326904296875, "global_step": 211856, "epoch": 2552} {"train_loss": -24.390872955322266, "global_step": 211857, "epoch": 2552} {"train_loss": -24.480350494384766, "global_step": 211858, "epoch": 2552} {"train_loss": -24.39558982849121, "global_step": 211859, "epoch": 2552} {"train_loss": -24.337970733642578, "global_step": 211860, "epoch": 2552} {"train_loss": -24.554080963134766, "global_step": 211861, "epoch": 2552} {"train_loss": -24.357572555541992, "global_step": 211862, "epoch": 2552} {"train_loss": -24.618276596069336, "global_step": 211863, "epoch": 2552} {"train_loss": -24.605037689208984, "global_step": 211864, "epoch": 2552} {"train_loss": -24.207700729370117, "global_step": 211865, "epoch": 2552} {"train_loss": -24.592321395874023, "global_step": 211866, "epoch": 2552} {"train_loss": -24.374940872192383, "global_step": 211867, "epoch": 2552} {"train_loss": -23.95934295654297, "global_step": 211868, "epoch": 2552} {"train_loss": -24.315710067749023, "global_step": 211869, "epoch": 2552} {"train_loss": -24.278223037719727, "global_step": 211870, "epoch": 2552} {"train_loss": -24.014739990234375, "global_step": 211871, "epoch": 2552} {"train_loss": -24.75679588317871, "global_step": 211872, "epoch": 2552} {"train_loss": -24.434186935424805, "global_step": 211873, "epoch": 2552} {"train_loss": -24.13730239868164, "global_step": 211874, "epoch": 2552} {"train_loss": -24.559417724609375, "global_step": 211875, "epoch": 2552} {"train_loss": -25.010732650756836, "global_step": 211876, "epoch": 2552} {"train_loss": -24.300485610961914, "global_step": 211877, "epoch": 2552} {"train_loss": -24.047754287719727, "global_step": 211878, "epoch": 2552} {"train_loss": -24.759023666381836, "global_step": 211879, "epoch": 2552} {"train_loss": -24.53580093383789, "global_step": 211880, "epoch": 2552} {"train_loss": -23.895341873168945, "global_step": 211881, "epoch": 2552} {"train_loss": -24.305208206176758, "global_step": 211882, "epoch": 2552} {"train_loss": -24.757932662963867, "global_step": 211883, "epoch": 2552} {"train_loss": -24.879209518432617, "global_step": 211884, "epoch": 2552} {"train_loss": -24.36033058166504, "global_step": 211885, "epoch": 2552} {"train_loss": -24.29469871520996, "global_step": 211886, "epoch": 2552} {"train_loss": -24.553159713745117, "global_step": 211887, "epoch": 2552} {"train_loss": -23.971378326416016, "global_step": 211888, "epoch": 2552} {"train_loss": -24.161048889160156, "global_step": 211889, "epoch": 2552} {"train_loss": -24.487930297851562, "global_step": 211890, "epoch": 2552} {"train_loss": -24.926183700561523, "global_step": 211891, "epoch": 2552} {"train_loss": -24.263898849487305, "global_step": 211892, "epoch": 2552} {"train_loss": -24.301546096801758, "global_step": 211893, "epoch": 2552} {"train_loss": -24.720300674438477, "global_step": 211894, "epoch": 2552} {"train_loss": -24.452653884887695, "global_step": 211895, "epoch": 2552} {"train_loss": -24.750125885009766, "global_step": 211896, "epoch": 2552} {"train_loss": -24.219594955444336, "global_step": 211897, "epoch": 2552} {"train_loss": -24.41357856198966, "global_step": 211898, "epoch": 2552, "val_loss": 6623227.0} {"train_loss": -23.762664794921875, "global_step": 211899, "epoch": 2553} {"train_loss": -24.024648666381836, "global_step": 211900, "epoch": 2553} {"train_loss": -23.555904388427734, "global_step": 211901, "epoch": 2553} {"train_loss": -24.154773712158203, "global_step": 211902, "epoch": 2553} {"train_loss": -23.88691520690918, "global_step": 211903, "epoch": 2553} {"train_loss": -23.79237174987793, "global_step": 211904, "epoch": 2553} {"train_loss": -23.724414825439453, "global_step": 211905, "epoch": 2553} {"train_loss": -24.154356002807617, "global_step": 211906, "epoch": 2553} {"train_loss": -23.467004776000977, "global_step": 211907, "epoch": 2553} {"train_loss": -24.41263771057129, "global_step": 211908, "epoch": 2553} {"train_loss": -24.215068817138672, "global_step": 211909, "epoch": 2553} {"train_loss": -23.979354858398438, "global_step": 211910, "epoch": 2553} {"train_loss": -24.22890281677246, "global_step": 211911, "epoch": 2553} {"train_loss": -23.968669891357422, "global_step": 211912, "epoch": 2553} {"train_loss": -24.202123641967773, "global_step": 211913, "epoch": 2553} {"train_loss": -23.922239303588867, "global_step": 211914, "epoch": 2553} {"train_loss": -24.019367218017578, "global_step": 211915, "epoch": 2553} {"train_loss": -24.130090713500977, "global_step": 211916, "epoch": 2553} {"train_loss": -24.194774627685547, "global_step": 211917, "epoch": 2553} {"train_loss": -24.367399215698242, "global_step": 211918, "epoch": 2553} {"train_loss": -24.498769760131836, "global_step": 211919, "epoch": 2553} {"train_loss": -24.913122177124023, "global_step": 211920, "epoch": 2553} {"train_loss": -24.214628219604492, "global_step": 211921, "epoch": 2553} {"train_loss": -24.271207809448242, "global_step": 211922, "epoch": 2553} {"train_loss": -24.40007781982422, "global_step": 211923, "epoch": 2553} {"train_loss": -24.15683364868164, "global_step": 211924, "epoch": 2553} {"train_loss": -24.296998977661133, "global_step": 211925, "epoch": 2553} {"train_loss": -24.510311126708984, "global_step": 211926, "epoch": 2553} {"train_loss": -24.520795822143555, "global_step": 211927, "epoch": 2553} {"train_loss": -24.429685592651367, "global_step": 211928, "epoch": 2553} {"train_loss": -24.656728744506836, "global_step": 211929, "epoch": 2553} {"train_loss": -24.54486846923828, "global_step": 211930, "epoch": 2553} {"train_loss": -24.417224884033203, "global_step": 211931, "epoch": 2553} {"train_loss": -24.172849655151367, "global_step": 211932, "epoch": 2553} {"train_loss": -24.416751861572266, "global_step": 211933, "epoch": 2553} {"train_loss": -24.66779136657715, "global_step": 211934, "epoch": 2553} {"train_loss": -24.43726921081543, "global_step": 211935, "epoch": 2553} {"train_loss": -24.377342224121094, "global_step": 211936, "epoch": 2553} {"train_loss": -24.7080135345459, "global_step": 211937, "epoch": 2553} {"train_loss": -24.465787887573242, "global_step": 211938, "epoch": 2553} {"train_loss": -24.484079360961914, "global_step": 211939, "epoch": 2553} {"train_loss": -24.289108276367188, "global_step": 211940, "epoch": 2553} {"train_loss": -24.718490600585938, "global_step": 211941, "epoch": 2553} {"train_loss": -24.56982421875, "global_step": 211942, "epoch": 2553} {"train_loss": -24.342504501342773, "global_step": 211943, "epoch": 2553} {"train_loss": -23.962543487548828, "global_step": 211944, "epoch": 2553} {"train_loss": -24.458011627197266, "global_step": 211945, "epoch": 2553} {"train_loss": -24.483896255493164, "global_step": 211946, "epoch": 2553} {"train_loss": -24.51236915588379, "global_step": 211947, "epoch": 2553} {"train_loss": -24.870664596557617, "global_step": 211948, "epoch": 2553} {"train_loss": -24.3962459564209, "global_step": 211949, "epoch": 2553} {"train_loss": -24.482934951782227, "global_step": 211950, "epoch": 2553} {"train_loss": -24.665708541870117, "global_step": 211951, "epoch": 2553} {"train_loss": -24.887619018554688, "global_step": 211952, "epoch": 2553} {"train_loss": -24.391454696655273, "global_step": 211953, "epoch": 2553} {"train_loss": -24.63422966003418, "global_step": 211954, "epoch": 2553} {"train_loss": -24.5620174407959, "global_step": 211955, "epoch": 2553} {"train_loss": -24.324186325073242, "global_step": 211956, "epoch": 2553} {"train_loss": -24.117353439331055, "global_step": 211957, "epoch": 2553} {"train_loss": -24.538305282592773, "global_step": 211958, "epoch": 2553} {"train_loss": -24.47205352783203, "global_step": 211959, "epoch": 2553} {"train_loss": -24.518360137939453, "global_step": 211960, "epoch": 2553} {"train_loss": -24.321897506713867, "global_step": 211961, "epoch": 2553} {"train_loss": -24.058502197265625, "global_step": 211962, "epoch": 2553} {"train_loss": -24.597681045532227, "global_step": 211963, "epoch": 2553} {"train_loss": -24.394426345825195, "global_step": 211964, "epoch": 2553} {"train_loss": -24.60696792602539, "global_step": 211965, "epoch": 2553} {"train_loss": -24.390872955322266, "global_step": 211966, "epoch": 2553} {"train_loss": -24.29087257385254, "global_step": 211967, "epoch": 2553} {"train_loss": -24.59779167175293, "global_step": 211968, "epoch": 2553} {"train_loss": -24.326770782470703, "global_step": 211969, "epoch": 2553} {"train_loss": -24.613636016845703, "global_step": 211970, "epoch": 2553} {"train_loss": -24.43602180480957, "global_step": 211971, "epoch": 2553} {"train_loss": -24.59832763671875, "global_step": 211972, "epoch": 2553} {"train_loss": -24.246585845947266, "global_step": 211973, "epoch": 2553} {"train_loss": -24.631412506103516, "global_step": 211974, "epoch": 2553} {"train_loss": -24.619327545166016, "global_step": 211975, "epoch": 2553} {"train_loss": -24.57088279724121, "global_step": 211976, "epoch": 2553} {"train_loss": -24.38519859313965, "global_step": 211977, "epoch": 2553} {"train_loss": -24.293624877929688, "global_step": 211978, "epoch": 2553} {"train_loss": -24.543935775756836, "global_step": 211979, "epoch": 2553} {"train_loss": -24.48622703552246, "global_step": 211980, "epoch": 2553} {"train_loss": -24.38227124961026, "global_step": 211981, "epoch": 2553, "val_loss": 6676699.0} {"train_loss": -22.958114624023438, "global_step": 211982, "epoch": 2554} {"train_loss": -23.302316665649414, "global_step": 211983, "epoch": 2554} {"train_loss": -22.735748291015625, "global_step": 211984, "epoch": 2554} {"train_loss": -23.562597274780273, "global_step": 211985, "epoch": 2554} {"train_loss": -23.171018600463867, "global_step": 211986, "epoch": 2554} {"train_loss": -23.448469161987305, "global_step": 211987, "epoch": 2554} {"train_loss": -23.057483673095703, "global_step": 211988, "epoch": 2554} {"train_loss": -23.60520362854004, "global_step": 211989, "epoch": 2554} {"train_loss": -23.291227340698242, "global_step": 211990, "epoch": 2554} {"train_loss": -23.796772003173828, "global_step": 211991, "epoch": 2554} {"train_loss": -23.592695236206055, "global_step": 211992, "epoch": 2554} {"train_loss": -23.604450225830078, "global_step": 211993, "epoch": 2554} {"train_loss": -23.72437286376953, "global_step": 211994, "epoch": 2554} {"train_loss": -24.00650978088379, "global_step": 211995, "epoch": 2554} {"train_loss": -24.17583656311035, "global_step": 211996, "epoch": 2554} {"train_loss": -23.895263671875, "global_step": 211997, "epoch": 2554} {"train_loss": -23.698867797851562, "global_step": 211998, "epoch": 2554} {"train_loss": -24.04374122619629, "global_step": 211999, "epoch": 2554} {"train_loss": -23.837736129760742, "global_step": 212000, "epoch": 2554} {"train_loss": -23.930538177490234, "global_step": 212001, "epoch": 2554} {"train_loss": -24.0664119720459, "global_step": 212002, "epoch": 2554} {"train_loss": -24.065176010131836, "global_step": 212003, "epoch": 2554} {"train_loss": -24.304136276245117, "global_step": 212004, "epoch": 2554} {"train_loss": -23.82792091369629, "global_step": 212005, "epoch": 2554} {"train_loss": -24.25201988220215, "global_step": 212006, "epoch": 2554} {"train_loss": -24.12641716003418, "global_step": 212007, "epoch": 2554} {"train_loss": -24.021928787231445, "global_step": 212008, "epoch": 2554} {"train_loss": -24.20962905883789, "global_step": 212009, "epoch": 2554} {"train_loss": -24.271142959594727, "global_step": 212010, "epoch": 2554} {"train_loss": -24.41922378540039, "global_step": 212011, "epoch": 2554} {"train_loss": -24.524959564208984, "global_step": 212012, "epoch": 2554} {"train_loss": -24.375272750854492, "global_step": 212013, "epoch": 2554} {"train_loss": -24.378644943237305, "global_step": 212014, "epoch": 2554} {"train_loss": -24.592208862304688, "global_step": 212015, "epoch": 2554} {"train_loss": -24.216094970703125, "global_step": 212016, "epoch": 2554} {"train_loss": -24.275480270385742, "global_step": 212017, "epoch": 2554} {"train_loss": -24.5900821685791, "global_step": 212018, "epoch": 2554} {"train_loss": -24.50325584411621, "global_step": 212019, "epoch": 2554} {"train_loss": -24.609540939331055, "global_step": 212020, "epoch": 2554} {"train_loss": -24.199542999267578, "global_step": 212021, "epoch": 2554} {"train_loss": -24.513397216796875, "global_step": 212022, "epoch": 2554} {"train_loss": -24.548418045043945, "global_step": 212023, "epoch": 2554} {"train_loss": -24.58963966369629, "global_step": 212024, "epoch": 2554} {"train_loss": -24.507152557373047, "global_step": 212025, "epoch": 2554} {"train_loss": -24.303804397583008, "global_step": 212026, "epoch": 2554} {"train_loss": -24.19436264038086, "global_step": 212027, "epoch": 2554} {"train_loss": -24.77437400817871, "global_step": 212028, "epoch": 2554} {"train_loss": -24.82828712463379, "global_step": 212029, "epoch": 2554} {"train_loss": -24.50043296813965, "global_step": 212030, "epoch": 2554} {"train_loss": -24.38648796081543, "global_step": 212031, "epoch": 2554} {"train_loss": -24.606653213500977, "global_step": 212032, "epoch": 2554} {"train_loss": -24.5626277923584, "global_step": 212033, "epoch": 2554} {"train_loss": -24.60316276550293, "global_step": 212034, "epoch": 2554} {"train_loss": -24.551773071289062, "global_step": 212035, "epoch": 2554} {"train_loss": -24.766489028930664, "global_step": 212036, "epoch": 2554} {"train_loss": -24.57590675354004, "global_step": 212037, "epoch": 2554} {"train_loss": -24.49738121032715, "global_step": 212038, "epoch": 2554} {"train_loss": -24.346057891845703, "global_step": 212039, "epoch": 2554} {"train_loss": -24.272825241088867, "global_step": 212040, "epoch": 2554} {"train_loss": -23.948713302612305, "global_step": 212041, "epoch": 2554} {"train_loss": -24.704023361206055, "global_step": 212042, "epoch": 2554} {"train_loss": -24.3887996673584, "global_step": 212043, "epoch": 2554} {"train_loss": -24.476715087890625, "global_step": 212044, "epoch": 2554} {"train_loss": -24.07716178894043, "global_step": 212045, "epoch": 2554} {"train_loss": -24.170093536376953, "global_step": 212046, "epoch": 2554} {"train_loss": -24.15683364868164, "global_step": 212047, "epoch": 2554} {"train_loss": -24.627782821655273, "global_step": 212048, "epoch": 2554} {"train_loss": -24.012624740600586, "global_step": 212049, "epoch": 2554} {"train_loss": -24.767990112304688, "global_step": 212050, "epoch": 2554} {"train_loss": -24.52472496032715, "global_step": 212051, "epoch": 2554} {"train_loss": -24.361799240112305, "global_step": 212052, "epoch": 2554} {"train_loss": -24.441959381103516, "global_step": 212053, "epoch": 2554} {"train_loss": -24.654937744140625, "global_step": 212054, "epoch": 2554} {"train_loss": -24.697982788085938, "global_step": 212055, "epoch": 2554} {"train_loss": -24.487625122070312, "global_step": 212056, "epoch": 2554} {"train_loss": -24.445287704467773, "global_step": 212057, "epoch": 2554} {"train_loss": -24.22169303894043, "global_step": 212058, "epoch": 2554} {"train_loss": -24.84415626525879, "global_step": 212059, "epoch": 2554} {"train_loss": -24.53786849975586, "global_step": 212060, "epoch": 2554} {"train_loss": -24.29575538635254, "global_step": 212061, "epoch": 2554} {"train_loss": -24.636301040649414, "global_step": 212062, "epoch": 2554} {"train_loss": -24.599679946899414, "global_step": 212063, "epoch": 2554} {"train_loss": -24.20758555308882, "global_step": 212064, "epoch": 2554, "val_loss": 6522714.0} {"train_loss": -24.08639144897461, "global_step": 212065, "epoch": 2555} {"train_loss": -24.318828582763672, "global_step": 212066, "epoch": 2555} {"train_loss": -23.97589683532715, "global_step": 212067, "epoch": 2555} {"train_loss": -24.81278419494629, "global_step": 212068, "epoch": 2555} {"train_loss": -24.192625045776367, "global_step": 212069, "epoch": 2555} {"train_loss": -23.948558807373047, "global_step": 212070, "epoch": 2555} {"train_loss": -24.616300582885742, "global_step": 212071, "epoch": 2555} {"train_loss": -24.474348068237305, "global_step": 212072, "epoch": 2555} {"train_loss": -24.404775619506836, "global_step": 212073, "epoch": 2555} {"train_loss": -24.541105270385742, "global_step": 212074, "epoch": 2555} {"train_loss": -24.371505737304688, "global_step": 212075, "epoch": 2555} {"train_loss": -23.9180965423584, "global_step": 212076, "epoch": 2555} {"train_loss": -24.505868911743164, "global_step": 212077, "epoch": 2555} {"train_loss": -24.22123146057129, "global_step": 212078, "epoch": 2555} {"train_loss": -24.07259178161621, "global_step": 212079, "epoch": 2555} {"train_loss": -24.196760177612305, "global_step": 212080, "epoch": 2555} {"train_loss": -24.68404197692871, "global_step": 212081, "epoch": 2555} {"train_loss": -24.340988159179688, "global_step": 212082, "epoch": 2555} {"train_loss": -24.574920654296875, "global_step": 212083, "epoch": 2555} {"train_loss": -24.566843032836914, "global_step": 212084, "epoch": 2555} {"train_loss": -24.017919540405273, "global_step": 212085, "epoch": 2555} {"train_loss": -24.430522918701172, "global_step": 212086, "epoch": 2555} {"train_loss": -24.016071319580078, "global_step": 212087, "epoch": 2555} {"train_loss": -24.340482711791992, "global_step": 212088, "epoch": 2555} {"train_loss": -23.923547744750977, "global_step": 212089, "epoch": 2555} {"train_loss": -23.947189331054688, "global_step": 212090, "epoch": 2555} {"train_loss": -24.2242488861084, "global_step": 212091, "epoch": 2555} {"train_loss": -24.577638626098633, "global_step": 212092, "epoch": 2555} {"train_loss": -24.381061553955078, "global_step": 212093, "epoch": 2555} {"train_loss": -24.272184371948242, "global_step": 212094, "epoch": 2555} {"train_loss": -24.20865249633789, "global_step": 212095, "epoch": 2555} {"train_loss": -24.47169303894043, "global_step": 212096, "epoch": 2555} {"train_loss": -24.457111358642578, "global_step": 212097, "epoch": 2555} {"train_loss": -24.38420867919922, "global_step": 212098, "epoch": 2555} {"train_loss": -24.070608139038086, "global_step": 212099, "epoch": 2555} {"train_loss": -24.291780471801758, "global_step": 212100, "epoch": 2555} {"train_loss": -24.526432037353516, "global_step": 212101, "epoch": 2555} {"train_loss": -24.39238929748535, "global_step": 212102, "epoch": 2555} {"train_loss": -24.27081298828125, "global_step": 212103, "epoch": 2555} {"train_loss": -24.22906494140625, "global_step": 212104, "epoch": 2555} {"train_loss": -24.543745040893555, "global_step": 212105, "epoch": 2555} {"train_loss": -24.520353317260742, "global_step": 212106, "epoch": 2555} {"train_loss": -24.281423568725586, "global_step": 212107, "epoch": 2555} {"train_loss": -24.658212661743164, "global_step": 212108, "epoch": 2555} {"train_loss": -24.430219650268555, "global_step": 212109, "epoch": 2555} {"train_loss": -24.251310348510742, "global_step": 212110, "epoch": 2555} {"train_loss": -23.969125747680664, "global_step": 212111, "epoch": 2555} {"train_loss": -24.50837516784668, "global_step": 212112, "epoch": 2555} {"train_loss": -24.64803123474121, "global_step": 212113, "epoch": 2555} {"train_loss": -24.22344970703125, "global_step": 212114, "epoch": 2555} {"train_loss": -24.687946319580078, "global_step": 212115, "epoch": 2555} {"train_loss": -24.56381607055664, "global_step": 212116, "epoch": 2555} {"train_loss": -24.71917724609375, "global_step": 212117, "epoch": 2555} {"train_loss": -24.435155868530273, "global_step": 212118, "epoch": 2555} {"train_loss": -25.007062911987305, "global_step": 212119, "epoch": 2555} {"train_loss": -24.387632369995117, "global_step": 212120, "epoch": 2555} {"train_loss": -24.961523056030273, "global_step": 212121, "epoch": 2555} {"train_loss": -24.788240432739258, "global_step": 212122, "epoch": 2555} {"train_loss": -24.468494415283203, "global_step": 212123, "epoch": 2555} {"train_loss": -24.34969139099121, "global_step": 212124, "epoch": 2555} {"train_loss": -24.49246597290039, "global_step": 212125, "epoch": 2555} {"train_loss": -24.761425018310547, "global_step": 212126, "epoch": 2555} {"train_loss": -24.713926315307617, "global_step": 212127, "epoch": 2555} {"train_loss": -24.634754180908203, "global_step": 212128, "epoch": 2555} {"train_loss": -24.708898544311523, "global_step": 212129, "epoch": 2555} {"train_loss": -24.617820739746094, "global_step": 212130, "epoch": 2555} {"train_loss": -24.643484115600586, "global_step": 212131, "epoch": 2555} {"train_loss": -24.540952682495117, "global_step": 212132, "epoch": 2555} {"train_loss": -24.724445343017578, "global_step": 212133, "epoch": 2555} {"train_loss": -24.068655014038086, "global_step": 212134, "epoch": 2555} {"train_loss": -24.46396827697754, "global_step": 212135, "epoch": 2555} {"train_loss": -24.698366165161133, "global_step": 212136, "epoch": 2555} {"train_loss": -24.554580688476562, "global_step": 212137, "epoch": 2555} {"train_loss": -24.309467315673828, "global_step": 212138, "epoch": 2555} {"train_loss": -24.275461196899414, "global_step": 212139, "epoch": 2555} {"train_loss": -24.453195571899414, "global_step": 212140, "epoch": 2555} {"train_loss": -24.40340805053711, "global_step": 212141, "epoch": 2555} {"train_loss": -24.63072967529297, "global_step": 212142, "epoch": 2555} {"train_loss": -24.129173278808594, "global_step": 212143, "epoch": 2555} {"train_loss": -24.233346939086914, "global_step": 212144, "epoch": 2555} {"train_loss": -24.13113784790039, "global_step": 212145, "epoch": 2555} {"train_loss": -24.52970314025879, "global_step": 212146, "epoch": 2555} {"train_loss": -24.400899795164545, "global_step": 212147, "epoch": 2555, "val_loss": 6587955.0} {"train_loss": -23.8936767578125, "global_step": 212148, "epoch": 2556} {"train_loss": -23.886756896972656, "global_step": 212149, "epoch": 2556} {"train_loss": -24.326154708862305, "global_step": 212150, "epoch": 2556} {"train_loss": -23.890594482421875, "global_step": 212151, "epoch": 2556} {"train_loss": -24.115650177001953, "global_step": 212152, "epoch": 2556} {"train_loss": -24.1641902923584, "global_step": 212153, "epoch": 2556} {"train_loss": -23.952407836914062, "global_step": 212154, "epoch": 2556} {"train_loss": -23.404809951782227, "global_step": 212155, "epoch": 2556} {"train_loss": -23.796934127807617, "global_step": 212156, "epoch": 2556} {"train_loss": -24.364255905151367, "global_step": 212157, "epoch": 2556} {"train_loss": -24.243091583251953, "global_step": 212158, "epoch": 2556} {"train_loss": -24.43918228149414, "global_step": 212159, "epoch": 2556} {"train_loss": -24.193090438842773, "global_step": 212160, "epoch": 2556} {"train_loss": -24.482746124267578, "global_step": 212161, "epoch": 2556} {"train_loss": -24.049570083618164, "global_step": 212162, "epoch": 2556} {"train_loss": -24.168975830078125, "global_step": 212163, "epoch": 2556} {"train_loss": -24.26584243774414, "global_step": 212164, "epoch": 2556} {"train_loss": -24.19729995727539, "global_step": 212165, "epoch": 2556} {"train_loss": -24.035104751586914, "global_step": 212166, "epoch": 2556} {"train_loss": -24.45552635192871, "global_step": 212167, "epoch": 2556} {"train_loss": -24.49002456665039, "global_step": 212168, "epoch": 2556} {"train_loss": -24.647329330444336, "global_step": 212169, "epoch": 2556} {"train_loss": -24.332128524780273, "global_step": 212170, "epoch": 2556} {"train_loss": -24.304285049438477, "global_step": 212171, "epoch": 2556} {"train_loss": -25.005659103393555, "global_step": 212172, "epoch": 2556} {"train_loss": -24.561948776245117, "global_step": 212173, "epoch": 2556} {"train_loss": -24.21048927307129, "global_step": 212174, "epoch": 2556} {"train_loss": -24.409391403198242, "global_step": 212175, "epoch": 2556} {"train_loss": -24.62742042541504, "global_step": 212176, "epoch": 2556} {"train_loss": -24.731760025024414, "global_step": 212177, "epoch": 2556} {"train_loss": -24.629674911499023, "global_step": 212178, "epoch": 2556} {"train_loss": -24.66375160217285, "global_step": 212179, "epoch": 2556} {"train_loss": -24.714046478271484, "global_step": 212180, "epoch": 2556} {"train_loss": -24.693992614746094, "global_step": 212181, "epoch": 2556} {"train_loss": -24.484472274780273, "global_step": 212182, "epoch": 2556} {"train_loss": -24.48563575744629, "global_step": 212183, "epoch": 2556} {"train_loss": -24.515226364135742, "global_step": 212184, "epoch": 2556} {"train_loss": -24.749313354492188, "global_step": 212185, "epoch": 2556} {"train_loss": -24.356266021728516, "global_step": 212186, "epoch": 2556} {"train_loss": -24.721677780151367, "global_step": 212187, "epoch": 2556} {"train_loss": -24.6862850189209, "global_step": 212188, "epoch": 2556} {"train_loss": -24.40667724609375, "global_step": 212189, "epoch": 2556} {"train_loss": -24.74232292175293, "global_step": 212190, "epoch": 2556} {"train_loss": -24.797658920288086, "global_step": 212191, "epoch": 2556} {"train_loss": -24.710397720336914, "global_step": 212192, "epoch": 2556} {"train_loss": -24.195165634155273, "global_step": 212193, "epoch": 2556} {"train_loss": -24.32771873474121, "global_step": 212194, "epoch": 2556} {"train_loss": -24.53781509399414, "global_step": 212195, "epoch": 2556} {"train_loss": -24.767793655395508, "global_step": 212196, "epoch": 2556} {"train_loss": -24.425100326538086, "global_step": 212197, "epoch": 2556} {"train_loss": -24.477384567260742, "global_step": 212198, "epoch": 2556} {"train_loss": -24.097597122192383, "global_step": 212199, "epoch": 2556} {"train_loss": -24.345462799072266, "global_step": 212200, "epoch": 2556} {"train_loss": -24.44791030883789, "global_step": 212201, "epoch": 2556} {"train_loss": -24.173830032348633, "global_step": 212202, "epoch": 2556} {"train_loss": -24.209415435791016, "global_step": 212203, "epoch": 2556} {"train_loss": -23.970937728881836, "global_step": 212204, "epoch": 2556} {"train_loss": -24.193622589111328, "global_step": 212205, "epoch": 2556} {"train_loss": -24.2811222076416, "global_step": 212206, "epoch": 2556} {"train_loss": -24.22835350036621, "global_step": 212207, "epoch": 2556} {"train_loss": -24.36456871032715, "global_step": 212208, "epoch": 2556} {"train_loss": -24.23929214477539, "global_step": 212209, "epoch": 2556} {"train_loss": -24.081762313842773, "global_step": 212210, "epoch": 2556} {"train_loss": -24.224822998046875, "global_step": 212211, "epoch": 2556} {"train_loss": -24.338285446166992, "global_step": 212212, "epoch": 2556} {"train_loss": -24.57400894165039, "global_step": 212213, "epoch": 2556} {"train_loss": -24.315366744995117, "global_step": 212214, "epoch": 2556} {"train_loss": -24.507171630859375, "global_step": 212215, "epoch": 2556} {"train_loss": -24.298683166503906, "global_step": 212216, "epoch": 2556} {"train_loss": -24.21084976196289, "global_step": 212217, "epoch": 2556} {"train_loss": -24.401334762573242, "global_step": 212218, "epoch": 2556} {"train_loss": -23.985088348388672, "global_step": 212219, "epoch": 2556} {"train_loss": -24.3420467376709, "global_step": 212220, "epoch": 2556} {"train_loss": -24.53879165649414, "global_step": 212221, "epoch": 2556} {"train_loss": -24.24064064025879, "global_step": 212222, "epoch": 2556} {"train_loss": -24.580137252807617, "global_step": 212223, "epoch": 2556} {"train_loss": -24.371967315673828, "global_step": 212224, "epoch": 2556} {"train_loss": -24.294157028198242, "global_step": 212225, "epoch": 2556} {"train_loss": -24.328123092651367, "global_step": 212226, "epoch": 2556} {"train_loss": -24.304431915283203, "global_step": 212227, "epoch": 2556} {"train_loss": -24.4915714263916, "global_step": 212228, "epoch": 2556} {"train_loss": -24.147817611694336, "global_step": 212229, "epoch": 2556} {"train_loss": -24.36934068978551, "global_step": 212230, "epoch": 2556, "val_loss": 6520960.0} {"train_loss": -23.056350708007812, "global_step": 212231, "epoch": 2557} {"train_loss": -23.935400009155273, "global_step": 212232, "epoch": 2557} {"train_loss": -23.923856735229492, "global_step": 212233, "epoch": 2557} {"train_loss": -23.441999435424805, "global_step": 212234, "epoch": 2557} {"train_loss": -23.683774948120117, "global_step": 212235, "epoch": 2557} {"train_loss": -23.79730987548828, "global_step": 212236, "epoch": 2557} {"train_loss": -24.1069278717041, "global_step": 212237, "epoch": 2557} {"train_loss": -23.857709884643555, "global_step": 212238, "epoch": 2557} {"train_loss": -24.05647850036621, "global_step": 212239, "epoch": 2557} {"train_loss": -23.938852310180664, "global_step": 212240, "epoch": 2557} {"train_loss": -24.051456451416016, "global_step": 212241, "epoch": 2557} {"train_loss": -23.853864669799805, "global_step": 212242, "epoch": 2557} {"train_loss": -23.944477081298828, "global_step": 212243, "epoch": 2557} {"train_loss": -24.238574981689453, "global_step": 212244, "epoch": 2557} {"train_loss": -24.25941276550293, "global_step": 212245, "epoch": 2557} {"train_loss": -23.871673583984375, "global_step": 212246, "epoch": 2557} {"train_loss": -24.397695541381836, "global_step": 212247, "epoch": 2557} {"train_loss": -24.323131561279297, "global_step": 212248, "epoch": 2557} {"train_loss": -24.218860626220703, "global_step": 212249, "epoch": 2557} {"train_loss": -24.121557235717773, "global_step": 212250, "epoch": 2557} {"train_loss": -24.241165161132812, "global_step": 212251, "epoch": 2557} {"train_loss": -24.555124282836914, "global_step": 212252, "epoch": 2557} {"train_loss": -24.379465103149414, "global_step": 212253, "epoch": 2557} {"train_loss": -24.538331985473633, "global_step": 212254, "epoch": 2557} {"train_loss": -24.41257095336914, "global_step": 212255, "epoch": 2557} {"train_loss": -24.45725440979004, "global_step": 212256, "epoch": 2557} {"train_loss": -24.387271881103516, "global_step": 212257, "epoch": 2557} {"train_loss": -24.211288452148438, "global_step": 212258, "epoch": 2557} {"train_loss": -24.35968589782715, "global_step": 212259, "epoch": 2557} {"train_loss": -24.52671241760254, "global_step": 212260, "epoch": 2557} {"train_loss": -24.096708297729492, "global_step": 212261, "epoch": 2557} {"train_loss": -24.65013313293457, "global_step": 212262, "epoch": 2557} {"train_loss": -24.907596588134766, "global_step": 212263, "epoch": 2557} {"train_loss": -24.46237564086914, "global_step": 212264, "epoch": 2557} {"train_loss": -24.423786163330078, "global_step": 212265, "epoch": 2557} {"train_loss": -24.353206634521484, "global_step": 212266, "epoch": 2557} {"train_loss": -24.68477439880371, "global_step": 212267, "epoch": 2557} {"train_loss": -24.696949005126953, "global_step": 212268, "epoch": 2557} {"train_loss": -24.29533576965332, "global_step": 212269, "epoch": 2557} {"train_loss": -24.28843116760254, "global_step": 212270, "epoch": 2557} {"train_loss": -24.89711570739746, "global_step": 212271, "epoch": 2557} {"train_loss": -24.638891220092773, "global_step": 212272, "epoch": 2557} {"train_loss": -24.369659423828125, "global_step": 212273, "epoch": 2557} {"train_loss": -24.704435348510742, "global_step": 212274, "epoch": 2557} {"train_loss": -24.47452735900879, "global_step": 212275, "epoch": 2557} {"train_loss": -24.64042091369629, "global_step": 212276, "epoch": 2557} {"train_loss": -24.6751708984375, "global_step": 212277, "epoch": 2557} {"train_loss": -24.67055320739746, "global_step": 212278, "epoch": 2557} {"train_loss": -24.99837303161621, "global_step": 212279, "epoch": 2557} {"train_loss": -24.17329216003418, "global_step": 212280, "epoch": 2557} {"train_loss": -24.92353630065918, "global_step": 212281, "epoch": 2557} {"train_loss": -24.440305709838867, "global_step": 212282, "epoch": 2557} {"train_loss": -24.278833389282227, "global_step": 212283, "epoch": 2557} {"train_loss": -24.0594425201416, "global_step": 212284, "epoch": 2557} {"train_loss": -24.01052474975586, "global_step": 212285, "epoch": 2557} {"train_loss": -24.292356491088867, "global_step": 212286, "epoch": 2557} {"train_loss": -24.012155532836914, "global_step": 212287, "epoch": 2557} {"train_loss": -23.849517822265625, "global_step": 212288, "epoch": 2557} {"train_loss": -24.2020320892334, "global_step": 212289, "epoch": 2557} {"train_loss": -24.459562301635742, "global_step": 212290, "epoch": 2557} {"train_loss": -24.087421417236328, "global_step": 212291, "epoch": 2557} {"train_loss": -24.638029098510742, "global_step": 212292, "epoch": 2557} {"train_loss": -24.547779083251953, "global_step": 212293, "epoch": 2557} {"train_loss": -24.364294052124023, "global_step": 212294, "epoch": 2557} {"train_loss": -24.417325973510742, "global_step": 212295, "epoch": 2557} {"train_loss": -24.507230758666992, "global_step": 212296, "epoch": 2557} {"train_loss": -24.837316513061523, "global_step": 212297, "epoch": 2557} {"train_loss": -24.317228317260742, "global_step": 212298, "epoch": 2557} {"train_loss": -24.139005661010742, "global_step": 212299, "epoch": 2557} {"train_loss": -24.305204391479492, "global_step": 212300, "epoch": 2557} {"train_loss": -24.767858505249023, "global_step": 212301, "epoch": 2557} {"train_loss": -24.48188591003418, "global_step": 212302, "epoch": 2557} {"train_loss": -24.719751358032227, "global_step": 212303, "epoch": 2557} {"train_loss": -24.524267196655273, "global_step": 212304, "epoch": 2557} {"train_loss": -24.508655548095703, "global_step": 212305, "epoch": 2557} {"train_loss": -24.401063919067383, "global_step": 212306, "epoch": 2557} {"train_loss": -24.517349243164062, "global_step": 212307, "epoch": 2557} {"train_loss": -24.534154891967773, "global_step": 212308, "epoch": 2557} {"train_loss": -25.185165405273438, "global_step": 212309, "epoch": 2557} {"train_loss": -24.276487350463867, "global_step": 212310, "epoch": 2557} {"train_loss": -24.68208122253418, "global_step": 212311, "epoch": 2557} {"train_loss": -24.487709045410156, "global_step": 212312, "epoch": 2557} {"train_loss": -24.34191145379859, "global_step": 212313, "epoch": 2557, "val_loss": 6602601.0} {"train_loss": -24.18864631652832, "global_step": 212314, "epoch": 2558} {"train_loss": -24.261322021484375, "global_step": 212315, "epoch": 2558} {"train_loss": -24.561893463134766, "global_step": 212316, "epoch": 2558} {"train_loss": -24.314329147338867, "global_step": 212317, "epoch": 2558} {"train_loss": -23.997167587280273, "global_step": 212318, "epoch": 2558} {"train_loss": -24.392248153686523, "global_step": 212319, "epoch": 2558} {"train_loss": -24.32990074157715, "global_step": 212320, "epoch": 2558} {"train_loss": -24.247495651245117, "global_step": 212321, "epoch": 2558} {"train_loss": -24.671131134033203, "global_step": 212322, "epoch": 2558} {"train_loss": -24.01657485961914, "global_step": 212323, "epoch": 2558} {"train_loss": -24.144323348999023, "global_step": 212324, "epoch": 2558} {"train_loss": -24.55602264404297, "global_step": 212325, "epoch": 2558} {"train_loss": -24.526039123535156, "global_step": 212326, "epoch": 2558} {"train_loss": -24.15498161315918, "global_step": 212327, "epoch": 2558} {"train_loss": -24.51044273376465, "global_step": 212328, "epoch": 2558} {"train_loss": -24.630083084106445, "global_step": 212329, "epoch": 2558} {"train_loss": -24.529619216918945, "global_step": 212330, "epoch": 2558} {"train_loss": -24.676044464111328, "global_step": 212331, "epoch": 2558} {"train_loss": -24.430885314941406, "global_step": 212332, "epoch": 2558} {"train_loss": -24.497642517089844, "global_step": 212333, "epoch": 2558} {"train_loss": -24.582921981811523, "global_step": 212334, "epoch": 2558} {"train_loss": -24.252775192260742, "global_step": 212335, "epoch": 2558} {"train_loss": -24.622251510620117, "global_step": 212336, "epoch": 2558} {"train_loss": -24.142263412475586, "global_step": 212337, "epoch": 2558} {"train_loss": -24.50877571105957, "global_step": 212338, "epoch": 2558} {"train_loss": -24.24302864074707, "global_step": 212339, "epoch": 2558} {"train_loss": -24.757217407226562, "global_step": 212340, "epoch": 2558} {"train_loss": -24.566787719726562, "global_step": 212341, "epoch": 2558} {"train_loss": -24.394084930419922, "global_step": 212342, "epoch": 2558} {"train_loss": -24.624788284301758, "global_step": 212343, "epoch": 2558} {"train_loss": -24.14985466003418, "global_step": 212344, "epoch": 2558} {"train_loss": -23.9126033782959, "global_step": 212345, "epoch": 2558} {"train_loss": -24.642866134643555, "global_step": 212346, "epoch": 2558} {"train_loss": -24.347509384155273, "global_step": 212347, "epoch": 2558} {"train_loss": -24.100481033325195, "global_step": 212348, "epoch": 2558} {"train_loss": -24.620283126831055, "global_step": 212349, "epoch": 2558} {"train_loss": -24.354263305664062, "global_step": 212350, "epoch": 2558} {"train_loss": -24.79476547241211, "global_step": 212351, "epoch": 2558} {"train_loss": -24.47181510925293, "global_step": 212352, "epoch": 2558} {"train_loss": -24.291242599487305, "global_step": 212353, "epoch": 2558} {"train_loss": -24.188243865966797, "global_step": 212354, "epoch": 2558} {"train_loss": -24.49307632446289, "global_step": 212355, "epoch": 2558} {"train_loss": -24.422182083129883, "global_step": 212356, "epoch": 2558} {"train_loss": -24.3671932220459, "global_step": 212357, "epoch": 2558} {"train_loss": -24.349225997924805, "global_step": 212358, "epoch": 2558} {"train_loss": -24.459749221801758, "global_step": 212359, "epoch": 2558} {"train_loss": -24.450063705444336, "global_step": 212360, "epoch": 2558} {"train_loss": -24.545438766479492, "global_step": 212361, "epoch": 2558} {"train_loss": -24.19673728942871, "global_step": 212362, "epoch": 2558} {"train_loss": -23.998701095581055, "global_step": 212363, "epoch": 2558} {"train_loss": -24.399431228637695, "global_step": 212364, "epoch": 2558} {"train_loss": -24.349349975585938, "global_step": 212365, "epoch": 2558} {"train_loss": -24.462003707885742, "global_step": 212366, "epoch": 2558} {"train_loss": -24.349706649780273, "global_step": 212367, "epoch": 2558} {"train_loss": -24.62055778503418, "global_step": 212368, "epoch": 2558} {"train_loss": -24.399965286254883, "global_step": 212369, "epoch": 2558} {"train_loss": -24.485145568847656, "global_step": 212370, "epoch": 2558} {"train_loss": -24.909690856933594, "global_step": 212371, "epoch": 2558} {"train_loss": -24.126312255859375, "global_step": 212372, "epoch": 2558} {"train_loss": -24.830625534057617, "global_step": 212373, "epoch": 2558} {"train_loss": -24.440549850463867, "global_step": 212374, "epoch": 2558} {"train_loss": -24.496976852416992, "global_step": 212375, "epoch": 2558} {"train_loss": -24.63313865661621, "global_step": 212376, "epoch": 2558} {"train_loss": -24.631757736206055, "global_step": 212377, "epoch": 2558} {"train_loss": -25.056180953979492, "global_step": 212378, "epoch": 2558} {"train_loss": -24.552520751953125, "global_step": 212379, "epoch": 2558} {"train_loss": -24.404052734375, "global_step": 212380, "epoch": 2558} {"train_loss": -24.170751571655273, "global_step": 212381, "epoch": 2558} {"train_loss": -24.46832847595215, "global_step": 212382, "epoch": 2558} {"train_loss": -24.305349349975586, "global_step": 212383, "epoch": 2558} {"train_loss": -24.511674880981445, "global_step": 212384, "epoch": 2558} {"train_loss": -24.328397750854492, "global_step": 212385, "epoch": 2558} {"train_loss": -24.304767608642578, "global_step": 212386, "epoch": 2558} {"train_loss": -24.132312774658203, "global_step": 212387, "epoch": 2558} {"train_loss": -24.188688278198242, "global_step": 212388, "epoch": 2558} {"train_loss": -24.4833984375, "global_step": 212389, "epoch": 2558} {"train_loss": -24.683246612548828, "global_step": 212390, "epoch": 2558} {"train_loss": -24.017887115478516, "global_step": 212391, "epoch": 2558} {"train_loss": -24.65984535217285, "global_step": 212392, "epoch": 2558} {"train_loss": -24.594266891479492, "global_step": 212393, "epoch": 2558} {"train_loss": -24.837547302246094, "global_step": 212394, "epoch": 2558} {"train_loss": -24.977264404296875, "global_step": 212395, "epoch": 2558} {"train_loss": -24.431915467043957, "global_step": 212396, "epoch": 2558, "val_loss": 6517922.0} {"train_loss": -23.62400245666504, "global_step": 212397, "epoch": 2559} {"train_loss": -23.289764404296875, "global_step": 212398, "epoch": 2559} {"train_loss": -24.18686866760254, "global_step": 212399, "epoch": 2559} {"train_loss": -24.165237426757812, "global_step": 212400, "epoch": 2559} {"train_loss": -23.7381649017334, "global_step": 212401, "epoch": 2559} {"train_loss": -23.94991111755371, "global_step": 212402, "epoch": 2559} {"train_loss": -24.169965744018555, "global_step": 212403, "epoch": 2559} {"train_loss": -24.016740798950195, "global_step": 212404, "epoch": 2559} {"train_loss": -24.091474533081055, "global_step": 212405, "epoch": 2559} {"train_loss": -24.02736473083496, "global_step": 212406, "epoch": 2559} {"train_loss": -24.22722053527832, "global_step": 212407, "epoch": 2559} {"train_loss": -24.124744415283203, "global_step": 212408, "epoch": 2559} {"train_loss": -23.690439224243164, "global_step": 212409, "epoch": 2559} {"train_loss": -24.35093116760254, "global_step": 212410, "epoch": 2559} {"train_loss": -24.284812927246094, "global_step": 212411, "epoch": 2559} {"train_loss": -23.654508590698242, "global_step": 212412, "epoch": 2559} {"train_loss": -24.31520652770996, "global_step": 212413, "epoch": 2559} {"train_loss": -23.94312858581543, "global_step": 212414, "epoch": 2559} {"train_loss": -24.121557235717773, "global_step": 212415, "epoch": 2559} {"train_loss": -24.220260620117188, "global_step": 212416, "epoch": 2559} {"train_loss": -24.08101463317871, "global_step": 212417, "epoch": 2559} {"train_loss": -24.390249252319336, "global_step": 212418, "epoch": 2559} {"train_loss": -24.050582885742188, "global_step": 212419, "epoch": 2559} {"train_loss": -24.359073638916016, "global_step": 212420, "epoch": 2559} {"train_loss": -24.48647117614746, "global_step": 212421, "epoch": 2559} {"train_loss": -24.251541137695312, "global_step": 212422, "epoch": 2559} {"train_loss": -24.24503517150879, "global_step": 212423, "epoch": 2559} {"train_loss": -24.46849250793457, "global_step": 212424, "epoch": 2559} {"train_loss": -24.525375366210938, "global_step": 212425, "epoch": 2559} {"train_loss": -24.559375762939453, "global_step": 212426, "epoch": 2559} {"train_loss": -24.429710388183594, "global_step": 212427, "epoch": 2559} {"train_loss": -24.32912254333496, "global_step": 212428, "epoch": 2559} {"train_loss": -24.452505111694336, "global_step": 212429, "epoch": 2559} {"train_loss": -24.442394256591797, "global_step": 212430, "epoch": 2559} {"train_loss": -24.60280990600586, "global_step": 212431, "epoch": 2559} {"train_loss": -24.65639305114746, "global_step": 212432, "epoch": 2559} {"train_loss": -24.553695678710938, "global_step": 212433, "epoch": 2559} {"train_loss": -24.474645614624023, "global_step": 212434, "epoch": 2559} {"train_loss": -24.39882469177246, "global_step": 212435, "epoch": 2559} {"train_loss": -24.634933471679688, "global_step": 212436, "epoch": 2559} {"train_loss": -24.343713760375977, "global_step": 212437, "epoch": 2559} {"train_loss": -24.50600242614746, "global_step": 212438, "epoch": 2559} {"train_loss": -24.60226821899414, "global_step": 212439, "epoch": 2559} {"train_loss": -24.508962631225586, "global_step": 212440, "epoch": 2559} {"train_loss": -24.24896240234375, "global_step": 212441, "epoch": 2559} {"train_loss": -24.25656509399414, "global_step": 212442, "epoch": 2559} {"train_loss": -24.324928283691406, "global_step": 212443, "epoch": 2559} {"train_loss": -24.10616111755371, "global_step": 212444, "epoch": 2559} {"train_loss": -23.49094009399414, "global_step": 212445, "epoch": 2559} {"train_loss": -23.99893569946289, "global_step": 212446, "epoch": 2559} {"train_loss": -24.587491989135742, "global_step": 212447, "epoch": 2559} {"train_loss": -24.096593856811523, "global_step": 212448, "epoch": 2559} {"train_loss": -24.370363235473633, "global_step": 212449, "epoch": 2559} {"train_loss": -23.918886184692383, "global_step": 212450, "epoch": 2559} {"train_loss": -24.401548385620117, "global_step": 212451, "epoch": 2559} {"train_loss": -23.8790340423584, "global_step": 212452, "epoch": 2559} {"train_loss": -24.216882705688477, "global_step": 212453, "epoch": 2559} {"train_loss": -24.14670753479004, "global_step": 212454, "epoch": 2559} {"train_loss": -24.332347869873047, "global_step": 212455, "epoch": 2559} {"train_loss": -24.39520835876465, "global_step": 212456, "epoch": 2559} {"train_loss": -24.533689498901367, "global_step": 212457, "epoch": 2559} {"train_loss": -24.665679931640625, "global_step": 212458, "epoch": 2559} {"train_loss": -24.53711700439453, "global_step": 212459, "epoch": 2559} {"train_loss": -24.258588790893555, "global_step": 212460, "epoch": 2559} {"train_loss": -24.40776252746582, "global_step": 212461, "epoch": 2559} {"train_loss": -24.5968074798584, "global_step": 212462, "epoch": 2559} {"train_loss": -24.239057540893555, "global_step": 212463, "epoch": 2559} {"train_loss": -24.845983505249023, "global_step": 212464, "epoch": 2559} {"train_loss": -24.620893478393555, "global_step": 212465, "epoch": 2559} {"train_loss": -24.644760131835938, "global_step": 212466, "epoch": 2559} {"train_loss": -24.405988693237305, "global_step": 212467, "epoch": 2559} {"train_loss": -24.368576049804688, "global_step": 212468, "epoch": 2559} {"train_loss": -24.593067169189453, "global_step": 212469, "epoch": 2559} {"train_loss": -24.60243034362793, "global_step": 212470, "epoch": 2559} {"train_loss": -24.952838897705078, "global_step": 212471, "epoch": 2559} {"train_loss": -24.941604614257812, "global_step": 212472, "epoch": 2559} {"train_loss": -24.705045700073242, "global_step": 212473, "epoch": 2559} {"train_loss": -24.389606475830078, "global_step": 212474, "epoch": 2559} {"train_loss": -24.879125595092773, "global_step": 212475, "epoch": 2559} {"train_loss": -24.43903923034668, "global_step": 212476, "epoch": 2559} {"train_loss": -24.421676635742188, "global_step": 212477, "epoch": 2559} {"train_loss": -24.232566833496094, "global_step": 212478, "epoch": 2559} {"train_loss": -24.320644286741693, "global_step": 212479, "epoch": 2559, "val_loss": 6482852.5} {"train_loss": -22.317642211914062, "global_step": 212480, "epoch": 2560} {"train_loss": -22.757644653320312, "global_step": 212481, "epoch": 2560} {"train_loss": -23.9909610748291, "global_step": 212482, "epoch": 2560} {"train_loss": -23.64999008178711, "global_step": 212483, "epoch": 2560} {"train_loss": -23.548398971557617, "global_step": 212484, "epoch": 2560} {"train_loss": -23.539043426513672, "global_step": 212485, "epoch": 2560} {"train_loss": -24.54426383972168, "global_step": 212486, "epoch": 2560} {"train_loss": -23.808420181274414, "global_step": 212487, "epoch": 2560} {"train_loss": -24.224708557128906, "global_step": 212488, "epoch": 2560} {"train_loss": -23.829565048217773, "global_step": 212489, "epoch": 2560} {"train_loss": -24.053491592407227, "global_step": 212490, "epoch": 2560} {"train_loss": -23.921541213989258, "global_step": 212491, "epoch": 2560} {"train_loss": -24.0689697265625, "global_step": 212492, "epoch": 2560} {"train_loss": -24.194746017456055, "global_step": 212493, "epoch": 2560} {"train_loss": -24.054502487182617, "global_step": 212494, "epoch": 2560} {"train_loss": -24.138280868530273, "global_step": 212495, "epoch": 2560} {"train_loss": -24.462759017944336, "global_step": 212496, "epoch": 2560} {"train_loss": -24.01615333557129, "global_step": 212497, "epoch": 2560} {"train_loss": -24.163938522338867, "global_step": 212498, "epoch": 2560} {"train_loss": -24.422927856445312, "global_step": 212499, "epoch": 2560} {"train_loss": -24.251394271850586, "global_step": 212500, "epoch": 2560} {"train_loss": -23.771808624267578, "global_step": 212501, "epoch": 2560} {"train_loss": -24.014663696289062, "global_step": 212502, "epoch": 2560} {"train_loss": -23.96152687072754, "global_step": 212503, "epoch": 2560} {"train_loss": -24.0661563873291, "global_step": 212504, "epoch": 2560} {"train_loss": -24.528776168823242, "global_step": 212505, "epoch": 2560} {"train_loss": -24.283811569213867, "global_step": 212506, "epoch": 2560} {"train_loss": -24.702537536621094, "global_step": 212507, "epoch": 2560} {"train_loss": -24.246780395507812, "global_step": 212508, "epoch": 2560} {"train_loss": -24.100683212280273, "global_step": 212509, "epoch": 2560} {"train_loss": -24.548263549804688, "global_step": 212510, "epoch": 2560} {"train_loss": -24.566999435424805, "global_step": 212511, "epoch": 2560} {"train_loss": -23.920040130615234, "global_step": 212512, "epoch": 2560} {"train_loss": -24.47027587890625, "global_step": 212513, "epoch": 2560} {"train_loss": -24.599308013916016, "global_step": 212514, "epoch": 2560} {"train_loss": -24.48202896118164, "global_step": 212515, "epoch": 2560} {"train_loss": -24.35763931274414, "global_step": 212516, "epoch": 2560} {"train_loss": -24.22443389892578, "global_step": 212517, "epoch": 2560} {"train_loss": -24.312482833862305, "global_step": 212518, "epoch": 2560} {"train_loss": -24.09084129333496, "global_step": 212519, "epoch": 2560} {"train_loss": -24.261533737182617, "global_step": 212520, "epoch": 2560} {"train_loss": -24.751497268676758, "global_step": 212521, "epoch": 2560} {"train_loss": -24.606548309326172, "global_step": 212522, "epoch": 2560} {"train_loss": -24.5305118560791, "global_step": 212523, "epoch": 2560} {"train_loss": -24.476787567138672, "global_step": 212524, "epoch": 2560} {"train_loss": -24.130273818969727, "global_step": 212525, "epoch": 2560} {"train_loss": -24.8094482421875, "global_step": 212526, "epoch": 2560} {"train_loss": -24.47701644897461, "global_step": 212527, "epoch": 2560} {"train_loss": -25.035852432250977, "global_step": 212528, "epoch": 2560} {"train_loss": -24.293500900268555, "global_step": 212529, "epoch": 2560} {"train_loss": -24.689556121826172, "global_step": 212530, "epoch": 2560} {"train_loss": -24.36511993408203, "global_step": 212531, "epoch": 2560} {"train_loss": -24.462324142456055, "global_step": 212532, "epoch": 2560} {"train_loss": -24.452173233032227, "global_step": 212533, "epoch": 2560} {"train_loss": -24.616744995117188, "global_step": 212534, "epoch": 2560} {"train_loss": -24.280744552612305, "global_step": 212535, "epoch": 2560} {"train_loss": -24.87290382385254, "global_step": 212536, "epoch": 2560} {"train_loss": -24.377145767211914, "global_step": 212537, "epoch": 2560} {"train_loss": -24.33335304260254, "global_step": 212538, "epoch": 2560} {"train_loss": -24.575437545776367, "global_step": 212539, "epoch": 2560} {"train_loss": -24.52235984802246, "global_step": 212540, "epoch": 2560} {"train_loss": -24.45939064025879, "global_step": 212541, "epoch": 2560} {"train_loss": -24.41786766052246, "global_step": 212542, "epoch": 2560} {"train_loss": -24.777189254760742, "global_step": 212543, "epoch": 2560} {"train_loss": -24.728530883789062, "global_step": 212544, "epoch": 2560} {"train_loss": -24.574068069458008, "global_step": 212545, "epoch": 2560} {"train_loss": -24.2242488861084, "global_step": 212546, "epoch": 2560} {"train_loss": -24.43137550354004, "global_step": 212547, "epoch": 2560} {"train_loss": -24.537927627563477, "global_step": 212548, "epoch": 2560} {"train_loss": -24.472637176513672, "global_step": 212549, "epoch": 2560} {"train_loss": -24.977294921875, "global_step": 212550, "epoch": 2560} {"train_loss": -24.79060173034668, "global_step": 212551, "epoch": 2560} {"train_loss": -24.536710739135742, "global_step": 212552, "epoch": 2560} {"train_loss": -24.363571166992188, "global_step": 212553, "epoch": 2560} {"train_loss": -24.485383987426758, "global_step": 212554, "epoch": 2560} {"train_loss": -24.533262252807617, "global_step": 212555, "epoch": 2560} {"train_loss": -24.569543838500977, "global_step": 212556, "epoch": 2560} {"train_loss": -24.59062385559082, "global_step": 212557, "epoch": 2560} {"train_loss": -24.552968978881836, "global_step": 212558, "epoch": 2560} {"train_loss": -24.24782371520996, "global_step": 212559, "epoch": 2560} {"train_loss": -24.140045166015625, "global_step": 212560, "epoch": 2560} {"train_loss": -24.61445426940918, "global_step": 212561, "epoch": 2560} {"train_loss": -24.3275828533862, "global_step": 212562, "epoch": 2560, "val_loss": 6618301.0} {"train_loss": -24.19869041442871, "global_step": 212563, "epoch": 2561} {"train_loss": -23.704885482788086, "global_step": 212564, "epoch": 2561} {"train_loss": -24.252859115600586, "global_step": 212565, "epoch": 2561} {"train_loss": -24.003726959228516, "global_step": 212566, "epoch": 2561} {"train_loss": -24.058210372924805, "global_step": 212567, "epoch": 2561} {"train_loss": -24.310176849365234, "global_step": 212568, "epoch": 2561} {"train_loss": -23.967565536499023, "global_step": 212569, "epoch": 2561} {"train_loss": -24.082334518432617, "global_step": 212570, "epoch": 2561} {"train_loss": -24.240163803100586, "global_step": 212571, "epoch": 2561} {"train_loss": -24.210189819335938, "global_step": 212572, "epoch": 2561} {"train_loss": -24.639493942260742, "global_step": 212573, "epoch": 2561} {"train_loss": -23.902671813964844, "global_step": 212574, "epoch": 2561} {"train_loss": -24.181541442871094, "global_step": 212575, "epoch": 2561} {"train_loss": -24.09885025024414, "global_step": 212576, "epoch": 2561} {"train_loss": -24.381824493408203, "global_step": 212577, "epoch": 2561} {"train_loss": -24.0955810546875, "global_step": 212578, "epoch": 2561} {"train_loss": -24.505887985229492, "global_step": 212579, "epoch": 2561} {"train_loss": -24.53590202331543, "global_step": 212580, "epoch": 2561} {"train_loss": -24.509201049804688, "global_step": 212581, "epoch": 2561} {"train_loss": -24.20343589782715, "global_step": 212582, "epoch": 2561} {"train_loss": -24.728544235229492, "global_step": 212583, "epoch": 2561} {"train_loss": -24.562854766845703, "global_step": 212584, "epoch": 2561} {"train_loss": -24.583843231201172, "global_step": 212585, "epoch": 2561} {"train_loss": -24.437345504760742, "global_step": 212586, "epoch": 2561} {"train_loss": -24.376428604125977, "global_step": 212587, "epoch": 2561} {"train_loss": -24.71119499206543, "global_step": 212588, "epoch": 2561} {"train_loss": -24.378902435302734, "global_step": 212589, "epoch": 2561} {"train_loss": -24.51473045349121, "global_step": 212590, "epoch": 2561} {"train_loss": -24.407896041870117, "global_step": 212591, "epoch": 2561} {"train_loss": -24.884464263916016, "global_step": 212592, "epoch": 2561} {"train_loss": -24.459064483642578, "global_step": 212593, "epoch": 2561} {"train_loss": -24.10480308532715, "global_step": 212594, "epoch": 2561} {"train_loss": -24.028942108154297, "global_step": 212595, "epoch": 2561} {"train_loss": -24.519826889038086, "global_step": 212596, "epoch": 2561} {"train_loss": -24.70145034790039, "global_step": 212597, "epoch": 2561} {"train_loss": -24.172382354736328, "global_step": 212598, "epoch": 2561} {"train_loss": -24.555225372314453, "global_step": 212599, "epoch": 2561} {"train_loss": -24.476926803588867, "global_step": 212600, "epoch": 2561} {"train_loss": -24.782947540283203, "global_step": 212601, "epoch": 2561} {"train_loss": -24.383237838745117, "global_step": 212602, "epoch": 2561} {"train_loss": -24.56532859802246, "global_step": 212603, "epoch": 2561} {"train_loss": -24.15254783630371, "global_step": 212604, "epoch": 2561} {"train_loss": -24.42913818359375, "global_step": 212605, "epoch": 2561} {"train_loss": -24.58234214782715, "global_step": 212606, "epoch": 2561} {"train_loss": -24.276479721069336, "global_step": 212607, "epoch": 2561} {"train_loss": -24.606142044067383, "global_step": 212608, "epoch": 2561} {"train_loss": -24.6898250579834, "global_step": 212609, "epoch": 2561} {"train_loss": -24.571260452270508, "global_step": 212610, "epoch": 2561} {"train_loss": -24.48160171508789, "global_step": 212611, "epoch": 2561} {"train_loss": -24.679624557495117, "global_step": 212612, "epoch": 2561} {"train_loss": -24.244749069213867, "global_step": 212613, "epoch": 2561} {"train_loss": -24.498065948486328, "global_step": 212614, "epoch": 2561} {"train_loss": -24.670684814453125, "global_step": 212615, "epoch": 2561} {"train_loss": -24.209745407104492, "global_step": 212616, "epoch": 2561} {"train_loss": -24.371252059936523, "global_step": 212617, "epoch": 2561} {"train_loss": -24.58945655822754, "global_step": 212618, "epoch": 2561} {"train_loss": -24.340646743774414, "global_step": 212619, "epoch": 2561} {"train_loss": -24.496519088745117, "global_step": 212620, "epoch": 2561} {"train_loss": -24.460195541381836, "global_step": 212621, "epoch": 2561} {"train_loss": -24.68739128112793, "global_step": 212622, "epoch": 2561} {"train_loss": -24.806407928466797, "global_step": 212623, "epoch": 2561} {"train_loss": -24.699981689453125, "global_step": 212624, "epoch": 2561} {"train_loss": -24.6072940826416, "global_step": 212625, "epoch": 2561} {"train_loss": -24.6601505279541, "global_step": 212626, "epoch": 2561} {"train_loss": -24.870437622070312, "global_step": 212627, "epoch": 2561} {"train_loss": -24.52674674987793, "global_step": 212628, "epoch": 2561} {"train_loss": -24.57281494140625, "global_step": 212629, "epoch": 2561} {"train_loss": -24.700023651123047, "global_step": 212630, "epoch": 2561} {"train_loss": -24.675996780395508, "global_step": 212631, "epoch": 2561} {"train_loss": -24.870838165283203, "global_step": 212632, "epoch": 2561} {"train_loss": -24.365427017211914, "global_step": 212633, "epoch": 2561} {"train_loss": -24.591135025024414, "global_step": 212634, "epoch": 2561} {"train_loss": -24.565868377685547, "global_step": 212635, "epoch": 2561} {"train_loss": -24.88649559020996, "global_step": 212636, "epoch": 2561} {"train_loss": -24.82891082763672, "global_step": 212637, "epoch": 2561} {"train_loss": -24.74332046508789, "global_step": 212638, "epoch": 2561} {"train_loss": -24.856008529663086, "global_step": 212639, "epoch": 2561} {"train_loss": -24.637170791625977, "global_step": 212640, "epoch": 2561} {"train_loss": -24.81696891784668, "global_step": 212641, "epoch": 2561} {"train_loss": -24.178848266601562, "global_step": 212642, "epoch": 2561} {"train_loss": -24.769790649414062, "global_step": 212643, "epoch": 2561} {"train_loss": -24.601259231567383, "global_step": 212644, "epoch": 2561} {"train_loss": -24.470889654504248, "global_step": 212645, "epoch": 2561, "val_loss": 6673736.0} {"train_loss": -24.456008911132812, "global_step": 212646, "epoch": 2562} {"train_loss": -24.449689865112305, "global_step": 212647, "epoch": 2562} {"train_loss": -24.095199584960938, "global_step": 212648, "epoch": 2562} {"train_loss": -23.77927589416504, "global_step": 212649, "epoch": 2562} {"train_loss": -24.533374786376953, "global_step": 212650, "epoch": 2562} {"train_loss": -24.325164794921875, "global_step": 212651, "epoch": 2562} {"train_loss": -24.56075096130371, "global_step": 212652, "epoch": 2562} {"train_loss": -24.039419174194336, "global_step": 212653, "epoch": 2562} {"train_loss": -24.49056053161621, "global_step": 212654, "epoch": 2562} {"train_loss": -24.484914779663086, "global_step": 212655, "epoch": 2562} {"train_loss": -24.586347579956055, "global_step": 212656, "epoch": 2562} {"train_loss": -24.525741577148438, "global_step": 212657, "epoch": 2562} {"train_loss": -24.283815383911133, "global_step": 212658, "epoch": 2562} {"train_loss": -24.1757755279541, "global_step": 212659, "epoch": 2562} {"train_loss": -24.549280166625977, "global_step": 212660, "epoch": 2562} {"train_loss": -24.145233154296875, "global_step": 212661, "epoch": 2562} {"train_loss": -24.47422981262207, "global_step": 212662, "epoch": 2562} {"train_loss": -24.127025604248047, "global_step": 212663, "epoch": 2562} {"train_loss": -24.292211532592773, "global_step": 212664, "epoch": 2562} {"train_loss": -23.977783203125, "global_step": 212665, "epoch": 2562} {"train_loss": -24.102262496948242, "global_step": 212666, "epoch": 2562} {"train_loss": -24.353683471679688, "global_step": 212667, "epoch": 2562} {"train_loss": -24.13198471069336, "global_step": 212668, "epoch": 2562} {"train_loss": -24.224613189697266, "global_step": 212669, "epoch": 2562} {"train_loss": -24.46710777282715, "global_step": 212670, "epoch": 2562} {"train_loss": -24.41938591003418, "global_step": 212671, "epoch": 2562} {"train_loss": -24.152502059936523, "global_step": 212672, "epoch": 2562} {"train_loss": -24.471906661987305, "global_step": 212673, "epoch": 2562} {"train_loss": -24.54193115234375, "global_step": 212674, "epoch": 2562} {"train_loss": -24.27642250061035, "global_step": 212675, "epoch": 2562} {"train_loss": -23.834867477416992, "global_step": 212676, "epoch": 2562} {"train_loss": -24.31220054626465, "global_step": 212677, "epoch": 2562} {"train_loss": -24.172515869140625, "global_step": 212678, "epoch": 2562} {"train_loss": -24.202102661132812, "global_step": 212679, "epoch": 2562} {"train_loss": -24.09844970703125, "global_step": 212680, "epoch": 2562} {"train_loss": -24.11358642578125, "global_step": 212681, "epoch": 2562} {"train_loss": -24.276647567749023, "global_step": 212682, "epoch": 2562} {"train_loss": -24.459997177124023, "global_step": 212683, "epoch": 2562} {"train_loss": -24.21840476989746, "global_step": 212684, "epoch": 2562} {"train_loss": -24.411373138427734, "global_step": 212685, "epoch": 2562} {"train_loss": -24.723926544189453, "global_step": 212686, "epoch": 2562} {"train_loss": -24.170886993408203, "global_step": 212687, "epoch": 2562} {"train_loss": -24.43393898010254, "global_step": 212688, "epoch": 2562} {"train_loss": -24.447744369506836, "global_step": 212689, "epoch": 2562} {"train_loss": -24.798629760742188, "global_step": 212690, "epoch": 2562} {"train_loss": -24.690824508666992, "global_step": 212691, "epoch": 2562} {"train_loss": -24.539548873901367, "global_step": 212692, "epoch": 2562} {"train_loss": -24.677648544311523, "global_step": 212693, "epoch": 2562} {"train_loss": -24.546419143676758, "global_step": 212694, "epoch": 2562} {"train_loss": -24.836599349975586, "global_step": 212695, "epoch": 2562} {"train_loss": -24.397056579589844, "global_step": 212696, "epoch": 2562} {"train_loss": -24.785736083984375, "global_step": 212697, "epoch": 2562} {"train_loss": -24.484359741210938, "global_step": 212698, "epoch": 2562} {"train_loss": -24.663419723510742, "global_step": 212699, "epoch": 2562} {"train_loss": -24.854291915893555, "global_step": 212700, "epoch": 2562} {"train_loss": -24.5408878326416, "global_step": 212701, "epoch": 2562} {"train_loss": -24.58599853515625, "global_step": 212702, "epoch": 2562} {"train_loss": -24.67555046081543, "global_step": 212703, "epoch": 2562} {"train_loss": -24.450265884399414, "global_step": 212704, "epoch": 2562} {"train_loss": -24.178607940673828, "global_step": 212705, "epoch": 2562} {"train_loss": -24.570711135864258, "global_step": 212706, "epoch": 2562} {"train_loss": -24.29806137084961, "global_step": 212707, "epoch": 2562} {"train_loss": -24.077260971069336, "global_step": 212708, "epoch": 2562} {"train_loss": -24.224592208862305, "global_step": 212709, "epoch": 2562} {"train_loss": -24.5307559967041, "global_step": 212710, "epoch": 2562} {"train_loss": -24.372159957885742, "global_step": 212711, "epoch": 2562} {"train_loss": -24.248205184936523, "global_step": 212712, "epoch": 2562} {"train_loss": -24.151723861694336, "global_step": 212713, "epoch": 2562} {"train_loss": -24.43879508972168, "global_step": 212714, "epoch": 2562} {"train_loss": -24.390600204467773, "global_step": 212715, "epoch": 2562} {"train_loss": -24.219133377075195, "global_step": 212716, "epoch": 2562} {"train_loss": -24.086963653564453, "global_step": 212717, "epoch": 2562} {"train_loss": -24.20210838317871, "global_step": 212718, "epoch": 2562} {"train_loss": -24.735036849975586, "global_step": 212719, "epoch": 2562} {"train_loss": -24.2717342376709, "global_step": 212720, "epoch": 2562} {"train_loss": -24.620019912719727, "global_step": 212721, "epoch": 2562} {"train_loss": -24.624900817871094, "global_step": 212722, "epoch": 2562} {"train_loss": -24.262699127197266, "global_step": 212723, "epoch": 2562} {"train_loss": -24.880949020385742, "global_step": 212724, "epoch": 2562} {"train_loss": -24.6005916595459, "global_step": 212725, "epoch": 2562} {"train_loss": -24.265195846557617, "global_step": 212726, "epoch": 2562} {"train_loss": -24.44317054748535, "global_step": 212727, "epoch": 2562} {"train_loss": -24.389550358416088, "global_step": 212728, "epoch": 2562, "val_loss": 6747484.5} {"train_loss": -23.52620506286621, "global_step": 212729, "epoch": 2563} {"train_loss": -24.054279327392578, "global_step": 212730, "epoch": 2563} {"train_loss": -24.11568260192871, "global_step": 212731, "epoch": 2563} {"train_loss": -24.386093139648438, "global_step": 212732, "epoch": 2563} {"train_loss": -24.24658203125, "global_step": 212733, "epoch": 2563} {"train_loss": -24.07965087890625, "global_step": 212734, "epoch": 2563} {"train_loss": -24.092844009399414, "global_step": 212735, "epoch": 2563} {"train_loss": -24.16054344177246, "global_step": 212736, "epoch": 2563} {"train_loss": -24.11517906188965, "global_step": 212737, "epoch": 2563} {"train_loss": -24.33985710144043, "global_step": 212738, "epoch": 2563} {"train_loss": -23.849990844726562, "global_step": 212739, "epoch": 2563} {"train_loss": -24.386411666870117, "global_step": 212740, "epoch": 2563} {"train_loss": -24.61566734313965, "global_step": 212741, "epoch": 2563} {"train_loss": -24.42069435119629, "global_step": 212742, "epoch": 2563} {"train_loss": -24.303728103637695, "global_step": 212743, "epoch": 2563} {"train_loss": -24.224836349487305, "global_step": 212744, "epoch": 2563} {"train_loss": -24.1318359375, "global_step": 212745, "epoch": 2563} {"train_loss": -24.25364875793457, "global_step": 212746, "epoch": 2563} {"train_loss": -24.269973754882812, "global_step": 212747, "epoch": 2563} {"train_loss": -24.706193923950195, "global_step": 212748, "epoch": 2563} {"train_loss": -24.60443687438965, "global_step": 212749, "epoch": 2563} {"train_loss": -24.423648834228516, "global_step": 212750, "epoch": 2563} {"train_loss": -24.37416648864746, "global_step": 212751, "epoch": 2563} {"train_loss": -24.490211486816406, "global_step": 212752, "epoch": 2563} {"train_loss": -24.166257858276367, "global_step": 212753, "epoch": 2563} {"train_loss": -24.16535758972168, "global_step": 212754, "epoch": 2563} {"train_loss": -24.49332618713379, "global_step": 212755, "epoch": 2563} {"train_loss": -24.26905632019043, "global_step": 212756, "epoch": 2563} {"train_loss": -24.529882431030273, "global_step": 212757, "epoch": 2563} {"train_loss": -23.995241165161133, "global_step": 212758, "epoch": 2563} {"train_loss": -24.550710678100586, "global_step": 212759, "epoch": 2563} {"train_loss": -24.297056198120117, "global_step": 212760, "epoch": 2563} {"train_loss": -24.056318283081055, "global_step": 212761, "epoch": 2563} {"train_loss": -24.595129013061523, "global_step": 212762, "epoch": 2563} {"train_loss": -24.579099655151367, "global_step": 212763, "epoch": 2563} {"train_loss": -24.18516731262207, "global_step": 212764, "epoch": 2563} {"train_loss": -24.540266036987305, "global_step": 212765, "epoch": 2563} {"train_loss": -24.652362823486328, "global_step": 212766, "epoch": 2563} {"train_loss": -24.39039421081543, "global_step": 212767, "epoch": 2563} {"train_loss": -24.259872436523438, "global_step": 212768, "epoch": 2563} {"train_loss": -24.290605545043945, "global_step": 212769, "epoch": 2563} {"train_loss": -24.06300926208496, "global_step": 212770, "epoch": 2563} {"train_loss": -24.58253288269043, "global_step": 212771, "epoch": 2563} {"train_loss": -24.44080924987793, "global_step": 212772, "epoch": 2563} {"train_loss": -24.582597732543945, "global_step": 212773, "epoch": 2563} {"train_loss": -24.455219268798828, "global_step": 212774, "epoch": 2563} {"train_loss": -24.574506759643555, "global_step": 212775, "epoch": 2563} {"train_loss": -24.424924850463867, "global_step": 212776, "epoch": 2563} {"train_loss": -24.07459259033203, "global_step": 212777, "epoch": 2563} {"train_loss": -24.12531089782715, "global_step": 212778, "epoch": 2563} {"train_loss": -25.016620635986328, "global_step": 212779, "epoch": 2563} {"train_loss": -24.60422706604004, "global_step": 212780, "epoch": 2563} {"train_loss": -24.119626998901367, "global_step": 212781, "epoch": 2563} {"train_loss": -24.2626895904541, "global_step": 212782, "epoch": 2563} {"train_loss": -24.646207809448242, "global_step": 212783, "epoch": 2563} {"train_loss": -24.7149715423584, "global_step": 212784, "epoch": 2563} {"train_loss": -24.584257125854492, "global_step": 212785, "epoch": 2563} {"train_loss": -24.456518173217773, "global_step": 212786, "epoch": 2563} {"train_loss": -24.68707847595215, "global_step": 212787, "epoch": 2563} {"train_loss": -24.57839012145996, "global_step": 212788, "epoch": 2563} {"train_loss": -24.17242431640625, "global_step": 212789, "epoch": 2563} {"train_loss": -24.40510368347168, "global_step": 212790, "epoch": 2563} {"train_loss": -24.624378204345703, "global_step": 212791, "epoch": 2563} {"train_loss": -24.615924835205078, "global_step": 212792, "epoch": 2563} {"train_loss": -24.47276496887207, "global_step": 212793, "epoch": 2563} {"train_loss": -24.48195457458496, "global_step": 212794, "epoch": 2563} {"train_loss": -24.04815673828125, "global_step": 212795, "epoch": 2563} {"train_loss": -24.399770736694336, "global_step": 212796, "epoch": 2563} {"train_loss": -24.599491119384766, "global_step": 212797, "epoch": 2563} {"train_loss": -24.599910736083984, "global_step": 212798, "epoch": 2563} {"train_loss": -24.708045959472656, "global_step": 212799, "epoch": 2563} {"train_loss": -24.507230758666992, "global_step": 212800, "epoch": 2563} {"train_loss": -24.70758628845215, "global_step": 212801, "epoch": 2563} {"train_loss": -24.526248931884766, "global_step": 212802, "epoch": 2563} {"train_loss": -24.352048873901367, "global_step": 212803, "epoch": 2563} {"train_loss": -24.74675178527832, "global_step": 212804, "epoch": 2563} {"train_loss": -24.880056381225586, "global_step": 212805, "epoch": 2563} {"train_loss": -24.818933486938477, "global_step": 212806, "epoch": 2563} {"train_loss": -24.594146728515625, "global_step": 212807, "epoch": 2563} {"train_loss": -24.217105865478516, "global_step": 212808, "epoch": 2563} {"train_loss": -24.840831756591797, "global_step": 212809, "epoch": 2563} {"train_loss": -24.31598472595215, "global_step": 212810, "epoch": 2563} {"train_loss": -24.419315567935804, "global_step": 212811, "epoch": 2563, "val_loss": 6891479.0} {"train_loss": -24.096290588378906, "global_step": 212812, "epoch": 2564} {"train_loss": -24.279104232788086, "global_step": 212813, "epoch": 2564} {"train_loss": -24.49971580505371, "global_step": 212814, "epoch": 2564} {"train_loss": -23.9307918548584, "global_step": 212815, "epoch": 2564} {"train_loss": -24.097959518432617, "global_step": 212816, "epoch": 2564} {"train_loss": -24.135446548461914, "global_step": 212817, "epoch": 2564} {"train_loss": -24.47221565246582, "global_step": 212818, "epoch": 2564} {"train_loss": -24.372426986694336, "global_step": 212819, "epoch": 2564} {"train_loss": -24.034971237182617, "global_step": 212820, "epoch": 2564} {"train_loss": -24.135208129882812, "global_step": 212821, "epoch": 2564} {"train_loss": -24.10972023010254, "global_step": 212822, "epoch": 2564} {"train_loss": -24.468290328979492, "global_step": 212823, "epoch": 2564} {"train_loss": -24.56838035583496, "global_step": 212824, "epoch": 2564} {"train_loss": -24.13909339904785, "global_step": 212825, "epoch": 2564} {"train_loss": -24.309890747070312, "global_step": 212826, "epoch": 2564} {"train_loss": -24.207151412963867, "global_step": 212827, "epoch": 2564} {"train_loss": -24.661699295043945, "global_step": 212828, "epoch": 2564} {"train_loss": -24.28084373474121, "global_step": 212829, "epoch": 2564} {"train_loss": -24.343244552612305, "global_step": 212830, "epoch": 2564} {"train_loss": -24.314865112304688, "global_step": 212831, "epoch": 2564} {"train_loss": -24.42045021057129, "global_step": 212832, "epoch": 2564} {"train_loss": -24.457727432250977, "global_step": 212833, "epoch": 2564} {"train_loss": -24.543344497680664, "global_step": 212834, "epoch": 2564} {"train_loss": -24.450523376464844, "global_step": 212835, "epoch": 2564} {"train_loss": -24.41493797302246, "global_step": 212836, "epoch": 2564} {"train_loss": -24.667129516601562, "global_step": 212837, "epoch": 2564} {"train_loss": -24.277021408081055, "global_step": 212838, "epoch": 2564} {"train_loss": -24.357725143432617, "global_step": 212839, "epoch": 2564} {"train_loss": -24.627471923828125, "global_step": 212840, "epoch": 2564} {"train_loss": -24.54935646057129, "global_step": 212841, "epoch": 2564} {"train_loss": -24.418455123901367, "global_step": 212842, "epoch": 2564} {"train_loss": -24.394704818725586, "global_step": 212843, "epoch": 2564} {"train_loss": -24.751157760620117, "global_step": 212844, "epoch": 2564} {"train_loss": -24.47992706298828, "global_step": 212845, "epoch": 2564} {"train_loss": -24.47725486755371, "global_step": 212846, "epoch": 2564} {"train_loss": -24.598129272460938, "global_step": 212847, "epoch": 2564} {"train_loss": -24.65555763244629, "global_step": 212848, "epoch": 2564} {"train_loss": -24.581806182861328, "global_step": 212849, "epoch": 2564} {"train_loss": -24.22381019592285, "global_step": 212850, "epoch": 2564} {"train_loss": -24.851032257080078, "global_step": 212851, "epoch": 2564} {"train_loss": -24.439382553100586, "global_step": 212852, "epoch": 2564} {"train_loss": -24.24032974243164, "global_step": 212853, "epoch": 2564} {"train_loss": -24.37106704711914, "global_step": 212854, "epoch": 2564} {"train_loss": -24.60723304748535, "global_step": 212855, "epoch": 2564} {"train_loss": -24.638418197631836, "global_step": 212856, "epoch": 2564} {"train_loss": -24.177169799804688, "global_step": 212857, "epoch": 2564} {"train_loss": -24.443660736083984, "global_step": 212858, "epoch": 2564} {"train_loss": -24.02852439880371, "global_step": 212859, "epoch": 2564} {"train_loss": -24.56069564819336, "global_step": 212860, "epoch": 2564} {"train_loss": -24.367563247680664, "global_step": 212861, "epoch": 2564} {"train_loss": -24.283170700073242, "global_step": 212862, "epoch": 2564} {"train_loss": -24.436620712280273, "global_step": 212863, "epoch": 2564} {"train_loss": -24.470373153686523, "global_step": 212864, "epoch": 2564} {"train_loss": -24.618253707885742, "global_step": 212865, "epoch": 2564} {"train_loss": -24.719379425048828, "global_step": 212866, "epoch": 2564} {"train_loss": -24.371007919311523, "global_step": 212867, "epoch": 2564} {"train_loss": -24.493301391601562, "global_step": 212868, "epoch": 2564} {"train_loss": -24.641218185424805, "global_step": 212869, "epoch": 2564} {"train_loss": -24.124204635620117, "global_step": 212870, "epoch": 2564} {"train_loss": -24.374835968017578, "global_step": 212871, "epoch": 2564} {"train_loss": -24.799863815307617, "global_step": 212872, "epoch": 2564} {"train_loss": -24.538251876831055, "global_step": 212873, "epoch": 2564} {"train_loss": -24.357694625854492, "global_step": 212874, "epoch": 2564} {"train_loss": -24.815061569213867, "global_step": 212875, "epoch": 2564} {"train_loss": -24.486345291137695, "global_step": 212876, "epoch": 2564} {"train_loss": -24.484922409057617, "global_step": 212877, "epoch": 2564} {"train_loss": -25.08989906311035, "global_step": 212878, "epoch": 2564} {"train_loss": -24.332761764526367, "global_step": 212879, "epoch": 2564} {"train_loss": -24.6245059967041, "global_step": 212880, "epoch": 2564} {"train_loss": -24.507131576538086, "global_step": 212881, "epoch": 2564} {"train_loss": -24.0517520904541, "global_step": 212882, "epoch": 2564} {"train_loss": -24.32440185546875, "global_step": 212883, "epoch": 2564} {"train_loss": -24.445453643798828, "global_step": 212884, "epoch": 2564} {"train_loss": -24.477975845336914, "global_step": 212885, "epoch": 2564} {"train_loss": -24.31096839904785, "global_step": 212886, "epoch": 2564} {"train_loss": -24.404361724853516, "global_step": 212887, "epoch": 2564} {"train_loss": -24.29483985900879, "global_step": 212888, "epoch": 2564} {"train_loss": -24.4003963470459, "global_step": 212889, "epoch": 2564} {"train_loss": -24.448705673217773, "global_step": 212890, "epoch": 2564} {"train_loss": -24.428491592407227, "global_step": 212891, "epoch": 2564} {"train_loss": -24.243085861206055, "global_step": 212892, "epoch": 2564} {"train_loss": -24.92828941345215, "global_step": 212893, "epoch": 2564} {"train_loss": -24.426854282976635, "global_step": 212894, "epoch": 2564, "val_loss": 6472670.0} {"train_loss": -23.734548568725586, "global_step": 212895, "epoch": 2565} {"train_loss": -23.80183219909668, "global_step": 212896, "epoch": 2565} {"train_loss": -23.3868465423584, "global_step": 212897, "epoch": 2565} {"train_loss": -23.463397979736328, "global_step": 212898, "epoch": 2565} {"train_loss": -24.06178855895996, "global_step": 212899, "epoch": 2565} {"train_loss": -23.41320037841797, "global_step": 212900, "epoch": 2565} {"train_loss": -23.45196533203125, "global_step": 212901, "epoch": 2565} {"train_loss": -23.875934600830078, "global_step": 212902, "epoch": 2565} {"train_loss": -23.516626358032227, "global_step": 212903, "epoch": 2565} {"train_loss": -23.924283981323242, "global_step": 212904, "epoch": 2565} {"train_loss": -23.668182373046875, "global_step": 212905, "epoch": 2565} {"train_loss": -23.83280372619629, "global_step": 212906, "epoch": 2565} {"train_loss": -24.0914363861084, "global_step": 212907, "epoch": 2565} {"train_loss": -23.537250518798828, "global_step": 212908, "epoch": 2565} {"train_loss": -23.963464736938477, "global_step": 212909, "epoch": 2565} {"train_loss": -23.76816177368164, "global_step": 212910, "epoch": 2565} {"train_loss": -24.364418029785156, "global_step": 212911, "epoch": 2565} {"train_loss": -24.0621395111084, "global_step": 212912, "epoch": 2565} {"train_loss": -23.98548698425293, "global_step": 212913, "epoch": 2565} {"train_loss": -24.011972427368164, "global_step": 212914, "epoch": 2565} {"train_loss": -24.103153228759766, "global_step": 212915, "epoch": 2565} {"train_loss": -24.430631637573242, "global_step": 212916, "epoch": 2565} {"train_loss": -24.228078842163086, "global_step": 212917, "epoch": 2565} {"train_loss": -24.476959228515625, "global_step": 212918, "epoch": 2565} {"train_loss": -24.554296493530273, "global_step": 212919, "epoch": 2565} {"train_loss": -24.311073303222656, "global_step": 212920, "epoch": 2565} {"train_loss": -24.058927536010742, "global_step": 212921, "epoch": 2565} {"train_loss": -24.49540138244629, "global_step": 212922, "epoch": 2565} {"train_loss": -24.231924057006836, "global_step": 212923, "epoch": 2565} {"train_loss": -24.532421112060547, "global_step": 212924, "epoch": 2565} {"train_loss": -24.420194625854492, "global_step": 212925, "epoch": 2565} {"train_loss": -24.502012252807617, "global_step": 212926, "epoch": 2565} {"train_loss": -24.355985641479492, "global_step": 212927, "epoch": 2565} {"train_loss": -24.338077545166016, "global_step": 212928, "epoch": 2565} {"train_loss": -24.435449600219727, "global_step": 212929, "epoch": 2565} {"train_loss": -24.445707321166992, "global_step": 212930, "epoch": 2565} {"train_loss": -24.638181686401367, "global_step": 212931, "epoch": 2565} {"train_loss": -24.19069480895996, "global_step": 212932, "epoch": 2565} {"train_loss": -24.414358139038086, "global_step": 212933, "epoch": 2565} {"train_loss": -24.660614013671875, "global_step": 212934, "epoch": 2565} {"train_loss": -24.43245506286621, "global_step": 212935, "epoch": 2565} {"train_loss": -24.821237564086914, "global_step": 212936, "epoch": 2565} {"train_loss": -24.419065475463867, "global_step": 212937, "epoch": 2565} {"train_loss": -24.4686279296875, "global_step": 212938, "epoch": 2565} {"train_loss": -24.20997428894043, "global_step": 212939, "epoch": 2565} {"train_loss": -24.432781219482422, "global_step": 212940, "epoch": 2565} {"train_loss": -23.97051429748535, "global_step": 212941, "epoch": 2565} {"train_loss": -24.654285430908203, "global_step": 212942, "epoch": 2565} {"train_loss": -24.67225456237793, "global_step": 212943, "epoch": 2565} {"train_loss": -24.165348052978516, "global_step": 212944, "epoch": 2565} {"train_loss": -24.666349411010742, "global_step": 212945, "epoch": 2565} {"train_loss": -24.50663185119629, "global_step": 212946, "epoch": 2565} {"train_loss": -24.69827651977539, "global_step": 212947, "epoch": 2565} {"train_loss": -24.437414169311523, "global_step": 212948, "epoch": 2565} {"train_loss": -24.58030128479004, "global_step": 212949, "epoch": 2565} {"train_loss": -24.82862663269043, "global_step": 212950, "epoch": 2565} {"train_loss": -24.548381805419922, "global_step": 212951, "epoch": 2565} {"train_loss": -24.71917152404785, "global_step": 212952, "epoch": 2565} {"train_loss": -24.754785537719727, "global_step": 212953, "epoch": 2565} {"train_loss": -24.18805503845215, "global_step": 212954, "epoch": 2565} {"train_loss": -24.538837432861328, "global_step": 212955, "epoch": 2565} {"train_loss": -24.381250381469727, "global_step": 212956, "epoch": 2565} {"train_loss": -24.726097106933594, "global_step": 212957, "epoch": 2565} {"train_loss": -24.369977951049805, "global_step": 212958, "epoch": 2565} {"train_loss": -24.55308723449707, "global_step": 212959, "epoch": 2565} {"train_loss": -24.652965545654297, "global_step": 212960, "epoch": 2565} {"train_loss": -24.608901977539062, "global_step": 212961, "epoch": 2565} {"train_loss": -24.062917709350586, "global_step": 212962, "epoch": 2565} {"train_loss": -24.56080436706543, "global_step": 212963, "epoch": 2565} {"train_loss": -24.606975555419922, "global_step": 212964, "epoch": 2565} {"train_loss": -24.130868911743164, "global_step": 212965, "epoch": 2565} {"train_loss": -24.435415267944336, "global_step": 212966, "epoch": 2565} {"train_loss": -24.519981384277344, "global_step": 212967, "epoch": 2565} {"train_loss": -24.721393585205078, "global_step": 212968, "epoch": 2565} {"train_loss": -24.312835693359375, "global_step": 212969, "epoch": 2565} {"train_loss": -24.49281883239746, "global_step": 212970, "epoch": 2565} {"train_loss": -24.21491050720215, "global_step": 212971, "epoch": 2565} {"train_loss": -24.617769241333008, "global_step": 212972, "epoch": 2565} {"train_loss": -24.66481590270996, "global_step": 212973, "epoch": 2565} {"train_loss": -24.782482147216797, "global_step": 212974, "epoch": 2565} {"train_loss": -24.695995330810547, "global_step": 212975, "epoch": 2565} {"train_loss": -24.609926223754883, "global_step": 212976, "epoch": 2565} {"train_loss": -24.304273214684912, "global_step": 212977, "epoch": 2565, "val_loss": 6640514.0} {"train_loss": -24.12458038330078, "global_step": 212978, "epoch": 2566} {"train_loss": -24.34649658203125, "global_step": 212979, "epoch": 2566} {"train_loss": -23.848989486694336, "global_step": 212980, "epoch": 2566} {"train_loss": -24.418832778930664, "global_step": 212981, "epoch": 2566} {"train_loss": -24.117197036743164, "global_step": 212982, "epoch": 2566} {"train_loss": -24.377431869506836, "global_step": 212983, "epoch": 2566} {"train_loss": -24.216297149658203, "global_step": 212984, "epoch": 2566} {"train_loss": -24.138900756835938, "global_step": 212985, "epoch": 2566} {"train_loss": -24.240415573120117, "global_step": 212986, "epoch": 2566} {"train_loss": -24.1883602142334, "global_step": 212987, "epoch": 2566} {"train_loss": -24.061105728149414, "global_step": 212988, "epoch": 2566} {"train_loss": -24.27420425415039, "global_step": 212989, "epoch": 2566} {"train_loss": -24.531442642211914, "global_step": 212990, "epoch": 2566} {"train_loss": -24.663053512573242, "global_step": 212991, "epoch": 2566} {"train_loss": -24.35722541809082, "global_step": 212992, "epoch": 2566} {"train_loss": -24.68499183654785, "global_step": 212993, "epoch": 2566} {"train_loss": -24.42176628112793, "global_step": 212994, "epoch": 2566} {"train_loss": -24.500699996948242, "global_step": 212995, "epoch": 2566} {"train_loss": -24.581308364868164, "global_step": 212996, "epoch": 2566} {"train_loss": -24.439809799194336, "global_step": 212997, "epoch": 2566} {"train_loss": -24.530960083007812, "global_step": 212998, "epoch": 2566} {"train_loss": -24.54719352722168, "global_step": 212999, "epoch": 2566} {"train_loss": -24.5527400970459, "global_step": 213000, "epoch": 2566} {"train_loss": -24.525596618652344, "global_step": 213001, "epoch": 2566} {"train_loss": -24.604433059692383, "global_step": 213002, "epoch": 2566} {"train_loss": -24.5621395111084, "global_step": 213003, "epoch": 2566} {"train_loss": -24.744775772094727, "global_step": 213004, "epoch": 2566} {"train_loss": -24.69405174255371, "global_step": 213005, "epoch": 2566} {"train_loss": -24.728883743286133, "global_step": 213006, "epoch": 2566} {"train_loss": -24.080387115478516, "global_step": 213007, "epoch": 2566} {"train_loss": -24.728195190429688, "global_step": 213008, "epoch": 2566} {"train_loss": -24.5538330078125, "global_step": 213009, "epoch": 2566} {"train_loss": -24.61517906188965, "global_step": 213010, "epoch": 2566} {"train_loss": -24.7294979095459, "global_step": 213011, "epoch": 2566} {"train_loss": -24.60393714904785, "global_step": 213012, "epoch": 2566} {"train_loss": -24.59950828552246, "global_step": 213013, "epoch": 2566} {"train_loss": -24.838773727416992, "global_step": 213014, "epoch": 2566} {"train_loss": -24.85578727722168, "global_step": 213015, "epoch": 2566} {"train_loss": -24.904403686523438, "global_step": 213016, "epoch": 2566} {"train_loss": -25.011268615722656, "global_step": 213017, "epoch": 2566} {"train_loss": -24.28940773010254, "global_step": 213018, "epoch": 2566} {"train_loss": -24.326160430908203, "global_step": 213019, "epoch": 2566} {"train_loss": -24.142353057861328, "global_step": 213020, "epoch": 2566} {"train_loss": -24.070165634155273, "global_step": 213021, "epoch": 2566} {"train_loss": -23.8923397064209, "global_step": 213022, "epoch": 2566} {"train_loss": -24.680185317993164, "global_step": 213023, "epoch": 2566} {"train_loss": -24.506040573120117, "global_step": 213024, "epoch": 2566} {"train_loss": -23.915355682373047, "global_step": 213025, "epoch": 2566} {"train_loss": -24.054555892944336, "global_step": 213026, "epoch": 2566} {"train_loss": -24.144193649291992, "global_step": 213027, "epoch": 2566} {"train_loss": -24.613788604736328, "global_step": 213028, "epoch": 2566} {"train_loss": -24.024770736694336, "global_step": 213029, "epoch": 2566} {"train_loss": -24.06937026977539, "global_step": 213030, "epoch": 2566} {"train_loss": -24.439851760864258, "global_step": 213031, "epoch": 2566} {"train_loss": -24.081693649291992, "global_step": 213032, "epoch": 2566} {"train_loss": -24.20734977722168, "global_step": 213033, "epoch": 2566} {"train_loss": -24.548702239990234, "global_step": 213034, "epoch": 2566} {"train_loss": -24.718067169189453, "global_step": 213035, "epoch": 2566} {"train_loss": -24.632347106933594, "global_step": 213036, "epoch": 2566} {"train_loss": -24.511104583740234, "global_step": 213037, "epoch": 2566} {"train_loss": -24.36191749572754, "global_step": 213038, "epoch": 2566} {"train_loss": -24.34002113342285, "global_step": 213039, "epoch": 2566} {"train_loss": -24.73248863220215, "global_step": 213040, "epoch": 2566} {"train_loss": -24.374679565429688, "global_step": 213041, "epoch": 2566} {"train_loss": -24.233566284179688, "global_step": 213042, "epoch": 2566} {"train_loss": -24.877216339111328, "global_step": 213043, "epoch": 2566} {"train_loss": -24.723913192749023, "global_step": 213044, "epoch": 2566} {"train_loss": -24.46246337890625, "global_step": 213045, "epoch": 2566} {"train_loss": -24.34169578552246, "global_step": 213046, "epoch": 2566} {"train_loss": -24.496417999267578, "global_step": 213047, "epoch": 2566} {"train_loss": -24.540037155151367, "global_step": 213048, "epoch": 2566} {"train_loss": -24.650192260742188, "global_step": 213049, "epoch": 2566} {"train_loss": -24.33055877685547, "global_step": 213050, "epoch": 2566} {"train_loss": -24.194677352905273, "global_step": 213051, "epoch": 2566} {"train_loss": -24.25398063659668, "global_step": 213052, "epoch": 2566} {"train_loss": -24.404598236083984, "global_step": 213053, "epoch": 2566} {"train_loss": -24.346620559692383, "global_step": 213054, "epoch": 2566} {"train_loss": -24.640472412109375, "global_step": 213055, "epoch": 2566} {"train_loss": -24.84495735168457, "global_step": 213056, "epoch": 2566} {"train_loss": -24.341434478759766, "global_step": 213057, "epoch": 2566} {"train_loss": -23.974552154541016, "global_step": 213058, "epoch": 2566} {"train_loss": -24.665746688842773, "global_step": 213059, "epoch": 2566} {"train_loss": -24.443608594227985, "global_step": 213060, "epoch": 2566, "val_loss": 6642717.0} {"train_loss": -24.334569931030273, "global_step": 213061, "epoch": 2567} {"train_loss": -24.17713737487793, "global_step": 213062, "epoch": 2567} {"train_loss": -23.987546920776367, "global_step": 213063, "epoch": 2567} {"train_loss": -24.712392807006836, "global_step": 213064, "epoch": 2567} {"train_loss": -24.12657356262207, "global_step": 213065, "epoch": 2567} {"train_loss": -24.255573272705078, "global_step": 213066, "epoch": 2567} {"train_loss": -24.599227905273438, "global_step": 213067, "epoch": 2567} {"train_loss": -24.026575088500977, "global_step": 213068, "epoch": 2567} {"train_loss": -24.084447860717773, "global_step": 213069, "epoch": 2567} {"train_loss": -24.570423126220703, "global_step": 213070, "epoch": 2567} {"train_loss": -24.188478469848633, "global_step": 213071, "epoch": 2567} {"train_loss": -24.41948127746582, "global_step": 213072, "epoch": 2567} {"train_loss": -24.82927894592285, "global_step": 213073, "epoch": 2567} {"train_loss": -24.38948631286621, "global_step": 213074, "epoch": 2567} {"train_loss": -24.647878646850586, "global_step": 213075, "epoch": 2567} {"train_loss": -24.421772003173828, "global_step": 213076, "epoch": 2567} {"train_loss": -24.393798828125, "global_step": 213077, "epoch": 2567} {"train_loss": -24.888137817382812, "global_step": 213078, "epoch": 2567} {"train_loss": -24.459035873413086, "global_step": 213079, "epoch": 2567} {"train_loss": -24.64207649230957, "global_step": 213080, "epoch": 2567} {"train_loss": -24.260791778564453, "global_step": 213081, "epoch": 2567} {"train_loss": -24.464731216430664, "global_step": 213082, "epoch": 2567} {"train_loss": -24.703824996948242, "global_step": 213083, "epoch": 2567} {"train_loss": -24.230724334716797, "global_step": 213084, "epoch": 2567} {"train_loss": -24.600101470947266, "global_step": 213085, "epoch": 2567} {"train_loss": -24.404504776000977, "global_step": 213086, "epoch": 2567} {"train_loss": -24.276670455932617, "global_step": 213087, "epoch": 2567} {"train_loss": -24.31747055053711, "global_step": 213088, "epoch": 2567} {"train_loss": -24.45026969909668, "global_step": 213089, "epoch": 2567} {"train_loss": -24.66106414794922, "global_step": 213090, "epoch": 2567} {"train_loss": -24.31599235534668, "global_step": 213091, "epoch": 2567} {"train_loss": -24.36714744567871, "global_step": 213092, "epoch": 2567} {"train_loss": -24.672101974487305, "global_step": 213093, "epoch": 2567} {"train_loss": -24.464059829711914, "global_step": 213094, "epoch": 2567} {"train_loss": -24.68471336364746, "global_step": 213095, "epoch": 2567} {"train_loss": -24.299699783325195, "global_step": 213096, "epoch": 2567} {"train_loss": -23.76092529296875, "global_step": 213097, "epoch": 2567} {"train_loss": -24.43548583984375, "global_step": 213098, "epoch": 2567} {"train_loss": -24.041156768798828, "global_step": 213099, "epoch": 2567} {"train_loss": -24.499332427978516, "global_step": 213100, "epoch": 2567} {"train_loss": -24.215564727783203, "global_step": 213101, "epoch": 2567} {"train_loss": -24.56634521484375, "global_step": 213102, "epoch": 2567} {"train_loss": -24.221027374267578, "global_step": 213103, "epoch": 2567} {"train_loss": -24.33966064453125, "global_step": 213104, "epoch": 2567} {"train_loss": -24.04087257385254, "global_step": 213105, "epoch": 2567} {"train_loss": -24.239028930664062, "global_step": 213106, "epoch": 2567} {"train_loss": -24.69053840637207, "global_step": 213107, "epoch": 2567} {"train_loss": -24.413837432861328, "global_step": 213108, "epoch": 2567} {"train_loss": -24.421186447143555, "global_step": 213109, "epoch": 2567} {"train_loss": -24.423202514648438, "global_step": 213110, "epoch": 2567} {"train_loss": -24.602710723876953, "global_step": 213111, "epoch": 2567} {"train_loss": -24.425458908081055, "global_step": 213112, "epoch": 2567} {"train_loss": -25.048341751098633, "global_step": 213113, "epoch": 2567} {"train_loss": -24.29227638244629, "global_step": 213114, "epoch": 2567} {"train_loss": -24.188617706298828, "global_step": 213115, "epoch": 2567} {"train_loss": -24.335119247436523, "global_step": 213116, "epoch": 2567} {"train_loss": -24.414608001708984, "global_step": 213117, "epoch": 2567} {"train_loss": -24.37087059020996, "global_step": 213118, "epoch": 2567} {"train_loss": -24.483976364135742, "global_step": 213119, "epoch": 2567} {"train_loss": -24.25760269165039, "global_step": 213120, "epoch": 2567} {"train_loss": -24.74726676940918, "global_step": 213121, "epoch": 2567} {"train_loss": -24.437665939331055, "global_step": 213122, "epoch": 2567} {"train_loss": -24.476858139038086, "global_step": 213123, "epoch": 2567} {"train_loss": -24.255334854125977, "global_step": 213124, "epoch": 2567} {"train_loss": -24.23292350769043, "global_step": 213125, "epoch": 2567} {"train_loss": -24.66217041015625, "global_step": 213126, "epoch": 2567} {"train_loss": -24.249357223510742, "global_step": 213127, "epoch": 2567} {"train_loss": -24.398395538330078, "global_step": 213128, "epoch": 2567} {"train_loss": -24.515792846679688, "global_step": 213129, "epoch": 2567} {"train_loss": -24.655488967895508, "global_step": 213130, "epoch": 2567} {"train_loss": -24.379337310791016, "global_step": 213131, "epoch": 2567} {"train_loss": -24.69428825378418, "global_step": 213132, "epoch": 2567} {"train_loss": -24.515064239501953, "global_step": 213133, "epoch": 2567} {"train_loss": -24.4879207611084, "global_step": 213134, "epoch": 2567} {"train_loss": -24.779279708862305, "global_step": 213135, "epoch": 2567} {"train_loss": -24.32568359375, "global_step": 213136, "epoch": 2567} {"train_loss": -25.048885345458984, "global_step": 213137, "epoch": 2567} {"train_loss": -24.59092140197754, "global_step": 213138, "epoch": 2567} {"train_loss": -24.358366012573242, "global_step": 213139, "epoch": 2567} {"train_loss": -24.36256217956543, "global_step": 213140, "epoch": 2567} {"train_loss": -24.222370147705078, "global_step": 213141, "epoch": 2567} {"train_loss": -24.658523559570312, "global_step": 213142, "epoch": 2567} {"train_loss": -24.425805126328065, "global_step": 213143, "epoch": 2567, "val_loss": 6560997.0} {"train_loss": -23.962953567504883, "global_step": 213144, "epoch": 2568} {"train_loss": -23.657896041870117, "global_step": 213145, "epoch": 2568} {"train_loss": -23.774616241455078, "global_step": 213146, "epoch": 2568} {"train_loss": -24.504018783569336, "global_step": 213147, "epoch": 2568} {"train_loss": -24.311248779296875, "global_step": 213148, "epoch": 2568} {"train_loss": -24.208974838256836, "global_step": 213149, "epoch": 2568} {"train_loss": -24.5513973236084, "global_step": 213150, "epoch": 2568} {"train_loss": -24.60070037841797, "global_step": 213151, "epoch": 2568} {"train_loss": -24.126188278198242, "global_step": 213152, "epoch": 2568} {"train_loss": -24.05255889892578, "global_step": 213153, "epoch": 2568} {"train_loss": -24.381942749023438, "global_step": 213154, "epoch": 2568} {"train_loss": -24.501150131225586, "global_step": 213155, "epoch": 2568} {"train_loss": -24.291717529296875, "global_step": 213156, "epoch": 2568} {"train_loss": -24.193256378173828, "global_step": 213157, "epoch": 2568} {"train_loss": -24.2762508392334, "global_step": 213158, "epoch": 2568} {"train_loss": -24.444589614868164, "global_step": 213159, "epoch": 2568} {"train_loss": -24.231077194213867, "global_step": 213160, "epoch": 2568} {"train_loss": -24.337574005126953, "global_step": 213161, "epoch": 2568} {"train_loss": -24.740108489990234, "global_step": 213162, "epoch": 2568} {"train_loss": -24.445295333862305, "global_step": 213163, "epoch": 2568} {"train_loss": -24.227066040039062, "global_step": 213164, "epoch": 2568} {"train_loss": -24.483882904052734, "global_step": 213165, "epoch": 2568} {"train_loss": -23.909046173095703, "global_step": 213166, "epoch": 2568} {"train_loss": -24.329660415649414, "global_step": 213167, "epoch": 2568} {"train_loss": -24.287160873413086, "global_step": 213168, "epoch": 2568} {"train_loss": -23.94826316833496, "global_step": 213169, "epoch": 2568} {"train_loss": -24.36173439025879, "global_step": 213170, "epoch": 2568} {"train_loss": -24.387136459350586, "global_step": 213171, "epoch": 2568} {"train_loss": -24.598623275756836, "global_step": 213172, "epoch": 2568} {"train_loss": -24.425199508666992, "global_step": 213173, "epoch": 2568} {"train_loss": -24.273021697998047, "global_step": 213174, "epoch": 2568} {"train_loss": -24.322647094726562, "global_step": 213175, "epoch": 2568} {"train_loss": -24.32893180847168, "global_step": 213176, "epoch": 2568} {"train_loss": -24.738544464111328, "global_step": 213177, "epoch": 2568} {"train_loss": -24.205284118652344, "global_step": 213178, "epoch": 2568} {"train_loss": -24.278512954711914, "global_step": 213179, "epoch": 2568} {"train_loss": -24.604177474975586, "global_step": 213180, "epoch": 2568} {"train_loss": -24.5664119720459, "global_step": 213181, "epoch": 2568} {"train_loss": -24.47739028930664, "global_step": 213182, "epoch": 2568} {"train_loss": -24.996784210205078, "global_step": 213183, "epoch": 2568} {"train_loss": -24.479511260986328, "global_step": 213184, "epoch": 2568} {"train_loss": -24.517919540405273, "global_step": 213185, "epoch": 2568} {"train_loss": -24.553855895996094, "global_step": 213186, "epoch": 2568} {"train_loss": -24.587366104125977, "global_step": 213187, "epoch": 2568} {"train_loss": -24.513296127319336, "global_step": 213188, "epoch": 2568} {"train_loss": -24.407550811767578, "global_step": 213189, "epoch": 2568} {"train_loss": -24.51154899597168, "global_step": 213190, "epoch": 2568} {"train_loss": -24.5428524017334, "global_step": 213191, "epoch": 2568} {"train_loss": -24.38469696044922, "global_step": 213192, "epoch": 2568} {"train_loss": -24.438100814819336, "global_step": 213193, "epoch": 2568} {"train_loss": -24.322107315063477, "global_step": 213194, "epoch": 2568} {"train_loss": -24.586339950561523, "global_step": 213195, "epoch": 2568} {"train_loss": -24.91383171081543, "global_step": 213196, "epoch": 2568} {"train_loss": -24.665252685546875, "global_step": 213197, "epoch": 2568} {"train_loss": -24.6264591217041, "global_step": 213198, "epoch": 2568} {"train_loss": -24.215784072875977, "global_step": 213199, "epoch": 2568} {"train_loss": -24.63176155090332, "global_step": 213200, "epoch": 2568} {"train_loss": -24.59535789489746, "global_step": 213201, "epoch": 2568} {"train_loss": -24.407764434814453, "global_step": 213202, "epoch": 2568} {"train_loss": -24.404865264892578, "global_step": 213203, "epoch": 2568} {"train_loss": -24.33702278137207, "global_step": 213204, "epoch": 2568} {"train_loss": -24.371259689331055, "global_step": 213205, "epoch": 2568} {"train_loss": -24.675067901611328, "global_step": 213206, "epoch": 2568} {"train_loss": -23.8783016204834, "global_step": 213207, "epoch": 2568} {"train_loss": -24.618282318115234, "global_step": 213208, "epoch": 2568} {"train_loss": -24.603132247924805, "global_step": 213209, "epoch": 2568} {"train_loss": -24.759113311767578, "global_step": 213210, "epoch": 2568} {"train_loss": -24.409107208251953, "global_step": 213211, "epoch": 2568} {"train_loss": -24.399503707885742, "global_step": 213212, "epoch": 2568} {"train_loss": -24.774307250976562, "global_step": 213213, "epoch": 2568} {"train_loss": -24.328048706054688, "global_step": 213214, "epoch": 2568} {"train_loss": -24.67421531677246, "global_step": 213215, "epoch": 2568} {"train_loss": -24.575057983398438, "global_step": 213216, "epoch": 2568} {"train_loss": -24.28879165649414, "global_step": 213217, "epoch": 2568} {"train_loss": -24.497770309448242, "global_step": 213218, "epoch": 2568} {"train_loss": -24.427953720092773, "global_step": 213219, "epoch": 2568} {"train_loss": -24.40973472595215, "global_step": 213220, "epoch": 2568} {"train_loss": -24.788930892944336, "global_step": 213221, "epoch": 2568} {"train_loss": -24.994653701782227, "global_step": 213222, "epoch": 2568} {"train_loss": -24.51593017578125, "global_step": 213223, "epoch": 2568} {"train_loss": -24.720569610595703, "global_step": 213224, "epoch": 2568} {"train_loss": -24.326658248901367, "global_step": 213225, "epoch": 2568} {"train_loss": -24.42478742944189, "global_step": 213226, "epoch": 2568, "val_loss": 6621066.5} {"train_loss": -23.982250213623047, "global_step": 213227, "epoch": 2569} {"train_loss": -23.936237335205078, "global_step": 213228, "epoch": 2569} {"train_loss": -24.647924423217773, "global_step": 213229, "epoch": 2569} {"train_loss": -24.339500427246094, "global_step": 213230, "epoch": 2569} {"train_loss": -24.478107452392578, "global_step": 213231, "epoch": 2569} {"train_loss": -23.859149932861328, "global_step": 213232, "epoch": 2569} {"train_loss": -23.929058074951172, "global_step": 213233, "epoch": 2569} {"train_loss": -24.12404441833496, "global_step": 213234, "epoch": 2569} {"train_loss": -23.845230102539062, "global_step": 213235, "epoch": 2569} {"train_loss": -24.33927345275879, "global_step": 213236, "epoch": 2569} {"train_loss": -24.1544132232666, "global_step": 213237, "epoch": 2569} {"train_loss": -24.029699325561523, "global_step": 213238, "epoch": 2569} {"train_loss": -24.066442489624023, "global_step": 213239, "epoch": 2569} {"train_loss": -24.3734188079834, "global_step": 213240, "epoch": 2569} {"train_loss": -24.331323623657227, "global_step": 213241, "epoch": 2569} {"train_loss": -24.381528854370117, "global_step": 213242, "epoch": 2569} {"train_loss": -24.714187622070312, "global_step": 213243, "epoch": 2569} {"train_loss": -24.406415939331055, "global_step": 213244, "epoch": 2569} {"train_loss": -24.408937454223633, "global_step": 213245, "epoch": 2569} {"train_loss": -24.546154022216797, "global_step": 213246, "epoch": 2569} {"train_loss": -24.52587127685547, "global_step": 213247, "epoch": 2569} {"train_loss": -24.523574829101562, "global_step": 213248, "epoch": 2569} {"train_loss": -24.597684860229492, "global_step": 213249, "epoch": 2569} {"train_loss": -24.27836036682129, "global_step": 213250, "epoch": 2569} {"train_loss": -24.481046676635742, "global_step": 213251, "epoch": 2569} {"train_loss": -24.24765968322754, "global_step": 213252, "epoch": 2569} {"train_loss": -24.633167266845703, "global_step": 213253, "epoch": 2569} {"train_loss": -24.137758255004883, "global_step": 213254, "epoch": 2569} {"train_loss": -24.527755737304688, "global_step": 213255, "epoch": 2569} {"train_loss": -24.54277229309082, "global_step": 213256, "epoch": 2569} {"train_loss": -24.4453067779541, "global_step": 213257, "epoch": 2569} {"train_loss": -24.431324005126953, "global_step": 213258, "epoch": 2569} {"train_loss": -24.570728302001953, "global_step": 213259, "epoch": 2569} {"train_loss": -24.85931968688965, "global_step": 213260, "epoch": 2569} {"train_loss": -24.49151039123535, "global_step": 213261, "epoch": 2569} {"train_loss": -24.353422164916992, "global_step": 213262, "epoch": 2569} {"train_loss": -24.6237735748291, "global_step": 213263, "epoch": 2569} {"train_loss": -24.795392990112305, "global_step": 213264, "epoch": 2569} {"train_loss": -24.676847457885742, "global_step": 213265, "epoch": 2569} {"train_loss": -24.467586517333984, "global_step": 213266, "epoch": 2569} {"train_loss": -24.620990753173828, "global_step": 213267, "epoch": 2569} {"train_loss": -24.159597396850586, "global_step": 213268, "epoch": 2569} {"train_loss": -24.726945877075195, "global_step": 213269, "epoch": 2569} {"train_loss": -24.403289794921875, "global_step": 213270, "epoch": 2569} {"train_loss": -24.425485610961914, "global_step": 213271, "epoch": 2569} {"train_loss": -24.525012969970703, "global_step": 213272, "epoch": 2569} {"train_loss": -24.477415084838867, "global_step": 213273, "epoch": 2569} {"train_loss": -24.408178329467773, "global_step": 213274, "epoch": 2569} {"train_loss": -24.218276977539062, "global_step": 213275, "epoch": 2569} {"train_loss": -24.102252960205078, "global_step": 213276, "epoch": 2569} {"train_loss": -23.97517967224121, "global_step": 213277, "epoch": 2569} {"train_loss": -24.369136810302734, "global_step": 213278, "epoch": 2569} {"train_loss": -24.787351608276367, "global_step": 213279, "epoch": 2569} {"train_loss": -24.136320114135742, "global_step": 213280, "epoch": 2569} {"train_loss": -24.017030715942383, "global_step": 213281, "epoch": 2569} {"train_loss": -24.62495994567871, "global_step": 213282, "epoch": 2569} {"train_loss": -24.251941680908203, "global_step": 213283, "epoch": 2569} {"train_loss": -24.086240768432617, "global_step": 213284, "epoch": 2569} {"train_loss": -24.350675582885742, "global_step": 213285, "epoch": 2569} {"train_loss": -24.28089141845703, "global_step": 213286, "epoch": 2569} {"train_loss": -24.285785675048828, "global_step": 213287, "epoch": 2569} {"train_loss": -24.30940055847168, "global_step": 213288, "epoch": 2569} {"train_loss": -24.20782470703125, "global_step": 213289, "epoch": 2569} {"train_loss": -24.237966537475586, "global_step": 213290, "epoch": 2569} {"train_loss": -23.74626922607422, "global_step": 213291, "epoch": 2569} {"train_loss": -24.62650489807129, "global_step": 213292, "epoch": 2569} {"train_loss": -24.339813232421875, "global_step": 213293, "epoch": 2569} {"train_loss": -24.51026725769043, "global_step": 213294, "epoch": 2569} {"train_loss": -24.4317626953125, "global_step": 213295, "epoch": 2569} {"train_loss": -24.9140682220459, "global_step": 213296, "epoch": 2569} {"train_loss": -24.478118896484375, "global_step": 213297, "epoch": 2569} {"train_loss": -24.455488204956055, "global_step": 213298, "epoch": 2569} {"train_loss": -24.481760025024414, "global_step": 213299, "epoch": 2569} {"train_loss": -24.484228134155273, "global_step": 213300, "epoch": 2569} {"train_loss": -24.70857048034668, "global_step": 213301, "epoch": 2569} {"train_loss": -24.436126708984375, "global_step": 213302, "epoch": 2569} {"train_loss": -24.577838897705078, "global_step": 213303, "epoch": 2569} {"train_loss": -24.313980102539062, "global_step": 213304, "epoch": 2569} {"train_loss": -24.97580909729004, "global_step": 213305, "epoch": 2569} {"train_loss": -24.375518798828125, "global_step": 213306, "epoch": 2569} {"train_loss": -24.587173461914062, "global_step": 213307, "epoch": 2569} {"train_loss": -24.82318687438965, "global_step": 213308, "epoch": 2569} {"train_loss": -24.40464785012854, "global_step": 213309, "epoch": 2569, "val_loss": 6746287.0} {"train_loss": -23.713781356811523, "global_step": 213310, "epoch": 2570} {"train_loss": -24.43094825744629, "global_step": 213311, "epoch": 2570} {"train_loss": -24.66218376159668, "global_step": 213312, "epoch": 2570} {"train_loss": -23.93048667907715, "global_step": 213313, "epoch": 2570} {"train_loss": -24.431013107299805, "global_step": 213314, "epoch": 2570} {"train_loss": -24.555097579956055, "global_step": 213315, "epoch": 2570} {"train_loss": -24.605680465698242, "global_step": 213316, "epoch": 2570} {"train_loss": -24.22678565979004, "global_step": 213317, "epoch": 2570} {"train_loss": -24.35120964050293, "global_step": 213318, "epoch": 2570} {"train_loss": -24.32918357849121, "global_step": 213319, "epoch": 2570} {"train_loss": -24.37504768371582, "global_step": 213320, "epoch": 2570} {"train_loss": -23.974218368530273, "global_step": 213321, "epoch": 2570} {"train_loss": -24.30377769470215, "global_step": 213322, "epoch": 2570} {"train_loss": -24.521453857421875, "global_step": 213323, "epoch": 2570} {"train_loss": -24.481409072875977, "global_step": 213324, "epoch": 2570} {"train_loss": -24.302125930786133, "global_step": 213325, "epoch": 2570} {"train_loss": -24.253379821777344, "global_step": 213326, "epoch": 2570} {"train_loss": -24.280832290649414, "global_step": 213327, "epoch": 2570} {"train_loss": -24.2210750579834, "global_step": 213328, "epoch": 2570} {"train_loss": -24.643390655517578, "global_step": 213329, "epoch": 2570} {"train_loss": -24.3714656829834, "global_step": 213330, "epoch": 2570} {"train_loss": -24.496417999267578, "global_step": 213331, "epoch": 2570} {"train_loss": -24.492582321166992, "global_step": 213332, "epoch": 2570} {"train_loss": -24.533370971679688, "global_step": 213333, "epoch": 2570} {"train_loss": -24.491565704345703, "global_step": 213334, "epoch": 2570} {"train_loss": -24.53546142578125, "global_step": 213335, "epoch": 2570} {"train_loss": -24.838132858276367, "global_step": 213336, "epoch": 2570} {"train_loss": -24.6329402923584, "global_step": 213337, "epoch": 2570} {"train_loss": -24.60221290588379, "global_step": 213338, "epoch": 2570} {"train_loss": -24.340152740478516, "global_step": 213339, "epoch": 2570} {"train_loss": -24.108749389648438, "global_step": 213340, "epoch": 2570} {"train_loss": -24.42378807067871, "global_step": 213341, "epoch": 2570} {"train_loss": -24.854001998901367, "global_step": 213342, "epoch": 2570} {"train_loss": -24.546466827392578, "global_step": 213343, "epoch": 2570} {"train_loss": -24.530118942260742, "global_step": 213344, "epoch": 2570} {"train_loss": -24.264606475830078, "global_step": 213345, "epoch": 2570} {"train_loss": -24.240631103515625, "global_step": 213346, "epoch": 2570} {"train_loss": -24.46109390258789, "global_step": 213347, "epoch": 2570} {"train_loss": -24.79269027709961, "global_step": 213348, "epoch": 2570} {"train_loss": -24.30194091796875, "global_step": 213349, "epoch": 2570} {"train_loss": -24.378496170043945, "global_step": 213350, "epoch": 2570} {"train_loss": -24.94776725769043, "global_step": 213351, "epoch": 2570} {"train_loss": -24.7249698638916, "global_step": 213352, "epoch": 2570} {"train_loss": -24.516326904296875, "global_step": 213353, "epoch": 2570} {"train_loss": -24.221317291259766, "global_step": 213354, "epoch": 2570} {"train_loss": -24.279733657836914, "global_step": 213355, "epoch": 2570} {"train_loss": -24.40683364868164, "global_step": 213356, "epoch": 2570} {"train_loss": -24.648588180541992, "global_step": 213357, "epoch": 2570} {"train_loss": -24.738922119140625, "global_step": 213358, "epoch": 2570} {"train_loss": -24.10304069519043, "global_step": 213359, "epoch": 2570} {"train_loss": -24.171422958374023, "global_step": 213360, "epoch": 2570} {"train_loss": -24.548871994018555, "global_step": 213361, "epoch": 2570} {"train_loss": -24.626867294311523, "global_step": 213362, "epoch": 2570} {"train_loss": -24.42991828918457, "global_step": 213363, "epoch": 2570} {"train_loss": -24.261648178100586, "global_step": 213364, "epoch": 2570} {"train_loss": -24.36891746520996, "global_step": 213365, "epoch": 2570} {"train_loss": -24.630823135375977, "global_step": 213366, "epoch": 2570} {"train_loss": -24.49623680114746, "global_step": 213367, "epoch": 2570} {"train_loss": -24.510663986206055, "global_step": 213368, "epoch": 2570} {"train_loss": -24.616376876831055, "global_step": 213369, "epoch": 2570} {"train_loss": -24.30149269104004, "global_step": 213370, "epoch": 2570} {"train_loss": -24.24138641357422, "global_step": 213371, "epoch": 2570} {"train_loss": -24.084213256835938, "global_step": 213372, "epoch": 2570} {"train_loss": -24.515396118164062, "global_step": 213373, "epoch": 2570} {"train_loss": -24.66359519958496, "global_step": 213374, "epoch": 2570} {"train_loss": -24.763561248779297, "global_step": 213375, "epoch": 2570} {"train_loss": -24.343013763427734, "global_step": 213376, "epoch": 2570} {"train_loss": -24.602767944335938, "global_step": 213377, "epoch": 2570} {"train_loss": -24.45018196105957, "global_step": 213378, "epoch": 2570} {"train_loss": -24.517629623413086, "global_step": 213379, "epoch": 2570} {"train_loss": -24.44599723815918, "global_step": 213380, "epoch": 2570} {"train_loss": -24.312849044799805, "global_step": 213381, "epoch": 2570} {"train_loss": -24.655216217041016, "global_step": 213382, "epoch": 2570} {"train_loss": -24.59027671813965, "global_step": 213383, "epoch": 2570} {"train_loss": -24.362789154052734, "global_step": 213384, "epoch": 2570} {"train_loss": -24.52338981628418, "global_step": 213385, "epoch": 2570} {"train_loss": -24.447856903076172, "global_step": 213386, "epoch": 2570} {"train_loss": -24.639856338500977, "global_step": 213387, "epoch": 2570} {"train_loss": -24.652301788330078, "global_step": 213388, "epoch": 2570} {"train_loss": -24.518705368041992, "global_step": 213389, "epoch": 2570} {"train_loss": -24.302566528320312, "global_step": 213390, "epoch": 2570} {"train_loss": -24.80426025390625, "global_step": 213391, "epoch": 2570} {"train_loss": -24.449557361832586, "global_step": 213392, "epoch": 2570, "val_loss": 6613267.0} {"train_loss": -24.25506019592285, "global_step": 213393, "epoch": 2571} {"train_loss": -24.062118530273438, "global_step": 213394, "epoch": 2571} {"train_loss": -23.8231258392334, "global_step": 213395, "epoch": 2571} {"train_loss": -24.06618881225586, "global_step": 213396, "epoch": 2571} {"train_loss": -23.5648250579834, "global_step": 213397, "epoch": 2571} {"train_loss": -24.035306930541992, "global_step": 213398, "epoch": 2571} {"train_loss": -23.7631893157959, "global_step": 213399, "epoch": 2571} {"train_loss": -24.362863540649414, "global_step": 213400, "epoch": 2571} {"train_loss": -24.080474853515625, "global_step": 213401, "epoch": 2571} {"train_loss": -24.14338493347168, "global_step": 213402, "epoch": 2571} {"train_loss": -24.06104278564453, "global_step": 213403, "epoch": 2571} {"train_loss": -23.988113403320312, "global_step": 213404, "epoch": 2571} {"train_loss": -24.166763305664062, "global_step": 213405, "epoch": 2571} {"train_loss": -24.15938377380371, "global_step": 213406, "epoch": 2571} {"train_loss": -24.088014602661133, "global_step": 213407, "epoch": 2571} {"train_loss": -24.295106887817383, "global_step": 213408, "epoch": 2571} {"train_loss": -24.411020278930664, "global_step": 213409, "epoch": 2571} {"train_loss": -24.298242568969727, "global_step": 213410, "epoch": 2571} {"train_loss": -24.12856101989746, "global_step": 213411, "epoch": 2571} {"train_loss": -24.330617904663086, "global_step": 213412, "epoch": 2571} {"train_loss": -24.570005416870117, "global_step": 213413, "epoch": 2571} {"train_loss": -24.34506607055664, "global_step": 213414, "epoch": 2571} {"train_loss": -24.973709106445312, "global_step": 213415, "epoch": 2571} {"train_loss": -24.61003875732422, "global_step": 213416, "epoch": 2571} {"train_loss": -24.23878288269043, "global_step": 213417, "epoch": 2571} {"train_loss": -24.565998077392578, "global_step": 213418, "epoch": 2571} {"train_loss": -24.340559005737305, "global_step": 213419, "epoch": 2571} {"train_loss": -24.739152908325195, "global_step": 213420, "epoch": 2571} {"train_loss": -24.639387130737305, "global_step": 213421, "epoch": 2571} {"train_loss": -24.514883041381836, "global_step": 213422, "epoch": 2571} {"train_loss": -24.7020206451416, "global_step": 213423, "epoch": 2571} {"train_loss": -24.692808151245117, "global_step": 213424, "epoch": 2571} {"train_loss": -24.00227928161621, "global_step": 213425, "epoch": 2571} {"train_loss": -24.302473068237305, "global_step": 213426, "epoch": 2571} {"train_loss": -24.47261619567871, "global_step": 213427, "epoch": 2571} {"train_loss": -24.593015670776367, "global_step": 213428, "epoch": 2571} {"train_loss": -24.35906410217285, "global_step": 213429, "epoch": 2571} {"train_loss": -24.353057861328125, "global_step": 213430, "epoch": 2571} {"train_loss": -23.811025619506836, "global_step": 213431, "epoch": 2571} {"train_loss": -23.546655654907227, "global_step": 213432, "epoch": 2571} {"train_loss": -23.864839553833008, "global_step": 213433, "epoch": 2571} {"train_loss": -24.612293243408203, "global_step": 213434, "epoch": 2571} {"train_loss": -24.613374710083008, "global_step": 213435, "epoch": 2571} {"train_loss": -24.401748657226562, "global_step": 213436, "epoch": 2571} {"train_loss": -24.606077194213867, "global_step": 213437, "epoch": 2571} {"train_loss": -24.508886337280273, "global_step": 213438, "epoch": 2571} {"train_loss": -24.060199737548828, "global_step": 213439, "epoch": 2571} {"train_loss": -24.435338973999023, "global_step": 213440, "epoch": 2571} {"train_loss": -24.40408706665039, "global_step": 213441, "epoch": 2571} {"train_loss": -24.487478256225586, "global_step": 213442, "epoch": 2571} {"train_loss": -24.190284729003906, "global_step": 213443, "epoch": 2571} {"train_loss": -24.748476028442383, "global_step": 213444, "epoch": 2571} {"train_loss": -24.658342361450195, "global_step": 213445, "epoch": 2571} {"train_loss": -24.365211486816406, "global_step": 213446, "epoch": 2571} {"train_loss": -24.595121383666992, "global_step": 213447, "epoch": 2571} {"train_loss": -24.9603214263916, "global_step": 213448, "epoch": 2571} {"train_loss": -24.49102210998535, "global_step": 213449, "epoch": 2571} {"train_loss": -24.33216667175293, "global_step": 213450, "epoch": 2571} {"train_loss": -24.95014762878418, "global_step": 213451, "epoch": 2571} {"train_loss": -24.574249267578125, "global_step": 213452, "epoch": 2571} {"train_loss": -24.773902893066406, "global_step": 213453, "epoch": 2571} {"train_loss": -24.510496139526367, "global_step": 213454, "epoch": 2571} {"train_loss": -24.468154907226562, "global_step": 213455, "epoch": 2571} {"train_loss": -24.42180633544922, "global_step": 213456, "epoch": 2571} {"train_loss": -24.247150421142578, "global_step": 213457, "epoch": 2571} {"train_loss": -24.625259399414062, "global_step": 213458, "epoch": 2571} {"train_loss": -24.282438278198242, "global_step": 213459, "epoch": 2571} {"train_loss": -24.565216064453125, "global_step": 213460, "epoch": 2571} {"train_loss": -24.884944915771484, "global_step": 213461, "epoch": 2571} {"train_loss": -24.640090942382812, "global_step": 213462, "epoch": 2571} {"train_loss": -24.48829460144043, "global_step": 213463, "epoch": 2571} {"train_loss": -24.754005432128906, "global_step": 213464, "epoch": 2571} {"train_loss": -24.628385543823242, "global_step": 213465, "epoch": 2571} {"train_loss": -24.673757553100586, "global_step": 213466, "epoch": 2571} {"train_loss": -24.823333740234375, "global_step": 213467, "epoch": 2571} {"train_loss": -24.47867202758789, "global_step": 213468, "epoch": 2571} {"train_loss": -25.037927627563477, "global_step": 213469, "epoch": 2571} {"train_loss": -24.735387802124023, "global_step": 213470, "epoch": 2571} {"train_loss": -24.638031005859375, "global_step": 213471, "epoch": 2571} {"train_loss": -24.358600616455078, "global_step": 213472, "epoch": 2571} {"train_loss": -24.33599281311035, "global_step": 213473, "epoch": 2571} {"train_loss": -24.327756881713867, "global_step": 213474, "epoch": 2571} {"train_loss": -24.37964062518384, "global_step": 213475, "epoch": 2571, "val_loss": 6780777.0} {"train_loss": -24.030027389526367, "global_step": 213476, "epoch": 2572} {"train_loss": -24.007495880126953, "global_step": 213477, "epoch": 2572} {"train_loss": -24.124574661254883, "global_step": 213478, "epoch": 2572} {"train_loss": -23.674039840698242, "global_step": 213479, "epoch": 2572} {"train_loss": -23.695716857910156, "global_step": 213480, "epoch": 2572} {"train_loss": -23.466360092163086, "global_step": 213481, "epoch": 2572} {"train_loss": -23.91470718383789, "global_step": 213482, "epoch": 2572} {"train_loss": -23.9570255279541, "global_step": 213483, "epoch": 2572} {"train_loss": -24.13042640686035, "global_step": 213484, "epoch": 2572} {"train_loss": -24.32296371459961, "global_step": 213485, "epoch": 2572} {"train_loss": -23.776962280273438, "global_step": 213486, "epoch": 2572} {"train_loss": -24.204734802246094, "global_step": 213487, "epoch": 2572} {"train_loss": -24.319162368774414, "global_step": 213488, "epoch": 2572} {"train_loss": -24.157855987548828, "global_step": 213489, "epoch": 2572} {"train_loss": -24.015493392944336, "global_step": 213490, "epoch": 2572} {"train_loss": -24.31785774230957, "global_step": 213491, "epoch": 2572} {"train_loss": -24.178930282592773, "global_step": 213492, "epoch": 2572} {"train_loss": -24.355939865112305, "global_step": 213493, "epoch": 2572} {"train_loss": -24.212448120117188, "global_step": 213494, "epoch": 2572} {"train_loss": -24.292343139648438, "global_step": 213495, "epoch": 2572} {"train_loss": -24.44482421875, "global_step": 213496, "epoch": 2572} {"train_loss": -24.56232261657715, "global_step": 213497, "epoch": 2572} {"train_loss": -24.204442977905273, "global_step": 213498, "epoch": 2572} {"train_loss": -24.225797653198242, "global_step": 213499, "epoch": 2572} {"train_loss": -24.42877197265625, "global_step": 213500, "epoch": 2572} {"train_loss": -24.490163803100586, "global_step": 213501, "epoch": 2572} {"train_loss": -24.13031578063965, "global_step": 213502, "epoch": 2572} {"train_loss": -24.56584930419922, "global_step": 213503, "epoch": 2572} {"train_loss": -24.156400680541992, "global_step": 213504, "epoch": 2572} {"train_loss": -24.606863021850586, "global_step": 213505, "epoch": 2572} {"train_loss": -24.481613159179688, "global_step": 213506, "epoch": 2572} {"train_loss": -24.24982452392578, "global_step": 213507, "epoch": 2572} {"train_loss": -24.31390380859375, "global_step": 213508, "epoch": 2572} {"train_loss": -24.76766014099121, "global_step": 213509, "epoch": 2572} {"train_loss": -24.351102828979492, "global_step": 213510, "epoch": 2572} {"train_loss": -24.611072540283203, "global_step": 213511, "epoch": 2572} {"train_loss": -24.576223373413086, "global_step": 213512, "epoch": 2572} {"train_loss": -24.257862091064453, "global_step": 213513, "epoch": 2572} {"train_loss": -23.972259521484375, "global_step": 213514, "epoch": 2572} {"train_loss": -24.339582443237305, "global_step": 213515, "epoch": 2572} {"train_loss": -24.469318389892578, "global_step": 213516, "epoch": 2572} {"train_loss": -23.88205909729004, "global_step": 213517, "epoch": 2572} {"train_loss": -24.29860496520996, "global_step": 213518, "epoch": 2572} {"train_loss": -24.45163345336914, "global_step": 213519, "epoch": 2572} {"train_loss": -24.20667839050293, "global_step": 213520, "epoch": 2572} {"train_loss": -24.2071533203125, "global_step": 213521, "epoch": 2572} {"train_loss": -24.671947479248047, "global_step": 213522, "epoch": 2572} {"train_loss": -24.400169372558594, "global_step": 213523, "epoch": 2572} {"train_loss": -24.316818237304688, "global_step": 213524, "epoch": 2572} {"train_loss": -24.240257263183594, "global_step": 213525, "epoch": 2572} {"train_loss": -24.750158309936523, "global_step": 213526, "epoch": 2572} {"train_loss": -23.962308883666992, "global_step": 213527, "epoch": 2572} {"train_loss": -24.424558639526367, "global_step": 213528, "epoch": 2572} {"train_loss": -24.359073638916016, "global_step": 213529, "epoch": 2572} {"train_loss": -24.622352600097656, "global_step": 213530, "epoch": 2572} {"train_loss": -24.598106384277344, "global_step": 213531, "epoch": 2572} {"train_loss": -24.754058837890625, "global_step": 213532, "epoch": 2572} {"train_loss": -24.693628311157227, "global_step": 213533, "epoch": 2572} {"train_loss": -24.4788818359375, "global_step": 213534, "epoch": 2572} {"train_loss": -24.732267379760742, "global_step": 213535, "epoch": 2572} {"train_loss": -24.2358455657959, "global_step": 213536, "epoch": 2572} {"train_loss": -24.777029037475586, "global_step": 213537, "epoch": 2572} {"train_loss": -25.084028244018555, "global_step": 213538, "epoch": 2572} {"train_loss": -24.494476318359375, "global_step": 213539, "epoch": 2572} {"train_loss": -24.478673934936523, "global_step": 213540, "epoch": 2572} {"train_loss": -24.654922485351562, "global_step": 213541, "epoch": 2572} {"train_loss": -24.401185989379883, "global_step": 213542, "epoch": 2572} {"train_loss": -24.347856521606445, "global_step": 213543, "epoch": 2572} {"train_loss": -24.680509567260742, "global_step": 213544, "epoch": 2572} {"train_loss": -24.545825958251953, "global_step": 213545, "epoch": 2572} {"train_loss": -24.51968002319336, "global_step": 213546, "epoch": 2572} {"train_loss": -24.801807403564453, "global_step": 213547, "epoch": 2572} {"train_loss": -24.556167602539062, "global_step": 213548, "epoch": 2572} {"train_loss": -24.485286712646484, "global_step": 213549, "epoch": 2572} {"train_loss": -24.72420883178711, "global_step": 213550, "epoch": 2572} {"train_loss": -24.660633087158203, "global_step": 213551, "epoch": 2572} {"train_loss": -24.509248733520508, "global_step": 213552, "epoch": 2572} {"train_loss": -24.703195571899414, "global_step": 213553, "epoch": 2572} {"train_loss": -24.518442153930664, "global_step": 213554, "epoch": 2572} {"train_loss": -24.69441795349121, "global_step": 213555, "epoch": 2572} {"train_loss": -24.574979782104492, "global_step": 213556, "epoch": 2572} {"train_loss": -24.134641647338867, "global_step": 213557, "epoch": 2572} {"train_loss": -24.361472279192455, "global_step": 213558, "epoch": 2572, "val_loss": 6920316.0} {"train_loss": -23.76512908935547, "global_step": 213559, "epoch": 2573} {"train_loss": -23.73280906677246, "global_step": 213560, "epoch": 2573} {"train_loss": -23.9422550201416, "global_step": 213561, "epoch": 2573} {"train_loss": -23.837047576904297, "global_step": 213562, "epoch": 2573} {"train_loss": -23.853769302368164, "global_step": 213563, "epoch": 2573} {"train_loss": -24.403554916381836, "global_step": 213564, "epoch": 2573} {"train_loss": -23.936445236206055, "global_step": 213565, "epoch": 2573} {"train_loss": -24.194257736206055, "global_step": 213566, "epoch": 2573} {"train_loss": -23.955183029174805, "global_step": 213567, "epoch": 2573} {"train_loss": -23.82940673828125, "global_step": 213568, "epoch": 2573} {"train_loss": -23.865325927734375, "global_step": 213569, "epoch": 2573} {"train_loss": -24.44655418395996, "global_step": 213570, "epoch": 2573} {"train_loss": -24.1998348236084, "global_step": 213571, "epoch": 2573} {"train_loss": -24.237720489501953, "global_step": 213572, "epoch": 2573} {"train_loss": -24.264623641967773, "global_step": 213573, "epoch": 2573} {"train_loss": -24.28670310974121, "global_step": 213574, "epoch": 2573} {"train_loss": -23.853107452392578, "global_step": 213575, "epoch": 2573} {"train_loss": -24.030244827270508, "global_step": 213576, "epoch": 2573} {"train_loss": -24.33241844177246, "global_step": 213577, "epoch": 2573} {"train_loss": -24.17742919921875, "global_step": 213578, "epoch": 2573} {"train_loss": -23.973127365112305, "global_step": 213579, "epoch": 2573} {"train_loss": -24.427316665649414, "global_step": 213580, "epoch": 2573} {"train_loss": -24.22718048095703, "global_step": 213581, "epoch": 2573} {"train_loss": -24.504316329956055, "global_step": 213582, "epoch": 2573} {"train_loss": -24.529253005981445, "global_step": 213583, "epoch": 2573} {"train_loss": -24.550344467163086, "global_step": 213584, "epoch": 2573} {"train_loss": -24.755544662475586, "global_step": 213585, "epoch": 2573} {"train_loss": -23.95228385925293, "global_step": 213586, "epoch": 2573} {"train_loss": -24.347082138061523, "global_step": 213587, "epoch": 2573} {"train_loss": -24.45441246032715, "global_step": 213588, "epoch": 2573} {"train_loss": -24.630359649658203, "global_step": 213589, "epoch": 2573} {"train_loss": -24.76896095275879, "global_step": 213590, "epoch": 2573} {"train_loss": -24.758848190307617, "global_step": 213591, "epoch": 2573} {"train_loss": -24.346921920776367, "global_step": 213592, "epoch": 2573} {"train_loss": -24.495121002197266, "global_step": 213593, "epoch": 2573} {"train_loss": -24.78644371032715, "global_step": 213594, "epoch": 2573} {"train_loss": -24.54636573791504, "global_step": 213595, "epoch": 2573} {"train_loss": -24.556791305541992, "global_step": 213596, "epoch": 2573} {"train_loss": -24.49246597290039, "global_step": 213597, "epoch": 2573} {"train_loss": -24.460783004760742, "global_step": 213598, "epoch": 2573} {"train_loss": -24.604774475097656, "global_step": 213599, "epoch": 2573} {"train_loss": -24.61029052734375, "global_step": 213600, "epoch": 2573} {"train_loss": -24.546640396118164, "global_step": 213601, "epoch": 2573} {"train_loss": -24.499692916870117, "global_step": 213602, "epoch": 2573} {"train_loss": -24.3813533782959, "global_step": 213603, "epoch": 2573} {"train_loss": -24.145578384399414, "global_step": 213604, "epoch": 2573} {"train_loss": -24.110441207885742, "global_step": 213605, "epoch": 2573} {"train_loss": -24.26827049255371, "global_step": 213606, "epoch": 2573} {"train_loss": -24.19117546081543, "global_step": 213607, "epoch": 2573} {"train_loss": -24.489599227905273, "global_step": 213608, "epoch": 2573} {"train_loss": -24.05476951599121, "global_step": 213609, "epoch": 2573} {"train_loss": -24.543901443481445, "global_step": 213610, "epoch": 2573} {"train_loss": -24.397554397583008, "global_step": 213611, "epoch": 2573} {"train_loss": -24.568031311035156, "global_step": 213612, "epoch": 2573} {"train_loss": -24.244592666625977, "global_step": 213613, "epoch": 2573} {"train_loss": -24.740610122680664, "global_step": 213614, "epoch": 2573} {"train_loss": -24.34404754638672, "global_step": 213615, "epoch": 2573} {"train_loss": -24.595956802368164, "global_step": 213616, "epoch": 2573} {"train_loss": -24.207700729370117, "global_step": 213617, "epoch": 2573} {"train_loss": -24.573503494262695, "global_step": 213618, "epoch": 2573} {"train_loss": -24.215530395507812, "global_step": 213619, "epoch": 2573} {"train_loss": -24.513113021850586, "global_step": 213620, "epoch": 2573} {"train_loss": -24.65224266052246, "global_step": 213621, "epoch": 2573} {"train_loss": -24.473501205444336, "global_step": 213622, "epoch": 2573} {"train_loss": -24.518465042114258, "global_step": 213623, "epoch": 2573} {"train_loss": -24.422632217407227, "global_step": 213624, "epoch": 2573} {"train_loss": -24.337629318237305, "global_step": 213625, "epoch": 2573} {"train_loss": -24.318883895874023, "global_step": 213626, "epoch": 2573} {"train_loss": -24.302101135253906, "global_step": 213627, "epoch": 2573} {"train_loss": -24.378511428833008, "global_step": 213628, "epoch": 2573} {"train_loss": -24.69736099243164, "global_step": 213629, "epoch": 2573} {"train_loss": -24.440610885620117, "global_step": 213630, "epoch": 2573} {"train_loss": -24.449514389038086, "global_step": 213631, "epoch": 2573} {"train_loss": -24.313858032226562, "global_step": 213632, "epoch": 2573} {"train_loss": -24.481359481811523, "global_step": 213633, "epoch": 2573} {"train_loss": -24.677244186401367, "global_step": 213634, "epoch": 2573} {"train_loss": -24.438682556152344, "global_step": 213635, "epoch": 2573} {"train_loss": -24.77646827697754, "global_step": 213636, "epoch": 2573} {"train_loss": -24.28221321105957, "global_step": 213637, "epoch": 2573} {"train_loss": -25.03610610961914, "global_step": 213638, "epoch": 2573} {"train_loss": -24.8174991607666, "global_step": 213639, "epoch": 2573} {"train_loss": -24.672027587890625, "global_step": 213640, "epoch": 2573} {"train_loss": -24.37800218972815, "global_step": 213641, "epoch": 2573, "val_loss": 6635019.0} {"train_loss": -24.212112426757812, "global_step": 213642, "epoch": 2574} {"train_loss": -24.267181396484375, "global_step": 213643, "epoch": 2574} {"train_loss": -24.332494735717773, "global_step": 213644, "epoch": 2574} {"train_loss": -24.397321701049805, "global_step": 213645, "epoch": 2574} {"train_loss": -24.335844039916992, "global_step": 213646, "epoch": 2574} {"train_loss": -24.236291885375977, "global_step": 213647, "epoch": 2574} {"train_loss": -24.063852310180664, "global_step": 213648, "epoch": 2574} {"train_loss": -24.227994918823242, "global_step": 213649, "epoch": 2574} {"train_loss": -24.247228622436523, "global_step": 213650, "epoch": 2574} {"train_loss": -24.36720848083496, "global_step": 213651, "epoch": 2574} {"train_loss": -24.3133602142334, "global_step": 213652, "epoch": 2574} {"train_loss": -24.51692008972168, "global_step": 213653, "epoch": 2574} {"train_loss": -24.22309684753418, "global_step": 213654, "epoch": 2574} {"train_loss": -24.205245971679688, "global_step": 213655, "epoch": 2574} {"train_loss": -24.42693328857422, "global_step": 213656, "epoch": 2574} {"train_loss": -24.856496810913086, "global_step": 213657, "epoch": 2574} {"train_loss": -24.27082633972168, "global_step": 213658, "epoch": 2574} {"train_loss": -24.177465438842773, "global_step": 213659, "epoch": 2574} {"train_loss": -24.891672134399414, "global_step": 213660, "epoch": 2574} {"train_loss": -24.366003036499023, "global_step": 213661, "epoch": 2574} {"train_loss": -24.244775772094727, "global_step": 213662, "epoch": 2574} {"train_loss": -24.733617782592773, "global_step": 213663, "epoch": 2574} {"train_loss": -24.75714111328125, "global_step": 213664, "epoch": 2574} {"train_loss": -24.277576446533203, "global_step": 213665, "epoch": 2574} {"train_loss": -24.62801170349121, "global_step": 213666, "epoch": 2574} {"train_loss": -23.95659828186035, "global_step": 213667, "epoch": 2574} {"train_loss": -24.153549194335938, "global_step": 213668, "epoch": 2574} {"train_loss": -24.826250076293945, "global_step": 213669, "epoch": 2574} {"train_loss": -24.892606735229492, "global_step": 213670, "epoch": 2574} {"train_loss": -24.350357055664062, "global_step": 213671, "epoch": 2574} {"train_loss": -24.16633415222168, "global_step": 213672, "epoch": 2574} {"train_loss": -24.36827850341797, "global_step": 213673, "epoch": 2574} {"train_loss": -24.419153213500977, "global_step": 213674, "epoch": 2574} {"train_loss": -24.54007339477539, "global_step": 213675, "epoch": 2574} {"train_loss": -24.523929595947266, "global_step": 213676, "epoch": 2574} {"train_loss": -24.500036239624023, "global_step": 213677, "epoch": 2574} {"train_loss": -24.545318603515625, "global_step": 213678, "epoch": 2574} {"train_loss": -24.6798152923584, "global_step": 213679, "epoch": 2574} {"train_loss": -24.270591735839844, "global_step": 213680, "epoch": 2574} {"train_loss": -24.427722930908203, "global_step": 213681, "epoch": 2574} {"train_loss": -24.624006271362305, "global_step": 213682, "epoch": 2574} {"train_loss": -24.434158325195312, "global_step": 213683, "epoch": 2574} {"train_loss": -24.61839485168457, "global_step": 213684, "epoch": 2574} {"train_loss": -24.42833709716797, "global_step": 213685, "epoch": 2574} {"train_loss": -24.521738052368164, "global_step": 213686, "epoch": 2574} {"train_loss": -24.109731674194336, "global_step": 213687, "epoch": 2574} {"train_loss": -24.176176071166992, "global_step": 213688, "epoch": 2574} {"train_loss": -24.45285415649414, "global_step": 213689, "epoch": 2574} {"train_loss": -24.526611328125, "global_step": 213690, "epoch": 2574} {"train_loss": -24.594995498657227, "global_step": 213691, "epoch": 2574} {"train_loss": -24.661766052246094, "global_step": 213692, "epoch": 2574} {"train_loss": -24.44028091430664, "global_step": 213693, "epoch": 2574} {"train_loss": -24.732084274291992, "global_step": 213694, "epoch": 2574} {"train_loss": -24.695907592773438, "global_step": 213695, "epoch": 2574} {"train_loss": -24.182174682617188, "global_step": 213696, "epoch": 2574} {"train_loss": -24.189855575561523, "global_step": 213697, "epoch": 2574} {"train_loss": -24.446748733520508, "global_step": 213698, "epoch": 2574} {"train_loss": -24.753559112548828, "global_step": 213699, "epoch": 2574} {"train_loss": -24.5075626373291, "global_step": 213700, "epoch": 2574} {"train_loss": -24.687047958374023, "global_step": 213701, "epoch": 2574} {"train_loss": -24.712894439697266, "global_step": 213702, "epoch": 2574} {"train_loss": -24.157140731811523, "global_step": 213703, "epoch": 2574} {"train_loss": -23.95197868347168, "global_step": 213704, "epoch": 2574} {"train_loss": -23.85281753540039, "global_step": 213705, "epoch": 2574} {"train_loss": -24.16004753112793, "global_step": 213706, "epoch": 2574} {"train_loss": -24.107868194580078, "global_step": 213707, "epoch": 2574} {"train_loss": -24.066577911376953, "global_step": 213708, "epoch": 2574} {"train_loss": -24.196819305419922, "global_step": 213709, "epoch": 2574} {"train_loss": -24.15351676940918, "global_step": 213710, "epoch": 2574} {"train_loss": -24.116458892822266, "global_step": 213711, "epoch": 2574} {"train_loss": -24.28492546081543, "global_step": 213712, "epoch": 2574} {"train_loss": -24.168909072875977, "global_step": 213713, "epoch": 2574} {"train_loss": -24.1645450592041, "global_step": 213714, "epoch": 2574} {"train_loss": -24.308441162109375, "global_step": 213715, "epoch": 2574} {"train_loss": -24.23676109313965, "global_step": 213716, "epoch": 2574} {"train_loss": -24.362333297729492, "global_step": 213717, "epoch": 2574} {"train_loss": -24.608789443969727, "global_step": 213718, "epoch": 2574} {"train_loss": -24.20379638671875, "global_step": 213719, "epoch": 2574} {"train_loss": -24.59113121032715, "global_step": 213720, "epoch": 2574} {"train_loss": -24.4564151763916, "global_step": 213721, "epoch": 2574} {"train_loss": -24.275869369506836, "global_step": 213722, "epoch": 2574} {"train_loss": -24.427595138549805, "global_step": 213723, "epoch": 2574} {"train_loss": -24.399514784295874, "global_step": 213724, "epoch": 2574, "val_loss": 6706343.0} {"train_loss": -23.94586753845215, "global_step": 213725, "epoch": 2575} {"train_loss": -24.481098175048828, "global_step": 213726, "epoch": 2575} {"train_loss": -24.276296615600586, "global_step": 213727, "epoch": 2575} {"train_loss": -24.04216766357422, "global_step": 213728, "epoch": 2575} {"train_loss": -24.208707809448242, "global_step": 213729, "epoch": 2575} {"train_loss": -24.085206985473633, "global_step": 213730, "epoch": 2575} {"train_loss": -24.250675201416016, "global_step": 213731, "epoch": 2575} {"train_loss": -24.204795837402344, "global_step": 213732, "epoch": 2575} {"train_loss": -24.0073299407959, "global_step": 213733, "epoch": 2575} {"train_loss": -24.347192764282227, "global_step": 213734, "epoch": 2575} {"train_loss": -24.09833335876465, "global_step": 213735, "epoch": 2575} {"train_loss": -24.328418731689453, "global_step": 213736, "epoch": 2575} {"train_loss": -24.213010787963867, "global_step": 213737, "epoch": 2575} {"train_loss": -24.62924575805664, "global_step": 213738, "epoch": 2575} {"train_loss": -24.511945724487305, "global_step": 213739, "epoch": 2575} {"train_loss": -24.403636932373047, "global_step": 213740, "epoch": 2575} {"train_loss": -24.4946346282959, "global_step": 213741, "epoch": 2575} {"train_loss": -24.656530380249023, "global_step": 213742, "epoch": 2575} {"train_loss": -24.982858657836914, "global_step": 213743, "epoch": 2575} {"train_loss": -24.917495727539062, "global_step": 213744, "epoch": 2575} {"train_loss": -24.333118438720703, "global_step": 213745, "epoch": 2575} {"train_loss": -24.761899948120117, "global_step": 213746, "epoch": 2575} {"train_loss": -24.42384910583496, "global_step": 213747, "epoch": 2575} {"train_loss": -24.629365921020508, "global_step": 213748, "epoch": 2575} {"train_loss": -24.781774520874023, "global_step": 213749, "epoch": 2575} {"train_loss": -24.563329696655273, "global_step": 213750, "epoch": 2575} {"train_loss": -24.36696434020996, "global_step": 213751, "epoch": 2575} {"train_loss": -24.680160522460938, "global_step": 213752, "epoch": 2575} {"train_loss": -24.665456771850586, "global_step": 213753, "epoch": 2575} {"train_loss": -24.645360946655273, "global_step": 213754, "epoch": 2575} {"train_loss": -24.40848731994629, "global_step": 213755, "epoch": 2575} {"train_loss": -24.535125732421875, "global_step": 213756, "epoch": 2575} {"train_loss": -24.603389739990234, "global_step": 213757, "epoch": 2575} {"train_loss": -24.571409225463867, "global_step": 213758, "epoch": 2575} {"train_loss": -24.709491729736328, "global_step": 213759, "epoch": 2575} {"train_loss": -24.624902725219727, "global_step": 213760, "epoch": 2575} {"train_loss": -24.623937606811523, "global_step": 213761, "epoch": 2575} {"train_loss": -24.51381492614746, "global_step": 213762, "epoch": 2575} {"train_loss": -24.663677215576172, "global_step": 213763, "epoch": 2575} {"train_loss": -24.44281768798828, "global_step": 213764, "epoch": 2575} {"train_loss": -24.624835968017578, "global_step": 213765, "epoch": 2575} {"train_loss": -24.884902954101562, "global_step": 213766, "epoch": 2575} {"train_loss": -24.561199188232422, "global_step": 213767, "epoch": 2575} {"train_loss": -24.38943862915039, "global_step": 213768, "epoch": 2575} {"train_loss": -24.009281158447266, "global_step": 213769, "epoch": 2575} {"train_loss": -24.01959800720215, "global_step": 213770, "epoch": 2575} {"train_loss": -24.3848934173584, "global_step": 213771, "epoch": 2575} {"train_loss": -24.59079360961914, "global_step": 213772, "epoch": 2575} {"train_loss": -24.558944702148438, "global_step": 213773, "epoch": 2575} {"train_loss": -25.020496368408203, "global_step": 213774, "epoch": 2575} {"train_loss": -24.689329147338867, "global_step": 213775, "epoch": 2575} {"train_loss": -24.5247802734375, "global_step": 213776, "epoch": 2575} {"train_loss": -24.42538070678711, "global_step": 213777, "epoch": 2575} {"train_loss": -24.521865844726562, "global_step": 213778, "epoch": 2575} {"train_loss": -24.28946876525879, "global_step": 213779, "epoch": 2575} {"train_loss": -24.38984489440918, "global_step": 213780, "epoch": 2575} {"train_loss": -24.12071990966797, "global_step": 213781, "epoch": 2575} {"train_loss": -24.15411376953125, "global_step": 213782, "epoch": 2575} {"train_loss": -24.932632446289062, "global_step": 213783, "epoch": 2575} {"train_loss": -24.355243682861328, "global_step": 213784, "epoch": 2575} {"train_loss": -24.581754684448242, "global_step": 213785, "epoch": 2575} {"train_loss": -23.939842224121094, "global_step": 213786, "epoch": 2575} {"train_loss": -23.903221130371094, "global_step": 213787, "epoch": 2575} {"train_loss": -24.517953872680664, "global_step": 213788, "epoch": 2575} {"train_loss": -24.21783447265625, "global_step": 213789, "epoch": 2575} {"train_loss": -23.871715545654297, "global_step": 213790, "epoch": 2575} {"train_loss": -23.801467895507812, "global_step": 213791, "epoch": 2575} {"train_loss": -24.442541122436523, "global_step": 213792, "epoch": 2575} {"train_loss": -24.205902099609375, "global_step": 213793, "epoch": 2575} {"train_loss": -24.280424118041992, "global_step": 213794, "epoch": 2575} {"train_loss": -24.256683349609375, "global_step": 213795, "epoch": 2575} {"train_loss": -24.62013053894043, "global_step": 213796, "epoch": 2575} {"train_loss": -24.778223037719727, "global_step": 213797, "epoch": 2575} {"train_loss": -24.308347702026367, "global_step": 213798, "epoch": 2575} {"train_loss": -24.812314987182617, "global_step": 213799, "epoch": 2575} {"train_loss": -24.235637664794922, "global_step": 213800, "epoch": 2575} {"train_loss": -24.214780807495117, "global_step": 213801, "epoch": 2575} {"train_loss": -24.182592391967773, "global_step": 213802, "epoch": 2575} {"train_loss": -24.48309898376465, "global_step": 213803, "epoch": 2575} {"train_loss": -24.389907836914062, "global_step": 213804, "epoch": 2575} {"train_loss": -24.070810317993164, "global_step": 213805, "epoch": 2575} {"train_loss": -24.478275299072266, "global_step": 213806, "epoch": 2575} {"train_loss": -24.392060888818946, "global_step": 213807, "epoch": 2575, "val_loss": 6459500.0} {"train_loss": -23.90780258178711, "global_step": 213808, "epoch": 2576} {"train_loss": -23.57496452331543, "global_step": 213809, "epoch": 2576} {"train_loss": -23.913957595825195, "global_step": 213810, "epoch": 2576} {"train_loss": -24.181257247924805, "global_step": 213811, "epoch": 2576} {"train_loss": -24.162952423095703, "global_step": 213812, "epoch": 2576} {"train_loss": -23.828079223632812, "global_step": 213813, "epoch": 2576} {"train_loss": -23.81612205505371, "global_step": 213814, "epoch": 2576} {"train_loss": -23.951169967651367, "global_step": 213815, "epoch": 2576} {"train_loss": -24.181058883666992, "global_step": 213816, "epoch": 2576} {"train_loss": -24.062414169311523, "global_step": 213817, "epoch": 2576} {"train_loss": -23.980695724487305, "global_step": 213818, "epoch": 2576} {"train_loss": -24.316102981567383, "global_step": 213819, "epoch": 2576} {"train_loss": -23.999780654907227, "global_step": 213820, "epoch": 2576} {"train_loss": -23.999685287475586, "global_step": 213821, "epoch": 2576} {"train_loss": -23.96687889099121, "global_step": 213822, "epoch": 2576} {"train_loss": -24.29463768005371, "global_step": 213823, "epoch": 2576} {"train_loss": -24.126306533813477, "global_step": 213824, "epoch": 2576} {"train_loss": -24.340177536010742, "global_step": 213825, "epoch": 2576} {"train_loss": -23.956357955932617, "global_step": 213826, "epoch": 2576} {"train_loss": -24.51319122314453, "global_step": 213827, "epoch": 2576} {"train_loss": -23.86793327331543, "global_step": 213828, "epoch": 2576} {"train_loss": -24.392093658447266, "global_step": 213829, "epoch": 2576} {"train_loss": -24.60023307800293, "global_step": 213830, "epoch": 2576} {"train_loss": -24.602689743041992, "global_step": 213831, "epoch": 2576} {"train_loss": -24.455917358398438, "global_step": 213832, "epoch": 2576} {"train_loss": -24.36041831970215, "global_step": 213833, "epoch": 2576} {"train_loss": -24.116424560546875, "global_step": 213834, "epoch": 2576} {"train_loss": -24.962635040283203, "global_step": 213835, "epoch": 2576} {"train_loss": -24.40593910217285, "global_step": 213836, "epoch": 2576} {"train_loss": -24.530498504638672, "global_step": 213837, "epoch": 2576} {"train_loss": -24.608388900756836, "global_step": 213838, "epoch": 2576} {"train_loss": -24.56658935546875, "global_step": 213839, "epoch": 2576} {"train_loss": -24.217294692993164, "global_step": 213840, "epoch": 2576} {"train_loss": -24.4688720703125, "global_step": 213841, "epoch": 2576} {"train_loss": -24.437868118286133, "global_step": 213842, "epoch": 2576} {"train_loss": -24.616512298583984, "global_step": 213843, "epoch": 2576} {"train_loss": -24.64276123046875, "global_step": 213844, "epoch": 2576} {"train_loss": -24.25474739074707, "global_step": 213845, "epoch": 2576} {"train_loss": -24.17510986328125, "global_step": 213846, "epoch": 2576} {"train_loss": -24.256834030151367, "global_step": 213847, "epoch": 2576} {"train_loss": -23.901830673217773, "global_step": 213848, "epoch": 2576} {"train_loss": -24.087631225585938, "global_step": 213849, "epoch": 2576} {"train_loss": -24.53303337097168, "global_step": 213850, "epoch": 2576} {"train_loss": -24.334714889526367, "global_step": 213851, "epoch": 2576} {"train_loss": -24.220687866210938, "global_step": 213852, "epoch": 2576} {"train_loss": -24.485441207885742, "global_step": 213853, "epoch": 2576} {"train_loss": -24.491514205932617, "global_step": 213854, "epoch": 2576} {"train_loss": -24.375957489013672, "global_step": 213855, "epoch": 2576} {"train_loss": -24.354122161865234, "global_step": 213856, "epoch": 2576} {"train_loss": -24.012760162353516, "global_step": 213857, "epoch": 2576} {"train_loss": -24.617666244506836, "global_step": 213858, "epoch": 2576} {"train_loss": -24.148244857788086, "global_step": 213859, "epoch": 2576} {"train_loss": -24.590734481811523, "global_step": 213860, "epoch": 2576} {"train_loss": -24.238039016723633, "global_step": 213861, "epoch": 2576} {"train_loss": -24.1746826171875, "global_step": 213862, "epoch": 2576} {"train_loss": -24.886058807373047, "global_step": 213863, "epoch": 2576} {"train_loss": -24.816328048706055, "global_step": 213864, "epoch": 2576} {"train_loss": -24.436967849731445, "global_step": 213865, "epoch": 2576} {"train_loss": -24.337238311767578, "global_step": 213866, "epoch": 2576} {"train_loss": -24.466123580932617, "global_step": 213867, "epoch": 2576} {"train_loss": -24.747129440307617, "global_step": 213868, "epoch": 2576} {"train_loss": -24.619871139526367, "global_step": 213869, "epoch": 2576} {"train_loss": -24.56358528137207, "global_step": 213870, "epoch": 2576} {"train_loss": -24.436017990112305, "global_step": 213871, "epoch": 2576} {"train_loss": -24.801267623901367, "global_step": 213872, "epoch": 2576} {"train_loss": -24.367422103881836, "global_step": 213873, "epoch": 2576} {"train_loss": -24.262704849243164, "global_step": 213874, "epoch": 2576} {"train_loss": -24.80150604248047, "global_step": 213875, "epoch": 2576} {"train_loss": -24.70490074157715, "global_step": 213876, "epoch": 2576} {"train_loss": -24.34368896484375, "global_step": 213877, "epoch": 2576} {"train_loss": -24.268075942993164, "global_step": 213878, "epoch": 2576} {"train_loss": -24.33612060546875, "global_step": 213879, "epoch": 2576} {"train_loss": -24.462017059326172, "global_step": 213880, "epoch": 2576} {"train_loss": -24.299152374267578, "global_step": 213881, "epoch": 2576} {"train_loss": -24.69005012512207, "global_step": 213882, "epoch": 2576} {"train_loss": -24.6439208984375, "global_step": 213883, "epoch": 2576} {"train_loss": -24.614973068237305, "global_step": 213884, "epoch": 2576} {"train_loss": -24.761117935180664, "global_step": 213885, "epoch": 2576} {"train_loss": -24.784666061401367, "global_step": 213886, "epoch": 2576} {"train_loss": -24.395185470581055, "global_step": 213887, "epoch": 2576} {"train_loss": -24.627487182617188, "global_step": 213888, "epoch": 2576} {"train_loss": -24.578824996948242, "global_step": 213889, "epoch": 2576} {"train_loss": -24.349577271794697, "global_step": 213890, "epoch": 2576, "val_loss": 6752965.0} {"train_loss": -24.51336097717285, "global_step": 213891, "epoch": 2577} {"train_loss": -24.058958053588867, "global_step": 213892, "epoch": 2577} {"train_loss": -24.289688110351562, "global_step": 213893, "epoch": 2577} {"train_loss": -24.40283966064453, "global_step": 213894, "epoch": 2577} {"train_loss": -24.176904678344727, "global_step": 213895, "epoch": 2577} {"train_loss": -24.049747467041016, "global_step": 213896, "epoch": 2577} {"train_loss": -24.610136032104492, "global_step": 213897, "epoch": 2577} {"train_loss": -24.468151092529297, "global_step": 213898, "epoch": 2577} {"train_loss": -24.471242904663086, "global_step": 213899, "epoch": 2577} {"train_loss": -24.401594161987305, "global_step": 213900, "epoch": 2577} {"train_loss": -24.72749137878418, "global_step": 213901, "epoch": 2577} {"train_loss": -24.319000244140625, "global_step": 213902, "epoch": 2577} {"train_loss": -24.376771926879883, "global_step": 213903, "epoch": 2577} {"train_loss": -24.155914306640625, "global_step": 213904, "epoch": 2577} {"train_loss": -24.3786678314209, "global_step": 213905, "epoch": 2577} {"train_loss": -24.410627365112305, "global_step": 213906, "epoch": 2577} {"train_loss": -24.160383224487305, "global_step": 213907, "epoch": 2577} {"train_loss": -24.62660026550293, "global_step": 213908, "epoch": 2577} {"train_loss": -24.235544204711914, "global_step": 213909, "epoch": 2577} {"train_loss": -24.38070297241211, "global_step": 213910, "epoch": 2577} {"train_loss": -24.320600509643555, "global_step": 213911, "epoch": 2577} {"train_loss": -24.23847007751465, "global_step": 213912, "epoch": 2577} {"train_loss": -24.51812171936035, "global_step": 213913, "epoch": 2577} {"train_loss": -24.54328727722168, "global_step": 213914, "epoch": 2577} {"train_loss": -24.521879196166992, "global_step": 213915, "epoch": 2577} {"train_loss": -24.760177612304688, "global_step": 213916, "epoch": 2577} {"train_loss": -24.329059600830078, "global_step": 213917, "epoch": 2577} {"train_loss": -24.745567321777344, "global_step": 213918, "epoch": 2577} {"train_loss": -24.616750717163086, "global_step": 213919, "epoch": 2577} {"train_loss": -24.54080581665039, "global_step": 213920, "epoch": 2577} {"train_loss": -24.67469596862793, "global_step": 213921, "epoch": 2577} {"train_loss": -24.413740158081055, "global_step": 213922, "epoch": 2577} {"train_loss": -24.368349075317383, "global_step": 213923, "epoch": 2577} {"train_loss": -24.3144474029541, "global_step": 213924, "epoch": 2577} {"train_loss": -24.572885513305664, "global_step": 213925, "epoch": 2577} {"train_loss": -24.36581802368164, "global_step": 213926, "epoch": 2577} {"train_loss": -24.46282958984375, "global_step": 213927, "epoch": 2577} {"train_loss": -24.531967163085938, "global_step": 213928, "epoch": 2577} {"train_loss": -24.5842342376709, "global_step": 213929, "epoch": 2577} {"train_loss": -24.409862518310547, "global_step": 213930, "epoch": 2577} {"train_loss": -24.24020767211914, "global_step": 213931, "epoch": 2577} {"train_loss": -24.864831924438477, "global_step": 213932, "epoch": 2577} {"train_loss": -24.419967651367188, "global_step": 213933, "epoch": 2577} {"train_loss": -24.2865047454834, "global_step": 213934, "epoch": 2577} {"train_loss": -25.053730010986328, "global_step": 213935, "epoch": 2577} {"train_loss": -24.22967529296875, "global_step": 213936, "epoch": 2577} {"train_loss": -24.001039505004883, "global_step": 213937, "epoch": 2577} {"train_loss": -24.329587936401367, "global_step": 213938, "epoch": 2577} {"train_loss": -24.454660415649414, "global_step": 213939, "epoch": 2577} {"train_loss": -24.443012237548828, "global_step": 213940, "epoch": 2577} {"train_loss": -25.09326171875, "global_step": 213941, "epoch": 2577} {"train_loss": -24.47649574279785, "global_step": 213942, "epoch": 2577} {"train_loss": -24.2070255279541, "global_step": 213943, "epoch": 2577} {"train_loss": -24.244977951049805, "global_step": 213944, "epoch": 2577} {"train_loss": -24.272916793823242, "global_step": 213945, "epoch": 2577} {"train_loss": -24.51694679260254, "global_step": 213946, "epoch": 2577} {"train_loss": -24.750843048095703, "global_step": 213947, "epoch": 2577} {"train_loss": -24.22089195251465, "global_step": 213948, "epoch": 2577} {"train_loss": -23.861276626586914, "global_step": 213949, "epoch": 2577} {"train_loss": -24.302963256835938, "global_step": 213950, "epoch": 2577} {"train_loss": -24.441152572631836, "global_step": 213951, "epoch": 2577} {"train_loss": -24.12789535522461, "global_step": 213952, "epoch": 2577} {"train_loss": -24.42974281311035, "global_step": 213953, "epoch": 2577} {"train_loss": -24.541471481323242, "global_step": 213954, "epoch": 2577} {"train_loss": -24.726594924926758, "global_step": 213955, "epoch": 2577} {"train_loss": -24.11981201171875, "global_step": 213956, "epoch": 2577} {"train_loss": -24.523590087890625, "global_step": 213957, "epoch": 2577} {"train_loss": -24.50312042236328, "global_step": 213958, "epoch": 2577} {"train_loss": -24.439472198486328, "global_step": 213959, "epoch": 2577} {"train_loss": -24.17937469482422, "global_step": 213960, "epoch": 2577} {"train_loss": -24.555265426635742, "global_step": 213961, "epoch": 2577} {"train_loss": -24.514745712280273, "global_step": 213962, "epoch": 2577} {"train_loss": -24.20187759399414, "global_step": 213963, "epoch": 2577} {"train_loss": -24.431119918823242, "global_step": 213964, "epoch": 2577} {"train_loss": -24.3924617767334, "global_step": 213965, "epoch": 2577} {"train_loss": -24.829450607299805, "global_step": 213966, "epoch": 2577} {"train_loss": -24.517133712768555, "global_step": 213967, "epoch": 2577} {"train_loss": -24.462234497070312, "global_step": 213968, "epoch": 2577} {"train_loss": -24.635587692260742, "global_step": 213969, "epoch": 2577} {"train_loss": -24.908777236938477, "global_step": 213970, "epoch": 2577} {"train_loss": -24.3958797454834, "global_step": 213971, "epoch": 2577} {"train_loss": -24.473365783691406, "global_step": 213972, "epoch": 2577} {"train_loss": -24.437785941434193, "global_step": 213973, "epoch": 2577, "val_loss": 6730045.0} {"train_loss": -24.60344123840332, "global_step": 213974, "epoch": 2578} {"train_loss": -24.482868194580078, "global_step": 213975, "epoch": 2578} {"train_loss": -24.300262451171875, "global_step": 213976, "epoch": 2578} {"train_loss": -24.270360946655273, "global_step": 213977, "epoch": 2578} {"train_loss": -24.033985137939453, "global_step": 213978, "epoch": 2578} {"train_loss": -24.29714584350586, "global_step": 213979, "epoch": 2578} {"train_loss": -24.623580932617188, "global_step": 213980, "epoch": 2578} {"train_loss": -24.37183380126953, "global_step": 213981, "epoch": 2578} {"train_loss": -24.06258201599121, "global_step": 213982, "epoch": 2578} {"train_loss": -24.587398529052734, "global_step": 213983, "epoch": 2578} {"train_loss": -24.6649227142334, "global_step": 213984, "epoch": 2578} {"train_loss": -24.28803062438965, "global_step": 213985, "epoch": 2578} {"train_loss": -24.26319694519043, "global_step": 213986, "epoch": 2578} {"train_loss": -24.303579330444336, "global_step": 213987, "epoch": 2578} {"train_loss": -24.462278366088867, "global_step": 213988, "epoch": 2578} {"train_loss": -23.926572799682617, "global_step": 213989, "epoch": 2578} {"train_loss": -24.17984962463379, "global_step": 213990, "epoch": 2578} {"train_loss": -24.73904037475586, "global_step": 213991, "epoch": 2578} {"train_loss": -24.590856552124023, "global_step": 213992, "epoch": 2578} {"train_loss": -24.745588302612305, "global_step": 213993, "epoch": 2578} {"train_loss": -24.506128311157227, "global_step": 213994, "epoch": 2578} {"train_loss": -24.561784744262695, "global_step": 213995, "epoch": 2578} {"train_loss": -24.450504302978516, "global_step": 213996, "epoch": 2578} {"train_loss": -24.413549423217773, "global_step": 213997, "epoch": 2578} {"train_loss": -24.459753036499023, "global_step": 213998, "epoch": 2578} {"train_loss": -24.921585083007812, "global_step": 213999, "epoch": 2578} {"train_loss": -24.4525146484375, "global_step": 214000, "epoch": 2578} {"train_loss": -24.5222110748291, "global_step": 214001, "epoch": 2578} {"train_loss": -24.37101173400879, "global_step": 214002, "epoch": 2578} {"train_loss": -24.503238677978516, "global_step": 214003, "epoch": 2578} {"train_loss": -24.522003173828125, "global_step": 214004, "epoch": 2578} {"train_loss": -25.18812370300293, "global_step": 214005, "epoch": 2578} {"train_loss": -24.397165298461914, "global_step": 214006, "epoch": 2578} {"train_loss": -24.44001007080078, "global_step": 214007, "epoch": 2578} {"train_loss": -24.080442428588867, "global_step": 214008, "epoch": 2578} {"train_loss": -24.603567123413086, "global_step": 214009, "epoch": 2578} {"train_loss": -24.385643005371094, "global_step": 214010, "epoch": 2578} {"train_loss": -24.584247589111328, "global_step": 214011, "epoch": 2578} {"train_loss": -24.2762393951416, "global_step": 214012, "epoch": 2578} {"train_loss": -24.804079055786133, "global_step": 214013, "epoch": 2578} {"train_loss": -24.61972427368164, "global_step": 214014, "epoch": 2578} {"train_loss": -24.76063346862793, "global_step": 214015, "epoch": 2578} {"train_loss": -24.689184188842773, "global_step": 214016, "epoch": 2578} {"train_loss": -24.718610763549805, "global_step": 214017, "epoch": 2578} {"train_loss": -24.78669548034668, "global_step": 214018, "epoch": 2578} {"train_loss": -24.653013229370117, "global_step": 214019, "epoch": 2578} {"train_loss": -24.65338706970215, "global_step": 214020, "epoch": 2578} {"train_loss": -24.601320266723633, "global_step": 214021, "epoch": 2578} {"train_loss": -24.578453063964844, "global_step": 214022, "epoch": 2578} {"train_loss": -24.682655334472656, "global_step": 214023, "epoch": 2578} {"train_loss": -24.791105270385742, "global_step": 214024, "epoch": 2578} {"train_loss": -24.647083282470703, "global_step": 214025, "epoch": 2578} {"train_loss": -24.053953170776367, "global_step": 214026, "epoch": 2578} {"train_loss": -23.222837448120117, "global_step": 214027, "epoch": 2578} {"train_loss": -22.68003273010254, "global_step": 214028, "epoch": 2578} {"train_loss": -23.432723999023438, "global_step": 214029, "epoch": 2578} {"train_loss": -24.406280517578125, "global_step": 214030, "epoch": 2578} {"train_loss": -23.6053524017334, "global_step": 214031, "epoch": 2578} {"train_loss": -24.328720092773438, "global_step": 214032, "epoch": 2578} {"train_loss": -23.922874450683594, "global_step": 214033, "epoch": 2578} {"train_loss": -24.15997886657715, "global_step": 214034, "epoch": 2578} {"train_loss": -24.024717330932617, "global_step": 214035, "epoch": 2578} {"train_loss": -23.90177345275879, "global_step": 214036, "epoch": 2578} {"train_loss": -23.944448471069336, "global_step": 214037, "epoch": 2578} {"train_loss": -24.03866958618164, "global_step": 214038, "epoch": 2578} {"train_loss": -24.2695369720459, "global_step": 214039, "epoch": 2578} {"train_loss": -23.934690475463867, "global_step": 214040, "epoch": 2578} {"train_loss": -24.03476905822754, "global_step": 214041, "epoch": 2578} {"train_loss": -24.238622665405273, "global_step": 214042, "epoch": 2578} {"train_loss": -24.403667449951172, "global_step": 214043, "epoch": 2578} {"train_loss": -24.448974609375, "global_step": 214044, "epoch": 2578} {"train_loss": -24.196779251098633, "global_step": 214045, "epoch": 2578} {"train_loss": -24.194355010986328, "global_step": 214046, "epoch": 2578} {"train_loss": -24.209447860717773, "global_step": 214047, "epoch": 2578} {"train_loss": -24.11980628967285, "global_step": 214048, "epoch": 2578} {"train_loss": -24.43451499938965, "global_step": 214049, "epoch": 2578} {"train_loss": -24.529333114624023, "global_step": 214050, "epoch": 2578} {"train_loss": -24.580341339111328, "global_step": 214051, "epoch": 2578} {"train_loss": -24.501310348510742, "global_step": 214052, "epoch": 2578} {"train_loss": -24.556591033935547, "global_step": 214053, "epoch": 2578} {"train_loss": -24.274795532226562, "global_step": 214054, "epoch": 2578} {"train_loss": -24.678028106689453, "global_step": 214055, "epoch": 2578} {"train_loss": -24.345278498638105, "global_step": 214056, "epoch": 2578, "val_loss": 6777046.0} {"train_loss": -24.16742515563965, "global_step": 214057, "epoch": 2579} {"train_loss": -24.38346290588379, "global_step": 214058, "epoch": 2579} {"train_loss": -24.13323974609375, "global_step": 214059, "epoch": 2579} {"train_loss": -24.36899185180664, "global_step": 214060, "epoch": 2579} {"train_loss": -24.535688400268555, "global_step": 214061, "epoch": 2579} {"train_loss": -24.561803817749023, "global_step": 214062, "epoch": 2579} {"train_loss": -24.287439346313477, "global_step": 214063, "epoch": 2579} {"train_loss": -24.574047088623047, "global_step": 214064, "epoch": 2579} {"train_loss": -24.852258682250977, "global_step": 214065, "epoch": 2579} {"train_loss": -24.90620231628418, "global_step": 214066, "epoch": 2579} {"train_loss": -24.81487274169922, "global_step": 214067, "epoch": 2579} {"train_loss": -24.364652633666992, "global_step": 214068, "epoch": 2579} {"train_loss": -24.52057456970215, "global_step": 214069, "epoch": 2579} {"train_loss": -24.503400802612305, "global_step": 214070, "epoch": 2579} {"train_loss": -24.64554214477539, "global_step": 214071, "epoch": 2579} {"train_loss": -24.734724044799805, "global_step": 214072, "epoch": 2579} {"train_loss": -24.303159713745117, "global_step": 214073, "epoch": 2579} {"train_loss": -24.60213279724121, "global_step": 214074, "epoch": 2579} {"train_loss": -24.56351089477539, "global_step": 214075, "epoch": 2579} {"train_loss": -24.4840030670166, "global_step": 214076, "epoch": 2579} {"train_loss": -24.410839080810547, "global_step": 214077, "epoch": 2579} {"train_loss": -24.523839950561523, "global_step": 214078, "epoch": 2579} {"train_loss": -24.63441276550293, "global_step": 214079, "epoch": 2579} {"train_loss": -24.8294620513916, "global_step": 214080, "epoch": 2579} {"train_loss": -24.598539352416992, "global_step": 214081, "epoch": 2579} {"train_loss": -24.63429832458496, "global_step": 214082, "epoch": 2579} {"train_loss": -24.37665557861328, "global_step": 214083, "epoch": 2579} {"train_loss": -24.587268829345703, "global_step": 214084, "epoch": 2579} {"train_loss": -24.51865577697754, "global_step": 214085, "epoch": 2579} {"train_loss": -23.786399841308594, "global_step": 214086, "epoch": 2579} {"train_loss": -24.371246337890625, "global_step": 214087, "epoch": 2579} {"train_loss": -24.274429321289062, "global_step": 214088, "epoch": 2579} {"train_loss": -24.405393600463867, "global_step": 214089, "epoch": 2579} {"train_loss": -24.662464141845703, "global_step": 214090, "epoch": 2579} {"train_loss": -24.7466983795166, "global_step": 214091, "epoch": 2579} {"train_loss": -24.520320892333984, "global_step": 214092, "epoch": 2579} {"train_loss": -24.48587989807129, "global_step": 214093, "epoch": 2579} {"train_loss": -24.620080947875977, "global_step": 214094, "epoch": 2579} {"train_loss": -24.49509620666504, "global_step": 214095, "epoch": 2579} {"train_loss": -24.586505889892578, "global_step": 214096, "epoch": 2579} {"train_loss": -24.190677642822266, "global_step": 214097, "epoch": 2579} {"train_loss": -24.24190330505371, "global_step": 214098, "epoch": 2579} {"train_loss": -24.500288009643555, "global_step": 214099, "epoch": 2579} {"train_loss": -24.6171875, "global_step": 214100, "epoch": 2579} {"train_loss": -24.49185562133789, "global_step": 214101, "epoch": 2579} {"train_loss": -24.37559700012207, "global_step": 214102, "epoch": 2579} {"train_loss": -24.770395278930664, "global_step": 214103, "epoch": 2579} {"train_loss": -24.45730209350586, "global_step": 214104, "epoch": 2579} {"train_loss": -24.559696197509766, "global_step": 214105, "epoch": 2579} {"train_loss": -24.347476959228516, "global_step": 214106, "epoch": 2579} {"train_loss": -24.773588180541992, "global_step": 214107, "epoch": 2579} {"train_loss": -24.721426010131836, "global_step": 214108, "epoch": 2579} {"train_loss": -24.45948600769043, "global_step": 214109, "epoch": 2579} {"train_loss": -24.69715118408203, "global_step": 214110, "epoch": 2579} {"train_loss": -24.9719181060791, "global_step": 214111, "epoch": 2579} {"train_loss": -24.83112907409668, "global_step": 214112, "epoch": 2579} {"train_loss": -24.51058006286621, "global_step": 214113, "epoch": 2579} {"train_loss": -24.63495635986328, "global_step": 214114, "epoch": 2579} {"train_loss": -24.4182186126709, "global_step": 214115, "epoch": 2579} {"train_loss": -24.11054801940918, "global_step": 214116, "epoch": 2579} {"train_loss": -24.280611038208008, "global_step": 214117, "epoch": 2579} {"train_loss": -24.689388275146484, "global_step": 214118, "epoch": 2579} {"train_loss": -24.287004470825195, "global_step": 214119, "epoch": 2579} {"train_loss": -24.65147590637207, "global_step": 214120, "epoch": 2579} {"train_loss": -24.39959144592285, "global_step": 214121, "epoch": 2579} {"train_loss": -24.20659637451172, "global_step": 214122, "epoch": 2579} {"train_loss": -24.328350067138672, "global_step": 214123, "epoch": 2579} {"train_loss": -24.38228416442871, "global_step": 214124, "epoch": 2579} {"train_loss": -24.60457420349121, "global_step": 214125, "epoch": 2579} {"train_loss": -24.422334671020508, "global_step": 214126, "epoch": 2579} {"train_loss": -24.884845733642578, "global_step": 214127, "epoch": 2579} {"train_loss": -24.05451011657715, "global_step": 214128, "epoch": 2579} {"train_loss": -24.420732498168945, "global_step": 214129, "epoch": 2579} {"train_loss": -24.269742965698242, "global_step": 214130, "epoch": 2579} {"train_loss": -24.381364822387695, "global_step": 214131, "epoch": 2579} {"train_loss": -24.700620651245117, "global_step": 214132, "epoch": 2579} {"train_loss": -24.532133102416992, "global_step": 214133, "epoch": 2579} {"train_loss": -24.428190231323242, "global_step": 214134, "epoch": 2579} {"train_loss": -24.584793090820312, "global_step": 214135, "epoch": 2579} {"train_loss": -24.832988739013672, "global_step": 214136, "epoch": 2579} {"train_loss": -24.613588333129883, "global_step": 214137, "epoch": 2579} {"train_loss": -24.580825805664062, "global_step": 214138, "epoch": 2579} {"train_loss": -24.499931381409425, "global_step": 214139, "epoch": 2579, "val_loss": 6678216.5} {"train_loss": -24.08660888671875, "global_step": 214140, "epoch": 2580} {"train_loss": -23.844802856445312, "global_step": 214141, "epoch": 2580} {"train_loss": -23.88680648803711, "global_step": 214142, "epoch": 2580} {"train_loss": -24.0845947265625, "global_step": 214143, "epoch": 2580} {"train_loss": -24.8030948638916, "global_step": 214144, "epoch": 2580} {"train_loss": -24.282657623291016, "global_step": 214145, "epoch": 2580} {"train_loss": -24.082019805908203, "global_step": 214146, "epoch": 2580} {"train_loss": -24.531164169311523, "global_step": 214147, "epoch": 2580} {"train_loss": -24.195709228515625, "global_step": 214148, "epoch": 2580} {"train_loss": -24.447324752807617, "global_step": 214149, "epoch": 2580} {"train_loss": -24.206483840942383, "global_step": 214150, "epoch": 2580} {"train_loss": -24.299205780029297, "global_step": 214151, "epoch": 2580} {"train_loss": -24.498510360717773, "global_step": 214152, "epoch": 2580} {"train_loss": -23.979642868041992, "global_step": 214153, "epoch": 2580} {"train_loss": -24.066818237304688, "global_step": 214154, "epoch": 2580} {"train_loss": -24.283451080322266, "global_step": 214155, "epoch": 2580} {"train_loss": -23.926485061645508, "global_step": 214156, "epoch": 2580} {"train_loss": -24.41765785217285, "global_step": 214157, "epoch": 2580} {"train_loss": -24.261310577392578, "global_step": 214158, "epoch": 2580} {"train_loss": -24.47157859802246, "global_step": 214159, "epoch": 2580} {"train_loss": -24.162067413330078, "global_step": 214160, "epoch": 2580} {"train_loss": -24.387351989746094, "global_step": 214161, "epoch": 2580} {"train_loss": -24.328290939331055, "global_step": 214162, "epoch": 2580} {"train_loss": -24.300819396972656, "global_step": 214163, "epoch": 2580} {"train_loss": -24.622732162475586, "global_step": 214164, "epoch": 2580} {"train_loss": -24.41936683654785, "global_step": 214165, "epoch": 2580} {"train_loss": -24.555675506591797, "global_step": 214166, "epoch": 2580} {"train_loss": -24.466796875, "global_step": 214167, "epoch": 2580} {"train_loss": -24.35161590576172, "global_step": 214168, "epoch": 2580} {"train_loss": -24.476911544799805, "global_step": 214169, "epoch": 2580} {"train_loss": -24.450149536132812, "global_step": 214170, "epoch": 2580} {"train_loss": -24.786954879760742, "global_step": 214171, "epoch": 2580} {"train_loss": -24.45554542541504, "global_step": 214172, "epoch": 2580} {"train_loss": -24.574682235717773, "global_step": 214173, "epoch": 2580} {"train_loss": -24.439298629760742, "global_step": 214174, "epoch": 2580} {"train_loss": -24.853172302246094, "global_step": 214175, "epoch": 2580} {"train_loss": -24.501806259155273, "global_step": 214176, "epoch": 2580} {"train_loss": -24.734811782836914, "global_step": 214177, "epoch": 2580} {"train_loss": -24.444482803344727, "global_step": 214178, "epoch": 2580} {"train_loss": -24.96766471862793, "global_step": 214179, "epoch": 2580} {"train_loss": -24.235158920288086, "global_step": 214180, "epoch": 2580} {"train_loss": -24.105087280273438, "global_step": 214181, "epoch": 2580} {"train_loss": -23.795093536376953, "global_step": 214182, "epoch": 2580} {"train_loss": -24.687501907348633, "global_step": 214183, "epoch": 2580} {"train_loss": -24.296918869018555, "global_step": 214184, "epoch": 2580} {"train_loss": -24.396520614624023, "global_step": 214185, "epoch": 2580} {"train_loss": -24.325925827026367, "global_step": 214186, "epoch": 2580} {"train_loss": -24.543500900268555, "global_step": 214187, "epoch": 2580} {"train_loss": -24.39796257019043, "global_step": 214188, "epoch": 2580} {"train_loss": -24.4379940032959, "global_step": 214189, "epoch": 2580} {"train_loss": -24.2254638671875, "global_step": 214190, "epoch": 2580} {"train_loss": -24.397003173828125, "global_step": 214191, "epoch": 2580} {"train_loss": -24.13675308227539, "global_step": 214192, "epoch": 2580} {"train_loss": -24.308629989624023, "global_step": 214193, "epoch": 2580} {"train_loss": -24.63764762878418, "global_step": 214194, "epoch": 2580} {"train_loss": -24.84577751159668, "global_step": 214195, "epoch": 2580} {"train_loss": -24.505090713500977, "global_step": 214196, "epoch": 2580} {"train_loss": -24.48624610900879, "global_step": 214197, "epoch": 2580} {"train_loss": -24.53839683532715, "global_step": 214198, "epoch": 2580} {"train_loss": -24.40598487854004, "global_step": 214199, "epoch": 2580} {"train_loss": -24.950857162475586, "global_step": 214200, "epoch": 2580} {"train_loss": -24.643766403198242, "global_step": 214201, "epoch": 2580} {"train_loss": -24.640317916870117, "global_step": 214202, "epoch": 2580} {"train_loss": -24.439767837524414, "global_step": 214203, "epoch": 2580} {"train_loss": -24.42599868774414, "global_step": 214204, "epoch": 2580} {"train_loss": -24.198579788208008, "global_step": 214205, "epoch": 2580} {"train_loss": -24.507919311523438, "global_step": 214206, "epoch": 2580} {"train_loss": -24.609312057495117, "global_step": 214207, "epoch": 2580} {"train_loss": -24.41337013244629, "global_step": 214208, "epoch": 2580} {"train_loss": -24.434831619262695, "global_step": 214209, "epoch": 2580} {"train_loss": -24.699216842651367, "global_step": 214210, "epoch": 2580} {"train_loss": -24.597057342529297, "global_step": 214211, "epoch": 2580} {"train_loss": -24.909753799438477, "global_step": 214212, "epoch": 2580} {"train_loss": -24.44576072692871, "global_step": 214213, "epoch": 2580} {"train_loss": -24.566652297973633, "global_step": 214214, "epoch": 2580} {"train_loss": -24.11079978942871, "global_step": 214215, "epoch": 2580} {"train_loss": -24.67124366760254, "global_step": 214216, "epoch": 2580} {"train_loss": -24.737524032592773, "global_step": 214217, "epoch": 2580} {"train_loss": -24.70849609375, "global_step": 214218, "epoch": 2580} {"train_loss": -24.67801856994629, "global_step": 214219, "epoch": 2580} {"train_loss": -24.673234939575195, "global_step": 214220, "epoch": 2580} {"train_loss": -24.78840446472168, "global_step": 214221, "epoch": 2580} {"train_loss": -24.457980466176227, "global_step": 214222, "epoch": 2580, "val_loss": 6555974.5} {"train_loss": -24.57835578918457, "global_step": 214223, "epoch": 2581} {"train_loss": -24.010793685913086, "global_step": 214224, "epoch": 2581} {"train_loss": -24.49282455444336, "global_step": 214225, "epoch": 2581} {"train_loss": -24.293485641479492, "global_step": 214226, "epoch": 2581} {"train_loss": -24.335189819335938, "global_step": 214227, "epoch": 2581} {"train_loss": -24.43710708618164, "global_step": 214228, "epoch": 2581} {"train_loss": -23.990598678588867, "global_step": 214229, "epoch": 2581} {"train_loss": -24.424028396606445, "global_step": 214230, "epoch": 2581} {"train_loss": -24.15141487121582, "global_step": 214231, "epoch": 2581} {"train_loss": -24.25046157836914, "global_step": 214232, "epoch": 2581} {"train_loss": -24.196332931518555, "global_step": 214233, "epoch": 2581} {"train_loss": -24.21675682067871, "global_step": 214234, "epoch": 2581} {"train_loss": -24.255027770996094, "global_step": 214235, "epoch": 2581} {"train_loss": -23.894590377807617, "global_step": 214236, "epoch": 2581} {"train_loss": -24.810823440551758, "global_step": 214237, "epoch": 2581} {"train_loss": -23.999248504638672, "global_step": 214238, "epoch": 2581} {"train_loss": -24.20867347717285, "global_step": 214239, "epoch": 2581} {"train_loss": -24.238046646118164, "global_step": 214240, "epoch": 2581} {"train_loss": -24.390287399291992, "global_step": 214241, "epoch": 2581} {"train_loss": -24.687997817993164, "global_step": 214242, "epoch": 2581} {"train_loss": -24.63587760925293, "global_step": 214243, "epoch": 2581} {"train_loss": -24.273298263549805, "global_step": 214244, "epoch": 2581} {"train_loss": -24.539274215698242, "global_step": 214245, "epoch": 2581} {"train_loss": -24.235109329223633, "global_step": 214246, "epoch": 2581} {"train_loss": -24.412145614624023, "global_step": 214247, "epoch": 2581} {"train_loss": -24.501840591430664, "global_step": 214248, "epoch": 2581} {"train_loss": -24.420360565185547, "global_step": 214249, "epoch": 2581} {"train_loss": -24.258588790893555, "global_step": 214250, "epoch": 2581} {"train_loss": -24.488454818725586, "global_step": 214251, "epoch": 2581} {"train_loss": -24.610754013061523, "global_step": 214252, "epoch": 2581} {"train_loss": -24.42816925048828, "global_step": 214253, "epoch": 2581} {"train_loss": -24.633657455444336, "global_step": 214254, "epoch": 2581} {"train_loss": -24.137100219726562, "global_step": 214255, "epoch": 2581} {"train_loss": -24.658517837524414, "global_step": 214256, "epoch": 2581} {"train_loss": -24.621091842651367, "global_step": 214257, "epoch": 2581} {"train_loss": -24.65669822692871, "global_step": 214258, "epoch": 2581} {"train_loss": -24.562463760375977, "global_step": 214259, "epoch": 2581} {"train_loss": -24.75292205810547, "global_step": 214260, "epoch": 2581} {"train_loss": -24.647565841674805, "global_step": 214261, "epoch": 2581} {"train_loss": -24.43410301208496, "global_step": 214262, "epoch": 2581} {"train_loss": -24.351844787597656, "global_step": 214263, "epoch": 2581} {"train_loss": -24.675291061401367, "global_step": 214264, "epoch": 2581} {"train_loss": -24.653974533081055, "global_step": 214265, "epoch": 2581} {"train_loss": -24.276681900024414, "global_step": 214266, "epoch": 2581} {"train_loss": -24.679983139038086, "global_step": 214267, "epoch": 2581} {"train_loss": -24.145963668823242, "global_step": 214268, "epoch": 2581} {"train_loss": -24.09272575378418, "global_step": 214269, "epoch": 2581} {"train_loss": -24.635610580444336, "global_step": 214270, "epoch": 2581} {"train_loss": -24.841920852661133, "global_step": 214271, "epoch": 2581} {"train_loss": -24.423864364624023, "global_step": 214272, "epoch": 2581} {"train_loss": -24.504487991333008, "global_step": 214273, "epoch": 2581} {"train_loss": -24.564069747924805, "global_step": 214274, "epoch": 2581} {"train_loss": -24.813220977783203, "global_step": 214275, "epoch": 2581} {"train_loss": -24.605146408081055, "global_step": 214276, "epoch": 2581} {"train_loss": -24.34029197692871, "global_step": 214277, "epoch": 2581} {"train_loss": -24.50982666015625, "global_step": 214278, "epoch": 2581} {"train_loss": -24.804237365722656, "global_step": 214279, "epoch": 2581} {"train_loss": -24.682586669921875, "global_step": 214280, "epoch": 2581} {"train_loss": -24.49838638305664, "global_step": 214281, "epoch": 2581} {"train_loss": -24.972415924072266, "global_step": 214282, "epoch": 2581} {"train_loss": -24.498228073120117, "global_step": 214283, "epoch": 2581} {"train_loss": -24.706632614135742, "global_step": 214284, "epoch": 2581} {"train_loss": -24.672704696655273, "global_step": 214285, "epoch": 2581} {"train_loss": -24.273012161254883, "global_step": 214286, "epoch": 2581} {"train_loss": -24.544998168945312, "global_step": 214287, "epoch": 2581} {"train_loss": -24.863561630249023, "global_step": 214288, "epoch": 2581} {"train_loss": -24.652708053588867, "global_step": 214289, "epoch": 2581} {"train_loss": -24.219135284423828, "global_step": 214290, "epoch": 2581} {"train_loss": -23.934310913085938, "global_step": 214291, "epoch": 2581} {"train_loss": -23.86261558532715, "global_step": 214292, "epoch": 2581} {"train_loss": -24.181974411010742, "global_step": 214293, "epoch": 2581} {"train_loss": -24.29351234436035, "global_step": 214294, "epoch": 2581} {"train_loss": -23.890188217163086, "global_step": 214295, "epoch": 2581} {"train_loss": -23.98642921447754, "global_step": 214296, "epoch": 2581} {"train_loss": -24.538904190063477, "global_step": 214297, "epoch": 2581} {"train_loss": -24.34820556640625, "global_step": 214298, "epoch": 2581} {"train_loss": -24.418350219726562, "global_step": 214299, "epoch": 2581} {"train_loss": -24.50325584411621, "global_step": 214300, "epoch": 2581} {"train_loss": -24.418716430664062, "global_step": 214301, "epoch": 2581} {"train_loss": -24.7763614654541, "global_step": 214302, "epoch": 2581} {"train_loss": -24.24519920349121, "global_step": 214303, "epoch": 2581} {"train_loss": -24.14474868774414, "global_step": 214304, "epoch": 2581} {"train_loss": -24.421455061579326, "global_step": 214305, "epoch": 2581, "val_loss": 6729072.0} {"train_loss": -23.963369369506836, "global_step": 214306, "epoch": 2582} {"train_loss": -24.37425422668457, "global_step": 214307, "epoch": 2582} {"train_loss": -24.252927780151367, "global_step": 214308, "epoch": 2582} {"train_loss": -24.28675079345703, "global_step": 214309, "epoch": 2582} {"train_loss": -23.943008422851562, "global_step": 214310, "epoch": 2582} {"train_loss": -24.36992645263672, "global_step": 214311, "epoch": 2582} {"train_loss": -24.203678131103516, "global_step": 214312, "epoch": 2582} {"train_loss": -24.472047805786133, "global_step": 214313, "epoch": 2582} {"train_loss": -23.849777221679688, "global_step": 214314, "epoch": 2582} {"train_loss": -24.390329360961914, "global_step": 214315, "epoch": 2582} {"train_loss": -24.236125946044922, "global_step": 214316, "epoch": 2582} {"train_loss": -24.490867614746094, "global_step": 214317, "epoch": 2582} {"train_loss": -24.781415939331055, "global_step": 214318, "epoch": 2582} {"train_loss": -24.463117599487305, "global_step": 214319, "epoch": 2582} {"train_loss": -24.36726951599121, "global_step": 214320, "epoch": 2582} {"train_loss": -24.56972312927246, "global_step": 214321, "epoch": 2582} {"train_loss": -24.59042739868164, "global_step": 214322, "epoch": 2582} {"train_loss": -24.56734275817871, "global_step": 214323, "epoch": 2582} {"train_loss": -24.333171844482422, "global_step": 214324, "epoch": 2582} {"train_loss": -24.26988983154297, "global_step": 214325, "epoch": 2582} {"train_loss": -24.7155818939209, "global_step": 214326, "epoch": 2582} {"train_loss": -24.37613296508789, "global_step": 214327, "epoch": 2582} {"train_loss": -24.803762435913086, "global_step": 214328, "epoch": 2582} {"train_loss": -24.59684181213379, "global_step": 214329, "epoch": 2582} {"train_loss": -24.832962036132812, "global_step": 214330, "epoch": 2582} {"train_loss": -24.42950439453125, "global_step": 214331, "epoch": 2582} {"train_loss": -24.664077758789062, "global_step": 214332, "epoch": 2582} {"train_loss": -24.197423934936523, "global_step": 214333, "epoch": 2582} {"train_loss": -24.81678581237793, "global_step": 214334, "epoch": 2582} {"train_loss": -24.740224838256836, "global_step": 214335, "epoch": 2582} {"train_loss": -24.534452438354492, "global_step": 214336, "epoch": 2582} {"train_loss": -24.20029640197754, "global_step": 214337, "epoch": 2582} {"train_loss": -24.343534469604492, "global_step": 214338, "epoch": 2582} {"train_loss": -23.921924591064453, "global_step": 214339, "epoch": 2582} {"train_loss": -24.544219970703125, "global_step": 214340, "epoch": 2582} {"train_loss": -24.176008224487305, "global_step": 214341, "epoch": 2582} {"train_loss": -24.13876724243164, "global_step": 214342, "epoch": 2582} {"train_loss": -24.36651039123535, "global_step": 214343, "epoch": 2582} {"train_loss": -24.335355758666992, "global_step": 214344, "epoch": 2582} {"train_loss": -24.57418441772461, "global_step": 214345, "epoch": 2582} {"train_loss": -24.177501678466797, "global_step": 214346, "epoch": 2582} {"train_loss": -24.423059463500977, "global_step": 214347, "epoch": 2582} {"train_loss": -24.432132720947266, "global_step": 214348, "epoch": 2582} {"train_loss": -24.642913818359375, "global_step": 214349, "epoch": 2582} {"train_loss": -24.48065185546875, "global_step": 214350, "epoch": 2582} {"train_loss": -24.531951904296875, "global_step": 214351, "epoch": 2582} {"train_loss": -24.496076583862305, "global_step": 214352, "epoch": 2582} {"train_loss": -24.487695693969727, "global_step": 214353, "epoch": 2582} {"train_loss": -24.757614135742188, "global_step": 214354, "epoch": 2582} {"train_loss": -24.664037704467773, "global_step": 214355, "epoch": 2582} {"train_loss": -24.47504997253418, "global_step": 214356, "epoch": 2582} {"train_loss": -24.537031173706055, "global_step": 214357, "epoch": 2582} {"train_loss": -24.24275016784668, "global_step": 214358, "epoch": 2582} {"train_loss": -24.41339683532715, "global_step": 214359, "epoch": 2582} {"train_loss": -24.724119186401367, "global_step": 214360, "epoch": 2582} {"train_loss": -24.206708908081055, "global_step": 214361, "epoch": 2582} {"train_loss": -24.600664138793945, "global_step": 214362, "epoch": 2582} {"train_loss": -24.746601104736328, "global_step": 214363, "epoch": 2582} {"train_loss": -24.803651809692383, "global_step": 214364, "epoch": 2582} {"train_loss": -24.73175621032715, "global_step": 214365, "epoch": 2582} {"train_loss": -24.72242546081543, "global_step": 214366, "epoch": 2582} {"train_loss": -24.287118911743164, "global_step": 214367, "epoch": 2582} {"train_loss": -24.557287216186523, "global_step": 214368, "epoch": 2582} {"train_loss": -24.39405632019043, "global_step": 214369, "epoch": 2582} {"train_loss": -24.58340835571289, "global_step": 214370, "epoch": 2582} {"train_loss": -24.25482749938965, "global_step": 214371, "epoch": 2582} {"train_loss": -24.55259132385254, "global_step": 214372, "epoch": 2582} {"train_loss": -24.437149047851562, "global_step": 214373, "epoch": 2582} {"train_loss": -24.876802444458008, "global_step": 214374, "epoch": 2582} {"train_loss": -24.685697555541992, "global_step": 214375, "epoch": 2582} {"train_loss": -24.151004791259766, "global_step": 214376, "epoch": 2582} {"train_loss": -24.2949275970459, "global_step": 214377, "epoch": 2582} {"train_loss": -24.45279884338379, "global_step": 214378, "epoch": 2582} {"train_loss": -24.399316787719727, "global_step": 214379, "epoch": 2582} {"train_loss": -24.63640785217285, "global_step": 214380, "epoch": 2582} {"train_loss": -24.187223434448242, "global_step": 214381, "epoch": 2582} {"train_loss": -24.603918075561523, "global_step": 214382, "epoch": 2582} {"train_loss": -24.685453414916992, "global_step": 214383, "epoch": 2582} {"train_loss": -24.5083065032959, "global_step": 214384, "epoch": 2582} {"train_loss": -24.173828125, "global_step": 214385, "epoch": 2582} {"train_loss": -24.421472549438477, "global_step": 214386, "epoch": 2582} {"train_loss": -24.782062530517578, "global_step": 214387, "epoch": 2582} {"train_loss": -24.4554225507989, "global_step": 214388, "epoch": 2582, "val_loss": 6672278.0} {"train_loss": -23.744970321655273, "global_step": 214389, "epoch": 2583} {"train_loss": -24.330549240112305, "global_step": 214390, "epoch": 2583} {"train_loss": -24.369449615478516, "global_step": 214391, "epoch": 2583} {"train_loss": -24.158140182495117, "global_step": 214392, "epoch": 2583} {"train_loss": -24.21518898010254, "global_step": 214393, "epoch": 2583} {"train_loss": -24.088563919067383, "global_step": 214394, "epoch": 2583} {"train_loss": -24.417972564697266, "global_step": 214395, "epoch": 2583} {"train_loss": -24.168685913085938, "global_step": 214396, "epoch": 2583} {"train_loss": -23.901123046875, "global_step": 214397, "epoch": 2583} {"train_loss": -24.09552001953125, "global_step": 214398, "epoch": 2583} {"train_loss": -24.4661922454834, "global_step": 214399, "epoch": 2583} {"train_loss": -24.12550163269043, "global_step": 214400, "epoch": 2583} {"train_loss": -24.478893280029297, "global_step": 214401, "epoch": 2583} {"train_loss": -24.057336807250977, "global_step": 214402, "epoch": 2583} {"train_loss": -24.289762496948242, "global_step": 214403, "epoch": 2583} {"train_loss": -24.772642135620117, "global_step": 214404, "epoch": 2583} {"train_loss": -24.345928192138672, "global_step": 214405, "epoch": 2583} {"train_loss": -24.617923736572266, "global_step": 214406, "epoch": 2583} {"train_loss": -24.438030242919922, "global_step": 214407, "epoch": 2583} {"train_loss": -24.556264877319336, "global_step": 214408, "epoch": 2583} {"train_loss": -24.547147750854492, "global_step": 214409, "epoch": 2583} {"train_loss": -24.43375015258789, "global_step": 214410, "epoch": 2583} {"train_loss": -24.468408584594727, "global_step": 214411, "epoch": 2583} {"train_loss": -24.910017013549805, "global_step": 214412, "epoch": 2583} {"train_loss": -24.327116012573242, "global_step": 214413, "epoch": 2583} {"train_loss": -24.229475021362305, "global_step": 214414, "epoch": 2583} {"train_loss": -24.18246841430664, "global_step": 214415, "epoch": 2583} {"train_loss": -24.09637451171875, "global_step": 214416, "epoch": 2583} {"train_loss": -24.30855369567871, "global_step": 214417, "epoch": 2583} {"train_loss": -24.487817764282227, "global_step": 214418, "epoch": 2583} {"train_loss": -24.446767807006836, "global_step": 214419, "epoch": 2583} {"train_loss": -24.32187843322754, "global_step": 214420, "epoch": 2583} {"train_loss": -24.618967056274414, "global_step": 214421, "epoch": 2583} {"train_loss": -24.502351760864258, "global_step": 214422, "epoch": 2583} {"train_loss": -24.464506149291992, "global_step": 214423, "epoch": 2583} {"train_loss": -24.38910484313965, "global_step": 214424, "epoch": 2583} {"train_loss": -24.54326820373535, "global_step": 214425, "epoch": 2583} {"train_loss": -24.175098419189453, "global_step": 214426, "epoch": 2583} {"train_loss": -24.290109634399414, "global_step": 214427, "epoch": 2583} {"train_loss": -24.28988265991211, "global_step": 214428, "epoch": 2583} {"train_loss": -24.876754760742188, "global_step": 214429, "epoch": 2583} {"train_loss": -24.374990463256836, "global_step": 214430, "epoch": 2583} {"train_loss": -24.910160064697266, "global_step": 214431, "epoch": 2583} {"train_loss": -24.527128219604492, "global_step": 214432, "epoch": 2583} {"train_loss": -24.55525016784668, "global_step": 214433, "epoch": 2583} {"train_loss": -24.76935386657715, "global_step": 214434, "epoch": 2583} {"train_loss": -24.248680114746094, "global_step": 214435, "epoch": 2583} {"train_loss": -24.42014503479004, "global_step": 214436, "epoch": 2583} {"train_loss": -24.578609466552734, "global_step": 214437, "epoch": 2583} {"train_loss": -24.546463012695312, "global_step": 214438, "epoch": 2583} {"train_loss": -24.604883193969727, "global_step": 214439, "epoch": 2583} {"train_loss": -24.36810874938965, "global_step": 214440, "epoch": 2583} {"train_loss": -24.218826293945312, "global_step": 214441, "epoch": 2583} {"train_loss": -24.38158416748047, "global_step": 214442, "epoch": 2583} {"train_loss": -24.323389053344727, "global_step": 214443, "epoch": 2583} {"train_loss": -24.470985412597656, "global_step": 214444, "epoch": 2583} {"train_loss": -24.88251304626465, "global_step": 214445, "epoch": 2583} {"train_loss": -24.4213809967041, "global_step": 214446, "epoch": 2583} {"train_loss": -24.452871322631836, "global_step": 214447, "epoch": 2583} {"train_loss": -24.458646774291992, "global_step": 214448, "epoch": 2583} {"train_loss": -24.70723533630371, "global_step": 214449, "epoch": 2583} {"train_loss": -24.492467880249023, "global_step": 214450, "epoch": 2583} {"train_loss": -24.404022216796875, "global_step": 214451, "epoch": 2583} {"train_loss": -24.17119598388672, "global_step": 214452, "epoch": 2583} {"train_loss": -24.266813278198242, "global_step": 214453, "epoch": 2583} {"train_loss": -24.2111873626709, "global_step": 214454, "epoch": 2583} {"train_loss": -24.3436279296875, "global_step": 214455, "epoch": 2583} {"train_loss": -24.316490173339844, "global_step": 214456, "epoch": 2583} {"train_loss": -24.06245231628418, "global_step": 214457, "epoch": 2583} {"train_loss": -24.248571395874023, "global_step": 214458, "epoch": 2583} {"train_loss": -24.375289916992188, "global_step": 214459, "epoch": 2583} {"train_loss": -24.533506393432617, "global_step": 214460, "epoch": 2583} {"train_loss": -24.086410522460938, "global_step": 214461, "epoch": 2583} {"train_loss": -24.21059226989746, "global_step": 214462, "epoch": 2583} {"train_loss": -24.71394157409668, "global_step": 214463, "epoch": 2583} {"train_loss": -24.152280807495117, "global_step": 214464, "epoch": 2583} {"train_loss": -24.311664581298828, "global_step": 214465, "epoch": 2583} {"train_loss": -24.28999900817871, "global_step": 214466, "epoch": 2583} {"train_loss": -24.518400192260742, "global_step": 214467, "epoch": 2583} {"train_loss": -24.177804946899414, "global_step": 214468, "epoch": 2583} {"train_loss": -24.294818878173828, "global_step": 214469, "epoch": 2583} {"train_loss": -24.80624008178711, "global_step": 214470, "epoch": 2583} {"train_loss": -24.374978076980774, "global_step": 214471, "epoch": 2583, "val_loss": 6735642.0} {"train_loss": -24.537765502929688, "global_step": 214472, "epoch": 2584} {"train_loss": -24.201934814453125, "global_step": 214473, "epoch": 2584} {"train_loss": -23.77068519592285, "global_step": 214474, "epoch": 2584} {"train_loss": -24.05862808227539, "global_step": 214475, "epoch": 2584} {"train_loss": -23.773778915405273, "global_step": 214476, "epoch": 2584} {"train_loss": -24.177770614624023, "global_step": 214477, "epoch": 2584} {"train_loss": -24.2153263092041, "global_step": 214478, "epoch": 2584} {"train_loss": -24.27405548095703, "global_step": 214479, "epoch": 2584} {"train_loss": -24.28530502319336, "global_step": 214480, "epoch": 2584} {"train_loss": -24.0858211517334, "global_step": 214481, "epoch": 2584} {"train_loss": -24.1307430267334, "global_step": 214482, "epoch": 2584} {"train_loss": -24.38711929321289, "global_step": 214483, "epoch": 2584} {"train_loss": -24.034284591674805, "global_step": 214484, "epoch": 2584} {"train_loss": -24.320829391479492, "global_step": 214485, "epoch": 2584} {"train_loss": -24.358972549438477, "global_step": 214486, "epoch": 2584} {"train_loss": -24.57474708557129, "global_step": 214487, "epoch": 2584} {"train_loss": -24.250829696655273, "global_step": 214488, "epoch": 2584} {"train_loss": -24.645505905151367, "global_step": 214489, "epoch": 2584} {"train_loss": -24.511817932128906, "global_step": 214490, "epoch": 2584} {"train_loss": -24.406169891357422, "global_step": 214491, "epoch": 2584} {"train_loss": -24.247156143188477, "global_step": 214492, "epoch": 2584} {"train_loss": -24.38527488708496, "global_step": 214493, "epoch": 2584} {"train_loss": -24.13144874572754, "global_step": 214494, "epoch": 2584} {"train_loss": -24.483585357666016, "global_step": 214495, "epoch": 2584} {"train_loss": -24.641199111938477, "global_step": 214496, "epoch": 2584} {"train_loss": -24.564502716064453, "global_step": 214497, "epoch": 2584} {"train_loss": -24.39609146118164, "global_step": 214498, "epoch": 2584} {"train_loss": -24.829853057861328, "global_step": 214499, "epoch": 2584} {"train_loss": -24.498188018798828, "global_step": 214500, "epoch": 2584} {"train_loss": -24.585865020751953, "global_step": 214501, "epoch": 2584} {"train_loss": -24.386198043823242, "global_step": 214502, "epoch": 2584} {"train_loss": -24.404626846313477, "global_step": 214503, "epoch": 2584} {"train_loss": -24.733604431152344, "global_step": 214504, "epoch": 2584} {"train_loss": -24.410520553588867, "global_step": 214505, "epoch": 2584} {"train_loss": -24.652082443237305, "global_step": 214506, "epoch": 2584} {"train_loss": -24.738882064819336, "global_step": 214507, "epoch": 2584} {"train_loss": -24.530075073242188, "global_step": 214508, "epoch": 2584} {"train_loss": -24.177085876464844, "global_step": 214509, "epoch": 2584} {"train_loss": -24.315204620361328, "global_step": 214510, "epoch": 2584} {"train_loss": -24.378150939941406, "global_step": 214511, "epoch": 2584} {"train_loss": -24.31369400024414, "global_step": 214512, "epoch": 2584} {"train_loss": -23.760541915893555, "global_step": 214513, "epoch": 2584} {"train_loss": -24.079538345336914, "global_step": 214514, "epoch": 2584} {"train_loss": -24.402374267578125, "global_step": 214515, "epoch": 2584} {"train_loss": -24.350082397460938, "global_step": 214516, "epoch": 2584} {"train_loss": -24.588062286376953, "global_step": 214517, "epoch": 2584} {"train_loss": -24.54781150817871, "global_step": 214518, "epoch": 2584} {"train_loss": -24.162586212158203, "global_step": 214519, "epoch": 2584} {"train_loss": -23.9803466796875, "global_step": 214520, "epoch": 2584} {"train_loss": -23.761144638061523, "global_step": 214521, "epoch": 2584} {"train_loss": -24.335227966308594, "global_step": 214522, "epoch": 2584} {"train_loss": -24.206008911132812, "global_step": 214523, "epoch": 2584} {"train_loss": -23.178340911865234, "global_step": 214524, "epoch": 2584} {"train_loss": -24.427614212036133, "global_step": 214525, "epoch": 2584} {"train_loss": -24.55454444885254, "global_step": 214526, "epoch": 2584} {"train_loss": -24.299959182739258, "global_step": 214527, "epoch": 2584} {"train_loss": -24.303442001342773, "global_step": 214528, "epoch": 2584} {"train_loss": -24.174564361572266, "global_step": 214529, "epoch": 2584} {"train_loss": -24.424867630004883, "global_step": 214530, "epoch": 2584} {"train_loss": -24.270978927612305, "global_step": 214531, "epoch": 2584} {"train_loss": -24.022611618041992, "global_step": 214532, "epoch": 2584} {"train_loss": -24.302762985229492, "global_step": 214533, "epoch": 2584} {"train_loss": -24.337650299072266, "global_step": 214534, "epoch": 2584} {"train_loss": -24.33526611328125, "global_step": 214535, "epoch": 2584} {"train_loss": -24.23500633239746, "global_step": 214536, "epoch": 2584} {"train_loss": -24.83710289001465, "global_step": 214537, "epoch": 2584} {"train_loss": -24.42400550842285, "global_step": 214538, "epoch": 2584} {"train_loss": -24.401750564575195, "global_step": 214539, "epoch": 2584} {"train_loss": -24.497299194335938, "global_step": 214540, "epoch": 2584} {"train_loss": -24.73122787475586, "global_step": 214541, "epoch": 2584} {"train_loss": -24.595251083374023, "global_step": 214542, "epoch": 2584} {"train_loss": -24.532411575317383, "global_step": 214543, "epoch": 2584} {"train_loss": -24.58891487121582, "global_step": 214544, "epoch": 2584} {"train_loss": -24.48186492919922, "global_step": 214545, "epoch": 2584} {"train_loss": -24.623788833618164, "global_step": 214546, "epoch": 2584} {"train_loss": -24.483728408813477, "global_step": 214547, "epoch": 2584} {"train_loss": -24.28824234008789, "global_step": 214548, "epoch": 2584} {"train_loss": -24.50977325439453, "global_step": 214549, "epoch": 2584} {"train_loss": -24.703062057495117, "global_step": 214550, "epoch": 2584} {"train_loss": -24.535194396972656, "global_step": 214551, "epoch": 2584} {"train_loss": -24.4100284576416, "global_step": 214552, "epoch": 2584} {"train_loss": -24.49884033203125, "global_step": 214553, "epoch": 2584} {"train_loss": -24.342408559408533, "global_step": 214554, "epoch": 2584, "val_loss": 6610541.0} {"train_loss": -24.218372344970703, "global_step": 214555, "epoch": 2585} {"train_loss": -23.590778350830078, "global_step": 214556, "epoch": 2585} {"train_loss": -24.1091251373291, "global_step": 214557, "epoch": 2585} {"train_loss": -24.03351593017578, "global_step": 214558, "epoch": 2585} {"train_loss": -24.136194229125977, "global_step": 214559, "epoch": 2585} {"train_loss": -24.391685485839844, "global_step": 214560, "epoch": 2585} {"train_loss": -24.079442977905273, "global_step": 214561, "epoch": 2585} {"train_loss": -24.355100631713867, "global_step": 214562, "epoch": 2585} {"train_loss": -24.4146785736084, "global_step": 214563, "epoch": 2585} {"train_loss": -24.294174194335938, "global_step": 214564, "epoch": 2585} {"train_loss": -24.32660484313965, "global_step": 214565, "epoch": 2585} {"train_loss": -24.314701080322266, "global_step": 214566, "epoch": 2585} {"train_loss": -24.258197784423828, "global_step": 214567, "epoch": 2585} {"train_loss": -24.320520401000977, "global_step": 214568, "epoch": 2585} {"train_loss": -24.1400203704834, "global_step": 214569, "epoch": 2585} {"train_loss": -24.550390243530273, "global_step": 214570, "epoch": 2585} {"train_loss": -24.282554626464844, "global_step": 214571, "epoch": 2585} {"train_loss": -24.714399337768555, "global_step": 214572, "epoch": 2585} {"train_loss": -24.22905921936035, "global_step": 214573, "epoch": 2585} {"train_loss": -24.182157516479492, "global_step": 214574, "epoch": 2585} {"train_loss": -24.271224975585938, "global_step": 214575, "epoch": 2585} {"train_loss": -24.252262115478516, "global_step": 214576, "epoch": 2585} {"train_loss": -24.628171920776367, "global_step": 214577, "epoch": 2585} {"train_loss": -24.473129272460938, "global_step": 214578, "epoch": 2585} {"train_loss": -24.70295524597168, "global_step": 214579, "epoch": 2585} {"train_loss": -24.72881507873535, "global_step": 214580, "epoch": 2585} {"train_loss": -24.557941436767578, "global_step": 214581, "epoch": 2585} {"train_loss": -24.27779197692871, "global_step": 214582, "epoch": 2585} {"train_loss": -24.49934196472168, "global_step": 214583, "epoch": 2585} {"train_loss": -24.715030670166016, "global_step": 214584, "epoch": 2585} {"train_loss": -24.13301658630371, "global_step": 214585, "epoch": 2585} {"train_loss": -24.501617431640625, "global_step": 214586, "epoch": 2585} {"train_loss": -24.450109481811523, "global_step": 214587, "epoch": 2585} {"train_loss": -24.74070930480957, "global_step": 214588, "epoch": 2585} {"train_loss": -24.484844207763672, "global_step": 214589, "epoch": 2585} {"train_loss": -24.637889862060547, "global_step": 214590, "epoch": 2585} {"train_loss": -24.885425567626953, "global_step": 214591, "epoch": 2585} {"train_loss": -24.468652725219727, "global_step": 214592, "epoch": 2585} {"train_loss": -25.01117706298828, "global_step": 214593, "epoch": 2585} {"train_loss": -24.600704193115234, "global_step": 214594, "epoch": 2585} {"train_loss": -24.5543155670166, "global_step": 214595, "epoch": 2585} {"train_loss": -24.309045791625977, "global_step": 214596, "epoch": 2585} {"train_loss": -24.2525634765625, "global_step": 214597, "epoch": 2585} {"train_loss": -24.55048370361328, "global_step": 214598, "epoch": 2585} {"train_loss": -24.495996475219727, "global_step": 214599, "epoch": 2585} {"train_loss": -24.873302459716797, "global_step": 214600, "epoch": 2585} {"train_loss": -24.388202667236328, "global_step": 214601, "epoch": 2585} {"train_loss": -25.0861759185791, "global_step": 214602, "epoch": 2585} {"train_loss": -24.793588638305664, "global_step": 214603, "epoch": 2585} {"train_loss": -24.77864646911621, "global_step": 214604, "epoch": 2585} {"train_loss": -24.791772842407227, "global_step": 214605, "epoch": 2585} {"train_loss": -24.64504051208496, "global_step": 214606, "epoch": 2585} {"train_loss": -24.462377548217773, "global_step": 214607, "epoch": 2585} {"train_loss": -24.591943740844727, "global_step": 214608, "epoch": 2585} {"train_loss": -24.549270629882812, "global_step": 214609, "epoch": 2585} {"train_loss": -24.550434112548828, "global_step": 214610, "epoch": 2585} {"train_loss": -24.135927200317383, "global_step": 214611, "epoch": 2585} {"train_loss": -24.56086540222168, "global_step": 214612, "epoch": 2585} {"train_loss": -25.149404525756836, "global_step": 214613, "epoch": 2585} {"train_loss": -24.24690055847168, "global_step": 214614, "epoch": 2585} {"train_loss": -24.60069465637207, "global_step": 214615, "epoch": 2585} {"train_loss": -24.09417724609375, "global_step": 214616, "epoch": 2585} {"train_loss": -24.223377227783203, "global_step": 214617, "epoch": 2585} {"train_loss": -24.37202262878418, "global_step": 214618, "epoch": 2585} {"train_loss": -23.82474136352539, "global_step": 214619, "epoch": 2585} {"train_loss": -23.90018653869629, "global_step": 214620, "epoch": 2585} {"train_loss": -24.835569381713867, "global_step": 214621, "epoch": 2585} {"train_loss": -23.875822067260742, "global_step": 214622, "epoch": 2585} {"train_loss": -23.91888999938965, "global_step": 214623, "epoch": 2585} {"train_loss": -23.88356590270996, "global_step": 214624, "epoch": 2585} {"train_loss": -24.18794822692871, "global_step": 214625, "epoch": 2585} {"train_loss": -24.434551239013672, "global_step": 214626, "epoch": 2585} {"train_loss": -24.193693161010742, "global_step": 214627, "epoch": 2585} {"train_loss": -24.169334411621094, "global_step": 214628, "epoch": 2585} {"train_loss": -24.320411682128906, "global_step": 214629, "epoch": 2585} {"train_loss": -24.25843048095703, "global_step": 214630, "epoch": 2585} {"train_loss": -24.327533721923828, "global_step": 214631, "epoch": 2585} {"train_loss": -24.597213745117188, "global_step": 214632, "epoch": 2585} {"train_loss": -24.16608238220215, "global_step": 214633, "epoch": 2585} {"train_loss": -24.58356285095215, "global_step": 214634, "epoch": 2585} {"train_loss": -24.362030029296875, "global_step": 214635, "epoch": 2585} {"train_loss": -24.08582878112793, "global_step": 214636, "epoch": 2585} {"train_loss": -24.419091190200255, "global_step": 214637, "epoch": 2585, "val_loss": 6461518.0} {"train_loss": -24.36396598815918, "global_step": 214638, "epoch": 2586} {"train_loss": -24.37392234802246, "global_step": 214639, "epoch": 2586} {"train_loss": -24.179033279418945, "global_step": 214640, "epoch": 2586} {"train_loss": -24.137067794799805, "global_step": 214641, "epoch": 2586} {"train_loss": -24.478628158569336, "global_step": 214642, "epoch": 2586} {"train_loss": -24.578275680541992, "global_step": 214643, "epoch": 2586} {"train_loss": -24.261327743530273, "global_step": 214644, "epoch": 2586} {"train_loss": -24.4500789642334, "global_step": 214645, "epoch": 2586} {"train_loss": -24.65997886657715, "global_step": 214646, "epoch": 2586} {"train_loss": -23.892499923706055, "global_step": 214647, "epoch": 2586} {"train_loss": -24.48322105407715, "global_step": 214648, "epoch": 2586} {"train_loss": -24.37635612487793, "global_step": 214649, "epoch": 2586} {"train_loss": -24.04343605041504, "global_step": 214650, "epoch": 2586} {"train_loss": -24.40411376953125, "global_step": 214651, "epoch": 2586} {"train_loss": -24.59685516357422, "global_step": 214652, "epoch": 2586} {"train_loss": -24.428373336791992, "global_step": 214653, "epoch": 2586} {"train_loss": -24.70999526977539, "global_step": 214654, "epoch": 2586} {"train_loss": -24.232807159423828, "global_step": 214655, "epoch": 2586} {"train_loss": -24.762121200561523, "global_step": 214656, "epoch": 2586} {"train_loss": -24.369304656982422, "global_step": 214657, "epoch": 2586} {"train_loss": -24.788503646850586, "global_step": 214658, "epoch": 2586} {"train_loss": -24.35987091064453, "global_step": 214659, "epoch": 2586} {"train_loss": -24.50214958190918, "global_step": 214660, "epoch": 2586} {"train_loss": -24.36423110961914, "global_step": 214661, "epoch": 2586} {"train_loss": -24.600324630737305, "global_step": 214662, "epoch": 2586} {"train_loss": -24.85238265991211, "global_step": 214663, "epoch": 2586} {"train_loss": -24.37764549255371, "global_step": 214664, "epoch": 2586} {"train_loss": -24.773473739624023, "global_step": 214665, "epoch": 2586} {"train_loss": -24.700706481933594, "global_step": 214666, "epoch": 2586} {"train_loss": -24.423255920410156, "global_step": 214667, "epoch": 2586} {"train_loss": -24.844284057617188, "global_step": 214668, "epoch": 2586} {"train_loss": -24.413793563842773, "global_step": 214669, "epoch": 2586} {"train_loss": -24.12871742248535, "global_step": 214670, "epoch": 2586} {"train_loss": -23.942344665527344, "global_step": 214671, "epoch": 2586} {"train_loss": -24.19352149963379, "global_step": 214672, "epoch": 2586} {"train_loss": -24.01712989807129, "global_step": 214673, "epoch": 2586} {"train_loss": -24.35284423828125, "global_step": 214674, "epoch": 2586} {"train_loss": -24.045825958251953, "global_step": 214675, "epoch": 2586} {"train_loss": -24.342187881469727, "global_step": 214676, "epoch": 2586} {"train_loss": -24.355594635009766, "global_step": 214677, "epoch": 2586} {"train_loss": -24.556249618530273, "global_step": 214678, "epoch": 2586} {"train_loss": -23.92302131652832, "global_step": 214679, "epoch": 2586} {"train_loss": -24.707019805908203, "global_step": 214680, "epoch": 2586} {"train_loss": -24.182064056396484, "global_step": 214681, "epoch": 2586} {"train_loss": -23.988988876342773, "global_step": 214682, "epoch": 2586} {"train_loss": -24.321332931518555, "global_step": 214683, "epoch": 2586} {"train_loss": -24.233335494995117, "global_step": 214684, "epoch": 2586} {"train_loss": -24.125513076782227, "global_step": 214685, "epoch": 2586} {"train_loss": -24.242475509643555, "global_step": 214686, "epoch": 2586} {"train_loss": -24.301279067993164, "global_step": 214687, "epoch": 2586} {"train_loss": -24.089006423950195, "global_step": 214688, "epoch": 2586} {"train_loss": -24.355966567993164, "global_step": 214689, "epoch": 2586} {"train_loss": -24.37199592590332, "global_step": 214690, "epoch": 2586} {"train_loss": -24.103200912475586, "global_step": 214691, "epoch": 2586} {"train_loss": -24.158653259277344, "global_step": 214692, "epoch": 2586} {"train_loss": -24.143476486206055, "global_step": 214693, "epoch": 2586} {"train_loss": -24.88222312927246, "global_step": 214694, "epoch": 2586} {"train_loss": -24.271717071533203, "global_step": 214695, "epoch": 2586} {"train_loss": -24.850309371948242, "global_step": 214696, "epoch": 2586} {"train_loss": -24.923635482788086, "global_step": 214697, "epoch": 2586} {"train_loss": -24.648527145385742, "global_step": 214698, "epoch": 2586} {"train_loss": -24.365392684936523, "global_step": 214699, "epoch": 2586} {"train_loss": -24.541858673095703, "global_step": 214700, "epoch": 2586} {"train_loss": -24.837263107299805, "global_step": 214701, "epoch": 2586} {"train_loss": -24.83160972595215, "global_step": 214702, "epoch": 2586} {"train_loss": -24.496835708618164, "global_step": 214703, "epoch": 2586} {"train_loss": -24.545074462890625, "global_step": 214704, "epoch": 2586} {"train_loss": -24.36757469177246, "global_step": 214705, "epoch": 2586} {"train_loss": -24.73206901550293, "global_step": 214706, "epoch": 2586} {"train_loss": -24.317325592041016, "global_step": 214707, "epoch": 2586} {"train_loss": -24.22216796875, "global_step": 214708, "epoch": 2586} {"train_loss": -24.764265060424805, "global_step": 214709, "epoch": 2586} {"train_loss": -24.865278244018555, "global_step": 214710, "epoch": 2586} {"train_loss": -24.59771728515625, "global_step": 214711, "epoch": 2586} {"train_loss": -24.6585636138916, "global_step": 214712, "epoch": 2586} {"train_loss": -24.613956451416016, "global_step": 214713, "epoch": 2586} {"train_loss": -24.8564395904541, "global_step": 214714, "epoch": 2586} {"train_loss": -24.6158504486084, "global_step": 214715, "epoch": 2586} {"train_loss": -24.461833953857422, "global_step": 214716, "epoch": 2586} {"train_loss": -24.566843032836914, "global_step": 214717, "epoch": 2586} {"train_loss": -24.122608184814453, "global_step": 214718, "epoch": 2586} {"train_loss": -24.186813354492188, "global_step": 214719, "epoch": 2586} {"train_loss": -24.421818744705384, "global_step": 214720, "epoch": 2586, "val_loss": 6811285.5} {"train_loss": -22.866992950439453, "global_step": 214721, "epoch": 2587} {"train_loss": -21.303285598754883, "global_step": 214722, "epoch": 2587} {"train_loss": -23.381866455078125, "global_step": 214723, "epoch": 2587} {"train_loss": -23.473974227905273, "global_step": 214724, "epoch": 2587} {"train_loss": -23.193532943725586, "global_step": 214725, "epoch": 2587} {"train_loss": -23.848712921142578, "global_step": 214726, "epoch": 2587} {"train_loss": -23.824352264404297, "global_step": 214727, "epoch": 2587} {"train_loss": -23.877050399780273, "global_step": 214728, "epoch": 2587} {"train_loss": -23.87000274658203, "global_step": 214729, "epoch": 2587} {"train_loss": -23.957489013671875, "global_step": 214730, "epoch": 2587} {"train_loss": -23.7890625, "global_step": 214731, "epoch": 2587} {"train_loss": -23.98453712463379, "global_step": 214732, "epoch": 2587} {"train_loss": -24.057279586791992, "global_step": 214733, "epoch": 2587} {"train_loss": -23.880821228027344, "global_step": 214734, "epoch": 2587} {"train_loss": -23.828001022338867, "global_step": 214735, "epoch": 2587} {"train_loss": -24.195947647094727, "global_step": 214736, "epoch": 2587} {"train_loss": -23.914403915405273, "global_step": 214737, "epoch": 2587} {"train_loss": -24.4300537109375, "global_step": 214738, "epoch": 2587} {"train_loss": -24.006458282470703, "global_step": 214739, "epoch": 2587} {"train_loss": -23.70380401611328, "global_step": 214740, "epoch": 2587} {"train_loss": -24.26714515686035, "global_step": 214741, "epoch": 2587} {"train_loss": -24.152950286865234, "global_step": 214742, "epoch": 2587} {"train_loss": -24.27668571472168, "global_step": 214743, "epoch": 2587} {"train_loss": -24.145856857299805, "global_step": 214744, "epoch": 2587} {"train_loss": -24.59173011779785, "global_step": 214745, "epoch": 2587} {"train_loss": -23.987384796142578, "global_step": 214746, "epoch": 2587} {"train_loss": -24.0670166015625, "global_step": 214747, "epoch": 2587} {"train_loss": -24.65553092956543, "global_step": 214748, "epoch": 2587} {"train_loss": -23.976755142211914, "global_step": 214749, "epoch": 2587} {"train_loss": -24.23643684387207, "global_step": 214750, "epoch": 2587} {"train_loss": -24.438522338867188, "global_step": 214751, "epoch": 2587} {"train_loss": -24.276168823242188, "global_step": 214752, "epoch": 2587} {"train_loss": -24.477928161621094, "global_step": 214753, "epoch": 2587} {"train_loss": -24.054052352905273, "global_step": 214754, "epoch": 2587} {"train_loss": -24.20320701599121, "global_step": 214755, "epoch": 2587} {"train_loss": -24.649580001831055, "global_step": 214756, "epoch": 2587} {"train_loss": -24.68803596496582, "global_step": 214757, "epoch": 2587} {"train_loss": -24.42295265197754, "global_step": 214758, "epoch": 2587} {"train_loss": -24.66586685180664, "global_step": 214759, "epoch": 2587} {"train_loss": -24.477506637573242, "global_step": 214760, "epoch": 2587} {"train_loss": -24.722736358642578, "global_step": 214761, "epoch": 2587} {"train_loss": -24.191913604736328, "global_step": 214762, "epoch": 2587} {"train_loss": -24.84759521484375, "global_step": 214763, "epoch": 2587} {"train_loss": -24.33709716796875, "global_step": 214764, "epoch": 2587} {"train_loss": -24.531295776367188, "global_step": 214765, "epoch": 2587} {"train_loss": -24.23111343383789, "global_step": 214766, "epoch": 2587} {"train_loss": -24.640335083007812, "global_step": 214767, "epoch": 2587} {"train_loss": -24.790849685668945, "global_step": 214768, "epoch": 2587} {"train_loss": -24.4119815826416, "global_step": 214769, "epoch": 2587} {"train_loss": -24.409706115722656, "global_step": 214770, "epoch": 2587} {"train_loss": -24.3118839263916, "global_step": 214771, "epoch": 2587} {"train_loss": -24.52801513671875, "global_step": 214772, "epoch": 2587} {"train_loss": -24.57330894470215, "global_step": 214773, "epoch": 2587} {"train_loss": -24.8595027923584, "global_step": 214774, "epoch": 2587} {"train_loss": -24.796630859375, "global_step": 214775, "epoch": 2587} {"train_loss": -24.230897903442383, "global_step": 214776, "epoch": 2587} {"train_loss": -24.48346519470215, "global_step": 214777, "epoch": 2587} {"train_loss": -24.15961265563965, "global_step": 214778, "epoch": 2587} {"train_loss": -24.0922794342041, "global_step": 214779, "epoch": 2587} {"train_loss": -24.43494987487793, "global_step": 214780, "epoch": 2587} {"train_loss": -24.637725830078125, "global_step": 214781, "epoch": 2587} {"train_loss": -24.37788200378418, "global_step": 214782, "epoch": 2587} {"train_loss": -24.616243362426758, "global_step": 214783, "epoch": 2587} {"train_loss": -24.62489891052246, "global_step": 214784, "epoch": 2587} {"train_loss": -24.7666072845459, "global_step": 214785, "epoch": 2587} {"train_loss": -24.630666732788086, "global_step": 214786, "epoch": 2587} {"train_loss": -24.545366287231445, "global_step": 214787, "epoch": 2587} {"train_loss": -24.861867904663086, "global_step": 214788, "epoch": 2587} {"train_loss": -24.514995574951172, "global_step": 214789, "epoch": 2587} {"train_loss": -24.218372344970703, "global_step": 214790, "epoch": 2587} {"train_loss": -23.971420288085938, "global_step": 214791, "epoch": 2587} {"train_loss": -24.013580322265625, "global_step": 214792, "epoch": 2587} {"train_loss": -24.5810604095459, "global_step": 214793, "epoch": 2587} {"train_loss": -24.245939254760742, "global_step": 214794, "epoch": 2587} {"train_loss": -24.149017333984375, "global_step": 214795, "epoch": 2587} {"train_loss": -24.144742965698242, "global_step": 214796, "epoch": 2587} {"train_loss": -24.379528045654297, "global_step": 214797, "epoch": 2587} {"train_loss": -24.28569984436035, "global_step": 214798, "epoch": 2587} {"train_loss": -24.32008934020996, "global_step": 214799, "epoch": 2587} {"train_loss": -24.56903076171875, "global_step": 214800, "epoch": 2587} {"train_loss": -24.4542236328125, "global_step": 214801, "epoch": 2587} {"train_loss": -24.42433738708496, "global_step": 214802, "epoch": 2587} {"train_loss": -24.235464371830584, "global_step": 214803, "epoch": 2587, "val_loss": 6578536.0} {"train_loss": -23.502073287963867, "global_step": 214804, "epoch": 2588} {"train_loss": -23.28329086303711, "global_step": 214805, "epoch": 2588} {"train_loss": -23.593948364257812, "global_step": 214806, "epoch": 2588} {"train_loss": -23.573942184448242, "global_step": 214807, "epoch": 2588} {"train_loss": -23.737302780151367, "global_step": 214808, "epoch": 2588} {"train_loss": -23.91374969482422, "global_step": 214809, "epoch": 2588} {"train_loss": -23.705350875854492, "global_step": 214810, "epoch": 2588} {"train_loss": -23.85286521911621, "global_step": 214811, "epoch": 2588} {"train_loss": -23.962596893310547, "global_step": 214812, "epoch": 2588} {"train_loss": -23.638702392578125, "global_step": 214813, "epoch": 2588} {"train_loss": -24.289457321166992, "global_step": 214814, "epoch": 2588} {"train_loss": -24.036413192749023, "global_step": 214815, "epoch": 2588} {"train_loss": -24.211322784423828, "global_step": 214816, "epoch": 2588} {"train_loss": -24.388593673706055, "global_step": 214817, "epoch": 2588} {"train_loss": -24.009706497192383, "global_step": 214818, "epoch": 2588} {"train_loss": -24.575000762939453, "global_step": 214819, "epoch": 2588} {"train_loss": -24.745092391967773, "global_step": 214820, "epoch": 2588} {"train_loss": -24.018131256103516, "global_step": 214821, "epoch": 2588} {"train_loss": -24.10921287536621, "global_step": 214822, "epoch": 2588} {"train_loss": -24.450531005859375, "global_step": 214823, "epoch": 2588} {"train_loss": -24.29155731201172, "global_step": 214824, "epoch": 2588} {"train_loss": -24.673521041870117, "global_step": 214825, "epoch": 2588} {"train_loss": -24.34455680847168, "global_step": 214826, "epoch": 2588} {"train_loss": -24.513797760009766, "global_step": 214827, "epoch": 2588} {"train_loss": -24.613550186157227, "global_step": 214828, "epoch": 2588} {"train_loss": -24.39727020263672, "global_step": 214829, "epoch": 2588} {"train_loss": -24.11713218688965, "global_step": 214830, "epoch": 2588} {"train_loss": -24.65872573852539, "global_step": 214831, "epoch": 2588} {"train_loss": -24.20185661315918, "global_step": 214832, "epoch": 2588} {"train_loss": -24.953596115112305, "global_step": 214833, "epoch": 2588} {"train_loss": -24.09056854248047, "global_step": 214834, "epoch": 2588} {"train_loss": -24.86359405517578, "global_step": 214835, "epoch": 2588} {"train_loss": -24.75028419494629, "global_step": 214836, "epoch": 2588} {"train_loss": -24.264808654785156, "global_step": 214837, "epoch": 2588} {"train_loss": -24.41757583618164, "global_step": 214838, "epoch": 2588} {"train_loss": -24.98563003540039, "global_step": 214839, "epoch": 2588} {"train_loss": -24.64127540588379, "global_step": 214840, "epoch": 2588} {"train_loss": -24.864200592041016, "global_step": 214841, "epoch": 2588} {"train_loss": -25.020526885986328, "global_step": 214842, "epoch": 2588} {"train_loss": -24.688879013061523, "global_step": 214843, "epoch": 2588} {"train_loss": -24.50493049621582, "global_step": 214844, "epoch": 2588} {"train_loss": -24.719636917114258, "global_step": 214845, "epoch": 2588} {"train_loss": -24.478395462036133, "global_step": 214846, "epoch": 2588} {"train_loss": -24.332082748413086, "global_step": 214847, "epoch": 2588} {"train_loss": -24.435161590576172, "global_step": 214848, "epoch": 2588} {"train_loss": -24.591785430908203, "global_step": 214849, "epoch": 2588} {"train_loss": -24.80867576599121, "global_step": 214850, "epoch": 2588} {"train_loss": -24.273948669433594, "global_step": 214851, "epoch": 2588} {"train_loss": -24.265613555908203, "global_step": 214852, "epoch": 2588} {"train_loss": -24.310400009155273, "global_step": 214853, "epoch": 2588} {"train_loss": -24.693090438842773, "global_step": 214854, "epoch": 2588} {"train_loss": -24.33444595336914, "global_step": 214855, "epoch": 2588} {"train_loss": -24.493879318237305, "global_step": 214856, "epoch": 2588} {"train_loss": -24.678882598876953, "global_step": 214857, "epoch": 2588} {"train_loss": -24.35860252380371, "global_step": 214858, "epoch": 2588} {"train_loss": -24.095924377441406, "global_step": 214859, "epoch": 2588} {"train_loss": -24.3494930267334, "global_step": 214860, "epoch": 2588} {"train_loss": -24.302471160888672, "global_step": 214861, "epoch": 2588} {"train_loss": -24.397184371948242, "global_step": 214862, "epoch": 2588} {"train_loss": -24.700546264648438, "global_step": 214863, "epoch": 2588} {"train_loss": -24.020116806030273, "global_step": 214864, "epoch": 2588} {"train_loss": -24.521177291870117, "global_step": 214865, "epoch": 2588} {"train_loss": -24.251556396484375, "global_step": 214866, "epoch": 2588} {"train_loss": -24.31148910522461, "global_step": 214867, "epoch": 2588} {"train_loss": -24.5, "global_step": 214868, "epoch": 2588} {"train_loss": -24.819061279296875, "global_step": 214869, "epoch": 2588} {"train_loss": -24.548311233520508, "global_step": 214870, "epoch": 2588} {"train_loss": -24.54663848876953, "global_step": 214871, "epoch": 2588} {"train_loss": -24.409563064575195, "global_step": 214872, "epoch": 2588} {"train_loss": -24.67766761779785, "global_step": 214873, "epoch": 2588} {"train_loss": -24.574304580688477, "global_step": 214874, "epoch": 2588} {"train_loss": -24.59212875366211, "global_step": 214875, "epoch": 2588} {"train_loss": -24.72840690612793, "global_step": 214876, "epoch": 2588} {"train_loss": -24.853384017944336, "global_step": 214877, "epoch": 2588} {"train_loss": -24.63508415222168, "global_step": 214878, "epoch": 2588} {"train_loss": -24.718542098999023, "global_step": 214879, "epoch": 2588} {"train_loss": -24.8535213470459, "global_step": 214880, "epoch": 2588} {"train_loss": -24.45443344116211, "global_step": 214881, "epoch": 2588} {"train_loss": -24.723642349243164, "global_step": 214882, "epoch": 2588} {"train_loss": -24.555845260620117, "global_step": 214883, "epoch": 2588} {"train_loss": -24.51129150390625, "global_step": 214884, "epoch": 2588} {"train_loss": -24.710084915161133, "global_step": 214885, "epoch": 2588} {"train_loss": -24.388148503131177, "global_step": 214886, "epoch": 2588, "val_loss": 6579211.0} {"train_loss": -23.969444274902344, "global_step": 214887, "epoch": 2589} {"train_loss": -24.35882568359375, "global_step": 214888, "epoch": 2589} {"train_loss": -24.643789291381836, "global_step": 214889, "epoch": 2589} {"train_loss": -23.887861251831055, "global_step": 214890, "epoch": 2589} {"train_loss": -24.4061222076416, "global_step": 214891, "epoch": 2589} {"train_loss": -23.61253547668457, "global_step": 214892, "epoch": 2589} {"train_loss": -23.97572135925293, "global_step": 214893, "epoch": 2589} {"train_loss": -23.96949577331543, "global_step": 214894, "epoch": 2589} {"train_loss": -24.768362045288086, "global_step": 214895, "epoch": 2589} {"train_loss": -24.5152587890625, "global_step": 214896, "epoch": 2589} {"train_loss": -23.778860092163086, "global_step": 214897, "epoch": 2589} {"train_loss": -24.613861083984375, "global_step": 214898, "epoch": 2589} {"train_loss": -24.281463623046875, "global_step": 214899, "epoch": 2589} {"train_loss": -24.147565841674805, "global_step": 214900, "epoch": 2589} {"train_loss": -24.44711685180664, "global_step": 214901, "epoch": 2589} {"train_loss": -24.38125991821289, "global_step": 214902, "epoch": 2589} {"train_loss": -24.143266677856445, "global_step": 214903, "epoch": 2589} {"train_loss": -24.603662490844727, "global_step": 214904, "epoch": 2589} {"train_loss": -24.23905372619629, "global_step": 214905, "epoch": 2589} {"train_loss": -24.533681869506836, "global_step": 214906, "epoch": 2589} {"train_loss": -23.886005401611328, "global_step": 214907, "epoch": 2589} {"train_loss": -23.970388412475586, "global_step": 214908, "epoch": 2589} {"train_loss": -24.35885238647461, "global_step": 214909, "epoch": 2589} {"train_loss": -24.365753173828125, "global_step": 214910, "epoch": 2589} {"train_loss": -24.483617782592773, "global_step": 214911, "epoch": 2589} {"train_loss": -24.417631149291992, "global_step": 214912, "epoch": 2589} {"train_loss": -24.495391845703125, "global_step": 214913, "epoch": 2589} {"train_loss": -25.09095573425293, "global_step": 214914, "epoch": 2589} {"train_loss": -24.225936889648438, "global_step": 214915, "epoch": 2589} {"train_loss": -24.037519454956055, "global_step": 214916, "epoch": 2589} {"train_loss": -24.544607162475586, "global_step": 214917, "epoch": 2589} {"train_loss": -24.595903396606445, "global_step": 214918, "epoch": 2589} {"train_loss": -24.429555892944336, "global_step": 214919, "epoch": 2589} {"train_loss": -24.324949264526367, "global_step": 214920, "epoch": 2589} {"train_loss": -24.17885398864746, "global_step": 214921, "epoch": 2589} {"train_loss": -24.525259017944336, "global_step": 214922, "epoch": 2589} {"train_loss": -24.533130645751953, "global_step": 214923, "epoch": 2589} {"train_loss": -24.53900909423828, "global_step": 214924, "epoch": 2589} {"train_loss": -24.305320739746094, "global_step": 214925, "epoch": 2589} {"train_loss": -24.559885025024414, "global_step": 214926, "epoch": 2589} {"train_loss": -24.190092086791992, "global_step": 214927, "epoch": 2589} {"train_loss": -24.6800594329834, "global_step": 214928, "epoch": 2589} {"train_loss": -24.81753921508789, "global_step": 214929, "epoch": 2589} {"train_loss": -24.641864776611328, "global_step": 214930, "epoch": 2589} {"train_loss": -24.54229164123535, "global_step": 214931, "epoch": 2589} {"train_loss": -24.4954833984375, "global_step": 214932, "epoch": 2589} {"train_loss": -24.66357421875, "global_step": 214933, "epoch": 2589} {"train_loss": -24.562469482421875, "global_step": 214934, "epoch": 2589} {"train_loss": -24.411331176757812, "global_step": 214935, "epoch": 2589} {"train_loss": -24.53298568725586, "global_step": 214936, "epoch": 2589} {"train_loss": -24.611520767211914, "global_step": 214937, "epoch": 2589} {"train_loss": -24.3206787109375, "global_step": 214938, "epoch": 2589} {"train_loss": -24.713943481445312, "global_step": 214939, "epoch": 2589} {"train_loss": -24.904369354248047, "global_step": 214940, "epoch": 2589} {"train_loss": -24.763153076171875, "global_step": 214941, "epoch": 2589} {"train_loss": -24.527036666870117, "global_step": 214942, "epoch": 2589} {"train_loss": -24.608062744140625, "global_step": 214943, "epoch": 2589} {"train_loss": -24.31123161315918, "global_step": 214944, "epoch": 2589} {"train_loss": -24.56397819519043, "global_step": 214945, "epoch": 2589} {"train_loss": -24.78602409362793, "global_step": 214946, "epoch": 2589} {"train_loss": -24.408933639526367, "global_step": 214947, "epoch": 2589} {"train_loss": -24.776630401611328, "global_step": 214948, "epoch": 2589} {"train_loss": -24.386022567749023, "global_step": 214949, "epoch": 2589} {"train_loss": -24.267242431640625, "global_step": 214950, "epoch": 2589} {"train_loss": -24.317398071289062, "global_step": 214951, "epoch": 2589} {"train_loss": -23.41537857055664, "global_step": 214952, "epoch": 2589} {"train_loss": -24.3356876373291, "global_step": 214953, "epoch": 2589} {"train_loss": -24.398035049438477, "global_step": 214954, "epoch": 2589} {"train_loss": -24.515546798706055, "global_step": 214955, "epoch": 2589} {"train_loss": -24.058874130249023, "global_step": 214956, "epoch": 2589} {"train_loss": -24.511863708496094, "global_step": 214957, "epoch": 2589} {"train_loss": -24.496484756469727, "global_step": 214958, "epoch": 2589} {"train_loss": -24.145212173461914, "global_step": 214959, "epoch": 2589} {"train_loss": -24.452396392822266, "global_step": 214960, "epoch": 2589} {"train_loss": -24.23360252380371, "global_step": 214961, "epoch": 2589} {"train_loss": -24.464052200317383, "global_step": 214962, "epoch": 2589} {"train_loss": -24.33915138244629, "global_step": 214963, "epoch": 2589} {"train_loss": -24.12615394592285, "global_step": 214964, "epoch": 2589} {"train_loss": -24.702035903930664, "global_step": 214965, "epoch": 2589} {"train_loss": -24.709495544433594, "global_step": 214966, "epoch": 2589} {"train_loss": -24.44256019592285, "global_step": 214967, "epoch": 2589} {"train_loss": -24.45291519165039, "global_step": 214968, "epoch": 2589} {"train_loss": -24.39754421739693, "global_step": 214969, "epoch": 2589, "val_loss": 6618956.0} {"train_loss": -24.184804916381836, "global_step": 214970, "epoch": 2590} {"train_loss": -24.199222564697266, "global_step": 214971, "epoch": 2590} {"train_loss": -24.345680236816406, "global_step": 214972, "epoch": 2590} {"train_loss": -24.103918075561523, "global_step": 214973, "epoch": 2590} {"train_loss": -24.14840316772461, "global_step": 214974, "epoch": 2590} {"train_loss": -24.200790405273438, "global_step": 214975, "epoch": 2590} {"train_loss": -24.578372955322266, "global_step": 214976, "epoch": 2590} {"train_loss": -24.16202163696289, "global_step": 214977, "epoch": 2590} {"train_loss": -24.340396881103516, "global_step": 214978, "epoch": 2590} {"train_loss": -24.269254684448242, "global_step": 214979, "epoch": 2590} {"train_loss": -24.321210861206055, "global_step": 214980, "epoch": 2590} {"train_loss": -24.187957763671875, "global_step": 214981, "epoch": 2590} {"train_loss": -24.473365783691406, "global_step": 214982, "epoch": 2590} {"train_loss": -24.046255111694336, "global_step": 214983, "epoch": 2590} {"train_loss": -24.0642147064209, "global_step": 214984, "epoch": 2590} {"train_loss": -24.494274139404297, "global_step": 214985, "epoch": 2590} {"train_loss": -24.16126823425293, "global_step": 214986, "epoch": 2590} {"train_loss": -24.24649429321289, "global_step": 214987, "epoch": 2590} {"train_loss": -24.199655532836914, "global_step": 214988, "epoch": 2590} {"train_loss": -24.04500961303711, "global_step": 214989, "epoch": 2590} {"train_loss": -24.423898696899414, "global_step": 214990, "epoch": 2590} {"train_loss": -24.653776168823242, "global_step": 214991, "epoch": 2590} {"train_loss": -24.733383178710938, "global_step": 214992, "epoch": 2590} {"train_loss": -24.21458625793457, "global_step": 214993, "epoch": 2590} {"train_loss": -24.144699096679688, "global_step": 214994, "epoch": 2590} {"train_loss": -23.968826293945312, "global_step": 214995, "epoch": 2590} {"train_loss": -24.235149383544922, "global_step": 214996, "epoch": 2590} {"train_loss": -24.614194869995117, "global_step": 214997, "epoch": 2590} {"train_loss": -24.335784912109375, "global_step": 214998, "epoch": 2590} {"train_loss": -24.391326904296875, "global_step": 214999, "epoch": 2590} {"train_loss": -24.14936637878418, "global_step": 215000, "epoch": 2590} {"train_loss": -24.5885066986084, "global_step": 215001, "epoch": 2590} {"train_loss": -24.418350219726562, "global_step": 215002, "epoch": 2590} {"train_loss": -24.769657135009766, "global_step": 215003, "epoch": 2590} {"train_loss": -24.382080078125, "global_step": 215004, "epoch": 2590} {"train_loss": -24.751413345336914, "global_step": 215005, "epoch": 2590} {"train_loss": -24.274295806884766, "global_step": 215006, "epoch": 2590} {"train_loss": -25.009254455566406, "global_step": 215007, "epoch": 2590} {"train_loss": -24.458024978637695, "global_step": 215008, "epoch": 2590} {"train_loss": -24.87998390197754, "global_step": 215009, "epoch": 2590} {"train_loss": -24.4981632232666, "global_step": 215010, "epoch": 2590} {"train_loss": -25.010984420776367, "global_step": 215011, "epoch": 2590} {"train_loss": -24.658109664916992, "global_step": 215012, "epoch": 2590} {"train_loss": -24.5902156829834, "global_step": 215013, "epoch": 2590} {"train_loss": -24.55843734741211, "global_step": 215014, "epoch": 2590} {"train_loss": -24.049827575683594, "global_step": 215015, "epoch": 2590} {"train_loss": -24.818557739257812, "global_step": 215016, "epoch": 2590} {"train_loss": -24.291555404663086, "global_step": 215017, "epoch": 2590} {"train_loss": -24.487363815307617, "global_step": 215018, "epoch": 2590} {"train_loss": -24.57131576538086, "global_step": 215019, "epoch": 2590} {"train_loss": -24.8048095703125, "global_step": 215020, "epoch": 2590} {"train_loss": -24.962186813354492, "global_step": 215021, "epoch": 2590} {"train_loss": -24.383726119995117, "global_step": 215022, "epoch": 2590} {"train_loss": -24.583023071289062, "global_step": 215023, "epoch": 2590} {"train_loss": -24.4644718170166, "global_step": 215024, "epoch": 2590} {"train_loss": -25.030012130737305, "global_step": 215025, "epoch": 2590} {"train_loss": -24.61342430114746, "global_step": 215026, "epoch": 2590} {"train_loss": -24.522687911987305, "global_step": 215027, "epoch": 2590} {"train_loss": -24.53662109375, "global_step": 215028, "epoch": 2590} {"train_loss": -24.87956428527832, "global_step": 215029, "epoch": 2590} {"train_loss": -24.309553146362305, "global_step": 215030, "epoch": 2590} {"train_loss": -24.43984031677246, "global_step": 215031, "epoch": 2590} {"train_loss": -24.378005981445312, "global_step": 215032, "epoch": 2590} {"train_loss": -24.714027404785156, "global_step": 215033, "epoch": 2590} {"train_loss": -24.330902099609375, "global_step": 215034, "epoch": 2590} {"train_loss": -24.35269546508789, "global_step": 215035, "epoch": 2590} {"train_loss": -24.147403717041016, "global_step": 215036, "epoch": 2590} {"train_loss": -24.36028480529785, "global_step": 215037, "epoch": 2590} {"train_loss": -24.40085792541504, "global_step": 215038, "epoch": 2590} {"train_loss": -24.346698760986328, "global_step": 215039, "epoch": 2590} {"train_loss": -24.532821655273438, "global_step": 215040, "epoch": 2590} {"train_loss": -24.575220108032227, "global_step": 215041, "epoch": 2590} {"train_loss": -24.252607345581055, "global_step": 215042, "epoch": 2590} {"train_loss": -24.250150680541992, "global_step": 215043, "epoch": 2590} {"train_loss": -24.572385787963867, "global_step": 215044, "epoch": 2590} {"train_loss": -24.37544822692871, "global_step": 215045, "epoch": 2590} {"train_loss": -24.273666381835938, "global_step": 215046, "epoch": 2590} {"train_loss": -24.576675415039062, "global_step": 215047, "epoch": 2590} {"train_loss": -24.202041625976562, "global_step": 215048, "epoch": 2590} {"train_loss": -24.61922264099121, "global_step": 215049, "epoch": 2590} {"train_loss": -24.4461727142334, "global_step": 215050, "epoch": 2590} {"train_loss": -24.57679557800293, "global_step": 215051, "epoch": 2590} {"train_loss": -24.429892689348705, "global_step": 215052, "epoch": 2590, "val_loss": 6818319.0} {"train_loss": -24.02571678161621, "global_step": 215053, "epoch": 2591} {"train_loss": -24.2171573638916, "global_step": 215054, "epoch": 2591} {"train_loss": -23.5294246673584, "global_step": 215055, "epoch": 2591} {"train_loss": -23.63834571838379, "global_step": 215056, "epoch": 2591} {"train_loss": -23.685436248779297, "global_step": 215057, "epoch": 2591} {"train_loss": -23.981063842773438, "global_step": 215058, "epoch": 2591} {"train_loss": -23.7156982421875, "global_step": 215059, "epoch": 2591} {"train_loss": -24.185651779174805, "global_step": 215060, "epoch": 2591} {"train_loss": -23.667438507080078, "global_step": 215061, "epoch": 2591} {"train_loss": -23.963857650756836, "global_step": 215062, "epoch": 2591} {"train_loss": -24.042015075683594, "global_step": 215063, "epoch": 2591} {"train_loss": -24.453174591064453, "global_step": 215064, "epoch": 2591} {"train_loss": -24.264612197875977, "global_step": 215065, "epoch": 2591} {"train_loss": -24.12420654296875, "global_step": 215066, "epoch": 2591} {"train_loss": -24.329673767089844, "global_step": 215067, "epoch": 2591} {"train_loss": -23.914907455444336, "global_step": 215068, "epoch": 2591} {"train_loss": -24.3759822845459, "global_step": 215069, "epoch": 2591} {"train_loss": -24.312347412109375, "global_step": 215070, "epoch": 2591} {"train_loss": -24.58970069885254, "global_step": 215071, "epoch": 2591} {"train_loss": -24.66786766052246, "global_step": 215072, "epoch": 2591} {"train_loss": -24.1755313873291, "global_step": 215073, "epoch": 2591} {"train_loss": -24.233280181884766, "global_step": 215074, "epoch": 2591} {"train_loss": -24.569297790527344, "global_step": 215075, "epoch": 2591} {"train_loss": -24.246109008789062, "global_step": 215076, "epoch": 2591} {"train_loss": -23.836166381835938, "global_step": 215077, "epoch": 2591} {"train_loss": -24.709341049194336, "global_step": 215078, "epoch": 2591} {"train_loss": -24.5871639251709, "global_step": 215079, "epoch": 2591} {"train_loss": -24.40972328186035, "global_step": 215080, "epoch": 2591} {"train_loss": -24.658140182495117, "global_step": 215081, "epoch": 2591} {"train_loss": -24.345794677734375, "global_step": 215082, "epoch": 2591} {"train_loss": -24.645742416381836, "global_step": 215083, "epoch": 2591} {"train_loss": -24.606943130493164, "global_step": 215084, "epoch": 2591} {"train_loss": -24.173133850097656, "global_step": 215085, "epoch": 2591} {"train_loss": -24.8709774017334, "global_step": 215086, "epoch": 2591} {"train_loss": -24.38489532470703, "global_step": 215087, "epoch": 2591} {"train_loss": -24.870676040649414, "global_step": 215088, "epoch": 2591} {"train_loss": -24.572595596313477, "global_step": 215089, "epoch": 2591} {"train_loss": -24.571447372436523, "global_step": 215090, "epoch": 2591} {"train_loss": -24.470273971557617, "global_step": 215091, "epoch": 2591} {"train_loss": -24.653656005859375, "global_step": 215092, "epoch": 2591} {"train_loss": -24.493131637573242, "global_step": 215093, "epoch": 2591} {"train_loss": -24.643014907836914, "global_step": 215094, "epoch": 2591} {"train_loss": -24.94798469543457, "global_step": 215095, "epoch": 2591} {"train_loss": -24.5871524810791, "global_step": 215096, "epoch": 2591} {"train_loss": -24.286243438720703, "global_step": 215097, "epoch": 2591} {"train_loss": -24.58148193359375, "global_step": 215098, "epoch": 2591} {"train_loss": -24.854816436767578, "global_step": 215099, "epoch": 2591} {"train_loss": -24.31507682800293, "global_step": 215100, "epoch": 2591} {"train_loss": -24.84154510498047, "global_step": 215101, "epoch": 2591} {"train_loss": -24.032285690307617, "global_step": 215102, "epoch": 2591} {"train_loss": -24.197208404541016, "global_step": 215103, "epoch": 2591} {"train_loss": -24.315515518188477, "global_step": 215104, "epoch": 2591} {"train_loss": -24.56850242614746, "global_step": 215105, "epoch": 2591} {"train_loss": -24.157527923583984, "global_step": 215106, "epoch": 2591} {"train_loss": -24.432920455932617, "global_step": 215107, "epoch": 2591} {"train_loss": -24.299436569213867, "global_step": 215108, "epoch": 2591} {"train_loss": -24.196983337402344, "global_step": 215109, "epoch": 2591} {"train_loss": -24.014179229736328, "global_step": 215110, "epoch": 2591} {"train_loss": -24.383329391479492, "global_step": 215111, "epoch": 2591} {"train_loss": -24.500391006469727, "global_step": 215112, "epoch": 2591} {"train_loss": -24.135345458984375, "global_step": 215113, "epoch": 2591} {"train_loss": -24.460834503173828, "global_step": 215114, "epoch": 2591} {"train_loss": -24.67304039001465, "global_step": 215115, "epoch": 2591} {"train_loss": -24.595746994018555, "global_step": 215116, "epoch": 2591} {"train_loss": -24.408153533935547, "global_step": 215117, "epoch": 2591} {"train_loss": -24.29463768005371, "global_step": 215118, "epoch": 2591} {"train_loss": -24.10923957824707, "global_step": 215119, "epoch": 2591} {"train_loss": -24.289325714111328, "global_step": 215120, "epoch": 2591} {"train_loss": -24.504684448242188, "global_step": 215121, "epoch": 2591} {"train_loss": -24.84868812561035, "global_step": 215122, "epoch": 2591} {"train_loss": -24.450185775756836, "global_step": 215123, "epoch": 2591} {"train_loss": -24.732654571533203, "global_step": 215124, "epoch": 2591} {"train_loss": -24.436857223510742, "global_step": 215125, "epoch": 2591} {"train_loss": -24.634000778198242, "global_step": 215126, "epoch": 2591} {"train_loss": -24.56606101989746, "global_step": 215127, "epoch": 2591} {"train_loss": -24.735021591186523, "global_step": 215128, "epoch": 2591} {"train_loss": -24.27747917175293, "global_step": 215129, "epoch": 2591} {"train_loss": -24.389816284179688, "global_step": 215130, "epoch": 2591} {"train_loss": -24.63055992126465, "global_step": 215131, "epoch": 2591} {"train_loss": -24.527210235595703, "global_step": 215132, "epoch": 2591} {"train_loss": -24.743154525756836, "global_step": 215133, "epoch": 2591} {"train_loss": -24.699697494506836, "global_step": 215134, "epoch": 2591} {"train_loss": -24.396755172545653, "global_step": 215135, "epoch": 2591, "val_loss": 6516043.0} {"train_loss": -23.86880111694336, "global_step": 215136, "epoch": 2592} {"train_loss": -24.110519409179688, "global_step": 215137, "epoch": 2592} {"train_loss": -23.9013671875, "global_step": 215138, "epoch": 2592} {"train_loss": -24.327741622924805, "global_step": 215139, "epoch": 2592} {"train_loss": -23.96522331237793, "global_step": 215140, "epoch": 2592} {"train_loss": -24.105390548706055, "global_step": 215141, "epoch": 2592} {"train_loss": -24.06807518005371, "global_step": 215142, "epoch": 2592} {"train_loss": -24.044843673706055, "global_step": 215143, "epoch": 2592} {"train_loss": -23.981393814086914, "global_step": 215144, "epoch": 2592} {"train_loss": -24.020963668823242, "global_step": 215145, "epoch": 2592} {"train_loss": -24.218997955322266, "global_step": 215146, "epoch": 2592} {"train_loss": -24.15949821472168, "global_step": 215147, "epoch": 2592} {"train_loss": -23.860246658325195, "global_step": 215148, "epoch": 2592} {"train_loss": -24.327194213867188, "global_step": 215149, "epoch": 2592} {"train_loss": -24.728853225708008, "global_step": 215150, "epoch": 2592} {"train_loss": -24.334814071655273, "global_step": 215151, "epoch": 2592} {"train_loss": -24.264135360717773, "global_step": 215152, "epoch": 2592} {"train_loss": -24.556257247924805, "global_step": 215153, "epoch": 2592} {"train_loss": -24.757749557495117, "global_step": 215154, "epoch": 2592} {"train_loss": -24.462448120117188, "global_step": 215155, "epoch": 2592} {"train_loss": -24.35065269470215, "global_step": 215156, "epoch": 2592} {"train_loss": -24.627378463745117, "global_step": 215157, "epoch": 2592} {"train_loss": -24.466684341430664, "global_step": 215158, "epoch": 2592} {"train_loss": -24.393217086791992, "global_step": 215159, "epoch": 2592} {"train_loss": -24.49715232849121, "global_step": 215160, "epoch": 2592} {"train_loss": -24.309009552001953, "global_step": 215161, "epoch": 2592} {"train_loss": -24.42951774597168, "global_step": 215162, "epoch": 2592} {"train_loss": -24.590560913085938, "global_step": 215163, "epoch": 2592} {"train_loss": -24.53859519958496, "global_step": 215164, "epoch": 2592} {"train_loss": -24.750577926635742, "global_step": 215165, "epoch": 2592} {"train_loss": -24.852510452270508, "global_step": 215166, "epoch": 2592} {"train_loss": -24.512815475463867, "global_step": 215167, "epoch": 2592} {"train_loss": -24.62000846862793, "global_step": 215168, "epoch": 2592} {"train_loss": -24.618812561035156, "global_step": 215169, "epoch": 2592} {"train_loss": -24.56220054626465, "global_step": 215170, "epoch": 2592} {"train_loss": -24.175046920776367, "global_step": 215171, "epoch": 2592} {"train_loss": -24.686880111694336, "global_step": 215172, "epoch": 2592} {"train_loss": -24.820514678955078, "global_step": 215173, "epoch": 2592} {"train_loss": -24.837717056274414, "global_step": 215174, "epoch": 2592} {"train_loss": -24.0969295501709, "global_step": 215175, "epoch": 2592} {"train_loss": -24.579069137573242, "global_step": 215176, "epoch": 2592} {"train_loss": -24.64987564086914, "global_step": 215177, "epoch": 2592} {"train_loss": -23.74186134338379, "global_step": 215178, "epoch": 2592} {"train_loss": -24.177762985229492, "global_step": 215179, "epoch": 2592} {"train_loss": -24.481473922729492, "global_step": 215180, "epoch": 2592} {"train_loss": -23.86414909362793, "global_step": 215181, "epoch": 2592} {"train_loss": -24.507516860961914, "global_step": 215182, "epoch": 2592} {"train_loss": -24.32322120666504, "global_step": 215183, "epoch": 2592} {"train_loss": -24.246984481811523, "global_step": 215184, "epoch": 2592} {"train_loss": -23.88042640686035, "global_step": 215185, "epoch": 2592} {"train_loss": -24.514467239379883, "global_step": 215186, "epoch": 2592} {"train_loss": -24.560434341430664, "global_step": 215187, "epoch": 2592} {"train_loss": -23.973865509033203, "global_step": 215188, "epoch": 2592} {"train_loss": -24.336994171142578, "global_step": 215189, "epoch": 2592} {"train_loss": -24.323957443237305, "global_step": 215190, "epoch": 2592} {"train_loss": -24.4309139251709, "global_step": 215191, "epoch": 2592} {"train_loss": -24.565881729125977, "global_step": 215192, "epoch": 2592} {"train_loss": -24.599475860595703, "global_step": 215193, "epoch": 2592} {"train_loss": -24.254810333251953, "global_step": 215194, "epoch": 2592} {"train_loss": -24.177335739135742, "global_step": 215195, "epoch": 2592} {"train_loss": -24.4085750579834, "global_step": 215196, "epoch": 2592} {"train_loss": -24.261213302612305, "global_step": 215197, "epoch": 2592} {"train_loss": -24.832012176513672, "global_step": 215198, "epoch": 2592} {"train_loss": -24.23160171508789, "global_step": 215199, "epoch": 2592} {"train_loss": -24.334585189819336, "global_step": 215200, "epoch": 2592} {"train_loss": -24.75211524963379, "global_step": 215201, "epoch": 2592} {"train_loss": -24.658823013305664, "global_step": 215202, "epoch": 2592} {"train_loss": -24.08525848388672, "global_step": 215203, "epoch": 2592} {"train_loss": -24.734619140625, "global_step": 215204, "epoch": 2592} {"train_loss": -24.569528579711914, "global_step": 215205, "epoch": 2592} {"train_loss": -24.389816284179688, "global_step": 215206, "epoch": 2592} {"train_loss": -24.53803062438965, "global_step": 215207, "epoch": 2592} {"train_loss": -24.367422103881836, "global_step": 215208, "epoch": 2592} {"train_loss": -24.49916648864746, "global_step": 215209, "epoch": 2592} {"train_loss": -24.321765899658203, "global_step": 215210, "epoch": 2592} {"train_loss": -24.473684310913086, "global_step": 215211, "epoch": 2592} {"train_loss": -24.853254318237305, "global_step": 215212, "epoch": 2592} {"train_loss": -24.5599422454834, "global_step": 215213, "epoch": 2592} {"train_loss": -24.503334045410156, "global_step": 215214, "epoch": 2592} {"train_loss": -24.512548446655273, "global_step": 215215, "epoch": 2592} {"train_loss": -24.272876739501953, "global_step": 215216, "epoch": 2592} {"train_loss": -24.541311264038086, "global_step": 215217, "epoch": 2592} {"train_loss": -24.380689575011473, "global_step": 215218, "epoch": 2592, "val_loss": 6844677.0} {"train_loss": -24.333105087280273, "global_step": 215219, "epoch": 2593} {"train_loss": -23.750991821289062, "global_step": 215220, "epoch": 2593} {"train_loss": -24.299545288085938, "global_step": 215221, "epoch": 2593} {"train_loss": -24.185827255249023, "global_step": 215222, "epoch": 2593} {"train_loss": -24.66893768310547, "global_step": 215223, "epoch": 2593} {"train_loss": -24.158811569213867, "global_step": 215224, "epoch": 2593} {"train_loss": -24.627286911010742, "global_step": 215225, "epoch": 2593} {"train_loss": -24.254413604736328, "global_step": 215226, "epoch": 2593} {"train_loss": -24.713119506835938, "global_step": 215227, "epoch": 2593} {"train_loss": -24.460309982299805, "global_step": 215228, "epoch": 2593} {"train_loss": -24.291715621948242, "global_step": 215229, "epoch": 2593} {"train_loss": -24.51066780090332, "global_step": 215230, "epoch": 2593} {"train_loss": -24.25993537902832, "global_step": 215231, "epoch": 2593} {"train_loss": -24.5429630279541, "global_step": 215232, "epoch": 2593} {"train_loss": -24.63420867919922, "global_step": 215233, "epoch": 2593} {"train_loss": -24.34527587890625, "global_step": 215234, "epoch": 2593} {"train_loss": -24.51607322692871, "global_step": 215235, "epoch": 2593} {"train_loss": -23.964126586914062, "global_step": 215236, "epoch": 2593} {"train_loss": -24.570755004882812, "global_step": 215237, "epoch": 2593} {"train_loss": -24.49671745300293, "global_step": 215238, "epoch": 2593} {"train_loss": -24.74765968322754, "global_step": 215239, "epoch": 2593} {"train_loss": -24.398828506469727, "global_step": 215240, "epoch": 2593} {"train_loss": -24.66673469543457, "global_step": 215241, "epoch": 2593} {"train_loss": -24.08466148376465, "global_step": 215242, "epoch": 2593} {"train_loss": -24.610929489135742, "global_step": 215243, "epoch": 2593} {"train_loss": -24.4876766204834, "global_step": 215244, "epoch": 2593} {"train_loss": -24.26862907409668, "global_step": 215245, "epoch": 2593} {"train_loss": -24.551054000854492, "global_step": 215246, "epoch": 2593} {"train_loss": -24.316938400268555, "global_step": 215247, "epoch": 2593} {"train_loss": -24.839181900024414, "global_step": 215248, "epoch": 2593} {"train_loss": -24.449676513671875, "global_step": 215249, "epoch": 2593} {"train_loss": -24.8697452545166, "global_step": 215250, "epoch": 2593} {"train_loss": -24.683683395385742, "global_step": 215251, "epoch": 2593} {"train_loss": -24.385135650634766, "global_step": 215252, "epoch": 2593} {"train_loss": -24.474411010742188, "global_step": 215253, "epoch": 2593} {"train_loss": -24.255260467529297, "global_step": 215254, "epoch": 2593} {"train_loss": -24.709089279174805, "global_step": 215255, "epoch": 2593} {"train_loss": -24.118696212768555, "global_step": 215256, "epoch": 2593} {"train_loss": -24.816787719726562, "global_step": 215257, "epoch": 2593} {"train_loss": -24.684345245361328, "global_step": 215258, "epoch": 2593} {"train_loss": -24.578433990478516, "global_step": 215259, "epoch": 2593} {"train_loss": -24.768178939819336, "global_step": 215260, "epoch": 2593} {"train_loss": -24.172048568725586, "global_step": 215261, "epoch": 2593} {"train_loss": -24.792333602905273, "global_step": 215262, "epoch": 2593} {"train_loss": -24.46109962463379, "global_step": 215263, "epoch": 2593} {"train_loss": -24.843250274658203, "global_step": 215264, "epoch": 2593} {"train_loss": -24.775259017944336, "global_step": 215265, "epoch": 2593} {"train_loss": -24.452070236206055, "global_step": 215266, "epoch": 2593} {"train_loss": -24.215316772460938, "global_step": 215267, "epoch": 2593} {"train_loss": -24.528982162475586, "global_step": 215268, "epoch": 2593} {"train_loss": -23.971805572509766, "global_step": 215269, "epoch": 2593} {"train_loss": -24.49224853515625, "global_step": 215270, "epoch": 2593} {"train_loss": -24.781888961791992, "global_step": 215271, "epoch": 2593} {"train_loss": -24.6624813079834, "global_step": 215272, "epoch": 2593} {"train_loss": -24.42085838317871, "global_step": 215273, "epoch": 2593} {"train_loss": -24.506498336791992, "global_step": 215274, "epoch": 2593} {"train_loss": -23.818618774414062, "global_step": 215275, "epoch": 2593} {"train_loss": -24.701078414916992, "global_step": 215276, "epoch": 2593} {"train_loss": -24.226877212524414, "global_step": 215277, "epoch": 2593} {"train_loss": -24.40364646911621, "global_step": 215278, "epoch": 2593} {"train_loss": -24.70576286315918, "global_step": 215279, "epoch": 2593} {"train_loss": -24.77728271484375, "global_step": 215280, "epoch": 2593} {"train_loss": -24.56015396118164, "global_step": 215281, "epoch": 2593} {"train_loss": -25.054401397705078, "global_step": 215282, "epoch": 2593} {"train_loss": -24.430805206298828, "global_step": 215283, "epoch": 2593} {"train_loss": -24.76761245727539, "global_step": 215284, "epoch": 2593} {"train_loss": -24.670276641845703, "global_step": 215285, "epoch": 2593} {"train_loss": -24.654861450195312, "global_step": 215286, "epoch": 2593} {"train_loss": -24.3348445892334, "global_step": 215287, "epoch": 2593} {"train_loss": -24.397859573364258, "global_step": 215288, "epoch": 2593} {"train_loss": -24.451486587524414, "global_step": 215289, "epoch": 2593} {"train_loss": -24.889644622802734, "global_step": 215290, "epoch": 2593} {"train_loss": -24.56160545349121, "global_step": 215291, "epoch": 2593} {"train_loss": -24.660215377807617, "global_step": 215292, "epoch": 2593} {"train_loss": -24.726608276367188, "global_step": 215293, "epoch": 2593} {"train_loss": -24.802595138549805, "global_step": 215294, "epoch": 2593} {"train_loss": -24.5100154876709, "global_step": 215295, "epoch": 2593} {"train_loss": -24.619272232055664, "global_step": 215296, "epoch": 2593} {"train_loss": -24.5505313873291, "global_step": 215297, "epoch": 2593} {"train_loss": -24.478925704956055, "global_step": 215298, "epoch": 2593} {"train_loss": -24.3636474609375, "global_step": 215299, "epoch": 2593} {"train_loss": -24.66619110107422, "global_step": 215300, "epoch": 2593} {"train_loss": -24.515583888593927, "global_step": 215301, "epoch": 2593, "val_loss": 6645164.0} {"train_loss": -24.125164031982422, "global_step": 215302, "epoch": 2594} {"train_loss": -24.150604248046875, "global_step": 215303, "epoch": 2594} {"train_loss": -24.352405548095703, "global_step": 215304, "epoch": 2594} {"train_loss": -24.003997802734375, "global_step": 215305, "epoch": 2594} {"train_loss": -24.161603927612305, "global_step": 215306, "epoch": 2594} {"train_loss": -23.87706184387207, "global_step": 215307, "epoch": 2594} {"train_loss": -24.247854232788086, "global_step": 215308, "epoch": 2594} {"train_loss": -23.823902130126953, "global_step": 215309, "epoch": 2594} {"train_loss": -24.537395477294922, "global_step": 215310, "epoch": 2594} {"train_loss": -24.17111587524414, "global_step": 215311, "epoch": 2594} {"train_loss": -24.38338279724121, "global_step": 215312, "epoch": 2594} {"train_loss": -24.36130714416504, "global_step": 215313, "epoch": 2594} {"train_loss": -24.05592918395996, "global_step": 215314, "epoch": 2594} {"train_loss": -24.11322021484375, "global_step": 215315, "epoch": 2594} {"train_loss": -24.449445724487305, "global_step": 215316, "epoch": 2594} {"train_loss": -24.1162166595459, "global_step": 215317, "epoch": 2594} {"train_loss": -24.329133987426758, "global_step": 215318, "epoch": 2594} {"train_loss": -24.31646156311035, "global_step": 215319, "epoch": 2594} {"train_loss": -24.182580947875977, "global_step": 215320, "epoch": 2594} {"train_loss": -24.223609924316406, "global_step": 215321, "epoch": 2594} {"train_loss": -24.268583297729492, "global_step": 215322, "epoch": 2594} {"train_loss": -24.545984268188477, "global_step": 215323, "epoch": 2594} {"train_loss": -24.407957077026367, "global_step": 215324, "epoch": 2594} {"train_loss": -24.094284057617188, "global_step": 215325, "epoch": 2594} {"train_loss": -24.19952392578125, "global_step": 215326, "epoch": 2594} {"train_loss": -24.184873580932617, "global_step": 215327, "epoch": 2594} {"train_loss": -24.545604705810547, "global_step": 215328, "epoch": 2594} {"train_loss": -24.354164123535156, "global_step": 215329, "epoch": 2594} {"train_loss": -24.613842010498047, "global_step": 215330, "epoch": 2594} {"train_loss": -24.382970809936523, "global_step": 215331, "epoch": 2594} {"train_loss": -24.838016510009766, "global_step": 215332, "epoch": 2594} {"train_loss": -24.524688720703125, "global_step": 215333, "epoch": 2594} {"train_loss": -24.368070602416992, "global_step": 215334, "epoch": 2594} {"train_loss": -24.42426872253418, "global_step": 215335, "epoch": 2594} {"train_loss": -24.445194244384766, "global_step": 215336, "epoch": 2594} {"train_loss": -24.446279525756836, "global_step": 215337, "epoch": 2594} {"train_loss": -24.575132369995117, "global_step": 215338, "epoch": 2594} {"train_loss": -24.656005859375, "global_step": 215339, "epoch": 2594} {"train_loss": -24.27894401550293, "global_step": 215340, "epoch": 2594} {"train_loss": -24.42757225036621, "global_step": 215341, "epoch": 2594} {"train_loss": -24.321420669555664, "global_step": 215342, "epoch": 2594} {"train_loss": -24.78688621520996, "global_step": 215343, "epoch": 2594} {"train_loss": -24.319507598876953, "global_step": 215344, "epoch": 2594} {"train_loss": -24.277685165405273, "global_step": 215345, "epoch": 2594} {"train_loss": -24.469343185424805, "global_step": 215346, "epoch": 2594} {"train_loss": -24.621442794799805, "global_step": 215347, "epoch": 2594} {"train_loss": -24.2326602935791, "global_step": 215348, "epoch": 2594} {"train_loss": -24.542003631591797, "global_step": 215349, "epoch": 2594} {"train_loss": -24.699926376342773, "global_step": 215350, "epoch": 2594} {"train_loss": -24.574125289916992, "global_step": 215351, "epoch": 2594} {"train_loss": -24.888092041015625, "global_step": 215352, "epoch": 2594} {"train_loss": -24.66487693786621, "global_step": 215353, "epoch": 2594} {"train_loss": -24.524099349975586, "global_step": 215354, "epoch": 2594} {"train_loss": -24.38447380065918, "global_step": 215355, "epoch": 2594} {"train_loss": -24.658720016479492, "global_step": 215356, "epoch": 2594} {"train_loss": -24.851797103881836, "global_step": 215357, "epoch": 2594} {"train_loss": -24.43730354309082, "global_step": 215358, "epoch": 2594} {"train_loss": -24.524646759033203, "global_step": 215359, "epoch": 2594} {"train_loss": -24.823625564575195, "global_step": 215360, "epoch": 2594} {"train_loss": -24.606609344482422, "global_step": 215361, "epoch": 2594} {"train_loss": -24.792070388793945, "global_step": 215362, "epoch": 2594} {"train_loss": -25.01436996459961, "global_step": 215363, "epoch": 2594} {"train_loss": -24.562719345092773, "global_step": 215364, "epoch": 2594} {"train_loss": -24.65931510925293, "global_step": 215365, "epoch": 2594} {"train_loss": -24.85055923461914, "global_step": 215366, "epoch": 2594} {"train_loss": -24.61772346496582, "global_step": 215367, "epoch": 2594} {"train_loss": -24.46586799621582, "global_step": 215368, "epoch": 2594} {"train_loss": -24.77662467956543, "global_step": 215369, "epoch": 2594} {"train_loss": -24.5909366607666, "global_step": 215370, "epoch": 2594} {"train_loss": -24.616186141967773, "global_step": 215371, "epoch": 2594} {"train_loss": -24.592697143554688, "global_step": 215372, "epoch": 2594} {"train_loss": -24.34490394592285, "global_step": 215373, "epoch": 2594} {"train_loss": -24.51759910583496, "global_step": 215374, "epoch": 2594} {"train_loss": -24.883642196655273, "global_step": 215375, "epoch": 2594} {"train_loss": -24.5351505279541, "global_step": 215376, "epoch": 2594} {"train_loss": -24.52069664001465, "global_step": 215377, "epoch": 2594} {"train_loss": -24.51948356628418, "global_step": 215378, "epoch": 2594} {"train_loss": -24.678709030151367, "global_step": 215379, "epoch": 2594} {"train_loss": -24.600875854492188, "global_step": 215380, "epoch": 2594} {"train_loss": -24.48949432373047, "global_step": 215381, "epoch": 2594} {"train_loss": -24.72349739074707, "global_step": 215382, "epoch": 2594} {"train_loss": -24.562145233154297, "global_step": 215383, "epoch": 2594} {"train_loss": -24.44485179487481, "global_step": 215384, "epoch": 2594, "val_loss": 6668962.5} {"train_loss": -23.53168296813965, "global_step": 215385, "epoch": 2595} {"train_loss": -23.787168502807617, "global_step": 215386, "epoch": 2595} {"train_loss": -24.16245460510254, "global_step": 215387, "epoch": 2595} {"train_loss": -23.92345428466797, "global_step": 215388, "epoch": 2595} {"train_loss": -24.227598190307617, "global_step": 215389, "epoch": 2595} {"train_loss": -24.092885971069336, "global_step": 215390, "epoch": 2595} {"train_loss": -24.337759017944336, "global_step": 215391, "epoch": 2595} {"train_loss": -24.070781707763672, "global_step": 215392, "epoch": 2595} {"train_loss": -24.2884521484375, "global_step": 215393, "epoch": 2595} {"train_loss": -24.15167808532715, "global_step": 215394, "epoch": 2595} {"train_loss": -24.114809036254883, "global_step": 215395, "epoch": 2595} {"train_loss": -24.11425018310547, "global_step": 215396, "epoch": 2595} {"train_loss": -23.926462173461914, "global_step": 215397, "epoch": 2595} {"train_loss": -24.487516403198242, "global_step": 215398, "epoch": 2595} {"train_loss": -24.567617416381836, "global_step": 215399, "epoch": 2595} {"train_loss": -24.174880981445312, "global_step": 215400, "epoch": 2595} {"train_loss": -24.75196647644043, "global_step": 215401, "epoch": 2595} {"train_loss": -24.540311813354492, "global_step": 215402, "epoch": 2595} {"train_loss": -24.206960678100586, "global_step": 215403, "epoch": 2595} {"train_loss": -24.701696395874023, "global_step": 215404, "epoch": 2595} {"train_loss": -24.45908546447754, "global_step": 215405, "epoch": 2595} {"train_loss": -24.483243942260742, "global_step": 215406, "epoch": 2595} {"train_loss": -24.42932891845703, "global_step": 215407, "epoch": 2595} {"train_loss": -24.436138153076172, "global_step": 215408, "epoch": 2595} {"train_loss": -24.739612579345703, "global_step": 215409, "epoch": 2595} {"train_loss": -24.60219383239746, "global_step": 215410, "epoch": 2595} {"train_loss": -24.32588005065918, "global_step": 215411, "epoch": 2595} {"train_loss": -24.816923141479492, "global_step": 215412, "epoch": 2595} {"train_loss": -24.612668991088867, "global_step": 215413, "epoch": 2595} {"train_loss": -24.131338119506836, "global_step": 215414, "epoch": 2595} {"train_loss": -24.81369400024414, "global_step": 215415, "epoch": 2595} {"train_loss": -24.47075843811035, "global_step": 215416, "epoch": 2595} {"train_loss": -24.761377334594727, "global_step": 215417, "epoch": 2595} {"train_loss": -24.567312240600586, "global_step": 215418, "epoch": 2595} {"train_loss": -24.45319175720215, "global_step": 215419, "epoch": 2595} {"train_loss": -24.81048011779785, "global_step": 215420, "epoch": 2595} {"train_loss": -24.513288497924805, "global_step": 215421, "epoch": 2595} {"train_loss": -24.851194381713867, "global_step": 215422, "epoch": 2595} {"train_loss": -24.74071502685547, "global_step": 215423, "epoch": 2595} {"train_loss": -24.7834529876709, "global_step": 215424, "epoch": 2595} {"train_loss": -24.818817138671875, "global_step": 215425, "epoch": 2595} {"train_loss": -24.77204132080078, "global_step": 215426, "epoch": 2595} {"train_loss": -24.534873962402344, "global_step": 215427, "epoch": 2595} {"train_loss": -24.2597599029541, "global_step": 215428, "epoch": 2595} {"train_loss": -23.9086856842041, "global_step": 215429, "epoch": 2595} {"train_loss": -23.99790382385254, "global_step": 215430, "epoch": 2595} {"train_loss": -24.323078155517578, "global_step": 215431, "epoch": 2595} {"train_loss": -24.352933883666992, "global_step": 215432, "epoch": 2595} {"train_loss": -24.494510650634766, "global_step": 215433, "epoch": 2595} {"train_loss": -24.43675422668457, "global_step": 215434, "epoch": 2595} {"train_loss": -24.381479263305664, "global_step": 215435, "epoch": 2595} {"train_loss": -24.311038970947266, "global_step": 215436, "epoch": 2595} {"train_loss": -24.255617141723633, "global_step": 215437, "epoch": 2595} {"train_loss": -24.71187400817871, "global_step": 215438, "epoch": 2595} {"train_loss": -24.45760154724121, "global_step": 215439, "epoch": 2595} {"train_loss": -24.181798934936523, "global_step": 215440, "epoch": 2595} {"train_loss": -24.556833267211914, "global_step": 215441, "epoch": 2595} {"train_loss": -24.52863121032715, "global_step": 215442, "epoch": 2595} {"train_loss": -24.742292404174805, "global_step": 215443, "epoch": 2595} {"train_loss": -24.355390548706055, "global_step": 215444, "epoch": 2595} {"train_loss": -24.360666275024414, "global_step": 215445, "epoch": 2595} {"train_loss": -24.5272159576416, "global_step": 215446, "epoch": 2595} {"train_loss": -24.54901123046875, "global_step": 215447, "epoch": 2595} {"train_loss": -24.89095687866211, "global_step": 215448, "epoch": 2595} {"train_loss": -24.910581588745117, "global_step": 215449, "epoch": 2595} {"train_loss": -24.222200393676758, "global_step": 215450, "epoch": 2595} {"train_loss": -24.417007446289062, "global_step": 215451, "epoch": 2595} {"train_loss": -24.17742919921875, "global_step": 215452, "epoch": 2595} {"train_loss": -24.461410522460938, "global_step": 215453, "epoch": 2595} {"train_loss": -24.64143180847168, "global_step": 215454, "epoch": 2595} {"train_loss": -24.794645309448242, "global_step": 215455, "epoch": 2595} {"train_loss": -24.474912643432617, "global_step": 215456, "epoch": 2595} {"train_loss": -24.753559112548828, "global_step": 215457, "epoch": 2595} {"train_loss": -24.776031494140625, "global_step": 215458, "epoch": 2595} {"train_loss": -24.763065338134766, "global_step": 215459, "epoch": 2595} {"train_loss": -24.578786849975586, "global_step": 215460, "epoch": 2595} {"train_loss": -24.888914108276367, "global_step": 215461, "epoch": 2595} {"train_loss": -24.546707153320312, "global_step": 215462, "epoch": 2595} {"train_loss": -24.349227905273438, "global_step": 215463, "epoch": 2595} {"train_loss": -24.76600456237793, "global_step": 215464, "epoch": 2595} {"train_loss": -24.702356338500977, "global_step": 215465, "epoch": 2595} {"train_loss": -24.468048095703125, "global_step": 215466, "epoch": 2595} {"train_loss": -24.452522461672864, "global_step": 215467, "epoch": 2595, "val_loss": 6701053.0} {"train_loss": -23.387069702148438, "global_step": 215468, "epoch": 2596} {"train_loss": -23.481815338134766, "global_step": 215469, "epoch": 2596} {"train_loss": -24.351110458374023, "global_step": 215470, "epoch": 2596} {"train_loss": -23.7613468170166, "global_step": 215471, "epoch": 2596} {"train_loss": -24.116092681884766, "global_step": 215472, "epoch": 2596} {"train_loss": -24.395721435546875, "global_step": 215473, "epoch": 2596} {"train_loss": -24.0120792388916, "global_step": 215474, "epoch": 2596} {"train_loss": -24.238134384155273, "global_step": 215475, "epoch": 2596} {"train_loss": -24.312793731689453, "global_step": 215476, "epoch": 2596} {"train_loss": -24.223081588745117, "global_step": 215477, "epoch": 2596} {"train_loss": -23.937387466430664, "global_step": 215478, "epoch": 2596} {"train_loss": -23.91433334350586, "global_step": 215479, "epoch": 2596} {"train_loss": -24.175704956054688, "global_step": 215480, "epoch": 2596} {"train_loss": -24.21535301208496, "global_step": 215481, "epoch": 2596} {"train_loss": -24.59296226501465, "global_step": 215482, "epoch": 2596} {"train_loss": -24.17661476135254, "global_step": 215483, "epoch": 2596} {"train_loss": -24.126394271850586, "global_step": 215484, "epoch": 2596} {"train_loss": -24.192441940307617, "global_step": 215485, "epoch": 2596} {"train_loss": -24.434627532958984, "global_step": 215486, "epoch": 2596} {"train_loss": -24.15226936340332, "global_step": 215487, "epoch": 2596} {"train_loss": -24.372114181518555, "global_step": 215488, "epoch": 2596} {"train_loss": -24.481922149658203, "global_step": 215489, "epoch": 2596} {"train_loss": -24.512983322143555, "global_step": 215490, "epoch": 2596} {"train_loss": -24.52314567565918, "global_step": 215491, "epoch": 2596} {"train_loss": -24.497745513916016, "global_step": 215492, "epoch": 2596} {"train_loss": -24.433414459228516, "global_step": 215493, "epoch": 2596} {"train_loss": -24.549713134765625, "global_step": 215494, "epoch": 2596} {"train_loss": -24.091135025024414, "global_step": 215495, "epoch": 2596} {"train_loss": -24.73794937133789, "global_step": 215496, "epoch": 2596} {"train_loss": -24.234594345092773, "global_step": 215497, "epoch": 2596} {"train_loss": -24.767541885375977, "global_step": 215498, "epoch": 2596} {"train_loss": -24.669116973876953, "global_step": 215499, "epoch": 2596} {"train_loss": -24.407562255859375, "global_step": 215500, "epoch": 2596} {"train_loss": -24.90463638305664, "global_step": 215501, "epoch": 2596} {"train_loss": -24.221582412719727, "global_step": 215502, "epoch": 2596} {"train_loss": -24.317041397094727, "global_step": 215503, "epoch": 2596} {"train_loss": -24.441932678222656, "global_step": 215504, "epoch": 2596} {"train_loss": -24.80586051940918, "global_step": 215505, "epoch": 2596} {"train_loss": -24.416955947875977, "global_step": 215506, "epoch": 2596} {"train_loss": -24.424707412719727, "global_step": 215507, "epoch": 2596} {"train_loss": -24.71813201904297, "global_step": 215508, "epoch": 2596} {"train_loss": -24.758319854736328, "global_step": 215509, "epoch": 2596} {"train_loss": -24.327762603759766, "global_step": 215510, "epoch": 2596} {"train_loss": -24.460792541503906, "global_step": 215511, "epoch": 2596} {"train_loss": -24.47195816040039, "global_step": 215512, "epoch": 2596} {"train_loss": -24.61031723022461, "global_step": 215513, "epoch": 2596} {"train_loss": -24.597702026367188, "global_step": 215514, "epoch": 2596} {"train_loss": -24.45188331604004, "global_step": 215515, "epoch": 2596} {"train_loss": -24.616437911987305, "global_step": 215516, "epoch": 2596} {"train_loss": -24.14112663269043, "global_step": 215517, "epoch": 2596} {"train_loss": -23.610626220703125, "global_step": 215518, "epoch": 2596} {"train_loss": -23.974143981933594, "global_step": 215519, "epoch": 2596} {"train_loss": -24.31808853149414, "global_step": 215520, "epoch": 2596} {"train_loss": -24.18106460571289, "global_step": 215521, "epoch": 2596} {"train_loss": -24.436664581298828, "global_step": 215522, "epoch": 2596} {"train_loss": -24.1657772064209, "global_step": 215523, "epoch": 2596} {"train_loss": -24.319095611572266, "global_step": 215524, "epoch": 2596} {"train_loss": -24.599620819091797, "global_step": 215525, "epoch": 2596} {"train_loss": -24.359731674194336, "global_step": 215526, "epoch": 2596} {"train_loss": -24.59372329711914, "global_step": 215527, "epoch": 2596} {"train_loss": -24.3846378326416, "global_step": 215528, "epoch": 2596} {"train_loss": -24.170339584350586, "global_step": 215529, "epoch": 2596} {"train_loss": -24.244741439819336, "global_step": 215530, "epoch": 2596} {"train_loss": -24.38355827331543, "global_step": 215531, "epoch": 2596} {"train_loss": -24.239038467407227, "global_step": 215532, "epoch": 2596} {"train_loss": -24.86836051940918, "global_step": 215533, "epoch": 2596} {"train_loss": -24.285144805908203, "global_step": 215534, "epoch": 2596} {"train_loss": -24.572343826293945, "global_step": 215535, "epoch": 2596} {"train_loss": -24.30198097229004, "global_step": 215536, "epoch": 2596} {"train_loss": -24.448062896728516, "global_step": 215537, "epoch": 2596} {"train_loss": -24.493223190307617, "global_step": 215538, "epoch": 2596} {"train_loss": -24.86836814880371, "global_step": 215539, "epoch": 2596} {"train_loss": -24.155879974365234, "global_step": 215540, "epoch": 2596} {"train_loss": -24.693317413330078, "global_step": 215541, "epoch": 2596} {"train_loss": -24.597192764282227, "global_step": 215542, "epoch": 2596} {"train_loss": -24.582870483398438, "global_step": 215543, "epoch": 2596} {"train_loss": -24.719593048095703, "global_step": 215544, "epoch": 2596} {"train_loss": -24.609952926635742, "global_step": 215545, "epoch": 2596} {"train_loss": -24.65185546875, "global_step": 215546, "epoch": 2596} {"train_loss": -24.491636276245117, "global_step": 215547, "epoch": 2596} {"train_loss": -24.745895385742188, "global_step": 215548, "epoch": 2596} {"train_loss": -24.62451171875, "global_step": 215549, "epoch": 2596} {"train_loss": -24.374921959566784, "global_step": 215550, "epoch": 2596, "val_loss": 6737779.0} {"train_loss": -23.4445858001709, "global_step": 215551, "epoch": 2597} {"train_loss": -24.18006706237793, "global_step": 215552, "epoch": 2597} {"train_loss": -23.644315719604492, "global_step": 215553, "epoch": 2597} {"train_loss": -23.6367244720459, "global_step": 215554, "epoch": 2597} {"train_loss": -23.20713996887207, "global_step": 215555, "epoch": 2597} {"train_loss": -24.314029693603516, "global_step": 215556, "epoch": 2597} {"train_loss": -23.541522979736328, "global_step": 215557, "epoch": 2597} {"train_loss": -24.03243637084961, "global_step": 215558, "epoch": 2597} {"train_loss": -24.07862663269043, "global_step": 215559, "epoch": 2597} {"train_loss": -24.11469841003418, "global_step": 215560, "epoch": 2597} {"train_loss": -24.104263305664062, "global_step": 215561, "epoch": 2597} {"train_loss": -23.952590942382812, "global_step": 215562, "epoch": 2597} {"train_loss": -23.89198112487793, "global_step": 215563, "epoch": 2597} {"train_loss": -23.99553871154785, "global_step": 215564, "epoch": 2597} {"train_loss": -24.11073112487793, "global_step": 215565, "epoch": 2597} {"train_loss": -23.740564346313477, "global_step": 215566, "epoch": 2597} {"train_loss": -24.474214553833008, "global_step": 215567, "epoch": 2597} {"train_loss": -24.337127685546875, "global_step": 215568, "epoch": 2597} {"train_loss": -23.948911666870117, "global_step": 215569, "epoch": 2597} {"train_loss": -24.301359176635742, "global_step": 215570, "epoch": 2597} {"train_loss": -24.126955032348633, "global_step": 215571, "epoch": 2597} {"train_loss": -24.47474479675293, "global_step": 215572, "epoch": 2597} {"train_loss": -24.327919006347656, "global_step": 215573, "epoch": 2597} {"train_loss": -23.966625213623047, "global_step": 215574, "epoch": 2597} {"train_loss": -24.67438316345215, "global_step": 215575, "epoch": 2597} {"train_loss": -24.46619987487793, "global_step": 215576, "epoch": 2597} {"train_loss": -24.38522720336914, "global_step": 215577, "epoch": 2597} {"train_loss": -24.527996063232422, "global_step": 215578, "epoch": 2597} {"train_loss": -24.34364891052246, "global_step": 215579, "epoch": 2597} {"train_loss": -23.92225456237793, "global_step": 215580, "epoch": 2597} {"train_loss": -24.61936378479004, "global_step": 215581, "epoch": 2597} {"train_loss": -24.4666805267334, "global_step": 215582, "epoch": 2597} {"train_loss": -24.60869026184082, "global_step": 215583, "epoch": 2597} {"train_loss": -24.565784454345703, "global_step": 215584, "epoch": 2597} {"train_loss": -24.481184005737305, "global_step": 215585, "epoch": 2597} {"train_loss": -24.14325523376465, "global_step": 215586, "epoch": 2597} {"train_loss": -24.3105411529541, "global_step": 215587, "epoch": 2597} {"train_loss": -24.09868812561035, "global_step": 215588, "epoch": 2597} {"train_loss": -24.562917709350586, "global_step": 215589, "epoch": 2597} {"train_loss": -24.465116500854492, "global_step": 215590, "epoch": 2597} {"train_loss": -24.254276275634766, "global_step": 215591, "epoch": 2597} {"train_loss": -24.582237243652344, "global_step": 215592, "epoch": 2597} {"train_loss": -24.51321792602539, "global_step": 215593, "epoch": 2597} {"train_loss": -24.466588973999023, "global_step": 215594, "epoch": 2597} {"train_loss": -24.353790283203125, "global_step": 215595, "epoch": 2597} {"train_loss": -24.367755889892578, "global_step": 215596, "epoch": 2597} {"train_loss": -24.66774559020996, "global_step": 215597, "epoch": 2597} {"train_loss": -24.18085289001465, "global_step": 215598, "epoch": 2597} {"train_loss": -24.56416893005371, "global_step": 215599, "epoch": 2597} {"train_loss": -24.443920135498047, "global_step": 215600, "epoch": 2597} {"train_loss": -24.39315414428711, "global_step": 215601, "epoch": 2597} {"train_loss": -24.449010848999023, "global_step": 215602, "epoch": 2597} {"train_loss": -24.331283569335938, "global_step": 215603, "epoch": 2597} {"train_loss": -24.674875259399414, "global_step": 215604, "epoch": 2597} {"train_loss": -24.44464683532715, "global_step": 215605, "epoch": 2597} {"train_loss": -24.503700256347656, "global_step": 215606, "epoch": 2597} {"train_loss": -25.01493263244629, "global_step": 215607, "epoch": 2597} {"train_loss": -24.85090446472168, "global_step": 215608, "epoch": 2597} {"train_loss": -24.68428611755371, "global_step": 215609, "epoch": 2597} {"train_loss": -24.682910919189453, "global_step": 215610, "epoch": 2597} {"train_loss": -24.66138458251953, "global_step": 215611, "epoch": 2597} {"train_loss": -24.446664810180664, "global_step": 215612, "epoch": 2597} {"train_loss": -24.445913314819336, "global_step": 215613, "epoch": 2597} {"train_loss": -24.65496253967285, "global_step": 215614, "epoch": 2597} {"train_loss": -24.238996505737305, "global_step": 215615, "epoch": 2597} {"train_loss": -24.41211700439453, "global_step": 215616, "epoch": 2597} {"train_loss": -24.40325164794922, "global_step": 215617, "epoch": 2597} {"train_loss": -25.168575286865234, "global_step": 215618, "epoch": 2597} {"train_loss": -24.478290557861328, "global_step": 215619, "epoch": 2597} {"train_loss": -24.51161766052246, "global_step": 215620, "epoch": 2597} {"train_loss": -24.743473052978516, "global_step": 215621, "epoch": 2597} {"train_loss": -24.643573760986328, "global_step": 215622, "epoch": 2597} {"train_loss": -24.784799575805664, "global_step": 215623, "epoch": 2597} {"train_loss": -24.859067916870117, "global_step": 215624, "epoch": 2597} {"train_loss": -24.668119430541992, "global_step": 215625, "epoch": 2597} {"train_loss": -24.4954776763916, "global_step": 215626, "epoch": 2597} {"train_loss": -24.279897689819336, "global_step": 215627, "epoch": 2597} {"train_loss": -24.260211944580078, "global_step": 215628, "epoch": 2597} {"train_loss": -24.631986618041992, "global_step": 215629, "epoch": 2597} {"train_loss": -24.36732292175293, "global_step": 215630, "epoch": 2597} {"train_loss": -24.26460075378418, "global_step": 215631, "epoch": 2597} {"train_loss": -24.1169376373291, "global_step": 215632, "epoch": 2597} {"train_loss": -24.337465906717693, "global_step": 215633, "epoch": 2597, "val_loss": 6673322.0} {"train_loss": -23.941303253173828, "global_step": 215634, "epoch": 2598} {"train_loss": -24.00147819519043, "global_step": 215635, "epoch": 2598} {"train_loss": -24.33521842956543, "global_step": 215636, "epoch": 2598} {"train_loss": -24.48287010192871, "global_step": 215637, "epoch": 2598} {"train_loss": -24.362802505493164, "global_step": 215638, "epoch": 2598} {"train_loss": -24.07992172241211, "global_step": 215639, "epoch": 2598} {"train_loss": -24.280431747436523, "global_step": 215640, "epoch": 2598} {"train_loss": -24.51643180847168, "global_step": 215641, "epoch": 2598} {"train_loss": -23.998991012573242, "global_step": 215642, "epoch": 2598} {"train_loss": -23.660690307617188, "global_step": 215643, "epoch": 2598} {"train_loss": -24.4326229095459, "global_step": 215644, "epoch": 2598} {"train_loss": -23.63495445251465, "global_step": 215645, "epoch": 2598} {"train_loss": -24.107826232910156, "global_step": 215646, "epoch": 2598} {"train_loss": -24.4748477935791, "global_step": 215647, "epoch": 2598} {"train_loss": -23.6689395904541, "global_step": 215648, "epoch": 2598} {"train_loss": -24.221288681030273, "global_step": 215649, "epoch": 2598} {"train_loss": -24.49346160888672, "global_step": 215650, "epoch": 2598} {"train_loss": -23.78885269165039, "global_step": 215651, "epoch": 2598} {"train_loss": -24.441579818725586, "global_step": 215652, "epoch": 2598} {"train_loss": -24.05320930480957, "global_step": 215653, "epoch": 2598} {"train_loss": -24.542678833007812, "global_step": 215654, "epoch": 2598} {"train_loss": -24.22428321838379, "global_step": 215655, "epoch": 2598} {"train_loss": -24.051406860351562, "global_step": 215656, "epoch": 2598} {"train_loss": -24.012048721313477, "global_step": 215657, "epoch": 2598} {"train_loss": -24.483823776245117, "global_step": 215658, "epoch": 2598} {"train_loss": -24.055389404296875, "global_step": 215659, "epoch": 2598} {"train_loss": -24.816078186035156, "global_step": 215660, "epoch": 2598} {"train_loss": -24.68975257873535, "global_step": 215661, "epoch": 2598} {"train_loss": -24.483816146850586, "global_step": 215662, "epoch": 2598} {"train_loss": -24.360937118530273, "global_step": 215663, "epoch": 2598} {"train_loss": -24.339859008789062, "global_step": 215664, "epoch": 2598} {"train_loss": -24.72833824157715, "global_step": 215665, "epoch": 2598} {"train_loss": -24.508100509643555, "global_step": 215666, "epoch": 2598} {"train_loss": -24.477590560913086, "global_step": 215667, "epoch": 2598} {"train_loss": -24.808218002319336, "global_step": 215668, "epoch": 2598} {"train_loss": -24.48859214782715, "global_step": 215669, "epoch": 2598} {"train_loss": -24.10123634338379, "global_step": 215670, "epoch": 2598} {"train_loss": -24.825693130493164, "global_step": 215671, "epoch": 2598} {"train_loss": -24.71889305114746, "global_step": 215672, "epoch": 2598} {"train_loss": -24.44534683227539, "global_step": 215673, "epoch": 2598} {"train_loss": -24.335224151611328, "global_step": 215674, "epoch": 2598} {"train_loss": -24.69453239440918, "global_step": 215675, "epoch": 2598} {"train_loss": -24.60186195373535, "global_step": 215676, "epoch": 2598} {"train_loss": -24.802322387695312, "global_step": 215677, "epoch": 2598} {"train_loss": -24.471967697143555, "global_step": 215678, "epoch": 2598} {"train_loss": -24.62860679626465, "global_step": 215679, "epoch": 2598} {"train_loss": -24.53122329711914, "global_step": 215680, "epoch": 2598} {"train_loss": -24.69386100769043, "global_step": 215681, "epoch": 2598} {"train_loss": -24.498594284057617, "global_step": 215682, "epoch": 2598} {"train_loss": -24.472929000854492, "global_step": 215683, "epoch": 2598} {"train_loss": -24.940933227539062, "global_step": 215684, "epoch": 2598} {"train_loss": -24.725126266479492, "global_step": 215685, "epoch": 2598} {"train_loss": -24.60860824584961, "global_step": 215686, "epoch": 2598} {"train_loss": -24.584697723388672, "global_step": 215687, "epoch": 2598} {"train_loss": -24.75887107849121, "global_step": 215688, "epoch": 2598} {"train_loss": -24.495071411132812, "global_step": 215689, "epoch": 2598} {"train_loss": -24.534006118774414, "global_step": 215690, "epoch": 2598} {"train_loss": -24.630264282226562, "global_step": 215691, "epoch": 2598} {"train_loss": -24.28042984008789, "global_step": 215692, "epoch": 2598} {"train_loss": -24.766979217529297, "global_step": 215693, "epoch": 2598} {"train_loss": -24.293487548828125, "global_step": 215694, "epoch": 2598} {"train_loss": -24.532033920288086, "global_step": 215695, "epoch": 2598} {"train_loss": -24.52191734313965, "global_step": 215696, "epoch": 2598} {"train_loss": -23.979843139648438, "global_step": 215697, "epoch": 2598} {"train_loss": -23.67095184326172, "global_step": 215698, "epoch": 2598} {"train_loss": -23.100479125976562, "global_step": 215699, "epoch": 2598} {"train_loss": -24.24317169189453, "global_step": 215700, "epoch": 2598} {"train_loss": -23.845434188842773, "global_step": 215701, "epoch": 2598} {"train_loss": -23.823257446289062, "global_step": 215702, "epoch": 2598} {"train_loss": -23.588903427124023, "global_step": 215703, "epoch": 2598} {"train_loss": -24.231687545776367, "global_step": 215704, "epoch": 2598} {"train_loss": -23.572683334350586, "global_step": 215705, "epoch": 2598} {"train_loss": -24.284940719604492, "global_step": 215706, "epoch": 2598} {"train_loss": -23.92287254333496, "global_step": 215707, "epoch": 2598} {"train_loss": -24.192039489746094, "global_step": 215708, "epoch": 2598} {"train_loss": -23.803800582885742, "global_step": 215709, "epoch": 2598} {"train_loss": -23.995933532714844, "global_step": 215710, "epoch": 2598} {"train_loss": -23.871360778808594, "global_step": 215711, "epoch": 2598} {"train_loss": -24.324607849121094, "global_step": 215712, "epoch": 2598} {"train_loss": -23.868131637573242, "global_step": 215713, "epoch": 2598} {"train_loss": -24.257959365844727, "global_step": 215714, "epoch": 2598} {"train_loss": -24.268095016479492, "global_step": 215715, "epoch": 2598} {"train_loss": -24.287213589771685, "global_step": 215716, "epoch": 2598, "val_loss": 6717032.5} {"train_loss": -23.783559799194336, "global_step": 215717, "epoch": 2599} {"train_loss": -24.012876510620117, "global_step": 215718, "epoch": 2599} {"train_loss": -24.293367385864258, "global_step": 215719, "epoch": 2599} {"train_loss": -23.90628433227539, "global_step": 215720, "epoch": 2599} {"train_loss": -23.95822525024414, "global_step": 215721, "epoch": 2599} {"train_loss": -24.28915786743164, "global_step": 215722, "epoch": 2599} {"train_loss": -24.2086181640625, "global_step": 215723, "epoch": 2599} {"train_loss": -24.558765411376953, "global_step": 215724, "epoch": 2599} {"train_loss": -23.757848739624023, "global_step": 215725, "epoch": 2599} {"train_loss": -24.387805938720703, "global_step": 215726, "epoch": 2599} {"train_loss": -24.4677677154541, "global_step": 215727, "epoch": 2599} {"train_loss": -24.036184310913086, "global_step": 215728, "epoch": 2599} {"train_loss": -24.273326873779297, "global_step": 215729, "epoch": 2599} {"train_loss": -24.531248092651367, "global_step": 215730, "epoch": 2599} {"train_loss": -24.535724639892578, "global_step": 215731, "epoch": 2599} {"train_loss": -24.03339958190918, "global_step": 215732, "epoch": 2599} {"train_loss": -24.412307739257812, "global_step": 215733, "epoch": 2599} {"train_loss": -24.32936668395996, "global_step": 215734, "epoch": 2599} {"train_loss": -24.33292007446289, "global_step": 215735, "epoch": 2599} {"train_loss": -24.23702049255371, "global_step": 215736, "epoch": 2599} {"train_loss": -24.36789321899414, "global_step": 215737, "epoch": 2599} {"train_loss": -24.48367691040039, "global_step": 215738, "epoch": 2599} {"train_loss": -24.424705505371094, "global_step": 215739, "epoch": 2599} {"train_loss": -24.58746910095215, "global_step": 215740, "epoch": 2599} {"train_loss": -24.53057289123535, "global_step": 215741, "epoch": 2599} {"train_loss": -24.70589828491211, "global_step": 215742, "epoch": 2599} {"train_loss": -24.264755249023438, "global_step": 215743, "epoch": 2599} {"train_loss": -24.6020565032959, "global_step": 215744, "epoch": 2599} {"train_loss": -24.0651798248291, "global_step": 215745, "epoch": 2599} {"train_loss": -24.34870719909668, "global_step": 215746, "epoch": 2599} {"train_loss": -24.844045639038086, "global_step": 215747, "epoch": 2599} {"train_loss": -24.324331283569336, "global_step": 215748, "epoch": 2599} {"train_loss": -24.14603042602539, "global_step": 215749, "epoch": 2599} {"train_loss": -24.70682144165039, "global_step": 215750, "epoch": 2599} {"train_loss": -24.442562103271484, "global_step": 215751, "epoch": 2599} {"train_loss": -24.93888282775879, "global_step": 215752, "epoch": 2599} {"train_loss": -24.692779541015625, "global_step": 215753, "epoch": 2599} {"train_loss": -24.502592086791992, "global_step": 215754, "epoch": 2599} {"train_loss": -24.72542381286621, "global_step": 215755, "epoch": 2599} {"train_loss": -24.803653717041016, "global_step": 215756, "epoch": 2599} {"train_loss": -24.153507232666016, "global_step": 215757, "epoch": 2599} {"train_loss": -24.63063621520996, "global_step": 215758, "epoch": 2599} {"train_loss": -24.541982650756836, "global_step": 215759, "epoch": 2599} {"train_loss": -24.50007438659668, "global_step": 215760, "epoch": 2599} {"train_loss": -24.554813385009766, "global_step": 215761, "epoch": 2599} {"train_loss": -24.516681671142578, "global_step": 215762, "epoch": 2599} {"train_loss": -24.601484298706055, "global_step": 215763, "epoch": 2599} {"train_loss": -24.353900909423828, "global_step": 215764, "epoch": 2599} {"train_loss": -24.60843849182129, "global_step": 215765, "epoch": 2599} {"train_loss": -24.78246307373047, "global_step": 215766, "epoch": 2599} {"train_loss": -24.502256393432617, "global_step": 215767, "epoch": 2599} {"train_loss": -24.811769485473633, "global_step": 215768, "epoch": 2599} {"train_loss": -24.471904754638672, "global_step": 215769, "epoch": 2599} {"train_loss": -24.675193786621094, "global_step": 215770, "epoch": 2599} {"train_loss": -24.124908447265625, "global_step": 215771, "epoch": 2599} {"train_loss": -24.422590255737305, "global_step": 215772, "epoch": 2599} {"train_loss": -24.761049270629883, "global_step": 215773, "epoch": 2599} {"train_loss": -24.210824966430664, "global_step": 215774, "epoch": 2599} {"train_loss": -24.24176025390625, "global_step": 215775, "epoch": 2599} {"train_loss": -24.67767333984375, "global_step": 215776, "epoch": 2599} {"train_loss": -24.341079711914062, "global_step": 215777, "epoch": 2599} {"train_loss": -24.42209243774414, "global_step": 215778, "epoch": 2599} {"train_loss": -24.052356719970703, "global_step": 215779, "epoch": 2599} {"train_loss": -24.54020118713379, "global_step": 215780, "epoch": 2599} {"train_loss": -24.703886032104492, "global_step": 215781, "epoch": 2599} {"train_loss": -24.300886154174805, "global_step": 215782, "epoch": 2599} {"train_loss": -24.7645320892334, "global_step": 215783, "epoch": 2599} {"train_loss": -24.790977478027344, "global_step": 215784, "epoch": 2599} {"train_loss": -24.68956756591797, "global_step": 215785, "epoch": 2599} {"train_loss": -24.49274253845215, "global_step": 215786, "epoch": 2599} {"train_loss": -24.59016227722168, "global_step": 215787, "epoch": 2599} {"train_loss": -24.473831176757812, "global_step": 215788, "epoch": 2599} {"train_loss": -24.388795852661133, "global_step": 215789, "epoch": 2599} {"train_loss": -24.768930435180664, "global_step": 215790, "epoch": 2599} {"train_loss": -24.539743423461914, "global_step": 215791, "epoch": 2599} {"train_loss": -24.123838424682617, "global_step": 215792, "epoch": 2599} {"train_loss": -24.543222427368164, "global_step": 215793, "epoch": 2599} {"train_loss": -24.990760803222656, "global_step": 215794, "epoch": 2599} {"train_loss": -24.497421264648438, "global_step": 215795, "epoch": 2599} {"train_loss": -24.46510124206543, "global_step": 215796, "epoch": 2599} {"train_loss": -24.74639320373535, "global_step": 215797, "epoch": 2599} {"train_loss": -24.674707412719727, "global_step": 215798, "epoch": 2599} {"train_loss": -24.469454064426653, "global_step": 215799, "epoch": 2599, "val_loss": 6626057.0} {"train_loss": -24.119552612304688, "global_step": 215800, "epoch": 2600} {"train_loss": -24.341299057006836, "global_step": 215801, "epoch": 2600} {"train_loss": -24.723695755004883, "global_step": 215802, "epoch": 2600} {"train_loss": -23.916778564453125, "global_step": 215803, "epoch": 2600} {"train_loss": -23.87553596496582, "global_step": 215804, "epoch": 2600} {"train_loss": -24.22430419921875, "global_step": 215805, "epoch": 2600} {"train_loss": -23.75971031188965, "global_step": 215806, "epoch": 2600} {"train_loss": -23.57587432861328, "global_step": 215807, "epoch": 2600} {"train_loss": -24.14572525024414, "global_step": 215808, "epoch": 2600} {"train_loss": -23.886980056762695, "global_step": 215809, "epoch": 2600} {"train_loss": -24.26460838317871, "global_step": 215810, "epoch": 2600} {"train_loss": -24.013263702392578, "global_step": 215811, "epoch": 2600} {"train_loss": -23.866090774536133, "global_step": 215812, "epoch": 2600} {"train_loss": -24.165647506713867, "global_step": 215813, "epoch": 2600} {"train_loss": -24.62016487121582, "global_step": 215814, "epoch": 2600} {"train_loss": -24.175785064697266, "global_step": 215815, "epoch": 2600} {"train_loss": -24.323339462280273, "global_step": 215816, "epoch": 2600} {"train_loss": -24.414337158203125, "global_step": 215817, "epoch": 2600} {"train_loss": -24.44439125061035, "global_step": 215818, "epoch": 2600} {"train_loss": -24.57781219482422, "global_step": 215819, "epoch": 2600} {"train_loss": -23.848426818847656, "global_step": 215820, "epoch": 2600} {"train_loss": -24.49651527404785, "global_step": 215821, "epoch": 2600} {"train_loss": -24.662534713745117, "global_step": 215822, "epoch": 2600} {"train_loss": -24.64739990234375, "global_step": 215823, "epoch": 2600} {"train_loss": -24.55177879333496, "global_step": 215824, "epoch": 2600} {"train_loss": -24.22373390197754, "global_step": 215825, "epoch": 2600} {"train_loss": -24.810302734375, "global_step": 215826, "epoch": 2600} {"train_loss": -24.83595848083496, "global_step": 215827, "epoch": 2600} {"train_loss": -24.27216148376465, "global_step": 215828, "epoch": 2600} {"train_loss": -24.56194305419922, "global_step": 215829, "epoch": 2600} {"train_loss": -24.692310333251953, "global_step": 215830, "epoch": 2600} {"train_loss": -24.388879776000977, "global_step": 215831, "epoch": 2600} {"train_loss": -24.496122360229492, "global_step": 215832, "epoch": 2600} {"train_loss": -24.446332931518555, "global_step": 215833, "epoch": 2600} {"train_loss": -24.42510986328125, "global_step": 215834, "epoch": 2600} {"train_loss": -24.51124382019043, "global_step": 215835, "epoch": 2600} {"train_loss": -24.446237564086914, "global_step": 215836, "epoch": 2600} {"train_loss": -24.574771881103516, "global_step": 215837, "epoch": 2600} {"train_loss": -24.43326187133789, "global_step": 215838, "epoch": 2600} {"train_loss": -24.372146606445312, "global_step": 215839, "epoch": 2600} {"train_loss": -24.065162658691406, "global_step": 215840, "epoch": 2600} {"train_loss": -24.888113021850586, "global_step": 215841, "epoch": 2600} {"train_loss": -24.51750373840332, "global_step": 215842, "epoch": 2600} {"train_loss": -24.671363830566406, "global_step": 215843, "epoch": 2600} {"train_loss": -24.726835250854492, "global_step": 215844, "epoch": 2600} {"train_loss": -24.673768997192383, "global_step": 215845, "epoch": 2600} {"train_loss": -24.593610763549805, "global_step": 215846, "epoch": 2600} {"train_loss": -24.94251251220703, "global_step": 215847, "epoch": 2600} {"train_loss": -24.635578155517578, "global_step": 215848, "epoch": 2600} {"train_loss": -24.648874282836914, "global_step": 215849, "epoch": 2600} {"train_loss": -24.989652633666992, "global_step": 215850, "epoch": 2600} {"train_loss": -24.442108154296875, "global_step": 215851, "epoch": 2600} {"train_loss": -24.66765594482422, "global_step": 215852, "epoch": 2600} {"train_loss": -24.751113891601562, "global_step": 215853, "epoch": 2600} {"train_loss": -24.509220123291016, "global_step": 215854, "epoch": 2600} {"train_loss": -24.360280990600586, "global_step": 215855, "epoch": 2600} {"train_loss": -24.75876808166504, "global_step": 215856, "epoch": 2600} {"train_loss": -24.608488082885742, "global_step": 215857, "epoch": 2600} {"train_loss": -24.691198348999023, "global_step": 215858, "epoch": 2600} {"train_loss": -24.45856285095215, "global_step": 215859, "epoch": 2600} {"train_loss": -24.512113571166992, "global_step": 215860, "epoch": 2600} {"train_loss": -24.614665985107422, "global_step": 215861, "epoch": 2600} {"train_loss": -24.781585693359375, "global_step": 215862, "epoch": 2600} {"train_loss": -24.78993034362793, "global_step": 215863, "epoch": 2600} {"train_loss": -24.742231369018555, "global_step": 215864, "epoch": 2600} {"train_loss": -24.92547607421875, "global_step": 215865, "epoch": 2600} {"train_loss": -24.843942642211914, "global_step": 215866, "epoch": 2600} {"train_loss": -24.961063385009766, "global_step": 215867, "epoch": 2600} {"train_loss": -24.423776626586914, "global_step": 215868, "epoch": 2600} {"train_loss": -24.43787956237793, "global_step": 215869, "epoch": 2600} {"train_loss": -24.42575454711914, "global_step": 215870, "epoch": 2600} {"train_loss": -24.040395736694336, "global_step": 215871, "epoch": 2600} {"train_loss": -24.320575714111328, "global_step": 215872, "epoch": 2600} {"train_loss": -24.574308395385742, "global_step": 215873, "epoch": 2600} {"train_loss": -24.802953720092773, "global_step": 215874, "epoch": 2600} {"train_loss": -23.92247772216797, "global_step": 215875, "epoch": 2600} {"train_loss": -24.131534576416016, "global_step": 215876, "epoch": 2600} {"train_loss": -24.235000610351562, "global_step": 215877, "epoch": 2600} {"train_loss": -24.693601608276367, "global_step": 215878, "epoch": 2600} {"train_loss": -24.070873260498047, "global_step": 215879, "epoch": 2600} {"train_loss": -24.49863624572754, "global_step": 215880, "epoch": 2600} {"train_loss": -24.347875595092773, "global_step": 215881, "epoch": 2600} {"train_loss": -24.45254771680717, "global_step": 215882, "epoch": 2600, "train/sim_max_reward_0": 1.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4500000": 1.0, "test/sim_max_reward_4500001": 1.0, "test/sim_max_reward_4500002": 1.0, "test/sim_max_reward_4500003": 1.0, "test/sim_max_reward_4500004": 1.0, "test/sim_max_reward_4500005": 1.0, "test/sim_max_reward_4500006": 1.0, "test/sim_max_reward_4500007": 1.0, "test/sim_max_reward_4500008": 1.0, "test/sim_max_reward_4500009": 1.0, "test/sim_max_reward_4500010": 1.0, "test/sim_max_reward_4500011": 1.0, "test/sim_max_reward_4500012": 1.0, "test/sim_max_reward_4500013": 1.0, "test/sim_max_reward_4500014": 1.0, "test/sim_max_reward_4500015": 1.0, "test/sim_max_reward_4500016": 1.0, "test/sim_max_reward_4500017": 1.0, "test/sim_max_reward_4500018": 1.0, "test/sim_max_reward_4500019": 0.0, "test/sim_max_reward_4500020": 1.0, "test/sim_max_reward_4500021": 1.0, "train/mean_score": 1.0, "test/mean_score": 0.9545454545454546, "val_loss": 6649553.0} {"train_loss": -23.903606414794922, "global_step": 215883, "epoch": 2601} {"train_loss": -24.062612533569336, "global_step": 215884, "epoch": 2601} {"train_loss": -24.034177780151367, "global_step": 215885, "epoch": 2601} {"train_loss": -23.93023109436035, "global_step": 215886, "epoch": 2601} {"train_loss": -23.876298904418945, "global_step": 215887, "epoch": 2601} {"train_loss": -24.028453826904297, "global_step": 215888, "epoch": 2601} {"train_loss": -24.375492095947266, "global_step": 215889, "epoch": 2601} {"train_loss": -23.656919479370117, "global_step": 215890, "epoch": 2601} {"train_loss": -23.831302642822266, "global_step": 215891, "epoch": 2601} {"train_loss": -24.26172637939453, "global_step": 215892, "epoch": 2601} {"train_loss": -24.201274871826172, "global_step": 215893, "epoch": 2601} {"train_loss": -23.713134765625, "global_step": 215894, "epoch": 2601} {"train_loss": -23.987327575683594, "global_step": 215895, "epoch": 2601} {"train_loss": -24.346872329711914, "global_step": 215896, "epoch": 2601} {"train_loss": -24.328052520751953, "global_step": 215897, "epoch": 2601} {"train_loss": -24.010055541992188, "global_step": 215898, "epoch": 2601} {"train_loss": -24.51972007751465, "global_step": 215899, "epoch": 2601} {"train_loss": -24.09840202331543, "global_step": 215900, "epoch": 2601} {"train_loss": -23.931533813476562, "global_step": 215901, "epoch": 2601} {"train_loss": -24.52442741394043, "global_step": 215902, "epoch": 2601} {"train_loss": -24.35486602783203, "global_step": 215903, "epoch": 2601} {"train_loss": -24.08041000366211, "global_step": 215904, "epoch": 2601} {"train_loss": -23.753061294555664, "global_step": 215905, "epoch": 2601} {"train_loss": -24.319992065429688, "global_step": 215906, "epoch": 2601} {"train_loss": -24.28734016418457, "global_step": 215907, "epoch": 2601} {"train_loss": -24.2609806060791, "global_step": 215908, "epoch": 2601} {"train_loss": -24.370779037475586, "global_step": 215909, "epoch": 2601} {"train_loss": -24.53208351135254, "global_step": 215910, "epoch": 2601} {"train_loss": -24.431602478027344, "global_step": 215911, "epoch": 2601} {"train_loss": -24.476043701171875, "global_step": 215912, "epoch": 2601} {"train_loss": -24.713537216186523, "global_step": 215913, "epoch": 2601} {"train_loss": -24.734769821166992, "global_step": 215914, "epoch": 2601} {"train_loss": -24.825576782226562, "global_step": 215915, "epoch": 2601} {"train_loss": -24.318761825561523, "global_step": 215916, "epoch": 2601} {"train_loss": -24.39693260192871, "global_step": 215917, "epoch": 2601} {"train_loss": -24.451175689697266, "global_step": 215918, "epoch": 2601} {"train_loss": -24.432117462158203, "global_step": 215919, "epoch": 2601} {"train_loss": -24.255020141601562, "global_step": 215920, "epoch": 2601} {"train_loss": -24.402685165405273, "global_step": 215921, "epoch": 2601} {"train_loss": -24.38922119140625, "global_step": 215922, "epoch": 2601} {"train_loss": -24.57280921936035, "global_step": 215923, "epoch": 2601} {"train_loss": -24.851713180541992, "global_step": 215924, "epoch": 2601} {"train_loss": -24.303802490234375, "global_step": 215925, "epoch": 2601} {"train_loss": -24.3974552154541, "global_step": 215926, "epoch": 2601} {"train_loss": -24.41633415222168, "global_step": 215927, "epoch": 2601} {"train_loss": -24.20216941833496, "global_step": 215928, "epoch": 2601} {"train_loss": -24.349607467651367, "global_step": 215929, "epoch": 2601} {"train_loss": -24.647567749023438, "global_step": 215930, "epoch": 2601} {"train_loss": -24.674640655517578, "global_step": 215931, "epoch": 2601} {"train_loss": -24.538366317749023, "global_step": 215932, "epoch": 2601} {"train_loss": -24.339323043823242, "global_step": 215933, "epoch": 2601} {"train_loss": -24.47944450378418, "global_step": 215934, "epoch": 2601} {"train_loss": -24.85431480407715, "global_step": 215935, "epoch": 2601} {"train_loss": -24.747989654541016, "global_step": 215936, "epoch": 2601} {"train_loss": -24.319866180419922, "global_step": 215937, "epoch": 2601} {"train_loss": -24.708345413208008, "global_step": 215938, "epoch": 2601} {"train_loss": -24.4710693359375, "global_step": 215939, "epoch": 2601} {"train_loss": -24.442060470581055, "global_step": 215940, "epoch": 2601} {"train_loss": -24.20215606689453, "global_step": 215941, "epoch": 2601} {"train_loss": -24.4464168548584, "global_step": 215942, "epoch": 2601} {"train_loss": -24.816110610961914, "global_step": 215943, "epoch": 2601} {"train_loss": -24.589691162109375, "global_step": 215944, "epoch": 2601} {"train_loss": -24.38948631286621, "global_step": 215945, "epoch": 2601} {"train_loss": -24.874956130981445, "global_step": 215946, "epoch": 2601} {"train_loss": -24.150619506835938, "global_step": 215947, "epoch": 2601} {"train_loss": -24.495361328125, "global_step": 215948, "epoch": 2601} {"train_loss": -24.499155044555664, "global_step": 215949, "epoch": 2601} {"train_loss": -24.791654586791992, "global_step": 215950, "epoch": 2601} {"train_loss": -24.514873504638672, "global_step": 215951, "epoch": 2601} {"train_loss": -24.317340850830078, "global_step": 215952, "epoch": 2601} {"train_loss": -24.55173110961914, "global_step": 215953, "epoch": 2601} {"train_loss": -24.902374267578125, "global_step": 215954, "epoch": 2601} {"train_loss": -24.26287841796875, "global_step": 215955, "epoch": 2601} {"train_loss": -24.704320907592773, "global_step": 215956, "epoch": 2601} {"train_loss": -24.872045516967773, "global_step": 215957, "epoch": 2601} {"train_loss": -24.737932205200195, "global_step": 215958, "epoch": 2601} {"train_loss": -24.747716903686523, "global_step": 215959, "epoch": 2601} {"train_loss": -24.85548973083496, "global_step": 215960, "epoch": 2601} {"train_loss": -24.759769439697266, "global_step": 215961, "epoch": 2601} {"train_loss": -24.056005477905273, "global_step": 215962, "epoch": 2601} {"train_loss": -24.267742156982422, "global_step": 215963, "epoch": 2601} {"train_loss": -24.628843307495117, "global_step": 215964, "epoch": 2601} {"train_loss": -24.39781763467444, "global_step": 215965, "epoch": 2601, "val_loss": 6625675.0} {"train_loss": -24.400659561157227, "global_step": 215966, "epoch": 2602} {"train_loss": -24.15815544128418, "global_step": 215967, "epoch": 2602} {"train_loss": -24.1455135345459, "global_step": 215968, "epoch": 2602} {"train_loss": -24.344688415527344, "global_step": 215969, "epoch": 2602} {"train_loss": -24.49781608581543, "global_step": 215970, "epoch": 2602} {"train_loss": -24.383760452270508, "global_step": 215971, "epoch": 2602} {"train_loss": -24.31988525390625, "global_step": 215972, "epoch": 2602} {"train_loss": -24.44148826599121, "global_step": 215973, "epoch": 2602} {"train_loss": -24.207983016967773, "global_step": 215974, "epoch": 2602} {"train_loss": -24.36163330078125, "global_step": 215975, "epoch": 2602} {"train_loss": -24.379776000976562, "global_step": 215976, "epoch": 2602} {"train_loss": -24.635587692260742, "global_step": 215977, "epoch": 2602} {"train_loss": -24.593713760375977, "global_step": 215978, "epoch": 2602} {"train_loss": -24.796207427978516, "global_step": 215979, "epoch": 2602} {"train_loss": -24.53993797302246, "global_step": 215980, "epoch": 2602} {"train_loss": -24.4980525970459, "global_step": 215981, "epoch": 2602} {"train_loss": -24.530624389648438, "global_step": 215982, "epoch": 2602} {"train_loss": -24.810697555541992, "global_step": 215983, "epoch": 2602} {"train_loss": -24.81268882751465, "global_step": 215984, "epoch": 2602} {"train_loss": -24.34608268737793, "global_step": 215985, "epoch": 2602} {"train_loss": -24.653106689453125, "global_step": 215986, "epoch": 2602} {"train_loss": -24.80573844909668, "global_step": 215987, "epoch": 2602} {"train_loss": -24.485855102539062, "global_step": 215988, "epoch": 2602} {"train_loss": -24.450576782226562, "global_step": 215989, "epoch": 2602} {"train_loss": -24.636850357055664, "global_step": 215990, "epoch": 2602} {"train_loss": -24.59865379333496, "global_step": 215991, "epoch": 2602} {"train_loss": -24.14543342590332, "global_step": 215992, "epoch": 2602} {"train_loss": -24.748106002807617, "global_step": 215993, "epoch": 2602} {"train_loss": -24.40555763244629, "global_step": 215994, "epoch": 2602} {"train_loss": -23.96890640258789, "global_step": 215995, "epoch": 2602} {"train_loss": -23.94162368774414, "global_step": 215996, "epoch": 2602} {"train_loss": -24.401620864868164, "global_step": 215997, "epoch": 2602} {"train_loss": -24.170520782470703, "global_step": 215998, "epoch": 2602} {"train_loss": -24.88623046875, "global_step": 215999, "epoch": 2602} {"train_loss": -24.632003784179688, "global_step": 216000, "epoch": 2602} {"train_loss": -24.364269256591797, "global_step": 216001, "epoch": 2602} {"train_loss": -24.505786895751953, "global_step": 216002, "epoch": 2602} {"train_loss": -24.39002799987793, "global_step": 216003, "epoch": 2602} {"train_loss": -24.159915924072266, "global_step": 216004, "epoch": 2602} {"train_loss": -24.579914093017578, "global_step": 216005, "epoch": 2602} {"train_loss": -24.427968978881836, "global_step": 216006, "epoch": 2602} {"train_loss": -24.62439727783203, "global_step": 216007, "epoch": 2602} {"train_loss": -24.823328018188477, "global_step": 216008, "epoch": 2602} {"train_loss": -24.474950790405273, "global_step": 216009, "epoch": 2602} {"train_loss": -24.50101089477539, "global_step": 216010, "epoch": 2602} {"train_loss": -24.513450622558594, "global_step": 216011, "epoch": 2602} {"train_loss": -24.952585220336914, "global_step": 216012, "epoch": 2602} {"train_loss": -24.863256454467773, "global_step": 216013, "epoch": 2602} {"train_loss": -24.513456344604492, "global_step": 216014, "epoch": 2602} {"train_loss": -24.505212783813477, "global_step": 216015, "epoch": 2602} {"train_loss": -24.22968864440918, "global_step": 216016, "epoch": 2602} {"train_loss": -24.64681053161621, "global_step": 216017, "epoch": 2602} {"train_loss": -24.54306983947754, "global_step": 216018, "epoch": 2602} {"train_loss": -24.432050704956055, "global_step": 216019, "epoch": 2602} {"train_loss": -25.040250778198242, "global_step": 216020, "epoch": 2602} {"train_loss": -24.56943130493164, "global_step": 216021, "epoch": 2602} {"train_loss": -24.441787719726562, "global_step": 216022, "epoch": 2602} {"train_loss": -24.65472412109375, "global_step": 216023, "epoch": 2602} {"train_loss": -24.2467041015625, "global_step": 216024, "epoch": 2602} {"train_loss": -24.560331344604492, "global_step": 216025, "epoch": 2602} {"train_loss": -24.358041763305664, "global_step": 216026, "epoch": 2602} {"train_loss": -24.273099899291992, "global_step": 216027, "epoch": 2602} {"train_loss": -24.100080490112305, "global_step": 216028, "epoch": 2602} {"train_loss": -24.754133224487305, "global_step": 216029, "epoch": 2602} {"train_loss": -24.4311466217041, "global_step": 216030, "epoch": 2602} {"train_loss": -24.400171279907227, "global_step": 216031, "epoch": 2602} {"train_loss": -24.59732437133789, "global_step": 216032, "epoch": 2602} {"train_loss": -24.39362144470215, "global_step": 216033, "epoch": 2602} {"train_loss": -24.849355697631836, "global_step": 216034, "epoch": 2602} {"train_loss": -24.64546775817871, "global_step": 216035, "epoch": 2602} {"train_loss": -24.508575439453125, "global_step": 216036, "epoch": 2602} {"train_loss": -24.296741485595703, "global_step": 216037, "epoch": 2602} {"train_loss": -24.53482437133789, "global_step": 216038, "epoch": 2602} {"train_loss": -24.40932273864746, "global_step": 216039, "epoch": 2602} {"train_loss": -24.333765029907227, "global_step": 216040, "epoch": 2602} {"train_loss": -24.669048309326172, "global_step": 216041, "epoch": 2602} {"train_loss": -24.923648834228516, "global_step": 216042, "epoch": 2602} {"train_loss": -24.579540252685547, "global_step": 216043, "epoch": 2602} {"train_loss": -24.575401306152344, "global_step": 216044, "epoch": 2602} {"train_loss": -24.68524169921875, "global_step": 216045, "epoch": 2602} {"train_loss": -24.187841415405273, "global_step": 216046, "epoch": 2602} {"train_loss": -24.589651107788086, "global_step": 216047, "epoch": 2602} {"train_loss": -24.493618861738458, "global_step": 216048, "epoch": 2602, "val_loss": 6649101.0} {"train_loss": -24.349830627441406, "global_step": 216049, "epoch": 2603} {"train_loss": -23.936735153198242, "global_step": 216050, "epoch": 2603} {"train_loss": -24.242599487304688, "global_step": 216051, "epoch": 2603} {"train_loss": -24.0474910736084, "global_step": 216052, "epoch": 2603} {"train_loss": -24.01486587524414, "global_step": 216053, "epoch": 2603} {"train_loss": -23.95574188232422, "global_step": 216054, "epoch": 2603} {"train_loss": -24.18238639831543, "global_step": 216055, "epoch": 2603} {"train_loss": -24.351478576660156, "global_step": 216056, "epoch": 2603} {"train_loss": -23.6685848236084, "global_step": 216057, "epoch": 2603} {"train_loss": -24.194793701171875, "global_step": 216058, "epoch": 2603} {"train_loss": -24.003055572509766, "global_step": 216059, "epoch": 2603} {"train_loss": -23.801313400268555, "global_step": 216060, "epoch": 2603} {"train_loss": -24.4000301361084, "global_step": 216061, "epoch": 2603} {"train_loss": -24.585485458374023, "global_step": 216062, "epoch": 2603} {"train_loss": -24.396520614624023, "global_step": 216063, "epoch": 2603} {"train_loss": -24.296064376831055, "global_step": 216064, "epoch": 2603} {"train_loss": -24.16229248046875, "global_step": 216065, "epoch": 2603} {"train_loss": -24.513551712036133, "global_step": 216066, "epoch": 2603} {"train_loss": -24.4636287689209, "global_step": 216067, "epoch": 2603} {"train_loss": -24.720075607299805, "global_step": 216068, "epoch": 2603} {"train_loss": -24.390155792236328, "global_step": 216069, "epoch": 2603} {"train_loss": -24.84559440612793, "global_step": 216070, "epoch": 2603} {"train_loss": -24.00558853149414, "global_step": 216071, "epoch": 2603} {"train_loss": -24.39661407470703, "global_step": 216072, "epoch": 2603} {"train_loss": -24.186697006225586, "global_step": 216073, "epoch": 2603} {"train_loss": -24.54266357421875, "global_step": 216074, "epoch": 2603} {"train_loss": -24.36687660217285, "global_step": 216075, "epoch": 2603} {"train_loss": -24.612279891967773, "global_step": 216076, "epoch": 2603} {"train_loss": -24.780750274658203, "global_step": 216077, "epoch": 2603} {"train_loss": -24.75876235961914, "global_step": 216078, "epoch": 2603} {"train_loss": -24.532075881958008, "global_step": 216079, "epoch": 2603} {"train_loss": -24.31121253967285, "global_step": 216080, "epoch": 2603} {"train_loss": -24.812374114990234, "global_step": 216081, "epoch": 2603} {"train_loss": -24.684459686279297, "global_step": 216082, "epoch": 2603} {"train_loss": -24.765274047851562, "global_step": 216083, "epoch": 2603} {"train_loss": -24.528255462646484, "global_step": 216084, "epoch": 2603} {"train_loss": -25.171293258666992, "global_step": 216085, "epoch": 2603} {"train_loss": -24.34370231628418, "global_step": 216086, "epoch": 2603} {"train_loss": -24.13152503967285, "global_step": 216087, "epoch": 2603} {"train_loss": -24.44998550415039, "global_step": 216088, "epoch": 2603} {"train_loss": -24.448596954345703, "global_step": 216089, "epoch": 2603} {"train_loss": -24.35578155517578, "global_step": 216090, "epoch": 2603} {"train_loss": -24.499685287475586, "global_step": 216091, "epoch": 2603} {"train_loss": -24.213333129882812, "global_step": 216092, "epoch": 2603} {"train_loss": -24.77594566345215, "global_step": 216093, "epoch": 2603} {"train_loss": -24.613300323486328, "global_step": 216094, "epoch": 2603} {"train_loss": -24.178823471069336, "global_step": 216095, "epoch": 2603} {"train_loss": -24.462411880493164, "global_step": 216096, "epoch": 2603} {"train_loss": -24.97960662841797, "global_step": 216097, "epoch": 2603} {"train_loss": -24.457275390625, "global_step": 216098, "epoch": 2603} {"train_loss": -24.486181259155273, "global_step": 216099, "epoch": 2603} {"train_loss": -24.57950210571289, "global_step": 216100, "epoch": 2603} {"train_loss": -24.67635154724121, "global_step": 216101, "epoch": 2603} {"train_loss": -24.63825225830078, "global_step": 216102, "epoch": 2603} {"train_loss": -24.626901626586914, "global_step": 216103, "epoch": 2603} {"train_loss": -24.434606552124023, "global_step": 216104, "epoch": 2603} {"train_loss": -24.691755294799805, "global_step": 216105, "epoch": 2603} {"train_loss": -24.52332878112793, "global_step": 216106, "epoch": 2603} {"train_loss": -24.61175537109375, "global_step": 216107, "epoch": 2603} {"train_loss": -24.593759536743164, "global_step": 216108, "epoch": 2603} {"train_loss": -24.40824317932129, "global_step": 216109, "epoch": 2603} {"train_loss": -24.279754638671875, "global_step": 216110, "epoch": 2603} {"train_loss": -24.12563705444336, "global_step": 216111, "epoch": 2603} {"train_loss": -23.99160385131836, "global_step": 216112, "epoch": 2603} {"train_loss": -24.270999908447266, "global_step": 216113, "epoch": 2603} {"train_loss": -24.57398796081543, "global_step": 216114, "epoch": 2603} {"train_loss": -24.78835105895996, "global_step": 216115, "epoch": 2603} {"train_loss": -24.490211486816406, "global_step": 216116, "epoch": 2603} {"train_loss": -24.52998161315918, "global_step": 216117, "epoch": 2603} {"train_loss": -24.669309616088867, "global_step": 216118, "epoch": 2603} {"train_loss": -24.69856071472168, "global_step": 216119, "epoch": 2603} {"train_loss": -24.66908073425293, "global_step": 216120, "epoch": 2603} {"train_loss": -24.757476806640625, "global_step": 216121, "epoch": 2603} {"train_loss": -24.928390502929688, "global_step": 216122, "epoch": 2603} {"train_loss": -24.487041473388672, "global_step": 216123, "epoch": 2603} {"train_loss": -24.373031616210938, "global_step": 216124, "epoch": 2603} {"train_loss": -24.341703414916992, "global_step": 216125, "epoch": 2603} {"train_loss": -24.499723434448242, "global_step": 216126, "epoch": 2603} {"train_loss": -24.996986389160156, "global_step": 216127, "epoch": 2603} {"train_loss": -24.72381019592285, "global_step": 216128, "epoch": 2603} {"train_loss": -24.34478759765625, "global_step": 216129, "epoch": 2603} {"train_loss": -24.41913414001465, "global_step": 216130, "epoch": 2603} {"train_loss": -24.447675406214703, "global_step": 216131, "epoch": 2603, "val_loss": 6710904.0} {"train_loss": -24.280576705932617, "global_step": 216132, "epoch": 2604} {"train_loss": -24.0736141204834, "global_step": 216133, "epoch": 2604} {"train_loss": -24.29086685180664, "global_step": 216134, "epoch": 2604} {"train_loss": -24.203266143798828, "global_step": 216135, "epoch": 2604} {"train_loss": -24.534399032592773, "global_step": 216136, "epoch": 2604} {"train_loss": -24.784591674804688, "global_step": 216137, "epoch": 2604} {"train_loss": -24.591238021850586, "global_step": 216138, "epoch": 2604} {"train_loss": -24.585752487182617, "global_step": 216139, "epoch": 2604} {"train_loss": -24.53737449645996, "global_step": 216140, "epoch": 2604} {"train_loss": -24.40034294128418, "global_step": 216141, "epoch": 2604} {"train_loss": -24.645538330078125, "global_step": 216142, "epoch": 2604} {"train_loss": -24.44099235534668, "global_step": 216143, "epoch": 2604} {"train_loss": -24.24833869934082, "global_step": 216144, "epoch": 2604} {"train_loss": -24.9998722076416, "global_step": 216145, "epoch": 2604} {"train_loss": -24.748937606811523, "global_step": 216146, "epoch": 2604} {"train_loss": -24.406845092773438, "global_step": 216147, "epoch": 2604} {"train_loss": -24.288068771362305, "global_step": 216148, "epoch": 2604} {"train_loss": -24.610830307006836, "global_step": 216149, "epoch": 2604} {"train_loss": -23.926525115966797, "global_step": 216150, "epoch": 2604} {"train_loss": -24.00132942199707, "global_step": 216151, "epoch": 2604} {"train_loss": -23.692873001098633, "global_step": 216152, "epoch": 2604} {"train_loss": -24.227066040039062, "global_step": 216153, "epoch": 2604} {"train_loss": -23.857084274291992, "global_step": 216154, "epoch": 2604} {"train_loss": -23.840011596679688, "global_step": 216155, "epoch": 2604} {"train_loss": -23.87180519104004, "global_step": 216156, "epoch": 2604} {"train_loss": -23.811508178710938, "global_step": 216157, "epoch": 2604} {"train_loss": -24.051319122314453, "global_step": 216158, "epoch": 2604} {"train_loss": -24.062185287475586, "global_step": 216159, "epoch": 2604} {"train_loss": -24.121747970581055, "global_step": 216160, "epoch": 2604} {"train_loss": -23.923402786254883, "global_step": 216161, "epoch": 2604} {"train_loss": -24.31026268005371, "global_step": 216162, "epoch": 2604} {"train_loss": -24.353771209716797, "global_step": 216163, "epoch": 2604} {"train_loss": -24.34018898010254, "global_step": 216164, "epoch": 2604} {"train_loss": -24.408042907714844, "global_step": 216165, "epoch": 2604} {"train_loss": -24.63254165649414, "global_step": 216166, "epoch": 2604} {"train_loss": -24.785205841064453, "global_step": 216167, "epoch": 2604} {"train_loss": -24.336212158203125, "global_step": 216168, "epoch": 2604} {"train_loss": -24.581769943237305, "global_step": 216169, "epoch": 2604} {"train_loss": -24.767065048217773, "global_step": 216170, "epoch": 2604} {"train_loss": -24.73208999633789, "global_step": 216171, "epoch": 2604} {"train_loss": -24.21578598022461, "global_step": 216172, "epoch": 2604} {"train_loss": -24.86899185180664, "global_step": 216173, "epoch": 2604} {"train_loss": -24.534650802612305, "global_step": 216174, "epoch": 2604} {"train_loss": -24.656461715698242, "global_step": 216175, "epoch": 2604} {"train_loss": -24.724761962890625, "global_step": 216176, "epoch": 2604} {"train_loss": -24.5784969329834, "global_step": 216177, "epoch": 2604} {"train_loss": -25.040287017822266, "global_step": 216178, "epoch": 2604} {"train_loss": -24.52393341064453, "global_step": 216179, "epoch": 2604} {"train_loss": -24.25433921813965, "global_step": 216180, "epoch": 2604} {"train_loss": -24.564695358276367, "global_step": 216181, "epoch": 2604} {"train_loss": -24.892696380615234, "global_step": 216182, "epoch": 2604} {"train_loss": -24.92848014831543, "global_step": 216183, "epoch": 2604} {"train_loss": -24.378416061401367, "global_step": 216184, "epoch": 2604} {"train_loss": -24.6229190826416, "global_step": 216185, "epoch": 2604} {"train_loss": -24.378576278686523, "global_step": 216186, "epoch": 2604} {"train_loss": -24.832721710205078, "global_step": 216187, "epoch": 2604} {"train_loss": -24.769521713256836, "global_step": 216188, "epoch": 2604} {"train_loss": -24.806394577026367, "global_step": 216189, "epoch": 2604} {"train_loss": -24.372222900390625, "global_step": 216190, "epoch": 2604} {"train_loss": -24.63221549987793, "global_step": 216191, "epoch": 2604} {"train_loss": -24.648731231689453, "global_step": 216192, "epoch": 2604} {"train_loss": -24.561647415161133, "global_step": 216193, "epoch": 2604} {"train_loss": -24.41827392578125, "global_step": 216194, "epoch": 2604} {"train_loss": -24.558713912963867, "global_step": 216195, "epoch": 2604} {"train_loss": -24.102033615112305, "global_step": 216196, "epoch": 2604} {"train_loss": -23.5921688079834, "global_step": 216197, "epoch": 2604} {"train_loss": -23.766822814941406, "global_step": 216198, "epoch": 2604} {"train_loss": -24.76900291442871, "global_step": 216199, "epoch": 2604} {"train_loss": -24.36970329284668, "global_step": 216200, "epoch": 2604} {"train_loss": -24.1264705657959, "global_step": 216201, "epoch": 2604} {"train_loss": -24.3491268157959, "global_step": 216202, "epoch": 2604} {"train_loss": -24.491867065429688, "global_step": 216203, "epoch": 2604} {"train_loss": -24.925039291381836, "global_step": 216204, "epoch": 2604} {"train_loss": -24.124311447143555, "global_step": 216205, "epoch": 2604} {"train_loss": -24.77277374267578, "global_step": 216206, "epoch": 2604} {"train_loss": -24.569068908691406, "global_step": 216207, "epoch": 2604} {"train_loss": -24.259817123413086, "global_step": 216208, "epoch": 2604} {"train_loss": -24.335918426513672, "global_step": 216209, "epoch": 2604} {"train_loss": -24.729040145874023, "global_step": 216210, "epoch": 2604} {"train_loss": -24.674848556518555, "global_step": 216211, "epoch": 2604} {"train_loss": -24.755666732788086, "global_step": 216212, "epoch": 2604} {"train_loss": -24.426950454711914, "global_step": 216213, "epoch": 2604} {"train_loss": -24.430921462645014, "global_step": 216214, "epoch": 2604, "val_loss": 6554457.0} {"train_loss": -24.381223678588867, "global_step": 216215, "epoch": 2605} {"train_loss": -24.105541229248047, "global_step": 216216, "epoch": 2605} {"train_loss": -24.331953048706055, "global_step": 216217, "epoch": 2605} {"train_loss": -24.117919921875, "global_step": 216218, "epoch": 2605} {"train_loss": -24.368999481201172, "global_step": 216219, "epoch": 2605} {"train_loss": -24.618484497070312, "global_step": 216220, "epoch": 2605} {"train_loss": -24.64700698852539, "global_step": 216221, "epoch": 2605} {"train_loss": -24.627187728881836, "global_step": 216222, "epoch": 2605} {"train_loss": -24.497678756713867, "global_step": 216223, "epoch": 2605} {"train_loss": -24.45432472229004, "global_step": 216224, "epoch": 2605} {"train_loss": -24.65089988708496, "global_step": 216225, "epoch": 2605} {"train_loss": -24.870222091674805, "global_step": 216226, "epoch": 2605} {"train_loss": -24.47734832763672, "global_step": 216227, "epoch": 2605} {"train_loss": -24.49456214904785, "global_step": 216228, "epoch": 2605} {"train_loss": -24.54053497314453, "global_step": 216229, "epoch": 2605} {"train_loss": -24.588909149169922, "global_step": 216230, "epoch": 2605} {"train_loss": -24.625593185424805, "global_step": 216231, "epoch": 2605} {"train_loss": -24.54029655456543, "global_step": 216232, "epoch": 2605} {"train_loss": -24.450468063354492, "global_step": 216233, "epoch": 2605} {"train_loss": -24.606794357299805, "global_step": 216234, "epoch": 2605} {"train_loss": -24.59317970275879, "global_step": 216235, "epoch": 2605} {"train_loss": -24.613601684570312, "global_step": 216236, "epoch": 2605} {"train_loss": -24.472991943359375, "global_step": 216237, "epoch": 2605} {"train_loss": -24.615707397460938, "global_step": 216238, "epoch": 2605} {"train_loss": -24.691730499267578, "global_step": 216239, "epoch": 2605} {"train_loss": -24.7822322845459, "global_step": 216240, "epoch": 2605} {"train_loss": -24.68414306640625, "global_step": 216241, "epoch": 2605} {"train_loss": -24.509151458740234, "global_step": 216242, "epoch": 2605} {"train_loss": -24.461713790893555, "global_step": 216243, "epoch": 2605} {"train_loss": -24.892581939697266, "global_step": 216244, "epoch": 2605} {"train_loss": -24.6691837310791, "global_step": 216245, "epoch": 2605} {"train_loss": -24.73101806640625, "global_step": 216246, "epoch": 2605} {"train_loss": -24.66596031188965, "global_step": 216247, "epoch": 2605} {"train_loss": -24.790273666381836, "global_step": 216248, "epoch": 2605} {"train_loss": -24.752412796020508, "global_step": 216249, "epoch": 2605} {"train_loss": -24.525375366210938, "global_step": 216250, "epoch": 2605} {"train_loss": -24.569385528564453, "global_step": 216251, "epoch": 2605} {"train_loss": -24.16655921936035, "global_step": 216252, "epoch": 2605} {"train_loss": -24.384010314941406, "global_step": 216253, "epoch": 2605} {"train_loss": -24.32366371154785, "global_step": 216254, "epoch": 2605} {"train_loss": -24.906312942504883, "global_step": 216255, "epoch": 2605} {"train_loss": -24.09099769592285, "global_step": 216256, "epoch": 2605} {"train_loss": -24.709739685058594, "global_step": 216257, "epoch": 2605} {"train_loss": -24.767850875854492, "global_step": 216258, "epoch": 2605} {"train_loss": -24.959291458129883, "global_step": 216259, "epoch": 2605} {"train_loss": -24.813451766967773, "global_step": 216260, "epoch": 2605} {"train_loss": -25.20804214477539, "global_step": 216261, "epoch": 2605} {"train_loss": -24.79658317565918, "global_step": 216262, "epoch": 2605} {"train_loss": -24.766576766967773, "global_step": 216263, "epoch": 2605} {"train_loss": -24.65791130065918, "global_step": 216264, "epoch": 2605} {"train_loss": -24.2287654876709, "global_step": 216265, "epoch": 2605} {"train_loss": -24.543296813964844, "global_step": 216266, "epoch": 2605} {"train_loss": -24.58974266052246, "global_step": 216267, "epoch": 2605} {"train_loss": -24.690412521362305, "global_step": 216268, "epoch": 2605} {"train_loss": -24.516931533813477, "global_step": 216269, "epoch": 2605} {"train_loss": -24.589893341064453, "global_step": 216270, "epoch": 2605} {"train_loss": -24.791339874267578, "global_step": 216271, "epoch": 2605} {"train_loss": -24.59381103515625, "global_step": 216272, "epoch": 2605} {"train_loss": -24.807443618774414, "global_step": 216273, "epoch": 2605} {"train_loss": -24.545053482055664, "global_step": 216274, "epoch": 2605} {"train_loss": -24.589344024658203, "global_step": 216275, "epoch": 2605} {"train_loss": -24.746959686279297, "global_step": 216276, "epoch": 2605} {"train_loss": -25.1439266204834, "global_step": 216277, "epoch": 2605} {"train_loss": -24.117679595947266, "global_step": 216278, "epoch": 2605} {"train_loss": -24.740856170654297, "global_step": 216279, "epoch": 2605} {"train_loss": -24.604764938354492, "global_step": 216280, "epoch": 2605} {"train_loss": -24.47919273376465, "global_step": 216281, "epoch": 2605} {"train_loss": -24.788976669311523, "global_step": 216282, "epoch": 2605} {"train_loss": -24.670093536376953, "global_step": 216283, "epoch": 2605} {"train_loss": -24.513608932495117, "global_step": 216284, "epoch": 2605} {"train_loss": -24.696857452392578, "global_step": 216285, "epoch": 2605} {"train_loss": -24.484973907470703, "global_step": 216286, "epoch": 2605} {"train_loss": -24.396825790405273, "global_step": 216287, "epoch": 2605} {"train_loss": -24.296995162963867, "global_step": 216288, "epoch": 2605} {"train_loss": -24.64723777770996, "global_step": 216289, "epoch": 2605} {"train_loss": -24.62276268005371, "global_step": 216290, "epoch": 2605} {"train_loss": -24.674697875976562, "global_step": 216291, "epoch": 2605} {"train_loss": -24.289794921875, "global_step": 216292, "epoch": 2605} {"train_loss": -24.49959373474121, "global_step": 216293, "epoch": 2605} {"train_loss": -24.591419219970703, "global_step": 216294, "epoch": 2605} {"train_loss": -24.590234756469727, "global_step": 216295, "epoch": 2605} {"train_loss": -24.30780601501465, "global_step": 216296, "epoch": 2605} {"train_loss": -24.574656842702844, "global_step": 216297, "epoch": 2605, "val_loss": 6662638.5} {"train_loss": -23.55861473083496, "global_step": 216298, "epoch": 2606} {"train_loss": -22.39198875427246, "global_step": 216299, "epoch": 2606} {"train_loss": -23.236963272094727, "global_step": 216300, "epoch": 2606} {"train_loss": -23.602781295776367, "global_step": 216301, "epoch": 2606} {"train_loss": -23.3209285736084, "global_step": 216302, "epoch": 2606} {"train_loss": -23.836374282836914, "global_step": 216303, "epoch": 2606} {"train_loss": -23.594350814819336, "global_step": 216304, "epoch": 2606} {"train_loss": -23.4886474609375, "global_step": 216305, "epoch": 2606} {"train_loss": -23.906349182128906, "global_step": 216306, "epoch": 2606} {"train_loss": -23.70404052734375, "global_step": 216307, "epoch": 2606} {"train_loss": -24.195650100708008, "global_step": 216308, "epoch": 2606} {"train_loss": -24.0493221282959, "global_step": 216309, "epoch": 2606} {"train_loss": -23.957548141479492, "global_step": 216310, "epoch": 2606} {"train_loss": -23.767980575561523, "global_step": 216311, "epoch": 2606} {"train_loss": -23.68619155883789, "global_step": 216312, "epoch": 2606} {"train_loss": -24.373910903930664, "global_step": 216313, "epoch": 2606} {"train_loss": -24.12064552307129, "global_step": 216314, "epoch": 2606} {"train_loss": -24.2386531829834, "global_step": 216315, "epoch": 2606} {"train_loss": -24.42951774597168, "global_step": 216316, "epoch": 2606} {"train_loss": -23.719995498657227, "global_step": 216317, "epoch": 2606} {"train_loss": -24.234792709350586, "global_step": 216318, "epoch": 2606} {"train_loss": -24.268741607666016, "global_step": 216319, "epoch": 2606} {"train_loss": -24.231142044067383, "global_step": 216320, "epoch": 2606} {"train_loss": -24.03485679626465, "global_step": 216321, "epoch": 2606} {"train_loss": -24.387617111206055, "global_step": 216322, "epoch": 2606} {"train_loss": -24.10336685180664, "global_step": 216323, "epoch": 2606} {"train_loss": -24.02644157409668, "global_step": 216324, "epoch": 2606} {"train_loss": -24.413848876953125, "global_step": 216325, "epoch": 2606} {"train_loss": -24.52092170715332, "global_step": 216326, "epoch": 2606} {"train_loss": -24.526071548461914, "global_step": 216327, "epoch": 2606} {"train_loss": -24.161569595336914, "global_step": 216328, "epoch": 2606} {"train_loss": -24.6002254486084, "global_step": 216329, "epoch": 2606} {"train_loss": -24.66164207458496, "global_step": 216330, "epoch": 2606} {"train_loss": -24.44659996032715, "global_step": 216331, "epoch": 2606} {"train_loss": -25.00838279724121, "global_step": 216332, "epoch": 2606} {"train_loss": -24.45000648498535, "global_step": 216333, "epoch": 2606} {"train_loss": -24.460895538330078, "global_step": 216334, "epoch": 2606} {"train_loss": -24.463815689086914, "global_step": 216335, "epoch": 2606} {"train_loss": -24.50630760192871, "global_step": 216336, "epoch": 2606} {"train_loss": -24.673254013061523, "global_step": 216337, "epoch": 2606} {"train_loss": -24.2236328125, "global_step": 216338, "epoch": 2606} {"train_loss": -24.601648330688477, "global_step": 216339, "epoch": 2606} {"train_loss": -24.806917190551758, "global_step": 216340, "epoch": 2606} {"train_loss": -24.44464683532715, "global_step": 216341, "epoch": 2606} {"train_loss": -24.275110244750977, "global_step": 216342, "epoch": 2606} {"train_loss": -24.229501724243164, "global_step": 216343, "epoch": 2606} {"train_loss": -24.963895797729492, "global_step": 216344, "epoch": 2606} {"train_loss": -24.4670467376709, "global_step": 216345, "epoch": 2606} {"train_loss": -24.5062313079834, "global_step": 216346, "epoch": 2606} {"train_loss": -24.611186981201172, "global_step": 216347, "epoch": 2606} {"train_loss": -23.990951538085938, "global_step": 216348, "epoch": 2606} {"train_loss": -24.599855422973633, "global_step": 216349, "epoch": 2606} {"train_loss": -24.216428756713867, "global_step": 216350, "epoch": 2606} {"train_loss": -24.54296875, "global_step": 216351, "epoch": 2606} {"train_loss": -24.435129165649414, "global_step": 216352, "epoch": 2606} {"train_loss": -24.549930572509766, "global_step": 216353, "epoch": 2606} {"train_loss": -24.03896141052246, "global_step": 216354, "epoch": 2606} {"train_loss": -24.19009780883789, "global_step": 216355, "epoch": 2606} {"train_loss": -24.35173988342285, "global_step": 216356, "epoch": 2606} {"train_loss": -24.38348960876465, "global_step": 216357, "epoch": 2606} {"train_loss": -24.50670623779297, "global_step": 216358, "epoch": 2606} {"train_loss": -24.145200729370117, "global_step": 216359, "epoch": 2606} {"train_loss": -24.124500274658203, "global_step": 216360, "epoch": 2606} {"train_loss": -24.728235244750977, "global_step": 216361, "epoch": 2606} {"train_loss": -24.03176498413086, "global_step": 216362, "epoch": 2606} {"train_loss": -24.437971115112305, "global_step": 216363, "epoch": 2606} {"train_loss": -24.346105575561523, "global_step": 216364, "epoch": 2606} {"train_loss": -24.51503562927246, "global_step": 216365, "epoch": 2606} {"train_loss": -24.264272689819336, "global_step": 216366, "epoch": 2606} {"train_loss": -24.812150955200195, "global_step": 216367, "epoch": 2606} {"train_loss": -24.23609161376953, "global_step": 216368, "epoch": 2606} {"train_loss": -24.215024948120117, "global_step": 216369, "epoch": 2606} {"train_loss": -24.479660034179688, "global_step": 216370, "epoch": 2606} {"train_loss": -24.58806800842285, "global_step": 216371, "epoch": 2606} {"train_loss": -24.272869110107422, "global_step": 216372, "epoch": 2606} {"train_loss": -24.367218017578125, "global_step": 216373, "epoch": 2606} {"train_loss": -24.50079345703125, "global_step": 216374, "epoch": 2606} {"train_loss": -24.112586975097656, "global_step": 216375, "epoch": 2606} {"train_loss": -24.821521759033203, "global_step": 216376, "epoch": 2606} {"train_loss": -24.598012924194336, "global_step": 216377, "epoch": 2606} {"train_loss": -24.059551239013672, "global_step": 216378, "epoch": 2606} {"train_loss": -25.038471221923828, "global_step": 216379, "epoch": 2606} {"train_loss": -24.247240434209985, "global_step": 216380, "epoch": 2606, "val_loss": 6655842.0} {"train_loss": -23.328779220581055, "global_step": 216381, "epoch": 2607} {"train_loss": -23.62546157836914, "global_step": 216382, "epoch": 2607} {"train_loss": -23.838972091674805, "global_step": 216383, "epoch": 2607} {"train_loss": -23.480314254760742, "global_step": 216384, "epoch": 2607} {"train_loss": -24.19435691833496, "global_step": 216385, "epoch": 2607} {"train_loss": -23.640426635742188, "global_step": 216386, "epoch": 2607} {"train_loss": -23.587013244628906, "global_step": 216387, "epoch": 2607} {"train_loss": -24.23971939086914, "global_step": 216388, "epoch": 2607} {"train_loss": -24.615140914916992, "global_step": 216389, "epoch": 2607} {"train_loss": -24.082597732543945, "global_step": 216390, "epoch": 2607} {"train_loss": -24.554122924804688, "global_step": 216391, "epoch": 2607} {"train_loss": -24.366058349609375, "global_step": 216392, "epoch": 2607} {"train_loss": -24.364593505859375, "global_step": 216393, "epoch": 2607} {"train_loss": -24.247140884399414, "global_step": 216394, "epoch": 2607} {"train_loss": -24.20749855041504, "global_step": 216395, "epoch": 2607} {"train_loss": -24.251548767089844, "global_step": 216396, "epoch": 2607} {"train_loss": -24.404743194580078, "global_step": 216397, "epoch": 2607} {"train_loss": -24.188720703125, "global_step": 216398, "epoch": 2607} {"train_loss": -24.452573776245117, "global_step": 216399, "epoch": 2607} {"train_loss": -24.365365982055664, "global_step": 216400, "epoch": 2607} {"train_loss": -24.432554244995117, "global_step": 216401, "epoch": 2607} {"train_loss": -24.240692138671875, "global_step": 216402, "epoch": 2607} {"train_loss": -24.30992317199707, "global_step": 216403, "epoch": 2607} {"train_loss": -24.175161361694336, "global_step": 216404, "epoch": 2607} {"train_loss": -24.429262161254883, "global_step": 216405, "epoch": 2607} {"train_loss": -24.625974655151367, "global_step": 216406, "epoch": 2607} {"train_loss": -24.749460220336914, "global_step": 216407, "epoch": 2607} {"train_loss": -24.38399314880371, "global_step": 216408, "epoch": 2607} {"train_loss": -24.69269371032715, "global_step": 216409, "epoch": 2607} {"train_loss": -24.388362884521484, "global_step": 216410, "epoch": 2607} {"train_loss": -24.707298278808594, "global_step": 216411, "epoch": 2607} {"train_loss": -24.33389663696289, "global_step": 216412, "epoch": 2607} {"train_loss": -24.387126922607422, "global_step": 216413, "epoch": 2607} {"train_loss": -24.694522857666016, "global_step": 216414, "epoch": 2607} {"train_loss": -24.61013412475586, "global_step": 216415, "epoch": 2607} {"train_loss": -24.67523765563965, "global_step": 216416, "epoch": 2607} {"train_loss": -24.5155086517334, "global_step": 216417, "epoch": 2607} {"train_loss": -24.573551177978516, "global_step": 216418, "epoch": 2607} {"train_loss": -24.742361068725586, "global_step": 216419, "epoch": 2607} {"train_loss": -24.38663101196289, "global_step": 216420, "epoch": 2607} {"train_loss": -24.471853256225586, "global_step": 216421, "epoch": 2607} {"train_loss": -24.241840362548828, "global_step": 216422, "epoch": 2607} {"train_loss": -24.947452545166016, "global_step": 216423, "epoch": 2607} {"train_loss": -24.609909057617188, "global_step": 216424, "epoch": 2607} {"train_loss": -24.474271774291992, "global_step": 216425, "epoch": 2607} {"train_loss": -24.24822235107422, "global_step": 216426, "epoch": 2607} {"train_loss": -24.59987449645996, "global_step": 216427, "epoch": 2607} {"train_loss": -24.9797306060791, "global_step": 216428, "epoch": 2607} {"train_loss": -24.65846824645996, "global_step": 216429, "epoch": 2607} {"train_loss": -24.842914581298828, "global_step": 216430, "epoch": 2607} {"train_loss": -24.52498435974121, "global_step": 216431, "epoch": 2607} {"train_loss": -24.42621421813965, "global_step": 216432, "epoch": 2607} {"train_loss": -24.509506225585938, "global_step": 216433, "epoch": 2607} {"train_loss": -24.94940185546875, "global_step": 216434, "epoch": 2607} {"train_loss": -24.64847183227539, "global_step": 216435, "epoch": 2607} {"train_loss": -24.28830337524414, "global_step": 216436, "epoch": 2607} {"train_loss": -24.079133987426758, "global_step": 216437, "epoch": 2607} {"train_loss": -24.724843978881836, "global_step": 216438, "epoch": 2607} {"train_loss": -24.45891761779785, "global_step": 216439, "epoch": 2607} {"train_loss": -24.742158889770508, "global_step": 216440, "epoch": 2607} {"train_loss": -24.41640281677246, "global_step": 216441, "epoch": 2607} {"train_loss": -24.551374435424805, "global_step": 216442, "epoch": 2607} {"train_loss": -24.750268936157227, "global_step": 216443, "epoch": 2607} {"train_loss": -24.81475830078125, "global_step": 216444, "epoch": 2607} {"train_loss": -24.561084747314453, "global_step": 216445, "epoch": 2607} {"train_loss": -24.898365020751953, "global_step": 216446, "epoch": 2607} {"train_loss": -24.913198471069336, "global_step": 216447, "epoch": 2607} {"train_loss": -24.78608512878418, "global_step": 216448, "epoch": 2607} {"train_loss": -24.8100643157959, "global_step": 216449, "epoch": 2607} {"train_loss": -24.598712921142578, "global_step": 216450, "epoch": 2607} {"train_loss": -24.55729103088379, "global_step": 216451, "epoch": 2607} {"train_loss": -24.578710556030273, "global_step": 216452, "epoch": 2607} {"train_loss": -24.816375732421875, "global_step": 216453, "epoch": 2607} {"train_loss": -24.901243209838867, "global_step": 216454, "epoch": 2607} {"train_loss": -24.78377914428711, "global_step": 216455, "epoch": 2607} {"train_loss": -24.697162628173828, "global_step": 216456, "epoch": 2607} {"train_loss": -24.569814682006836, "global_step": 216457, "epoch": 2607} {"train_loss": -24.395212173461914, "global_step": 216458, "epoch": 2607} {"train_loss": -24.78114128112793, "global_step": 216459, "epoch": 2607} {"train_loss": -24.705123901367188, "global_step": 216460, "epoch": 2607} {"train_loss": -24.533315658569336, "global_step": 216461, "epoch": 2607} {"train_loss": -24.33143424987793, "global_step": 216462, "epoch": 2607} {"train_loss": -24.466237286487257, "global_step": 216463, "epoch": 2607, "val_loss": 6603020.0} {"train_loss": -23.839736938476562, "global_step": 216464, "epoch": 2608} {"train_loss": -23.9442081451416, "global_step": 216465, "epoch": 2608} {"train_loss": -24.173368453979492, "global_step": 216466, "epoch": 2608} {"train_loss": -24.087265014648438, "global_step": 216467, "epoch": 2608} {"train_loss": -24.540111541748047, "global_step": 216468, "epoch": 2608} {"train_loss": -23.987342834472656, "global_step": 216469, "epoch": 2608} {"train_loss": -24.433490753173828, "global_step": 216470, "epoch": 2608} {"train_loss": -24.276199340820312, "global_step": 216471, "epoch": 2608} {"train_loss": -24.0494384765625, "global_step": 216472, "epoch": 2608} {"train_loss": -24.20413589477539, "global_step": 216473, "epoch": 2608} {"train_loss": -24.23847770690918, "global_step": 216474, "epoch": 2608} {"train_loss": -24.418298721313477, "global_step": 216475, "epoch": 2608} {"train_loss": -24.33357048034668, "global_step": 216476, "epoch": 2608} {"train_loss": -24.553176879882812, "global_step": 216477, "epoch": 2608} {"train_loss": -24.548389434814453, "global_step": 216478, "epoch": 2608} {"train_loss": -23.920703887939453, "global_step": 216479, "epoch": 2608} {"train_loss": -24.89875602722168, "global_step": 216480, "epoch": 2608} {"train_loss": -24.414560317993164, "global_step": 216481, "epoch": 2608} {"train_loss": -24.580671310424805, "global_step": 216482, "epoch": 2608} {"train_loss": -23.75310516357422, "global_step": 216483, "epoch": 2608} {"train_loss": -24.67509651184082, "global_step": 216484, "epoch": 2608} {"train_loss": -24.5113582611084, "global_step": 216485, "epoch": 2608} {"train_loss": -24.563478469848633, "global_step": 216486, "epoch": 2608} {"train_loss": -24.239843368530273, "global_step": 216487, "epoch": 2608} {"train_loss": -24.57431983947754, "global_step": 216488, "epoch": 2608} {"train_loss": -24.462278366088867, "global_step": 216489, "epoch": 2608} {"train_loss": -24.6833553314209, "global_step": 216490, "epoch": 2608} {"train_loss": -24.450342178344727, "global_step": 216491, "epoch": 2608} {"train_loss": -24.581077575683594, "global_step": 216492, "epoch": 2608} {"train_loss": -24.615325927734375, "global_step": 216493, "epoch": 2608} {"train_loss": -24.626564025878906, "global_step": 216494, "epoch": 2608} {"train_loss": -24.702669143676758, "global_step": 216495, "epoch": 2608} {"train_loss": -24.45292091369629, "global_step": 216496, "epoch": 2608} {"train_loss": -24.55753517150879, "global_step": 216497, "epoch": 2608} {"train_loss": -24.668476104736328, "global_step": 216498, "epoch": 2608} {"train_loss": -24.6364688873291, "global_step": 216499, "epoch": 2608} {"train_loss": -24.7674617767334, "global_step": 216500, "epoch": 2608} {"train_loss": -24.62825584411621, "global_step": 216501, "epoch": 2608} {"train_loss": -24.550004959106445, "global_step": 216502, "epoch": 2608} {"train_loss": -24.916963577270508, "global_step": 216503, "epoch": 2608} {"train_loss": -24.62766456604004, "global_step": 216504, "epoch": 2608} {"train_loss": -24.623008728027344, "global_step": 216505, "epoch": 2608} {"train_loss": -24.864337921142578, "global_step": 216506, "epoch": 2608} {"train_loss": -24.862653732299805, "global_step": 216507, "epoch": 2608} {"train_loss": -24.450544357299805, "global_step": 216508, "epoch": 2608} {"train_loss": -24.303054809570312, "global_step": 216509, "epoch": 2608} {"train_loss": -24.351606369018555, "global_step": 216510, "epoch": 2608} {"train_loss": -24.182565689086914, "global_step": 216511, "epoch": 2608} {"train_loss": -24.58833122253418, "global_step": 216512, "epoch": 2608} {"train_loss": -24.5322208404541, "global_step": 216513, "epoch": 2608} {"train_loss": -24.183706283569336, "global_step": 216514, "epoch": 2608} {"train_loss": -24.6470947265625, "global_step": 216515, "epoch": 2608} {"train_loss": -24.499279022216797, "global_step": 216516, "epoch": 2608} {"train_loss": -24.688949584960938, "global_step": 216517, "epoch": 2608} {"train_loss": -24.32614517211914, "global_step": 216518, "epoch": 2608} {"train_loss": -24.405017852783203, "global_step": 216519, "epoch": 2608} {"train_loss": -24.661054611206055, "global_step": 216520, "epoch": 2608} {"train_loss": -24.551244735717773, "global_step": 216521, "epoch": 2608} {"train_loss": -24.59920310974121, "global_step": 216522, "epoch": 2608} {"train_loss": -24.736276626586914, "global_step": 216523, "epoch": 2608} {"train_loss": -24.28685760498047, "global_step": 216524, "epoch": 2608} {"train_loss": -24.692106246948242, "global_step": 216525, "epoch": 2608} {"train_loss": -24.58992576599121, "global_step": 216526, "epoch": 2608} {"train_loss": -24.913406372070312, "global_step": 216527, "epoch": 2608} {"train_loss": -24.47541618347168, "global_step": 216528, "epoch": 2608} {"train_loss": -24.52777671813965, "global_step": 216529, "epoch": 2608} {"train_loss": -24.52519989013672, "global_step": 216530, "epoch": 2608} {"train_loss": -24.761083602905273, "global_step": 216531, "epoch": 2608} {"train_loss": -24.475378036499023, "global_step": 216532, "epoch": 2608} {"train_loss": -24.81020164489746, "global_step": 216533, "epoch": 2608} {"train_loss": -24.748634338378906, "global_step": 216534, "epoch": 2608} {"train_loss": -24.66020965576172, "global_step": 216535, "epoch": 2608} {"train_loss": -25.031661987304688, "global_step": 216536, "epoch": 2608} {"train_loss": -24.694337844848633, "global_step": 216537, "epoch": 2608} {"train_loss": -24.576128005981445, "global_step": 216538, "epoch": 2608} {"train_loss": -25.068565368652344, "global_step": 216539, "epoch": 2608} {"train_loss": -24.603363037109375, "global_step": 216540, "epoch": 2608} {"train_loss": -24.387985229492188, "global_step": 216541, "epoch": 2608} {"train_loss": -24.774381637573242, "global_step": 216542, "epoch": 2608} {"train_loss": -24.588682174682617, "global_step": 216543, "epoch": 2608} {"train_loss": -24.735767364501953, "global_step": 216544, "epoch": 2608} {"train_loss": -24.72944450378418, "global_step": 216545, "epoch": 2608} {"train_loss": -24.51516319182982, "global_step": 216546, "epoch": 2608, "val_loss": 6692189.0} {"train_loss": -24.059438705444336, "global_step": 216547, "epoch": 2609} {"train_loss": -24.129535675048828, "global_step": 216548, "epoch": 2609} {"train_loss": -23.943628311157227, "global_step": 216549, "epoch": 2609} {"train_loss": -24.029130935668945, "global_step": 216550, "epoch": 2609} {"train_loss": -23.7653865814209, "global_step": 216551, "epoch": 2609} {"train_loss": -24.138376235961914, "global_step": 216552, "epoch": 2609} {"train_loss": -23.602991104125977, "global_step": 216553, "epoch": 2609} {"train_loss": -24.627336502075195, "global_step": 216554, "epoch": 2609} {"train_loss": -24.54697608947754, "global_step": 216555, "epoch": 2609} {"train_loss": -23.784475326538086, "global_step": 216556, "epoch": 2609} {"train_loss": -23.782520294189453, "global_step": 216557, "epoch": 2609} {"train_loss": -24.067514419555664, "global_step": 216558, "epoch": 2609} {"train_loss": -23.849445343017578, "global_step": 216559, "epoch": 2609} {"train_loss": -24.633493423461914, "global_step": 216560, "epoch": 2609} {"train_loss": -24.139326095581055, "global_step": 216561, "epoch": 2609} {"train_loss": -24.10633659362793, "global_step": 216562, "epoch": 2609} {"train_loss": -24.19756507873535, "global_step": 216563, "epoch": 2609} {"train_loss": -24.263166427612305, "global_step": 216564, "epoch": 2609} {"train_loss": -24.363712310791016, "global_step": 216565, "epoch": 2609} {"train_loss": -24.0300350189209, "global_step": 216566, "epoch": 2609} {"train_loss": -24.51344108581543, "global_step": 216567, "epoch": 2609} {"train_loss": -24.82869529724121, "global_step": 216568, "epoch": 2609} {"train_loss": -24.51319694519043, "global_step": 216569, "epoch": 2609} {"train_loss": -24.333219528198242, "global_step": 216570, "epoch": 2609} {"train_loss": -24.540624618530273, "global_step": 216571, "epoch": 2609} {"train_loss": -24.427762985229492, "global_step": 216572, "epoch": 2609} {"train_loss": -23.94301414489746, "global_step": 216573, "epoch": 2609} {"train_loss": -24.246015548706055, "global_step": 216574, "epoch": 2609} {"train_loss": -24.4627742767334, "global_step": 216575, "epoch": 2609} {"train_loss": -24.2236385345459, "global_step": 216576, "epoch": 2609} {"train_loss": -24.400909423828125, "global_step": 216577, "epoch": 2609} {"train_loss": -24.519643783569336, "global_step": 216578, "epoch": 2609} {"train_loss": -24.000661849975586, "global_step": 216579, "epoch": 2609} {"train_loss": -24.485929489135742, "global_step": 216580, "epoch": 2609} {"train_loss": -24.457561492919922, "global_step": 216581, "epoch": 2609} {"train_loss": -24.53230094909668, "global_step": 216582, "epoch": 2609} {"train_loss": -24.76816749572754, "global_step": 216583, "epoch": 2609} {"train_loss": -24.729150772094727, "global_step": 216584, "epoch": 2609} {"train_loss": -24.764646530151367, "global_step": 216585, "epoch": 2609} {"train_loss": -24.520856857299805, "global_step": 216586, "epoch": 2609} {"train_loss": -24.8472900390625, "global_step": 216587, "epoch": 2609} {"train_loss": -24.917173385620117, "global_step": 216588, "epoch": 2609} {"train_loss": -24.497095108032227, "global_step": 216589, "epoch": 2609} {"train_loss": -24.88301658630371, "global_step": 216590, "epoch": 2609} {"train_loss": -25.05600357055664, "global_step": 216591, "epoch": 2609} {"train_loss": -24.643112182617188, "global_step": 216592, "epoch": 2609} {"train_loss": -24.677536010742188, "global_step": 216593, "epoch": 2609} {"train_loss": -24.698156356811523, "global_step": 216594, "epoch": 2609} {"train_loss": -24.33986473083496, "global_step": 216595, "epoch": 2609} {"train_loss": -24.658437728881836, "global_step": 216596, "epoch": 2609} {"train_loss": -24.381053924560547, "global_step": 216597, "epoch": 2609} {"train_loss": -24.35536766052246, "global_step": 216598, "epoch": 2609} {"train_loss": -24.627016067504883, "global_step": 216599, "epoch": 2609} {"train_loss": -24.415193557739258, "global_step": 216600, "epoch": 2609} {"train_loss": -24.548288345336914, "global_step": 216601, "epoch": 2609} {"train_loss": -24.60785675048828, "global_step": 216602, "epoch": 2609} {"train_loss": -24.550168991088867, "global_step": 216603, "epoch": 2609} {"train_loss": -24.527204513549805, "global_step": 216604, "epoch": 2609} {"train_loss": -24.402589797973633, "global_step": 216605, "epoch": 2609} {"train_loss": -24.7579288482666, "global_step": 216606, "epoch": 2609} {"train_loss": -24.59663963317871, "global_step": 216607, "epoch": 2609} {"train_loss": -24.628761291503906, "global_step": 216608, "epoch": 2609} {"train_loss": -24.75847625732422, "global_step": 216609, "epoch": 2609} {"train_loss": -24.448766708374023, "global_step": 216610, "epoch": 2609} {"train_loss": -24.47504997253418, "global_step": 216611, "epoch": 2609} {"train_loss": -24.482290267944336, "global_step": 216612, "epoch": 2609} {"train_loss": -24.45536231994629, "global_step": 216613, "epoch": 2609} {"train_loss": -24.628509521484375, "global_step": 216614, "epoch": 2609} {"train_loss": -24.611177444458008, "global_step": 216615, "epoch": 2609} {"train_loss": -24.480024337768555, "global_step": 216616, "epoch": 2609} {"train_loss": -24.350515365600586, "global_step": 216617, "epoch": 2609} {"train_loss": -24.32143211364746, "global_step": 216618, "epoch": 2609} {"train_loss": -24.50563621520996, "global_step": 216619, "epoch": 2609} {"train_loss": -24.585453033447266, "global_step": 216620, "epoch": 2609} {"train_loss": -24.743268966674805, "global_step": 216621, "epoch": 2609} {"train_loss": -24.58760643005371, "global_step": 216622, "epoch": 2609} {"train_loss": -24.559703826904297, "global_step": 216623, "epoch": 2609} {"train_loss": -24.448062896728516, "global_step": 216624, "epoch": 2609} {"train_loss": -24.595529556274414, "global_step": 216625, "epoch": 2609} {"train_loss": -24.299184799194336, "global_step": 216626, "epoch": 2609} {"train_loss": -24.4730281829834, "global_step": 216627, "epoch": 2609} {"train_loss": -24.4281063079834, "global_step": 216628, "epoch": 2609} {"train_loss": -24.4627674056823, "global_step": 216629, "epoch": 2609, "val_loss": 6629203.0} {"train_loss": -22.784955978393555, "global_step": 216630, "epoch": 2610} {"train_loss": -22.456331253051758, "global_step": 216631, "epoch": 2610} {"train_loss": -22.408605575561523, "global_step": 216632, "epoch": 2610} {"train_loss": -23.07490348815918, "global_step": 216633, "epoch": 2610} {"train_loss": -23.096792221069336, "global_step": 216634, "epoch": 2610} {"train_loss": -23.205244064331055, "global_step": 216635, "epoch": 2610} {"train_loss": -23.963397979736328, "global_step": 216636, "epoch": 2610} {"train_loss": -23.83486557006836, "global_step": 216637, "epoch": 2610} {"train_loss": -23.908361434936523, "global_step": 216638, "epoch": 2610} {"train_loss": -24.170515060424805, "global_step": 216639, "epoch": 2610} {"train_loss": -23.59705352783203, "global_step": 216640, "epoch": 2610} {"train_loss": -24.001155853271484, "global_step": 216641, "epoch": 2610} {"train_loss": -24.14752769470215, "global_step": 216642, "epoch": 2610} {"train_loss": -23.96503257751465, "global_step": 216643, "epoch": 2610} {"train_loss": -23.906278610229492, "global_step": 216644, "epoch": 2610} {"train_loss": -24.476486206054688, "global_step": 216645, "epoch": 2610} {"train_loss": -24.33161735534668, "global_step": 216646, "epoch": 2610} {"train_loss": -23.979331970214844, "global_step": 216647, "epoch": 2610} {"train_loss": -23.69512939453125, "global_step": 216648, "epoch": 2610} {"train_loss": -23.844614028930664, "global_step": 216649, "epoch": 2610} {"train_loss": -24.38942527770996, "global_step": 216650, "epoch": 2610} {"train_loss": -24.177701950073242, "global_step": 216651, "epoch": 2610} {"train_loss": -23.788143157958984, "global_step": 216652, "epoch": 2610} {"train_loss": -24.39520835876465, "global_step": 216653, "epoch": 2610} {"train_loss": -24.140790939331055, "global_step": 216654, "epoch": 2610} {"train_loss": -24.074033737182617, "global_step": 216655, "epoch": 2610} {"train_loss": -24.067434310913086, "global_step": 216656, "epoch": 2610} {"train_loss": -24.552663803100586, "global_step": 216657, "epoch": 2610} {"train_loss": -24.559127807617188, "global_step": 216658, "epoch": 2610} {"train_loss": -24.295291900634766, "global_step": 216659, "epoch": 2610} {"train_loss": -24.439992904663086, "global_step": 216660, "epoch": 2610} {"train_loss": -24.272645950317383, "global_step": 216661, "epoch": 2610} {"train_loss": -24.4544620513916, "global_step": 216662, "epoch": 2610} {"train_loss": -24.213560104370117, "global_step": 216663, "epoch": 2610} {"train_loss": -24.36138153076172, "global_step": 216664, "epoch": 2610} {"train_loss": -24.8070068359375, "global_step": 216665, "epoch": 2610} {"train_loss": -24.571636199951172, "global_step": 216666, "epoch": 2610} {"train_loss": -24.40443992614746, "global_step": 216667, "epoch": 2610} {"train_loss": -24.30842399597168, "global_step": 216668, "epoch": 2610} {"train_loss": -24.584569931030273, "global_step": 216669, "epoch": 2610} {"train_loss": -24.681964874267578, "global_step": 216670, "epoch": 2610} {"train_loss": -24.684711456298828, "global_step": 216671, "epoch": 2610} {"train_loss": -24.758241653442383, "global_step": 216672, "epoch": 2610} {"train_loss": -24.11612892150879, "global_step": 216673, "epoch": 2610} {"train_loss": -24.856178283691406, "global_step": 216674, "epoch": 2610} {"train_loss": -24.814905166625977, "global_step": 216675, "epoch": 2610} {"train_loss": -24.019855499267578, "global_step": 216676, "epoch": 2610} {"train_loss": -24.498991012573242, "global_step": 216677, "epoch": 2610} {"train_loss": -24.488950729370117, "global_step": 216678, "epoch": 2610} {"train_loss": -24.53497886657715, "global_step": 216679, "epoch": 2610} {"train_loss": -24.61590576171875, "global_step": 216680, "epoch": 2610} {"train_loss": -24.372514724731445, "global_step": 216681, "epoch": 2610} {"train_loss": -24.322484970092773, "global_step": 216682, "epoch": 2610} {"train_loss": -24.786542892456055, "global_step": 216683, "epoch": 2610} {"train_loss": -24.627716064453125, "global_step": 216684, "epoch": 2610} {"train_loss": -24.65338134765625, "global_step": 216685, "epoch": 2610} {"train_loss": -24.545856475830078, "global_step": 216686, "epoch": 2610} {"train_loss": -24.420597076416016, "global_step": 216687, "epoch": 2610} {"train_loss": -24.357208251953125, "global_step": 216688, "epoch": 2610} {"train_loss": -23.86454200744629, "global_step": 216689, "epoch": 2610} {"train_loss": -24.105764389038086, "global_step": 216690, "epoch": 2610} {"train_loss": -24.726613998413086, "global_step": 216691, "epoch": 2610} {"train_loss": -24.452930450439453, "global_step": 216692, "epoch": 2610} {"train_loss": -24.25347137451172, "global_step": 216693, "epoch": 2610} {"train_loss": -24.303247451782227, "global_step": 216694, "epoch": 2610} {"train_loss": -24.447336196899414, "global_step": 216695, "epoch": 2610} {"train_loss": -24.42996597290039, "global_step": 216696, "epoch": 2610} {"train_loss": -24.38107681274414, "global_step": 216697, "epoch": 2610} {"train_loss": -24.37930679321289, "global_step": 216698, "epoch": 2610} {"train_loss": -24.64204978942871, "global_step": 216699, "epoch": 2610} {"train_loss": -24.227985382080078, "global_step": 216700, "epoch": 2610} {"train_loss": -24.530466079711914, "global_step": 216701, "epoch": 2610} {"train_loss": -24.375473022460938, "global_step": 216702, "epoch": 2610} {"train_loss": -24.29694938659668, "global_step": 216703, "epoch": 2610} {"train_loss": -24.884647369384766, "global_step": 216704, "epoch": 2610} {"train_loss": -24.273962020874023, "global_step": 216705, "epoch": 2610} {"train_loss": -24.265085220336914, "global_step": 216706, "epoch": 2610} {"train_loss": -24.43320655822754, "global_step": 216707, "epoch": 2610} {"train_loss": -24.639986038208008, "global_step": 216708, "epoch": 2610} {"train_loss": -24.562963485717773, "global_step": 216709, "epoch": 2610} {"train_loss": -24.77066993713379, "global_step": 216710, "epoch": 2610} {"train_loss": -24.470720291137695, "global_step": 216711, "epoch": 2610} {"train_loss": -24.244231051709278, "global_step": 216712, "epoch": 2610, "val_loss": 6630660.0} {"train_loss": -24.605514526367188, "global_step": 216713, "epoch": 2611} {"train_loss": -24.51373291015625, "global_step": 216714, "epoch": 2611} {"train_loss": -24.673978805541992, "global_step": 216715, "epoch": 2611} {"train_loss": -24.24024772644043, "global_step": 216716, "epoch": 2611} {"train_loss": -24.149280548095703, "global_step": 216717, "epoch": 2611} {"train_loss": -24.286640167236328, "global_step": 216718, "epoch": 2611} {"train_loss": -24.276594161987305, "global_step": 216719, "epoch": 2611} {"train_loss": -24.155874252319336, "global_step": 216720, "epoch": 2611} {"train_loss": -24.54615592956543, "global_step": 216721, "epoch": 2611} {"train_loss": -24.64551544189453, "global_step": 216722, "epoch": 2611} {"train_loss": -24.60630226135254, "global_step": 216723, "epoch": 2611} {"train_loss": -24.28891372680664, "global_step": 216724, "epoch": 2611} {"train_loss": -24.506996154785156, "global_step": 216725, "epoch": 2611} {"train_loss": -24.582223892211914, "global_step": 216726, "epoch": 2611} {"train_loss": -24.795948028564453, "global_step": 216727, "epoch": 2611} {"train_loss": -24.46492576599121, "global_step": 216728, "epoch": 2611} {"train_loss": -24.301387786865234, "global_step": 216729, "epoch": 2611} {"train_loss": -24.46601676940918, "global_step": 216730, "epoch": 2611} {"train_loss": -24.74094581604004, "global_step": 216731, "epoch": 2611} {"train_loss": -24.411678314208984, "global_step": 216732, "epoch": 2611} {"train_loss": -24.67238426208496, "global_step": 216733, "epoch": 2611} {"train_loss": -25.056854248046875, "global_step": 216734, "epoch": 2611} {"train_loss": -24.582273483276367, "global_step": 216735, "epoch": 2611} {"train_loss": -24.316438674926758, "global_step": 216736, "epoch": 2611} {"train_loss": -24.692991256713867, "global_step": 216737, "epoch": 2611} {"train_loss": -24.558237075805664, "global_step": 216738, "epoch": 2611} {"train_loss": -24.30337142944336, "global_step": 216739, "epoch": 2611} {"train_loss": -24.271732330322266, "global_step": 216740, "epoch": 2611} {"train_loss": -24.53255271911621, "global_step": 216741, "epoch": 2611} {"train_loss": -24.603378295898438, "global_step": 216742, "epoch": 2611} {"train_loss": -24.563188552856445, "global_step": 216743, "epoch": 2611} {"train_loss": -24.469017028808594, "global_step": 216744, "epoch": 2611} {"train_loss": -24.570072174072266, "global_step": 216745, "epoch": 2611} {"train_loss": -24.6181583404541, "global_step": 216746, "epoch": 2611} {"train_loss": -24.46249008178711, "global_step": 216747, "epoch": 2611} {"train_loss": -24.566898345947266, "global_step": 216748, "epoch": 2611} {"train_loss": -24.45304298400879, "global_step": 216749, "epoch": 2611} {"train_loss": -24.675411224365234, "global_step": 216750, "epoch": 2611} {"train_loss": -24.383464813232422, "global_step": 216751, "epoch": 2611} {"train_loss": -24.861845016479492, "global_step": 216752, "epoch": 2611} {"train_loss": -24.503662109375, "global_step": 216753, "epoch": 2611} {"train_loss": -25.00079345703125, "global_step": 216754, "epoch": 2611} {"train_loss": -24.75322914123535, "global_step": 216755, "epoch": 2611} {"train_loss": -24.808908462524414, "global_step": 216756, "epoch": 2611} {"train_loss": -24.717456817626953, "global_step": 216757, "epoch": 2611} {"train_loss": -24.907604217529297, "global_step": 216758, "epoch": 2611} {"train_loss": -24.81988525390625, "global_step": 216759, "epoch": 2611} {"train_loss": -24.36053466796875, "global_step": 216760, "epoch": 2611} {"train_loss": -24.697221755981445, "global_step": 216761, "epoch": 2611} {"train_loss": -24.235883712768555, "global_step": 216762, "epoch": 2611} {"train_loss": -24.686073303222656, "global_step": 216763, "epoch": 2611} {"train_loss": -24.35910987854004, "global_step": 216764, "epoch": 2611} {"train_loss": -24.284915924072266, "global_step": 216765, "epoch": 2611} {"train_loss": -24.266836166381836, "global_step": 216766, "epoch": 2611} {"train_loss": -24.43427848815918, "global_step": 216767, "epoch": 2611} {"train_loss": -24.393203735351562, "global_step": 216768, "epoch": 2611} {"train_loss": -24.411163330078125, "global_step": 216769, "epoch": 2611} {"train_loss": -24.439783096313477, "global_step": 216770, "epoch": 2611} {"train_loss": -24.712522506713867, "global_step": 216771, "epoch": 2611} {"train_loss": -24.739240646362305, "global_step": 216772, "epoch": 2611} {"train_loss": -24.704771041870117, "global_step": 216773, "epoch": 2611} {"train_loss": -24.722448348999023, "global_step": 216774, "epoch": 2611} {"train_loss": -24.897024154663086, "global_step": 216775, "epoch": 2611} {"train_loss": -24.402999877929688, "global_step": 216776, "epoch": 2611} {"train_loss": -24.75647735595703, "global_step": 216777, "epoch": 2611} {"train_loss": -24.521574020385742, "global_step": 216778, "epoch": 2611} {"train_loss": -24.448240280151367, "global_step": 216779, "epoch": 2611} {"train_loss": -24.555015563964844, "global_step": 216780, "epoch": 2611} {"train_loss": -25.081274032592773, "global_step": 216781, "epoch": 2611} {"train_loss": -24.42348289489746, "global_step": 216782, "epoch": 2611} {"train_loss": -24.644784927368164, "global_step": 216783, "epoch": 2611} {"train_loss": -24.549646377563477, "global_step": 216784, "epoch": 2611} {"train_loss": -24.773672103881836, "global_step": 216785, "epoch": 2611} {"train_loss": -24.20411491394043, "global_step": 216786, "epoch": 2611} {"train_loss": -24.410293579101562, "global_step": 216787, "epoch": 2611} {"train_loss": -24.565467834472656, "global_step": 216788, "epoch": 2611} {"train_loss": -24.3900203704834, "global_step": 216789, "epoch": 2611} {"train_loss": -25.034101486206055, "global_step": 216790, "epoch": 2611} {"train_loss": -24.208906173706055, "global_step": 216791, "epoch": 2611} {"train_loss": -24.67325782775879, "global_step": 216792, "epoch": 2611} {"train_loss": -24.755170822143555, "global_step": 216793, "epoch": 2611} {"train_loss": -24.78440284729004, "global_step": 216794, "epoch": 2611} {"train_loss": -24.55538850807282, "global_step": 216795, "epoch": 2611, "val_loss": 6641755.0} {"train_loss": -24.267169952392578, "global_step": 216796, "epoch": 2612} {"train_loss": -23.68406105041504, "global_step": 216797, "epoch": 2612} {"train_loss": -23.55716896057129, "global_step": 216798, "epoch": 2612} {"train_loss": -23.873779296875, "global_step": 216799, "epoch": 2612} {"train_loss": -23.501331329345703, "global_step": 216800, "epoch": 2612} {"train_loss": -23.371511459350586, "global_step": 216801, "epoch": 2612} {"train_loss": -24.264463424682617, "global_step": 216802, "epoch": 2612} {"train_loss": -23.492542266845703, "global_step": 216803, "epoch": 2612} {"train_loss": -24.124725341796875, "global_step": 216804, "epoch": 2612} {"train_loss": -23.72287940979004, "global_step": 216805, "epoch": 2612} {"train_loss": -24.32189178466797, "global_step": 216806, "epoch": 2612} {"train_loss": -24.23798179626465, "global_step": 216807, "epoch": 2612} {"train_loss": -24.395767211914062, "global_step": 216808, "epoch": 2612} {"train_loss": -24.445280075073242, "global_step": 216809, "epoch": 2612} {"train_loss": -23.915407180786133, "global_step": 216810, "epoch": 2612} {"train_loss": -24.231542587280273, "global_step": 216811, "epoch": 2612} {"train_loss": -24.378305435180664, "global_step": 216812, "epoch": 2612} {"train_loss": -24.394804000854492, "global_step": 216813, "epoch": 2612} {"train_loss": -24.159622192382812, "global_step": 216814, "epoch": 2612} {"train_loss": -24.4658203125, "global_step": 216815, "epoch": 2612} {"train_loss": -24.608200073242188, "global_step": 216816, "epoch": 2612} {"train_loss": -24.365528106689453, "global_step": 216817, "epoch": 2612} {"train_loss": -24.1087646484375, "global_step": 216818, "epoch": 2612} {"train_loss": -24.104455947875977, "global_step": 216819, "epoch": 2612} {"train_loss": -24.17582130432129, "global_step": 216820, "epoch": 2612} {"train_loss": -24.31812858581543, "global_step": 216821, "epoch": 2612} {"train_loss": -24.993215560913086, "global_step": 216822, "epoch": 2612} {"train_loss": -24.539194107055664, "global_step": 216823, "epoch": 2612} {"train_loss": -24.733060836791992, "global_step": 216824, "epoch": 2612} {"train_loss": -24.475330352783203, "global_step": 216825, "epoch": 2612} {"train_loss": -24.501148223876953, "global_step": 216826, "epoch": 2612} {"train_loss": -24.36575698852539, "global_step": 216827, "epoch": 2612} {"train_loss": -24.772655487060547, "global_step": 216828, "epoch": 2612} {"train_loss": -24.48759651184082, "global_step": 216829, "epoch": 2612} {"train_loss": -24.588077545166016, "global_step": 216830, "epoch": 2612} {"train_loss": -24.721012115478516, "global_step": 216831, "epoch": 2612} {"train_loss": -24.773046493530273, "global_step": 216832, "epoch": 2612} {"train_loss": -24.73506736755371, "global_step": 216833, "epoch": 2612} {"train_loss": -24.61773109436035, "global_step": 216834, "epoch": 2612} {"train_loss": -24.67559242248535, "global_step": 216835, "epoch": 2612} {"train_loss": -24.826644897460938, "global_step": 216836, "epoch": 2612} {"train_loss": -24.571796417236328, "global_step": 216837, "epoch": 2612} {"train_loss": -24.64937400817871, "global_step": 216838, "epoch": 2612} {"train_loss": -24.5140438079834, "global_step": 216839, "epoch": 2612} {"train_loss": -24.921438217163086, "global_step": 216840, "epoch": 2612} {"train_loss": -24.634265899658203, "global_step": 216841, "epoch": 2612} {"train_loss": -24.91177749633789, "global_step": 216842, "epoch": 2612} {"train_loss": -24.672006607055664, "global_step": 216843, "epoch": 2612} {"train_loss": -24.423429489135742, "global_step": 216844, "epoch": 2612} {"train_loss": -24.114500045776367, "global_step": 216845, "epoch": 2612} {"train_loss": -24.03066062927246, "global_step": 216846, "epoch": 2612} {"train_loss": -24.570709228515625, "global_step": 216847, "epoch": 2612} {"train_loss": -24.611408233642578, "global_step": 216848, "epoch": 2612} {"train_loss": -24.456140518188477, "global_step": 216849, "epoch": 2612} {"train_loss": -24.91659927368164, "global_step": 216850, "epoch": 2612} {"train_loss": -24.598526000976562, "global_step": 216851, "epoch": 2612} {"train_loss": -24.232669830322266, "global_step": 216852, "epoch": 2612} {"train_loss": -24.67493438720703, "global_step": 216853, "epoch": 2612} {"train_loss": -24.624601364135742, "global_step": 216854, "epoch": 2612} {"train_loss": -24.741281509399414, "global_step": 216855, "epoch": 2612} {"train_loss": -24.264921188354492, "global_step": 216856, "epoch": 2612} {"train_loss": -24.493045806884766, "global_step": 216857, "epoch": 2612} {"train_loss": -24.516393661499023, "global_step": 216858, "epoch": 2612} {"train_loss": -24.541446685791016, "global_step": 216859, "epoch": 2612} {"train_loss": -24.546628952026367, "global_step": 216860, "epoch": 2612} {"train_loss": -24.492355346679688, "global_step": 216861, "epoch": 2612} {"train_loss": -24.68963623046875, "global_step": 216862, "epoch": 2612} {"train_loss": -24.515348434448242, "global_step": 216863, "epoch": 2612} {"train_loss": -24.34107780456543, "global_step": 216864, "epoch": 2612} {"train_loss": -24.39854621887207, "global_step": 216865, "epoch": 2612} {"train_loss": -24.518404006958008, "global_step": 216866, "epoch": 2612} {"train_loss": -24.7552490234375, "global_step": 216867, "epoch": 2612} {"train_loss": -24.596830368041992, "global_step": 216868, "epoch": 2612} {"train_loss": -24.534626007080078, "global_step": 216869, "epoch": 2612} {"train_loss": -24.49142837524414, "global_step": 216870, "epoch": 2612} {"train_loss": -24.420833587646484, "global_step": 216871, "epoch": 2612} {"train_loss": -24.422534942626953, "global_step": 216872, "epoch": 2612} {"train_loss": -24.716493606567383, "global_step": 216873, "epoch": 2612} {"train_loss": -24.35392189025879, "global_step": 216874, "epoch": 2612} {"train_loss": -23.908554077148438, "global_step": 216875, "epoch": 2612} {"train_loss": -24.70496940612793, "global_step": 216876, "epoch": 2612} {"train_loss": -24.42910385131836, "global_step": 216877, "epoch": 2612} {"train_loss": -24.414761187082313, "global_step": 216878, "epoch": 2612, "val_loss": 6642569.0} {"train_loss": -23.483932495117188, "global_step": 216879, "epoch": 2613} {"train_loss": -24.51605796813965, "global_step": 216880, "epoch": 2613} {"train_loss": -23.99965476989746, "global_step": 216881, "epoch": 2613} {"train_loss": -24.663251876831055, "global_step": 216882, "epoch": 2613} {"train_loss": -23.837491989135742, "global_step": 216883, "epoch": 2613} {"train_loss": -24.114904403686523, "global_step": 216884, "epoch": 2613} {"train_loss": -24.24369239807129, "global_step": 216885, "epoch": 2613} {"train_loss": -24.737140655517578, "global_step": 216886, "epoch": 2613} {"train_loss": -24.72528076171875, "global_step": 216887, "epoch": 2613} {"train_loss": -24.47907829284668, "global_step": 216888, "epoch": 2613} {"train_loss": -24.486270904541016, "global_step": 216889, "epoch": 2613} {"train_loss": -24.27076530456543, "global_step": 216890, "epoch": 2613} {"train_loss": -24.71710777282715, "global_step": 216891, "epoch": 2613} {"train_loss": -24.488828659057617, "global_step": 216892, "epoch": 2613} {"train_loss": -24.414175033569336, "global_step": 216893, "epoch": 2613} {"train_loss": -24.570600509643555, "global_step": 216894, "epoch": 2613} {"train_loss": -24.249242782592773, "global_step": 216895, "epoch": 2613} {"train_loss": -24.44045066833496, "global_step": 216896, "epoch": 2613} {"train_loss": -24.62630844116211, "global_step": 216897, "epoch": 2613} {"train_loss": -24.22127342224121, "global_step": 216898, "epoch": 2613} {"train_loss": -24.46670913696289, "global_step": 216899, "epoch": 2613} {"train_loss": -24.644195556640625, "global_step": 216900, "epoch": 2613} {"train_loss": -24.623971939086914, "global_step": 216901, "epoch": 2613} {"train_loss": -24.715665817260742, "global_step": 216902, "epoch": 2613} {"train_loss": -24.514440536499023, "global_step": 216903, "epoch": 2613} {"train_loss": -24.352649688720703, "global_step": 216904, "epoch": 2613} {"train_loss": -24.637277603149414, "global_step": 216905, "epoch": 2613} {"train_loss": -24.711057662963867, "global_step": 216906, "epoch": 2613} {"train_loss": -24.418642044067383, "global_step": 216907, "epoch": 2613} {"train_loss": -24.697885513305664, "global_step": 216908, "epoch": 2613} {"train_loss": -24.3443546295166, "global_step": 216909, "epoch": 2613} {"train_loss": -24.66774559020996, "global_step": 216910, "epoch": 2613} {"train_loss": -24.536563873291016, "global_step": 216911, "epoch": 2613} {"train_loss": -24.418607711791992, "global_step": 216912, "epoch": 2613} {"train_loss": -24.619094848632812, "global_step": 216913, "epoch": 2613} {"train_loss": -24.69820213317871, "global_step": 216914, "epoch": 2613} {"train_loss": -24.51387596130371, "global_step": 216915, "epoch": 2613} {"train_loss": -24.4660587310791, "global_step": 216916, "epoch": 2613} {"train_loss": -24.361923217773438, "global_step": 216917, "epoch": 2613} {"train_loss": -24.344179153442383, "global_step": 216918, "epoch": 2613} {"train_loss": -24.730960845947266, "global_step": 216919, "epoch": 2613} {"train_loss": -24.548437118530273, "global_step": 216920, "epoch": 2613} {"train_loss": -24.747150421142578, "global_step": 216921, "epoch": 2613} {"train_loss": -24.865436553955078, "global_step": 216922, "epoch": 2613} {"train_loss": -24.679445266723633, "global_step": 216923, "epoch": 2613} {"train_loss": -23.927043914794922, "global_step": 216924, "epoch": 2613} {"train_loss": -24.777204513549805, "global_step": 216925, "epoch": 2613} {"train_loss": -24.4039249420166, "global_step": 216926, "epoch": 2613} {"train_loss": -24.626373291015625, "global_step": 216927, "epoch": 2613} {"train_loss": -24.71339225769043, "global_step": 216928, "epoch": 2613} {"train_loss": -24.418128967285156, "global_step": 216929, "epoch": 2613} {"train_loss": -24.639829635620117, "global_step": 216930, "epoch": 2613} {"train_loss": -24.861282348632812, "global_step": 216931, "epoch": 2613} {"train_loss": -24.517526626586914, "global_step": 216932, "epoch": 2613} {"train_loss": -24.759565353393555, "global_step": 216933, "epoch": 2613} {"train_loss": -24.24782371520996, "global_step": 216934, "epoch": 2613} {"train_loss": -24.521032333374023, "global_step": 216935, "epoch": 2613} {"train_loss": -24.797245025634766, "global_step": 216936, "epoch": 2613} {"train_loss": -24.756641387939453, "global_step": 216937, "epoch": 2613} {"train_loss": -24.72562599182129, "global_step": 216938, "epoch": 2613} {"train_loss": -24.475433349609375, "global_step": 216939, "epoch": 2613} {"train_loss": -24.21898651123047, "global_step": 216940, "epoch": 2613} {"train_loss": -24.421493530273438, "global_step": 216941, "epoch": 2613} {"train_loss": -24.239242553710938, "global_step": 216942, "epoch": 2613} {"train_loss": -24.43777847290039, "global_step": 216943, "epoch": 2613} {"train_loss": -24.214279174804688, "global_step": 216944, "epoch": 2613} {"train_loss": -24.532468795776367, "global_step": 216945, "epoch": 2613} {"train_loss": -24.56533432006836, "global_step": 216946, "epoch": 2613} {"train_loss": -24.515945434570312, "global_step": 216947, "epoch": 2613} {"train_loss": -24.56183433532715, "global_step": 216948, "epoch": 2613} {"train_loss": -24.739492416381836, "global_step": 216949, "epoch": 2613} {"train_loss": -24.43979835510254, "global_step": 216950, "epoch": 2613} {"train_loss": -24.653249740600586, "global_step": 216951, "epoch": 2613} {"train_loss": -24.88472557067871, "global_step": 216952, "epoch": 2613} {"train_loss": -24.741445541381836, "global_step": 216953, "epoch": 2613} {"train_loss": -24.317649841308594, "global_step": 216954, "epoch": 2613} {"train_loss": -24.597482681274414, "global_step": 216955, "epoch": 2613} {"train_loss": -24.63924217224121, "global_step": 216956, "epoch": 2613} {"train_loss": -24.81807518005371, "global_step": 216957, "epoch": 2613} {"train_loss": -24.402311325073242, "global_step": 216958, "epoch": 2613} {"train_loss": -24.7774715423584, "global_step": 216959, "epoch": 2613} {"train_loss": -24.77235984802246, "global_step": 216960, "epoch": 2613} {"train_loss": -24.515919053410908, "global_step": 216961, "epoch": 2613, "val_loss": 6624914.0} {"train_loss": -23.97809410095215, "global_step": 216962, "epoch": 2614} {"train_loss": -24.20570945739746, "global_step": 216963, "epoch": 2614} {"train_loss": -23.834306716918945, "global_step": 216964, "epoch": 2614} {"train_loss": -23.04386329650879, "global_step": 216965, "epoch": 2614} {"train_loss": -23.49418830871582, "global_step": 216966, "epoch": 2614} {"train_loss": -24.436941146850586, "global_step": 216967, "epoch": 2614} {"train_loss": -24.219091415405273, "global_step": 216968, "epoch": 2614} {"train_loss": -23.54439353942871, "global_step": 216969, "epoch": 2614} {"train_loss": -23.943668365478516, "global_step": 216970, "epoch": 2614} {"train_loss": -24.249052047729492, "global_step": 216971, "epoch": 2614} {"train_loss": -24.298540115356445, "global_step": 216972, "epoch": 2614} {"train_loss": -23.885984420776367, "global_step": 216973, "epoch": 2614} {"train_loss": -24.109699249267578, "global_step": 216974, "epoch": 2614} {"train_loss": -24.392196655273438, "global_step": 216975, "epoch": 2614} {"train_loss": -24.001142501831055, "global_step": 216976, "epoch": 2614} {"train_loss": -24.027612686157227, "global_step": 216977, "epoch": 2614} {"train_loss": -24.057964324951172, "global_step": 216978, "epoch": 2614} {"train_loss": -24.063894271850586, "global_step": 216979, "epoch": 2614} {"train_loss": -24.45587730407715, "global_step": 216980, "epoch": 2614} {"train_loss": -24.39039421081543, "global_step": 216981, "epoch": 2614} {"train_loss": -24.25875473022461, "global_step": 216982, "epoch": 2614} {"train_loss": -24.313716888427734, "global_step": 216983, "epoch": 2614} {"train_loss": -24.390539169311523, "global_step": 216984, "epoch": 2614} {"train_loss": -24.155513763427734, "global_step": 216985, "epoch": 2614} {"train_loss": -24.50082778930664, "global_step": 216986, "epoch": 2614} {"train_loss": -24.445690155029297, "global_step": 216987, "epoch": 2614} {"train_loss": -24.300827026367188, "global_step": 216988, "epoch": 2614} {"train_loss": -24.74144172668457, "global_step": 216989, "epoch": 2614} {"train_loss": -24.108592987060547, "global_step": 216990, "epoch": 2614} {"train_loss": -24.407772064208984, "global_step": 216991, "epoch": 2614} {"train_loss": -24.63019371032715, "global_step": 216992, "epoch": 2614} {"train_loss": -24.487960815429688, "global_step": 216993, "epoch": 2614} {"train_loss": -24.42734718322754, "global_step": 216994, "epoch": 2614} {"train_loss": -24.66998863220215, "global_step": 216995, "epoch": 2614} {"train_loss": -24.695016860961914, "global_step": 216996, "epoch": 2614} {"train_loss": -24.633731842041016, "global_step": 216997, "epoch": 2614} {"train_loss": -24.39522933959961, "global_step": 216998, "epoch": 2614} {"train_loss": -24.853628158569336, "global_step": 216999, "epoch": 2614} {"train_loss": -24.717153549194336, "global_step": 217000, "epoch": 2614} {"train_loss": -24.7104434967041, "global_step": 217001, "epoch": 2614} {"train_loss": -24.689075469970703, "global_step": 217002, "epoch": 2614} {"train_loss": -24.260656356811523, "global_step": 217003, "epoch": 2614} {"train_loss": -24.663227081298828, "global_step": 217004, "epoch": 2614} {"train_loss": -24.70697593688965, "global_step": 217005, "epoch": 2614} {"train_loss": -24.8625545501709, "global_step": 217006, "epoch": 2614} {"train_loss": -24.30853843688965, "global_step": 217007, "epoch": 2614} {"train_loss": -24.40926170349121, "global_step": 217008, "epoch": 2614} {"train_loss": -24.56148910522461, "global_step": 217009, "epoch": 2614} {"train_loss": -24.585474014282227, "global_step": 217010, "epoch": 2614} {"train_loss": -24.63715362548828, "global_step": 217011, "epoch": 2614} {"train_loss": -24.71091079711914, "global_step": 217012, "epoch": 2614} {"train_loss": -23.838441848754883, "global_step": 217013, "epoch": 2614} {"train_loss": -24.565298080444336, "global_step": 217014, "epoch": 2614} {"train_loss": -24.670978546142578, "global_step": 217015, "epoch": 2614} {"train_loss": -24.470699310302734, "global_step": 217016, "epoch": 2614} {"train_loss": -24.225086212158203, "global_step": 217017, "epoch": 2614} {"train_loss": -24.674142837524414, "global_step": 217018, "epoch": 2614} {"train_loss": -24.20895767211914, "global_step": 217019, "epoch": 2614} {"train_loss": -24.346839904785156, "global_step": 217020, "epoch": 2614} {"train_loss": -24.548757553100586, "global_step": 217021, "epoch": 2614} {"train_loss": -24.411169052124023, "global_step": 217022, "epoch": 2614} {"train_loss": -24.27669334411621, "global_step": 217023, "epoch": 2614} {"train_loss": -24.34910011291504, "global_step": 217024, "epoch": 2614} {"train_loss": -24.0446834564209, "global_step": 217025, "epoch": 2614} {"train_loss": -24.926082611083984, "global_step": 217026, "epoch": 2614} {"train_loss": -23.730499267578125, "global_step": 217027, "epoch": 2614} {"train_loss": -24.54446792602539, "global_step": 217028, "epoch": 2614} {"train_loss": -24.231460571289062, "global_step": 217029, "epoch": 2614} {"train_loss": -24.487363815307617, "global_step": 217030, "epoch": 2614} {"train_loss": -24.2710018157959, "global_step": 217031, "epoch": 2614} {"train_loss": -24.288877487182617, "global_step": 217032, "epoch": 2614} {"train_loss": -24.394132614135742, "global_step": 217033, "epoch": 2614} {"train_loss": -24.699811935424805, "global_step": 217034, "epoch": 2614} {"train_loss": -24.574094772338867, "global_step": 217035, "epoch": 2614} {"train_loss": -24.9046688079834, "global_step": 217036, "epoch": 2614} {"train_loss": -24.599027633666992, "global_step": 217037, "epoch": 2614} {"train_loss": -24.55503273010254, "global_step": 217038, "epoch": 2614} {"train_loss": -24.594579696655273, "global_step": 217039, "epoch": 2614} {"train_loss": -24.84918785095215, "global_step": 217040, "epoch": 2614} {"train_loss": -24.528091430664062, "global_step": 217041, "epoch": 2614} {"train_loss": -24.527456283569336, "global_step": 217042, "epoch": 2614} {"train_loss": -24.56308937072754, "global_step": 217043, "epoch": 2614} {"train_loss": -24.378854981387953, "global_step": 217044, "epoch": 2614, "val_loss": 6509316.0} {"train_loss": -23.9666805267334, "global_step": 217045, "epoch": 2615} {"train_loss": -24.042434692382812, "global_step": 217046, "epoch": 2615} {"train_loss": -23.69793128967285, "global_step": 217047, "epoch": 2615} {"train_loss": -23.90946388244629, "global_step": 217048, "epoch": 2615} {"train_loss": -24.1464786529541, "global_step": 217049, "epoch": 2615} {"train_loss": -24.022552490234375, "global_step": 217050, "epoch": 2615} {"train_loss": -24.28632926940918, "global_step": 217051, "epoch": 2615} {"train_loss": -24.495939254760742, "global_step": 217052, "epoch": 2615} {"train_loss": -24.221271514892578, "global_step": 217053, "epoch": 2615} {"train_loss": -24.324913024902344, "global_step": 217054, "epoch": 2615} {"train_loss": -24.197500228881836, "global_step": 217055, "epoch": 2615} {"train_loss": -24.306625366210938, "global_step": 217056, "epoch": 2615} {"train_loss": -24.309417724609375, "global_step": 217057, "epoch": 2615} {"train_loss": -24.562219619750977, "global_step": 217058, "epoch": 2615} {"train_loss": -24.415653228759766, "global_step": 217059, "epoch": 2615} {"train_loss": -23.97205924987793, "global_step": 217060, "epoch": 2615} {"train_loss": -24.577550888061523, "global_step": 217061, "epoch": 2615} {"train_loss": -24.450109481811523, "global_step": 217062, "epoch": 2615} {"train_loss": -24.586708068847656, "global_step": 217063, "epoch": 2615} {"train_loss": -24.227981567382812, "global_step": 217064, "epoch": 2615} {"train_loss": -24.42487907409668, "global_step": 217065, "epoch": 2615} {"train_loss": -24.407976150512695, "global_step": 217066, "epoch": 2615} {"train_loss": -24.212568283081055, "global_step": 217067, "epoch": 2615} {"train_loss": -24.213895797729492, "global_step": 217068, "epoch": 2615} {"train_loss": -24.7745418548584, "global_step": 217069, "epoch": 2615} {"train_loss": -24.457517623901367, "global_step": 217070, "epoch": 2615} {"train_loss": -24.79861831665039, "global_step": 217071, "epoch": 2615} {"train_loss": -24.40098762512207, "global_step": 217072, "epoch": 2615} {"train_loss": -24.51556968688965, "global_step": 217073, "epoch": 2615} {"train_loss": -24.533721923828125, "global_step": 217074, "epoch": 2615} {"train_loss": -24.53537368774414, "global_step": 217075, "epoch": 2615} {"train_loss": -24.63563346862793, "global_step": 217076, "epoch": 2615} {"train_loss": -24.48834800720215, "global_step": 217077, "epoch": 2615} {"train_loss": -24.40460777282715, "global_step": 217078, "epoch": 2615} {"train_loss": -24.815143585205078, "global_step": 217079, "epoch": 2615} {"train_loss": -24.76798439025879, "global_step": 217080, "epoch": 2615} {"train_loss": -24.601221084594727, "global_step": 217081, "epoch": 2615} {"train_loss": -24.332767486572266, "global_step": 217082, "epoch": 2615} {"train_loss": -24.369701385498047, "global_step": 217083, "epoch": 2615} {"train_loss": -24.758800506591797, "global_step": 217084, "epoch": 2615} {"train_loss": -24.597036361694336, "global_step": 217085, "epoch": 2615} {"train_loss": -24.442514419555664, "global_step": 217086, "epoch": 2615} {"train_loss": -24.639738082885742, "global_step": 217087, "epoch": 2615} {"train_loss": -24.05765151977539, "global_step": 217088, "epoch": 2615} {"train_loss": -24.633777618408203, "global_step": 217089, "epoch": 2615} {"train_loss": -24.444759368896484, "global_step": 217090, "epoch": 2615} {"train_loss": -24.53371238708496, "global_step": 217091, "epoch": 2615} {"train_loss": -24.13104248046875, "global_step": 217092, "epoch": 2615} {"train_loss": -24.626407623291016, "global_step": 217093, "epoch": 2615} {"train_loss": -24.434476852416992, "global_step": 217094, "epoch": 2615} {"train_loss": -24.505565643310547, "global_step": 217095, "epoch": 2615} {"train_loss": -24.649267196655273, "global_step": 217096, "epoch": 2615} {"train_loss": -24.126113891601562, "global_step": 217097, "epoch": 2615} {"train_loss": -24.612457275390625, "global_step": 217098, "epoch": 2615} {"train_loss": -24.5085391998291, "global_step": 217099, "epoch": 2615} {"train_loss": -24.44199562072754, "global_step": 217100, "epoch": 2615} {"train_loss": -24.6097469329834, "global_step": 217101, "epoch": 2615} {"train_loss": -24.641027450561523, "global_step": 217102, "epoch": 2615} {"train_loss": -24.596675872802734, "global_step": 217103, "epoch": 2615} {"train_loss": -24.244216918945312, "global_step": 217104, "epoch": 2615} {"train_loss": -24.569507598876953, "global_step": 217105, "epoch": 2615} {"train_loss": -24.403547286987305, "global_step": 217106, "epoch": 2615} {"train_loss": -24.580801010131836, "global_step": 217107, "epoch": 2615} {"train_loss": -24.49601173400879, "global_step": 217108, "epoch": 2615} {"train_loss": -24.70053482055664, "global_step": 217109, "epoch": 2615} {"train_loss": -24.85254669189453, "global_step": 217110, "epoch": 2615} {"train_loss": -24.628662109375, "global_step": 217111, "epoch": 2615} {"train_loss": -24.38960075378418, "global_step": 217112, "epoch": 2615} {"train_loss": -24.79901123046875, "global_step": 217113, "epoch": 2615} {"train_loss": -24.533039093017578, "global_step": 217114, "epoch": 2615} {"train_loss": -24.466398239135742, "global_step": 217115, "epoch": 2615} {"train_loss": -24.589569091796875, "global_step": 217116, "epoch": 2615} {"train_loss": -24.565980911254883, "global_step": 217117, "epoch": 2615} {"train_loss": -24.4813289642334, "global_step": 217118, "epoch": 2615} {"train_loss": -24.59787940979004, "global_step": 217119, "epoch": 2615} {"train_loss": -24.635587692260742, "global_step": 217120, "epoch": 2615} {"train_loss": -24.55620765686035, "global_step": 217121, "epoch": 2615} {"train_loss": -24.490751266479492, "global_step": 217122, "epoch": 2615} {"train_loss": -24.84522247314453, "global_step": 217123, "epoch": 2615} {"train_loss": -24.744380950927734, "global_step": 217124, "epoch": 2615} {"train_loss": -25.019336700439453, "global_step": 217125, "epoch": 2615} {"train_loss": -24.413528442382812, "global_step": 217126, "epoch": 2615} {"train_loss": -24.459772431706806, "global_step": 217127, "epoch": 2615, "val_loss": 6630141.0} {"train_loss": -24.147563934326172, "global_step": 217128, "epoch": 2616} {"train_loss": -24.760557174682617, "global_step": 217129, "epoch": 2616} {"train_loss": -24.49313735961914, "global_step": 217130, "epoch": 2616} {"train_loss": -23.90762710571289, "global_step": 217131, "epoch": 2616} {"train_loss": -24.024921417236328, "global_step": 217132, "epoch": 2616} {"train_loss": -24.28608512878418, "global_step": 217133, "epoch": 2616} {"train_loss": -23.97412872314453, "global_step": 217134, "epoch": 2616} {"train_loss": -24.329023361206055, "global_step": 217135, "epoch": 2616} {"train_loss": -24.242454528808594, "global_step": 217136, "epoch": 2616} {"train_loss": -24.048383712768555, "global_step": 217137, "epoch": 2616} {"train_loss": -24.468765258789062, "global_step": 217138, "epoch": 2616} {"train_loss": -24.54461669921875, "global_step": 217139, "epoch": 2616} {"train_loss": -24.57672119140625, "global_step": 217140, "epoch": 2616} {"train_loss": -24.433454513549805, "global_step": 217141, "epoch": 2616} {"train_loss": -24.405668258666992, "global_step": 217142, "epoch": 2616} {"train_loss": -24.705209732055664, "global_step": 217143, "epoch": 2616} {"train_loss": -24.1240177154541, "global_step": 217144, "epoch": 2616} {"train_loss": -24.619352340698242, "global_step": 217145, "epoch": 2616} {"train_loss": -24.183446884155273, "global_step": 217146, "epoch": 2616} {"train_loss": -24.476566314697266, "global_step": 217147, "epoch": 2616} {"train_loss": -24.21224594116211, "global_step": 217148, "epoch": 2616} {"train_loss": -24.36775016784668, "global_step": 217149, "epoch": 2616} {"train_loss": -24.39605712890625, "global_step": 217150, "epoch": 2616} {"train_loss": -24.56296157836914, "global_step": 217151, "epoch": 2616} {"train_loss": -24.191068649291992, "global_step": 217152, "epoch": 2616} {"train_loss": -24.52107810974121, "global_step": 217153, "epoch": 2616} {"train_loss": -24.60584831237793, "global_step": 217154, "epoch": 2616} {"train_loss": -24.491802215576172, "global_step": 217155, "epoch": 2616} {"train_loss": -24.76313591003418, "global_step": 217156, "epoch": 2616} {"train_loss": -24.358341217041016, "global_step": 217157, "epoch": 2616} {"train_loss": -24.546875, "global_step": 217158, "epoch": 2616} {"train_loss": -24.162221908569336, "global_step": 217159, "epoch": 2616} {"train_loss": -24.275909423828125, "global_step": 217160, "epoch": 2616} {"train_loss": -24.29731559753418, "global_step": 217161, "epoch": 2616} {"train_loss": -24.380155563354492, "global_step": 217162, "epoch": 2616} {"train_loss": -24.571569442749023, "global_step": 217163, "epoch": 2616} {"train_loss": -24.268545150756836, "global_step": 217164, "epoch": 2616} {"train_loss": -24.672286987304688, "global_step": 217165, "epoch": 2616} {"train_loss": -24.179122924804688, "global_step": 217166, "epoch": 2616} {"train_loss": -24.466976165771484, "global_step": 217167, "epoch": 2616} {"train_loss": -24.83428382873535, "global_step": 217168, "epoch": 2616} {"train_loss": -24.791229248046875, "global_step": 217169, "epoch": 2616} {"train_loss": -24.645288467407227, "global_step": 217170, "epoch": 2616} {"train_loss": -24.47812843322754, "global_step": 217171, "epoch": 2616} {"train_loss": -24.990955352783203, "global_step": 217172, "epoch": 2616} {"train_loss": -24.613561630249023, "global_step": 217173, "epoch": 2616} {"train_loss": -24.49777603149414, "global_step": 217174, "epoch": 2616} {"train_loss": -24.710514068603516, "global_step": 217175, "epoch": 2616} {"train_loss": -24.604455947875977, "global_step": 217176, "epoch": 2616} {"train_loss": -24.69835090637207, "global_step": 217177, "epoch": 2616} {"train_loss": -24.504959106445312, "global_step": 217178, "epoch": 2616} {"train_loss": -24.61256217956543, "global_step": 217179, "epoch": 2616} {"train_loss": -24.93207359313965, "global_step": 217180, "epoch": 2616} {"train_loss": -24.555728912353516, "global_step": 217181, "epoch": 2616} {"train_loss": -24.56207847595215, "global_step": 217182, "epoch": 2616} {"train_loss": -24.8402156829834, "global_step": 217183, "epoch": 2616} {"train_loss": -24.465595245361328, "global_step": 217184, "epoch": 2616} {"train_loss": -24.340726852416992, "global_step": 217185, "epoch": 2616} {"train_loss": -23.475112915039062, "global_step": 217186, "epoch": 2616} {"train_loss": -23.36957359313965, "global_step": 217187, "epoch": 2616} {"train_loss": -23.665128707885742, "global_step": 217188, "epoch": 2616} {"train_loss": -23.48774528503418, "global_step": 217189, "epoch": 2616} {"train_loss": -24.532804489135742, "global_step": 217190, "epoch": 2616} {"train_loss": -23.959609985351562, "global_step": 217191, "epoch": 2616} {"train_loss": -24.20869255065918, "global_step": 217192, "epoch": 2616} {"train_loss": -24.072818756103516, "global_step": 217193, "epoch": 2616} {"train_loss": -24.28383445739746, "global_step": 217194, "epoch": 2616} {"train_loss": -24.84922218322754, "global_step": 217195, "epoch": 2616} {"train_loss": -24.125436782836914, "global_step": 217196, "epoch": 2616} {"train_loss": -24.273778915405273, "global_step": 217197, "epoch": 2616} {"train_loss": -24.12680435180664, "global_step": 217198, "epoch": 2616} {"train_loss": -23.920944213867188, "global_step": 217199, "epoch": 2616} {"train_loss": -24.28140640258789, "global_step": 217200, "epoch": 2616} {"train_loss": -24.48610496520996, "global_step": 217201, "epoch": 2616} {"train_loss": -24.327919006347656, "global_step": 217202, "epoch": 2616} {"train_loss": -24.539342880249023, "global_step": 217203, "epoch": 2616} {"train_loss": -24.78510856628418, "global_step": 217204, "epoch": 2616} {"train_loss": -24.478818893432617, "global_step": 217205, "epoch": 2616} {"train_loss": -24.66664695739746, "global_step": 217206, "epoch": 2616} {"train_loss": -24.299488067626953, "global_step": 217207, "epoch": 2616} {"train_loss": -24.575946807861328, "global_step": 217208, "epoch": 2616} {"train_loss": -24.83806800842285, "global_step": 217209, "epoch": 2616} {"train_loss": -24.382321139416064, "global_step": 217210, "epoch": 2616, "val_loss": 6613566.0} {"train_loss": -24.235055923461914, "global_step": 217211, "epoch": 2617} {"train_loss": -24.186798095703125, "global_step": 217212, "epoch": 2617} {"train_loss": -24.42023277282715, "global_step": 217213, "epoch": 2617} {"train_loss": -24.236328125, "global_step": 217214, "epoch": 2617} {"train_loss": -24.22338104248047, "global_step": 217215, "epoch": 2617} {"train_loss": -24.690847396850586, "global_step": 217216, "epoch": 2617} {"train_loss": -24.438220977783203, "global_step": 217217, "epoch": 2617} {"train_loss": -24.42188262939453, "global_step": 217218, "epoch": 2617} {"train_loss": -24.551773071289062, "global_step": 217219, "epoch": 2617} {"train_loss": -24.474899291992188, "global_step": 217220, "epoch": 2617} {"train_loss": -24.168869018554688, "global_step": 217221, "epoch": 2617} {"train_loss": -24.34201431274414, "global_step": 217222, "epoch": 2617} {"train_loss": -24.489839553833008, "global_step": 217223, "epoch": 2617} {"train_loss": -24.331647872924805, "global_step": 217224, "epoch": 2617} {"train_loss": -24.104873657226562, "global_step": 217225, "epoch": 2617} {"train_loss": -24.680973052978516, "global_step": 217226, "epoch": 2617} {"train_loss": -24.778608322143555, "global_step": 217227, "epoch": 2617} {"train_loss": -24.467132568359375, "global_step": 217228, "epoch": 2617} {"train_loss": -24.999765396118164, "global_step": 217229, "epoch": 2617} {"train_loss": -24.490447998046875, "global_step": 217230, "epoch": 2617} {"train_loss": -24.3165225982666, "global_step": 217231, "epoch": 2617} {"train_loss": -24.779760360717773, "global_step": 217232, "epoch": 2617} {"train_loss": -23.94091796875, "global_step": 217233, "epoch": 2617} {"train_loss": -24.48663330078125, "global_step": 217234, "epoch": 2617} {"train_loss": -24.409887313842773, "global_step": 217235, "epoch": 2617} {"train_loss": -24.63338279724121, "global_step": 217236, "epoch": 2617} {"train_loss": -24.701683044433594, "global_step": 217237, "epoch": 2617} {"train_loss": -24.564701080322266, "global_step": 217238, "epoch": 2617} {"train_loss": -24.978120803833008, "global_step": 217239, "epoch": 2617} {"train_loss": -24.337125778198242, "global_step": 217240, "epoch": 2617} {"train_loss": -24.882644653320312, "global_step": 217241, "epoch": 2617} {"train_loss": -24.715768814086914, "global_step": 217242, "epoch": 2617} {"train_loss": -24.73931312561035, "global_step": 217243, "epoch": 2617} {"train_loss": -24.564884185791016, "global_step": 217244, "epoch": 2617} {"train_loss": -24.249345779418945, "global_step": 217245, "epoch": 2617} {"train_loss": -24.765535354614258, "global_step": 217246, "epoch": 2617} {"train_loss": -24.43520736694336, "global_step": 217247, "epoch": 2617} {"train_loss": -24.475317001342773, "global_step": 217248, "epoch": 2617} {"train_loss": -24.3839168548584, "global_step": 217249, "epoch": 2617} {"train_loss": -24.527774810791016, "global_step": 217250, "epoch": 2617} {"train_loss": -24.77290153503418, "global_step": 217251, "epoch": 2617} {"train_loss": -24.606571197509766, "global_step": 217252, "epoch": 2617} {"train_loss": -24.699234008789062, "global_step": 217253, "epoch": 2617} {"train_loss": -24.52185821533203, "global_step": 217254, "epoch": 2617} {"train_loss": -24.339765548706055, "global_step": 217255, "epoch": 2617} {"train_loss": -24.527822494506836, "global_step": 217256, "epoch": 2617} {"train_loss": -24.08756446838379, "global_step": 217257, "epoch": 2617} {"train_loss": -24.291757583618164, "global_step": 217258, "epoch": 2617} {"train_loss": -24.463178634643555, "global_step": 217259, "epoch": 2617} {"train_loss": -24.522857666015625, "global_step": 217260, "epoch": 2617} {"train_loss": -24.411460876464844, "global_step": 217261, "epoch": 2617} {"train_loss": -24.52150535583496, "global_step": 217262, "epoch": 2617} {"train_loss": -24.691129684448242, "global_step": 217263, "epoch": 2617} {"train_loss": -24.75678062438965, "global_step": 217264, "epoch": 2617} {"train_loss": -24.916885375976562, "global_step": 217265, "epoch": 2617} {"train_loss": -24.4049129486084, "global_step": 217266, "epoch": 2617} {"train_loss": -24.70661735534668, "global_step": 217267, "epoch": 2617} {"train_loss": -24.51127052307129, "global_step": 217268, "epoch": 2617} {"train_loss": -24.764617919921875, "global_step": 217269, "epoch": 2617} {"train_loss": -24.687307357788086, "global_step": 217270, "epoch": 2617} {"train_loss": -24.547931671142578, "global_step": 217271, "epoch": 2617} {"train_loss": -24.58917808532715, "global_step": 217272, "epoch": 2617} {"train_loss": -24.67061996459961, "global_step": 217273, "epoch": 2617} {"train_loss": -24.598358154296875, "global_step": 217274, "epoch": 2617} {"train_loss": -24.991178512573242, "global_step": 217275, "epoch": 2617} {"train_loss": -24.853487014770508, "global_step": 217276, "epoch": 2617} {"train_loss": -24.53035545349121, "global_step": 217277, "epoch": 2617} {"train_loss": -24.74973487854004, "global_step": 217278, "epoch": 2617} {"train_loss": -24.770431518554688, "global_step": 217279, "epoch": 2617} {"train_loss": -24.78633689880371, "global_step": 217280, "epoch": 2617} {"train_loss": -24.725080490112305, "global_step": 217281, "epoch": 2617} {"train_loss": -24.291513442993164, "global_step": 217282, "epoch": 2617} {"train_loss": -24.6866397857666, "global_step": 217283, "epoch": 2617} {"train_loss": -24.06959342956543, "global_step": 217284, "epoch": 2617} {"train_loss": -24.63396453857422, "global_step": 217285, "epoch": 2617} {"train_loss": -24.655569076538086, "global_step": 217286, "epoch": 2617} {"train_loss": -24.746158599853516, "global_step": 217287, "epoch": 2617} {"train_loss": -25.026052474975586, "global_step": 217288, "epoch": 2617} {"train_loss": -24.766910552978516, "global_step": 217289, "epoch": 2617} {"train_loss": -25.024633407592773, "global_step": 217290, "epoch": 2617} {"train_loss": -24.69367790222168, "global_step": 217291, "epoch": 2617} {"train_loss": -24.987258911132812, "global_step": 217292, "epoch": 2617} {"train_loss": -24.558636424053145, "global_step": 217293, "epoch": 2617, "val_loss": 6547518.0} {"train_loss": -24.105239868164062, "global_step": 217294, "epoch": 2618} {"train_loss": -23.949661254882812, "global_step": 217295, "epoch": 2618} {"train_loss": -24.16783332824707, "global_step": 217296, "epoch": 2618} {"train_loss": -24.442371368408203, "global_step": 217297, "epoch": 2618} {"train_loss": -24.115415573120117, "global_step": 217298, "epoch": 2618} {"train_loss": -24.172443389892578, "global_step": 217299, "epoch": 2618} {"train_loss": -24.329450607299805, "global_step": 217300, "epoch": 2618} {"train_loss": -24.0349063873291, "global_step": 217301, "epoch": 2618} {"train_loss": -24.527189254760742, "global_step": 217302, "epoch": 2618} {"train_loss": -24.921682357788086, "global_step": 217303, "epoch": 2618} {"train_loss": -24.29265022277832, "global_step": 217304, "epoch": 2618} {"train_loss": -24.264110565185547, "global_step": 217305, "epoch": 2618} {"train_loss": -24.25994873046875, "global_step": 217306, "epoch": 2618} {"train_loss": -24.081790924072266, "global_step": 217307, "epoch": 2618} {"train_loss": -24.352598190307617, "global_step": 217308, "epoch": 2618} {"train_loss": -24.331417083740234, "global_step": 217309, "epoch": 2618} {"train_loss": -24.438852310180664, "global_step": 217310, "epoch": 2618} {"train_loss": -24.513341903686523, "global_step": 217311, "epoch": 2618} {"train_loss": -24.606969833374023, "global_step": 217312, "epoch": 2618} {"train_loss": -24.51220703125, "global_step": 217313, "epoch": 2618} {"train_loss": -24.347305297851562, "global_step": 217314, "epoch": 2618} {"train_loss": -24.557523727416992, "global_step": 217315, "epoch": 2618} {"train_loss": -24.299163818359375, "global_step": 217316, "epoch": 2618} {"train_loss": -24.209436416625977, "global_step": 217317, "epoch": 2618} {"train_loss": -24.58195686340332, "global_step": 217318, "epoch": 2618} {"train_loss": -24.48129653930664, "global_step": 217319, "epoch": 2618} {"train_loss": -24.831026077270508, "global_step": 217320, "epoch": 2618} {"train_loss": -24.695798873901367, "global_step": 217321, "epoch": 2618} {"train_loss": -24.431900024414062, "global_step": 217322, "epoch": 2618} {"train_loss": -24.16901206970215, "global_step": 217323, "epoch": 2618} {"train_loss": -24.533720016479492, "global_step": 217324, "epoch": 2618} {"train_loss": -24.697614669799805, "global_step": 217325, "epoch": 2618} {"train_loss": -24.655179977416992, "global_step": 217326, "epoch": 2618} {"train_loss": -24.8200626373291, "global_step": 217327, "epoch": 2618} {"train_loss": -24.79726219177246, "global_step": 217328, "epoch": 2618} {"train_loss": -24.96613311767578, "global_step": 217329, "epoch": 2618} {"train_loss": -24.742328643798828, "global_step": 217330, "epoch": 2618} {"train_loss": -24.41901969909668, "global_step": 217331, "epoch": 2618} {"train_loss": -24.57822608947754, "global_step": 217332, "epoch": 2618} {"train_loss": -24.646039962768555, "global_step": 217333, "epoch": 2618} {"train_loss": -24.464567184448242, "global_step": 217334, "epoch": 2618} {"train_loss": -24.8197078704834, "global_step": 217335, "epoch": 2618} {"train_loss": -24.770715713500977, "global_step": 217336, "epoch": 2618} {"train_loss": -24.518312454223633, "global_step": 217337, "epoch": 2618} {"train_loss": -24.760671615600586, "global_step": 217338, "epoch": 2618} {"train_loss": -24.622163772583008, "global_step": 217339, "epoch": 2618} {"train_loss": -24.751028060913086, "global_step": 217340, "epoch": 2618} {"train_loss": -24.239151000976562, "global_step": 217341, "epoch": 2618} {"train_loss": -24.916522979736328, "global_step": 217342, "epoch": 2618} {"train_loss": -24.45796012878418, "global_step": 217343, "epoch": 2618} {"train_loss": -24.906286239624023, "global_step": 217344, "epoch": 2618} {"train_loss": -24.896163940429688, "global_step": 217345, "epoch": 2618} {"train_loss": -24.55765724182129, "global_step": 217346, "epoch": 2618} {"train_loss": -24.52582359313965, "global_step": 217347, "epoch": 2618} {"train_loss": -24.748037338256836, "global_step": 217348, "epoch": 2618} {"train_loss": -24.65607261657715, "global_step": 217349, "epoch": 2618} {"train_loss": -24.789831161499023, "global_step": 217350, "epoch": 2618} {"train_loss": -24.757497787475586, "global_step": 217351, "epoch": 2618} {"train_loss": -24.407684326171875, "global_step": 217352, "epoch": 2618} {"train_loss": -24.840330123901367, "global_step": 217353, "epoch": 2618} {"train_loss": -24.684690475463867, "global_step": 217354, "epoch": 2618} {"train_loss": -24.730735778808594, "global_step": 217355, "epoch": 2618} {"train_loss": -24.574033737182617, "global_step": 217356, "epoch": 2618} {"train_loss": -25.03098487854004, "global_step": 217357, "epoch": 2618} {"train_loss": -24.582040786743164, "global_step": 217358, "epoch": 2618} {"train_loss": -24.66205406188965, "global_step": 217359, "epoch": 2618} {"train_loss": -25.063142776489258, "global_step": 217360, "epoch": 2618} {"train_loss": -24.876436233520508, "global_step": 217361, "epoch": 2618} {"train_loss": -24.584264755249023, "global_step": 217362, "epoch": 2618} {"train_loss": -24.693838119506836, "global_step": 217363, "epoch": 2618} {"train_loss": -24.35797119140625, "global_step": 217364, "epoch": 2618} {"train_loss": -24.568723678588867, "global_step": 217365, "epoch": 2618} {"train_loss": -24.16547966003418, "global_step": 217366, "epoch": 2618} {"train_loss": -24.627073287963867, "global_step": 217367, "epoch": 2618} {"train_loss": -25.194726943969727, "global_step": 217368, "epoch": 2618} {"train_loss": -24.81468391418457, "global_step": 217369, "epoch": 2618} {"train_loss": -24.662015914916992, "global_step": 217370, "epoch": 2618} {"train_loss": -24.398168563842773, "global_step": 217371, "epoch": 2618} {"train_loss": -24.53618812561035, "global_step": 217372, "epoch": 2618} {"train_loss": -24.654569625854492, "global_step": 217373, "epoch": 2618} {"train_loss": -24.58320426940918, "global_step": 217374, "epoch": 2618} {"train_loss": -24.815954208374023, "global_step": 217375, "epoch": 2618} {"train_loss": -24.560216214283404, "global_step": 217376, "epoch": 2618, "val_loss": 6701142.0} {"train_loss": -24.080493927001953, "global_step": 217377, "epoch": 2619} {"train_loss": -24.00135612487793, "global_step": 217378, "epoch": 2619} {"train_loss": -24.528573989868164, "global_step": 217379, "epoch": 2619} {"train_loss": -23.756088256835938, "global_step": 217380, "epoch": 2619} {"train_loss": -24.132638931274414, "global_step": 217381, "epoch": 2619} {"train_loss": -23.938823699951172, "global_step": 217382, "epoch": 2619} {"train_loss": -23.943187713623047, "global_step": 217383, "epoch": 2619} {"train_loss": -24.05751609802246, "global_step": 217384, "epoch": 2619} {"train_loss": -24.199800491333008, "global_step": 217385, "epoch": 2619} {"train_loss": -24.382041931152344, "global_step": 217386, "epoch": 2619} {"train_loss": -23.84385871887207, "global_step": 217387, "epoch": 2619} {"train_loss": -24.006807327270508, "global_step": 217388, "epoch": 2619} {"train_loss": -24.03719139099121, "global_step": 217389, "epoch": 2619} {"train_loss": -24.305580139160156, "global_step": 217390, "epoch": 2619} {"train_loss": -24.368762969970703, "global_step": 217391, "epoch": 2619} {"train_loss": -23.9207763671875, "global_step": 217392, "epoch": 2619} {"train_loss": -24.257524490356445, "global_step": 217393, "epoch": 2619} {"train_loss": -24.259828567504883, "global_step": 217394, "epoch": 2619} {"train_loss": -24.42563819885254, "global_step": 217395, "epoch": 2619} {"train_loss": -24.01755714416504, "global_step": 217396, "epoch": 2619} {"train_loss": -24.485897064208984, "global_step": 217397, "epoch": 2619} {"train_loss": -23.996929168701172, "global_step": 217398, "epoch": 2619} {"train_loss": -24.490198135375977, "global_step": 217399, "epoch": 2619} {"train_loss": -24.499248504638672, "global_step": 217400, "epoch": 2619} {"train_loss": -24.26019287109375, "global_step": 217401, "epoch": 2619} {"train_loss": -24.177465438842773, "global_step": 217402, "epoch": 2619} {"train_loss": -24.31211280822754, "global_step": 217403, "epoch": 2619} {"train_loss": -24.26422119140625, "global_step": 217404, "epoch": 2619} {"train_loss": -24.92826271057129, "global_step": 217405, "epoch": 2619} {"train_loss": -24.271930694580078, "global_step": 217406, "epoch": 2619} {"train_loss": -24.281005859375, "global_step": 217407, "epoch": 2619} {"train_loss": -24.4368896484375, "global_step": 217408, "epoch": 2619} {"train_loss": -24.525022506713867, "global_step": 217409, "epoch": 2619} {"train_loss": -24.630361557006836, "global_step": 217410, "epoch": 2619} {"train_loss": -24.396343231201172, "global_step": 217411, "epoch": 2619} {"train_loss": -24.51161766052246, "global_step": 217412, "epoch": 2619} {"train_loss": -24.442733764648438, "global_step": 217413, "epoch": 2619} {"train_loss": -24.591264724731445, "global_step": 217414, "epoch": 2619} {"train_loss": -24.417463302612305, "global_step": 217415, "epoch": 2619} {"train_loss": -24.366003036499023, "global_step": 217416, "epoch": 2619} {"train_loss": -24.743316650390625, "global_step": 217417, "epoch": 2619} {"train_loss": -24.423566818237305, "global_step": 217418, "epoch": 2619} {"train_loss": -24.32588768005371, "global_step": 217419, "epoch": 2619} {"train_loss": -24.61775016784668, "global_step": 217420, "epoch": 2619} {"train_loss": -24.6755428314209, "global_step": 217421, "epoch": 2619} {"train_loss": -24.360998153686523, "global_step": 217422, "epoch": 2619} {"train_loss": -24.416269302368164, "global_step": 217423, "epoch": 2619} {"train_loss": -24.744943618774414, "global_step": 217424, "epoch": 2619} {"train_loss": -24.518136978149414, "global_step": 217425, "epoch": 2619} {"train_loss": -24.32390594482422, "global_step": 217426, "epoch": 2619} {"train_loss": -24.74898338317871, "global_step": 217427, "epoch": 2619} {"train_loss": -24.577648162841797, "global_step": 217428, "epoch": 2619} {"train_loss": -24.412757873535156, "global_step": 217429, "epoch": 2619} {"train_loss": -24.713106155395508, "global_step": 217430, "epoch": 2619} {"train_loss": -24.732986450195312, "global_step": 217431, "epoch": 2619} {"train_loss": -24.85519790649414, "global_step": 217432, "epoch": 2619} {"train_loss": -24.696823120117188, "global_step": 217433, "epoch": 2619} {"train_loss": -24.69427490234375, "global_step": 217434, "epoch": 2619} {"train_loss": -24.8881893157959, "global_step": 217435, "epoch": 2619} {"train_loss": -24.986621856689453, "global_step": 217436, "epoch": 2619} {"train_loss": -24.629587173461914, "global_step": 217437, "epoch": 2619} {"train_loss": -24.556745529174805, "global_step": 217438, "epoch": 2619} {"train_loss": -24.433027267456055, "global_step": 217439, "epoch": 2619} {"train_loss": -24.412351608276367, "global_step": 217440, "epoch": 2619} {"train_loss": -24.13193702697754, "global_step": 217441, "epoch": 2619} {"train_loss": -24.686447143554688, "global_step": 217442, "epoch": 2619} {"train_loss": -23.96953582763672, "global_step": 217443, "epoch": 2619} {"train_loss": -24.403615951538086, "global_step": 217444, "epoch": 2619} {"train_loss": -24.63286781311035, "global_step": 217445, "epoch": 2619} {"train_loss": -24.222761154174805, "global_step": 217446, "epoch": 2619} {"train_loss": -24.157068252563477, "global_step": 217447, "epoch": 2619} {"train_loss": -24.641992568969727, "global_step": 217448, "epoch": 2619} {"train_loss": -24.931455612182617, "global_step": 217449, "epoch": 2619} {"train_loss": -24.603418350219727, "global_step": 217450, "epoch": 2619} {"train_loss": -24.56146240234375, "global_step": 217451, "epoch": 2619} {"train_loss": -24.655920028686523, "global_step": 217452, "epoch": 2619} {"train_loss": -24.5628604888916, "global_step": 217453, "epoch": 2619} {"train_loss": -24.484067916870117, "global_step": 217454, "epoch": 2619} {"train_loss": -24.597776412963867, "global_step": 217455, "epoch": 2619} {"train_loss": -24.393390655517578, "global_step": 217456, "epoch": 2619} {"train_loss": -24.4967041015625, "global_step": 217457, "epoch": 2619} {"train_loss": -24.71274757385254, "global_step": 217458, "epoch": 2619} {"train_loss": -24.41445989493864, "global_step": 217459, "epoch": 2619, "val_loss": 6628831.0} {"train_loss": -24.11921501159668, "global_step": 217460, "epoch": 2620} {"train_loss": -24.415483474731445, "global_step": 217461, "epoch": 2620} {"train_loss": -23.93116569519043, "global_step": 217462, "epoch": 2620} {"train_loss": -24.142230987548828, "global_step": 217463, "epoch": 2620} {"train_loss": -24.177518844604492, "global_step": 217464, "epoch": 2620} {"train_loss": -24.324560165405273, "global_step": 217465, "epoch": 2620} {"train_loss": -24.300146102905273, "global_step": 217466, "epoch": 2620} {"train_loss": -24.349401473999023, "global_step": 217467, "epoch": 2620} {"train_loss": -24.31297492980957, "global_step": 217468, "epoch": 2620} {"train_loss": -24.150197982788086, "global_step": 217469, "epoch": 2620} {"train_loss": -24.806936264038086, "global_step": 217470, "epoch": 2620} {"train_loss": -24.251562118530273, "global_step": 217471, "epoch": 2620} {"train_loss": -24.4290828704834, "global_step": 217472, "epoch": 2620} {"train_loss": -24.46829605102539, "global_step": 217473, "epoch": 2620} {"train_loss": -24.354339599609375, "global_step": 217474, "epoch": 2620} {"train_loss": -24.668394088745117, "global_step": 217475, "epoch": 2620} {"train_loss": -24.39893341064453, "global_step": 217476, "epoch": 2620} {"train_loss": -24.516071319580078, "global_step": 217477, "epoch": 2620} {"train_loss": -24.452835083007812, "global_step": 217478, "epoch": 2620} {"train_loss": -24.72430419921875, "global_step": 217479, "epoch": 2620} {"train_loss": -24.37452507019043, "global_step": 217480, "epoch": 2620} {"train_loss": -24.630983352661133, "global_step": 217481, "epoch": 2620} {"train_loss": -24.35169792175293, "global_step": 217482, "epoch": 2620} {"train_loss": -24.22145652770996, "global_step": 217483, "epoch": 2620} {"train_loss": -24.416526794433594, "global_step": 217484, "epoch": 2620} {"train_loss": -24.378555297851562, "global_step": 217485, "epoch": 2620} {"train_loss": -24.384719848632812, "global_step": 217486, "epoch": 2620} {"train_loss": -24.620283126831055, "global_step": 217487, "epoch": 2620} {"train_loss": -24.415836334228516, "global_step": 217488, "epoch": 2620} {"train_loss": -24.532691955566406, "global_step": 217489, "epoch": 2620} {"train_loss": -24.3312931060791, "global_step": 217490, "epoch": 2620} {"train_loss": -24.74790382385254, "global_step": 217491, "epoch": 2620} {"train_loss": -24.685558319091797, "global_step": 217492, "epoch": 2620} {"train_loss": -24.3083553314209, "global_step": 217493, "epoch": 2620} {"train_loss": -24.8560848236084, "global_step": 217494, "epoch": 2620} {"train_loss": -24.611225128173828, "global_step": 217495, "epoch": 2620} {"train_loss": -24.496824264526367, "global_step": 217496, "epoch": 2620} {"train_loss": -24.617298126220703, "global_step": 217497, "epoch": 2620} {"train_loss": -24.473602294921875, "global_step": 217498, "epoch": 2620} {"train_loss": -24.42755699157715, "global_step": 217499, "epoch": 2620} {"train_loss": -24.533191680908203, "global_step": 217500, "epoch": 2620} {"train_loss": -25.1275577545166, "global_step": 217501, "epoch": 2620} {"train_loss": -24.61787223815918, "global_step": 217502, "epoch": 2620} {"train_loss": -24.650192260742188, "global_step": 217503, "epoch": 2620} {"train_loss": -24.370145797729492, "global_step": 217504, "epoch": 2620} {"train_loss": -24.814321517944336, "global_step": 217505, "epoch": 2620} {"train_loss": -24.3103084564209, "global_step": 217506, "epoch": 2620} {"train_loss": -24.798568725585938, "global_step": 217507, "epoch": 2620} {"train_loss": -24.66204833984375, "global_step": 217508, "epoch": 2620} {"train_loss": -24.64020347595215, "global_step": 217509, "epoch": 2620} {"train_loss": -24.485980987548828, "global_step": 217510, "epoch": 2620} {"train_loss": -24.927698135375977, "global_step": 217511, "epoch": 2620} {"train_loss": -25.208465576171875, "global_step": 217512, "epoch": 2620} {"train_loss": -24.736473083496094, "global_step": 217513, "epoch": 2620} {"train_loss": -24.8233642578125, "global_step": 217514, "epoch": 2620} {"train_loss": -24.72493553161621, "global_step": 217515, "epoch": 2620} {"train_loss": -24.751070022583008, "global_step": 217516, "epoch": 2620} {"train_loss": -24.51802635192871, "global_step": 217517, "epoch": 2620} {"train_loss": -24.5389347076416, "global_step": 217518, "epoch": 2620} {"train_loss": -24.468772888183594, "global_step": 217519, "epoch": 2620} {"train_loss": -24.4429931640625, "global_step": 217520, "epoch": 2620} {"train_loss": -24.825170516967773, "global_step": 217521, "epoch": 2620} {"train_loss": -24.351850509643555, "global_step": 217522, "epoch": 2620} {"train_loss": -24.78948402404785, "global_step": 217523, "epoch": 2620} {"train_loss": -24.21590232849121, "global_step": 217524, "epoch": 2620} {"train_loss": -24.720312118530273, "global_step": 217525, "epoch": 2620} {"train_loss": -24.78858757019043, "global_step": 217526, "epoch": 2620} {"train_loss": -24.697980880737305, "global_step": 217527, "epoch": 2620} {"train_loss": -24.56728172302246, "global_step": 217528, "epoch": 2620} {"train_loss": -24.36014747619629, "global_step": 217529, "epoch": 2620} {"train_loss": -24.451629638671875, "global_step": 217530, "epoch": 2620} {"train_loss": -24.583181381225586, "global_step": 217531, "epoch": 2620} {"train_loss": -24.63230323791504, "global_step": 217532, "epoch": 2620} {"train_loss": -24.771942138671875, "global_step": 217533, "epoch": 2620} {"train_loss": -24.551387786865234, "global_step": 217534, "epoch": 2620} {"train_loss": -24.36152458190918, "global_step": 217535, "epoch": 2620} {"train_loss": -24.330230712890625, "global_step": 217536, "epoch": 2620} {"train_loss": -24.118650436401367, "global_step": 217537, "epoch": 2620} {"train_loss": -24.811382293701172, "global_step": 217538, "epoch": 2620} {"train_loss": -24.327884674072266, "global_step": 217539, "epoch": 2620} {"train_loss": -24.08487319946289, "global_step": 217540, "epoch": 2620} {"train_loss": -24.399147033691406, "global_step": 217541, "epoch": 2620} {"train_loss": -24.494162938680994, "global_step": 217542, "epoch": 2620, "val_loss": 6641829.0} {"train_loss": -24.269018173217773, "global_step": 217543, "epoch": 2621} {"train_loss": -23.903074264526367, "global_step": 217544, "epoch": 2621} {"train_loss": -23.666770935058594, "global_step": 217545, "epoch": 2621} {"train_loss": -23.631423950195312, "global_step": 217546, "epoch": 2621} {"train_loss": -24.455039978027344, "global_step": 217547, "epoch": 2621} {"train_loss": -23.7222957611084, "global_step": 217548, "epoch": 2621} {"train_loss": -23.478235244750977, "global_step": 217549, "epoch": 2621} {"train_loss": -23.907556533813477, "global_step": 217550, "epoch": 2621} {"train_loss": -24.03998565673828, "global_step": 217551, "epoch": 2621} {"train_loss": -24.046279907226562, "global_step": 217552, "epoch": 2621} {"train_loss": -24.24571418762207, "global_step": 217553, "epoch": 2621} {"train_loss": -23.732481002807617, "global_step": 217554, "epoch": 2621} {"train_loss": -24.024686813354492, "global_step": 217555, "epoch": 2621} {"train_loss": -23.52012062072754, "global_step": 217556, "epoch": 2621} {"train_loss": -24.453872680664062, "global_step": 217557, "epoch": 2621} {"train_loss": -24.141386032104492, "global_step": 217558, "epoch": 2621} {"train_loss": -23.98194694519043, "global_step": 217559, "epoch": 2621} {"train_loss": -24.1505126953125, "global_step": 217560, "epoch": 2621} {"train_loss": -24.373228073120117, "global_step": 217561, "epoch": 2621} {"train_loss": -24.158559799194336, "global_step": 217562, "epoch": 2621} {"train_loss": -24.411754608154297, "global_step": 217563, "epoch": 2621} {"train_loss": -23.896352767944336, "global_step": 217564, "epoch": 2621} {"train_loss": -24.377286911010742, "global_step": 217565, "epoch": 2621} {"train_loss": -24.224924087524414, "global_step": 217566, "epoch": 2621} {"train_loss": -24.531375885009766, "global_step": 217567, "epoch": 2621} {"train_loss": -23.988035202026367, "global_step": 217568, "epoch": 2621} {"train_loss": -24.173398971557617, "global_step": 217569, "epoch": 2621} {"train_loss": -24.366376876831055, "global_step": 217570, "epoch": 2621} {"train_loss": -24.653409957885742, "global_step": 217571, "epoch": 2621} {"train_loss": -24.387680053710938, "global_step": 217572, "epoch": 2621} {"train_loss": -24.600421905517578, "global_step": 217573, "epoch": 2621} {"train_loss": -24.395620346069336, "global_step": 217574, "epoch": 2621} {"train_loss": -24.548446655273438, "global_step": 217575, "epoch": 2621} {"train_loss": -24.0578670501709, "global_step": 217576, "epoch": 2621} {"train_loss": -24.50715446472168, "global_step": 217577, "epoch": 2621} {"train_loss": -24.578489303588867, "global_step": 217578, "epoch": 2621} {"train_loss": -24.489816665649414, "global_step": 217579, "epoch": 2621} {"train_loss": -24.32880210876465, "global_step": 217580, "epoch": 2621} {"train_loss": -24.23886489868164, "global_step": 217581, "epoch": 2621} {"train_loss": -24.45419692993164, "global_step": 217582, "epoch": 2621} {"train_loss": -24.287351608276367, "global_step": 217583, "epoch": 2621} {"train_loss": -24.203121185302734, "global_step": 217584, "epoch": 2621} {"train_loss": -24.263065338134766, "global_step": 217585, "epoch": 2621} {"train_loss": -24.653589248657227, "global_step": 217586, "epoch": 2621} {"train_loss": -24.327951431274414, "global_step": 217587, "epoch": 2621} {"train_loss": -25.017906188964844, "global_step": 217588, "epoch": 2621} {"train_loss": -24.188690185546875, "global_step": 217589, "epoch": 2621} {"train_loss": -24.60747718811035, "global_step": 217590, "epoch": 2621} {"train_loss": -24.613330841064453, "global_step": 217591, "epoch": 2621} {"train_loss": -24.50018882751465, "global_step": 217592, "epoch": 2621} {"train_loss": -24.406705856323242, "global_step": 217593, "epoch": 2621} {"train_loss": -24.825178146362305, "global_step": 217594, "epoch": 2621} {"train_loss": -24.700746536254883, "global_step": 217595, "epoch": 2621} {"train_loss": -24.18939781188965, "global_step": 217596, "epoch": 2621} {"train_loss": -24.86631965637207, "global_step": 217597, "epoch": 2621} {"train_loss": -24.53798484802246, "global_step": 217598, "epoch": 2621} {"train_loss": -24.676076889038086, "global_step": 217599, "epoch": 2621} {"train_loss": -24.638994216918945, "global_step": 217600, "epoch": 2621} {"train_loss": -24.981037139892578, "global_step": 217601, "epoch": 2621} {"train_loss": -24.53485679626465, "global_step": 217602, "epoch": 2621} {"train_loss": -24.610610961914062, "global_step": 217603, "epoch": 2621} {"train_loss": -24.356159210205078, "global_step": 217604, "epoch": 2621} {"train_loss": -24.647764205932617, "global_step": 217605, "epoch": 2621} {"train_loss": -24.50898551940918, "global_step": 217606, "epoch": 2621} {"train_loss": -24.260217666625977, "global_step": 217607, "epoch": 2621} {"train_loss": -24.76025390625, "global_step": 217608, "epoch": 2621} {"train_loss": -24.431650161743164, "global_step": 217609, "epoch": 2621} {"train_loss": -24.863195419311523, "global_step": 217610, "epoch": 2621} {"train_loss": -24.374513626098633, "global_step": 217611, "epoch": 2621} {"train_loss": -24.480077743530273, "global_step": 217612, "epoch": 2621} {"train_loss": -24.617862701416016, "global_step": 217613, "epoch": 2621} {"train_loss": -24.381093978881836, "global_step": 217614, "epoch": 2621} {"train_loss": -25.081247329711914, "global_step": 217615, "epoch": 2621} {"train_loss": -24.802200317382812, "global_step": 217616, "epoch": 2621} {"train_loss": -24.56449317932129, "global_step": 217617, "epoch": 2621} {"train_loss": -24.01089096069336, "global_step": 217618, "epoch": 2621} {"train_loss": -24.460399627685547, "global_step": 217619, "epoch": 2621} {"train_loss": -24.582950592041016, "global_step": 217620, "epoch": 2621} {"train_loss": -24.428638458251953, "global_step": 217621, "epoch": 2621} {"train_loss": -24.537744522094727, "global_step": 217622, "epoch": 2621} {"train_loss": -24.696271896362305, "global_step": 217623, "epoch": 2621} {"train_loss": -24.703367233276367, "global_step": 217624, "epoch": 2621} {"train_loss": -24.370171696306713, "global_step": 217625, "epoch": 2621, "val_loss": 6601703.0} {"train_loss": -24.23299217224121, "global_step": 217626, "epoch": 2622} {"train_loss": -23.99833106994629, "global_step": 217627, "epoch": 2622} {"train_loss": -24.0888671875, "global_step": 217628, "epoch": 2622} {"train_loss": -24.176637649536133, "global_step": 217629, "epoch": 2622} {"train_loss": -24.460336685180664, "global_step": 217630, "epoch": 2622} {"train_loss": -24.379302978515625, "global_step": 217631, "epoch": 2622} {"train_loss": -24.132200241088867, "global_step": 217632, "epoch": 2622} {"train_loss": -24.522357940673828, "global_step": 217633, "epoch": 2622} {"train_loss": -24.140457153320312, "global_step": 217634, "epoch": 2622} {"train_loss": -24.195158004760742, "global_step": 217635, "epoch": 2622} {"train_loss": -24.17457389831543, "global_step": 217636, "epoch": 2622} {"train_loss": -24.41131019592285, "global_step": 217637, "epoch": 2622} {"train_loss": -24.376728057861328, "global_step": 217638, "epoch": 2622} {"train_loss": -24.166854858398438, "global_step": 217639, "epoch": 2622} {"train_loss": -24.52183723449707, "global_step": 217640, "epoch": 2622} {"train_loss": -24.595067977905273, "global_step": 217641, "epoch": 2622} {"train_loss": -24.390335083007812, "global_step": 217642, "epoch": 2622} {"train_loss": -23.74358558654785, "global_step": 217643, "epoch": 2622} {"train_loss": -24.442276000976562, "global_step": 217644, "epoch": 2622} {"train_loss": -24.459623336791992, "global_step": 217645, "epoch": 2622} {"train_loss": -24.2771053314209, "global_step": 217646, "epoch": 2622} {"train_loss": -24.325929641723633, "global_step": 217647, "epoch": 2622} {"train_loss": -24.146472930908203, "global_step": 217648, "epoch": 2622} {"train_loss": -24.251697540283203, "global_step": 217649, "epoch": 2622} {"train_loss": -24.679346084594727, "global_step": 217650, "epoch": 2622} {"train_loss": -24.47310447692871, "global_step": 217651, "epoch": 2622} {"train_loss": -24.45637321472168, "global_step": 217652, "epoch": 2622} {"train_loss": -24.078800201416016, "global_step": 217653, "epoch": 2622} {"train_loss": -24.367450714111328, "global_step": 217654, "epoch": 2622} {"train_loss": -24.11636734008789, "global_step": 217655, "epoch": 2622} {"train_loss": -24.2508602142334, "global_step": 217656, "epoch": 2622} {"train_loss": -24.380735397338867, "global_step": 217657, "epoch": 2622} {"train_loss": -23.94126319885254, "global_step": 217658, "epoch": 2622} {"train_loss": -24.151283264160156, "global_step": 217659, "epoch": 2622} {"train_loss": -24.227602005004883, "global_step": 217660, "epoch": 2622} {"train_loss": -24.255380630493164, "global_step": 217661, "epoch": 2622} {"train_loss": -24.413442611694336, "global_step": 217662, "epoch": 2622} {"train_loss": -24.23417091369629, "global_step": 217663, "epoch": 2622} {"train_loss": -23.69209098815918, "global_step": 217664, "epoch": 2622} {"train_loss": -24.48365592956543, "global_step": 217665, "epoch": 2622} {"train_loss": -24.386545181274414, "global_step": 217666, "epoch": 2622} {"train_loss": -24.070520401000977, "global_step": 217667, "epoch": 2622} {"train_loss": -24.907567977905273, "global_step": 217668, "epoch": 2622} {"train_loss": -24.444931030273438, "global_step": 217669, "epoch": 2622} {"train_loss": -24.34132957458496, "global_step": 217670, "epoch": 2622} {"train_loss": -24.102603912353516, "global_step": 217671, "epoch": 2622} {"train_loss": -24.42954444885254, "global_step": 217672, "epoch": 2622} {"train_loss": -24.44602394104004, "global_step": 217673, "epoch": 2622} {"train_loss": -24.237491607666016, "global_step": 217674, "epoch": 2622} {"train_loss": -24.326826095581055, "global_step": 217675, "epoch": 2622} {"train_loss": -24.19326400756836, "global_step": 217676, "epoch": 2622} {"train_loss": -24.41318130493164, "global_step": 217677, "epoch": 2622} {"train_loss": -24.84981346130371, "global_step": 217678, "epoch": 2622} {"train_loss": -24.328723907470703, "global_step": 217679, "epoch": 2622} {"train_loss": -24.15251922607422, "global_step": 217680, "epoch": 2622} {"train_loss": -24.84751319885254, "global_step": 217681, "epoch": 2622} {"train_loss": -24.521024703979492, "global_step": 217682, "epoch": 2622} {"train_loss": -24.716331481933594, "global_step": 217683, "epoch": 2622} {"train_loss": -24.60103988647461, "global_step": 217684, "epoch": 2622} {"train_loss": -24.878286361694336, "global_step": 217685, "epoch": 2622} {"train_loss": -24.652809143066406, "global_step": 217686, "epoch": 2622} {"train_loss": -24.962553024291992, "global_step": 217687, "epoch": 2622} {"train_loss": -24.489822387695312, "global_step": 217688, "epoch": 2622} {"train_loss": -24.72541618347168, "global_step": 217689, "epoch": 2622} {"train_loss": -24.892417907714844, "global_step": 217690, "epoch": 2622} {"train_loss": -24.740873336791992, "global_step": 217691, "epoch": 2622} {"train_loss": -24.582304000854492, "global_step": 217692, "epoch": 2622} {"train_loss": -24.66025733947754, "global_step": 217693, "epoch": 2622} {"train_loss": -24.3963680267334, "global_step": 217694, "epoch": 2622} {"train_loss": -24.782638549804688, "global_step": 217695, "epoch": 2622} {"train_loss": -25.275075912475586, "global_step": 217696, "epoch": 2622} {"train_loss": -24.74651336669922, "global_step": 217697, "epoch": 2622} {"train_loss": -24.389541625976562, "global_step": 217698, "epoch": 2622} {"train_loss": -24.751298904418945, "global_step": 217699, "epoch": 2622} {"train_loss": -24.677623748779297, "global_step": 217700, "epoch": 2622} {"train_loss": -25.1354923248291, "global_step": 217701, "epoch": 2622} {"train_loss": -24.617969512939453, "global_step": 217702, "epoch": 2622} {"train_loss": -24.856779098510742, "global_step": 217703, "epoch": 2622} {"train_loss": -24.61895751953125, "global_step": 217704, "epoch": 2622} {"train_loss": -24.491491317749023, "global_step": 217705, "epoch": 2622} {"train_loss": -24.31385040283203, "global_step": 217706, "epoch": 2622} {"train_loss": -24.434680938720703, "global_step": 217707, "epoch": 2622} {"train_loss": -24.451620308749646, "global_step": 217708, "epoch": 2622, "val_loss": 6642241.0} {"train_loss": -22.94095802307129, "global_step": 217709, "epoch": 2623} {"train_loss": -21.236005783081055, "global_step": 217710, "epoch": 2623} {"train_loss": -22.468875885009766, "global_step": 217711, "epoch": 2623} {"train_loss": -23.740888595581055, "global_step": 217712, "epoch": 2623} {"train_loss": -23.48398208618164, "global_step": 217713, "epoch": 2623} {"train_loss": -23.995681762695312, "global_step": 217714, "epoch": 2623} {"train_loss": -23.638978958129883, "global_step": 217715, "epoch": 2623} {"train_loss": -23.74428367614746, "global_step": 217716, "epoch": 2623} {"train_loss": -24.367538452148438, "global_step": 217717, "epoch": 2623} {"train_loss": -24.050582885742188, "global_step": 217718, "epoch": 2623} {"train_loss": -24.121435165405273, "global_step": 217719, "epoch": 2623} {"train_loss": -23.62567138671875, "global_step": 217720, "epoch": 2623} {"train_loss": -23.813566207885742, "global_step": 217721, "epoch": 2623} {"train_loss": -23.92302131652832, "global_step": 217722, "epoch": 2623} {"train_loss": -23.608610153198242, "global_step": 217723, "epoch": 2623} {"train_loss": -24.106386184692383, "global_step": 217724, "epoch": 2623} {"train_loss": -24.266050338745117, "global_step": 217725, "epoch": 2623} {"train_loss": -23.775787353515625, "global_step": 217726, "epoch": 2623} {"train_loss": -24.214908599853516, "global_step": 217727, "epoch": 2623} {"train_loss": -24.302343368530273, "global_step": 217728, "epoch": 2623} {"train_loss": -24.211881637573242, "global_step": 217729, "epoch": 2623} {"train_loss": -24.24906349182129, "global_step": 217730, "epoch": 2623} {"train_loss": -24.047941207885742, "global_step": 217731, "epoch": 2623} {"train_loss": -24.314090728759766, "global_step": 217732, "epoch": 2623} {"train_loss": -24.27665138244629, "global_step": 217733, "epoch": 2623} {"train_loss": -24.341360092163086, "global_step": 217734, "epoch": 2623} {"train_loss": -24.30717658996582, "global_step": 217735, "epoch": 2623} {"train_loss": -24.46491813659668, "global_step": 217736, "epoch": 2623} {"train_loss": -24.14480972290039, "global_step": 217737, "epoch": 2623} {"train_loss": -24.455053329467773, "global_step": 217738, "epoch": 2623} {"train_loss": -24.582853317260742, "global_step": 217739, "epoch": 2623} {"train_loss": -24.044092178344727, "global_step": 217740, "epoch": 2623} {"train_loss": -24.600263595581055, "global_step": 217741, "epoch": 2623} {"train_loss": -24.441612243652344, "global_step": 217742, "epoch": 2623} {"train_loss": -24.3522891998291, "global_step": 217743, "epoch": 2623} {"train_loss": -24.285959243774414, "global_step": 217744, "epoch": 2623} {"train_loss": -24.521636962890625, "global_step": 217745, "epoch": 2623} {"train_loss": -24.566776275634766, "global_step": 217746, "epoch": 2623} {"train_loss": -24.4210147857666, "global_step": 217747, "epoch": 2623} {"train_loss": -24.389629364013672, "global_step": 217748, "epoch": 2623} {"train_loss": -24.58957862854004, "global_step": 217749, "epoch": 2623} {"train_loss": -24.62732696533203, "global_step": 217750, "epoch": 2623} {"train_loss": -24.28410530090332, "global_step": 217751, "epoch": 2623} {"train_loss": -24.631019592285156, "global_step": 217752, "epoch": 2623} {"train_loss": -24.57265281677246, "global_step": 217753, "epoch": 2623} {"train_loss": -24.642805099487305, "global_step": 217754, "epoch": 2623} {"train_loss": -24.328411102294922, "global_step": 217755, "epoch": 2623} {"train_loss": -24.282209396362305, "global_step": 217756, "epoch": 2623} {"train_loss": -24.574459075927734, "global_step": 217757, "epoch": 2623} {"train_loss": -24.220195770263672, "global_step": 217758, "epoch": 2623} {"train_loss": -24.480833053588867, "global_step": 217759, "epoch": 2623} {"train_loss": -24.461301803588867, "global_step": 217760, "epoch": 2623} {"train_loss": -24.607397079467773, "global_step": 217761, "epoch": 2623} {"train_loss": -24.587589263916016, "global_step": 217762, "epoch": 2623} {"train_loss": -24.581716537475586, "global_step": 217763, "epoch": 2623} {"train_loss": -24.56989860534668, "global_step": 217764, "epoch": 2623} {"train_loss": -24.540842056274414, "global_step": 217765, "epoch": 2623} {"train_loss": -24.33818817138672, "global_step": 217766, "epoch": 2623} {"train_loss": -24.528478622436523, "global_step": 217767, "epoch": 2623} {"train_loss": -24.624324798583984, "global_step": 217768, "epoch": 2623} {"train_loss": -24.575305938720703, "global_step": 217769, "epoch": 2623} {"train_loss": -24.391036987304688, "global_step": 217770, "epoch": 2623} {"train_loss": -24.67145347595215, "global_step": 217771, "epoch": 2623} {"train_loss": -24.608884811401367, "global_step": 217772, "epoch": 2623} {"train_loss": -24.62682342529297, "global_step": 217773, "epoch": 2623} {"train_loss": -24.90814781188965, "global_step": 217774, "epoch": 2623} {"train_loss": -24.988840103149414, "global_step": 217775, "epoch": 2623} {"train_loss": -24.274494171142578, "global_step": 217776, "epoch": 2623} {"train_loss": -24.35047721862793, "global_step": 217777, "epoch": 2623} {"train_loss": -24.249263763427734, "global_step": 217778, "epoch": 2623} {"train_loss": -24.468595504760742, "global_step": 217779, "epoch": 2623} {"train_loss": -24.443748474121094, "global_step": 217780, "epoch": 2623} {"train_loss": -24.531137466430664, "global_step": 217781, "epoch": 2623} {"train_loss": -24.434249877929688, "global_step": 217782, "epoch": 2623} {"train_loss": -24.39975357055664, "global_step": 217783, "epoch": 2623} {"train_loss": -24.65938949584961, "global_step": 217784, "epoch": 2623} {"train_loss": -24.092689514160156, "global_step": 217785, "epoch": 2623} {"train_loss": -24.930957794189453, "global_step": 217786, "epoch": 2623} {"train_loss": -24.69312286376953, "global_step": 217787, "epoch": 2623} {"train_loss": -24.205326080322266, "global_step": 217788, "epoch": 2623} {"train_loss": -24.390289306640625, "global_step": 217789, "epoch": 2623} {"train_loss": -24.630176544189453, "global_step": 217790, "epoch": 2623} {"train_loss": -24.25899395310735, "global_step": 217791, "epoch": 2623, "val_loss": 6690221.0} {"train_loss": -23.87584114074707, "global_step": 217792, "epoch": 2624} {"train_loss": -23.937549591064453, "global_step": 217793, "epoch": 2624} {"train_loss": -24.768207550048828, "global_step": 217794, "epoch": 2624} {"train_loss": -23.87603187561035, "global_step": 217795, "epoch": 2624} {"train_loss": -24.25908088684082, "global_step": 217796, "epoch": 2624} {"train_loss": -23.814462661743164, "global_step": 217797, "epoch": 2624} {"train_loss": -24.002599716186523, "global_step": 217798, "epoch": 2624} {"train_loss": -24.719762802124023, "global_step": 217799, "epoch": 2624} {"train_loss": -24.03078842163086, "global_step": 217800, "epoch": 2624} {"train_loss": -24.3089542388916, "global_step": 217801, "epoch": 2624} {"train_loss": -24.1239070892334, "global_step": 217802, "epoch": 2624} {"train_loss": -24.33812713623047, "global_step": 217803, "epoch": 2624} {"train_loss": -24.367130279541016, "global_step": 217804, "epoch": 2624} {"train_loss": -24.211523056030273, "global_step": 217805, "epoch": 2624} {"train_loss": -24.43722152709961, "global_step": 217806, "epoch": 2624} {"train_loss": -24.013458251953125, "global_step": 217807, "epoch": 2624} {"train_loss": -24.30806541442871, "global_step": 217808, "epoch": 2624} {"train_loss": -24.7605037689209, "global_step": 217809, "epoch": 2624} {"train_loss": -24.158599853515625, "global_step": 217810, "epoch": 2624} {"train_loss": -24.41786766052246, "global_step": 217811, "epoch": 2624} {"train_loss": -24.63776206970215, "global_step": 217812, "epoch": 2624} {"train_loss": -24.7111873626709, "global_step": 217813, "epoch": 2624} {"train_loss": -24.130903244018555, "global_step": 217814, "epoch": 2624} {"train_loss": -24.351816177368164, "global_step": 217815, "epoch": 2624} {"train_loss": -24.740097045898438, "global_step": 217816, "epoch": 2624} {"train_loss": -24.577367782592773, "global_step": 217817, "epoch": 2624} {"train_loss": -24.752317428588867, "global_step": 217818, "epoch": 2624} {"train_loss": -24.43084144592285, "global_step": 217819, "epoch": 2624} {"train_loss": -24.280733108520508, "global_step": 217820, "epoch": 2624} {"train_loss": -24.46243667602539, "global_step": 217821, "epoch": 2624} {"train_loss": -24.706430435180664, "global_step": 217822, "epoch": 2624} {"train_loss": -24.427671432495117, "global_step": 217823, "epoch": 2624} {"train_loss": -24.687763214111328, "global_step": 217824, "epoch": 2624} {"train_loss": -24.5105037689209, "global_step": 217825, "epoch": 2624} {"train_loss": -24.680105209350586, "global_step": 217826, "epoch": 2624} {"train_loss": -24.57697105407715, "global_step": 217827, "epoch": 2624} {"train_loss": -24.84205436706543, "global_step": 217828, "epoch": 2624} {"train_loss": -24.63113784790039, "global_step": 217829, "epoch": 2624} {"train_loss": -24.794076919555664, "global_step": 217830, "epoch": 2624} {"train_loss": -24.86055564880371, "global_step": 217831, "epoch": 2624} {"train_loss": -24.60841941833496, "global_step": 217832, "epoch": 2624} {"train_loss": -24.60482406616211, "global_step": 217833, "epoch": 2624} {"train_loss": -24.491897583007812, "global_step": 217834, "epoch": 2624} {"train_loss": -24.99176025390625, "global_step": 217835, "epoch": 2624} {"train_loss": -24.835968017578125, "global_step": 217836, "epoch": 2624} {"train_loss": -24.973220825195312, "global_step": 217837, "epoch": 2624} {"train_loss": -24.931474685668945, "global_step": 217838, "epoch": 2624} {"train_loss": -24.91064453125, "global_step": 217839, "epoch": 2624} {"train_loss": -24.47014808654785, "global_step": 217840, "epoch": 2624} {"train_loss": -24.7418270111084, "global_step": 217841, "epoch": 2624} {"train_loss": -24.81876564025879, "global_step": 217842, "epoch": 2624} {"train_loss": -24.339136123657227, "global_step": 217843, "epoch": 2624} {"train_loss": -24.363431930541992, "global_step": 217844, "epoch": 2624} {"train_loss": -24.27690315246582, "global_step": 217845, "epoch": 2624} {"train_loss": -24.183780670166016, "global_step": 217846, "epoch": 2624} {"train_loss": -24.043643951416016, "global_step": 217847, "epoch": 2624} {"train_loss": -24.55967140197754, "global_step": 217848, "epoch": 2624} {"train_loss": -24.258771896362305, "global_step": 217849, "epoch": 2624} {"train_loss": -24.734006881713867, "global_step": 217850, "epoch": 2624} {"train_loss": -24.641000747680664, "global_step": 217851, "epoch": 2624} {"train_loss": -24.60089111328125, "global_step": 217852, "epoch": 2624} {"train_loss": -24.54159164428711, "global_step": 217853, "epoch": 2624} {"train_loss": -23.84086799621582, "global_step": 217854, "epoch": 2624} {"train_loss": -24.46345329284668, "global_step": 217855, "epoch": 2624} {"train_loss": -24.4715633392334, "global_step": 217856, "epoch": 2624} {"train_loss": -24.492481231689453, "global_step": 217857, "epoch": 2624} {"train_loss": -24.427837371826172, "global_step": 217858, "epoch": 2624} {"train_loss": -24.2830867767334, "global_step": 217859, "epoch": 2624} {"train_loss": -24.30525779724121, "global_step": 217860, "epoch": 2624} {"train_loss": -24.591266632080078, "global_step": 217861, "epoch": 2624} {"train_loss": -24.688602447509766, "global_step": 217862, "epoch": 2624} {"train_loss": -24.815570831298828, "global_step": 217863, "epoch": 2624} {"train_loss": -24.59471321105957, "global_step": 217864, "epoch": 2624} {"train_loss": -24.92997169494629, "global_step": 217865, "epoch": 2624} {"train_loss": -24.79894256591797, "global_step": 217866, "epoch": 2624} {"train_loss": -24.541370391845703, "global_step": 217867, "epoch": 2624} {"train_loss": -24.608673095703125, "global_step": 217868, "epoch": 2624} {"train_loss": -24.64389419555664, "global_step": 217869, "epoch": 2624} {"train_loss": -24.571033477783203, "global_step": 217870, "epoch": 2624} {"train_loss": -24.773731231689453, "global_step": 217871, "epoch": 2624} {"train_loss": -24.112674713134766, "global_step": 217872, "epoch": 2624} {"train_loss": -24.800201416015625, "global_step": 217873, "epoch": 2624} {"train_loss": -24.479207555931733, "global_step": 217874, "epoch": 2624, "val_loss": 6673950.0} {"train_loss": -24.560903549194336, "global_step": 217875, "epoch": 2625} {"train_loss": -24.004499435424805, "global_step": 217876, "epoch": 2625} {"train_loss": -23.864442825317383, "global_step": 217877, "epoch": 2625} {"train_loss": -24.607084274291992, "global_step": 217878, "epoch": 2625} {"train_loss": -23.934593200683594, "global_step": 217879, "epoch": 2625} {"train_loss": -24.023313522338867, "global_step": 217880, "epoch": 2625} {"train_loss": -23.849143981933594, "global_step": 217881, "epoch": 2625} {"train_loss": -24.49078369140625, "global_step": 217882, "epoch": 2625} {"train_loss": -24.0446834564209, "global_step": 217883, "epoch": 2625} {"train_loss": -24.189085006713867, "global_step": 217884, "epoch": 2625} {"train_loss": -24.47486686706543, "global_step": 217885, "epoch": 2625} {"train_loss": -24.08683204650879, "global_step": 217886, "epoch": 2625} {"train_loss": -24.04341697692871, "global_step": 217887, "epoch": 2625} {"train_loss": -24.578964233398438, "global_step": 217888, "epoch": 2625} {"train_loss": -24.630517959594727, "global_step": 217889, "epoch": 2625} {"train_loss": -24.282712936401367, "global_step": 217890, "epoch": 2625} {"train_loss": -24.582263946533203, "global_step": 217891, "epoch": 2625} {"train_loss": -24.07035255432129, "global_step": 217892, "epoch": 2625} {"train_loss": -24.574777603149414, "global_step": 217893, "epoch": 2625} {"train_loss": -24.301666259765625, "global_step": 217894, "epoch": 2625} {"train_loss": -24.334684371948242, "global_step": 217895, "epoch": 2625} {"train_loss": -24.646883010864258, "global_step": 217896, "epoch": 2625} {"train_loss": -24.377777099609375, "global_step": 217897, "epoch": 2625} {"train_loss": -24.17489242553711, "global_step": 217898, "epoch": 2625} {"train_loss": -24.56460189819336, "global_step": 217899, "epoch": 2625} {"train_loss": -24.935256958007812, "global_step": 217900, "epoch": 2625} {"train_loss": -24.589258193969727, "global_step": 217901, "epoch": 2625} {"train_loss": -24.629703521728516, "global_step": 217902, "epoch": 2625} {"train_loss": -24.42768096923828, "global_step": 217903, "epoch": 2625} {"train_loss": -24.610868453979492, "global_step": 217904, "epoch": 2625} {"train_loss": -24.65192222595215, "global_step": 217905, "epoch": 2625} {"train_loss": -24.955076217651367, "global_step": 217906, "epoch": 2625} {"train_loss": -24.4173583984375, "global_step": 217907, "epoch": 2625} {"train_loss": -24.68306541442871, "global_step": 217908, "epoch": 2625} {"train_loss": -24.783689498901367, "global_step": 217909, "epoch": 2625} {"train_loss": -24.64765739440918, "global_step": 217910, "epoch": 2625} {"train_loss": -24.946027755737305, "global_step": 217911, "epoch": 2625} {"train_loss": -24.966583251953125, "global_step": 217912, "epoch": 2625} {"train_loss": -25.015708923339844, "global_step": 217913, "epoch": 2625} {"train_loss": -24.70172119140625, "global_step": 217914, "epoch": 2625} {"train_loss": -24.389446258544922, "global_step": 217915, "epoch": 2625} {"train_loss": -24.830093383789062, "global_step": 217916, "epoch": 2625} {"train_loss": -24.419336318969727, "global_step": 217917, "epoch": 2625} {"train_loss": -24.53614616394043, "global_step": 217918, "epoch": 2625} {"train_loss": -25.07925796508789, "global_step": 217919, "epoch": 2625} {"train_loss": -24.82740020751953, "global_step": 217920, "epoch": 2625} {"train_loss": -24.573902130126953, "global_step": 217921, "epoch": 2625} {"train_loss": -24.448795318603516, "global_step": 217922, "epoch": 2625} {"train_loss": -24.8724308013916, "global_step": 217923, "epoch": 2625} {"train_loss": -25.00223731994629, "global_step": 217924, "epoch": 2625} {"train_loss": -24.86127281188965, "global_step": 217925, "epoch": 2625} {"train_loss": -24.69484519958496, "global_step": 217926, "epoch": 2625} {"train_loss": -24.77332878112793, "global_step": 217927, "epoch": 2625} {"train_loss": -24.787351608276367, "global_step": 217928, "epoch": 2625} {"train_loss": -24.60907554626465, "global_step": 217929, "epoch": 2625} {"train_loss": -24.7388858795166, "global_step": 217930, "epoch": 2625} {"train_loss": -24.822126388549805, "global_step": 217931, "epoch": 2625} {"train_loss": -24.60225486755371, "global_step": 217932, "epoch": 2625} {"train_loss": -24.934322357177734, "global_step": 217933, "epoch": 2625} {"train_loss": -24.40371322631836, "global_step": 217934, "epoch": 2625} {"train_loss": -24.468992233276367, "global_step": 217935, "epoch": 2625} {"train_loss": -24.090290069580078, "global_step": 217936, "epoch": 2625} {"train_loss": -24.455341339111328, "global_step": 217937, "epoch": 2625} {"train_loss": -24.540225982666016, "global_step": 217938, "epoch": 2625} {"train_loss": -24.507883071899414, "global_step": 217939, "epoch": 2625} {"train_loss": -24.530494689941406, "global_step": 217940, "epoch": 2625} {"train_loss": -24.459447860717773, "global_step": 217941, "epoch": 2625} {"train_loss": -24.498212814331055, "global_step": 217942, "epoch": 2625} {"train_loss": -24.904306411743164, "global_step": 217943, "epoch": 2625} {"train_loss": -24.483646392822266, "global_step": 217944, "epoch": 2625} {"train_loss": -24.43788719177246, "global_step": 217945, "epoch": 2625} {"train_loss": -24.636442184448242, "global_step": 217946, "epoch": 2625} {"train_loss": -24.60757064819336, "global_step": 217947, "epoch": 2625} {"train_loss": -24.683963775634766, "global_step": 217948, "epoch": 2625} {"train_loss": -24.69426727294922, "global_step": 217949, "epoch": 2625} {"train_loss": -24.838031768798828, "global_step": 217950, "epoch": 2625} {"train_loss": -24.70143699645996, "global_step": 217951, "epoch": 2625} {"train_loss": -24.62095832824707, "global_step": 217952, "epoch": 2625} {"train_loss": -24.327375411987305, "global_step": 217953, "epoch": 2625} {"train_loss": -24.660226821899414, "global_step": 217954, "epoch": 2625} {"train_loss": -24.564260482788086, "global_step": 217955, "epoch": 2625} {"train_loss": -24.456491470336914, "global_step": 217956, "epoch": 2625} {"train_loss": -24.568554430122834, "global_step": 217957, "epoch": 2625, "val_loss": 6630608.0} {"train_loss": -23.161184310913086, "global_step": 217958, "epoch": 2626} {"train_loss": -23.83338165283203, "global_step": 217959, "epoch": 2626} {"train_loss": -23.486291885375977, "global_step": 217960, "epoch": 2626} {"train_loss": -23.818037033081055, "global_step": 217961, "epoch": 2626} {"train_loss": -23.459726333618164, "global_step": 217962, "epoch": 2626} {"train_loss": -24.041929244995117, "global_step": 217963, "epoch": 2626} {"train_loss": -23.81755256652832, "global_step": 217964, "epoch": 2626} {"train_loss": -23.96917724609375, "global_step": 217965, "epoch": 2626} {"train_loss": -24.275381088256836, "global_step": 217966, "epoch": 2626} {"train_loss": -23.801513671875, "global_step": 217967, "epoch": 2626} {"train_loss": -24.186391830444336, "global_step": 217968, "epoch": 2626} {"train_loss": -23.942276000976562, "global_step": 217969, "epoch": 2626} {"train_loss": -24.173755645751953, "global_step": 217970, "epoch": 2626} {"train_loss": -24.132442474365234, "global_step": 217971, "epoch": 2626} {"train_loss": -24.26349639892578, "global_step": 217972, "epoch": 2626} {"train_loss": -23.750123977661133, "global_step": 217973, "epoch": 2626} {"train_loss": -24.182668685913086, "global_step": 217974, "epoch": 2626} {"train_loss": -24.133731842041016, "global_step": 217975, "epoch": 2626} {"train_loss": -24.0803165435791, "global_step": 217976, "epoch": 2626} {"train_loss": -24.431917190551758, "global_step": 217977, "epoch": 2626} {"train_loss": -24.54744529724121, "global_step": 217978, "epoch": 2626} {"train_loss": -24.656982421875, "global_step": 217979, "epoch": 2626} {"train_loss": -24.66587257385254, "global_step": 217980, "epoch": 2626} {"train_loss": -24.611839294433594, "global_step": 217981, "epoch": 2626} {"train_loss": -24.536575317382812, "global_step": 217982, "epoch": 2626} {"train_loss": -24.74249839782715, "global_step": 217983, "epoch": 2626} {"train_loss": -24.834186553955078, "global_step": 217984, "epoch": 2626} {"train_loss": -24.76548194885254, "global_step": 217985, "epoch": 2626} {"train_loss": -24.546981811523438, "global_step": 217986, "epoch": 2626} {"train_loss": -24.248075485229492, "global_step": 217987, "epoch": 2626} {"train_loss": -24.631500244140625, "global_step": 217988, "epoch": 2626} {"train_loss": -24.455503463745117, "global_step": 217989, "epoch": 2626} {"train_loss": -24.31354522705078, "global_step": 217990, "epoch": 2626} {"train_loss": -24.39876365661621, "global_step": 217991, "epoch": 2626} {"train_loss": -24.561429977416992, "global_step": 217992, "epoch": 2626} {"train_loss": -24.63450050354004, "global_step": 217993, "epoch": 2626} {"train_loss": -24.29729652404785, "global_step": 217994, "epoch": 2626} {"train_loss": -24.522457122802734, "global_step": 217995, "epoch": 2626} {"train_loss": -24.50486183166504, "global_step": 217996, "epoch": 2626} {"train_loss": -24.580211639404297, "global_step": 217997, "epoch": 2626} {"train_loss": -24.78615951538086, "global_step": 217998, "epoch": 2626} {"train_loss": -24.221895217895508, "global_step": 217999, "epoch": 2626} {"train_loss": -25.06839942932129, "global_step": 218000, "epoch": 2626} {"train_loss": -24.47840690612793, "global_step": 218001, "epoch": 2626} {"train_loss": -24.9077091217041, "global_step": 218002, "epoch": 2626} {"train_loss": -24.550968170166016, "global_step": 218003, "epoch": 2626} {"train_loss": -24.824111938476562, "global_step": 218004, "epoch": 2626} {"train_loss": -24.602359771728516, "global_step": 218005, "epoch": 2626} {"train_loss": -24.768878936767578, "global_step": 218006, "epoch": 2626} {"train_loss": -24.85190773010254, "global_step": 218007, "epoch": 2626} {"train_loss": -24.8528995513916, "global_step": 218008, "epoch": 2626} {"train_loss": -24.903060913085938, "global_step": 218009, "epoch": 2626} {"train_loss": -24.918718338012695, "global_step": 218010, "epoch": 2626} {"train_loss": -24.47343635559082, "global_step": 218011, "epoch": 2626} {"train_loss": -24.788293838500977, "global_step": 218012, "epoch": 2626} {"train_loss": -24.24471092224121, "global_step": 218013, "epoch": 2626} {"train_loss": -24.461750030517578, "global_step": 218014, "epoch": 2626} {"train_loss": -24.496206283569336, "global_step": 218015, "epoch": 2626} {"train_loss": -24.716781616210938, "global_step": 218016, "epoch": 2626} {"train_loss": -24.814924240112305, "global_step": 218017, "epoch": 2626} {"train_loss": -24.715599060058594, "global_step": 218018, "epoch": 2626} {"train_loss": -24.632291793823242, "global_step": 218019, "epoch": 2626} {"train_loss": -24.231964111328125, "global_step": 218020, "epoch": 2626} {"train_loss": -24.59756851196289, "global_step": 218021, "epoch": 2626} {"train_loss": -24.530982971191406, "global_step": 218022, "epoch": 2626} {"train_loss": -24.523183822631836, "global_step": 218023, "epoch": 2626} {"train_loss": -24.149362564086914, "global_step": 218024, "epoch": 2626} {"train_loss": -24.003141403198242, "global_step": 218025, "epoch": 2626} {"train_loss": -24.0394344329834, "global_step": 218026, "epoch": 2626} {"train_loss": -24.141677856445312, "global_step": 218027, "epoch": 2626} {"train_loss": -24.02298927307129, "global_step": 218028, "epoch": 2626} {"train_loss": -24.059267044067383, "global_step": 218029, "epoch": 2626} {"train_loss": -24.265382766723633, "global_step": 218030, "epoch": 2626} {"train_loss": -24.346521377563477, "global_step": 218031, "epoch": 2626} {"train_loss": -24.596235275268555, "global_step": 218032, "epoch": 2626} {"train_loss": -24.50691032409668, "global_step": 218033, "epoch": 2626} {"train_loss": -24.532379150390625, "global_step": 218034, "epoch": 2626} {"train_loss": -24.09577751159668, "global_step": 218035, "epoch": 2626} {"train_loss": -24.33312225341797, "global_step": 218036, "epoch": 2626} {"train_loss": -24.44520378112793, "global_step": 218037, "epoch": 2626} {"train_loss": -24.364500045776367, "global_step": 218038, "epoch": 2626} {"train_loss": -24.593338012695312, "global_step": 218039, "epoch": 2626} {"train_loss": -24.38687830086214, "global_step": 218040, "epoch": 2626, "val_loss": 6689515.5} {"train_loss": -24.073644638061523, "global_step": 218041, "epoch": 2627} {"train_loss": -24.16126823425293, "global_step": 218042, "epoch": 2627} {"train_loss": -24.044843673706055, "global_step": 218043, "epoch": 2627} {"train_loss": -24.23322868347168, "global_step": 218044, "epoch": 2627} {"train_loss": -24.074848175048828, "global_step": 218045, "epoch": 2627} {"train_loss": -23.974552154541016, "global_step": 218046, "epoch": 2627} {"train_loss": -24.216846466064453, "global_step": 218047, "epoch": 2627} {"train_loss": -24.186233520507812, "global_step": 218048, "epoch": 2627} {"train_loss": -24.106334686279297, "global_step": 218049, "epoch": 2627} {"train_loss": -24.491575241088867, "global_step": 218050, "epoch": 2627} {"train_loss": -23.92765235900879, "global_step": 218051, "epoch": 2627} {"train_loss": -24.52008819580078, "global_step": 218052, "epoch": 2627} {"train_loss": -24.21982765197754, "global_step": 218053, "epoch": 2627} {"train_loss": -24.299762725830078, "global_step": 218054, "epoch": 2627} {"train_loss": -24.35774803161621, "global_step": 218055, "epoch": 2627} {"train_loss": -24.54573631286621, "global_step": 218056, "epoch": 2627} {"train_loss": -24.208906173706055, "global_step": 218057, "epoch": 2627} {"train_loss": -24.674711227416992, "global_step": 218058, "epoch": 2627} {"train_loss": -24.650144577026367, "global_step": 218059, "epoch": 2627} {"train_loss": -24.323556900024414, "global_step": 218060, "epoch": 2627} {"train_loss": -24.281564712524414, "global_step": 218061, "epoch": 2627} {"train_loss": -24.76495361328125, "global_step": 218062, "epoch": 2627} {"train_loss": -24.83502197265625, "global_step": 218063, "epoch": 2627} {"train_loss": -24.61610221862793, "global_step": 218064, "epoch": 2627} {"train_loss": -24.53773307800293, "global_step": 218065, "epoch": 2627} {"train_loss": -24.780868530273438, "global_step": 218066, "epoch": 2627} {"train_loss": -24.867992401123047, "global_step": 218067, "epoch": 2627} {"train_loss": -24.882883071899414, "global_step": 218068, "epoch": 2627} {"train_loss": -24.82213020324707, "global_step": 218069, "epoch": 2627} {"train_loss": -24.749052047729492, "global_step": 218070, "epoch": 2627} {"train_loss": -24.435293197631836, "global_step": 218071, "epoch": 2627} {"train_loss": -24.23872184753418, "global_step": 218072, "epoch": 2627} {"train_loss": -24.619592666625977, "global_step": 218073, "epoch": 2627} {"train_loss": -24.657373428344727, "global_step": 218074, "epoch": 2627} {"train_loss": -24.79108238220215, "global_step": 218075, "epoch": 2627} {"train_loss": -24.892837524414062, "global_step": 218076, "epoch": 2627} {"train_loss": -24.621580123901367, "global_step": 218077, "epoch": 2627} {"train_loss": -24.53327751159668, "global_step": 218078, "epoch": 2627} {"train_loss": -24.742542266845703, "global_step": 218079, "epoch": 2627} {"train_loss": -24.82316780090332, "global_step": 218080, "epoch": 2627} {"train_loss": -24.64506721496582, "global_step": 218081, "epoch": 2627} {"train_loss": -24.330799102783203, "global_step": 218082, "epoch": 2627} {"train_loss": -25.075498580932617, "global_step": 218083, "epoch": 2627} {"train_loss": -24.953540802001953, "global_step": 218084, "epoch": 2627} {"train_loss": -23.951749801635742, "global_step": 218085, "epoch": 2627} {"train_loss": -24.801435470581055, "global_step": 218086, "epoch": 2627} {"train_loss": -24.375036239624023, "global_step": 218087, "epoch": 2627} {"train_loss": -24.732213973999023, "global_step": 218088, "epoch": 2627} {"train_loss": -24.406723022460938, "global_step": 218089, "epoch": 2627} {"train_loss": -24.064783096313477, "global_step": 218090, "epoch": 2627} {"train_loss": -24.146467208862305, "global_step": 218091, "epoch": 2627} {"train_loss": -24.076765060424805, "global_step": 218092, "epoch": 2627} {"train_loss": -24.29052734375, "global_step": 218093, "epoch": 2627} {"train_loss": -24.467622756958008, "global_step": 218094, "epoch": 2627} {"train_loss": -24.42795181274414, "global_step": 218095, "epoch": 2627} {"train_loss": -24.546382904052734, "global_step": 218096, "epoch": 2627} {"train_loss": -24.444581985473633, "global_step": 218097, "epoch": 2627} {"train_loss": -24.675596237182617, "global_step": 218098, "epoch": 2627} {"train_loss": -24.335283279418945, "global_step": 218099, "epoch": 2627} {"train_loss": -24.338594436645508, "global_step": 218100, "epoch": 2627} {"train_loss": -24.297290802001953, "global_step": 218101, "epoch": 2627} {"train_loss": -24.71039390563965, "global_step": 218102, "epoch": 2627} {"train_loss": -24.464590072631836, "global_step": 218103, "epoch": 2627} {"train_loss": -24.61083984375, "global_step": 218104, "epoch": 2627} {"train_loss": -24.579538345336914, "global_step": 218105, "epoch": 2627} {"train_loss": -25.044189453125, "global_step": 218106, "epoch": 2627} {"train_loss": -24.895366668701172, "global_step": 218107, "epoch": 2627} {"train_loss": -24.442697525024414, "global_step": 218108, "epoch": 2627} {"train_loss": -24.754648208618164, "global_step": 218109, "epoch": 2627} {"train_loss": -24.403095245361328, "global_step": 218110, "epoch": 2627} {"train_loss": -24.545780181884766, "global_step": 218111, "epoch": 2627} {"train_loss": -24.975278854370117, "global_step": 218112, "epoch": 2627} {"train_loss": -24.17629051208496, "global_step": 218113, "epoch": 2627} {"train_loss": -24.84561538696289, "global_step": 218114, "epoch": 2627} {"train_loss": -24.474580764770508, "global_step": 218115, "epoch": 2627} {"train_loss": -24.31736183166504, "global_step": 218116, "epoch": 2627} {"train_loss": -24.328786849975586, "global_step": 218117, "epoch": 2627} {"train_loss": -23.955785751342773, "global_step": 218118, "epoch": 2627} {"train_loss": -24.653392791748047, "global_step": 218119, "epoch": 2627} {"train_loss": -24.461286544799805, "global_step": 218120, "epoch": 2627} {"train_loss": -24.479764938354492, "global_step": 218121, "epoch": 2627} {"train_loss": -24.30046844482422, "global_step": 218122, "epoch": 2627} {"train_loss": -24.47888820142631, "global_step": 218123, "epoch": 2627, "val_loss": 6700554.0} {"train_loss": -22.989870071411133, "global_step": 218124, "epoch": 2628} {"train_loss": -23.04902458190918, "global_step": 218125, "epoch": 2628} {"train_loss": -23.975690841674805, "global_step": 218126, "epoch": 2628} {"train_loss": -24.23848533630371, "global_step": 218127, "epoch": 2628} {"train_loss": -23.79713249206543, "global_step": 218128, "epoch": 2628} {"train_loss": -23.854177474975586, "global_step": 218129, "epoch": 2628} {"train_loss": -23.850387573242188, "global_step": 218130, "epoch": 2628} {"train_loss": -24.049875259399414, "global_step": 218131, "epoch": 2628} {"train_loss": -24.058475494384766, "global_step": 218132, "epoch": 2628} {"train_loss": -24.193883895874023, "global_step": 218133, "epoch": 2628} {"train_loss": -24.360889434814453, "global_step": 218134, "epoch": 2628} {"train_loss": -24.32439422607422, "global_step": 218135, "epoch": 2628} {"train_loss": -24.31924819946289, "global_step": 218136, "epoch": 2628} {"train_loss": -24.004159927368164, "global_step": 218137, "epoch": 2628} {"train_loss": -24.50752067565918, "global_step": 218138, "epoch": 2628} {"train_loss": -24.217350006103516, "global_step": 218139, "epoch": 2628} {"train_loss": -23.940332412719727, "global_step": 218140, "epoch": 2628} {"train_loss": -24.299591064453125, "global_step": 218141, "epoch": 2628} {"train_loss": -24.249486923217773, "global_step": 218142, "epoch": 2628} {"train_loss": -23.985830307006836, "global_step": 218143, "epoch": 2628} {"train_loss": -24.18641471862793, "global_step": 218144, "epoch": 2628} {"train_loss": -24.058853149414062, "global_step": 218145, "epoch": 2628} {"train_loss": -24.39993667602539, "global_step": 218146, "epoch": 2628} {"train_loss": -24.304716110229492, "global_step": 218147, "epoch": 2628} {"train_loss": -24.2947998046875, "global_step": 218148, "epoch": 2628} {"train_loss": -24.546499252319336, "global_step": 218149, "epoch": 2628} {"train_loss": -24.70491600036621, "global_step": 218150, "epoch": 2628} {"train_loss": -24.77766990661621, "global_step": 218151, "epoch": 2628} {"train_loss": -24.019418716430664, "global_step": 218152, "epoch": 2628} {"train_loss": -24.58982276916504, "global_step": 218153, "epoch": 2628} {"train_loss": -24.597055435180664, "global_step": 218154, "epoch": 2628} {"train_loss": -24.573577880859375, "global_step": 218155, "epoch": 2628} {"train_loss": -24.4923095703125, "global_step": 218156, "epoch": 2628} {"train_loss": -24.413537979125977, "global_step": 218157, "epoch": 2628} {"train_loss": -24.586620330810547, "global_step": 218158, "epoch": 2628} {"train_loss": -24.215497970581055, "global_step": 218159, "epoch": 2628} {"train_loss": -24.73013687133789, "global_step": 218160, "epoch": 2628} {"train_loss": -24.199460983276367, "global_step": 218161, "epoch": 2628} {"train_loss": -24.57289695739746, "global_step": 218162, "epoch": 2628} {"train_loss": -24.50435447692871, "global_step": 218163, "epoch": 2628} {"train_loss": -24.344085693359375, "global_step": 218164, "epoch": 2628} {"train_loss": -24.63618278503418, "global_step": 218165, "epoch": 2628} {"train_loss": -24.571592330932617, "global_step": 218166, "epoch": 2628} {"train_loss": -24.48760986328125, "global_step": 218167, "epoch": 2628} {"train_loss": -24.68656349182129, "global_step": 218168, "epoch": 2628} {"train_loss": -24.693342208862305, "global_step": 218169, "epoch": 2628} {"train_loss": -24.514680862426758, "global_step": 218170, "epoch": 2628} {"train_loss": -24.961301803588867, "global_step": 218171, "epoch": 2628} {"train_loss": -24.61280059814453, "global_step": 218172, "epoch": 2628} {"train_loss": -24.6561336517334, "global_step": 218173, "epoch": 2628} {"train_loss": -24.750120162963867, "global_step": 218174, "epoch": 2628} {"train_loss": -24.603290557861328, "global_step": 218175, "epoch": 2628} {"train_loss": -24.357412338256836, "global_step": 218176, "epoch": 2628} {"train_loss": -24.675466537475586, "global_step": 218177, "epoch": 2628} {"train_loss": -24.7423152923584, "global_step": 218178, "epoch": 2628} {"train_loss": -24.52410125732422, "global_step": 218179, "epoch": 2628} {"train_loss": -24.410236358642578, "global_step": 218180, "epoch": 2628} {"train_loss": -24.69146156311035, "global_step": 218181, "epoch": 2628} {"train_loss": -24.613317489624023, "global_step": 218182, "epoch": 2628} {"train_loss": -24.6462345123291, "global_step": 218183, "epoch": 2628} {"train_loss": -24.678186416625977, "global_step": 218184, "epoch": 2628} {"train_loss": -25.001066207885742, "global_step": 218185, "epoch": 2628} {"train_loss": -24.38730239868164, "global_step": 218186, "epoch": 2628} {"train_loss": -24.6279354095459, "global_step": 218187, "epoch": 2628} {"train_loss": -24.49277114868164, "global_step": 218188, "epoch": 2628} {"train_loss": -24.71293067932129, "global_step": 218189, "epoch": 2628} {"train_loss": -24.524093627929688, "global_step": 218190, "epoch": 2628} {"train_loss": -24.536897659301758, "global_step": 218191, "epoch": 2628} {"train_loss": -24.685579299926758, "global_step": 218192, "epoch": 2628} {"train_loss": -24.40741539001465, "global_step": 218193, "epoch": 2628} {"train_loss": -24.66458511352539, "global_step": 218194, "epoch": 2628} {"train_loss": -24.328100204467773, "global_step": 218195, "epoch": 2628} {"train_loss": -24.6146240234375, "global_step": 218196, "epoch": 2628} {"train_loss": -24.605051040649414, "global_step": 218197, "epoch": 2628} {"train_loss": -24.529748916625977, "global_step": 218198, "epoch": 2628} {"train_loss": -24.626617431640625, "global_step": 218199, "epoch": 2628} {"train_loss": -24.649198532104492, "global_step": 218200, "epoch": 2628} {"train_loss": -24.584245681762695, "global_step": 218201, "epoch": 2628} {"train_loss": -24.7254695892334, "global_step": 218202, "epoch": 2628} {"train_loss": -24.77081871032715, "global_step": 218203, "epoch": 2628} {"train_loss": -24.463010787963867, "global_step": 218204, "epoch": 2628} {"train_loss": -24.577184677124023, "global_step": 218205, "epoch": 2628} {"train_loss": -24.407174029982233, "global_step": 218206, "epoch": 2628, "val_loss": 6647570.0} {"train_loss": -23.551132202148438, "global_step": 218207, "epoch": 2629} {"train_loss": -21.92877769470215, "global_step": 218208, "epoch": 2629} {"train_loss": -22.49258804321289, "global_step": 218209, "epoch": 2629} {"train_loss": -23.863927841186523, "global_step": 218210, "epoch": 2629} {"train_loss": -22.797510147094727, "global_step": 218211, "epoch": 2629} {"train_loss": -22.866968154907227, "global_step": 218212, "epoch": 2629} {"train_loss": -23.770946502685547, "global_step": 218213, "epoch": 2629} {"train_loss": -22.87677001953125, "global_step": 218214, "epoch": 2629} {"train_loss": -24.14972496032715, "global_step": 218215, "epoch": 2629} {"train_loss": -23.493167877197266, "global_step": 218216, "epoch": 2629} {"train_loss": -23.8814754486084, "global_step": 218217, "epoch": 2629} {"train_loss": -23.737974166870117, "global_step": 218218, "epoch": 2629} {"train_loss": -23.825748443603516, "global_step": 218219, "epoch": 2629} {"train_loss": -23.64091682434082, "global_step": 218220, "epoch": 2629} {"train_loss": -24.316396713256836, "global_step": 218221, "epoch": 2629} {"train_loss": -23.633264541625977, "global_step": 218222, "epoch": 2629} {"train_loss": -23.968887329101562, "global_step": 218223, "epoch": 2629} {"train_loss": -23.666383743286133, "global_step": 218224, "epoch": 2629} {"train_loss": -23.741043090820312, "global_step": 218225, "epoch": 2629} {"train_loss": -23.93928337097168, "global_step": 218226, "epoch": 2629} {"train_loss": -24.290372848510742, "global_step": 218227, "epoch": 2629} {"train_loss": -23.86623191833496, "global_step": 218228, "epoch": 2629} {"train_loss": -24.20199203491211, "global_step": 218229, "epoch": 2629} {"train_loss": -24.001195907592773, "global_step": 218230, "epoch": 2629} {"train_loss": -24.485567092895508, "global_step": 218231, "epoch": 2629} {"train_loss": -23.791549682617188, "global_step": 218232, "epoch": 2629} {"train_loss": -23.73817253112793, "global_step": 218233, "epoch": 2629} {"train_loss": -24.20302391052246, "global_step": 218234, "epoch": 2629} {"train_loss": -24.379438400268555, "global_step": 218235, "epoch": 2629} {"train_loss": -24.56813621520996, "global_step": 218236, "epoch": 2629} {"train_loss": -24.054237365722656, "global_step": 218237, "epoch": 2629} {"train_loss": -24.3960018157959, "global_step": 218238, "epoch": 2629} {"train_loss": -24.03330421447754, "global_step": 218239, "epoch": 2629} {"train_loss": -24.221708297729492, "global_step": 218240, "epoch": 2629} {"train_loss": -24.232091903686523, "global_step": 218241, "epoch": 2629} {"train_loss": -24.4041690826416, "global_step": 218242, "epoch": 2629} {"train_loss": -24.38006019592285, "global_step": 218243, "epoch": 2629} {"train_loss": -24.594335556030273, "global_step": 218244, "epoch": 2629} {"train_loss": -24.39447021484375, "global_step": 218245, "epoch": 2629} {"train_loss": -24.696720123291016, "global_step": 218246, "epoch": 2629} {"train_loss": -24.915359497070312, "global_step": 218247, "epoch": 2629} {"train_loss": -24.38239860534668, "global_step": 218248, "epoch": 2629} {"train_loss": -24.61585807800293, "global_step": 218249, "epoch": 2629} {"train_loss": -24.336734771728516, "global_step": 218250, "epoch": 2629} {"train_loss": -24.88433265686035, "global_step": 218251, "epoch": 2629} {"train_loss": -24.24689292907715, "global_step": 218252, "epoch": 2629} {"train_loss": -24.17193603515625, "global_step": 218253, "epoch": 2629} {"train_loss": -24.566333770751953, "global_step": 218254, "epoch": 2629} {"train_loss": -24.649581909179688, "global_step": 218255, "epoch": 2629} {"train_loss": -24.503320693969727, "global_step": 218256, "epoch": 2629} {"train_loss": -24.066137313842773, "global_step": 218257, "epoch": 2629} {"train_loss": -24.115102767944336, "global_step": 218258, "epoch": 2629} {"train_loss": -24.2326717376709, "global_step": 218259, "epoch": 2629} {"train_loss": -24.689428329467773, "global_step": 218260, "epoch": 2629} {"train_loss": -24.66554069519043, "global_step": 218261, "epoch": 2629} {"train_loss": -24.57792854309082, "global_step": 218262, "epoch": 2629} {"train_loss": -24.801851272583008, "global_step": 218263, "epoch": 2629} {"train_loss": -24.9937744140625, "global_step": 218264, "epoch": 2629} {"train_loss": -24.787322998046875, "global_step": 218265, "epoch": 2629} {"train_loss": -24.512893676757812, "global_step": 218266, "epoch": 2629} {"train_loss": -24.65825080871582, "global_step": 218267, "epoch": 2629} {"train_loss": -24.520301818847656, "global_step": 218268, "epoch": 2629} {"train_loss": -24.38386344909668, "global_step": 218269, "epoch": 2629} {"train_loss": -24.30909538269043, "global_step": 218270, "epoch": 2629} {"train_loss": -24.386699676513672, "global_step": 218271, "epoch": 2629} {"train_loss": -24.17750358581543, "global_step": 218272, "epoch": 2629} {"train_loss": -24.6203670501709, "global_step": 218273, "epoch": 2629} {"train_loss": -24.604455947875977, "global_step": 218274, "epoch": 2629} {"train_loss": -24.200902938842773, "global_step": 218275, "epoch": 2629} {"train_loss": -24.42258644104004, "global_step": 218276, "epoch": 2629} {"train_loss": -24.542095184326172, "global_step": 218277, "epoch": 2629} {"train_loss": -24.731706619262695, "global_step": 218278, "epoch": 2629} {"train_loss": -24.600122451782227, "global_step": 218279, "epoch": 2629} {"train_loss": -24.620880126953125, "global_step": 218280, "epoch": 2629} {"train_loss": -24.498754501342773, "global_step": 218281, "epoch": 2629} {"train_loss": -24.440629959106445, "global_step": 218282, "epoch": 2629} {"train_loss": -25.04023551940918, "global_step": 218283, "epoch": 2629} {"train_loss": -24.834762573242188, "global_step": 218284, "epoch": 2629} {"train_loss": -24.54332160949707, "global_step": 218285, "epoch": 2629} {"train_loss": -25.033435821533203, "global_step": 218286, "epoch": 2629} {"train_loss": -24.681331634521484, "global_step": 218287, "epoch": 2629} {"train_loss": -24.12986183166504, "global_step": 218288, "epoch": 2629} {"train_loss": -24.225530854190687, "global_step": 218289, "epoch": 2629, "val_loss": 6575972.5} {"train_loss": -23.830646514892578, "global_step": 218290, "epoch": 2630} {"train_loss": -24.71278953552246, "global_step": 218291, "epoch": 2630} {"train_loss": -24.031579971313477, "global_step": 218292, "epoch": 2630} {"train_loss": -23.696504592895508, "global_step": 218293, "epoch": 2630} {"train_loss": -24.0053653717041, "global_step": 218294, "epoch": 2630} {"train_loss": -23.3985595703125, "global_step": 218295, "epoch": 2630} {"train_loss": -24.17127799987793, "global_step": 218296, "epoch": 2630} {"train_loss": -24.033227920532227, "global_step": 218297, "epoch": 2630} {"train_loss": -24.4144344329834, "global_step": 218298, "epoch": 2630} {"train_loss": -24.335729598999023, "global_step": 218299, "epoch": 2630} {"train_loss": -24.249557495117188, "global_step": 218300, "epoch": 2630} {"train_loss": -24.26132583618164, "global_step": 218301, "epoch": 2630} {"train_loss": -24.028076171875, "global_step": 218302, "epoch": 2630} {"train_loss": -24.542776107788086, "global_step": 218303, "epoch": 2630} {"train_loss": -24.163251876831055, "global_step": 218304, "epoch": 2630} {"train_loss": -24.233366012573242, "global_step": 218305, "epoch": 2630} {"train_loss": -24.206274032592773, "global_step": 218306, "epoch": 2630} {"train_loss": -24.042051315307617, "global_step": 218307, "epoch": 2630} {"train_loss": -24.318622589111328, "global_step": 218308, "epoch": 2630} {"train_loss": -24.280475616455078, "global_step": 218309, "epoch": 2630} {"train_loss": -24.54023551940918, "global_step": 218310, "epoch": 2630} {"train_loss": -24.397846221923828, "global_step": 218311, "epoch": 2630} {"train_loss": -24.470645904541016, "global_step": 218312, "epoch": 2630} {"train_loss": -24.304685592651367, "global_step": 218313, "epoch": 2630} {"train_loss": -24.403039932250977, "global_step": 218314, "epoch": 2630} {"train_loss": -24.560352325439453, "global_step": 218315, "epoch": 2630} {"train_loss": -24.609567642211914, "global_step": 218316, "epoch": 2630} {"train_loss": -24.58028221130371, "global_step": 218317, "epoch": 2630} {"train_loss": -24.196674346923828, "global_step": 218318, "epoch": 2630} {"train_loss": -25.031774520874023, "global_step": 218319, "epoch": 2630} {"train_loss": -24.76509666442871, "global_step": 218320, "epoch": 2630} {"train_loss": -24.17033576965332, "global_step": 218321, "epoch": 2630} {"train_loss": -24.141250610351562, "global_step": 218322, "epoch": 2630} {"train_loss": -24.418241500854492, "global_step": 218323, "epoch": 2630} {"train_loss": -24.648038864135742, "global_step": 218324, "epoch": 2630} {"train_loss": -23.869003295898438, "global_step": 218325, "epoch": 2630} {"train_loss": -23.957624435424805, "global_step": 218326, "epoch": 2630} {"train_loss": -24.28485870361328, "global_step": 218327, "epoch": 2630} {"train_loss": -24.366455078125, "global_step": 218328, "epoch": 2630} {"train_loss": -24.41756248474121, "global_step": 218329, "epoch": 2630} {"train_loss": -24.69484519958496, "global_step": 218330, "epoch": 2630} {"train_loss": -24.54183006286621, "global_step": 218331, "epoch": 2630} {"train_loss": -24.778181076049805, "global_step": 218332, "epoch": 2630} {"train_loss": -24.55805015563965, "global_step": 218333, "epoch": 2630} {"train_loss": -24.329004287719727, "global_step": 218334, "epoch": 2630} {"train_loss": -24.78949546813965, "global_step": 218335, "epoch": 2630} {"train_loss": -24.407100677490234, "global_step": 218336, "epoch": 2630} {"train_loss": -24.507741928100586, "global_step": 218337, "epoch": 2630} {"train_loss": -24.616622924804688, "global_step": 218338, "epoch": 2630} {"train_loss": -24.792285919189453, "global_step": 218339, "epoch": 2630} {"train_loss": -24.541776657104492, "global_step": 218340, "epoch": 2630} {"train_loss": -24.719255447387695, "global_step": 218341, "epoch": 2630} {"train_loss": -24.773271560668945, "global_step": 218342, "epoch": 2630} {"train_loss": -24.818349838256836, "global_step": 218343, "epoch": 2630} {"train_loss": -24.60768699645996, "global_step": 218344, "epoch": 2630} {"train_loss": -24.693506240844727, "global_step": 218345, "epoch": 2630} {"train_loss": -24.713409423828125, "global_step": 218346, "epoch": 2630} {"train_loss": -24.409685134887695, "global_step": 218347, "epoch": 2630} {"train_loss": -24.780933380126953, "global_step": 218348, "epoch": 2630} {"train_loss": -24.683395385742188, "global_step": 218349, "epoch": 2630} {"train_loss": -24.882158279418945, "global_step": 218350, "epoch": 2630} {"train_loss": -24.672773361206055, "global_step": 218351, "epoch": 2630} {"train_loss": -24.444034576416016, "global_step": 218352, "epoch": 2630} {"train_loss": -24.591703414916992, "global_step": 218353, "epoch": 2630} {"train_loss": -24.414995193481445, "global_step": 218354, "epoch": 2630} {"train_loss": -25.02089500427246, "global_step": 218355, "epoch": 2630} {"train_loss": -24.956939697265625, "global_step": 218356, "epoch": 2630} {"train_loss": -24.770353317260742, "global_step": 218357, "epoch": 2630} {"train_loss": -24.64093017578125, "global_step": 218358, "epoch": 2630} {"train_loss": -24.686933517456055, "global_step": 218359, "epoch": 2630} {"train_loss": -24.164077758789062, "global_step": 218360, "epoch": 2630} {"train_loss": -24.183347702026367, "global_step": 218361, "epoch": 2630} {"train_loss": -24.4970760345459, "global_step": 218362, "epoch": 2630} {"train_loss": -24.77471923828125, "global_step": 218363, "epoch": 2630} {"train_loss": -24.582304000854492, "global_step": 218364, "epoch": 2630} {"train_loss": -24.676319122314453, "global_step": 218365, "epoch": 2630} {"train_loss": -24.54400634765625, "global_step": 218366, "epoch": 2630} {"train_loss": -24.50264549255371, "global_step": 218367, "epoch": 2630} {"train_loss": -24.785654067993164, "global_step": 218368, "epoch": 2630} {"train_loss": -24.157886505126953, "global_step": 218369, "epoch": 2630} {"train_loss": -24.00001335144043, "global_step": 218370, "epoch": 2630} {"train_loss": -24.69951820373535, "global_step": 218371, "epoch": 2630} {"train_loss": -24.440262024661145, "global_step": 218372, "epoch": 2630, "val_loss": 6659298.0} {"train_loss": -22.916446685791016, "global_step": 218373, "epoch": 2631} {"train_loss": -22.586423873901367, "global_step": 218374, "epoch": 2631} {"train_loss": -23.5690860748291, "global_step": 218375, "epoch": 2631} {"train_loss": -23.555164337158203, "global_step": 218376, "epoch": 2631} {"train_loss": -23.716894149780273, "global_step": 218377, "epoch": 2631} {"train_loss": -23.968488693237305, "global_step": 218378, "epoch": 2631} {"train_loss": -23.973344802856445, "global_step": 218379, "epoch": 2631} {"train_loss": -23.856000900268555, "global_step": 218380, "epoch": 2631} {"train_loss": -24.018465042114258, "global_step": 218381, "epoch": 2631} {"train_loss": -24.093032836914062, "global_step": 218382, "epoch": 2631} {"train_loss": -24.178991317749023, "global_step": 218383, "epoch": 2631} {"train_loss": -23.999876022338867, "global_step": 218384, "epoch": 2631} {"train_loss": -24.0285701751709, "global_step": 218385, "epoch": 2631} {"train_loss": -23.968116760253906, "global_step": 218386, "epoch": 2631} {"train_loss": -24.162307739257812, "global_step": 218387, "epoch": 2631} {"train_loss": -24.18338394165039, "global_step": 218388, "epoch": 2631} {"train_loss": -24.179243087768555, "global_step": 218389, "epoch": 2631} {"train_loss": -24.194421768188477, "global_step": 218390, "epoch": 2631} {"train_loss": -24.385568618774414, "global_step": 218391, "epoch": 2631} {"train_loss": -24.31461524963379, "global_step": 218392, "epoch": 2631} {"train_loss": -24.392990112304688, "global_step": 218393, "epoch": 2631} {"train_loss": -24.345600128173828, "global_step": 218394, "epoch": 2631} {"train_loss": -24.27070426940918, "global_step": 218395, "epoch": 2631} {"train_loss": -24.291019439697266, "global_step": 218396, "epoch": 2631} {"train_loss": -24.726703643798828, "global_step": 218397, "epoch": 2631} {"train_loss": -24.37795639038086, "global_step": 218398, "epoch": 2631} {"train_loss": -24.509021759033203, "global_step": 218399, "epoch": 2631} {"train_loss": -24.51089859008789, "global_step": 218400, "epoch": 2631} {"train_loss": -24.262990951538086, "global_step": 218401, "epoch": 2631} {"train_loss": -24.216638565063477, "global_step": 218402, "epoch": 2631} {"train_loss": -24.60000991821289, "global_step": 218403, "epoch": 2631} {"train_loss": -24.380170822143555, "global_step": 218404, "epoch": 2631} {"train_loss": -24.538253784179688, "global_step": 218405, "epoch": 2631} {"train_loss": -24.5859432220459, "global_step": 218406, "epoch": 2631} {"train_loss": -24.28887367248535, "global_step": 218407, "epoch": 2631} {"train_loss": -24.364587783813477, "global_step": 218408, "epoch": 2631} {"train_loss": -24.92533302307129, "global_step": 218409, "epoch": 2631} {"train_loss": -24.57002067565918, "global_step": 218410, "epoch": 2631} {"train_loss": -24.529544830322266, "global_step": 218411, "epoch": 2631} {"train_loss": -24.72859001159668, "global_step": 218412, "epoch": 2631} {"train_loss": -24.5445499420166, "global_step": 218413, "epoch": 2631} {"train_loss": -24.390104293823242, "global_step": 218414, "epoch": 2631} {"train_loss": -24.665237426757812, "global_step": 218415, "epoch": 2631} {"train_loss": -24.65899658203125, "global_step": 218416, "epoch": 2631} {"train_loss": -24.688459396362305, "global_step": 218417, "epoch": 2631} {"train_loss": -24.491483688354492, "global_step": 218418, "epoch": 2631} {"train_loss": -24.555294036865234, "global_step": 218419, "epoch": 2631} {"train_loss": -24.468441009521484, "global_step": 218420, "epoch": 2631} {"train_loss": -24.247373580932617, "global_step": 218421, "epoch": 2631} {"train_loss": -24.606016159057617, "global_step": 218422, "epoch": 2631} {"train_loss": -25.098073959350586, "global_step": 218423, "epoch": 2631} {"train_loss": -25.00575828552246, "global_step": 218424, "epoch": 2631} {"train_loss": -24.568450927734375, "global_step": 218425, "epoch": 2631} {"train_loss": -24.86282730102539, "global_step": 218426, "epoch": 2631} {"train_loss": -24.60159683227539, "global_step": 218427, "epoch": 2631} {"train_loss": -24.738292694091797, "global_step": 218428, "epoch": 2631} {"train_loss": -24.462207794189453, "global_step": 218429, "epoch": 2631} {"train_loss": -24.453338623046875, "global_step": 218430, "epoch": 2631} {"train_loss": -24.48682975769043, "global_step": 218431, "epoch": 2631} {"train_loss": -24.302284240722656, "global_step": 218432, "epoch": 2631} {"train_loss": -24.409513473510742, "global_step": 218433, "epoch": 2631} {"train_loss": -24.23072624206543, "global_step": 218434, "epoch": 2631} {"train_loss": -24.483251571655273, "global_step": 218435, "epoch": 2631} {"train_loss": -24.689416885375977, "global_step": 218436, "epoch": 2631} {"train_loss": -24.683555603027344, "global_step": 218437, "epoch": 2631} {"train_loss": -24.681833267211914, "global_step": 218438, "epoch": 2631} {"train_loss": -24.74297523498535, "global_step": 218439, "epoch": 2631} {"train_loss": -24.4852352142334, "global_step": 218440, "epoch": 2631} {"train_loss": -24.614089965820312, "global_step": 218441, "epoch": 2631} {"train_loss": -24.827713012695312, "global_step": 218442, "epoch": 2631} {"train_loss": -24.617807388305664, "global_step": 218443, "epoch": 2631} {"train_loss": -24.705810546875, "global_step": 218444, "epoch": 2631} {"train_loss": -24.25286865234375, "global_step": 218445, "epoch": 2631} {"train_loss": -24.468414306640625, "global_step": 218446, "epoch": 2631} {"train_loss": -24.556299209594727, "global_step": 218447, "epoch": 2631} {"train_loss": -24.225854873657227, "global_step": 218448, "epoch": 2631} {"train_loss": -24.4205322265625, "global_step": 218449, "epoch": 2631} {"train_loss": -24.52009391784668, "global_step": 218450, "epoch": 2631} {"train_loss": -24.749753952026367, "global_step": 218451, "epoch": 2631} {"train_loss": -24.631258010864258, "global_step": 218452, "epoch": 2631} {"train_loss": -24.26104736328125, "global_step": 218453, "epoch": 2631} {"train_loss": -24.87259292602539, "global_step": 218454, "epoch": 2631} {"train_loss": -24.3812869198351, "global_step": 218455, "epoch": 2631, "val_loss": 6561118.5} {"train_loss": -24.41857147216797, "global_step": 218456, "epoch": 2632} {"train_loss": -24.631423950195312, "global_step": 218457, "epoch": 2632} {"train_loss": -24.693870544433594, "global_step": 218458, "epoch": 2632} {"train_loss": -24.562318801879883, "global_step": 218459, "epoch": 2632} {"train_loss": -24.377958297729492, "global_step": 218460, "epoch": 2632} {"train_loss": -24.621660232543945, "global_step": 218461, "epoch": 2632} {"train_loss": -24.722158432006836, "global_step": 218462, "epoch": 2632} {"train_loss": -24.04690933227539, "global_step": 218463, "epoch": 2632} {"train_loss": -24.656766891479492, "global_step": 218464, "epoch": 2632} {"train_loss": -24.69648551940918, "global_step": 218465, "epoch": 2632} {"train_loss": -24.692752838134766, "global_step": 218466, "epoch": 2632} {"train_loss": -24.602270126342773, "global_step": 218467, "epoch": 2632} {"train_loss": -24.685413360595703, "global_step": 218468, "epoch": 2632} {"train_loss": -24.79794692993164, "global_step": 218469, "epoch": 2632} {"train_loss": -24.65645408630371, "global_step": 218470, "epoch": 2632} {"train_loss": -24.746000289916992, "global_step": 218471, "epoch": 2632} {"train_loss": -24.668432235717773, "global_step": 218472, "epoch": 2632} {"train_loss": -24.705215454101562, "global_step": 218473, "epoch": 2632} {"train_loss": -24.553918838500977, "global_step": 218474, "epoch": 2632} {"train_loss": -24.35259437561035, "global_step": 218475, "epoch": 2632} {"train_loss": -24.543485641479492, "global_step": 218476, "epoch": 2632} {"train_loss": -24.176843643188477, "global_step": 218477, "epoch": 2632} {"train_loss": -24.91236686706543, "global_step": 218478, "epoch": 2632} {"train_loss": -24.45074462890625, "global_step": 218479, "epoch": 2632} {"train_loss": -24.395097732543945, "global_step": 218480, "epoch": 2632} {"train_loss": -24.457881927490234, "global_step": 218481, "epoch": 2632} {"train_loss": -24.271562576293945, "global_step": 218482, "epoch": 2632} {"train_loss": -24.5500431060791, "global_step": 218483, "epoch": 2632} {"train_loss": -24.32794761657715, "global_step": 218484, "epoch": 2632} {"train_loss": -24.11713981628418, "global_step": 218485, "epoch": 2632} {"train_loss": -24.2817325592041, "global_step": 218486, "epoch": 2632} {"train_loss": -24.835586547851562, "global_step": 218487, "epoch": 2632} {"train_loss": -24.367446899414062, "global_step": 218488, "epoch": 2632} {"train_loss": -24.74786949157715, "global_step": 218489, "epoch": 2632} {"train_loss": -24.59455680847168, "global_step": 218490, "epoch": 2632} {"train_loss": -24.245817184448242, "global_step": 218491, "epoch": 2632} {"train_loss": -24.910091400146484, "global_step": 218492, "epoch": 2632} {"train_loss": -24.9444637298584, "global_step": 218493, "epoch": 2632} {"train_loss": -24.636337280273438, "global_step": 218494, "epoch": 2632} {"train_loss": -24.72492027282715, "global_step": 218495, "epoch": 2632} {"train_loss": -24.57509422302246, "global_step": 218496, "epoch": 2632} {"train_loss": -24.843978881835938, "global_step": 218497, "epoch": 2632} {"train_loss": -24.307296752929688, "global_step": 218498, "epoch": 2632} {"train_loss": -24.582693099975586, "global_step": 218499, "epoch": 2632} {"train_loss": -24.408554077148438, "global_step": 218500, "epoch": 2632} {"train_loss": -24.551321029663086, "global_step": 218501, "epoch": 2632} {"train_loss": -24.428300857543945, "global_step": 218502, "epoch": 2632} {"train_loss": -24.3646297454834, "global_step": 218503, "epoch": 2632} {"train_loss": -24.284061431884766, "global_step": 218504, "epoch": 2632} {"train_loss": -24.45412254333496, "global_step": 218505, "epoch": 2632} {"train_loss": -24.560068130493164, "global_step": 218506, "epoch": 2632} {"train_loss": -24.51535987854004, "global_step": 218507, "epoch": 2632} {"train_loss": -24.720449447631836, "global_step": 218508, "epoch": 2632} {"train_loss": -24.765308380126953, "global_step": 218509, "epoch": 2632} {"train_loss": -24.229934692382812, "global_step": 218510, "epoch": 2632} {"train_loss": -24.758872985839844, "global_step": 218511, "epoch": 2632} {"train_loss": -24.314838409423828, "global_step": 218512, "epoch": 2632} {"train_loss": -24.558486938476562, "global_step": 218513, "epoch": 2632} {"train_loss": -24.975934982299805, "global_step": 218514, "epoch": 2632} {"train_loss": -24.678861618041992, "global_step": 218515, "epoch": 2632} {"train_loss": -24.533100128173828, "global_step": 218516, "epoch": 2632} {"train_loss": -24.668548583984375, "global_step": 218517, "epoch": 2632} {"train_loss": -24.75724983215332, "global_step": 218518, "epoch": 2632} {"train_loss": -24.334182739257812, "global_step": 218519, "epoch": 2632} {"train_loss": -24.630727767944336, "global_step": 218520, "epoch": 2632} {"train_loss": -24.844425201416016, "global_step": 218521, "epoch": 2632} {"train_loss": -24.377445220947266, "global_step": 218522, "epoch": 2632} {"train_loss": -24.788475036621094, "global_step": 218523, "epoch": 2632} {"train_loss": -24.524280548095703, "global_step": 218524, "epoch": 2632} {"train_loss": -24.52008628845215, "global_step": 218525, "epoch": 2632} {"train_loss": -24.80327033996582, "global_step": 218526, "epoch": 2632} {"train_loss": -24.7896785736084, "global_step": 218527, "epoch": 2632} {"train_loss": -24.698163986206055, "global_step": 218528, "epoch": 2632} {"train_loss": -24.549530029296875, "global_step": 218529, "epoch": 2632} {"train_loss": -24.59209632873535, "global_step": 218530, "epoch": 2632} {"train_loss": -24.648176193237305, "global_step": 218531, "epoch": 2632} {"train_loss": -24.685558319091797, "global_step": 218532, "epoch": 2632} {"train_loss": -24.34271812438965, "global_step": 218533, "epoch": 2632} {"train_loss": -25.170562744140625, "global_step": 218534, "epoch": 2632} {"train_loss": -24.74107551574707, "global_step": 218535, "epoch": 2632} {"train_loss": -24.91529083251953, "global_step": 218536, "epoch": 2632} {"train_loss": -24.73383903503418, "global_step": 218537, "epoch": 2632} {"train_loss": -24.574416378894483, "global_step": 218538, "epoch": 2632, "val_loss": 6565496.0} {"train_loss": -23.883852005004883, "global_step": 218539, "epoch": 2633} {"train_loss": -23.114240646362305, "global_step": 218540, "epoch": 2633} {"train_loss": -23.713565826416016, "global_step": 218541, "epoch": 2633} {"train_loss": -23.678714752197266, "global_step": 218542, "epoch": 2633} {"train_loss": -24.151418685913086, "global_step": 218543, "epoch": 2633} {"train_loss": -23.513139724731445, "global_step": 218544, "epoch": 2633} {"train_loss": -24.23610496520996, "global_step": 218545, "epoch": 2633} {"train_loss": -23.60333251953125, "global_step": 218546, "epoch": 2633} {"train_loss": -24.383602142333984, "global_step": 218547, "epoch": 2633} {"train_loss": -24.250761032104492, "global_step": 218548, "epoch": 2633} {"train_loss": -24.193613052368164, "global_step": 218549, "epoch": 2633} {"train_loss": -24.657026290893555, "global_step": 218550, "epoch": 2633} {"train_loss": -23.977741241455078, "global_step": 218551, "epoch": 2633} {"train_loss": -24.355785369873047, "global_step": 218552, "epoch": 2633} {"train_loss": -24.18808364868164, "global_step": 218553, "epoch": 2633} {"train_loss": -24.455066680908203, "global_step": 218554, "epoch": 2633} {"train_loss": -23.9958553314209, "global_step": 218555, "epoch": 2633} {"train_loss": -24.11333656311035, "global_step": 218556, "epoch": 2633} {"train_loss": -24.347448348999023, "global_step": 218557, "epoch": 2633} {"train_loss": -24.280078887939453, "global_step": 218558, "epoch": 2633} {"train_loss": -24.025293350219727, "global_step": 218559, "epoch": 2633} {"train_loss": -24.642850875854492, "global_step": 218560, "epoch": 2633} {"train_loss": -24.508996963500977, "global_step": 218561, "epoch": 2633} {"train_loss": -24.486902236938477, "global_step": 218562, "epoch": 2633} {"train_loss": -24.354328155517578, "global_step": 218563, "epoch": 2633} {"train_loss": -24.100675582885742, "global_step": 218564, "epoch": 2633} {"train_loss": -24.51318359375, "global_step": 218565, "epoch": 2633} {"train_loss": -23.99964714050293, "global_step": 218566, "epoch": 2633} {"train_loss": -24.313980102539062, "global_step": 218567, "epoch": 2633} {"train_loss": -24.578073501586914, "global_step": 218568, "epoch": 2633} {"train_loss": -24.68607521057129, "global_step": 218569, "epoch": 2633} {"train_loss": -24.700841903686523, "global_step": 218570, "epoch": 2633} {"train_loss": -24.690898895263672, "global_step": 218571, "epoch": 2633} {"train_loss": -24.430789947509766, "global_step": 218572, "epoch": 2633} {"train_loss": -24.773073196411133, "global_step": 218573, "epoch": 2633} {"train_loss": -24.756072998046875, "global_step": 218574, "epoch": 2633} {"train_loss": -24.726734161376953, "global_step": 218575, "epoch": 2633} {"train_loss": -24.67767333984375, "global_step": 218576, "epoch": 2633} {"train_loss": -24.807239532470703, "global_step": 218577, "epoch": 2633} {"train_loss": -24.372520446777344, "global_step": 218578, "epoch": 2633} {"train_loss": -24.521574020385742, "global_step": 218579, "epoch": 2633} {"train_loss": -24.74171257019043, "global_step": 218580, "epoch": 2633} {"train_loss": -24.38926124572754, "global_step": 218581, "epoch": 2633} {"train_loss": -24.62556266784668, "global_step": 218582, "epoch": 2633} {"train_loss": -24.902225494384766, "global_step": 218583, "epoch": 2633} {"train_loss": -24.79193687438965, "global_step": 218584, "epoch": 2633} {"train_loss": -24.919546127319336, "global_step": 218585, "epoch": 2633} {"train_loss": -24.77018165588379, "global_step": 218586, "epoch": 2633} {"train_loss": -24.595922470092773, "global_step": 218587, "epoch": 2633} {"train_loss": -24.681133270263672, "global_step": 218588, "epoch": 2633} {"train_loss": -24.801868438720703, "global_step": 218589, "epoch": 2633} {"train_loss": -24.67662239074707, "global_step": 218590, "epoch": 2633} {"train_loss": -24.373123168945312, "global_step": 218591, "epoch": 2633} {"train_loss": -24.11444091796875, "global_step": 218592, "epoch": 2633} {"train_loss": -23.944238662719727, "global_step": 218593, "epoch": 2633} {"train_loss": -23.878828048706055, "global_step": 218594, "epoch": 2633} {"train_loss": -24.597455978393555, "global_step": 218595, "epoch": 2633} {"train_loss": -24.84048080444336, "global_step": 218596, "epoch": 2633} {"train_loss": -24.35274887084961, "global_step": 218597, "epoch": 2633} {"train_loss": -24.8575439453125, "global_step": 218598, "epoch": 2633} {"train_loss": -24.616069793701172, "global_step": 218599, "epoch": 2633} {"train_loss": -24.456222534179688, "global_step": 218600, "epoch": 2633} {"train_loss": -24.63336753845215, "global_step": 218601, "epoch": 2633} {"train_loss": -24.782644271850586, "global_step": 218602, "epoch": 2633} {"train_loss": -24.525205612182617, "global_step": 218603, "epoch": 2633} {"train_loss": -23.965513229370117, "global_step": 218604, "epoch": 2633} {"train_loss": -24.81856346130371, "global_step": 218605, "epoch": 2633} {"train_loss": -24.18254280090332, "global_step": 218606, "epoch": 2633} {"train_loss": -24.534961700439453, "global_step": 218607, "epoch": 2633} {"train_loss": -24.63612937927246, "global_step": 218608, "epoch": 2633} {"train_loss": -24.7287654876709, "global_step": 218609, "epoch": 2633} {"train_loss": -24.765775680541992, "global_step": 218610, "epoch": 2633} {"train_loss": -24.346799850463867, "global_step": 218611, "epoch": 2633} {"train_loss": -25.09136199951172, "global_step": 218612, "epoch": 2633} {"train_loss": -24.4708309173584, "global_step": 218613, "epoch": 2633} {"train_loss": -24.45916748046875, "global_step": 218614, "epoch": 2633} {"train_loss": -24.677001953125, "global_step": 218615, "epoch": 2633} {"train_loss": -24.8947696685791, "global_step": 218616, "epoch": 2633} {"train_loss": -24.53082847595215, "global_step": 218617, "epoch": 2633} {"train_loss": -24.767255783081055, "global_step": 218618, "epoch": 2633} {"train_loss": -24.52247428894043, "global_step": 218619, "epoch": 2633} {"train_loss": -24.472232818603516, "global_step": 218620, "epoch": 2633} {"train_loss": -24.44078013408615, "global_step": 218621, "epoch": 2633, "val_loss": 6610296.0} {"train_loss": -24.71731948852539, "global_step": 218622, "epoch": 2634} {"train_loss": -24.005491256713867, "global_step": 218623, "epoch": 2634} {"train_loss": -23.994985580444336, "global_step": 218624, "epoch": 2634} {"train_loss": -24.426990509033203, "global_step": 218625, "epoch": 2634} {"train_loss": -24.39769172668457, "global_step": 218626, "epoch": 2634} {"train_loss": -24.576828002929688, "global_step": 218627, "epoch": 2634} {"train_loss": -24.739276885986328, "global_step": 218628, "epoch": 2634} {"train_loss": -24.255117416381836, "global_step": 218629, "epoch": 2634} {"train_loss": -24.227828979492188, "global_step": 218630, "epoch": 2634} {"train_loss": -24.193506240844727, "global_step": 218631, "epoch": 2634} {"train_loss": -24.23160171508789, "global_step": 218632, "epoch": 2634} {"train_loss": -23.994121551513672, "global_step": 218633, "epoch": 2634} {"train_loss": -24.8933048248291, "global_step": 218634, "epoch": 2634} {"train_loss": -24.493938446044922, "global_step": 218635, "epoch": 2634} {"train_loss": -24.418521881103516, "global_step": 218636, "epoch": 2634} {"train_loss": -24.45701026916504, "global_step": 218637, "epoch": 2634} {"train_loss": -24.59107780456543, "global_step": 218638, "epoch": 2634} {"train_loss": -24.60892105102539, "global_step": 218639, "epoch": 2634} {"train_loss": -24.838224411010742, "global_step": 218640, "epoch": 2634} {"train_loss": -24.812070846557617, "global_step": 218641, "epoch": 2634} {"train_loss": -24.336978912353516, "global_step": 218642, "epoch": 2634} {"train_loss": -24.530067443847656, "global_step": 218643, "epoch": 2634} {"train_loss": -24.117822647094727, "global_step": 218644, "epoch": 2634} {"train_loss": -24.4862003326416, "global_step": 218645, "epoch": 2634} {"train_loss": -24.351654052734375, "global_step": 218646, "epoch": 2634} {"train_loss": -24.84598159790039, "global_step": 218647, "epoch": 2634} {"train_loss": -24.580013275146484, "global_step": 218648, "epoch": 2634} {"train_loss": -24.427541732788086, "global_step": 218649, "epoch": 2634} {"train_loss": -24.953134536743164, "global_step": 218650, "epoch": 2634} {"train_loss": -24.540971755981445, "global_step": 218651, "epoch": 2634} {"train_loss": -24.454734802246094, "global_step": 218652, "epoch": 2634} {"train_loss": -24.714914321899414, "global_step": 218653, "epoch": 2634} {"train_loss": -24.737293243408203, "global_step": 218654, "epoch": 2634} {"train_loss": -24.843952178955078, "global_step": 218655, "epoch": 2634} {"train_loss": -24.623815536499023, "global_step": 218656, "epoch": 2634} {"train_loss": -24.99953269958496, "global_step": 218657, "epoch": 2634} {"train_loss": -24.645803451538086, "global_step": 218658, "epoch": 2634} {"train_loss": -24.880155563354492, "global_step": 218659, "epoch": 2634} {"train_loss": -24.49019432067871, "global_step": 218660, "epoch": 2634} {"train_loss": -24.486433029174805, "global_step": 218661, "epoch": 2634} {"train_loss": -24.752737045288086, "global_step": 218662, "epoch": 2634} {"train_loss": -24.529991149902344, "global_step": 218663, "epoch": 2634} {"train_loss": -24.9006290435791, "global_step": 218664, "epoch": 2634} {"train_loss": -24.653207778930664, "global_step": 218665, "epoch": 2634} {"train_loss": -25.030399322509766, "global_step": 218666, "epoch": 2634} {"train_loss": -24.768680572509766, "global_step": 218667, "epoch": 2634} {"train_loss": -24.6058406829834, "global_step": 218668, "epoch": 2634} {"train_loss": -24.313955307006836, "global_step": 218669, "epoch": 2634} {"train_loss": -24.615415573120117, "global_step": 218670, "epoch": 2634} {"train_loss": -24.256399154663086, "global_step": 218671, "epoch": 2634} {"train_loss": -25.101856231689453, "global_step": 218672, "epoch": 2634} {"train_loss": -24.477697372436523, "global_step": 218673, "epoch": 2634} {"train_loss": -24.36147117614746, "global_step": 218674, "epoch": 2634} {"train_loss": -24.24472999572754, "global_step": 218675, "epoch": 2634} {"train_loss": -24.338214874267578, "global_step": 218676, "epoch": 2634} {"train_loss": -24.409269332885742, "global_step": 218677, "epoch": 2634} {"train_loss": -24.261098861694336, "global_step": 218678, "epoch": 2634} {"train_loss": -24.556129455566406, "global_step": 218679, "epoch": 2634} {"train_loss": -24.251630783081055, "global_step": 218680, "epoch": 2634} {"train_loss": -24.49563217163086, "global_step": 218681, "epoch": 2634} {"train_loss": -24.415639877319336, "global_step": 218682, "epoch": 2634} {"train_loss": -24.548681259155273, "global_step": 218683, "epoch": 2634} {"train_loss": -24.46234703063965, "global_step": 218684, "epoch": 2634} {"train_loss": -24.587993621826172, "global_step": 218685, "epoch": 2634} {"train_loss": -24.655065536499023, "global_step": 218686, "epoch": 2634} {"train_loss": -24.621814727783203, "global_step": 218687, "epoch": 2634} {"train_loss": -24.714574813842773, "global_step": 218688, "epoch": 2634} {"train_loss": -24.77032470703125, "global_step": 218689, "epoch": 2634} {"train_loss": -24.91353416442871, "global_step": 218690, "epoch": 2634} {"train_loss": -24.638200759887695, "global_step": 218691, "epoch": 2634} {"train_loss": -24.724777221679688, "global_step": 218692, "epoch": 2634} {"train_loss": -24.689701080322266, "global_step": 218693, "epoch": 2634} {"train_loss": -24.64173698425293, "global_step": 218694, "epoch": 2634} {"train_loss": -24.575380325317383, "global_step": 218695, "epoch": 2634} {"train_loss": -24.236650466918945, "global_step": 218696, "epoch": 2634} {"train_loss": -24.979639053344727, "global_step": 218697, "epoch": 2634} {"train_loss": -24.486608505249023, "global_step": 218698, "epoch": 2634} {"train_loss": -24.610998153686523, "global_step": 218699, "epoch": 2634} {"train_loss": -24.947980880737305, "global_step": 218700, "epoch": 2634} {"train_loss": -24.423837661743164, "global_step": 218701, "epoch": 2634} {"train_loss": -24.451025009155273, "global_step": 218702, "epoch": 2634} {"train_loss": -24.599327087402344, "global_step": 218703, "epoch": 2634} {"train_loss": -24.569521869521544, "global_step": 218704, "epoch": 2634, "val_loss": 6586960.0} {"train_loss": -22.11531639099121, "global_step": 218705, "epoch": 2635} {"train_loss": -21.713180541992188, "global_step": 218706, "epoch": 2635} {"train_loss": -21.947816848754883, "global_step": 218707, "epoch": 2635} {"train_loss": -23.21791648864746, "global_step": 218708, "epoch": 2635} {"train_loss": -22.387182235717773, "global_step": 218709, "epoch": 2635} {"train_loss": -23.574575424194336, "global_step": 218710, "epoch": 2635} {"train_loss": -22.773059844970703, "global_step": 218711, "epoch": 2635} {"train_loss": -23.5465030670166, "global_step": 218712, "epoch": 2635} {"train_loss": -23.1794490814209, "global_step": 218713, "epoch": 2635} {"train_loss": -23.35703468322754, "global_step": 218714, "epoch": 2635} {"train_loss": -23.07135581970215, "global_step": 218715, "epoch": 2635} {"train_loss": -23.635848999023438, "global_step": 218716, "epoch": 2635} {"train_loss": -23.57834815979004, "global_step": 218717, "epoch": 2635} {"train_loss": -23.084646224975586, "global_step": 218718, "epoch": 2635} {"train_loss": -23.54977798461914, "global_step": 218719, "epoch": 2635} {"train_loss": -23.737939834594727, "global_step": 218720, "epoch": 2635} {"train_loss": -23.830862045288086, "global_step": 218721, "epoch": 2635} {"train_loss": -23.721128463745117, "global_step": 218722, "epoch": 2635} {"train_loss": -23.673105239868164, "global_step": 218723, "epoch": 2635} {"train_loss": -23.902511596679688, "global_step": 218724, "epoch": 2635} {"train_loss": -23.609243392944336, "global_step": 218725, "epoch": 2635} {"train_loss": -24.229848861694336, "global_step": 218726, "epoch": 2635} {"train_loss": -23.73834228515625, "global_step": 218727, "epoch": 2635} {"train_loss": -23.958967208862305, "global_step": 218728, "epoch": 2635} {"train_loss": -24.116445541381836, "global_step": 218729, "epoch": 2635} {"train_loss": -24.031938552856445, "global_step": 218730, "epoch": 2635} {"train_loss": -23.82659149169922, "global_step": 218731, "epoch": 2635} {"train_loss": -24.08111572265625, "global_step": 218732, "epoch": 2635} {"train_loss": -23.852949142456055, "global_step": 218733, "epoch": 2635} {"train_loss": -24.301252365112305, "global_step": 218734, "epoch": 2635} {"train_loss": -23.9926815032959, "global_step": 218735, "epoch": 2635} {"train_loss": -24.290435791015625, "global_step": 218736, "epoch": 2635} {"train_loss": -24.540403366088867, "global_step": 218737, "epoch": 2635} {"train_loss": -24.232465744018555, "global_step": 218738, "epoch": 2635} {"train_loss": -24.306623458862305, "global_step": 218739, "epoch": 2635} {"train_loss": -24.47731590270996, "global_step": 218740, "epoch": 2635} {"train_loss": -24.42156982421875, "global_step": 218741, "epoch": 2635} {"train_loss": -24.07980728149414, "global_step": 218742, "epoch": 2635} {"train_loss": -24.767099380493164, "global_step": 218743, "epoch": 2635} {"train_loss": -24.409423828125, "global_step": 218744, "epoch": 2635} {"train_loss": -24.495685577392578, "global_step": 218745, "epoch": 2635} {"train_loss": -24.70598793029785, "global_step": 218746, "epoch": 2635} {"train_loss": -24.401092529296875, "global_step": 218747, "epoch": 2635} {"train_loss": -24.754024505615234, "global_step": 218748, "epoch": 2635} {"train_loss": -24.514936447143555, "global_step": 218749, "epoch": 2635} {"train_loss": -24.485166549682617, "global_step": 218750, "epoch": 2635} {"train_loss": -24.564945220947266, "global_step": 218751, "epoch": 2635} {"train_loss": -24.897470474243164, "global_step": 218752, "epoch": 2635} {"train_loss": -24.440841674804688, "global_step": 218753, "epoch": 2635} {"train_loss": -24.78989028930664, "global_step": 218754, "epoch": 2635} {"train_loss": -24.63111686706543, "global_step": 218755, "epoch": 2635} {"train_loss": -24.548986434936523, "global_step": 218756, "epoch": 2635} {"train_loss": -24.773300170898438, "global_step": 218757, "epoch": 2635} {"train_loss": -24.86327362060547, "global_step": 218758, "epoch": 2635} {"train_loss": -24.85071563720703, "global_step": 218759, "epoch": 2635} {"train_loss": -25.012622833251953, "global_step": 218760, "epoch": 2635} {"train_loss": -24.518957138061523, "global_step": 218761, "epoch": 2635} {"train_loss": -24.39999771118164, "global_step": 218762, "epoch": 2635} {"train_loss": -24.89772605895996, "global_step": 218763, "epoch": 2635} {"train_loss": -24.792516708374023, "global_step": 218764, "epoch": 2635} {"train_loss": -24.5369873046875, "global_step": 218765, "epoch": 2635} {"train_loss": -24.651182174682617, "global_step": 218766, "epoch": 2635} {"train_loss": -24.440250396728516, "global_step": 218767, "epoch": 2635} {"train_loss": -24.568437576293945, "global_step": 218768, "epoch": 2635} {"train_loss": -24.54326820373535, "global_step": 218769, "epoch": 2635} {"train_loss": -24.090614318847656, "global_step": 218770, "epoch": 2635} {"train_loss": -24.939664840698242, "global_step": 218771, "epoch": 2635} {"train_loss": -25.014846801757812, "global_step": 218772, "epoch": 2635} {"train_loss": -24.724655151367188, "global_step": 218773, "epoch": 2635} {"train_loss": -24.5534610748291, "global_step": 218774, "epoch": 2635} {"train_loss": -24.73624610900879, "global_step": 218775, "epoch": 2635} {"train_loss": -24.69953727722168, "global_step": 218776, "epoch": 2635} {"train_loss": -24.5019588470459, "global_step": 218777, "epoch": 2635} {"train_loss": -24.2034912109375, "global_step": 218778, "epoch": 2635} {"train_loss": -24.560148239135742, "global_step": 218779, "epoch": 2635} {"train_loss": -24.8095703125, "global_step": 218780, "epoch": 2635} {"train_loss": -24.641490936279297, "global_step": 218781, "epoch": 2635} {"train_loss": -24.512243270874023, "global_step": 218782, "epoch": 2635} {"train_loss": -24.314619064331055, "global_step": 218783, "epoch": 2635} {"train_loss": -24.376083374023438, "global_step": 218784, "epoch": 2635} {"train_loss": -24.84078025817871, "global_step": 218785, "epoch": 2635} {"train_loss": -24.329269409179688, "global_step": 218786, "epoch": 2635} {"train_loss": -24.1473560792854, "global_step": 218787, "epoch": 2635, "val_loss": 6691796.0} {"train_loss": -23.976972579956055, "global_step": 218788, "epoch": 2636} {"train_loss": -24.215185165405273, "global_step": 218789, "epoch": 2636} {"train_loss": -24.158300399780273, "global_step": 218790, "epoch": 2636} {"train_loss": -24.105920791625977, "global_step": 218791, "epoch": 2636} {"train_loss": -24.255207061767578, "global_step": 218792, "epoch": 2636} {"train_loss": -24.36119270324707, "global_step": 218793, "epoch": 2636} {"train_loss": -23.988927841186523, "global_step": 218794, "epoch": 2636} {"train_loss": -24.54020881652832, "global_step": 218795, "epoch": 2636} {"train_loss": -24.454174041748047, "global_step": 218796, "epoch": 2636} {"train_loss": -24.18433380126953, "global_step": 218797, "epoch": 2636} {"train_loss": -24.411603927612305, "global_step": 218798, "epoch": 2636} {"train_loss": -24.310699462890625, "global_step": 218799, "epoch": 2636} {"train_loss": -24.40460777282715, "global_step": 218800, "epoch": 2636} {"train_loss": -24.71851921081543, "global_step": 218801, "epoch": 2636} {"train_loss": -24.555038452148438, "global_step": 218802, "epoch": 2636} {"train_loss": -24.4135684967041, "global_step": 218803, "epoch": 2636} {"train_loss": -24.596532821655273, "global_step": 218804, "epoch": 2636} {"train_loss": -24.37471580505371, "global_step": 218805, "epoch": 2636} {"train_loss": -24.17119598388672, "global_step": 218806, "epoch": 2636} {"train_loss": -24.3599796295166, "global_step": 218807, "epoch": 2636} {"train_loss": -24.612272262573242, "global_step": 218808, "epoch": 2636} {"train_loss": -24.422475814819336, "global_step": 218809, "epoch": 2636} {"train_loss": -24.2063045501709, "global_step": 218810, "epoch": 2636} {"train_loss": -24.442691802978516, "global_step": 218811, "epoch": 2636} {"train_loss": -24.77312660217285, "global_step": 218812, "epoch": 2636} {"train_loss": -24.278413772583008, "global_step": 218813, "epoch": 2636} {"train_loss": -25.065006256103516, "global_step": 218814, "epoch": 2636} {"train_loss": -24.513113021850586, "global_step": 218815, "epoch": 2636} {"train_loss": -24.054941177368164, "global_step": 218816, "epoch": 2636} {"train_loss": -24.427133560180664, "global_step": 218817, "epoch": 2636} {"train_loss": -25.03407096862793, "global_step": 218818, "epoch": 2636} {"train_loss": -24.932096481323242, "global_step": 218819, "epoch": 2636} {"train_loss": -24.758272171020508, "global_step": 218820, "epoch": 2636} {"train_loss": -24.7341365814209, "global_step": 218821, "epoch": 2636} {"train_loss": -24.731454849243164, "global_step": 218822, "epoch": 2636} {"train_loss": -25.154756546020508, "global_step": 218823, "epoch": 2636} {"train_loss": -24.687578201293945, "global_step": 218824, "epoch": 2636} {"train_loss": -24.529937744140625, "global_step": 218825, "epoch": 2636} {"train_loss": -24.64752769470215, "global_step": 218826, "epoch": 2636} {"train_loss": -24.459142684936523, "global_step": 218827, "epoch": 2636} {"train_loss": -24.247413635253906, "global_step": 218828, "epoch": 2636} {"train_loss": -24.650028228759766, "global_step": 218829, "epoch": 2636} {"train_loss": -24.72336769104004, "global_step": 218830, "epoch": 2636} {"train_loss": -24.5533447265625, "global_step": 218831, "epoch": 2636} {"train_loss": -24.826019287109375, "global_step": 218832, "epoch": 2636} {"train_loss": -24.524259567260742, "global_step": 218833, "epoch": 2636} {"train_loss": -24.51712417602539, "global_step": 218834, "epoch": 2636} {"train_loss": -24.538026809692383, "global_step": 218835, "epoch": 2636} {"train_loss": -24.251258850097656, "global_step": 218836, "epoch": 2636} {"train_loss": -24.606237411499023, "global_step": 218837, "epoch": 2636} {"train_loss": -24.92118263244629, "global_step": 218838, "epoch": 2636} {"train_loss": -24.736982345581055, "global_step": 218839, "epoch": 2636} {"train_loss": -24.315847396850586, "global_step": 218840, "epoch": 2636} {"train_loss": -24.26609230041504, "global_step": 218841, "epoch": 2636} {"train_loss": -24.4005126953125, "global_step": 218842, "epoch": 2636} {"train_loss": -24.34638786315918, "global_step": 218843, "epoch": 2636} {"train_loss": -24.609891891479492, "global_step": 218844, "epoch": 2636} {"train_loss": -24.376253128051758, "global_step": 218845, "epoch": 2636} {"train_loss": -24.762903213500977, "global_step": 218846, "epoch": 2636} {"train_loss": -24.520273208618164, "global_step": 218847, "epoch": 2636} {"train_loss": -24.34736442565918, "global_step": 218848, "epoch": 2636} {"train_loss": -24.207250595092773, "global_step": 218849, "epoch": 2636} {"train_loss": -24.264188766479492, "global_step": 218850, "epoch": 2636} {"train_loss": -24.41316032409668, "global_step": 218851, "epoch": 2636} {"train_loss": -24.844633102416992, "global_step": 218852, "epoch": 2636} {"train_loss": -24.413772583007812, "global_step": 218853, "epoch": 2636} {"train_loss": -24.19298553466797, "global_step": 218854, "epoch": 2636} {"train_loss": -24.407062530517578, "global_step": 218855, "epoch": 2636} {"train_loss": -24.312456130981445, "global_step": 218856, "epoch": 2636} {"train_loss": -24.926733016967773, "global_step": 218857, "epoch": 2636} {"train_loss": -24.351581573486328, "global_step": 218858, "epoch": 2636} {"train_loss": -24.63726806640625, "global_step": 218859, "epoch": 2636} {"train_loss": -24.596391677856445, "global_step": 218860, "epoch": 2636} {"train_loss": -24.663190841674805, "global_step": 218861, "epoch": 2636} {"train_loss": -24.877023696899414, "global_step": 218862, "epoch": 2636} {"train_loss": -24.660850524902344, "global_step": 218863, "epoch": 2636} {"train_loss": -24.6141414642334, "global_step": 218864, "epoch": 2636} {"train_loss": -24.677671432495117, "global_step": 218865, "epoch": 2636} {"train_loss": -24.52704429626465, "global_step": 218866, "epoch": 2636} {"train_loss": -24.628087997436523, "global_step": 218867, "epoch": 2636} {"train_loss": -24.60392951965332, "global_step": 218868, "epoch": 2636} {"train_loss": -24.880247116088867, "global_step": 218869, "epoch": 2636} {"train_loss": -24.51608731373247, "global_step": 218870, "epoch": 2636, "val_loss": 6585154.0} {"train_loss": -24.12607765197754, "global_step": 218871, "epoch": 2637} {"train_loss": -23.63886070251465, "global_step": 218872, "epoch": 2637} {"train_loss": -23.98542594909668, "global_step": 218873, "epoch": 2637} {"train_loss": -24.387500762939453, "global_step": 218874, "epoch": 2637} {"train_loss": -24.203460693359375, "global_step": 218875, "epoch": 2637} {"train_loss": -24.025644302368164, "global_step": 218876, "epoch": 2637} {"train_loss": -24.092008590698242, "global_step": 218877, "epoch": 2637} {"train_loss": -24.554462432861328, "global_step": 218878, "epoch": 2637} {"train_loss": -23.958683013916016, "global_step": 218879, "epoch": 2637} {"train_loss": -24.134357452392578, "global_step": 218880, "epoch": 2637} {"train_loss": -24.358806610107422, "global_step": 218881, "epoch": 2637} {"train_loss": -24.226667404174805, "global_step": 218882, "epoch": 2637} {"train_loss": -24.24030113220215, "global_step": 218883, "epoch": 2637} {"train_loss": -24.700525283813477, "global_step": 218884, "epoch": 2637} {"train_loss": -24.35279083251953, "global_step": 218885, "epoch": 2637} {"train_loss": -24.57539939880371, "global_step": 218886, "epoch": 2637} {"train_loss": -24.60274314880371, "global_step": 218887, "epoch": 2637} {"train_loss": -24.48084831237793, "global_step": 218888, "epoch": 2637} {"train_loss": -24.12827491760254, "global_step": 218889, "epoch": 2637} {"train_loss": -24.549396514892578, "global_step": 218890, "epoch": 2637} {"train_loss": -24.261009216308594, "global_step": 218891, "epoch": 2637} {"train_loss": -24.337305068969727, "global_step": 218892, "epoch": 2637} {"train_loss": -24.436155319213867, "global_step": 218893, "epoch": 2637} {"train_loss": -24.459915161132812, "global_step": 218894, "epoch": 2637} {"train_loss": -24.808059692382812, "global_step": 218895, "epoch": 2637} {"train_loss": -24.694740295410156, "global_step": 218896, "epoch": 2637} {"train_loss": -24.620941162109375, "global_step": 218897, "epoch": 2637} {"train_loss": -24.610946655273438, "global_step": 218898, "epoch": 2637} {"train_loss": -24.581872940063477, "global_step": 218899, "epoch": 2637} {"train_loss": -24.723005294799805, "global_step": 218900, "epoch": 2637} {"train_loss": -24.334482192993164, "global_step": 218901, "epoch": 2637} {"train_loss": -24.8558349609375, "global_step": 218902, "epoch": 2637} {"train_loss": -24.78011131286621, "global_step": 218903, "epoch": 2637} {"train_loss": -24.536909103393555, "global_step": 218904, "epoch": 2637} {"train_loss": -24.623403549194336, "global_step": 218905, "epoch": 2637} {"train_loss": -24.7213191986084, "global_step": 218906, "epoch": 2637} {"train_loss": -24.47052001953125, "global_step": 218907, "epoch": 2637} {"train_loss": -24.991073608398438, "global_step": 218908, "epoch": 2637} {"train_loss": -25.014184951782227, "global_step": 218909, "epoch": 2637} {"train_loss": -24.485904693603516, "global_step": 218910, "epoch": 2637} {"train_loss": -25.06294822692871, "global_step": 218911, "epoch": 2637} {"train_loss": -24.529916763305664, "global_step": 218912, "epoch": 2637} {"train_loss": -24.772274017333984, "global_step": 218913, "epoch": 2637} {"train_loss": -24.48933219909668, "global_step": 218914, "epoch": 2637} {"train_loss": -24.81551170349121, "global_step": 218915, "epoch": 2637} {"train_loss": -24.5792179107666, "global_step": 218916, "epoch": 2637} {"train_loss": -24.598962783813477, "global_step": 218917, "epoch": 2637} {"train_loss": -24.37648582458496, "global_step": 218918, "epoch": 2637} {"train_loss": -24.485280990600586, "global_step": 218919, "epoch": 2637} {"train_loss": -24.262435913085938, "global_step": 218920, "epoch": 2637} {"train_loss": -24.169187545776367, "global_step": 218921, "epoch": 2637} {"train_loss": -24.639799118041992, "global_step": 218922, "epoch": 2637} {"train_loss": -24.660390853881836, "global_step": 218923, "epoch": 2637} {"train_loss": -24.535371780395508, "global_step": 218924, "epoch": 2637} {"train_loss": -24.467329025268555, "global_step": 218925, "epoch": 2637} {"train_loss": -24.389005661010742, "global_step": 218926, "epoch": 2637} {"train_loss": -24.895483016967773, "global_step": 218927, "epoch": 2637} {"train_loss": -24.50079917907715, "global_step": 218928, "epoch": 2637} {"train_loss": -24.552736282348633, "global_step": 218929, "epoch": 2637} {"train_loss": -24.366485595703125, "global_step": 218930, "epoch": 2637} {"train_loss": -24.910829544067383, "global_step": 218931, "epoch": 2637} {"train_loss": -24.731290817260742, "global_step": 218932, "epoch": 2637} {"train_loss": -24.715349197387695, "global_step": 218933, "epoch": 2637} {"train_loss": -24.688833236694336, "global_step": 218934, "epoch": 2637} {"train_loss": -24.306127548217773, "global_step": 218935, "epoch": 2637} {"train_loss": -25.103839874267578, "global_step": 218936, "epoch": 2637} {"train_loss": -24.53824234008789, "global_step": 218937, "epoch": 2637} {"train_loss": -24.68898582458496, "global_step": 218938, "epoch": 2637} {"train_loss": -24.858373641967773, "global_step": 218939, "epoch": 2637} {"train_loss": -24.342565536499023, "global_step": 218940, "epoch": 2637} {"train_loss": -24.25752067565918, "global_step": 218941, "epoch": 2637} {"train_loss": -24.75897216796875, "global_step": 218942, "epoch": 2637} {"train_loss": -24.789508819580078, "global_step": 218943, "epoch": 2637} {"train_loss": -24.750350952148438, "global_step": 218944, "epoch": 2637} {"train_loss": -24.857770919799805, "global_step": 218945, "epoch": 2637} {"train_loss": -24.528701782226562, "global_step": 218946, "epoch": 2637} {"train_loss": -24.855945587158203, "global_step": 218947, "epoch": 2637} {"train_loss": -24.340559005737305, "global_step": 218948, "epoch": 2637} {"train_loss": -24.38738441467285, "global_step": 218949, "epoch": 2637} {"train_loss": -24.40142822265625, "global_step": 218950, "epoch": 2637} {"train_loss": -24.77988624572754, "global_step": 218951, "epoch": 2637} {"train_loss": -24.516427993774414, "global_step": 218952, "epoch": 2637} {"train_loss": -24.5508219247841, "global_step": 218953, "epoch": 2637, "val_loss": 6644821.0} {"train_loss": -23.057065963745117, "global_step": 218954, "epoch": 2638} {"train_loss": -23.1704158782959, "global_step": 218955, "epoch": 2638} {"train_loss": -23.848142623901367, "global_step": 218956, "epoch": 2638} {"train_loss": -23.996170043945312, "global_step": 218957, "epoch": 2638} {"train_loss": -23.67938995361328, "global_step": 218958, "epoch": 2638} {"train_loss": -23.601972579956055, "global_step": 218959, "epoch": 2638} {"train_loss": -23.86731719970703, "global_step": 218960, "epoch": 2638} {"train_loss": -24.034696578979492, "global_step": 218961, "epoch": 2638} {"train_loss": -24.139596939086914, "global_step": 218962, "epoch": 2638} {"train_loss": -24.09372901916504, "global_step": 218963, "epoch": 2638} {"train_loss": -24.350080490112305, "global_step": 218964, "epoch": 2638} {"train_loss": -24.401132583618164, "global_step": 218965, "epoch": 2638} {"train_loss": -24.320802688598633, "global_step": 218966, "epoch": 2638} {"train_loss": -24.361923217773438, "global_step": 218967, "epoch": 2638} {"train_loss": -24.212039947509766, "global_step": 218968, "epoch": 2638} {"train_loss": -24.213924407958984, "global_step": 218969, "epoch": 2638} {"train_loss": -24.154441833496094, "global_step": 218970, "epoch": 2638} {"train_loss": -24.52898597717285, "global_step": 218971, "epoch": 2638} {"train_loss": -24.503446578979492, "global_step": 218972, "epoch": 2638} {"train_loss": -24.207141876220703, "global_step": 218973, "epoch": 2638} {"train_loss": -24.195423126220703, "global_step": 218974, "epoch": 2638} {"train_loss": -24.236295700073242, "global_step": 218975, "epoch": 2638} {"train_loss": -24.165830612182617, "global_step": 218976, "epoch": 2638} {"train_loss": -24.469589233398438, "global_step": 218977, "epoch": 2638} {"train_loss": -24.494762420654297, "global_step": 218978, "epoch": 2638} {"train_loss": -24.4334774017334, "global_step": 218979, "epoch": 2638} {"train_loss": -24.64115333557129, "global_step": 218980, "epoch": 2638} {"train_loss": -24.40131378173828, "global_step": 218981, "epoch": 2638} {"train_loss": -24.54737663269043, "global_step": 218982, "epoch": 2638} {"train_loss": -24.733505249023438, "global_step": 218983, "epoch": 2638} {"train_loss": -24.542715072631836, "global_step": 218984, "epoch": 2638} {"train_loss": -24.52336311340332, "global_step": 218985, "epoch": 2638} {"train_loss": -24.57277488708496, "global_step": 218986, "epoch": 2638} {"train_loss": -24.334278106689453, "global_step": 218987, "epoch": 2638} {"train_loss": -24.82118797302246, "global_step": 218988, "epoch": 2638} {"train_loss": -24.55525016784668, "global_step": 218989, "epoch": 2638} {"train_loss": -24.721601486206055, "global_step": 218990, "epoch": 2638} {"train_loss": -24.745365142822266, "global_step": 218991, "epoch": 2638} {"train_loss": -24.62159538269043, "global_step": 218992, "epoch": 2638} {"train_loss": -24.589786529541016, "global_step": 218993, "epoch": 2638} {"train_loss": -24.681928634643555, "global_step": 218994, "epoch": 2638} {"train_loss": -24.73688507080078, "global_step": 218995, "epoch": 2638} {"train_loss": -24.38577651977539, "global_step": 218996, "epoch": 2638} {"train_loss": -24.68006706237793, "global_step": 218997, "epoch": 2638} {"train_loss": -24.51946449279785, "global_step": 218998, "epoch": 2638} {"train_loss": -24.69080924987793, "global_step": 218999, "epoch": 2638} {"train_loss": -24.54438591003418, "global_step": 219000, "epoch": 2638} {"train_loss": -24.662307739257812, "global_step": 219001, "epoch": 2638} {"train_loss": -24.628755569458008, "global_step": 219002, "epoch": 2638} {"train_loss": -25.051347732543945, "global_step": 219003, "epoch": 2638} {"train_loss": -24.828969955444336, "global_step": 219004, "epoch": 2638} {"train_loss": -24.65155601501465, "global_step": 219005, "epoch": 2638} {"train_loss": -24.458776473999023, "global_step": 219006, "epoch": 2638} {"train_loss": -24.62937355041504, "global_step": 219007, "epoch": 2638} {"train_loss": -24.4483585357666, "global_step": 219008, "epoch": 2638} {"train_loss": -24.51594352722168, "global_step": 219009, "epoch": 2638} {"train_loss": -24.610158920288086, "global_step": 219010, "epoch": 2638} {"train_loss": -24.638206481933594, "global_step": 219011, "epoch": 2638} {"train_loss": -24.650402069091797, "global_step": 219012, "epoch": 2638} {"train_loss": -24.89046287536621, "global_step": 219013, "epoch": 2638} {"train_loss": -24.79316520690918, "global_step": 219014, "epoch": 2638} {"train_loss": -24.4373836517334, "global_step": 219015, "epoch": 2638} {"train_loss": -24.169363021850586, "global_step": 219016, "epoch": 2638} {"train_loss": -23.969858169555664, "global_step": 219017, "epoch": 2638} {"train_loss": -24.500011444091797, "global_step": 219018, "epoch": 2638} {"train_loss": -24.60276985168457, "global_step": 219019, "epoch": 2638} {"train_loss": -24.023252487182617, "global_step": 219020, "epoch": 2638} {"train_loss": -23.784666061401367, "global_step": 219021, "epoch": 2638} {"train_loss": -24.28987693786621, "global_step": 219022, "epoch": 2638} {"train_loss": -24.56215476989746, "global_step": 219023, "epoch": 2638} {"train_loss": -24.008058547973633, "global_step": 219024, "epoch": 2638} {"train_loss": -24.292526245117188, "global_step": 219025, "epoch": 2638} {"train_loss": -24.678653717041016, "global_step": 219026, "epoch": 2638} {"train_loss": -23.983692169189453, "global_step": 219027, "epoch": 2638} {"train_loss": -24.266870498657227, "global_step": 219028, "epoch": 2638} {"train_loss": -24.306211471557617, "global_step": 219029, "epoch": 2638} {"train_loss": -24.27960777282715, "global_step": 219030, "epoch": 2638} {"train_loss": -24.954023361206055, "global_step": 219031, "epoch": 2638} {"train_loss": -24.50373649597168, "global_step": 219032, "epoch": 2638} {"train_loss": -24.417497634887695, "global_step": 219033, "epoch": 2638} {"train_loss": -24.439130783081055, "global_step": 219034, "epoch": 2638} {"train_loss": -24.513565063476562, "global_step": 219035, "epoch": 2638} {"train_loss": -24.37888166128871, "global_step": 219036, "epoch": 2638, "val_loss": 6763222.0} {"train_loss": -24.18321418762207, "global_step": 219037, "epoch": 2639} {"train_loss": -24.098011016845703, "global_step": 219038, "epoch": 2639} {"train_loss": -24.134172439575195, "global_step": 219039, "epoch": 2639} {"train_loss": -23.541440963745117, "global_step": 219040, "epoch": 2639} {"train_loss": -24.362293243408203, "global_step": 219041, "epoch": 2639} {"train_loss": -23.640140533447266, "global_step": 219042, "epoch": 2639} {"train_loss": -24.21306800842285, "global_step": 219043, "epoch": 2639} {"train_loss": -24.12281608581543, "global_step": 219044, "epoch": 2639} {"train_loss": -24.210403442382812, "global_step": 219045, "epoch": 2639} {"train_loss": -24.181079864501953, "global_step": 219046, "epoch": 2639} {"train_loss": -24.207731246948242, "global_step": 219047, "epoch": 2639} {"train_loss": -24.19057273864746, "global_step": 219048, "epoch": 2639} {"train_loss": -23.98354148864746, "global_step": 219049, "epoch": 2639} {"train_loss": -24.21681785583496, "global_step": 219050, "epoch": 2639} {"train_loss": -24.326810836791992, "global_step": 219051, "epoch": 2639} {"train_loss": -24.379331588745117, "global_step": 219052, "epoch": 2639} {"train_loss": -24.35173797607422, "global_step": 219053, "epoch": 2639} {"train_loss": -24.206647872924805, "global_step": 219054, "epoch": 2639} {"train_loss": -24.221288681030273, "global_step": 219055, "epoch": 2639} {"train_loss": -24.590347290039062, "global_step": 219056, "epoch": 2639} {"train_loss": -24.148794174194336, "global_step": 219057, "epoch": 2639} {"train_loss": -24.20027732849121, "global_step": 219058, "epoch": 2639} {"train_loss": -24.542835235595703, "global_step": 219059, "epoch": 2639} {"train_loss": -24.757780075073242, "global_step": 219060, "epoch": 2639} {"train_loss": -24.41702651977539, "global_step": 219061, "epoch": 2639} {"train_loss": -24.554285049438477, "global_step": 219062, "epoch": 2639} {"train_loss": -24.42133140563965, "global_step": 219063, "epoch": 2639} {"train_loss": -24.11471939086914, "global_step": 219064, "epoch": 2639} {"train_loss": -24.48087501525879, "global_step": 219065, "epoch": 2639} {"train_loss": -24.589582443237305, "global_step": 219066, "epoch": 2639} {"train_loss": -24.611736297607422, "global_step": 219067, "epoch": 2639} {"train_loss": -24.673410415649414, "global_step": 219068, "epoch": 2639} {"train_loss": -24.512006759643555, "global_step": 219069, "epoch": 2639} {"train_loss": -24.41341209411621, "global_step": 219070, "epoch": 2639} {"train_loss": -24.645841598510742, "global_step": 219071, "epoch": 2639} {"train_loss": -24.50929069519043, "global_step": 219072, "epoch": 2639} {"train_loss": -24.541858673095703, "global_step": 219073, "epoch": 2639} {"train_loss": -24.663700103759766, "global_step": 219074, "epoch": 2639} {"train_loss": -24.752687454223633, "global_step": 219075, "epoch": 2639} {"train_loss": -24.498613357543945, "global_step": 219076, "epoch": 2639} {"train_loss": -24.598819732666016, "global_step": 219077, "epoch": 2639} {"train_loss": -24.655920028686523, "global_step": 219078, "epoch": 2639} {"train_loss": -24.48503875732422, "global_step": 219079, "epoch": 2639} {"train_loss": -24.7653751373291, "global_step": 219080, "epoch": 2639} {"train_loss": -24.60186195373535, "global_step": 219081, "epoch": 2639} {"train_loss": -24.485668182373047, "global_step": 219082, "epoch": 2639} {"train_loss": -24.36929702758789, "global_step": 219083, "epoch": 2639} {"train_loss": -24.517160415649414, "global_step": 219084, "epoch": 2639} {"train_loss": -25.12155532836914, "global_step": 219085, "epoch": 2639} {"train_loss": -24.754505157470703, "global_step": 219086, "epoch": 2639} {"train_loss": -24.85849380493164, "global_step": 219087, "epoch": 2639} {"train_loss": -24.838058471679688, "global_step": 219088, "epoch": 2639} {"train_loss": -24.981693267822266, "global_step": 219089, "epoch": 2639} {"train_loss": -24.545730590820312, "global_step": 219090, "epoch": 2639} {"train_loss": -24.45535659790039, "global_step": 219091, "epoch": 2639} {"train_loss": -24.89566421508789, "global_step": 219092, "epoch": 2639} {"train_loss": -24.716129302978516, "global_step": 219093, "epoch": 2639} {"train_loss": -24.29340362548828, "global_step": 219094, "epoch": 2639} {"train_loss": -24.785947799682617, "global_step": 219095, "epoch": 2639} {"train_loss": -24.74629783630371, "global_step": 219096, "epoch": 2639} {"train_loss": -24.637800216674805, "global_step": 219097, "epoch": 2639} {"train_loss": -24.246362686157227, "global_step": 219098, "epoch": 2639} {"train_loss": -24.59946632385254, "global_step": 219099, "epoch": 2639} {"train_loss": -24.905609130859375, "global_step": 219100, "epoch": 2639} {"train_loss": -24.260061264038086, "global_step": 219101, "epoch": 2639} {"train_loss": -23.963544845581055, "global_step": 219102, "epoch": 2639} {"train_loss": -24.13382339477539, "global_step": 219103, "epoch": 2639} {"train_loss": -24.201135635375977, "global_step": 219104, "epoch": 2639} {"train_loss": -24.2908992767334, "global_step": 219105, "epoch": 2639} {"train_loss": -24.409391403198242, "global_step": 219106, "epoch": 2639} {"train_loss": -24.92595672607422, "global_step": 219107, "epoch": 2639} {"train_loss": -24.826229095458984, "global_step": 219108, "epoch": 2639} {"train_loss": -24.83724021911621, "global_step": 219109, "epoch": 2639} {"train_loss": -24.727313995361328, "global_step": 219110, "epoch": 2639} {"train_loss": -24.7722110748291, "global_step": 219111, "epoch": 2639} {"train_loss": -24.50661277770996, "global_step": 219112, "epoch": 2639} {"train_loss": -24.490314483642578, "global_step": 219113, "epoch": 2639} {"train_loss": -24.72751235961914, "global_step": 219114, "epoch": 2639} {"train_loss": -24.451810836791992, "global_step": 219115, "epoch": 2639} {"train_loss": -24.941211700439453, "global_step": 219116, "epoch": 2639} {"train_loss": -24.944738388061523, "global_step": 219117, "epoch": 2639} {"train_loss": -24.185148239135742, "global_step": 219118, "epoch": 2639} {"train_loss": -24.502551779689558, "global_step": 219119, "epoch": 2639, "val_loss": 6624339.0} {"train_loss": -23.996912002563477, "global_step": 219120, "epoch": 2640} {"train_loss": -24.244312286376953, "global_step": 219121, "epoch": 2640} {"train_loss": -24.136661529541016, "global_step": 219122, "epoch": 2640} {"train_loss": -24.43881607055664, "global_step": 219123, "epoch": 2640} {"train_loss": -24.069799423217773, "global_step": 219124, "epoch": 2640} {"train_loss": -23.986988067626953, "global_step": 219125, "epoch": 2640} {"train_loss": -24.291641235351562, "global_step": 219126, "epoch": 2640} {"train_loss": -24.525497436523438, "global_step": 219127, "epoch": 2640} {"train_loss": -24.00196647644043, "global_step": 219128, "epoch": 2640} {"train_loss": -24.02638816833496, "global_step": 219129, "epoch": 2640} {"train_loss": -24.378793716430664, "global_step": 219130, "epoch": 2640} {"train_loss": -24.060083389282227, "global_step": 219131, "epoch": 2640} {"train_loss": -24.6083984375, "global_step": 219132, "epoch": 2640} {"train_loss": -24.126420974731445, "global_step": 219133, "epoch": 2640} {"train_loss": -23.606765747070312, "global_step": 219134, "epoch": 2640} {"train_loss": -24.282806396484375, "global_step": 219135, "epoch": 2640} {"train_loss": -24.247648239135742, "global_step": 219136, "epoch": 2640} {"train_loss": -23.895919799804688, "global_step": 219137, "epoch": 2640} {"train_loss": -24.559436798095703, "global_step": 219138, "epoch": 2640} {"train_loss": -24.049346923828125, "global_step": 219139, "epoch": 2640} {"train_loss": -24.392995834350586, "global_step": 219140, "epoch": 2640} {"train_loss": -24.048492431640625, "global_step": 219141, "epoch": 2640} {"train_loss": -24.731430053710938, "global_step": 219142, "epoch": 2640} {"train_loss": -24.37472915649414, "global_step": 219143, "epoch": 2640} {"train_loss": -24.407655715942383, "global_step": 219144, "epoch": 2640} {"train_loss": -24.3074951171875, "global_step": 219145, "epoch": 2640} {"train_loss": -24.101842880249023, "global_step": 219146, "epoch": 2640} {"train_loss": -24.235090255737305, "global_step": 219147, "epoch": 2640} {"train_loss": -24.70296287536621, "global_step": 219148, "epoch": 2640} {"train_loss": -24.701488494873047, "global_step": 219149, "epoch": 2640} {"train_loss": -24.261978149414062, "global_step": 219150, "epoch": 2640} {"train_loss": -24.494043350219727, "global_step": 219151, "epoch": 2640} {"train_loss": -24.59160804748535, "global_step": 219152, "epoch": 2640} {"train_loss": -24.92728042602539, "global_step": 219153, "epoch": 2640} {"train_loss": -24.84744644165039, "global_step": 219154, "epoch": 2640} {"train_loss": -24.54153060913086, "global_step": 219155, "epoch": 2640} {"train_loss": -24.6358585357666, "global_step": 219156, "epoch": 2640} {"train_loss": -24.541187286376953, "global_step": 219157, "epoch": 2640} {"train_loss": -24.335973739624023, "global_step": 219158, "epoch": 2640} {"train_loss": -24.4787654876709, "global_step": 219159, "epoch": 2640} {"train_loss": -24.677734375, "global_step": 219160, "epoch": 2640} {"train_loss": -24.667463302612305, "global_step": 219161, "epoch": 2640} {"train_loss": -24.909391403198242, "global_step": 219162, "epoch": 2640} {"train_loss": -24.45712661743164, "global_step": 219163, "epoch": 2640} {"train_loss": -24.70932388305664, "global_step": 219164, "epoch": 2640} {"train_loss": -24.456134796142578, "global_step": 219165, "epoch": 2640} {"train_loss": -24.66261100769043, "global_step": 219166, "epoch": 2640} {"train_loss": -24.604238510131836, "global_step": 219167, "epoch": 2640} {"train_loss": -24.68855857849121, "global_step": 219168, "epoch": 2640} {"train_loss": -24.557065963745117, "global_step": 219169, "epoch": 2640} {"train_loss": -24.632688522338867, "global_step": 219170, "epoch": 2640} {"train_loss": -24.52540397644043, "global_step": 219171, "epoch": 2640} {"train_loss": -24.88029670715332, "global_step": 219172, "epoch": 2640} {"train_loss": -25.253116607666016, "global_step": 219173, "epoch": 2640} {"train_loss": -24.546125411987305, "global_step": 219174, "epoch": 2640} {"train_loss": -25.05075454711914, "global_step": 219175, "epoch": 2640} {"train_loss": -24.850753784179688, "global_step": 219176, "epoch": 2640} {"train_loss": -24.39509391784668, "global_step": 219177, "epoch": 2640} {"train_loss": -24.43016242980957, "global_step": 219178, "epoch": 2640} {"train_loss": -24.997039794921875, "global_step": 219179, "epoch": 2640} {"train_loss": -24.523975372314453, "global_step": 219180, "epoch": 2640} {"train_loss": -24.51576042175293, "global_step": 219181, "epoch": 2640} {"train_loss": -24.698802947998047, "global_step": 219182, "epoch": 2640} {"train_loss": -24.432641983032227, "global_step": 219183, "epoch": 2640} {"train_loss": -24.64194679260254, "global_step": 219184, "epoch": 2640} {"train_loss": -24.662235260009766, "global_step": 219185, "epoch": 2640} {"train_loss": -24.612960815429688, "global_step": 219186, "epoch": 2640} {"train_loss": -24.546676635742188, "global_step": 219187, "epoch": 2640} {"train_loss": -24.918710708618164, "global_step": 219188, "epoch": 2640} {"train_loss": -24.601398468017578, "global_step": 219189, "epoch": 2640} {"train_loss": -24.439136505126953, "global_step": 219190, "epoch": 2640} {"train_loss": -23.898136138916016, "global_step": 219191, "epoch": 2640} {"train_loss": -24.428592681884766, "global_step": 219192, "epoch": 2640} {"train_loss": -24.91818618774414, "global_step": 219193, "epoch": 2640} {"train_loss": -24.27248191833496, "global_step": 219194, "epoch": 2640} {"train_loss": -24.20229148864746, "global_step": 219195, "epoch": 2640} {"train_loss": -24.2849178314209, "global_step": 219196, "epoch": 2640} {"train_loss": -24.00924301147461, "global_step": 219197, "epoch": 2640} {"train_loss": -23.95535659790039, "global_step": 219198, "epoch": 2640} {"train_loss": -24.229511260986328, "global_step": 219199, "epoch": 2640} {"train_loss": -24.36191749572754, "global_step": 219200, "epoch": 2640} {"train_loss": -24.15319061279297, "global_step": 219201, "epoch": 2640} {"train_loss": -24.451353877423756, "global_step": 219202, "epoch": 2640, "val_loss": 6696193.5} {"train_loss": -23.523183822631836, "global_step": 219203, "epoch": 2641} {"train_loss": -24.371362686157227, "global_step": 219204, "epoch": 2641} {"train_loss": -23.616514205932617, "global_step": 219205, "epoch": 2641} {"train_loss": -23.871925354003906, "global_step": 219206, "epoch": 2641} {"train_loss": -24.079345703125, "global_step": 219207, "epoch": 2641} {"train_loss": -24.040571212768555, "global_step": 219208, "epoch": 2641} {"train_loss": -24.238998413085938, "global_step": 219209, "epoch": 2641} {"train_loss": -24.08352279663086, "global_step": 219210, "epoch": 2641} {"train_loss": -24.050432205200195, "global_step": 219211, "epoch": 2641} {"train_loss": -24.495023727416992, "global_step": 219212, "epoch": 2641} {"train_loss": -23.707019805908203, "global_step": 219213, "epoch": 2641} {"train_loss": -24.233625411987305, "global_step": 219214, "epoch": 2641} {"train_loss": -24.482376098632812, "global_step": 219215, "epoch": 2641} {"train_loss": -24.411426544189453, "global_step": 219216, "epoch": 2641} {"train_loss": -24.3310604095459, "global_step": 219217, "epoch": 2641} {"train_loss": -24.335256576538086, "global_step": 219218, "epoch": 2641} {"train_loss": -24.40799331665039, "global_step": 219219, "epoch": 2641} {"train_loss": -24.394001007080078, "global_step": 219220, "epoch": 2641} {"train_loss": -24.24140167236328, "global_step": 219221, "epoch": 2641} {"train_loss": -24.39794158935547, "global_step": 219222, "epoch": 2641} {"train_loss": -24.90399742126465, "global_step": 219223, "epoch": 2641} {"train_loss": -24.736825942993164, "global_step": 219224, "epoch": 2641} {"train_loss": -24.58695411682129, "global_step": 219225, "epoch": 2641} {"train_loss": -24.527952194213867, "global_step": 219226, "epoch": 2641} {"train_loss": -24.38105583190918, "global_step": 219227, "epoch": 2641} {"train_loss": -24.549116134643555, "global_step": 219228, "epoch": 2641} {"train_loss": -24.617658615112305, "global_step": 219229, "epoch": 2641} {"train_loss": -24.222265243530273, "global_step": 219230, "epoch": 2641} {"train_loss": -25.153705596923828, "global_step": 219231, "epoch": 2641} {"train_loss": -24.271230697631836, "global_step": 219232, "epoch": 2641} {"train_loss": -24.597402572631836, "global_step": 219233, "epoch": 2641} {"train_loss": -24.475370407104492, "global_step": 219234, "epoch": 2641} {"train_loss": -24.382904052734375, "global_step": 219235, "epoch": 2641} {"train_loss": -24.418806076049805, "global_step": 219236, "epoch": 2641} {"train_loss": -24.43915557861328, "global_step": 219237, "epoch": 2641} {"train_loss": -24.810224533081055, "global_step": 219238, "epoch": 2641} {"train_loss": -24.517311096191406, "global_step": 219239, "epoch": 2641} {"train_loss": -24.595956802368164, "global_step": 219240, "epoch": 2641} {"train_loss": -24.58854103088379, "global_step": 219241, "epoch": 2641} {"train_loss": -24.332578659057617, "global_step": 219242, "epoch": 2641} {"train_loss": -24.200361251831055, "global_step": 219243, "epoch": 2641} {"train_loss": -24.653390884399414, "global_step": 219244, "epoch": 2641} {"train_loss": -24.22981834411621, "global_step": 219245, "epoch": 2641} {"train_loss": -24.713285446166992, "global_step": 219246, "epoch": 2641} {"train_loss": -24.457412719726562, "global_step": 219247, "epoch": 2641} {"train_loss": -23.78546714782715, "global_step": 219248, "epoch": 2641} {"train_loss": -24.362165451049805, "global_step": 219249, "epoch": 2641} {"train_loss": -24.593900680541992, "global_step": 219250, "epoch": 2641} {"train_loss": -24.59981346130371, "global_step": 219251, "epoch": 2641} {"train_loss": -24.265399932861328, "global_step": 219252, "epoch": 2641} {"train_loss": -24.72907829284668, "global_step": 219253, "epoch": 2641} {"train_loss": -24.33926773071289, "global_step": 219254, "epoch": 2641} {"train_loss": -24.628070831298828, "global_step": 219255, "epoch": 2641} {"train_loss": -24.661245346069336, "global_step": 219256, "epoch": 2641} {"train_loss": -24.56366539001465, "global_step": 219257, "epoch": 2641} {"train_loss": -24.92877769470215, "global_step": 219258, "epoch": 2641} {"train_loss": -24.6807918548584, "global_step": 219259, "epoch": 2641} {"train_loss": -24.586633682250977, "global_step": 219260, "epoch": 2641} {"train_loss": -24.828763961791992, "global_step": 219261, "epoch": 2641} {"train_loss": -24.794857025146484, "global_step": 219262, "epoch": 2641} {"train_loss": -24.60469627380371, "global_step": 219263, "epoch": 2641} {"train_loss": -24.720413208007812, "global_step": 219264, "epoch": 2641} {"train_loss": -24.758625030517578, "global_step": 219265, "epoch": 2641} {"train_loss": -24.498645782470703, "global_step": 219266, "epoch": 2641} {"train_loss": -24.402769088745117, "global_step": 219267, "epoch": 2641} {"train_loss": -24.84718132019043, "global_step": 219268, "epoch": 2641} {"train_loss": -24.7186336517334, "global_step": 219269, "epoch": 2641} {"train_loss": -24.816293716430664, "global_step": 219270, "epoch": 2641} {"train_loss": -24.470243453979492, "global_step": 219271, "epoch": 2641} {"train_loss": -24.610212326049805, "global_step": 219272, "epoch": 2641} {"train_loss": -24.408679962158203, "global_step": 219273, "epoch": 2641} {"train_loss": -24.75185775756836, "global_step": 219274, "epoch": 2641} {"train_loss": -24.631547927856445, "global_step": 219275, "epoch": 2641} {"train_loss": -24.699098587036133, "global_step": 219276, "epoch": 2641} {"train_loss": -24.576398849487305, "global_step": 219277, "epoch": 2641} {"train_loss": -24.854562759399414, "global_step": 219278, "epoch": 2641} {"train_loss": -24.780460357666016, "global_step": 219279, "epoch": 2641} {"train_loss": -24.632455825805664, "global_step": 219280, "epoch": 2641} {"train_loss": -24.633182525634766, "global_step": 219281, "epoch": 2641} {"train_loss": -24.76323127746582, "global_step": 219282, "epoch": 2641} {"train_loss": -24.69331169128418, "global_step": 219283, "epoch": 2641} {"train_loss": -24.893796920776367, "global_step": 219284, "epoch": 2641} {"train_loss": -24.485001506575617, "global_step": 219285, "epoch": 2641, "val_loss": 6586348.5} {"train_loss": -24.30824851989746, "global_step": 219286, "epoch": 2642} {"train_loss": -24.50410270690918, "global_step": 219287, "epoch": 2642} {"train_loss": -24.58082389831543, "global_step": 219288, "epoch": 2642} {"train_loss": -24.70708656311035, "global_step": 219289, "epoch": 2642} {"train_loss": -24.50189971923828, "global_step": 219290, "epoch": 2642} {"train_loss": -24.64898109436035, "global_step": 219291, "epoch": 2642} {"train_loss": -24.358373641967773, "global_step": 219292, "epoch": 2642} {"train_loss": -24.633544921875, "global_step": 219293, "epoch": 2642} {"train_loss": -24.529096603393555, "global_step": 219294, "epoch": 2642} {"train_loss": -24.466367721557617, "global_step": 219295, "epoch": 2642} {"train_loss": -24.471363067626953, "global_step": 219296, "epoch": 2642} {"train_loss": -24.174571990966797, "global_step": 219297, "epoch": 2642} {"train_loss": -24.098058700561523, "global_step": 219298, "epoch": 2642} {"train_loss": -24.404338836669922, "global_step": 219299, "epoch": 2642} {"train_loss": -24.566434860229492, "global_step": 219300, "epoch": 2642} {"train_loss": -24.70627212524414, "global_step": 219301, "epoch": 2642} {"train_loss": -24.592687606811523, "global_step": 219302, "epoch": 2642} {"train_loss": -24.322525024414062, "global_step": 219303, "epoch": 2642} {"train_loss": -24.505910873413086, "global_step": 219304, "epoch": 2642} {"train_loss": -25.071674346923828, "global_step": 219305, "epoch": 2642} {"train_loss": -24.689010620117188, "global_step": 219306, "epoch": 2642} {"train_loss": -24.479543685913086, "global_step": 219307, "epoch": 2642} {"train_loss": -24.411691665649414, "global_step": 219308, "epoch": 2642} {"train_loss": -24.645910263061523, "global_step": 219309, "epoch": 2642} {"train_loss": -24.659915924072266, "global_step": 219310, "epoch": 2642} {"train_loss": -24.738924026489258, "global_step": 219311, "epoch": 2642} {"train_loss": -24.707683563232422, "global_step": 219312, "epoch": 2642} {"train_loss": -24.42051124572754, "global_step": 219313, "epoch": 2642} {"train_loss": -24.3964786529541, "global_step": 219314, "epoch": 2642} {"train_loss": -24.712064743041992, "global_step": 219315, "epoch": 2642} {"train_loss": -24.197479248046875, "global_step": 219316, "epoch": 2642} {"train_loss": -24.548826217651367, "global_step": 219317, "epoch": 2642} {"train_loss": -24.517148971557617, "global_step": 219318, "epoch": 2642} {"train_loss": -24.518739700317383, "global_step": 219319, "epoch": 2642} {"train_loss": -24.49921989440918, "global_step": 219320, "epoch": 2642} {"train_loss": -24.35546875, "global_step": 219321, "epoch": 2642} {"train_loss": -24.414081573486328, "global_step": 219322, "epoch": 2642} {"train_loss": -24.11484146118164, "global_step": 219323, "epoch": 2642} {"train_loss": -24.605924606323242, "global_step": 219324, "epoch": 2642} {"train_loss": -24.105878829956055, "global_step": 219325, "epoch": 2642} {"train_loss": -24.66741371154785, "global_step": 219326, "epoch": 2642} {"train_loss": -24.725112915039062, "global_step": 219327, "epoch": 2642} {"train_loss": -24.489988327026367, "global_step": 219328, "epoch": 2642} {"train_loss": -24.67986488342285, "global_step": 219329, "epoch": 2642} {"train_loss": -24.80029296875, "global_step": 219330, "epoch": 2642} {"train_loss": -24.712080001831055, "global_step": 219331, "epoch": 2642} {"train_loss": -24.804067611694336, "global_step": 219332, "epoch": 2642} {"train_loss": -24.46619987487793, "global_step": 219333, "epoch": 2642} {"train_loss": -24.85765266418457, "global_step": 219334, "epoch": 2642} {"train_loss": -24.66259765625, "global_step": 219335, "epoch": 2642} {"train_loss": -24.70171356201172, "global_step": 219336, "epoch": 2642} {"train_loss": -24.479917526245117, "global_step": 219337, "epoch": 2642} {"train_loss": -24.99675178527832, "global_step": 219338, "epoch": 2642} {"train_loss": -24.60099220275879, "global_step": 219339, "epoch": 2642} {"train_loss": -25.03148078918457, "global_step": 219340, "epoch": 2642} {"train_loss": -25.10013198852539, "global_step": 219341, "epoch": 2642} {"train_loss": -24.73785972595215, "global_step": 219342, "epoch": 2642} {"train_loss": -24.85955238342285, "global_step": 219343, "epoch": 2642} {"train_loss": -24.582515716552734, "global_step": 219344, "epoch": 2642} {"train_loss": -24.414608001708984, "global_step": 219345, "epoch": 2642} {"train_loss": -24.293874740600586, "global_step": 219346, "epoch": 2642} {"train_loss": -24.572782516479492, "global_step": 219347, "epoch": 2642} {"train_loss": -24.378976821899414, "global_step": 219348, "epoch": 2642} {"train_loss": -24.200353622436523, "global_step": 219349, "epoch": 2642} {"train_loss": -24.406808853149414, "global_step": 219350, "epoch": 2642} {"train_loss": -24.820261001586914, "global_step": 219351, "epoch": 2642} {"train_loss": -24.37801170349121, "global_step": 219352, "epoch": 2642} {"train_loss": -24.525808334350586, "global_step": 219353, "epoch": 2642} {"train_loss": -24.851654052734375, "global_step": 219354, "epoch": 2642} {"train_loss": -24.689870834350586, "global_step": 219355, "epoch": 2642} {"train_loss": -24.57421875, "global_step": 219356, "epoch": 2642} {"train_loss": -24.76256561279297, "global_step": 219357, "epoch": 2642} {"train_loss": -24.512773513793945, "global_step": 219358, "epoch": 2642} {"train_loss": -24.65260887145996, "global_step": 219359, "epoch": 2642} {"train_loss": -24.74888801574707, "global_step": 219360, "epoch": 2642} {"train_loss": -24.685422897338867, "global_step": 219361, "epoch": 2642} {"train_loss": -24.887659072875977, "global_step": 219362, "epoch": 2642} {"train_loss": -24.274438858032227, "global_step": 219363, "epoch": 2642} {"train_loss": -24.442895889282227, "global_step": 219364, "epoch": 2642} {"train_loss": -24.4925537109375, "global_step": 219365, "epoch": 2642} {"train_loss": -24.93892478942871, "global_step": 219366, "epoch": 2642} {"train_loss": -24.507963180541992, "global_step": 219367, "epoch": 2642} {"train_loss": -24.56135191400367, "global_step": 219368, "epoch": 2642, "val_loss": 6704804.5} {"train_loss": -24.78385353088379, "global_step": 219369, "epoch": 2643} {"train_loss": -24.405384063720703, "global_step": 219370, "epoch": 2643} {"train_loss": -24.2764949798584, "global_step": 219371, "epoch": 2643} {"train_loss": -24.51838493347168, "global_step": 219372, "epoch": 2643} {"train_loss": -24.28788185119629, "global_step": 219373, "epoch": 2643} {"train_loss": -24.6768856048584, "global_step": 219374, "epoch": 2643} {"train_loss": -24.13409996032715, "global_step": 219375, "epoch": 2643} {"train_loss": -24.565900802612305, "global_step": 219376, "epoch": 2643} {"train_loss": -24.0824031829834, "global_step": 219377, "epoch": 2643} {"train_loss": -24.487537384033203, "global_step": 219378, "epoch": 2643} {"train_loss": -24.359588623046875, "global_step": 219379, "epoch": 2643} {"train_loss": -24.30389404296875, "global_step": 219380, "epoch": 2643} {"train_loss": -24.39092445373535, "global_step": 219381, "epoch": 2643} {"train_loss": -24.182937622070312, "global_step": 219382, "epoch": 2643} {"train_loss": -24.46504020690918, "global_step": 219383, "epoch": 2643} {"train_loss": -24.29253578186035, "global_step": 219384, "epoch": 2643} {"train_loss": -24.40157127380371, "global_step": 219385, "epoch": 2643} {"train_loss": -24.431730270385742, "global_step": 219386, "epoch": 2643} {"train_loss": -24.724750518798828, "global_step": 219387, "epoch": 2643} {"train_loss": -24.19447898864746, "global_step": 219388, "epoch": 2643} {"train_loss": -24.74092674255371, "global_step": 219389, "epoch": 2643} {"train_loss": -24.298511505126953, "global_step": 219390, "epoch": 2643} {"train_loss": -24.46209144592285, "global_step": 219391, "epoch": 2643} {"train_loss": -24.404876708984375, "global_step": 219392, "epoch": 2643} {"train_loss": -24.2045955657959, "global_step": 219393, "epoch": 2643} {"train_loss": -24.373903274536133, "global_step": 219394, "epoch": 2643} {"train_loss": -24.09406852722168, "global_step": 219395, "epoch": 2643} {"train_loss": -24.639612197875977, "global_step": 219396, "epoch": 2643} {"train_loss": -24.590524673461914, "global_step": 219397, "epoch": 2643} {"train_loss": -24.492013931274414, "global_step": 219398, "epoch": 2643} {"train_loss": -24.258134841918945, "global_step": 219399, "epoch": 2643} {"train_loss": -24.32906150817871, "global_step": 219400, "epoch": 2643} {"train_loss": -24.552204132080078, "global_step": 219401, "epoch": 2643} {"train_loss": -24.223468780517578, "global_step": 219402, "epoch": 2643} {"train_loss": -24.36195182800293, "global_step": 219403, "epoch": 2643} {"train_loss": -24.389698028564453, "global_step": 219404, "epoch": 2643} {"train_loss": -24.62713623046875, "global_step": 219405, "epoch": 2643} {"train_loss": -24.22487449645996, "global_step": 219406, "epoch": 2643} {"train_loss": -24.66637420654297, "global_step": 219407, "epoch": 2643} {"train_loss": -24.425203323364258, "global_step": 219408, "epoch": 2643} {"train_loss": -24.55354881286621, "global_step": 219409, "epoch": 2643} {"train_loss": -24.42842674255371, "global_step": 219410, "epoch": 2643} {"train_loss": -24.793909072875977, "global_step": 219411, "epoch": 2643} {"train_loss": -24.503398895263672, "global_step": 219412, "epoch": 2643} {"train_loss": -24.789203643798828, "global_step": 219413, "epoch": 2643} {"train_loss": -24.478181838989258, "global_step": 219414, "epoch": 2643} {"train_loss": -24.377099990844727, "global_step": 219415, "epoch": 2643} {"train_loss": -24.798521041870117, "global_step": 219416, "epoch": 2643} {"train_loss": -24.585317611694336, "global_step": 219417, "epoch": 2643} {"train_loss": -24.79328727722168, "global_step": 219418, "epoch": 2643} {"train_loss": -24.646305084228516, "global_step": 219419, "epoch": 2643} {"train_loss": -24.631860733032227, "global_step": 219420, "epoch": 2643} {"train_loss": -24.52264976501465, "global_step": 219421, "epoch": 2643} {"train_loss": -24.517005920410156, "global_step": 219422, "epoch": 2643} {"train_loss": -24.763660430908203, "global_step": 219423, "epoch": 2643} {"train_loss": -24.993284225463867, "global_step": 219424, "epoch": 2643} {"train_loss": -24.595172882080078, "global_step": 219425, "epoch": 2643} {"train_loss": -24.64168357849121, "global_step": 219426, "epoch": 2643} {"train_loss": -24.3903751373291, "global_step": 219427, "epoch": 2643} {"train_loss": -24.27223014831543, "global_step": 219428, "epoch": 2643} {"train_loss": -24.781604766845703, "global_step": 219429, "epoch": 2643} {"train_loss": -24.148012161254883, "global_step": 219430, "epoch": 2643} {"train_loss": -24.645910263061523, "global_step": 219431, "epoch": 2643} {"train_loss": -24.18701934814453, "global_step": 219432, "epoch": 2643} {"train_loss": -24.80511474609375, "global_step": 219433, "epoch": 2643} {"train_loss": -23.903818130493164, "global_step": 219434, "epoch": 2643} {"train_loss": -24.33966636657715, "global_step": 219435, "epoch": 2643} {"train_loss": -24.191823959350586, "global_step": 219436, "epoch": 2643} {"train_loss": -25.009244918823242, "global_step": 219437, "epoch": 2643} {"train_loss": -24.32810401916504, "global_step": 219438, "epoch": 2643} {"train_loss": -24.366567611694336, "global_step": 219439, "epoch": 2643} {"train_loss": -24.81329917907715, "global_step": 219440, "epoch": 2643} {"train_loss": -24.600072860717773, "global_step": 219441, "epoch": 2643} {"train_loss": -24.11696434020996, "global_step": 219442, "epoch": 2643} {"train_loss": -23.958417892456055, "global_step": 219443, "epoch": 2643} {"train_loss": -24.510251998901367, "global_step": 219444, "epoch": 2643} {"train_loss": -24.457565307617188, "global_step": 219445, "epoch": 2643} {"train_loss": -24.29400634765625, "global_step": 219446, "epoch": 2643} {"train_loss": -24.776113510131836, "global_step": 219447, "epoch": 2643} {"train_loss": -24.62125587463379, "global_step": 219448, "epoch": 2643} {"train_loss": -24.499042510986328, "global_step": 219449, "epoch": 2643} {"train_loss": -24.448318481445312, "global_step": 219450, "epoch": 2643} {"train_loss": -24.442129410893084, "global_step": 219451, "epoch": 2643, "val_loss": 6799022.0} {"train_loss": -20.614885330200195, "global_step": 219452, "epoch": 2644} {"train_loss": -23.611291885375977, "global_step": 219453, "epoch": 2644} {"train_loss": -20.8151798248291, "global_step": 219454, "epoch": 2644} {"train_loss": -23.061460494995117, "global_step": 219455, "epoch": 2644} {"train_loss": -22.06620216369629, "global_step": 219456, "epoch": 2644} {"train_loss": -22.96621322631836, "global_step": 219457, "epoch": 2644} {"train_loss": -23.36237907409668, "global_step": 219458, "epoch": 2644} {"train_loss": -22.688119888305664, "global_step": 219459, "epoch": 2644} {"train_loss": -23.74300193786621, "global_step": 219460, "epoch": 2644} {"train_loss": -23.74729347229004, "global_step": 219461, "epoch": 2644} {"train_loss": -22.831680297851562, "global_step": 219462, "epoch": 2644} {"train_loss": -23.3282470703125, "global_step": 219463, "epoch": 2644} {"train_loss": -23.449325561523438, "global_step": 219464, "epoch": 2644} {"train_loss": -23.809476852416992, "global_step": 219465, "epoch": 2644} {"train_loss": -23.997190475463867, "global_step": 219466, "epoch": 2644} {"train_loss": -23.468856811523438, "global_step": 219467, "epoch": 2644} {"train_loss": -23.68622398376465, "global_step": 219468, "epoch": 2644} {"train_loss": -23.970117568969727, "global_step": 219469, "epoch": 2644} {"train_loss": -23.424076080322266, "global_step": 219470, "epoch": 2644} {"train_loss": -23.63602066040039, "global_step": 219471, "epoch": 2644} {"train_loss": -23.705541610717773, "global_step": 219472, "epoch": 2644} {"train_loss": -23.81575584411621, "global_step": 219473, "epoch": 2644} {"train_loss": -23.836681365966797, "global_step": 219474, "epoch": 2644} {"train_loss": -24.115625381469727, "global_step": 219475, "epoch": 2644} {"train_loss": -23.613798141479492, "global_step": 219476, "epoch": 2644} {"train_loss": -23.77898406982422, "global_step": 219477, "epoch": 2644} {"train_loss": -23.41580581665039, "global_step": 219478, "epoch": 2644} {"train_loss": -23.35748291015625, "global_step": 219479, "epoch": 2644} {"train_loss": -24.054777145385742, "global_step": 219480, "epoch": 2644} {"train_loss": -24.028640747070312, "global_step": 219481, "epoch": 2644} {"train_loss": -23.919904708862305, "global_step": 219482, "epoch": 2644} {"train_loss": -24.2764892578125, "global_step": 219483, "epoch": 2644} {"train_loss": -24.481372833251953, "global_step": 219484, "epoch": 2644} {"train_loss": -24.216516494750977, "global_step": 219485, "epoch": 2644} {"train_loss": -24.283620834350586, "global_step": 219486, "epoch": 2644} {"train_loss": -24.184776306152344, "global_step": 219487, "epoch": 2644} {"train_loss": -24.240854263305664, "global_step": 219488, "epoch": 2644} {"train_loss": -23.972091674804688, "global_step": 219489, "epoch": 2644} {"train_loss": -23.6998291015625, "global_step": 219490, "epoch": 2644} {"train_loss": -24.270017623901367, "global_step": 219491, "epoch": 2644} {"train_loss": -24.08500099182129, "global_step": 219492, "epoch": 2644} {"train_loss": -24.33075714111328, "global_step": 219493, "epoch": 2644} {"train_loss": -24.18646240234375, "global_step": 219494, "epoch": 2644} {"train_loss": -24.860261917114258, "global_step": 219495, "epoch": 2644} {"train_loss": -24.530309677124023, "global_step": 219496, "epoch": 2644} {"train_loss": -24.59376335144043, "global_step": 219497, "epoch": 2644} {"train_loss": -24.439525604248047, "global_step": 219498, "epoch": 2644} {"train_loss": -24.372474670410156, "global_step": 219499, "epoch": 2644} {"train_loss": -24.57107925415039, "global_step": 219500, "epoch": 2644} {"train_loss": -24.351652145385742, "global_step": 219501, "epoch": 2644} {"train_loss": -24.675806045532227, "global_step": 219502, "epoch": 2644} {"train_loss": -24.742948532104492, "global_step": 219503, "epoch": 2644} {"train_loss": -24.713125228881836, "global_step": 219504, "epoch": 2644} {"train_loss": -24.469879150390625, "global_step": 219505, "epoch": 2644} {"train_loss": -24.5465087890625, "global_step": 219506, "epoch": 2644} {"train_loss": -24.661666870117188, "global_step": 219507, "epoch": 2644} {"train_loss": -24.52174949645996, "global_step": 219508, "epoch": 2644} {"train_loss": -24.642087936401367, "global_step": 219509, "epoch": 2644} {"train_loss": -24.476491928100586, "global_step": 219510, "epoch": 2644} {"train_loss": -24.705982208251953, "global_step": 219511, "epoch": 2644} {"train_loss": -24.643966674804688, "global_step": 219512, "epoch": 2644} {"train_loss": -24.202194213867188, "global_step": 219513, "epoch": 2644} {"train_loss": -24.62839698791504, "global_step": 219514, "epoch": 2644} {"train_loss": -24.5233211517334, "global_step": 219515, "epoch": 2644} {"train_loss": -24.35599136352539, "global_step": 219516, "epoch": 2644} {"train_loss": -24.569272994995117, "global_step": 219517, "epoch": 2644} {"train_loss": -24.232542037963867, "global_step": 219518, "epoch": 2644} {"train_loss": -24.60722541809082, "global_step": 219519, "epoch": 2644} {"train_loss": -24.131742477416992, "global_step": 219520, "epoch": 2644} {"train_loss": -24.4951229095459, "global_step": 219521, "epoch": 2644} {"train_loss": -24.463363647460938, "global_step": 219522, "epoch": 2644} {"train_loss": -24.625524520874023, "global_step": 219523, "epoch": 2644} {"train_loss": -24.588964462280273, "global_step": 219524, "epoch": 2644} {"train_loss": -24.713581085205078, "global_step": 219525, "epoch": 2644} {"train_loss": -24.5075740814209, "global_step": 219526, "epoch": 2644} {"train_loss": -24.529865264892578, "global_step": 219527, "epoch": 2644} {"train_loss": -24.36152458190918, "global_step": 219528, "epoch": 2644} {"train_loss": -24.74403953552246, "global_step": 219529, "epoch": 2644} {"train_loss": -24.662235260009766, "global_step": 219530, "epoch": 2644} {"train_loss": -24.835651397705078, "global_step": 219531, "epoch": 2644} {"train_loss": -24.740262985229492, "global_step": 219532, "epoch": 2644} {"train_loss": -24.952051162719727, "global_step": 219533, "epoch": 2644} {"train_loss": -24.04982980475368, "global_step": 219534, "epoch": 2644, "val_loss": 6748771.0} {"train_loss": -24.243242263793945, "global_step": 219535, "epoch": 2645} {"train_loss": -23.72225570678711, "global_step": 219536, "epoch": 2645} {"train_loss": -23.485965728759766, "global_step": 219537, "epoch": 2645} {"train_loss": -23.943531036376953, "global_step": 219538, "epoch": 2645} {"train_loss": -24.0654239654541, "global_step": 219539, "epoch": 2645} {"train_loss": -23.112125396728516, "global_step": 219540, "epoch": 2645} {"train_loss": -24.16607666015625, "global_step": 219541, "epoch": 2645} {"train_loss": -23.92530632019043, "global_step": 219542, "epoch": 2645} {"train_loss": -24.156091690063477, "global_step": 219543, "epoch": 2645} {"train_loss": -24.338960647583008, "global_step": 219544, "epoch": 2645} {"train_loss": -24.054733276367188, "global_step": 219545, "epoch": 2645} {"train_loss": -23.88575553894043, "global_step": 219546, "epoch": 2645} {"train_loss": -23.861968994140625, "global_step": 219547, "epoch": 2645} {"train_loss": -24.441200256347656, "global_step": 219548, "epoch": 2645} {"train_loss": -24.307172775268555, "global_step": 219549, "epoch": 2645} {"train_loss": -24.178983688354492, "global_step": 219550, "epoch": 2645} {"train_loss": -24.287076950073242, "global_step": 219551, "epoch": 2645} {"train_loss": -24.705366134643555, "global_step": 219552, "epoch": 2645} {"train_loss": -24.577878952026367, "global_step": 219553, "epoch": 2645} {"train_loss": -24.42289161682129, "global_step": 219554, "epoch": 2645} {"train_loss": -24.481319427490234, "global_step": 219555, "epoch": 2645} {"train_loss": -24.360395431518555, "global_step": 219556, "epoch": 2645} {"train_loss": -24.458105087280273, "global_step": 219557, "epoch": 2645} {"train_loss": -24.616825103759766, "global_step": 219558, "epoch": 2645} {"train_loss": -24.51145362854004, "global_step": 219559, "epoch": 2645} {"train_loss": -24.45279312133789, "global_step": 219560, "epoch": 2645} {"train_loss": -24.413021087646484, "global_step": 219561, "epoch": 2645} {"train_loss": -24.613361358642578, "global_step": 219562, "epoch": 2645} {"train_loss": -24.718536376953125, "global_step": 219563, "epoch": 2645} {"train_loss": -24.736007690429688, "global_step": 219564, "epoch": 2645} {"train_loss": -24.989103317260742, "global_step": 219565, "epoch": 2645} {"train_loss": -24.620656967163086, "global_step": 219566, "epoch": 2645} {"train_loss": -24.75180435180664, "global_step": 219567, "epoch": 2645} {"train_loss": -24.55558967590332, "global_step": 219568, "epoch": 2645} {"train_loss": -24.684301376342773, "global_step": 219569, "epoch": 2645} {"train_loss": -24.64240837097168, "global_step": 219570, "epoch": 2645} {"train_loss": -24.895137786865234, "global_step": 219571, "epoch": 2645} {"train_loss": -24.122041702270508, "global_step": 219572, "epoch": 2645} {"train_loss": -24.9913387298584, "global_step": 219573, "epoch": 2645} {"train_loss": -24.5690975189209, "global_step": 219574, "epoch": 2645} {"train_loss": -24.385652542114258, "global_step": 219575, "epoch": 2645} {"train_loss": -24.512920379638672, "global_step": 219576, "epoch": 2645} {"train_loss": -24.897001266479492, "global_step": 219577, "epoch": 2645} {"train_loss": -24.221031188964844, "global_step": 219578, "epoch": 2645} {"train_loss": -24.342191696166992, "global_step": 219579, "epoch": 2645} {"train_loss": -24.7115535736084, "global_step": 219580, "epoch": 2645} {"train_loss": -24.770557403564453, "global_step": 219581, "epoch": 2645} {"train_loss": -24.622587203979492, "global_step": 219582, "epoch": 2645} {"train_loss": -24.418882369995117, "global_step": 219583, "epoch": 2645} {"train_loss": -24.93245506286621, "global_step": 219584, "epoch": 2645} {"train_loss": -24.83329963684082, "global_step": 219585, "epoch": 2645} {"train_loss": -24.7363224029541, "global_step": 219586, "epoch": 2645} {"train_loss": -24.434295654296875, "global_step": 219587, "epoch": 2645} {"train_loss": -24.586523056030273, "global_step": 219588, "epoch": 2645} {"train_loss": -24.64365005493164, "global_step": 219589, "epoch": 2645} {"train_loss": -24.809309005737305, "global_step": 219590, "epoch": 2645} {"train_loss": -24.375905990600586, "global_step": 219591, "epoch": 2645} {"train_loss": -24.887039184570312, "global_step": 219592, "epoch": 2645} {"train_loss": -24.7357234954834, "global_step": 219593, "epoch": 2645} {"train_loss": -24.455053329467773, "global_step": 219594, "epoch": 2645} {"train_loss": -24.384000778198242, "global_step": 219595, "epoch": 2645} {"train_loss": -24.8837890625, "global_step": 219596, "epoch": 2645} {"train_loss": -24.81583023071289, "global_step": 219597, "epoch": 2645} {"train_loss": -24.61915397644043, "global_step": 219598, "epoch": 2645} {"train_loss": -24.626712799072266, "global_step": 219599, "epoch": 2645} {"train_loss": -24.595876693725586, "global_step": 219600, "epoch": 2645} {"train_loss": -24.600791931152344, "global_step": 219601, "epoch": 2645} {"train_loss": -24.209341049194336, "global_step": 219602, "epoch": 2645} {"train_loss": -24.348342895507812, "global_step": 219603, "epoch": 2645} {"train_loss": -24.694263458251953, "global_step": 219604, "epoch": 2645} {"train_loss": -24.34791374206543, "global_step": 219605, "epoch": 2645} {"train_loss": -24.553054809570312, "global_step": 219606, "epoch": 2645} {"train_loss": -24.524572372436523, "global_step": 219607, "epoch": 2645} {"train_loss": -24.959087371826172, "global_step": 219608, "epoch": 2645} {"train_loss": -24.70275115966797, "global_step": 219609, "epoch": 2645} {"train_loss": -24.63037109375, "global_step": 219610, "epoch": 2645} {"train_loss": -24.976560592651367, "global_step": 219611, "epoch": 2645} {"train_loss": -24.491493225097656, "global_step": 219612, "epoch": 2645} {"train_loss": -24.5988826751709, "global_step": 219613, "epoch": 2645} {"train_loss": -24.53754997253418, "global_step": 219614, "epoch": 2645} {"train_loss": -24.442922592163086, "global_step": 219615, "epoch": 2645} {"train_loss": -24.4798641204834, "global_step": 219616, "epoch": 2645} {"train_loss": -24.472632143870893, "global_step": 219617, "epoch": 2645, "val_loss": 6734273.0} {"train_loss": -24.056838989257812, "global_step": 219618, "epoch": 2646} {"train_loss": -23.7717342376709, "global_step": 219619, "epoch": 2646} {"train_loss": -24.39932632446289, "global_step": 219620, "epoch": 2646} {"train_loss": -24.163801193237305, "global_step": 219621, "epoch": 2646} {"train_loss": -23.807193756103516, "global_step": 219622, "epoch": 2646} {"train_loss": -24.342283248901367, "global_step": 219623, "epoch": 2646} {"train_loss": -23.932443618774414, "global_step": 219624, "epoch": 2646} {"train_loss": -23.974462509155273, "global_step": 219625, "epoch": 2646} {"train_loss": -24.058557510375977, "global_step": 219626, "epoch": 2646} {"train_loss": -23.941144943237305, "global_step": 219627, "epoch": 2646} {"train_loss": -24.25244140625, "global_step": 219628, "epoch": 2646} {"train_loss": -24.448129653930664, "global_step": 219629, "epoch": 2646} {"train_loss": -24.114490509033203, "global_step": 219630, "epoch": 2646} {"train_loss": -24.839902877807617, "global_step": 219631, "epoch": 2646} {"train_loss": -24.319059371948242, "global_step": 219632, "epoch": 2646} {"train_loss": -24.323671340942383, "global_step": 219633, "epoch": 2646} {"train_loss": -24.136573791503906, "global_step": 219634, "epoch": 2646} {"train_loss": -24.41263771057129, "global_step": 219635, "epoch": 2646} {"train_loss": -23.840391159057617, "global_step": 219636, "epoch": 2646} {"train_loss": -24.079801559448242, "global_step": 219637, "epoch": 2646} {"train_loss": -23.999876022338867, "global_step": 219638, "epoch": 2646} {"train_loss": -24.364538192749023, "global_step": 219639, "epoch": 2646} {"train_loss": -24.3989200592041, "global_step": 219640, "epoch": 2646} {"train_loss": -24.183320999145508, "global_step": 219641, "epoch": 2646} {"train_loss": -24.0880069732666, "global_step": 219642, "epoch": 2646} {"train_loss": -24.468351364135742, "global_step": 219643, "epoch": 2646} {"train_loss": -24.35147476196289, "global_step": 219644, "epoch": 2646} {"train_loss": -24.37611198425293, "global_step": 219645, "epoch": 2646} {"train_loss": -24.55348777770996, "global_step": 219646, "epoch": 2646} {"train_loss": -24.474592208862305, "global_step": 219647, "epoch": 2646} {"train_loss": -24.406593322753906, "global_step": 219648, "epoch": 2646} {"train_loss": -24.602415084838867, "global_step": 219649, "epoch": 2646} {"train_loss": -24.16750144958496, "global_step": 219650, "epoch": 2646} {"train_loss": -24.694625854492188, "global_step": 219651, "epoch": 2646} {"train_loss": -24.441877365112305, "global_step": 219652, "epoch": 2646} {"train_loss": -24.563098907470703, "global_step": 219653, "epoch": 2646} {"train_loss": -24.30182647705078, "global_step": 219654, "epoch": 2646} {"train_loss": -24.446069717407227, "global_step": 219655, "epoch": 2646} {"train_loss": -24.78009605407715, "global_step": 219656, "epoch": 2646} {"train_loss": -24.734195709228516, "global_step": 219657, "epoch": 2646} {"train_loss": -24.55388832092285, "global_step": 219658, "epoch": 2646} {"train_loss": -24.6745548248291, "global_step": 219659, "epoch": 2646} {"train_loss": -24.625349044799805, "global_step": 219660, "epoch": 2646} {"train_loss": -24.842748641967773, "global_step": 219661, "epoch": 2646} {"train_loss": -24.34739112854004, "global_step": 219662, "epoch": 2646} {"train_loss": -24.342313766479492, "global_step": 219663, "epoch": 2646} {"train_loss": -24.822961807250977, "global_step": 219664, "epoch": 2646} {"train_loss": -24.622669219970703, "global_step": 219665, "epoch": 2646} {"train_loss": -24.83755874633789, "global_step": 219666, "epoch": 2646} {"train_loss": -24.20199966430664, "global_step": 219667, "epoch": 2646} {"train_loss": -24.57867431640625, "global_step": 219668, "epoch": 2646} {"train_loss": -24.827411651611328, "global_step": 219669, "epoch": 2646} {"train_loss": -24.95778465270996, "global_step": 219670, "epoch": 2646} {"train_loss": -24.47023582458496, "global_step": 219671, "epoch": 2646} {"train_loss": -24.901573181152344, "global_step": 219672, "epoch": 2646} {"train_loss": -24.242097854614258, "global_step": 219673, "epoch": 2646} {"train_loss": -24.49970054626465, "global_step": 219674, "epoch": 2646} {"train_loss": -24.375070571899414, "global_step": 219675, "epoch": 2646} {"train_loss": -24.69782829284668, "global_step": 219676, "epoch": 2646} {"train_loss": -24.705434799194336, "global_step": 219677, "epoch": 2646} {"train_loss": -24.69065284729004, "global_step": 219678, "epoch": 2646} {"train_loss": -24.5656681060791, "global_step": 219679, "epoch": 2646} {"train_loss": -24.576602935791016, "global_step": 219680, "epoch": 2646} {"train_loss": -24.661455154418945, "global_step": 219681, "epoch": 2646} {"train_loss": -24.586183547973633, "global_step": 219682, "epoch": 2646} {"train_loss": -24.724592208862305, "global_step": 219683, "epoch": 2646} {"train_loss": -25.06499481201172, "global_step": 219684, "epoch": 2646} {"train_loss": -24.579090118408203, "global_step": 219685, "epoch": 2646} {"train_loss": -24.587848663330078, "global_step": 219686, "epoch": 2646} {"train_loss": -24.704111099243164, "global_step": 219687, "epoch": 2646} {"train_loss": -24.23847770690918, "global_step": 219688, "epoch": 2646} {"train_loss": -24.377685546875, "global_step": 219689, "epoch": 2646} {"train_loss": -24.341962814331055, "global_step": 219690, "epoch": 2646} {"train_loss": -24.516063690185547, "global_step": 219691, "epoch": 2646} {"train_loss": -24.676647186279297, "global_step": 219692, "epoch": 2646} {"train_loss": -24.80775260925293, "global_step": 219693, "epoch": 2646} {"train_loss": -24.738056182861328, "global_step": 219694, "epoch": 2646} {"train_loss": -24.70278549194336, "global_step": 219695, "epoch": 2646} {"train_loss": -24.747926712036133, "global_step": 219696, "epoch": 2646} {"train_loss": -24.618085861206055, "global_step": 219697, "epoch": 2646} {"train_loss": -24.710315704345703, "global_step": 219698, "epoch": 2646} {"train_loss": -24.450815200805664, "global_step": 219699, "epoch": 2646} {"train_loss": -24.447820479611316, "global_step": 219700, "epoch": 2646, "val_loss": 6569810.0} {"train_loss": -24.542898178100586, "global_step": 219701, "epoch": 2647} {"train_loss": -24.431102752685547, "global_step": 219702, "epoch": 2647} {"train_loss": -23.991281509399414, "global_step": 219703, "epoch": 2647} {"train_loss": -24.397550582885742, "global_step": 219704, "epoch": 2647} {"train_loss": -24.638526916503906, "global_step": 219705, "epoch": 2647} {"train_loss": -24.08090591430664, "global_step": 219706, "epoch": 2647} {"train_loss": -24.261234283447266, "global_step": 219707, "epoch": 2647} {"train_loss": -23.866025924682617, "global_step": 219708, "epoch": 2647} {"train_loss": -24.803091049194336, "global_step": 219709, "epoch": 2647} {"train_loss": -24.372907638549805, "global_step": 219710, "epoch": 2647} {"train_loss": -24.115909576416016, "global_step": 219711, "epoch": 2647} {"train_loss": -24.19732666015625, "global_step": 219712, "epoch": 2647} {"train_loss": -24.060205459594727, "global_step": 219713, "epoch": 2647} {"train_loss": -24.38222312927246, "global_step": 219714, "epoch": 2647} {"train_loss": -24.49444007873535, "global_step": 219715, "epoch": 2647} {"train_loss": -24.343236923217773, "global_step": 219716, "epoch": 2647} {"train_loss": -24.267480850219727, "global_step": 219717, "epoch": 2647} {"train_loss": -24.609939575195312, "global_step": 219718, "epoch": 2647} {"train_loss": -24.45710563659668, "global_step": 219719, "epoch": 2647} {"train_loss": -24.532304763793945, "global_step": 219720, "epoch": 2647} {"train_loss": -24.578561782836914, "global_step": 219721, "epoch": 2647} {"train_loss": -24.85856056213379, "global_step": 219722, "epoch": 2647} {"train_loss": -24.753284454345703, "global_step": 219723, "epoch": 2647} {"train_loss": -24.456714630126953, "global_step": 219724, "epoch": 2647} {"train_loss": -24.810482025146484, "global_step": 219725, "epoch": 2647} {"train_loss": -24.22879409790039, "global_step": 219726, "epoch": 2647} {"train_loss": -24.43718910217285, "global_step": 219727, "epoch": 2647} {"train_loss": -24.72562599182129, "global_step": 219728, "epoch": 2647} {"train_loss": -24.36298370361328, "global_step": 219729, "epoch": 2647} {"train_loss": -24.422147750854492, "global_step": 219730, "epoch": 2647} {"train_loss": -25.047710418701172, "global_step": 219731, "epoch": 2647} {"train_loss": -24.903703689575195, "global_step": 219732, "epoch": 2647} {"train_loss": -24.61097526550293, "global_step": 219733, "epoch": 2647} {"train_loss": -24.44281578063965, "global_step": 219734, "epoch": 2647} {"train_loss": -24.65108299255371, "global_step": 219735, "epoch": 2647} {"train_loss": -24.712034225463867, "global_step": 219736, "epoch": 2647} {"train_loss": -24.753461837768555, "global_step": 219737, "epoch": 2647} {"train_loss": -24.885929107666016, "global_step": 219738, "epoch": 2647} {"train_loss": -24.57574462890625, "global_step": 219739, "epoch": 2647} {"train_loss": -24.758207321166992, "global_step": 219740, "epoch": 2647} {"train_loss": -25.015878677368164, "global_step": 219741, "epoch": 2647} {"train_loss": -24.707996368408203, "global_step": 219742, "epoch": 2647} {"train_loss": -24.935657501220703, "global_step": 219743, "epoch": 2647} {"train_loss": -24.733793258666992, "global_step": 219744, "epoch": 2647} {"train_loss": -24.404176712036133, "global_step": 219745, "epoch": 2647} {"train_loss": -24.266550064086914, "global_step": 219746, "epoch": 2647} {"train_loss": -24.628753662109375, "global_step": 219747, "epoch": 2647} {"train_loss": -24.787527084350586, "global_step": 219748, "epoch": 2647} {"train_loss": -24.827234268188477, "global_step": 219749, "epoch": 2647} {"train_loss": -24.346582412719727, "global_step": 219750, "epoch": 2647} {"train_loss": -24.709980010986328, "global_step": 219751, "epoch": 2647} {"train_loss": -24.651350021362305, "global_step": 219752, "epoch": 2647} {"train_loss": -24.78120994567871, "global_step": 219753, "epoch": 2647} {"train_loss": -24.532333374023438, "global_step": 219754, "epoch": 2647} {"train_loss": -24.485572814941406, "global_step": 219755, "epoch": 2647} {"train_loss": -25.182416915893555, "global_step": 219756, "epoch": 2647} {"train_loss": -24.494033813476562, "global_step": 219757, "epoch": 2647} {"train_loss": -24.209354400634766, "global_step": 219758, "epoch": 2647} {"train_loss": -24.983686447143555, "global_step": 219759, "epoch": 2647} {"train_loss": -24.419538497924805, "global_step": 219760, "epoch": 2647} {"train_loss": -24.813024520874023, "global_step": 219761, "epoch": 2647} {"train_loss": -24.674884796142578, "global_step": 219762, "epoch": 2647} {"train_loss": -24.25033950805664, "global_step": 219763, "epoch": 2647} {"train_loss": -24.29437828063965, "global_step": 219764, "epoch": 2647} {"train_loss": -24.45258903503418, "global_step": 219765, "epoch": 2647} {"train_loss": -24.134977340698242, "global_step": 219766, "epoch": 2647} {"train_loss": -23.7225341796875, "global_step": 219767, "epoch": 2647} {"train_loss": -24.090574264526367, "global_step": 219768, "epoch": 2647} {"train_loss": -24.267169952392578, "global_step": 219769, "epoch": 2647} {"train_loss": -24.30580711364746, "global_step": 219770, "epoch": 2647} {"train_loss": -23.953744888305664, "global_step": 219771, "epoch": 2647} {"train_loss": -24.128747940063477, "global_step": 219772, "epoch": 2647} {"train_loss": -24.280685424804688, "global_step": 219773, "epoch": 2647} {"train_loss": -24.6510066986084, "global_step": 219774, "epoch": 2647} {"train_loss": -24.225454330444336, "global_step": 219775, "epoch": 2647} {"train_loss": -24.59568214416504, "global_step": 219776, "epoch": 2647} {"train_loss": -24.392406463623047, "global_step": 219777, "epoch": 2647} {"train_loss": -24.346113204956055, "global_step": 219778, "epoch": 2647} {"train_loss": -24.185562133789062, "global_step": 219779, "epoch": 2647} {"train_loss": -24.45777702331543, "global_step": 219780, "epoch": 2647} {"train_loss": -24.265966415405273, "global_step": 219781, "epoch": 2647} {"train_loss": -24.131988525390625, "global_step": 219782, "epoch": 2647} {"train_loss": -24.48502575058535, "global_step": 219783, "epoch": 2647, "val_loss": 6614492.5} {"train_loss": -23.511093139648438, "global_step": 219784, "epoch": 2648} {"train_loss": -24.3866024017334, "global_step": 219785, "epoch": 2648} {"train_loss": -24.090839385986328, "global_step": 219786, "epoch": 2648} {"train_loss": -24.267332077026367, "global_step": 219787, "epoch": 2648} {"train_loss": -24.571022033691406, "global_step": 219788, "epoch": 2648} {"train_loss": -24.4423828125, "global_step": 219789, "epoch": 2648} {"train_loss": -24.342538833618164, "global_step": 219790, "epoch": 2648} {"train_loss": -24.628707885742188, "global_step": 219791, "epoch": 2648} {"train_loss": -24.094818115234375, "global_step": 219792, "epoch": 2648} {"train_loss": -24.767614364624023, "global_step": 219793, "epoch": 2648} {"train_loss": -24.45721435546875, "global_step": 219794, "epoch": 2648} {"train_loss": -24.679588317871094, "global_step": 219795, "epoch": 2648} {"train_loss": -23.806352615356445, "global_step": 219796, "epoch": 2648} {"train_loss": -24.172727584838867, "global_step": 219797, "epoch": 2648} {"train_loss": -24.338781356811523, "global_step": 219798, "epoch": 2648} {"train_loss": -24.186386108398438, "global_step": 219799, "epoch": 2648} {"train_loss": -24.897811889648438, "global_step": 219800, "epoch": 2648} {"train_loss": -24.467077255249023, "global_step": 219801, "epoch": 2648} {"train_loss": -24.351482391357422, "global_step": 219802, "epoch": 2648} {"train_loss": -24.565187454223633, "global_step": 219803, "epoch": 2648} {"train_loss": -24.375534057617188, "global_step": 219804, "epoch": 2648} {"train_loss": -24.62111473083496, "global_step": 219805, "epoch": 2648} {"train_loss": -24.50648307800293, "global_step": 219806, "epoch": 2648} {"train_loss": -24.403202056884766, "global_step": 219807, "epoch": 2648} {"train_loss": -24.421817779541016, "global_step": 219808, "epoch": 2648} {"train_loss": -24.438512802124023, "global_step": 219809, "epoch": 2648} {"train_loss": -24.52025032043457, "global_step": 219810, "epoch": 2648} {"train_loss": -24.537002563476562, "global_step": 219811, "epoch": 2648} {"train_loss": -24.377784729003906, "global_step": 219812, "epoch": 2648} {"train_loss": -24.432300567626953, "global_step": 219813, "epoch": 2648} {"train_loss": -24.487720489501953, "global_step": 219814, "epoch": 2648} {"train_loss": -24.198699951171875, "global_step": 219815, "epoch": 2648} {"train_loss": -24.537599563598633, "global_step": 219816, "epoch": 2648} {"train_loss": -24.31301498413086, "global_step": 219817, "epoch": 2648} {"train_loss": -24.395841598510742, "global_step": 219818, "epoch": 2648} {"train_loss": -24.356231689453125, "global_step": 219819, "epoch": 2648} {"train_loss": -24.180612564086914, "global_step": 219820, "epoch": 2648} {"train_loss": -24.18836784362793, "global_step": 219821, "epoch": 2648} {"train_loss": -24.62731170654297, "global_step": 219822, "epoch": 2648} {"train_loss": -24.556005477905273, "global_step": 219823, "epoch": 2648} {"train_loss": -24.13779067993164, "global_step": 219824, "epoch": 2648} {"train_loss": -24.793277740478516, "global_step": 219825, "epoch": 2648} {"train_loss": -24.885862350463867, "global_step": 219826, "epoch": 2648} {"train_loss": -24.448287963867188, "global_step": 219827, "epoch": 2648} {"train_loss": -24.60500144958496, "global_step": 219828, "epoch": 2648} {"train_loss": -24.73963737487793, "global_step": 219829, "epoch": 2648} {"train_loss": -24.564960479736328, "global_step": 219830, "epoch": 2648} {"train_loss": -24.61123275756836, "global_step": 219831, "epoch": 2648} {"train_loss": -24.41559410095215, "global_step": 219832, "epoch": 2648} {"train_loss": -24.565595626831055, "global_step": 219833, "epoch": 2648} {"train_loss": -24.41008186340332, "global_step": 219834, "epoch": 2648} {"train_loss": -24.52547836303711, "global_step": 219835, "epoch": 2648} {"train_loss": -24.560636520385742, "global_step": 219836, "epoch": 2648} {"train_loss": -24.695737838745117, "global_step": 219837, "epoch": 2648} {"train_loss": -24.59706687927246, "global_step": 219838, "epoch": 2648} {"train_loss": -24.409284591674805, "global_step": 219839, "epoch": 2648} {"train_loss": -24.390966415405273, "global_step": 219840, "epoch": 2648} {"train_loss": -24.86530113220215, "global_step": 219841, "epoch": 2648} {"train_loss": -24.71474266052246, "global_step": 219842, "epoch": 2648} {"train_loss": -24.899198532104492, "global_step": 219843, "epoch": 2648} {"train_loss": -24.523527145385742, "global_step": 219844, "epoch": 2648} {"train_loss": -24.37887954711914, "global_step": 219845, "epoch": 2648} {"train_loss": -24.608678817749023, "global_step": 219846, "epoch": 2648} {"train_loss": -24.39214515686035, "global_step": 219847, "epoch": 2648} {"train_loss": -24.562063217163086, "global_step": 219848, "epoch": 2648} {"train_loss": -24.813291549682617, "global_step": 219849, "epoch": 2648} {"train_loss": -24.578304290771484, "global_step": 219850, "epoch": 2648} {"train_loss": -24.955459594726562, "global_step": 219851, "epoch": 2648} {"train_loss": -24.45417594909668, "global_step": 219852, "epoch": 2648} {"train_loss": -24.84511375427246, "global_step": 219853, "epoch": 2648} {"train_loss": -24.748153686523438, "global_step": 219854, "epoch": 2648} {"train_loss": -24.803882598876953, "global_step": 219855, "epoch": 2648} {"train_loss": -24.652189254760742, "global_step": 219856, "epoch": 2648} {"train_loss": -24.569734573364258, "global_step": 219857, "epoch": 2648} {"train_loss": -24.664453506469727, "global_step": 219858, "epoch": 2648} {"train_loss": -24.78028678894043, "global_step": 219859, "epoch": 2648} {"train_loss": -24.49247169494629, "global_step": 219860, "epoch": 2648} {"train_loss": -24.6505069732666, "global_step": 219861, "epoch": 2648} {"train_loss": -24.549251556396484, "global_step": 219862, "epoch": 2648} {"train_loss": -23.974395751953125, "global_step": 219863, "epoch": 2648} {"train_loss": -24.230756759643555, "global_step": 219864, "epoch": 2648} {"train_loss": -24.571813583374023, "global_step": 219865, "epoch": 2648} {"train_loss": -24.486216878316487, "global_step": 219866, "epoch": 2648, "val_loss": 6798496.0} {"train_loss": -24.29670524597168, "global_step": 219867, "epoch": 2649} {"train_loss": -24.639745712280273, "global_step": 219868, "epoch": 2649} {"train_loss": -24.550800323486328, "global_step": 219869, "epoch": 2649} {"train_loss": -24.001005172729492, "global_step": 219870, "epoch": 2649} {"train_loss": -24.154443740844727, "global_step": 219871, "epoch": 2649} {"train_loss": -24.392194747924805, "global_step": 219872, "epoch": 2649} {"train_loss": -24.32761573791504, "global_step": 219873, "epoch": 2649} {"train_loss": -24.304855346679688, "global_step": 219874, "epoch": 2649} {"train_loss": -24.57670783996582, "global_step": 219875, "epoch": 2649} {"train_loss": -24.141836166381836, "global_step": 219876, "epoch": 2649} {"train_loss": -24.096757888793945, "global_step": 219877, "epoch": 2649} {"train_loss": -24.641279220581055, "global_step": 219878, "epoch": 2649} {"train_loss": -24.35202407836914, "global_step": 219879, "epoch": 2649} {"train_loss": -24.420413970947266, "global_step": 219880, "epoch": 2649} {"train_loss": -24.54483985900879, "global_step": 219881, "epoch": 2649} {"train_loss": -24.068655014038086, "global_step": 219882, "epoch": 2649} {"train_loss": -24.408340454101562, "global_step": 219883, "epoch": 2649} {"train_loss": -24.563745498657227, "global_step": 219884, "epoch": 2649} {"train_loss": -24.737913131713867, "global_step": 219885, "epoch": 2649} {"train_loss": -24.41023063659668, "global_step": 219886, "epoch": 2649} {"train_loss": -24.466848373413086, "global_step": 219887, "epoch": 2649} {"train_loss": -24.640146255493164, "global_step": 219888, "epoch": 2649} {"train_loss": -24.692445755004883, "global_step": 219889, "epoch": 2649} {"train_loss": -24.750520706176758, "global_step": 219890, "epoch": 2649} {"train_loss": -24.77825164794922, "global_step": 219891, "epoch": 2649} {"train_loss": -24.461734771728516, "global_step": 219892, "epoch": 2649} {"train_loss": -24.353729248046875, "global_step": 219893, "epoch": 2649} {"train_loss": -24.532346725463867, "global_step": 219894, "epoch": 2649} {"train_loss": -24.751758575439453, "global_step": 219895, "epoch": 2649} {"train_loss": -24.143644332885742, "global_step": 219896, "epoch": 2649} {"train_loss": -24.38144302368164, "global_step": 219897, "epoch": 2649} {"train_loss": -25.13655662536621, "global_step": 219898, "epoch": 2649} {"train_loss": -24.5830078125, "global_step": 219899, "epoch": 2649} {"train_loss": -24.560453414916992, "global_step": 219900, "epoch": 2649} {"train_loss": -24.69445037841797, "global_step": 219901, "epoch": 2649} {"train_loss": -24.891965866088867, "global_step": 219902, "epoch": 2649} {"train_loss": -24.725433349609375, "global_step": 219903, "epoch": 2649} {"train_loss": -24.748533248901367, "global_step": 219904, "epoch": 2649} {"train_loss": -24.6601619720459, "global_step": 219905, "epoch": 2649} {"train_loss": -24.37126350402832, "global_step": 219906, "epoch": 2649} {"train_loss": -24.915895462036133, "global_step": 219907, "epoch": 2649} {"train_loss": -24.757226943969727, "global_step": 219908, "epoch": 2649} {"train_loss": -24.473291397094727, "global_step": 219909, "epoch": 2649} {"train_loss": -24.676973342895508, "global_step": 219910, "epoch": 2649} {"train_loss": -24.37698745727539, "global_step": 219911, "epoch": 2649} {"train_loss": -24.738950729370117, "global_step": 219912, "epoch": 2649} {"train_loss": -24.60431480407715, "global_step": 219913, "epoch": 2649} {"train_loss": -24.510297775268555, "global_step": 219914, "epoch": 2649} {"train_loss": -24.61060905456543, "global_step": 219915, "epoch": 2649} {"train_loss": -24.2818660736084, "global_step": 219916, "epoch": 2649} {"train_loss": -24.544103622436523, "global_step": 219917, "epoch": 2649} {"train_loss": -24.595308303833008, "global_step": 219918, "epoch": 2649} {"train_loss": -24.602584838867188, "global_step": 219919, "epoch": 2649} {"train_loss": -24.643131256103516, "global_step": 219920, "epoch": 2649} {"train_loss": -24.453704833984375, "global_step": 219921, "epoch": 2649} {"train_loss": -24.388153076171875, "global_step": 219922, "epoch": 2649} {"train_loss": -24.572132110595703, "global_step": 219923, "epoch": 2649} {"train_loss": -24.927396774291992, "global_step": 219924, "epoch": 2649} {"train_loss": -24.323274612426758, "global_step": 219925, "epoch": 2649} {"train_loss": -24.60515594482422, "global_step": 219926, "epoch": 2649} {"train_loss": -24.50276756286621, "global_step": 219927, "epoch": 2649} {"train_loss": -24.903276443481445, "global_step": 219928, "epoch": 2649} {"train_loss": -24.419370651245117, "global_step": 219929, "epoch": 2649} {"train_loss": -24.97771453857422, "global_step": 219930, "epoch": 2649} {"train_loss": -24.427471160888672, "global_step": 219931, "epoch": 2649} {"train_loss": -24.246557235717773, "global_step": 219932, "epoch": 2649} {"train_loss": -24.435394287109375, "global_step": 219933, "epoch": 2649} {"train_loss": -24.716217041015625, "global_step": 219934, "epoch": 2649} {"train_loss": -24.532852172851562, "global_step": 219935, "epoch": 2649} {"train_loss": -24.592945098876953, "global_step": 219936, "epoch": 2649} {"train_loss": -24.377626419067383, "global_step": 219937, "epoch": 2649} {"train_loss": -24.584579467773438, "global_step": 219938, "epoch": 2649} {"train_loss": -24.78264617919922, "global_step": 219939, "epoch": 2649} {"train_loss": -24.337894439697266, "global_step": 219940, "epoch": 2649} {"train_loss": -24.8756103515625, "global_step": 219941, "epoch": 2649} {"train_loss": -24.610370635986328, "global_step": 219942, "epoch": 2649} {"train_loss": -24.48727035522461, "global_step": 219943, "epoch": 2649} {"train_loss": -24.804641723632812, "global_step": 219944, "epoch": 2649} {"train_loss": -24.449939727783203, "global_step": 219945, "epoch": 2649} {"train_loss": -24.605215072631836, "global_step": 219946, "epoch": 2649} {"train_loss": -24.70015525817871, "global_step": 219947, "epoch": 2649} {"train_loss": -24.605222702026367, "global_step": 219948, "epoch": 2649} {"train_loss": -24.557264236082514, "global_step": 219949, "epoch": 2649, "val_loss": 6661906.0} {"train_loss": -24.058759689331055, "global_step": 219950, "epoch": 2650} {"train_loss": -24.113801956176758, "global_step": 219951, "epoch": 2650} {"train_loss": -23.9440975189209, "global_step": 219952, "epoch": 2650} {"train_loss": -24.3321590423584, "global_step": 219953, "epoch": 2650} {"train_loss": -24.095245361328125, "global_step": 219954, "epoch": 2650} {"train_loss": -23.864913940429688, "global_step": 219955, "epoch": 2650} {"train_loss": -24.378005981445312, "global_step": 219956, "epoch": 2650} {"train_loss": -24.45741844177246, "global_step": 219957, "epoch": 2650} {"train_loss": -24.38728141784668, "global_step": 219958, "epoch": 2650} {"train_loss": -24.23885154724121, "global_step": 219959, "epoch": 2650} {"train_loss": -24.43695068359375, "global_step": 219960, "epoch": 2650} {"train_loss": -24.217172622680664, "global_step": 219961, "epoch": 2650} {"train_loss": -24.291738510131836, "global_step": 219962, "epoch": 2650} {"train_loss": -24.131486892700195, "global_step": 219963, "epoch": 2650} {"train_loss": -24.8128662109375, "global_step": 219964, "epoch": 2650} {"train_loss": -24.755325317382812, "global_step": 219965, "epoch": 2650} {"train_loss": -24.190229415893555, "global_step": 219966, "epoch": 2650} {"train_loss": -24.42795181274414, "global_step": 219967, "epoch": 2650} {"train_loss": -24.46785545349121, "global_step": 219968, "epoch": 2650} {"train_loss": -24.556615829467773, "global_step": 219969, "epoch": 2650} {"train_loss": -24.402950286865234, "global_step": 219970, "epoch": 2650} {"train_loss": -24.686790466308594, "global_step": 219971, "epoch": 2650} {"train_loss": -24.358627319335938, "global_step": 219972, "epoch": 2650} {"train_loss": -24.246545791625977, "global_step": 219973, "epoch": 2650} {"train_loss": -24.479068756103516, "global_step": 219974, "epoch": 2650} {"train_loss": -24.613183975219727, "global_step": 219975, "epoch": 2650} {"train_loss": -24.613555908203125, "global_step": 219976, "epoch": 2650} {"train_loss": -24.445505142211914, "global_step": 219977, "epoch": 2650} {"train_loss": -24.84500503540039, "global_step": 219978, "epoch": 2650} {"train_loss": -24.72457504272461, "global_step": 219979, "epoch": 2650} {"train_loss": -24.540069580078125, "global_step": 219980, "epoch": 2650} {"train_loss": -24.88176918029785, "global_step": 219981, "epoch": 2650} {"train_loss": -24.626636505126953, "global_step": 219982, "epoch": 2650} {"train_loss": -24.952852249145508, "global_step": 219983, "epoch": 2650} {"train_loss": -24.80204200744629, "global_step": 219984, "epoch": 2650} {"train_loss": -24.496097564697266, "global_step": 219985, "epoch": 2650} {"train_loss": -24.496051788330078, "global_step": 219986, "epoch": 2650} {"train_loss": -24.736968994140625, "global_step": 219987, "epoch": 2650} {"train_loss": -24.488845825195312, "global_step": 219988, "epoch": 2650} {"train_loss": -24.970996856689453, "global_step": 219989, "epoch": 2650} {"train_loss": -25.015968322753906, "global_step": 219990, "epoch": 2650} {"train_loss": -24.749744415283203, "global_step": 219991, "epoch": 2650} {"train_loss": -24.801786422729492, "global_step": 219992, "epoch": 2650} {"train_loss": -24.956396102905273, "global_step": 219993, "epoch": 2650} {"train_loss": -24.384048461914062, "global_step": 219994, "epoch": 2650} {"train_loss": -23.97477149963379, "global_step": 219995, "epoch": 2650} {"train_loss": -23.702070236206055, "global_step": 219996, "epoch": 2650} {"train_loss": -23.25906753540039, "global_step": 219997, "epoch": 2650} {"train_loss": -23.55780601501465, "global_step": 219998, "epoch": 2650} {"train_loss": -24.327917098999023, "global_step": 219999, "epoch": 2650} {"train_loss": -23.662656784057617, "global_step": 220000, "epoch": 2650} {"train_loss": -24.546663284301758, "global_step": 220001, "epoch": 2650} {"train_loss": -24.330350875854492, "global_step": 220002, "epoch": 2650} {"train_loss": -24.029767990112305, "global_step": 220003, "epoch": 2650} {"train_loss": -24.310016632080078, "global_step": 220004, "epoch": 2650} {"train_loss": -24.046913146972656, "global_step": 220005, "epoch": 2650} {"train_loss": -24.56062126159668, "global_step": 220006, "epoch": 2650} {"train_loss": -24.123046875, "global_step": 220007, "epoch": 2650} {"train_loss": -24.49015998840332, "global_step": 220008, "epoch": 2650} {"train_loss": -24.245080947875977, "global_step": 220009, "epoch": 2650} {"train_loss": -24.031034469604492, "global_step": 220010, "epoch": 2650} {"train_loss": -24.489622116088867, "global_step": 220011, "epoch": 2650} {"train_loss": -24.483840942382812, "global_step": 220012, "epoch": 2650} {"train_loss": -24.4215030670166, "global_step": 220013, "epoch": 2650} {"train_loss": -24.220691680908203, "global_step": 220014, "epoch": 2650} {"train_loss": -24.474292755126953, "global_step": 220015, "epoch": 2650} {"train_loss": -24.3315486907959, "global_step": 220016, "epoch": 2650} {"train_loss": -24.508567810058594, "global_step": 220017, "epoch": 2650} {"train_loss": -24.347517013549805, "global_step": 220018, "epoch": 2650} {"train_loss": -24.56842041015625, "global_step": 220019, "epoch": 2650} {"train_loss": -24.198591232299805, "global_step": 220020, "epoch": 2650} {"train_loss": -24.2395076751709, "global_step": 220021, "epoch": 2650} {"train_loss": -24.6512508392334, "global_step": 220022, "epoch": 2650} {"train_loss": -24.598745346069336, "global_step": 220023, "epoch": 2650} {"train_loss": -24.527463912963867, "global_step": 220024, "epoch": 2650} {"train_loss": -24.698415756225586, "global_step": 220025, "epoch": 2650} {"train_loss": -24.53413963317871, "global_step": 220026, "epoch": 2650} {"train_loss": -24.678701400756836, "global_step": 220027, "epoch": 2650} {"train_loss": -24.684301376342773, "global_step": 220028, "epoch": 2650} {"train_loss": -24.79800796508789, "global_step": 220029, "epoch": 2650} {"train_loss": -24.767414093017578, "global_step": 220030, "epoch": 2650} {"train_loss": -24.77338981628418, "global_step": 220031, "epoch": 2650} {"train_loss": -24.413689762712963, "global_step": 220032, "epoch": 2650, "train/sim_max_reward_0": 1.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4500000": 1.0, "test/sim_max_reward_4500001": 1.0, "test/sim_max_reward_4500002": 1.0, "test/sim_max_reward_4500003": 1.0, "test/sim_max_reward_4500004": 1.0, "test/sim_max_reward_4500005": 1.0, "test/sim_max_reward_4500006": 1.0, "test/sim_max_reward_4500007": 1.0, "test/sim_max_reward_4500008": 1.0, "test/sim_max_reward_4500009": 1.0, "test/sim_max_reward_4500010": 1.0, "test/sim_max_reward_4500011": 1.0, "test/sim_max_reward_4500012": 1.0, "test/sim_max_reward_4500013": 1.0, "test/sim_max_reward_4500014": 1.0, "test/sim_max_reward_4500015": 1.0, "test/sim_max_reward_4500016": 1.0, "test/sim_max_reward_4500017": 1.0, "test/sim_max_reward_4500018": 1.0, "test/sim_max_reward_4500019": 0.0, "test/sim_max_reward_4500020": 1.0, "test/sim_max_reward_4500021": 1.0, "train/mean_score": 1.0, "test/mean_score": 0.9545454545454546, "val_loss": 6496211.0} {"train_loss": -24.751455307006836, "global_step": 220033, "epoch": 2651} {"train_loss": -23.92393684387207, "global_step": 220034, "epoch": 2651} {"train_loss": -24.34000587463379, "global_step": 220035, "epoch": 2651} {"train_loss": -24.354022979736328, "global_step": 220036, "epoch": 2651} {"train_loss": -24.408044815063477, "global_step": 220037, "epoch": 2651} {"train_loss": -24.459569931030273, "global_step": 220038, "epoch": 2651} {"train_loss": -24.417078018188477, "global_step": 220039, "epoch": 2651} {"train_loss": -24.68240737915039, "global_step": 220040, "epoch": 2651} {"train_loss": -24.391096115112305, "global_step": 220041, "epoch": 2651} {"train_loss": -24.426639556884766, "global_step": 220042, "epoch": 2651} {"train_loss": -24.33260726928711, "global_step": 220043, "epoch": 2651} {"train_loss": -24.55267333984375, "global_step": 220044, "epoch": 2651} {"train_loss": -24.654483795166016, "global_step": 220045, "epoch": 2651} {"train_loss": -24.49540138244629, "global_step": 220046, "epoch": 2651} {"train_loss": -24.32901382446289, "global_step": 220047, "epoch": 2651} {"train_loss": -24.827062606811523, "global_step": 220048, "epoch": 2651} {"train_loss": -24.66482925415039, "global_step": 220049, "epoch": 2651} {"train_loss": -24.693769454956055, "global_step": 220050, "epoch": 2651} {"train_loss": -24.89474105834961, "global_step": 220051, "epoch": 2651} {"train_loss": -24.613893508911133, "global_step": 220052, "epoch": 2651} {"train_loss": -24.44921112060547, "global_step": 220053, "epoch": 2651} {"train_loss": -24.54191780090332, "global_step": 220054, "epoch": 2651} {"train_loss": -24.50977897644043, "global_step": 220055, "epoch": 2651} {"train_loss": -24.80782127380371, "global_step": 220056, "epoch": 2651} {"train_loss": -24.526700973510742, "global_step": 220057, "epoch": 2651} {"train_loss": -24.20017433166504, "global_step": 220058, "epoch": 2651} {"train_loss": -24.05536651611328, "global_step": 220059, "epoch": 2651} {"train_loss": -24.37750816345215, "global_step": 220060, "epoch": 2651} {"train_loss": -24.318254470825195, "global_step": 220061, "epoch": 2651} {"train_loss": -24.1840763092041, "global_step": 220062, "epoch": 2651} {"train_loss": -24.28520393371582, "global_step": 220063, "epoch": 2651} {"train_loss": -24.314048767089844, "global_step": 220064, "epoch": 2651} {"train_loss": -24.66617202758789, "global_step": 220065, "epoch": 2651} {"train_loss": -24.524208068847656, "global_step": 220066, "epoch": 2651} {"train_loss": -24.63839340209961, "global_step": 220067, "epoch": 2651} {"train_loss": -24.742862701416016, "global_step": 220068, "epoch": 2651} {"train_loss": -24.33966636657715, "global_step": 220069, "epoch": 2651} {"train_loss": -24.86528968811035, "global_step": 220070, "epoch": 2651} {"train_loss": -24.667966842651367, "global_step": 220071, "epoch": 2651} {"train_loss": -24.611526489257812, "global_step": 220072, "epoch": 2651} {"train_loss": -24.997329711914062, "global_step": 220073, "epoch": 2651} {"train_loss": -24.12080955505371, "global_step": 220074, "epoch": 2651} {"train_loss": -24.2000732421875, "global_step": 220075, "epoch": 2651} {"train_loss": -24.63905143737793, "global_step": 220076, "epoch": 2651} {"train_loss": -24.3671817779541, "global_step": 220077, "epoch": 2651} {"train_loss": -24.0768985748291, "global_step": 220078, "epoch": 2651} {"train_loss": -24.51007652282715, "global_step": 220079, "epoch": 2651} {"train_loss": -24.43735122680664, "global_step": 220080, "epoch": 2651} {"train_loss": -24.704336166381836, "global_step": 220081, "epoch": 2651} {"train_loss": -24.289884567260742, "global_step": 220082, "epoch": 2651} {"train_loss": -24.287939071655273, "global_step": 220083, "epoch": 2651} {"train_loss": -24.47882652282715, "global_step": 220084, "epoch": 2651} {"train_loss": -25.065153121948242, "global_step": 220085, "epoch": 2651} {"train_loss": -24.43450355529785, "global_step": 220086, "epoch": 2651} {"train_loss": -24.931503295898438, "global_step": 220087, "epoch": 2651} {"train_loss": -24.985454559326172, "global_step": 220088, "epoch": 2651} {"train_loss": -24.897031784057617, "global_step": 220089, "epoch": 2651} {"train_loss": -24.538198471069336, "global_step": 220090, "epoch": 2651} {"train_loss": -24.471269607543945, "global_step": 220091, "epoch": 2651} {"train_loss": -24.740354537963867, "global_step": 220092, "epoch": 2651} {"train_loss": -24.471097946166992, "global_step": 220093, "epoch": 2651} {"train_loss": -24.96225357055664, "global_step": 220094, "epoch": 2651} {"train_loss": -24.97456169128418, "global_step": 220095, "epoch": 2651} {"train_loss": -25.06312370300293, "global_step": 220096, "epoch": 2651} {"train_loss": -24.811019897460938, "global_step": 220097, "epoch": 2651} {"train_loss": -24.826068878173828, "global_step": 220098, "epoch": 2651} {"train_loss": -25.08391571044922, "global_step": 220099, "epoch": 2651} {"train_loss": -24.653440475463867, "global_step": 220100, "epoch": 2651} {"train_loss": -24.96344566345215, "global_step": 220101, "epoch": 2651} {"train_loss": -24.914093017578125, "global_step": 220102, "epoch": 2651} {"train_loss": -24.973880767822266, "global_step": 220103, "epoch": 2651} {"train_loss": -24.742069244384766, "global_step": 220104, "epoch": 2651} {"train_loss": -24.812780380249023, "global_step": 220105, "epoch": 2651} {"train_loss": -25.117507934570312, "global_step": 220106, "epoch": 2651} {"train_loss": -24.476354598999023, "global_step": 220107, "epoch": 2651} {"train_loss": -24.622821807861328, "global_step": 220108, "epoch": 2651} {"train_loss": -24.585485458374023, "global_step": 220109, "epoch": 2651} {"train_loss": -24.632482528686523, "global_step": 220110, "epoch": 2651} {"train_loss": -24.27646827697754, "global_step": 220111, "epoch": 2651} {"train_loss": -24.658653259277344, "global_step": 220112, "epoch": 2651} {"train_loss": -24.295368194580078, "global_step": 220113, "epoch": 2651} {"train_loss": -24.607759475708008, "global_step": 220114, "epoch": 2651} {"train_loss": -24.573579213705408, "global_step": 220115, "epoch": 2651, "val_loss": 6738420.0} {"train_loss": -22.55558204650879, "global_step": 220116, "epoch": 2652} {"train_loss": -22.482696533203125, "global_step": 220117, "epoch": 2652} {"train_loss": -23.02607536315918, "global_step": 220118, "epoch": 2652} {"train_loss": -22.485212326049805, "global_step": 220119, "epoch": 2652} {"train_loss": -23.55171775817871, "global_step": 220120, "epoch": 2652} {"train_loss": -23.07908058166504, "global_step": 220121, "epoch": 2652} {"train_loss": -23.96198844909668, "global_step": 220122, "epoch": 2652} {"train_loss": -23.46278953552246, "global_step": 220123, "epoch": 2652} {"train_loss": -24.145263671875, "global_step": 220124, "epoch": 2652} {"train_loss": -23.894033432006836, "global_step": 220125, "epoch": 2652} {"train_loss": -23.9328670501709, "global_step": 220126, "epoch": 2652} {"train_loss": -23.600202560424805, "global_step": 220127, "epoch": 2652} {"train_loss": -24.15494728088379, "global_step": 220128, "epoch": 2652} {"train_loss": -24.01156997680664, "global_step": 220129, "epoch": 2652} {"train_loss": -24.033214569091797, "global_step": 220130, "epoch": 2652} {"train_loss": -23.791889190673828, "global_step": 220131, "epoch": 2652} {"train_loss": -23.93134880065918, "global_step": 220132, "epoch": 2652} {"train_loss": -24.306440353393555, "global_step": 220133, "epoch": 2652} {"train_loss": -24.161054611206055, "global_step": 220134, "epoch": 2652} {"train_loss": -23.80684471130371, "global_step": 220135, "epoch": 2652} {"train_loss": -24.152128219604492, "global_step": 220136, "epoch": 2652} {"train_loss": -24.4339656829834, "global_step": 220137, "epoch": 2652} {"train_loss": -24.167800903320312, "global_step": 220138, "epoch": 2652} {"train_loss": -24.507095336914062, "global_step": 220139, "epoch": 2652} {"train_loss": -24.129240036010742, "global_step": 220140, "epoch": 2652} {"train_loss": -24.33656883239746, "global_step": 220141, "epoch": 2652} {"train_loss": -24.419408798217773, "global_step": 220142, "epoch": 2652} {"train_loss": -24.346511840820312, "global_step": 220143, "epoch": 2652} {"train_loss": -24.266925811767578, "global_step": 220144, "epoch": 2652} {"train_loss": -24.600055694580078, "global_step": 220145, "epoch": 2652} {"train_loss": -24.85652732849121, "global_step": 220146, "epoch": 2652} {"train_loss": -24.4691104888916, "global_step": 220147, "epoch": 2652} {"train_loss": -24.47073745727539, "global_step": 220148, "epoch": 2652} {"train_loss": -24.407358169555664, "global_step": 220149, "epoch": 2652} {"train_loss": -24.518709182739258, "global_step": 220150, "epoch": 2652} {"train_loss": -24.273786544799805, "global_step": 220151, "epoch": 2652} {"train_loss": -24.226734161376953, "global_step": 220152, "epoch": 2652} {"train_loss": -24.478891372680664, "global_step": 220153, "epoch": 2652} {"train_loss": -24.93524742126465, "global_step": 220154, "epoch": 2652} {"train_loss": -24.621200561523438, "global_step": 220155, "epoch": 2652} {"train_loss": -24.732038497924805, "global_step": 220156, "epoch": 2652} {"train_loss": -24.937326431274414, "global_step": 220157, "epoch": 2652} {"train_loss": -24.613346099853516, "global_step": 220158, "epoch": 2652} {"train_loss": -24.715301513671875, "global_step": 220159, "epoch": 2652} {"train_loss": -24.52454948425293, "global_step": 220160, "epoch": 2652} {"train_loss": -24.62228775024414, "global_step": 220161, "epoch": 2652} {"train_loss": -24.610248565673828, "global_step": 220162, "epoch": 2652} {"train_loss": -24.569595336914062, "global_step": 220163, "epoch": 2652} {"train_loss": -24.346691131591797, "global_step": 220164, "epoch": 2652} {"train_loss": -24.760005950927734, "global_step": 220165, "epoch": 2652} {"train_loss": -24.629545211791992, "global_step": 220166, "epoch": 2652} {"train_loss": -25.106460571289062, "global_step": 220167, "epoch": 2652} {"train_loss": -24.306440353393555, "global_step": 220168, "epoch": 2652} {"train_loss": -24.58163833618164, "global_step": 220169, "epoch": 2652} {"train_loss": -24.618473052978516, "global_step": 220170, "epoch": 2652} {"train_loss": -24.679031372070312, "global_step": 220171, "epoch": 2652} {"train_loss": -24.836904525756836, "global_step": 220172, "epoch": 2652} {"train_loss": -24.928890228271484, "global_step": 220173, "epoch": 2652} {"train_loss": -24.620798110961914, "global_step": 220174, "epoch": 2652} {"train_loss": -24.702138900756836, "global_step": 220175, "epoch": 2652} {"train_loss": -24.74016571044922, "global_step": 220176, "epoch": 2652} {"train_loss": -24.738765716552734, "global_step": 220177, "epoch": 2652} {"train_loss": -24.52048683166504, "global_step": 220178, "epoch": 2652} {"train_loss": -24.72627067565918, "global_step": 220179, "epoch": 2652} {"train_loss": -24.779279708862305, "global_step": 220180, "epoch": 2652} {"train_loss": -24.704187393188477, "global_step": 220181, "epoch": 2652} {"train_loss": -24.794458389282227, "global_step": 220182, "epoch": 2652} {"train_loss": -24.578472137451172, "global_step": 220183, "epoch": 2652} {"train_loss": -24.533126831054688, "global_step": 220184, "epoch": 2652} {"train_loss": -24.589818954467773, "global_step": 220185, "epoch": 2652} {"train_loss": -24.70235824584961, "global_step": 220186, "epoch": 2652} {"train_loss": -24.896533966064453, "global_step": 220187, "epoch": 2652} {"train_loss": -24.70623207092285, "global_step": 220188, "epoch": 2652} {"train_loss": -24.962003707885742, "global_step": 220189, "epoch": 2652} {"train_loss": -25.07497215270996, "global_step": 220190, "epoch": 2652} {"train_loss": -24.882856369018555, "global_step": 220191, "epoch": 2652} {"train_loss": -25.030546188354492, "global_step": 220192, "epoch": 2652} {"train_loss": -24.961389541625977, "global_step": 220193, "epoch": 2652} {"train_loss": -24.894681930541992, "global_step": 220194, "epoch": 2652} {"train_loss": -24.686491012573242, "global_step": 220195, "epoch": 2652} {"train_loss": -24.359132766723633, "global_step": 220196, "epoch": 2652} {"train_loss": -24.11318016052246, "global_step": 220197, "epoch": 2652} {"train_loss": -24.377130186701397, "global_step": 220198, "epoch": 2652, "val_loss": 6603781.5} {"train_loss": -22.436819076538086, "global_step": 220199, "epoch": 2653} {"train_loss": -19.914310455322266, "global_step": 220200, "epoch": 2653} {"train_loss": -21.799619674682617, "global_step": 220201, "epoch": 2653} {"train_loss": -22.777524948120117, "global_step": 220202, "epoch": 2653} {"train_loss": -22.24510955810547, "global_step": 220203, "epoch": 2653} {"train_loss": -22.96138572692871, "global_step": 220204, "epoch": 2653} {"train_loss": -22.527603149414062, "global_step": 220205, "epoch": 2653} {"train_loss": -22.70075798034668, "global_step": 220206, "epoch": 2653} {"train_loss": -23.39932632446289, "global_step": 220207, "epoch": 2653} {"train_loss": -23.085878372192383, "global_step": 220208, "epoch": 2653} {"train_loss": -23.174367904663086, "global_step": 220209, "epoch": 2653} {"train_loss": -23.206815719604492, "global_step": 220210, "epoch": 2653} {"train_loss": -23.255939483642578, "global_step": 220211, "epoch": 2653} {"train_loss": -23.0542049407959, "global_step": 220212, "epoch": 2653} {"train_loss": -23.342126846313477, "global_step": 220213, "epoch": 2653} {"train_loss": -23.39176368713379, "global_step": 220214, "epoch": 2653} {"train_loss": -23.379730224609375, "global_step": 220215, "epoch": 2653} {"train_loss": -23.356786727905273, "global_step": 220216, "epoch": 2653} {"train_loss": -23.79420280456543, "global_step": 220217, "epoch": 2653} {"train_loss": -23.42083168029785, "global_step": 220218, "epoch": 2653} {"train_loss": -23.479263305664062, "global_step": 220219, "epoch": 2653} {"train_loss": -23.5783634185791, "global_step": 220220, "epoch": 2653} {"train_loss": -23.339584350585938, "global_step": 220221, "epoch": 2653} {"train_loss": -23.904272079467773, "global_step": 220222, "epoch": 2653} {"train_loss": -23.814443588256836, "global_step": 220223, "epoch": 2653} {"train_loss": -23.83906364440918, "global_step": 220224, "epoch": 2653} {"train_loss": -24.166385650634766, "global_step": 220225, "epoch": 2653} {"train_loss": -23.787796020507812, "global_step": 220226, "epoch": 2653} {"train_loss": -24.09490203857422, "global_step": 220227, "epoch": 2653} {"train_loss": -23.863866806030273, "global_step": 220228, "epoch": 2653} {"train_loss": -24.087560653686523, "global_step": 220229, "epoch": 2653} {"train_loss": -24.302282333374023, "global_step": 220230, "epoch": 2653} {"train_loss": -24.349943161010742, "global_step": 220231, "epoch": 2653} {"train_loss": -24.09785270690918, "global_step": 220232, "epoch": 2653} {"train_loss": -24.29193687438965, "global_step": 220233, "epoch": 2653} {"train_loss": -24.574899673461914, "global_step": 220234, "epoch": 2653} {"train_loss": -24.33674430847168, "global_step": 220235, "epoch": 2653} {"train_loss": -24.434457778930664, "global_step": 220236, "epoch": 2653} {"train_loss": -24.30759620666504, "global_step": 220237, "epoch": 2653} {"train_loss": -24.657426834106445, "global_step": 220238, "epoch": 2653} {"train_loss": -24.437833786010742, "global_step": 220239, "epoch": 2653} {"train_loss": -24.53788185119629, "global_step": 220240, "epoch": 2653} {"train_loss": -24.671234130859375, "global_step": 220241, "epoch": 2653} {"train_loss": -24.354753494262695, "global_step": 220242, "epoch": 2653} {"train_loss": -24.31846046447754, "global_step": 220243, "epoch": 2653} {"train_loss": -24.619354248046875, "global_step": 220244, "epoch": 2653} {"train_loss": -24.714916229248047, "global_step": 220245, "epoch": 2653} {"train_loss": -25.03677749633789, "global_step": 220246, "epoch": 2653} {"train_loss": -24.394010543823242, "global_step": 220247, "epoch": 2653} {"train_loss": -24.534765243530273, "global_step": 220248, "epoch": 2653} {"train_loss": -24.52577781677246, "global_step": 220249, "epoch": 2653} {"train_loss": -24.843891143798828, "global_step": 220250, "epoch": 2653} {"train_loss": -24.50331687927246, "global_step": 220251, "epoch": 2653} {"train_loss": -24.51403045654297, "global_step": 220252, "epoch": 2653} {"train_loss": -24.40846824645996, "global_step": 220253, "epoch": 2653} {"train_loss": -24.83335304260254, "global_step": 220254, "epoch": 2653} {"train_loss": -24.56515884399414, "global_step": 220255, "epoch": 2653} {"train_loss": -24.50518798828125, "global_step": 220256, "epoch": 2653} {"train_loss": -24.80864715576172, "global_step": 220257, "epoch": 2653} {"train_loss": -24.769140243530273, "global_step": 220258, "epoch": 2653} {"train_loss": -24.78085708618164, "global_step": 220259, "epoch": 2653} {"train_loss": -25.500913619995117, "global_step": 220260, "epoch": 2653} {"train_loss": -24.710376739501953, "global_step": 220261, "epoch": 2653} {"train_loss": -24.60529136657715, "global_step": 220262, "epoch": 2653} {"train_loss": -24.574087142944336, "global_step": 220263, "epoch": 2653} {"train_loss": -24.7369327545166, "global_step": 220264, "epoch": 2653} {"train_loss": -24.5952091217041, "global_step": 220265, "epoch": 2653} {"train_loss": -24.30782127380371, "global_step": 220266, "epoch": 2653} {"train_loss": -24.514822006225586, "global_step": 220267, "epoch": 2653} {"train_loss": -24.5339298248291, "global_step": 220268, "epoch": 2653} {"train_loss": -24.940628051757812, "global_step": 220269, "epoch": 2653} {"train_loss": -24.645689010620117, "global_step": 220270, "epoch": 2653} {"train_loss": -24.64131736755371, "global_step": 220271, "epoch": 2653} {"train_loss": -24.899290084838867, "global_step": 220272, "epoch": 2653} {"train_loss": -24.447158813476562, "global_step": 220273, "epoch": 2653} {"train_loss": -24.6351318359375, "global_step": 220274, "epoch": 2653} {"train_loss": -24.715301513671875, "global_step": 220275, "epoch": 2653} {"train_loss": -24.851871490478516, "global_step": 220276, "epoch": 2653} {"train_loss": -24.528732299804688, "global_step": 220277, "epoch": 2653} {"train_loss": -24.969594955444336, "global_step": 220278, "epoch": 2653} {"train_loss": -24.660329818725586, "global_step": 220279, "epoch": 2653} {"train_loss": -24.808502197265625, "global_step": 220280, "epoch": 2653} {"train_loss": -24.09014566260648, "global_step": 220281, "epoch": 2653, "val_loss": 6611645.0} {"train_loss": -22.753019332885742, "global_step": 220282, "epoch": 2654} {"train_loss": -23.189882278442383, "global_step": 220283, "epoch": 2654} {"train_loss": -24.111751556396484, "global_step": 220284, "epoch": 2654} {"train_loss": -23.4028377532959, "global_step": 220285, "epoch": 2654} {"train_loss": -23.588523864746094, "global_step": 220286, "epoch": 2654} {"train_loss": -23.95178985595703, "global_step": 220287, "epoch": 2654} {"train_loss": -23.473876953125, "global_step": 220288, "epoch": 2654} {"train_loss": -24.132705688476562, "global_step": 220289, "epoch": 2654} {"train_loss": -24.23988914489746, "global_step": 220290, "epoch": 2654} {"train_loss": -23.841642379760742, "global_step": 220291, "epoch": 2654} {"train_loss": -24.62607192993164, "global_step": 220292, "epoch": 2654} {"train_loss": -24.245941162109375, "global_step": 220293, "epoch": 2654} {"train_loss": -24.24995231628418, "global_step": 220294, "epoch": 2654} {"train_loss": -24.068283081054688, "global_step": 220295, "epoch": 2654} {"train_loss": -24.26210594177246, "global_step": 220296, "epoch": 2654} {"train_loss": -24.12213134765625, "global_step": 220297, "epoch": 2654} {"train_loss": -24.243818283081055, "global_step": 220298, "epoch": 2654} {"train_loss": -24.25137710571289, "global_step": 220299, "epoch": 2654} {"train_loss": -24.162208557128906, "global_step": 220300, "epoch": 2654} {"train_loss": -24.0205135345459, "global_step": 220301, "epoch": 2654} {"train_loss": -24.369550704956055, "global_step": 220302, "epoch": 2654} {"train_loss": -24.188968658447266, "global_step": 220303, "epoch": 2654} {"train_loss": -24.46303367614746, "global_step": 220304, "epoch": 2654} {"train_loss": -24.275800704956055, "global_step": 220305, "epoch": 2654} {"train_loss": -24.378511428833008, "global_step": 220306, "epoch": 2654} {"train_loss": -24.4940128326416, "global_step": 220307, "epoch": 2654} {"train_loss": -24.59775733947754, "global_step": 220308, "epoch": 2654} {"train_loss": -24.702177047729492, "global_step": 220309, "epoch": 2654} {"train_loss": -24.482990264892578, "global_step": 220310, "epoch": 2654} {"train_loss": -24.725000381469727, "global_step": 220311, "epoch": 2654} {"train_loss": -24.574575424194336, "global_step": 220312, "epoch": 2654} {"train_loss": -24.536624908447266, "global_step": 220313, "epoch": 2654} {"train_loss": -24.02128028869629, "global_step": 220314, "epoch": 2654} {"train_loss": -24.764266967773438, "global_step": 220315, "epoch": 2654} {"train_loss": -24.54768943786621, "global_step": 220316, "epoch": 2654} {"train_loss": -24.50417709350586, "global_step": 220317, "epoch": 2654} {"train_loss": -24.484399795532227, "global_step": 220318, "epoch": 2654} {"train_loss": -24.50185775756836, "global_step": 220319, "epoch": 2654} {"train_loss": -24.470869064331055, "global_step": 220320, "epoch": 2654} {"train_loss": -24.506118774414062, "global_step": 220321, "epoch": 2654} {"train_loss": -24.52919578552246, "global_step": 220322, "epoch": 2654} {"train_loss": -24.369047164916992, "global_step": 220323, "epoch": 2654} {"train_loss": -24.09440040588379, "global_step": 220324, "epoch": 2654} {"train_loss": -24.76796531677246, "global_step": 220325, "epoch": 2654} {"train_loss": -24.750682830810547, "global_step": 220326, "epoch": 2654} {"train_loss": -24.754436492919922, "global_step": 220327, "epoch": 2654} {"train_loss": -25.018924713134766, "global_step": 220328, "epoch": 2654} {"train_loss": -24.5199031829834, "global_step": 220329, "epoch": 2654} {"train_loss": -24.883861541748047, "global_step": 220330, "epoch": 2654} {"train_loss": -24.5336856842041, "global_step": 220331, "epoch": 2654} {"train_loss": -24.629039764404297, "global_step": 220332, "epoch": 2654} {"train_loss": -24.949596405029297, "global_step": 220333, "epoch": 2654} {"train_loss": -24.382558822631836, "global_step": 220334, "epoch": 2654} {"train_loss": -24.768260955810547, "global_step": 220335, "epoch": 2654} {"train_loss": -24.889341354370117, "global_step": 220336, "epoch": 2654} {"train_loss": -24.64072608947754, "global_step": 220337, "epoch": 2654} {"train_loss": -24.816267013549805, "global_step": 220338, "epoch": 2654} {"train_loss": -24.456899642944336, "global_step": 220339, "epoch": 2654} {"train_loss": -24.508214950561523, "global_step": 220340, "epoch": 2654} {"train_loss": -24.384225845336914, "global_step": 220341, "epoch": 2654} {"train_loss": -24.394760131835938, "global_step": 220342, "epoch": 2654} {"train_loss": -24.622344970703125, "global_step": 220343, "epoch": 2654} {"train_loss": -24.317895889282227, "global_step": 220344, "epoch": 2654} {"train_loss": -24.575016021728516, "global_step": 220345, "epoch": 2654} {"train_loss": -24.27716636657715, "global_step": 220346, "epoch": 2654} {"train_loss": -24.2285099029541, "global_step": 220347, "epoch": 2654} {"train_loss": -24.488311767578125, "global_step": 220348, "epoch": 2654} {"train_loss": -24.536535263061523, "global_step": 220349, "epoch": 2654} {"train_loss": -24.245094299316406, "global_step": 220350, "epoch": 2654} {"train_loss": -24.11407470703125, "global_step": 220351, "epoch": 2654} {"train_loss": -24.647634506225586, "global_step": 220352, "epoch": 2654} {"train_loss": -24.323307037353516, "global_step": 220353, "epoch": 2654} {"train_loss": -24.345916748046875, "global_step": 220354, "epoch": 2654} {"train_loss": -24.920154571533203, "global_step": 220355, "epoch": 2654} {"train_loss": -25.15764045715332, "global_step": 220356, "epoch": 2654} {"train_loss": -24.70612335205078, "global_step": 220357, "epoch": 2654} {"train_loss": -24.39439582824707, "global_step": 220358, "epoch": 2654} {"train_loss": -24.426572799682617, "global_step": 220359, "epoch": 2654} {"train_loss": -24.57590675354004, "global_step": 220360, "epoch": 2654} {"train_loss": -24.33294677734375, "global_step": 220361, "epoch": 2654} {"train_loss": -24.58155632019043, "global_step": 220362, "epoch": 2654} {"train_loss": -24.33487319946289, "global_step": 220363, "epoch": 2654} {"train_loss": -24.38764792752553, "global_step": 220364, "epoch": 2654, "val_loss": 6802163.0} {"train_loss": -24.384397506713867, "global_step": 220365, "epoch": 2655} {"train_loss": -23.96993637084961, "global_step": 220366, "epoch": 2655} {"train_loss": -24.40081787109375, "global_step": 220367, "epoch": 2655} {"train_loss": -24.247272491455078, "global_step": 220368, "epoch": 2655} {"train_loss": -24.09273338317871, "global_step": 220369, "epoch": 2655} {"train_loss": -24.417346954345703, "global_step": 220370, "epoch": 2655} {"train_loss": -24.3544979095459, "global_step": 220371, "epoch": 2655} {"train_loss": -24.02481460571289, "global_step": 220372, "epoch": 2655} {"train_loss": -24.229618072509766, "global_step": 220373, "epoch": 2655} {"train_loss": -24.51589012145996, "global_step": 220374, "epoch": 2655} {"train_loss": -24.376998901367188, "global_step": 220375, "epoch": 2655} {"train_loss": -24.4310245513916, "global_step": 220376, "epoch": 2655} {"train_loss": -24.493459701538086, "global_step": 220377, "epoch": 2655} {"train_loss": -24.143705368041992, "global_step": 220378, "epoch": 2655} {"train_loss": -24.5566463470459, "global_step": 220379, "epoch": 2655} {"train_loss": -24.62562370300293, "global_step": 220380, "epoch": 2655} {"train_loss": -24.718521118164062, "global_step": 220381, "epoch": 2655} {"train_loss": -24.280385971069336, "global_step": 220382, "epoch": 2655} {"train_loss": -24.5577392578125, "global_step": 220383, "epoch": 2655} {"train_loss": -24.565265655517578, "global_step": 220384, "epoch": 2655} {"train_loss": -24.268217086791992, "global_step": 220385, "epoch": 2655} {"train_loss": -24.412601470947266, "global_step": 220386, "epoch": 2655} {"train_loss": -24.6724910736084, "global_step": 220387, "epoch": 2655} {"train_loss": -24.2597713470459, "global_step": 220388, "epoch": 2655} {"train_loss": -24.84312629699707, "global_step": 220389, "epoch": 2655} {"train_loss": -24.59427261352539, "global_step": 220390, "epoch": 2655} {"train_loss": -24.721282958984375, "global_step": 220391, "epoch": 2655} {"train_loss": -24.946147918701172, "global_step": 220392, "epoch": 2655} {"train_loss": -25.232126235961914, "global_step": 220393, "epoch": 2655} {"train_loss": -24.520198822021484, "global_step": 220394, "epoch": 2655} {"train_loss": -24.830968856811523, "global_step": 220395, "epoch": 2655} {"train_loss": -24.79730796813965, "global_step": 220396, "epoch": 2655} {"train_loss": -24.544513702392578, "global_step": 220397, "epoch": 2655} {"train_loss": -24.555034637451172, "global_step": 220398, "epoch": 2655} {"train_loss": -24.686185836791992, "global_step": 220399, "epoch": 2655} {"train_loss": -24.844114303588867, "global_step": 220400, "epoch": 2655} {"train_loss": -24.3765869140625, "global_step": 220401, "epoch": 2655} {"train_loss": -24.645292282104492, "global_step": 220402, "epoch": 2655} {"train_loss": -24.295001983642578, "global_step": 220403, "epoch": 2655} {"train_loss": -24.721540451049805, "global_step": 220404, "epoch": 2655} {"train_loss": -24.526016235351562, "global_step": 220405, "epoch": 2655} {"train_loss": -24.579315185546875, "global_step": 220406, "epoch": 2655} {"train_loss": -24.692155838012695, "global_step": 220407, "epoch": 2655} {"train_loss": -25.132888793945312, "global_step": 220408, "epoch": 2655} {"train_loss": -24.407855987548828, "global_step": 220409, "epoch": 2655} {"train_loss": -24.538434982299805, "global_step": 220410, "epoch": 2655} {"train_loss": -24.582067489624023, "global_step": 220411, "epoch": 2655} {"train_loss": -24.887401580810547, "global_step": 220412, "epoch": 2655} {"train_loss": -24.85433006286621, "global_step": 220413, "epoch": 2655} {"train_loss": -24.849618911743164, "global_step": 220414, "epoch": 2655} {"train_loss": -24.329696655273438, "global_step": 220415, "epoch": 2655} {"train_loss": -24.63418197631836, "global_step": 220416, "epoch": 2655} {"train_loss": -24.517719268798828, "global_step": 220417, "epoch": 2655} {"train_loss": -24.54720115661621, "global_step": 220418, "epoch": 2655} {"train_loss": -24.14252281188965, "global_step": 220419, "epoch": 2655} {"train_loss": -24.547061920166016, "global_step": 220420, "epoch": 2655} {"train_loss": -24.910531997680664, "global_step": 220421, "epoch": 2655} {"train_loss": -24.67629051208496, "global_step": 220422, "epoch": 2655} {"train_loss": -24.82160186767578, "global_step": 220423, "epoch": 2655} {"train_loss": -24.484088897705078, "global_step": 220424, "epoch": 2655} {"train_loss": -24.3339786529541, "global_step": 220425, "epoch": 2655} {"train_loss": -24.487064361572266, "global_step": 220426, "epoch": 2655} {"train_loss": -24.473188400268555, "global_step": 220427, "epoch": 2655} {"train_loss": -24.406494140625, "global_step": 220428, "epoch": 2655} {"train_loss": -24.200170516967773, "global_step": 220429, "epoch": 2655} {"train_loss": -24.67441749572754, "global_step": 220430, "epoch": 2655} {"train_loss": -25.09315299987793, "global_step": 220431, "epoch": 2655} {"train_loss": -24.549339294433594, "global_step": 220432, "epoch": 2655} {"train_loss": -24.71727752685547, "global_step": 220433, "epoch": 2655} {"train_loss": -25.06049156188965, "global_step": 220434, "epoch": 2655} {"train_loss": -24.413745880126953, "global_step": 220435, "epoch": 2655} {"train_loss": -24.844770431518555, "global_step": 220436, "epoch": 2655} {"train_loss": -24.71320915222168, "global_step": 220437, "epoch": 2655} {"train_loss": -24.946475982666016, "global_step": 220438, "epoch": 2655} {"train_loss": -24.635950088500977, "global_step": 220439, "epoch": 2655} {"train_loss": -24.824628829956055, "global_step": 220440, "epoch": 2655} {"train_loss": -24.688783645629883, "global_step": 220441, "epoch": 2655} {"train_loss": -24.697860717773438, "global_step": 220442, "epoch": 2655} {"train_loss": -24.58966636657715, "global_step": 220443, "epoch": 2655} {"train_loss": -24.410993576049805, "global_step": 220444, "epoch": 2655} {"train_loss": -24.774478912353516, "global_step": 220445, "epoch": 2655} {"train_loss": -24.605621337890625, "global_step": 220446, "epoch": 2655} {"train_loss": -24.552421225122657, "global_step": 220447, "epoch": 2655, "val_loss": 6719060.0} {"train_loss": -21.993696212768555, "global_step": 220448, "epoch": 2656} {"train_loss": -21.2780704498291, "global_step": 220449, "epoch": 2656} {"train_loss": -23.201303482055664, "global_step": 220450, "epoch": 2656} {"train_loss": -23.316085815429688, "global_step": 220451, "epoch": 2656} {"train_loss": -23.891469955444336, "global_step": 220452, "epoch": 2656} {"train_loss": -23.823278427124023, "global_step": 220453, "epoch": 2656} {"train_loss": -23.560876846313477, "global_step": 220454, "epoch": 2656} {"train_loss": -23.763025283813477, "global_step": 220455, "epoch": 2656} {"train_loss": -24.130346298217773, "global_step": 220456, "epoch": 2656} {"train_loss": -24.254018783569336, "global_step": 220457, "epoch": 2656} {"train_loss": -23.79404640197754, "global_step": 220458, "epoch": 2656} {"train_loss": -23.998014450073242, "global_step": 220459, "epoch": 2656} {"train_loss": -23.760623931884766, "global_step": 220460, "epoch": 2656} {"train_loss": -24.330707550048828, "global_step": 220461, "epoch": 2656} {"train_loss": -24.001585006713867, "global_step": 220462, "epoch": 2656} {"train_loss": -24.197507858276367, "global_step": 220463, "epoch": 2656} {"train_loss": -24.1262264251709, "global_step": 220464, "epoch": 2656} {"train_loss": -23.84492301940918, "global_step": 220465, "epoch": 2656} {"train_loss": -23.97981071472168, "global_step": 220466, "epoch": 2656} {"train_loss": -23.981008529663086, "global_step": 220467, "epoch": 2656} {"train_loss": -24.076135635375977, "global_step": 220468, "epoch": 2656} {"train_loss": -24.25844383239746, "global_step": 220469, "epoch": 2656} {"train_loss": -24.624418258666992, "global_step": 220470, "epoch": 2656} {"train_loss": -24.271194458007812, "global_step": 220471, "epoch": 2656} {"train_loss": -24.408681869506836, "global_step": 220472, "epoch": 2656} {"train_loss": -24.55782127380371, "global_step": 220473, "epoch": 2656} {"train_loss": -24.13554573059082, "global_step": 220474, "epoch": 2656} {"train_loss": -24.66585350036621, "global_step": 220475, "epoch": 2656} {"train_loss": -24.613529205322266, "global_step": 220476, "epoch": 2656} {"train_loss": -24.219099044799805, "global_step": 220477, "epoch": 2656} {"train_loss": -24.45355987548828, "global_step": 220478, "epoch": 2656} {"train_loss": -24.52434730529785, "global_step": 220479, "epoch": 2656} {"train_loss": -24.85329818725586, "global_step": 220480, "epoch": 2656} {"train_loss": -24.51796531677246, "global_step": 220481, "epoch": 2656} {"train_loss": -24.600812911987305, "global_step": 220482, "epoch": 2656} {"train_loss": -24.50613784790039, "global_step": 220483, "epoch": 2656} {"train_loss": -24.458694458007812, "global_step": 220484, "epoch": 2656} {"train_loss": -24.45456886291504, "global_step": 220485, "epoch": 2656} {"train_loss": -24.813140869140625, "global_step": 220486, "epoch": 2656} {"train_loss": -24.463916778564453, "global_step": 220487, "epoch": 2656} {"train_loss": -24.591508865356445, "global_step": 220488, "epoch": 2656} {"train_loss": -24.659271240234375, "global_step": 220489, "epoch": 2656} {"train_loss": -24.478429794311523, "global_step": 220490, "epoch": 2656} {"train_loss": -24.936635971069336, "global_step": 220491, "epoch": 2656} {"train_loss": -24.748092651367188, "global_step": 220492, "epoch": 2656} {"train_loss": -25.115449905395508, "global_step": 220493, "epoch": 2656} {"train_loss": -24.620241165161133, "global_step": 220494, "epoch": 2656} {"train_loss": -24.5418643951416, "global_step": 220495, "epoch": 2656} {"train_loss": -24.919118881225586, "global_step": 220496, "epoch": 2656} {"train_loss": -24.77614402770996, "global_step": 220497, "epoch": 2656} {"train_loss": -25.094724655151367, "global_step": 220498, "epoch": 2656} {"train_loss": -25.022539138793945, "global_step": 220499, "epoch": 2656} {"train_loss": -24.875051498413086, "global_step": 220500, "epoch": 2656} {"train_loss": -24.971858978271484, "global_step": 220501, "epoch": 2656} {"train_loss": -24.440961837768555, "global_step": 220502, "epoch": 2656} {"train_loss": -24.792673110961914, "global_step": 220503, "epoch": 2656} {"train_loss": -24.69767189025879, "global_step": 220504, "epoch": 2656} {"train_loss": -24.359270095825195, "global_step": 220505, "epoch": 2656} {"train_loss": -25.037580490112305, "global_step": 220506, "epoch": 2656} {"train_loss": -24.549734115600586, "global_step": 220507, "epoch": 2656} {"train_loss": -24.47951889038086, "global_step": 220508, "epoch": 2656} {"train_loss": -24.221675872802734, "global_step": 220509, "epoch": 2656} {"train_loss": -24.635623931884766, "global_step": 220510, "epoch": 2656} {"train_loss": -24.741830825805664, "global_step": 220511, "epoch": 2656} {"train_loss": -24.48812484741211, "global_step": 220512, "epoch": 2656} {"train_loss": -24.621007919311523, "global_step": 220513, "epoch": 2656} {"train_loss": -24.952146530151367, "global_step": 220514, "epoch": 2656} {"train_loss": -24.2106876373291, "global_step": 220515, "epoch": 2656} {"train_loss": -24.67441177368164, "global_step": 220516, "epoch": 2656} {"train_loss": -24.531169891357422, "global_step": 220517, "epoch": 2656} {"train_loss": -24.422836303710938, "global_step": 220518, "epoch": 2656} {"train_loss": -24.556669235229492, "global_step": 220519, "epoch": 2656} {"train_loss": -24.005285263061523, "global_step": 220520, "epoch": 2656} {"train_loss": -24.746877670288086, "global_step": 220521, "epoch": 2656} {"train_loss": -24.507177352905273, "global_step": 220522, "epoch": 2656} {"train_loss": -24.30210304260254, "global_step": 220523, "epoch": 2656} {"train_loss": -24.410511016845703, "global_step": 220524, "epoch": 2656} {"train_loss": -25.015899658203125, "global_step": 220525, "epoch": 2656} {"train_loss": -24.68579864501953, "global_step": 220526, "epoch": 2656} {"train_loss": -24.85221290588379, "global_step": 220527, "epoch": 2656} {"train_loss": -24.488605499267578, "global_step": 220528, "epoch": 2656} {"train_loss": -24.332857131958008, "global_step": 220529, "epoch": 2656} {"train_loss": -24.357012599347584, "global_step": 220530, "epoch": 2656, "val_loss": 6706572.0} {"train_loss": -24.343231201171875, "global_step": 220531, "epoch": 2657} {"train_loss": -23.91267204284668, "global_step": 220532, "epoch": 2657} {"train_loss": -24.444595336914062, "global_step": 220533, "epoch": 2657} {"train_loss": -24.15362548828125, "global_step": 220534, "epoch": 2657} {"train_loss": -23.83562660217285, "global_step": 220535, "epoch": 2657} {"train_loss": -23.766040802001953, "global_step": 220536, "epoch": 2657} {"train_loss": -24.265003204345703, "global_step": 220537, "epoch": 2657} {"train_loss": -23.90996551513672, "global_step": 220538, "epoch": 2657} {"train_loss": -24.19451904296875, "global_step": 220539, "epoch": 2657} {"train_loss": -24.17829704284668, "global_step": 220540, "epoch": 2657} {"train_loss": -24.433303833007812, "global_step": 220541, "epoch": 2657} {"train_loss": -24.356374740600586, "global_step": 220542, "epoch": 2657} {"train_loss": -24.61952018737793, "global_step": 220543, "epoch": 2657} {"train_loss": -24.455068588256836, "global_step": 220544, "epoch": 2657} {"train_loss": -24.367345809936523, "global_step": 220545, "epoch": 2657} {"train_loss": -24.500869750976562, "global_step": 220546, "epoch": 2657} {"train_loss": -24.83650779724121, "global_step": 220547, "epoch": 2657} {"train_loss": -24.58058738708496, "global_step": 220548, "epoch": 2657} {"train_loss": -24.24224853515625, "global_step": 220549, "epoch": 2657} {"train_loss": -24.391952514648438, "global_step": 220550, "epoch": 2657} {"train_loss": -24.557397842407227, "global_step": 220551, "epoch": 2657} {"train_loss": -24.340740203857422, "global_step": 220552, "epoch": 2657} {"train_loss": -24.631071090698242, "global_step": 220553, "epoch": 2657} {"train_loss": -24.880395889282227, "global_step": 220554, "epoch": 2657} {"train_loss": -24.73943519592285, "global_step": 220555, "epoch": 2657} {"train_loss": -24.357589721679688, "global_step": 220556, "epoch": 2657} {"train_loss": -24.916305541992188, "global_step": 220557, "epoch": 2657} {"train_loss": -24.52516746520996, "global_step": 220558, "epoch": 2657} {"train_loss": -24.764080047607422, "global_step": 220559, "epoch": 2657} {"train_loss": -24.763031005859375, "global_step": 220560, "epoch": 2657} {"train_loss": -24.799673080444336, "global_step": 220561, "epoch": 2657} {"train_loss": -24.734277725219727, "global_step": 220562, "epoch": 2657} {"train_loss": -24.541168212890625, "global_step": 220563, "epoch": 2657} {"train_loss": -24.73048973083496, "global_step": 220564, "epoch": 2657} {"train_loss": -24.563236236572266, "global_step": 220565, "epoch": 2657} {"train_loss": -24.42572021484375, "global_step": 220566, "epoch": 2657} {"train_loss": -24.55370330810547, "global_step": 220567, "epoch": 2657} {"train_loss": -24.85115623474121, "global_step": 220568, "epoch": 2657} {"train_loss": -24.76604652404785, "global_step": 220569, "epoch": 2657} {"train_loss": -24.787673950195312, "global_step": 220570, "epoch": 2657} {"train_loss": -24.55592918395996, "global_step": 220571, "epoch": 2657} {"train_loss": -24.617733001708984, "global_step": 220572, "epoch": 2657} {"train_loss": -24.742116928100586, "global_step": 220573, "epoch": 2657} {"train_loss": -24.41352653503418, "global_step": 220574, "epoch": 2657} {"train_loss": -24.554182052612305, "global_step": 220575, "epoch": 2657} {"train_loss": -24.4163875579834, "global_step": 220576, "epoch": 2657} {"train_loss": -25.162975311279297, "global_step": 220577, "epoch": 2657} {"train_loss": -24.640310287475586, "global_step": 220578, "epoch": 2657} {"train_loss": -24.358631134033203, "global_step": 220579, "epoch": 2657} {"train_loss": -24.2426700592041, "global_step": 220580, "epoch": 2657} {"train_loss": -24.81454849243164, "global_step": 220581, "epoch": 2657} {"train_loss": -24.733861923217773, "global_step": 220582, "epoch": 2657} {"train_loss": -24.574111938476562, "global_step": 220583, "epoch": 2657} {"train_loss": -24.830659866333008, "global_step": 220584, "epoch": 2657} {"train_loss": -24.68528938293457, "global_step": 220585, "epoch": 2657} {"train_loss": -24.877355575561523, "global_step": 220586, "epoch": 2657} {"train_loss": -24.61869239807129, "global_step": 220587, "epoch": 2657} {"train_loss": -24.401123046875, "global_step": 220588, "epoch": 2657} {"train_loss": -24.89072608947754, "global_step": 220589, "epoch": 2657} {"train_loss": -24.821752548217773, "global_step": 220590, "epoch": 2657} {"train_loss": -24.91941261291504, "global_step": 220591, "epoch": 2657} {"train_loss": -24.57184410095215, "global_step": 220592, "epoch": 2657} {"train_loss": -24.352684020996094, "global_step": 220593, "epoch": 2657} {"train_loss": -24.481863021850586, "global_step": 220594, "epoch": 2657} {"train_loss": -24.706384658813477, "global_step": 220595, "epoch": 2657} {"train_loss": -24.68128204345703, "global_step": 220596, "epoch": 2657} {"train_loss": -24.380659103393555, "global_step": 220597, "epoch": 2657} {"train_loss": -24.786415100097656, "global_step": 220598, "epoch": 2657} {"train_loss": -24.911230087280273, "global_step": 220599, "epoch": 2657} {"train_loss": -24.724882125854492, "global_step": 220600, "epoch": 2657} {"train_loss": -24.588014602661133, "global_step": 220601, "epoch": 2657} {"train_loss": -24.522876739501953, "global_step": 220602, "epoch": 2657} {"train_loss": -24.65096092224121, "global_step": 220603, "epoch": 2657} {"train_loss": -24.8885440826416, "global_step": 220604, "epoch": 2657} {"train_loss": -24.9852294921875, "global_step": 220605, "epoch": 2657} {"train_loss": -24.57840919494629, "global_step": 220606, "epoch": 2657} {"train_loss": -24.26786231994629, "global_step": 220607, "epoch": 2657} {"train_loss": -24.36348533630371, "global_step": 220608, "epoch": 2657} {"train_loss": -24.407690048217773, "global_step": 220609, "epoch": 2657} {"train_loss": -25.054170608520508, "global_step": 220610, "epoch": 2657} {"train_loss": -24.616613388061523, "global_step": 220611, "epoch": 2657} {"train_loss": -24.788558959960938, "global_step": 220612, "epoch": 2657} {"train_loss": -24.577396208981433, "global_step": 220613, "epoch": 2657, "val_loss": 6543920.0} {"train_loss": -23.846668243408203, "global_step": 220614, "epoch": 2658} {"train_loss": -23.582592010498047, "global_step": 220615, "epoch": 2658} {"train_loss": -24.304956436157227, "global_step": 220616, "epoch": 2658} {"train_loss": -23.994871139526367, "global_step": 220617, "epoch": 2658} {"train_loss": -23.750391006469727, "global_step": 220618, "epoch": 2658} {"train_loss": -24.137510299682617, "global_step": 220619, "epoch": 2658} {"train_loss": -24.390838623046875, "global_step": 220620, "epoch": 2658} {"train_loss": -23.989965438842773, "global_step": 220621, "epoch": 2658} {"train_loss": -24.004352569580078, "global_step": 220622, "epoch": 2658} {"train_loss": -24.639511108398438, "global_step": 220623, "epoch": 2658} {"train_loss": -24.43912124633789, "global_step": 220624, "epoch": 2658} {"train_loss": -24.499860763549805, "global_step": 220625, "epoch": 2658} {"train_loss": -24.13751792907715, "global_step": 220626, "epoch": 2658} {"train_loss": -24.37930679321289, "global_step": 220627, "epoch": 2658} {"train_loss": -24.200387954711914, "global_step": 220628, "epoch": 2658} {"train_loss": -24.32429313659668, "global_step": 220629, "epoch": 2658} {"train_loss": -24.526630401611328, "global_step": 220630, "epoch": 2658} {"train_loss": -24.418310165405273, "global_step": 220631, "epoch": 2658} {"train_loss": -24.415760040283203, "global_step": 220632, "epoch": 2658} {"train_loss": -24.43836784362793, "global_step": 220633, "epoch": 2658} {"train_loss": -24.391815185546875, "global_step": 220634, "epoch": 2658} {"train_loss": -24.50337791442871, "global_step": 220635, "epoch": 2658} {"train_loss": -24.887054443359375, "global_step": 220636, "epoch": 2658} {"train_loss": -24.098875045776367, "global_step": 220637, "epoch": 2658} {"train_loss": -24.333227157592773, "global_step": 220638, "epoch": 2658} {"train_loss": -24.56186294555664, "global_step": 220639, "epoch": 2658} {"train_loss": -24.53279685974121, "global_step": 220640, "epoch": 2658} {"train_loss": -24.314077377319336, "global_step": 220641, "epoch": 2658} {"train_loss": -25.02752113342285, "global_step": 220642, "epoch": 2658} {"train_loss": -24.568660736083984, "global_step": 220643, "epoch": 2658} {"train_loss": -24.803810119628906, "global_step": 220644, "epoch": 2658} {"train_loss": -25.101757049560547, "global_step": 220645, "epoch": 2658} {"train_loss": -24.49000358581543, "global_step": 220646, "epoch": 2658} {"train_loss": -24.869810104370117, "global_step": 220647, "epoch": 2658} {"train_loss": -24.955219268798828, "global_step": 220648, "epoch": 2658} {"train_loss": -24.488615036010742, "global_step": 220649, "epoch": 2658} {"train_loss": -24.63960838317871, "global_step": 220650, "epoch": 2658} {"train_loss": -24.72488784790039, "global_step": 220651, "epoch": 2658} {"train_loss": -24.7753849029541, "global_step": 220652, "epoch": 2658} {"train_loss": -24.79380989074707, "global_step": 220653, "epoch": 2658} {"train_loss": -24.929819107055664, "global_step": 220654, "epoch": 2658} {"train_loss": -24.836103439331055, "global_step": 220655, "epoch": 2658} {"train_loss": -24.540325164794922, "global_step": 220656, "epoch": 2658} {"train_loss": -24.711902618408203, "global_step": 220657, "epoch": 2658} {"train_loss": -24.62906837463379, "global_step": 220658, "epoch": 2658} {"train_loss": -24.46588897705078, "global_step": 220659, "epoch": 2658} {"train_loss": -23.908416748046875, "global_step": 220660, "epoch": 2658} {"train_loss": -24.430822372436523, "global_step": 220661, "epoch": 2658} {"train_loss": -24.471073150634766, "global_step": 220662, "epoch": 2658} {"train_loss": -24.76874351501465, "global_step": 220663, "epoch": 2658} {"train_loss": -24.607284545898438, "global_step": 220664, "epoch": 2658} {"train_loss": -24.871601104736328, "global_step": 220665, "epoch": 2658} {"train_loss": -24.432950973510742, "global_step": 220666, "epoch": 2658} {"train_loss": -24.712488174438477, "global_step": 220667, "epoch": 2658} {"train_loss": -24.57278823852539, "global_step": 220668, "epoch": 2658} {"train_loss": -24.494380950927734, "global_step": 220669, "epoch": 2658} {"train_loss": -24.917238235473633, "global_step": 220670, "epoch": 2658} {"train_loss": -24.70869255065918, "global_step": 220671, "epoch": 2658} {"train_loss": -24.473230361938477, "global_step": 220672, "epoch": 2658} {"train_loss": -24.60878562927246, "global_step": 220673, "epoch": 2658} {"train_loss": -24.65406608581543, "global_step": 220674, "epoch": 2658} {"train_loss": -24.218795776367188, "global_step": 220675, "epoch": 2658} {"train_loss": -24.586448669433594, "global_step": 220676, "epoch": 2658} {"train_loss": -24.76541519165039, "global_step": 220677, "epoch": 2658} {"train_loss": -24.923364639282227, "global_step": 220678, "epoch": 2658} {"train_loss": -24.51123046875, "global_step": 220679, "epoch": 2658} {"train_loss": -24.914243698120117, "global_step": 220680, "epoch": 2658} {"train_loss": -24.324583053588867, "global_step": 220681, "epoch": 2658} {"train_loss": -24.38630485534668, "global_step": 220682, "epoch": 2658} {"train_loss": -24.81633186340332, "global_step": 220683, "epoch": 2658} {"train_loss": -24.541091918945312, "global_step": 220684, "epoch": 2658} {"train_loss": -24.302749633789062, "global_step": 220685, "epoch": 2658} {"train_loss": -24.604665756225586, "global_step": 220686, "epoch": 2658} {"train_loss": -24.362735748291016, "global_step": 220687, "epoch": 2658} {"train_loss": -24.6809024810791, "global_step": 220688, "epoch": 2658} {"train_loss": -24.409006118774414, "global_step": 220689, "epoch": 2658} {"train_loss": -24.539325714111328, "global_step": 220690, "epoch": 2658} {"train_loss": -24.919174194335938, "global_step": 220691, "epoch": 2658} {"train_loss": -24.369155883789062, "global_step": 220692, "epoch": 2658} {"train_loss": -24.74840545654297, "global_step": 220693, "epoch": 2658} {"train_loss": -24.585773468017578, "global_step": 220694, "epoch": 2658} {"train_loss": -24.34120750427246, "global_step": 220695, "epoch": 2658} {"train_loss": -24.5133612529341, "global_step": 220696, "epoch": 2658, "val_loss": 6678995.0} {"train_loss": -24.237232208251953, "global_step": 220697, "epoch": 2659} {"train_loss": -24.574050903320312, "global_step": 220698, "epoch": 2659} {"train_loss": -24.264923095703125, "global_step": 220699, "epoch": 2659} {"train_loss": -24.704805374145508, "global_step": 220700, "epoch": 2659} {"train_loss": -24.443571090698242, "global_step": 220701, "epoch": 2659} {"train_loss": -24.466638565063477, "global_step": 220702, "epoch": 2659} {"train_loss": -24.633230209350586, "global_step": 220703, "epoch": 2659} {"train_loss": -24.449377059936523, "global_step": 220704, "epoch": 2659} {"train_loss": -24.505685806274414, "global_step": 220705, "epoch": 2659} {"train_loss": -24.343671798706055, "global_step": 220706, "epoch": 2659} {"train_loss": -24.377216339111328, "global_step": 220707, "epoch": 2659} {"train_loss": -24.316328048706055, "global_step": 220708, "epoch": 2659} {"train_loss": -24.850048065185547, "global_step": 220709, "epoch": 2659} {"train_loss": -24.690811157226562, "global_step": 220710, "epoch": 2659} {"train_loss": -24.570085525512695, "global_step": 220711, "epoch": 2659} {"train_loss": -24.455415725708008, "global_step": 220712, "epoch": 2659} {"train_loss": -24.33359718322754, "global_step": 220713, "epoch": 2659} {"train_loss": -24.953893661499023, "global_step": 220714, "epoch": 2659} {"train_loss": -24.412269592285156, "global_step": 220715, "epoch": 2659} {"train_loss": -24.378171920776367, "global_step": 220716, "epoch": 2659} {"train_loss": -24.457420349121094, "global_step": 220717, "epoch": 2659} {"train_loss": -24.67591667175293, "global_step": 220718, "epoch": 2659} {"train_loss": -24.849084854125977, "global_step": 220719, "epoch": 2659} {"train_loss": -24.57295799255371, "global_step": 220720, "epoch": 2659} {"train_loss": -24.32663917541504, "global_step": 220721, "epoch": 2659} {"train_loss": -24.806325912475586, "global_step": 220722, "epoch": 2659} {"train_loss": -24.88395118713379, "global_step": 220723, "epoch": 2659} {"train_loss": -24.528013229370117, "global_step": 220724, "epoch": 2659} {"train_loss": -24.49264144897461, "global_step": 220725, "epoch": 2659} {"train_loss": -24.610319137573242, "global_step": 220726, "epoch": 2659} {"train_loss": -24.99226951599121, "global_step": 220727, "epoch": 2659} {"train_loss": -25.01991081237793, "global_step": 220728, "epoch": 2659} {"train_loss": -24.525175094604492, "global_step": 220729, "epoch": 2659} {"train_loss": -24.89226722717285, "global_step": 220730, "epoch": 2659} {"train_loss": -24.742267608642578, "global_step": 220731, "epoch": 2659} {"train_loss": -24.690963745117188, "global_step": 220732, "epoch": 2659} {"train_loss": -24.67363929748535, "global_step": 220733, "epoch": 2659} {"train_loss": -24.850385665893555, "global_step": 220734, "epoch": 2659} {"train_loss": -24.73450469970703, "global_step": 220735, "epoch": 2659} {"train_loss": -24.79444122314453, "global_step": 220736, "epoch": 2659} {"train_loss": -24.98750877380371, "global_step": 220737, "epoch": 2659} {"train_loss": -24.37630271911621, "global_step": 220738, "epoch": 2659} {"train_loss": -24.218961715698242, "global_step": 220739, "epoch": 2659} {"train_loss": -24.211044311523438, "global_step": 220740, "epoch": 2659} {"train_loss": -24.22316551208496, "global_step": 220741, "epoch": 2659} {"train_loss": -24.399089813232422, "global_step": 220742, "epoch": 2659} {"train_loss": -24.650516510009766, "global_step": 220743, "epoch": 2659} {"train_loss": -24.920316696166992, "global_step": 220744, "epoch": 2659} {"train_loss": -24.694578170776367, "global_step": 220745, "epoch": 2659} {"train_loss": -24.350543975830078, "global_step": 220746, "epoch": 2659} {"train_loss": -24.667577743530273, "global_step": 220747, "epoch": 2659} {"train_loss": -24.680404663085938, "global_step": 220748, "epoch": 2659} {"train_loss": -24.650890350341797, "global_step": 220749, "epoch": 2659} {"train_loss": -24.728796005249023, "global_step": 220750, "epoch": 2659} {"train_loss": -24.626211166381836, "global_step": 220751, "epoch": 2659} {"train_loss": -24.716861724853516, "global_step": 220752, "epoch": 2659} {"train_loss": -24.94984245300293, "global_step": 220753, "epoch": 2659} {"train_loss": -25.04409408569336, "global_step": 220754, "epoch": 2659} {"train_loss": -24.463979721069336, "global_step": 220755, "epoch": 2659} {"train_loss": -24.810958862304688, "global_step": 220756, "epoch": 2659} {"train_loss": -24.52680778503418, "global_step": 220757, "epoch": 2659} {"train_loss": -24.724184036254883, "global_step": 220758, "epoch": 2659} {"train_loss": -24.40642738342285, "global_step": 220759, "epoch": 2659} {"train_loss": -25.01157569885254, "global_step": 220760, "epoch": 2659} {"train_loss": -24.78206443786621, "global_step": 220761, "epoch": 2659} {"train_loss": -24.399280548095703, "global_step": 220762, "epoch": 2659} {"train_loss": -24.301929473876953, "global_step": 220763, "epoch": 2659} {"train_loss": -24.6051082611084, "global_step": 220764, "epoch": 2659} {"train_loss": -24.172147750854492, "global_step": 220765, "epoch": 2659} {"train_loss": -24.970460891723633, "global_step": 220766, "epoch": 2659} {"train_loss": -24.451828002929688, "global_step": 220767, "epoch": 2659} {"train_loss": -24.500791549682617, "global_step": 220768, "epoch": 2659} {"train_loss": -24.460681915283203, "global_step": 220769, "epoch": 2659} {"train_loss": -24.526350021362305, "global_step": 220770, "epoch": 2659} {"train_loss": -24.379165649414062, "global_step": 220771, "epoch": 2659} {"train_loss": -24.804962158203125, "global_step": 220772, "epoch": 2659} {"train_loss": -24.444168090820312, "global_step": 220773, "epoch": 2659} {"train_loss": -24.546430587768555, "global_step": 220774, "epoch": 2659} {"train_loss": -24.344884872436523, "global_step": 220775, "epoch": 2659} {"train_loss": -24.80141258239746, "global_step": 220776, "epoch": 2659} {"train_loss": -24.419727325439453, "global_step": 220777, "epoch": 2659} {"train_loss": -24.460893630981445, "global_step": 220778, "epoch": 2659} {"train_loss": -24.59377114169569, "global_step": 220779, "epoch": 2659, "val_loss": 6580122.0} {"train_loss": -23.2521915435791, "global_step": 220780, "epoch": 2660} {"train_loss": -23.5513858795166, "global_step": 220781, "epoch": 2660} {"train_loss": -23.872488021850586, "global_step": 220782, "epoch": 2660} {"train_loss": -23.38385009765625, "global_step": 220783, "epoch": 2660} {"train_loss": -23.793102264404297, "global_step": 220784, "epoch": 2660} {"train_loss": -24.222116470336914, "global_step": 220785, "epoch": 2660} {"train_loss": -24.200490951538086, "global_step": 220786, "epoch": 2660} {"train_loss": -24.218454360961914, "global_step": 220787, "epoch": 2660} {"train_loss": -24.083332061767578, "global_step": 220788, "epoch": 2660} {"train_loss": -24.049497604370117, "global_step": 220789, "epoch": 2660} {"train_loss": -24.076025009155273, "global_step": 220790, "epoch": 2660} {"train_loss": -23.90590476989746, "global_step": 220791, "epoch": 2660} {"train_loss": -24.229839324951172, "global_step": 220792, "epoch": 2660} {"train_loss": -24.336894989013672, "global_step": 220793, "epoch": 2660} {"train_loss": -24.12796974182129, "global_step": 220794, "epoch": 2660} {"train_loss": -24.080591201782227, "global_step": 220795, "epoch": 2660} {"train_loss": -24.14420509338379, "global_step": 220796, "epoch": 2660} {"train_loss": -24.086318969726562, "global_step": 220797, "epoch": 2660} {"train_loss": -24.545429229736328, "global_step": 220798, "epoch": 2660} {"train_loss": -24.06361198425293, "global_step": 220799, "epoch": 2660} {"train_loss": -24.306631088256836, "global_step": 220800, "epoch": 2660} {"train_loss": -24.173643112182617, "global_step": 220801, "epoch": 2660} {"train_loss": -24.41823959350586, "global_step": 220802, "epoch": 2660} {"train_loss": -24.410598754882812, "global_step": 220803, "epoch": 2660} {"train_loss": -24.62066650390625, "global_step": 220804, "epoch": 2660} {"train_loss": -24.09639549255371, "global_step": 220805, "epoch": 2660} {"train_loss": -24.473922729492188, "global_step": 220806, "epoch": 2660} {"train_loss": -24.366846084594727, "global_step": 220807, "epoch": 2660} {"train_loss": -24.257028579711914, "global_step": 220808, "epoch": 2660} {"train_loss": -24.58697509765625, "global_step": 220809, "epoch": 2660} {"train_loss": -24.45926284790039, "global_step": 220810, "epoch": 2660} {"train_loss": -24.585384368896484, "global_step": 220811, "epoch": 2660} {"train_loss": -24.222501754760742, "global_step": 220812, "epoch": 2660} {"train_loss": -24.348237991333008, "global_step": 220813, "epoch": 2660} {"train_loss": -24.671443939208984, "global_step": 220814, "epoch": 2660} {"train_loss": -24.42028045654297, "global_step": 220815, "epoch": 2660} {"train_loss": -24.669321060180664, "global_step": 220816, "epoch": 2660} {"train_loss": -24.65932273864746, "global_step": 220817, "epoch": 2660} {"train_loss": -24.394128799438477, "global_step": 220818, "epoch": 2660} {"train_loss": -24.36622428894043, "global_step": 220819, "epoch": 2660} {"train_loss": -24.675336837768555, "global_step": 220820, "epoch": 2660} {"train_loss": -24.72054100036621, "global_step": 220821, "epoch": 2660} {"train_loss": -24.32197380065918, "global_step": 220822, "epoch": 2660} {"train_loss": -24.477258682250977, "global_step": 220823, "epoch": 2660} {"train_loss": -24.565902709960938, "global_step": 220824, "epoch": 2660} {"train_loss": -24.667184829711914, "global_step": 220825, "epoch": 2660} {"train_loss": -25.09809112548828, "global_step": 220826, "epoch": 2660} {"train_loss": -24.38361930847168, "global_step": 220827, "epoch": 2660} {"train_loss": -24.923297882080078, "global_step": 220828, "epoch": 2660} {"train_loss": -24.538497924804688, "global_step": 220829, "epoch": 2660} {"train_loss": -24.66129493713379, "global_step": 220830, "epoch": 2660} {"train_loss": -24.581924438476562, "global_step": 220831, "epoch": 2660} {"train_loss": -24.438268661499023, "global_step": 220832, "epoch": 2660} {"train_loss": -24.342832565307617, "global_step": 220833, "epoch": 2660} {"train_loss": -24.723459243774414, "global_step": 220834, "epoch": 2660} {"train_loss": -24.38654899597168, "global_step": 220835, "epoch": 2660} {"train_loss": -24.730985641479492, "global_step": 220836, "epoch": 2660} {"train_loss": -24.60556983947754, "global_step": 220837, "epoch": 2660} {"train_loss": -24.55517578125, "global_step": 220838, "epoch": 2660} {"train_loss": -24.88530158996582, "global_step": 220839, "epoch": 2660} {"train_loss": -24.662412643432617, "global_step": 220840, "epoch": 2660} {"train_loss": -24.55635643005371, "global_step": 220841, "epoch": 2660} {"train_loss": -24.552995681762695, "global_step": 220842, "epoch": 2660} {"train_loss": -24.26865577697754, "global_step": 220843, "epoch": 2660} {"train_loss": -24.865528106689453, "global_step": 220844, "epoch": 2660} {"train_loss": -24.796342849731445, "global_step": 220845, "epoch": 2660} {"train_loss": -24.6456241607666, "global_step": 220846, "epoch": 2660} {"train_loss": -24.43928337097168, "global_step": 220847, "epoch": 2660} {"train_loss": -24.528934478759766, "global_step": 220848, "epoch": 2660} {"train_loss": -24.67897605895996, "global_step": 220849, "epoch": 2660} {"train_loss": -24.718107223510742, "global_step": 220850, "epoch": 2660} {"train_loss": -24.6344051361084, "global_step": 220851, "epoch": 2660} {"train_loss": -24.51813316345215, "global_step": 220852, "epoch": 2660} {"train_loss": -24.569318771362305, "global_step": 220853, "epoch": 2660} {"train_loss": -24.485422134399414, "global_step": 220854, "epoch": 2660} {"train_loss": -24.780317306518555, "global_step": 220855, "epoch": 2660} {"train_loss": -24.204824447631836, "global_step": 220856, "epoch": 2660} {"train_loss": -24.372800827026367, "global_step": 220857, "epoch": 2660} {"train_loss": -24.677093505859375, "global_step": 220858, "epoch": 2660} {"train_loss": -24.83083152770996, "global_step": 220859, "epoch": 2660} {"train_loss": -24.746614456176758, "global_step": 220860, "epoch": 2660} {"train_loss": -24.96351432800293, "global_step": 220861, "epoch": 2660} {"train_loss": -24.417281966611565, "global_step": 220862, "epoch": 2660, "val_loss": 6792719.0} {"train_loss": -24.639265060424805, "global_step": 220863, "epoch": 2661} {"train_loss": -24.204965591430664, "global_step": 220864, "epoch": 2661} {"train_loss": -23.590763092041016, "global_step": 220865, "epoch": 2661} {"train_loss": -23.383563995361328, "global_step": 220866, "epoch": 2661} {"train_loss": -24.074668884277344, "global_step": 220867, "epoch": 2661} {"train_loss": -24.538415908813477, "global_step": 220868, "epoch": 2661} {"train_loss": -24.362173080444336, "global_step": 220869, "epoch": 2661} {"train_loss": -24.365697860717773, "global_step": 220870, "epoch": 2661} {"train_loss": -24.320531845092773, "global_step": 220871, "epoch": 2661} {"train_loss": -24.413543701171875, "global_step": 220872, "epoch": 2661} {"train_loss": -24.372045516967773, "global_step": 220873, "epoch": 2661} {"train_loss": -24.390968322753906, "global_step": 220874, "epoch": 2661} {"train_loss": -24.728519439697266, "global_step": 220875, "epoch": 2661} {"train_loss": -24.828327178955078, "global_step": 220876, "epoch": 2661} {"train_loss": -24.526437759399414, "global_step": 220877, "epoch": 2661} {"train_loss": -24.48198699951172, "global_step": 220878, "epoch": 2661} {"train_loss": -24.655981063842773, "global_step": 220879, "epoch": 2661} {"train_loss": -24.616575241088867, "global_step": 220880, "epoch": 2661} {"train_loss": -24.861364364624023, "global_step": 220881, "epoch": 2661} {"train_loss": -24.328475952148438, "global_step": 220882, "epoch": 2661} {"train_loss": -24.514768600463867, "global_step": 220883, "epoch": 2661} {"train_loss": -24.531307220458984, "global_step": 220884, "epoch": 2661} {"train_loss": -24.51799964904785, "global_step": 220885, "epoch": 2661} {"train_loss": -24.431638717651367, "global_step": 220886, "epoch": 2661} {"train_loss": -24.816612243652344, "global_step": 220887, "epoch": 2661} {"train_loss": -24.65296173095703, "global_step": 220888, "epoch": 2661} {"train_loss": -24.4976749420166, "global_step": 220889, "epoch": 2661} {"train_loss": -24.39175796508789, "global_step": 220890, "epoch": 2661} {"train_loss": -24.527217864990234, "global_step": 220891, "epoch": 2661} {"train_loss": -24.819257736206055, "global_step": 220892, "epoch": 2661} {"train_loss": -24.350845336914062, "global_step": 220893, "epoch": 2661} {"train_loss": -24.69044303894043, "global_step": 220894, "epoch": 2661} {"train_loss": -24.781692504882812, "global_step": 220895, "epoch": 2661} {"train_loss": -25.01715660095215, "global_step": 220896, "epoch": 2661} {"train_loss": -24.883298873901367, "global_step": 220897, "epoch": 2661} {"train_loss": -24.446636199951172, "global_step": 220898, "epoch": 2661} {"train_loss": -25.010604858398438, "global_step": 220899, "epoch": 2661} {"train_loss": -25.034391403198242, "global_step": 220900, "epoch": 2661} {"train_loss": -24.67352294921875, "global_step": 220901, "epoch": 2661} {"train_loss": -24.73345184326172, "global_step": 220902, "epoch": 2661} {"train_loss": -24.62238883972168, "global_step": 220903, "epoch": 2661} {"train_loss": -24.802419662475586, "global_step": 220904, "epoch": 2661} {"train_loss": -25.064071655273438, "global_step": 220905, "epoch": 2661} {"train_loss": -24.8276424407959, "global_step": 220906, "epoch": 2661} {"train_loss": -24.830629348754883, "global_step": 220907, "epoch": 2661} {"train_loss": -24.80560874938965, "global_step": 220908, "epoch": 2661} {"train_loss": -24.741992950439453, "global_step": 220909, "epoch": 2661} {"train_loss": -24.509817123413086, "global_step": 220910, "epoch": 2661} {"train_loss": -24.728063583374023, "global_step": 220911, "epoch": 2661} {"train_loss": -24.465478897094727, "global_step": 220912, "epoch": 2661} {"train_loss": -23.996845245361328, "global_step": 220913, "epoch": 2661} {"train_loss": -24.570680618286133, "global_step": 220914, "epoch": 2661} {"train_loss": -24.47491455078125, "global_step": 220915, "epoch": 2661} {"train_loss": -24.802228927612305, "global_step": 220916, "epoch": 2661} {"train_loss": -24.453907012939453, "global_step": 220917, "epoch": 2661} {"train_loss": -24.361337661743164, "global_step": 220918, "epoch": 2661} {"train_loss": -24.531423568725586, "global_step": 220919, "epoch": 2661} {"train_loss": -24.33784294128418, "global_step": 220920, "epoch": 2661} {"train_loss": -24.72196388244629, "global_step": 220921, "epoch": 2661} {"train_loss": -24.583707809448242, "global_step": 220922, "epoch": 2661} {"train_loss": -24.792997360229492, "global_step": 220923, "epoch": 2661} {"train_loss": -24.25752830505371, "global_step": 220924, "epoch": 2661} {"train_loss": -24.60085105895996, "global_step": 220925, "epoch": 2661} {"train_loss": -24.45229721069336, "global_step": 220926, "epoch": 2661} {"train_loss": -24.331716537475586, "global_step": 220927, "epoch": 2661} {"train_loss": -24.248212814331055, "global_step": 220928, "epoch": 2661} {"train_loss": -24.522109985351562, "global_step": 220929, "epoch": 2661} {"train_loss": -24.557458877563477, "global_step": 220930, "epoch": 2661} {"train_loss": -24.760177612304688, "global_step": 220931, "epoch": 2661} {"train_loss": -24.868833541870117, "global_step": 220932, "epoch": 2661} {"train_loss": -24.044986724853516, "global_step": 220933, "epoch": 2661} {"train_loss": -24.67812156677246, "global_step": 220934, "epoch": 2661} {"train_loss": -24.924543380737305, "global_step": 220935, "epoch": 2661} {"train_loss": -24.527311325073242, "global_step": 220936, "epoch": 2661} {"train_loss": -24.147550582885742, "global_step": 220937, "epoch": 2661} {"train_loss": -25.007986068725586, "global_step": 220938, "epoch": 2661} {"train_loss": -24.30100440979004, "global_step": 220939, "epoch": 2661} {"train_loss": -24.560453414916992, "global_step": 220940, "epoch": 2661} {"train_loss": -24.290592193603516, "global_step": 220941, "epoch": 2661} {"train_loss": -24.8248348236084, "global_step": 220942, "epoch": 2661} {"train_loss": -24.65787696838379, "global_step": 220943, "epoch": 2661} {"train_loss": -24.5799617767334, "global_step": 220944, "epoch": 2661} {"train_loss": -24.529010634824456, "global_step": 220945, "epoch": 2661, "val_loss": 6819573.0} {"train_loss": -24.173521041870117, "global_step": 220946, "epoch": 2662} {"train_loss": -24.112668991088867, "global_step": 220947, "epoch": 2662} {"train_loss": -23.99640655517578, "global_step": 220948, "epoch": 2662} {"train_loss": -24.244516372680664, "global_step": 220949, "epoch": 2662} {"train_loss": -24.335172653198242, "global_step": 220950, "epoch": 2662} {"train_loss": -24.10552978515625, "global_step": 220951, "epoch": 2662} {"train_loss": -24.43929100036621, "global_step": 220952, "epoch": 2662} {"train_loss": -23.934293746948242, "global_step": 220953, "epoch": 2662} {"train_loss": -24.043119430541992, "global_step": 220954, "epoch": 2662} {"train_loss": -24.30763053894043, "global_step": 220955, "epoch": 2662} {"train_loss": -24.563520431518555, "global_step": 220956, "epoch": 2662} {"train_loss": -24.237903594970703, "global_step": 220957, "epoch": 2662} {"train_loss": -24.098133087158203, "global_step": 220958, "epoch": 2662} {"train_loss": -24.601303100585938, "global_step": 220959, "epoch": 2662} {"train_loss": -24.571340560913086, "global_step": 220960, "epoch": 2662} {"train_loss": -24.588356018066406, "global_step": 220961, "epoch": 2662} {"train_loss": -24.532590866088867, "global_step": 220962, "epoch": 2662} {"train_loss": -24.279876708984375, "global_step": 220963, "epoch": 2662} {"train_loss": -24.46578025817871, "global_step": 220964, "epoch": 2662} {"train_loss": -24.497644424438477, "global_step": 220965, "epoch": 2662} {"train_loss": -24.67195701599121, "global_step": 220966, "epoch": 2662} {"train_loss": -24.717329025268555, "global_step": 220967, "epoch": 2662} {"train_loss": -24.40718650817871, "global_step": 220968, "epoch": 2662} {"train_loss": -24.704626083374023, "global_step": 220969, "epoch": 2662} {"train_loss": -24.575536727905273, "global_step": 220970, "epoch": 2662} {"train_loss": -24.377792358398438, "global_step": 220971, "epoch": 2662} {"train_loss": -24.65284538269043, "global_step": 220972, "epoch": 2662} {"train_loss": -24.824766159057617, "global_step": 220973, "epoch": 2662} {"train_loss": -24.26612663269043, "global_step": 220974, "epoch": 2662} {"train_loss": -24.3580265045166, "global_step": 220975, "epoch": 2662} {"train_loss": -24.61598014831543, "global_step": 220976, "epoch": 2662} {"train_loss": -24.5063533782959, "global_step": 220977, "epoch": 2662} {"train_loss": -24.822031021118164, "global_step": 220978, "epoch": 2662} {"train_loss": -24.638051986694336, "global_step": 220979, "epoch": 2662} {"train_loss": -24.506744384765625, "global_step": 220980, "epoch": 2662} {"train_loss": -24.390186309814453, "global_step": 220981, "epoch": 2662} {"train_loss": -24.8748779296875, "global_step": 220982, "epoch": 2662} {"train_loss": -24.398723602294922, "global_step": 220983, "epoch": 2662} {"train_loss": -24.94464111328125, "global_step": 220984, "epoch": 2662} {"train_loss": -24.454519271850586, "global_step": 220985, "epoch": 2662} {"train_loss": -24.869535446166992, "global_step": 220986, "epoch": 2662} {"train_loss": -24.838598251342773, "global_step": 220987, "epoch": 2662} {"train_loss": -24.869216918945312, "global_step": 220988, "epoch": 2662} {"train_loss": -24.608427047729492, "global_step": 220989, "epoch": 2662} {"train_loss": -25.036020278930664, "global_step": 220990, "epoch": 2662} {"train_loss": -24.66216468811035, "global_step": 220991, "epoch": 2662} {"train_loss": -24.649717330932617, "global_step": 220992, "epoch": 2662} {"train_loss": -24.331584930419922, "global_step": 220993, "epoch": 2662} {"train_loss": -24.837610244750977, "global_step": 220994, "epoch": 2662} {"train_loss": -24.771686553955078, "global_step": 220995, "epoch": 2662} {"train_loss": -24.66793441772461, "global_step": 220996, "epoch": 2662} {"train_loss": -24.697982788085938, "global_step": 220997, "epoch": 2662} {"train_loss": -24.9528751373291, "global_step": 220998, "epoch": 2662} {"train_loss": -24.707691192626953, "global_step": 220999, "epoch": 2662} {"train_loss": -24.589635848999023, "global_step": 221000, "epoch": 2662} {"train_loss": -25.1187744140625, "global_step": 221001, "epoch": 2662} {"train_loss": -24.934236526489258, "global_step": 221002, "epoch": 2662} {"train_loss": -24.718915939331055, "global_step": 221003, "epoch": 2662} {"train_loss": -24.68924331665039, "global_step": 221004, "epoch": 2662} {"train_loss": -24.556058883666992, "global_step": 221005, "epoch": 2662} {"train_loss": -24.67037010192871, "global_step": 221006, "epoch": 2662} {"train_loss": -24.874866485595703, "global_step": 221007, "epoch": 2662} {"train_loss": -24.241500854492188, "global_step": 221008, "epoch": 2662} {"train_loss": -24.75119400024414, "global_step": 221009, "epoch": 2662} {"train_loss": -24.391359329223633, "global_step": 221010, "epoch": 2662} {"train_loss": -24.56694221496582, "global_step": 221011, "epoch": 2662} {"train_loss": -24.656274795532227, "global_step": 221012, "epoch": 2662} {"train_loss": -24.622079849243164, "global_step": 221013, "epoch": 2662} {"train_loss": -24.84710121154785, "global_step": 221014, "epoch": 2662} {"train_loss": -24.31209373474121, "global_step": 221015, "epoch": 2662} {"train_loss": -24.8284854888916, "global_step": 221016, "epoch": 2662} {"train_loss": -24.679338455200195, "global_step": 221017, "epoch": 2662} {"train_loss": -24.648900985717773, "global_step": 221018, "epoch": 2662} {"train_loss": -24.748912811279297, "global_step": 221019, "epoch": 2662} {"train_loss": -24.735593795776367, "global_step": 221020, "epoch": 2662} {"train_loss": -24.42706298828125, "global_step": 221021, "epoch": 2662} {"train_loss": -24.649349212646484, "global_step": 221022, "epoch": 2662} {"train_loss": -24.532880783081055, "global_step": 221023, "epoch": 2662} {"train_loss": -24.625722885131836, "global_step": 221024, "epoch": 2662} {"train_loss": -24.424686431884766, "global_step": 221025, "epoch": 2662} {"train_loss": -24.460012435913086, "global_step": 221026, "epoch": 2662} {"train_loss": -24.65537452697754, "global_step": 221027, "epoch": 2662} {"train_loss": -24.57801524702325, "global_step": 221028, "epoch": 2662, "val_loss": 6609774.0} {"train_loss": -23.22933006286621, "global_step": 221029, "epoch": 2663} {"train_loss": -23.666284561157227, "global_step": 221030, "epoch": 2663} {"train_loss": -24.102182388305664, "global_step": 221031, "epoch": 2663} {"train_loss": -24.046857833862305, "global_step": 221032, "epoch": 2663} {"train_loss": -23.66108512878418, "global_step": 221033, "epoch": 2663} {"train_loss": -24.215801239013672, "global_step": 221034, "epoch": 2663} {"train_loss": -23.57193374633789, "global_step": 221035, "epoch": 2663} {"train_loss": -23.06803321838379, "global_step": 221036, "epoch": 2663} {"train_loss": -24.334415435791016, "global_step": 221037, "epoch": 2663} {"train_loss": -23.780668258666992, "global_step": 221038, "epoch": 2663} {"train_loss": -23.948776245117188, "global_step": 221039, "epoch": 2663} {"train_loss": -24.175622940063477, "global_step": 221040, "epoch": 2663} {"train_loss": -24.253738403320312, "global_step": 221041, "epoch": 2663} {"train_loss": -23.6385440826416, "global_step": 221042, "epoch": 2663} {"train_loss": -24.550039291381836, "global_step": 221043, "epoch": 2663} {"train_loss": -24.065061569213867, "global_step": 221044, "epoch": 2663} {"train_loss": -24.137104034423828, "global_step": 221045, "epoch": 2663} {"train_loss": -24.586950302124023, "global_step": 221046, "epoch": 2663} {"train_loss": -24.392004013061523, "global_step": 221047, "epoch": 2663} {"train_loss": -24.49907684326172, "global_step": 221048, "epoch": 2663} {"train_loss": -24.395832061767578, "global_step": 221049, "epoch": 2663} {"train_loss": -24.526840209960938, "global_step": 221050, "epoch": 2663} {"train_loss": -24.396366119384766, "global_step": 221051, "epoch": 2663} {"train_loss": -24.230825424194336, "global_step": 221052, "epoch": 2663} {"train_loss": -24.431533813476562, "global_step": 221053, "epoch": 2663} {"train_loss": -24.362531661987305, "global_step": 221054, "epoch": 2663} {"train_loss": -24.775623321533203, "global_step": 221055, "epoch": 2663} {"train_loss": -24.561845779418945, "global_step": 221056, "epoch": 2663} {"train_loss": -24.401277542114258, "global_step": 221057, "epoch": 2663} {"train_loss": -24.632417678833008, "global_step": 221058, "epoch": 2663} {"train_loss": -24.15024757385254, "global_step": 221059, "epoch": 2663} {"train_loss": -24.678325653076172, "global_step": 221060, "epoch": 2663} {"train_loss": -24.686580657958984, "global_step": 221061, "epoch": 2663} {"train_loss": -24.722660064697266, "global_step": 221062, "epoch": 2663} {"train_loss": -24.64874839782715, "global_step": 221063, "epoch": 2663} {"train_loss": -24.524641036987305, "global_step": 221064, "epoch": 2663} {"train_loss": -24.816146850585938, "global_step": 221065, "epoch": 2663} {"train_loss": -24.455060958862305, "global_step": 221066, "epoch": 2663} {"train_loss": -24.58047866821289, "global_step": 221067, "epoch": 2663} {"train_loss": -24.879940032958984, "global_step": 221068, "epoch": 2663} {"train_loss": -25.041990280151367, "global_step": 221069, "epoch": 2663} {"train_loss": -24.582889556884766, "global_step": 221070, "epoch": 2663} {"train_loss": -24.581298828125, "global_step": 221071, "epoch": 2663} {"train_loss": -24.819690704345703, "global_step": 221072, "epoch": 2663} {"train_loss": -24.48456382751465, "global_step": 221073, "epoch": 2663} {"train_loss": -24.556777954101562, "global_step": 221074, "epoch": 2663} {"train_loss": -24.736846923828125, "global_step": 221075, "epoch": 2663} {"train_loss": -25.070737838745117, "global_step": 221076, "epoch": 2663} {"train_loss": -24.681537628173828, "global_step": 221077, "epoch": 2663} {"train_loss": -24.68672752380371, "global_step": 221078, "epoch": 2663} {"train_loss": -24.804899215698242, "global_step": 221079, "epoch": 2663} {"train_loss": -25.236358642578125, "global_step": 221080, "epoch": 2663} {"train_loss": -24.43855857849121, "global_step": 221081, "epoch": 2663} {"train_loss": -24.656009674072266, "global_step": 221082, "epoch": 2663} {"train_loss": -24.62506866455078, "global_step": 221083, "epoch": 2663} {"train_loss": -24.70880699157715, "global_step": 221084, "epoch": 2663} {"train_loss": -24.645322799682617, "global_step": 221085, "epoch": 2663} {"train_loss": -24.6414852142334, "global_step": 221086, "epoch": 2663} {"train_loss": -24.78305435180664, "global_step": 221087, "epoch": 2663} {"train_loss": -24.311222076416016, "global_step": 221088, "epoch": 2663} {"train_loss": -24.477636337280273, "global_step": 221089, "epoch": 2663} {"train_loss": -24.905481338500977, "global_step": 221090, "epoch": 2663} {"train_loss": -24.491729736328125, "global_step": 221091, "epoch": 2663} {"train_loss": -24.530105590820312, "global_step": 221092, "epoch": 2663} {"train_loss": -24.329328536987305, "global_step": 221093, "epoch": 2663} {"train_loss": -24.869428634643555, "global_step": 221094, "epoch": 2663} {"train_loss": -24.73415184020996, "global_step": 221095, "epoch": 2663} {"train_loss": -24.754926681518555, "global_step": 221096, "epoch": 2663} {"train_loss": -24.952335357666016, "global_step": 221097, "epoch": 2663} {"train_loss": -24.473962783813477, "global_step": 221098, "epoch": 2663} {"train_loss": -24.536252975463867, "global_step": 221099, "epoch": 2663} {"train_loss": -24.76477813720703, "global_step": 221100, "epoch": 2663} {"train_loss": -24.587766647338867, "global_step": 221101, "epoch": 2663} {"train_loss": -24.503576278686523, "global_step": 221102, "epoch": 2663} {"train_loss": -24.620994567871094, "global_step": 221103, "epoch": 2663} {"train_loss": -24.53961181640625, "global_step": 221104, "epoch": 2663} {"train_loss": -24.502315521240234, "global_step": 221105, "epoch": 2663} {"train_loss": -24.03384780883789, "global_step": 221106, "epoch": 2663} {"train_loss": -24.19598960876465, "global_step": 221107, "epoch": 2663} {"train_loss": -24.34096336364746, "global_step": 221108, "epoch": 2663} {"train_loss": -24.270076751708984, "global_step": 221109, "epoch": 2663} {"train_loss": -24.37239646911621, "global_step": 221110, "epoch": 2663} {"train_loss": -24.451114999242577, "global_step": 221111, "epoch": 2663, "val_loss": 6831232.0} {"train_loss": -24.046247482299805, "global_step": 221112, "epoch": 2664} {"train_loss": -23.15207290649414, "global_step": 221113, "epoch": 2664} {"train_loss": -23.353113174438477, "global_step": 221114, "epoch": 2664} {"train_loss": -24.465208053588867, "global_step": 221115, "epoch": 2664} {"train_loss": -23.26412010192871, "global_step": 221116, "epoch": 2664} {"train_loss": -24.183732986450195, "global_step": 221117, "epoch": 2664} {"train_loss": -23.908300399780273, "global_step": 221118, "epoch": 2664} {"train_loss": -23.74877166748047, "global_step": 221119, "epoch": 2664} {"train_loss": -24.242843627929688, "global_step": 221120, "epoch": 2664} {"train_loss": -23.885929107666016, "global_step": 221121, "epoch": 2664} {"train_loss": -23.929218292236328, "global_step": 221122, "epoch": 2664} {"train_loss": -23.885183334350586, "global_step": 221123, "epoch": 2664} {"train_loss": -23.857715606689453, "global_step": 221124, "epoch": 2664} {"train_loss": -24.073740005493164, "global_step": 221125, "epoch": 2664} {"train_loss": -24.326091766357422, "global_step": 221126, "epoch": 2664} {"train_loss": -23.772790908813477, "global_step": 221127, "epoch": 2664} {"train_loss": -24.08347511291504, "global_step": 221128, "epoch": 2664} {"train_loss": -24.222002029418945, "global_step": 221129, "epoch": 2664} {"train_loss": -24.36968994140625, "global_step": 221130, "epoch": 2664} {"train_loss": -24.16290855407715, "global_step": 221131, "epoch": 2664} {"train_loss": -24.17011833190918, "global_step": 221132, "epoch": 2664} {"train_loss": -24.28038787841797, "global_step": 221133, "epoch": 2664} {"train_loss": -24.587308883666992, "global_step": 221134, "epoch": 2664} {"train_loss": -24.26750373840332, "global_step": 221135, "epoch": 2664} {"train_loss": -24.527538299560547, "global_step": 221136, "epoch": 2664} {"train_loss": -24.397050857543945, "global_step": 221137, "epoch": 2664} {"train_loss": -24.477148056030273, "global_step": 221138, "epoch": 2664} {"train_loss": -24.419950485229492, "global_step": 221139, "epoch": 2664} {"train_loss": -24.277196884155273, "global_step": 221140, "epoch": 2664} {"train_loss": -24.28507423400879, "global_step": 221141, "epoch": 2664} {"train_loss": -24.6531925201416, "global_step": 221142, "epoch": 2664} {"train_loss": -24.77277946472168, "global_step": 221143, "epoch": 2664} {"train_loss": -24.734207153320312, "global_step": 221144, "epoch": 2664} {"train_loss": -24.441823959350586, "global_step": 221145, "epoch": 2664} {"train_loss": -24.6109561920166, "global_step": 221146, "epoch": 2664} {"train_loss": -24.84014320373535, "global_step": 221147, "epoch": 2664} {"train_loss": -24.855371475219727, "global_step": 221148, "epoch": 2664} {"train_loss": -24.516895294189453, "global_step": 221149, "epoch": 2664} {"train_loss": -24.46918296813965, "global_step": 221150, "epoch": 2664} {"train_loss": -24.641939163208008, "global_step": 221151, "epoch": 2664} {"train_loss": -24.741708755493164, "global_step": 221152, "epoch": 2664} {"train_loss": -24.90829849243164, "global_step": 221153, "epoch": 2664} {"train_loss": -24.477476119995117, "global_step": 221154, "epoch": 2664} {"train_loss": -24.359146118164062, "global_step": 221155, "epoch": 2664} {"train_loss": -24.999116897583008, "global_step": 221156, "epoch": 2664} {"train_loss": -24.497364044189453, "global_step": 221157, "epoch": 2664} {"train_loss": -24.78706169128418, "global_step": 221158, "epoch": 2664} {"train_loss": -24.38129997253418, "global_step": 221159, "epoch": 2664} {"train_loss": -23.988508224487305, "global_step": 221160, "epoch": 2664} {"train_loss": -25.088804244995117, "global_step": 221161, "epoch": 2664} {"train_loss": -24.558183670043945, "global_step": 221162, "epoch": 2664} {"train_loss": -24.126352310180664, "global_step": 221163, "epoch": 2664} {"train_loss": -23.936521530151367, "global_step": 221164, "epoch": 2664} {"train_loss": -24.25792121887207, "global_step": 221165, "epoch": 2664} {"train_loss": -24.249101638793945, "global_step": 221166, "epoch": 2664} {"train_loss": -24.250450134277344, "global_step": 221167, "epoch": 2664} {"train_loss": -24.304492950439453, "global_step": 221168, "epoch": 2664} {"train_loss": -24.03870964050293, "global_step": 221169, "epoch": 2664} {"train_loss": -24.31441879272461, "global_step": 221170, "epoch": 2664} {"train_loss": -24.575546264648438, "global_step": 221171, "epoch": 2664} {"train_loss": -24.763628005981445, "global_step": 221172, "epoch": 2664} {"train_loss": -24.48321533203125, "global_step": 221173, "epoch": 2664} {"train_loss": -24.91472625732422, "global_step": 221174, "epoch": 2664} {"train_loss": -24.53238296508789, "global_step": 221175, "epoch": 2664} {"train_loss": -24.467819213867188, "global_step": 221176, "epoch": 2664} {"train_loss": -24.45928955078125, "global_step": 221177, "epoch": 2664} {"train_loss": -24.64356231689453, "global_step": 221178, "epoch": 2664} {"train_loss": -24.81538200378418, "global_step": 221179, "epoch": 2664} {"train_loss": -24.738691329956055, "global_step": 221180, "epoch": 2664} {"train_loss": -24.220727920532227, "global_step": 221181, "epoch": 2664} {"train_loss": -24.64769744873047, "global_step": 221182, "epoch": 2664} {"train_loss": -24.76128578186035, "global_step": 221183, "epoch": 2664} {"train_loss": -24.731443405151367, "global_step": 221184, "epoch": 2664} {"train_loss": -24.710987091064453, "global_step": 221185, "epoch": 2664} {"train_loss": -24.400981903076172, "global_step": 221186, "epoch": 2664} {"train_loss": -24.49639129638672, "global_step": 221187, "epoch": 2664} {"train_loss": -24.736906051635742, "global_step": 221188, "epoch": 2664} {"train_loss": -24.733638763427734, "global_step": 221189, "epoch": 2664} {"train_loss": -24.89214324951172, "global_step": 221190, "epoch": 2664} {"train_loss": -24.916412353515625, "global_step": 221191, "epoch": 2664} {"train_loss": -24.653064727783203, "global_step": 221192, "epoch": 2664} {"train_loss": -24.482803344726562, "global_step": 221193, "epoch": 2664} {"train_loss": -24.396645856190876, "global_step": 221194, "epoch": 2664, "val_loss": 6619802.0} {"train_loss": -24.195627212524414, "global_step": 221195, "epoch": 2665} {"train_loss": -24.60593605041504, "global_step": 221196, "epoch": 2665} {"train_loss": -24.436582565307617, "global_step": 221197, "epoch": 2665} {"train_loss": -24.2595157623291, "global_step": 221198, "epoch": 2665} {"train_loss": -24.17390251159668, "global_step": 221199, "epoch": 2665} {"train_loss": -24.017526626586914, "global_step": 221200, "epoch": 2665} {"train_loss": -24.128522872924805, "global_step": 221201, "epoch": 2665} {"train_loss": -24.246906280517578, "global_step": 221202, "epoch": 2665} {"train_loss": -24.383075714111328, "global_step": 221203, "epoch": 2665} {"train_loss": -24.645849227905273, "global_step": 221204, "epoch": 2665} {"train_loss": -24.237401962280273, "global_step": 221205, "epoch": 2665} {"train_loss": -24.31963539123535, "global_step": 221206, "epoch": 2665} {"train_loss": -24.654706954956055, "global_step": 221207, "epoch": 2665} {"train_loss": -24.64051628112793, "global_step": 221208, "epoch": 2665} {"train_loss": -24.579919815063477, "global_step": 221209, "epoch": 2665} {"train_loss": -24.658924102783203, "global_step": 221210, "epoch": 2665} {"train_loss": -24.305835723876953, "global_step": 221211, "epoch": 2665} {"train_loss": -24.2105770111084, "global_step": 221212, "epoch": 2665} {"train_loss": -24.47490882873535, "global_step": 221213, "epoch": 2665} {"train_loss": -24.32429313659668, "global_step": 221214, "epoch": 2665} {"train_loss": -24.456907272338867, "global_step": 221215, "epoch": 2665} {"train_loss": -24.365177154541016, "global_step": 221216, "epoch": 2665} {"train_loss": -24.49993324279785, "global_step": 221217, "epoch": 2665} {"train_loss": -24.578161239624023, "global_step": 221218, "epoch": 2665} {"train_loss": -24.485504150390625, "global_step": 221219, "epoch": 2665} {"train_loss": -24.45479393005371, "global_step": 221220, "epoch": 2665} {"train_loss": -24.13583755493164, "global_step": 221221, "epoch": 2665} {"train_loss": -24.221176147460938, "global_step": 221222, "epoch": 2665} {"train_loss": -24.646223068237305, "global_step": 221223, "epoch": 2665} {"train_loss": -24.654367446899414, "global_step": 221224, "epoch": 2665} {"train_loss": -24.603670120239258, "global_step": 221225, "epoch": 2665} {"train_loss": -24.407676696777344, "global_step": 221226, "epoch": 2665} {"train_loss": -24.625329971313477, "global_step": 221227, "epoch": 2665} {"train_loss": -24.432077407836914, "global_step": 221228, "epoch": 2665} {"train_loss": -24.503999710083008, "global_step": 221229, "epoch": 2665} {"train_loss": -24.70035171508789, "global_step": 221230, "epoch": 2665} {"train_loss": -24.49822998046875, "global_step": 221231, "epoch": 2665} {"train_loss": -24.342660903930664, "global_step": 221232, "epoch": 2665} {"train_loss": -24.532312393188477, "global_step": 221233, "epoch": 2665} {"train_loss": -24.475027084350586, "global_step": 221234, "epoch": 2665} {"train_loss": -24.6895809173584, "global_step": 221235, "epoch": 2665} {"train_loss": -24.236291885375977, "global_step": 221236, "epoch": 2665} {"train_loss": -24.679136276245117, "global_step": 221237, "epoch": 2665} {"train_loss": -24.808584213256836, "global_step": 221238, "epoch": 2665} {"train_loss": -24.645893096923828, "global_step": 221239, "epoch": 2665} {"train_loss": -24.868087768554688, "global_step": 221240, "epoch": 2665} {"train_loss": -24.489410400390625, "global_step": 221241, "epoch": 2665} {"train_loss": -24.8812313079834, "global_step": 221242, "epoch": 2665} {"train_loss": -24.538488388061523, "global_step": 221243, "epoch": 2665} {"train_loss": -24.700366973876953, "global_step": 221244, "epoch": 2665} {"train_loss": -24.59265899658203, "global_step": 221245, "epoch": 2665} {"train_loss": -25.11941909790039, "global_step": 221246, "epoch": 2665} {"train_loss": -24.5306396484375, "global_step": 221247, "epoch": 2665} {"train_loss": -24.4354305267334, "global_step": 221248, "epoch": 2665} {"train_loss": -24.533905029296875, "global_step": 221249, "epoch": 2665} {"train_loss": -24.518949508666992, "global_step": 221250, "epoch": 2665} {"train_loss": -24.516611099243164, "global_step": 221251, "epoch": 2665} {"train_loss": -24.58670997619629, "global_step": 221252, "epoch": 2665} {"train_loss": -24.725980758666992, "global_step": 221253, "epoch": 2665} {"train_loss": -24.6463680267334, "global_step": 221254, "epoch": 2665} {"train_loss": -24.75380516052246, "global_step": 221255, "epoch": 2665} {"train_loss": -24.59905433654785, "global_step": 221256, "epoch": 2665} {"train_loss": -24.779666900634766, "global_step": 221257, "epoch": 2665} {"train_loss": -24.69721794128418, "global_step": 221258, "epoch": 2665} {"train_loss": -24.50270652770996, "global_step": 221259, "epoch": 2665} {"train_loss": -24.754173278808594, "global_step": 221260, "epoch": 2665} {"train_loss": -24.53264808654785, "global_step": 221261, "epoch": 2665} {"train_loss": -24.6774959564209, "global_step": 221262, "epoch": 2665} {"train_loss": -24.75043296813965, "global_step": 221263, "epoch": 2665} {"train_loss": -24.505062103271484, "global_step": 221264, "epoch": 2665} {"train_loss": -24.458723068237305, "global_step": 221265, "epoch": 2665} {"train_loss": -24.83510971069336, "global_step": 221266, "epoch": 2665} {"train_loss": -24.607736587524414, "global_step": 221267, "epoch": 2665} {"train_loss": -24.169721603393555, "global_step": 221268, "epoch": 2665} {"train_loss": -24.282543182373047, "global_step": 221269, "epoch": 2665} {"train_loss": -24.06167221069336, "global_step": 221270, "epoch": 2665} {"train_loss": -24.132984161376953, "global_step": 221271, "epoch": 2665} {"train_loss": -24.824565887451172, "global_step": 221272, "epoch": 2665} {"train_loss": -24.636423110961914, "global_step": 221273, "epoch": 2665} {"train_loss": -24.413898468017578, "global_step": 221274, "epoch": 2665} {"train_loss": -24.52661895751953, "global_step": 221275, "epoch": 2665} {"train_loss": -24.450159072875977, "global_step": 221276, "epoch": 2665} {"train_loss": -24.490787115441748, "global_step": 221277, "epoch": 2665, "val_loss": 6742800.0} {"train_loss": -24.81525993347168, "global_step": 221278, "epoch": 2666} {"train_loss": -24.279647827148438, "global_step": 221279, "epoch": 2666} {"train_loss": -24.735746383666992, "global_step": 221280, "epoch": 2666} {"train_loss": -24.12837028503418, "global_step": 221281, "epoch": 2666} {"train_loss": -24.32978630065918, "global_step": 221282, "epoch": 2666} {"train_loss": -24.604084014892578, "global_step": 221283, "epoch": 2666} {"train_loss": -24.591079711914062, "global_step": 221284, "epoch": 2666} {"train_loss": -24.17432975769043, "global_step": 221285, "epoch": 2666} {"train_loss": -24.630212783813477, "global_step": 221286, "epoch": 2666} {"train_loss": -24.756122589111328, "global_step": 221287, "epoch": 2666} {"train_loss": -24.45501708984375, "global_step": 221288, "epoch": 2666} {"train_loss": -24.4580135345459, "global_step": 221289, "epoch": 2666} {"train_loss": -24.531883239746094, "global_step": 221290, "epoch": 2666} {"train_loss": -24.634912490844727, "global_step": 221291, "epoch": 2666} {"train_loss": -24.21160316467285, "global_step": 221292, "epoch": 2666} {"train_loss": -24.574384689331055, "global_step": 221293, "epoch": 2666} {"train_loss": -24.45575523376465, "global_step": 221294, "epoch": 2666} {"train_loss": -24.375417709350586, "global_step": 221295, "epoch": 2666} {"train_loss": -24.589813232421875, "global_step": 221296, "epoch": 2666} {"train_loss": -24.886188507080078, "global_step": 221297, "epoch": 2666} {"train_loss": -24.79228973388672, "global_step": 221298, "epoch": 2666} {"train_loss": -24.595748901367188, "global_step": 221299, "epoch": 2666} {"train_loss": -24.47870445251465, "global_step": 221300, "epoch": 2666} {"train_loss": -24.679847717285156, "global_step": 221301, "epoch": 2666} {"train_loss": -24.725902557373047, "global_step": 221302, "epoch": 2666} {"train_loss": -24.613000869750977, "global_step": 221303, "epoch": 2666} {"train_loss": -24.849721908569336, "global_step": 221304, "epoch": 2666} {"train_loss": -24.937952041625977, "global_step": 221305, "epoch": 2666} {"train_loss": -24.567218780517578, "global_step": 221306, "epoch": 2666} {"train_loss": -25.00959587097168, "global_step": 221307, "epoch": 2666} {"train_loss": -24.532867431640625, "global_step": 221308, "epoch": 2666} {"train_loss": -24.43900489807129, "global_step": 221309, "epoch": 2666} {"train_loss": -24.747129440307617, "global_step": 221310, "epoch": 2666} {"train_loss": -24.839599609375, "global_step": 221311, "epoch": 2666} {"train_loss": -24.70318031311035, "global_step": 221312, "epoch": 2666} {"train_loss": -24.463735580444336, "global_step": 221313, "epoch": 2666} {"train_loss": -24.692150115966797, "global_step": 221314, "epoch": 2666} {"train_loss": -25.077322006225586, "global_step": 221315, "epoch": 2666} {"train_loss": -24.800390243530273, "global_step": 221316, "epoch": 2666} {"train_loss": -24.588348388671875, "global_step": 221317, "epoch": 2666} {"train_loss": -24.86614227294922, "global_step": 221318, "epoch": 2666} {"train_loss": -24.726730346679688, "global_step": 221319, "epoch": 2666} {"train_loss": -24.860342025756836, "global_step": 221320, "epoch": 2666} {"train_loss": -24.436569213867188, "global_step": 221321, "epoch": 2666} {"train_loss": -25.220788955688477, "global_step": 221322, "epoch": 2666} {"train_loss": -24.895435333251953, "global_step": 221323, "epoch": 2666} {"train_loss": -24.67132568359375, "global_step": 221324, "epoch": 2666} {"train_loss": -24.788436889648438, "global_step": 221325, "epoch": 2666} {"train_loss": -24.473119735717773, "global_step": 221326, "epoch": 2666} {"train_loss": -24.468807220458984, "global_step": 221327, "epoch": 2666} {"train_loss": -24.372400283813477, "global_step": 221328, "epoch": 2666} {"train_loss": -24.738882064819336, "global_step": 221329, "epoch": 2666} {"train_loss": -24.9243106842041, "global_step": 221330, "epoch": 2666} {"train_loss": -24.170637130737305, "global_step": 221331, "epoch": 2666} {"train_loss": -24.39817237854004, "global_step": 221332, "epoch": 2666} {"train_loss": -23.514657974243164, "global_step": 221333, "epoch": 2666} {"train_loss": -23.721487045288086, "global_step": 221334, "epoch": 2666} {"train_loss": -23.891586303710938, "global_step": 221335, "epoch": 2666} {"train_loss": -24.167356491088867, "global_step": 221336, "epoch": 2666} {"train_loss": -24.06180763244629, "global_step": 221337, "epoch": 2666} {"train_loss": -23.331388473510742, "global_step": 221338, "epoch": 2666} {"train_loss": -24.172378540039062, "global_step": 221339, "epoch": 2666} {"train_loss": -23.87678337097168, "global_step": 221340, "epoch": 2666} {"train_loss": -23.991174697875977, "global_step": 221341, "epoch": 2666} {"train_loss": -23.86368179321289, "global_step": 221342, "epoch": 2666} {"train_loss": -24.23383140563965, "global_step": 221343, "epoch": 2666} {"train_loss": -24.163991928100586, "global_step": 221344, "epoch": 2666} {"train_loss": -23.866853713989258, "global_step": 221345, "epoch": 2666} {"train_loss": -24.4707088470459, "global_step": 221346, "epoch": 2666} {"train_loss": -24.246503829956055, "global_step": 221347, "epoch": 2666} {"train_loss": -24.328460693359375, "global_step": 221348, "epoch": 2666} {"train_loss": -24.33885383605957, "global_step": 221349, "epoch": 2666} {"train_loss": -24.278656005859375, "global_step": 221350, "epoch": 2666} {"train_loss": -24.31790542602539, "global_step": 221351, "epoch": 2666} {"train_loss": -24.410655975341797, "global_step": 221352, "epoch": 2666} {"train_loss": -24.047117233276367, "global_step": 221353, "epoch": 2666} {"train_loss": -24.274206161499023, "global_step": 221354, "epoch": 2666} {"train_loss": -24.39173698425293, "global_step": 221355, "epoch": 2666} {"train_loss": -24.459217071533203, "global_step": 221356, "epoch": 2666} {"train_loss": -24.963048934936523, "global_step": 221357, "epoch": 2666} {"train_loss": -24.09209632873535, "global_step": 221358, "epoch": 2666} {"train_loss": -24.535303115844727, "global_step": 221359, "epoch": 2666} {"train_loss": -24.46739973504859, "global_step": 221360, "epoch": 2666, "val_loss": 6671934.0} {"train_loss": -23.894962310791016, "global_step": 221361, "epoch": 2667} {"train_loss": -24.389198303222656, "global_step": 221362, "epoch": 2667} {"train_loss": -23.980619430541992, "global_step": 221363, "epoch": 2667} {"train_loss": -24.47205924987793, "global_step": 221364, "epoch": 2667} {"train_loss": -24.541677474975586, "global_step": 221365, "epoch": 2667} {"train_loss": -24.45680809020996, "global_step": 221366, "epoch": 2667} {"train_loss": -24.210742950439453, "global_step": 221367, "epoch": 2667} {"train_loss": -24.336156845092773, "global_step": 221368, "epoch": 2667} {"train_loss": -24.099531173706055, "global_step": 221369, "epoch": 2667} {"train_loss": -23.995458602905273, "global_step": 221370, "epoch": 2667} {"train_loss": -24.666776657104492, "global_step": 221371, "epoch": 2667} {"train_loss": -23.915260314941406, "global_step": 221372, "epoch": 2667} {"train_loss": -24.597049713134766, "global_step": 221373, "epoch": 2667} {"train_loss": -24.374425888061523, "global_step": 221374, "epoch": 2667} {"train_loss": -24.185832977294922, "global_step": 221375, "epoch": 2667} {"train_loss": -24.727994918823242, "global_step": 221376, "epoch": 2667} {"train_loss": -23.89190673828125, "global_step": 221377, "epoch": 2667} {"train_loss": -24.470500946044922, "global_step": 221378, "epoch": 2667} {"train_loss": -23.97995948791504, "global_step": 221379, "epoch": 2667} {"train_loss": -24.38275718688965, "global_step": 221380, "epoch": 2667} {"train_loss": -24.39991569519043, "global_step": 221381, "epoch": 2667} {"train_loss": -24.357681274414062, "global_step": 221382, "epoch": 2667} {"train_loss": -24.671524047851562, "global_step": 221383, "epoch": 2667} {"train_loss": -24.53765296936035, "global_step": 221384, "epoch": 2667} {"train_loss": -24.79477882385254, "global_step": 221385, "epoch": 2667} {"train_loss": -24.7806396484375, "global_step": 221386, "epoch": 2667} {"train_loss": -24.835309982299805, "global_step": 221387, "epoch": 2667} {"train_loss": -24.878984451293945, "global_step": 221388, "epoch": 2667} {"train_loss": -24.72212791442871, "global_step": 221389, "epoch": 2667} {"train_loss": -24.78499412536621, "global_step": 221390, "epoch": 2667} {"train_loss": -24.483501434326172, "global_step": 221391, "epoch": 2667} {"train_loss": -24.767980575561523, "global_step": 221392, "epoch": 2667} {"train_loss": -24.658477783203125, "global_step": 221393, "epoch": 2667} {"train_loss": -24.774248123168945, "global_step": 221394, "epoch": 2667} {"train_loss": -24.861242294311523, "global_step": 221395, "epoch": 2667} {"train_loss": -24.23700523376465, "global_step": 221396, "epoch": 2667} {"train_loss": -24.49882698059082, "global_step": 221397, "epoch": 2667} {"train_loss": -24.602191925048828, "global_step": 221398, "epoch": 2667} {"train_loss": -24.68703842163086, "global_step": 221399, "epoch": 2667} {"train_loss": -24.406129837036133, "global_step": 221400, "epoch": 2667} {"train_loss": -24.56318473815918, "global_step": 221401, "epoch": 2667} {"train_loss": -24.555601119995117, "global_step": 221402, "epoch": 2667} {"train_loss": -24.4867000579834, "global_step": 221403, "epoch": 2667} {"train_loss": -24.619686126708984, "global_step": 221404, "epoch": 2667} {"train_loss": -24.882455825805664, "global_step": 221405, "epoch": 2667} {"train_loss": -24.68060874938965, "global_step": 221406, "epoch": 2667} {"train_loss": -24.732715606689453, "global_step": 221407, "epoch": 2667} {"train_loss": -24.889936447143555, "global_step": 221408, "epoch": 2667} {"train_loss": -24.552988052368164, "global_step": 221409, "epoch": 2667} {"train_loss": -24.83661460876465, "global_step": 221410, "epoch": 2667} {"train_loss": -24.352941513061523, "global_step": 221411, "epoch": 2667} {"train_loss": -24.13990592956543, "global_step": 221412, "epoch": 2667} {"train_loss": -24.476613998413086, "global_step": 221413, "epoch": 2667} {"train_loss": -24.758665084838867, "global_step": 221414, "epoch": 2667} {"train_loss": -24.879785537719727, "global_step": 221415, "epoch": 2667} {"train_loss": -24.43476676940918, "global_step": 221416, "epoch": 2667} {"train_loss": -24.726728439331055, "global_step": 221417, "epoch": 2667} {"train_loss": -24.679752349853516, "global_step": 221418, "epoch": 2667} {"train_loss": -24.838726043701172, "global_step": 221419, "epoch": 2667} {"train_loss": -24.67432975769043, "global_step": 221420, "epoch": 2667} {"train_loss": -24.45532989501953, "global_step": 221421, "epoch": 2667} {"train_loss": -24.53035545349121, "global_step": 221422, "epoch": 2667} {"train_loss": -24.59421157836914, "global_step": 221423, "epoch": 2667} {"train_loss": -24.68157958984375, "global_step": 221424, "epoch": 2667} {"train_loss": -24.423871994018555, "global_step": 221425, "epoch": 2667} {"train_loss": -24.344125747680664, "global_step": 221426, "epoch": 2667} {"train_loss": -24.18118667602539, "global_step": 221427, "epoch": 2667} {"train_loss": -24.445011138916016, "global_step": 221428, "epoch": 2667} {"train_loss": -24.72393035888672, "global_step": 221429, "epoch": 2667} {"train_loss": -24.78485107421875, "global_step": 221430, "epoch": 2667} {"train_loss": -24.31617546081543, "global_step": 221431, "epoch": 2667} {"train_loss": -24.7572021484375, "global_step": 221432, "epoch": 2667} {"train_loss": -24.38498878479004, "global_step": 221433, "epoch": 2667} {"train_loss": -24.44373893737793, "global_step": 221434, "epoch": 2667} {"train_loss": -24.733556747436523, "global_step": 221435, "epoch": 2667} {"train_loss": -24.843137741088867, "global_step": 221436, "epoch": 2667} {"train_loss": -24.549062728881836, "global_step": 221437, "epoch": 2667} {"train_loss": -24.29252052307129, "global_step": 221438, "epoch": 2667} {"train_loss": -24.704492568969727, "global_step": 221439, "epoch": 2667} {"train_loss": -24.641254425048828, "global_step": 221440, "epoch": 2667} {"train_loss": -24.24367332458496, "global_step": 221441, "epoch": 2667} {"train_loss": -24.664220809936523, "global_step": 221442, "epoch": 2667} {"train_loss": -24.521952112037017, "global_step": 221443, "epoch": 2667, "val_loss": 6717554.0} {"train_loss": -23.721405029296875, "global_step": 221444, "epoch": 2668} {"train_loss": -24.308549880981445, "global_step": 221445, "epoch": 2668} {"train_loss": -24.453969955444336, "global_step": 221446, "epoch": 2668} {"train_loss": -23.592710494995117, "global_step": 221447, "epoch": 2668} {"train_loss": -23.7266902923584, "global_step": 221448, "epoch": 2668} {"train_loss": -24.312057495117188, "global_step": 221449, "epoch": 2668} {"train_loss": -24.447784423828125, "global_step": 221450, "epoch": 2668} {"train_loss": -24.178258895874023, "global_step": 221451, "epoch": 2668} {"train_loss": -24.63185691833496, "global_step": 221452, "epoch": 2668} {"train_loss": -24.504865646362305, "global_step": 221453, "epoch": 2668} {"train_loss": -24.51059341430664, "global_step": 221454, "epoch": 2668} {"train_loss": -24.701398849487305, "global_step": 221455, "epoch": 2668} {"train_loss": -24.1343936920166, "global_step": 221456, "epoch": 2668} {"train_loss": -24.312564849853516, "global_step": 221457, "epoch": 2668} {"train_loss": -24.139991760253906, "global_step": 221458, "epoch": 2668} {"train_loss": -24.482580184936523, "global_step": 221459, "epoch": 2668} {"train_loss": -24.801198959350586, "global_step": 221460, "epoch": 2668} {"train_loss": -24.87503433227539, "global_step": 221461, "epoch": 2668} {"train_loss": -24.293188095092773, "global_step": 221462, "epoch": 2668} {"train_loss": -24.606943130493164, "global_step": 221463, "epoch": 2668} {"train_loss": -24.70305824279785, "global_step": 221464, "epoch": 2668} {"train_loss": -24.976675033569336, "global_step": 221465, "epoch": 2668} {"train_loss": -24.641111373901367, "global_step": 221466, "epoch": 2668} {"train_loss": -24.495712280273438, "global_step": 221467, "epoch": 2668} {"train_loss": -24.388635635375977, "global_step": 221468, "epoch": 2668} {"train_loss": -24.922117233276367, "global_step": 221469, "epoch": 2668} {"train_loss": -25.01430320739746, "global_step": 221470, "epoch": 2668} {"train_loss": -24.763914108276367, "global_step": 221471, "epoch": 2668} {"train_loss": -24.930988311767578, "global_step": 221472, "epoch": 2668} {"train_loss": -24.845022201538086, "global_step": 221473, "epoch": 2668} {"train_loss": -24.840545654296875, "global_step": 221474, "epoch": 2668} {"train_loss": -24.40505027770996, "global_step": 221475, "epoch": 2668} {"train_loss": -24.69074821472168, "global_step": 221476, "epoch": 2668} {"train_loss": -24.728729248046875, "global_step": 221477, "epoch": 2668} {"train_loss": -24.73941421508789, "global_step": 221478, "epoch": 2668} {"train_loss": -24.7005615234375, "global_step": 221479, "epoch": 2668} {"train_loss": -24.952417373657227, "global_step": 221480, "epoch": 2668} {"train_loss": -24.89824867248535, "global_step": 221481, "epoch": 2668} {"train_loss": -24.8625431060791, "global_step": 221482, "epoch": 2668} {"train_loss": -24.719308853149414, "global_step": 221483, "epoch": 2668} {"train_loss": -24.917966842651367, "global_step": 221484, "epoch": 2668} {"train_loss": -24.782957077026367, "global_step": 221485, "epoch": 2668} {"train_loss": -24.400741577148438, "global_step": 221486, "epoch": 2668} {"train_loss": -24.546512603759766, "global_step": 221487, "epoch": 2668} {"train_loss": -25.00737190246582, "global_step": 221488, "epoch": 2668} {"train_loss": -24.761829376220703, "global_step": 221489, "epoch": 2668} {"train_loss": -24.539213180541992, "global_step": 221490, "epoch": 2668} {"train_loss": -24.4979305267334, "global_step": 221491, "epoch": 2668} {"train_loss": -24.50027847290039, "global_step": 221492, "epoch": 2668} {"train_loss": -24.601743698120117, "global_step": 221493, "epoch": 2668} {"train_loss": -24.399850845336914, "global_step": 221494, "epoch": 2668} {"train_loss": -24.4598331451416, "global_step": 221495, "epoch": 2668} {"train_loss": -24.397830963134766, "global_step": 221496, "epoch": 2668} {"train_loss": -24.886701583862305, "global_step": 221497, "epoch": 2668} {"train_loss": -24.34185028076172, "global_step": 221498, "epoch": 2668} {"train_loss": -24.55671501159668, "global_step": 221499, "epoch": 2668} {"train_loss": -24.570158004760742, "global_step": 221500, "epoch": 2668} {"train_loss": -24.900127410888672, "global_step": 221501, "epoch": 2668} {"train_loss": -24.12581443786621, "global_step": 221502, "epoch": 2668} {"train_loss": -24.69344139099121, "global_step": 221503, "epoch": 2668} {"train_loss": -24.400531768798828, "global_step": 221504, "epoch": 2668} {"train_loss": -24.65213966369629, "global_step": 221505, "epoch": 2668} {"train_loss": -24.483264923095703, "global_step": 221506, "epoch": 2668} {"train_loss": -24.661436080932617, "global_step": 221507, "epoch": 2668} {"train_loss": -24.482582092285156, "global_step": 221508, "epoch": 2668} {"train_loss": -24.689977645874023, "global_step": 221509, "epoch": 2668} {"train_loss": -24.61949920654297, "global_step": 221510, "epoch": 2668} {"train_loss": -24.769123077392578, "global_step": 221511, "epoch": 2668} {"train_loss": -24.5600643157959, "global_step": 221512, "epoch": 2668} {"train_loss": -24.52577018737793, "global_step": 221513, "epoch": 2668} {"train_loss": -24.896894454956055, "global_step": 221514, "epoch": 2668} {"train_loss": -24.458999633789062, "global_step": 221515, "epoch": 2668} {"train_loss": -24.39987564086914, "global_step": 221516, "epoch": 2668} {"train_loss": -24.540563583374023, "global_step": 221517, "epoch": 2668} {"train_loss": -24.48213768005371, "global_step": 221518, "epoch": 2668} {"train_loss": -24.534896850585938, "global_step": 221519, "epoch": 2668} {"train_loss": -24.64211082458496, "global_step": 221520, "epoch": 2668} {"train_loss": -24.430116653442383, "global_step": 221521, "epoch": 2668} {"train_loss": -24.62894630432129, "global_step": 221522, "epoch": 2668} {"train_loss": -24.58807945251465, "global_step": 221523, "epoch": 2668} {"train_loss": -24.380136489868164, "global_step": 221524, "epoch": 2668} {"train_loss": -24.46685218811035, "global_step": 221525, "epoch": 2668} {"train_loss": -24.578055347304748, "global_step": 221526, "epoch": 2668, "val_loss": 6824813.0} {"train_loss": -24.105823516845703, "global_step": 221527, "epoch": 2669} {"train_loss": -24.050518035888672, "global_step": 221528, "epoch": 2669} {"train_loss": -24.103717803955078, "global_step": 221529, "epoch": 2669} {"train_loss": -23.766881942749023, "global_step": 221530, "epoch": 2669} {"train_loss": -24.40707778930664, "global_step": 221531, "epoch": 2669} {"train_loss": -24.484464645385742, "global_step": 221532, "epoch": 2669} {"train_loss": -24.42917823791504, "global_step": 221533, "epoch": 2669} {"train_loss": -24.549802780151367, "global_step": 221534, "epoch": 2669} {"train_loss": -24.450824737548828, "global_step": 221535, "epoch": 2669} {"train_loss": -24.49630355834961, "global_step": 221536, "epoch": 2669} {"train_loss": -24.064260482788086, "global_step": 221537, "epoch": 2669} {"train_loss": -24.200149536132812, "global_step": 221538, "epoch": 2669} {"train_loss": -24.138652801513672, "global_step": 221539, "epoch": 2669} {"train_loss": -24.536855697631836, "global_step": 221540, "epoch": 2669} {"train_loss": -24.29524803161621, "global_step": 221541, "epoch": 2669} {"train_loss": -24.626522064208984, "global_step": 221542, "epoch": 2669} {"train_loss": -24.292158126831055, "global_step": 221543, "epoch": 2669} {"train_loss": -24.564334869384766, "global_step": 221544, "epoch": 2669} {"train_loss": -24.47629737854004, "global_step": 221545, "epoch": 2669} {"train_loss": -24.397550582885742, "global_step": 221546, "epoch": 2669} {"train_loss": -24.757694244384766, "global_step": 221547, "epoch": 2669} {"train_loss": -24.67049217224121, "global_step": 221548, "epoch": 2669} {"train_loss": -24.461633682250977, "global_step": 221549, "epoch": 2669} {"train_loss": -24.44218635559082, "global_step": 221550, "epoch": 2669} {"train_loss": -24.652406692504883, "global_step": 221551, "epoch": 2669} {"train_loss": -24.6588134765625, "global_step": 221552, "epoch": 2669} {"train_loss": -24.577730178833008, "global_step": 221553, "epoch": 2669} {"train_loss": -24.6810302734375, "global_step": 221554, "epoch": 2669} {"train_loss": -24.44529151916504, "global_step": 221555, "epoch": 2669} {"train_loss": -24.63749885559082, "global_step": 221556, "epoch": 2669} {"train_loss": -24.584970474243164, "global_step": 221557, "epoch": 2669} {"train_loss": -24.911334991455078, "global_step": 221558, "epoch": 2669} {"train_loss": -24.654645919799805, "global_step": 221559, "epoch": 2669} {"train_loss": -24.889867782592773, "global_step": 221560, "epoch": 2669} {"train_loss": -24.521345138549805, "global_step": 221561, "epoch": 2669} {"train_loss": -24.6485652923584, "global_step": 221562, "epoch": 2669} {"train_loss": -24.318532943725586, "global_step": 221563, "epoch": 2669} {"train_loss": -24.773609161376953, "global_step": 221564, "epoch": 2669} {"train_loss": -24.922882080078125, "global_step": 221565, "epoch": 2669} {"train_loss": -24.607969284057617, "global_step": 221566, "epoch": 2669} {"train_loss": -24.302949905395508, "global_step": 221567, "epoch": 2669} {"train_loss": -24.381853103637695, "global_step": 221568, "epoch": 2669} {"train_loss": -24.775970458984375, "global_step": 221569, "epoch": 2669} {"train_loss": -24.098796844482422, "global_step": 221570, "epoch": 2669} {"train_loss": -24.49455451965332, "global_step": 221571, "epoch": 2669} {"train_loss": -24.47684097290039, "global_step": 221572, "epoch": 2669} {"train_loss": -24.44556999206543, "global_step": 221573, "epoch": 2669} {"train_loss": -24.426218032836914, "global_step": 221574, "epoch": 2669} {"train_loss": -24.79336929321289, "global_step": 221575, "epoch": 2669} {"train_loss": -25.004009246826172, "global_step": 221576, "epoch": 2669} {"train_loss": -24.727354049682617, "global_step": 221577, "epoch": 2669} {"train_loss": -25.03839683532715, "global_step": 221578, "epoch": 2669} {"train_loss": -24.891050338745117, "global_step": 221579, "epoch": 2669} {"train_loss": -24.4796085357666, "global_step": 221580, "epoch": 2669} {"train_loss": -24.50348472595215, "global_step": 221581, "epoch": 2669} {"train_loss": -24.749469757080078, "global_step": 221582, "epoch": 2669} {"train_loss": -24.921154022216797, "global_step": 221583, "epoch": 2669} {"train_loss": -24.460081100463867, "global_step": 221584, "epoch": 2669} {"train_loss": -24.6875, "global_step": 221585, "epoch": 2669} {"train_loss": -24.475439071655273, "global_step": 221586, "epoch": 2669} {"train_loss": -24.555707931518555, "global_step": 221587, "epoch": 2669} {"train_loss": -24.950836181640625, "global_step": 221588, "epoch": 2669} {"train_loss": -24.74527931213379, "global_step": 221589, "epoch": 2669} {"train_loss": -24.5119571685791, "global_step": 221590, "epoch": 2669} {"train_loss": -24.744962692260742, "global_step": 221591, "epoch": 2669} {"train_loss": -24.893972396850586, "global_step": 221592, "epoch": 2669} {"train_loss": -24.668384552001953, "global_step": 221593, "epoch": 2669} {"train_loss": -24.953712463378906, "global_step": 221594, "epoch": 2669} {"train_loss": -24.50309181213379, "global_step": 221595, "epoch": 2669} {"train_loss": -24.666528701782227, "global_step": 221596, "epoch": 2669} {"train_loss": -24.486669540405273, "global_step": 221597, "epoch": 2669} {"train_loss": -24.955785751342773, "global_step": 221598, "epoch": 2669} {"train_loss": -24.53922462463379, "global_step": 221599, "epoch": 2669} {"train_loss": -24.670190811157227, "global_step": 221600, "epoch": 2669} {"train_loss": -24.40042495727539, "global_step": 221601, "epoch": 2669} {"train_loss": -24.6241512298584, "global_step": 221602, "epoch": 2669} {"train_loss": -24.34914207458496, "global_step": 221603, "epoch": 2669} {"train_loss": -24.951635360717773, "global_step": 221604, "epoch": 2669} {"train_loss": -24.715229034423828, "global_step": 221605, "epoch": 2669} {"train_loss": -24.60905647277832, "global_step": 221606, "epoch": 2669} {"train_loss": -24.489877700805664, "global_step": 221607, "epoch": 2669} {"train_loss": -24.779495239257812, "global_step": 221608, "epoch": 2669} {"train_loss": -24.553843417799616, "global_step": 221609, "epoch": 2669, "val_loss": 6736006.0} {"train_loss": -24.50526237487793, "global_step": 221610, "epoch": 2670} {"train_loss": -24.060598373413086, "global_step": 221611, "epoch": 2670} {"train_loss": -24.111536026000977, "global_step": 221612, "epoch": 2670} {"train_loss": -24.8209285736084, "global_step": 221613, "epoch": 2670} {"train_loss": -24.6649169921875, "global_step": 221614, "epoch": 2670} {"train_loss": -24.482154846191406, "global_step": 221615, "epoch": 2670} {"train_loss": -24.705486297607422, "global_step": 221616, "epoch": 2670} {"train_loss": -24.529346466064453, "global_step": 221617, "epoch": 2670} {"train_loss": -24.518774032592773, "global_step": 221618, "epoch": 2670} {"train_loss": -24.102989196777344, "global_step": 221619, "epoch": 2670} {"train_loss": -24.67626953125, "global_step": 221620, "epoch": 2670} {"train_loss": -24.499082565307617, "global_step": 221621, "epoch": 2670} {"train_loss": -24.69398307800293, "global_step": 221622, "epoch": 2670} {"train_loss": -24.606515884399414, "global_step": 221623, "epoch": 2670} {"train_loss": -24.876474380493164, "global_step": 221624, "epoch": 2670} {"train_loss": -24.691944122314453, "global_step": 221625, "epoch": 2670} {"train_loss": -24.62516975402832, "global_step": 221626, "epoch": 2670} {"train_loss": -24.585790634155273, "global_step": 221627, "epoch": 2670} {"train_loss": -24.49985122680664, "global_step": 221628, "epoch": 2670} {"train_loss": -24.79082679748535, "global_step": 221629, "epoch": 2670} {"train_loss": -24.52389907836914, "global_step": 221630, "epoch": 2670} {"train_loss": -24.85593032836914, "global_step": 221631, "epoch": 2670} {"train_loss": -24.8504581451416, "global_step": 221632, "epoch": 2670} {"train_loss": -24.404630661010742, "global_step": 221633, "epoch": 2670} {"train_loss": -24.485013961791992, "global_step": 221634, "epoch": 2670} {"train_loss": -24.57684898376465, "global_step": 221635, "epoch": 2670} {"train_loss": -24.928918838500977, "global_step": 221636, "epoch": 2670} {"train_loss": -24.399091720581055, "global_step": 221637, "epoch": 2670} {"train_loss": -24.880901336669922, "global_step": 221638, "epoch": 2670} {"train_loss": -24.752702713012695, "global_step": 221639, "epoch": 2670} {"train_loss": -24.12126350402832, "global_step": 221640, "epoch": 2670} {"train_loss": -24.660587310791016, "global_step": 221641, "epoch": 2670} {"train_loss": -24.611724853515625, "global_step": 221642, "epoch": 2670} {"train_loss": -24.70435333251953, "global_step": 221643, "epoch": 2670} {"train_loss": -24.51632308959961, "global_step": 221644, "epoch": 2670} {"train_loss": -24.530670166015625, "global_step": 221645, "epoch": 2670} {"train_loss": -24.5208683013916, "global_step": 221646, "epoch": 2670} {"train_loss": -24.7288875579834, "global_step": 221647, "epoch": 2670} {"train_loss": -24.970184326171875, "global_step": 221648, "epoch": 2670} {"train_loss": -24.799516677856445, "global_step": 221649, "epoch": 2670} {"train_loss": -24.55112075805664, "global_step": 221650, "epoch": 2670} {"train_loss": -24.943483352661133, "global_step": 221651, "epoch": 2670} {"train_loss": -24.45548439025879, "global_step": 221652, "epoch": 2670} {"train_loss": -24.52846908569336, "global_step": 221653, "epoch": 2670} {"train_loss": -24.599430084228516, "global_step": 221654, "epoch": 2670} {"train_loss": -24.802371978759766, "global_step": 221655, "epoch": 2670} {"train_loss": -24.95914649963379, "global_step": 221656, "epoch": 2670} {"train_loss": -24.646833419799805, "global_step": 221657, "epoch": 2670} {"train_loss": -24.97256088256836, "global_step": 221658, "epoch": 2670} {"train_loss": -24.68086051940918, "global_step": 221659, "epoch": 2670} {"train_loss": -24.716772079467773, "global_step": 221660, "epoch": 2670} {"train_loss": -24.49800682067871, "global_step": 221661, "epoch": 2670} {"train_loss": -24.017318725585938, "global_step": 221662, "epoch": 2670} {"train_loss": -23.967239379882812, "global_step": 221663, "epoch": 2670} {"train_loss": -24.138402938842773, "global_step": 221664, "epoch": 2670} {"train_loss": -24.819517135620117, "global_step": 221665, "epoch": 2670} {"train_loss": -24.185264587402344, "global_step": 221666, "epoch": 2670} {"train_loss": -24.473453521728516, "global_step": 221667, "epoch": 2670} {"train_loss": -24.686311721801758, "global_step": 221668, "epoch": 2670} {"train_loss": -24.80023193359375, "global_step": 221669, "epoch": 2670} {"train_loss": -24.41053581237793, "global_step": 221670, "epoch": 2670} {"train_loss": -25.06174659729004, "global_step": 221671, "epoch": 2670} {"train_loss": -24.393604278564453, "global_step": 221672, "epoch": 2670} {"train_loss": -24.696319580078125, "global_step": 221673, "epoch": 2670} {"train_loss": -24.52174186706543, "global_step": 221674, "epoch": 2670} {"train_loss": -24.79097557067871, "global_step": 221675, "epoch": 2670} {"train_loss": -24.657011032104492, "global_step": 221676, "epoch": 2670} {"train_loss": -24.443225860595703, "global_step": 221677, "epoch": 2670} {"train_loss": -24.803571701049805, "global_step": 221678, "epoch": 2670} {"train_loss": -24.610986709594727, "global_step": 221679, "epoch": 2670} {"train_loss": -24.9184513092041, "global_step": 221680, "epoch": 2670} {"train_loss": -24.5240535736084, "global_step": 221681, "epoch": 2670} {"train_loss": -24.386844635009766, "global_step": 221682, "epoch": 2670} {"train_loss": -24.394134521484375, "global_step": 221683, "epoch": 2670} {"train_loss": -24.80051612854004, "global_step": 221684, "epoch": 2670} {"train_loss": -24.876291275024414, "global_step": 221685, "epoch": 2670} {"train_loss": -24.406076431274414, "global_step": 221686, "epoch": 2670} {"train_loss": -24.920053482055664, "global_step": 221687, "epoch": 2670} {"train_loss": -24.885793685913086, "global_step": 221688, "epoch": 2670} {"train_loss": -24.198091506958008, "global_step": 221689, "epoch": 2670} {"train_loss": -24.507539749145508, "global_step": 221690, "epoch": 2670} {"train_loss": -25.059972763061523, "global_step": 221691, "epoch": 2670} {"train_loss": -24.617115939956115, "global_step": 221692, "epoch": 2670, "val_loss": 6701475.0} {"train_loss": -23.867441177368164, "global_step": 221693, "epoch": 2671} {"train_loss": -23.972564697265625, "global_step": 221694, "epoch": 2671} {"train_loss": -24.34906768798828, "global_step": 221695, "epoch": 2671} {"train_loss": -24.128934860229492, "global_step": 221696, "epoch": 2671} {"train_loss": -23.958820343017578, "global_step": 221697, "epoch": 2671} {"train_loss": -24.19268226623535, "global_step": 221698, "epoch": 2671} {"train_loss": -24.20633888244629, "global_step": 221699, "epoch": 2671} {"train_loss": -24.203792572021484, "global_step": 221700, "epoch": 2671} {"train_loss": -24.185134887695312, "global_step": 221701, "epoch": 2671} {"train_loss": -24.149185180664062, "global_step": 221702, "epoch": 2671} {"train_loss": -24.43149185180664, "global_step": 221703, "epoch": 2671} {"train_loss": -23.91775894165039, "global_step": 221704, "epoch": 2671} {"train_loss": -24.321470260620117, "global_step": 221705, "epoch": 2671} {"train_loss": -24.183422088623047, "global_step": 221706, "epoch": 2671} {"train_loss": -24.360584259033203, "global_step": 221707, "epoch": 2671} {"train_loss": -24.210922241210938, "global_step": 221708, "epoch": 2671} {"train_loss": -24.185461044311523, "global_step": 221709, "epoch": 2671} {"train_loss": -24.406965255737305, "global_step": 221710, "epoch": 2671} {"train_loss": -24.14579200744629, "global_step": 221711, "epoch": 2671} {"train_loss": -24.59429931640625, "global_step": 221712, "epoch": 2671} {"train_loss": -23.956298828125, "global_step": 221713, "epoch": 2671} {"train_loss": -24.399429321289062, "global_step": 221714, "epoch": 2671} {"train_loss": -24.68776512145996, "global_step": 221715, "epoch": 2671} {"train_loss": -24.580150604248047, "global_step": 221716, "epoch": 2671} {"train_loss": -24.50416374206543, "global_step": 221717, "epoch": 2671} {"train_loss": -24.098955154418945, "global_step": 221718, "epoch": 2671} {"train_loss": -24.19057273864746, "global_step": 221719, "epoch": 2671} {"train_loss": -24.189319610595703, "global_step": 221720, "epoch": 2671} {"train_loss": -24.821653366088867, "global_step": 221721, "epoch": 2671} {"train_loss": -24.49561882019043, "global_step": 221722, "epoch": 2671} {"train_loss": -24.56473159790039, "global_step": 221723, "epoch": 2671} {"train_loss": -24.27794647216797, "global_step": 221724, "epoch": 2671} {"train_loss": -24.697736740112305, "global_step": 221725, "epoch": 2671} {"train_loss": -24.811338424682617, "global_step": 221726, "epoch": 2671} {"train_loss": -24.590503692626953, "global_step": 221727, "epoch": 2671} {"train_loss": -24.465354919433594, "global_step": 221728, "epoch": 2671} {"train_loss": -24.736793518066406, "global_step": 221729, "epoch": 2671} {"train_loss": -24.880550384521484, "global_step": 221730, "epoch": 2671} {"train_loss": -24.248336791992188, "global_step": 221731, "epoch": 2671} {"train_loss": -24.75379753112793, "global_step": 221732, "epoch": 2671} {"train_loss": -24.562726974487305, "global_step": 221733, "epoch": 2671} {"train_loss": -25.01165771484375, "global_step": 221734, "epoch": 2671} {"train_loss": -24.60658836364746, "global_step": 221735, "epoch": 2671} {"train_loss": -24.390317916870117, "global_step": 221736, "epoch": 2671} {"train_loss": -24.6348876953125, "global_step": 221737, "epoch": 2671} {"train_loss": -24.5384464263916, "global_step": 221738, "epoch": 2671} {"train_loss": -24.608552932739258, "global_step": 221739, "epoch": 2671} {"train_loss": -24.800884246826172, "global_step": 221740, "epoch": 2671} {"train_loss": -24.68337059020996, "global_step": 221741, "epoch": 2671} {"train_loss": -24.80510902404785, "global_step": 221742, "epoch": 2671} {"train_loss": -24.59730339050293, "global_step": 221743, "epoch": 2671} {"train_loss": -24.530208587646484, "global_step": 221744, "epoch": 2671} {"train_loss": -24.709257125854492, "global_step": 221745, "epoch": 2671} {"train_loss": -25.038192749023438, "global_step": 221746, "epoch": 2671} {"train_loss": -24.81849479675293, "global_step": 221747, "epoch": 2671} {"train_loss": -24.651281356811523, "global_step": 221748, "epoch": 2671} {"train_loss": -24.40411376953125, "global_step": 221749, "epoch": 2671} {"train_loss": -24.874832153320312, "global_step": 221750, "epoch": 2671} {"train_loss": -24.665294647216797, "global_step": 221751, "epoch": 2671} {"train_loss": -24.538604736328125, "global_step": 221752, "epoch": 2671} {"train_loss": -24.824995040893555, "global_step": 221753, "epoch": 2671} {"train_loss": -24.23526954650879, "global_step": 221754, "epoch": 2671} {"train_loss": -24.247617721557617, "global_step": 221755, "epoch": 2671} {"train_loss": -24.27548599243164, "global_step": 221756, "epoch": 2671} {"train_loss": -24.362712860107422, "global_step": 221757, "epoch": 2671} {"train_loss": -24.890663146972656, "global_step": 221758, "epoch": 2671} {"train_loss": -24.476184844970703, "global_step": 221759, "epoch": 2671} {"train_loss": -24.205810546875, "global_step": 221760, "epoch": 2671} {"train_loss": -24.735456466674805, "global_step": 221761, "epoch": 2671} {"train_loss": -24.624801635742188, "global_step": 221762, "epoch": 2671} {"train_loss": -23.971309661865234, "global_step": 221763, "epoch": 2671} {"train_loss": -23.940536499023438, "global_step": 221764, "epoch": 2671} {"train_loss": -24.374984741210938, "global_step": 221765, "epoch": 2671} {"train_loss": -24.365589141845703, "global_step": 221766, "epoch": 2671} {"train_loss": -24.347681045532227, "global_step": 221767, "epoch": 2671} {"train_loss": -24.782148361206055, "global_step": 221768, "epoch": 2671} {"train_loss": -24.2048397064209, "global_step": 221769, "epoch": 2671} {"train_loss": -24.660675048828125, "global_step": 221770, "epoch": 2671} {"train_loss": -24.69550132751465, "global_step": 221771, "epoch": 2671} {"train_loss": -24.294139862060547, "global_step": 221772, "epoch": 2671} {"train_loss": -24.86079978942871, "global_step": 221773, "epoch": 2671} {"train_loss": -24.320804595947266, "global_step": 221774, "epoch": 2671} {"train_loss": -24.468158147421228, "global_step": 221775, "epoch": 2671, "val_loss": 6716250.5} {"train_loss": -23.6610164642334, "global_step": 221776, "epoch": 2672} {"train_loss": -24.343292236328125, "global_step": 221777, "epoch": 2672} {"train_loss": -23.823591232299805, "global_step": 221778, "epoch": 2672} {"train_loss": -24.460697174072266, "global_step": 221779, "epoch": 2672} {"train_loss": -23.645160675048828, "global_step": 221780, "epoch": 2672} {"train_loss": -24.179983139038086, "global_step": 221781, "epoch": 2672} {"train_loss": -23.940298080444336, "global_step": 221782, "epoch": 2672} {"train_loss": -24.21310806274414, "global_step": 221783, "epoch": 2672} {"train_loss": -24.377300262451172, "global_step": 221784, "epoch": 2672} {"train_loss": -24.330476760864258, "global_step": 221785, "epoch": 2672} {"train_loss": -24.335721969604492, "global_step": 221786, "epoch": 2672} {"train_loss": -24.352506637573242, "global_step": 221787, "epoch": 2672} {"train_loss": -24.394744873046875, "global_step": 221788, "epoch": 2672} {"train_loss": -24.283084869384766, "global_step": 221789, "epoch": 2672} {"train_loss": -24.313318252563477, "global_step": 221790, "epoch": 2672} {"train_loss": -24.386404037475586, "global_step": 221791, "epoch": 2672} {"train_loss": -24.43111228942871, "global_step": 221792, "epoch": 2672} {"train_loss": -24.073060989379883, "global_step": 221793, "epoch": 2672} {"train_loss": -24.821455001831055, "global_step": 221794, "epoch": 2672} {"train_loss": -24.60044288635254, "global_step": 221795, "epoch": 2672} {"train_loss": -24.551504135131836, "global_step": 221796, "epoch": 2672} {"train_loss": -24.771656036376953, "global_step": 221797, "epoch": 2672} {"train_loss": -24.204181671142578, "global_step": 221798, "epoch": 2672} {"train_loss": -24.5799560546875, "global_step": 221799, "epoch": 2672} {"train_loss": -24.603473663330078, "global_step": 221800, "epoch": 2672} {"train_loss": -24.314542770385742, "global_step": 221801, "epoch": 2672} {"train_loss": -24.6845703125, "global_step": 221802, "epoch": 2672} {"train_loss": -24.830026626586914, "global_step": 221803, "epoch": 2672} {"train_loss": -24.864545822143555, "global_step": 221804, "epoch": 2672} {"train_loss": -24.62891960144043, "global_step": 221805, "epoch": 2672} {"train_loss": -24.750625610351562, "global_step": 221806, "epoch": 2672} {"train_loss": -24.483673095703125, "global_step": 221807, "epoch": 2672} {"train_loss": -24.643972396850586, "global_step": 221808, "epoch": 2672} {"train_loss": -24.722604751586914, "global_step": 221809, "epoch": 2672} {"train_loss": -24.924283981323242, "global_step": 221810, "epoch": 2672} {"train_loss": -24.738407135009766, "global_step": 221811, "epoch": 2672} {"train_loss": -24.63313102722168, "global_step": 221812, "epoch": 2672} {"train_loss": -24.686052322387695, "global_step": 221813, "epoch": 2672} {"train_loss": -24.86233901977539, "global_step": 221814, "epoch": 2672} {"train_loss": -24.456907272338867, "global_step": 221815, "epoch": 2672} {"train_loss": -24.59881019592285, "global_step": 221816, "epoch": 2672} {"train_loss": -24.860124588012695, "global_step": 221817, "epoch": 2672} {"train_loss": -24.56416130065918, "global_step": 221818, "epoch": 2672} {"train_loss": -24.236251831054688, "global_step": 221819, "epoch": 2672} {"train_loss": -24.089448928833008, "global_step": 221820, "epoch": 2672} {"train_loss": -24.35540771484375, "global_step": 221821, "epoch": 2672} {"train_loss": -24.7139835357666, "global_step": 221822, "epoch": 2672} {"train_loss": -24.27617835998535, "global_step": 221823, "epoch": 2672} {"train_loss": -24.21234130859375, "global_step": 221824, "epoch": 2672} {"train_loss": -24.510112762451172, "global_step": 221825, "epoch": 2672} {"train_loss": -24.753381729125977, "global_step": 221826, "epoch": 2672} {"train_loss": -24.535615921020508, "global_step": 221827, "epoch": 2672} {"train_loss": -24.529603958129883, "global_step": 221828, "epoch": 2672} {"train_loss": -24.349157333374023, "global_step": 221829, "epoch": 2672} {"train_loss": -24.676273345947266, "global_step": 221830, "epoch": 2672} {"train_loss": -24.85717010498047, "global_step": 221831, "epoch": 2672} {"train_loss": -24.671281814575195, "global_step": 221832, "epoch": 2672} {"train_loss": -24.825525283813477, "global_step": 221833, "epoch": 2672} {"train_loss": -24.871984481811523, "global_step": 221834, "epoch": 2672} {"train_loss": -24.716323852539062, "global_step": 221835, "epoch": 2672} {"train_loss": -24.464693069458008, "global_step": 221836, "epoch": 2672} {"train_loss": -24.6724910736084, "global_step": 221837, "epoch": 2672} {"train_loss": -24.533918380737305, "global_step": 221838, "epoch": 2672} {"train_loss": -24.51838493347168, "global_step": 221839, "epoch": 2672} {"train_loss": -24.819616317749023, "global_step": 221840, "epoch": 2672} {"train_loss": -24.433238983154297, "global_step": 221841, "epoch": 2672} {"train_loss": -24.52552604675293, "global_step": 221842, "epoch": 2672} {"train_loss": -24.79616355895996, "global_step": 221843, "epoch": 2672} {"train_loss": -24.67089080810547, "global_step": 221844, "epoch": 2672} {"train_loss": -24.553796768188477, "global_step": 221845, "epoch": 2672} {"train_loss": -24.503890991210938, "global_step": 221846, "epoch": 2672} {"train_loss": -24.507774353027344, "global_step": 221847, "epoch": 2672} {"train_loss": -24.99344825744629, "global_step": 221848, "epoch": 2672} {"train_loss": -24.39470863342285, "global_step": 221849, "epoch": 2672} {"train_loss": -25.116743087768555, "global_step": 221850, "epoch": 2672} {"train_loss": -24.594009399414062, "global_step": 221851, "epoch": 2672} {"train_loss": -24.580957412719727, "global_step": 221852, "epoch": 2672} {"train_loss": -24.766218185424805, "global_step": 221853, "epoch": 2672} {"train_loss": -24.738271713256836, "global_step": 221854, "epoch": 2672} {"train_loss": -24.73413848876953, "global_step": 221855, "epoch": 2672} {"train_loss": -24.98233985900879, "global_step": 221856, "epoch": 2672} {"train_loss": -24.340744018554688, "global_step": 221857, "epoch": 2672} {"train_loss": -24.543377405189606, "global_step": 221858, "epoch": 2672, "val_loss": 6693584.5} {"train_loss": -24.106807708740234, "global_step": 221859, "epoch": 2673} {"train_loss": -23.647945404052734, "global_step": 221860, "epoch": 2673} {"train_loss": -23.613561630249023, "global_step": 221861, "epoch": 2673} {"train_loss": -24.31659507751465, "global_step": 221862, "epoch": 2673} {"train_loss": -24.488603591918945, "global_step": 221863, "epoch": 2673} {"train_loss": -24.1415958404541, "global_step": 221864, "epoch": 2673} {"train_loss": -24.12677574157715, "global_step": 221865, "epoch": 2673} {"train_loss": -24.027212142944336, "global_step": 221866, "epoch": 2673} {"train_loss": -24.149330139160156, "global_step": 221867, "epoch": 2673} {"train_loss": -24.266258239746094, "global_step": 221868, "epoch": 2673} {"train_loss": -24.2681884765625, "global_step": 221869, "epoch": 2673} {"train_loss": -24.2153377532959, "global_step": 221870, "epoch": 2673} {"train_loss": -24.25847053527832, "global_step": 221871, "epoch": 2673} {"train_loss": -24.32245445251465, "global_step": 221872, "epoch": 2673} {"train_loss": -24.560049057006836, "global_step": 221873, "epoch": 2673} {"train_loss": -24.730886459350586, "global_step": 221874, "epoch": 2673} {"train_loss": -24.459272384643555, "global_step": 221875, "epoch": 2673} {"train_loss": -24.567541122436523, "global_step": 221876, "epoch": 2673} {"train_loss": -24.603300094604492, "global_step": 221877, "epoch": 2673} {"train_loss": -24.421289443969727, "global_step": 221878, "epoch": 2673} {"train_loss": -24.7282772064209, "global_step": 221879, "epoch": 2673} {"train_loss": -24.628009796142578, "global_step": 221880, "epoch": 2673} {"train_loss": -24.32852554321289, "global_step": 221881, "epoch": 2673} {"train_loss": -24.602828979492188, "global_step": 221882, "epoch": 2673} {"train_loss": -24.566923141479492, "global_step": 221883, "epoch": 2673} {"train_loss": -24.936542510986328, "global_step": 221884, "epoch": 2673} {"train_loss": -24.9754638671875, "global_step": 221885, "epoch": 2673} {"train_loss": -24.96782684326172, "global_step": 221886, "epoch": 2673} {"train_loss": -24.339319229125977, "global_step": 221887, "epoch": 2673} {"train_loss": -25.14366340637207, "global_step": 221888, "epoch": 2673} {"train_loss": -24.67922019958496, "global_step": 221889, "epoch": 2673} {"train_loss": -24.790868759155273, "global_step": 221890, "epoch": 2673} {"train_loss": -24.44272232055664, "global_step": 221891, "epoch": 2673} {"train_loss": -24.294822692871094, "global_step": 221892, "epoch": 2673} {"train_loss": -24.546672821044922, "global_step": 221893, "epoch": 2673} {"train_loss": -24.25979995727539, "global_step": 221894, "epoch": 2673} {"train_loss": -24.917837142944336, "global_step": 221895, "epoch": 2673} {"train_loss": -24.767181396484375, "global_step": 221896, "epoch": 2673} {"train_loss": -24.80481719970703, "global_step": 221897, "epoch": 2673} {"train_loss": -24.68535614013672, "global_step": 221898, "epoch": 2673} {"train_loss": -25.09984588623047, "global_step": 221899, "epoch": 2673} {"train_loss": -24.758710861206055, "global_step": 221900, "epoch": 2673} {"train_loss": -25.146350860595703, "global_step": 221901, "epoch": 2673} {"train_loss": -24.913389205932617, "global_step": 221902, "epoch": 2673} {"train_loss": -24.63272476196289, "global_step": 221903, "epoch": 2673} {"train_loss": -24.64716148376465, "global_step": 221904, "epoch": 2673} {"train_loss": -24.57735252380371, "global_step": 221905, "epoch": 2673} {"train_loss": -24.469079971313477, "global_step": 221906, "epoch": 2673} {"train_loss": -24.782651901245117, "global_step": 221907, "epoch": 2673} {"train_loss": -24.420318603515625, "global_step": 221908, "epoch": 2673} {"train_loss": -24.888763427734375, "global_step": 221909, "epoch": 2673} {"train_loss": -24.17179298400879, "global_step": 221910, "epoch": 2673} {"train_loss": -24.456974029541016, "global_step": 221911, "epoch": 2673} {"train_loss": -24.802762985229492, "global_step": 221912, "epoch": 2673} {"train_loss": -24.601898193359375, "global_step": 221913, "epoch": 2673} {"train_loss": -24.85141944885254, "global_step": 221914, "epoch": 2673} {"train_loss": -23.72098731994629, "global_step": 221915, "epoch": 2673} {"train_loss": -23.939626693725586, "global_step": 221916, "epoch": 2673} {"train_loss": -24.7624568939209, "global_step": 221917, "epoch": 2673} {"train_loss": -24.48594093322754, "global_step": 221918, "epoch": 2673} {"train_loss": -24.236989974975586, "global_step": 221919, "epoch": 2673} {"train_loss": -24.35797691345215, "global_step": 221920, "epoch": 2673} {"train_loss": -24.671300888061523, "global_step": 221921, "epoch": 2673} {"train_loss": -24.122209548950195, "global_step": 221922, "epoch": 2673} {"train_loss": -24.60199546813965, "global_step": 221923, "epoch": 2673} {"train_loss": -24.51742172241211, "global_step": 221924, "epoch": 2673} {"train_loss": -24.68963050842285, "global_step": 221925, "epoch": 2673} {"train_loss": -24.34549331665039, "global_step": 221926, "epoch": 2673} {"train_loss": -24.488554000854492, "global_step": 221927, "epoch": 2673} {"train_loss": -24.345149993896484, "global_step": 221928, "epoch": 2673} {"train_loss": -24.640003204345703, "global_step": 221929, "epoch": 2673} {"train_loss": -24.85443878173828, "global_step": 221930, "epoch": 2673} {"train_loss": -24.5765323638916, "global_step": 221931, "epoch": 2673} {"train_loss": -24.54996109008789, "global_step": 221932, "epoch": 2673} {"train_loss": -24.633695602416992, "global_step": 221933, "epoch": 2673} {"train_loss": -24.76690673828125, "global_step": 221934, "epoch": 2673} {"train_loss": -24.610607147216797, "global_step": 221935, "epoch": 2673} {"train_loss": -24.620040893554688, "global_step": 221936, "epoch": 2673} {"train_loss": -24.635845184326172, "global_step": 221937, "epoch": 2673} {"train_loss": -24.75290298461914, "global_step": 221938, "epoch": 2673} {"train_loss": -24.64078712463379, "global_step": 221939, "epoch": 2673} {"train_loss": -24.910858154296875, "global_step": 221940, "epoch": 2673} {"train_loss": -24.53372704839132, "global_step": 221941, "epoch": 2673, "val_loss": 6652455.0} {"train_loss": -24.47767448425293, "global_step": 221942, "epoch": 2674} {"train_loss": -24.06561279296875, "global_step": 221943, "epoch": 2674} {"train_loss": -24.446744918823242, "global_step": 221944, "epoch": 2674} {"train_loss": -24.092153549194336, "global_step": 221945, "epoch": 2674} {"train_loss": -24.007427215576172, "global_step": 221946, "epoch": 2674} {"train_loss": -24.064128875732422, "global_step": 221947, "epoch": 2674} {"train_loss": -24.081052780151367, "global_step": 221948, "epoch": 2674} {"train_loss": -24.051435470581055, "global_step": 221949, "epoch": 2674} {"train_loss": -24.08788299560547, "global_step": 221950, "epoch": 2674} {"train_loss": -24.33486557006836, "global_step": 221951, "epoch": 2674} {"train_loss": -24.528676986694336, "global_step": 221952, "epoch": 2674} {"train_loss": -23.948774337768555, "global_step": 221953, "epoch": 2674} {"train_loss": -24.606088638305664, "global_step": 221954, "epoch": 2674} {"train_loss": -24.37802505493164, "global_step": 221955, "epoch": 2674} {"train_loss": -24.111209869384766, "global_step": 221956, "epoch": 2674} {"train_loss": -25.009307861328125, "global_step": 221957, "epoch": 2674} {"train_loss": -24.78774070739746, "global_step": 221958, "epoch": 2674} {"train_loss": -24.180545806884766, "global_step": 221959, "epoch": 2674} {"train_loss": -24.631607055664062, "global_step": 221960, "epoch": 2674} {"train_loss": -24.77412986755371, "global_step": 221961, "epoch": 2674} {"train_loss": -24.2313232421875, "global_step": 221962, "epoch": 2674} {"train_loss": -24.87335777282715, "global_step": 221963, "epoch": 2674} {"train_loss": -24.731813430786133, "global_step": 221964, "epoch": 2674} {"train_loss": -24.4459228515625, "global_step": 221965, "epoch": 2674} {"train_loss": -24.62948226928711, "global_step": 221966, "epoch": 2674} {"train_loss": -24.255239486694336, "global_step": 221967, "epoch": 2674} {"train_loss": -24.7403621673584, "global_step": 221968, "epoch": 2674} {"train_loss": -24.70677375793457, "global_step": 221969, "epoch": 2674} {"train_loss": -24.62270164489746, "global_step": 221970, "epoch": 2674} {"train_loss": -24.789648056030273, "global_step": 221971, "epoch": 2674} {"train_loss": -24.818044662475586, "global_step": 221972, "epoch": 2674} {"train_loss": -24.714540481567383, "global_step": 221973, "epoch": 2674} {"train_loss": -24.857267379760742, "global_step": 221974, "epoch": 2674} {"train_loss": -24.72199249267578, "global_step": 221975, "epoch": 2674} {"train_loss": -24.79277992248535, "global_step": 221976, "epoch": 2674} {"train_loss": -24.58845329284668, "global_step": 221977, "epoch": 2674} {"train_loss": -24.449613571166992, "global_step": 221978, "epoch": 2674} {"train_loss": -24.727170944213867, "global_step": 221979, "epoch": 2674} {"train_loss": -24.911428451538086, "global_step": 221980, "epoch": 2674} {"train_loss": -24.57831573486328, "global_step": 221981, "epoch": 2674} {"train_loss": -24.526172637939453, "global_step": 221982, "epoch": 2674} {"train_loss": -24.573957443237305, "global_step": 221983, "epoch": 2674} {"train_loss": -24.40350914001465, "global_step": 221984, "epoch": 2674} {"train_loss": -24.51486587524414, "global_step": 221985, "epoch": 2674} {"train_loss": -24.52864646911621, "global_step": 221986, "epoch": 2674} {"train_loss": -24.082386016845703, "global_step": 221987, "epoch": 2674} {"train_loss": -24.215831756591797, "global_step": 221988, "epoch": 2674} {"train_loss": -24.442787170410156, "global_step": 221989, "epoch": 2674} {"train_loss": -24.08466148376465, "global_step": 221990, "epoch": 2674} {"train_loss": -24.7562313079834, "global_step": 221991, "epoch": 2674} {"train_loss": -24.765409469604492, "global_step": 221992, "epoch": 2674} {"train_loss": -24.616003036499023, "global_step": 221993, "epoch": 2674} {"train_loss": -24.66107940673828, "global_step": 221994, "epoch": 2674} {"train_loss": -24.92046546936035, "global_step": 221995, "epoch": 2674} {"train_loss": -24.548049926757812, "global_step": 221996, "epoch": 2674} {"train_loss": -24.345834732055664, "global_step": 221997, "epoch": 2674} {"train_loss": -24.397443771362305, "global_step": 221998, "epoch": 2674} {"train_loss": -24.591062545776367, "global_step": 221999, "epoch": 2674} {"train_loss": -24.53066062927246, "global_step": 222000, "epoch": 2674} {"train_loss": -24.872318267822266, "global_step": 222001, "epoch": 2674} {"train_loss": -24.702877044677734, "global_step": 222002, "epoch": 2674} {"train_loss": -24.692001342773438, "global_step": 222003, "epoch": 2674} {"train_loss": -24.280553817749023, "global_step": 222004, "epoch": 2674} {"train_loss": -24.63180160522461, "global_step": 222005, "epoch": 2674} {"train_loss": -24.484176635742188, "global_step": 222006, "epoch": 2674} {"train_loss": -24.413196563720703, "global_step": 222007, "epoch": 2674} {"train_loss": -24.566007614135742, "global_step": 222008, "epoch": 2674} {"train_loss": -23.91496467590332, "global_step": 222009, "epoch": 2674} {"train_loss": -24.513818740844727, "global_step": 222010, "epoch": 2674} {"train_loss": -24.864383697509766, "global_step": 222011, "epoch": 2674} {"train_loss": -24.58478355407715, "global_step": 222012, "epoch": 2674} {"train_loss": -24.247486114501953, "global_step": 222013, "epoch": 2674} {"train_loss": -24.66706657409668, "global_step": 222014, "epoch": 2674} {"train_loss": -24.25381851196289, "global_step": 222015, "epoch": 2674} {"train_loss": -24.43351173400879, "global_step": 222016, "epoch": 2674} {"train_loss": -24.72218132019043, "global_step": 222017, "epoch": 2674} {"train_loss": -24.872907638549805, "global_step": 222018, "epoch": 2674} {"train_loss": -24.839622497558594, "global_step": 222019, "epoch": 2674} {"train_loss": -24.785470962524414, "global_step": 222020, "epoch": 2674} {"train_loss": -24.5062255859375, "global_step": 222021, "epoch": 2674} {"train_loss": -24.526830673217773, "global_step": 222022, "epoch": 2674} {"train_loss": -25.01755714416504, "global_step": 222023, "epoch": 2674} {"train_loss": -24.514628467789617, "global_step": 222024, "epoch": 2674, "val_loss": 6632123.0} {"train_loss": -23.383989334106445, "global_step": 222025, "epoch": 2675} {"train_loss": -23.117704391479492, "global_step": 222026, "epoch": 2675} {"train_loss": -23.868127822875977, "global_step": 222027, "epoch": 2675} {"train_loss": -24.18876838684082, "global_step": 222028, "epoch": 2675} {"train_loss": -24.172212600708008, "global_step": 222029, "epoch": 2675} {"train_loss": -24.279430389404297, "global_step": 222030, "epoch": 2675} {"train_loss": -24.614622116088867, "global_step": 222031, "epoch": 2675} {"train_loss": -24.134328842163086, "global_step": 222032, "epoch": 2675} {"train_loss": -24.13848876953125, "global_step": 222033, "epoch": 2675} {"train_loss": -24.526752471923828, "global_step": 222034, "epoch": 2675} {"train_loss": -24.390079498291016, "global_step": 222035, "epoch": 2675} {"train_loss": -24.15375328063965, "global_step": 222036, "epoch": 2675} {"train_loss": -24.228662490844727, "global_step": 222037, "epoch": 2675} {"train_loss": -24.184778213500977, "global_step": 222038, "epoch": 2675} {"train_loss": -24.55612564086914, "global_step": 222039, "epoch": 2675} {"train_loss": -24.528608322143555, "global_step": 222040, "epoch": 2675} {"train_loss": -24.42146110534668, "global_step": 222041, "epoch": 2675} {"train_loss": -24.310068130493164, "global_step": 222042, "epoch": 2675} {"train_loss": -24.39011001586914, "global_step": 222043, "epoch": 2675} {"train_loss": -24.677518844604492, "global_step": 222044, "epoch": 2675} {"train_loss": -24.539566040039062, "global_step": 222045, "epoch": 2675} {"train_loss": -24.73945426940918, "global_step": 222046, "epoch": 2675} {"train_loss": -24.6077880859375, "global_step": 222047, "epoch": 2675} {"train_loss": -24.811851501464844, "global_step": 222048, "epoch": 2675} {"train_loss": -24.58233070373535, "global_step": 222049, "epoch": 2675} {"train_loss": -24.332178115844727, "global_step": 222050, "epoch": 2675} {"train_loss": -24.716405868530273, "global_step": 222051, "epoch": 2675} {"train_loss": -24.5293025970459, "global_step": 222052, "epoch": 2675} {"train_loss": -24.50784683227539, "global_step": 222053, "epoch": 2675} {"train_loss": -24.36944580078125, "global_step": 222054, "epoch": 2675} {"train_loss": -24.4990291595459, "global_step": 222055, "epoch": 2675} {"train_loss": -24.570920944213867, "global_step": 222056, "epoch": 2675} {"train_loss": -25.07859992980957, "global_step": 222057, "epoch": 2675} {"train_loss": -24.503061294555664, "global_step": 222058, "epoch": 2675} {"train_loss": -24.55836296081543, "global_step": 222059, "epoch": 2675} {"train_loss": -25.0511417388916, "global_step": 222060, "epoch": 2675} {"train_loss": -25.0927734375, "global_step": 222061, "epoch": 2675} {"train_loss": -24.395263671875, "global_step": 222062, "epoch": 2675} {"train_loss": -24.842275619506836, "global_step": 222063, "epoch": 2675} {"train_loss": -24.37750244140625, "global_step": 222064, "epoch": 2675} {"train_loss": -24.55634880065918, "global_step": 222065, "epoch": 2675} {"train_loss": -24.24469566345215, "global_step": 222066, "epoch": 2675} {"train_loss": -24.497343063354492, "global_step": 222067, "epoch": 2675} {"train_loss": -24.60089683532715, "global_step": 222068, "epoch": 2675} {"train_loss": -24.32801628112793, "global_step": 222069, "epoch": 2675} {"train_loss": -24.545400619506836, "global_step": 222070, "epoch": 2675} {"train_loss": -24.673553466796875, "global_step": 222071, "epoch": 2675} {"train_loss": -24.905622482299805, "global_step": 222072, "epoch": 2675} {"train_loss": -24.446374893188477, "global_step": 222073, "epoch": 2675} {"train_loss": -24.7178897857666, "global_step": 222074, "epoch": 2675} {"train_loss": -24.526447296142578, "global_step": 222075, "epoch": 2675} {"train_loss": -24.366992950439453, "global_step": 222076, "epoch": 2675} {"train_loss": -24.67276954650879, "global_step": 222077, "epoch": 2675} {"train_loss": -24.438522338867188, "global_step": 222078, "epoch": 2675} {"train_loss": -24.54816246032715, "global_step": 222079, "epoch": 2675} {"train_loss": -24.76209831237793, "global_step": 222080, "epoch": 2675} {"train_loss": -24.395946502685547, "global_step": 222081, "epoch": 2675} {"train_loss": -24.760208129882812, "global_step": 222082, "epoch": 2675} {"train_loss": -24.64061737060547, "global_step": 222083, "epoch": 2675} {"train_loss": -24.696136474609375, "global_step": 222084, "epoch": 2675} {"train_loss": -24.948537826538086, "global_step": 222085, "epoch": 2675} {"train_loss": -24.624494552612305, "global_step": 222086, "epoch": 2675} {"train_loss": -24.783079147338867, "global_step": 222087, "epoch": 2675} {"train_loss": -24.80429458618164, "global_step": 222088, "epoch": 2675} {"train_loss": -24.653730392456055, "global_step": 222089, "epoch": 2675} {"train_loss": -24.120697021484375, "global_step": 222090, "epoch": 2675} {"train_loss": -24.79267120361328, "global_step": 222091, "epoch": 2675} {"train_loss": -24.41881561279297, "global_step": 222092, "epoch": 2675} {"train_loss": -24.746137619018555, "global_step": 222093, "epoch": 2675} {"train_loss": -24.450437545776367, "global_step": 222094, "epoch": 2675} {"train_loss": -24.842676162719727, "global_step": 222095, "epoch": 2675} {"train_loss": -24.82782745361328, "global_step": 222096, "epoch": 2675} {"train_loss": -24.663217544555664, "global_step": 222097, "epoch": 2675} {"train_loss": -25.03249168395996, "global_step": 222098, "epoch": 2675} {"train_loss": -24.61012077331543, "global_step": 222099, "epoch": 2675} {"train_loss": -24.572145462036133, "global_step": 222100, "epoch": 2675} {"train_loss": -24.969364166259766, "global_step": 222101, "epoch": 2675} {"train_loss": -24.704788208007812, "global_step": 222102, "epoch": 2675} {"train_loss": -24.82371711730957, "global_step": 222103, "epoch": 2675} {"train_loss": -24.53407859802246, "global_step": 222104, "epoch": 2675} {"train_loss": -24.867843627929688, "global_step": 222105, "epoch": 2675} {"train_loss": -24.457677841186523, "global_step": 222106, "epoch": 2675} {"train_loss": -24.54112893989287, "global_step": 222107, "epoch": 2675, "val_loss": 6652815.0} {"train_loss": -24.225772857666016, "global_step": 222108, "epoch": 2676} {"train_loss": -24.31032371520996, "global_step": 222109, "epoch": 2676} {"train_loss": -24.4132080078125, "global_step": 222110, "epoch": 2676} {"train_loss": -24.67477798461914, "global_step": 222111, "epoch": 2676} {"train_loss": -24.394983291625977, "global_step": 222112, "epoch": 2676} {"train_loss": -24.36285400390625, "global_step": 222113, "epoch": 2676} {"train_loss": -24.235692977905273, "global_step": 222114, "epoch": 2676} {"train_loss": -24.56867790222168, "global_step": 222115, "epoch": 2676} {"train_loss": -24.776031494140625, "global_step": 222116, "epoch": 2676} {"train_loss": -24.803335189819336, "global_step": 222117, "epoch": 2676} {"train_loss": -24.48720359802246, "global_step": 222118, "epoch": 2676} {"train_loss": -24.28031349182129, "global_step": 222119, "epoch": 2676} {"train_loss": -24.52779197692871, "global_step": 222120, "epoch": 2676} {"train_loss": -24.141862869262695, "global_step": 222121, "epoch": 2676} {"train_loss": -24.551420211791992, "global_step": 222122, "epoch": 2676} {"train_loss": -24.210725784301758, "global_step": 222123, "epoch": 2676} {"train_loss": -24.481632232666016, "global_step": 222124, "epoch": 2676} {"train_loss": -24.23017692565918, "global_step": 222125, "epoch": 2676} {"train_loss": -24.383834838867188, "global_step": 222126, "epoch": 2676} {"train_loss": -24.370969772338867, "global_step": 222127, "epoch": 2676} {"train_loss": -24.73036766052246, "global_step": 222128, "epoch": 2676} {"train_loss": -24.942096710205078, "global_step": 222129, "epoch": 2676} {"train_loss": -24.583377838134766, "global_step": 222130, "epoch": 2676} {"train_loss": -24.88718032836914, "global_step": 222131, "epoch": 2676} {"train_loss": -24.546043395996094, "global_step": 222132, "epoch": 2676} {"train_loss": -24.753765106201172, "global_step": 222133, "epoch": 2676} {"train_loss": -24.809326171875, "global_step": 222134, "epoch": 2676} {"train_loss": -24.207626342773438, "global_step": 222135, "epoch": 2676} {"train_loss": -24.959243774414062, "global_step": 222136, "epoch": 2676} {"train_loss": -24.78964614868164, "global_step": 222137, "epoch": 2676} {"train_loss": -24.30719566345215, "global_step": 222138, "epoch": 2676} {"train_loss": -24.736988067626953, "global_step": 222139, "epoch": 2676} {"train_loss": -24.77503776550293, "global_step": 222140, "epoch": 2676} {"train_loss": -24.558975219726562, "global_step": 222141, "epoch": 2676} {"train_loss": -24.947431564331055, "global_step": 222142, "epoch": 2676} {"train_loss": -24.83601951599121, "global_step": 222143, "epoch": 2676} {"train_loss": -24.79543113708496, "global_step": 222144, "epoch": 2676} {"train_loss": -24.739416122436523, "global_step": 222145, "epoch": 2676} {"train_loss": -24.438344955444336, "global_step": 222146, "epoch": 2676} {"train_loss": -25.082054138183594, "global_step": 222147, "epoch": 2676} {"train_loss": -24.50263214111328, "global_step": 222148, "epoch": 2676} {"train_loss": -24.54868507385254, "global_step": 222149, "epoch": 2676} {"train_loss": -24.99527931213379, "global_step": 222150, "epoch": 2676} {"train_loss": -24.733823776245117, "global_step": 222151, "epoch": 2676} {"train_loss": -24.742965698242188, "global_step": 222152, "epoch": 2676} {"train_loss": -24.81205940246582, "global_step": 222153, "epoch": 2676} {"train_loss": -24.732257843017578, "global_step": 222154, "epoch": 2676} {"train_loss": -24.123069763183594, "global_step": 222155, "epoch": 2676} {"train_loss": -24.447477340698242, "global_step": 222156, "epoch": 2676} {"train_loss": -24.504562377929688, "global_step": 222157, "epoch": 2676} {"train_loss": -24.728652954101562, "global_step": 222158, "epoch": 2676} {"train_loss": -24.593379974365234, "global_step": 222159, "epoch": 2676} {"train_loss": -24.49420166015625, "global_step": 222160, "epoch": 2676} {"train_loss": -24.677030563354492, "global_step": 222161, "epoch": 2676} {"train_loss": -24.737855911254883, "global_step": 222162, "epoch": 2676} {"train_loss": -24.202917098999023, "global_step": 222163, "epoch": 2676} {"train_loss": -24.66683578491211, "global_step": 222164, "epoch": 2676} {"train_loss": -24.631406784057617, "global_step": 222165, "epoch": 2676} {"train_loss": -24.569238662719727, "global_step": 222166, "epoch": 2676} {"train_loss": -24.569995880126953, "global_step": 222167, "epoch": 2676} {"train_loss": -24.580768585205078, "global_step": 222168, "epoch": 2676} {"train_loss": -24.347604751586914, "global_step": 222169, "epoch": 2676} {"train_loss": -24.659252166748047, "global_step": 222170, "epoch": 2676} {"train_loss": -24.772729873657227, "global_step": 222171, "epoch": 2676} {"train_loss": -24.5935115814209, "global_step": 222172, "epoch": 2676} {"train_loss": -24.935556411743164, "global_step": 222173, "epoch": 2676} {"train_loss": -24.663253784179688, "global_step": 222174, "epoch": 2676} {"train_loss": -24.47541618347168, "global_step": 222175, "epoch": 2676} {"train_loss": -24.753456115722656, "global_step": 222176, "epoch": 2676} {"train_loss": -24.426246643066406, "global_step": 222177, "epoch": 2676} {"train_loss": -24.647626876831055, "global_step": 222178, "epoch": 2676} {"train_loss": -24.385732650756836, "global_step": 222179, "epoch": 2676} {"train_loss": -24.51791763305664, "global_step": 222180, "epoch": 2676} {"train_loss": -24.844953536987305, "global_step": 222181, "epoch": 2676} {"train_loss": -24.59295082092285, "global_step": 222182, "epoch": 2676} {"train_loss": -24.958444595336914, "global_step": 222183, "epoch": 2676} {"train_loss": -24.605703353881836, "global_step": 222184, "epoch": 2676} {"train_loss": -24.623571395874023, "global_step": 222185, "epoch": 2676} {"train_loss": -24.674192428588867, "global_step": 222186, "epoch": 2676} {"train_loss": -24.660093307495117, "global_step": 222187, "epoch": 2676} {"train_loss": -24.424606323242188, "global_step": 222188, "epoch": 2676} {"train_loss": -24.595134735107422, "global_step": 222189, "epoch": 2676} {"train_loss": -24.593995266650097, "global_step": 222190, "epoch": 2676, "val_loss": 6847739.0} {"train_loss": -23.715335845947266, "global_step": 222191, "epoch": 2677} {"train_loss": -24.072805404663086, "global_step": 222192, "epoch": 2677} {"train_loss": -24.102115631103516, "global_step": 222193, "epoch": 2677} {"train_loss": -24.12887954711914, "global_step": 222194, "epoch": 2677} {"train_loss": -23.788536071777344, "global_step": 222195, "epoch": 2677} {"train_loss": -24.022680282592773, "global_step": 222196, "epoch": 2677} {"train_loss": -24.2823429107666, "global_step": 222197, "epoch": 2677} {"train_loss": -23.79791831970215, "global_step": 222198, "epoch": 2677} {"train_loss": -23.753520965576172, "global_step": 222199, "epoch": 2677} {"train_loss": -24.219850540161133, "global_step": 222200, "epoch": 2677} {"train_loss": -23.761764526367188, "global_step": 222201, "epoch": 2677} {"train_loss": -23.812875747680664, "global_step": 222202, "epoch": 2677} {"train_loss": -24.299184799194336, "global_step": 222203, "epoch": 2677} {"train_loss": -23.8584041595459, "global_step": 222204, "epoch": 2677} {"train_loss": -24.206436157226562, "global_step": 222205, "epoch": 2677} {"train_loss": -24.361173629760742, "global_step": 222206, "epoch": 2677} {"train_loss": -23.99040412902832, "global_step": 222207, "epoch": 2677} {"train_loss": -24.058786392211914, "global_step": 222208, "epoch": 2677} {"train_loss": -24.335474014282227, "global_step": 222209, "epoch": 2677} {"train_loss": -24.224441528320312, "global_step": 222210, "epoch": 2677} {"train_loss": -24.37746238708496, "global_step": 222211, "epoch": 2677} {"train_loss": -24.36734962463379, "global_step": 222212, "epoch": 2677} {"train_loss": -24.42609214782715, "global_step": 222213, "epoch": 2677} {"train_loss": -24.515485763549805, "global_step": 222214, "epoch": 2677} {"train_loss": -24.278440475463867, "global_step": 222215, "epoch": 2677} {"train_loss": -24.476829528808594, "global_step": 222216, "epoch": 2677} {"train_loss": -24.697406768798828, "global_step": 222217, "epoch": 2677} {"train_loss": -25.02718734741211, "global_step": 222218, "epoch": 2677} {"train_loss": -24.52033233642578, "global_step": 222219, "epoch": 2677} {"train_loss": -24.692874908447266, "global_step": 222220, "epoch": 2677} {"train_loss": -24.51404571533203, "global_step": 222221, "epoch": 2677} {"train_loss": -24.47517967224121, "global_step": 222222, "epoch": 2677} {"train_loss": -24.867063522338867, "global_step": 222223, "epoch": 2677} {"train_loss": -24.507190704345703, "global_step": 222224, "epoch": 2677} {"train_loss": -24.258630752563477, "global_step": 222225, "epoch": 2677} {"train_loss": -24.610624313354492, "global_step": 222226, "epoch": 2677} {"train_loss": -24.729597091674805, "global_step": 222227, "epoch": 2677} {"train_loss": -24.544086456298828, "global_step": 222228, "epoch": 2677} {"train_loss": -25.090076446533203, "global_step": 222229, "epoch": 2677} {"train_loss": -24.674150466918945, "global_step": 222230, "epoch": 2677} {"train_loss": -24.791969299316406, "global_step": 222231, "epoch": 2677} {"train_loss": -24.83768081665039, "global_step": 222232, "epoch": 2677} {"train_loss": -24.514448165893555, "global_step": 222233, "epoch": 2677} {"train_loss": -24.72864532470703, "global_step": 222234, "epoch": 2677} {"train_loss": -24.66132164001465, "global_step": 222235, "epoch": 2677} {"train_loss": -24.968341827392578, "global_step": 222236, "epoch": 2677} {"train_loss": -24.833213806152344, "global_step": 222237, "epoch": 2677} {"train_loss": -24.70327377319336, "global_step": 222238, "epoch": 2677} {"train_loss": -24.56981086730957, "global_step": 222239, "epoch": 2677} {"train_loss": -24.712331771850586, "global_step": 222240, "epoch": 2677} {"train_loss": -24.73735809326172, "global_step": 222241, "epoch": 2677} {"train_loss": -24.73213768005371, "global_step": 222242, "epoch": 2677} {"train_loss": -24.562671661376953, "global_step": 222243, "epoch": 2677} {"train_loss": -24.934995651245117, "global_step": 222244, "epoch": 2677} {"train_loss": -24.61824607849121, "global_step": 222245, "epoch": 2677} {"train_loss": -24.191999435424805, "global_step": 222246, "epoch": 2677} {"train_loss": -24.386945724487305, "global_step": 222247, "epoch": 2677} {"train_loss": -24.794464111328125, "global_step": 222248, "epoch": 2677} {"train_loss": -25.060773849487305, "global_step": 222249, "epoch": 2677} {"train_loss": -24.85127067565918, "global_step": 222250, "epoch": 2677} {"train_loss": -24.8646183013916, "global_step": 222251, "epoch": 2677} {"train_loss": -24.239774703979492, "global_step": 222252, "epoch": 2677} {"train_loss": -24.432764053344727, "global_step": 222253, "epoch": 2677} {"train_loss": -24.789939880371094, "global_step": 222254, "epoch": 2677} {"train_loss": -24.557432174682617, "global_step": 222255, "epoch": 2677} {"train_loss": -24.945886611938477, "global_step": 222256, "epoch": 2677} {"train_loss": -24.426044464111328, "global_step": 222257, "epoch": 2677} {"train_loss": -24.23895835876465, "global_step": 222258, "epoch": 2677} {"train_loss": -24.678564071655273, "global_step": 222259, "epoch": 2677} {"train_loss": -25.0654239654541, "global_step": 222260, "epoch": 2677} {"train_loss": -24.647924423217773, "global_step": 222261, "epoch": 2677} {"train_loss": -24.812711715698242, "global_step": 222262, "epoch": 2677} {"train_loss": -24.62046241760254, "global_step": 222263, "epoch": 2677} {"train_loss": -24.559003829956055, "global_step": 222264, "epoch": 2677} {"train_loss": -24.546308517456055, "global_step": 222265, "epoch": 2677} {"train_loss": -24.802183151245117, "global_step": 222266, "epoch": 2677} {"train_loss": -24.715559005737305, "global_step": 222267, "epoch": 2677} {"train_loss": -25.064538955688477, "global_step": 222268, "epoch": 2677} {"train_loss": -24.916248321533203, "global_step": 222269, "epoch": 2677} {"train_loss": -24.842655181884766, "global_step": 222270, "epoch": 2677} {"train_loss": -24.671350479125977, "global_step": 222271, "epoch": 2677} {"train_loss": -24.78571319580078, "global_step": 222272, "epoch": 2677} {"train_loss": -24.518923541149462, "global_step": 222273, "epoch": 2677, "val_loss": 6710863.0} {"train_loss": -23.57013511657715, "global_step": 222274, "epoch": 2678} {"train_loss": -22.06125259399414, "global_step": 222275, "epoch": 2678} {"train_loss": -21.646541595458984, "global_step": 222276, "epoch": 2678} {"train_loss": -24.066864013671875, "global_step": 222277, "epoch": 2678} {"train_loss": -22.634944915771484, "global_step": 222278, "epoch": 2678} {"train_loss": -23.081464767456055, "global_step": 222279, "epoch": 2678} {"train_loss": -23.64476203918457, "global_step": 222280, "epoch": 2678} {"train_loss": -23.406232833862305, "global_step": 222281, "epoch": 2678} {"train_loss": -24.01662826538086, "global_step": 222282, "epoch": 2678} {"train_loss": -23.550779342651367, "global_step": 222283, "epoch": 2678} {"train_loss": -23.980100631713867, "global_step": 222284, "epoch": 2678} {"train_loss": -23.715499877929688, "global_step": 222285, "epoch": 2678} {"train_loss": -24.178537368774414, "global_step": 222286, "epoch": 2678} {"train_loss": -23.9556941986084, "global_step": 222287, "epoch": 2678} {"train_loss": -24.1080379486084, "global_step": 222288, "epoch": 2678} {"train_loss": -23.993688583374023, "global_step": 222289, "epoch": 2678} {"train_loss": -24.22054672241211, "global_step": 222290, "epoch": 2678} {"train_loss": -24.277420043945312, "global_step": 222291, "epoch": 2678} {"train_loss": -24.328420639038086, "global_step": 222292, "epoch": 2678} {"train_loss": -24.10906410217285, "global_step": 222293, "epoch": 2678} {"train_loss": -23.843399047851562, "global_step": 222294, "epoch": 2678} {"train_loss": -23.94782829284668, "global_step": 222295, "epoch": 2678} {"train_loss": -23.93073844909668, "global_step": 222296, "epoch": 2678} {"train_loss": -24.0905818939209, "global_step": 222297, "epoch": 2678} {"train_loss": -24.46771240234375, "global_step": 222298, "epoch": 2678} {"train_loss": -24.337942123413086, "global_step": 222299, "epoch": 2678} {"train_loss": -24.299589157104492, "global_step": 222300, "epoch": 2678} {"train_loss": -24.22113037109375, "global_step": 222301, "epoch": 2678} {"train_loss": -24.539201736450195, "global_step": 222302, "epoch": 2678} {"train_loss": -24.019866943359375, "global_step": 222303, "epoch": 2678} {"train_loss": -24.478689193725586, "global_step": 222304, "epoch": 2678} {"train_loss": -24.38477897644043, "global_step": 222305, "epoch": 2678} {"train_loss": -24.600605010986328, "global_step": 222306, "epoch": 2678} {"train_loss": -24.72383689880371, "global_step": 222307, "epoch": 2678} {"train_loss": -24.413105010986328, "global_step": 222308, "epoch": 2678} {"train_loss": -24.771793365478516, "global_step": 222309, "epoch": 2678} {"train_loss": -24.763460159301758, "global_step": 222310, "epoch": 2678} {"train_loss": -24.373445510864258, "global_step": 222311, "epoch": 2678} {"train_loss": -24.478689193725586, "global_step": 222312, "epoch": 2678} {"train_loss": -24.52081871032715, "global_step": 222313, "epoch": 2678} {"train_loss": -24.54303741455078, "global_step": 222314, "epoch": 2678} {"train_loss": -24.679655075073242, "global_step": 222315, "epoch": 2678} {"train_loss": -24.785717010498047, "global_step": 222316, "epoch": 2678} {"train_loss": -24.40077018737793, "global_step": 222317, "epoch": 2678} {"train_loss": -24.570545196533203, "global_step": 222318, "epoch": 2678} {"train_loss": -24.691320419311523, "global_step": 222319, "epoch": 2678} {"train_loss": -24.694765090942383, "global_step": 222320, "epoch": 2678} {"train_loss": -24.490957260131836, "global_step": 222321, "epoch": 2678} {"train_loss": -24.590023040771484, "global_step": 222322, "epoch": 2678} {"train_loss": -24.700885772705078, "global_step": 222323, "epoch": 2678} {"train_loss": -24.98457908630371, "global_step": 222324, "epoch": 2678} {"train_loss": -24.883543014526367, "global_step": 222325, "epoch": 2678} {"train_loss": -24.81721305847168, "global_step": 222326, "epoch": 2678} {"train_loss": -24.658153533935547, "global_step": 222327, "epoch": 2678} {"train_loss": -24.519363403320312, "global_step": 222328, "epoch": 2678} {"train_loss": -24.88728141784668, "global_step": 222329, "epoch": 2678} {"train_loss": -24.85162925720215, "global_step": 222330, "epoch": 2678} {"train_loss": -24.88153076171875, "global_step": 222331, "epoch": 2678} {"train_loss": -24.748367309570312, "global_step": 222332, "epoch": 2678} {"train_loss": -24.663089752197266, "global_step": 222333, "epoch": 2678} {"train_loss": -24.813291549682617, "global_step": 222334, "epoch": 2678} {"train_loss": -24.783065795898438, "global_step": 222335, "epoch": 2678} {"train_loss": -24.94887351989746, "global_step": 222336, "epoch": 2678} {"train_loss": -24.376052856445312, "global_step": 222337, "epoch": 2678} {"train_loss": -24.709564208984375, "global_step": 222338, "epoch": 2678} {"train_loss": -25.369531631469727, "global_step": 222339, "epoch": 2678} {"train_loss": -24.573410034179688, "global_step": 222340, "epoch": 2678} {"train_loss": -24.807430267333984, "global_step": 222341, "epoch": 2678} {"train_loss": -24.388324737548828, "global_step": 222342, "epoch": 2678} {"train_loss": -24.992599487304688, "global_step": 222343, "epoch": 2678} {"train_loss": -24.718280792236328, "global_step": 222344, "epoch": 2678} {"train_loss": -24.47756004333496, "global_step": 222345, "epoch": 2678} {"train_loss": -24.711729049682617, "global_step": 222346, "epoch": 2678} {"train_loss": -24.697322845458984, "global_step": 222347, "epoch": 2678} {"train_loss": -24.63250732421875, "global_step": 222348, "epoch": 2678} {"train_loss": -24.413372039794922, "global_step": 222349, "epoch": 2678} {"train_loss": -24.622900009155273, "global_step": 222350, "epoch": 2678} {"train_loss": -24.604537963867188, "global_step": 222351, "epoch": 2678} {"train_loss": -24.713623046875, "global_step": 222352, "epoch": 2678} {"train_loss": -24.669822692871094, "global_step": 222353, "epoch": 2678} {"train_loss": -24.186120986938477, "global_step": 222354, "epoch": 2678} {"train_loss": -24.14558219909668, "global_step": 222355, "epoch": 2678} {"train_loss": -24.34224050590791, "global_step": 222356, "epoch": 2678, "val_loss": 6584274.0} {"train_loss": -23.94354820251465, "global_step": 222357, "epoch": 2679} {"train_loss": -23.542057037353516, "global_step": 222358, "epoch": 2679} {"train_loss": -24.163084030151367, "global_step": 222359, "epoch": 2679} {"train_loss": -23.959110260009766, "global_step": 222360, "epoch": 2679} {"train_loss": -24.213394165039062, "global_step": 222361, "epoch": 2679} {"train_loss": -24.261198043823242, "global_step": 222362, "epoch": 2679} {"train_loss": -24.237720489501953, "global_step": 222363, "epoch": 2679} {"train_loss": -23.847000122070312, "global_step": 222364, "epoch": 2679} {"train_loss": -24.418359756469727, "global_step": 222365, "epoch": 2679} {"train_loss": -23.995004653930664, "global_step": 222366, "epoch": 2679} {"train_loss": -24.261533737182617, "global_step": 222367, "epoch": 2679} {"train_loss": -24.13106346130371, "global_step": 222368, "epoch": 2679} {"train_loss": -24.212726593017578, "global_step": 222369, "epoch": 2679} {"train_loss": -24.59814453125, "global_step": 222370, "epoch": 2679} {"train_loss": -24.35080337524414, "global_step": 222371, "epoch": 2679} {"train_loss": -24.244985580444336, "global_step": 222372, "epoch": 2679} {"train_loss": -24.111774444580078, "global_step": 222373, "epoch": 2679} {"train_loss": -24.364965438842773, "global_step": 222374, "epoch": 2679} {"train_loss": -24.34247398376465, "global_step": 222375, "epoch": 2679} {"train_loss": -24.353239059448242, "global_step": 222376, "epoch": 2679} {"train_loss": -24.30029296875, "global_step": 222377, "epoch": 2679} {"train_loss": -24.668670654296875, "global_step": 222378, "epoch": 2679} {"train_loss": -24.12470054626465, "global_step": 222379, "epoch": 2679} {"train_loss": -24.561046600341797, "global_step": 222380, "epoch": 2679} {"train_loss": -24.47139549255371, "global_step": 222381, "epoch": 2679} {"train_loss": -24.719552993774414, "global_step": 222382, "epoch": 2679} {"train_loss": -24.724374771118164, "global_step": 222383, "epoch": 2679} {"train_loss": -24.09901237487793, "global_step": 222384, "epoch": 2679} {"train_loss": -24.489898681640625, "global_step": 222385, "epoch": 2679} {"train_loss": -24.67510414123535, "global_step": 222386, "epoch": 2679} {"train_loss": -24.620027542114258, "global_step": 222387, "epoch": 2679} {"train_loss": -24.379520416259766, "global_step": 222388, "epoch": 2679} {"train_loss": -24.14158058166504, "global_step": 222389, "epoch": 2679} {"train_loss": -24.711048126220703, "global_step": 222390, "epoch": 2679} {"train_loss": -24.677412033081055, "global_step": 222391, "epoch": 2679} {"train_loss": -25.013996124267578, "global_step": 222392, "epoch": 2679} {"train_loss": -24.67067527770996, "global_step": 222393, "epoch": 2679} {"train_loss": -24.566129684448242, "global_step": 222394, "epoch": 2679} {"train_loss": -24.42634391784668, "global_step": 222395, "epoch": 2679} {"train_loss": -25.026979446411133, "global_step": 222396, "epoch": 2679} {"train_loss": -24.62208366394043, "global_step": 222397, "epoch": 2679} {"train_loss": -24.727087020874023, "global_step": 222398, "epoch": 2679} {"train_loss": -24.712003707885742, "global_step": 222399, "epoch": 2679} {"train_loss": -25.123559951782227, "global_step": 222400, "epoch": 2679} {"train_loss": -24.937734603881836, "global_step": 222401, "epoch": 2679} {"train_loss": -24.742937088012695, "global_step": 222402, "epoch": 2679} {"train_loss": -24.632469177246094, "global_step": 222403, "epoch": 2679} {"train_loss": -25.086811065673828, "global_step": 222404, "epoch": 2679} {"train_loss": -24.869577407836914, "global_step": 222405, "epoch": 2679} {"train_loss": -24.861209869384766, "global_step": 222406, "epoch": 2679} {"train_loss": -24.448753356933594, "global_step": 222407, "epoch": 2679} {"train_loss": -24.689167022705078, "global_step": 222408, "epoch": 2679} {"train_loss": -24.72420310974121, "global_step": 222409, "epoch": 2679} {"train_loss": -24.909757614135742, "global_step": 222410, "epoch": 2679} {"train_loss": -24.751968383789062, "global_step": 222411, "epoch": 2679} {"train_loss": -24.70279312133789, "global_step": 222412, "epoch": 2679} {"train_loss": -24.57508087158203, "global_step": 222413, "epoch": 2679} {"train_loss": -24.888418197631836, "global_step": 222414, "epoch": 2679} {"train_loss": -24.334794998168945, "global_step": 222415, "epoch": 2679} {"train_loss": -24.79402732849121, "global_step": 222416, "epoch": 2679} {"train_loss": -24.698650360107422, "global_step": 222417, "epoch": 2679} {"train_loss": -24.61501121520996, "global_step": 222418, "epoch": 2679} {"train_loss": -24.3907470703125, "global_step": 222419, "epoch": 2679} {"train_loss": -24.618005752563477, "global_step": 222420, "epoch": 2679} {"train_loss": -24.793964385986328, "global_step": 222421, "epoch": 2679} {"train_loss": -24.747478485107422, "global_step": 222422, "epoch": 2679} {"train_loss": -24.864927291870117, "global_step": 222423, "epoch": 2679} {"train_loss": -24.592866897583008, "global_step": 222424, "epoch": 2679} {"train_loss": -24.98582649230957, "global_step": 222425, "epoch": 2679} {"train_loss": -24.52130699157715, "global_step": 222426, "epoch": 2679} {"train_loss": -24.701101303100586, "global_step": 222427, "epoch": 2679} {"train_loss": -24.587430953979492, "global_step": 222428, "epoch": 2679} {"train_loss": -24.572391510009766, "global_step": 222429, "epoch": 2679} {"train_loss": -24.512826919555664, "global_step": 222430, "epoch": 2679} {"train_loss": -24.63465690612793, "global_step": 222431, "epoch": 2679} {"train_loss": -24.72027015686035, "global_step": 222432, "epoch": 2679} {"train_loss": -24.41311264038086, "global_step": 222433, "epoch": 2679} {"train_loss": -24.60074806213379, "global_step": 222434, "epoch": 2679} {"train_loss": -24.70977210998535, "global_step": 222435, "epoch": 2679} {"train_loss": -24.712570190429688, "global_step": 222436, "epoch": 2679} {"train_loss": -24.737333297729492, "global_step": 222437, "epoch": 2679} {"train_loss": -24.46728515625, "global_step": 222438, "epoch": 2679} {"train_loss": -24.550753306193524, "global_step": 222439, "epoch": 2679, "val_loss": 6667349.5} {"train_loss": -24.31429100036621, "global_step": 222440, "epoch": 2680} {"train_loss": -24.123258590698242, "global_step": 222441, "epoch": 2680} {"train_loss": -24.50433349609375, "global_step": 222442, "epoch": 2680} {"train_loss": -24.201313018798828, "global_step": 222443, "epoch": 2680} {"train_loss": -24.252140045166016, "global_step": 222444, "epoch": 2680} {"train_loss": -24.059221267700195, "global_step": 222445, "epoch": 2680} {"train_loss": -24.345552444458008, "global_step": 222446, "epoch": 2680} {"train_loss": -24.54364776611328, "global_step": 222447, "epoch": 2680} {"train_loss": -24.34157371520996, "global_step": 222448, "epoch": 2680} {"train_loss": -24.424243927001953, "global_step": 222449, "epoch": 2680} {"train_loss": -24.72574234008789, "global_step": 222450, "epoch": 2680} {"train_loss": -24.425704956054688, "global_step": 222451, "epoch": 2680} {"train_loss": -23.917394638061523, "global_step": 222452, "epoch": 2680} {"train_loss": -24.598371505737305, "global_step": 222453, "epoch": 2680} {"train_loss": -24.039752960205078, "global_step": 222454, "epoch": 2680} {"train_loss": -24.40459442138672, "global_step": 222455, "epoch": 2680} {"train_loss": -24.211570739746094, "global_step": 222456, "epoch": 2680} {"train_loss": -23.96122169494629, "global_step": 222457, "epoch": 2680} {"train_loss": -24.472410202026367, "global_step": 222458, "epoch": 2680} {"train_loss": -24.03191566467285, "global_step": 222459, "epoch": 2680} {"train_loss": -24.61564064025879, "global_step": 222460, "epoch": 2680} {"train_loss": -24.709157943725586, "global_step": 222461, "epoch": 2680} {"train_loss": -24.519254684448242, "global_step": 222462, "epoch": 2680} {"train_loss": -24.537044525146484, "global_step": 222463, "epoch": 2680} {"train_loss": -24.547460556030273, "global_step": 222464, "epoch": 2680} {"train_loss": -24.245254516601562, "global_step": 222465, "epoch": 2680} {"train_loss": -24.396718978881836, "global_step": 222466, "epoch": 2680} {"train_loss": -24.012235641479492, "global_step": 222467, "epoch": 2680} {"train_loss": -24.6467342376709, "global_step": 222468, "epoch": 2680} {"train_loss": -24.451047897338867, "global_step": 222469, "epoch": 2680} {"train_loss": -24.285110473632812, "global_step": 222470, "epoch": 2680} {"train_loss": -24.665491104125977, "global_step": 222471, "epoch": 2680} {"train_loss": -24.912891387939453, "global_step": 222472, "epoch": 2680} {"train_loss": -24.73665428161621, "global_step": 222473, "epoch": 2680} {"train_loss": -24.82161521911621, "global_step": 222474, "epoch": 2680} {"train_loss": -24.69838523864746, "global_step": 222475, "epoch": 2680} {"train_loss": -24.700260162353516, "global_step": 222476, "epoch": 2680} {"train_loss": -24.66409683227539, "global_step": 222477, "epoch": 2680} {"train_loss": -24.823461532592773, "global_step": 222478, "epoch": 2680} {"train_loss": -24.83977699279785, "global_step": 222479, "epoch": 2680} {"train_loss": -24.719335556030273, "global_step": 222480, "epoch": 2680} {"train_loss": -24.543506622314453, "global_step": 222481, "epoch": 2680} {"train_loss": -24.7340087890625, "global_step": 222482, "epoch": 2680} {"train_loss": -24.66037368774414, "global_step": 222483, "epoch": 2680} {"train_loss": -24.5237979888916, "global_step": 222484, "epoch": 2680} {"train_loss": -24.47905921936035, "global_step": 222485, "epoch": 2680} {"train_loss": -24.597030639648438, "global_step": 222486, "epoch": 2680} {"train_loss": -24.57610511779785, "global_step": 222487, "epoch": 2680} {"train_loss": -24.94529151916504, "global_step": 222488, "epoch": 2680} {"train_loss": -24.657405853271484, "global_step": 222489, "epoch": 2680} {"train_loss": -24.59005355834961, "global_step": 222490, "epoch": 2680} {"train_loss": -24.74788475036621, "global_step": 222491, "epoch": 2680} {"train_loss": -24.61960220336914, "global_step": 222492, "epoch": 2680} {"train_loss": -24.418537139892578, "global_step": 222493, "epoch": 2680} {"train_loss": -24.944534301757812, "global_step": 222494, "epoch": 2680} {"train_loss": -24.84651756286621, "global_step": 222495, "epoch": 2680} {"train_loss": -24.59461784362793, "global_step": 222496, "epoch": 2680} {"train_loss": -24.88535499572754, "global_step": 222497, "epoch": 2680} {"train_loss": -24.669090270996094, "global_step": 222498, "epoch": 2680} {"train_loss": -24.644620895385742, "global_step": 222499, "epoch": 2680} {"train_loss": -24.275400161743164, "global_step": 222500, "epoch": 2680} {"train_loss": -24.26837730407715, "global_step": 222501, "epoch": 2680} {"train_loss": -24.503662109375, "global_step": 222502, "epoch": 2680} {"train_loss": -24.878690719604492, "global_step": 222503, "epoch": 2680} {"train_loss": -24.664396286010742, "global_step": 222504, "epoch": 2680} {"train_loss": -24.80573081970215, "global_step": 222505, "epoch": 2680} {"train_loss": -24.325687408447266, "global_step": 222506, "epoch": 2680} {"train_loss": -24.466760635375977, "global_step": 222507, "epoch": 2680} {"train_loss": -24.348180770874023, "global_step": 222508, "epoch": 2680} {"train_loss": -24.612333297729492, "global_step": 222509, "epoch": 2680} {"train_loss": -24.648374557495117, "global_step": 222510, "epoch": 2680} {"train_loss": -24.749343872070312, "global_step": 222511, "epoch": 2680} {"train_loss": -24.369937896728516, "global_step": 222512, "epoch": 2680} {"train_loss": -24.784072875976562, "global_step": 222513, "epoch": 2680} {"train_loss": -24.67963218688965, "global_step": 222514, "epoch": 2680} {"train_loss": -24.932668685913086, "global_step": 222515, "epoch": 2680} {"train_loss": -24.601072311401367, "global_step": 222516, "epoch": 2680} {"train_loss": -24.897031784057617, "global_step": 222517, "epoch": 2680} {"train_loss": -24.681791305541992, "global_step": 222518, "epoch": 2680} {"train_loss": -24.29878044128418, "global_step": 222519, "epoch": 2680} {"train_loss": -24.861684799194336, "global_step": 222520, "epoch": 2680} {"train_loss": -24.637983322143555, "global_step": 222521, "epoch": 2680} {"train_loss": -24.542674489768153, "global_step": 222522, "epoch": 2680, "val_loss": 6680741.0} {"train_loss": -24.057159423828125, "global_step": 222523, "epoch": 2681} {"train_loss": -24.43242835998535, "global_step": 222524, "epoch": 2681} {"train_loss": -23.9971866607666, "global_step": 222525, "epoch": 2681} {"train_loss": -24.42867088317871, "global_step": 222526, "epoch": 2681} {"train_loss": -24.244993209838867, "global_step": 222527, "epoch": 2681} {"train_loss": -24.491107940673828, "global_step": 222528, "epoch": 2681} {"train_loss": -24.45230484008789, "global_step": 222529, "epoch": 2681} {"train_loss": -24.74062156677246, "global_step": 222530, "epoch": 2681} {"train_loss": -24.44466209411621, "global_step": 222531, "epoch": 2681} {"train_loss": -24.51688575744629, "global_step": 222532, "epoch": 2681} {"train_loss": -24.3955078125, "global_step": 222533, "epoch": 2681} {"train_loss": -23.99924087524414, "global_step": 222534, "epoch": 2681} {"train_loss": -24.488691329956055, "global_step": 222535, "epoch": 2681} {"train_loss": -24.80903434753418, "global_step": 222536, "epoch": 2681} {"train_loss": -24.767410278320312, "global_step": 222537, "epoch": 2681} {"train_loss": -24.62847328186035, "global_step": 222538, "epoch": 2681} {"train_loss": -24.332799911499023, "global_step": 222539, "epoch": 2681} {"train_loss": -24.61972999572754, "global_step": 222540, "epoch": 2681} {"train_loss": -24.623838424682617, "global_step": 222541, "epoch": 2681} {"train_loss": -24.83941650390625, "global_step": 222542, "epoch": 2681} {"train_loss": -24.573301315307617, "global_step": 222543, "epoch": 2681} {"train_loss": -24.743488311767578, "global_step": 222544, "epoch": 2681} {"train_loss": -24.541444778442383, "global_step": 222545, "epoch": 2681} {"train_loss": -24.87139892578125, "global_step": 222546, "epoch": 2681} {"train_loss": -24.553695678710938, "global_step": 222547, "epoch": 2681} {"train_loss": -24.706174850463867, "global_step": 222548, "epoch": 2681} {"train_loss": -24.84242820739746, "global_step": 222549, "epoch": 2681} {"train_loss": -24.561262130737305, "global_step": 222550, "epoch": 2681} {"train_loss": -25.123191833496094, "global_step": 222551, "epoch": 2681} {"train_loss": -24.834186553955078, "global_step": 222552, "epoch": 2681} {"train_loss": -24.76169776916504, "global_step": 222553, "epoch": 2681} {"train_loss": -25.064531326293945, "global_step": 222554, "epoch": 2681} {"train_loss": -24.95969581604004, "global_step": 222555, "epoch": 2681} {"train_loss": -24.564481735229492, "global_step": 222556, "epoch": 2681} {"train_loss": -24.813522338867188, "global_step": 222557, "epoch": 2681} {"train_loss": -24.905611038208008, "global_step": 222558, "epoch": 2681} {"train_loss": -24.54998207092285, "global_step": 222559, "epoch": 2681} {"train_loss": -24.712942123413086, "global_step": 222560, "epoch": 2681} {"train_loss": -24.719650268554688, "global_step": 222561, "epoch": 2681} {"train_loss": -24.365020751953125, "global_step": 222562, "epoch": 2681} {"train_loss": -24.537553787231445, "global_step": 222563, "epoch": 2681} {"train_loss": -24.7259578704834, "global_step": 222564, "epoch": 2681} {"train_loss": -24.739715576171875, "global_step": 222565, "epoch": 2681} {"train_loss": -24.901927947998047, "global_step": 222566, "epoch": 2681} {"train_loss": -24.890140533447266, "global_step": 222567, "epoch": 2681} {"train_loss": -24.661317825317383, "global_step": 222568, "epoch": 2681} {"train_loss": -24.84907341003418, "global_step": 222569, "epoch": 2681} {"train_loss": -24.76951789855957, "global_step": 222570, "epoch": 2681} {"train_loss": -24.78689956665039, "global_step": 222571, "epoch": 2681} {"train_loss": -24.802717208862305, "global_step": 222572, "epoch": 2681} {"train_loss": -24.617748260498047, "global_step": 222573, "epoch": 2681} {"train_loss": -24.450498580932617, "global_step": 222574, "epoch": 2681} {"train_loss": -24.51820182800293, "global_step": 222575, "epoch": 2681} {"train_loss": -24.73711585998535, "global_step": 222576, "epoch": 2681} {"train_loss": -24.493545532226562, "global_step": 222577, "epoch": 2681} {"train_loss": -24.8038330078125, "global_step": 222578, "epoch": 2681} {"train_loss": -24.609601974487305, "global_step": 222579, "epoch": 2681} {"train_loss": -24.874393463134766, "global_step": 222580, "epoch": 2681} {"train_loss": -24.85795783996582, "global_step": 222581, "epoch": 2681} {"train_loss": -24.85222816467285, "global_step": 222582, "epoch": 2681} {"train_loss": -24.387012481689453, "global_step": 222583, "epoch": 2681} {"train_loss": -24.897537231445312, "global_step": 222584, "epoch": 2681} {"train_loss": -24.227554321289062, "global_step": 222585, "epoch": 2681} {"train_loss": -24.857315063476562, "global_step": 222586, "epoch": 2681} {"train_loss": -24.698347091674805, "global_step": 222587, "epoch": 2681} {"train_loss": -24.64237403869629, "global_step": 222588, "epoch": 2681} {"train_loss": -24.61920928955078, "global_step": 222589, "epoch": 2681} {"train_loss": -24.39385414123535, "global_step": 222590, "epoch": 2681} {"train_loss": -24.741455078125, "global_step": 222591, "epoch": 2681} {"train_loss": -24.712366104125977, "global_step": 222592, "epoch": 2681} {"train_loss": -24.776365280151367, "global_step": 222593, "epoch": 2681} {"train_loss": -24.787668228149414, "global_step": 222594, "epoch": 2681} {"train_loss": -24.706905364990234, "global_step": 222595, "epoch": 2681} {"train_loss": -24.81931495666504, "global_step": 222596, "epoch": 2681} {"train_loss": -24.60448455810547, "global_step": 222597, "epoch": 2681} {"train_loss": -24.7051944732666, "global_step": 222598, "epoch": 2681} {"train_loss": -24.923131942749023, "global_step": 222599, "epoch": 2681} {"train_loss": -24.68712043762207, "global_step": 222600, "epoch": 2681} {"train_loss": -24.996641159057617, "global_step": 222601, "epoch": 2681} {"train_loss": -24.379165649414062, "global_step": 222602, "epoch": 2681} {"train_loss": -24.489377975463867, "global_step": 222603, "epoch": 2681} {"train_loss": -24.46369743347168, "global_step": 222604, "epoch": 2681} {"train_loss": -24.65486698840038, "global_step": 222605, "epoch": 2681, "val_loss": 6686896.0} {"train_loss": -23.99567413330078, "global_step": 222606, "epoch": 2682} {"train_loss": -24.329439163208008, "global_step": 222607, "epoch": 2682} {"train_loss": -24.52228546142578, "global_step": 222608, "epoch": 2682} {"train_loss": -23.4973201751709, "global_step": 222609, "epoch": 2682} {"train_loss": -24.122896194458008, "global_step": 222610, "epoch": 2682} {"train_loss": -24.033451080322266, "global_step": 222611, "epoch": 2682} {"train_loss": -23.822830200195312, "global_step": 222612, "epoch": 2682} {"train_loss": -24.00692367553711, "global_step": 222613, "epoch": 2682} {"train_loss": -23.72098731994629, "global_step": 222614, "epoch": 2682} {"train_loss": -23.913419723510742, "global_step": 222615, "epoch": 2682} {"train_loss": -23.87148094177246, "global_step": 222616, "epoch": 2682} {"train_loss": -23.767961502075195, "global_step": 222617, "epoch": 2682} {"train_loss": -24.510818481445312, "global_step": 222618, "epoch": 2682} {"train_loss": -23.97763442993164, "global_step": 222619, "epoch": 2682} {"train_loss": -24.265295028686523, "global_step": 222620, "epoch": 2682} {"train_loss": -24.051864624023438, "global_step": 222621, "epoch": 2682} {"train_loss": -24.40865135192871, "global_step": 222622, "epoch": 2682} {"train_loss": -24.194364547729492, "global_step": 222623, "epoch": 2682} {"train_loss": -24.03716468811035, "global_step": 222624, "epoch": 2682} {"train_loss": -24.508991241455078, "global_step": 222625, "epoch": 2682} {"train_loss": -24.34082794189453, "global_step": 222626, "epoch": 2682} {"train_loss": -24.550186157226562, "global_step": 222627, "epoch": 2682} {"train_loss": -24.54035186767578, "global_step": 222628, "epoch": 2682} {"train_loss": -25.022136688232422, "global_step": 222629, "epoch": 2682} {"train_loss": -24.50136375427246, "global_step": 222630, "epoch": 2682} {"train_loss": -24.63411521911621, "global_step": 222631, "epoch": 2682} {"train_loss": -24.186016082763672, "global_step": 222632, "epoch": 2682} {"train_loss": -24.643962860107422, "global_step": 222633, "epoch": 2682} {"train_loss": -24.54435920715332, "global_step": 222634, "epoch": 2682} {"train_loss": -24.54730224609375, "global_step": 222635, "epoch": 2682} {"train_loss": -24.295745849609375, "global_step": 222636, "epoch": 2682} {"train_loss": -24.459806442260742, "global_step": 222637, "epoch": 2682} {"train_loss": -24.457170486450195, "global_step": 222638, "epoch": 2682} {"train_loss": -24.7673282623291, "global_step": 222639, "epoch": 2682} {"train_loss": -24.355405807495117, "global_step": 222640, "epoch": 2682} {"train_loss": -24.549474716186523, "global_step": 222641, "epoch": 2682} {"train_loss": -24.19308853149414, "global_step": 222642, "epoch": 2682} {"train_loss": -24.531579971313477, "global_step": 222643, "epoch": 2682} {"train_loss": -24.627750396728516, "global_step": 222644, "epoch": 2682} {"train_loss": -24.443012237548828, "global_step": 222645, "epoch": 2682} {"train_loss": -24.420669555664062, "global_step": 222646, "epoch": 2682} {"train_loss": -24.496679306030273, "global_step": 222647, "epoch": 2682} {"train_loss": -24.606225967407227, "global_step": 222648, "epoch": 2682} {"train_loss": -24.8099422454834, "global_step": 222649, "epoch": 2682} {"train_loss": -24.795019149780273, "global_step": 222650, "epoch": 2682} {"train_loss": -24.82469367980957, "global_step": 222651, "epoch": 2682} {"train_loss": -24.680761337280273, "global_step": 222652, "epoch": 2682} {"train_loss": -24.724924087524414, "global_step": 222653, "epoch": 2682} {"train_loss": -24.55647850036621, "global_step": 222654, "epoch": 2682} {"train_loss": -24.383275985717773, "global_step": 222655, "epoch": 2682} {"train_loss": -24.565855026245117, "global_step": 222656, "epoch": 2682} {"train_loss": -24.628639221191406, "global_step": 222657, "epoch": 2682} {"train_loss": -24.525192260742188, "global_step": 222658, "epoch": 2682} {"train_loss": -24.7252197265625, "global_step": 222659, "epoch": 2682} {"train_loss": -24.666921615600586, "global_step": 222660, "epoch": 2682} {"train_loss": -24.329151153564453, "global_step": 222661, "epoch": 2682} {"train_loss": -24.837005615234375, "global_step": 222662, "epoch": 2682} {"train_loss": -24.5599422454834, "global_step": 222663, "epoch": 2682} {"train_loss": -24.899839401245117, "global_step": 222664, "epoch": 2682} {"train_loss": -24.406064987182617, "global_step": 222665, "epoch": 2682} {"train_loss": -24.762475967407227, "global_step": 222666, "epoch": 2682} {"train_loss": -24.884885787963867, "global_step": 222667, "epoch": 2682} {"train_loss": -24.734546661376953, "global_step": 222668, "epoch": 2682} {"train_loss": -24.467639923095703, "global_step": 222669, "epoch": 2682} {"train_loss": -24.78311538696289, "global_step": 222670, "epoch": 2682} {"train_loss": -24.644506454467773, "global_step": 222671, "epoch": 2682} {"train_loss": -24.628307342529297, "global_step": 222672, "epoch": 2682} {"train_loss": -24.730093002319336, "global_step": 222673, "epoch": 2682} {"train_loss": -24.88431167602539, "global_step": 222674, "epoch": 2682} {"train_loss": -24.286108016967773, "global_step": 222675, "epoch": 2682} {"train_loss": -24.68782615661621, "global_step": 222676, "epoch": 2682} {"train_loss": -24.701648712158203, "global_step": 222677, "epoch": 2682} {"train_loss": -24.904010772705078, "global_step": 222678, "epoch": 2682} {"train_loss": -25.01667594909668, "global_step": 222679, "epoch": 2682} {"train_loss": -25.01283836364746, "global_step": 222680, "epoch": 2682} {"train_loss": -24.821447372436523, "global_step": 222681, "epoch": 2682} {"train_loss": -24.455825805664062, "global_step": 222682, "epoch": 2682} {"train_loss": -24.62229347229004, "global_step": 222683, "epoch": 2682} {"train_loss": -24.636938095092773, "global_step": 222684, "epoch": 2682} {"train_loss": -24.652292251586914, "global_step": 222685, "epoch": 2682} {"train_loss": -24.325876235961914, "global_step": 222686, "epoch": 2682} {"train_loss": -24.17377281188965, "global_step": 222687, "epoch": 2682} {"train_loss": -24.46505413285221, "global_step": 222688, "epoch": 2682, "val_loss": 6726714.5} {"train_loss": -24.21196937561035, "global_step": 222689, "epoch": 2683} {"train_loss": -23.28548240661621, "global_step": 222690, "epoch": 2683} {"train_loss": -22.812225341796875, "global_step": 222691, "epoch": 2683} {"train_loss": -23.400407791137695, "global_step": 222692, "epoch": 2683} {"train_loss": -23.579891204833984, "global_step": 222693, "epoch": 2683} {"train_loss": -23.702768325805664, "global_step": 222694, "epoch": 2683} {"train_loss": -23.763273239135742, "global_step": 222695, "epoch": 2683} {"train_loss": -23.602216720581055, "global_step": 222696, "epoch": 2683} {"train_loss": -23.887094497680664, "global_step": 222697, "epoch": 2683} {"train_loss": -23.59847068786621, "global_step": 222698, "epoch": 2683} {"train_loss": -24.19110679626465, "global_step": 222699, "epoch": 2683} {"train_loss": -24.30276870727539, "global_step": 222700, "epoch": 2683} {"train_loss": -23.948148727416992, "global_step": 222701, "epoch": 2683} {"train_loss": -24.132320404052734, "global_step": 222702, "epoch": 2683} {"train_loss": -24.343795776367188, "global_step": 222703, "epoch": 2683} {"train_loss": -24.117813110351562, "global_step": 222704, "epoch": 2683} {"train_loss": -24.511838912963867, "global_step": 222705, "epoch": 2683} {"train_loss": -24.38276481628418, "global_step": 222706, "epoch": 2683} {"train_loss": -23.930044174194336, "global_step": 222707, "epoch": 2683} {"train_loss": -24.206485748291016, "global_step": 222708, "epoch": 2683} {"train_loss": -24.454862594604492, "global_step": 222709, "epoch": 2683} {"train_loss": -24.22163963317871, "global_step": 222710, "epoch": 2683} {"train_loss": -24.446226119995117, "global_step": 222711, "epoch": 2683} {"train_loss": -24.385053634643555, "global_step": 222712, "epoch": 2683} {"train_loss": -24.31643295288086, "global_step": 222713, "epoch": 2683} {"train_loss": -24.082239151000977, "global_step": 222714, "epoch": 2683} {"train_loss": -24.689119338989258, "global_step": 222715, "epoch": 2683} {"train_loss": -24.221799850463867, "global_step": 222716, "epoch": 2683} {"train_loss": -24.483163833618164, "global_step": 222717, "epoch": 2683} {"train_loss": -24.150188446044922, "global_step": 222718, "epoch": 2683} {"train_loss": -24.4204158782959, "global_step": 222719, "epoch": 2683} {"train_loss": -24.66798973083496, "global_step": 222720, "epoch": 2683} {"train_loss": -24.610788345336914, "global_step": 222721, "epoch": 2683} {"train_loss": -24.65907859802246, "global_step": 222722, "epoch": 2683} {"train_loss": -24.622785568237305, "global_step": 222723, "epoch": 2683} {"train_loss": -24.5159969329834, "global_step": 222724, "epoch": 2683} {"train_loss": -24.555341720581055, "global_step": 222725, "epoch": 2683} {"train_loss": -24.66387367248535, "global_step": 222726, "epoch": 2683} {"train_loss": -24.43052101135254, "global_step": 222727, "epoch": 2683} {"train_loss": -24.48749351501465, "global_step": 222728, "epoch": 2683} {"train_loss": -24.467498779296875, "global_step": 222729, "epoch": 2683} {"train_loss": -24.500137329101562, "global_step": 222730, "epoch": 2683} {"train_loss": -24.65630531311035, "global_step": 222731, "epoch": 2683} {"train_loss": -24.305707931518555, "global_step": 222732, "epoch": 2683} {"train_loss": -24.38313102722168, "global_step": 222733, "epoch": 2683} {"train_loss": -24.85297393798828, "global_step": 222734, "epoch": 2683} {"train_loss": -24.483951568603516, "global_step": 222735, "epoch": 2683} {"train_loss": -24.563488006591797, "global_step": 222736, "epoch": 2683} {"train_loss": -24.702529907226562, "global_step": 222737, "epoch": 2683} {"train_loss": -24.521591186523438, "global_step": 222738, "epoch": 2683} {"train_loss": -24.56741714477539, "global_step": 222739, "epoch": 2683} {"train_loss": -24.909517288208008, "global_step": 222740, "epoch": 2683} {"train_loss": -24.839200973510742, "global_step": 222741, "epoch": 2683} {"train_loss": -25.038532257080078, "global_step": 222742, "epoch": 2683} {"train_loss": -24.82161521911621, "global_step": 222743, "epoch": 2683} {"train_loss": -24.861448287963867, "global_step": 222744, "epoch": 2683} {"train_loss": -24.40298843383789, "global_step": 222745, "epoch": 2683} {"train_loss": -24.89069366455078, "global_step": 222746, "epoch": 2683} {"train_loss": -24.72344398498535, "global_step": 222747, "epoch": 2683} {"train_loss": -24.50922203063965, "global_step": 222748, "epoch": 2683} {"train_loss": -24.060667037963867, "global_step": 222749, "epoch": 2683} {"train_loss": -24.70845603942871, "global_step": 222750, "epoch": 2683} {"train_loss": -24.52289581298828, "global_step": 222751, "epoch": 2683} {"train_loss": -24.7382869720459, "global_step": 222752, "epoch": 2683} {"train_loss": -24.279367446899414, "global_step": 222753, "epoch": 2683} {"train_loss": -24.289369583129883, "global_step": 222754, "epoch": 2683} {"train_loss": -24.664886474609375, "global_step": 222755, "epoch": 2683} {"train_loss": -24.64877700805664, "global_step": 222756, "epoch": 2683} {"train_loss": -24.592679977416992, "global_step": 222757, "epoch": 2683} {"train_loss": -24.627471923828125, "global_step": 222758, "epoch": 2683} {"train_loss": -24.621929168701172, "global_step": 222759, "epoch": 2683} {"train_loss": -24.85694694519043, "global_step": 222760, "epoch": 2683} {"train_loss": -24.900970458984375, "global_step": 222761, "epoch": 2683} {"train_loss": -24.681787490844727, "global_step": 222762, "epoch": 2683} {"train_loss": -24.992704391479492, "global_step": 222763, "epoch": 2683} {"train_loss": -24.631513595581055, "global_step": 222764, "epoch": 2683} {"train_loss": -24.444583892822266, "global_step": 222765, "epoch": 2683} {"train_loss": -24.60952377319336, "global_step": 222766, "epoch": 2683} {"train_loss": -24.918426513671875, "global_step": 222767, "epoch": 2683} {"train_loss": -24.72669792175293, "global_step": 222768, "epoch": 2683} {"train_loss": -24.780771255493164, "global_step": 222769, "epoch": 2683} {"train_loss": -24.74060821533203, "global_step": 222770, "epoch": 2683} {"train_loss": -24.409800104348058, "global_step": 222771, "epoch": 2683, "val_loss": 6632324.5} {"train_loss": -24.325828552246094, "global_step": 222772, "epoch": 2684} {"train_loss": -24.266416549682617, "global_step": 222773, "epoch": 2684} {"train_loss": -24.062955856323242, "global_step": 222774, "epoch": 2684} {"train_loss": -24.40021324157715, "global_step": 222775, "epoch": 2684} {"train_loss": -24.226736068725586, "global_step": 222776, "epoch": 2684} {"train_loss": -24.614215850830078, "global_step": 222777, "epoch": 2684} {"train_loss": -24.478137969970703, "global_step": 222778, "epoch": 2684} {"train_loss": -24.39670753479004, "global_step": 222779, "epoch": 2684} {"train_loss": -24.38152503967285, "global_step": 222780, "epoch": 2684} {"train_loss": -24.41648292541504, "global_step": 222781, "epoch": 2684} {"train_loss": -24.484506607055664, "global_step": 222782, "epoch": 2684} {"train_loss": -24.079952239990234, "global_step": 222783, "epoch": 2684} {"train_loss": -24.040212631225586, "global_step": 222784, "epoch": 2684} {"train_loss": -24.49896812438965, "global_step": 222785, "epoch": 2684} {"train_loss": -24.683244705200195, "global_step": 222786, "epoch": 2684} {"train_loss": -24.37868881225586, "global_step": 222787, "epoch": 2684} {"train_loss": -24.806381225585938, "global_step": 222788, "epoch": 2684} {"train_loss": -24.30939292907715, "global_step": 222789, "epoch": 2684} {"train_loss": -24.4221248626709, "global_step": 222790, "epoch": 2684} {"train_loss": -24.580551147460938, "global_step": 222791, "epoch": 2684} {"train_loss": -24.032644271850586, "global_step": 222792, "epoch": 2684} {"train_loss": -24.572311401367188, "global_step": 222793, "epoch": 2684} {"train_loss": -24.56146812438965, "global_step": 222794, "epoch": 2684} {"train_loss": -24.393888473510742, "global_step": 222795, "epoch": 2684} {"train_loss": -24.5683536529541, "global_step": 222796, "epoch": 2684} {"train_loss": -24.703567504882812, "global_step": 222797, "epoch": 2684} {"train_loss": -24.438438415527344, "global_step": 222798, "epoch": 2684} {"train_loss": -24.58669090270996, "global_step": 222799, "epoch": 2684} {"train_loss": -24.703969955444336, "global_step": 222800, "epoch": 2684} {"train_loss": -24.78169059753418, "global_step": 222801, "epoch": 2684} {"train_loss": -24.72063636779785, "global_step": 222802, "epoch": 2684} {"train_loss": -24.98253059387207, "global_step": 222803, "epoch": 2684} {"train_loss": -24.787708282470703, "global_step": 222804, "epoch": 2684} {"train_loss": -24.6656551361084, "global_step": 222805, "epoch": 2684} {"train_loss": -25.109825134277344, "global_step": 222806, "epoch": 2684} {"train_loss": -24.2348575592041, "global_step": 222807, "epoch": 2684} {"train_loss": -24.985204696655273, "global_step": 222808, "epoch": 2684} {"train_loss": -24.562408447265625, "global_step": 222809, "epoch": 2684} {"train_loss": -24.526050567626953, "global_step": 222810, "epoch": 2684} {"train_loss": -24.52094078063965, "global_step": 222811, "epoch": 2684} {"train_loss": -24.752517700195312, "global_step": 222812, "epoch": 2684} {"train_loss": -24.691679000854492, "global_step": 222813, "epoch": 2684} {"train_loss": -24.770601272583008, "global_step": 222814, "epoch": 2684} {"train_loss": -24.36152458190918, "global_step": 222815, "epoch": 2684} {"train_loss": -24.58913230895996, "global_step": 222816, "epoch": 2684} {"train_loss": -24.542858123779297, "global_step": 222817, "epoch": 2684} {"train_loss": -24.8062744140625, "global_step": 222818, "epoch": 2684} {"train_loss": -24.754671096801758, "global_step": 222819, "epoch": 2684} {"train_loss": -24.421110153198242, "global_step": 222820, "epoch": 2684} {"train_loss": -24.489187240600586, "global_step": 222821, "epoch": 2684} {"train_loss": -24.543668746948242, "global_step": 222822, "epoch": 2684} {"train_loss": -24.696134567260742, "global_step": 222823, "epoch": 2684} {"train_loss": -24.59481430053711, "global_step": 222824, "epoch": 2684} {"train_loss": -24.60822105407715, "global_step": 222825, "epoch": 2684} {"train_loss": -24.9350643157959, "global_step": 222826, "epoch": 2684} {"train_loss": -24.597562789916992, "global_step": 222827, "epoch": 2684} {"train_loss": -24.467069625854492, "global_step": 222828, "epoch": 2684} {"train_loss": -24.66444969177246, "global_step": 222829, "epoch": 2684} {"train_loss": -24.414613723754883, "global_step": 222830, "epoch": 2684} {"train_loss": -24.49908447265625, "global_step": 222831, "epoch": 2684} {"train_loss": -24.620437622070312, "global_step": 222832, "epoch": 2684} {"train_loss": -24.479938507080078, "global_step": 222833, "epoch": 2684} {"train_loss": -24.873432159423828, "global_step": 222834, "epoch": 2684} {"train_loss": -24.958690643310547, "global_step": 222835, "epoch": 2684} {"train_loss": -24.99833106994629, "global_step": 222836, "epoch": 2684} {"train_loss": -24.84866714477539, "global_step": 222837, "epoch": 2684} {"train_loss": -24.740802764892578, "global_step": 222838, "epoch": 2684} {"train_loss": -24.602720260620117, "global_step": 222839, "epoch": 2684} {"train_loss": -24.735624313354492, "global_step": 222840, "epoch": 2684} {"train_loss": -24.679357528686523, "global_step": 222841, "epoch": 2684} {"train_loss": -24.616811752319336, "global_step": 222842, "epoch": 2684} {"train_loss": -24.767324447631836, "global_step": 222843, "epoch": 2684} {"train_loss": -25.177337646484375, "global_step": 222844, "epoch": 2684} {"train_loss": -24.368736267089844, "global_step": 222845, "epoch": 2684} {"train_loss": -24.72170066833496, "global_step": 222846, "epoch": 2684} {"train_loss": -24.86366844177246, "global_step": 222847, "epoch": 2684} {"train_loss": -24.644546508789062, "global_step": 222848, "epoch": 2684} {"train_loss": -24.6809139251709, "global_step": 222849, "epoch": 2684} {"train_loss": -23.77593994140625, "global_step": 222850, "epoch": 2684} {"train_loss": -23.176198959350586, "global_step": 222851, "epoch": 2684} {"train_loss": -23.88826560974121, "global_step": 222852, "epoch": 2684} {"train_loss": -23.95680809020996, "global_step": 222853, "epoch": 2684} {"train_loss": -24.533157026911358, "global_step": 222854, "epoch": 2684, "val_loss": 6731764.5} {"train_loss": -21.244943618774414, "global_step": 222855, "epoch": 2685} {"train_loss": -23.268102645874023, "global_step": 222856, "epoch": 2685} {"train_loss": -22.31838035583496, "global_step": 222857, "epoch": 2685} {"train_loss": -23.4250545501709, "global_step": 222858, "epoch": 2685} {"train_loss": -22.329015731811523, "global_step": 222859, "epoch": 2685} {"train_loss": -23.044897079467773, "global_step": 222860, "epoch": 2685} {"train_loss": -23.378625869750977, "global_step": 222861, "epoch": 2685} {"train_loss": -23.279022216796875, "global_step": 222862, "epoch": 2685} {"train_loss": -23.43358612060547, "global_step": 222863, "epoch": 2685} {"train_loss": -23.466720581054688, "global_step": 222864, "epoch": 2685} {"train_loss": -23.797880172729492, "global_step": 222865, "epoch": 2685} {"train_loss": -23.397186279296875, "global_step": 222866, "epoch": 2685} {"train_loss": -23.862728118896484, "global_step": 222867, "epoch": 2685} {"train_loss": -24.014055252075195, "global_step": 222868, "epoch": 2685} {"train_loss": -23.38443946838379, "global_step": 222869, "epoch": 2685} {"train_loss": -23.364118576049805, "global_step": 222870, "epoch": 2685} {"train_loss": -23.947643280029297, "global_step": 222871, "epoch": 2685} {"train_loss": -23.936767578125, "global_step": 222872, "epoch": 2685} {"train_loss": -23.81154441833496, "global_step": 222873, "epoch": 2685} {"train_loss": -23.83272361755371, "global_step": 222874, "epoch": 2685} {"train_loss": -23.87245750427246, "global_step": 222875, "epoch": 2685} {"train_loss": -24.1021785736084, "global_step": 222876, "epoch": 2685} {"train_loss": -23.914274215698242, "global_step": 222877, "epoch": 2685} {"train_loss": -24.274770736694336, "global_step": 222878, "epoch": 2685} {"train_loss": -23.832603454589844, "global_step": 222879, "epoch": 2685} {"train_loss": -24.136564254760742, "global_step": 222880, "epoch": 2685} {"train_loss": -24.220951080322266, "global_step": 222881, "epoch": 2685} {"train_loss": -23.982738494873047, "global_step": 222882, "epoch": 2685} {"train_loss": -24.315387725830078, "global_step": 222883, "epoch": 2685} {"train_loss": -24.258167266845703, "global_step": 222884, "epoch": 2685} {"train_loss": -24.43088722229004, "global_step": 222885, "epoch": 2685} {"train_loss": -24.434900283813477, "global_step": 222886, "epoch": 2685} {"train_loss": -24.6942195892334, "global_step": 222887, "epoch": 2685} {"train_loss": -24.34330177307129, "global_step": 222888, "epoch": 2685} {"train_loss": -24.295459747314453, "global_step": 222889, "epoch": 2685} {"train_loss": -24.405258178710938, "global_step": 222890, "epoch": 2685} {"train_loss": -24.69615936279297, "global_step": 222891, "epoch": 2685} {"train_loss": -24.57126808166504, "global_step": 222892, "epoch": 2685} {"train_loss": -24.80695343017578, "global_step": 222893, "epoch": 2685} {"train_loss": -24.821508407592773, "global_step": 222894, "epoch": 2685} {"train_loss": -24.310413360595703, "global_step": 222895, "epoch": 2685} {"train_loss": -24.68709945678711, "global_step": 222896, "epoch": 2685} {"train_loss": -24.472747802734375, "global_step": 222897, "epoch": 2685} {"train_loss": -24.628583908081055, "global_step": 222898, "epoch": 2685} {"train_loss": -24.555078506469727, "global_step": 222899, "epoch": 2685} {"train_loss": -24.82520866394043, "global_step": 222900, "epoch": 2685} {"train_loss": -24.65981101989746, "global_step": 222901, "epoch": 2685} {"train_loss": -24.1904239654541, "global_step": 222902, "epoch": 2685} {"train_loss": -24.66860580444336, "global_step": 222903, "epoch": 2685} {"train_loss": -24.71244239807129, "global_step": 222904, "epoch": 2685} {"train_loss": -24.666553497314453, "global_step": 222905, "epoch": 2685} {"train_loss": -24.610960006713867, "global_step": 222906, "epoch": 2685} {"train_loss": -24.680744171142578, "global_step": 222907, "epoch": 2685} {"train_loss": -24.926515579223633, "global_step": 222908, "epoch": 2685} {"train_loss": -24.863698959350586, "global_step": 222909, "epoch": 2685} {"train_loss": -24.58668327331543, "global_step": 222910, "epoch": 2685} {"train_loss": -24.522964477539062, "global_step": 222911, "epoch": 2685} {"train_loss": -24.92621421813965, "global_step": 222912, "epoch": 2685} {"train_loss": -25.000957489013672, "global_step": 222913, "epoch": 2685} {"train_loss": -24.710281372070312, "global_step": 222914, "epoch": 2685} {"train_loss": -24.61594581604004, "global_step": 222915, "epoch": 2685} {"train_loss": -24.577932357788086, "global_step": 222916, "epoch": 2685} {"train_loss": -24.829631805419922, "global_step": 222917, "epoch": 2685} {"train_loss": -24.59572410583496, "global_step": 222918, "epoch": 2685} {"train_loss": -24.743492126464844, "global_step": 222919, "epoch": 2685} {"train_loss": -24.645170211791992, "global_step": 222920, "epoch": 2685} {"train_loss": -24.613981246948242, "global_step": 222921, "epoch": 2685} {"train_loss": -24.443771362304688, "global_step": 222922, "epoch": 2685} {"train_loss": -24.719032287597656, "global_step": 222923, "epoch": 2685} {"train_loss": -24.758596420288086, "global_step": 222924, "epoch": 2685} {"train_loss": -24.483179092407227, "global_step": 222925, "epoch": 2685} {"train_loss": -24.67823600769043, "global_step": 222926, "epoch": 2685} {"train_loss": -24.203554153442383, "global_step": 222927, "epoch": 2685} {"train_loss": -25.306737899780273, "global_step": 222928, "epoch": 2685} {"train_loss": -24.720474243164062, "global_step": 222929, "epoch": 2685} {"train_loss": -24.697372436523438, "global_step": 222930, "epoch": 2685} {"train_loss": -24.74825096130371, "global_step": 222931, "epoch": 2685} {"train_loss": -24.360326766967773, "global_step": 222932, "epoch": 2685} {"train_loss": -24.929683685302734, "global_step": 222933, "epoch": 2685} {"train_loss": -24.708417892456055, "global_step": 222934, "epoch": 2685} {"train_loss": -24.558622360229492, "global_step": 222935, "epoch": 2685} {"train_loss": -24.525869369506836, "global_step": 222936, "epoch": 2685} {"train_loss": -24.249391969428004, "global_step": 222937, "epoch": 2685, "val_loss": 6649351.5} {"train_loss": -24.791336059570312, "global_step": 222938, "epoch": 2686} {"train_loss": -24.968820571899414, "global_step": 222939, "epoch": 2686} {"train_loss": -24.807830810546875, "global_step": 222940, "epoch": 2686} {"train_loss": -24.74384117126465, "global_step": 222941, "epoch": 2686} {"train_loss": -24.523012161254883, "global_step": 222942, "epoch": 2686} {"train_loss": -24.64032554626465, "global_step": 222943, "epoch": 2686} {"train_loss": -24.66066551208496, "global_step": 222944, "epoch": 2686} {"train_loss": -24.674135208129883, "global_step": 222945, "epoch": 2686} {"train_loss": -24.500455856323242, "global_step": 222946, "epoch": 2686} {"train_loss": -24.299123764038086, "global_step": 222947, "epoch": 2686} {"train_loss": -24.5397891998291, "global_step": 222948, "epoch": 2686} {"train_loss": -24.324323654174805, "global_step": 222949, "epoch": 2686} {"train_loss": -24.435422897338867, "global_step": 222950, "epoch": 2686} {"train_loss": -24.392837524414062, "global_step": 222951, "epoch": 2686} {"train_loss": -24.60432243347168, "global_step": 222952, "epoch": 2686} {"train_loss": -24.7083683013916, "global_step": 222953, "epoch": 2686} {"train_loss": -24.566858291625977, "global_step": 222954, "epoch": 2686} {"train_loss": -24.747995376586914, "global_step": 222955, "epoch": 2686} {"train_loss": -24.738975524902344, "global_step": 222956, "epoch": 2686} {"train_loss": -24.665178298950195, "global_step": 222957, "epoch": 2686} {"train_loss": -24.42600440979004, "global_step": 222958, "epoch": 2686} {"train_loss": -25.115631103515625, "global_step": 222959, "epoch": 2686} {"train_loss": -24.75880241394043, "global_step": 222960, "epoch": 2686} {"train_loss": -24.415102005004883, "global_step": 222961, "epoch": 2686} {"train_loss": -24.73121452331543, "global_step": 222962, "epoch": 2686} {"train_loss": -24.664270401000977, "global_step": 222963, "epoch": 2686} {"train_loss": -24.670251846313477, "global_step": 222964, "epoch": 2686} {"train_loss": -24.615333557128906, "global_step": 222965, "epoch": 2686} {"train_loss": -24.528594970703125, "global_step": 222966, "epoch": 2686} {"train_loss": -24.655834197998047, "global_step": 222967, "epoch": 2686} {"train_loss": -24.635557174682617, "global_step": 222968, "epoch": 2686} {"train_loss": -24.578580856323242, "global_step": 222969, "epoch": 2686} {"train_loss": -24.796772003173828, "global_step": 222970, "epoch": 2686} {"train_loss": -24.563512802124023, "global_step": 222971, "epoch": 2686} {"train_loss": -24.944360733032227, "global_step": 222972, "epoch": 2686} {"train_loss": -24.476613998413086, "global_step": 222973, "epoch": 2686} {"train_loss": -24.683685302734375, "global_step": 222974, "epoch": 2686} {"train_loss": -24.475418090820312, "global_step": 222975, "epoch": 2686} {"train_loss": -24.360937118530273, "global_step": 222976, "epoch": 2686} {"train_loss": -24.73968505859375, "global_step": 222977, "epoch": 2686} {"train_loss": -24.328521728515625, "global_step": 222978, "epoch": 2686} {"train_loss": -24.41701316833496, "global_step": 222979, "epoch": 2686} {"train_loss": -24.448719024658203, "global_step": 222980, "epoch": 2686} {"train_loss": -24.699155807495117, "global_step": 222981, "epoch": 2686} {"train_loss": -24.436208724975586, "global_step": 222982, "epoch": 2686} {"train_loss": -24.63972282409668, "global_step": 222983, "epoch": 2686} {"train_loss": -24.583065032958984, "global_step": 222984, "epoch": 2686} {"train_loss": -24.333215713500977, "global_step": 222985, "epoch": 2686} {"train_loss": -24.54261589050293, "global_step": 222986, "epoch": 2686} {"train_loss": -24.8443546295166, "global_step": 222987, "epoch": 2686} {"train_loss": -24.682037353515625, "global_step": 222988, "epoch": 2686} {"train_loss": -24.9527587890625, "global_step": 222989, "epoch": 2686} {"train_loss": -24.69636344909668, "global_step": 222990, "epoch": 2686} {"train_loss": -24.774518966674805, "global_step": 222991, "epoch": 2686} {"train_loss": -24.575803756713867, "global_step": 222992, "epoch": 2686} {"train_loss": -24.87355613708496, "global_step": 222993, "epoch": 2686} {"train_loss": -24.546653747558594, "global_step": 222994, "epoch": 2686} {"train_loss": -24.56082534790039, "global_step": 222995, "epoch": 2686} {"train_loss": -24.284372329711914, "global_step": 222996, "epoch": 2686} {"train_loss": -24.782718658447266, "global_step": 222997, "epoch": 2686} {"train_loss": -24.641603469848633, "global_step": 222998, "epoch": 2686} {"train_loss": -24.82904052734375, "global_step": 222999, "epoch": 2686} {"train_loss": -24.783864974975586, "global_step": 223000, "epoch": 2686} {"train_loss": -24.409805297851562, "global_step": 223001, "epoch": 2686} {"train_loss": -24.772550582885742, "global_step": 223002, "epoch": 2686} {"train_loss": -24.748197555541992, "global_step": 223003, "epoch": 2686} {"train_loss": -24.9056453704834, "global_step": 223004, "epoch": 2686} {"train_loss": -24.708105087280273, "global_step": 223005, "epoch": 2686} {"train_loss": -24.5274600982666, "global_step": 223006, "epoch": 2686} {"train_loss": -24.648008346557617, "global_step": 223007, "epoch": 2686} {"train_loss": -24.860614776611328, "global_step": 223008, "epoch": 2686} {"train_loss": -24.24571418762207, "global_step": 223009, "epoch": 2686} {"train_loss": -24.25027084350586, "global_step": 223010, "epoch": 2686} {"train_loss": -24.629440307617188, "global_step": 223011, "epoch": 2686} {"train_loss": -24.501914978027344, "global_step": 223012, "epoch": 2686} {"train_loss": -24.67063331604004, "global_step": 223013, "epoch": 2686} {"train_loss": -24.12399673461914, "global_step": 223014, "epoch": 2686} {"train_loss": -24.995702743530273, "global_step": 223015, "epoch": 2686} {"train_loss": -24.656381607055664, "global_step": 223016, "epoch": 2686} {"train_loss": -24.695920944213867, "global_step": 223017, "epoch": 2686} {"train_loss": -24.65378761291504, "global_step": 223018, "epoch": 2686} {"train_loss": -24.826099395751953, "global_step": 223019, "epoch": 2686} {"train_loss": -24.6295171760651, "global_step": 223020, "epoch": 2686, "val_loss": 6778676.0} {"train_loss": -24.589601516723633, "global_step": 223021, "epoch": 2687} {"train_loss": -24.38423728942871, "global_step": 223022, "epoch": 2687} {"train_loss": -24.696035385131836, "global_step": 223023, "epoch": 2687} {"train_loss": -24.318450927734375, "global_step": 223024, "epoch": 2687} {"train_loss": -24.415502548217773, "global_step": 223025, "epoch": 2687} {"train_loss": -24.317224502563477, "global_step": 223026, "epoch": 2687} {"train_loss": -24.7473201751709, "global_step": 223027, "epoch": 2687} {"train_loss": -24.487295150756836, "global_step": 223028, "epoch": 2687} {"train_loss": -24.763824462890625, "global_step": 223029, "epoch": 2687} {"train_loss": -24.507732391357422, "global_step": 223030, "epoch": 2687} {"train_loss": -24.29369354248047, "global_step": 223031, "epoch": 2687} {"train_loss": -24.55116844177246, "global_step": 223032, "epoch": 2687} {"train_loss": -24.611745834350586, "global_step": 223033, "epoch": 2687} {"train_loss": -24.585561752319336, "global_step": 223034, "epoch": 2687} {"train_loss": -24.573287963867188, "global_step": 223035, "epoch": 2687} {"train_loss": -24.427906036376953, "global_step": 223036, "epoch": 2687} {"train_loss": -24.35392189025879, "global_step": 223037, "epoch": 2687} {"train_loss": -24.306034088134766, "global_step": 223038, "epoch": 2687} {"train_loss": -24.729978561401367, "global_step": 223039, "epoch": 2687} {"train_loss": -24.7357234954834, "global_step": 223040, "epoch": 2687} {"train_loss": -23.987287521362305, "global_step": 223041, "epoch": 2687} {"train_loss": -23.638471603393555, "global_step": 223042, "epoch": 2687} {"train_loss": -23.39448356628418, "global_step": 223043, "epoch": 2687} {"train_loss": -24.375303268432617, "global_step": 223044, "epoch": 2687} {"train_loss": -24.300128936767578, "global_step": 223045, "epoch": 2687} {"train_loss": -23.957719802856445, "global_step": 223046, "epoch": 2687} {"train_loss": -24.67470932006836, "global_step": 223047, "epoch": 2687} {"train_loss": -24.311866760253906, "global_step": 223048, "epoch": 2687} {"train_loss": -24.44625473022461, "global_step": 223049, "epoch": 2687} {"train_loss": -24.0125789642334, "global_step": 223050, "epoch": 2687} {"train_loss": -24.075660705566406, "global_step": 223051, "epoch": 2687} {"train_loss": -24.4326171875, "global_step": 223052, "epoch": 2687} {"train_loss": -24.243824005126953, "global_step": 223053, "epoch": 2687} {"train_loss": -24.312793731689453, "global_step": 223054, "epoch": 2687} {"train_loss": -24.287891387939453, "global_step": 223055, "epoch": 2687} {"train_loss": -24.844797134399414, "global_step": 223056, "epoch": 2687} {"train_loss": -24.762067794799805, "global_step": 223057, "epoch": 2687} {"train_loss": -24.37998390197754, "global_step": 223058, "epoch": 2687} {"train_loss": -24.726974487304688, "global_step": 223059, "epoch": 2687} {"train_loss": -24.840818405151367, "global_step": 223060, "epoch": 2687} {"train_loss": -24.30824089050293, "global_step": 223061, "epoch": 2687} {"train_loss": -24.661958694458008, "global_step": 223062, "epoch": 2687} {"train_loss": -24.6257381439209, "global_step": 223063, "epoch": 2687} {"train_loss": -24.917333602905273, "global_step": 223064, "epoch": 2687} {"train_loss": -24.610889434814453, "global_step": 223065, "epoch": 2687} {"train_loss": -24.373388290405273, "global_step": 223066, "epoch": 2687} {"train_loss": -24.920400619506836, "global_step": 223067, "epoch": 2687} {"train_loss": -24.61395263671875, "global_step": 223068, "epoch": 2687} {"train_loss": -24.649328231811523, "global_step": 223069, "epoch": 2687} {"train_loss": -24.642507553100586, "global_step": 223070, "epoch": 2687} {"train_loss": -24.3956241607666, "global_step": 223071, "epoch": 2687} {"train_loss": -24.62937355041504, "global_step": 223072, "epoch": 2687} {"train_loss": -24.692142486572266, "global_step": 223073, "epoch": 2687} {"train_loss": -24.74176025390625, "global_step": 223074, "epoch": 2687} {"train_loss": -24.915220260620117, "global_step": 223075, "epoch": 2687} {"train_loss": -24.786523818969727, "global_step": 223076, "epoch": 2687} {"train_loss": -24.767255783081055, "global_step": 223077, "epoch": 2687} {"train_loss": -24.785747528076172, "global_step": 223078, "epoch": 2687} {"train_loss": -25.108304977416992, "global_step": 223079, "epoch": 2687} {"train_loss": -24.394052505493164, "global_step": 223080, "epoch": 2687} {"train_loss": -24.642534255981445, "global_step": 223081, "epoch": 2687} {"train_loss": -24.724332809448242, "global_step": 223082, "epoch": 2687} {"train_loss": -24.709033966064453, "global_step": 223083, "epoch": 2687} {"train_loss": -24.446529388427734, "global_step": 223084, "epoch": 2687} {"train_loss": -25.068700790405273, "global_step": 223085, "epoch": 2687} {"train_loss": -24.764297485351562, "global_step": 223086, "epoch": 2687} {"train_loss": -24.816150665283203, "global_step": 223087, "epoch": 2687} {"train_loss": -24.387893676757812, "global_step": 223088, "epoch": 2687} {"train_loss": -24.359540939331055, "global_step": 223089, "epoch": 2687} {"train_loss": -25.000024795532227, "global_step": 223090, "epoch": 2687} {"train_loss": -24.414331436157227, "global_step": 223091, "epoch": 2687} {"train_loss": -24.7165470123291, "global_step": 223092, "epoch": 2687} {"train_loss": -24.68375587463379, "global_step": 223093, "epoch": 2687} {"train_loss": -24.443239212036133, "global_step": 223094, "epoch": 2687} {"train_loss": -24.4025936126709, "global_step": 223095, "epoch": 2687} {"train_loss": -24.80035972595215, "global_step": 223096, "epoch": 2687} {"train_loss": -24.923198699951172, "global_step": 223097, "epoch": 2687} {"train_loss": -24.756885528564453, "global_step": 223098, "epoch": 2687} {"train_loss": -25.013931274414062, "global_step": 223099, "epoch": 2687} {"train_loss": -24.79207420349121, "global_step": 223100, "epoch": 2687} {"train_loss": -24.51422119140625, "global_step": 223101, "epoch": 2687} {"train_loss": -24.436635971069336, "global_step": 223102, "epoch": 2687} {"train_loss": -24.54510560093156, "global_step": 223103, "epoch": 2687, "val_loss": 6794254.0} {"train_loss": -23.312850952148438, "global_step": 223104, "epoch": 2688} {"train_loss": -23.299131393432617, "global_step": 223105, "epoch": 2688} {"train_loss": -24.597745895385742, "global_step": 223106, "epoch": 2688} {"train_loss": -23.875314712524414, "global_step": 223107, "epoch": 2688} {"train_loss": -24.152984619140625, "global_step": 223108, "epoch": 2688} {"train_loss": -24.220706939697266, "global_step": 223109, "epoch": 2688} {"train_loss": -23.960859298706055, "global_step": 223110, "epoch": 2688} {"train_loss": -24.015928268432617, "global_step": 223111, "epoch": 2688} {"train_loss": -24.265087127685547, "global_step": 223112, "epoch": 2688} {"train_loss": -24.468738555908203, "global_step": 223113, "epoch": 2688} {"train_loss": -24.389205932617188, "global_step": 223114, "epoch": 2688} {"train_loss": -24.10312843322754, "global_step": 223115, "epoch": 2688} {"train_loss": -24.538488388061523, "global_step": 223116, "epoch": 2688} {"train_loss": -24.91904640197754, "global_step": 223117, "epoch": 2688} {"train_loss": -24.346166610717773, "global_step": 223118, "epoch": 2688} {"train_loss": -24.141647338867188, "global_step": 223119, "epoch": 2688} {"train_loss": -24.819049835205078, "global_step": 223120, "epoch": 2688} {"train_loss": -24.486745834350586, "global_step": 223121, "epoch": 2688} {"train_loss": -24.205402374267578, "global_step": 223122, "epoch": 2688} {"train_loss": -24.754453659057617, "global_step": 223123, "epoch": 2688} {"train_loss": -24.54573631286621, "global_step": 223124, "epoch": 2688} {"train_loss": -24.563413619995117, "global_step": 223125, "epoch": 2688} {"train_loss": -24.37858009338379, "global_step": 223126, "epoch": 2688} {"train_loss": -24.829866409301758, "global_step": 223127, "epoch": 2688} {"train_loss": -24.823169708251953, "global_step": 223128, "epoch": 2688} {"train_loss": -24.952402114868164, "global_step": 223129, "epoch": 2688} {"train_loss": -24.250417709350586, "global_step": 223130, "epoch": 2688} {"train_loss": -24.67349624633789, "global_step": 223131, "epoch": 2688} {"train_loss": -24.601112365722656, "global_step": 223132, "epoch": 2688} {"train_loss": -24.669538497924805, "global_step": 223133, "epoch": 2688} {"train_loss": -24.64011573791504, "global_step": 223134, "epoch": 2688} {"train_loss": -24.882211685180664, "global_step": 223135, "epoch": 2688} {"train_loss": -24.505319595336914, "global_step": 223136, "epoch": 2688} {"train_loss": -24.36532974243164, "global_step": 223137, "epoch": 2688} {"train_loss": -24.687782287597656, "global_step": 223138, "epoch": 2688} {"train_loss": -24.614675521850586, "global_step": 223139, "epoch": 2688} {"train_loss": -24.447351455688477, "global_step": 223140, "epoch": 2688} {"train_loss": -24.662057876586914, "global_step": 223141, "epoch": 2688} {"train_loss": -24.99236297607422, "global_step": 223142, "epoch": 2688} {"train_loss": -24.558340072631836, "global_step": 223143, "epoch": 2688} {"train_loss": -24.41279411315918, "global_step": 223144, "epoch": 2688} {"train_loss": -24.916479110717773, "global_step": 223145, "epoch": 2688} {"train_loss": -25.026514053344727, "global_step": 223146, "epoch": 2688} {"train_loss": -24.946638107299805, "global_step": 223147, "epoch": 2688} {"train_loss": -24.510120391845703, "global_step": 223148, "epoch": 2688} {"train_loss": -24.59130096435547, "global_step": 223149, "epoch": 2688} {"train_loss": -24.493711471557617, "global_step": 223150, "epoch": 2688} {"train_loss": -24.549640655517578, "global_step": 223151, "epoch": 2688} {"train_loss": -24.867246627807617, "global_step": 223152, "epoch": 2688} {"train_loss": -24.618541717529297, "global_step": 223153, "epoch": 2688} {"train_loss": -24.679189682006836, "global_step": 223154, "epoch": 2688} {"train_loss": -24.529767990112305, "global_step": 223155, "epoch": 2688} {"train_loss": -24.81827163696289, "global_step": 223156, "epoch": 2688} {"train_loss": -24.976165771484375, "global_step": 223157, "epoch": 2688} {"train_loss": -24.680816650390625, "global_step": 223158, "epoch": 2688} {"train_loss": -24.982385635375977, "global_step": 223159, "epoch": 2688} {"train_loss": -24.730222702026367, "global_step": 223160, "epoch": 2688} {"train_loss": -24.847793579101562, "global_step": 223161, "epoch": 2688} {"train_loss": -24.477005004882812, "global_step": 223162, "epoch": 2688} {"train_loss": -24.935800552368164, "global_step": 223163, "epoch": 2688} {"train_loss": -24.57002830505371, "global_step": 223164, "epoch": 2688} {"train_loss": -24.269346237182617, "global_step": 223165, "epoch": 2688} {"train_loss": -24.914644241333008, "global_step": 223166, "epoch": 2688} {"train_loss": -24.604827880859375, "global_step": 223167, "epoch": 2688} {"train_loss": -24.81915283203125, "global_step": 223168, "epoch": 2688} {"train_loss": -24.51059341430664, "global_step": 223169, "epoch": 2688} {"train_loss": -24.720233917236328, "global_step": 223170, "epoch": 2688} {"train_loss": -25.21194839477539, "global_step": 223171, "epoch": 2688} {"train_loss": -24.862462997436523, "global_step": 223172, "epoch": 2688} {"train_loss": -25.00701904296875, "global_step": 223173, "epoch": 2688} {"train_loss": -24.760221481323242, "global_step": 223174, "epoch": 2688} {"train_loss": -24.856550216674805, "global_step": 223175, "epoch": 2688} {"train_loss": -24.579620361328125, "global_step": 223176, "epoch": 2688} {"train_loss": -24.961139678955078, "global_step": 223177, "epoch": 2688} {"train_loss": -24.92558479309082, "global_step": 223178, "epoch": 2688} {"train_loss": -24.942861557006836, "global_step": 223179, "epoch": 2688} {"train_loss": -25.012191772460938, "global_step": 223180, "epoch": 2688} {"train_loss": -24.44440460205078, "global_step": 223181, "epoch": 2688} {"train_loss": -24.576627731323242, "global_step": 223182, "epoch": 2688} {"train_loss": -24.221609115600586, "global_step": 223183, "epoch": 2688} {"train_loss": -24.707294464111328, "global_step": 223184, "epoch": 2688} {"train_loss": -24.504831314086914, "global_step": 223185, "epoch": 2688} {"train_loss": -24.60601303376347, "global_step": 223186, "epoch": 2688, "val_loss": 6711286.0} {"train_loss": -24.38789176940918, "global_step": 223187, "epoch": 2689} {"train_loss": -23.391067504882812, "global_step": 223188, "epoch": 2689} {"train_loss": -24.112598419189453, "global_step": 223189, "epoch": 2689} {"train_loss": -23.732236862182617, "global_step": 223190, "epoch": 2689} {"train_loss": -23.101938247680664, "global_step": 223191, "epoch": 2689} {"train_loss": -23.860416412353516, "global_step": 223192, "epoch": 2689} {"train_loss": -24.232635498046875, "global_step": 223193, "epoch": 2689} {"train_loss": -23.91371726989746, "global_step": 223194, "epoch": 2689} {"train_loss": -23.238941192626953, "global_step": 223195, "epoch": 2689} {"train_loss": -23.93342399597168, "global_step": 223196, "epoch": 2689} {"train_loss": -23.660673141479492, "global_step": 223197, "epoch": 2689} {"train_loss": -24.41029167175293, "global_step": 223198, "epoch": 2689} {"train_loss": -24.404680252075195, "global_step": 223199, "epoch": 2689} {"train_loss": -24.0511531829834, "global_step": 223200, "epoch": 2689} {"train_loss": -23.9528751373291, "global_step": 223201, "epoch": 2689} {"train_loss": -24.040830612182617, "global_step": 223202, "epoch": 2689} {"train_loss": -24.34659767150879, "global_step": 223203, "epoch": 2689} {"train_loss": -24.174036026000977, "global_step": 223204, "epoch": 2689} {"train_loss": -24.599050521850586, "global_step": 223205, "epoch": 2689} {"train_loss": -24.19704246520996, "global_step": 223206, "epoch": 2689} {"train_loss": -24.415950775146484, "global_step": 223207, "epoch": 2689} {"train_loss": -24.529165267944336, "global_step": 223208, "epoch": 2689} {"train_loss": -24.43697166442871, "global_step": 223209, "epoch": 2689} {"train_loss": -24.365392684936523, "global_step": 223210, "epoch": 2689} {"train_loss": -24.681934356689453, "global_step": 223211, "epoch": 2689} {"train_loss": -24.430578231811523, "global_step": 223212, "epoch": 2689} {"train_loss": -24.15909767150879, "global_step": 223213, "epoch": 2689} {"train_loss": -24.424091339111328, "global_step": 223214, "epoch": 2689} {"train_loss": -24.363582611083984, "global_step": 223215, "epoch": 2689} {"train_loss": -24.62959098815918, "global_step": 223216, "epoch": 2689} {"train_loss": -24.94878578186035, "global_step": 223217, "epoch": 2689} {"train_loss": -24.851728439331055, "global_step": 223218, "epoch": 2689} {"train_loss": -24.90378761291504, "global_step": 223219, "epoch": 2689} {"train_loss": -24.538671493530273, "global_step": 223220, "epoch": 2689} {"train_loss": -24.558340072631836, "global_step": 223221, "epoch": 2689} {"train_loss": -24.602392196655273, "global_step": 223222, "epoch": 2689} {"train_loss": -24.65934181213379, "global_step": 223223, "epoch": 2689} {"train_loss": -24.55006980895996, "global_step": 223224, "epoch": 2689} {"train_loss": -24.794775009155273, "global_step": 223225, "epoch": 2689} {"train_loss": -24.906095504760742, "global_step": 223226, "epoch": 2689} {"train_loss": -24.917898178100586, "global_step": 223227, "epoch": 2689} {"train_loss": -25.104276657104492, "global_step": 223228, "epoch": 2689} {"train_loss": -24.990978240966797, "global_step": 223229, "epoch": 2689} {"train_loss": -24.700525283813477, "global_step": 223230, "epoch": 2689} {"train_loss": -24.24197769165039, "global_step": 223231, "epoch": 2689} {"train_loss": -24.710092544555664, "global_step": 223232, "epoch": 2689} {"train_loss": -24.4428768157959, "global_step": 223233, "epoch": 2689} {"train_loss": -25.0072021484375, "global_step": 223234, "epoch": 2689} {"train_loss": -24.625213623046875, "global_step": 223235, "epoch": 2689} {"train_loss": -24.93896484375, "global_step": 223236, "epoch": 2689} {"train_loss": -24.624601364135742, "global_step": 223237, "epoch": 2689} {"train_loss": -24.180557250976562, "global_step": 223238, "epoch": 2689} {"train_loss": -24.718948364257812, "global_step": 223239, "epoch": 2689} {"train_loss": -24.967206954956055, "global_step": 223240, "epoch": 2689} {"train_loss": -24.966840744018555, "global_step": 223241, "epoch": 2689} {"train_loss": -24.52129554748535, "global_step": 223242, "epoch": 2689} {"train_loss": -24.407861709594727, "global_step": 223243, "epoch": 2689} {"train_loss": -24.63218116760254, "global_step": 223244, "epoch": 2689} {"train_loss": -24.57176399230957, "global_step": 223245, "epoch": 2689} {"train_loss": -24.426847457885742, "global_step": 223246, "epoch": 2689} {"train_loss": -24.664947509765625, "global_step": 223247, "epoch": 2689} {"train_loss": -24.36263656616211, "global_step": 223248, "epoch": 2689} {"train_loss": -24.479846954345703, "global_step": 223249, "epoch": 2689} {"train_loss": -24.808246612548828, "global_step": 223250, "epoch": 2689} {"train_loss": -24.44060707092285, "global_step": 223251, "epoch": 2689} {"train_loss": -24.25800132751465, "global_step": 223252, "epoch": 2689} {"train_loss": -25.015592575073242, "global_step": 223253, "epoch": 2689} {"train_loss": -24.46377944946289, "global_step": 223254, "epoch": 2689} {"train_loss": -24.553272247314453, "global_step": 223255, "epoch": 2689} {"train_loss": -24.936567306518555, "global_step": 223256, "epoch": 2689} {"train_loss": -24.542922973632812, "global_step": 223257, "epoch": 2689} {"train_loss": -24.803054809570312, "global_step": 223258, "epoch": 2689} {"train_loss": -24.692466735839844, "global_step": 223259, "epoch": 2689} {"train_loss": -24.64052963256836, "global_step": 223260, "epoch": 2689} {"train_loss": -24.54926872253418, "global_step": 223261, "epoch": 2689} {"train_loss": -24.622547149658203, "global_step": 223262, "epoch": 2689} {"train_loss": -24.898000717163086, "global_step": 223263, "epoch": 2689} {"train_loss": -24.56797218322754, "global_step": 223264, "epoch": 2689} {"train_loss": -24.409452438354492, "global_step": 223265, "epoch": 2689} {"train_loss": -24.832334518432617, "global_step": 223266, "epoch": 2689} {"train_loss": -24.763452529907227, "global_step": 223267, "epoch": 2689} {"train_loss": -25.0703067779541, "global_step": 223268, "epoch": 2689} {"train_loss": -24.476183121462903, "global_step": 223269, "epoch": 2689, "val_loss": 6689117.5} {"train_loss": -24.41702651977539, "global_step": 223270, "epoch": 2690} {"train_loss": -24.20997428894043, "global_step": 223271, "epoch": 2690} {"train_loss": -24.337446212768555, "global_step": 223272, "epoch": 2690} {"train_loss": -24.535871505737305, "global_step": 223273, "epoch": 2690} {"train_loss": -24.232696533203125, "global_step": 223274, "epoch": 2690} {"train_loss": -24.478788375854492, "global_step": 223275, "epoch": 2690} {"train_loss": -24.44415283203125, "global_step": 223276, "epoch": 2690} {"train_loss": -23.940410614013672, "global_step": 223277, "epoch": 2690} {"train_loss": -24.393835067749023, "global_step": 223278, "epoch": 2690} {"train_loss": -23.881183624267578, "global_step": 223279, "epoch": 2690} {"train_loss": -24.699356079101562, "global_step": 223280, "epoch": 2690} {"train_loss": -24.202539443969727, "global_step": 223281, "epoch": 2690} {"train_loss": -24.59174156188965, "global_step": 223282, "epoch": 2690} {"train_loss": -24.4267578125, "global_step": 223283, "epoch": 2690} {"train_loss": -24.229944229125977, "global_step": 223284, "epoch": 2690} {"train_loss": -24.33310890197754, "global_step": 223285, "epoch": 2690} {"train_loss": -24.395038604736328, "global_step": 223286, "epoch": 2690} {"train_loss": -24.76704978942871, "global_step": 223287, "epoch": 2690} {"train_loss": -24.265737533569336, "global_step": 223288, "epoch": 2690} {"train_loss": -24.46860694885254, "global_step": 223289, "epoch": 2690} {"train_loss": -24.59287452697754, "global_step": 223290, "epoch": 2690} {"train_loss": -24.319738388061523, "global_step": 223291, "epoch": 2690} {"train_loss": -24.646638870239258, "global_step": 223292, "epoch": 2690} {"train_loss": -24.42502784729004, "global_step": 223293, "epoch": 2690} {"train_loss": -24.489837646484375, "global_step": 223294, "epoch": 2690} {"train_loss": -24.644092559814453, "global_step": 223295, "epoch": 2690} {"train_loss": -24.354047775268555, "global_step": 223296, "epoch": 2690} {"train_loss": -24.59243392944336, "global_step": 223297, "epoch": 2690} {"train_loss": -24.73073387145996, "global_step": 223298, "epoch": 2690} {"train_loss": -24.4721736907959, "global_step": 223299, "epoch": 2690} {"train_loss": -24.782560348510742, "global_step": 223300, "epoch": 2690} {"train_loss": -24.653087615966797, "global_step": 223301, "epoch": 2690} {"train_loss": -24.551389694213867, "global_step": 223302, "epoch": 2690} {"train_loss": -24.831640243530273, "global_step": 223303, "epoch": 2690} {"train_loss": -24.81525230407715, "global_step": 223304, "epoch": 2690} {"train_loss": -24.212427139282227, "global_step": 223305, "epoch": 2690} {"train_loss": -24.748477935791016, "global_step": 223306, "epoch": 2690} {"train_loss": -24.85466766357422, "global_step": 223307, "epoch": 2690} {"train_loss": -24.5579891204834, "global_step": 223308, "epoch": 2690} {"train_loss": -24.850515365600586, "global_step": 223309, "epoch": 2690} {"train_loss": -24.66357421875, "global_step": 223310, "epoch": 2690} {"train_loss": -24.68246841430664, "global_step": 223311, "epoch": 2690} {"train_loss": -24.289289474487305, "global_step": 223312, "epoch": 2690} {"train_loss": -24.575931549072266, "global_step": 223313, "epoch": 2690} {"train_loss": -24.970380783081055, "global_step": 223314, "epoch": 2690} {"train_loss": -24.8389892578125, "global_step": 223315, "epoch": 2690} {"train_loss": -24.673521041870117, "global_step": 223316, "epoch": 2690} {"train_loss": -24.936574935913086, "global_step": 223317, "epoch": 2690} {"train_loss": -24.53239631652832, "global_step": 223318, "epoch": 2690} {"train_loss": -24.776819229125977, "global_step": 223319, "epoch": 2690} {"train_loss": -24.31521987915039, "global_step": 223320, "epoch": 2690} {"train_loss": -24.96925926208496, "global_step": 223321, "epoch": 2690} {"train_loss": -24.919958114624023, "global_step": 223322, "epoch": 2690} {"train_loss": -24.468521118164062, "global_step": 223323, "epoch": 2690} {"train_loss": -24.648649215698242, "global_step": 223324, "epoch": 2690} {"train_loss": -24.702600479125977, "global_step": 223325, "epoch": 2690} {"train_loss": -24.62994384765625, "global_step": 223326, "epoch": 2690} {"train_loss": -24.434919357299805, "global_step": 223327, "epoch": 2690} {"train_loss": -24.663633346557617, "global_step": 223328, "epoch": 2690} {"train_loss": -24.552793502807617, "global_step": 223329, "epoch": 2690} {"train_loss": -24.685413360595703, "global_step": 223330, "epoch": 2690} {"train_loss": -24.540857315063477, "global_step": 223331, "epoch": 2690} {"train_loss": -24.33251190185547, "global_step": 223332, "epoch": 2690} {"train_loss": -24.331262588500977, "global_step": 223333, "epoch": 2690} {"train_loss": -24.68120765686035, "global_step": 223334, "epoch": 2690} {"train_loss": -24.31268882751465, "global_step": 223335, "epoch": 2690} {"train_loss": -24.83180046081543, "global_step": 223336, "epoch": 2690} {"train_loss": -24.682605743408203, "global_step": 223337, "epoch": 2690} {"train_loss": -24.4945125579834, "global_step": 223338, "epoch": 2690} {"train_loss": -24.786081314086914, "global_step": 223339, "epoch": 2690} {"train_loss": -24.766786575317383, "global_step": 223340, "epoch": 2690} {"train_loss": -24.831180572509766, "global_step": 223341, "epoch": 2690} {"train_loss": -24.689054489135742, "global_step": 223342, "epoch": 2690} {"train_loss": -25.048681259155273, "global_step": 223343, "epoch": 2690} {"train_loss": -24.921194076538086, "global_step": 223344, "epoch": 2690} {"train_loss": -24.515005111694336, "global_step": 223345, "epoch": 2690} {"train_loss": -24.796770095825195, "global_step": 223346, "epoch": 2690} {"train_loss": -24.689111709594727, "global_step": 223347, "epoch": 2690} {"train_loss": -24.394697189331055, "global_step": 223348, "epoch": 2690} {"train_loss": -23.94073486328125, "global_step": 223349, "epoch": 2690} {"train_loss": -24.693098068237305, "global_step": 223350, "epoch": 2690} {"train_loss": -24.391204833984375, "global_step": 223351, "epoch": 2690} {"train_loss": -24.570854232971925, "global_step": 223352, "epoch": 2690, "val_loss": 6662528.0} {"train_loss": -23.807470321655273, "global_step": 223353, "epoch": 2691} {"train_loss": -23.61248207092285, "global_step": 223354, "epoch": 2691} {"train_loss": -23.931650161743164, "global_step": 223355, "epoch": 2691} {"train_loss": -23.866342544555664, "global_step": 223356, "epoch": 2691} {"train_loss": -24.037006378173828, "global_step": 223357, "epoch": 2691} {"train_loss": -24.069278717041016, "global_step": 223358, "epoch": 2691} {"train_loss": -24.16510581970215, "global_step": 223359, "epoch": 2691} {"train_loss": -24.255765914916992, "global_step": 223360, "epoch": 2691} {"train_loss": -24.055908203125, "global_step": 223361, "epoch": 2691} {"train_loss": -24.735488891601562, "global_step": 223362, "epoch": 2691} {"train_loss": -24.314435958862305, "global_step": 223363, "epoch": 2691} {"train_loss": -24.03805923461914, "global_step": 223364, "epoch": 2691} {"train_loss": -24.354034423828125, "global_step": 223365, "epoch": 2691} {"train_loss": -24.628435134887695, "global_step": 223366, "epoch": 2691} {"train_loss": -24.25948143005371, "global_step": 223367, "epoch": 2691} {"train_loss": -24.24643325805664, "global_step": 223368, "epoch": 2691} {"train_loss": -24.643110275268555, "global_step": 223369, "epoch": 2691} {"train_loss": -24.536775588989258, "global_step": 223370, "epoch": 2691} {"train_loss": -24.34616470336914, "global_step": 223371, "epoch": 2691} {"train_loss": -25.014026641845703, "global_step": 223372, "epoch": 2691} {"train_loss": -24.681827545166016, "global_step": 223373, "epoch": 2691} {"train_loss": -24.446924209594727, "global_step": 223374, "epoch": 2691} {"train_loss": -24.659025192260742, "global_step": 223375, "epoch": 2691} {"train_loss": -24.603424072265625, "global_step": 223376, "epoch": 2691} {"train_loss": -24.733165740966797, "global_step": 223377, "epoch": 2691} {"train_loss": -24.779924392700195, "global_step": 223378, "epoch": 2691} {"train_loss": -24.5863037109375, "global_step": 223379, "epoch": 2691} {"train_loss": -24.567480087280273, "global_step": 223380, "epoch": 2691} {"train_loss": -24.566553115844727, "global_step": 223381, "epoch": 2691} {"train_loss": -24.326980590820312, "global_step": 223382, "epoch": 2691} {"train_loss": -24.63629913330078, "global_step": 223383, "epoch": 2691} {"train_loss": -24.741849899291992, "global_step": 223384, "epoch": 2691} {"train_loss": -24.4609317779541, "global_step": 223385, "epoch": 2691} {"train_loss": -24.723302841186523, "global_step": 223386, "epoch": 2691} {"train_loss": -24.803024291992188, "global_step": 223387, "epoch": 2691} {"train_loss": -24.984174728393555, "global_step": 223388, "epoch": 2691} {"train_loss": -24.592435836791992, "global_step": 223389, "epoch": 2691} {"train_loss": -24.43281364440918, "global_step": 223390, "epoch": 2691} {"train_loss": -24.984098434448242, "global_step": 223391, "epoch": 2691} {"train_loss": -25.129169464111328, "global_step": 223392, "epoch": 2691} {"train_loss": -24.603971481323242, "global_step": 223393, "epoch": 2691} {"train_loss": -24.489795684814453, "global_step": 223394, "epoch": 2691} {"train_loss": -24.502965927124023, "global_step": 223395, "epoch": 2691} {"train_loss": -24.492101669311523, "global_step": 223396, "epoch": 2691} {"train_loss": -24.67630958557129, "global_step": 223397, "epoch": 2691} {"train_loss": -24.749494552612305, "global_step": 223398, "epoch": 2691} {"train_loss": -24.81070327758789, "global_step": 223399, "epoch": 2691} {"train_loss": -24.659643173217773, "global_step": 223400, "epoch": 2691} {"train_loss": -24.672901153564453, "global_step": 223401, "epoch": 2691} {"train_loss": -24.96535301208496, "global_step": 223402, "epoch": 2691} {"train_loss": -25.16591453552246, "global_step": 223403, "epoch": 2691} {"train_loss": -24.917896270751953, "global_step": 223404, "epoch": 2691} {"train_loss": -24.827560424804688, "global_step": 223405, "epoch": 2691} {"train_loss": -24.7576847076416, "global_step": 223406, "epoch": 2691} {"train_loss": -24.496427536010742, "global_step": 223407, "epoch": 2691} {"train_loss": -24.407155990600586, "global_step": 223408, "epoch": 2691} {"train_loss": -24.44651985168457, "global_step": 223409, "epoch": 2691} {"train_loss": -24.674091339111328, "global_step": 223410, "epoch": 2691} {"train_loss": -24.05768585205078, "global_step": 223411, "epoch": 2691} {"train_loss": -24.614749908447266, "global_step": 223412, "epoch": 2691} {"train_loss": -24.50711441040039, "global_step": 223413, "epoch": 2691} {"train_loss": -24.4569091796875, "global_step": 223414, "epoch": 2691} {"train_loss": -24.338979721069336, "global_step": 223415, "epoch": 2691} {"train_loss": -24.55115509033203, "global_step": 223416, "epoch": 2691} {"train_loss": -24.681991577148438, "global_step": 223417, "epoch": 2691} {"train_loss": -24.751981735229492, "global_step": 223418, "epoch": 2691} {"train_loss": -24.34383773803711, "global_step": 223419, "epoch": 2691} {"train_loss": -25.125246047973633, "global_step": 223420, "epoch": 2691} {"train_loss": -24.379480361938477, "global_step": 223421, "epoch": 2691} {"train_loss": -24.679325103759766, "global_step": 223422, "epoch": 2691} {"train_loss": -24.380441665649414, "global_step": 223423, "epoch": 2691} {"train_loss": -24.856124877929688, "global_step": 223424, "epoch": 2691} {"train_loss": -24.207822799682617, "global_step": 223425, "epoch": 2691} {"train_loss": -24.433019638061523, "global_step": 223426, "epoch": 2691} {"train_loss": -24.886709213256836, "global_step": 223427, "epoch": 2691} {"train_loss": -24.802175521850586, "global_step": 223428, "epoch": 2691} {"train_loss": -24.825889587402344, "global_step": 223429, "epoch": 2691} {"train_loss": -24.762821197509766, "global_step": 223430, "epoch": 2691} {"train_loss": -24.68035888671875, "global_step": 223431, "epoch": 2691} {"train_loss": -24.32173728942871, "global_step": 223432, "epoch": 2691} {"train_loss": -24.69965171813965, "global_step": 223433, "epoch": 2691} {"train_loss": -24.704059600830078, "global_step": 223434, "epoch": 2691} {"train_loss": -24.545551254088622, "global_step": 223435, "epoch": 2691, "val_loss": 6595433.5} {"train_loss": -23.340652465820312, "global_step": 223436, "epoch": 2692} {"train_loss": -23.88361930847168, "global_step": 223437, "epoch": 2692} {"train_loss": -24.338382720947266, "global_step": 223438, "epoch": 2692} {"train_loss": -24.119733810424805, "global_step": 223439, "epoch": 2692} {"train_loss": -24.366933822631836, "global_step": 223440, "epoch": 2692} {"train_loss": -23.829833984375, "global_step": 223441, "epoch": 2692} {"train_loss": -24.335874557495117, "global_step": 223442, "epoch": 2692} {"train_loss": -24.558460235595703, "global_step": 223443, "epoch": 2692} {"train_loss": -24.484895706176758, "global_step": 223444, "epoch": 2692} {"train_loss": -24.371435165405273, "global_step": 223445, "epoch": 2692} {"train_loss": -24.609344482421875, "global_step": 223446, "epoch": 2692} {"train_loss": -24.540252685546875, "global_step": 223447, "epoch": 2692} {"train_loss": -24.50357437133789, "global_step": 223448, "epoch": 2692} {"train_loss": -24.45760154724121, "global_step": 223449, "epoch": 2692} {"train_loss": -24.143299102783203, "global_step": 223450, "epoch": 2692} {"train_loss": -24.164758682250977, "global_step": 223451, "epoch": 2692} {"train_loss": -24.20273208618164, "global_step": 223452, "epoch": 2692} {"train_loss": -24.355314254760742, "global_step": 223453, "epoch": 2692} {"train_loss": -24.625837326049805, "global_step": 223454, "epoch": 2692} {"train_loss": -24.368310928344727, "global_step": 223455, "epoch": 2692} {"train_loss": -24.379453659057617, "global_step": 223456, "epoch": 2692} {"train_loss": -24.492538452148438, "global_step": 223457, "epoch": 2692} {"train_loss": -23.986530303955078, "global_step": 223458, "epoch": 2692} {"train_loss": -24.568632125854492, "global_step": 223459, "epoch": 2692} {"train_loss": -24.939456939697266, "global_step": 223460, "epoch": 2692} {"train_loss": -24.592763900756836, "global_step": 223461, "epoch": 2692} {"train_loss": -25.013837814331055, "global_step": 223462, "epoch": 2692} {"train_loss": -24.454322814941406, "global_step": 223463, "epoch": 2692} {"train_loss": -24.37894058227539, "global_step": 223464, "epoch": 2692} {"train_loss": -24.540515899658203, "global_step": 223465, "epoch": 2692} {"train_loss": -24.577299118041992, "global_step": 223466, "epoch": 2692} {"train_loss": -24.66597557067871, "global_step": 223467, "epoch": 2692} {"train_loss": -24.55657958984375, "global_step": 223468, "epoch": 2692} {"train_loss": -24.222877502441406, "global_step": 223469, "epoch": 2692} {"train_loss": -24.65461540222168, "global_step": 223470, "epoch": 2692} {"train_loss": -24.319721221923828, "global_step": 223471, "epoch": 2692} {"train_loss": -24.51460838317871, "global_step": 223472, "epoch": 2692} {"train_loss": -24.716808319091797, "global_step": 223473, "epoch": 2692} {"train_loss": -24.61966323852539, "global_step": 223474, "epoch": 2692} {"train_loss": -25.111806869506836, "global_step": 223475, "epoch": 2692} {"train_loss": -24.765182495117188, "global_step": 223476, "epoch": 2692} {"train_loss": -24.78956413269043, "global_step": 223477, "epoch": 2692} {"train_loss": -24.48763084411621, "global_step": 223478, "epoch": 2692} {"train_loss": -24.651226043701172, "global_step": 223479, "epoch": 2692} {"train_loss": -24.65205192565918, "global_step": 223480, "epoch": 2692} {"train_loss": -24.94586944580078, "global_step": 223481, "epoch": 2692} {"train_loss": -24.761707305908203, "global_step": 223482, "epoch": 2692} {"train_loss": -25.00191307067871, "global_step": 223483, "epoch": 2692} {"train_loss": -24.48925018310547, "global_step": 223484, "epoch": 2692} {"train_loss": -25.026931762695312, "global_step": 223485, "epoch": 2692} {"train_loss": -24.977537155151367, "global_step": 223486, "epoch": 2692} {"train_loss": -24.812021255493164, "global_step": 223487, "epoch": 2692} {"train_loss": -24.36724090576172, "global_step": 223488, "epoch": 2692} {"train_loss": -24.771394729614258, "global_step": 223489, "epoch": 2692} {"train_loss": -24.536828994750977, "global_step": 223490, "epoch": 2692} {"train_loss": -24.583498001098633, "global_step": 223491, "epoch": 2692} {"train_loss": -24.567636489868164, "global_step": 223492, "epoch": 2692} {"train_loss": -24.53720474243164, "global_step": 223493, "epoch": 2692} {"train_loss": -24.391897201538086, "global_step": 223494, "epoch": 2692} {"train_loss": -24.846628189086914, "global_step": 223495, "epoch": 2692} {"train_loss": -24.668066024780273, "global_step": 223496, "epoch": 2692} {"train_loss": -24.81210708618164, "global_step": 223497, "epoch": 2692} {"train_loss": -24.732343673706055, "global_step": 223498, "epoch": 2692} {"train_loss": -24.554746627807617, "global_step": 223499, "epoch": 2692} {"train_loss": -24.535188674926758, "global_step": 223500, "epoch": 2692} {"train_loss": -24.825777053833008, "global_step": 223501, "epoch": 2692} {"train_loss": -24.807310104370117, "global_step": 223502, "epoch": 2692} {"train_loss": -24.616823196411133, "global_step": 223503, "epoch": 2692} {"train_loss": -24.58429527282715, "global_step": 223504, "epoch": 2692} {"train_loss": -24.86452293395996, "global_step": 223505, "epoch": 2692} {"train_loss": -24.627687454223633, "global_step": 223506, "epoch": 2692} {"train_loss": -24.435039520263672, "global_step": 223507, "epoch": 2692} {"train_loss": -24.68549919128418, "global_step": 223508, "epoch": 2692} {"train_loss": -24.39056968688965, "global_step": 223509, "epoch": 2692} {"train_loss": -23.972049713134766, "global_step": 223510, "epoch": 2692} {"train_loss": -23.741762161254883, "global_step": 223511, "epoch": 2692} {"train_loss": -24.691495895385742, "global_step": 223512, "epoch": 2692} {"train_loss": -24.535079956054688, "global_step": 223513, "epoch": 2692} {"train_loss": -24.2172908782959, "global_step": 223514, "epoch": 2692} {"train_loss": -24.623889923095703, "global_step": 223515, "epoch": 2692} {"train_loss": -24.327312469482422, "global_step": 223516, "epoch": 2692} {"train_loss": -24.655054092407227, "global_step": 223517, "epoch": 2692} {"train_loss": -24.528271387858563, "global_step": 223518, "epoch": 2692, "val_loss": 6706414.0} {"train_loss": -24.128211975097656, "global_step": 223519, "epoch": 2693} {"train_loss": -24.00135612487793, "global_step": 223520, "epoch": 2693} {"train_loss": -24.082609176635742, "global_step": 223521, "epoch": 2693} {"train_loss": -23.88787841796875, "global_step": 223522, "epoch": 2693} {"train_loss": -23.86232566833496, "global_step": 223523, "epoch": 2693} {"train_loss": -24.152902603149414, "global_step": 223524, "epoch": 2693} {"train_loss": -24.1929988861084, "global_step": 223525, "epoch": 2693} {"train_loss": -24.035049438476562, "global_step": 223526, "epoch": 2693} {"train_loss": -23.919132232666016, "global_step": 223527, "epoch": 2693} {"train_loss": -24.452505111694336, "global_step": 223528, "epoch": 2693} {"train_loss": -24.238475799560547, "global_step": 223529, "epoch": 2693} {"train_loss": -24.36292839050293, "global_step": 223530, "epoch": 2693} {"train_loss": -24.800458908081055, "global_step": 223531, "epoch": 2693} {"train_loss": -24.24090003967285, "global_step": 223532, "epoch": 2693} {"train_loss": -24.631080627441406, "global_step": 223533, "epoch": 2693} {"train_loss": -24.01307487487793, "global_step": 223534, "epoch": 2693} {"train_loss": -24.312772750854492, "global_step": 223535, "epoch": 2693} {"train_loss": -24.60731315612793, "global_step": 223536, "epoch": 2693} {"train_loss": -24.826541900634766, "global_step": 223537, "epoch": 2693} {"train_loss": -24.497785568237305, "global_step": 223538, "epoch": 2693} {"train_loss": -24.260074615478516, "global_step": 223539, "epoch": 2693} {"train_loss": -24.68749237060547, "global_step": 223540, "epoch": 2693} {"train_loss": -24.429744720458984, "global_step": 223541, "epoch": 2693} {"train_loss": -24.90488052368164, "global_step": 223542, "epoch": 2693} {"train_loss": -24.572038650512695, "global_step": 223543, "epoch": 2693} {"train_loss": -24.810977935791016, "global_step": 223544, "epoch": 2693} {"train_loss": -24.72132682800293, "global_step": 223545, "epoch": 2693} {"train_loss": -24.49827766418457, "global_step": 223546, "epoch": 2693} {"train_loss": -24.85833168029785, "global_step": 223547, "epoch": 2693} {"train_loss": -24.372634887695312, "global_step": 223548, "epoch": 2693} {"train_loss": -24.95562171936035, "global_step": 223549, "epoch": 2693} {"train_loss": -24.68558692932129, "global_step": 223550, "epoch": 2693} {"train_loss": -24.724645614624023, "global_step": 223551, "epoch": 2693} {"train_loss": -24.973388671875, "global_step": 223552, "epoch": 2693} {"train_loss": -24.45979881286621, "global_step": 223553, "epoch": 2693} {"train_loss": -24.802648544311523, "global_step": 223554, "epoch": 2693} {"train_loss": -24.547334671020508, "global_step": 223555, "epoch": 2693} {"train_loss": -24.656904220581055, "global_step": 223556, "epoch": 2693} {"train_loss": -24.648387908935547, "global_step": 223557, "epoch": 2693} {"train_loss": -24.54572105407715, "global_step": 223558, "epoch": 2693} {"train_loss": -24.588533401489258, "global_step": 223559, "epoch": 2693} {"train_loss": -24.383848190307617, "global_step": 223560, "epoch": 2693} {"train_loss": -24.872434616088867, "global_step": 223561, "epoch": 2693} {"train_loss": -24.38408660888672, "global_step": 223562, "epoch": 2693} {"train_loss": -24.583236694335938, "global_step": 223563, "epoch": 2693} {"train_loss": -24.642658233642578, "global_step": 223564, "epoch": 2693} {"train_loss": -24.760887145996094, "global_step": 223565, "epoch": 2693} {"train_loss": -24.657676696777344, "global_step": 223566, "epoch": 2693} {"train_loss": -24.668684005737305, "global_step": 223567, "epoch": 2693} {"train_loss": -24.756757736206055, "global_step": 223568, "epoch": 2693} {"train_loss": -24.429777145385742, "global_step": 223569, "epoch": 2693} {"train_loss": -24.792692184448242, "global_step": 223570, "epoch": 2693} {"train_loss": -24.611215591430664, "global_step": 223571, "epoch": 2693} {"train_loss": -25.020212173461914, "global_step": 223572, "epoch": 2693} {"train_loss": -24.31320571899414, "global_step": 223573, "epoch": 2693} {"train_loss": -24.589378356933594, "global_step": 223574, "epoch": 2693} {"train_loss": -24.66475486755371, "global_step": 223575, "epoch": 2693} {"train_loss": -24.848857879638672, "global_step": 223576, "epoch": 2693} {"train_loss": -24.560640335083008, "global_step": 223577, "epoch": 2693} {"train_loss": -24.664030075073242, "global_step": 223578, "epoch": 2693} {"train_loss": -24.489377975463867, "global_step": 223579, "epoch": 2693} {"train_loss": -25.045392990112305, "global_step": 223580, "epoch": 2693} {"train_loss": -24.512039184570312, "global_step": 223581, "epoch": 2693} {"train_loss": -24.40030288696289, "global_step": 223582, "epoch": 2693} {"train_loss": -24.684621810913086, "global_step": 223583, "epoch": 2693} {"train_loss": -24.79326057434082, "global_step": 223584, "epoch": 2693} {"train_loss": -24.763051986694336, "global_step": 223585, "epoch": 2693} {"train_loss": -24.763208389282227, "global_step": 223586, "epoch": 2693} {"train_loss": -24.693235397338867, "global_step": 223587, "epoch": 2693} {"train_loss": -24.800373077392578, "global_step": 223588, "epoch": 2693} {"train_loss": -24.544153213500977, "global_step": 223589, "epoch": 2693} {"train_loss": -24.623273849487305, "global_step": 223590, "epoch": 2693} {"train_loss": -24.59962272644043, "global_step": 223591, "epoch": 2693} {"train_loss": -24.785690307617188, "global_step": 223592, "epoch": 2693} {"train_loss": -24.833431243896484, "global_step": 223593, "epoch": 2693} {"train_loss": -24.676151275634766, "global_step": 223594, "epoch": 2693} {"train_loss": -24.676076889038086, "global_step": 223595, "epoch": 2693} {"train_loss": -24.73031234741211, "global_step": 223596, "epoch": 2693} {"train_loss": -25.022235870361328, "global_step": 223597, "epoch": 2693} {"train_loss": -24.40134620666504, "global_step": 223598, "epoch": 2693} {"train_loss": -25.02776527404785, "global_step": 223599, "epoch": 2693} {"train_loss": -24.337238311767578, "global_step": 223600, "epoch": 2693} {"train_loss": -24.5664102715182, "global_step": 223601, "epoch": 2693, "val_loss": 6729451.0} {"train_loss": -24.279539108276367, "global_step": 223602, "epoch": 2694} {"train_loss": -24.360881805419922, "global_step": 223603, "epoch": 2694} {"train_loss": -24.637216567993164, "global_step": 223604, "epoch": 2694} {"train_loss": -24.473691940307617, "global_step": 223605, "epoch": 2694} {"train_loss": -24.313499450683594, "global_step": 223606, "epoch": 2694} {"train_loss": -24.44529151916504, "global_step": 223607, "epoch": 2694} {"train_loss": -24.602258682250977, "global_step": 223608, "epoch": 2694} {"train_loss": -24.66193962097168, "global_step": 223609, "epoch": 2694} {"train_loss": -24.777769088745117, "global_step": 223610, "epoch": 2694} {"train_loss": -24.38959312438965, "global_step": 223611, "epoch": 2694} {"train_loss": -24.553709030151367, "global_step": 223612, "epoch": 2694} {"train_loss": -25.043474197387695, "global_step": 223613, "epoch": 2694} {"train_loss": -24.213708877563477, "global_step": 223614, "epoch": 2694} {"train_loss": -24.433208465576172, "global_step": 223615, "epoch": 2694} {"train_loss": -24.79164695739746, "global_step": 223616, "epoch": 2694} {"train_loss": -24.883926391601562, "global_step": 223617, "epoch": 2694} {"train_loss": -24.760147094726562, "global_step": 223618, "epoch": 2694} {"train_loss": -24.418533325195312, "global_step": 223619, "epoch": 2694} {"train_loss": -24.633230209350586, "global_step": 223620, "epoch": 2694} {"train_loss": -24.4627685546875, "global_step": 223621, "epoch": 2694} {"train_loss": -24.728097915649414, "global_step": 223622, "epoch": 2694} {"train_loss": -24.61539077758789, "global_step": 223623, "epoch": 2694} {"train_loss": -24.64256477355957, "global_step": 223624, "epoch": 2694} {"train_loss": -24.26022720336914, "global_step": 223625, "epoch": 2694} {"train_loss": -24.801979064941406, "global_step": 223626, "epoch": 2694} {"train_loss": -24.494186401367188, "global_step": 223627, "epoch": 2694} {"train_loss": -24.589069366455078, "global_step": 223628, "epoch": 2694} {"train_loss": -24.3493709564209, "global_step": 223629, "epoch": 2694} {"train_loss": -24.63606834411621, "global_step": 223630, "epoch": 2694} {"train_loss": -24.872329711914062, "global_step": 223631, "epoch": 2694} {"train_loss": -24.61861801147461, "global_step": 223632, "epoch": 2694} {"train_loss": -24.726207733154297, "global_step": 223633, "epoch": 2694} {"train_loss": -24.5610294342041, "global_step": 223634, "epoch": 2694} {"train_loss": -25.11207389831543, "global_step": 223635, "epoch": 2694} {"train_loss": -24.414583206176758, "global_step": 223636, "epoch": 2694} {"train_loss": -24.453460693359375, "global_step": 223637, "epoch": 2694} {"train_loss": -24.329065322875977, "global_step": 223638, "epoch": 2694} {"train_loss": -24.64381980895996, "global_step": 223639, "epoch": 2694} {"train_loss": -24.85894775390625, "global_step": 223640, "epoch": 2694} {"train_loss": -24.598785400390625, "global_step": 223641, "epoch": 2694} {"train_loss": -24.637954711914062, "global_step": 223642, "epoch": 2694} {"train_loss": -24.828317642211914, "global_step": 223643, "epoch": 2694} {"train_loss": -24.81464958190918, "global_step": 223644, "epoch": 2694} {"train_loss": -24.96398162841797, "global_step": 223645, "epoch": 2694} {"train_loss": -24.940536499023438, "global_step": 223646, "epoch": 2694} {"train_loss": -24.44175148010254, "global_step": 223647, "epoch": 2694} {"train_loss": -25.015533447265625, "global_step": 223648, "epoch": 2694} {"train_loss": -24.904804229736328, "global_step": 223649, "epoch": 2694} {"train_loss": -24.746641159057617, "global_step": 223650, "epoch": 2694} {"train_loss": -24.623441696166992, "global_step": 223651, "epoch": 2694} {"train_loss": -24.340255737304688, "global_step": 223652, "epoch": 2694} {"train_loss": -24.447998046875, "global_step": 223653, "epoch": 2694} {"train_loss": -24.43719482421875, "global_step": 223654, "epoch": 2694} {"train_loss": -24.42237091064453, "global_step": 223655, "epoch": 2694} {"train_loss": -24.574155807495117, "global_step": 223656, "epoch": 2694} {"train_loss": -24.46121597290039, "global_step": 223657, "epoch": 2694} {"train_loss": -25.09309196472168, "global_step": 223658, "epoch": 2694} {"train_loss": -24.34551429748535, "global_step": 223659, "epoch": 2694} {"train_loss": -24.009227752685547, "global_step": 223660, "epoch": 2694} {"train_loss": -24.81032371520996, "global_step": 223661, "epoch": 2694} {"train_loss": -24.2903995513916, "global_step": 223662, "epoch": 2694} {"train_loss": -24.985876083374023, "global_step": 223663, "epoch": 2694} {"train_loss": -24.434558868408203, "global_step": 223664, "epoch": 2694} {"train_loss": -24.781461715698242, "global_step": 223665, "epoch": 2694} {"train_loss": -24.572084426879883, "global_step": 223666, "epoch": 2694} {"train_loss": -24.525054931640625, "global_step": 223667, "epoch": 2694} {"train_loss": -24.641881942749023, "global_step": 223668, "epoch": 2694} {"train_loss": -24.608135223388672, "global_step": 223669, "epoch": 2694} {"train_loss": -24.75895118713379, "global_step": 223670, "epoch": 2694} {"train_loss": -24.85487937927246, "global_step": 223671, "epoch": 2694} {"train_loss": -24.527952194213867, "global_step": 223672, "epoch": 2694} {"train_loss": -24.535776138305664, "global_step": 223673, "epoch": 2694} {"train_loss": -24.48321533203125, "global_step": 223674, "epoch": 2694} {"train_loss": -24.531538009643555, "global_step": 223675, "epoch": 2694} {"train_loss": -24.252721786499023, "global_step": 223676, "epoch": 2694} {"train_loss": -24.796167373657227, "global_step": 223677, "epoch": 2694} {"train_loss": -24.597139358520508, "global_step": 223678, "epoch": 2694} {"train_loss": -24.552539825439453, "global_step": 223679, "epoch": 2694} {"train_loss": -24.52713966369629, "global_step": 223680, "epoch": 2694} {"train_loss": -24.508005142211914, "global_step": 223681, "epoch": 2694} {"train_loss": -24.73407554626465, "global_step": 223682, "epoch": 2694} {"train_loss": -24.914798736572266, "global_step": 223683, "epoch": 2694} {"train_loss": -24.592337688767767, "global_step": 223684, "epoch": 2694, "val_loss": 6674868.0} {"train_loss": -24.588245391845703, "global_step": 223685, "epoch": 2695} {"train_loss": -24.248197555541992, "global_step": 223686, "epoch": 2695} {"train_loss": -24.247671127319336, "global_step": 223687, "epoch": 2695} {"train_loss": -24.28021812438965, "global_step": 223688, "epoch": 2695} {"train_loss": -24.342660903930664, "global_step": 223689, "epoch": 2695} {"train_loss": -24.152257919311523, "global_step": 223690, "epoch": 2695} {"train_loss": -24.13595199584961, "global_step": 223691, "epoch": 2695} {"train_loss": -24.370502471923828, "global_step": 223692, "epoch": 2695} {"train_loss": -24.547672271728516, "global_step": 223693, "epoch": 2695} {"train_loss": -24.02042579650879, "global_step": 223694, "epoch": 2695} {"train_loss": -24.364301681518555, "global_step": 223695, "epoch": 2695} {"train_loss": -24.59012794494629, "global_step": 223696, "epoch": 2695} {"train_loss": -24.593994140625, "global_step": 223697, "epoch": 2695} {"train_loss": -24.658044815063477, "global_step": 223698, "epoch": 2695} {"train_loss": -24.57733726501465, "global_step": 223699, "epoch": 2695} {"train_loss": -24.270885467529297, "global_step": 223700, "epoch": 2695} {"train_loss": -24.3183536529541, "global_step": 223701, "epoch": 2695} {"train_loss": -24.631317138671875, "global_step": 223702, "epoch": 2695} {"train_loss": -24.449092864990234, "global_step": 223703, "epoch": 2695} {"train_loss": -24.238412857055664, "global_step": 223704, "epoch": 2695} {"train_loss": -24.448293685913086, "global_step": 223705, "epoch": 2695} {"train_loss": -24.4995059967041, "global_step": 223706, "epoch": 2695} {"train_loss": -24.574533462524414, "global_step": 223707, "epoch": 2695} {"train_loss": -24.232267379760742, "global_step": 223708, "epoch": 2695} {"train_loss": -24.988691329956055, "global_step": 223709, "epoch": 2695} {"train_loss": -24.627771377563477, "global_step": 223710, "epoch": 2695} {"train_loss": -24.760377883911133, "global_step": 223711, "epoch": 2695} {"train_loss": -24.683469772338867, "global_step": 223712, "epoch": 2695} {"train_loss": -24.334590911865234, "global_step": 223713, "epoch": 2695} {"train_loss": -24.570837020874023, "global_step": 223714, "epoch": 2695} {"train_loss": -24.973552703857422, "global_step": 223715, "epoch": 2695} {"train_loss": -24.61959457397461, "global_step": 223716, "epoch": 2695} {"train_loss": -24.561397552490234, "global_step": 223717, "epoch": 2695} {"train_loss": -24.946460723876953, "global_step": 223718, "epoch": 2695} {"train_loss": -24.67276382446289, "global_step": 223719, "epoch": 2695} {"train_loss": -24.91314697265625, "global_step": 223720, "epoch": 2695} {"train_loss": -24.865509033203125, "global_step": 223721, "epoch": 2695} {"train_loss": -24.6062068939209, "global_step": 223722, "epoch": 2695} {"train_loss": -24.315448760986328, "global_step": 223723, "epoch": 2695} {"train_loss": -24.567108154296875, "global_step": 223724, "epoch": 2695} {"train_loss": -24.994260787963867, "global_step": 223725, "epoch": 2695} {"train_loss": -24.597854614257812, "global_step": 223726, "epoch": 2695} {"train_loss": -24.6357421875, "global_step": 223727, "epoch": 2695} {"train_loss": -24.993444442749023, "global_step": 223728, "epoch": 2695} {"train_loss": -24.191320419311523, "global_step": 223729, "epoch": 2695} {"train_loss": -24.330976486206055, "global_step": 223730, "epoch": 2695} {"train_loss": -24.7614803314209, "global_step": 223731, "epoch": 2695} {"train_loss": -24.285703659057617, "global_step": 223732, "epoch": 2695} {"train_loss": -24.6949462890625, "global_step": 223733, "epoch": 2695} {"train_loss": -24.556589126586914, "global_step": 223734, "epoch": 2695} {"train_loss": -24.479589462280273, "global_step": 223735, "epoch": 2695} {"train_loss": -25.166772842407227, "global_step": 223736, "epoch": 2695} {"train_loss": -24.619176864624023, "global_step": 223737, "epoch": 2695} {"train_loss": -24.717565536499023, "global_step": 223738, "epoch": 2695} {"train_loss": -24.452802658081055, "global_step": 223739, "epoch": 2695} {"train_loss": -24.716938018798828, "global_step": 223740, "epoch": 2695} {"train_loss": -24.76997184753418, "global_step": 223741, "epoch": 2695} {"train_loss": -24.543405532836914, "global_step": 223742, "epoch": 2695} {"train_loss": -24.482772827148438, "global_step": 223743, "epoch": 2695} {"train_loss": -24.856050491333008, "global_step": 223744, "epoch": 2695} {"train_loss": -24.6362247467041, "global_step": 223745, "epoch": 2695} {"train_loss": -24.84069061279297, "global_step": 223746, "epoch": 2695} {"train_loss": -24.594369888305664, "global_step": 223747, "epoch": 2695} {"train_loss": -25.014427185058594, "global_step": 223748, "epoch": 2695} {"train_loss": -24.952320098876953, "global_step": 223749, "epoch": 2695} {"train_loss": -24.990833282470703, "global_step": 223750, "epoch": 2695} {"train_loss": -24.734716415405273, "global_step": 223751, "epoch": 2695} {"train_loss": -24.69150161743164, "global_step": 223752, "epoch": 2695} {"train_loss": -24.895389556884766, "global_step": 223753, "epoch": 2695} {"train_loss": -24.417280197143555, "global_step": 223754, "epoch": 2695} {"train_loss": -24.523910522460938, "global_step": 223755, "epoch": 2695} {"train_loss": -24.745317459106445, "global_step": 223756, "epoch": 2695} {"train_loss": -24.666889190673828, "global_step": 223757, "epoch": 2695} {"train_loss": -24.7767391204834, "global_step": 223758, "epoch": 2695} {"train_loss": -24.869918823242188, "global_step": 223759, "epoch": 2695} {"train_loss": -24.88844871520996, "global_step": 223760, "epoch": 2695} {"train_loss": -24.579761505126953, "global_step": 223761, "epoch": 2695} {"train_loss": -24.50282859802246, "global_step": 223762, "epoch": 2695} {"train_loss": -24.58848762512207, "global_step": 223763, "epoch": 2695} {"train_loss": -24.819135665893555, "global_step": 223764, "epoch": 2695} {"train_loss": -25.179227828979492, "global_step": 223765, "epoch": 2695} {"train_loss": -24.660837173461914, "global_step": 223766, "epoch": 2695} {"train_loss": -24.611888173114824, "global_step": 223767, "epoch": 2695, "val_loss": 6687808.5} {"train_loss": -23.98605728149414, "global_step": 223768, "epoch": 2696} {"train_loss": -23.695621490478516, "global_step": 223769, "epoch": 2696} {"train_loss": -23.766538619995117, "global_step": 223770, "epoch": 2696} {"train_loss": -22.341876983642578, "global_step": 223771, "epoch": 2696} {"train_loss": -22.19607925415039, "global_step": 223772, "epoch": 2696} {"train_loss": -23.65597915649414, "global_step": 223773, "epoch": 2696} {"train_loss": -23.795074462890625, "global_step": 223774, "epoch": 2696} {"train_loss": -22.83778190612793, "global_step": 223775, "epoch": 2696} {"train_loss": -23.960895538330078, "global_step": 223776, "epoch": 2696} {"train_loss": -23.566850662231445, "global_step": 223777, "epoch": 2696} {"train_loss": -23.585493087768555, "global_step": 223778, "epoch": 2696} {"train_loss": -23.77726173400879, "global_step": 223779, "epoch": 2696} {"train_loss": -23.75185203552246, "global_step": 223780, "epoch": 2696} {"train_loss": -23.681808471679688, "global_step": 223781, "epoch": 2696} {"train_loss": -24.38004493713379, "global_step": 223782, "epoch": 2696} {"train_loss": -24.112720489501953, "global_step": 223783, "epoch": 2696} {"train_loss": -23.874237060546875, "global_step": 223784, "epoch": 2696} {"train_loss": -23.9294376373291, "global_step": 223785, "epoch": 2696} {"train_loss": -23.795949935913086, "global_step": 223786, "epoch": 2696} {"train_loss": -24.260757446289062, "global_step": 223787, "epoch": 2696} {"train_loss": -24.240400314331055, "global_step": 223788, "epoch": 2696} {"train_loss": -24.39068603515625, "global_step": 223789, "epoch": 2696} {"train_loss": -24.001596450805664, "global_step": 223790, "epoch": 2696} {"train_loss": -24.23084831237793, "global_step": 223791, "epoch": 2696} {"train_loss": -24.302309036254883, "global_step": 223792, "epoch": 2696} {"train_loss": -24.0109920501709, "global_step": 223793, "epoch": 2696} {"train_loss": -24.5026912689209, "global_step": 223794, "epoch": 2696} {"train_loss": -24.499631881713867, "global_step": 223795, "epoch": 2696} {"train_loss": -24.556730270385742, "global_step": 223796, "epoch": 2696} {"train_loss": -24.516714096069336, "global_step": 223797, "epoch": 2696} {"train_loss": -24.420108795166016, "global_step": 223798, "epoch": 2696} {"train_loss": -24.402204513549805, "global_step": 223799, "epoch": 2696} {"train_loss": -24.216510772705078, "global_step": 223800, "epoch": 2696} {"train_loss": -24.454143524169922, "global_step": 223801, "epoch": 2696} {"train_loss": -24.17597007751465, "global_step": 223802, "epoch": 2696} {"train_loss": -24.488365173339844, "global_step": 223803, "epoch": 2696} {"train_loss": -24.545801162719727, "global_step": 223804, "epoch": 2696} {"train_loss": -24.603797912597656, "global_step": 223805, "epoch": 2696} {"train_loss": -24.604074478149414, "global_step": 223806, "epoch": 2696} {"train_loss": -24.40073013305664, "global_step": 223807, "epoch": 2696} {"train_loss": -24.465946197509766, "global_step": 223808, "epoch": 2696} {"train_loss": -24.464323043823242, "global_step": 223809, "epoch": 2696} {"train_loss": -24.736827850341797, "global_step": 223810, "epoch": 2696} {"train_loss": -24.830835342407227, "global_step": 223811, "epoch": 2696} {"train_loss": -24.589603424072266, "global_step": 223812, "epoch": 2696} {"train_loss": -24.791608810424805, "global_step": 223813, "epoch": 2696} {"train_loss": -24.385211944580078, "global_step": 223814, "epoch": 2696} {"train_loss": -24.869565963745117, "global_step": 223815, "epoch": 2696} {"train_loss": -24.71703338623047, "global_step": 223816, "epoch": 2696} {"train_loss": -24.680240631103516, "global_step": 223817, "epoch": 2696} {"train_loss": -24.783432006835938, "global_step": 223818, "epoch": 2696} {"train_loss": -24.864765167236328, "global_step": 223819, "epoch": 2696} {"train_loss": -24.57282066345215, "global_step": 223820, "epoch": 2696} {"train_loss": -24.704843521118164, "global_step": 223821, "epoch": 2696} {"train_loss": -24.498472213745117, "global_step": 223822, "epoch": 2696} {"train_loss": -25.245914459228516, "global_step": 223823, "epoch": 2696} {"train_loss": -24.4981746673584, "global_step": 223824, "epoch": 2696} {"train_loss": -24.627073287963867, "global_step": 223825, "epoch": 2696} {"train_loss": -24.540430068969727, "global_step": 223826, "epoch": 2696} {"train_loss": -24.64954948425293, "global_step": 223827, "epoch": 2696} {"train_loss": -24.50896644592285, "global_step": 223828, "epoch": 2696} {"train_loss": -24.67629051208496, "global_step": 223829, "epoch": 2696} {"train_loss": -24.5849552154541, "global_step": 223830, "epoch": 2696} {"train_loss": -24.3931884765625, "global_step": 223831, "epoch": 2696} {"train_loss": -24.57135772705078, "global_step": 223832, "epoch": 2696} {"train_loss": -24.5551815032959, "global_step": 223833, "epoch": 2696} {"train_loss": -24.97157859802246, "global_step": 223834, "epoch": 2696} {"train_loss": -24.619245529174805, "global_step": 223835, "epoch": 2696} {"train_loss": -24.53740692138672, "global_step": 223836, "epoch": 2696} {"train_loss": -24.76885414123535, "global_step": 223837, "epoch": 2696} {"train_loss": -24.4066219329834, "global_step": 223838, "epoch": 2696} {"train_loss": -24.34333610534668, "global_step": 223839, "epoch": 2696} {"train_loss": -24.64266014099121, "global_step": 223840, "epoch": 2696} {"train_loss": -24.6643009185791, "global_step": 223841, "epoch": 2696} {"train_loss": -24.735916137695312, "global_step": 223842, "epoch": 2696} {"train_loss": -24.547895431518555, "global_step": 223843, "epoch": 2696} {"train_loss": -24.540802001953125, "global_step": 223844, "epoch": 2696} {"train_loss": -24.400360107421875, "global_step": 223845, "epoch": 2696} {"train_loss": -24.435054779052734, "global_step": 223846, "epoch": 2696} {"train_loss": -24.60401153564453, "global_step": 223847, "epoch": 2696} {"train_loss": -24.96637535095215, "global_step": 223848, "epoch": 2696} {"train_loss": -24.53488540649414, "global_step": 223849, "epoch": 2696} {"train_loss": -24.341703989419592, "global_step": 223850, "epoch": 2696, "val_loss": 6734746.0} {"train_loss": -24.2060604095459, "global_step": 223851, "epoch": 2697} {"train_loss": -23.857637405395508, "global_step": 223852, "epoch": 2697} {"train_loss": -24.4464111328125, "global_step": 223853, "epoch": 2697} {"train_loss": -24.1297664642334, "global_step": 223854, "epoch": 2697} {"train_loss": -24.166479110717773, "global_step": 223855, "epoch": 2697} {"train_loss": -24.298704147338867, "global_step": 223856, "epoch": 2697} {"train_loss": -24.364194869995117, "global_step": 223857, "epoch": 2697} {"train_loss": -24.618576049804688, "global_step": 223858, "epoch": 2697} {"train_loss": -24.304407119750977, "global_step": 223859, "epoch": 2697} {"train_loss": -24.151901245117188, "global_step": 223860, "epoch": 2697} {"train_loss": -24.423025131225586, "global_step": 223861, "epoch": 2697} {"train_loss": -24.069143295288086, "global_step": 223862, "epoch": 2697} {"train_loss": -24.556156158447266, "global_step": 223863, "epoch": 2697} {"train_loss": -24.40787124633789, "global_step": 223864, "epoch": 2697} {"train_loss": -24.368127822875977, "global_step": 223865, "epoch": 2697} {"train_loss": -24.91139793395996, "global_step": 223866, "epoch": 2697} {"train_loss": -24.5376033782959, "global_step": 223867, "epoch": 2697} {"train_loss": -24.535053253173828, "global_step": 223868, "epoch": 2697} {"train_loss": -24.637792587280273, "global_step": 223869, "epoch": 2697} {"train_loss": -24.249603271484375, "global_step": 223870, "epoch": 2697} {"train_loss": -24.21002769470215, "global_step": 223871, "epoch": 2697} {"train_loss": -24.268238067626953, "global_step": 223872, "epoch": 2697} {"train_loss": -24.657838821411133, "global_step": 223873, "epoch": 2697} {"train_loss": -24.708139419555664, "global_step": 223874, "epoch": 2697} {"train_loss": -24.725549697875977, "global_step": 223875, "epoch": 2697} {"train_loss": -24.78480339050293, "global_step": 223876, "epoch": 2697} {"train_loss": -24.635217666625977, "global_step": 223877, "epoch": 2697} {"train_loss": -24.513288497924805, "global_step": 223878, "epoch": 2697} {"train_loss": -24.513072967529297, "global_step": 223879, "epoch": 2697} {"train_loss": -24.445293426513672, "global_step": 223880, "epoch": 2697} {"train_loss": -24.490312576293945, "global_step": 223881, "epoch": 2697} {"train_loss": -24.6824951171875, "global_step": 223882, "epoch": 2697} {"train_loss": -24.77473258972168, "global_step": 223883, "epoch": 2697} {"train_loss": -24.85616111755371, "global_step": 223884, "epoch": 2697} {"train_loss": -24.49336814880371, "global_step": 223885, "epoch": 2697} {"train_loss": -25.100263595581055, "global_step": 223886, "epoch": 2697} {"train_loss": -24.724781036376953, "global_step": 223887, "epoch": 2697} {"train_loss": -24.919464111328125, "global_step": 223888, "epoch": 2697} {"train_loss": -24.92951774597168, "global_step": 223889, "epoch": 2697} {"train_loss": -24.742115020751953, "global_step": 223890, "epoch": 2697} {"train_loss": -24.863157272338867, "global_step": 223891, "epoch": 2697} {"train_loss": -24.70683479309082, "global_step": 223892, "epoch": 2697} {"train_loss": -24.7003173828125, "global_step": 223893, "epoch": 2697} {"train_loss": -24.89838981628418, "global_step": 223894, "epoch": 2697} {"train_loss": -24.91802215576172, "global_step": 223895, "epoch": 2697} {"train_loss": -24.80265235900879, "global_step": 223896, "epoch": 2697} {"train_loss": -24.928674697875977, "global_step": 223897, "epoch": 2697} {"train_loss": -24.95334243774414, "global_step": 223898, "epoch": 2697} {"train_loss": -24.869014739990234, "global_step": 223899, "epoch": 2697} {"train_loss": -25.12992286682129, "global_step": 223900, "epoch": 2697} {"train_loss": -24.703298568725586, "global_step": 223901, "epoch": 2697} {"train_loss": -25.021514892578125, "global_step": 223902, "epoch": 2697} {"train_loss": -24.795495986938477, "global_step": 223903, "epoch": 2697} {"train_loss": -24.621479034423828, "global_step": 223904, "epoch": 2697} {"train_loss": -24.66425132751465, "global_step": 223905, "epoch": 2697} {"train_loss": -24.93022346496582, "global_step": 223906, "epoch": 2697} {"train_loss": -24.513877868652344, "global_step": 223907, "epoch": 2697} {"train_loss": -24.941335678100586, "global_step": 223908, "epoch": 2697} {"train_loss": -24.810293197631836, "global_step": 223909, "epoch": 2697} {"train_loss": -24.931171417236328, "global_step": 223910, "epoch": 2697} {"train_loss": -24.549285888671875, "global_step": 223911, "epoch": 2697} {"train_loss": -24.728954315185547, "global_step": 223912, "epoch": 2697} {"train_loss": -24.703632354736328, "global_step": 223913, "epoch": 2697} {"train_loss": -24.9575252532959, "global_step": 223914, "epoch": 2697} {"train_loss": -24.40083885192871, "global_step": 223915, "epoch": 2697} {"train_loss": -24.531484603881836, "global_step": 223916, "epoch": 2697} {"train_loss": -24.58278465270996, "global_step": 223917, "epoch": 2697} {"train_loss": -24.477434158325195, "global_step": 223918, "epoch": 2697} {"train_loss": -25.05682945251465, "global_step": 223919, "epoch": 2697} {"train_loss": -24.842641830444336, "global_step": 223920, "epoch": 2697} {"train_loss": -24.52662467956543, "global_step": 223921, "epoch": 2697} {"train_loss": -24.38683319091797, "global_step": 223922, "epoch": 2697} {"train_loss": -24.591291427612305, "global_step": 223923, "epoch": 2697} {"train_loss": -24.635419845581055, "global_step": 223924, "epoch": 2697} {"train_loss": -24.356189727783203, "global_step": 223925, "epoch": 2697} {"train_loss": -24.97977066040039, "global_step": 223926, "epoch": 2697} {"train_loss": -24.824316024780273, "global_step": 223927, "epoch": 2697} {"train_loss": -24.193878173828125, "global_step": 223928, "epoch": 2697} {"train_loss": -25.054033279418945, "global_step": 223929, "epoch": 2697} {"train_loss": -24.491437911987305, "global_step": 223930, "epoch": 2697} {"train_loss": -24.617965698242188, "global_step": 223931, "epoch": 2697} {"train_loss": -24.85485076904297, "global_step": 223932, "epoch": 2697} {"train_loss": -24.643074679087444, "global_step": 223933, "epoch": 2697, "val_loss": 6716828.0} {"train_loss": -24.7053279876709, "global_step": 223934, "epoch": 2698} {"train_loss": -24.39796257019043, "global_step": 223935, "epoch": 2698} {"train_loss": -24.376794815063477, "global_step": 223936, "epoch": 2698} {"train_loss": -24.183940887451172, "global_step": 223937, "epoch": 2698} {"train_loss": -24.601484298706055, "global_step": 223938, "epoch": 2698} {"train_loss": -24.52471923828125, "global_step": 223939, "epoch": 2698} {"train_loss": -24.315473556518555, "global_step": 223940, "epoch": 2698} {"train_loss": -24.450374603271484, "global_step": 223941, "epoch": 2698} {"train_loss": -23.953916549682617, "global_step": 223942, "epoch": 2698} {"train_loss": -24.596115112304688, "global_step": 223943, "epoch": 2698} {"train_loss": -24.42203140258789, "global_step": 223944, "epoch": 2698} {"train_loss": -24.603775024414062, "global_step": 223945, "epoch": 2698} {"train_loss": -24.716983795166016, "global_step": 223946, "epoch": 2698} {"train_loss": -24.194738388061523, "global_step": 223947, "epoch": 2698} {"train_loss": -24.230243682861328, "global_step": 223948, "epoch": 2698} {"train_loss": -24.300085067749023, "global_step": 223949, "epoch": 2698} {"train_loss": -24.397743225097656, "global_step": 223950, "epoch": 2698} {"train_loss": -23.931259155273438, "global_step": 223951, "epoch": 2698} {"train_loss": -24.874547958374023, "global_step": 223952, "epoch": 2698} {"train_loss": -24.68959617614746, "global_step": 223953, "epoch": 2698} {"train_loss": -24.66552734375, "global_step": 223954, "epoch": 2698} {"train_loss": -24.512100219726562, "global_step": 223955, "epoch": 2698} {"train_loss": -24.27518653869629, "global_step": 223956, "epoch": 2698} {"train_loss": -24.258161544799805, "global_step": 223957, "epoch": 2698} {"train_loss": -24.263784408569336, "global_step": 223958, "epoch": 2698} {"train_loss": -24.6328182220459, "global_step": 223959, "epoch": 2698} {"train_loss": -24.676109313964844, "global_step": 223960, "epoch": 2698} {"train_loss": -24.505788803100586, "global_step": 223961, "epoch": 2698} {"train_loss": -24.877639770507812, "global_step": 223962, "epoch": 2698} {"train_loss": -24.572996139526367, "global_step": 223963, "epoch": 2698} {"train_loss": -24.852449417114258, "global_step": 223964, "epoch": 2698} {"train_loss": -24.495771408081055, "global_step": 223965, "epoch": 2698} {"train_loss": -24.459165573120117, "global_step": 223966, "epoch": 2698} {"train_loss": -24.66683006286621, "global_step": 223967, "epoch": 2698} {"train_loss": -24.328876495361328, "global_step": 223968, "epoch": 2698} {"train_loss": -24.526975631713867, "global_step": 223969, "epoch": 2698} {"train_loss": -24.55931854248047, "global_step": 223970, "epoch": 2698} {"train_loss": -24.761655807495117, "global_step": 223971, "epoch": 2698} {"train_loss": -24.544919967651367, "global_step": 223972, "epoch": 2698} {"train_loss": -24.445287704467773, "global_step": 223973, "epoch": 2698} {"train_loss": -24.838438034057617, "global_step": 223974, "epoch": 2698} {"train_loss": -24.46160888671875, "global_step": 223975, "epoch": 2698} {"train_loss": -24.42596435546875, "global_step": 223976, "epoch": 2698} {"train_loss": -24.70592498779297, "global_step": 223977, "epoch": 2698} {"train_loss": -25.07931137084961, "global_step": 223978, "epoch": 2698} {"train_loss": -24.627065658569336, "global_step": 223979, "epoch": 2698} {"train_loss": -25.015472412109375, "global_step": 223980, "epoch": 2698} {"train_loss": -24.65113639831543, "global_step": 223981, "epoch": 2698} {"train_loss": -24.857707977294922, "global_step": 223982, "epoch": 2698} {"train_loss": -24.74765396118164, "global_step": 223983, "epoch": 2698} {"train_loss": -24.843326568603516, "global_step": 223984, "epoch": 2698} {"train_loss": -24.92731285095215, "global_step": 223985, "epoch": 2698} {"train_loss": -24.855417251586914, "global_step": 223986, "epoch": 2698} {"train_loss": -25.00349998474121, "global_step": 223987, "epoch": 2698} {"train_loss": -24.801742553710938, "global_step": 223988, "epoch": 2698} {"train_loss": -24.810422897338867, "global_step": 223989, "epoch": 2698} {"train_loss": -24.78550148010254, "global_step": 223990, "epoch": 2698} {"train_loss": -24.66133689880371, "global_step": 223991, "epoch": 2698} {"train_loss": -24.50094985961914, "global_step": 223992, "epoch": 2698} {"train_loss": -24.07716178894043, "global_step": 223993, "epoch": 2698} {"train_loss": -23.133920669555664, "global_step": 223994, "epoch": 2698} {"train_loss": -24.13888168334961, "global_step": 223995, "epoch": 2698} {"train_loss": -23.991540908813477, "global_step": 223996, "epoch": 2698} {"train_loss": -24.34918212890625, "global_step": 223997, "epoch": 2698} {"train_loss": -24.33331871032715, "global_step": 223998, "epoch": 2698} {"train_loss": -24.112262725830078, "global_step": 223999, "epoch": 2698} {"train_loss": -23.565841674804688, "global_step": 224000, "epoch": 2698} {"train_loss": -24.124664306640625, "global_step": 224001, "epoch": 2698} {"train_loss": -23.912221908569336, "global_step": 224002, "epoch": 2698} {"train_loss": -24.87709617614746, "global_step": 224003, "epoch": 2698} {"train_loss": -24.34463882446289, "global_step": 224004, "epoch": 2698} {"train_loss": -24.13690757751465, "global_step": 224005, "epoch": 2698} {"train_loss": -24.61086654663086, "global_step": 224006, "epoch": 2698} {"train_loss": -24.371082305908203, "global_step": 224007, "epoch": 2698} {"train_loss": -24.367321014404297, "global_step": 224008, "epoch": 2698} {"train_loss": -24.430959701538086, "global_step": 224009, "epoch": 2698} {"train_loss": -24.699575424194336, "global_step": 224010, "epoch": 2698} {"train_loss": -24.751489639282227, "global_step": 224011, "epoch": 2698} {"train_loss": -24.87958526611328, "global_step": 224012, "epoch": 2698} {"train_loss": -24.331253051757812, "global_step": 224013, "epoch": 2698} {"train_loss": -24.459299087524414, "global_step": 224014, "epoch": 2698} {"train_loss": -24.59857749938965, "global_step": 224015, "epoch": 2698} {"train_loss": -24.494455751166285, "global_step": 224016, "epoch": 2698, "val_loss": 6621745.0} {"train_loss": -24.06205177307129, "global_step": 224017, "epoch": 2699} {"train_loss": -24.296430587768555, "global_step": 224018, "epoch": 2699} {"train_loss": -24.34827423095703, "global_step": 224019, "epoch": 2699} {"train_loss": -24.049583435058594, "global_step": 224020, "epoch": 2699} {"train_loss": -23.94781494140625, "global_step": 224021, "epoch": 2699} {"train_loss": -24.4974308013916, "global_step": 224022, "epoch": 2699} {"train_loss": -24.431325912475586, "global_step": 224023, "epoch": 2699} {"train_loss": -24.4010009765625, "global_step": 224024, "epoch": 2699} {"train_loss": -24.254642486572266, "global_step": 224025, "epoch": 2699} {"train_loss": -24.41806983947754, "global_step": 224026, "epoch": 2699} {"train_loss": -24.492887496948242, "global_step": 224027, "epoch": 2699} {"train_loss": -24.44333839416504, "global_step": 224028, "epoch": 2699} {"train_loss": -24.38340187072754, "global_step": 224029, "epoch": 2699} {"train_loss": -24.412128448486328, "global_step": 224030, "epoch": 2699} {"train_loss": -24.437673568725586, "global_step": 224031, "epoch": 2699} {"train_loss": -24.436508178710938, "global_step": 224032, "epoch": 2699} {"train_loss": -24.315637588500977, "global_step": 224033, "epoch": 2699} {"train_loss": -24.373106002807617, "global_step": 224034, "epoch": 2699} {"train_loss": -24.83047866821289, "global_step": 224035, "epoch": 2699} {"train_loss": -24.635746002197266, "global_step": 224036, "epoch": 2699} {"train_loss": -24.421777725219727, "global_step": 224037, "epoch": 2699} {"train_loss": -24.819826126098633, "global_step": 224038, "epoch": 2699} {"train_loss": -24.829837799072266, "global_step": 224039, "epoch": 2699} {"train_loss": -24.491924285888672, "global_step": 224040, "epoch": 2699} {"train_loss": -24.660276412963867, "global_step": 224041, "epoch": 2699} {"train_loss": -24.656583786010742, "global_step": 224042, "epoch": 2699} {"train_loss": -24.922544479370117, "global_step": 224043, "epoch": 2699} {"train_loss": -24.271413803100586, "global_step": 224044, "epoch": 2699} {"train_loss": -24.407506942749023, "global_step": 224045, "epoch": 2699} {"train_loss": -24.249242782592773, "global_step": 224046, "epoch": 2699} {"train_loss": -24.713973999023438, "global_step": 224047, "epoch": 2699} {"train_loss": -24.449697494506836, "global_step": 224048, "epoch": 2699} {"train_loss": -24.76670265197754, "global_step": 224049, "epoch": 2699} {"train_loss": -24.679006576538086, "global_step": 224050, "epoch": 2699} {"train_loss": -24.457172393798828, "global_step": 224051, "epoch": 2699} {"train_loss": -24.38755226135254, "global_step": 224052, "epoch": 2699} {"train_loss": -24.943647384643555, "global_step": 224053, "epoch": 2699} {"train_loss": -24.77227210998535, "global_step": 224054, "epoch": 2699} {"train_loss": -24.920774459838867, "global_step": 224055, "epoch": 2699} {"train_loss": -24.678646087646484, "global_step": 224056, "epoch": 2699} {"train_loss": -24.377696990966797, "global_step": 224057, "epoch": 2699} {"train_loss": -24.68438148498535, "global_step": 224058, "epoch": 2699} {"train_loss": -25.022974014282227, "global_step": 224059, "epoch": 2699} {"train_loss": -24.480356216430664, "global_step": 224060, "epoch": 2699} {"train_loss": -24.74164390563965, "global_step": 224061, "epoch": 2699} {"train_loss": -24.49164390563965, "global_step": 224062, "epoch": 2699} {"train_loss": -24.82680320739746, "global_step": 224063, "epoch": 2699} {"train_loss": -24.389127731323242, "global_step": 224064, "epoch": 2699} {"train_loss": -24.7426815032959, "global_step": 224065, "epoch": 2699} {"train_loss": -24.817813873291016, "global_step": 224066, "epoch": 2699} {"train_loss": -24.831073760986328, "global_step": 224067, "epoch": 2699} {"train_loss": -24.824684143066406, "global_step": 224068, "epoch": 2699} {"train_loss": -24.472990036010742, "global_step": 224069, "epoch": 2699} {"train_loss": -24.167177200317383, "global_step": 224070, "epoch": 2699} {"train_loss": -23.681236267089844, "global_step": 224071, "epoch": 2699} {"train_loss": -24.255277633666992, "global_step": 224072, "epoch": 2699} {"train_loss": -24.485544204711914, "global_step": 224073, "epoch": 2699} {"train_loss": -24.495716094970703, "global_step": 224074, "epoch": 2699} {"train_loss": -24.272628784179688, "global_step": 224075, "epoch": 2699} {"train_loss": -24.464141845703125, "global_step": 224076, "epoch": 2699} {"train_loss": -24.7298526763916, "global_step": 224077, "epoch": 2699} {"train_loss": -24.851160049438477, "global_step": 224078, "epoch": 2699} {"train_loss": -24.20017433166504, "global_step": 224079, "epoch": 2699} {"train_loss": -24.27821159362793, "global_step": 224080, "epoch": 2699} {"train_loss": -24.36778450012207, "global_step": 224081, "epoch": 2699} {"train_loss": -24.49176788330078, "global_step": 224082, "epoch": 2699} {"train_loss": -24.554712295532227, "global_step": 224083, "epoch": 2699} {"train_loss": -24.64321517944336, "global_step": 224084, "epoch": 2699} {"train_loss": -24.82126808166504, "global_step": 224085, "epoch": 2699} {"train_loss": -24.76511573791504, "global_step": 224086, "epoch": 2699} {"train_loss": -24.771984100341797, "global_step": 224087, "epoch": 2699} {"train_loss": -24.731388092041016, "global_step": 224088, "epoch": 2699} {"train_loss": -24.799070358276367, "global_step": 224089, "epoch": 2699} {"train_loss": -25.00004005432129, "global_step": 224090, "epoch": 2699} {"train_loss": -25.015913009643555, "global_step": 224091, "epoch": 2699} {"train_loss": -24.608083724975586, "global_step": 224092, "epoch": 2699} {"train_loss": -24.608978271484375, "global_step": 224093, "epoch": 2699} {"train_loss": -24.461891174316406, "global_step": 224094, "epoch": 2699} {"train_loss": -24.212099075317383, "global_step": 224095, "epoch": 2699} {"train_loss": -24.956262588500977, "global_step": 224096, "epoch": 2699} {"train_loss": -24.710500717163086, "global_step": 224097, "epoch": 2699} {"train_loss": -24.936521530151367, "global_step": 224098, "epoch": 2699} {"train_loss": -24.523196231888, "global_step": 224099, "epoch": 2699, "val_loss": 6727267.0} {"train_loss": -23.305723190307617, "global_step": 224100, "epoch": 2700} {"train_loss": -23.4849796295166, "global_step": 224101, "epoch": 2700} {"train_loss": -24.530197143554688, "global_step": 224102, "epoch": 2700} {"train_loss": -23.4564151763916, "global_step": 224103, "epoch": 2700} {"train_loss": -24.157451629638672, "global_step": 224104, "epoch": 2700} {"train_loss": -23.861610412597656, "global_step": 224105, "epoch": 2700} {"train_loss": -24.301305770874023, "global_step": 224106, "epoch": 2700} {"train_loss": -24.050939559936523, "global_step": 224107, "epoch": 2700} {"train_loss": -24.19571876525879, "global_step": 224108, "epoch": 2700} {"train_loss": -24.098068237304688, "global_step": 224109, "epoch": 2700} {"train_loss": -24.17157554626465, "global_step": 224110, "epoch": 2700} {"train_loss": -24.182592391967773, "global_step": 224111, "epoch": 2700} {"train_loss": -24.306543350219727, "global_step": 224112, "epoch": 2700} {"train_loss": -24.105810165405273, "global_step": 224113, "epoch": 2700} {"train_loss": -23.918556213378906, "global_step": 224114, "epoch": 2700} {"train_loss": -24.371870040893555, "global_step": 224115, "epoch": 2700} {"train_loss": -24.407386779785156, "global_step": 224116, "epoch": 2700} {"train_loss": -24.581594467163086, "global_step": 224117, "epoch": 2700} {"train_loss": -24.595016479492188, "global_step": 224118, "epoch": 2700} {"train_loss": -24.53755760192871, "global_step": 224119, "epoch": 2700} {"train_loss": -24.339824676513672, "global_step": 224120, "epoch": 2700} {"train_loss": -24.43122100830078, "global_step": 224121, "epoch": 2700} {"train_loss": -24.5247859954834, "global_step": 224122, "epoch": 2700} {"train_loss": -24.434856414794922, "global_step": 224123, "epoch": 2700} {"train_loss": -24.482545852661133, "global_step": 224124, "epoch": 2700} {"train_loss": -24.497650146484375, "global_step": 224125, "epoch": 2700} {"train_loss": -24.373035430908203, "global_step": 224126, "epoch": 2700} {"train_loss": -24.50144386291504, "global_step": 224127, "epoch": 2700} {"train_loss": -24.51032257080078, "global_step": 224128, "epoch": 2700} {"train_loss": -24.328737258911133, "global_step": 224129, "epoch": 2700} {"train_loss": -24.512798309326172, "global_step": 224130, "epoch": 2700} {"train_loss": -24.979984283447266, "global_step": 224131, "epoch": 2700} {"train_loss": -24.62456703186035, "global_step": 224132, "epoch": 2700} {"train_loss": -24.425914764404297, "global_step": 224133, "epoch": 2700} {"train_loss": -24.572587966918945, "global_step": 224134, "epoch": 2700} {"train_loss": -24.208072662353516, "global_step": 224135, "epoch": 2700} {"train_loss": -24.409320831298828, "global_step": 224136, "epoch": 2700} {"train_loss": -24.677814483642578, "global_step": 224137, "epoch": 2700} {"train_loss": -24.980270385742188, "global_step": 224138, "epoch": 2700} {"train_loss": -24.604082107543945, "global_step": 224139, "epoch": 2700} {"train_loss": -24.67902183532715, "global_step": 224140, "epoch": 2700} {"train_loss": -24.601591110229492, "global_step": 224141, "epoch": 2700} {"train_loss": -24.38032341003418, "global_step": 224142, "epoch": 2700} {"train_loss": -24.76418113708496, "global_step": 224143, "epoch": 2700} {"train_loss": -24.78504753112793, "global_step": 224144, "epoch": 2700} {"train_loss": -24.473724365234375, "global_step": 224145, "epoch": 2700} {"train_loss": -24.714689254760742, "global_step": 224146, "epoch": 2700} {"train_loss": -24.764249801635742, "global_step": 224147, "epoch": 2700} {"train_loss": -24.869123458862305, "global_step": 224148, "epoch": 2700} {"train_loss": -24.853700637817383, "global_step": 224149, "epoch": 2700} {"train_loss": -24.767704010009766, "global_step": 224150, "epoch": 2700} {"train_loss": -24.806909561157227, "global_step": 224151, "epoch": 2700} {"train_loss": -24.7343692779541, "global_step": 224152, "epoch": 2700} {"train_loss": -24.286914825439453, "global_step": 224153, "epoch": 2700} {"train_loss": -24.01508140563965, "global_step": 224154, "epoch": 2700} {"train_loss": -24.32734489440918, "global_step": 224155, "epoch": 2700} {"train_loss": -24.763675689697266, "global_step": 224156, "epoch": 2700} {"train_loss": -24.7692928314209, "global_step": 224157, "epoch": 2700} {"train_loss": -24.3016300201416, "global_step": 224158, "epoch": 2700} {"train_loss": -24.994373321533203, "global_step": 224159, "epoch": 2700} {"train_loss": -24.713258743286133, "global_step": 224160, "epoch": 2700} {"train_loss": -24.890592575073242, "global_step": 224161, "epoch": 2700} {"train_loss": -24.900867462158203, "global_step": 224162, "epoch": 2700} {"train_loss": -24.647043228149414, "global_step": 224163, "epoch": 2700} {"train_loss": -24.753952026367188, "global_step": 224164, "epoch": 2700} {"train_loss": -24.86991310119629, "global_step": 224165, "epoch": 2700} {"train_loss": -24.589599609375, "global_step": 224166, "epoch": 2700} {"train_loss": -24.653072357177734, "global_step": 224167, "epoch": 2700} {"train_loss": -24.623533248901367, "global_step": 224168, "epoch": 2700} {"train_loss": -24.62948989868164, "global_step": 224169, "epoch": 2700} {"train_loss": -24.494068145751953, "global_step": 224170, "epoch": 2700} {"train_loss": -24.613454818725586, "global_step": 224171, "epoch": 2700} {"train_loss": -24.321807861328125, "global_step": 224172, "epoch": 2700} {"train_loss": -24.68449592590332, "global_step": 224173, "epoch": 2700} {"train_loss": -24.737707138061523, "global_step": 224174, "epoch": 2700} {"train_loss": -25.130186080932617, "global_step": 224175, "epoch": 2700} {"train_loss": -24.10265350341797, "global_step": 224176, "epoch": 2700} {"train_loss": -24.652860641479492, "global_step": 224177, "epoch": 2700} {"train_loss": -24.286108016967773, "global_step": 224178, "epoch": 2700} {"train_loss": -24.68729019165039, "global_step": 224179, "epoch": 2700} {"train_loss": -24.844772338867188, "global_step": 224180, "epoch": 2700} {"train_loss": -24.67778968811035, "global_step": 224181, "epoch": 2700} {"train_loss": -24.49247210858816, "global_step": 224182, "epoch": 2700, "train/sim_max_reward_0": 1.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4500000": 1.0, "test/sim_max_reward_4500001": 1.0, "test/sim_max_reward_4500002": 1.0, "test/sim_max_reward_4500003": 1.0, "test/sim_max_reward_4500004": 0.0, "test/sim_max_reward_4500005": 1.0, "test/sim_max_reward_4500006": 1.0, "test/sim_max_reward_4500007": 0.0, "test/sim_max_reward_4500008": 1.0, "test/sim_max_reward_4500009": 1.0, "test/sim_max_reward_4500010": 1.0, "test/sim_max_reward_4500011": 1.0, "test/sim_max_reward_4500012": 1.0, "test/sim_max_reward_4500013": 0.0, "test/sim_max_reward_4500014": 1.0, "test/sim_max_reward_4500015": 1.0, "test/sim_max_reward_4500016": 1.0, "test/sim_max_reward_4500017": 1.0, "test/sim_max_reward_4500018": 1.0, "test/sim_max_reward_4500019": 1.0, "test/sim_max_reward_4500020": 1.0, "test/sim_max_reward_4500021": 1.0, "train/mean_score": 1.0, "test/mean_score": 0.8636363636363636, "val_loss": 6823041.5} {"train_loss": -24.442285537719727, "global_step": 224183, "epoch": 2701} {"train_loss": -24.287460327148438, "global_step": 224184, "epoch": 2701} {"train_loss": -23.5649471282959, "global_step": 224185, "epoch": 2701} {"train_loss": -23.834951400756836, "global_step": 224186, "epoch": 2701} {"train_loss": -24.46274757385254, "global_step": 224187, "epoch": 2701} {"train_loss": -24.276107788085938, "global_step": 224188, "epoch": 2701} {"train_loss": -24.0433406829834, "global_step": 224189, "epoch": 2701} {"train_loss": -24.086219787597656, "global_step": 224190, "epoch": 2701} {"train_loss": -24.516468048095703, "global_step": 224191, "epoch": 2701} {"train_loss": -24.328662872314453, "global_step": 224192, "epoch": 2701} {"train_loss": -24.176618576049805, "global_step": 224193, "epoch": 2701} {"train_loss": -24.499755859375, "global_step": 224194, "epoch": 2701} {"train_loss": -24.200347900390625, "global_step": 224195, "epoch": 2701} {"train_loss": -24.3925724029541, "global_step": 224196, "epoch": 2701} {"train_loss": -24.617002487182617, "global_step": 224197, "epoch": 2701} {"train_loss": -24.40009880065918, "global_step": 224198, "epoch": 2701} {"train_loss": -24.472509384155273, "global_step": 224199, "epoch": 2701} {"train_loss": -24.3140811920166, "global_step": 224200, "epoch": 2701} {"train_loss": -24.526264190673828, "global_step": 224201, "epoch": 2701} {"train_loss": -24.816083908081055, "global_step": 224202, "epoch": 2701} {"train_loss": -24.914215087890625, "global_step": 224203, "epoch": 2701} {"train_loss": -24.987682342529297, "global_step": 224204, "epoch": 2701} {"train_loss": -24.639551162719727, "global_step": 224205, "epoch": 2701} {"train_loss": -24.29049301147461, "global_step": 224206, "epoch": 2701} {"train_loss": -24.840030670166016, "global_step": 224207, "epoch": 2701} {"train_loss": -24.968698501586914, "global_step": 224208, "epoch": 2701} {"train_loss": -24.708038330078125, "global_step": 224209, "epoch": 2701} {"train_loss": -24.546642303466797, "global_step": 224210, "epoch": 2701} {"train_loss": -24.6085262298584, "global_step": 224211, "epoch": 2701} {"train_loss": -24.848758697509766, "global_step": 224212, "epoch": 2701} {"train_loss": -24.628454208374023, "global_step": 224213, "epoch": 2701} {"train_loss": -24.517616271972656, "global_step": 224214, "epoch": 2701} {"train_loss": -24.920162200927734, "global_step": 224215, "epoch": 2701} {"train_loss": -24.787851333618164, "global_step": 224216, "epoch": 2701} {"train_loss": -24.883760452270508, "global_step": 224217, "epoch": 2701} {"train_loss": -24.9852237701416, "global_step": 224218, "epoch": 2701} {"train_loss": -25.01547622680664, "global_step": 224219, "epoch": 2701} {"train_loss": -24.866485595703125, "global_step": 224220, "epoch": 2701} {"train_loss": -24.841291427612305, "global_step": 224221, "epoch": 2701} {"train_loss": -25.1499080657959, "global_step": 224222, "epoch": 2701} {"train_loss": -24.78969383239746, "global_step": 224223, "epoch": 2701} {"train_loss": -24.550132751464844, "global_step": 224224, "epoch": 2701} {"train_loss": -24.923542022705078, "global_step": 224225, "epoch": 2701} {"train_loss": -24.852331161499023, "global_step": 224226, "epoch": 2701} {"train_loss": -24.68918800354004, "global_step": 224227, "epoch": 2701} {"train_loss": -24.601408004760742, "global_step": 224228, "epoch": 2701} {"train_loss": -24.979202270507812, "global_step": 224229, "epoch": 2701} {"train_loss": -24.833419799804688, "global_step": 224230, "epoch": 2701} {"train_loss": -24.383310317993164, "global_step": 224231, "epoch": 2701} {"train_loss": -24.745182037353516, "global_step": 224232, "epoch": 2701} {"train_loss": -24.289960861206055, "global_step": 224233, "epoch": 2701} {"train_loss": -24.796422958374023, "global_step": 224234, "epoch": 2701} {"train_loss": -24.279953002929688, "global_step": 224235, "epoch": 2701} {"train_loss": -24.687936782836914, "global_step": 224236, "epoch": 2701} {"train_loss": -24.403568267822266, "global_step": 224237, "epoch": 2701} {"train_loss": -24.6015567779541, "global_step": 224238, "epoch": 2701} {"train_loss": -24.052507400512695, "global_step": 224239, "epoch": 2701} {"train_loss": -24.62477684020996, "global_step": 224240, "epoch": 2701} {"train_loss": -24.57345962524414, "global_step": 224241, "epoch": 2701} {"train_loss": -24.548974990844727, "global_step": 224242, "epoch": 2701} {"train_loss": -24.452836990356445, "global_step": 224243, "epoch": 2701} {"train_loss": -24.117069244384766, "global_step": 224244, "epoch": 2701} {"train_loss": -24.374032974243164, "global_step": 224245, "epoch": 2701} {"train_loss": -24.614490509033203, "global_step": 224246, "epoch": 2701} {"train_loss": -24.261402130126953, "global_step": 224247, "epoch": 2701} {"train_loss": -24.521154403686523, "global_step": 224248, "epoch": 2701} {"train_loss": -24.829547882080078, "global_step": 224249, "epoch": 2701} {"train_loss": -24.83341407775879, "global_step": 224250, "epoch": 2701} {"train_loss": -24.557937622070312, "global_step": 224251, "epoch": 2701} {"train_loss": -24.486602783203125, "global_step": 224252, "epoch": 2701} {"train_loss": -24.512920379638672, "global_step": 224253, "epoch": 2701} {"train_loss": -25.06842041015625, "global_step": 224254, "epoch": 2701} {"train_loss": -24.69596290588379, "global_step": 224255, "epoch": 2701} {"train_loss": -24.560033798217773, "global_step": 224256, "epoch": 2701} {"train_loss": -24.856313705444336, "global_step": 224257, "epoch": 2701} {"train_loss": -24.740530014038086, "global_step": 224258, "epoch": 2701} {"train_loss": -24.55219078063965, "global_step": 224259, "epoch": 2701} {"train_loss": -24.76270294189453, "global_step": 224260, "epoch": 2701} {"train_loss": -24.207712173461914, "global_step": 224261, "epoch": 2701} {"train_loss": -24.966571807861328, "global_step": 224262, "epoch": 2701} {"train_loss": -24.515522003173828, "global_step": 224263, "epoch": 2701} {"train_loss": -24.430877685546875, "global_step": 224264, "epoch": 2701} {"train_loss": -24.564378945224256, "global_step": 224265, "epoch": 2701, "val_loss": 6582579.0} {"train_loss": -24.43207359313965, "global_step": 224266, "epoch": 2702} {"train_loss": -24.631534576416016, "global_step": 224267, "epoch": 2702} {"train_loss": -24.626924514770508, "global_step": 224268, "epoch": 2702} {"train_loss": -24.05049705505371, "global_step": 224269, "epoch": 2702} {"train_loss": -24.66069984436035, "global_step": 224270, "epoch": 2702} {"train_loss": -24.230802536010742, "global_step": 224271, "epoch": 2702} {"train_loss": -24.3599796295166, "global_step": 224272, "epoch": 2702} {"train_loss": -25.059778213500977, "global_step": 224273, "epoch": 2702} {"train_loss": -24.331872940063477, "global_step": 224274, "epoch": 2702} {"train_loss": -24.631919860839844, "global_step": 224275, "epoch": 2702} {"train_loss": -24.49798583984375, "global_step": 224276, "epoch": 2702} {"train_loss": -24.4616756439209, "global_step": 224277, "epoch": 2702} {"train_loss": -24.463300704956055, "global_step": 224278, "epoch": 2702} {"train_loss": -24.551599502563477, "global_step": 224279, "epoch": 2702} {"train_loss": -24.653982162475586, "global_step": 224280, "epoch": 2702} {"train_loss": -24.808019638061523, "global_step": 224281, "epoch": 2702} {"train_loss": -24.829164505004883, "global_step": 224282, "epoch": 2702} {"train_loss": -24.690528869628906, "global_step": 224283, "epoch": 2702} {"train_loss": -24.757787704467773, "global_step": 224284, "epoch": 2702} {"train_loss": -24.59713363647461, "global_step": 224285, "epoch": 2702} {"train_loss": -25.06989860534668, "global_step": 224286, "epoch": 2702} {"train_loss": -24.713943481445312, "global_step": 224287, "epoch": 2702} {"train_loss": -24.719053268432617, "global_step": 224288, "epoch": 2702} {"train_loss": -24.47262954711914, "global_step": 224289, "epoch": 2702} {"train_loss": -24.13298988342285, "global_step": 224290, "epoch": 2702} {"train_loss": -24.299116134643555, "global_step": 224291, "epoch": 2702} {"train_loss": -23.99079704284668, "global_step": 224292, "epoch": 2702} {"train_loss": -24.536813735961914, "global_step": 224293, "epoch": 2702} {"train_loss": -24.422273635864258, "global_step": 224294, "epoch": 2702} {"train_loss": -24.699304580688477, "global_step": 224295, "epoch": 2702} {"train_loss": -24.712080001831055, "global_step": 224296, "epoch": 2702} {"train_loss": -24.28672218322754, "global_step": 224297, "epoch": 2702} {"train_loss": -24.506303787231445, "global_step": 224298, "epoch": 2702} {"train_loss": -24.689807891845703, "global_step": 224299, "epoch": 2702} {"train_loss": -24.414783477783203, "global_step": 224300, "epoch": 2702} {"train_loss": -24.4811954498291, "global_step": 224301, "epoch": 2702} {"train_loss": -24.633756637573242, "global_step": 224302, "epoch": 2702} {"train_loss": -24.578876495361328, "global_step": 224303, "epoch": 2702} {"train_loss": -24.805395126342773, "global_step": 224304, "epoch": 2702} {"train_loss": -24.633651733398438, "global_step": 224305, "epoch": 2702} {"train_loss": -24.57895278930664, "global_step": 224306, "epoch": 2702} {"train_loss": -25.09288787841797, "global_step": 224307, "epoch": 2702} {"train_loss": -24.575496673583984, "global_step": 224308, "epoch": 2702} {"train_loss": -24.146406173706055, "global_step": 224309, "epoch": 2702} {"train_loss": -24.893268585205078, "global_step": 224310, "epoch": 2702} {"train_loss": -24.463754653930664, "global_step": 224311, "epoch": 2702} {"train_loss": -24.404699325561523, "global_step": 224312, "epoch": 2702} {"train_loss": -24.567626953125, "global_step": 224313, "epoch": 2702} {"train_loss": -25.100404739379883, "global_step": 224314, "epoch": 2702} {"train_loss": -24.568098068237305, "global_step": 224315, "epoch": 2702} {"train_loss": -24.88284683227539, "global_step": 224316, "epoch": 2702} {"train_loss": -24.9080867767334, "global_step": 224317, "epoch": 2702} {"train_loss": -24.704282760620117, "global_step": 224318, "epoch": 2702} {"train_loss": -25.324052810668945, "global_step": 224319, "epoch": 2702} {"train_loss": -24.440021514892578, "global_step": 224320, "epoch": 2702} {"train_loss": -24.644174575805664, "global_step": 224321, "epoch": 2702} {"train_loss": -24.776508331298828, "global_step": 224322, "epoch": 2702} {"train_loss": -24.459741592407227, "global_step": 224323, "epoch": 2702} {"train_loss": -24.752595901489258, "global_step": 224324, "epoch": 2702} {"train_loss": -24.615833282470703, "global_step": 224325, "epoch": 2702} {"train_loss": -24.76727867126465, "global_step": 224326, "epoch": 2702} {"train_loss": -24.94512367248535, "global_step": 224327, "epoch": 2702} {"train_loss": -24.710233688354492, "global_step": 224328, "epoch": 2702} {"train_loss": -24.908796310424805, "global_step": 224329, "epoch": 2702} {"train_loss": -24.864856719970703, "global_step": 224330, "epoch": 2702} {"train_loss": -24.642820358276367, "global_step": 224331, "epoch": 2702} {"train_loss": -24.554990768432617, "global_step": 224332, "epoch": 2702} {"train_loss": -25.04220962524414, "global_step": 224333, "epoch": 2702} {"train_loss": -24.664575576782227, "global_step": 224334, "epoch": 2702} {"train_loss": -24.46675682067871, "global_step": 224335, "epoch": 2702} {"train_loss": -24.792781829833984, "global_step": 224336, "epoch": 2702} {"train_loss": -24.925870895385742, "global_step": 224337, "epoch": 2702} {"train_loss": -24.55915641784668, "global_step": 224338, "epoch": 2702} {"train_loss": -24.472599029541016, "global_step": 224339, "epoch": 2702} {"train_loss": -24.4835262298584, "global_step": 224340, "epoch": 2702} {"train_loss": -24.30671501159668, "global_step": 224341, "epoch": 2702} {"train_loss": -24.133573532104492, "global_step": 224342, "epoch": 2702} {"train_loss": -24.07997703552246, "global_step": 224343, "epoch": 2702} {"train_loss": -24.101322174072266, "global_step": 224344, "epoch": 2702} {"train_loss": -24.577646255493164, "global_step": 224345, "epoch": 2702} {"train_loss": -24.68024253845215, "global_step": 224346, "epoch": 2702} {"train_loss": -24.775257110595703, "global_step": 224347, "epoch": 2702} {"train_loss": -24.589563599552015, "global_step": 224348, "epoch": 2702, "val_loss": 6651527.0} {"train_loss": -23.614534378051758, "global_step": 224349, "epoch": 2703} {"train_loss": -24.062314987182617, "global_step": 224350, "epoch": 2703} {"train_loss": -23.534870147705078, "global_step": 224351, "epoch": 2703} {"train_loss": -23.664152145385742, "global_step": 224352, "epoch": 2703} {"train_loss": -24.091938018798828, "global_step": 224353, "epoch": 2703} {"train_loss": -23.736391067504883, "global_step": 224354, "epoch": 2703} {"train_loss": -23.62054443359375, "global_step": 224355, "epoch": 2703} {"train_loss": -23.755075454711914, "global_step": 224356, "epoch": 2703} {"train_loss": -23.966148376464844, "global_step": 224357, "epoch": 2703} {"train_loss": -23.90294075012207, "global_step": 224358, "epoch": 2703} {"train_loss": -24.277799606323242, "global_step": 224359, "epoch": 2703} {"train_loss": -24.247112274169922, "global_step": 224360, "epoch": 2703} {"train_loss": -24.156370162963867, "global_step": 224361, "epoch": 2703} {"train_loss": -24.46455955505371, "global_step": 224362, "epoch": 2703} {"train_loss": -23.853361129760742, "global_step": 224363, "epoch": 2703} {"train_loss": -24.0101261138916, "global_step": 224364, "epoch": 2703} {"train_loss": -24.608173370361328, "global_step": 224365, "epoch": 2703} {"train_loss": -24.37973976135254, "global_step": 224366, "epoch": 2703} {"train_loss": -24.764719009399414, "global_step": 224367, "epoch": 2703} {"train_loss": -24.508529663085938, "global_step": 224368, "epoch": 2703} {"train_loss": -24.668352127075195, "global_step": 224369, "epoch": 2703} {"train_loss": -24.459325790405273, "global_step": 224370, "epoch": 2703} {"train_loss": -24.3203182220459, "global_step": 224371, "epoch": 2703} {"train_loss": -24.523345947265625, "global_step": 224372, "epoch": 2703} {"train_loss": -24.723798751831055, "global_step": 224373, "epoch": 2703} {"train_loss": -24.68967628479004, "global_step": 224374, "epoch": 2703} {"train_loss": -24.320566177368164, "global_step": 224375, "epoch": 2703} {"train_loss": -24.383268356323242, "global_step": 224376, "epoch": 2703} {"train_loss": -24.649707794189453, "global_step": 224377, "epoch": 2703} {"train_loss": -24.71457290649414, "global_step": 224378, "epoch": 2703} {"train_loss": -24.892122268676758, "global_step": 224379, "epoch": 2703} {"train_loss": -24.675302505493164, "global_step": 224380, "epoch": 2703} {"train_loss": -24.544696807861328, "global_step": 224381, "epoch": 2703} {"train_loss": -24.679346084594727, "global_step": 224382, "epoch": 2703} {"train_loss": -24.66988754272461, "global_step": 224383, "epoch": 2703} {"train_loss": -24.813703536987305, "global_step": 224384, "epoch": 2703} {"train_loss": -24.91518211364746, "global_step": 224385, "epoch": 2703} {"train_loss": -24.762975692749023, "global_step": 224386, "epoch": 2703} {"train_loss": -24.85028839111328, "global_step": 224387, "epoch": 2703} {"train_loss": -25.123977661132812, "global_step": 224388, "epoch": 2703} {"train_loss": -25.20318603515625, "global_step": 224389, "epoch": 2703} {"train_loss": -24.584775924682617, "global_step": 224390, "epoch": 2703} {"train_loss": -24.4881534576416, "global_step": 224391, "epoch": 2703} {"train_loss": -24.37587547302246, "global_step": 224392, "epoch": 2703} {"train_loss": -24.778310775756836, "global_step": 224393, "epoch": 2703} {"train_loss": -24.834516525268555, "global_step": 224394, "epoch": 2703} {"train_loss": -24.78592872619629, "global_step": 224395, "epoch": 2703} {"train_loss": -24.78337860107422, "global_step": 224396, "epoch": 2703} {"train_loss": -24.794809341430664, "global_step": 224397, "epoch": 2703} {"train_loss": -24.663572311401367, "global_step": 224398, "epoch": 2703} {"train_loss": -24.758371353149414, "global_step": 224399, "epoch": 2703} {"train_loss": -24.547306060791016, "global_step": 224400, "epoch": 2703} {"train_loss": -24.88901710510254, "global_step": 224401, "epoch": 2703} {"train_loss": -24.477888107299805, "global_step": 224402, "epoch": 2703} {"train_loss": -24.330142974853516, "global_step": 224403, "epoch": 2703} {"train_loss": -25.114591598510742, "global_step": 224404, "epoch": 2703} {"train_loss": -24.20151710510254, "global_step": 224405, "epoch": 2703} {"train_loss": -24.60361099243164, "global_step": 224406, "epoch": 2703} {"train_loss": -24.437437057495117, "global_step": 224407, "epoch": 2703} {"train_loss": -24.50434684753418, "global_step": 224408, "epoch": 2703} {"train_loss": -24.31862449645996, "global_step": 224409, "epoch": 2703} {"train_loss": -23.951467514038086, "global_step": 224410, "epoch": 2703} {"train_loss": -23.428298950195312, "global_step": 224411, "epoch": 2703} {"train_loss": -23.816404342651367, "global_step": 224412, "epoch": 2703} {"train_loss": -24.14049530029297, "global_step": 224413, "epoch": 2703} {"train_loss": -24.70480728149414, "global_step": 224414, "epoch": 2703} {"train_loss": -24.45594596862793, "global_step": 224415, "epoch": 2703} {"train_loss": -24.6529598236084, "global_step": 224416, "epoch": 2703} {"train_loss": -24.515399932861328, "global_step": 224417, "epoch": 2703} {"train_loss": -24.378164291381836, "global_step": 224418, "epoch": 2703} {"train_loss": -24.60365104675293, "global_step": 224419, "epoch": 2703} {"train_loss": -24.294553756713867, "global_step": 224420, "epoch": 2703} {"train_loss": -24.463825225830078, "global_step": 224421, "epoch": 2703} {"train_loss": -24.214153289794922, "global_step": 224422, "epoch": 2703} {"train_loss": -24.742584228515625, "global_step": 224423, "epoch": 2703} {"train_loss": -24.580045700073242, "global_step": 224424, "epoch": 2703} {"train_loss": -24.69385528564453, "global_step": 224425, "epoch": 2703} {"train_loss": -24.633024215698242, "global_step": 224426, "epoch": 2703} {"train_loss": -24.472524642944336, "global_step": 224427, "epoch": 2703} {"train_loss": -24.39113426208496, "global_step": 224428, "epoch": 2703} {"train_loss": -24.394529342651367, "global_step": 224429, "epoch": 2703} {"train_loss": -24.600006103515625, "global_step": 224430, "epoch": 2703} {"train_loss": -24.444874981799757, "global_step": 224431, "epoch": 2703, "val_loss": 6811215.0} {"train_loss": -24.009750366210938, "global_step": 224432, "epoch": 2704} {"train_loss": -24.021484375, "global_step": 224433, "epoch": 2704} {"train_loss": -24.095184326171875, "global_step": 224434, "epoch": 2704} {"train_loss": -24.087553024291992, "global_step": 224435, "epoch": 2704} {"train_loss": -24.109905242919922, "global_step": 224436, "epoch": 2704} {"train_loss": -24.274744033813477, "global_step": 224437, "epoch": 2704} {"train_loss": -24.08349609375, "global_step": 224438, "epoch": 2704} {"train_loss": -24.30775260925293, "global_step": 224439, "epoch": 2704} {"train_loss": -24.403146743774414, "global_step": 224440, "epoch": 2704} {"train_loss": -24.11557388305664, "global_step": 224441, "epoch": 2704} {"train_loss": -24.600875854492188, "global_step": 224442, "epoch": 2704} {"train_loss": -24.151763916015625, "global_step": 224443, "epoch": 2704} {"train_loss": -24.607139587402344, "global_step": 224444, "epoch": 2704} {"train_loss": -24.436668395996094, "global_step": 224445, "epoch": 2704} {"train_loss": -24.59805679321289, "global_step": 224446, "epoch": 2704} {"train_loss": -24.667491912841797, "global_step": 224447, "epoch": 2704} {"train_loss": -24.526559829711914, "global_step": 224448, "epoch": 2704} {"train_loss": -24.565900802612305, "global_step": 224449, "epoch": 2704} {"train_loss": -24.643280029296875, "global_step": 224450, "epoch": 2704} {"train_loss": -24.606374740600586, "global_step": 224451, "epoch": 2704} {"train_loss": -24.38899040222168, "global_step": 224452, "epoch": 2704} {"train_loss": -24.80453872680664, "global_step": 224453, "epoch": 2704} {"train_loss": -24.312978744506836, "global_step": 224454, "epoch": 2704} {"train_loss": -24.705106735229492, "global_step": 224455, "epoch": 2704} {"train_loss": -24.454940795898438, "global_step": 224456, "epoch": 2704} {"train_loss": -24.496662139892578, "global_step": 224457, "epoch": 2704} {"train_loss": -24.521451950073242, "global_step": 224458, "epoch": 2704} {"train_loss": -24.694196701049805, "global_step": 224459, "epoch": 2704} {"train_loss": -24.44489860534668, "global_step": 224460, "epoch": 2704} {"train_loss": -24.55360221862793, "global_step": 224461, "epoch": 2704} {"train_loss": -24.481550216674805, "global_step": 224462, "epoch": 2704} {"train_loss": -24.6417236328125, "global_step": 224463, "epoch": 2704} {"train_loss": -24.418230056762695, "global_step": 224464, "epoch": 2704} {"train_loss": -24.401365280151367, "global_step": 224465, "epoch": 2704} {"train_loss": -24.62879753112793, "global_step": 224466, "epoch": 2704} {"train_loss": -24.49714469909668, "global_step": 224467, "epoch": 2704} {"train_loss": -24.858125686645508, "global_step": 224468, "epoch": 2704} {"train_loss": -24.51710319519043, "global_step": 224469, "epoch": 2704} {"train_loss": -24.726747512817383, "global_step": 224470, "epoch": 2704} {"train_loss": -24.744293212890625, "global_step": 224471, "epoch": 2704} {"train_loss": -24.475290298461914, "global_step": 224472, "epoch": 2704} {"train_loss": -24.432849884033203, "global_step": 224473, "epoch": 2704} {"train_loss": -24.97788429260254, "global_step": 224474, "epoch": 2704} {"train_loss": -24.659130096435547, "global_step": 224475, "epoch": 2704} {"train_loss": -24.708398818969727, "global_step": 224476, "epoch": 2704} {"train_loss": -24.826627731323242, "global_step": 224477, "epoch": 2704} {"train_loss": -24.72382926940918, "global_step": 224478, "epoch": 2704} {"train_loss": -24.338308334350586, "global_step": 224479, "epoch": 2704} {"train_loss": -24.823230743408203, "global_step": 224480, "epoch": 2704} {"train_loss": -24.93037223815918, "global_step": 224481, "epoch": 2704} {"train_loss": -25.456724166870117, "global_step": 224482, "epoch": 2704} {"train_loss": -24.6733455657959, "global_step": 224483, "epoch": 2704} {"train_loss": -24.85245132446289, "global_step": 224484, "epoch": 2704} {"train_loss": -24.654783248901367, "global_step": 224485, "epoch": 2704} {"train_loss": -24.716968536376953, "global_step": 224486, "epoch": 2704} {"train_loss": -24.533706665039062, "global_step": 224487, "epoch": 2704} {"train_loss": -24.714454650878906, "global_step": 224488, "epoch": 2704} {"train_loss": -25.090534210205078, "global_step": 224489, "epoch": 2704} {"train_loss": -24.954843521118164, "global_step": 224490, "epoch": 2704} {"train_loss": -24.576581954956055, "global_step": 224491, "epoch": 2704} {"train_loss": -24.219274520874023, "global_step": 224492, "epoch": 2704} {"train_loss": -24.643985748291016, "global_step": 224493, "epoch": 2704} {"train_loss": -24.89763641357422, "global_step": 224494, "epoch": 2704} {"train_loss": -24.26568603515625, "global_step": 224495, "epoch": 2704} {"train_loss": -24.237529754638672, "global_step": 224496, "epoch": 2704} {"train_loss": -24.313026428222656, "global_step": 224497, "epoch": 2704} {"train_loss": -24.5756893157959, "global_step": 224498, "epoch": 2704} {"train_loss": -24.81771469116211, "global_step": 224499, "epoch": 2704} {"train_loss": -24.240188598632812, "global_step": 224500, "epoch": 2704} {"train_loss": -24.54296875, "global_step": 224501, "epoch": 2704} {"train_loss": -24.49074363708496, "global_step": 224502, "epoch": 2704} {"train_loss": -24.429349899291992, "global_step": 224503, "epoch": 2704} {"train_loss": -24.59344482421875, "global_step": 224504, "epoch": 2704} {"train_loss": -24.337852478027344, "global_step": 224505, "epoch": 2704} {"train_loss": -24.470834732055664, "global_step": 224506, "epoch": 2704} {"train_loss": -23.975080490112305, "global_step": 224507, "epoch": 2704} {"train_loss": -24.356321334838867, "global_step": 224508, "epoch": 2704} {"train_loss": -24.7830867767334, "global_step": 224509, "epoch": 2704} {"train_loss": -24.496593475341797, "global_step": 224510, "epoch": 2704} {"train_loss": -24.407577514648438, "global_step": 224511, "epoch": 2704} {"train_loss": -24.300437927246094, "global_step": 224512, "epoch": 2704} {"train_loss": -24.604541778564453, "global_step": 224513, "epoch": 2704} {"train_loss": -24.540374480098126, "global_step": 224514, "epoch": 2704, "val_loss": 6799391.0} {"train_loss": -23.823598861694336, "global_step": 224515, "epoch": 2705} {"train_loss": -24.197622299194336, "global_step": 224516, "epoch": 2705} {"train_loss": -23.921598434448242, "global_step": 224517, "epoch": 2705} {"train_loss": -23.829992294311523, "global_step": 224518, "epoch": 2705} {"train_loss": -24.342370986938477, "global_step": 224519, "epoch": 2705} {"train_loss": -23.651952743530273, "global_step": 224520, "epoch": 2705} {"train_loss": -24.418384552001953, "global_step": 224521, "epoch": 2705} {"train_loss": -24.072967529296875, "global_step": 224522, "epoch": 2705} {"train_loss": -24.42289161682129, "global_step": 224523, "epoch": 2705} {"train_loss": -23.97925567626953, "global_step": 224524, "epoch": 2705} {"train_loss": -24.165983200073242, "global_step": 224525, "epoch": 2705} {"train_loss": -23.530115127563477, "global_step": 224526, "epoch": 2705} {"train_loss": -24.105607986450195, "global_step": 224527, "epoch": 2705} {"train_loss": -24.47565269470215, "global_step": 224528, "epoch": 2705} {"train_loss": -24.446195602416992, "global_step": 224529, "epoch": 2705} {"train_loss": -24.288606643676758, "global_step": 224530, "epoch": 2705} {"train_loss": -24.61884117126465, "global_step": 224531, "epoch": 2705} {"train_loss": -24.511566162109375, "global_step": 224532, "epoch": 2705} {"train_loss": -24.1583194732666, "global_step": 224533, "epoch": 2705} {"train_loss": -24.47199821472168, "global_step": 224534, "epoch": 2705} {"train_loss": -25.038944244384766, "global_step": 224535, "epoch": 2705} {"train_loss": -24.43722915649414, "global_step": 224536, "epoch": 2705} {"train_loss": -24.634557723999023, "global_step": 224537, "epoch": 2705} {"train_loss": -24.96329689025879, "global_step": 224538, "epoch": 2705} {"train_loss": -24.839475631713867, "global_step": 224539, "epoch": 2705} {"train_loss": -24.73191261291504, "global_step": 224540, "epoch": 2705} {"train_loss": -24.398313522338867, "global_step": 224541, "epoch": 2705} {"train_loss": -24.711288452148438, "global_step": 224542, "epoch": 2705} {"train_loss": -24.432077407836914, "global_step": 224543, "epoch": 2705} {"train_loss": -24.399280548095703, "global_step": 224544, "epoch": 2705} {"train_loss": -24.68691062927246, "global_step": 224545, "epoch": 2705} {"train_loss": -24.450729370117188, "global_step": 224546, "epoch": 2705} {"train_loss": -24.542400360107422, "global_step": 224547, "epoch": 2705} {"train_loss": -24.825048446655273, "global_step": 224548, "epoch": 2705} {"train_loss": -24.66965103149414, "global_step": 224549, "epoch": 2705} {"train_loss": -24.32160758972168, "global_step": 224550, "epoch": 2705} {"train_loss": -24.460269927978516, "global_step": 224551, "epoch": 2705} {"train_loss": -24.791105270385742, "global_step": 224552, "epoch": 2705} {"train_loss": -24.799379348754883, "global_step": 224553, "epoch": 2705} {"train_loss": -24.719247817993164, "global_step": 224554, "epoch": 2705} {"train_loss": -24.491350173950195, "global_step": 224555, "epoch": 2705} {"train_loss": -24.684730529785156, "global_step": 224556, "epoch": 2705} {"train_loss": -24.72066879272461, "global_step": 224557, "epoch": 2705} {"train_loss": -24.415023803710938, "global_step": 224558, "epoch": 2705} {"train_loss": -24.88348388671875, "global_step": 224559, "epoch": 2705} {"train_loss": -24.52547264099121, "global_step": 224560, "epoch": 2705} {"train_loss": -24.93269920349121, "global_step": 224561, "epoch": 2705} {"train_loss": -25.26911735534668, "global_step": 224562, "epoch": 2705} {"train_loss": -24.87002944946289, "global_step": 224563, "epoch": 2705} {"train_loss": -24.994169235229492, "global_step": 224564, "epoch": 2705} {"train_loss": -24.73972511291504, "global_step": 224565, "epoch": 2705} {"train_loss": -24.855409622192383, "global_step": 224566, "epoch": 2705} {"train_loss": -24.693256378173828, "global_step": 224567, "epoch": 2705} {"train_loss": -25.028135299682617, "global_step": 224568, "epoch": 2705} {"train_loss": -24.782459259033203, "global_step": 224569, "epoch": 2705} {"train_loss": -24.890573501586914, "global_step": 224570, "epoch": 2705} {"train_loss": -24.7110538482666, "global_step": 224571, "epoch": 2705} {"train_loss": -24.4796199798584, "global_step": 224572, "epoch": 2705} {"train_loss": -24.790136337280273, "global_step": 224573, "epoch": 2705} {"train_loss": -24.90431022644043, "global_step": 224574, "epoch": 2705} {"train_loss": -24.592483520507812, "global_step": 224575, "epoch": 2705} {"train_loss": -24.50251007080078, "global_step": 224576, "epoch": 2705} {"train_loss": -24.097280502319336, "global_step": 224577, "epoch": 2705} {"train_loss": -22.89670181274414, "global_step": 224578, "epoch": 2705} {"train_loss": -23.475914001464844, "global_step": 224579, "epoch": 2705} {"train_loss": -24.34373664855957, "global_step": 224580, "epoch": 2705} {"train_loss": -24.156757354736328, "global_step": 224581, "epoch": 2705} {"train_loss": -24.033613204956055, "global_step": 224582, "epoch": 2705} {"train_loss": -24.607961654663086, "global_step": 224583, "epoch": 2705} {"train_loss": -23.946367263793945, "global_step": 224584, "epoch": 2705} {"train_loss": -24.297306060791016, "global_step": 224585, "epoch": 2705} {"train_loss": -23.861711502075195, "global_step": 224586, "epoch": 2705} {"train_loss": -24.265443801879883, "global_step": 224587, "epoch": 2705} {"train_loss": -24.575223922729492, "global_step": 224588, "epoch": 2705} {"train_loss": -24.2271785736084, "global_step": 224589, "epoch": 2705} {"train_loss": -24.671968460083008, "global_step": 224590, "epoch": 2705} {"train_loss": -24.527761459350586, "global_step": 224591, "epoch": 2705} {"train_loss": -24.788150787353516, "global_step": 224592, "epoch": 2705} {"train_loss": -24.4047908782959, "global_step": 224593, "epoch": 2705} {"train_loss": -24.368820190429688, "global_step": 224594, "epoch": 2705} {"train_loss": -24.71436882019043, "global_step": 224595, "epoch": 2705} {"train_loss": -24.47876739501953, "global_step": 224596, "epoch": 2705} {"train_loss": -24.439071862094373, "global_step": 224597, "epoch": 2705, "val_loss": 6616922.0} {"train_loss": -23.956235885620117, "global_step": 224598, "epoch": 2706} {"train_loss": -23.87598419189453, "global_step": 224599, "epoch": 2706} {"train_loss": -23.979454040527344, "global_step": 224600, "epoch": 2706} {"train_loss": -24.061100006103516, "global_step": 224601, "epoch": 2706} {"train_loss": -24.200658798217773, "global_step": 224602, "epoch": 2706} {"train_loss": -24.5356388092041, "global_step": 224603, "epoch": 2706} {"train_loss": -24.068622589111328, "global_step": 224604, "epoch": 2706} {"train_loss": -23.981168746948242, "global_step": 224605, "epoch": 2706} {"train_loss": -24.269699096679688, "global_step": 224606, "epoch": 2706} {"train_loss": -24.115741729736328, "global_step": 224607, "epoch": 2706} {"train_loss": -24.235015869140625, "global_step": 224608, "epoch": 2706} {"train_loss": -24.611902236938477, "global_step": 224609, "epoch": 2706} {"train_loss": -24.415863037109375, "global_step": 224610, "epoch": 2706} {"train_loss": -24.385948181152344, "global_step": 224611, "epoch": 2706} {"train_loss": -24.514602661132812, "global_step": 224612, "epoch": 2706} {"train_loss": -24.975610733032227, "global_step": 224613, "epoch": 2706} {"train_loss": -24.533477783203125, "global_step": 224614, "epoch": 2706} {"train_loss": -24.689489364624023, "global_step": 224615, "epoch": 2706} {"train_loss": -24.578027725219727, "global_step": 224616, "epoch": 2706} {"train_loss": -24.50293731689453, "global_step": 224617, "epoch": 2706} {"train_loss": -24.558637619018555, "global_step": 224618, "epoch": 2706} {"train_loss": -24.562700271606445, "global_step": 224619, "epoch": 2706} {"train_loss": -24.454038619995117, "global_step": 224620, "epoch": 2706} {"train_loss": -24.585458755493164, "global_step": 224621, "epoch": 2706} {"train_loss": -24.581323623657227, "global_step": 224622, "epoch": 2706} {"train_loss": -24.53390884399414, "global_step": 224623, "epoch": 2706} {"train_loss": -24.845556259155273, "global_step": 224624, "epoch": 2706} {"train_loss": -24.619916915893555, "global_step": 224625, "epoch": 2706} {"train_loss": -24.64960289001465, "global_step": 224626, "epoch": 2706} {"train_loss": -24.7359676361084, "global_step": 224627, "epoch": 2706} {"train_loss": -24.51776695251465, "global_step": 224628, "epoch": 2706} {"train_loss": -24.614545822143555, "global_step": 224629, "epoch": 2706} {"train_loss": -24.685678482055664, "global_step": 224630, "epoch": 2706} {"train_loss": -24.483108520507812, "global_step": 224631, "epoch": 2706} {"train_loss": -24.849164962768555, "global_step": 224632, "epoch": 2706} {"train_loss": -24.575672149658203, "global_step": 224633, "epoch": 2706} {"train_loss": -25.01340103149414, "global_step": 224634, "epoch": 2706} {"train_loss": -24.519014358520508, "global_step": 224635, "epoch": 2706} {"train_loss": -24.883140563964844, "global_step": 224636, "epoch": 2706} {"train_loss": -24.61617088317871, "global_step": 224637, "epoch": 2706} {"train_loss": -24.900415420532227, "global_step": 224638, "epoch": 2706} {"train_loss": -24.46335792541504, "global_step": 224639, "epoch": 2706} {"train_loss": -24.58111000061035, "global_step": 224640, "epoch": 2706} {"train_loss": -24.852863311767578, "global_step": 224641, "epoch": 2706} {"train_loss": -24.845088958740234, "global_step": 224642, "epoch": 2706} {"train_loss": -24.607696533203125, "global_step": 224643, "epoch": 2706} {"train_loss": -24.21756362915039, "global_step": 224644, "epoch": 2706} {"train_loss": -24.172107696533203, "global_step": 224645, "epoch": 2706} {"train_loss": -24.076642990112305, "global_step": 224646, "epoch": 2706} {"train_loss": -24.71630096435547, "global_step": 224647, "epoch": 2706} {"train_loss": -24.758024215698242, "global_step": 224648, "epoch": 2706} {"train_loss": -24.179174423217773, "global_step": 224649, "epoch": 2706} {"train_loss": -24.695730209350586, "global_step": 224650, "epoch": 2706} {"train_loss": -24.27777099609375, "global_step": 224651, "epoch": 2706} {"train_loss": -24.4084529876709, "global_step": 224652, "epoch": 2706} {"train_loss": -24.72138023376465, "global_step": 224653, "epoch": 2706} {"train_loss": -24.23467254638672, "global_step": 224654, "epoch": 2706} {"train_loss": -24.59238624572754, "global_step": 224655, "epoch": 2706} {"train_loss": -23.86970329284668, "global_step": 224656, "epoch": 2706} {"train_loss": -24.52240562438965, "global_step": 224657, "epoch": 2706} {"train_loss": -24.285442352294922, "global_step": 224658, "epoch": 2706} {"train_loss": -24.72715950012207, "global_step": 224659, "epoch": 2706} {"train_loss": -24.49762535095215, "global_step": 224660, "epoch": 2706} {"train_loss": -24.352231979370117, "global_step": 224661, "epoch": 2706} {"train_loss": -24.958066940307617, "global_step": 224662, "epoch": 2706} {"train_loss": -24.444644927978516, "global_step": 224663, "epoch": 2706} {"train_loss": -24.33124351501465, "global_step": 224664, "epoch": 2706} {"train_loss": -24.41554069519043, "global_step": 224665, "epoch": 2706} {"train_loss": -24.64712905883789, "global_step": 224666, "epoch": 2706} {"train_loss": -24.719541549682617, "global_step": 224667, "epoch": 2706} {"train_loss": -24.62654685974121, "global_step": 224668, "epoch": 2706} {"train_loss": -24.55904197692871, "global_step": 224669, "epoch": 2706} {"train_loss": -24.673852920532227, "global_step": 224670, "epoch": 2706} {"train_loss": -25.00848960876465, "global_step": 224671, "epoch": 2706} {"train_loss": -24.429534912109375, "global_step": 224672, "epoch": 2706} {"train_loss": -24.93067169189453, "global_step": 224673, "epoch": 2706} {"train_loss": -24.921588897705078, "global_step": 224674, "epoch": 2706} {"train_loss": -24.893102645874023, "global_step": 224675, "epoch": 2706} {"train_loss": -24.182889938354492, "global_step": 224676, "epoch": 2706} {"train_loss": -24.644804000854492, "global_step": 224677, "epoch": 2706} {"train_loss": -24.892240524291992, "global_step": 224678, "epoch": 2706} {"train_loss": -25.115827560424805, "global_step": 224679, "epoch": 2706} {"train_loss": -24.535919878856244, "global_step": 224680, "epoch": 2706, "val_loss": 6681042.0} {"train_loss": -24.04953384399414, "global_step": 224681, "epoch": 2707} {"train_loss": -24.27410316467285, "global_step": 224682, "epoch": 2707} {"train_loss": -24.494474411010742, "global_step": 224683, "epoch": 2707} {"train_loss": -24.25154685974121, "global_step": 224684, "epoch": 2707} {"train_loss": -24.619428634643555, "global_step": 224685, "epoch": 2707} {"train_loss": -24.4177188873291, "global_step": 224686, "epoch": 2707} {"train_loss": -24.27845001220703, "global_step": 224687, "epoch": 2707} {"train_loss": -24.46052360534668, "global_step": 224688, "epoch": 2707} {"train_loss": -24.427154541015625, "global_step": 224689, "epoch": 2707} {"train_loss": -24.43058967590332, "global_step": 224690, "epoch": 2707} {"train_loss": -24.158567428588867, "global_step": 224691, "epoch": 2707} {"train_loss": -24.81490135192871, "global_step": 224692, "epoch": 2707} {"train_loss": -24.529094696044922, "global_step": 224693, "epoch": 2707} {"train_loss": -24.528547286987305, "global_step": 224694, "epoch": 2707} {"train_loss": -24.718978881835938, "global_step": 224695, "epoch": 2707} {"train_loss": -24.549352645874023, "global_step": 224696, "epoch": 2707} {"train_loss": -24.548818588256836, "global_step": 224697, "epoch": 2707} {"train_loss": -24.93177604675293, "global_step": 224698, "epoch": 2707} {"train_loss": -24.603994369506836, "global_step": 224699, "epoch": 2707} {"train_loss": -24.45828628540039, "global_step": 224700, "epoch": 2707} {"train_loss": -24.830406188964844, "global_step": 224701, "epoch": 2707} {"train_loss": -24.298877716064453, "global_step": 224702, "epoch": 2707} {"train_loss": -24.4912109375, "global_step": 224703, "epoch": 2707} {"train_loss": -24.64227294921875, "global_step": 224704, "epoch": 2707} {"train_loss": -24.717647552490234, "global_step": 224705, "epoch": 2707} {"train_loss": -24.593551635742188, "global_step": 224706, "epoch": 2707} {"train_loss": -24.892080307006836, "global_step": 224707, "epoch": 2707} {"train_loss": -25.083267211914062, "global_step": 224708, "epoch": 2707} {"train_loss": -24.313566207885742, "global_step": 224709, "epoch": 2707} {"train_loss": -24.726200103759766, "global_step": 224710, "epoch": 2707} {"train_loss": -24.728281021118164, "global_step": 224711, "epoch": 2707} {"train_loss": -24.62495231628418, "global_step": 224712, "epoch": 2707} {"train_loss": -24.82343864440918, "global_step": 224713, "epoch": 2707} {"train_loss": -24.86276626586914, "global_step": 224714, "epoch": 2707} {"train_loss": -24.77907371520996, "global_step": 224715, "epoch": 2707} {"train_loss": -24.926040649414062, "global_step": 224716, "epoch": 2707} {"train_loss": -24.65790367126465, "global_step": 224717, "epoch": 2707} {"train_loss": -24.720016479492188, "global_step": 224718, "epoch": 2707} {"train_loss": -24.646326065063477, "global_step": 224719, "epoch": 2707} {"train_loss": -24.523221969604492, "global_step": 224720, "epoch": 2707} {"train_loss": -24.685684204101562, "global_step": 224721, "epoch": 2707} {"train_loss": -24.95294761657715, "global_step": 224722, "epoch": 2707} {"train_loss": -24.662460327148438, "global_step": 224723, "epoch": 2707} {"train_loss": -24.55632972717285, "global_step": 224724, "epoch": 2707} {"train_loss": -24.70884895324707, "global_step": 224725, "epoch": 2707} {"train_loss": -24.923845291137695, "global_step": 224726, "epoch": 2707} {"train_loss": -24.384035110473633, "global_step": 224727, "epoch": 2707} {"train_loss": -24.951831817626953, "global_step": 224728, "epoch": 2707} {"train_loss": -24.377775192260742, "global_step": 224729, "epoch": 2707} {"train_loss": -24.724584579467773, "global_step": 224730, "epoch": 2707} {"train_loss": -24.567720413208008, "global_step": 224731, "epoch": 2707} {"train_loss": -24.760683059692383, "global_step": 224732, "epoch": 2707} {"train_loss": -24.810352325439453, "global_step": 224733, "epoch": 2707} {"train_loss": -25.135120391845703, "global_step": 224734, "epoch": 2707} {"train_loss": -24.968555450439453, "global_step": 224735, "epoch": 2707} {"train_loss": -24.64996910095215, "global_step": 224736, "epoch": 2707} {"train_loss": -24.87299919128418, "global_step": 224737, "epoch": 2707} {"train_loss": -24.722183227539062, "global_step": 224738, "epoch": 2707} {"train_loss": -24.926233291625977, "global_step": 224739, "epoch": 2707} {"train_loss": -24.802221298217773, "global_step": 224740, "epoch": 2707} {"train_loss": -24.804105758666992, "global_step": 224741, "epoch": 2707} {"train_loss": -24.66049575805664, "global_step": 224742, "epoch": 2707} {"train_loss": -24.746442794799805, "global_step": 224743, "epoch": 2707} {"train_loss": -24.644161224365234, "global_step": 224744, "epoch": 2707} {"train_loss": -24.993377685546875, "global_step": 224745, "epoch": 2707} {"train_loss": -25.083444595336914, "global_step": 224746, "epoch": 2707} {"train_loss": -24.783601760864258, "global_step": 224747, "epoch": 2707} {"train_loss": -24.9831600189209, "global_step": 224748, "epoch": 2707} {"train_loss": -24.842554092407227, "global_step": 224749, "epoch": 2707} {"train_loss": -24.774946212768555, "global_step": 224750, "epoch": 2707} {"train_loss": -24.47650146484375, "global_step": 224751, "epoch": 2707} {"train_loss": -24.383634567260742, "global_step": 224752, "epoch": 2707} {"train_loss": -24.774267196655273, "global_step": 224753, "epoch": 2707} {"train_loss": -24.801694869995117, "global_step": 224754, "epoch": 2707} {"train_loss": -24.498323440551758, "global_step": 224755, "epoch": 2707} {"train_loss": -24.655120849609375, "global_step": 224756, "epoch": 2707} {"train_loss": -24.33416175842285, "global_step": 224757, "epoch": 2707} {"train_loss": -24.656757354736328, "global_step": 224758, "epoch": 2707} {"train_loss": -24.59902000427246, "global_step": 224759, "epoch": 2707} {"train_loss": -24.602798461914062, "global_step": 224760, "epoch": 2707} {"train_loss": -24.449430465698242, "global_step": 224761, "epoch": 2707} {"train_loss": -24.520483016967773, "global_step": 224762, "epoch": 2707} {"train_loss": -24.65568103560482, "global_step": 224763, "epoch": 2707, "val_loss": 6641747.0} {"train_loss": -24.24558448791504, "global_step": 224764, "epoch": 2708} {"train_loss": -24.341764450073242, "global_step": 224765, "epoch": 2708} {"train_loss": -24.335447311401367, "global_step": 224766, "epoch": 2708} {"train_loss": -24.264312744140625, "global_step": 224767, "epoch": 2708} {"train_loss": -24.066570281982422, "global_step": 224768, "epoch": 2708} {"train_loss": -24.207124710083008, "global_step": 224769, "epoch": 2708} {"train_loss": -23.9941463470459, "global_step": 224770, "epoch": 2708} {"train_loss": -24.404714584350586, "global_step": 224771, "epoch": 2708} {"train_loss": -24.34581756591797, "global_step": 224772, "epoch": 2708} {"train_loss": -24.46687126159668, "global_step": 224773, "epoch": 2708} {"train_loss": -24.73976707458496, "global_step": 224774, "epoch": 2708} {"train_loss": -24.424131393432617, "global_step": 224775, "epoch": 2708} {"train_loss": -24.39450454711914, "global_step": 224776, "epoch": 2708} {"train_loss": -24.50806999206543, "global_step": 224777, "epoch": 2708} {"train_loss": -24.532926559448242, "global_step": 224778, "epoch": 2708} {"train_loss": -24.619997024536133, "global_step": 224779, "epoch": 2708} {"train_loss": -24.959209442138672, "global_step": 224780, "epoch": 2708} {"train_loss": -24.68205451965332, "global_step": 224781, "epoch": 2708} {"train_loss": -24.50613784790039, "global_step": 224782, "epoch": 2708} {"train_loss": -24.33335304260254, "global_step": 224783, "epoch": 2708} {"train_loss": -24.60626220703125, "global_step": 224784, "epoch": 2708} {"train_loss": -24.62299919128418, "global_step": 224785, "epoch": 2708} {"train_loss": -24.570419311523438, "global_step": 224786, "epoch": 2708} {"train_loss": -24.644384384155273, "global_step": 224787, "epoch": 2708} {"train_loss": -24.561830520629883, "global_step": 224788, "epoch": 2708} {"train_loss": -24.76532554626465, "global_step": 224789, "epoch": 2708} {"train_loss": -24.62863540649414, "global_step": 224790, "epoch": 2708} {"train_loss": -24.43979263305664, "global_step": 224791, "epoch": 2708} {"train_loss": -24.891103744506836, "global_step": 224792, "epoch": 2708} {"train_loss": -24.558923721313477, "global_step": 224793, "epoch": 2708} {"train_loss": -24.736196517944336, "global_step": 224794, "epoch": 2708} {"train_loss": -24.657377243041992, "global_step": 224795, "epoch": 2708} {"train_loss": -24.13202476501465, "global_step": 224796, "epoch": 2708} {"train_loss": -24.729963302612305, "global_step": 224797, "epoch": 2708} {"train_loss": -24.495101928710938, "global_step": 224798, "epoch": 2708} {"train_loss": -24.94409942626953, "global_step": 224799, "epoch": 2708} {"train_loss": -24.85858726501465, "global_step": 224800, "epoch": 2708} {"train_loss": -24.768903732299805, "global_step": 224801, "epoch": 2708} {"train_loss": -24.812894821166992, "global_step": 224802, "epoch": 2708} {"train_loss": -24.991361618041992, "global_step": 224803, "epoch": 2708} {"train_loss": -25.034696578979492, "global_step": 224804, "epoch": 2708} {"train_loss": -24.50494384765625, "global_step": 224805, "epoch": 2708} {"train_loss": -24.954818725585938, "global_step": 224806, "epoch": 2708} {"train_loss": -24.695392608642578, "global_step": 224807, "epoch": 2708} {"train_loss": -24.53792381286621, "global_step": 224808, "epoch": 2708} {"train_loss": -24.813413619995117, "global_step": 224809, "epoch": 2708} {"train_loss": -24.770334243774414, "global_step": 224810, "epoch": 2708} {"train_loss": -24.591297149658203, "global_step": 224811, "epoch": 2708} {"train_loss": -24.781217575073242, "global_step": 224812, "epoch": 2708} {"train_loss": -24.825607299804688, "global_step": 224813, "epoch": 2708} {"train_loss": -24.84227752685547, "global_step": 224814, "epoch": 2708} {"train_loss": -24.818878173828125, "global_step": 224815, "epoch": 2708} {"train_loss": -24.66476821899414, "global_step": 224816, "epoch": 2708} {"train_loss": -24.806346893310547, "global_step": 224817, "epoch": 2708} {"train_loss": -24.44010353088379, "global_step": 224818, "epoch": 2708} {"train_loss": -24.630615234375, "global_step": 224819, "epoch": 2708} {"train_loss": -24.386886596679688, "global_step": 224820, "epoch": 2708} {"train_loss": -24.858312606811523, "global_step": 224821, "epoch": 2708} {"train_loss": -24.944700241088867, "global_step": 224822, "epoch": 2708} {"train_loss": -24.667110443115234, "global_step": 224823, "epoch": 2708} {"train_loss": -24.648832321166992, "global_step": 224824, "epoch": 2708} {"train_loss": -24.452030181884766, "global_step": 224825, "epoch": 2708} {"train_loss": -24.77782440185547, "global_step": 224826, "epoch": 2708} {"train_loss": -24.6927547454834, "global_step": 224827, "epoch": 2708} {"train_loss": -24.752912521362305, "global_step": 224828, "epoch": 2708} {"train_loss": -24.576215744018555, "global_step": 224829, "epoch": 2708} {"train_loss": -24.374731063842773, "global_step": 224830, "epoch": 2708} {"train_loss": -24.716581344604492, "global_step": 224831, "epoch": 2708} {"train_loss": -24.584827423095703, "global_step": 224832, "epoch": 2708} {"train_loss": -24.235105514526367, "global_step": 224833, "epoch": 2708} {"train_loss": -24.458881378173828, "global_step": 224834, "epoch": 2708} {"train_loss": -24.761022567749023, "global_step": 224835, "epoch": 2708} {"train_loss": -24.640979766845703, "global_step": 224836, "epoch": 2708} {"train_loss": -24.54793357849121, "global_step": 224837, "epoch": 2708} {"train_loss": -24.452329635620117, "global_step": 224838, "epoch": 2708} {"train_loss": -24.48238182067871, "global_step": 224839, "epoch": 2708} {"train_loss": -24.952505111694336, "global_step": 224840, "epoch": 2708} {"train_loss": -24.80366325378418, "global_step": 224841, "epoch": 2708} {"train_loss": -24.590774536132812, "global_step": 224842, "epoch": 2708} {"train_loss": -24.83586311340332, "global_step": 224843, "epoch": 2708} {"train_loss": -24.735944747924805, "global_step": 224844, "epoch": 2708} {"train_loss": -24.495901107788086, "global_step": 224845, "epoch": 2708} {"train_loss": -24.61950134369264, "global_step": 224846, "epoch": 2708, "val_loss": 6687732.0} {"train_loss": -24.53322410583496, "global_step": 224847, "epoch": 2709} {"train_loss": -24.576387405395508, "global_step": 224848, "epoch": 2709} {"train_loss": -24.478343963623047, "global_step": 224849, "epoch": 2709} {"train_loss": -24.355350494384766, "global_step": 224850, "epoch": 2709} {"train_loss": -24.15127944946289, "global_step": 224851, "epoch": 2709} {"train_loss": -24.3724308013916, "global_step": 224852, "epoch": 2709} {"train_loss": -24.35410499572754, "global_step": 224853, "epoch": 2709} {"train_loss": -24.116989135742188, "global_step": 224854, "epoch": 2709} {"train_loss": -24.16249656677246, "global_step": 224855, "epoch": 2709} {"train_loss": -23.933746337890625, "global_step": 224856, "epoch": 2709} {"train_loss": -24.77326774597168, "global_step": 224857, "epoch": 2709} {"train_loss": -24.507474899291992, "global_step": 224858, "epoch": 2709} {"train_loss": -24.66020393371582, "global_step": 224859, "epoch": 2709} {"train_loss": -24.749290466308594, "global_step": 224860, "epoch": 2709} {"train_loss": -24.133249282836914, "global_step": 224861, "epoch": 2709} {"train_loss": -24.845901489257812, "global_step": 224862, "epoch": 2709} {"train_loss": -24.45249366760254, "global_step": 224863, "epoch": 2709} {"train_loss": -24.69667625427246, "global_step": 224864, "epoch": 2709} {"train_loss": -24.391996383666992, "global_step": 224865, "epoch": 2709} {"train_loss": -24.376928329467773, "global_step": 224866, "epoch": 2709} {"train_loss": -24.632905960083008, "global_step": 224867, "epoch": 2709} {"train_loss": -24.54050064086914, "global_step": 224868, "epoch": 2709} {"train_loss": -24.761316299438477, "global_step": 224869, "epoch": 2709} {"train_loss": -24.525907516479492, "global_step": 224870, "epoch": 2709} {"train_loss": -24.476411819458008, "global_step": 224871, "epoch": 2709} {"train_loss": -24.583568572998047, "global_step": 224872, "epoch": 2709} {"train_loss": -24.904787063598633, "global_step": 224873, "epoch": 2709} {"train_loss": -24.14618492126465, "global_step": 224874, "epoch": 2709} {"train_loss": -24.828296661376953, "global_step": 224875, "epoch": 2709} {"train_loss": -24.634260177612305, "global_step": 224876, "epoch": 2709} {"train_loss": -24.60015296936035, "global_step": 224877, "epoch": 2709} {"train_loss": -24.49294662475586, "global_step": 224878, "epoch": 2709} {"train_loss": -25.236295700073242, "global_step": 224879, "epoch": 2709} {"train_loss": -24.953405380249023, "global_step": 224880, "epoch": 2709} {"train_loss": -24.839263916015625, "global_step": 224881, "epoch": 2709} {"train_loss": -24.504194259643555, "global_step": 224882, "epoch": 2709} {"train_loss": -24.19038963317871, "global_step": 224883, "epoch": 2709} {"train_loss": -24.781457901000977, "global_step": 224884, "epoch": 2709} {"train_loss": -24.23415756225586, "global_step": 224885, "epoch": 2709} {"train_loss": -24.174514770507812, "global_step": 224886, "epoch": 2709} {"train_loss": -24.821462631225586, "global_step": 224887, "epoch": 2709} {"train_loss": -24.671369552612305, "global_step": 224888, "epoch": 2709} {"train_loss": -23.99614906311035, "global_step": 224889, "epoch": 2709} {"train_loss": -24.328693389892578, "global_step": 224890, "epoch": 2709} {"train_loss": -24.263160705566406, "global_step": 224891, "epoch": 2709} {"train_loss": -24.533246994018555, "global_step": 224892, "epoch": 2709} {"train_loss": -24.495603561401367, "global_step": 224893, "epoch": 2709} {"train_loss": -24.68936538696289, "global_step": 224894, "epoch": 2709} {"train_loss": -24.587661743164062, "global_step": 224895, "epoch": 2709} {"train_loss": -24.11033058166504, "global_step": 224896, "epoch": 2709} {"train_loss": -24.812625885009766, "global_step": 224897, "epoch": 2709} {"train_loss": -24.475183486938477, "global_step": 224898, "epoch": 2709} {"train_loss": -24.615869522094727, "global_step": 224899, "epoch": 2709} {"train_loss": -24.50565528869629, "global_step": 224900, "epoch": 2709} {"train_loss": -24.429853439331055, "global_step": 224901, "epoch": 2709} {"train_loss": -24.557470321655273, "global_step": 224902, "epoch": 2709} {"train_loss": -24.265541076660156, "global_step": 224903, "epoch": 2709} {"train_loss": -24.48445701599121, "global_step": 224904, "epoch": 2709} {"train_loss": -24.625080108642578, "global_step": 224905, "epoch": 2709} {"train_loss": -24.542003631591797, "global_step": 224906, "epoch": 2709} {"train_loss": -24.5830135345459, "global_step": 224907, "epoch": 2709} {"train_loss": -24.59846305847168, "global_step": 224908, "epoch": 2709} {"train_loss": -24.516870498657227, "global_step": 224909, "epoch": 2709} {"train_loss": -24.519878387451172, "global_step": 224910, "epoch": 2709} {"train_loss": -24.595230102539062, "global_step": 224911, "epoch": 2709} {"train_loss": -24.536968231201172, "global_step": 224912, "epoch": 2709} {"train_loss": -24.71627426147461, "global_step": 224913, "epoch": 2709} {"train_loss": -24.7641658782959, "global_step": 224914, "epoch": 2709} {"train_loss": -24.8437557220459, "global_step": 224915, "epoch": 2709} {"train_loss": -24.951663970947266, "global_step": 224916, "epoch": 2709} {"train_loss": -24.539274215698242, "global_step": 224917, "epoch": 2709} {"train_loss": -24.983383178710938, "global_step": 224918, "epoch": 2709} {"train_loss": -24.865745544433594, "global_step": 224919, "epoch": 2709} {"train_loss": -24.286239624023438, "global_step": 224920, "epoch": 2709} {"train_loss": -24.53340721130371, "global_step": 224921, "epoch": 2709} {"train_loss": -24.769319534301758, "global_step": 224922, "epoch": 2709} {"train_loss": -24.734037399291992, "global_step": 224923, "epoch": 2709} {"train_loss": -24.89277458190918, "global_step": 224924, "epoch": 2709} {"train_loss": -24.480451583862305, "global_step": 224925, "epoch": 2709} {"train_loss": -24.69074821472168, "global_step": 224926, "epoch": 2709} {"train_loss": -24.761737823486328, "global_step": 224927, "epoch": 2709} {"train_loss": -24.410980224609375, "global_step": 224928, "epoch": 2709} {"train_loss": -24.572207646197583, "global_step": 224929, "epoch": 2709, "val_loss": 6752798.0} {"train_loss": -23.874662399291992, "global_step": 224930, "epoch": 2710} {"train_loss": -23.63016128540039, "global_step": 224931, "epoch": 2710} {"train_loss": -23.97260093688965, "global_step": 224932, "epoch": 2710} {"train_loss": -24.174030303955078, "global_step": 224933, "epoch": 2710} {"train_loss": -23.99037742614746, "global_step": 224934, "epoch": 2710} {"train_loss": -24.01556396484375, "global_step": 224935, "epoch": 2710} {"train_loss": -24.41275978088379, "global_step": 224936, "epoch": 2710} {"train_loss": -23.989944458007812, "global_step": 224937, "epoch": 2710} {"train_loss": -24.286283493041992, "global_step": 224938, "epoch": 2710} {"train_loss": -24.341995239257812, "global_step": 224939, "epoch": 2710} {"train_loss": -24.360244750976562, "global_step": 224940, "epoch": 2710} {"train_loss": -24.607961654663086, "global_step": 224941, "epoch": 2710} {"train_loss": -24.353952407836914, "global_step": 224942, "epoch": 2710} {"train_loss": -24.411962509155273, "global_step": 224943, "epoch": 2710} {"train_loss": -24.52825927734375, "global_step": 224944, "epoch": 2710} {"train_loss": -24.205360412597656, "global_step": 224945, "epoch": 2710} {"train_loss": -24.637332916259766, "global_step": 224946, "epoch": 2710} {"train_loss": -24.64896011352539, "global_step": 224947, "epoch": 2710} {"train_loss": -24.297758102416992, "global_step": 224948, "epoch": 2710} {"train_loss": -24.417871475219727, "global_step": 224949, "epoch": 2710} {"train_loss": -24.367826461791992, "global_step": 224950, "epoch": 2710} {"train_loss": -24.46364402770996, "global_step": 224951, "epoch": 2710} {"train_loss": -24.830480575561523, "global_step": 224952, "epoch": 2710} {"train_loss": -24.40720558166504, "global_step": 224953, "epoch": 2710} {"train_loss": -24.554771423339844, "global_step": 224954, "epoch": 2710} {"train_loss": -24.710941314697266, "global_step": 224955, "epoch": 2710} {"train_loss": -24.8210506439209, "global_step": 224956, "epoch": 2710} {"train_loss": -24.943151473999023, "global_step": 224957, "epoch": 2710} {"train_loss": -24.77225685119629, "global_step": 224958, "epoch": 2710} {"train_loss": -24.81829071044922, "global_step": 224959, "epoch": 2710} {"train_loss": -24.349414825439453, "global_step": 224960, "epoch": 2710} {"train_loss": -24.433950424194336, "global_step": 224961, "epoch": 2710} {"train_loss": -24.55750846862793, "global_step": 224962, "epoch": 2710} {"train_loss": -24.581256866455078, "global_step": 224963, "epoch": 2710} {"train_loss": -24.88871192932129, "global_step": 224964, "epoch": 2710} {"train_loss": -24.534988403320312, "global_step": 224965, "epoch": 2710} {"train_loss": -24.802207946777344, "global_step": 224966, "epoch": 2710} {"train_loss": -24.597766876220703, "global_step": 224967, "epoch": 2710} {"train_loss": -24.517728805541992, "global_step": 224968, "epoch": 2710} {"train_loss": -24.50489616394043, "global_step": 224969, "epoch": 2710} {"train_loss": -24.515111923217773, "global_step": 224970, "epoch": 2710} {"train_loss": -24.61375617980957, "global_step": 224971, "epoch": 2710} {"train_loss": -24.51327896118164, "global_step": 224972, "epoch": 2710} {"train_loss": -24.6453914642334, "global_step": 224973, "epoch": 2710} {"train_loss": -24.606592178344727, "global_step": 224974, "epoch": 2710} {"train_loss": -24.443363189697266, "global_step": 224975, "epoch": 2710} {"train_loss": -24.691007614135742, "global_step": 224976, "epoch": 2710} {"train_loss": -25.065561294555664, "global_step": 224977, "epoch": 2710} {"train_loss": -24.68971824645996, "global_step": 224978, "epoch": 2710} {"train_loss": -24.670501708984375, "global_step": 224979, "epoch": 2710} {"train_loss": -24.535432815551758, "global_step": 224980, "epoch": 2710} {"train_loss": -24.73444175720215, "global_step": 224981, "epoch": 2710} {"train_loss": -24.78826141357422, "global_step": 224982, "epoch": 2710} {"train_loss": -24.597869873046875, "global_step": 224983, "epoch": 2710} {"train_loss": -24.61701774597168, "global_step": 224984, "epoch": 2710} {"train_loss": -24.775094985961914, "global_step": 224985, "epoch": 2710} {"train_loss": -24.79735565185547, "global_step": 224986, "epoch": 2710} {"train_loss": -24.48963165283203, "global_step": 224987, "epoch": 2710} {"train_loss": -24.649036407470703, "global_step": 224988, "epoch": 2710} {"train_loss": -24.844024658203125, "global_step": 224989, "epoch": 2710} {"train_loss": -24.673355102539062, "global_step": 224990, "epoch": 2710} {"train_loss": -24.901348114013672, "global_step": 224991, "epoch": 2710} {"train_loss": -24.627714157104492, "global_step": 224992, "epoch": 2710} {"train_loss": -24.850095748901367, "global_step": 224993, "epoch": 2710} {"train_loss": -24.60902214050293, "global_step": 224994, "epoch": 2710} {"train_loss": -24.1326961517334, "global_step": 224995, "epoch": 2710} {"train_loss": -24.546329498291016, "global_step": 224996, "epoch": 2710} {"train_loss": -24.925771713256836, "global_step": 224997, "epoch": 2710} {"train_loss": -24.52803611755371, "global_step": 224998, "epoch": 2710} {"train_loss": -24.925153732299805, "global_step": 224999, "epoch": 2710} {"train_loss": -24.55789566040039, "global_step": 225000, "epoch": 2710} {"train_loss": -24.79045295715332, "global_step": 225001, "epoch": 2710} {"train_loss": -24.384546279907227, "global_step": 225002, "epoch": 2710} {"train_loss": -24.474681854248047, "global_step": 225003, "epoch": 2710} {"train_loss": -24.41329002380371, "global_step": 225004, "epoch": 2710} {"train_loss": -24.5732421875, "global_step": 225005, "epoch": 2710} {"train_loss": -24.440092086791992, "global_step": 225006, "epoch": 2710} {"train_loss": -24.676908493041992, "global_step": 225007, "epoch": 2710} {"train_loss": -24.61875343322754, "global_step": 225008, "epoch": 2710} {"train_loss": -24.725360870361328, "global_step": 225009, "epoch": 2710} {"train_loss": -24.778013229370117, "global_step": 225010, "epoch": 2710} {"train_loss": -24.291234970092773, "global_step": 225011, "epoch": 2710} {"train_loss": -24.555566511958478, "global_step": 225012, "epoch": 2710, "val_loss": 6609272.0} {"train_loss": -24.191375732421875, "global_step": 225013, "epoch": 2711} {"train_loss": -24.323486328125, "global_step": 225014, "epoch": 2711} {"train_loss": -24.42652702331543, "global_step": 225015, "epoch": 2711} {"train_loss": -24.036277770996094, "global_step": 225016, "epoch": 2711} {"train_loss": -24.502683639526367, "global_step": 225017, "epoch": 2711} {"train_loss": -24.206153869628906, "global_step": 225018, "epoch": 2711} {"train_loss": -24.543405532836914, "global_step": 225019, "epoch": 2711} {"train_loss": -24.748031616210938, "global_step": 225020, "epoch": 2711} {"train_loss": -24.367542266845703, "global_step": 225021, "epoch": 2711} {"train_loss": -24.758970260620117, "global_step": 225022, "epoch": 2711} {"train_loss": -24.577260971069336, "global_step": 225023, "epoch": 2711} {"train_loss": -24.654773712158203, "global_step": 225024, "epoch": 2711} {"train_loss": -24.459238052368164, "global_step": 225025, "epoch": 2711} {"train_loss": -24.76727867126465, "global_step": 225026, "epoch": 2711} {"train_loss": -24.763320922851562, "global_step": 225027, "epoch": 2711} {"train_loss": -24.452953338623047, "global_step": 225028, "epoch": 2711} {"train_loss": -24.361154556274414, "global_step": 225029, "epoch": 2711} {"train_loss": -24.61134147644043, "global_step": 225030, "epoch": 2711} {"train_loss": -24.226316452026367, "global_step": 225031, "epoch": 2711} {"train_loss": -24.181922912597656, "global_step": 225032, "epoch": 2711} {"train_loss": -24.404203414916992, "global_step": 225033, "epoch": 2711} {"train_loss": -24.610443115234375, "global_step": 225034, "epoch": 2711} {"train_loss": -24.444381713867188, "global_step": 225035, "epoch": 2711} {"train_loss": -24.314138412475586, "global_step": 225036, "epoch": 2711} {"train_loss": -24.559755325317383, "global_step": 225037, "epoch": 2711} {"train_loss": -24.629531860351562, "global_step": 225038, "epoch": 2711} {"train_loss": -24.477054595947266, "global_step": 225039, "epoch": 2711} {"train_loss": -24.576589584350586, "global_step": 225040, "epoch": 2711} {"train_loss": -24.52686309814453, "global_step": 225041, "epoch": 2711} {"train_loss": -24.4897403717041, "global_step": 225042, "epoch": 2711} {"train_loss": -24.955781936645508, "global_step": 225043, "epoch": 2711} {"train_loss": -24.983190536499023, "global_step": 225044, "epoch": 2711} {"train_loss": -24.76486587524414, "global_step": 225045, "epoch": 2711} {"train_loss": -24.4776554107666, "global_step": 225046, "epoch": 2711} {"train_loss": -24.657474517822266, "global_step": 225047, "epoch": 2711} {"train_loss": -24.84816551208496, "global_step": 225048, "epoch": 2711} {"train_loss": -24.60822868347168, "global_step": 225049, "epoch": 2711} {"train_loss": -25.0194091796875, "global_step": 225050, "epoch": 2711} {"train_loss": -24.822586059570312, "global_step": 225051, "epoch": 2711} {"train_loss": -24.74933433532715, "global_step": 225052, "epoch": 2711} {"train_loss": -24.73355484008789, "global_step": 225053, "epoch": 2711} {"train_loss": -24.318134307861328, "global_step": 225054, "epoch": 2711} {"train_loss": -24.79060173034668, "global_step": 225055, "epoch": 2711} {"train_loss": -24.862995147705078, "global_step": 225056, "epoch": 2711} {"train_loss": -24.98530387878418, "global_step": 225057, "epoch": 2711} {"train_loss": -24.856969833374023, "global_step": 225058, "epoch": 2711} {"train_loss": -24.830564498901367, "global_step": 225059, "epoch": 2711} {"train_loss": -24.56355094909668, "global_step": 225060, "epoch": 2711} {"train_loss": -24.84364891052246, "global_step": 225061, "epoch": 2711} {"train_loss": -24.831180572509766, "global_step": 225062, "epoch": 2711} {"train_loss": -24.729957580566406, "global_step": 225063, "epoch": 2711} {"train_loss": -24.80963706970215, "global_step": 225064, "epoch": 2711} {"train_loss": -24.64803123474121, "global_step": 225065, "epoch": 2711} {"train_loss": -24.717615127563477, "global_step": 225066, "epoch": 2711} {"train_loss": -24.53966522216797, "global_step": 225067, "epoch": 2711} {"train_loss": -25.05111312866211, "global_step": 225068, "epoch": 2711} {"train_loss": -24.441848754882812, "global_step": 225069, "epoch": 2711} {"train_loss": -24.682310104370117, "global_step": 225070, "epoch": 2711} {"train_loss": -24.64996910095215, "global_step": 225071, "epoch": 2711} {"train_loss": -24.487457275390625, "global_step": 225072, "epoch": 2711} {"train_loss": -24.837203979492188, "global_step": 225073, "epoch": 2711} {"train_loss": -24.622093200683594, "global_step": 225074, "epoch": 2711} {"train_loss": -24.505521774291992, "global_step": 225075, "epoch": 2711} {"train_loss": -24.84893226623535, "global_step": 225076, "epoch": 2711} {"train_loss": -24.951522827148438, "global_step": 225077, "epoch": 2711} {"train_loss": -24.86858558654785, "global_step": 225078, "epoch": 2711} {"train_loss": -24.298786163330078, "global_step": 225079, "epoch": 2711} {"train_loss": -24.344892501831055, "global_step": 225080, "epoch": 2711} {"train_loss": -24.29787254333496, "global_step": 225081, "epoch": 2711} {"train_loss": -24.50063133239746, "global_step": 225082, "epoch": 2711} {"train_loss": -24.778701782226562, "global_step": 225083, "epoch": 2711} {"train_loss": -24.464757919311523, "global_step": 225084, "epoch": 2711} {"train_loss": -24.133634567260742, "global_step": 225085, "epoch": 2711} {"train_loss": -24.641796112060547, "global_step": 225086, "epoch": 2711} {"train_loss": -24.74312400817871, "global_step": 225087, "epoch": 2711} {"train_loss": -24.40161895751953, "global_step": 225088, "epoch": 2711} {"train_loss": -24.371816635131836, "global_step": 225089, "epoch": 2711} {"train_loss": -24.575735092163086, "global_step": 225090, "epoch": 2711} {"train_loss": -24.58306121826172, "global_step": 225091, "epoch": 2711} {"train_loss": -24.31157875061035, "global_step": 225092, "epoch": 2711} {"train_loss": -24.354040145874023, "global_step": 225093, "epoch": 2711} {"train_loss": -24.660053253173828, "global_step": 225094, "epoch": 2711} {"train_loss": -24.587942789836102, "global_step": 225095, "epoch": 2711, "val_loss": 6783226.5} {"train_loss": -23.782852172851562, "global_step": 225096, "epoch": 2712} {"train_loss": -24.091045379638672, "global_step": 225097, "epoch": 2712} {"train_loss": -24.085773468017578, "global_step": 225098, "epoch": 2712} {"train_loss": -24.174671173095703, "global_step": 225099, "epoch": 2712} {"train_loss": -24.16884994506836, "global_step": 225100, "epoch": 2712} {"train_loss": -24.262102127075195, "global_step": 225101, "epoch": 2712} {"train_loss": -24.321699142456055, "global_step": 225102, "epoch": 2712} {"train_loss": -23.913755416870117, "global_step": 225103, "epoch": 2712} {"train_loss": -24.18279457092285, "global_step": 225104, "epoch": 2712} {"train_loss": -24.36684226989746, "global_step": 225105, "epoch": 2712} {"train_loss": -24.8261661529541, "global_step": 225106, "epoch": 2712} {"train_loss": -24.607908248901367, "global_step": 225107, "epoch": 2712} {"train_loss": -24.30512809753418, "global_step": 225108, "epoch": 2712} {"train_loss": -24.370771408081055, "global_step": 225109, "epoch": 2712} {"train_loss": -24.397626876831055, "global_step": 225110, "epoch": 2712} {"train_loss": -24.512067794799805, "global_step": 225111, "epoch": 2712} {"train_loss": -24.63496208190918, "global_step": 225112, "epoch": 2712} {"train_loss": -24.512258529663086, "global_step": 225113, "epoch": 2712} {"train_loss": -24.542203903198242, "global_step": 225114, "epoch": 2712} {"train_loss": -24.117456436157227, "global_step": 225115, "epoch": 2712} {"train_loss": -24.7768497467041, "global_step": 225116, "epoch": 2712} {"train_loss": -24.72977638244629, "global_step": 225117, "epoch": 2712} {"train_loss": -24.89668083190918, "global_step": 225118, "epoch": 2712} {"train_loss": -24.20645523071289, "global_step": 225119, "epoch": 2712} {"train_loss": -24.618698120117188, "global_step": 225120, "epoch": 2712} {"train_loss": -24.792299270629883, "global_step": 225121, "epoch": 2712} {"train_loss": -24.950002670288086, "global_step": 225122, "epoch": 2712} {"train_loss": -24.58599090576172, "global_step": 225123, "epoch": 2712} {"train_loss": -24.653432846069336, "global_step": 225124, "epoch": 2712} {"train_loss": -24.95753288269043, "global_step": 225125, "epoch": 2712} {"train_loss": -24.7205753326416, "global_step": 225126, "epoch": 2712} {"train_loss": -25.0417537689209, "global_step": 225127, "epoch": 2712} {"train_loss": -25.024484634399414, "global_step": 225128, "epoch": 2712} {"train_loss": -24.974767684936523, "global_step": 225129, "epoch": 2712} {"train_loss": -24.55031394958496, "global_step": 225130, "epoch": 2712} {"train_loss": -24.328327178955078, "global_step": 225131, "epoch": 2712} {"train_loss": -24.74152183532715, "global_step": 225132, "epoch": 2712} {"train_loss": -24.860116958618164, "global_step": 225133, "epoch": 2712} {"train_loss": -24.821659088134766, "global_step": 225134, "epoch": 2712} {"train_loss": -24.661720275878906, "global_step": 225135, "epoch": 2712} {"train_loss": -24.48719024658203, "global_step": 225136, "epoch": 2712} {"train_loss": -24.649038314819336, "global_step": 225137, "epoch": 2712} {"train_loss": -24.68303871154785, "global_step": 225138, "epoch": 2712} {"train_loss": -24.692581176757812, "global_step": 225139, "epoch": 2712} {"train_loss": -24.731672286987305, "global_step": 225140, "epoch": 2712} {"train_loss": -24.698379516601562, "global_step": 225141, "epoch": 2712} {"train_loss": -25.015668869018555, "global_step": 225142, "epoch": 2712} {"train_loss": -24.88750648498535, "global_step": 225143, "epoch": 2712} {"train_loss": -24.628263473510742, "global_step": 225144, "epoch": 2712} {"train_loss": -24.69172477722168, "global_step": 225145, "epoch": 2712} {"train_loss": -24.73216438293457, "global_step": 225146, "epoch": 2712} {"train_loss": -24.82439422607422, "global_step": 225147, "epoch": 2712} {"train_loss": -24.756803512573242, "global_step": 225148, "epoch": 2712} {"train_loss": -24.66431999206543, "global_step": 225149, "epoch": 2712} {"train_loss": -25.111759185791016, "global_step": 225150, "epoch": 2712} {"train_loss": -24.71559715270996, "global_step": 225151, "epoch": 2712} {"train_loss": -24.770112991333008, "global_step": 225152, "epoch": 2712} {"train_loss": -24.661880493164062, "global_step": 225153, "epoch": 2712} {"train_loss": -24.83684730529785, "global_step": 225154, "epoch": 2712} {"train_loss": -24.75044822692871, "global_step": 225155, "epoch": 2712} {"train_loss": -24.72869873046875, "global_step": 225156, "epoch": 2712} {"train_loss": -24.672565460205078, "global_step": 225157, "epoch": 2712} {"train_loss": -24.794315338134766, "global_step": 225158, "epoch": 2712} {"train_loss": -24.714815139770508, "global_step": 225159, "epoch": 2712} {"train_loss": -24.469100952148438, "global_step": 225160, "epoch": 2712} {"train_loss": -24.24460792541504, "global_step": 225161, "epoch": 2712} {"train_loss": -24.160823822021484, "global_step": 225162, "epoch": 2712} {"train_loss": -24.1754207611084, "global_step": 225163, "epoch": 2712} {"train_loss": -24.36297607421875, "global_step": 225164, "epoch": 2712} {"train_loss": -24.297134399414062, "global_step": 225165, "epoch": 2712} {"train_loss": -24.259685516357422, "global_step": 225166, "epoch": 2712} {"train_loss": -24.019821166992188, "global_step": 225167, "epoch": 2712} {"train_loss": -24.46425437927246, "global_step": 225168, "epoch": 2712} {"train_loss": -24.186328887939453, "global_step": 225169, "epoch": 2712} {"train_loss": -24.37843132019043, "global_step": 225170, "epoch": 2712} {"train_loss": -24.5180606842041, "global_step": 225171, "epoch": 2712} {"train_loss": -24.293506622314453, "global_step": 225172, "epoch": 2712} {"train_loss": -23.425188064575195, "global_step": 225173, "epoch": 2712} {"train_loss": -24.168424606323242, "global_step": 225174, "epoch": 2712} {"train_loss": -24.195363998413086, "global_step": 225175, "epoch": 2712} {"train_loss": -24.423847198486328, "global_step": 225176, "epoch": 2712} {"train_loss": -24.38833999633789, "global_step": 225177, "epoch": 2712} {"train_loss": -24.528206583965254, "global_step": 225178, "epoch": 2712, "val_loss": 6802982.0} {"train_loss": -24.004484176635742, "global_step": 225179, "epoch": 2713} {"train_loss": -24.043041229248047, "global_step": 225180, "epoch": 2713} {"train_loss": -24.009782791137695, "global_step": 225181, "epoch": 2713} {"train_loss": -24.19240951538086, "global_step": 225182, "epoch": 2713} {"train_loss": -23.961057662963867, "global_step": 225183, "epoch": 2713} {"train_loss": -24.670188903808594, "global_step": 225184, "epoch": 2713} {"train_loss": -24.469501495361328, "global_step": 225185, "epoch": 2713} {"train_loss": -23.93914222717285, "global_step": 225186, "epoch": 2713} {"train_loss": -24.17961883544922, "global_step": 225187, "epoch": 2713} {"train_loss": -24.462158203125, "global_step": 225188, "epoch": 2713} {"train_loss": -24.395572662353516, "global_step": 225189, "epoch": 2713} {"train_loss": -24.237165451049805, "global_step": 225190, "epoch": 2713} {"train_loss": -24.537809371948242, "global_step": 225191, "epoch": 2713} {"train_loss": -24.199905395507812, "global_step": 225192, "epoch": 2713} {"train_loss": -24.390989303588867, "global_step": 225193, "epoch": 2713} {"train_loss": -24.44547462463379, "global_step": 225194, "epoch": 2713} {"train_loss": -24.470232009887695, "global_step": 225195, "epoch": 2713} {"train_loss": -24.417367935180664, "global_step": 225196, "epoch": 2713} {"train_loss": -24.761911392211914, "global_step": 225197, "epoch": 2713} {"train_loss": -24.743011474609375, "global_step": 225198, "epoch": 2713} {"train_loss": -24.787044525146484, "global_step": 225199, "epoch": 2713} {"train_loss": -24.682729721069336, "global_step": 225200, "epoch": 2713} {"train_loss": -24.54555320739746, "global_step": 225201, "epoch": 2713} {"train_loss": -24.295217514038086, "global_step": 225202, "epoch": 2713} {"train_loss": -24.895841598510742, "global_step": 225203, "epoch": 2713} {"train_loss": -24.49712562561035, "global_step": 225204, "epoch": 2713} {"train_loss": -24.478275299072266, "global_step": 225205, "epoch": 2713} {"train_loss": -24.688146591186523, "global_step": 225206, "epoch": 2713} {"train_loss": -24.942914962768555, "global_step": 225207, "epoch": 2713} {"train_loss": -24.741641998291016, "global_step": 225208, "epoch": 2713} {"train_loss": -24.791706085205078, "global_step": 225209, "epoch": 2713} {"train_loss": -24.64401626586914, "global_step": 225210, "epoch": 2713} {"train_loss": -24.537519454956055, "global_step": 225211, "epoch": 2713} {"train_loss": -24.726118087768555, "global_step": 225212, "epoch": 2713} {"train_loss": -24.738046646118164, "global_step": 225213, "epoch": 2713} {"train_loss": -24.559717178344727, "global_step": 225214, "epoch": 2713} {"train_loss": -24.825254440307617, "global_step": 225215, "epoch": 2713} {"train_loss": -24.844928741455078, "global_step": 225216, "epoch": 2713} {"train_loss": -24.534366607666016, "global_step": 225217, "epoch": 2713} {"train_loss": -24.60731315612793, "global_step": 225218, "epoch": 2713} {"train_loss": -24.744808197021484, "global_step": 225219, "epoch": 2713} {"train_loss": -24.981409072875977, "global_step": 225220, "epoch": 2713} {"train_loss": -24.769515991210938, "global_step": 225221, "epoch": 2713} {"train_loss": -24.781553268432617, "global_step": 225222, "epoch": 2713} {"train_loss": -24.695194244384766, "global_step": 225223, "epoch": 2713} {"train_loss": -24.452335357666016, "global_step": 225224, "epoch": 2713} {"train_loss": -24.580705642700195, "global_step": 225225, "epoch": 2713} {"train_loss": -24.4152774810791, "global_step": 225226, "epoch": 2713} {"train_loss": -24.568662643432617, "global_step": 225227, "epoch": 2713} {"train_loss": -24.3918514251709, "global_step": 225228, "epoch": 2713} {"train_loss": -24.965604782104492, "global_step": 225229, "epoch": 2713} {"train_loss": -24.43601417541504, "global_step": 225230, "epoch": 2713} {"train_loss": -24.383323669433594, "global_step": 225231, "epoch": 2713} {"train_loss": -24.10822868347168, "global_step": 225232, "epoch": 2713} {"train_loss": -24.06800079345703, "global_step": 225233, "epoch": 2713} {"train_loss": -24.595352172851562, "global_step": 225234, "epoch": 2713} {"train_loss": -24.192676544189453, "global_step": 225235, "epoch": 2713} {"train_loss": -24.243343353271484, "global_step": 225236, "epoch": 2713} {"train_loss": -25.181339263916016, "global_step": 225237, "epoch": 2713} {"train_loss": -24.599523544311523, "global_step": 225238, "epoch": 2713} {"train_loss": -24.632614135742188, "global_step": 225239, "epoch": 2713} {"train_loss": -24.286548614501953, "global_step": 225240, "epoch": 2713} {"train_loss": -24.4935302734375, "global_step": 225241, "epoch": 2713} {"train_loss": -24.596847534179688, "global_step": 225242, "epoch": 2713} {"train_loss": -24.425256729125977, "global_step": 225243, "epoch": 2713} {"train_loss": -24.462589263916016, "global_step": 225244, "epoch": 2713} {"train_loss": -24.600845336914062, "global_step": 225245, "epoch": 2713} {"train_loss": -24.615625381469727, "global_step": 225246, "epoch": 2713} {"train_loss": -24.686140060424805, "global_step": 225247, "epoch": 2713} {"train_loss": -24.647878646850586, "global_step": 225248, "epoch": 2713} {"train_loss": -24.842470169067383, "global_step": 225249, "epoch": 2713} {"train_loss": -24.88870620727539, "global_step": 225250, "epoch": 2713} {"train_loss": -24.52130126953125, "global_step": 225251, "epoch": 2713} {"train_loss": -24.602338790893555, "global_step": 225252, "epoch": 2713} {"train_loss": -24.33717155456543, "global_step": 225253, "epoch": 2713} {"train_loss": -24.708097457885742, "global_step": 225254, "epoch": 2713} {"train_loss": -24.18585968017578, "global_step": 225255, "epoch": 2713} {"train_loss": -24.414304733276367, "global_step": 225256, "epoch": 2713} {"train_loss": -24.226194381713867, "global_step": 225257, "epoch": 2713} {"train_loss": -24.729963302612305, "global_step": 225258, "epoch": 2713} {"train_loss": -24.840351104736328, "global_step": 225259, "epoch": 2713} {"train_loss": -24.461454391479492, "global_step": 225260, "epoch": 2713} {"train_loss": -24.53121601242617, "global_step": 225261, "epoch": 2713, "val_loss": 6698059.0} {"train_loss": -24.043420791625977, "global_step": 225262, "epoch": 2714} {"train_loss": -23.893095016479492, "global_step": 225263, "epoch": 2714} {"train_loss": -24.05364418029785, "global_step": 225264, "epoch": 2714} {"train_loss": -23.985166549682617, "global_step": 225265, "epoch": 2714} {"train_loss": -24.2945613861084, "global_step": 225266, "epoch": 2714} {"train_loss": -24.2486515045166, "global_step": 225267, "epoch": 2714} {"train_loss": -24.410337448120117, "global_step": 225268, "epoch": 2714} {"train_loss": -24.34943962097168, "global_step": 225269, "epoch": 2714} {"train_loss": -24.213857650756836, "global_step": 225270, "epoch": 2714} {"train_loss": -24.27342987060547, "global_step": 225271, "epoch": 2714} {"train_loss": -24.115554809570312, "global_step": 225272, "epoch": 2714} {"train_loss": -24.305072784423828, "global_step": 225273, "epoch": 2714} {"train_loss": -24.965225219726562, "global_step": 225274, "epoch": 2714} {"train_loss": -24.392690658569336, "global_step": 225275, "epoch": 2714} {"train_loss": -24.38095474243164, "global_step": 225276, "epoch": 2714} {"train_loss": -24.271289825439453, "global_step": 225277, "epoch": 2714} {"train_loss": -24.54346466064453, "global_step": 225278, "epoch": 2714} {"train_loss": -24.250219345092773, "global_step": 225279, "epoch": 2714} {"train_loss": -24.71280288696289, "global_step": 225280, "epoch": 2714} {"train_loss": -24.685659408569336, "global_step": 225281, "epoch": 2714} {"train_loss": -24.754207611083984, "global_step": 225282, "epoch": 2714} {"train_loss": -24.453271865844727, "global_step": 225283, "epoch": 2714} {"train_loss": -24.637313842773438, "global_step": 225284, "epoch": 2714} {"train_loss": -24.218292236328125, "global_step": 225285, "epoch": 2714} {"train_loss": -24.526262283325195, "global_step": 225286, "epoch": 2714} {"train_loss": -24.6817684173584, "global_step": 225287, "epoch": 2714} {"train_loss": -24.400667190551758, "global_step": 225288, "epoch": 2714} {"train_loss": -24.800046920776367, "global_step": 225289, "epoch": 2714} {"train_loss": -24.759838104248047, "global_step": 225290, "epoch": 2714} {"train_loss": -24.585826873779297, "global_step": 225291, "epoch": 2714} {"train_loss": -24.53994369506836, "global_step": 225292, "epoch": 2714} {"train_loss": -24.465185165405273, "global_step": 225293, "epoch": 2714} {"train_loss": -24.637847900390625, "global_step": 225294, "epoch": 2714} {"train_loss": -24.090219497680664, "global_step": 225295, "epoch": 2714} {"train_loss": -25.0262508392334, "global_step": 225296, "epoch": 2714} {"train_loss": -24.74207305908203, "global_step": 225297, "epoch": 2714} {"train_loss": -24.63046646118164, "global_step": 225298, "epoch": 2714} {"train_loss": -25.112449645996094, "global_step": 225299, "epoch": 2714} {"train_loss": -24.509220123291016, "global_step": 225300, "epoch": 2714} {"train_loss": -24.853572845458984, "global_step": 225301, "epoch": 2714} {"train_loss": -25.000137329101562, "global_step": 225302, "epoch": 2714} {"train_loss": -25.048452377319336, "global_step": 225303, "epoch": 2714} {"train_loss": -24.756196975708008, "global_step": 225304, "epoch": 2714} {"train_loss": -24.90007972717285, "global_step": 225305, "epoch": 2714} {"train_loss": -24.59360694885254, "global_step": 225306, "epoch": 2714} {"train_loss": -24.826351165771484, "global_step": 225307, "epoch": 2714} {"train_loss": -24.809982299804688, "global_step": 225308, "epoch": 2714} {"train_loss": -24.910011291503906, "global_step": 225309, "epoch": 2714} {"train_loss": -24.655580520629883, "global_step": 225310, "epoch": 2714} {"train_loss": -24.901525497436523, "global_step": 225311, "epoch": 2714} {"train_loss": -25.05817222595215, "global_step": 225312, "epoch": 2714} {"train_loss": -25.186229705810547, "global_step": 225313, "epoch": 2714} {"train_loss": -24.652692794799805, "global_step": 225314, "epoch": 2714} {"train_loss": -24.9851016998291, "global_step": 225315, "epoch": 2714} {"train_loss": -24.73642921447754, "global_step": 225316, "epoch": 2714} {"train_loss": -24.75965690612793, "global_step": 225317, "epoch": 2714} {"train_loss": -24.889326095581055, "global_step": 225318, "epoch": 2714} {"train_loss": -24.76299285888672, "global_step": 225319, "epoch": 2714} {"train_loss": -24.695011138916016, "global_step": 225320, "epoch": 2714} {"train_loss": -24.68006134033203, "global_step": 225321, "epoch": 2714} {"train_loss": -24.97197914123535, "global_step": 225322, "epoch": 2714} {"train_loss": -24.789342880249023, "global_step": 225323, "epoch": 2714} {"train_loss": -24.8580265045166, "global_step": 225324, "epoch": 2714} {"train_loss": -24.46268081665039, "global_step": 225325, "epoch": 2714} {"train_loss": -24.8508358001709, "global_step": 225326, "epoch": 2714} {"train_loss": -25.213672637939453, "global_step": 225327, "epoch": 2714} {"train_loss": -25.16688346862793, "global_step": 225328, "epoch": 2714} {"train_loss": -24.59881591796875, "global_step": 225329, "epoch": 2714} {"train_loss": -24.241317749023438, "global_step": 225330, "epoch": 2714} {"train_loss": -24.314279556274414, "global_step": 225331, "epoch": 2714} {"train_loss": -24.32363510131836, "global_step": 225332, "epoch": 2714} {"train_loss": -24.39511489868164, "global_step": 225333, "epoch": 2714} {"train_loss": -24.827289581298828, "global_step": 225334, "epoch": 2714} {"train_loss": -24.242752075195312, "global_step": 225335, "epoch": 2714} {"train_loss": -24.79886817932129, "global_step": 225336, "epoch": 2714} {"train_loss": -24.756296157836914, "global_step": 225337, "epoch": 2714} {"train_loss": -24.732397079467773, "global_step": 225338, "epoch": 2714} {"train_loss": -24.931167602539062, "global_step": 225339, "epoch": 2714} {"train_loss": -25.03631591796875, "global_step": 225340, "epoch": 2714} {"train_loss": -24.818021774291992, "global_step": 225341, "epoch": 2714} {"train_loss": -24.80173110961914, "global_step": 225342, "epoch": 2714} {"train_loss": -24.93634605407715, "global_step": 225343, "epoch": 2714} {"train_loss": -24.635971850659473, "global_step": 225344, "epoch": 2714, "val_loss": 6751167.0} {"train_loss": -23.986955642700195, "global_step": 225345, "epoch": 2715} {"train_loss": -24.057531356811523, "global_step": 225346, "epoch": 2715} {"train_loss": -24.21453094482422, "global_step": 225347, "epoch": 2715} {"train_loss": -24.074481964111328, "global_step": 225348, "epoch": 2715} {"train_loss": -23.745304107666016, "global_step": 225349, "epoch": 2715} {"train_loss": -24.388690948486328, "global_step": 225350, "epoch": 2715} {"train_loss": -24.13484764099121, "global_step": 225351, "epoch": 2715} {"train_loss": -24.136716842651367, "global_step": 225352, "epoch": 2715} {"train_loss": -24.0332088470459, "global_step": 225353, "epoch": 2715} {"train_loss": -23.974897384643555, "global_step": 225354, "epoch": 2715} {"train_loss": -24.530872344970703, "global_step": 225355, "epoch": 2715} {"train_loss": -24.24772834777832, "global_step": 225356, "epoch": 2715} {"train_loss": -24.317033767700195, "global_step": 225357, "epoch": 2715} {"train_loss": -24.439483642578125, "global_step": 225358, "epoch": 2715} {"train_loss": -24.59021759033203, "global_step": 225359, "epoch": 2715} {"train_loss": -24.38151741027832, "global_step": 225360, "epoch": 2715} {"train_loss": -24.54205322265625, "global_step": 225361, "epoch": 2715} {"train_loss": -24.459579467773438, "global_step": 225362, "epoch": 2715} {"train_loss": -24.631561279296875, "global_step": 225363, "epoch": 2715} {"train_loss": -24.392009735107422, "global_step": 225364, "epoch": 2715} {"train_loss": -24.765806198120117, "global_step": 225365, "epoch": 2715} {"train_loss": -24.49018096923828, "global_step": 225366, "epoch": 2715} {"train_loss": -24.341787338256836, "global_step": 225367, "epoch": 2715} {"train_loss": -24.51974868774414, "global_step": 225368, "epoch": 2715} {"train_loss": -24.61136245727539, "global_step": 225369, "epoch": 2715} {"train_loss": -24.672286987304688, "global_step": 225370, "epoch": 2715} {"train_loss": -24.391225814819336, "global_step": 225371, "epoch": 2715} {"train_loss": -24.644136428833008, "global_step": 225372, "epoch": 2715} {"train_loss": -24.42349624633789, "global_step": 225373, "epoch": 2715} {"train_loss": -24.342782974243164, "global_step": 225374, "epoch": 2715} {"train_loss": -24.402450561523438, "global_step": 225375, "epoch": 2715} {"train_loss": -24.982343673706055, "global_step": 225376, "epoch": 2715} {"train_loss": -24.645421981811523, "global_step": 225377, "epoch": 2715} {"train_loss": -24.644805908203125, "global_step": 225378, "epoch": 2715} {"train_loss": -24.429540634155273, "global_step": 225379, "epoch": 2715} {"train_loss": -24.749635696411133, "global_step": 225380, "epoch": 2715} {"train_loss": -24.674015045166016, "global_step": 225381, "epoch": 2715} {"train_loss": -24.735143661499023, "global_step": 225382, "epoch": 2715} {"train_loss": -24.5576229095459, "global_step": 225383, "epoch": 2715} {"train_loss": -24.85329818725586, "global_step": 225384, "epoch": 2715} {"train_loss": -25.093950271606445, "global_step": 225385, "epoch": 2715} {"train_loss": -25.14900779724121, "global_step": 225386, "epoch": 2715} {"train_loss": -24.699214935302734, "global_step": 225387, "epoch": 2715} {"train_loss": -24.945453643798828, "global_step": 225388, "epoch": 2715} {"train_loss": -24.853256225585938, "global_step": 225389, "epoch": 2715} {"train_loss": -24.93628692626953, "global_step": 225390, "epoch": 2715} {"train_loss": -24.70697593688965, "global_step": 225391, "epoch": 2715} {"train_loss": -24.993101119995117, "global_step": 225392, "epoch": 2715} {"train_loss": -24.709243774414062, "global_step": 225393, "epoch": 2715} {"train_loss": -24.550561904907227, "global_step": 225394, "epoch": 2715} {"train_loss": -24.724538803100586, "global_step": 225395, "epoch": 2715} {"train_loss": -24.693410873413086, "global_step": 225396, "epoch": 2715} {"train_loss": -24.8360652923584, "global_step": 225397, "epoch": 2715} {"train_loss": -24.766035079956055, "global_step": 225398, "epoch": 2715} {"train_loss": -24.961673736572266, "global_step": 225399, "epoch": 2715} {"train_loss": -24.686813354492188, "global_step": 225400, "epoch": 2715} {"train_loss": -24.905122756958008, "global_step": 225401, "epoch": 2715} {"train_loss": -24.70576286315918, "global_step": 225402, "epoch": 2715} {"train_loss": -24.979114532470703, "global_step": 225403, "epoch": 2715} {"train_loss": -24.51382064819336, "global_step": 225404, "epoch": 2715} {"train_loss": -24.38021469116211, "global_step": 225405, "epoch": 2715} {"train_loss": -24.701932907104492, "global_step": 225406, "epoch": 2715} {"train_loss": -24.513673782348633, "global_step": 225407, "epoch": 2715} {"train_loss": -24.9269962310791, "global_step": 225408, "epoch": 2715} {"train_loss": -24.822086334228516, "global_step": 225409, "epoch": 2715} {"train_loss": -24.61751365661621, "global_step": 225410, "epoch": 2715} {"train_loss": -24.659229278564453, "global_step": 225411, "epoch": 2715} {"train_loss": -24.832733154296875, "global_step": 225412, "epoch": 2715} {"train_loss": -24.893173217773438, "global_step": 225413, "epoch": 2715} {"train_loss": -24.800222396850586, "global_step": 225414, "epoch": 2715} {"train_loss": -24.740690231323242, "global_step": 225415, "epoch": 2715} {"train_loss": -25.094533920288086, "global_step": 225416, "epoch": 2715} {"train_loss": -24.528295516967773, "global_step": 225417, "epoch": 2715} {"train_loss": -24.565046310424805, "global_step": 225418, "epoch": 2715} {"train_loss": -24.988422393798828, "global_step": 225419, "epoch": 2715} {"train_loss": -24.642620086669922, "global_step": 225420, "epoch": 2715} {"train_loss": -24.590776443481445, "global_step": 225421, "epoch": 2715} {"train_loss": -25.084135055541992, "global_step": 225422, "epoch": 2715} {"train_loss": -24.600351333618164, "global_step": 225423, "epoch": 2715} {"train_loss": -24.72430419921875, "global_step": 225424, "epoch": 2715} {"train_loss": -24.560428619384766, "global_step": 225425, "epoch": 2715} {"train_loss": -24.66615104675293, "global_step": 225426, "epoch": 2715} {"train_loss": -24.596357966043865, "global_step": 225427, "epoch": 2715, "val_loss": 6796081.5} {"train_loss": -24.37501335144043, "global_step": 225428, "epoch": 2716} {"train_loss": -23.52593421936035, "global_step": 225429, "epoch": 2716} {"train_loss": -24.226890563964844, "global_step": 225430, "epoch": 2716} {"train_loss": -23.748319625854492, "global_step": 225431, "epoch": 2716} {"train_loss": -24.282283782958984, "global_step": 225432, "epoch": 2716} {"train_loss": -23.616052627563477, "global_step": 225433, "epoch": 2716} {"train_loss": -24.19284439086914, "global_step": 225434, "epoch": 2716} {"train_loss": -23.981693267822266, "global_step": 225435, "epoch": 2716} {"train_loss": -24.049787521362305, "global_step": 225436, "epoch": 2716} {"train_loss": -24.571277618408203, "global_step": 225437, "epoch": 2716} {"train_loss": -23.874067306518555, "global_step": 225438, "epoch": 2716} {"train_loss": -24.527830123901367, "global_step": 225439, "epoch": 2716} {"train_loss": -24.16364288330078, "global_step": 225440, "epoch": 2716} {"train_loss": -24.398418426513672, "global_step": 225441, "epoch": 2716} {"train_loss": -24.28537940979004, "global_step": 225442, "epoch": 2716} {"train_loss": -24.56722068786621, "global_step": 225443, "epoch": 2716} {"train_loss": -23.948413848876953, "global_step": 225444, "epoch": 2716} {"train_loss": -24.097339630126953, "global_step": 225445, "epoch": 2716} {"train_loss": -24.281232833862305, "global_step": 225446, "epoch": 2716} {"train_loss": -24.508056640625, "global_step": 225447, "epoch": 2716} {"train_loss": -24.067245483398438, "global_step": 225448, "epoch": 2716} {"train_loss": -24.389986038208008, "global_step": 225449, "epoch": 2716} {"train_loss": -24.16377067565918, "global_step": 225450, "epoch": 2716} {"train_loss": -24.5491886138916, "global_step": 225451, "epoch": 2716} {"train_loss": -24.51934242248535, "global_step": 225452, "epoch": 2716} {"train_loss": -24.112165451049805, "global_step": 225453, "epoch": 2716} {"train_loss": -24.391996383666992, "global_step": 225454, "epoch": 2716} {"train_loss": -24.37525749206543, "global_step": 225455, "epoch": 2716} {"train_loss": -24.043004989624023, "global_step": 225456, "epoch": 2716} {"train_loss": -24.42653465270996, "global_step": 225457, "epoch": 2716} {"train_loss": -24.35933494567871, "global_step": 225458, "epoch": 2716} {"train_loss": -24.821882247924805, "global_step": 225459, "epoch": 2716} {"train_loss": -24.45411491394043, "global_step": 225460, "epoch": 2716} {"train_loss": -24.365779876708984, "global_step": 225461, "epoch": 2716} {"train_loss": -24.73528480529785, "global_step": 225462, "epoch": 2716} {"train_loss": -24.530858993530273, "global_step": 225463, "epoch": 2716} {"train_loss": -24.49228286743164, "global_step": 225464, "epoch": 2716} {"train_loss": -24.59832191467285, "global_step": 225465, "epoch": 2716} {"train_loss": -24.514677047729492, "global_step": 225466, "epoch": 2716} {"train_loss": -24.474327087402344, "global_step": 225467, "epoch": 2716} {"train_loss": -24.36590576171875, "global_step": 225468, "epoch": 2716} {"train_loss": -24.506521224975586, "global_step": 225469, "epoch": 2716} {"train_loss": -24.480546951293945, "global_step": 225470, "epoch": 2716} {"train_loss": -24.47279930114746, "global_step": 225471, "epoch": 2716} {"train_loss": -24.51300621032715, "global_step": 225472, "epoch": 2716} {"train_loss": -25.023334503173828, "global_step": 225473, "epoch": 2716} {"train_loss": -24.810108184814453, "global_step": 225474, "epoch": 2716} {"train_loss": -24.414228439331055, "global_step": 225475, "epoch": 2716} {"train_loss": -24.76045799255371, "global_step": 225476, "epoch": 2716} {"train_loss": -24.58057403564453, "global_step": 225477, "epoch": 2716} {"train_loss": -24.953702926635742, "global_step": 225478, "epoch": 2716} {"train_loss": -24.53290367126465, "global_step": 225479, "epoch": 2716} {"train_loss": -24.511167526245117, "global_step": 225480, "epoch": 2716} {"train_loss": -24.98719596862793, "global_step": 225481, "epoch": 2716} {"train_loss": -24.834522247314453, "global_step": 225482, "epoch": 2716} {"train_loss": -24.914352416992188, "global_step": 225483, "epoch": 2716} {"train_loss": -24.113245010375977, "global_step": 225484, "epoch": 2716} {"train_loss": -24.49366569519043, "global_step": 225485, "epoch": 2716} {"train_loss": -25.082616806030273, "global_step": 225486, "epoch": 2716} {"train_loss": -24.426969528198242, "global_step": 225487, "epoch": 2716} {"train_loss": -24.84395408630371, "global_step": 225488, "epoch": 2716} {"train_loss": -25.03907585144043, "global_step": 225489, "epoch": 2716} {"train_loss": -24.876235961914062, "global_step": 225490, "epoch": 2716} {"train_loss": -24.676929473876953, "global_step": 225491, "epoch": 2716} {"train_loss": -24.310407638549805, "global_step": 225492, "epoch": 2716} {"train_loss": -24.519357681274414, "global_step": 225493, "epoch": 2716} {"train_loss": -24.794349670410156, "global_step": 225494, "epoch": 2716} {"train_loss": -25.034015655517578, "global_step": 225495, "epoch": 2716} {"train_loss": -24.890850067138672, "global_step": 225496, "epoch": 2716} {"train_loss": -24.704450607299805, "global_step": 225497, "epoch": 2716} {"train_loss": -24.72529411315918, "global_step": 225498, "epoch": 2716} {"train_loss": -24.346364974975586, "global_step": 225499, "epoch": 2716} {"train_loss": -24.885406494140625, "global_step": 225500, "epoch": 2716} {"train_loss": -24.505748748779297, "global_step": 225501, "epoch": 2716} {"train_loss": -24.662839889526367, "global_step": 225502, "epoch": 2716} {"train_loss": -24.251867294311523, "global_step": 225503, "epoch": 2716} {"train_loss": -25.009119033813477, "global_step": 225504, "epoch": 2716} {"train_loss": -24.949321746826172, "global_step": 225505, "epoch": 2716} {"train_loss": -24.60743522644043, "global_step": 225506, "epoch": 2716} {"train_loss": -24.19666862487793, "global_step": 225507, "epoch": 2716} {"train_loss": -24.73719596862793, "global_step": 225508, "epoch": 2716} {"train_loss": -24.30670738220215, "global_step": 225509, "epoch": 2716} {"train_loss": -24.465253370353974, "global_step": 225510, "epoch": 2716, "val_loss": 6861761.0} {"train_loss": -22.308841705322266, "global_step": 225511, "epoch": 2717} {"train_loss": -24.27425193786621, "global_step": 225512, "epoch": 2717} {"train_loss": -22.538782119750977, "global_step": 225513, "epoch": 2717} {"train_loss": -23.363889694213867, "global_step": 225514, "epoch": 2717} {"train_loss": -23.184459686279297, "global_step": 225515, "epoch": 2717} {"train_loss": -23.633817672729492, "global_step": 225516, "epoch": 2717} {"train_loss": -23.436771392822266, "global_step": 225517, "epoch": 2717} {"train_loss": -23.464191436767578, "global_step": 225518, "epoch": 2717} {"train_loss": -23.917837142944336, "global_step": 225519, "epoch": 2717} {"train_loss": -23.80735206604004, "global_step": 225520, "epoch": 2717} {"train_loss": -24.016376495361328, "global_step": 225521, "epoch": 2717} {"train_loss": -23.439739227294922, "global_step": 225522, "epoch": 2717} {"train_loss": -23.797216415405273, "global_step": 225523, "epoch": 2717} {"train_loss": -23.59986686706543, "global_step": 225524, "epoch": 2717} {"train_loss": -24.140914916992188, "global_step": 225525, "epoch": 2717} {"train_loss": -24.111759185791016, "global_step": 225526, "epoch": 2717} {"train_loss": -24.162065505981445, "global_step": 225527, "epoch": 2717} {"train_loss": -24.081899642944336, "global_step": 225528, "epoch": 2717} {"train_loss": -23.909116744995117, "global_step": 225529, "epoch": 2717} {"train_loss": -24.428571701049805, "global_step": 225530, "epoch": 2717} {"train_loss": -24.114194869995117, "global_step": 225531, "epoch": 2717} {"train_loss": -24.309553146362305, "global_step": 225532, "epoch": 2717} {"train_loss": -24.439800262451172, "global_step": 225533, "epoch": 2717} {"train_loss": -24.240156173706055, "global_step": 225534, "epoch": 2717} {"train_loss": -24.35808563232422, "global_step": 225535, "epoch": 2717} {"train_loss": -24.434396743774414, "global_step": 225536, "epoch": 2717} {"train_loss": -24.376880645751953, "global_step": 225537, "epoch": 2717} {"train_loss": -24.305835723876953, "global_step": 225538, "epoch": 2717} {"train_loss": -24.2264461517334, "global_step": 225539, "epoch": 2717} {"train_loss": -24.640827178955078, "global_step": 225540, "epoch": 2717} {"train_loss": -24.14348793029785, "global_step": 225541, "epoch": 2717} {"train_loss": -24.14693260192871, "global_step": 225542, "epoch": 2717} {"train_loss": -24.443195343017578, "global_step": 225543, "epoch": 2717} {"train_loss": -24.12241554260254, "global_step": 225544, "epoch": 2717} {"train_loss": -24.38225746154785, "global_step": 225545, "epoch": 2717} {"train_loss": -24.343942642211914, "global_step": 225546, "epoch": 2717} {"train_loss": -24.590625762939453, "global_step": 225547, "epoch": 2717} {"train_loss": -24.574514389038086, "global_step": 225548, "epoch": 2717} {"train_loss": -24.313194274902344, "global_step": 225549, "epoch": 2717} {"train_loss": -24.536924362182617, "global_step": 225550, "epoch": 2717} {"train_loss": -24.7166748046875, "global_step": 225551, "epoch": 2717} {"train_loss": -24.662240982055664, "global_step": 225552, "epoch": 2717} {"train_loss": -24.0306453704834, "global_step": 225553, "epoch": 2717} {"train_loss": -24.812984466552734, "global_step": 225554, "epoch": 2717} {"train_loss": -24.63150978088379, "global_step": 225555, "epoch": 2717} {"train_loss": -24.456012725830078, "global_step": 225556, "epoch": 2717} {"train_loss": -24.4525146484375, "global_step": 225557, "epoch": 2717} {"train_loss": -24.574369430541992, "global_step": 225558, "epoch": 2717} {"train_loss": -24.430572509765625, "global_step": 225559, "epoch": 2717} {"train_loss": -24.85879898071289, "global_step": 225560, "epoch": 2717} {"train_loss": -24.882164001464844, "global_step": 225561, "epoch": 2717} {"train_loss": -24.545339584350586, "global_step": 225562, "epoch": 2717} {"train_loss": -24.848310470581055, "global_step": 225563, "epoch": 2717} {"train_loss": -24.70418930053711, "global_step": 225564, "epoch": 2717} {"train_loss": -24.697967529296875, "global_step": 225565, "epoch": 2717} {"train_loss": -24.710594177246094, "global_step": 225566, "epoch": 2717} {"train_loss": -24.966909408569336, "global_step": 225567, "epoch": 2717} {"train_loss": -24.854345321655273, "global_step": 225568, "epoch": 2717} {"train_loss": -24.84358787536621, "global_step": 225569, "epoch": 2717} {"train_loss": -24.400775909423828, "global_step": 225570, "epoch": 2717} {"train_loss": -25.12285804748535, "global_step": 225571, "epoch": 2717} {"train_loss": -24.7744140625, "global_step": 225572, "epoch": 2717} {"train_loss": -24.654590606689453, "global_step": 225573, "epoch": 2717} {"train_loss": -24.483795166015625, "global_step": 225574, "epoch": 2717} {"train_loss": -24.848546981811523, "global_step": 225575, "epoch": 2717} {"train_loss": -24.340909957885742, "global_step": 225576, "epoch": 2717} {"train_loss": -24.460432052612305, "global_step": 225577, "epoch": 2717} {"train_loss": -24.91937828063965, "global_step": 225578, "epoch": 2717} {"train_loss": -24.41895866394043, "global_step": 225579, "epoch": 2717} {"train_loss": -24.71854019165039, "global_step": 225580, "epoch": 2717} {"train_loss": -25.10713005065918, "global_step": 225581, "epoch": 2717} {"train_loss": -24.93585777282715, "global_step": 225582, "epoch": 2717} {"train_loss": -24.6541805267334, "global_step": 225583, "epoch": 2717} {"train_loss": -24.878625869750977, "global_step": 225584, "epoch": 2717} {"train_loss": -24.79262351989746, "global_step": 225585, "epoch": 2717} {"train_loss": -24.787137985229492, "global_step": 225586, "epoch": 2717} {"train_loss": -25.084789276123047, "global_step": 225587, "epoch": 2717} {"train_loss": -24.79401206970215, "global_step": 225588, "epoch": 2717} {"train_loss": -24.716007232666016, "global_step": 225589, "epoch": 2717} {"train_loss": -24.333465576171875, "global_step": 225590, "epoch": 2717} {"train_loss": -24.787023544311523, "global_step": 225591, "epoch": 2717} {"train_loss": -24.958175659179688, "global_step": 225592, "epoch": 2717} {"train_loss": -24.39421058562865, "global_step": 225593, "epoch": 2717, "val_loss": 6776637.0} {"train_loss": -23.45408821105957, "global_step": 225594, "epoch": 2718} {"train_loss": -23.920623779296875, "global_step": 225595, "epoch": 2718} {"train_loss": -24.19996452331543, "global_step": 225596, "epoch": 2718} {"train_loss": -23.941308975219727, "global_step": 225597, "epoch": 2718} {"train_loss": -24.41839599609375, "global_step": 225598, "epoch": 2718} {"train_loss": -24.3170166015625, "global_step": 225599, "epoch": 2718} {"train_loss": -24.180471420288086, "global_step": 225600, "epoch": 2718} {"train_loss": -23.879140853881836, "global_step": 225601, "epoch": 2718} {"train_loss": -24.066789627075195, "global_step": 225602, "epoch": 2718} {"train_loss": -24.442033767700195, "global_step": 225603, "epoch": 2718} {"train_loss": -24.074007034301758, "global_step": 225604, "epoch": 2718} {"train_loss": -24.131956100463867, "global_step": 225605, "epoch": 2718} {"train_loss": -24.757192611694336, "global_step": 225606, "epoch": 2718} {"train_loss": -24.135269165039062, "global_step": 225607, "epoch": 2718} {"train_loss": -23.93001937866211, "global_step": 225608, "epoch": 2718} {"train_loss": -24.186840057373047, "global_step": 225609, "epoch": 2718} {"train_loss": -24.466876983642578, "global_step": 225610, "epoch": 2718} {"train_loss": -24.088836669921875, "global_step": 225611, "epoch": 2718} {"train_loss": -24.764707565307617, "global_step": 225612, "epoch": 2718} {"train_loss": -24.573932647705078, "global_step": 225613, "epoch": 2718} {"train_loss": -24.64581298828125, "global_step": 225614, "epoch": 2718} {"train_loss": -24.54193687438965, "global_step": 225615, "epoch": 2718} {"train_loss": -24.740558624267578, "global_step": 225616, "epoch": 2718} {"train_loss": -24.674365997314453, "global_step": 225617, "epoch": 2718} {"train_loss": -24.461156845092773, "global_step": 225618, "epoch": 2718} {"train_loss": -24.7547664642334, "global_step": 225619, "epoch": 2718} {"train_loss": -24.50020408630371, "global_step": 225620, "epoch": 2718} {"train_loss": -24.33475112915039, "global_step": 225621, "epoch": 2718} {"train_loss": -24.55339241027832, "global_step": 225622, "epoch": 2718} {"train_loss": -24.53291893005371, "global_step": 225623, "epoch": 2718} {"train_loss": -24.621091842651367, "global_step": 225624, "epoch": 2718} {"train_loss": -24.704837799072266, "global_step": 225625, "epoch": 2718} {"train_loss": -24.799062728881836, "global_step": 225626, "epoch": 2718} {"train_loss": -25.014476776123047, "global_step": 225627, "epoch": 2718} {"train_loss": -24.592544555664062, "global_step": 225628, "epoch": 2718} {"train_loss": -24.944955825805664, "global_step": 225629, "epoch": 2718} {"train_loss": -25.040483474731445, "global_step": 225630, "epoch": 2718} {"train_loss": -25.004243850708008, "global_step": 225631, "epoch": 2718} {"train_loss": -24.704172134399414, "global_step": 225632, "epoch": 2718} {"train_loss": -24.737199783325195, "global_step": 225633, "epoch": 2718} {"train_loss": -24.658567428588867, "global_step": 225634, "epoch": 2718} {"train_loss": -24.818986892700195, "global_step": 225635, "epoch": 2718} {"train_loss": -25.186256408691406, "global_step": 225636, "epoch": 2718} {"train_loss": -24.681215286254883, "global_step": 225637, "epoch": 2718} {"train_loss": -25.08688735961914, "global_step": 225638, "epoch": 2718} {"train_loss": -25.020538330078125, "global_step": 225639, "epoch": 2718} {"train_loss": -25.007827758789062, "global_step": 225640, "epoch": 2718} {"train_loss": -24.650495529174805, "global_step": 225641, "epoch": 2718} {"train_loss": -24.488027572631836, "global_step": 225642, "epoch": 2718} {"train_loss": -24.685348510742188, "global_step": 225643, "epoch": 2718} {"train_loss": -24.812204360961914, "global_step": 225644, "epoch": 2718} {"train_loss": -24.231977462768555, "global_step": 225645, "epoch": 2718} {"train_loss": -24.164541244506836, "global_step": 225646, "epoch": 2718} {"train_loss": -24.142398834228516, "global_step": 225647, "epoch": 2718} {"train_loss": -24.534366607666016, "global_step": 225648, "epoch": 2718} {"train_loss": -24.61260986328125, "global_step": 225649, "epoch": 2718} {"train_loss": -24.31342887878418, "global_step": 225650, "epoch": 2718} {"train_loss": -24.518396377563477, "global_step": 225651, "epoch": 2718} {"train_loss": -24.482376098632812, "global_step": 225652, "epoch": 2718} {"train_loss": -24.547382354736328, "global_step": 225653, "epoch": 2718} {"train_loss": -24.336280822753906, "global_step": 225654, "epoch": 2718} {"train_loss": -24.515121459960938, "global_step": 225655, "epoch": 2718} {"train_loss": -24.27581787109375, "global_step": 225656, "epoch": 2718} {"train_loss": -24.565977096557617, "global_step": 225657, "epoch": 2718} {"train_loss": -24.438629150390625, "global_step": 225658, "epoch": 2718} {"train_loss": -24.523197174072266, "global_step": 225659, "epoch": 2718} {"train_loss": -24.847684860229492, "global_step": 225660, "epoch": 2718} {"train_loss": -24.584314346313477, "global_step": 225661, "epoch": 2718} {"train_loss": -24.664546966552734, "global_step": 225662, "epoch": 2718} {"train_loss": -24.372817993164062, "global_step": 225663, "epoch": 2718} {"train_loss": -24.362720489501953, "global_step": 225664, "epoch": 2718} {"train_loss": -24.532630920410156, "global_step": 225665, "epoch": 2718} {"train_loss": -24.830524444580078, "global_step": 225666, "epoch": 2718} {"train_loss": -24.5482234954834, "global_step": 225667, "epoch": 2718} {"train_loss": -24.888463973999023, "global_step": 225668, "epoch": 2718} {"train_loss": -24.500104904174805, "global_step": 225669, "epoch": 2718} {"train_loss": -24.751577377319336, "global_step": 225670, "epoch": 2718} {"train_loss": -24.776975631713867, "global_step": 225671, "epoch": 2718} {"train_loss": -24.432653427124023, "global_step": 225672, "epoch": 2718} {"train_loss": -24.624242782592773, "global_step": 225673, "epoch": 2718} {"train_loss": -24.484373092651367, "global_step": 225674, "epoch": 2718} {"train_loss": -24.81254005432129, "global_step": 225675, "epoch": 2718} {"train_loss": -24.517894331231176, "global_step": 225676, "epoch": 2718, "val_loss": 6529214.0} {"train_loss": -23.67993927001953, "global_step": 225677, "epoch": 2719} {"train_loss": -24.049680709838867, "global_step": 225678, "epoch": 2719} {"train_loss": -23.984506607055664, "global_step": 225679, "epoch": 2719} {"train_loss": -24.01105308532715, "global_step": 225680, "epoch": 2719} {"train_loss": -24.35382080078125, "global_step": 225681, "epoch": 2719} {"train_loss": -23.93815040588379, "global_step": 225682, "epoch": 2719} {"train_loss": -23.800857543945312, "global_step": 225683, "epoch": 2719} {"train_loss": -24.502161026000977, "global_step": 225684, "epoch": 2719} {"train_loss": -24.111236572265625, "global_step": 225685, "epoch": 2719} {"train_loss": -24.315954208374023, "global_step": 225686, "epoch": 2719} {"train_loss": -24.20444107055664, "global_step": 225687, "epoch": 2719} {"train_loss": -24.680578231811523, "global_step": 225688, "epoch": 2719} {"train_loss": -24.66534423828125, "global_step": 225689, "epoch": 2719} {"train_loss": -24.065505981445312, "global_step": 225690, "epoch": 2719} {"train_loss": -24.447690963745117, "global_step": 225691, "epoch": 2719} {"train_loss": -24.118070602416992, "global_step": 225692, "epoch": 2719} {"train_loss": -24.57931137084961, "global_step": 225693, "epoch": 2719} {"train_loss": -24.461137771606445, "global_step": 225694, "epoch": 2719} {"train_loss": -24.36348533630371, "global_step": 225695, "epoch": 2719} {"train_loss": -24.61807632446289, "global_step": 225696, "epoch": 2719} {"train_loss": -24.564828872680664, "global_step": 225697, "epoch": 2719} {"train_loss": -24.756683349609375, "global_step": 225698, "epoch": 2719} {"train_loss": -24.539714813232422, "global_step": 225699, "epoch": 2719} {"train_loss": -24.655057907104492, "global_step": 225700, "epoch": 2719} {"train_loss": -24.63953971862793, "global_step": 225701, "epoch": 2719} {"train_loss": -24.559982299804688, "global_step": 225702, "epoch": 2719} {"train_loss": -24.734683990478516, "global_step": 225703, "epoch": 2719} {"train_loss": -24.355024337768555, "global_step": 225704, "epoch": 2719} {"train_loss": -24.61128044128418, "global_step": 225705, "epoch": 2719} {"train_loss": -24.663145065307617, "global_step": 225706, "epoch": 2719} {"train_loss": -24.40471076965332, "global_step": 225707, "epoch": 2719} {"train_loss": -25.24676513671875, "global_step": 225708, "epoch": 2719} {"train_loss": -24.58563804626465, "global_step": 225709, "epoch": 2719} {"train_loss": -24.611967086791992, "global_step": 225710, "epoch": 2719} {"train_loss": -24.67818260192871, "global_step": 225711, "epoch": 2719} {"train_loss": -24.409147262573242, "global_step": 225712, "epoch": 2719} {"train_loss": -24.392160415649414, "global_step": 225713, "epoch": 2719} {"train_loss": -24.673980712890625, "global_step": 225714, "epoch": 2719} {"train_loss": -24.69390296936035, "global_step": 225715, "epoch": 2719} {"train_loss": -25.112991333007812, "global_step": 225716, "epoch": 2719} {"train_loss": -24.562402725219727, "global_step": 225717, "epoch": 2719} {"train_loss": -24.64198875427246, "global_step": 225718, "epoch": 2719} {"train_loss": -24.528305053710938, "global_step": 225719, "epoch": 2719} {"train_loss": -24.751266479492188, "global_step": 225720, "epoch": 2719} {"train_loss": -24.293354034423828, "global_step": 225721, "epoch": 2719} {"train_loss": -24.52121925354004, "global_step": 225722, "epoch": 2719} {"train_loss": -24.48655128479004, "global_step": 225723, "epoch": 2719} {"train_loss": -24.745521545410156, "global_step": 225724, "epoch": 2719} {"train_loss": -24.564733505249023, "global_step": 225725, "epoch": 2719} {"train_loss": -24.375215530395508, "global_step": 225726, "epoch": 2719} {"train_loss": -25.141937255859375, "global_step": 225727, "epoch": 2719} {"train_loss": -24.639541625976562, "global_step": 225728, "epoch": 2719} {"train_loss": -24.30709457397461, "global_step": 225729, "epoch": 2719} {"train_loss": -24.25177001953125, "global_step": 225730, "epoch": 2719} {"train_loss": -24.39058494567871, "global_step": 225731, "epoch": 2719} {"train_loss": -24.5226993560791, "global_step": 225732, "epoch": 2719} {"train_loss": -24.464496612548828, "global_step": 225733, "epoch": 2719} {"train_loss": -24.479154586791992, "global_step": 225734, "epoch": 2719} {"train_loss": -24.51741600036621, "global_step": 225735, "epoch": 2719} {"train_loss": -24.690149307250977, "global_step": 225736, "epoch": 2719} {"train_loss": -25.052202224731445, "global_step": 225737, "epoch": 2719} {"train_loss": -24.455801010131836, "global_step": 225738, "epoch": 2719} {"train_loss": -24.608064651489258, "global_step": 225739, "epoch": 2719} {"train_loss": -24.423240661621094, "global_step": 225740, "epoch": 2719} {"train_loss": -25.02045249938965, "global_step": 225741, "epoch": 2719} {"train_loss": -24.73512840270996, "global_step": 225742, "epoch": 2719} {"train_loss": -24.621479034423828, "global_step": 225743, "epoch": 2719} {"train_loss": -24.51634407043457, "global_step": 225744, "epoch": 2719} {"train_loss": -24.805028915405273, "global_step": 225745, "epoch": 2719} {"train_loss": -24.406387329101562, "global_step": 225746, "epoch": 2719} {"train_loss": -24.759382247924805, "global_step": 225747, "epoch": 2719} {"train_loss": -24.831281661987305, "global_step": 225748, "epoch": 2719} {"train_loss": -24.941665649414062, "global_step": 225749, "epoch": 2719} {"train_loss": -24.49700355529785, "global_step": 225750, "epoch": 2719} {"train_loss": -24.65497589111328, "global_step": 225751, "epoch": 2719} {"train_loss": -24.870237350463867, "global_step": 225752, "epoch": 2719} {"train_loss": -24.374242782592773, "global_step": 225753, "epoch": 2719} {"train_loss": -24.32441520690918, "global_step": 225754, "epoch": 2719} {"train_loss": -24.4711856842041, "global_step": 225755, "epoch": 2719} {"train_loss": -25.027389526367188, "global_step": 225756, "epoch": 2719} {"train_loss": -24.427528381347656, "global_step": 225757, "epoch": 2719} {"train_loss": -24.522680282592773, "global_step": 225758, "epoch": 2719} {"train_loss": -24.523452965609998, "global_step": 225759, "epoch": 2719, "val_loss": 6657589.0} {"train_loss": -24.70477294921875, "global_step": 225760, "epoch": 2720} {"train_loss": -24.425323486328125, "global_step": 225761, "epoch": 2720} {"train_loss": -24.574565887451172, "global_step": 225762, "epoch": 2720} {"train_loss": -24.82782745361328, "global_step": 225763, "epoch": 2720} {"train_loss": -24.36149787902832, "global_step": 225764, "epoch": 2720} {"train_loss": -24.29036521911621, "global_step": 225765, "epoch": 2720} {"train_loss": -24.2808780670166, "global_step": 225766, "epoch": 2720} {"train_loss": -24.494003295898438, "global_step": 225767, "epoch": 2720} {"train_loss": -24.304637908935547, "global_step": 225768, "epoch": 2720} {"train_loss": -24.21919059753418, "global_step": 225769, "epoch": 2720} {"train_loss": -24.42051124572754, "global_step": 225770, "epoch": 2720} {"train_loss": -24.43834114074707, "global_step": 225771, "epoch": 2720} {"train_loss": -24.425537109375, "global_step": 225772, "epoch": 2720} {"train_loss": -24.55242347717285, "global_step": 225773, "epoch": 2720} {"train_loss": -24.358449935913086, "global_step": 225774, "epoch": 2720} {"train_loss": -24.62787437438965, "global_step": 225775, "epoch": 2720} {"train_loss": -24.658222198486328, "global_step": 225776, "epoch": 2720} {"train_loss": -24.865339279174805, "global_step": 225777, "epoch": 2720} {"train_loss": -24.6866512298584, "global_step": 225778, "epoch": 2720} {"train_loss": -24.76215934753418, "global_step": 225779, "epoch": 2720} {"train_loss": -24.42911148071289, "global_step": 225780, "epoch": 2720} {"train_loss": -24.261459350585938, "global_step": 225781, "epoch": 2720} {"train_loss": -24.7030086517334, "global_step": 225782, "epoch": 2720} {"train_loss": -24.92464256286621, "global_step": 225783, "epoch": 2720} {"train_loss": -24.906591415405273, "global_step": 225784, "epoch": 2720} {"train_loss": -24.703821182250977, "global_step": 225785, "epoch": 2720} {"train_loss": -24.682462692260742, "global_step": 225786, "epoch": 2720} {"train_loss": -25.00160026550293, "global_step": 225787, "epoch": 2720} {"train_loss": -25.001110076904297, "global_step": 225788, "epoch": 2720} {"train_loss": -24.71823501586914, "global_step": 225789, "epoch": 2720} {"train_loss": -24.756412506103516, "global_step": 225790, "epoch": 2720} {"train_loss": -24.566293716430664, "global_step": 225791, "epoch": 2720} {"train_loss": -24.82640838623047, "global_step": 225792, "epoch": 2720} {"train_loss": -24.689916610717773, "global_step": 225793, "epoch": 2720} {"train_loss": -25.144433975219727, "global_step": 225794, "epoch": 2720} {"train_loss": -24.828716278076172, "global_step": 225795, "epoch": 2720} {"train_loss": -24.913297653198242, "global_step": 225796, "epoch": 2720} {"train_loss": -24.85084342956543, "global_step": 225797, "epoch": 2720} {"train_loss": -24.839767456054688, "global_step": 225798, "epoch": 2720} {"train_loss": -24.665260314941406, "global_step": 225799, "epoch": 2720} {"train_loss": -24.78407096862793, "global_step": 225800, "epoch": 2720} {"train_loss": -24.623746871948242, "global_step": 225801, "epoch": 2720} {"train_loss": -24.77457618713379, "global_step": 225802, "epoch": 2720} {"train_loss": -24.817779541015625, "global_step": 225803, "epoch": 2720} {"train_loss": -24.931398391723633, "global_step": 225804, "epoch": 2720} {"train_loss": -24.655942916870117, "global_step": 225805, "epoch": 2720} {"train_loss": -24.987857818603516, "global_step": 225806, "epoch": 2720} {"train_loss": -24.7586727142334, "global_step": 225807, "epoch": 2720} {"train_loss": -24.809682846069336, "global_step": 225808, "epoch": 2720} {"train_loss": -24.81355094909668, "global_step": 225809, "epoch": 2720} {"train_loss": -24.672088623046875, "global_step": 225810, "epoch": 2720} {"train_loss": -24.72491455078125, "global_step": 225811, "epoch": 2720} {"train_loss": -24.34406852722168, "global_step": 225812, "epoch": 2720} {"train_loss": -24.600875854492188, "global_step": 225813, "epoch": 2720} {"train_loss": -24.960861206054688, "global_step": 225814, "epoch": 2720} {"train_loss": -24.484176635742188, "global_step": 225815, "epoch": 2720} {"train_loss": -24.740985870361328, "global_step": 225816, "epoch": 2720} {"train_loss": -24.758146286010742, "global_step": 225817, "epoch": 2720} {"train_loss": -24.50223159790039, "global_step": 225818, "epoch": 2720} {"train_loss": -24.686939239501953, "global_step": 225819, "epoch": 2720} {"train_loss": -24.83194923400879, "global_step": 225820, "epoch": 2720} {"train_loss": -24.513818740844727, "global_step": 225821, "epoch": 2720} {"train_loss": -23.977590560913086, "global_step": 225822, "epoch": 2720} {"train_loss": -23.22629165649414, "global_step": 225823, "epoch": 2720} {"train_loss": -23.361082077026367, "global_step": 225824, "epoch": 2720} {"train_loss": -24.785566329956055, "global_step": 225825, "epoch": 2720} {"train_loss": -23.6096134185791, "global_step": 225826, "epoch": 2720} {"train_loss": -24.07941436767578, "global_step": 225827, "epoch": 2720} {"train_loss": -24.164337158203125, "global_step": 225828, "epoch": 2720} {"train_loss": -24.732486724853516, "global_step": 225829, "epoch": 2720} {"train_loss": -24.435026168823242, "global_step": 225830, "epoch": 2720} {"train_loss": -24.606443405151367, "global_step": 225831, "epoch": 2720} {"train_loss": -24.22711181640625, "global_step": 225832, "epoch": 2720} {"train_loss": -24.34920883178711, "global_step": 225833, "epoch": 2720} {"train_loss": -24.31953239440918, "global_step": 225834, "epoch": 2720} {"train_loss": -24.316368103027344, "global_step": 225835, "epoch": 2720} {"train_loss": -24.33884048461914, "global_step": 225836, "epoch": 2720} {"train_loss": -24.407695770263672, "global_step": 225837, "epoch": 2720} {"train_loss": -24.551834106445312, "global_step": 225838, "epoch": 2720} {"train_loss": -24.73505973815918, "global_step": 225839, "epoch": 2720} {"train_loss": -24.428068161010742, "global_step": 225840, "epoch": 2720} {"train_loss": -24.428709030151367, "global_step": 225841, "epoch": 2720} {"train_loss": -24.560653043080524, "global_step": 225842, "epoch": 2720, "val_loss": 6625659.0} {"train_loss": -24.052093505859375, "global_step": 225843, "epoch": 2721} {"train_loss": -24.288360595703125, "global_step": 225844, "epoch": 2721} {"train_loss": -24.425552368164062, "global_step": 225845, "epoch": 2721} {"train_loss": -24.070608139038086, "global_step": 225846, "epoch": 2721} {"train_loss": -24.5581111907959, "global_step": 225847, "epoch": 2721} {"train_loss": -24.360044479370117, "global_step": 225848, "epoch": 2721} {"train_loss": -24.290769577026367, "global_step": 225849, "epoch": 2721} {"train_loss": -24.38873863220215, "global_step": 225850, "epoch": 2721} {"train_loss": -23.95293617248535, "global_step": 225851, "epoch": 2721} {"train_loss": -24.559120178222656, "global_step": 225852, "epoch": 2721} {"train_loss": -24.54759979248047, "global_step": 225853, "epoch": 2721} {"train_loss": -24.271926879882812, "global_step": 225854, "epoch": 2721} {"train_loss": -24.62306022644043, "global_step": 225855, "epoch": 2721} {"train_loss": -24.560462951660156, "global_step": 225856, "epoch": 2721} {"train_loss": -24.51389503479004, "global_step": 225857, "epoch": 2721} {"train_loss": -24.828214645385742, "global_step": 225858, "epoch": 2721} {"train_loss": -24.780500411987305, "global_step": 225859, "epoch": 2721} {"train_loss": -24.117219924926758, "global_step": 225860, "epoch": 2721} {"train_loss": -24.577848434448242, "global_step": 225861, "epoch": 2721} {"train_loss": -24.615310668945312, "global_step": 225862, "epoch": 2721} {"train_loss": -24.251493453979492, "global_step": 225863, "epoch": 2721} {"train_loss": -24.463699340820312, "global_step": 225864, "epoch": 2721} {"train_loss": -24.73740005493164, "global_step": 225865, "epoch": 2721} {"train_loss": -24.201414108276367, "global_step": 225866, "epoch": 2721} {"train_loss": -25.105207443237305, "global_step": 225867, "epoch": 2721} {"train_loss": -24.240806579589844, "global_step": 225868, "epoch": 2721} {"train_loss": -24.765613555908203, "global_step": 225869, "epoch": 2721} {"train_loss": -24.6528263092041, "global_step": 225870, "epoch": 2721} {"train_loss": -24.349027633666992, "global_step": 225871, "epoch": 2721} {"train_loss": -24.5915470123291, "global_step": 225872, "epoch": 2721} {"train_loss": -24.5341854095459, "global_step": 225873, "epoch": 2721} {"train_loss": -24.796634674072266, "global_step": 225874, "epoch": 2721} {"train_loss": -24.661039352416992, "global_step": 225875, "epoch": 2721} {"train_loss": -24.70582389831543, "global_step": 225876, "epoch": 2721} {"train_loss": -24.896432876586914, "global_step": 225877, "epoch": 2721} {"train_loss": -24.619037628173828, "global_step": 225878, "epoch": 2721} {"train_loss": -24.930248260498047, "global_step": 225879, "epoch": 2721} {"train_loss": -25.04017448425293, "global_step": 225880, "epoch": 2721} {"train_loss": -24.71731948852539, "global_step": 225881, "epoch": 2721} {"train_loss": -24.810047149658203, "global_step": 225882, "epoch": 2721} {"train_loss": -24.82013702392578, "global_step": 225883, "epoch": 2721} {"train_loss": -24.72813606262207, "global_step": 225884, "epoch": 2721} {"train_loss": -24.415082931518555, "global_step": 225885, "epoch": 2721} {"train_loss": -24.653417587280273, "global_step": 225886, "epoch": 2721} {"train_loss": -24.588186264038086, "global_step": 225887, "epoch": 2721} {"train_loss": -24.673988342285156, "global_step": 225888, "epoch": 2721} {"train_loss": -24.23256492614746, "global_step": 225889, "epoch": 2721} {"train_loss": -24.702817916870117, "global_step": 225890, "epoch": 2721} {"train_loss": -25.03969383239746, "global_step": 225891, "epoch": 2721} {"train_loss": -24.395322799682617, "global_step": 225892, "epoch": 2721} {"train_loss": -24.40524673461914, "global_step": 225893, "epoch": 2721} {"train_loss": -24.535892486572266, "global_step": 225894, "epoch": 2721} {"train_loss": -24.49513816833496, "global_step": 225895, "epoch": 2721} {"train_loss": -24.70309829711914, "global_step": 225896, "epoch": 2721} {"train_loss": -24.30714225769043, "global_step": 225897, "epoch": 2721} {"train_loss": -24.642234802246094, "global_step": 225898, "epoch": 2721} {"train_loss": -24.74060821533203, "global_step": 225899, "epoch": 2721} {"train_loss": -24.841032028198242, "global_step": 225900, "epoch": 2721} {"train_loss": -24.43232536315918, "global_step": 225901, "epoch": 2721} {"train_loss": -24.51333236694336, "global_step": 225902, "epoch": 2721} {"train_loss": -24.72232437133789, "global_step": 225903, "epoch": 2721} {"train_loss": -24.409862518310547, "global_step": 225904, "epoch": 2721} {"train_loss": -24.815458297729492, "global_step": 225905, "epoch": 2721} {"train_loss": -25.175052642822266, "global_step": 225906, "epoch": 2721} {"train_loss": -24.540979385375977, "global_step": 225907, "epoch": 2721} {"train_loss": -24.659061431884766, "global_step": 225908, "epoch": 2721} {"train_loss": -24.576078414916992, "global_step": 225909, "epoch": 2721} {"train_loss": -24.7092342376709, "global_step": 225910, "epoch": 2721} {"train_loss": -25.13907241821289, "global_step": 225911, "epoch": 2721} {"train_loss": -24.47629737854004, "global_step": 225912, "epoch": 2721} {"train_loss": -24.797874450683594, "global_step": 225913, "epoch": 2721} {"train_loss": -24.981643676757812, "global_step": 225914, "epoch": 2721} {"train_loss": -24.761280059814453, "global_step": 225915, "epoch": 2721} {"train_loss": -24.77332878112793, "global_step": 225916, "epoch": 2721} {"train_loss": -25.070945739746094, "global_step": 225917, "epoch": 2721} {"train_loss": -24.87690544128418, "global_step": 225918, "epoch": 2721} {"train_loss": -24.887216567993164, "global_step": 225919, "epoch": 2721} {"train_loss": -24.852933883666992, "global_step": 225920, "epoch": 2721} {"train_loss": -24.482255935668945, "global_step": 225921, "epoch": 2721} {"train_loss": -24.566442489624023, "global_step": 225922, "epoch": 2721} {"train_loss": -24.733642578125, "global_step": 225923, "epoch": 2721} {"train_loss": -24.385883331298828, "global_step": 225924, "epoch": 2721} {"train_loss": -24.594407483755823, "global_step": 225925, "epoch": 2721, "val_loss": 6719539.0} {"train_loss": -23.669403076171875, "global_step": 225926, "epoch": 2722} {"train_loss": -23.58863639831543, "global_step": 225927, "epoch": 2722} {"train_loss": -24.35302734375, "global_step": 225928, "epoch": 2722} {"train_loss": -23.93052864074707, "global_step": 225929, "epoch": 2722} {"train_loss": -24.734556198120117, "global_step": 225930, "epoch": 2722} {"train_loss": -24.416027069091797, "global_step": 225931, "epoch": 2722} {"train_loss": -24.048664093017578, "global_step": 225932, "epoch": 2722} {"train_loss": -24.227354049682617, "global_step": 225933, "epoch": 2722} {"train_loss": -24.369861602783203, "global_step": 225934, "epoch": 2722} {"train_loss": -23.885562896728516, "global_step": 225935, "epoch": 2722} {"train_loss": -24.137516021728516, "global_step": 225936, "epoch": 2722} {"train_loss": -24.562284469604492, "global_step": 225937, "epoch": 2722} {"train_loss": -24.165590286254883, "global_step": 225938, "epoch": 2722} {"train_loss": -24.440465927124023, "global_step": 225939, "epoch": 2722} {"train_loss": -24.7426815032959, "global_step": 225940, "epoch": 2722} {"train_loss": -24.6903018951416, "global_step": 225941, "epoch": 2722} {"train_loss": -24.70491600036621, "global_step": 225942, "epoch": 2722} {"train_loss": -24.524351119995117, "global_step": 225943, "epoch": 2722} {"train_loss": -24.79934310913086, "global_step": 225944, "epoch": 2722} {"train_loss": -24.620939254760742, "global_step": 225945, "epoch": 2722} {"train_loss": -24.619876861572266, "global_step": 225946, "epoch": 2722} {"train_loss": -24.81965446472168, "global_step": 225947, "epoch": 2722} {"train_loss": -24.6734619140625, "global_step": 225948, "epoch": 2722} {"train_loss": -24.738706588745117, "global_step": 225949, "epoch": 2722} {"train_loss": -24.40667152404785, "global_step": 225950, "epoch": 2722} {"train_loss": -24.629863739013672, "global_step": 225951, "epoch": 2722} {"train_loss": -24.952484130859375, "global_step": 225952, "epoch": 2722} {"train_loss": -24.726911544799805, "global_step": 225953, "epoch": 2722} {"train_loss": -24.610090255737305, "global_step": 225954, "epoch": 2722} {"train_loss": -24.81673240661621, "global_step": 225955, "epoch": 2722} {"train_loss": -24.653732299804688, "global_step": 225956, "epoch": 2722} {"train_loss": -24.908353805541992, "global_step": 225957, "epoch": 2722} {"train_loss": -24.453041076660156, "global_step": 225958, "epoch": 2722} {"train_loss": -24.722713470458984, "global_step": 225959, "epoch": 2722} {"train_loss": -25.155200958251953, "global_step": 225960, "epoch": 2722} {"train_loss": -24.86614418029785, "global_step": 225961, "epoch": 2722} {"train_loss": -24.746475219726562, "global_step": 225962, "epoch": 2722} {"train_loss": -24.5445499420166, "global_step": 225963, "epoch": 2722} {"train_loss": -24.7651424407959, "global_step": 225964, "epoch": 2722} {"train_loss": -24.879547119140625, "global_step": 225965, "epoch": 2722} {"train_loss": -24.715747833251953, "global_step": 225966, "epoch": 2722} {"train_loss": -25.069223403930664, "global_step": 225967, "epoch": 2722} {"train_loss": -24.768142700195312, "global_step": 225968, "epoch": 2722} {"train_loss": -24.53345489501953, "global_step": 225969, "epoch": 2722} {"train_loss": -24.391691207885742, "global_step": 225970, "epoch": 2722} {"train_loss": -24.88276481628418, "global_step": 225971, "epoch": 2722} {"train_loss": -24.76265525817871, "global_step": 225972, "epoch": 2722} {"train_loss": -24.496679306030273, "global_step": 225973, "epoch": 2722} {"train_loss": -24.374303817749023, "global_step": 225974, "epoch": 2722} {"train_loss": -24.207839965820312, "global_step": 225975, "epoch": 2722} {"train_loss": -24.511075973510742, "global_step": 225976, "epoch": 2722} {"train_loss": -24.747243881225586, "global_step": 225977, "epoch": 2722} {"train_loss": -24.357664108276367, "global_step": 225978, "epoch": 2722} {"train_loss": -24.733871459960938, "global_step": 225979, "epoch": 2722} {"train_loss": -24.317665100097656, "global_step": 225980, "epoch": 2722} {"train_loss": -24.89193344116211, "global_step": 225981, "epoch": 2722} {"train_loss": -24.97222900390625, "global_step": 225982, "epoch": 2722} {"train_loss": -24.300048828125, "global_step": 225983, "epoch": 2722} {"train_loss": -24.91318130493164, "global_step": 225984, "epoch": 2722} {"train_loss": -24.424087524414062, "global_step": 225985, "epoch": 2722} {"train_loss": -24.50507354736328, "global_step": 225986, "epoch": 2722} {"train_loss": -24.722692489624023, "global_step": 225987, "epoch": 2722} {"train_loss": -24.85040283203125, "global_step": 225988, "epoch": 2722} {"train_loss": -24.661563873291016, "global_step": 225989, "epoch": 2722} {"train_loss": -24.92220687866211, "global_step": 225990, "epoch": 2722} {"train_loss": -24.562665939331055, "global_step": 225991, "epoch": 2722} {"train_loss": -24.8621768951416, "global_step": 225992, "epoch": 2722} {"train_loss": -24.74818229675293, "global_step": 225993, "epoch": 2722} {"train_loss": -24.676481246948242, "global_step": 225994, "epoch": 2722} {"train_loss": -24.94363784790039, "global_step": 225995, "epoch": 2722} {"train_loss": -24.87628936767578, "global_step": 225996, "epoch": 2722} {"train_loss": -24.12858009338379, "global_step": 225997, "epoch": 2722} {"train_loss": -24.43270492553711, "global_step": 225998, "epoch": 2722} {"train_loss": -24.62232780456543, "global_step": 225999, "epoch": 2722} {"train_loss": -24.533649444580078, "global_step": 226000, "epoch": 2722} {"train_loss": -24.868457794189453, "global_step": 226001, "epoch": 2722} {"train_loss": -24.91442108154297, "global_step": 226002, "epoch": 2722} {"train_loss": -24.85304069519043, "global_step": 226003, "epoch": 2722} {"train_loss": -24.6437931060791, "global_step": 226004, "epoch": 2722} {"train_loss": -24.918161392211914, "global_step": 226005, "epoch": 2722} {"train_loss": -24.727706909179688, "global_step": 226006, "epoch": 2722} {"train_loss": -24.774417877197266, "global_step": 226007, "epoch": 2722} {"train_loss": -24.621178707444525, "global_step": 226008, "epoch": 2722, "val_loss": 6696108.0} {"train_loss": -24.43134880065918, "global_step": 226009, "epoch": 2723} {"train_loss": -24.242557525634766, "global_step": 226010, "epoch": 2723} {"train_loss": -24.065759658813477, "global_step": 226011, "epoch": 2723} {"train_loss": -24.71624183654785, "global_step": 226012, "epoch": 2723} {"train_loss": -24.822500228881836, "global_step": 226013, "epoch": 2723} {"train_loss": -24.197507858276367, "global_step": 226014, "epoch": 2723} {"train_loss": -23.93691062927246, "global_step": 226015, "epoch": 2723} {"train_loss": -24.415882110595703, "global_step": 226016, "epoch": 2723} {"train_loss": -24.2117977142334, "global_step": 226017, "epoch": 2723} {"train_loss": -24.37335205078125, "global_step": 226018, "epoch": 2723} {"train_loss": -24.379941940307617, "global_step": 226019, "epoch": 2723} {"train_loss": -24.114187240600586, "global_step": 226020, "epoch": 2723} {"train_loss": -24.17119789123535, "global_step": 226021, "epoch": 2723} {"train_loss": -24.296445846557617, "global_step": 226022, "epoch": 2723} {"train_loss": -24.1676025390625, "global_step": 226023, "epoch": 2723} {"train_loss": -24.26573944091797, "global_step": 226024, "epoch": 2723} {"train_loss": -24.321794509887695, "global_step": 226025, "epoch": 2723} {"train_loss": -24.269805908203125, "global_step": 226026, "epoch": 2723} {"train_loss": -24.82330894470215, "global_step": 226027, "epoch": 2723} {"train_loss": -24.2691593170166, "global_step": 226028, "epoch": 2723} {"train_loss": -24.70684814453125, "global_step": 226029, "epoch": 2723} {"train_loss": -24.469959259033203, "global_step": 226030, "epoch": 2723} {"train_loss": -24.175016403198242, "global_step": 226031, "epoch": 2723} {"train_loss": -24.99295997619629, "global_step": 226032, "epoch": 2723} {"train_loss": -24.714305877685547, "global_step": 226033, "epoch": 2723} {"train_loss": -24.47869873046875, "global_step": 226034, "epoch": 2723} {"train_loss": -24.426294326782227, "global_step": 226035, "epoch": 2723} {"train_loss": -24.713350296020508, "global_step": 226036, "epoch": 2723} {"train_loss": -24.482513427734375, "global_step": 226037, "epoch": 2723} {"train_loss": -24.570411682128906, "global_step": 226038, "epoch": 2723} {"train_loss": -24.89954948425293, "global_step": 226039, "epoch": 2723} {"train_loss": -24.60988426208496, "global_step": 226040, "epoch": 2723} {"train_loss": -24.556705474853516, "global_step": 226041, "epoch": 2723} {"train_loss": -24.718420028686523, "global_step": 226042, "epoch": 2723} {"train_loss": -24.666828155517578, "global_step": 226043, "epoch": 2723} {"train_loss": -24.803077697753906, "global_step": 226044, "epoch": 2723} {"train_loss": -25.21099853515625, "global_step": 226045, "epoch": 2723} {"train_loss": -24.665067672729492, "global_step": 226046, "epoch": 2723} {"train_loss": -24.502370834350586, "global_step": 226047, "epoch": 2723} {"train_loss": -24.78999900817871, "global_step": 226048, "epoch": 2723} {"train_loss": -24.57525634765625, "global_step": 226049, "epoch": 2723} {"train_loss": -24.910741806030273, "global_step": 226050, "epoch": 2723} {"train_loss": -24.824796676635742, "global_step": 226051, "epoch": 2723} {"train_loss": -25.073787689208984, "global_step": 226052, "epoch": 2723} {"train_loss": -24.6595458984375, "global_step": 226053, "epoch": 2723} {"train_loss": -24.388540267944336, "global_step": 226054, "epoch": 2723} {"train_loss": -24.837743759155273, "global_step": 226055, "epoch": 2723} {"train_loss": -24.76051902770996, "global_step": 226056, "epoch": 2723} {"train_loss": -24.94931411743164, "global_step": 226057, "epoch": 2723} {"train_loss": -24.693111419677734, "global_step": 226058, "epoch": 2723} {"train_loss": -24.7958984375, "global_step": 226059, "epoch": 2723} {"train_loss": -24.390857696533203, "global_step": 226060, "epoch": 2723} {"train_loss": -24.333181381225586, "global_step": 226061, "epoch": 2723} {"train_loss": -24.866262435913086, "global_step": 226062, "epoch": 2723} {"train_loss": -24.741567611694336, "global_step": 226063, "epoch": 2723} {"train_loss": -24.336631774902344, "global_step": 226064, "epoch": 2723} {"train_loss": -24.801422119140625, "global_step": 226065, "epoch": 2723} {"train_loss": -24.411941528320312, "global_step": 226066, "epoch": 2723} {"train_loss": -24.810562133789062, "global_step": 226067, "epoch": 2723} {"train_loss": -24.298248291015625, "global_step": 226068, "epoch": 2723} {"train_loss": -24.90467643737793, "global_step": 226069, "epoch": 2723} {"train_loss": -24.232446670532227, "global_step": 226070, "epoch": 2723} {"train_loss": -24.81129264831543, "global_step": 226071, "epoch": 2723} {"train_loss": -24.707782745361328, "global_step": 226072, "epoch": 2723} {"train_loss": -24.335147857666016, "global_step": 226073, "epoch": 2723} {"train_loss": -24.78278160095215, "global_step": 226074, "epoch": 2723} {"train_loss": -24.61893081665039, "global_step": 226075, "epoch": 2723} {"train_loss": -24.650962829589844, "global_step": 226076, "epoch": 2723} {"train_loss": -24.587345123291016, "global_step": 226077, "epoch": 2723} {"train_loss": -24.43043327331543, "global_step": 226078, "epoch": 2723} {"train_loss": -24.460800170898438, "global_step": 226079, "epoch": 2723} {"train_loss": -24.873754501342773, "global_step": 226080, "epoch": 2723} {"train_loss": -24.807409286499023, "global_step": 226081, "epoch": 2723} {"train_loss": -24.76262855529785, "global_step": 226082, "epoch": 2723} {"train_loss": -24.722930908203125, "global_step": 226083, "epoch": 2723} {"train_loss": -24.960432052612305, "global_step": 226084, "epoch": 2723} {"train_loss": -24.771757125854492, "global_step": 226085, "epoch": 2723} {"train_loss": -24.618364334106445, "global_step": 226086, "epoch": 2723} {"train_loss": -24.61564064025879, "global_step": 226087, "epoch": 2723} {"train_loss": -24.87557029724121, "global_step": 226088, "epoch": 2723} {"train_loss": -24.687646865844727, "global_step": 226089, "epoch": 2723} {"train_loss": -24.806676864624023, "global_step": 226090, "epoch": 2723} {"train_loss": -24.58438765284527, "global_step": 226091, "epoch": 2723, "val_loss": 6666933.0} {"train_loss": -24.64160919189453, "global_step": 226092, "epoch": 2724} {"train_loss": -24.277257919311523, "global_step": 226093, "epoch": 2724} {"train_loss": -24.612672805786133, "global_step": 226094, "epoch": 2724} {"train_loss": -24.46695899963379, "global_step": 226095, "epoch": 2724} {"train_loss": -24.567785263061523, "global_step": 226096, "epoch": 2724} {"train_loss": -24.894943237304688, "global_step": 226097, "epoch": 2724} {"train_loss": -24.493925094604492, "global_step": 226098, "epoch": 2724} {"train_loss": -24.54547119140625, "global_step": 226099, "epoch": 2724} {"train_loss": -24.2487850189209, "global_step": 226100, "epoch": 2724} {"train_loss": -24.523162841796875, "global_step": 226101, "epoch": 2724} {"train_loss": -24.656904220581055, "global_step": 226102, "epoch": 2724} {"train_loss": -24.33616065979004, "global_step": 226103, "epoch": 2724} {"train_loss": -25.232088088989258, "global_step": 226104, "epoch": 2724} {"train_loss": -24.083234786987305, "global_step": 226105, "epoch": 2724} {"train_loss": -24.24545669555664, "global_step": 226106, "epoch": 2724} {"train_loss": -24.960636138916016, "global_step": 226107, "epoch": 2724} {"train_loss": -24.7121524810791, "global_step": 226108, "epoch": 2724} {"train_loss": -24.95306968688965, "global_step": 226109, "epoch": 2724} {"train_loss": -24.62042236328125, "global_step": 226110, "epoch": 2724} {"train_loss": -24.8067569732666, "global_step": 226111, "epoch": 2724} {"train_loss": -24.46785545349121, "global_step": 226112, "epoch": 2724} {"train_loss": -24.643613815307617, "global_step": 226113, "epoch": 2724} {"train_loss": -25.108318328857422, "global_step": 226114, "epoch": 2724} {"train_loss": -24.444154739379883, "global_step": 226115, "epoch": 2724} {"train_loss": -24.570880889892578, "global_step": 226116, "epoch": 2724} {"train_loss": -24.7435245513916, "global_step": 226117, "epoch": 2724} {"train_loss": -25.235570907592773, "global_step": 226118, "epoch": 2724} {"train_loss": -24.924551010131836, "global_step": 226119, "epoch": 2724} {"train_loss": -24.82490348815918, "global_step": 226120, "epoch": 2724} {"train_loss": -24.895721435546875, "global_step": 226121, "epoch": 2724} {"train_loss": -24.971485137939453, "global_step": 226122, "epoch": 2724} {"train_loss": -24.97499656677246, "global_step": 226123, "epoch": 2724} {"train_loss": -24.76220703125, "global_step": 226124, "epoch": 2724} {"train_loss": -25.152645111083984, "global_step": 226125, "epoch": 2724} {"train_loss": -24.694318771362305, "global_step": 226126, "epoch": 2724} {"train_loss": -24.695877075195312, "global_step": 226127, "epoch": 2724} {"train_loss": -24.622573852539062, "global_step": 226128, "epoch": 2724} {"train_loss": -24.758811950683594, "global_step": 226129, "epoch": 2724} {"train_loss": -24.656919479370117, "global_step": 226130, "epoch": 2724} {"train_loss": -24.66090965270996, "global_step": 226131, "epoch": 2724} {"train_loss": -25.194805145263672, "global_step": 226132, "epoch": 2724} {"train_loss": -24.698230743408203, "global_step": 226133, "epoch": 2724} {"train_loss": -24.51959228515625, "global_step": 226134, "epoch": 2724} {"train_loss": -24.754825592041016, "global_step": 226135, "epoch": 2724} {"train_loss": -24.552820205688477, "global_step": 226136, "epoch": 2724} {"train_loss": -24.624183654785156, "global_step": 226137, "epoch": 2724} {"train_loss": -24.52520179748535, "global_step": 226138, "epoch": 2724} {"train_loss": -24.624624252319336, "global_step": 226139, "epoch": 2724} {"train_loss": -24.872854232788086, "global_step": 226140, "epoch": 2724} {"train_loss": -24.629697799682617, "global_step": 226141, "epoch": 2724} {"train_loss": -24.94540023803711, "global_step": 226142, "epoch": 2724} {"train_loss": -24.54554557800293, "global_step": 226143, "epoch": 2724} {"train_loss": -24.779874801635742, "global_step": 226144, "epoch": 2724} {"train_loss": -24.68158531188965, "global_step": 226145, "epoch": 2724} {"train_loss": -24.647891998291016, "global_step": 226146, "epoch": 2724} {"train_loss": -24.59207534790039, "global_step": 226147, "epoch": 2724} {"train_loss": -24.535818099975586, "global_step": 226148, "epoch": 2724} {"train_loss": -24.79030418395996, "global_step": 226149, "epoch": 2724} {"train_loss": -24.5727481842041, "global_step": 226150, "epoch": 2724} {"train_loss": -24.80604362487793, "global_step": 226151, "epoch": 2724} {"train_loss": -24.929929733276367, "global_step": 226152, "epoch": 2724} {"train_loss": -24.309452056884766, "global_step": 226153, "epoch": 2724} {"train_loss": -24.511343002319336, "global_step": 226154, "epoch": 2724} {"train_loss": -24.463411331176758, "global_step": 226155, "epoch": 2724} {"train_loss": -24.86224365234375, "global_step": 226156, "epoch": 2724} {"train_loss": -24.458892822265625, "global_step": 226157, "epoch": 2724} {"train_loss": -24.754100799560547, "global_step": 226158, "epoch": 2724} {"train_loss": -24.42902946472168, "global_step": 226159, "epoch": 2724} {"train_loss": -24.476648330688477, "global_step": 226160, "epoch": 2724} {"train_loss": -24.368671417236328, "global_step": 226161, "epoch": 2724} {"train_loss": -24.754913330078125, "global_step": 226162, "epoch": 2724} {"train_loss": -24.256118774414062, "global_step": 226163, "epoch": 2724} {"train_loss": -24.567373275756836, "global_step": 226164, "epoch": 2724} {"train_loss": -24.350250244140625, "global_step": 226165, "epoch": 2724} {"train_loss": -24.335893630981445, "global_step": 226166, "epoch": 2724} {"train_loss": -24.80341148376465, "global_step": 226167, "epoch": 2724} {"train_loss": -24.58669090270996, "global_step": 226168, "epoch": 2724} {"train_loss": -24.74946403503418, "global_step": 226169, "epoch": 2724} {"train_loss": -24.14884376525879, "global_step": 226170, "epoch": 2724} {"train_loss": -24.959087371826172, "global_step": 226171, "epoch": 2724} {"train_loss": -24.37651252746582, "global_step": 226172, "epoch": 2724} {"train_loss": -24.50693130493164, "global_step": 226173, "epoch": 2724} {"train_loss": -24.64853796901473, "global_step": 226174, "epoch": 2724, "val_loss": 6753269.0} {"train_loss": -24.468847274780273, "global_step": 226175, "epoch": 2725} {"train_loss": -24.052392959594727, "global_step": 226176, "epoch": 2725} {"train_loss": -23.580726623535156, "global_step": 226177, "epoch": 2725} {"train_loss": -24.598371505737305, "global_step": 226178, "epoch": 2725} {"train_loss": -24.20830726623535, "global_step": 226179, "epoch": 2725} {"train_loss": -24.529117584228516, "global_step": 226180, "epoch": 2725} {"train_loss": -24.30511474609375, "global_step": 226181, "epoch": 2725} {"train_loss": -23.96780776977539, "global_step": 226182, "epoch": 2725} {"train_loss": -24.60390281677246, "global_step": 226183, "epoch": 2725} {"train_loss": -24.105716705322266, "global_step": 226184, "epoch": 2725} {"train_loss": -24.007699966430664, "global_step": 226185, "epoch": 2725} {"train_loss": -24.99178123474121, "global_step": 226186, "epoch": 2725} {"train_loss": -24.51556968688965, "global_step": 226187, "epoch": 2725} {"train_loss": -24.37168312072754, "global_step": 226188, "epoch": 2725} {"train_loss": -24.711624145507812, "global_step": 226189, "epoch": 2725} {"train_loss": -24.579313278198242, "global_step": 226190, "epoch": 2725} {"train_loss": -24.872669219970703, "global_step": 226191, "epoch": 2725} {"train_loss": -24.875532150268555, "global_step": 226192, "epoch": 2725} {"train_loss": -24.541425704956055, "global_step": 226193, "epoch": 2725} {"train_loss": -25.05024528503418, "global_step": 226194, "epoch": 2725} {"train_loss": -24.839679718017578, "global_step": 226195, "epoch": 2725} {"train_loss": -24.425559997558594, "global_step": 226196, "epoch": 2725} {"train_loss": -24.697404861450195, "global_step": 226197, "epoch": 2725} {"train_loss": -24.615894317626953, "global_step": 226198, "epoch": 2725} {"train_loss": -24.503318786621094, "global_step": 226199, "epoch": 2725} {"train_loss": -24.57970428466797, "global_step": 226200, "epoch": 2725} {"train_loss": -24.54948616027832, "global_step": 226201, "epoch": 2725} {"train_loss": -24.441251754760742, "global_step": 226202, "epoch": 2725} {"train_loss": -24.454914093017578, "global_step": 226203, "epoch": 2725} {"train_loss": -24.6253719329834, "global_step": 226204, "epoch": 2725} {"train_loss": -24.732471466064453, "global_step": 226205, "epoch": 2725} {"train_loss": -24.47980308532715, "global_step": 226206, "epoch": 2725} {"train_loss": -24.601333618164062, "global_step": 226207, "epoch": 2725} {"train_loss": -24.72416114807129, "global_step": 226208, "epoch": 2725} {"train_loss": -24.79654312133789, "global_step": 226209, "epoch": 2725} {"train_loss": -24.7371883392334, "global_step": 226210, "epoch": 2725} {"train_loss": -24.8756103515625, "global_step": 226211, "epoch": 2725} {"train_loss": -24.651660919189453, "global_step": 226212, "epoch": 2725} {"train_loss": -24.52302360534668, "global_step": 226213, "epoch": 2725} {"train_loss": -24.55222511291504, "global_step": 226214, "epoch": 2725} {"train_loss": -24.332136154174805, "global_step": 226215, "epoch": 2725} {"train_loss": -25.16219139099121, "global_step": 226216, "epoch": 2725} {"train_loss": -24.557891845703125, "global_step": 226217, "epoch": 2725} {"train_loss": -24.442657470703125, "global_step": 226218, "epoch": 2725} {"train_loss": -24.33135986328125, "global_step": 226219, "epoch": 2725} {"train_loss": -24.313100814819336, "global_step": 226220, "epoch": 2725} {"train_loss": -24.915250778198242, "global_step": 226221, "epoch": 2725} {"train_loss": -24.36992835998535, "global_step": 226222, "epoch": 2725} {"train_loss": -24.699995040893555, "global_step": 226223, "epoch": 2725} {"train_loss": -24.841001510620117, "global_step": 226224, "epoch": 2725} {"train_loss": -24.356714248657227, "global_step": 226225, "epoch": 2725} {"train_loss": -24.4188289642334, "global_step": 226226, "epoch": 2725} {"train_loss": -24.875255584716797, "global_step": 226227, "epoch": 2725} {"train_loss": -24.495595932006836, "global_step": 226228, "epoch": 2725} {"train_loss": -24.806110382080078, "global_step": 226229, "epoch": 2725} {"train_loss": -24.44463348388672, "global_step": 226230, "epoch": 2725} {"train_loss": -24.93320655822754, "global_step": 226231, "epoch": 2725} {"train_loss": -24.589292526245117, "global_step": 226232, "epoch": 2725} {"train_loss": -24.346708297729492, "global_step": 226233, "epoch": 2725} {"train_loss": -24.512928009033203, "global_step": 226234, "epoch": 2725} {"train_loss": -25.084882736206055, "global_step": 226235, "epoch": 2725} {"train_loss": -24.610036849975586, "global_step": 226236, "epoch": 2725} {"train_loss": -24.897802352905273, "global_step": 226237, "epoch": 2725} {"train_loss": -24.83652687072754, "global_step": 226238, "epoch": 2725} {"train_loss": -24.769651412963867, "global_step": 226239, "epoch": 2725} {"train_loss": -24.800277709960938, "global_step": 226240, "epoch": 2725} {"train_loss": -25.139930725097656, "global_step": 226241, "epoch": 2725} {"train_loss": -24.47369956970215, "global_step": 226242, "epoch": 2725} {"train_loss": -24.749984741210938, "global_step": 226243, "epoch": 2725} {"train_loss": -24.63532066345215, "global_step": 226244, "epoch": 2725} {"train_loss": -24.75832176208496, "global_step": 226245, "epoch": 2725} {"train_loss": -24.749561309814453, "global_step": 226246, "epoch": 2725} {"train_loss": -24.949386596679688, "global_step": 226247, "epoch": 2725} {"train_loss": -24.838275909423828, "global_step": 226248, "epoch": 2725} {"train_loss": -25.057415008544922, "global_step": 226249, "epoch": 2725} {"train_loss": -24.8951416015625, "global_step": 226250, "epoch": 2725} {"train_loss": -24.543867111206055, "global_step": 226251, "epoch": 2725} {"train_loss": -25.130905151367188, "global_step": 226252, "epoch": 2725} {"train_loss": -24.77197265625, "global_step": 226253, "epoch": 2725} {"train_loss": -24.645715713500977, "global_step": 226254, "epoch": 2725} {"train_loss": -24.475738525390625, "global_step": 226255, "epoch": 2725} {"train_loss": -24.227230072021484, "global_step": 226256, "epoch": 2725} {"train_loss": -24.59312756090279, "global_step": 226257, "epoch": 2725, "val_loss": 6683158.0} {"train_loss": -21.036792755126953, "global_step": 226258, "epoch": 2726} {"train_loss": -21.922748565673828, "global_step": 226259, "epoch": 2726} {"train_loss": -23.014022827148438, "global_step": 226260, "epoch": 2726} {"train_loss": -22.677392959594727, "global_step": 226261, "epoch": 2726} {"train_loss": -23.203699111938477, "global_step": 226262, "epoch": 2726} {"train_loss": -23.7547550201416, "global_step": 226263, "epoch": 2726} {"train_loss": -22.558908462524414, "global_step": 226264, "epoch": 2726} {"train_loss": -23.98563575744629, "global_step": 226265, "epoch": 2726} {"train_loss": -23.594717025756836, "global_step": 226266, "epoch": 2726} {"train_loss": -23.289487838745117, "global_step": 226267, "epoch": 2726} {"train_loss": -23.546091079711914, "global_step": 226268, "epoch": 2726} {"train_loss": -23.832687377929688, "global_step": 226269, "epoch": 2726} {"train_loss": -23.680097579956055, "global_step": 226270, "epoch": 2726} {"train_loss": -23.819095611572266, "global_step": 226271, "epoch": 2726} {"train_loss": -23.840185165405273, "global_step": 226272, "epoch": 2726} {"train_loss": -23.739131927490234, "global_step": 226273, "epoch": 2726} {"train_loss": -24.166603088378906, "global_step": 226274, "epoch": 2726} {"train_loss": -23.839420318603516, "global_step": 226275, "epoch": 2726} {"train_loss": -23.923542022705078, "global_step": 226276, "epoch": 2726} {"train_loss": -23.976505279541016, "global_step": 226277, "epoch": 2726} {"train_loss": -23.914453506469727, "global_step": 226278, "epoch": 2726} {"train_loss": -23.934925079345703, "global_step": 226279, "epoch": 2726} {"train_loss": -23.804630279541016, "global_step": 226280, "epoch": 2726} {"train_loss": -23.902740478515625, "global_step": 226281, "epoch": 2726} {"train_loss": -24.118844985961914, "global_step": 226282, "epoch": 2726} {"train_loss": -24.189329147338867, "global_step": 226283, "epoch": 2726} {"train_loss": -24.356311798095703, "global_step": 226284, "epoch": 2726} {"train_loss": -24.3763370513916, "global_step": 226285, "epoch": 2726} {"train_loss": -24.373266220092773, "global_step": 226286, "epoch": 2726} {"train_loss": -24.419597625732422, "global_step": 226287, "epoch": 2726} {"train_loss": -24.11958885192871, "global_step": 226288, "epoch": 2726} {"train_loss": -24.257341384887695, "global_step": 226289, "epoch": 2726} {"train_loss": -24.43990707397461, "global_step": 226290, "epoch": 2726} {"train_loss": -24.049758911132812, "global_step": 226291, "epoch": 2726} {"train_loss": -24.618606567382812, "global_step": 226292, "epoch": 2726} {"train_loss": -24.330875396728516, "global_step": 226293, "epoch": 2726} {"train_loss": -24.558698654174805, "global_step": 226294, "epoch": 2726} {"train_loss": -24.499975204467773, "global_step": 226295, "epoch": 2726} {"train_loss": -24.303598403930664, "global_step": 226296, "epoch": 2726} {"train_loss": -24.567977905273438, "global_step": 226297, "epoch": 2726} {"train_loss": -24.340682983398438, "global_step": 226298, "epoch": 2726} {"train_loss": -24.850448608398438, "global_step": 226299, "epoch": 2726} {"train_loss": -24.587522506713867, "global_step": 226300, "epoch": 2726} {"train_loss": -24.436792373657227, "global_step": 226301, "epoch": 2726} {"train_loss": -24.45919418334961, "global_step": 226302, "epoch": 2726} {"train_loss": -24.611011505126953, "global_step": 226303, "epoch": 2726} {"train_loss": -24.514841079711914, "global_step": 226304, "epoch": 2726} {"train_loss": -24.625417709350586, "global_step": 226305, "epoch": 2726} {"train_loss": -24.778133392333984, "global_step": 226306, "epoch": 2726} {"train_loss": -24.698774337768555, "global_step": 226307, "epoch": 2726} {"train_loss": -24.57233428955078, "global_step": 226308, "epoch": 2726} {"train_loss": -25.253494262695312, "global_step": 226309, "epoch": 2726} {"train_loss": -24.324871063232422, "global_step": 226310, "epoch": 2726} {"train_loss": -24.282207489013672, "global_step": 226311, "epoch": 2726} {"train_loss": -24.4112491607666, "global_step": 226312, "epoch": 2726} {"train_loss": -24.647865295410156, "global_step": 226313, "epoch": 2726} {"train_loss": -24.4709415435791, "global_step": 226314, "epoch": 2726} {"train_loss": -24.77571678161621, "global_step": 226315, "epoch": 2726} {"train_loss": -24.511762619018555, "global_step": 226316, "epoch": 2726} {"train_loss": -24.745075225830078, "global_step": 226317, "epoch": 2726} {"train_loss": -24.651899337768555, "global_step": 226318, "epoch": 2726} {"train_loss": -24.72434425354004, "global_step": 226319, "epoch": 2726} {"train_loss": -24.53766441345215, "global_step": 226320, "epoch": 2726} {"train_loss": -24.810537338256836, "global_step": 226321, "epoch": 2726} {"train_loss": -25.004135131835938, "global_step": 226322, "epoch": 2726} {"train_loss": -24.416990280151367, "global_step": 226323, "epoch": 2726} {"train_loss": -24.63540267944336, "global_step": 226324, "epoch": 2726} {"train_loss": -25.094070434570312, "global_step": 226325, "epoch": 2726} {"train_loss": -24.96758460998535, "global_step": 226326, "epoch": 2726} {"train_loss": -24.56275177001953, "global_step": 226327, "epoch": 2726} {"train_loss": -24.913124084472656, "global_step": 226328, "epoch": 2726} {"train_loss": -25.167818069458008, "global_step": 226329, "epoch": 2726} {"train_loss": -25.00320816040039, "global_step": 226330, "epoch": 2726} {"train_loss": -24.736631393432617, "global_step": 226331, "epoch": 2726} {"train_loss": -24.364368438720703, "global_step": 226332, "epoch": 2726} {"train_loss": -24.96746826171875, "global_step": 226333, "epoch": 2726} {"train_loss": -24.853803634643555, "global_step": 226334, "epoch": 2726} {"train_loss": -24.797800064086914, "global_step": 226335, "epoch": 2726} {"train_loss": -24.83635711669922, "global_step": 226336, "epoch": 2726} {"train_loss": -25.031471252441406, "global_step": 226337, "epoch": 2726} {"train_loss": -24.500974655151367, "global_step": 226338, "epoch": 2726} {"train_loss": -25.099140167236328, "global_step": 226339, "epoch": 2726} {"train_loss": -24.279312846172285, "global_step": 226340, "epoch": 2726, "val_loss": 6718227.0} {"train_loss": -24.5493221282959, "global_step": 226341, "epoch": 2727} {"train_loss": -24.22188949584961, "global_step": 226342, "epoch": 2727} {"train_loss": -24.4311466217041, "global_step": 226343, "epoch": 2727} {"train_loss": -24.37866973876953, "global_step": 226344, "epoch": 2727} {"train_loss": -24.455942153930664, "global_step": 226345, "epoch": 2727} {"train_loss": -24.310348510742188, "global_step": 226346, "epoch": 2727} {"train_loss": -24.173625946044922, "global_step": 226347, "epoch": 2727} {"train_loss": -24.576763153076172, "global_step": 226348, "epoch": 2727} {"train_loss": -24.022268295288086, "global_step": 226349, "epoch": 2727} {"train_loss": -24.451866149902344, "global_step": 226350, "epoch": 2727} {"train_loss": -24.76626968383789, "global_step": 226351, "epoch": 2727} {"train_loss": -25.001625061035156, "global_step": 226352, "epoch": 2727} {"train_loss": -24.66714859008789, "global_step": 226353, "epoch": 2727} {"train_loss": -24.775686264038086, "global_step": 226354, "epoch": 2727} {"train_loss": -25.05031394958496, "global_step": 226355, "epoch": 2727} {"train_loss": -24.60707664489746, "global_step": 226356, "epoch": 2727} {"train_loss": -24.757816314697266, "global_step": 226357, "epoch": 2727} {"train_loss": -24.577688217163086, "global_step": 226358, "epoch": 2727} {"train_loss": -24.886377334594727, "global_step": 226359, "epoch": 2727} {"train_loss": -24.544225692749023, "global_step": 226360, "epoch": 2727} {"train_loss": -24.39026641845703, "global_step": 226361, "epoch": 2727} {"train_loss": -24.549097061157227, "global_step": 226362, "epoch": 2727} {"train_loss": -24.62632942199707, "global_step": 226363, "epoch": 2727} {"train_loss": -24.506925582885742, "global_step": 226364, "epoch": 2727} {"train_loss": -24.68861198425293, "global_step": 226365, "epoch": 2727} {"train_loss": -24.842302322387695, "global_step": 226366, "epoch": 2727} {"train_loss": -24.89231300354004, "global_step": 226367, "epoch": 2727} {"train_loss": -24.373558044433594, "global_step": 226368, "epoch": 2727} {"train_loss": -24.321971893310547, "global_step": 226369, "epoch": 2727} {"train_loss": -24.788768768310547, "global_step": 226370, "epoch": 2727} {"train_loss": -24.668540954589844, "global_step": 226371, "epoch": 2727} {"train_loss": -24.874799728393555, "global_step": 226372, "epoch": 2727} {"train_loss": -25.071521759033203, "global_step": 226373, "epoch": 2727} {"train_loss": -24.76207733154297, "global_step": 226374, "epoch": 2727} {"train_loss": -24.85085105895996, "global_step": 226375, "epoch": 2727} {"train_loss": -24.600309371948242, "global_step": 226376, "epoch": 2727} {"train_loss": -24.677186965942383, "global_step": 226377, "epoch": 2727} {"train_loss": -24.777420043945312, "global_step": 226378, "epoch": 2727} {"train_loss": -24.98148536682129, "global_step": 226379, "epoch": 2727} {"train_loss": -24.694730758666992, "global_step": 226380, "epoch": 2727} {"train_loss": -24.75161361694336, "global_step": 226381, "epoch": 2727} {"train_loss": -24.66316032409668, "global_step": 226382, "epoch": 2727} {"train_loss": -24.819704055786133, "global_step": 226383, "epoch": 2727} {"train_loss": -24.482458114624023, "global_step": 226384, "epoch": 2727} {"train_loss": -24.783126831054688, "global_step": 226385, "epoch": 2727} {"train_loss": -25.084125518798828, "global_step": 226386, "epoch": 2727} {"train_loss": -24.755414962768555, "global_step": 226387, "epoch": 2727} {"train_loss": -25.101110458374023, "global_step": 226388, "epoch": 2727} {"train_loss": -25.051599502563477, "global_step": 226389, "epoch": 2727} {"train_loss": -24.650360107421875, "global_step": 226390, "epoch": 2727} {"train_loss": -24.767988204956055, "global_step": 226391, "epoch": 2727} {"train_loss": -24.591697692871094, "global_step": 226392, "epoch": 2727} {"train_loss": -25.068227767944336, "global_step": 226393, "epoch": 2727} {"train_loss": -24.7891788482666, "global_step": 226394, "epoch": 2727} {"train_loss": -24.849210739135742, "global_step": 226395, "epoch": 2727} {"train_loss": -25.014266967773438, "global_step": 226396, "epoch": 2727} {"train_loss": -25.02225685119629, "global_step": 226397, "epoch": 2727} {"train_loss": -24.63389015197754, "global_step": 226398, "epoch": 2727} {"train_loss": -25.00020980834961, "global_step": 226399, "epoch": 2727} {"train_loss": -24.565519332885742, "global_step": 226400, "epoch": 2727} {"train_loss": -24.648468017578125, "global_step": 226401, "epoch": 2727} {"train_loss": -24.955387115478516, "global_step": 226402, "epoch": 2727} {"train_loss": -24.73488426208496, "global_step": 226403, "epoch": 2727} {"train_loss": -24.5484619140625, "global_step": 226404, "epoch": 2727} {"train_loss": -24.56110191345215, "global_step": 226405, "epoch": 2727} {"train_loss": -24.823915481567383, "global_step": 226406, "epoch": 2727} {"train_loss": -24.86219596862793, "global_step": 226407, "epoch": 2727} {"train_loss": -24.45689582824707, "global_step": 226408, "epoch": 2727} {"train_loss": -24.80885887145996, "global_step": 226409, "epoch": 2727} {"train_loss": -24.993276596069336, "global_step": 226410, "epoch": 2727} {"train_loss": -24.809253692626953, "global_step": 226411, "epoch": 2727} {"train_loss": -25.115476608276367, "global_step": 226412, "epoch": 2727} {"train_loss": -25.1414852142334, "global_step": 226413, "epoch": 2727} {"train_loss": -24.9332218170166, "global_step": 226414, "epoch": 2727} {"train_loss": -24.34758949279785, "global_step": 226415, "epoch": 2727} {"train_loss": -24.53343963623047, "global_step": 226416, "epoch": 2727} {"train_loss": -24.90048599243164, "global_step": 226417, "epoch": 2727} {"train_loss": -24.510038375854492, "global_step": 226418, "epoch": 2727} {"train_loss": -25.033432006835938, "global_step": 226419, "epoch": 2727} {"train_loss": -24.576696395874023, "global_step": 226420, "epoch": 2727} {"train_loss": -24.580921173095703, "global_step": 226421, "epoch": 2727} {"train_loss": -24.592870712280273, "global_step": 226422, "epoch": 2727} {"train_loss": -24.714442839105445, "global_step": 226423, "epoch": 2727, "val_loss": 6635436.0} {"train_loss": -23.590030670166016, "global_step": 226424, "epoch": 2728} {"train_loss": -23.554258346557617, "global_step": 226425, "epoch": 2728} {"train_loss": -24.350627899169922, "global_step": 226426, "epoch": 2728} {"train_loss": -24.272977828979492, "global_step": 226427, "epoch": 2728} {"train_loss": -24.1031551361084, "global_step": 226428, "epoch": 2728} {"train_loss": -23.95783805847168, "global_step": 226429, "epoch": 2728} {"train_loss": -24.159793853759766, "global_step": 226430, "epoch": 2728} {"train_loss": -24.462812423706055, "global_step": 226431, "epoch": 2728} {"train_loss": -24.352317810058594, "global_step": 226432, "epoch": 2728} {"train_loss": -24.514493942260742, "global_step": 226433, "epoch": 2728} {"train_loss": -24.26533317565918, "global_step": 226434, "epoch": 2728} {"train_loss": -24.365779876708984, "global_step": 226435, "epoch": 2728} {"train_loss": -24.344011306762695, "global_step": 226436, "epoch": 2728} {"train_loss": -24.413328170776367, "global_step": 226437, "epoch": 2728} {"train_loss": -24.54097557067871, "global_step": 226438, "epoch": 2728} {"train_loss": -24.49970817565918, "global_step": 226439, "epoch": 2728} {"train_loss": -24.374448776245117, "global_step": 226440, "epoch": 2728} {"train_loss": -24.446758270263672, "global_step": 226441, "epoch": 2728} {"train_loss": -24.614349365234375, "global_step": 226442, "epoch": 2728} {"train_loss": -24.61189079284668, "global_step": 226443, "epoch": 2728} {"train_loss": -24.675466537475586, "global_step": 226444, "epoch": 2728} {"train_loss": -24.689054489135742, "global_step": 226445, "epoch": 2728} {"train_loss": -24.39449119567871, "global_step": 226446, "epoch": 2728} {"train_loss": -24.545034408569336, "global_step": 226447, "epoch": 2728} {"train_loss": -24.2277774810791, "global_step": 226448, "epoch": 2728} {"train_loss": -24.836101531982422, "global_step": 226449, "epoch": 2728} {"train_loss": -24.28948402404785, "global_step": 226450, "epoch": 2728} {"train_loss": -24.555225372314453, "global_step": 226451, "epoch": 2728} {"train_loss": -24.781370162963867, "global_step": 226452, "epoch": 2728} {"train_loss": -24.626636505126953, "global_step": 226453, "epoch": 2728} {"train_loss": -24.879436492919922, "global_step": 226454, "epoch": 2728} {"train_loss": -24.68245506286621, "global_step": 226455, "epoch": 2728} {"train_loss": -24.946653366088867, "global_step": 226456, "epoch": 2728} {"train_loss": -24.395177841186523, "global_step": 226457, "epoch": 2728} {"train_loss": -24.785959243774414, "global_step": 226458, "epoch": 2728} {"train_loss": -24.616113662719727, "global_step": 226459, "epoch": 2728} {"train_loss": -24.6787109375, "global_step": 226460, "epoch": 2728} {"train_loss": -24.68230628967285, "global_step": 226461, "epoch": 2728} {"train_loss": -24.79400062561035, "global_step": 226462, "epoch": 2728} {"train_loss": -24.593124389648438, "global_step": 226463, "epoch": 2728} {"train_loss": -24.61528205871582, "global_step": 226464, "epoch": 2728} {"train_loss": -24.391796112060547, "global_step": 226465, "epoch": 2728} {"train_loss": -24.409788131713867, "global_step": 226466, "epoch": 2728} {"train_loss": -25.01157569885254, "global_step": 226467, "epoch": 2728} {"train_loss": -24.59634780883789, "global_step": 226468, "epoch": 2728} {"train_loss": -24.87909507751465, "global_step": 226469, "epoch": 2728} {"train_loss": -25.04170799255371, "global_step": 226470, "epoch": 2728} {"train_loss": -25.137699127197266, "global_step": 226471, "epoch": 2728} {"train_loss": -24.595619201660156, "global_step": 226472, "epoch": 2728} {"train_loss": -24.84245491027832, "global_step": 226473, "epoch": 2728} {"train_loss": -24.66338539123535, "global_step": 226474, "epoch": 2728} {"train_loss": -24.441238403320312, "global_step": 226475, "epoch": 2728} {"train_loss": -24.389286041259766, "global_step": 226476, "epoch": 2728} {"train_loss": -24.486637115478516, "global_step": 226477, "epoch": 2728} {"train_loss": -24.375507354736328, "global_step": 226478, "epoch": 2728} {"train_loss": -24.700422286987305, "global_step": 226479, "epoch": 2728} {"train_loss": -24.65097427368164, "global_step": 226480, "epoch": 2728} {"train_loss": -24.504392623901367, "global_step": 226481, "epoch": 2728} {"train_loss": -24.934720993041992, "global_step": 226482, "epoch": 2728} {"train_loss": -24.686023712158203, "global_step": 226483, "epoch": 2728} {"train_loss": -24.780912399291992, "global_step": 226484, "epoch": 2728} {"train_loss": -24.642169952392578, "global_step": 226485, "epoch": 2728} {"train_loss": -24.96683692932129, "global_step": 226486, "epoch": 2728} {"train_loss": -24.586811065673828, "global_step": 226487, "epoch": 2728} {"train_loss": -24.348535537719727, "global_step": 226488, "epoch": 2728} {"train_loss": -24.768030166625977, "global_step": 226489, "epoch": 2728} {"train_loss": -24.97926139831543, "global_step": 226490, "epoch": 2728} {"train_loss": -24.708425521850586, "global_step": 226491, "epoch": 2728} {"train_loss": -24.71151351928711, "global_step": 226492, "epoch": 2728} {"train_loss": -24.80841636657715, "global_step": 226493, "epoch": 2728} {"train_loss": -24.2479305267334, "global_step": 226494, "epoch": 2728} {"train_loss": -24.771026611328125, "global_step": 226495, "epoch": 2728} {"train_loss": -24.931079864501953, "global_step": 226496, "epoch": 2728} {"train_loss": -24.905893325805664, "global_step": 226497, "epoch": 2728} {"train_loss": -25.074085235595703, "global_step": 226498, "epoch": 2728} {"train_loss": -24.62972640991211, "global_step": 226499, "epoch": 2728} {"train_loss": -24.999094009399414, "global_step": 226500, "epoch": 2728} {"train_loss": -24.946317672729492, "global_step": 226501, "epoch": 2728} {"train_loss": -24.73451805114746, "global_step": 226502, "epoch": 2728} {"train_loss": -24.68737030029297, "global_step": 226503, "epoch": 2728} {"train_loss": -24.915515899658203, "global_step": 226504, "epoch": 2728} {"train_loss": -24.846643447875977, "global_step": 226505, "epoch": 2728} {"train_loss": -24.60408362423081, "global_step": 226506, "epoch": 2728, "val_loss": 6654574.5} {"train_loss": -24.104948043823242, "global_step": 226507, "epoch": 2729} {"train_loss": -24.391691207885742, "global_step": 226508, "epoch": 2729} {"train_loss": -24.431318283081055, "global_step": 226509, "epoch": 2729} {"train_loss": -24.127803802490234, "global_step": 226510, "epoch": 2729} {"train_loss": -24.32977867126465, "global_step": 226511, "epoch": 2729} {"train_loss": -24.408933639526367, "global_step": 226512, "epoch": 2729} {"train_loss": -24.195032119750977, "global_step": 226513, "epoch": 2729} {"train_loss": -24.171232223510742, "global_step": 226514, "epoch": 2729} {"train_loss": -24.433231353759766, "global_step": 226515, "epoch": 2729} {"train_loss": -24.52398681640625, "global_step": 226516, "epoch": 2729} {"train_loss": -24.570682525634766, "global_step": 226517, "epoch": 2729} {"train_loss": -24.14717674255371, "global_step": 226518, "epoch": 2729} {"train_loss": -24.56816291809082, "global_step": 226519, "epoch": 2729} {"train_loss": -24.660858154296875, "global_step": 226520, "epoch": 2729} {"train_loss": -24.621084213256836, "global_step": 226521, "epoch": 2729} {"train_loss": -24.411497116088867, "global_step": 226522, "epoch": 2729} {"train_loss": -24.809097290039062, "global_step": 226523, "epoch": 2729} {"train_loss": -24.295654296875, "global_step": 226524, "epoch": 2729} {"train_loss": -25.094797134399414, "global_step": 226525, "epoch": 2729} {"train_loss": -24.392742156982422, "global_step": 226526, "epoch": 2729} {"train_loss": -24.666860580444336, "global_step": 226527, "epoch": 2729} {"train_loss": -24.743432998657227, "global_step": 226528, "epoch": 2729} {"train_loss": -24.775110244750977, "global_step": 226529, "epoch": 2729} {"train_loss": -25.22753143310547, "global_step": 226530, "epoch": 2729} {"train_loss": -24.67620277404785, "global_step": 226531, "epoch": 2729} {"train_loss": -24.743438720703125, "global_step": 226532, "epoch": 2729} {"train_loss": -24.289306640625, "global_step": 226533, "epoch": 2729} {"train_loss": -24.8818416595459, "global_step": 226534, "epoch": 2729} {"train_loss": -24.68181610107422, "global_step": 226535, "epoch": 2729} {"train_loss": -24.411954879760742, "global_step": 226536, "epoch": 2729} {"train_loss": -24.536022186279297, "global_step": 226537, "epoch": 2729} {"train_loss": -24.830617904663086, "global_step": 226538, "epoch": 2729} {"train_loss": -24.577356338500977, "global_step": 226539, "epoch": 2729} {"train_loss": -24.372600555419922, "global_step": 226540, "epoch": 2729} {"train_loss": -24.86393165588379, "global_step": 226541, "epoch": 2729} {"train_loss": -24.73665428161621, "global_step": 226542, "epoch": 2729} {"train_loss": -24.843076705932617, "global_step": 226543, "epoch": 2729} {"train_loss": -24.818649291992188, "global_step": 226544, "epoch": 2729} {"train_loss": -24.586652755737305, "global_step": 226545, "epoch": 2729} {"train_loss": -25.076431274414062, "global_step": 226546, "epoch": 2729} {"train_loss": -24.583646774291992, "global_step": 226547, "epoch": 2729} {"train_loss": -25.05112648010254, "global_step": 226548, "epoch": 2729} {"train_loss": -25.20989418029785, "global_step": 226549, "epoch": 2729} {"train_loss": -24.570402145385742, "global_step": 226550, "epoch": 2729} {"train_loss": -24.74163246154785, "global_step": 226551, "epoch": 2729} {"train_loss": -25.019346237182617, "global_step": 226552, "epoch": 2729} {"train_loss": -24.552776336669922, "global_step": 226553, "epoch": 2729} {"train_loss": -24.560321807861328, "global_step": 226554, "epoch": 2729} {"train_loss": -24.541852951049805, "global_step": 226555, "epoch": 2729} {"train_loss": -24.742660522460938, "global_step": 226556, "epoch": 2729} {"train_loss": -24.750574111938477, "global_step": 226557, "epoch": 2729} {"train_loss": -25.117868423461914, "global_step": 226558, "epoch": 2729} {"train_loss": -24.584726333618164, "global_step": 226559, "epoch": 2729} {"train_loss": -24.654699325561523, "global_step": 226560, "epoch": 2729} {"train_loss": -25.0047664642334, "global_step": 226561, "epoch": 2729} {"train_loss": -24.60647964477539, "global_step": 226562, "epoch": 2729} {"train_loss": -25.0839900970459, "global_step": 226563, "epoch": 2729} {"train_loss": -24.403383255004883, "global_step": 226564, "epoch": 2729} {"train_loss": -24.342283248901367, "global_step": 226565, "epoch": 2729} {"train_loss": -24.449609756469727, "global_step": 226566, "epoch": 2729} {"train_loss": -24.29344940185547, "global_step": 226567, "epoch": 2729} {"train_loss": -24.968128204345703, "global_step": 226568, "epoch": 2729} {"train_loss": -24.536001205444336, "global_step": 226569, "epoch": 2729} {"train_loss": -24.54959487915039, "global_step": 226570, "epoch": 2729} {"train_loss": -24.828847885131836, "global_step": 226571, "epoch": 2729} {"train_loss": -24.4094181060791, "global_step": 226572, "epoch": 2729} {"train_loss": -24.3165283203125, "global_step": 226573, "epoch": 2729} {"train_loss": -24.697961807250977, "global_step": 226574, "epoch": 2729} {"train_loss": -24.877254486083984, "global_step": 226575, "epoch": 2729} {"train_loss": -24.926227569580078, "global_step": 226576, "epoch": 2729} {"train_loss": -24.662992477416992, "global_step": 226577, "epoch": 2729} {"train_loss": -24.850069046020508, "global_step": 226578, "epoch": 2729} {"train_loss": -24.879179000854492, "global_step": 226579, "epoch": 2729} {"train_loss": -24.564350128173828, "global_step": 226580, "epoch": 2729} {"train_loss": -24.57471466064453, "global_step": 226581, "epoch": 2729} {"train_loss": -24.66508674621582, "global_step": 226582, "epoch": 2729} {"train_loss": -24.668222427368164, "global_step": 226583, "epoch": 2729} {"train_loss": -24.74952507019043, "global_step": 226584, "epoch": 2729} {"train_loss": -24.629180908203125, "global_step": 226585, "epoch": 2729} {"train_loss": -24.557920455932617, "global_step": 226586, "epoch": 2729} {"train_loss": -24.67317008972168, "global_step": 226587, "epoch": 2729} {"train_loss": -24.854421615600586, "global_step": 226588, "epoch": 2729} {"train_loss": -24.63569926066571, "global_step": 226589, "epoch": 2729, "val_loss": 6854022.0} {"train_loss": -23.06927490234375, "global_step": 226590, "epoch": 2730} {"train_loss": -23.677377700805664, "global_step": 226591, "epoch": 2730} {"train_loss": -24.032028198242188, "global_step": 226592, "epoch": 2730} {"train_loss": -23.89290428161621, "global_step": 226593, "epoch": 2730} {"train_loss": -24.10835838317871, "global_step": 226594, "epoch": 2730} {"train_loss": -23.677717208862305, "global_step": 226595, "epoch": 2730} {"train_loss": -23.79804801940918, "global_step": 226596, "epoch": 2730} {"train_loss": -24.00680160522461, "global_step": 226597, "epoch": 2730} {"train_loss": -24.13028907775879, "global_step": 226598, "epoch": 2730} {"train_loss": -23.97623634338379, "global_step": 226599, "epoch": 2730} {"train_loss": -24.413503646850586, "global_step": 226600, "epoch": 2730} {"train_loss": -23.268962860107422, "global_step": 226601, "epoch": 2730} {"train_loss": -24.03911781311035, "global_step": 226602, "epoch": 2730} {"train_loss": -24.086416244506836, "global_step": 226603, "epoch": 2730} {"train_loss": -24.116605758666992, "global_step": 226604, "epoch": 2730} {"train_loss": -24.22491455078125, "global_step": 226605, "epoch": 2730} {"train_loss": -24.133209228515625, "global_step": 226606, "epoch": 2730} {"train_loss": -23.876867294311523, "global_step": 226607, "epoch": 2730} {"train_loss": -24.385568618774414, "global_step": 226608, "epoch": 2730} {"train_loss": -24.292200088500977, "global_step": 226609, "epoch": 2730} {"train_loss": -24.353302001953125, "global_step": 226610, "epoch": 2730} {"train_loss": -24.303146362304688, "global_step": 226611, "epoch": 2730} {"train_loss": -24.562559127807617, "global_step": 226612, "epoch": 2730} {"train_loss": -24.313182830810547, "global_step": 226613, "epoch": 2730} {"train_loss": -24.5839900970459, "global_step": 226614, "epoch": 2730} {"train_loss": -24.461584091186523, "global_step": 226615, "epoch": 2730} {"train_loss": -24.57233238220215, "global_step": 226616, "epoch": 2730} {"train_loss": -24.82332992553711, "global_step": 226617, "epoch": 2730} {"train_loss": -24.497724533081055, "global_step": 226618, "epoch": 2730} {"train_loss": -24.581892013549805, "global_step": 226619, "epoch": 2730} {"train_loss": -24.57179832458496, "global_step": 226620, "epoch": 2730} {"train_loss": -24.57291603088379, "global_step": 226621, "epoch": 2730} {"train_loss": -24.4522762298584, "global_step": 226622, "epoch": 2730} {"train_loss": -23.11781883239746, "global_step": 226623, "epoch": 2730} {"train_loss": -24.52910804748535, "global_step": 226624, "epoch": 2730} {"train_loss": -24.957483291625977, "global_step": 226625, "epoch": 2730} {"train_loss": -24.330076217651367, "global_step": 226626, "epoch": 2730} {"train_loss": -24.62531852722168, "global_step": 226627, "epoch": 2730} {"train_loss": -24.767715454101562, "global_step": 226628, "epoch": 2730} {"train_loss": -24.657739639282227, "global_step": 226629, "epoch": 2730} {"train_loss": -24.26634407043457, "global_step": 226630, "epoch": 2730} {"train_loss": -24.636327743530273, "global_step": 226631, "epoch": 2730} {"train_loss": -24.732681274414062, "global_step": 226632, "epoch": 2730} {"train_loss": -24.915979385375977, "global_step": 226633, "epoch": 2730} {"train_loss": -24.693893432617188, "global_step": 226634, "epoch": 2730} {"train_loss": -24.621877670288086, "global_step": 226635, "epoch": 2730} {"train_loss": -24.78524398803711, "global_step": 226636, "epoch": 2730} {"train_loss": -24.938581466674805, "global_step": 226637, "epoch": 2730} {"train_loss": -24.437753677368164, "global_step": 226638, "epoch": 2730} {"train_loss": -24.658735275268555, "global_step": 226639, "epoch": 2730} {"train_loss": -24.71394920349121, "global_step": 226640, "epoch": 2730} {"train_loss": -24.519262313842773, "global_step": 226641, "epoch": 2730} {"train_loss": -24.867502212524414, "global_step": 226642, "epoch": 2730} {"train_loss": -24.664199829101562, "global_step": 226643, "epoch": 2730} {"train_loss": -24.79977035522461, "global_step": 226644, "epoch": 2730} {"train_loss": -24.936067581176758, "global_step": 226645, "epoch": 2730} {"train_loss": -24.315561294555664, "global_step": 226646, "epoch": 2730} {"train_loss": -24.75605583190918, "global_step": 226647, "epoch": 2730} {"train_loss": -24.34627914428711, "global_step": 226648, "epoch": 2730} {"train_loss": -24.841171264648438, "global_step": 226649, "epoch": 2730} {"train_loss": -25.11360740661621, "global_step": 226650, "epoch": 2730} {"train_loss": -24.77792739868164, "global_step": 226651, "epoch": 2730} {"train_loss": -24.734174728393555, "global_step": 226652, "epoch": 2730} {"train_loss": -24.729949951171875, "global_step": 226653, "epoch": 2730} {"train_loss": -24.582813262939453, "global_step": 226654, "epoch": 2730} {"train_loss": -24.967924118041992, "global_step": 226655, "epoch": 2730} {"train_loss": -24.343034744262695, "global_step": 226656, "epoch": 2730} {"train_loss": -24.776018142700195, "global_step": 226657, "epoch": 2730} {"train_loss": -24.984525680541992, "global_step": 226658, "epoch": 2730} {"train_loss": -24.561880111694336, "global_step": 226659, "epoch": 2730} {"train_loss": -24.624650955200195, "global_step": 226660, "epoch": 2730} {"train_loss": -24.84488296508789, "global_step": 226661, "epoch": 2730} {"train_loss": -25.07802391052246, "global_step": 226662, "epoch": 2730} {"train_loss": -24.62774085998535, "global_step": 226663, "epoch": 2730} {"train_loss": -24.258289337158203, "global_step": 226664, "epoch": 2730} {"train_loss": -24.320667266845703, "global_step": 226665, "epoch": 2730} {"train_loss": -24.504491806030273, "global_step": 226666, "epoch": 2730} {"train_loss": -24.828943252563477, "global_step": 226667, "epoch": 2730} {"train_loss": -24.729389190673828, "global_step": 226668, "epoch": 2730} {"train_loss": -24.66823959350586, "global_step": 226669, "epoch": 2730} {"train_loss": -24.5518798828125, "global_step": 226670, "epoch": 2730} {"train_loss": -24.572355270385742, "global_step": 226671, "epoch": 2730} {"train_loss": -24.47686595227345, "global_step": 226672, "epoch": 2730, "val_loss": 6705908.0} {"train_loss": -23.097253799438477, "global_step": 226673, "epoch": 2731} {"train_loss": -23.79400634765625, "global_step": 226674, "epoch": 2731} {"train_loss": -23.48464012145996, "global_step": 226675, "epoch": 2731} {"train_loss": -23.653409957885742, "global_step": 226676, "epoch": 2731} {"train_loss": -24.109661102294922, "global_step": 226677, "epoch": 2731} {"train_loss": -23.424606323242188, "global_step": 226678, "epoch": 2731} {"train_loss": -24.28311538696289, "global_step": 226679, "epoch": 2731} {"train_loss": -23.972715377807617, "global_step": 226680, "epoch": 2731} {"train_loss": -24.189319610595703, "global_step": 226681, "epoch": 2731} {"train_loss": -23.51774787902832, "global_step": 226682, "epoch": 2731} {"train_loss": -23.656055450439453, "global_step": 226683, "epoch": 2731} {"train_loss": -24.388147354125977, "global_step": 226684, "epoch": 2731} {"train_loss": -24.147567749023438, "global_step": 226685, "epoch": 2731} {"train_loss": -23.640684127807617, "global_step": 226686, "epoch": 2731} {"train_loss": -24.170856475830078, "global_step": 226687, "epoch": 2731} {"train_loss": -24.10390281677246, "global_step": 226688, "epoch": 2731} {"train_loss": -24.191680908203125, "global_step": 226689, "epoch": 2731} {"train_loss": -24.398725509643555, "global_step": 226690, "epoch": 2731} {"train_loss": -24.195463180541992, "global_step": 226691, "epoch": 2731} {"train_loss": -24.288631439208984, "global_step": 226692, "epoch": 2731} {"train_loss": -24.296606063842773, "global_step": 226693, "epoch": 2731} {"train_loss": -24.174591064453125, "global_step": 226694, "epoch": 2731} {"train_loss": -24.393888473510742, "global_step": 226695, "epoch": 2731} {"train_loss": -24.352848052978516, "global_step": 226696, "epoch": 2731} {"train_loss": -24.237577438354492, "global_step": 226697, "epoch": 2731} {"train_loss": -24.690288543701172, "global_step": 226698, "epoch": 2731} {"train_loss": -24.511262893676758, "global_step": 226699, "epoch": 2731} {"train_loss": -24.337751388549805, "global_step": 226700, "epoch": 2731} {"train_loss": -24.53480339050293, "global_step": 226701, "epoch": 2731} {"train_loss": -24.472259521484375, "global_step": 226702, "epoch": 2731} {"train_loss": -24.716306686401367, "global_step": 226703, "epoch": 2731} {"train_loss": -24.357236862182617, "global_step": 226704, "epoch": 2731} {"train_loss": -24.592981338500977, "global_step": 226705, "epoch": 2731} {"train_loss": -24.90420913696289, "global_step": 226706, "epoch": 2731} {"train_loss": -24.969676971435547, "global_step": 226707, "epoch": 2731} {"train_loss": -24.89078140258789, "global_step": 226708, "epoch": 2731} {"train_loss": -24.77396583557129, "global_step": 226709, "epoch": 2731} {"train_loss": -24.85146713256836, "global_step": 226710, "epoch": 2731} {"train_loss": -24.778648376464844, "global_step": 226711, "epoch": 2731} {"train_loss": -24.645549774169922, "global_step": 226712, "epoch": 2731} {"train_loss": -24.81087303161621, "global_step": 226713, "epoch": 2731} {"train_loss": -24.527429580688477, "global_step": 226714, "epoch": 2731} {"train_loss": -24.920560836791992, "global_step": 226715, "epoch": 2731} {"train_loss": -24.652732849121094, "global_step": 226716, "epoch": 2731} {"train_loss": -24.602783203125, "global_step": 226717, "epoch": 2731} {"train_loss": -25.33930015563965, "global_step": 226718, "epoch": 2731} {"train_loss": -24.872312545776367, "global_step": 226719, "epoch": 2731} {"train_loss": -24.94292640686035, "global_step": 226720, "epoch": 2731} {"train_loss": -24.98115348815918, "global_step": 226721, "epoch": 2731} {"train_loss": -24.556058883666992, "global_step": 226722, "epoch": 2731} {"train_loss": -25.057090759277344, "global_step": 226723, "epoch": 2731} {"train_loss": -24.941104888916016, "global_step": 226724, "epoch": 2731} {"train_loss": -24.89911460876465, "global_step": 226725, "epoch": 2731} {"train_loss": -25.03240966796875, "global_step": 226726, "epoch": 2731} {"train_loss": -24.63836669921875, "global_step": 226727, "epoch": 2731} {"train_loss": -24.8330135345459, "global_step": 226728, "epoch": 2731} {"train_loss": -24.728984832763672, "global_step": 226729, "epoch": 2731} {"train_loss": -24.473243713378906, "global_step": 226730, "epoch": 2731} {"train_loss": -24.7607421875, "global_step": 226731, "epoch": 2731} {"train_loss": -24.575666427612305, "global_step": 226732, "epoch": 2731} {"train_loss": -24.331531524658203, "global_step": 226733, "epoch": 2731} {"train_loss": -24.93844223022461, "global_step": 226734, "epoch": 2731} {"train_loss": -24.659467697143555, "global_step": 226735, "epoch": 2731} {"train_loss": -24.55611228942871, "global_step": 226736, "epoch": 2731} {"train_loss": -24.94325065612793, "global_step": 226737, "epoch": 2731} {"train_loss": -24.78815269470215, "global_step": 226738, "epoch": 2731} {"train_loss": -25.098468780517578, "global_step": 226739, "epoch": 2731} {"train_loss": -24.8452205657959, "global_step": 226740, "epoch": 2731} {"train_loss": -24.501205444335938, "global_step": 226741, "epoch": 2731} {"train_loss": -24.541057586669922, "global_step": 226742, "epoch": 2731} {"train_loss": -24.658111572265625, "global_step": 226743, "epoch": 2731} {"train_loss": -24.477584838867188, "global_step": 226744, "epoch": 2731} {"train_loss": -25.08057975769043, "global_step": 226745, "epoch": 2731} {"train_loss": -24.843061447143555, "global_step": 226746, "epoch": 2731} {"train_loss": -24.845569610595703, "global_step": 226747, "epoch": 2731} {"train_loss": -24.538808822631836, "global_step": 226748, "epoch": 2731} {"train_loss": -25.017902374267578, "global_step": 226749, "epoch": 2731} {"train_loss": -24.487768173217773, "global_step": 226750, "epoch": 2731} {"train_loss": -24.490137100219727, "global_step": 226751, "epoch": 2731} {"train_loss": -24.567663192749023, "global_step": 226752, "epoch": 2731} {"train_loss": -24.900556564331055, "global_step": 226753, "epoch": 2731} {"train_loss": -24.501813888549805, "global_step": 226754, "epoch": 2731} {"train_loss": -24.510926051312182, "global_step": 226755, "epoch": 2731, "val_loss": 6753822.5} {"train_loss": -24.45505142211914, "global_step": 226756, "epoch": 2732} {"train_loss": -24.834531784057617, "global_step": 226757, "epoch": 2732} {"train_loss": -24.596418380737305, "global_step": 226758, "epoch": 2732} {"train_loss": -24.24094581604004, "global_step": 226759, "epoch": 2732} {"train_loss": -24.673208236694336, "global_step": 226760, "epoch": 2732} {"train_loss": -24.310089111328125, "global_step": 226761, "epoch": 2732} {"train_loss": -24.356943130493164, "global_step": 226762, "epoch": 2732} {"train_loss": -24.484500885009766, "global_step": 226763, "epoch": 2732} {"train_loss": -24.633930206298828, "global_step": 226764, "epoch": 2732} {"train_loss": -24.033334732055664, "global_step": 226765, "epoch": 2732} {"train_loss": -24.30958366394043, "global_step": 226766, "epoch": 2732} {"train_loss": -24.9637451171875, "global_step": 226767, "epoch": 2732} {"train_loss": -24.178752899169922, "global_step": 226768, "epoch": 2732} {"train_loss": -24.6805477142334, "global_step": 226769, "epoch": 2732} {"train_loss": -24.76288414001465, "global_step": 226770, "epoch": 2732} {"train_loss": -24.56694984436035, "global_step": 226771, "epoch": 2732} {"train_loss": -24.58748435974121, "global_step": 226772, "epoch": 2732} {"train_loss": -24.465503692626953, "global_step": 226773, "epoch": 2732} {"train_loss": -24.92120361328125, "global_step": 226774, "epoch": 2732} {"train_loss": -24.975177764892578, "global_step": 226775, "epoch": 2732} {"train_loss": -24.85700035095215, "global_step": 226776, "epoch": 2732} {"train_loss": -24.436994552612305, "global_step": 226777, "epoch": 2732} {"train_loss": -24.707265853881836, "global_step": 226778, "epoch": 2732} {"train_loss": -24.70160675048828, "global_step": 226779, "epoch": 2732} {"train_loss": -24.5273380279541, "global_step": 226780, "epoch": 2732} {"train_loss": -24.96971321105957, "global_step": 226781, "epoch": 2732} {"train_loss": -24.81028938293457, "global_step": 226782, "epoch": 2732} {"train_loss": -25.194869995117188, "global_step": 226783, "epoch": 2732} {"train_loss": -24.832937240600586, "global_step": 226784, "epoch": 2732} {"train_loss": -24.80436134338379, "global_step": 226785, "epoch": 2732} {"train_loss": -24.887027740478516, "global_step": 226786, "epoch": 2732} {"train_loss": -25.01405906677246, "global_step": 226787, "epoch": 2732} {"train_loss": -24.847959518432617, "global_step": 226788, "epoch": 2732} {"train_loss": -24.846704483032227, "global_step": 226789, "epoch": 2732} {"train_loss": -24.734468460083008, "global_step": 226790, "epoch": 2732} {"train_loss": -24.265104293823242, "global_step": 226791, "epoch": 2732} {"train_loss": -24.49651527404785, "global_step": 226792, "epoch": 2732} {"train_loss": -24.89723777770996, "global_step": 226793, "epoch": 2732} {"train_loss": -24.739912033081055, "global_step": 226794, "epoch": 2732} {"train_loss": -24.60181999206543, "global_step": 226795, "epoch": 2732} {"train_loss": -24.476871490478516, "global_step": 226796, "epoch": 2732} {"train_loss": -23.575246810913086, "global_step": 226797, "epoch": 2732} {"train_loss": -23.991811752319336, "global_step": 226798, "epoch": 2732} {"train_loss": -24.429283142089844, "global_step": 226799, "epoch": 2732} {"train_loss": -24.386295318603516, "global_step": 226800, "epoch": 2732} {"train_loss": -24.361040115356445, "global_step": 226801, "epoch": 2732} {"train_loss": -24.158777236938477, "global_step": 226802, "epoch": 2732} {"train_loss": -24.44631004333496, "global_step": 226803, "epoch": 2732} {"train_loss": -24.36748504638672, "global_step": 226804, "epoch": 2732} {"train_loss": -23.899715423583984, "global_step": 226805, "epoch": 2732} {"train_loss": -24.42891502380371, "global_step": 226806, "epoch": 2732} {"train_loss": -24.31639862060547, "global_step": 226807, "epoch": 2732} {"train_loss": -24.4486083984375, "global_step": 226808, "epoch": 2732} {"train_loss": -24.65821075439453, "global_step": 226809, "epoch": 2732} {"train_loss": -24.53560447692871, "global_step": 226810, "epoch": 2732} {"train_loss": -24.757658004760742, "global_step": 226811, "epoch": 2732} {"train_loss": -24.69215965270996, "global_step": 226812, "epoch": 2732} {"train_loss": -24.662734985351562, "global_step": 226813, "epoch": 2732} {"train_loss": -24.887744903564453, "global_step": 226814, "epoch": 2732} {"train_loss": -24.5759334564209, "global_step": 226815, "epoch": 2732} {"train_loss": -24.771665573120117, "global_step": 226816, "epoch": 2732} {"train_loss": -24.838695526123047, "global_step": 226817, "epoch": 2732} {"train_loss": -25.1491756439209, "global_step": 226818, "epoch": 2732} {"train_loss": -24.563718795776367, "global_step": 226819, "epoch": 2732} {"train_loss": -24.7574462890625, "global_step": 226820, "epoch": 2732} {"train_loss": -24.55466079711914, "global_step": 226821, "epoch": 2732} {"train_loss": -24.901580810546875, "global_step": 226822, "epoch": 2732} {"train_loss": -24.342939376831055, "global_step": 226823, "epoch": 2732} {"train_loss": -24.439918518066406, "global_step": 226824, "epoch": 2732} {"train_loss": -24.604097366333008, "global_step": 226825, "epoch": 2732} {"train_loss": -24.373937606811523, "global_step": 226826, "epoch": 2732} {"train_loss": -24.829071044921875, "global_step": 226827, "epoch": 2732} {"train_loss": -24.595216751098633, "global_step": 226828, "epoch": 2732} {"train_loss": -24.530593872070312, "global_step": 226829, "epoch": 2732} {"train_loss": -24.943613052368164, "global_step": 226830, "epoch": 2732} {"train_loss": -25.16886329650879, "global_step": 226831, "epoch": 2732} {"train_loss": -24.670507431030273, "global_step": 226832, "epoch": 2732} {"train_loss": -24.773000717163086, "global_step": 226833, "epoch": 2732} {"train_loss": -24.145597457885742, "global_step": 226834, "epoch": 2732} {"train_loss": -24.6718807220459, "global_step": 226835, "epoch": 2732} {"train_loss": -24.627363204956055, "global_step": 226836, "epoch": 2732} {"train_loss": -24.731435775756836, "global_step": 226837, "epoch": 2732} {"train_loss": -24.608109508652284, "global_step": 226838, "epoch": 2732, "val_loss": 6750634.0} {"train_loss": -24.04547119140625, "global_step": 226839, "epoch": 2733} {"train_loss": -24.23477554321289, "global_step": 226840, "epoch": 2733} {"train_loss": -24.716506958007812, "global_step": 226841, "epoch": 2733} {"train_loss": -24.3301944732666, "global_step": 226842, "epoch": 2733} {"train_loss": -24.347755432128906, "global_step": 226843, "epoch": 2733} {"train_loss": -24.200092315673828, "global_step": 226844, "epoch": 2733} {"train_loss": -24.151409149169922, "global_step": 226845, "epoch": 2733} {"train_loss": -23.969369888305664, "global_step": 226846, "epoch": 2733} {"train_loss": -24.5433406829834, "global_step": 226847, "epoch": 2733} {"train_loss": -23.738962173461914, "global_step": 226848, "epoch": 2733} {"train_loss": -24.352075576782227, "global_step": 226849, "epoch": 2733} {"train_loss": -24.169591903686523, "global_step": 226850, "epoch": 2733} {"train_loss": -24.618330001831055, "global_step": 226851, "epoch": 2733} {"train_loss": -24.031076431274414, "global_step": 226852, "epoch": 2733} {"train_loss": -24.142866134643555, "global_step": 226853, "epoch": 2733} {"train_loss": -24.36488914489746, "global_step": 226854, "epoch": 2733} {"train_loss": -24.298908233642578, "global_step": 226855, "epoch": 2733} {"train_loss": -24.648849487304688, "global_step": 226856, "epoch": 2733} {"train_loss": -24.68378448486328, "global_step": 226857, "epoch": 2733} {"train_loss": -24.587787628173828, "global_step": 226858, "epoch": 2733} {"train_loss": -24.515016555786133, "global_step": 226859, "epoch": 2733} {"train_loss": -24.171979904174805, "global_step": 226860, "epoch": 2733} {"train_loss": -24.822811126708984, "global_step": 226861, "epoch": 2733} {"train_loss": -24.415746688842773, "global_step": 226862, "epoch": 2733} {"train_loss": -24.21845054626465, "global_step": 226863, "epoch": 2733} {"train_loss": -24.774612426757812, "global_step": 226864, "epoch": 2733} {"train_loss": -24.495100021362305, "global_step": 226865, "epoch": 2733} {"train_loss": -24.35645866394043, "global_step": 226866, "epoch": 2733} {"train_loss": -24.631723403930664, "global_step": 226867, "epoch": 2733} {"train_loss": -24.5147647857666, "global_step": 226868, "epoch": 2733} {"train_loss": -24.55690574645996, "global_step": 226869, "epoch": 2733} {"train_loss": -24.184814453125, "global_step": 226870, "epoch": 2733} {"train_loss": -24.526885986328125, "global_step": 226871, "epoch": 2733} {"train_loss": -24.746755599975586, "global_step": 226872, "epoch": 2733} {"train_loss": -24.287023544311523, "global_step": 226873, "epoch": 2733} {"train_loss": -24.698637008666992, "global_step": 226874, "epoch": 2733} {"train_loss": -24.67205047607422, "global_step": 226875, "epoch": 2733} {"train_loss": -24.319278717041016, "global_step": 226876, "epoch": 2733} {"train_loss": -24.97361183166504, "global_step": 226877, "epoch": 2733} {"train_loss": -24.498943328857422, "global_step": 226878, "epoch": 2733} {"train_loss": -24.77862548828125, "global_step": 226879, "epoch": 2733} {"train_loss": -24.900590896606445, "global_step": 226880, "epoch": 2733} {"train_loss": -24.830961227416992, "global_step": 226881, "epoch": 2733} {"train_loss": -24.31561279296875, "global_step": 226882, "epoch": 2733} {"train_loss": -24.669713973999023, "global_step": 226883, "epoch": 2733} {"train_loss": -24.789203643798828, "global_step": 226884, "epoch": 2733} {"train_loss": -24.788732528686523, "global_step": 226885, "epoch": 2733} {"train_loss": -24.68555450439453, "global_step": 226886, "epoch": 2733} {"train_loss": -24.60696792602539, "global_step": 226887, "epoch": 2733} {"train_loss": -24.683303833007812, "global_step": 226888, "epoch": 2733} {"train_loss": -24.359277725219727, "global_step": 226889, "epoch": 2733} {"train_loss": -24.825210571289062, "global_step": 226890, "epoch": 2733} {"train_loss": -24.85041618347168, "global_step": 226891, "epoch": 2733} {"train_loss": -24.7830810546875, "global_step": 226892, "epoch": 2733} {"train_loss": -24.683242797851562, "global_step": 226893, "epoch": 2733} {"train_loss": -24.5689754486084, "global_step": 226894, "epoch": 2733} {"train_loss": -24.835004806518555, "global_step": 226895, "epoch": 2733} {"train_loss": -24.838703155517578, "global_step": 226896, "epoch": 2733} {"train_loss": -24.71430206298828, "global_step": 226897, "epoch": 2733} {"train_loss": -24.67964744567871, "global_step": 226898, "epoch": 2733} {"train_loss": -24.644268035888672, "global_step": 226899, "epoch": 2733} {"train_loss": -24.529220581054688, "global_step": 226900, "epoch": 2733} {"train_loss": -24.458200454711914, "global_step": 226901, "epoch": 2733} {"train_loss": -24.715124130249023, "global_step": 226902, "epoch": 2733} {"train_loss": -24.599876403808594, "global_step": 226903, "epoch": 2733} {"train_loss": -24.800046920776367, "global_step": 226904, "epoch": 2733} {"train_loss": -24.782785415649414, "global_step": 226905, "epoch": 2733} {"train_loss": -24.719820022583008, "global_step": 226906, "epoch": 2733} {"train_loss": -24.705848693847656, "global_step": 226907, "epoch": 2733} {"train_loss": -24.876373291015625, "global_step": 226908, "epoch": 2733} {"train_loss": -24.78132438659668, "global_step": 226909, "epoch": 2733} {"train_loss": -24.626821517944336, "global_step": 226910, "epoch": 2733} {"train_loss": -24.63324546813965, "global_step": 226911, "epoch": 2733} {"train_loss": -24.78749656677246, "global_step": 226912, "epoch": 2733} {"train_loss": -24.537919998168945, "global_step": 226913, "epoch": 2733} {"train_loss": -25.07696533203125, "global_step": 226914, "epoch": 2733} {"train_loss": -25.03546905517578, "global_step": 226915, "epoch": 2733} {"train_loss": -24.535776138305664, "global_step": 226916, "epoch": 2733} {"train_loss": -24.984548568725586, "global_step": 226917, "epoch": 2733} {"train_loss": -24.876562118530273, "global_step": 226918, "epoch": 2733} {"train_loss": -24.8366756439209, "global_step": 226919, "epoch": 2733} {"train_loss": -24.895328521728516, "global_step": 226920, "epoch": 2733} {"train_loss": -24.590366662266742, "global_step": 226921, "epoch": 2733, "val_loss": 6747761.5} {"train_loss": -23.2117862701416, "global_step": 226922, "epoch": 2734} {"train_loss": -24.149682998657227, "global_step": 226923, "epoch": 2734} {"train_loss": -23.47132682800293, "global_step": 226924, "epoch": 2734} {"train_loss": -23.657222747802734, "global_step": 226925, "epoch": 2734} {"train_loss": -23.471399307250977, "global_step": 226926, "epoch": 2734} {"train_loss": -23.565214157104492, "global_step": 226927, "epoch": 2734} {"train_loss": -23.94589614868164, "global_step": 226928, "epoch": 2734} {"train_loss": -23.436826705932617, "global_step": 226929, "epoch": 2734} {"train_loss": -24.003454208374023, "global_step": 226930, "epoch": 2734} {"train_loss": -23.69346046447754, "global_step": 226931, "epoch": 2734} {"train_loss": -23.57891845703125, "global_step": 226932, "epoch": 2734} {"train_loss": -23.89544105529785, "global_step": 226933, "epoch": 2734} {"train_loss": -23.77179527282715, "global_step": 226934, "epoch": 2734} {"train_loss": -24.0914363861084, "global_step": 226935, "epoch": 2734} {"train_loss": -24.165996551513672, "global_step": 226936, "epoch": 2734} {"train_loss": -24.3095645904541, "global_step": 226937, "epoch": 2734} {"train_loss": -24.510175704956055, "global_step": 226938, "epoch": 2734} {"train_loss": -24.219369888305664, "global_step": 226939, "epoch": 2734} {"train_loss": -24.329769134521484, "global_step": 226940, "epoch": 2734} {"train_loss": -24.279783248901367, "global_step": 226941, "epoch": 2734} {"train_loss": -24.15023422241211, "global_step": 226942, "epoch": 2734} {"train_loss": -24.483800888061523, "global_step": 226943, "epoch": 2734} {"train_loss": -24.427824020385742, "global_step": 226944, "epoch": 2734} {"train_loss": -24.44394874572754, "global_step": 226945, "epoch": 2734} {"train_loss": -24.11353874206543, "global_step": 226946, "epoch": 2734} {"train_loss": -24.26291847229004, "global_step": 226947, "epoch": 2734} {"train_loss": -24.47842025756836, "global_step": 226948, "epoch": 2734} {"train_loss": -24.584274291992188, "global_step": 226949, "epoch": 2734} {"train_loss": -24.801008224487305, "global_step": 226950, "epoch": 2734} {"train_loss": -24.73117446899414, "global_step": 226951, "epoch": 2734} {"train_loss": -24.453222274780273, "global_step": 226952, "epoch": 2734} {"train_loss": -24.430164337158203, "global_step": 226953, "epoch": 2734} {"train_loss": -24.637332916259766, "global_step": 226954, "epoch": 2734} {"train_loss": -24.918039321899414, "global_step": 226955, "epoch": 2734} {"train_loss": -24.402408599853516, "global_step": 226956, "epoch": 2734} {"train_loss": -24.641101837158203, "global_step": 226957, "epoch": 2734} {"train_loss": -24.847949981689453, "global_step": 226958, "epoch": 2734} {"train_loss": -24.6718692779541, "global_step": 226959, "epoch": 2734} {"train_loss": -24.698034286499023, "global_step": 226960, "epoch": 2734} {"train_loss": -24.423629760742188, "global_step": 226961, "epoch": 2734} {"train_loss": -24.595884323120117, "global_step": 226962, "epoch": 2734} {"train_loss": -24.522140502929688, "global_step": 226963, "epoch": 2734} {"train_loss": -24.635793685913086, "global_step": 226964, "epoch": 2734} {"train_loss": -24.523761749267578, "global_step": 226965, "epoch": 2734} {"train_loss": -24.71912956237793, "global_step": 226966, "epoch": 2734} {"train_loss": -24.520666122436523, "global_step": 226967, "epoch": 2734} {"train_loss": -24.558317184448242, "global_step": 226968, "epoch": 2734} {"train_loss": -24.73018455505371, "global_step": 226969, "epoch": 2734} {"train_loss": -24.537769317626953, "global_step": 226970, "epoch": 2734} {"train_loss": -24.602760314941406, "global_step": 226971, "epoch": 2734} {"train_loss": -24.71103858947754, "global_step": 226972, "epoch": 2734} {"train_loss": -24.612211227416992, "global_step": 226973, "epoch": 2734} {"train_loss": -24.365732192993164, "global_step": 226974, "epoch": 2734} {"train_loss": -24.664844512939453, "global_step": 226975, "epoch": 2734} {"train_loss": -24.707014083862305, "global_step": 226976, "epoch": 2734} {"train_loss": -24.424604415893555, "global_step": 226977, "epoch": 2734} {"train_loss": -24.832815170288086, "global_step": 226978, "epoch": 2734} {"train_loss": -24.307186126708984, "global_step": 226979, "epoch": 2734} {"train_loss": -24.72320556640625, "global_step": 226980, "epoch": 2734} {"train_loss": -24.900876998901367, "global_step": 226981, "epoch": 2734} {"train_loss": -24.37813377380371, "global_step": 226982, "epoch": 2734} {"train_loss": -24.797948837280273, "global_step": 226983, "epoch": 2734} {"train_loss": -24.725250244140625, "global_step": 226984, "epoch": 2734} {"train_loss": -24.653051376342773, "global_step": 226985, "epoch": 2734} {"train_loss": -24.277639389038086, "global_step": 226986, "epoch": 2734} {"train_loss": -24.718381881713867, "global_step": 226987, "epoch": 2734} {"train_loss": -24.67319107055664, "global_step": 226988, "epoch": 2734} {"train_loss": -24.794891357421875, "global_step": 226989, "epoch": 2734} {"train_loss": -25.014150619506836, "global_step": 226990, "epoch": 2734} {"train_loss": -24.669340133666992, "global_step": 226991, "epoch": 2734} {"train_loss": -24.618738174438477, "global_step": 226992, "epoch": 2734} {"train_loss": -24.800491333007812, "global_step": 226993, "epoch": 2734} {"train_loss": -24.784238815307617, "global_step": 226994, "epoch": 2734} {"train_loss": -24.898527145385742, "global_step": 226995, "epoch": 2734} {"train_loss": -24.750171661376953, "global_step": 226996, "epoch": 2734} {"train_loss": -24.25935935974121, "global_step": 226997, "epoch": 2734} {"train_loss": -24.846906661987305, "global_step": 226998, "epoch": 2734} {"train_loss": -24.826614379882812, "global_step": 226999, "epoch": 2734} {"train_loss": -25.165481567382812, "global_step": 227000, "epoch": 2734} {"train_loss": -24.75323486328125, "global_step": 227001, "epoch": 2734} {"train_loss": -24.439483642578125, "global_step": 227002, "epoch": 2734} {"train_loss": -24.737150192260742, "global_step": 227003, "epoch": 2734} {"train_loss": -24.444693002356104, "global_step": 227004, "epoch": 2734, "val_loss": 6651200.5} {"train_loss": -24.34394645690918, "global_step": 227005, "epoch": 2735} {"train_loss": -24.43088722229004, "global_step": 227006, "epoch": 2735} {"train_loss": -24.233652114868164, "global_step": 227007, "epoch": 2735} {"train_loss": -24.59110450744629, "global_step": 227008, "epoch": 2735} {"train_loss": -24.68069076538086, "global_step": 227009, "epoch": 2735} {"train_loss": -24.536588668823242, "global_step": 227010, "epoch": 2735} {"train_loss": -24.500885009765625, "global_step": 227011, "epoch": 2735} {"train_loss": -24.693767547607422, "global_step": 227012, "epoch": 2735} {"train_loss": -24.824594497680664, "global_step": 227013, "epoch": 2735} {"train_loss": -24.38298988342285, "global_step": 227014, "epoch": 2735} {"train_loss": -24.732770919799805, "global_step": 227015, "epoch": 2735} {"train_loss": -24.46982765197754, "global_step": 227016, "epoch": 2735} {"train_loss": -24.77802085876465, "global_step": 227017, "epoch": 2735} {"train_loss": -24.731367111206055, "global_step": 227018, "epoch": 2735} {"train_loss": -24.812997817993164, "global_step": 227019, "epoch": 2735} {"train_loss": -25.005521774291992, "global_step": 227020, "epoch": 2735} {"train_loss": -24.688302993774414, "global_step": 227021, "epoch": 2735} {"train_loss": -24.835119247436523, "global_step": 227022, "epoch": 2735} {"train_loss": -24.25077247619629, "global_step": 227023, "epoch": 2735} {"train_loss": -24.41132926940918, "global_step": 227024, "epoch": 2735} {"train_loss": -24.424589157104492, "global_step": 227025, "epoch": 2735} {"train_loss": -24.551618576049805, "global_step": 227026, "epoch": 2735} {"train_loss": -24.681432723999023, "global_step": 227027, "epoch": 2735} {"train_loss": -24.77424430847168, "global_step": 227028, "epoch": 2735} {"train_loss": -24.807025909423828, "global_step": 227029, "epoch": 2735} {"train_loss": -24.5050106048584, "global_step": 227030, "epoch": 2735} {"train_loss": -24.713720321655273, "global_step": 227031, "epoch": 2735} {"train_loss": -24.646581649780273, "global_step": 227032, "epoch": 2735} {"train_loss": -24.91560173034668, "global_step": 227033, "epoch": 2735} {"train_loss": -24.668758392333984, "global_step": 227034, "epoch": 2735} {"train_loss": -24.762298583984375, "global_step": 227035, "epoch": 2735} {"train_loss": -24.757150650024414, "global_step": 227036, "epoch": 2735} {"train_loss": -24.965356826782227, "global_step": 227037, "epoch": 2735} {"train_loss": -24.82093620300293, "global_step": 227038, "epoch": 2735} {"train_loss": -24.633258819580078, "global_step": 227039, "epoch": 2735} {"train_loss": -24.714189529418945, "global_step": 227040, "epoch": 2735} {"train_loss": -24.67741584777832, "global_step": 227041, "epoch": 2735} {"train_loss": -25.000593185424805, "global_step": 227042, "epoch": 2735} {"train_loss": -24.82131004333496, "global_step": 227043, "epoch": 2735} {"train_loss": -24.8553524017334, "global_step": 227044, "epoch": 2735} {"train_loss": -24.387521743774414, "global_step": 227045, "epoch": 2735} {"train_loss": -24.744197845458984, "global_step": 227046, "epoch": 2735} {"train_loss": -24.282917022705078, "global_step": 227047, "epoch": 2735} {"train_loss": -24.230100631713867, "global_step": 227048, "epoch": 2735} {"train_loss": -24.697927474975586, "global_step": 227049, "epoch": 2735} {"train_loss": -24.75929069519043, "global_step": 227050, "epoch": 2735} {"train_loss": -24.453977584838867, "global_step": 227051, "epoch": 2735} {"train_loss": -24.369647979736328, "global_step": 227052, "epoch": 2735} {"train_loss": -23.854877471923828, "global_step": 227053, "epoch": 2735} {"train_loss": -24.366071701049805, "global_step": 227054, "epoch": 2735} {"train_loss": -25.13981056213379, "global_step": 227055, "epoch": 2735} {"train_loss": -24.57977294921875, "global_step": 227056, "epoch": 2735} {"train_loss": -24.697275161743164, "global_step": 227057, "epoch": 2735} {"train_loss": -24.408672332763672, "global_step": 227058, "epoch": 2735} {"train_loss": -24.087299346923828, "global_step": 227059, "epoch": 2735} {"train_loss": -24.806535720825195, "global_step": 227060, "epoch": 2735} {"train_loss": -24.30003547668457, "global_step": 227061, "epoch": 2735} {"train_loss": -24.84309196472168, "global_step": 227062, "epoch": 2735} {"train_loss": -24.762067794799805, "global_step": 227063, "epoch": 2735} {"train_loss": -24.813833236694336, "global_step": 227064, "epoch": 2735} {"train_loss": -25.111242294311523, "global_step": 227065, "epoch": 2735} {"train_loss": -24.556364059448242, "global_step": 227066, "epoch": 2735} {"train_loss": -24.634769439697266, "global_step": 227067, "epoch": 2735} {"train_loss": -24.718347549438477, "global_step": 227068, "epoch": 2735} {"train_loss": -24.821273803710938, "global_step": 227069, "epoch": 2735} {"train_loss": -24.678455352783203, "global_step": 227070, "epoch": 2735} {"train_loss": -24.765811920166016, "global_step": 227071, "epoch": 2735} {"train_loss": -24.710874557495117, "global_step": 227072, "epoch": 2735} {"train_loss": -24.632261276245117, "global_step": 227073, "epoch": 2735} {"train_loss": -25.170019149780273, "global_step": 227074, "epoch": 2735} {"train_loss": -24.46474266052246, "global_step": 227075, "epoch": 2735} {"train_loss": -24.510839462280273, "global_step": 227076, "epoch": 2735} {"train_loss": -24.742992401123047, "global_step": 227077, "epoch": 2735} {"train_loss": -24.940898895263672, "global_step": 227078, "epoch": 2735} {"train_loss": -24.420270919799805, "global_step": 227079, "epoch": 2735} {"train_loss": -24.705760955810547, "global_step": 227080, "epoch": 2735} {"train_loss": -24.58183479309082, "global_step": 227081, "epoch": 2735} {"train_loss": -24.89874267578125, "global_step": 227082, "epoch": 2735} {"train_loss": -24.48750114440918, "global_step": 227083, "epoch": 2735} {"train_loss": -24.828073501586914, "global_step": 227084, "epoch": 2735} {"train_loss": -24.674856185913086, "global_step": 227085, "epoch": 2735} {"train_loss": -24.924985885620117, "global_step": 227086, "epoch": 2735} {"train_loss": -24.65677603756089, "global_step": 227087, "epoch": 2735, "val_loss": 6792449.0} {"train_loss": -23.973093032836914, "global_step": 227088, "epoch": 2736} {"train_loss": -23.4389705657959, "global_step": 227089, "epoch": 2736} {"train_loss": -24.347532272338867, "global_step": 227090, "epoch": 2736} {"train_loss": -23.691425323486328, "global_step": 227091, "epoch": 2736} {"train_loss": -24.404325485229492, "global_step": 227092, "epoch": 2736} {"train_loss": -24.632312774658203, "global_step": 227093, "epoch": 2736} {"train_loss": -24.126983642578125, "global_step": 227094, "epoch": 2736} {"train_loss": -24.781543731689453, "global_step": 227095, "epoch": 2736} {"train_loss": -24.279232025146484, "global_step": 227096, "epoch": 2736} {"train_loss": -24.01009178161621, "global_step": 227097, "epoch": 2736} {"train_loss": -24.46259117126465, "global_step": 227098, "epoch": 2736} {"train_loss": -24.426000595092773, "global_step": 227099, "epoch": 2736} {"train_loss": -24.430208206176758, "global_step": 227100, "epoch": 2736} {"train_loss": -24.15003776550293, "global_step": 227101, "epoch": 2736} {"train_loss": -24.568479537963867, "global_step": 227102, "epoch": 2736} {"train_loss": -24.601587295532227, "global_step": 227103, "epoch": 2736} {"train_loss": -24.648542404174805, "global_step": 227104, "epoch": 2736} {"train_loss": -24.213621139526367, "global_step": 227105, "epoch": 2736} {"train_loss": -24.568103790283203, "global_step": 227106, "epoch": 2736} {"train_loss": -24.56093406677246, "global_step": 227107, "epoch": 2736} {"train_loss": -24.513792037963867, "global_step": 227108, "epoch": 2736} {"train_loss": -24.664213180541992, "global_step": 227109, "epoch": 2736} {"train_loss": -24.560699462890625, "global_step": 227110, "epoch": 2736} {"train_loss": -24.5264949798584, "global_step": 227111, "epoch": 2736} {"train_loss": -24.834928512573242, "global_step": 227112, "epoch": 2736} {"train_loss": -24.91144371032715, "global_step": 227113, "epoch": 2736} {"train_loss": -25.00860023498535, "global_step": 227114, "epoch": 2736} {"train_loss": -24.627077102661133, "global_step": 227115, "epoch": 2736} {"train_loss": -24.438236236572266, "global_step": 227116, "epoch": 2736} {"train_loss": -24.979135513305664, "global_step": 227117, "epoch": 2736} {"train_loss": -24.733230590820312, "global_step": 227118, "epoch": 2736} {"train_loss": -24.715864181518555, "global_step": 227119, "epoch": 2736} {"train_loss": -24.421524047851562, "global_step": 227120, "epoch": 2736} {"train_loss": -24.425703048706055, "global_step": 227121, "epoch": 2736} {"train_loss": -24.439313888549805, "global_step": 227122, "epoch": 2736} {"train_loss": -24.437162399291992, "global_step": 227123, "epoch": 2736} {"train_loss": -24.538747787475586, "global_step": 227124, "epoch": 2736} {"train_loss": -23.655981063842773, "global_step": 227125, "epoch": 2736} {"train_loss": -24.519760131835938, "global_step": 227126, "epoch": 2736} {"train_loss": -24.823257446289062, "global_step": 227127, "epoch": 2736} {"train_loss": -24.555755615234375, "global_step": 227128, "epoch": 2736} {"train_loss": -24.581266403198242, "global_step": 227129, "epoch": 2736} {"train_loss": -24.535253524780273, "global_step": 227130, "epoch": 2736} {"train_loss": -24.686424255371094, "global_step": 227131, "epoch": 2736} {"train_loss": -24.768278121948242, "global_step": 227132, "epoch": 2736} {"train_loss": -24.85028076171875, "global_step": 227133, "epoch": 2736} {"train_loss": -24.950668334960938, "global_step": 227134, "epoch": 2736} {"train_loss": -24.757823944091797, "global_step": 227135, "epoch": 2736} {"train_loss": -24.5576171875, "global_step": 227136, "epoch": 2736} {"train_loss": -24.763477325439453, "global_step": 227137, "epoch": 2736} {"train_loss": -24.745107650756836, "global_step": 227138, "epoch": 2736} {"train_loss": -24.83388900756836, "global_step": 227139, "epoch": 2736} {"train_loss": -25.077926635742188, "global_step": 227140, "epoch": 2736} {"train_loss": -24.682723999023438, "global_step": 227141, "epoch": 2736} {"train_loss": -24.809171676635742, "global_step": 227142, "epoch": 2736} {"train_loss": -24.491836547851562, "global_step": 227143, "epoch": 2736} {"train_loss": -24.27129554748535, "global_step": 227144, "epoch": 2736} {"train_loss": -24.69722557067871, "global_step": 227145, "epoch": 2736} {"train_loss": -24.455013275146484, "global_step": 227146, "epoch": 2736} {"train_loss": -24.45241355895996, "global_step": 227147, "epoch": 2736} {"train_loss": -24.532209396362305, "global_step": 227148, "epoch": 2736} {"train_loss": -25.031126022338867, "global_step": 227149, "epoch": 2736} {"train_loss": -24.70497703552246, "global_step": 227150, "epoch": 2736} {"train_loss": -24.845182418823242, "global_step": 227151, "epoch": 2736} {"train_loss": -24.750139236450195, "global_step": 227152, "epoch": 2736} {"train_loss": -24.98219871520996, "global_step": 227153, "epoch": 2736} {"train_loss": -24.653650283813477, "global_step": 227154, "epoch": 2736} {"train_loss": -24.65203285217285, "global_step": 227155, "epoch": 2736} {"train_loss": -24.825361251831055, "global_step": 227156, "epoch": 2736} {"train_loss": -24.765024185180664, "global_step": 227157, "epoch": 2736} {"train_loss": -24.964645385742188, "global_step": 227158, "epoch": 2736} {"train_loss": -24.16045570373535, "global_step": 227159, "epoch": 2736} {"train_loss": -24.66348648071289, "global_step": 227160, "epoch": 2736} {"train_loss": -24.784238815307617, "global_step": 227161, "epoch": 2736} {"train_loss": -24.52870750427246, "global_step": 227162, "epoch": 2736} {"train_loss": -25.3721923828125, "global_step": 227163, "epoch": 2736} {"train_loss": -24.762256622314453, "global_step": 227164, "epoch": 2736} {"train_loss": -24.480188369750977, "global_step": 227165, "epoch": 2736} {"train_loss": -24.77564811706543, "global_step": 227166, "epoch": 2736} {"train_loss": -24.470197677612305, "global_step": 227167, "epoch": 2736} {"train_loss": -24.56828498840332, "global_step": 227168, "epoch": 2736} {"train_loss": -25.091672897338867, "global_step": 227169, "epoch": 2736} {"train_loss": -24.582209989248987, "global_step": 227170, "epoch": 2736, "val_loss": 6788371.5} {"train_loss": -24.301380157470703, "global_step": 227171, "epoch": 2737} {"train_loss": -24.203380584716797, "global_step": 227172, "epoch": 2737} {"train_loss": -24.39935302734375, "global_step": 227173, "epoch": 2737} {"train_loss": -24.319345474243164, "global_step": 227174, "epoch": 2737} {"train_loss": -24.04511833190918, "global_step": 227175, "epoch": 2737} {"train_loss": -24.525304794311523, "global_step": 227176, "epoch": 2737} {"train_loss": -24.088909149169922, "global_step": 227177, "epoch": 2737} {"train_loss": -24.520404815673828, "global_step": 227178, "epoch": 2737} {"train_loss": -24.269834518432617, "global_step": 227179, "epoch": 2737} {"train_loss": -24.425708770751953, "global_step": 227180, "epoch": 2737} {"train_loss": -24.602928161621094, "global_step": 227181, "epoch": 2737} {"train_loss": -24.367374420166016, "global_step": 227182, "epoch": 2737} {"train_loss": -24.486143112182617, "global_step": 227183, "epoch": 2737} {"train_loss": -24.550365447998047, "global_step": 227184, "epoch": 2737} {"train_loss": -24.23053550720215, "global_step": 227185, "epoch": 2737} {"train_loss": -24.314241409301758, "global_step": 227186, "epoch": 2737} {"train_loss": -24.511646270751953, "global_step": 227187, "epoch": 2737} {"train_loss": -24.759260177612305, "global_step": 227188, "epoch": 2737} {"train_loss": -24.359210968017578, "global_step": 227189, "epoch": 2737} {"train_loss": -24.773611068725586, "global_step": 227190, "epoch": 2737} {"train_loss": -24.719762802124023, "global_step": 227191, "epoch": 2737} {"train_loss": -24.05229949951172, "global_step": 227192, "epoch": 2737} {"train_loss": -24.715364456176758, "global_step": 227193, "epoch": 2737} {"train_loss": -24.513504028320312, "global_step": 227194, "epoch": 2737} {"train_loss": -24.659748077392578, "global_step": 227195, "epoch": 2737} {"train_loss": -24.788537979125977, "global_step": 227196, "epoch": 2737} {"train_loss": -24.5345516204834, "global_step": 227197, "epoch": 2737} {"train_loss": -24.74570655822754, "global_step": 227198, "epoch": 2737} {"train_loss": -24.68759536743164, "global_step": 227199, "epoch": 2737} {"train_loss": -24.879175186157227, "global_step": 227200, "epoch": 2737} {"train_loss": -24.612401962280273, "global_step": 227201, "epoch": 2737} {"train_loss": -24.718828201293945, "global_step": 227202, "epoch": 2737} {"train_loss": -24.680007934570312, "global_step": 227203, "epoch": 2737} {"train_loss": -24.808380126953125, "global_step": 227204, "epoch": 2737} {"train_loss": -24.64065933227539, "global_step": 227205, "epoch": 2737} {"train_loss": -25.005205154418945, "global_step": 227206, "epoch": 2737} {"train_loss": -24.7509708404541, "global_step": 227207, "epoch": 2737} {"train_loss": -24.666000366210938, "global_step": 227208, "epoch": 2737} {"train_loss": -24.89102554321289, "global_step": 227209, "epoch": 2737} {"train_loss": -25.171842575073242, "global_step": 227210, "epoch": 2737} {"train_loss": -24.751482009887695, "global_step": 227211, "epoch": 2737} {"train_loss": -25.09754180908203, "global_step": 227212, "epoch": 2737} {"train_loss": -24.888635635375977, "global_step": 227213, "epoch": 2737} {"train_loss": -24.98999786376953, "global_step": 227214, "epoch": 2737} {"train_loss": -24.931745529174805, "global_step": 227215, "epoch": 2737} {"train_loss": -24.38286781311035, "global_step": 227216, "epoch": 2737} {"train_loss": -24.530515670776367, "global_step": 227217, "epoch": 2737} {"train_loss": -24.711111068725586, "global_step": 227218, "epoch": 2737} {"train_loss": -25.1353702545166, "global_step": 227219, "epoch": 2737} {"train_loss": -24.771202087402344, "global_step": 227220, "epoch": 2737} {"train_loss": -24.979562759399414, "global_step": 227221, "epoch": 2737} {"train_loss": -25.014326095581055, "global_step": 227222, "epoch": 2737} {"train_loss": -24.634536743164062, "global_step": 227223, "epoch": 2737} {"train_loss": -24.43613052368164, "global_step": 227224, "epoch": 2737} {"train_loss": -24.820194244384766, "global_step": 227225, "epoch": 2737} {"train_loss": -24.638145446777344, "global_step": 227226, "epoch": 2737} {"train_loss": -25.129886627197266, "global_step": 227227, "epoch": 2737} {"train_loss": -25.134811401367188, "global_step": 227228, "epoch": 2737} {"train_loss": -24.96958351135254, "global_step": 227229, "epoch": 2737} {"train_loss": -24.855222702026367, "global_step": 227230, "epoch": 2737} {"train_loss": -24.513425827026367, "global_step": 227231, "epoch": 2737} {"train_loss": -24.814617156982422, "global_step": 227232, "epoch": 2737} {"train_loss": -24.241079330444336, "global_step": 227233, "epoch": 2737} {"train_loss": -24.705596923828125, "global_step": 227234, "epoch": 2737} {"train_loss": -24.895055770874023, "global_step": 227235, "epoch": 2737} {"train_loss": -24.699140548706055, "global_step": 227236, "epoch": 2737} {"train_loss": -24.411500930786133, "global_step": 227237, "epoch": 2737} {"train_loss": -24.624650955200195, "global_step": 227238, "epoch": 2737} {"train_loss": -24.76457977294922, "global_step": 227239, "epoch": 2737} {"train_loss": -24.791837692260742, "global_step": 227240, "epoch": 2737} {"train_loss": -24.512094497680664, "global_step": 227241, "epoch": 2737} {"train_loss": -25.09340476989746, "global_step": 227242, "epoch": 2737} {"train_loss": -24.706331253051758, "global_step": 227243, "epoch": 2737} {"train_loss": -24.771869659423828, "global_step": 227244, "epoch": 2737} {"train_loss": -24.895315170288086, "global_step": 227245, "epoch": 2737} {"train_loss": -25.03382682800293, "global_step": 227246, "epoch": 2737} {"train_loss": -24.905210494995117, "global_step": 227247, "epoch": 2737} {"train_loss": -24.842321395874023, "global_step": 227248, "epoch": 2737} {"train_loss": -24.60599708557129, "global_step": 227249, "epoch": 2737} {"train_loss": -24.89982032775879, "global_step": 227250, "epoch": 2737} {"train_loss": -24.78826904296875, "global_step": 227251, "epoch": 2737} {"train_loss": -24.581031799316406, "global_step": 227252, "epoch": 2737} {"train_loss": -24.649309296205818, "global_step": 227253, "epoch": 2737, "val_loss": 6725812.0} {"train_loss": -24.577978134155273, "global_step": 227254, "epoch": 2738} {"train_loss": -24.082895278930664, "global_step": 227255, "epoch": 2738} {"train_loss": -24.54529571533203, "global_step": 227256, "epoch": 2738} {"train_loss": -24.352039337158203, "global_step": 227257, "epoch": 2738} {"train_loss": -24.809606552124023, "global_step": 227258, "epoch": 2738} {"train_loss": -24.359161376953125, "global_step": 227259, "epoch": 2738} {"train_loss": -24.381681442260742, "global_step": 227260, "epoch": 2738} {"train_loss": -24.49347496032715, "global_step": 227261, "epoch": 2738} {"train_loss": -24.67440414428711, "global_step": 227262, "epoch": 2738} {"train_loss": -24.52327537536621, "global_step": 227263, "epoch": 2738} {"train_loss": -24.08681297302246, "global_step": 227264, "epoch": 2738} {"train_loss": -24.4345703125, "global_step": 227265, "epoch": 2738} {"train_loss": -24.43438720703125, "global_step": 227266, "epoch": 2738} {"train_loss": -24.016300201416016, "global_step": 227267, "epoch": 2738} {"train_loss": -24.72762107849121, "global_step": 227268, "epoch": 2738} {"train_loss": -24.7292537689209, "global_step": 227269, "epoch": 2738} {"train_loss": -24.348310470581055, "global_step": 227270, "epoch": 2738} {"train_loss": -24.67653465270996, "global_step": 227271, "epoch": 2738} {"train_loss": -24.36787986755371, "global_step": 227272, "epoch": 2738} {"train_loss": -24.450918197631836, "global_step": 227273, "epoch": 2738} {"train_loss": -24.578800201416016, "global_step": 227274, "epoch": 2738} {"train_loss": -25.007328033447266, "global_step": 227275, "epoch": 2738} {"train_loss": -24.730375289916992, "global_step": 227276, "epoch": 2738} {"train_loss": -24.84049415588379, "global_step": 227277, "epoch": 2738} {"train_loss": -24.701810836791992, "global_step": 227278, "epoch": 2738} {"train_loss": -24.824771881103516, "global_step": 227279, "epoch": 2738} {"train_loss": -24.85652732849121, "global_step": 227280, "epoch": 2738} {"train_loss": -24.522960662841797, "global_step": 227281, "epoch": 2738} {"train_loss": -24.734821319580078, "global_step": 227282, "epoch": 2738} {"train_loss": -24.902524948120117, "global_step": 227283, "epoch": 2738} {"train_loss": -24.536497116088867, "global_step": 227284, "epoch": 2738} {"train_loss": -24.345252990722656, "global_step": 227285, "epoch": 2738} {"train_loss": -24.2611083984375, "global_step": 227286, "epoch": 2738} {"train_loss": -24.33838653564453, "global_step": 227287, "epoch": 2738} {"train_loss": -25.06325340270996, "global_step": 227288, "epoch": 2738} {"train_loss": -25.035221099853516, "global_step": 227289, "epoch": 2738} {"train_loss": -24.35102653503418, "global_step": 227290, "epoch": 2738} {"train_loss": -24.535154342651367, "global_step": 227291, "epoch": 2738} {"train_loss": -24.808073043823242, "global_step": 227292, "epoch": 2738} {"train_loss": -25.034944534301758, "global_step": 227293, "epoch": 2738} {"train_loss": -24.705209732055664, "global_step": 227294, "epoch": 2738} {"train_loss": -24.67462730407715, "global_step": 227295, "epoch": 2738} {"train_loss": -24.74393653869629, "global_step": 227296, "epoch": 2738} {"train_loss": -24.901351928710938, "global_step": 227297, "epoch": 2738} {"train_loss": -24.711889266967773, "global_step": 227298, "epoch": 2738} {"train_loss": -24.793275833129883, "global_step": 227299, "epoch": 2738} {"train_loss": -24.78899574279785, "global_step": 227300, "epoch": 2738} {"train_loss": -24.72218132019043, "global_step": 227301, "epoch": 2738} {"train_loss": -24.8507137298584, "global_step": 227302, "epoch": 2738} {"train_loss": -24.5252742767334, "global_step": 227303, "epoch": 2738} {"train_loss": -24.73763656616211, "global_step": 227304, "epoch": 2738} {"train_loss": -24.54878807067871, "global_step": 227305, "epoch": 2738} {"train_loss": -24.745229721069336, "global_step": 227306, "epoch": 2738} {"train_loss": -24.65152931213379, "global_step": 227307, "epoch": 2738} {"train_loss": -24.46254539489746, "global_step": 227308, "epoch": 2738} {"train_loss": -24.514623641967773, "global_step": 227309, "epoch": 2738} {"train_loss": -24.708818435668945, "global_step": 227310, "epoch": 2738} {"train_loss": -25.099395751953125, "global_step": 227311, "epoch": 2738} {"train_loss": -25.001230239868164, "global_step": 227312, "epoch": 2738} {"train_loss": -24.64522361755371, "global_step": 227313, "epoch": 2738} {"train_loss": -24.130435943603516, "global_step": 227314, "epoch": 2738} {"train_loss": -24.67711067199707, "global_step": 227315, "epoch": 2738} {"train_loss": -24.562824249267578, "global_step": 227316, "epoch": 2738} {"train_loss": -24.517892837524414, "global_step": 227317, "epoch": 2738} {"train_loss": -24.97576904296875, "global_step": 227318, "epoch": 2738} {"train_loss": -24.762008666992188, "global_step": 227319, "epoch": 2738} {"train_loss": -24.41847801208496, "global_step": 227320, "epoch": 2738} {"train_loss": -24.378768920898438, "global_step": 227321, "epoch": 2738} {"train_loss": -24.72226905822754, "global_step": 227322, "epoch": 2738} {"train_loss": -24.22231101989746, "global_step": 227323, "epoch": 2738} {"train_loss": -24.31290626525879, "global_step": 227324, "epoch": 2738} {"train_loss": -24.473148345947266, "global_step": 227325, "epoch": 2738} {"train_loss": -24.7890682220459, "global_step": 227326, "epoch": 2738} {"train_loss": -24.671937942504883, "global_step": 227327, "epoch": 2738} {"train_loss": -24.80643081665039, "global_step": 227328, "epoch": 2738} {"train_loss": -24.783721923828125, "global_step": 227329, "epoch": 2738} {"train_loss": -24.736623764038086, "global_step": 227330, "epoch": 2738} {"train_loss": -24.59132194519043, "global_step": 227331, "epoch": 2738} {"train_loss": -24.96536636352539, "global_step": 227332, "epoch": 2738} {"train_loss": -24.34382438659668, "global_step": 227333, "epoch": 2738} {"train_loss": -24.68857192993164, "global_step": 227334, "epoch": 2738} {"train_loss": -24.887914657592773, "global_step": 227335, "epoch": 2738} {"train_loss": -24.62348850663886, "global_step": 227336, "epoch": 2738, "val_loss": 6702062.0} {"train_loss": -24.175214767456055, "global_step": 227337, "epoch": 2739} {"train_loss": -23.815261840820312, "global_step": 227338, "epoch": 2739} {"train_loss": -24.66170883178711, "global_step": 227339, "epoch": 2739} {"train_loss": -23.964696884155273, "global_step": 227340, "epoch": 2739} {"train_loss": -24.434423446655273, "global_step": 227341, "epoch": 2739} {"train_loss": -24.224151611328125, "global_step": 227342, "epoch": 2739} {"train_loss": -24.13790512084961, "global_step": 227343, "epoch": 2739} {"train_loss": -24.08002281188965, "global_step": 227344, "epoch": 2739} {"train_loss": -23.545820236206055, "global_step": 227345, "epoch": 2739} {"train_loss": -24.176496505737305, "global_step": 227346, "epoch": 2739} {"train_loss": -24.416122436523438, "global_step": 227347, "epoch": 2739} {"train_loss": -24.0476016998291, "global_step": 227348, "epoch": 2739} {"train_loss": -24.628143310546875, "global_step": 227349, "epoch": 2739} {"train_loss": -24.364370346069336, "global_step": 227350, "epoch": 2739} {"train_loss": -24.47840690612793, "global_step": 227351, "epoch": 2739} {"train_loss": -24.77787208557129, "global_step": 227352, "epoch": 2739} {"train_loss": -24.493003845214844, "global_step": 227353, "epoch": 2739} {"train_loss": -24.962020874023438, "global_step": 227354, "epoch": 2739} {"train_loss": -24.463315963745117, "global_step": 227355, "epoch": 2739} {"train_loss": -24.434412002563477, "global_step": 227356, "epoch": 2739} {"train_loss": -24.60646629333496, "global_step": 227357, "epoch": 2739} {"train_loss": -24.60420799255371, "global_step": 227358, "epoch": 2739} {"train_loss": -24.671070098876953, "global_step": 227359, "epoch": 2739} {"train_loss": -24.72492027282715, "global_step": 227360, "epoch": 2739} {"train_loss": -24.378034591674805, "global_step": 227361, "epoch": 2739} {"train_loss": -24.603609085083008, "global_step": 227362, "epoch": 2739} {"train_loss": -24.427200317382812, "global_step": 227363, "epoch": 2739} {"train_loss": -24.743154525756836, "global_step": 227364, "epoch": 2739} {"train_loss": -24.60369873046875, "global_step": 227365, "epoch": 2739} {"train_loss": -24.470598220825195, "global_step": 227366, "epoch": 2739} {"train_loss": -24.646352767944336, "global_step": 227367, "epoch": 2739} {"train_loss": -24.404865264892578, "global_step": 227368, "epoch": 2739} {"train_loss": -24.642057418823242, "global_step": 227369, "epoch": 2739} {"train_loss": -24.618040084838867, "global_step": 227370, "epoch": 2739} {"train_loss": -25.051551818847656, "global_step": 227371, "epoch": 2739} {"train_loss": -24.694860458374023, "global_step": 227372, "epoch": 2739} {"train_loss": -24.781524658203125, "global_step": 227373, "epoch": 2739} {"train_loss": -24.853404998779297, "global_step": 227374, "epoch": 2739} {"train_loss": -24.812911987304688, "global_step": 227375, "epoch": 2739} {"train_loss": -24.97045135498047, "global_step": 227376, "epoch": 2739} {"train_loss": -25.129789352416992, "global_step": 227377, "epoch": 2739} {"train_loss": -24.645986557006836, "global_step": 227378, "epoch": 2739} {"train_loss": -24.639392852783203, "global_step": 227379, "epoch": 2739} {"train_loss": -24.641386032104492, "global_step": 227380, "epoch": 2739} {"train_loss": -25.256513595581055, "global_step": 227381, "epoch": 2739} {"train_loss": -24.85037612915039, "global_step": 227382, "epoch": 2739} {"train_loss": -24.85533905029297, "global_step": 227383, "epoch": 2739} {"train_loss": -24.908798217773438, "global_step": 227384, "epoch": 2739} {"train_loss": -24.957778930664062, "global_step": 227385, "epoch": 2739} {"train_loss": -24.44011878967285, "global_step": 227386, "epoch": 2739} {"train_loss": -24.163902282714844, "global_step": 227387, "epoch": 2739} {"train_loss": -24.65531349182129, "global_step": 227388, "epoch": 2739} {"train_loss": -24.845233917236328, "global_step": 227389, "epoch": 2739} {"train_loss": -24.720556259155273, "global_step": 227390, "epoch": 2739} {"train_loss": -24.759117126464844, "global_step": 227391, "epoch": 2739} {"train_loss": -24.58872413635254, "global_step": 227392, "epoch": 2739} {"train_loss": -24.890668869018555, "global_step": 227393, "epoch": 2739} {"train_loss": -24.571075439453125, "global_step": 227394, "epoch": 2739} {"train_loss": -24.031333923339844, "global_step": 227395, "epoch": 2739} {"train_loss": -24.61347770690918, "global_step": 227396, "epoch": 2739} {"train_loss": -24.86696434020996, "global_step": 227397, "epoch": 2739} {"train_loss": -24.791519165039062, "global_step": 227398, "epoch": 2739} {"train_loss": -24.715957641601562, "global_step": 227399, "epoch": 2739} {"train_loss": -24.864145278930664, "global_step": 227400, "epoch": 2739} {"train_loss": -24.164337158203125, "global_step": 227401, "epoch": 2739} {"train_loss": -23.973712921142578, "global_step": 227402, "epoch": 2739} {"train_loss": -24.082448959350586, "global_step": 227403, "epoch": 2739} {"train_loss": -23.986127853393555, "global_step": 227404, "epoch": 2739} {"train_loss": -24.411100387573242, "global_step": 227405, "epoch": 2739} {"train_loss": -24.35646629333496, "global_step": 227406, "epoch": 2739} {"train_loss": -24.257291793823242, "global_step": 227407, "epoch": 2739} {"train_loss": -24.524608612060547, "global_step": 227408, "epoch": 2739} {"train_loss": -24.400184631347656, "global_step": 227409, "epoch": 2739} {"train_loss": -24.870834350585938, "global_step": 227410, "epoch": 2739} {"train_loss": -24.519283294677734, "global_step": 227411, "epoch": 2739} {"train_loss": -24.502172470092773, "global_step": 227412, "epoch": 2739} {"train_loss": -24.7729549407959, "global_step": 227413, "epoch": 2739} {"train_loss": -24.660938262939453, "global_step": 227414, "epoch": 2739} {"train_loss": -24.462860107421875, "global_step": 227415, "epoch": 2739} {"train_loss": -24.865110397338867, "global_step": 227416, "epoch": 2739} {"train_loss": -24.217227935791016, "global_step": 227417, "epoch": 2739} {"train_loss": -24.707901000976562, "global_step": 227418, "epoch": 2739} {"train_loss": -24.5651368290545, "global_step": 227419, "epoch": 2739, "val_loss": 6751731.0} {"train_loss": -24.386249542236328, "global_step": 227420, "epoch": 2740} {"train_loss": -24.38996696472168, "global_step": 227421, "epoch": 2740} {"train_loss": -24.36351776123047, "global_step": 227422, "epoch": 2740} {"train_loss": -24.573881149291992, "global_step": 227423, "epoch": 2740} {"train_loss": -24.25450897216797, "global_step": 227424, "epoch": 2740} {"train_loss": -24.244735717773438, "global_step": 227425, "epoch": 2740} {"train_loss": -24.241804122924805, "global_step": 227426, "epoch": 2740} {"train_loss": -24.795522689819336, "global_step": 227427, "epoch": 2740} {"train_loss": -24.78421401977539, "global_step": 227428, "epoch": 2740} {"train_loss": -24.554983139038086, "global_step": 227429, "epoch": 2740} {"train_loss": -24.546463012695312, "global_step": 227430, "epoch": 2740} {"train_loss": -24.428895950317383, "global_step": 227431, "epoch": 2740} {"train_loss": -24.610599517822266, "global_step": 227432, "epoch": 2740} {"train_loss": -24.718732833862305, "global_step": 227433, "epoch": 2740} {"train_loss": -24.094608306884766, "global_step": 227434, "epoch": 2740} {"train_loss": -24.782800674438477, "global_step": 227435, "epoch": 2740} {"train_loss": -24.354076385498047, "global_step": 227436, "epoch": 2740} {"train_loss": -24.485593795776367, "global_step": 227437, "epoch": 2740} {"train_loss": -24.4812068939209, "global_step": 227438, "epoch": 2740} {"train_loss": -24.013851165771484, "global_step": 227439, "epoch": 2740} {"train_loss": -24.6301212310791, "global_step": 227440, "epoch": 2740} {"train_loss": -24.757143020629883, "global_step": 227441, "epoch": 2740} {"train_loss": -24.404314041137695, "global_step": 227442, "epoch": 2740} {"train_loss": -24.853132247924805, "global_step": 227443, "epoch": 2740} {"train_loss": -24.52720069885254, "global_step": 227444, "epoch": 2740} {"train_loss": -24.64912986755371, "global_step": 227445, "epoch": 2740} {"train_loss": -24.909587860107422, "global_step": 227446, "epoch": 2740} {"train_loss": -24.787946701049805, "global_step": 227447, "epoch": 2740} {"train_loss": -24.602188110351562, "global_step": 227448, "epoch": 2740} {"train_loss": -24.457294464111328, "global_step": 227449, "epoch": 2740} {"train_loss": -24.59430503845215, "global_step": 227450, "epoch": 2740} {"train_loss": -24.339069366455078, "global_step": 227451, "epoch": 2740} {"train_loss": -24.640277862548828, "global_step": 227452, "epoch": 2740} {"train_loss": -24.788721084594727, "global_step": 227453, "epoch": 2740} {"train_loss": -24.62758445739746, "global_step": 227454, "epoch": 2740} {"train_loss": -24.71147346496582, "global_step": 227455, "epoch": 2740} {"train_loss": -24.951818466186523, "global_step": 227456, "epoch": 2740} {"train_loss": -24.564359664916992, "global_step": 227457, "epoch": 2740} {"train_loss": -24.592382431030273, "global_step": 227458, "epoch": 2740} {"train_loss": -24.624330520629883, "global_step": 227459, "epoch": 2740} {"train_loss": -24.640644073486328, "global_step": 227460, "epoch": 2740} {"train_loss": -24.886709213256836, "global_step": 227461, "epoch": 2740} {"train_loss": -24.771947860717773, "global_step": 227462, "epoch": 2740} {"train_loss": -24.684106826782227, "global_step": 227463, "epoch": 2740} {"train_loss": -24.44365882873535, "global_step": 227464, "epoch": 2740} {"train_loss": -24.699506759643555, "global_step": 227465, "epoch": 2740} {"train_loss": -24.587024688720703, "global_step": 227466, "epoch": 2740} {"train_loss": -24.965606689453125, "global_step": 227467, "epoch": 2740} {"train_loss": -24.697599411010742, "global_step": 227468, "epoch": 2740} {"train_loss": -24.803470611572266, "global_step": 227469, "epoch": 2740} {"train_loss": -24.55142593383789, "global_step": 227470, "epoch": 2740} {"train_loss": -24.530622482299805, "global_step": 227471, "epoch": 2740} {"train_loss": -24.80878257751465, "global_step": 227472, "epoch": 2740} {"train_loss": -24.446561813354492, "global_step": 227473, "epoch": 2740} {"train_loss": -24.811492919921875, "global_step": 227474, "epoch": 2740} {"train_loss": -24.452756881713867, "global_step": 227475, "epoch": 2740} {"train_loss": -25.137659072875977, "global_step": 227476, "epoch": 2740} {"train_loss": -24.572484970092773, "global_step": 227477, "epoch": 2740} {"train_loss": -24.744428634643555, "global_step": 227478, "epoch": 2740} {"train_loss": -24.852758407592773, "global_step": 227479, "epoch": 2740} {"train_loss": -24.790761947631836, "global_step": 227480, "epoch": 2740} {"train_loss": -24.761457443237305, "global_step": 227481, "epoch": 2740} {"train_loss": -24.70306396484375, "global_step": 227482, "epoch": 2740} {"train_loss": -25.061206817626953, "global_step": 227483, "epoch": 2740} {"train_loss": -24.703369140625, "global_step": 227484, "epoch": 2740} {"train_loss": -24.550336837768555, "global_step": 227485, "epoch": 2740} {"train_loss": -24.580272674560547, "global_step": 227486, "epoch": 2740} {"train_loss": -24.925077438354492, "global_step": 227487, "epoch": 2740} {"train_loss": -24.44771385192871, "global_step": 227488, "epoch": 2740} {"train_loss": -24.749887466430664, "global_step": 227489, "epoch": 2740} {"train_loss": -24.524383544921875, "global_step": 227490, "epoch": 2740} {"train_loss": -24.938547134399414, "global_step": 227491, "epoch": 2740} {"train_loss": -24.66005516052246, "global_step": 227492, "epoch": 2740} {"train_loss": -24.509000778198242, "global_step": 227493, "epoch": 2740} {"train_loss": -25.02851676940918, "global_step": 227494, "epoch": 2740} {"train_loss": -24.696779251098633, "global_step": 227495, "epoch": 2740} {"train_loss": -24.389867782592773, "global_step": 227496, "epoch": 2740} {"train_loss": -24.475812911987305, "global_step": 227497, "epoch": 2740} {"train_loss": -24.54301643371582, "global_step": 227498, "epoch": 2740} {"train_loss": -25.039663314819336, "global_step": 227499, "epoch": 2740} {"train_loss": -24.796918869018555, "global_step": 227500, "epoch": 2740} {"train_loss": -24.960668563842773, "global_step": 227501, "epoch": 2740} {"train_loss": -24.63298581594444, "global_step": 227502, "epoch": 2740, "val_loss": 6785908.0} {"train_loss": -24.30487823486328, "global_step": 227503, "epoch": 2741} {"train_loss": -23.996227264404297, "global_step": 227504, "epoch": 2741} {"train_loss": -23.815906524658203, "global_step": 227505, "epoch": 2741} {"train_loss": -23.96742820739746, "global_step": 227506, "epoch": 2741} {"train_loss": -23.911331176757812, "global_step": 227507, "epoch": 2741} {"train_loss": -23.819549560546875, "global_step": 227508, "epoch": 2741} {"train_loss": -23.900712966918945, "global_step": 227509, "epoch": 2741} {"train_loss": -24.082548141479492, "global_step": 227510, "epoch": 2741} {"train_loss": -24.38107681274414, "global_step": 227511, "epoch": 2741} {"train_loss": -23.969083786010742, "global_step": 227512, "epoch": 2741} {"train_loss": -24.198501586914062, "global_step": 227513, "epoch": 2741} {"train_loss": -24.285184860229492, "global_step": 227514, "epoch": 2741} {"train_loss": -24.113754272460938, "global_step": 227515, "epoch": 2741} {"train_loss": -24.281295776367188, "global_step": 227516, "epoch": 2741} {"train_loss": -24.339859008789062, "global_step": 227517, "epoch": 2741} {"train_loss": -24.54098129272461, "global_step": 227518, "epoch": 2741} {"train_loss": -24.88730239868164, "global_step": 227519, "epoch": 2741} {"train_loss": -24.829715728759766, "global_step": 227520, "epoch": 2741} {"train_loss": -24.12801170349121, "global_step": 227521, "epoch": 2741} {"train_loss": -24.32858657836914, "global_step": 227522, "epoch": 2741} {"train_loss": -24.846511840820312, "global_step": 227523, "epoch": 2741} {"train_loss": -24.293556213378906, "global_step": 227524, "epoch": 2741} {"train_loss": -24.53821563720703, "global_step": 227525, "epoch": 2741} {"train_loss": -24.6842098236084, "global_step": 227526, "epoch": 2741} {"train_loss": -24.574039459228516, "global_step": 227527, "epoch": 2741} {"train_loss": -24.46723747253418, "global_step": 227528, "epoch": 2741} {"train_loss": -24.72432518005371, "global_step": 227529, "epoch": 2741} {"train_loss": -24.64859962463379, "global_step": 227530, "epoch": 2741} {"train_loss": -24.766695022583008, "global_step": 227531, "epoch": 2741} {"train_loss": -24.768539428710938, "global_step": 227532, "epoch": 2741} {"train_loss": -24.7608585357666, "global_step": 227533, "epoch": 2741} {"train_loss": -24.3840389251709, "global_step": 227534, "epoch": 2741} {"train_loss": -25.009872436523438, "global_step": 227535, "epoch": 2741} {"train_loss": -24.864078521728516, "global_step": 227536, "epoch": 2741} {"train_loss": -24.407712936401367, "global_step": 227537, "epoch": 2741} {"train_loss": -24.797178268432617, "global_step": 227538, "epoch": 2741} {"train_loss": -24.390708923339844, "global_step": 227539, "epoch": 2741} {"train_loss": -24.829301834106445, "global_step": 227540, "epoch": 2741} {"train_loss": -24.406089782714844, "global_step": 227541, "epoch": 2741} {"train_loss": -24.821081161499023, "global_step": 227542, "epoch": 2741} {"train_loss": -24.962421417236328, "global_step": 227543, "epoch": 2741} {"train_loss": -24.856306076049805, "global_step": 227544, "epoch": 2741} {"train_loss": -24.736623764038086, "global_step": 227545, "epoch": 2741} {"train_loss": -24.77765464782715, "global_step": 227546, "epoch": 2741} {"train_loss": -24.593305587768555, "global_step": 227547, "epoch": 2741} {"train_loss": -24.327756881713867, "global_step": 227548, "epoch": 2741} {"train_loss": -24.812437057495117, "global_step": 227549, "epoch": 2741} {"train_loss": -24.2269344329834, "global_step": 227550, "epoch": 2741} {"train_loss": -24.668710708618164, "global_step": 227551, "epoch": 2741} {"train_loss": -23.97737693786621, "global_step": 227552, "epoch": 2741} {"train_loss": -24.367483139038086, "global_step": 227553, "epoch": 2741} {"train_loss": -24.700618743896484, "global_step": 227554, "epoch": 2741} {"train_loss": -24.4528751373291, "global_step": 227555, "epoch": 2741} {"train_loss": -24.48844337463379, "global_step": 227556, "epoch": 2741} {"train_loss": -24.368314743041992, "global_step": 227557, "epoch": 2741} {"train_loss": -24.67782211303711, "global_step": 227558, "epoch": 2741} {"train_loss": -24.307819366455078, "global_step": 227559, "epoch": 2741} {"train_loss": -25.024499893188477, "global_step": 227560, "epoch": 2741} {"train_loss": -24.791614532470703, "global_step": 227561, "epoch": 2741} {"train_loss": -24.999897003173828, "global_step": 227562, "epoch": 2741} {"train_loss": -24.843677520751953, "global_step": 227563, "epoch": 2741} {"train_loss": -24.916873931884766, "global_step": 227564, "epoch": 2741} {"train_loss": -24.79482078552246, "global_step": 227565, "epoch": 2741} {"train_loss": -24.48244285583496, "global_step": 227566, "epoch": 2741} {"train_loss": -24.812009811401367, "global_step": 227567, "epoch": 2741} {"train_loss": -24.76985740661621, "global_step": 227568, "epoch": 2741} {"train_loss": -24.741323471069336, "global_step": 227569, "epoch": 2741} {"train_loss": -24.737279891967773, "global_step": 227570, "epoch": 2741} {"train_loss": -24.710742950439453, "global_step": 227571, "epoch": 2741} {"train_loss": -24.46187973022461, "global_step": 227572, "epoch": 2741} {"train_loss": -24.755483627319336, "global_step": 227573, "epoch": 2741} {"train_loss": -24.763702392578125, "global_step": 227574, "epoch": 2741} {"train_loss": -24.501115798950195, "global_step": 227575, "epoch": 2741} {"train_loss": -24.676990509033203, "global_step": 227576, "epoch": 2741} {"train_loss": -24.370304107666016, "global_step": 227577, "epoch": 2741} {"train_loss": -24.835546493530273, "global_step": 227578, "epoch": 2741} {"train_loss": -24.657363891601562, "global_step": 227579, "epoch": 2741} {"train_loss": -24.650680541992188, "global_step": 227580, "epoch": 2741} {"train_loss": -25.05342674255371, "global_step": 227581, "epoch": 2741} {"train_loss": -24.785390853881836, "global_step": 227582, "epoch": 2741} {"train_loss": -24.520681381225586, "global_step": 227583, "epoch": 2741} {"train_loss": -24.543703079223633, "global_step": 227584, "epoch": 2741} {"train_loss": -24.53961703288986, "global_step": 227585, "epoch": 2741, "val_loss": 6766121.0} {"train_loss": -24.67030906677246, "global_step": 227586, "epoch": 2742} {"train_loss": -24.227432250976562, "global_step": 227587, "epoch": 2742} {"train_loss": -24.323781967163086, "global_step": 227588, "epoch": 2742} {"train_loss": -24.408475875854492, "global_step": 227589, "epoch": 2742} {"train_loss": -24.522497177124023, "global_step": 227590, "epoch": 2742} {"train_loss": -24.339691162109375, "global_step": 227591, "epoch": 2742} {"train_loss": -24.043222427368164, "global_step": 227592, "epoch": 2742} {"train_loss": -24.378231048583984, "global_step": 227593, "epoch": 2742} {"train_loss": -24.491657257080078, "global_step": 227594, "epoch": 2742} {"train_loss": -23.83102798461914, "global_step": 227595, "epoch": 2742} {"train_loss": -24.51248550415039, "global_step": 227596, "epoch": 2742} {"train_loss": -24.530820846557617, "global_step": 227597, "epoch": 2742} {"train_loss": -24.449350357055664, "global_step": 227598, "epoch": 2742} {"train_loss": -24.9517822265625, "global_step": 227599, "epoch": 2742} {"train_loss": -24.237363815307617, "global_step": 227600, "epoch": 2742} {"train_loss": -24.731252670288086, "global_step": 227601, "epoch": 2742} {"train_loss": -24.397937774658203, "global_step": 227602, "epoch": 2742} {"train_loss": -24.59293556213379, "global_step": 227603, "epoch": 2742} {"train_loss": -24.303363800048828, "global_step": 227604, "epoch": 2742} {"train_loss": -24.764841079711914, "global_step": 227605, "epoch": 2742} {"train_loss": -24.284671783447266, "global_step": 227606, "epoch": 2742} {"train_loss": -24.59968376159668, "global_step": 227607, "epoch": 2742} {"train_loss": -24.379056930541992, "global_step": 227608, "epoch": 2742} {"train_loss": -24.176536560058594, "global_step": 227609, "epoch": 2742} {"train_loss": -24.720306396484375, "global_step": 227610, "epoch": 2742} {"train_loss": -24.768003463745117, "global_step": 227611, "epoch": 2742} {"train_loss": -24.81915283203125, "global_step": 227612, "epoch": 2742} {"train_loss": -25.02570152282715, "global_step": 227613, "epoch": 2742} {"train_loss": -25.012418746948242, "global_step": 227614, "epoch": 2742} {"train_loss": -24.876310348510742, "global_step": 227615, "epoch": 2742} {"train_loss": -24.579307556152344, "global_step": 227616, "epoch": 2742} {"train_loss": -24.805906295776367, "global_step": 227617, "epoch": 2742} {"train_loss": -24.460575103759766, "global_step": 227618, "epoch": 2742} {"train_loss": -24.66049575805664, "global_step": 227619, "epoch": 2742} {"train_loss": -24.227529525756836, "global_step": 227620, "epoch": 2742} {"train_loss": -24.59015464782715, "global_step": 227621, "epoch": 2742} {"train_loss": -24.845617294311523, "global_step": 227622, "epoch": 2742} {"train_loss": -24.73333740234375, "global_step": 227623, "epoch": 2742} {"train_loss": -24.65699577331543, "global_step": 227624, "epoch": 2742} {"train_loss": -24.896032333374023, "global_step": 227625, "epoch": 2742} {"train_loss": -24.678508758544922, "global_step": 227626, "epoch": 2742} {"train_loss": -24.39000129699707, "global_step": 227627, "epoch": 2742} {"train_loss": -25.033246994018555, "global_step": 227628, "epoch": 2742} {"train_loss": -24.77910041809082, "global_step": 227629, "epoch": 2742} {"train_loss": -24.829208374023438, "global_step": 227630, "epoch": 2742} {"train_loss": -24.746122360229492, "global_step": 227631, "epoch": 2742} {"train_loss": -24.702472686767578, "global_step": 227632, "epoch": 2742} {"train_loss": -24.712034225463867, "global_step": 227633, "epoch": 2742} {"train_loss": -24.779186248779297, "global_step": 227634, "epoch": 2742} {"train_loss": -24.31638526916504, "global_step": 227635, "epoch": 2742} {"train_loss": -24.667455673217773, "global_step": 227636, "epoch": 2742} {"train_loss": -24.313222885131836, "global_step": 227637, "epoch": 2742} {"train_loss": -24.587646484375, "global_step": 227638, "epoch": 2742} {"train_loss": -24.561880111694336, "global_step": 227639, "epoch": 2742} {"train_loss": -24.828580856323242, "global_step": 227640, "epoch": 2742} {"train_loss": -24.44442367553711, "global_step": 227641, "epoch": 2742} {"train_loss": -24.634418487548828, "global_step": 227642, "epoch": 2742} {"train_loss": -24.392135620117188, "global_step": 227643, "epoch": 2742} {"train_loss": -24.401294708251953, "global_step": 227644, "epoch": 2742} {"train_loss": -24.77137565612793, "global_step": 227645, "epoch": 2742} {"train_loss": -24.487167358398438, "global_step": 227646, "epoch": 2742} {"train_loss": -24.666227340698242, "global_step": 227647, "epoch": 2742} {"train_loss": -24.671140670776367, "global_step": 227648, "epoch": 2742} {"train_loss": -24.684049606323242, "global_step": 227649, "epoch": 2742} {"train_loss": -24.914928436279297, "global_step": 227650, "epoch": 2742} {"train_loss": -24.85970115661621, "global_step": 227651, "epoch": 2742} {"train_loss": -24.50687026977539, "global_step": 227652, "epoch": 2742} {"train_loss": -25.116714477539062, "global_step": 227653, "epoch": 2742} {"train_loss": -24.78750991821289, "global_step": 227654, "epoch": 2742} {"train_loss": -24.88797378540039, "global_step": 227655, "epoch": 2742} {"train_loss": -24.465627670288086, "global_step": 227656, "epoch": 2742} {"train_loss": -25.119783401489258, "global_step": 227657, "epoch": 2742} {"train_loss": -24.393823623657227, "global_step": 227658, "epoch": 2742} {"train_loss": -24.824119567871094, "global_step": 227659, "epoch": 2742} {"train_loss": -24.720233917236328, "global_step": 227660, "epoch": 2742} {"train_loss": -24.643369674682617, "global_step": 227661, "epoch": 2742} {"train_loss": -24.674131393432617, "global_step": 227662, "epoch": 2742} {"train_loss": -24.60161781311035, "global_step": 227663, "epoch": 2742} {"train_loss": -24.312349319458008, "global_step": 227664, "epoch": 2742} {"train_loss": -24.165328979492188, "global_step": 227665, "epoch": 2742} {"train_loss": -24.995441436767578, "global_step": 227666, "epoch": 2742} {"train_loss": -24.538604736328125, "global_step": 227667, "epoch": 2742} {"train_loss": -24.6037540435791, "global_step": 227668, "epoch": 2742, "val_loss": 6747661.0} {"train_loss": -22.962594985961914, "global_step": 227669, "epoch": 2743} {"train_loss": -23.142791748046875, "global_step": 227670, "epoch": 2743} {"train_loss": -24.300262451171875, "global_step": 227671, "epoch": 2743} {"train_loss": -23.24755859375, "global_step": 227672, "epoch": 2743} {"train_loss": -23.63397979736328, "global_step": 227673, "epoch": 2743} {"train_loss": -24.047727584838867, "global_step": 227674, "epoch": 2743} {"train_loss": -23.97526741027832, "global_step": 227675, "epoch": 2743} {"train_loss": -24.1783504486084, "global_step": 227676, "epoch": 2743} {"train_loss": -23.345455169677734, "global_step": 227677, "epoch": 2743} {"train_loss": -24.20936393737793, "global_step": 227678, "epoch": 2743} {"train_loss": -23.809316635131836, "global_step": 227679, "epoch": 2743} {"train_loss": -24.096174240112305, "global_step": 227680, "epoch": 2743} {"train_loss": -23.718799591064453, "global_step": 227681, "epoch": 2743} {"train_loss": -24.585147857666016, "global_step": 227682, "epoch": 2743} {"train_loss": -24.16483497619629, "global_step": 227683, "epoch": 2743} {"train_loss": -24.094623565673828, "global_step": 227684, "epoch": 2743} {"train_loss": -24.330907821655273, "global_step": 227685, "epoch": 2743} {"train_loss": -24.4621639251709, "global_step": 227686, "epoch": 2743} {"train_loss": -24.158283233642578, "global_step": 227687, "epoch": 2743} {"train_loss": -24.384933471679688, "global_step": 227688, "epoch": 2743} {"train_loss": -24.41468048095703, "global_step": 227689, "epoch": 2743} {"train_loss": -23.962743759155273, "global_step": 227690, "epoch": 2743} {"train_loss": -24.527379989624023, "global_step": 227691, "epoch": 2743} {"train_loss": -24.49081802368164, "global_step": 227692, "epoch": 2743} {"train_loss": -24.167179107666016, "global_step": 227693, "epoch": 2743} {"train_loss": -24.67561912536621, "global_step": 227694, "epoch": 2743} {"train_loss": -24.450170516967773, "global_step": 227695, "epoch": 2743} {"train_loss": -24.518768310546875, "global_step": 227696, "epoch": 2743} {"train_loss": -24.689050674438477, "global_step": 227697, "epoch": 2743} {"train_loss": -24.596303939819336, "global_step": 227698, "epoch": 2743} {"train_loss": -24.38389015197754, "global_step": 227699, "epoch": 2743} {"train_loss": -24.652069091796875, "global_step": 227700, "epoch": 2743} {"train_loss": -24.458770751953125, "global_step": 227701, "epoch": 2743} {"train_loss": -24.86418342590332, "global_step": 227702, "epoch": 2743} {"train_loss": -24.7685546875, "global_step": 227703, "epoch": 2743} {"train_loss": -24.346494674682617, "global_step": 227704, "epoch": 2743} {"train_loss": -24.81708526611328, "global_step": 227705, "epoch": 2743} {"train_loss": -24.906269073486328, "global_step": 227706, "epoch": 2743} {"train_loss": -24.76673698425293, "global_step": 227707, "epoch": 2743} {"train_loss": -24.725954055786133, "global_step": 227708, "epoch": 2743} {"train_loss": -24.668832778930664, "global_step": 227709, "epoch": 2743} {"train_loss": -24.705686569213867, "global_step": 227710, "epoch": 2743} {"train_loss": -24.719009399414062, "global_step": 227711, "epoch": 2743} {"train_loss": -24.597736358642578, "global_step": 227712, "epoch": 2743} {"train_loss": -24.794628143310547, "global_step": 227713, "epoch": 2743} {"train_loss": -24.922025680541992, "global_step": 227714, "epoch": 2743} {"train_loss": -25.04605484008789, "global_step": 227715, "epoch": 2743} {"train_loss": -24.66459846496582, "global_step": 227716, "epoch": 2743} {"train_loss": -25.190811157226562, "global_step": 227717, "epoch": 2743} {"train_loss": -24.984460830688477, "global_step": 227718, "epoch": 2743} {"train_loss": -24.670812606811523, "global_step": 227719, "epoch": 2743} {"train_loss": -24.467479705810547, "global_step": 227720, "epoch": 2743} {"train_loss": -24.79420280456543, "global_step": 227721, "epoch": 2743} {"train_loss": -24.802963256835938, "global_step": 227722, "epoch": 2743} {"train_loss": -24.797775268554688, "global_step": 227723, "epoch": 2743} {"train_loss": -24.88778305053711, "global_step": 227724, "epoch": 2743} {"train_loss": -24.723682403564453, "global_step": 227725, "epoch": 2743} {"train_loss": -24.516931533813477, "global_step": 227726, "epoch": 2743} {"train_loss": -24.39196014404297, "global_step": 227727, "epoch": 2743} {"train_loss": -23.748825073242188, "global_step": 227728, "epoch": 2743} {"train_loss": -24.321691513061523, "global_step": 227729, "epoch": 2743} {"train_loss": -24.900196075439453, "global_step": 227730, "epoch": 2743} {"train_loss": -24.958585739135742, "global_step": 227731, "epoch": 2743} {"train_loss": -24.17671775817871, "global_step": 227732, "epoch": 2743} {"train_loss": -25.212909698486328, "global_step": 227733, "epoch": 2743} {"train_loss": -24.86573600769043, "global_step": 227734, "epoch": 2743} {"train_loss": -24.65998649597168, "global_step": 227735, "epoch": 2743} {"train_loss": -24.77716636657715, "global_step": 227736, "epoch": 2743} {"train_loss": -24.810077667236328, "global_step": 227737, "epoch": 2743} {"train_loss": -24.708240509033203, "global_step": 227738, "epoch": 2743} {"train_loss": -24.937223434448242, "global_step": 227739, "epoch": 2743} {"train_loss": -24.517858505249023, "global_step": 227740, "epoch": 2743} {"train_loss": -24.13331413269043, "global_step": 227741, "epoch": 2743} {"train_loss": -24.24911117553711, "global_step": 227742, "epoch": 2743} {"train_loss": -24.66223907470703, "global_step": 227743, "epoch": 2743} {"train_loss": -24.501693725585938, "global_step": 227744, "epoch": 2743} {"train_loss": -24.23632049560547, "global_step": 227745, "epoch": 2743} {"train_loss": -24.990503311157227, "global_step": 227746, "epoch": 2743} {"train_loss": -24.640762329101562, "global_step": 227747, "epoch": 2743} {"train_loss": -24.859785079956055, "global_step": 227748, "epoch": 2743} {"train_loss": -24.82991600036621, "global_step": 227749, "epoch": 2743} {"train_loss": -24.475116729736328, "global_step": 227750, "epoch": 2743} {"train_loss": -24.488350121371717, "global_step": 227751, "epoch": 2743, "val_loss": 6887552.0} {"train_loss": -24.67557144165039, "global_step": 227752, "epoch": 2744} {"train_loss": -24.934432983398438, "global_step": 227753, "epoch": 2744} {"train_loss": -24.646207809448242, "global_step": 227754, "epoch": 2744} {"train_loss": -24.48702049255371, "global_step": 227755, "epoch": 2744} {"train_loss": -24.801156997680664, "global_step": 227756, "epoch": 2744} {"train_loss": -24.619726181030273, "global_step": 227757, "epoch": 2744} {"train_loss": -24.37153434753418, "global_step": 227758, "epoch": 2744} {"train_loss": -24.79743766784668, "global_step": 227759, "epoch": 2744} {"train_loss": -24.215002059936523, "global_step": 227760, "epoch": 2744} {"train_loss": -24.644594192504883, "global_step": 227761, "epoch": 2744} {"train_loss": -24.552845001220703, "global_step": 227762, "epoch": 2744} {"train_loss": -24.668476104736328, "global_step": 227763, "epoch": 2744} {"train_loss": -24.233972549438477, "global_step": 227764, "epoch": 2744} {"train_loss": -24.35631561279297, "global_step": 227765, "epoch": 2744} {"train_loss": -24.6025390625, "global_step": 227766, "epoch": 2744} {"train_loss": -24.8607120513916, "global_step": 227767, "epoch": 2744} {"train_loss": -24.34980583190918, "global_step": 227768, "epoch": 2744} {"train_loss": -24.279855728149414, "global_step": 227769, "epoch": 2744} {"train_loss": -24.550874710083008, "global_step": 227770, "epoch": 2744} {"train_loss": -24.723093032836914, "global_step": 227771, "epoch": 2744} {"train_loss": -24.833829879760742, "global_step": 227772, "epoch": 2744} {"train_loss": -24.92109489440918, "global_step": 227773, "epoch": 2744} {"train_loss": -24.711694717407227, "global_step": 227774, "epoch": 2744} {"train_loss": -24.8027286529541, "global_step": 227775, "epoch": 2744} {"train_loss": -24.669830322265625, "global_step": 227776, "epoch": 2744} {"train_loss": -24.611188888549805, "global_step": 227777, "epoch": 2744} {"train_loss": -24.634761810302734, "global_step": 227778, "epoch": 2744} {"train_loss": -24.349672317504883, "global_step": 227779, "epoch": 2744} {"train_loss": -24.56235122680664, "global_step": 227780, "epoch": 2744} {"train_loss": -24.738027572631836, "global_step": 227781, "epoch": 2744} {"train_loss": -24.63182830810547, "global_step": 227782, "epoch": 2744} {"train_loss": -24.740802764892578, "global_step": 227783, "epoch": 2744} {"train_loss": -24.800350189208984, "global_step": 227784, "epoch": 2744} {"train_loss": -24.73674964904785, "global_step": 227785, "epoch": 2744} {"train_loss": -24.684749603271484, "global_step": 227786, "epoch": 2744} {"train_loss": -24.973125457763672, "global_step": 227787, "epoch": 2744} {"train_loss": -24.750837326049805, "global_step": 227788, "epoch": 2744} {"train_loss": -24.853429794311523, "global_step": 227789, "epoch": 2744} {"train_loss": -24.8713436126709, "global_step": 227790, "epoch": 2744} {"train_loss": -24.73147964477539, "global_step": 227791, "epoch": 2744} {"train_loss": -24.665191650390625, "global_step": 227792, "epoch": 2744} {"train_loss": -25.0671443939209, "global_step": 227793, "epoch": 2744} {"train_loss": -24.818424224853516, "global_step": 227794, "epoch": 2744} {"train_loss": -24.87396812438965, "global_step": 227795, "epoch": 2744} {"train_loss": -24.904003143310547, "global_step": 227796, "epoch": 2744} {"train_loss": -24.357284545898438, "global_step": 227797, "epoch": 2744} {"train_loss": -24.473220825195312, "global_step": 227798, "epoch": 2744} {"train_loss": -24.3900089263916, "global_step": 227799, "epoch": 2744} {"train_loss": -24.396297454833984, "global_step": 227800, "epoch": 2744} {"train_loss": -25.210676193237305, "global_step": 227801, "epoch": 2744} {"train_loss": -24.665319442749023, "global_step": 227802, "epoch": 2744} {"train_loss": -24.92115592956543, "global_step": 227803, "epoch": 2744} {"train_loss": -24.6141300201416, "global_step": 227804, "epoch": 2744} {"train_loss": -24.944833755493164, "global_step": 227805, "epoch": 2744} {"train_loss": -24.25433921813965, "global_step": 227806, "epoch": 2744} {"train_loss": -24.663537979125977, "global_step": 227807, "epoch": 2744} {"train_loss": -24.727008819580078, "global_step": 227808, "epoch": 2744} {"train_loss": -24.659738540649414, "global_step": 227809, "epoch": 2744} {"train_loss": -24.50861167907715, "global_step": 227810, "epoch": 2744} {"train_loss": -24.161497116088867, "global_step": 227811, "epoch": 2744} {"train_loss": -24.946142196655273, "global_step": 227812, "epoch": 2744} {"train_loss": -24.63494873046875, "global_step": 227813, "epoch": 2744} {"train_loss": -25.354307174682617, "global_step": 227814, "epoch": 2744} {"train_loss": -24.7533016204834, "global_step": 227815, "epoch": 2744} {"train_loss": -25.128284454345703, "global_step": 227816, "epoch": 2744} {"train_loss": -24.52153205871582, "global_step": 227817, "epoch": 2744} {"train_loss": -24.835208892822266, "global_step": 227818, "epoch": 2744} {"train_loss": -24.401716232299805, "global_step": 227819, "epoch": 2744} {"train_loss": -24.96088218688965, "global_step": 227820, "epoch": 2744} {"train_loss": -25.108837127685547, "global_step": 227821, "epoch": 2744} {"train_loss": -24.772157669067383, "global_step": 227822, "epoch": 2744} {"train_loss": -24.956050872802734, "global_step": 227823, "epoch": 2744} {"train_loss": -24.63496971130371, "global_step": 227824, "epoch": 2744} {"train_loss": -24.664161682128906, "global_step": 227825, "epoch": 2744} {"train_loss": -24.8739013671875, "global_step": 227826, "epoch": 2744} {"train_loss": -24.96105194091797, "global_step": 227827, "epoch": 2744} {"train_loss": -24.756593704223633, "global_step": 227828, "epoch": 2744} {"train_loss": -24.93231964111328, "global_step": 227829, "epoch": 2744} {"train_loss": -24.684467315673828, "global_step": 227830, "epoch": 2744} {"train_loss": -24.69594955444336, "global_step": 227831, "epoch": 2744} {"train_loss": -24.74493408203125, "global_step": 227832, "epoch": 2744} {"train_loss": -24.505863189697266, "global_step": 227833, "epoch": 2744} {"train_loss": -24.717260774359644, "global_step": 227834, "epoch": 2744, "val_loss": 6741622.0} {"train_loss": -23.72264862060547, "global_step": 227835, "epoch": 2745} {"train_loss": -23.962751388549805, "global_step": 227836, "epoch": 2745} {"train_loss": -22.873193740844727, "global_step": 227837, "epoch": 2745} {"train_loss": -23.980905532836914, "global_step": 227838, "epoch": 2745} {"train_loss": -24.010501861572266, "global_step": 227839, "epoch": 2745} {"train_loss": -24.19964027404785, "global_step": 227840, "epoch": 2745} {"train_loss": -24.0559024810791, "global_step": 227841, "epoch": 2745} {"train_loss": -23.879871368408203, "global_step": 227842, "epoch": 2745} {"train_loss": -24.3790225982666, "global_step": 227843, "epoch": 2745} {"train_loss": -24.21753692626953, "global_step": 227844, "epoch": 2745} {"train_loss": -24.177579879760742, "global_step": 227845, "epoch": 2745} {"train_loss": -24.109699249267578, "global_step": 227846, "epoch": 2745} {"train_loss": -23.93543815612793, "global_step": 227847, "epoch": 2745} {"train_loss": -24.88079833984375, "global_step": 227848, "epoch": 2745} {"train_loss": -24.334203720092773, "global_step": 227849, "epoch": 2745} {"train_loss": -24.611968994140625, "global_step": 227850, "epoch": 2745} {"train_loss": -24.587472915649414, "global_step": 227851, "epoch": 2745} {"train_loss": -24.43564796447754, "global_step": 227852, "epoch": 2745} {"train_loss": -24.463611602783203, "global_step": 227853, "epoch": 2745} {"train_loss": -24.389965057373047, "global_step": 227854, "epoch": 2745} {"train_loss": -24.638498306274414, "global_step": 227855, "epoch": 2745} {"train_loss": -24.66617202758789, "global_step": 227856, "epoch": 2745} {"train_loss": -24.550642013549805, "global_step": 227857, "epoch": 2745} {"train_loss": -24.493215560913086, "global_step": 227858, "epoch": 2745} {"train_loss": -24.334196090698242, "global_step": 227859, "epoch": 2745} {"train_loss": -24.4091854095459, "global_step": 227860, "epoch": 2745} {"train_loss": -24.423078536987305, "global_step": 227861, "epoch": 2745} {"train_loss": -25.073152542114258, "global_step": 227862, "epoch": 2745} {"train_loss": -24.18310546875, "global_step": 227863, "epoch": 2745} {"train_loss": -24.262027740478516, "global_step": 227864, "epoch": 2745} {"train_loss": -24.753765106201172, "global_step": 227865, "epoch": 2745} {"train_loss": -24.766721725463867, "global_step": 227866, "epoch": 2745} {"train_loss": -24.587629318237305, "global_step": 227867, "epoch": 2745} {"train_loss": -24.775264739990234, "global_step": 227868, "epoch": 2745} {"train_loss": -24.249361038208008, "global_step": 227869, "epoch": 2745} {"train_loss": -24.7166805267334, "global_step": 227870, "epoch": 2745} {"train_loss": -24.75276756286621, "global_step": 227871, "epoch": 2745} {"train_loss": -24.477048873901367, "global_step": 227872, "epoch": 2745} {"train_loss": -25.036909103393555, "global_step": 227873, "epoch": 2745} {"train_loss": -24.896804809570312, "global_step": 227874, "epoch": 2745} {"train_loss": -24.87360954284668, "global_step": 227875, "epoch": 2745} {"train_loss": -24.788084030151367, "global_step": 227876, "epoch": 2745} {"train_loss": -25.151697158813477, "global_step": 227877, "epoch": 2745} {"train_loss": -24.897104263305664, "global_step": 227878, "epoch": 2745} {"train_loss": -24.89300537109375, "global_step": 227879, "epoch": 2745} {"train_loss": -25.061634063720703, "global_step": 227880, "epoch": 2745} {"train_loss": -25.228219985961914, "global_step": 227881, "epoch": 2745} {"train_loss": -24.708417892456055, "global_step": 227882, "epoch": 2745} {"train_loss": -24.986846923828125, "global_step": 227883, "epoch": 2745} {"train_loss": -24.883665084838867, "global_step": 227884, "epoch": 2745} {"train_loss": -24.78053855895996, "global_step": 227885, "epoch": 2745} {"train_loss": -24.952835083007812, "global_step": 227886, "epoch": 2745} {"train_loss": -24.775957107543945, "global_step": 227887, "epoch": 2745} {"train_loss": -24.68727684020996, "global_step": 227888, "epoch": 2745} {"train_loss": -24.678129196166992, "global_step": 227889, "epoch": 2745} {"train_loss": -24.852783203125, "global_step": 227890, "epoch": 2745} {"train_loss": -24.95619010925293, "global_step": 227891, "epoch": 2745} {"train_loss": -24.811376571655273, "global_step": 227892, "epoch": 2745} {"train_loss": -24.46047019958496, "global_step": 227893, "epoch": 2745} {"train_loss": -24.76473045349121, "global_step": 227894, "epoch": 2745} {"train_loss": -24.748632431030273, "global_step": 227895, "epoch": 2745} {"train_loss": -24.735944747924805, "global_step": 227896, "epoch": 2745} {"train_loss": -24.897964477539062, "global_step": 227897, "epoch": 2745} {"train_loss": -24.696203231811523, "global_step": 227898, "epoch": 2745} {"train_loss": -24.939987182617188, "global_step": 227899, "epoch": 2745} {"train_loss": -24.181995391845703, "global_step": 227900, "epoch": 2745} {"train_loss": -24.484094619750977, "global_step": 227901, "epoch": 2745} {"train_loss": -24.60364532470703, "global_step": 227902, "epoch": 2745} {"train_loss": -24.66281509399414, "global_step": 227903, "epoch": 2745} {"train_loss": -24.601064682006836, "global_step": 227904, "epoch": 2745} {"train_loss": -24.417909622192383, "global_step": 227905, "epoch": 2745} {"train_loss": -24.485107421875, "global_step": 227906, "epoch": 2745} {"train_loss": -24.70906639099121, "global_step": 227907, "epoch": 2745} {"train_loss": -24.936492919921875, "global_step": 227908, "epoch": 2745} {"train_loss": -24.56660270690918, "global_step": 227909, "epoch": 2745} {"train_loss": -24.631759643554688, "global_step": 227910, "epoch": 2745} {"train_loss": -24.65180015563965, "global_step": 227911, "epoch": 2745} {"train_loss": -24.40474510192871, "global_step": 227912, "epoch": 2745} {"train_loss": -25.265478134155273, "global_step": 227913, "epoch": 2745} {"train_loss": -24.57441520690918, "global_step": 227914, "epoch": 2745} {"train_loss": -24.51130485534668, "global_step": 227915, "epoch": 2745} {"train_loss": -24.76795768737793, "global_step": 227916, "epoch": 2745} {"train_loss": -24.57021874117564, "global_step": 227917, "epoch": 2745, "val_loss": 6660391.0} {"train_loss": -24.739049911499023, "global_step": 227918, "epoch": 2746} {"train_loss": -24.676517486572266, "global_step": 227919, "epoch": 2746} {"train_loss": -24.424482345581055, "global_step": 227920, "epoch": 2746} {"train_loss": -24.61884117126465, "global_step": 227921, "epoch": 2746} {"train_loss": -24.36126136779785, "global_step": 227922, "epoch": 2746} {"train_loss": -24.4317626953125, "global_step": 227923, "epoch": 2746} {"train_loss": -24.687284469604492, "global_step": 227924, "epoch": 2746} {"train_loss": -24.809005737304688, "global_step": 227925, "epoch": 2746} {"train_loss": -24.687484741210938, "global_step": 227926, "epoch": 2746} {"train_loss": -24.644529342651367, "global_step": 227927, "epoch": 2746} {"train_loss": -24.731178283691406, "global_step": 227928, "epoch": 2746} {"train_loss": -24.666147232055664, "global_step": 227929, "epoch": 2746} {"train_loss": -24.861644744873047, "global_step": 227930, "epoch": 2746} {"train_loss": -24.926349639892578, "global_step": 227931, "epoch": 2746} {"train_loss": -24.587453842163086, "global_step": 227932, "epoch": 2746} {"train_loss": -24.825830459594727, "global_step": 227933, "epoch": 2746} {"train_loss": -24.64791488647461, "global_step": 227934, "epoch": 2746} {"train_loss": -24.348682403564453, "global_step": 227935, "epoch": 2746} {"train_loss": -25.005525588989258, "global_step": 227936, "epoch": 2746} {"train_loss": -24.40981101989746, "global_step": 227937, "epoch": 2746} {"train_loss": -25.115921020507812, "global_step": 227938, "epoch": 2746} {"train_loss": -24.13763427734375, "global_step": 227939, "epoch": 2746} {"train_loss": -24.41818618774414, "global_step": 227940, "epoch": 2746} {"train_loss": -24.362070083618164, "global_step": 227941, "epoch": 2746} {"train_loss": -24.525047302246094, "global_step": 227942, "epoch": 2746} {"train_loss": -24.496124267578125, "global_step": 227943, "epoch": 2746} {"train_loss": -24.1954402923584, "global_step": 227944, "epoch": 2746} {"train_loss": -24.326099395751953, "global_step": 227945, "epoch": 2746} {"train_loss": -24.17527198791504, "global_step": 227946, "epoch": 2746} {"train_loss": -24.562105178833008, "global_step": 227947, "epoch": 2746} {"train_loss": -24.458600997924805, "global_step": 227948, "epoch": 2746} {"train_loss": -24.348621368408203, "global_step": 227949, "epoch": 2746} {"train_loss": -24.788333892822266, "global_step": 227950, "epoch": 2746} {"train_loss": -24.385913848876953, "global_step": 227951, "epoch": 2746} {"train_loss": -24.35501480102539, "global_step": 227952, "epoch": 2746} {"train_loss": -24.545169830322266, "global_step": 227953, "epoch": 2746} {"train_loss": -24.369298934936523, "global_step": 227954, "epoch": 2746} {"train_loss": -24.40597915649414, "global_step": 227955, "epoch": 2746} {"train_loss": -24.961217880249023, "global_step": 227956, "epoch": 2746} {"train_loss": -24.291336059570312, "global_step": 227957, "epoch": 2746} {"train_loss": -24.748985290527344, "global_step": 227958, "epoch": 2746} {"train_loss": -24.740009307861328, "global_step": 227959, "epoch": 2746} {"train_loss": -24.323225021362305, "global_step": 227960, "epoch": 2746} {"train_loss": -24.60509490966797, "global_step": 227961, "epoch": 2746} {"train_loss": -24.445560455322266, "global_step": 227962, "epoch": 2746} {"train_loss": -24.484567642211914, "global_step": 227963, "epoch": 2746} {"train_loss": -24.953659057617188, "global_step": 227964, "epoch": 2746} {"train_loss": -24.6553955078125, "global_step": 227965, "epoch": 2746} {"train_loss": -24.890554428100586, "global_step": 227966, "epoch": 2746} {"train_loss": -24.56695556640625, "global_step": 227967, "epoch": 2746} {"train_loss": -24.84577178955078, "global_step": 227968, "epoch": 2746} {"train_loss": -24.50209617614746, "global_step": 227969, "epoch": 2746} {"train_loss": -24.766782760620117, "global_step": 227970, "epoch": 2746} {"train_loss": -24.6036319732666, "global_step": 227971, "epoch": 2746} {"train_loss": -24.644926071166992, "global_step": 227972, "epoch": 2746} {"train_loss": -25.070236206054688, "global_step": 227973, "epoch": 2746} {"train_loss": -24.786893844604492, "global_step": 227974, "epoch": 2746} {"train_loss": -24.820663452148438, "global_step": 227975, "epoch": 2746} {"train_loss": -24.99273681640625, "global_step": 227976, "epoch": 2746} {"train_loss": -24.865468978881836, "global_step": 227977, "epoch": 2746} {"train_loss": -24.598230361938477, "global_step": 227978, "epoch": 2746} {"train_loss": -24.95745849609375, "global_step": 227979, "epoch": 2746} {"train_loss": -25.071683883666992, "global_step": 227980, "epoch": 2746} {"train_loss": -24.28243064880371, "global_step": 227981, "epoch": 2746} {"train_loss": -24.962125778198242, "global_step": 227982, "epoch": 2746} {"train_loss": -24.863489151000977, "global_step": 227983, "epoch": 2746} {"train_loss": -24.497045516967773, "global_step": 227984, "epoch": 2746} {"train_loss": -25.040119171142578, "global_step": 227985, "epoch": 2746} {"train_loss": -24.806747436523438, "global_step": 227986, "epoch": 2746} {"train_loss": -24.555007934570312, "global_step": 227987, "epoch": 2746} {"train_loss": -24.961383819580078, "global_step": 227988, "epoch": 2746} {"train_loss": -24.478302001953125, "global_step": 227989, "epoch": 2746} {"train_loss": -24.904438018798828, "global_step": 227990, "epoch": 2746} {"train_loss": -24.571239471435547, "global_step": 227991, "epoch": 2746} {"train_loss": -24.74688720703125, "global_step": 227992, "epoch": 2746} {"train_loss": -24.7257137298584, "global_step": 227993, "epoch": 2746} {"train_loss": -24.707632064819336, "global_step": 227994, "epoch": 2746} {"train_loss": -24.90993309020996, "global_step": 227995, "epoch": 2746} {"train_loss": -24.770069122314453, "global_step": 227996, "epoch": 2746} {"train_loss": -24.8388671875, "global_step": 227997, "epoch": 2746} {"train_loss": -25.091066360473633, "global_step": 227998, "epoch": 2746} {"train_loss": -24.500301361083984, "global_step": 227999, "epoch": 2746} {"train_loss": -24.655869311596973, "global_step": 228000, "epoch": 2746, "val_loss": 6775861.0} {"train_loss": -23.767621994018555, "global_step": 228001, "epoch": 2747} {"train_loss": -23.488996505737305, "global_step": 228002, "epoch": 2747} {"train_loss": -24.565046310424805, "global_step": 228003, "epoch": 2747} {"train_loss": -23.967031478881836, "global_step": 228004, "epoch": 2747} {"train_loss": -23.934743881225586, "global_step": 228005, "epoch": 2747} {"train_loss": -24.084192276000977, "global_step": 228006, "epoch": 2747} {"train_loss": -24.190523147583008, "global_step": 228007, "epoch": 2747} {"train_loss": -24.21748924255371, "global_step": 228008, "epoch": 2747} {"train_loss": -24.494976043701172, "global_step": 228009, "epoch": 2747} {"train_loss": -23.8619384765625, "global_step": 228010, "epoch": 2747} {"train_loss": -24.272174835205078, "global_step": 228011, "epoch": 2747} {"train_loss": -24.377023696899414, "global_step": 228012, "epoch": 2747} {"train_loss": -23.849470138549805, "global_step": 228013, "epoch": 2747} {"train_loss": -24.41996192932129, "global_step": 228014, "epoch": 2747} {"train_loss": -24.268075942993164, "global_step": 228015, "epoch": 2747} {"train_loss": -24.34937858581543, "global_step": 228016, "epoch": 2747} {"train_loss": -24.196369171142578, "global_step": 228017, "epoch": 2747} {"train_loss": -24.20498275756836, "global_step": 228018, "epoch": 2747} {"train_loss": -24.242862701416016, "global_step": 228019, "epoch": 2747} {"train_loss": -24.343448638916016, "global_step": 228020, "epoch": 2747} {"train_loss": -24.68790054321289, "global_step": 228021, "epoch": 2747} {"train_loss": -24.497331619262695, "global_step": 228022, "epoch": 2747} {"train_loss": -24.561798095703125, "global_step": 228023, "epoch": 2747} {"train_loss": -24.728534698486328, "global_step": 228024, "epoch": 2747} {"train_loss": -24.40418815612793, "global_step": 228025, "epoch": 2747} {"train_loss": -24.296239852905273, "global_step": 228026, "epoch": 2747} {"train_loss": -24.492048263549805, "global_step": 228027, "epoch": 2747} {"train_loss": -24.598230361938477, "global_step": 228028, "epoch": 2747} {"train_loss": -24.729236602783203, "global_step": 228029, "epoch": 2747} {"train_loss": -24.766075134277344, "global_step": 228030, "epoch": 2747} {"train_loss": -24.816593170166016, "global_step": 228031, "epoch": 2747} {"train_loss": -24.843730926513672, "global_step": 228032, "epoch": 2747} {"train_loss": -24.639434814453125, "global_step": 228033, "epoch": 2747} {"train_loss": -24.6917781829834, "global_step": 228034, "epoch": 2747} {"train_loss": -24.792341232299805, "global_step": 228035, "epoch": 2747} {"train_loss": -24.785221099853516, "global_step": 228036, "epoch": 2747} {"train_loss": -24.633529663085938, "global_step": 228037, "epoch": 2747} {"train_loss": -24.856582641601562, "global_step": 228038, "epoch": 2747} {"train_loss": -24.40960121154785, "global_step": 228039, "epoch": 2747} {"train_loss": -24.861358642578125, "global_step": 228040, "epoch": 2747} {"train_loss": -24.812210083007812, "global_step": 228041, "epoch": 2747} {"train_loss": -24.998750686645508, "global_step": 228042, "epoch": 2747} {"train_loss": -24.447795867919922, "global_step": 228043, "epoch": 2747} {"train_loss": -25.08057975769043, "global_step": 228044, "epoch": 2747} {"train_loss": -24.784425735473633, "global_step": 228045, "epoch": 2747} {"train_loss": -24.919347763061523, "global_step": 228046, "epoch": 2747} {"train_loss": -24.64410972595215, "global_step": 228047, "epoch": 2747} {"train_loss": -24.795164108276367, "global_step": 228048, "epoch": 2747} {"train_loss": -24.36338996887207, "global_step": 228049, "epoch": 2747} {"train_loss": -24.321378707885742, "global_step": 228050, "epoch": 2747} {"train_loss": -24.977096557617188, "global_step": 228051, "epoch": 2747} {"train_loss": -24.758352279663086, "global_step": 228052, "epoch": 2747} {"train_loss": -24.37864112854004, "global_step": 228053, "epoch": 2747} {"train_loss": -24.876371383666992, "global_step": 228054, "epoch": 2747} {"train_loss": -24.89755630493164, "global_step": 228055, "epoch": 2747} {"train_loss": -24.42502212524414, "global_step": 228056, "epoch": 2747} {"train_loss": -24.989423751831055, "global_step": 228057, "epoch": 2747} {"train_loss": -24.559268951416016, "global_step": 228058, "epoch": 2747} {"train_loss": -24.638059616088867, "global_step": 228059, "epoch": 2747} {"train_loss": -25.216257095336914, "global_step": 228060, "epoch": 2747} {"train_loss": -24.55859375, "global_step": 228061, "epoch": 2747} {"train_loss": -24.781156539916992, "global_step": 228062, "epoch": 2747} {"train_loss": -24.736560821533203, "global_step": 228063, "epoch": 2747} {"train_loss": -25.00079345703125, "global_step": 228064, "epoch": 2747} {"train_loss": -24.78521156311035, "global_step": 228065, "epoch": 2747} {"train_loss": -24.718460083007812, "global_step": 228066, "epoch": 2747} {"train_loss": -24.571367263793945, "global_step": 228067, "epoch": 2747} {"train_loss": -25.15045738220215, "global_step": 228068, "epoch": 2747} {"train_loss": -24.80861473083496, "global_step": 228069, "epoch": 2747} {"train_loss": -24.608816146850586, "global_step": 228070, "epoch": 2747} {"train_loss": -23.991247177124023, "global_step": 228071, "epoch": 2747} {"train_loss": -22.838096618652344, "global_step": 228072, "epoch": 2747} {"train_loss": -24.326391220092773, "global_step": 228073, "epoch": 2747} {"train_loss": -24.677326202392578, "global_step": 228074, "epoch": 2747} {"train_loss": -24.264867782592773, "global_step": 228075, "epoch": 2747} {"train_loss": -24.10112190246582, "global_step": 228076, "epoch": 2747} {"train_loss": -24.578161239624023, "global_step": 228077, "epoch": 2747} {"train_loss": -24.34027671813965, "global_step": 228078, "epoch": 2747} {"train_loss": -24.22475242614746, "global_step": 228079, "epoch": 2747} {"train_loss": -24.571731567382812, "global_step": 228080, "epoch": 2747} {"train_loss": -24.468286514282227, "global_step": 228081, "epoch": 2747} {"train_loss": -24.55503273010254, "global_step": 228082, "epoch": 2747} {"train_loss": -24.513233184814453, "global_step": 228083, "epoch": 2747, "val_loss": 6811326.0} {"train_loss": -22.65470314025879, "global_step": 228084, "epoch": 2748} {"train_loss": -23.296926498413086, "global_step": 228085, "epoch": 2748} {"train_loss": -23.54659080505371, "global_step": 228086, "epoch": 2748} {"train_loss": -24.121740341186523, "global_step": 228087, "epoch": 2748} {"train_loss": -23.950546264648438, "global_step": 228088, "epoch": 2748} {"train_loss": -23.56080436706543, "global_step": 228089, "epoch": 2748} {"train_loss": -24.04054832458496, "global_step": 228090, "epoch": 2748} {"train_loss": -24.141067504882812, "global_step": 228091, "epoch": 2748} {"train_loss": -24.3651123046875, "global_step": 228092, "epoch": 2748} {"train_loss": -24.24027442932129, "global_step": 228093, "epoch": 2748} {"train_loss": -23.618940353393555, "global_step": 228094, "epoch": 2748} {"train_loss": -24.16047477722168, "global_step": 228095, "epoch": 2748} {"train_loss": -24.10161781311035, "global_step": 228096, "epoch": 2748} {"train_loss": -24.51416015625, "global_step": 228097, "epoch": 2748} {"train_loss": -24.546207427978516, "global_step": 228098, "epoch": 2748} {"train_loss": -24.292970657348633, "global_step": 228099, "epoch": 2748} {"train_loss": -24.211400985717773, "global_step": 228100, "epoch": 2748} {"train_loss": -24.38406753540039, "global_step": 228101, "epoch": 2748} {"train_loss": -24.621591567993164, "global_step": 228102, "epoch": 2748} {"train_loss": -23.998531341552734, "global_step": 228103, "epoch": 2748} {"train_loss": -24.377843856811523, "global_step": 228104, "epoch": 2748} {"train_loss": -24.126291275024414, "global_step": 228105, "epoch": 2748} {"train_loss": -24.540197372436523, "global_step": 228106, "epoch": 2748} {"train_loss": -24.94454002380371, "global_step": 228107, "epoch": 2748} {"train_loss": -24.385547637939453, "global_step": 228108, "epoch": 2748} {"train_loss": -24.8717098236084, "global_step": 228109, "epoch": 2748} {"train_loss": -24.721464157104492, "global_step": 228110, "epoch": 2748} {"train_loss": -24.57025146484375, "global_step": 228111, "epoch": 2748} {"train_loss": -24.48699378967285, "global_step": 228112, "epoch": 2748} {"train_loss": -24.743635177612305, "global_step": 228113, "epoch": 2748} {"train_loss": -25.17458152770996, "global_step": 228114, "epoch": 2748} {"train_loss": -24.950321197509766, "global_step": 228115, "epoch": 2748} {"train_loss": -24.485504150390625, "global_step": 228116, "epoch": 2748} {"train_loss": -24.409181594848633, "global_step": 228117, "epoch": 2748} {"train_loss": -24.49543571472168, "global_step": 228118, "epoch": 2748} {"train_loss": -25.096227645874023, "global_step": 228119, "epoch": 2748} {"train_loss": -24.556013107299805, "global_step": 228120, "epoch": 2748} {"train_loss": -24.61882781982422, "global_step": 228121, "epoch": 2748} {"train_loss": -24.956710815429688, "global_step": 228122, "epoch": 2748} {"train_loss": -24.746946334838867, "global_step": 228123, "epoch": 2748} {"train_loss": -24.683927536010742, "global_step": 228124, "epoch": 2748} {"train_loss": -24.721281051635742, "global_step": 228125, "epoch": 2748} {"train_loss": -24.856979370117188, "global_step": 228126, "epoch": 2748} {"train_loss": -24.47873306274414, "global_step": 228127, "epoch": 2748} {"train_loss": -24.81312370300293, "global_step": 228128, "epoch": 2748} {"train_loss": -24.894838333129883, "global_step": 228129, "epoch": 2748} {"train_loss": -24.805683135986328, "global_step": 228130, "epoch": 2748} {"train_loss": -24.91216468811035, "global_step": 228131, "epoch": 2748} {"train_loss": -24.96845054626465, "global_step": 228132, "epoch": 2748} {"train_loss": -25.041934967041016, "global_step": 228133, "epoch": 2748} {"train_loss": -24.676748275756836, "global_step": 228134, "epoch": 2748} {"train_loss": -24.562088012695312, "global_step": 228135, "epoch": 2748} {"train_loss": -25.062021255493164, "global_step": 228136, "epoch": 2748} {"train_loss": -24.992895126342773, "global_step": 228137, "epoch": 2748} {"train_loss": -25.135061264038086, "global_step": 228138, "epoch": 2748} {"train_loss": -24.762678146362305, "global_step": 228139, "epoch": 2748} {"train_loss": -24.750669479370117, "global_step": 228140, "epoch": 2748} {"train_loss": -24.779447555541992, "global_step": 228141, "epoch": 2748} {"train_loss": -24.81330680847168, "global_step": 228142, "epoch": 2748} {"train_loss": -24.8632755279541, "global_step": 228143, "epoch": 2748} {"train_loss": -24.493114471435547, "global_step": 228144, "epoch": 2748} {"train_loss": -24.764049530029297, "global_step": 228145, "epoch": 2748} {"train_loss": -25.026107788085938, "global_step": 228146, "epoch": 2748} {"train_loss": -24.798486709594727, "global_step": 228147, "epoch": 2748} {"train_loss": -24.54720115661621, "global_step": 228148, "epoch": 2748} {"train_loss": -24.258310317993164, "global_step": 228149, "epoch": 2748} {"train_loss": -24.46512222290039, "global_step": 228150, "epoch": 2748} {"train_loss": -24.7514591217041, "global_step": 228151, "epoch": 2748} {"train_loss": -24.50275230407715, "global_step": 228152, "epoch": 2748} {"train_loss": -24.961450576782227, "global_step": 228153, "epoch": 2748} {"train_loss": -24.812084197998047, "global_step": 228154, "epoch": 2748} {"train_loss": -24.59541130065918, "global_step": 228155, "epoch": 2748} {"train_loss": -24.617799758911133, "global_step": 228156, "epoch": 2748} {"train_loss": -24.231210708618164, "global_step": 228157, "epoch": 2748} {"train_loss": -24.658205032348633, "global_step": 228158, "epoch": 2748} {"train_loss": -24.54548454284668, "global_step": 228159, "epoch": 2748} {"train_loss": -24.258142471313477, "global_step": 228160, "epoch": 2748} {"train_loss": -25.080734252929688, "global_step": 228161, "epoch": 2748} {"train_loss": -24.714324951171875, "global_step": 228162, "epoch": 2748} {"train_loss": -24.576398849487305, "global_step": 228163, "epoch": 2748} {"train_loss": -24.5032901763916, "global_step": 228164, "epoch": 2748} {"train_loss": -24.1466121673584, "global_step": 228165, "epoch": 2748} {"train_loss": -24.523260047636835, "global_step": 228166, "epoch": 2748, "val_loss": 6644664.0} {"train_loss": -24.229589462280273, "global_step": 228167, "epoch": 2749} {"train_loss": -24.10320472717285, "global_step": 228168, "epoch": 2749} {"train_loss": -24.081287384033203, "global_step": 228169, "epoch": 2749} {"train_loss": -24.178007125854492, "global_step": 228170, "epoch": 2749} {"train_loss": -24.4902400970459, "global_step": 228171, "epoch": 2749} {"train_loss": -24.051061630249023, "global_step": 228172, "epoch": 2749} {"train_loss": -24.195520401000977, "global_step": 228173, "epoch": 2749} {"train_loss": -24.79487419128418, "global_step": 228174, "epoch": 2749} {"train_loss": -24.418737411499023, "global_step": 228175, "epoch": 2749} {"train_loss": -24.303590774536133, "global_step": 228176, "epoch": 2749} {"train_loss": -24.24129295349121, "global_step": 228177, "epoch": 2749} {"train_loss": -24.619009017944336, "global_step": 228178, "epoch": 2749} {"train_loss": -24.54183006286621, "global_step": 228179, "epoch": 2749} {"train_loss": -24.450366973876953, "global_step": 228180, "epoch": 2749} {"train_loss": -24.431367874145508, "global_step": 228181, "epoch": 2749} {"train_loss": -24.610427856445312, "global_step": 228182, "epoch": 2749} {"train_loss": -24.571096420288086, "global_step": 228183, "epoch": 2749} {"train_loss": -25.030628204345703, "global_step": 228184, "epoch": 2749} {"train_loss": -24.92233657836914, "global_step": 228185, "epoch": 2749} {"train_loss": -25.198963165283203, "global_step": 228186, "epoch": 2749} {"train_loss": -24.60862159729004, "global_step": 228187, "epoch": 2749} {"train_loss": -24.800657272338867, "global_step": 228188, "epoch": 2749} {"train_loss": -24.37117576599121, "global_step": 228189, "epoch": 2749} {"train_loss": -24.76717758178711, "global_step": 228190, "epoch": 2749} {"train_loss": -24.869178771972656, "global_step": 228191, "epoch": 2749} {"train_loss": -24.745664596557617, "global_step": 228192, "epoch": 2749} {"train_loss": -24.485280990600586, "global_step": 228193, "epoch": 2749} {"train_loss": -24.719560623168945, "global_step": 228194, "epoch": 2749} {"train_loss": -24.71042251586914, "global_step": 228195, "epoch": 2749} {"train_loss": -24.602582931518555, "global_step": 228196, "epoch": 2749} {"train_loss": -24.841861724853516, "global_step": 228197, "epoch": 2749} {"train_loss": -24.937467575073242, "global_step": 228198, "epoch": 2749} {"train_loss": -24.255496978759766, "global_step": 228199, "epoch": 2749} {"train_loss": -25.227460861206055, "global_step": 228200, "epoch": 2749} {"train_loss": -24.57465171813965, "global_step": 228201, "epoch": 2749} {"train_loss": -24.539480209350586, "global_step": 228202, "epoch": 2749} {"train_loss": -24.77573585510254, "global_step": 228203, "epoch": 2749} {"train_loss": -24.817474365234375, "global_step": 228204, "epoch": 2749} {"train_loss": -24.689878463745117, "global_step": 228205, "epoch": 2749} {"train_loss": -24.757368087768555, "global_step": 228206, "epoch": 2749} {"train_loss": -24.878707885742188, "global_step": 228207, "epoch": 2749} {"train_loss": -24.765304565429688, "global_step": 228208, "epoch": 2749} {"train_loss": -24.9166316986084, "global_step": 228209, "epoch": 2749} {"train_loss": -24.727096557617188, "global_step": 228210, "epoch": 2749} {"train_loss": -24.727033615112305, "global_step": 228211, "epoch": 2749} {"train_loss": -24.870121002197266, "global_step": 228212, "epoch": 2749} {"train_loss": -24.694944381713867, "global_step": 228213, "epoch": 2749} {"train_loss": -24.3906307220459, "global_step": 228214, "epoch": 2749} {"train_loss": -24.0380916595459, "global_step": 228215, "epoch": 2749} {"train_loss": -24.316959381103516, "global_step": 228216, "epoch": 2749} {"train_loss": -24.970630645751953, "global_step": 228217, "epoch": 2749} {"train_loss": -24.492374420166016, "global_step": 228218, "epoch": 2749} {"train_loss": -25.094524383544922, "global_step": 228219, "epoch": 2749} {"train_loss": -24.2542781829834, "global_step": 228220, "epoch": 2749} {"train_loss": -24.5463809967041, "global_step": 228221, "epoch": 2749} {"train_loss": -24.64734649658203, "global_step": 228222, "epoch": 2749} {"train_loss": -24.588947296142578, "global_step": 228223, "epoch": 2749} {"train_loss": -24.293216705322266, "global_step": 228224, "epoch": 2749} {"train_loss": -24.96903419494629, "global_step": 228225, "epoch": 2749} {"train_loss": -24.548730850219727, "global_step": 228226, "epoch": 2749} {"train_loss": -24.44464874267578, "global_step": 228227, "epoch": 2749} {"train_loss": -24.672117233276367, "global_step": 228228, "epoch": 2749} {"train_loss": -24.390073776245117, "global_step": 228229, "epoch": 2749} {"train_loss": -24.208499908447266, "global_step": 228230, "epoch": 2749} {"train_loss": -24.72267723083496, "global_step": 228231, "epoch": 2749} {"train_loss": -24.687721252441406, "global_step": 228232, "epoch": 2749} {"train_loss": -24.800405502319336, "global_step": 228233, "epoch": 2749} {"train_loss": -25.0401554107666, "global_step": 228234, "epoch": 2749} {"train_loss": -24.691953659057617, "global_step": 228235, "epoch": 2749} {"train_loss": -24.89333152770996, "global_step": 228236, "epoch": 2749} {"train_loss": -24.706287384033203, "global_step": 228237, "epoch": 2749} {"train_loss": -24.767133712768555, "global_step": 228238, "epoch": 2749} {"train_loss": -25.08102035522461, "global_step": 228239, "epoch": 2749} {"train_loss": -24.9426326751709, "global_step": 228240, "epoch": 2749} {"train_loss": -24.978164672851562, "global_step": 228241, "epoch": 2749} {"train_loss": -24.643524169921875, "global_step": 228242, "epoch": 2749} {"train_loss": -24.99775505065918, "global_step": 228243, "epoch": 2749} {"train_loss": -24.824594497680664, "global_step": 228244, "epoch": 2749} {"train_loss": -24.734941482543945, "global_step": 228245, "epoch": 2749} {"train_loss": -24.728836059570312, "global_step": 228246, "epoch": 2749} {"train_loss": -24.654333114624023, "global_step": 228247, "epoch": 2749} {"train_loss": -24.95417594909668, "global_step": 228248, "epoch": 2749} {"train_loss": -24.645711623042462, "global_step": 228249, "epoch": 2749, "val_loss": 6818034.0} {"train_loss": -23.920392990112305, "global_step": 228250, "epoch": 2750} {"train_loss": -24.192304611206055, "global_step": 228251, "epoch": 2750} {"train_loss": -24.194704055786133, "global_step": 228252, "epoch": 2750} {"train_loss": -24.580175399780273, "global_step": 228253, "epoch": 2750} {"train_loss": -24.36640739440918, "global_step": 228254, "epoch": 2750} {"train_loss": -24.00018882751465, "global_step": 228255, "epoch": 2750} {"train_loss": -24.281240463256836, "global_step": 228256, "epoch": 2750} {"train_loss": -24.67479133605957, "global_step": 228257, "epoch": 2750} {"train_loss": -24.22165298461914, "global_step": 228258, "epoch": 2750} {"train_loss": -24.762939453125, "global_step": 228259, "epoch": 2750} {"train_loss": -24.242286682128906, "global_step": 228260, "epoch": 2750} {"train_loss": -24.807292938232422, "global_step": 228261, "epoch": 2750} {"train_loss": -24.67531394958496, "global_step": 228262, "epoch": 2750} {"train_loss": -24.288166046142578, "global_step": 228263, "epoch": 2750} {"train_loss": -24.61651611328125, "global_step": 228264, "epoch": 2750} {"train_loss": -24.572778701782227, "global_step": 228265, "epoch": 2750} {"train_loss": -24.7119140625, "global_step": 228266, "epoch": 2750} {"train_loss": -24.796850204467773, "global_step": 228267, "epoch": 2750} {"train_loss": -24.506872177124023, "global_step": 228268, "epoch": 2750} {"train_loss": -24.944997787475586, "global_step": 228269, "epoch": 2750} {"train_loss": -24.82234764099121, "global_step": 228270, "epoch": 2750} {"train_loss": -24.932579040527344, "global_step": 228271, "epoch": 2750} {"train_loss": -24.607593536376953, "global_step": 228272, "epoch": 2750} {"train_loss": -24.981796264648438, "global_step": 228273, "epoch": 2750} {"train_loss": -24.971708297729492, "global_step": 228274, "epoch": 2750} {"train_loss": -24.36865234375, "global_step": 228275, "epoch": 2750} {"train_loss": -24.802236557006836, "global_step": 228276, "epoch": 2750} {"train_loss": -24.550968170166016, "global_step": 228277, "epoch": 2750} {"train_loss": -24.719188690185547, "global_step": 228278, "epoch": 2750} {"train_loss": -24.910079956054688, "global_step": 228279, "epoch": 2750} {"train_loss": -24.962491989135742, "global_step": 228280, "epoch": 2750} {"train_loss": -24.773283004760742, "global_step": 228281, "epoch": 2750} {"train_loss": -24.76431655883789, "global_step": 228282, "epoch": 2750} {"train_loss": -24.6123046875, "global_step": 228283, "epoch": 2750} {"train_loss": -24.559616088867188, "global_step": 228284, "epoch": 2750} {"train_loss": -24.495620727539062, "global_step": 228285, "epoch": 2750} {"train_loss": -24.614486694335938, "global_step": 228286, "epoch": 2750} {"train_loss": -24.83119773864746, "global_step": 228287, "epoch": 2750} {"train_loss": -24.779813766479492, "global_step": 228288, "epoch": 2750} {"train_loss": -24.740156173706055, "global_step": 228289, "epoch": 2750} {"train_loss": -24.716176986694336, "global_step": 228290, "epoch": 2750} {"train_loss": -24.727617263793945, "global_step": 228291, "epoch": 2750} {"train_loss": -24.667417526245117, "global_step": 228292, "epoch": 2750} {"train_loss": -24.5372314453125, "global_step": 228293, "epoch": 2750} {"train_loss": -25.203706741333008, "global_step": 228294, "epoch": 2750} {"train_loss": -24.286216735839844, "global_step": 228295, "epoch": 2750} {"train_loss": -24.20220947265625, "global_step": 228296, "epoch": 2750} {"train_loss": -24.796070098876953, "global_step": 228297, "epoch": 2750} {"train_loss": -24.49294662475586, "global_step": 228298, "epoch": 2750} {"train_loss": -24.76338768005371, "global_step": 228299, "epoch": 2750} {"train_loss": -24.761228561401367, "global_step": 228300, "epoch": 2750} {"train_loss": -24.612300872802734, "global_step": 228301, "epoch": 2750} {"train_loss": -24.558368682861328, "global_step": 228302, "epoch": 2750} {"train_loss": -24.392309188842773, "global_step": 228303, "epoch": 2750} {"train_loss": -24.694278717041016, "global_step": 228304, "epoch": 2750} {"train_loss": -24.473995208740234, "global_step": 228305, "epoch": 2750} {"train_loss": -24.959461212158203, "global_step": 228306, "epoch": 2750} {"train_loss": -24.35908317565918, "global_step": 228307, "epoch": 2750} {"train_loss": -24.68697738647461, "global_step": 228308, "epoch": 2750} {"train_loss": -24.728641510009766, "global_step": 228309, "epoch": 2750} {"train_loss": -24.475521087646484, "global_step": 228310, "epoch": 2750} {"train_loss": -24.6311092376709, "global_step": 228311, "epoch": 2750} {"train_loss": -24.95966148376465, "global_step": 228312, "epoch": 2750} {"train_loss": -24.614660263061523, "global_step": 228313, "epoch": 2750} {"train_loss": -24.547231674194336, "global_step": 228314, "epoch": 2750} {"train_loss": -24.87334632873535, "global_step": 228315, "epoch": 2750} {"train_loss": -24.733991622924805, "global_step": 228316, "epoch": 2750} {"train_loss": -24.48915672302246, "global_step": 228317, "epoch": 2750} {"train_loss": -24.46441650390625, "global_step": 228318, "epoch": 2750} {"train_loss": -24.609012603759766, "global_step": 228319, "epoch": 2750} {"train_loss": -24.453968048095703, "global_step": 228320, "epoch": 2750} {"train_loss": -24.552223205566406, "global_step": 228321, "epoch": 2750} {"train_loss": -24.560577392578125, "global_step": 228322, "epoch": 2750} {"train_loss": -24.40864372253418, "global_step": 228323, "epoch": 2750} {"train_loss": -24.83534049987793, "global_step": 228324, "epoch": 2750} {"train_loss": -24.69873046875, "global_step": 228325, "epoch": 2750} {"train_loss": -24.453256607055664, "global_step": 228326, "epoch": 2750} {"train_loss": -24.720746994018555, "global_step": 228327, "epoch": 2750} {"train_loss": -24.5638484954834, "global_step": 228328, "epoch": 2750} {"train_loss": -24.687101364135742, "global_step": 228329, "epoch": 2750} {"train_loss": -24.93155860900879, "global_step": 228330, "epoch": 2750} {"train_loss": -24.52202606201172, "global_step": 228331, "epoch": 2750} {"train_loss": -24.630862454333936, "global_step": 228332, "epoch": 2750, "train/sim_max_reward_0": 1.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 0.0, "test/sim_max_reward_4500000": 1.0, "test/sim_max_reward_4500001": 1.0, "test/sim_max_reward_4500002": 1.0, "test/sim_max_reward_4500003": 1.0, "test/sim_max_reward_4500004": 1.0, "test/sim_max_reward_4500005": 1.0, "test/sim_max_reward_4500006": 1.0, "test/sim_max_reward_4500007": 0.0, "test/sim_max_reward_4500008": 1.0, "test/sim_max_reward_4500009": 1.0, "test/sim_max_reward_4500010": 1.0, "test/sim_max_reward_4500011": 1.0, "test/sim_max_reward_4500012": 1.0, "test/sim_max_reward_4500013": 1.0, "test/sim_max_reward_4500014": 1.0, "test/sim_max_reward_4500015": 1.0, "test/sim_max_reward_4500016": 1.0, "test/sim_max_reward_4500017": 1.0, "test/sim_max_reward_4500018": 1.0, "test/sim_max_reward_4500019": 1.0, "test/sim_max_reward_4500020": 1.0, "test/sim_max_reward_4500021": 1.0, "train/mean_score": 0.8333333333333334, "test/mean_score": 0.9545454545454546, "val_loss": 6667839.5} {"train_loss": -24.39902114868164, "global_step": 228333, "epoch": 2751} {"train_loss": -24.278860092163086, "global_step": 228334, "epoch": 2751} {"train_loss": -24.719558715820312, "global_step": 228335, "epoch": 2751} {"train_loss": -24.401357650756836, "global_step": 228336, "epoch": 2751} {"train_loss": -24.459543228149414, "global_step": 228337, "epoch": 2751} {"train_loss": -24.612512588500977, "global_step": 228338, "epoch": 2751} {"train_loss": -24.618160247802734, "global_step": 228339, "epoch": 2751} {"train_loss": -24.684720993041992, "global_step": 228340, "epoch": 2751} {"train_loss": -24.445148468017578, "global_step": 228341, "epoch": 2751} {"train_loss": -24.333776473999023, "global_step": 228342, "epoch": 2751} {"train_loss": -24.89093589782715, "global_step": 228343, "epoch": 2751} {"train_loss": -24.848928451538086, "global_step": 228344, "epoch": 2751} {"train_loss": -24.717092514038086, "global_step": 228345, "epoch": 2751} {"train_loss": -24.939626693725586, "global_step": 228346, "epoch": 2751} {"train_loss": -24.580617904663086, "global_step": 228347, "epoch": 2751} {"train_loss": -24.67188835144043, "global_step": 228348, "epoch": 2751} {"train_loss": -24.80359649658203, "global_step": 228349, "epoch": 2751} {"train_loss": -25.016128540039062, "global_step": 228350, "epoch": 2751} {"train_loss": -24.506099700927734, "global_step": 228351, "epoch": 2751} {"train_loss": -24.549219131469727, "global_step": 228352, "epoch": 2751} {"train_loss": -24.66859245300293, "global_step": 228353, "epoch": 2751} {"train_loss": -24.87965965270996, "global_step": 228354, "epoch": 2751} {"train_loss": -24.47484588623047, "global_step": 228355, "epoch": 2751} {"train_loss": -25.16696548461914, "global_step": 228356, "epoch": 2751} {"train_loss": -24.762222290039062, "global_step": 228357, "epoch": 2751} {"train_loss": -24.63802146911621, "global_step": 228358, "epoch": 2751} {"train_loss": -25.061769485473633, "global_step": 228359, "epoch": 2751} {"train_loss": -24.751598358154297, "global_step": 228360, "epoch": 2751} {"train_loss": -24.94607925415039, "global_step": 228361, "epoch": 2751} {"train_loss": -24.699533462524414, "global_step": 228362, "epoch": 2751} {"train_loss": -25.351543426513672, "global_step": 228363, "epoch": 2751} {"train_loss": -24.929906845092773, "global_step": 228364, "epoch": 2751} {"train_loss": -25.21587562561035, "global_step": 228365, "epoch": 2751} {"train_loss": -24.852558135986328, "global_step": 228366, "epoch": 2751} {"train_loss": -24.68949317932129, "global_step": 228367, "epoch": 2751} {"train_loss": -24.701953887939453, "global_step": 228368, "epoch": 2751} {"train_loss": -24.50062370300293, "global_step": 228369, "epoch": 2751} {"train_loss": -24.547590255737305, "global_step": 228370, "epoch": 2751} {"train_loss": -24.88435173034668, "global_step": 228371, "epoch": 2751} {"train_loss": -24.859342575073242, "global_step": 228372, "epoch": 2751} {"train_loss": -24.89920997619629, "global_step": 228373, "epoch": 2751} {"train_loss": -24.912649154663086, "global_step": 228374, "epoch": 2751} {"train_loss": -24.724903106689453, "global_step": 228375, "epoch": 2751} {"train_loss": -24.67093849182129, "global_step": 228376, "epoch": 2751} {"train_loss": -24.75966453552246, "global_step": 228377, "epoch": 2751} {"train_loss": -24.67292022705078, "global_step": 228378, "epoch": 2751} {"train_loss": -24.8155517578125, "global_step": 228379, "epoch": 2751} {"train_loss": -24.525741577148438, "global_step": 228380, "epoch": 2751} {"train_loss": -24.64731788635254, "global_step": 228381, "epoch": 2751} {"train_loss": -24.67647361755371, "global_step": 228382, "epoch": 2751} {"train_loss": -23.922435760498047, "global_step": 228383, "epoch": 2751} {"train_loss": -22.455303192138672, "global_step": 228384, "epoch": 2751} {"train_loss": -22.8831844329834, "global_step": 228385, "epoch": 2751} {"train_loss": -24.15813636779785, "global_step": 228386, "epoch": 2751} {"train_loss": -24.073684692382812, "global_step": 228387, "epoch": 2751} {"train_loss": -23.9353084564209, "global_step": 228388, "epoch": 2751} {"train_loss": -24.486677169799805, "global_step": 228389, "epoch": 2751} {"train_loss": -24.56526756286621, "global_step": 228390, "epoch": 2751} {"train_loss": -24.1949462890625, "global_step": 228391, "epoch": 2751} {"train_loss": -24.08965301513672, "global_step": 228392, "epoch": 2751} {"train_loss": -24.880422592163086, "global_step": 228393, "epoch": 2751} {"train_loss": -24.5280704498291, "global_step": 228394, "epoch": 2751} {"train_loss": -24.589414596557617, "global_step": 228395, "epoch": 2751} {"train_loss": -24.549938201904297, "global_step": 228396, "epoch": 2751} {"train_loss": -24.56690788269043, "global_step": 228397, "epoch": 2751} {"train_loss": -24.34623146057129, "global_step": 228398, "epoch": 2751} {"train_loss": -24.189123153686523, "global_step": 228399, "epoch": 2751} {"train_loss": -24.613473892211914, "global_step": 228400, "epoch": 2751} {"train_loss": -24.49797248840332, "global_step": 228401, "epoch": 2751} {"train_loss": -24.5385799407959, "global_step": 228402, "epoch": 2751} {"train_loss": -24.419376373291016, "global_step": 228403, "epoch": 2751} {"train_loss": -24.15532875061035, "global_step": 228404, "epoch": 2751} {"train_loss": -24.789098739624023, "global_step": 228405, "epoch": 2751} {"train_loss": -24.75124168395996, "global_step": 228406, "epoch": 2751} {"train_loss": -24.388660430908203, "global_step": 228407, "epoch": 2751} {"train_loss": -25.108564376831055, "global_step": 228408, "epoch": 2751} {"train_loss": -24.429834365844727, "global_step": 228409, "epoch": 2751} {"train_loss": -24.21515655517578, "global_step": 228410, "epoch": 2751} {"train_loss": -24.688709259033203, "global_step": 228411, "epoch": 2751} {"train_loss": -24.947813034057617, "global_step": 228412, "epoch": 2751} {"train_loss": -24.743711471557617, "global_step": 228413, "epoch": 2751} {"train_loss": -24.276594161987305, "global_step": 228414, "epoch": 2751} {"train_loss": -24.55944410576878, "global_step": 228415, "epoch": 2751, "val_loss": 6930945.0} {"train_loss": -24.371185302734375, "global_step": 228416, "epoch": 2752} {"train_loss": -24.208301544189453, "global_step": 228417, "epoch": 2752} {"train_loss": -24.80974006652832, "global_step": 228418, "epoch": 2752} {"train_loss": -24.34450340270996, "global_step": 228419, "epoch": 2752} {"train_loss": -24.41119956970215, "global_step": 228420, "epoch": 2752} {"train_loss": -24.485807418823242, "global_step": 228421, "epoch": 2752} {"train_loss": -24.66206932067871, "global_step": 228422, "epoch": 2752} {"train_loss": -24.85011863708496, "global_step": 228423, "epoch": 2752} {"train_loss": -24.52219581604004, "global_step": 228424, "epoch": 2752} {"train_loss": -24.80458641052246, "global_step": 228425, "epoch": 2752} {"train_loss": -24.580442428588867, "global_step": 228426, "epoch": 2752} {"train_loss": -24.742704391479492, "global_step": 228427, "epoch": 2752} {"train_loss": -24.482467651367188, "global_step": 228428, "epoch": 2752} {"train_loss": -24.71626853942871, "global_step": 228429, "epoch": 2752} {"train_loss": -24.805631637573242, "global_step": 228430, "epoch": 2752} {"train_loss": -24.897464752197266, "global_step": 228431, "epoch": 2752} {"train_loss": -25.06496238708496, "global_step": 228432, "epoch": 2752} {"train_loss": -24.680850982666016, "global_step": 228433, "epoch": 2752} {"train_loss": -24.543737411499023, "global_step": 228434, "epoch": 2752} {"train_loss": -24.91773223876953, "global_step": 228435, "epoch": 2752} {"train_loss": -24.804243087768555, "global_step": 228436, "epoch": 2752} {"train_loss": -25.02659797668457, "global_step": 228437, "epoch": 2752} {"train_loss": -24.679096221923828, "global_step": 228438, "epoch": 2752} {"train_loss": -24.906585693359375, "global_step": 228439, "epoch": 2752} {"train_loss": -24.746414184570312, "global_step": 228440, "epoch": 2752} {"train_loss": -25.043256759643555, "global_step": 228441, "epoch": 2752} {"train_loss": -24.795164108276367, "global_step": 228442, "epoch": 2752} {"train_loss": -24.431615829467773, "global_step": 228443, "epoch": 2752} {"train_loss": -24.726301193237305, "global_step": 228444, "epoch": 2752} {"train_loss": -24.58296775817871, "global_step": 228445, "epoch": 2752} {"train_loss": -24.89141845703125, "global_step": 228446, "epoch": 2752} {"train_loss": -24.48957633972168, "global_step": 228447, "epoch": 2752} {"train_loss": -24.739765167236328, "global_step": 228448, "epoch": 2752} {"train_loss": -24.626047134399414, "global_step": 228449, "epoch": 2752} {"train_loss": -24.917598724365234, "global_step": 228450, "epoch": 2752} {"train_loss": -24.761144638061523, "global_step": 228451, "epoch": 2752} {"train_loss": -25.06564712524414, "global_step": 228452, "epoch": 2752} {"train_loss": -24.96549415588379, "global_step": 228453, "epoch": 2752} {"train_loss": -24.764982223510742, "global_step": 228454, "epoch": 2752} {"train_loss": -24.812429428100586, "global_step": 228455, "epoch": 2752} {"train_loss": -24.576400756835938, "global_step": 228456, "epoch": 2752} {"train_loss": -24.46358871459961, "global_step": 228457, "epoch": 2752} {"train_loss": -24.758209228515625, "global_step": 228458, "epoch": 2752} {"train_loss": -24.471925735473633, "global_step": 228459, "epoch": 2752} {"train_loss": -24.434598922729492, "global_step": 228460, "epoch": 2752} {"train_loss": -24.332965850830078, "global_step": 228461, "epoch": 2752} {"train_loss": -24.8062686920166, "global_step": 228462, "epoch": 2752} {"train_loss": -24.396347045898438, "global_step": 228463, "epoch": 2752} {"train_loss": -24.38675880432129, "global_step": 228464, "epoch": 2752} {"train_loss": -24.68738555908203, "global_step": 228465, "epoch": 2752} {"train_loss": -24.571989059448242, "global_step": 228466, "epoch": 2752} {"train_loss": -25.00778579711914, "global_step": 228467, "epoch": 2752} {"train_loss": -24.608367919921875, "global_step": 228468, "epoch": 2752} {"train_loss": -24.949417114257812, "global_step": 228469, "epoch": 2752} {"train_loss": -24.854703903198242, "global_step": 228470, "epoch": 2752} {"train_loss": -24.427173614501953, "global_step": 228471, "epoch": 2752} {"train_loss": -24.510343551635742, "global_step": 228472, "epoch": 2752} {"train_loss": -24.902326583862305, "global_step": 228473, "epoch": 2752} {"train_loss": -24.722501754760742, "global_step": 228474, "epoch": 2752} {"train_loss": -24.37523078918457, "global_step": 228475, "epoch": 2752} {"train_loss": -24.4802188873291, "global_step": 228476, "epoch": 2752} {"train_loss": -24.82063865661621, "global_step": 228477, "epoch": 2752} {"train_loss": -24.41689109802246, "global_step": 228478, "epoch": 2752} {"train_loss": -24.29521942138672, "global_step": 228479, "epoch": 2752} {"train_loss": -24.289199829101562, "global_step": 228480, "epoch": 2752} {"train_loss": -24.4947566986084, "global_step": 228481, "epoch": 2752} {"train_loss": -24.82593536376953, "global_step": 228482, "epoch": 2752} {"train_loss": -24.59882164001465, "global_step": 228483, "epoch": 2752} {"train_loss": -24.865447998046875, "global_step": 228484, "epoch": 2752} {"train_loss": -24.55263328552246, "global_step": 228485, "epoch": 2752} {"train_loss": -24.99502182006836, "global_step": 228486, "epoch": 2752} {"train_loss": -24.688568115234375, "global_step": 228487, "epoch": 2752} {"train_loss": -24.644254684448242, "global_step": 228488, "epoch": 2752} {"train_loss": -24.902563095092773, "global_step": 228489, "epoch": 2752} {"train_loss": -24.72572135925293, "global_step": 228490, "epoch": 2752} {"train_loss": -24.837749481201172, "global_step": 228491, "epoch": 2752} {"train_loss": -25.027090072631836, "global_step": 228492, "epoch": 2752} {"train_loss": -24.733993530273438, "global_step": 228493, "epoch": 2752} {"train_loss": -24.729440689086914, "global_step": 228494, "epoch": 2752} {"train_loss": -25.222280502319336, "global_step": 228495, "epoch": 2752} {"train_loss": -24.815792083740234, "global_step": 228496, "epoch": 2752} {"train_loss": -24.73512077331543, "global_step": 228497, "epoch": 2752} {"train_loss": -24.69973722710667, "global_step": 228498, "epoch": 2752, "val_loss": 6709597.0} {"train_loss": -23.872976303100586, "global_step": 228499, "epoch": 2753} {"train_loss": -24.19364356994629, "global_step": 228500, "epoch": 2753} {"train_loss": -24.836467742919922, "global_step": 228501, "epoch": 2753} {"train_loss": -24.10995864868164, "global_step": 228502, "epoch": 2753} {"train_loss": -24.009098052978516, "global_step": 228503, "epoch": 2753} {"train_loss": -24.26287078857422, "global_step": 228504, "epoch": 2753} {"train_loss": -24.38624382019043, "global_step": 228505, "epoch": 2753} {"train_loss": -24.338184356689453, "global_step": 228506, "epoch": 2753} {"train_loss": -23.711956024169922, "global_step": 228507, "epoch": 2753} {"train_loss": -23.89531707763672, "global_step": 228508, "epoch": 2753} {"train_loss": -24.85940933227539, "global_step": 228509, "epoch": 2753} {"train_loss": -24.260635375976562, "global_step": 228510, "epoch": 2753} {"train_loss": -24.475086212158203, "global_step": 228511, "epoch": 2753} {"train_loss": -24.099916458129883, "global_step": 228512, "epoch": 2753} {"train_loss": -24.432266235351562, "global_step": 228513, "epoch": 2753} {"train_loss": -24.257232666015625, "global_step": 228514, "epoch": 2753} {"train_loss": -24.254030227661133, "global_step": 228515, "epoch": 2753} {"train_loss": -24.305335998535156, "global_step": 228516, "epoch": 2753} {"train_loss": -24.81014060974121, "global_step": 228517, "epoch": 2753} {"train_loss": -24.532438278198242, "global_step": 228518, "epoch": 2753} {"train_loss": -24.721832275390625, "global_step": 228519, "epoch": 2753} {"train_loss": -24.9201602935791, "global_step": 228520, "epoch": 2753} {"train_loss": -24.303577423095703, "global_step": 228521, "epoch": 2753} {"train_loss": -24.557138442993164, "global_step": 228522, "epoch": 2753} {"train_loss": -24.615530014038086, "global_step": 228523, "epoch": 2753} {"train_loss": -24.696426391601562, "global_step": 228524, "epoch": 2753} {"train_loss": -24.64422607421875, "global_step": 228525, "epoch": 2753} {"train_loss": -24.801021575927734, "global_step": 228526, "epoch": 2753} {"train_loss": -24.613584518432617, "global_step": 228527, "epoch": 2753} {"train_loss": -24.976455688476562, "global_step": 228528, "epoch": 2753} {"train_loss": -24.670995712280273, "global_step": 228529, "epoch": 2753} {"train_loss": -24.672414779663086, "global_step": 228530, "epoch": 2753} {"train_loss": -24.93147850036621, "global_step": 228531, "epoch": 2753} {"train_loss": -24.9501953125, "global_step": 228532, "epoch": 2753} {"train_loss": -24.94485855102539, "global_step": 228533, "epoch": 2753} {"train_loss": -24.92522621154785, "global_step": 228534, "epoch": 2753} {"train_loss": -24.804296493530273, "global_step": 228535, "epoch": 2753} {"train_loss": -25.0042781829834, "global_step": 228536, "epoch": 2753} {"train_loss": -24.90396499633789, "global_step": 228537, "epoch": 2753} {"train_loss": -24.92646598815918, "global_step": 228538, "epoch": 2753} {"train_loss": -25.266040802001953, "global_step": 228539, "epoch": 2753} {"train_loss": -24.700946807861328, "global_step": 228540, "epoch": 2753} {"train_loss": -24.527162551879883, "global_step": 228541, "epoch": 2753} {"train_loss": -24.952068328857422, "global_step": 228542, "epoch": 2753} {"train_loss": -24.77350616455078, "global_step": 228543, "epoch": 2753} {"train_loss": -24.84202003479004, "global_step": 228544, "epoch": 2753} {"train_loss": -24.994779586791992, "global_step": 228545, "epoch": 2753} {"train_loss": -24.375335693359375, "global_step": 228546, "epoch": 2753} {"train_loss": -24.512836456298828, "global_step": 228547, "epoch": 2753} {"train_loss": -24.488821029663086, "global_step": 228548, "epoch": 2753} {"train_loss": -24.528573989868164, "global_step": 228549, "epoch": 2753} {"train_loss": -25.050344467163086, "global_step": 228550, "epoch": 2753} {"train_loss": -24.929536819458008, "global_step": 228551, "epoch": 2753} {"train_loss": -24.779630661010742, "global_step": 228552, "epoch": 2753} {"train_loss": -25.06122398376465, "global_step": 228553, "epoch": 2753} {"train_loss": -25.012954711914062, "global_step": 228554, "epoch": 2753} {"train_loss": -25.150821685791016, "global_step": 228555, "epoch": 2753} {"train_loss": -24.754560470581055, "global_step": 228556, "epoch": 2753} {"train_loss": -24.85273551940918, "global_step": 228557, "epoch": 2753} {"train_loss": -24.651859283447266, "global_step": 228558, "epoch": 2753} {"train_loss": -24.817211151123047, "global_step": 228559, "epoch": 2753} {"train_loss": -25.01468276977539, "global_step": 228560, "epoch": 2753} {"train_loss": -24.756460189819336, "global_step": 228561, "epoch": 2753} {"train_loss": -24.70930290222168, "global_step": 228562, "epoch": 2753} {"train_loss": -24.378311157226562, "global_step": 228563, "epoch": 2753} {"train_loss": -24.59699058532715, "global_step": 228564, "epoch": 2753} {"train_loss": -25.121557235717773, "global_step": 228565, "epoch": 2753} {"train_loss": -24.714353561401367, "global_step": 228566, "epoch": 2753} {"train_loss": -24.4548282623291, "global_step": 228567, "epoch": 2753} {"train_loss": -24.503110885620117, "global_step": 228568, "epoch": 2753} {"train_loss": -25.06023597717285, "global_step": 228569, "epoch": 2753} {"train_loss": -24.803014755249023, "global_step": 228570, "epoch": 2753} {"train_loss": -24.859636306762695, "global_step": 228571, "epoch": 2753} {"train_loss": -24.7287654876709, "global_step": 228572, "epoch": 2753} {"train_loss": -24.75685691833496, "global_step": 228573, "epoch": 2753} {"train_loss": -24.841716766357422, "global_step": 228574, "epoch": 2753} {"train_loss": -24.68537139892578, "global_step": 228575, "epoch": 2753} {"train_loss": -24.786596298217773, "global_step": 228576, "epoch": 2753} {"train_loss": -24.817228317260742, "global_step": 228577, "epoch": 2753} {"train_loss": -24.65766716003418, "global_step": 228578, "epoch": 2753} {"train_loss": -24.759939193725586, "global_step": 228579, "epoch": 2753} {"train_loss": -24.68219566345215, "global_step": 228580, "epoch": 2753} {"train_loss": -24.678958984742682, "global_step": 228581, "epoch": 2753, "val_loss": 6643675.0} {"train_loss": -24.36003875732422, "global_step": 228582, "epoch": 2754} {"train_loss": -24.366352081298828, "global_step": 228583, "epoch": 2754} {"train_loss": -24.698719024658203, "global_step": 228584, "epoch": 2754} {"train_loss": -24.11866569519043, "global_step": 228585, "epoch": 2754} {"train_loss": -24.615703582763672, "global_step": 228586, "epoch": 2754} {"train_loss": -24.572114944458008, "global_step": 228587, "epoch": 2754} {"train_loss": -24.840560913085938, "global_step": 228588, "epoch": 2754} {"train_loss": -24.417348861694336, "global_step": 228589, "epoch": 2754} {"train_loss": -24.360620498657227, "global_step": 228590, "epoch": 2754} {"train_loss": -24.685766220092773, "global_step": 228591, "epoch": 2754} {"train_loss": -24.45348358154297, "global_step": 228592, "epoch": 2754} {"train_loss": -24.46333122253418, "global_step": 228593, "epoch": 2754} {"train_loss": -24.665098190307617, "global_step": 228594, "epoch": 2754} {"train_loss": -24.722625732421875, "global_step": 228595, "epoch": 2754} {"train_loss": -24.35707664489746, "global_step": 228596, "epoch": 2754} {"train_loss": -24.550535202026367, "global_step": 228597, "epoch": 2754} {"train_loss": -24.694677352905273, "global_step": 228598, "epoch": 2754} {"train_loss": -25.02264976501465, "global_step": 228599, "epoch": 2754} {"train_loss": -24.49677085876465, "global_step": 228600, "epoch": 2754} {"train_loss": -25.00214958190918, "global_step": 228601, "epoch": 2754} {"train_loss": -24.694467544555664, "global_step": 228602, "epoch": 2754} {"train_loss": -24.687376022338867, "global_step": 228603, "epoch": 2754} {"train_loss": -24.304655075073242, "global_step": 228604, "epoch": 2754} {"train_loss": -24.756935119628906, "global_step": 228605, "epoch": 2754} {"train_loss": -24.64659309387207, "global_step": 228606, "epoch": 2754} {"train_loss": -24.963245391845703, "global_step": 228607, "epoch": 2754} {"train_loss": -24.888093948364258, "global_step": 228608, "epoch": 2754} {"train_loss": -24.663135528564453, "global_step": 228609, "epoch": 2754} {"train_loss": -24.758493423461914, "global_step": 228610, "epoch": 2754} {"train_loss": -24.690515518188477, "global_step": 228611, "epoch": 2754} {"train_loss": -24.692325592041016, "global_step": 228612, "epoch": 2754} {"train_loss": -24.776575088500977, "global_step": 228613, "epoch": 2754} {"train_loss": -24.778120040893555, "global_step": 228614, "epoch": 2754} {"train_loss": -24.611360549926758, "global_step": 228615, "epoch": 2754} {"train_loss": -24.622360229492188, "global_step": 228616, "epoch": 2754} {"train_loss": -24.281774520874023, "global_step": 228617, "epoch": 2754} {"train_loss": -25.138504028320312, "global_step": 228618, "epoch": 2754} {"train_loss": -25.096426010131836, "global_step": 228619, "epoch": 2754} {"train_loss": -25.247676849365234, "global_step": 228620, "epoch": 2754} {"train_loss": -24.991182327270508, "global_step": 228621, "epoch": 2754} {"train_loss": -24.378881454467773, "global_step": 228622, "epoch": 2754} {"train_loss": -24.897146224975586, "global_step": 228623, "epoch": 2754} {"train_loss": -24.835134506225586, "global_step": 228624, "epoch": 2754} {"train_loss": -24.486743927001953, "global_step": 228625, "epoch": 2754} {"train_loss": -25.034015655517578, "global_step": 228626, "epoch": 2754} {"train_loss": -24.66625213623047, "global_step": 228627, "epoch": 2754} {"train_loss": -24.583826065063477, "global_step": 228628, "epoch": 2754} {"train_loss": -24.410999298095703, "global_step": 228629, "epoch": 2754} {"train_loss": -24.450056076049805, "global_step": 228630, "epoch": 2754} {"train_loss": -24.604589462280273, "global_step": 228631, "epoch": 2754} {"train_loss": -24.87554359436035, "global_step": 228632, "epoch": 2754} {"train_loss": -24.57868766784668, "global_step": 228633, "epoch": 2754} {"train_loss": -24.911230087280273, "global_step": 228634, "epoch": 2754} {"train_loss": -24.15154457092285, "global_step": 228635, "epoch": 2754} {"train_loss": -24.659868240356445, "global_step": 228636, "epoch": 2754} {"train_loss": -24.915298461914062, "global_step": 228637, "epoch": 2754} {"train_loss": -24.68674659729004, "global_step": 228638, "epoch": 2754} {"train_loss": -24.53690528869629, "global_step": 228639, "epoch": 2754} {"train_loss": -24.516117095947266, "global_step": 228640, "epoch": 2754} {"train_loss": -25.03864860534668, "global_step": 228641, "epoch": 2754} {"train_loss": -24.690963745117188, "global_step": 228642, "epoch": 2754} {"train_loss": -24.484458923339844, "global_step": 228643, "epoch": 2754} {"train_loss": -24.557636260986328, "global_step": 228644, "epoch": 2754} {"train_loss": -24.850248336791992, "global_step": 228645, "epoch": 2754} {"train_loss": -24.268692016601562, "global_step": 228646, "epoch": 2754} {"train_loss": -25.10712242126465, "global_step": 228647, "epoch": 2754} {"train_loss": -24.561498641967773, "global_step": 228648, "epoch": 2754} {"train_loss": -24.718412399291992, "global_step": 228649, "epoch": 2754} {"train_loss": -24.73182487487793, "global_step": 228650, "epoch": 2754} {"train_loss": -24.662084579467773, "global_step": 228651, "epoch": 2754} {"train_loss": -24.842788696289062, "global_step": 228652, "epoch": 2754} {"train_loss": -24.758094787597656, "global_step": 228653, "epoch": 2754} {"train_loss": -25.0660457611084, "global_step": 228654, "epoch": 2754} {"train_loss": -24.42396354675293, "global_step": 228655, "epoch": 2754} {"train_loss": -24.774030685424805, "global_step": 228656, "epoch": 2754} {"train_loss": -24.894046783447266, "global_step": 228657, "epoch": 2754} {"train_loss": -24.671396255493164, "global_step": 228658, "epoch": 2754} {"train_loss": -24.898733139038086, "global_step": 228659, "epoch": 2754} {"train_loss": -25.241052627563477, "global_step": 228660, "epoch": 2754} {"train_loss": -24.743497848510742, "global_step": 228661, "epoch": 2754} {"train_loss": -24.7668514251709, "global_step": 228662, "epoch": 2754} {"train_loss": -25.020971298217773, "global_step": 228663, "epoch": 2754} {"train_loss": -24.697665088148003, "global_step": 228664, "epoch": 2754, "val_loss": 6712184.0} {"train_loss": -23.987133026123047, "global_step": 228665, "epoch": 2755} {"train_loss": -23.923913955688477, "global_step": 228666, "epoch": 2755} {"train_loss": -24.142309188842773, "global_step": 228667, "epoch": 2755} {"train_loss": -24.52842903137207, "global_step": 228668, "epoch": 2755} {"train_loss": -24.430421829223633, "global_step": 228669, "epoch": 2755} {"train_loss": -24.028701782226562, "global_step": 228670, "epoch": 2755} {"train_loss": -24.4381103515625, "global_step": 228671, "epoch": 2755} {"train_loss": -24.39420509338379, "global_step": 228672, "epoch": 2755} {"train_loss": -24.017778396606445, "global_step": 228673, "epoch": 2755} {"train_loss": -24.6406192779541, "global_step": 228674, "epoch": 2755} {"train_loss": -24.514556884765625, "global_step": 228675, "epoch": 2755} {"train_loss": -24.184207916259766, "global_step": 228676, "epoch": 2755} {"train_loss": -24.334989547729492, "global_step": 228677, "epoch": 2755} {"train_loss": -24.710315704345703, "global_step": 228678, "epoch": 2755} {"train_loss": -24.41876220703125, "global_step": 228679, "epoch": 2755} {"train_loss": -24.507972717285156, "global_step": 228680, "epoch": 2755} {"train_loss": -24.61566925048828, "global_step": 228681, "epoch": 2755} {"train_loss": -24.544666290283203, "global_step": 228682, "epoch": 2755} {"train_loss": -24.82368278503418, "global_step": 228683, "epoch": 2755} {"train_loss": -24.711355209350586, "global_step": 228684, "epoch": 2755} {"train_loss": -24.929595947265625, "global_step": 228685, "epoch": 2755} {"train_loss": -24.6039981842041, "global_step": 228686, "epoch": 2755} {"train_loss": -24.491159439086914, "global_step": 228687, "epoch": 2755} {"train_loss": -24.631324768066406, "global_step": 228688, "epoch": 2755} {"train_loss": -24.924015045166016, "global_step": 228689, "epoch": 2755} {"train_loss": -24.737255096435547, "global_step": 228690, "epoch": 2755} {"train_loss": -24.986425399780273, "global_step": 228691, "epoch": 2755} {"train_loss": -24.538114547729492, "global_step": 228692, "epoch": 2755} {"train_loss": -24.91288185119629, "global_step": 228693, "epoch": 2755} {"train_loss": -24.74854850769043, "global_step": 228694, "epoch": 2755} {"train_loss": -24.97994041442871, "global_step": 228695, "epoch": 2755} {"train_loss": -24.921283721923828, "global_step": 228696, "epoch": 2755} {"train_loss": -24.352733612060547, "global_step": 228697, "epoch": 2755} {"train_loss": -24.563491821289062, "global_step": 228698, "epoch": 2755} {"train_loss": -25.216663360595703, "global_step": 228699, "epoch": 2755} {"train_loss": -24.80828857421875, "global_step": 228700, "epoch": 2755} {"train_loss": -24.55934715270996, "global_step": 228701, "epoch": 2755} {"train_loss": -24.710773468017578, "global_step": 228702, "epoch": 2755} {"train_loss": -25.20088005065918, "global_step": 228703, "epoch": 2755} {"train_loss": -24.17889404296875, "global_step": 228704, "epoch": 2755} {"train_loss": -24.67032814025879, "global_step": 228705, "epoch": 2755} {"train_loss": -24.503232955932617, "global_step": 228706, "epoch": 2755} {"train_loss": -24.378677368164062, "global_step": 228707, "epoch": 2755} {"train_loss": -24.546382904052734, "global_step": 228708, "epoch": 2755} {"train_loss": -24.796194076538086, "global_step": 228709, "epoch": 2755} {"train_loss": -24.67056655883789, "global_step": 228710, "epoch": 2755} {"train_loss": -24.616485595703125, "global_step": 228711, "epoch": 2755} {"train_loss": -24.87761878967285, "global_step": 228712, "epoch": 2755} {"train_loss": -24.77952766418457, "global_step": 228713, "epoch": 2755} {"train_loss": -25.065492630004883, "global_step": 228714, "epoch": 2755} {"train_loss": -24.629730224609375, "global_step": 228715, "epoch": 2755} {"train_loss": -24.668161392211914, "global_step": 228716, "epoch": 2755} {"train_loss": -24.778079986572266, "global_step": 228717, "epoch": 2755} {"train_loss": -24.71754264831543, "global_step": 228718, "epoch": 2755} {"train_loss": -24.419931411743164, "global_step": 228719, "epoch": 2755} {"train_loss": -24.372617721557617, "global_step": 228720, "epoch": 2755} {"train_loss": -24.32271385192871, "global_step": 228721, "epoch": 2755} {"train_loss": -24.348403930664062, "global_step": 228722, "epoch": 2755} {"train_loss": -24.293720245361328, "global_step": 228723, "epoch": 2755} {"train_loss": -25.137189865112305, "global_step": 228724, "epoch": 2755} {"train_loss": -24.696226119995117, "global_step": 228725, "epoch": 2755} {"train_loss": -24.222375869750977, "global_step": 228726, "epoch": 2755} {"train_loss": -24.53931999206543, "global_step": 228727, "epoch": 2755} {"train_loss": -24.888425827026367, "global_step": 228728, "epoch": 2755} {"train_loss": -24.846220016479492, "global_step": 228729, "epoch": 2755} {"train_loss": -24.688297271728516, "global_step": 228730, "epoch": 2755} {"train_loss": -24.527097702026367, "global_step": 228731, "epoch": 2755} {"train_loss": -24.83617401123047, "global_step": 228732, "epoch": 2755} {"train_loss": -24.642690658569336, "global_step": 228733, "epoch": 2755} {"train_loss": -24.3987979888916, "global_step": 228734, "epoch": 2755} {"train_loss": -24.890283584594727, "global_step": 228735, "epoch": 2755} {"train_loss": -24.514806747436523, "global_step": 228736, "epoch": 2755} {"train_loss": -24.558073043823242, "global_step": 228737, "epoch": 2755} {"train_loss": -24.739593505859375, "global_step": 228738, "epoch": 2755} {"train_loss": -24.623403549194336, "global_step": 228739, "epoch": 2755} {"train_loss": -24.85037612915039, "global_step": 228740, "epoch": 2755} {"train_loss": -25.16928482055664, "global_step": 228741, "epoch": 2755} {"train_loss": -25.150901794433594, "global_step": 228742, "epoch": 2755} {"train_loss": -24.508499145507812, "global_step": 228743, "epoch": 2755} {"train_loss": -24.809036254882812, "global_step": 228744, "epoch": 2755} {"train_loss": -24.963882446289062, "global_step": 228745, "epoch": 2755} {"train_loss": -25.22292137145996, "global_step": 228746, "epoch": 2755} {"train_loss": -24.64195086008095, "global_step": 228747, "epoch": 2755, "val_loss": 6657377.0} {"train_loss": -24.275955200195312, "global_step": 228748, "epoch": 2756} {"train_loss": -23.93301773071289, "global_step": 228749, "epoch": 2756} {"train_loss": -23.99334716796875, "global_step": 228750, "epoch": 2756} {"train_loss": -24.336755752563477, "global_step": 228751, "epoch": 2756} {"train_loss": -23.692543029785156, "global_step": 228752, "epoch": 2756} {"train_loss": -24.193603515625, "global_step": 228753, "epoch": 2756} {"train_loss": -24.609285354614258, "global_step": 228754, "epoch": 2756} {"train_loss": -24.056657791137695, "global_step": 228755, "epoch": 2756} {"train_loss": -24.11100196838379, "global_step": 228756, "epoch": 2756} {"train_loss": -24.665990829467773, "global_step": 228757, "epoch": 2756} {"train_loss": -23.791921615600586, "global_step": 228758, "epoch": 2756} {"train_loss": -24.49704933166504, "global_step": 228759, "epoch": 2756} {"train_loss": -24.29890251159668, "global_step": 228760, "epoch": 2756} {"train_loss": -24.2739315032959, "global_step": 228761, "epoch": 2756} {"train_loss": -24.325742721557617, "global_step": 228762, "epoch": 2756} {"train_loss": -24.567899703979492, "global_step": 228763, "epoch": 2756} {"train_loss": -24.536306381225586, "global_step": 228764, "epoch": 2756} {"train_loss": -24.204145431518555, "global_step": 228765, "epoch": 2756} {"train_loss": -24.296178817749023, "global_step": 228766, "epoch": 2756} {"train_loss": -24.33821678161621, "global_step": 228767, "epoch": 2756} {"train_loss": -24.535768508911133, "global_step": 228768, "epoch": 2756} {"train_loss": -24.43673324584961, "global_step": 228769, "epoch": 2756} {"train_loss": -24.5003662109375, "global_step": 228770, "epoch": 2756} {"train_loss": -24.67746353149414, "global_step": 228771, "epoch": 2756} {"train_loss": -24.885805130004883, "global_step": 228772, "epoch": 2756} {"train_loss": -24.586021423339844, "global_step": 228773, "epoch": 2756} {"train_loss": -24.860219955444336, "global_step": 228774, "epoch": 2756} {"train_loss": -24.430469512939453, "global_step": 228775, "epoch": 2756} {"train_loss": -24.84564208984375, "global_step": 228776, "epoch": 2756} {"train_loss": -24.71833038330078, "global_step": 228777, "epoch": 2756} {"train_loss": -24.80705451965332, "global_step": 228778, "epoch": 2756} {"train_loss": -24.625593185424805, "global_step": 228779, "epoch": 2756} {"train_loss": -24.953632354736328, "global_step": 228780, "epoch": 2756} {"train_loss": -24.644872665405273, "global_step": 228781, "epoch": 2756} {"train_loss": -24.657285690307617, "global_step": 228782, "epoch": 2756} {"train_loss": -24.981504440307617, "global_step": 228783, "epoch": 2756} {"train_loss": -24.536523818969727, "global_step": 228784, "epoch": 2756} {"train_loss": -24.7899169921875, "global_step": 228785, "epoch": 2756} {"train_loss": -24.537464141845703, "global_step": 228786, "epoch": 2756} {"train_loss": -24.784826278686523, "global_step": 228787, "epoch": 2756} {"train_loss": -24.75294303894043, "global_step": 228788, "epoch": 2756} {"train_loss": -24.899948120117188, "global_step": 228789, "epoch": 2756} {"train_loss": -24.559053421020508, "global_step": 228790, "epoch": 2756} {"train_loss": -24.699556350708008, "global_step": 228791, "epoch": 2756} {"train_loss": -24.734418869018555, "global_step": 228792, "epoch": 2756} {"train_loss": -25.17073631286621, "global_step": 228793, "epoch": 2756} {"train_loss": -24.573490142822266, "global_step": 228794, "epoch": 2756} {"train_loss": -24.841550827026367, "global_step": 228795, "epoch": 2756} {"train_loss": -24.585437774658203, "global_step": 228796, "epoch": 2756} {"train_loss": -25.01576042175293, "global_step": 228797, "epoch": 2756} {"train_loss": -25.070621490478516, "global_step": 228798, "epoch": 2756} {"train_loss": -24.75255012512207, "global_step": 228799, "epoch": 2756} {"train_loss": -25.315237045288086, "global_step": 228800, "epoch": 2756} {"train_loss": -24.49468231201172, "global_step": 228801, "epoch": 2756} {"train_loss": -24.131332397460938, "global_step": 228802, "epoch": 2756} {"train_loss": -24.637189865112305, "global_step": 228803, "epoch": 2756} {"train_loss": -24.466630935668945, "global_step": 228804, "epoch": 2756} {"train_loss": -24.698909759521484, "global_step": 228805, "epoch": 2756} {"train_loss": -24.644989013671875, "global_step": 228806, "epoch": 2756} {"train_loss": -24.92555046081543, "global_step": 228807, "epoch": 2756} {"train_loss": -24.781330108642578, "global_step": 228808, "epoch": 2756} {"train_loss": -24.669967651367188, "global_step": 228809, "epoch": 2756} {"train_loss": -24.640594482421875, "global_step": 228810, "epoch": 2756} {"train_loss": -24.578100204467773, "global_step": 228811, "epoch": 2756} {"train_loss": -24.508237838745117, "global_step": 228812, "epoch": 2756} {"train_loss": -24.475624084472656, "global_step": 228813, "epoch": 2756} {"train_loss": -24.396718978881836, "global_step": 228814, "epoch": 2756} {"train_loss": -24.521718978881836, "global_step": 228815, "epoch": 2756} {"train_loss": -24.485197067260742, "global_step": 228816, "epoch": 2756} {"train_loss": -24.782854080200195, "global_step": 228817, "epoch": 2756} {"train_loss": -24.715185165405273, "global_step": 228818, "epoch": 2756} {"train_loss": -24.690183639526367, "global_step": 228819, "epoch": 2756} {"train_loss": -24.662912368774414, "global_step": 228820, "epoch": 2756} {"train_loss": -24.65652084350586, "global_step": 228821, "epoch": 2756} {"train_loss": -24.42780303955078, "global_step": 228822, "epoch": 2756} {"train_loss": -24.653535842895508, "global_step": 228823, "epoch": 2756} {"train_loss": -25.049741744995117, "global_step": 228824, "epoch": 2756} {"train_loss": -24.529098510742188, "global_step": 228825, "epoch": 2756} {"train_loss": -24.81869888305664, "global_step": 228826, "epoch": 2756} {"train_loss": -24.790708541870117, "global_step": 228827, "epoch": 2756} {"train_loss": -25.286815643310547, "global_step": 228828, "epoch": 2756} {"train_loss": -24.7930965423584, "global_step": 228829, "epoch": 2756} {"train_loss": -24.618015473147473, "global_step": 228830, "epoch": 2756, "val_loss": 6826505.0} {"train_loss": -24.06760597229004, "global_step": 228831, "epoch": 2757} {"train_loss": -23.76370620727539, "global_step": 228832, "epoch": 2757} {"train_loss": -24.15032386779785, "global_step": 228833, "epoch": 2757} {"train_loss": -23.960372924804688, "global_step": 228834, "epoch": 2757} {"train_loss": -24.63631248474121, "global_step": 228835, "epoch": 2757} {"train_loss": -23.576446533203125, "global_step": 228836, "epoch": 2757} {"train_loss": -24.426361083984375, "global_step": 228837, "epoch": 2757} {"train_loss": -24.033315658569336, "global_step": 228838, "epoch": 2757} {"train_loss": -24.31097412109375, "global_step": 228839, "epoch": 2757} {"train_loss": -24.063400268554688, "global_step": 228840, "epoch": 2757} {"train_loss": -24.471288681030273, "global_step": 228841, "epoch": 2757} {"train_loss": -23.73024559020996, "global_step": 228842, "epoch": 2757} {"train_loss": -24.453237533569336, "global_step": 228843, "epoch": 2757} {"train_loss": -24.234394073486328, "global_step": 228844, "epoch": 2757} {"train_loss": -24.48872947692871, "global_step": 228845, "epoch": 2757} {"train_loss": -24.3857479095459, "global_step": 228846, "epoch": 2757} {"train_loss": -24.487628936767578, "global_step": 228847, "epoch": 2757} {"train_loss": -24.403730392456055, "global_step": 228848, "epoch": 2757} {"train_loss": -24.373720169067383, "global_step": 228849, "epoch": 2757} {"train_loss": -24.17386245727539, "global_step": 228850, "epoch": 2757} {"train_loss": -24.1724910736084, "global_step": 228851, "epoch": 2757} {"train_loss": -24.3649845123291, "global_step": 228852, "epoch": 2757} {"train_loss": -24.69260597229004, "global_step": 228853, "epoch": 2757} {"train_loss": -24.558584213256836, "global_step": 228854, "epoch": 2757} {"train_loss": -24.811338424682617, "global_step": 228855, "epoch": 2757} {"train_loss": -24.587848663330078, "global_step": 228856, "epoch": 2757} {"train_loss": -24.736608505249023, "global_step": 228857, "epoch": 2757} {"train_loss": -24.495235443115234, "global_step": 228858, "epoch": 2757} {"train_loss": -24.63092041015625, "global_step": 228859, "epoch": 2757} {"train_loss": -24.57840347290039, "global_step": 228860, "epoch": 2757} {"train_loss": -24.872724533081055, "global_step": 228861, "epoch": 2757} {"train_loss": -24.9548397064209, "global_step": 228862, "epoch": 2757} {"train_loss": -24.761432647705078, "global_step": 228863, "epoch": 2757} {"train_loss": -24.79179573059082, "global_step": 228864, "epoch": 2757} {"train_loss": -24.886178970336914, "global_step": 228865, "epoch": 2757} {"train_loss": -24.666406631469727, "global_step": 228866, "epoch": 2757} {"train_loss": -24.653467178344727, "global_step": 228867, "epoch": 2757} {"train_loss": -24.833593368530273, "global_step": 228868, "epoch": 2757} {"train_loss": -24.944843292236328, "global_step": 228869, "epoch": 2757} {"train_loss": -25.079336166381836, "global_step": 228870, "epoch": 2757} {"train_loss": -24.80134391784668, "global_step": 228871, "epoch": 2757} {"train_loss": -24.979713439941406, "global_step": 228872, "epoch": 2757} {"train_loss": -24.77229118347168, "global_step": 228873, "epoch": 2757} {"train_loss": -24.830957412719727, "global_step": 228874, "epoch": 2757} {"train_loss": -24.987796783447266, "global_step": 228875, "epoch": 2757} {"train_loss": -24.591970443725586, "global_step": 228876, "epoch": 2757} {"train_loss": -24.97604751586914, "global_step": 228877, "epoch": 2757} {"train_loss": -24.722970962524414, "global_step": 228878, "epoch": 2757} {"train_loss": -25.075986862182617, "global_step": 228879, "epoch": 2757} {"train_loss": -24.78797149658203, "global_step": 228880, "epoch": 2757} {"train_loss": -24.888578414916992, "global_step": 228881, "epoch": 2757} {"train_loss": -24.71970558166504, "global_step": 228882, "epoch": 2757} {"train_loss": -24.745359420776367, "global_step": 228883, "epoch": 2757} {"train_loss": -24.489322662353516, "global_step": 228884, "epoch": 2757} {"train_loss": -24.458621978759766, "global_step": 228885, "epoch": 2757} {"train_loss": -24.87908935546875, "global_step": 228886, "epoch": 2757} {"train_loss": -24.5844783782959, "global_step": 228887, "epoch": 2757} {"train_loss": -25.164905548095703, "global_step": 228888, "epoch": 2757} {"train_loss": -24.091201782226562, "global_step": 228889, "epoch": 2757} {"train_loss": -24.359216690063477, "global_step": 228890, "epoch": 2757} {"train_loss": -24.529396057128906, "global_step": 228891, "epoch": 2757} {"train_loss": -24.621580123901367, "global_step": 228892, "epoch": 2757} {"train_loss": -24.33500099182129, "global_step": 228893, "epoch": 2757} {"train_loss": -24.82430076599121, "global_step": 228894, "epoch": 2757} {"train_loss": -24.448657989501953, "global_step": 228895, "epoch": 2757} {"train_loss": -25.0062255859375, "global_step": 228896, "epoch": 2757} {"train_loss": -24.189043045043945, "global_step": 228897, "epoch": 2757} {"train_loss": -24.707855224609375, "global_step": 228898, "epoch": 2757} {"train_loss": -24.204587936401367, "global_step": 228899, "epoch": 2757} {"train_loss": -24.452167510986328, "global_step": 228900, "epoch": 2757} {"train_loss": -24.47775650024414, "global_step": 228901, "epoch": 2757} {"train_loss": -24.607982635498047, "global_step": 228902, "epoch": 2757} {"train_loss": -24.70404815673828, "global_step": 228903, "epoch": 2757} {"train_loss": -24.685379028320312, "global_step": 228904, "epoch": 2757} {"train_loss": -24.719528198242188, "global_step": 228905, "epoch": 2757} {"train_loss": -24.767019271850586, "global_step": 228906, "epoch": 2757} {"train_loss": -24.56086540222168, "global_step": 228907, "epoch": 2757} {"train_loss": -24.173748016357422, "global_step": 228908, "epoch": 2757} {"train_loss": -24.641956329345703, "global_step": 228909, "epoch": 2757} {"train_loss": -24.949174880981445, "global_step": 228910, "epoch": 2757} {"train_loss": -24.93430519104004, "global_step": 228911, "epoch": 2757} {"train_loss": -24.953702926635742, "global_step": 228912, "epoch": 2757} {"train_loss": -24.56243988404791, "global_step": 228913, "epoch": 2757, "val_loss": 6744204.0} {"train_loss": -24.579448699951172, "global_step": 228914, "epoch": 2758} {"train_loss": -24.417673110961914, "global_step": 228915, "epoch": 2758} {"train_loss": -24.11023712158203, "global_step": 228916, "epoch": 2758} {"train_loss": -24.173614501953125, "global_step": 228917, "epoch": 2758} {"train_loss": -24.23487663269043, "global_step": 228918, "epoch": 2758} {"train_loss": -24.521240234375, "global_step": 228919, "epoch": 2758} {"train_loss": -24.55537986755371, "global_step": 228920, "epoch": 2758} {"train_loss": -24.892030715942383, "global_step": 228921, "epoch": 2758} {"train_loss": -24.178665161132812, "global_step": 228922, "epoch": 2758} {"train_loss": -24.503583908081055, "global_step": 228923, "epoch": 2758} {"train_loss": -24.902820587158203, "global_step": 228924, "epoch": 2758} {"train_loss": -24.398391723632812, "global_step": 228925, "epoch": 2758} {"train_loss": -24.705303192138672, "global_step": 228926, "epoch": 2758} {"train_loss": -25.071866989135742, "global_step": 228927, "epoch": 2758} {"train_loss": -24.653287887573242, "global_step": 228928, "epoch": 2758} {"train_loss": -24.48601722717285, "global_step": 228929, "epoch": 2758} {"train_loss": -24.904102325439453, "global_step": 228930, "epoch": 2758} {"train_loss": -24.73674964904785, "global_step": 228931, "epoch": 2758} {"train_loss": -24.891202926635742, "global_step": 228932, "epoch": 2758} {"train_loss": -24.525861740112305, "global_step": 228933, "epoch": 2758} {"train_loss": -24.72382926940918, "global_step": 228934, "epoch": 2758} {"train_loss": -24.62204360961914, "global_step": 228935, "epoch": 2758} {"train_loss": -24.760848999023438, "global_step": 228936, "epoch": 2758} {"train_loss": -24.883939743041992, "global_step": 228937, "epoch": 2758} {"train_loss": -24.760412216186523, "global_step": 228938, "epoch": 2758} {"train_loss": -24.627431869506836, "global_step": 228939, "epoch": 2758} {"train_loss": -25.257909774780273, "global_step": 228940, "epoch": 2758} {"train_loss": -24.765222549438477, "global_step": 228941, "epoch": 2758} {"train_loss": -24.90376091003418, "global_step": 228942, "epoch": 2758} {"train_loss": -25.19428253173828, "global_step": 228943, "epoch": 2758} {"train_loss": -24.840776443481445, "global_step": 228944, "epoch": 2758} {"train_loss": -24.793577194213867, "global_step": 228945, "epoch": 2758} {"train_loss": -24.98089027404785, "global_step": 228946, "epoch": 2758} {"train_loss": -24.692317962646484, "global_step": 228947, "epoch": 2758} {"train_loss": -24.971811294555664, "global_step": 228948, "epoch": 2758} {"train_loss": -24.61982536315918, "global_step": 228949, "epoch": 2758} {"train_loss": -24.61067771911621, "global_step": 228950, "epoch": 2758} {"train_loss": -24.90219497680664, "global_step": 228951, "epoch": 2758} {"train_loss": -24.76193618774414, "global_step": 228952, "epoch": 2758} {"train_loss": -24.54725456237793, "global_step": 228953, "epoch": 2758} {"train_loss": -24.591856002807617, "global_step": 228954, "epoch": 2758} {"train_loss": -25.057294845581055, "global_step": 228955, "epoch": 2758} {"train_loss": -25.044462203979492, "global_step": 228956, "epoch": 2758} {"train_loss": -24.823644638061523, "global_step": 228957, "epoch": 2758} {"train_loss": -24.527807235717773, "global_step": 228958, "epoch": 2758} {"train_loss": -24.81024742126465, "global_step": 228959, "epoch": 2758} {"train_loss": -25.055835723876953, "global_step": 228960, "epoch": 2758} {"train_loss": -24.678346633911133, "global_step": 228961, "epoch": 2758} {"train_loss": -24.510412216186523, "global_step": 228962, "epoch": 2758} {"train_loss": -24.832786560058594, "global_step": 228963, "epoch": 2758} {"train_loss": -24.89158058166504, "global_step": 228964, "epoch": 2758} {"train_loss": -24.839597702026367, "global_step": 228965, "epoch": 2758} {"train_loss": -24.990652084350586, "global_step": 228966, "epoch": 2758} {"train_loss": -24.99323081970215, "global_step": 228967, "epoch": 2758} {"train_loss": -24.874418258666992, "global_step": 228968, "epoch": 2758} {"train_loss": -24.716773986816406, "global_step": 228969, "epoch": 2758} {"train_loss": -24.644147872924805, "global_step": 228970, "epoch": 2758} {"train_loss": -24.77164077758789, "global_step": 228971, "epoch": 2758} {"train_loss": -24.36500358581543, "global_step": 228972, "epoch": 2758} {"train_loss": -24.698196411132812, "global_step": 228973, "epoch": 2758} {"train_loss": -25.004806518554688, "global_step": 228974, "epoch": 2758} {"train_loss": -24.581357955932617, "global_step": 228975, "epoch": 2758} {"train_loss": -24.72163200378418, "global_step": 228976, "epoch": 2758} {"train_loss": -24.819074630737305, "global_step": 228977, "epoch": 2758} {"train_loss": -24.736867904663086, "global_step": 228978, "epoch": 2758} {"train_loss": -24.69989585876465, "global_step": 228979, "epoch": 2758} {"train_loss": -24.372394561767578, "global_step": 228980, "epoch": 2758} {"train_loss": -24.46748161315918, "global_step": 228981, "epoch": 2758} {"train_loss": -24.781686782836914, "global_step": 228982, "epoch": 2758} {"train_loss": -24.6529598236084, "global_step": 228983, "epoch": 2758} {"train_loss": -24.697145462036133, "global_step": 228984, "epoch": 2758} {"train_loss": -24.600446701049805, "global_step": 228985, "epoch": 2758} {"train_loss": -24.61268424987793, "global_step": 228986, "epoch": 2758} {"train_loss": -24.72645378112793, "global_step": 228987, "epoch": 2758} {"train_loss": -24.521535873413086, "global_step": 228988, "epoch": 2758} {"train_loss": -24.487546920776367, "global_step": 228989, "epoch": 2758} {"train_loss": -24.7606258392334, "global_step": 228990, "epoch": 2758} {"train_loss": -24.66945457458496, "global_step": 228991, "epoch": 2758} {"train_loss": -24.533050537109375, "global_step": 228992, "epoch": 2758} {"train_loss": -24.955020904541016, "global_step": 228993, "epoch": 2758} {"train_loss": -24.64133071899414, "global_step": 228994, "epoch": 2758} {"train_loss": -24.88681983947754, "global_step": 228995, "epoch": 2758} {"train_loss": -24.724330948059816, "global_step": 228996, "epoch": 2758, "val_loss": 6628039.0} {"train_loss": -24.604963302612305, "global_step": 228997, "epoch": 2759} {"train_loss": -24.400577545166016, "global_step": 228998, "epoch": 2759} {"train_loss": -24.38397789001465, "global_step": 228999, "epoch": 2759} {"train_loss": -23.90760612487793, "global_step": 229000, "epoch": 2759} {"train_loss": -24.784130096435547, "global_step": 229001, "epoch": 2759} {"train_loss": -24.32400894165039, "global_step": 229002, "epoch": 2759} {"train_loss": -24.477575302124023, "global_step": 229003, "epoch": 2759} {"train_loss": -24.39639663696289, "global_step": 229004, "epoch": 2759} {"train_loss": -24.248882293701172, "global_step": 229005, "epoch": 2759} {"train_loss": -24.366085052490234, "global_step": 229006, "epoch": 2759} {"train_loss": -24.107933044433594, "global_step": 229007, "epoch": 2759} {"train_loss": -24.39556884765625, "global_step": 229008, "epoch": 2759} {"train_loss": -24.340293884277344, "global_step": 229009, "epoch": 2759} {"train_loss": -24.13332176208496, "global_step": 229010, "epoch": 2759} {"train_loss": -24.794235229492188, "global_step": 229011, "epoch": 2759} {"train_loss": -24.29847526550293, "global_step": 229012, "epoch": 2759} {"train_loss": -24.81168556213379, "global_step": 229013, "epoch": 2759} {"train_loss": -24.452932357788086, "global_step": 229014, "epoch": 2759} {"train_loss": -25.340620040893555, "global_step": 229015, "epoch": 2759} {"train_loss": -24.297428131103516, "global_step": 229016, "epoch": 2759} {"train_loss": -24.437427520751953, "global_step": 229017, "epoch": 2759} {"train_loss": -24.46221923828125, "global_step": 229018, "epoch": 2759} {"train_loss": -24.57398796081543, "global_step": 229019, "epoch": 2759} {"train_loss": -24.620107650756836, "global_step": 229020, "epoch": 2759} {"train_loss": -24.849964141845703, "global_step": 229021, "epoch": 2759} {"train_loss": -24.389188766479492, "global_step": 229022, "epoch": 2759} {"train_loss": -24.502059936523438, "global_step": 229023, "epoch": 2759} {"train_loss": -24.48201560974121, "global_step": 229024, "epoch": 2759} {"train_loss": -24.885116577148438, "global_step": 229025, "epoch": 2759} {"train_loss": -24.62867546081543, "global_step": 229026, "epoch": 2759} {"train_loss": -24.65099334716797, "global_step": 229027, "epoch": 2759} {"train_loss": -24.728931427001953, "global_step": 229028, "epoch": 2759} {"train_loss": -24.809711456298828, "global_step": 229029, "epoch": 2759} {"train_loss": -25.149890899658203, "global_step": 229030, "epoch": 2759} {"train_loss": -24.51819610595703, "global_step": 229031, "epoch": 2759} {"train_loss": -24.866117477416992, "global_step": 229032, "epoch": 2759} {"train_loss": -25.139602661132812, "global_step": 229033, "epoch": 2759} {"train_loss": -24.792272567749023, "global_step": 229034, "epoch": 2759} {"train_loss": -24.412817001342773, "global_step": 229035, "epoch": 2759} {"train_loss": -24.861608505249023, "global_step": 229036, "epoch": 2759} {"train_loss": -25.011808395385742, "global_step": 229037, "epoch": 2759} {"train_loss": -25.208984375, "global_step": 229038, "epoch": 2759} {"train_loss": -25.206329345703125, "global_step": 229039, "epoch": 2759} {"train_loss": -24.45486831665039, "global_step": 229040, "epoch": 2759} {"train_loss": -24.965436935424805, "global_step": 229041, "epoch": 2759} {"train_loss": -24.7083797454834, "global_step": 229042, "epoch": 2759} {"train_loss": -24.69487762451172, "global_step": 229043, "epoch": 2759} {"train_loss": -24.951200485229492, "global_step": 229044, "epoch": 2759} {"train_loss": -24.445125579833984, "global_step": 229045, "epoch": 2759} {"train_loss": -24.64946937561035, "global_step": 229046, "epoch": 2759} {"train_loss": -24.893117904663086, "global_step": 229047, "epoch": 2759} {"train_loss": -24.71492576599121, "global_step": 229048, "epoch": 2759} {"train_loss": -24.461273193359375, "global_step": 229049, "epoch": 2759} {"train_loss": -24.75924301147461, "global_step": 229050, "epoch": 2759} {"train_loss": -24.99505615234375, "global_step": 229051, "epoch": 2759} {"train_loss": -24.658447265625, "global_step": 229052, "epoch": 2759} {"train_loss": -24.523681640625, "global_step": 229053, "epoch": 2759} {"train_loss": -24.64066505432129, "global_step": 229054, "epoch": 2759} {"train_loss": -24.90635108947754, "global_step": 229055, "epoch": 2759} {"train_loss": -25.138212203979492, "global_step": 229056, "epoch": 2759} {"train_loss": -24.557966232299805, "global_step": 229057, "epoch": 2759} {"train_loss": -25.123943328857422, "global_step": 229058, "epoch": 2759} {"train_loss": -24.958200454711914, "global_step": 229059, "epoch": 2759} {"train_loss": -24.745763778686523, "global_step": 229060, "epoch": 2759} {"train_loss": -24.968706130981445, "global_step": 229061, "epoch": 2759} {"train_loss": -24.90406036376953, "global_step": 229062, "epoch": 2759} {"train_loss": -24.76041030883789, "global_step": 229063, "epoch": 2759} {"train_loss": -24.502973556518555, "global_step": 229064, "epoch": 2759} {"train_loss": -24.81480598449707, "global_step": 229065, "epoch": 2759} {"train_loss": -24.788188934326172, "global_step": 229066, "epoch": 2759} {"train_loss": -24.60711669921875, "global_step": 229067, "epoch": 2759} {"train_loss": -24.785409927368164, "global_step": 229068, "epoch": 2759} {"train_loss": -24.69563102722168, "global_step": 229069, "epoch": 2759} {"train_loss": -24.917682647705078, "global_step": 229070, "epoch": 2759} {"train_loss": -24.775358200073242, "global_step": 229071, "epoch": 2759} {"train_loss": -24.73628807067871, "global_step": 229072, "epoch": 2759} {"train_loss": -24.822834014892578, "global_step": 229073, "epoch": 2759} {"train_loss": -24.511640548706055, "global_step": 229074, "epoch": 2759} {"train_loss": -24.56999969482422, "global_step": 229075, "epoch": 2759} {"train_loss": -24.792333602905273, "global_step": 229076, "epoch": 2759} {"train_loss": -25.13051414489746, "global_step": 229077, "epoch": 2759} {"train_loss": -24.81705093383789, "global_step": 229078, "epoch": 2759} {"train_loss": -24.668722865093184, "global_step": 229079, "epoch": 2759, "val_loss": 6695745.0} {"train_loss": -23.946943283081055, "global_step": 229080, "epoch": 2760} {"train_loss": -24.020151138305664, "global_step": 229081, "epoch": 2760} {"train_loss": -24.193883895874023, "global_step": 229082, "epoch": 2760} {"train_loss": -23.850341796875, "global_step": 229083, "epoch": 2760} {"train_loss": -24.575815200805664, "global_step": 229084, "epoch": 2760} {"train_loss": -24.67999839782715, "global_step": 229085, "epoch": 2760} {"train_loss": -24.382434844970703, "global_step": 229086, "epoch": 2760} {"train_loss": -24.240707397460938, "global_step": 229087, "epoch": 2760} {"train_loss": -24.101242065429688, "global_step": 229088, "epoch": 2760} {"train_loss": -24.438785552978516, "global_step": 229089, "epoch": 2760} {"train_loss": -24.328311920166016, "global_step": 229090, "epoch": 2760} {"train_loss": -24.6634521484375, "global_step": 229091, "epoch": 2760} {"train_loss": -24.110977172851562, "global_step": 229092, "epoch": 2760} {"train_loss": -24.519071578979492, "global_step": 229093, "epoch": 2760} {"train_loss": -24.76653480529785, "global_step": 229094, "epoch": 2760} {"train_loss": -24.474416732788086, "global_step": 229095, "epoch": 2760} {"train_loss": -24.510961532592773, "global_step": 229096, "epoch": 2760} {"train_loss": -24.691991806030273, "global_step": 229097, "epoch": 2760} {"train_loss": -24.478973388671875, "global_step": 229098, "epoch": 2760} {"train_loss": -24.718143463134766, "global_step": 229099, "epoch": 2760} {"train_loss": -24.786069869995117, "global_step": 229100, "epoch": 2760} {"train_loss": -24.64644432067871, "global_step": 229101, "epoch": 2760} {"train_loss": -24.56333351135254, "global_step": 229102, "epoch": 2760} {"train_loss": -24.623380661010742, "global_step": 229103, "epoch": 2760} {"train_loss": -24.79868507385254, "global_step": 229104, "epoch": 2760} {"train_loss": -24.63270378112793, "global_step": 229105, "epoch": 2760} {"train_loss": -24.577518463134766, "global_step": 229106, "epoch": 2760} {"train_loss": -24.747089385986328, "global_step": 229107, "epoch": 2760} {"train_loss": -24.605148315429688, "global_step": 229108, "epoch": 2760} {"train_loss": -24.893497467041016, "global_step": 229109, "epoch": 2760} {"train_loss": -24.77186393737793, "global_step": 229110, "epoch": 2760} {"train_loss": -25.01714324951172, "global_step": 229111, "epoch": 2760} {"train_loss": -25.066190719604492, "global_step": 229112, "epoch": 2760} {"train_loss": -24.984161376953125, "global_step": 229113, "epoch": 2760} {"train_loss": -24.762449264526367, "global_step": 229114, "epoch": 2760} {"train_loss": -24.972814559936523, "global_step": 229115, "epoch": 2760} {"train_loss": -25.111249923706055, "global_step": 229116, "epoch": 2760} {"train_loss": -24.680770874023438, "global_step": 229117, "epoch": 2760} {"train_loss": -24.347705841064453, "global_step": 229118, "epoch": 2760} {"train_loss": -25.056819915771484, "global_step": 229119, "epoch": 2760} {"train_loss": -24.733407974243164, "global_step": 229120, "epoch": 2760} {"train_loss": -24.985183715820312, "global_step": 229121, "epoch": 2760} {"train_loss": -24.661304473876953, "global_step": 229122, "epoch": 2760} {"train_loss": -24.707292556762695, "global_step": 229123, "epoch": 2760} {"train_loss": -24.878896713256836, "global_step": 229124, "epoch": 2760} {"train_loss": -25.082704544067383, "global_step": 229125, "epoch": 2760} {"train_loss": -24.694517135620117, "global_step": 229126, "epoch": 2760} {"train_loss": -24.42034912109375, "global_step": 229127, "epoch": 2760} {"train_loss": -23.903371810913086, "global_step": 229128, "epoch": 2760} {"train_loss": -24.134714126586914, "global_step": 229129, "epoch": 2760} {"train_loss": -24.953746795654297, "global_step": 229130, "epoch": 2760} {"train_loss": -24.695547103881836, "global_step": 229131, "epoch": 2760} {"train_loss": -25.012537002563477, "global_step": 229132, "epoch": 2760} {"train_loss": -24.690404891967773, "global_step": 229133, "epoch": 2760} {"train_loss": -24.92463493347168, "global_step": 229134, "epoch": 2760} {"train_loss": -24.221477508544922, "global_step": 229135, "epoch": 2760} {"train_loss": -24.485538482666016, "global_step": 229136, "epoch": 2760} {"train_loss": -24.37931251525879, "global_step": 229137, "epoch": 2760} {"train_loss": -24.51625633239746, "global_step": 229138, "epoch": 2760} {"train_loss": -24.471939086914062, "global_step": 229139, "epoch": 2760} {"train_loss": -24.700347900390625, "global_step": 229140, "epoch": 2760} {"train_loss": -24.43287467956543, "global_step": 229141, "epoch": 2760} {"train_loss": -24.333759307861328, "global_step": 229142, "epoch": 2760} {"train_loss": -24.972028732299805, "global_step": 229143, "epoch": 2760} {"train_loss": -24.91655731201172, "global_step": 229144, "epoch": 2760} {"train_loss": -24.43696403503418, "global_step": 229145, "epoch": 2760} {"train_loss": -24.625858306884766, "global_step": 229146, "epoch": 2760} {"train_loss": -25.01315689086914, "global_step": 229147, "epoch": 2760} {"train_loss": -24.637981414794922, "global_step": 229148, "epoch": 2760} {"train_loss": -24.953458786010742, "global_step": 229149, "epoch": 2760} {"train_loss": -24.77625846862793, "global_step": 229150, "epoch": 2760} {"train_loss": -24.699010848999023, "global_step": 229151, "epoch": 2760} {"train_loss": -25.040897369384766, "global_step": 229152, "epoch": 2760} {"train_loss": -24.769296646118164, "global_step": 229153, "epoch": 2760} {"train_loss": -24.61846351623535, "global_step": 229154, "epoch": 2760} {"train_loss": -24.79920768737793, "global_step": 229155, "epoch": 2760} {"train_loss": -25.125335693359375, "global_step": 229156, "epoch": 2760} {"train_loss": -24.828271865844727, "global_step": 229157, "epoch": 2760} {"train_loss": -24.91671371459961, "global_step": 229158, "epoch": 2760} {"train_loss": -24.41280174255371, "global_step": 229159, "epoch": 2760} {"train_loss": -24.959163665771484, "global_step": 229160, "epoch": 2760} {"train_loss": -24.91377830505371, "global_step": 229161, "epoch": 2760} {"train_loss": -24.643649664269873, "global_step": 229162, "epoch": 2760, "val_loss": 6707182.0} {"train_loss": -24.429819107055664, "global_step": 229163, "epoch": 2761} {"train_loss": -24.29755210876465, "global_step": 229164, "epoch": 2761} {"train_loss": -23.604063034057617, "global_step": 229165, "epoch": 2761} {"train_loss": -24.017627716064453, "global_step": 229166, "epoch": 2761} {"train_loss": -24.030025482177734, "global_step": 229167, "epoch": 2761} {"train_loss": -24.27989959716797, "global_step": 229168, "epoch": 2761} {"train_loss": -24.211566925048828, "global_step": 229169, "epoch": 2761} {"train_loss": -24.057214736938477, "global_step": 229170, "epoch": 2761} {"train_loss": -24.255537033081055, "global_step": 229171, "epoch": 2761} {"train_loss": -24.270559310913086, "global_step": 229172, "epoch": 2761} {"train_loss": -24.24518394470215, "global_step": 229173, "epoch": 2761} {"train_loss": -24.30681800842285, "global_step": 229174, "epoch": 2761} {"train_loss": -24.378522872924805, "global_step": 229175, "epoch": 2761} {"train_loss": -24.294137954711914, "global_step": 229176, "epoch": 2761} {"train_loss": -24.326292037963867, "global_step": 229177, "epoch": 2761} {"train_loss": -24.40282440185547, "global_step": 229178, "epoch": 2761} {"train_loss": -24.47774314880371, "global_step": 229179, "epoch": 2761} {"train_loss": -24.31281852722168, "global_step": 229180, "epoch": 2761} {"train_loss": -24.77356719970703, "global_step": 229181, "epoch": 2761} {"train_loss": -24.463092803955078, "global_step": 229182, "epoch": 2761} {"train_loss": -24.40566635131836, "global_step": 229183, "epoch": 2761} {"train_loss": -24.690187454223633, "global_step": 229184, "epoch": 2761} {"train_loss": -24.82329750061035, "global_step": 229185, "epoch": 2761} {"train_loss": -24.72664451599121, "global_step": 229186, "epoch": 2761} {"train_loss": -24.382959365844727, "global_step": 229187, "epoch": 2761} {"train_loss": -24.52787208557129, "global_step": 229188, "epoch": 2761} {"train_loss": -24.672134399414062, "global_step": 229189, "epoch": 2761} {"train_loss": -24.85503578186035, "global_step": 229190, "epoch": 2761} {"train_loss": -24.473798751831055, "global_step": 229191, "epoch": 2761} {"train_loss": -24.72532081604004, "global_step": 229192, "epoch": 2761} {"train_loss": -24.519025802612305, "global_step": 229193, "epoch": 2761} {"train_loss": -24.62230682373047, "global_step": 229194, "epoch": 2761} {"train_loss": -24.465906143188477, "global_step": 229195, "epoch": 2761} {"train_loss": -24.867156982421875, "global_step": 229196, "epoch": 2761} {"train_loss": -24.874361038208008, "global_step": 229197, "epoch": 2761} {"train_loss": -24.77251625061035, "global_step": 229198, "epoch": 2761} {"train_loss": -24.547866821289062, "global_step": 229199, "epoch": 2761} {"train_loss": -24.942441940307617, "global_step": 229200, "epoch": 2761} {"train_loss": -24.812807083129883, "global_step": 229201, "epoch": 2761} {"train_loss": -24.65360450744629, "global_step": 229202, "epoch": 2761} {"train_loss": -25.013641357421875, "global_step": 229203, "epoch": 2761} {"train_loss": -24.8737850189209, "global_step": 229204, "epoch": 2761} {"train_loss": -24.97607421875, "global_step": 229205, "epoch": 2761} {"train_loss": -24.531930923461914, "global_step": 229206, "epoch": 2761} {"train_loss": -24.94086265563965, "global_step": 229207, "epoch": 2761} {"train_loss": -24.71065330505371, "global_step": 229208, "epoch": 2761} {"train_loss": -24.92643165588379, "global_step": 229209, "epoch": 2761} {"train_loss": -24.842737197875977, "global_step": 229210, "epoch": 2761} {"train_loss": -24.830907821655273, "global_step": 229211, "epoch": 2761} {"train_loss": -24.576082229614258, "global_step": 229212, "epoch": 2761} {"train_loss": -24.83430290222168, "global_step": 229213, "epoch": 2761} {"train_loss": -24.596393585205078, "global_step": 229214, "epoch": 2761} {"train_loss": -24.730276107788086, "global_step": 229215, "epoch": 2761} {"train_loss": -24.7276611328125, "global_step": 229216, "epoch": 2761} {"train_loss": -24.81045913696289, "global_step": 229217, "epoch": 2761} {"train_loss": -24.235492706298828, "global_step": 229218, "epoch": 2761} {"train_loss": -24.297292709350586, "global_step": 229219, "epoch": 2761} {"train_loss": -24.520748138427734, "global_step": 229220, "epoch": 2761} {"train_loss": -25.137649536132812, "global_step": 229221, "epoch": 2761} {"train_loss": -24.39154624938965, "global_step": 229222, "epoch": 2761} {"train_loss": -24.469968795776367, "global_step": 229223, "epoch": 2761} {"train_loss": -24.985563278198242, "global_step": 229224, "epoch": 2761} {"train_loss": -24.82374382019043, "global_step": 229225, "epoch": 2761} {"train_loss": -24.727462768554688, "global_step": 229226, "epoch": 2761} {"train_loss": -24.398569107055664, "global_step": 229227, "epoch": 2761} {"train_loss": -24.480451583862305, "global_step": 229228, "epoch": 2761} {"train_loss": -24.825231552124023, "global_step": 229229, "epoch": 2761} {"train_loss": -24.95046043395996, "global_step": 229230, "epoch": 2761} {"train_loss": -24.838605880737305, "global_step": 229231, "epoch": 2761} {"train_loss": -24.829858779907227, "global_step": 229232, "epoch": 2761} {"train_loss": -24.675067901611328, "global_step": 229233, "epoch": 2761} {"train_loss": -25.06178092956543, "global_step": 229234, "epoch": 2761} {"train_loss": -24.616689682006836, "global_step": 229235, "epoch": 2761} {"train_loss": -24.71294403076172, "global_step": 229236, "epoch": 2761} {"train_loss": -24.875864028930664, "global_step": 229237, "epoch": 2761} {"train_loss": -24.885589599609375, "global_step": 229238, "epoch": 2761} {"train_loss": -24.699872970581055, "global_step": 229239, "epoch": 2761} {"train_loss": -24.68964958190918, "global_step": 229240, "epoch": 2761} {"train_loss": -24.720792770385742, "global_step": 229241, "epoch": 2761} {"train_loss": -24.89447593688965, "global_step": 229242, "epoch": 2761} {"train_loss": -24.904836654663086, "global_step": 229243, "epoch": 2761} {"train_loss": -25.190603256225586, "global_step": 229244, "epoch": 2761} {"train_loss": -24.61627884370735, "global_step": 229245, "epoch": 2761, "val_loss": 6829707.0} {"train_loss": -24.367605209350586, "global_step": 229246, "epoch": 2762} {"train_loss": -24.279830932617188, "global_step": 229247, "epoch": 2762} {"train_loss": -24.662626266479492, "global_step": 229248, "epoch": 2762} {"train_loss": -24.30284881591797, "global_step": 229249, "epoch": 2762} {"train_loss": -24.218435287475586, "global_step": 229250, "epoch": 2762} {"train_loss": -24.51599884033203, "global_step": 229251, "epoch": 2762} {"train_loss": -24.484073638916016, "global_step": 229252, "epoch": 2762} {"train_loss": -24.31231689453125, "global_step": 229253, "epoch": 2762} {"train_loss": -24.86646270751953, "global_step": 229254, "epoch": 2762} {"train_loss": -24.518293380737305, "global_step": 229255, "epoch": 2762} {"train_loss": -24.28995704650879, "global_step": 229256, "epoch": 2762} {"train_loss": -24.509328842163086, "global_step": 229257, "epoch": 2762} {"train_loss": -24.257211685180664, "global_step": 229258, "epoch": 2762} {"train_loss": -24.667783737182617, "global_step": 229259, "epoch": 2762} {"train_loss": -24.39813804626465, "global_step": 229260, "epoch": 2762} {"train_loss": -24.512983322143555, "global_step": 229261, "epoch": 2762} {"train_loss": -24.667884826660156, "global_step": 229262, "epoch": 2762} {"train_loss": -24.862836837768555, "global_step": 229263, "epoch": 2762} {"train_loss": -24.210744857788086, "global_step": 229264, "epoch": 2762} {"train_loss": -24.4840030670166, "global_step": 229265, "epoch": 2762} {"train_loss": -24.62038803100586, "global_step": 229266, "epoch": 2762} {"train_loss": -24.716106414794922, "global_step": 229267, "epoch": 2762} {"train_loss": -24.700929641723633, "global_step": 229268, "epoch": 2762} {"train_loss": -24.446125030517578, "global_step": 229269, "epoch": 2762} {"train_loss": -24.60126304626465, "global_step": 229270, "epoch": 2762} {"train_loss": -24.5091552734375, "global_step": 229271, "epoch": 2762} {"train_loss": -25.065677642822266, "global_step": 229272, "epoch": 2762} {"train_loss": -24.4527645111084, "global_step": 229273, "epoch": 2762} {"train_loss": -24.723995208740234, "global_step": 229274, "epoch": 2762} {"train_loss": -24.64824867248535, "global_step": 229275, "epoch": 2762} {"train_loss": -24.80780601501465, "global_step": 229276, "epoch": 2762} {"train_loss": -25.044353485107422, "global_step": 229277, "epoch": 2762} {"train_loss": -24.988283157348633, "global_step": 229278, "epoch": 2762} {"train_loss": -24.704181671142578, "global_step": 229279, "epoch": 2762} {"train_loss": -24.74836540222168, "global_step": 229280, "epoch": 2762} {"train_loss": -24.50901222229004, "global_step": 229281, "epoch": 2762} {"train_loss": -24.672794342041016, "global_step": 229282, "epoch": 2762} {"train_loss": -24.751123428344727, "global_step": 229283, "epoch": 2762} {"train_loss": -24.617807388305664, "global_step": 229284, "epoch": 2762} {"train_loss": -24.771799087524414, "global_step": 229285, "epoch": 2762} {"train_loss": -24.838407516479492, "global_step": 229286, "epoch": 2762} {"train_loss": -24.703243255615234, "global_step": 229287, "epoch": 2762} {"train_loss": -24.930774688720703, "global_step": 229288, "epoch": 2762} {"train_loss": -24.836654663085938, "global_step": 229289, "epoch": 2762} {"train_loss": -24.949676513671875, "global_step": 229290, "epoch": 2762} {"train_loss": -24.416173934936523, "global_step": 229291, "epoch": 2762} {"train_loss": -24.989347457885742, "global_step": 229292, "epoch": 2762} {"train_loss": -24.746253967285156, "global_step": 229293, "epoch": 2762} {"train_loss": -24.5941104888916, "global_step": 229294, "epoch": 2762} {"train_loss": -24.83032989501953, "global_step": 229295, "epoch": 2762} {"train_loss": -24.600345611572266, "global_step": 229296, "epoch": 2762} {"train_loss": -24.98554801940918, "global_step": 229297, "epoch": 2762} {"train_loss": -24.79111671447754, "global_step": 229298, "epoch": 2762} {"train_loss": -24.469158172607422, "global_step": 229299, "epoch": 2762} {"train_loss": -24.454517364501953, "global_step": 229300, "epoch": 2762} {"train_loss": -24.64349937438965, "global_step": 229301, "epoch": 2762} {"train_loss": -25.318260192871094, "global_step": 229302, "epoch": 2762} {"train_loss": -24.267986297607422, "global_step": 229303, "epoch": 2762} {"train_loss": -24.99106216430664, "global_step": 229304, "epoch": 2762} {"train_loss": -24.582117080688477, "global_step": 229305, "epoch": 2762} {"train_loss": -24.795515060424805, "global_step": 229306, "epoch": 2762} {"train_loss": -24.652780532836914, "global_step": 229307, "epoch": 2762} {"train_loss": -24.6237850189209, "global_step": 229308, "epoch": 2762} {"train_loss": -24.756317138671875, "global_step": 229309, "epoch": 2762} {"train_loss": -24.87662696838379, "global_step": 229310, "epoch": 2762} {"train_loss": -24.627317428588867, "global_step": 229311, "epoch": 2762} {"train_loss": -24.776233673095703, "global_step": 229312, "epoch": 2762} {"train_loss": -24.442176818847656, "global_step": 229313, "epoch": 2762} {"train_loss": -24.41934585571289, "global_step": 229314, "epoch": 2762} {"train_loss": -25.029882431030273, "global_step": 229315, "epoch": 2762} {"train_loss": -24.380582809448242, "global_step": 229316, "epoch": 2762} {"train_loss": -24.62889289855957, "global_step": 229317, "epoch": 2762} {"train_loss": -24.8015079498291, "global_step": 229318, "epoch": 2762} {"train_loss": -24.521045684814453, "global_step": 229319, "epoch": 2762} {"train_loss": -24.90769386291504, "global_step": 229320, "epoch": 2762} {"train_loss": -24.887958526611328, "global_step": 229321, "epoch": 2762} {"train_loss": -24.816953659057617, "global_step": 229322, "epoch": 2762} {"train_loss": -24.90514373779297, "global_step": 229323, "epoch": 2762} {"train_loss": -24.86111831665039, "global_step": 229324, "epoch": 2762} {"train_loss": -24.57769775390625, "global_step": 229325, "epoch": 2762} {"train_loss": -24.51788902282715, "global_step": 229326, "epoch": 2762} {"train_loss": -24.5887393951416, "global_step": 229327, "epoch": 2762} {"train_loss": -24.672185139483716, "global_step": 229328, "epoch": 2762, "val_loss": 6678514.5} {"train_loss": -24.451248168945312, "global_step": 229329, "epoch": 2763} {"train_loss": -24.038991928100586, "global_step": 229330, "epoch": 2763} {"train_loss": -23.989538192749023, "global_step": 229331, "epoch": 2763} {"train_loss": -24.374582290649414, "global_step": 229332, "epoch": 2763} {"train_loss": -24.757976531982422, "global_step": 229333, "epoch": 2763} {"train_loss": -24.386920928955078, "global_step": 229334, "epoch": 2763} {"train_loss": -24.33197021484375, "global_step": 229335, "epoch": 2763} {"train_loss": -24.13927459716797, "global_step": 229336, "epoch": 2763} {"train_loss": -24.597475051879883, "global_step": 229337, "epoch": 2763} {"train_loss": -24.67327308654785, "global_step": 229338, "epoch": 2763} {"train_loss": -24.518436431884766, "global_step": 229339, "epoch": 2763} {"train_loss": -24.685062408447266, "global_step": 229340, "epoch": 2763} {"train_loss": -24.40061378479004, "global_step": 229341, "epoch": 2763} {"train_loss": -24.99812889099121, "global_step": 229342, "epoch": 2763} {"train_loss": -24.884204864501953, "global_step": 229343, "epoch": 2763} {"train_loss": -24.542966842651367, "global_step": 229344, "epoch": 2763} {"train_loss": -24.758197784423828, "global_step": 229345, "epoch": 2763} {"train_loss": -24.608631134033203, "global_step": 229346, "epoch": 2763} {"train_loss": -24.943822860717773, "global_step": 229347, "epoch": 2763} {"train_loss": -25.06682014465332, "global_step": 229348, "epoch": 2763} {"train_loss": -24.703439712524414, "global_step": 229349, "epoch": 2763} {"train_loss": -24.457914352416992, "global_step": 229350, "epoch": 2763} {"train_loss": -25.2471866607666, "global_step": 229351, "epoch": 2763} {"train_loss": -24.71306800842285, "global_step": 229352, "epoch": 2763} {"train_loss": -24.695430755615234, "global_step": 229353, "epoch": 2763} {"train_loss": -24.941280364990234, "global_step": 229354, "epoch": 2763} {"train_loss": -24.755748748779297, "global_step": 229355, "epoch": 2763} {"train_loss": -24.596149444580078, "global_step": 229356, "epoch": 2763} {"train_loss": -24.94098663330078, "global_step": 229357, "epoch": 2763} {"train_loss": -24.75127410888672, "global_step": 229358, "epoch": 2763} {"train_loss": -24.734750747680664, "global_step": 229359, "epoch": 2763} {"train_loss": -24.729589462280273, "global_step": 229360, "epoch": 2763} {"train_loss": -24.893035888671875, "global_step": 229361, "epoch": 2763} {"train_loss": -24.451696395874023, "global_step": 229362, "epoch": 2763} {"train_loss": -25.210046768188477, "global_step": 229363, "epoch": 2763} {"train_loss": -24.690351486206055, "global_step": 229364, "epoch": 2763} {"train_loss": -25.044132232666016, "global_step": 229365, "epoch": 2763} {"train_loss": -24.976043701171875, "global_step": 229366, "epoch": 2763} {"train_loss": -24.834716796875, "global_step": 229367, "epoch": 2763} {"train_loss": -24.936403274536133, "global_step": 229368, "epoch": 2763} {"train_loss": -24.87879753112793, "global_step": 229369, "epoch": 2763} {"train_loss": -24.40603256225586, "global_step": 229370, "epoch": 2763} {"train_loss": -24.964921951293945, "global_step": 229371, "epoch": 2763} {"train_loss": -24.32748031616211, "global_step": 229372, "epoch": 2763} {"train_loss": -24.582307815551758, "global_step": 229373, "epoch": 2763} {"train_loss": -24.5734806060791, "global_step": 229374, "epoch": 2763} {"train_loss": -24.682525634765625, "global_step": 229375, "epoch": 2763} {"train_loss": -24.50408363342285, "global_step": 229376, "epoch": 2763} {"train_loss": -24.7216854095459, "global_step": 229377, "epoch": 2763} {"train_loss": -24.714109420776367, "global_step": 229378, "epoch": 2763} {"train_loss": -24.54074478149414, "global_step": 229379, "epoch": 2763} {"train_loss": -24.595487594604492, "global_step": 229380, "epoch": 2763} {"train_loss": -24.15994644165039, "global_step": 229381, "epoch": 2763} {"train_loss": -24.0858097076416, "global_step": 229382, "epoch": 2763} {"train_loss": -24.442874908447266, "global_step": 229383, "epoch": 2763} {"train_loss": -24.93619728088379, "global_step": 229384, "epoch": 2763} {"train_loss": -24.426921844482422, "global_step": 229385, "epoch": 2763} {"train_loss": -24.56813621520996, "global_step": 229386, "epoch": 2763} {"train_loss": -24.680694580078125, "global_step": 229387, "epoch": 2763} {"train_loss": -24.346405029296875, "global_step": 229388, "epoch": 2763} {"train_loss": -24.48253631591797, "global_step": 229389, "epoch": 2763} {"train_loss": -24.540925979614258, "global_step": 229390, "epoch": 2763} {"train_loss": -24.36977195739746, "global_step": 229391, "epoch": 2763} {"train_loss": -24.450336456298828, "global_step": 229392, "epoch": 2763} {"train_loss": -24.668476104736328, "global_step": 229393, "epoch": 2763} {"train_loss": -24.612144470214844, "global_step": 229394, "epoch": 2763} {"train_loss": -24.722299575805664, "global_step": 229395, "epoch": 2763} {"train_loss": -24.55710792541504, "global_step": 229396, "epoch": 2763} {"train_loss": -24.728164672851562, "global_step": 229397, "epoch": 2763} {"train_loss": -24.69098472595215, "global_step": 229398, "epoch": 2763} {"train_loss": -24.30061912536621, "global_step": 229399, "epoch": 2763} {"train_loss": -24.503507614135742, "global_step": 229400, "epoch": 2763} {"train_loss": -24.887577056884766, "global_step": 229401, "epoch": 2763} {"train_loss": -24.979692459106445, "global_step": 229402, "epoch": 2763} {"train_loss": -24.619272232055664, "global_step": 229403, "epoch": 2763} {"train_loss": -24.659381866455078, "global_step": 229404, "epoch": 2763} {"train_loss": -24.774658203125, "global_step": 229405, "epoch": 2763} {"train_loss": -24.681522369384766, "global_step": 229406, "epoch": 2763} {"train_loss": -24.8465633392334, "global_step": 229407, "epoch": 2763} {"train_loss": -24.599573135375977, "global_step": 229408, "epoch": 2763} {"train_loss": -24.640939712524414, "global_step": 229409, "epoch": 2763} {"train_loss": -24.96409034729004, "global_step": 229410, "epoch": 2763} {"train_loss": -24.648750902658485, "global_step": 229411, "epoch": 2763, "val_loss": 6614038.0} {"train_loss": -23.938236236572266, "global_step": 229412, "epoch": 2764} {"train_loss": -24.243518829345703, "global_step": 229413, "epoch": 2764} {"train_loss": -24.232179641723633, "global_step": 229414, "epoch": 2764} {"train_loss": -24.11252212524414, "global_step": 229415, "epoch": 2764} {"train_loss": -24.467130661010742, "global_step": 229416, "epoch": 2764} {"train_loss": -23.979970932006836, "global_step": 229417, "epoch": 2764} {"train_loss": -24.230527877807617, "global_step": 229418, "epoch": 2764} {"train_loss": -24.113737106323242, "global_step": 229419, "epoch": 2764} {"train_loss": -24.4860897064209, "global_step": 229420, "epoch": 2764} {"train_loss": -24.203617095947266, "global_step": 229421, "epoch": 2764} {"train_loss": -24.4675235748291, "global_step": 229422, "epoch": 2764} {"train_loss": -24.45412254333496, "global_step": 229423, "epoch": 2764} {"train_loss": -24.187631607055664, "global_step": 229424, "epoch": 2764} {"train_loss": -24.65128517150879, "global_step": 229425, "epoch": 2764} {"train_loss": -24.28037452697754, "global_step": 229426, "epoch": 2764} {"train_loss": -24.462491989135742, "global_step": 229427, "epoch": 2764} {"train_loss": -24.236530303955078, "global_step": 229428, "epoch": 2764} {"train_loss": -24.572683334350586, "global_step": 229429, "epoch": 2764} {"train_loss": -24.691526412963867, "global_step": 229430, "epoch": 2764} {"train_loss": -24.502395629882812, "global_step": 229431, "epoch": 2764} {"train_loss": -24.712217330932617, "global_step": 229432, "epoch": 2764} {"train_loss": -24.527755737304688, "global_step": 229433, "epoch": 2764} {"train_loss": -24.67142677307129, "global_step": 229434, "epoch": 2764} {"train_loss": -24.560810089111328, "global_step": 229435, "epoch": 2764} {"train_loss": -24.770280838012695, "global_step": 229436, "epoch": 2764} {"train_loss": -24.729019165039062, "global_step": 229437, "epoch": 2764} {"train_loss": -24.72185707092285, "global_step": 229438, "epoch": 2764} {"train_loss": -25.07701301574707, "global_step": 229439, "epoch": 2764} {"train_loss": -24.466726303100586, "global_step": 229440, "epoch": 2764} {"train_loss": -24.45918846130371, "global_step": 229441, "epoch": 2764} {"train_loss": -24.681888580322266, "global_step": 229442, "epoch": 2764} {"train_loss": -24.82190704345703, "global_step": 229443, "epoch": 2764} {"train_loss": -24.75881004333496, "global_step": 229444, "epoch": 2764} {"train_loss": -24.701290130615234, "global_step": 229445, "epoch": 2764} {"train_loss": -24.659109115600586, "global_step": 229446, "epoch": 2764} {"train_loss": -24.43967628479004, "global_step": 229447, "epoch": 2764} {"train_loss": -25.244831085205078, "global_step": 229448, "epoch": 2764} {"train_loss": -24.65966033935547, "global_step": 229449, "epoch": 2764} {"train_loss": -24.415359497070312, "global_step": 229450, "epoch": 2764} {"train_loss": -24.63080406188965, "global_step": 229451, "epoch": 2764} {"train_loss": -24.70164680480957, "global_step": 229452, "epoch": 2764} {"train_loss": -25.235952377319336, "global_step": 229453, "epoch": 2764} {"train_loss": -24.737409591674805, "global_step": 229454, "epoch": 2764} {"train_loss": -24.774391174316406, "global_step": 229455, "epoch": 2764} {"train_loss": -24.494338989257812, "global_step": 229456, "epoch": 2764} {"train_loss": -25.13980484008789, "global_step": 229457, "epoch": 2764} {"train_loss": -25.086519241333008, "global_step": 229458, "epoch": 2764} {"train_loss": -24.707233428955078, "global_step": 229459, "epoch": 2764} {"train_loss": -24.895206451416016, "global_step": 229460, "epoch": 2764} {"train_loss": -24.79412269592285, "global_step": 229461, "epoch": 2764} {"train_loss": -24.690189361572266, "global_step": 229462, "epoch": 2764} {"train_loss": -24.768712997436523, "global_step": 229463, "epoch": 2764} {"train_loss": -24.600011825561523, "global_step": 229464, "epoch": 2764} {"train_loss": -24.67097282409668, "global_step": 229465, "epoch": 2764} {"train_loss": -24.708715438842773, "global_step": 229466, "epoch": 2764} {"train_loss": -24.65212059020996, "global_step": 229467, "epoch": 2764} {"train_loss": -25.070650100708008, "global_step": 229468, "epoch": 2764} {"train_loss": -24.668832778930664, "global_step": 229469, "epoch": 2764} {"train_loss": -24.802169799804688, "global_step": 229470, "epoch": 2764} {"train_loss": -24.732919692993164, "global_step": 229471, "epoch": 2764} {"train_loss": -24.71338653564453, "global_step": 229472, "epoch": 2764} {"train_loss": -24.829967498779297, "global_step": 229473, "epoch": 2764} {"train_loss": -24.672508239746094, "global_step": 229474, "epoch": 2764} {"train_loss": -24.948617935180664, "global_step": 229475, "epoch": 2764} {"train_loss": -24.91676139831543, "global_step": 229476, "epoch": 2764} {"train_loss": -24.81520652770996, "global_step": 229477, "epoch": 2764} {"train_loss": -24.864927291870117, "global_step": 229478, "epoch": 2764} {"train_loss": -24.447200775146484, "global_step": 229479, "epoch": 2764} {"train_loss": -24.428205490112305, "global_step": 229480, "epoch": 2764} {"train_loss": -24.9884033203125, "global_step": 229481, "epoch": 2764} {"train_loss": -23.92824363708496, "global_step": 229482, "epoch": 2764} {"train_loss": -24.43848991394043, "global_step": 229483, "epoch": 2764} {"train_loss": -24.435155868530273, "global_step": 229484, "epoch": 2764} {"train_loss": -24.42824363708496, "global_step": 229485, "epoch": 2764} {"train_loss": -24.5980281829834, "global_step": 229486, "epoch": 2764} {"train_loss": -24.31407928466797, "global_step": 229487, "epoch": 2764} {"train_loss": -24.582624435424805, "global_step": 229488, "epoch": 2764} {"train_loss": -24.539865493774414, "global_step": 229489, "epoch": 2764} {"train_loss": -24.36616325378418, "global_step": 229490, "epoch": 2764} {"train_loss": -24.956497192382812, "global_step": 229491, "epoch": 2764} {"train_loss": -24.9041748046875, "global_step": 229492, "epoch": 2764} {"train_loss": -24.462247848510742, "global_step": 229493, "epoch": 2764} {"train_loss": -24.612434180386096, "global_step": 229494, "epoch": 2764, "val_loss": 6758622.0} {"train_loss": -24.102994918823242, "global_step": 229495, "epoch": 2765} {"train_loss": -23.736806869506836, "global_step": 229496, "epoch": 2765} {"train_loss": -24.052427291870117, "global_step": 229497, "epoch": 2765} {"train_loss": -24.098480224609375, "global_step": 229498, "epoch": 2765} {"train_loss": -24.064008712768555, "global_step": 229499, "epoch": 2765} {"train_loss": -24.13599395751953, "global_step": 229500, "epoch": 2765} {"train_loss": -24.364084243774414, "global_step": 229501, "epoch": 2765} {"train_loss": -24.534671783447266, "global_step": 229502, "epoch": 2765} {"train_loss": -24.20033073425293, "global_step": 229503, "epoch": 2765} {"train_loss": -24.394132614135742, "global_step": 229504, "epoch": 2765} {"train_loss": -24.663883209228516, "global_step": 229505, "epoch": 2765} {"train_loss": -24.4385929107666, "global_step": 229506, "epoch": 2765} {"train_loss": -24.564929962158203, "global_step": 229507, "epoch": 2765} {"train_loss": -24.437931060791016, "global_step": 229508, "epoch": 2765} {"train_loss": -24.53127098083496, "global_step": 229509, "epoch": 2765} {"train_loss": -24.54880714416504, "global_step": 229510, "epoch": 2765} {"train_loss": -24.882160186767578, "global_step": 229511, "epoch": 2765} {"train_loss": -24.661483764648438, "global_step": 229512, "epoch": 2765} {"train_loss": -24.702665328979492, "global_step": 229513, "epoch": 2765} {"train_loss": -24.567148208618164, "global_step": 229514, "epoch": 2765} {"train_loss": -24.376815795898438, "global_step": 229515, "epoch": 2765} {"train_loss": -24.2312068939209, "global_step": 229516, "epoch": 2765} {"train_loss": -24.587865829467773, "global_step": 229517, "epoch": 2765} {"train_loss": -24.795318603515625, "global_step": 229518, "epoch": 2765} {"train_loss": -24.825284957885742, "global_step": 229519, "epoch": 2765} {"train_loss": -24.410125732421875, "global_step": 229520, "epoch": 2765} {"train_loss": -24.960006713867188, "global_step": 229521, "epoch": 2765} {"train_loss": -24.861982345581055, "global_step": 229522, "epoch": 2765} {"train_loss": -24.719533920288086, "global_step": 229523, "epoch": 2765} {"train_loss": -24.715747833251953, "global_step": 229524, "epoch": 2765} {"train_loss": -24.864877700805664, "global_step": 229525, "epoch": 2765} {"train_loss": -24.567955017089844, "global_step": 229526, "epoch": 2765} {"train_loss": -24.66599464416504, "global_step": 229527, "epoch": 2765} {"train_loss": -25.176528930664062, "global_step": 229528, "epoch": 2765} {"train_loss": -24.77686882019043, "global_step": 229529, "epoch": 2765} {"train_loss": -24.776641845703125, "global_step": 229530, "epoch": 2765} {"train_loss": -24.720705032348633, "global_step": 229531, "epoch": 2765} {"train_loss": -24.493576049804688, "global_step": 229532, "epoch": 2765} {"train_loss": -25.00655174255371, "global_step": 229533, "epoch": 2765} {"train_loss": -25.005340576171875, "global_step": 229534, "epoch": 2765} {"train_loss": -24.78786277770996, "global_step": 229535, "epoch": 2765} {"train_loss": -24.628793716430664, "global_step": 229536, "epoch": 2765} {"train_loss": -24.941612243652344, "global_step": 229537, "epoch": 2765} {"train_loss": -24.864795684814453, "global_step": 229538, "epoch": 2765} {"train_loss": -24.58310890197754, "global_step": 229539, "epoch": 2765} {"train_loss": -24.431488037109375, "global_step": 229540, "epoch": 2765} {"train_loss": -24.497404098510742, "global_step": 229541, "epoch": 2765} {"train_loss": -24.82492446899414, "global_step": 229542, "epoch": 2765} {"train_loss": -25.041595458984375, "global_step": 229543, "epoch": 2765} {"train_loss": -24.677053451538086, "global_step": 229544, "epoch": 2765} {"train_loss": -24.686918258666992, "global_step": 229545, "epoch": 2765} {"train_loss": -24.53566551208496, "global_step": 229546, "epoch": 2765} {"train_loss": -24.469268798828125, "global_step": 229547, "epoch": 2765} {"train_loss": -24.18204116821289, "global_step": 229548, "epoch": 2765} {"train_loss": -24.72238540649414, "global_step": 229549, "epoch": 2765} {"train_loss": -25.281387329101562, "global_step": 229550, "epoch": 2765} {"train_loss": -24.664567947387695, "global_step": 229551, "epoch": 2765} {"train_loss": -24.428070068359375, "global_step": 229552, "epoch": 2765} {"train_loss": -24.72119140625, "global_step": 229553, "epoch": 2765} {"train_loss": -24.498388290405273, "global_step": 229554, "epoch": 2765} {"train_loss": -24.871057510375977, "global_step": 229555, "epoch": 2765} {"train_loss": -24.431838989257812, "global_step": 229556, "epoch": 2765} {"train_loss": -24.931148529052734, "global_step": 229557, "epoch": 2765} {"train_loss": -24.599456787109375, "global_step": 229558, "epoch": 2765} {"train_loss": -25.053466796875, "global_step": 229559, "epoch": 2765} {"train_loss": -24.68873405456543, "global_step": 229560, "epoch": 2765} {"train_loss": -24.742883682250977, "global_step": 229561, "epoch": 2765} {"train_loss": -24.619976043701172, "global_step": 229562, "epoch": 2765} {"train_loss": -24.95184898376465, "global_step": 229563, "epoch": 2765} {"train_loss": -24.473316192626953, "global_step": 229564, "epoch": 2765} {"train_loss": -24.649778366088867, "global_step": 229565, "epoch": 2765} {"train_loss": -25.009401321411133, "global_step": 229566, "epoch": 2765} {"train_loss": -24.564895629882812, "global_step": 229567, "epoch": 2765} {"train_loss": -24.721878051757812, "global_step": 229568, "epoch": 2765} {"train_loss": -24.826810836791992, "global_step": 229569, "epoch": 2765} {"train_loss": -24.896602630615234, "global_step": 229570, "epoch": 2765} {"train_loss": -24.69379234313965, "global_step": 229571, "epoch": 2765} {"train_loss": -24.682096481323242, "global_step": 229572, "epoch": 2765} {"train_loss": -24.714574813842773, "global_step": 229573, "epoch": 2765} {"train_loss": -24.974912643432617, "global_step": 229574, "epoch": 2765} {"train_loss": -24.657363891601562, "global_step": 229575, "epoch": 2765} {"train_loss": -24.859352111816406, "global_step": 229576, "epoch": 2765} {"train_loss": -24.647860423628106, "global_step": 229577, "epoch": 2765, "val_loss": 6768546.0} {"train_loss": -24.86087417602539, "global_step": 229578, "epoch": 2766} {"train_loss": -24.15174674987793, "global_step": 229579, "epoch": 2766} {"train_loss": -24.471364974975586, "global_step": 229580, "epoch": 2766} {"train_loss": -24.387550354003906, "global_step": 229581, "epoch": 2766} {"train_loss": -24.60700035095215, "global_step": 229582, "epoch": 2766} {"train_loss": -24.75069236755371, "global_step": 229583, "epoch": 2766} {"train_loss": -24.225934982299805, "global_step": 229584, "epoch": 2766} {"train_loss": -24.300321578979492, "global_step": 229585, "epoch": 2766} {"train_loss": -23.3550968170166, "global_step": 229586, "epoch": 2766} {"train_loss": -23.910505294799805, "global_step": 229587, "epoch": 2766} {"train_loss": -23.62668800354004, "global_step": 229588, "epoch": 2766} {"train_loss": -24.502704620361328, "global_step": 229589, "epoch": 2766} {"train_loss": -24.072519302368164, "global_step": 229590, "epoch": 2766} {"train_loss": -24.631427764892578, "global_step": 229591, "epoch": 2766} {"train_loss": -24.433225631713867, "global_step": 229592, "epoch": 2766} {"train_loss": -24.466211318969727, "global_step": 229593, "epoch": 2766} {"train_loss": -24.634416580200195, "global_step": 229594, "epoch": 2766} {"train_loss": -24.42287254333496, "global_step": 229595, "epoch": 2766} {"train_loss": -24.63258934020996, "global_step": 229596, "epoch": 2766} {"train_loss": -24.39483642578125, "global_step": 229597, "epoch": 2766} {"train_loss": -24.429441452026367, "global_step": 229598, "epoch": 2766} {"train_loss": -24.848468780517578, "global_step": 229599, "epoch": 2766} {"train_loss": -25.016576766967773, "global_step": 229600, "epoch": 2766} {"train_loss": -24.522464752197266, "global_step": 229601, "epoch": 2766} {"train_loss": -24.858482360839844, "global_step": 229602, "epoch": 2766} {"train_loss": -24.980398178100586, "global_step": 229603, "epoch": 2766} {"train_loss": -24.679622650146484, "global_step": 229604, "epoch": 2766} {"train_loss": -24.9307804107666, "global_step": 229605, "epoch": 2766} {"train_loss": -24.761030197143555, "global_step": 229606, "epoch": 2766} {"train_loss": -24.834423065185547, "global_step": 229607, "epoch": 2766} {"train_loss": -24.52108383178711, "global_step": 229608, "epoch": 2766} {"train_loss": -24.64309310913086, "global_step": 229609, "epoch": 2766} {"train_loss": -24.834203720092773, "global_step": 229610, "epoch": 2766} {"train_loss": -24.687673568725586, "global_step": 229611, "epoch": 2766} {"train_loss": -25.015233993530273, "global_step": 229612, "epoch": 2766} {"train_loss": -24.724308013916016, "global_step": 229613, "epoch": 2766} {"train_loss": -24.55299186706543, "global_step": 229614, "epoch": 2766} {"train_loss": -24.449466705322266, "global_step": 229615, "epoch": 2766} {"train_loss": -25.039987564086914, "global_step": 229616, "epoch": 2766} {"train_loss": -24.986955642700195, "global_step": 229617, "epoch": 2766} {"train_loss": -24.830244064331055, "global_step": 229618, "epoch": 2766} {"train_loss": -25.023916244506836, "global_step": 229619, "epoch": 2766} {"train_loss": -24.983978271484375, "global_step": 229620, "epoch": 2766} {"train_loss": -24.790891647338867, "global_step": 229621, "epoch": 2766} {"train_loss": -25.087743759155273, "global_step": 229622, "epoch": 2766} {"train_loss": -25.003618240356445, "global_step": 229623, "epoch": 2766} {"train_loss": -24.672657012939453, "global_step": 229624, "epoch": 2766} {"train_loss": -24.928253173828125, "global_step": 229625, "epoch": 2766} {"train_loss": -25.24262046813965, "global_step": 229626, "epoch": 2766} {"train_loss": -24.966144561767578, "global_step": 229627, "epoch": 2766} {"train_loss": -24.677448272705078, "global_step": 229628, "epoch": 2766} {"train_loss": -24.913000106811523, "global_step": 229629, "epoch": 2766} {"train_loss": -24.672407150268555, "global_step": 229630, "epoch": 2766} {"train_loss": -25.165082931518555, "global_step": 229631, "epoch": 2766} {"train_loss": -25.003450393676758, "global_step": 229632, "epoch": 2766} {"train_loss": -25.206499099731445, "global_step": 229633, "epoch": 2766} {"train_loss": -24.929311752319336, "global_step": 229634, "epoch": 2766} {"train_loss": -24.792890548706055, "global_step": 229635, "epoch": 2766} {"train_loss": -24.67433738708496, "global_step": 229636, "epoch": 2766} {"train_loss": -24.85523796081543, "global_step": 229637, "epoch": 2766} {"train_loss": -25.101139068603516, "global_step": 229638, "epoch": 2766} {"train_loss": -24.64862060546875, "global_step": 229639, "epoch": 2766} {"train_loss": -24.49045753479004, "global_step": 229640, "epoch": 2766} {"train_loss": -24.285598754882812, "global_step": 229641, "epoch": 2766} {"train_loss": -24.38814926147461, "global_step": 229642, "epoch": 2766} {"train_loss": -24.178680419921875, "global_step": 229643, "epoch": 2766} {"train_loss": -24.257261276245117, "global_step": 229644, "epoch": 2766} {"train_loss": -23.98067283630371, "global_step": 229645, "epoch": 2766} {"train_loss": -24.554771423339844, "global_step": 229646, "epoch": 2766} {"train_loss": -24.699071884155273, "global_step": 229647, "epoch": 2766} {"train_loss": -24.238372802734375, "global_step": 229648, "epoch": 2766} {"train_loss": -24.648130416870117, "global_step": 229649, "epoch": 2766} {"train_loss": -24.593175888061523, "global_step": 229650, "epoch": 2766} {"train_loss": -24.68135643005371, "global_step": 229651, "epoch": 2766} {"train_loss": -24.310678482055664, "global_step": 229652, "epoch": 2766} {"train_loss": -24.657747268676758, "global_step": 229653, "epoch": 2766} {"train_loss": -24.582616806030273, "global_step": 229654, "epoch": 2766} {"train_loss": -24.77879524230957, "global_step": 229655, "epoch": 2766} {"train_loss": -24.71965980529785, "global_step": 229656, "epoch": 2766} {"train_loss": -24.476755142211914, "global_step": 229657, "epoch": 2766} {"train_loss": -24.76028060913086, "global_step": 229658, "epoch": 2766} {"train_loss": -24.756479263305664, "global_step": 229659, "epoch": 2766} {"train_loss": -24.651146003998907, "global_step": 229660, "epoch": 2766, "val_loss": 6830460.0} {"train_loss": -23.99137306213379, "global_step": 229661, "epoch": 2767} {"train_loss": -24.61213493347168, "global_step": 229662, "epoch": 2767} {"train_loss": -24.4630184173584, "global_step": 229663, "epoch": 2767} {"train_loss": -24.81308364868164, "global_step": 229664, "epoch": 2767} {"train_loss": -24.213886260986328, "global_step": 229665, "epoch": 2767} {"train_loss": -24.699460983276367, "global_step": 229666, "epoch": 2767} {"train_loss": -24.241270065307617, "global_step": 229667, "epoch": 2767} {"train_loss": -24.18934440612793, "global_step": 229668, "epoch": 2767} {"train_loss": -24.614145278930664, "global_step": 229669, "epoch": 2767} {"train_loss": -24.630245208740234, "global_step": 229670, "epoch": 2767} {"train_loss": -24.450119018554688, "global_step": 229671, "epoch": 2767} {"train_loss": -24.511442184448242, "global_step": 229672, "epoch": 2767} {"train_loss": -24.71099281311035, "global_step": 229673, "epoch": 2767} {"train_loss": -24.602249145507812, "global_step": 229674, "epoch": 2767} {"train_loss": -24.504703521728516, "global_step": 229675, "epoch": 2767} {"train_loss": -25.03736114501953, "global_step": 229676, "epoch": 2767} {"train_loss": -24.761098861694336, "global_step": 229677, "epoch": 2767} {"train_loss": -24.799602508544922, "global_step": 229678, "epoch": 2767} {"train_loss": -24.706844329833984, "global_step": 229679, "epoch": 2767} {"train_loss": -24.896364212036133, "global_step": 229680, "epoch": 2767} {"train_loss": -24.3538818359375, "global_step": 229681, "epoch": 2767} {"train_loss": -24.874967575073242, "global_step": 229682, "epoch": 2767} {"train_loss": -24.766685485839844, "global_step": 229683, "epoch": 2767} {"train_loss": -24.66792106628418, "global_step": 229684, "epoch": 2767} {"train_loss": -24.68170738220215, "global_step": 229685, "epoch": 2767} {"train_loss": -24.3362979888916, "global_step": 229686, "epoch": 2767} {"train_loss": -24.6801815032959, "global_step": 229687, "epoch": 2767} {"train_loss": -24.317970275878906, "global_step": 229688, "epoch": 2767} {"train_loss": -24.521358489990234, "global_step": 229689, "epoch": 2767} {"train_loss": -24.70033836364746, "global_step": 229690, "epoch": 2767} {"train_loss": -24.765108108520508, "global_step": 229691, "epoch": 2767} {"train_loss": -24.390216827392578, "global_step": 229692, "epoch": 2767} {"train_loss": -24.414587020874023, "global_step": 229693, "epoch": 2767} {"train_loss": -24.724729537963867, "global_step": 229694, "epoch": 2767} {"train_loss": -24.1517333984375, "global_step": 229695, "epoch": 2767} {"train_loss": -24.858596801757812, "global_step": 229696, "epoch": 2767} {"train_loss": -24.565814971923828, "global_step": 229697, "epoch": 2767} {"train_loss": -24.66499137878418, "global_step": 229698, "epoch": 2767} {"train_loss": -24.25878143310547, "global_step": 229699, "epoch": 2767} {"train_loss": -24.54766845703125, "global_step": 229700, "epoch": 2767} {"train_loss": -24.609392166137695, "global_step": 229701, "epoch": 2767} {"train_loss": -24.547597885131836, "global_step": 229702, "epoch": 2767} {"train_loss": -24.672107696533203, "global_step": 229703, "epoch": 2767} {"train_loss": -24.738325119018555, "global_step": 229704, "epoch": 2767} {"train_loss": -24.6441593170166, "global_step": 229705, "epoch": 2767} {"train_loss": -24.670852661132812, "global_step": 229706, "epoch": 2767} {"train_loss": -24.3907413482666, "global_step": 229707, "epoch": 2767} {"train_loss": -24.115985870361328, "global_step": 229708, "epoch": 2767} {"train_loss": -24.686443328857422, "global_step": 229709, "epoch": 2767} {"train_loss": -24.347410202026367, "global_step": 229710, "epoch": 2767} {"train_loss": -24.344236373901367, "global_step": 229711, "epoch": 2767} {"train_loss": -24.230045318603516, "global_step": 229712, "epoch": 2767} {"train_loss": -24.377840042114258, "global_step": 229713, "epoch": 2767} {"train_loss": -24.889562606811523, "global_step": 229714, "epoch": 2767} {"train_loss": -24.459857940673828, "global_step": 229715, "epoch": 2767} {"train_loss": -24.69063949584961, "global_step": 229716, "epoch": 2767} {"train_loss": -24.595333099365234, "global_step": 229717, "epoch": 2767} {"train_loss": -24.654586791992188, "global_step": 229718, "epoch": 2767} {"train_loss": -24.930265426635742, "global_step": 229719, "epoch": 2767} {"train_loss": -24.531780242919922, "global_step": 229720, "epoch": 2767} {"train_loss": -24.959524154663086, "global_step": 229721, "epoch": 2767} {"train_loss": -24.66192054748535, "global_step": 229722, "epoch": 2767} {"train_loss": -25.066059112548828, "global_step": 229723, "epoch": 2767} {"train_loss": -24.851076126098633, "global_step": 229724, "epoch": 2767} {"train_loss": -24.919126510620117, "global_step": 229725, "epoch": 2767} {"train_loss": -24.599393844604492, "global_step": 229726, "epoch": 2767} {"train_loss": -24.847379684448242, "global_step": 229727, "epoch": 2767} {"train_loss": -24.96966552734375, "global_step": 229728, "epoch": 2767} {"train_loss": -24.858667373657227, "global_step": 229729, "epoch": 2767} {"train_loss": -24.722644805908203, "global_step": 229730, "epoch": 2767} {"train_loss": -24.778308868408203, "global_step": 229731, "epoch": 2767} {"train_loss": -24.61282730102539, "global_step": 229732, "epoch": 2767} {"train_loss": -24.714208602905273, "global_step": 229733, "epoch": 2767} {"train_loss": -24.351470947265625, "global_step": 229734, "epoch": 2767} {"train_loss": -24.405723571777344, "global_step": 229735, "epoch": 2767} {"train_loss": -25.115686416625977, "global_step": 229736, "epoch": 2767} {"train_loss": -24.759931564331055, "global_step": 229737, "epoch": 2767} {"train_loss": -24.790205001831055, "global_step": 229738, "epoch": 2767} {"train_loss": -24.89942741394043, "global_step": 229739, "epoch": 2767} {"train_loss": -24.82539176940918, "global_step": 229740, "epoch": 2767} {"train_loss": -24.47852897644043, "global_step": 229741, "epoch": 2767} {"train_loss": -24.918577194213867, "global_step": 229742, "epoch": 2767} {"train_loss": -24.61310485472162, "global_step": 229743, "epoch": 2767, "val_loss": 6675945.0} {"train_loss": -24.320547103881836, "global_step": 229744, "epoch": 2768} {"train_loss": -24.319194793701172, "global_step": 229745, "epoch": 2768} {"train_loss": -24.505950927734375, "global_step": 229746, "epoch": 2768} {"train_loss": -24.071426391601562, "global_step": 229747, "epoch": 2768} {"train_loss": -24.470251083374023, "global_step": 229748, "epoch": 2768} {"train_loss": -24.150869369506836, "global_step": 229749, "epoch": 2768} {"train_loss": -24.289121627807617, "global_step": 229750, "epoch": 2768} {"train_loss": -24.37811851501465, "global_step": 229751, "epoch": 2768} {"train_loss": -24.312007904052734, "global_step": 229752, "epoch": 2768} {"train_loss": -24.409780502319336, "global_step": 229753, "epoch": 2768} {"train_loss": -24.34882164001465, "global_step": 229754, "epoch": 2768} {"train_loss": -24.35145378112793, "global_step": 229755, "epoch": 2768} {"train_loss": -24.78391456604004, "global_step": 229756, "epoch": 2768} {"train_loss": -23.899511337280273, "global_step": 229757, "epoch": 2768} {"train_loss": -24.388263702392578, "global_step": 229758, "epoch": 2768} {"train_loss": -24.813865661621094, "global_step": 229759, "epoch": 2768} {"train_loss": -24.59528923034668, "global_step": 229760, "epoch": 2768} {"train_loss": -24.73135757446289, "global_step": 229761, "epoch": 2768} {"train_loss": -24.54073143005371, "global_step": 229762, "epoch": 2768} {"train_loss": -24.693830490112305, "global_step": 229763, "epoch": 2768} {"train_loss": -24.571250915527344, "global_step": 229764, "epoch": 2768} {"train_loss": -24.702268600463867, "global_step": 229765, "epoch": 2768} {"train_loss": -24.618228912353516, "global_step": 229766, "epoch": 2768} {"train_loss": -24.65195655822754, "global_step": 229767, "epoch": 2768} {"train_loss": -24.58861541748047, "global_step": 229768, "epoch": 2768} {"train_loss": -24.748624801635742, "global_step": 229769, "epoch": 2768} {"train_loss": -25.050342559814453, "global_step": 229770, "epoch": 2768} {"train_loss": -25.01984214782715, "global_step": 229771, "epoch": 2768} {"train_loss": -24.656635284423828, "global_step": 229772, "epoch": 2768} {"train_loss": -24.712228775024414, "global_step": 229773, "epoch": 2768} {"train_loss": -24.65228843688965, "global_step": 229774, "epoch": 2768} {"train_loss": -24.423742294311523, "global_step": 229775, "epoch": 2768} {"train_loss": -25.104894638061523, "global_step": 229776, "epoch": 2768} {"train_loss": -24.35597038269043, "global_step": 229777, "epoch": 2768} {"train_loss": -24.675474166870117, "global_step": 229778, "epoch": 2768} {"train_loss": -25.178491592407227, "global_step": 229779, "epoch": 2768} {"train_loss": -25.024999618530273, "global_step": 229780, "epoch": 2768} {"train_loss": -24.58967399597168, "global_step": 229781, "epoch": 2768} {"train_loss": -24.97440528869629, "global_step": 229782, "epoch": 2768} {"train_loss": -25.1163387298584, "global_step": 229783, "epoch": 2768} {"train_loss": -25.20926284790039, "global_step": 229784, "epoch": 2768} {"train_loss": -24.833097457885742, "global_step": 229785, "epoch": 2768} {"train_loss": -24.843172073364258, "global_step": 229786, "epoch": 2768} {"train_loss": -24.901268005371094, "global_step": 229787, "epoch": 2768} {"train_loss": -25.062536239624023, "global_step": 229788, "epoch": 2768} {"train_loss": -24.36330795288086, "global_step": 229789, "epoch": 2768} {"train_loss": -24.556543350219727, "global_step": 229790, "epoch": 2768} {"train_loss": -24.223831176757812, "global_step": 229791, "epoch": 2768} {"train_loss": -23.581531524658203, "global_step": 229792, "epoch": 2768} {"train_loss": -22.84319496154785, "global_step": 229793, "epoch": 2768} {"train_loss": -23.691606521606445, "global_step": 229794, "epoch": 2768} {"train_loss": -24.57063102722168, "global_step": 229795, "epoch": 2768} {"train_loss": -24.133047103881836, "global_step": 229796, "epoch": 2768} {"train_loss": -23.95252799987793, "global_step": 229797, "epoch": 2768} {"train_loss": -24.669260025024414, "global_step": 229798, "epoch": 2768} {"train_loss": -24.070743560791016, "global_step": 229799, "epoch": 2768} {"train_loss": -24.33039665222168, "global_step": 229800, "epoch": 2768} {"train_loss": -24.078365325927734, "global_step": 229801, "epoch": 2768} {"train_loss": -24.151180267333984, "global_step": 229802, "epoch": 2768} {"train_loss": -24.130876541137695, "global_step": 229803, "epoch": 2768} {"train_loss": -24.863719940185547, "global_step": 229804, "epoch": 2768} {"train_loss": -24.546051025390625, "global_step": 229805, "epoch": 2768} {"train_loss": -24.598251342773438, "global_step": 229806, "epoch": 2768} {"train_loss": -24.788267135620117, "global_step": 229807, "epoch": 2768} {"train_loss": -24.140501022338867, "global_step": 229808, "epoch": 2768} {"train_loss": -24.482473373413086, "global_step": 229809, "epoch": 2768} {"train_loss": -24.532981872558594, "global_step": 229810, "epoch": 2768} {"train_loss": -24.95953369140625, "global_step": 229811, "epoch": 2768} {"train_loss": -24.588897705078125, "global_step": 229812, "epoch": 2768} {"train_loss": -24.538105010986328, "global_step": 229813, "epoch": 2768} {"train_loss": -24.565959930419922, "global_step": 229814, "epoch": 2768} {"train_loss": -24.483184814453125, "global_step": 229815, "epoch": 2768} {"train_loss": -24.982446670532227, "global_step": 229816, "epoch": 2768} {"train_loss": -24.533843994140625, "global_step": 229817, "epoch": 2768} {"train_loss": -24.790557861328125, "global_step": 229818, "epoch": 2768} {"train_loss": -24.67371940612793, "global_step": 229819, "epoch": 2768} {"train_loss": -24.896154403686523, "global_step": 229820, "epoch": 2768} {"train_loss": -24.4907283782959, "global_step": 229821, "epoch": 2768} {"train_loss": -24.969379425048828, "global_step": 229822, "epoch": 2768} {"train_loss": -24.621522903442383, "global_step": 229823, "epoch": 2768} {"train_loss": -24.731342315673828, "global_step": 229824, "epoch": 2768} {"train_loss": -24.471179962158203, "global_step": 229825, "epoch": 2768} {"train_loss": -24.53706513829978, "global_step": 229826, "epoch": 2768, "val_loss": 6860777.0} {"train_loss": -24.660053253173828, "global_step": 229827, "epoch": 2769} {"train_loss": -24.89224624633789, "global_step": 229828, "epoch": 2769} {"train_loss": -24.670289993286133, "global_step": 229829, "epoch": 2769} {"train_loss": -24.87428855895996, "global_step": 229830, "epoch": 2769} {"train_loss": -24.68582534790039, "global_step": 229831, "epoch": 2769} {"train_loss": -24.533681869506836, "global_step": 229832, "epoch": 2769} {"train_loss": -24.358081817626953, "global_step": 229833, "epoch": 2769} {"train_loss": -24.612274169921875, "global_step": 229834, "epoch": 2769} {"train_loss": -25.18203353881836, "global_step": 229835, "epoch": 2769} {"train_loss": -24.398300170898438, "global_step": 229836, "epoch": 2769} {"train_loss": -24.609806060791016, "global_step": 229837, "epoch": 2769} {"train_loss": -24.670398712158203, "global_step": 229838, "epoch": 2769} {"train_loss": -24.536787033081055, "global_step": 229839, "epoch": 2769} {"train_loss": -25.098037719726562, "global_step": 229840, "epoch": 2769} {"train_loss": -24.491483688354492, "global_step": 229841, "epoch": 2769} {"train_loss": -25.008533477783203, "global_step": 229842, "epoch": 2769} {"train_loss": -24.651639938354492, "global_step": 229843, "epoch": 2769} {"train_loss": -24.82987403869629, "global_step": 229844, "epoch": 2769} {"train_loss": -24.672765731811523, "global_step": 229845, "epoch": 2769} {"train_loss": -24.988656997680664, "global_step": 229846, "epoch": 2769} {"train_loss": -24.582504272460938, "global_step": 229847, "epoch": 2769} {"train_loss": -24.695295333862305, "global_step": 229848, "epoch": 2769} {"train_loss": -24.814050674438477, "global_step": 229849, "epoch": 2769} {"train_loss": -24.748241424560547, "global_step": 229850, "epoch": 2769} {"train_loss": -24.813629150390625, "global_step": 229851, "epoch": 2769} {"train_loss": -24.78728485107422, "global_step": 229852, "epoch": 2769} {"train_loss": -24.71989631652832, "global_step": 229853, "epoch": 2769} {"train_loss": -24.8250732421875, "global_step": 229854, "epoch": 2769} {"train_loss": -25.021589279174805, "global_step": 229855, "epoch": 2769} {"train_loss": -24.908584594726562, "global_step": 229856, "epoch": 2769} {"train_loss": -24.864185333251953, "global_step": 229857, "epoch": 2769} {"train_loss": -25.116596221923828, "global_step": 229858, "epoch": 2769} {"train_loss": -24.930418014526367, "global_step": 229859, "epoch": 2769} {"train_loss": -24.603384017944336, "global_step": 229860, "epoch": 2769} {"train_loss": -24.951276779174805, "global_step": 229861, "epoch": 2769} {"train_loss": -24.97385597229004, "global_step": 229862, "epoch": 2769} {"train_loss": -24.402164459228516, "global_step": 229863, "epoch": 2769} {"train_loss": -24.746143341064453, "global_step": 229864, "epoch": 2769} {"train_loss": -24.488834381103516, "global_step": 229865, "epoch": 2769} {"train_loss": -25.016393661499023, "global_step": 229866, "epoch": 2769} {"train_loss": -24.717002868652344, "global_step": 229867, "epoch": 2769} {"train_loss": -24.507064819335938, "global_step": 229868, "epoch": 2769} {"train_loss": -24.715457916259766, "global_step": 229869, "epoch": 2769} {"train_loss": -25.045412063598633, "global_step": 229870, "epoch": 2769} {"train_loss": -24.46453285217285, "global_step": 229871, "epoch": 2769} {"train_loss": -24.656843185424805, "global_step": 229872, "epoch": 2769} {"train_loss": -24.777185440063477, "global_step": 229873, "epoch": 2769} {"train_loss": -24.475330352783203, "global_step": 229874, "epoch": 2769} {"train_loss": -24.752038955688477, "global_step": 229875, "epoch": 2769} {"train_loss": -24.512483596801758, "global_step": 229876, "epoch": 2769} {"train_loss": -24.983911514282227, "global_step": 229877, "epoch": 2769} {"train_loss": -24.251026153564453, "global_step": 229878, "epoch": 2769} {"train_loss": -24.773508071899414, "global_step": 229879, "epoch": 2769} {"train_loss": -24.65797233581543, "global_step": 229880, "epoch": 2769} {"train_loss": -24.390363693237305, "global_step": 229881, "epoch": 2769} {"train_loss": -24.924959182739258, "global_step": 229882, "epoch": 2769} {"train_loss": -24.742246627807617, "global_step": 229883, "epoch": 2769} {"train_loss": -25.090225219726562, "global_step": 229884, "epoch": 2769} {"train_loss": -24.743366241455078, "global_step": 229885, "epoch": 2769} {"train_loss": -24.539594650268555, "global_step": 229886, "epoch": 2769} {"train_loss": -24.713987350463867, "global_step": 229887, "epoch": 2769} {"train_loss": -24.84956932067871, "global_step": 229888, "epoch": 2769} {"train_loss": -24.70215606689453, "global_step": 229889, "epoch": 2769} {"train_loss": -24.677356719970703, "global_step": 229890, "epoch": 2769} {"train_loss": -24.67728614807129, "global_step": 229891, "epoch": 2769} {"train_loss": -24.877304077148438, "global_step": 229892, "epoch": 2769} {"train_loss": -24.602598190307617, "global_step": 229893, "epoch": 2769} {"train_loss": -25.025205612182617, "global_step": 229894, "epoch": 2769} {"train_loss": -24.802392959594727, "global_step": 229895, "epoch": 2769} {"train_loss": -24.81226921081543, "global_step": 229896, "epoch": 2769} {"train_loss": -24.860946655273438, "global_step": 229897, "epoch": 2769} {"train_loss": -25.193403244018555, "global_step": 229898, "epoch": 2769} {"train_loss": -25.052881240844727, "global_step": 229899, "epoch": 2769} {"train_loss": -24.515522003173828, "global_step": 229900, "epoch": 2769} {"train_loss": -25.149551391601562, "global_step": 229901, "epoch": 2769} {"train_loss": -24.95814323425293, "global_step": 229902, "epoch": 2769} {"train_loss": -24.95073127746582, "global_step": 229903, "epoch": 2769} {"train_loss": -24.8115291595459, "global_step": 229904, "epoch": 2769} {"train_loss": -25.02829360961914, "global_step": 229905, "epoch": 2769} {"train_loss": -24.84380531311035, "global_step": 229906, "epoch": 2769} {"train_loss": -24.181137084960938, "global_step": 229907, "epoch": 2769} {"train_loss": -24.26192283630371, "global_step": 229908, "epoch": 2769} {"train_loss": -24.751414310501282, "global_step": 229909, "epoch": 2769, "val_loss": 6797205.0} {"train_loss": -24.38189125061035, "global_step": 229910, "epoch": 2770} {"train_loss": -23.44821548461914, "global_step": 229911, "epoch": 2770} {"train_loss": -24.615081787109375, "global_step": 229912, "epoch": 2770} {"train_loss": -24.21933364868164, "global_step": 229913, "epoch": 2770} {"train_loss": -24.3835391998291, "global_step": 229914, "epoch": 2770} {"train_loss": -24.329605102539062, "global_step": 229915, "epoch": 2770} {"train_loss": -23.897811889648438, "global_step": 229916, "epoch": 2770} {"train_loss": -24.888999938964844, "global_step": 229917, "epoch": 2770} {"train_loss": -24.035415649414062, "global_step": 229918, "epoch": 2770} {"train_loss": -24.43703269958496, "global_step": 229919, "epoch": 2770} {"train_loss": -24.408788681030273, "global_step": 229920, "epoch": 2770} {"train_loss": -24.253013610839844, "global_step": 229921, "epoch": 2770} {"train_loss": -24.47157859802246, "global_step": 229922, "epoch": 2770} {"train_loss": -24.690032958984375, "global_step": 229923, "epoch": 2770} {"train_loss": -24.709226608276367, "global_step": 229924, "epoch": 2770} {"train_loss": -24.692190170288086, "global_step": 229925, "epoch": 2770} {"train_loss": -24.845624923706055, "global_step": 229926, "epoch": 2770} {"train_loss": -24.822221755981445, "global_step": 229927, "epoch": 2770} {"train_loss": -24.605554580688477, "global_step": 229928, "epoch": 2770} {"train_loss": -24.777393341064453, "global_step": 229929, "epoch": 2770} {"train_loss": -24.812856674194336, "global_step": 229930, "epoch": 2770} {"train_loss": -24.787805557250977, "global_step": 229931, "epoch": 2770} {"train_loss": -24.430368423461914, "global_step": 229932, "epoch": 2770} {"train_loss": -24.56239891052246, "global_step": 229933, "epoch": 2770} {"train_loss": -25.071340560913086, "global_step": 229934, "epoch": 2770} {"train_loss": -25.09447479248047, "global_step": 229935, "epoch": 2770} {"train_loss": -25.054140090942383, "global_step": 229936, "epoch": 2770} {"train_loss": -24.501359939575195, "global_step": 229937, "epoch": 2770} {"train_loss": -24.977176666259766, "global_step": 229938, "epoch": 2770} {"train_loss": -24.768186569213867, "global_step": 229939, "epoch": 2770} {"train_loss": -24.5718936920166, "global_step": 229940, "epoch": 2770} {"train_loss": -24.64082908630371, "global_step": 229941, "epoch": 2770} {"train_loss": -24.994945526123047, "global_step": 229942, "epoch": 2770} {"train_loss": -24.7883243560791, "global_step": 229943, "epoch": 2770} {"train_loss": -24.937456130981445, "global_step": 229944, "epoch": 2770} {"train_loss": -24.8510684967041, "global_step": 229945, "epoch": 2770} {"train_loss": -24.90233039855957, "global_step": 229946, "epoch": 2770} {"train_loss": -24.607803344726562, "global_step": 229947, "epoch": 2770} {"train_loss": -24.690061569213867, "global_step": 229948, "epoch": 2770} {"train_loss": -24.9993953704834, "global_step": 229949, "epoch": 2770} {"train_loss": -24.957229614257812, "global_step": 229950, "epoch": 2770} {"train_loss": -24.767162322998047, "global_step": 229951, "epoch": 2770} {"train_loss": -24.86102867126465, "global_step": 229952, "epoch": 2770} {"train_loss": -24.83885383605957, "global_step": 229953, "epoch": 2770} {"train_loss": -24.38947868347168, "global_step": 229954, "epoch": 2770} {"train_loss": -24.78568458557129, "global_step": 229955, "epoch": 2770} {"train_loss": -24.718109130859375, "global_step": 229956, "epoch": 2770} {"train_loss": -24.65811538696289, "global_step": 229957, "epoch": 2770} {"train_loss": -24.71036720275879, "global_step": 229958, "epoch": 2770} {"train_loss": -24.68836212158203, "global_step": 229959, "epoch": 2770} {"train_loss": -24.708328247070312, "global_step": 229960, "epoch": 2770} {"train_loss": -24.663055419921875, "global_step": 229961, "epoch": 2770} {"train_loss": -24.533235549926758, "global_step": 229962, "epoch": 2770} {"train_loss": -24.771909713745117, "global_step": 229963, "epoch": 2770} {"train_loss": -24.979230880737305, "global_step": 229964, "epoch": 2770} {"train_loss": -25.24225425720215, "global_step": 229965, "epoch": 2770} {"train_loss": -24.650625228881836, "global_step": 229966, "epoch": 2770} {"train_loss": -24.23627281188965, "global_step": 229967, "epoch": 2770} {"train_loss": -24.524845123291016, "global_step": 229968, "epoch": 2770} {"train_loss": -24.87522315979004, "global_step": 229969, "epoch": 2770} {"train_loss": -24.469120025634766, "global_step": 229970, "epoch": 2770} {"train_loss": -24.500457763671875, "global_step": 229971, "epoch": 2770} {"train_loss": -25.060352325439453, "global_step": 229972, "epoch": 2770} {"train_loss": -24.74983024597168, "global_step": 229973, "epoch": 2770} {"train_loss": -24.553220748901367, "global_step": 229974, "epoch": 2770} {"train_loss": -24.574731826782227, "global_step": 229975, "epoch": 2770} {"train_loss": -24.58149528503418, "global_step": 229976, "epoch": 2770} {"train_loss": -24.63965606689453, "global_step": 229977, "epoch": 2770} {"train_loss": -24.771282196044922, "global_step": 229978, "epoch": 2770} {"train_loss": -24.501436233520508, "global_step": 229979, "epoch": 2770} {"train_loss": -24.69557762145996, "global_step": 229980, "epoch": 2770} {"train_loss": -24.919034957885742, "global_step": 229981, "epoch": 2770} {"train_loss": -24.51678466796875, "global_step": 229982, "epoch": 2770} {"train_loss": -24.557666778564453, "global_step": 229983, "epoch": 2770} {"train_loss": -24.634340286254883, "global_step": 229984, "epoch": 2770} {"train_loss": -24.933034896850586, "global_step": 229985, "epoch": 2770} {"train_loss": -24.582416534423828, "global_step": 229986, "epoch": 2770} {"train_loss": -24.73475456237793, "global_step": 229987, "epoch": 2770} {"train_loss": -24.916940689086914, "global_step": 229988, "epoch": 2770} {"train_loss": -24.97623634338379, "global_step": 229989, "epoch": 2770} {"train_loss": -24.592687606811523, "global_step": 229990, "epoch": 2770} {"train_loss": -24.75364112854004, "global_step": 229991, "epoch": 2770} {"train_loss": -24.686049587755317, "global_step": 229992, "epoch": 2770, "val_loss": 6651131.0} {"train_loss": -22.256134033203125, "global_step": 229993, "epoch": 2771} {"train_loss": -22.618066787719727, "global_step": 229994, "epoch": 2771} {"train_loss": -22.15590476989746, "global_step": 229995, "epoch": 2771} {"train_loss": -23.68842124938965, "global_step": 229996, "epoch": 2771} {"train_loss": -23.2431640625, "global_step": 229997, "epoch": 2771} {"train_loss": -23.180875778198242, "global_step": 229998, "epoch": 2771} {"train_loss": -23.743900299072266, "global_step": 229999, "epoch": 2771} {"train_loss": -23.3697452545166, "global_step": 230000, "epoch": 2771} {"train_loss": -23.781814575195312, "global_step": 230001, "epoch": 2771} {"train_loss": -23.376405715942383, "global_step": 230002, "epoch": 2771} {"train_loss": -23.436262130737305, "global_step": 230003, "epoch": 2771} {"train_loss": -24.073843002319336, "global_step": 230004, "epoch": 2771} {"train_loss": -23.943607330322266, "global_step": 230005, "epoch": 2771} {"train_loss": -24.22176170349121, "global_step": 230006, "epoch": 2771} {"train_loss": -24.09612464904785, "global_step": 230007, "epoch": 2771} {"train_loss": -24.107568740844727, "global_step": 230008, "epoch": 2771} {"train_loss": -24.214738845825195, "global_step": 230009, "epoch": 2771} {"train_loss": -24.04839515686035, "global_step": 230010, "epoch": 2771} {"train_loss": -24.188232421875, "global_step": 230011, "epoch": 2771} {"train_loss": -24.11602210998535, "global_step": 230012, "epoch": 2771} {"train_loss": -24.2490291595459, "global_step": 230013, "epoch": 2771} {"train_loss": -24.24818992614746, "global_step": 230014, "epoch": 2771} {"train_loss": -24.203954696655273, "global_step": 230015, "epoch": 2771} {"train_loss": -24.35346031188965, "global_step": 230016, "epoch": 2771} {"train_loss": -24.45223045349121, "global_step": 230017, "epoch": 2771} {"train_loss": -24.397075653076172, "global_step": 230018, "epoch": 2771} {"train_loss": -24.508909225463867, "global_step": 230019, "epoch": 2771} {"train_loss": -24.392553329467773, "global_step": 230020, "epoch": 2771} {"train_loss": -24.5396785736084, "global_step": 230021, "epoch": 2771} {"train_loss": -24.62553596496582, "global_step": 230022, "epoch": 2771} {"train_loss": -24.913137435913086, "global_step": 230023, "epoch": 2771} {"train_loss": -24.33634376525879, "global_step": 230024, "epoch": 2771} {"train_loss": -24.68598175048828, "global_step": 230025, "epoch": 2771} {"train_loss": -24.780399322509766, "global_step": 230026, "epoch": 2771} {"train_loss": -24.33234214782715, "global_step": 230027, "epoch": 2771} {"train_loss": -24.2091064453125, "global_step": 230028, "epoch": 2771} {"train_loss": -24.882429122924805, "global_step": 230029, "epoch": 2771} {"train_loss": -24.844329833984375, "global_step": 230030, "epoch": 2771} {"train_loss": -24.757137298583984, "global_step": 230031, "epoch": 2771} {"train_loss": -24.917203903198242, "global_step": 230032, "epoch": 2771} {"train_loss": -24.82244873046875, "global_step": 230033, "epoch": 2771} {"train_loss": -24.798261642456055, "global_step": 230034, "epoch": 2771} {"train_loss": -25.04715919494629, "global_step": 230035, "epoch": 2771} {"train_loss": -24.847515106201172, "global_step": 230036, "epoch": 2771} {"train_loss": -24.61812400817871, "global_step": 230037, "epoch": 2771} {"train_loss": -24.883451461791992, "global_step": 230038, "epoch": 2771} {"train_loss": -24.641908645629883, "global_step": 230039, "epoch": 2771} {"train_loss": -24.82267951965332, "global_step": 230040, "epoch": 2771} {"train_loss": -24.84412956237793, "global_step": 230041, "epoch": 2771} {"train_loss": -24.848482131958008, "global_step": 230042, "epoch": 2771} {"train_loss": -24.345460891723633, "global_step": 230043, "epoch": 2771} {"train_loss": -24.831987380981445, "global_step": 230044, "epoch": 2771} {"train_loss": -25.072660446166992, "global_step": 230045, "epoch": 2771} {"train_loss": -24.665857315063477, "global_step": 230046, "epoch": 2771} {"train_loss": -24.7216739654541, "global_step": 230047, "epoch": 2771} {"train_loss": -24.6219482421875, "global_step": 230048, "epoch": 2771} {"train_loss": -24.683530807495117, "global_step": 230049, "epoch": 2771} {"train_loss": -24.052892684936523, "global_step": 230050, "epoch": 2771} {"train_loss": -24.780536651611328, "global_step": 230051, "epoch": 2771} {"train_loss": -24.940082550048828, "global_step": 230052, "epoch": 2771} {"train_loss": -24.512170791625977, "global_step": 230053, "epoch": 2771} {"train_loss": -24.753904342651367, "global_step": 230054, "epoch": 2771} {"train_loss": -24.841278076171875, "global_step": 230055, "epoch": 2771} {"train_loss": -24.52860450744629, "global_step": 230056, "epoch": 2771} {"train_loss": -24.793704986572266, "global_step": 230057, "epoch": 2771} {"train_loss": -24.325387954711914, "global_step": 230058, "epoch": 2771} {"train_loss": -24.639205932617188, "global_step": 230059, "epoch": 2771} {"train_loss": -24.40334129333496, "global_step": 230060, "epoch": 2771} {"train_loss": -25.001861572265625, "global_step": 230061, "epoch": 2771} {"train_loss": -24.43512535095215, "global_step": 230062, "epoch": 2771} {"train_loss": -24.856481552124023, "global_step": 230063, "epoch": 2771} {"train_loss": -24.798025131225586, "global_step": 230064, "epoch": 2771} {"train_loss": -24.8582706451416, "global_step": 230065, "epoch": 2771} {"train_loss": -24.744586944580078, "global_step": 230066, "epoch": 2771} {"train_loss": -24.40706443786621, "global_step": 230067, "epoch": 2771} {"train_loss": -24.825998306274414, "global_step": 230068, "epoch": 2771} {"train_loss": -24.92058753967285, "global_step": 230069, "epoch": 2771} {"train_loss": -24.98493766784668, "global_step": 230070, "epoch": 2771} {"train_loss": -24.438203811645508, "global_step": 230071, "epoch": 2771} {"train_loss": -24.80380630493164, "global_step": 230072, "epoch": 2771} {"train_loss": -24.89961814880371, "global_step": 230073, "epoch": 2771} {"train_loss": -24.88020133972168, "global_step": 230074, "epoch": 2771} {"train_loss": -24.415563813175062, "global_step": 230075, "epoch": 2771, "val_loss": 6778118.0} {"train_loss": -24.4137020111084, "global_step": 230076, "epoch": 2772} {"train_loss": -24.454505920410156, "global_step": 230077, "epoch": 2772} {"train_loss": -24.80289077758789, "global_step": 230078, "epoch": 2772} {"train_loss": -24.891305923461914, "global_step": 230079, "epoch": 2772} {"train_loss": -24.388408660888672, "global_step": 230080, "epoch": 2772} {"train_loss": -24.173913955688477, "global_step": 230081, "epoch": 2772} {"train_loss": -24.316513061523438, "global_step": 230082, "epoch": 2772} {"train_loss": -24.448354721069336, "global_step": 230083, "epoch": 2772} {"train_loss": -24.85365104675293, "global_step": 230084, "epoch": 2772} {"train_loss": -24.37032127380371, "global_step": 230085, "epoch": 2772} {"train_loss": -24.774152755737305, "global_step": 230086, "epoch": 2772} {"train_loss": -24.47503662109375, "global_step": 230087, "epoch": 2772} {"train_loss": -24.65376853942871, "global_step": 230088, "epoch": 2772} {"train_loss": -24.872602462768555, "global_step": 230089, "epoch": 2772} {"train_loss": -24.432111740112305, "global_step": 230090, "epoch": 2772} {"train_loss": -24.561735153198242, "global_step": 230091, "epoch": 2772} {"train_loss": -24.832700729370117, "global_step": 230092, "epoch": 2772} {"train_loss": -25.188926696777344, "global_step": 230093, "epoch": 2772} {"train_loss": -24.735454559326172, "global_step": 230094, "epoch": 2772} {"train_loss": -24.580337524414062, "global_step": 230095, "epoch": 2772} {"train_loss": -24.53826332092285, "global_step": 230096, "epoch": 2772} {"train_loss": -24.635669708251953, "global_step": 230097, "epoch": 2772} {"train_loss": -24.65312385559082, "global_step": 230098, "epoch": 2772} {"train_loss": -24.81446075439453, "global_step": 230099, "epoch": 2772} {"train_loss": -24.589324951171875, "global_step": 230100, "epoch": 2772} {"train_loss": -25.00286293029785, "global_step": 230101, "epoch": 2772} {"train_loss": -24.828065872192383, "global_step": 230102, "epoch": 2772} {"train_loss": -24.668561935424805, "global_step": 230103, "epoch": 2772} {"train_loss": -25.059635162353516, "global_step": 230104, "epoch": 2772} {"train_loss": -25.179452896118164, "global_step": 230105, "epoch": 2772} {"train_loss": -24.56818389892578, "global_step": 230106, "epoch": 2772} {"train_loss": -24.329565048217773, "global_step": 230107, "epoch": 2772} {"train_loss": -25.24108123779297, "global_step": 230108, "epoch": 2772} {"train_loss": -24.767515182495117, "global_step": 230109, "epoch": 2772} {"train_loss": -24.82093620300293, "global_step": 230110, "epoch": 2772} {"train_loss": -24.951995849609375, "global_step": 230111, "epoch": 2772} {"train_loss": -24.843189239501953, "global_step": 230112, "epoch": 2772} {"train_loss": -24.832229614257812, "global_step": 230113, "epoch": 2772} {"train_loss": -24.808452606201172, "global_step": 230114, "epoch": 2772} {"train_loss": -24.777202606201172, "global_step": 230115, "epoch": 2772} {"train_loss": -24.80748748779297, "global_step": 230116, "epoch": 2772} {"train_loss": -24.61798095703125, "global_step": 230117, "epoch": 2772} {"train_loss": -24.880258560180664, "global_step": 230118, "epoch": 2772} {"train_loss": -24.80124282836914, "global_step": 230119, "epoch": 2772} {"train_loss": -24.61598777770996, "global_step": 230120, "epoch": 2772} {"train_loss": -24.970670700073242, "global_step": 230121, "epoch": 2772} {"train_loss": -24.83650016784668, "global_step": 230122, "epoch": 2772} {"train_loss": -24.57312774658203, "global_step": 230123, "epoch": 2772} {"train_loss": -24.605545043945312, "global_step": 230124, "epoch": 2772} {"train_loss": -24.468599319458008, "global_step": 230125, "epoch": 2772} {"train_loss": -24.843244552612305, "global_step": 230126, "epoch": 2772} {"train_loss": -24.513044357299805, "global_step": 230127, "epoch": 2772} {"train_loss": -24.60839080810547, "global_step": 230128, "epoch": 2772} {"train_loss": -24.772708892822266, "global_step": 230129, "epoch": 2772} {"train_loss": -24.37775230407715, "global_step": 230130, "epoch": 2772} {"train_loss": -25.170583724975586, "global_step": 230131, "epoch": 2772} {"train_loss": -24.595266342163086, "global_step": 230132, "epoch": 2772} {"train_loss": -24.903806686401367, "global_step": 230133, "epoch": 2772} {"train_loss": -24.617429733276367, "global_step": 230134, "epoch": 2772} {"train_loss": -24.64536476135254, "global_step": 230135, "epoch": 2772} {"train_loss": -24.6208553314209, "global_step": 230136, "epoch": 2772} {"train_loss": -25.024673461914062, "global_step": 230137, "epoch": 2772} {"train_loss": -24.966672897338867, "global_step": 230138, "epoch": 2772} {"train_loss": -24.963991165161133, "global_step": 230139, "epoch": 2772} {"train_loss": -24.716283798217773, "global_step": 230140, "epoch": 2772} {"train_loss": -24.758098602294922, "global_step": 230141, "epoch": 2772} {"train_loss": -24.611835479736328, "global_step": 230142, "epoch": 2772} {"train_loss": -24.996219635009766, "global_step": 230143, "epoch": 2772} {"train_loss": -24.99395751953125, "global_step": 230144, "epoch": 2772} {"train_loss": -24.964975357055664, "global_step": 230145, "epoch": 2772} {"train_loss": -24.66834831237793, "global_step": 230146, "epoch": 2772} {"train_loss": -24.8963565826416, "global_step": 230147, "epoch": 2772} {"train_loss": -24.8236141204834, "global_step": 230148, "epoch": 2772} {"train_loss": -24.865032196044922, "global_step": 230149, "epoch": 2772} {"train_loss": -24.642175674438477, "global_step": 230150, "epoch": 2772} {"train_loss": -24.931798934936523, "global_step": 230151, "epoch": 2772} {"train_loss": -24.818349838256836, "global_step": 230152, "epoch": 2772} {"train_loss": -24.7762451171875, "global_step": 230153, "epoch": 2772} {"train_loss": -24.90860366821289, "global_step": 230154, "epoch": 2772} {"train_loss": -24.904081344604492, "global_step": 230155, "epoch": 2772} {"train_loss": -25.08009147644043, "global_step": 230156, "epoch": 2772} {"train_loss": -24.85896110534668, "global_step": 230157, "epoch": 2772} {"train_loss": -24.719759263188006, "global_step": 230158, "epoch": 2772, "val_loss": 6684487.0} {"train_loss": -24.43695068359375, "global_step": 230159, "epoch": 2773} {"train_loss": -23.3824405670166, "global_step": 230160, "epoch": 2773} {"train_loss": -23.87598991394043, "global_step": 230161, "epoch": 2773} {"train_loss": -24.24698829650879, "global_step": 230162, "epoch": 2773} {"train_loss": -24.0878849029541, "global_step": 230163, "epoch": 2773} {"train_loss": -24.45222282409668, "global_step": 230164, "epoch": 2773} {"train_loss": -24.292678833007812, "global_step": 230165, "epoch": 2773} {"train_loss": -24.57327651977539, "global_step": 230166, "epoch": 2773} {"train_loss": -24.572874069213867, "global_step": 230167, "epoch": 2773} {"train_loss": -24.73386001586914, "global_step": 230168, "epoch": 2773} {"train_loss": -24.468297958374023, "global_step": 230169, "epoch": 2773} {"train_loss": -24.31720542907715, "global_step": 230170, "epoch": 2773} {"train_loss": -24.38589859008789, "global_step": 230171, "epoch": 2773} {"train_loss": -24.613174438476562, "global_step": 230172, "epoch": 2773} {"train_loss": -24.27886962890625, "global_step": 230173, "epoch": 2773} {"train_loss": -24.292724609375, "global_step": 230174, "epoch": 2773} {"train_loss": -24.09196662902832, "global_step": 230175, "epoch": 2773} {"train_loss": -24.66015625, "global_step": 230176, "epoch": 2773} {"train_loss": -24.66327476501465, "global_step": 230177, "epoch": 2773} {"train_loss": -24.758197784423828, "global_step": 230178, "epoch": 2773} {"train_loss": -24.766780853271484, "global_step": 230179, "epoch": 2773} {"train_loss": -24.6181697845459, "global_step": 230180, "epoch": 2773} {"train_loss": -24.558767318725586, "global_step": 230181, "epoch": 2773} {"train_loss": -24.40302848815918, "global_step": 230182, "epoch": 2773} {"train_loss": -24.995346069335938, "global_step": 230183, "epoch": 2773} {"train_loss": -24.67573356628418, "global_step": 230184, "epoch": 2773} {"train_loss": -24.717716217041016, "global_step": 230185, "epoch": 2773} {"train_loss": -24.803709030151367, "global_step": 230186, "epoch": 2773} {"train_loss": -24.511188507080078, "global_step": 230187, "epoch": 2773} {"train_loss": -25.15577507019043, "global_step": 230188, "epoch": 2773} {"train_loss": -24.667709350585938, "global_step": 230189, "epoch": 2773} {"train_loss": -24.875518798828125, "global_step": 230190, "epoch": 2773} {"train_loss": -24.242115020751953, "global_step": 230191, "epoch": 2773} {"train_loss": -24.592235565185547, "global_step": 230192, "epoch": 2773} {"train_loss": -24.946853637695312, "global_step": 230193, "epoch": 2773} {"train_loss": -24.90382194519043, "global_step": 230194, "epoch": 2773} {"train_loss": -24.74416732788086, "global_step": 230195, "epoch": 2773} {"train_loss": -25.0274658203125, "global_step": 230196, "epoch": 2773} {"train_loss": -24.753131866455078, "global_step": 230197, "epoch": 2773} {"train_loss": -25.155851364135742, "global_step": 230198, "epoch": 2773} {"train_loss": -24.46268081665039, "global_step": 230199, "epoch": 2773} {"train_loss": -24.986719131469727, "global_step": 230200, "epoch": 2773} {"train_loss": -25.33147430419922, "global_step": 230201, "epoch": 2773} {"train_loss": -24.632678985595703, "global_step": 230202, "epoch": 2773} {"train_loss": -24.443470001220703, "global_step": 230203, "epoch": 2773} {"train_loss": -25.06561851501465, "global_step": 230204, "epoch": 2773} {"train_loss": -24.71609115600586, "global_step": 230205, "epoch": 2773} {"train_loss": -24.445587158203125, "global_step": 230206, "epoch": 2773} {"train_loss": -24.72652244567871, "global_step": 230207, "epoch": 2773} {"train_loss": -24.897192001342773, "global_step": 230208, "epoch": 2773} {"train_loss": -24.405029296875, "global_step": 230209, "epoch": 2773} {"train_loss": -24.365568161010742, "global_step": 230210, "epoch": 2773} {"train_loss": -24.164968490600586, "global_step": 230211, "epoch": 2773} {"train_loss": -24.390172958374023, "global_step": 230212, "epoch": 2773} {"train_loss": -25.26667022705078, "global_step": 230213, "epoch": 2773} {"train_loss": -25.05469512939453, "global_step": 230214, "epoch": 2773} {"train_loss": -24.383222579956055, "global_step": 230215, "epoch": 2773} {"train_loss": -24.371871948242188, "global_step": 230216, "epoch": 2773} {"train_loss": -24.567224502563477, "global_step": 230217, "epoch": 2773} {"train_loss": -24.734167098999023, "global_step": 230218, "epoch": 2773} {"train_loss": -24.578428268432617, "global_step": 230219, "epoch": 2773} {"train_loss": -24.58940887451172, "global_step": 230220, "epoch": 2773} {"train_loss": -24.919382095336914, "global_step": 230221, "epoch": 2773} {"train_loss": -24.79385757446289, "global_step": 230222, "epoch": 2773} {"train_loss": -24.578125, "global_step": 230223, "epoch": 2773} {"train_loss": -24.499839782714844, "global_step": 230224, "epoch": 2773} {"train_loss": -24.420413970947266, "global_step": 230225, "epoch": 2773} {"train_loss": -24.691280364990234, "global_step": 230226, "epoch": 2773} {"train_loss": -25.082530975341797, "global_step": 230227, "epoch": 2773} {"train_loss": -24.86591148376465, "global_step": 230228, "epoch": 2773} {"train_loss": -24.954761505126953, "global_step": 230229, "epoch": 2773} {"train_loss": -24.70999526977539, "global_step": 230230, "epoch": 2773} {"train_loss": -25.18182373046875, "global_step": 230231, "epoch": 2773} {"train_loss": -24.756311416625977, "global_step": 230232, "epoch": 2773} {"train_loss": -24.689237594604492, "global_step": 230233, "epoch": 2773} {"train_loss": -24.87164878845215, "global_step": 230234, "epoch": 2773} {"train_loss": -24.735258102416992, "global_step": 230235, "epoch": 2773} {"train_loss": -24.77472496032715, "global_step": 230236, "epoch": 2773} {"train_loss": -24.56524658203125, "global_step": 230237, "epoch": 2773} {"train_loss": -24.79201316833496, "global_step": 230238, "epoch": 2773} {"train_loss": -24.819232940673828, "global_step": 230239, "epoch": 2773} {"train_loss": -24.994775772094727, "global_step": 230240, "epoch": 2773} {"train_loss": -24.647724381412367, "global_step": 230241, "epoch": 2773, "val_loss": 6684250.0} {"train_loss": -23.85251808166504, "global_step": 230242, "epoch": 2774} {"train_loss": -24.220190048217773, "global_step": 230243, "epoch": 2774} {"train_loss": -24.739439010620117, "global_step": 230244, "epoch": 2774} {"train_loss": -24.10603904724121, "global_step": 230245, "epoch": 2774} {"train_loss": -24.37051773071289, "global_step": 230246, "epoch": 2774} {"train_loss": -24.561140060424805, "global_step": 230247, "epoch": 2774} {"train_loss": -24.48734474182129, "global_step": 230248, "epoch": 2774} {"train_loss": -24.127578735351562, "global_step": 230249, "epoch": 2774} {"train_loss": -24.444442749023438, "global_step": 230250, "epoch": 2774} {"train_loss": -24.647628784179688, "global_step": 230251, "epoch": 2774} {"train_loss": -24.45001792907715, "global_step": 230252, "epoch": 2774} {"train_loss": -24.608539581298828, "global_step": 230253, "epoch": 2774} {"train_loss": -24.327491760253906, "global_step": 230254, "epoch": 2774} {"train_loss": -24.43202018737793, "global_step": 230255, "epoch": 2774} {"train_loss": -24.45262336730957, "global_step": 230256, "epoch": 2774} {"train_loss": -24.652088165283203, "global_step": 230257, "epoch": 2774} {"train_loss": -24.630258560180664, "global_step": 230258, "epoch": 2774} {"train_loss": -24.882970809936523, "global_step": 230259, "epoch": 2774} {"train_loss": -24.221921920776367, "global_step": 230260, "epoch": 2774} {"train_loss": -24.28116226196289, "global_step": 230261, "epoch": 2774} {"train_loss": -24.75327491760254, "global_step": 230262, "epoch": 2774} {"train_loss": -24.961843490600586, "global_step": 230263, "epoch": 2774} {"train_loss": -24.27132225036621, "global_step": 230264, "epoch": 2774} {"train_loss": -25.183576583862305, "global_step": 230265, "epoch": 2774} {"train_loss": -24.702239990234375, "global_step": 230266, "epoch": 2774} {"train_loss": -24.48175048828125, "global_step": 230267, "epoch": 2774} {"train_loss": -24.705657958984375, "global_step": 230268, "epoch": 2774} {"train_loss": -24.229995727539062, "global_step": 230269, "epoch": 2774} {"train_loss": -24.46854591369629, "global_step": 230270, "epoch": 2774} {"train_loss": -24.823867797851562, "global_step": 230271, "epoch": 2774} {"train_loss": -24.72952651977539, "global_step": 230272, "epoch": 2774} {"train_loss": -24.618099212646484, "global_step": 230273, "epoch": 2774} {"train_loss": -25.029376983642578, "global_step": 230274, "epoch": 2774} {"train_loss": -24.924097061157227, "global_step": 230275, "epoch": 2774} {"train_loss": -24.8447265625, "global_step": 230276, "epoch": 2774} {"train_loss": -25.171903610229492, "global_step": 230277, "epoch": 2774} {"train_loss": -24.468891143798828, "global_step": 230278, "epoch": 2774} {"train_loss": -24.855024337768555, "global_step": 230279, "epoch": 2774} {"train_loss": -24.462148666381836, "global_step": 230280, "epoch": 2774} {"train_loss": -24.79254913330078, "global_step": 230281, "epoch": 2774} {"train_loss": -24.6202449798584, "global_step": 230282, "epoch": 2774} {"train_loss": -24.306554794311523, "global_step": 230283, "epoch": 2774} {"train_loss": -24.84868621826172, "global_step": 230284, "epoch": 2774} {"train_loss": -24.801250457763672, "global_step": 230285, "epoch": 2774} {"train_loss": -25.065662384033203, "global_step": 230286, "epoch": 2774} {"train_loss": -24.859899520874023, "global_step": 230287, "epoch": 2774} {"train_loss": -25.07518768310547, "global_step": 230288, "epoch": 2774} {"train_loss": -24.84742546081543, "global_step": 230289, "epoch": 2774} {"train_loss": -24.75101089477539, "global_step": 230290, "epoch": 2774} {"train_loss": -24.789560317993164, "global_step": 230291, "epoch": 2774} {"train_loss": -24.836076736450195, "global_step": 230292, "epoch": 2774} {"train_loss": -24.981552124023438, "global_step": 230293, "epoch": 2774} {"train_loss": -24.872360229492188, "global_step": 230294, "epoch": 2774} {"train_loss": -24.719026565551758, "global_step": 230295, "epoch": 2774} {"train_loss": -24.461429595947266, "global_step": 230296, "epoch": 2774} {"train_loss": -25.562658309936523, "global_step": 230297, "epoch": 2774} {"train_loss": -24.871540069580078, "global_step": 230298, "epoch": 2774} {"train_loss": -24.74136734008789, "global_step": 230299, "epoch": 2774} {"train_loss": -24.83646583557129, "global_step": 230300, "epoch": 2774} {"train_loss": -24.73499298095703, "global_step": 230301, "epoch": 2774} {"train_loss": -24.646469116210938, "global_step": 230302, "epoch": 2774} {"train_loss": -24.604501724243164, "global_step": 230303, "epoch": 2774} {"train_loss": -24.59035301208496, "global_step": 230304, "epoch": 2774} {"train_loss": -24.75240707397461, "global_step": 230305, "epoch": 2774} {"train_loss": -24.979154586791992, "global_step": 230306, "epoch": 2774} {"train_loss": -24.547012329101562, "global_step": 230307, "epoch": 2774} {"train_loss": -24.905136108398438, "global_step": 230308, "epoch": 2774} {"train_loss": -24.614797592163086, "global_step": 230309, "epoch": 2774} {"train_loss": -24.453569412231445, "global_step": 230310, "epoch": 2774} {"train_loss": -24.5362606048584, "global_step": 230311, "epoch": 2774} {"train_loss": -24.6660213470459, "global_step": 230312, "epoch": 2774} {"train_loss": -24.91566276550293, "global_step": 230313, "epoch": 2774} {"train_loss": -24.960317611694336, "global_step": 230314, "epoch": 2774} {"train_loss": -24.823354721069336, "global_step": 230315, "epoch": 2774} {"train_loss": -24.533843994140625, "global_step": 230316, "epoch": 2774} {"train_loss": -24.450952529907227, "global_step": 230317, "epoch": 2774} {"train_loss": -24.726972579956055, "global_step": 230318, "epoch": 2774} {"train_loss": -24.63809585571289, "global_step": 230319, "epoch": 2774} {"train_loss": -24.878841400146484, "global_step": 230320, "epoch": 2774} {"train_loss": -24.65272331237793, "global_step": 230321, "epoch": 2774} {"train_loss": -24.934980392456055, "global_step": 230322, "epoch": 2774} {"train_loss": -24.857349395751953, "global_step": 230323, "epoch": 2774} {"train_loss": -24.685568843979432, "global_step": 230324, "epoch": 2774, "val_loss": 6830825.0} {"train_loss": -24.392873764038086, "global_step": 230325, "epoch": 2775} {"train_loss": -24.63031005859375, "global_step": 230326, "epoch": 2775} {"train_loss": -24.304136276245117, "global_step": 230327, "epoch": 2775} {"train_loss": -24.6195125579834, "global_step": 230328, "epoch": 2775} {"train_loss": -24.380903244018555, "global_step": 230329, "epoch": 2775} {"train_loss": -24.563732147216797, "global_step": 230330, "epoch": 2775} {"train_loss": -24.800582885742188, "global_step": 230331, "epoch": 2775} {"train_loss": -24.54920768737793, "global_step": 230332, "epoch": 2775} {"train_loss": -24.225482940673828, "global_step": 230333, "epoch": 2775} {"train_loss": -24.75909996032715, "global_step": 230334, "epoch": 2775} {"train_loss": -24.916736602783203, "global_step": 230335, "epoch": 2775} {"train_loss": -24.598953247070312, "global_step": 230336, "epoch": 2775} {"train_loss": -24.85938835144043, "global_step": 230337, "epoch": 2775} {"train_loss": -24.420373916625977, "global_step": 230338, "epoch": 2775} {"train_loss": -24.736642837524414, "global_step": 230339, "epoch": 2775} {"train_loss": -24.741758346557617, "global_step": 230340, "epoch": 2775} {"train_loss": -24.673181533813477, "global_step": 230341, "epoch": 2775} {"train_loss": -24.743005752563477, "global_step": 230342, "epoch": 2775} {"train_loss": -24.592151641845703, "global_step": 230343, "epoch": 2775} {"train_loss": -24.806081771850586, "global_step": 230344, "epoch": 2775} {"train_loss": -24.921886444091797, "global_step": 230345, "epoch": 2775} {"train_loss": -24.777801513671875, "global_step": 230346, "epoch": 2775} {"train_loss": -24.762678146362305, "global_step": 230347, "epoch": 2775} {"train_loss": -24.565542221069336, "global_step": 230348, "epoch": 2775} {"train_loss": -24.630319595336914, "global_step": 230349, "epoch": 2775} {"train_loss": -24.96207618713379, "global_step": 230350, "epoch": 2775} {"train_loss": -24.778648376464844, "global_step": 230351, "epoch": 2775} {"train_loss": -24.78961753845215, "global_step": 230352, "epoch": 2775} {"train_loss": -25.147520065307617, "global_step": 230353, "epoch": 2775} {"train_loss": -24.503782272338867, "global_step": 230354, "epoch": 2775} {"train_loss": -24.825063705444336, "global_step": 230355, "epoch": 2775} {"train_loss": -24.85698890686035, "global_step": 230356, "epoch": 2775} {"train_loss": -24.55860710144043, "global_step": 230357, "epoch": 2775} {"train_loss": -24.866819381713867, "global_step": 230358, "epoch": 2775} {"train_loss": -24.653467178344727, "global_step": 230359, "epoch": 2775} {"train_loss": -24.655086517333984, "global_step": 230360, "epoch": 2775} {"train_loss": -24.866498947143555, "global_step": 230361, "epoch": 2775} {"train_loss": -24.582340240478516, "global_step": 230362, "epoch": 2775} {"train_loss": -24.845335006713867, "global_step": 230363, "epoch": 2775} {"train_loss": -24.66104507446289, "global_step": 230364, "epoch": 2775} {"train_loss": -25.066965103149414, "global_step": 230365, "epoch": 2775} {"train_loss": -24.721616744995117, "global_step": 230366, "epoch": 2775} {"train_loss": -24.793392181396484, "global_step": 230367, "epoch": 2775} {"train_loss": -24.74163818359375, "global_step": 230368, "epoch": 2775} {"train_loss": -24.804880142211914, "global_step": 230369, "epoch": 2775} {"train_loss": -24.753864288330078, "global_step": 230370, "epoch": 2775} {"train_loss": -24.89531898498535, "global_step": 230371, "epoch": 2775} {"train_loss": -24.641820907592773, "global_step": 230372, "epoch": 2775} {"train_loss": -24.99818229675293, "global_step": 230373, "epoch": 2775} {"train_loss": -24.74408531188965, "global_step": 230374, "epoch": 2775} {"train_loss": -25.26605796813965, "global_step": 230375, "epoch": 2775} {"train_loss": -24.598421096801758, "global_step": 230376, "epoch": 2775} {"train_loss": -24.642501831054688, "global_step": 230377, "epoch": 2775} {"train_loss": -24.828062057495117, "global_step": 230378, "epoch": 2775} {"train_loss": -24.6344051361084, "global_step": 230379, "epoch": 2775} {"train_loss": -24.72841453552246, "global_step": 230380, "epoch": 2775} {"train_loss": -24.937728881835938, "global_step": 230381, "epoch": 2775} {"train_loss": -24.626880645751953, "global_step": 230382, "epoch": 2775} {"train_loss": -24.645891189575195, "global_step": 230383, "epoch": 2775} {"train_loss": -25.006052017211914, "global_step": 230384, "epoch": 2775} {"train_loss": -24.878889083862305, "global_step": 230385, "epoch": 2775} {"train_loss": -24.702533721923828, "global_step": 230386, "epoch": 2775} {"train_loss": -24.774099349975586, "global_step": 230387, "epoch": 2775} {"train_loss": -24.70569610595703, "global_step": 230388, "epoch": 2775} {"train_loss": -24.726606369018555, "global_step": 230389, "epoch": 2775} {"train_loss": -25.078702926635742, "global_step": 230390, "epoch": 2775} {"train_loss": -24.918298721313477, "global_step": 230391, "epoch": 2775} {"train_loss": -24.6761474609375, "global_step": 230392, "epoch": 2775} {"train_loss": -24.77638816833496, "global_step": 230393, "epoch": 2775} {"train_loss": -24.763172149658203, "global_step": 230394, "epoch": 2775} {"train_loss": -24.575275421142578, "global_step": 230395, "epoch": 2775} {"train_loss": -24.598657608032227, "global_step": 230396, "epoch": 2775} {"train_loss": -24.478452682495117, "global_step": 230397, "epoch": 2775} {"train_loss": -24.618696212768555, "global_step": 230398, "epoch": 2775} {"train_loss": -25.093652725219727, "global_step": 230399, "epoch": 2775} {"train_loss": -24.93934440612793, "global_step": 230400, "epoch": 2775} {"train_loss": -24.78804588317871, "global_step": 230401, "epoch": 2775} {"train_loss": -24.774871826171875, "global_step": 230402, "epoch": 2775} {"train_loss": -24.86956214904785, "global_step": 230403, "epoch": 2775} {"train_loss": -24.754535675048828, "global_step": 230404, "epoch": 2775} {"train_loss": -24.967239379882812, "global_step": 230405, "epoch": 2775} {"train_loss": -24.723590850830078, "global_step": 230406, "epoch": 2775} {"train_loss": -24.746536599584374, "global_step": 230407, "epoch": 2775, "val_loss": 6696168.0} {"train_loss": -23.987607955932617, "global_step": 230408, "epoch": 2776} {"train_loss": -23.682294845581055, "global_step": 230409, "epoch": 2776} {"train_loss": -24.09247398376465, "global_step": 230410, "epoch": 2776} {"train_loss": -24.128820419311523, "global_step": 230411, "epoch": 2776} {"train_loss": -23.872543334960938, "global_step": 230412, "epoch": 2776} {"train_loss": -24.33806610107422, "global_step": 230413, "epoch": 2776} {"train_loss": -24.28265953063965, "global_step": 230414, "epoch": 2776} {"train_loss": -24.570680618286133, "global_step": 230415, "epoch": 2776} {"train_loss": -24.432422637939453, "global_step": 230416, "epoch": 2776} {"train_loss": -24.374088287353516, "global_step": 230417, "epoch": 2776} {"train_loss": -24.647741317749023, "global_step": 230418, "epoch": 2776} {"train_loss": -24.678836822509766, "global_step": 230419, "epoch": 2776} {"train_loss": -24.70365333557129, "global_step": 230420, "epoch": 2776} {"train_loss": -24.434852600097656, "global_step": 230421, "epoch": 2776} {"train_loss": -24.823667526245117, "global_step": 230422, "epoch": 2776} {"train_loss": -24.784452438354492, "global_step": 230423, "epoch": 2776} {"train_loss": -24.476791381835938, "global_step": 230424, "epoch": 2776} {"train_loss": -24.7774715423584, "global_step": 230425, "epoch": 2776} {"train_loss": -24.759634017944336, "global_step": 230426, "epoch": 2776} {"train_loss": -24.5185489654541, "global_step": 230427, "epoch": 2776} {"train_loss": -24.458044052124023, "global_step": 230428, "epoch": 2776} {"train_loss": -24.774246215820312, "global_step": 230429, "epoch": 2776} {"train_loss": -24.704320907592773, "global_step": 230430, "epoch": 2776} {"train_loss": -24.64164161682129, "global_step": 230431, "epoch": 2776} {"train_loss": -24.58408546447754, "global_step": 230432, "epoch": 2776} {"train_loss": -24.709096908569336, "global_step": 230433, "epoch": 2776} {"train_loss": -24.925579071044922, "global_step": 230434, "epoch": 2776} {"train_loss": -24.26878547668457, "global_step": 230435, "epoch": 2776} {"train_loss": -24.75463104248047, "global_step": 230436, "epoch": 2776} {"train_loss": -24.948829650878906, "global_step": 230437, "epoch": 2776} {"train_loss": -24.47920036315918, "global_step": 230438, "epoch": 2776} {"train_loss": -24.324094772338867, "global_step": 230439, "epoch": 2776} {"train_loss": -24.444700241088867, "global_step": 230440, "epoch": 2776} {"train_loss": -25.17916488647461, "global_step": 230441, "epoch": 2776} {"train_loss": -24.853261947631836, "global_step": 230442, "epoch": 2776} {"train_loss": -24.7684326171875, "global_step": 230443, "epoch": 2776} {"train_loss": -24.717519760131836, "global_step": 230444, "epoch": 2776} {"train_loss": -24.65804100036621, "global_step": 230445, "epoch": 2776} {"train_loss": -24.644590377807617, "global_step": 230446, "epoch": 2776} {"train_loss": -24.703571319580078, "global_step": 230447, "epoch": 2776} {"train_loss": -24.81426429748535, "global_step": 230448, "epoch": 2776} {"train_loss": -24.496967315673828, "global_step": 230449, "epoch": 2776} {"train_loss": -25.232507705688477, "global_step": 230450, "epoch": 2776} {"train_loss": -25.039457321166992, "global_step": 230451, "epoch": 2776} {"train_loss": -24.7525691986084, "global_step": 230452, "epoch": 2776} {"train_loss": -24.920164108276367, "global_step": 230453, "epoch": 2776} {"train_loss": -24.686166763305664, "global_step": 230454, "epoch": 2776} {"train_loss": -25.08278465270996, "global_step": 230455, "epoch": 2776} {"train_loss": -25.10767936706543, "global_step": 230456, "epoch": 2776} {"train_loss": -24.624923706054688, "global_step": 230457, "epoch": 2776} {"train_loss": -24.416288375854492, "global_step": 230458, "epoch": 2776} {"train_loss": -24.233654022216797, "global_step": 230459, "epoch": 2776} {"train_loss": -24.305768966674805, "global_step": 230460, "epoch": 2776} {"train_loss": -24.068151473999023, "global_step": 230461, "epoch": 2776} {"train_loss": -24.33150291442871, "global_step": 230462, "epoch": 2776} {"train_loss": -24.3623104095459, "global_step": 230463, "epoch": 2776} {"train_loss": -24.615474700927734, "global_step": 230464, "epoch": 2776} {"train_loss": -24.764148712158203, "global_step": 230465, "epoch": 2776} {"train_loss": -24.75601577758789, "global_step": 230466, "epoch": 2776} {"train_loss": -24.407188415527344, "global_step": 230467, "epoch": 2776} {"train_loss": -24.13532066345215, "global_step": 230468, "epoch": 2776} {"train_loss": -24.552356719970703, "global_step": 230469, "epoch": 2776} {"train_loss": -24.49394416809082, "global_step": 230470, "epoch": 2776} {"train_loss": -25.06438636779785, "global_step": 230471, "epoch": 2776} {"train_loss": -24.72251319885254, "global_step": 230472, "epoch": 2776} {"train_loss": -24.55304527282715, "global_step": 230473, "epoch": 2776} {"train_loss": -24.27544593811035, "global_step": 230474, "epoch": 2776} {"train_loss": -24.8789005279541, "global_step": 230475, "epoch": 2776} {"train_loss": -25.31995964050293, "global_step": 230476, "epoch": 2776} {"train_loss": -24.479732513427734, "global_step": 230477, "epoch": 2776} {"train_loss": -24.730993270874023, "global_step": 230478, "epoch": 2776} {"train_loss": -25.09050178527832, "global_step": 230479, "epoch": 2776} {"train_loss": -24.768835067749023, "global_step": 230480, "epoch": 2776} {"train_loss": -24.594741821289062, "global_step": 230481, "epoch": 2776} {"train_loss": -24.720373153686523, "global_step": 230482, "epoch": 2776} {"train_loss": -24.801637649536133, "global_step": 230483, "epoch": 2776} {"train_loss": -24.6474552154541, "global_step": 230484, "epoch": 2776} {"train_loss": -25.100109100341797, "global_step": 230485, "epoch": 2776} {"train_loss": -24.76352310180664, "global_step": 230486, "epoch": 2776} {"train_loss": -25.148740768432617, "global_step": 230487, "epoch": 2776} {"train_loss": -24.399179458618164, "global_step": 230488, "epoch": 2776} {"train_loss": -24.92190933227539, "global_step": 230489, "epoch": 2776} {"train_loss": -24.621576286224, "global_step": 230490, "epoch": 2776, "val_loss": 6619474.0} {"train_loss": -24.475208282470703, "global_step": 230491, "epoch": 2777} {"train_loss": -24.376235961914062, "global_step": 230492, "epoch": 2777} {"train_loss": -24.185789108276367, "global_step": 230493, "epoch": 2777} {"train_loss": -24.273061752319336, "global_step": 230494, "epoch": 2777} {"train_loss": -24.480493545532227, "global_step": 230495, "epoch": 2777} {"train_loss": -24.332876205444336, "global_step": 230496, "epoch": 2777} {"train_loss": -24.400890350341797, "global_step": 230497, "epoch": 2777} {"train_loss": -24.544225692749023, "global_step": 230498, "epoch": 2777} {"train_loss": -24.462478637695312, "global_step": 230499, "epoch": 2777} {"train_loss": -25.03148651123047, "global_step": 230500, "epoch": 2777} {"train_loss": -24.944875717163086, "global_step": 230501, "epoch": 2777} {"train_loss": -24.67894744873047, "global_step": 230502, "epoch": 2777} {"train_loss": -24.51930046081543, "global_step": 230503, "epoch": 2777} {"train_loss": -24.85988426208496, "global_step": 230504, "epoch": 2777} {"train_loss": -24.54692840576172, "global_step": 230505, "epoch": 2777} {"train_loss": -24.794269561767578, "global_step": 230506, "epoch": 2777} {"train_loss": -24.81295394897461, "global_step": 230507, "epoch": 2777} {"train_loss": -24.656009674072266, "global_step": 230508, "epoch": 2777} {"train_loss": -25.033260345458984, "global_step": 230509, "epoch": 2777} {"train_loss": -24.7089786529541, "global_step": 230510, "epoch": 2777} {"train_loss": -24.759206771850586, "global_step": 230511, "epoch": 2777} {"train_loss": -24.594654083251953, "global_step": 230512, "epoch": 2777} {"train_loss": -24.68552589416504, "global_step": 230513, "epoch": 2777} {"train_loss": -25.086767196655273, "global_step": 230514, "epoch": 2777} {"train_loss": -24.665693283081055, "global_step": 230515, "epoch": 2777} {"train_loss": -24.73749542236328, "global_step": 230516, "epoch": 2777} {"train_loss": -24.82291030883789, "global_step": 230517, "epoch": 2777} {"train_loss": -24.923709869384766, "global_step": 230518, "epoch": 2777} {"train_loss": -24.669416427612305, "global_step": 230519, "epoch": 2777} {"train_loss": -24.676971435546875, "global_step": 230520, "epoch": 2777} {"train_loss": -24.884504318237305, "global_step": 230521, "epoch": 2777} {"train_loss": -24.940366744995117, "global_step": 230522, "epoch": 2777} {"train_loss": -24.95290756225586, "global_step": 230523, "epoch": 2777} {"train_loss": -25.192153930664062, "global_step": 230524, "epoch": 2777} {"train_loss": -24.614999771118164, "global_step": 230525, "epoch": 2777} {"train_loss": -24.290136337280273, "global_step": 230526, "epoch": 2777} {"train_loss": -24.80145263671875, "global_step": 230527, "epoch": 2777} {"train_loss": -24.5650691986084, "global_step": 230528, "epoch": 2777} {"train_loss": -24.941221237182617, "global_step": 230529, "epoch": 2777} {"train_loss": -24.279882431030273, "global_step": 230530, "epoch": 2777} {"train_loss": -24.192758560180664, "global_step": 230531, "epoch": 2777} {"train_loss": -24.66879653930664, "global_step": 230532, "epoch": 2777} {"train_loss": -24.746444702148438, "global_step": 230533, "epoch": 2777} {"train_loss": -24.559486389160156, "global_step": 230534, "epoch": 2777} {"train_loss": -24.4447078704834, "global_step": 230535, "epoch": 2777} {"train_loss": -24.836156845092773, "global_step": 230536, "epoch": 2777} {"train_loss": -24.578615188598633, "global_step": 230537, "epoch": 2777} {"train_loss": -24.805700302124023, "global_step": 230538, "epoch": 2777} {"train_loss": -24.672611236572266, "global_step": 230539, "epoch": 2777} {"train_loss": -24.726858139038086, "global_step": 230540, "epoch": 2777} {"train_loss": -25.265592575073242, "global_step": 230541, "epoch": 2777} {"train_loss": -24.804676055908203, "global_step": 230542, "epoch": 2777} {"train_loss": -24.807662963867188, "global_step": 230543, "epoch": 2777} {"train_loss": -24.82652473449707, "global_step": 230544, "epoch": 2777} {"train_loss": -24.469736099243164, "global_step": 230545, "epoch": 2777} {"train_loss": -24.316408157348633, "global_step": 230546, "epoch": 2777} {"train_loss": -24.34229850769043, "global_step": 230547, "epoch": 2777} {"train_loss": -24.310068130493164, "global_step": 230548, "epoch": 2777} {"train_loss": -24.83695411682129, "global_step": 230549, "epoch": 2777} {"train_loss": -24.397125244140625, "global_step": 230550, "epoch": 2777} {"train_loss": -24.79762840270996, "global_step": 230551, "epoch": 2777} {"train_loss": -24.515705108642578, "global_step": 230552, "epoch": 2777} {"train_loss": -25.003204345703125, "global_step": 230553, "epoch": 2777} {"train_loss": -24.861234664916992, "global_step": 230554, "epoch": 2777} {"train_loss": -25.024362564086914, "global_step": 230555, "epoch": 2777} {"train_loss": -24.653949737548828, "global_step": 230556, "epoch": 2777} {"train_loss": -24.73615074157715, "global_step": 230557, "epoch": 2777} {"train_loss": -25.01692008972168, "global_step": 230558, "epoch": 2777} {"train_loss": -24.461397171020508, "global_step": 230559, "epoch": 2777} {"train_loss": -24.73956871032715, "global_step": 230560, "epoch": 2777} {"train_loss": -24.61165428161621, "global_step": 230561, "epoch": 2777} {"train_loss": -24.644760131835938, "global_step": 230562, "epoch": 2777} {"train_loss": -24.842618942260742, "global_step": 230563, "epoch": 2777} {"train_loss": -24.361530303955078, "global_step": 230564, "epoch": 2777} {"train_loss": -25.25313949584961, "global_step": 230565, "epoch": 2777} {"train_loss": -24.41231346130371, "global_step": 230566, "epoch": 2777} {"train_loss": -24.775299072265625, "global_step": 230567, "epoch": 2777} {"train_loss": -24.78299331665039, "global_step": 230568, "epoch": 2777} {"train_loss": -24.86127471923828, "global_step": 230569, "epoch": 2777} {"train_loss": -24.78095054626465, "global_step": 230570, "epoch": 2777} {"train_loss": -24.68877410888672, "global_step": 230571, "epoch": 2777} {"train_loss": -24.74665641784668, "global_step": 230572, "epoch": 2777} {"train_loss": -24.688716658626696, "global_step": 230573, "epoch": 2777, "val_loss": 6817620.0} {"train_loss": -24.358556747436523, "global_step": 230574, "epoch": 2778} {"train_loss": -24.452184677124023, "global_step": 230575, "epoch": 2778} {"train_loss": -24.486661911010742, "global_step": 230576, "epoch": 2778} {"train_loss": -24.47963523864746, "global_step": 230577, "epoch": 2778} {"train_loss": -24.466861724853516, "global_step": 230578, "epoch": 2778} {"train_loss": -24.177976608276367, "global_step": 230579, "epoch": 2778} {"train_loss": -24.457868576049805, "global_step": 230580, "epoch": 2778} {"train_loss": -24.334951400756836, "global_step": 230581, "epoch": 2778} {"train_loss": -24.464405059814453, "global_step": 230582, "epoch": 2778} {"train_loss": -24.636688232421875, "global_step": 230583, "epoch": 2778} {"train_loss": -24.06875991821289, "global_step": 230584, "epoch": 2778} {"train_loss": -24.51373863220215, "global_step": 230585, "epoch": 2778} {"train_loss": -24.239994049072266, "global_step": 230586, "epoch": 2778} {"train_loss": -24.217130661010742, "global_step": 230587, "epoch": 2778} {"train_loss": -24.493574142456055, "global_step": 230588, "epoch": 2778} {"train_loss": -24.60536766052246, "global_step": 230589, "epoch": 2778} {"train_loss": -24.300527572631836, "global_step": 230590, "epoch": 2778} {"train_loss": -24.409563064575195, "global_step": 230591, "epoch": 2778} {"train_loss": -24.4417724609375, "global_step": 230592, "epoch": 2778} {"train_loss": -24.440385818481445, "global_step": 230593, "epoch": 2778} {"train_loss": -24.78694725036621, "global_step": 230594, "epoch": 2778} {"train_loss": -24.508075714111328, "global_step": 230595, "epoch": 2778} {"train_loss": -24.421417236328125, "global_step": 230596, "epoch": 2778} {"train_loss": -24.56361198425293, "global_step": 230597, "epoch": 2778} {"train_loss": -24.580617904663086, "global_step": 230598, "epoch": 2778} {"train_loss": -24.32107162475586, "global_step": 230599, "epoch": 2778} {"train_loss": -24.75812530517578, "global_step": 230600, "epoch": 2778} {"train_loss": -24.512561798095703, "global_step": 230601, "epoch": 2778} {"train_loss": -24.761350631713867, "global_step": 230602, "epoch": 2778} {"train_loss": -24.67329978942871, "global_step": 230603, "epoch": 2778} {"train_loss": -24.447301864624023, "global_step": 230604, "epoch": 2778} {"train_loss": -24.635862350463867, "global_step": 230605, "epoch": 2778} {"train_loss": -24.436565399169922, "global_step": 230606, "epoch": 2778} {"train_loss": -24.412817001342773, "global_step": 230607, "epoch": 2778} {"train_loss": -24.853376388549805, "global_step": 230608, "epoch": 2778} {"train_loss": -24.739994049072266, "global_step": 230609, "epoch": 2778} {"train_loss": -24.47479248046875, "global_step": 230610, "epoch": 2778} {"train_loss": -24.764556884765625, "global_step": 230611, "epoch": 2778} {"train_loss": -24.57198143005371, "global_step": 230612, "epoch": 2778} {"train_loss": -24.869604110717773, "global_step": 230613, "epoch": 2778} {"train_loss": -24.719724655151367, "global_step": 230614, "epoch": 2778} {"train_loss": -25.04031753540039, "global_step": 230615, "epoch": 2778} {"train_loss": -24.959548950195312, "global_step": 230616, "epoch": 2778} {"train_loss": -24.58970069885254, "global_step": 230617, "epoch": 2778} {"train_loss": -24.846860885620117, "global_step": 230618, "epoch": 2778} {"train_loss": -24.916799545288086, "global_step": 230619, "epoch": 2778} {"train_loss": -24.837793350219727, "global_step": 230620, "epoch": 2778} {"train_loss": -25.005558013916016, "global_step": 230621, "epoch": 2778} {"train_loss": -25.24750518798828, "global_step": 230622, "epoch": 2778} {"train_loss": -24.81673240661621, "global_step": 230623, "epoch": 2778} {"train_loss": -24.85414695739746, "global_step": 230624, "epoch": 2778} {"train_loss": -24.892728805541992, "global_step": 230625, "epoch": 2778} {"train_loss": -24.74458885192871, "global_step": 230626, "epoch": 2778} {"train_loss": -24.807172775268555, "global_step": 230627, "epoch": 2778} {"train_loss": -25.263761520385742, "global_step": 230628, "epoch": 2778} {"train_loss": -24.960033416748047, "global_step": 230629, "epoch": 2778} {"train_loss": -25.13240623474121, "global_step": 230630, "epoch": 2778} {"train_loss": -24.936771392822266, "global_step": 230631, "epoch": 2778} {"train_loss": -25.049880981445312, "global_step": 230632, "epoch": 2778} {"train_loss": -24.735074996948242, "global_step": 230633, "epoch": 2778} {"train_loss": -25.36277198791504, "global_step": 230634, "epoch": 2778} {"train_loss": -25.08578872680664, "global_step": 230635, "epoch": 2778} {"train_loss": -24.939115524291992, "global_step": 230636, "epoch": 2778} {"train_loss": -24.583776473999023, "global_step": 230637, "epoch": 2778} {"train_loss": -24.51198387145996, "global_step": 230638, "epoch": 2778} {"train_loss": -24.284543991088867, "global_step": 230639, "epoch": 2778} {"train_loss": -24.139972686767578, "global_step": 230640, "epoch": 2778} {"train_loss": -24.73785400390625, "global_step": 230641, "epoch": 2778} {"train_loss": -24.458023071289062, "global_step": 230642, "epoch": 2778} {"train_loss": -24.279794692993164, "global_step": 230643, "epoch": 2778} {"train_loss": -24.83465003967285, "global_step": 230644, "epoch": 2778} {"train_loss": -24.395816802978516, "global_step": 230645, "epoch": 2778} {"train_loss": -24.61397361755371, "global_step": 230646, "epoch": 2778} {"train_loss": -24.467504501342773, "global_step": 230647, "epoch": 2778} {"train_loss": -24.725631713867188, "global_step": 230648, "epoch": 2778} {"train_loss": -24.79743003845215, "global_step": 230649, "epoch": 2778} {"train_loss": -24.629209518432617, "global_step": 230650, "epoch": 2778} {"train_loss": -24.425024032592773, "global_step": 230651, "epoch": 2778} {"train_loss": -24.53870391845703, "global_step": 230652, "epoch": 2778} {"train_loss": -24.612600326538086, "global_step": 230653, "epoch": 2778} {"train_loss": -24.55739402770996, "global_step": 230654, "epoch": 2778} {"train_loss": -24.996362686157227, "global_step": 230655, "epoch": 2778} {"train_loss": -24.62336363275367, "global_step": 230656, "epoch": 2778, "val_loss": 6714765.0} {"train_loss": -24.540987014770508, "global_step": 230657, "epoch": 2779} {"train_loss": -23.89537239074707, "global_step": 230658, "epoch": 2779} {"train_loss": -24.250370025634766, "global_step": 230659, "epoch": 2779} {"train_loss": -24.435176849365234, "global_step": 230660, "epoch": 2779} {"train_loss": -24.216711044311523, "global_step": 230661, "epoch": 2779} {"train_loss": -24.379188537597656, "global_step": 230662, "epoch": 2779} {"train_loss": -24.660221099853516, "global_step": 230663, "epoch": 2779} {"train_loss": -24.21280860900879, "global_step": 230664, "epoch": 2779} {"train_loss": -24.673460006713867, "global_step": 230665, "epoch": 2779} {"train_loss": -24.480016708374023, "global_step": 230666, "epoch": 2779} {"train_loss": -24.427509307861328, "global_step": 230667, "epoch": 2779} {"train_loss": -24.753055572509766, "global_step": 230668, "epoch": 2779} {"train_loss": -24.587390899658203, "global_step": 230669, "epoch": 2779} {"train_loss": -24.18861198425293, "global_step": 230670, "epoch": 2779} {"train_loss": -24.40327262878418, "global_step": 230671, "epoch": 2779} {"train_loss": -24.675748825073242, "global_step": 230672, "epoch": 2779} {"train_loss": -24.907421112060547, "global_step": 230673, "epoch": 2779} {"train_loss": -24.635055541992188, "global_step": 230674, "epoch": 2779} {"train_loss": -24.59715461730957, "global_step": 230675, "epoch": 2779} {"train_loss": -24.47029685974121, "global_step": 230676, "epoch": 2779} {"train_loss": -24.903427124023438, "global_step": 230677, "epoch": 2779} {"train_loss": -24.89388084411621, "global_step": 230678, "epoch": 2779} {"train_loss": -24.3490047454834, "global_step": 230679, "epoch": 2779} {"train_loss": -24.609996795654297, "global_step": 230680, "epoch": 2779} {"train_loss": -25.121435165405273, "global_step": 230681, "epoch": 2779} {"train_loss": -24.673940658569336, "global_step": 230682, "epoch": 2779} {"train_loss": -24.78598976135254, "global_step": 230683, "epoch": 2779} {"train_loss": -24.29306411743164, "global_step": 230684, "epoch": 2779} {"train_loss": -25.01128578186035, "global_step": 230685, "epoch": 2779} {"train_loss": -24.722442626953125, "global_step": 230686, "epoch": 2779} {"train_loss": -25.01358985900879, "global_step": 230687, "epoch": 2779} {"train_loss": -24.6329345703125, "global_step": 230688, "epoch": 2779} {"train_loss": -24.928525924682617, "global_step": 230689, "epoch": 2779} {"train_loss": -24.3286075592041, "global_step": 230690, "epoch": 2779} {"train_loss": -24.66388511657715, "global_step": 230691, "epoch": 2779} {"train_loss": -24.82280921936035, "global_step": 230692, "epoch": 2779} {"train_loss": -23.973691940307617, "global_step": 230693, "epoch": 2779} {"train_loss": -24.18367576599121, "global_step": 230694, "epoch": 2779} {"train_loss": -24.653135299682617, "global_step": 230695, "epoch": 2779} {"train_loss": -24.625614166259766, "global_step": 230696, "epoch": 2779} {"train_loss": -24.720962524414062, "global_step": 230697, "epoch": 2779} {"train_loss": -24.89430046081543, "global_step": 230698, "epoch": 2779} {"train_loss": -24.71625328063965, "global_step": 230699, "epoch": 2779} {"train_loss": -25.056169509887695, "global_step": 230700, "epoch": 2779} {"train_loss": -24.720516204833984, "global_step": 230701, "epoch": 2779} {"train_loss": -24.504676818847656, "global_step": 230702, "epoch": 2779} {"train_loss": -24.5517520904541, "global_step": 230703, "epoch": 2779} {"train_loss": -24.696792602539062, "global_step": 230704, "epoch": 2779} {"train_loss": -24.645709991455078, "global_step": 230705, "epoch": 2779} {"train_loss": -25.184354782104492, "global_step": 230706, "epoch": 2779} {"train_loss": -24.608861923217773, "global_step": 230707, "epoch": 2779} {"train_loss": -24.85261344909668, "global_step": 230708, "epoch": 2779} {"train_loss": -24.511554718017578, "global_step": 230709, "epoch": 2779} {"train_loss": -25.05156898498535, "global_step": 230710, "epoch": 2779} {"train_loss": -24.362407684326172, "global_step": 230711, "epoch": 2779} {"train_loss": -25.017898559570312, "global_step": 230712, "epoch": 2779} {"train_loss": -24.695966720581055, "global_step": 230713, "epoch": 2779} {"train_loss": -24.724822998046875, "global_step": 230714, "epoch": 2779} {"train_loss": -24.704252243041992, "global_step": 230715, "epoch": 2779} {"train_loss": -24.529865264892578, "global_step": 230716, "epoch": 2779} {"train_loss": -24.625642776489258, "global_step": 230717, "epoch": 2779} {"train_loss": -24.723163604736328, "global_step": 230718, "epoch": 2779} {"train_loss": -24.999351501464844, "global_step": 230719, "epoch": 2779} {"train_loss": -24.483675003051758, "global_step": 230720, "epoch": 2779} {"train_loss": -24.791772842407227, "global_step": 230721, "epoch": 2779} {"train_loss": -24.593441009521484, "global_step": 230722, "epoch": 2779} {"train_loss": -25.23423194885254, "global_step": 230723, "epoch": 2779} {"train_loss": -24.98042106628418, "global_step": 230724, "epoch": 2779} {"train_loss": -24.789600372314453, "global_step": 230725, "epoch": 2779} {"train_loss": -24.832441329956055, "global_step": 230726, "epoch": 2779} {"train_loss": -24.53402328491211, "global_step": 230727, "epoch": 2779} {"train_loss": -25.015838623046875, "global_step": 230728, "epoch": 2779} {"train_loss": -24.892841339111328, "global_step": 230729, "epoch": 2779} {"train_loss": -24.807092666625977, "global_step": 230730, "epoch": 2779} {"train_loss": -24.747177124023438, "global_step": 230731, "epoch": 2779} {"train_loss": -24.968223571777344, "global_step": 230732, "epoch": 2779} {"train_loss": -24.37213706970215, "global_step": 230733, "epoch": 2779} {"train_loss": -24.709197998046875, "global_step": 230734, "epoch": 2779} {"train_loss": -25.14976692199707, "global_step": 230735, "epoch": 2779} {"train_loss": -24.939130783081055, "global_step": 230736, "epoch": 2779} {"train_loss": -25.027063369750977, "global_step": 230737, "epoch": 2779} {"train_loss": -24.6503963470459, "global_step": 230738, "epoch": 2779} {"train_loss": -24.686106118811182, "global_step": 230739, "epoch": 2779, "val_loss": 6625605.0} {"train_loss": -24.676054000854492, "global_step": 230740, "epoch": 2780} {"train_loss": -24.438892364501953, "global_step": 230741, "epoch": 2780} {"train_loss": -24.51154327392578, "global_step": 230742, "epoch": 2780} {"train_loss": -24.45067024230957, "global_step": 230743, "epoch": 2780} {"train_loss": -24.416929244995117, "global_step": 230744, "epoch": 2780} {"train_loss": -24.319765090942383, "global_step": 230745, "epoch": 2780} {"train_loss": -24.404638290405273, "global_step": 230746, "epoch": 2780} {"train_loss": -25.03053855895996, "global_step": 230747, "epoch": 2780} {"train_loss": -24.575489044189453, "global_step": 230748, "epoch": 2780} {"train_loss": -24.75240135192871, "global_step": 230749, "epoch": 2780} {"train_loss": -24.351160049438477, "global_step": 230750, "epoch": 2780} {"train_loss": -24.59250831604004, "global_step": 230751, "epoch": 2780} {"train_loss": -24.802770614624023, "global_step": 230752, "epoch": 2780} {"train_loss": -24.58629608154297, "global_step": 230753, "epoch": 2780} {"train_loss": -24.632083892822266, "global_step": 230754, "epoch": 2780} {"train_loss": -24.52351188659668, "global_step": 230755, "epoch": 2780} {"train_loss": -24.547195434570312, "global_step": 230756, "epoch": 2780} {"train_loss": -24.894298553466797, "global_step": 230757, "epoch": 2780} {"train_loss": -24.855104446411133, "global_step": 230758, "epoch": 2780} {"train_loss": -24.8636474609375, "global_step": 230759, "epoch": 2780} {"train_loss": -24.465002059936523, "global_step": 230760, "epoch": 2780} {"train_loss": -24.761884689331055, "global_step": 230761, "epoch": 2780} {"train_loss": -24.50828742980957, "global_step": 230762, "epoch": 2780} {"train_loss": -24.85040855407715, "global_step": 230763, "epoch": 2780} {"train_loss": -24.870258331298828, "global_step": 230764, "epoch": 2780} {"train_loss": -24.554969787597656, "global_step": 230765, "epoch": 2780} {"train_loss": -24.63743019104004, "global_step": 230766, "epoch": 2780} {"train_loss": -24.69856834411621, "global_step": 230767, "epoch": 2780} {"train_loss": -24.92168617248535, "global_step": 230768, "epoch": 2780} {"train_loss": -24.91659927368164, "global_step": 230769, "epoch": 2780} {"train_loss": -24.734277725219727, "global_step": 230770, "epoch": 2780} {"train_loss": -24.864212036132812, "global_step": 230771, "epoch": 2780} {"train_loss": -24.9757022857666, "global_step": 230772, "epoch": 2780} {"train_loss": -24.833372116088867, "global_step": 230773, "epoch": 2780} {"train_loss": -24.877431869506836, "global_step": 230774, "epoch": 2780} {"train_loss": -24.479690551757812, "global_step": 230775, "epoch": 2780} {"train_loss": -24.80238914489746, "global_step": 230776, "epoch": 2780} {"train_loss": -25.118650436401367, "global_step": 230777, "epoch": 2780} {"train_loss": -25.078100204467773, "global_step": 230778, "epoch": 2780} {"train_loss": -24.602819442749023, "global_step": 230779, "epoch": 2780} {"train_loss": -24.567813873291016, "global_step": 230780, "epoch": 2780} {"train_loss": -24.642494201660156, "global_step": 230781, "epoch": 2780} {"train_loss": -24.784387588500977, "global_step": 230782, "epoch": 2780} {"train_loss": -25.184171676635742, "global_step": 230783, "epoch": 2780} {"train_loss": -24.514307022094727, "global_step": 230784, "epoch": 2780} {"train_loss": -24.933815002441406, "global_step": 230785, "epoch": 2780} {"train_loss": -25.094736099243164, "global_step": 230786, "epoch": 2780} {"train_loss": -24.4846134185791, "global_step": 230787, "epoch": 2780} {"train_loss": -24.83357048034668, "global_step": 230788, "epoch": 2780} {"train_loss": -24.5332088470459, "global_step": 230789, "epoch": 2780} {"train_loss": -24.794111251831055, "global_step": 230790, "epoch": 2780} {"train_loss": -24.13510513305664, "global_step": 230791, "epoch": 2780} {"train_loss": -23.022802352905273, "global_step": 230792, "epoch": 2780} {"train_loss": -23.2338924407959, "global_step": 230793, "epoch": 2780} {"train_loss": -24.53391456604004, "global_step": 230794, "epoch": 2780} {"train_loss": -24.76479721069336, "global_step": 230795, "epoch": 2780} {"train_loss": -24.127979278564453, "global_step": 230796, "epoch": 2780} {"train_loss": -24.39350700378418, "global_step": 230797, "epoch": 2780} {"train_loss": -24.499332427978516, "global_step": 230798, "epoch": 2780} {"train_loss": -24.335098266601562, "global_step": 230799, "epoch": 2780} {"train_loss": -23.985273361206055, "global_step": 230800, "epoch": 2780} {"train_loss": -24.56269645690918, "global_step": 230801, "epoch": 2780} {"train_loss": -24.934070587158203, "global_step": 230802, "epoch": 2780} {"train_loss": -24.672618865966797, "global_step": 230803, "epoch": 2780} {"train_loss": -24.249677658081055, "global_step": 230804, "epoch": 2780} {"train_loss": -24.485977172851562, "global_step": 230805, "epoch": 2780} {"train_loss": -24.300251007080078, "global_step": 230806, "epoch": 2780} {"train_loss": -24.691499710083008, "global_step": 230807, "epoch": 2780} {"train_loss": -24.432205200195312, "global_step": 230808, "epoch": 2780} {"train_loss": -24.369375228881836, "global_step": 230809, "epoch": 2780} {"train_loss": -25.00473403930664, "global_step": 230810, "epoch": 2780} {"train_loss": -24.784982681274414, "global_step": 230811, "epoch": 2780} {"train_loss": -24.50428581237793, "global_step": 230812, "epoch": 2780} {"train_loss": -24.077512741088867, "global_step": 230813, "epoch": 2780} {"train_loss": -24.26380729675293, "global_step": 230814, "epoch": 2780} {"train_loss": -24.317731857299805, "global_step": 230815, "epoch": 2780} {"train_loss": -24.71748924255371, "global_step": 230816, "epoch": 2780} {"train_loss": -24.701147079467773, "global_step": 230817, "epoch": 2780} {"train_loss": -24.916635513305664, "global_step": 230818, "epoch": 2780} {"train_loss": -24.437204360961914, "global_step": 230819, "epoch": 2780} {"train_loss": -24.803407669067383, "global_step": 230820, "epoch": 2780} {"train_loss": -25.186630249023438, "global_step": 230821, "epoch": 2780} {"train_loss": -24.603067926613683, "global_step": 230822, "epoch": 2780, "val_loss": 6675271.0} {"train_loss": -24.352041244506836, "global_step": 230823, "epoch": 2781} {"train_loss": -24.22041130065918, "global_step": 230824, "epoch": 2781} {"train_loss": -24.68492317199707, "global_step": 230825, "epoch": 2781} {"train_loss": -24.145313262939453, "global_step": 230826, "epoch": 2781} {"train_loss": -24.32675552368164, "global_step": 230827, "epoch": 2781} {"train_loss": -24.696369171142578, "global_step": 230828, "epoch": 2781} {"train_loss": -24.244752883911133, "global_step": 230829, "epoch": 2781} {"train_loss": -24.290307998657227, "global_step": 230830, "epoch": 2781} {"train_loss": -24.393465042114258, "global_step": 230831, "epoch": 2781} {"train_loss": -24.976652145385742, "global_step": 230832, "epoch": 2781} {"train_loss": -24.81052589416504, "global_step": 230833, "epoch": 2781} {"train_loss": -24.642658233642578, "global_step": 230834, "epoch": 2781} {"train_loss": -24.65107536315918, "global_step": 230835, "epoch": 2781} {"train_loss": -24.476377487182617, "global_step": 230836, "epoch": 2781} {"train_loss": -24.994001388549805, "global_step": 230837, "epoch": 2781} {"train_loss": -24.310165405273438, "global_step": 230838, "epoch": 2781} {"train_loss": -24.562692642211914, "global_step": 230839, "epoch": 2781} {"train_loss": -24.686059951782227, "global_step": 230840, "epoch": 2781} {"train_loss": -24.853561401367188, "global_step": 230841, "epoch": 2781} {"train_loss": -24.993181228637695, "global_step": 230842, "epoch": 2781} {"train_loss": -24.7244815826416, "global_step": 230843, "epoch": 2781} {"train_loss": -24.663211822509766, "global_step": 230844, "epoch": 2781} {"train_loss": -24.699575424194336, "global_step": 230845, "epoch": 2781} {"train_loss": -24.55512809753418, "global_step": 230846, "epoch": 2781} {"train_loss": -24.484838485717773, "global_step": 230847, "epoch": 2781} {"train_loss": -24.538480758666992, "global_step": 230848, "epoch": 2781} {"train_loss": -24.741514205932617, "global_step": 230849, "epoch": 2781} {"train_loss": -24.775243759155273, "global_step": 230850, "epoch": 2781} {"train_loss": -24.760610580444336, "global_step": 230851, "epoch": 2781} {"train_loss": -24.35021209716797, "global_step": 230852, "epoch": 2781} {"train_loss": -24.833173751831055, "global_step": 230853, "epoch": 2781} {"train_loss": -24.30521583557129, "global_step": 230854, "epoch": 2781} {"train_loss": -24.302661895751953, "global_step": 230855, "epoch": 2781} {"train_loss": -24.84490966796875, "global_step": 230856, "epoch": 2781} {"train_loss": -24.9205379486084, "global_step": 230857, "epoch": 2781} {"train_loss": -24.653186798095703, "global_step": 230858, "epoch": 2781} {"train_loss": -24.689626693725586, "global_step": 230859, "epoch": 2781} {"train_loss": -24.778488159179688, "global_step": 230860, "epoch": 2781} {"train_loss": -24.727550506591797, "global_step": 230861, "epoch": 2781} {"train_loss": -24.725433349609375, "global_step": 230862, "epoch": 2781} {"train_loss": -24.828222274780273, "global_step": 230863, "epoch": 2781} {"train_loss": -24.76279067993164, "global_step": 230864, "epoch": 2781} {"train_loss": -25.139312744140625, "global_step": 230865, "epoch": 2781} {"train_loss": -24.976774215698242, "global_step": 230866, "epoch": 2781} {"train_loss": -24.768774032592773, "global_step": 230867, "epoch": 2781} {"train_loss": -25.055723190307617, "global_step": 230868, "epoch": 2781} {"train_loss": -24.94501495361328, "global_step": 230869, "epoch": 2781} {"train_loss": -24.71591567993164, "global_step": 230870, "epoch": 2781} {"train_loss": -24.7886905670166, "global_step": 230871, "epoch": 2781} {"train_loss": -24.924169540405273, "global_step": 230872, "epoch": 2781} {"train_loss": -25.120737075805664, "global_step": 230873, "epoch": 2781} {"train_loss": -24.859128952026367, "global_step": 230874, "epoch": 2781} {"train_loss": -24.854623794555664, "global_step": 230875, "epoch": 2781} {"train_loss": -24.957441329956055, "global_step": 230876, "epoch": 2781} {"train_loss": -25.1892147064209, "global_step": 230877, "epoch": 2781} {"train_loss": -24.729408264160156, "global_step": 230878, "epoch": 2781} {"train_loss": -24.660049438476562, "global_step": 230879, "epoch": 2781} {"train_loss": -24.960952758789062, "global_step": 230880, "epoch": 2781} {"train_loss": -24.865198135375977, "global_step": 230881, "epoch": 2781} {"train_loss": -24.62253189086914, "global_step": 230882, "epoch": 2781} {"train_loss": -24.478744506835938, "global_step": 230883, "epoch": 2781} {"train_loss": -24.533615112304688, "global_step": 230884, "epoch": 2781} {"train_loss": -24.58138084411621, "global_step": 230885, "epoch": 2781} {"train_loss": -25.0644474029541, "global_step": 230886, "epoch": 2781} {"train_loss": -24.6186580657959, "global_step": 230887, "epoch": 2781} {"train_loss": -24.84406089782715, "global_step": 230888, "epoch": 2781} {"train_loss": -24.569454193115234, "global_step": 230889, "epoch": 2781} {"train_loss": -24.49799919128418, "global_step": 230890, "epoch": 2781} {"train_loss": -25.140878677368164, "global_step": 230891, "epoch": 2781} {"train_loss": -24.488901138305664, "global_step": 230892, "epoch": 2781} {"train_loss": -24.9461727142334, "global_step": 230893, "epoch": 2781} {"train_loss": -25.033689498901367, "global_step": 230894, "epoch": 2781} {"train_loss": -24.784465789794922, "global_step": 230895, "epoch": 2781} {"train_loss": -24.83629608154297, "global_step": 230896, "epoch": 2781} {"train_loss": -24.57352066040039, "global_step": 230897, "epoch": 2781} {"train_loss": -24.740625381469727, "global_step": 230898, "epoch": 2781} {"train_loss": -24.462804794311523, "global_step": 230899, "epoch": 2781} {"train_loss": -24.816783905029297, "global_step": 230900, "epoch": 2781} {"train_loss": -24.491947174072266, "global_step": 230901, "epoch": 2781} {"train_loss": -24.56447410583496, "global_step": 230902, "epoch": 2781} {"train_loss": -24.749414443969727, "global_step": 230903, "epoch": 2781} {"train_loss": -24.87139892578125, "global_step": 230904, "epoch": 2781} {"train_loss": -24.707829969475068, "global_step": 230905, "epoch": 2781, "val_loss": 6800095.5} {"train_loss": -24.211042404174805, "global_step": 230906, "epoch": 2782} {"train_loss": -24.230209350585938, "global_step": 230907, "epoch": 2782} {"train_loss": -24.370651245117188, "global_step": 230908, "epoch": 2782} {"train_loss": -23.95195198059082, "global_step": 230909, "epoch": 2782} {"train_loss": -24.372737884521484, "global_step": 230910, "epoch": 2782} {"train_loss": -24.27179527282715, "global_step": 230911, "epoch": 2782} {"train_loss": -23.678342819213867, "global_step": 230912, "epoch": 2782} {"train_loss": -24.33466911315918, "global_step": 230913, "epoch": 2782} {"train_loss": -24.1711483001709, "global_step": 230914, "epoch": 2782} {"train_loss": -24.144495010375977, "global_step": 230915, "epoch": 2782} {"train_loss": -24.24196434020996, "global_step": 230916, "epoch": 2782} {"train_loss": -24.428773880004883, "global_step": 230917, "epoch": 2782} {"train_loss": -24.2254695892334, "global_step": 230918, "epoch": 2782} {"train_loss": -24.09834098815918, "global_step": 230919, "epoch": 2782} {"train_loss": -24.6182861328125, "global_step": 230920, "epoch": 2782} {"train_loss": -24.6984806060791, "global_step": 230921, "epoch": 2782} {"train_loss": -24.8944149017334, "global_step": 230922, "epoch": 2782} {"train_loss": -24.315553665161133, "global_step": 230923, "epoch": 2782} {"train_loss": -25.065841674804688, "global_step": 230924, "epoch": 2782} {"train_loss": -24.821264266967773, "global_step": 230925, "epoch": 2782} {"train_loss": -24.387985229492188, "global_step": 230926, "epoch": 2782} {"train_loss": -24.697519302368164, "global_step": 230927, "epoch": 2782} {"train_loss": -24.476484298706055, "global_step": 230928, "epoch": 2782} {"train_loss": -24.670124053955078, "global_step": 230929, "epoch": 2782} {"train_loss": -24.41790199279785, "global_step": 230930, "epoch": 2782} {"train_loss": -24.012720108032227, "global_step": 230931, "epoch": 2782} {"train_loss": -24.661788940429688, "global_step": 230932, "epoch": 2782} {"train_loss": -24.814876556396484, "global_step": 230933, "epoch": 2782} {"train_loss": -24.37969398498535, "global_step": 230934, "epoch": 2782} {"train_loss": -25.23555564880371, "global_step": 230935, "epoch": 2782} {"train_loss": -24.55669593811035, "global_step": 230936, "epoch": 2782} {"train_loss": -24.57120132446289, "global_step": 230937, "epoch": 2782} {"train_loss": -24.549694061279297, "global_step": 230938, "epoch": 2782} {"train_loss": -25.11703109741211, "global_step": 230939, "epoch": 2782} {"train_loss": -24.59122085571289, "global_step": 230940, "epoch": 2782} {"train_loss": -24.874542236328125, "global_step": 230941, "epoch": 2782} {"train_loss": -24.644332885742188, "global_step": 230942, "epoch": 2782} {"train_loss": -24.807865142822266, "global_step": 230943, "epoch": 2782} {"train_loss": -24.93423843383789, "global_step": 230944, "epoch": 2782} {"train_loss": -24.752944946289062, "global_step": 230945, "epoch": 2782} {"train_loss": -24.944976806640625, "global_step": 230946, "epoch": 2782} {"train_loss": -24.522106170654297, "global_step": 230947, "epoch": 2782} {"train_loss": -24.755935668945312, "global_step": 230948, "epoch": 2782} {"train_loss": -25.083181381225586, "global_step": 230949, "epoch": 2782} {"train_loss": -25.119367599487305, "global_step": 230950, "epoch": 2782} {"train_loss": -24.79670524597168, "global_step": 230951, "epoch": 2782} {"train_loss": -24.950223922729492, "global_step": 230952, "epoch": 2782} {"train_loss": -24.85462760925293, "global_step": 230953, "epoch": 2782} {"train_loss": -24.842329025268555, "global_step": 230954, "epoch": 2782} {"train_loss": -25.132003784179688, "global_step": 230955, "epoch": 2782} {"train_loss": -25.156505584716797, "global_step": 230956, "epoch": 2782} {"train_loss": -24.688053131103516, "global_step": 230957, "epoch": 2782} {"train_loss": -25.086254119873047, "global_step": 230958, "epoch": 2782} {"train_loss": -24.987905502319336, "global_step": 230959, "epoch": 2782} {"train_loss": -24.778043746948242, "global_step": 230960, "epoch": 2782} {"train_loss": -25.079004287719727, "global_step": 230961, "epoch": 2782} {"train_loss": -25.110349655151367, "global_step": 230962, "epoch": 2782} {"train_loss": -25.2387752532959, "global_step": 230963, "epoch": 2782} {"train_loss": -25.229780197143555, "global_step": 230964, "epoch": 2782} {"train_loss": -24.651609420776367, "global_step": 230965, "epoch": 2782} {"train_loss": -24.688095092773438, "global_step": 230966, "epoch": 2782} {"train_loss": -24.643264770507812, "global_step": 230967, "epoch": 2782} {"train_loss": -24.76924705505371, "global_step": 230968, "epoch": 2782} {"train_loss": -24.324682235717773, "global_step": 230969, "epoch": 2782} {"train_loss": -24.464553833007812, "global_step": 230970, "epoch": 2782} {"train_loss": -24.81130027770996, "global_step": 230971, "epoch": 2782} {"train_loss": -24.697595596313477, "global_step": 230972, "epoch": 2782} {"train_loss": -24.71610450744629, "global_step": 230973, "epoch": 2782} {"train_loss": -24.669431686401367, "global_step": 230974, "epoch": 2782} {"train_loss": -24.56298828125, "global_step": 230975, "epoch": 2782} {"train_loss": -24.939041137695312, "global_step": 230976, "epoch": 2782} {"train_loss": -24.536996841430664, "global_step": 230977, "epoch": 2782} {"train_loss": -24.378103256225586, "global_step": 230978, "epoch": 2782} {"train_loss": -24.572633743286133, "global_step": 230979, "epoch": 2782} {"train_loss": -24.87462615966797, "global_step": 230980, "epoch": 2782} {"train_loss": -24.564828872680664, "global_step": 230981, "epoch": 2782} {"train_loss": -25.050277709960938, "global_step": 230982, "epoch": 2782} {"train_loss": -24.703109741210938, "global_step": 230983, "epoch": 2782} {"train_loss": -24.89522361755371, "global_step": 230984, "epoch": 2782} {"train_loss": -24.703754425048828, "global_step": 230985, "epoch": 2782} {"train_loss": -24.87587547302246, "global_step": 230986, "epoch": 2782} {"train_loss": -24.976709365844727, "global_step": 230987, "epoch": 2782} {"train_loss": -24.673908785165075, "global_step": 230988, "epoch": 2782, "val_loss": 6672406.0} {"train_loss": -24.7744083404541, "global_step": 230989, "epoch": 2783} {"train_loss": -23.81414031982422, "global_step": 230990, "epoch": 2783} {"train_loss": -23.992630004882812, "global_step": 230991, "epoch": 2783} {"train_loss": -24.251440048217773, "global_step": 230992, "epoch": 2783} {"train_loss": -24.394359588623047, "global_step": 230993, "epoch": 2783} {"train_loss": -24.574941635131836, "global_step": 230994, "epoch": 2783} {"train_loss": -24.431020736694336, "global_step": 230995, "epoch": 2783} {"train_loss": -24.00271987915039, "global_step": 230996, "epoch": 2783} {"train_loss": -24.48710060119629, "global_step": 230997, "epoch": 2783} {"train_loss": -24.598026275634766, "global_step": 230998, "epoch": 2783} {"train_loss": -24.777732849121094, "global_step": 230999, "epoch": 2783} {"train_loss": -24.54502296447754, "global_step": 231000, "epoch": 2783} {"train_loss": -24.52887725830078, "global_step": 231001, "epoch": 2783} {"train_loss": -24.885595321655273, "global_step": 231002, "epoch": 2783} {"train_loss": -24.57771873474121, "global_step": 231003, "epoch": 2783} {"train_loss": -24.279550552368164, "global_step": 231004, "epoch": 2783} {"train_loss": -24.56854248046875, "global_step": 231005, "epoch": 2783} {"train_loss": -24.59820556640625, "global_step": 231006, "epoch": 2783} {"train_loss": -24.113752365112305, "global_step": 231007, "epoch": 2783} {"train_loss": -24.50263786315918, "global_step": 231008, "epoch": 2783} {"train_loss": -24.52573013305664, "global_step": 231009, "epoch": 2783} {"train_loss": -24.610158920288086, "global_step": 231010, "epoch": 2783} {"train_loss": -24.350393295288086, "global_step": 231011, "epoch": 2783} {"train_loss": -24.268903732299805, "global_step": 231012, "epoch": 2783} {"train_loss": -24.711679458618164, "global_step": 231013, "epoch": 2783} {"train_loss": -24.676517486572266, "global_step": 231014, "epoch": 2783} {"train_loss": -24.694581985473633, "global_step": 231015, "epoch": 2783} {"train_loss": -24.895572662353516, "global_step": 231016, "epoch": 2783} {"train_loss": -24.321359634399414, "global_step": 231017, "epoch": 2783} {"train_loss": -24.34246826171875, "global_step": 231018, "epoch": 2783} {"train_loss": -24.838781356811523, "global_step": 231019, "epoch": 2783} {"train_loss": -25.087289810180664, "global_step": 231020, "epoch": 2783} {"train_loss": -24.69183349609375, "global_step": 231021, "epoch": 2783} {"train_loss": -24.6901912689209, "global_step": 231022, "epoch": 2783} {"train_loss": -24.539731979370117, "global_step": 231023, "epoch": 2783} {"train_loss": -24.66908073425293, "global_step": 231024, "epoch": 2783} {"train_loss": -24.413799285888672, "global_step": 231025, "epoch": 2783} {"train_loss": -24.608509063720703, "global_step": 231026, "epoch": 2783} {"train_loss": -24.98356056213379, "global_step": 231027, "epoch": 2783} {"train_loss": -25.162534713745117, "global_step": 231028, "epoch": 2783} {"train_loss": -24.9776611328125, "global_step": 231029, "epoch": 2783} {"train_loss": -24.786117553710938, "global_step": 231030, "epoch": 2783} {"train_loss": -24.531665802001953, "global_step": 231031, "epoch": 2783} {"train_loss": -24.475727081298828, "global_step": 231032, "epoch": 2783} {"train_loss": -24.947284698486328, "global_step": 231033, "epoch": 2783} {"train_loss": -24.718008041381836, "global_step": 231034, "epoch": 2783} {"train_loss": -24.674673080444336, "global_step": 231035, "epoch": 2783} {"train_loss": -24.96906852722168, "global_step": 231036, "epoch": 2783} {"train_loss": -24.445287704467773, "global_step": 231037, "epoch": 2783} {"train_loss": -24.658973693847656, "global_step": 231038, "epoch": 2783} {"train_loss": -25.04063606262207, "global_step": 231039, "epoch": 2783} {"train_loss": -24.850618362426758, "global_step": 231040, "epoch": 2783} {"train_loss": -24.848289489746094, "global_step": 231041, "epoch": 2783} {"train_loss": -24.527761459350586, "global_step": 231042, "epoch": 2783} {"train_loss": -24.84640121459961, "global_step": 231043, "epoch": 2783} {"train_loss": -24.617292404174805, "global_step": 231044, "epoch": 2783} {"train_loss": -24.618209838867188, "global_step": 231045, "epoch": 2783} {"train_loss": -24.53302001953125, "global_step": 231046, "epoch": 2783} {"train_loss": -24.645206451416016, "global_step": 231047, "epoch": 2783} {"train_loss": -24.517580032348633, "global_step": 231048, "epoch": 2783} {"train_loss": -24.747175216674805, "global_step": 231049, "epoch": 2783} {"train_loss": -24.594192504882812, "global_step": 231050, "epoch": 2783} {"train_loss": -24.566850662231445, "global_step": 231051, "epoch": 2783} {"train_loss": -24.485973358154297, "global_step": 231052, "epoch": 2783} {"train_loss": -24.7575626373291, "global_step": 231053, "epoch": 2783} {"train_loss": -24.351451873779297, "global_step": 231054, "epoch": 2783} {"train_loss": -24.357091903686523, "global_step": 231055, "epoch": 2783} {"train_loss": -24.613449096679688, "global_step": 231056, "epoch": 2783} {"train_loss": -24.667444229125977, "global_step": 231057, "epoch": 2783} {"train_loss": -24.390668869018555, "global_step": 231058, "epoch": 2783} {"train_loss": -24.62958335876465, "global_step": 231059, "epoch": 2783} {"train_loss": -24.704816818237305, "global_step": 231060, "epoch": 2783} {"train_loss": -24.702526092529297, "global_step": 231061, "epoch": 2783} {"train_loss": -24.68610954284668, "global_step": 231062, "epoch": 2783} {"train_loss": -24.630735397338867, "global_step": 231063, "epoch": 2783} {"train_loss": -24.815149307250977, "global_step": 231064, "epoch": 2783} {"train_loss": -24.75181007385254, "global_step": 231065, "epoch": 2783} {"train_loss": -24.621990203857422, "global_step": 231066, "epoch": 2783} {"train_loss": -24.855478286743164, "global_step": 231067, "epoch": 2783} {"train_loss": -24.739957809448242, "global_step": 231068, "epoch": 2783} {"train_loss": -24.94666862487793, "global_step": 231069, "epoch": 2783} {"train_loss": -24.949995040893555, "global_step": 231070, "epoch": 2783} {"train_loss": -24.620862133531684, "global_step": 231071, "epoch": 2783, "val_loss": 6584366.0} {"train_loss": -24.68914794921875, "global_step": 231072, "epoch": 2784} {"train_loss": -24.661863327026367, "global_step": 231073, "epoch": 2784} {"train_loss": -24.90089225769043, "global_step": 231074, "epoch": 2784} {"train_loss": -24.63637924194336, "global_step": 231075, "epoch": 2784} {"train_loss": -24.74523162841797, "global_step": 231076, "epoch": 2784} {"train_loss": -24.48126983642578, "global_step": 231077, "epoch": 2784} {"train_loss": -24.920242309570312, "global_step": 231078, "epoch": 2784} {"train_loss": -24.934324264526367, "global_step": 231079, "epoch": 2784} {"train_loss": -24.842863082885742, "global_step": 231080, "epoch": 2784} {"train_loss": -24.62083625793457, "global_step": 231081, "epoch": 2784} {"train_loss": -24.790313720703125, "global_step": 231082, "epoch": 2784} {"train_loss": -24.572797775268555, "global_step": 231083, "epoch": 2784} {"train_loss": -24.743261337280273, "global_step": 231084, "epoch": 2784} {"train_loss": -24.679676055908203, "global_step": 231085, "epoch": 2784} {"train_loss": -25.17829704284668, "global_step": 231086, "epoch": 2784} {"train_loss": -24.65100860595703, "global_step": 231087, "epoch": 2784} {"train_loss": -24.54743003845215, "global_step": 231088, "epoch": 2784} {"train_loss": -24.507308959960938, "global_step": 231089, "epoch": 2784} {"train_loss": -25.102081298828125, "global_step": 231090, "epoch": 2784} {"train_loss": -24.546775817871094, "global_step": 231091, "epoch": 2784} {"train_loss": -24.80938720703125, "global_step": 231092, "epoch": 2784} {"train_loss": -24.60382843017578, "global_step": 231093, "epoch": 2784} {"train_loss": -24.786649703979492, "global_step": 231094, "epoch": 2784} {"train_loss": -24.908527374267578, "global_step": 231095, "epoch": 2784} {"train_loss": -24.876388549804688, "global_step": 231096, "epoch": 2784} {"train_loss": -24.678407669067383, "global_step": 231097, "epoch": 2784} {"train_loss": -24.6767635345459, "global_step": 231098, "epoch": 2784} {"train_loss": -24.818052291870117, "global_step": 231099, "epoch": 2784} {"train_loss": -24.67861557006836, "global_step": 231100, "epoch": 2784} {"train_loss": -24.4669132232666, "global_step": 231101, "epoch": 2784} {"train_loss": -24.451993942260742, "global_step": 231102, "epoch": 2784} {"train_loss": -24.459928512573242, "global_step": 231103, "epoch": 2784} {"train_loss": -24.846969604492188, "global_step": 231104, "epoch": 2784} {"train_loss": -25.51722526550293, "global_step": 231105, "epoch": 2784} {"train_loss": -24.726999282836914, "global_step": 231106, "epoch": 2784} {"train_loss": -24.7161922454834, "global_step": 231107, "epoch": 2784} {"train_loss": -24.761470794677734, "global_step": 231108, "epoch": 2784} {"train_loss": -24.673643112182617, "global_step": 231109, "epoch": 2784} {"train_loss": -25.45597267150879, "global_step": 231110, "epoch": 2784} {"train_loss": -24.6215877532959, "global_step": 231111, "epoch": 2784} {"train_loss": -24.75582504272461, "global_step": 231112, "epoch": 2784} {"train_loss": -24.94350242614746, "global_step": 231113, "epoch": 2784} {"train_loss": -24.71365737915039, "global_step": 231114, "epoch": 2784} {"train_loss": -24.69351577758789, "global_step": 231115, "epoch": 2784} {"train_loss": -24.71016502380371, "global_step": 231116, "epoch": 2784} {"train_loss": -24.724538803100586, "global_step": 231117, "epoch": 2784} {"train_loss": -24.653371810913086, "global_step": 231118, "epoch": 2784} {"train_loss": -25.00626564025879, "global_step": 231119, "epoch": 2784} {"train_loss": -24.764942169189453, "global_step": 231120, "epoch": 2784} {"train_loss": -24.740381240844727, "global_step": 231121, "epoch": 2784} {"train_loss": -24.719640731811523, "global_step": 231122, "epoch": 2784} {"train_loss": -24.72258186340332, "global_step": 231123, "epoch": 2784} {"train_loss": -25.065174102783203, "global_step": 231124, "epoch": 2784} {"train_loss": -24.878768920898438, "global_step": 231125, "epoch": 2784} {"train_loss": -24.764541625976562, "global_step": 231126, "epoch": 2784} {"train_loss": -24.626750946044922, "global_step": 231127, "epoch": 2784} {"train_loss": -24.922653198242188, "global_step": 231128, "epoch": 2784} {"train_loss": -24.87580680847168, "global_step": 231129, "epoch": 2784} {"train_loss": -24.748428344726562, "global_step": 231130, "epoch": 2784} {"train_loss": -24.70480728149414, "global_step": 231131, "epoch": 2784} {"train_loss": -24.963544845581055, "global_step": 231132, "epoch": 2784} {"train_loss": -25.08100700378418, "global_step": 231133, "epoch": 2784} {"train_loss": -24.390661239624023, "global_step": 231134, "epoch": 2784} {"train_loss": -25.09341812133789, "global_step": 231135, "epoch": 2784} {"train_loss": -24.798757553100586, "global_step": 231136, "epoch": 2784} {"train_loss": -24.941082000732422, "global_step": 231137, "epoch": 2784} {"train_loss": -24.724502563476562, "global_step": 231138, "epoch": 2784} {"train_loss": -24.846302032470703, "global_step": 231139, "epoch": 2784} {"train_loss": -24.894489288330078, "global_step": 231140, "epoch": 2784} {"train_loss": -24.60964584350586, "global_step": 231141, "epoch": 2784} {"train_loss": -24.546390533447266, "global_step": 231142, "epoch": 2784} {"train_loss": -24.418601989746094, "global_step": 231143, "epoch": 2784} {"train_loss": -24.618192672729492, "global_step": 231144, "epoch": 2784} {"train_loss": -25.139429092407227, "global_step": 231145, "epoch": 2784} {"train_loss": -24.767520904541016, "global_step": 231146, "epoch": 2784} {"train_loss": -24.588043212890625, "global_step": 231147, "epoch": 2784} {"train_loss": -24.707551956176758, "global_step": 231148, "epoch": 2784} {"train_loss": -24.35814094543457, "global_step": 231149, "epoch": 2784} {"train_loss": -24.7337703704834, "global_step": 231150, "epoch": 2784} {"train_loss": -24.931188583374023, "global_step": 231151, "epoch": 2784} {"train_loss": -24.856237411499023, "global_step": 231152, "epoch": 2784} {"train_loss": -24.7562313079834, "global_step": 231153, "epoch": 2784} {"train_loss": -24.777444081134107, "global_step": 231154, "epoch": 2784, "val_loss": 6666888.5} {"train_loss": -23.758014678955078, "global_step": 231155, "epoch": 2785} {"train_loss": -23.831531524658203, "global_step": 231156, "epoch": 2785} {"train_loss": -24.495283126831055, "global_step": 231157, "epoch": 2785} {"train_loss": -23.16883087158203, "global_step": 231158, "epoch": 2785} {"train_loss": -24.0898380279541, "global_step": 231159, "epoch": 2785} {"train_loss": -23.739580154418945, "global_step": 231160, "epoch": 2785} {"train_loss": -23.97079086303711, "global_step": 231161, "epoch": 2785} {"train_loss": -24.17302131652832, "global_step": 231162, "epoch": 2785} {"train_loss": -24.018417358398438, "global_step": 231163, "epoch": 2785} {"train_loss": -23.811660766601562, "global_step": 231164, "epoch": 2785} {"train_loss": -24.219289779663086, "global_step": 231165, "epoch": 2785} {"train_loss": -24.199525833129883, "global_step": 231166, "epoch": 2785} {"train_loss": -24.100868225097656, "global_step": 231167, "epoch": 2785} {"train_loss": -24.106908798217773, "global_step": 231168, "epoch": 2785} {"train_loss": -24.503833770751953, "global_step": 231169, "epoch": 2785} {"train_loss": -24.236713409423828, "global_step": 231170, "epoch": 2785} {"train_loss": -24.479616165161133, "global_step": 231171, "epoch": 2785} {"train_loss": -24.470367431640625, "global_step": 231172, "epoch": 2785} {"train_loss": -24.563085556030273, "global_step": 231173, "epoch": 2785} {"train_loss": -23.99976348876953, "global_step": 231174, "epoch": 2785} {"train_loss": -24.274768829345703, "global_step": 231175, "epoch": 2785} {"train_loss": -24.37303352355957, "global_step": 231176, "epoch": 2785} {"train_loss": -24.350576400756836, "global_step": 231177, "epoch": 2785} {"train_loss": -24.172903060913086, "global_step": 231178, "epoch": 2785} {"train_loss": -24.435718536376953, "global_step": 231179, "epoch": 2785} {"train_loss": -24.51573371887207, "global_step": 231180, "epoch": 2785} {"train_loss": -24.35349464416504, "global_step": 231181, "epoch": 2785} {"train_loss": -24.64405632019043, "global_step": 231182, "epoch": 2785} {"train_loss": -24.539066314697266, "global_step": 231183, "epoch": 2785} {"train_loss": -24.76821517944336, "global_step": 231184, "epoch": 2785} {"train_loss": -24.91029167175293, "global_step": 231185, "epoch": 2785} {"train_loss": -24.596782684326172, "global_step": 231186, "epoch": 2785} {"train_loss": -24.805524826049805, "global_step": 231187, "epoch": 2785} {"train_loss": -24.431732177734375, "global_step": 231188, "epoch": 2785} {"train_loss": -24.322622299194336, "global_step": 231189, "epoch": 2785} {"train_loss": -24.986513137817383, "global_step": 231190, "epoch": 2785} {"train_loss": -24.437042236328125, "global_step": 231191, "epoch": 2785} {"train_loss": -25.0096435546875, "global_step": 231192, "epoch": 2785} {"train_loss": -24.526803970336914, "global_step": 231193, "epoch": 2785} {"train_loss": -24.64788246154785, "global_step": 231194, "epoch": 2785} {"train_loss": -24.358549118041992, "global_step": 231195, "epoch": 2785} {"train_loss": -24.829425811767578, "global_step": 231196, "epoch": 2785} {"train_loss": -24.605680465698242, "global_step": 231197, "epoch": 2785} {"train_loss": -24.689254760742188, "global_step": 231198, "epoch": 2785} {"train_loss": -24.851879119873047, "global_step": 231199, "epoch": 2785} {"train_loss": -24.71946144104004, "global_step": 231200, "epoch": 2785} {"train_loss": -24.456012725830078, "global_step": 231201, "epoch": 2785} {"train_loss": -24.457813262939453, "global_step": 231202, "epoch": 2785} {"train_loss": -24.468896865844727, "global_step": 231203, "epoch": 2785} {"train_loss": -24.550668716430664, "global_step": 231204, "epoch": 2785} {"train_loss": -24.90792465209961, "global_step": 231205, "epoch": 2785} {"train_loss": -24.789722442626953, "global_step": 231206, "epoch": 2785} {"train_loss": -24.651941299438477, "global_step": 231207, "epoch": 2785} {"train_loss": -24.766977310180664, "global_step": 231208, "epoch": 2785} {"train_loss": -24.812585830688477, "global_step": 231209, "epoch": 2785} {"train_loss": -25.016355514526367, "global_step": 231210, "epoch": 2785} {"train_loss": -25.088829040527344, "global_step": 231211, "epoch": 2785} {"train_loss": -25.08519744873047, "global_step": 231212, "epoch": 2785} {"train_loss": -24.302509307861328, "global_step": 231213, "epoch": 2785} {"train_loss": -25.053085327148438, "global_step": 231214, "epoch": 2785} {"train_loss": -24.668132781982422, "global_step": 231215, "epoch": 2785} {"train_loss": -24.480777740478516, "global_step": 231216, "epoch": 2785} {"train_loss": -24.640466690063477, "global_step": 231217, "epoch": 2785} {"train_loss": -24.832321166992188, "global_step": 231218, "epoch": 2785} {"train_loss": -24.48322868347168, "global_step": 231219, "epoch": 2785} {"train_loss": -25.151823043823242, "global_step": 231220, "epoch": 2785} {"train_loss": -25.092872619628906, "global_step": 231221, "epoch": 2785} {"train_loss": -24.77291488647461, "global_step": 231222, "epoch": 2785} {"train_loss": -24.735177993774414, "global_step": 231223, "epoch": 2785} {"train_loss": -24.801660537719727, "global_step": 231224, "epoch": 2785} {"train_loss": -24.941328048706055, "global_step": 231225, "epoch": 2785} {"train_loss": -24.942102432250977, "global_step": 231226, "epoch": 2785} {"train_loss": -24.77286720275879, "global_step": 231227, "epoch": 2785} {"train_loss": -25.046100616455078, "global_step": 231228, "epoch": 2785} {"train_loss": -24.723684310913086, "global_step": 231229, "epoch": 2785} {"train_loss": -24.72435760498047, "global_step": 231230, "epoch": 2785} {"train_loss": -24.940006256103516, "global_step": 231231, "epoch": 2785} {"train_loss": -25.0152645111084, "global_step": 231232, "epoch": 2785} {"train_loss": -24.924776077270508, "global_step": 231233, "epoch": 2785} {"train_loss": -25.026050567626953, "global_step": 231234, "epoch": 2785} {"train_loss": -24.936878204345703, "global_step": 231235, "epoch": 2785} {"train_loss": -24.715818405151367, "global_step": 231236, "epoch": 2785} {"train_loss": -24.574808970991388, "global_step": 231237, "epoch": 2785, "val_loss": 6653097.0} {"train_loss": -23.445571899414062, "global_step": 231238, "epoch": 2786} {"train_loss": -22.943796157836914, "global_step": 231239, "epoch": 2786} {"train_loss": -24.28534698486328, "global_step": 231240, "epoch": 2786} {"train_loss": -23.30164337158203, "global_step": 231241, "epoch": 2786} {"train_loss": -24.291996002197266, "global_step": 231242, "epoch": 2786} {"train_loss": -23.766571044921875, "global_step": 231243, "epoch": 2786} {"train_loss": -23.48896598815918, "global_step": 231244, "epoch": 2786} {"train_loss": -23.93391227722168, "global_step": 231245, "epoch": 2786} {"train_loss": -24.03105926513672, "global_step": 231246, "epoch": 2786} {"train_loss": -22.88442039489746, "global_step": 231247, "epoch": 2786} {"train_loss": -24.285253524780273, "global_step": 231248, "epoch": 2786} {"train_loss": -23.76272964477539, "global_step": 231249, "epoch": 2786} {"train_loss": -23.64113998413086, "global_step": 231250, "epoch": 2786} {"train_loss": -24.17147445678711, "global_step": 231251, "epoch": 2786} {"train_loss": -23.69681739807129, "global_step": 231252, "epoch": 2786} {"train_loss": -24.198715209960938, "global_step": 231253, "epoch": 2786} {"train_loss": -24.162899017333984, "global_step": 231254, "epoch": 2786} {"train_loss": -24.184837341308594, "global_step": 231255, "epoch": 2786} {"train_loss": -24.247365951538086, "global_step": 231256, "epoch": 2786} {"train_loss": -24.038053512573242, "global_step": 231257, "epoch": 2786} {"train_loss": -23.86454200744629, "global_step": 231258, "epoch": 2786} {"train_loss": -24.31287384033203, "global_step": 231259, "epoch": 2786} {"train_loss": -24.247976303100586, "global_step": 231260, "epoch": 2786} {"train_loss": -24.349639892578125, "global_step": 231261, "epoch": 2786} {"train_loss": -24.222761154174805, "global_step": 231262, "epoch": 2786} {"train_loss": -24.37674331665039, "global_step": 231263, "epoch": 2786} {"train_loss": -24.256175994873047, "global_step": 231264, "epoch": 2786} {"train_loss": -24.146577835083008, "global_step": 231265, "epoch": 2786} {"train_loss": -24.26938247680664, "global_step": 231266, "epoch": 2786} {"train_loss": -24.596298217773438, "global_step": 231267, "epoch": 2786} {"train_loss": -24.504026412963867, "global_step": 231268, "epoch": 2786} {"train_loss": -24.706769943237305, "global_step": 231269, "epoch": 2786} {"train_loss": -24.66636848449707, "global_step": 231270, "epoch": 2786} {"train_loss": -24.694473266601562, "global_step": 231271, "epoch": 2786} {"train_loss": -24.729185104370117, "global_step": 231272, "epoch": 2786} {"train_loss": -24.416065216064453, "global_step": 231273, "epoch": 2786} {"train_loss": -24.74785041809082, "global_step": 231274, "epoch": 2786} {"train_loss": -24.847747802734375, "global_step": 231275, "epoch": 2786} {"train_loss": -24.589080810546875, "global_step": 231276, "epoch": 2786} {"train_loss": -24.8770809173584, "global_step": 231277, "epoch": 2786} {"train_loss": -24.8861026763916, "global_step": 231278, "epoch": 2786} {"train_loss": -25.018796920776367, "global_step": 231279, "epoch": 2786} {"train_loss": -25.213237762451172, "global_step": 231280, "epoch": 2786} {"train_loss": -24.931324005126953, "global_step": 231281, "epoch": 2786} {"train_loss": -24.802183151245117, "global_step": 231282, "epoch": 2786} {"train_loss": -24.79096031188965, "global_step": 231283, "epoch": 2786} {"train_loss": -24.5290584564209, "global_step": 231284, "epoch": 2786} {"train_loss": -24.77777862548828, "global_step": 231285, "epoch": 2786} {"train_loss": -24.927339553833008, "global_step": 231286, "epoch": 2786} {"train_loss": -25.01401710510254, "global_step": 231287, "epoch": 2786} {"train_loss": -25.01630210876465, "global_step": 231288, "epoch": 2786} {"train_loss": -24.704011917114258, "global_step": 231289, "epoch": 2786} {"train_loss": -25.018569946289062, "global_step": 231290, "epoch": 2786} {"train_loss": -24.872270584106445, "global_step": 231291, "epoch": 2786} {"train_loss": -25.114879608154297, "global_step": 231292, "epoch": 2786} {"train_loss": -24.70594024658203, "global_step": 231293, "epoch": 2786} {"train_loss": -24.51153564453125, "global_step": 231294, "epoch": 2786} {"train_loss": -24.541976928710938, "global_step": 231295, "epoch": 2786} {"train_loss": -24.792993545532227, "global_step": 231296, "epoch": 2786} {"train_loss": -25.51465606689453, "global_step": 231297, "epoch": 2786} {"train_loss": -24.60560417175293, "global_step": 231298, "epoch": 2786} {"train_loss": -24.785781860351562, "global_step": 231299, "epoch": 2786} {"train_loss": -24.852291107177734, "global_step": 231300, "epoch": 2786} {"train_loss": -24.79632568359375, "global_step": 231301, "epoch": 2786} {"train_loss": -24.53616714477539, "global_step": 231302, "epoch": 2786} {"train_loss": -24.67882537841797, "global_step": 231303, "epoch": 2786} {"train_loss": -24.773801803588867, "global_step": 231304, "epoch": 2786} {"train_loss": -24.54439353942871, "global_step": 231305, "epoch": 2786} {"train_loss": -24.65152359008789, "global_step": 231306, "epoch": 2786} {"train_loss": -25.19601821899414, "global_step": 231307, "epoch": 2786} {"train_loss": -24.720935821533203, "global_step": 231308, "epoch": 2786} {"train_loss": -24.654808044433594, "global_step": 231309, "epoch": 2786} {"train_loss": -24.550888061523438, "global_step": 231310, "epoch": 2786} {"train_loss": -24.789844512939453, "global_step": 231311, "epoch": 2786} {"train_loss": -24.577924728393555, "global_step": 231312, "epoch": 2786} {"train_loss": -24.793155670166016, "global_step": 231313, "epoch": 2786} {"train_loss": -24.587560653686523, "global_step": 231314, "epoch": 2786} {"train_loss": -24.806411743164062, "global_step": 231315, "epoch": 2786} {"train_loss": -24.826711654663086, "global_step": 231316, "epoch": 2786} {"train_loss": -24.590152740478516, "global_step": 231317, "epoch": 2786} {"train_loss": -24.58766746520996, "global_step": 231318, "epoch": 2786} {"train_loss": -24.916000366210938, "global_step": 231319, "epoch": 2786} {"train_loss": -24.494635570480163, "global_step": 231320, "epoch": 2786, "val_loss": 6725291.0} {"train_loss": -24.267189025878906, "global_step": 231321, "epoch": 2787} {"train_loss": -24.871885299682617, "global_step": 231322, "epoch": 2787} {"train_loss": -24.22395133972168, "global_step": 231323, "epoch": 2787} {"train_loss": -24.688688278198242, "global_step": 231324, "epoch": 2787} {"train_loss": -24.429689407348633, "global_step": 231325, "epoch": 2787} {"train_loss": -24.263513565063477, "global_step": 231326, "epoch": 2787} {"train_loss": -24.29020118713379, "global_step": 231327, "epoch": 2787} {"train_loss": -24.488235473632812, "global_step": 231328, "epoch": 2787} {"train_loss": -24.505962371826172, "global_step": 231329, "epoch": 2787} {"train_loss": -24.685041427612305, "global_step": 231330, "epoch": 2787} {"train_loss": -24.597497940063477, "global_step": 231331, "epoch": 2787} {"train_loss": -24.850400924682617, "global_step": 231332, "epoch": 2787} {"train_loss": -24.609535217285156, "global_step": 231333, "epoch": 2787} {"train_loss": -24.856266021728516, "global_step": 231334, "epoch": 2787} {"train_loss": -24.762083053588867, "global_step": 231335, "epoch": 2787} {"train_loss": -24.62172508239746, "global_step": 231336, "epoch": 2787} {"train_loss": -24.535993576049805, "global_step": 231337, "epoch": 2787} {"train_loss": -24.66800880432129, "global_step": 231338, "epoch": 2787} {"train_loss": -25.042936325073242, "global_step": 231339, "epoch": 2787} {"train_loss": -24.799274444580078, "global_step": 231340, "epoch": 2787} {"train_loss": -25.021717071533203, "global_step": 231341, "epoch": 2787} {"train_loss": -24.7575740814209, "global_step": 231342, "epoch": 2787} {"train_loss": -24.874238967895508, "global_step": 231343, "epoch": 2787} {"train_loss": -24.97212028503418, "global_step": 231344, "epoch": 2787} {"train_loss": -24.46647071838379, "global_step": 231345, "epoch": 2787} {"train_loss": -24.74921417236328, "global_step": 231346, "epoch": 2787} {"train_loss": -24.984567642211914, "global_step": 231347, "epoch": 2787} {"train_loss": -24.444242477416992, "global_step": 231348, "epoch": 2787} {"train_loss": -24.841325759887695, "global_step": 231349, "epoch": 2787} {"train_loss": -24.607215881347656, "global_step": 231350, "epoch": 2787} {"train_loss": -24.594491958618164, "global_step": 231351, "epoch": 2787} {"train_loss": -24.760684967041016, "global_step": 231352, "epoch": 2787} {"train_loss": -24.6769962310791, "global_step": 231353, "epoch": 2787} {"train_loss": -24.710176467895508, "global_step": 231354, "epoch": 2787} {"train_loss": -24.57350730895996, "global_step": 231355, "epoch": 2787} {"train_loss": -24.533288955688477, "global_step": 231356, "epoch": 2787} {"train_loss": -24.732677459716797, "global_step": 231357, "epoch": 2787} {"train_loss": -24.83504295349121, "global_step": 231358, "epoch": 2787} {"train_loss": -24.6612548828125, "global_step": 231359, "epoch": 2787} {"train_loss": -24.85508918762207, "global_step": 231360, "epoch": 2787} {"train_loss": -25.03955078125, "global_step": 231361, "epoch": 2787} {"train_loss": -24.742223739624023, "global_step": 231362, "epoch": 2787} {"train_loss": -25.011444091796875, "global_step": 231363, "epoch": 2787} {"train_loss": -24.769378662109375, "global_step": 231364, "epoch": 2787} {"train_loss": -24.794876098632812, "global_step": 231365, "epoch": 2787} {"train_loss": -24.90077018737793, "global_step": 231366, "epoch": 2787} {"train_loss": -24.678924560546875, "global_step": 231367, "epoch": 2787} {"train_loss": -24.883337020874023, "global_step": 231368, "epoch": 2787} {"train_loss": -24.917137145996094, "global_step": 231369, "epoch": 2787} {"train_loss": -25.14331817626953, "global_step": 231370, "epoch": 2787} {"train_loss": -24.92120361328125, "global_step": 231371, "epoch": 2787} {"train_loss": -25.39058494567871, "global_step": 231372, "epoch": 2787} {"train_loss": -24.93084144592285, "global_step": 231373, "epoch": 2787} {"train_loss": -24.74057960510254, "global_step": 231374, "epoch": 2787} {"train_loss": -24.61053466796875, "global_step": 231375, "epoch": 2787} {"train_loss": -25.11920928955078, "global_step": 231376, "epoch": 2787} {"train_loss": -24.828733444213867, "global_step": 231377, "epoch": 2787} {"train_loss": -24.848312377929688, "global_step": 231378, "epoch": 2787} {"train_loss": -24.76894760131836, "global_step": 231379, "epoch": 2787} {"train_loss": -24.5482234954834, "global_step": 231380, "epoch": 2787} {"train_loss": -24.608280181884766, "global_step": 231381, "epoch": 2787} {"train_loss": -24.925735473632812, "global_step": 231382, "epoch": 2787} {"train_loss": -24.76521873474121, "global_step": 231383, "epoch": 2787} {"train_loss": -24.988168716430664, "global_step": 231384, "epoch": 2787} {"train_loss": -25.2203311920166, "global_step": 231385, "epoch": 2787} {"train_loss": -24.796003341674805, "global_step": 231386, "epoch": 2787} {"train_loss": -24.844785690307617, "global_step": 231387, "epoch": 2787} {"train_loss": -24.884611129760742, "global_step": 231388, "epoch": 2787} {"train_loss": -24.966896057128906, "global_step": 231389, "epoch": 2787} {"train_loss": -24.674795150756836, "global_step": 231390, "epoch": 2787} {"train_loss": -24.758825302124023, "global_step": 231391, "epoch": 2787} {"train_loss": -24.903453826904297, "global_step": 231392, "epoch": 2787} {"train_loss": -25.040739059448242, "global_step": 231393, "epoch": 2787} {"train_loss": -25.11386489868164, "global_step": 231394, "epoch": 2787} {"train_loss": -24.922212600708008, "global_step": 231395, "epoch": 2787} {"train_loss": -25.084386825561523, "global_step": 231396, "epoch": 2787} {"train_loss": -24.686050415039062, "global_step": 231397, "epoch": 2787} {"train_loss": -24.891931533813477, "global_step": 231398, "epoch": 2787} {"train_loss": -24.927200317382812, "global_step": 231399, "epoch": 2787} {"train_loss": -24.704334259033203, "global_step": 231400, "epoch": 2787} {"train_loss": -24.39327621459961, "global_step": 231401, "epoch": 2787} {"train_loss": -24.30584716796875, "global_step": 231402, "epoch": 2787} {"train_loss": -24.766158115432923, "global_step": 231403, "epoch": 2787, "val_loss": 6739037.0} {"train_loss": -23.380826950073242, "global_step": 231404, "epoch": 2788} {"train_loss": -21.973779678344727, "global_step": 231405, "epoch": 2788} {"train_loss": -23.26649284362793, "global_step": 231406, "epoch": 2788} {"train_loss": -23.781150817871094, "global_step": 231407, "epoch": 2788} {"train_loss": -22.97828483581543, "global_step": 231408, "epoch": 2788} {"train_loss": -23.764333724975586, "global_step": 231409, "epoch": 2788} {"train_loss": -22.441675186157227, "global_step": 231410, "epoch": 2788} {"train_loss": -23.625680923461914, "global_step": 231411, "epoch": 2788} {"train_loss": -23.40907096862793, "global_step": 231412, "epoch": 2788} {"train_loss": -23.68605613708496, "global_step": 231413, "epoch": 2788} {"train_loss": -23.96188735961914, "global_step": 231414, "epoch": 2788} {"train_loss": -23.459016799926758, "global_step": 231415, "epoch": 2788} {"train_loss": -24.142126083374023, "global_step": 231416, "epoch": 2788} {"train_loss": -24.147275924682617, "global_step": 231417, "epoch": 2788} {"train_loss": -23.567468643188477, "global_step": 231418, "epoch": 2788} {"train_loss": -23.559675216674805, "global_step": 231419, "epoch": 2788} {"train_loss": -23.851293563842773, "global_step": 231420, "epoch": 2788} {"train_loss": -24.173091888427734, "global_step": 231421, "epoch": 2788} {"train_loss": -23.940763473510742, "global_step": 231422, "epoch": 2788} {"train_loss": -24.209745407104492, "global_step": 231423, "epoch": 2788} {"train_loss": -24.120037078857422, "global_step": 231424, "epoch": 2788} {"train_loss": -23.943025588989258, "global_step": 231425, "epoch": 2788} {"train_loss": -24.13392448425293, "global_step": 231426, "epoch": 2788} {"train_loss": -24.27480697631836, "global_step": 231427, "epoch": 2788} {"train_loss": -24.10706901550293, "global_step": 231428, "epoch": 2788} {"train_loss": -24.344186782836914, "global_step": 231429, "epoch": 2788} {"train_loss": -24.069293975830078, "global_step": 231430, "epoch": 2788} {"train_loss": -24.139833450317383, "global_step": 231431, "epoch": 2788} {"train_loss": -23.962249755859375, "global_step": 231432, "epoch": 2788} {"train_loss": -24.3049259185791, "global_step": 231433, "epoch": 2788} {"train_loss": -24.5335693359375, "global_step": 231434, "epoch": 2788} {"train_loss": -24.355175018310547, "global_step": 231435, "epoch": 2788} {"train_loss": -24.665002822875977, "global_step": 231436, "epoch": 2788} {"train_loss": -24.956876754760742, "global_step": 231437, "epoch": 2788} {"train_loss": -24.485666275024414, "global_step": 231438, "epoch": 2788} {"train_loss": -24.425291061401367, "global_step": 231439, "epoch": 2788} {"train_loss": -24.682567596435547, "global_step": 231440, "epoch": 2788} {"train_loss": -24.491397857666016, "global_step": 231441, "epoch": 2788} {"train_loss": -24.625707626342773, "global_step": 231442, "epoch": 2788} {"train_loss": -24.86847496032715, "global_step": 231443, "epoch": 2788} {"train_loss": -24.683523178100586, "global_step": 231444, "epoch": 2788} {"train_loss": -24.576215744018555, "global_step": 231445, "epoch": 2788} {"train_loss": -24.79194450378418, "global_step": 231446, "epoch": 2788} {"train_loss": -24.836990356445312, "global_step": 231447, "epoch": 2788} {"train_loss": -24.217082977294922, "global_step": 231448, "epoch": 2788} {"train_loss": -24.585172653198242, "global_step": 231449, "epoch": 2788} {"train_loss": -24.86956787109375, "global_step": 231450, "epoch": 2788} {"train_loss": -24.925390243530273, "global_step": 231451, "epoch": 2788} {"train_loss": -24.804685592651367, "global_step": 231452, "epoch": 2788} {"train_loss": -24.85352897644043, "global_step": 231453, "epoch": 2788} {"train_loss": -25.015356063842773, "global_step": 231454, "epoch": 2788} {"train_loss": -24.905210494995117, "global_step": 231455, "epoch": 2788} {"train_loss": -24.941120147705078, "global_step": 231456, "epoch": 2788} {"train_loss": -24.790985107421875, "global_step": 231457, "epoch": 2788} {"train_loss": -24.635358810424805, "global_step": 231458, "epoch": 2788} {"train_loss": -24.77552604675293, "global_step": 231459, "epoch": 2788} {"train_loss": -24.561988830566406, "global_step": 231460, "epoch": 2788} {"train_loss": -24.062124252319336, "global_step": 231461, "epoch": 2788} {"train_loss": -24.304195404052734, "global_step": 231462, "epoch": 2788} {"train_loss": -24.43231773376465, "global_step": 231463, "epoch": 2788} {"train_loss": -24.346181869506836, "global_step": 231464, "epoch": 2788} {"train_loss": -24.718717575073242, "global_step": 231465, "epoch": 2788} {"train_loss": -24.80929183959961, "global_step": 231466, "epoch": 2788} {"train_loss": -24.59992790222168, "global_step": 231467, "epoch": 2788} {"train_loss": -24.8691463470459, "global_step": 231468, "epoch": 2788} {"train_loss": -25.101530075073242, "global_step": 231469, "epoch": 2788} {"train_loss": -24.886123657226562, "global_step": 231470, "epoch": 2788} {"train_loss": -24.728445053100586, "global_step": 231471, "epoch": 2788} {"train_loss": -24.969995498657227, "global_step": 231472, "epoch": 2788} {"train_loss": -24.35655403137207, "global_step": 231473, "epoch": 2788} {"train_loss": -24.78931999206543, "global_step": 231474, "epoch": 2788} {"train_loss": -24.890460968017578, "global_step": 231475, "epoch": 2788} {"train_loss": -24.654111862182617, "global_step": 231476, "epoch": 2788} {"train_loss": -24.417112350463867, "global_step": 231477, "epoch": 2788} {"train_loss": -24.998981475830078, "global_step": 231478, "epoch": 2788} {"train_loss": -24.67481803894043, "global_step": 231479, "epoch": 2788} {"train_loss": -24.665674209594727, "global_step": 231480, "epoch": 2788} {"train_loss": -24.541250228881836, "global_step": 231481, "epoch": 2788} {"train_loss": -24.732358932495117, "global_step": 231482, "epoch": 2788} {"train_loss": -24.826608657836914, "global_step": 231483, "epoch": 2788} {"train_loss": -24.566720962524414, "global_step": 231484, "epoch": 2788} {"train_loss": -24.656076431274414, "global_step": 231485, "epoch": 2788} {"train_loss": -24.33349843772061, "global_step": 231486, "epoch": 2788, "val_loss": 6723001.0} {"train_loss": -23.79925537109375, "global_step": 231487, "epoch": 2789} {"train_loss": -23.971494674682617, "global_step": 231488, "epoch": 2789} {"train_loss": -24.095661163330078, "global_step": 231489, "epoch": 2789} {"train_loss": -24.06194305419922, "global_step": 231490, "epoch": 2789} {"train_loss": -23.812185287475586, "global_step": 231491, "epoch": 2789} {"train_loss": -24.1656551361084, "global_step": 231492, "epoch": 2789} {"train_loss": -23.761240005493164, "global_step": 231493, "epoch": 2789} {"train_loss": -24.138296127319336, "global_step": 231494, "epoch": 2789} {"train_loss": -24.370281219482422, "global_step": 231495, "epoch": 2789} {"train_loss": -24.016843795776367, "global_step": 231496, "epoch": 2789} {"train_loss": -24.448238372802734, "global_step": 231497, "epoch": 2789} {"train_loss": -24.406753540039062, "global_step": 231498, "epoch": 2789} {"train_loss": -24.258939743041992, "global_step": 231499, "epoch": 2789} {"train_loss": -24.629276275634766, "global_step": 231500, "epoch": 2789} {"train_loss": -24.390867233276367, "global_step": 231501, "epoch": 2789} {"train_loss": -24.426273345947266, "global_step": 231502, "epoch": 2789} {"train_loss": -24.149351119995117, "global_step": 231503, "epoch": 2789} {"train_loss": -24.192827224731445, "global_step": 231504, "epoch": 2789} {"train_loss": -24.385150909423828, "global_step": 231505, "epoch": 2789} {"train_loss": -24.354581832885742, "global_step": 231506, "epoch": 2789} {"train_loss": -24.555051803588867, "global_step": 231507, "epoch": 2789} {"train_loss": -24.339679718017578, "global_step": 231508, "epoch": 2789} {"train_loss": -24.927576065063477, "global_step": 231509, "epoch": 2789} {"train_loss": -24.525869369506836, "global_step": 231510, "epoch": 2789} {"train_loss": -24.46595573425293, "global_step": 231511, "epoch": 2789} {"train_loss": -25.086883544921875, "global_step": 231512, "epoch": 2789} {"train_loss": -24.781049728393555, "global_step": 231513, "epoch": 2789} {"train_loss": -24.809181213378906, "global_step": 231514, "epoch": 2789} {"train_loss": -25.166608810424805, "global_step": 231515, "epoch": 2789} {"train_loss": -24.8714542388916, "global_step": 231516, "epoch": 2789} {"train_loss": -24.072996139526367, "global_step": 231517, "epoch": 2789} {"train_loss": -24.51808738708496, "global_step": 231518, "epoch": 2789} {"train_loss": -24.697418212890625, "global_step": 231519, "epoch": 2789} {"train_loss": -24.616790771484375, "global_step": 231520, "epoch": 2789} {"train_loss": -25.050323486328125, "global_step": 231521, "epoch": 2789} {"train_loss": -24.857547760009766, "global_step": 231522, "epoch": 2789} {"train_loss": -24.87454605102539, "global_step": 231523, "epoch": 2789} {"train_loss": -24.607816696166992, "global_step": 231524, "epoch": 2789} {"train_loss": -24.98764419555664, "global_step": 231525, "epoch": 2789} {"train_loss": -24.79079246520996, "global_step": 231526, "epoch": 2789} {"train_loss": -24.8687801361084, "global_step": 231527, "epoch": 2789} {"train_loss": -24.903079986572266, "global_step": 231528, "epoch": 2789} {"train_loss": -24.523082733154297, "global_step": 231529, "epoch": 2789} {"train_loss": -24.6832218170166, "global_step": 231530, "epoch": 2789} {"train_loss": -24.95713996887207, "global_step": 231531, "epoch": 2789} {"train_loss": -24.944971084594727, "global_step": 231532, "epoch": 2789} {"train_loss": -24.681079864501953, "global_step": 231533, "epoch": 2789} {"train_loss": -24.94759750366211, "global_step": 231534, "epoch": 2789} {"train_loss": -24.70515251159668, "global_step": 231535, "epoch": 2789} {"train_loss": -24.842634201049805, "global_step": 231536, "epoch": 2789} {"train_loss": -24.868247985839844, "global_step": 231537, "epoch": 2789} {"train_loss": -24.632144927978516, "global_step": 231538, "epoch": 2789} {"train_loss": -24.83588981628418, "global_step": 231539, "epoch": 2789} {"train_loss": -25.059484481811523, "global_step": 231540, "epoch": 2789} {"train_loss": -25.144346237182617, "global_step": 231541, "epoch": 2789} {"train_loss": -24.663679122924805, "global_step": 231542, "epoch": 2789} {"train_loss": -24.74452018737793, "global_step": 231543, "epoch": 2789} {"train_loss": -24.67732048034668, "global_step": 231544, "epoch": 2789} {"train_loss": -24.55155372619629, "global_step": 231545, "epoch": 2789} {"train_loss": -24.888870239257812, "global_step": 231546, "epoch": 2789} {"train_loss": -24.86785125732422, "global_step": 231547, "epoch": 2789} {"train_loss": -24.809860229492188, "global_step": 231548, "epoch": 2789} {"train_loss": -24.948955535888672, "global_step": 231549, "epoch": 2789} {"train_loss": -24.792203903198242, "global_step": 231550, "epoch": 2789} {"train_loss": -25.26325225830078, "global_step": 231551, "epoch": 2789} {"train_loss": -24.876787185668945, "global_step": 231552, "epoch": 2789} {"train_loss": -24.763498306274414, "global_step": 231553, "epoch": 2789} {"train_loss": -24.774412155151367, "global_step": 231554, "epoch": 2789} {"train_loss": -24.583059310913086, "global_step": 231555, "epoch": 2789} {"train_loss": -24.84600830078125, "global_step": 231556, "epoch": 2789} {"train_loss": -25.275371551513672, "global_step": 231557, "epoch": 2789} {"train_loss": -25.099403381347656, "global_step": 231558, "epoch": 2789} {"train_loss": -24.547523498535156, "global_step": 231559, "epoch": 2789} {"train_loss": -24.55415916442871, "global_step": 231560, "epoch": 2789} {"train_loss": -24.8551025390625, "global_step": 231561, "epoch": 2789} {"train_loss": -24.82903480529785, "global_step": 231562, "epoch": 2789} {"train_loss": -25.302318572998047, "global_step": 231563, "epoch": 2789} {"train_loss": -25.089431762695312, "global_step": 231564, "epoch": 2789} {"train_loss": -24.682748794555664, "global_step": 231565, "epoch": 2789} {"train_loss": -24.629892349243164, "global_step": 231566, "epoch": 2789} {"train_loss": -24.676647186279297, "global_step": 231567, "epoch": 2789} {"train_loss": -24.889312744140625, "global_step": 231568, "epoch": 2789} {"train_loss": -24.672930637037897, "global_step": 231569, "epoch": 2789, "val_loss": 6645284.0} {"train_loss": -24.19693946838379, "global_step": 231570, "epoch": 2790} {"train_loss": -24.367313385009766, "global_step": 231571, "epoch": 2790} {"train_loss": -24.289596557617188, "global_step": 231572, "epoch": 2790} {"train_loss": -24.6204776763916, "global_step": 231573, "epoch": 2790} {"train_loss": -24.233448028564453, "global_step": 231574, "epoch": 2790} {"train_loss": -24.418264389038086, "global_step": 231575, "epoch": 2790} {"train_loss": -24.041095733642578, "global_step": 231576, "epoch": 2790} {"train_loss": -23.94990348815918, "global_step": 231577, "epoch": 2790} {"train_loss": -24.66534423828125, "global_step": 231578, "epoch": 2790} {"train_loss": -23.898056030273438, "global_step": 231579, "epoch": 2790} {"train_loss": -24.375783920288086, "global_step": 231580, "epoch": 2790} {"train_loss": -24.169971466064453, "global_step": 231581, "epoch": 2790} {"train_loss": -24.044483184814453, "global_step": 231582, "epoch": 2790} {"train_loss": -24.634746551513672, "global_step": 231583, "epoch": 2790} {"train_loss": -24.46802520751953, "global_step": 231584, "epoch": 2790} {"train_loss": -24.502798080444336, "global_step": 231585, "epoch": 2790} {"train_loss": -24.546661376953125, "global_step": 231586, "epoch": 2790} {"train_loss": -24.519559860229492, "global_step": 231587, "epoch": 2790} {"train_loss": -24.563732147216797, "global_step": 231588, "epoch": 2790} {"train_loss": -24.67768096923828, "global_step": 231589, "epoch": 2790} {"train_loss": -24.490468978881836, "global_step": 231590, "epoch": 2790} {"train_loss": -24.596372604370117, "global_step": 231591, "epoch": 2790} {"train_loss": -24.633136749267578, "global_step": 231592, "epoch": 2790} {"train_loss": -24.859434127807617, "global_step": 231593, "epoch": 2790} {"train_loss": -24.667705535888672, "global_step": 231594, "epoch": 2790} {"train_loss": -24.45754623413086, "global_step": 231595, "epoch": 2790} {"train_loss": -24.747386932373047, "global_step": 231596, "epoch": 2790} {"train_loss": -24.724531173706055, "global_step": 231597, "epoch": 2790} {"train_loss": -24.891096115112305, "global_step": 231598, "epoch": 2790} {"train_loss": -24.683156967163086, "global_step": 231599, "epoch": 2790} {"train_loss": -25.101917266845703, "global_step": 231600, "epoch": 2790} {"train_loss": -25.17235565185547, "global_step": 231601, "epoch": 2790} {"train_loss": -24.31391716003418, "global_step": 231602, "epoch": 2790} {"train_loss": -24.703062057495117, "global_step": 231603, "epoch": 2790} {"train_loss": -24.986547470092773, "global_step": 231604, "epoch": 2790} {"train_loss": -25.01093864440918, "global_step": 231605, "epoch": 2790} {"train_loss": -24.75649070739746, "global_step": 231606, "epoch": 2790} {"train_loss": -24.937559127807617, "global_step": 231607, "epoch": 2790} {"train_loss": -24.680097579956055, "global_step": 231608, "epoch": 2790} {"train_loss": -24.819486618041992, "global_step": 231609, "epoch": 2790} {"train_loss": -24.888280868530273, "global_step": 231610, "epoch": 2790} {"train_loss": -24.71573257446289, "global_step": 231611, "epoch": 2790} {"train_loss": -24.847078323364258, "global_step": 231612, "epoch": 2790} {"train_loss": -25.075008392333984, "global_step": 231613, "epoch": 2790} {"train_loss": -24.99204444885254, "global_step": 231614, "epoch": 2790} {"train_loss": -24.73605728149414, "global_step": 231615, "epoch": 2790} {"train_loss": -24.74953269958496, "global_step": 231616, "epoch": 2790} {"train_loss": -24.993810653686523, "global_step": 231617, "epoch": 2790} {"train_loss": -24.784963607788086, "global_step": 231618, "epoch": 2790} {"train_loss": -24.74362564086914, "global_step": 231619, "epoch": 2790} {"train_loss": -24.49053192138672, "global_step": 231620, "epoch": 2790} {"train_loss": -24.274906158447266, "global_step": 231621, "epoch": 2790} {"train_loss": -24.33941078186035, "global_step": 231622, "epoch": 2790} {"train_loss": -24.306777954101562, "global_step": 231623, "epoch": 2790} {"train_loss": -24.391786575317383, "global_step": 231624, "epoch": 2790} {"train_loss": -24.550344467163086, "global_step": 231625, "epoch": 2790} {"train_loss": -24.711013793945312, "global_step": 231626, "epoch": 2790} {"train_loss": -24.70210075378418, "global_step": 231627, "epoch": 2790} {"train_loss": -24.76552963256836, "global_step": 231628, "epoch": 2790} {"train_loss": -24.777297973632812, "global_step": 231629, "epoch": 2790} {"train_loss": -24.75669288635254, "global_step": 231630, "epoch": 2790} {"train_loss": -24.622512817382812, "global_step": 231631, "epoch": 2790} {"train_loss": -24.556320190429688, "global_step": 231632, "epoch": 2790} {"train_loss": -24.913541793823242, "global_step": 231633, "epoch": 2790} {"train_loss": -24.656482696533203, "global_step": 231634, "epoch": 2790} {"train_loss": -24.358304977416992, "global_step": 231635, "epoch": 2790} {"train_loss": -24.87127685546875, "global_step": 231636, "epoch": 2790} {"train_loss": -24.429279327392578, "global_step": 231637, "epoch": 2790} {"train_loss": -24.638784408569336, "global_step": 231638, "epoch": 2790} {"train_loss": -24.82309341430664, "global_step": 231639, "epoch": 2790} {"train_loss": -24.845731735229492, "global_step": 231640, "epoch": 2790} {"train_loss": -24.70549964904785, "global_step": 231641, "epoch": 2790} {"train_loss": -25.1508846282959, "global_step": 231642, "epoch": 2790} {"train_loss": -24.890737533569336, "global_step": 231643, "epoch": 2790} {"train_loss": -25.037805557250977, "global_step": 231644, "epoch": 2790} {"train_loss": -24.974905014038086, "global_step": 231645, "epoch": 2790} {"train_loss": -24.77202796936035, "global_step": 231646, "epoch": 2790} {"train_loss": -24.627643585205078, "global_step": 231647, "epoch": 2790} {"train_loss": -24.682315826416016, "global_step": 231648, "epoch": 2790} {"train_loss": -24.875364303588867, "global_step": 231649, "epoch": 2790} {"train_loss": -24.69977378845215, "global_step": 231650, "epoch": 2790} {"train_loss": -24.816024780273438, "global_step": 231651, "epoch": 2790} {"train_loss": -24.64341949554811, "global_step": 231652, "epoch": 2790, "val_loss": 6620900.0} {"train_loss": -24.596288681030273, "global_step": 231653, "epoch": 2791} {"train_loss": -24.103857040405273, "global_step": 231654, "epoch": 2791} {"train_loss": -24.624460220336914, "global_step": 231655, "epoch": 2791} {"train_loss": -24.485761642456055, "global_step": 231656, "epoch": 2791} {"train_loss": -24.420303344726562, "global_step": 231657, "epoch": 2791} {"train_loss": -24.50034523010254, "global_step": 231658, "epoch": 2791} {"train_loss": -24.213335037231445, "global_step": 231659, "epoch": 2791} {"train_loss": -25.30140495300293, "global_step": 231660, "epoch": 2791} {"train_loss": -24.53631591796875, "global_step": 231661, "epoch": 2791} {"train_loss": -24.724727630615234, "global_step": 231662, "epoch": 2791} {"train_loss": -24.26909828186035, "global_step": 231663, "epoch": 2791} {"train_loss": -24.852582931518555, "global_step": 231664, "epoch": 2791} {"train_loss": -24.682741165161133, "global_step": 231665, "epoch": 2791} {"train_loss": -24.687673568725586, "global_step": 231666, "epoch": 2791} {"train_loss": -24.408071517944336, "global_step": 231667, "epoch": 2791} {"train_loss": -24.799365997314453, "global_step": 231668, "epoch": 2791} {"train_loss": -24.702726364135742, "global_step": 231669, "epoch": 2791} {"train_loss": -24.82671356201172, "global_step": 231670, "epoch": 2791} {"train_loss": -24.70170021057129, "global_step": 231671, "epoch": 2791} {"train_loss": -24.47365379333496, "global_step": 231672, "epoch": 2791} {"train_loss": -24.625776290893555, "global_step": 231673, "epoch": 2791} {"train_loss": -24.684965133666992, "global_step": 231674, "epoch": 2791} {"train_loss": -24.80190086364746, "global_step": 231675, "epoch": 2791} {"train_loss": -24.96714210510254, "global_step": 231676, "epoch": 2791} {"train_loss": -24.585447311401367, "global_step": 231677, "epoch": 2791} {"train_loss": -24.89347267150879, "global_step": 231678, "epoch": 2791} {"train_loss": -25.01390838623047, "global_step": 231679, "epoch": 2791} {"train_loss": -24.8528995513916, "global_step": 231680, "epoch": 2791} {"train_loss": -24.534692764282227, "global_step": 231681, "epoch": 2791} {"train_loss": -24.91094398498535, "global_step": 231682, "epoch": 2791} {"train_loss": -24.96274185180664, "global_step": 231683, "epoch": 2791} {"train_loss": -24.614643096923828, "global_step": 231684, "epoch": 2791} {"train_loss": -25.142648696899414, "global_step": 231685, "epoch": 2791} {"train_loss": -24.961713790893555, "global_step": 231686, "epoch": 2791} {"train_loss": -25.057361602783203, "global_step": 231687, "epoch": 2791} {"train_loss": -24.76898193359375, "global_step": 231688, "epoch": 2791} {"train_loss": -24.706768035888672, "global_step": 231689, "epoch": 2791} {"train_loss": -25.042078018188477, "global_step": 231690, "epoch": 2791} {"train_loss": -25.07257652282715, "global_step": 231691, "epoch": 2791} {"train_loss": -24.540943145751953, "global_step": 231692, "epoch": 2791} {"train_loss": -24.602529525756836, "global_step": 231693, "epoch": 2791} {"train_loss": -24.82758903503418, "global_step": 231694, "epoch": 2791} {"train_loss": -24.69482421875, "global_step": 231695, "epoch": 2791} {"train_loss": -24.809139251708984, "global_step": 231696, "epoch": 2791} {"train_loss": -24.702442169189453, "global_step": 231697, "epoch": 2791} {"train_loss": -24.74428939819336, "global_step": 231698, "epoch": 2791} {"train_loss": -24.777563095092773, "global_step": 231699, "epoch": 2791} {"train_loss": -24.79998779296875, "global_step": 231700, "epoch": 2791} {"train_loss": -24.849254608154297, "global_step": 231701, "epoch": 2791} {"train_loss": -24.878149032592773, "global_step": 231702, "epoch": 2791} {"train_loss": -24.80390739440918, "global_step": 231703, "epoch": 2791} {"train_loss": -24.68452262878418, "global_step": 231704, "epoch": 2791} {"train_loss": -25.039443969726562, "global_step": 231705, "epoch": 2791} {"train_loss": -24.07403564453125, "global_step": 231706, "epoch": 2791} {"train_loss": -24.382169723510742, "global_step": 231707, "epoch": 2791} {"train_loss": -24.74951934814453, "global_step": 231708, "epoch": 2791} {"train_loss": -24.613332748413086, "global_step": 231709, "epoch": 2791} {"train_loss": -24.737380981445312, "global_step": 231710, "epoch": 2791} {"train_loss": -24.612119674682617, "global_step": 231711, "epoch": 2791} {"train_loss": -24.35480499267578, "global_step": 231712, "epoch": 2791} {"train_loss": -24.491193771362305, "global_step": 231713, "epoch": 2791} {"train_loss": -24.67325210571289, "global_step": 231714, "epoch": 2791} {"train_loss": -24.39594841003418, "global_step": 231715, "epoch": 2791} {"train_loss": -24.226682662963867, "global_step": 231716, "epoch": 2791} {"train_loss": -24.28400993347168, "global_step": 231717, "epoch": 2791} {"train_loss": -24.701547622680664, "global_step": 231718, "epoch": 2791} {"train_loss": -24.604352951049805, "global_step": 231719, "epoch": 2791} {"train_loss": -24.774709701538086, "global_step": 231720, "epoch": 2791} {"train_loss": -25.095802307128906, "global_step": 231721, "epoch": 2791} {"train_loss": -25.148103713989258, "global_step": 231722, "epoch": 2791} {"train_loss": -24.68134307861328, "global_step": 231723, "epoch": 2791} {"train_loss": -24.73284339904785, "global_step": 231724, "epoch": 2791} {"train_loss": -24.679433822631836, "global_step": 231725, "epoch": 2791} {"train_loss": -24.264404296875, "global_step": 231726, "epoch": 2791} {"train_loss": -25.107330322265625, "global_step": 231727, "epoch": 2791} {"train_loss": -24.610559463500977, "global_step": 231728, "epoch": 2791} {"train_loss": -24.7702693939209, "global_step": 231729, "epoch": 2791} {"train_loss": -25.173099517822266, "global_step": 231730, "epoch": 2791} {"train_loss": -25.109277725219727, "global_step": 231731, "epoch": 2791} {"train_loss": -24.966901779174805, "global_step": 231732, "epoch": 2791} {"train_loss": -24.555166244506836, "global_step": 231733, "epoch": 2791} {"train_loss": -24.596595764160156, "global_step": 231734, "epoch": 2791} {"train_loss": -24.707757857908685, "global_step": 231735, "epoch": 2791, "val_loss": 6747210.5} {"train_loss": -24.197795867919922, "global_step": 231736, "epoch": 2792} {"train_loss": -24.339441299438477, "global_step": 231737, "epoch": 2792} {"train_loss": -24.406095504760742, "global_step": 231738, "epoch": 2792} {"train_loss": -24.30080795288086, "global_step": 231739, "epoch": 2792} {"train_loss": -24.707509994506836, "global_step": 231740, "epoch": 2792} {"train_loss": -24.531253814697266, "global_step": 231741, "epoch": 2792} {"train_loss": -24.645166397094727, "global_step": 231742, "epoch": 2792} {"train_loss": -24.23836326599121, "global_step": 231743, "epoch": 2792} {"train_loss": -24.418081283569336, "global_step": 231744, "epoch": 2792} {"train_loss": -24.787832260131836, "global_step": 231745, "epoch": 2792} {"train_loss": -24.459814071655273, "global_step": 231746, "epoch": 2792} {"train_loss": -24.37632942199707, "global_step": 231747, "epoch": 2792} {"train_loss": -24.579809188842773, "global_step": 231748, "epoch": 2792} {"train_loss": -24.831439971923828, "global_step": 231749, "epoch": 2792} {"train_loss": -24.591596603393555, "global_step": 231750, "epoch": 2792} {"train_loss": -24.539291381835938, "global_step": 231751, "epoch": 2792} {"train_loss": -24.56121826171875, "global_step": 231752, "epoch": 2792} {"train_loss": -24.869550704956055, "global_step": 231753, "epoch": 2792} {"train_loss": -24.57172966003418, "global_step": 231754, "epoch": 2792} {"train_loss": -24.59273338317871, "global_step": 231755, "epoch": 2792} {"train_loss": -24.632854461669922, "global_step": 231756, "epoch": 2792} {"train_loss": -24.41859245300293, "global_step": 231757, "epoch": 2792} {"train_loss": -24.548816680908203, "global_step": 231758, "epoch": 2792} {"train_loss": -24.68708610534668, "global_step": 231759, "epoch": 2792} {"train_loss": -24.737943649291992, "global_step": 231760, "epoch": 2792} {"train_loss": -24.822298049926758, "global_step": 231761, "epoch": 2792} {"train_loss": -24.802942276000977, "global_step": 231762, "epoch": 2792} {"train_loss": -25.083284378051758, "global_step": 231763, "epoch": 2792} {"train_loss": -24.53952980041504, "global_step": 231764, "epoch": 2792} {"train_loss": -24.730594635009766, "global_step": 231765, "epoch": 2792} {"train_loss": -24.276752471923828, "global_step": 231766, "epoch": 2792} {"train_loss": -25.11297035217285, "global_step": 231767, "epoch": 2792} {"train_loss": -25.114429473876953, "global_step": 231768, "epoch": 2792} {"train_loss": -25.01357078552246, "global_step": 231769, "epoch": 2792} {"train_loss": -24.537595748901367, "global_step": 231770, "epoch": 2792} {"train_loss": -24.470836639404297, "global_step": 231771, "epoch": 2792} {"train_loss": -24.508398056030273, "global_step": 231772, "epoch": 2792} {"train_loss": -24.471094131469727, "global_step": 231773, "epoch": 2792} {"train_loss": -24.602134704589844, "global_step": 231774, "epoch": 2792} {"train_loss": -24.394563674926758, "global_step": 231775, "epoch": 2792} {"train_loss": -24.63376808166504, "global_step": 231776, "epoch": 2792} {"train_loss": -24.686017990112305, "global_step": 231777, "epoch": 2792} {"train_loss": -24.69523048400879, "global_step": 231778, "epoch": 2792} {"train_loss": -24.88789176940918, "global_step": 231779, "epoch": 2792} {"train_loss": -25.026697158813477, "global_step": 231780, "epoch": 2792} {"train_loss": -24.734046936035156, "global_step": 231781, "epoch": 2792} {"train_loss": -24.868127822875977, "global_step": 231782, "epoch": 2792} {"train_loss": -24.622760772705078, "global_step": 231783, "epoch": 2792} {"train_loss": -24.837169647216797, "global_step": 231784, "epoch": 2792} {"train_loss": -24.50516128540039, "global_step": 231785, "epoch": 2792} {"train_loss": -24.527206420898438, "global_step": 231786, "epoch": 2792} {"train_loss": -24.92253303527832, "global_step": 231787, "epoch": 2792} {"train_loss": -24.53127098083496, "global_step": 231788, "epoch": 2792} {"train_loss": -24.743844985961914, "global_step": 231789, "epoch": 2792} {"train_loss": -24.919546127319336, "global_step": 231790, "epoch": 2792} {"train_loss": -24.6876220703125, "global_step": 231791, "epoch": 2792} {"train_loss": -24.517393112182617, "global_step": 231792, "epoch": 2792} {"train_loss": -25.02016258239746, "global_step": 231793, "epoch": 2792} {"train_loss": -24.702627182006836, "global_step": 231794, "epoch": 2792} {"train_loss": -24.48807144165039, "global_step": 231795, "epoch": 2792} {"train_loss": -24.398475646972656, "global_step": 231796, "epoch": 2792} {"train_loss": -24.664331436157227, "global_step": 231797, "epoch": 2792} {"train_loss": -24.90854835510254, "global_step": 231798, "epoch": 2792} {"train_loss": -24.140493392944336, "global_step": 231799, "epoch": 2792} {"train_loss": -24.61445426940918, "global_step": 231800, "epoch": 2792} {"train_loss": -24.5347843170166, "global_step": 231801, "epoch": 2792} {"train_loss": -24.821964263916016, "global_step": 231802, "epoch": 2792} {"train_loss": -24.931903839111328, "global_step": 231803, "epoch": 2792} {"train_loss": -24.557491302490234, "global_step": 231804, "epoch": 2792} {"train_loss": -24.370746612548828, "global_step": 231805, "epoch": 2792} {"train_loss": -24.69685935974121, "global_step": 231806, "epoch": 2792} {"train_loss": -25.057939529418945, "global_step": 231807, "epoch": 2792} {"train_loss": -24.898813247680664, "global_step": 231808, "epoch": 2792} {"train_loss": -24.807819366455078, "global_step": 231809, "epoch": 2792} {"train_loss": -25.109678268432617, "global_step": 231810, "epoch": 2792} {"train_loss": -24.522186279296875, "global_step": 231811, "epoch": 2792} {"train_loss": -25.26421356201172, "global_step": 231812, "epoch": 2792} {"train_loss": -24.80377769470215, "global_step": 231813, "epoch": 2792} {"train_loss": -23.948936462402344, "global_step": 231814, "epoch": 2792} {"train_loss": -24.864906311035156, "global_step": 231815, "epoch": 2792} {"train_loss": -24.955625534057617, "global_step": 231816, "epoch": 2792} {"train_loss": -24.880599975585938, "global_step": 231817, "epoch": 2792} {"train_loss": -24.682930888899836, "global_step": 231818, "epoch": 2792, "val_loss": 6763012.0} {"train_loss": -23.985685348510742, "global_step": 231819, "epoch": 2793} {"train_loss": -22.858922958374023, "global_step": 231820, "epoch": 2793} {"train_loss": -24.28609275817871, "global_step": 231821, "epoch": 2793} {"train_loss": -24.027307510375977, "global_step": 231822, "epoch": 2793} {"train_loss": -23.739015579223633, "global_step": 231823, "epoch": 2793} {"train_loss": -24.387771606445312, "global_step": 231824, "epoch": 2793} {"train_loss": -24.114246368408203, "global_step": 231825, "epoch": 2793} {"train_loss": -24.190488815307617, "global_step": 231826, "epoch": 2793} {"train_loss": -24.273853302001953, "global_step": 231827, "epoch": 2793} {"train_loss": -24.56049156188965, "global_step": 231828, "epoch": 2793} {"train_loss": -24.548181533813477, "global_step": 231829, "epoch": 2793} {"train_loss": -24.6342830657959, "global_step": 231830, "epoch": 2793} {"train_loss": -24.468219757080078, "global_step": 231831, "epoch": 2793} {"train_loss": -24.1937198638916, "global_step": 231832, "epoch": 2793} {"train_loss": -24.42799949645996, "global_step": 231833, "epoch": 2793} {"train_loss": -24.624258041381836, "global_step": 231834, "epoch": 2793} {"train_loss": -24.594030380249023, "global_step": 231835, "epoch": 2793} {"train_loss": -24.217235565185547, "global_step": 231836, "epoch": 2793} {"train_loss": -24.540870666503906, "global_step": 231837, "epoch": 2793} {"train_loss": -24.4906005859375, "global_step": 231838, "epoch": 2793} {"train_loss": -24.3305606842041, "global_step": 231839, "epoch": 2793} {"train_loss": -24.174304962158203, "global_step": 231840, "epoch": 2793} {"train_loss": -24.63556480407715, "global_step": 231841, "epoch": 2793} {"train_loss": -24.419334411621094, "global_step": 231842, "epoch": 2793} {"train_loss": -24.57367706298828, "global_step": 231843, "epoch": 2793} {"train_loss": -24.62135887145996, "global_step": 231844, "epoch": 2793} {"train_loss": -24.537405014038086, "global_step": 231845, "epoch": 2793} {"train_loss": -24.575321197509766, "global_step": 231846, "epoch": 2793} {"train_loss": -24.739206314086914, "global_step": 231847, "epoch": 2793} {"train_loss": -24.49349594116211, "global_step": 231848, "epoch": 2793} {"train_loss": -24.631834030151367, "global_step": 231849, "epoch": 2793} {"train_loss": -24.589523315429688, "global_step": 231850, "epoch": 2793} {"train_loss": -24.478971481323242, "global_step": 231851, "epoch": 2793} {"train_loss": -24.741344451904297, "global_step": 231852, "epoch": 2793} {"train_loss": -24.591737747192383, "global_step": 231853, "epoch": 2793} {"train_loss": -24.91016387939453, "global_step": 231854, "epoch": 2793} {"train_loss": -25.176801681518555, "global_step": 231855, "epoch": 2793} {"train_loss": -24.866544723510742, "global_step": 231856, "epoch": 2793} {"train_loss": -24.479101181030273, "global_step": 231857, "epoch": 2793} {"train_loss": -24.858108520507812, "global_step": 231858, "epoch": 2793} {"train_loss": -24.910377502441406, "global_step": 231859, "epoch": 2793} {"train_loss": -25.194793701171875, "global_step": 231860, "epoch": 2793} {"train_loss": -24.8343448638916, "global_step": 231861, "epoch": 2793} {"train_loss": -25.191967010498047, "global_step": 231862, "epoch": 2793} {"train_loss": -24.63022232055664, "global_step": 231863, "epoch": 2793} {"train_loss": -24.794496536254883, "global_step": 231864, "epoch": 2793} {"train_loss": -24.73834228515625, "global_step": 231865, "epoch": 2793} {"train_loss": -24.677154541015625, "global_step": 231866, "epoch": 2793} {"train_loss": -25.293825149536133, "global_step": 231867, "epoch": 2793} {"train_loss": -24.88994789123535, "global_step": 231868, "epoch": 2793} {"train_loss": -24.920103073120117, "global_step": 231869, "epoch": 2793} {"train_loss": -24.679616928100586, "global_step": 231870, "epoch": 2793} {"train_loss": -25.23353385925293, "global_step": 231871, "epoch": 2793} {"train_loss": -24.692523956298828, "global_step": 231872, "epoch": 2793} {"train_loss": -25.197620391845703, "global_step": 231873, "epoch": 2793} {"train_loss": -24.454771041870117, "global_step": 231874, "epoch": 2793} {"train_loss": -25.016769409179688, "global_step": 231875, "epoch": 2793} {"train_loss": -25.218141555786133, "global_step": 231876, "epoch": 2793} {"train_loss": -25.259260177612305, "global_step": 231877, "epoch": 2793} {"train_loss": -24.457456588745117, "global_step": 231878, "epoch": 2793} {"train_loss": -25.116430282592773, "global_step": 231879, "epoch": 2793} {"train_loss": -24.924585342407227, "global_step": 231880, "epoch": 2793} {"train_loss": -24.342885971069336, "global_step": 231881, "epoch": 2793} {"train_loss": -24.054702758789062, "global_step": 231882, "epoch": 2793} {"train_loss": -24.629507064819336, "global_step": 231883, "epoch": 2793} {"train_loss": -23.694154739379883, "global_step": 231884, "epoch": 2793} {"train_loss": -24.69209098815918, "global_step": 231885, "epoch": 2793} {"train_loss": -23.791784286499023, "global_step": 231886, "epoch": 2793} {"train_loss": -23.610580444335938, "global_step": 231887, "epoch": 2793} {"train_loss": -24.549802780151367, "global_step": 231888, "epoch": 2793} {"train_loss": -24.306737899780273, "global_step": 231889, "epoch": 2793} {"train_loss": -24.36652183532715, "global_step": 231890, "epoch": 2793} {"train_loss": -24.460851669311523, "global_step": 231891, "epoch": 2793} {"train_loss": -24.67417335510254, "global_step": 231892, "epoch": 2793} {"train_loss": -24.465709686279297, "global_step": 231893, "epoch": 2793} {"train_loss": -24.60302734375, "global_step": 231894, "epoch": 2793} {"train_loss": -24.855792999267578, "global_step": 231895, "epoch": 2793} {"train_loss": -24.68505859375, "global_step": 231896, "epoch": 2793} {"train_loss": -24.299545288085938, "global_step": 231897, "epoch": 2793} {"train_loss": -24.514245986938477, "global_step": 231898, "epoch": 2793} {"train_loss": -24.408937454223633, "global_step": 231899, "epoch": 2793} {"train_loss": -24.57020378112793, "global_step": 231900, "epoch": 2793} {"train_loss": -24.544547437185265, "global_step": 231901, "epoch": 2793, "val_loss": 6655682.0} {"train_loss": -24.492189407348633, "global_step": 231902, "epoch": 2794} {"train_loss": -24.48221778869629, "global_step": 231903, "epoch": 2794} {"train_loss": -24.147262573242188, "global_step": 231904, "epoch": 2794} {"train_loss": -24.683246612548828, "global_step": 231905, "epoch": 2794} {"train_loss": -24.493703842163086, "global_step": 231906, "epoch": 2794} {"train_loss": -24.341236114501953, "global_step": 231907, "epoch": 2794} {"train_loss": -24.455413818359375, "global_step": 231908, "epoch": 2794} {"train_loss": -24.807153701782227, "global_step": 231909, "epoch": 2794} {"train_loss": -24.386280059814453, "global_step": 231910, "epoch": 2794} {"train_loss": -24.78789710998535, "global_step": 231911, "epoch": 2794} {"train_loss": -24.614429473876953, "global_step": 231912, "epoch": 2794} {"train_loss": -24.659290313720703, "global_step": 231913, "epoch": 2794} {"train_loss": -25.10885238647461, "global_step": 231914, "epoch": 2794} {"train_loss": -24.615127563476562, "global_step": 231915, "epoch": 2794} {"train_loss": -24.64253807067871, "global_step": 231916, "epoch": 2794} {"train_loss": -25.051420211791992, "global_step": 231917, "epoch": 2794} {"train_loss": -24.613391876220703, "global_step": 231918, "epoch": 2794} {"train_loss": -24.37103271484375, "global_step": 231919, "epoch": 2794} {"train_loss": -24.730382919311523, "global_step": 231920, "epoch": 2794} {"train_loss": -24.59901237487793, "global_step": 231921, "epoch": 2794} {"train_loss": -24.729578018188477, "global_step": 231922, "epoch": 2794} {"train_loss": -24.990447998046875, "global_step": 231923, "epoch": 2794} {"train_loss": -24.717626571655273, "global_step": 231924, "epoch": 2794} {"train_loss": -24.6805419921875, "global_step": 231925, "epoch": 2794} {"train_loss": -25.041959762573242, "global_step": 231926, "epoch": 2794} {"train_loss": -24.574630737304688, "global_step": 231927, "epoch": 2794} {"train_loss": -24.69063377380371, "global_step": 231928, "epoch": 2794} {"train_loss": -24.97652244567871, "global_step": 231929, "epoch": 2794} {"train_loss": -24.563175201416016, "global_step": 231930, "epoch": 2794} {"train_loss": -24.6389217376709, "global_step": 231931, "epoch": 2794} {"train_loss": -24.58846664428711, "global_step": 231932, "epoch": 2794} {"train_loss": -24.52389907836914, "global_step": 231933, "epoch": 2794} {"train_loss": -25.006093978881836, "global_step": 231934, "epoch": 2794} {"train_loss": -24.2786922454834, "global_step": 231935, "epoch": 2794} {"train_loss": -24.651147842407227, "global_step": 231936, "epoch": 2794} {"train_loss": -24.785123825073242, "global_step": 231937, "epoch": 2794} {"train_loss": -24.71773338317871, "global_step": 231938, "epoch": 2794} {"train_loss": -24.933469772338867, "global_step": 231939, "epoch": 2794} {"train_loss": -24.875818252563477, "global_step": 231940, "epoch": 2794} {"train_loss": -25.120054244995117, "global_step": 231941, "epoch": 2794} {"train_loss": -24.614656448364258, "global_step": 231942, "epoch": 2794} {"train_loss": -24.939271926879883, "global_step": 231943, "epoch": 2794} {"train_loss": -25.05224609375, "global_step": 231944, "epoch": 2794} {"train_loss": -24.684375762939453, "global_step": 231945, "epoch": 2794} {"train_loss": -24.959871292114258, "global_step": 231946, "epoch": 2794} {"train_loss": -24.81591796875, "global_step": 231947, "epoch": 2794} {"train_loss": -24.261062622070312, "global_step": 231948, "epoch": 2794} {"train_loss": -24.698108673095703, "global_step": 231949, "epoch": 2794} {"train_loss": -24.698902130126953, "global_step": 231950, "epoch": 2794} {"train_loss": -24.85683822631836, "global_step": 231951, "epoch": 2794} {"train_loss": -24.382041931152344, "global_step": 231952, "epoch": 2794} {"train_loss": -24.772933959960938, "global_step": 231953, "epoch": 2794} {"train_loss": -24.625329971313477, "global_step": 231954, "epoch": 2794} {"train_loss": -24.931657791137695, "global_step": 231955, "epoch": 2794} {"train_loss": -24.835664749145508, "global_step": 231956, "epoch": 2794} {"train_loss": -24.600317001342773, "global_step": 231957, "epoch": 2794} {"train_loss": -24.5585994720459, "global_step": 231958, "epoch": 2794} {"train_loss": -24.45865821838379, "global_step": 231959, "epoch": 2794} {"train_loss": -24.62060546875, "global_step": 231960, "epoch": 2794} {"train_loss": -24.392797470092773, "global_step": 231961, "epoch": 2794} {"train_loss": -24.5673885345459, "global_step": 231962, "epoch": 2794} {"train_loss": -25.1414852142334, "global_step": 231963, "epoch": 2794} {"train_loss": -24.646568298339844, "global_step": 231964, "epoch": 2794} {"train_loss": -24.681644439697266, "global_step": 231965, "epoch": 2794} {"train_loss": -24.81810760498047, "global_step": 231966, "epoch": 2794} {"train_loss": -24.842924118041992, "global_step": 231967, "epoch": 2794} {"train_loss": -24.965002059936523, "global_step": 231968, "epoch": 2794} {"train_loss": -24.788671493530273, "global_step": 231969, "epoch": 2794} {"train_loss": -25.036191940307617, "global_step": 231970, "epoch": 2794} {"train_loss": -25.089981079101562, "global_step": 231971, "epoch": 2794} {"train_loss": -24.637897491455078, "global_step": 231972, "epoch": 2794} {"train_loss": -24.608631134033203, "global_step": 231973, "epoch": 2794} {"train_loss": -25.054067611694336, "global_step": 231974, "epoch": 2794} {"train_loss": -24.470748901367188, "global_step": 231975, "epoch": 2794} {"train_loss": -24.655805587768555, "global_step": 231976, "epoch": 2794} {"train_loss": -25.1624813079834, "global_step": 231977, "epoch": 2794} {"train_loss": -24.80242919921875, "global_step": 231978, "epoch": 2794} {"train_loss": -24.885459899902344, "global_step": 231979, "epoch": 2794} {"train_loss": -24.640640258789062, "global_step": 231980, "epoch": 2794} {"train_loss": -24.893903732299805, "global_step": 231981, "epoch": 2794} {"train_loss": -24.50957679748535, "global_step": 231982, "epoch": 2794} {"train_loss": -24.79360008239746, "global_step": 231983, "epoch": 2794} {"train_loss": -24.715323574571723, "global_step": 231984, "epoch": 2794, "val_loss": 6737967.0} {"train_loss": -24.082969665527344, "global_step": 231985, "epoch": 2795} {"train_loss": -23.593158721923828, "global_step": 231986, "epoch": 2795} {"train_loss": -23.794179916381836, "global_step": 231987, "epoch": 2795} {"train_loss": -23.981674194335938, "global_step": 231988, "epoch": 2795} {"train_loss": -24.048398971557617, "global_step": 231989, "epoch": 2795} {"train_loss": -23.29286766052246, "global_step": 231990, "epoch": 2795} {"train_loss": -24.45563316345215, "global_step": 231991, "epoch": 2795} {"train_loss": -23.762271881103516, "global_step": 231992, "epoch": 2795} {"train_loss": -23.722084045410156, "global_step": 231993, "epoch": 2795} {"train_loss": -23.738847732543945, "global_step": 231994, "epoch": 2795} {"train_loss": -24.2721004486084, "global_step": 231995, "epoch": 2795} {"train_loss": -23.799964904785156, "global_step": 231996, "epoch": 2795} {"train_loss": -24.315799713134766, "global_step": 231997, "epoch": 2795} {"train_loss": -24.596036911010742, "global_step": 231998, "epoch": 2795} {"train_loss": -24.58360481262207, "global_step": 231999, "epoch": 2795} {"train_loss": -24.505613327026367, "global_step": 232000, "epoch": 2795} {"train_loss": -23.78110694885254, "global_step": 232001, "epoch": 2795} {"train_loss": -24.23280906677246, "global_step": 232002, "epoch": 2795} {"train_loss": -24.206226348876953, "global_step": 232003, "epoch": 2795} {"train_loss": -24.24591636657715, "global_step": 232004, "epoch": 2795} {"train_loss": -24.265470504760742, "global_step": 232005, "epoch": 2795} {"train_loss": -24.47999382019043, "global_step": 232006, "epoch": 2795} {"train_loss": -24.357648849487305, "global_step": 232007, "epoch": 2795} {"train_loss": -24.690656661987305, "global_step": 232008, "epoch": 2795} {"train_loss": -24.354448318481445, "global_step": 232009, "epoch": 2795} {"train_loss": -24.950523376464844, "global_step": 232010, "epoch": 2795} {"train_loss": -24.5047607421875, "global_step": 232011, "epoch": 2795} {"train_loss": -24.986492156982422, "global_step": 232012, "epoch": 2795} {"train_loss": -24.47429847717285, "global_step": 232013, "epoch": 2795} {"train_loss": -24.689725875854492, "global_step": 232014, "epoch": 2795} {"train_loss": -24.483434677124023, "global_step": 232015, "epoch": 2795} {"train_loss": -24.688894271850586, "global_step": 232016, "epoch": 2795} {"train_loss": -24.63839340209961, "global_step": 232017, "epoch": 2795} {"train_loss": -24.836219787597656, "global_step": 232018, "epoch": 2795} {"train_loss": -24.747610092163086, "global_step": 232019, "epoch": 2795} {"train_loss": -25.037038803100586, "global_step": 232020, "epoch": 2795} {"train_loss": -24.851499557495117, "global_step": 232021, "epoch": 2795} {"train_loss": -24.60185432434082, "global_step": 232022, "epoch": 2795} {"train_loss": -24.50005531311035, "global_step": 232023, "epoch": 2795} {"train_loss": -24.776901245117188, "global_step": 232024, "epoch": 2795} {"train_loss": -24.804487228393555, "global_step": 232025, "epoch": 2795} {"train_loss": -24.679601669311523, "global_step": 232026, "epoch": 2795} {"train_loss": -24.55742835998535, "global_step": 232027, "epoch": 2795} {"train_loss": -24.914432525634766, "global_step": 232028, "epoch": 2795} {"train_loss": -24.862272262573242, "global_step": 232029, "epoch": 2795} {"train_loss": -24.80232810974121, "global_step": 232030, "epoch": 2795} {"train_loss": -24.937742233276367, "global_step": 232031, "epoch": 2795} {"train_loss": -24.95789909362793, "global_step": 232032, "epoch": 2795} {"train_loss": -24.24835777282715, "global_step": 232033, "epoch": 2795} {"train_loss": -25.2733154296875, "global_step": 232034, "epoch": 2795} {"train_loss": -24.942914962768555, "global_step": 232035, "epoch": 2795} {"train_loss": -25.16431999206543, "global_step": 232036, "epoch": 2795} {"train_loss": -24.834867477416992, "global_step": 232037, "epoch": 2795} {"train_loss": -24.821083068847656, "global_step": 232038, "epoch": 2795} {"train_loss": -24.997297286987305, "global_step": 232039, "epoch": 2795} {"train_loss": -24.78858184814453, "global_step": 232040, "epoch": 2795} {"train_loss": -24.797101974487305, "global_step": 232041, "epoch": 2795} {"train_loss": -25.07944107055664, "global_step": 232042, "epoch": 2795} {"train_loss": -24.657718658447266, "global_step": 232043, "epoch": 2795} {"train_loss": -24.483747482299805, "global_step": 232044, "epoch": 2795} {"train_loss": -24.627134323120117, "global_step": 232045, "epoch": 2795} {"train_loss": -24.758955001831055, "global_step": 232046, "epoch": 2795} {"train_loss": -24.61846351623535, "global_step": 232047, "epoch": 2795} {"train_loss": -24.639480590820312, "global_step": 232048, "epoch": 2795} {"train_loss": -25.193445205688477, "global_step": 232049, "epoch": 2795} {"train_loss": -24.506879806518555, "global_step": 232050, "epoch": 2795} {"train_loss": -24.82497787475586, "global_step": 232051, "epoch": 2795} {"train_loss": -25.047880172729492, "global_step": 232052, "epoch": 2795} {"train_loss": -24.592924118041992, "global_step": 232053, "epoch": 2795} {"train_loss": -25.203563690185547, "global_step": 232054, "epoch": 2795} {"train_loss": -24.965768814086914, "global_step": 232055, "epoch": 2795} {"train_loss": -24.83310890197754, "global_step": 232056, "epoch": 2795} {"train_loss": -24.861902236938477, "global_step": 232057, "epoch": 2795} {"train_loss": -24.86690330505371, "global_step": 232058, "epoch": 2795} {"train_loss": -25.127389907836914, "global_step": 232059, "epoch": 2795} {"train_loss": -24.978424072265625, "global_step": 232060, "epoch": 2795} {"train_loss": -24.816913604736328, "global_step": 232061, "epoch": 2795} {"train_loss": -25.06294822692871, "global_step": 232062, "epoch": 2795} {"train_loss": -25.220975875854492, "global_step": 232063, "epoch": 2795} {"train_loss": -25.337522506713867, "global_step": 232064, "epoch": 2795} {"train_loss": -25.009593963623047, "global_step": 232065, "epoch": 2795} {"train_loss": -24.957448959350586, "global_step": 232066, "epoch": 2795} {"train_loss": -24.630367554813983, "global_step": 232067, "epoch": 2795, "val_loss": 6747756.0} {"train_loss": -24.604537963867188, "global_step": 232068, "epoch": 2796} {"train_loss": -24.76926612854004, "global_step": 232069, "epoch": 2796} {"train_loss": -24.38871192932129, "global_step": 232070, "epoch": 2796} {"train_loss": -24.93465232849121, "global_step": 232071, "epoch": 2796} {"train_loss": -24.6287841796875, "global_step": 232072, "epoch": 2796} {"train_loss": -24.734506607055664, "global_step": 232073, "epoch": 2796} {"train_loss": -24.630603790283203, "global_step": 232074, "epoch": 2796} {"train_loss": -24.58281707763672, "global_step": 232075, "epoch": 2796} {"train_loss": -24.833953857421875, "global_step": 232076, "epoch": 2796} {"train_loss": -24.5643367767334, "global_step": 232077, "epoch": 2796} {"train_loss": -24.532426834106445, "global_step": 232078, "epoch": 2796} {"train_loss": -24.66570281982422, "global_step": 232079, "epoch": 2796} {"train_loss": -24.788772583007812, "global_step": 232080, "epoch": 2796} {"train_loss": -24.722122192382812, "global_step": 232081, "epoch": 2796} {"train_loss": -24.330114364624023, "global_step": 232082, "epoch": 2796} {"train_loss": -24.744489669799805, "global_step": 232083, "epoch": 2796} {"train_loss": -24.64433479309082, "global_step": 232084, "epoch": 2796} {"train_loss": -24.865114212036133, "global_step": 232085, "epoch": 2796} {"train_loss": -24.90217399597168, "global_step": 232086, "epoch": 2796} {"train_loss": -24.663564682006836, "global_step": 232087, "epoch": 2796} {"train_loss": -24.848623275756836, "global_step": 232088, "epoch": 2796} {"train_loss": -24.840715408325195, "global_step": 232089, "epoch": 2796} {"train_loss": -24.848920822143555, "global_step": 232090, "epoch": 2796} {"train_loss": -24.879722595214844, "global_step": 232091, "epoch": 2796} {"train_loss": -24.90976905822754, "global_step": 232092, "epoch": 2796} {"train_loss": -25.426145553588867, "global_step": 232093, "epoch": 2796} {"train_loss": -24.64510154724121, "global_step": 232094, "epoch": 2796} {"train_loss": -24.790491104125977, "global_step": 232095, "epoch": 2796} {"train_loss": -24.994001388549805, "global_step": 232096, "epoch": 2796} {"train_loss": -24.956464767456055, "global_step": 232097, "epoch": 2796} {"train_loss": -24.966201782226562, "global_step": 232098, "epoch": 2796} {"train_loss": -24.7589054107666, "global_step": 232099, "epoch": 2796} {"train_loss": -24.908222198486328, "global_step": 232100, "epoch": 2796} {"train_loss": -25.33379554748535, "global_step": 232101, "epoch": 2796} {"train_loss": -24.836883544921875, "global_step": 232102, "epoch": 2796} {"train_loss": -24.991811752319336, "global_step": 232103, "epoch": 2796} {"train_loss": -24.9434871673584, "global_step": 232104, "epoch": 2796} {"train_loss": -24.56353187561035, "global_step": 232105, "epoch": 2796} {"train_loss": -24.54903221130371, "global_step": 232106, "epoch": 2796} {"train_loss": -24.769521713256836, "global_step": 232107, "epoch": 2796} {"train_loss": -25.002025604248047, "global_step": 232108, "epoch": 2796} {"train_loss": -24.3325252532959, "global_step": 232109, "epoch": 2796} {"train_loss": -24.031200408935547, "global_step": 232110, "epoch": 2796} {"train_loss": -24.28724479675293, "global_step": 232111, "epoch": 2796} {"train_loss": -24.433839797973633, "global_step": 232112, "epoch": 2796} {"train_loss": -24.620452880859375, "global_step": 232113, "epoch": 2796} {"train_loss": -24.880048751831055, "global_step": 232114, "epoch": 2796} {"train_loss": -24.418201446533203, "global_step": 232115, "epoch": 2796} {"train_loss": -24.876951217651367, "global_step": 232116, "epoch": 2796} {"train_loss": -24.683332443237305, "global_step": 232117, "epoch": 2796} {"train_loss": -24.800687789916992, "global_step": 232118, "epoch": 2796} {"train_loss": -24.539220809936523, "global_step": 232119, "epoch": 2796} {"train_loss": -24.887426376342773, "global_step": 232120, "epoch": 2796} {"train_loss": -24.694143295288086, "global_step": 232121, "epoch": 2796} {"train_loss": -24.970434188842773, "global_step": 232122, "epoch": 2796} {"train_loss": -24.735416412353516, "global_step": 232123, "epoch": 2796} {"train_loss": -24.900354385375977, "global_step": 232124, "epoch": 2796} {"train_loss": -24.35594940185547, "global_step": 232125, "epoch": 2796} {"train_loss": -24.65716552734375, "global_step": 232126, "epoch": 2796} {"train_loss": -24.78179931640625, "global_step": 232127, "epoch": 2796} {"train_loss": -24.741230010986328, "global_step": 232128, "epoch": 2796} {"train_loss": -24.806976318359375, "global_step": 232129, "epoch": 2796} {"train_loss": -24.65652084350586, "global_step": 232130, "epoch": 2796} {"train_loss": -24.681821823120117, "global_step": 232131, "epoch": 2796} {"train_loss": -24.754724502563477, "global_step": 232132, "epoch": 2796} {"train_loss": -24.53607177734375, "global_step": 232133, "epoch": 2796} {"train_loss": -24.321279525756836, "global_step": 232134, "epoch": 2796} {"train_loss": -25.205175399780273, "global_step": 232135, "epoch": 2796} {"train_loss": -25.156936645507812, "global_step": 232136, "epoch": 2796} {"train_loss": -24.8001651763916, "global_step": 232137, "epoch": 2796} {"train_loss": -24.715328216552734, "global_step": 232138, "epoch": 2796} {"train_loss": -24.66013526916504, "global_step": 232139, "epoch": 2796} {"train_loss": -24.563034057617188, "global_step": 232140, "epoch": 2796} {"train_loss": -24.906570434570312, "global_step": 232141, "epoch": 2796} {"train_loss": -25.147855758666992, "global_step": 232142, "epoch": 2796} {"train_loss": -24.959243774414062, "global_step": 232143, "epoch": 2796} {"train_loss": -24.79292869567871, "global_step": 232144, "epoch": 2796} {"train_loss": -25.10883140563965, "global_step": 232145, "epoch": 2796} {"train_loss": -25.05033302307129, "global_step": 232146, "epoch": 2796} {"train_loss": -24.722209930419922, "global_step": 232147, "epoch": 2796} {"train_loss": -24.609180450439453, "global_step": 232148, "epoch": 2796} {"train_loss": -24.57672119140625, "global_step": 232149, "epoch": 2796} {"train_loss": -24.74559671333037, "global_step": 232150, "epoch": 2796, "val_loss": 6854084.5} {"train_loss": -23.48102569580078, "global_step": 232151, "epoch": 2797} {"train_loss": -22.5783748626709, "global_step": 232152, "epoch": 2797} {"train_loss": -23.5632381439209, "global_step": 232153, "epoch": 2797} {"train_loss": -23.949569702148438, "global_step": 232154, "epoch": 2797} {"train_loss": -22.733104705810547, "global_step": 232155, "epoch": 2797} {"train_loss": -24.100112915039062, "global_step": 232156, "epoch": 2797} {"train_loss": -23.458486557006836, "global_step": 232157, "epoch": 2797} {"train_loss": -24.384937286376953, "global_step": 232158, "epoch": 2797} {"train_loss": -23.533763885498047, "global_step": 232159, "epoch": 2797} {"train_loss": -23.979381561279297, "global_step": 232160, "epoch": 2797} {"train_loss": -23.67806053161621, "global_step": 232161, "epoch": 2797} {"train_loss": -23.997262954711914, "global_step": 232162, "epoch": 2797} {"train_loss": -23.825428009033203, "global_step": 232163, "epoch": 2797} {"train_loss": -24.130962371826172, "global_step": 232164, "epoch": 2797} {"train_loss": -24.2806453704834, "global_step": 232165, "epoch": 2797} {"train_loss": -23.761579513549805, "global_step": 232166, "epoch": 2797} {"train_loss": -23.880550384521484, "global_step": 232167, "epoch": 2797} {"train_loss": -24.06266975402832, "global_step": 232168, "epoch": 2797} {"train_loss": -24.316770553588867, "global_step": 232169, "epoch": 2797} {"train_loss": -23.990806579589844, "global_step": 232170, "epoch": 2797} {"train_loss": -24.442352294921875, "global_step": 232171, "epoch": 2797} {"train_loss": -24.399560928344727, "global_step": 232172, "epoch": 2797} {"train_loss": -24.2476806640625, "global_step": 232173, "epoch": 2797} {"train_loss": -24.23636245727539, "global_step": 232174, "epoch": 2797} {"train_loss": -24.327363967895508, "global_step": 232175, "epoch": 2797} {"train_loss": -24.45917320251465, "global_step": 232176, "epoch": 2797} {"train_loss": -24.580699920654297, "global_step": 232177, "epoch": 2797} {"train_loss": -24.29218101501465, "global_step": 232178, "epoch": 2797} {"train_loss": -24.397489547729492, "global_step": 232179, "epoch": 2797} {"train_loss": -24.560022354125977, "global_step": 232180, "epoch": 2797} {"train_loss": -24.877422332763672, "global_step": 232181, "epoch": 2797} {"train_loss": -24.643579483032227, "global_step": 232182, "epoch": 2797} {"train_loss": -24.507482528686523, "global_step": 232183, "epoch": 2797} {"train_loss": -24.712738037109375, "global_step": 232184, "epoch": 2797} {"train_loss": -24.28019142150879, "global_step": 232185, "epoch": 2797} {"train_loss": -24.402997970581055, "global_step": 232186, "epoch": 2797} {"train_loss": -24.80311393737793, "global_step": 232187, "epoch": 2797} {"train_loss": -24.623109817504883, "global_step": 232188, "epoch": 2797} {"train_loss": -24.71626091003418, "global_step": 232189, "epoch": 2797} {"train_loss": -24.758451461791992, "global_step": 232190, "epoch": 2797} {"train_loss": -24.586881637573242, "global_step": 232191, "epoch": 2797} {"train_loss": -24.478534698486328, "global_step": 232192, "epoch": 2797} {"train_loss": -24.890649795532227, "global_step": 232193, "epoch": 2797} {"train_loss": -24.880311965942383, "global_step": 232194, "epoch": 2797} {"train_loss": -24.630136489868164, "global_step": 232195, "epoch": 2797} {"train_loss": -24.609695434570312, "global_step": 232196, "epoch": 2797} {"train_loss": -24.863149642944336, "global_step": 232197, "epoch": 2797} {"train_loss": -25.05575942993164, "global_step": 232198, "epoch": 2797} {"train_loss": -24.811525344848633, "global_step": 232199, "epoch": 2797} {"train_loss": -24.92892837524414, "global_step": 232200, "epoch": 2797} {"train_loss": -25.00606346130371, "global_step": 232201, "epoch": 2797} {"train_loss": -25.184558868408203, "global_step": 232202, "epoch": 2797} {"train_loss": -25.15435791015625, "global_step": 232203, "epoch": 2797} {"train_loss": -24.728214263916016, "global_step": 232204, "epoch": 2797} {"train_loss": -25.133668899536133, "global_step": 232205, "epoch": 2797} {"train_loss": -24.594852447509766, "global_step": 232206, "epoch": 2797} {"train_loss": -24.840784072875977, "global_step": 232207, "epoch": 2797} {"train_loss": -24.885465621948242, "global_step": 232208, "epoch": 2797} {"train_loss": -25.103031158447266, "global_step": 232209, "epoch": 2797} {"train_loss": -24.903661727905273, "global_step": 232210, "epoch": 2797} {"train_loss": -24.641042709350586, "global_step": 232211, "epoch": 2797} {"train_loss": -24.58160972595215, "global_step": 232212, "epoch": 2797} {"train_loss": -24.397960662841797, "global_step": 232213, "epoch": 2797} {"train_loss": -24.71378517150879, "global_step": 232214, "epoch": 2797} {"train_loss": -24.859907150268555, "global_step": 232215, "epoch": 2797} {"train_loss": -24.963706970214844, "global_step": 232216, "epoch": 2797} {"train_loss": -24.914264678955078, "global_step": 232217, "epoch": 2797} {"train_loss": -24.858022689819336, "global_step": 232218, "epoch": 2797} {"train_loss": -24.71424102783203, "global_step": 232219, "epoch": 2797} {"train_loss": -24.57695770263672, "global_step": 232220, "epoch": 2797} {"train_loss": -24.962839126586914, "global_step": 232221, "epoch": 2797} {"train_loss": -24.884552001953125, "global_step": 232222, "epoch": 2797} {"train_loss": -24.618637084960938, "global_step": 232223, "epoch": 2797} {"train_loss": -24.756698608398438, "global_step": 232224, "epoch": 2797} {"train_loss": -24.953149795532227, "global_step": 232225, "epoch": 2797} {"train_loss": -24.71327018737793, "global_step": 232226, "epoch": 2797} {"train_loss": -24.747106552124023, "global_step": 232227, "epoch": 2797} {"train_loss": -24.942291259765625, "global_step": 232228, "epoch": 2797} {"train_loss": -25.009841918945312, "global_step": 232229, "epoch": 2797} {"train_loss": -24.631305694580078, "global_step": 232230, "epoch": 2797} {"train_loss": -24.71502113342285, "global_step": 232231, "epoch": 2797} {"train_loss": -24.574018478393555, "global_step": 232232, "epoch": 2797} {"train_loss": -24.507064175893024, "global_step": 232233, "epoch": 2797, "val_loss": 6770741.0} {"train_loss": -24.319990158081055, "global_step": 232234, "epoch": 2798} {"train_loss": -24.34311866760254, "global_step": 232235, "epoch": 2798} {"train_loss": -24.792831420898438, "global_step": 232236, "epoch": 2798} {"train_loss": -24.129919052124023, "global_step": 232237, "epoch": 2798} {"train_loss": -24.552167892456055, "global_step": 232238, "epoch": 2798} {"train_loss": -24.3033447265625, "global_step": 232239, "epoch": 2798} {"train_loss": -24.632156372070312, "global_step": 232240, "epoch": 2798} {"train_loss": -24.951658248901367, "global_step": 232241, "epoch": 2798} {"train_loss": -24.663759231567383, "global_step": 232242, "epoch": 2798} {"train_loss": -24.4140567779541, "global_step": 232243, "epoch": 2798} {"train_loss": -25.27065086364746, "global_step": 232244, "epoch": 2798} {"train_loss": -24.185184478759766, "global_step": 232245, "epoch": 2798} {"train_loss": -24.73986053466797, "global_step": 232246, "epoch": 2798} {"train_loss": -24.676664352416992, "global_step": 232247, "epoch": 2798} {"train_loss": -24.350149154663086, "global_step": 232248, "epoch": 2798} {"train_loss": -24.199817657470703, "global_step": 232249, "epoch": 2798} {"train_loss": -24.629501342773438, "global_step": 232250, "epoch": 2798} {"train_loss": -24.628992080688477, "global_step": 232251, "epoch": 2798} {"train_loss": -24.261741638183594, "global_step": 232252, "epoch": 2798} {"train_loss": -24.480375289916992, "global_step": 232253, "epoch": 2798} {"train_loss": -24.915884017944336, "global_step": 232254, "epoch": 2798} {"train_loss": -24.80997657775879, "global_step": 232255, "epoch": 2798} {"train_loss": -24.606855392456055, "global_step": 232256, "epoch": 2798} {"train_loss": -24.716297149658203, "global_step": 232257, "epoch": 2798} {"train_loss": -24.513242721557617, "global_step": 232258, "epoch": 2798} {"train_loss": -24.713178634643555, "global_step": 232259, "epoch": 2798} {"train_loss": -24.554723739624023, "global_step": 232260, "epoch": 2798} {"train_loss": -24.770221710205078, "global_step": 232261, "epoch": 2798} {"train_loss": -24.187509536743164, "global_step": 232262, "epoch": 2798} {"train_loss": -24.35759735107422, "global_step": 232263, "epoch": 2798} {"train_loss": -24.774887084960938, "global_step": 232264, "epoch": 2798} {"train_loss": -24.656850814819336, "global_step": 232265, "epoch": 2798} {"train_loss": -25.158945083618164, "global_step": 232266, "epoch": 2798} {"train_loss": -24.99968147277832, "global_step": 232267, "epoch": 2798} {"train_loss": -24.736000061035156, "global_step": 232268, "epoch": 2798} {"train_loss": -24.680883407592773, "global_step": 232269, "epoch": 2798} {"train_loss": -25.143083572387695, "global_step": 232270, "epoch": 2798} {"train_loss": -24.483078002929688, "global_step": 232271, "epoch": 2798} {"train_loss": -24.905508041381836, "global_step": 232272, "epoch": 2798} {"train_loss": -24.858097076416016, "global_step": 232273, "epoch": 2798} {"train_loss": -24.951448440551758, "global_step": 232274, "epoch": 2798} {"train_loss": -24.729110717773438, "global_step": 232275, "epoch": 2798} {"train_loss": -24.848543167114258, "global_step": 232276, "epoch": 2798} {"train_loss": -24.708372116088867, "global_step": 232277, "epoch": 2798} {"train_loss": -24.999597549438477, "global_step": 232278, "epoch": 2798} {"train_loss": -24.9581241607666, "global_step": 232279, "epoch": 2798} {"train_loss": -25.023160934448242, "global_step": 232280, "epoch": 2798} {"train_loss": -24.670211791992188, "global_step": 232281, "epoch": 2798} {"train_loss": -24.88445281982422, "global_step": 232282, "epoch": 2798} {"train_loss": -24.839874267578125, "global_step": 232283, "epoch": 2798} {"train_loss": -24.662260055541992, "global_step": 232284, "epoch": 2798} {"train_loss": -24.704635620117188, "global_step": 232285, "epoch": 2798} {"train_loss": -24.715951919555664, "global_step": 232286, "epoch": 2798} {"train_loss": -25.0257625579834, "global_step": 232287, "epoch": 2798} {"train_loss": -25.015655517578125, "global_step": 232288, "epoch": 2798} {"train_loss": -24.96359634399414, "global_step": 232289, "epoch": 2798} {"train_loss": -25.010330200195312, "global_step": 232290, "epoch": 2798} {"train_loss": -24.608051300048828, "global_step": 232291, "epoch": 2798} {"train_loss": -24.883975982666016, "global_step": 232292, "epoch": 2798} {"train_loss": -25.214088439941406, "global_step": 232293, "epoch": 2798} {"train_loss": -24.99906349182129, "global_step": 232294, "epoch": 2798} {"train_loss": -24.73432731628418, "global_step": 232295, "epoch": 2798} {"train_loss": -25.00499725341797, "global_step": 232296, "epoch": 2798} {"train_loss": -24.876829147338867, "global_step": 232297, "epoch": 2798} {"train_loss": -25.04988670349121, "global_step": 232298, "epoch": 2798} {"train_loss": -24.89554214477539, "global_step": 232299, "epoch": 2798} {"train_loss": -24.648351669311523, "global_step": 232300, "epoch": 2798} {"train_loss": -24.55633544921875, "global_step": 232301, "epoch": 2798} {"train_loss": -24.981800079345703, "global_step": 232302, "epoch": 2798} {"train_loss": -24.83562660217285, "global_step": 232303, "epoch": 2798} {"train_loss": -25.06245231628418, "global_step": 232304, "epoch": 2798} {"train_loss": -25.020261764526367, "global_step": 232305, "epoch": 2798} {"train_loss": -24.90552520751953, "global_step": 232306, "epoch": 2798} {"train_loss": -24.63681983947754, "global_step": 232307, "epoch": 2798} {"train_loss": -24.681203842163086, "global_step": 232308, "epoch": 2798} {"train_loss": -24.467329025268555, "global_step": 232309, "epoch": 2798} {"train_loss": -24.758996963500977, "global_step": 232310, "epoch": 2798} {"train_loss": -24.874008178710938, "global_step": 232311, "epoch": 2798} {"train_loss": -24.95880126953125, "global_step": 232312, "epoch": 2798} {"train_loss": -25.1195125579834, "global_step": 232313, "epoch": 2798} {"train_loss": -24.665422439575195, "global_step": 232314, "epoch": 2798} {"train_loss": -24.588016510009766, "global_step": 232315, "epoch": 2798} {"train_loss": -24.75360399269196, "global_step": 232316, "epoch": 2798, "val_loss": 6787926.0} {"train_loss": -22.70269203186035, "global_step": 232317, "epoch": 2799} {"train_loss": -23.215591430664062, "global_step": 232318, "epoch": 2799} {"train_loss": -23.47462272644043, "global_step": 232319, "epoch": 2799} {"train_loss": -23.978513717651367, "global_step": 232320, "epoch": 2799} {"train_loss": -24.00849723815918, "global_step": 232321, "epoch": 2799} {"train_loss": -24.09608268737793, "global_step": 232322, "epoch": 2799} {"train_loss": -24.102886199951172, "global_step": 232323, "epoch": 2799} {"train_loss": -23.87586784362793, "global_step": 232324, "epoch": 2799} {"train_loss": -24.19136619567871, "global_step": 232325, "epoch": 2799} {"train_loss": -24.326663970947266, "global_step": 232326, "epoch": 2799} {"train_loss": -24.2827205657959, "global_step": 232327, "epoch": 2799} {"train_loss": -24.332372665405273, "global_step": 232328, "epoch": 2799} {"train_loss": -24.491436004638672, "global_step": 232329, "epoch": 2799} {"train_loss": -24.403038024902344, "global_step": 232330, "epoch": 2799} {"train_loss": -24.285974502563477, "global_step": 232331, "epoch": 2799} {"train_loss": -24.356616973876953, "global_step": 232332, "epoch": 2799} {"train_loss": -24.714111328125, "global_step": 232333, "epoch": 2799} {"train_loss": -24.5778751373291, "global_step": 232334, "epoch": 2799} {"train_loss": -24.72601890563965, "global_step": 232335, "epoch": 2799} {"train_loss": -24.61026382446289, "global_step": 232336, "epoch": 2799} {"train_loss": -24.660825729370117, "global_step": 232337, "epoch": 2799} {"train_loss": -24.453968048095703, "global_step": 232338, "epoch": 2799} {"train_loss": -25.04973030090332, "global_step": 232339, "epoch": 2799} {"train_loss": -24.7243709564209, "global_step": 232340, "epoch": 2799} {"train_loss": -24.58344078063965, "global_step": 232341, "epoch": 2799} {"train_loss": -24.56498146057129, "global_step": 232342, "epoch": 2799} {"train_loss": -24.63985252380371, "global_step": 232343, "epoch": 2799} {"train_loss": -24.363569259643555, "global_step": 232344, "epoch": 2799} {"train_loss": -24.713876724243164, "global_step": 232345, "epoch": 2799} {"train_loss": -24.62078857421875, "global_step": 232346, "epoch": 2799} {"train_loss": -24.508472442626953, "global_step": 232347, "epoch": 2799} {"train_loss": -24.580265045166016, "global_step": 232348, "epoch": 2799} {"train_loss": -24.877765655517578, "global_step": 232349, "epoch": 2799} {"train_loss": -24.88715171813965, "global_step": 232350, "epoch": 2799} {"train_loss": -24.897855758666992, "global_step": 232351, "epoch": 2799} {"train_loss": -24.598114013671875, "global_step": 232352, "epoch": 2799} {"train_loss": -24.757661819458008, "global_step": 232353, "epoch": 2799} {"train_loss": -24.917654037475586, "global_step": 232354, "epoch": 2799} {"train_loss": -25.05027198791504, "global_step": 232355, "epoch": 2799} {"train_loss": -24.806787490844727, "global_step": 232356, "epoch": 2799} {"train_loss": -24.764318466186523, "global_step": 232357, "epoch": 2799} {"train_loss": -25.043203353881836, "global_step": 232358, "epoch": 2799} {"train_loss": -24.676105499267578, "global_step": 232359, "epoch": 2799} {"train_loss": -24.937448501586914, "global_step": 232360, "epoch": 2799} {"train_loss": -25.04006004333496, "global_step": 232361, "epoch": 2799} {"train_loss": -25.10658073425293, "global_step": 232362, "epoch": 2799} {"train_loss": -24.74861717224121, "global_step": 232363, "epoch": 2799} {"train_loss": -25.01099395751953, "global_step": 232364, "epoch": 2799} {"train_loss": -24.592729568481445, "global_step": 232365, "epoch": 2799} {"train_loss": -25.308298110961914, "global_step": 232366, "epoch": 2799} {"train_loss": -24.69382667541504, "global_step": 232367, "epoch": 2799} {"train_loss": -24.611942291259766, "global_step": 232368, "epoch": 2799} {"train_loss": -24.804508209228516, "global_step": 232369, "epoch": 2799} {"train_loss": -24.592147827148438, "global_step": 232370, "epoch": 2799} {"train_loss": -24.511075973510742, "global_step": 232371, "epoch": 2799} {"train_loss": -25.005084991455078, "global_step": 232372, "epoch": 2799} {"train_loss": -24.895828247070312, "global_step": 232373, "epoch": 2799} {"train_loss": -24.458669662475586, "global_step": 232374, "epoch": 2799} {"train_loss": -25.004499435424805, "global_step": 232375, "epoch": 2799} {"train_loss": -24.423282623291016, "global_step": 232376, "epoch": 2799} {"train_loss": -24.738901138305664, "global_step": 232377, "epoch": 2799} {"train_loss": -24.89832305908203, "global_step": 232378, "epoch": 2799} {"train_loss": -24.597333908081055, "global_step": 232379, "epoch": 2799} {"train_loss": -25.013811111450195, "global_step": 232380, "epoch": 2799} {"train_loss": -24.8479061126709, "global_step": 232381, "epoch": 2799} {"train_loss": -24.923994064331055, "global_step": 232382, "epoch": 2799} {"train_loss": -24.697662353515625, "global_step": 232383, "epoch": 2799} {"train_loss": -24.49175453186035, "global_step": 232384, "epoch": 2799} {"train_loss": -25.129867553710938, "global_step": 232385, "epoch": 2799} {"train_loss": -24.69270133972168, "global_step": 232386, "epoch": 2799} {"train_loss": -24.810213088989258, "global_step": 232387, "epoch": 2799} {"train_loss": -24.93617820739746, "global_step": 232388, "epoch": 2799} {"train_loss": -24.80675506591797, "global_step": 232389, "epoch": 2799} {"train_loss": -24.8511962890625, "global_step": 232390, "epoch": 2799} {"train_loss": -24.697525024414062, "global_step": 232391, "epoch": 2799} {"train_loss": -24.842269897460938, "global_step": 232392, "epoch": 2799} {"train_loss": -25.280813217163086, "global_step": 232393, "epoch": 2799} {"train_loss": -24.8974666595459, "global_step": 232394, "epoch": 2799} {"train_loss": -24.59614372253418, "global_step": 232395, "epoch": 2799} {"train_loss": -24.544815063476562, "global_step": 232396, "epoch": 2799} {"train_loss": -25.164413452148438, "global_step": 232397, "epoch": 2799} {"train_loss": -24.79775047302246, "global_step": 232398, "epoch": 2799} {"train_loss": -24.64314800859934, "global_step": 232399, "epoch": 2799, "val_loss": 6874666.0} {"train_loss": -24.631134033203125, "global_step": 232400, "epoch": 2800} {"train_loss": -24.045881271362305, "global_step": 232401, "epoch": 2800} {"train_loss": -24.812240600585938, "global_step": 232402, "epoch": 2800} {"train_loss": -24.508939743041992, "global_step": 232403, "epoch": 2800} {"train_loss": -24.693058013916016, "global_step": 232404, "epoch": 2800} {"train_loss": -24.376996994018555, "global_step": 232405, "epoch": 2800} {"train_loss": -24.32746124267578, "global_step": 232406, "epoch": 2800} {"train_loss": -25.017337799072266, "global_step": 232407, "epoch": 2800} {"train_loss": -24.559606552124023, "global_step": 232408, "epoch": 2800} {"train_loss": -24.53205680847168, "global_step": 232409, "epoch": 2800} {"train_loss": -24.221586227416992, "global_step": 232410, "epoch": 2800} {"train_loss": -25.01776695251465, "global_step": 232411, "epoch": 2800} {"train_loss": -24.5626163482666, "global_step": 232412, "epoch": 2800} {"train_loss": -24.596317291259766, "global_step": 232413, "epoch": 2800} {"train_loss": -24.6455135345459, "global_step": 232414, "epoch": 2800} {"train_loss": -24.741931915283203, "global_step": 232415, "epoch": 2800} {"train_loss": -24.80269432067871, "global_step": 232416, "epoch": 2800} {"train_loss": -24.94968032836914, "global_step": 232417, "epoch": 2800} {"train_loss": -24.713760375976562, "global_step": 232418, "epoch": 2800} {"train_loss": -24.9537410736084, "global_step": 232419, "epoch": 2800} {"train_loss": -24.771583557128906, "global_step": 232420, "epoch": 2800} {"train_loss": -24.863317489624023, "global_step": 232421, "epoch": 2800} {"train_loss": -24.762420654296875, "global_step": 232422, "epoch": 2800} {"train_loss": -25.203489303588867, "global_step": 232423, "epoch": 2800} {"train_loss": -25.12691307067871, "global_step": 232424, "epoch": 2800} {"train_loss": -24.818456649780273, "global_step": 232425, "epoch": 2800} {"train_loss": -24.975645065307617, "global_step": 232426, "epoch": 2800} {"train_loss": -24.800809860229492, "global_step": 232427, "epoch": 2800} {"train_loss": -24.47684669494629, "global_step": 232428, "epoch": 2800} {"train_loss": -24.673429489135742, "global_step": 232429, "epoch": 2800} {"train_loss": -24.699460983276367, "global_step": 232430, "epoch": 2800} {"train_loss": -24.836261749267578, "global_step": 232431, "epoch": 2800} {"train_loss": -24.458505630493164, "global_step": 232432, "epoch": 2800} {"train_loss": -25.142250061035156, "global_step": 232433, "epoch": 2800} {"train_loss": -24.717458724975586, "global_step": 232434, "epoch": 2800} {"train_loss": -25.112211227416992, "global_step": 232435, "epoch": 2800} {"train_loss": -24.688962936401367, "global_step": 232436, "epoch": 2800} {"train_loss": -24.76375389099121, "global_step": 232437, "epoch": 2800} {"train_loss": -24.813657760620117, "global_step": 232438, "epoch": 2800} {"train_loss": -24.99901008605957, "global_step": 232439, "epoch": 2800} {"train_loss": -24.958494186401367, "global_step": 232440, "epoch": 2800} {"train_loss": -24.905187606811523, "global_step": 232441, "epoch": 2800} {"train_loss": -24.759998321533203, "global_step": 232442, "epoch": 2800} {"train_loss": -24.766782760620117, "global_step": 232443, "epoch": 2800} {"train_loss": -24.767353057861328, "global_step": 232444, "epoch": 2800} {"train_loss": -24.03607177734375, "global_step": 232445, "epoch": 2800} {"train_loss": -24.495119094848633, "global_step": 232446, "epoch": 2800} {"train_loss": -25.160470962524414, "global_step": 232447, "epoch": 2800} {"train_loss": -24.417638778686523, "global_step": 232448, "epoch": 2800} {"train_loss": -25.054197311401367, "global_step": 232449, "epoch": 2800} {"train_loss": -24.3629150390625, "global_step": 232450, "epoch": 2800} {"train_loss": -24.721113204956055, "global_step": 232451, "epoch": 2800} {"train_loss": -24.607866287231445, "global_step": 232452, "epoch": 2800} {"train_loss": -24.621061325073242, "global_step": 232453, "epoch": 2800} {"train_loss": -24.59429359436035, "global_step": 232454, "epoch": 2800} {"train_loss": -24.762027740478516, "global_step": 232455, "epoch": 2800} {"train_loss": -24.444578170776367, "global_step": 232456, "epoch": 2800} {"train_loss": -24.55830955505371, "global_step": 232457, "epoch": 2800} {"train_loss": -24.685699462890625, "global_step": 232458, "epoch": 2800} {"train_loss": -24.873733520507812, "global_step": 232459, "epoch": 2800} {"train_loss": -24.55257225036621, "global_step": 232460, "epoch": 2800} {"train_loss": -24.898475646972656, "global_step": 232461, "epoch": 2800} {"train_loss": -24.96709632873535, "global_step": 232462, "epoch": 2800} {"train_loss": -24.79854393005371, "global_step": 232463, "epoch": 2800} {"train_loss": -24.5390625, "global_step": 232464, "epoch": 2800} {"train_loss": -24.674823760986328, "global_step": 232465, "epoch": 2800} {"train_loss": -24.684858322143555, "global_step": 232466, "epoch": 2800} {"train_loss": -25.014036178588867, "global_step": 232467, "epoch": 2800} {"train_loss": -25.1466007232666, "global_step": 232468, "epoch": 2800} {"train_loss": -24.834365844726562, "global_step": 232469, "epoch": 2800} {"train_loss": -24.739028930664062, "global_step": 232470, "epoch": 2800} {"train_loss": -24.52720069885254, "global_step": 232471, "epoch": 2800} {"train_loss": -24.969594955444336, "global_step": 232472, "epoch": 2800} {"train_loss": -24.876516342163086, "global_step": 232473, "epoch": 2800} {"train_loss": -24.973737716674805, "global_step": 232474, "epoch": 2800} {"train_loss": -24.846576690673828, "global_step": 232475, "epoch": 2800} {"train_loss": -25.268796920776367, "global_step": 232476, "epoch": 2800} {"train_loss": -24.933879852294922, "global_step": 232477, "epoch": 2800} {"train_loss": -25.23320770263672, "global_step": 232478, "epoch": 2800} {"train_loss": -25.057010650634766, "global_step": 232479, "epoch": 2800} {"train_loss": -25.00678062438965, "global_step": 232480, "epoch": 2800} {"train_loss": -25.12741470336914, "global_step": 232481, "epoch": 2800} {"train_loss": -24.75207657411874, "global_step": 232482, "epoch": 2800, "train/sim_max_reward_0": 1.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4500000": 1.0, "test/sim_max_reward_4500001": 1.0, "test/sim_max_reward_4500002": 1.0, "test/sim_max_reward_4500003": 1.0, "test/sim_max_reward_4500004": 1.0, "test/sim_max_reward_4500005": 1.0, "test/sim_max_reward_4500006": 1.0, "test/sim_max_reward_4500007": 1.0, "test/sim_max_reward_4500008": 1.0, "test/sim_max_reward_4500009": 1.0, "test/sim_max_reward_4500010": 1.0, "test/sim_max_reward_4500011": 1.0, "test/sim_max_reward_4500012": 1.0, "test/sim_max_reward_4500013": 1.0, "test/sim_max_reward_4500014": 1.0, "test/sim_max_reward_4500015": 1.0, "test/sim_max_reward_4500016": 1.0, "test/sim_max_reward_4500017": 1.0, "test/sim_max_reward_4500018": 1.0, "test/sim_max_reward_4500019": 0.0, "test/sim_max_reward_4500020": 1.0, "test/sim_max_reward_4500021": 1.0, "train/mean_score": 1.0, "test/mean_score": 0.9545454545454546, "val_loss": 6660541.0} {"train_loss": -24.537551879882812, "global_step": 232483, "epoch": 2801} {"train_loss": -24.79966163635254, "global_step": 232484, "epoch": 2801} {"train_loss": -24.245119094848633, "global_step": 232485, "epoch": 2801} {"train_loss": -23.73630714416504, "global_step": 232486, "epoch": 2801} {"train_loss": -22.916528701782227, "global_step": 232487, "epoch": 2801} {"train_loss": -23.09663200378418, "global_step": 232488, "epoch": 2801} {"train_loss": -24.246929168701172, "global_step": 232489, "epoch": 2801} {"train_loss": -23.752721786499023, "global_step": 232490, "epoch": 2801} {"train_loss": -24.23554039001465, "global_step": 232491, "epoch": 2801} {"train_loss": -24.06256103515625, "global_step": 232492, "epoch": 2801} {"train_loss": -24.083803176879883, "global_step": 232493, "epoch": 2801} {"train_loss": -24.509052276611328, "global_step": 232494, "epoch": 2801} {"train_loss": -24.39042854309082, "global_step": 232495, "epoch": 2801} {"train_loss": -24.543081283569336, "global_step": 232496, "epoch": 2801} {"train_loss": -24.60966682434082, "global_step": 232497, "epoch": 2801} {"train_loss": -24.37752914428711, "global_step": 232498, "epoch": 2801} {"train_loss": -24.38156509399414, "global_step": 232499, "epoch": 2801} {"train_loss": -24.14381217956543, "global_step": 232500, "epoch": 2801} {"train_loss": -24.6052188873291, "global_step": 232501, "epoch": 2801} {"train_loss": -24.423315048217773, "global_step": 232502, "epoch": 2801} {"train_loss": -24.42321014404297, "global_step": 232503, "epoch": 2801} {"train_loss": -24.6859073638916, "global_step": 232504, "epoch": 2801} {"train_loss": -24.40006446838379, "global_step": 232505, "epoch": 2801} {"train_loss": -24.574460983276367, "global_step": 232506, "epoch": 2801} {"train_loss": -24.750080108642578, "global_step": 232507, "epoch": 2801} {"train_loss": -24.510774612426758, "global_step": 232508, "epoch": 2801} {"train_loss": -24.589887619018555, "global_step": 232509, "epoch": 2801} {"train_loss": -24.681621551513672, "global_step": 232510, "epoch": 2801} {"train_loss": -24.718961715698242, "global_step": 232511, "epoch": 2801} {"train_loss": -24.75292205810547, "global_step": 232512, "epoch": 2801} {"train_loss": -24.677453994750977, "global_step": 232513, "epoch": 2801} {"train_loss": -24.487775802612305, "global_step": 232514, "epoch": 2801} {"train_loss": -24.6563720703125, "global_step": 232515, "epoch": 2801} {"train_loss": -24.791065216064453, "global_step": 232516, "epoch": 2801} {"train_loss": -24.948659896850586, "global_step": 232517, "epoch": 2801} {"train_loss": -24.44081687927246, "global_step": 232518, "epoch": 2801} {"train_loss": -25.025537490844727, "global_step": 232519, "epoch": 2801} {"train_loss": -24.78282928466797, "global_step": 232520, "epoch": 2801} {"train_loss": -24.872526168823242, "global_step": 232521, "epoch": 2801} {"train_loss": -24.748151779174805, "global_step": 232522, "epoch": 2801} {"train_loss": -24.69974136352539, "global_step": 232523, "epoch": 2801} {"train_loss": -24.812070846557617, "global_step": 232524, "epoch": 2801} {"train_loss": -24.82745933532715, "global_step": 232525, "epoch": 2801} {"train_loss": -24.63844108581543, "global_step": 232526, "epoch": 2801} {"train_loss": -24.7608699798584, "global_step": 232527, "epoch": 2801} {"train_loss": -24.899702072143555, "global_step": 232528, "epoch": 2801} {"train_loss": -24.63504409790039, "global_step": 232529, "epoch": 2801} {"train_loss": -24.82891845703125, "global_step": 232530, "epoch": 2801} {"train_loss": -24.801633834838867, "global_step": 232531, "epoch": 2801} {"train_loss": -24.229028701782227, "global_step": 232532, "epoch": 2801} {"train_loss": -24.631439208984375, "global_step": 232533, "epoch": 2801} {"train_loss": -24.834156036376953, "global_step": 232534, "epoch": 2801} {"train_loss": -24.3736629486084, "global_step": 232535, "epoch": 2801} {"train_loss": -24.392667770385742, "global_step": 232536, "epoch": 2801} {"train_loss": -24.75516128540039, "global_step": 232537, "epoch": 2801} {"train_loss": -24.566547393798828, "global_step": 232538, "epoch": 2801} {"train_loss": -24.810874938964844, "global_step": 232539, "epoch": 2801} {"train_loss": -24.45029067993164, "global_step": 232540, "epoch": 2801} {"train_loss": -24.655874252319336, "global_step": 232541, "epoch": 2801} {"train_loss": -24.864408493041992, "global_step": 232542, "epoch": 2801} {"train_loss": -24.51399803161621, "global_step": 232543, "epoch": 2801} {"train_loss": -24.749839782714844, "global_step": 232544, "epoch": 2801} {"train_loss": -24.6599178314209, "global_step": 232545, "epoch": 2801} {"train_loss": -24.45145034790039, "global_step": 232546, "epoch": 2801} {"train_loss": -24.66993522644043, "global_step": 232547, "epoch": 2801} {"train_loss": -24.772842407226562, "global_step": 232548, "epoch": 2801} {"train_loss": -24.44862174987793, "global_step": 232549, "epoch": 2801} {"train_loss": -24.835172653198242, "global_step": 232550, "epoch": 2801} {"train_loss": -24.93619155883789, "global_step": 232551, "epoch": 2801} {"train_loss": -24.436504364013672, "global_step": 232552, "epoch": 2801} {"train_loss": -24.803985595703125, "global_step": 232553, "epoch": 2801} {"train_loss": -24.797607421875, "global_step": 232554, "epoch": 2801} {"train_loss": -24.763967514038086, "global_step": 232555, "epoch": 2801} {"train_loss": -24.349470138549805, "global_step": 232556, "epoch": 2801} {"train_loss": -24.56148338317871, "global_step": 232557, "epoch": 2801} {"train_loss": -24.499155044555664, "global_step": 232558, "epoch": 2801} {"train_loss": -24.32419204711914, "global_step": 232559, "epoch": 2801} {"train_loss": -24.956205368041992, "global_step": 232560, "epoch": 2801} {"train_loss": -24.707773208618164, "global_step": 232561, "epoch": 2801} {"train_loss": -25.031808853149414, "global_step": 232562, "epoch": 2801} {"train_loss": -24.8120059967041, "global_step": 232563, "epoch": 2801} {"train_loss": -24.8094539642334, "global_step": 232564, "epoch": 2801} {"train_loss": -24.562378894851868, "global_step": 232565, "epoch": 2801, "val_loss": 6799369.0} {"train_loss": -24.260725021362305, "global_step": 232566, "epoch": 2802} {"train_loss": -24.327890396118164, "global_step": 232567, "epoch": 2802} {"train_loss": -24.3335018157959, "global_step": 232568, "epoch": 2802} {"train_loss": -24.1026668548584, "global_step": 232569, "epoch": 2802} {"train_loss": -24.660295486450195, "global_step": 232570, "epoch": 2802} {"train_loss": -24.679725646972656, "global_step": 232571, "epoch": 2802} {"train_loss": -24.403762817382812, "global_step": 232572, "epoch": 2802} {"train_loss": -24.401639938354492, "global_step": 232573, "epoch": 2802} {"train_loss": -24.40940284729004, "global_step": 232574, "epoch": 2802} {"train_loss": -24.856534957885742, "global_step": 232575, "epoch": 2802} {"train_loss": -24.748876571655273, "global_step": 232576, "epoch": 2802} {"train_loss": -24.56025505065918, "global_step": 232577, "epoch": 2802} {"train_loss": -24.531648635864258, "global_step": 232578, "epoch": 2802} {"train_loss": -24.680524826049805, "global_step": 232579, "epoch": 2802} {"train_loss": -24.820575714111328, "global_step": 232580, "epoch": 2802} {"train_loss": -24.435049057006836, "global_step": 232581, "epoch": 2802} {"train_loss": -24.183944702148438, "global_step": 232582, "epoch": 2802} {"train_loss": -24.63129997253418, "global_step": 232583, "epoch": 2802} {"train_loss": -24.80439567565918, "global_step": 232584, "epoch": 2802} {"train_loss": -24.714515686035156, "global_step": 232585, "epoch": 2802} {"train_loss": -24.809019088745117, "global_step": 232586, "epoch": 2802} {"train_loss": -24.479795455932617, "global_step": 232587, "epoch": 2802} {"train_loss": -24.469690322875977, "global_step": 232588, "epoch": 2802} {"train_loss": -24.58426284790039, "global_step": 232589, "epoch": 2802} {"train_loss": -25.05910301208496, "global_step": 232590, "epoch": 2802} {"train_loss": -24.50240135192871, "global_step": 232591, "epoch": 2802} {"train_loss": -24.87981605529785, "global_step": 232592, "epoch": 2802} {"train_loss": -24.436086654663086, "global_step": 232593, "epoch": 2802} {"train_loss": -24.374235153198242, "global_step": 232594, "epoch": 2802} {"train_loss": -24.576120376586914, "global_step": 232595, "epoch": 2802} {"train_loss": -24.867521286010742, "global_step": 232596, "epoch": 2802} {"train_loss": -24.52837562561035, "global_step": 232597, "epoch": 2802} {"train_loss": -24.664894104003906, "global_step": 232598, "epoch": 2802} {"train_loss": -24.691076278686523, "global_step": 232599, "epoch": 2802} {"train_loss": -24.886035919189453, "global_step": 232600, "epoch": 2802} {"train_loss": -24.326478958129883, "global_step": 232601, "epoch": 2802} {"train_loss": -24.91067886352539, "global_step": 232602, "epoch": 2802} {"train_loss": -23.909269332885742, "global_step": 232603, "epoch": 2802} {"train_loss": -24.50087547302246, "global_step": 232604, "epoch": 2802} {"train_loss": -24.652448654174805, "global_step": 232605, "epoch": 2802} {"train_loss": -24.674549102783203, "global_step": 232606, "epoch": 2802} {"train_loss": -24.551733016967773, "global_step": 232607, "epoch": 2802} {"train_loss": -24.377887725830078, "global_step": 232608, "epoch": 2802} {"train_loss": -24.52469253540039, "global_step": 232609, "epoch": 2802} {"train_loss": -24.699569702148438, "global_step": 232610, "epoch": 2802} {"train_loss": -24.844154357910156, "global_step": 232611, "epoch": 2802} {"train_loss": -24.824216842651367, "global_step": 232612, "epoch": 2802} {"train_loss": -24.85578727722168, "global_step": 232613, "epoch": 2802} {"train_loss": -24.94641876220703, "global_step": 232614, "epoch": 2802} {"train_loss": -24.66888999938965, "global_step": 232615, "epoch": 2802} {"train_loss": -25.14436149597168, "global_step": 232616, "epoch": 2802} {"train_loss": -24.602554321289062, "global_step": 232617, "epoch": 2802} {"train_loss": -24.741647720336914, "global_step": 232618, "epoch": 2802} {"train_loss": -24.290517807006836, "global_step": 232619, "epoch": 2802} {"train_loss": -24.327497482299805, "global_step": 232620, "epoch": 2802} {"train_loss": -24.779518127441406, "global_step": 232621, "epoch": 2802} {"train_loss": -24.8573055267334, "global_step": 232622, "epoch": 2802} {"train_loss": -24.588552474975586, "global_step": 232623, "epoch": 2802} {"train_loss": -24.375110626220703, "global_step": 232624, "epoch": 2802} {"train_loss": -24.517240524291992, "global_step": 232625, "epoch": 2802} {"train_loss": -24.746435165405273, "global_step": 232626, "epoch": 2802} {"train_loss": -24.613080978393555, "global_step": 232627, "epoch": 2802} {"train_loss": -24.9980525970459, "global_step": 232628, "epoch": 2802} {"train_loss": -25.013511657714844, "global_step": 232629, "epoch": 2802} {"train_loss": -24.809852600097656, "global_step": 232630, "epoch": 2802} {"train_loss": -25.03877067565918, "global_step": 232631, "epoch": 2802} {"train_loss": -25.017276763916016, "global_step": 232632, "epoch": 2802} {"train_loss": -24.893003463745117, "global_step": 232633, "epoch": 2802} {"train_loss": -24.669334411621094, "global_step": 232634, "epoch": 2802} {"train_loss": -25.091739654541016, "global_step": 232635, "epoch": 2802} {"train_loss": -24.83159065246582, "global_step": 232636, "epoch": 2802} {"train_loss": -24.985977172851562, "global_step": 232637, "epoch": 2802} {"train_loss": -25.435972213745117, "global_step": 232638, "epoch": 2802} {"train_loss": -24.926422119140625, "global_step": 232639, "epoch": 2802} {"train_loss": -25.232070922851562, "global_step": 232640, "epoch": 2802} {"train_loss": -25.001243591308594, "global_step": 232641, "epoch": 2802} {"train_loss": -25.087316513061523, "global_step": 232642, "epoch": 2802} {"train_loss": -25.273427963256836, "global_step": 232643, "epoch": 2802} {"train_loss": -24.73856544494629, "global_step": 232644, "epoch": 2802} {"train_loss": -24.791397094726562, "global_step": 232645, "epoch": 2802} {"train_loss": -24.849592208862305, "global_step": 232646, "epoch": 2802} {"train_loss": -24.292734146118164, "global_step": 232647, "epoch": 2802} {"train_loss": -24.693597012255566, "global_step": 232648, "epoch": 2802, "val_loss": 6710249.5} {"train_loss": -24.054218292236328, "global_step": 232649, "epoch": 2803} {"train_loss": -23.89440155029297, "global_step": 232650, "epoch": 2803} {"train_loss": -24.408605575561523, "global_step": 232651, "epoch": 2803} {"train_loss": -24.412084579467773, "global_step": 232652, "epoch": 2803} {"train_loss": -24.497962951660156, "global_step": 232653, "epoch": 2803} {"train_loss": -24.449691772460938, "global_step": 232654, "epoch": 2803} {"train_loss": -24.864465713500977, "global_step": 232655, "epoch": 2803} {"train_loss": -24.477758407592773, "global_step": 232656, "epoch": 2803} {"train_loss": -24.926578521728516, "global_step": 232657, "epoch": 2803} {"train_loss": -24.8110294342041, "global_step": 232658, "epoch": 2803} {"train_loss": -24.859804153442383, "global_step": 232659, "epoch": 2803} {"train_loss": -24.508230209350586, "global_step": 232660, "epoch": 2803} {"train_loss": -24.558691024780273, "global_step": 232661, "epoch": 2803} {"train_loss": -24.936805725097656, "global_step": 232662, "epoch": 2803} {"train_loss": -24.631053924560547, "global_step": 232663, "epoch": 2803} {"train_loss": -24.752994537353516, "global_step": 232664, "epoch": 2803} {"train_loss": -24.35515594482422, "global_step": 232665, "epoch": 2803} {"train_loss": -24.333078384399414, "global_step": 232666, "epoch": 2803} {"train_loss": -25.000207901000977, "global_step": 232667, "epoch": 2803} {"train_loss": -24.65555763244629, "global_step": 232668, "epoch": 2803} {"train_loss": -24.533048629760742, "global_step": 232669, "epoch": 2803} {"train_loss": -24.76384925842285, "global_step": 232670, "epoch": 2803} {"train_loss": -24.831510543823242, "global_step": 232671, "epoch": 2803} {"train_loss": -24.74401092529297, "global_step": 232672, "epoch": 2803} {"train_loss": -24.8983211517334, "global_step": 232673, "epoch": 2803} {"train_loss": -24.66077995300293, "global_step": 232674, "epoch": 2803} {"train_loss": -24.34517478942871, "global_step": 232675, "epoch": 2803} {"train_loss": -24.832881927490234, "global_step": 232676, "epoch": 2803} {"train_loss": -24.874841690063477, "global_step": 232677, "epoch": 2803} {"train_loss": -24.707876205444336, "global_step": 232678, "epoch": 2803} {"train_loss": -25.12872886657715, "global_step": 232679, "epoch": 2803} {"train_loss": -25.141876220703125, "global_step": 232680, "epoch": 2803} {"train_loss": -25.04157066345215, "global_step": 232681, "epoch": 2803} {"train_loss": -24.77650260925293, "global_step": 232682, "epoch": 2803} {"train_loss": -25.136268615722656, "global_step": 232683, "epoch": 2803} {"train_loss": -24.707401275634766, "global_step": 232684, "epoch": 2803} {"train_loss": -24.59345054626465, "global_step": 232685, "epoch": 2803} {"train_loss": -25.118066787719727, "global_step": 232686, "epoch": 2803} {"train_loss": -24.98150634765625, "global_step": 232687, "epoch": 2803} {"train_loss": -25.05319595336914, "global_step": 232688, "epoch": 2803} {"train_loss": -24.983657836914062, "global_step": 232689, "epoch": 2803} {"train_loss": -24.9487247467041, "global_step": 232690, "epoch": 2803} {"train_loss": -25.12705421447754, "global_step": 232691, "epoch": 2803} {"train_loss": -24.816808700561523, "global_step": 232692, "epoch": 2803} {"train_loss": -25.21231460571289, "global_step": 232693, "epoch": 2803} {"train_loss": -25.018325805664062, "global_step": 232694, "epoch": 2803} {"train_loss": -24.78841209411621, "global_step": 232695, "epoch": 2803} {"train_loss": -24.614179611206055, "global_step": 232696, "epoch": 2803} {"train_loss": -24.288705825805664, "global_step": 232697, "epoch": 2803} {"train_loss": -24.6800479888916, "global_step": 232698, "epoch": 2803} {"train_loss": -24.207731246948242, "global_step": 232699, "epoch": 2803} {"train_loss": -24.488828659057617, "global_step": 232700, "epoch": 2803} {"train_loss": -24.732025146484375, "global_step": 232701, "epoch": 2803} {"train_loss": -25.083986282348633, "global_step": 232702, "epoch": 2803} {"train_loss": -24.428701400756836, "global_step": 232703, "epoch": 2803} {"train_loss": -24.356904983520508, "global_step": 232704, "epoch": 2803} {"train_loss": -24.44087791442871, "global_step": 232705, "epoch": 2803} {"train_loss": -24.577478408813477, "global_step": 232706, "epoch": 2803} {"train_loss": -24.955432891845703, "global_step": 232707, "epoch": 2803} {"train_loss": -24.754114151000977, "global_step": 232708, "epoch": 2803} {"train_loss": -24.786056518554688, "global_step": 232709, "epoch": 2803} {"train_loss": -24.86478614807129, "global_step": 232710, "epoch": 2803} {"train_loss": -24.22864532470703, "global_step": 232711, "epoch": 2803} {"train_loss": -24.789112091064453, "global_step": 232712, "epoch": 2803} {"train_loss": -24.17920684814453, "global_step": 232713, "epoch": 2803} {"train_loss": -25.016443252563477, "global_step": 232714, "epoch": 2803} {"train_loss": -24.78635597229004, "global_step": 232715, "epoch": 2803} {"train_loss": -24.588220596313477, "global_step": 232716, "epoch": 2803} {"train_loss": -24.578907012939453, "global_step": 232717, "epoch": 2803} {"train_loss": -24.985944747924805, "global_step": 232718, "epoch": 2803} {"train_loss": -24.889549255371094, "global_step": 232719, "epoch": 2803} {"train_loss": -24.49349021911621, "global_step": 232720, "epoch": 2803} {"train_loss": -24.79645347595215, "global_step": 232721, "epoch": 2803} {"train_loss": -24.759397506713867, "global_step": 232722, "epoch": 2803} {"train_loss": -25.027332305908203, "global_step": 232723, "epoch": 2803} {"train_loss": -24.888031005859375, "global_step": 232724, "epoch": 2803} {"train_loss": -25.057884216308594, "global_step": 232725, "epoch": 2803} {"train_loss": -24.729480743408203, "global_step": 232726, "epoch": 2803} {"train_loss": -24.93977928161621, "global_step": 232727, "epoch": 2803} {"train_loss": -24.902462005615234, "global_step": 232728, "epoch": 2803} {"train_loss": -24.47365379333496, "global_step": 232729, "epoch": 2803} {"train_loss": -25.073026657104492, "global_step": 232730, "epoch": 2803} {"train_loss": -24.71648767770055, "global_step": 232731, "epoch": 2803, "val_loss": 6761034.5} {"train_loss": -24.444480895996094, "global_step": 232732, "epoch": 2804} {"train_loss": -24.91412925720215, "global_step": 232733, "epoch": 2804} {"train_loss": -24.861549377441406, "global_step": 232734, "epoch": 2804} {"train_loss": -24.49347686767578, "global_step": 232735, "epoch": 2804} {"train_loss": -24.49410057067871, "global_step": 232736, "epoch": 2804} {"train_loss": -24.498188018798828, "global_step": 232737, "epoch": 2804} {"train_loss": -24.80777931213379, "global_step": 232738, "epoch": 2804} {"train_loss": -24.556188583374023, "global_step": 232739, "epoch": 2804} {"train_loss": -24.683469772338867, "global_step": 232740, "epoch": 2804} {"train_loss": -24.736881256103516, "global_step": 232741, "epoch": 2804} {"train_loss": -24.447175979614258, "global_step": 232742, "epoch": 2804} {"train_loss": -24.8647403717041, "global_step": 232743, "epoch": 2804} {"train_loss": -24.719816207885742, "global_step": 232744, "epoch": 2804} {"train_loss": -25.041372299194336, "global_step": 232745, "epoch": 2804} {"train_loss": -24.417360305786133, "global_step": 232746, "epoch": 2804} {"train_loss": -24.710159301757812, "global_step": 232747, "epoch": 2804} {"train_loss": -24.650739669799805, "global_step": 232748, "epoch": 2804} {"train_loss": -24.555898666381836, "global_step": 232749, "epoch": 2804} {"train_loss": -24.721588134765625, "global_step": 232750, "epoch": 2804} {"train_loss": -25.1475830078125, "global_step": 232751, "epoch": 2804} {"train_loss": -25.04920768737793, "global_step": 232752, "epoch": 2804} {"train_loss": -24.69416618347168, "global_step": 232753, "epoch": 2804} {"train_loss": -24.975257873535156, "global_step": 232754, "epoch": 2804} {"train_loss": -24.982336044311523, "global_step": 232755, "epoch": 2804} {"train_loss": -24.76372718811035, "global_step": 232756, "epoch": 2804} {"train_loss": -25.116701126098633, "global_step": 232757, "epoch": 2804} {"train_loss": -25.06647491455078, "global_step": 232758, "epoch": 2804} {"train_loss": -25.10677146911621, "global_step": 232759, "epoch": 2804} {"train_loss": -24.781877517700195, "global_step": 232760, "epoch": 2804} {"train_loss": -24.98065757751465, "global_step": 232761, "epoch": 2804} {"train_loss": -25.041601181030273, "global_step": 232762, "epoch": 2804} {"train_loss": -24.977392196655273, "global_step": 232763, "epoch": 2804} {"train_loss": -24.567441940307617, "global_step": 232764, "epoch": 2804} {"train_loss": -24.891263961791992, "global_step": 232765, "epoch": 2804} {"train_loss": -24.90952491760254, "global_step": 232766, "epoch": 2804} {"train_loss": -24.70928192138672, "global_step": 232767, "epoch": 2804} {"train_loss": -24.69291114807129, "global_step": 232768, "epoch": 2804} {"train_loss": -24.828548431396484, "global_step": 232769, "epoch": 2804} {"train_loss": -25.07294464111328, "global_step": 232770, "epoch": 2804} {"train_loss": -24.735977172851562, "global_step": 232771, "epoch": 2804} {"train_loss": -24.9830379486084, "global_step": 232772, "epoch": 2804} {"train_loss": -24.86543083190918, "global_step": 232773, "epoch": 2804} {"train_loss": -25.308786392211914, "global_step": 232774, "epoch": 2804} {"train_loss": -25.02629280090332, "global_step": 232775, "epoch": 2804} {"train_loss": -24.7221736907959, "global_step": 232776, "epoch": 2804} {"train_loss": -24.744272232055664, "global_step": 232777, "epoch": 2804} {"train_loss": -24.091629028320312, "global_step": 232778, "epoch": 2804} {"train_loss": -23.910160064697266, "global_step": 232779, "epoch": 2804} {"train_loss": -23.886493682861328, "global_step": 232780, "epoch": 2804} {"train_loss": -24.494110107421875, "global_step": 232781, "epoch": 2804} {"train_loss": -24.445676803588867, "global_step": 232782, "epoch": 2804} {"train_loss": -24.95940589904785, "global_step": 232783, "epoch": 2804} {"train_loss": -24.318340301513672, "global_step": 232784, "epoch": 2804} {"train_loss": -24.777984619140625, "global_step": 232785, "epoch": 2804} {"train_loss": -24.919292449951172, "global_step": 232786, "epoch": 2804} {"train_loss": -24.296241760253906, "global_step": 232787, "epoch": 2804} {"train_loss": -24.828960418701172, "global_step": 232788, "epoch": 2804} {"train_loss": -24.944427490234375, "global_step": 232789, "epoch": 2804} {"train_loss": -24.99226188659668, "global_step": 232790, "epoch": 2804} {"train_loss": -24.96125602722168, "global_step": 232791, "epoch": 2804} {"train_loss": -24.755340576171875, "global_step": 232792, "epoch": 2804} {"train_loss": -25.03986930847168, "global_step": 232793, "epoch": 2804} {"train_loss": -24.746061325073242, "global_step": 232794, "epoch": 2804} {"train_loss": -24.68921661376953, "global_step": 232795, "epoch": 2804} {"train_loss": -24.745649337768555, "global_step": 232796, "epoch": 2804} {"train_loss": -24.54599952697754, "global_step": 232797, "epoch": 2804} {"train_loss": -24.678991317749023, "global_step": 232798, "epoch": 2804} {"train_loss": -24.648494720458984, "global_step": 232799, "epoch": 2804} {"train_loss": -24.992136001586914, "global_step": 232800, "epoch": 2804} {"train_loss": -24.621471405029297, "global_step": 232801, "epoch": 2804} {"train_loss": -24.687549591064453, "global_step": 232802, "epoch": 2804} {"train_loss": -24.850645065307617, "global_step": 232803, "epoch": 2804} {"train_loss": -24.498632431030273, "global_step": 232804, "epoch": 2804} {"train_loss": -25.08941650390625, "global_step": 232805, "epoch": 2804} {"train_loss": -24.75383949279785, "global_step": 232806, "epoch": 2804} {"train_loss": -24.730173110961914, "global_step": 232807, "epoch": 2804} {"train_loss": -24.649032592773438, "global_step": 232808, "epoch": 2804} {"train_loss": -24.919620513916016, "global_step": 232809, "epoch": 2804} {"train_loss": -24.7861328125, "global_step": 232810, "epoch": 2804} {"train_loss": -25.005090713500977, "global_step": 232811, "epoch": 2804} {"train_loss": -24.810136795043945, "global_step": 232812, "epoch": 2804} {"train_loss": -24.572845458984375, "global_step": 232813, "epoch": 2804} {"train_loss": -24.746884311538146, "global_step": 232814, "epoch": 2804, "val_loss": 6785412.0} {"train_loss": -23.252567291259766, "global_step": 232815, "epoch": 2805} {"train_loss": -22.782989501953125, "global_step": 232816, "epoch": 2805} {"train_loss": -24.096534729003906, "global_step": 232817, "epoch": 2805} {"train_loss": -24.054975509643555, "global_step": 232818, "epoch": 2805} {"train_loss": -23.897600173950195, "global_step": 232819, "epoch": 2805} {"train_loss": -23.838037490844727, "global_step": 232820, "epoch": 2805} {"train_loss": -24.191774368286133, "global_step": 232821, "epoch": 2805} {"train_loss": -23.939489364624023, "global_step": 232822, "epoch": 2805} {"train_loss": -24.32878875732422, "global_step": 232823, "epoch": 2805} {"train_loss": -24.002548217773438, "global_step": 232824, "epoch": 2805} {"train_loss": -24.173574447631836, "global_step": 232825, "epoch": 2805} {"train_loss": -23.967144012451172, "global_step": 232826, "epoch": 2805} {"train_loss": -24.14240074157715, "global_step": 232827, "epoch": 2805} {"train_loss": -24.09746742248535, "global_step": 232828, "epoch": 2805} {"train_loss": -24.06730079650879, "global_step": 232829, "epoch": 2805} {"train_loss": -24.447053909301758, "global_step": 232830, "epoch": 2805} {"train_loss": -24.346324920654297, "global_step": 232831, "epoch": 2805} {"train_loss": -24.129695892333984, "global_step": 232832, "epoch": 2805} {"train_loss": -24.332332611083984, "global_step": 232833, "epoch": 2805} {"train_loss": -24.45619773864746, "global_step": 232834, "epoch": 2805} {"train_loss": -24.406240463256836, "global_step": 232835, "epoch": 2805} {"train_loss": -24.55829429626465, "global_step": 232836, "epoch": 2805} {"train_loss": -24.61264991760254, "global_step": 232837, "epoch": 2805} {"train_loss": -24.70505142211914, "global_step": 232838, "epoch": 2805} {"train_loss": -24.616270065307617, "global_step": 232839, "epoch": 2805} {"train_loss": -24.53858757019043, "global_step": 232840, "epoch": 2805} {"train_loss": -24.676076889038086, "global_step": 232841, "epoch": 2805} {"train_loss": -24.558231353759766, "global_step": 232842, "epoch": 2805} {"train_loss": -24.253768920898438, "global_step": 232843, "epoch": 2805} {"train_loss": -24.61403465270996, "global_step": 232844, "epoch": 2805} {"train_loss": -24.224355697631836, "global_step": 232845, "epoch": 2805} {"train_loss": -24.646623611450195, "global_step": 232846, "epoch": 2805} {"train_loss": -25.07197380065918, "global_step": 232847, "epoch": 2805} {"train_loss": -24.780012130737305, "global_step": 232848, "epoch": 2805} {"train_loss": -24.76942253112793, "global_step": 232849, "epoch": 2805} {"train_loss": -24.65102195739746, "global_step": 232850, "epoch": 2805} {"train_loss": -24.85145378112793, "global_step": 232851, "epoch": 2805} {"train_loss": -24.79920768737793, "global_step": 232852, "epoch": 2805} {"train_loss": -25.123428344726562, "global_step": 232853, "epoch": 2805} {"train_loss": -24.662382125854492, "global_step": 232854, "epoch": 2805} {"train_loss": -24.593374252319336, "global_step": 232855, "epoch": 2805} {"train_loss": -25.0823974609375, "global_step": 232856, "epoch": 2805} {"train_loss": -24.85915756225586, "global_step": 232857, "epoch": 2805} {"train_loss": -24.811267852783203, "global_step": 232858, "epoch": 2805} {"train_loss": -25.220109939575195, "global_step": 232859, "epoch": 2805} {"train_loss": -24.84751319885254, "global_step": 232860, "epoch": 2805} {"train_loss": -24.794816970825195, "global_step": 232861, "epoch": 2805} {"train_loss": -24.604703903198242, "global_step": 232862, "epoch": 2805} {"train_loss": -24.79843521118164, "global_step": 232863, "epoch": 2805} {"train_loss": -24.96632957458496, "global_step": 232864, "epoch": 2805} {"train_loss": -24.943578720092773, "global_step": 232865, "epoch": 2805} {"train_loss": -25.117334365844727, "global_step": 232866, "epoch": 2805} {"train_loss": -25.13532829284668, "global_step": 232867, "epoch": 2805} {"train_loss": -24.888439178466797, "global_step": 232868, "epoch": 2805} {"train_loss": -24.911447525024414, "global_step": 232869, "epoch": 2805} {"train_loss": -24.78317642211914, "global_step": 232870, "epoch": 2805} {"train_loss": -24.803403854370117, "global_step": 232871, "epoch": 2805} {"train_loss": -24.526601791381836, "global_step": 232872, "epoch": 2805} {"train_loss": -25.225326538085938, "global_step": 232873, "epoch": 2805} {"train_loss": -24.500303268432617, "global_step": 232874, "epoch": 2805} {"train_loss": -24.874155044555664, "global_step": 232875, "epoch": 2805} {"train_loss": -24.447092056274414, "global_step": 232876, "epoch": 2805} {"train_loss": -24.547765731811523, "global_step": 232877, "epoch": 2805} {"train_loss": -24.694459915161133, "global_step": 232878, "epoch": 2805} {"train_loss": -24.714645385742188, "global_step": 232879, "epoch": 2805} {"train_loss": -24.96885108947754, "global_step": 232880, "epoch": 2805} {"train_loss": -24.779401779174805, "global_step": 232881, "epoch": 2805} {"train_loss": -24.68409538269043, "global_step": 232882, "epoch": 2805} {"train_loss": -24.51141357421875, "global_step": 232883, "epoch": 2805} {"train_loss": -24.837818145751953, "global_step": 232884, "epoch": 2805} {"train_loss": -24.833282470703125, "global_step": 232885, "epoch": 2805} {"train_loss": -24.46559715270996, "global_step": 232886, "epoch": 2805} {"train_loss": -24.98426628112793, "global_step": 232887, "epoch": 2805} {"train_loss": -24.97016143798828, "global_step": 232888, "epoch": 2805} {"train_loss": -24.902164459228516, "global_step": 232889, "epoch": 2805} {"train_loss": -24.7861328125, "global_step": 232890, "epoch": 2805} {"train_loss": -24.988059997558594, "global_step": 232891, "epoch": 2805} {"train_loss": -24.680273056030273, "global_step": 232892, "epoch": 2805} {"train_loss": -25.069507598876953, "global_step": 232893, "epoch": 2805} {"train_loss": -24.836339950561523, "global_step": 232894, "epoch": 2805} {"train_loss": -25.016260147094727, "global_step": 232895, "epoch": 2805} {"train_loss": -24.982946395874023, "global_step": 232896, "epoch": 2805} {"train_loss": -24.60093135144337, "global_step": 232897, "epoch": 2805, "val_loss": 6669307.0} {"train_loss": -24.751859664916992, "global_step": 232898, "epoch": 2806} {"train_loss": -24.6142578125, "global_step": 232899, "epoch": 2806} {"train_loss": -24.7354793548584, "global_step": 232900, "epoch": 2806} {"train_loss": -24.448022842407227, "global_step": 232901, "epoch": 2806} {"train_loss": -24.474782943725586, "global_step": 232902, "epoch": 2806} {"train_loss": -24.63213539123535, "global_step": 232903, "epoch": 2806} {"train_loss": -24.849390029907227, "global_step": 232904, "epoch": 2806} {"train_loss": -24.496004104614258, "global_step": 232905, "epoch": 2806} {"train_loss": -24.56349754333496, "global_step": 232906, "epoch": 2806} {"train_loss": -24.823551177978516, "global_step": 232907, "epoch": 2806} {"train_loss": -24.310688018798828, "global_step": 232908, "epoch": 2806} {"train_loss": -24.681554794311523, "global_step": 232909, "epoch": 2806} {"train_loss": -24.706613540649414, "global_step": 232910, "epoch": 2806} {"train_loss": -25.12943458557129, "global_step": 232911, "epoch": 2806} {"train_loss": -25.132713317871094, "global_step": 232912, "epoch": 2806} {"train_loss": -24.662445068359375, "global_step": 232913, "epoch": 2806} {"train_loss": -24.3232479095459, "global_step": 232914, "epoch": 2806} {"train_loss": -24.803686141967773, "global_step": 232915, "epoch": 2806} {"train_loss": -24.766407012939453, "global_step": 232916, "epoch": 2806} {"train_loss": -24.711456298828125, "global_step": 232917, "epoch": 2806} {"train_loss": -24.812414169311523, "global_step": 232918, "epoch": 2806} {"train_loss": -24.487112045288086, "global_step": 232919, "epoch": 2806} {"train_loss": -24.666454315185547, "global_step": 232920, "epoch": 2806} {"train_loss": -24.504087448120117, "global_step": 232921, "epoch": 2806} {"train_loss": -24.904150009155273, "global_step": 232922, "epoch": 2806} {"train_loss": -24.813671112060547, "global_step": 232923, "epoch": 2806} {"train_loss": -24.83388328552246, "global_step": 232924, "epoch": 2806} {"train_loss": -24.751569747924805, "global_step": 232925, "epoch": 2806} {"train_loss": -24.054656982421875, "global_step": 232926, "epoch": 2806} {"train_loss": -24.803115844726562, "global_step": 232927, "epoch": 2806} {"train_loss": -24.53879165649414, "global_step": 232928, "epoch": 2806} {"train_loss": -24.725162506103516, "global_step": 232929, "epoch": 2806} {"train_loss": -24.608198165893555, "global_step": 232930, "epoch": 2806} {"train_loss": -24.8535099029541, "global_step": 232931, "epoch": 2806} {"train_loss": -24.808237075805664, "global_step": 232932, "epoch": 2806} {"train_loss": -24.563329696655273, "global_step": 232933, "epoch": 2806} {"train_loss": -24.783170700073242, "global_step": 232934, "epoch": 2806} {"train_loss": -24.82967758178711, "global_step": 232935, "epoch": 2806} {"train_loss": -24.885644912719727, "global_step": 232936, "epoch": 2806} {"train_loss": -24.847898483276367, "global_step": 232937, "epoch": 2806} {"train_loss": -24.621824264526367, "global_step": 232938, "epoch": 2806} {"train_loss": -24.997495651245117, "global_step": 232939, "epoch": 2806} {"train_loss": -24.885787963867188, "global_step": 232940, "epoch": 2806} {"train_loss": -24.651304244995117, "global_step": 232941, "epoch": 2806} {"train_loss": -24.943206787109375, "global_step": 232942, "epoch": 2806} {"train_loss": -24.841703414916992, "global_step": 232943, "epoch": 2806} {"train_loss": -25.026798248291016, "global_step": 232944, "epoch": 2806} {"train_loss": -24.97223472595215, "global_step": 232945, "epoch": 2806} {"train_loss": -24.949750900268555, "global_step": 232946, "epoch": 2806} {"train_loss": -24.890928268432617, "global_step": 232947, "epoch": 2806} {"train_loss": -24.4318790435791, "global_step": 232948, "epoch": 2806} {"train_loss": -24.502382278442383, "global_step": 232949, "epoch": 2806} {"train_loss": -24.546878814697266, "global_step": 232950, "epoch": 2806} {"train_loss": -24.8740234375, "global_step": 232951, "epoch": 2806} {"train_loss": -24.727558135986328, "global_step": 232952, "epoch": 2806} {"train_loss": -24.49562644958496, "global_step": 232953, "epoch": 2806} {"train_loss": -24.87571907043457, "global_step": 232954, "epoch": 2806} {"train_loss": -24.66543197631836, "global_step": 232955, "epoch": 2806} {"train_loss": -24.66843605041504, "global_step": 232956, "epoch": 2806} {"train_loss": -25.275428771972656, "global_step": 232957, "epoch": 2806} {"train_loss": -25.14640235900879, "global_step": 232958, "epoch": 2806} {"train_loss": -25.004640579223633, "global_step": 232959, "epoch": 2806} {"train_loss": -24.81105613708496, "global_step": 232960, "epoch": 2806} {"train_loss": -24.836469650268555, "global_step": 232961, "epoch": 2806} {"train_loss": -25.229816436767578, "global_step": 232962, "epoch": 2806} {"train_loss": -25.0267276763916, "global_step": 232963, "epoch": 2806} {"train_loss": -24.861188888549805, "global_step": 232964, "epoch": 2806} {"train_loss": -24.500839233398438, "global_step": 232965, "epoch": 2806} {"train_loss": -24.7930850982666, "global_step": 232966, "epoch": 2806} {"train_loss": -24.739139556884766, "global_step": 232967, "epoch": 2806} {"train_loss": -24.74933433532715, "global_step": 232968, "epoch": 2806} {"train_loss": -24.819238662719727, "global_step": 232969, "epoch": 2806} {"train_loss": -25.189838409423828, "global_step": 232970, "epoch": 2806} {"train_loss": -24.694623947143555, "global_step": 232971, "epoch": 2806} {"train_loss": -24.99113655090332, "global_step": 232972, "epoch": 2806} {"train_loss": -24.616912841796875, "global_step": 232973, "epoch": 2806} {"train_loss": -24.8465576171875, "global_step": 232974, "epoch": 2806} {"train_loss": -24.92426109313965, "global_step": 232975, "epoch": 2806} {"train_loss": -24.911649703979492, "global_step": 232976, "epoch": 2806} {"train_loss": -24.717926025390625, "global_step": 232977, "epoch": 2806} {"train_loss": -24.744321823120117, "global_step": 232978, "epoch": 2806} {"train_loss": -24.706119537353516, "global_step": 232979, "epoch": 2806} {"train_loss": -24.758412050913616, "global_step": 232980, "epoch": 2806, "val_loss": 6654991.0} {"train_loss": -24.386760711669922, "global_step": 232981, "epoch": 2807} {"train_loss": -24.499927520751953, "global_step": 232982, "epoch": 2807} {"train_loss": -24.507627487182617, "global_step": 232983, "epoch": 2807} {"train_loss": -24.43153953552246, "global_step": 232984, "epoch": 2807} {"train_loss": -24.723758697509766, "global_step": 232985, "epoch": 2807} {"train_loss": -24.604522705078125, "global_step": 232986, "epoch": 2807} {"train_loss": -24.3482608795166, "global_step": 232987, "epoch": 2807} {"train_loss": -24.150571823120117, "global_step": 232988, "epoch": 2807} {"train_loss": -24.412094116210938, "global_step": 232989, "epoch": 2807} {"train_loss": -24.656227111816406, "global_step": 232990, "epoch": 2807} {"train_loss": -24.478504180908203, "global_step": 232991, "epoch": 2807} {"train_loss": -24.64312744140625, "global_step": 232992, "epoch": 2807} {"train_loss": -24.400619506835938, "global_step": 232993, "epoch": 2807} {"train_loss": -24.49856948852539, "global_step": 232994, "epoch": 2807} {"train_loss": -24.497114181518555, "global_step": 232995, "epoch": 2807} {"train_loss": -24.434070587158203, "global_step": 232996, "epoch": 2807} {"train_loss": -24.598146438598633, "global_step": 232997, "epoch": 2807} {"train_loss": -24.80914878845215, "global_step": 232998, "epoch": 2807} {"train_loss": -24.167097091674805, "global_step": 232999, "epoch": 2807} {"train_loss": -24.493623733520508, "global_step": 233000, "epoch": 2807} {"train_loss": -24.642375946044922, "global_step": 233001, "epoch": 2807} {"train_loss": -24.730775833129883, "global_step": 233002, "epoch": 2807} {"train_loss": -25.117998123168945, "global_step": 233003, "epoch": 2807} {"train_loss": -24.608963012695312, "global_step": 233004, "epoch": 2807} {"train_loss": -24.630184173583984, "global_step": 233005, "epoch": 2807} {"train_loss": -24.40208625793457, "global_step": 233006, "epoch": 2807} {"train_loss": -24.76942253112793, "global_step": 233007, "epoch": 2807} {"train_loss": -24.43107032775879, "global_step": 233008, "epoch": 2807} {"train_loss": -24.67911148071289, "global_step": 233009, "epoch": 2807} {"train_loss": -24.77117347717285, "global_step": 233010, "epoch": 2807} {"train_loss": -24.358869552612305, "global_step": 233011, "epoch": 2807} {"train_loss": -24.74860382080078, "global_step": 233012, "epoch": 2807} {"train_loss": -24.85548210144043, "global_step": 233013, "epoch": 2807} {"train_loss": -24.9406681060791, "global_step": 233014, "epoch": 2807} {"train_loss": -24.73714256286621, "global_step": 233015, "epoch": 2807} {"train_loss": -24.95843505859375, "global_step": 233016, "epoch": 2807} {"train_loss": -25.08038330078125, "global_step": 233017, "epoch": 2807} {"train_loss": -24.783201217651367, "global_step": 233018, "epoch": 2807} {"train_loss": -24.82303810119629, "global_step": 233019, "epoch": 2807} {"train_loss": -24.61594581604004, "global_step": 233020, "epoch": 2807} {"train_loss": -24.732458114624023, "global_step": 233021, "epoch": 2807} {"train_loss": -24.955854415893555, "global_step": 233022, "epoch": 2807} {"train_loss": -24.566539764404297, "global_step": 233023, "epoch": 2807} {"train_loss": -24.878108978271484, "global_step": 233024, "epoch": 2807} {"train_loss": -25.0249080657959, "global_step": 233025, "epoch": 2807} {"train_loss": -24.69609832763672, "global_step": 233026, "epoch": 2807} {"train_loss": -24.5943603515625, "global_step": 233027, "epoch": 2807} {"train_loss": -24.589603424072266, "global_step": 233028, "epoch": 2807} {"train_loss": -25.197040557861328, "global_step": 233029, "epoch": 2807} {"train_loss": -24.909395217895508, "global_step": 233030, "epoch": 2807} {"train_loss": -24.440122604370117, "global_step": 233031, "epoch": 2807} {"train_loss": -24.80805206298828, "global_step": 233032, "epoch": 2807} {"train_loss": -24.92353630065918, "global_step": 233033, "epoch": 2807} {"train_loss": -25.141328811645508, "global_step": 233034, "epoch": 2807} {"train_loss": -24.300037384033203, "global_step": 233035, "epoch": 2807} {"train_loss": -24.507802963256836, "global_step": 233036, "epoch": 2807} {"train_loss": -24.700166702270508, "global_step": 233037, "epoch": 2807} {"train_loss": -24.400028228759766, "global_step": 233038, "epoch": 2807} {"train_loss": -24.210514068603516, "global_step": 233039, "epoch": 2807} {"train_loss": -24.92310905456543, "global_step": 233040, "epoch": 2807} {"train_loss": -25.074087142944336, "global_step": 233041, "epoch": 2807} {"train_loss": -24.665857315063477, "global_step": 233042, "epoch": 2807} {"train_loss": -24.739599227905273, "global_step": 233043, "epoch": 2807} {"train_loss": -24.323318481445312, "global_step": 233044, "epoch": 2807} {"train_loss": -24.934173583984375, "global_step": 233045, "epoch": 2807} {"train_loss": -24.82382583618164, "global_step": 233046, "epoch": 2807} {"train_loss": -24.93767547607422, "global_step": 233047, "epoch": 2807} {"train_loss": -24.99808692932129, "global_step": 233048, "epoch": 2807} {"train_loss": -24.530851364135742, "global_step": 233049, "epoch": 2807} {"train_loss": -24.77152442932129, "global_step": 233050, "epoch": 2807} {"train_loss": -24.787866592407227, "global_step": 233051, "epoch": 2807} {"train_loss": -24.830533981323242, "global_step": 233052, "epoch": 2807} {"train_loss": -24.614744186401367, "global_step": 233053, "epoch": 2807} {"train_loss": -24.982513427734375, "global_step": 233054, "epoch": 2807} {"train_loss": -24.617063522338867, "global_step": 233055, "epoch": 2807} {"train_loss": -24.471071243286133, "global_step": 233056, "epoch": 2807} {"train_loss": -24.572921752929688, "global_step": 233057, "epoch": 2807} {"train_loss": -25.130395889282227, "global_step": 233058, "epoch": 2807} {"train_loss": -24.080896377563477, "global_step": 233059, "epoch": 2807} {"train_loss": -24.450517654418945, "global_step": 233060, "epoch": 2807} {"train_loss": -24.497098922729492, "global_step": 233061, "epoch": 2807} {"train_loss": -24.128366470336914, "global_step": 233062, "epoch": 2807} {"train_loss": -24.65483221950301, "global_step": 233063, "epoch": 2807, "val_loss": 6885777.0} {"train_loss": -22.92820930480957, "global_step": 233064, "epoch": 2808} {"train_loss": -23.981054306030273, "global_step": 233065, "epoch": 2808} {"train_loss": -23.393152236938477, "global_step": 233066, "epoch": 2808} {"train_loss": -24.250558853149414, "global_step": 233067, "epoch": 2808} {"train_loss": -24.238269805908203, "global_step": 233068, "epoch": 2808} {"train_loss": -23.75806999206543, "global_step": 233069, "epoch": 2808} {"train_loss": -23.886510848999023, "global_step": 233070, "epoch": 2808} {"train_loss": -24.001882553100586, "global_step": 233071, "epoch": 2808} {"train_loss": -24.479049682617188, "global_step": 233072, "epoch": 2808} {"train_loss": -23.76727294921875, "global_step": 233073, "epoch": 2808} {"train_loss": -24.112056732177734, "global_step": 233074, "epoch": 2808} {"train_loss": -24.01340103149414, "global_step": 233075, "epoch": 2808} {"train_loss": -24.477710723876953, "global_step": 233076, "epoch": 2808} {"train_loss": -24.25959587097168, "global_step": 233077, "epoch": 2808} {"train_loss": -24.266311645507812, "global_step": 233078, "epoch": 2808} {"train_loss": -24.08504295349121, "global_step": 233079, "epoch": 2808} {"train_loss": -23.98463249206543, "global_step": 233080, "epoch": 2808} {"train_loss": -24.188674926757812, "global_step": 233081, "epoch": 2808} {"train_loss": -24.74054527282715, "global_step": 233082, "epoch": 2808} {"train_loss": -24.446453094482422, "global_step": 233083, "epoch": 2808} {"train_loss": -24.422697067260742, "global_step": 233084, "epoch": 2808} {"train_loss": -24.13572120666504, "global_step": 233085, "epoch": 2808} {"train_loss": -24.24090003967285, "global_step": 233086, "epoch": 2808} {"train_loss": -24.16836929321289, "global_step": 233087, "epoch": 2808} {"train_loss": -24.076730728149414, "global_step": 233088, "epoch": 2808} {"train_loss": -24.6755428314209, "global_step": 233089, "epoch": 2808} {"train_loss": -24.64655876159668, "global_step": 233090, "epoch": 2808} {"train_loss": -24.42079734802246, "global_step": 233091, "epoch": 2808} {"train_loss": -24.77358055114746, "global_step": 233092, "epoch": 2808} {"train_loss": -24.64631462097168, "global_step": 233093, "epoch": 2808} {"train_loss": -25.28501319885254, "global_step": 233094, "epoch": 2808} {"train_loss": -24.82478904724121, "global_step": 233095, "epoch": 2808} {"train_loss": -24.445592880249023, "global_step": 233096, "epoch": 2808} {"train_loss": -25.06574821472168, "global_step": 233097, "epoch": 2808} {"train_loss": -25.102781295776367, "global_step": 233098, "epoch": 2808} {"train_loss": -24.726224899291992, "global_step": 233099, "epoch": 2808} {"train_loss": -24.892358779907227, "global_step": 233100, "epoch": 2808} {"train_loss": -24.563058853149414, "global_step": 233101, "epoch": 2808} {"train_loss": -24.869338989257812, "global_step": 233102, "epoch": 2808} {"train_loss": -24.922391891479492, "global_step": 233103, "epoch": 2808} {"train_loss": -24.84369468688965, "global_step": 233104, "epoch": 2808} {"train_loss": -24.773876190185547, "global_step": 233105, "epoch": 2808} {"train_loss": -24.990066528320312, "global_step": 233106, "epoch": 2808} {"train_loss": -24.62212562561035, "global_step": 233107, "epoch": 2808} {"train_loss": -25.031280517578125, "global_step": 233108, "epoch": 2808} {"train_loss": -24.700952529907227, "global_step": 233109, "epoch": 2808} {"train_loss": -25.1375732421875, "global_step": 233110, "epoch": 2808} {"train_loss": -25.019018173217773, "global_step": 233111, "epoch": 2808} {"train_loss": -25.017393112182617, "global_step": 233112, "epoch": 2808} {"train_loss": -24.729087829589844, "global_step": 233113, "epoch": 2808} {"train_loss": -25.118125915527344, "global_step": 233114, "epoch": 2808} {"train_loss": -24.68527603149414, "global_step": 233115, "epoch": 2808} {"train_loss": -24.423276901245117, "global_step": 233116, "epoch": 2808} {"train_loss": -24.867095947265625, "global_step": 233117, "epoch": 2808} {"train_loss": -24.924711227416992, "global_step": 233118, "epoch": 2808} {"train_loss": -24.53542137145996, "global_step": 233119, "epoch": 2808} {"train_loss": -24.514554977416992, "global_step": 233120, "epoch": 2808} {"train_loss": -24.729755401611328, "global_step": 233121, "epoch": 2808} {"train_loss": -24.5393123626709, "global_step": 233122, "epoch": 2808} {"train_loss": -24.661273956298828, "global_step": 233123, "epoch": 2808} {"train_loss": -24.5102596282959, "global_step": 233124, "epoch": 2808} {"train_loss": -24.40736961364746, "global_step": 233125, "epoch": 2808} {"train_loss": -24.33993148803711, "global_step": 233126, "epoch": 2808} {"train_loss": -24.94459342956543, "global_step": 233127, "epoch": 2808} {"train_loss": -24.313879013061523, "global_step": 233128, "epoch": 2808} {"train_loss": -24.37858009338379, "global_step": 233129, "epoch": 2808} {"train_loss": -24.586669921875, "global_step": 233130, "epoch": 2808} {"train_loss": -24.75618553161621, "global_step": 233131, "epoch": 2808} {"train_loss": -24.0872859954834, "global_step": 233132, "epoch": 2808} {"train_loss": -24.502492904663086, "global_step": 233133, "epoch": 2808} {"train_loss": -24.45958709716797, "global_step": 233134, "epoch": 2808} {"train_loss": -24.064212799072266, "global_step": 233135, "epoch": 2808} {"train_loss": -24.268329620361328, "global_step": 233136, "epoch": 2808} {"train_loss": -24.77924346923828, "global_step": 233137, "epoch": 2808} {"train_loss": -24.452369689941406, "global_step": 233138, "epoch": 2808} {"train_loss": -24.823040008544922, "global_step": 233139, "epoch": 2808} {"train_loss": -24.731918334960938, "global_step": 233140, "epoch": 2808} {"train_loss": -24.726755142211914, "global_step": 233141, "epoch": 2808} {"train_loss": -24.775156021118164, "global_step": 233142, "epoch": 2808} {"train_loss": -24.42289161682129, "global_step": 233143, "epoch": 2808} {"train_loss": -24.514930725097656, "global_step": 233144, "epoch": 2808} {"train_loss": -24.689176559448242, "global_step": 233145, "epoch": 2808} {"train_loss": -24.487939949495246, "global_step": 233146, "epoch": 2808, "val_loss": 6690531.0} {"train_loss": -23.215862274169922, "global_step": 233147, "epoch": 2809} {"train_loss": -23.76165199279785, "global_step": 233148, "epoch": 2809} {"train_loss": -24.14777183532715, "global_step": 233149, "epoch": 2809} {"train_loss": -24.063310623168945, "global_step": 233150, "epoch": 2809} {"train_loss": -24.4832820892334, "global_step": 233151, "epoch": 2809} {"train_loss": -23.94431495666504, "global_step": 233152, "epoch": 2809} {"train_loss": -24.36577033996582, "global_step": 233153, "epoch": 2809} {"train_loss": -24.035276412963867, "global_step": 233154, "epoch": 2809} {"train_loss": -24.624225616455078, "global_step": 233155, "epoch": 2809} {"train_loss": -24.120603561401367, "global_step": 233156, "epoch": 2809} {"train_loss": -24.541748046875, "global_step": 233157, "epoch": 2809} {"train_loss": -24.02374839782715, "global_step": 233158, "epoch": 2809} {"train_loss": -24.360586166381836, "global_step": 233159, "epoch": 2809} {"train_loss": -24.329986572265625, "global_step": 233160, "epoch": 2809} {"train_loss": -24.01853370666504, "global_step": 233161, "epoch": 2809} {"train_loss": -24.52151870727539, "global_step": 233162, "epoch": 2809} {"train_loss": -24.501434326171875, "global_step": 233163, "epoch": 2809} {"train_loss": -24.736927032470703, "global_step": 233164, "epoch": 2809} {"train_loss": -24.681625366210938, "global_step": 233165, "epoch": 2809} {"train_loss": -24.38582420349121, "global_step": 233166, "epoch": 2809} {"train_loss": -24.544296264648438, "global_step": 233167, "epoch": 2809} {"train_loss": -24.43739128112793, "global_step": 233168, "epoch": 2809} {"train_loss": -24.493927001953125, "global_step": 233169, "epoch": 2809} {"train_loss": -24.85383415222168, "global_step": 233170, "epoch": 2809} {"train_loss": -24.89152717590332, "global_step": 233171, "epoch": 2809} {"train_loss": -24.8127498626709, "global_step": 233172, "epoch": 2809} {"train_loss": -24.988916397094727, "global_step": 233173, "epoch": 2809} {"train_loss": -24.441104888916016, "global_step": 233174, "epoch": 2809} {"train_loss": -25.066129684448242, "global_step": 233175, "epoch": 2809} {"train_loss": -24.713703155517578, "global_step": 233176, "epoch": 2809} {"train_loss": -24.70339012145996, "global_step": 233177, "epoch": 2809} {"train_loss": -24.431766510009766, "global_step": 233178, "epoch": 2809} {"train_loss": -24.970252990722656, "global_step": 233179, "epoch": 2809} {"train_loss": -24.63715171813965, "global_step": 233180, "epoch": 2809} {"train_loss": -24.566862106323242, "global_step": 233181, "epoch": 2809} {"train_loss": -24.633642196655273, "global_step": 233182, "epoch": 2809} {"train_loss": -24.784042358398438, "global_step": 233183, "epoch": 2809} {"train_loss": -24.84018325805664, "global_step": 233184, "epoch": 2809} {"train_loss": -24.78171157836914, "global_step": 233185, "epoch": 2809} {"train_loss": -24.563690185546875, "global_step": 233186, "epoch": 2809} {"train_loss": -24.881032943725586, "global_step": 233187, "epoch": 2809} {"train_loss": -24.834312438964844, "global_step": 233188, "epoch": 2809} {"train_loss": -25.154006958007812, "global_step": 233189, "epoch": 2809} {"train_loss": -24.7406005859375, "global_step": 233190, "epoch": 2809} {"train_loss": -24.727014541625977, "global_step": 233191, "epoch": 2809} {"train_loss": -25.190216064453125, "global_step": 233192, "epoch": 2809} {"train_loss": -24.971853256225586, "global_step": 233193, "epoch": 2809} {"train_loss": -24.871572494506836, "global_step": 233194, "epoch": 2809} {"train_loss": -25.238615036010742, "global_step": 233195, "epoch": 2809} {"train_loss": -25.02012062072754, "global_step": 233196, "epoch": 2809} {"train_loss": -24.782682418823242, "global_step": 233197, "epoch": 2809} {"train_loss": -24.986400604248047, "global_step": 233198, "epoch": 2809} {"train_loss": -25.011343002319336, "global_step": 233199, "epoch": 2809} {"train_loss": -25.13700294494629, "global_step": 233200, "epoch": 2809} {"train_loss": -25.01145362854004, "global_step": 233201, "epoch": 2809} {"train_loss": -24.653873443603516, "global_step": 233202, "epoch": 2809} {"train_loss": -24.957273483276367, "global_step": 233203, "epoch": 2809} {"train_loss": -24.991748809814453, "global_step": 233204, "epoch": 2809} {"train_loss": -24.96563148498535, "global_step": 233205, "epoch": 2809} {"train_loss": -25.168312072753906, "global_step": 233206, "epoch": 2809} {"train_loss": -24.447675704956055, "global_step": 233207, "epoch": 2809} {"train_loss": -24.92971420288086, "global_step": 233208, "epoch": 2809} {"train_loss": -24.727828979492188, "global_step": 233209, "epoch": 2809} {"train_loss": -24.71393394470215, "global_step": 233210, "epoch": 2809} {"train_loss": -24.505207061767578, "global_step": 233211, "epoch": 2809} {"train_loss": -24.20249366760254, "global_step": 233212, "epoch": 2809} {"train_loss": -24.46259307861328, "global_step": 233213, "epoch": 2809} {"train_loss": -24.662466049194336, "global_step": 233214, "epoch": 2809} {"train_loss": -24.5073299407959, "global_step": 233215, "epoch": 2809} {"train_loss": -24.4577579498291, "global_step": 233216, "epoch": 2809} {"train_loss": -24.403078079223633, "global_step": 233217, "epoch": 2809} {"train_loss": -25.228378295898438, "global_step": 233218, "epoch": 2809} {"train_loss": -24.29427719116211, "global_step": 233219, "epoch": 2809} {"train_loss": -24.5874080657959, "global_step": 233220, "epoch": 2809} {"train_loss": -24.866744995117188, "global_step": 233221, "epoch": 2809} {"train_loss": -24.65169906616211, "global_step": 233222, "epoch": 2809} {"train_loss": -24.44391441345215, "global_step": 233223, "epoch": 2809} {"train_loss": -24.7850399017334, "global_step": 233224, "epoch": 2809} {"train_loss": -24.72002601623535, "global_step": 233225, "epoch": 2809} {"train_loss": -24.66853904724121, "global_step": 233226, "epoch": 2809} {"train_loss": -24.919906616210938, "global_step": 233227, "epoch": 2809} {"train_loss": -24.631221771240234, "global_step": 233228, "epoch": 2809} {"train_loss": -24.607637979898108, "global_step": 233229, "epoch": 2809, "val_loss": 6723441.0} {"train_loss": -23.033546447753906, "global_step": 233230, "epoch": 2810} {"train_loss": -23.703678131103516, "global_step": 233231, "epoch": 2810} {"train_loss": -23.31019401550293, "global_step": 233232, "epoch": 2810} {"train_loss": -24.092206954956055, "global_step": 233233, "epoch": 2810} {"train_loss": -23.81409454345703, "global_step": 233234, "epoch": 2810} {"train_loss": -24.6027774810791, "global_step": 233235, "epoch": 2810} {"train_loss": -23.98780059814453, "global_step": 233236, "epoch": 2810} {"train_loss": -24.395904541015625, "global_step": 233237, "epoch": 2810} {"train_loss": -24.105932235717773, "global_step": 233238, "epoch": 2810} {"train_loss": -24.523191452026367, "global_step": 233239, "epoch": 2810} {"train_loss": -24.255910873413086, "global_step": 233240, "epoch": 2810} {"train_loss": -24.211103439331055, "global_step": 233241, "epoch": 2810} {"train_loss": -24.493627548217773, "global_step": 233242, "epoch": 2810} {"train_loss": -24.20425796508789, "global_step": 233243, "epoch": 2810} {"train_loss": -24.472753524780273, "global_step": 233244, "epoch": 2810} {"train_loss": -24.879915237426758, "global_step": 233245, "epoch": 2810} {"train_loss": -24.603185653686523, "global_step": 233246, "epoch": 2810} {"train_loss": -24.17306900024414, "global_step": 233247, "epoch": 2810} {"train_loss": -24.23764419555664, "global_step": 233248, "epoch": 2810} {"train_loss": -24.575124740600586, "global_step": 233249, "epoch": 2810} {"train_loss": -24.515655517578125, "global_step": 233250, "epoch": 2810} {"train_loss": -24.715543746948242, "global_step": 233251, "epoch": 2810} {"train_loss": -24.50187110900879, "global_step": 233252, "epoch": 2810} {"train_loss": -24.70880699157715, "global_step": 233253, "epoch": 2810} {"train_loss": -24.512792587280273, "global_step": 233254, "epoch": 2810} {"train_loss": -24.911239624023438, "global_step": 233255, "epoch": 2810} {"train_loss": -24.765600204467773, "global_step": 233256, "epoch": 2810} {"train_loss": -24.825963973999023, "global_step": 233257, "epoch": 2810} {"train_loss": -24.861501693725586, "global_step": 233258, "epoch": 2810} {"train_loss": -24.409900665283203, "global_step": 233259, "epoch": 2810} {"train_loss": -24.575284957885742, "global_step": 233260, "epoch": 2810} {"train_loss": -25.095447540283203, "global_step": 233261, "epoch": 2810} {"train_loss": -24.71433448791504, "global_step": 233262, "epoch": 2810} {"train_loss": -24.837324142456055, "global_step": 233263, "epoch": 2810} {"train_loss": -24.705827713012695, "global_step": 233264, "epoch": 2810} {"train_loss": -24.429731369018555, "global_step": 233265, "epoch": 2810} {"train_loss": -24.925642013549805, "global_step": 233266, "epoch": 2810} {"train_loss": -25.28644371032715, "global_step": 233267, "epoch": 2810} {"train_loss": -25.033857345581055, "global_step": 233268, "epoch": 2810} {"train_loss": -24.843435287475586, "global_step": 233269, "epoch": 2810} {"train_loss": -25.14496421813965, "global_step": 233270, "epoch": 2810} {"train_loss": -25.03192138671875, "global_step": 233271, "epoch": 2810} {"train_loss": -24.59398651123047, "global_step": 233272, "epoch": 2810} {"train_loss": -25.23799705505371, "global_step": 233273, "epoch": 2810} {"train_loss": -24.68317985534668, "global_step": 233274, "epoch": 2810} {"train_loss": -25.06796646118164, "global_step": 233275, "epoch": 2810} {"train_loss": -25.066465377807617, "global_step": 233276, "epoch": 2810} {"train_loss": -25.083789825439453, "global_step": 233277, "epoch": 2810} {"train_loss": -24.924091339111328, "global_step": 233278, "epoch": 2810} {"train_loss": -25.14198875427246, "global_step": 233279, "epoch": 2810} {"train_loss": -24.630990982055664, "global_step": 233280, "epoch": 2810} {"train_loss": -25.07329750061035, "global_step": 233281, "epoch": 2810} {"train_loss": -24.979183197021484, "global_step": 233282, "epoch": 2810} {"train_loss": -25.039691925048828, "global_step": 233283, "epoch": 2810} {"train_loss": -24.689905166625977, "global_step": 233284, "epoch": 2810} {"train_loss": -24.81458854675293, "global_step": 233285, "epoch": 2810} {"train_loss": -25.018699645996094, "global_step": 233286, "epoch": 2810} {"train_loss": -24.683609008789062, "global_step": 233287, "epoch": 2810} {"train_loss": -24.718399047851562, "global_step": 233288, "epoch": 2810} {"train_loss": -24.94840431213379, "global_step": 233289, "epoch": 2810} {"train_loss": -24.869367599487305, "global_step": 233290, "epoch": 2810} {"train_loss": -24.647811889648438, "global_step": 233291, "epoch": 2810} {"train_loss": -24.994131088256836, "global_step": 233292, "epoch": 2810} {"train_loss": -25.048276901245117, "global_step": 233293, "epoch": 2810} {"train_loss": -25.095170974731445, "global_step": 233294, "epoch": 2810} {"train_loss": -24.734020233154297, "global_step": 233295, "epoch": 2810} {"train_loss": -24.528335571289062, "global_step": 233296, "epoch": 2810} {"train_loss": -24.64325523376465, "global_step": 233297, "epoch": 2810} {"train_loss": -24.672138214111328, "global_step": 233298, "epoch": 2810} {"train_loss": -24.45271110534668, "global_step": 233299, "epoch": 2810} {"train_loss": -24.76668357849121, "global_step": 233300, "epoch": 2810} {"train_loss": -24.94999122619629, "global_step": 233301, "epoch": 2810} {"train_loss": -24.38974952697754, "global_step": 233302, "epoch": 2810} {"train_loss": -24.63923454284668, "global_step": 233303, "epoch": 2810} {"train_loss": -24.503021240234375, "global_step": 233304, "epoch": 2810} {"train_loss": -24.452529907226562, "global_step": 233305, "epoch": 2810} {"train_loss": -24.684951782226562, "global_step": 233306, "epoch": 2810} {"train_loss": -24.946256637573242, "global_step": 233307, "epoch": 2810} {"train_loss": -24.69055938720703, "global_step": 233308, "epoch": 2810} {"train_loss": -24.83034324645996, "global_step": 233309, "epoch": 2810} {"train_loss": -24.767385482788086, "global_step": 233310, "epoch": 2810} {"train_loss": -24.355417251586914, "global_step": 233311, "epoch": 2810} {"train_loss": -24.65276171213173, "global_step": 233312, "epoch": 2810, "val_loss": 6730516.5} {"train_loss": -24.62665557861328, "global_step": 233313, "epoch": 2811} {"train_loss": -24.5726261138916, "global_step": 233314, "epoch": 2811} {"train_loss": -24.290430068969727, "global_step": 233315, "epoch": 2811} {"train_loss": -24.93343162536621, "global_step": 233316, "epoch": 2811} {"train_loss": -24.35725975036621, "global_step": 233317, "epoch": 2811} {"train_loss": -24.599241256713867, "global_step": 233318, "epoch": 2811} {"train_loss": -24.353036880493164, "global_step": 233319, "epoch": 2811} {"train_loss": -24.809955596923828, "global_step": 233320, "epoch": 2811} {"train_loss": -24.537343978881836, "global_step": 233321, "epoch": 2811} {"train_loss": -24.624801635742188, "global_step": 233322, "epoch": 2811} {"train_loss": -24.559906005859375, "global_step": 233323, "epoch": 2811} {"train_loss": -24.74322509765625, "global_step": 233324, "epoch": 2811} {"train_loss": -24.70607566833496, "global_step": 233325, "epoch": 2811} {"train_loss": -24.797164916992188, "global_step": 233326, "epoch": 2811} {"train_loss": -24.79237174987793, "global_step": 233327, "epoch": 2811} {"train_loss": -25.06093406677246, "global_step": 233328, "epoch": 2811} {"train_loss": -24.735427856445312, "global_step": 233329, "epoch": 2811} {"train_loss": -24.874731063842773, "global_step": 233330, "epoch": 2811} {"train_loss": -24.68922996520996, "global_step": 233331, "epoch": 2811} {"train_loss": -24.643407821655273, "global_step": 233332, "epoch": 2811} {"train_loss": -25.2613582611084, "global_step": 233333, "epoch": 2811} {"train_loss": -25.11219596862793, "global_step": 233334, "epoch": 2811} {"train_loss": -24.847023010253906, "global_step": 233335, "epoch": 2811} {"train_loss": -24.98094367980957, "global_step": 233336, "epoch": 2811} {"train_loss": -24.95575523376465, "global_step": 233337, "epoch": 2811} {"train_loss": -24.90502166748047, "global_step": 233338, "epoch": 2811} {"train_loss": -24.93070411682129, "global_step": 233339, "epoch": 2811} {"train_loss": -25.001258850097656, "global_step": 233340, "epoch": 2811} {"train_loss": -25.372114181518555, "global_step": 233341, "epoch": 2811} {"train_loss": -24.8549861907959, "global_step": 233342, "epoch": 2811} {"train_loss": -24.52140235900879, "global_step": 233343, "epoch": 2811} {"train_loss": -24.609542846679688, "global_step": 233344, "epoch": 2811} {"train_loss": -25.001951217651367, "global_step": 233345, "epoch": 2811} {"train_loss": -24.632352828979492, "global_step": 233346, "epoch": 2811} {"train_loss": -24.673839569091797, "global_step": 233347, "epoch": 2811} {"train_loss": -24.915027618408203, "global_step": 233348, "epoch": 2811} {"train_loss": -24.7551212310791, "global_step": 233349, "epoch": 2811} {"train_loss": -24.75147819519043, "global_step": 233350, "epoch": 2811} {"train_loss": -24.72218132019043, "global_step": 233351, "epoch": 2811} {"train_loss": -24.786767959594727, "global_step": 233352, "epoch": 2811} {"train_loss": -24.841577529907227, "global_step": 233353, "epoch": 2811} {"train_loss": -24.926050186157227, "global_step": 233354, "epoch": 2811} {"train_loss": -24.558691024780273, "global_step": 233355, "epoch": 2811} {"train_loss": -24.593976974487305, "global_step": 233356, "epoch": 2811} {"train_loss": -24.749753952026367, "global_step": 233357, "epoch": 2811} {"train_loss": -24.91676139831543, "global_step": 233358, "epoch": 2811} {"train_loss": -24.81871795654297, "global_step": 233359, "epoch": 2811} {"train_loss": -24.710241317749023, "global_step": 233360, "epoch": 2811} {"train_loss": -24.628591537475586, "global_step": 233361, "epoch": 2811} {"train_loss": -25.011486053466797, "global_step": 233362, "epoch": 2811} {"train_loss": -24.681005477905273, "global_step": 233363, "epoch": 2811} {"train_loss": -24.603031158447266, "global_step": 233364, "epoch": 2811} {"train_loss": -24.935155868530273, "global_step": 233365, "epoch": 2811} {"train_loss": -25.09307861328125, "global_step": 233366, "epoch": 2811} {"train_loss": -24.984880447387695, "global_step": 233367, "epoch": 2811} {"train_loss": -24.869474411010742, "global_step": 233368, "epoch": 2811} {"train_loss": -24.70657730102539, "global_step": 233369, "epoch": 2811} {"train_loss": -24.692180633544922, "global_step": 233370, "epoch": 2811} {"train_loss": -24.703540802001953, "global_step": 233371, "epoch": 2811} {"train_loss": -25.049699783325195, "global_step": 233372, "epoch": 2811} {"train_loss": -25.21161460876465, "global_step": 233373, "epoch": 2811} {"train_loss": -24.9990177154541, "global_step": 233374, "epoch": 2811} {"train_loss": -24.901845932006836, "global_step": 233375, "epoch": 2811} {"train_loss": -24.874757766723633, "global_step": 233376, "epoch": 2811} {"train_loss": -24.630796432495117, "global_step": 233377, "epoch": 2811} {"train_loss": -24.75105857849121, "global_step": 233378, "epoch": 2811} {"train_loss": -24.452064514160156, "global_step": 233379, "epoch": 2811} {"train_loss": -24.344758987426758, "global_step": 233380, "epoch": 2811} {"train_loss": -24.945032119750977, "global_step": 233381, "epoch": 2811} {"train_loss": -24.539443969726562, "global_step": 233382, "epoch": 2811} {"train_loss": -24.643310546875, "global_step": 233383, "epoch": 2811} {"train_loss": -23.937711715698242, "global_step": 233384, "epoch": 2811} {"train_loss": -24.4381160736084, "global_step": 233385, "epoch": 2811} {"train_loss": -24.662080764770508, "global_step": 233386, "epoch": 2811} {"train_loss": -24.70122718811035, "global_step": 233387, "epoch": 2811} {"train_loss": -24.63722801208496, "global_step": 233388, "epoch": 2811} {"train_loss": -25.176034927368164, "global_step": 233389, "epoch": 2811} {"train_loss": -24.931020736694336, "global_step": 233390, "epoch": 2811} {"train_loss": -24.76865577697754, "global_step": 233391, "epoch": 2811} {"train_loss": -25.138809204101562, "global_step": 233392, "epoch": 2811} {"train_loss": -24.669397354125977, "global_step": 233393, "epoch": 2811} {"train_loss": -24.414594650268555, "global_step": 233394, "epoch": 2811} {"train_loss": -24.757916990532934, "global_step": 233395, "epoch": 2811, "val_loss": 6697082.0} {"train_loss": -24.260757446289062, "global_step": 233396, "epoch": 2812} {"train_loss": -24.47665786743164, "global_step": 233397, "epoch": 2812} {"train_loss": -24.188247680664062, "global_step": 233398, "epoch": 2812} {"train_loss": -24.38043785095215, "global_step": 233399, "epoch": 2812} {"train_loss": -24.16022300720215, "global_step": 233400, "epoch": 2812} {"train_loss": -24.318403244018555, "global_step": 233401, "epoch": 2812} {"train_loss": -24.35497283935547, "global_step": 233402, "epoch": 2812} {"train_loss": -24.391210556030273, "global_step": 233403, "epoch": 2812} {"train_loss": -24.651979446411133, "global_step": 233404, "epoch": 2812} {"train_loss": -24.31159782409668, "global_step": 233405, "epoch": 2812} {"train_loss": -24.3482723236084, "global_step": 233406, "epoch": 2812} {"train_loss": -24.061901092529297, "global_step": 233407, "epoch": 2812} {"train_loss": -24.665124893188477, "global_step": 233408, "epoch": 2812} {"train_loss": -24.789958953857422, "global_step": 233409, "epoch": 2812} {"train_loss": -24.510835647583008, "global_step": 233410, "epoch": 2812} {"train_loss": -24.567546844482422, "global_step": 233411, "epoch": 2812} {"train_loss": -24.757511138916016, "global_step": 233412, "epoch": 2812} {"train_loss": -24.167158126831055, "global_step": 233413, "epoch": 2812} {"train_loss": -24.415283203125, "global_step": 233414, "epoch": 2812} {"train_loss": -24.372560501098633, "global_step": 233415, "epoch": 2812} {"train_loss": -24.18979835510254, "global_step": 233416, "epoch": 2812} {"train_loss": -24.337629318237305, "global_step": 233417, "epoch": 2812} {"train_loss": -24.522689819335938, "global_step": 233418, "epoch": 2812} {"train_loss": -24.62019920349121, "global_step": 233419, "epoch": 2812} {"train_loss": -24.22627830505371, "global_step": 233420, "epoch": 2812} {"train_loss": -24.89508819580078, "global_step": 233421, "epoch": 2812} {"train_loss": -24.64988899230957, "global_step": 233422, "epoch": 2812} {"train_loss": -24.85893440246582, "global_step": 233423, "epoch": 2812} {"train_loss": -24.91994285583496, "global_step": 233424, "epoch": 2812} {"train_loss": -24.6497802734375, "global_step": 233425, "epoch": 2812} {"train_loss": -24.58075523376465, "global_step": 233426, "epoch": 2812} {"train_loss": -24.69788932800293, "global_step": 233427, "epoch": 2812} {"train_loss": -25.141834259033203, "global_step": 233428, "epoch": 2812} {"train_loss": -24.687742233276367, "global_step": 233429, "epoch": 2812} {"train_loss": -24.77104949951172, "global_step": 233430, "epoch": 2812} {"train_loss": -24.685941696166992, "global_step": 233431, "epoch": 2812} {"train_loss": -24.690465927124023, "global_step": 233432, "epoch": 2812} {"train_loss": -24.958602905273438, "global_step": 233433, "epoch": 2812} {"train_loss": -24.70870590209961, "global_step": 233434, "epoch": 2812} {"train_loss": -24.700260162353516, "global_step": 233435, "epoch": 2812} {"train_loss": -24.996509552001953, "global_step": 233436, "epoch": 2812} {"train_loss": -25.0068302154541, "global_step": 233437, "epoch": 2812} {"train_loss": -24.746198654174805, "global_step": 233438, "epoch": 2812} {"train_loss": -25.058942794799805, "global_step": 233439, "epoch": 2812} {"train_loss": -24.5604190826416, "global_step": 233440, "epoch": 2812} {"train_loss": -24.58359718322754, "global_step": 233441, "epoch": 2812} {"train_loss": -25.32969093322754, "global_step": 233442, "epoch": 2812} {"train_loss": -24.67738914489746, "global_step": 233443, "epoch": 2812} {"train_loss": -24.179718017578125, "global_step": 233444, "epoch": 2812} {"train_loss": -24.194639205932617, "global_step": 233445, "epoch": 2812} {"train_loss": -24.880117416381836, "global_step": 233446, "epoch": 2812} {"train_loss": -24.478906631469727, "global_step": 233447, "epoch": 2812} {"train_loss": -24.406829833984375, "global_step": 233448, "epoch": 2812} {"train_loss": -24.21457862854004, "global_step": 233449, "epoch": 2812} {"train_loss": -24.641963958740234, "global_step": 233450, "epoch": 2812} {"train_loss": -24.910154342651367, "global_step": 233451, "epoch": 2812} {"train_loss": -24.284507751464844, "global_step": 233452, "epoch": 2812} {"train_loss": -24.990354537963867, "global_step": 233453, "epoch": 2812} {"train_loss": -24.14609146118164, "global_step": 233454, "epoch": 2812} {"train_loss": -24.543045043945312, "global_step": 233455, "epoch": 2812} {"train_loss": -24.412113189697266, "global_step": 233456, "epoch": 2812} {"train_loss": -24.805389404296875, "global_step": 233457, "epoch": 2812} {"train_loss": -24.816320419311523, "global_step": 233458, "epoch": 2812} {"train_loss": -24.878740310668945, "global_step": 233459, "epoch": 2812} {"train_loss": -24.584640502929688, "global_step": 233460, "epoch": 2812} {"train_loss": -24.49989891052246, "global_step": 233461, "epoch": 2812} {"train_loss": -24.9021053314209, "global_step": 233462, "epoch": 2812} {"train_loss": -24.613269805908203, "global_step": 233463, "epoch": 2812} {"train_loss": -24.550765991210938, "global_step": 233464, "epoch": 2812} {"train_loss": -24.897499084472656, "global_step": 233465, "epoch": 2812} {"train_loss": -24.425111770629883, "global_step": 233466, "epoch": 2812} {"train_loss": -24.551633834838867, "global_step": 233467, "epoch": 2812} {"train_loss": -25.09589958190918, "global_step": 233468, "epoch": 2812} {"train_loss": -24.471240997314453, "global_step": 233469, "epoch": 2812} {"train_loss": -24.911497116088867, "global_step": 233470, "epoch": 2812} {"train_loss": -24.913862228393555, "global_step": 233471, "epoch": 2812} {"train_loss": -24.848257064819336, "global_step": 233472, "epoch": 2812} {"train_loss": -25.127544403076172, "global_step": 233473, "epoch": 2812} {"train_loss": -24.918777465820312, "global_step": 233474, "epoch": 2812} {"train_loss": -24.729230880737305, "global_step": 233475, "epoch": 2812} {"train_loss": -24.844614028930664, "global_step": 233476, "epoch": 2812} {"train_loss": -25.141828536987305, "global_step": 233477, "epoch": 2812} {"train_loss": -24.63725832284215, "global_step": 233478, "epoch": 2812, "val_loss": 6679910.5} {"train_loss": -24.590646743774414, "global_step": 233479, "epoch": 2813} {"train_loss": -24.912466049194336, "global_step": 233480, "epoch": 2813} {"train_loss": -25.012529373168945, "global_step": 233481, "epoch": 2813} {"train_loss": -24.937713623046875, "global_step": 233482, "epoch": 2813} {"train_loss": -24.842708587646484, "global_step": 233483, "epoch": 2813} {"train_loss": -24.580961227416992, "global_step": 233484, "epoch": 2813} {"train_loss": -24.472923278808594, "global_step": 233485, "epoch": 2813} {"train_loss": -25.046463012695312, "global_step": 233486, "epoch": 2813} {"train_loss": -24.518064498901367, "global_step": 233487, "epoch": 2813} {"train_loss": -25.272764205932617, "global_step": 233488, "epoch": 2813} {"train_loss": -24.75395965576172, "global_step": 233489, "epoch": 2813} {"train_loss": -24.682558059692383, "global_step": 233490, "epoch": 2813} {"train_loss": -24.949132919311523, "global_step": 233491, "epoch": 2813} {"train_loss": -24.69512367248535, "global_step": 233492, "epoch": 2813} {"train_loss": -25.035188674926758, "global_step": 233493, "epoch": 2813} {"train_loss": -24.901819229125977, "global_step": 233494, "epoch": 2813} {"train_loss": -24.84766960144043, "global_step": 233495, "epoch": 2813} {"train_loss": -24.536617279052734, "global_step": 233496, "epoch": 2813} {"train_loss": -24.97039222717285, "global_step": 233497, "epoch": 2813} {"train_loss": -24.613510131835938, "global_step": 233498, "epoch": 2813} {"train_loss": -25.111276626586914, "global_step": 233499, "epoch": 2813} {"train_loss": -24.92903709411621, "global_step": 233500, "epoch": 2813} {"train_loss": -25.070575714111328, "global_step": 233501, "epoch": 2813} {"train_loss": -24.916303634643555, "global_step": 233502, "epoch": 2813} {"train_loss": -24.972375869750977, "global_step": 233503, "epoch": 2813} {"train_loss": -24.6293888092041, "global_step": 233504, "epoch": 2813} {"train_loss": -24.932584762573242, "global_step": 233505, "epoch": 2813} {"train_loss": -24.75486183166504, "global_step": 233506, "epoch": 2813} {"train_loss": -25.295114517211914, "global_step": 233507, "epoch": 2813} {"train_loss": -24.60099220275879, "global_step": 233508, "epoch": 2813} {"train_loss": -24.12457847595215, "global_step": 233509, "epoch": 2813} {"train_loss": -24.451021194458008, "global_step": 233510, "epoch": 2813} {"train_loss": -24.866918563842773, "global_step": 233511, "epoch": 2813} {"train_loss": -24.48859214782715, "global_step": 233512, "epoch": 2813} {"train_loss": -24.844133377075195, "global_step": 233513, "epoch": 2813} {"train_loss": -24.13448143005371, "global_step": 233514, "epoch": 2813} {"train_loss": -24.610692977905273, "global_step": 233515, "epoch": 2813} {"train_loss": -24.368457794189453, "global_step": 233516, "epoch": 2813} {"train_loss": -24.55500602722168, "global_step": 233517, "epoch": 2813} {"train_loss": -24.809452056884766, "global_step": 233518, "epoch": 2813} {"train_loss": -24.7401180267334, "global_step": 233519, "epoch": 2813} {"train_loss": -24.55653953552246, "global_step": 233520, "epoch": 2813} {"train_loss": -25.04929542541504, "global_step": 233521, "epoch": 2813} {"train_loss": -24.740365982055664, "global_step": 233522, "epoch": 2813} {"train_loss": -24.39299964904785, "global_step": 233523, "epoch": 2813} {"train_loss": -24.81339454650879, "global_step": 233524, "epoch": 2813} {"train_loss": -24.965564727783203, "global_step": 233525, "epoch": 2813} {"train_loss": -24.36985206604004, "global_step": 233526, "epoch": 2813} {"train_loss": -24.838546752929688, "global_step": 233527, "epoch": 2813} {"train_loss": -24.643083572387695, "global_step": 233528, "epoch": 2813} {"train_loss": -25.35491371154785, "global_step": 233529, "epoch": 2813} {"train_loss": -24.76337242126465, "global_step": 233530, "epoch": 2813} {"train_loss": -25.160552978515625, "global_step": 233531, "epoch": 2813} {"train_loss": -24.734994888305664, "global_step": 233532, "epoch": 2813} {"train_loss": -24.728837966918945, "global_step": 233533, "epoch": 2813} {"train_loss": -24.244897842407227, "global_step": 233534, "epoch": 2813} {"train_loss": -24.881351470947266, "global_step": 233535, "epoch": 2813} {"train_loss": -24.562026977539062, "global_step": 233536, "epoch": 2813} {"train_loss": -24.71402359008789, "global_step": 233537, "epoch": 2813} {"train_loss": -24.61273193359375, "global_step": 233538, "epoch": 2813} {"train_loss": -25.020893096923828, "global_step": 233539, "epoch": 2813} {"train_loss": -25.273178100585938, "global_step": 233540, "epoch": 2813} {"train_loss": -24.867456436157227, "global_step": 233541, "epoch": 2813} {"train_loss": -24.739974975585938, "global_step": 233542, "epoch": 2813} {"train_loss": -24.626142501831055, "global_step": 233543, "epoch": 2813} {"train_loss": -24.32062339782715, "global_step": 233544, "epoch": 2813} {"train_loss": -24.67513084411621, "global_step": 233545, "epoch": 2813} {"train_loss": -25.01667594909668, "global_step": 233546, "epoch": 2813} {"train_loss": -24.980314254760742, "global_step": 233547, "epoch": 2813} {"train_loss": -25.07462501525879, "global_step": 233548, "epoch": 2813} {"train_loss": -24.546106338500977, "global_step": 233549, "epoch": 2813} {"train_loss": -24.847354888916016, "global_step": 233550, "epoch": 2813} {"train_loss": -24.791479110717773, "global_step": 233551, "epoch": 2813} {"train_loss": -24.793563842773438, "global_step": 233552, "epoch": 2813} {"train_loss": -24.470426559448242, "global_step": 233553, "epoch": 2813} {"train_loss": -24.85013198852539, "global_step": 233554, "epoch": 2813} {"train_loss": -25.055517196655273, "global_step": 233555, "epoch": 2813} {"train_loss": -24.662199020385742, "global_step": 233556, "epoch": 2813} {"train_loss": -24.64662742614746, "global_step": 233557, "epoch": 2813} {"train_loss": -24.902494430541992, "global_step": 233558, "epoch": 2813} {"train_loss": -24.51873207092285, "global_step": 233559, "epoch": 2813} {"train_loss": -24.599273681640625, "global_step": 233560, "epoch": 2813} {"train_loss": -24.763249569628613, "global_step": 233561, "epoch": 2813, "val_loss": 6781231.0} {"train_loss": -22.334659576416016, "global_step": 233562, "epoch": 2814} {"train_loss": -22.448122024536133, "global_step": 233563, "epoch": 2814} {"train_loss": -23.763364791870117, "global_step": 233564, "epoch": 2814} {"train_loss": -23.812503814697266, "global_step": 233565, "epoch": 2814} {"train_loss": -24.017900466918945, "global_step": 233566, "epoch": 2814} {"train_loss": -23.530261993408203, "global_step": 233567, "epoch": 2814} {"train_loss": -23.925344467163086, "global_step": 233568, "epoch": 2814} {"train_loss": -23.941068649291992, "global_step": 233569, "epoch": 2814} {"train_loss": -24.0157413482666, "global_step": 233570, "epoch": 2814} {"train_loss": -24.177358627319336, "global_step": 233571, "epoch": 2814} {"train_loss": -24.329381942749023, "global_step": 233572, "epoch": 2814} {"train_loss": -24.54758071899414, "global_step": 233573, "epoch": 2814} {"train_loss": -24.44593620300293, "global_step": 233574, "epoch": 2814} {"train_loss": -24.740087509155273, "global_step": 233575, "epoch": 2814} {"train_loss": -24.500062942504883, "global_step": 233576, "epoch": 2814} {"train_loss": -24.506513595581055, "global_step": 233577, "epoch": 2814} {"train_loss": -24.466150283813477, "global_step": 233578, "epoch": 2814} {"train_loss": -24.131864547729492, "global_step": 233579, "epoch": 2814} {"train_loss": -24.262447357177734, "global_step": 233580, "epoch": 2814} {"train_loss": -24.74890899658203, "global_step": 233581, "epoch": 2814} {"train_loss": -24.377609252929688, "global_step": 233582, "epoch": 2814} {"train_loss": -24.303754806518555, "global_step": 233583, "epoch": 2814} {"train_loss": -24.552358627319336, "global_step": 233584, "epoch": 2814} {"train_loss": -24.395841598510742, "global_step": 233585, "epoch": 2814} {"train_loss": -24.925615310668945, "global_step": 233586, "epoch": 2814} {"train_loss": -24.723379135131836, "global_step": 233587, "epoch": 2814} {"train_loss": -24.2707576751709, "global_step": 233588, "epoch": 2814} {"train_loss": -24.57102394104004, "global_step": 233589, "epoch": 2814} {"train_loss": -24.62723159790039, "global_step": 233590, "epoch": 2814} {"train_loss": -24.961580276489258, "global_step": 233591, "epoch": 2814} {"train_loss": -24.75999641418457, "global_step": 233592, "epoch": 2814} {"train_loss": -24.52440071105957, "global_step": 233593, "epoch": 2814} {"train_loss": -24.711759567260742, "global_step": 233594, "epoch": 2814} {"train_loss": -24.691476821899414, "global_step": 233595, "epoch": 2814} {"train_loss": -24.736648559570312, "global_step": 233596, "epoch": 2814} {"train_loss": -24.500518798828125, "global_step": 233597, "epoch": 2814} {"train_loss": -24.288043975830078, "global_step": 233598, "epoch": 2814} {"train_loss": -24.51136589050293, "global_step": 233599, "epoch": 2814} {"train_loss": -24.8121280670166, "global_step": 233600, "epoch": 2814} {"train_loss": -24.65730857849121, "global_step": 233601, "epoch": 2814} {"train_loss": -24.68726348876953, "global_step": 233602, "epoch": 2814} {"train_loss": -25.123552322387695, "global_step": 233603, "epoch": 2814} {"train_loss": -25.001516342163086, "global_step": 233604, "epoch": 2814} {"train_loss": -25.01618766784668, "global_step": 233605, "epoch": 2814} {"train_loss": -24.873937606811523, "global_step": 233606, "epoch": 2814} {"train_loss": -24.860919952392578, "global_step": 233607, "epoch": 2814} {"train_loss": -24.9704532623291, "global_step": 233608, "epoch": 2814} {"train_loss": -24.89171028137207, "global_step": 233609, "epoch": 2814} {"train_loss": -25.02451515197754, "global_step": 233610, "epoch": 2814} {"train_loss": -25.036266326904297, "global_step": 233611, "epoch": 2814} {"train_loss": -24.88924789428711, "global_step": 233612, "epoch": 2814} {"train_loss": -24.957202911376953, "global_step": 233613, "epoch": 2814} {"train_loss": -25.115522384643555, "global_step": 233614, "epoch": 2814} {"train_loss": -24.663955688476562, "global_step": 233615, "epoch": 2814} {"train_loss": -24.48872184753418, "global_step": 233616, "epoch": 2814} {"train_loss": -24.702255249023438, "global_step": 233617, "epoch": 2814} {"train_loss": -24.89710807800293, "global_step": 233618, "epoch": 2814} {"train_loss": -25.16376304626465, "global_step": 233619, "epoch": 2814} {"train_loss": -24.903465270996094, "global_step": 233620, "epoch": 2814} {"train_loss": -24.854644775390625, "global_step": 233621, "epoch": 2814} {"train_loss": -25.105138778686523, "global_step": 233622, "epoch": 2814} {"train_loss": -24.693151473999023, "global_step": 233623, "epoch": 2814} {"train_loss": -24.90569496154785, "global_step": 233624, "epoch": 2814} {"train_loss": -25.127670288085938, "global_step": 233625, "epoch": 2814} {"train_loss": -24.9842472076416, "global_step": 233626, "epoch": 2814} {"train_loss": -24.88414764404297, "global_step": 233627, "epoch": 2814} {"train_loss": -24.985288619995117, "global_step": 233628, "epoch": 2814} {"train_loss": -24.437931060791016, "global_step": 233629, "epoch": 2814} {"train_loss": -24.90386390686035, "global_step": 233630, "epoch": 2814} {"train_loss": -24.836380004882812, "global_step": 233631, "epoch": 2814} {"train_loss": -24.706640243530273, "global_step": 233632, "epoch": 2814} {"train_loss": -24.81732749938965, "global_step": 233633, "epoch": 2814} {"train_loss": -24.80624771118164, "global_step": 233634, "epoch": 2814} {"train_loss": -24.72440528869629, "global_step": 233635, "epoch": 2814} {"train_loss": -25.278907775878906, "global_step": 233636, "epoch": 2814} {"train_loss": -24.86421012878418, "global_step": 233637, "epoch": 2814} {"train_loss": -24.640350341796875, "global_step": 233638, "epoch": 2814} {"train_loss": -24.87007713317871, "global_step": 233639, "epoch": 2814} {"train_loss": -24.622711181640625, "global_step": 233640, "epoch": 2814} {"train_loss": -24.74717140197754, "global_step": 233641, "epoch": 2814} {"train_loss": -24.816930770874023, "global_step": 233642, "epoch": 2814} {"train_loss": -24.66195297241211, "global_step": 233643, "epoch": 2814} {"train_loss": -24.583962727742023, "global_step": 233644, "epoch": 2814, "val_loss": 6777422.0} {"train_loss": -24.38823890686035, "global_step": 233645, "epoch": 2815} {"train_loss": -24.04465675354004, "global_step": 233646, "epoch": 2815} {"train_loss": -24.9514102935791, "global_step": 233647, "epoch": 2815} {"train_loss": -24.15656089782715, "global_step": 233648, "epoch": 2815} {"train_loss": -24.641006469726562, "global_step": 233649, "epoch": 2815} {"train_loss": -24.75978660583496, "global_step": 233650, "epoch": 2815} {"train_loss": -24.971914291381836, "global_step": 233651, "epoch": 2815} {"train_loss": -24.47747230529785, "global_step": 233652, "epoch": 2815} {"train_loss": -25.01041030883789, "global_step": 233653, "epoch": 2815} {"train_loss": -24.52378273010254, "global_step": 233654, "epoch": 2815} {"train_loss": -24.723569869995117, "global_step": 233655, "epoch": 2815} {"train_loss": -24.48341941833496, "global_step": 233656, "epoch": 2815} {"train_loss": -24.840679168701172, "global_step": 233657, "epoch": 2815} {"train_loss": -24.29544448852539, "global_step": 233658, "epoch": 2815} {"train_loss": -24.79848289489746, "global_step": 233659, "epoch": 2815} {"train_loss": -24.745174407958984, "global_step": 233660, "epoch": 2815} {"train_loss": -24.519683837890625, "global_step": 233661, "epoch": 2815} {"train_loss": -24.85127830505371, "global_step": 233662, "epoch": 2815} {"train_loss": -24.475934982299805, "global_step": 233663, "epoch": 2815} {"train_loss": -25.062850952148438, "global_step": 233664, "epoch": 2815} {"train_loss": -24.506765365600586, "global_step": 233665, "epoch": 2815} {"train_loss": -24.472314834594727, "global_step": 233666, "epoch": 2815} {"train_loss": -24.978544235229492, "global_step": 233667, "epoch": 2815} {"train_loss": -24.825223922729492, "global_step": 233668, "epoch": 2815} {"train_loss": -24.74173355102539, "global_step": 233669, "epoch": 2815} {"train_loss": -24.66908073425293, "global_step": 233670, "epoch": 2815} {"train_loss": -24.22659683227539, "global_step": 233671, "epoch": 2815} {"train_loss": -24.770475387573242, "global_step": 233672, "epoch": 2815} {"train_loss": -25.019773483276367, "global_step": 233673, "epoch": 2815} {"train_loss": -25.025243759155273, "global_step": 233674, "epoch": 2815} {"train_loss": -24.511686325073242, "global_step": 233675, "epoch": 2815} {"train_loss": -24.85128402709961, "global_step": 233676, "epoch": 2815} {"train_loss": -25.06520652770996, "global_step": 233677, "epoch": 2815} {"train_loss": -25.064443588256836, "global_step": 233678, "epoch": 2815} {"train_loss": -24.734310150146484, "global_step": 233679, "epoch": 2815} {"train_loss": -24.76820945739746, "global_step": 233680, "epoch": 2815} {"train_loss": -25.030920028686523, "global_step": 233681, "epoch": 2815} {"train_loss": -24.963253021240234, "global_step": 233682, "epoch": 2815} {"train_loss": -24.696523666381836, "global_step": 233683, "epoch": 2815} {"train_loss": -25.160179138183594, "global_step": 233684, "epoch": 2815} {"train_loss": -24.768035888671875, "global_step": 233685, "epoch": 2815} {"train_loss": -25.1489200592041, "global_step": 233686, "epoch": 2815} {"train_loss": -24.67897605895996, "global_step": 233687, "epoch": 2815} {"train_loss": -25.374183654785156, "global_step": 233688, "epoch": 2815} {"train_loss": -24.871774673461914, "global_step": 233689, "epoch": 2815} {"train_loss": -25.016836166381836, "global_step": 233690, "epoch": 2815} {"train_loss": -24.8702392578125, "global_step": 233691, "epoch": 2815} {"train_loss": -25.116540908813477, "global_step": 233692, "epoch": 2815} {"train_loss": -24.71595573425293, "global_step": 233693, "epoch": 2815} {"train_loss": -24.830766677856445, "global_step": 233694, "epoch": 2815} {"train_loss": -24.510961532592773, "global_step": 233695, "epoch": 2815} {"train_loss": -24.669158935546875, "global_step": 233696, "epoch": 2815} {"train_loss": -24.56368637084961, "global_step": 233697, "epoch": 2815} {"train_loss": -24.93422508239746, "global_step": 233698, "epoch": 2815} {"train_loss": -24.63722038269043, "global_step": 233699, "epoch": 2815} {"train_loss": -24.564512252807617, "global_step": 233700, "epoch": 2815} {"train_loss": -24.691556930541992, "global_step": 233701, "epoch": 2815} {"train_loss": -24.8762149810791, "global_step": 233702, "epoch": 2815} {"train_loss": -25.108768463134766, "global_step": 233703, "epoch": 2815} {"train_loss": -24.57906150817871, "global_step": 233704, "epoch": 2815} {"train_loss": -24.908395767211914, "global_step": 233705, "epoch": 2815} {"train_loss": -25.30573081970215, "global_step": 233706, "epoch": 2815} {"train_loss": -24.47128677368164, "global_step": 233707, "epoch": 2815} {"train_loss": -24.740089416503906, "global_step": 233708, "epoch": 2815} {"train_loss": -24.782087326049805, "global_step": 233709, "epoch": 2815} {"train_loss": -25.140722274780273, "global_step": 233710, "epoch": 2815} {"train_loss": -25.07748031616211, "global_step": 233711, "epoch": 2815} {"train_loss": -24.45509910583496, "global_step": 233712, "epoch": 2815} {"train_loss": -24.447561264038086, "global_step": 233713, "epoch": 2815} {"train_loss": -25.06114387512207, "global_step": 233714, "epoch": 2815} {"train_loss": -25.2650089263916, "global_step": 233715, "epoch": 2815} {"train_loss": -25.14298439025879, "global_step": 233716, "epoch": 2815} {"train_loss": -24.573352813720703, "global_step": 233717, "epoch": 2815} {"train_loss": -24.860313415527344, "global_step": 233718, "epoch": 2815} {"train_loss": -24.48917579650879, "global_step": 233719, "epoch": 2815} {"train_loss": -24.63801383972168, "global_step": 233720, "epoch": 2815} {"train_loss": -24.704214096069336, "global_step": 233721, "epoch": 2815} {"train_loss": -25.2404842376709, "global_step": 233722, "epoch": 2815} {"train_loss": -24.58685874938965, "global_step": 233723, "epoch": 2815} {"train_loss": -24.558862686157227, "global_step": 233724, "epoch": 2815} {"train_loss": -24.985620498657227, "global_step": 233725, "epoch": 2815} {"train_loss": -25.138486862182617, "global_step": 233726, "epoch": 2815} {"train_loss": -24.7796562148864, "global_step": 233727, "epoch": 2815, "val_loss": 6691446.0} {"train_loss": -24.203393936157227, "global_step": 233728, "epoch": 2816} {"train_loss": -24.391691207885742, "global_step": 233729, "epoch": 2816} {"train_loss": -24.112340927124023, "global_step": 233730, "epoch": 2816} {"train_loss": -24.455337524414062, "global_step": 233731, "epoch": 2816} {"train_loss": -24.516489028930664, "global_step": 233732, "epoch": 2816} {"train_loss": -24.538259506225586, "global_step": 233733, "epoch": 2816} {"train_loss": -24.809268951416016, "global_step": 233734, "epoch": 2816} {"train_loss": -24.541051864624023, "global_step": 233735, "epoch": 2816} {"train_loss": -24.70754051208496, "global_step": 233736, "epoch": 2816} {"train_loss": -24.54645347595215, "global_step": 233737, "epoch": 2816} {"train_loss": -24.8916015625, "global_step": 233738, "epoch": 2816} {"train_loss": -24.78314781188965, "global_step": 233739, "epoch": 2816} {"train_loss": -24.783071517944336, "global_step": 233740, "epoch": 2816} {"train_loss": -24.83937644958496, "global_step": 233741, "epoch": 2816} {"train_loss": -24.897748947143555, "global_step": 233742, "epoch": 2816} {"train_loss": -24.736602783203125, "global_step": 233743, "epoch": 2816} {"train_loss": -25.157306671142578, "global_step": 233744, "epoch": 2816} {"train_loss": -24.68885612487793, "global_step": 233745, "epoch": 2816} {"train_loss": -25.076784133911133, "global_step": 233746, "epoch": 2816} {"train_loss": -24.727256774902344, "global_step": 233747, "epoch": 2816} {"train_loss": -24.848779678344727, "global_step": 233748, "epoch": 2816} {"train_loss": -24.66292381286621, "global_step": 233749, "epoch": 2816} {"train_loss": -24.622880935668945, "global_step": 233750, "epoch": 2816} {"train_loss": -25.020246505737305, "global_step": 233751, "epoch": 2816} {"train_loss": -24.717838287353516, "global_step": 233752, "epoch": 2816} {"train_loss": -24.8750057220459, "global_step": 233753, "epoch": 2816} {"train_loss": -24.5252685546875, "global_step": 233754, "epoch": 2816} {"train_loss": -24.741226196289062, "global_step": 233755, "epoch": 2816} {"train_loss": -24.79520034790039, "global_step": 233756, "epoch": 2816} {"train_loss": -24.98521614074707, "global_step": 233757, "epoch": 2816} {"train_loss": -24.96998405456543, "global_step": 233758, "epoch": 2816} {"train_loss": -24.811079025268555, "global_step": 233759, "epoch": 2816} {"train_loss": -24.55032730102539, "global_step": 233760, "epoch": 2816} {"train_loss": -24.980009078979492, "global_step": 233761, "epoch": 2816} {"train_loss": -24.494932174682617, "global_step": 233762, "epoch": 2816} {"train_loss": -24.931764602661133, "global_step": 233763, "epoch": 2816} {"train_loss": -24.621889114379883, "global_step": 233764, "epoch": 2816} {"train_loss": -24.418445587158203, "global_step": 233765, "epoch": 2816} {"train_loss": -24.785680770874023, "global_step": 233766, "epoch": 2816} {"train_loss": -24.782194137573242, "global_step": 233767, "epoch": 2816} {"train_loss": -24.893156051635742, "global_step": 233768, "epoch": 2816} {"train_loss": -24.736574172973633, "global_step": 233769, "epoch": 2816} {"train_loss": -25.151105880737305, "global_step": 233770, "epoch": 2816} {"train_loss": -25.32215690612793, "global_step": 233771, "epoch": 2816} {"train_loss": -24.64186668395996, "global_step": 233772, "epoch": 2816} {"train_loss": -24.814542770385742, "global_step": 233773, "epoch": 2816} {"train_loss": -24.521299362182617, "global_step": 233774, "epoch": 2816} {"train_loss": -24.67095375061035, "global_step": 233775, "epoch": 2816} {"train_loss": -24.731504440307617, "global_step": 233776, "epoch": 2816} {"train_loss": -25.048093795776367, "global_step": 233777, "epoch": 2816} {"train_loss": -24.689435958862305, "global_step": 233778, "epoch": 2816} {"train_loss": -24.446792602539062, "global_step": 233779, "epoch": 2816} {"train_loss": -24.651071548461914, "global_step": 233780, "epoch": 2816} {"train_loss": -24.58819007873535, "global_step": 233781, "epoch": 2816} {"train_loss": -24.378393173217773, "global_step": 233782, "epoch": 2816} {"train_loss": -25.06307029724121, "global_step": 233783, "epoch": 2816} {"train_loss": -24.745838165283203, "global_step": 233784, "epoch": 2816} {"train_loss": -24.80870819091797, "global_step": 233785, "epoch": 2816} {"train_loss": -24.72321319580078, "global_step": 233786, "epoch": 2816} {"train_loss": -24.45430564880371, "global_step": 233787, "epoch": 2816} {"train_loss": -24.606454849243164, "global_step": 233788, "epoch": 2816} {"train_loss": -24.3822021484375, "global_step": 233789, "epoch": 2816} {"train_loss": -24.807188034057617, "global_step": 233790, "epoch": 2816} {"train_loss": -24.524587631225586, "global_step": 233791, "epoch": 2816} {"train_loss": -24.535253524780273, "global_step": 233792, "epoch": 2816} {"train_loss": -25.042339324951172, "global_step": 233793, "epoch": 2816} {"train_loss": -24.834415435791016, "global_step": 233794, "epoch": 2816} {"train_loss": -24.746313095092773, "global_step": 233795, "epoch": 2816} {"train_loss": -24.82712745666504, "global_step": 233796, "epoch": 2816} {"train_loss": -25.033384323120117, "global_step": 233797, "epoch": 2816} {"train_loss": -24.800750732421875, "global_step": 233798, "epoch": 2816} {"train_loss": -24.787073135375977, "global_step": 233799, "epoch": 2816} {"train_loss": -24.803016662597656, "global_step": 233800, "epoch": 2816} {"train_loss": -24.789030075073242, "global_step": 233801, "epoch": 2816} {"train_loss": -25.159257888793945, "global_step": 233802, "epoch": 2816} {"train_loss": -24.85738182067871, "global_step": 233803, "epoch": 2816} {"train_loss": -24.832761764526367, "global_step": 233804, "epoch": 2816} {"train_loss": -24.39169692993164, "global_step": 233805, "epoch": 2816} {"train_loss": -25.02771759033203, "global_step": 233806, "epoch": 2816} {"train_loss": -24.44744873046875, "global_step": 233807, "epoch": 2816} {"train_loss": -24.532197952270508, "global_step": 233808, "epoch": 2816} {"train_loss": -24.770410537719727, "global_step": 233809, "epoch": 2816} {"train_loss": -24.725207248366022, "global_step": 233810, "epoch": 2816, "val_loss": 6765451.0} {"train_loss": -24.77435874938965, "global_step": 233811, "epoch": 2817} {"train_loss": -24.41120719909668, "global_step": 233812, "epoch": 2817} {"train_loss": -24.84912109375, "global_step": 233813, "epoch": 2817} {"train_loss": -24.43390464782715, "global_step": 233814, "epoch": 2817} {"train_loss": -24.668989181518555, "global_step": 233815, "epoch": 2817} {"train_loss": -24.44388198852539, "global_step": 233816, "epoch": 2817} {"train_loss": -24.367412567138672, "global_step": 233817, "epoch": 2817} {"train_loss": -24.49618911743164, "global_step": 233818, "epoch": 2817} {"train_loss": -24.21765899658203, "global_step": 233819, "epoch": 2817} {"train_loss": -24.554391860961914, "global_step": 233820, "epoch": 2817} {"train_loss": -24.107465744018555, "global_step": 233821, "epoch": 2817} {"train_loss": -24.777374267578125, "global_step": 233822, "epoch": 2817} {"train_loss": -24.72865867614746, "global_step": 233823, "epoch": 2817} {"train_loss": -24.83879280090332, "global_step": 233824, "epoch": 2817} {"train_loss": -24.703351974487305, "global_step": 233825, "epoch": 2817} {"train_loss": -24.722911834716797, "global_step": 233826, "epoch": 2817} {"train_loss": -24.587446212768555, "global_step": 233827, "epoch": 2817} {"train_loss": -24.411893844604492, "global_step": 233828, "epoch": 2817} {"train_loss": -24.62390899658203, "global_step": 233829, "epoch": 2817} {"train_loss": -24.62360191345215, "global_step": 233830, "epoch": 2817} {"train_loss": -25.039846420288086, "global_step": 233831, "epoch": 2817} {"train_loss": -24.600875854492188, "global_step": 233832, "epoch": 2817} {"train_loss": -24.55008316040039, "global_step": 233833, "epoch": 2817} {"train_loss": -24.516178131103516, "global_step": 233834, "epoch": 2817} {"train_loss": -24.915063858032227, "global_step": 233835, "epoch": 2817} {"train_loss": -24.798954010009766, "global_step": 233836, "epoch": 2817} {"train_loss": -24.813745498657227, "global_step": 233837, "epoch": 2817} {"train_loss": -24.818374633789062, "global_step": 233838, "epoch": 2817} {"train_loss": -24.7379207611084, "global_step": 233839, "epoch": 2817} {"train_loss": -25.130826950073242, "global_step": 233840, "epoch": 2817} {"train_loss": -24.675992965698242, "global_step": 233841, "epoch": 2817} {"train_loss": -24.993160247802734, "global_step": 233842, "epoch": 2817} {"train_loss": -24.742612838745117, "global_step": 233843, "epoch": 2817} {"train_loss": -24.868026733398438, "global_step": 233844, "epoch": 2817} {"train_loss": -24.8900146484375, "global_step": 233845, "epoch": 2817} {"train_loss": -25.17561149597168, "global_step": 233846, "epoch": 2817} {"train_loss": -25.08250617980957, "global_step": 233847, "epoch": 2817} {"train_loss": -24.69891357421875, "global_step": 233848, "epoch": 2817} {"train_loss": -24.815383911132812, "global_step": 233849, "epoch": 2817} {"train_loss": -24.426057815551758, "global_step": 233850, "epoch": 2817} {"train_loss": -25.14344596862793, "global_step": 233851, "epoch": 2817} {"train_loss": -24.647241592407227, "global_step": 233852, "epoch": 2817} {"train_loss": -24.760900497436523, "global_step": 233853, "epoch": 2817} {"train_loss": -24.801715850830078, "global_step": 233854, "epoch": 2817} {"train_loss": -25.075191497802734, "global_step": 233855, "epoch": 2817} {"train_loss": -24.694032669067383, "global_step": 233856, "epoch": 2817} {"train_loss": -24.78705406188965, "global_step": 233857, "epoch": 2817} {"train_loss": -24.66433334350586, "global_step": 233858, "epoch": 2817} {"train_loss": -24.698911666870117, "global_step": 233859, "epoch": 2817} {"train_loss": -25.1682186126709, "global_step": 233860, "epoch": 2817} {"train_loss": -24.90264320373535, "global_step": 233861, "epoch": 2817} {"train_loss": -24.974706649780273, "global_step": 233862, "epoch": 2817} {"train_loss": -24.84174919128418, "global_step": 233863, "epoch": 2817} {"train_loss": -24.774490356445312, "global_step": 233864, "epoch": 2817} {"train_loss": -24.659067153930664, "global_step": 233865, "epoch": 2817} {"train_loss": -24.734628677368164, "global_step": 233866, "epoch": 2817} {"train_loss": -24.903196334838867, "global_step": 233867, "epoch": 2817} {"train_loss": -25.03644371032715, "global_step": 233868, "epoch": 2817} {"train_loss": -24.843141555786133, "global_step": 233869, "epoch": 2817} {"train_loss": -24.887231826782227, "global_step": 233870, "epoch": 2817} {"train_loss": -24.5664005279541, "global_step": 233871, "epoch": 2817} {"train_loss": -24.527164459228516, "global_step": 233872, "epoch": 2817} {"train_loss": -24.62906837463379, "global_step": 233873, "epoch": 2817} {"train_loss": -24.468427658081055, "global_step": 233874, "epoch": 2817} {"train_loss": -24.7056941986084, "global_step": 233875, "epoch": 2817} {"train_loss": -24.990758895874023, "global_step": 233876, "epoch": 2817} {"train_loss": -24.33382225036621, "global_step": 233877, "epoch": 2817} {"train_loss": -25.04937744140625, "global_step": 233878, "epoch": 2817} {"train_loss": -25.055891036987305, "global_step": 233879, "epoch": 2817} {"train_loss": -24.502737045288086, "global_step": 233880, "epoch": 2817} {"train_loss": -24.6252384185791, "global_step": 233881, "epoch": 2817} {"train_loss": -24.79816246032715, "global_step": 233882, "epoch": 2817} {"train_loss": -24.74798583984375, "global_step": 233883, "epoch": 2817} {"train_loss": -24.51264762878418, "global_step": 233884, "epoch": 2817} {"train_loss": -24.657045364379883, "global_step": 233885, "epoch": 2817} {"train_loss": -25.03684425354004, "global_step": 233886, "epoch": 2817} {"train_loss": -24.723501205444336, "global_step": 233887, "epoch": 2817} {"train_loss": -24.621976852416992, "global_step": 233888, "epoch": 2817} {"train_loss": -24.982526779174805, "global_step": 233889, "epoch": 2817} {"train_loss": -24.973834991455078, "global_step": 233890, "epoch": 2817} {"train_loss": -24.906574249267578, "global_step": 233891, "epoch": 2817} {"train_loss": -24.48624610900879, "global_step": 233892, "epoch": 2817} {"train_loss": -24.740214818931488, "global_step": 233893, "epoch": 2817, "val_loss": 6777251.0} {"train_loss": -24.483366012573242, "global_step": 233894, "epoch": 2818} {"train_loss": -24.199621200561523, "global_step": 233895, "epoch": 2818} {"train_loss": -24.51974868774414, "global_step": 233896, "epoch": 2818} {"train_loss": -24.48823356628418, "global_step": 233897, "epoch": 2818} {"train_loss": -24.599592208862305, "global_step": 233898, "epoch": 2818} {"train_loss": -24.459793090820312, "global_step": 233899, "epoch": 2818} {"train_loss": -24.588319778442383, "global_step": 233900, "epoch": 2818} {"train_loss": -24.346200942993164, "global_step": 233901, "epoch": 2818} {"train_loss": -24.610584259033203, "global_step": 233902, "epoch": 2818} {"train_loss": -24.33051872253418, "global_step": 233903, "epoch": 2818} {"train_loss": -24.602827072143555, "global_step": 233904, "epoch": 2818} {"train_loss": -24.302724838256836, "global_step": 233905, "epoch": 2818} {"train_loss": -24.468454360961914, "global_step": 233906, "epoch": 2818} {"train_loss": -24.505695343017578, "global_step": 233907, "epoch": 2818} {"train_loss": -24.400039672851562, "global_step": 233908, "epoch": 2818} {"train_loss": -24.90772247314453, "global_step": 233909, "epoch": 2818} {"train_loss": -24.461835861206055, "global_step": 233910, "epoch": 2818} {"train_loss": -24.715225219726562, "global_step": 233911, "epoch": 2818} {"train_loss": -24.774391174316406, "global_step": 233912, "epoch": 2818} {"train_loss": -24.8977108001709, "global_step": 233913, "epoch": 2818} {"train_loss": -24.84326934814453, "global_step": 233914, "epoch": 2818} {"train_loss": -24.848163604736328, "global_step": 233915, "epoch": 2818} {"train_loss": -24.8266658782959, "global_step": 233916, "epoch": 2818} {"train_loss": -24.552074432373047, "global_step": 233917, "epoch": 2818} {"train_loss": -24.563501358032227, "global_step": 233918, "epoch": 2818} {"train_loss": -24.564380645751953, "global_step": 233919, "epoch": 2818} {"train_loss": -24.76078224182129, "global_step": 233920, "epoch": 2818} {"train_loss": -24.6978816986084, "global_step": 233921, "epoch": 2818} {"train_loss": -24.706405639648438, "global_step": 233922, "epoch": 2818} {"train_loss": -24.746896743774414, "global_step": 233923, "epoch": 2818} {"train_loss": -24.89674186706543, "global_step": 233924, "epoch": 2818} {"train_loss": -24.984434127807617, "global_step": 233925, "epoch": 2818} {"train_loss": -24.903724670410156, "global_step": 233926, "epoch": 2818} {"train_loss": -24.976043701171875, "global_step": 233927, "epoch": 2818} {"train_loss": -24.824604034423828, "global_step": 233928, "epoch": 2818} {"train_loss": -24.890317916870117, "global_step": 233929, "epoch": 2818} {"train_loss": -24.9359188079834, "global_step": 233930, "epoch": 2818} {"train_loss": -24.828495025634766, "global_step": 233931, "epoch": 2818} {"train_loss": -24.809247970581055, "global_step": 233932, "epoch": 2818} {"train_loss": -25.141115188598633, "global_step": 233933, "epoch": 2818} {"train_loss": -24.82917594909668, "global_step": 233934, "epoch": 2818} {"train_loss": -24.8398494720459, "global_step": 233935, "epoch": 2818} {"train_loss": -24.56918716430664, "global_step": 233936, "epoch": 2818} {"train_loss": -24.83157730102539, "global_step": 233937, "epoch": 2818} {"train_loss": -24.746915817260742, "global_step": 233938, "epoch": 2818} {"train_loss": -24.684907913208008, "global_step": 233939, "epoch": 2818} {"train_loss": -25.13771629333496, "global_step": 233940, "epoch": 2818} {"train_loss": -24.848106384277344, "global_step": 233941, "epoch": 2818} {"train_loss": -24.839197158813477, "global_step": 233942, "epoch": 2818} {"train_loss": -24.63462257385254, "global_step": 233943, "epoch": 2818} {"train_loss": -24.896013259887695, "global_step": 233944, "epoch": 2818} {"train_loss": -24.980825424194336, "global_step": 233945, "epoch": 2818} {"train_loss": -24.601709365844727, "global_step": 233946, "epoch": 2818} {"train_loss": -24.340099334716797, "global_step": 233947, "epoch": 2818} {"train_loss": -24.361164093017578, "global_step": 233948, "epoch": 2818} {"train_loss": -24.934995651245117, "global_step": 233949, "epoch": 2818} {"train_loss": -24.806360244750977, "global_step": 233950, "epoch": 2818} {"train_loss": -24.911151885986328, "global_step": 233951, "epoch": 2818} {"train_loss": -24.795595169067383, "global_step": 233952, "epoch": 2818} {"train_loss": -25.161352157592773, "global_step": 233953, "epoch": 2818} {"train_loss": -24.914365768432617, "global_step": 233954, "epoch": 2818} {"train_loss": -24.702844619750977, "global_step": 233955, "epoch": 2818} {"train_loss": -25.105972290039062, "global_step": 233956, "epoch": 2818} {"train_loss": -24.790451049804688, "global_step": 233957, "epoch": 2818} {"train_loss": -24.89641571044922, "global_step": 233958, "epoch": 2818} {"train_loss": -24.98951530456543, "global_step": 233959, "epoch": 2818} {"train_loss": -24.983739852905273, "global_step": 233960, "epoch": 2818} {"train_loss": -25.15803337097168, "global_step": 233961, "epoch": 2818} {"train_loss": -25.116586685180664, "global_step": 233962, "epoch": 2818} {"train_loss": -25.238605499267578, "global_step": 233963, "epoch": 2818} {"train_loss": -24.34903907775879, "global_step": 233964, "epoch": 2818} {"train_loss": -25.17030906677246, "global_step": 233965, "epoch": 2818} {"train_loss": -24.86832046508789, "global_step": 233966, "epoch": 2818} {"train_loss": -24.977405548095703, "global_step": 233967, "epoch": 2818} {"train_loss": -25.156503677368164, "global_step": 233968, "epoch": 2818} {"train_loss": -25.069120407104492, "global_step": 233969, "epoch": 2818} {"train_loss": -24.81039810180664, "global_step": 233970, "epoch": 2818} {"train_loss": -25.156227111816406, "global_step": 233971, "epoch": 2818} {"train_loss": -24.680831909179688, "global_step": 233972, "epoch": 2818} {"train_loss": -24.82341957092285, "global_step": 233973, "epoch": 2818} {"train_loss": -24.58907127380371, "global_step": 233974, "epoch": 2818} {"train_loss": -24.736265182495117, "global_step": 233975, "epoch": 2818} {"train_loss": -24.778888702392578, "global_step": 233976, "epoch": 2818, "val_loss": 6660722.0} {"train_loss": -22.8525447845459, "global_step": 233977, "epoch": 2819} {"train_loss": -22.180456161499023, "global_step": 233978, "epoch": 2819} {"train_loss": -22.95989227294922, "global_step": 233979, "epoch": 2819} {"train_loss": -23.274660110473633, "global_step": 233980, "epoch": 2819} {"train_loss": -23.50270652770996, "global_step": 233981, "epoch": 2819} {"train_loss": -24.33997917175293, "global_step": 233982, "epoch": 2819} {"train_loss": -23.97120475769043, "global_step": 233983, "epoch": 2819} {"train_loss": -24.174436569213867, "global_step": 233984, "epoch": 2819} {"train_loss": -23.98160171508789, "global_step": 233985, "epoch": 2819} {"train_loss": -24.20551872253418, "global_step": 233986, "epoch": 2819} {"train_loss": -24.26795768737793, "global_step": 233987, "epoch": 2819} {"train_loss": -23.915180206298828, "global_step": 233988, "epoch": 2819} {"train_loss": -24.308813095092773, "global_step": 233989, "epoch": 2819} {"train_loss": -24.088226318359375, "global_step": 233990, "epoch": 2819} {"train_loss": -24.138471603393555, "global_step": 233991, "epoch": 2819} {"train_loss": -24.04979705810547, "global_step": 233992, "epoch": 2819} {"train_loss": -24.16425323486328, "global_step": 233993, "epoch": 2819} {"train_loss": -24.404558181762695, "global_step": 233994, "epoch": 2819} {"train_loss": -24.6087646484375, "global_step": 233995, "epoch": 2819} {"train_loss": -24.494321823120117, "global_step": 233996, "epoch": 2819} {"train_loss": -24.17560386657715, "global_step": 233997, "epoch": 2819} {"train_loss": -24.507307052612305, "global_step": 233998, "epoch": 2819} {"train_loss": -24.035655975341797, "global_step": 233999, "epoch": 2819} {"train_loss": -24.81894302368164, "global_step": 234000, "epoch": 2819} {"train_loss": -24.22262191772461, "global_step": 234001, "epoch": 2819} {"train_loss": -24.732097625732422, "global_step": 234002, "epoch": 2819} {"train_loss": -24.825870513916016, "global_step": 234003, "epoch": 2819} {"train_loss": -24.890993118286133, "global_step": 234004, "epoch": 2819} {"train_loss": -24.21063804626465, "global_step": 234005, "epoch": 2819} {"train_loss": -24.73781394958496, "global_step": 234006, "epoch": 2819} {"train_loss": -24.7313175201416, "global_step": 234007, "epoch": 2819} {"train_loss": -24.883651733398438, "global_step": 234008, "epoch": 2819} {"train_loss": -24.664228439331055, "global_step": 234009, "epoch": 2819} {"train_loss": -25.146997451782227, "global_step": 234010, "epoch": 2819} {"train_loss": -24.865461349487305, "global_step": 234011, "epoch": 2819} {"train_loss": -24.97921371459961, "global_step": 234012, "epoch": 2819} {"train_loss": -24.680097579956055, "global_step": 234013, "epoch": 2819} {"train_loss": -24.644426345825195, "global_step": 234014, "epoch": 2819} {"train_loss": -24.541364669799805, "global_step": 234015, "epoch": 2819} {"train_loss": -24.7369327545166, "global_step": 234016, "epoch": 2819} {"train_loss": -24.80044937133789, "global_step": 234017, "epoch": 2819} {"train_loss": -24.572919845581055, "global_step": 234018, "epoch": 2819} {"train_loss": -24.80047035217285, "global_step": 234019, "epoch": 2819} {"train_loss": -25.137495040893555, "global_step": 234020, "epoch": 2819} {"train_loss": -24.738195419311523, "global_step": 234021, "epoch": 2819} {"train_loss": -24.903039932250977, "global_step": 234022, "epoch": 2819} {"train_loss": -25.082387924194336, "global_step": 234023, "epoch": 2819} {"train_loss": -24.928709030151367, "global_step": 234024, "epoch": 2819} {"train_loss": -24.87229347229004, "global_step": 234025, "epoch": 2819} {"train_loss": -25.019824981689453, "global_step": 234026, "epoch": 2819} {"train_loss": -24.721466064453125, "global_step": 234027, "epoch": 2819} {"train_loss": -24.808979034423828, "global_step": 234028, "epoch": 2819} {"train_loss": -24.71143913269043, "global_step": 234029, "epoch": 2819} {"train_loss": -25.087818145751953, "global_step": 234030, "epoch": 2819} {"train_loss": -25.190214157104492, "global_step": 234031, "epoch": 2819} {"train_loss": -24.6180477142334, "global_step": 234032, "epoch": 2819} {"train_loss": -24.92527198791504, "global_step": 234033, "epoch": 2819} {"train_loss": -25.00486183166504, "global_step": 234034, "epoch": 2819} {"train_loss": -24.419668197631836, "global_step": 234035, "epoch": 2819} {"train_loss": -24.908878326416016, "global_step": 234036, "epoch": 2819} {"train_loss": -24.82347297668457, "global_step": 234037, "epoch": 2819} {"train_loss": -24.858474731445312, "global_step": 234038, "epoch": 2819} {"train_loss": -23.863845825195312, "global_step": 234039, "epoch": 2819} {"train_loss": -23.631935119628906, "global_step": 234040, "epoch": 2819} {"train_loss": -23.529836654663086, "global_step": 234041, "epoch": 2819} {"train_loss": -25.0289363861084, "global_step": 234042, "epoch": 2819} {"train_loss": -24.587360382080078, "global_step": 234043, "epoch": 2819} {"train_loss": -24.68811798095703, "global_step": 234044, "epoch": 2819} {"train_loss": -24.420259475708008, "global_step": 234045, "epoch": 2819} {"train_loss": -24.561660766601562, "global_step": 234046, "epoch": 2819} {"train_loss": -24.0224552154541, "global_step": 234047, "epoch": 2819} {"train_loss": -24.820598602294922, "global_step": 234048, "epoch": 2819} {"train_loss": -24.640779495239258, "global_step": 234049, "epoch": 2819} {"train_loss": -24.516395568847656, "global_step": 234050, "epoch": 2819} {"train_loss": -24.27107048034668, "global_step": 234051, "epoch": 2819} {"train_loss": -24.775259017944336, "global_step": 234052, "epoch": 2819} {"train_loss": -24.681148529052734, "global_step": 234053, "epoch": 2819} {"train_loss": -24.762380599975586, "global_step": 234054, "epoch": 2819} {"train_loss": -24.7442569732666, "global_step": 234055, "epoch": 2819} {"train_loss": -25.02668571472168, "global_step": 234056, "epoch": 2819} {"train_loss": -24.813674926757812, "global_step": 234057, "epoch": 2819} {"train_loss": -24.1568660736084, "global_step": 234058, "epoch": 2819} {"train_loss": -24.468989291823053, "global_step": 234059, "epoch": 2819, "val_loss": 6722737.0} {"train_loss": -24.609174728393555, "global_step": 234060, "epoch": 2820} {"train_loss": -24.723976135253906, "global_step": 234061, "epoch": 2820} {"train_loss": -24.539865493774414, "global_step": 234062, "epoch": 2820} {"train_loss": -24.811384201049805, "global_step": 234063, "epoch": 2820} {"train_loss": -24.45936393737793, "global_step": 234064, "epoch": 2820} {"train_loss": -24.6363468170166, "global_step": 234065, "epoch": 2820} {"train_loss": -24.741458892822266, "global_step": 234066, "epoch": 2820} {"train_loss": -24.89008903503418, "global_step": 234067, "epoch": 2820} {"train_loss": -24.80440902709961, "global_step": 234068, "epoch": 2820} {"train_loss": -24.774080276489258, "global_step": 234069, "epoch": 2820} {"train_loss": -24.81321144104004, "global_step": 234070, "epoch": 2820} {"train_loss": -24.986597061157227, "global_step": 234071, "epoch": 2820} {"train_loss": -25.078550338745117, "global_step": 234072, "epoch": 2820} {"train_loss": -24.842512130737305, "global_step": 234073, "epoch": 2820} {"train_loss": -24.797454833984375, "global_step": 234074, "epoch": 2820} {"train_loss": -25.064645767211914, "global_step": 234075, "epoch": 2820} {"train_loss": -24.900129318237305, "global_step": 234076, "epoch": 2820} {"train_loss": -24.874797821044922, "global_step": 234077, "epoch": 2820} {"train_loss": -25.02317237854004, "global_step": 234078, "epoch": 2820} {"train_loss": -24.791568756103516, "global_step": 234079, "epoch": 2820} {"train_loss": -25.317874908447266, "global_step": 234080, "epoch": 2820} {"train_loss": -24.81373405456543, "global_step": 234081, "epoch": 2820} {"train_loss": -24.946414947509766, "global_step": 234082, "epoch": 2820} {"train_loss": -24.87434196472168, "global_step": 234083, "epoch": 2820} {"train_loss": -24.80445671081543, "global_step": 234084, "epoch": 2820} {"train_loss": -24.836477279663086, "global_step": 234085, "epoch": 2820} {"train_loss": -24.9455623626709, "global_step": 234086, "epoch": 2820} {"train_loss": -24.914621353149414, "global_step": 234087, "epoch": 2820} {"train_loss": -24.762697219848633, "global_step": 234088, "epoch": 2820} {"train_loss": -24.788467407226562, "global_step": 234089, "epoch": 2820} {"train_loss": -24.85713768005371, "global_step": 234090, "epoch": 2820} {"train_loss": -24.753610610961914, "global_step": 234091, "epoch": 2820} {"train_loss": -25.020809173583984, "global_step": 234092, "epoch": 2820} {"train_loss": -24.438352584838867, "global_step": 234093, "epoch": 2820} {"train_loss": -24.58375358581543, "global_step": 234094, "epoch": 2820} {"train_loss": -24.719482421875, "global_step": 234095, "epoch": 2820} {"train_loss": -24.985570907592773, "global_step": 234096, "epoch": 2820} {"train_loss": -24.893497467041016, "global_step": 234097, "epoch": 2820} {"train_loss": -24.63404655456543, "global_step": 234098, "epoch": 2820} {"train_loss": -24.924367904663086, "global_step": 234099, "epoch": 2820} {"train_loss": -24.66008186340332, "global_step": 234100, "epoch": 2820} {"train_loss": -24.66615867614746, "global_step": 234101, "epoch": 2820} {"train_loss": -24.766080856323242, "global_step": 234102, "epoch": 2820} {"train_loss": -24.867712020874023, "global_step": 234103, "epoch": 2820} {"train_loss": -25.237878799438477, "global_step": 234104, "epoch": 2820} {"train_loss": -24.915063858032227, "global_step": 234105, "epoch": 2820} {"train_loss": -24.76751708984375, "global_step": 234106, "epoch": 2820} {"train_loss": -24.41631507873535, "global_step": 234107, "epoch": 2820} {"train_loss": -25.2342586517334, "global_step": 234108, "epoch": 2820} {"train_loss": -24.595102310180664, "global_step": 234109, "epoch": 2820} {"train_loss": -24.995311737060547, "global_step": 234110, "epoch": 2820} {"train_loss": -24.801555633544922, "global_step": 234111, "epoch": 2820} {"train_loss": -24.52068519592285, "global_step": 234112, "epoch": 2820} {"train_loss": -24.703218460083008, "global_step": 234113, "epoch": 2820} {"train_loss": -24.75632095336914, "global_step": 234114, "epoch": 2820} {"train_loss": -25.106952667236328, "global_step": 234115, "epoch": 2820} {"train_loss": -24.59934425354004, "global_step": 234116, "epoch": 2820} {"train_loss": -24.864282608032227, "global_step": 234117, "epoch": 2820} {"train_loss": -24.927946090698242, "global_step": 234118, "epoch": 2820} {"train_loss": -24.881269454956055, "global_step": 234119, "epoch": 2820} {"train_loss": -25.0296630859375, "global_step": 234120, "epoch": 2820} {"train_loss": -24.75003433227539, "global_step": 234121, "epoch": 2820} {"train_loss": -24.700897216796875, "global_step": 234122, "epoch": 2820} {"train_loss": -24.670597076416016, "global_step": 234123, "epoch": 2820} {"train_loss": -24.82366371154785, "global_step": 234124, "epoch": 2820} {"train_loss": -25.094970703125, "global_step": 234125, "epoch": 2820} {"train_loss": -25.265897750854492, "global_step": 234126, "epoch": 2820} {"train_loss": -24.77635955810547, "global_step": 234127, "epoch": 2820} {"train_loss": -24.912982940673828, "global_step": 234128, "epoch": 2820} {"train_loss": -24.928634643554688, "global_step": 234129, "epoch": 2820} {"train_loss": -24.83705711364746, "global_step": 234130, "epoch": 2820} {"train_loss": -24.91843605041504, "global_step": 234131, "epoch": 2820} {"train_loss": -25.309885025024414, "global_step": 234132, "epoch": 2820} {"train_loss": -25.09632682800293, "global_step": 234133, "epoch": 2820} {"train_loss": -24.815685272216797, "global_step": 234134, "epoch": 2820} {"train_loss": -25.080638885498047, "global_step": 234135, "epoch": 2820} {"train_loss": -25.131256103515625, "global_step": 234136, "epoch": 2820} {"train_loss": -24.870471954345703, "global_step": 234137, "epoch": 2820} {"train_loss": -24.775068283081055, "global_step": 234138, "epoch": 2820} {"train_loss": -24.806915283203125, "global_step": 234139, "epoch": 2820} {"train_loss": -24.915380477905273, "global_step": 234140, "epoch": 2820} {"train_loss": -24.978647232055664, "global_step": 234141, "epoch": 2820} {"train_loss": -24.847447039133094, "global_step": 234142, "epoch": 2820, "val_loss": 6719691.0} {"train_loss": -19.758825302124023, "global_step": 234143, "epoch": 2821} {"train_loss": -20.39788818359375, "global_step": 234144, "epoch": 2821} {"train_loss": -23.284255981445312, "global_step": 234145, "epoch": 2821} {"train_loss": -23.103534698486328, "global_step": 234146, "epoch": 2821} {"train_loss": -23.76253890991211, "global_step": 234147, "epoch": 2821} {"train_loss": -23.253173828125, "global_step": 234148, "epoch": 2821} {"train_loss": -23.857168197631836, "global_step": 234149, "epoch": 2821} {"train_loss": -23.6102294921875, "global_step": 234150, "epoch": 2821} {"train_loss": -23.90120506286621, "global_step": 234151, "epoch": 2821} {"train_loss": -23.624622344970703, "global_step": 234152, "epoch": 2821} {"train_loss": -23.980939865112305, "global_step": 234153, "epoch": 2821} {"train_loss": -23.557912826538086, "global_step": 234154, "epoch": 2821} {"train_loss": -24.012582778930664, "global_step": 234155, "epoch": 2821} {"train_loss": -23.82293128967285, "global_step": 234156, "epoch": 2821} {"train_loss": -23.833555221557617, "global_step": 234157, "epoch": 2821} {"train_loss": -24.043106079101562, "global_step": 234158, "epoch": 2821} {"train_loss": -23.827713012695312, "global_step": 234159, "epoch": 2821} {"train_loss": -24.14977264404297, "global_step": 234160, "epoch": 2821} {"train_loss": -23.81157875061035, "global_step": 234161, "epoch": 2821} {"train_loss": -24.350467681884766, "global_step": 234162, "epoch": 2821} {"train_loss": -24.220722198486328, "global_step": 234163, "epoch": 2821} {"train_loss": -24.010807037353516, "global_step": 234164, "epoch": 2821} {"train_loss": -24.26117515563965, "global_step": 234165, "epoch": 2821} {"train_loss": -24.293867111206055, "global_step": 234166, "epoch": 2821} {"train_loss": -24.580612182617188, "global_step": 234167, "epoch": 2821} {"train_loss": -24.26650619506836, "global_step": 234168, "epoch": 2821} {"train_loss": -24.40210723876953, "global_step": 234169, "epoch": 2821} {"train_loss": -24.13663101196289, "global_step": 234170, "epoch": 2821} {"train_loss": -24.315046310424805, "global_step": 234171, "epoch": 2821} {"train_loss": -24.909019470214844, "global_step": 234172, "epoch": 2821} {"train_loss": -23.98196792602539, "global_step": 234173, "epoch": 2821} {"train_loss": -24.629934310913086, "global_step": 234174, "epoch": 2821} {"train_loss": -24.630353927612305, "global_step": 234175, "epoch": 2821} {"train_loss": -24.672332763671875, "global_step": 234176, "epoch": 2821} {"train_loss": -24.638710021972656, "global_step": 234177, "epoch": 2821} {"train_loss": -24.40286636352539, "global_step": 234178, "epoch": 2821} {"train_loss": -24.54954719543457, "global_step": 234179, "epoch": 2821} {"train_loss": -25.37181854248047, "global_step": 234180, "epoch": 2821} {"train_loss": -24.418001174926758, "global_step": 234181, "epoch": 2821} {"train_loss": -24.482023239135742, "global_step": 234182, "epoch": 2821} {"train_loss": -24.524215698242188, "global_step": 234183, "epoch": 2821} {"train_loss": -24.77895164489746, "global_step": 234184, "epoch": 2821} {"train_loss": -24.896133422851562, "global_step": 234185, "epoch": 2821} {"train_loss": -24.374364852905273, "global_step": 234186, "epoch": 2821} {"train_loss": -24.90925407409668, "global_step": 234187, "epoch": 2821} {"train_loss": -25.042001724243164, "global_step": 234188, "epoch": 2821} {"train_loss": -24.83438491821289, "global_step": 234189, "epoch": 2821} {"train_loss": -24.910009384155273, "global_step": 234190, "epoch": 2821} {"train_loss": -25.15119171142578, "global_step": 234191, "epoch": 2821} {"train_loss": -24.81557273864746, "global_step": 234192, "epoch": 2821} {"train_loss": -24.665203094482422, "global_step": 234193, "epoch": 2821} {"train_loss": -24.9578914642334, "global_step": 234194, "epoch": 2821} {"train_loss": -24.742338180541992, "global_step": 234195, "epoch": 2821} {"train_loss": -24.871967315673828, "global_step": 234196, "epoch": 2821} {"train_loss": -24.613933563232422, "global_step": 234197, "epoch": 2821} {"train_loss": -24.818933486938477, "global_step": 234198, "epoch": 2821} {"train_loss": -25.042612075805664, "global_step": 234199, "epoch": 2821} {"train_loss": -24.930503845214844, "global_step": 234200, "epoch": 2821} {"train_loss": -24.82857894897461, "global_step": 234201, "epoch": 2821} {"train_loss": -24.718809127807617, "global_step": 234202, "epoch": 2821} {"train_loss": -24.88997459411621, "global_step": 234203, "epoch": 2821} {"train_loss": -25.10905647277832, "global_step": 234204, "epoch": 2821} {"train_loss": -25.027244567871094, "global_step": 234205, "epoch": 2821} {"train_loss": -24.47100067138672, "global_step": 234206, "epoch": 2821} {"train_loss": -25.022878646850586, "global_step": 234207, "epoch": 2821} {"train_loss": -24.684934616088867, "global_step": 234208, "epoch": 2821} {"train_loss": -24.898191452026367, "global_step": 234209, "epoch": 2821} {"train_loss": -24.782135009765625, "global_step": 234210, "epoch": 2821} {"train_loss": -25.074853897094727, "global_step": 234211, "epoch": 2821} {"train_loss": -25.05002784729004, "global_step": 234212, "epoch": 2821} {"train_loss": -24.400630950927734, "global_step": 234213, "epoch": 2821} {"train_loss": -24.494291305541992, "global_step": 234214, "epoch": 2821} {"train_loss": -25.18587875366211, "global_step": 234215, "epoch": 2821} {"train_loss": -24.710968017578125, "global_step": 234216, "epoch": 2821} {"train_loss": -24.848600387573242, "global_step": 234217, "epoch": 2821} {"train_loss": -25.27464485168457, "global_step": 234218, "epoch": 2821} {"train_loss": -24.897672653198242, "global_step": 234219, "epoch": 2821} {"train_loss": -24.98256492614746, "global_step": 234220, "epoch": 2821} {"train_loss": -24.74104881286621, "global_step": 234221, "epoch": 2821} {"train_loss": -24.68560218811035, "global_step": 234222, "epoch": 2821} {"train_loss": -24.810182571411133, "global_step": 234223, "epoch": 2821} {"train_loss": -24.745840072631836, "global_step": 234224, "epoch": 2821} {"train_loss": -24.395195604806922, "global_step": 234225, "epoch": 2821, "val_loss": 6619479.0} {"train_loss": -23.94881820678711, "global_step": 234226, "epoch": 2822} {"train_loss": -24.442581176757812, "global_step": 234227, "epoch": 2822} {"train_loss": -24.481338500976562, "global_step": 234228, "epoch": 2822} {"train_loss": -24.040523529052734, "global_step": 234229, "epoch": 2822} {"train_loss": -24.455148696899414, "global_step": 234230, "epoch": 2822} {"train_loss": -23.858999252319336, "global_step": 234231, "epoch": 2822} {"train_loss": -23.812847137451172, "global_step": 234232, "epoch": 2822} {"train_loss": -24.74258804321289, "global_step": 234233, "epoch": 2822} {"train_loss": -24.689743041992188, "global_step": 234234, "epoch": 2822} {"train_loss": -24.542272567749023, "global_step": 234235, "epoch": 2822} {"train_loss": -24.492786407470703, "global_step": 234236, "epoch": 2822} {"train_loss": -24.458189010620117, "global_step": 234237, "epoch": 2822} {"train_loss": -24.514083862304688, "global_step": 234238, "epoch": 2822} {"train_loss": -24.3972110748291, "global_step": 234239, "epoch": 2822} {"train_loss": -24.362293243408203, "global_step": 234240, "epoch": 2822} {"train_loss": -24.433856964111328, "global_step": 234241, "epoch": 2822} {"train_loss": -24.729475021362305, "global_step": 234242, "epoch": 2822} {"train_loss": -24.72456169128418, "global_step": 234243, "epoch": 2822} {"train_loss": -24.637868881225586, "global_step": 234244, "epoch": 2822} {"train_loss": -24.340381622314453, "global_step": 234245, "epoch": 2822} {"train_loss": -24.630172729492188, "global_step": 234246, "epoch": 2822} {"train_loss": -24.863019943237305, "global_step": 234247, "epoch": 2822} {"train_loss": -24.919462203979492, "global_step": 234248, "epoch": 2822} {"train_loss": -24.964645385742188, "global_step": 234249, "epoch": 2822} {"train_loss": -24.633989334106445, "global_step": 234250, "epoch": 2822} {"train_loss": -24.536569595336914, "global_step": 234251, "epoch": 2822} {"train_loss": -24.737730026245117, "global_step": 234252, "epoch": 2822} {"train_loss": -24.552274703979492, "global_step": 234253, "epoch": 2822} {"train_loss": -24.67193603515625, "global_step": 234254, "epoch": 2822} {"train_loss": -24.912092208862305, "global_step": 234255, "epoch": 2822} {"train_loss": -24.708057403564453, "global_step": 234256, "epoch": 2822} {"train_loss": -24.82862663269043, "global_step": 234257, "epoch": 2822} {"train_loss": -24.79787254333496, "global_step": 234258, "epoch": 2822} {"train_loss": -24.887075424194336, "global_step": 234259, "epoch": 2822} {"train_loss": -24.87977409362793, "global_step": 234260, "epoch": 2822} {"train_loss": -25.0660457611084, "global_step": 234261, "epoch": 2822} {"train_loss": -25.25370979309082, "global_step": 234262, "epoch": 2822} {"train_loss": -24.737329483032227, "global_step": 234263, "epoch": 2822} {"train_loss": -25.079587936401367, "global_step": 234264, "epoch": 2822} {"train_loss": -24.71474266052246, "global_step": 234265, "epoch": 2822} {"train_loss": -24.88053321838379, "global_step": 234266, "epoch": 2822} {"train_loss": -24.7152042388916, "global_step": 234267, "epoch": 2822} {"train_loss": -25.218303680419922, "global_step": 234268, "epoch": 2822} {"train_loss": -24.642892837524414, "global_step": 234269, "epoch": 2822} {"train_loss": -24.8369083404541, "global_step": 234270, "epoch": 2822} {"train_loss": -24.73659324645996, "global_step": 234271, "epoch": 2822} {"train_loss": -25.248838424682617, "global_step": 234272, "epoch": 2822} {"train_loss": -25.33843421936035, "global_step": 234273, "epoch": 2822} {"train_loss": -24.884632110595703, "global_step": 234274, "epoch": 2822} {"train_loss": -24.687503814697266, "global_step": 234275, "epoch": 2822} {"train_loss": -24.93002700805664, "global_step": 234276, "epoch": 2822} {"train_loss": -25.013471603393555, "global_step": 234277, "epoch": 2822} {"train_loss": -24.546361923217773, "global_step": 234278, "epoch": 2822} {"train_loss": -24.803659439086914, "global_step": 234279, "epoch": 2822} {"train_loss": -24.612688064575195, "global_step": 234280, "epoch": 2822} {"train_loss": -25.200437545776367, "global_step": 234281, "epoch": 2822} {"train_loss": -24.988073348999023, "global_step": 234282, "epoch": 2822} {"train_loss": -24.579212188720703, "global_step": 234283, "epoch": 2822} {"train_loss": -24.40413475036621, "global_step": 234284, "epoch": 2822} {"train_loss": -24.96866798400879, "global_step": 234285, "epoch": 2822} {"train_loss": -24.86945915222168, "global_step": 234286, "epoch": 2822} {"train_loss": -24.98585319519043, "global_step": 234287, "epoch": 2822} {"train_loss": -24.9350528717041, "global_step": 234288, "epoch": 2822} {"train_loss": -24.81646156311035, "global_step": 234289, "epoch": 2822} {"train_loss": -25.19029426574707, "global_step": 234290, "epoch": 2822} {"train_loss": -24.785551071166992, "global_step": 234291, "epoch": 2822} {"train_loss": -25.01028060913086, "global_step": 234292, "epoch": 2822} {"train_loss": -24.666107177734375, "global_step": 234293, "epoch": 2822} {"train_loss": -24.944150924682617, "global_step": 234294, "epoch": 2822} {"train_loss": -24.565847396850586, "global_step": 234295, "epoch": 2822} {"train_loss": -24.919591903686523, "global_step": 234296, "epoch": 2822} {"train_loss": -25.08616065979004, "global_step": 234297, "epoch": 2822} {"train_loss": -24.89630699157715, "global_step": 234298, "epoch": 2822} {"train_loss": -24.50133514404297, "global_step": 234299, "epoch": 2822} {"train_loss": -24.446449279785156, "global_step": 234300, "epoch": 2822} {"train_loss": -24.6553897857666, "global_step": 234301, "epoch": 2822} {"train_loss": -24.503402709960938, "global_step": 234302, "epoch": 2822} {"train_loss": -24.827713012695312, "global_step": 234303, "epoch": 2822} {"train_loss": -24.639957427978516, "global_step": 234304, "epoch": 2822} {"train_loss": -24.52581214904785, "global_step": 234305, "epoch": 2822} {"train_loss": -24.485305786132812, "global_step": 234306, "epoch": 2822} {"train_loss": -24.56279754638672, "global_step": 234307, "epoch": 2822} {"train_loss": -24.716983933046638, "global_step": 234308, "epoch": 2822, "val_loss": 6744534.5} {"train_loss": -24.1361026763916, "global_step": 234309, "epoch": 2823} {"train_loss": -24.19022560119629, "global_step": 234310, "epoch": 2823} {"train_loss": -24.378345489501953, "global_step": 234311, "epoch": 2823} {"train_loss": -24.371448516845703, "global_step": 234312, "epoch": 2823} {"train_loss": -24.414024353027344, "global_step": 234313, "epoch": 2823} {"train_loss": -24.576955795288086, "global_step": 234314, "epoch": 2823} {"train_loss": -24.365665435791016, "global_step": 234315, "epoch": 2823} {"train_loss": -24.57444953918457, "global_step": 234316, "epoch": 2823} {"train_loss": -24.372802734375, "global_step": 234317, "epoch": 2823} {"train_loss": -24.265323638916016, "global_step": 234318, "epoch": 2823} {"train_loss": -24.519495010375977, "global_step": 234319, "epoch": 2823} {"train_loss": -24.652061462402344, "global_step": 234320, "epoch": 2823} {"train_loss": -24.546432495117188, "global_step": 234321, "epoch": 2823} {"train_loss": -24.07492446899414, "global_step": 234322, "epoch": 2823} {"train_loss": -24.448108673095703, "global_step": 234323, "epoch": 2823} {"train_loss": -24.556629180908203, "global_step": 234324, "epoch": 2823} {"train_loss": -24.15082359313965, "global_step": 234325, "epoch": 2823} {"train_loss": -24.721668243408203, "global_step": 234326, "epoch": 2823} {"train_loss": -24.872936248779297, "global_step": 234327, "epoch": 2823} {"train_loss": -24.544124603271484, "global_step": 234328, "epoch": 2823} {"train_loss": -24.40750503540039, "global_step": 234329, "epoch": 2823} {"train_loss": -24.53138542175293, "global_step": 234330, "epoch": 2823} {"train_loss": -24.13153648376465, "global_step": 234331, "epoch": 2823} {"train_loss": -24.601104736328125, "global_step": 234332, "epoch": 2823} {"train_loss": -24.640594482421875, "global_step": 234333, "epoch": 2823} {"train_loss": -24.66607093811035, "global_step": 234334, "epoch": 2823} {"train_loss": -24.894773483276367, "global_step": 234335, "epoch": 2823} {"train_loss": -24.379701614379883, "global_step": 234336, "epoch": 2823} {"train_loss": -24.68927574157715, "global_step": 234337, "epoch": 2823} {"train_loss": -24.88719940185547, "global_step": 234338, "epoch": 2823} {"train_loss": -24.644495010375977, "global_step": 234339, "epoch": 2823} {"train_loss": -24.608097076416016, "global_step": 234340, "epoch": 2823} {"train_loss": -24.810049057006836, "global_step": 234341, "epoch": 2823} {"train_loss": -24.498632431030273, "global_step": 234342, "epoch": 2823} {"train_loss": -24.656829833984375, "global_step": 234343, "epoch": 2823} {"train_loss": -25.123611450195312, "global_step": 234344, "epoch": 2823} {"train_loss": -24.753253936767578, "global_step": 234345, "epoch": 2823} {"train_loss": -24.597900390625, "global_step": 234346, "epoch": 2823} {"train_loss": -25.21150016784668, "global_step": 234347, "epoch": 2823} {"train_loss": -24.532461166381836, "global_step": 234348, "epoch": 2823} {"train_loss": -24.862728118896484, "global_step": 234349, "epoch": 2823} {"train_loss": -24.924285888671875, "global_step": 234350, "epoch": 2823} {"train_loss": -24.951820373535156, "global_step": 234351, "epoch": 2823} {"train_loss": -24.625568389892578, "global_step": 234352, "epoch": 2823} {"train_loss": -24.683176040649414, "global_step": 234353, "epoch": 2823} {"train_loss": -24.772296905517578, "global_step": 234354, "epoch": 2823} {"train_loss": -24.467451095581055, "global_step": 234355, "epoch": 2823} {"train_loss": -24.50111198425293, "global_step": 234356, "epoch": 2823} {"train_loss": -25.095352172851562, "global_step": 234357, "epoch": 2823} {"train_loss": -24.682355880737305, "global_step": 234358, "epoch": 2823} {"train_loss": -24.875577926635742, "global_step": 234359, "epoch": 2823} {"train_loss": -24.744131088256836, "global_step": 234360, "epoch": 2823} {"train_loss": -25.11769676208496, "global_step": 234361, "epoch": 2823} {"train_loss": -24.573200225830078, "global_step": 234362, "epoch": 2823} {"train_loss": -24.515422821044922, "global_step": 234363, "epoch": 2823} {"train_loss": -24.57689094543457, "global_step": 234364, "epoch": 2823} {"train_loss": -24.84815788269043, "global_step": 234365, "epoch": 2823} {"train_loss": -24.624784469604492, "global_step": 234366, "epoch": 2823} {"train_loss": -24.9862060546875, "global_step": 234367, "epoch": 2823} {"train_loss": -24.791990280151367, "global_step": 234368, "epoch": 2823} {"train_loss": -24.80517578125, "global_step": 234369, "epoch": 2823} {"train_loss": -24.962350845336914, "global_step": 234370, "epoch": 2823} {"train_loss": -25.012481689453125, "global_step": 234371, "epoch": 2823} {"train_loss": -25.409099578857422, "global_step": 234372, "epoch": 2823} {"train_loss": -24.554471969604492, "global_step": 234373, "epoch": 2823} {"train_loss": -24.811948776245117, "global_step": 234374, "epoch": 2823} {"train_loss": -24.462499618530273, "global_step": 234375, "epoch": 2823} {"train_loss": -24.789045333862305, "global_step": 234376, "epoch": 2823} {"train_loss": -25.151716232299805, "global_step": 234377, "epoch": 2823} {"train_loss": -24.694793701171875, "global_step": 234378, "epoch": 2823} {"train_loss": -24.979999542236328, "global_step": 234379, "epoch": 2823} {"train_loss": -25.20892906188965, "global_step": 234380, "epoch": 2823} {"train_loss": -24.974658966064453, "global_step": 234381, "epoch": 2823} {"train_loss": -24.817630767822266, "global_step": 234382, "epoch": 2823} {"train_loss": -24.906558990478516, "global_step": 234383, "epoch": 2823} {"train_loss": -24.894195556640625, "global_step": 234384, "epoch": 2823} {"train_loss": -24.60774803161621, "global_step": 234385, "epoch": 2823} {"train_loss": -25.037384033203125, "global_step": 234386, "epoch": 2823} {"train_loss": -24.91650390625, "global_step": 234387, "epoch": 2823} {"train_loss": -24.722152709960938, "global_step": 234388, "epoch": 2823} {"train_loss": -24.95473861694336, "global_step": 234389, "epoch": 2823} {"train_loss": -25.163816452026367, "global_step": 234390, "epoch": 2823} {"train_loss": -24.70112625949354, "global_step": 234391, "epoch": 2823, "val_loss": 6751563.0} {"train_loss": -24.396678924560547, "global_step": 234392, "epoch": 2824} {"train_loss": -24.624799728393555, "global_step": 234393, "epoch": 2824} {"train_loss": -24.30372428894043, "global_step": 234394, "epoch": 2824} {"train_loss": -24.636964797973633, "global_step": 234395, "epoch": 2824} {"train_loss": -24.5986270904541, "global_step": 234396, "epoch": 2824} {"train_loss": -24.79660987854004, "global_step": 234397, "epoch": 2824} {"train_loss": -24.4112606048584, "global_step": 234398, "epoch": 2824} {"train_loss": -24.700653076171875, "global_step": 234399, "epoch": 2824} {"train_loss": -24.322872161865234, "global_step": 234400, "epoch": 2824} {"train_loss": -25.216577529907227, "global_step": 234401, "epoch": 2824} {"train_loss": -24.56141471862793, "global_step": 234402, "epoch": 2824} {"train_loss": -24.655988693237305, "global_step": 234403, "epoch": 2824} {"train_loss": -24.69082260131836, "global_step": 234404, "epoch": 2824} {"train_loss": -24.560115814208984, "global_step": 234405, "epoch": 2824} {"train_loss": -24.64035987854004, "global_step": 234406, "epoch": 2824} {"train_loss": -24.573686599731445, "global_step": 234407, "epoch": 2824} {"train_loss": -24.744991302490234, "global_step": 234408, "epoch": 2824} {"train_loss": -24.956907272338867, "global_step": 234409, "epoch": 2824} {"train_loss": -25.03675651550293, "global_step": 234410, "epoch": 2824} {"train_loss": -24.879911422729492, "global_step": 234411, "epoch": 2824} {"train_loss": -24.755741119384766, "global_step": 234412, "epoch": 2824} {"train_loss": -25.01090431213379, "global_step": 234413, "epoch": 2824} {"train_loss": -24.735097885131836, "global_step": 234414, "epoch": 2824} {"train_loss": -24.68246078491211, "global_step": 234415, "epoch": 2824} {"train_loss": -24.948822021484375, "global_step": 234416, "epoch": 2824} {"train_loss": -24.73372459411621, "global_step": 234417, "epoch": 2824} {"train_loss": -24.923505783081055, "global_step": 234418, "epoch": 2824} {"train_loss": -25.019519805908203, "global_step": 234419, "epoch": 2824} {"train_loss": -24.7792911529541, "global_step": 234420, "epoch": 2824} {"train_loss": -24.745420455932617, "global_step": 234421, "epoch": 2824} {"train_loss": -24.310272216796875, "global_step": 234422, "epoch": 2824} {"train_loss": -24.85332679748535, "global_step": 234423, "epoch": 2824} {"train_loss": -24.997173309326172, "global_step": 234424, "epoch": 2824} {"train_loss": -24.894989013671875, "global_step": 234425, "epoch": 2824} {"train_loss": -24.51698875427246, "global_step": 234426, "epoch": 2824} {"train_loss": -24.4504337310791, "global_step": 234427, "epoch": 2824} {"train_loss": -24.784835815429688, "global_step": 234428, "epoch": 2824} {"train_loss": -25.02943229675293, "global_step": 234429, "epoch": 2824} {"train_loss": -24.7901554107666, "global_step": 234430, "epoch": 2824} {"train_loss": -24.410154342651367, "global_step": 234431, "epoch": 2824} {"train_loss": -24.90087127685547, "global_step": 234432, "epoch": 2824} {"train_loss": -25.131473541259766, "global_step": 234433, "epoch": 2824} {"train_loss": -24.745594024658203, "global_step": 234434, "epoch": 2824} {"train_loss": -24.718765258789062, "global_step": 234435, "epoch": 2824} {"train_loss": -24.686765670776367, "global_step": 234436, "epoch": 2824} {"train_loss": -24.726720809936523, "global_step": 234437, "epoch": 2824} {"train_loss": -24.74247169494629, "global_step": 234438, "epoch": 2824} {"train_loss": -24.858522415161133, "global_step": 234439, "epoch": 2824} {"train_loss": -24.762731552124023, "global_step": 234440, "epoch": 2824} {"train_loss": -24.855642318725586, "global_step": 234441, "epoch": 2824} {"train_loss": -24.928754806518555, "global_step": 234442, "epoch": 2824} {"train_loss": -24.621816635131836, "global_step": 234443, "epoch": 2824} {"train_loss": -24.708566665649414, "global_step": 234444, "epoch": 2824} {"train_loss": -24.823593139648438, "global_step": 234445, "epoch": 2824} {"train_loss": -24.793743133544922, "global_step": 234446, "epoch": 2824} {"train_loss": -25.189281463623047, "global_step": 234447, "epoch": 2824} {"train_loss": -24.63136100769043, "global_step": 234448, "epoch": 2824} {"train_loss": -24.82826805114746, "global_step": 234449, "epoch": 2824} {"train_loss": -24.790435791015625, "global_step": 234450, "epoch": 2824} {"train_loss": -24.722707748413086, "global_step": 234451, "epoch": 2824} {"train_loss": -24.87845230102539, "global_step": 234452, "epoch": 2824} {"train_loss": -24.84291648864746, "global_step": 234453, "epoch": 2824} {"train_loss": -24.553115844726562, "global_step": 234454, "epoch": 2824} {"train_loss": -24.72031593322754, "global_step": 234455, "epoch": 2824} {"train_loss": -24.538278579711914, "global_step": 234456, "epoch": 2824} {"train_loss": -25.11829376220703, "global_step": 234457, "epoch": 2824} {"train_loss": -24.91200828552246, "global_step": 234458, "epoch": 2824} {"train_loss": -24.49613380432129, "global_step": 234459, "epoch": 2824} {"train_loss": -24.773893356323242, "global_step": 234460, "epoch": 2824} {"train_loss": -24.728445053100586, "global_step": 234461, "epoch": 2824} {"train_loss": -24.63079261779785, "global_step": 234462, "epoch": 2824} {"train_loss": -24.590688705444336, "global_step": 234463, "epoch": 2824} {"train_loss": -25.0736026763916, "global_step": 234464, "epoch": 2824} {"train_loss": -24.961759567260742, "global_step": 234465, "epoch": 2824} {"train_loss": -24.686765670776367, "global_step": 234466, "epoch": 2824} {"train_loss": -24.626062393188477, "global_step": 234467, "epoch": 2824} {"train_loss": -24.620243072509766, "global_step": 234468, "epoch": 2824} {"train_loss": -25.016645431518555, "global_step": 234469, "epoch": 2824} {"train_loss": -25.05690574645996, "global_step": 234470, "epoch": 2824} {"train_loss": -24.736663818359375, "global_step": 234471, "epoch": 2824} {"train_loss": -24.809158325195312, "global_step": 234472, "epoch": 2824} {"train_loss": -25.086353302001953, "global_step": 234473, "epoch": 2824} {"train_loss": -24.7516963682979, "global_step": 234474, "epoch": 2824, "val_loss": 6694758.0} {"train_loss": -23.517047882080078, "global_step": 234475, "epoch": 2825} {"train_loss": -22.011457443237305, "global_step": 234476, "epoch": 2825} {"train_loss": -24.48129653930664, "global_step": 234477, "epoch": 2825} {"train_loss": -23.85017204284668, "global_step": 234478, "epoch": 2825} {"train_loss": -23.803430557250977, "global_step": 234479, "epoch": 2825} {"train_loss": -24.19550895690918, "global_step": 234480, "epoch": 2825} {"train_loss": -23.903034210205078, "global_step": 234481, "epoch": 2825} {"train_loss": -24.674535751342773, "global_step": 234482, "epoch": 2825} {"train_loss": -23.924436569213867, "global_step": 234483, "epoch": 2825} {"train_loss": -24.59978675842285, "global_step": 234484, "epoch": 2825} {"train_loss": -24.01297378540039, "global_step": 234485, "epoch": 2825} {"train_loss": -24.25293731689453, "global_step": 234486, "epoch": 2825} {"train_loss": -24.15097427368164, "global_step": 234487, "epoch": 2825} {"train_loss": -24.197904586791992, "global_step": 234488, "epoch": 2825} {"train_loss": -24.48799705505371, "global_step": 234489, "epoch": 2825} {"train_loss": -24.49586296081543, "global_step": 234490, "epoch": 2825} {"train_loss": -24.623170852661133, "global_step": 234491, "epoch": 2825} {"train_loss": -24.565141677856445, "global_step": 234492, "epoch": 2825} {"train_loss": -24.384374618530273, "global_step": 234493, "epoch": 2825} {"train_loss": -24.33887481689453, "global_step": 234494, "epoch": 2825} {"train_loss": -24.2229061126709, "global_step": 234495, "epoch": 2825} {"train_loss": -24.498733520507812, "global_step": 234496, "epoch": 2825} {"train_loss": -24.156436920166016, "global_step": 234497, "epoch": 2825} {"train_loss": -24.632518768310547, "global_step": 234498, "epoch": 2825} {"train_loss": -24.394672393798828, "global_step": 234499, "epoch": 2825} {"train_loss": -24.507705688476562, "global_step": 234500, "epoch": 2825} {"train_loss": -24.765317916870117, "global_step": 234501, "epoch": 2825} {"train_loss": -24.524526596069336, "global_step": 234502, "epoch": 2825} {"train_loss": -24.900419235229492, "global_step": 234503, "epoch": 2825} {"train_loss": -25.00857925415039, "global_step": 234504, "epoch": 2825} {"train_loss": -24.913990020751953, "global_step": 234505, "epoch": 2825} {"train_loss": -24.903884887695312, "global_step": 234506, "epoch": 2825} {"train_loss": -24.980573654174805, "global_step": 234507, "epoch": 2825} {"train_loss": -24.878076553344727, "global_step": 234508, "epoch": 2825} {"train_loss": -24.824522018432617, "global_step": 234509, "epoch": 2825} {"train_loss": -24.8056697845459, "global_step": 234510, "epoch": 2825} {"train_loss": -25.149084091186523, "global_step": 234511, "epoch": 2825} {"train_loss": -24.964468002319336, "global_step": 234512, "epoch": 2825} {"train_loss": -25.10549545288086, "global_step": 234513, "epoch": 2825} {"train_loss": -25.05988121032715, "global_step": 234514, "epoch": 2825} {"train_loss": -24.865116119384766, "global_step": 234515, "epoch": 2825} {"train_loss": -24.668655395507812, "global_step": 234516, "epoch": 2825} {"train_loss": -24.945737838745117, "global_step": 234517, "epoch": 2825} {"train_loss": -25.23213768005371, "global_step": 234518, "epoch": 2825} {"train_loss": -24.632322311401367, "global_step": 234519, "epoch": 2825} {"train_loss": -24.940359115600586, "global_step": 234520, "epoch": 2825} {"train_loss": -24.9486141204834, "global_step": 234521, "epoch": 2825} {"train_loss": -25.176679611206055, "global_step": 234522, "epoch": 2825} {"train_loss": -24.824771881103516, "global_step": 234523, "epoch": 2825} {"train_loss": -24.614652633666992, "global_step": 234524, "epoch": 2825} {"train_loss": -24.941104888916016, "global_step": 234525, "epoch": 2825} {"train_loss": -24.950347900390625, "global_step": 234526, "epoch": 2825} {"train_loss": -25.046157836914062, "global_step": 234527, "epoch": 2825} {"train_loss": -24.848766326904297, "global_step": 234528, "epoch": 2825} {"train_loss": -24.9909725189209, "global_step": 234529, "epoch": 2825} {"train_loss": -24.992202758789062, "global_step": 234530, "epoch": 2825} {"train_loss": -24.720327377319336, "global_step": 234531, "epoch": 2825} {"train_loss": -25.02251434326172, "global_step": 234532, "epoch": 2825} {"train_loss": -24.821531295776367, "global_step": 234533, "epoch": 2825} {"train_loss": -25.071670532226562, "global_step": 234534, "epoch": 2825} {"train_loss": -24.816965103149414, "global_step": 234535, "epoch": 2825} {"train_loss": -24.86659812927246, "global_step": 234536, "epoch": 2825} {"train_loss": -24.787046432495117, "global_step": 234537, "epoch": 2825} {"train_loss": -24.8499813079834, "global_step": 234538, "epoch": 2825} {"train_loss": -25.20939826965332, "global_step": 234539, "epoch": 2825} {"train_loss": -25.159011840820312, "global_step": 234540, "epoch": 2825} {"train_loss": -24.683279037475586, "global_step": 234541, "epoch": 2825} {"train_loss": -25.049509048461914, "global_step": 234542, "epoch": 2825} {"train_loss": -24.631839752197266, "global_step": 234543, "epoch": 2825} {"train_loss": -24.918787002563477, "global_step": 234544, "epoch": 2825} {"train_loss": -25.02439308166504, "global_step": 234545, "epoch": 2825} {"train_loss": -25.210302352905273, "global_step": 234546, "epoch": 2825} {"train_loss": -24.747182846069336, "global_step": 234547, "epoch": 2825} {"train_loss": -24.652366638183594, "global_step": 234548, "epoch": 2825} {"train_loss": -25.029638290405273, "global_step": 234549, "epoch": 2825} {"train_loss": -24.66387939453125, "global_step": 234550, "epoch": 2825} {"train_loss": -25.00436782836914, "global_step": 234551, "epoch": 2825} {"train_loss": -24.534465789794922, "global_step": 234552, "epoch": 2825} {"train_loss": -24.691635131835938, "global_step": 234553, "epoch": 2825} {"train_loss": -24.75869369506836, "global_step": 234554, "epoch": 2825} {"train_loss": -24.74527931213379, "global_step": 234555, "epoch": 2825} {"train_loss": -24.260412216186523, "global_step": 234556, "epoch": 2825} {"train_loss": -24.658320231610034, "global_step": 234557, "epoch": 2825, "val_loss": 6698246.0} {"train_loss": -23.492481231689453, "global_step": 234558, "epoch": 2826} {"train_loss": -23.54573631286621, "global_step": 234559, "epoch": 2826} {"train_loss": -23.899494171142578, "global_step": 234560, "epoch": 2826} {"train_loss": -23.87631607055664, "global_step": 234561, "epoch": 2826} {"train_loss": -23.995466232299805, "global_step": 234562, "epoch": 2826} {"train_loss": -23.778593063354492, "global_step": 234563, "epoch": 2826} {"train_loss": -23.86676597595215, "global_step": 234564, "epoch": 2826} {"train_loss": -23.873868942260742, "global_step": 234565, "epoch": 2826} {"train_loss": -24.317792892456055, "global_step": 234566, "epoch": 2826} {"train_loss": -23.934131622314453, "global_step": 234567, "epoch": 2826} {"train_loss": -24.16719627380371, "global_step": 234568, "epoch": 2826} {"train_loss": -24.50394630432129, "global_step": 234569, "epoch": 2826} {"train_loss": -24.20821189880371, "global_step": 234570, "epoch": 2826} {"train_loss": -24.34612464904785, "global_step": 234571, "epoch": 2826} {"train_loss": -24.29935646057129, "global_step": 234572, "epoch": 2826} {"train_loss": -24.202533721923828, "global_step": 234573, "epoch": 2826} {"train_loss": -24.81817626953125, "global_step": 234574, "epoch": 2826} {"train_loss": -24.021289825439453, "global_step": 234575, "epoch": 2826} {"train_loss": -24.53232765197754, "global_step": 234576, "epoch": 2826} {"train_loss": -24.690174102783203, "global_step": 234577, "epoch": 2826} {"train_loss": -24.194204330444336, "global_step": 234578, "epoch": 2826} {"train_loss": -24.193265914916992, "global_step": 234579, "epoch": 2826} {"train_loss": -24.49751853942871, "global_step": 234580, "epoch": 2826} {"train_loss": -24.44329833984375, "global_step": 234581, "epoch": 2826} {"train_loss": -24.39371681213379, "global_step": 234582, "epoch": 2826} {"train_loss": -24.760038375854492, "global_step": 234583, "epoch": 2826} {"train_loss": -24.68572998046875, "global_step": 234584, "epoch": 2826} {"train_loss": -24.223241806030273, "global_step": 234585, "epoch": 2826} {"train_loss": -24.536680221557617, "global_step": 234586, "epoch": 2826} {"train_loss": -24.390735626220703, "global_step": 234587, "epoch": 2826} {"train_loss": -24.64594841003418, "global_step": 234588, "epoch": 2826} {"train_loss": -24.73805809020996, "global_step": 234589, "epoch": 2826} {"train_loss": -24.546878814697266, "global_step": 234590, "epoch": 2826} {"train_loss": -24.751026153564453, "global_step": 234591, "epoch": 2826} {"train_loss": -24.757373809814453, "global_step": 234592, "epoch": 2826} {"train_loss": -24.770160675048828, "global_step": 234593, "epoch": 2826} {"train_loss": -24.6643123626709, "global_step": 234594, "epoch": 2826} {"train_loss": -24.7468318939209, "global_step": 234595, "epoch": 2826} {"train_loss": -25.097932815551758, "global_step": 234596, "epoch": 2826} {"train_loss": -24.777847290039062, "global_step": 234597, "epoch": 2826} {"train_loss": -24.705408096313477, "global_step": 234598, "epoch": 2826} {"train_loss": -24.757253646850586, "global_step": 234599, "epoch": 2826} {"train_loss": -24.87041664123535, "global_step": 234600, "epoch": 2826} {"train_loss": -24.789844512939453, "global_step": 234601, "epoch": 2826} {"train_loss": -24.642292022705078, "global_step": 234602, "epoch": 2826} {"train_loss": -24.68326187133789, "global_step": 234603, "epoch": 2826} {"train_loss": -24.92791175842285, "global_step": 234604, "epoch": 2826} {"train_loss": -25.421987533569336, "global_step": 234605, "epoch": 2826} {"train_loss": -24.625242233276367, "global_step": 234606, "epoch": 2826} {"train_loss": -24.87014389038086, "global_step": 234607, "epoch": 2826} {"train_loss": -25.019147872924805, "global_step": 234608, "epoch": 2826} {"train_loss": -24.860692977905273, "global_step": 234609, "epoch": 2826} {"train_loss": -24.83979606628418, "global_step": 234610, "epoch": 2826} {"train_loss": -24.670095443725586, "global_step": 234611, "epoch": 2826} {"train_loss": -25.012235641479492, "global_step": 234612, "epoch": 2826} {"train_loss": -24.873048782348633, "global_step": 234613, "epoch": 2826} {"train_loss": -24.87518882751465, "global_step": 234614, "epoch": 2826} {"train_loss": -24.52997589111328, "global_step": 234615, "epoch": 2826} {"train_loss": -24.916549682617188, "global_step": 234616, "epoch": 2826} {"train_loss": -24.88636589050293, "global_step": 234617, "epoch": 2826} {"train_loss": -24.601119995117188, "global_step": 234618, "epoch": 2826} {"train_loss": -24.47267723083496, "global_step": 234619, "epoch": 2826} {"train_loss": -24.22479820251465, "global_step": 234620, "epoch": 2826} {"train_loss": -24.696409225463867, "global_step": 234621, "epoch": 2826} {"train_loss": -24.91267204284668, "global_step": 234622, "epoch": 2826} {"train_loss": -24.68889808654785, "global_step": 234623, "epoch": 2826} {"train_loss": -24.693517684936523, "global_step": 234624, "epoch": 2826} {"train_loss": -24.91609764099121, "global_step": 234625, "epoch": 2826} {"train_loss": -25.05340003967285, "global_step": 234626, "epoch": 2826} {"train_loss": -24.69342613220215, "global_step": 234627, "epoch": 2826} {"train_loss": -24.496261596679688, "global_step": 234628, "epoch": 2826} {"train_loss": -24.474262237548828, "global_step": 234629, "epoch": 2826} {"train_loss": -24.315031051635742, "global_step": 234630, "epoch": 2826} {"train_loss": -24.499874114990234, "global_step": 234631, "epoch": 2826} {"train_loss": -24.92828941345215, "global_step": 234632, "epoch": 2826} {"train_loss": -24.824003219604492, "global_step": 234633, "epoch": 2826} {"train_loss": -24.808691024780273, "global_step": 234634, "epoch": 2826} {"train_loss": -24.802709579467773, "global_step": 234635, "epoch": 2826} {"train_loss": -24.739572525024414, "global_step": 234636, "epoch": 2826} {"train_loss": -24.78009033203125, "global_step": 234637, "epoch": 2826} {"train_loss": -24.66868019104004, "global_step": 234638, "epoch": 2826} {"train_loss": -24.628326416015625, "global_step": 234639, "epoch": 2826} {"train_loss": -24.583795593445558, "global_step": 234640, "epoch": 2826, "val_loss": 6848529.0} {"train_loss": -22.238636016845703, "global_step": 234641, "epoch": 2827} {"train_loss": -23.719650268554688, "global_step": 234642, "epoch": 2827} {"train_loss": -23.75618553161621, "global_step": 234643, "epoch": 2827} {"train_loss": -23.613323211669922, "global_step": 234644, "epoch": 2827} {"train_loss": -23.579320907592773, "global_step": 234645, "epoch": 2827} {"train_loss": -23.959423065185547, "global_step": 234646, "epoch": 2827} {"train_loss": -23.547815322875977, "global_step": 234647, "epoch": 2827} {"train_loss": -23.86452293395996, "global_step": 234648, "epoch": 2827} {"train_loss": -24.256147384643555, "global_step": 234649, "epoch": 2827} {"train_loss": -23.91377067565918, "global_step": 234650, "epoch": 2827} {"train_loss": -24.27737045288086, "global_step": 234651, "epoch": 2827} {"train_loss": -24.18067741394043, "global_step": 234652, "epoch": 2827} {"train_loss": -24.389982223510742, "global_step": 234653, "epoch": 2827} {"train_loss": -23.913320541381836, "global_step": 234654, "epoch": 2827} {"train_loss": -24.47159767150879, "global_step": 234655, "epoch": 2827} {"train_loss": -24.51157569885254, "global_step": 234656, "epoch": 2827} {"train_loss": -24.408668518066406, "global_step": 234657, "epoch": 2827} {"train_loss": -24.56526756286621, "global_step": 234658, "epoch": 2827} {"train_loss": -24.66038703918457, "global_step": 234659, "epoch": 2827} {"train_loss": -24.6673583984375, "global_step": 234660, "epoch": 2827} {"train_loss": -24.329694747924805, "global_step": 234661, "epoch": 2827} {"train_loss": -24.115203857421875, "global_step": 234662, "epoch": 2827} {"train_loss": -24.60318374633789, "global_step": 234663, "epoch": 2827} {"train_loss": -24.678064346313477, "global_step": 234664, "epoch": 2827} {"train_loss": -24.43231773376465, "global_step": 234665, "epoch": 2827} {"train_loss": -24.79033851623535, "global_step": 234666, "epoch": 2827} {"train_loss": -24.60562515258789, "global_step": 234667, "epoch": 2827} {"train_loss": -24.576467514038086, "global_step": 234668, "epoch": 2827} {"train_loss": -24.767284393310547, "global_step": 234669, "epoch": 2827} {"train_loss": -24.782089233398438, "global_step": 234670, "epoch": 2827} {"train_loss": -25.024925231933594, "global_step": 234671, "epoch": 2827} {"train_loss": -24.763843536376953, "global_step": 234672, "epoch": 2827} {"train_loss": -24.474225997924805, "global_step": 234673, "epoch": 2827} {"train_loss": -25.16815185546875, "global_step": 234674, "epoch": 2827} {"train_loss": -24.868976593017578, "global_step": 234675, "epoch": 2827} {"train_loss": -24.793842315673828, "global_step": 234676, "epoch": 2827} {"train_loss": -24.975828170776367, "global_step": 234677, "epoch": 2827} {"train_loss": -24.89057731628418, "global_step": 234678, "epoch": 2827} {"train_loss": -24.57071876525879, "global_step": 234679, "epoch": 2827} {"train_loss": -24.99142837524414, "global_step": 234680, "epoch": 2827} {"train_loss": -24.7734317779541, "global_step": 234681, "epoch": 2827} {"train_loss": -24.351240158081055, "global_step": 234682, "epoch": 2827} {"train_loss": -24.457387924194336, "global_step": 234683, "epoch": 2827} {"train_loss": -25.200292587280273, "global_step": 234684, "epoch": 2827} {"train_loss": -24.530485153198242, "global_step": 234685, "epoch": 2827} {"train_loss": -24.4019832611084, "global_step": 234686, "epoch": 2827} {"train_loss": -24.256784439086914, "global_step": 234687, "epoch": 2827} {"train_loss": -24.545175552368164, "global_step": 234688, "epoch": 2827} {"train_loss": -24.748594284057617, "global_step": 234689, "epoch": 2827} {"train_loss": -24.4849796295166, "global_step": 234690, "epoch": 2827} {"train_loss": -25.09031105041504, "global_step": 234691, "epoch": 2827} {"train_loss": -24.618892669677734, "global_step": 234692, "epoch": 2827} {"train_loss": -24.783342361450195, "global_step": 234693, "epoch": 2827} {"train_loss": -25.20730972290039, "global_step": 234694, "epoch": 2827} {"train_loss": -24.65419578552246, "global_step": 234695, "epoch": 2827} {"train_loss": -24.849346160888672, "global_step": 234696, "epoch": 2827} {"train_loss": -24.729637145996094, "global_step": 234697, "epoch": 2827} {"train_loss": -24.869892120361328, "global_step": 234698, "epoch": 2827} {"train_loss": -24.526212692260742, "global_step": 234699, "epoch": 2827} {"train_loss": -24.96470832824707, "global_step": 234700, "epoch": 2827} {"train_loss": -24.67397689819336, "global_step": 234701, "epoch": 2827} {"train_loss": -24.815937042236328, "global_step": 234702, "epoch": 2827} {"train_loss": -24.76679039001465, "global_step": 234703, "epoch": 2827} {"train_loss": -24.89387321472168, "global_step": 234704, "epoch": 2827} {"train_loss": -24.885604858398438, "global_step": 234705, "epoch": 2827} {"train_loss": -24.637256622314453, "global_step": 234706, "epoch": 2827} {"train_loss": -24.808942794799805, "global_step": 234707, "epoch": 2827} {"train_loss": -24.60856056213379, "global_step": 234708, "epoch": 2827} {"train_loss": -25.343551635742188, "global_step": 234709, "epoch": 2827} {"train_loss": -24.5697078704834, "global_step": 234710, "epoch": 2827} {"train_loss": -24.96018409729004, "global_step": 234711, "epoch": 2827} {"train_loss": -24.723388671875, "global_step": 234712, "epoch": 2827} {"train_loss": -25.23384666442871, "global_step": 234713, "epoch": 2827} {"train_loss": -25.011167526245117, "global_step": 234714, "epoch": 2827} {"train_loss": -24.837495803833008, "global_step": 234715, "epoch": 2827} {"train_loss": -24.874013900756836, "global_step": 234716, "epoch": 2827} {"train_loss": -24.828983306884766, "global_step": 234717, "epoch": 2827} {"train_loss": -24.68854331970215, "global_step": 234718, "epoch": 2827} {"train_loss": -24.751585006713867, "global_step": 234719, "epoch": 2827} {"train_loss": -25.04526710510254, "global_step": 234720, "epoch": 2827} {"train_loss": -24.47824478149414, "global_step": 234721, "epoch": 2827} {"train_loss": -24.896968841552734, "global_step": 234722, "epoch": 2827} {"train_loss": -24.566639107393932, "global_step": 234723, "epoch": 2827, "val_loss": 6791360.0} {"train_loss": -24.754989624023438, "global_step": 234724, "epoch": 2828} {"train_loss": -24.002634048461914, "global_step": 234725, "epoch": 2828} {"train_loss": -24.646799087524414, "global_step": 234726, "epoch": 2828} {"train_loss": -24.4821834564209, "global_step": 234727, "epoch": 2828} {"train_loss": -24.425596237182617, "global_step": 234728, "epoch": 2828} {"train_loss": -24.598325729370117, "global_step": 234729, "epoch": 2828} {"train_loss": -24.947803497314453, "global_step": 234730, "epoch": 2828} {"train_loss": -24.825748443603516, "global_step": 234731, "epoch": 2828} {"train_loss": -24.880817413330078, "global_step": 234732, "epoch": 2828} {"train_loss": -24.900287628173828, "global_step": 234733, "epoch": 2828} {"train_loss": -24.597257614135742, "global_step": 234734, "epoch": 2828} {"train_loss": -24.480205535888672, "global_step": 234735, "epoch": 2828} {"train_loss": -24.720661163330078, "global_step": 234736, "epoch": 2828} {"train_loss": -24.46027183532715, "global_step": 234737, "epoch": 2828} {"train_loss": -24.181262969970703, "global_step": 234738, "epoch": 2828} {"train_loss": -24.601896286010742, "global_step": 234739, "epoch": 2828} {"train_loss": -24.28985023498535, "global_step": 234740, "epoch": 2828} {"train_loss": -24.517864227294922, "global_step": 234741, "epoch": 2828} {"train_loss": -24.487356185913086, "global_step": 234742, "epoch": 2828} {"train_loss": -24.514219284057617, "global_step": 234743, "epoch": 2828} {"train_loss": -25.146520614624023, "global_step": 234744, "epoch": 2828} {"train_loss": -24.402013778686523, "global_step": 234745, "epoch": 2828} {"train_loss": -24.51239585876465, "global_step": 234746, "epoch": 2828} {"train_loss": -24.77958106994629, "global_step": 234747, "epoch": 2828} {"train_loss": -24.969219207763672, "global_step": 234748, "epoch": 2828} {"train_loss": -24.434263229370117, "global_step": 234749, "epoch": 2828} {"train_loss": -24.62201499938965, "global_step": 234750, "epoch": 2828} {"train_loss": -24.65195083618164, "global_step": 234751, "epoch": 2828} {"train_loss": -24.794309616088867, "global_step": 234752, "epoch": 2828} {"train_loss": -24.47779655456543, "global_step": 234753, "epoch": 2828} {"train_loss": -24.691556930541992, "global_step": 234754, "epoch": 2828} {"train_loss": -24.6856746673584, "global_step": 234755, "epoch": 2828} {"train_loss": -24.89698600769043, "global_step": 234756, "epoch": 2828} {"train_loss": -24.716684341430664, "global_step": 234757, "epoch": 2828} {"train_loss": -24.759992599487305, "global_step": 234758, "epoch": 2828} {"train_loss": -24.683979034423828, "global_step": 234759, "epoch": 2828} {"train_loss": -24.45722007751465, "global_step": 234760, "epoch": 2828} {"train_loss": -25.020389556884766, "global_step": 234761, "epoch": 2828} {"train_loss": -24.891653060913086, "global_step": 234762, "epoch": 2828} {"train_loss": -24.871204376220703, "global_step": 234763, "epoch": 2828} {"train_loss": -24.713239669799805, "global_step": 234764, "epoch": 2828} {"train_loss": -24.58493423461914, "global_step": 234765, "epoch": 2828} {"train_loss": -25.003828048706055, "global_step": 234766, "epoch": 2828} {"train_loss": -25.06703758239746, "global_step": 234767, "epoch": 2828} {"train_loss": -25.090656280517578, "global_step": 234768, "epoch": 2828} {"train_loss": -24.975820541381836, "global_step": 234769, "epoch": 2828} {"train_loss": -24.856956481933594, "global_step": 234770, "epoch": 2828} {"train_loss": -25.003087997436523, "global_step": 234771, "epoch": 2828} {"train_loss": -24.738187789916992, "global_step": 234772, "epoch": 2828} {"train_loss": -25.0667667388916, "global_step": 234773, "epoch": 2828} {"train_loss": -24.89910125732422, "global_step": 234774, "epoch": 2828} {"train_loss": -25.116865158081055, "global_step": 234775, "epoch": 2828} {"train_loss": -24.566389083862305, "global_step": 234776, "epoch": 2828} {"train_loss": -24.849355697631836, "global_step": 234777, "epoch": 2828} {"train_loss": -24.76256561279297, "global_step": 234778, "epoch": 2828} {"train_loss": -24.701107025146484, "global_step": 234779, "epoch": 2828} {"train_loss": -24.813743591308594, "global_step": 234780, "epoch": 2828} {"train_loss": -25.019773483276367, "global_step": 234781, "epoch": 2828} {"train_loss": -24.9919376373291, "global_step": 234782, "epoch": 2828} {"train_loss": -24.426694869995117, "global_step": 234783, "epoch": 2828} {"train_loss": -24.95966911315918, "global_step": 234784, "epoch": 2828} {"train_loss": -24.913015365600586, "global_step": 234785, "epoch": 2828} {"train_loss": -24.931604385375977, "global_step": 234786, "epoch": 2828} {"train_loss": -24.45394515991211, "global_step": 234787, "epoch": 2828} {"train_loss": -24.86078643798828, "global_step": 234788, "epoch": 2828} {"train_loss": -24.76024055480957, "global_step": 234789, "epoch": 2828} {"train_loss": -24.877155303955078, "global_step": 234790, "epoch": 2828} {"train_loss": -24.756671905517578, "global_step": 234791, "epoch": 2828} {"train_loss": -25.124027252197266, "global_step": 234792, "epoch": 2828} {"train_loss": -24.591428756713867, "global_step": 234793, "epoch": 2828} {"train_loss": -24.843618392944336, "global_step": 234794, "epoch": 2828} {"train_loss": -24.320104598999023, "global_step": 234795, "epoch": 2828} {"train_loss": -24.2664794921875, "global_step": 234796, "epoch": 2828} {"train_loss": -24.458711624145508, "global_step": 234797, "epoch": 2828} {"train_loss": -24.63766860961914, "global_step": 234798, "epoch": 2828} {"train_loss": -24.738859176635742, "global_step": 234799, "epoch": 2828} {"train_loss": -24.389911651611328, "global_step": 234800, "epoch": 2828} {"train_loss": -24.72121238708496, "global_step": 234801, "epoch": 2828} {"train_loss": -24.70196533203125, "global_step": 234802, "epoch": 2828} {"train_loss": -24.695171356201172, "global_step": 234803, "epoch": 2828} {"train_loss": -24.591938018798828, "global_step": 234804, "epoch": 2828} {"train_loss": -25.029748916625977, "global_step": 234805, "epoch": 2828} {"train_loss": -24.690957931150873, "global_step": 234806, "epoch": 2828, "val_loss": 6721131.0} {"train_loss": -22.776382446289062, "global_step": 234807, "epoch": 2829} {"train_loss": -23.34181785583496, "global_step": 234808, "epoch": 2829} {"train_loss": -23.971332550048828, "global_step": 234809, "epoch": 2829} {"train_loss": -23.777780532836914, "global_step": 234810, "epoch": 2829} {"train_loss": -23.859333038330078, "global_step": 234811, "epoch": 2829} {"train_loss": -23.7679386138916, "global_step": 234812, "epoch": 2829} {"train_loss": -24.09865951538086, "global_step": 234813, "epoch": 2829} {"train_loss": -24.306196212768555, "global_step": 234814, "epoch": 2829} {"train_loss": -24.3409481048584, "global_step": 234815, "epoch": 2829} {"train_loss": -24.719280242919922, "global_step": 234816, "epoch": 2829} {"train_loss": -24.356481552124023, "global_step": 234817, "epoch": 2829} {"train_loss": -24.603391647338867, "global_step": 234818, "epoch": 2829} {"train_loss": -24.10317039489746, "global_step": 234819, "epoch": 2829} {"train_loss": -24.037893295288086, "global_step": 234820, "epoch": 2829} {"train_loss": -24.64695167541504, "global_step": 234821, "epoch": 2829} {"train_loss": -24.45107650756836, "global_step": 234822, "epoch": 2829} {"train_loss": -24.701845169067383, "global_step": 234823, "epoch": 2829} {"train_loss": -24.338869094848633, "global_step": 234824, "epoch": 2829} {"train_loss": -24.387968063354492, "global_step": 234825, "epoch": 2829} {"train_loss": -24.4301700592041, "global_step": 234826, "epoch": 2829} {"train_loss": -24.516090393066406, "global_step": 234827, "epoch": 2829} {"train_loss": -24.67732048034668, "global_step": 234828, "epoch": 2829} {"train_loss": -24.49129295349121, "global_step": 234829, "epoch": 2829} {"train_loss": -24.446857452392578, "global_step": 234830, "epoch": 2829} {"train_loss": -24.5267276763916, "global_step": 234831, "epoch": 2829} {"train_loss": -24.688444137573242, "global_step": 234832, "epoch": 2829} {"train_loss": -24.66643524169922, "global_step": 234833, "epoch": 2829} {"train_loss": -25.04570770263672, "global_step": 234834, "epoch": 2829} {"train_loss": -24.63396644592285, "global_step": 234835, "epoch": 2829} {"train_loss": -24.702850341796875, "global_step": 234836, "epoch": 2829} {"train_loss": -24.58328628540039, "global_step": 234837, "epoch": 2829} {"train_loss": -24.550840377807617, "global_step": 234838, "epoch": 2829} {"train_loss": -25.12690544128418, "global_step": 234839, "epoch": 2829} {"train_loss": -24.952951431274414, "global_step": 234840, "epoch": 2829} {"train_loss": -24.84073257446289, "global_step": 234841, "epoch": 2829} {"train_loss": -25.19938087463379, "global_step": 234842, "epoch": 2829} {"train_loss": -24.7943058013916, "global_step": 234843, "epoch": 2829} {"train_loss": -25.018075942993164, "global_step": 234844, "epoch": 2829} {"train_loss": -24.748783111572266, "global_step": 234845, "epoch": 2829} {"train_loss": -24.973554611206055, "global_step": 234846, "epoch": 2829} {"train_loss": -24.946428298950195, "global_step": 234847, "epoch": 2829} {"train_loss": -25.059585571289062, "global_step": 234848, "epoch": 2829} {"train_loss": -24.518095016479492, "global_step": 234849, "epoch": 2829} {"train_loss": -24.655502319335938, "global_step": 234850, "epoch": 2829} {"train_loss": -25.01222038269043, "global_step": 234851, "epoch": 2829} {"train_loss": -24.65909194946289, "global_step": 234852, "epoch": 2829} {"train_loss": -24.381772994995117, "global_step": 234853, "epoch": 2829} {"train_loss": -24.381412506103516, "global_step": 234854, "epoch": 2829} {"train_loss": -25.002197265625, "global_step": 234855, "epoch": 2829} {"train_loss": -24.72615623474121, "global_step": 234856, "epoch": 2829} {"train_loss": -24.853052139282227, "global_step": 234857, "epoch": 2829} {"train_loss": -24.88304901123047, "global_step": 234858, "epoch": 2829} {"train_loss": -24.829591751098633, "global_step": 234859, "epoch": 2829} {"train_loss": -24.877309799194336, "global_step": 234860, "epoch": 2829} {"train_loss": -25.044530868530273, "global_step": 234861, "epoch": 2829} {"train_loss": -24.98992919921875, "global_step": 234862, "epoch": 2829} {"train_loss": -24.625883102416992, "global_step": 234863, "epoch": 2829} {"train_loss": -24.8886661529541, "global_step": 234864, "epoch": 2829} {"train_loss": -24.757156372070312, "global_step": 234865, "epoch": 2829} {"train_loss": -24.694412231445312, "global_step": 234866, "epoch": 2829} {"train_loss": -24.78436279296875, "global_step": 234867, "epoch": 2829} {"train_loss": -24.666467666625977, "global_step": 234868, "epoch": 2829} {"train_loss": -24.712308883666992, "global_step": 234869, "epoch": 2829} {"train_loss": -25.215314865112305, "global_step": 234870, "epoch": 2829} {"train_loss": -24.85681915283203, "global_step": 234871, "epoch": 2829} {"train_loss": -25.032989501953125, "global_step": 234872, "epoch": 2829} {"train_loss": -24.726102828979492, "global_step": 234873, "epoch": 2829} {"train_loss": -25.116506576538086, "global_step": 234874, "epoch": 2829} {"train_loss": -24.771024703979492, "global_step": 234875, "epoch": 2829} {"train_loss": -24.916807174682617, "global_step": 234876, "epoch": 2829} {"train_loss": -25.052627563476562, "global_step": 234877, "epoch": 2829} {"train_loss": -25.04842185974121, "global_step": 234878, "epoch": 2829} {"train_loss": -24.921005249023438, "global_step": 234879, "epoch": 2829} {"train_loss": -24.96561050415039, "global_step": 234880, "epoch": 2829} {"train_loss": -24.88750648498535, "global_step": 234881, "epoch": 2829} {"train_loss": -24.882198333740234, "global_step": 234882, "epoch": 2829} {"train_loss": -24.719228744506836, "global_step": 234883, "epoch": 2829} {"train_loss": -25.113567352294922, "global_step": 234884, "epoch": 2829} {"train_loss": -25.037246704101562, "global_step": 234885, "epoch": 2829} {"train_loss": -24.726341247558594, "global_step": 234886, "epoch": 2829} {"train_loss": -24.590593338012695, "global_step": 234887, "epoch": 2829} {"train_loss": -24.500146865844727, "global_step": 234888, "epoch": 2829} {"train_loss": -24.681931690997388, "global_step": 234889, "epoch": 2829, "val_loss": 6829851.0} {"train_loss": -23.43314552307129, "global_step": 234890, "epoch": 2830} {"train_loss": -24.117355346679688, "global_step": 234891, "epoch": 2830} {"train_loss": -23.639257431030273, "global_step": 234892, "epoch": 2830} {"train_loss": -23.829740524291992, "global_step": 234893, "epoch": 2830} {"train_loss": -24.491411209106445, "global_step": 234894, "epoch": 2830} {"train_loss": -23.76120376586914, "global_step": 234895, "epoch": 2830} {"train_loss": -24.269025802612305, "global_step": 234896, "epoch": 2830} {"train_loss": -24.317394256591797, "global_step": 234897, "epoch": 2830} {"train_loss": -24.056415557861328, "global_step": 234898, "epoch": 2830} {"train_loss": -24.159643173217773, "global_step": 234899, "epoch": 2830} {"train_loss": -24.210477828979492, "global_step": 234900, "epoch": 2830} {"train_loss": -24.43329620361328, "global_step": 234901, "epoch": 2830} {"train_loss": -24.63136863708496, "global_step": 234902, "epoch": 2830} {"train_loss": -24.358749389648438, "global_step": 234903, "epoch": 2830} {"train_loss": -24.58587646484375, "global_step": 234904, "epoch": 2830} {"train_loss": -24.342405319213867, "global_step": 234905, "epoch": 2830} {"train_loss": -24.706361770629883, "global_step": 234906, "epoch": 2830} {"train_loss": -24.581693649291992, "global_step": 234907, "epoch": 2830} {"train_loss": -24.63018035888672, "global_step": 234908, "epoch": 2830} {"train_loss": -24.45524024963379, "global_step": 234909, "epoch": 2830} {"train_loss": -24.80574607849121, "global_step": 234910, "epoch": 2830} {"train_loss": -24.388858795166016, "global_step": 234911, "epoch": 2830} {"train_loss": -24.849918365478516, "global_step": 234912, "epoch": 2830} {"train_loss": -24.82090187072754, "global_step": 234913, "epoch": 2830} {"train_loss": -24.647436141967773, "global_step": 234914, "epoch": 2830} {"train_loss": -24.56601333618164, "global_step": 234915, "epoch": 2830} {"train_loss": -24.703872680664062, "global_step": 234916, "epoch": 2830} {"train_loss": -24.910398483276367, "global_step": 234917, "epoch": 2830} {"train_loss": -24.60976791381836, "global_step": 234918, "epoch": 2830} {"train_loss": -25.15350914001465, "global_step": 234919, "epoch": 2830} {"train_loss": -24.56219482421875, "global_step": 234920, "epoch": 2830} {"train_loss": -24.764835357666016, "global_step": 234921, "epoch": 2830} {"train_loss": -24.80733299255371, "global_step": 234922, "epoch": 2830} {"train_loss": -25.201330184936523, "global_step": 234923, "epoch": 2830} {"train_loss": -24.847986221313477, "global_step": 234924, "epoch": 2830} {"train_loss": -24.849302291870117, "global_step": 234925, "epoch": 2830} {"train_loss": -25.05470085144043, "global_step": 234926, "epoch": 2830} {"train_loss": -25.24212646484375, "global_step": 234927, "epoch": 2830} {"train_loss": -24.53632164001465, "global_step": 234928, "epoch": 2830} {"train_loss": -24.815290451049805, "global_step": 234929, "epoch": 2830} {"train_loss": -24.896718978881836, "global_step": 234930, "epoch": 2830} {"train_loss": -24.623493194580078, "global_step": 234931, "epoch": 2830} {"train_loss": -24.8343563079834, "global_step": 234932, "epoch": 2830} {"train_loss": -24.926374435424805, "global_step": 234933, "epoch": 2830} {"train_loss": -25.02458953857422, "global_step": 234934, "epoch": 2830} {"train_loss": -24.74339485168457, "global_step": 234935, "epoch": 2830} {"train_loss": -24.530031204223633, "global_step": 234936, "epoch": 2830} {"train_loss": -24.9654598236084, "global_step": 234937, "epoch": 2830} {"train_loss": -24.97675132751465, "global_step": 234938, "epoch": 2830} {"train_loss": -25.319660186767578, "global_step": 234939, "epoch": 2830} {"train_loss": -24.719789505004883, "global_step": 234940, "epoch": 2830} {"train_loss": -24.844348907470703, "global_step": 234941, "epoch": 2830} {"train_loss": -24.790311813354492, "global_step": 234942, "epoch": 2830} {"train_loss": -24.52265739440918, "global_step": 234943, "epoch": 2830} {"train_loss": -24.97226905822754, "global_step": 234944, "epoch": 2830} {"train_loss": -24.56757164001465, "global_step": 234945, "epoch": 2830} {"train_loss": -24.37872886657715, "global_step": 234946, "epoch": 2830} {"train_loss": -24.948698043823242, "global_step": 234947, "epoch": 2830} {"train_loss": -25.095624923706055, "global_step": 234948, "epoch": 2830} {"train_loss": -25.06544303894043, "global_step": 234949, "epoch": 2830} {"train_loss": -24.731752395629883, "global_step": 234950, "epoch": 2830} {"train_loss": -24.5731143951416, "global_step": 234951, "epoch": 2830} {"train_loss": -24.722871780395508, "global_step": 234952, "epoch": 2830} {"train_loss": -24.64972496032715, "global_step": 234953, "epoch": 2830} {"train_loss": -24.889150619506836, "global_step": 234954, "epoch": 2830} {"train_loss": -24.772563934326172, "global_step": 234955, "epoch": 2830} {"train_loss": -25.001296997070312, "global_step": 234956, "epoch": 2830} {"train_loss": -25.08711814880371, "global_step": 234957, "epoch": 2830} {"train_loss": -24.961889266967773, "global_step": 234958, "epoch": 2830} {"train_loss": -24.572086334228516, "global_step": 234959, "epoch": 2830} {"train_loss": -24.8140926361084, "global_step": 234960, "epoch": 2830} {"train_loss": -24.907176971435547, "global_step": 234961, "epoch": 2830} {"train_loss": -24.31118392944336, "global_step": 234962, "epoch": 2830} {"train_loss": -25.392297744750977, "global_step": 234963, "epoch": 2830} {"train_loss": -24.595504760742188, "global_step": 234964, "epoch": 2830} {"train_loss": -24.849058151245117, "global_step": 234965, "epoch": 2830} {"train_loss": -24.529573440551758, "global_step": 234966, "epoch": 2830} {"train_loss": -24.211118698120117, "global_step": 234967, "epoch": 2830} {"train_loss": -24.606794357299805, "global_step": 234968, "epoch": 2830} {"train_loss": -24.666549682617188, "global_step": 234969, "epoch": 2830} {"train_loss": -24.887441635131836, "global_step": 234970, "epoch": 2830} {"train_loss": -24.595993041992188, "global_step": 234971, "epoch": 2830} {"train_loss": -24.663671654391003, "global_step": 234972, "epoch": 2830, "val_loss": 6812888.0} {"train_loss": -24.20183753967285, "global_step": 234973, "epoch": 2831} {"train_loss": -23.940643310546875, "global_step": 234974, "epoch": 2831} {"train_loss": -24.0371150970459, "global_step": 234975, "epoch": 2831} {"train_loss": -24.17487144470215, "global_step": 234976, "epoch": 2831} {"train_loss": -24.573057174682617, "global_step": 234977, "epoch": 2831} {"train_loss": -24.274818420410156, "global_step": 234978, "epoch": 2831} {"train_loss": -24.363248825073242, "global_step": 234979, "epoch": 2831} {"train_loss": -24.580232620239258, "global_step": 234980, "epoch": 2831} {"train_loss": -24.690185546875, "global_step": 234981, "epoch": 2831} {"train_loss": -24.563159942626953, "global_step": 234982, "epoch": 2831} {"train_loss": -24.604799270629883, "global_step": 234983, "epoch": 2831} {"train_loss": -24.842327117919922, "global_step": 234984, "epoch": 2831} {"train_loss": -24.65610694885254, "global_step": 234985, "epoch": 2831} {"train_loss": -24.532190322875977, "global_step": 234986, "epoch": 2831} {"train_loss": -24.75129508972168, "global_step": 234987, "epoch": 2831} {"train_loss": -24.935827255249023, "global_step": 234988, "epoch": 2831} {"train_loss": -24.70978355407715, "global_step": 234989, "epoch": 2831} {"train_loss": -24.806669235229492, "global_step": 234990, "epoch": 2831} {"train_loss": -24.602588653564453, "global_step": 234991, "epoch": 2831} {"train_loss": -24.662107467651367, "global_step": 234992, "epoch": 2831} {"train_loss": -25.138532638549805, "global_step": 234993, "epoch": 2831} {"train_loss": -24.626422882080078, "global_step": 234994, "epoch": 2831} {"train_loss": -24.674549102783203, "global_step": 234995, "epoch": 2831} {"train_loss": -24.962575912475586, "global_step": 234996, "epoch": 2831} {"train_loss": -25.03620719909668, "global_step": 234997, "epoch": 2831} {"train_loss": -25.02411460876465, "global_step": 234998, "epoch": 2831} {"train_loss": -24.833765029907227, "global_step": 234999, "epoch": 2831} {"train_loss": -24.944311141967773, "global_step": 235000, "epoch": 2831} {"train_loss": -25.175031661987305, "global_step": 235001, "epoch": 2831} {"train_loss": -24.635278701782227, "global_step": 235002, "epoch": 2831} {"train_loss": -24.312976837158203, "global_step": 235003, "epoch": 2831} {"train_loss": -24.928075790405273, "global_step": 235004, "epoch": 2831} {"train_loss": -25.004703521728516, "global_step": 235005, "epoch": 2831} {"train_loss": -24.784025192260742, "global_step": 235006, "epoch": 2831} {"train_loss": -24.38930320739746, "global_step": 235007, "epoch": 2831} {"train_loss": -24.775680541992188, "global_step": 235008, "epoch": 2831} {"train_loss": -24.900590896606445, "global_step": 235009, "epoch": 2831} {"train_loss": -24.756528854370117, "global_step": 235010, "epoch": 2831} {"train_loss": -24.768169403076172, "global_step": 235011, "epoch": 2831} {"train_loss": -24.818119049072266, "global_step": 235012, "epoch": 2831} {"train_loss": -24.92283058166504, "global_step": 235013, "epoch": 2831} {"train_loss": -24.680789947509766, "global_step": 235014, "epoch": 2831} {"train_loss": -24.81667137145996, "global_step": 235015, "epoch": 2831} {"train_loss": -24.74945640563965, "global_step": 235016, "epoch": 2831} {"train_loss": -24.776227951049805, "global_step": 235017, "epoch": 2831} {"train_loss": -24.84429359436035, "global_step": 235018, "epoch": 2831} {"train_loss": -24.803266525268555, "global_step": 235019, "epoch": 2831} {"train_loss": -25.08814811706543, "global_step": 235020, "epoch": 2831} {"train_loss": -24.644287109375, "global_step": 235021, "epoch": 2831} {"train_loss": -25.063339233398438, "global_step": 235022, "epoch": 2831} {"train_loss": -25.072406768798828, "global_step": 235023, "epoch": 2831} {"train_loss": -24.844058990478516, "global_step": 235024, "epoch": 2831} {"train_loss": -24.640399932861328, "global_step": 235025, "epoch": 2831} {"train_loss": -24.917627334594727, "global_step": 235026, "epoch": 2831} {"train_loss": -24.71357536315918, "global_step": 235027, "epoch": 2831} {"train_loss": -24.972253799438477, "global_step": 235028, "epoch": 2831} {"train_loss": -24.784244537353516, "global_step": 235029, "epoch": 2831} {"train_loss": -25.14446449279785, "global_step": 235030, "epoch": 2831} {"train_loss": -25.18893051147461, "global_step": 235031, "epoch": 2831} {"train_loss": -24.892181396484375, "global_step": 235032, "epoch": 2831} {"train_loss": -24.96478843688965, "global_step": 235033, "epoch": 2831} {"train_loss": -24.89571762084961, "global_step": 235034, "epoch": 2831} {"train_loss": -24.596878051757812, "global_step": 235035, "epoch": 2831} {"train_loss": -24.651031494140625, "global_step": 235036, "epoch": 2831} {"train_loss": -24.678237915039062, "global_step": 235037, "epoch": 2831} {"train_loss": -24.519020080566406, "global_step": 235038, "epoch": 2831} {"train_loss": -24.630258560180664, "global_step": 235039, "epoch": 2831} {"train_loss": -24.940393447875977, "global_step": 235040, "epoch": 2831} {"train_loss": -24.567588806152344, "global_step": 235041, "epoch": 2831} {"train_loss": -24.55742645263672, "global_step": 235042, "epoch": 2831} {"train_loss": -24.725662231445312, "global_step": 235043, "epoch": 2831} {"train_loss": -24.722267150878906, "global_step": 235044, "epoch": 2831} {"train_loss": -24.840999603271484, "global_step": 235045, "epoch": 2831} {"train_loss": -24.942537307739258, "global_step": 235046, "epoch": 2831} {"train_loss": -25.00424575805664, "global_step": 235047, "epoch": 2831} {"train_loss": -24.70496368408203, "global_step": 235048, "epoch": 2831} {"train_loss": -24.604110717773438, "global_step": 235049, "epoch": 2831} {"train_loss": -24.64964485168457, "global_step": 235050, "epoch": 2831} {"train_loss": -24.640592575073242, "global_step": 235051, "epoch": 2831} {"train_loss": -24.748380661010742, "global_step": 235052, "epoch": 2831} {"train_loss": -24.887178421020508, "global_step": 235053, "epoch": 2831} {"train_loss": -24.34066390991211, "global_step": 235054, "epoch": 2831} {"train_loss": -24.736196563904542, "global_step": 235055, "epoch": 2831, "val_loss": 6611340.0} {"train_loss": -24.318342208862305, "global_step": 235056, "epoch": 2832} {"train_loss": -24.179922103881836, "global_step": 235057, "epoch": 2832} {"train_loss": -24.56093406677246, "global_step": 235058, "epoch": 2832} {"train_loss": -24.55824851989746, "global_step": 235059, "epoch": 2832} {"train_loss": -24.481929779052734, "global_step": 235060, "epoch": 2832} {"train_loss": -24.413227081298828, "global_step": 235061, "epoch": 2832} {"train_loss": -24.668170928955078, "global_step": 235062, "epoch": 2832} {"train_loss": -24.57620620727539, "global_step": 235063, "epoch": 2832} {"train_loss": -24.910858154296875, "global_step": 235064, "epoch": 2832} {"train_loss": -24.619749069213867, "global_step": 235065, "epoch": 2832} {"train_loss": -24.726770401000977, "global_step": 235066, "epoch": 2832} {"train_loss": -24.630460739135742, "global_step": 235067, "epoch": 2832} {"train_loss": -24.58980369567871, "global_step": 235068, "epoch": 2832} {"train_loss": -24.850906372070312, "global_step": 235069, "epoch": 2832} {"train_loss": -24.500131607055664, "global_step": 235070, "epoch": 2832} {"train_loss": -24.763120651245117, "global_step": 235071, "epoch": 2832} {"train_loss": -24.818603515625, "global_step": 235072, "epoch": 2832} {"train_loss": -24.83294677734375, "global_step": 235073, "epoch": 2832} {"train_loss": -24.73202896118164, "global_step": 235074, "epoch": 2832} {"train_loss": -24.822484970092773, "global_step": 235075, "epoch": 2832} {"train_loss": -24.986236572265625, "global_step": 235076, "epoch": 2832} {"train_loss": -24.781797409057617, "global_step": 235077, "epoch": 2832} {"train_loss": -24.68691062927246, "global_step": 235078, "epoch": 2832} {"train_loss": -24.68556785583496, "global_step": 235079, "epoch": 2832} {"train_loss": -24.574460983276367, "global_step": 235080, "epoch": 2832} {"train_loss": -24.701324462890625, "global_step": 235081, "epoch": 2832} {"train_loss": -24.88260841369629, "global_step": 235082, "epoch": 2832} {"train_loss": -24.938947677612305, "global_step": 235083, "epoch": 2832} {"train_loss": -24.45051383972168, "global_step": 235084, "epoch": 2832} {"train_loss": -24.831058502197266, "global_step": 235085, "epoch": 2832} {"train_loss": -24.883718490600586, "global_step": 235086, "epoch": 2832} {"train_loss": -24.553943634033203, "global_step": 235087, "epoch": 2832} {"train_loss": -24.820981979370117, "global_step": 235088, "epoch": 2832} {"train_loss": -24.67428970336914, "global_step": 235089, "epoch": 2832} {"train_loss": -24.727853775024414, "global_step": 235090, "epoch": 2832} {"train_loss": -25.137359619140625, "global_step": 235091, "epoch": 2832} {"train_loss": -24.777694702148438, "global_step": 235092, "epoch": 2832} {"train_loss": -24.6485652923584, "global_step": 235093, "epoch": 2832} {"train_loss": -24.89461326599121, "global_step": 235094, "epoch": 2832} {"train_loss": -24.501731872558594, "global_step": 235095, "epoch": 2832} {"train_loss": -24.84071922302246, "global_step": 235096, "epoch": 2832} {"train_loss": -24.810550689697266, "global_step": 235097, "epoch": 2832} {"train_loss": -24.869653701782227, "global_step": 235098, "epoch": 2832} {"train_loss": -24.578372955322266, "global_step": 235099, "epoch": 2832} {"train_loss": -25.34992218017578, "global_step": 235100, "epoch": 2832} {"train_loss": -24.999197006225586, "global_step": 235101, "epoch": 2832} {"train_loss": -24.844959259033203, "global_step": 235102, "epoch": 2832} {"train_loss": -24.76300811767578, "global_step": 235103, "epoch": 2832} {"train_loss": -24.530010223388672, "global_step": 235104, "epoch": 2832} {"train_loss": -25.03397560119629, "global_step": 235105, "epoch": 2832} {"train_loss": -25.056264877319336, "global_step": 235106, "epoch": 2832} {"train_loss": -25.076025009155273, "global_step": 235107, "epoch": 2832} {"train_loss": -24.815189361572266, "global_step": 235108, "epoch": 2832} {"train_loss": -25.032140731811523, "global_step": 235109, "epoch": 2832} {"train_loss": -24.879430770874023, "global_step": 235110, "epoch": 2832} {"train_loss": -25.290176391601562, "global_step": 235111, "epoch": 2832} {"train_loss": -24.67458152770996, "global_step": 235112, "epoch": 2832} {"train_loss": -24.812009811401367, "global_step": 235113, "epoch": 2832} {"train_loss": -25.05386734008789, "global_step": 235114, "epoch": 2832} {"train_loss": -24.748075485229492, "global_step": 235115, "epoch": 2832} {"train_loss": -24.677831649780273, "global_step": 235116, "epoch": 2832} {"train_loss": -24.84303092956543, "global_step": 235117, "epoch": 2832} {"train_loss": -24.420820236206055, "global_step": 235118, "epoch": 2832} {"train_loss": -24.4694881439209, "global_step": 235119, "epoch": 2832} {"train_loss": -23.92885398864746, "global_step": 235120, "epoch": 2832} {"train_loss": -24.577367782592773, "global_step": 235121, "epoch": 2832} {"train_loss": -25.058561325073242, "global_step": 235122, "epoch": 2832} {"train_loss": -24.725643157958984, "global_step": 235123, "epoch": 2832} {"train_loss": -24.55706787109375, "global_step": 235124, "epoch": 2832} {"train_loss": -24.41981315612793, "global_step": 235125, "epoch": 2832} {"train_loss": -24.999055862426758, "global_step": 235126, "epoch": 2832} {"train_loss": -24.605667114257812, "global_step": 235127, "epoch": 2832} {"train_loss": -24.75813102722168, "global_step": 235128, "epoch": 2832} {"train_loss": -24.5666561126709, "global_step": 235129, "epoch": 2832} {"train_loss": -24.70222282409668, "global_step": 235130, "epoch": 2832} {"train_loss": -25.106969833374023, "global_step": 235131, "epoch": 2832} {"train_loss": -24.788400650024414, "global_step": 235132, "epoch": 2832} {"train_loss": -24.532852172851562, "global_step": 235133, "epoch": 2832} {"train_loss": -25.00642204284668, "global_step": 235134, "epoch": 2832} {"train_loss": -25.09693145751953, "global_step": 235135, "epoch": 2832} {"train_loss": -24.74832534790039, "global_step": 235136, "epoch": 2832} {"train_loss": -24.592260360717773, "global_step": 235137, "epoch": 2832} {"train_loss": -24.74372815511313, "global_step": 235138, "epoch": 2832, "val_loss": 6680208.5} {"train_loss": -25.05307960510254, "global_step": 235139, "epoch": 2833} {"train_loss": -24.528867721557617, "global_step": 235140, "epoch": 2833} {"train_loss": -24.663883209228516, "global_step": 235141, "epoch": 2833} {"train_loss": -24.946186065673828, "global_step": 235142, "epoch": 2833} {"train_loss": -24.603443145751953, "global_step": 235143, "epoch": 2833} {"train_loss": -24.632278442382812, "global_step": 235144, "epoch": 2833} {"train_loss": -25.006681442260742, "global_step": 235145, "epoch": 2833} {"train_loss": -24.92100715637207, "global_step": 235146, "epoch": 2833} {"train_loss": -24.5187931060791, "global_step": 235147, "epoch": 2833} {"train_loss": -24.845556259155273, "global_step": 235148, "epoch": 2833} {"train_loss": -24.619800567626953, "global_step": 235149, "epoch": 2833} {"train_loss": -24.39217185974121, "global_step": 235150, "epoch": 2833} {"train_loss": -24.677818298339844, "global_step": 235151, "epoch": 2833} {"train_loss": -24.628803253173828, "global_step": 235152, "epoch": 2833} {"train_loss": -24.74599266052246, "global_step": 235153, "epoch": 2833} {"train_loss": -24.23714256286621, "global_step": 235154, "epoch": 2833} {"train_loss": -24.336576461791992, "global_step": 235155, "epoch": 2833} {"train_loss": -24.910837173461914, "global_step": 235156, "epoch": 2833} {"train_loss": -24.776214599609375, "global_step": 235157, "epoch": 2833} {"train_loss": -24.46308708190918, "global_step": 235158, "epoch": 2833} {"train_loss": -25.015472412109375, "global_step": 235159, "epoch": 2833} {"train_loss": -24.5595645904541, "global_step": 235160, "epoch": 2833} {"train_loss": -24.87531852722168, "global_step": 235161, "epoch": 2833} {"train_loss": -25.16708755493164, "global_step": 235162, "epoch": 2833} {"train_loss": -24.78075408935547, "global_step": 235163, "epoch": 2833} {"train_loss": -24.98832130432129, "global_step": 235164, "epoch": 2833} {"train_loss": -24.942962646484375, "global_step": 235165, "epoch": 2833} {"train_loss": -24.933542251586914, "global_step": 235166, "epoch": 2833} {"train_loss": -24.81243324279785, "global_step": 235167, "epoch": 2833} {"train_loss": -24.925504684448242, "global_step": 235168, "epoch": 2833} {"train_loss": -25.098596572875977, "global_step": 235169, "epoch": 2833} {"train_loss": -25.08839988708496, "global_step": 235170, "epoch": 2833} {"train_loss": -25.061452865600586, "global_step": 235171, "epoch": 2833} {"train_loss": -24.703134536743164, "global_step": 235172, "epoch": 2833} {"train_loss": -24.71548843383789, "global_step": 235173, "epoch": 2833} {"train_loss": -24.791791915893555, "global_step": 235174, "epoch": 2833} {"train_loss": -24.897815704345703, "global_step": 235175, "epoch": 2833} {"train_loss": -24.675840377807617, "global_step": 235176, "epoch": 2833} {"train_loss": -24.967134475708008, "global_step": 235177, "epoch": 2833} {"train_loss": -25.173919677734375, "global_step": 235178, "epoch": 2833} {"train_loss": -24.72093963623047, "global_step": 235179, "epoch": 2833} {"train_loss": -25.056140899658203, "global_step": 235180, "epoch": 2833} {"train_loss": -24.9174861907959, "global_step": 235181, "epoch": 2833} {"train_loss": -24.661630630493164, "global_step": 235182, "epoch": 2833} {"train_loss": -25.320234298706055, "global_step": 235183, "epoch": 2833} {"train_loss": -24.717639923095703, "global_step": 235184, "epoch": 2833} {"train_loss": -24.92591094970703, "global_step": 235185, "epoch": 2833} {"train_loss": -25.108407974243164, "global_step": 235186, "epoch": 2833} {"train_loss": -24.743146896362305, "global_step": 235187, "epoch": 2833} {"train_loss": -24.64984703063965, "global_step": 235188, "epoch": 2833} {"train_loss": -24.387685775756836, "global_step": 235189, "epoch": 2833} {"train_loss": -24.609893798828125, "global_step": 235190, "epoch": 2833} {"train_loss": -24.835790634155273, "global_step": 235191, "epoch": 2833} {"train_loss": -25.02509307861328, "global_step": 235192, "epoch": 2833} {"train_loss": -24.603975296020508, "global_step": 235193, "epoch": 2833} {"train_loss": -24.918855667114258, "global_step": 235194, "epoch": 2833} {"train_loss": -24.910310745239258, "global_step": 235195, "epoch": 2833} {"train_loss": -24.90730094909668, "global_step": 235196, "epoch": 2833} {"train_loss": -24.779829025268555, "global_step": 235197, "epoch": 2833} {"train_loss": -24.829618453979492, "global_step": 235198, "epoch": 2833} {"train_loss": -24.826257705688477, "global_step": 235199, "epoch": 2833} {"train_loss": -24.93951988220215, "global_step": 235200, "epoch": 2833} {"train_loss": -24.765790939331055, "global_step": 235201, "epoch": 2833} {"train_loss": -24.570127487182617, "global_step": 235202, "epoch": 2833} {"train_loss": -25.10530662536621, "global_step": 235203, "epoch": 2833} {"train_loss": -24.582351684570312, "global_step": 235204, "epoch": 2833} {"train_loss": -24.84027671813965, "global_step": 235205, "epoch": 2833} {"train_loss": -24.623010635375977, "global_step": 235206, "epoch": 2833} {"train_loss": -24.727218627929688, "global_step": 235207, "epoch": 2833} {"train_loss": -24.6910343170166, "global_step": 235208, "epoch": 2833} {"train_loss": -24.835315704345703, "global_step": 235209, "epoch": 2833} {"train_loss": -24.827966690063477, "global_step": 235210, "epoch": 2833} {"train_loss": -24.857187271118164, "global_step": 235211, "epoch": 2833} {"train_loss": -25.042821884155273, "global_step": 235212, "epoch": 2833} {"train_loss": -24.518024444580078, "global_step": 235213, "epoch": 2833} {"train_loss": -24.410667419433594, "global_step": 235214, "epoch": 2833} {"train_loss": -24.848604202270508, "global_step": 235215, "epoch": 2833} {"train_loss": -24.93305778503418, "global_step": 235216, "epoch": 2833} {"train_loss": -24.69097328186035, "global_step": 235217, "epoch": 2833} {"train_loss": -24.86762046813965, "global_step": 235218, "epoch": 2833} {"train_loss": -24.742319107055664, "global_step": 235219, "epoch": 2833} {"train_loss": -24.443872451782227, "global_step": 235220, "epoch": 2833} {"train_loss": -24.79084506666804, "global_step": 235221, "epoch": 2833, "val_loss": 6755060.0} {"train_loss": -23.978002548217773, "global_step": 235222, "epoch": 2834} {"train_loss": -24.966428756713867, "global_step": 235223, "epoch": 2834} {"train_loss": -24.748966217041016, "global_step": 235224, "epoch": 2834} {"train_loss": -23.790170669555664, "global_step": 235225, "epoch": 2834} {"train_loss": -24.7520809173584, "global_step": 235226, "epoch": 2834} {"train_loss": -24.2413387298584, "global_step": 235227, "epoch": 2834} {"train_loss": -24.26325035095215, "global_step": 235228, "epoch": 2834} {"train_loss": -24.6214599609375, "global_step": 235229, "epoch": 2834} {"train_loss": -24.549684524536133, "global_step": 235230, "epoch": 2834} {"train_loss": -24.715185165405273, "global_step": 235231, "epoch": 2834} {"train_loss": -24.51596450805664, "global_step": 235232, "epoch": 2834} {"train_loss": -24.652177810668945, "global_step": 235233, "epoch": 2834} {"train_loss": -24.805509567260742, "global_step": 235234, "epoch": 2834} {"train_loss": -24.5396785736084, "global_step": 235235, "epoch": 2834} {"train_loss": -24.319284439086914, "global_step": 235236, "epoch": 2834} {"train_loss": -24.70090675354004, "global_step": 235237, "epoch": 2834} {"train_loss": -24.860946655273438, "global_step": 235238, "epoch": 2834} {"train_loss": -24.87375259399414, "global_step": 235239, "epoch": 2834} {"train_loss": -24.903867721557617, "global_step": 235240, "epoch": 2834} {"train_loss": -24.879005432128906, "global_step": 235241, "epoch": 2834} {"train_loss": -24.502338409423828, "global_step": 235242, "epoch": 2834} {"train_loss": -24.871606826782227, "global_step": 235243, "epoch": 2834} {"train_loss": -24.88478660583496, "global_step": 235244, "epoch": 2834} {"train_loss": -24.45993423461914, "global_step": 235245, "epoch": 2834} {"train_loss": -24.6916446685791, "global_step": 235246, "epoch": 2834} {"train_loss": -24.91847801208496, "global_step": 235247, "epoch": 2834} {"train_loss": -24.88654899597168, "global_step": 235248, "epoch": 2834} {"train_loss": -24.672937393188477, "global_step": 235249, "epoch": 2834} {"train_loss": -25.000146865844727, "global_step": 235250, "epoch": 2834} {"train_loss": -24.798885345458984, "global_step": 235251, "epoch": 2834} {"train_loss": -24.703821182250977, "global_step": 235252, "epoch": 2834} {"train_loss": -24.926694869995117, "global_step": 235253, "epoch": 2834} {"train_loss": -25.1662540435791, "global_step": 235254, "epoch": 2834} {"train_loss": -24.966764450073242, "global_step": 235255, "epoch": 2834} {"train_loss": -24.933835983276367, "global_step": 235256, "epoch": 2834} {"train_loss": -24.712949752807617, "global_step": 235257, "epoch": 2834} {"train_loss": -24.67933464050293, "global_step": 235258, "epoch": 2834} {"train_loss": -24.73343276977539, "global_step": 235259, "epoch": 2834} {"train_loss": -24.721158981323242, "global_step": 235260, "epoch": 2834} {"train_loss": -24.875200271606445, "global_step": 235261, "epoch": 2834} {"train_loss": -24.72450065612793, "global_step": 235262, "epoch": 2834} {"train_loss": -24.61334228515625, "global_step": 235263, "epoch": 2834} {"train_loss": -24.5738525390625, "global_step": 235264, "epoch": 2834} {"train_loss": -24.968320846557617, "global_step": 235265, "epoch": 2834} {"train_loss": -24.845935821533203, "global_step": 235266, "epoch": 2834} {"train_loss": -24.677236557006836, "global_step": 235267, "epoch": 2834} {"train_loss": -24.42791175842285, "global_step": 235268, "epoch": 2834} {"train_loss": -24.58905029296875, "global_step": 235269, "epoch": 2834} {"train_loss": -24.90968894958496, "global_step": 235270, "epoch": 2834} {"train_loss": -25.053319931030273, "global_step": 235271, "epoch": 2834} {"train_loss": -24.462263107299805, "global_step": 235272, "epoch": 2834} {"train_loss": -24.679738998413086, "global_step": 235273, "epoch": 2834} {"train_loss": -24.722192764282227, "global_step": 235274, "epoch": 2834} {"train_loss": -24.935304641723633, "global_step": 235275, "epoch": 2834} {"train_loss": -25.007808685302734, "global_step": 235276, "epoch": 2834} {"train_loss": -24.533447265625, "global_step": 235277, "epoch": 2834} {"train_loss": -24.754478454589844, "global_step": 235278, "epoch": 2834} {"train_loss": -24.991559982299805, "global_step": 235279, "epoch": 2834} {"train_loss": -24.918149948120117, "global_step": 235280, "epoch": 2834} {"train_loss": -24.66828155517578, "global_step": 235281, "epoch": 2834} {"train_loss": -25.001277923583984, "global_step": 235282, "epoch": 2834} {"train_loss": -24.728866577148438, "global_step": 235283, "epoch": 2834} {"train_loss": -24.285551071166992, "global_step": 235284, "epoch": 2834} {"train_loss": -24.710281372070312, "global_step": 235285, "epoch": 2834} {"train_loss": -25.09053611755371, "global_step": 235286, "epoch": 2834} {"train_loss": -25.224756240844727, "global_step": 235287, "epoch": 2834} {"train_loss": -24.8621883392334, "global_step": 235288, "epoch": 2834} {"train_loss": -25.07547950744629, "global_step": 235289, "epoch": 2834} {"train_loss": -25.300207138061523, "global_step": 235290, "epoch": 2834} {"train_loss": -24.853254318237305, "global_step": 235291, "epoch": 2834} {"train_loss": -24.962900161743164, "global_step": 235292, "epoch": 2834} {"train_loss": -24.696561813354492, "global_step": 235293, "epoch": 2834} {"train_loss": -24.875463485717773, "global_step": 235294, "epoch": 2834} {"train_loss": -24.742420196533203, "global_step": 235295, "epoch": 2834} {"train_loss": -25.079940795898438, "global_step": 235296, "epoch": 2834} {"train_loss": -24.561857223510742, "global_step": 235297, "epoch": 2834} {"train_loss": -24.853750228881836, "global_step": 235298, "epoch": 2834} {"train_loss": -24.577913284301758, "global_step": 235299, "epoch": 2834} {"train_loss": -24.691974639892578, "global_step": 235300, "epoch": 2834} {"train_loss": -24.8467960357666, "global_step": 235301, "epoch": 2834} {"train_loss": -24.567480087280273, "global_step": 235302, "epoch": 2834} {"train_loss": -25.320453643798828, "global_step": 235303, "epoch": 2834} {"train_loss": -24.771913988044464, "global_step": 235304, "epoch": 2834, "val_loss": 6760960.0} {"train_loss": -24.092283248901367, "global_step": 235305, "epoch": 2835} {"train_loss": -24.381582260131836, "global_step": 235306, "epoch": 2835} {"train_loss": -24.47376251220703, "global_step": 235307, "epoch": 2835} {"train_loss": -24.43614387512207, "global_step": 235308, "epoch": 2835} {"train_loss": -24.16448974609375, "global_step": 235309, "epoch": 2835} {"train_loss": -24.44854164123535, "global_step": 235310, "epoch": 2835} {"train_loss": -24.452564239501953, "global_step": 235311, "epoch": 2835} {"train_loss": -24.376462936401367, "global_step": 235312, "epoch": 2835} {"train_loss": -24.807233810424805, "global_step": 235313, "epoch": 2835} {"train_loss": -24.535308837890625, "global_step": 235314, "epoch": 2835} {"train_loss": -24.580520629882812, "global_step": 235315, "epoch": 2835} {"train_loss": -24.39948272705078, "global_step": 235316, "epoch": 2835} {"train_loss": -24.719135284423828, "global_step": 235317, "epoch": 2835} {"train_loss": -24.495487213134766, "global_step": 235318, "epoch": 2835} {"train_loss": -24.559110641479492, "global_step": 235319, "epoch": 2835} {"train_loss": -24.47495460510254, "global_step": 235320, "epoch": 2835} {"train_loss": -24.64882469177246, "global_step": 235321, "epoch": 2835} {"train_loss": -24.795413970947266, "global_step": 235322, "epoch": 2835} {"train_loss": -24.7058162689209, "global_step": 235323, "epoch": 2835} {"train_loss": -24.659692764282227, "global_step": 235324, "epoch": 2835} {"train_loss": -24.859111785888672, "global_step": 235325, "epoch": 2835} {"train_loss": -25.0866756439209, "global_step": 235326, "epoch": 2835} {"train_loss": -24.78334617614746, "global_step": 235327, "epoch": 2835} {"train_loss": -24.86408042907715, "global_step": 235328, "epoch": 2835} {"train_loss": -25.084611892700195, "global_step": 235329, "epoch": 2835} {"train_loss": -24.841293334960938, "global_step": 235330, "epoch": 2835} {"train_loss": -24.485628128051758, "global_step": 235331, "epoch": 2835} {"train_loss": -24.646177291870117, "global_step": 235332, "epoch": 2835} {"train_loss": -24.69966697692871, "global_step": 235333, "epoch": 2835} {"train_loss": -25.223188400268555, "global_step": 235334, "epoch": 2835} {"train_loss": -25.33567237854004, "global_step": 235335, "epoch": 2835} {"train_loss": -25.171314239501953, "global_step": 235336, "epoch": 2835} {"train_loss": -24.545501708984375, "global_step": 235337, "epoch": 2835} {"train_loss": -24.718420028686523, "global_step": 235338, "epoch": 2835} {"train_loss": -24.68071937561035, "global_step": 235339, "epoch": 2835} {"train_loss": -24.750898361206055, "global_step": 235340, "epoch": 2835} {"train_loss": -24.53480339050293, "global_step": 235341, "epoch": 2835} {"train_loss": -24.170806884765625, "global_step": 235342, "epoch": 2835} {"train_loss": -25.247089385986328, "global_step": 235343, "epoch": 2835} {"train_loss": -24.7493953704834, "global_step": 235344, "epoch": 2835} {"train_loss": -24.14852523803711, "global_step": 235345, "epoch": 2835} {"train_loss": -24.517004013061523, "global_step": 235346, "epoch": 2835} {"train_loss": -24.638227462768555, "global_step": 235347, "epoch": 2835} {"train_loss": -24.582992553710938, "global_step": 235348, "epoch": 2835} {"train_loss": -24.3782958984375, "global_step": 235349, "epoch": 2835} {"train_loss": -24.690088272094727, "global_step": 235350, "epoch": 2835} {"train_loss": -24.53386688232422, "global_step": 235351, "epoch": 2835} {"train_loss": -24.86957359313965, "global_step": 235352, "epoch": 2835} {"train_loss": -23.810184478759766, "global_step": 235353, "epoch": 2835} {"train_loss": -24.300878524780273, "global_step": 235354, "epoch": 2835} {"train_loss": -24.315210342407227, "global_step": 235355, "epoch": 2835} {"train_loss": -24.23221206665039, "global_step": 235356, "epoch": 2835} {"train_loss": -24.828842163085938, "global_step": 235357, "epoch": 2835} {"train_loss": -24.33078956604004, "global_step": 235358, "epoch": 2835} {"train_loss": -24.879064559936523, "global_step": 235359, "epoch": 2835} {"train_loss": -24.388341903686523, "global_step": 235360, "epoch": 2835} {"train_loss": -24.63109016418457, "global_step": 235361, "epoch": 2835} {"train_loss": -24.585784912109375, "global_step": 235362, "epoch": 2835} {"train_loss": -24.177213668823242, "global_step": 235363, "epoch": 2835} {"train_loss": -24.58839988708496, "global_step": 235364, "epoch": 2835} {"train_loss": -24.688613891601562, "global_step": 235365, "epoch": 2835} {"train_loss": -24.387014389038086, "global_step": 235366, "epoch": 2835} {"train_loss": -24.64873695373535, "global_step": 235367, "epoch": 2835} {"train_loss": -24.249914169311523, "global_step": 235368, "epoch": 2835} {"train_loss": -24.492786407470703, "global_step": 235369, "epoch": 2835} {"train_loss": -24.6112003326416, "global_step": 235370, "epoch": 2835} {"train_loss": -24.67689323425293, "global_step": 235371, "epoch": 2835} {"train_loss": -24.87647819519043, "global_step": 235372, "epoch": 2835} {"train_loss": -24.568119049072266, "global_step": 235373, "epoch": 2835} {"train_loss": -24.712995529174805, "global_step": 235374, "epoch": 2835} {"train_loss": -24.656173706054688, "global_step": 235375, "epoch": 2835} {"train_loss": -24.578672409057617, "global_step": 235376, "epoch": 2835} {"train_loss": -24.837038040161133, "global_step": 235377, "epoch": 2835} {"train_loss": -24.756338119506836, "global_step": 235378, "epoch": 2835} {"train_loss": -24.285842895507812, "global_step": 235379, "epoch": 2835} {"train_loss": -24.771032333374023, "global_step": 235380, "epoch": 2835} {"train_loss": -24.83649253845215, "global_step": 235381, "epoch": 2835} {"train_loss": -25.199735641479492, "global_step": 235382, "epoch": 2835} {"train_loss": -24.669677734375, "global_step": 235383, "epoch": 2835} {"train_loss": -24.610279083251953, "global_step": 235384, "epoch": 2835} {"train_loss": -24.902271270751953, "global_step": 235385, "epoch": 2835} {"train_loss": -24.83930015563965, "global_step": 235386, "epoch": 2835} {"train_loss": -24.604170282203032, "global_step": 235387, "epoch": 2835, "val_loss": 6837671.0} {"train_loss": -24.2779483795166, "global_step": 235388, "epoch": 2836} {"train_loss": -24.406850814819336, "global_step": 235389, "epoch": 2836} {"train_loss": -24.278711318969727, "global_step": 235390, "epoch": 2836} {"train_loss": -24.365814208984375, "global_step": 235391, "epoch": 2836} {"train_loss": -24.717761993408203, "global_step": 235392, "epoch": 2836} {"train_loss": -24.578739166259766, "global_step": 235393, "epoch": 2836} {"train_loss": -24.1083927154541, "global_step": 235394, "epoch": 2836} {"train_loss": -24.523588180541992, "global_step": 235395, "epoch": 2836} {"train_loss": -24.450424194335938, "global_step": 235396, "epoch": 2836} {"train_loss": -24.60038185119629, "global_step": 235397, "epoch": 2836} {"train_loss": -24.59430694580078, "global_step": 235398, "epoch": 2836} {"train_loss": -24.91497802734375, "global_step": 235399, "epoch": 2836} {"train_loss": -24.893735885620117, "global_step": 235400, "epoch": 2836} {"train_loss": -24.808332443237305, "global_step": 235401, "epoch": 2836} {"train_loss": -24.808908462524414, "global_step": 235402, "epoch": 2836} {"train_loss": -24.72650718688965, "global_step": 235403, "epoch": 2836} {"train_loss": -24.509342193603516, "global_step": 235404, "epoch": 2836} {"train_loss": -24.731800079345703, "global_step": 235405, "epoch": 2836} {"train_loss": -25.279314041137695, "global_step": 235406, "epoch": 2836} {"train_loss": -24.920452117919922, "global_step": 235407, "epoch": 2836} {"train_loss": -24.717313766479492, "global_step": 235408, "epoch": 2836} {"train_loss": -25.205137252807617, "global_step": 235409, "epoch": 2836} {"train_loss": -24.78420639038086, "global_step": 235410, "epoch": 2836} {"train_loss": -24.99397850036621, "global_step": 235411, "epoch": 2836} {"train_loss": -24.771024703979492, "global_step": 235412, "epoch": 2836} {"train_loss": -24.867704391479492, "global_step": 235413, "epoch": 2836} {"train_loss": -24.67951202392578, "global_step": 235414, "epoch": 2836} {"train_loss": -24.969558715820312, "global_step": 235415, "epoch": 2836} {"train_loss": -24.867725372314453, "global_step": 235416, "epoch": 2836} {"train_loss": -25.02894401550293, "global_step": 235417, "epoch": 2836} {"train_loss": -25.0375919342041, "global_step": 235418, "epoch": 2836} {"train_loss": -24.90997314453125, "global_step": 235419, "epoch": 2836} {"train_loss": -24.73659324645996, "global_step": 235420, "epoch": 2836} {"train_loss": -24.72713279724121, "global_step": 235421, "epoch": 2836} {"train_loss": -24.93484878540039, "global_step": 235422, "epoch": 2836} {"train_loss": -24.941884994506836, "global_step": 235423, "epoch": 2836} {"train_loss": -24.42506217956543, "global_step": 235424, "epoch": 2836} {"train_loss": -24.611520767211914, "global_step": 235425, "epoch": 2836} {"train_loss": -24.652494430541992, "global_step": 235426, "epoch": 2836} {"train_loss": -24.3713321685791, "global_step": 235427, "epoch": 2836} {"train_loss": -24.720457077026367, "global_step": 235428, "epoch": 2836} {"train_loss": -24.90694808959961, "global_step": 235429, "epoch": 2836} {"train_loss": -24.748062133789062, "global_step": 235430, "epoch": 2836} {"train_loss": -24.60511589050293, "global_step": 235431, "epoch": 2836} {"train_loss": -24.729368209838867, "global_step": 235432, "epoch": 2836} {"train_loss": -25.0017147064209, "global_step": 235433, "epoch": 2836} {"train_loss": -24.75531578063965, "global_step": 235434, "epoch": 2836} {"train_loss": -24.322113037109375, "global_step": 235435, "epoch": 2836} {"train_loss": -25.161441802978516, "global_step": 235436, "epoch": 2836} {"train_loss": -24.461450576782227, "global_step": 235437, "epoch": 2836} {"train_loss": -24.723068237304688, "global_step": 235438, "epoch": 2836} {"train_loss": -24.732410430908203, "global_step": 235439, "epoch": 2836} {"train_loss": -24.64693260192871, "global_step": 235440, "epoch": 2836} {"train_loss": -24.515209197998047, "global_step": 235441, "epoch": 2836} {"train_loss": -24.49281883239746, "global_step": 235442, "epoch": 2836} {"train_loss": -24.767255783081055, "global_step": 235443, "epoch": 2836} {"train_loss": -24.95671272277832, "global_step": 235444, "epoch": 2836} {"train_loss": -24.784902572631836, "global_step": 235445, "epoch": 2836} {"train_loss": -24.826231002807617, "global_step": 235446, "epoch": 2836} {"train_loss": -24.602109909057617, "global_step": 235447, "epoch": 2836} {"train_loss": -24.904678344726562, "global_step": 235448, "epoch": 2836} {"train_loss": -24.897462844848633, "global_step": 235449, "epoch": 2836} {"train_loss": -24.7662353515625, "global_step": 235450, "epoch": 2836} {"train_loss": -24.93788719177246, "global_step": 235451, "epoch": 2836} {"train_loss": -24.948514938354492, "global_step": 235452, "epoch": 2836} {"train_loss": -24.876972198486328, "global_step": 235453, "epoch": 2836} {"train_loss": -24.9769344329834, "global_step": 235454, "epoch": 2836} {"train_loss": -24.846914291381836, "global_step": 235455, "epoch": 2836} {"train_loss": -24.870315551757812, "global_step": 235456, "epoch": 2836} {"train_loss": -24.82571792602539, "global_step": 235457, "epoch": 2836} {"train_loss": -24.952106475830078, "global_step": 235458, "epoch": 2836} {"train_loss": -24.985565185546875, "global_step": 235459, "epoch": 2836} {"train_loss": -25.099987030029297, "global_step": 235460, "epoch": 2836} {"train_loss": -24.67959976196289, "global_step": 235461, "epoch": 2836} {"train_loss": -24.969663619995117, "global_step": 235462, "epoch": 2836} {"train_loss": -24.96428871154785, "global_step": 235463, "epoch": 2836} {"train_loss": -24.71637535095215, "global_step": 235464, "epoch": 2836} {"train_loss": -25.083524703979492, "global_step": 235465, "epoch": 2836} {"train_loss": -24.603309631347656, "global_step": 235466, "epoch": 2836} {"train_loss": -25.506956100463867, "global_step": 235467, "epoch": 2836} {"train_loss": -24.857389450073242, "global_step": 235468, "epoch": 2836} {"train_loss": -25.262788772583008, "global_step": 235469, "epoch": 2836} {"train_loss": -24.770999265004352, "global_step": 235470, "epoch": 2836, "val_loss": 6695454.0} {"train_loss": -24.464487075805664, "global_step": 235471, "epoch": 2837} {"train_loss": -23.996980667114258, "global_step": 235472, "epoch": 2837} {"train_loss": -24.456235885620117, "global_step": 235473, "epoch": 2837} {"train_loss": -24.44012451171875, "global_step": 235474, "epoch": 2837} {"train_loss": -24.16542625427246, "global_step": 235475, "epoch": 2837} {"train_loss": -24.88360595703125, "global_step": 235476, "epoch": 2837} {"train_loss": -24.44608497619629, "global_step": 235477, "epoch": 2837} {"train_loss": -24.83555030822754, "global_step": 235478, "epoch": 2837} {"train_loss": -24.695032119750977, "global_step": 235479, "epoch": 2837} {"train_loss": -24.888463973999023, "global_step": 235480, "epoch": 2837} {"train_loss": -24.850345611572266, "global_step": 235481, "epoch": 2837} {"train_loss": -24.866653442382812, "global_step": 235482, "epoch": 2837} {"train_loss": -24.75650978088379, "global_step": 235483, "epoch": 2837} {"train_loss": -25.105737686157227, "global_step": 235484, "epoch": 2837} {"train_loss": -24.551380157470703, "global_step": 235485, "epoch": 2837} {"train_loss": -24.729711532592773, "global_step": 235486, "epoch": 2837} {"train_loss": -24.998737335205078, "global_step": 235487, "epoch": 2837} {"train_loss": -24.832626342773438, "global_step": 235488, "epoch": 2837} {"train_loss": -25.151321411132812, "global_step": 235489, "epoch": 2837} {"train_loss": -24.668846130371094, "global_step": 235490, "epoch": 2837} {"train_loss": -24.543237686157227, "global_step": 235491, "epoch": 2837} {"train_loss": -24.44642448425293, "global_step": 235492, "epoch": 2837} {"train_loss": -24.595203399658203, "global_step": 235493, "epoch": 2837} {"train_loss": -24.895244598388672, "global_step": 235494, "epoch": 2837} {"train_loss": -24.571348190307617, "global_step": 235495, "epoch": 2837} {"train_loss": -24.508211135864258, "global_step": 235496, "epoch": 2837} {"train_loss": -25.094085693359375, "global_step": 235497, "epoch": 2837} {"train_loss": -24.90925407409668, "global_step": 235498, "epoch": 2837} {"train_loss": -24.793272018432617, "global_step": 235499, "epoch": 2837} {"train_loss": -24.215970993041992, "global_step": 235500, "epoch": 2837} {"train_loss": -24.38966178894043, "global_step": 235501, "epoch": 2837} {"train_loss": -24.69485092163086, "global_step": 235502, "epoch": 2837} {"train_loss": -24.526065826416016, "global_step": 235503, "epoch": 2837} {"train_loss": -24.86305046081543, "global_step": 235504, "epoch": 2837} {"train_loss": -24.803266525268555, "global_step": 235505, "epoch": 2837} {"train_loss": -24.6947078704834, "global_step": 235506, "epoch": 2837} {"train_loss": -24.90000343322754, "global_step": 235507, "epoch": 2837} {"train_loss": -25.078481674194336, "global_step": 235508, "epoch": 2837} {"train_loss": -24.44202995300293, "global_step": 235509, "epoch": 2837} {"train_loss": -24.563751220703125, "global_step": 235510, "epoch": 2837} {"train_loss": -24.5788516998291, "global_step": 235511, "epoch": 2837} {"train_loss": -25.012033462524414, "global_step": 235512, "epoch": 2837} {"train_loss": -24.681747436523438, "global_step": 235513, "epoch": 2837} {"train_loss": -24.772907257080078, "global_step": 235514, "epoch": 2837} {"train_loss": -24.39497184753418, "global_step": 235515, "epoch": 2837} {"train_loss": -24.489866256713867, "global_step": 235516, "epoch": 2837} {"train_loss": -24.541475296020508, "global_step": 235517, "epoch": 2837} {"train_loss": -24.83449363708496, "global_step": 235518, "epoch": 2837} {"train_loss": -24.75844383239746, "global_step": 235519, "epoch": 2837} {"train_loss": -24.450071334838867, "global_step": 235520, "epoch": 2837} {"train_loss": -25.044309616088867, "global_step": 235521, "epoch": 2837} {"train_loss": -24.817035675048828, "global_step": 235522, "epoch": 2837} {"train_loss": -24.62835693359375, "global_step": 235523, "epoch": 2837} {"train_loss": -24.701343536376953, "global_step": 235524, "epoch": 2837} {"train_loss": -24.93611717224121, "global_step": 235525, "epoch": 2837} {"train_loss": -25.268884658813477, "global_step": 235526, "epoch": 2837} {"train_loss": -24.922985076904297, "global_step": 235527, "epoch": 2837} {"train_loss": -24.89151954650879, "global_step": 235528, "epoch": 2837} {"train_loss": -24.790298461914062, "global_step": 235529, "epoch": 2837} {"train_loss": -25.00298309326172, "global_step": 235530, "epoch": 2837} {"train_loss": -24.70738983154297, "global_step": 235531, "epoch": 2837} {"train_loss": -24.94101333618164, "global_step": 235532, "epoch": 2837} {"train_loss": -24.67734146118164, "global_step": 235533, "epoch": 2837} {"train_loss": -25.04648780822754, "global_step": 235534, "epoch": 2837} {"train_loss": -24.786386489868164, "global_step": 235535, "epoch": 2837} {"train_loss": -24.997522354125977, "global_step": 235536, "epoch": 2837} {"train_loss": -25.025129318237305, "global_step": 235537, "epoch": 2837} {"train_loss": -24.3007869720459, "global_step": 235538, "epoch": 2837} {"train_loss": -24.98902702331543, "global_step": 235539, "epoch": 2837} {"train_loss": -24.479665756225586, "global_step": 235540, "epoch": 2837} {"train_loss": -24.51081657409668, "global_step": 235541, "epoch": 2837} {"train_loss": -24.847700119018555, "global_step": 235542, "epoch": 2837} {"train_loss": -25.053176879882812, "global_step": 235543, "epoch": 2837} {"train_loss": -24.63446617126465, "global_step": 235544, "epoch": 2837} {"train_loss": -24.805532455444336, "global_step": 235545, "epoch": 2837} {"train_loss": -24.726703643798828, "global_step": 235546, "epoch": 2837} {"train_loss": -24.800344467163086, "global_step": 235547, "epoch": 2837} {"train_loss": -24.469125747680664, "global_step": 235548, "epoch": 2837} {"train_loss": -24.98701286315918, "global_step": 235549, "epoch": 2837} {"train_loss": -24.701887130737305, "global_step": 235550, "epoch": 2837} {"train_loss": -24.966413497924805, "global_step": 235551, "epoch": 2837} {"train_loss": -24.649595260620117, "global_step": 235552, "epoch": 2837} {"train_loss": -24.731231068990315, "global_step": 235553, "epoch": 2837, "val_loss": 6799585.0} {"train_loss": -24.62244987487793, "global_step": 235554, "epoch": 2838} {"train_loss": -24.784286499023438, "global_step": 235555, "epoch": 2838} {"train_loss": -24.81644630432129, "global_step": 235556, "epoch": 2838} {"train_loss": -24.36798667907715, "global_step": 235557, "epoch": 2838} {"train_loss": -24.45777702331543, "global_step": 235558, "epoch": 2838} {"train_loss": -24.370702743530273, "global_step": 235559, "epoch": 2838} {"train_loss": -24.653024673461914, "global_step": 235560, "epoch": 2838} {"train_loss": -24.413793563842773, "global_step": 235561, "epoch": 2838} {"train_loss": -24.4955997467041, "global_step": 235562, "epoch": 2838} {"train_loss": -24.81476402282715, "global_step": 235563, "epoch": 2838} {"train_loss": -24.955556869506836, "global_step": 235564, "epoch": 2838} {"train_loss": -24.45862579345703, "global_step": 235565, "epoch": 2838} {"train_loss": -24.66387367248535, "global_step": 235566, "epoch": 2838} {"train_loss": -24.93098258972168, "global_step": 235567, "epoch": 2838} {"train_loss": -24.673341751098633, "global_step": 235568, "epoch": 2838} {"train_loss": -23.994037628173828, "global_step": 235569, "epoch": 2838} {"train_loss": -24.410009384155273, "global_step": 235570, "epoch": 2838} {"train_loss": -24.545413970947266, "global_step": 235571, "epoch": 2838} {"train_loss": -24.49690055847168, "global_step": 235572, "epoch": 2838} {"train_loss": -24.30585289001465, "global_step": 235573, "epoch": 2838} {"train_loss": -24.56954002380371, "global_step": 235574, "epoch": 2838} {"train_loss": -24.174673080444336, "global_step": 235575, "epoch": 2838} {"train_loss": -24.46933364868164, "global_step": 235576, "epoch": 2838} {"train_loss": -24.48005485534668, "global_step": 235577, "epoch": 2838} {"train_loss": -24.538440704345703, "global_step": 235578, "epoch": 2838} {"train_loss": -24.692951202392578, "global_step": 235579, "epoch": 2838} {"train_loss": -24.967636108398438, "global_step": 235580, "epoch": 2838} {"train_loss": -24.6378173828125, "global_step": 235581, "epoch": 2838} {"train_loss": -24.581335067749023, "global_step": 235582, "epoch": 2838} {"train_loss": -24.8856143951416, "global_step": 235583, "epoch": 2838} {"train_loss": -24.830121994018555, "global_step": 235584, "epoch": 2838} {"train_loss": -25.319177627563477, "global_step": 235585, "epoch": 2838} {"train_loss": -24.75660514831543, "global_step": 235586, "epoch": 2838} {"train_loss": -25.074552536010742, "global_step": 235587, "epoch": 2838} {"train_loss": -25.4188175201416, "global_step": 235588, "epoch": 2838} {"train_loss": -24.804508209228516, "global_step": 235589, "epoch": 2838} {"train_loss": -24.84844970703125, "global_step": 235590, "epoch": 2838} {"train_loss": -25.234954833984375, "global_step": 235591, "epoch": 2838} {"train_loss": -24.884571075439453, "global_step": 235592, "epoch": 2838} {"train_loss": -25.478811264038086, "global_step": 235593, "epoch": 2838} {"train_loss": -25.34467124938965, "global_step": 235594, "epoch": 2838} {"train_loss": -25.103267669677734, "global_step": 235595, "epoch": 2838} {"train_loss": -24.88237953186035, "global_step": 235596, "epoch": 2838} {"train_loss": -24.784549713134766, "global_step": 235597, "epoch": 2838} {"train_loss": -25.432035446166992, "global_step": 235598, "epoch": 2838} {"train_loss": -25.22430419921875, "global_step": 235599, "epoch": 2838} {"train_loss": -24.790021896362305, "global_step": 235600, "epoch": 2838} {"train_loss": -24.6423397064209, "global_step": 235601, "epoch": 2838} {"train_loss": -24.866567611694336, "global_step": 235602, "epoch": 2838} {"train_loss": -24.862146377563477, "global_step": 235603, "epoch": 2838} {"train_loss": -24.542959213256836, "global_step": 235604, "epoch": 2838} {"train_loss": -24.983722686767578, "global_step": 235605, "epoch": 2838} {"train_loss": -24.819562911987305, "global_step": 235606, "epoch": 2838} {"train_loss": -24.933507919311523, "global_step": 235607, "epoch": 2838} {"train_loss": -24.70549774169922, "global_step": 235608, "epoch": 2838} {"train_loss": -24.8798770904541, "global_step": 235609, "epoch": 2838} {"train_loss": -24.675649642944336, "global_step": 235610, "epoch": 2838} {"train_loss": -24.928070068359375, "global_step": 235611, "epoch": 2838} {"train_loss": -25.01511001586914, "global_step": 235612, "epoch": 2838} {"train_loss": -24.592153549194336, "global_step": 235613, "epoch": 2838} {"train_loss": -24.850528717041016, "global_step": 235614, "epoch": 2838} {"train_loss": -24.485380172729492, "global_step": 235615, "epoch": 2838} {"train_loss": -24.695844650268555, "global_step": 235616, "epoch": 2838} {"train_loss": -24.863737106323242, "global_step": 235617, "epoch": 2838} {"train_loss": -24.60913848876953, "global_step": 235618, "epoch": 2838} {"train_loss": -24.609094619750977, "global_step": 235619, "epoch": 2838} {"train_loss": -24.84796905517578, "global_step": 235620, "epoch": 2838} {"train_loss": -24.942975997924805, "global_step": 235621, "epoch": 2838} {"train_loss": -24.850351333618164, "global_step": 235622, "epoch": 2838} {"train_loss": -24.97077751159668, "global_step": 235623, "epoch": 2838} {"train_loss": -25.013660430908203, "global_step": 235624, "epoch": 2838} {"train_loss": -24.679433822631836, "global_step": 235625, "epoch": 2838} {"train_loss": -24.69099998474121, "global_step": 235626, "epoch": 2838} {"train_loss": -24.897274017333984, "global_step": 235627, "epoch": 2838} {"train_loss": -24.892675399780273, "global_step": 235628, "epoch": 2838} {"train_loss": -25.0313663482666, "global_step": 235629, "epoch": 2838} {"train_loss": -24.88933563232422, "global_step": 235630, "epoch": 2838} {"train_loss": -25.394437789916992, "global_step": 235631, "epoch": 2838} {"train_loss": -24.89971923828125, "global_step": 235632, "epoch": 2838} {"train_loss": -24.777685165405273, "global_step": 235633, "epoch": 2838} {"train_loss": -25.20856285095215, "global_step": 235634, "epoch": 2838} {"train_loss": -24.822078704833984, "global_step": 235635, "epoch": 2838} {"train_loss": -24.79564253106175, "global_step": 235636, "epoch": 2838, "val_loss": 6775955.0} {"train_loss": -24.557723999023438, "global_step": 235637, "epoch": 2839} {"train_loss": -24.092029571533203, "global_step": 235638, "epoch": 2839} {"train_loss": -24.81256103515625, "global_step": 235639, "epoch": 2839} {"train_loss": -24.58542251586914, "global_step": 235640, "epoch": 2839} {"train_loss": -24.31754493713379, "global_step": 235641, "epoch": 2839} {"train_loss": -24.666675567626953, "global_step": 235642, "epoch": 2839} {"train_loss": -24.781347274780273, "global_step": 235643, "epoch": 2839} {"train_loss": -24.628196716308594, "global_step": 235644, "epoch": 2839} {"train_loss": -24.376264572143555, "global_step": 235645, "epoch": 2839} {"train_loss": -24.741500854492188, "global_step": 235646, "epoch": 2839} {"train_loss": -24.80428695678711, "global_step": 235647, "epoch": 2839} {"train_loss": -24.640182495117188, "global_step": 235648, "epoch": 2839} {"train_loss": -24.76312255859375, "global_step": 235649, "epoch": 2839} {"train_loss": -24.600820541381836, "global_step": 235650, "epoch": 2839} {"train_loss": -25.001434326171875, "global_step": 235651, "epoch": 2839} {"train_loss": -24.79620933532715, "global_step": 235652, "epoch": 2839} {"train_loss": -24.822751998901367, "global_step": 235653, "epoch": 2839} {"train_loss": -25.387649536132812, "global_step": 235654, "epoch": 2839} {"train_loss": -24.5983943939209, "global_step": 235655, "epoch": 2839} {"train_loss": -24.699914932250977, "global_step": 235656, "epoch": 2839} {"train_loss": -24.64156723022461, "global_step": 235657, "epoch": 2839} {"train_loss": -24.471670150756836, "global_step": 235658, "epoch": 2839} {"train_loss": -24.605621337890625, "global_step": 235659, "epoch": 2839} {"train_loss": -24.999807357788086, "global_step": 235660, "epoch": 2839} {"train_loss": -24.694982528686523, "global_step": 235661, "epoch": 2839} {"train_loss": -24.88214874267578, "global_step": 235662, "epoch": 2839} {"train_loss": -24.690677642822266, "global_step": 235663, "epoch": 2839} {"train_loss": -24.44719886779785, "global_step": 235664, "epoch": 2839} {"train_loss": -24.979421615600586, "global_step": 235665, "epoch": 2839} {"train_loss": -24.946670532226562, "global_step": 235666, "epoch": 2839} {"train_loss": -24.954923629760742, "global_step": 235667, "epoch": 2839} {"train_loss": -24.936025619506836, "global_step": 235668, "epoch": 2839} {"train_loss": -24.87154197692871, "global_step": 235669, "epoch": 2839} {"train_loss": -24.587116241455078, "global_step": 235670, "epoch": 2839} {"train_loss": -25.07911491394043, "global_step": 235671, "epoch": 2839} {"train_loss": -24.75410270690918, "global_step": 235672, "epoch": 2839} {"train_loss": -24.885549545288086, "global_step": 235673, "epoch": 2839} {"train_loss": -25.017871856689453, "global_step": 235674, "epoch": 2839} {"train_loss": -25.2305965423584, "global_step": 235675, "epoch": 2839} {"train_loss": -25.098112106323242, "global_step": 235676, "epoch": 2839} {"train_loss": -24.866634368896484, "global_step": 235677, "epoch": 2839} {"train_loss": -24.668188095092773, "global_step": 235678, "epoch": 2839} {"train_loss": -24.95923614501953, "global_step": 235679, "epoch": 2839} {"train_loss": -24.80084800720215, "global_step": 235680, "epoch": 2839} {"train_loss": -25.1964168548584, "global_step": 235681, "epoch": 2839} {"train_loss": -25.05519676208496, "global_step": 235682, "epoch": 2839} {"train_loss": -24.923227310180664, "global_step": 235683, "epoch": 2839} {"train_loss": -24.797048568725586, "global_step": 235684, "epoch": 2839} {"train_loss": -24.905309677124023, "global_step": 235685, "epoch": 2839} {"train_loss": -24.99839973449707, "global_step": 235686, "epoch": 2839} {"train_loss": -25.00667953491211, "global_step": 235687, "epoch": 2839} {"train_loss": -24.86685562133789, "global_step": 235688, "epoch": 2839} {"train_loss": -24.961383819580078, "global_step": 235689, "epoch": 2839} {"train_loss": -24.50070571899414, "global_step": 235690, "epoch": 2839} {"train_loss": -24.840787887573242, "global_step": 235691, "epoch": 2839} {"train_loss": -24.685529708862305, "global_step": 235692, "epoch": 2839} {"train_loss": -25.10324478149414, "global_step": 235693, "epoch": 2839} {"train_loss": -24.65443992614746, "global_step": 235694, "epoch": 2839} {"train_loss": -24.944562911987305, "global_step": 235695, "epoch": 2839} {"train_loss": -24.824270248413086, "global_step": 235696, "epoch": 2839} {"train_loss": -24.660001754760742, "global_step": 235697, "epoch": 2839} {"train_loss": -24.914541244506836, "global_step": 235698, "epoch": 2839} {"train_loss": -25.031553268432617, "global_step": 235699, "epoch": 2839} {"train_loss": -24.6075496673584, "global_step": 235700, "epoch": 2839} {"train_loss": -24.61663818359375, "global_step": 235701, "epoch": 2839} {"train_loss": -24.48719024658203, "global_step": 235702, "epoch": 2839} {"train_loss": -24.831926345825195, "global_step": 235703, "epoch": 2839} {"train_loss": -24.75446128845215, "global_step": 235704, "epoch": 2839} {"train_loss": -24.493139266967773, "global_step": 235705, "epoch": 2839} {"train_loss": -24.92877197265625, "global_step": 235706, "epoch": 2839} {"train_loss": -24.81627082824707, "global_step": 235707, "epoch": 2839} {"train_loss": -24.323627471923828, "global_step": 235708, "epoch": 2839} {"train_loss": -24.84342384338379, "global_step": 235709, "epoch": 2839} {"train_loss": -24.83431053161621, "global_step": 235710, "epoch": 2839} {"train_loss": -24.39426612854004, "global_step": 235711, "epoch": 2839} {"train_loss": -24.43910789489746, "global_step": 235712, "epoch": 2839} {"train_loss": -24.768646240234375, "global_step": 235713, "epoch": 2839} {"train_loss": -24.921628952026367, "global_step": 235714, "epoch": 2839} {"train_loss": -24.326095581054688, "global_step": 235715, "epoch": 2839} {"train_loss": -24.866052627563477, "global_step": 235716, "epoch": 2839} {"train_loss": -24.608930587768555, "global_step": 235717, "epoch": 2839} {"train_loss": -24.61966896057129, "global_step": 235718, "epoch": 2839} {"train_loss": -24.781294144779803, "global_step": 235719, "epoch": 2839, "val_loss": 6778295.0} {"train_loss": -23.501562118530273, "global_step": 235720, "epoch": 2840} {"train_loss": -23.782094955444336, "global_step": 235721, "epoch": 2840} {"train_loss": -23.906274795532227, "global_step": 235722, "epoch": 2840} {"train_loss": -23.85066795349121, "global_step": 235723, "epoch": 2840} {"train_loss": -23.934803009033203, "global_step": 235724, "epoch": 2840} {"train_loss": -23.940053939819336, "global_step": 235725, "epoch": 2840} {"train_loss": -24.068082809448242, "global_step": 235726, "epoch": 2840} {"train_loss": -24.37369155883789, "global_step": 235727, "epoch": 2840} {"train_loss": -24.40264320373535, "global_step": 235728, "epoch": 2840} {"train_loss": -24.201160430908203, "global_step": 235729, "epoch": 2840} {"train_loss": -24.125228881835938, "global_step": 235730, "epoch": 2840} {"train_loss": -24.220998764038086, "global_step": 235731, "epoch": 2840} {"train_loss": -24.17578125, "global_step": 235732, "epoch": 2840} {"train_loss": -24.52399444580078, "global_step": 235733, "epoch": 2840} {"train_loss": -24.33844566345215, "global_step": 235734, "epoch": 2840} {"train_loss": -24.020877838134766, "global_step": 235735, "epoch": 2840} {"train_loss": -24.195390701293945, "global_step": 235736, "epoch": 2840} {"train_loss": -24.572162628173828, "global_step": 235737, "epoch": 2840} {"train_loss": -24.538217544555664, "global_step": 235738, "epoch": 2840} {"train_loss": -24.663867950439453, "global_step": 235739, "epoch": 2840} {"train_loss": -24.367671966552734, "global_step": 235740, "epoch": 2840} {"train_loss": -24.787946701049805, "global_step": 235741, "epoch": 2840} {"train_loss": -24.624792098999023, "global_step": 235742, "epoch": 2840} {"train_loss": -24.50065040588379, "global_step": 235743, "epoch": 2840} {"train_loss": -24.14386558532715, "global_step": 235744, "epoch": 2840} {"train_loss": -24.675485610961914, "global_step": 235745, "epoch": 2840} {"train_loss": -24.560009002685547, "global_step": 235746, "epoch": 2840} {"train_loss": -24.841079711914062, "global_step": 235747, "epoch": 2840} {"train_loss": -24.6732234954834, "global_step": 235748, "epoch": 2840} {"train_loss": -24.99468994140625, "global_step": 235749, "epoch": 2840} {"train_loss": -25.017223358154297, "global_step": 235750, "epoch": 2840} {"train_loss": -24.84866714477539, "global_step": 235751, "epoch": 2840} {"train_loss": -24.841373443603516, "global_step": 235752, "epoch": 2840} {"train_loss": -24.539579391479492, "global_step": 235753, "epoch": 2840} {"train_loss": -25.086929321289062, "global_step": 235754, "epoch": 2840} {"train_loss": -25.087486267089844, "global_step": 235755, "epoch": 2840} {"train_loss": -24.857290267944336, "global_step": 235756, "epoch": 2840} {"train_loss": -24.82423973083496, "global_step": 235757, "epoch": 2840} {"train_loss": -24.44833755493164, "global_step": 235758, "epoch": 2840} {"train_loss": -24.72092628479004, "global_step": 235759, "epoch": 2840} {"train_loss": -24.9285888671875, "global_step": 235760, "epoch": 2840} {"train_loss": -24.808504104614258, "global_step": 235761, "epoch": 2840} {"train_loss": -24.51337242126465, "global_step": 235762, "epoch": 2840} {"train_loss": -24.819543838500977, "global_step": 235763, "epoch": 2840} {"train_loss": -24.894445419311523, "global_step": 235764, "epoch": 2840} {"train_loss": -25.224105834960938, "global_step": 235765, "epoch": 2840} {"train_loss": -25.055070877075195, "global_step": 235766, "epoch": 2840} {"train_loss": -24.58892822265625, "global_step": 235767, "epoch": 2840} {"train_loss": -24.47224235534668, "global_step": 235768, "epoch": 2840} {"train_loss": -25.155054092407227, "global_step": 235769, "epoch": 2840} {"train_loss": -25.035722732543945, "global_step": 235770, "epoch": 2840} {"train_loss": -24.701202392578125, "global_step": 235771, "epoch": 2840} {"train_loss": -24.620656967163086, "global_step": 235772, "epoch": 2840} {"train_loss": -24.813251495361328, "global_step": 235773, "epoch": 2840} {"train_loss": -24.687116622924805, "global_step": 235774, "epoch": 2840} {"train_loss": -24.869525909423828, "global_step": 235775, "epoch": 2840} {"train_loss": -25.274656295776367, "global_step": 235776, "epoch": 2840} {"train_loss": -24.995868682861328, "global_step": 235777, "epoch": 2840} {"train_loss": -24.920093536376953, "global_step": 235778, "epoch": 2840} {"train_loss": -24.881248474121094, "global_step": 235779, "epoch": 2840} {"train_loss": -25.096363067626953, "global_step": 235780, "epoch": 2840} {"train_loss": -25.221952438354492, "global_step": 235781, "epoch": 2840} {"train_loss": -24.657506942749023, "global_step": 235782, "epoch": 2840} {"train_loss": -24.986968994140625, "global_step": 235783, "epoch": 2840} {"train_loss": -24.959300994873047, "global_step": 235784, "epoch": 2840} {"train_loss": -24.8613224029541, "global_step": 235785, "epoch": 2840} {"train_loss": -24.755966186523438, "global_step": 235786, "epoch": 2840} {"train_loss": -25.10977554321289, "global_step": 235787, "epoch": 2840} {"train_loss": -25.12253189086914, "global_step": 235788, "epoch": 2840} {"train_loss": -25.043970108032227, "global_step": 235789, "epoch": 2840} {"train_loss": -24.919992446899414, "global_step": 235790, "epoch": 2840} {"train_loss": -24.889684677124023, "global_step": 235791, "epoch": 2840} {"train_loss": -25.240196228027344, "global_step": 235792, "epoch": 2840} {"train_loss": -25.03928565979004, "global_step": 235793, "epoch": 2840} {"train_loss": -25.049707412719727, "global_step": 235794, "epoch": 2840} {"train_loss": -24.8472957611084, "global_step": 235795, "epoch": 2840} {"train_loss": -24.88108253479004, "global_step": 235796, "epoch": 2840} {"train_loss": -24.721464157104492, "global_step": 235797, "epoch": 2840} {"train_loss": -24.99704360961914, "global_step": 235798, "epoch": 2840} {"train_loss": -25.072397232055664, "global_step": 235799, "epoch": 2840} {"train_loss": -24.783750534057617, "global_step": 235800, "epoch": 2840} {"train_loss": -25.017629623413086, "global_step": 235801, "epoch": 2840} {"train_loss": -24.687089230640826, "global_step": 235802, "epoch": 2840, "val_loss": 6789541.0} {"train_loss": -23.971637725830078, "global_step": 235803, "epoch": 2841} {"train_loss": -24.245771408081055, "global_step": 235804, "epoch": 2841} {"train_loss": -23.52362632751465, "global_step": 235805, "epoch": 2841} {"train_loss": -23.463808059692383, "global_step": 235806, "epoch": 2841} {"train_loss": -24.105602264404297, "global_step": 235807, "epoch": 2841} {"train_loss": -24.17635154724121, "global_step": 235808, "epoch": 2841} {"train_loss": -24.006877899169922, "global_step": 235809, "epoch": 2841} {"train_loss": -24.263383865356445, "global_step": 235810, "epoch": 2841} {"train_loss": -24.10936737060547, "global_step": 235811, "epoch": 2841} {"train_loss": -24.624614715576172, "global_step": 235812, "epoch": 2841} {"train_loss": -23.61187744140625, "global_step": 235813, "epoch": 2841} {"train_loss": -24.743335723876953, "global_step": 235814, "epoch": 2841} {"train_loss": -24.134366989135742, "global_step": 235815, "epoch": 2841} {"train_loss": -24.170082092285156, "global_step": 235816, "epoch": 2841} {"train_loss": -24.427474975585938, "global_step": 235817, "epoch": 2841} {"train_loss": -24.17945671081543, "global_step": 235818, "epoch": 2841} {"train_loss": -24.7678279876709, "global_step": 235819, "epoch": 2841} {"train_loss": -24.298553466796875, "global_step": 235820, "epoch": 2841} {"train_loss": -24.222522735595703, "global_step": 235821, "epoch": 2841} {"train_loss": -24.46624755859375, "global_step": 235822, "epoch": 2841} {"train_loss": -24.518136978149414, "global_step": 235823, "epoch": 2841} {"train_loss": -24.53153419494629, "global_step": 235824, "epoch": 2841} {"train_loss": -24.820070266723633, "global_step": 235825, "epoch": 2841} {"train_loss": -24.59992790222168, "global_step": 235826, "epoch": 2841} {"train_loss": -24.47844886779785, "global_step": 235827, "epoch": 2841} {"train_loss": -24.53875732421875, "global_step": 235828, "epoch": 2841} {"train_loss": -24.760828018188477, "global_step": 235829, "epoch": 2841} {"train_loss": -24.663251876831055, "global_step": 235830, "epoch": 2841} {"train_loss": -24.51995849609375, "global_step": 235831, "epoch": 2841} {"train_loss": -24.8447265625, "global_step": 235832, "epoch": 2841} {"train_loss": -24.72491455078125, "global_step": 235833, "epoch": 2841} {"train_loss": -24.710153579711914, "global_step": 235834, "epoch": 2841} {"train_loss": -24.86610221862793, "global_step": 235835, "epoch": 2841} {"train_loss": -24.906497955322266, "global_step": 235836, "epoch": 2841} {"train_loss": -24.88294792175293, "global_step": 235837, "epoch": 2841} {"train_loss": -25.023523330688477, "global_step": 235838, "epoch": 2841} {"train_loss": -24.948530197143555, "global_step": 235839, "epoch": 2841} {"train_loss": -25.219104766845703, "global_step": 235840, "epoch": 2841} {"train_loss": -24.693801879882812, "global_step": 235841, "epoch": 2841} {"train_loss": -24.70222282409668, "global_step": 235842, "epoch": 2841} {"train_loss": -24.776792526245117, "global_step": 235843, "epoch": 2841} {"train_loss": -24.913097381591797, "global_step": 235844, "epoch": 2841} {"train_loss": -24.494478225708008, "global_step": 235845, "epoch": 2841} {"train_loss": -24.75200843811035, "global_step": 235846, "epoch": 2841} {"train_loss": -24.795181274414062, "global_step": 235847, "epoch": 2841} {"train_loss": -24.866474151611328, "global_step": 235848, "epoch": 2841} {"train_loss": -24.652952194213867, "global_step": 235849, "epoch": 2841} {"train_loss": -24.767236709594727, "global_step": 235850, "epoch": 2841} {"train_loss": -25.18379020690918, "global_step": 235851, "epoch": 2841} {"train_loss": -24.922517776489258, "global_step": 235852, "epoch": 2841} {"train_loss": -24.722929000854492, "global_step": 235853, "epoch": 2841} {"train_loss": -24.727453231811523, "global_step": 235854, "epoch": 2841} {"train_loss": -24.97022819519043, "global_step": 235855, "epoch": 2841} {"train_loss": -24.990140914916992, "global_step": 235856, "epoch": 2841} {"train_loss": -24.777820587158203, "global_step": 235857, "epoch": 2841} {"train_loss": -25.03507423400879, "global_step": 235858, "epoch": 2841} {"train_loss": -24.66935157775879, "global_step": 235859, "epoch": 2841} {"train_loss": -24.8734130859375, "global_step": 235860, "epoch": 2841} {"train_loss": -24.83254051208496, "global_step": 235861, "epoch": 2841} {"train_loss": -24.942556381225586, "global_step": 235862, "epoch": 2841} {"train_loss": -24.65398406982422, "global_step": 235863, "epoch": 2841} {"train_loss": -24.763675689697266, "global_step": 235864, "epoch": 2841} {"train_loss": -24.712215423583984, "global_step": 235865, "epoch": 2841} {"train_loss": -24.789243698120117, "global_step": 235866, "epoch": 2841} {"train_loss": -24.92058563232422, "global_step": 235867, "epoch": 2841} {"train_loss": -25.024803161621094, "global_step": 235868, "epoch": 2841} {"train_loss": -25.10576820373535, "global_step": 235869, "epoch": 2841} {"train_loss": -24.554597854614258, "global_step": 235870, "epoch": 2841} {"train_loss": -24.395933151245117, "global_step": 235871, "epoch": 2841} {"train_loss": -24.761152267456055, "global_step": 235872, "epoch": 2841} {"train_loss": -24.865327835083008, "global_step": 235873, "epoch": 2841} {"train_loss": -24.785634994506836, "global_step": 235874, "epoch": 2841} {"train_loss": -24.809192657470703, "global_step": 235875, "epoch": 2841} {"train_loss": -24.1862735748291, "global_step": 235876, "epoch": 2841} {"train_loss": -24.916810989379883, "global_step": 235877, "epoch": 2841} {"train_loss": -24.40287208557129, "global_step": 235878, "epoch": 2841} {"train_loss": -25.00557518005371, "global_step": 235879, "epoch": 2841} {"train_loss": -24.623197555541992, "global_step": 235880, "epoch": 2841} {"train_loss": -25.082069396972656, "global_step": 235881, "epoch": 2841} {"train_loss": -24.951032638549805, "global_step": 235882, "epoch": 2841} {"train_loss": -24.523866653442383, "global_step": 235883, "epoch": 2841} {"train_loss": -24.95294761657715, "global_step": 235884, "epoch": 2841} {"train_loss": -24.63558263663786, "global_step": 235885, "epoch": 2841, "val_loss": 6722503.5} {"train_loss": -24.68414306640625, "global_step": 235886, "epoch": 2842} {"train_loss": -24.475296020507812, "global_step": 235887, "epoch": 2842} {"train_loss": -24.825883865356445, "global_step": 235888, "epoch": 2842} {"train_loss": -24.606124877929688, "global_step": 235889, "epoch": 2842} {"train_loss": -24.75804901123047, "global_step": 235890, "epoch": 2842} {"train_loss": -24.999662399291992, "global_step": 235891, "epoch": 2842} {"train_loss": -24.51522445678711, "global_step": 235892, "epoch": 2842} {"train_loss": -24.868682861328125, "global_step": 235893, "epoch": 2842} {"train_loss": -24.93680191040039, "global_step": 235894, "epoch": 2842} {"train_loss": -24.14133071899414, "global_step": 235895, "epoch": 2842} {"train_loss": -24.709318161010742, "global_step": 235896, "epoch": 2842} {"train_loss": -24.674345016479492, "global_step": 235897, "epoch": 2842} {"train_loss": -24.533300399780273, "global_step": 235898, "epoch": 2842} {"train_loss": -24.6777400970459, "global_step": 235899, "epoch": 2842} {"train_loss": -24.948307037353516, "global_step": 235900, "epoch": 2842} {"train_loss": -24.91788673400879, "global_step": 235901, "epoch": 2842} {"train_loss": -24.897459030151367, "global_step": 235902, "epoch": 2842} {"train_loss": -24.673221588134766, "global_step": 235903, "epoch": 2842} {"train_loss": -24.8159236907959, "global_step": 235904, "epoch": 2842} {"train_loss": -24.817930221557617, "global_step": 235905, "epoch": 2842} {"train_loss": -25.036863327026367, "global_step": 235906, "epoch": 2842} {"train_loss": -24.331758499145508, "global_step": 235907, "epoch": 2842} {"train_loss": -25.07980728149414, "global_step": 235908, "epoch": 2842} {"train_loss": -24.446653366088867, "global_step": 235909, "epoch": 2842} {"train_loss": -24.623779296875, "global_step": 235910, "epoch": 2842} {"train_loss": -24.80869483947754, "global_step": 235911, "epoch": 2842} {"train_loss": -24.553056716918945, "global_step": 235912, "epoch": 2842} {"train_loss": -24.69028091430664, "global_step": 235913, "epoch": 2842} {"train_loss": -24.393644332885742, "global_step": 235914, "epoch": 2842} {"train_loss": -24.6003475189209, "global_step": 235915, "epoch": 2842} {"train_loss": -24.666309356689453, "global_step": 235916, "epoch": 2842} {"train_loss": -24.521087646484375, "global_step": 235917, "epoch": 2842} {"train_loss": -24.86065101623535, "global_step": 235918, "epoch": 2842} {"train_loss": -24.799968719482422, "global_step": 235919, "epoch": 2842} {"train_loss": -24.301748275756836, "global_step": 235920, "epoch": 2842} {"train_loss": -24.962413787841797, "global_step": 235921, "epoch": 2842} {"train_loss": -24.8057861328125, "global_step": 235922, "epoch": 2842} {"train_loss": -24.34917640686035, "global_step": 235923, "epoch": 2842} {"train_loss": -24.986007690429688, "global_step": 235924, "epoch": 2842} {"train_loss": -24.730026245117188, "global_step": 235925, "epoch": 2842} {"train_loss": -25.0877742767334, "global_step": 235926, "epoch": 2842} {"train_loss": -24.655637741088867, "global_step": 235927, "epoch": 2842} {"train_loss": -24.6998291015625, "global_step": 235928, "epoch": 2842} {"train_loss": -24.91633415222168, "global_step": 235929, "epoch": 2842} {"train_loss": -24.795392990112305, "global_step": 235930, "epoch": 2842} {"train_loss": -24.733448028564453, "global_step": 235931, "epoch": 2842} {"train_loss": -24.769718170166016, "global_step": 235932, "epoch": 2842} {"train_loss": -24.82950782775879, "global_step": 235933, "epoch": 2842} {"train_loss": -25.076404571533203, "global_step": 235934, "epoch": 2842} {"train_loss": -24.818073272705078, "global_step": 235935, "epoch": 2842} {"train_loss": -25.331602096557617, "global_step": 235936, "epoch": 2842} {"train_loss": -24.69166374206543, "global_step": 235937, "epoch": 2842} {"train_loss": -24.67422866821289, "global_step": 235938, "epoch": 2842} {"train_loss": -24.904329299926758, "global_step": 235939, "epoch": 2842} {"train_loss": -24.900222778320312, "global_step": 235940, "epoch": 2842} {"train_loss": -25.215524673461914, "global_step": 235941, "epoch": 2842} {"train_loss": -24.745389938354492, "global_step": 235942, "epoch": 2842} {"train_loss": -24.545690536499023, "global_step": 235943, "epoch": 2842} {"train_loss": -24.796369552612305, "global_step": 235944, "epoch": 2842} {"train_loss": -24.942882537841797, "global_step": 235945, "epoch": 2842} {"train_loss": -24.776222229003906, "global_step": 235946, "epoch": 2842} {"train_loss": -24.842849731445312, "global_step": 235947, "epoch": 2842} {"train_loss": -25.019489288330078, "global_step": 235948, "epoch": 2842} {"train_loss": -24.560537338256836, "global_step": 235949, "epoch": 2842} {"train_loss": -25.10120964050293, "global_step": 235950, "epoch": 2842} {"train_loss": -24.903390884399414, "global_step": 235951, "epoch": 2842} {"train_loss": -25.032358169555664, "global_step": 235952, "epoch": 2842} {"train_loss": -25.026708602905273, "global_step": 235953, "epoch": 2842} {"train_loss": -24.60041618347168, "global_step": 235954, "epoch": 2842} {"train_loss": -25.151731491088867, "global_step": 235955, "epoch": 2842} {"train_loss": -24.85215187072754, "global_step": 235956, "epoch": 2842} {"train_loss": -24.7828311920166, "global_step": 235957, "epoch": 2842} {"train_loss": -24.594724655151367, "global_step": 235958, "epoch": 2842} {"train_loss": -25.16046142578125, "global_step": 235959, "epoch": 2842} {"train_loss": -24.734819412231445, "global_step": 235960, "epoch": 2842} {"train_loss": -24.68707847595215, "global_step": 235961, "epoch": 2842} {"train_loss": -24.914081573486328, "global_step": 235962, "epoch": 2842} {"train_loss": -25.05829429626465, "global_step": 235963, "epoch": 2842} {"train_loss": -24.88567543029785, "global_step": 235964, "epoch": 2842} {"train_loss": -24.830642700195312, "global_step": 235965, "epoch": 2842} {"train_loss": -24.751012802124023, "global_step": 235966, "epoch": 2842} {"train_loss": -24.924951553344727, "global_step": 235967, "epoch": 2842} {"train_loss": -24.7822735568127, "global_step": 235968, "epoch": 2842, "val_loss": 6752243.0} {"train_loss": -24.190189361572266, "global_step": 235969, "epoch": 2843} {"train_loss": -24.341018676757812, "global_step": 235970, "epoch": 2843} {"train_loss": -24.381912231445312, "global_step": 235971, "epoch": 2843} {"train_loss": -23.97410011291504, "global_step": 235972, "epoch": 2843} {"train_loss": -24.685731887817383, "global_step": 235973, "epoch": 2843} {"train_loss": -24.426666259765625, "global_step": 235974, "epoch": 2843} {"train_loss": -24.5003662109375, "global_step": 235975, "epoch": 2843} {"train_loss": -24.466632843017578, "global_step": 235976, "epoch": 2843} {"train_loss": -24.847970962524414, "global_step": 235977, "epoch": 2843} {"train_loss": -24.683130264282227, "global_step": 235978, "epoch": 2843} {"train_loss": -24.77471923828125, "global_step": 235979, "epoch": 2843} {"train_loss": -25.007678985595703, "global_step": 235980, "epoch": 2843} {"train_loss": -24.59775733947754, "global_step": 235981, "epoch": 2843} {"train_loss": -24.706876754760742, "global_step": 235982, "epoch": 2843} {"train_loss": -24.775365829467773, "global_step": 235983, "epoch": 2843} {"train_loss": -25.170013427734375, "global_step": 235984, "epoch": 2843} {"train_loss": -24.2551326751709, "global_step": 235985, "epoch": 2843} {"train_loss": -24.76511573791504, "global_step": 235986, "epoch": 2843} {"train_loss": -24.702899932861328, "global_step": 235987, "epoch": 2843} {"train_loss": -24.736183166503906, "global_step": 235988, "epoch": 2843} {"train_loss": -24.749311447143555, "global_step": 235989, "epoch": 2843} {"train_loss": -24.4532527923584, "global_step": 235990, "epoch": 2843} {"train_loss": -24.99059295654297, "global_step": 235991, "epoch": 2843} {"train_loss": -24.906280517578125, "global_step": 235992, "epoch": 2843} {"train_loss": -24.94422721862793, "global_step": 235993, "epoch": 2843} {"train_loss": -25.088468551635742, "global_step": 235994, "epoch": 2843} {"train_loss": -25.14223289489746, "global_step": 235995, "epoch": 2843} {"train_loss": -25.049293518066406, "global_step": 235996, "epoch": 2843} {"train_loss": -24.83028221130371, "global_step": 235997, "epoch": 2843} {"train_loss": -24.94295883178711, "global_step": 235998, "epoch": 2843} {"train_loss": -25.209653854370117, "global_step": 235999, "epoch": 2843} {"train_loss": -24.89454460144043, "global_step": 236000, "epoch": 2843} {"train_loss": -25.089466094970703, "global_step": 236001, "epoch": 2843} {"train_loss": -24.810598373413086, "global_step": 236002, "epoch": 2843} {"train_loss": -25.261215209960938, "global_step": 236003, "epoch": 2843} {"train_loss": -24.885345458984375, "global_step": 236004, "epoch": 2843} {"train_loss": -25.064407348632812, "global_step": 236005, "epoch": 2843} {"train_loss": -24.899341583251953, "global_step": 236006, "epoch": 2843} {"train_loss": -24.890657424926758, "global_step": 236007, "epoch": 2843} {"train_loss": -24.678123474121094, "global_step": 236008, "epoch": 2843} {"train_loss": -24.63739585876465, "global_step": 236009, "epoch": 2843} {"train_loss": -24.578577041625977, "global_step": 236010, "epoch": 2843} {"train_loss": -24.31697654724121, "global_step": 236011, "epoch": 2843} {"train_loss": -24.266935348510742, "global_step": 236012, "epoch": 2843} {"train_loss": -24.83381462097168, "global_step": 236013, "epoch": 2843} {"train_loss": -24.55985450744629, "global_step": 236014, "epoch": 2843} {"train_loss": -24.371522903442383, "global_step": 236015, "epoch": 2843} {"train_loss": -24.498144149780273, "global_step": 236016, "epoch": 2843} {"train_loss": -24.897136688232422, "global_step": 236017, "epoch": 2843} {"train_loss": -24.531524658203125, "global_step": 236018, "epoch": 2843} {"train_loss": -24.709768295288086, "global_step": 236019, "epoch": 2843} {"train_loss": -24.321706771850586, "global_step": 236020, "epoch": 2843} {"train_loss": -24.77589225769043, "global_step": 236021, "epoch": 2843} {"train_loss": -24.566999435424805, "global_step": 236022, "epoch": 2843} {"train_loss": -24.740217208862305, "global_step": 236023, "epoch": 2843} {"train_loss": -24.570768356323242, "global_step": 236024, "epoch": 2843} {"train_loss": -24.689592361450195, "global_step": 236025, "epoch": 2843} {"train_loss": -24.66754722595215, "global_step": 236026, "epoch": 2843} {"train_loss": -24.915584564208984, "global_step": 236027, "epoch": 2843} {"train_loss": -24.979887008666992, "global_step": 236028, "epoch": 2843} {"train_loss": -24.565256118774414, "global_step": 236029, "epoch": 2843} {"train_loss": -25.04584312438965, "global_step": 236030, "epoch": 2843} {"train_loss": -24.839136123657227, "global_step": 236031, "epoch": 2843} {"train_loss": -25.050825119018555, "global_step": 236032, "epoch": 2843} {"train_loss": -24.76786231994629, "global_step": 236033, "epoch": 2843} {"train_loss": -24.75079345703125, "global_step": 236034, "epoch": 2843} {"train_loss": -25.01152992248535, "global_step": 236035, "epoch": 2843} {"train_loss": -24.78530502319336, "global_step": 236036, "epoch": 2843} {"train_loss": -24.879636764526367, "global_step": 236037, "epoch": 2843} {"train_loss": -24.790937423706055, "global_step": 236038, "epoch": 2843} {"train_loss": -24.555622100830078, "global_step": 236039, "epoch": 2843} {"train_loss": -24.923521041870117, "global_step": 236040, "epoch": 2843} {"train_loss": -24.867643356323242, "global_step": 236041, "epoch": 2843} {"train_loss": -24.72211265563965, "global_step": 236042, "epoch": 2843} {"train_loss": -24.584583282470703, "global_step": 236043, "epoch": 2843} {"train_loss": -24.806901931762695, "global_step": 236044, "epoch": 2843} {"train_loss": -24.629480361938477, "global_step": 236045, "epoch": 2843} {"train_loss": -24.6278018951416, "global_step": 236046, "epoch": 2843} {"train_loss": -24.968103408813477, "global_step": 236047, "epoch": 2843} {"train_loss": -24.914169311523438, "global_step": 236048, "epoch": 2843} {"train_loss": -24.707082748413086, "global_step": 236049, "epoch": 2843} {"train_loss": -24.589025497436523, "global_step": 236050, "epoch": 2843} {"train_loss": -24.729284171598504, "global_step": 236051, "epoch": 2843, "val_loss": 6732963.0} {"train_loss": -21.537134170532227, "global_step": 236052, "epoch": 2844} {"train_loss": -24.149066925048828, "global_step": 236053, "epoch": 2844} {"train_loss": -23.336109161376953, "global_step": 236054, "epoch": 2844} {"train_loss": -23.79323387145996, "global_step": 236055, "epoch": 2844} {"train_loss": -22.882938385009766, "global_step": 236056, "epoch": 2844} {"train_loss": -24.042495727539062, "global_step": 236057, "epoch": 2844} {"train_loss": -23.821123123168945, "global_step": 236058, "epoch": 2844} {"train_loss": -24.179929733276367, "global_step": 236059, "epoch": 2844} {"train_loss": -24.121862411499023, "global_step": 236060, "epoch": 2844} {"train_loss": -23.761335372924805, "global_step": 236061, "epoch": 2844} {"train_loss": -23.649967193603516, "global_step": 236062, "epoch": 2844} {"train_loss": -23.732868194580078, "global_step": 236063, "epoch": 2844} {"train_loss": -24.231382369995117, "global_step": 236064, "epoch": 2844} {"train_loss": -24.162290573120117, "global_step": 236065, "epoch": 2844} {"train_loss": -24.3043212890625, "global_step": 236066, "epoch": 2844} {"train_loss": -24.187570571899414, "global_step": 236067, "epoch": 2844} {"train_loss": -24.118499755859375, "global_step": 236068, "epoch": 2844} {"train_loss": -24.089380264282227, "global_step": 236069, "epoch": 2844} {"train_loss": -24.54244041442871, "global_step": 236070, "epoch": 2844} {"train_loss": -24.431224822998047, "global_step": 236071, "epoch": 2844} {"train_loss": -24.91986846923828, "global_step": 236072, "epoch": 2844} {"train_loss": -24.25226402282715, "global_step": 236073, "epoch": 2844} {"train_loss": -24.285573959350586, "global_step": 236074, "epoch": 2844} {"train_loss": -24.51129722595215, "global_step": 236075, "epoch": 2844} {"train_loss": -24.51776885986328, "global_step": 236076, "epoch": 2844} {"train_loss": -24.42255210876465, "global_step": 236077, "epoch": 2844} {"train_loss": -24.468128204345703, "global_step": 236078, "epoch": 2844} {"train_loss": -24.679452896118164, "global_step": 236079, "epoch": 2844} {"train_loss": -24.69117546081543, "global_step": 236080, "epoch": 2844} {"train_loss": -24.516401290893555, "global_step": 236081, "epoch": 2844} {"train_loss": -24.654815673828125, "global_step": 236082, "epoch": 2844} {"train_loss": -24.73049545288086, "global_step": 236083, "epoch": 2844} {"train_loss": -24.748624801635742, "global_step": 236084, "epoch": 2844} {"train_loss": -24.827102661132812, "global_step": 236085, "epoch": 2844} {"train_loss": -24.643722534179688, "global_step": 236086, "epoch": 2844} {"train_loss": -24.87530517578125, "global_step": 236087, "epoch": 2844} {"train_loss": -25.093740463256836, "global_step": 236088, "epoch": 2844} {"train_loss": -24.838224411010742, "global_step": 236089, "epoch": 2844} {"train_loss": -24.8652400970459, "global_step": 236090, "epoch": 2844} {"train_loss": -24.52310562133789, "global_step": 236091, "epoch": 2844} {"train_loss": -24.573486328125, "global_step": 236092, "epoch": 2844} {"train_loss": -24.58542251586914, "global_step": 236093, "epoch": 2844} {"train_loss": -24.941686630249023, "global_step": 236094, "epoch": 2844} {"train_loss": -24.880197525024414, "global_step": 236095, "epoch": 2844} {"train_loss": -25.251157760620117, "global_step": 236096, "epoch": 2844} {"train_loss": -24.756540298461914, "global_step": 236097, "epoch": 2844} {"train_loss": -24.834115982055664, "global_step": 236098, "epoch": 2844} {"train_loss": -24.967113494873047, "global_step": 236099, "epoch": 2844} {"train_loss": -24.877052307128906, "global_step": 236100, "epoch": 2844} {"train_loss": -24.77687644958496, "global_step": 236101, "epoch": 2844} {"train_loss": -24.781702041625977, "global_step": 236102, "epoch": 2844} {"train_loss": -24.472084045410156, "global_step": 236103, "epoch": 2844} {"train_loss": -24.87049674987793, "global_step": 236104, "epoch": 2844} {"train_loss": -24.65410804748535, "global_step": 236105, "epoch": 2844} {"train_loss": -24.7460994720459, "global_step": 236106, "epoch": 2844} {"train_loss": -24.850217819213867, "global_step": 236107, "epoch": 2844} {"train_loss": -24.962446212768555, "global_step": 236108, "epoch": 2844} {"train_loss": -24.843210220336914, "global_step": 236109, "epoch": 2844} {"train_loss": -24.57367515563965, "global_step": 236110, "epoch": 2844} {"train_loss": -24.8431453704834, "global_step": 236111, "epoch": 2844} {"train_loss": -24.984167098999023, "global_step": 236112, "epoch": 2844} {"train_loss": -24.828664779663086, "global_step": 236113, "epoch": 2844} {"train_loss": -24.875741958618164, "global_step": 236114, "epoch": 2844} {"train_loss": -25.071521759033203, "global_step": 236115, "epoch": 2844} {"train_loss": -25.125959396362305, "global_step": 236116, "epoch": 2844} {"train_loss": -24.946203231811523, "global_step": 236117, "epoch": 2844} {"train_loss": -24.94535255432129, "global_step": 236118, "epoch": 2844} {"train_loss": -24.726797103881836, "global_step": 236119, "epoch": 2844} {"train_loss": -25.165971755981445, "global_step": 236120, "epoch": 2844} {"train_loss": -24.790822982788086, "global_step": 236121, "epoch": 2844} {"train_loss": -24.739328384399414, "global_step": 236122, "epoch": 2844} {"train_loss": -24.8461856842041, "global_step": 236123, "epoch": 2844} {"train_loss": -24.68494987487793, "global_step": 236124, "epoch": 2844} {"train_loss": -24.751907348632812, "global_step": 236125, "epoch": 2844} {"train_loss": -24.782949447631836, "global_step": 236126, "epoch": 2844} {"train_loss": -24.98298454284668, "global_step": 236127, "epoch": 2844} {"train_loss": -24.53740882873535, "global_step": 236128, "epoch": 2844} {"train_loss": -24.34946060180664, "global_step": 236129, "epoch": 2844} {"train_loss": -24.09889030456543, "global_step": 236130, "epoch": 2844} {"train_loss": -24.459510803222656, "global_step": 236131, "epoch": 2844} {"train_loss": -24.541616439819336, "global_step": 236132, "epoch": 2844} {"train_loss": -24.461061477661133, "global_step": 236133, "epoch": 2844} {"train_loss": -24.537981607827795, "global_step": 236134, "epoch": 2844, "val_loss": 6777310.5} {"train_loss": -23.970659255981445, "global_step": 236135, "epoch": 2845} {"train_loss": -24.074186325073242, "global_step": 236136, "epoch": 2845} {"train_loss": -24.296289443969727, "global_step": 236137, "epoch": 2845} {"train_loss": -24.096744537353516, "global_step": 236138, "epoch": 2845} {"train_loss": -24.144100189208984, "global_step": 236139, "epoch": 2845} {"train_loss": -24.61998176574707, "global_step": 236140, "epoch": 2845} {"train_loss": -24.58782958984375, "global_step": 236141, "epoch": 2845} {"train_loss": -24.153003692626953, "global_step": 236142, "epoch": 2845} {"train_loss": -24.293413162231445, "global_step": 236143, "epoch": 2845} {"train_loss": -24.165090560913086, "global_step": 236144, "epoch": 2845} {"train_loss": -24.43338394165039, "global_step": 236145, "epoch": 2845} {"train_loss": -24.2011661529541, "global_step": 236146, "epoch": 2845} {"train_loss": -24.204742431640625, "global_step": 236147, "epoch": 2845} {"train_loss": -24.495737075805664, "global_step": 236148, "epoch": 2845} {"train_loss": -24.58547019958496, "global_step": 236149, "epoch": 2845} {"train_loss": -24.258554458618164, "global_step": 236150, "epoch": 2845} {"train_loss": -24.614004135131836, "global_step": 236151, "epoch": 2845} {"train_loss": -24.628461837768555, "global_step": 236152, "epoch": 2845} {"train_loss": -24.78676414489746, "global_step": 236153, "epoch": 2845} {"train_loss": -24.92203140258789, "global_step": 236154, "epoch": 2845} {"train_loss": -24.488515853881836, "global_step": 236155, "epoch": 2845} {"train_loss": -24.75920295715332, "global_step": 236156, "epoch": 2845} {"train_loss": -24.67286491394043, "global_step": 236157, "epoch": 2845} {"train_loss": -24.56557273864746, "global_step": 236158, "epoch": 2845} {"train_loss": -24.69839096069336, "global_step": 236159, "epoch": 2845} {"train_loss": -24.911401748657227, "global_step": 236160, "epoch": 2845} {"train_loss": -24.867216110229492, "global_step": 236161, "epoch": 2845} {"train_loss": -24.809621810913086, "global_step": 236162, "epoch": 2845} {"train_loss": -24.33967399597168, "global_step": 236163, "epoch": 2845} {"train_loss": -24.739973068237305, "global_step": 236164, "epoch": 2845} {"train_loss": -25.016340255737305, "global_step": 236165, "epoch": 2845} {"train_loss": -24.80489158630371, "global_step": 236166, "epoch": 2845} {"train_loss": -24.875446319580078, "global_step": 236167, "epoch": 2845} {"train_loss": -24.99850845336914, "global_step": 236168, "epoch": 2845} {"train_loss": -24.582040786743164, "global_step": 236169, "epoch": 2845} {"train_loss": -24.717756271362305, "global_step": 236170, "epoch": 2845} {"train_loss": -25.182315826416016, "global_step": 236171, "epoch": 2845} {"train_loss": -24.592599868774414, "global_step": 236172, "epoch": 2845} {"train_loss": -24.627887725830078, "global_step": 236173, "epoch": 2845} {"train_loss": -24.926130294799805, "global_step": 236174, "epoch": 2845} {"train_loss": -24.86688804626465, "global_step": 236175, "epoch": 2845} {"train_loss": -24.689172744750977, "global_step": 236176, "epoch": 2845} {"train_loss": -24.786396026611328, "global_step": 236177, "epoch": 2845} {"train_loss": -24.664281845092773, "global_step": 236178, "epoch": 2845} {"train_loss": -24.692747116088867, "global_step": 236179, "epoch": 2845} {"train_loss": -25.076017379760742, "global_step": 236180, "epoch": 2845} {"train_loss": -24.9019832611084, "global_step": 236181, "epoch": 2845} {"train_loss": -25.181350708007812, "global_step": 236182, "epoch": 2845} {"train_loss": -24.794723510742188, "global_step": 236183, "epoch": 2845} {"train_loss": -25.0964298248291, "global_step": 236184, "epoch": 2845} {"train_loss": -24.907257080078125, "global_step": 236185, "epoch": 2845} {"train_loss": -24.82627296447754, "global_step": 236186, "epoch": 2845} {"train_loss": -24.742361068725586, "global_step": 236187, "epoch": 2845} {"train_loss": -24.92724609375, "global_step": 236188, "epoch": 2845} {"train_loss": -24.736976623535156, "global_step": 236189, "epoch": 2845} {"train_loss": -24.90874671936035, "global_step": 236190, "epoch": 2845} {"train_loss": -24.91752052307129, "global_step": 236191, "epoch": 2845} {"train_loss": -24.822837829589844, "global_step": 236192, "epoch": 2845} {"train_loss": -24.8879451751709, "global_step": 236193, "epoch": 2845} {"train_loss": -24.884084701538086, "global_step": 236194, "epoch": 2845} {"train_loss": -25.1546630859375, "global_step": 236195, "epoch": 2845} {"train_loss": -24.746307373046875, "global_step": 236196, "epoch": 2845} {"train_loss": -25.035703659057617, "global_step": 236197, "epoch": 2845} {"train_loss": -24.833559036254883, "global_step": 236198, "epoch": 2845} {"train_loss": -24.8563232421875, "global_step": 236199, "epoch": 2845} {"train_loss": -24.862314224243164, "global_step": 236200, "epoch": 2845} {"train_loss": -24.794157028198242, "global_step": 236201, "epoch": 2845} {"train_loss": -25.049631118774414, "global_step": 236202, "epoch": 2845} {"train_loss": -25.22548484802246, "global_step": 236203, "epoch": 2845} {"train_loss": -24.895986557006836, "global_step": 236204, "epoch": 2845} {"train_loss": -25.246488571166992, "global_step": 236205, "epoch": 2845} {"train_loss": -24.810544967651367, "global_step": 236206, "epoch": 2845} {"train_loss": -24.7876033782959, "global_step": 236207, "epoch": 2845} {"train_loss": -24.806745529174805, "global_step": 236208, "epoch": 2845} {"train_loss": -25.02438735961914, "global_step": 236209, "epoch": 2845} {"train_loss": -24.840370178222656, "global_step": 236210, "epoch": 2845} {"train_loss": -25.011524200439453, "global_step": 236211, "epoch": 2845} {"train_loss": -24.681753158569336, "global_step": 236212, "epoch": 2845} {"train_loss": -24.819995880126953, "global_step": 236213, "epoch": 2845} {"train_loss": -24.9135799407959, "global_step": 236214, "epoch": 2845} {"train_loss": -24.809568405151367, "global_step": 236215, "epoch": 2845} {"train_loss": -24.533361434936523, "global_step": 236216, "epoch": 2845} {"train_loss": -24.715569484664734, "global_step": 236217, "epoch": 2845, "val_loss": 6699243.0} {"train_loss": -24.672975540161133, "global_step": 236218, "epoch": 2846} {"train_loss": -24.052001953125, "global_step": 236219, "epoch": 2846} {"train_loss": -24.437509536743164, "global_step": 236220, "epoch": 2846} {"train_loss": -24.261587142944336, "global_step": 236221, "epoch": 2846} {"train_loss": -24.528066635131836, "global_step": 236222, "epoch": 2846} {"train_loss": -24.774349212646484, "global_step": 236223, "epoch": 2846} {"train_loss": -24.226669311523438, "global_step": 236224, "epoch": 2846} {"train_loss": -24.07288932800293, "global_step": 236225, "epoch": 2846} {"train_loss": -24.384931564331055, "global_step": 236226, "epoch": 2846} {"train_loss": -24.543447494506836, "global_step": 236227, "epoch": 2846} {"train_loss": -24.454519271850586, "global_step": 236228, "epoch": 2846} {"train_loss": -24.74500846862793, "global_step": 236229, "epoch": 2846} {"train_loss": -24.789159774780273, "global_step": 236230, "epoch": 2846} {"train_loss": -24.405166625976562, "global_step": 236231, "epoch": 2846} {"train_loss": -24.739898681640625, "global_step": 236232, "epoch": 2846} {"train_loss": -24.707563400268555, "global_step": 236233, "epoch": 2846} {"train_loss": -24.580419540405273, "global_step": 236234, "epoch": 2846} {"train_loss": -24.702451705932617, "global_step": 236235, "epoch": 2846} {"train_loss": -24.859722137451172, "global_step": 236236, "epoch": 2846} {"train_loss": -24.73523712158203, "global_step": 236237, "epoch": 2846} {"train_loss": -24.585718154907227, "global_step": 236238, "epoch": 2846} {"train_loss": -24.490028381347656, "global_step": 236239, "epoch": 2846} {"train_loss": -24.92909812927246, "global_step": 236240, "epoch": 2846} {"train_loss": -24.19768714904785, "global_step": 236241, "epoch": 2846} {"train_loss": -24.71487045288086, "global_step": 236242, "epoch": 2846} {"train_loss": -24.88458824157715, "global_step": 236243, "epoch": 2846} {"train_loss": -24.623830795288086, "global_step": 236244, "epoch": 2846} {"train_loss": -24.880802154541016, "global_step": 236245, "epoch": 2846} {"train_loss": -24.76968765258789, "global_step": 236246, "epoch": 2846} {"train_loss": -24.564279556274414, "global_step": 236247, "epoch": 2846} {"train_loss": -24.792068481445312, "global_step": 236248, "epoch": 2846} {"train_loss": -24.3735408782959, "global_step": 236249, "epoch": 2846} {"train_loss": -25.118160247802734, "global_step": 236250, "epoch": 2846} {"train_loss": -24.887222290039062, "global_step": 236251, "epoch": 2846} {"train_loss": -24.970258712768555, "global_step": 236252, "epoch": 2846} {"train_loss": -24.377288818359375, "global_step": 236253, "epoch": 2846} {"train_loss": -24.219404220581055, "global_step": 236254, "epoch": 2846} {"train_loss": -24.856637954711914, "global_step": 236255, "epoch": 2846} {"train_loss": -24.689516067504883, "global_step": 236256, "epoch": 2846} {"train_loss": -24.8544979095459, "global_step": 236257, "epoch": 2846} {"train_loss": -24.492897033691406, "global_step": 236258, "epoch": 2846} {"train_loss": -23.994556427001953, "global_step": 236259, "epoch": 2846} {"train_loss": -24.88335609436035, "global_step": 236260, "epoch": 2846} {"train_loss": -24.930557250976562, "global_step": 236261, "epoch": 2846} {"train_loss": -24.85712242126465, "global_step": 236262, "epoch": 2846} {"train_loss": -24.822898864746094, "global_step": 236263, "epoch": 2846} {"train_loss": -24.723045349121094, "global_step": 236264, "epoch": 2846} {"train_loss": -25.06968116760254, "global_step": 236265, "epoch": 2846} {"train_loss": -25.159391403198242, "global_step": 236266, "epoch": 2846} {"train_loss": -24.85713005065918, "global_step": 236267, "epoch": 2846} {"train_loss": -24.92140769958496, "global_step": 236268, "epoch": 2846} {"train_loss": -24.795242309570312, "global_step": 236269, "epoch": 2846} {"train_loss": -24.592302322387695, "global_step": 236270, "epoch": 2846} {"train_loss": -24.569217681884766, "global_step": 236271, "epoch": 2846} {"train_loss": -24.836698532104492, "global_step": 236272, "epoch": 2846} {"train_loss": -24.91675567626953, "global_step": 236273, "epoch": 2846} {"train_loss": -24.931550979614258, "global_step": 236274, "epoch": 2846} {"train_loss": -24.999284744262695, "global_step": 236275, "epoch": 2846} {"train_loss": -24.70722770690918, "global_step": 236276, "epoch": 2846} {"train_loss": -24.830270767211914, "global_step": 236277, "epoch": 2846} {"train_loss": -24.71565055847168, "global_step": 236278, "epoch": 2846} {"train_loss": -25.022897720336914, "global_step": 236279, "epoch": 2846} {"train_loss": -25.084571838378906, "global_step": 236280, "epoch": 2846} {"train_loss": -25.140111923217773, "global_step": 236281, "epoch": 2846} {"train_loss": -24.794189453125, "global_step": 236282, "epoch": 2846} {"train_loss": -24.918853759765625, "global_step": 236283, "epoch": 2846} {"train_loss": -24.970014572143555, "global_step": 236284, "epoch": 2846} {"train_loss": -24.73415184020996, "global_step": 236285, "epoch": 2846} {"train_loss": -24.870759963989258, "global_step": 236286, "epoch": 2846} {"train_loss": -25.00181007385254, "global_step": 236287, "epoch": 2846} {"train_loss": -24.841907501220703, "global_step": 236288, "epoch": 2846} {"train_loss": -24.26712989807129, "global_step": 236289, "epoch": 2846} {"train_loss": -24.56317138671875, "global_step": 236290, "epoch": 2846} {"train_loss": -24.645164489746094, "global_step": 236291, "epoch": 2846} {"train_loss": -24.642684936523438, "global_step": 236292, "epoch": 2846} {"train_loss": -24.373395919799805, "global_step": 236293, "epoch": 2846} {"train_loss": -24.789627075195312, "global_step": 236294, "epoch": 2846} {"train_loss": -24.331560134887695, "global_step": 236295, "epoch": 2846} {"train_loss": -24.70700454711914, "global_step": 236296, "epoch": 2846} {"train_loss": -24.519580841064453, "global_step": 236297, "epoch": 2846} {"train_loss": -24.89704704284668, "global_step": 236298, "epoch": 2846} {"train_loss": -24.83725357055664, "global_step": 236299, "epoch": 2846} {"train_loss": -24.705448771097576, "global_step": 236300, "epoch": 2846, "val_loss": 6893976.0} {"train_loss": -24.16497039794922, "global_step": 236301, "epoch": 2847} {"train_loss": -24.292875289916992, "global_step": 236302, "epoch": 2847} {"train_loss": -24.679737091064453, "global_step": 236303, "epoch": 2847} {"train_loss": -24.572904586791992, "global_step": 236304, "epoch": 2847} {"train_loss": -24.312088012695312, "global_step": 236305, "epoch": 2847} {"train_loss": -24.94220542907715, "global_step": 236306, "epoch": 2847} {"train_loss": -24.633146286010742, "global_step": 236307, "epoch": 2847} {"train_loss": -24.62782096862793, "global_step": 236308, "epoch": 2847} {"train_loss": -24.94000244140625, "global_step": 236309, "epoch": 2847} {"train_loss": -24.741575241088867, "global_step": 236310, "epoch": 2847} {"train_loss": -24.3286075592041, "global_step": 236311, "epoch": 2847} {"train_loss": -24.732980728149414, "global_step": 236312, "epoch": 2847} {"train_loss": -25.037214279174805, "global_step": 236313, "epoch": 2847} {"train_loss": -24.78778839111328, "global_step": 236314, "epoch": 2847} {"train_loss": -25.017541885375977, "global_step": 236315, "epoch": 2847} {"train_loss": -25.104175567626953, "global_step": 236316, "epoch": 2847} {"train_loss": -25.049991607666016, "global_step": 236317, "epoch": 2847} {"train_loss": -24.926401138305664, "global_step": 236318, "epoch": 2847} {"train_loss": -25.15541648864746, "global_step": 236319, "epoch": 2847} {"train_loss": -24.68124771118164, "global_step": 236320, "epoch": 2847} {"train_loss": -24.50239372253418, "global_step": 236321, "epoch": 2847} {"train_loss": -24.76835060119629, "global_step": 236322, "epoch": 2847} {"train_loss": -24.675153732299805, "global_step": 236323, "epoch": 2847} {"train_loss": -24.75227165222168, "global_step": 236324, "epoch": 2847} {"train_loss": -25.07343101501465, "global_step": 236325, "epoch": 2847} {"train_loss": -24.37911605834961, "global_step": 236326, "epoch": 2847} {"train_loss": -24.619638442993164, "global_step": 236327, "epoch": 2847} {"train_loss": -24.645172119140625, "global_step": 236328, "epoch": 2847} {"train_loss": -24.804967880249023, "global_step": 236329, "epoch": 2847} {"train_loss": -24.746051788330078, "global_step": 236330, "epoch": 2847} {"train_loss": -24.62590217590332, "global_step": 236331, "epoch": 2847} {"train_loss": -24.714277267456055, "global_step": 236332, "epoch": 2847} {"train_loss": -24.69603157043457, "global_step": 236333, "epoch": 2847} {"train_loss": -24.973974227905273, "global_step": 236334, "epoch": 2847} {"train_loss": -24.902769088745117, "global_step": 236335, "epoch": 2847} {"train_loss": -24.761138916015625, "global_step": 236336, "epoch": 2847} {"train_loss": -24.999874114990234, "global_step": 236337, "epoch": 2847} {"train_loss": -25.012863159179688, "global_step": 236338, "epoch": 2847} {"train_loss": -24.736722946166992, "global_step": 236339, "epoch": 2847} {"train_loss": -24.587430953979492, "global_step": 236340, "epoch": 2847} {"train_loss": -24.598608016967773, "global_step": 236341, "epoch": 2847} {"train_loss": -25.047977447509766, "global_step": 236342, "epoch": 2847} {"train_loss": -25.031558990478516, "global_step": 236343, "epoch": 2847} {"train_loss": -25.142683029174805, "global_step": 236344, "epoch": 2847} {"train_loss": -24.60047721862793, "global_step": 236345, "epoch": 2847} {"train_loss": -24.604597091674805, "global_step": 236346, "epoch": 2847} {"train_loss": -24.51624298095703, "global_step": 236347, "epoch": 2847} {"train_loss": -24.36463165283203, "global_step": 236348, "epoch": 2847} {"train_loss": -24.63685417175293, "global_step": 236349, "epoch": 2847} {"train_loss": -24.803693771362305, "global_step": 236350, "epoch": 2847} {"train_loss": -24.512962341308594, "global_step": 236351, "epoch": 2847} {"train_loss": -24.46174430847168, "global_step": 236352, "epoch": 2847} {"train_loss": -24.692747116088867, "global_step": 236353, "epoch": 2847} {"train_loss": -24.906814575195312, "global_step": 236354, "epoch": 2847} {"train_loss": -24.56768798828125, "global_step": 236355, "epoch": 2847} {"train_loss": -25.20713233947754, "global_step": 236356, "epoch": 2847} {"train_loss": -25.094406127929688, "global_step": 236357, "epoch": 2847} {"train_loss": -25.146738052368164, "global_step": 236358, "epoch": 2847} {"train_loss": -24.763437271118164, "global_step": 236359, "epoch": 2847} {"train_loss": -24.85367774963379, "global_step": 236360, "epoch": 2847} {"train_loss": -24.72842025756836, "global_step": 236361, "epoch": 2847} {"train_loss": -25.12629508972168, "global_step": 236362, "epoch": 2847} {"train_loss": -24.898569107055664, "global_step": 236363, "epoch": 2847} {"train_loss": -24.621381759643555, "global_step": 236364, "epoch": 2847} {"train_loss": -25.01368522644043, "global_step": 236365, "epoch": 2847} {"train_loss": -24.778911590576172, "global_step": 236366, "epoch": 2847} {"train_loss": -25.0992488861084, "global_step": 236367, "epoch": 2847} {"train_loss": -24.561697006225586, "global_step": 236368, "epoch": 2847} {"train_loss": -24.90211296081543, "global_step": 236369, "epoch": 2847} {"train_loss": -24.441110610961914, "global_step": 236370, "epoch": 2847} {"train_loss": -24.645889282226562, "global_step": 236371, "epoch": 2847} {"train_loss": -25.13221549987793, "global_step": 236372, "epoch": 2847} {"train_loss": -24.849475860595703, "global_step": 236373, "epoch": 2847} {"train_loss": -24.85039520263672, "global_step": 236374, "epoch": 2847} {"train_loss": -24.7180233001709, "global_step": 236375, "epoch": 2847} {"train_loss": -24.775615692138672, "global_step": 236376, "epoch": 2847} {"train_loss": -25.110193252563477, "global_step": 236377, "epoch": 2847} {"train_loss": -24.936307907104492, "global_step": 236378, "epoch": 2847} {"train_loss": -24.26666259765625, "global_step": 236379, "epoch": 2847} {"train_loss": -24.639911651611328, "global_step": 236380, "epoch": 2847} {"train_loss": -24.196664810180664, "global_step": 236381, "epoch": 2847} {"train_loss": -24.3118896484375, "global_step": 236382, "epoch": 2847} {"train_loss": -24.7428179131933, "global_step": 236383, "epoch": 2847, "val_loss": 6851561.0} {"train_loss": -24.156896591186523, "global_step": 236384, "epoch": 2848} {"train_loss": -24.20241928100586, "global_step": 236385, "epoch": 2848} {"train_loss": -24.10291862487793, "global_step": 236386, "epoch": 2848} {"train_loss": -24.158123016357422, "global_step": 236387, "epoch": 2848} {"train_loss": -23.666658401489258, "global_step": 236388, "epoch": 2848} {"train_loss": -23.79770278930664, "global_step": 236389, "epoch": 2848} {"train_loss": -24.196104049682617, "global_step": 236390, "epoch": 2848} {"train_loss": -23.9060001373291, "global_step": 236391, "epoch": 2848} {"train_loss": -24.373947143554688, "global_step": 236392, "epoch": 2848} {"train_loss": -24.116901397705078, "global_step": 236393, "epoch": 2848} {"train_loss": -24.055723190307617, "global_step": 236394, "epoch": 2848} {"train_loss": -24.217430114746094, "global_step": 236395, "epoch": 2848} {"train_loss": -24.066213607788086, "global_step": 236396, "epoch": 2848} {"train_loss": -24.59772300720215, "global_step": 236397, "epoch": 2848} {"train_loss": -24.434024810791016, "global_step": 236398, "epoch": 2848} {"train_loss": -24.080480575561523, "global_step": 236399, "epoch": 2848} {"train_loss": -24.72559928894043, "global_step": 236400, "epoch": 2848} {"train_loss": -24.20741844177246, "global_step": 236401, "epoch": 2848} {"train_loss": -24.423110961914062, "global_step": 236402, "epoch": 2848} {"train_loss": -24.467147827148438, "global_step": 236403, "epoch": 2848} {"train_loss": -24.259973526000977, "global_step": 236404, "epoch": 2848} {"train_loss": -24.44721794128418, "global_step": 236405, "epoch": 2848} {"train_loss": -24.45047378540039, "global_step": 236406, "epoch": 2848} {"train_loss": -24.53793716430664, "global_step": 236407, "epoch": 2848} {"train_loss": -24.631221771240234, "global_step": 236408, "epoch": 2848} {"train_loss": -24.653188705444336, "global_step": 236409, "epoch": 2848} {"train_loss": -24.638412475585938, "global_step": 236410, "epoch": 2848} {"train_loss": -24.395673751831055, "global_step": 236411, "epoch": 2848} {"train_loss": -24.746389389038086, "global_step": 236412, "epoch": 2848} {"train_loss": -24.653974533081055, "global_step": 236413, "epoch": 2848} {"train_loss": -24.536619186401367, "global_step": 236414, "epoch": 2848} {"train_loss": -24.613483428955078, "global_step": 236415, "epoch": 2848} {"train_loss": -24.919891357421875, "global_step": 236416, "epoch": 2848} {"train_loss": -24.66533851623535, "global_step": 236417, "epoch": 2848} {"train_loss": -24.589685440063477, "global_step": 236418, "epoch": 2848} {"train_loss": -24.799102783203125, "global_step": 236419, "epoch": 2848} {"train_loss": -24.581890106201172, "global_step": 236420, "epoch": 2848} {"train_loss": -24.40523910522461, "global_step": 236421, "epoch": 2848} {"train_loss": -24.828292846679688, "global_step": 236422, "epoch": 2848} {"train_loss": -24.877334594726562, "global_step": 236423, "epoch": 2848} {"train_loss": -24.696653366088867, "global_step": 236424, "epoch": 2848} {"train_loss": -25.279190063476562, "global_step": 236425, "epoch": 2848} {"train_loss": -24.9201602935791, "global_step": 236426, "epoch": 2848} {"train_loss": -24.854063034057617, "global_step": 236427, "epoch": 2848} {"train_loss": -24.59950828552246, "global_step": 236428, "epoch": 2848} {"train_loss": -24.765522003173828, "global_step": 236429, "epoch": 2848} {"train_loss": -24.617523193359375, "global_step": 236430, "epoch": 2848} {"train_loss": -24.8167667388916, "global_step": 236431, "epoch": 2848} {"train_loss": -24.83942985534668, "global_step": 236432, "epoch": 2848} {"train_loss": -24.72490119934082, "global_step": 236433, "epoch": 2848} {"train_loss": -24.399091720581055, "global_step": 236434, "epoch": 2848} {"train_loss": -24.672908782958984, "global_step": 236435, "epoch": 2848} {"train_loss": -24.869476318359375, "global_step": 236436, "epoch": 2848} {"train_loss": -24.664535522460938, "global_step": 236437, "epoch": 2848} {"train_loss": -24.962100982666016, "global_step": 236438, "epoch": 2848} {"train_loss": -24.65290069580078, "global_step": 236439, "epoch": 2848} {"train_loss": -24.754337310791016, "global_step": 236440, "epoch": 2848} {"train_loss": -24.785192489624023, "global_step": 236441, "epoch": 2848} {"train_loss": -24.762685775756836, "global_step": 236442, "epoch": 2848} {"train_loss": -24.92238426208496, "global_step": 236443, "epoch": 2848} {"train_loss": -24.813512802124023, "global_step": 236444, "epoch": 2848} {"train_loss": -24.68707275390625, "global_step": 236445, "epoch": 2848} {"train_loss": -24.822919845581055, "global_step": 236446, "epoch": 2848} {"train_loss": -25.051870346069336, "global_step": 236447, "epoch": 2848} {"train_loss": -25.05974006652832, "global_step": 236448, "epoch": 2848} {"train_loss": -24.97137451171875, "global_step": 236449, "epoch": 2848} {"train_loss": -24.6177978515625, "global_step": 236450, "epoch": 2848} {"train_loss": -25.043636322021484, "global_step": 236451, "epoch": 2848} {"train_loss": -25.08344841003418, "global_step": 236452, "epoch": 2848} {"train_loss": -24.848787307739258, "global_step": 236453, "epoch": 2848} {"train_loss": -25.004125595092773, "global_step": 236454, "epoch": 2848} {"train_loss": -24.499542236328125, "global_step": 236455, "epoch": 2848} {"train_loss": -24.41312599182129, "global_step": 236456, "epoch": 2848} {"train_loss": -24.59583854675293, "global_step": 236457, "epoch": 2848} {"train_loss": -24.559032440185547, "global_step": 236458, "epoch": 2848} {"train_loss": -24.827802658081055, "global_step": 236459, "epoch": 2848} {"train_loss": -24.631864547729492, "global_step": 236460, "epoch": 2848} {"train_loss": -24.44646644592285, "global_step": 236461, "epoch": 2848} {"train_loss": -24.92334747314453, "global_step": 236462, "epoch": 2848} {"train_loss": -25.02491569519043, "global_step": 236463, "epoch": 2848} {"train_loss": -24.76999282836914, "global_step": 236464, "epoch": 2848} {"train_loss": -25.03337860107422, "global_step": 236465, "epoch": 2848} {"train_loss": -24.62104376827378, "global_step": 236466, "epoch": 2848, "val_loss": 6708262.0} {"train_loss": -24.6149959564209, "global_step": 236467, "epoch": 2849} {"train_loss": -24.414514541625977, "global_step": 236468, "epoch": 2849} {"train_loss": -23.847043991088867, "global_step": 236469, "epoch": 2849} {"train_loss": -24.326297760009766, "global_step": 236470, "epoch": 2849} {"train_loss": -24.476642608642578, "global_step": 236471, "epoch": 2849} {"train_loss": -24.70516014099121, "global_step": 236472, "epoch": 2849} {"train_loss": -24.311328887939453, "global_step": 236473, "epoch": 2849} {"train_loss": -24.967205047607422, "global_step": 236474, "epoch": 2849} {"train_loss": -24.645078659057617, "global_step": 236475, "epoch": 2849} {"train_loss": -24.492971420288086, "global_step": 236476, "epoch": 2849} {"train_loss": -24.598661422729492, "global_step": 236477, "epoch": 2849} {"train_loss": -24.280492782592773, "global_step": 236478, "epoch": 2849} {"train_loss": -24.918264389038086, "global_step": 236479, "epoch": 2849} {"train_loss": -24.704797744750977, "global_step": 236480, "epoch": 2849} {"train_loss": -24.710020065307617, "global_step": 236481, "epoch": 2849} {"train_loss": -24.4443359375, "global_step": 236482, "epoch": 2849} {"train_loss": -24.73750877380371, "global_step": 236483, "epoch": 2849} {"train_loss": -24.24153709411621, "global_step": 236484, "epoch": 2849} {"train_loss": -24.683469772338867, "global_step": 236485, "epoch": 2849} {"train_loss": -24.816267013549805, "global_step": 236486, "epoch": 2849} {"train_loss": -24.578622817993164, "global_step": 236487, "epoch": 2849} {"train_loss": -24.555326461791992, "global_step": 236488, "epoch": 2849} {"train_loss": -24.742918014526367, "global_step": 236489, "epoch": 2849} {"train_loss": -24.622180938720703, "global_step": 236490, "epoch": 2849} {"train_loss": -24.706573486328125, "global_step": 236491, "epoch": 2849} {"train_loss": -24.689321517944336, "global_step": 236492, "epoch": 2849} {"train_loss": -24.510082244873047, "global_step": 236493, "epoch": 2849} {"train_loss": -24.831872940063477, "global_step": 236494, "epoch": 2849} {"train_loss": -24.87395668029785, "global_step": 236495, "epoch": 2849} {"train_loss": -24.45379638671875, "global_step": 236496, "epoch": 2849} {"train_loss": -24.982807159423828, "global_step": 236497, "epoch": 2849} {"train_loss": -25.087539672851562, "global_step": 236498, "epoch": 2849} {"train_loss": -24.658178329467773, "global_step": 236499, "epoch": 2849} {"train_loss": -24.79513931274414, "global_step": 236500, "epoch": 2849} {"train_loss": -24.849227905273438, "global_step": 236501, "epoch": 2849} {"train_loss": -24.859603881835938, "global_step": 236502, "epoch": 2849} {"train_loss": -24.802906036376953, "global_step": 236503, "epoch": 2849} {"train_loss": -24.996129989624023, "global_step": 236504, "epoch": 2849} {"train_loss": -25.168851852416992, "global_step": 236505, "epoch": 2849} {"train_loss": -24.819238662719727, "global_step": 236506, "epoch": 2849} {"train_loss": -24.941926956176758, "global_step": 236507, "epoch": 2849} {"train_loss": -24.8066463470459, "global_step": 236508, "epoch": 2849} {"train_loss": -25.20547103881836, "global_step": 236509, "epoch": 2849} {"train_loss": -24.999622344970703, "global_step": 236510, "epoch": 2849} {"train_loss": -25.129423141479492, "global_step": 236511, "epoch": 2849} {"train_loss": -24.717809677124023, "global_step": 236512, "epoch": 2849} {"train_loss": -24.799848556518555, "global_step": 236513, "epoch": 2849} {"train_loss": -24.742677688598633, "global_step": 236514, "epoch": 2849} {"train_loss": -25.206592559814453, "global_step": 236515, "epoch": 2849} {"train_loss": -24.972326278686523, "global_step": 236516, "epoch": 2849} {"train_loss": -24.974746704101562, "global_step": 236517, "epoch": 2849} {"train_loss": -25.217931747436523, "global_step": 236518, "epoch": 2849} {"train_loss": -25.059240341186523, "global_step": 236519, "epoch": 2849} {"train_loss": -24.92517852783203, "global_step": 236520, "epoch": 2849} {"train_loss": -24.84584617614746, "global_step": 236521, "epoch": 2849} {"train_loss": -25.181396484375, "global_step": 236522, "epoch": 2849} {"train_loss": -24.69159507751465, "global_step": 236523, "epoch": 2849} {"train_loss": -24.43406105041504, "global_step": 236524, "epoch": 2849} {"train_loss": -24.25775718688965, "global_step": 236525, "epoch": 2849} {"train_loss": -24.398855209350586, "global_step": 236526, "epoch": 2849} {"train_loss": -24.771209716796875, "global_step": 236527, "epoch": 2849} {"train_loss": -23.893884658813477, "global_step": 236528, "epoch": 2849} {"train_loss": -23.948766708374023, "global_step": 236529, "epoch": 2849} {"train_loss": -23.765758514404297, "global_step": 236530, "epoch": 2849} {"train_loss": -24.955976486206055, "global_step": 236531, "epoch": 2849} {"train_loss": -24.52747917175293, "global_step": 236532, "epoch": 2849} {"train_loss": -24.253198623657227, "global_step": 236533, "epoch": 2849} {"train_loss": -24.339330673217773, "global_step": 236534, "epoch": 2849} {"train_loss": -24.755849838256836, "global_step": 236535, "epoch": 2849} {"train_loss": -24.633275985717773, "global_step": 236536, "epoch": 2849} {"train_loss": -24.791532516479492, "global_step": 236537, "epoch": 2849} {"train_loss": -24.12575340270996, "global_step": 236538, "epoch": 2849} {"train_loss": -24.88368797302246, "global_step": 236539, "epoch": 2849} {"train_loss": -24.72920799255371, "global_step": 236540, "epoch": 2849} {"train_loss": -24.876314163208008, "global_step": 236541, "epoch": 2849} {"train_loss": -24.35474967956543, "global_step": 236542, "epoch": 2849} {"train_loss": -24.732990264892578, "global_step": 236543, "epoch": 2849} {"train_loss": -24.565786361694336, "global_step": 236544, "epoch": 2849} {"train_loss": -24.6148738861084, "global_step": 236545, "epoch": 2849} {"train_loss": -24.931135177612305, "global_step": 236546, "epoch": 2849} {"train_loss": -24.959409713745117, "global_step": 236547, "epoch": 2849} {"train_loss": -24.89137077331543, "global_step": 236548, "epoch": 2849} {"train_loss": -24.684414875076477, "global_step": 236549, "epoch": 2849, "val_loss": 6822431.0} {"train_loss": -24.87328338623047, "global_step": 236550, "epoch": 2850} {"train_loss": -24.86441993713379, "global_step": 236551, "epoch": 2850} {"train_loss": -24.7647705078125, "global_step": 236552, "epoch": 2850} {"train_loss": -24.78035545349121, "global_step": 236553, "epoch": 2850} {"train_loss": -24.820175170898438, "global_step": 236554, "epoch": 2850} {"train_loss": -24.974233627319336, "global_step": 236555, "epoch": 2850} {"train_loss": -24.5567684173584, "global_step": 236556, "epoch": 2850} {"train_loss": -24.494245529174805, "global_step": 236557, "epoch": 2850} {"train_loss": -24.71416664123535, "global_step": 236558, "epoch": 2850} {"train_loss": -24.625051498413086, "global_step": 236559, "epoch": 2850} {"train_loss": -24.58901023864746, "global_step": 236560, "epoch": 2850} {"train_loss": -25.088287353515625, "global_step": 236561, "epoch": 2850} {"train_loss": -24.919401168823242, "global_step": 236562, "epoch": 2850} {"train_loss": -24.759601593017578, "global_step": 236563, "epoch": 2850} {"train_loss": -24.58698081970215, "global_step": 236564, "epoch": 2850} {"train_loss": -24.99566078186035, "global_step": 236565, "epoch": 2850} {"train_loss": -24.604751586914062, "global_step": 236566, "epoch": 2850} {"train_loss": -24.994848251342773, "global_step": 236567, "epoch": 2850} {"train_loss": -24.95388412475586, "global_step": 236568, "epoch": 2850} {"train_loss": -24.9171199798584, "global_step": 236569, "epoch": 2850} {"train_loss": -24.980770111083984, "global_step": 236570, "epoch": 2850} {"train_loss": -24.946243286132812, "global_step": 236571, "epoch": 2850} {"train_loss": -25.49751091003418, "global_step": 236572, "epoch": 2850} {"train_loss": -24.452138900756836, "global_step": 236573, "epoch": 2850} {"train_loss": -24.868425369262695, "global_step": 236574, "epoch": 2850} {"train_loss": -25.106760025024414, "global_step": 236575, "epoch": 2850} {"train_loss": -24.7183837890625, "global_step": 236576, "epoch": 2850} {"train_loss": -25.065763473510742, "global_step": 236577, "epoch": 2850} {"train_loss": -25.142393112182617, "global_step": 236578, "epoch": 2850} {"train_loss": -25.108030319213867, "global_step": 236579, "epoch": 2850} {"train_loss": -24.812381744384766, "global_step": 236580, "epoch": 2850} {"train_loss": -24.930898666381836, "global_step": 236581, "epoch": 2850} {"train_loss": -25.28464698791504, "global_step": 236582, "epoch": 2850} {"train_loss": -25.050796508789062, "global_step": 236583, "epoch": 2850} {"train_loss": -25.11231803894043, "global_step": 236584, "epoch": 2850} {"train_loss": -25.019330978393555, "global_step": 236585, "epoch": 2850} {"train_loss": -24.833982467651367, "global_step": 236586, "epoch": 2850} {"train_loss": -24.90797996520996, "global_step": 236587, "epoch": 2850} {"train_loss": -24.9160213470459, "global_step": 236588, "epoch": 2850} {"train_loss": -24.52743911743164, "global_step": 236589, "epoch": 2850} {"train_loss": -24.8363094329834, "global_step": 236590, "epoch": 2850} {"train_loss": -24.583051681518555, "global_step": 236591, "epoch": 2850} {"train_loss": -25.06686782836914, "global_step": 236592, "epoch": 2850} {"train_loss": -24.846593856811523, "global_step": 236593, "epoch": 2850} {"train_loss": -24.513029098510742, "global_step": 236594, "epoch": 2850} {"train_loss": -24.802745819091797, "global_step": 236595, "epoch": 2850} {"train_loss": -25.092451095581055, "global_step": 236596, "epoch": 2850} {"train_loss": -25.04811668395996, "global_step": 236597, "epoch": 2850} {"train_loss": -24.95746421813965, "global_step": 236598, "epoch": 2850} {"train_loss": -24.4780216217041, "global_step": 236599, "epoch": 2850} {"train_loss": -24.601224899291992, "global_step": 236600, "epoch": 2850} {"train_loss": -24.159896850585938, "global_step": 236601, "epoch": 2850} {"train_loss": -24.483196258544922, "global_step": 236602, "epoch": 2850} {"train_loss": -24.703256607055664, "global_step": 236603, "epoch": 2850} {"train_loss": -25.0784854888916, "global_step": 236604, "epoch": 2850} {"train_loss": -24.99787712097168, "global_step": 236605, "epoch": 2850} {"train_loss": -24.93907928466797, "global_step": 236606, "epoch": 2850} {"train_loss": -24.83966636657715, "global_step": 236607, "epoch": 2850} {"train_loss": -25.06745147705078, "global_step": 236608, "epoch": 2850} {"train_loss": -24.878843307495117, "global_step": 236609, "epoch": 2850} {"train_loss": -25.057132720947266, "global_step": 236610, "epoch": 2850} {"train_loss": -24.54596519470215, "global_step": 236611, "epoch": 2850} {"train_loss": -24.91391372680664, "global_step": 236612, "epoch": 2850} {"train_loss": -24.826980590820312, "global_step": 236613, "epoch": 2850} {"train_loss": -25.1939754486084, "global_step": 236614, "epoch": 2850} {"train_loss": -24.675378799438477, "global_step": 236615, "epoch": 2850} {"train_loss": -24.67755126953125, "global_step": 236616, "epoch": 2850} {"train_loss": -24.841711044311523, "global_step": 236617, "epoch": 2850} {"train_loss": -24.45090103149414, "global_step": 236618, "epoch": 2850} {"train_loss": -25.170141220092773, "global_step": 236619, "epoch": 2850} {"train_loss": -24.795974731445312, "global_step": 236620, "epoch": 2850} {"train_loss": -24.602869033813477, "global_step": 236621, "epoch": 2850} {"train_loss": -25.48174476623535, "global_step": 236622, "epoch": 2850} {"train_loss": -24.79158592224121, "global_step": 236623, "epoch": 2850} {"train_loss": -24.86347007751465, "global_step": 236624, "epoch": 2850} {"train_loss": -24.785037994384766, "global_step": 236625, "epoch": 2850} {"train_loss": -24.833372116088867, "global_step": 236626, "epoch": 2850} {"train_loss": -25.089033126831055, "global_step": 236627, "epoch": 2850} {"train_loss": -24.6209716796875, "global_step": 236628, "epoch": 2850} {"train_loss": -25.088703155517578, "global_step": 236629, "epoch": 2850} {"train_loss": -24.783170700073242, "global_step": 236630, "epoch": 2850} {"train_loss": -25.108327865600586, "global_step": 236631, "epoch": 2850} {"train_loss": -24.847169370536346, "global_step": 236632, "epoch": 2850, "train/sim_max_reward_0": 1.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4500000": 1.0, "test/sim_max_reward_4500001": 1.0, "test/sim_max_reward_4500002": 1.0, "test/sim_max_reward_4500003": 1.0, "test/sim_max_reward_4500004": 1.0, "test/sim_max_reward_4500005": 0.0, "test/sim_max_reward_4500006": 1.0, "test/sim_max_reward_4500007": 1.0, "test/sim_max_reward_4500008": 1.0, "test/sim_max_reward_4500009": 1.0, "test/sim_max_reward_4500010": 1.0, "test/sim_max_reward_4500011": 1.0, "test/sim_max_reward_4500012": 1.0, "test/sim_max_reward_4500013": 1.0, "test/sim_max_reward_4500014": 1.0, "test/sim_max_reward_4500015": 1.0, "test/sim_max_reward_4500016": 1.0, "test/sim_max_reward_4500017": 1.0, "test/sim_max_reward_4500018": 1.0, "test/sim_max_reward_4500019": 0.0, "test/sim_max_reward_4500020": 1.0, "test/sim_max_reward_4500021": 1.0, "train/mean_score": 1.0, "test/mean_score": 0.9090909090909091, "val_loss": 6787551.0} {"train_loss": -23.337831497192383, "global_step": 236633, "epoch": 2851} {"train_loss": -22.921741485595703, "global_step": 236634, "epoch": 2851} {"train_loss": -23.734643936157227, "global_step": 236635, "epoch": 2851} {"train_loss": -24.714468002319336, "global_step": 236636, "epoch": 2851} {"train_loss": -23.79725456237793, "global_step": 236637, "epoch": 2851} {"train_loss": -24.129926681518555, "global_step": 236638, "epoch": 2851} {"train_loss": -24.550344467163086, "global_step": 236639, "epoch": 2851} {"train_loss": -24.24979591369629, "global_step": 236640, "epoch": 2851} {"train_loss": -24.08922576904297, "global_step": 236641, "epoch": 2851} {"train_loss": -24.35038948059082, "global_step": 236642, "epoch": 2851} {"train_loss": -24.112728118896484, "global_step": 236643, "epoch": 2851} {"train_loss": -24.258832931518555, "global_step": 236644, "epoch": 2851} {"train_loss": -24.075767517089844, "global_step": 236645, "epoch": 2851} {"train_loss": -24.124364852905273, "global_step": 236646, "epoch": 2851} {"train_loss": -24.557069778442383, "global_step": 236647, "epoch": 2851} {"train_loss": -23.862577438354492, "global_step": 236648, "epoch": 2851} {"train_loss": -24.2762508392334, "global_step": 236649, "epoch": 2851} {"train_loss": -24.542203903198242, "global_step": 236650, "epoch": 2851} {"train_loss": -24.59052085876465, "global_step": 236651, "epoch": 2851} {"train_loss": -24.768198013305664, "global_step": 236652, "epoch": 2851} {"train_loss": -24.49631118774414, "global_step": 236653, "epoch": 2851} {"train_loss": -24.58958625793457, "global_step": 236654, "epoch": 2851} {"train_loss": -24.737878799438477, "global_step": 236655, "epoch": 2851} {"train_loss": -24.95345115661621, "global_step": 236656, "epoch": 2851} {"train_loss": -24.377920150756836, "global_step": 236657, "epoch": 2851} {"train_loss": -24.247556686401367, "global_step": 236658, "epoch": 2851} {"train_loss": -24.952768325805664, "global_step": 236659, "epoch": 2851} {"train_loss": -24.56797218322754, "global_step": 236660, "epoch": 2851} {"train_loss": -24.501604080200195, "global_step": 236661, "epoch": 2851} {"train_loss": -24.63948631286621, "global_step": 236662, "epoch": 2851} {"train_loss": -24.55130958557129, "global_step": 236663, "epoch": 2851} {"train_loss": -24.75679588317871, "global_step": 236664, "epoch": 2851} {"train_loss": -24.71343994140625, "global_step": 236665, "epoch": 2851} {"train_loss": -24.409605026245117, "global_step": 236666, "epoch": 2851} {"train_loss": -24.840988159179688, "global_step": 236667, "epoch": 2851} {"train_loss": -24.694791793823242, "global_step": 236668, "epoch": 2851} {"train_loss": -24.894411087036133, "global_step": 236669, "epoch": 2851} {"train_loss": -24.76186752319336, "global_step": 236670, "epoch": 2851} {"train_loss": -25.073453903198242, "global_step": 236671, "epoch": 2851} {"train_loss": -25.26022720336914, "global_step": 236672, "epoch": 2851} {"train_loss": -24.936620712280273, "global_step": 236673, "epoch": 2851} {"train_loss": -24.99297523498535, "global_step": 236674, "epoch": 2851} {"train_loss": -24.700769424438477, "global_step": 236675, "epoch": 2851} {"train_loss": -25.026411056518555, "global_step": 236676, "epoch": 2851} {"train_loss": -24.652790069580078, "global_step": 236677, "epoch": 2851} {"train_loss": -24.526874542236328, "global_step": 236678, "epoch": 2851} {"train_loss": -25.017719268798828, "global_step": 236679, "epoch": 2851} {"train_loss": -24.72919273376465, "global_step": 236680, "epoch": 2851} {"train_loss": -24.90247917175293, "global_step": 236681, "epoch": 2851} {"train_loss": -24.84926986694336, "global_step": 236682, "epoch": 2851} {"train_loss": -25.02068519592285, "global_step": 236683, "epoch": 2851} {"train_loss": -24.74921989440918, "global_step": 236684, "epoch": 2851} {"train_loss": -24.846904754638672, "global_step": 236685, "epoch": 2851} {"train_loss": -25.139467239379883, "global_step": 236686, "epoch": 2851} {"train_loss": -24.553699493408203, "global_step": 236687, "epoch": 2851} {"train_loss": -24.911819458007812, "global_step": 236688, "epoch": 2851} {"train_loss": -24.660356521606445, "global_step": 236689, "epoch": 2851} {"train_loss": -24.8923282623291, "global_step": 236690, "epoch": 2851} {"train_loss": -25.0605525970459, "global_step": 236691, "epoch": 2851} {"train_loss": -24.38386344909668, "global_step": 236692, "epoch": 2851} {"train_loss": -25.188556671142578, "global_step": 236693, "epoch": 2851} {"train_loss": -24.676359176635742, "global_step": 236694, "epoch": 2851} {"train_loss": -24.934843063354492, "global_step": 236695, "epoch": 2851} {"train_loss": -25.0557918548584, "global_step": 236696, "epoch": 2851} {"train_loss": -24.62636375427246, "global_step": 236697, "epoch": 2851} {"train_loss": -24.76658058166504, "global_step": 236698, "epoch": 2851} {"train_loss": -24.827360153198242, "global_step": 236699, "epoch": 2851} {"train_loss": -24.977426528930664, "global_step": 236700, "epoch": 2851} {"train_loss": -24.773727416992188, "global_step": 236701, "epoch": 2851} {"train_loss": -25.018665313720703, "global_step": 236702, "epoch": 2851} {"train_loss": -24.68744468688965, "global_step": 236703, "epoch": 2851} {"train_loss": -24.55722999572754, "global_step": 236704, "epoch": 2851} {"train_loss": -24.746488571166992, "global_step": 236705, "epoch": 2851} {"train_loss": -24.806716918945312, "global_step": 236706, "epoch": 2851} {"train_loss": -24.760555267333984, "global_step": 236707, "epoch": 2851} {"train_loss": -25.07478141784668, "global_step": 236708, "epoch": 2851} {"train_loss": -24.8140869140625, "global_step": 236709, "epoch": 2851} {"train_loss": -25.328832626342773, "global_step": 236710, "epoch": 2851} {"train_loss": -24.67422103881836, "global_step": 236711, "epoch": 2851} {"train_loss": -25.027311325073242, "global_step": 236712, "epoch": 2851} {"train_loss": -25.15886116027832, "global_step": 236713, "epoch": 2851} {"train_loss": -24.868261337280273, "global_step": 236714, "epoch": 2851} {"train_loss": -24.655241219394178, "global_step": 236715, "epoch": 2851, "val_loss": 6753833.0} {"train_loss": -24.563955307006836, "global_step": 236716, "epoch": 2852} {"train_loss": -24.4211368560791, "global_step": 236717, "epoch": 2852} {"train_loss": -24.799381256103516, "global_step": 236718, "epoch": 2852} {"train_loss": -24.668012619018555, "global_step": 236719, "epoch": 2852} {"train_loss": -24.776342391967773, "global_step": 236720, "epoch": 2852} {"train_loss": -24.730972290039062, "global_step": 236721, "epoch": 2852} {"train_loss": -24.593217849731445, "global_step": 236722, "epoch": 2852} {"train_loss": -24.646108627319336, "global_step": 236723, "epoch": 2852} {"train_loss": -24.508188247680664, "global_step": 236724, "epoch": 2852} {"train_loss": -24.5364933013916, "global_step": 236725, "epoch": 2852} {"train_loss": -24.887075424194336, "global_step": 236726, "epoch": 2852} {"train_loss": -24.847043991088867, "global_step": 236727, "epoch": 2852} {"train_loss": -24.901758193969727, "global_step": 236728, "epoch": 2852} {"train_loss": -24.699542999267578, "global_step": 236729, "epoch": 2852} {"train_loss": -24.844905853271484, "global_step": 236730, "epoch": 2852} {"train_loss": -24.602521896362305, "global_step": 236731, "epoch": 2852} {"train_loss": -25.10018539428711, "global_step": 236732, "epoch": 2852} {"train_loss": -24.880056381225586, "global_step": 236733, "epoch": 2852} {"train_loss": -24.654592514038086, "global_step": 236734, "epoch": 2852} {"train_loss": -24.7714900970459, "global_step": 236735, "epoch": 2852} {"train_loss": -24.968181610107422, "global_step": 236736, "epoch": 2852} {"train_loss": -24.668737411499023, "global_step": 236737, "epoch": 2852} {"train_loss": -25.014978408813477, "global_step": 236738, "epoch": 2852} {"train_loss": -24.337711334228516, "global_step": 236739, "epoch": 2852} {"train_loss": -24.710676193237305, "global_step": 236740, "epoch": 2852} {"train_loss": -24.90106201171875, "global_step": 236741, "epoch": 2852} {"train_loss": -24.55575942993164, "global_step": 236742, "epoch": 2852} {"train_loss": -24.589439392089844, "global_step": 236743, "epoch": 2852} {"train_loss": -24.871540069580078, "global_step": 236744, "epoch": 2852} {"train_loss": -24.894201278686523, "global_step": 236745, "epoch": 2852} {"train_loss": -24.71021270751953, "global_step": 236746, "epoch": 2852} {"train_loss": -24.576833724975586, "global_step": 236747, "epoch": 2852} {"train_loss": -24.92975425720215, "global_step": 236748, "epoch": 2852} {"train_loss": -24.932538986206055, "global_step": 236749, "epoch": 2852} {"train_loss": -24.745023727416992, "global_step": 236750, "epoch": 2852} {"train_loss": -24.950414657592773, "global_step": 236751, "epoch": 2852} {"train_loss": -24.6595401763916, "global_step": 236752, "epoch": 2852} {"train_loss": -24.747404098510742, "global_step": 236753, "epoch": 2852} {"train_loss": -25.001541137695312, "global_step": 236754, "epoch": 2852} {"train_loss": -25.061904907226562, "global_step": 236755, "epoch": 2852} {"train_loss": -24.962688446044922, "global_step": 236756, "epoch": 2852} {"train_loss": -24.998188018798828, "global_step": 236757, "epoch": 2852} {"train_loss": -24.770313262939453, "global_step": 236758, "epoch": 2852} {"train_loss": -25.04047966003418, "global_step": 236759, "epoch": 2852} {"train_loss": -24.655942916870117, "global_step": 236760, "epoch": 2852} {"train_loss": -24.82331657409668, "global_step": 236761, "epoch": 2852} {"train_loss": -24.44887351989746, "global_step": 236762, "epoch": 2852} {"train_loss": -24.729068756103516, "global_step": 236763, "epoch": 2852} {"train_loss": -24.69832992553711, "global_step": 236764, "epoch": 2852} {"train_loss": -24.439756393432617, "global_step": 236765, "epoch": 2852} {"train_loss": -24.991806030273438, "global_step": 236766, "epoch": 2852} {"train_loss": -24.680784225463867, "global_step": 236767, "epoch": 2852} {"train_loss": -24.509754180908203, "global_step": 236768, "epoch": 2852} {"train_loss": -24.71442985534668, "global_step": 236769, "epoch": 2852} {"train_loss": -24.95996856689453, "global_step": 236770, "epoch": 2852} {"train_loss": -24.81315040588379, "global_step": 236771, "epoch": 2852} {"train_loss": -24.761014938354492, "global_step": 236772, "epoch": 2852} {"train_loss": -24.64186668395996, "global_step": 236773, "epoch": 2852} {"train_loss": -24.675430297851562, "global_step": 236774, "epoch": 2852} {"train_loss": -25.115196228027344, "global_step": 236775, "epoch": 2852} {"train_loss": -24.67714500427246, "global_step": 236776, "epoch": 2852} {"train_loss": -25.212379455566406, "global_step": 236777, "epoch": 2852} {"train_loss": -24.831693649291992, "global_step": 236778, "epoch": 2852} {"train_loss": -24.34305191040039, "global_step": 236779, "epoch": 2852} {"train_loss": -24.190107345581055, "global_step": 236780, "epoch": 2852} {"train_loss": -25.001798629760742, "global_step": 236781, "epoch": 2852} {"train_loss": -25.033039093017578, "global_step": 236782, "epoch": 2852} {"train_loss": -24.66463279724121, "global_step": 236783, "epoch": 2852} {"train_loss": -24.968734741210938, "global_step": 236784, "epoch": 2852} {"train_loss": -24.879581451416016, "global_step": 236785, "epoch": 2852} {"train_loss": -24.914236068725586, "global_step": 236786, "epoch": 2852} {"train_loss": -25.024581909179688, "global_step": 236787, "epoch": 2852} {"train_loss": -24.500282287597656, "global_step": 236788, "epoch": 2852} {"train_loss": -24.960660934448242, "global_step": 236789, "epoch": 2852} {"train_loss": -24.60636329650879, "global_step": 236790, "epoch": 2852} {"train_loss": -24.754825592041016, "global_step": 236791, "epoch": 2852} {"train_loss": -24.93731117248535, "global_step": 236792, "epoch": 2852} {"train_loss": -24.974628448486328, "global_step": 236793, "epoch": 2852} {"train_loss": -25.003253936767578, "global_step": 236794, "epoch": 2852} {"train_loss": -24.833677291870117, "global_step": 236795, "epoch": 2852} {"train_loss": -24.679616928100586, "global_step": 236796, "epoch": 2852} {"train_loss": -24.880624771118164, "global_step": 236797, "epoch": 2852} {"train_loss": -24.77111735975886, "global_step": 236798, "epoch": 2852, "val_loss": 6832956.0} {"train_loss": -24.545452117919922, "global_step": 236799, "epoch": 2853} {"train_loss": -24.319965362548828, "global_step": 236800, "epoch": 2853} {"train_loss": -24.69066047668457, "global_step": 236801, "epoch": 2853} {"train_loss": -24.60175132751465, "global_step": 236802, "epoch": 2853} {"train_loss": -24.57770347595215, "global_step": 236803, "epoch": 2853} {"train_loss": -24.811811447143555, "global_step": 236804, "epoch": 2853} {"train_loss": -24.90843963623047, "global_step": 236805, "epoch": 2853} {"train_loss": -24.912927627563477, "global_step": 236806, "epoch": 2853} {"train_loss": -25.08473777770996, "global_step": 236807, "epoch": 2853} {"train_loss": -24.86680793762207, "global_step": 236808, "epoch": 2853} {"train_loss": -24.7156925201416, "global_step": 236809, "epoch": 2853} {"train_loss": -24.730703353881836, "global_step": 236810, "epoch": 2853} {"train_loss": -24.618806838989258, "global_step": 236811, "epoch": 2853} {"train_loss": -24.735090255737305, "global_step": 236812, "epoch": 2853} {"train_loss": -24.616596221923828, "global_step": 236813, "epoch": 2853} {"train_loss": -25.096454620361328, "global_step": 236814, "epoch": 2853} {"train_loss": -24.84261131286621, "global_step": 236815, "epoch": 2853} {"train_loss": -24.937742233276367, "global_step": 236816, "epoch": 2853} {"train_loss": -24.77485466003418, "global_step": 236817, "epoch": 2853} {"train_loss": -24.839488983154297, "global_step": 236818, "epoch": 2853} {"train_loss": -24.753969192504883, "global_step": 236819, "epoch": 2853} {"train_loss": -24.673128128051758, "global_step": 236820, "epoch": 2853} {"train_loss": -24.730152130126953, "global_step": 236821, "epoch": 2853} {"train_loss": -25.06624984741211, "global_step": 236822, "epoch": 2853} {"train_loss": -24.908315658569336, "global_step": 236823, "epoch": 2853} {"train_loss": -25.088590621948242, "global_step": 236824, "epoch": 2853} {"train_loss": -24.433074951171875, "global_step": 236825, "epoch": 2853} {"train_loss": -25.12725830078125, "global_step": 236826, "epoch": 2853} {"train_loss": -24.955854415893555, "global_step": 236827, "epoch": 2853} {"train_loss": -24.89539909362793, "global_step": 236828, "epoch": 2853} {"train_loss": -24.8730525970459, "global_step": 236829, "epoch": 2853} {"train_loss": -24.91761589050293, "global_step": 236830, "epoch": 2853} {"train_loss": -24.98976707458496, "global_step": 236831, "epoch": 2853} {"train_loss": -24.978696823120117, "global_step": 236832, "epoch": 2853} {"train_loss": -25.110504150390625, "global_step": 236833, "epoch": 2853} {"train_loss": -24.89419937133789, "global_step": 236834, "epoch": 2853} {"train_loss": -24.987699508666992, "global_step": 236835, "epoch": 2853} {"train_loss": -25.10992431640625, "global_step": 236836, "epoch": 2853} {"train_loss": -25.144332885742188, "global_step": 236837, "epoch": 2853} {"train_loss": -24.66864776611328, "global_step": 236838, "epoch": 2853} {"train_loss": -24.717676162719727, "global_step": 236839, "epoch": 2853} {"train_loss": -25.020429611206055, "global_step": 236840, "epoch": 2853} {"train_loss": -24.85702896118164, "global_step": 236841, "epoch": 2853} {"train_loss": -25.104923248291016, "global_step": 236842, "epoch": 2853} {"train_loss": -24.821008682250977, "global_step": 236843, "epoch": 2853} {"train_loss": -24.664365768432617, "global_step": 236844, "epoch": 2853} {"train_loss": -24.807292938232422, "global_step": 236845, "epoch": 2853} {"train_loss": -24.9422550201416, "global_step": 236846, "epoch": 2853} {"train_loss": -24.8537654876709, "global_step": 236847, "epoch": 2853} {"train_loss": -24.478586196899414, "global_step": 236848, "epoch": 2853} {"train_loss": -24.6632080078125, "global_step": 236849, "epoch": 2853} {"train_loss": -25.260520935058594, "global_step": 236850, "epoch": 2853} {"train_loss": -24.681421279907227, "global_step": 236851, "epoch": 2853} {"train_loss": -24.727352142333984, "global_step": 236852, "epoch": 2853} {"train_loss": -25.214719772338867, "global_step": 236853, "epoch": 2853} {"train_loss": -24.76835060119629, "global_step": 236854, "epoch": 2853} {"train_loss": -25.159597396850586, "global_step": 236855, "epoch": 2853} {"train_loss": -24.805952072143555, "global_step": 236856, "epoch": 2853} {"train_loss": -25.15934181213379, "global_step": 236857, "epoch": 2853} {"train_loss": -25.039342880249023, "global_step": 236858, "epoch": 2853} {"train_loss": -24.695234298706055, "global_step": 236859, "epoch": 2853} {"train_loss": -24.20147705078125, "global_step": 236860, "epoch": 2853} {"train_loss": -24.877246856689453, "global_step": 236861, "epoch": 2853} {"train_loss": -24.75946617126465, "global_step": 236862, "epoch": 2853} {"train_loss": -24.687978744506836, "global_step": 236863, "epoch": 2853} {"train_loss": -24.454435348510742, "global_step": 236864, "epoch": 2853} {"train_loss": -24.609954833984375, "global_step": 236865, "epoch": 2853} {"train_loss": -25.0201473236084, "global_step": 236866, "epoch": 2853} {"train_loss": -25.059675216674805, "global_step": 236867, "epoch": 2853} {"train_loss": -24.560932159423828, "global_step": 236868, "epoch": 2853} {"train_loss": -25.097515106201172, "global_step": 236869, "epoch": 2853} {"train_loss": -24.987016677856445, "global_step": 236870, "epoch": 2853} {"train_loss": -24.801544189453125, "global_step": 236871, "epoch": 2853} {"train_loss": -24.9602108001709, "global_step": 236872, "epoch": 2853} {"train_loss": -24.90152359008789, "global_step": 236873, "epoch": 2853} {"train_loss": -25.0561466217041, "global_step": 236874, "epoch": 2853} {"train_loss": -24.955411911010742, "global_step": 236875, "epoch": 2853} {"train_loss": -24.56221580505371, "global_step": 236876, "epoch": 2853} {"train_loss": -24.87057876586914, "global_step": 236877, "epoch": 2853} {"train_loss": -25.036405563354492, "global_step": 236878, "epoch": 2853} {"train_loss": -25.03337287902832, "global_step": 236879, "epoch": 2853} {"train_loss": -24.696548461914062, "global_step": 236880, "epoch": 2853} {"train_loss": -24.837564100702124, "global_step": 236881, "epoch": 2853, "val_loss": 6688584.0} {"train_loss": -23.34961700439453, "global_step": 236882, "epoch": 2854} {"train_loss": -23.620569229125977, "global_step": 236883, "epoch": 2854} {"train_loss": -24.4890079498291, "global_step": 236884, "epoch": 2854} {"train_loss": -23.71677017211914, "global_step": 236885, "epoch": 2854} {"train_loss": -24.15828514099121, "global_step": 236886, "epoch": 2854} {"train_loss": -23.585779190063477, "global_step": 236887, "epoch": 2854} {"train_loss": -24.619131088256836, "global_step": 236888, "epoch": 2854} {"train_loss": -24.42241096496582, "global_step": 236889, "epoch": 2854} {"train_loss": -24.529865264892578, "global_step": 236890, "epoch": 2854} {"train_loss": -24.11612892150879, "global_step": 236891, "epoch": 2854} {"train_loss": -24.758100509643555, "global_step": 236892, "epoch": 2854} {"train_loss": -24.764286041259766, "global_step": 236893, "epoch": 2854} {"train_loss": -24.530012130737305, "global_step": 236894, "epoch": 2854} {"train_loss": -24.4832763671875, "global_step": 236895, "epoch": 2854} {"train_loss": -24.606897354125977, "global_step": 236896, "epoch": 2854} {"train_loss": -24.455984115600586, "global_step": 236897, "epoch": 2854} {"train_loss": -24.46837615966797, "global_step": 236898, "epoch": 2854} {"train_loss": -24.516782760620117, "global_step": 236899, "epoch": 2854} {"train_loss": -24.639841079711914, "global_step": 236900, "epoch": 2854} {"train_loss": -24.332630157470703, "global_step": 236901, "epoch": 2854} {"train_loss": -24.68442153930664, "global_step": 236902, "epoch": 2854} {"train_loss": -24.237442016601562, "global_step": 236903, "epoch": 2854} {"train_loss": -24.48042106628418, "global_step": 236904, "epoch": 2854} {"train_loss": -24.9194393157959, "global_step": 236905, "epoch": 2854} {"train_loss": -24.359460830688477, "global_step": 236906, "epoch": 2854} {"train_loss": -24.86726951599121, "global_step": 236907, "epoch": 2854} {"train_loss": -24.631200790405273, "global_step": 236908, "epoch": 2854} {"train_loss": -24.760107040405273, "global_step": 236909, "epoch": 2854} {"train_loss": -24.591373443603516, "global_step": 236910, "epoch": 2854} {"train_loss": -24.856130599975586, "global_step": 236911, "epoch": 2854} {"train_loss": -25.13147735595703, "global_step": 236912, "epoch": 2854} {"train_loss": -25.02694320678711, "global_step": 236913, "epoch": 2854} {"train_loss": -24.72760009765625, "global_step": 236914, "epoch": 2854} {"train_loss": -25.05694007873535, "global_step": 236915, "epoch": 2854} {"train_loss": -25.28360366821289, "global_step": 236916, "epoch": 2854} {"train_loss": -24.857206344604492, "global_step": 236917, "epoch": 2854} {"train_loss": -24.6231632232666, "global_step": 236918, "epoch": 2854} {"train_loss": -24.49812126159668, "global_step": 236919, "epoch": 2854} {"train_loss": -25.25421714782715, "global_step": 236920, "epoch": 2854} {"train_loss": -24.795700073242188, "global_step": 236921, "epoch": 2854} {"train_loss": -24.914766311645508, "global_step": 236922, "epoch": 2854} {"train_loss": -25.06648826599121, "global_step": 236923, "epoch": 2854} {"train_loss": -24.845552444458008, "global_step": 236924, "epoch": 2854} {"train_loss": -24.627899169921875, "global_step": 236925, "epoch": 2854} {"train_loss": -24.635669708251953, "global_step": 236926, "epoch": 2854} {"train_loss": -24.8095703125, "global_step": 236927, "epoch": 2854} {"train_loss": -24.387874603271484, "global_step": 236928, "epoch": 2854} {"train_loss": -25.045085906982422, "global_step": 236929, "epoch": 2854} {"train_loss": -24.892438888549805, "global_step": 236930, "epoch": 2854} {"train_loss": -25.17500877380371, "global_step": 236931, "epoch": 2854} {"train_loss": -24.906225204467773, "global_step": 236932, "epoch": 2854} {"train_loss": -24.808195114135742, "global_step": 236933, "epoch": 2854} {"train_loss": -24.921010971069336, "global_step": 236934, "epoch": 2854} {"train_loss": -24.9077205657959, "global_step": 236935, "epoch": 2854} {"train_loss": -24.4974422454834, "global_step": 236936, "epoch": 2854} {"train_loss": -24.950489044189453, "global_step": 236937, "epoch": 2854} {"train_loss": -24.754072189331055, "global_step": 236938, "epoch": 2854} {"train_loss": -24.92445182800293, "global_step": 236939, "epoch": 2854} {"train_loss": -24.526819229125977, "global_step": 236940, "epoch": 2854} {"train_loss": -24.55747413635254, "global_step": 236941, "epoch": 2854} {"train_loss": -24.15349006652832, "global_step": 236942, "epoch": 2854} {"train_loss": -23.985015869140625, "global_step": 236943, "epoch": 2854} {"train_loss": -24.80289649963379, "global_step": 236944, "epoch": 2854} {"train_loss": -24.813405990600586, "global_step": 236945, "epoch": 2854} {"train_loss": -24.679729461669922, "global_step": 236946, "epoch": 2854} {"train_loss": -24.802148818969727, "global_step": 236947, "epoch": 2854} {"train_loss": -24.779273986816406, "global_step": 236948, "epoch": 2854} {"train_loss": -24.947500228881836, "global_step": 236949, "epoch": 2854} {"train_loss": -24.785810470581055, "global_step": 236950, "epoch": 2854} {"train_loss": -25.096128463745117, "global_step": 236951, "epoch": 2854} {"train_loss": -24.92658805847168, "global_step": 236952, "epoch": 2854} {"train_loss": -25.016590118408203, "global_step": 236953, "epoch": 2854} {"train_loss": -24.81666374206543, "global_step": 236954, "epoch": 2854} {"train_loss": -24.776723861694336, "global_step": 236955, "epoch": 2854} {"train_loss": -24.697309494018555, "global_step": 236956, "epoch": 2854} {"train_loss": -24.92506980895996, "global_step": 236957, "epoch": 2854} {"train_loss": -25.028614044189453, "global_step": 236958, "epoch": 2854} {"train_loss": -24.710128784179688, "global_step": 236959, "epoch": 2854} {"train_loss": -24.504369735717773, "global_step": 236960, "epoch": 2854} {"train_loss": -24.77035903930664, "global_step": 236961, "epoch": 2854} {"train_loss": -25.08953857421875, "global_step": 236962, "epoch": 2854} {"train_loss": -24.46375846862793, "global_step": 236963, "epoch": 2854} {"train_loss": -24.665269644863635, "global_step": 236964, "epoch": 2854, "val_loss": 6684785.0} {"train_loss": -24.37390899658203, "global_step": 236965, "epoch": 2855} {"train_loss": -24.7615909576416, "global_step": 236966, "epoch": 2855} {"train_loss": -24.96481704711914, "global_step": 236967, "epoch": 2855} {"train_loss": -24.53338623046875, "global_step": 236968, "epoch": 2855} {"train_loss": -24.5344181060791, "global_step": 236969, "epoch": 2855} {"train_loss": -24.586362838745117, "global_step": 236970, "epoch": 2855} {"train_loss": -24.73805046081543, "global_step": 236971, "epoch": 2855} {"train_loss": -24.264280319213867, "global_step": 236972, "epoch": 2855} {"train_loss": -24.666845321655273, "global_step": 236973, "epoch": 2855} {"train_loss": -24.530202865600586, "global_step": 236974, "epoch": 2855} {"train_loss": -24.634248733520508, "global_step": 236975, "epoch": 2855} {"train_loss": -24.847749710083008, "global_step": 236976, "epoch": 2855} {"train_loss": -24.5169677734375, "global_step": 236977, "epoch": 2855} {"train_loss": -24.4892635345459, "global_step": 236978, "epoch": 2855} {"train_loss": -24.96953773498535, "global_step": 236979, "epoch": 2855} {"train_loss": -24.36859130859375, "global_step": 236980, "epoch": 2855} {"train_loss": -24.872522354125977, "global_step": 236981, "epoch": 2855} {"train_loss": -24.949731826782227, "global_step": 236982, "epoch": 2855} {"train_loss": -24.812162399291992, "global_step": 236983, "epoch": 2855} {"train_loss": -24.45612144470215, "global_step": 236984, "epoch": 2855} {"train_loss": -24.432348251342773, "global_step": 236985, "epoch": 2855} {"train_loss": -24.849445343017578, "global_step": 236986, "epoch": 2855} {"train_loss": -24.258447647094727, "global_step": 236987, "epoch": 2855} {"train_loss": -24.91727066040039, "global_step": 236988, "epoch": 2855} {"train_loss": -24.426067352294922, "global_step": 236989, "epoch": 2855} {"train_loss": -24.56642723083496, "global_step": 236990, "epoch": 2855} {"train_loss": -24.927120208740234, "global_step": 236991, "epoch": 2855} {"train_loss": -24.63857650756836, "global_step": 236992, "epoch": 2855} {"train_loss": -24.795581817626953, "global_step": 236993, "epoch": 2855} {"train_loss": -24.410919189453125, "global_step": 236994, "epoch": 2855} {"train_loss": -24.33121681213379, "global_step": 236995, "epoch": 2855} {"train_loss": -24.801244735717773, "global_step": 236996, "epoch": 2855} {"train_loss": -24.614444732666016, "global_step": 236997, "epoch": 2855} {"train_loss": -24.570453643798828, "global_step": 236998, "epoch": 2855} {"train_loss": -24.67616844177246, "global_step": 236999, "epoch": 2855} {"train_loss": -24.744720458984375, "global_step": 237000, "epoch": 2855} {"train_loss": -24.602733612060547, "global_step": 237001, "epoch": 2855} {"train_loss": -25.018850326538086, "global_step": 237002, "epoch": 2855} {"train_loss": -24.405471801757812, "global_step": 237003, "epoch": 2855} {"train_loss": -24.742034912109375, "global_step": 237004, "epoch": 2855} {"train_loss": -25.147050857543945, "global_step": 237005, "epoch": 2855} {"train_loss": -24.77805519104004, "global_step": 237006, "epoch": 2855} {"train_loss": -24.945959091186523, "global_step": 237007, "epoch": 2855} {"train_loss": -24.563322067260742, "global_step": 237008, "epoch": 2855} {"train_loss": -24.694721221923828, "global_step": 237009, "epoch": 2855} {"train_loss": -25.012256622314453, "global_step": 237010, "epoch": 2855} {"train_loss": -25.083547592163086, "global_step": 237011, "epoch": 2855} {"train_loss": -24.81963539123535, "global_step": 237012, "epoch": 2855} {"train_loss": -24.714338302612305, "global_step": 237013, "epoch": 2855} {"train_loss": -24.84186363220215, "global_step": 237014, "epoch": 2855} {"train_loss": -24.827356338500977, "global_step": 237015, "epoch": 2855} {"train_loss": -24.802621841430664, "global_step": 237016, "epoch": 2855} {"train_loss": -24.814361572265625, "global_step": 237017, "epoch": 2855} {"train_loss": -24.92561912536621, "global_step": 237018, "epoch": 2855} {"train_loss": -24.811620712280273, "global_step": 237019, "epoch": 2855} {"train_loss": -24.71676254272461, "global_step": 237020, "epoch": 2855} {"train_loss": -25.071088790893555, "global_step": 237021, "epoch": 2855} {"train_loss": -24.994504928588867, "global_step": 237022, "epoch": 2855} {"train_loss": -24.45528221130371, "global_step": 237023, "epoch": 2855} {"train_loss": -24.596174240112305, "global_step": 237024, "epoch": 2855} {"train_loss": -24.544151306152344, "global_step": 237025, "epoch": 2855} {"train_loss": -24.9185848236084, "global_step": 237026, "epoch": 2855} {"train_loss": -24.639896392822266, "global_step": 237027, "epoch": 2855} {"train_loss": -25.01007080078125, "global_step": 237028, "epoch": 2855} {"train_loss": -24.888071060180664, "global_step": 237029, "epoch": 2855} {"train_loss": -24.692777633666992, "global_step": 237030, "epoch": 2855} {"train_loss": -24.93560791015625, "global_step": 237031, "epoch": 2855} {"train_loss": -24.810245513916016, "global_step": 237032, "epoch": 2855} {"train_loss": -24.81412124633789, "global_step": 237033, "epoch": 2855} {"train_loss": -25.125394821166992, "global_step": 237034, "epoch": 2855} {"train_loss": -24.7115535736084, "global_step": 237035, "epoch": 2855} {"train_loss": -24.751806259155273, "global_step": 237036, "epoch": 2855} {"train_loss": -25.070234298706055, "global_step": 237037, "epoch": 2855} {"train_loss": -25.28046417236328, "global_step": 237038, "epoch": 2855} {"train_loss": -24.932703018188477, "global_step": 237039, "epoch": 2855} {"train_loss": -24.580718994140625, "global_step": 237040, "epoch": 2855} {"train_loss": -25.160892486572266, "global_step": 237041, "epoch": 2855} {"train_loss": -24.671615600585938, "global_step": 237042, "epoch": 2855} {"train_loss": -24.948274612426758, "global_step": 237043, "epoch": 2855} {"train_loss": -24.92580223083496, "global_step": 237044, "epoch": 2855} {"train_loss": -24.98992919921875, "global_step": 237045, "epoch": 2855} {"train_loss": -25.224258422851562, "global_step": 237046, "epoch": 2855} {"train_loss": -24.756983377847327, "global_step": 237047, "epoch": 2855, "val_loss": 6767470.0} {"train_loss": -24.42670249938965, "global_step": 237048, "epoch": 2856} {"train_loss": -24.24183464050293, "global_step": 237049, "epoch": 2856} {"train_loss": -24.83829689025879, "global_step": 237050, "epoch": 2856} {"train_loss": -24.595731735229492, "global_step": 237051, "epoch": 2856} {"train_loss": -24.942716598510742, "global_step": 237052, "epoch": 2856} {"train_loss": -24.592124938964844, "global_step": 237053, "epoch": 2856} {"train_loss": -25.146728515625, "global_step": 237054, "epoch": 2856} {"train_loss": -24.789766311645508, "global_step": 237055, "epoch": 2856} {"train_loss": -24.664291381835938, "global_step": 237056, "epoch": 2856} {"train_loss": -24.746112823486328, "global_step": 237057, "epoch": 2856} {"train_loss": -24.673913955688477, "global_step": 237058, "epoch": 2856} {"train_loss": -24.994977951049805, "global_step": 237059, "epoch": 2856} {"train_loss": -24.459529876708984, "global_step": 237060, "epoch": 2856} {"train_loss": -24.841327667236328, "global_step": 237061, "epoch": 2856} {"train_loss": -24.6728458404541, "global_step": 237062, "epoch": 2856} {"train_loss": -24.868520736694336, "global_step": 237063, "epoch": 2856} {"train_loss": -24.94496726989746, "global_step": 237064, "epoch": 2856} {"train_loss": -24.89118766784668, "global_step": 237065, "epoch": 2856} {"train_loss": -24.78273582458496, "global_step": 237066, "epoch": 2856} {"train_loss": -24.79966163635254, "global_step": 237067, "epoch": 2856} {"train_loss": -24.966665267944336, "global_step": 237068, "epoch": 2856} {"train_loss": -24.85017204284668, "global_step": 237069, "epoch": 2856} {"train_loss": -24.760900497436523, "global_step": 237070, "epoch": 2856} {"train_loss": -24.753681182861328, "global_step": 237071, "epoch": 2856} {"train_loss": -24.94742774963379, "global_step": 237072, "epoch": 2856} {"train_loss": -25.23507308959961, "global_step": 237073, "epoch": 2856} {"train_loss": -24.754356384277344, "global_step": 237074, "epoch": 2856} {"train_loss": -25.133991241455078, "global_step": 237075, "epoch": 2856} {"train_loss": -25.118627548217773, "global_step": 237076, "epoch": 2856} {"train_loss": -24.74018669128418, "global_step": 237077, "epoch": 2856} {"train_loss": -25.211713790893555, "global_step": 237078, "epoch": 2856} {"train_loss": -24.833393096923828, "global_step": 237079, "epoch": 2856} {"train_loss": -25.04146385192871, "global_step": 237080, "epoch": 2856} {"train_loss": -24.899309158325195, "global_step": 237081, "epoch": 2856} {"train_loss": -24.87947654724121, "global_step": 237082, "epoch": 2856} {"train_loss": -25.197555541992188, "global_step": 237083, "epoch": 2856} {"train_loss": -24.678495407104492, "global_step": 237084, "epoch": 2856} {"train_loss": -25.238937377929688, "global_step": 237085, "epoch": 2856} {"train_loss": -24.662240982055664, "global_step": 237086, "epoch": 2856} {"train_loss": -24.87193489074707, "global_step": 237087, "epoch": 2856} {"train_loss": -24.883438110351562, "global_step": 237088, "epoch": 2856} {"train_loss": -24.769540786743164, "global_step": 237089, "epoch": 2856} {"train_loss": -24.168724060058594, "global_step": 237090, "epoch": 2856} {"train_loss": -23.5379581451416, "global_step": 237091, "epoch": 2856} {"train_loss": -24.230106353759766, "global_step": 237092, "epoch": 2856} {"train_loss": -24.17641258239746, "global_step": 237093, "epoch": 2856} {"train_loss": -24.1231632232666, "global_step": 237094, "epoch": 2856} {"train_loss": -25.054304122924805, "global_step": 237095, "epoch": 2856} {"train_loss": -24.258390426635742, "global_step": 237096, "epoch": 2856} {"train_loss": -24.68609619140625, "global_step": 237097, "epoch": 2856} {"train_loss": -24.454214096069336, "global_step": 237098, "epoch": 2856} {"train_loss": -24.39546775817871, "global_step": 237099, "epoch": 2856} {"train_loss": -24.249082565307617, "global_step": 237100, "epoch": 2856} {"train_loss": -24.246124267578125, "global_step": 237101, "epoch": 2856} {"train_loss": -24.41034507751465, "global_step": 237102, "epoch": 2856} {"train_loss": -24.69858741760254, "global_step": 237103, "epoch": 2856} {"train_loss": -24.81599998474121, "global_step": 237104, "epoch": 2856} {"train_loss": -24.47525405883789, "global_step": 237105, "epoch": 2856} {"train_loss": -24.39946937561035, "global_step": 237106, "epoch": 2856} {"train_loss": -24.68845558166504, "global_step": 237107, "epoch": 2856} {"train_loss": -24.72633934020996, "global_step": 237108, "epoch": 2856} {"train_loss": -24.584516525268555, "global_step": 237109, "epoch": 2856} {"train_loss": -24.953567504882812, "global_step": 237110, "epoch": 2856} {"train_loss": -24.71791648864746, "global_step": 237111, "epoch": 2856} {"train_loss": -24.901737213134766, "global_step": 237112, "epoch": 2856} {"train_loss": -24.592679977416992, "global_step": 237113, "epoch": 2856} {"train_loss": -24.883451461791992, "global_step": 237114, "epoch": 2856} {"train_loss": -24.703779220581055, "global_step": 237115, "epoch": 2856} {"train_loss": -24.61366081237793, "global_step": 237116, "epoch": 2856} {"train_loss": -24.615095138549805, "global_step": 237117, "epoch": 2856} {"train_loss": -24.90113639831543, "global_step": 237118, "epoch": 2856} {"train_loss": -24.939359664916992, "global_step": 237119, "epoch": 2856} {"train_loss": -24.855056762695312, "global_step": 237120, "epoch": 2856} {"train_loss": -24.778181076049805, "global_step": 237121, "epoch": 2856} {"train_loss": -24.450363159179688, "global_step": 237122, "epoch": 2856} {"train_loss": -24.99240493774414, "global_step": 237123, "epoch": 2856} {"train_loss": -25.01153564453125, "global_step": 237124, "epoch": 2856} {"train_loss": -24.84229850769043, "global_step": 237125, "epoch": 2856} {"train_loss": -25.187549591064453, "global_step": 237126, "epoch": 2856} {"train_loss": -24.919864654541016, "global_step": 237127, "epoch": 2856} {"train_loss": -24.755084991455078, "global_step": 237128, "epoch": 2856} {"train_loss": -24.737836837768555, "global_step": 237129, "epoch": 2856} {"train_loss": -24.742642919701265, "global_step": 237130, "epoch": 2856, "val_loss": 6790071.0} {"train_loss": -24.01511573791504, "global_step": 237131, "epoch": 2857} {"train_loss": -23.60133171081543, "global_step": 237132, "epoch": 2857} {"train_loss": -24.203510284423828, "global_step": 237133, "epoch": 2857} {"train_loss": -24.68899917602539, "global_step": 237134, "epoch": 2857} {"train_loss": -24.327335357666016, "global_step": 237135, "epoch": 2857} {"train_loss": -24.203153610229492, "global_step": 237136, "epoch": 2857} {"train_loss": -24.39701271057129, "global_step": 237137, "epoch": 2857} {"train_loss": -24.438119888305664, "global_step": 237138, "epoch": 2857} {"train_loss": -24.23419952392578, "global_step": 237139, "epoch": 2857} {"train_loss": -24.24651527404785, "global_step": 237140, "epoch": 2857} {"train_loss": -24.580066680908203, "global_step": 237141, "epoch": 2857} {"train_loss": -24.4034423828125, "global_step": 237142, "epoch": 2857} {"train_loss": -24.012704849243164, "global_step": 237143, "epoch": 2857} {"train_loss": -24.37461280822754, "global_step": 237144, "epoch": 2857} {"train_loss": -24.472043991088867, "global_step": 237145, "epoch": 2857} {"train_loss": -24.43337631225586, "global_step": 237146, "epoch": 2857} {"train_loss": -24.888042449951172, "global_step": 237147, "epoch": 2857} {"train_loss": -24.776031494140625, "global_step": 237148, "epoch": 2857} {"train_loss": -24.76286506652832, "global_step": 237149, "epoch": 2857} {"train_loss": -24.757118225097656, "global_step": 237150, "epoch": 2857} {"train_loss": -24.506677627563477, "global_step": 237151, "epoch": 2857} {"train_loss": -24.821569442749023, "global_step": 237152, "epoch": 2857} {"train_loss": -24.509328842163086, "global_step": 237153, "epoch": 2857} {"train_loss": -24.898296356201172, "global_step": 237154, "epoch": 2857} {"train_loss": -24.555383682250977, "global_step": 237155, "epoch": 2857} {"train_loss": -24.88161277770996, "global_step": 237156, "epoch": 2857} {"train_loss": -25.15427017211914, "global_step": 237157, "epoch": 2857} {"train_loss": -24.846240997314453, "global_step": 237158, "epoch": 2857} {"train_loss": -24.4877986907959, "global_step": 237159, "epoch": 2857} {"train_loss": -24.834585189819336, "global_step": 237160, "epoch": 2857} {"train_loss": -24.864118576049805, "global_step": 237161, "epoch": 2857} {"train_loss": -24.7426700592041, "global_step": 237162, "epoch": 2857} {"train_loss": -24.692237854003906, "global_step": 237163, "epoch": 2857} {"train_loss": -24.83568000793457, "global_step": 237164, "epoch": 2857} {"train_loss": -25.069608688354492, "global_step": 237165, "epoch": 2857} {"train_loss": -24.723234176635742, "global_step": 237166, "epoch": 2857} {"train_loss": -25.0400333404541, "global_step": 237167, "epoch": 2857} {"train_loss": -24.94528579711914, "global_step": 237168, "epoch": 2857} {"train_loss": -24.8880615234375, "global_step": 237169, "epoch": 2857} {"train_loss": -24.89875602722168, "global_step": 237170, "epoch": 2857} {"train_loss": -25.12228775024414, "global_step": 237171, "epoch": 2857} {"train_loss": -25.086488723754883, "global_step": 237172, "epoch": 2857} {"train_loss": -24.874492645263672, "global_step": 237173, "epoch": 2857} {"train_loss": -25.016813278198242, "global_step": 237174, "epoch": 2857} {"train_loss": -24.624683380126953, "global_step": 237175, "epoch": 2857} {"train_loss": -24.558685302734375, "global_step": 237176, "epoch": 2857} {"train_loss": -24.669946670532227, "global_step": 237177, "epoch": 2857} {"train_loss": -24.92426300048828, "global_step": 237178, "epoch": 2857} {"train_loss": -25.136341094970703, "global_step": 237179, "epoch": 2857} {"train_loss": -24.288999557495117, "global_step": 237180, "epoch": 2857} {"train_loss": -24.450931549072266, "global_step": 237181, "epoch": 2857} {"train_loss": -24.444149017333984, "global_step": 237182, "epoch": 2857} {"train_loss": -24.66840934753418, "global_step": 237183, "epoch": 2857} {"train_loss": -24.75519371032715, "global_step": 237184, "epoch": 2857} {"train_loss": -24.592588424682617, "global_step": 237185, "epoch": 2857} {"train_loss": -24.851285934448242, "global_step": 237186, "epoch": 2857} {"train_loss": -25.107702255249023, "global_step": 237187, "epoch": 2857} {"train_loss": -24.863889694213867, "global_step": 237188, "epoch": 2857} {"train_loss": -24.526018142700195, "global_step": 237189, "epoch": 2857} {"train_loss": -24.514083862304688, "global_step": 237190, "epoch": 2857} {"train_loss": -24.832691192626953, "global_step": 237191, "epoch": 2857} {"train_loss": -24.842483520507812, "global_step": 237192, "epoch": 2857} {"train_loss": -25.059728622436523, "global_step": 237193, "epoch": 2857} {"train_loss": -24.5866756439209, "global_step": 237194, "epoch": 2857} {"train_loss": -24.81214714050293, "global_step": 237195, "epoch": 2857} {"train_loss": -24.703229904174805, "global_step": 237196, "epoch": 2857} {"train_loss": -24.644512176513672, "global_step": 237197, "epoch": 2857} {"train_loss": -25.015012741088867, "global_step": 237198, "epoch": 2857} {"train_loss": -24.705610275268555, "global_step": 237199, "epoch": 2857} {"train_loss": -24.87360382080078, "global_step": 237200, "epoch": 2857} {"train_loss": -24.476837158203125, "global_step": 237201, "epoch": 2857} {"train_loss": -25.090635299682617, "global_step": 237202, "epoch": 2857} {"train_loss": -25.06219482421875, "global_step": 237203, "epoch": 2857} {"train_loss": -24.692646026611328, "global_step": 237204, "epoch": 2857} {"train_loss": -25.063982009887695, "global_step": 237205, "epoch": 2857} {"train_loss": -25.213777542114258, "global_step": 237206, "epoch": 2857} {"train_loss": -24.7349853515625, "global_step": 237207, "epoch": 2857} {"train_loss": -24.80787467956543, "global_step": 237208, "epoch": 2857} {"train_loss": -24.672292709350586, "global_step": 237209, "epoch": 2857} {"train_loss": -24.9200496673584, "global_step": 237210, "epoch": 2857} {"train_loss": -24.56819725036621, "global_step": 237211, "epoch": 2857} {"train_loss": -24.647520065307617, "global_step": 237212, "epoch": 2857} {"train_loss": -24.70713934840926, "global_step": 237213, "epoch": 2857, "val_loss": 6701773.0} {"train_loss": -24.31954574584961, "global_step": 237214, "epoch": 2858} {"train_loss": -24.762046813964844, "global_step": 237215, "epoch": 2858} {"train_loss": -24.609373092651367, "global_step": 237216, "epoch": 2858} {"train_loss": -24.614164352416992, "global_step": 237217, "epoch": 2858} {"train_loss": -24.40774917602539, "global_step": 237218, "epoch": 2858} {"train_loss": -24.723285675048828, "global_step": 237219, "epoch": 2858} {"train_loss": -24.95564842224121, "global_step": 237220, "epoch": 2858} {"train_loss": -24.483983993530273, "global_step": 237221, "epoch": 2858} {"train_loss": -24.96649169921875, "global_step": 237222, "epoch": 2858} {"train_loss": -24.774673461914062, "global_step": 237223, "epoch": 2858} {"train_loss": -24.39478874206543, "global_step": 237224, "epoch": 2858} {"train_loss": -24.686643600463867, "global_step": 237225, "epoch": 2858} {"train_loss": -24.79706382751465, "global_step": 237226, "epoch": 2858} {"train_loss": -24.920522689819336, "global_step": 237227, "epoch": 2858} {"train_loss": -25.160932540893555, "global_step": 237228, "epoch": 2858} {"train_loss": -24.604211807250977, "global_step": 237229, "epoch": 2858} {"train_loss": -24.79865264892578, "global_step": 237230, "epoch": 2858} {"train_loss": -24.912317276000977, "global_step": 237231, "epoch": 2858} {"train_loss": -24.848661422729492, "global_step": 237232, "epoch": 2858} {"train_loss": -24.858991622924805, "global_step": 237233, "epoch": 2858} {"train_loss": -24.91370964050293, "global_step": 237234, "epoch": 2858} {"train_loss": -25.079254150390625, "global_step": 237235, "epoch": 2858} {"train_loss": -24.900236129760742, "global_step": 237236, "epoch": 2858} {"train_loss": -24.762649536132812, "global_step": 237237, "epoch": 2858} {"train_loss": -24.774290084838867, "global_step": 237238, "epoch": 2858} {"train_loss": -24.81167984008789, "global_step": 237239, "epoch": 2858} {"train_loss": -25.038572311401367, "global_step": 237240, "epoch": 2858} {"train_loss": -24.75834846496582, "global_step": 237241, "epoch": 2858} {"train_loss": -24.576396942138672, "global_step": 237242, "epoch": 2858} {"train_loss": -24.870014190673828, "global_step": 237243, "epoch": 2858} {"train_loss": -24.94277000427246, "global_step": 237244, "epoch": 2858} {"train_loss": -24.767770767211914, "global_step": 237245, "epoch": 2858} {"train_loss": -24.377965927124023, "global_step": 237246, "epoch": 2858} {"train_loss": -24.764657974243164, "global_step": 237247, "epoch": 2858} {"train_loss": -25.386863708496094, "global_step": 237248, "epoch": 2858} {"train_loss": -24.77192497253418, "global_step": 237249, "epoch": 2858} {"train_loss": -24.802581787109375, "global_step": 237250, "epoch": 2858} {"train_loss": -24.643756866455078, "global_step": 237251, "epoch": 2858} {"train_loss": -24.805377960205078, "global_step": 237252, "epoch": 2858} {"train_loss": -24.772794723510742, "global_step": 237253, "epoch": 2858} {"train_loss": -25.027708053588867, "global_step": 237254, "epoch": 2858} {"train_loss": -24.62833023071289, "global_step": 237255, "epoch": 2858} {"train_loss": -24.8402156829834, "global_step": 237256, "epoch": 2858} {"train_loss": -24.876691818237305, "global_step": 237257, "epoch": 2858} {"train_loss": -24.839834213256836, "global_step": 237258, "epoch": 2858} {"train_loss": -24.827083587646484, "global_step": 237259, "epoch": 2858} {"train_loss": -24.905019760131836, "global_step": 237260, "epoch": 2858} {"train_loss": -24.754907608032227, "global_step": 237261, "epoch": 2858} {"train_loss": -24.58625602722168, "global_step": 237262, "epoch": 2858} {"train_loss": -25.022390365600586, "global_step": 237263, "epoch": 2858} {"train_loss": -24.805513381958008, "global_step": 237264, "epoch": 2858} {"train_loss": -24.94295310974121, "global_step": 237265, "epoch": 2858} {"train_loss": -24.53388023376465, "global_step": 237266, "epoch": 2858} {"train_loss": -25.035917282104492, "global_step": 237267, "epoch": 2858} {"train_loss": -24.68362808227539, "global_step": 237268, "epoch": 2858} {"train_loss": -25.008275985717773, "global_step": 237269, "epoch": 2858} {"train_loss": -24.81134033203125, "global_step": 237270, "epoch": 2858} {"train_loss": -24.521711349487305, "global_step": 237271, "epoch": 2858} {"train_loss": -25.290950775146484, "global_step": 237272, "epoch": 2858} {"train_loss": -24.758071899414062, "global_step": 237273, "epoch": 2858} {"train_loss": -24.913543701171875, "global_step": 237274, "epoch": 2858} {"train_loss": -25.15407371520996, "global_step": 237275, "epoch": 2858} {"train_loss": -24.80614471435547, "global_step": 237276, "epoch": 2858} {"train_loss": -24.94005012512207, "global_step": 237277, "epoch": 2858} {"train_loss": -24.84402084350586, "global_step": 237278, "epoch": 2858} {"train_loss": -24.85430908203125, "global_step": 237279, "epoch": 2858} {"train_loss": -25.07661247253418, "global_step": 237280, "epoch": 2858} {"train_loss": -24.689910888671875, "global_step": 237281, "epoch": 2858} {"train_loss": -24.990108489990234, "global_step": 237282, "epoch": 2858} {"train_loss": -24.611684799194336, "global_step": 237283, "epoch": 2858} {"train_loss": -24.67596435546875, "global_step": 237284, "epoch": 2858} {"train_loss": -24.846830368041992, "global_step": 237285, "epoch": 2858} {"train_loss": -24.645065307617188, "global_step": 237286, "epoch": 2858} {"train_loss": -24.727481842041016, "global_step": 237287, "epoch": 2858} {"train_loss": -25.020790100097656, "global_step": 237288, "epoch": 2858} {"train_loss": -24.905176162719727, "global_step": 237289, "epoch": 2858} {"train_loss": -24.883878707885742, "global_step": 237290, "epoch": 2858} {"train_loss": -24.841949462890625, "global_step": 237291, "epoch": 2858} {"train_loss": -24.37227439880371, "global_step": 237292, "epoch": 2858} {"train_loss": -24.856157302856445, "global_step": 237293, "epoch": 2858} {"train_loss": -25.073266983032227, "global_step": 237294, "epoch": 2858} {"train_loss": -25.087299346923828, "global_step": 237295, "epoch": 2858} {"train_loss": -24.80178210246994, "global_step": 237296, "epoch": 2858, "val_loss": 6792566.0} {"train_loss": -24.6317195892334, "global_step": 237297, "epoch": 2859} {"train_loss": -24.242429733276367, "global_step": 237298, "epoch": 2859} {"train_loss": -24.5675048828125, "global_step": 237299, "epoch": 2859} {"train_loss": -24.128019332885742, "global_step": 237300, "epoch": 2859} {"train_loss": -24.51751708984375, "global_step": 237301, "epoch": 2859} {"train_loss": -24.29540252685547, "global_step": 237302, "epoch": 2859} {"train_loss": -23.962717056274414, "global_step": 237303, "epoch": 2859} {"train_loss": -24.28462028503418, "global_step": 237304, "epoch": 2859} {"train_loss": -24.418710708618164, "global_step": 237305, "epoch": 2859} {"train_loss": -24.291584014892578, "global_step": 237306, "epoch": 2859} {"train_loss": -24.655851364135742, "global_step": 237307, "epoch": 2859} {"train_loss": -24.712677001953125, "global_step": 237308, "epoch": 2859} {"train_loss": -24.89712142944336, "global_step": 237309, "epoch": 2859} {"train_loss": -24.4700870513916, "global_step": 237310, "epoch": 2859} {"train_loss": -24.851394653320312, "global_step": 237311, "epoch": 2859} {"train_loss": -24.930601119995117, "global_step": 237312, "epoch": 2859} {"train_loss": -24.48255729675293, "global_step": 237313, "epoch": 2859} {"train_loss": -24.387792587280273, "global_step": 237314, "epoch": 2859} {"train_loss": -25.11309814453125, "global_step": 237315, "epoch": 2859} {"train_loss": -24.851438522338867, "global_step": 237316, "epoch": 2859} {"train_loss": -24.720258712768555, "global_step": 237317, "epoch": 2859} {"train_loss": -24.553203582763672, "global_step": 237318, "epoch": 2859} {"train_loss": -24.721786499023438, "global_step": 237319, "epoch": 2859} {"train_loss": -24.8951473236084, "global_step": 237320, "epoch": 2859} {"train_loss": -24.760557174682617, "global_step": 237321, "epoch": 2859} {"train_loss": -24.595998764038086, "global_step": 237322, "epoch": 2859} {"train_loss": -24.32795524597168, "global_step": 237323, "epoch": 2859} {"train_loss": -25.3597354888916, "global_step": 237324, "epoch": 2859} {"train_loss": -24.774017333984375, "global_step": 237325, "epoch": 2859} {"train_loss": -24.76877212524414, "global_step": 237326, "epoch": 2859} {"train_loss": -24.959745407104492, "global_step": 237327, "epoch": 2859} {"train_loss": -24.715024948120117, "global_step": 237328, "epoch": 2859} {"train_loss": -24.918594360351562, "global_step": 237329, "epoch": 2859} {"train_loss": -24.839229583740234, "global_step": 237330, "epoch": 2859} {"train_loss": -24.947860717773438, "global_step": 237331, "epoch": 2859} {"train_loss": -24.967477798461914, "global_step": 237332, "epoch": 2859} {"train_loss": -24.856201171875, "global_step": 237333, "epoch": 2859} {"train_loss": -24.9097957611084, "global_step": 237334, "epoch": 2859} {"train_loss": -24.962974548339844, "global_step": 237335, "epoch": 2859} {"train_loss": -24.87961196899414, "global_step": 237336, "epoch": 2859} {"train_loss": -24.86495018005371, "global_step": 237337, "epoch": 2859} {"train_loss": -24.87468910217285, "global_step": 237338, "epoch": 2859} {"train_loss": -24.736242294311523, "global_step": 237339, "epoch": 2859} {"train_loss": -25.112314224243164, "global_step": 237340, "epoch": 2859} {"train_loss": -24.86789321899414, "global_step": 237341, "epoch": 2859} {"train_loss": -25.123708724975586, "global_step": 237342, "epoch": 2859} {"train_loss": -24.73978042602539, "global_step": 237343, "epoch": 2859} {"train_loss": -24.939111709594727, "global_step": 237344, "epoch": 2859} {"train_loss": -24.600543975830078, "global_step": 237345, "epoch": 2859} {"train_loss": -24.742509841918945, "global_step": 237346, "epoch": 2859} {"train_loss": -25.012283325195312, "global_step": 237347, "epoch": 2859} {"train_loss": -24.996423721313477, "global_step": 237348, "epoch": 2859} {"train_loss": -24.95722007751465, "global_step": 237349, "epoch": 2859} {"train_loss": -25.3004207611084, "global_step": 237350, "epoch": 2859} {"train_loss": -25.06165885925293, "global_step": 237351, "epoch": 2859} {"train_loss": -24.768667221069336, "global_step": 237352, "epoch": 2859} {"train_loss": -25.046056747436523, "global_step": 237353, "epoch": 2859} {"train_loss": -25.172658920288086, "global_step": 237354, "epoch": 2859} {"train_loss": -25.360605239868164, "global_step": 237355, "epoch": 2859} {"train_loss": -25.100521087646484, "global_step": 237356, "epoch": 2859} {"train_loss": -24.928979873657227, "global_step": 237357, "epoch": 2859} {"train_loss": -25.101333618164062, "global_step": 237358, "epoch": 2859} {"train_loss": -25.065336227416992, "global_step": 237359, "epoch": 2859} {"train_loss": -24.813980102539062, "global_step": 237360, "epoch": 2859} {"train_loss": -24.948360443115234, "global_step": 237361, "epoch": 2859} {"train_loss": -24.866682052612305, "global_step": 237362, "epoch": 2859} {"train_loss": -24.79622459411621, "global_step": 237363, "epoch": 2859} {"train_loss": -25.2281494140625, "global_step": 237364, "epoch": 2859} {"train_loss": -25.197561264038086, "global_step": 237365, "epoch": 2859} {"train_loss": -24.75213623046875, "global_step": 237366, "epoch": 2859} {"train_loss": -24.936073303222656, "global_step": 237367, "epoch": 2859} {"train_loss": -24.653654098510742, "global_step": 237368, "epoch": 2859} {"train_loss": -24.72560691833496, "global_step": 237369, "epoch": 2859} {"train_loss": -24.64893341064453, "global_step": 237370, "epoch": 2859} {"train_loss": -24.28156089782715, "global_step": 237371, "epoch": 2859} {"train_loss": -24.413190841674805, "global_step": 237372, "epoch": 2859} {"train_loss": -24.80988121032715, "global_step": 237373, "epoch": 2859} {"train_loss": -24.834524154663086, "global_step": 237374, "epoch": 2859} {"train_loss": -24.243385314941406, "global_step": 237375, "epoch": 2859} {"train_loss": -24.494516372680664, "global_step": 237376, "epoch": 2859} {"train_loss": -24.85152244567871, "global_step": 237377, "epoch": 2859} {"train_loss": -24.940208435058594, "global_step": 237378, "epoch": 2859} {"train_loss": -24.784958207463642, "global_step": 237379, "epoch": 2859, "val_loss": 6722317.0} {"train_loss": -24.432645797729492, "global_step": 237380, "epoch": 2860} {"train_loss": -24.46247673034668, "global_step": 237381, "epoch": 2860} {"train_loss": -23.972640991210938, "global_step": 237382, "epoch": 2860} {"train_loss": -24.19605827331543, "global_step": 237383, "epoch": 2860} {"train_loss": -23.83012580871582, "global_step": 237384, "epoch": 2860} {"train_loss": -24.167613983154297, "global_step": 237385, "epoch": 2860} {"train_loss": -24.4390926361084, "global_step": 237386, "epoch": 2860} {"train_loss": -24.329496383666992, "global_step": 237387, "epoch": 2860} {"train_loss": -24.468717575073242, "global_step": 237388, "epoch": 2860} {"train_loss": -24.569416046142578, "global_step": 237389, "epoch": 2860} {"train_loss": -24.196340560913086, "global_step": 237390, "epoch": 2860} {"train_loss": -24.57248306274414, "global_step": 237391, "epoch": 2860} {"train_loss": -24.452991485595703, "global_step": 237392, "epoch": 2860} {"train_loss": -24.49158477783203, "global_step": 237393, "epoch": 2860} {"train_loss": -24.32013511657715, "global_step": 237394, "epoch": 2860} {"train_loss": -24.397016525268555, "global_step": 237395, "epoch": 2860} {"train_loss": -24.39176368713379, "global_step": 237396, "epoch": 2860} {"train_loss": -24.40889549255371, "global_step": 237397, "epoch": 2860} {"train_loss": -24.725948333740234, "global_step": 237398, "epoch": 2860} {"train_loss": -24.311141967773438, "global_step": 237399, "epoch": 2860} {"train_loss": -24.775480270385742, "global_step": 237400, "epoch": 2860} {"train_loss": -24.256755828857422, "global_step": 237401, "epoch": 2860} {"train_loss": -24.799156188964844, "global_step": 237402, "epoch": 2860} {"train_loss": -24.664318084716797, "global_step": 237403, "epoch": 2860} {"train_loss": -24.615442276000977, "global_step": 237404, "epoch": 2860} {"train_loss": -24.731218338012695, "global_step": 237405, "epoch": 2860} {"train_loss": -24.675851821899414, "global_step": 237406, "epoch": 2860} {"train_loss": -24.880762100219727, "global_step": 237407, "epoch": 2860} {"train_loss": -24.664358139038086, "global_step": 237408, "epoch": 2860} {"train_loss": -24.79747200012207, "global_step": 237409, "epoch": 2860} {"train_loss": -24.710269927978516, "global_step": 237410, "epoch": 2860} {"train_loss": -24.378454208374023, "global_step": 237411, "epoch": 2860} {"train_loss": -25.001689910888672, "global_step": 237412, "epoch": 2860} {"train_loss": -25.23541831970215, "global_step": 237413, "epoch": 2860} {"train_loss": -24.8547420501709, "global_step": 237414, "epoch": 2860} {"train_loss": -24.919212341308594, "global_step": 237415, "epoch": 2860} {"train_loss": -24.64476776123047, "global_step": 237416, "epoch": 2860} {"train_loss": -25.100107192993164, "global_step": 237417, "epoch": 2860} {"train_loss": -25.03061294555664, "global_step": 237418, "epoch": 2860} {"train_loss": -24.923309326171875, "global_step": 237419, "epoch": 2860} {"train_loss": -25.08124351501465, "global_step": 237420, "epoch": 2860} {"train_loss": -25.05971336364746, "global_step": 237421, "epoch": 2860} {"train_loss": -24.577661514282227, "global_step": 237422, "epoch": 2860} {"train_loss": -24.67176628112793, "global_step": 237423, "epoch": 2860} {"train_loss": -25.054845809936523, "global_step": 237424, "epoch": 2860} {"train_loss": -24.804357528686523, "global_step": 237425, "epoch": 2860} {"train_loss": -24.972017288208008, "global_step": 237426, "epoch": 2860} {"train_loss": -24.835721969604492, "global_step": 237427, "epoch": 2860} {"train_loss": -24.861608505249023, "global_step": 237428, "epoch": 2860} {"train_loss": -24.96451187133789, "global_step": 237429, "epoch": 2860} {"train_loss": -24.998706817626953, "global_step": 237430, "epoch": 2860} {"train_loss": -24.352798461914062, "global_step": 237431, "epoch": 2860} {"train_loss": -24.617734909057617, "global_step": 237432, "epoch": 2860} {"train_loss": -24.80397605895996, "global_step": 237433, "epoch": 2860} {"train_loss": -24.554105758666992, "global_step": 237434, "epoch": 2860} {"train_loss": -24.74806785583496, "global_step": 237435, "epoch": 2860} {"train_loss": -24.74228858947754, "global_step": 237436, "epoch": 2860} {"train_loss": -25.081716537475586, "global_step": 237437, "epoch": 2860} {"train_loss": -24.699892044067383, "global_step": 237438, "epoch": 2860} {"train_loss": -24.963186264038086, "global_step": 237439, "epoch": 2860} {"train_loss": -24.84326171875, "global_step": 237440, "epoch": 2860} {"train_loss": -24.852170944213867, "global_step": 237441, "epoch": 2860} {"train_loss": -24.771535873413086, "global_step": 237442, "epoch": 2860} {"train_loss": -25.494306564331055, "global_step": 237443, "epoch": 2860} {"train_loss": -24.950864791870117, "global_step": 237444, "epoch": 2860} {"train_loss": -24.69936180114746, "global_step": 237445, "epoch": 2860} {"train_loss": -25.2419490814209, "global_step": 237446, "epoch": 2860} {"train_loss": -24.722875595092773, "global_step": 237447, "epoch": 2860} {"train_loss": -24.50589370727539, "global_step": 237448, "epoch": 2860} {"train_loss": -25.193008422851562, "global_step": 237449, "epoch": 2860} {"train_loss": -24.419513702392578, "global_step": 237450, "epoch": 2860} {"train_loss": -24.68141746520996, "global_step": 237451, "epoch": 2860} {"train_loss": -24.853809356689453, "global_step": 237452, "epoch": 2860} {"train_loss": -24.64750099182129, "global_step": 237453, "epoch": 2860} {"train_loss": -24.87148094177246, "global_step": 237454, "epoch": 2860} {"train_loss": -24.66799545288086, "global_step": 237455, "epoch": 2860} {"train_loss": -25.0880184173584, "global_step": 237456, "epoch": 2860} {"train_loss": -24.58055877685547, "global_step": 237457, "epoch": 2860} {"train_loss": -24.87079429626465, "global_step": 237458, "epoch": 2860} {"train_loss": -24.52303123474121, "global_step": 237459, "epoch": 2860} {"train_loss": -24.96497917175293, "global_step": 237460, "epoch": 2860} {"train_loss": -25.012378692626953, "global_step": 237461, "epoch": 2860} {"train_loss": -24.693934475082948, "global_step": 237462, "epoch": 2860, "val_loss": 6744811.0} {"train_loss": -23.47010040283203, "global_step": 237463, "epoch": 2861} {"train_loss": -24.466474533081055, "global_step": 237464, "epoch": 2861} {"train_loss": -24.03240394592285, "global_step": 237465, "epoch": 2861} {"train_loss": -23.48873519897461, "global_step": 237466, "epoch": 2861} {"train_loss": -24.550870895385742, "global_step": 237467, "epoch": 2861} {"train_loss": -24.24989128112793, "global_step": 237468, "epoch": 2861} {"train_loss": -24.097291946411133, "global_step": 237469, "epoch": 2861} {"train_loss": -24.64345932006836, "global_step": 237470, "epoch": 2861} {"train_loss": -24.299034118652344, "global_step": 237471, "epoch": 2861} {"train_loss": -24.386005401611328, "global_step": 237472, "epoch": 2861} {"train_loss": -24.17600440979004, "global_step": 237473, "epoch": 2861} {"train_loss": -24.437969207763672, "global_step": 237474, "epoch": 2861} {"train_loss": -24.55206298828125, "global_step": 237475, "epoch": 2861} {"train_loss": -24.71541404724121, "global_step": 237476, "epoch": 2861} {"train_loss": -24.624277114868164, "global_step": 237477, "epoch": 2861} {"train_loss": -24.754880905151367, "global_step": 237478, "epoch": 2861} {"train_loss": -24.737930297851562, "global_step": 237479, "epoch": 2861} {"train_loss": -24.462615966796875, "global_step": 237480, "epoch": 2861} {"train_loss": -25.009292602539062, "global_step": 237481, "epoch": 2861} {"train_loss": -24.56390953063965, "global_step": 237482, "epoch": 2861} {"train_loss": -24.68257713317871, "global_step": 237483, "epoch": 2861} {"train_loss": -24.494298934936523, "global_step": 237484, "epoch": 2861} {"train_loss": -24.91644859313965, "global_step": 237485, "epoch": 2861} {"train_loss": -24.655242919921875, "global_step": 237486, "epoch": 2861} {"train_loss": -24.828641891479492, "global_step": 237487, "epoch": 2861} {"train_loss": -24.728330612182617, "global_step": 237488, "epoch": 2861} {"train_loss": -24.88725471496582, "global_step": 237489, "epoch": 2861} {"train_loss": -24.808502197265625, "global_step": 237490, "epoch": 2861} {"train_loss": -24.93716812133789, "global_step": 237491, "epoch": 2861} {"train_loss": -25.140348434448242, "global_step": 237492, "epoch": 2861} {"train_loss": -24.664546966552734, "global_step": 237493, "epoch": 2861} {"train_loss": -25.0695743560791, "global_step": 237494, "epoch": 2861} {"train_loss": -24.551002502441406, "global_step": 237495, "epoch": 2861} {"train_loss": -24.919694900512695, "global_step": 237496, "epoch": 2861} {"train_loss": -25.14015007019043, "global_step": 237497, "epoch": 2861} {"train_loss": -25.108572006225586, "global_step": 237498, "epoch": 2861} {"train_loss": -24.73634910583496, "global_step": 237499, "epoch": 2861} {"train_loss": -24.95144271850586, "global_step": 237500, "epoch": 2861} {"train_loss": -25.195655822753906, "global_step": 237501, "epoch": 2861} {"train_loss": -25.084440231323242, "global_step": 237502, "epoch": 2861} {"train_loss": -24.98063850402832, "global_step": 237503, "epoch": 2861} {"train_loss": -25.146957397460938, "global_step": 237504, "epoch": 2861} {"train_loss": -24.63230323791504, "global_step": 237505, "epoch": 2861} {"train_loss": -24.805383682250977, "global_step": 237506, "epoch": 2861} {"train_loss": -24.570571899414062, "global_step": 237507, "epoch": 2861} {"train_loss": -24.784854888916016, "global_step": 237508, "epoch": 2861} {"train_loss": -24.785694122314453, "global_step": 237509, "epoch": 2861} {"train_loss": -24.837068557739258, "global_step": 237510, "epoch": 2861} {"train_loss": -24.597999572753906, "global_step": 237511, "epoch": 2861} {"train_loss": -25.418241500854492, "global_step": 237512, "epoch": 2861} {"train_loss": -24.56330680847168, "global_step": 237513, "epoch": 2861} {"train_loss": -24.631210327148438, "global_step": 237514, "epoch": 2861} {"train_loss": -24.836118698120117, "global_step": 237515, "epoch": 2861} {"train_loss": -24.482013702392578, "global_step": 237516, "epoch": 2861} {"train_loss": -24.28877067565918, "global_step": 237517, "epoch": 2861} {"train_loss": -24.75555992126465, "global_step": 237518, "epoch": 2861} {"train_loss": -24.86798095703125, "global_step": 237519, "epoch": 2861} {"train_loss": -25.19289207458496, "global_step": 237520, "epoch": 2861} {"train_loss": -25.091625213623047, "global_step": 237521, "epoch": 2861} {"train_loss": -25.304439544677734, "global_step": 237522, "epoch": 2861} {"train_loss": -25.103214263916016, "global_step": 237523, "epoch": 2861} {"train_loss": -25.046436309814453, "global_step": 237524, "epoch": 2861} {"train_loss": -24.82465171813965, "global_step": 237525, "epoch": 2861} {"train_loss": -24.845853805541992, "global_step": 237526, "epoch": 2861} {"train_loss": -25.05341148376465, "global_step": 237527, "epoch": 2861} {"train_loss": -25.140460968017578, "global_step": 237528, "epoch": 2861} {"train_loss": -25.04979133605957, "global_step": 237529, "epoch": 2861} {"train_loss": -24.691442489624023, "global_step": 237530, "epoch": 2861} {"train_loss": -25.265640258789062, "global_step": 237531, "epoch": 2861} {"train_loss": -24.967838287353516, "global_step": 237532, "epoch": 2861} {"train_loss": -24.600812911987305, "global_step": 237533, "epoch": 2861} {"train_loss": -25.099157333374023, "global_step": 237534, "epoch": 2861} {"train_loss": -25.208114624023438, "global_step": 237535, "epoch": 2861} {"train_loss": -24.89942741394043, "global_step": 237536, "epoch": 2861} {"train_loss": -24.678024291992188, "global_step": 237537, "epoch": 2861} {"train_loss": -25.00026512145996, "global_step": 237538, "epoch": 2861} {"train_loss": -25.02750015258789, "global_step": 237539, "epoch": 2861} {"train_loss": -24.962444305419922, "global_step": 237540, "epoch": 2861} {"train_loss": -24.898956298828125, "global_step": 237541, "epoch": 2861} {"train_loss": -24.852251052856445, "global_step": 237542, "epoch": 2861} {"train_loss": -24.667715072631836, "global_step": 237543, "epoch": 2861} {"train_loss": -24.505521774291992, "global_step": 237544, "epoch": 2861} {"train_loss": -24.760063102446406, "global_step": 237545, "epoch": 2861, "val_loss": 6784185.5} {"train_loss": -24.681976318359375, "global_step": 237546, "epoch": 2862} {"train_loss": -24.650043487548828, "global_step": 237547, "epoch": 2862} {"train_loss": -24.49141502380371, "global_step": 237548, "epoch": 2862} {"train_loss": -24.691625595092773, "global_step": 237549, "epoch": 2862} {"train_loss": -24.376060485839844, "global_step": 237550, "epoch": 2862} {"train_loss": -24.55974769592285, "global_step": 237551, "epoch": 2862} {"train_loss": -24.569690704345703, "global_step": 237552, "epoch": 2862} {"train_loss": -24.581527709960938, "global_step": 237553, "epoch": 2862} {"train_loss": -24.54001808166504, "global_step": 237554, "epoch": 2862} {"train_loss": -24.538585662841797, "global_step": 237555, "epoch": 2862} {"train_loss": -24.692007064819336, "global_step": 237556, "epoch": 2862} {"train_loss": -24.630008697509766, "global_step": 237557, "epoch": 2862} {"train_loss": -24.618499755859375, "global_step": 237558, "epoch": 2862} {"train_loss": -25.10328483581543, "global_step": 237559, "epoch": 2862} {"train_loss": -24.895029067993164, "global_step": 237560, "epoch": 2862} {"train_loss": -25.288944244384766, "global_step": 237561, "epoch": 2862} {"train_loss": -24.91267204284668, "global_step": 237562, "epoch": 2862} {"train_loss": -24.791244506835938, "global_step": 237563, "epoch": 2862} {"train_loss": -24.53795051574707, "global_step": 237564, "epoch": 2862} {"train_loss": -25.317079544067383, "global_step": 237565, "epoch": 2862} {"train_loss": -25.049814224243164, "global_step": 237566, "epoch": 2862} {"train_loss": -24.14450454711914, "global_step": 237567, "epoch": 2862} {"train_loss": -24.669946670532227, "global_step": 237568, "epoch": 2862} {"train_loss": -24.81906509399414, "global_step": 237569, "epoch": 2862} {"train_loss": -24.840709686279297, "global_step": 237570, "epoch": 2862} {"train_loss": -24.812612533569336, "global_step": 237571, "epoch": 2862} {"train_loss": -24.7000789642334, "global_step": 237572, "epoch": 2862} {"train_loss": -24.640127182006836, "global_step": 237573, "epoch": 2862} {"train_loss": -24.470035552978516, "global_step": 237574, "epoch": 2862} {"train_loss": -25.38662338256836, "global_step": 237575, "epoch": 2862} {"train_loss": -24.853656768798828, "global_step": 237576, "epoch": 2862} {"train_loss": -24.62403106689453, "global_step": 237577, "epoch": 2862} {"train_loss": -24.550127029418945, "global_step": 237578, "epoch": 2862} {"train_loss": -24.645233154296875, "global_step": 237579, "epoch": 2862} {"train_loss": -24.27492904663086, "global_step": 237580, "epoch": 2862} {"train_loss": -24.801008224487305, "global_step": 237581, "epoch": 2862} {"train_loss": -25.039888381958008, "global_step": 237582, "epoch": 2862} {"train_loss": -25.36467742919922, "global_step": 237583, "epoch": 2862} {"train_loss": -24.792516708374023, "global_step": 237584, "epoch": 2862} {"train_loss": -25.04288673400879, "global_step": 237585, "epoch": 2862} {"train_loss": -25.007741928100586, "global_step": 237586, "epoch": 2862} {"train_loss": -24.870664596557617, "global_step": 237587, "epoch": 2862} {"train_loss": -24.7076473236084, "global_step": 237588, "epoch": 2862} {"train_loss": -24.986408233642578, "global_step": 237589, "epoch": 2862} {"train_loss": -24.812604904174805, "global_step": 237590, "epoch": 2862} {"train_loss": -24.910703659057617, "global_step": 237591, "epoch": 2862} {"train_loss": -24.761077880859375, "global_step": 237592, "epoch": 2862} {"train_loss": -25.104602813720703, "global_step": 237593, "epoch": 2862} {"train_loss": -24.881868362426758, "global_step": 237594, "epoch": 2862} {"train_loss": -25.08023452758789, "global_step": 237595, "epoch": 2862} {"train_loss": -24.682706832885742, "global_step": 237596, "epoch": 2862} {"train_loss": -24.92007827758789, "global_step": 237597, "epoch": 2862} {"train_loss": -24.447118759155273, "global_step": 237598, "epoch": 2862} {"train_loss": -24.94974136352539, "global_step": 237599, "epoch": 2862} {"train_loss": -24.466856002807617, "global_step": 237600, "epoch": 2862} {"train_loss": -24.647863388061523, "global_step": 237601, "epoch": 2862} {"train_loss": -24.980405807495117, "global_step": 237602, "epoch": 2862} {"train_loss": -24.702892303466797, "global_step": 237603, "epoch": 2862} {"train_loss": -24.918071746826172, "global_step": 237604, "epoch": 2862} {"train_loss": -24.780292510986328, "global_step": 237605, "epoch": 2862} {"train_loss": -24.623403549194336, "global_step": 237606, "epoch": 2862} {"train_loss": -24.522323608398438, "global_step": 237607, "epoch": 2862} {"train_loss": -24.677038192749023, "global_step": 237608, "epoch": 2862} {"train_loss": -24.49690818786621, "global_step": 237609, "epoch": 2862} {"train_loss": -24.807323455810547, "global_step": 237610, "epoch": 2862} {"train_loss": -24.75843620300293, "global_step": 237611, "epoch": 2862} {"train_loss": -24.65034294128418, "global_step": 237612, "epoch": 2862} {"train_loss": -24.747655868530273, "global_step": 237613, "epoch": 2862} {"train_loss": -24.86223793029785, "global_step": 237614, "epoch": 2862} {"train_loss": -24.703577041625977, "global_step": 237615, "epoch": 2862} {"train_loss": -24.829166412353516, "global_step": 237616, "epoch": 2862} {"train_loss": -24.684646606445312, "global_step": 237617, "epoch": 2862} {"train_loss": -24.940397262573242, "global_step": 237618, "epoch": 2862} {"train_loss": -24.49800682067871, "global_step": 237619, "epoch": 2862} {"train_loss": -24.616291046142578, "global_step": 237620, "epoch": 2862} {"train_loss": -24.585865020751953, "global_step": 237621, "epoch": 2862} {"train_loss": -25.196460723876953, "global_step": 237622, "epoch": 2862} {"train_loss": -25.219411849975586, "global_step": 237623, "epoch": 2862} {"train_loss": -24.985971450805664, "global_step": 237624, "epoch": 2862} {"train_loss": -24.66353416442871, "global_step": 237625, "epoch": 2862} {"train_loss": -25.07686424255371, "global_step": 237626, "epoch": 2862} {"train_loss": -25.05268669128418, "global_step": 237627, "epoch": 2862} {"train_loss": -24.769566478499446, "global_step": 237628, "epoch": 2862, "val_loss": 6675050.0} {"train_loss": -24.770618438720703, "global_step": 237629, "epoch": 2863} {"train_loss": -24.024215698242188, "global_step": 237630, "epoch": 2863} {"train_loss": -24.68328285217285, "global_step": 237631, "epoch": 2863} {"train_loss": -24.47314453125, "global_step": 237632, "epoch": 2863} {"train_loss": -24.629714965820312, "global_step": 237633, "epoch": 2863} {"train_loss": -24.569669723510742, "global_step": 237634, "epoch": 2863} {"train_loss": -24.671451568603516, "global_step": 237635, "epoch": 2863} {"train_loss": -24.400970458984375, "global_step": 237636, "epoch": 2863} {"train_loss": -24.230398178100586, "global_step": 237637, "epoch": 2863} {"train_loss": -24.63149070739746, "global_step": 237638, "epoch": 2863} {"train_loss": -24.071008682250977, "global_step": 237639, "epoch": 2863} {"train_loss": -24.795717239379883, "global_step": 237640, "epoch": 2863} {"train_loss": -24.728897094726562, "global_step": 237641, "epoch": 2863} {"train_loss": -24.328601837158203, "global_step": 237642, "epoch": 2863} {"train_loss": -24.41224479675293, "global_step": 237643, "epoch": 2863} {"train_loss": -24.562955856323242, "global_step": 237644, "epoch": 2863} {"train_loss": -24.413211822509766, "global_step": 237645, "epoch": 2863} {"train_loss": -24.470518112182617, "global_step": 237646, "epoch": 2863} {"train_loss": -24.699628829956055, "global_step": 237647, "epoch": 2863} {"train_loss": -24.655691146850586, "global_step": 237648, "epoch": 2863} {"train_loss": -24.50439453125, "global_step": 237649, "epoch": 2863} {"train_loss": -24.958637237548828, "global_step": 237650, "epoch": 2863} {"train_loss": -24.882221221923828, "global_step": 237651, "epoch": 2863} {"train_loss": -24.90159034729004, "global_step": 237652, "epoch": 2863} {"train_loss": -24.84113121032715, "global_step": 237653, "epoch": 2863} {"train_loss": -25.020883560180664, "global_step": 237654, "epoch": 2863} {"train_loss": -24.8941707611084, "global_step": 237655, "epoch": 2863} {"train_loss": -25.120817184448242, "global_step": 237656, "epoch": 2863} {"train_loss": -25.044559478759766, "global_step": 237657, "epoch": 2863} {"train_loss": -25.09661102294922, "global_step": 237658, "epoch": 2863} {"train_loss": -24.5507755279541, "global_step": 237659, "epoch": 2863} {"train_loss": -24.758853912353516, "global_step": 237660, "epoch": 2863} {"train_loss": -25.043771743774414, "global_step": 237661, "epoch": 2863} {"train_loss": -25.10818862915039, "global_step": 237662, "epoch": 2863} {"train_loss": -24.691951751708984, "global_step": 237663, "epoch": 2863} {"train_loss": -25.21721839904785, "global_step": 237664, "epoch": 2863} {"train_loss": -24.980825424194336, "global_step": 237665, "epoch": 2863} {"train_loss": -24.843692779541016, "global_step": 237666, "epoch": 2863} {"train_loss": -24.663429260253906, "global_step": 237667, "epoch": 2863} {"train_loss": -25.459959030151367, "global_step": 237668, "epoch": 2863} {"train_loss": -24.665624618530273, "global_step": 237669, "epoch": 2863} {"train_loss": -24.593481063842773, "global_step": 237670, "epoch": 2863} {"train_loss": -25.114120483398438, "global_step": 237671, "epoch": 2863} {"train_loss": -24.823488235473633, "global_step": 237672, "epoch": 2863} {"train_loss": -24.9444637298584, "global_step": 237673, "epoch": 2863} {"train_loss": -25.054014205932617, "global_step": 237674, "epoch": 2863} {"train_loss": -24.92336082458496, "global_step": 237675, "epoch": 2863} {"train_loss": -24.555723190307617, "global_step": 237676, "epoch": 2863} {"train_loss": -24.705886840820312, "global_step": 237677, "epoch": 2863} {"train_loss": -24.636089324951172, "global_step": 237678, "epoch": 2863} {"train_loss": -24.895097732543945, "global_step": 237679, "epoch": 2863} {"train_loss": -25.128250122070312, "global_step": 237680, "epoch": 2863} {"train_loss": -24.796146392822266, "global_step": 237681, "epoch": 2863} {"train_loss": -24.924413681030273, "global_step": 237682, "epoch": 2863} {"train_loss": -24.726158142089844, "global_step": 237683, "epoch": 2863} {"train_loss": -24.97757339477539, "global_step": 237684, "epoch": 2863} {"train_loss": -24.719024658203125, "global_step": 237685, "epoch": 2863} {"train_loss": -24.92405128479004, "global_step": 237686, "epoch": 2863} {"train_loss": -25.072168350219727, "global_step": 237687, "epoch": 2863} {"train_loss": -24.924312591552734, "global_step": 237688, "epoch": 2863} {"train_loss": -24.88080406188965, "global_step": 237689, "epoch": 2863} {"train_loss": -24.821901321411133, "global_step": 237690, "epoch": 2863} {"train_loss": -25.004114151000977, "global_step": 237691, "epoch": 2863} {"train_loss": -25.29996109008789, "global_step": 237692, "epoch": 2863} {"train_loss": -24.932050704956055, "global_step": 237693, "epoch": 2863} {"train_loss": -25.034177780151367, "global_step": 237694, "epoch": 2863} {"train_loss": -25.160812377929688, "global_step": 237695, "epoch": 2863} {"train_loss": -24.724441528320312, "global_step": 237696, "epoch": 2863} {"train_loss": -24.714191436767578, "global_step": 237697, "epoch": 2863} {"train_loss": -24.75913429260254, "global_step": 237698, "epoch": 2863} {"train_loss": -24.572385787963867, "global_step": 237699, "epoch": 2863} {"train_loss": -24.864212036132812, "global_step": 237700, "epoch": 2863} {"train_loss": -24.943326950073242, "global_step": 237701, "epoch": 2863} {"train_loss": -24.883329391479492, "global_step": 237702, "epoch": 2863} {"train_loss": -24.816564559936523, "global_step": 237703, "epoch": 2863} {"train_loss": -25.322124481201172, "global_step": 237704, "epoch": 2863} {"train_loss": -24.743324279785156, "global_step": 237705, "epoch": 2863} {"train_loss": -25.093170166015625, "global_step": 237706, "epoch": 2863} {"train_loss": -24.941137313842773, "global_step": 237707, "epoch": 2863} {"train_loss": -24.9907283782959, "global_step": 237708, "epoch": 2863} {"train_loss": -25.043161392211914, "global_step": 237709, "epoch": 2863} {"train_loss": -24.851728439331055, "global_step": 237710, "epoch": 2863} {"train_loss": -24.812297085681593, "global_step": 237711, "epoch": 2863, "val_loss": 6974322.0} {"train_loss": -24.85489845275879, "global_step": 237712, "epoch": 2864} {"train_loss": -24.327293395996094, "global_step": 237713, "epoch": 2864} {"train_loss": -24.35460662841797, "global_step": 237714, "epoch": 2864} {"train_loss": -24.454360961914062, "global_step": 237715, "epoch": 2864} {"train_loss": -25.054609298706055, "global_step": 237716, "epoch": 2864} {"train_loss": -24.574615478515625, "global_step": 237717, "epoch": 2864} {"train_loss": -24.35773468017578, "global_step": 237718, "epoch": 2864} {"train_loss": -24.748388290405273, "global_step": 237719, "epoch": 2864} {"train_loss": -24.775339126586914, "global_step": 237720, "epoch": 2864} {"train_loss": -24.763412475585938, "global_step": 237721, "epoch": 2864} {"train_loss": -24.96119499206543, "global_step": 237722, "epoch": 2864} {"train_loss": -25.08490562438965, "global_step": 237723, "epoch": 2864} {"train_loss": -24.837308883666992, "global_step": 237724, "epoch": 2864} {"train_loss": -24.729820251464844, "global_step": 237725, "epoch": 2864} {"train_loss": -24.576210021972656, "global_step": 237726, "epoch": 2864} {"train_loss": -24.663305282592773, "global_step": 237727, "epoch": 2864} {"train_loss": -24.66648292541504, "global_step": 237728, "epoch": 2864} {"train_loss": -24.72353172302246, "global_step": 237729, "epoch": 2864} {"train_loss": -24.87088394165039, "global_step": 237730, "epoch": 2864} {"train_loss": -24.820894241333008, "global_step": 237731, "epoch": 2864} {"train_loss": -24.700742721557617, "global_step": 237732, "epoch": 2864} {"train_loss": -25.088560104370117, "global_step": 237733, "epoch": 2864} {"train_loss": -25.293453216552734, "global_step": 237734, "epoch": 2864} {"train_loss": -24.89796257019043, "global_step": 237735, "epoch": 2864} {"train_loss": -24.945898056030273, "global_step": 237736, "epoch": 2864} {"train_loss": -24.977880477905273, "global_step": 237737, "epoch": 2864} {"train_loss": -24.64191246032715, "global_step": 237738, "epoch": 2864} {"train_loss": -24.57355308532715, "global_step": 237739, "epoch": 2864} {"train_loss": -24.613033294677734, "global_step": 237740, "epoch": 2864} {"train_loss": -24.89813804626465, "global_step": 237741, "epoch": 2864} {"train_loss": -24.935869216918945, "global_step": 237742, "epoch": 2864} {"train_loss": -25.237735748291016, "global_step": 237743, "epoch": 2864} {"train_loss": -25.130125045776367, "global_step": 237744, "epoch": 2864} {"train_loss": -25.021997451782227, "global_step": 237745, "epoch": 2864} {"train_loss": -25.02372169494629, "global_step": 237746, "epoch": 2864} {"train_loss": -25.039762496948242, "global_step": 237747, "epoch": 2864} {"train_loss": -24.63936424255371, "global_step": 237748, "epoch": 2864} {"train_loss": -24.851099014282227, "global_step": 237749, "epoch": 2864} {"train_loss": -25.106098175048828, "global_step": 237750, "epoch": 2864} {"train_loss": -24.817081451416016, "global_step": 237751, "epoch": 2864} {"train_loss": -25.17059898376465, "global_step": 237752, "epoch": 2864} {"train_loss": -24.556669235229492, "global_step": 237753, "epoch": 2864} {"train_loss": -24.985620498657227, "global_step": 237754, "epoch": 2864} {"train_loss": -24.661203384399414, "global_step": 237755, "epoch": 2864} {"train_loss": -25.018192291259766, "global_step": 237756, "epoch": 2864} {"train_loss": -25.001184463500977, "global_step": 237757, "epoch": 2864} {"train_loss": -24.697465896606445, "global_step": 237758, "epoch": 2864} {"train_loss": -24.98605728149414, "global_step": 237759, "epoch": 2864} {"train_loss": -24.872949600219727, "global_step": 237760, "epoch": 2864} {"train_loss": -24.74689292907715, "global_step": 237761, "epoch": 2864} {"train_loss": -25.04871940612793, "global_step": 237762, "epoch": 2864} {"train_loss": -25.012685775756836, "global_step": 237763, "epoch": 2864} {"train_loss": -24.8287410736084, "global_step": 237764, "epoch": 2864} {"train_loss": -25.232284545898438, "global_step": 237765, "epoch": 2864} {"train_loss": -24.818729400634766, "global_step": 237766, "epoch": 2864} {"train_loss": -24.742691040039062, "global_step": 237767, "epoch": 2864} {"train_loss": -24.49022102355957, "global_step": 237768, "epoch": 2864} {"train_loss": -24.824857711791992, "global_step": 237769, "epoch": 2864} {"train_loss": -24.91108512878418, "global_step": 237770, "epoch": 2864} {"train_loss": -24.796886444091797, "global_step": 237771, "epoch": 2864} {"train_loss": -25.1854305267334, "global_step": 237772, "epoch": 2864} {"train_loss": -24.423643112182617, "global_step": 237773, "epoch": 2864} {"train_loss": -24.66980743408203, "global_step": 237774, "epoch": 2864} {"train_loss": -24.608505249023438, "global_step": 237775, "epoch": 2864} {"train_loss": -24.245243072509766, "global_step": 237776, "epoch": 2864} {"train_loss": -24.735666275024414, "global_step": 237777, "epoch": 2864} {"train_loss": -24.959009170532227, "global_step": 237778, "epoch": 2864} {"train_loss": -24.25532341003418, "global_step": 237779, "epoch": 2864} {"train_loss": -24.424697875976562, "global_step": 237780, "epoch": 2864} {"train_loss": -24.0046443939209, "global_step": 237781, "epoch": 2864} {"train_loss": -24.93067169189453, "global_step": 237782, "epoch": 2864} {"train_loss": -24.412012100219727, "global_step": 237783, "epoch": 2864} {"train_loss": -24.607168197631836, "global_step": 237784, "epoch": 2864} {"train_loss": -24.391122817993164, "global_step": 237785, "epoch": 2864} {"train_loss": -24.666309356689453, "global_step": 237786, "epoch": 2864} {"train_loss": -24.711347579956055, "global_step": 237787, "epoch": 2864} {"train_loss": -24.64154624938965, "global_step": 237788, "epoch": 2864} {"train_loss": -25.117963790893555, "global_step": 237789, "epoch": 2864} {"train_loss": -24.41482162475586, "global_step": 237790, "epoch": 2864} {"train_loss": -24.76715660095215, "global_step": 237791, "epoch": 2864} {"train_loss": -24.555063247680664, "global_step": 237792, "epoch": 2864} {"train_loss": -24.66912269592285, "global_step": 237793, "epoch": 2864} {"train_loss": -24.769161660987212, "global_step": 237794, "epoch": 2864, "val_loss": 6932002.5} {"train_loss": -23.904943466186523, "global_step": 237795, "epoch": 2865} {"train_loss": -23.90480613708496, "global_step": 237796, "epoch": 2865} {"train_loss": -24.11128807067871, "global_step": 237797, "epoch": 2865} {"train_loss": -23.888484954833984, "global_step": 237798, "epoch": 2865} {"train_loss": -24.275463104248047, "global_step": 237799, "epoch": 2865} {"train_loss": -24.472013473510742, "global_step": 237800, "epoch": 2865} {"train_loss": -24.33733367919922, "global_step": 237801, "epoch": 2865} {"train_loss": -24.845478057861328, "global_step": 237802, "epoch": 2865} {"train_loss": -24.779754638671875, "global_step": 237803, "epoch": 2865} {"train_loss": -24.296735763549805, "global_step": 237804, "epoch": 2865} {"train_loss": -24.33827781677246, "global_step": 237805, "epoch": 2865} {"train_loss": -24.640901565551758, "global_step": 237806, "epoch": 2865} {"train_loss": -24.59233856201172, "global_step": 237807, "epoch": 2865} {"train_loss": -24.75505256652832, "global_step": 237808, "epoch": 2865} {"train_loss": -24.500642776489258, "global_step": 237809, "epoch": 2865} {"train_loss": -25.025436401367188, "global_step": 237810, "epoch": 2865} {"train_loss": -24.371572494506836, "global_step": 237811, "epoch": 2865} {"train_loss": -24.810462951660156, "global_step": 237812, "epoch": 2865} {"train_loss": -24.691936492919922, "global_step": 237813, "epoch": 2865} {"train_loss": -24.845346450805664, "global_step": 237814, "epoch": 2865} {"train_loss": -24.570802688598633, "global_step": 237815, "epoch": 2865} {"train_loss": -24.759977340698242, "global_step": 237816, "epoch": 2865} {"train_loss": -24.933120727539062, "global_step": 237817, "epoch": 2865} {"train_loss": -24.953367233276367, "global_step": 237818, "epoch": 2865} {"train_loss": -25.175125122070312, "global_step": 237819, "epoch": 2865} {"train_loss": -24.573144912719727, "global_step": 237820, "epoch": 2865} {"train_loss": -24.972440719604492, "global_step": 237821, "epoch": 2865} {"train_loss": -24.85708999633789, "global_step": 237822, "epoch": 2865} {"train_loss": -25.236608505249023, "global_step": 237823, "epoch": 2865} {"train_loss": -24.97129249572754, "global_step": 237824, "epoch": 2865} {"train_loss": -24.733755111694336, "global_step": 237825, "epoch": 2865} {"train_loss": -25.01687240600586, "global_step": 237826, "epoch": 2865} {"train_loss": -25.213605880737305, "global_step": 237827, "epoch": 2865} {"train_loss": -25.09405517578125, "global_step": 237828, "epoch": 2865} {"train_loss": -24.835756301879883, "global_step": 237829, "epoch": 2865} {"train_loss": -25.07821273803711, "global_step": 237830, "epoch": 2865} {"train_loss": -24.948986053466797, "global_step": 237831, "epoch": 2865} {"train_loss": -24.928312301635742, "global_step": 237832, "epoch": 2865} {"train_loss": -24.675113677978516, "global_step": 237833, "epoch": 2865} {"train_loss": -25.402307510375977, "global_step": 237834, "epoch": 2865} {"train_loss": -24.68560791015625, "global_step": 237835, "epoch": 2865} {"train_loss": -25.1589412689209, "global_step": 237836, "epoch": 2865} {"train_loss": -24.97286033630371, "global_step": 237837, "epoch": 2865} {"train_loss": -24.91350555419922, "global_step": 237838, "epoch": 2865} {"train_loss": -25.021589279174805, "global_step": 237839, "epoch": 2865} {"train_loss": -24.9206600189209, "global_step": 237840, "epoch": 2865} {"train_loss": -24.582138061523438, "global_step": 237841, "epoch": 2865} {"train_loss": -24.907012939453125, "global_step": 237842, "epoch": 2865} {"train_loss": -24.64133644104004, "global_step": 237843, "epoch": 2865} {"train_loss": -24.74616241455078, "global_step": 237844, "epoch": 2865} {"train_loss": -24.44561195373535, "global_step": 237845, "epoch": 2865} {"train_loss": -24.335262298583984, "global_step": 237846, "epoch": 2865} {"train_loss": -24.468128204345703, "global_step": 237847, "epoch": 2865} {"train_loss": -24.72416877746582, "global_step": 237848, "epoch": 2865} {"train_loss": -24.806921005249023, "global_step": 237849, "epoch": 2865} {"train_loss": -24.558988571166992, "global_step": 237850, "epoch": 2865} {"train_loss": -24.120962142944336, "global_step": 237851, "epoch": 2865} {"train_loss": -24.600942611694336, "global_step": 237852, "epoch": 2865} {"train_loss": -24.971532821655273, "global_step": 237853, "epoch": 2865} {"train_loss": -24.975553512573242, "global_step": 237854, "epoch": 2865} {"train_loss": -24.638015747070312, "global_step": 237855, "epoch": 2865} {"train_loss": -24.941835403442383, "global_step": 237856, "epoch": 2865} {"train_loss": -24.656875610351562, "global_step": 237857, "epoch": 2865} {"train_loss": -24.559886932373047, "global_step": 237858, "epoch": 2865} {"train_loss": -24.594892501831055, "global_step": 237859, "epoch": 2865} {"train_loss": -24.89067840576172, "global_step": 237860, "epoch": 2865} {"train_loss": -25.110851287841797, "global_step": 237861, "epoch": 2865} {"train_loss": -25.02741813659668, "global_step": 237862, "epoch": 2865} {"train_loss": -24.712614059448242, "global_step": 237863, "epoch": 2865} {"train_loss": -24.545734405517578, "global_step": 237864, "epoch": 2865} {"train_loss": -25.061216354370117, "global_step": 237865, "epoch": 2865} {"train_loss": -24.458627700805664, "global_step": 237866, "epoch": 2865} {"train_loss": -24.589216232299805, "global_step": 237867, "epoch": 2865} {"train_loss": -24.947410583496094, "global_step": 237868, "epoch": 2865} {"train_loss": -25.127471923828125, "global_step": 237869, "epoch": 2865} {"train_loss": -25.08538246154785, "global_step": 237870, "epoch": 2865} {"train_loss": -25.156564712524414, "global_step": 237871, "epoch": 2865} {"train_loss": -24.83039665222168, "global_step": 237872, "epoch": 2865} {"train_loss": -24.97258186340332, "global_step": 237873, "epoch": 2865} {"train_loss": -25.19614601135254, "global_step": 237874, "epoch": 2865} {"train_loss": -25.056198120117188, "global_step": 237875, "epoch": 2865} {"train_loss": -24.843246459960938, "global_step": 237876, "epoch": 2865} {"train_loss": -24.744421143129646, "global_step": 237877, "epoch": 2865, "val_loss": 6776038.5} {"train_loss": -24.533437728881836, "global_step": 237878, "epoch": 2866} {"train_loss": -24.375843048095703, "global_step": 237879, "epoch": 2866} {"train_loss": -24.360593795776367, "global_step": 237880, "epoch": 2866} {"train_loss": -24.613162994384766, "global_step": 237881, "epoch": 2866} {"train_loss": -25.2237606048584, "global_step": 237882, "epoch": 2866} {"train_loss": -24.818992614746094, "global_step": 237883, "epoch": 2866} {"train_loss": -24.31814193725586, "global_step": 237884, "epoch": 2866} {"train_loss": -24.42828941345215, "global_step": 237885, "epoch": 2866} {"train_loss": -24.58101463317871, "global_step": 237886, "epoch": 2866} {"train_loss": -25.14196014404297, "global_step": 237887, "epoch": 2866} {"train_loss": -24.29392433166504, "global_step": 237888, "epoch": 2866} {"train_loss": -24.90167236328125, "global_step": 237889, "epoch": 2866} {"train_loss": -24.79304313659668, "global_step": 237890, "epoch": 2866} {"train_loss": -24.42770767211914, "global_step": 237891, "epoch": 2866} {"train_loss": -24.402481079101562, "global_step": 237892, "epoch": 2866} {"train_loss": -24.7578067779541, "global_step": 237893, "epoch": 2866} {"train_loss": -24.631752014160156, "global_step": 237894, "epoch": 2866} {"train_loss": -24.628767013549805, "global_step": 237895, "epoch": 2866} {"train_loss": -24.73370361328125, "global_step": 237896, "epoch": 2866} {"train_loss": -24.765750885009766, "global_step": 237897, "epoch": 2866} {"train_loss": -24.901809692382812, "global_step": 237898, "epoch": 2866} {"train_loss": -24.822477340698242, "global_step": 237899, "epoch": 2866} {"train_loss": -24.80629539489746, "global_step": 237900, "epoch": 2866} {"train_loss": -24.96584701538086, "global_step": 237901, "epoch": 2866} {"train_loss": -24.98291778564453, "global_step": 237902, "epoch": 2866} {"train_loss": -24.6597900390625, "global_step": 237903, "epoch": 2866} {"train_loss": -24.79444694519043, "global_step": 237904, "epoch": 2866} {"train_loss": -24.861831665039062, "global_step": 237905, "epoch": 2866} {"train_loss": -24.999359130859375, "global_step": 237906, "epoch": 2866} {"train_loss": -24.588132858276367, "global_step": 237907, "epoch": 2866} {"train_loss": -24.912927627563477, "global_step": 237908, "epoch": 2866} {"train_loss": -24.800445556640625, "global_step": 237909, "epoch": 2866} {"train_loss": -25.14301872253418, "global_step": 237910, "epoch": 2866} {"train_loss": -25.046070098876953, "global_step": 237911, "epoch": 2866} {"train_loss": -24.710357666015625, "global_step": 237912, "epoch": 2866} {"train_loss": -24.834577560424805, "global_step": 237913, "epoch": 2866} {"train_loss": -25.099882125854492, "global_step": 237914, "epoch": 2866} {"train_loss": -24.978342056274414, "global_step": 237915, "epoch": 2866} {"train_loss": -24.92543601989746, "global_step": 237916, "epoch": 2866} {"train_loss": -24.75361442565918, "global_step": 237917, "epoch": 2866} {"train_loss": -24.905902862548828, "global_step": 237918, "epoch": 2866} {"train_loss": -24.997426986694336, "global_step": 237919, "epoch": 2866} {"train_loss": -25.084762573242188, "global_step": 237920, "epoch": 2866} {"train_loss": -24.69025421142578, "global_step": 237921, "epoch": 2866} {"train_loss": -24.414077758789062, "global_step": 237922, "epoch": 2866} {"train_loss": -24.795307159423828, "global_step": 237923, "epoch": 2866} {"train_loss": -24.881864547729492, "global_step": 237924, "epoch": 2866} {"train_loss": -24.94999122619629, "global_step": 237925, "epoch": 2866} {"train_loss": -24.939517974853516, "global_step": 237926, "epoch": 2866} {"train_loss": -24.98551368713379, "global_step": 237927, "epoch": 2866} {"train_loss": -24.660741806030273, "global_step": 237928, "epoch": 2866} {"train_loss": -24.879718780517578, "global_step": 237929, "epoch": 2866} {"train_loss": -24.536083221435547, "global_step": 237930, "epoch": 2866} {"train_loss": -25.234575271606445, "global_step": 237931, "epoch": 2866} {"train_loss": -24.818817138671875, "global_step": 237932, "epoch": 2866} {"train_loss": -24.91010856628418, "global_step": 237933, "epoch": 2866} {"train_loss": -24.800128936767578, "global_step": 237934, "epoch": 2866} {"train_loss": -24.908706665039062, "global_step": 237935, "epoch": 2866} {"train_loss": -25.034690856933594, "global_step": 237936, "epoch": 2866} {"train_loss": -24.8637752532959, "global_step": 237937, "epoch": 2866} {"train_loss": -25.19683837890625, "global_step": 237938, "epoch": 2866} {"train_loss": -25.024789810180664, "global_step": 237939, "epoch": 2866} {"train_loss": -25.182056427001953, "global_step": 237940, "epoch": 2866} {"train_loss": -25.08693504333496, "global_step": 237941, "epoch": 2866} {"train_loss": -25.221847534179688, "global_step": 237942, "epoch": 2866} {"train_loss": -24.774415969848633, "global_step": 237943, "epoch": 2866} {"train_loss": -24.870466232299805, "global_step": 237944, "epoch": 2866} {"train_loss": -25.17538833618164, "global_step": 237945, "epoch": 2866} {"train_loss": -24.876089096069336, "global_step": 237946, "epoch": 2866} {"train_loss": -24.931371688842773, "global_step": 237947, "epoch": 2866} {"train_loss": -24.59794044494629, "global_step": 237948, "epoch": 2866} {"train_loss": -25.118621826171875, "global_step": 237949, "epoch": 2866} {"train_loss": -25.15165901184082, "global_step": 237950, "epoch": 2866} {"train_loss": -24.94332504272461, "global_step": 237951, "epoch": 2866} {"train_loss": -24.908710479736328, "global_step": 237952, "epoch": 2866} {"train_loss": -24.592390060424805, "global_step": 237953, "epoch": 2866} {"train_loss": -24.74942970275879, "global_step": 237954, "epoch": 2866} {"train_loss": -24.841001510620117, "global_step": 237955, "epoch": 2866} {"train_loss": -24.57623863220215, "global_step": 237956, "epoch": 2866} {"train_loss": -25.175045013427734, "global_step": 237957, "epoch": 2866} {"train_loss": -24.722429275512695, "global_step": 237958, "epoch": 2866} {"train_loss": -24.90923500061035, "global_step": 237959, "epoch": 2866} {"train_loss": -24.85061578865511, "global_step": 237960, "epoch": 2866, "val_loss": 6692022.5} {"train_loss": -23.331327438354492, "global_step": 237961, "epoch": 2867} {"train_loss": -23.683643341064453, "global_step": 237962, "epoch": 2867} {"train_loss": -23.687040328979492, "global_step": 237963, "epoch": 2867} {"train_loss": -24.419448852539062, "global_step": 237964, "epoch": 2867} {"train_loss": -24.057310104370117, "global_step": 237965, "epoch": 2867} {"train_loss": -24.27063751220703, "global_step": 237966, "epoch": 2867} {"train_loss": -24.428142547607422, "global_step": 237967, "epoch": 2867} {"train_loss": -24.577234268188477, "global_step": 237968, "epoch": 2867} {"train_loss": -24.480985641479492, "global_step": 237969, "epoch": 2867} {"train_loss": -24.199853897094727, "global_step": 237970, "epoch": 2867} {"train_loss": -24.28508186340332, "global_step": 237971, "epoch": 2867} {"train_loss": -24.532785415649414, "global_step": 237972, "epoch": 2867} {"train_loss": -24.32538414001465, "global_step": 237973, "epoch": 2867} {"train_loss": -24.522430419921875, "global_step": 237974, "epoch": 2867} {"train_loss": -24.25916862487793, "global_step": 237975, "epoch": 2867} {"train_loss": -24.779558181762695, "global_step": 237976, "epoch": 2867} {"train_loss": -24.545927047729492, "global_step": 237977, "epoch": 2867} {"train_loss": -24.770544052124023, "global_step": 237978, "epoch": 2867} {"train_loss": -24.59876823425293, "global_step": 237979, "epoch": 2867} {"train_loss": -24.599557876586914, "global_step": 237980, "epoch": 2867} {"train_loss": -24.603439331054688, "global_step": 237981, "epoch": 2867} {"train_loss": -24.725730895996094, "global_step": 237982, "epoch": 2867} {"train_loss": -24.77008819580078, "global_step": 237983, "epoch": 2867} {"train_loss": -24.763324737548828, "global_step": 237984, "epoch": 2867} {"train_loss": -24.395992279052734, "global_step": 237985, "epoch": 2867} {"train_loss": -24.642179489135742, "global_step": 237986, "epoch": 2867} {"train_loss": -24.28741455078125, "global_step": 237987, "epoch": 2867} {"train_loss": -24.890207290649414, "global_step": 237988, "epoch": 2867} {"train_loss": -24.86380386352539, "global_step": 237989, "epoch": 2867} {"train_loss": -24.72604751586914, "global_step": 237990, "epoch": 2867} {"train_loss": -24.859262466430664, "global_step": 237991, "epoch": 2867} {"train_loss": -24.76432228088379, "global_step": 237992, "epoch": 2867} {"train_loss": -24.776044845581055, "global_step": 237993, "epoch": 2867} {"train_loss": -24.82015037536621, "global_step": 237994, "epoch": 2867} {"train_loss": -24.90105628967285, "global_step": 237995, "epoch": 2867} {"train_loss": -25.056838989257812, "global_step": 237996, "epoch": 2867} {"train_loss": -24.60755729675293, "global_step": 237997, "epoch": 2867} {"train_loss": -24.9157657623291, "global_step": 237998, "epoch": 2867} {"train_loss": -25.081872940063477, "global_step": 237999, "epoch": 2867} {"train_loss": -24.664642333984375, "global_step": 238000, "epoch": 2867} {"train_loss": -24.94985580444336, "global_step": 238001, "epoch": 2867} {"train_loss": -25.376951217651367, "global_step": 238002, "epoch": 2867} {"train_loss": -24.564966201782227, "global_step": 238003, "epoch": 2867} {"train_loss": -24.994049072265625, "global_step": 238004, "epoch": 2867} {"train_loss": -25.07296371459961, "global_step": 238005, "epoch": 2867} {"train_loss": -24.797080993652344, "global_step": 238006, "epoch": 2867} {"train_loss": -25.143943786621094, "global_step": 238007, "epoch": 2867} {"train_loss": -25.04912567138672, "global_step": 238008, "epoch": 2867} {"train_loss": -24.940343856811523, "global_step": 238009, "epoch": 2867} {"train_loss": -24.90264320373535, "global_step": 238010, "epoch": 2867} {"train_loss": -24.516733169555664, "global_step": 238011, "epoch": 2867} {"train_loss": -24.930927276611328, "global_step": 238012, "epoch": 2867} {"train_loss": -24.655237197875977, "global_step": 238013, "epoch": 2867} {"train_loss": -25.065977096557617, "global_step": 238014, "epoch": 2867} {"train_loss": -24.569822311401367, "global_step": 238015, "epoch": 2867} {"train_loss": -25.045026779174805, "global_step": 238016, "epoch": 2867} {"train_loss": -24.827335357666016, "global_step": 238017, "epoch": 2867} {"train_loss": -24.722135543823242, "global_step": 238018, "epoch": 2867} {"train_loss": -24.79498291015625, "global_step": 238019, "epoch": 2867} {"train_loss": -24.882965087890625, "global_step": 238020, "epoch": 2867} {"train_loss": -24.612714767456055, "global_step": 238021, "epoch": 2867} {"train_loss": -24.735200881958008, "global_step": 238022, "epoch": 2867} {"train_loss": -25.40668296813965, "global_step": 238023, "epoch": 2867} {"train_loss": -25.063785552978516, "global_step": 238024, "epoch": 2867} {"train_loss": -24.7938289642334, "global_step": 238025, "epoch": 2867} {"train_loss": -24.857959747314453, "global_step": 238026, "epoch": 2867} {"train_loss": -24.935821533203125, "global_step": 238027, "epoch": 2867} {"train_loss": -25.220104217529297, "global_step": 238028, "epoch": 2867} {"train_loss": -25.038549423217773, "global_step": 238029, "epoch": 2867} {"train_loss": -24.98615074157715, "global_step": 238030, "epoch": 2867} {"train_loss": -25.186206817626953, "global_step": 238031, "epoch": 2867} {"train_loss": -24.725160598754883, "global_step": 238032, "epoch": 2867} {"train_loss": -25.0920352935791, "global_step": 238033, "epoch": 2867} {"train_loss": -25.19840431213379, "global_step": 238034, "epoch": 2867} {"train_loss": -24.857065200805664, "global_step": 238035, "epoch": 2867} {"train_loss": -25.659427642822266, "global_step": 238036, "epoch": 2867} {"train_loss": -24.62393569946289, "global_step": 238037, "epoch": 2867} {"train_loss": -24.718034744262695, "global_step": 238038, "epoch": 2867} {"train_loss": -24.637943267822266, "global_step": 238039, "epoch": 2867} {"train_loss": -24.99555015563965, "global_step": 238040, "epoch": 2867} {"train_loss": -25.32144546508789, "global_step": 238041, "epoch": 2867} {"train_loss": -25.111047744750977, "global_step": 238042, "epoch": 2867} {"train_loss": -24.747676550623883, "global_step": 238043, "epoch": 2867, "val_loss": 6772325.5} {"train_loss": -24.310941696166992, "global_step": 238044, "epoch": 2868} {"train_loss": -24.64139175415039, "global_step": 238045, "epoch": 2868} {"train_loss": -24.93783950805664, "global_step": 238046, "epoch": 2868} {"train_loss": -24.26729393005371, "global_step": 238047, "epoch": 2868} {"train_loss": -24.32393455505371, "global_step": 238048, "epoch": 2868} {"train_loss": -24.60551643371582, "global_step": 238049, "epoch": 2868} {"train_loss": -24.84535789489746, "global_step": 238050, "epoch": 2868} {"train_loss": -24.599023818969727, "global_step": 238051, "epoch": 2868} {"train_loss": -24.39164161682129, "global_step": 238052, "epoch": 2868} {"train_loss": -24.22898292541504, "global_step": 238053, "epoch": 2868} {"train_loss": -24.8614444732666, "global_step": 238054, "epoch": 2868} {"train_loss": -23.971351623535156, "global_step": 238055, "epoch": 2868} {"train_loss": -23.913549423217773, "global_step": 238056, "epoch": 2868} {"train_loss": -24.162683486938477, "global_step": 238057, "epoch": 2868} {"train_loss": -24.47918701171875, "global_step": 238058, "epoch": 2868} {"train_loss": -24.664518356323242, "global_step": 238059, "epoch": 2868} {"train_loss": -24.21210289001465, "global_step": 238060, "epoch": 2868} {"train_loss": -24.201215744018555, "global_step": 238061, "epoch": 2868} {"train_loss": -24.765039443969727, "global_step": 238062, "epoch": 2868} {"train_loss": -24.4034366607666, "global_step": 238063, "epoch": 2868} {"train_loss": -23.872161865234375, "global_step": 238064, "epoch": 2868} {"train_loss": -24.83832550048828, "global_step": 238065, "epoch": 2868} {"train_loss": -24.15494155883789, "global_step": 238066, "epoch": 2868} {"train_loss": -24.539932250976562, "global_step": 238067, "epoch": 2868} {"train_loss": -24.66267204284668, "global_step": 238068, "epoch": 2868} {"train_loss": -24.567232131958008, "global_step": 238069, "epoch": 2868} {"train_loss": -24.394102096557617, "global_step": 238070, "epoch": 2868} {"train_loss": -24.82441520690918, "global_step": 238071, "epoch": 2868} {"train_loss": -24.791231155395508, "global_step": 238072, "epoch": 2868} {"train_loss": -25.065067291259766, "global_step": 238073, "epoch": 2868} {"train_loss": -24.73552703857422, "global_step": 238074, "epoch": 2868} {"train_loss": -24.742778778076172, "global_step": 238075, "epoch": 2868} {"train_loss": -24.82879638671875, "global_step": 238076, "epoch": 2868} {"train_loss": -24.744840621948242, "global_step": 238077, "epoch": 2868} {"train_loss": -24.71551513671875, "global_step": 238078, "epoch": 2868} {"train_loss": -25.086023330688477, "global_step": 238079, "epoch": 2868} {"train_loss": -25.27947235107422, "global_step": 238080, "epoch": 2868} {"train_loss": -24.82601547241211, "global_step": 238081, "epoch": 2868} {"train_loss": -24.891239166259766, "global_step": 238082, "epoch": 2868} {"train_loss": -24.71550941467285, "global_step": 238083, "epoch": 2868} {"train_loss": -24.744312286376953, "global_step": 238084, "epoch": 2868} {"train_loss": -24.60986328125, "global_step": 238085, "epoch": 2868} {"train_loss": -25.310983657836914, "global_step": 238086, "epoch": 2868} {"train_loss": -25.043916702270508, "global_step": 238087, "epoch": 2868} {"train_loss": -25.186328887939453, "global_step": 238088, "epoch": 2868} {"train_loss": -24.817819595336914, "global_step": 238089, "epoch": 2868} {"train_loss": -24.89210319519043, "global_step": 238090, "epoch": 2868} {"train_loss": -24.740896224975586, "global_step": 238091, "epoch": 2868} {"train_loss": -25.163726806640625, "global_step": 238092, "epoch": 2868} {"train_loss": -24.508514404296875, "global_step": 238093, "epoch": 2868} {"train_loss": -25.020286560058594, "global_step": 238094, "epoch": 2868} {"train_loss": -25.213909149169922, "global_step": 238095, "epoch": 2868} {"train_loss": -24.54542350769043, "global_step": 238096, "epoch": 2868} {"train_loss": -25.18097496032715, "global_step": 238097, "epoch": 2868} {"train_loss": -24.844045639038086, "global_step": 238098, "epoch": 2868} {"train_loss": -24.375364303588867, "global_step": 238099, "epoch": 2868} {"train_loss": -24.141319274902344, "global_step": 238100, "epoch": 2868} {"train_loss": -24.205631256103516, "global_step": 238101, "epoch": 2868} {"train_loss": -24.789596557617188, "global_step": 238102, "epoch": 2868} {"train_loss": -24.593643188476562, "global_step": 238103, "epoch": 2868} {"train_loss": -24.727628707885742, "global_step": 238104, "epoch": 2868} {"train_loss": -24.021665573120117, "global_step": 238105, "epoch": 2868} {"train_loss": -24.632177352905273, "global_step": 238106, "epoch": 2868} {"train_loss": -24.52507209777832, "global_step": 238107, "epoch": 2868} {"train_loss": -24.253555297851562, "global_step": 238108, "epoch": 2868} {"train_loss": -24.55959129333496, "global_step": 238109, "epoch": 2868} {"train_loss": -24.892316818237305, "global_step": 238110, "epoch": 2868} {"train_loss": -24.543689727783203, "global_step": 238111, "epoch": 2868} {"train_loss": -24.793598175048828, "global_step": 238112, "epoch": 2868} {"train_loss": -24.928335189819336, "global_step": 238113, "epoch": 2868} {"train_loss": -24.583799362182617, "global_step": 238114, "epoch": 2868} {"train_loss": -24.718046188354492, "global_step": 238115, "epoch": 2868} {"train_loss": -24.761009216308594, "global_step": 238116, "epoch": 2868} {"train_loss": -24.823949813842773, "global_step": 238117, "epoch": 2868} {"train_loss": -24.642887115478516, "global_step": 238118, "epoch": 2868} {"train_loss": -24.79972267150879, "global_step": 238119, "epoch": 2868} {"train_loss": -24.43448257446289, "global_step": 238120, "epoch": 2868} {"train_loss": -25.051319122314453, "global_step": 238121, "epoch": 2868} {"train_loss": -25.28079605102539, "global_step": 238122, "epoch": 2868} {"train_loss": -24.85348129272461, "global_step": 238123, "epoch": 2868} {"train_loss": -25.305072784423828, "global_step": 238124, "epoch": 2868} {"train_loss": -24.991317749023438, "global_step": 238125, "epoch": 2868} {"train_loss": -24.68503235047122, "global_step": 238126, "epoch": 2868, "val_loss": 6732143.5} {"train_loss": -24.355527877807617, "global_step": 238127, "epoch": 2869} {"train_loss": -24.345117568969727, "global_step": 238128, "epoch": 2869} {"train_loss": -24.562963485717773, "global_step": 238129, "epoch": 2869} {"train_loss": -24.957088470458984, "global_step": 238130, "epoch": 2869} {"train_loss": -24.242773056030273, "global_step": 238131, "epoch": 2869} {"train_loss": -24.732376098632812, "global_step": 238132, "epoch": 2869} {"train_loss": -24.426435470581055, "global_step": 238133, "epoch": 2869} {"train_loss": -24.93701171875, "global_step": 238134, "epoch": 2869} {"train_loss": -24.541669845581055, "global_step": 238135, "epoch": 2869} {"train_loss": -24.636978149414062, "global_step": 238136, "epoch": 2869} {"train_loss": -24.509653091430664, "global_step": 238137, "epoch": 2869} {"train_loss": -25.0621337890625, "global_step": 238138, "epoch": 2869} {"train_loss": -24.570707321166992, "global_step": 238139, "epoch": 2869} {"train_loss": -24.91328239440918, "global_step": 238140, "epoch": 2869} {"train_loss": -24.831716537475586, "global_step": 238141, "epoch": 2869} {"train_loss": -24.3206787109375, "global_step": 238142, "epoch": 2869} {"train_loss": -24.557384490966797, "global_step": 238143, "epoch": 2869} {"train_loss": -24.77301025390625, "global_step": 238144, "epoch": 2869} {"train_loss": -24.832225799560547, "global_step": 238145, "epoch": 2869} {"train_loss": -24.977252960205078, "global_step": 238146, "epoch": 2869} {"train_loss": -24.691843032836914, "global_step": 238147, "epoch": 2869} {"train_loss": -24.835010528564453, "global_step": 238148, "epoch": 2869} {"train_loss": -25.019376754760742, "global_step": 238149, "epoch": 2869} {"train_loss": -24.761011123657227, "global_step": 238150, "epoch": 2869} {"train_loss": -24.774250030517578, "global_step": 238151, "epoch": 2869} {"train_loss": -24.814498901367188, "global_step": 238152, "epoch": 2869} {"train_loss": -25.006229400634766, "global_step": 238153, "epoch": 2869} {"train_loss": -24.913061141967773, "global_step": 238154, "epoch": 2869} {"train_loss": -25.172876358032227, "global_step": 238155, "epoch": 2869} {"train_loss": -25.250598907470703, "global_step": 238156, "epoch": 2869} {"train_loss": -25.12518310546875, "global_step": 238157, "epoch": 2869} {"train_loss": -24.538471221923828, "global_step": 238158, "epoch": 2869} {"train_loss": -24.78750228881836, "global_step": 238159, "epoch": 2869} {"train_loss": -24.7301025390625, "global_step": 238160, "epoch": 2869} {"train_loss": -25.055753707885742, "global_step": 238161, "epoch": 2869} {"train_loss": -25.111875534057617, "global_step": 238162, "epoch": 2869} {"train_loss": -24.454801559448242, "global_step": 238163, "epoch": 2869} {"train_loss": -24.537057876586914, "global_step": 238164, "epoch": 2869} {"train_loss": -24.74300193786621, "global_step": 238165, "epoch": 2869} {"train_loss": -24.661331176757812, "global_step": 238166, "epoch": 2869} {"train_loss": -24.539976119995117, "global_step": 238167, "epoch": 2869} {"train_loss": -24.959802627563477, "global_step": 238168, "epoch": 2869} {"train_loss": -24.634531021118164, "global_step": 238169, "epoch": 2869} {"train_loss": -24.72260856628418, "global_step": 238170, "epoch": 2869} {"train_loss": -24.849605560302734, "global_step": 238171, "epoch": 2869} {"train_loss": -25.060209274291992, "global_step": 238172, "epoch": 2869} {"train_loss": -24.635025024414062, "global_step": 238173, "epoch": 2869} {"train_loss": -24.867202758789062, "global_step": 238174, "epoch": 2869} {"train_loss": -24.692399978637695, "global_step": 238175, "epoch": 2869} {"train_loss": -24.843841552734375, "global_step": 238176, "epoch": 2869} {"train_loss": -24.5654296875, "global_step": 238177, "epoch": 2869} {"train_loss": -25.208112716674805, "global_step": 238178, "epoch": 2869} {"train_loss": -24.57440757751465, "global_step": 238179, "epoch": 2869} {"train_loss": -24.64210319519043, "global_step": 238180, "epoch": 2869} {"train_loss": -24.61934471130371, "global_step": 238181, "epoch": 2869} {"train_loss": -24.790447235107422, "global_step": 238182, "epoch": 2869} {"train_loss": -24.816333770751953, "global_step": 238183, "epoch": 2869} {"train_loss": -25.09943962097168, "global_step": 238184, "epoch": 2869} {"train_loss": -24.73580551147461, "global_step": 238185, "epoch": 2869} {"train_loss": -24.855371475219727, "global_step": 238186, "epoch": 2869} {"train_loss": -25.021501541137695, "global_step": 238187, "epoch": 2869} {"train_loss": -25.107358932495117, "global_step": 238188, "epoch": 2869} {"train_loss": -24.650999069213867, "global_step": 238189, "epoch": 2869} {"train_loss": -24.81259536743164, "global_step": 238190, "epoch": 2869} {"train_loss": -24.931133270263672, "global_step": 238191, "epoch": 2869} {"train_loss": -25.17855453491211, "global_step": 238192, "epoch": 2869} {"train_loss": -24.99641990661621, "global_step": 238193, "epoch": 2869} {"train_loss": -24.631986618041992, "global_step": 238194, "epoch": 2869} {"train_loss": -24.723047256469727, "global_step": 238195, "epoch": 2869} {"train_loss": -24.9671573638916, "global_step": 238196, "epoch": 2869} {"train_loss": -24.939899444580078, "global_step": 238197, "epoch": 2869} {"train_loss": -24.709659576416016, "global_step": 238198, "epoch": 2869} {"train_loss": -24.97140884399414, "global_step": 238199, "epoch": 2869} {"train_loss": -24.942081451416016, "global_step": 238200, "epoch": 2869} {"train_loss": -25.110437393188477, "global_step": 238201, "epoch": 2869} {"train_loss": -24.858264923095703, "global_step": 238202, "epoch": 2869} {"train_loss": -24.658308029174805, "global_step": 238203, "epoch": 2869} {"train_loss": -24.25613784790039, "global_step": 238204, "epoch": 2869} {"train_loss": -24.976329803466797, "global_step": 238205, "epoch": 2869} {"train_loss": -24.865629196166992, "global_step": 238206, "epoch": 2869} {"train_loss": -24.772418975830078, "global_step": 238207, "epoch": 2869} {"train_loss": -24.559951782226562, "global_step": 238208, "epoch": 2869} {"train_loss": -24.77911887111434, "global_step": 238209, "epoch": 2869, "val_loss": 6826833.0} {"train_loss": -24.57905387878418, "global_step": 238210, "epoch": 2870} {"train_loss": -24.259241104125977, "global_step": 238211, "epoch": 2870} {"train_loss": -24.384571075439453, "global_step": 238212, "epoch": 2870} {"train_loss": -24.631017684936523, "global_step": 238213, "epoch": 2870} {"train_loss": -24.405658721923828, "global_step": 238214, "epoch": 2870} {"train_loss": -24.290611267089844, "global_step": 238215, "epoch": 2870} {"train_loss": -24.799789428710938, "global_step": 238216, "epoch": 2870} {"train_loss": -24.39915657043457, "global_step": 238217, "epoch": 2870} {"train_loss": -24.42799949645996, "global_step": 238218, "epoch": 2870} {"train_loss": -24.536834716796875, "global_step": 238219, "epoch": 2870} {"train_loss": -24.731000900268555, "global_step": 238220, "epoch": 2870} {"train_loss": -23.66682243347168, "global_step": 238221, "epoch": 2870} {"train_loss": -24.837980270385742, "global_step": 238222, "epoch": 2870} {"train_loss": -24.319252014160156, "global_step": 238223, "epoch": 2870} {"train_loss": -24.68140411376953, "global_step": 238224, "epoch": 2870} {"train_loss": -24.49516487121582, "global_step": 238225, "epoch": 2870} {"train_loss": -24.80447769165039, "global_step": 238226, "epoch": 2870} {"train_loss": -24.67140007019043, "global_step": 238227, "epoch": 2870} {"train_loss": -24.826576232910156, "global_step": 238228, "epoch": 2870} {"train_loss": -24.49839210510254, "global_step": 238229, "epoch": 2870} {"train_loss": -24.737152099609375, "global_step": 238230, "epoch": 2870} {"train_loss": -24.7314453125, "global_step": 238231, "epoch": 2870} {"train_loss": -24.775894165039062, "global_step": 238232, "epoch": 2870} {"train_loss": -24.91179847717285, "global_step": 238233, "epoch": 2870} {"train_loss": -25.099597930908203, "global_step": 238234, "epoch": 2870} {"train_loss": -24.3593807220459, "global_step": 238235, "epoch": 2870} {"train_loss": -24.800878524780273, "global_step": 238236, "epoch": 2870} {"train_loss": -24.717960357666016, "global_step": 238237, "epoch": 2870} {"train_loss": -24.617063522338867, "global_step": 238238, "epoch": 2870} {"train_loss": -24.701671600341797, "global_step": 238239, "epoch": 2870} {"train_loss": -24.731571197509766, "global_step": 238240, "epoch": 2870} {"train_loss": -24.707122802734375, "global_step": 238241, "epoch": 2870} {"train_loss": -24.78797149658203, "global_step": 238242, "epoch": 2870} {"train_loss": -25.013341903686523, "global_step": 238243, "epoch": 2870} {"train_loss": -25.11090660095215, "global_step": 238244, "epoch": 2870} {"train_loss": -25.088937759399414, "global_step": 238245, "epoch": 2870} {"train_loss": -25.370014190673828, "global_step": 238246, "epoch": 2870} {"train_loss": -24.716047286987305, "global_step": 238247, "epoch": 2870} {"train_loss": -25.17374610900879, "global_step": 238248, "epoch": 2870} {"train_loss": -25.099130630493164, "global_step": 238249, "epoch": 2870} {"train_loss": -24.715320587158203, "global_step": 238250, "epoch": 2870} {"train_loss": -24.819507598876953, "global_step": 238251, "epoch": 2870} {"train_loss": -25.01028823852539, "global_step": 238252, "epoch": 2870} {"train_loss": -24.96882438659668, "global_step": 238253, "epoch": 2870} {"train_loss": -24.894681930541992, "global_step": 238254, "epoch": 2870} {"train_loss": -25.189313888549805, "global_step": 238255, "epoch": 2870} {"train_loss": -24.82110023498535, "global_step": 238256, "epoch": 2870} {"train_loss": -24.99251365661621, "global_step": 238257, "epoch": 2870} {"train_loss": -24.9172420501709, "global_step": 238258, "epoch": 2870} {"train_loss": -24.706329345703125, "global_step": 238259, "epoch": 2870} {"train_loss": -24.628950119018555, "global_step": 238260, "epoch": 2870} {"train_loss": -24.55866050720215, "global_step": 238261, "epoch": 2870} {"train_loss": -24.72199058532715, "global_step": 238262, "epoch": 2870} {"train_loss": -24.593961715698242, "global_step": 238263, "epoch": 2870} {"train_loss": -24.80653953552246, "global_step": 238264, "epoch": 2870} {"train_loss": -24.66835594177246, "global_step": 238265, "epoch": 2870} {"train_loss": -24.550872802734375, "global_step": 238266, "epoch": 2870} {"train_loss": -24.709619522094727, "global_step": 238267, "epoch": 2870} {"train_loss": -24.63966178894043, "global_step": 238268, "epoch": 2870} {"train_loss": -24.48917579650879, "global_step": 238269, "epoch": 2870} {"train_loss": -24.711456298828125, "global_step": 238270, "epoch": 2870} {"train_loss": -25.108989715576172, "global_step": 238271, "epoch": 2870} {"train_loss": -24.947954177856445, "global_step": 238272, "epoch": 2870} {"train_loss": -24.491498947143555, "global_step": 238273, "epoch": 2870} {"train_loss": -24.989290237426758, "global_step": 238274, "epoch": 2870} {"train_loss": -24.425506591796875, "global_step": 238275, "epoch": 2870} {"train_loss": -24.678199768066406, "global_step": 238276, "epoch": 2870} {"train_loss": -24.96343231201172, "global_step": 238277, "epoch": 2870} {"train_loss": -24.694110870361328, "global_step": 238278, "epoch": 2870} {"train_loss": -25.141836166381836, "global_step": 238279, "epoch": 2870} {"train_loss": -24.76734733581543, "global_step": 238280, "epoch": 2870} {"train_loss": -24.853071212768555, "global_step": 238281, "epoch": 2870} {"train_loss": -24.76498794555664, "global_step": 238282, "epoch": 2870} {"train_loss": -24.662839889526367, "global_step": 238283, "epoch": 2870} {"train_loss": -24.903268814086914, "global_step": 238284, "epoch": 2870} {"train_loss": -25.03898048400879, "global_step": 238285, "epoch": 2870} {"train_loss": -25.013925552368164, "global_step": 238286, "epoch": 2870} {"train_loss": -25.183446884155273, "global_step": 238287, "epoch": 2870} {"train_loss": -25.095951080322266, "global_step": 238288, "epoch": 2870} {"train_loss": -24.791654586791992, "global_step": 238289, "epoch": 2870} {"train_loss": -25.0599422454834, "global_step": 238290, "epoch": 2870} {"train_loss": -24.786386489868164, "global_step": 238291, "epoch": 2870} {"train_loss": -24.7655722836414, "global_step": 238292, "epoch": 2870, "val_loss": 6828246.5} {"train_loss": -24.60487937927246, "global_step": 238293, "epoch": 2871} {"train_loss": -24.184720993041992, "global_step": 238294, "epoch": 2871} {"train_loss": -24.63791275024414, "global_step": 238295, "epoch": 2871} {"train_loss": -24.418485641479492, "global_step": 238296, "epoch": 2871} {"train_loss": -24.439661026000977, "global_step": 238297, "epoch": 2871} {"train_loss": -24.451335906982422, "global_step": 238298, "epoch": 2871} {"train_loss": -24.617300033569336, "global_step": 238299, "epoch": 2871} {"train_loss": -24.683496475219727, "global_step": 238300, "epoch": 2871} {"train_loss": -24.534358978271484, "global_step": 238301, "epoch": 2871} {"train_loss": -24.668460845947266, "global_step": 238302, "epoch": 2871} {"train_loss": -24.483013153076172, "global_step": 238303, "epoch": 2871} {"train_loss": -24.464921951293945, "global_step": 238304, "epoch": 2871} {"train_loss": -25.046220779418945, "global_step": 238305, "epoch": 2871} {"train_loss": -24.488882064819336, "global_step": 238306, "epoch": 2871} {"train_loss": -24.7630672454834, "global_step": 238307, "epoch": 2871} {"train_loss": -24.946664810180664, "global_step": 238308, "epoch": 2871} {"train_loss": -24.650253295898438, "global_step": 238309, "epoch": 2871} {"train_loss": -24.686965942382812, "global_step": 238310, "epoch": 2871} {"train_loss": -24.555166244506836, "global_step": 238311, "epoch": 2871} {"train_loss": -24.546457290649414, "global_step": 238312, "epoch": 2871} {"train_loss": -24.714200973510742, "global_step": 238313, "epoch": 2871} {"train_loss": -24.259916305541992, "global_step": 238314, "epoch": 2871} {"train_loss": -24.81562614440918, "global_step": 238315, "epoch": 2871} {"train_loss": -24.87235450744629, "global_step": 238316, "epoch": 2871} {"train_loss": -25.121910095214844, "global_step": 238317, "epoch": 2871} {"train_loss": -24.500638961791992, "global_step": 238318, "epoch": 2871} {"train_loss": -24.520278930664062, "global_step": 238319, "epoch": 2871} {"train_loss": -24.569766998291016, "global_step": 238320, "epoch": 2871} {"train_loss": -24.99690055847168, "global_step": 238321, "epoch": 2871} {"train_loss": -25.091243743896484, "global_step": 238322, "epoch": 2871} {"train_loss": -24.752954483032227, "global_step": 238323, "epoch": 2871} {"train_loss": -24.76378059387207, "global_step": 238324, "epoch": 2871} {"train_loss": -24.70621681213379, "global_step": 238325, "epoch": 2871} {"train_loss": -24.802457809448242, "global_step": 238326, "epoch": 2871} {"train_loss": -24.618446350097656, "global_step": 238327, "epoch": 2871} {"train_loss": -24.515226364135742, "global_step": 238328, "epoch": 2871} {"train_loss": -24.64571189880371, "global_step": 238329, "epoch": 2871} {"train_loss": -25.087020874023438, "global_step": 238330, "epoch": 2871} {"train_loss": -24.639781951904297, "global_step": 238331, "epoch": 2871} {"train_loss": -25.14893913269043, "global_step": 238332, "epoch": 2871} {"train_loss": -24.74910545349121, "global_step": 238333, "epoch": 2871} {"train_loss": -24.515670776367188, "global_step": 238334, "epoch": 2871} {"train_loss": -24.610397338867188, "global_step": 238335, "epoch": 2871} {"train_loss": -24.792957305908203, "global_step": 238336, "epoch": 2871} {"train_loss": -24.84392547607422, "global_step": 238337, "epoch": 2871} {"train_loss": -24.843950271606445, "global_step": 238338, "epoch": 2871} {"train_loss": -25.10857582092285, "global_step": 238339, "epoch": 2871} {"train_loss": -24.89969825744629, "global_step": 238340, "epoch": 2871} {"train_loss": -25.045373916625977, "global_step": 238341, "epoch": 2871} {"train_loss": -24.6855525970459, "global_step": 238342, "epoch": 2871} {"train_loss": -24.96930503845215, "global_step": 238343, "epoch": 2871} {"train_loss": -24.876949310302734, "global_step": 238344, "epoch": 2871} {"train_loss": -25.053739547729492, "global_step": 238345, "epoch": 2871} {"train_loss": -24.741010665893555, "global_step": 238346, "epoch": 2871} {"train_loss": -25.115947723388672, "global_step": 238347, "epoch": 2871} {"train_loss": -24.777175903320312, "global_step": 238348, "epoch": 2871} {"train_loss": -25.022090911865234, "global_step": 238349, "epoch": 2871} {"train_loss": -24.975183486938477, "global_step": 238350, "epoch": 2871} {"train_loss": -24.825620651245117, "global_step": 238351, "epoch": 2871} {"train_loss": -25.08075523376465, "global_step": 238352, "epoch": 2871} {"train_loss": -24.580102920532227, "global_step": 238353, "epoch": 2871} {"train_loss": -25.193029403686523, "global_step": 238354, "epoch": 2871} {"train_loss": -24.896324157714844, "global_step": 238355, "epoch": 2871} {"train_loss": -24.881301879882812, "global_step": 238356, "epoch": 2871} {"train_loss": -24.964710235595703, "global_step": 238357, "epoch": 2871} {"train_loss": -24.96388053894043, "global_step": 238358, "epoch": 2871} {"train_loss": -25.09362030029297, "global_step": 238359, "epoch": 2871} {"train_loss": -25.192951202392578, "global_step": 238360, "epoch": 2871} {"train_loss": -25.01590919494629, "global_step": 238361, "epoch": 2871} {"train_loss": -25.46918296813965, "global_step": 238362, "epoch": 2871} {"train_loss": -24.919355392456055, "global_step": 238363, "epoch": 2871} {"train_loss": -25.112701416015625, "global_step": 238364, "epoch": 2871} {"train_loss": -25.175460815429688, "global_step": 238365, "epoch": 2871} {"train_loss": -24.889925003051758, "global_step": 238366, "epoch": 2871} {"train_loss": -25.06367301940918, "global_step": 238367, "epoch": 2871} {"train_loss": -24.732894897460938, "global_step": 238368, "epoch": 2871} {"train_loss": -24.42562484741211, "global_step": 238369, "epoch": 2871} {"train_loss": -24.82994270324707, "global_step": 238370, "epoch": 2871} {"train_loss": -24.91509437561035, "global_step": 238371, "epoch": 2871} {"train_loss": -25.07718276977539, "global_step": 238372, "epoch": 2871} {"train_loss": -24.957761764526367, "global_step": 238373, "epoch": 2871} {"train_loss": -25.051305770874023, "global_step": 238374, "epoch": 2871} {"train_loss": -24.804907994097974, "global_step": 238375, "epoch": 2871, "val_loss": 6767881.0} {"train_loss": -23.841888427734375, "global_step": 238376, "epoch": 2872} {"train_loss": -23.675094604492188, "global_step": 238377, "epoch": 2872} {"train_loss": -23.864212036132812, "global_step": 238378, "epoch": 2872} {"train_loss": -24.151473999023438, "global_step": 238379, "epoch": 2872} {"train_loss": -23.867158889770508, "global_step": 238380, "epoch": 2872} {"train_loss": -24.333606719970703, "global_step": 238381, "epoch": 2872} {"train_loss": -24.269338607788086, "global_step": 238382, "epoch": 2872} {"train_loss": -24.384124755859375, "global_step": 238383, "epoch": 2872} {"train_loss": -23.99082374572754, "global_step": 238384, "epoch": 2872} {"train_loss": -24.2593994140625, "global_step": 238385, "epoch": 2872} {"train_loss": -24.180997848510742, "global_step": 238386, "epoch": 2872} {"train_loss": -24.45111083984375, "global_step": 238387, "epoch": 2872} {"train_loss": -24.5053768157959, "global_step": 238388, "epoch": 2872} {"train_loss": -24.556440353393555, "global_step": 238389, "epoch": 2872} {"train_loss": -24.255861282348633, "global_step": 238390, "epoch": 2872} {"train_loss": -24.867813110351562, "global_step": 238391, "epoch": 2872} {"train_loss": -24.63875389099121, "global_step": 238392, "epoch": 2872} {"train_loss": -25.069440841674805, "global_step": 238393, "epoch": 2872} {"train_loss": -24.441579818725586, "global_step": 238394, "epoch": 2872} {"train_loss": -24.566650390625, "global_step": 238395, "epoch": 2872} {"train_loss": -24.573301315307617, "global_step": 238396, "epoch": 2872} {"train_loss": -24.509531021118164, "global_step": 238397, "epoch": 2872} {"train_loss": -24.66006851196289, "global_step": 238398, "epoch": 2872} {"train_loss": -24.610517501831055, "global_step": 238399, "epoch": 2872} {"train_loss": -24.646717071533203, "global_step": 238400, "epoch": 2872} {"train_loss": -24.850467681884766, "global_step": 238401, "epoch": 2872} {"train_loss": -24.83469009399414, "global_step": 238402, "epoch": 2872} {"train_loss": -24.53462028503418, "global_step": 238403, "epoch": 2872} {"train_loss": -25.035953521728516, "global_step": 238404, "epoch": 2872} {"train_loss": -24.796236038208008, "global_step": 238405, "epoch": 2872} {"train_loss": -24.825429916381836, "global_step": 238406, "epoch": 2872} {"train_loss": -24.812698364257812, "global_step": 238407, "epoch": 2872} {"train_loss": -25.203720092773438, "global_step": 238408, "epoch": 2872} {"train_loss": -24.8487548828125, "global_step": 238409, "epoch": 2872} {"train_loss": -25.006174087524414, "global_step": 238410, "epoch": 2872} {"train_loss": -24.731660842895508, "global_step": 238411, "epoch": 2872} {"train_loss": -24.954605102539062, "global_step": 238412, "epoch": 2872} {"train_loss": -25.14320945739746, "global_step": 238413, "epoch": 2872} {"train_loss": -24.723264694213867, "global_step": 238414, "epoch": 2872} {"train_loss": -25.111982345581055, "global_step": 238415, "epoch": 2872} {"train_loss": -25.32379722595215, "global_step": 238416, "epoch": 2872} {"train_loss": -25.211959838867188, "global_step": 238417, "epoch": 2872} {"train_loss": -24.89974021911621, "global_step": 238418, "epoch": 2872} {"train_loss": -25.0007381439209, "global_step": 238419, "epoch": 2872} {"train_loss": -24.882247924804688, "global_step": 238420, "epoch": 2872} {"train_loss": -25.016813278198242, "global_step": 238421, "epoch": 2872} {"train_loss": -25.062088012695312, "global_step": 238422, "epoch": 2872} {"train_loss": -24.70911407470703, "global_step": 238423, "epoch": 2872} {"train_loss": -25.083328247070312, "global_step": 238424, "epoch": 2872} {"train_loss": -25.284561157226562, "global_step": 238425, "epoch": 2872} {"train_loss": -25.071928024291992, "global_step": 238426, "epoch": 2872} {"train_loss": -24.886577606201172, "global_step": 238427, "epoch": 2872} {"train_loss": -24.74920082092285, "global_step": 238428, "epoch": 2872} {"train_loss": -24.701784133911133, "global_step": 238429, "epoch": 2872} {"train_loss": -25.12228775024414, "global_step": 238430, "epoch": 2872} {"train_loss": -25.165342330932617, "global_step": 238431, "epoch": 2872} {"train_loss": -24.538171768188477, "global_step": 238432, "epoch": 2872} {"train_loss": -24.678693771362305, "global_step": 238433, "epoch": 2872} {"train_loss": -24.40737533569336, "global_step": 238434, "epoch": 2872} {"train_loss": -24.980680465698242, "global_step": 238435, "epoch": 2872} {"train_loss": -24.709257125854492, "global_step": 238436, "epoch": 2872} {"train_loss": -24.544452667236328, "global_step": 238437, "epoch": 2872} {"train_loss": -24.578214645385742, "global_step": 238438, "epoch": 2872} {"train_loss": -25.242633819580078, "global_step": 238439, "epoch": 2872} {"train_loss": -24.57659912109375, "global_step": 238440, "epoch": 2872} {"train_loss": -24.943313598632812, "global_step": 238441, "epoch": 2872} {"train_loss": -24.856231689453125, "global_step": 238442, "epoch": 2872} {"train_loss": -24.64256477355957, "global_step": 238443, "epoch": 2872} {"train_loss": -24.807819366455078, "global_step": 238444, "epoch": 2872} {"train_loss": -24.858213424682617, "global_step": 238445, "epoch": 2872} {"train_loss": -24.845548629760742, "global_step": 238446, "epoch": 2872} {"train_loss": -25.234689712524414, "global_step": 238447, "epoch": 2872} {"train_loss": -25.170316696166992, "global_step": 238448, "epoch": 2872} {"train_loss": -24.68436050415039, "global_step": 238449, "epoch": 2872} {"train_loss": -25.016189575195312, "global_step": 238450, "epoch": 2872} {"train_loss": -25.041187286376953, "global_step": 238451, "epoch": 2872} {"train_loss": -24.791175842285156, "global_step": 238452, "epoch": 2872} {"train_loss": -24.69995880126953, "global_step": 238453, "epoch": 2872} {"train_loss": -24.964765548706055, "global_step": 238454, "epoch": 2872} {"train_loss": -25.115201950073242, "global_step": 238455, "epoch": 2872} {"train_loss": -25.257709503173828, "global_step": 238456, "epoch": 2872} {"train_loss": -25.23206901550293, "global_step": 238457, "epoch": 2872} {"train_loss": -24.75033406177199, "global_step": 238458, "epoch": 2872, "val_loss": 6754853.0} {"train_loss": -24.47200584411621, "global_step": 238459, "epoch": 2873} {"train_loss": -24.462581634521484, "global_step": 238460, "epoch": 2873} {"train_loss": -24.72878074645996, "global_step": 238461, "epoch": 2873} {"train_loss": -24.685373306274414, "global_step": 238462, "epoch": 2873} {"train_loss": -24.35761260986328, "global_step": 238463, "epoch": 2873} {"train_loss": -24.943490982055664, "global_step": 238464, "epoch": 2873} {"train_loss": -24.924640655517578, "global_step": 238465, "epoch": 2873} {"train_loss": -25.007837295532227, "global_step": 238466, "epoch": 2873} {"train_loss": -24.735021591186523, "global_step": 238467, "epoch": 2873} {"train_loss": -24.341455459594727, "global_step": 238468, "epoch": 2873} {"train_loss": -24.613983154296875, "global_step": 238469, "epoch": 2873} {"train_loss": -24.979652404785156, "global_step": 238470, "epoch": 2873} {"train_loss": -25.00418472290039, "global_step": 238471, "epoch": 2873} {"train_loss": -24.946455001831055, "global_step": 238472, "epoch": 2873} {"train_loss": -24.857046127319336, "global_step": 238473, "epoch": 2873} {"train_loss": -24.7862606048584, "global_step": 238474, "epoch": 2873} {"train_loss": -24.6058292388916, "global_step": 238475, "epoch": 2873} {"train_loss": -24.509244918823242, "global_step": 238476, "epoch": 2873} {"train_loss": -24.980979919433594, "global_step": 238477, "epoch": 2873} {"train_loss": -24.824691772460938, "global_step": 238478, "epoch": 2873} {"train_loss": -24.85164451599121, "global_step": 238479, "epoch": 2873} {"train_loss": -24.700780868530273, "global_step": 238480, "epoch": 2873} {"train_loss": -24.382226943969727, "global_step": 238481, "epoch": 2873} {"train_loss": -24.796897888183594, "global_step": 238482, "epoch": 2873} {"train_loss": -24.729745864868164, "global_step": 238483, "epoch": 2873} {"train_loss": -24.73980140686035, "global_step": 238484, "epoch": 2873} {"train_loss": -25.067726135253906, "global_step": 238485, "epoch": 2873} {"train_loss": -24.438886642456055, "global_step": 238486, "epoch": 2873} {"train_loss": -24.679676055908203, "global_step": 238487, "epoch": 2873} {"train_loss": -24.916608810424805, "global_step": 238488, "epoch": 2873} {"train_loss": -24.938875198364258, "global_step": 238489, "epoch": 2873} {"train_loss": -24.85227394104004, "global_step": 238490, "epoch": 2873} {"train_loss": -24.91621971130371, "global_step": 238491, "epoch": 2873} {"train_loss": -24.737735748291016, "global_step": 238492, "epoch": 2873} {"train_loss": -24.719741821289062, "global_step": 238493, "epoch": 2873} {"train_loss": -24.650928497314453, "global_step": 238494, "epoch": 2873} {"train_loss": -24.84206199645996, "global_step": 238495, "epoch": 2873} {"train_loss": -24.6456356048584, "global_step": 238496, "epoch": 2873} {"train_loss": -24.944412231445312, "global_step": 238497, "epoch": 2873} {"train_loss": -25.439960479736328, "global_step": 238498, "epoch": 2873} {"train_loss": -24.899616241455078, "global_step": 238499, "epoch": 2873} {"train_loss": -25.103290557861328, "global_step": 238500, "epoch": 2873} {"train_loss": -25.131711959838867, "global_step": 238501, "epoch": 2873} {"train_loss": -25.02372169494629, "global_step": 238502, "epoch": 2873} {"train_loss": -24.981895446777344, "global_step": 238503, "epoch": 2873} {"train_loss": -25.120450973510742, "global_step": 238504, "epoch": 2873} {"train_loss": -24.97150230407715, "global_step": 238505, "epoch": 2873} {"train_loss": -25.023834228515625, "global_step": 238506, "epoch": 2873} {"train_loss": -24.96115493774414, "global_step": 238507, "epoch": 2873} {"train_loss": -24.986318588256836, "global_step": 238508, "epoch": 2873} {"train_loss": -24.768165588378906, "global_step": 238509, "epoch": 2873} {"train_loss": -24.59137535095215, "global_step": 238510, "epoch": 2873} {"train_loss": -25.184125900268555, "global_step": 238511, "epoch": 2873} {"train_loss": -25.057302474975586, "global_step": 238512, "epoch": 2873} {"train_loss": -24.666074752807617, "global_step": 238513, "epoch": 2873} {"train_loss": -24.699329376220703, "global_step": 238514, "epoch": 2873} {"train_loss": -24.35025978088379, "global_step": 238515, "epoch": 2873} {"train_loss": -24.930517196655273, "global_step": 238516, "epoch": 2873} {"train_loss": -25.03419303894043, "global_step": 238517, "epoch": 2873} {"train_loss": -24.899301528930664, "global_step": 238518, "epoch": 2873} {"train_loss": -24.452465057373047, "global_step": 238519, "epoch": 2873} {"train_loss": -25.140579223632812, "global_step": 238520, "epoch": 2873} {"train_loss": -24.85713768005371, "global_step": 238521, "epoch": 2873} {"train_loss": -24.974506378173828, "global_step": 238522, "epoch": 2873} {"train_loss": -25.109006881713867, "global_step": 238523, "epoch": 2873} {"train_loss": -24.731464385986328, "global_step": 238524, "epoch": 2873} {"train_loss": -24.75052261352539, "global_step": 238525, "epoch": 2873} {"train_loss": -25.172138214111328, "global_step": 238526, "epoch": 2873} {"train_loss": -24.68323516845703, "global_step": 238527, "epoch": 2873} {"train_loss": -24.55022621154785, "global_step": 238528, "epoch": 2873} {"train_loss": -24.848161697387695, "global_step": 238529, "epoch": 2873} {"train_loss": -24.825042724609375, "global_step": 238530, "epoch": 2873} {"train_loss": -24.88738441467285, "global_step": 238531, "epoch": 2873} {"train_loss": -25.16397476196289, "global_step": 238532, "epoch": 2873} {"train_loss": -24.8140811920166, "global_step": 238533, "epoch": 2873} {"train_loss": -25.216522216796875, "global_step": 238534, "epoch": 2873} {"train_loss": -24.695608139038086, "global_step": 238535, "epoch": 2873} {"train_loss": -24.78235626220703, "global_step": 238536, "epoch": 2873} {"train_loss": -24.989227294921875, "global_step": 238537, "epoch": 2873} {"train_loss": -24.98859214782715, "global_step": 238538, "epoch": 2873} {"train_loss": -25.115629196166992, "global_step": 238539, "epoch": 2873} {"train_loss": -24.816055297851562, "global_step": 238540, "epoch": 2873} {"train_loss": -24.835048124014612, "global_step": 238541, "epoch": 2873, "val_loss": 6868466.5} {"train_loss": -23.893951416015625, "global_step": 238542, "epoch": 2874} {"train_loss": -24.43572425842285, "global_step": 238543, "epoch": 2874} {"train_loss": -24.65178871154785, "global_step": 238544, "epoch": 2874} {"train_loss": -23.936508178710938, "global_step": 238545, "epoch": 2874} {"train_loss": -24.615095138549805, "global_step": 238546, "epoch": 2874} {"train_loss": -24.717227935791016, "global_step": 238547, "epoch": 2874} {"train_loss": -24.647058486938477, "global_step": 238548, "epoch": 2874} {"train_loss": -24.475614547729492, "global_step": 238549, "epoch": 2874} {"train_loss": -24.554121017456055, "global_step": 238550, "epoch": 2874} {"train_loss": -24.907865524291992, "global_step": 238551, "epoch": 2874} {"train_loss": -24.691774368286133, "global_step": 238552, "epoch": 2874} {"train_loss": -24.49480628967285, "global_step": 238553, "epoch": 2874} {"train_loss": -24.90252113342285, "global_step": 238554, "epoch": 2874} {"train_loss": -24.64423179626465, "global_step": 238555, "epoch": 2874} {"train_loss": -24.545948028564453, "global_step": 238556, "epoch": 2874} {"train_loss": -25.087421417236328, "global_step": 238557, "epoch": 2874} {"train_loss": -24.88795280456543, "global_step": 238558, "epoch": 2874} {"train_loss": -24.379093170166016, "global_step": 238559, "epoch": 2874} {"train_loss": -24.436981201171875, "global_step": 238560, "epoch": 2874} {"train_loss": -24.637662887573242, "global_step": 238561, "epoch": 2874} {"train_loss": -24.91428565979004, "global_step": 238562, "epoch": 2874} {"train_loss": -25.07443618774414, "global_step": 238563, "epoch": 2874} {"train_loss": -24.792142868041992, "global_step": 238564, "epoch": 2874} {"train_loss": -24.590986251831055, "global_step": 238565, "epoch": 2874} {"train_loss": -24.71079444885254, "global_step": 238566, "epoch": 2874} {"train_loss": -24.869770050048828, "global_step": 238567, "epoch": 2874} {"train_loss": -24.911901473999023, "global_step": 238568, "epoch": 2874} {"train_loss": -24.80744743347168, "global_step": 238569, "epoch": 2874} {"train_loss": -24.799955368041992, "global_step": 238570, "epoch": 2874} {"train_loss": -24.78853988647461, "global_step": 238571, "epoch": 2874} {"train_loss": -24.737390518188477, "global_step": 238572, "epoch": 2874} {"train_loss": -24.571868896484375, "global_step": 238573, "epoch": 2874} {"train_loss": -24.857725143432617, "global_step": 238574, "epoch": 2874} {"train_loss": -24.517526626586914, "global_step": 238575, "epoch": 2874} {"train_loss": -24.644031524658203, "global_step": 238576, "epoch": 2874} {"train_loss": -24.75568389892578, "global_step": 238577, "epoch": 2874} {"train_loss": -24.512556076049805, "global_step": 238578, "epoch": 2874} {"train_loss": -24.615081787109375, "global_step": 238579, "epoch": 2874} {"train_loss": -24.95340919494629, "global_step": 238580, "epoch": 2874} {"train_loss": -24.806621551513672, "global_step": 238581, "epoch": 2874} {"train_loss": -24.664762496948242, "global_step": 238582, "epoch": 2874} {"train_loss": -24.867359161376953, "global_step": 238583, "epoch": 2874} {"train_loss": -24.648590087890625, "global_step": 238584, "epoch": 2874} {"train_loss": -24.695152282714844, "global_step": 238585, "epoch": 2874} {"train_loss": -24.895902633666992, "global_step": 238586, "epoch": 2874} {"train_loss": -24.717336654663086, "global_step": 238587, "epoch": 2874} {"train_loss": -24.944711685180664, "global_step": 238588, "epoch": 2874} {"train_loss": -25.251895904541016, "global_step": 238589, "epoch": 2874} {"train_loss": -24.741615295410156, "global_step": 238590, "epoch": 2874} {"train_loss": -24.641691207885742, "global_step": 238591, "epoch": 2874} {"train_loss": -25.25843620300293, "global_step": 238592, "epoch": 2874} {"train_loss": -24.638181686401367, "global_step": 238593, "epoch": 2874} {"train_loss": -24.76797866821289, "global_step": 238594, "epoch": 2874} {"train_loss": -25.08880043029785, "global_step": 238595, "epoch": 2874} {"train_loss": -25.3325138092041, "global_step": 238596, "epoch": 2874} {"train_loss": -24.67228126525879, "global_step": 238597, "epoch": 2874} {"train_loss": -24.698949813842773, "global_step": 238598, "epoch": 2874} {"train_loss": -24.857938766479492, "global_step": 238599, "epoch": 2874} {"train_loss": -24.73987579345703, "global_step": 238600, "epoch": 2874} {"train_loss": -24.939922332763672, "global_step": 238601, "epoch": 2874} {"train_loss": -25.301931381225586, "global_step": 238602, "epoch": 2874} {"train_loss": -25.01177406311035, "global_step": 238603, "epoch": 2874} {"train_loss": -25.097158432006836, "global_step": 238604, "epoch": 2874} {"train_loss": -24.882841110229492, "global_step": 238605, "epoch": 2874} {"train_loss": -24.798521041870117, "global_step": 238606, "epoch": 2874} {"train_loss": -24.57753562927246, "global_step": 238607, "epoch": 2874} {"train_loss": -25.11817741394043, "global_step": 238608, "epoch": 2874} {"train_loss": -24.68025016784668, "global_step": 238609, "epoch": 2874} {"train_loss": -24.963476181030273, "global_step": 238610, "epoch": 2874} {"train_loss": -25.1000919342041, "global_step": 238611, "epoch": 2874} {"train_loss": -24.6884765625, "global_step": 238612, "epoch": 2874} {"train_loss": -24.811054229736328, "global_step": 238613, "epoch": 2874} {"train_loss": -24.759450912475586, "global_step": 238614, "epoch": 2874} {"train_loss": -25.04649543762207, "global_step": 238615, "epoch": 2874} {"train_loss": -25.004247665405273, "global_step": 238616, "epoch": 2874} {"train_loss": -25.212875366210938, "global_step": 238617, "epoch": 2874} {"train_loss": -24.509952545166016, "global_step": 238618, "epoch": 2874} {"train_loss": -24.99370765686035, "global_step": 238619, "epoch": 2874} {"train_loss": -24.935251235961914, "global_step": 238620, "epoch": 2874} {"train_loss": -25.062402725219727, "global_step": 238621, "epoch": 2874} {"train_loss": -24.81146812438965, "global_step": 238622, "epoch": 2874} {"train_loss": -24.92963218688965, "global_step": 238623, "epoch": 2874} {"train_loss": -24.76761032012572, "global_step": 238624, "epoch": 2874, "val_loss": 6875260.0} {"train_loss": -22.639707565307617, "global_step": 238625, "epoch": 2875} {"train_loss": -22.613996505737305, "global_step": 238626, "epoch": 2875} {"train_loss": -22.87667465209961, "global_step": 238627, "epoch": 2875} {"train_loss": -21.657501220703125, "global_step": 238628, "epoch": 2875} {"train_loss": -23.89435386657715, "global_step": 238629, "epoch": 2875} {"train_loss": -22.870908737182617, "global_step": 238630, "epoch": 2875} {"train_loss": -23.797422409057617, "global_step": 238631, "epoch": 2875} {"train_loss": -23.61530876159668, "global_step": 238632, "epoch": 2875} {"train_loss": -23.830047607421875, "global_step": 238633, "epoch": 2875} {"train_loss": -23.645307540893555, "global_step": 238634, "epoch": 2875} {"train_loss": -23.8657283782959, "global_step": 238635, "epoch": 2875} {"train_loss": -23.817411422729492, "global_step": 238636, "epoch": 2875} {"train_loss": -23.376007080078125, "global_step": 238637, "epoch": 2875} {"train_loss": -23.501047134399414, "global_step": 238638, "epoch": 2875} {"train_loss": -23.846622467041016, "global_step": 238639, "epoch": 2875} {"train_loss": -23.679969787597656, "global_step": 238640, "epoch": 2875} {"train_loss": -23.947269439697266, "global_step": 238641, "epoch": 2875} {"train_loss": -24.169225692749023, "global_step": 238642, "epoch": 2875} {"train_loss": -23.7191219329834, "global_step": 238643, "epoch": 2875} {"train_loss": -24.035139083862305, "global_step": 238644, "epoch": 2875} {"train_loss": -24.216995239257812, "global_step": 238645, "epoch": 2875} {"train_loss": -23.994977951049805, "global_step": 238646, "epoch": 2875} {"train_loss": -24.343791961669922, "global_step": 238647, "epoch": 2875} {"train_loss": -24.058940887451172, "global_step": 238648, "epoch": 2875} {"train_loss": -24.410242080688477, "global_step": 238649, "epoch": 2875} {"train_loss": -24.2811279296875, "global_step": 238650, "epoch": 2875} {"train_loss": -24.513608932495117, "global_step": 238651, "epoch": 2875} {"train_loss": -24.115734100341797, "global_step": 238652, "epoch": 2875} {"train_loss": -24.24794578552246, "global_step": 238653, "epoch": 2875} {"train_loss": -24.1345272064209, "global_step": 238654, "epoch": 2875} {"train_loss": -24.570810317993164, "global_step": 238655, "epoch": 2875} {"train_loss": -24.24000358581543, "global_step": 238656, "epoch": 2875} {"train_loss": -24.375242233276367, "global_step": 238657, "epoch": 2875} {"train_loss": -24.00580596923828, "global_step": 238658, "epoch": 2875} {"train_loss": -24.354467391967773, "global_step": 238659, "epoch": 2875} {"train_loss": -24.455677032470703, "global_step": 238660, "epoch": 2875} {"train_loss": -24.877851486206055, "global_step": 238661, "epoch": 2875} {"train_loss": -24.5440616607666, "global_step": 238662, "epoch": 2875} {"train_loss": -24.522470474243164, "global_step": 238663, "epoch": 2875} {"train_loss": -24.825416564941406, "global_step": 238664, "epoch": 2875} {"train_loss": -24.6604061126709, "global_step": 238665, "epoch": 2875} {"train_loss": -24.79110336303711, "global_step": 238666, "epoch": 2875} {"train_loss": -24.903358459472656, "global_step": 238667, "epoch": 2875} {"train_loss": -24.76969337463379, "global_step": 238668, "epoch": 2875} {"train_loss": -24.83510398864746, "global_step": 238669, "epoch": 2875} {"train_loss": -24.816537857055664, "global_step": 238670, "epoch": 2875} {"train_loss": -24.832387924194336, "global_step": 238671, "epoch": 2875} {"train_loss": -24.93026351928711, "global_step": 238672, "epoch": 2875} {"train_loss": -24.879409790039062, "global_step": 238673, "epoch": 2875} {"train_loss": -25.15015983581543, "global_step": 238674, "epoch": 2875} {"train_loss": -24.935697555541992, "global_step": 238675, "epoch": 2875} {"train_loss": -24.41400909423828, "global_step": 238676, "epoch": 2875} {"train_loss": -24.94158172607422, "global_step": 238677, "epoch": 2875} {"train_loss": -24.78432273864746, "global_step": 238678, "epoch": 2875} {"train_loss": -25.05180549621582, "global_step": 238679, "epoch": 2875} {"train_loss": -24.80525779724121, "global_step": 238680, "epoch": 2875} {"train_loss": -25.134740829467773, "global_step": 238681, "epoch": 2875} {"train_loss": -24.94264030456543, "global_step": 238682, "epoch": 2875} {"train_loss": -24.98005485534668, "global_step": 238683, "epoch": 2875} {"train_loss": -24.716156005859375, "global_step": 238684, "epoch": 2875} {"train_loss": -24.681589126586914, "global_step": 238685, "epoch": 2875} {"train_loss": -25.40743064880371, "global_step": 238686, "epoch": 2875} {"train_loss": -24.813718795776367, "global_step": 238687, "epoch": 2875} {"train_loss": -25.004791259765625, "global_step": 238688, "epoch": 2875} {"train_loss": -24.618728637695312, "global_step": 238689, "epoch": 2875} {"train_loss": -25.126171112060547, "global_step": 238690, "epoch": 2875} {"train_loss": -24.82793617248535, "global_step": 238691, "epoch": 2875} {"train_loss": -24.915714263916016, "global_step": 238692, "epoch": 2875} {"train_loss": -24.617040634155273, "global_step": 238693, "epoch": 2875} {"train_loss": -24.900602340698242, "global_step": 238694, "epoch": 2875} {"train_loss": -24.818899154663086, "global_step": 238695, "epoch": 2875} {"train_loss": -25.086746215820312, "global_step": 238696, "epoch": 2875} {"train_loss": -24.534889221191406, "global_step": 238697, "epoch": 2875} {"train_loss": -24.909324645996094, "global_step": 238698, "epoch": 2875} {"train_loss": -24.861284255981445, "global_step": 238699, "epoch": 2875} {"train_loss": -24.826148986816406, "global_step": 238700, "epoch": 2875} {"train_loss": -24.986825942993164, "global_step": 238701, "epoch": 2875} {"train_loss": -24.999929428100586, "global_step": 238702, "epoch": 2875} {"train_loss": -25.11279296875, "global_step": 238703, "epoch": 2875} {"train_loss": -24.640045166015625, "global_step": 238704, "epoch": 2875} {"train_loss": -25.056514739990234, "global_step": 238705, "epoch": 2875} {"train_loss": -24.473636627197266, "global_step": 238706, "epoch": 2875} {"train_loss": -24.416378940444396, "global_step": 238707, "epoch": 2875, "val_loss": 6737694.0} {"train_loss": -24.350860595703125, "global_step": 238708, "epoch": 2876} {"train_loss": -23.543432235717773, "global_step": 238709, "epoch": 2876} {"train_loss": -23.146406173706055, "global_step": 238710, "epoch": 2876} {"train_loss": -23.899538040161133, "global_step": 238711, "epoch": 2876} {"train_loss": -23.765775680541992, "global_step": 238712, "epoch": 2876} {"train_loss": -23.446353912353516, "global_step": 238713, "epoch": 2876} {"train_loss": -24.02950096130371, "global_step": 238714, "epoch": 2876} {"train_loss": -24.30301856994629, "global_step": 238715, "epoch": 2876} {"train_loss": -23.824277877807617, "global_step": 238716, "epoch": 2876} {"train_loss": -24.458969116210938, "global_step": 238717, "epoch": 2876} {"train_loss": -23.83466339111328, "global_step": 238718, "epoch": 2876} {"train_loss": -24.092140197753906, "global_step": 238719, "epoch": 2876} {"train_loss": -24.24708366394043, "global_step": 238720, "epoch": 2876} {"train_loss": -24.373804092407227, "global_step": 238721, "epoch": 2876} {"train_loss": -24.526214599609375, "global_step": 238722, "epoch": 2876} {"train_loss": -23.955852508544922, "global_step": 238723, "epoch": 2876} {"train_loss": -24.629613876342773, "global_step": 238724, "epoch": 2876} {"train_loss": -24.476354598999023, "global_step": 238725, "epoch": 2876} {"train_loss": -24.63700294494629, "global_step": 238726, "epoch": 2876} {"train_loss": -24.737136840820312, "global_step": 238727, "epoch": 2876} {"train_loss": -24.368051528930664, "global_step": 238728, "epoch": 2876} {"train_loss": -24.586111068725586, "global_step": 238729, "epoch": 2876} {"train_loss": -24.319860458374023, "global_step": 238730, "epoch": 2876} {"train_loss": -24.396347045898438, "global_step": 238731, "epoch": 2876} {"train_loss": -24.06465721130371, "global_step": 238732, "epoch": 2876} {"train_loss": -24.847768783569336, "global_step": 238733, "epoch": 2876} {"train_loss": -24.703062057495117, "global_step": 238734, "epoch": 2876} {"train_loss": -24.397268295288086, "global_step": 238735, "epoch": 2876} {"train_loss": -24.923965454101562, "global_step": 238736, "epoch": 2876} {"train_loss": -24.909154891967773, "global_step": 238737, "epoch": 2876} {"train_loss": -24.574481964111328, "global_step": 238738, "epoch": 2876} {"train_loss": -24.88747215270996, "global_step": 238739, "epoch": 2876} {"train_loss": -24.619184494018555, "global_step": 238740, "epoch": 2876} {"train_loss": -25.175006866455078, "global_step": 238741, "epoch": 2876} {"train_loss": -25.076276779174805, "global_step": 238742, "epoch": 2876} {"train_loss": -25.094148635864258, "global_step": 238743, "epoch": 2876} {"train_loss": -24.87932777404785, "global_step": 238744, "epoch": 2876} {"train_loss": -25.320058822631836, "global_step": 238745, "epoch": 2876} {"train_loss": -25.038150787353516, "global_step": 238746, "epoch": 2876} {"train_loss": -24.944904327392578, "global_step": 238747, "epoch": 2876} {"train_loss": -24.7707462310791, "global_step": 238748, "epoch": 2876} {"train_loss": -25.147403717041016, "global_step": 238749, "epoch": 2876} {"train_loss": -24.815065383911133, "global_step": 238750, "epoch": 2876} {"train_loss": -25.243459701538086, "global_step": 238751, "epoch": 2876} {"train_loss": -24.7210750579834, "global_step": 238752, "epoch": 2876} {"train_loss": -24.935949325561523, "global_step": 238753, "epoch": 2876} {"train_loss": -25.101789474487305, "global_step": 238754, "epoch": 2876} {"train_loss": -24.926410675048828, "global_step": 238755, "epoch": 2876} {"train_loss": -24.45124626159668, "global_step": 238756, "epoch": 2876} {"train_loss": -25.247133255004883, "global_step": 238757, "epoch": 2876} {"train_loss": -24.869592666625977, "global_step": 238758, "epoch": 2876} {"train_loss": -24.3095760345459, "global_step": 238759, "epoch": 2876} {"train_loss": -23.801259994506836, "global_step": 238760, "epoch": 2876} {"train_loss": -23.79728126525879, "global_step": 238761, "epoch": 2876} {"train_loss": -24.618009567260742, "global_step": 238762, "epoch": 2876} {"train_loss": -24.620779037475586, "global_step": 238763, "epoch": 2876} {"train_loss": -24.641952514648438, "global_step": 238764, "epoch": 2876} {"train_loss": -24.458877563476562, "global_step": 238765, "epoch": 2876} {"train_loss": -24.42284393310547, "global_step": 238766, "epoch": 2876} {"train_loss": -24.470998764038086, "global_step": 238767, "epoch": 2876} {"train_loss": -24.70022964477539, "global_step": 238768, "epoch": 2876} {"train_loss": -24.696212768554688, "global_step": 238769, "epoch": 2876} {"train_loss": -24.563451766967773, "global_step": 238770, "epoch": 2876} {"train_loss": -24.643356323242188, "global_step": 238771, "epoch": 2876} {"train_loss": -24.78045082092285, "global_step": 238772, "epoch": 2876} {"train_loss": -24.910734176635742, "global_step": 238773, "epoch": 2876} {"train_loss": -24.484556198120117, "global_step": 238774, "epoch": 2876} {"train_loss": -24.677255630493164, "global_step": 238775, "epoch": 2876} {"train_loss": -25.154800415039062, "global_step": 238776, "epoch": 2876} {"train_loss": -25.0708065032959, "global_step": 238777, "epoch": 2876} {"train_loss": -24.669382095336914, "global_step": 238778, "epoch": 2876} {"train_loss": -24.804418563842773, "global_step": 238779, "epoch": 2876} {"train_loss": -25.077987670898438, "global_step": 238780, "epoch": 2876} {"train_loss": -24.882911682128906, "global_step": 238781, "epoch": 2876} {"train_loss": -24.811376571655273, "global_step": 238782, "epoch": 2876} {"train_loss": -24.77701759338379, "global_step": 238783, "epoch": 2876} {"train_loss": -25.05365562438965, "global_step": 238784, "epoch": 2876} {"train_loss": -24.529193878173828, "global_step": 238785, "epoch": 2876} {"train_loss": -24.90962791442871, "global_step": 238786, "epoch": 2876} {"train_loss": -24.759531021118164, "global_step": 238787, "epoch": 2876} {"train_loss": -24.906299591064453, "global_step": 238788, "epoch": 2876} {"train_loss": -25.179336547851562, "global_step": 238789, "epoch": 2876} {"train_loss": -24.611301674900286, "global_step": 238790, "epoch": 2876, "val_loss": 6711295.0} {"train_loss": -24.041656494140625, "global_step": 238791, "epoch": 2877} {"train_loss": -23.765501022338867, "global_step": 238792, "epoch": 2877} {"train_loss": -24.82533836364746, "global_step": 238793, "epoch": 2877} {"train_loss": -24.14207649230957, "global_step": 238794, "epoch": 2877} {"train_loss": -24.528539657592773, "global_step": 238795, "epoch": 2877} {"train_loss": -24.32234764099121, "global_step": 238796, "epoch": 2877} {"train_loss": -24.64158821105957, "global_step": 238797, "epoch": 2877} {"train_loss": -24.630659103393555, "global_step": 238798, "epoch": 2877} {"train_loss": -24.65163230895996, "global_step": 238799, "epoch": 2877} {"train_loss": -24.297216415405273, "global_step": 238800, "epoch": 2877} {"train_loss": -24.390960693359375, "global_step": 238801, "epoch": 2877} {"train_loss": -24.523365020751953, "global_step": 238802, "epoch": 2877} {"train_loss": -24.711261749267578, "global_step": 238803, "epoch": 2877} {"train_loss": -24.754329681396484, "global_step": 238804, "epoch": 2877} {"train_loss": -24.752546310424805, "global_step": 238805, "epoch": 2877} {"train_loss": -24.409940719604492, "global_step": 238806, "epoch": 2877} {"train_loss": -24.66675567626953, "global_step": 238807, "epoch": 2877} {"train_loss": -25.007963180541992, "global_step": 238808, "epoch": 2877} {"train_loss": -24.67123794555664, "global_step": 238809, "epoch": 2877} {"train_loss": -24.661916732788086, "global_step": 238810, "epoch": 2877} {"train_loss": -24.486982345581055, "global_step": 238811, "epoch": 2877} {"train_loss": -25.05908966064453, "global_step": 238812, "epoch": 2877} {"train_loss": -24.951337814331055, "global_step": 238813, "epoch": 2877} {"train_loss": -24.68491554260254, "global_step": 238814, "epoch": 2877} {"train_loss": -24.698843002319336, "global_step": 238815, "epoch": 2877} {"train_loss": -25.095109939575195, "global_step": 238816, "epoch": 2877} {"train_loss": -24.961088180541992, "global_step": 238817, "epoch": 2877} {"train_loss": -24.7772274017334, "global_step": 238818, "epoch": 2877} {"train_loss": -24.57577896118164, "global_step": 238819, "epoch": 2877} {"train_loss": -25.023046493530273, "global_step": 238820, "epoch": 2877} {"train_loss": -25.209659576416016, "global_step": 238821, "epoch": 2877} {"train_loss": -25.094480514526367, "global_step": 238822, "epoch": 2877} {"train_loss": -24.936594009399414, "global_step": 238823, "epoch": 2877} {"train_loss": -24.62164878845215, "global_step": 238824, "epoch": 2877} {"train_loss": -24.939157485961914, "global_step": 238825, "epoch": 2877} {"train_loss": -24.97872543334961, "global_step": 238826, "epoch": 2877} {"train_loss": -25.062225341796875, "global_step": 238827, "epoch": 2877} {"train_loss": -25.226041793823242, "global_step": 238828, "epoch": 2877} {"train_loss": -24.920259475708008, "global_step": 238829, "epoch": 2877} {"train_loss": -24.78569221496582, "global_step": 238830, "epoch": 2877} {"train_loss": -25.010618209838867, "global_step": 238831, "epoch": 2877} {"train_loss": -24.730424880981445, "global_step": 238832, "epoch": 2877} {"train_loss": -25.195343017578125, "global_step": 238833, "epoch": 2877} {"train_loss": -24.887083053588867, "global_step": 238834, "epoch": 2877} {"train_loss": -24.8132381439209, "global_step": 238835, "epoch": 2877} {"train_loss": -25.088830947875977, "global_step": 238836, "epoch": 2877} {"train_loss": -24.913272857666016, "global_step": 238837, "epoch": 2877} {"train_loss": -24.92764663696289, "global_step": 238838, "epoch": 2877} {"train_loss": -25.18442153930664, "global_step": 238839, "epoch": 2877} {"train_loss": -24.834980010986328, "global_step": 238840, "epoch": 2877} {"train_loss": -24.82402229309082, "global_step": 238841, "epoch": 2877} {"train_loss": -25.011585235595703, "global_step": 238842, "epoch": 2877} {"train_loss": -24.680498123168945, "global_step": 238843, "epoch": 2877} {"train_loss": -24.866687774658203, "global_step": 238844, "epoch": 2877} {"train_loss": -24.926685333251953, "global_step": 238845, "epoch": 2877} {"train_loss": -24.903858184814453, "global_step": 238846, "epoch": 2877} {"train_loss": -24.59391212463379, "global_step": 238847, "epoch": 2877} {"train_loss": -24.92205238342285, "global_step": 238848, "epoch": 2877} {"train_loss": -24.534326553344727, "global_step": 238849, "epoch": 2877} {"train_loss": -24.468292236328125, "global_step": 238850, "epoch": 2877} {"train_loss": -24.709383010864258, "global_step": 238851, "epoch": 2877} {"train_loss": -25.104782104492188, "global_step": 238852, "epoch": 2877} {"train_loss": -24.73050880432129, "global_step": 238853, "epoch": 2877} {"train_loss": -24.176898956298828, "global_step": 238854, "epoch": 2877} {"train_loss": -25.01057243347168, "global_step": 238855, "epoch": 2877} {"train_loss": -24.43839454650879, "global_step": 238856, "epoch": 2877} {"train_loss": -24.89211082458496, "global_step": 238857, "epoch": 2877} {"train_loss": -23.899211883544922, "global_step": 238858, "epoch": 2877} {"train_loss": -24.297443389892578, "global_step": 238859, "epoch": 2877} {"train_loss": -24.45747184753418, "global_step": 238860, "epoch": 2877} {"train_loss": -24.511199951171875, "global_step": 238861, "epoch": 2877} {"train_loss": -24.642236709594727, "global_step": 238862, "epoch": 2877} {"train_loss": -24.581296920776367, "global_step": 238863, "epoch": 2877} {"train_loss": -24.423044204711914, "global_step": 238864, "epoch": 2877} {"train_loss": -25.053543090820312, "global_step": 238865, "epoch": 2877} {"train_loss": -24.842378616333008, "global_step": 238866, "epoch": 2877} {"train_loss": -24.88882827758789, "global_step": 238867, "epoch": 2877} {"train_loss": -24.652029037475586, "global_step": 238868, "epoch": 2877} {"train_loss": -25.045997619628906, "global_step": 238869, "epoch": 2877} {"train_loss": -24.4251766204834, "global_step": 238870, "epoch": 2877} {"train_loss": -24.675613403320312, "global_step": 238871, "epoch": 2877} {"train_loss": -24.571475982666016, "global_step": 238872, "epoch": 2877} {"train_loss": -24.716508451714574, "global_step": 238873, "epoch": 2877, "val_loss": 6648152.5} {"train_loss": -24.42758560180664, "global_step": 238874, "epoch": 2878} {"train_loss": -24.710693359375, "global_step": 238875, "epoch": 2878} {"train_loss": -24.75876808166504, "global_step": 238876, "epoch": 2878} {"train_loss": -24.443544387817383, "global_step": 238877, "epoch": 2878} {"train_loss": -24.659683227539062, "global_step": 238878, "epoch": 2878} {"train_loss": -24.320419311523438, "global_step": 238879, "epoch": 2878} {"train_loss": -24.52850341796875, "global_step": 238880, "epoch": 2878} {"train_loss": -24.958547592163086, "global_step": 238881, "epoch": 2878} {"train_loss": -24.622724533081055, "global_step": 238882, "epoch": 2878} {"train_loss": -24.766775131225586, "global_step": 238883, "epoch": 2878} {"train_loss": -24.73732566833496, "global_step": 238884, "epoch": 2878} {"train_loss": -24.818904876708984, "global_step": 238885, "epoch": 2878} {"train_loss": -25.04829978942871, "global_step": 238886, "epoch": 2878} {"train_loss": -24.92660903930664, "global_step": 238887, "epoch": 2878} {"train_loss": -24.99347496032715, "global_step": 238888, "epoch": 2878} {"train_loss": -25.203927993774414, "global_step": 238889, "epoch": 2878} {"train_loss": -24.936872482299805, "global_step": 238890, "epoch": 2878} {"train_loss": -24.803647994995117, "global_step": 238891, "epoch": 2878} {"train_loss": -24.918048858642578, "global_step": 238892, "epoch": 2878} {"train_loss": -24.979644775390625, "global_step": 238893, "epoch": 2878} {"train_loss": -24.820310592651367, "global_step": 238894, "epoch": 2878} {"train_loss": -25.310836791992188, "global_step": 238895, "epoch": 2878} {"train_loss": -25.236974716186523, "global_step": 238896, "epoch": 2878} {"train_loss": -24.795490264892578, "global_step": 238897, "epoch": 2878} {"train_loss": -25.07040786743164, "global_step": 238898, "epoch": 2878} {"train_loss": -25.043031692504883, "global_step": 238899, "epoch": 2878} {"train_loss": -24.748350143432617, "global_step": 238900, "epoch": 2878} {"train_loss": -25.158876419067383, "global_step": 238901, "epoch": 2878} {"train_loss": -24.977479934692383, "global_step": 238902, "epoch": 2878} {"train_loss": -24.736309051513672, "global_step": 238903, "epoch": 2878} {"train_loss": -24.735219955444336, "global_step": 238904, "epoch": 2878} {"train_loss": -24.754179000854492, "global_step": 238905, "epoch": 2878} {"train_loss": -24.850549697875977, "global_step": 238906, "epoch": 2878} {"train_loss": -24.77019691467285, "global_step": 238907, "epoch": 2878} {"train_loss": -25.00405502319336, "global_step": 238908, "epoch": 2878} {"train_loss": -24.632492065429688, "global_step": 238909, "epoch": 2878} {"train_loss": -25.017244338989258, "global_step": 238910, "epoch": 2878} {"train_loss": -24.717660903930664, "global_step": 238911, "epoch": 2878} {"train_loss": -24.76462745666504, "global_step": 238912, "epoch": 2878} {"train_loss": -24.92850685119629, "global_step": 238913, "epoch": 2878} {"train_loss": -25.16297721862793, "global_step": 238914, "epoch": 2878} {"train_loss": -24.58643341064453, "global_step": 238915, "epoch": 2878} {"train_loss": -24.419666290283203, "global_step": 238916, "epoch": 2878} {"train_loss": -25.085617065429688, "global_step": 238917, "epoch": 2878} {"train_loss": -24.906801223754883, "global_step": 238918, "epoch": 2878} {"train_loss": -24.833148956298828, "global_step": 238919, "epoch": 2878} {"train_loss": -24.745494842529297, "global_step": 238920, "epoch": 2878} {"train_loss": -24.55575942993164, "global_step": 238921, "epoch": 2878} {"train_loss": -25.086740493774414, "global_step": 238922, "epoch": 2878} {"train_loss": -24.820907592773438, "global_step": 238923, "epoch": 2878} {"train_loss": -24.59987449645996, "global_step": 238924, "epoch": 2878} {"train_loss": -24.65785789489746, "global_step": 238925, "epoch": 2878} {"train_loss": -25.06273078918457, "global_step": 238926, "epoch": 2878} {"train_loss": -24.91437339782715, "global_step": 238927, "epoch": 2878} {"train_loss": -24.96341323852539, "global_step": 238928, "epoch": 2878} {"train_loss": -24.43703269958496, "global_step": 238929, "epoch": 2878} {"train_loss": -24.958707809448242, "global_step": 238930, "epoch": 2878} {"train_loss": -24.766759872436523, "global_step": 238931, "epoch": 2878} {"train_loss": -24.421157836914062, "global_step": 238932, "epoch": 2878} {"train_loss": -24.72291374206543, "global_step": 238933, "epoch": 2878} {"train_loss": -24.85091209411621, "global_step": 238934, "epoch": 2878} {"train_loss": -24.758512496948242, "global_step": 238935, "epoch": 2878} {"train_loss": -24.972084045410156, "global_step": 238936, "epoch": 2878} {"train_loss": -24.48992156982422, "global_step": 238937, "epoch": 2878} {"train_loss": -24.5775203704834, "global_step": 238938, "epoch": 2878} {"train_loss": -24.522634506225586, "global_step": 238939, "epoch": 2878} {"train_loss": -24.659494400024414, "global_step": 238940, "epoch": 2878} {"train_loss": -24.645421981811523, "global_step": 238941, "epoch": 2878} {"train_loss": -25.041954040527344, "global_step": 238942, "epoch": 2878} {"train_loss": -24.70271873474121, "global_step": 238943, "epoch": 2878} {"train_loss": -25.01285743713379, "global_step": 238944, "epoch": 2878} {"train_loss": -24.854778289794922, "global_step": 238945, "epoch": 2878} {"train_loss": -25.014135360717773, "global_step": 238946, "epoch": 2878} {"train_loss": -24.539962768554688, "global_step": 238947, "epoch": 2878} {"train_loss": -24.757068634033203, "global_step": 238948, "epoch": 2878} {"train_loss": -24.784576416015625, "global_step": 238949, "epoch": 2878} {"train_loss": -24.749208450317383, "global_step": 238950, "epoch": 2878} {"train_loss": -24.783933639526367, "global_step": 238951, "epoch": 2878} {"train_loss": -24.93577003479004, "global_step": 238952, "epoch": 2878} {"train_loss": -24.93642234802246, "global_step": 238953, "epoch": 2878} {"train_loss": -25.013330459594727, "global_step": 238954, "epoch": 2878} {"train_loss": -24.527938842773438, "global_step": 238955, "epoch": 2878} {"train_loss": -24.815791279436596, "global_step": 238956, "epoch": 2878, "val_loss": 6776035.0} {"train_loss": -24.490468978881836, "global_step": 238957, "epoch": 2879} {"train_loss": -24.253925323486328, "global_step": 238958, "epoch": 2879} {"train_loss": -24.058454513549805, "global_step": 238959, "epoch": 2879} {"train_loss": -24.414752960205078, "global_step": 238960, "epoch": 2879} {"train_loss": -24.453489303588867, "global_step": 238961, "epoch": 2879} {"train_loss": -24.243820190429688, "global_step": 238962, "epoch": 2879} {"train_loss": -24.64960289001465, "global_step": 238963, "epoch": 2879} {"train_loss": -24.723840713500977, "global_step": 238964, "epoch": 2879} {"train_loss": -24.36156463623047, "global_step": 238965, "epoch": 2879} {"train_loss": -24.330581665039062, "global_step": 238966, "epoch": 2879} {"train_loss": -24.598058700561523, "global_step": 238967, "epoch": 2879} {"train_loss": -24.290767669677734, "global_step": 238968, "epoch": 2879} {"train_loss": -25.111623764038086, "global_step": 238969, "epoch": 2879} {"train_loss": -24.664541244506836, "global_step": 238970, "epoch": 2879} {"train_loss": -24.777408599853516, "global_step": 238971, "epoch": 2879} {"train_loss": -24.858238220214844, "global_step": 238972, "epoch": 2879} {"train_loss": -24.707422256469727, "global_step": 238973, "epoch": 2879} {"train_loss": -24.83295249938965, "global_step": 238974, "epoch": 2879} {"train_loss": -24.475513458251953, "global_step": 238975, "epoch": 2879} {"train_loss": -25.041330337524414, "global_step": 238976, "epoch": 2879} {"train_loss": -24.84137535095215, "global_step": 238977, "epoch": 2879} {"train_loss": -24.85638999938965, "global_step": 238978, "epoch": 2879} {"train_loss": -24.96486473083496, "global_step": 238979, "epoch": 2879} {"train_loss": -24.951475143432617, "global_step": 238980, "epoch": 2879} {"train_loss": -25.044038772583008, "global_step": 238981, "epoch": 2879} {"train_loss": -24.60919189453125, "global_step": 238982, "epoch": 2879} {"train_loss": -24.79036521911621, "global_step": 238983, "epoch": 2879} {"train_loss": -24.965444564819336, "global_step": 238984, "epoch": 2879} {"train_loss": -25.107547760009766, "global_step": 238985, "epoch": 2879} {"train_loss": -24.90182876586914, "global_step": 238986, "epoch": 2879} {"train_loss": -24.74257469177246, "global_step": 238987, "epoch": 2879} {"train_loss": -24.681737899780273, "global_step": 238988, "epoch": 2879} {"train_loss": -25.020854949951172, "global_step": 238989, "epoch": 2879} {"train_loss": -25.54534339904785, "global_step": 238990, "epoch": 2879} {"train_loss": -24.970605850219727, "global_step": 238991, "epoch": 2879} {"train_loss": -24.341541290283203, "global_step": 238992, "epoch": 2879} {"train_loss": -24.752111434936523, "global_step": 238993, "epoch": 2879} {"train_loss": -25.08045196533203, "global_step": 238994, "epoch": 2879} {"train_loss": -24.96307945251465, "global_step": 238995, "epoch": 2879} {"train_loss": -25.056655883789062, "global_step": 238996, "epoch": 2879} {"train_loss": -24.995601654052734, "global_step": 238997, "epoch": 2879} {"train_loss": -24.751922607421875, "global_step": 238998, "epoch": 2879} {"train_loss": -24.840438842773438, "global_step": 238999, "epoch": 2879} {"train_loss": -25.177663803100586, "global_step": 239000, "epoch": 2879} {"train_loss": -24.386178970336914, "global_step": 239001, "epoch": 2879} {"train_loss": -25.008655548095703, "global_step": 239002, "epoch": 2879} {"train_loss": -25.10670280456543, "global_step": 239003, "epoch": 2879} {"train_loss": -25.37385368347168, "global_step": 239004, "epoch": 2879} {"train_loss": -24.342119216918945, "global_step": 239005, "epoch": 2879} {"train_loss": -24.90582847595215, "global_step": 239006, "epoch": 2879} {"train_loss": -25.21525001525879, "global_step": 239007, "epoch": 2879} {"train_loss": -24.933881759643555, "global_step": 239008, "epoch": 2879} {"train_loss": -24.82856559753418, "global_step": 239009, "epoch": 2879} {"train_loss": -24.928321838378906, "global_step": 239010, "epoch": 2879} {"train_loss": -24.903884887695312, "global_step": 239011, "epoch": 2879} {"train_loss": -25.05915641784668, "global_step": 239012, "epoch": 2879} {"train_loss": -25.09771156311035, "global_step": 239013, "epoch": 2879} {"train_loss": -24.784286499023438, "global_step": 239014, "epoch": 2879} {"train_loss": -24.8662109375, "global_step": 239015, "epoch": 2879} {"train_loss": -24.8903865814209, "global_step": 239016, "epoch": 2879} {"train_loss": -25.026578903198242, "global_step": 239017, "epoch": 2879} {"train_loss": -25.058063507080078, "global_step": 239018, "epoch": 2879} {"train_loss": -24.950063705444336, "global_step": 239019, "epoch": 2879} {"train_loss": -25.0275821685791, "global_step": 239020, "epoch": 2879} {"train_loss": -25.057373046875, "global_step": 239021, "epoch": 2879} {"train_loss": -24.765588760375977, "global_step": 239022, "epoch": 2879} {"train_loss": -24.699737548828125, "global_step": 239023, "epoch": 2879} {"train_loss": -24.922225952148438, "global_step": 239024, "epoch": 2879} {"train_loss": -25.0470027923584, "global_step": 239025, "epoch": 2879} {"train_loss": -25.302459716796875, "global_step": 239026, "epoch": 2879} {"train_loss": -25.111257553100586, "global_step": 239027, "epoch": 2879} {"train_loss": -24.935260772705078, "global_step": 239028, "epoch": 2879} {"train_loss": -24.913572311401367, "global_step": 239029, "epoch": 2879} {"train_loss": -25.191715240478516, "global_step": 239030, "epoch": 2879} {"train_loss": -24.99261474609375, "global_step": 239031, "epoch": 2879} {"train_loss": -25.599868774414062, "global_step": 239032, "epoch": 2879} {"train_loss": -24.904321670532227, "global_step": 239033, "epoch": 2879} {"train_loss": -24.91584587097168, "global_step": 239034, "epoch": 2879} {"train_loss": -24.678499221801758, "global_step": 239035, "epoch": 2879} {"train_loss": -24.46207618713379, "global_step": 239036, "epoch": 2879} {"train_loss": -24.57988166809082, "global_step": 239037, "epoch": 2879} {"train_loss": -25.084686279296875, "global_step": 239038, "epoch": 2879} {"train_loss": -24.822598055184606, "global_step": 239039, "epoch": 2879, "val_loss": 6787123.5} {"train_loss": -24.50544548034668, "global_step": 239040, "epoch": 2880} {"train_loss": -23.856184005737305, "global_step": 239041, "epoch": 2880} {"train_loss": -24.06717300415039, "global_step": 239042, "epoch": 2880} {"train_loss": -24.196414947509766, "global_step": 239043, "epoch": 2880} {"train_loss": -24.28825569152832, "global_step": 239044, "epoch": 2880} {"train_loss": -24.222673416137695, "global_step": 239045, "epoch": 2880} {"train_loss": -24.54599952697754, "global_step": 239046, "epoch": 2880} {"train_loss": -24.791013717651367, "global_step": 239047, "epoch": 2880} {"train_loss": -24.414188385009766, "global_step": 239048, "epoch": 2880} {"train_loss": -24.74456787109375, "global_step": 239049, "epoch": 2880} {"train_loss": -24.893980026245117, "global_step": 239050, "epoch": 2880} {"train_loss": -24.71949577331543, "global_step": 239051, "epoch": 2880} {"train_loss": -24.80027961730957, "global_step": 239052, "epoch": 2880} {"train_loss": -24.50775146484375, "global_step": 239053, "epoch": 2880} {"train_loss": -24.751876831054688, "global_step": 239054, "epoch": 2880} {"train_loss": -24.449609756469727, "global_step": 239055, "epoch": 2880} {"train_loss": -24.364355087280273, "global_step": 239056, "epoch": 2880} {"train_loss": -24.851003646850586, "global_step": 239057, "epoch": 2880} {"train_loss": -25.16438865661621, "global_step": 239058, "epoch": 2880} {"train_loss": -24.739187240600586, "global_step": 239059, "epoch": 2880} {"train_loss": -24.593143463134766, "global_step": 239060, "epoch": 2880} {"train_loss": -24.46659278869629, "global_step": 239061, "epoch": 2880} {"train_loss": -24.87717056274414, "global_step": 239062, "epoch": 2880} {"train_loss": -24.778757095336914, "global_step": 239063, "epoch": 2880} {"train_loss": -24.572444915771484, "global_step": 239064, "epoch": 2880} {"train_loss": -24.765642166137695, "global_step": 239065, "epoch": 2880} {"train_loss": -24.960607528686523, "global_step": 239066, "epoch": 2880} {"train_loss": -24.889360427856445, "global_step": 239067, "epoch": 2880} {"train_loss": -24.750961303710938, "global_step": 239068, "epoch": 2880} {"train_loss": -24.66117286682129, "global_step": 239069, "epoch": 2880} {"train_loss": -24.676603317260742, "global_step": 239070, "epoch": 2880} {"train_loss": -24.77833366394043, "global_step": 239071, "epoch": 2880} {"train_loss": -24.763225555419922, "global_step": 239072, "epoch": 2880} {"train_loss": -24.616119384765625, "global_step": 239073, "epoch": 2880} {"train_loss": -24.645328521728516, "global_step": 239074, "epoch": 2880} {"train_loss": -25.14071273803711, "global_step": 239075, "epoch": 2880} {"train_loss": -25.27263641357422, "global_step": 239076, "epoch": 2880} {"train_loss": -25.198904037475586, "global_step": 239077, "epoch": 2880} {"train_loss": -24.695451736450195, "global_step": 239078, "epoch": 2880} {"train_loss": -24.81717300415039, "global_step": 239079, "epoch": 2880} {"train_loss": -24.954195022583008, "global_step": 239080, "epoch": 2880} {"train_loss": -24.58917808532715, "global_step": 239081, "epoch": 2880} {"train_loss": -24.812326431274414, "global_step": 239082, "epoch": 2880} {"train_loss": -24.885116577148438, "global_step": 239083, "epoch": 2880} {"train_loss": -24.89473533630371, "global_step": 239084, "epoch": 2880} {"train_loss": -25.00043296813965, "global_step": 239085, "epoch": 2880} {"train_loss": -24.920644760131836, "global_step": 239086, "epoch": 2880} {"train_loss": -25.154306411743164, "global_step": 239087, "epoch": 2880} {"train_loss": -24.876081466674805, "global_step": 239088, "epoch": 2880} {"train_loss": -24.883743286132812, "global_step": 239089, "epoch": 2880} {"train_loss": -24.90926742553711, "global_step": 239090, "epoch": 2880} {"train_loss": -24.82207679748535, "global_step": 239091, "epoch": 2880} {"train_loss": -25.213953018188477, "global_step": 239092, "epoch": 2880} {"train_loss": -24.743906021118164, "global_step": 239093, "epoch": 2880} {"train_loss": -24.809051513671875, "global_step": 239094, "epoch": 2880} {"train_loss": -24.76643943786621, "global_step": 239095, "epoch": 2880} {"train_loss": -25.307571411132812, "global_step": 239096, "epoch": 2880} {"train_loss": -24.961074829101562, "global_step": 239097, "epoch": 2880} {"train_loss": -25.007421493530273, "global_step": 239098, "epoch": 2880} {"train_loss": -25.559728622436523, "global_step": 239099, "epoch": 2880} {"train_loss": -24.728824615478516, "global_step": 239100, "epoch": 2880} {"train_loss": -24.837377548217773, "global_step": 239101, "epoch": 2880} {"train_loss": -25.281396865844727, "global_step": 239102, "epoch": 2880} {"train_loss": -25.01045799255371, "global_step": 239103, "epoch": 2880} {"train_loss": -25.14821434020996, "global_step": 239104, "epoch": 2880} {"train_loss": -25.260299682617188, "global_step": 239105, "epoch": 2880} {"train_loss": -25.47183609008789, "global_step": 239106, "epoch": 2880} {"train_loss": -24.786924362182617, "global_step": 239107, "epoch": 2880} {"train_loss": -25.074481964111328, "global_step": 239108, "epoch": 2880} {"train_loss": -25.05137062072754, "global_step": 239109, "epoch": 2880} {"train_loss": -24.922386169433594, "global_step": 239110, "epoch": 2880} {"train_loss": -24.846723556518555, "global_step": 239111, "epoch": 2880} {"train_loss": -25.14055824279785, "global_step": 239112, "epoch": 2880} {"train_loss": -24.756406784057617, "global_step": 239113, "epoch": 2880} {"train_loss": -24.963232040405273, "global_step": 239114, "epoch": 2880} {"train_loss": -24.613906860351562, "global_step": 239115, "epoch": 2880} {"train_loss": -24.730913162231445, "global_step": 239116, "epoch": 2880} {"train_loss": -25.095422744750977, "global_step": 239117, "epoch": 2880} {"train_loss": -25.015867233276367, "global_step": 239118, "epoch": 2880} {"train_loss": -24.95998191833496, "global_step": 239119, "epoch": 2880} {"train_loss": -24.925901412963867, "global_step": 239120, "epoch": 2880} {"train_loss": -24.949100494384766, "global_step": 239121, "epoch": 2880} {"train_loss": -24.82089431027332, "global_step": 239122, "epoch": 2880, "val_loss": 6682674.0} {"train_loss": -24.303741455078125, "global_step": 239123, "epoch": 2881} {"train_loss": -24.494457244873047, "global_step": 239124, "epoch": 2881} {"train_loss": -24.249692916870117, "global_step": 239125, "epoch": 2881} {"train_loss": -24.037425994873047, "global_step": 239126, "epoch": 2881} {"train_loss": -24.26639175415039, "global_step": 239127, "epoch": 2881} {"train_loss": -24.158246994018555, "global_step": 239128, "epoch": 2881} {"train_loss": -24.153060913085938, "global_step": 239129, "epoch": 2881} {"train_loss": -24.65627098083496, "global_step": 239130, "epoch": 2881} {"train_loss": -24.253446578979492, "global_step": 239131, "epoch": 2881} {"train_loss": -24.357757568359375, "global_step": 239132, "epoch": 2881} {"train_loss": -24.674121856689453, "global_step": 239133, "epoch": 2881} {"train_loss": -24.3031005859375, "global_step": 239134, "epoch": 2881} {"train_loss": -24.44590950012207, "global_step": 239135, "epoch": 2881} {"train_loss": -24.703588485717773, "global_step": 239136, "epoch": 2881} {"train_loss": -24.564878463745117, "global_step": 239137, "epoch": 2881} {"train_loss": -24.78742027282715, "global_step": 239138, "epoch": 2881} {"train_loss": -24.90215492248535, "global_step": 239139, "epoch": 2881} {"train_loss": -24.786863327026367, "global_step": 239140, "epoch": 2881} {"train_loss": -24.61565399169922, "global_step": 239141, "epoch": 2881} {"train_loss": -24.417722702026367, "global_step": 239142, "epoch": 2881} {"train_loss": -24.570423126220703, "global_step": 239143, "epoch": 2881} {"train_loss": -24.38925552368164, "global_step": 239144, "epoch": 2881} {"train_loss": -24.746366500854492, "global_step": 239145, "epoch": 2881} {"train_loss": -24.82724952697754, "global_step": 239146, "epoch": 2881} {"train_loss": -25.049484252929688, "global_step": 239147, "epoch": 2881} {"train_loss": -24.846845626831055, "global_step": 239148, "epoch": 2881} {"train_loss": -24.649831771850586, "global_step": 239149, "epoch": 2881} {"train_loss": -24.439228057861328, "global_step": 239150, "epoch": 2881} {"train_loss": -24.74590301513672, "global_step": 239151, "epoch": 2881} {"train_loss": -24.67467498779297, "global_step": 239152, "epoch": 2881} {"train_loss": -24.835241317749023, "global_step": 239153, "epoch": 2881} {"train_loss": -24.9698543548584, "global_step": 239154, "epoch": 2881} {"train_loss": -24.69951820373535, "global_step": 239155, "epoch": 2881} {"train_loss": -24.959014892578125, "global_step": 239156, "epoch": 2881} {"train_loss": -24.86919593811035, "global_step": 239157, "epoch": 2881} {"train_loss": -25.191335678100586, "global_step": 239158, "epoch": 2881} {"train_loss": -24.693098068237305, "global_step": 239159, "epoch": 2881} {"train_loss": -25.30914878845215, "global_step": 239160, "epoch": 2881} {"train_loss": -24.93669319152832, "global_step": 239161, "epoch": 2881} {"train_loss": -25.264972686767578, "global_step": 239162, "epoch": 2881} {"train_loss": -24.904279708862305, "global_step": 239163, "epoch": 2881} {"train_loss": -24.832822799682617, "global_step": 239164, "epoch": 2881} {"train_loss": -25.241390228271484, "global_step": 239165, "epoch": 2881} {"train_loss": -25.033876419067383, "global_step": 239166, "epoch": 2881} {"train_loss": -25.092437744140625, "global_step": 239167, "epoch": 2881} {"train_loss": -24.956552505493164, "global_step": 239168, "epoch": 2881} {"train_loss": -24.972354888916016, "global_step": 239169, "epoch": 2881} {"train_loss": -24.917245864868164, "global_step": 239170, "epoch": 2881} {"train_loss": -25.007774353027344, "global_step": 239171, "epoch": 2881} {"train_loss": -25.27256965637207, "global_step": 239172, "epoch": 2881} {"train_loss": -24.938486099243164, "global_step": 239173, "epoch": 2881} {"train_loss": -24.86785888671875, "global_step": 239174, "epoch": 2881} {"train_loss": -24.53463363647461, "global_step": 239175, "epoch": 2881} {"train_loss": -24.707252502441406, "global_step": 239176, "epoch": 2881} {"train_loss": -24.85349464416504, "global_step": 239177, "epoch": 2881} {"train_loss": -24.766407012939453, "global_step": 239178, "epoch": 2881} {"train_loss": -24.806331634521484, "global_step": 239179, "epoch": 2881} {"train_loss": -25.121076583862305, "global_step": 239180, "epoch": 2881} {"train_loss": -25.089435577392578, "global_step": 239181, "epoch": 2881} {"train_loss": -24.470462799072266, "global_step": 239182, "epoch": 2881} {"train_loss": -25.060043334960938, "global_step": 239183, "epoch": 2881} {"train_loss": -24.64557647705078, "global_step": 239184, "epoch": 2881} {"train_loss": -24.487995147705078, "global_step": 239185, "epoch": 2881} {"train_loss": -24.88825035095215, "global_step": 239186, "epoch": 2881} {"train_loss": -24.833349227905273, "global_step": 239187, "epoch": 2881} {"train_loss": -24.739166259765625, "global_step": 239188, "epoch": 2881} {"train_loss": -24.652969360351562, "global_step": 239189, "epoch": 2881} {"train_loss": -24.97943687438965, "global_step": 239190, "epoch": 2881} {"train_loss": -24.863815307617188, "global_step": 239191, "epoch": 2881} {"train_loss": -24.767152786254883, "global_step": 239192, "epoch": 2881} {"train_loss": -24.8402042388916, "global_step": 239193, "epoch": 2881} {"train_loss": -24.636960983276367, "global_step": 239194, "epoch": 2881} {"train_loss": -25.152908325195312, "global_step": 239195, "epoch": 2881} {"train_loss": -24.890789031982422, "global_step": 239196, "epoch": 2881} {"train_loss": -24.706954956054688, "global_step": 239197, "epoch": 2881} {"train_loss": -25.386281967163086, "global_step": 239198, "epoch": 2881} {"train_loss": -24.938562393188477, "global_step": 239199, "epoch": 2881} {"train_loss": -24.846097946166992, "global_step": 239200, "epoch": 2881} {"train_loss": -25.117767333984375, "global_step": 239201, "epoch": 2881} {"train_loss": -25.074167251586914, "global_step": 239202, "epoch": 2881} {"train_loss": -25.004714965820312, "global_step": 239203, "epoch": 2881} {"train_loss": -24.587026596069336, "global_step": 239204, "epoch": 2881} {"train_loss": -24.78205239629171, "global_step": 239205, "epoch": 2881, "val_loss": 6804337.5} {"train_loss": -24.823429107666016, "global_step": 239206, "epoch": 2882} {"train_loss": -24.483890533447266, "global_step": 239207, "epoch": 2882} {"train_loss": -24.478296279907227, "global_step": 239208, "epoch": 2882} {"train_loss": -24.05560302734375, "global_step": 239209, "epoch": 2882} {"train_loss": -24.235454559326172, "global_step": 239210, "epoch": 2882} {"train_loss": -23.754770278930664, "global_step": 239211, "epoch": 2882} {"train_loss": -24.218639373779297, "global_step": 239212, "epoch": 2882} {"train_loss": -24.289281845092773, "global_step": 239213, "epoch": 2882} {"train_loss": -24.646312713623047, "global_step": 239214, "epoch": 2882} {"train_loss": -24.19290542602539, "global_step": 239215, "epoch": 2882} {"train_loss": -24.22117805480957, "global_step": 239216, "epoch": 2882} {"train_loss": -24.532304763793945, "global_step": 239217, "epoch": 2882} {"train_loss": -24.245492935180664, "global_step": 239218, "epoch": 2882} {"train_loss": -24.331228256225586, "global_step": 239219, "epoch": 2882} {"train_loss": -24.430768966674805, "global_step": 239220, "epoch": 2882} {"train_loss": -24.565641403198242, "global_step": 239221, "epoch": 2882} {"train_loss": -24.61252784729004, "global_step": 239222, "epoch": 2882} {"train_loss": -24.810914993286133, "global_step": 239223, "epoch": 2882} {"train_loss": -24.786649703979492, "global_step": 239224, "epoch": 2882} {"train_loss": -24.891754150390625, "global_step": 239225, "epoch": 2882} {"train_loss": -24.823158264160156, "global_step": 239226, "epoch": 2882} {"train_loss": -24.49055290222168, "global_step": 239227, "epoch": 2882} {"train_loss": -24.579185485839844, "global_step": 239228, "epoch": 2882} {"train_loss": -24.586740493774414, "global_step": 239229, "epoch": 2882} {"train_loss": -24.9014892578125, "global_step": 239230, "epoch": 2882} {"train_loss": -25.09518814086914, "global_step": 239231, "epoch": 2882} {"train_loss": -24.693422317504883, "global_step": 239232, "epoch": 2882} {"train_loss": -24.77520751953125, "global_step": 239233, "epoch": 2882} {"train_loss": -24.805227279663086, "global_step": 239234, "epoch": 2882} {"train_loss": -24.865659713745117, "global_step": 239235, "epoch": 2882} {"train_loss": -24.82732391357422, "global_step": 239236, "epoch": 2882} {"train_loss": -24.81332778930664, "global_step": 239237, "epoch": 2882} {"train_loss": -24.954313278198242, "global_step": 239238, "epoch": 2882} {"train_loss": -25.038806915283203, "global_step": 239239, "epoch": 2882} {"train_loss": -25.076858520507812, "global_step": 239240, "epoch": 2882} {"train_loss": -25.15226173400879, "global_step": 239241, "epoch": 2882} {"train_loss": -24.74127769470215, "global_step": 239242, "epoch": 2882} {"train_loss": -25.08978271484375, "global_step": 239243, "epoch": 2882} {"train_loss": -24.7797794342041, "global_step": 239244, "epoch": 2882} {"train_loss": -25.101619720458984, "global_step": 239245, "epoch": 2882} {"train_loss": -25.37238883972168, "global_step": 239246, "epoch": 2882} {"train_loss": -25.153831481933594, "global_step": 239247, "epoch": 2882} {"train_loss": -25.072582244873047, "global_step": 239248, "epoch": 2882} {"train_loss": -24.925485610961914, "global_step": 239249, "epoch": 2882} {"train_loss": -25.075321197509766, "global_step": 239250, "epoch": 2882} {"train_loss": -25.027481079101562, "global_step": 239251, "epoch": 2882} {"train_loss": -25.16560935974121, "global_step": 239252, "epoch": 2882} {"train_loss": -24.875783920288086, "global_step": 239253, "epoch": 2882} {"train_loss": -24.794919967651367, "global_step": 239254, "epoch": 2882} {"train_loss": -25.044034957885742, "global_step": 239255, "epoch": 2882} {"train_loss": -24.945524215698242, "global_step": 239256, "epoch": 2882} {"train_loss": -24.925434112548828, "global_step": 239257, "epoch": 2882} {"train_loss": -25.23801040649414, "global_step": 239258, "epoch": 2882} {"train_loss": -24.996793746948242, "global_step": 239259, "epoch": 2882} {"train_loss": -25.044389724731445, "global_step": 239260, "epoch": 2882} {"train_loss": -25.01945686340332, "global_step": 239261, "epoch": 2882} {"train_loss": -25.066556930541992, "global_step": 239262, "epoch": 2882} {"train_loss": -25.00736427307129, "global_step": 239263, "epoch": 2882} {"train_loss": -24.83689308166504, "global_step": 239264, "epoch": 2882} {"train_loss": -25.24912452697754, "global_step": 239265, "epoch": 2882} {"train_loss": -24.867538452148438, "global_step": 239266, "epoch": 2882} {"train_loss": -24.47254753112793, "global_step": 239267, "epoch": 2882} {"train_loss": -23.77324867248535, "global_step": 239268, "epoch": 2882} {"train_loss": -24.3230037689209, "global_step": 239269, "epoch": 2882} {"train_loss": -24.581615447998047, "global_step": 239270, "epoch": 2882} {"train_loss": -24.81337547302246, "global_step": 239271, "epoch": 2882} {"train_loss": -24.479602813720703, "global_step": 239272, "epoch": 2882} {"train_loss": -24.587915420532227, "global_step": 239273, "epoch": 2882} {"train_loss": -24.50919532775879, "global_step": 239274, "epoch": 2882} {"train_loss": -24.61397361755371, "global_step": 239275, "epoch": 2882} {"train_loss": -24.357412338256836, "global_step": 239276, "epoch": 2882} {"train_loss": -24.889150619506836, "global_step": 239277, "epoch": 2882} {"train_loss": -24.546981811523438, "global_step": 239278, "epoch": 2882} {"train_loss": -24.623750686645508, "global_step": 239279, "epoch": 2882} {"train_loss": -24.781354904174805, "global_step": 239280, "epoch": 2882} {"train_loss": -24.76333999633789, "global_step": 239281, "epoch": 2882} {"train_loss": -24.314517974853516, "global_step": 239282, "epoch": 2882} {"train_loss": -24.856496810913086, "global_step": 239283, "epoch": 2882} {"train_loss": -24.750394821166992, "global_step": 239284, "epoch": 2882} {"train_loss": -24.94257164001465, "global_step": 239285, "epoch": 2882} {"train_loss": -24.68949317932129, "global_step": 239286, "epoch": 2882} {"train_loss": -25.185007095336914, "global_step": 239287, "epoch": 2882} {"train_loss": -24.730288310223315, "global_step": 239288, "epoch": 2882, "val_loss": 6866861.0} {"train_loss": -24.51092529296875, "global_step": 239289, "epoch": 2883} {"train_loss": -24.59161949157715, "global_step": 239290, "epoch": 2883} {"train_loss": -24.85483741760254, "global_step": 239291, "epoch": 2883} {"train_loss": -24.82175064086914, "global_step": 239292, "epoch": 2883} {"train_loss": -24.677257537841797, "global_step": 239293, "epoch": 2883} {"train_loss": -24.78778076171875, "global_step": 239294, "epoch": 2883} {"train_loss": -24.5244083404541, "global_step": 239295, "epoch": 2883} {"train_loss": -24.91559410095215, "global_step": 239296, "epoch": 2883} {"train_loss": -24.121999740600586, "global_step": 239297, "epoch": 2883} {"train_loss": -25.116817474365234, "global_step": 239298, "epoch": 2883} {"train_loss": -24.589279174804688, "global_step": 239299, "epoch": 2883} {"train_loss": -24.603073120117188, "global_step": 239300, "epoch": 2883} {"train_loss": -24.77894401550293, "global_step": 239301, "epoch": 2883} {"train_loss": -24.822053909301758, "global_step": 239302, "epoch": 2883} {"train_loss": -24.73322105407715, "global_step": 239303, "epoch": 2883} {"train_loss": -24.54961585998535, "global_step": 239304, "epoch": 2883} {"train_loss": -24.969297409057617, "global_step": 239305, "epoch": 2883} {"train_loss": -24.980497360229492, "global_step": 239306, "epoch": 2883} {"train_loss": -24.9215145111084, "global_step": 239307, "epoch": 2883} {"train_loss": -25.1269588470459, "global_step": 239308, "epoch": 2883} {"train_loss": -24.930246353149414, "global_step": 239309, "epoch": 2883} {"train_loss": -24.68813705444336, "global_step": 239310, "epoch": 2883} {"train_loss": -24.944936752319336, "global_step": 239311, "epoch": 2883} {"train_loss": -25.07059097290039, "global_step": 239312, "epoch": 2883} {"train_loss": -24.761850357055664, "global_step": 239313, "epoch": 2883} {"train_loss": -24.909957885742188, "global_step": 239314, "epoch": 2883} {"train_loss": -24.989547729492188, "global_step": 239315, "epoch": 2883} {"train_loss": -25.091991424560547, "global_step": 239316, "epoch": 2883} {"train_loss": -25.15244483947754, "global_step": 239317, "epoch": 2883} {"train_loss": -24.7659912109375, "global_step": 239318, "epoch": 2883} {"train_loss": -24.826168060302734, "global_step": 239319, "epoch": 2883} {"train_loss": -24.392004013061523, "global_step": 239320, "epoch": 2883} {"train_loss": -25.19312858581543, "global_step": 239321, "epoch": 2883} {"train_loss": -25.210824966430664, "global_step": 239322, "epoch": 2883} {"train_loss": -24.62881088256836, "global_step": 239323, "epoch": 2883} {"train_loss": -24.955839157104492, "global_step": 239324, "epoch": 2883} {"train_loss": -25.238021850585938, "global_step": 239325, "epoch": 2883} {"train_loss": -25.152387619018555, "global_step": 239326, "epoch": 2883} {"train_loss": -25.282426834106445, "global_step": 239327, "epoch": 2883} {"train_loss": -24.770505905151367, "global_step": 239328, "epoch": 2883} {"train_loss": -25.060728073120117, "global_step": 239329, "epoch": 2883} {"train_loss": -24.560998916625977, "global_step": 239330, "epoch": 2883} {"train_loss": -24.546186447143555, "global_step": 239331, "epoch": 2883} {"train_loss": -24.30124282836914, "global_step": 239332, "epoch": 2883} {"train_loss": -25.167932510375977, "global_step": 239333, "epoch": 2883} {"train_loss": -24.921621322631836, "global_step": 239334, "epoch": 2883} {"train_loss": -24.81781578063965, "global_step": 239335, "epoch": 2883} {"train_loss": -24.425329208374023, "global_step": 239336, "epoch": 2883} {"train_loss": -25.031728744506836, "global_step": 239337, "epoch": 2883} {"train_loss": -24.281888961791992, "global_step": 239338, "epoch": 2883} {"train_loss": -24.73287582397461, "global_step": 239339, "epoch": 2883} {"train_loss": -24.585529327392578, "global_step": 239340, "epoch": 2883} {"train_loss": -24.547565460205078, "global_step": 239341, "epoch": 2883} {"train_loss": -24.53875732421875, "global_step": 239342, "epoch": 2883} {"train_loss": -24.994190216064453, "global_step": 239343, "epoch": 2883} {"train_loss": -24.763248443603516, "global_step": 239344, "epoch": 2883} {"train_loss": -24.763397216796875, "global_step": 239345, "epoch": 2883} {"train_loss": -24.39157485961914, "global_step": 239346, "epoch": 2883} {"train_loss": -24.719100952148438, "global_step": 239347, "epoch": 2883} {"train_loss": -24.81870460510254, "global_step": 239348, "epoch": 2883} {"train_loss": -24.793210983276367, "global_step": 239349, "epoch": 2883} {"train_loss": -25.016857147216797, "global_step": 239350, "epoch": 2883} {"train_loss": -25.072343826293945, "global_step": 239351, "epoch": 2883} {"train_loss": -24.727256774902344, "global_step": 239352, "epoch": 2883} {"train_loss": -24.535972595214844, "global_step": 239353, "epoch": 2883} {"train_loss": -25.03091812133789, "global_step": 239354, "epoch": 2883} {"train_loss": -25.18754005432129, "global_step": 239355, "epoch": 2883} {"train_loss": -24.856830596923828, "global_step": 239356, "epoch": 2883} {"train_loss": -24.95236587524414, "global_step": 239357, "epoch": 2883} {"train_loss": -25.17239761352539, "global_step": 239358, "epoch": 2883} {"train_loss": -24.988182067871094, "global_step": 239359, "epoch": 2883} {"train_loss": -25.187620162963867, "global_step": 239360, "epoch": 2883} {"train_loss": -25.300809860229492, "global_step": 239361, "epoch": 2883} {"train_loss": -25.14515495300293, "global_step": 239362, "epoch": 2883} {"train_loss": -25.240346908569336, "global_step": 239363, "epoch": 2883} {"train_loss": -25.237789154052734, "global_step": 239364, "epoch": 2883} {"train_loss": -24.55000877380371, "global_step": 239365, "epoch": 2883} {"train_loss": -25.161375045776367, "global_step": 239366, "epoch": 2883} {"train_loss": -24.78925132751465, "global_step": 239367, "epoch": 2883} {"train_loss": -24.873781204223633, "global_step": 239368, "epoch": 2883} {"train_loss": -25.113880157470703, "global_step": 239369, "epoch": 2883} {"train_loss": -25.139142990112305, "global_step": 239370, "epoch": 2883} {"train_loss": -24.855892135436278, "global_step": 239371, "epoch": 2883, "val_loss": 6784303.0} {"train_loss": -24.660001754760742, "global_step": 239372, "epoch": 2884} {"train_loss": -23.63181495666504, "global_step": 239373, "epoch": 2884} {"train_loss": -23.367795944213867, "global_step": 239374, "epoch": 2884} {"train_loss": -23.50624656677246, "global_step": 239375, "epoch": 2884} {"train_loss": -23.919925689697266, "global_step": 239376, "epoch": 2884} {"train_loss": -24.536331176757812, "global_step": 239377, "epoch": 2884} {"train_loss": -24.3212947845459, "global_step": 239378, "epoch": 2884} {"train_loss": -24.603275299072266, "global_step": 239379, "epoch": 2884} {"train_loss": -24.660564422607422, "global_step": 239380, "epoch": 2884} {"train_loss": -24.497268676757812, "global_step": 239381, "epoch": 2884} {"train_loss": -24.504941940307617, "global_step": 239382, "epoch": 2884} {"train_loss": -24.66297721862793, "global_step": 239383, "epoch": 2884} {"train_loss": -24.400405883789062, "global_step": 239384, "epoch": 2884} {"train_loss": -24.559919357299805, "global_step": 239385, "epoch": 2884} {"train_loss": -24.233402252197266, "global_step": 239386, "epoch": 2884} {"train_loss": -24.56365203857422, "global_step": 239387, "epoch": 2884} {"train_loss": -24.2998046875, "global_step": 239388, "epoch": 2884} {"train_loss": -24.63414764404297, "global_step": 239389, "epoch": 2884} {"train_loss": -24.43804931640625, "global_step": 239390, "epoch": 2884} {"train_loss": -25.176183700561523, "global_step": 239391, "epoch": 2884} {"train_loss": -24.3781681060791, "global_step": 239392, "epoch": 2884} {"train_loss": -24.614593505859375, "global_step": 239393, "epoch": 2884} {"train_loss": -24.691787719726562, "global_step": 239394, "epoch": 2884} {"train_loss": -24.781232833862305, "global_step": 239395, "epoch": 2884} {"train_loss": -24.824081420898438, "global_step": 239396, "epoch": 2884} {"train_loss": -24.733808517456055, "global_step": 239397, "epoch": 2884} {"train_loss": -24.89510726928711, "global_step": 239398, "epoch": 2884} {"train_loss": -24.58636474609375, "global_step": 239399, "epoch": 2884} {"train_loss": -24.68452262878418, "global_step": 239400, "epoch": 2884} {"train_loss": -24.7857666015625, "global_step": 239401, "epoch": 2884} {"train_loss": -24.799833297729492, "global_step": 239402, "epoch": 2884} {"train_loss": -24.922428131103516, "global_step": 239403, "epoch": 2884} {"train_loss": -25.291261672973633, "global_step": 239404, "epoch": 2884} {"train_loss": -24.8105525970459, "global_step": 239405, "epoch": 2884} {"train_loss": -24.801959991455078, "global_step": 239406, "epoch": 2884} {"train_loss": -25.010417938232422, "global_step": 239407, "epoch": 2884} {"train_loss": -25.025691986083984, "global_step": 239408, "epoch": 2884} {"train_loss": -24.936325073242188, "global_step": 239409, "epoch": 2884} {"train_loss": -25.061100006103516, "global_step": 239410, "epoch": 2884} {"train_loss": -24.951332092285156, "global_step": 239411, "epoch": 2884} {"train_loss": -25.53824234008789, "global_step": 239412, "epoch": 2884} {"train_loss": -25.43507957458496, "global_step": 239413, "epoch": 2884} {"train_loss": -24.754810333251953, "global_step": 239414, "epoch": 2884} {"train_loss": -24.851232528686523, "global_step": 239415, "epoch": 2884} {"train_loss": -25.007375717163086, "global_step": 239416, "epoch": 2884} {"train_loss": -25.21295738220215, "global_step": 239417, "epoch": 2884} {"train_loss": -25.253873825073242, "global_step": 239418, "epoch": 2884} {"train_loss": -24.938018798828125, "global_step": 239419, "epoch": 2884} {"train_loss": -25.012340545654297, "global_step": 239420, "epoch": 2884} {"train_loss": -24.684497833251953, "global_step": 239421, "epoch": 2884} {"train_loss": -24.412551879882812, "global_step": 239422, "epoch": 2884} {"train_loss": -24.215457916259766, "global_step": 239423, "epoch": 2884} {"train_loss": -24.5783634185791, "global_step": 239424, "epoch": 2884} {"train_loss": -24.66168212890625, "global_step": 239425, "epoch": 2884} {"train_loss": -24.575349807739258, "global_step": 239426, "epoch": 2884} {"train_loss": -24.400005340576172, "global_step": 239427, "epoch": 2884} {"train_loss": -24.075605392456055, "global_step": 239428, "epoch": 2884} {"train_loss": -24.622953414916992, "global_step": 239429, "epoch": 2884} {"train_loss": -24.6718692779541, "global_step": 239430, "epoch": 2884} {"train_loss": -24.899423599243164, "global_step": 239431, "epoch": 2884} {"train_loss": -24.300912857055664, "global_step": 239432, "epoch": 2884} {"train_loss": -24.409475326538086, "global_step": 239433, "epoch": 2884} {"train_loss": -24.498783111572266, "global_step": 239434, "epoch": 2884} {"train_loss": -24.60993766784668, "global_step": 239435, "epoch": 2884} {"train_loss": -24.629697799682617, "global_step": 239436, "epoch": 2884} {"train_loss": -24.737457275390625, "global_step": 239437, "epoch": 2884} {"train_loss": -24.827444076538086, "global_step": 239438, "epoch": 2884} {"train_loss": -24.477008819580078, "global_step": 239439, "epoch": 2884} {"train_loss": -24.8939266204834, "global_step": 239440, "epoch": 2884} {"train_loss": -24.489974975585938, "global_step": 239441, "epoch": 2884} {"train_loss": -24.316408157348633, "global_step": 239442, "epoch": 2884} {"train_loss": -24.4216365814209, "global_step": 239443, "epoch": 2884} {"train_loss": -24.829666137695312, "global_step": 239444, "epoch": 2884} {"train_loss": -24.626218795776367, "global_step": 239445, "epoch": 2884} {"train_loss": -24.593381881713867, "global_step": 239446, "epoch": 2884} {"train_loss": -24.92229652404785, "global_step": 239447, "epoch": 2884} {"train_loss": -25.263748168945312, "global_step": 239448, "epoch": 2884} {"train_loss": -24.662933349609375, "global_step": 239449, "epoch": 2884} {"train_loss": -24.773954391479492, "global_step": 239450, "epoch": 2884} {"train_loss": -24.88787841796875, "global_step": 239451, "epoch": 2884} {"train_loss": -24.85895538330078, "global_step": 239452, "epoch": 2884} {"train_loss": -25.168079376220703, "global_step": 239453, "epoch": 2884} {"train_loss": -24.670018598257776, "global_step": 239454, "epoch": 2884, "val_loss": 6741701.0} {"train_loss": -24.620527267456055, "global_step": 239455, "epoch": 2885} {"train_loss": -24.174875259399414, "global_step": 239456, "epoch": 2885} {"train_loss": -24.174715042114258, "global_step": 239457, "epoch": 2885} {"train_loss": -24.869213104248047, "global_step": 239458, "epoch": 2885} {"train_loss": -24.374441146850586, "global_step": 239459, "epoch": 2885} {"train_loss": -24.3625431060791, "global_step": 239460, "epoch": 2885} {"train_loss": -24.62336540222168, "global_step": 239461, "epoch": 2885} {"train_loss": -24.602407455444336, "global_step": 239462, "epoch": 2885} {"train_loss": -24.538227081298828, "global_step": 239463, "epoch": 2885} {"train_loss": -24.57789421081543, "global_step": 239464, "epoch": 2885} {"train_loss": -24.586706161499023, "global_step": 239465, "epoch": 2885} {"train_loss": -24.48639488220215, "global_step": 239466, "epoch": 2885} {"train_loss": -24.3857479095459, "global_step": 239467, "epoch": 2885} {"train_loss": -24.965234756469727, "global_step": 239468, "epoch": 2885} {"train_loss": -24.429176330566406, "global_step": 239469, "epoch": 2885} {"train_loss": -24.95591163635254, "global_step": 239470, "epoch": 2885} {"train_loss": -24.679046630859375, "global_step": 239471, "epoch": 2885} {"train_loss": -24.4976863861084, "global_step": 239472, "epoch": 2885} {"train_loss": -24.735044479370117, "global_step": 239473, "epoch": 2885} {"train_loss": -24.756032943725586, "global_step": 239474, "epoch": 2885} {"train_loss": -24.41411018371582, "global_step": 239475, "epoch": 2885} {"train_loss": -24.695709228515625, "global_step": 239476, "epoch": 2885} {"train_loss": -24.812992095947266, "global_step": 239477, "epoch": 2885} {"train_loss": -24.796756744384766, "global_step": 239478, "epoch": 2885} {"train_loss": -25.19049072265625, "global_step": 239479, "epoch": 2885} {"train_loss": -25.031335830688477, "global_step": 239480, "epoch": 2885} {"train_loss": -24.711288452148438, "global_step": 239481, "epoch": 2885} {"train_loss": -24.86199951171875, "global_step": 239482, "epoch": 2885} {"train_loss": -24.97857666015625, "global_step": 239483, "epoch": 2885} {"train_loss": -24.825376510620117, "global_step": 239484, "epoch": 2885} {"train_loss": -24.698322296142578, "global_step": 239485, "epoch": 2885} {"train_loss": -24.94404411315918, "global_step": 239486, "epoch": 2885} {"train_loss": -24.75679588317871, "global_step": 239487, "epoch": 2885} {"train_loss": -24.654260635375977, "global_step": 239488, "epoch": 2885} {"train_loss": -24.699298858642578, "global_step": 239489, "epoch": 2885} {"train_loss": -25.116413116455078, "global_step": 239490, "epoch": 2885} {"train_loss": -24.688993453979492, "global_step": 239491, "epoch": 2885} {"train_loss": -24.831623077392578, "global_step": 239492, "epoch": 2885} {"train_loss": -25.049606323242188, "global_step": 239493, "epoch": 2885} {"train_loss": -25.035526275634766, "global_step": 239494, "epoch": 2885} {"train_loss": -24.73956871032715, "global_step": 239495, "epoch": 2885} {"train_loss": -25.05257225036621, "global_step": 239496, "epoch": 2885} {"train_loss": -25.150964736938477, "global_step": 239497, "epoch": 2885} {"train_loss": -24.962255477905273, "global_step": 239498, "epoch": 2885} {"train_loss": -24.94160270690918, "global_step": 239499, "epoch": 2885} {"train_loss": -25.284534454345703, "global_step": 239500, "epoch": 2885} {"train_loss": -25.377939224243164, "global_step": 239501, "epoch": 2885} {"train_loss": -25.179746627807617, "global_step": 239502, "epoch": 2885} {"train_loss": -25.092695236206055, "global_step": 239503, "epoch": 2885} {"train_loss": -25.421558380126953, "global_step": 239504, "epoch": 2885} {"train_loss": -24.975364685058594, "global_step": 239505, "epoch": 2885} {"train_loss": -24.98977279663086, "global_step": 239506, "epoch": 2885} {"train_loss": -24.999225616455078, "global_step": 239507, "epoch": 2885} {"train_loss": -25.018627166748047, "global_step": 239508, "epoch": 2885} {"train_loss": -24.95525360107422, "global_step": 239509, "epoch": 2885} {"train_loss": -25.12753677368164, "global_step": 239510, "epoch": 2885} {"train_loss": -25.01595115661621, "global_step": 239511, "epoch": 2885} {"train_loss": -24.67868423461914, "global_step": 239512, "epoch": 2885} {"train_loss": -24.896894454956055, "global_step": 239513, "epoch": 2885} {"train_loss": -25.221540451049805, "global_step": 239514, "epoch": 2885} {"train_loss": -25.223630905151367, "global_step": 239515, "epoch": 2885} {"train_loss": -24.81122398376465, "global_step": 239516, "epoch": 2885} {"train_loss": -24.89611053466797, "global_step": 239517, "epoch": 2885} {"train_loss": -25.023822784423828, "global_step": 239518, "epoch": 2885} {"train_loss": -25.0164794921875, "global_step": 239519, "epoch": 2885} {"train_loss": -24.771747589111328, "global_step": 239520, "epoch": 2885} {"train_loss": -25.37253189086914, "global_step": 239521, "epoch": 2885} {"train_loss": -25.173559188842773, "global_step": 239522, "epoch": 2885} {"train_loss": -25.0938777923584, "global_step": 239523, "epoch": 2885} {"train_loss": -24.898578643798828, "global_step": 239524, "epoch": 2885} {"train_loss": -25.011056900024414, "global_step": 239525, "epoch": 2885} {"train_loss": -24.8929386138916, "global_step": 239526, "epoch": 2885} {"train_loss": -25.109750747680664, "global_step": 239527, "epoch": 2885} {"train_loss": -24.946706771850586, "global_step": 239528, "epoch": 2885} {"train_loss": -24.816265106201172, "global_step": 239529, "epoch": 2885} {"train_loss": -24.819936752319336, "global_step": 239530, "epoch": 2885} {"train_loss": -24.877090454101562, "global_step": 239531, "epoch": 2885} {"train_loss": -24.6803035736084, "global_step": 239532, "epoch": 2885} {"train_loss": -25.431299209594727, "global_step": 239533, "epoch": 2885} {"train_loss": -24.7285213470459, "global_step": 239534, "epoch": 2885} {"train_loss": -25.30531120300293, "global_step": 239535, "epoch": 2885} {"train_loss": -25.237836837768555, "global_step": 239536, "epoch": 2885} {"train_loss": -24.86353885696595, "global_step": 239537, "epoch": 2885, "val_loss": 6679110.0} {"train_loss": -23.574054718017578, "global_step": 239538, "epoch": 2886} {"train_loss": -23.3851261138916, "global_step": 239539, "epoch": 2886} {"train_loss": -24.181751251220703, "global_step": 239540, "epoch": 2886} {"train_loss": -24.22812843322754, "global_step": 239541, "epoch": 2886} {"train_loss": -24.301977157592773, "global_step": 239542, "epoch": 2886} {"train_loss": -24.584089279174805, "global_step": 239543, "epoch": 2886} {"train_loss": -24.08173942565918, "global_step": 239544, "epoch": 2886} {"train_loss": -24.16072654724121, "global_step": 239545, "epoch": 2886} {"train_loss": -24.264331817626953, "global_step": 239546, "epoch": 2886} {"train_loss": -23.9953670501709, "global_step": 239547, "epoch": 2886} {"train_loss": -24.337369918823242, "global_step": 239548, "epoch": 2886} {"train_loss": -24.538818359375, "global_step": 239549, "epoch": 2886} {"train_loss": -24.387231826782227, "global_step": 239550, "epoch": 2886} {"train_loss": -24.89906120300293, "global_step": 239551, "epoch": 2886} {"train_loss": -24.19541358947754, "global_step": 239552, "epoch": 2886} {"train_loss": -24.426347732543945, "global_step": 239553, "epoch": 2886} {"train_loss": -24.024463653564453, "global_step": 239554, "epoch": 2886} {"train_loss": -24.509740829467773, "global_step": 239555, "epoch": 2886} {"train_loss": -24.62734031677246, "global_step": 239556, "epoch": 2886} {"train_loss": -24.863433837890625, "global_step": 239557, "epoch": 2886} {"train_loss": -24.239248275756836, "global_step": 239558, "epoch": 2886} {"train_loss": -24.228269577026367, "global_step": 239559, "epoch": 2886} {"train_loss": -24.26161003112793, "global_step": 239560, "epoch": 2886} {"train_loss": -24.842985153198242, "global_step": 239561, "epoch": 2886} {"train_loss": -24.615930557250977, "global_step": 239562, "epoch": 2886} {"train_loss": -24.846214294433594, "global_step": 239563, "epoch": 2886} {"train_loss": -24.739011764526367, "global_step": 239564, "epoch": 2886} {"train_loss": -24.658403396606445, "global_step": 239565, "epoch": 2886} {"train_loss": -25.007797241210938, "global_step": 239566, "epoch": 2886} {"train_loss": -24.397098541259766, "global_step": 239567, "epoch": 2886} {"train_loss": -25.003503799438477, "global_step": 239568, "epoch": 2886} {"train_loss": -24.561506271362305, "global_step": 239569, "epoch": 2886} {"train_loss": -25.067514419555664, "global_step": 239570, "epoch": 2886} {"train_loss": -24.736480712890625, "global_step": 239571, "epoch": 2886} {"train_loss": -24.868906021118164, "global_step": 239572, "epoch": 2886} {"train_loss": -24.621519088745117, "global_step": 239573, "epoch": 2886} {"train_loss": -24.85966682434082, "global_step": 239574, "epoch": 2886} {"train_loss": -24.56574058532715, "global_step": 239575, "epoch": 2886} {"train_loss": -24.897851943969727, "global_step": 239576, "epoch": 2886} {"train_loss": -24.69623374938965, "global_step": 239577, "epoch": 2886} {"train_loss": -24.793216705322266, "global_step": 239578, "epoch": 2886} {"train_loss": -24.833160400390625, "global_step": 239579, "epoch": 2886} {"train_loss": -24.912559509277344, "global_step": 239580, "epoch": 2886} {"train_loss": -24.93941307067871, "global_step": 239581, "epoch": 2886} {"train_loss": -25.21351432800293, "global_step": 239582, "epoch": 2886} {"train_loss": -24.80360221862793, "global_step": 239583, "epoch": 2886} {"train_loss": -24.857831954956055, "global_step": 239584, "epoch": 2886} {"train_loss": -24.963245391845703, "global_step": 239585, "epoch": 2886} {"train_loss": -24.927597045898438, "global_step": 239586, "epoch": 2886} {"train_loss": -24.769445419311523, "global_step": 239587, "epoch": 2886} {"train_loss": -24.968881607055664, "global_step": 239588, "epoch": 2886} {"train_loss": -25.164043426513672, "global_step": 239589, "epoch": 2886} {"train_loss": -25.295360565185547, "global_step": 239590, "epoch": 2886} {"train_loss": -24.954626083374023, "global_step": 239591, "epoch": 2886} {"train_loss": -24.84267234802246, "global_step": 239592, "epoch": 2886} {"train_loss": -24.724308013916016, "global_step": 239593, "epoch": 2886} {"train_loss": -24.808469772338867, "global_step": 239594, "epoch": 2886} {"train_loss": -25.20638084411621, "global_step": 239595, "epoch": 2886} {"train_loss": -24.599414825439453, "global_step": 239596, "epoch": 2886} {"train_loss": -24.987590789794922, "global_step": 239597, "epoch": 2886} {"train_loss": -25.358163833618164, "global_step": 239598, "epoch": 2886} {"train_loss": -24.914661407470703, "global_step": 239599, "epoch": 2886} {"train_loss": -24.706092834472656, "global_step": 239600, "epoch": 2886} {"train_loss": -25.071414947509766, "global_step": 239601, "epoch": 2886} {"train_loss": -25.11838150024414, "global_step": 239602, "epoch": 2886} {"train_loss": -25.107269287109375, "global_step": 239603, "epoch": 2886} {"train_loss": -25.223541259765625, "global_step": 239604, "epoch": 2886} {"train_loss": -24.924726486206055, "global_step": 239605, "epoch": 2886} {"train_loss": -25.066417694091797, "global_step": 239606, "epoch": 2886} {"train_loss": -24.9251651763916, "global_step": 239607, "epoch": 2886} {"train_loss": -25.02126121520996, "global_step": 239608, "epoch": 2886} {"train_loss": -25.171276092529297, "global_step": 239609, "epoch": 2886} {"train_loss": -25.095937728881836, "global_step": 239610, "epoch": 2886} {"train_loss": -24.867298126220703, "global_step": 239611, "epoch": 2886} {"train_loss": -24.99800682067871, "global_step": 239612, "epoch": 2886} {"train_loss": -25.09580421447754, "global_step": 239613, "epoch": 2886} {"train_loss": -24.73775291442871, "global_step": 239614, "epoch": 2886} {"train_loss": -24.99134063720703, "global_step": 239615, "epoch": 2886} {"train_loss": -24.73517417907715, "global_step": 239616, "epoch": 2886} {"train_loss": -24.741138458251953, "global_step": 239617, "epoch": 2886} {"train_loss": -25.15315818786621, "global_step": 239618, "epoch": 2886} {"train_loss": -25.090534210205078, "global_step": 239619, "epoch": 2886} {"train_loss": -24.749945789934642, "global_step": 239620, "epoch": 2886, "val_loss": 6885104.5} {"train_loss": -23.658159255981445, "global_step": 239621, "epoch": 2887} {"train_loss": -24.554859161376953, "global_step": 239622, "epoch": 2887} {"train_loss": -24.257123947143555, "global_step": 239623, "epoch": 2887} {"train_loss": -24.112812042236328, "global_step": 239624, "epoch": 2887} {"train_loss": -24.593029022216797, "global_step": 239625, "epoch": 2887} {"train_loss": -23.956226348876953, "global_step": 239626, "epoch": 2887} {"train_loss": -24.304187774658203, "global_step": 239627, "epoch": 2887} {"train_loss": -24.259986877441406, "global_step": 239628, "epoch": 2887} {"train_loss": -23.886327743530273, "global_step": 239629, "epoch": 2887} {"train_loss": -24.537799835205078, "global_step": 239630, "epoch": 2887} {"train_loss": -24.286361694335938, "global_step": 239631, "epoch": 2887} {"train_loss": -24.25564956665039, "global_step": 239632, "epoch": 2887} {"train_loss": -24.399211883544922, "global_step": 239633, "epoch": 2887} {"train_loss": -24.515302658081055, "global_step": 239634, "epoch": 2887} {"train_loss": -24.44013786315918, "global_step": 239635, "epoch": 2887} {"train_loss": -24.633939743041992, "global_step": 239636, "epoch": 2887} {"train_loss": -24.57522964477539, "global_step": 239637, "epoch": 2887} {"train_loss": -24.61403465270996, "global_step": 239638, "epoch": 2887} {"train_loss": -24.543792724609375, "global_step": 239639, "epoch": 2887} {"train_loss": -24.2559871673584, "global_step": 239640, "epoch": 2887} {"train_loss": -24.5051326751709, "global_step": 239641, "epoch": 2887} {"train_loss": -24.774993896484375, "global_step": 239642, "epoch": 2887} {"train_loss": -24.73748207092285, "global_step": 239643, "epoch": 2887} {"train_loss": -24.696308135986328, "global_step": 239644, "epoch": 2887} {"train_loss": -24.933378219604492, "global_step": 239645, "epoch": 2887} {"train_loss": -24.590436935424805, "global_step": 239646, "epoch": 2887} {"train_loss": -24.533506393432617, "global_step": 239647, "epoch": 2887} {"train_loss": -25.118898391723633, "global_step": 239648, "epoch": 2887} {"train_loss": -25.027374267578125, "global_step": 239649, "epoch": 2887} {"train_loss": -24.87283706665039, "global_step": 239650, "epoch": 2887} {"train_loss": -24.99773597717285, "global_step": 239651, "epoch": 2887} {"train_loss": -24.710901260375977, "global_step": 239652, "epoch": 2887} {"train_loss": -24.932947158813477, "global_step": 239653, "epoch": 2887} {"train_loss": -24.805185317993164, "global_step": 239654, "epoch": 2887} {"train_loss": -25.054990768432617, "global_step": 239655, "epoch": 2887} {"train_loss": -24.78476905822754, "global_step": 239656, "epoch": 2887} {"train_loss": -25.22639274597168, "global_step": 239657, "epoch": 2887} {"train_loss": -24.84525489807129, "global_step": 239658, "epoch": 2887} {"train_loss": -24.898584365844727, "global_step": 239659, "epoch": 2887} {"train_loss": -24.890613555908203, "global_step": 239660, "epoch": 2887} {"train_loss": -25.071765899658203, "global_step": 239661, "epoch": 2887} {"train_loss": -24.799421310424805, "global_step": 239662, "epoch": 2887} {"train_loss": -24.815425872802734, "global_step": 239663, "epoch": 2887} {"train_loss": -25.304946899414062, "global_step": 239664, "epoch": 2887} {"train_loss": -24.463754653930664, "global_step": 239665, "epoch": 2887} {"train_loss": -24.642820358276367, "global_step": 239666, "epoch": 2887} {"train_loss": -25.216880798339844, "global_step": 239667, "epoch": 2887} {"train_loss": -25.05649757385254, "global_step": 239668, "epoch": 2887} {"train_loss": -24.74880027770996, "global_step": 239669, "epoch": 2887} {"train_loss": -24.77260398864746, "global_step": 239670, "epoch": 2887} {"train_loss": -25.154356002807617, "global_step": 239671, "epoch": 2887} {"train_loss": -24.8568172454834, "global_step": 239672, "epoch": 2887} {"train_loss": -24.708629608154297, "global_step": 239673, "epoch": 2887} {"train_loss": -24.973657608032227, "global_step": 239674, "epoch": 2887} {"train_loss": -24.849462509155273, "global_step": 239675, "epoch": 2887} {"train_loss": -25.22041893005371, "global_step": 239676, "epoch": 2887} {"train_loss": -24.813756942749023, "global_step": 239677, "epoch": 2887} {"train_loss": -24.806427001953125, "global_step": 239678, "epoch": 2887} {"train_loss": -25.040725708007812, "global_step": 239679, "epoch": 2887} {"train_loss": -25.16293716430664, "global_step": 239680, "epoch": 2887} {"train_loss": -24.804630279541016, "global_step": 239681, "epoch": 2887} {"train_loss": -24.843006134033203, "global_step": 239682, "epoch": 2887} {"train_loss": -24.982152938842773, "global_step": 239683, "epoch": 2887} {"train_loss": -24.762256622314453, "global_step": 239684, "epoch": 2887} {"train_loss": -24.729450225830078, "global_step": 239685, "epoch": 2887} {"train_loss": -25.18447494506836, "global_step": 239686, "epoch": 2887} {"train_loss": -24.6740779876709, "global_step": 239687, "epoch": 2887} {"train_loss": -24.409177780151367, "global_step": 239688, "epoch": 2887} {"train_loss": -24.6113338470459, "global_step": 239689, "epoch": 2887} {"train_loss": -24.772974014282227, "global_step": 239690, "epoch": 2887} {"train_loss": -24.68039894104004, "global_step": 239691, "epoch": 2887} {"train_loss": -24.817903518676758, "global_step": 239692, "epoch": 2887} {"train_loss": -24.865524291992188, "global_step": 239693, "epoch": 2887} {"train_loss": -25.054458618164062, "global_step": 239694, "epoch": 2887} {"train_loss": -24.704431533813477, "global_step": 239695, "epoch": 2887} {"train_loss": -25.169836044311523, "global_step": 239696, "epoch": 2887} {"train_loss": -24.83271598815918, "global_step": 239697, "epoch": 2887} {"train_loss": -25.10750389099121, "global_step": 239698, "epoch": 2887} {"train_loss": -24.93243980407715, "global_step": 239699, "epoch": 2887} {"train_loss": -24.71240234375, "global_step": 239700, "epoch": 2887} {"train_loss": -24.856101989746094, "global_step": 239701, "epoch": 2887} {"train_loss": -24.802093505859375, "global_step": 239702, "epoch": 2887} {"train_loss": -24.71428165665592, "global_step": 239703, "epoch": 2887, "val_loss": 6824865.5} {"train_loss": -24.441282272338867, "global_step": 239704, "epoch": 2888} {"train_loss": -24.31625747680664, "global_step": 239705, "epoch": 2888} {"train_loss": -24.424030303955078, "global_step": 239706, "epoch": 2888} {"train_loss": -24.438413619995117, "global_step": 239707, "epoch": 2888} {"train_loss": -24.37332534790039, "global_step": 239708, "epoch": 2888} {"train_loss": -24.83650779724121, "global_step": 239709, "epoch": 2888} {"train_loss": -24.406612396240234, "global_step": 239710, "epoch": 2888} {"train_loss": -24.510997772216797, "global_step": 239711, "epoch": 2888} {"train_loss": -24.549484252929688, "global_step": 239712, "epoch": 2888} {"train_loss": -24.252216339111328, "global_step": 239713, "epoch": 2888} {"train_loss": -24.575565338134766, "global_step": 239714, "epoch": 2888} {"train_loss": -24.837427139282227, "global_step": 239715, "epoch": 2888} {"train_loss": -24.625995635986328, "global_step": 239716, "epoch": 2888} {"train_loss": -24.813522338867188, "global_step": 239717, "epoch": 2888} {"train_loss": -24.41176414489746, "global_step": 239718, "epoch": 2888} {"train_loss": -24.64143180847168, "global_step": 239719, "epoch": 2888} {"train_loss": -24.477815628051758, "global_step": 239720, "epoch": 2888} {"train_loss": -24.471281051635742, "global_step": 239721, "epoch": 2888} {"train_loss": -24.839670181274414, "global_step": 239722, "epoch": 2888} {"train_loss": -24.866531372070312, "global_step": 239723, "epoch": 2888} {"train_loss": -24.876617431640625, "global_step": 239724, "epoch": 2888} {"train_loss": -24.851240158081055, "global_step": 239725, "epoch": 2888} {"train_loss": -24.902292251586914, "global_step": 239726, "epoch": 2888} {"train_loss": -24.857402801513672, "global_step": 239727, "epoch": 2888} {"train_loss": -25.017919540405273, "global_step": 239728, "epoch": 2888} {"train_loss": -24.55791664123535, "global_step": 239729, "epoch": 2888} {"train_loss": -24.880033493041992, "global_step": 239730, "epoch": 2888} {"train_loss": -25.080026626586914, "global_step": 239731, "epoch": 2888} {"train_loss": -24.94334602355957, "global_step": 239732, "epoch": 2888} {"train_loss": -24.905752182006836, "global_step": 239733, "epoch": 2888} {"train_loss": -24.825780868530273, "global_step": 239734, "epoch": 2888} {"train_loss": -24.783639907836914, "global_step": 239735, "epoch": 2888} {"train_loss": -25.01402473449707, "global_step": 239736, "epoch": 2888} {"train_loss": -25.509923934936523, "global_step": 239737, "epoch": 2888} {"train_loss": -24.592857360839844, "global_step": 239738, "epoch": 2888} {"train_loss": -24.981582641601562, "global_step": 239739, "epoch": 2888} {"train_loss": -24.545467376708984, "global_step": 239740, "epoch": 2888} {"train_loss": -25.15546989440918, "global_step": 239741, "epoch": 2888} {"train_loss": -24.468957901000977, "global_step": 239742, "epoch": 2888} {"train_loss": -24.8775691986084, "global_step": 239743, "epoch": 2888} {"train_loss": -24.713979721069336, "global_step": 239744, "epoch": 2888} {"train_loss": -25.24323844909668, "global_step": 239745, "epoch": 2888} {"train_loss": -24.7414493560791, "global_step": 239746, "epoch": 2888} {"train_loss": -24.924875259399414, "global_step": 239747, "epoch": 2888} {"train_loss": -25.072484970092773, "global_step": 239748, "epoch": 2888} {"train_loss": -25.064451217651367, "global_step": 239749, "epoch": 2888} {"train_loss": -25.042343139648438, "global_step": 239750, "epoch": 2888} {"train_loss": -24.886398315429688, "global_step": 239751, "epoch": 2888} {"train_loss": -24.753747940063477, "global_step": 239752, "epoch": 2888} {"train_loss": -25.18856430053711, "global_step": 239753, "epoch": 2888} {"train_loss": -25.171066284179688, "global_step": 239754, "epoch": 2888} {"train_loss": -24.953474044799805, "global_step": 239755, "epoch": 2888} {"train_loss": -24.968595504760742, "global_step": 239756, "epoch": 2888} {"train_loss": -24.72833824157715, "global_step": 239757, "epoch": 2888} {"train_loss": -24.51827621459961, "global_step": 239758, "epoch": 2888} {"train_loss": -24.55099868774414, "global_step": 239759, "epoch": 2888} {"train_loss": -24.37156105041504, "global_step": 239760, "epoch": 2888} {"train_loss": -25.174184799194336, "global_step": 239761, "epoch": 2888} {"train_loss": -24.665191650390625, "global_step": 239762, "epoch": 2888} {"train_loss": -24.893310546875, "global_step": 239763, "epoch": 2888} {"train_loss": -24.56627082824707, "global_step": 239764, "epoch": 2888} {"train_loss": -24.747472763061523, "global_step": 239765, "epoch": 2888} {"train_loss": -25.073719024658203, "global_step": 239766, "epoch": 2888} {"train_loss": -24.884408950805664, "global_step": 239767, "epoch": 2888} {"train_loss": -24.768836975097656, "global_step": 239768, "epoch": 2888} {"train_loss": -25.130460739135742, "global_step": 239769, "epoch": 2888} {"train_loss": -24.98687171936035, "global_step": 239770, "epoch": 2888} {"train_loss": -24.798965454101562, "global_step": 239771, "epoch": 2888} {"train_loss": -24.709766387939453, "global_step": 239772, "epoch": 2888} {"train_loss": -24.577043533325195, "global_step": 239773, "epoch": 2888} {"train_loss": -25.280492782592773, "global_step": 239774, "epoch": 2888} {"train_loss": -24.957639694213867, "global_step": 239775, "epoch": 2888} {"train_loss": -24.87725830078125, "global_step": 239776, "epoch": 2888} {"train_loss": -25.125974655151367, "global_step": 239777, "epoch": 2888} {"train_loss": -25.16725730895996, "global_step": 239778, "epoch": 2888} {"train_loss": -24.94498062133789, "global_step": 239779, "epoch": 2888} {"train_loss": -24.740053176879883, "global_step": 239780, "epoch": 2888} {"train_loss": -25.114768981933594, "global_step": 239781, "epoch": 2888} {"train_loss": -24.794879913330078, "global_step": 239782, "epoch": 2888} {"train_loss": -24.954511642456055, "global_step": 239783, "epoch": 2888} {"train_loss": -25.365724563598633, "global_step": 239784, "epoch": 2888} {"train_loss": -24.640899658203125, "global_step": 239785, "epoch": 2888} {"train_loss": -24.81371180982475, "global_step": 239786, "epoch": 2888, "val_loss": 6915866.0} {"train_loss": -23.671113967895508, "global_step": 239787, "epoch": 2889} {"train_loss": -24.468936920166016, "global_step": 239788, "epoch": 2889} {"train_loss": -23.904010772705078, "global_step": 239789, "epoch": 2889} {"train_loss": -23.529056549072266, "global_step": 239790, "epoch": 2889} {"train_loss": -24.180639266967773, "global_step": 239791, "epoch": 2889} {"train_loss": -24.33935546875, "global_step": 239792, "epoch": 2889} {"train_loss": -24.221139907836914, "global_step": 239793, "epoch": 2889} {"train_loss": -24.41983985900879, "global_step": 239794, "epoch": 2889} {"train_loss": -24.40895652770996, "global_step": 239795, "epoch": 2889} {"train_loss": -24.18893814086914, "global_step": 239796, "epoch": 2889} {"train_loss": -24.126379013061523, "global_step": 239797, "epoch": 2889} {"train_loss": -24.3426513671875, "global_step": 239798, "epoch": 2889} {"train_loss": -24.142637252807617, "global_step": 239799, "epoch": 2889} {"train_loss": -24.04400062561035, "global_step": 239800, "epoch": 2889} {"train_loss": -24.58680534362793, "global_step": 239801, "epoch": 2889} {"train_loss": -24.56485366821289, "global_step": 239802, "epoch": 2889} {"train_loss": -24.381900787353516, "global_step": 239803, "epoch": 2889} {"train_loss": -24.793155670166016, "global_step": 239804, "epoch": 2889} {"train_loss": -24.505197525024414, "global_step": 239805, "epoch": 2889} {"train_loss": -24.89609718322754, "global_step": 239806, "epoch": 2889} {"train_loss": -24.459949493408203, "global_step": 239807, "epoch": 2889} {"train_loss": -24.69178581237793, "global_step": 239808, "epoch": 2889} {"train_loss": -24.799955368041992, "global_step": 239809, "epoch": 2889} {"train_loss": -24.826351165771484, "global_step": 239810, "epoch": 2889} {"train_loss": -25.02708625793457, "global_step": 239811, "epoch": 2889} {"train_loss": -25.11032485961914, "global_step": 239812, "epoch": 2889} {"train_loss": -24.743783950805664, "global_step": 239813, "epoch": 2889} {"train_loss": -24.981632232666016, "global_step": 239814, "epoch": 2889} {"train_loss": -24.799230575561523, "global_step": 239815, "epoch": 2889} {"train_loss": -24.849454879760742, "global_step": 239816, "epoch": 2889} {"train_loss": -24.82962989807129, "global_step": 239817, "epoch": 2889} {"train_loss": -24.61656379699707, "global_step": 239818, "epoch": 2889} {"train_loss": -24.996646881103516, "global_step": 239819, "epoch": 2889} {"train_loss": -24.823749542236328, "global_step": 239820, "epoch": 2889} {"train_loss": -24.772018432617188, "global_step": 239821, "epoch": 2889} {"train_loss": -25.1337890625, "global_step": 239822, "epoch": 2889} {"train_loss": -24.856800079345703, "global_step": 239823, "epoch": 2889} {"train_loss": -24.787649154663086, "global_step": 239824, "epoch": 2889} {"train_loss": -25.074132919311523, "global_step": 239825, "epoch": 2889} {"train_loss": -24.626760482788086, "global_step": 239826, "epoch": 2889} {"train_loss": -24.805444717407227, "global_step": 239827, "epoch": 2889} {"train_loss": -24.778453826904297, "global_step": 239828, "epoch": 2889} {"train_loss": -25.0621280670166, "global_step": 239829, "epoch": 2889} {"train_loss": -24.661046981811523, "global_step": 239830, "epoch": 2889} {"train_loss": -24.884098052978516, "global_step": 239831, "epoch": 2889} {"train_loss": -24.85688591003418, "global_step": 239832, "epoch": 2889} {"train_loss": -25.060850143432617, "global_step": 239833, "epoch": 2889} {"train_loss": -25.438085556030273, "global_step": 239834, "epoch": 2889} {"train_loss": -24.96015167236328, "global_step": 239835, "epoch": 2889} {"train_loss": -24.750585556030273, "global_step": 239836, "epoch": 2889} {"train_loss": -24.831619262695312, "global_step": 239837, "epoch": 2889} {"train_loss": -25.045040130615234, "global_step": 239838, "epoch": 2889} {"train_loss": -24.740903854370117, "global_step": 239839, "epoch": 2889} {"train_loss": -24.989988327026367, "global_step": 239840, "epoch": 2889} {"train_loss": -25.033353805541992, "global_step": 239841, "epoch": 2889} {"train_loss": -25.218677520751953, "global_step": 239842, "epoch": 2889} {"train_loss": -24.77920913696289, "global_step": 239843, "epoch": 2889} {"train_loss": -24.991270065307617, "global_step": 239844, "epoch": 2889} {"train_loss": -24.881624221801758, "global_step": 239845, "epoch": 2889} {"train_loss": -24.7310791015625, "global_step": 239846, "epoch": 2889} {"train_loss": -24.877363204956055, "global_step": 239847, "epoch": 2889} {"train_loss": -25.051334381103516, "global_step": 239848, "epoch": 2889} {"train_loss": -24.832237243652344, "global_step": 239849, "epoch": 2889} {"train_loss": -24.976890563964844, "global_step": 239850, "epoch": 2889} {"train_loss": -24.624359130859375, "global_step": 239851, "epoch": 2889} {"train_loss": -24.707304000854492, "global_step": 239852, "epoch": 2889} {"train_loss": -24.40142822265625, "global_step": 239853, "epoch": 2889} {"train_loss": -24.927534103393555, "global_step": 239854, "epoch": 2889} {"train_loss": -24.642139434814453, "global_step": 239855, "epoch": 2889} {"train_loss": -25.074604034423828, "global_step": 239856, "epoch": 2889} {"train_loss": -24.987110137939453, "global_step": 239857, "epoch": 2889} {"train_loss": -24.389097213745117, "global_step": 239858, "epoch": 2889} {"train_loss": -24.975475311279297, "global_step": 239859, "epoch": 2889} {"train_loss": -25.080772399902344, "global_step": 239860, "epoch": 2889} {"train_loss": -24.879369735717773, "global_step": 239861, "epoch": 2889} {"train_loss": -24.6943416595459, "global_step": 239862, "epoch": 2889} {"train_loss": -24.772825241088867, "global_step": 239863, "epoch": 2889} {"train_loss": -25.092361450195312, "global_step": 239864, "epoch": 2889} {"train_loss": -24.980016708374023, "global_step": 239865, "epoch": 2889} {"train_loss": -24.955854415893555, "global_step": 239866, "epoch": 2889} {"train_loss": -24.985462188720703, "global_step": 239867, "epoch": 2889} {"train_loss": -24.946853637695312, "global_step": 239868, "epoch": 2889} {"train_loss": -24.722263244261224, "global_step": 239869, "epoch": 2889, "val_loss": 6824291.0} {"train_loss": -24.486501693725586, "global_step": 239870, "epoch": 2890} {"train_loss": -24.2618408203125, "global_step": 239871, "epoch": 2890} {"train_loss": -24.358449935913086, "global_step": 239872, "epoch": 2890} {"train_loss": -24.450237274169922, "global_step": 239873, "epoch": 2890} {"train_loss": -24.329771041870117, "global_step": 239874, "epoch": 2890} {"train_loss": -24.58487319946289, "global_step": 239875, "epoch": 2890} {"train_loss": -24.638410568237305, "global_step": 239876, "epoch": 2890} {"train_loss": -24.3505859375, "global_step": 239877, "epoch": 2890} {"train_loss": -24.807804107666016, "global_step": 239878, "epoch": 2890} {"train_loss": -24.4962100982666, "global_step": 239879, "epoch": 2890} {"train_loss": -24.76656150817871, "global_step": 239880, "epoch": 2890} {"train_loss": -24.44203758239746, "global_step": 239881, "epoch": 2890} {"train_loss": -24.766315460205078, "global_step": 239882, "epoch": 2890} {"train_loss": -24.598623275756836, "global_step": 239883, "epoch": 2890} {"train_loss": -24.40949058532715, "global_step": 239884, "epoch": 2890} {"train_loss": -24.993459701538086, "global_step": 239885, "epoch": 2890} {"train_loss": -24.95699691772461, "global_step": 239886, "epoch": 2890} {"train_loss": -24.8445987701416, "global_step": 239887, "epoch": 2890} {"train_loss": -24.618757247924805, "global_step": 239888, "epoch": 2890} {"train_loss": -24.773212432861328, "global_step": 239889, "epoch": 2890} {"train_loss": -24.721967697143555, "global_step": 239890, "epoch": 2890} {"train_loss": -24.805551528930664, "global_step": 239891, "epoch": 2890} {"train_loss": -24.873228073120117, "global_step": 239892, "epoch": 2890} {"train_loss": -24.743955612182617, "global_step": 239893, "epoch": 2890} {"train_loss": -24.81842613220215, "global_step": 239894, "epoch": 2890} {"train_loss": -24.670053482055664, "global_step": 239895, "epoch": 2890} {"train_loss": -24.76706886291504, "global_step": 239896, "epoch": 2890} {"train_loss": -24.64808464050293, "global_step": 239897, "epoch": 2890} {"train_loss": -24.771305084228516, "global_step": 239898, "epoch": 2890} {"train_loss": -25.233604431152344, "global_step": 239899, "epoch": 2890} {"train_loss": -24.957483291625977, "global_step": 239900, "epoch": 2890} {"train_loss": -24.762643814086914, "global_step": 239901, "epoch": 2890} {"train_loss": -25.171213150024414, "global_step": 239902, "epoch": 2890} {"train_loss": -24.68290901184082, "global_step": 239903, "epoch": 2890} {"train_loss": -24.78868293762207, "global_step": 239904, "epoch": 2890} {"train_loss": -24.79344940185547, "global_step": 239905, "epoch": 2890} {"train_loss": -24.884626388549805, "global_step": 239906, "epoch": 2890} {"train_loss": -24.875329971313477, "global_step": 239907, "epoch": 2890} {"train_loss": -24.664194107055664, "global_step": 239908, "epoch": 2890} {"train_loss": -25.11799430847168, "global_step": 239909, "epoch": 2890} {"train_loss": -25.031646728515625, "global_step": 239910, "epoch": 2890} {"train_loss": -24.789892196655273, "global_step": 239911, "epoch": 2890} {"train_loss": -24.65867805480957, "global_step": 239912, "epoch": 2890} {"train_loss": -24.94012451171875, "global_step": 239913, "epoch": 2890} {"train_loss": -24.301227569580078, "global_step": 239914, "epoch": 2890} {"train_loss": -25.03535270690918, "global_step": 239915, "epoch": 2890} {"train_loss": -24.863922119140625, "global_step": 239916, "epoch": 2890} {"train_loss": -24.446338653564453, "global_step": 239917, "epoch": 2890} {"train_loss": -24.724102020263672, "global_step": 239918, "epoch": 2890} {"train_loss": -24.87769317626953, "global_step": 239919, "epoch": 2890} {"train_loss": -24.908771514892578, "global_step": 239920, "epoch": 2890} {"train_loss": -25.03154754638672, "global_step": 239921, "epoch": 2890} {"train_loss": -24.846261978149414, "global_step": 239922, "epoch": 2890} {"train_loss": -24.828983306884766, "global_step": 239923, "epoch": 2890} {"train_loss": -24.67396354675293, "global_step": 239924, "epoch": 2890} {"train_loss": -24.85392951965332, "global_step": 239925, "epoch": 2890} {"train_loss": -24.47775650024414, "global_step": 239926, "epoch": 2890} {"train_loss": -24.61270523071289, "global_step": 239927, "epoch": 2890} {"train_loss": -24.48830795288086, "global_step": 239928, "epoch": 2890} {"train_loss": -24.78172492980957, "global_step": 239929, "epoch": 2890} {"train_loss": -24.823434829711914, "global_step": 239930, "epoch": 2890} {"train_loss": -24.653690338134766, "global_step": 239931, "epoch": 2890} {"train_loss": -24.9619083404541, "global_step": 239932, "epoch": 2890} {"train_loss": -24.892135620117188, "global_step": 239933, "epoch": 2890} {"train_loss": -24.788421630859375, "global_step": 239934, "epoch": 2890} {"train_loss": -25.13754653930664, "global_step": 239935, "epoch": 2890} {"train_loss": -24.741992950439453, "global_step": 239936, "epoch": 2890} {"train_loss": -24.96681022644043, "global_step": 239937, "epoch": 2890} {"train_loss": -24.77528953552246, "global_step": 239938, "epoch": 2890} {"train_loss": -24.990985870361328, "global_step": 239939, "epoch": 2890} {"train_loss": -25.150449752807617, "global_step": 239940, "epoch": 2890} {"train_loss": -24.717321395874023, "global_step": 239941, "epoch": 2890} {"train_loss": -25.05885124206543, "global_step": 239942, "epoch": 2890} {"train_loss": -24.8538761138916, "global_step": 239943, "epoch": 2890} {"train_loss": -25.200162887573242, "global_step": 239944, "epoch": 2890} {"train_loss": -25.193286895751953, "global_step": 239945, "epoch": 2890} {"train_loss": -24.82575798034668, "global_step": 239946, "epoch": 2890} {"train_loss": -25.10933494567871, "global_step": 239947, "epoch": 2890} {"train_loss": -24.767118453979492, "global_step": 239948, "epoch": 2890} {"train_loss": -24.75472068786621, "global_step": 239949, "epoch": 2890} {"train_loss": -25.370359420776367, "global_step": 239950, "epoch": 2890} {"train_loss": -25.053617477416992, "global_step": 239951, "epoch": 2890} {"train_loss": -24.795649402112847, "global_step": 239952, "epoch": 2890, "val_loss": 6849621.0} {"train_loss": -24.912616729736328, "global_step": 239953, "epoch": 2891} {"train_loss": -24.54680824279785, "global_step": 239954, "epoch": 2891} {"train_loss": -24.789209365844727, "global_step": 239955, "epoch": 2891} {"train_loss": -24.541044235229492, "global_step": 239956, "epoch": 2891} {"train_loss": -24.509614944458008, "global_step": 239957, "epoch": 2891} {"train_loss": -24.615131378173828, "global_step": 239958, "epoch": 2891} {"train_loss": -24.23895263671875, "global_step": 239959, "epoch": 2891} {"train_loss": -24.495059967041016, "global_step": 239960, "epoch": 2891} {"train_loss": -24.388275146484375, "global_step": 239961, "epoch": 2891} {"train_loss": -24.56098747253418, "global_step": 239962, "epoch": 2891} {"train_loss": -24.385540008544922, "global_step": 239963, "epoch": 2891} {"train_loss": -24.82696533203125, "global_step": 239964, "epoch": 2891} {"train_loss": -24.266510009765625, "global_step": 239965, "epoch": 2891} {"train_loss": -24.691625595092773, "global_step": 239966, "epoch": 2891} {"train_loss": -24.603654861450195, "global_step": 239967, "epoch": 2891} {"train_loss": -24.83693504333496, "global_step": 239968, "epoch": 2891} {"train_loss": -24.493244171142578, "global_step": 239969, "epoch": 2891} {"train_loss": -24.56995964050293, "global_step": 239970, "epoch": 2891} {"train_loss": -24.972110748291016, "global_step": 239971, "epoch": 2891} {"train_loss": -24.58957862854004, "global_step": 239972, "epoch": 2891} {"train_loss": -24.748361587524414, "global_step": 239973, "epoch": 2891} {"train_loss": -25.02035903930664, "global_step": 239974, "epoch": 2891} {"train_loss": -24.64762306213379, "global_step": 239975, "epoch": 2891} {"train_loss": -25.0428524017334, "global_step": 239976, "epoch": 2891} {"train_loss": -24.920063018798828, "global_step": 239977, "epoch": 2891} {"train_loss": -24.505075454711914, "global_step": 239978, "epoch": 2891} {"train_loss": -24.702009201049805, "global_step": 239979, "epoch": 2891} {"train_loss": -24.784072875976562, "global_step": 239980, "epoch": 2891} {"train_loss": -24.442846298217773, "global_step": 239981, "epoch": 2891} {"train_loss": -24.6613712310791, "global_step": 239982, "epoch": 2891} {"train_loss": -25.290206909179688, "global_step": 239983, "epoch": 2891} {"train_loss": -24.87769317626953, "global_step": 239984, "epoch": 2891} {"train_loss": -24.653230667114258, "global_step": 239985, "epoch": 2891} {"train_loss": -24.876941680908203, "global_step": 239986, "epoch": 2891} {"train_loss": -25.1267147064209, "global_step": 239987, "epoch": 2891} {"train_loss": -24.5328311920166, "global_step": 239988, "epoch": 2891} {"train_loss": -24.892717361450195, "global_step": 239989, "epoch": 2891} {"train_loss": -24.95870018005371, "global_step": 239990, "epoch": 2891} {"train_loss": -24.6616268157959, "global_step": 239991, "epoch": 2891} {"train_loss": -24.84510612487793, "global_step": 239992, "epoch": 2891} {"train_loss": -24.98103141784668, "global_step": 239993, "epoch": 2891} {"train_loss": -25.123437881469727, "global_step": 239994, "epoch": 2891} {"train_loss": -24.907936096191406, "global_step": 239995, "epoch": 2891} {"train_loss": -25.258420944213867, "global_step": 239996, "epoch": 2891} {"train_loss": -25.037221908569336, "global_step": 239997, "epoch": 2891} {"train_loss": -24.977033615112305, "global_step": 239998, "epoch": 2891} {"train_loss": -24.651447296142578, "global_step": 239999, "epoch": 2891} {"train_loss": -25.16761016845703, "global_step": 240000, "epoch": 2891} {"train_loss": -25.11868667602539, "global_step": 240001, "epoch": 2891} {"train_loss": -25.225311279296875, "global_step": 240002, "epoch": 2891} {"train_loss": -24.907278060913086, "global_step": 240003, "epoch": 2891} {"train_loss": -25.181791305541992, "global_step": 240004, "epoch": 2891} {"train_loss": -25.066694259643555, "global_step": 240005, "epoch": 2891} {"train_loss": -24.79854393005371, "global_step": 240006, "epoch": 2891} {"train_loss": -24.8186092376709, "global_step": 240007, "epoch": 2891} {"train_loss": -24.88498878479004, "global_step": 240008, "epoch": 2891} {"train_loss": -25.054489135742188, "global_step": 240009, "epoch": 2891} {"train_loss": -24.749258041381836, "global_step": 240010, "epoch": 2891} {"train_loss": -24.707447052001953, "global_step": 240011, "epoch": 2891} {"train_loss": -24.601505279541016, "global_step": 240012, "epoch": 2891} {"train_loss": -25.063007354736328, "global_step": 240013, "epoch": 2891} {"train_loss": -24.80673599243164, "global_step": 240014, "epoch": 2891} {"train_loss": -24.795087814331055, "global_step": 240015, "epoch": 2891} {"train_loss": -24.884109497070312, "global_step": 240016, "epoch": 2891} {"train_loss": -24.72612190246582, "global_step": 240017, "epoch": 2891} {"train_loss": -24.958005905151367, "global_step": 240018, "epoch": 2891} {"train_loss": -24.858596801757812, "global_step": 240019, "epoch": 2891} {"train_loss": -24.93865394592285, "global_step": 240020, "epoch": 2891} {"train_loss": -24.69101333618164, "global_step": 240021, "epoch": 2891} {"train_loss": -24.657745361328125, "global_step": 240022, "epoch": 2891} {"train_loss": -24.89525604248047, "global_step": 240023, "epoch": 2891} {"train_loss": -24.718820571899414, "global_step": 240024, "epoch": 2891} {"train_loss": -24.713956832885742, "global_step": 240025, "epoch": 2891} {"train_loss": -24.922853469848633, "global_step": 240026, "epoch": 2891} {"train_loss": -24.437040328979492, "global_step": 240027, "epoch": 2891} {"train_loss": -24.735517501831055, "global_step": 240028, "epoch": 2891} {"train_loss": -25.15296745300293, "global_step": 240029, "epoch": 2891} {"train_loss": -24.880996704101562, "global_step": 240030, "epoch": 2891} {"train_loss": -24.820819854736328, "global_step": 240031, "epoch": 2891} {"train_loss": -25.0283203125, "global_step": 240032, "epoch": 2891} {"train_loss": -25.121543884277344, "global_step": 240033, "epoch": 2891} {"train_loss": -24.723899841308594, "global_step": 240034, "epoch": 2891} {"train_loss": -24.803780015692652, "global_step": 240035, "epoch": 2891, "val_loss": 6731888.5} {"train_loss": -23.829288482666016, "global_step": 240036, "epoch": 2892} {"train_loss": -23.985246658325195, "global_step": 240037, "epoch": 2892} {"train_loss": -23.523395538330078, "global_step": 240038, "epoch": 2892} {"train_loss": -23.946613311767578, "global_step": 240039, "epoch": 2892} {"train_loss": -24.126005172729492, "global_step": 240040, "epoch": 2892} {"train_loss": -24.55710220336914, "global_step": 240041, "epoch": 2892} {"train_loss": -24.37677574157715, "global_step": 240042, "epoch": 2892} {"train_loss": -24.80877113342285, "global_step": 240043, "epoch": 2892} {"train_loss": -24.54883575439453, "global_step": 240044, "epoch": 2892} {"train_loss": -24.538877487182617, "global_step": 240045, "epoch": 2892} {"train_loss": -24.56996726989746, "global_step": 240046, "epoch": 2892} {"train_loss": -24.755849838256836, "global_step": 240047, "epoch": 2892} {"train_loss": -24.415897369384766, "global_step": 240048, "epoch": 2892} {"train_loss": -24.615854263305664, "global_step": 240049, "epoch": 2892} {"train_loss": -24.58491325378418, "global_step": 240050, "epoch": 2892} {"train_loss": -24.881635665893555, "global_step": 240051, "epoch": 2892} {"train_loss": -24.72064208984375, "global_step": 240052, "epoch": 2892} {"train_loss": -24.568029403686523, "global_step": 240053, "epoch": 2892} {"train_loss": -25.033641815185547, "global_step": 240054, "epoch": 2892} {"train_loss": -24.60993003845215, "global_step": 240055, "epoch": 2892} {"train_loss": -24.854812622070312, "global_step": 240056, "epoch": 2892} {"train_loss": -24.85127830505371, "global_step": 240057, "epoch": 2892} {"train_loss": -25.097753524780273, "global_step": 240058, "epoch": 2892} {"train_loss": -24.67877960205078, "global_step": 240059, "epoch": 2892} {"train_loss": -25.041616439819336, "global_step": 240060, "epoch": 2892} {"train_loss": -24.699636459350586, "global_step": 240061, "epoch": 2892} {"train_loss": -24.664709091186523, "global_step": 240062, "epoch": 2892} {"train_loss": -25.13490867614746, "global_step": 240063, "epoch": 2892} {"train_loss": -24.550235748291016, "global_step": 240064, "epoch": 2892} {"train_loss": -24.550647735595703, "global_step": 240065, "epoch": 2892} {"train_loss": -24.540937423706055, "global_step": 240066, "epoch": 2892} {"train_loss": -24.414152145385742, "global_step": 240067, "epoch": 2892} {"train_loss": -25.004995346069336, "global_step": 240068, "epoch": 2892} {"train_loss": -24.94709587097168, "global_step": 240069, "epoch": 2892} {"train_loss": -24.586566925048828, "global_step": 240070, "epoch": 2892} {"train_loss": -24.91263198852539, "global_step": 240071, "epoch": 2892} {"train_loss": -24.8984317779541, "global_step": 240072, "epoch": 2892} {"train_loss": -24.844892501831055, "global_step": 240073, "epoch": 2892} {"train_loss": -24.8983154296875, "global_step": 240074, "epoch": 2892} {"train_loss": -24.978404998779297, "global_step": 240075, "epoch": 2892} {"train_loss": -24.783721923828125, "global_step": 240076, "epoch": 2892} {"train_loss": -25.07852554321289, "global_step": 240077, "epoch": 2892} {"train_loss": -24.588525772094727, "global_step": 240078, "epoch": 2892} {"train_loss": -24.858036041259766, "global_step": 240079, "epoch": 2892} {"train_loss": -24.666791915893555, "global_step": 240080, "epoch": 2892} {"train_loss": -24.12249755859375, "global_step": 240081, "epoch": 2892} {"train_loss": -25.05403709411621, "global_step": 240082, "epoch": 2892} {"train_loss": -24.531972885131836, "global_step": 240083, "epoch": 2892} {"train_loss": -24.648880004882812, "global_step": 240084, "epoch": 2892} {"train_loss": -24.606630325317383, "global_step": 240085, "epoch": 2892} {"train_loss": -25.071077346801758, "global_step": 240086, "epoch": 2892} {"train_loss": -24.731735229492188, "global_step": 240087, "epoch": 2892} {"train_loss": -24.73361587524414, "global_step": 240088, "epoch": 2892} {"train_loss": -24.99236488342285, "global_step": 240089, "epoch": 2892} {"train_loss": -24.836685180664062, "global_step": 240090, "epoch": 2892} {"train_loss": -25.166168212890625, "global_step": 240091, "epoch": 2892} {"train_loss": -24.842374801635742, "global_step": 240092, "epoch": 2892} {"train_loss": -24.85790252685547, "global_step": 240093, "epoch": 2892} {"train_loss": -24.708749771118164, "global_step": 240094, "epoch": 2892} {"train_loss": -25.139135360717773, "global_step": 240095, "epoch": 2892} {"train_loss": -24.69179916381836, "global_step": 240096, "epoch": 2892} {"train_loss": -24.907800674438477, "global_step": 240097, "epoch": 2892} {"train_loss": -24.689741134643555, "global_step": 240098, "epoch": 2892} {"train_loss": -24.60849380493164, "global_step": 240099, "epoch": 2892} {"train_loss": -24.92510986328125, "global_step": 240100, "epoch": 2892} {"train_loss": -24.94264030456543, "global_step": 240101, "epoch": 2892} {"train_loss": -25.025867462158203, "global_step": 240102, "epoch": 2892} {"train_loss": -25.199871063232422, "global_step": 240103, "epoch": 2892} {"train_loss": -25.216930389404297, "global_step": 240104, "epoch": 2892} {"train_loss": -25.007001876831055, "global_step": 240105, "epoch": 2892} {"train_loss": -24.96578025817871, "global_step": 240106, "epoch": 2892} {"train_loss": -24.97144889831543, "global_step": 240107, "epoch": 2892} {"train_loss": -25.2445011138916, "global_step": 240108, "epoch": 2892} {"train_loss": -25.189937591552734, "global_step": 240109, "epoch": 2892} {"train_loss": -24.823949813842773, "global_step": 240110, "epoch": 2892} {"train_loss": -25.226316452026367, "global_step": 240111, "epoch": 2892} {"train_loss": -25.228050231933594, "global_step": 240112, "epoch": 2892} {"train_loss": -24.979734420776367, "global_step": 240113, "epoch": 2892} {"train_loss": -25.214567184448242, "global_step": 240114, "epoch": 2892} {"train_loss": -25.286285400390625, "global_step": 240115, "epoch": 2892} {"train_loss": -25.069263458251953, "global_step": 240116, "epoch": 2892} {"train_loss": -25.103422164916992, "global_step": 240117, "epoch": 2892} {"train_loss": -24.77864692871829, "global_step": 240118, "epoch": 2892, "val_loss": 6827082.0} {"train_loss": -24.160831451416016, "global_step": 240119, "epoch": 2893} {"train_loss": -24.548782348632812, "global_step": 240120, "epoch": 2893} {"train_loss": -24.213903427124023, "global_step": 240121, "epoch": 2893} {"train_loss": -25.000490188598633, "global_step": 240122, "epoch": 2893} {"train_loss": -24.563535690307617, "global_step": 240123, "epoch": 2893} {"train_loss": -24.78794288635254, "global_step": 240124, "epoch": 2893} {"train_loss": -24.33578872680664, "global_step": 240125, "epoch": 2893} {"train_loss": -24.572065353393555, "global_step": 240126, "epoch": 2893} {"train_loss": -24.4103946685791, "global_step": 240127, "epoch": 2893} {"train_loss": -24.911930084228516, "global_step": 240128, "epoch": 2893} {"train_loss": -24.698394775390625, "global_step": 240129, "epoch": 2893} {"train_loss": -24.612258911132812, "global_step": 240130, "epoch": 2893} {"train_loss": -24.754436492919922, "global_step": 240131, "epoch": 2893} {"train_loss": -24.85735511779785, "global_step": 240132, "epoch": 2893} {"train_loss": -24.74325942993164, "global_step": 240133, "epoch": 2893} {"train_loss": -24.83323860168457, "global_step": 240134, "epoch": 2893} {"train_loss": -24.91253089904785, "global_step": 240135, "epoch": 2893} {"train_loss": -24.73333168029785, "global_step": 240136, "epoch": 2893} {"train_loss": -24.678747177124023, "global_step": 240137, "epoch": 2893} {"train_loss": -24.833511352539062, "global_step": 240138, "epoch": 2893} {"train_loss": -24.966928482055664, "global_step": 240139, "epoch": 2893} {"train_loss": -24.710437774658203, "global_step": 240140, "epoch": 2893} {"train_loss": -24.96660804748535, "global_step": 240141, "epoch": 2893} {"train_loss": -24.62110710144043, "global_step": 240142, "epoch": 2893} {"train_loss": -24.915985107421875, "global_step": 240143, "epoch": 2893} {"train_loss": -25.318754196166992, "global_step": 240144, "epoch": 2893} {"train_loss": -24.892019271850586, "global_step": 240145, "epoch": 2893} {"train_loss": -24.940536499023438, "global_step": 240146, "epoch": 2893} {"train_loss": -25.16698455810547, "global_step": 240147, "epoch": 2893} {"train_loss": -25.106876373291016, "global_step": 240148, "epoch": 2893} {"train_loss": -25.029666900634766, "global_step": 240149, "epoch": 2893} {"train_loss": -24.86078453063965, "global_step": 240150, "epoch": 2893} {"train_loss": -24.875085830688477, "global_step": 240151, "epoch": 2893} {"train_loss": -25.132043838500977, "global_step": 240152, "epoch": 2893} {"train_loss": -24.801916122436523, "global_step": 240153, "epoch": 2893} {"train_loss": -24.612642288208008, "global_step": 240154, "epoch": 2893} {"train_loss": -25.262296676635742, "global_step": 240155, "epoch": 2893} {"train_loss": -25.085128784179688, "global_step": 240156, "epoch": 2893} {"train_loss": -24.97170066833496, "global_step": 240157, "epoch": 2893} {"train_loss": -25.259937286376953, "global_step": 240158, "epoch": 2893} {"train_loss": -25.198734283447266, "global_step": 240159, "epoch": 2893} {"train_loss": -24.986936569213867, "global_step": 240160, "epoch": 2893} {"train_loss": -25.120075225830078, "global_step": 240161, "epoch": 2893} {"train_loss": -24.998779296875, "global_step": 240162, "epoch": 2893} {"train_loss": -24.55634117126465, "global_step": 240163, "epoch": 2893} {"train_loss": -23.434507369995117, "global_step": 240164, "epoch": 2893} {"train_loss": -23.25246238708496, "global_step": 240165, "epoch": 2893} {"train_loss": -24.127790451049805, "global_step": 240166, "epoch": 2893} {"train_loss": -24.415395736694336, "global_step": 240167, "epoch": 2893} {"train_loss": -23.470117568969727, "global_step": 240168, "epoch": 2893} {"train_loss": -24.170886993408203, "global_step": 240169, "epoch": 2893} {"train_loss": -24.376832962036133, "global_step": 240170, "epoch": 2893} {"train_loss": -24.12743377685547, "global_step": 240171, "epoch": 2893} {"train_loss": -24.76650047302246, "global_step": 240172, "epoch": 2893} {"train_loss": -24.450057983398438, "global_step": 240173, "epoch": 2893} {"train_loss": -24.34111976623535, "global_step": 240174, "epoch": 2893} {"train_loss": -24.089536666870117, "global_step": 240175, "epoch": 2893} {"train_loss": -24.583349227905273, "global_step": 240176, "epoch": 2893} {"train_loss": -24.400487899780273, "global_step": 240177, "epoch": 2893} {"train_loss": -24.43121337890625, "global_step": 240178, "epoch": 2893} {"train_loss": -24.413284301757812, "global_step": 240179, "epoch": 2893} {"train_loss": -24.468324661254883, "global_step": 240180, "epoch": 2893} {"train_loss": -24.46616554260254, "global_step": 240181, "epoch": 2893} {"train_loss": -24.44443702697754, "global_step": 240182, "epoch": 2893} {"train_loss": -24.541202545166016, "global_step": 240183, "epoch": 2893} {"train_loss": -24.68730354309082, "global_step": 240184, "epoch": 2893} {"train_loss": -24.325559616088867, "global_step": 240185, "epoch": 2893} {"train_loss": -24.576860427856445, "global_step": 240186, "epoch": 2893} {"train_loss": -24.70656967163086, "global_step": 240187, "epoch": 2893} {"train_loss": -24.621549606323242, "global_step": 240188, "epoch": 2893} {"train_loss": -24.955787658691406, "global_step": 240189, "epoch": 2893} {"train_loss": -24.493728637695312, "global_step": 240190, "epoch": 2893} {"train_loss": -25.1240291595459, "global_step": 240191, "epoch": 2893} {"train_loss": -24.7207088470459, "global_step": 240192, "epoch": 2893} {"train_loss": -24.621204376220703, "global_step": 240193, "epoch": 2893} {"train_loss": -24.611133575439453, "global_step": 240194, "epoch": 2893} {"train_loss": -24.409582138061523, "global_step": 240195, "epoch": 2893} {"train_loss": -24.8916072845459, "global_step": 240196, "epoch": 2893} {"train_loss": -24.812389373779297, "global_step": 240197, "epoch": 2893} {"train_loss": -24.8583927154541, "global_step": 240198, "epoch": 2893} {"train_loss": -24.990720748901367, "global_step": 240199, "epoch": 2893} {"train_loss": -25.02216148376465, "global_step": 240200, "epoch": 2893} {"train_loss": -24.662311209253517, "global_step": 240201, "epoch": 2893, "val_loss": 6760837.0} {"train_loss": -24.2902774810791, "global_step": 240202, "epoch": 2894} {"train_loss": -24.786434173583984, "global_step": 240203, "epoch": 2894} {"train_loss": -24.803852081298828, "global_step": 240204, "epoch": 2894} {"train_loss": -24.531124114990234, "global_step": 240205, "epoch": 2894} {"train_loss": -24.55317497253418, "global_step": 240206, "epoch": 2894} {"train_loss": -24.524620056152344, "global_step": 240207, "epoch": 2894} {"train_loss": -24.87210464477539, "global_step": 240208, "epoch": 2894} {"train_loss": -24.8062744140625, "global_step": 240209, "epoch": 2894} {"train_loss": -24.7915096282959, "global_step": 240210, "epoch": 2894} {"train_loss": -24.44856071472168, "global_step": 240211, "epoch": 2894} {"train_loss": -24.69978904724121, "global_step": 240212, "epoch": 2894} {"train_loss": -24.541284561157227, "global_step": 240213, "epoch": 2894} {"train_loss": -24.791101455688477, "global_step": 240214, "epoch": 2894} {"train_loss": -24.880094528198242, "global_step": 240215, "epoch": 2894} {"train_loss": -25.33431053161621, "global_step": 240216, "epoch": 2894} {"train_loss": -24.91180992126465, "global_step": 240217, "epoch": 2894} {"train_loss": -24.920093536376953, "global_step": 240218, "epoch": 2894} {"train_loss": -24.904449462890625, "global_step": 240219, "epoch": 2894} {"train_loss": -25.263137817382812, "global_step": 240220, "epoch": 2894} {"train_loss": -24.684003829956055, "global_step": 240221, "epoch": 2894} {"train_loss": -25.28632164001465, "global_step": 240222, "epoch": 2894} {"train_loss": -24.929458618164062, "global_step": 240223, "epoch": 2894} {"train_loss": -24.848535537719727, "global_step": 240224, "epoch": 2894} {"train_loss": -24.99687385559082, "global_step": 240225, "epoch": 2894} {"train_loss": -25.00313377380371, "global_step": 240226, "epoch": 2894} {"train_loss": -25.071027755737305, "global_step": 240227, "epoch": 2894} {"train_loss": -24.893606185913086, "global_step": 240228, "epoch": 2894} {"train_loss": -24.941940307617188, "global_step": 240229, "epoch": 2894} {"train_loss": -24.63454246520996, "global_step": 240230, "epoch": 2894} {"train_loss": -24.8787784576416, "global_step": 240231, "epoch": 2894} {"train_loss": -24.9604434967041, "global_step": 240232, "epoch": 2894} {"train_loss": -24.98944854736328, "global_step": 240233, "epoch": 2894} {"train_loss": -24.907527923583984, "global_step": 240234, "epoch": 2894} {"train_loss": -25.054292678833008, "global_step": 240235, "epoch": 2894} {"train_loss": -24.654783248901367, "global_step": 240236, "epoch": 2894} {"train_loss": -25.223356246948242, "global_step": 240237, "epoch": 2894} {"train_loss": -25.12965202331543, "global_step": 240238, "epoch": 2894} {"train_loss": -25.44979476928711, "global_step": 240239, "epoch": 2894} {"train_loss": -24.61613655090332, "global_step": 240240, "epoch": 2894} {"train_loss": -24.532079696655273, "global_step": 240241, "epoch": 2894} {"train_loss": -24.913177490234375, "global_step": 240242, "epoch": 2894} {"train_loss": -24.739709854125977, "global_step": 240243, "epoch": 2894} {"train_loss": -24.840219497680664, "global_step": 240244, "epoch": 2894} {"train_loss": -25.00372314453125, "global_step": 240245, "epoch": 2894} {"train_loss": -24.986066818237305, "global_step": 240246, "epoch": 2894} {"train_loss": -24.773685455322266, "global_step": 240247, "epoch": 2894} {"train_loss": -24.927770614624023, "global_step": 240248, "epoch": 2894} {"train_loss": -24.95258331298828, "global_step": 240249, "epoch": 2894} {"train_loss": -24.781095504760742, "global_step": 240250, "epoch": 2894} {"train_loss": -24.939512252807617, "global_step": 240251, "epoch": 2894} {"train_loss": -25.155271530151367, "global_step": 240252, "epoch": 2894} {"train_loss": -25.191059112548828, "global_step": 240253, "epoch": 2894} {"train_loss": -24.998716354370117, "global_step": 240254, "epoch": 2894} {"train_loss": -25.099014282226562, "global_step": 240255, "epoch": 2894} {"train_loss": -24.866867065429688, "global_step": 240256, "epoch": 2894} {"train_loss": -24.917877197265625, "global_step": 240257, "epoch": 2894} {"train_loss": -25.063188552856445, "global_step": 240258, "epoch": 2894} {"train_loss": -24.99761199951172, "global_step": 240259, "epoch": 2894} {"train_loss": -24.963708877563477, "global_step": 240260, "epoch": 2894} {"train_loss": -25.01979637145996, "global_step": 240261, "epoch": 2894} {"train_loss": -24.910818099975586, "global_step": 240262, "epoch": 2894} {"train_loss": -24.976850509643555, "global_step": 240263, "epoch": 2894} {"train_loss": -24.547561645507812, "global_step": 240264, "epoch": 2894} {"train_loss": -24.736494064331055, "global_step": 240265, "epoch": 2894} {"train_loss": -25.05951499938965, "global_step": 240266, "epoch": 2894} {"train_loss": -25.27056312561035, "global_step": 240267, "epoch": 2894} {"train_loss": -24.84433364868164, "global_step": 240268, "epoch": 2894} {"train_loss": -25.051340103149414, "global_step": 240269, "epoch": 2894} {"train_loss": -24.616941452026367, "global_step": 240270, "epoch": 2894} {"train_loss": -24.956933975219727, "global_step": 240271, "epoch": 2894} {"train_loss": -24.63487434387207, "global_step": 240272, "epoch": 2894} {"train_loss": -24.85348892211914, "global_step": 240273, "epoch": 2894} {"train_loss": -24.69386100769043, "global_step": 240274, "epoch": 2894} {"train_loss": -25.080543518066406, "global_step": 240275, "epoch": 2894} {"train_loss": -24.691665649414062, "global_step": 240276, "epoch": 2894} {"train_loss": -24.795969009399414, "global_step": 240277, "epoch": 2894} {"train_loss": -24.20950698852539, "global_step": 240278, "epoch": 2894} {"train_loss": -24.606008529663086, "global_step": 240279, "epoch": 2894} {"train_loss": -24.77898406982422, "global_step": 240280, "epoch": 2894} {"train_loss": -24.307205200195312, "global_step": 240281, "epoch": 2894} {"train_loss": -24.592138290405273, "global_step": 240282, "epoch": 2894} {"train_loss": -24.605117797851562, "global_step": 240283, "epoch": 2894} {"train_loss": -24.857981072850976, "global_step": 240284, "epoch": 2894, "val_loss": 6996233.5} {"train_loss": -23.71909523010254, "global_step": 240285, "epoch": 2895} {"train_loss": -24.071481704711914, "global_step": 240286, "epoch": 2895} {"train_loss": -24.617225646972656, "global_step": 240287, "epoch": 2895} {"train_loss": -23.682632446289062, "global_step": 240288, "epoch": 2895} {"train_loss": -24.256731033325195, "global_step": 240289, "epoch": 2895} {"train_loss": -23.809843063354492, "global_step": 240290, "epoch": 2895} {"train_loss": -24.131412506103516, "global_step": 240291, "epoch": 2895} {"train_loss": -24.11661720275879, "global_step": 240292, "epoch": 2895} {"train_loss": -24.583959579467773, "global_step": 240293, "epoch": 2895} {"train_loss": -24.615741729736328, "global_step": 240294, "epoch": 2895} {"train_loss": -24.33131217956543, "global_step": 240295, "epoch": 2895} {"train_loss": -24.375646591186523, "global_step": 240296, "epoch": 2895} {"train_loss": -24.379531860351562, "global_step": 240297, "epoch": 2895} {"train_loss": -23.91703987121582, "global_step": 240298, "epoch": 2895} {"train_loss": -24.604991912841797, "global_step": 240299, "epoch": 2895} {"train_loss": -24.128116607666016, "global_step": 240300, "epoch": 2895} {"train_loss": -24.661352157592773, "global_step": 240301, "epoch": 2895} {"train_loss": -24.554529190063477, "global_step": 240302, "epoch": 2895} {"train_loss": -24.350910186767578, "global_step": 240303, "epoch": 2895} {"train_loss": -24.473005294799805, "global_step": 240304, "epoch": 2895} {"train_loss": -24.29119300842285, "global_step": 240305, "epoch": 2895} {"train_loss": -24.6945858001709, "global_step": 240306, "epoch": 2895} {"train_loss": -24.506195068359375, "global_step": 240307, "epoch": 2895} {"train_loss": -24.59271812438965, "global_step": 240308, "epoch": 2895} {"train_loss": -24.82097053527832, "global_step": 240309, "epoch": 2895} {"train_loss": -24.560583114624023, "global_step": 240310, "epoch": 2895} {"train_loss": -24.44610023498535, "global_step": 240311, "epoch": 2895} {"train_loss": -24.80879020690918, "global_step": 240312, "epoch": 2895} {"train_loss": -24.856830596923828, "global_step": 240313, "epoch": 2895} {"train_loss": -25.049070358276367, "global_step": 240314, "epoch": 2895} {"train_loss": -24.89878273010254, "global_step": 240315, "epoch": 2895} {"train_loss": -24.648534774780273, "global_step": 240316, "epoch": 2895} {"train_loss": -24.777891159057617, "global_step": 240317, "epoch": 2895} {"train_loss": -24.75653648376465, "global_step": 240318, "epoch": 2895} {"train_loss": -24.64823341369629, "global_step": 240319, "epoch": 2895} {"train_loss": -24.703454971313477, "global_step": 240320, "epoch": 2895} {"train_loss": -24.759206771850586, "global_step": 240321, "epoch": 2895} {"train_loss": -24.592388153076172, "global_step": 240322, "epoch": 2895} {"train_loss": -24.74549674987793, "global_step": 240323, "epoch": 2895} {"train_loss": -25.124998092651367, "global_step": 240324, "epoch": 2895} {"train_loss": -24.859371185302734, "global_step": 240325, "epoch": 2895} {"train_loss": -24.71222496032715, "global_step": 240326, "epoch": 2895} {"train_loss": -25.239198684692383, "global_step": 240327, "epoch": 2895} {"train_loss": -25.09346580505371, "global_step": 240328, "epoch": 2895} {"train_loss": -25.009031295776367, "global_step": 240329, "epoch": 2895} {"train_loss": -25.06693458557129, "global_step": 240330, "epoch": 2895} {"train_loss": -25.076948165893555, "global_step": 240331, "epoch": 2895} {"train_loss": -24.920658111572266, "global_step": 240332, "epoch": 2895} {"train_loss": -25.07826042175293, "global_step": 240333, "epoch": 2895} {"train_loss": -25.003223419189453, "global_step": 240334, "epoch": 2895} {"train_loss": -25.18623161315918, "global_step": 240335, "epoch": 2895} {"train_loss": -24.984182357788086, "global_step": 240336, "epoch": 2895} {"train_loss": -24.991104125976562, "global_step": 240337, "epoch": 2895} {"train_loss": -24.865432739257812, "global_step": 240338, "epoch": 2895} {"train_loss": -25.34405517578125, "global_step": 240339, "epoch": 2895} {"train_loss": -25.403303146362305, "global_step": 240340, "epoch": 2895} {"train_loss": -25.141145706176758, "global_step": 240341, "epoch": 2895} {"train_loss": -25.19965171813965, "global_step": 240342, "epoch": 2895} {"train_loss": -24.781919479370117, "global_step": 240343, "epoch": 2895} {"train_loss": -24.68703269958496, "global_step": 240344, "epoch": 2895} {"train_loss": -24.786176681518555, "global_step": 240345, "epoch": 2895} {"train_loss": -25.00840950012207, "global_step": 240346, "epoch": 2895} {"train_loss": -24.698766708374023, "global_step": 240347, "epoch": 2895} {"train_loss": -24.87624168395996, "global_step": 240348, "epoch": 2895} {"train_loss": -25.30311393737793, "global_step": 240349, "epoch": 2895} {"train_loss": -25.049421310424805, "global_step": 240350, "epoch": 2895} {"train_loss": -24.989519119262695, "global_step": 240351, "epoch": 2895} {"train_loss": -24.985280990600586, "global_step": 240352, "epoch": 2895} {"train_loss": -25.114004135131836, "global_step": 240353, "epoch": 2895} {"train_loss": -24.780807495117188, "global_step": 240354, "epoch": 2895} {"train_loss": -24.906457901000977, "global_step": 240355, "epoch": 2895} {"train_loss": -24.751169204711914, "global_step": 240356, "epoch": 2895} {"train_loss": -24.4134578704834, "global_step": 240357, "epoch": 2895} {"train_loss": -24.684465408325195, "global_step": 240358, "epoch": 2895} {"train_loss": -24.535491943359375, "global_step": 240359, "epoch": 2895} {"train_loss": -24.631885528564453, "global_step": 240360, "epoch": 2895} {"train_loss": -25.214004516601562, "global_step": 240361, "epoch": 2895} {"train_loss": -24.851978302001953, "global_step": 240362, "epoch": 2895} {"train_loss": -25.04827880859375, "global_step": 240363, "epoch": 2895} {"train_loss": -25.166610717773438, "global_step": 240364, "epoch": 2895} {"train_loss": -24.763534545898438, "global_step": 240365, "epoch": 2895} {"train_loss": -24.952470779418945, "global_step": 240366, "epoch": 2895} {"train_loss": -24.73774746814406, "global_step": 240367, "epoch": 2895, "val_loss": 6805742.5} {"train_loss": -24.739933013916016, "global_step": 240368, "epoch": 2896} {"train_loss": -24.649837493896484, "global_step": 240369, "epoch": 2896} {"train_loss": -24.679567337036133, "global_step": 240370, "epoch": 2896} {"train_loss": -24.50064468383789, "global_step": 240371, "epoch": 2896} {"train_loss": -24.9105281829834, "global_step": 240372, "epoch": 2896} {"train_loss": -24.35672378540039, "global_step": 240373, "epoch": 2896} {"train_loss": -24.858402252197266, "global_step": 240374, "epoch": 2896} {"train_loss": -24.475488662719727, "global_step": 240375, "epoch": 2896} {"train_loss": -24.480152130126953, "global_step": 240376, "epoch": 2896} {"train_loss": -24.989185333251953, "global_step": 240377, "epoch": 2896} {"train_loss": -24.530256271362305, "global_step": 240378, "epoch": 2896} {"train_loss": -24.86621856689453, "global_step": 240379, "epoch": 2896} {"train_loss": -24.490705490112305, "global_step": 240380, "epoch": 2896} {"train_loss": -24.19121742248535, "global_step": 240381, "epoch": 2896} {"train_loss": -24.93120765686035, "global_step": 240382, "epoch": 2896} {"train_loss": -24.37369728088379, "global_step": 240383, "epoch": 2896} {"train_loss": -25.08027458190918, "global_step": 240384, "epoch": 2896} {"train_loss": -24.4151611328125, "global_step": 240385, "epoch": 2896} {"train_loss": -24.753908157348633, "global_step": 240386, "epoch": 2896} {"train_loss": -25.05510711669922, "global_step": 240387, "epoch": 2896} {"train_loss": -24.626461029052734, "global_step": 240388, "epoch": 2896} {"train_loss": -25.072649002075195, "global_step": 240389, "epoch": 2896} {"train_loss": -24.627471923828125, "global_step": 240390, "epoch": 2896} {"train_loss": -24.850740432739258, "global_step": 240391, "epoch": 2896} {"train_loss": -24.55655860900879, "global_step": 240392, "epoch": 2896} {"train_loss": -24.708951950073242, "global_step": 240393, "epoch": 2896} {"train_loss": -24.750680923461914, "global_step": 240394, "epoch": 2896} {"train_loss": -25.11157989501953, "global_step": 240395, "epoch": 2896} {"train_loss": -24.90609359741211, "global_step": 240396, "epoch": 2896} {"train_loss": -24.778465270996094, "global_step": 240397, "epoch": 2896} {"train_loss": -24.913440704345703, "global_step": 240398, "epoch": 2896} {"train_loss": -24.64453887939453, "global_step": 240399, "epoch": 2896} {"train_loss": -24.818979263305664, "global_step": 240400, "epoch": 2896} {"train_loss": -24.744449615478516, "global_step": 240401, "epoch": 2896} {"train_loss": -24.928937911987305, "global_step": 240402, "epoch": 2896} {"train_loss": -25.016916275024414, "global_step": 240403, "epoch": 2896} {"train_loss": -24.74380111694336, "global_step": 240404, "epoch": 2896} {"train_loss": -25.06787109375, "global_step": 240405, "epoch": 2896} {"train_loss": -24.926809310913086, "global_step": 240406, "epoch": 2896} {"train_loss": -25.45322036743164, "global_step": 240407, "epoch": 2896} {"train_loss": -24.664220809936523, "global_step": 240408, "epoch": 2896} {"train_loss": -24.651092529296875, "global_step": 240409, "epoch": 2896} {"train_loss": -25.140134811401367, "global_step": 240410, "epoch": 2896} {"train_loss": -24.915498733520508, "global_step": 240411, "epoch": 2896} {"train_loss": -24.82480239868164, "global_step": 240412, "epoch": 2896} {"train_loss": -24.929529190063477, "global_step": 240413, "epoch": 2896} {"train_loss": -24.72067642211914, "global_step": 240414, "epoch": 2896} {"train_loss": -24.736417770385742, "global_step": 240415, "epoch": 2896} {"train_loss": -24.88873863220215, "global_step": 240416, "epoch": 2896} {"train_loss": -24.810056686401367, "global_step": 240417, "epoch": 2896} {"train_loss": -25.0371036529541, "global_step": 240418, "epoch": 2896} {"train_loss": -24.60970115661621, "global_step": 240419, "epoch": 2896} {"train_loss": -24.637052536010742, "global_step": 240420, "epoch": 2896} {"train_loss": -25.26667594909668, "global_step": 240421, "epoch": 2896} {"train_loss": -24.979562759399414, "global_step": 240422, "epoch": 2896} {"train_loss": -24.90114402770996, "global_step": 240423, "epoch": 2896} {"train_loss": -24.633459091186523, "global_step": 240424, "epoch": 2896} {"train_loss": -25.00027847290039, "global_step": 240425, "epoch": 2896} {"train_loss": -24.975637435913086, "global_step": 240426, "epoch": 2896} {"train_loss": -24.96761131286621, "global_step": 240427, "epoch": 2896} {"train_loss": -24.829092025756836, "global_step": 240428, "epoch": 2896} {"train_loss": -25.265531539916992, "global_step": 240429, "epoch": 2896} {"train_loss": -24.954702377319336, "global_step": 240430, "epoch": 2896} {"train_loss": -24.64955711364746, "global_step": 240431, "epoch": 2896} {"train_loss": -25.156774520874023, "global_step": 240432, "epoch": 2896} {"train_loss": -24.762863159179688, "global_step": 240433, "epoch": 2896} {"train_loss": -24.735939025878906, "global_step": 240434, "epoch": 2896} {"train_loss": -24.80100440979004, "global_step": 240435, "epoch": 2896} {"train_loss": -25.065799713134766, "global_step": 240436, "epoch": 2896} {"train_loss": -24.756990432739258, "global_step": 240437, "epoch": 2896} {"train_loss": -24.79096794128418, "global_step": 240438, "epoch": 2896} {"train_loss": -25.263484954833984, "global_step": 240439, "epoch": 2896} {"train_loss": -24.964101791381836, "global_step": 240440, "epoch": 2896} {"train_loss": -24.87006950378418, "global_step": 240441, "epoch": 2896} {"train_loss": -24.894458770751953, "global_step": 240442, "epoch": 2896} {"train_loss": -24.904861450195312, "global_step": 240443, "epoch": 2896} {"train_loss": -24.647321701049805, "global_step": 240444, "epoch": 2896} {"train_loss": -24.88214683532715, "global_step": 240445, "epoch": 2896} {"train_loss": -24.827062606811523, "global_step": 240446, "epoch": 2896} {"train_loss": -25.117538452148438, "global_step": 240447, "epoch": 2896} {"train_loss": -24.815202713012695, "global_step": 240448, "epoch": 2896} {"train_loss": -24.8134822845459, "global_step": 240449, "epoch": 2896} {"train_loss": -24.82623704657497, "global_step": 240450, "epoch": 2896, "val_loss": 6811483.0} {"train_loss": -24.51765251159668, "global_step": 240451, "epoch": 2897} {"train_loss": -24.257129669189453, "global_step": 240452, "epoch": 2897} {"train_loss": -24.576231002807617, "global_step": 240453, "epoch": 2897} {"train_loss": -24.803207397460938, "global_step": 240454, "epoch": 2897} {"train_loss": -24.71082305908203, "global_step": 240455, "epoch": 2897} {"train_loss": -24.902761459350586, "global_step": 240456, "epoch": 2897} {"train_loss": -24.872915267944336, "global_step": 240457, "epoch": 2897} {"train_loss": -24.63081932067871, "global_step": 240458, "epoch": 2897} {"train_loss": -24.720129013061523, "global_step": 240459, "epoch": 2897} {"train_loss": -24.52390480041504, "global_step": 240460, "epoch": 2897} {"train_loss": -25.153079986572266, "global_step": 240461, "epoch": 2897} {"train_loss": -24.622465133666992, "global_step": 240462, "epoch": 2897} {"train_loss": -24.8018798828125, "global_step": 240463, "epoch": 2897} {"train_loss": -24.903186798095703, "global_step": 240464, "epoch": 2897} {"train_loss": -24.760942459106445, "global_step": 240465, "epoch": 2897} {"train_loss": -24.955705642700195, "global_step": 240466, "epoch": 2897} {"train_loss": -24.802213668823242, "global_step": 240467, "epoch": 2897} {"train_loss": -25.271326065063477, "global_step": 240468, "epoch": 2897} {"train_loss": -24.54971694946289, "global_step": 240469, "epoch": 2897} {"train_loss": -25.005298614501953, "global_step": 240470, "epoch": 2897} {"train_loss": -24.826501846313477, "global_step": 240471, "epoch": 2897} {"train_loss": -25.141035079956055, "global_step": 240472, "epoch": 2897} {"train_loss": -25.01230812072754, "global_step": 240473, "epoch": 2897} {"train_loss": -24.832605361938477, "global_step": 240474, "epoch": 2897} {"train_loss": -25.099353790283203, "global_step": 240475, "epoch": 2897} {"train_loss": -24.829483032226562, "global_step": 240476, "epoch": 2897} {"train_loss": -24.19239616394043, "global_step": 240477, "epoch": 2897} {"train_loss": -24.813392639160156, "global_step": 240478, "epoch": 2897} {"train_loss": -24.103792190551758, "global_step": 240479, "epoch": 2897} {"train_loss": -24.152963638305664, "global_step": 240480, "epoch": 2897} {"train_loss": -24.51686668395996, "global_step": 240481, "epoch": 2897} {"train_loss": -25.037555694580078, "global_step": 240482, "epoch": 2897} {"train_loss": -24.14092445373535, "global_step": 240483, "epoch": 2897} {"train_loss": -24.7600040435791, "global_step": 240484, "epoch": 2897} {"train_loss": -24.518484115600586, "global_step": 240485, "epoch": 2897} {"train_loss": -24.721662521362305, "global_step": 240486, "epoch": 2897} {"train_loss": -24.68124771118164, "global_step": 240487, "epoch": 2897} {"train_loss": -24.882240295410156, "global_step": 240488, "epoch": 2897} {"train_loss": -24.77138328552246, "global_step": 240489, "epoch": 2897} {"train_loss": -24.92230796813965, "global_step": 240490, "epoch": 2897} {"train_loss": -24.580184936523438, "global_step": 240491, "epoch": 2897} {"train_loss": -24.999526977539062, "global_step": 240492, "epoch": 2897} {"train_loss": -24.690574645996094, "global_step": 240493, "epoch": 2897} {"train_loss": -24.988683700561523, "global_step": 240494, "epoch": 2897} {"train_loss": -24.76910972595215, "global_step": 240495, "epoch": 2897} {"train_loss": -24.573463439941406, "global_step": 240496, "epoch": 2897} {"train_loss": -24.52139663696289, "global_step": 240497, "epoch": 2897} {"train_loss": -24.968236923217773, "global_step": 240498, "epoch": 2897} {"train_loss": -24.63619613647461, "global_step": 240499, "epoch": 2897} {"train_loss": -24.801729202270508, "global_step": 240500, "epoch": 2897} {"train_loss": -24.836429595947266, "global_step": 240501, "epoch": 2897} {"train_loss": -24.662824630737305, "global_step": 240502, "epoch": 2897} {"train_loss": -24.902477264404297, "global_step": 240503, "epoch": 2897} {"train_loss": -24.98809242248535, "global_step": 240504, "epoch": 2897} {"train_loss": -24.802743911743164, "global_step": 240505, "epoch": 2897} {"train_loss": -24.56743812561035, "global_step": 240506, "epoch": 2897} {"train_loss": -24.804443359375, "global_step": 240507, "epoch": 2897} {"train_loss": -24.320560455322266, "global_step": 240508, "epoch": 2897} {"train_loss": -24.474010467529297, "global_step": 240509, "epoch": 2897} {"train_loss": -25.027347564697266, "global_step": 240510, "epoch": 2897} {"train_loss": -24.917123794555664, "global_step": 240511, "epoch": 2897} {"train_loss": -24.7061710357666, "global_step": 240512, "epoch": 2897} {"train_loss": -24.71485710144043, "global_step": 240513, "epoch": 2897} {"train_loss": -24.750274658203125, "global_step": 240514, "epoch": 2897} {"train_loss": -25.227537155151367, "global_step": 240515, "epoch": 2897} {"train_loss": -24.98628044128418, "global_step": 240516, "epoch": 2897} {"train_loss": -24.976362228393555, "global_step": 240517, "epoch": 2897} {"train_loss": -25.098962783813477, "global_step": 240518, "epoch": 2897} {"train_loss": -24.79171371459961, "global_step": 240519, "epoch": 2897} {"train_loss": -24.862722396850586, "global_step": 240520, "epoch": 2897} {"train_loss": -24.97492218017578, "global_step": 240521, "epoch": 2897} {"train_loss": -25.075210571289062, "global_step": 240522, "epoch": 2897} {"train_loss": -24.774707794189453, "global_step": 240523, "epoch": 2897} {"train_loss": -24.97299575805664, "global_step": 240524, "epoch": 2897} {"train_loss": -24.761396408081055, "global_step": 240525, "epoch": 2897} {"train_loss": -25.223596572875977, "global_step": 240526, "epoch": 2897} {"train_loss": -24.879602432250977, "global_step": 240527, "epoch": 2897} {"train_loss": -25.04098892211914, "global_step": 240528, "epoch": 2897} {"train_loss": -25.09656524658203, "global_step": 240529, "epoch": 2897} {"train_loss": -25.088172912597656, "global_step": 240530, "epoch": 2897} {"train_loss": -24.97150230407715, "global_step": 240531, "epoch": 2897} {"train_loss": -25.302457809448242, "global_step": 240532, "epoch": 2897} {"train_loss": -24.780522357986634, "global_step": 240533, "epoch": 2897, "val_loss": 6809577.0} {"train_loss": -24.310178756713867, "global_step": 240534, "epoch": 2898} {"train_loss": -23.493717193603516, "global_step": 240535, "epoch": 2898} {"train_loss": -23.336088180541992, "global_step": 240536, "epoch": 2898} {"train_loss": -23.527494430541992, "global_step": 240537, "epoch": 2898} {"train_loss": -24.29938316345215, "global_step": 240538, "epoch": 2898} {"train_loss": -22.954648971557617, "global_step": 240539, "epoch": 2898} {"train_loss": -23.949277877807617, "global_step": 240540, "epoch": 2898} {"train_loss": -23.616077423095703, "global_step": 240541, "epoch": 2898} {"train_loss": -23.917516708374023, "global_step": 240542, "epoch": 2898} {"train_loss": -23.214624404907227, "global_step": 240543, "epoch": 2898} {"train_loss": -23.9625301361084, "global_step": 240544, "epoch": 2898} {"train_loss": -23.857929229736328, "global_step": 240545, "epoch": 2898} {"train_loss": -23.95465850830078, "global_step": 240546, "epoch": 2898} {"train_loss": -23.67204475402832, "global_step": 240547, "epoch": 2898} {"train_loss": -24.304567337036133, "global_step": 240548, "epoch": 2898} {"train_loss": -24.295133590698242, "global_step": 240549, "epoch": 2898} {"train_loss": -24.234378814697266, "global_step": 240550, "epoch": 2898} {"train_loss": -24.24606704711914, "global_step": 240551, "epoch": 2898} {"train_loss": -24.270263671875, "global_step": 240552, "epoch": 2898} {"train_loss": -24.281675338745117, "global_step": 240553, "epoch": 2898} {"train_loss": -23.57003402709961, "global_step": 240554, "epoch": 2898} {"train_loss": -24.168609619140625, "global_step": 240555, "epoch": 2898} {"train_loss": -24.38295555114746, "global_step": 240556, "epoch": 2898} {"train_loss": -24.31300163269043, "global_step": 240557, "epoch": 2898} {"train_loss": -24.505971908569336, "global_step": 240558, "epoch": 2898} {"train_loss": -24.512012481689453, "global_step": 240559, "epoch": 2898} {"train_loss": -24.612279891967773, "global_step": 240560, "epoch": 2898} {"train_loss": -24.664138793945312, "global_step": 240561, "epoch": 2898} {"train_loss": -24.538070678710938, "global_step": 240562, "epoch": 2898} {"train_loss": -24.621761322021484, "global_step": 240563, "epoch": 2898} {"train_loss": -24.69322967529297, "global_step": 240564, "epoch": 2898} {"train_loss": -24.630901336669922, "global_step": 240565, "epoch": 2898} {"train_loss": -24.383459091186523, "global_step": 240566, "epoch": 2898} {"train_loss": -24.872037887573242, "global_step": 240567, "epoch": 2898} {"train_loss": -24.470014572143555, "global_step": 240568, "epoch": 2898} {"train_loss": -25.276107788085938, "global_step": 240569, "epoch": 2898} {"train_loss": -24.606094360351562, "global_step": 240570, "epoch": 2898} {"train_loss": -24.583728790283203, "global_step": 240571, "epoch": 2898} {"train_loss": -25.093048095703125, "global_step": 240572, "epoch": 2898} {"train_loss": -24.890432357788086, "global_step": 240573, "epoch": 2898} {"train_loss": -25.204193115234375, "global_step": 240574, "epoch": 2898} {"train_loss": -24.792943954467773, "global_step": 240575, "epoch": 2898} {"train_loss": -24.920316696166992, "global_step": 240576, "epoch": 2898} {"train_loss": -25.02716636657715, "global_step": 240577, "epoch": 2898} {"train_loss": -25.322866439819336, "global_step": 240578, "epoch": 2898} {"train_loss": -24.76018714904785, "global_step": 240579, "epoch": 2898} {"train_loss": -25.08953857421875, "global_step": 240580, "epoch": 2898} {"train_loss": -25.089935302734375, "global_step": 240581, "epoch": 2898} {"train_loss": -24.880901336669922, "global_step": 240582, "epoch": 2898} {"train_loss": -24.845449447631836, "global_step": 240583, "epoch": 2898} {"train_loss": -25.20053482055664, "global_step": 240584, "epoch": 2898} {"train_loss": -25.138134002685547, "global_step": 240585, "epoch": 2898} {"train_loss": -24.80900001525879, "global_step": 240586, "epoch": 2898} {"train_loss": -24.877059936523438, "global_step": 240587, "epoch": 2898} {"train_loss": -24.97657585144043, "global_step": 240588, "epoch": 2898} {"train_loss": -24.90792465209961, "global_step": 240589, "epoch": 2898} {"train_loss": -24.971485137939453, "global_step": 240590, "epoch": 2898} {"train_loss": -25.03846549987793, "global_step": 240591, "epoch": 2898} {"train_loss": -24.837255477905273, "global_step": 240592, "epoch": 2898} {"train_loss": -24.823095321655273, "global_step": 240593, "epoch": 2898} {"train_loss": -25.112789154052734, "global_step": 240594, "epoch": 2898} {"train_loss": -25.238637924194336, "global_step": 240595, "epoch": 2898} {"train_loss": -25.09596061706543, "global_step": 240596, "epoch": 2898} {"train_loss": -24.573562622070312, "global_step": 240597, "epoch": 2898} {"train_loss": -24.78706169128418, "global_step": 240598, "epoch": 2898} {"train_loss": -24.888269424438477, "global_step": 240599, "epoch": 2898} {"train_loss": -24.421146392822266, "global_step": 240600, "epoch": 2898} {"train_loss": -25.038808822631836, "global_step": 240601, "epoch": 2898} {"train_loss": -24.584468841552734, "global_step": 240602, "epoch": 2898} {"train_loss": -24.938596725463867, "global_step": 240603, "epoch": 2898} {"train_loss": -24.67751121520996, "global_step": 240604, "epoch": 2898} {"train_loss": -25.41102409362793, "global_step": 240605, "epoch": 2898} {"train_loss": -25.06907081604004, "global_step": 240606, "epoch": 2898} {"train_loss": -24.800031661987305, "global_step": 240607, "epoch": 2898} {"train_loss": -24.99872398376465, "global_step": 240608, "epoch": 2898} {"train_loss": -24.711669921875, "global_step": 240609, "epoch": 2898} {"train_loss": -24.806241989135742, "global_step": 240610, "epoch": 2898} {"train_loss": -24.865703582763672, "global_step": 240611, "epoch": 2898} {"train_loss": -24.957387924194336, "global_step": 240612, "epoch": 2898} {"train_loss": -24.822011947631836, "global_step": 240613, "epoch": 2898} {"train_loss": -25.000213623046875, "global_step": 240614, "epoch": 2898} {"train_loss": -24.69025993347168, "global_step": 240615, "epoch": 2898} {"train_loss": -24.57197828177946, "global_step": 240616, "epoch": 2898, "val_loss": 6704550.5} {"train_loss": -23.964765548706055, "global_step": 240617, "epoch": 2899} {"train_loss": -24.20513343811035, "global_step": 240618, "epoch": 2899} {"train_loss": -24.128793716430664, "global_step": 240619, "epoch": 2899} {"train_loss": -24.182859420776367, "global_step": 240620, "epoch": 2899} {"train_loss": -24.606794357299805, "global_step": 240621, "epoch": 2899} {"train_loss": -24.549421310424805, "global_step": 240622, "epoch": 2899} {"train_loss": -23.775074005126953, "global_step": 240623, "epoch": 2899} {"train_loss": -24.255674362182617, "global_step": 240624, "epoch": 2899} {"train_loss": -24.201602935791016, "global_step": 240625, "epoch": 2899} {"train_loss": -24.29764747619629, "global_step": 240626, "epoch": 2899} {"train_loss": -24.7891845703125, "global_step": 240627, "epoch": 2899} {"train_loss": -24.5468807220459, "global_step": 240628, "epoch": 2899} {"train_loss": -24.549795150756836, "global_step": 240629, "epoch": 2899} {"train_loss": -24.33062744140625, "global_step": 240630, "epoch": 2899} {"train_loss": -24.126544952392578, "global_step": 240631, "epoch": 2899} {"train_loss": -24.58892059326172, "global_step": 240632, "epoch": 2899} {"train_loss": -24.440948486328125, "global_step": 240633, "epoch": 2899} {"train_loss": -24.7420654296875, "global_step": 240634, "epoch": 2899} {"train_loss": -24.344017028808594, "global_step": 240635, "epoch": 2899} {"train_loss": -24.71400260925293, "global_step": 240636, "epoch": 2899} {"train_loss": -24.87886619567871, "global_step": 240637, "epoch": 2899} {"train_loss": -24.614364624023438, "global_step": 240638, "epoch": 2899} {"train_loss": -24.481595993041992, "global_step": 240639, "epoch": 2899} {"train_loss": -24.770782470703125, "global_step": 240640, "epoch": 2899} {"train_loss": -24.46964454650879, "global_step": 240641, "epoch": 2899} {"train_loss": -24.647348403930664, "global_step": 240642, "epoch": 2899} {"train_loss": -24.690921783447266, "global_step": 240643, "epoch": 2899} {"train_loss": -24.297056198120117, "global_step": 240644, "epoch": 2899} {"train_loss": -24.950193405151367, "global_step": 240645, "epoch": 2899} {"train_loss": -24.65867805480957, "global_step": 240646, "epoch": 2899} {"train_loss": -25.084827423095703, "global_step": 240647, "epoch": 2899} {"train_loss": -24.745555877685547, "global_step": 240648, "epoch": 2899} {"train_loss": -24.715837478637695, "global_step": 240649, "epoch": 2899} {"train_loss": -24.983213424682617, "global_step": 240650, "epoch": 2899} {"train_loss": -24.92841148376465, "global_step": 240651, "epoch": 2899} {"train_loss": -24.90921401977539, "global_step": 240652, "epoch": 2899} {"train_loss": -24.82325553894043, "global_step": 240653, "epoch": 2899} {"train_loss": -24.703922271728516, "global_step": 240654, "epoch": 2899} {"train_loss": -24.77634620666504, "global_step": 240655, "epoch": 2899} {"train_loss": -24.799772262573242, "global_step": 240656, "epoch": 2899} {"train_loss": -24.866268157958984, "global_step": 240657, "epoch": 2899} {"train_loss": -24.850906372070312, "global_step": 240658, "epoch": 2899} {"train_loss": -24.850341796875, "global_step": 240659, "epoch": 2899} {"train_loss": -25.049579620361328, "global_step": 240660, "epoch": 2899} {"train_loss": -25.039226531982422, "global_step": 240661, "epoch": 2899} {"train_loss": -24.754148483276367, "global_step": 240662, "epoch": 2899} {"train_loss": -24.704416275024414, "global_step": 240663, "epoch": 2899} {"train_loss": -24.67258071899414, "global_step": 240664, "epoch": 2899} {"train_loss": -24.962080001831055, "global_step": 240665, "epoch": 2899} {"train_loss": -24.717824935913086, "global_step": 240666, "epoch": 2899} {"train_loss": -24.54627799987793, "global_step": 240667, "epoch": 2899} {"train_loss": -25.233890533447266, "global_step": 240668, "epoch": 2899} {"train_loss": -25.097646713256836, "global_step": 240669, "epoch": 2899} {"train_loss": -25.282970428466797, "global_step": 240670, "epoch": 2899} {"train_loss": -24.52704429626465, "global_step": 240671, "epoch": 2899} {"train_loss": -24.815292358398438, "global_step": 240672, "epoch": 2899} {"train_loss": -25.03365135192871, "global_step": 240673, "epoch": 2899} {"train_loss": -25.306859970092773, "global_step": 240674, "epoch": 2899} {"train_loss": -25.088956832885742, "global_step": 240675, "epoch": 2899} {"train_loss": -24.616498947143555, "global_step": 240676, "epoch": 2899} {"train_loss": -24.807764053344727, "global_step": 240677, "epoch": 2899} {"train_loss": -24.855283737182617, "global_step": 240678, "epoch": 2899} {"train_loss": -24.825918197631836, "global_step": 240679, "epoch": 2899} {"train_loss": -24.813344955444336, "global_step": 240680, "epoch": 2899} {"train_loss": -24.98154067993164, "global_step": 240681, "epoch": 2899} {"train_loss": -25.19306182861328, "global_step": 240682, "epoch": 2899} {"train_loss": -25.263105392456055, "global_step": 240683, "epoch": 2899} {"train_loss": -25.10176658630371, "global_step": 240684, "epoch": 2899} {"train_loss": -24.642765045166016, "global_step": 240685, "epoch": 2899} {"train_loss": -25.22260856628418, "global_step": 240686, "epoch": 2899} {"train_loss": -24.88047981262207, "global_step": 240687, "epoch": 2899} {"train_loss": -25.0113525390625, "global_step": 240688, "epoch": 2899} {"train_loss": -25.065067291259766, "global_step": 240689, "epoch": 2899} {"train_loss": -24.85818862915039, "global_step": 240690, "epoch": 2899} {"train_loss": -24.31604766845703, "global_step": 240691, "epoch": 2899} {"train_loss": -24.94148063659668, "global_step": 240692, "epoch": 2899} {"train_loss": -25.034648895263672, "global_step": 240693, "epoch": 2899} {"train_loss": -24.669902801513672, "global_step": 240694, "epoch": 2899} {"train_loss": -25.111309051513672, "global_step": 240695, "epoch": 2899} {"train_loss": -24.873971939086914, "global_step": 240696, "epoch": 2899} {"train_loss": -25.078739166259766, "global_step": 240697, "epoch": 2899} {"train_loss": -24.699235916137695, "global_step": 240698, "epoch": 2899} {"train_loss": -24.740292514663146, "global_step": 240699, "epoch": 2899, "val_loss": 6849000.5} {"train_loss": -24.577322006225586, "global_step": 240700, "epoch": 2900} {"train_loss": -24.585355758666992, "global_step": 240701, "epoch": 2900} {"train_loss": -24.86481285095215, "global_step": 240702, "epoch": 2900} {"train_loss": -24.883289337158203, "global_step": 240703, "epoch": 2900} {"train_loss": -25.121545791625977, "global_step": 240704, "epoch": 2900} {"train_loss": -24.787179946899414, "global_step": 240705, "epoch": 2900} {"train_loss": -25.0347843170166, "global_step": 240706, "epoch": 2900} {"train_loss": -25.09197998046875, "global_step": 240707, "epoch": 2900} {"train_loss": -24.447330474853516, "global_step": 240708, "epoch": 2900} {"train_loss": -24.388837814331055, "global_step": 240709, "epoch": 2900} {"train_loss": -24.57387924194336, "global_step": 240710, "epoch": 2900} {"train_loss": -25.05165672302246, "global_step": 240711, "epoch": 2900} {"train_loss": -24.903715133666992, "global_step": 240712, "epoch": 2900} {"train_loss": -24.581531524658203, "global_step": 240713, "epoch": 2900} {"train_loss": -24.904659271240234, "global_step": 240714, "epoch": 2900} {"train_loss": -24.832687377929688, "global_step": 240715, "epoch": 2900} {"train_loss": -24.703596115112305, "global_step": 240716, "epoch": 2900} {"train_loss": -24.842388153076172, "global_step": 240717, "epoch": 2900} {"train_loss": -25.086917877197266, "global_step": 240718, "epoch": 2900} {"train_loss": -24.698827743530273, "global_step": 240719, "epoch": 2900} {"train_loss": -24.909826278686523, "global_step": 240720, "epoch": 2900} {"train_loss": -24.973176956176758, "global_step": 240721, "epoch": 2900} {"train_loss": -24.629405975341797, "global_step": 240722, "epoch": 2900} {"train_loss": -25.03278160095215, "global_step": 240723, "epoch": 2900} {"train_loss": -24.79930877685547, "global_step": 240724, "epoch": 2900} {"train_loss": -25.055105209350586, "global_step": 240725, "epoch": 2900} {"train_loss": -25.164173126220703, "global_step": 240726, "epoch": 2900} {"train_loss": -25.291975021362305, "global_step": 240727, "epoch": 2900} {"train_loss": -25.07396125793457, "global_step": 240728, "epoch": 2900} {"train_loss": -25.137968063354492, "global_step": 240729, "epoch": 2900} {"train_loss": -24.896203994750977, "global_step": 240730, "epoch": 2900} {"train_loss": -24.96078109741211, "global_step": 240731, "epoch": 2900} {"train_loss": -24.711572647094727, "global_step": 240732, "epoch": 2900} {"train_loss": -24.708539962768555, "global_step": 240733, "epoch": 2900} {"train_loss": -24.740615844726562, "global_step": 240734, "epoch": 2900} {"train_loss": -24.993799209594727, "global_step": 240735, "epoch": 2900} {"train_loss": -24.934823989868164, "global_step": 240736, "epoch": 2900} {"train_loss": -25.268747329711914, "global_step": 240737, "epoch": 2900} {"train_loss": -24.767614364624023, "global_step": 240738, "epoch": 2900} {"train_loss": -24.787622451782227, "global_step": 240739, "epoch": 2900} {"train_loss": -24.936128616333008, "global_step": 240740, "epoch": 2900} {"train_loss": -25.428159713745117, "global_step": 240741, "epoch": 2900} {"train_loss": -25.040491104125977, "global_step": 240742, "epoch": 2900} {"train_loss": -24.570022583007812, "global_step": 240743, "epoch": 2900} {"train_loss": -25.061182022094727, "global_step": 240744, "epoch": 2900} {"train_loss": -24.823026657104492, "global_step": 240745, "epoch": 2900} {"train_loss": -24.773813247680664, "global_step": 240746, "epoch": 2900} {"train_loss": -25.06332778930664, "global_step": 240747, "epoch": 2900} {"train_loss": -25.15842056274414, "global_step": 240748, "epoch": 2900} {"train_loss": -25.095556259155273, "global_step": 240749, "epoch": 2900} {"train_loss": -24.647336959838867, "global_step": 240750, "epoch": 2900} {"train_loss": -25.079368591308594, "global_step": 240751, "epoch": 2900} {"train_loss": -24.686843872070312, "global_step": 240752, "epoch": 2900} {"train_loss": -24.409631729125977, "global_step": 240753, "epoch": 2900} {"train_loss": -25.146121978759766, "global_step": 240754, "epoch": 2900} {"train_loss": -24.79440689086914, "global_step": 240755, "epoch": 2900} {"train_loss": -24.509510040283203, "global_step": 240756, "epoch": 2900} {"train_loss": -24.849075317382812, "global_step": 240757, "epoch": 2900} {"train_loss": -24.569900512695312, "global_step": 240758, "epoch": 2900} {"train_loss": -24.784780502319336, "global_step": 240759, "epoch": 2900} {"train_loss": -24.44942283630371, "global_step": 240760, "epoch": 2900} {"train_loss": -24.328678131103516, "global_step": 240761, "epoch": 2900} {"train_loss": -24.423246383666992, "global_step": 240762, "epoch": 2900} {"train_loss": -24.680301666259766, "global_step": 240763, "epoch": 2900} {"train_loss": -25.020231246948242, "global_step": 240764, "epoch": 2900} {"train_loss": -24.507518768310547, "global_step": 240765, "epoch": 2900} {"train_loss": -24.598630905151367, "global_step": 240766, "epoch": 2900} {"train_loss": -24.49849510192871, "global_step": 240767, "epoch": 2900} {"train_loss": -24.675268173217773, "global_step": 240768, "epoch": 2900} {"train_loss": -24.765399932861328, "global_step": 240769, "epoch": 2900} {"train_loss": -24.83562660217285, "global_step": 240770, "epoch": 2900} {"train_loss": -24.82476806640625, "global_step": 240771, "epoch": 2900} {"train_loss": -24.92880630493164, "global_step": 240772, "epoch": 2900} {"train_loss": -25.052440643310547, "global_step": 240773, "epoch": 2900} {"train_loss": -25.357213973999023, "global_step": 240774, "epoch": 2900} {"train_loss": -24.826133728027344, "global_step": 240775, "epoch": 2900} {"train_loss": -24.728185653686523, "global_step": 240776, "epoch": 2900} {"train_loss": -24.624832153320312, "global_step": 240777, "epoch": 2900} {"train_loss": -24.851272583007812, "global_step": 240778, "epoch": 2900} {"train_loss": -24.78968620300293, "global_step": 240779, "epoch": 2900} {"train_loss": -24.807010650634766, "global_step": 240780, "epoch": 2900} {"train_loss": -25.066030502319336, "global_step": 240781, "epoch": 2900} {"train_loss": -24.85260972631983, "global_step": 240782, "epoch": 2900, "train/sim_max_reward_0": 1.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4500000": 1.0, "test/sim_max_reward_4500001": 1.0, "test/sim_max_reward_4500002": 1.0, "test/sim_max_reward_4500003": 1.0, "test/sim_max_reward_4500004": 1.0, "test/sim_max_reward_4500005": 1.0, "test/sim_max_reward_4500006": 1.0, "test/sim_max_reward_4500007": 0.0, "test/sim_max_reward_4500008": 1.0, "test/sim_max_reward_4500009": 1.0, "test/sim_max_reward_4500010": 1.0, "test/sim_max_reward_4500011": 1.0, "test/sim_max_reward_4500012": 1.0, "test/sim_max_reward_4500013": 1.0, "test/sim_max_reward_4500014": 1.0, "test/sim_max_reward_4500015": 1.0, "test/sim_max_reward_4500016": 1.0, "test/sim_max_reward_4500017": 1.0, "test/sim_max_reward_4500018": 1.0, "test/sim_max_reward_4500019": 0.0, "test/sim_max_reward_4500020": 1.0, "test/sim_max_reward_4500021": 1.0, "train/mean_score": 1.0, "test/mean_score": 0.9090909090909091, "val_loss": 6797423.0} {"train_loss": -23.839183807373047, "global_step": 240783, "epoch": 2901} {"train_loss": -22.826696395874023, "global_step": 240784, "epoch": 2901} {"train_loss": -24.279102325439453, "global_step": 240785, "epoch": 2901} {"train_loss": -23.721059799194336, "global_step": 240786, "epoch": 2901} {"train_loss": -23.953886032104492, "global_step": 240787, "epoch": 2901} {"train_loss": -24.16896629333496, "global_step": 240788, "epoch": 2901} {"train_loss": -24.179182052612305, "global_step": 240789, "epoch": 2901} {"train_loss": -24.468955993652344, "global_step": 240790, "epoch": 2901} {"train_loss": -24.684091567993164, "global_step": 240791, "epoch": 2901} {"train_loss": -24.337434768676758, "global_step": 240792, "epoch": 2901} {"train_loss": -24.337316513061523, "global_step": 240793, "epoch": 2901} {"train_loss": -24.744720458984375, "global_step": 240794, "epoch": 2901} {"train_loss": -24.574193954467773, "global_step": 240795, "epoch": 2901} {"train_loss": -24.615737915039062, "global_step": 240796, "epoch": 2901} {"train_loss": -24.330184936523438, "global_step": 240797, "epoch": 2901} {"train_loss": -24.5792179107666, "global_step": 240798, "epoch": 2901} {"train_loss": -24.83806800842285, "global_step": 240799, "epoch": 2901} {"train_loss": -24.236276626586914, "global_step": 240800, "epoch": 2901} {"train_loss": -24.945194244384766, "global_step": 240801, "epoch": 2901} {"train_loss": -24.614826202392578, "global_step": 240802, "epoch": 2901} {"train_loss": -24.72443199157715, "global_step": 240803, "epoch": 2901} {"train_loss": -24.42821502685547, "global_step": 240804, "epoch": 2901} {"train_loss": -24.87944984436035, "global_step": 240805, "epoch": 2901} {"train_loss": -25.014503479003906, "global_step": 240806, "epoch": 2901} {"train_loss": -24.85187339782715, "global_step": 240807, "epoch": 2901} {"train_loss": -25.050106048583984, "global_step": 240808, "epoch": 2901} {"train_loss": -24.54024314880371, "global_step": 240809, "epoch": 2901} {"train_loss": -24.83235740661621, "global_step": 240810, "epoch": 2901} {"train_loss": -24.724206924438477, "global_step": 240811, "epoch": 2901} {"train_loss": -24.734716415405273, "global_step": 240812, "epoch": 2901} {"train_loss": -24.60401725769043, "global_step": 240813, "epoch": 2901} {"train_loss": -25.01740074157715, "global_step": 240814, "epoch": 2901} {"train_loss": -24.850065231323242, "global_step": 240815, "epoch": 2901} {"train_loss": -24.636280059814453, "global_step": 240816, "epoch": 2901} {"train_loss": -25.02903938293457, "global_step": 240817, "epoch": 2901} {"train_loss": -24.556974411010742, "global_step": 240818, "epoch": 2901} {"train_loss": -24.559743881225586, "global_step": 240819, "epoch": 2901} {"train_loss": -24.725868225097656, "global_step": 240820, "epoch": 2901} {"train_loss": -24.765422821044922, "global_step": 240821, "epoch": 2901} {"train_loss": -25.241167068481445, "global_step": 240822, "epoch": 2901} {"train_loss": -25.402708053588867, "global_step": 240823, "epoch": 2901} {"train_loss": -24.95316505432129, "global_step": 240824, "epoch": 2901} {"train_loss": -24.875009536743164, "global_step": 240825, "epoch": 2901} {"train_loss": -24.553091049194336, "global_step": 240826, "epoch": 2901} {"train_loss": -23.682775497436523, "global_step": 240827, "epoch": 2901} {"train_loss": -24.091550827026367, "global_step": 240828, "epoch": 2901} {"train_loss": -24.46561050415039, "global_step": 240829, "epoch": 2901} {"train_loss": -24.738222122192383, "global_step": 240830, "epoch": 2901} {"train_loss": -24.603515625, "global_step": 240831, "epoch": 2901} {"train_loss": -25.09512710571289, "global_step": 240832, "epoch": 2901} {"train_loss": -24.98492431640625, "global_step": 240833, "epoch": 2901} {"train_loss": -24.882661819458008, "global_step": 240834, "epoch": 2901} {"train_loss": -25.057601928710938, "global_step": 240835, "epoch": 2901} {"train_loss": -25.106374740600586, "global_step": 240836, "epoch": 2901} {"train_loss": -24.798099517822266, "global_step": 240837, "epoch": 2901} {"train_loss": -25.075490951538086, "global_step": 240838, "epoch": 2901} {"train_loss": -24.87234115600586, "global_step": 240839, "epoch": 2901} {"train_loss": -25.39924430847168, "global_step": 240840, "epoch": 2901} {"train_loss": -24.387731552124023, "global_step": 240841, "epoch": 2901} {"train_loss": -24.516218185424805, "global_step": 240842, "epoch": 2901} {"train_loss": -24.82655906677246, "global_step": 240843, "epoch": 2901} {"train_loss": -24.784128189086914, "global_step": 240844, "epoch": 2901} {"train_loss": -24.99853515625, "global_step": 240845, "epoch": 2901} {"train_loss": -24.55120849609375, "global_step": 240846, "epoch": 2901} {"train_loss": -25.03441047668457, "global_step": 240847, "epoch": 2901} {"train_loss": -24.999267578125, "global_step": 240848, "epoch": 2901} {"train_loss": -24.878820419311523, "global_step": 240849, "epoch": 2901} {"train_loss": -25.079687118530273, "global_step": 240850, "epoch": 2901} {"train_loss": -24.9487361907959, "global_step": 240851, "epoch": 2901} {"train_loss": -25.073667526245117, "global_step": 240852, "epoch": 2901} {"train_loss": -24.968740463256836, "global_step": 240853, "epoch": 2901} {"train_loss": -25.0615177154541, "global_step": 240854, "epoch": 2901} {"train_loss": -24.87428092956543, "global_step": 240855, "epoch": 2901} {"train_loss": -25.311094284057617, "global_step": 240856, "epoch": 2901} {"train_loss": -24.6812686920166, "global_step": 240857, "epoch": 2901} {"train_loss": -24.7243709564209, "global_step": 240858, "epoch": 2901} {"train_loss": -24.80575942993164, "global_step": 240859, "epoch": 2901} {"train_loss": -24.935226440429688, "global_step": 240860, "epoch": 2901} {"train_loss": -24.756162643432617, "global_step": 240861, "epoch": 2901} {"train_loss": -25.58966827392578, "global_step": 240862, "epoch": 2901} {"train_loss": -25.06538200378418, "global_step": 240863, "epoch": 2901} {"train_loss": -24.678298950195312, "global_step": 240864, "epoch": 2901} {"train_loss": -24.7064157279141, "global_step": 240865, "epoch": 2901, "val_loss": 6868736.0} {"train_loss": -24.414306640625, "global_step": 240866, "epoch": 2902} {"train_loss": -24.647056579589844, "global_step": 240867, "epoch": 2902} {"train_loss": -24.40241241455078, "global_step": 240868, "epoch": 2902} {"train_loss": -24.76460075378418, "global_step": 240869, "epoch": 2902} {"train_loss": -24.832366943359375, "global_step": 240870, "epoch": 2902} {"train_loss": -24.612314224243164, "global_step": 240871, "epoch": 2902} {"train_loss": -24.35531997680664, "global_step": 240872, "epoch": 2902} {"train_loss": -24.700254440307617, "global_step": 240873, "epoch": 2902} {"train_loss": -25.19495964050293, "global_step": 240874, "epoch": 2902} {"train_loss": -24.882436752319336, "global_step": 240875, "epoch": 2902} {"train_loss": -24.40896224975586, "global_step": 240876, "epoch": 2902} {"train_loss": -24.728063583374023, "global_step": 240877, "epoch": 2902} {"train_loss": -24.75459098815918, "global_step": 240878, "epoch": 2902} {"train_loss": -24.57850456237793, "global_step": 240879, "epoch": 2902} {"train_loss": -24.996335983276367, "global_step": 240880, "epoch": 2902} {"train_loss": -24.817842483520508, "global_step": 240881, "epoch": 2902} {"train_loss": -24.407690048217773, "global_step": 240882, "epoch": 2902} {"train_loss": -24.838354110717773, "global_step": 240883, "epoch": 2902} {"train_loss": -24.939727783203125, "global_step": 240884, "epoch": 2902} {"train_loss": -25.35149383544922, "global_step": 240885, "epoch": 2902} {"train_loss": -25.172460556030273, "global_step": 240886, "epoch": 2902} {"train_loss": -25.131803512573242, "global_step": 240887, "epoch": 2902} {"train_loss": -24.932302474975586, "global_step": 240888, "epoch": 2902} {"train_loss": -24.9757080078125, "global_step": 240889, "epoch": 2902} {"train_loss": -25.14191436767578, "global_step": 240890, "epoch": 2902} {"train_loss": -25.218542098999023, "global_step": 240891, "epoch": 2902} {"train_loss": -25.187265396118164, "global_step": 240892, "epoch": 2902} {"train_loss": -25.200584411621094, "global_step": 240893, "epoch": 2902} {"train_loss": -24.85691261291504, "global_step": 240894, "epoch": 2902} {"train_loss": -24.86103630065918, "global_step": 240895, "epoch": 2902} {"train_loss": -25.056772232055664, "global_step": 240896, "epoch": 2902} {"train_loss": -25.034109115600586, "global_step": 240897, "epoch": 2902} {"train_loss": -25.106250762939453, "global_step": 240898, "epoch": 2902} {"train_loss": -24.906295776367188, "global_step": 240899, "epoch": 2902} {"train_loss": -25.167612075805664, "global_step": 240900, "epoch": 2902} {"train_loss": -25.214588165283203, "global_step": 240901, "epoch": 2902} {"train_loss": -24.914886474609375, "global_step": 240902, "epoch": 2902} {"train_loss": -25.007164001464844, "global_step": 240903, "epoch": 2902} {"train_loss": -24.818513870239258, "global_step": 240904, "epoch": 2902} {"train_loss": -25.271203994750977, "global_step": 240905, "epoch": 2902} {"train_loss": -25.139020919799805, "global_step": 240906, "epoch": 2902} {"train_loss": -25.050418853759766, "global_step": 240907, "epoch": 2902} {"train_loss": -24.881643295288086, "global_step": 240908, "epoch": 2902} {"train_loss": -25.104764938354492, "global_step": 240909, "epoch": 2902} {"train_loss": -24.994028091430664, "global_step": 240910, "epoch": 2902} {"train_loss": -25.11551856994629, "global_step": 240911, "epoch": 2902} {"train_loss": -25.120975494384766, "global_step": 240912, "epoch": 2902} {"train_loss": -24.86041831970215, "global_step": 240913, "epoch": 2902} {"train_loss": -24.96783447265625, "global_step": 240914, "epoch": 2902} {"train_loss": -25.192148208618164, "global_step": 240915, "epoch": 2902} {"train_loss": -25.247325897216797, "global_step": 240916, "epoch": 2902} {"train_loss": -25.060657501220703, "global_step": 240917, "epoch": 2902} {"train_loss": -24.90458106994629, "global_step": 240918, "epoch": 2902} {"train_loss": -25.000228881835938, "global_step": 240919, "epoch": 2902} {"train_loss": -24.85302734375, "global_step": 240920, "epoch": 2902} {"train_loss": -25.01722526550293, "global_step": 240921, "epoch": 2902} {"train_loss": -24.418224334716797, "global_step": 240922, "epoch": 2902} {"train_loss": -24.09160804748535, "global_step": 240923, "epoch": 2902} {"train_loss": -24.31976890563965, "global_step": 240924, "epoch": 2902} {"train_loss": -24.712249755859375, "global_step": 240925, "epoch": 2902} {"train_loss": -24.62031364440918, "global_step": 240926, "epoch": 2902} {"train_loss": -24.488306045532227, "global_step": 240927, "epoch": 2902} {"train_loss": -24.080244064331055, "global_step": 240928, "epoch": 2902} {"train_loss": -24.545944213867188, "global_step": 240929, "epoch": 2902} {"train_loss": -24.5682373046875, "global_step": 240930, "epoch": 2902} {"train_loss": -24.92034912109375, "global_step": 240931, "epoch": 2902} {"train_loss": -24.487485885620117, "global_step": 240932, "epoch": 2902} {"train_loss": -24.744897842407227, "global_step": 240933, "epoch": 2902} {"train_loss": -24.967695236206055, "global_step": 240934, "epoch": 2902} {"train_loss": -24.407276153564453, "global_step": 240935, "epoch": 2902} {"train_loss": -24.72462272644043, "global_step": 240936, "epoch": 2902} {"train_loss": -24.758710861206055, "global_step": 240937, "epoch": 2902} {"train_loss": -24.708881378173828, "global_step": 240938, "epoch": 2902} {"train_loss": -24.923263549804688, "global_step": 240939, "epoch": 2902} {"train_loss": -24.745197296142578, "global_step": 240940, "epoch": 2902} {"train_loss": -24.806699752807617, "global_step": 240941, "epoch": 2902} {"train_loss": -24.689611434936523, "global_step": 240942, "epoch": 2902} {"train_loss": -24.698713302612305, "global_step": 240943, "epoch": 2902} {"train_loss": -25.0311279296875, "global_step": 240944, "epoch": 2902} {"train_loss": -24.800050735473633, "global_step": 240945, "epoch": 2902} {"train_loss": -25.028223037719727, "global_step": 240946, "epoch": 2902} {"train_loss": -24.915502548217773, "global_step": 240947, "epoch": 2902} {"train_loss": -24.835385701742517, "global_step": 240948, "epoch": 2902, "val_loss": 6787688.5} {"train_loss": -24.79437828063965, "global_step": 240949, "epoch": 2903} {"train_loss": -25.286903381347656, "global_step": 240950, "epoch": 2903} {"train_loss": -24.430173873901367, "global_step": 240951, "epoch": 2903} {"train_loss": -24.657629013061523, "global_step": 240952, "epoch": 2903} {"train_loss": -24.588998794555664, "global_step": 240953, "epoch": 2903} {"train_loss": -24.909406661987305, "global_step": 240954, "epoch": 2903} {"train_loss": -25.2602596282959, "global_step": 240955, "epoch": 2903} {"train_loss": -24.698057174682617, "global_step": 240956, "epoch": 2903} {"train_loss": -24.807361602783203, "global_step": 240957, "epoch": 2903} {"train_loss": -24.9890079498291, "global_step": 240958, "epoch": 2903} {"train_loss": -24.50160789489746, "global_step": 240959, "epoch": 2903} {"train_loss": -24.966394424438477, "global_step": 240960, "epoch": 2903} {"train_loss": -24.860525131225586, "global_step": 240961, "epoch": 2903} {"train_loss": -24.436447143554688, "global_step": 240962, "epoch": 2903} {"train_loss": -24.466171264648438, "global_step": 240963, "epoch": 2903} {"train_loss": -24.71021842956543, "global_step": 240964, "epoch": 2903} {"train_loss": -25.415115356445312, "global_step": 240965, "epoch": 2903} {"train_loss": -24.785154342651367, "global_step": 240966, "epoch": 2903} {"train_loss": -24.824052810668945, "global_step": 240967, "epoch": 2903} {"train_loss": -24.44123077392578, "global_step": 240968, "epoch": 2903} {"train_loss": -25.04825782775879, "global_step": 240969, "epoch": 2903} {"train_loss": -24.866296768188477, "global_step": 240970, "epoch": 2903} {"train_loss": -24.95643424987793, "global_step": 240971, "epoch": 2903} {"train_loss": -24.68149757385254, "global_step": 240972, "epoch": 2903} {"train_loss": -24.78995132446289, "global_step": 240973, "epoch": 2903} {"train_loss": -24.6727294921875, "global_step": 240974, "epoch": 2903} {"train_loss": -24.948627471923828, "global_step": 240975, "epoch": 2903} {"train_loss": -24.741806030273438, "global_step": 240976, "epoch": 2903} {"train_loss": -24.99660873413086, "global_step": 240977, "epoch": 2903} {"train_loss": -24.6932430267334, "global_step": 240978, "epoch": 2903} {"train_loss": -24.690000534057617, "global_step": 240979, "epoch": 2903} {"train_loss": -24.981609344482422, "global_step": 240980, "epoch": 2903} {"train_loss": -24.755895614624023, "global_step": 240981, "epoch": 2903} {"train_loss": -24.855262756347656, "global_step": 240982, "epoch": 2903} {"train_loss": -25.051971435546875, "global_step": 240983, "epoch": 2903} {"train_loss": -24.959726333618164, "global_step": 240984, "epoch": 2903} {"train_loss": -25.24298858642578, "global_step": 240985, "epoch": 2903} {"train_loss": -24.672182083129883, "global_step": 240986, "epoch": 2903} {"train_loss": -24.98016929626465, "global_step": 240987, "epoch": 2903} {"train_loss": -24.837387084960938, "global_step": 240988, "epoch": 2903} {"train_loss": -24.564672470092773, "global_step": 240989, "epoch": 2903} {"train_loss": -24.948949813842773, "global_step": 240990, "epoch": 2903} {"train_loss": -25.17934226989746, "global_step": 240991, "epoch": 2903} {"train_loss": -24.974349975585938, "global_step": 240992, "epoch": 2903} {"train_loss": -24.86728858947754, "global_step": 240993, "epoch": 2903} {"train_loss": -24.939666748046875, "global_step": 240994, "epoch": 2903} {"train_loss": -24.69596290588379, "global_step": 240995, "epoch": 2903} {"train_loss": -24.83748435974121, "global_step": 240996, "epoch": 2903} {"train_loss": -24.814878463745117, "global_step": 240997, "epoch": 2903} {"train_loss": -24.602588653564453, "global_step": 240998, "epoch": 2903} {"train_loss": -24.904037475585938, "global_step": 240999, "epoch": 2903} {"train_loss": -25.001096725463867, "global_step": 241000, "epoch": 2903} {"train_loss": -24.990924835205078, "global_step": 241001, "epoch": 2903} {"train_loss": -24.74700164794922, "global_step": 241002, "epoch": 2903} {"train_loss": -25.117429733276367, "global_step": 241003, "epoch": 2903} {"train_loss": -24.771469116210938, "global_step": 241004, "epoch": 2903} {"train_loss": -25.047468185424805, "global_step": 241005, "epoch": 2903} {"train_loss": -25.141767501831055, "global_step": 241006, "epoch": 2903} {"train_loss": -25.250259399414062, "global_step": 241007, "epoch": 2903} {"train_loss": -24.89103126525879, "global_step": 241008, "epoch": 2903} {"train_loss": -24.95106315612793, "global_step": 241009, "epoch": 2903} {"train_loss": -24.496185302734375, "global_step": 241010, "epoch": 2903} {"train_loss": -25.338397979736328, "global_step": 241011, "epoch": 2903} {"train_loss": -24.889455795288086, "global_step": 241012, "epoch": 2903} {"train_loss": -25.246557235717773, "global_step": 241013, "epoch": 2903} {"train_loss": -25.070526123046875, "global_step": 241014, "epoch": 2903} {"train_loss": -24.95503807067871, "global_step": 241015, "epoch": 2903} {"train_loss": -25.021480560302734, "global_step": 241016, "epoch": 2903} {"train_loss": -25.32022476196289, "global_step": 241017, "epoch": 2903} {"train_loss": -25.21892738342285, "global_step": 241018, "epoch": 2903} {"train_loss": -24.525693893432617, "global_step": 241019, "epoch": 2903} {"train_loss": -24.335773468017578, "global_step": 241020, "epoch": 2903} {"train_loss": -24.750490188598633, "global_step": 241021, "epoch": 2903} {"train_loss": -24.891420364379883, "global_step": 241022, "epoch": 2903} {"train_loss": -24.777833938598633, "global_step": 241023, "epoch": 2903} {"train_loss": -24.921674728393555, "global_step": 241024, "epoch": 2903} {"train_loss": -24.80473518371582, "global_step": 241025, "epoch": 2903} {"train_loss": -25.063322067260742, "global_step": 241026, "epoch": 2903} {"train_loss": -24.89691734313965, "global_step": 241027, "epoch": 2903} {"train_loss": -25.0629940032959, "global_step": 241028, "epoch": 2903} {"train_loss": -24.85172462463379, "global_step": 241029, "epoch": 2903} {"train_loss": -24.969497680664062, "global_step": 241030, "epoch": 2903} {"train_loss": -24.872412922870684, "global_step": 241031, "epoch": 2903, "val_loss": 6872323.0} {"train_loss": -25.048986434936523, "global_step": 241032, "epoch": 2904} {"train_loss": -24.54469871520996, "global_step": 241033, "epoch": 2904} {"train_loss": -24.340805053710938, "global_step": 241034, "epoch": 2904} {"train_loss": -24.404651641845703, "global_step": 241035, "epoch": 2904} {"train_loss": -24.682218551635742, "global_step": 241036, "epoch": 2904} {"train_loss": -24.308874130249023, "global_step": 241037, "epoch": 2904} {"train_loss": -24.542795181274414, "global_step": 241038, "epoch": 2904} {"train_loss": -24.43570327758789, "global_step": 241039, "epoch": 2904} {"train_loss": -24.760726928710938, "global_step": 241040, "epoch": 2904} {"train_loss": -24.539833068847656, "global_step": 241041, "epoch": 2904} {"train_loss": -24.542150497436523, "global_step": 241042, "epoch": 2904} {"train_loss": -24.906280517578125, "global_step": 241043, "epoch": 2904} {"train_loss": -24.560348510742188, "global_step": 241044, "epoch": 2904} {"train_loss": -25.156736373901367, "global_step": 241045, "epoch": 2904} {"train_loss": -24.327062606811523, "global_step": 241046, "epoch": 2904} {"train_loss": -24.558189392089844, "global_step": 241047, "epoch": 2904} {"train_loss": -25.122535705566406, "global_step": 241048, "epoch": 2904} {"train_loss": -24.83484649658203, "global_step": 241049, "epoch": 2904} {"train_loss": -24.573455810546875, "global_step": 241050, "epoch": 2904} {"train_loss": -24.630321502685547, "global_step": 241051, "epoch": 2904} {"train_loss": -24.638532638549805, "global_step": 241052, "epoch": 2904} {"train_loss": -24.87361717224121, "global_step": 241053, "epoch": 2904} {"train_loss": -24.686887741088867, "global_step": 241054, "epoch": 2904} {"train_loss": -24.661531448364258, "global_step": 241055, "epoch": 2904} {"train_loss": -24.88783073425293, "global_step": 241056, "epoch": 2904} {"train_loss": -24.610647201538086, "global_step": 241057, "epoch": 2904} {"train_loss": -24.932100296020508, "global_step": 241058, "epoch": 2904} {"train_loss": -25.09394645690918, "global_step": 241059, "epoch": 2904} {"train_loss": -25.356027603149414, "global_step": 241060, "epoch": 2904} {"train_loss": -25.105318069458008, "global_step": 241061, "epoch": 2904} {"train_loss": -25.078466415405273, "global_step": 241062, "epoch": 2904} {"train_loss": -24.542539596557617, "global_step": 241063, "epoch": 2904} {"train_loss": -24.659265518188477, "global_step": 241064, "epoch": 2904} {"train_loss": -25.189498901367188, "global_step": 241065, "epoch": 2904} {"train_loss": -24.913394927978516, "global_step": 241066, "epoch": 2904} {"train_loss": -24.762887954711914, "global_step": 241067, "epoch": 2904} {"train_loss": -25.16360855102539, "global_step": 241068, "epoch": 2904} {"train_loss": -25.00360870361328, "global_step": 241069, "epoch": 2904} {"train_loss": -24.6292667388916, "global_step": 241070, "epoch": 2904} {"train_loss": -25.097537994384766, "global_step": 241071, "epoch": 2904} {"train_loss": -25.195438385009766, "global_step": 241072, "epoch": 2904} {"train_loss": -25.126731872558594, "global_step": 241073, "epoch": 2904} {"train_loss": -24.993274688720703, "global_step": 241074, "epoch": 2904} {"train_loss": -25.372657775878906, "global_step": 241075, "epoch": 2904} {"train_loss": -24.707250595092773, "global_step": 241076, "epoch": 2904} {"train_loss": -24.69330406188965, "global_step": 241077, "epoch": 2904} {"train_loss": -25.261119842529297, "global_step": 241078, "epoch": 2904} {"train_loss": -25.500656127929688, "global_step": 241079, "epoch": 2904} {"train_loss": -24.738544464111328, "global_step": 241080, "epoch": 2904} {"train_loss": -24.56134605407715, "global_step": 241081, "epoch": 2904} {"train_loss": -24.975860595703125, "global_step": 241082, "epoch": 2904} {"train_loss": -25.037900924682617, "global_step": 241083, "epoch": 2904} {"train_loss": -24.569074630737305, "global_step": 241084, "epoch": 2904} {"train_loss": -24.12013053894043, "global_step": 241085, "epoch": 2904} {"train_loss": -24.790014266967773, "global_step": 241086, "epoch": 2904} {"train_loss": -24.198049545288086, "global_step": 241087, "epoch": 2904} {"train_loss": -25.13545036315918, "global_step": 241088, "epoch": 2904} {"train_loss": -24.71050453186035, "global_step": 241089, "epoch": 2904} {"train_loss": -25.04654884338379, "global_step": 241090, "epoch": 2904} {"train_loss": -24.907079696655273, "global_step": 241091, "epoch": 2904} {"train_loss": -24.744892120361328, "global_step": 241092, "epoch": 2904} {"train_loss": -24.999271392822266, "global_step": 241093, "epoch": 2904} {"train_loss": -25.027618408203125, "global_step": 241094, "epoch": 2904} {"train_loss": -24.956098556518555, "global_step": 241095, "epoch": 2904} {"train_loss": -24.690603256225586, "global_step": 241096, "epoch": 2904} {"train_loss": -24.243934631347656, "global_step": 241097, "epoch": 2904} {"train_loss": -24.654130935668945, "global_step": 241098, "epoch": 2904} {"train_loss": -24.826902389526367, "global_step": 241099, "epoch": 2904} {"train_loss": -25.134702682495117, "global_step": 241100, "epoch": 2904} {"train_loss": -25.047330856323242, "global_step": 241101, "epoch": 2904} {"train_loss": -24.64032554626465, "global_step": 241102, "epoch": 2904} {"train_loss": -25.138004302978516, "global_step": 241103, "epoch": 2904} {"train_loss": -24.916336059570312, "global_step": 241104, "epoch": 2904} {"train_loss": -25.10896873474121, "global_step": 241105, "epoch": 2904} {"train_loss": -24.83961296081543, "global_step": 241106, "epoch": 2904} {"train_loss": -24.96756935119629, "global_step": 241107, "epoch": 2904} {"train_loss": -24.9367618560791, "global_step": 241108, "epoch": 2904} {"train_loss": -24.83746910095215, "global_step": 241109, "epoch": 2904} {"train_loss": -24.93977165222168, "global_step": 241110, "epoch": 2904} {"train_loss": -25.05697250366211, "global_step": 241111, "epoch": 2904} {"train_loss": -24.83584976196289, "global_step": 241112, "epoch": 2904} {"train_loss": -24.983009338378906, "global_step": 241113, "epoch": 2904} {"train_loss": -24.83225126151579, "global_step": 241114, "epoch": 2904, "val_loss": 6821592.0} {"train_loss": -24.421812057495117, "global_step": 241115, "epoch": 2905} {"train_loss": -24.64839744567871, "global_step": 241116, "epoch": 2905} {"train_loss": -24.483861923217773, "global_step": 241117, "epoch": 2905} {"train_loss": -24.541868209838867, "global_step": 241118, "epoch": 2905} {"train_loss": -24.661823272705078, "global_step": 241119, "epoch": 2905} {"train_loss": -24.95404624938965, "global_step": 241120, "epoch": 2905} {"train_loss": -24.534255981445312, "global_step": 241121, "epoch": 2905} {"train_loss": -24.461835861206055, "global_step": 241122, "epoch": 2905} {"train_loss": -24.69305992126465, "global_step": 241123, "epoch": 2905} {"train_loss": -24.85060691833496, "global_step": 241124, "epoch": 2905} {"train_loss": -24.696226119995117, "global_step": 241125, "epoch": 2905} {"train_loss": -24.482389450073242, "global_step": 241126, "epoch": 2905} {"train_loss": -24.878679275512695, "global_step": 241127, "epoch": 2905} {"train_loss": -24.68644142150879, "global_step": 241128, "epoch": 2905} {"train_loss": -24.995725631713867, "global_step": 241129, "epoch": 2905} {"train_loss": -24.752164840698242, "global_step": 241130, "epoch": 2905} {"train_loss": -24.389265060424805, "global_step": 241131, "epoch": 2905} {"train_loss": -24.788522720336914, "global_step": 241132, "epoch": 2905} {"train_loss": -24.7325439453125, "global_step": 241133, "epoch": 2905} {"train_loss": -24.962730407714844, "global_step": 241134, "epoch": 2905} {"train_loss": -25.1381893157959, "global_step": 241135, "epoch": 2905} {"train_loss": -25.055130004882812, "global_step": 241136, "epoch": 2905} {"train_loss": -24.940366744995117, "global_step": 241137, "epoch": 2905} {"train_loss": -25.05982780456543, "global_step": 241138, "epoch": 2905} {"train_loss": -24.985618591308594, "global_step": 241139, "epoch": 2905} {"train_loss": -25.26266860961914, "global_step": 241140, "epoch": 2905} {"train_loss": -24.97968864440918, "global_step": 241141, "epoch": 2905} {"train_loss": -25.212797164916992, "global_step": 241142, "epoch": 2905} {"train_loss": -24.961669921875, "global_step": 241143, "epoch": 2905} {"train_loss": -25.128774642944336, "global_step": 241144, "epoch": 2905} {"train_loss": -25.002315521240234, "global_step": 241145, "epoch": 2905} {"train_loss": -24.93475341796875, "global_step": 241146, "epoch": 2905} {"train_loss": -24.82205581665039, "global_step": 241147, "epoch": 2905} {"train_loss": -24.807912826538086, "global_step": 241148, "epoch": 2905} {"train_loss": -24.9038143157959, "global_step": 241149, "epoch": 2905} {"train_loss": -24.898725509643555, "global_step": 241150, "epoch": 2905} {"train_loss": -24.7828311920166, "global_step": 241151, "epoch": 2905} {"train_loss": -24.717788696289062, "global_step": 241152, "epoch": 2905} {"train_loss": -25.063156127929688, "global_step": 241153, "epoch": 2905} {"train_loss": -24.690099716186523, "global_step": 241154, "epoch": 2905} {"train_loss": -25.107675552368164, "global_step": 241155, "epoch": 2905} {"train_loss": -25.104820251464844, "global_step": 241156, "epoch": 2905} {"train_loss": -25.00528335571289, "global_step": 241157, "epoch": 2905} {"train_loss": -24.872478485107422, "global_step": 241158, "epoch": 2905} {"train_loss": -24.96184730529785, "global_step": 241159, "epoch": 2905} {"train_loss": -24.917953491210938, "global_step": 241160, "epoch": 2905} {"train_loss": -24.872587203979492, "global_step": 241161, "epoch": 2905} {"train_loss": -25.07063102722168, "global_step": 241162, "epoch": 2905} {"train_loss": -24.814889907836914, "global_step": 241163, "epoch": 2905} {"train_loss": -24.804956436157227, "global_step": 241164, "epoch": 2905} {"train_loss": -24.93393898010254, "global_step": 241165, "epoch": 2905} {"train_loss": -24.96600914001465, "global_step": 241166, "epoch": 2905} {"train_loss": -24.955827713012695, "global_step": 241167, "epoch": 2905} {"train_loss": -24.77713966369629, "global_step": 241168, "epoch": 2905} {"train_loss": -25.052518844604492, "global_step": 241169, "epoch": 2905} {"train_loss": -24.91326332092285, "global_step": 241170, "epoch": 2905} {"train_loss": -25.218120574951172, "global_step": 241171, "epoch": 2905} {"train_loss": -24.912817001342773, "global_step": 241172, "epoch": 2905} {"train_loss": -25.116270065307617, "global_step": 241173, "epoch": 2905} {"train_loss": -24.56280517578125, "global_step": 241174, "epoch": 2905} {"train_loss": -25.133102416992188, "global_step": 241175, "epoch": 2905} {"train_loss": -24.973384857177734, "global_step": 241176, "epoch": 2905} {"train_loss": -24.870166778564453, "global_step": 241177, "epoch": 2905} {"train_loss": -24.49922752380371, "global_step": 241178, "epoch": 2905} {"train_loss": -25.15559959411621, "global_step": 241179, "epoch": 2905} {"train_loss": -24.85919952392578, "global_step": 241180, "epoch": 2905} {"train_loss": -25.056936264038086, "global_step": 241181, "epoch": 2905} {"train_loss": -25.177778244018555, "global_step": 241182, "epoch": 2905} {"train_loss": -24.899200439453125, "global_step": 241183, "epoch": 2905} {"train_loss": -24.779346466064453, "global_step": 241184, "epoch": 2905} {"train_loss": -24.842021942138672, "global_step": 241185, "epoch": 2905} {"train_loss": -24.957767486572266, "global_step": 241186, "epoch": 2905} {"train_loss": -24.830297470092773, "global_step": 241187, "epoch": 2905} {"train_loss": -24.87336540222168, "global_step": 241188, "epoch": 2905} {"train_loss": -25.18406867980957, "global_step": 241189, "epoch": 2905} {"train_loss": -24.719289779663086, "global_step": 241190, "epoch": 2905} {"train_loss": -25.087671279907227, "global_step": 241191, "epoch": 2905} {"train_loss": -25.00004005432129, "global_step": 241192, "epoch": 2905} {"train_loss": -24.733320236206055, "global_step": 241193, "epoch": 2905} {"train_loss": -24.920734405517578, "global_step": 241194, "epoch": 2905} {"train_loss": -25.15627098083496, "global_step": 241195, "epoch": 2905} {"train_loss": -24.624128341674805, "global_step": 241196, "epoch": 2905} {"train_loss": -24.87742663004312, "global_step": 241197, "epoch": 2905, "val_loss": 6839522.0} {"train_loss": -24.55484390258789, "global_step": 241198, "epoch": 2906} {"train_loss": -24.35700798034668, "global_step": 241199, "epoch": 2906} {"train_loss": -24.773757934570312, "global_step": 241200, "epoch": 2906} {"train_loss": -24.436996459960938, "global_step": 241201, "epoch": 2906} {"train_loss": -24.43818473815918, "global_step": 241202, "epoch": 2906} {"train_loss": -24.285037994384766, "global_step": 241203, "epoch": 2906} {"train_loss": -24.842927932739258, "global_step": 241204, "epoch": 2906} {"train_loss": -24.49286460876465, "global_step": 241205, "epoch": 2906} {"train_loss": -25.07493019104004, "global_step": 241206, "epoch": 2906} {"train_loss": -25.108749389648438, "global_step": 241207, "epoch": 2906} {"train_loss": -24.961286544799805, "global_step": 241208, "epoch": 2906} {"train_loss": -24.676897048950195, "global_step": 241209, "epoch": 2906} {"train_loss": -24.69338035583496, "global_step": 241210, "epoch": 2906} {"train_loss": -24.423070907592773, "global_step": 241211, "epoch": 2906} {"train_loss": -24.56060218811035, "global_step": 241212, "epoch": 2906} {"train_loss": -25.04631805419922, "global_step": 241213, "epoch": 2906} {"train_loss": -24.862091064453125, "global_step": 241214, "epoch": 2906} {"train_loss": -24.696287155151367, "global_step": 241215, "epoch": 2906} {"train_loss": -24.755903244018555, "global_step": 241216, "epoch": 2906} {"train_loss": -24.718503952026367, "global_step": 241217, "epoch": 2906} {"train_loss": -24.724262237548828, "global_step": 241218, "epoch": 2906} {"train_loss": -24.727888107299805, "global_step": 241219, "epoch": 2906} {"train_loss": -25.20332908630371, "global_step": 241220, "epoch": 2906} {"train_loss": -24.9793758392334, "global_step": 241221, "epoch": 2906} {"train_loss": -25.144681930541992, "global_step": 241222, "epoch": 2906} {"train_loss": -25.167224884033203, "global_step": 241223, "epoch": 2906} {"train_loss": -25.216047286987305, "global_step": 241224, "epoch": 2906} {"train_loss": -25.066116333007812, "global_step": 241225, "epoch": 2906} {"train_loss": -24.966800689697266, "global_step": 241226, "epoch": 2906} {"train_loss": -24.884891510009766, "global_step": 241227, "epoch": 2906} {"train_loss": -25.02341079711914, "global_step": 241228, "epoch": 2906} {"train_loss": -25.023712158203125, "global_step": 241229, "epoch": 2906} {"train_loss": -24.832685470581055, "global_step": 241230, "epoch": 2906} {"train_loss": -25.046085357666016, "global_step": 241231, "epoch": 2906} {"train_loss": -24.688369750976562, "global_step": 241232, "epoch": 2906} {"train_loss": -25.211938858032227, "global_step": 241233, "epoch": 2906} {"train_loss": -25.19472312927246, "global_step": 241234, "epoch": 2906} {"train_loss": -25.087732315063477, "global_step": 241235, "epoch": 2906} {"train_loss": -24.773317337036133, "global_step": 241236, "epoch": 2906} {"train_loss": -24.774240493774414, "global_step": 241237, "epoch": 2906} {"train_loss": -25.034011840820312, "global_step": 241238, "epoch": 2906} {"train_loss": -25.134000778198242, "global_step": 241239, "epoch": 2906} {"train_loss": -24.997182846069336, "global_step": 241240, "epoch": 2906} {"train_loss": -24.573944091796875, "global_step": 241241, "epoch": 2906} {"train_loss": -24.91814422607422, "global_step": 241242, "epoch": 2906} {"train_loss": -25.083402633666992, "global_step": 241243, "epoch": 2906} {"train_loss": -25.146015167236328, "global_step": 241244, "epoch": 2906} {"train_loss": -24.71766471862793, "global_step": 241245, "epoch": 2906} {"train_loss": -24.761585235595703, "global_step": 241246, "epoch": 2906} {"train_loss": -25.233753204345703, "global_step": 241247, "epoch": 2906} {"train_loss": -25.156667709350586, "global_step": 241248, "epoch": 2906} {"train_loss": -24.845277786254883, "global_step": 241249, "epoch": 2906} {"train_loss": -24.736774444580078, "global_step": 241250, "epoch": 2906} {"train_loss": -25.169281005859375, "global_step": 241251, "epoch": 2906} {"train_loss": -24.644123077392578, "global_step": 241252, "epoch": 2906} {"train_loss": -24.840641021728516, "global_step": 241253, "epoch": 2906} {"train_loss": -24.98593521118164, "global_step": 241254, "epoch": 2906} {"train_loss": -25.229625701904297, "global_step": 241255, "epoch": 2906} {"train_loss": -25.070096969604492, "global_step": 241256, "epoch": 2906} {"train_loss": -24.866804122924805, "global_step": 241257, "epoch": 2906} {"train_loss": -25.014129638671875, "global_step": 241258, "epoch": 2906} {"train_loss": -24.626134872436523, "global_step": 241259, "epoch": 2906} {"train_loss": -25.2195987701416, "global_step": 241260, "epoch": 2906} {"train_loss": -25.000425338745117, "global_step": 241261, "epoch": 2906} {"train_loss": -25.317142486572266, "global_step": 241262, "epoch": 2906} {"train_loss": -25.008939743041992, "global_step": 241263, "epoch": 2906} {"train_loss": -24.73036766052246, "global_step": 241264, "epoch": 2906} {"train_loss": -24.872400283813477, "global_step": 241265, "epoch": 2906} {"train_loss": -24.895708084106445, "global_step": 241266, "epoch": 2906} {"train_loss": -25.0461483001709, "global_step": 241267, "epoch": 2906} {"train_loss": -24.778270721435547, "global_step": 241268, "epoch": 2906} {"train_loss": -24.955291748046875, "global_step": 241269, "epoch": 2906} {"train_loss": -24.565221786499023, "global_step": 241270, "epoch": 2906} {"train_loss": -24.9527645111084, "global_step": 241271, "epoch": 2906} {"train_loss": -24.71483039855957, "global_step": 241272, "epoch": 2906} {"train_loss": -24.206907272338867, "global_step": 241273, "epoch": 2906} {"train_loss": -24.434484481811523, "global_step": 241274, "epoch": 2906} {"train_loss": -24.148548126220703, "global_step": 241275, "epoch": 2906} {"train_loss": -24.946569442749023, "global_step": 241276, "epoch": 2906} {"train_loss": -24.66655731201172, "global_step": 241277, "epoch": 2906} {"train_loss": -24.57610511779785, "global_step": 241278, "epoch": 2906} {"train_loss": -24.692777633666992, "global_step": 241279, "epoch": 2906} {"train_loss": -24.844198939311934, "global_step": 241280, "epoch": 2906, "val_loss": 6933672.0} {"train_loss": -23.844806671142578, "global_step": 241281, "epoch": 2907} {"train_loss": -24.473663330078125, "global_step": 241282, "epoch": 2907} {"train_loss": -24.047922134399414, "global_step": 241283, "epoch": 2907} {"train_loss": -24.624326705932617, "global_step": 241284, "epoch": 2907} {"train_loss": -24.10188865661621, "global_step": 241285, "epoch": 2907} {"train_loss": -23.951400756835938, "global_step": 241286, "epoch": 2907} {"train_loss": -24.524953842163086, "global_step": 241287, "epoch": 2907} {"train_loss": -24.368663787841797, "global_step": 241288, "epoch": 2907} {"train_loss": -24.95979881286621, "global_step": 241289, "epoch": 2907} {"train_loss": -24.21015167236328, "global_step": 241290, "epoch": 2907} {"train_loss": -24.514822006225586, "global_step": 241291, "epoch": 2907} {"train_loss": -24.28921890258789, "global_step": 241292, "epoch": 2907} {"train_loss": -24.513023376464844, "global_step": 241293, "epoch": 2907} {"train_loss": -24.451684951782227, "global_step": 241294, "epoch": 2907} {"train_loss": -24.789682388305664, "global_step": 241295, "epoch": 2907} {"train_loss": -24.489858627319336, "global_step": 241296, "epoch": 2907} {"train_loss": -24.975488662719727, "global_step": 241297, "epoch": 2907} {"train_loss": -24.677915573120117, "global_step": 241298, "epoch": 2907} {"train_loss": -24.810726165771484, "global_step": 241299, "epoch": 2907} {"train_loss": -24.55765151977539, "global_step": 241300, "epoch": 2907} {"train_loss": -24.78865623474121, "global_step": 241301, "epoch": 2907} {"train_loss": -24.59818458557129, "global_step": 241302, "epoch": 2907} {"train_loss": -24.793394088745117, "global_step": 241303, "epoch": 2907} {"train_loss": -24.857013702392578, "global_step": 241304, "epoch": 2907} {"train_loss": -24.655515670776367, "global_step": 241305, "epoch": 2907} {"train_loss": -25.01057243347168, "global_step": 241306, "epoch": 2907} {"train_loss": -25.044513702392578, "global_step": 241307, "epoch": 2907} {"train_loss": -24.738107681274414, "global_step": 241308, "epoch": 2907} {"train_loss": -25.068815231323242, "global_step": 241309, "epoch": 2907} {"train_loss": -24.9305419921875, "global_step": 241310, "epoch": 2907} {"train_loss": -24.748258590698242, "global_step": 241311, "epoch": 2907} {"train_loss": -25.075321197509766, "global_step": 241312, "epoch": 2907} {"train_loss": -24.8916015625, "global_step": 241313, "epoch": 2907} {"train_loss": -25.02290916442871, "global_step": 241314, "epoch": 2907} {"train_loss": -24.84276580810547, "global_step": 241315, "epoch": 2907} {"train_loss": -24.935808181762695, "global_step": 241316, "epoch": 2907} {"train_loss": -25.08523941040039, "global_step": 241317, "epoch": 2907} {"train_loss": -24.902406692504883, "global_step": 241318, "epoch": 2907} {"train_loss": -25.0388240814209, "global_step": 241319, "epoch": 2907} {"train_loss": -25.034378051757812, "global_step": 241320, "epoch": 2907} {"train_loss": -25.01401138305664, "global_step": 241321, "epoch": 2907} {"train_loss": -25.064245223999023, "global_step": 241322, "epoch": 2907} {"train_loss": -25.113245010375977, "global_step": 241323, "epoch": 2907} {"train_loss": -25.07574462890625, "global_step": 241324, "epoch": 2907} {"train_loss": -25.221923828125, "global_step": 241325, "epoch": 2907} {"train_loss": -25.074798583984375, "global_step": 241326, "epoch": 2907} {"train_loss": -24.761032104492188, "global_step": 241327, "epoch": 2907} {"train_loss": -25.235158920288086, "global_step": 241328, "epoch": 2907} {"train_loss": -25.142536163330078, "global_step": 241329, "epoch": 2907} {"train_loss": -24.81355094909668, "global_step": 241330, "epoch": 2907} {"train_loss": -24.9882755279541, "global_step": 241331, "epoch": 2907} {"train_loss": -24.80645179748535, "global_step": 241332, "epoch": 2907} {"train_loss": -25.3438720703125, "global_step": 241333, "epoch": 2907} {"train_loss": -24.734609603881836, "global_step": 241334, "epoch": 2907} {"train_loss": -24.745811462402344, "global_step": 241335, "epoch": 2907} {"train_loss": -25.065916061401367, "global_step": 241336, "epoch": 2907} {"train_loss": -25.364160537719727, "global_step": 241337, "epoch": 2907} {"train_loss": -24.775712966918945, "global_step": 241338, "epoch": 2907} {"train_loss": -24.741819381713867, "global_step": 241339, "epoch": 2907} {"train_loss": -24.914457321166992, "global_step": 241340, "epoch": 2907} {"train_loss": -24.762313842773438, "global_step": 241341, "epoch": 2907} {"train_loss": -24.554006576538086, "global_step": 241342, "epoch": 2907} {"train_loss": -24.4544734954834, "global_step": 241343, "epoch": 2907} {"train_loss": -24.969364166259766, "global_step": 241344, "epoch": 2907} {"train_loss": -24.727231979370117, "global_step": 241345, "epoch": 2907} {"train_loss": -25.10968589782715, "global_step": 241346, "epoch": 2907} {"train_loss": -25.043561935424805, "global_step": 241347, "epoch": 2907} {"train_loss": -24.5327205657959, "global_step": 241348, "epoch": 2907} {"train_loss": -24.59958839416504, "global_step": 241349, "epoch": 2907} {"train_loss": -25.010141372680664, "global_step": 241350, "epoch": 2907} {"train_loss": -24.709524154663086, "global_step": 241351, "epoch": 2907} {"train_loss": -24.729354858398438, "global_step": 241352, "epoch": 2907} {"train_loss": -24.934024810791016, "global_step": 241353, "epoch": 2907} {"train_loss": -24.728830337524414, "global_step": 241354, "epoch": 2907} {"train_loss": -25.064964294433594, "global_step": 241355, "epoch": 2907} {"train_loss": -24.965513229370117, "global_step": 241356, "epoch": 2907} {"train_loss": -25.207609176635742, "global_step": 241357, "epoch": 2907} {"train_loss": -24.73664665222168, "global_step": 241358, "epoch": 2907} {"train_loss": -25.197778701782227, "global_step": 241359, "epoch": 2907} {"train_loss": -24.843923568725586, "global_step": 241360, "epoch": 2907} {"train_loss": -25.185327529907227, "global_step": 241361, "epoch": 2907} {"train_loss": -25.10848045349121, "global_step": 241362, "epoch": 2907} {"train_loss": -24.808255643729705, "global_step": 241363, "epoch": 2907, "val_loss": 6717153.0} {"train_loss": -25.048730850219727, "global_step": 241364, "epoch": 2908} {"train_loss": -24.796274185180664, "global_step": 241365, "epoch": 2908} {"train_loss": -24.470165252685547, "global_step": 241366, "epoch": 2908} {"train_loss": -24.271339416503906, "global_step": 241367, "epoch": 2908} {"train_loss": -24.241727828979492, "global_step": 241368, "epoch": 2908} {"train_loss": -24.165111541748047, "global_step": 241369, "epoch": 2908} {"train_loss": -24.039386749267578, "global_step": 241370, "epoch": 2908} {"train_loss": -23.968473434448242, "global_step": 241371, "epoch": 2908} {"train_loss": -24.65416717529297, "global_step": 241372, "epoch": 2908} {"train_loss": -24.572351455688477, "global_step": 241373, "epoch": 2908} {"train_loss": -24.61389923095703, "global_step": 241374, "epoch": 2908} {"train_loss": -24.424474716186523, "global_step": 241375, "epoch": 2908} {"train_loss": -24.809152603149414, "global_step": 241376, "epoch": 2908} {"train_loss": -24.648799896240234, "global_step": 241377, "epoch": 2908} {"train_loss": -24.431135177612305, "global_step": 241378, "epoch": 2908} {"train_loss": -24.64656639099121, "global_step": 241379, "epoch": 2908} {"train_loss": -24.658178329467773, "global_step": 241380, "epoch": 2908} {"train_loss": -24.625516891479492, "global_step": 241381, "epoch": 2908} {"train_loss": -24.333404541015625, "global_step": 241382, "epoch": 2908} {"train_loss": -24.6129150390625, "global_step": 241383, "epoch": 2908} {"train_loss": -24.75153923034668, "global_step": 241384, "epoch": 2908} {"train_loss": -24.582534790039062, "global_step": 241385, "epoch": 2908} {"train_loss": -24.623491287231445, "global_step": 241386, "epoch": 2908} {"train_loss": -24.768945693969727, "global_step": 241387, "epoch": 2908} {"train_loss": -24.605321884155273, "global_step": 241388, "epoch": 2908} {"train_loss": -24.74086570739746, "global_step": 241389, "epoch": 2908} {"train_loss": -24.828018188476562, "global_step": 241390, "epoch": 2908} {"train_loss": -24.637943267822266, "global_step": 241391, "epoch": 2908} {"train_loss": -25.080514907836914, "global_step": 241392, "epoch": 2908} {"train_loss": -25.062427520751953, "global_step": 241393, "epoch": 2908} {"train_loss": -24.719642639160156, "global_step": 241394, "epoch": 2908} {"train_loss": -24.986522674560547, "global_step": 241395, "epoch": 2908} {"train_loss": -25.332698822021484, "global_step": 241396, "epoch": 2908} {"train_loss": -25.10811996459961, "global_step": 241397, "epoch": 2908} {"train_loss": -25.214094161987305, "global_step": 241398, "epoch": 2908} {"train_loss": -24.975011825561523, "global_step": 241399, "epoch": 2908} {"train_loss": -25.17774200439453, "global_step": 241400, "epoch": 2908} {"train_loss": -24.85933494567871, "global_step": 241401, "epoch": 2908} {"train_loss": -25.01429557800293, "global_step": 241402, "epoch": 2908} {"train_loss": -25.04062271118164, "global_step": 241403, "epoch": 2908} {"train_loss": -25.047321319580078, "global_step": 241404, "epoch": 2908} {"train_loss": -25.079477310180664, "global_step": 241405, "epoch": 2908} {"train_loss": -25.14614486694336, "global_step": 241406, "epoch": 2908} {"train_loss": -24.94875717163086, "global_step": 241407, "epoch": 2908} {"train_loss": -25.148481369018555, "global_step": 241408, "epoch": 2908} {"train_loss": -25.143808364868164, "global_step": 241409, "epoch": 2908} {"train_loss": -24.908153533935547, "global_step": 241410, "epoch": 2908} {"train_loss": -24.47694969177246, "global_step": 241411, "epoch": 2908} {"train_loss": -24.835262298583984, "global_step": 241412, "epoch": 2908} {"train_loss": -24.899646759033203, "global_step": 241413, "epoch": 2908} {"train_loss": -25.051538467407227, "global_step": 241414, "epoch": 2908} {"train_loss": -24.442556381225586, "global_step": 241415, "epoch": 2908} {"train_loss": -24.41350746154785, "global_step": 241416, "epoch": 2908} {"train_loss": -24.821685791015625, "global_step": 241417, "epoch": 2908} {"train_loss": -25.149377822875977, "global_step": 241418, "epoch": 2908} {"train_loss": -24.838623046875, "global_step": 241419, "epoch": 2908} {"train_loss": -24.76466178894043, "global_step": 241420, "epoch": 2908} {"train_loss": -24.7614803314209, "global_step": 241421, "epoch": 2908} {"train_loss": -24.929407119750977, "global_step": 241422, "epoch": 2908} {"train_loss": -25.1778621673584, "global_step": 241423, "epoch": 2908} {"train_loss": -24.84305763244629, "global_step": 241424, "epoch": 2908} {"train_loss": -24.986391067504883, "global_step": 241425, "epoch": 2908} {"train_loss": -25.01468276977539, "global_step": 241426, "epoch": 2908} {"train_loss": -24.80129051208496, "global_step": 241427, "epoch": 2908} {"train_loss": -24.69691276550293, "global_step": 241428, "epoch": 2908} {"train_loss": -25.048215866088867, "global_step": 241429, "epoch": 2908} {"train_loss": -24.377330780029297, "global_step": 241430, "epoch": 2908} {"train_loss": -24.63718032836914, "global_step": 241431, "epoch": 2908} {"train_loss": -24.869064331054688, "global_step": 241432, "epoch": 2908} {"train_loss": -25.120559692382812, "global_step": 241433, "epoch": 2908} {"train_loss": -25.117084503173828, "global_step": 241434, "epoch": 2908} {"train_loss": -25.158557891845703, "global_step": 241435, "epoch": 2908} {"train_loss": -24.637414932250977, "global_step": 241436, "epoch": 2908} {"train_loss": -24.709543228149414, "global_step": 241437, "epoch": 2908} {"train_loss": -24.68688201904297, "global_step": 241438, "epoch": 2908} {"train_loss": -24.628217697143555, "global_step": 241439, "epoch": 2908} {"train_loss": -24.868650436401367, "global_step": 241440, "epoch": 2908} {"train_loss": -24.51985740661621, "global_step": 241441, "epoch": 2908} {"train_loss": -25.166364669799805, "global_step": 241442, "epoch": 2908} {"train_loss": -24.496274948120117, "global_step": 241443, "epoch": 2908} {"train_loss": -25.104568481445312, "global_step": 241444, "epoch": 2908} {"train_loss": -25.048059463500977, "global_step": 241445, "epoch": 2908} {"train_loss": -24.798203916434783, "global_step": 241446, "epoch": 2908, "val_loss": 6920742.0} {"train_loss": -24.37531852722168, "global_step": 241447, "epoch": 2909} {"train_loss": -24.662824630737305, "global_step": 241448, "epoch": 2909} {"train_loss": -24.487396240234375, "global_step": 241449, "epoch": 2909} {"train_loss": -23.99521827697754, "global_step": 241450, "epoch": 2909} {"train_loss": -24.23650360107422, "global_step": 241451, "epoch": 2909} {"train_loss": -24.565061569213867, "global_step": 241452, "epoch": 2909} {"train_loss": -24.54050064086914, "global_step": 241453, "epoch": 2909} {"train_loss": -24.27191734313965, "global_step": 241454, "epoch": 2909} {"train_loss": -24.672744750976562, "global_step": 241455, "epoch": 2909} {"train_loss": -24.59549331665039, "global_step": 241456, "epoch": 2909} {"train_loss": -24.66034507751465, "global_step": 241457, "epoch": 2909} {"train_loss": -24.298450469970703, "global_step": 241458, "epoch": 2909} {"train_loss": -24.98183250427246, "global_step": 241459, "epoch": 2909} {"train_loss": -25.006256103515625, "global_step": 241460, "epoch": 2909} {"train_loss": -24.695816040039062, "global_step": 241461, "epoch": 2909} {"train_loss": -24.76727294921875, "global_step": 241462, "epoch": 2909} {"train_loss": -24.644155502319336, "global_step": 241463, "epoch": 2909} {"train_loss": -24.63335609436035, "global_step": 241464, "epoch": 2909} {"train_loss": -24.96845817565918, "global_step": 241465, "epoch": 2909} {"train_loss": -24.714767456054688, "global_step": 241466, "epoch": 2909} {"train_loss": -24.8582820892334, "global_step": 241467, "epoch": 2909} {"train_loss": -24.654754638671875, "global_step": 241468, "epoch": 2909} {"train_loss": -25.1373348236084, "global_step": 241469, "epoch": 2909} {"train_loss": -24.85167694091797, "global_step": 241470, "epoch": 2909} {"train_loss": -24.678401947021484, "global_step": 241471, "epoch": 2909} {"train_loss": -24.995412826538086, "global_step": 241472, "epoch": 2909} {"train_loss": -24.95090675354004, "global_step": 241473, "epoch": 2909} {"train_loss": -24.87024688720703, "global_step": 241474, "epoch": 2909} {"train_loss": -24.869667053222656, "global_step": 241475, "epoch": 2909} {"train_loss": -24.878971099853516, "global_step": 241476, "epoch": 2909} {"train_loss": -24.961395263671875, "global_step": 241477, "epoch": 2909} {"train_loss": -25.0821533203125, "global_step": 241478, "epoch": 2909} {"train_loss": -24.9801082611084, "global_step": 241479, "epoch": 2909} {"train_loss": -25.038606643676758, "global_step": 241480, "epoch": 2909} {"train_loss": -24.972063064575195, "global_step": 241481, "epoch": 2909} {"train_loss": -25.12017822265625, "global_step": 241482, "epoch": 2909} {"train_loss": -24.89272117614746, "global_step": 241483, "epoch": 2909} {"train_loss": -24.885501861572266, "global_step": 241484, "epoch": 2909} {"train_loss": -24.97517967224121, "global_step": 241485, "epoch": 2909} {"train_loss": -24.556501388549805, "global_step": 241486, "epoch": 2909} {"train_loss": -24.13521957397461, "global_step": 241487, "epoch": 2909} {"train_loss": -24.523372650146484, "global_step": 241488, "epoch": 2909} {"train_loss": -25.115583419799805, "global_step": 241489, "epoch": 2909} {"train_loss": -25.05739402770996, "global_step": 241490, "epoch": 2909} {"train_loss": -24.510929107666016, "global_step": 241491, "epoch": 2909} {"train_loss": -25.15707778930664, "global_step": 241492, "epoch": 2909} {"train_loss": -24.652469635009766, "global_step": 241493, "epoch": 2909} {"train_loss": -24.956533432006836, "global_step": 241494, "epoch": 2909} {"train_loss": -24.596702575683594, "global_step": 241495, "epoch": 2909} {"train_loss": -24.546255111694336, "global_step": 241496, "epoch": 2909} {"train_loss": -24.6920108795166, "global_step": 241497, "epoch": 2909} {"train_loss": -24.93226432800293, "global_step": 241498, "epoch": 2909} {"train_loss": -24.683032989501953, "global_step": 241499, "epoch": 2909} {"train_loss": -24.970149993896484, "global_step": 241500, "epoch": 2909} {"train_loss": -24.760679244995117, "global_step": 241501, "epoch": 2909} {"train_loss": -24.930282592773438, "global_step": 241502, "epoch": 2909} {"train_loss": -24.447612762451172, "global_step": 241503, "epoch": 2909} {"train_loss": -24.90130043029785, "global_step": 241504, "epoch": 2909} {"train_loss": -24.267370223999023, "global_step": 241505, "epoch": 2909} {"train_loss": -24.5585880279541, "global_step": 241506, "epoch": 2909} {"train_loss": -24.893024444580078, "global_step": 241507, "epoch": 2909} {"train_loss": -24.888370513916016, "global_step": 241508, "epoch": 2909} {"train_loss": -24.75539207458496, "global_step": 241509, "epoch": 2909} {"train_loss": -24.32900047302246, "global_step": 241510, "epoch": 2909} {"train_loss": -24.762065887451172, "global_step": 241511, "epoch": 2909} {"train_loss": -24.794919967651367, "global_step": 241512, "epoch": 2909} {"train_loss": -25.073652267456055, "global_step": 241513, "epoch": 2909} {"train_loss": -24.707761764526367, "global_step": 241514, "epoch": 2909} {"train_loss": -25.09540367126465, "global_step": 241515, "epoch": 2909} {"train_loss": -24.988935470581055, "global_step": 241516, "epoch": 2909} {"train_loss": -25.17540740966797, "global_step": 241517, "epoch": 2909} {"train_loss": -25.19942283630371, "global_step": 241518, "epoch": 2909} {"train_loss": -24.842466354370117, "global_step": 241519, "epoch": 2909} {"train_loss": -24.943037033081055, "global_step": 241520, "epoch": 2909} {"train_loss": -25.362218856811523, "global_step": 241521, "epoch": 2909} {"train_loss": -25.014368057250977, "global_step": 241522, "epoch": 2909} {"train_loss": -25.01026153564453, "global_step": 241523, "epoch": 2909} {"train_loss": -24.823043823242188, "global_step": 241524, "epoch": 2909} {"train_loss": -25.23151206970215, "global_step": 241525, "epoch": 2909} {"train_loss": -24.835277557373047, "global_step": 241526, "epoch": 2909} {"train_loss": -25.166772842407227, "global_step": 241527, "epoch": 2909} {"train_loss": -25.104909896850586, "global_step": 241528, "epoch": 2909} {"train_loss": -24.79164247627718, "global_step": 241529, "epoch": 2909, "val_loss": 6746781.0} {"train_loss": -24.820743560791016, "global_step": 241530, "epoch": 2910} {"train_loss": -23.269372940063477, "global_step": 241531, "epoch": 2910} {"train_loss": -22.89872169494629, "global_step": 241532, "epoch": 2910} {"train_loss": -23.934831619262695, "global_step": 241533, "epoch": 2910} {"train_loss": -24.5205020904541, "global_step": 241534, "epoch": 2910} {"train_loss": -24.575149536132812, "global_step": 241535, "epoch": 2910} {"train_loss": -24.89027976989746, "global_step": 241536, "epoch": 2910} {"train_loss": -24.19561004638672, "global_step": 241537, "epoch": 2910} {"train_loss": -24.73900604248047, "global_step": 241538, "epoch": 2910} {"train_loss": -24.71748924255371, "global_step": 241539, "epoch": 2910} {"train_loss": -24.428817749023438, "global_step": 241540, "epoch": 2910} {"train_loss": -24.824539184570312, "global_step": 241541, "epoch": 2910} {"train_loss": -24.977237701416016, "global_step": 241542, "epoch": 2910} {"train_loss": -24.578466415405273, "global_step": 241543, "epoch": 2910} {"train_loss": -24.547239303588867, "global_step": 241544, "epoch": 2910} {"train_loss": -24.634855270385742, "global_step": 241545, "epoch": 2910} {"train_loss": -24.51974868774414, "global_step": 241546, "epoch": 2910} {"train_loss": -25.20824432373047, "global_step": 241547, "epoch": 2910} {"train_loss": -24.52414321899414, "global_step": 241548, "epoch": 2910} {"train_loss": -24.485275268554688, "global_step": 241549, "epoch": 2910} {"train_loss": -24.91402244567871, "global_step": 241550, "epoch": 2910} {"train_loss": -25.05617904663086, "global_step": 241551, "epoch": 2910} {"train_loss": -24.478439331054688, "global_step": 241552, "epoch": 2910} {"train_loss": -24.64566993713379, "global_step": 241553, "epoch": 2910} {"train_loss": -25.044788360595703, "global_step": 241554, "epoch": 2910} {"train_loss": -24.94202995300293, "global_step": 241555, "epoch": 2910} {"train_loss": -24.752092361450195, "global_step": 241556, "epoch": 2910} {"train_loss": -24.952213287353516, "global_step": 241557, "epoch": 2910} {"train_loss": -24.891935348510742, "global_step": 241558, "epoch": 2910} {"train_loss": -25.04047966003418, "global_step": 241559, "epoch": 2910} {"train_loss": -25.09907341003418, "global_step": 241560, "epoch": 2910} {"train_loss": -25.22968864440918, "global_step": 241561, "epoch": 2910} {"train_loss": -25.003171920776367, "global_step": 241562, "epoch": 2910} {"train_loss": -24.85430908203125, "global_step": 241563, "epoch": 2910} {"train_loss": -25.003843307495117, "global_step": 241564, "epoch": 2910} {"train_loss": -24.574106216430664, "global_step": 241565, "epoch": 2910} {"train_loss": -25.444055557250977, "global_step": 241566, "epoch": 2910} {"train_loss": -25.02138328552246, "global_step": 241567, "epoch": 2910} {"train_loss": -25.012460708618164, "global_step": 241568, "epoch": 2910} {"train_loss": -24.64739418029785, "global_step": 241569, "epoch": 2910} {"train_loss": -24.774612426757812, "global_step": 241570, "epoch": 2910} {"train_loss": -24.772533416748047, "global_step": 241571, "epoch": 2910} {"train_loss": -24.934804916381836, "global_step": 241572, "epoch": 2910} {"train_loss": -24.8013916015625, "global_step": 241573, "epoch": 2910} {"train_loss": -24.73341178894043, "global_step": 241574, "epoch": 2910} {"train_loss": -25.14422607421875, "global_step": 241575, "epoch": 2910} {"train_loss": -25.138683319091797, "global_step": 241576, "epoch": 2910} {"train_loss": -25.02042579650879, "global_step": 241577, "epoch": 2910} {"train_loss": -25.3190860748291, "global_step": 241578, "epoch": 2910} {"train_loss": -24.386445999145508, "global_step": 241579, "epoch": 2910} {"train_loss": -24.6317138671875, "global_step": 241580, "epoch": 2910} {"train_loss": -24.435321807861328, "global_step": 241581, "epoch": 2910} {"train_loss": -24.07367515563965, "global_step": 241582, "epoch": 2910} {"train_loss": -24.651281356811523, "global_step": 241583, "epoch": 2910} {"train_loss": -24.798337936401367, "global_step": 241584, "epoch": 2910} {"train_loss": -24.520666122436523, "global_step": 241585, "epoch": 2910} {"train_loss": -24.90120506286621, "global_step": 241586, "epoch": 2910} {"train_loss": -24.457237243652344, "global_step": 241587, "epoch": 2910} {"train_loss": -24.63856315612793, "global_step": 241588, "epoch": 2910} {"train_loss": -24.617979049682617, "global_step": 241589, "epoch": 2910} {"train_loss": -24.831972122192383, "global_step": 241590, "epoch": 2910} {"train_loss": -24.517784118652344, "global_step": 241591, "epoch": 2910} {"train_loss": -24.396703720092773, "global_step": 241592, "epoch": 2910} {"train_loss": -24.805456161499023, "global_step": 241593, "epoch": 2910} {"train_loss": -24.469913482666016, "global_step": 241594, "epoch": 2910} {"train_loss": -24.45627784729004, "global_step": 241595, "epoch": 2910} {"train_loss": -24.246793746948242, "global_step": 241596, "epoch": 2910} {"train_loss": -24.784435272216797, "global_step": 241597, "epoch": 2910} {"train_loss": -24.782058715820312, "global_step": 241598, "epoch": 2910} {"train_loss": -23.9599609375, "global_step": 241599, "epoch": 2910} {"train_loss": -24.904367446899414, "global_step": 241600, "epoch": 2910} {"train_loss": -24.500171661376953, "global_step": 241601, "epoch": 2910} {"train_loss": -24.49473762512207, "global_step": 241602, "epoch": 2910} {"train_loss": -24.60352897644043, "global_step": 241603, "epoch": 2910} {"train_loss": -24.746076583862305, "global_step": 241604, "epoch": 2910} {"train_loss": -24.83089828491211, "global_step": 241605, "epoch": 2910} {"train_loss": -24.94621467590332, "global_step": 241606, "epoch": 2910} {"train_loss": -24.9460506439209, "global_step": 241607, "epoch": 2910} {"train_loss": -24.81733512878418, "global_step": 241608, "epoch": 2910} {"train_loss": -24.871967315673828, "global_step": 241609, "epoch": 2910} {"train_loss": -24.557775497436523, "global_step": 241610, "epoch": 2910} {"train_loss": -24.995460510253906, "global_step": 241611, "epoch": 2910} {"train_loss": -24.69880255733628, "global_step": 241612, "epoch": 2910, "val_loss": 6798650.0} {"train_loss": -23.804977416992188, "global_step": 241613, "epoch": 2911} {"train_loss": -23.828908920288086, "global_step": 241614, "epoch": 2911} {"train_loss": -24.4615478515625, "global_step": 241615, "epoch": 2911} {"train_loss": -24.31181526184082, "global_step": 241616, "epoch": 2911} {"train_loss": -24.44292449951172, "global_step": 241617, "epoch": 2911} {"train_loss": -24.604883193969727, "global_step": 241618, "epoch": 2911} {"train_loss": -24.636619567871094, "global_step": 241619, "epoch": 2911} {"train_loss": -24.233205795288086, "global_step": 241620, "epoch": 2911} {"train_loss": -24.932538986206055, "global_step": 241621, "epoch": 2911} {"train_loss": -24.39999008178711, "global_step": 241622, "epoch": 2911} {"train_loss": -24.642377853393555, "global_step": 241623, "epoch": 2911} {"train_loss": -24.546607971191406, "global_step": 241624, "epoch": 2911} {"train_loss": -24.49509048461914, "global_step": 241625, "epoch": 2911} {"train_loss": -24.745281219482422, "global_step": 241626, "epoch": 2911} {"train_loss": -24.686813354492188, "global_step": 241627, "epoch": 2911} {"train_loss": -24.97633171081543, "global_step": 241628, "epoch": 2911} {"train_loss": -24.49460792541504, "global_step": 241629, "epoch": 2911} {"train_loss": -24.697433471679688, "global_step": 241630, "epoch": 2911} {"train_loss": -24.825820922851562, "global_step": 241631, "epoch": 2911} {"train_loss": -24.703765869140625, "global_step": 241632, "epoch": 2911} {"train_loss": -24.727506637573242, "global_step": 241633, "epoch": 2911} {"train_loss": -24.852928161621094, "global_step": 241634, "epoch": 2911} {"train_loss": -24.911514282226562, "global_step": 241635, "epoch": 2911} {"train_loss": -25.06342887878418, "global_step": 241636, "epoch": 2911} {"train_loss": -24.963788986206055, "global_step": 241637, "epoch": 2911} {"train_loss": -25.155231475830078, "global_step": 241638, "epoch": 2911} {"train_loss": -24.475597381591797, "global_step": 241639, "epoch": 2911} {"train_loss": -24.49309730529785, "global_step": 241640, "epoch": 2911} {"train_loss": -25.247364044189453, "global_step": 241641, "epoch": 2911} {"train_loss": -25.155771255493164, "global_step": 241642, "epoch": 2911} {"train_loss": -25.153121948242188, "global_step": 241643, "epoch": 2911} {"train_loss": -24.808603286743164, "global_step": 241644, "epoch": 2911} {"train_loss": -24.74597930908203, "global_step": 241645, "epoch": 2911} {"train_loss": -24.996328353881836, "global_step": 241646, "epoch": 2911} {"train_loss": -25.009185791015625, "global_step": 241647, "epoch": 2911} {"train_loss": -24.89027976989746, "global_step": 241648, "epoch": 2911} {"train_loss": -24.86667251586914, "global_step": 241649, "epoch": 2911} {"train_loss": -25.189916610717773, "global_step": 241650, "epoch": 2911} {"train_loss": -25.161046981811523, "global_step": 241651, "epoch": 2911} {"train_loss": -24.759063720703125, "global_step": 241652, "epoch": 2911} {"train_loss": -24.832590103149414, "global_step": 241653, "epoch": 2911} {"train_loss": -25.16119956970215, "global_step": 241654, "epoch": 2911} {"train_loss": -25.37593650817871, "global_step": 241655, "epoch": 2911} {"train_loss": -25.53742027282715, "global_step": 241656, "epoch": 2911} {"train_loss": -24.932697296142578, "global_step": 241657, "epoch": 2911} {"train_loss": -25.216161727905273, "global_step": 241658, "epoch": 2911} {"train_loss": -25.08736228942871, "global_step": 241659, "epoch": 2911} {"train_loss": -24.9888973236084, "global_step": 241660, "epoch": 2911} {"train_loss": -24.875110626220703, "global_step": 241661, "epoch": 2911} {"train_loss": -25.129592895507812, "global_step": 241662, "epoch": 2911} {"train_loss": -25.42567253112793, "global_step": 241663, "epoch": 2911} {"train_loss": -25.1037654876709, "global_step": 241664, "epoch": 2911} {"train_loss": -25.090986251831055, "global_step": 241665, "epoch": 2911} {"train_loss": -25.078123092651367, "global_step": 241666, "epoch": 2911} {"train_loss": -24.833511352539062, "global_step": 241667, "epoch": 2911} {"train_loss": -24.49641227722168, "global_step": 241668, "epoch": 2911} {"train_loss": -24.32692527770996, "global_step": 241669, "epoch": 2911} {"train_loss": -24.34197425842285, "global_step": 241670, "epoch": 2911} {"train_loss": -24.48550033569336, "global_step": 241671, "epoch": 2911} {"train_loss": -24.33632469177246, "global_step": 241672, "epoch": 2911} {"train_loss": -24.936532974243164, "global_step": 241673, "epoch": 2911} {"train_loss": -24.472301483154297, "global_step": 241674, "epoch": 2911} {"train_loss": -24.258655548095703, "global_step": 241675, "epoch": 2911} {"train_loss": -24.622034072875977, "global_step": 241676, "epoch": 2911} {"train_loss": -24.939695358276367, "global_step": 241677, "epoch": 2911} {"train_loss": -24.54088592529297, "global_step": 241678, "epoch": 2911} {"train_loss": -24.716480255126953, "global_step": 241679, "epoch": 2911} {"train_loss": -24.87986183166504, "global_step": 241680, "epoch": 2911} {"train_loss": -24.720108032226562, "global_step": 241681, "epoch": 2911} {"train_loss": -24.988191604614258, "global_step": 241682, "epoch": 2911} {"train_loss": -24.61956787109375, "global_step": 241683, "epoch": 2911} {"train_loss": -24.61237907409668, "global_step": 241684, "epoch": 2911} {"train_loss": -25.023902893066406, "global_step": 241685, "epoch": 2911} {"train_loss": -24.808361053466797, "global_step": 241686, "epoch": 2911} {"train_loss": -24.801319122314453, "global_step": 241687, "epoch": 2911} {"train_loss": -24.86945343017578, "global_step": 241688, "epoch": 2911} {"train_loss": -24.710424423217773, "global_step": 241689, "epoch": 2911} {"train_loss": -24.77126121520996, "global_step": 241690, "epoch": 2911} {"train_loss": -24.980276107788086, "global_step": 241691, "epoch": 2911} {"train_loss": -25.078062057495117, "global_step": 241692, "epoch": 2911} {"train_loss": -24.843341827392578, "global_step": 241693, "epoch": 2911} {"train_loss": -25.074119567871094, "global_step": 241694, "epoch": 2911} {"train_loss": -24.79070054479392, "global_step": 241695, "epoch": 2911, "val_loss": 6742978.0} {"train_loss": -24.639484405517578, "global_step": 241696, "epoch": 2912} {"train_loss": -24.64171028137207, "global_step": 241697, "epoch": 2912} {"train_loss": -24.448883056640625, "global_step": 241698, "epoch": 2912} {"train_loss": -24.589519500732422, "global_step": 241699, "epoch": 2912} {"train_loss": -24.855648040771484, "global_step": 241700, "epoch": 2912} {"train_loss": -25.07168197631836, "global_step": 241701, "epoch": 2912} {"train_loss": -24.83778953552246, "global_step": 241702, "epoch": 2912} {"train_loss": -24.70131492614746, "global_step": 241703, "epoch": 2912} {"train_loss": -24.808435440063477, "global_step": 241704, "epoch": 2912} {"train_loss": -25.089323043823242, "global_step": 241705, "epoch": 2912} {"train_loss": -25.01239585876465, "global_step": 241706, "epoch": 2912} {"train_loss": -24.832639694213867, "global_step": 241707, "epoch": 2912} {"train_loss": -24.63117790222168, "global_step": 241708, "epoch": 2912} {"train_loss": -25.097625732421875, "global_step": 241709, "epoch": 2912} {"train_loss": -25.160602569580078, "global_step": 241710, "epoch": 2912} {"train_loss": -24.841083526611328, "global_step": 241711, "epoch": 2912} {"train_loss": -24.940433502197266, "global_step": 241712, "epoch": 2912} {"train_loss": -24.719318389892578, "global_step": 241713, "epoch": 2912} {"train_loss": -25.03173828125, "global_step": 241714, "epoch": 2912} {"train_loss": -24.970800399780273, "global_step": 241715, "epoch": 2912} {"train_loss": -24.912322998046875, "global_step": 241716, "epoch": 2912} {"train_loss": -25.266210556030273, "global_step": 241717, "epoch": 2912} {"train_loss": -24.451852798461914, "global_step": 241718, "epoch": 2912} {"train_loss": -25.058349609375, "global_step": 241719, "epoch": 2912} {"train_loss": -24.991666793823242, "global_step": 241720, "epoch": 2912} {"train_loss": -24.975065231323242, "global_step": 241721, "epoch": 2912} {"train_loss": -25.063312530517578, "global_step": 241722, "epoch": 2912} {"train_loss": -24.864803314208984, "global_step": 241723, "epoch": 2912} {"train_loss": -24.92099952697754, "global_step": 241724, "epoch": 2912} {"train_loss": -25.224794387817383, "global_step": 241725, "epoch": 2912} {"train_loss": -24.680078506469727, "global_step": 241726, "epoch": 2912} {"train_loss": -24.837242126464844, "global_step": 241727, "epoch": 2912} {"train_loss": -24.825990676879883, "global_step": 241728, "epoch": 2912} {"train_loss": -24.726701736450195, "global_step": 241729, "epoch": 2912} {"train_loss": -24.88309669494629, "global_step": 241730, "epoch": 2912} {"train_loss": -24.66542625427246, "global_step": 241731, "epoch": 2912} {"train_loss": -24.668630599975586, "global_step": 241732, "epoch": 2912} {"train_loss": -25.06427574157715, "global_step": 241733, "epoch": 2912} {"train_loss": -24.80658531188965, "global_step": 241734, "epoch": 2912} {"train_loss": -25.062044143676758, "global_step": 241735, "epoch": 2912} {"train_loss": -25.109384536743164, "global_step": 241736, "epoch": 2912} {"train_loss": -24.692228317260742, "global_step": 241737, "epoch": 2912} {"train_loss": -24.699390411376953, "global_step": 241738, "epoch": 2912} {"train_loss": -24.638315200805664, "global_step": 241739, "epoch": 2912} {"train_loss": -24.789228439331055, "global_step": 241740, "epoch": 2912} {"train_loss": -25.13982582092285, "global_step": 241741, "epoch": 2912} {"train_loss": -24.609580993652344, "global_step": 241742, "epoch": 2912} {"train_loss": -25.088735580444336, "global_step": 241743, "epoch": 2912} {"train_loss": -25.2031192779541, "global_step": 241744, "epoch": 2912} {"train_loss": -25.0277099609375, "global_step": 241745, "epoch": 2912} {"train_loss": -24.578157424926758, "global_step": 241746, "epoch": 2912} {"train_loss": -24.917139053344727, "global_step": 241747, "epoch": 2912} {"train_loss": -25.277708053588867, "global_step": 241748, "epoch": 2912} {"train_loss": -24.985355377197266, "global_step": 241749, "epoch": 2912} {"train_loss": -24.850000381469727, "global_step": 241750, "epoch": 2912} {"train_loss": -24.825775146484375, "global_step": 241751, "epoch": 2912} {"train_loss": -25.236228942871094, "global_step": 241752, "epoch": 2912} {"train_loss": -25.223474502563477, "global_step": 241753, "epoch": 2912} {"train_loss": -25.1925106048584, "global_step": 241754, "epoch": 2912} {"train_loss": -25.1643009185791, "global_step": 241755, "epoch": 2912} {"train_loss": -25.108339309692383, "global_step": 241756, "epoch": 2912} {"train_loss": -24.943439483642578, "global_step": 241757, "epoch": 2912} {"train_loss": -25.311498641967773, "global_step": 241758, "epoch": 2912} {"train_loss": -25.00260353088379, "global_step": 241759, "epoch": 2912} {"train_loss": -24.96738624572754, "global_step": 241760, "epoch": 2912} {"train_loss": -24.906665802001953, "global_step": 241761, "epoch": 2912} {"train_loss": -24.608495712280273, "global_step": 241762, "epoch": 2912} {"train_loss": -24.628671646118164, "global_step": 241763, "epoch": 2912} {"train_loss": -24.885791778564453, "global_step": 241764, "epoch": 2912} {"train_loss": -25.085195541381836, "global_step": 241765, "epoch": 2912} {"train_loss": -25.234455108642578, "global_step": 241766, "epoch": 2912} {"train_loss": -24.489601135253906, "global_step": 241767, "epoch": 2912} {"train_loss": -24.877056121826172, "global_step": 241768, "epoch": 2912} {"train_loss": -24.593332290649414, "global_step": 241769, "epoch": 2912} {"train_loss": -25.23353385925293, "global_step": 241770, "epoch": 2912} {"train_loss": -24.62619400024414, "global_step": 241771, "epoch": 2912} {"train_loss": -25.36209487915039, "global_step": 241772, "epoch": 2912} {"train_loss": -24.686752319335938, "global_step": 241773, "epoch": 2912} {"train_loss": -25.022960662841797, "global_step": 241774, "epoch": 2912} {"train_loss": -25.041187286376953, "global_step": 241775, "epoch": 2912} {"train_loss": -24.928258895874023, "global_step": 241776, "epoch": 2912} {"train_loss": -24.657133102416992, "global_step": 241777, "epoch": 2912} {"train_loss": -24.91061598996082, "global_step": 241778, "epoch": 2912, "val_loss": 6758503.0} {"train_loss": -24.370372772216797, "global_step": 241779, "epoch": 2913} {"train_loss": -24.50257682800293, "global_step": 241780, "epoch": 2913} {"train_loss": -24.35406494140625, "global_step": 241781, "epoch": 2913} {"train_loss": -24.282041549682617, "global_step": 241782, "epoch": 2913} {"train_loss": -24.40498161315918, "global_step": 241783, "epoch": 2913} {"train_loss": -24.344409942626953, "global_step": 241784, "epoch": 2913} {"train_loss": -24.48929786682129, "global_step": 241785, "epoch": 2913} {"train_loss": -25.271390914916992, "global_step": 241786, "epoch": 2913} {"train_loss": -25.24393081665039, "global_step": 241787, "epoch": 2913} {"train_loss": -24.264005661010742, "global_step": 241788, "epoch": 2913} {"train_loss": -24.372072219848633, "global_step": 241789, "epoch": 2913} {"train_loss": -24.67972755432129, "global_step": 241790, "epoch": 2913} {"train_loss": -24.6474666595459, "global_step": 241791, "epoch": 2913} {"train_loss": -24.43972396850586, "global_step": 241792, "epoch": 2913} {"train_loss": -24.963985443115234, "global_step": 241793, "epoch": 2913} {"train_loss": -24.77359390258789, "global_step": 241794, "epoch": 2913} {"train_loss": -24.934228897094727, "global_step": 241795, "epoch": 2913} {"train_loss": -24.664152145385742, "global_step": 241796, "epoch": 2913} {"train_loss": -24.378002166748047, "global_step": 241797, "epoch": 2913} {"train_loss": -24.912843704223633, "global_step": 241798, "epoch": 2913} {"train_loss": -24.900787353515625, "global_step": 241799, "epoch": 2913} {"train_loss": -24.692012786865234, "global_step": 241800, "epoch": 2913} {"train_loss": -25.10963249206543, "global_step": 241801, "epoch": 2913} {"train_loss": -24.46344757080078, "global_step": 241802, "epoch": 2913} {"train_loss": -24.964576721191406, "global_step": 241803, "epoch": 2913} {"train_loss": -24.6971492767334, "global_step": 241804, "epoch": 2913} {"train_loss": -24.579679489135742, "global_step": 241805, "epoch": 2913} {"train_loss": -24.514928817749023, "global_step": 241806, "epoch": 2913} {"train_loss": -24.87767791748047, "global_step": 241807, "epoch": 2913} {"train_loss": -24.64145278930664, "global_step": 241808, "epoch": 2913} {"train_loss": -24.698474884033203, "global_step": 241809, "epoch": 2913} {"train_loss": -24.629411697387695, "global_step": 241810, "epoch": 2913} {"train_loss": -24.831104278564453, "global_step": 241811, "epoch": 2913} {"train_loss": -24.51124382019043, "global_step": 241812, "epoch": 2913} {"train_loss": -24.963214874267578, "global_step": 241813, "epoch": 2913} {"train_loss": -24.67936134338379, "global_step": 241814, "epoch": 2913} {"train_loss": -24.41641616821289, "global_step": 241815, "epoch": 2913} {"train_loss": -25.065067291259766, "global_step": 241816, "epoch": 2913} {"train_loss": -25.15961265563965, "global_step": 241817, "epoch": 2913} {"train_loss": -25.017030715942383, "global_step": 241818, "epoch": 2913} {"train_loss": -24.47019386291504, "global_step": 241819, "epoch": 2913} {"train_loss": -24.959657669067383, "global_step": 241820, "epoch": 2913} {"train_loss": -24.689889907836914, "global_step": 241821, "epoch": 2913} {"train_loss": -24.955854415893555, "global_step": 241822, "epoch": 2913} {"train_loss": -24.84254264831543, "global_step": 241823, "epoch": 2913} {"train_loss": -25.030914306640625, "global_step": 241824, "epoch": 2913} {"train_loss": -25.449758529663086, "global_step": 241825, "epoch": 2913} {"train_loss": -24.662893295288086, "global_step": 241826, "epoch": 2913} {"train_loss": -25.03460693359375, "global_step": 241827, "epoch": 2913} {"train_loss": -25.11781883239746, "global_step": 241828, "epoch": 2913} {"train_loss": -24.584821701049805, "global_step": 241829, "epoch": 2913} {"train_loss": -24.825916290283203, "global_step": 241830, "epoch": 2913} {"train_loss": -24.96980094909668, "global_step": 241831, "epoch": 2913} {"train_loss": -24.864551544189453, "global_step": 241832, "epoch": 2913} {"train_loss": -24.84745216369629, "global_step": 241833, "epoch": 2913} {"train_loss": -24.809255599975586, "global_step": 241834, "epoch": 2913} {"train_loss": -24.872900009155273, "global_step": 241835, "epoch": 2913} {"train_loss": -25.124176025390625, "global_step": 241836, "epoch": 2913} {"train_loss": -24.655866622924805, "global_step": 241837, "epoch": 2913} {"train_loss": -24.809268951416016, "global_step": 241838, "epoch": 2913} {"train_loss": -24.888349533081055, "global_step": 241839, "epoch": 2913} {"train_loss": -25.024641036987305, "global_step": 241840, "epoch": 2913} {"train_loss": -24.72498893737793, "global_step": 241841, "epoch": 2913} {"train_loss": -24.7102108001709, "global_step": 241842, "epoch": 2913} {"train_loss": -24.964889526367188, "global_step": 241843, "epoch": 2913} {"train_loss": -25.071277618408203, "global_step": 241844, "epoch": 2913} {"train_loss": -25.043432235717773, "global_step": 241845, "epoch": 2913} {"train_loss": -25.055822372436523, "global_step": 241846, "epoch": 2913} {"train_loss": -25.194555282592773, "global_step": 241847, "epoch": 2913} {"train_loss": -24.849267959594727, "global_step": 241848, "epoch": 2913} {"train_loss": -24.713836669921875, "global_step": 241849, "epoch": 2913} {"train_loss": -25.027450561523438, "global_step": 241850, "epoch": 2913} {"train_loss": -25.043867111206055, "global_step": 241851, "epoch": 2913} {"train_loss": -25.19647789001465, "global_step": 241852, "epoch": 2913} {"train_loss": -24.945079803466797, "global_step": 241853, "epoch": 2913} {"train_loss": -24.862548828125, "global_step": 241854, "epoch": 2913} {"train_loss": -24.594806671142578, "global_step": 241855, "epoch": 2913} {"train_loss": -24.93400001525879, "global_step": 241856, "epoch": 2913} {"train_loss": -24.7447509765625, "global_step": 241857, "epoch": 2913} {"train_loss": -24.781108856201172, "global_step": 241858, "epoch": 2913} {"train_loss": -24.605939865112305, "global_step": 241859, "epoch": 2913} {"train_loss": -25.079086303710938, "global_step": 241860, "epoch": 2913} {"train_loss": -24.795558722622424, "global_step": 241861, "epoch": 2913, "val_loss": 6806526.0} {"train_loss": -24.741756439208984, "global_step": 241862, "epoch": 2914} {"train_loss": -23.87420082092285, "global_step": 241863, "epoch": 2914} {"train_loss": -24.458410263061523, "global_step": 241864, "epoch": 2914} {"train_loss": -24.10910987854004, "global_step": 241865, "epoch": 2914} {"train_loss": -24.370208740234375, "global_step": 241866, "epoch": 2914} {"train_loss": -24.52524757385254, "global_step": 241867, "epoch": 2914} {"train_loss": -24.680744171142578, "global_step": 241868, "epoch": 2914} {"train_loss": -24.830368041992188, "global_step": 241869, "epoch": 2914} {"train_loss": -24.5341796875, "global_step": 241870, "epoch": 2914} {"train_loss": -24.402326583862305, "global_step": 241871, "epoch": 2914} {"train_loss": -24.031469345092773, "global_step": 241872, "epoch": 2914} {"train_loss": -24.799360275268555, "global_step": 241873, "epoch": 2914} {"train_loss": -24.42475700378418, "global_step": 241874, "epoch": 2914} {"train_loss": -24.688587188720703, "global_step": 241875, "epoch": 2914} {"train_loss": -24.3149471282959, "global_step": 241876, "epoch": 2914} {"train_loss": -24.287534713745117, "global_step": 241877, "epoch": 2914} {"train_loss": -24.682010650634766, "global_step": 241878, "epoch": 2914} {"train_loss": -24.52882194519043, "global_step": 241879, "epoch": 2914} {"train_loss": -24.661531448364258, "global_step": 241880, "epoch": 2914} {"train_loss": -24.37200355529785, "global_step": 241881, "epoch": 2914} {"train_loss": -24.902246475219727, "global_step": 241882, "epoch": 2914} {"train_loss": -24.588945388793945, "global_step": 241883, "epoch": 2914} {"train_loss": -24.48618507385254, "global_step": 241884, "epoch": 2914} {"train_loss": -24.65479278564453, "global_step": 241885, "epoch": 2914} {"train_loss": -24.407896041870117, "global_step": 241886, "epoch": 2914} {"train_loss": -24.7772274017334, "global_step": 241887, "epoch": 2914} {"train_loss": -24.915800094604492, "global_step": 241888, "epoch": 2914} {"train_loss": -24.538253784179688, "global_step": 241889, "epoch": 2914} {"train_loss": -24.847171783447266, "global_step": 241890, "epoch": 2914} {"train_loss": -24.748794555664062, "global_step": 241891, "epoch": 2914} {"train_loss": -24.977827072143555, "global_step": 241892, "epoch": 2914} {"train_loss": -25.125314712524414, "global_step": 241893, "epoch": 2914} {"train_loss": -25.04707145690918, "global_step": 241894, "epoch": 2914} {"train_loss": -24.958803176879883, "global_step": 241895, "epoch": 2914} {"train_loss": -25.1896915435791, "global_step": 241896, "epoch": 2914} {"train_loss": -24.748111724853516, "global_step": 241897, "epoch": 2914} {"train_loss": -24.642858505249023, "global_step": 241898, "epoch": 2914} {"train_loss": -24.900793075561523, "global_step": 241899, "epoch": 2914} {"train_loss": -24.750904083251953, "global_step": 241900, "epoch": 2914} {"train_loss": -25.286935806274414, "global_step": 241901, "epoch": 2914} {"train_loss": -24.996423721313477, "global_step": 241902, "epoch": 2914} {"train_loss": -24.96044921875, "global_step": 241903, "epoch": 2914} {"train_loss": -25.155805587768555, "global_step": 241904, "epoch": 2914} {"train_loss": -24.796493530273438, "global_step": 241905, "epoch": 2914} {"train_loss": -24.726049423217773, "global_step": 241906, "epoch": 2914} {"train_loss": -24.927967071533203, "global_step": 241907, "epoch": 2914} {"train_loss": -25.16573143005371, "global_step": 241908, "epoch": 2914} {"train_loss": -24.949060440063477, "global_step": 241909, "epoch": 2914} {"train_loss": -25.03302574157715, "global_step": 241910, "epoch": 2914} {"train_loss": -24.965883255004883, "global_step": 241911, "epoch": 2914} {"train_loss": -24.897113800048828, "global_step": 241912, "epoch": 2914} {"train_loss": -24.849172592163086, "global_step": 241913, "epoch": 2914} {"train_loss": -24.69500160217285, "global_step": 241914, "epoch": 2914} {"train_loss": -25.066068649291992, "global_step": 241915, "epoch": 2914} {"train_loss": -25.092741012573242, "global_step": 241916, "epoch": 2914} {"train_loss": -24.489164352416992, "global_step": 241917, "epoch": 2914} {"train_loss": -24.796171188354492, "global_step": 241918, "epoch": 2914} {"train_loss": -24.748971939086914, "global_step": 241919, "epoch": 2914} {"train_loss": -24.869754791259766, "global_step": 241920, "epoch": 2914} {"train_loss": -24.870410919189453, "global_step": 241921, "epoch": 2914} {"train_loss": -24.477453231811523, "global_step": 241922, "epoch": 2914} {"train_loss": -24.914779663085938, "global_step": 241923, "epoch": 2914} {"train_loss": -25.19114112854004, "global_step": 241924, "epoch": 2914} {"train_loss": -24.600194931030273, "global_step": 241925, "epoch": 2914} {"train_loss": -24.9711856842041, "global_step": 241926, "epoch": 2914} {"train_loss": -24.813398361206055, "global_step": 241927, "epoch": 2914} {"train_loss": -24.954837799072266, "global_step": 241928, "epoch": 2914} {"train_loss": -25.192901611328125, "global_step": 241929, "epoch": 2914} {"train_loss": -25.164880752563477, "global_step": 241930, "epoch": 2914} {"train_loss": -24.923734664916992, "global_step": 241931, "epoch": 2914} {"train_loss": -24.812610626220703, "global_step": 241932, "epoch": 2914} {"train_loss": -24.867511749267578, "global_step": 241933, "epoch": 2914} {"train_loss": -25.008888244628906, "global_step": 241934, "epoch": 2914} {"train_loss": -24.968311309814453, "global_step": 241935, "epoch": 2914} {"train_loss": -24.88039207458496, "global_step": 241936, "epoch": 2914} {"train_loss": -25.45549964904785, "global_step": 241937, "epoch": 2914} {"train_loss": -25.059436798095703, "global_step": 241938, "epoch": 2914} {"train_loss": -24.66350555419922, "global_step": 241939, "epoch": 2914} {"train_loss": -24.80323600769043, "global_step": 241940, "epoch": 2914} {"train_loss": -25.111474990844727, "global_step": 241941, "epoch": 2914} {"train_loss": -25.006101608276367, "global_step": 241942, "epoch": 2914} {"train_loss": -24.87166404724121, "global_step": 241943, "epoch": 2914} {"train_loss": -24.795439111181054, "global_step": 241944, "epoch": 2914, "val_loss": 6686659.0} {"train_loss": -22.259662628173828, "global_step": 241945, "epoch": 2915} {"train_loss": -20.87628173828125, "global_step": 241946, "epoch": 2915} {"train_loss": -23.60920524597168, "global_step": 241947, "epoch": 2915} {"train_loss": -23.914396286010742, "global_step": 241948, "epoch": 2915} {"train_loss": -23.413312911987305, "global_step": 241949, "epoch": 2915} {"train_loss": -23.698150634765625, "global_step": 241950, "epoch": 2915} {"train_loss": -24.227842330932617, "global_step": 241951, "epoch": 2915} {"train_loss": -23.499483108520508, "global_step": 241952, "epoch": 2915} {"train_loss": -23.73587989807129, "global_step": 241953, "epoch": 2915} {"train_loss": -24.25678825378418, "global_step": 241954, "epoch": 2915} {"train_loss": -23.866867065429688, "global_step": 241955, "epoch": 2915} {"train_loss": -23.66901969909668, "global_step": 241956, "epoch": 2915} {"train_loss": -24.258342742919922, "global_step": 241957, "epoch": 2915} {"train_loss": -24.42484474182129, "global_step": 241958, "epoch": 2915} {"train_loss": -23.800525665283203, "global_step": 241959, "epoch": 2915} {"train_loss": -23.8383846282959, "global_step": 241960, "epoch": 2915} {"train_loss": -24.331153869628906, "global_step": 241961, "epoch": 2915} {"train_loss": -24.30133628845215, "global_step": 241962, "epoch": 2915} {"train_loss": -24.423269271850586, "global_step": 241963, "epoch": 2915} {"train_loss": -24.336856842041016, "global_step": 241964, "epoch": 2915} {"train_loss": -24.03152847290039, "global_step": 241965, "epoch": 2915} {"train_loss": -24.624116897583008, "global_step": 241966, "epoch": 2915} {"train_loss": -24.31369400024414, "global_step": 241967, "epoch": 2915} {"train_loss": -24.786178588867188, "global_step": 241968, "epoch": 2915} {"train_loss": -24.471139907836914, "global_step": 241969, "epoch": 2915} {"train_loss": -24.2053279876709, "global_step": 241970, "epoch": 2915} {"train_loss": -24.67237091064453, "global_step": 241971, "epoch": 2915} {"train_loss": -24.273643493652344, "global_step": 241972, "epoch": 2915} {"train_loss": -24.738855361938477, "global_step": 241973, "epoch": 2915} {"train_loss": -24.729291915893555, "global_step": 241974, "epoch": 2915} {"train_loss": -24.756696701049805, "global_step": 241975, "epoch": 2915} {"train_loss": -24.927640914916992, "global_step": 241976, "epoch": 2915} {"train_loss": -24.632831573486328, "global_step": 241977, "epoch": 2915} {"train_loss": -25.051565170288086, "global_step": 241978, "epoch": 2915} {"train_loss": -24.588396072387695, "global_step": 241979, "epoch": 2915} {"train_loss": -24.824703216552734, "global_step": 241980, "epoch": 2915} {"train_loss": -24.431304931640625, "global_step": 241981, "epoch": 2915} {"train_loss": -24.61869239807129, "global_step": 241982, "epoch": 2915} {"train_loss": -24.84206199645996, "global_step": 241983, "epoch": 2915} {"train_loss": -24.50678062438965, "global_step": 241984, "epoch": 2915} {"train_loss": -24.929340362548828, "global_step": 241985, "epoch": 2915} {"train_loss": -24.783584594726562, "global_step": 241986, "epoch": 2915} {"train_loss": -24.437414169311523, "global_step": 241987, "epoch": 2915} {"train_loss": -24.832056045532227, "global_step": 241988, "epoch": 2915} {"train_loss": -24.849828720092773, "global_step": 241989, "epoch": 2915} {"train_loss": -24.46364402770996, "global_step": 241990, "epoch": 2915} {"train_loss": -24.92344093322754, "global_step": 241991, "epoch": 2915} {"train_loss": -24.782262802124023, "global_step": 241992, "epoch": 2915} {"train_loss": -25.089462280273438, "global_step": 241993, "epoch": 2915} {"train_loss": -24.725101470947266, "global_step": 241994, "epoch": 2915} {"train_loss": -25.198720932006836, "global_step": 241995, "epoch": 2915} {"train_loss": -24.92669105529785, "global_step": 241996, "epoch": 2915} {"train_loss": -24.701623916625977, "global_step": 241997, "epoch": 2915} {"train_loss": -25.214784622192383, "global_step": 241998, "epoch": 2915} {"train_loss": -25.068540573120117, "global_step": 241999, "epoch": 2915} {"train_loss": -24.786893844604492, "global_step": 242000, "epoch": 2915} {"train_loss": -24.662277221679688, "global_step": 242001, "epoch": 2915} {"train_loss": -25.074758529663086, "global_step": 242002, "epoch": 2915} {"train_loss": -25.415481567382812, "global_step": 242003, "epoch": 2915} {"train_loss": -25.042646408081055, "global_step": 242004, "epoch": 2915} {"train_loss": -24.960901260375977, "global_step": 242005, "epoch": 2915} {"train_loss": -24.99692153930664, "global_step": 242006, "epoch": 2915} {"train_loss": -24.67763328552246, "global_step": 242007, "epoch": 2915} {"train_loss": -24.693750381469727, "global_step": 242008, "epoch": 2915} {"train_loss": -25.015512466430664, "global_step": 242009, "epoch": 2915} {"train_loss": -25.118446350097656, "global_step": 242010, "epoch": 2915} {"train_loss": -24.799829483032227, "global_step": 242011, "epoch": 2915} {"train_loss": -24.95172119140625, "global_step": 242012, "epoch": 2915} {"train_loss": -25.064828872680664, "global_step": 242013, "epoch": 2915} {"train_loss": -25.071958541870117, "global_step": 242014, "epoch": 2915} {"train_loss": -24.933340072631836, "global_step": 242015, "epoch": 2915} {"train_loss": -24.8482666015625, "global_step": 242016, "epoch": 2915} {"train_loss": -24.92569923400879, "global_step": 242017, "epoch": 2915} {"train_loss": -24.7613468170166, "global_step": 242018, "epoch": 2915} {"train_loss": -24.93798828125, "global_step": 242019, "epoch": 2915} {"train_loss": -24.702255249023438, "global_step": 242020, "epoch": 2915} {"train_loss": -24.92877769470215, "global_step": 242021, "epoch": 2915} {"train_loss": -24.983888626098633, "global_step": 242022, "epoch": 2915} {"train_loss": -25.168880462646484, "global_step": 242023, "epoch": 2915} {"train_loss": -24.7874755859375, "global_step": 242024, "epoch": 2915} {"train_loss": -25.110260009765625, "global_step": 242025, "epoch": 2915} {"train_loss": -25.035688400268555, "global_step": 242026, "epoch": 2915} {"train_loss": -24.565098911882885, "global_step": 242027, "epoch": 2915, "val_loss": 6731657.0} {"train_loss": -23.812963485717773, "global_step": 242028, "epoch": 2916} {"train_loss": -22.559404373168945, "global_step": 242029, "epoch": 2916} {"train_loss": -23.26594352722168, "global_step": 242030, "epoch": 2916} {"train_loss": -24.589025497436523, "global_step": 242031, "epoch": 2916} {"train_loss": -24.25452995300293, "global_step": 242032, "epoch": 2916} {"train_loss": -24.143505096435547, "global_step": 242033, "epoch": 2916} {"train_loss": -24.28933334350586, "global_step": 242034, "epoch": 2916} {"train_loss": -23.69068145751953, "global_step": 242035, "epoch": 2916} {"train_loss": -24.356599807739258, "global_step": 242036, "epoch": 2916} {"train_loss": -24.15097427368164, "global_step": 242037, "epoch": 2916} {"train_loss": -24.20907974243164, "global_step": 242038, "epoch": 2916} {"train_loss": -24.23185157775879, "global_step": 242039, "epoch": 2916} {"train_loss": -24.702985763549805, "global_step": 242040, "epoch": 2916} {"train_loss": -23.983230590820312, "global_step": 242041, "epoch": 2916} {"train_loss": -24.43228530883789, "global_step": 242042, "epoch": 2916} {"train_loss": -24.659439086914062, "global_step": 242043, "epoch": 2916} {"train_loss": -24.401941299438477, "global_step": 242044, "epoch": 2916} {"train_loss": -24.972763061523438, "global_step": 242045, "epoch": 2916} {"train_loss": -24.3964786529541, "global_step": 242046, "epoch": 2916} {"train_loss": -24.64223289489746, "global_step": 242047, "epoch": 2916} {"train_loss": -24.745512008666992, "global_step": 242048, "epoch": 2916} {"train_loss": -24.990636825561523, "global_step": 242049, "epoch": 2916} {"train_loss": -24.680639266967773, "global_step": 242050, "epoch": 2916} {"train_loss": -24.616146087646484, "global_step": 242051, "epoch": 2916} {"train_loss": -24.758268356323242, "global_step": 242052, "epoch": 2916} {"train_loss": -24.753583908081055, "global_step": 242053, "epoch": 2916} {"train_loss": -24.68889617919922, "global_step": 242054, "epoch": 2916} {"train_loss": -24.69801139831543, "global_step": 242055, "epoch": 2916} {"train_loss": -24.733047485351562, "global_step": 242056, "epoch": 2916} {"train_loss": -24.747180938720703, "global_step": 242057, "epoch": 2916} {"train_loss": -24.687166213989258, "global_step": 242058, "epoch": 2916} {"train_loss": -24.689401626586914, "global_step": 242059, "epoch": 2916} {"train_loss": -24.861682891845703, "global_step": 242060, "epoch": 2916} {"train_loss": -24.939666748046875, "global_step": 242061, "epoch": 2916} {"train_loss": -24.842981338500977, "global_step": 242062, "epoch": 2916} {"train_loss": -25.07777976989746, "global_step": 242063, "epoch": 2916} {"train_loss": -24.668411254882812, "global_step": 242064, "epoch": 2916} {"train_loss": -24.866222381591797, "global_step": 242065, "epoch": 2916} {"train_loss": -24.832029342651367, "global_step": 242066, "epoch": 2916} {"train_loss": -25.28679084777832, "global_step": 242067, "epoch": 2916} {"train_loss": -24.611970901489258, "global_step": 242068, "epoch": 2916} {"train_loss": -25.046417236328125, "global_step": 242069, "epoch": 2916} {"train_loss": -24.809572219848633, "global_step": 242070, "epoch": 2916} {"train_loss": -25.136178970336914, "global_step": 242071, "epoch": 2916} {"train_loss": -25.013254165649414, "global_step": 242072, "epoch": 2916} {"train_loss": -25.112056732177734, "global_step": 242073, "epoch": 2916} {"train_loss": -24.636356353759766, "global_step": 242074, "epoch": 2916} {"train_loss": -24.969627380371094, "global_step": 242075, "epoch": 2916} {"train_loss": -25.017322540283203, "global_step": 242076, "epoch": 2916} {"train_loss": -24.906639099121094, "global_step": 242077, "epoch": 2916} {"train_loss": -25.152036666870117, "global_step": 242078, "epoch": 2916} {"train_loss": -25.203580856323242, "global_step": 242079, "epoch": 2916} {"train_loss": -24.924137115478516, "global_step": 242080, "epoch": 2916} {"train_loss": -25.0648193359375, "global_step": 242081, "epoch": 2916} {"train_loss": -24.959915161132812, "global_step": 242082, "epoch": 2916} {"train_loss": -25.124906539916992, "global_step": 242083, "epoch": 2916} {"train_loss": -24.870283126831055, "global_step": 242084, "epoch": 2916} {"train_loss": -25.142141342163086, "global_step": 242085, "epoch": 2916} {"train_loss": -24.965181350708008, "global_step": 242086, "epoch": 2916} {"train_loss": -24.79580307006836, "global_step": 242087, "epoch": 2916} {"train_loss": -24.843482971191406, "global_step": 242088, "epoch": 2916} {"train_loss": -24.8198299407959, "global_step": 242089, "epoch": 2916} {"train_loss": -25.094697952270508, "global_step": 242090, "epoch": 2916} {"train_loss": -24.78987693786621, "global_step": 242091, "epoch": 2916} {"train_loss": -24.73328971862793, "global_step": 242092, "epoch": 2916} {"train_loss": -24.66838264465332, "global_step": 242093, "epoch": 2916} {"train_loss": -25.072359085083008, "global_step": 242094, "epoch": 2916} {"train_loss": -24.966209411621094, "global_step": 242095, "epoch": 2916} {"train_loss": -25.0787410736084, "global_step": 242096, "epoch": 2916} {"train_loss": -25.156890869140625, "global_step": 242097, "epoch": 2916} {"train_loss": -24.826738357543945, "global_step": 242098, "epoch": 2916} {"train_loss": -24.781620025634766, "global_step": 242099, "epoch": 2916} {"train_loss": -24.6993408203125, "global_step": 242100, "epoch": 2916} {"train_loss": -25.24658203125, "global_step": 242101, "epoch": 2916} {"train_loss": -24.823110580444336, "global_step": 242102, "epoch": 2916} {"train_loss": -25.224714279174805, "global_step": 242103, "epoch": 2916} {"train_loss": -25.207687377929688, "global_step": 242104, "epoch": 2916} {"train_loss": -24.675832748413086, "global_step": 242105, "epoch": 2916} {"train_loss": -25.339618682861328, "global_step": 242106, "epoch": 2916} {"train_loss": -24.909208297729492, "global_step": 242107, "epoch": 2916} {"train_loss": -25.12299156188965, "global_step": 242108, "epoch": 2916} {"train_loss": -24.837926864624023, "global_step": 242109, "epoch": 2916} {"train_loss": -24.736901317734315, "global_step": 242110, "epoch": 2916, "val_loss": 6783395.0} {"train_loss": -23.770828247070312, "global_step": 242111, "epoch": 2917} {"train_loss": -23.939966201782227, "global_step": 242112, "epoch": 2917} {"train_loss": -24.479623794555664, "global_step": 242113, "epoch": 2917} {"train_loss": -23.790647506713867, "global_step": 242114, "epoch": 2917} {"train_loss": -23.956485748291016, "global_step": 242115, "epoch": 2917} {"train_loss": -23.93440055847168, "global_step": 242116, "epoch": 2917} {"train_loss": -24.50996971130371, "global_step": 242117, "epoch": 2917} {"train_loss": -23.8277645111084, "global_step": 242118, "epoch": 2917} {"train_loss": -24.46489906311035, "global_step": 242119, "epoch": 2917} {"train_loss": -24.35401725769043, "global_step": 242120, "epoch": 2917} {"train_loss": -24.602842330932617, "global_step": 242121, "epoch": 2917} {"train_loss": -24.254898071289062, "global_step": 242122, "epoch": 2917} {"train_loss": -24.6074275970459, "global_step": 242123, "epoch": 2917} {"train_loss": -24.36296272277832, "global_step": 242124, "epoch": 2917} {"train_loss": -24.316984176635742, "global_step": 242125, "epoch": 2917} {"train_loss": -24.835952758789062, "global_step": 242126, "epoch": 2917} {"train_loss": -24.574634552001953, "global_step": 242127, "epoch": 2917} {"train_loss": -24.310823440551758, "global_step": 242128, "epoch": 2917} {"train_loss": -24.810016632080078, "global_step": 242129, "epoch": 2917} {"train_loss": -24.742727279663086, "global_step": 242130, "epoch": 2917} {"train_loss": -24.91440773010254, "global_step": 242131, "epoch": 2917} {"train_loss": -24.299129486083984, "global_step": 242132, "epoch": 2917} {"train_loss": -24.91585350036621, "global_step": 242133, "epoch": 2917} {"train_loss": -24.696271896362305, "global_step": 242134, "epoch": 2917} {"train_loss": -24.9379825592041, "global_step": 242135, "epoch": 2917} {"train_loss": -24.759225845336914, "global_step": 242136, "epoch": 2917} {"train_loss": -25.005292892456055, "global_step": 242137, "epoch": 2917} {"train_loss": -24.99225425720215, "global_step": 242138, "epoch": 2917} {"train_loss": -24.856399536132812, "global_step": 242139, "epoch": 2917} {"train_loss": -24.57309913635254, "global_step": 242140, "epoch": 2917} {"train_loss": -24.764020919799805, "global_step": 242141, "epoch": 2917} {"train_loss": -24.98773193359375, "global_step": 242142, "epoch": 2917} {"train_loss": -24.94161033630371, "global_step": 242143, "epoch": 2917} {"train_loss": -24.735525131225586, "global_step": 242144, "epoch": 2917} {"train_loss": -24.63935661315918, "global_step": 242145, "epoch": 2917} {"train_loss": -24.798246383666992, "global_step": 242146, "epoch": 2917} {"train_loss": -25.124359130859375, "global_step": 242147, "epoch": 2917} {"train_loss": -25.2767391204834, "global_step": 242148, "epoch": 2917} {"train_loss": -25.143768310546875, "global_step": 242149, "epoch": 2917} {"train_loss": -25.19129753112793, "global_step": 242150, "epoch": 2917} {"train_loss": -24.800037384033203, "global_step": 242151, "epoch": 2917} {"train_loss": -25.122211456298828, "global_step": 242152, "epoch": 2917} {"train_loss": -24.983957290649414, "global_step": 242153, "epoch": 2917} {"train_loss": -25.03772735595703, "global_step": 242154, "epoch": 2917} {"train_loss": -24.854896545410156, "global_step": 242155, "epoch": 2917} {"train_loss": -25.070398330688477, "global_step": 242156, "epoch": 2917} {"train_loss": -25.05011749267578, "global_step": 242157, "epoch": 2917} {"train_loss": -24.89303970336914, "global_step": 242158, "epoch": 2917} {"train_loss": -24.778120040893555, "global_step": 242159, "epoch": 2917} {"train_loss": -25.221332550048828, "global_step": 242160, "epoch": 2917} {"train_loss": -25.041603088378906, "global_step": 242161, "epoch": 2917} {"train_loss": -25.116605758666992, "global_step": 242162, "epoch": 2917} {"train_loss": -25.432268142700195, "global_step": 242163, "epoch": 2917} {"train_loss": -25.12773323059082, "global_step": 242164, "epoch": 2917} {"train_loss": -25.05428123474121, "global_step": 242165, "epoch": 2917} {"train_loss": -25.069242477416992, "global_step": 242166, "epoch": 2917} {"train_loss": -24.8573055267334, "global_step": 242167, "epoch": 2917} {"train_loss": -25.0116024017334, "global_step": 242168, "epoch": 2917} {"train_loss": -24.98280906677246, "global_step": 242169, "epoch": 2917} {"train_loss": -25.12275505065918, "global_step": 242170, "epoch": 2917} {"train_loss": -25.346044540405273, "global_step": 242171, "epoch": 2917} {"train_loss": -24.70499610900879, "global_step": 242172, "epoch": 2917} {"train_loss": -25.00473976135254, "global_step": 242173, "epoch": 2917} {"train_loss": -24.97925567626953, "global_step": 242174, "epoch": 2917} {"train_loss": -24.869115829467773, "global_step": 242175, "epoch": 2917} {"train_loss": -24.88794708251953, "global_step": 242176, "epoch": 2917} {"train_loss": -24.68897819519043, "global_step": 242177, "epoch": 2917} {"train_loss": -24.705841064453125, "global_step": 242178, "epoch": 2917} {"train_loss": -24.462997436523438, "global_step": 242179, "epoch": 2917} {"train_loss": -24.652950286865234, "global_step": 242180, "epoch": 2917} {"train_loss": -25.128402709960938, "global_step": 242181, "epoch": 2917} {"train_loss": -24.81673240661621, "global_step": 242182, "epoch": 2917} {"train_loss": -24.17113494873047, "global_step": 242183, "epoch": 2917} {"train_loss": -24.816850662231445, "global_step": 242184, "epoch": 2917} {"train_loss": -24.616085052490234, "global_step": 242185, "epoch": 2917} {"train_loss": -24.800390243530273, "global_step": 242186, "epoch": 2917} {"train_loss": -24.964969635009766, "global_step": 242187, "epoch": 2917} {"train_loss": -24.933382034301758, "global_step": 242188, "epoch": 2917} {"train_loss": -25.03314208984375, "global_step": 242189, "epoch": 2917} {"train_loss": -24.702917098999023, "global_step": 242190, "epoch": 2917} {"train_loss": -24.549062728881836, "global_step": 242191, "epoch": 2917} {"train_loss": -24.754114151000977, "global_step": 242192, "epoch": 2917} {"train_loss": -24.741812028080584, "global_step": 242193, "epoch": 2917, "val_loss": 6903427.0} {"train_loss": -24.53205680847168, "global_step": 242194, "epoch": 2918} {"train_loss": -24.76842498779297, "global_step": 242195, "epoch": 2918} {"train_loss": -24.76287078857422, "global_step": 242196, "epoch": 2918} {"train_loss": -24.852523803710938, "global_step": 242197, "epoch": 2918} {"train_loss": -24.4954891204834, "global_step": 242198, "epoch": 2918} {"train_loss": -24.772663116455078, "global_step": 242199, "epoch": 2918} {"train_loss": -24.313800811767578, "global_step": 242200, "epoch": 2918} {"train_loss": -24.872013092041016, "global_step": 242201, "epoch": 2918} {"train_loss": -24.780454635620117, "global_step": 242202, "epoch": 2918} {"train_loss": -24.853469848632812, "global_step": 242203, "epoch": 2918} {"train_loss": -24.286096572875977, "global_step": 242204, "epoch": 2918} {"train_loss": -24.833969116210938, "global_step": 242205, "epoch": 2918} {"train_loss": -24.579166412353516, "global_step": 242206, "epoch": 2918} {"train_loss": -24.730947494506836, "global_step": 242207, "epoch": 2918} {"train_loss": -24.599502563476562, "global_step": 242208, "epoch": 2918} {"train_loss": -25.127246856689453, "global_step": 242209, "epoch": 2918} {"train_loss": -24.769058227539062, "global_step": 242210, "epoch": 2918} {"train_loss": -25.19729995727539, "global_step": 242211, "epoch": 2918} {"train_loss": -25.443492889404297, "global_step": 242212, "epoch": 2918} {"train_loss": -25.189130783081055, "global_step": 242213, "epoch": 2918} {"train_loss": -25.058317184448242, "global_step": 242214, "epoch": 2918} {"train_loss": -25.039825439453125, "global_step": 242215, "epoch": 2918} {"train_loss": -24.791746139526367, "global_step": 242216, "epoch": 2918} {"train_loss": -24.67331886291504, "global_step": 242217, "epoch": 2918} {"train_loss": -25.34847068786621, "global_step": 242218, "epoch": 2918} {"train_loss": -25.058473587036133, "global_step": 242219, "epoch": 2918} {"train_loss": -25.092145919799805, "global_step": 242220, "epoch": 2918} {"train_loss": -24.83699607849121, "global_step": 242221, "epoch": 2918} {"train_loss": -24.801578521728516, "global_step": 242222, "epoch": 2918} {"train_loss": -24.545568466186523, "global_step": 242223, "epoch": 2918} {"train_loss": -24.854633331298828, "global_step": 242224, "epoch": 2918} {"train_loss": -25.38741111755371, "global_step": 242225, "epoch": 2918} {"train_loss": -24.731718063354492, "global_step": 242226, "epoch": 2918} {"train_loss": -24.64012336730957, "global_step": 242227, "epoch": 2918} {"train_loss": -24.88996696472168, "global_step": 242228, "epoch": 2918} {"train_loss": -25.372251510620117, "global_step": 242229, "epoch": 2918} {"train_loss": -24.648719787597656, "global_step": 242230, "epoch": 2918} {"train_loss": -24.760501861572266, "global_step": 242231, "epoch": 2918} {"train_loss": -25.01130485534668, "global_step": 242232, "epoch": 2918} {"train_loss": -24.841978073120117, "global_step": 242233, "epoch": 2918} {"train_loss": -24.534149169921875, "global_step": 242234, "epoch": 2918} {"train_loss": -25.00309181213379, "global_step": 242235, "epoch": 2918} {"train_loss": -24.520503997802734, "global_step": 242236, "epoch": 2918} {"train_loss": -24.6018123626709, "global_step": 242237, "epoch": 2918} {"train_loss": -24.898788452148438, "global_step": 242238, "epoch": 2918} {"train_loss": -25.10578727722168, "global_step": 242239, "epoch": 2918} {"train_loss": -24.907670974731445, "global_step": 242240, "epoch": 2918} {"train_loss": -25.168704986572266, "global_step": 242241, "epoch": 2918} {"train_loss": -24.78097915649414, "global_step": 242242, "epoch": 2918} {"train_loss": -24.66023826599121, "global_step": 242243, "epoch": 2918} {"train_loss": -24.72586441040039, "global_step": 242244, "epoch": 2918} {"train_loss": -24.828001022338867, "global_step": 242245, "epoch": 2918} {"train_loss": -25.131925582885742, "global_step": 242246, "epoch": 2918} {"train_loss": -24.59407615661621, "global_step": 242247, "epoch": 2918} {"train_loss": -24.829742431640625, "global_step": 242248, "epoch": 2918} {"train_loss": -24.813024520874023, "global_step": 242249, "epoch": 2918} {"train_loss": -24.945154190063477, "global_step": 242250, "epoch": 2918} {"train_loss": -24.79854393005371, "global_step": 242251, "epoch": 2918} {"train_loss": -25.12686538696289, "global_step": 242252, "epoch": 2918} {"train_loss": -24.78119468688965, "global_step": 242253, "epoch": 2918} {"train_loss": -25.196964263916016, "global_step": 242254, "epoch": 2918} {"train_loss": -25.027664184570312, "global_step": 242255, "epoch": 2918} {"train_loss": -25.080768585205078, "global_step": 242256, "epoch": 2918} {"train_loss": -24.35127830505371, "global_step": 242257, "epoch": 2918} {"train_loss": -24.769269943237305, "global_step": 242258, "epoch": 2918} {"train_loss": -24.888980865478516, "global_step": 242259, "epoch": 2918} {"train_loss": -25.091176986694336, "global_step": 242260, "epoch": 2918} {"train_loss": -24.9714412689209, "global_step": 242261, "epoch": 2918} {"train_loss": -24.71192741394043, "global_step": 242262, "epoch": 2918} {"train_loss": -24.737062454223633, "global_step": 242263, "epoch": 2918} {"train_loss": -25.268564224243164, "global_step": 242264, "epoch": 2918} {"train_loss": -24.906055450439453, "global_step": 242265, "epoch": 2918} {"train_loss": -25.33400535583496, "global_step": 242266, "epoch": 2918} {"train_loss": -24.482450485229492, "global_step": 242267, "epoch": 2918} {"train_loss": -25.090621948242188, "global_step": 242268, "epoch": 2918} {"train_loss": -24.719881057739258, "global_step": 242269, "epoch": 2918} {"train_loss": -24.747835159301758, "global_step": 242270, "epoch": 2918} {"train_loss": -24.754497528076172, "global_step": 242271, "epoch": 2918} {"train_loss": -25.255475997924805, "global_step": 242272, "epoch": 2918} {"train_loss": -24.908071517944336, "global_step": 242273, "epoch": 2918} {"train_loss": -25.172231674194336, "global_step": 242274, "epoch": 2918} {"train_loss": -24.96388816833496, "global_step": 242275, "epoch": 2918} {"train_loss": -24.86129707887948, "global_step": 242276, "epoch": 2918, "val_loss": 6870326.0} {"train_loss": -24.105093002319336, "global_step": 242277, "epoch": 2919} {"train_loss": -24.05963134765625, "global_step": 242278, "epoch": 2919} {"train_loss": -24.687063217163086, "global_step": 242279, "epoch": 2919} {"train_loss": -24.774614334106445, "global_step": 242280, "epoch": 2919} {"train_loss": -24.563940048217773, "global_step": 242281, "epoch": 2919} {"train_loss": -24.61850929260254, "global_step": 242282, "epoch": 2919} {"train_loss": -24.68756675720215, "global_step": 242283, "epoch": 2919} {"train_loss": -24.690282821655273, "global_step": 242284, "epoch": 2919} {"train_loss": -24.323856353759766, "global_step": 242285, "epoch": 2919} {"train_loss": -24.42945671081543, "global_step": 242286, "epoch": 2919} {"train_loss": -24.763906478881836, "global_step": 242287, "epoch": 2919} {"train_loss": -24.766016006469727, "global_step": 242288, "epoch": 2919} {"train_loss": -24.56020164489746, "global_step": 242289, "epoch": 2919} {"train_loss": -24.825214385986328, "global_step": 242290, "epoch": 2919} {"train_loss": -24.747976303100586, "global_step": 242291, "epoch": 2919} {"train_loss": -24.646825790405273, "global_step": 242292, "epoch": 2919} {"train_loss": -24.768613815307617, "global_step": 242293, "epoch": 2919} {"train_loss": -24.639806747436523, "global_step": 242294, "epoch": 2919} {"train_loss": -24.84082794189453, "global_step": 242295, "epoch": 2919} {"train_loss": -25.1345272064209, "global_step": 242296, "epoch": 2919} {"train_loss": -24.932331085205078, "global_step": 242297, "epoch": 2919} {"train_loss": -24.54813003540039, "global_step": 242298, "epoch": 2919} {"train_loss": -24.94038963317871, "global_step": 242299, "epoch": 2919} {"train_loss": -24.46003532409668, "global_step": 242300, "epoch": 2919} {"train_loss": -24.881746292114258, "global_step": 242301, "epoch": 2919} {"train_loss": -25.06501007080078, "global_step": 242302, "epoch": 2919} {"train_loss": -24.787683486938477, "global_step": 242303, "epoch": 2919} {"train_loss": -24.40679168701172, "global_step": 242304, "epoch": 2919} {"train_loss": -25.10125732421875, "global_step": 242305, "epoch": 2919} {"train_loss": -24.856679916381836, "global_step": 242306, "epoch": 2919} {"train_loss": -24.870607376098633, "global_step": 242307, "epoch": 2919} {"train_loss": -24.6428279876709, "global_step": 242308, "epoch": 2919} {"train_loss": -25.130069732666016, "global_step": 242309, "epoch": 2919} {"train_loss": -25.236968994140625, "global_step": 242310, "epoch": 2919} {"train_loss": -25.23838233947754, "global_step": 242311, "epoch": 2919} {"train_loss": -25.324939727783203, "global_step": 242312, "epoch": 2919} {"train_loss": -25.07456398010254, "global_step": 242313, "epoch": 2919} {"train_loss": -25.111801147460938, "global_step": 242314, "epoch": 2919} {"train_loss": -24.967792510986328, "global_step": 242315, "epoch": 2919} {"train_loss": -25.19385528564453, "global_step": 242316, "epoch": 2919} {"train_loss": -24.915843963623047, "global_step": 242317, "epoch": 2919} {"train_loss": -24.90778350830078, "global_step": 242318, "epoch": 2919} {"train_loss": -25.060171127319336, "global_step": 242319, "epoch": 2919} {"train_loss": -25.043943405151367, "global_step": 242320, "epoch": 2919} {"train_loss": -24.902387619018555, "global_step": 242321, "epoch": 2919} {"train_loss": -25.322050094604492, "global_step": 242322, "epoch": 2919} {"train_loss": -25.26741600036621, "global_step": 242323, "epoch": 2919} {"train_loss": -24.944725036621094, "global_step": 242324, "epoch": 2919} {"train_loss": -25.514280319213867, "global_step": 242325, "epoch": 2919} {"train_loss": -25.10979652404785, "global_step": 242326, "epoch": 2919} {"train_loss": -25.3021297454834, "global_step": 242327, "epoch": 2919} {"train_loss": -25.02722930908203, "global_step": 242328, "epoch": 2919} {"train_loss": -24.94158935546875, "global_step": 242329, "epoch": 2919} {"train_loss": -24.69658851623535, "global_step": 242330, "epoch": 2919} {"train_loss": -24.78511619567871, "global_step": 242331, "epoch": 2919} {"train_loss": -24.947607040405273, "global_step": 242332, "epoch": 2919} {"train_loss": -25.087329864501953, "global_step": 242333, "epoch": 2919} {"train_loss": -24.83247947692871, "global_step": 242334, "epoch": 2919} {"train_loss": -25.264822006225586, "global_step": 242335, "epoch": 2919} {"train_loss": -24.753856658935547, "global_step": 242336, "epoch": 2919} {"train_loss": -24.66575050354004, "global_step": 242337, "epoch": 2919} {"train_loss": -25.382863998413086, "global_step": 242338, "epoch": 2919} {"train_loss": -24.544490814208984, "global_step": 242339, "epoch": 2919} {"train_loss": -24.807178497314453, "global_step": 242340, "epoch": 2919} {"train_loss": -24.678380966186523, "global_step": 242341, "epoch": 2919} {"train_loss": -24.78937339782715, "global_step": 242342, "epoch": 2919} {"train_loss": -24.8184814453125, "global_step": 242343, "epoch": 2919} {"train_loss": -24.399738311767578, "global_step": 242344, "epoch": 2919} {"train_loss": -25.02402687072754, "global_step": 242345, "epoch": 2919} {"train_loss": -25.56122589111328, "global_step": 242346, "epoch": 2919} {"train_loss": -24.929113388061523, "global_step": 242347, "epoch": 2919} {"train_loss": -25.252206802368164, "global_step": 242348, "epoch": 2919} {"train_loss": -24.983808517456055, "global_step": 242349, "epoch": 2919} {"train_loss": -25.034420013427734, "global_step": 242350, "epoch": 2919} {"train_loss": -25.23591423034668, "global_step": 242351, "epoch": 2919} {"train_loss": -25.330352783203125, "global_step": 242352, "epoch": 2919} {"train_loss": -25.020292282104492, "global_step": 242353, "epoch": 2919} {"train_loss": -25.109634399414062, "global_step": 242354, "epoch": 2919} {"train_loss": -25.041757583618164, "global_step": 242355, "epoch": 2919} {"train_loss": -25.033782958984375, "global_step": 242356, "epoch": 2919} {"train_loss": -24.85684585571289, "global_step": 242357, "epoch": 2919} {"train_loss": -24.83701515197754, "global_step": 242358, "epoch": 2919} {"train_loss": -24.904425563582453, "global_step": 242359, "epoch": 2919, "val_loss": 6856722.5} {"train_loss": -24.856754302978516, "global_step": 242360, "epoch": 2920} {"train_loss": -24.470413208007812, "global_step": 242361, "epoch": 2920} {"train_loss": -24.737462997436523, "global_step": 242362, "epoch": 2920} {"train_loss": -24.469480514526367, "global_step": 242363, "epoch": 2920} {"train_loss": -25.10077667236328, "global_step": 242364, "epoch": 2920} {"train_loss": -24.18614959716797, "global_step": 242365, "epoch": 2920} {"train_loss": -23.599014282226562, "global_step": 242366, "epoch": 2920} {"train_loss": -24.347135543823242, "global_step": 242367, "epoch": 2920} {"train_loss": -24.183908462524414, "global_step": 242368, "epoch": 2920} {"train_loss": -24.77786636352539, "global_step": 242369, "epoch": 2920} {"train_loss": -24.51840591430664, "global_step": 242370, "epoch": 2920} {"train_loss": -24.6995849609375, "global_step": 242371, "epoch": 2920} {"train_loss": -24.74989891052246, "global_step": 242372, "epoch": 2920} {"train_loss": -24.603681564331055, "global_step": 242373, "epoch": 2920} {"train_loss": -24.69409942626953, "global_step": 242374, "epoch": 2920} {"train_loss": -25.02255630493164, "global_step": 242375, "epoch": 2920} {"train_loss": -24.62891960144043, "global_step": 242376, "epoch": 2920} {"train_loss": -24.64704704284668, "global_step": 242377, "epoch": 2920} {"train_loss": -25.02467918395996, "global_step": 242378, "epoch": 2920} {"train_loss": -24.951519012451172, "global_step": 242379, "epoch": 2920} {"train_loss": -24.588274002075195, "global_step": 242380, "epoch": 2920} {"train_loss": -25.02744483947754, "global_step": 242381, "epoch": 2920} {"train_loss": -24.573074340820312, "global_step": 242382, "epoch": 2920} {"train_loss": -24.975650787353516, "global_step": 242383, "epoch": 2920} {"train_loss": -24.726490020751953, "global_step": 242384, "epoch": 2920} {"train_loss": -24.572160720825195, "global_step": 242385, "epoch": 2920} {"train_loss": -24.712242126464844, "global_step": 242386, "epoch": 2920} {"train_loss": -24.748565673828125, "global_step": 242387, "epoch": 2920} {"train_loss": -24.88502311706543, "global_step": 242388, "epoch": 2920} {"train_loss": -24.85646629333496, "global_step": 242389, "epoch": 2920} {"train_loss": -24.744720458984375, "global_step": 242390, "epoch": 2920} {"train_loss": -24.76590919494629, "global_step": 242391, "epoch": 2920} {"train_loss": -24.91609001159668, "global_step": 242392, "epoch": 2920} {"train_loss": -25.03795623779297, "global_step": 242393, "epoch": 2920} {"train_loss": -25.241004943847656, "global_step": 242394, "epoch": 2920} {"train_loss": -25.290740966796875, "global_step": 242395, "epoch": 2920} {"train_loss": -25.073928833007812, "global_step": 242396, "epoch": 2920} {"train_loss": -24.75935173034668, "global_step": 242397, "epoch": 2920} {"train_loss": -25.17609405517578, "global_step": 242398, "epoch": 2920} {"train_loss": -24.95525550842285, "global_step": 242399, "epoch": 2920} {"train_loss": -24.668975830078125, "global_step": 242400, "epoch": 2920} {"train_loss": -25.125146865844727, "global_step": 242401, "epoch": 2920} {"train_loss": -24.867277145385742, "global_step": 242402, "epoch": 2920} {"train_loss": -24.87824821472168, "global_step": 242403, "epoch": 2920} {"train_loss": -24.96306800842285, "global_step": 242404, "epoch": 2920} {"train_loss": -24.95454978942871, "global_step": 242405, "epoch": 2920} {"train_loss": -25.07344627380371, "global_step": 242406, "epoch": 2920} {"train_loss": -25.00160789489746, "global_step": 242407, "epoch": 2920} {"train_loss": -24.848695755004883, "global_step": 242408, "epoch": 2920} {"train_loss": -25.374984741210938, "global_step": 242409, "epoch": 2920} {"train_loss": -25.119884490966797, "global_step": 242410, "epoch": 2920} {"train_loss": -24.745548248291016, "global_step": 242411, "epoch": 2920} {"train_loss": -25.048851013183594, "global_step": 242412, "epoch": 2920} {"train_loss": -25.36635398864746, "global_step": 242413, "epoch": 2920} {"train_loss": -24.93991470336914, "global_step": 242414, "epoch": 2920} {"train_loss": -24.495962142944336, "global_step": 242415, "epoch": 2920} {"train_loss": -25.146997451782227, "global_step": 242416, "epoch": 2920} {"train_loss": -25.33243179321289, "global_step": 242417, "epoch": 2920} {"train_loss": -25.042367935180664, "global_step": 242418, "epoch": 2920} {"train_loss": -24.5728702545166, "global_step": 242419, "epoch": 2920} {"train_loss": -25.085721969604492, "global_step": 242420, "epoch": 2920} {"train_loss": -24.77623176574707, "global_step": 242421, "epoch": 2920} {"train_loss": -25.216962814331055, "global_step": 242422, "epoch": 2920} {"train_loss": -24.759723663330078, "global_step": 242423, "epoch": 2920} {"train_loss": -25.092269897460938, "global_step": 242424, "epoch": 2920} {"train_loss": -25.43317985534668, "global_step": 242425, "epoch": 2920} {"train_loss": -24.769620895385742, "global_step": 242426, "epoch": 2920} {"train_loss": -24.919477462768555, "global_step": 242427, "epoch": 2920} {"train_loss": -25.10395050048828, "global_step": 242428, "epoch": 2920} {"train_loss": -24.686965942382812, "global_step": 242429, "epoch": 2920} {"train_loss": -24.885581970214844, "global_step": 242430, "epoch": 2920} {"train_loss": -24.971830368041992, "global_step": 242431, "epoch": 2920} {"train_loss": -24.760848999023438, "global_step": 242432, "epoch": 2920} {"train_loss": -24.706592559814453, "global_step": 242433, "epoch": 2920} {"train_loss": -25.207569122314453, "global_step": 242434, "epoch": 2920} {"train_loss": -24.812217712402344, "global_step": 242435, "epoch": 2920} {"train_loss": -24.916967391967773, "global_step": 242436, "epoch": 2920} {"train_loss": -25.02895736694336, "global_step": 242437, "epoch": 2920} {"train_loss": -24.949352264404297, "global_step": 242438, "epoch": 2920} {"train_loss": -25.12528419494629, "global_step": 242439, "epoch": 2920} {"train_loss": -25.116575241088867, "global_step": 242440, "epoch": 2920} {"train_loss": -25.23593521118164, "global_step": 242441, "epoch": 2920} {"train_loss": -24.858195890863257, "global_step": 242442, "epoch": 2920, "val_loss": 6779244.0} {"train_loss": -24.301315307617188, "global_step": 242443, "epoch": 2921} {"train_loss": -23.73563003540039, "global_step": 242444, "epoch": 2921} {"train_loss": -24.7347469329834, "global_step": 242445, "epoch": 2921} {"train_loss": -24.003339767456055, "global_step": 242446, "epoch": 2921} {"train_loss": -23.798999786376953, "global_step": 242447, "epoch": 2921} {"train_loss": -24.468046188354492, "global_step": 242448, "epoch": 2921} {"train_loss": -24.18471336364746, "global_step": 242449, "epoch": 2921} {"train_loss": -24.41203498840332, "global_step": 242450, "epoch": 2921} {"train_loss": -24.18271255493164, "global_step": 242451, "epoch": 2921} {"train_loss": -24.379581451416016, "global_step": 242452, "epoch": 2921} {"train_loss": -24.83884620666504, "global_step": 242453, "epoch": 2921} {"train_loss": -24.78408432006836, "global_step": 242454, "epoch": 2921} {"train_loss": -24.148880004882812, "global_step": 242455, "epoch": 2921} {"train_loss": -24.775897979736328, "global_step": 242456, "epoch": 2921} {"train_loss": -24.412900924682617, "global_step": 242457, "epoch": 2921} {"train_loss": -24.691984176635742, "global_step": 242458, "epoch": 2921} {"train_loss": -24.268821716308594, "global_step": 242459, "epoch": 2921} {"train_loss": -24.893068313598633, "global_step": 242460, "epoch": 2921} {"train_loss": -24.79926872253418, "global_step": 242461, "epoch": 2921} {"train_loss": -24.554534912109375, "global_step": 242462, "epoch": 2921} {"train_loss": -24.43161964416504, "global_step": 242463, "epoch": 2921} {"train_loss": -24.735824584960938, "global_step": 242464, "epoch": 2921} {"train_loss": -24.543506622314453, "global_step": 242465, "epoch": 2921} {"train_loss": -24.519393920898438, "global_step": 242466, "epoch": 2921} {"train_loss": -24.811269760131836, "global_step": 242467, "epoch": 2921} {"train_loss": -24.78455924987793, "global_step": 242468, "epoch": 2921} {"train_loss": -24.662439346313477, "global_step": 242469, "epoch": 2921} {"train_loss": -24.876426696777344, "global_step": 242470, "epoch": 2921} {"train_loss": -24.879913330078125, "global_step": 242471, "epoch": 2921} {"train_loss": -24.78387451171875, "global_step": 242472, "epoch": 2921} {"train_loss": -24.775218963623047, "global_step": 242473, "epoch": 2921} {"train_loss": -24.674976348876953, "global_step": 242474, "epoch": 2921} {"train_loss": -24.806211471557617, "global_step": 242475, "epoch": 2921} {"train_loss": -24.52642250061035, "global_step": 242476, "epoch": 2921} {"train_loss": -24.799406051635742, "global_step": 242477, "epoch": 2921} {"train_loss": -25.289640426635742, "global_step": 242478, "epoch": 2921} {"train_loss": -24.9791202545166, "global_step": 242479, "epoch": 2921} {"train_loss": -24.87626075744629, "global_step": 242480, "epoch": 2921} {"train_loss": -25.439207077026367, "global_step": 242481, "epoch": 2921} {"train_loss": -25.030811309814453, "global_step": 242482, "epoch": 2921} {"train_loss": -24.745290756225586, "global_step": 242483, "epoch": 2921} {"train_loss": -24.99567985534668, "global_step": 242484, "epoch": 2921} {"train_loss": -25.41717529296875, "global_step": 242485, "epoch": 2921} {"train_loss": -24.729040145874023, "global_step": 242486, "epoch": 2921} {"train_loss": -25.02522087097168, "global_step": 242487, "epoch": 2921} {"train_loss": -24.710052490234375, "global_step": 242488, "epoch": 2921} {"train_loss": -25.201414108276367, "global_step": 242489, "epoch": 2921} {"train_loss": -24.8719425201416, "global_step": 242490, "epoch": 2921} {"train_loss": -24.489669799804688, "global_step": 242491, "epoch": 2921} {"train_loss": -24.635568618774414, "global_step": 242492, "epoch": 2921} {"train_loss": -24.792083740234375, "global_step": 242493, "epoch": 2921} {"train_loss": -25.014307022094727, "global_step": 242494, "epoch": 2921} {"train_loss": -25.07162857055664, "global_step": 242495, "epoch": 2921} {"train_loss": -24.930191040039062, "global_step": 242496, "epoch": 2921} {"train_loss": -24.900419235229492, "global_step": 242497, "epoch": 2921} {"train_loss": -25.102954864501953, "global_step": 242498, "epoch": 2921} {"train_loss": -24.877599716186523, "global_step": 242499, "epoch": 2921} {"train_loss": -25.088836669921875, "global_step": 242500, "epoch": 2921} {"train_loss": -24.94711685180664, "global_step": 242501, "epoch": 2921} {"train_loss": -24.604570388793945, "global_step": 242502, "epoch": 2921} {"train_loss": -24.494674682617188, "global_step": 242503, "epoch": 2921} {"train_loss": -25.005008697509766, "global_step": 242504, "epoch": 2921} {"train_loss": -25.024728775024414, "global_step": 242505, "epoch": 2921} {"train_loss": -24.76030921936035, "global_step": 242506, "epoch": 2921} {"train_loss": -24.779495239257812, "global_step": 242507, "epoch": 2921} {"train_loss": -24.765478134155273, "global_step": 242508, "epoch": 2921} {"train_loss": -24.711078643798828, "global_step": 242509, "epoch": 2921} {"train_loss": -25.034475326538086, "global_step": 242510, "epoch": 2921} {"train_loss": -24.90421485900879, "global_step": 242511, "epoch": 2921} {"train_loss": -24.906957626342773, "global_step": 242512, "epoch": 2921} {"train_loss": -24.827062606811523, "global_step": 242513, "epoch": 2921} {"train_loss": -25.064672470092773, "global_step": 242514, "epoch": 2921} {"train_loss": -24.91744041442871, "global_step": 242515, "epoch": 2921} {"train_loss": -25.279752731323242, "global_step": 242516, "epoch": 2921} {"train_loss": -25.00379753112793, "global_step": 242517, "epoch": 2921} {"train_loss": -24.757728576660156, "global_step": 242518, "epoch": 2921} {"train_loss": -25.05415916442871, "global_step": 242519, "epoch": 2921} {"train_loss": -25.01603126525879, "global_step": 242520, "epoch": 2921} {"train_loss": -24.935914993286133, "global_step": 242521, "epoch": 2921} {"train_loss": -24.63425064086914, "global_step": 242522, "epoch": 2921} {"train_loss": -24.94435691833496, "global_step": 242523, "epoch": 2921} {"train_loss": -23.78728675842285, "global_step": 242524, "epoch": 2921} {"train_loss": -24.740249748689582, "global_step": 242525, "epoch": 2921, "val_loss": 6973564.0} {"train_loss": -22.769102096557617, "global_step": 242526, "epoch": 2922} {"train_loss": -24.03546142578125, "global_step": 242527, "epoch": 2922} {"train_loss": -23.885831832885742, "global_step": 242528, "epoch": 2922} {"train_loss": -23.6397647857666, "global_step": 242529, "epoch": 2922} {"train_loss": -23.603090286254883, "global_step": 242530, "epoch": 2922} {"train_loss": -23.66974449157715, "global_step": 242531, "epoch": 2922} {"train_loss": -23.749719619750977, "global_step": 242532, "epoch": 2922} {"train_loss": -23.88446044921875, "global_step": 242533, "epoch": 2922} {"train_loss": -23.84044075012207, "global_step": 242534, "epoch": 2922} {"train_loss": -23.931461334228516, "global_step": 242535, "epoch": 2922} {"train_loss": -23.85141944885254, "global_step": 242536, "epoch": 2922} {"train_loss": -23.729185104370117, "global_step": 242537, "epoch": 2922} {"train_loss": -24.203811645507812, "global_step": 242538, "epoch": 2922} {"train_loss": -24.154544830322266, "global_step": 242539, "epoch": 2922} {"train_loss": -23.92732810974121, "global_step": 242540, "epoch": 2922} {"train_loss": -24.17178726196289, "global_step": 242541, "epoch": 2922} {"train_loss": -24.382320404052734, "global_step": 242542, "epoch": 2922} {"train_loss": -24.20467185974121, "global_step": 242543, "epoch": 2922} {"train_loss": -24.6243953704834, "global_step": 242544, "epoch": 2922} {"train_loss": -24.2879695892334, "global_step": 242545, "epoch": 2922} {"train_loss": -24.146526336669922, "global_step": 242546, "epoch": 2922} {"train_loss": -24.46542739868164, "global_step": 242547, "epoch": 2922} {"train_loss": -24.637662887573242, "global_step": 242548, "epoch": 2922} {"train_loss": -24.65790367126465, "global_step": 242549, "epoch": 2922} {"train_loss": -24.473356246948242, "global_step": 242550, "epoch": 2922} {"train_loss": -24.207246780395508, "global_step": 242551, "epoch": 2922} {"train_loss": -24.492721557617188, "global_step": 242552, "epoch": 2922} {"train_loss": -24.633541107177734, "global_step": 242553, "epoch": 2922} {"train_loss": -24.78719139099121, "global_step": 242554, "epoch": 2922} {"train_loss": -24.50264549255371, "global_step": 242555, "epoch": 2922} {"train_loss": -24.55394172668457, "global_step": 242556, "epoch": 2922} {"train_loss": -24.488096237182617, "global_step": 242557, "epoch": 2922} {"train_loss": -24.973474502563477, "global_step": 242558, "epoch": 2922} {"train_loss": -24.630373001098633, "global_step": 242559, "epoch": 2922} {"train_loss": -24.747743606567383, "global_step": 242560, "epoch": 2922} {"train_loss": -24.854917526245117, "global_step": 242561, "epoch": 2922} {"train_loss": -24.858348846435547, "global_step": 242562, "epoch": 2922} {"train_loss": -25.006832122802734, "global_step": 242563, "epoch": 2922} {"train_loss": -24.687360763549805, "global_step": 242564, "epoch": 2922} {"train_loss": -25.056547164916992, "global_step": 242565, "epoch": 2922} {"train_loss": -24.954898834228516, "global_step": 242566, "epoch": 2922} {"train_loss": -24.672367095947266, "global_step": 242567, "epoch": 2922} {"train_loss": -24.627059936523438, "global_step": 242568, "epoch": 2922} {"train_loss": -24.980234146118164, "global_step": 242569, "epoch": 2922} {"train_loss": -24.803817749023438, "global_step": 242570, "epoch": 2922} {"train_loss": -25.032575607299805, "global_step": 242571, "epoch": 2922} {"train_loss": -24.91299057006836, "global_step": 242572, "epoch": 2922} {"train_loss": -24.661834716796875, "global_step": 242573, "epoch": 2922} {"train_loss": -25.117414474487305, "global_step": 242574, "epoch": 2922} {"train_loss": -24.776935577392578, "global_step": 242575, "epoch": 2922} {"train_loss": -25.1854305267334, "global_step": 242576, "epoch": 2922} {"train_loss": -25.00162124633789, "global_step": 242577, "epoch": 2922} {"train_loss": -24.93610191345215, "global_step": 242578, "epoch": 2922} {"train_loss": -24.95166015625, "global_step": 242579, "epoch": 2922} {"train_loss": -25.025522232055664, "global_step": 242580, "epoch": 2922} {"train_loss": -25.331329345703125, "global_step": 242581, "epoch": 2922} {"train_loss": -25.049530029296875, "global_step": 242582, "epoch": 2922} {"train_loss": -25.236804962158203, "global_step": 242583, "epoch": 2922} {"train_loss": -24.800344467163086, "global_step": 242584, "epoch": 2922} {"train_loss": -24.92418670654297, "global_step": 242585, "epoch": 2922} {"train_loss": -24.982778549194336, "global_step": 242586, "epoch": 2922} {"train_loss": -24.840965270996094, "global_step": 242587, "epoch": 2922} {"train_loss": -24.923322677612305, "global_step": 242588, "epoch": 2922} {"train_loss": -24.532718658447266, "global_step": 242589, "epoch": 2922} {"train_loss": -24.749126434326172, "global_step": 242590, "epoch": 2922} {"train_loss": -24.985824584960938, "global_step": 242591, "epoch": 2922} {"train_loss": -25.047183990478516, "global_step": 242592, "epoch": 2922} {"train_loss": -24.672449111938477, "global_step": 242593, "epoch": 2922} {"train_loss": -24.492630004882812, "global_step": 242594, "epoch": 2922} {"train_loss": -24.881772994995117, "global_step": 242595, "epoch": 2922} {"train_loss": -25.000213623046875, "global_step": 242596, "epoch": 2922} {"train_loss": -24.781200408935547, "global_step": 242597, "epoch": 2922} {"train_loss": -25.21957015991211, "global_step": 242598, "epoch": 2922} {"train_loss": -25.01869010925293, "global_step": 242599, "epoch": 2922} {"train_loss": -24.699710845947266, "global_step": 242600, "epoch": 2922} {"train_loss": -24.713720321655273, "global_step": 242601, "epoch": 2922} {"train_loss": -24.926652908325195, "global_step": 242602, "epoch": 2922} {"train_loss": -24.81471061706543, "global_step": 242603, "epoch": 2922} {"train_loss": -24.95774269104004, "global_step": 242604, "epoch": 2922} {"train_loss": -24.486173629760742, "global_step": 242605, "epoch": 2922} {"train_loss": -25.19351577758789, "global_step": 242606, "epoch": 2922} {"train_loss": -24.96648597717285, "global_step": 242607, "epoch": 2922} {"train_loss": -24.60915229981204, "global_step": 242608, "epoch": 2922, "val_loss": 6834553.0} {"train_loss": -24.636943817138672, "global_step": 242609, "epoch": 2923} {"train_loss": -24.062129974365234, "global_step": 242610, "epoch": 2923} {"train_loss": -24.405597686767578, "global_step": 242611, "epoch": 2923} {"train_loss": -24.410768508911133, "global_step": 242612, "epoch": 2923} {"train_loss": -24.534944534301758, "global_step": 242613, "epoch": 2923} {"train_loss": -24.456424713134766, "global_step": 242614, "epoch": 2923} {"train_loss": -24.56451416015625, "global_step": 242615, "epoch": 2923} {"train_loss": -24.82552146911621, "global_step": 242616, "epoch": 2923} {"train_loss": -24.73777198791504, "global_step": 242617, "epoch": 2923} {"train_loss": -24.605180740356445, "global_step": 242618, "epoch": 2923} {"train_loss": -24.702043533325195, "global_step": 242619, "epoch": 2923} {"train_loss": -24.71283721923828, "global_step": 242620, "epoch": 2923} {"train_loss": -24.968358993530273, "global_step": 242621, "epoch": 2923} {"train_loss": -24.876062393188477, "global_step": 242622, "epoch": 2923} {"train_loss": -24.533218383789062, "global_step": 242623, "epoch": 2923} {"train_loss": -24.621976852416992, "global_step": 242624, "epoch": 2923} {"train_loss": -24.998533248901367, "global_step": 242625, "epoch": 2923} {"train_loss": -24.858570098876953, "global_step": 242626, "epoch": 2923} {"train_loss": -24.81595230102539, "global_step": 242627, "epoch": 2923} {"train_loss": -24.56481170654297, "global_step": 242628, "epoch": 2923} {"train_loss": -24.704782485961914, "global_step": 242629, "epoch": 2923} {"train_loss": -24.63307762145996, "global_step": 242630, "epoch": 2923} {"train_loss": -24.60988426208496, "global_step": 242631, "epoch": 2923} {"train_loss": -24.672231674194336, "global_step": 242632, "epoch": 2923} {"train_loss": -24.682266235351562, "global_step": 242633, "epoch": 2923} {"train_loss": -24.932273864746094, "global_step": 242634, "epoch": 2923} {"train_loss": -24.625444412231445, "global_step": 242635, "epoch": 2923} {"train_loss": -24.86466407775879, "global_step": 242636, "epoch": 2923} {"train_loss": -25.131595611572266, "global_step": 242637, "epoch": 2923} {"train_loss": -24.80854606628418, "global_step": 242638, "epoch": 2923} {"train_loss": -25.035669326782227, "global_step": 242639, "epoch": 2923} {"train_loss": -24.98320960998535, "global_step": 242640, "epoch": 2923} {"train_loss": -25.1144962310791, "global_step": 242641, "epoch": 2923} {"train_loss": -24.915992736816406, "global_step": 242642, "epoch": 2923} {"train_loss": -25.041828155517578, "global_step": 242643, "epoch": 2923} {"train_loss": -24.68243980407715, "global_step": 242644, "epoch": 2923} {"train_loss": -25.042661666870117, "global_step": 242645, "epoch": 2923} {"train_loss": -25.014650344848633, "global_step": 242646, "epoch": 2923} {"train_loss": -24.6192569732666, "global_step": 242647, "epoch": 2923} {"train_loss": -24.62872886657715, "global_step": 242648, "epoch": 2923} {"train_loss": -24.953947067260742, "global_step": 242649, "epoch": 2923} {"train_loss": -24.565414428710938, "global_step": 242650, "epoch": 2923} {"train_loss": -24.596866607666016, "global_step": 242651, "epoch": 2923} {"train_loss": -24.872922897338867, "global_step": 242652, "epoch": 2923} {"train_loss": -24.633384704589844, "global_step": 242653, "epoch": 2923} {"train_loss": -24.61667823791504, "global_step": 242654, "epoch": 2923} {"train_loss": -24.832401275634766, "global_step": 242655, "epoch": 2923} {"train_loss": -24.489641189575195, "global_step": 242656, "epoch": 2923} {"train_loss": -24.88515281677246, "global_step": 242657, "epoch": 2923} {"train_loss": -24.926712036132812, "global_step": 242658, "epoch": 2923} {"train_loss": -24.626340866088867, "global_step": 242659, "epoch": 2923} {"train_loss": -24.87687873840332, "global_step": 242660, "epoch": 2923} {"train_loss": -25.05503273010254, "global_step": 242661, "epoch": 2923} {"train_loss": -25.133766174316406, "global_step": 242662, "epoch": 2923} {"train_loss": -24.91377830505371, "global_step": 242663, "epoch": 2923} {"train_loss": -25.182178497314453, "global_step": 242664, "epoch": 2923} {"train_loss": -24.949079513549805, "global_step": 242665, "epoch": 2923} {"train_loss": -25.084896087646484, "global_step": 242666, "epoch": 2923} {"train_loss": -24.711572647094727, "global_step": 242667, "epoch": 2923} {"train_loss": -25.112354278564453, "global_step": 242668, "epoch": 2923} {"train_loss": -25.047739028930664, "global_step": 242669, "epoch": 2923} {"train_loss": -24.762325286865234, "global_step": 242670, "epoch": 2923} {"train_loss": -25.308935165405273, "global_step": 242671, "epoch": 2923} {"train_loss": -25.103500366210938, "global_step": 242672, "epoch": 2923} {"train_loss": -25.014501571655273, "global_step": 242673, "epoch": 2923} {"train_loss": -25.353322982788086, "global_step": 242674, "epoch": 2923} {"train_loss": -24.678781509399414, "global_step": 242675, "epoch": 2923} {"train_loss": -25.06318473815918, "global_step": 242676, "epoch": 2923} {"train_loss": -25.190204620361328, "global_step": 242677, "epoch": 2923} {"train_loss": -25.09038543701172, "global_step": 242678, "epoch": 2923} {"train_loss": -25.472333908081055, "global_step": 242679, "epoch": 2923} {"train_loss": -25.039159774780273, "global_step": 242680, "epoch": 2923} {"train_loss": -24.76289939880371, "global_step": 242681, "epoch": 2923} {"train_loss": -25.180429458618164, "global_step": 242682, "epoch": 2923} {"train_loss": -24.666748046875, "global_step": 242683, "epoch": 2923} {"train_loss": -24.993295669555664, "global_step": 242684, "epoch": 2923} {"train_loss": -25.230045318603516, "global_step": 242685, "epoch": 2923} {"train_loss": -24.777002334594727, "global_step": 242686, "epoch": 2923} {"train_loss": -25.177906036376953, "global_step": 242687, "epoch": 2923} {"train_loss": -24.83519744873047, "global_step": 242688, "epoch": 2923} {"train_loss": -25.08050537109375, "global_step": 242689, "epoch": 2923} {"train_loss": -25.160001754760742, "global_step": 242690, "epoch": 2923} {"train_loss": -24.84222818857216, "global_step": 242691, "epoch": 2923, "val_loss": 6765477.0} {"train_loss": -24.355079650878906, "global_step": 242692, "epoch": 2924} {"train_loss": -24.632108688354492, "global_step": 242693, "epoch": 2924} {"train_loss": -25.128345489501953, "global_step": 242694, "epoch": 2924} {"train_loss": -24.45563316345215, "global_step": 242695, "epoch": 2924} {"train_loss": -25.01436424255371, "global_step": 242696, "epoch": 2924} {"train_loss": -24.434846878051758, "global_step": 242697, "epoch": 2924} {"train_loss": -24.752872467041016, "global_step": 242698, "epoch": 2924} {"train_loss": -24.493488311767578, "global_step": 242699, "epoch": 2924} {"train_loss": -24.399473190307617, "global_step": 242700, "epoch": 2924} {"train_loss": -24.710174560546875, "global_step": 242701, "epoch": 2924} {"train_loss": -24.477033615112305, "global_step": 242702, "epoch": 2924} {"train_loss": -24.760679244995117, "global_step": 242703, "epoch": 2924} {"train_loss": -24.734859466552734, "global_step": 242704, "epoch": 2924} {"train_loss": -24.983230590820312, "global_step": 242705, "epoch": 2924} {"train_loss": -24.61855125427246, "global_step": 242706, "epoch": 2924} {"train_loss": -24.960031509399414, "global_step": 242707, "epoch": 2924} {"train_loss": -25.13636589050293, "global_step": 242708, "epoch": 2924} {"train_loss": -25.200742721557617, "global_step": 242709, "epoch": 2924} {"train_loss": -24.52950096130371, "global_step": 242710, "epoch": 2924} {"train_loss": -24.968461990356445, "global_step": 242711, "epoch": 2924} {"train_loss": -24.788663864135742, "global_step": 242712, "epoch": 2924} {"train_loss": -24.849637985229492, "global_step": 242713, "epoch": 2924} {"train_loss": -24.61635398864746, "global_step": 242714, "epoch": 2924} {"train_loss": -24.80183219909668, "global_step": 242715, "epoch": 2924} {"train_loss": -24.880542755126953, "global_step": 242716, "epoch": 2924} {"train_loss": -24.71292495727539, "global_step": 242717, "epoch": 2924} {"train_loss": -24.478256225585938, "global_step": 242718, "epoch": 2924} {"train_loss": -24.678232192993164, "global_step": 242719, "epoch": 2924} {"train_loss": -24.622175216674805, "global_step": 242720, "epoch": 2924} {"train_loss": -25.174610137939453, "global_step": 242721, "epoch": 2924} {"train_loss": -24.84591293334961, "global_step": 242722, "epoch": 2924} {"train_loss": -24.796390533447266, "global_step": 242723, "epoch": 2924} {"train_loss": -24.860776901245117, "global_step": 242724, "epoch": 2924} {"train_loss": -24.8502140045166, "global_step": 242725, "epoch": 2924} {"train_loss": -24.705270767211914, "global_step": 242726, "epoch": 2924} {"train_loss": -25.037670135498047, "global_step": 242727, "epoch": 2924} {"train_loss": -24.765243530273438, "global_step": 242728, "epoch": 2924} {"train_loss": -24.79074478149414, "global_step": 242729, "epoch": 2924} {"train_loss": -25.097761154174805, "global_step": 242730, "epoch": 2924} {"train_loss": -25.230466842651367, "global_step": 242731, "epoch": 2924} {"train_loss": -25.113998413085938, "global_step": 242732, "epoch": 2924} {"train_loss": -25.099760055541992, "global_step": 242733, "epoch": 2924} {"train_loss": -25.33047866821289, "global_step": 242734, "epoch": 2924} {"train_loss": -24.753129959106445, "global_step": 242735, "epoch": 2924} {"train_loss": -24.99958610534668, "global_step": 242736, "epoch": 2924} {"train_loss": -25.63384437561035, "global_step": 242737, "epoch": 2924} {"train_loss": -24.917041778564453, "global_step": 242738, "epoch": 2924} {"train_loss": -25.05535888671875, "global_step": 242739, "epoch": 2924} {"train_loss": -25.1164493560791, "global_step": 242740, "epoch": 2924} {"train_loss": -25.050039291381836, "global_step": 242741, "epoch": 2924} {"train_loss": -24.842487335205078, "global_step": 242742, "epoch": 2924} {"train_loss": -25.068954467773438, "global_step": 242743, "epoch": 2924} {"train_loss": -24.925954818725586, "global_step": 242744, "epoch": 2924} {"train_loss": -24.716995239257812, "global_step": 242745, "epoch": 2924} {"train_loss": -25.22792625427246, "global_step": 242746, "epoch": 2924} {"train_loss": -24.816415786743164, "global_step": 242747, "epoch": 2924} {"train_loss": -25.368528366088867, "global_step": 242748, "epoch": 2924} {"train_loss": -24.921064376831055, "global_step": 242749, "epoch": 2924} {"train_loss": -24.813833236694336, "global_step": 242750, "epoch": 2924} {"train_loss": -24.94516372680664, "global_step": 242751, "epoch": 2924} {"train_loss": -24.96685218811035, "global_step": 242752, "epoch": 2924} {"train_loss": -24.989408493041992, "global_step": 242753, "epoch": 2924} {"train_loss": -24.68062400817871, "global_step": 242754, "epoch": 2924} {"train_loss": -24.62629508972168, "global_step": 242755, "epoch": 2924} {"train_loss": -24.788299560546875, "global_step": 242756, "epoch": 2924} {"train_loss": -24.78928565979004, "global_step": 242757, "epoch": 2924} {"train_loss": -24.837636947631836, "global_step": 242758, "epoch": 2924} {"train_loss": -24.517602920532227, "global_step": 242759, "epoch": 2924} {"train_loss": -24.798025131225586, "global_step": 242760, "epoch": 2924} {"train_loss": -24.592571258544922, "global_step": 242761, "epoch": 2924} {"train_loss": -24.884292602539062, "global_step": 242762, "epoch": 2924} {"train_loss": -24.726343154907227, "global_step": 242763, "epoch": 2924} {"train_loss": -24.506629943847656, "global_step": 242764, "epoch": 2924} {"train_loss": -24.547590255737305, "global_step": 242765, "epoch": 2924} {"train_loss": -24.695531845092773, "global_step": 242766, "epoch": 2924} {"train_loss": -24.71457290649414, "global_step": 242767, "epoch": 2924} {"train_loss": -24.62748146057129, "global_step": 242768, "epoch": 2924} {"train_loss": -24.612049102783203, "global_step": 242769, "epoch": 2924} {"train_loss": -24.7683162689209, "global_step": 242770, "epoch": 2924} {"train_loss": -24.6439151763916, "global_step": 242771, "epoch": 2924} {"train_loss": -24.875179290771484, "global_step": 242772, "epoch": 2924} {"train_loss": -25.449853897094727, "global_step": 242773, "epoch": 2924} {"train_loss": -24.829272787254975, "global_step": 242774, "epoch": 2924, "val_loss": 6760111.5} {"train_loss": -24.50335121154785, "global_step": 242775, "epoch": 2925} {"train_loss": -24.734745025634766, "global_step": 242776, "epoch": 2925} {"train_loss": -24.633054733276367, "global_step": 242777, "epoch": 2925} {"train_loss": -24.735279083251953, "global_step": 242778, "epoch": 2925} {"train_loss": -24.569229125976562, "global_step": 242779, "epoch": 2925} {"train_loss": -24.931230545043945, "global_step": 242780, "epoch": 2925} {"train_loss": -24.312353134155273, "global_step": 242781, "epoch": 2925} {"train_loss": -24.880807876586914, "global_step": 242782, "epoch": 2925} {"train_loss": -24.47980308532715, "global_step": 242783, "epoch": 2925} {"train_loss": -24.55256462097168, "global_step": 242784, "epoch": 2925} {"train_loss": -24.675262451171875, "global_step": 242785, "epoch": 2925} {"train_loss": -24.808984756469727, "global_step": 242786, "epoch": 2925} {"train_loss": -24.68548583984375, "global_step": 242787, "epoch": 2925} {"train_loss": -24.7718563079834, "global_step": 242788, "epoch": 2925} {"train_loss": -24.707456588745117, "global_step": 242789, "epoch": 2925} {"train_loss": -24.596464157104492, "global_step": 242790, "epoch": 2925} {"train_loss": -25.152135848999023, "global_step": 242791, "epoch": 2925} {"train_loss": -25.163482666015625, "global_step": 242792, "epoch": 2925} {"train_loss": -24.85552978515625, "global_step": 242793, "epoch": 2925} {"train_loss": -24.697195053100586, "global_step": 242794, "epoch": 2925} {"train_loss": -24.872333526611328, "global_step": 242795, "epoch": 2925} {"train_loss": -25.306501388549805, "global_step": 242796, "epoch": 2925} {"train_loss": -25.05451202392578, "global_step": 242797, "epoch": 2925} {"train_loss": -24.238821029663086, "global_step": 242798, "epoch": 2925} {"train_loss": -24.88032341003418, "global_step": 242799, "epoch": 2925} {"train_loss": -25.104259490966797, "global_step": 242800, "epoch": 2925} {"train_loss": -24.616500854492188, "global_step": 242801, "epoch": 2925} {"train_loss": -25.153030395507812, "global_step": 242802, "epoch": 2925} {"train_loss": -25.31064224243164, "global_step": 242803, "epoch": 2925} {"train_loss": -25.274078369140625, "global_step": 242804, "epoch": 2925} {"train_loss": -24.98497200012207, "global_step": 242805, "epoch": 2925} {"train_loss": -24.894140243530273, "global_step": 242806, "epoch": 2925} {"train_loss": -25.03956413269043, "global_step": 242807, "epoch": 2925} {"train_loss": -24.86759376525879, "global_step": 242808, "epoch": 2925} {"train_loss": -25.238399505615234, "global_step": 242809, "epoch": 2925} {"train_loss": -25.07740592956543, "global_step": 242810, "epoch": 2925} {"train_loss": -25.3255672454834, "global_step": 242811, "epoch": 2925} {"train_loss": -24.90321922302246, "global_step": 242812, "epoch": 2925} {"train_loss": -25.11189842224121, "global_step": 242813, "epoch": 2925} {"train_loss": -25.121023178100586, "global_step": 242814, "epoch": 2925} {"train_loss": -25.403165817260742, "global_step": 242815, "epoch": 2925} {"train_loss": -25.084392547607422, "global_step": 242816, "epoch": 2925} {"train_loss": -25.210996627807617, "global_step": 242817, "epoch": 2925} {"train_loss": -25.079893112182617, "global_step": 242818, "epoch": 2925} {"train_loss": -24.99419593811035, "global_step": 242819, "epoch": 2925} {"train_loss": -24.58033561706543, "global_step": 242820, "epoch": 2925} {"train_loss": -24.5003662109375, "global_step": 242821, "epoch": 2925} {"train_loss": -25.044816970825195, "global_step": 242822, "epoch": 2925} {"train_loss": -25.088459014892578, "global_step": 242823, "epoch": 2925} {"train_loss": -24.714853286743164, "global_step": 242824, "epoch": 2925} {"train_loss": -25.07076072692871, "global_step": 242825, "epoch": 2925} {"train_loss": -24.969621658325195, "global_step": 242826, "epoch": 2925} {"train_loss": -25.19290542602539, "global_step": 242827, "epoch": 2925} {"train_loss": -25.384611129760742, "global_step": 242828, "epoch": 2925} {"train_loss": -25.087970733642578, "global_step": 242829, "epoch": 2925} {"train_loss": -24.96822166442871, "global_step": 242830, "epoch": 2925} {"train_loss": -25.353178024291992, "global_step": 242831, "epoch": 2925} {"train_loss": -24.92758560180664, "global_step": 242832, "epoch": 2925} {"train_loss": -25.16072654724121, "global_step": 242833, "epoch": 2925} {"train_loss": -24.926694869995117, "global_step": 242834, "epoch": 2925} {"train_loss": -25.35108184814453, "global_step": 242835, "epoch": 2925} {"train_loss": -24.83161735534668, "global_step": 242836, "epoch": 2925} {"train_loss": -24.97027587890625, "global_step": 242837, "epoch": 2925} {"train_loss": -24.471586227416992, "global_step": 242838, "epoch": 2925} {"train_loss": -24.91999053955078, "global_step": 242839, "epoch": 2925} {"train_loss": -25.060482025146484, "global_step": 242840, "epoch": 2925} {"train_loss": -24.96119499206543, "global_step": 242841, "epoch": 2925} {"train_loss": -25.2818603515625, "global_step": 242842, "epoch": 2925} {"train_loss": -24.84821128845215, "global_step": 242843, "epoch": 2925} {"train_loss": -24.85017204284668, "global_step": 242844, "epoch": 2925} {"train_loss": -25.025951385498047, "global_step": 242845, "epoch": 2925} {"train_loss": -25.13724708557129, "global_step": 242846, "epoch": 2925} {"train_loss": -24.961097717285156, "global_step": 242847, "epoch": 2925} {"train_loss": -24.83349609375, "global_step": 242848, "epoch": 2925} {"train_loss": -24.834562301635742, "global_step": 242849, "epoch": 2925} {"train_loss": -24.990140914916992, "global_step": 242850, "epoch": 2925} {"train_loss": -24.971994400024414, "global_step": 242851, "epoch": 2925} {"train_loss": -24.835519790649414, "global_step": 242852, "epoch": 2925} {"train_loss": -25.143339157104492, "global_step": 242853, "epoch": 2925} {"train_loss": -24.687910079956055, "global_step": 242854, "epoch": 2925} {"train_loss": -24.983304977416992, "global_step": 242855, "epoch": 2925} {"train_loss": -24.811216354370117, "global_step": 242856, "epoch": 2925} {"train_loss": -24.91952792707696, "global_step": 242857, "epoch": 2925, "val_loss": 6852775.0} {"train_loss": -24.689146041870117, "global_step": 242858, "epoch": 2926} {"train_loss": -24.469228744506836, "global_step": 242859, "epoch": 2926} {"train_loss": -23.404027938842773, "global_step": 242860, "epoch": 2926} {"train_loss": -23.101329803466797, "global_step": 242861, "epoch": 2926} {"train_loss": -24.58388328552246, "global_step": 242862, "epoch": 2926} {"train_loss": -24.1392822265625, "global_step": 242863, "epoch": 2926} {"train_loss": -24.48251724243164, "global_step": 242864, "epoch": 2926} {"train_loss": -24.04071617126465, "global_step": 242865, "epoch": 2926} {"train_loss": -24.575759887695312, "global_step": 242866, "epoch": 2926} {"train_loss": -24.25553321838379, "global_step": 242867, "epoch": 2926} {"train_loss": -24.32895278930664, "global_step": 242868, "epoch": 2926} {"train_loss": -24.6875, "global_step": 242869, "epoch": 2926} {"train_loss": -24.869787216186523, "global_step": 242870, "epoch": 2926} {"train_loss": -24.436811447143555, "global_step": 242871, "epoch": 2926} {"train_loss": -24.414833068847656, "global_step": 242872, "epoch": 2926} {"train_loss": -24.56374168395996, "global_step": 242873, "epoch": 2926} {"train_loss": -24.20426368713379, "global_step": 242874, "epoch": 2926} {"train_loss": -24.716096878051758, "global_step": 242875, "epoch": 2926} {"train_loss": -24.37324333190918, "global_step": 242876, "epoch": 2926} {"train_loss": -24.57819366455078, "global_step": 242877, "epoch": 2926} {"train_loss": -24.916030883789062, "global_step": 242878, "epoch": 2926} {"train_loss": -24.90789222717285, "global_step": 242879, "epoch": 2926} {"train_loss": -24.758708953857422, "global_step": 242880, "epoch": 2926} {"train_loss": -24.892501831054688, "global_step": 242881, "epoch": 2926} {"train_loss": -24.416982650756836, "global_step": 242882, "epoch": 2926} {"train_loss": -24.759967803955078, "global_step": 242883, "epoch": 2926} {"train_loss": -24.744028091430664, "global_step": 242884, "epoch": 2926} {"train_loss": -24.99931526184082, "global_step": 242885, "epoch": 2926} {"train_loss": -24.916982650756836, "global_step": 242886, "epoch": 2926} {"train_loss": -24.69806671142578, "global_step": 242887, "epoch": 2926} {"train_loss": -24.74781608581543, "global_step": 242888, "epoch": 2926} {"train_loss": -24.567060470581055, "global_step": 242889, "epoch": 2926} {"train_loss": -24.59751319885254, "global_step": 242890, "epoch": 2926} {"train_loss": -24.551464080810547, "global_step": 242891, "epoch": 2926} {"train_loss": -24.93771743774414, "global_step": 242892, "epoch": 2926} {"train_loss": -24.60427474975586, "global_step": 242893, "epoch": 2926} {"train_loss": -24.800888061523438, "global_step": 242894, "epoch": 2926} {"train_loss": -25.025821685791016, "global_step": 242895, "epoch": 2926} {"train_loss": -25.055604934692383, "global_step": 242896, "epoch": 2926} {"train_loss": -24.8819522857666, "global_step": 242897, "epoch": 2926} {"train_loss": -24.777677536010742, "global_step": 242898, "epoch": 2926} {"train_loss": -24.99820899963379, "global_step": 242899, "epoch": 2926} {"train_loss": -25.07230567932129, "global_step": 242900, "epoch": 2926} {"train_loss": -25.014528274536133, "global_step": 242901, "epoch": 2926} {"train_loss": -25.261350631713867, "global_step": 242902, "epoch": 2926} {"train_loss": -24.992477416992188, "global_step": 242903, "epoch": 2926} {"train_loss": -25.256620407104492, "global_step": 242904, "epoch": 2926} {"train_loss": -25.066373825073242, "global_step": 242905, "epoch": 2926} {"train_loss": -24.966150283813477, "global_step": 242906, "epoch": 2926} {"train_loss": -25.026996612548828, "global_step": 242907, "epoch": 2926} {"train_loss": -24.941303253173828, "global_step": 242908, "epoch": 2926} {"train_loss": -24.980484008789062, "global_step": 242909, "epoch": 2926} {"train_loss": -25.141250610351562, "global_step": 242910, "epoch": 2926} {"train_loss": -25.04298973083496, "global_step": 242911, "epoch": 2926} {"train_loss": -25.110456466674805, "global_step": 242912, "epoch": 2926} {"train_loss": -25.070844650268555, "global_step": 242913, "epoch": 2926} {"train_loss": -25.100370407104492, "global_step": 242914, "epoch": 2926} {"train_loss": -25.380264282226562, "global_step": 242915, "epoch": 2926} {"train_loss": -25.141477584838867, "global_step": 242916, "epoch": 2926} {"train_loss": -24.99835777282715, "global_step": 242917, "epoch": 2926} {"train_loss": -25.134174346923828, "global_step": 242918, "epoch": 2926} {"train_loss": -24.828994750976562, "global_step": 242919, "epoch": 2926} {"train_loss": -24.949615478515625, "global_step": 242920, "epoch": 2926} {"train_loss": -24.650299072265625, "global_step": 242921, "epoch": 2926} {"train_loss": -25.30072784423828, "global_step": 242922, "epoch": 2926} {"train_loss": -24.73927879333496, "global_step": 242923, "epoch": 2926} {"train_loss": -24.99591636657715, "global_step": 242924, "epoch": 2926} {"train_loss": -24.584909439086914, "global_step": 242925, "epoch": 2926} {"train_loss": -24.573959350585938, "global_step": 242926, "epoch": 2926} {"train_loss": -23.968915939331055, "global_step": 242927, "epoch": 2926} {"train_loss": -23.970783233642578, "global_step": 242928, "epoch": 2926} {"train_loss": -25.204925537109375, "global_step": 242929, "epoch": 2926} {"train_loss": -24.795251846313477, "global_step": 242930, "epoch": 2926} {"train_loss": -23.807708740234375, "global_step": 242931, "epoch": 2926} {"train_loss": -24.453893661499023, "global_step": 242932, "epoch": 2926} {"train_loss": -24.840591430664062, "global_step": 242933, "epoch": 2926} {"train_loss": -24.206756591796875, "global_step": 242934, "epoch": 2926} {"train_loss": -24.629901885986328, "global_step": 242935, "epoch": 2926} {"train_loss": -25.08139419555664, "global_step": 242936, "epoch": 2926} {"train_loss": -24.1933650970459, "global_step": 242937, "epoch": 2926} {"train_loss": -24.5749568939209, "global_step": 242938, "epoch": 2926} {"train_loss": -24.796865463256836, "global_step": 242939, "epoch": 2926} {"train_loss": -24.70305348591632, "global_step": 242940, "epoch": 2926, "val_loss": 6901959.5} {"train_loss": -24.423377990722656, "global_step": 242941, "epoch": 2927} {"train_loss": -24.6475830078125, "global_step": 242942, "epoch": 2927} {"train_loss": -24.22247314453125, "global_step": 242943, "epoch": 2927} {"train_loss": -24.336320877075195, "global_step": 242944, "epoch": 2927} {"train_loss": -24.71550941467285, "global_step": 242945, "epoch": 2927} {"train_loss": -24.567808151245117, "global_step": 242946, "epoch": 2927} {"train_loss": -24.60788345336914, "global_step": 242947, "epoch": 2927} {"train_loss": -24.378747940063477, "global_step": 242948, "epoch": 2927} {"train_loss": -24.693572998046875, "global_step": 242949, "epoch": 2927} {"train_loss": -24.54046058654785, "global_step": 242950, "epoch": 2927} {"train_loss": -24.510936737060547, "global_step": 242951, "epoch": 2927} {"train_loss": -24.67555046081543, "global_step": 242952, "epoch": 2927} {"train_loss": -24.76816749572754, "global_step": 242953, "epoch": 2927} {"train_loss": -24.354394912719727, "global_step": 242954, "epoch": 2927} {"train_loss": -25.048738479614258, "global_step": 242955, "epoch": 2927} {"train_loss": -24.615453720092773, "global_step": 242956, "epoch": 2927} {"train_loss": -24.647611618041992, "global_step": 242957, "epoch": 2927} {"train_loss": -25.091413497924805, "global_step": 242958, "epoch": 2927} {"train_loss": -24.5966739654541, "global_step": 242959, "epoch": 2927} {"train_loss": -24.710851669311523, "global_step": 242960, "epoch": 2927} {"train_loss": -24.705459594726562, "global_step": 242961, "epoch": 2927} {"train_loss": -24.639957427978516, "global_step": 242962, "epoch": 2927} {"train_loss": -24.57785415649414, "global_step": 242963, "epoch": 2927} {"train_loss": -24.960956573486328, "global_step": 242964, "epoch": 2927} {"train_loss": -24.913536071777344, "global_step": 242965, "epoch": 2927} {"train_loss": -24.985252380371094, "global_step": 242966, "epoch": 2927} {"train_loss": -25.294788360595703, "global_step": 242967, "epoch": 2927} {"train_loss": -24.68408203125, "global_step": 242968, "epoch": 2927} {"train_loss": -24.894302368164062, "global_step": 242969, "epoch": 2927} {"train_loss": -24.749731063842773, "global_step": 242970, "epoch": 2927} {"train_loss": -24.740747451782227, "global_step": 242971, "epoch": 2927} {"train_loss": -24.34537124633789, "global_step": 242972, "epoch": 2927} {"train_loss": -24.754337310791016, "global_step": 242973, "epoch": 2927} {"train_loss": -25.174182891845703, "global_step": 242974, "epoch": 2927} {"train_loss": -25.076553344726562, "global_step": 242975, "epoch": 2927} {"train_loss": -24.850263595581055, "global_step": 242976, "epoch": 2927} {"train_loss": -24.703441619873047, "global_step": 242977, "epoch": 2927} {"train_loss": -24.895606994628906, "global_step": 242978, "epoch": 2927} {"train_loss": -24.828886032104492, "global_step": 242979, "epoch": 2927} {"train_loss": -24.710630416870117, "global_step": 242980, "epoch": 2927} {"train_loss": -24.714372634887695, "global_step": 242981, "epoch": 2927} {"train_loss": -24.77435874938965, "global_step": 242982, "epoch": 2927} {"train_loss": -25.162357330322266, "global_step": 242983, "epoch": 2927} {"train_loss": -24.846237182617188, "global_step": 242984, "epoch": 2927} {"train_loss": -25.218852996826172, "global_step": 242985, "epoch": 2927} {"train_loss": -24.710969924926758, "global_step": 242986, "epoch": 2927} {"train_loss": -25.469343185424805, "global_step": 242987, "epoch": 2927} {"train_loss": -25.097816467285156, "global_step": 242988, "epoch": 2927} {"train_loss": -25.0595645904541, "global_step": 242989, "epoch": 2927} {"train_loss": -25.220779418945312, "global_step": 242990, "epoch": 2927} {"train_loss": -25.02113914489746, "global_step": 242991, "epoch": 2927} {"train_loss": -25.05616569519043, "global_step": 242992, "epoch": 2927} {"train_loss": -25.0181827545166, "global_step": 242993, "epoch": 2927} {"train_loss": -24.759212493896484, "global_step": 242994, "epoch": 2927} {"train_loss": -25.042734146118164, "global_step": 242995, "epoch": 2927} {"train_loss": -25.110776901245117, "global_step": 242996, "epoch": 2927} {"train_loss": -25.10670280456543, "global_step": 242997, "epoch": 2927} {"train_loss": -24.756681442260742, "global_step": 242998, "epoch": 2927} {"train_loss": -25.34396743774414, "global_step": 242999, "epoch": 2927} {"train_loss": -24.854734420776367, "global_step": 243000, "epoch": 2927} {"train_loss": -24.88840103149414, "global_step": 243001, "epoch": 2927} {"train_loss": -24.828144073486328, "global_step": 243002, "epoch": 2927} {"train_loss": -24.989852905273438, "global_step": 243003, "epoch": 2927} {"train_loss": -24.967599868774414, "global_step": 243004, "epoch": 2927} {"train_loss": -24.70928955078125, "global_step": 243005, "epoch": 2927} {"train_loss": -25.20088768005371, "global_step": 243006, "epoch": 2927} {"train_loss": -24.856616973876953, "global_step": 243007, "epoch": 2927} {"train_loss": -25.032514572143555, "global_step": 243008, "epoch": 2927} {"train_loss": -25.170013427734375, "global_step": 243009, "epoch": 2927} {"train_loss": -24.730688095092773, "global_step": 243010, "epoch": 2927} {"train_loss": -24.97980499267578, "global_step": 243011, "epoch": 2927} {"train_loss": -24.830814361572266, "global_step": 243012, "epoch": 2927} {"train_loss": -24.7988338470459, "global_step": 243013, "epoch": 2927} {"train_loss": -24.748138427734375, "global_step": 243014, "epoch": 2927} {"train_loss": -24.849496841430664, "global_step": 243015, "epoch": 2927} {"train_loss": -24.890220642089844, "global_step": 243016, "epoch": 2927} {"train_loss": -24.84865379333496, "global_step": 243017, "epoch": 2927} {"train_loss": -24.815324783325195, "global_step": 243018, "epoch": 2927} {"train_loss": -24.870040893554688, "global_step": 243019, "epoch": 2927} {"train_loss": -24.946340560913086, "global_step": 243020, "epoch": 2927} {"train_loss": -25.23177146911621, "global_step": 243021, "epoch": 2927} {"train_loss": -24.830556869506836, "global_step": 243022, "epoch": 2927} {"train_loss": -24.842063352286097, "global_step": 243023, "epoch": 2927, "val_loss": 6890116.0} {"train_loss": -23.1326961517334, "global_step": 243024, "epoch": 2928} {"train_loss": -23.322711944580078, "global_step": 243025, "epoch": 2928} {"train_loss": -23.816396713256836, "global_step": 243026, "epoch": 2928} {"train_loss": -23.633020401000977, "global_step": 243027, "epoch": 2928} {"train_loss": -23.881866455078125, "global_step": 243028, "epoch": 2928} {"train_loss": -23.73993682861328, "global_step": 243029, "epoch": 2928} {"train_loss": -23.849143981933594, "global_step": 243030, "epoch": 2928} {"train_loss": -24.291879653930664, "global_step": 243031, "epoch": 2928} {"train_loss": -24.305908203125, "global_step": 243032, "epoch": 2928} {"train_loss": -24.70011329650879, "global_step": 243033, "epoch": 2928} {"train_loss": -24.51227378845215, "global_step": 243034, "epoch": 2928} {"train_loss": -24.355634689331055, "global_step": 243035, "epoch": 2928} {"train_loss": -24.347326278686523, "global_step": 243036, "epoch": 2928} {"train_loss": -24.404048919677734, "global_step": 243037, "epoch": 2928} {"train_loss": -24.2124080657959, "global_step": 243038, "epoch": 2928} {"train_loss": -24.39041519165039, "global_step": 243039, "epoch": 2928} {"train_loss": -24.514610290527344, "global_step": 243040, "epoch": 2928} {"train_loss": -24.4866886138916, "global_step": 243041, "epoch": 2928} {"train_loss": -24.49217414855957, "global_step": 243042, "epoch": 2928} {"train_loss": -24.511112213134766, "global_step": 243043, "epoch": 2928} {"train_loss": -24.393278121948242, "global_step": 243044, "epoch": 2928} {"train_loss": -24.444181442260742, "global_step": 243045, "epoch": 2928} {"train_loss": -24.560171127319336, "global_step": 243046, "epoch": 2928} {"train_loss": -24.53977394104004, "global_step": 243047, "epoch": 2928} {"train_loss": -24.867311477661133, "global_step": 243048, "epoch": 2928} {"train_loss": -24.790719985961914, "global_step": 243049, "epoch": 2928} {"train_loss": -24.858291625976562, "global_step": 243050, "epoch": 2928} {"train_loss": -25.05293846130371, "global_step": 243051, "epoch": 2928} {"train_loss": -24.357376098632812, "global_step": 243052, "epoch": 2928} {"train_loss": -24.97246742248535, "global_step": 243053, "epoch": 2928} {"train_loss": -24.820621490478516, "global_step": 243054, "epoch": 2928} {"train_loss": -25.023008346557617, "global_step": 243055, "epoch": 2928} {"train_loss": -24.307987213134766, "global_step": 243056, "epoch": 2928} {"train_loss": -25.102542877197266, "global_step": 243057, "epoch": 2928} {"train_loss": -24.513782501220703, "global_step": 243058, "epoch": 2928} {"train_loss": -25.134319305419922, "global_step": 243059, "epoch": 2928} {"train_loss": -24.886287689208984, "global_step": 243060, "epoch": 2928} {"train_loss": -24.891372680664062, "global_step": 243061, "epoch": 2928} {"train_loss": -24.863330841064453, "global_step": 243062, "epoch": 2928} {"train_loss": -24.331222534179688, "global_step": 243063, "epoch": 2928} {"train_loss": -24.418672561645508, "global_step": 243064, "epoch": 2928} {"train_loss": -24.75998878479004, "global_step": 243065, "epoch": 2928} {"train_loss": -24.672821044921875, "global_step": 243066, "epoch": 2928} {"train_loss": -24.719308853149414, "global_step": 243067, "epoch": 2928} {"train_loss": -24.634883880615234, "global_step": 243068, "epoch": 2928} {"train_loss": -25.038471221923828, "global_step": 243069, "epoch": 2928} {"train_loss": -24.52168846130371, "global_step": 243070, "epoch": 2928} {"train_loss": -24.81251335144043, "global_step": 243071, "epoch": 2928} {"train_loss": -25.02402687072754, "global_step": 243072, "epoch": 2928} {"train_loss": -25.0537166595459, "global_step": 243073, "epoch": 2928} {"train_loss": -24.793298721313477, "global_step": 243074, "epoch": 2928} {"train_loss": -25.102802276611328, "global_step": 243075, "epoch": 2928} {"train_loss": -24.810575485229492, "global_step": 243076, "epoch": 2928} {"train_loss": -24.684986114501953, "global_step": 243077, "epoch": 2928} {"train_loss": -25.09208106994629, "global_step": 243078, "epoch": 2928} {"train_loss": -25.098709106445312, "global_step": 243079, "epoch": 2928} {"train_loss": -24.712020874023438, "global_step": 243080, "epoch": 2928} {"train_loss": -25.058820724487305, "global_step": 243081, "epoch": 2928} {"train_loss": -25.055593490600586, "global_step": 243082, "epoch": 2928} {"train_loss": -25.346466064453125, "global_step": 243083, "epoch": 2928} {"train_loss": -25.489606857299805, "global_step": 243084, "epoch": 2928} {"train_loss": -25.04714584350586, "global_step": 243085, "epoch": 2928} {"train_loss": -24.859771728515625, "global_step": 243086, "epoch": 2928} {"train_loss": -25.069137573242188, "global_step": 243087, "epoch": 2928} {"train_loss": -25.02262306213379, "global_step": 243088, "epoch": 2928} {"train_loss": -25.210969924926758, "global_step": 243089, "epoch": 2928} {"train_loss": -25.23499870300293, "global_step": 243090, "epoch": 2928} {"train_loss": -25.157285690307617, "global_step": 243091, "epoch": 2928} {"train_loss": -24.460538864135742, "global_step": 243092, "epoch": 2928} {"train_loss": -24.59337043762207, "global_step": 243093, "epoch": 2928} {"train_loss": -24.803647994995117, "global_step": 243094, "epoch": 2928} {"train_loss": -25.026247024536133, "global_step": 243095, "epoch": 2928} {"train_loss": -24.97702980041504, "global_step": 243096, "epoch": 2928} {"train_loss": -24.59656524658203, "global_step": 243097, "epoch": 2928} {"train_loss": -24.75387191772461, "global_step": 243098, "epoch": 2928} {"train_loss": -25.079038619995117, "global_step": 243099, "epoch": 2928} {"train_loss": -24.9731388092041, "global_step": 243100, "epoch": 2928} {"train_loss": -25.039945602416992, "global_step": 243101, "epoch": 2928} {"train_loss": -24.97529411315918, "global_step": 243102, "epoch": 2928} {"train_loss": -25.027570724487305, "global_step": 243103, "epoch": 2928} {"train_loss": -25.174972534179688, "global_step": 243104, "epoch": 2928} {"train_loss": -25.02467155456543, "global_step": 243105, "epoch": 2928} {"train_loss": -24.678407002644366, "global_step": 243106, "epoch": 2928, "val_loss": 6831928.0} {"train_loss": -23.7574462890625, "global_step": 243107, "epoch": 2929} {"train_loss": -24.307218551635742, "global_step": 243108, "epoch": 2929} {"train_loss": -24.659223556518555, "global_step": 243109, "epoch": 2929} {"train_loss": -24.25140380859375, "global_step": 243110, "epoch": 2929} {"train_loss": -24.50958251953125, "global_step": 243111, "epoch": 2929} {"train_loss": -24.673702239990234, "global_step": 243112, "epoch": 2929} {"train_loss": -24.206584930419922, "global_step": 243113, "epoch": 2929} {"train_loss": -24.12338638305664, "global_step": 243114, "epoch": 2929} {"train_loss": -24.50009536743164, "global_step": 243115, "epoch": 2929} {"train_loss": -24.683073043823242, "global_step": 243116, "epoch": 2929} {"train_loss": -24.073272705078125, "global_step": 243117, "epoch": 2929} {"train_loss": -24.546350479125977, "global_step": 243118, "epoch": 2929} {"train_loss": -24.693952560424805, "global_step": 243119, "epoch": 2929} {"train_loss": -24.706520080566406, "global_step": 243120, "epoch": 2929} {"train_loss": -24.794147491455078, "global_step": 243121, "epoch": 2929} {"train_loss": -24.4653377532959, "global_step": 243122, "epoch": 2929} {"train_loss": -24.767560958862305, "global_step": 243123, "epoch": 2929} {"train_loss": -24.464773178100586, "global_step": 243124, "epoch": 2929} {"train_loss": -24.740026473999023, "global_step": 243125, "epoch": 2929} {"train_loss": -24.98470115661621, "global_step": 243126, "epoch": 2929} {"train_loss": -25.097949981689453, "global_step": 243127, "epoch": 2929} {"train_loss": -24.662160873413086, "global_step": 243128, "epoch": 2929} {"train_loss": -24.635299682617188, "global_step": 243129, "epoch": 2929} {"train_loss": -24.840341567993164, "global_step": 243130, "epoch": 2929} {"train_loss": -24.679824829101562, "global_step": 243131, "epoch": 2929} {"train_loss": -24.6866512298584, "global_step": 243132, "epoch": 2929} {"train_loss": -24.72614097595215, "global_step": 243133, "epoch": 2929} {"train_loss": -24.910062789916992, "global_step": 243134, "epoch": 2929} {"train_loss": -24.49495506286621, "global_step": 243135, "epoch": 2929} {"train_loss": -24.97220230102539, "global_step": 243136, "epoch": 2929} {"train_loss": -24.772174835205078, "global_step": 243137, "epoch": 2929} {"train_loss": -24.871530532836914, "global_step": 243138, "epoch": 2929} {"train_loss": -24.76345443725586, "global_step": 243139, "epoch": 2929} {"train_loss": -25.034875869750977, "global_step": 243140, "epoch": 2929} {"train_loss": -24.794313430786133, "global_step": 243141, "epoch": 2929} {"train_loss": -25.034345626831055, "global_step": 243142, "epoch": 2929} {"train_loss": -24.686416625976562, "global_step": 243143, "epoch": 2929} {"train_loss": -24.307462692260742, "global_step": 243144, "epoch": 2929} {"train_loss": -24.622268676757812, "global_step": 243145, "epoch": 2929} {"train_loss": -24.91415786743164, "global_step": 243146, "epoch": 2929} {"train_loss": -24.937726974487305, "global_step": 243147, "epoch": 2929} {"train_loss": -25.459409713745117, "global_step": 243148, "epoch": 2929} {"train_loss": -24.517736434936523, "global_step": 243149, "epoch": 2929} {"train_loss": -24.5681209564209, "global_step": 243150, "epoch": 2929} {"train_loss": -24.692779541015625, "global_step": 243151, "epoch": 2929} {"train_loss": -24.94646453857422, "global_step": 243152, "epoch": 2929} {"train_loss": -24.962202072143555, "global_step": 243153, "epoch": 2929} {"train_loss": -25.253026962280273, "global_step": 243154, "epoch": 2929} {"train_loss": -25.4035701751709, "global_step": 243155, "epoch": 2929} {"train_loss": -25.186155319213867, "global_step": 243156, "epoch": 2929} {"train_loss": -25.205625534057617, "global_step": 243157, "epoch": 2929} {"train_loss": -25.2628173828125, "global_step": 243158, "epoch": 2929} {"train_loss": -24.983121871948242, "global_step": 243159, "epoch": 2929} {"train_loss": -25.492422103881836, "global_step": 243160, "epoch": 2929} {"train_loss": -24.931903839111328, "global_step": 243161, "epoch": 2929} {"train_loss": -25.231359481811523, "global_step": 243162, "epoch": 2929} {"train_loss": -25.056354522705078, "global_step": 243163, "epoch": 2929} {"train_loss": -25.013208389282227, "global_step": 243164, "epoch": 2929} {"train_loss": -24.759136199951172, "global_step": 243165, "epoch": 2929} {"train_loss": -25.089868545532227, "global_step": 243166, "epoch": 2929} {"train_loss": -25.160755157470703, "global_step": 243167, "epoch": 2929} {"train_loss": -25.12067985534668, "global_step": 243168, "epoch": 2929} {"train_loss": -24.959814071655273, "global_step": 243169, "epoch": 2929} {"train_loss": -24.91541290283203, "global_step": 243170, "epoch": 2929} {"train_loss": -24.681760787963867, "global_step": 243171, "epoch": 2929} {"train_loss": -25.016220092773438, "global_step": 243172, "epoch": 2929} {"train_loss": -25.099903106689453, "global_step": 243173, "epoch": 2929} {"train_loss": -24.80704116821289, "global_step": 243174, "epoch": 2929} {"train_loss": -25.039648056030273, "global_step": 243175, "epoch": 2929} {"train_loss": -24.926538467407227, "global_step": 243176, "epoch": 2929} {"train_loss": -24.723180770874023, "global_step": 243177, "epoch": 2929} {"train_loss": -24.921655654907227, "global_step": 243178, "epoch": 2929} {"train_loss": -24.667036056518555, "global_step": 243179, "epoch": 2929} {"train_loss": -25.079526901245117, "global_step": 243180, "epoch": 2929} {"train_loss": -24.49375343322754, "global_step": 243181, "epoch": 2929} {"train_loss": -24.617603302001953, "global_step": 243182, "epoch": 2929} {"train_loss": -24.989749908447266, "global_step": 243183, "epoch": 2929} {"train_loss": -24.79323387145996, "global_step": 243184, "epoch": 2929} {"train_loss": -24.8115177154541, "global_step": 243185, "epoch": 2929} {"train_loss": -25.054649353027344, "global_step": 243186, "epoch": 2929} {"train_loss": -24.821226119995117, "global_step": 243187, "epoch": 2929} {"train_loss": -24.82465171813965, "global_step": 243188, "epoch": 2929} {"train_loss": -24.801742944372705, "global_step": 243189, "epoch": 2929, "val_loss": 6926006.0} {"train_loss": -24.153371810913086, "global_step": 243190, "epoch": 2930} {"train_loss": -23.9691219329834, "global_step": 243191, "epoch": 2930} {"train_loss": -24.108196258544922, "global_step": 243192, "epoch": 2930} {"train_loss": -24.488698959350586, "global_step": 243193, "epoch": 2930} {"train_loss": -24.014129638671875, "global_step": 243194, "epoch": 2930} {"train_loss": -24.281808853149414, "global_step": 243195, "epoch": 2930} {"train_loss": -24.7952880859375, "global_step": 243196, "epoch": 2930} {"train_loss": -23.958463668823242, "global_step": 243197, "epoch": 2930} {"train_loss": -23.704015731811523, "global_step": 243198, "epoch": 2930} {"train_loss": -24.222064971923828, "global_step": 243199, "epoch": 2930} {"train_loss": -24.577672958374023, "global_step": 243200, "epoch": 2930} {"train_loss": -24.62310791015625, "global_step": 243201, "epoch": 2930} {"train_loss": -24.200950622558594, "global_step": 243202, "epoch": 2930} {"train_loss": -24.175554275512695, "global_step": 243203, "epoch": 2930} {"train_loss": -24.289335250854492, "global_step": 243204, "epoch": 2930} {"train_loss": -24.2591495513916, "global_step": 243205, "epoch": 2930} {"train_loss": -24.471403121948242, "global_step": 243206, "epoch": 2930} {"train_loss": -23.9971866607666, "global_step": 243207, "epoch": 2930} {"train_loss": -24.427169799804688, "global_step": 243208, "epoch": 2930} {"train_loss": -24.697608947753906, "global_step": 243209, "epoch": 2930} {"train_loss": -24.503263473510742, "global_step": 243210, "epoch": 2930} {"train_loss": -24.572357177734375, "global_step": 243211, "epoch": 2930} {"train_loss": -24.64650535583496, "global_step": 243212, "epoch": 2930} {"train_loss": -24.863454818725586, "global_step": 243213, "epoch": 2930} {"train_loss": -24.533578872680664, "global_step": 243214, "epoch": 2930} {"train_loss": -24.81139373779297, "global_step": 243215, "epoch": 2930} {"train_loss": -24.869321823120117, "global_step": 243216, "epoch": 2930} {"train_loss": -24.66566276550293, "global_step": 243217, "epoch": 2930} {"train_loss": -25.174299240112305, "global_step": 243218, "epoch": 2930} {"train_loss": -24.6780948638916, "global_step": 243219, "epoch": 2930} {"train_loss": -24.70467185974121, "global_step": 243220, "epoch": 2930} {"train_loss": -24.895448684692383, "global_step": 243221, "epoch": 2930} {"train_loss": -24.661718368530273, "global_step": 243222, "epoch": 2930} {"train_loss": -24.771451950073242, "global_step": 243223, "epoch": 2930} {"train_loss": -25.06839942932129, "global_step": 243224, "epoch": 2930} {"train_loss": -24.623029708862305, "global_step": 243225, "epoch": 2930} {"train_loss": -25.283552169799805, "global_step": 243226, "epoch": 2930} {"train_loss": -24.6810359954834, "global_step": 243227, "epoch": 2930} {"train_loss": -24.71555519104004, "global_step": 243228, "epoch": 2930} {"train_loss": -25.302644729614258, "global_step": 243229, "epoch": 2930} {"train_loss": -24.595502853393555, "global_step": 243230, "epoch": 2930} {"train_loss": -24.783233642578125, "global_step": 243231, "epoch": 2930} {"train_loss": -25.165752410888672, "global_step": 243232, "epoch": 2930} {"train_loss": -25.02931785583496, "global_step": 243233, "epoch": 2930} {"train_loss": -25.312116622924805, "global_step": 243234, "epoch": 2930} {"train_loss": -25.050216674804688, "global_step": 243235, "epoch": 2930} {"train_loss": -24.981536865234375, "global_step": 243236, "epoch": 2930} {"train_loss": -24.764989852905273, "global_step": 243237, "epoch": 2930} {"train_loss": -25.280094146728516, "global_step": 243238, "epoch": 2930} {"train_loss": -24.967361450195312, "global_step": 243239, "epoch": 2930} {"train_loss": -25.114505767822266, "global_step": 243240, "epoch": 2930} {"train_loss": -25.4300537109375, "global_step": 243241, "epoch": 2930} {"train_loss": -25.05132484436035, "global_step": 243242, "epoch": 2930} {"train_loss": -25.357545852661133, "global_step": 243243, "epoch": 2930} {"train_loss": -24.889423370361328, "global_step": 243244, "epoch": 2930} {"train_loss": -25.032926559448242, "global_step": 243245, "epoch": 2930} {"train_loss": -25.311450958251953, "global_step": 243246, "epoch": 2930} {"train_loss": -24.06268882751465, "global_step": 243247, "epoch": 2930} {"train_loss": -24.638792037963867, "global_step": 243248, "epoch": 2930} {"train_loss": -25.14987564086914, "global_step": 243249, "epoch": 2930} {"train_loss": -25.352264404296875, "global_step": 243250, "epoch": 2930} {"train_loss": -25.030397415161133, "global_step": 243251, "epoch": 2930} {"train_loss": -24.673166275024414, "global_step": 243252, "epoch": 2930} {"train_loss": -24.542678833007812, "global_step": 243253, "epoch": 2930} {"train_loss": -24.782583236694336, "global_step": 243254, "epoch": 2930} {"train_loss": -25.13323211669922, "global_step": 243255, "epoch": 2930} {"train_loss": -25.00520133972168, "global_step": 243256, "epoch": 2930} {"train_loss": -24.919788360595703, "global_step": 243257, "epoch": 2930} {"train_loss": -24.855857849121094, "global_step": 243258, "epoch": 2930} {"train_loss": -24.7340145111084, "global_step": 243259, "epoch": 2930} {"train_loss": -25.157529830932617, "global_step": 243260, "epoch": 2930} {"train_loss": -24.831558227539062, "global_step": 243261, "epoch": 2930} {"train_loss": -24.60550308227539, "global_step": 243262, "epoch": 2930} {"train_loss": -24.978015899658203, "global_step": 243263, "epoch": 2930} {"train_loss": -24.616239547729492, "global_step": 243264, "epoch": 2930} {"train_loss": -24.505491256713867, "global_step": 243265, "epoch": 2930} {"train_loss": -24.923748016357422, "global_step": 243266, "epoch": 2930} {"train_loss": -24.8365478515625, "global_step": 243267, "epoch": 2930} {"train_loss": -24.148374557495117, "global_step": 243268, "epoch": 2930} {"train_loss": -25.046911239624023, "global_step": 243269, "epoch": 2930} {"train_loss": -25.194965362548828, "global_step": 243270, "epoch": 2930} {"train_loss": -24.568429946899414, "global_step": 243271, "epoch": 2930} {"train_loss": -24.72376124830131, "global_step": 243272, "epoch": 2930, "val_loss": 6803541.0} {"train_loss": -24.423480987548828, "global_step": 243273, "epoch": 2931} {"train_loss": -24.560226440429688, "global_step": 243274, "epoch": 2931} {"train_loss": -24.3070011138916, "global_step": 243275, "epoch": 2931} {"train_loss": -24.925771713256836, "global_step": 243276, "epoch": 2931} {"train_loss": -24.561391830444336, "global_step": 243277, "epoch": 2931} {"train_loss": -24.06314468383789, "global_step": 243278, "epoch": 2931} {"train_loss": -24.709848403930664, "global_step": 243279, "epoch": 2931} {"train_loss": -24.49774742126465, "global_step": 243280, "epoch": 2931} {"train_loss": -24.68008041381836, "global_step": 243281, "epoch": 2931} {"train_loss": -24.357860565185547, "global_step": 243282, "epoch": 2931} {"train_loss": -24.549171447753906, "global_step": 243283, "epoch": 2931} {"train_loss": -24.882476806640625, "global_step": 243284, "epoch": 2931} {"train_loss": -24.71283721923828, "global_step": 243285, "epoch": 2931} {"train_loss": -24.82681655883789, "global_step": 243286, "epoch": 2931} {"train_loss": -24.7537899017334, "global_step": 243287, "epoch": 2931} {"train_loss": -24.981943130493164, "global_step": 243288, "epoch": 2931} {"train_loss": -24.83485984802246, "global_step": 243289, "epoch": 2931} {"train_loss": -24.626005172729492, "global_step": 243290, "epoch": 2931} {"train_loss": -24.998308181762695, "global_step": 243291, "epoch": 2931} {"train_loss": -24.79108238220215, "global_step": 243292, "epoch": 2931} {"train_loss": -25.25935173034668, "global_step": 243293, "epoch": 2931} {"train_loss": -25.02941131591797, "global_step": 243294, "epoch": 2931} {"train_loss": -25.368955612182617, "global_step": 243295, "epoch": 2931} {"train_loss": -24.877676010131836, "global_step": 243296, "epoch": 2931} {"train_loss": -25.305606842041016, "global_step": 243297, "epoch": 2931} {"train_loss": -25.052709579467773, "global_step": 243298, "epoch": 2931} {"train_loss": -25.241384506225586, "global_step": 243299, "epoch": 2931} {"train_loss": -25.14234733581543, "global_step": 243300, "epoch": 2931} {"train_loss": -24.8336181640625, "global_step": 243301, "epoch": 2931} {"train_loss": -25.145004272460938, "global_step": 243302, "epoch": 2931} {"train_loss": -24.748937606811523, "global_step": 243303, "epoch": 2931} {"train_loss": -24.90214729309082, "global_step": 243304, "epoch": 2931} {"train_loss": -24.79926872253418, "global_step": 243305, "epoch": 2931} {"train_loss": -24.89676284790039, "global_step": 243306, "epoch": 2931} {"train_loss": -25.078344345092773, "global_step": 243307, "epoch": 2931} {"train_loss": -24.726179122924805, "global_step": 243308, "epoch": 2931} {"train_loss": -25.067373275756836, "global_step": 243309, "epoch": 2931} {"train_loss": -25.09585189819336, "global_step": 243310, "epoch": 2931} {"train_loss": -24.983583450317383, "global_step": 243311, "epoch": 2931} {"train_loss": -25.145397186279297, "global_step": 243312, "epoch": 2931} {"train_loss": -24.950393676757812, "global_step": 243313, "epoch": 2931} {"train_loss": -24.84137535095215, "global_step": 243314, "epoch": 2931} {"train_loss": -25.061861038208008, "global_step": 243315, "epoch": 2931} {"train_loss": -24.900968551635742, "global_step": 243316, "epoch": 2931} {"train_loss": -24.994613647460938, "global_step": 243317, "epoch": 2931} {"train_loss": -24.81580924987793, "global_step": 243318, "epoch": 2931} {"train_loss": -24.938701629638672, "global_step": 243319, "epoch": 2931} {"train_loss": -24.713333129882812, "global_step": 243320, "epoch": 2931} {"train_loss": -24.87660026550293, "global_step": 243321, "epoch": 2931} {"train_loss": -24.454181671142578, "global_step": 243322, "epoch": 2931} {"train_loss": -24.206378936767578, "global_step": 243323, "epoch": 2931} {"train_loss": -24.596712112426758, "global_step": 243324, "epoch": 2931} {"train_loss": -24.59213638305664, "global_step": 243325, "epoch": 2931} {"train_loss": -24.990127563476562, "global_step": 243326, "epoch": 2931} {"train_loss": -24.70597267150879, "global_step": 243327, "epoch": 2931} {"train_loss": -24.94264793395996, "global_step": 243328, "epoch": 2931} {"train_loss": -24.996854782104492, "global_step": 243329, "epoch": 2931} {"train_loss": -24.766010284423828, "global_step": 243330, "epoch": 2931} {"train_loss": -25.409320831298828, "global_step": 243331, "epoch": 2931} {"train_loss": -24.944807052612305, "global_step": 243332, "epoch": 2931} {"train_loss": -24.43295669555664, "global_step": 243333, "epoch": 2931} {"train_loss": -25.065183639526367, "global_step": 243334, "epoch": 2931} {"train_loss": -25.317081451416016, "global_step": 243335, "epoch": 2931} {"train_loss": -24.691953659057617, "global_step": 243336, "epoch": 2931} {"train_loss": -24.88031578063965, "global_step": 243337, "epoch": 2931} {"train_loss": -25.26409339904785, "global_step": 243338, "epoch": 2931} {"train_loss": -24.96012306213379, "global_step": 243339, "epoch": 2931} {"train_loss": -24.436635971069336, "global_step": 243340, "epoch": 2931} {"train_loss": -24.96974754333496, "global_step": 243341, "epoch": 2931} {"train_loss": -25.287809371948242, "global_step": 243342, "epoch": 2931} {"train_loss": -25.232807159423828, "global_step": 243343, "epoch": 2931} {"train_loss": -24.983617782592773, "global_step": 243344, "epoch": 2931} {"train_loss": -24.993131637573242, "global_step": 243345, "epoch": 2931} {"train_loss": -25.029455184936523, "global_step": 243346, "epoch": 2931} {"train_loss": -24.727331161499023, "global_step": 243347, "epoch": 2931} {"train_loss": -25.070621490478516, "global_step": 243348, "epoch": 2931} {"train_loss": -25.222043991088867, "global_step": 243349, "epoch": 2931} {"train_loss": -24.562454223632812, "global_step": 243350, "epoch": 2931} {"train_loss": -25.10964012145996, "global_step": 243351, "epoch": 2931} {"train_loss": -25.04302978515625, "global_step": 243352, "epoch": 2931} {"train_loss": -24.837045669555664, "global_step": 243353, "epoch": 2931} {"train_loss": -24.885074615478516, "global_step": 243354, "epoch": 2931} {"train_loss": -24.879094043409967, "global_step": 243355, "epoch": 2931, "val_loss": 6817826.0} {"train_loss": -23.543258666992188, "global_step": 243356, "epoch": 2932} {"train_loss": -23.898508071899414, "global_step": 243357, "epoch": 2932} {"train_loss": -23.874521255493164, "global_step": 243358, "epoch": 2932} {"train_loss": -23.991361618041992, "global_step": 243359, "epoch": 2932} {"train_loss": -24.323505401611328, "global_step": 243360, "epoch": 2932} {"train_loss": -24.14517593383789, "global_step": 243361, "epoch": 2932} {"train_loss": -24.449140548706055, "global_step": 243362, "epoch": 2932} {"train_loss": -24.094741821289062, "global_step": 243363, "epoch": 2932} {"train_loss": -24.38553237915039, "global_step": 243364, "epoch": 2932} {"train_loss": -24.37318992614746, "global_step": 243365, "epoch": 2932} {"train_loss": -24.3028564453125, "global_step": 243366, "epoch": 2932} {"train_loss": -24.661970138549805, "global_step": 243367, "epoch": 2932} {"train_loss": -24.17091941833496, "global_step": 243368, "epoch": 2932} {"train_loss": -24.259550094604492, "global_step": 243369, "epoch": 2932} {"train_loss": -24.176652908325195, "global_step": 243370, "epoch": 2932} {"train_loss": -24.297677993774414, "global_step": 243371, "epoch": 2932} {"train_loss": -24.272045135498047, "global_step": 243372, "epoch": 2932} {"train_loss": -24.42293357849121, "global_step": 243373, "epoch": 2932} {"train_loss": -24.646894454956055, "global_step": 243374, "epoch": 2932} {"train_loss": -24.63431167602539, "global_step": 243375, "epoch": 2932} {"train_loss": -24.432601928710938, "global_step": 243376, "epoch": 2932} {"train_loss": -24.5101318359375, "global_step": 243377, "epoch": 2932} {"train_loss": -24.2667236328125, "global_step": 243378, "epoch": 2932} {"train_loss": -24.61359214782715, "global_step": 243379, "epoch": 2932} {"train_loss": -24.394678115844727, "global_step": 243380, "epoch": 2932} {"train_loss": -24.556440353393555, "global_step": 243381, "epoch": 2932} {"train_loss": -24.669235229492188, "global_step": 243382, "epoch": 2932} {"train_loss": -24.886762619018555, "global_step": 243383, "epoch": 2932} {"train_loss": -24.678083419799805, "global_step": 243384, "epoch": 2932} {"train_loss": -24.721790313720703, "global_step": 243385, "epoch": 2932} {"train_loss": -24.531503677368164, "global_step": 243386, "epoch": 2932} {"train_loss": -24.754806518554688, "global_step": 243387, "epoch": 2932} {"train_loss": -24.59588623046875, "global_step": 243388, "epoch": 2932} {"train_loss": -24.72310447692871, "global_step": 243389, "epoch": 2932} {"train_loss": -24.683774948120117, "global_step": 243390, "epoch": 2932} {"train_loss": -25.153440475463867, "global_step": 243391, "epoch": 2932} {"train_loss": -24.942108154296875, "global_step": 243392, "epoch": 2932} {"train_loss": -25.04027557373047, "global_step": 243393, "epoch": 2932} {"train_loss": -24.970712661743164, "global_step": 243394, "epoch": 2932} {"train_loss": -24.850576400756836, "global_step": 243395, "epoch": 2932} {"train_loss": -25.22494888305664, "global_step": 243396, "epoch": 2932} {"train_loss": -25.03509521484375, "global_step": 243397, "epoch": 2932} {"train_loss": -24.782480239868164, "global_step": 243398, "epoch": 2932} {"train_loss": -24.47171401977539, "global_step": 243399, "epoch": 2932} {"train_loss": -25.031248092651367, "global_step": 243400, "epoch": 2932} {"train_loss": -25.15801429748535, "global_step": 243401, "epoch": 2932} {"train_loss": -24.878585815429688, "global_step": 243402, "epoch": 2932} {"train_loss": -24.639907836914062, "global_step": 243403, "epoch": 2932} {"train_loss": -25.038684844970703, "global_step": 243404, "epoch": 2932} {"train_loss": -24.87195587158203, "global_step": 243405, "epoch": 2932} {"train_loss": -24.795225143432617, "global_step": 243406, "epoch": 2932} {"train_loss": -25.1040096282959, "global_step": 243407, "epoch": 2932} {"train_loss": -24.854610443115234, "global_step": 243408, "epoch": 2932} {"train_loss": -24.84686851501465, "global_step": 243409, "epoch": 2932} {"train_loss": -25.056913375854492, "global_step": 243410, "epoch": 2932} {"train_loss": -24.945905685424805, "global_step": 243411, "epoch": 2932} {"train_loss": -24.522336959838867, "global_step": 243412, "epoch": 2932} {"train_loss": -25.075809478759766, "global_step": 243413, "epoch": 2932} {"train_loss": -25.053525924682617, "global_step": 243414, "epoch": 2932} {"train_loss": -25.31548500061035, "global_step": 243415, "epoch": 2932} {"train_loss": -25.081281661987305, "global_step": 243416, "epoch": 2932} {"train_loss": -25.3830623626709, "global_step": 243417, "epoch": 2932} {"train_loss": -25.214866638183594, "global_step": 243418, "epoch": 2932} {"train_loss": -25.074005126953125, "global_step": 243419, "epoch": 2932} {"train_loss": -25.135629653930664, "global_step": 243420, "epoch": 2932} {"train_loss": -24.831388473510742, "global_step": 243421, "epoch": 2932} {"train_loss": -24.88153648376465, "global_step": 243422, "epoch": 2932} {"train_loss": -24.924604415893555, "global_step": 243423, "epoch": 2932} {"train_loss": -24.983121871948242, "global_step": 243424, "epoch": 2932} {"train_loss": -24.893924713134766, "global_step": 243425, "epoch": 2932} {"train_loss": -25.208255767822266, "global_step": 243426, "epoch": 2932} {"train_loss": -24.92983055114746, "global_step": 243427, "epoch": 2932} {"train_loss": -25.034677505493164, "global_step": 243428, "epoch": 2932} {"train_loss": -24.772897720336914, "global_step": 243429, "epoch": 2932} {"train_loss": -24.854358673095703, "global_step": 243430, "epoch": 2932} {"train_loss": -24.65373420715332, "global_step": 243431, "epoch": 2932} {"train_loss": -25.200395584106445, "global_step": 243432, "epoch": 2932} {"train_loss": -24.952791213989258, "global_step": 243433, "epoch": 2932} {"train_loss": -24.904111862182617, "global_step": 243434, "epoch": 2932} {"train_loss": -25.189817428588867, "global_step": 243435, "epoch": 2932} {"train_loss": -24.566879272460938, "global_step": 243436, "epoch": 2932} {"train_loss": -24.408584594726562, "global_step": 243437, "epoch": 2932} {"train_loss": -24.719327995576055, "global_step": 243438, "epoch": 2932, "val_loss": 6905561.0} {"train_loss": -23.745153427124023, "global_step": 243439, "epoch": 2933} {"train_loss": -24.179311752319336, "global_step": 243440, "epoch": 2933} {"train_loss": -24.1113338470459, "global_step": 243441, "epoch": 2933} {"train_loss": -24.38661766052246, "global_step": 243442, "epoch": 2933} {"train_loss": -24.584306716918945, "global_step": 243443, "epoch": 2933} {"train_loss": -24.1373291015625, "global_step": 243444, "epoch": 2933} {"train_loss": -24.27690315246582, "global_step": 243445, "epoch": 2933} {"train_loss": -24.637121200561523, "global_step": 243446, "epoch": 2933} {"train_loss": -24.599029541015625, "global_step": 243447, "epoch": 2933} {"train_loss": -24.55925178527832, "global_step": 243448, "epoch": 2933} {"train_loss": -24.553861618041992, "global_step": 243449, "epoch": 2933} {"train_loss": -24.617050170898438, "global_step": 243450, "epoch": 2933} {"train_loss": -24.871784210205078, "global_step": 243451, "epoch": 2933} {"train_loss": -24.570539474487305, "global_step": 243452, "epoch": 2933} {"train_loss": -24.31415557861328, "global_step": 243453, "epoch": 2933} {"train_loss": -24.910747528076172, "global_step": 243454, "epoch": 2933} {"train_loss": -24.55303955078125, "global_step": 243455, "epoch": 2933} {"train_loss": -24.646411895751953, "global_step": 243456, "epoch": 2933} {"train_loss": -24.76114273071289, "global_step": 243457, "epoch": 2933} {"train_loss": -24.441242218017578, "global_step": 243458, "epoch": 2933} {"train_loss": -24.98982810974121, "global_step": 243459, "epoch": 2933} {"train_loss": -25.444385528564453, "global_step": 243460, "epoch": 2933} {"train_loss": -24.9233341217041, "global_step": 243461, "epoch": 2933} {"train_loss": -25.149795532226562, "global_step": 243462, "epoch": 2933} {"train_loss": -25.247549057006836, "global_step": 243463, "epoch": 2933} {"train_loss": -24.764543533325195, "global_step": 243464, "epoch": 2933} {"train_loss": -24.995981216430664, "global_step": 243465, "epoch": 2933} {"train_loss": -24.658918380737305, "global_step": 243466, "epoch": 2933} {"train_loss": -24.750728607177734, "global_step": 243467, "epoch": 2933} {"train_loss": -24.844350814819336, "global_step": 243468, "epoch": 2933} {"train_loss": -25.1232852935791, "global_step": 243469, "epoch": 2933} {"train_loss": -24.547815322875977, "global_step": 243470, "epoch": 2933} {"train_loss": -24.864721298217773, "global_step": 243471, "epoch": 2933} {"train_loss": -24.64558219909668, "global_step": 243472, "epoch": 2933} {"train_loss": -25.059494018554688, "global_step": 243473, "epoch": 2933} {"train_loss": -24.991064071655273, "global_step": 243474, "epoch": 2933} {"train_loss": -25.377927780151367, "global_step": 243475, "epoch": 2933} {"train_loss": -25.07771110534668, "global_step": 243476, "epoch": 2933} {"train_loss": -24.972854614257812, "global_step": 243477, "epoch": 2933} {"train_loss": -25.02432632446289, "global_step": 243478, "epoch": 2933} {"train_loss": -24.975183486938477, "global_step": 243479, "epoch": 2933} {"train_loss": -24.892303466796875, "global_step": 243480, "epoch": 2933} {"train_loss": -24.86158561706543, "global_step": 243481, "epoch": 2933} {"train_loss": -24.899656295776367, "global_step": 243482, "epoch": 2933} {"train_loss": -25.474584579467773, "global_step": 243483, "epoch": 2933} {"train_loss": -25.188522338867188, "global_step": 243484, "epoch": 2933} {"train_loss": -24.73921775817871, "global_step": 243485, "epoch": 2933} {"train_loss": -25.191160202026367, "global_step": 243486, "epoch": 2933} {"train_loss": -24.766040802001953, "global_step": 243487, "epoch": 2933} {"train_loss": -24.91806983947754, "global_step": 243488, "epoch": 2933} {"train_loss": -24.959861755371094, "global_step": 243489, "epoch": 2933} {"train_loss": -24.681608200073242, "global_step": 243490, "epoch": 2933} {"train_loss": -25.05084228515625, "global_step": 243491, "epoch": 2933} {"train_loss": -25.008121490478516, "global_step": 243492, "epoch": 2933} {"train_loss": -24.74867820739746, "global_step": 243493, "epoch": 2933} {"train_loss": -24.842302322387695, "global_step": 243494, "epoch": 2933} {"train_loss": -24.98056411743164, "global_step": 243495, "epoch": 2933} {"train_loss": -24.845632553100586, "global_step": 243496, "epoch": 2933} {"train_loss": -25.082944869995117, "global_step": 243497, "epoch": 2933} {"train_loss": -24.837461471557617, "global_step": 243498, "epoch": 2933} {"train_loss": -25.057849884033203, "global_step": 243499, "epoch": 2933} {"train_loss": -24.74579620361328, "global_step": 243500, "epoch": 2933} {"train_loss": -24.894149780273438, "global_step": 243501, "epoch": 2933} {"train_loss": -24.98240089416504, "global_step": 243502, "epoch": 2933} {"train_loss": -25.080717086791992, "global_step": 243503, "epoch": 2933} {"train_loss": -25.14133071899414, "global_step": 243504, "epoch": 2933} {"train_loss": -25.528966903686523, "global_step": 243505, "epoch": 2933} {"train_loss": -24.8560733795166, "global_step": 243506, "epoch": 2933} {"train_loss": -25.111719131469727, "global_step": 243507, "epoch": 2933} {"train_loss": -25.001880645751953, "global_step": 243508, "epoch": 2933} {"train_loss": -25.13907241821289, "global_step": 243509, "epoch": 2933} {"train_loss": -24.808883666992188, "global_step": 243510, "epoch": 2933} {"train_loss": -24.882862091064453, "global_step": 243511, "epoch": 2933} {"train_loss": -25.2893123626709, "global_step": 243512, "epoch": 2933} {"train_loss": -24.71103858947754, "global_step": 243513, "epoch": 2933} {"train_loss": -24.59779930114746, "global_step": 243514, "epoch": 2933} {"train_loss": -25.15130615234375, "global_step": 243515, "epoch": 2933} {"train_loss": -24.53258514404297, "global_step": 243516, "epoch": 2933} {"train_loss": -24.73122787475586, "global_step": 243517, "epoch": 2933} {"train_loss": -24.704833984375, "global_step": 243518, "epoch": 2933} {"train_loss": -24.676101684570312, "global_step": 243519, "epoch": 2933} {"train_loss": -24.637882232666016, "global_step": 243520, "epoch": 2933} {"train_loss": -24.831356117524297, "global_step": 243521, "epoch": 2933, "val_loss": 6800952.5} {"train_loss": -23.26633071899414, "global_step": 243522, "epoch": 2934} {"train_loss": -23.135271072387695, "global_step": 243523, "epoch": 2934} {"train_loss": -24.495954513549805, "global_step": 243524, "epoch": 2934} {"train_loss": -23.843982696533203, "global_step": 243525, "epoch": 2934} {"train_loss": -24.392436981201172, "global_step": 243526, "epoch": 2934} {"train_loss": -24.100351333618164, "global_step": 243527, "epoch": 2934} {"train_loss": -24.594633102416992, "global_step": 243528, "epoch": 2934} {"train_loss": -24.28183937072754, "global_step": 243529, "epoch": 2934} {"train_loss": -24.490753173828125, "global_step": 243530, "epoch": 2934} {"train_loss": -24.212385177612305, "global_step": 243531, "epoch": 2934} {"train_loss": -24.439071655273438, "global_step": 243532, "epoch": 2934} {"train_loss": -24.535297393798828, "global_step": 243533, "epoch": 2934} {"train_loss": -24.573835372924805, "global_step": 243534, "epoch": 2934} {"train_loss": -24.234088897705078, "global_step": 243535, "epoch": 2934} {"train_loss": -24.564695358276367, "global_step": 243536, "epoch": 2934} {"train_loss": -24.86899185180664, "global_step": 243537, "epoch": 2934} {"train_loss": -24.463960647583008, "global_step": 243538, "epoch": 2934} {"train_loss": -24.30417251586914, "global_step": 243539, "epoch": 2934} {"train_loss": -24.82004165649414, "global_step": 243540, "epoch": 2934} {"train_loss": -24.507078170776367, "global_step": 243541, "epoch": 2934} {"train_loss": -24.996658325195312, "global_step": 243542, "epoch": 2934} {"train_loss": -24.533105850219727, "global_step": 243543, "epoch": 2934} {"train_loss": -24.6900577545166, "global_step": 243544, "epoch": 2934} {"train_loss": -24.896297454833984, "global_step": 243545, "epoch": 2934} {"train_loss": -24.83196258544922, "global_step": 243546, "epoch": 2934} {"train_loss": -24.86328887939453, "global_step": 243547, "epoch": 2934} {"train_loss": -24.377944946289062, "global_step": 243548, "epoch": 2934} {"train_loss": -24.634384155273438, "global_step": 243549, "epoch": 2934} {"train_loss": -24.741605758666992, "global_step": 243550, "epoch": 2934} {"train_loss": -24.85886573791504, "global_step": 243551, "epoch": 2934} {"train_loss": -24.66705322265625, "global_step": 243552, "epoch": 2934} {"train_loss": -24.774187088012695, "global_step": 243553, "epoch": 2934} {"train_loss": -25.000690460205078, "global_step": 243554, "epoch": 2934} {"train_loss": -25.326889038085938, "global_step": 243555, "epoch": 2934} {"train_loss": -24.931495666503906, "global_step": 243556, "epoch": 2934} {"train_loss": -24.765172958374023, "global_step": 243557, "epoch": 2934} {"train_loss": -25.42131996154785, "global_step": 243558, "epoch": 2934} {"train_loss": -25.103900909423828, "global_step": 243559, "epoch": 2934} {"train_loss": -25.035018920898438, "global_step": 243560, "epoch": 2934} {"train_loss": -25.0728816986084, "global_step": 243561, "epoch": 2934} {"train_loss": -25.0196590423584, "global_step": 243562, "epoch": 2934} {"train_loss": -24.92213249206543, "global_step": 243563, "epoch": 2934} {"train_loss": -24.965045928955078, "global_step": 243564, "epoch": 2934} {"train_loss": -25.12088394165039, "global_step": 243565, "epoch": 2934} {"train_loss": -25.1296443939209, "global_step": 243566, "epoch": 2934} {"train_loss": -25.243566513061523, "global_step": 243567, "epoch": 2934} {"train_loss": -25.370668411254883, "global_step": 243568, "epoch": 2934} {"train_loss": -25.161603927612305, "global_step": 243569, "epoch": 2934} {"train_loss": -24.945640563964844, "global_step": 243570, "epoch": 2934} {"train_loss": -25.2425594329834, "global_step": 243571, "epoch": 2934} {"train_loss": -24.80402374267578, "global_step": 243572, "epoch": 2934} {"train_loss": -24.69065284729004, "global_step": 243573, "epoch": 2934} {"train_loss": -24.941709518432617, "global_step": 243574, "epoch": 2934} {"train_loss": -24.765329360961914, "global_step": 243575, "epoch": 2934} {"train_loss": -25.197526931762695, "global_step": 243576, "epoch": 2934} {"train_loss": -24.826562881469727, "global_step": 243577, "epoch": 2934} {"train_loss": -25.235815048217773, "global_step": 243578, "epoch": 2934} {"train_loss": -25.01924705505371, "global_step": 243579, "epoch": 2934} {"train_loss": -24.69968032836914, "global_step": 243580, "epoch": 2934} {"train_loss": -25.41499900817871, "global_step": 243581, "epoch": 2934} {"train_loss": -24.895009994506836, "global_step": 243582, "epoch": 2934} {"train_loss": -24.822433471679688, "global_step": 243583, "epoch": 2934} {"train_loss": -25.000259399414062, "global_step": 243584, "epoch": 2934} {"train_loss": -24.87714195251465, "global_step": 243585, "epoch": 2934} {"train_loss": -24.92987060546875, "global_step": 243586, "epoch": 2934} {"train_loss": -24.630577087402344, "global_step": 243587, "epoch": 2934} {"train_loss": -25.099491119384766, "global_step": 243588, "epoch": 2934} {"train_loss": -24.776538848876953, "global_step": 243589, "epoch": 2934} {"train_loss": -25.169565200805664, "global_step": 243590, "epoch": 2934} {"train_loss": -24.84905242919922, "global_step": 243591, "epoch": 2934} {"train_loss": -24.9908390045166, "global_step": 243592, "epoch": 2934} {"train_loss": -24.900360107421875, "global_step": 243593, "epoch": 2934} {"train_loss": -24.96190643310547, "global_step": 243594, "epoch": 2934} {"train_loss": -24.88501739501953, "global_step": 243595, "epoch": 2934} {"train_loss": -25.04960060119629, "global_step": 243596, "epoch": 2934} {"train_loss": -25.148792266845703, "global_step": 243597, "epoch": 2934} {"train_loss": -25.041088104248047, "global_step": 243598, "epoch": 2934} {"train_loss": -25.096120834350586, "global_step": 243599, "epoch": 2934} {"train_loss": -25.29302978515625, "global_step": 243600, "epoch": 2934} {"train_loss": -24.76214599609375, "global_step": 243601, "epoch": 2934} {"train_loss": -24.76097297668457, "global_step": 243602, "epoch": 2934} {"train_loss": -24.728483200073242, "global_step": 243603, "epoch": 2934} {"train_loss": -24.804284865597644, "global_step": 243604, "epoch": 2934, "val_loss": 6798936.0} {"train_loss": -23.921457290649414, "global_step": 243605, "epoch": 2935} {"train_loss": -23.232534408569336, "global_step": 243606, "epoch": 2935} {"train_loss": -22.85247802734375, "global_step": 243607, "epoch": 2935} {"train_loss": -22.751760482788086, "global_step": 243608, "epoch": 2935} {"train_loss": -23.572391510009766, "global_step": 243609, "epoch": 2935} {"train_loss": -23.385957717895508, "global_step": 243610, "epoch": 2935} {"train_loss": -23.489456176757812, "global_step": 243611, "epoch": 2935} {"train_loss": -23.492525100708008, "global_step": 243612, "epoch": 2935} {"train_loss": -22.98204231262207, "global_step": 243613, "epoch": 2935} {"train_loss": -24.041946411132812, "global_step": 243614, "epoch": 2935} {"train_loss": -23.77084732055664, "global_step": 243615, "epoch": 2935} {"train_loss": -23.893077850341797, "global_step": 243616, "epoch": 2935} {"train_loss": -23.759479522705078, "global_step": 243617, "epoch": 2935} {"train_loss": -24.17347526550293, "global_step": 243618, "epoch": 2935} {"train_loss": -24.206878662109375, "global_step": 243619, "epoch": 2935} {"train_loss": -24.210424423217773, "global_step": 243620, "epoch": 2935} {"train_loss": -23.857486724853516, "global_step": 243621, "epoch": 2935} {"train_loss": -24.243444442749023, "global_step": 243622, "epoch": 2935} {"train_loss": -24.30924415588379, "global_step": 243623, "epoch": 2935} {"train_loss": -23.721649169921875, "global_step": 243624, "epoch": 2935} {"train_loss": -24.197275161743164, "global_step": 243625, "epoch": 2935} {"train_loss": -23.990888595581055, "global_step": 243626, "epoch": 2935} {"train_loss": -23.473440170288086, "global_step": 243627, "epoch": 2935} {"train_loss": -24.254369735717773, "global_step": 243628, "epoch": 2935} {"train_loss": -24.925992965698242, "global_step": 243629, "epoch": 2935} {"train_loss": -24.755117416381836, "global_step": 243630, "epoch": 2935} {"train_loss": -24.442827224731445, "global_step": 243631, "epoch": 2935} {"train_loss": -24.555404663085938, "global_step": 243632, "epoch": 2935} {"train_loss": -24.441730499267578, "global_step": 243633, "epoch": 2935} {"train_loss": -24.601369857788086, "global_step": 243634, "epoch": 2935} {"train_loss": -24.58867645263672, "global_step": 243635, "epoch": 2935} {"train_loss": -24.68397331237793, "global_step": 243636, "epoch": 2935} {"train_loss": -24.496047973632812, "global_step": 243637, "epoch": 2935} {"train_loss": -24.4301815032959, "global_step": 243638, "epoch": 2935} {"train_loss": -24.69382095336914, "global_step": 243639, "epoch": 2935} {"train_loss": -24.68189811706543, "global_step": 243640, "epoch": 2935} {"train_loss": -24.673810958862305, "global_step": 243641, "epoch": 2935} {"train_loss": -24.88320541381836, "global_step": 243642, "epoch": 2935} {"train_loss": -24.591764450073242, "global_step": 243643, "epoch": 2935} {"train_loss": -24.563447952270508, "global_step": 243644, "epoch": 2935} {"train_loss": -24.67886734008789, "global_step": 243645, "epoch": 2935} {"train_loss": -24.699522018432617, "global_step": 243646, "epoch": 2935} {"train_loss": -24.49008560180664, "global_step": 243647, "epoch": 2935} {"train_loss": -24.875167846679688, "global_step": 243648, "epoch": 2935} {"train_loss": -24.95705795288086, "global_step": 243649, "epoch": 2935} {"train_loss": -24.748870849609375, "global_step": 243650, "epoch": 2935} {"train_loss": -24.742340087890625, "global_step": 243651, "epoch": 2935} {"train_loss": -24.979572296142578, "global_step": 243652, "epoch": 2935} {"train_loss": -24.892820358276367, "global_step": 243653, "epoch": 2935} {"train_loss": -24.936813354492188, "global_step": 243654, "epoch": 2935} {"train_loss": -24.72462272644043, "global_step": 243655, "epoch": 2935} {"train_loss": -24.809133529663086, "global_step": 243656, "epoch": 2935} {"train_loss": -24.92842674255371, "global_step": 243657, "epoch": 2935} {"train_loss": -24.982633590698242, "global_step": 243658, "epoch": 2935} {"train_loss": -25.056196212768555, "global_step": 243659, "epoch": 2935} {"train_loss": -24.743101119995117, "global_step": 243660, "epoch": 2935} {"train_loss": -24.831872940063477, "global_step": 243661, "epoch": 2935} {"train_loss": -24.927106857299805, "global_step": 243662, "epoch": 2935} {"train_loss": -24.93105125427246, "global_step": 243663, "epoch": 2935} {"train_loss": -24.915119171142578, "global_step": 243664, "epoch": 2935} {"train_loss": -25.133350372314453, "global_step": 243665, "epoch": 2935} {"train_loss": -25.162084579467773, "global_step": 243666, "epoch": 2935} {"train_loss": -24.814472198486328, "global_step": 243667, "epoch": 2935} {"train_loss": -25.063770294189453, "global_step": 243668, "epoch": 2935} {"train_loss": -24.474613189697266, "global_step": 243669, "epoch": 2935} {"train_loss": -25.128585815429688, "global_step": 243670, "epoch": 2935} {"train_loss": -25.269872665405273, "global_step": 243671, "epoch": 2935} {"train_loss": -24.96013832092285, "global_step": 243672, "epoch": 2935} {"train_loss": -25.641199111938477, "global_step": 243673, "epoch": 2935} {"train_loss": -24.79640769958496, "global_step": 243674, "epoch": 2935} {"train_loss": -25.348844528198242, "global_step": 243675, "epoch": 2935} {"train_loss": -24.99593162536621, "global_step": 243676, "epoch": 2935} {"train_loss": -25.09882164001465, "global_step": 243677, "epoch": 2935} {"train_loss": -25.265974044799805, "global_step": 243678, "epoch": 2935} {"train_loss": -25.06403160095215, "global_step": 243679, "epoch": 2935} {"train_loss": -25.594209671020508, "global_step": 243680, "epoch": 2935} {"train_loss": -25.00164222717285, "global_step": 243681, "epoch": 2935} {"train_loss": -25.357454299926758, "global_step": 243682, "epoch": 2935} {"train_loss": -25.096744537353516, "global_step": 243683, "epoch": 2935} {"train_loss": -24.948745727539062, "global_step": 243684, "epoch": 2935} {"train_loss": -25.474340438842773, "global_step": 243685, "epoch": 2935} {"train_loss": -24.84929847717285, "global_step": 243686, "epoch": 2935} {"train_loss": -24.550952038133, "global_step": 243687, "epoch": 2935, "val_loss": 6826384.0} {"train_loss": -24.614604949951172, "global_step": 243688, "epoch": 2936} {"train_loss": -24.846866607666016, "global_step": 243689, "epoch": 2936} {"train_loss": -24.281936645507812, "global_step": 243690, "epoch": 2936} {"train_loss": -24.31926727294922, "global_step": 243691, "epoch": 2936} {"train_loss": -25.11334228515625, "global_step": 243692, "epoch": 2936} {"train_loss": -25.27565574645996, "global_step": 243693, "epoch": 2936} {"train_loss": -24.798816680908203, "global_step": 243694, "epoch": 2936} {"train_loss": -24.939451217651367, "global_step": 243695, "epoch": 2936} {"train_loss": -24.7006778717041, "global_step": 243696, "epoch": 2936} {"train_loss": -24.5211238861084, "global_step": 243697, "epoch": 2936} {"train_loss": -24.96942138671875, "global_step": 243698, "epoch": 2936} {"train_loss": -24.653249740600586, "global_step": 243699, "epoch": 2936} {"train_loss": -24.792667388916016, "global_step": 243700, "epoch": 2936} {"train_loss": -25.106220245361328, "global_step": 243701, "epoch": 2936} {"train_loss": -24.735980987548828, "global_step": 243702, "epoch": 2936} {"train_loss": -24.918212890625, "global_step": 243703, "epoch": 2936} {"train_loss": -25.00806999206543, "global_step": 243704, "epoch": 2936} {"train_loss": -25.206829071044922, "global_step": 243705, "epoch": 2936} {"train_loss": -24.763395309448242, "global_step": 243706, "epoch": 2936} {"train_loss": -25.355012893676758, "global_step": 243707, "epoch": 2936} {"train_loss": -25.09714698791504, "global_step": 243708, "epoch": 2936} {"train_loss": -25.204605102539062, "global_step": 243709, "epoch": 2936} {"train_loss": -24.888593673706055, "global_step": 243710, "epoch": 2936} {"train_loss": -25.33717155456543, "global_step": 243711, "epoch": 2936} {"train_loss": -25.161046981811523, "global_step": 243712, "epoch": 2936} {"train_loss": -25.01808738708496, "global_step": 243713, "epoch": 2936} {"train_loss": -25.757078170776367, "global_step": 243714, "epoch": 2936} {"train_loss": -24.79353141784668, "global_step": 243715, "epoch": 2936} {"train_loss": -24.978296279907227, "global_step": 243716, "epoch": 2936} {"train_loss": -25.094879150390625, "global_step": 243717, "epoch": 2936} {"train_loss": -25.168306350708008, "global_step": 243718, "epoch": 2936} {"train_loss": -24.921707153320312, "global_step": 243719, "epoch": 2936} {"train_loss": -24.846235275268555, "global_step": 243720, "epoch": 2936} {"train_loss": -24.955595016479492, "global_step": 243721, "epoch": 2936} {"train_loss": -25.205364227294922, "global_step": 243722, "epoch": 2936} {"train_loss": -25.078296661376953, "global_step": 243723, "epoch": 2936} {"train_loss": -25.242998123168945, "global_step": 243724, "epoch": 2936} {"train_loss": -25.052074432373047, "global_step": 243725, "epoch": 2936} {"train_loss": -24.951709747314453, "global_step": 243726, "epoch": 2936} {"train_loss": -25.0858154296875, "global_step": 243727, "epoch": 2936} {"train_loss": -25.104612350463867, "global_step": 243728, "epoch": 2936} {"train_loss": -25.15570640563965, "global_step": 243729, "epoch": 2936} {"train_loss": -24.896711349487305, "global_step": 243730, "epoch": 2936} {"train_loss": -24.806142807006836, "global_step": 243731, "epoch": 2936} {"train_loss": -24.8655948638916, "global_step": 243732, "epoch": 2936} {"train_loss": -25.19771385192871, "global_step": 243733, "epoch": 2936} {"train_loss": -24.77498435974121, "global_step": 243734, "epoch": 2936} {"train_loss": -24.621755599975586, "global_step": 243735, "epoch": 2936} {"train_loss": -25.062177658081055, "global_step": 243736, "epoch": 2936} {"train_loss": -24.7831974029541, "global_step": 243737, "epoch": 2936} {"train_loss": -25.035680770874023, "global_step": 243738, "epoch": 2936} {"train_loss": -25.008848190307617, "global_step": 243739, "epoch": 2936} {"train_loss": -25.242536544799805, "global_step": 243740, "epoch": 2936} {"train_loss": -25.38787841796875, "global_step": 243741, "epoch": 2936} {"train_loss": -25.336748123168945, "global_step": 243742, "epoch": 2936} {"train_loss": -25.358619689941406, "global_step": 243743, "epoch": 2936} {"train_loss": -24.677614212036133, "global_step": 243744, "epoch": 2936} {"train_loss": -24.971879959106445, "global_step": 243745, "epoch": 2936} {"train_loss": -24.97586441040039, "global_step": 243746, "epoch": 2936} {"train_loss": -24.936283111572266, "global_step": 243747, "epoch": 2936} {"train_loss": -24.746152877807617, "global_step": 243748, "epoch": 2936} {"train_loss": -24.4107608795166, "global_step": 243749, "epoch": 2936} {"train_loss": -24.48503875732422, "global_step": 243750, "epoch": 2936} {"train_loss": -24.608814239501953, "global_step": 243751, "epoch": 2936} {"train_loss": -24.830833435058594, "global_step": 243752, "epoch": 2936} {"train_loss": -25.06683349609375, "global_step": 243753, "epoch": 2936} {"train_loss": -24.575223922729492, "global_step": 243754, "epoch": 2936} {"train_loss": -24.504602432250977, "global_step": 243755, "epoch": 2936} {"train_loss": -24.773157119750977, "global_step": 243756, "epoch": 2936} {"train_loss": -24.833831787109375, "global_step": 243757, "epoch": 2936} {"train_loss": -25.240585327148438, "global_step": 243758, "epoch": 2936} {"train_loss": -24.915836334228516, "global_step": 243759, "epoch": 2936} {"train_loss": -24.593597412109375, "global_step": 243760, "epoch": 2936} {"train_loss": -24.6009464263916, "global_step": 243761, "epoch": 2936} {"train_loss": -24.93984031677246, "global_step": 243762, "epoch": 2936} {"train_loss": -25.13037109375, "global_step": 243763, "epoch": 2936} {"train_loss": -24.496084213256836, "global_step": 243764, "epoch": 2936} {"train_loss": -24.634620666503906, "global_step": 243765, "epoch": 2936} {"train_loss": -24.83254051208496, "global_step": 243766, "epoch": 2936} {"train_loss": -25.087190628051758, "global_step": 243767, "epoch": 2936} {"train_loss": -25.14105796813965, "global_step": 243768, "epoch": 2936} {"train_loss": -24.832550048828125, "global_step": 243769, "epoch": 2936} {"train_loss": -24.903896998210126, "global_step": 243770, "epoch": 2936, "val_loss": 6800163.0} {"train_loss": -24.279850006103516, "global_step": 243771, "epoch": 2937} {"train_loss": -24.214509963989258, "global_step": 243772, "epoch": 2937} {"train_loss": -24.181941986083984, "global_step": 243773, "epoch": 2937} {"train_loss": -24.513229370117188, "global_step": 243774, "epoch": 2937} {"train_loss": -24.49640464782715, "global_step": 243775, "epoch": 2937} {"train_loss": -24.554731369018555, "global_step": 243776, "epoch": 2937} {"train_loss": -24.346193313598633, "global_step": 243777, "epoch": 2937} {"train_loss": -24.393741607666016, "global_step": 243778, "epoch": 2937} {"train_loss": -24.75851821899414, "global_step": 243779, "epoch": 2937} {"train_loss": -24.5903263092041, "global_step": 243780, "epoch": 2937} {"train_loss": -24.08284568786621, "global_step": 243781, "epoch": 2937} {"train_loss": -24.63209342956543, "global_step": 243782, "epoch": 2937} {"train_loss": -24.944318771362305, "global_step": 243783, "epoch": 2937} {"train_loss": -24.467409133911133, "global_step": 243784, "epoch": 2937} {"train_loss": -24.339256286621094, "global_step": 243785, "epoch": 2937} {"train_loss": -24.383258819580078, "global_step": 243786, "epoch": 2937} {"train_loss": -24.81471061706543, "global_step": 243787, "epoch": 2937} {"train_loss": -24.514822006225586, "global_step": 243788, "epoch": 2937} {"train_loss": -24.331377029418945, "global_step": 243789, "epoch": 2937} {"train_loss": -24.819637298583984, "global_step": 243790, "epoch": 2937} {"train_loss": -24.504262924194336, "global_step": 243791, "epoch": 2937} {"train_loss": -24.662872314453125, "global_step": 243792, "epoch": 2937} {"train_loss": -24.956207275390625, "global_step": 243793, "epoch": 2937} {"train_loss": -24.801450729370117, "global_step": 243794, "epoch": 2937} {"train_loss": -24.822803497314453, "global_step": 243795, "epoch": 2937} {"train_loss": -24.502328872680664, "global_step": 243796, "epoch": 2937} {"train_loss": -24.733871459960938, "global_step": 243797, "epoch": 2937} {"train_loss": -24.82068634033203, "global_step": 243798, "epoch": 2937} {"train_loss": -25.12958335876465, "global_step": 243799, "epoch": 2937} {"train_loss": -24.4962158203125, "global_step": 243800, "epoch": 2937} {"train_loss": -25.003406524658203, "global_step": 243801, "epoch": 2937} {"train_loss": -25.00833511352539, "global_step": 243802, "epoch": 2937} {"train_loss": -25.235916137695312, "global_step": 243803, "epoch": 2937} {"train_loss": -24.612098693847656, "global_step": 243804, "epoch": 2937} {"train_loss": -24.74491310119629, "global_step": 243805, "epoch": 2937} {"train_loss": -24.612751007080078, "global_step": 243806, "epoch": 2937} {"train_loss": -24.851659774780273, "global_step": 243807, "epoch": 2937} {"train_loss": -25.075220108032227, "global_step": 243808, "epoch": 2937} {"train_loss": -25.134618759155273, "global_step": 243809, "epoch": 2937} {"train_loss": -24.989450454711914, "global_step": 243810, "epoch": 2937} {"train_loss": -25.252670288085938, "global_step": 243811, "epoch": 2937} {"train_loss": -25.00596046447754, "global_step": 243812, "epoch": 2937} {"train_loss": -25.34151268005371, "global_step": 243813, "epoch": 2937} {"train_loss": -25.100746154785156, "global_step": 243814, "epoch": 2937} {"train_loss": -25.14468765258789, "global_step": 243815, "epoch": 2937} {"train_loss": -24.887298583984375, "global_step": 243816, "epoch": 2937} {"train_loss": -25.38800621032715, "global_step": 243817, "epoch": 2937} {"train_loss": -25.287784576416016, "global_step": 243818, "epoch": 2937} {"train_loss": -24.869930267333984, "global_step": 243819, "epoch": 2937} {"train_loss": -24.967914581298828, "global_step": 243820, "epoch": 2937} {"train_loss": -25.295454025268555, "global_step": 243821, "epoch": 2937} {"train_loss": -25.022632598876953, "global_step": 243822, "epoch": 2937} {"train_loss": -25.283912658691406, "global_step": 243823, "epoch": 2937} {"train_loss": -25.327898025512695, "global_step": 243824, "epoch": 2937} {"train_loss": -24.977401733398438, "global_step": 243825, "epoch": 2937} {"train_loss": -24.93580436706543, "global_step": 243826, "epoch": 2937} {"train_loss": -24.849483489990234, "global_step": 243827, "epoch": 2937} {"train_loss": -25.028030395507812, "global_step": 243828, "epoch": 2937} {"train_loss": -24.871740341186523, "global_step": 243829, "epoch": 2937} {"train_loss": -24.835947036743164, "global_step": 243830, "epoch": 2937} {"train_loss": -25.131996154785156, "global_step": 243831, "epoch": 2937} {"train_loss": -24.92287254333496, "global_step": 243832, "epoch": 2937} {"train_loss": -25.283344268798828, "global_step": 243833, "epoch": 2937} {"train_loss": -24.79197883605957, "global_step": 243834, "epoch": 2937} {"train_loss": -24.503883361816406, "global_step": 243835, "epoch": 2937} {"train_loss": -24.826322555541992, "global_step": 243836, "epoch": 2937} {"train_loss": -24.895584106445312, "global_step": 243837, "epoch": 2937} {"train_loss": -24.595640182495117, "global_step": 243838, "epoch": 2937} {"train_loss": -24.5306453704834, "global_step": 243839, "epoch": 2937} {"train_loss": -24.976186752319336, "global_step": 243840, "epoch": 2937} {"train_loss": -24.852371215820312, "global_step": 243841, "epoch": 2937} {"train_loss": -24.694969177246094, "global_step": 243842, "epoch": 2937} {"train_loss": -25.034664154052734, "global_step": 243843, "epoch": 2937} {"train_loss": -24.5379638671875, "global_step": 243844, "epoch": 2937} {"train_loss": -25.01328468322754, "global_step": 243845, "epoch": 2937} {"train_loss": -24.918188095092773, "global_step": 243846, "epoch": 2937} {"train_loss": -24.90532112121582, "global_step": 243847, "epoch": 2937} {"train_loss": -24.73924446105957, "global_step": 243848, "epoch": 2937} {"train_loss": -24.411245346069336, "global_step": 243849, "epoch": 2937} {"train_loss": -24.508039474487305, "global_step": 243850, "epoch": 2937} {"train_loss": -24.81536865234375, "global_step": 243851, "epoch": 2937} {"train_loss": -24.560941696166992, "global_step": 243852, "epoch": 2937} {"train_loss": -24.801326246146697, "global_step": 243853, "epoch": 2937, "val_loss": 6777511.0} {"train_loss": -25.15317726135254, "global_step": 243854, "epoch": 2938} {"train_loss": -24.340980529785156, "global_step": 243855, "epoch": 2938} {"train_loss": -24.560060501098633, "global_step": 243856, "epoch": 2938} {"train_loss": -24.45441436767578, "global_step": 243857, "epoch": 2938} {"train_loss": -24.742704391479492, "global_step": 243858, "epoch": 2938} {"train_loss": -24.49675750732422, "global_step": 243859, "epoch": 2938} {"train_loss": -24.642362594604492, "global_step": 243860, "epoch": 2938} {"train_loss": -24.650747299194336, "global_step": 243861, "epoch": 2938} {"train_loss": -24.973617553710938, "global_step": 243862, "epoch": 2938} {"train_loss": -24.4716739654541, "global_step": 243863, "epoch": 2938} {"train_loss": -24.915151596069336, "global_step": 243864, "epoch": 2938} {"train_loss": -24.656156539916992, "global_step": 243865, "epoch": 2938} {"train_loss": -25.21173095703125, "global_step": 243866, "epoch": 2938} {"train_loss": -24.61431312561035, "global_step": 243867, "epoch": 2938} {"train_loss": -24.20880126953125, "global_step": 243868, "epoch": 2938} {"train_loss": -24.891132354736328, "global_step": 243869, "epoch": 2938} {"train_loss": -24.973798751831055, "global_step": 243870, "epoch": 2938} {"train_loss": -24.580549240112305, "global_step": 243871, "epoch": 2938} {"train_loss": -24.27959632873535, "global_step": 243872, "epoch": 2938} {"train_loss": -24.758939743041992, "global_step": 243873, "epoch": 2938} {"train_loss": -24.512025833129883, "global_step": 243874, "epoch": 2938} {"train_loss": -24.803512573242188, "global_step": 243875, "epoch": 2938} {"train_loss": -24.720504760742188, "global_step": 243876, "epoch": 2938} {"train_loss": -25.14633560180664, "global_step": 243877, "epoch": 2938} {"train_loss": -24.9753475189209, "global_step": 243878, "epoch": 2938} {"train_loss": -24.661497116088867, "global_step": 243879, "epoch": 2938} {"train_loss": -24.97427749633789, "global_step": 243880, "epoch": 2938} {"train_loss": -25.0910701751709, "global_step": 243881, "epoch": 2938} {"train_loss": -24.437610626220703, "global_step": 243882, "epoch": 2938} {"train_loss": -25.340002059936523, "global_step": 243883, "epoch": 2938} {"train_loss": -24.94002342224121, "global_step": 243884, "epoch": 2938} {"train_loss": -24.806180953979492, "global_step": 243885, "epoch": 2938} {"train_loss": -24.885074615478516, "global_step": 243886, "epoch": 2938} {"train_loss": -25.291479110717773, "global_step": 243887, "epoch": 2938} {"train_loss": -24.69590187072754, "global_step": 243888, "epoch": 2938} {"train_loss": -25.31088638305664, "global_step": 243889, "epoch": 2938} {"train_loss": -25.233470916748047, "global_step": 243890, "epoch": 2938} {"train_loss": -25.191316604614258, "global_step": 243891, "epoch": 2938} {"train_loss": -25.195493698120117, "global_step": 243892, "epoch": 2938} {"train_loss": -24.943756103515625, "global_step": 243893, "epoch": 2938} {"train_loss": -25.29778480529785, "global_step": 243894, "epoch": 2938} {"train_loss": -24.91208267211914, "global_step": 243895, "epoch": 2938} {"train_loss": -25.180694580078125, "global_step": 243896, "epoch": 2938} {"train_loss": -24.739187240600586, "global_step": 243897, "epoch": 2938} {"train_loss": -25.138916015625, "global_step": 243898, "epoch": 2938} {"train_loss": -24.744762420654297, "global_step": 243899, "epoch": 2938} {"train_loss": -25.46454429626465, "global_step": 243900, "epoch": 2938} {"train_loss": -25.138431549072266, "global_step": 243901, "epoch": 2938} {"train_loss": -24.720792770385742, "global_step": 243902, "epoch": 2938} {"train_loss": -25.015045166015625, "global_step": 243903, "epoch": 2938} {"train_loss": -24.864059448242188, "global_step": 243904, "epoch": 2938} {"train_loss": -24.62300682067871, "global_step": 243905, "epoch": 2938} {"train_loss": -24.892179489135742, "global_step": 243906, "epoch": 2938} {"train_loss": -24.650854110717773, "global_step": 243907, "epoch": 2938} {"train_loss": -24.645423889160156, "global_step": 243908, "epoch": 2938} {"train_loss": -24.738962173461914, "global_step": 243909, "epoch": 2938} {"train_loss": -24.58565330505371, "global_step": 243910, "epoch": 2938} {"train_loss": -24.973215103149414, "global_step": 243911, "epoch": 2938} {"train_loss": -24.895689010620117, "global_step": 243912, "epoch": 2938} {"train_loss": -24.68528938293457, "global_step": 243913, "epoch": 2938} {"train_loss": -24.725927352905273, "global_step": 243914, "epoch": 2938} {"train_loss": -24.750717163085938, "global_step": 243915, "epoch": 2938} {"train_loss": -24.876956939697266, "global_step": 243916, "epoch": 2938} {"train_loss": -24.605472564697266, "global_step": 243917, "epoch": 2938} {"train_loss": -25.249832153320312, "global_step": 243918, "epoch": 2938} {"train_loss": -24.424800872802734, "global_step": 243919, "epoch": 2938} {"train_loss": -24.76317596435547, "global_step": 243920, "epoch": 2938} {"train_loss": -24.676725387573242, "global_step": 243921, "epoch": 2938} {"train_loss": -24.657316207885742, "global_step": 243922, "epoch": 2938} {"train_loss": -24.750837326049805, "global_step": 243923, "epoch": 2938} {"train_loss": -24.732084274291992, "global_step": 243924, "epoch": 2938} {"train_loss": -25.324365615844727, "global_step": 243925, "epoch": 2938} {"train_loss": -24.55609893798828, "global_step": 243926, "epoch": 2938} {"train_loss": -25.02826499938965, "global_step": 243927, "epoch": 2938} {"train_loss": -25.39182472229004, "global_step": 243928, "epoch": 2938} {"train_loss": -24.814420700073242, "global_step": 243929, "epoch": 2938} {"train_loss": -25.014707565307617, "global_step": 243930, "epoch": 2938} {"train_loss": -24.723560333251953, "global_step": 243931, "epoch": 2938} {"train_loss": -24.81754493713379, "global_step": 243932, "epoch": 2938} {"train_loss": -24.418920516967773, "global_step": 243933, "epoch": 2938} {"train_loss": -24.87690544128418, "global_step": 243934, "epoch": 2938} {"train_loss": -24.83946990966797, "global_step": 243935, "epoch": 2938} {"train_loss": -24.831797910023884, "global_step": 243936, "epoch": 2938, "val_loss": 6862792.0} {"train_loss": -24.421491622924805, "global_step": 243937, "epoch": 2939} {"train_loss": -24.458850860595703, "global_step": 243938, "epoch": 2939} {"train_loss": -24.43603515625, "global_step": 243939, "epoch": 2939} {"train_loss": -24.790027618408203, "global_step": 243940, "epoch": 2939} {"train_loss": -24.57508659362793, "global_step": 243941, "epoch": 2939} {"train_loss": -24.448955535888672, "global_step": 243942, "epoch": 2939} {"train_loss": -23.993417739868164, "global_step": 243943, "epoch": 2939} {"train_loss": -24.545703887939453, "global_step": 243944, "epoch": 2939} {"train_loss": -24.843219757080078, "global_step": 243945, "epoch": 2939} {"train_loss": -24.8139705657959, "global_step": 243946, "epoch": 2939} {"train_loss": -24.71918296813965, "global_step": 243947, "epoch": 2939} {"train_loss": -24.916730880737305, "global_step": 243948, "epoch": 2939} {"train_loss": -24.805580139160156, "global_step": 243949, "epoch": 2939} {"train_loss": -24.4876708984375, "global_step": 243950, "epoch": 2939} {"train_loss": -24.709623336791992, "global_step": 243951, "epoch": 2939} {"train_loss": -24.662572860717773, "global_step": 243952, "epoch": 2939} {"train_loss": -24.674924850463867, "global_step": 243953, "epoch": 2939} {"train_loss": -24.979761123657227, "global_step": 243954, "epoch": 2939} {"train_loss": -24.72011947631836, "global_step": 243955, "epoch": 2939} {"train_loss": -24.60030174255371, "global_step": 243956, "epoch": 2939} {"train_loss": -24.9958553314209, "global_step": 243957, "epoch": 2939} {"train_loss": -25.004491806030273, "global_step": 243958, "epoch": 2939} {"train_loss": -24.679838180541992, "global_step": 243959, "epoch": 2939} {"train_loss": -24.503366470336914, "global_step": 243960, "epoch": 2939} {"train_loss": -25.287166595458984, "global_step": 243961, "epoch": 2939} {"train_loss": -24.915327072143555, "global_step": 243962, "epoch": 2939} {"train_loss": -24.426496505737305, "global_step": 243963, "epoch": 2939} {"train_loss": -24.183759689331055, "global_step": 243964, "epoch": 2939} {"train_loss": -24.869295120239258, "global_step": 243965, "epoch": 2939} {"train_loss": -24.609296798706055, "global_step": 243966, "epoch": 2939} {"train_loss": -24.49677848815918, "global_step": 243967, "epoch": 2939} {"train_loss": -24.7371883392334, "global_step": 243968, "epoch": 2939} {"train_loss": -24.754575729370117, "global_step": 243969, "epoch": 2939} {"train_loss": -24.842802047729492, "global_step": 243970, "epoch": 2939} {"train_loss": -24.896591186523438, "global_step": 243971, "epoch": 2939} {"train_loss": -24.539356231689453, "global_step": 243972, "epoch": 2939} {"train_loss": -24.938011169433594, "global_step": 243973, "epoch": 2939} {"train_loss": -24.99127197265625, "global_step": 243974, "epoch": 2939} {"train_loss": -24.756122589111328, "global_step": 243975, "epoch": 2939} {"train_loss": -24.68454360961914, "global_step": 243976, "epoch": 2939} {"train_loss": -24.668493270874023, "global_step": 243977, "epoch": 2939} {"train_loss": -24.859872817993164, "global_step": 243978, "epoch": 2939} {"train_loss": -24.712528228759766, "global_step": 243979, "epoch": 2939} {"train_loss": -25.023391723632812, "global_step": 243980, "epoch": 2939} {"train_loss": -24.954788208007812, "global_step": 243981, "epoch": 2939} {"train_loss": -25.107484817504883, "global_step": 243982, "epoch": 2939} {"train_loss": -25.104557037353516, "global_step": 243983, "epoch": 2939} {"train_loss": -24.999319076538086, "global_step": 243984, "epoch": 2939} {"train_loss": -25.19550132751465, "global_step": 243985, "epoch": 2939} {"train_loss": -25.035160064697266, "global_step": 243986, "epoch": 2939} {"train_loss": -24.90374183654785, "global_step": 243987, "epoch": 2939} {"train_loss": -24.832468032836914, "global_step": 243988, "epoch": 2939} {"train_loss": -24.952802658081055, "global_step": 243989, "epoch": 2939} {"train_loss": -25.109617233276367, "global_step": 243990, "epoch": 2939} {"train_loss": -25.144540786743164, "global_step": 243991, "epoch": 2939} {"train_loss": -25.063081741333008, "global_step": 243992, "epoch": 2939} {"train_loss": -24.91728401184082, "global_step": 243993, "epoch": 2939} {"train_loss": -24.89954948425293, "global_step": 243994, "epoch": 2939} {"train_loss": -25.051456451416016, "global_step": 243995, "epoch": 2939} {"train_loss": -24.83084487915039, "global_step": 243996, "epoch": 2939} {"train_loss": -25.155670166015625, "global_step": 243997, "epoch": 2939} {"train_loss": -25.001209259033203, "global_step": 243998, "epoch": 2939} {"train_loss": -24.88077735900879, "global_step": 243999, "epoch": 2939} {"train_loss": -24.82602882385254, "global_step": 244000, "epoch": 2939} {"train_loss": -25.284984588623047, "global_step": 244001, "epoch": 2939} {"train_loss": -25.344396591186523, "global_step": 244002, "epoch": 2939} {"train_loss": -25.130521774291992, "global_step": 244003, "epoch": 2939} {"train_loss": -25.03858757019043, "global_step": 244004, "epoch": 2939} {"train_loss": -25.1771240234375, "global_step": 244005, "epoch": 2939} {"train_loss": -24.90691566467285, "global_step": 244006, "epoch": 2939} {"train_loss": -25.196943283081055, "global_step": 244007, "epoch": 2939} {"train_loss": -24.776580810546875, "global_step": 244008, "epoch": 2939} {"train_loss": -25.27398681640625, "global_step": 244009, "epoch": 2939} {"train_loss": -24.907453536987305, "global_step": 244010, "epoch": 2939} {"train_loss": -24.9133243560791, "global_step": 244011, "epoch": 2939} {"train_loss": -25.15817642211914, "global_step": 244012, "epoch": 2939} {"train_loss": -25.2967586517334, "global_step": 244013, "epoch": 2939} {"train_loss": -25.226606369018555, "global_step": 244014, "epoch": 2939} {"train_loss": -25.40968132019043, "global_step": 244015, "epoch": 2939} {"train_loss": -25.124217987060547, "global_step": 244016, "epoch": 2939} {"train_loss": -25.510799407958984, "global_step": 244017, "epoch": 2939} {"train_loss": -24.99431800842285, "global_step": 244018, "epoch": 2939} {"train_loss": -24.88285112955484, "global_step": 244019, "epoch": 2939, "val_loss": 6845570.5} {"train_loss": -24.437217712402344, "global_step": 244020, "epoch": 2940} {"train_loss": -23.70836639404297, "global_step": 244021, "epoch": 2940} {"train_loss": -24.250429153442383, "global_step": 244022, "epoch": 2940} {"train_loss": -23.285409927368164, "global_step": 244023, "epoch": 2940} {"train_loss": -22.90195655822754, "global_step": 244024, "epoch": 2940} {"train_loss": -23.822982788085938, "global_step": 244025, "epoch": 2940} {"train_loss": -24.10958480834961, "global_step": 244026, "epoch": 2940} {"train_loss": -23.97019386291504, "global_step": 244027, "epoch": 2940} {"train_loss": -24.509788513183594, "global_step": 244028, "epoch": 2940} {"train_loss": -24.32671546936035, "global_step": 244029, "epoch": 2940} {"train_loss": -24.520620346069336, "global_step": 244030, "epoch": 2940} {"train_loss": -24.82356834411621, "global_step": 244031, "epoch": 2940} {"train_loss": -24.531335830688477, "global_step": 244032, "epoch": 2940} {"train_loss": -24.378087997436523, "global_step": 244033, "epoch": 2940} {"train_loss": -24.50275993347168, "global_step": 244034, "epoch": 2940} {"train_loss": -24.66908073425293, "global_step": 244035, "epoch": 2940} {"train_loss": -24.67641258239746, "global_step": 244036, "epoch": 2940} {"train_loss": -24.704967498779297, "global_step": 244037, "epoch": 2940} {"train_loss": -24.27913475036621, "global_step": 244038, "epoch": 2940} {"train_loss": -24.63146209716797, "global_step": 244039, "epoch": 2940} {"train_loss": -24.449535369873047, "global_step": 244040, "epoch": 2940} {"train_loss": -24.7358455657959, "global_step": 244041, "epoch": 2940} {"train_loss": -24.913549423217773, "global_step": 244042, "epoch": 2940} {"train_loss": -24.8583927154541, "global_step": 244043, "epoch": 2940} {"train_loss": -24.61259651184082, "global_step": 244044, "epoch": 2940} {"train_loss": -24.87868309020996, "global_step": 244045, "epoch": 2940} {"train_loss": -24.69234848022461, "global_step": 244046, "epoch": 2940} {"train_loss": -24.861051559448242, "global_step": 244047, "epoch": 2940} {"train_loss": -24.691328048706055, "global_step": 244048, "epoch": 2940} {"train_loss": -24.785329818725586, "global_step": 244049, "epoch": 2940} {"train_loss": -24.874195098876953, "global_step": 244050, "epoch": 2940} {"train_loss": -24.671354293823242, "global_step": 244051, "epoch": 2940} {"train_loss": -24.97293472290039, "global_step": 244052, "epoch": 2940} {"train_loss": -25.049428939819336, "global_step": 244053, "epoch": 2940} {"train_loss": -24.7718505859375, "global_step": 244054, "epoch": 2940} {"train_loss": -24.862180709838867, "global_step": 244055, "epoch": 2940} {"train_loss": -25.292470932006836, "global_step": 244056, "epoch": 2940} {"train_loss": -25.03649139404297, "global_step": 244057, "epoch": 2940} {"train_loss": -25.076345443725586, "global_step": 244058, "epoch": 2940} {"train_loss": -25.07586097717285, "global_step": 244059, "epoch": 2940} {"train_loss": -24.601341247558594, "global_step": 244060, "epoch": 2940} {"train_loss": -24.746768951416016, "global_step": 244061, "epoch": 2940} {"train_loss": -25.111825942993164, "global_step": 244062, "epoch": 2940} {"train_loss": -24.974246978759766, "global_step": 244063, "epoch": 2940} {"train_loss": -25.163747787475586, "global_step": 244064, "epoch": 2940} {"train_loss": -25.104223251342773, "global_step": 244065, "epoch": 2940} {"train_loss": -24.982425689697266, "global_step": 244066, "epoch": 2940} {"train_loss": -25.053627014160156, "global_step": 244067, "epoch": 2940} {"train_loss": -25.35332679748535, "global_step": 244068, "epoch": 2940} {"train_loss": -25.30595588684082, "global_step": 244069, "epoch": 2940} {"train_loss": -25.074724197387695, "global_step": 244070, "epoch": 2940} {"train_loss": -25.204496383666992, "global_step": 244071, "epoch": 2940} {"train_loss": -25.259492874145508, "global_step": 244072, "epoch": 2940} {"train_loss": -25.151031494140625, "global_step": 244073, "epoch": 2940} {"train_loss": -25.055864334106445, "global_step": 244074, "epoch": 2940} {"train_loss": -25.319847106933594, "global_step": 244075, "epoch": 2940} {"train_loss": -24.877166748046875, "global_step": 244076, "epoch": 2940} {"train_loss": -24.98517417907715, "global_step": 244077, "epoch": 2940} {"train_loss": -24.715604782104492, "global_step": 244078, "epoch": 2940} {"train_loss": -24.608015060424805, "global_step": 244079, "epoch": 2940} {"train_loss": -24.608060836791992, "global_step": 244080, "epoch": 2940} {"train_loss": -23.948997497558594, "global_step": 244081, "epoch": 2940} {"train_loss": -23.94181251525879, "global_step": 244082, "epoch": 2940} {"train_loss": -23.7482967376709, "global_step": 244083, "epoch": 2940} {"train_loss": -24.421335220336914, "global_step": 244084, "epoch": 2940} {"train_loss": -24.785123825073242, "global_step": 244085, "epoch": 2940} {"train_loss": -24.575328826904297, "global_step": 244086, "epoch": 2940} {"train_loss": -24.7718563079834, "global_step": 244087, "epoch": 2940} {"train_loss": -25.21395492553711, "global_step": 244088, "epoch": 2940} {"train_loss": -24.605558395385742, "global_step": 244089, "epoch": 2940} {"train_loss": -24.175662994384766, "global_step": 244090, "epoch": 2940} {"train_loss": -24.30836296081543, "global_step": 244091, "epoch": 2940} {"train_loss": -24.75898551940918, "global_step": 244092, "epoch": 2940} {"train_loss": -24.910070419311523, "global_step": 244093, "epoch": 2940} {"train_loss": -25.027305603027344, "global_step": 244094, "epoch": 2940} {"train_loss": -24.424386978149414, "global_step": 244095, "epoch": 2940} {"train_loss": -24.851125717163086, "global_step": 244096, "epoch": 2940} {"train_loss": -24.53489112854004, "global_step": 244097, "epoch": 2940} {"train_loss": -24.884225845336914, "global_step": 244098, "epoch": 2940} {"train_loss": -25.083450317382812, "global_step": 244099, "epoch": 2940} {"train_loss": -25.234159469604492, "global_step": 244100, "epoch": 2940} {"train_loss": -24.960006713867188, "global_step": 244101, "epoch": 2940} {"train_loss": -24.69659040060388, "global_step": 244102, "epoch": 2940, "val_loss": 6791738.0} {"train_loss": -24.70890235900879, "global_step": 244103, "epoch": 2941} {"train_loss": -24.318876266479492, "global_step": 244104, "epoch": 2941} {"train_loss": -24.544645309448242, "global_step": 244105, "epoch": 2941} {"train_loss": -24.51617431640625, "global_step": 244106, "epoch": 2941} {"train_loss": -24.785823822021484, "global_step": 244107, "epoch": 2941} {"train_loss": -24.536855697631836, "global_step": 244108, "epoch": 2941} {"train_loss": -24.77910041809082, "global_step": 244109, "epoch": 2941} {"train_loss": -24.417322158813477, "global_step": 244110, "epoch": 2941} {"train_loss": -24.683713912963867, "global_step": 244111, "epoch": 2941} {"train_loss": -24.64899444580078, "global_step": 244112, "epoch": 2941} {"train_loss": -24.8041934967041, "global_step": 244113, "epoch": 2941} {"train_loss": -25.16187858581543, "global_step": 244114, "epoch": 2941} {"train_loss": -24.78865623474121, "global_step": 244115, "epoch": 2941} {"train_loss": -24.68134880065918, "global_step": 244116, "epoch": 2941} {"train_loss": -25.239370346069336, "global_step": 244117, "epoch": 2941} {"train_loss": -24.70686149597168, "global_step": 244118, "epoch": 2941} {"train_loss": -25.0838680267334, "global_step": 244119, "epoch": 2941} {"train_loss": -24.835569381713867, "global_step": 244120, "epoch": 2941} {"train_loss": -24.87055015563965, "global_step": 244121, "epoch": 2941} {"train_loss": -24.83024787902832, "global_step": 244122, "epoch": 2941} {"train_loss": -24.960134506225586, "global_step": 244123, "epoch": 2941} {"train_loss": -24.99578857421875, "global_step": 244124, "epoch": 2941} {"train_loss": -24.968442916870117, "global_step": 244125, "epoch": 2941} {"train_loss": -25.0551815032959, "global_step": 244126, "epoch": 2941} {"train_loss": -24.924169540405273, "global_step": 244127, "epoch": 2941} {"train_loss": -24.911592483520508, "global_step": 244128, "epoch": 2941} {"train_loss": -24.776826858520508, "global_step": 244129, "epoch": 2941} {"train_loss": -25.237592697143555, "global_step": 244130, "epoch": 2941} {"train_loss": -25.24401092529297, "global_step": 244131, "epoch": 2941} {"train_loss": -25.2041015625, "global_step": 244132, "epoch": 2941} {"train_loss": -24.950834274291992, "global_step": 244133, "epoch": 2941} {"train_loss": -24.855966567993164, "global_step": 244134, "epoch": 2941} {"train_loss": -25.01058006286621, "global_step": 244135, "epoch": 2941} {"train_loss": -24.86570167541504, "global_step": 244136, "epoch": 2941} {"train_loss": -25.12683868408203, "global_step": 244137, "epoch": 2941} {"train_loss": -25.23598289489746, "global_step": 244138, "epoch": 2941} {"train_loss": -24.954113006591797, "global_step": 244139, "epoch": 2941} {"train_loss": -24.472930908203125, "global_step": 244140, "epoch": 2941} {"train_loss": -25.159502029418945, "global_step": 244141, "epoch": 2941} {"train_loss": -24.777496337890625, "global_step": 244142, "epoch": 2941} {"train_loss": -24.940885543823242, "global_step": 244143, "epoch": 2941} {"train_loss": -25.00604820251465, "global_step": 244144, "epoch": 2941} {"train_loss": -25.064550399780273, "global_step": 244145, "epoch": 2941} {"train_loss": -24.65102195739746, "global_step": 244146, "epoch": 2941} {"train_loss": -25.031116485595703, "global_step": 244147, "epoch": 2941} {"train_loss": -24.72707176208496, "global_step": 244148, "epoch": 2941} {"train_loss": -24.891809463500977, "global_step": 244149, "epoch": 2941} {"train_loss": -24.4764461517334, "global_step": 244150, "epoch": 2941} {"train_loss": -25.14314842224121, "global_step": 244151, "epoch": 2941} {"train_loss": -24.795148849487305, "global_step": 244152, "epoch": 2941} {"train_loss": -24.820932388305664, "global_step": 244153, "epoch": 2941} {"train_loss": -25.005468368530273, "global_step": 244154, "epoch": 2941} {"train_loss": -24.824657440185547, "global_step": 244155, "epoch": 2941} {"train_loss": -25.01421356201172, "global_step": 244156, "epoch": 2941} {"train_loss": -25.041828155517578, "global_step": 244157, "epoch": 2941} {"train_loss": -25.16243553161621, "global_step": 244158, "epoch": 2941} {"train_loss": -24.69185447692871, "global_step": 244159, "epoch": 2941} {"train_loss": -24.525373458862305, "global_step": 244160, "epoch": 2941} {"train_loss": -24.70395851135254, "global_step": 244161, "epoch": 2941} {"train_loss": -24.97762107849121, "global_step": 244162, "epoch": 2941} {"train_loss": -24.57819938659668, "global_step": 244163, "epoch": 2941} {"train_loss": -24.948184967041016, "global_step": 244164, "epoch": 2941} {"train_loss": -24.797842025756836, "global_step": 244165, "epoch": 2941} {"train_loss": -24.889951705932617, "global_step": 244166, "epoch": 2941} {"train_loss": -24.592037200927734, "global_step": 244167, "epoch": 2941} {"train_loss": -24.811277389526367, "global_step": 244168, "epoch": 2941} {"train_loss": -25.372417449951172, "global_step": 244169, "epoch": 2941} {"train_loss": -25.072002410888672, "global_step": 244170, "epoch": 2941} {"train_loss": -24.77657127380371, "global_step": 244171, "epoch": 2941} {"train_loss": -24.967565536499023, "global_step": 244172, "epoch": 2941} {"train_loss": -25.092304229736328, "global_step": 244173, "epoch": 2941} {"train_loss": -24.8085880279541, "global_step": 244174, "epoch": 2941} {"train_loss": -25.213048934936523, "global_step": 244175, "epoch": 2941} {"train_loss": -24.8319091796875, "global_step": 244176, "epoch": 2941} {"train_loss": -24.916107177734375, "global_step": 244177, "epoch": 2941} {"train_loss": -24.81583595275879, "global_step": 244178, "epoch": 2941} {"train_loss": -25.010986328125, "global_step": 244179, "epoch": 2941} {"train_loss": -25.404300689697266, "global_step": 244180, "epoch": 2941} {"train_loss": -25.177968978881836, "global_step": 244181, "epoch": 2941} {"train_loss": -25.58517837524414, "global_step": 244182, "epoch": 2941} {"train_loss": -24.873868942260742, "global_step": 244183, "epoch": 2941} {"train_loss": -24.999881744384766, "global_step": 244184, "epoch": 2941} {"train_loss": -24.88430101325713, "global_step": 244185, "epoch": 2941, "val_loss": 6789989.0} {"train_loss": -24.437747955322266, "global_step": 244186, "epoch": 2942} {"train_loss": -24.19129180908203, "global_step": 244187, "epoch": 2942} {"train_loss": -24.6331844329834, "global_step": 244188, "epoch": 2942} {"train_loss": -24.543827056884766, "global_step": 244189, "epoch": 2942} {"train_loss": -24.486831665039062, "global_step": 244190, "epoch": 2942} {"train_loss": -24.491531372070312, "global_step": 244191, "epoch": 2942} {"train_loss": -24.81536102294922, "global_step": 244192, "epoch": 2942} {"train_loss": -25.109540939331055, "global_step": 244193, "epoch": 2942} {"train_loss": -24.440616607666016, "global_step": 244194, "epoch": 2942} {"train_loss": -24.64175033569336, "global_step": 244195, "epoch": 2942} {"train_loss": -24.753517150878906, "global_step": 244196, "epoch": 2942} {"train_loss": -24.525480270385742, "global_step": 244197, "epoch": 2942} {"train_loss": -24.97633171081543, "global_step": 244198, "epoch": 2942} {"train_loss": -24.554258346557617, "global_step": 244199, "epoch": 2942} {"train_loss": -24.804685592651367, "global_step": 244200, "epoch": 2942} {"train_loss": -24.57459831237793, "global_step": 244201, "epoch": 2942} {"train_loss": -24.6375789642334, "global_step": 244202, "epoch": 2942} {"train_loss": -24.741064071655273, "global_step": 244203, "epoch": 2942} {"train_loss": -24.632020950317383, "global_step": 244204, "epoch": 2942} {"train_loss": -24.849576950073242, "global_step": 244205, "epoch": 2942} {"train_loss": -25.014005661010742, "global_step": 244206, "epoch": 2942} {"train_loss": -24.89022445678711, "global_step": 244207, "epoch": 2942} {"train_loss": -25.23080062866211, "global_step": 244208, "epoch": 2942} {"train_loss": -24.740385055541992, "global_step": 244209, "epoch": 2942} {"train_loss": -24.696271896362305, "global_step": 244210, "epoch": 2942} {"train_loss": -24.929105758666992, "global_step": 244211, "epoch": 2942} {"train_loss": -25.280942916870117, "global_step": 244212, "epoch": 2942} {"train_loss": -25.329572677612305, "global_step": 244213, "epoch": 2942} {"train_loss": -25.07125473022461, "global_step": 244214, "epoch": 2942} {"train_loss": -24.818851470947266, "global_step": 244215, "epoch": 2942} {"train_loss": -25.10164451599121, "global_step": 244216, "epoch": 2942} {"train_loss": -25.074451446533203, "global_step": 244217, "epoch": 2942} {"train_loss": -24.96502685546875, "global_step": 244218, "epoch": 2942} {"train_loss": -25.242219924926758, "global_step": 244219, "epoch": 2942} {"train_loss": -24.989973068237305, "global_step": 244220, "epoch": 2942} {"train_loss": -24.669933319091797, "global_step": 244221, "epoch": 2942} {"train_loss": -25.02324676513672, "global_step": 244222, "epoch": 2942} {"train_loss": -25.132505416870117, "global_step": 244223, "epoch": 2942} {"train_loss": -25.456815719604492, "global_step": 244224, "epoch": 2942} {"train_loss": -25.00173568725586, "global_step": 244225, "epoch": 2942} {"train_loss": -25.098012924194336, "global_step": 244226, "epoch": 2942} {"train_loss": -24.625242233276367, "global_step": 244227, "epoch": 2942} {"train_loss": -25.163333892822266, "global_step": 244228, "epoch": 2942} {"train_loss": -25.243112564086914, "global_step": 244229, "epoch": 2942} {"train_loss": -24.827350616455078, "global_step": 244230, "epoch": 2942} {"train_loss": -25.197919845581055, "global_step": 244231, "epoch": 2942} {"train_loss": -25.256744384765625, "global_step": 244232, "epoch": 2942} {"train_loss": -25.35105323791504, "global_step": 244233, "epoch": 2942} {"train_loss": -24.85810661315918, "global_step": 244234, "epoch": 2942} {"train_loss": -25.28842544555664, "global_step": 244235, "epoch": 2942} {"train_loss": -24.98299217224121, "global_step": 244236, "epoch": 2942} {"train_loss": -24.875747680664062, "global_step": 244237, "epoch": 2942} {"train_loss": -24.885540008544922, "global_step": 244238, "epoch": 2942} {"train_loss": -25.041746139526367, "global_step": 244239, "epoch": 2942} {"train_loss": -25.231698989868164, "global_step": 244240, "epoch": 2942} {"train_loss": -24.94350814819336, "global_step": 244241, "epoch": 2942} {"train_loss": -25.013166427612305, "global_step": 244242, "epoch": 2942} {"train_loss": -24.82469940185547, "global_step": 244243, "epoch": 2942} {"train_loss": -25.182186126708984, "global_step": 244244, "epoch": 2942} {"train_loss": -24.671253204345703, "global_step": 244245, "epoch": 2942} {"train_loss": -25.031383514404297, "global_step": 244246, "epoch": 2942} {"train_loss": -25.115901947021484, "global_step": 244247, "epoch": 2942} {"train_loss": -25.19170570373535, "global_step": 244248, "epoch": 2942} {"train_loss": -24.464872360229492, "global_step": 244249, "epoch": 2942} {"train_loss": -24.79046058654785, "global_step": 244250, "epoch": 2942} {"train_loss": -24.64162826538086, "global_step": 244251, "epoch": 2942} {"train_loss": -24.961637496948242, "global_step": 244252, "epoch": 2942} {"train_loss": -24.41075897216797, "global_step": 244253, "epoch": 2942} {"train_loss": -24.51860237121582, "global_step": 244254, "epoch": 2942} {"train_loss": -24.45676040649414, "global_step": 244255, "epoch": 2942} {"train_loss": -24.526458740234375, "global_step": 244256, "epoch": 2942} {"train_loss": -24.69468116760254, "global_step": 244257, "epoch": 2942} {"train_loss": -24.405874252319336, "global_step": 244258, "epoch": 2942} {"train_loss": -24.532487869262695, "global_step": 244259, "epoch": 2942} {"train_loss": -24.30254554748535, "global_step": 244260, "epoch": 2942} {"train_loss": -24.188825607299805, "global_step": 244261, "epoch": 2942} {"train_loss": -24.284482955932617, "global_step": 244262, "epoch": 2942} {"train_loss": -24.663806915283203, "global_step": 244263, "epoch": 2942} {"train_loss": -24.260900497436523, "global_step": 244264, "epoch": 2942} {"train_loss": -24.90774917602539, "global_step": 244265, "epoch": 2942} {"train_loss": -25.181310653686523, "global_step": 244266, "epoch": 2942} {"train_loss": -24.822708129882812, "global_step": 244267, "epoch": 2942} {"train_loss": -24.830052249402886, "global_step": 244268, "epoch": 2942, "val_loss": 6799881.0} {"train_loss": -24.4920654296875, "global_step": 244269, "epoch": 2943} {"train_loss": -24.0266056060791, "global_step": 244270, "epoch": 2943} {"train_loss": -24.5211238861084, "global_step": 244271, "epoch": 2943} {"train_loss": -23.904497146606445, "global_step": 244272, "epoch": 2943} {"train_loss": -24.541446685791016, "global_step": 244273, "epoch": 2943} {"train_loss": -24.130842208862305, "global_step": 244274, "epoch": 2943} {"train_loss": -24.16761589050293, "global_step": 244275, "epoch": 2943} {"train_loss": -24.188119888305664, "global_step": 244276, "epoch": 2943} {"train_loss": -24.159170150756836, "global_step": 244277, "epoch": 2943} {"train_loss": -24.498064041137695, "global_step": 244278, "epoch": 2943} {"train_loss": -24.480798721313477, "global_step": 244279, "epoch": 2943} {"train_loss": -24.13813591003418, "global_step": 244280, "epoch": 2943} {"train_loss": -24.294164657592773, "global_step": 244281, "epoch": 2943} {"train_loss": -24.760669708251953, "global_step": 244282, "epoch": 2943} {"train_loss": -24.456483840942383, "global_step": 244283, "epoch": 2943} {"train_loss": -24.434967041015625, "global_step": 244284, "epoch": 2943} {"train_loss": -24.373550415039062, "global_step": 244285, "epoch": 2943} {"train_loss": -24.5130615234375, "global_step": 244286, "epoch": 2943} {"train_loss": -24.644189834594727, "global_step": 244287, "epoch": 2943} {"train_loss": -24.79138946533203, "global_step": 244288, "epoch": 2943} {"train_loss": -24.66238021850586, "global_step": 244289, "epoch": 2943} {"train_loss": -24.441410064697266, "global_step": 244290, "epoch": 2943} {"train_loss": -25.183643341064453, "global_step": 244291, "epoch": 2943} {"train_loss": -24.899158477783203, "global_step": 244292, "epoch": 2943} {"train_loss": -24.947643280029297, "global_step": 244293, "epoch": 2943} {"train_loss": -24.735082626342773, "global_step": 244294, "epoch": 2943} {"train_loss": -24.952909469604492, "global_step": 244295, "epoch": 2943} {"train_loss": -25.339990615844727, "global_step": 244296, "epoch": 2943} {"train_loss": -24.733922958374023, "global_step": 244297, "epoch": 2943} {"train_loss": -24.626789093017578, "global_step": 244298, "epoch": 2943} {"train_loss": -24.922529220581055, "global_step": 244299, "epoch": 2943} {"train_loss": -24.869413375854492, "global_step": 244300, "epoch": 2943} {"train_loss": -24.893009185791016, "global_step": 244301, "epoch": 2943} {"train_loss": -24.892749786376953, "global_step": 244302, "epoch": 2943} {"train_loss": -25.19952392578125, "global_step": 244303, "epoch": 2943} {"train_loss": -24.728124618530273, "global_step": 244304, "epoch": 2943} {"train_loss": -25.362281799316406, "global_step": 244305, "epoch": 2943} {"train_loss": -25.1489200592041, "global_step": 244306, "epoch": 2943} {"train_loss": -24.569080352783203, "global_step": 244307, "epoch": 2943} {"train_loss": -24.891117095947266, "global_step": 244308, "epoch": 2943} {"train_loss": -24.92511558532715, "global_step": 244309, "epoch": 2943} {"train_loss": -24.662893295288086, "global_step": 244310, "epoch": 2943} {"train_loss": -24.718833923339844, "global_step": 244311, "epoch": 2943} {"train_loss": -24.810205459594727, "global_step": 244312, "epoch": 2943} {"train_loss": -25.00824546813965, "global_step": 244313, "epoch": 2943} {"train_loss": -25.0059871673584, "global_step": 244314, "epoch": 2943} {"train_loss": -24.800540924072266, "global_step": 244315, "epoch": 2943} {"train_loss": -25.18105125427246, "global_step": 244316, "epoch": 2943} {"train_loss": -24.82389259338379, "global_step": 244317, "epoch": 2943} {"train_loss": -25.053316116333008, "global_step": 244318, "epoch": 2943} {"train_loss": -24.835264205932617, "global_step": 244319, "epoch": 2943} {"train_loss": -25.043991088867188, "global_step": 244320, "epoch": 2943} {"train_loss": -25.651996612548828, "global_step": 244321, "epoch": 2943} {"train_loss": -24.875967025756836, "global_step": 244322, "epoch": 2943} {"train_loss": -24.749998092651367, "global_step": 244323, "epoch": 2943} {"train_loss": -24.88982391357422, "global_step": 244324, "epoch": 2943} {"train_loss": -25.0367374420166, "global_step": 244325, "epoch": 2943} {"train_loss": -24.862329483032227, "global_step": 244326, "epoch": 2943} {"train_loss": -24.899734497070312, "global_step": 244327, "epoch": 2943} {"train_loss": -24.93100929260254, "global_step": 244328, "epoch": 2943} {"train_loss": -24.924036026000977, "global_step": 244329, "epoch": 2943} {"train_loss": -24.908363342285156, "global_step": 244330, "epoch": 2943} {"train_loss": -24.946273803710938, "global_step": 244331, "epoch": 2943} {"train_loss": -24.707727432250977, "global_step": 244332, "epoch": 2943} {"train_loss": -24.74735450744629, "global_step": 244333, "epoch": 2943} {"train_loss": -25.07413101196289, "global_step": 244334, "epoch": 2943} {"train_loss": -24.863027572631836, "global_step": 244335, "epoch": 2943} {"train_loss": -24.748722076416016, "global_step": 244336, "epoch": 2943} {"train_loss": -24.911544799804688, "global_step": 244337, "epoch": 2943} {"train_loss": -24.746780395507812, "global_step": 244338, "epoch": 2943} {"train_loss": -24.822093963623047, "global_step": 244339, "epoch": 2943} {"train_loss": -24.844863891601562, "global_step": 244340, "epoch": 2943} {"train_loss": -25.169109344482422, "global_step": 244341, "epoch": 2943} {"train_loss": -25.376514434814453, "global_step": 244342, "epoch": 2943} {"train_loss": -24.986101150512695, "global_step": 244343, "epoch": 2943} {"train_loss": -24.819129943847656, "global_step": 244344, "epoch": 2943} {"train_loss": -25.179523468017578, "global_step": 244345, "epoch": 2943} {"train_loss": -25.196592330932617, "global_step": 244346, "epoch": 2943} {"train_loss": -25.179956436157227, "global_step": 244347, "epoch": 2943} {"train_loss": -24.96837615966797, "global_step": 244348, "epoch": 2943} {"train_loss": -25.026559829711914, "global_step": 244349, "epoch": 2943} {"train_loss": -25.077795028686523, "global_step": 244350, "epoch": 2943} {"train_loss": -24.813959994948053, "global_step": 244351, "epoch": 2943, "val_loss": 6935499.5} {"train_loss": -24.864225387573242, "global_step": 244352, "epoch": 2944} {"train_loss": -24.611719131469727, "global_step": 244353, "epoch": 2944} {"train_loss": -24.594608306884766, "global_step": 244354, "epoch": 2944} {"train_loss": -24.626821517944336, "global_step": 244355, "epoch": 2944} {"train_loss": -24.661319732666016, "global_step": 244356, "epoch": 2944} {"train_loss": -23.888158798217773, "global_step": 244357, "epoch": 2944} {"train_loss": -24.38324737548828, "global_step": 244358, "epoch": 2944} {"train_loss": -24.65326499938965, "global_step": 244359, "epoch": 2944} {"train_loss": -24.55231475830078, "global_step": 244360, "epoch": 2944} {"train_loss": -24.703102111816406, "global_step": 244361, "epoch": 2944} {"train_loss": -24.334104537963867, "global_step": 244362, "epoch": 2944} {"train_loss": -24.688655853271484, "global_step": 244363, "epoch": 2944} {"train_loss": -24.460111618041992, "global_step": 244364, "epoch": 2944} {"train_loss": -24.378158569335938, "global_step": 244365, "epoch": 2944} {"train_loss": -24.77604103088379, "global_step": 244366, "epoch": 2944} {"train_loss": -24.723365783691406, "global_step": 244367, "epoch": 2944} {"train_loss": -24.496213912963867, "global_step": 244368, "epoch": 2944} {"train_loss": -24.75606346130371, "global_step": 244369, "epoch": 2944} {"train_loss": -25.31819725036621, "global_step": 244370, "epoch": 2944} {"train_loss": -24.83403205871582, "global_step": 244371, "epoch": 2944} {"train_loss": -25.250831604003906, "global_step": 244372, "epoch": 2944} {"train_loss": -24.46198081970215, "global_step": 244373, "epoch": 2944} {"train_loss": -25.192575454711914, "global_step": 244374, "epoch": 2944} {"train_loss": -25.1890926361084, "global_step": 244375, "epoch": 2944} {"train_loss": -24.64891815185547, "global_step": 244376, "epoch": 2944} {"train_loss": -24.519550323486328, "global_step": 244377, "epoch": 2944} {"train_loss": -24.962705612182617, "global_step": 244378, "epoch": 2944} {"train_loss": -24.711610794067383, "global_step": 244379, "epoch": 2944} {"train_loss": -24.903892517089844, "global_step": 244380, "epoch": 2944} {"train_loss": -24.903549194335938, "global_step": 244381, "epoch": 2944} {"train_loss": -24.88758659362793, "global_step": 244382, "epoch": 2944} {"train_loss": -25.079404830932617, "global_step": 244383, "epoch": 2944} {"train_loss": -25.16329002380371, "global_step": 244384, "epoch": 2944} {"train_loss": -25.169559478759766, "global_step": 244385, "epoch": 2944} {"train_loss": -25.176584243774414, "global_step": 244386, "epoch": 2944} {"train_loss": -24.810325622558594, "global_step": 244387, "epoch": 2944} {"train_loss": -24.887800216674805, "global_step": 244388, "epoch": 2944} {"train_loss": -24.529926300048828, "global_step": 244389, "epoch": 2944} {"train_loss": -24.909616470336914, "global_step": 244390, "epoch": 2944} {"train_loss": -24.90381622314453, "global_step": 244391, "epoch": 2944} {"train_loss": -24.818037033081055, "global_step": 244392, "epoch": 2944} {"train_loss": -24.76319122314453, "global_step": 244393, "epoch": 2944} {"train_loss": -24.894285202026367, "global_step": 244394, "epoch": 2944} {"train_loss": -24.813861846923828, "global_step": 244395, "epoch": 2944} {"train_loss": -24.910037994384766, "global_step": 244396, "epoch": 2944} {"train_loss": -25.20960807800293, "global_step": 244397, "epoch": 2944} {"train_loss": -24.972524642944336, "global_step": 244398, "epoch": 2944} {"train_loss": -25.160776138305664, "global_step": 244399, "epoch": 2944} {"train_loss": -25.199295043945312, "global_step": 244400, "epoch": 2944} {"train_loss": -25.135778427124023, "global_step": 244401, "epoch": 2944} {"train_loss": -25.1748104095459, "global_step": 244402, "epoch": 2944} {"train_loss": -24.636823654174805, "global_step": 244403, "epoch": 2944} {"train_loss": -24.787506103515625, "global_step": 244404, "epoch": 2944} {"train_loss": -25.105911254882812, "global_step": 244405, "epoch": 2944} {"train_loss": -24.682979583740234, "global_step": 244406, "epoch": 2944} {"train_loss": -24.589780807495117, "global_step": 244407, "epoch": 2944} {"train_loss": -25.006763458251953, "global_step": 244408, "epoch": 2944} {"train_loss": -25.12337303161621, "global_step": 244409, "epoch": 2944} {"train_loss": -24.84173583984375, "global_step": 244410, "epoch": 2944} {"train_loss": -24.982736587524414, "global_step": 244411, "epoch": 2944} {"train_loss": -24.939367294311523, "global_step": 244412, "epoch": 2944} {"train_loss": -25.039752960205078, "global_step": 244413, "epoch": 2944} {"train_loss": -25.079700469970703, "global_step": 244414, "epoch": 2944} {"train_loss": -25.32045555114746, "global_step": 244415, "epoch": 2944} {"train_loss": -24.83558464050293, "global_step": 244416, "epoch": 2944} {"train_loss": -25.308860778808594, "global_step": 244417, "epoch": 2944} {"train_loss": -25.34600067138672, "global_step": 244418, "epoch": 2944} {"train_loss": -25.00628089904785, "global_step": 244419, "epoch": 2944} {"train_loss": -25.429052352905273, "global_step": 244420, "epoch": 2944} {"train_loss": -25.011844635009766, "global_step": 244421, "epoch": 2944} {"train_loss": -24.97914695739746, "global_step": 244422, "epoch": 2944} {"train_loss": -25.09968376159668, "global_step": 244423, "epoch": 2944} {"train_loss": -25.119592666625977, "global_step": 244424, "epoch": 2944} {"train_loss": -25.223562240600586, "global_step": 244425, "epoch": 2944} {"train_loss": -25.158489227294922, "global_step": 244426, "epoch": 2944} {"train_loss": -25.187280654907227, "global_step": 244427, "epoch": 2944} {"train_loss": -24.818349838256836, "global_step": 244428, "epoch": 2944} {"train_loss": -25.342966079711914, "global_step": 244429, "epoch": 2944} {"train_loss": -25.095626831054688, "global_step": 244430, "epoch": 2944} {"train_loss": -24.60048484802246, "global_step": 244431, "epoch": 2944} {"train_loss": -24.742414474487305, "global_step": 244432, "epoch": 2944} {"train_loss": -24.862882614135742, "global_step": 244433, "epoch": 2944} {"train_loss": -24.891827962484705, "global_step": 244434, "epoch": 2944, "val_loss": 6776862.5} {"train_loss": -24.075082778930664, "global_step": 244435, "epoch": 2945} {"train_loss": -24.026161193847656, "global_step": 244436, "epoch": 2945} {"train_loss": -24.26654815673828, "global_step": 244437, "epoch": 2945} {"train_loss": -23.730993270874023, "global_step": 244438, "epoch": 2945} {"train_loss": -24.16761589050293, "global_step": 244439, "epoch": 2945} {"train_loss": -24.07257652282715, "global_step": 244440, "epoch": 2945} {"train_loss": -24.175922393798828, "global_step": 244441, "epoch": 2945} {"train_loss": -24.568449020385742, "global_step": 244442, "epoch": 2945} {"train_loss": -24.23797035217285, "global_step": 244443, "epoch": 2945} {"train_loss": -24.228473663330078, "global_step": 244444, "epoch": 2945} {"train_loss": -24.695165634155273, "global_step": 244445, "epoch": 2945} {"train_loss": -24.471027374267578, "global_step": 244446, "epoch": 2945} {"train_loss": -23.971418380737305, "global_step": 244447, "epoch": 2945} {"train_loss": -24.283233642578125, "global_step": 244448, "epoch": 2945} {"train_loss": -24.72891616821289, "global_step": 244449, "epoch": 2945} {"train_loss": -25.002798080444336, "global_step": 244450, "epoch": 2945} {"train_loss": -24.422863006591797, "global_step": 244451, "epoch": 2945} {"train_loss": -24.38434600830078, "global_step": 244452, "epoch": 2945} {"train_loss": -24.354646682739258, "global_step": 244453, "epoch": 2945} {"train_loss": -24.364145278930664, "global_step": 244454, "epoch": 2945} {"train_loss": -24.528776168823242, "global_step": 244455, "epoch": 2945} {"train_loss": -24.749881744384766, "global_step": 244456, "epoch": 2945} {"train_loss": -24.61349105834961, "global_step": 244457, "epoch": 2945} {"train_loss": -24.70954704284668, "global_step": 244458, "epoch": 2945} {"train_loss": -24.584135055541992, "global_step": 244459, "epoch": 2945} {"train_loss": -24.70000648498535, "global_step": 244460, "epoch": 2945} {"train_loss": -24.630651473999023, "global_step": 244461, "epoch": 2945} {"train_loss": -24.61099624633789, "global_step": 244462, "epoch": 2945} {"train_loss": -24.61182403564453, "global_step": 244463, "epoch": 2945} {"train_loss": -24.379657745361328, "global_step": 244464, "epoch": 2945} {"train_loss": -24.984708786010742, "global_step": 244465, "epoch": 2945} {"train_loss": -24.741085052490234, "global_step": 244466, "epoch": 2945} {"train_loss": -24.6773624420166, "global_step": 244467, "epoch": 2945} {"train_loss": -24.91957664489746, "global_step": 244468, "epoch": 2945} {"train_loss": -25.073123931884766, "global_step": 244469, "epoch": 2945} {"train_loss": -25.231443405151367, "global_step": 244470, "epoch": 2945} {"train_loss": -24.92105484008789, "global_step": 244471, "epoch": 2945} {"train_loss": -24.646589279174805, "global_step": 244472, "epoch": 2945} {"train_loss": -24.814102172851562, "global_step": 244473, "epoch": 2945} {"train_loss": -24.91284942626953, "global_step": 244474, "epoch": 2945} {"train_loss": -24.77249526977539, "global_step": 244475, "epoch": 2945} {"train_loss": -25.18217658996582, "global_step": 244476, "epoch": 2945} {"train_loss": -24.91924476623535, "global_step": 244477, "epoch": 2945} {"train_loss": -24.78481101989746, "global_step": 244478, "epoch": 2945} {"train_loss": -24.770254135131836, "global_step": 244479, "epoch": 2945} {"train_loss": -25.052419662475586, "global_step": 244480, "epoch": 2945} {"train_loss": -25.1683406829834, "global_step": 244481, "epoch": 2945} {"train_loss": -24.858779907226562, "global_step": 244482, "epoch": 2945} {"train_loss": -25.18729019165039, "global_step": 244483, "epoch": 2945} {"train_loss": -25.073833465576172, "global_step": 244484, "epoch": 2945} {"train_loss": -25.005287170410156, "global_step": 244485, "epoch": 2945} {"train_loss": -24.93754005432129, "global_step": 244486, "epoch": 2945} {"train_loss": -24.821531295776367, "global_step": 244487, "epoch": 2945} {"train_loss": -25.08968162536621, "global_step": 244488, "epoch": 2945} {"train_loss": -25.033695220947266, "global_step": 244489, "epoch": 2945} {"train_loss": -25.354734420776367, "global_step": 244490, "epoch": 2945} {"train_loss": -25.04859161376953, "global_step": 244491, "epoch": 2945} {"train_loss": -25.075429916381836, "global_step": 244492, "epoch": 2945} {"train_loss": -24.9718074798584, "global_step": 244493, "epoch": 2945} {"train_loss": -24.794940948486328, "global_step": 244494, "epoch": 2945} {"train_loss": -24.972618103027344, "global_step": 244495, "epoch": 2945} {"train_loss": -24.91486167907715, "global_step": 244496, "epoch": 2945} {"train_loss": -24.911542892456055, "global_step": 244497, "epoch": 2945} {"train_loss": -25.22195816040039, "global_step": 244498, "epoch": 2945} {"train_loss": -24.62747573852539, "global_step": 244499, "epoch": 2945} {"train_loss": -24.874614715576172, "global_step": 244500, "epoch": 2945} {"train_loss": -25.120813369750977, "global_step": 244501, "epoch": 2945} {"train_loss": -25.06172752380371, "global_step": 244502, "epoch": 2945} {"train_loss": -25.28403663635254, "global_step": 244503, "epoch": 2945} {"train_loss": -24.669572830200195, "global_step": 244504, "epoch": 2945} {"train_loss": -24.9422550201416, "global_step": 244505, "epoch": 2945} {"train_loss": -24.834487915039062, "global_step": 244506, "epoch": 2945} {"train_loss": -25.091779708862305, "global_step": 244507, "epoch": 2945} {"train_loss": -24.701322555541992, "global_step": 244508, "epoch": 2945} {"train_loss": -25.000350952148438, "global_step": 244509, "epoch": 2945} {"train_loss": -25.018775939941406, "global_step": 244510, "epoch": 2945} {"train_loss": -25.023115158081055, "global_step": 244511, "epoch": 2945} {"train_loss": -24.800384521484375, "global_step": 244512, "epoch": 2945} {"train_loss": -24.636655807495117, "global_step": 244513, "epoch": 2945} {"train_loss": -24.944412231445312, "global_step": 244514, "epoch": 2945} {"train_loss": -24.917945861816406, "global_step": 244515, "epoch": 2945} {"train_loss": -24.762319564819336, "global_step": 244516, "epoch": 2945} {"train_loss": -24.751733136464313, "global_step": 244517, "epoch": 2945, "val_loss": 6811821.5} {"train_loss": -24.833044052124023, "global_step": 244518, "epoch": 2946} {"train_loss": -24.783071517944336, "global_step": 244519, "epoch": 2946} {"train_loss": -24.42025375366211, "global_step": 244520, "epoch": 2946} {"train_loss": -24.424367904663086, "global_step": 244521, "epoch": 2946} {"train_loss": -24.333908081054688, "global_step": 244522, "epoch": 2946} {"train_loss": -24.708362579345703, "global_step": 244523, "epoch": 2946} {"train_loss": -24.653440475463867, "global_step": 244524, "epoch": 2946} {"train_loss": -24.591156005859375, "global_step": 244525, "epoch": 2946} {"train_loss": -24.56203269958496, "global_step": 244526, "epoch": 2946} {"train_loss": -24.39199447631836, "global_step": 244527, "epoch": 2946} {"train_loss": -24.828933715820312, "global_step": 244528, "epoch": 2946} {"train_loss": -24.67583656311035, "global_step": 244529, "epoch": 2946} {"train_loss": -24.535629272460938, "global_step": 244530, "epoch": 2946} {"train_loss": -24.608522415161133, "global_step": 244531, "epoch": 2946} {"train_loss": -24.63286590576172, "global_step": 244532, "epoch": 2946} {"train_loss": -24.48809242248535, "global_step": 244533, "epoch": 2946} {"train_loss": -24.50303840637207, "global_step": 244534, "epoch": 2946} {"train_loss": -24.751771926879883, "global_step": 244535, "epoch": 2946} {"train_loss": -24.89056968688965, "global_step": 244536, "epoch": 2946} {"train_loss": -24.927133560180664, "global_step": 244537, "epoch": 2946} {"train_loss": -24.968814849853516, "global_step": 244538, "epoch": 2946} {"train_loss": -24.841020584106445, "global_step": 244539, "epoch": 2946} {"train_loss": -24.95869255065918, "global_step": 244540, "epoch": 2946} {"train_loss": -24.477943420410156, "global_step": 244541, "epoch": 2946} {"train_loss": -24.706775665283203, "global_step": 244542, "epoch": 2946} {"train_loss": -25.10439109802246, "global_step": 244543, "epoch": 2946} {"train_loss": -24.771116256713867, "global_step": 244544, "epoch": 2946} {"train_loss": -25.10574722290039, "global_step": 244545, "epoch": 2946} {"train_loss": -24.76350975036621, "global_step": 244546, "epoch": 2946} {"train_loss": -24.88776969909668, "global_step": 244547, "epoch": 2946} {"train_loss": -24.942224502563477, "global_step": 244548, "epoch": 2946} {"train_loss": -25.121204376220703, "global_step": 244549, "epoch": 2946} {"train_loss": -24.68630027770996, "global_step": 244550, "epoch": 2946} {"train_loss": -24.779056549072266, "global_step": 244551, "epoch": 2946} {"train_loss": -24.899154663085938, "global_step": 244552, "epoch": 2946} {"train_loss": -24.955305099487305, "global_step": 244553, "epoch": 2946} {"train_loss": -25.11568832397461, "global_step": 244554, "epoch": 2946} {"train_loss": -24.879966735839844, "global_step": 244555, "epoch": 2946} {"train_loss": -25.03435707092285, "global_step": 244556, "epoch": 2946} {"train_loss": -24.536142349243164, "global_step": 244557, "epoch": 2946} {"train_loss": -24.85858154296875, "global_step": 244558, "epoch": 2946} {"train_loss": -24.89229965209961, "global_step": 244559, "epoch": 2946} {"train_loss": -24.825605392456055, "global_step": 244560, "epoch": 2946} {"train_loss": -25.11219596862793, "global_step": 244561, "epoch": 2946} {"train_loss": -24.983064651489258, "global_step": 244562, "epoch": 2946} {"train_loss": -25.15452766418457, "global_step": 244563, "epoch": 2946} {"train_loss": -25.325571060180664, "global_step": 244564, "epoch": 2946} {"train_loss": -25.642475128173828, "global_step": 244565, "epoch": 2946} {"train_loss": -25.19337272644043, "global_step": 244566, "epoch": 2946} {"train_loss": -25.35851287841797, "global_step": 244567, "epoch": 2946} {"train_loss": -24.925241470336914, "global_step": 244568, "epoch": 2946} {"train_loss": -24.91514778137207, "global_step": 244569, "epoch": 2946} {"train_loss": -24.826345443725586, "global_step": 244570, "epoch": 2946} {"train_loss": -25.02781867980957, "global_step": 244571, "epoch": 2946} {"train_loss": -24.993677139282227, "global_step": 244572, "epoch": 2946} {"train_loss": -25.24639892578125, "global_step": 244573, "epoch": 2946} {"train_loss": -25.122055053710938, "global_step": 244574, "epoch": 2946} {"train_loss": -25.218677520751953, "global_step": 244575, "epoch": 2946} {"train_loss": -24.999385833740234, "global_step": 244576, "epoch": 2946} {"train_loss": -25.41352653503418, "global_step": 244577, "epoch": 2946} {"train_loss": -24.994253158569336, "global_step": 244578, "epoch": 2946} {"train_loss": -24.943655014038086, "global_step": 244579, "epoch": 2946} {"train_loss": -25.254545211791992, "global_step": 244580, "epoch": 2946} {"train_loss": -24.92453956604004, "global_step": 244581, "epoch": 2946} {"train_loss": -24.832992553710938, "global_step": 244582, "epoch": 2946} {"train_loss": -25.133670806884766, "global_step": 244583, "epoch": 2946} {"train_loss": -24.83268165588379, "global_step": 244584, "epoch": 2946} {"train_loss": -25.123197555541992, "global_step": 244585, "epoch": 2946} {"train_loss": -25.136533737182617, "global_step": 244586, "epoch": 2946} {"train_loss": -25.006065368652344, "global_step": 244587, "epoch": 2946} {"train_loss": -24.457204818725586, "global_step": 244588, "epoch": 2946} {"train_loss": -24.902515411376953, "global_step": 244589, "epoch": 2946} {"train_loss": -25.14369773864746, "global_step": 244590, "epoch": 2946} {"train_loss": -25.01848793029785, "global_step": 244591, "epoch": 2946} {"train_loss": -24.907752990722656, "global_step": 244592, "epoch": 2946} {"train_loss": -25.094770431518555, "global_step": 244593, "epoch": 2946} {"train_loss": -24.62575340270996, "global_step": 244594, "epoch": 2946} {"train_loss": -24.55377197265625, "global_step": 244595, "epoch": 2946} {"train_loss": -24.801788330078125, "global_step": 244596, "epoch": 2946} {"train_loss": -25.053159713745117, "global_step": 244597, "epoch": 2946} {"train_loss": -24.662057876586914, "global_step": 244598, "epoch": 2946} {"train_loss": -24.943950653076172, "global_step": 244599, "epoch": 2946} {"train_loss": -24.900939573724585, "global_step": 244600, "epoch": 2946, "val_loss": 6943786.0} {"train_loss": -24.07729148864746, "global_step": 244601, "epoch": 2947} {"train_loss": -23.627490997314453, "global_step": 244602, "epoch": 2947} {"train_loss": -23.914215087890625, "global_step": 244603, "epoch": 2947} {"train_loss": -23.820188522338867, "global_step": 244604, "epoch": 2947} {"train_loss": -23.786592483520508, "global_step": 244605, "epoch": 2947} {"train_loss": -24.5714168548584, "global_step": 244606, "epoch": 2947} {"train_loss": -24.27692985534668, "global_step": 244607, "epoch": 2947} {"train_loss": -23.97885513305664, "global_step": 244608, "epoch": 2947} {"train_loss": -23.969379425048828, "global_step": 244609, "epoch": 2947} {"train_loss": -24.318450927734375, "global_step": 244610, "epoch": 2947} {"train_loss": -24.466354370117188, "global_step": 244611, "epoch": 2947} {"train_loss": -24.368310928344727, "global_step": 244612, "epoch": 2947} {"train_loss": -24.37710952758789, "global_step": 244613, "epoch": 2947} {"train_loss": -24.63749885559082, "global_step": 244614, "epoch": 2947} {"train_loss": -24.2810115814209, "global_step": 244615, "epoch": 2947} {"train_loss": -24.4973201751709, "global_step": 244616, "epoch": 2947} {"train_loss": -24.607084274291992, "global_step": 244617, "epoch": 2947} {"train_loss": -24.31807518005371, "global_step": 244618, "epoch": 2947} {"train_loss": -24.71097183227539, "global_step": 244619, "epoch": 2947} {"train_loss": -24.200361251831055, "global_step": 244620, "epoch": 2947} {"train_loss": -24.712247848510742, "global_step": 244621, "epoch": 2947} {"train_loss": -24.685712814331055, "global_step": 244622, "epoch": 2947} {"train_loss": -24.944828033447266, "global_step": 244623, "epoch": 2947} {"train_loss": -24.472932815551758, "global_step": 244624, "epoch": 2947} {"train_loss": -24.863853454589844, "global_step": 244625, "epoch": 2947} {"train_loss": -24.518308639526367, "global_step": 244626, "epoch": 2947} {"train_loss": -24.708829879760742, "global_step": 244627, "epoch": 2947} {"train_loss": -24.639541625976562, "global_step": 244628, "epoch": 2947} {"train_loss": -24.823387145996094, "global_step": 244629, "epoch": 2947} {"train_loss": -24.913328170776367, "global_step": 244630, "epoch": 2947} {"train_loss": -24.956541061401367, "global_step": 244631, "epoch": 2947} {"train_loss": -24.99928092956543, "global_step": 244632, "epoch": 2947} {"train_loss": -24.813573837280273, "global_step": 244633, "epoch": 2947} {"train_loss": -24.593473434448242, "global_step": 244634, "epoch": 2947} {"train_loss": -25.07111167907715, "global_step": 244635, "epoch": 2947} {"train_loss": -25.11385726928711, "global_step": 244636, "epoch": 2947} {"train_loss": -25.091453552246094, "global_step": 244637, "epoch": 2947} {"train_loss": -25.3319034576416, "global_step": 244638, "epoch": 2947} {"train_loss": -25.137771606445312, "global_step": 244639, "epoch": 2947} {"train_loss": -25.0130615234375, "global_step": 244640, "epoch": 2947} {"train_loss": -24.967863082885742, "global_step": 244641, "epoch": 2947} {"train_loss": -25.22804832458496, "global_step": 244642, "epoch": 2947} {"train_loss": -24.686826705932617, "global_step": 244643, "epoch": 2947} {"train_loss": -24.999942779541016, "global_step": 244644, "epoch": 2947} {"train_loss": -25.379392623901367, "global_step": 244645, "epoch": 2947} {"train_loss": -24.938459396362305, "global_step": 244646, "epoch": 2947} {"train_loss": -24.86807632446289, "global_step": 244647, "epoch": 2947} {"train_loss": -24.775766372680664, "global_step": 244648, "epoch": 2947} {"train_loss": -25.142179489135742, "global_step": 244649, "epoch": 2947} {"train_loss": -25.045272827148438, "global_step": 244650, "epoch": 2947} {"train_loss": -25.22786521911621, "global_step": 244651, "epoch": 2947} {"train_loss": -25.003320693969727, "global_step": 244652, "epoch": 2947} {"train_loss": -24.632415771484375, "global_step": 244653, "epoch": 2947} {"train_loss": -24.956287384033203, "global_step": 244654, "epoch": 2947} {"train_loss": -24.99366569519043, "global_step": 244655, "epoch": 2947} {"train_loss": -25.20941734313965, "global_step": 244656, "epoch": 2947} {"train_loss": -24.87470817565918, "global_step": 244657, "epoch": 2947} {"train_loss": -24.851123809814453, "global_step": 244658, "epoch": 2947} {"train_loss": -24.816158294677734, "global_step": 244659, "epoch": 2947} {"train_loss": -25.089242935180664, "global_step": 244660, "epoch": 2947} {"train_loss": -25.251571655273438, "global_step": 244661, "epoch": 2947} {"train_loss": -24.981985092163086, "global_step": 244662, "epoch": 2947} {"train_loss": -25.36017608642578, "global_step": 244663, "epoch": 2947} {"train_loss": -25.189878463745117, "global_step": 244664, "epoch": 2947} {"train_loss": -24.99997329711914, "global_step": 244665, "epoch": 2947} {"train_loss": -24.68903350830078, "global_step": 244666, "epoch": 2947} {"train_loss": -25.15193748474121, "global_step": 244667, "epoch": 2947} {"train_loss": -24.873226165771484, "global_step": 244668, "epoch": 2947} {"train_loss": -25.025938034057617, "global_step": 244669, "epoch": 2947} {"train_loss": -24.805208206176758, "global_step": 244670, "epoch": 2947} {"train_loss": -24.98394775390625, "global_step": 244671, "epoch": 2947} {"train_loss": -24.984052658081055, "global_step": 244672, "epoch": 2947} {"train_loss": -24.722883224487305, "global_step": 244673, "epoch": 2947} {"train_loss": -24.767135620117188, "global_step": 244674, "epoch": 2947} {"train_loss": -24.973800659179688, "global_step": 244675, "epoch": 2947} {"train_loss": -24.99928855895996, "global_step": 244676, "epoch": 2947} {"train_loss": -24.975406646728516, "global_step": 244677, "epoch": 2947} {"train_loss": -24.846668243408203, "global_step": 244678, "epoch": 2947} {"train_loss": -24.781524658203125, "global_step": 244679, "epoch": 2947} {"train_loss": -25.31964874267578, "global_step": 244680, "epoch": 2947} {"train_loss": -25.452558517456055, "global_step": 244681, "epoch": 2947} {"train_loss": -24.81975746154785, "global_step": 244682, "epoch": 2947} {"train_loss": -24.776416663663934, "global_step": 244683, "epoch": 2947, "val_loss": 6943094.0} {"train_loss": -24.625078201293945, "global_step": 244684, "epoch": 2948} {"train_loss": -24.146453857421875, "global_step": 244685, "epoch": 2948} {"train_loss": -24.75945472717285, "global_step": 244686, "epoch": 2948} {"train_loss": -24.415634155273438, "global_step": 244687, "epoch": 2948} {"train_loss": -24.097232818603516, "global_step": 244688, "epoch": 2948} {"train_loss": -24.159765243530273, "global_step": 244689, "epoch": 2948} {"train_loss": -24.934473037719727, "global_step": 244690, "epoch": 2948} {"train_loss": -24.681394577026367, "global_step": 244691, "epoch": 2948} {"train_loss": -24.730119705200195, "global_step": 244692, "epoch": 2948} {"train_loss": -24.695585250854492, "global_step": 244693, "epoch": 2948} {"train_loss": -24.76715087890625, "global_step": 244694, "epoch": 2948} {"train_loss": -24.72437858581543, "global_step": 244695, "epoch": 2948} {"train_loss": -24.78981590270996, "global_step": 244696, "epoch": 2948} {"train_loss": -25.05588722229004, "global_step": 244697, "epoch": 2948} {"train_loss": -24.566984176635742, "global_step": 244698, "epoch": 2948} {"train_loss": -24.788162231445312, "global_step": 244699, "epoch": 2948} {"train_loss": -25.162412643432617, "global_step": 244700, "epoch": 2948} {"train_loss": -24.7446231842041, "global_step": 244701, "epoch": 2948} {"train_loss": -24.748477935791016, "global_step": 244702, "epoch": 2948} {"train_loss": -24.726526260375977, "global_step": 244703, "epoch": 2948} {"train_loss": -25.041858673095703, "global_step": 244704, "epoch": 2948} {"train_loss": -24.863981246948242, "global_step": 244705, "epoch": 2948} {"train_loss": -24.66731071472168, "global_step": 244706, "epoch": 2948} {"train_loss": -24.61829948425293, "global_step": 244707, "epoch": 2948} {"train_loss": -24.774982452392578, "global_step": 244708, "epoch": 2948} {"train_loss": -25.004241943359375, "global_step": 244709, "epoch": 2948} {"train_loss": -25.281240463256836, "global_step": 244710, "epoch": 2948} {"train_loss": -24.665817260742188, "global_step": 244711, "epoch": 2948} {"train_loss": -24.829822540283203, "global_step": 244712, "epoch": 2948} {"train_loss": -24.838260650634766, "global_step": 244713, "epoch": 2948} {"train_loss": -25.392505645751953, "global_step": 244714, "epoch": 2948} {"train_loss": -24.7758731842041, "global_step": 244715, "epoch": 2948} {"train_loss": -24.93330955505371, "global_step": 244716, "epoch": 2948} {"train_loss": -25.201648712158203, "global_step": 244717, "epoch": 2948} {"train_loss": -25.182809829711914, "global_step": 244718, "epoch": 2948} {"train_loss": -25.07358169555664, "global_step": 244719, "epoch": 2948} {"train_loss": -24.892749786376953, "global_step": 244720, "epoch": 2948} {"train_loss": -25.101646423339844, "global_step": 244721, "epoch": 2948} {"train_loss": -24.811677932739258, "global_step": 244722, "epoch": 2948} {"train_loss": -24.9134521484375, "global_step": 244723, "epoch": 2948} {"train_loss": -24.812835693359375, "global_step": 244724, "epoch": 2948} {"train_loss": -25.112051010131836, "global_step": 244725, "epoch": 2948} {"train_loss": -24.963951110839844, "global_step": 244726, "epoch": 2948} {"train_loss": -24.979013442993164, "global_step": 244727, "epoch": 2948} {"train_loss": -25.391706466674805, "global_step": 244728, "epoch": 2948} {"train_loss": -24.897119522094727, "global_step": 244729, "epoch": 2948} {"train_loss": -25.025054931640625, "global_step": 244730, "epoch": 2948} {"train_loss": -25.00339126586914, "global_step": 244731, "epoch": 2948} {"train_loss": -25.35589027404785, "global_step": 244732, "epoch": 2948} {"train_loss": -25.01429557800293, "global_step": 244733, "epoch": 2948} {"train_loss": -25.28453254699707, "global_step": 244734, "epoch": 2948} {"train_loss": -25.379425048828125, "global_step": 244735, "epoch": 2948} {"train_loss": -24.871410369873047, "global_step": 244736, "epoch": 2948} {"train_loss": -25.22079849243164, "global_step": 244737, "epoch": 2948} {"train_loss": -24.911489486694336, "global_step": 244738, "epoch": 2948} {"train_loss": -24.909833908081055, "global_step": 244739, "epoch": 2948} {"train_loss": -25.586355209350586, "global_step": 244740, "epoch": 2948} {"train_loss": -25.194372177124023, "global_step": 244741, "epoch": 2948} {"train_loss": -25.393461227416992, "global_step": 244742, "epoch": 2948} {"train_loss": -24.312803268432617, "global_step": 244743, "epoch": 2948} {"train_loss": -24.083660125732422, "global_step": 244744, "epoch": 2948} {"train_loss": -24.4582576751709, "global_step": 244745, "epoch": 2948} {"train_loss": -24.425687789916992, "global_step": 244746, "epoch": 2948} {"train_loss": -24.513288497924805, "global_step": 244747, "epoch": 2948} {"train_loss": -24.451034545898438, "global_step": 244748, "epoch": 2948} {"train_loss": -24.61670684814453, "global_step": 244749, "epoch": 2948} {"train_loss": -24.669979095458984, "global_step": 244750, "epoch": 2948} {"train_loss": -24.767072677612305, "global_step": 244751, "epoch": 2948} {"train_loss": -24.987707138061523, "global_step": 244752, "epoch": 2948} {"train_loss": -24.7440242767334, "global_step": 244753, "epoch": 2948} {"train_loss": -24.939743041992188, "global_step": 244754, "epoch": 2948} {"train_loss": -24.969196319580078, "global_step": 244755, "epoch": 2948} {"train_loss": -24.836790084838867, "global_step": 244756, "epoch": 2948} {"train_loss": -24.686798095703125, "global_step": 244757, "epoch": 2948} {"train_loss": -24.840444564819336, "global_step": 244758, "epoch": 2948} {"train_loss": -25.000171661376953, "global_step": 244759, "epoch": 2948} {"train_loss": -24.273027420043945, "global_step": 244760, "epoch": 2948} {"train_loss": -24.76272964477539, "global_step": 244761, "epoch": 2948} {"train_loss": -24.868574142456055, "global_step": 244762, "epoch": 2948} {"train_loss": -24.802762985229492, "global_step": 244763, "epoch": 2948} {"train_loss": -24.993141174316406, "global_step": 244764, "epoch": 2948} {"train_loss": -25.05214500427246, "global_step": 244765, "epoch": 2948} {"train_loss": -24.842638268528216, "global_step": 244766, "epoch": 2948, "val_loss": 6746517.0} {"train_loss": -24.387853622436523, "global_step": 244767, "epoch": 2949} {"train_loss": -24.7847957611084, "global_step": 244768, "epoch": 2949} {"train_loss": -24.632476806640625, "global_step": 244769, "epoch": 2949} {"train_loss": -24.649656295776367, "global_step": 244770, "epoch": 2949} {"train_loss": -24.267255783081055, "global_step": 244771, "epoch": 2949} {"train_loss": -24.67197036743164, "global_step": 244772, "epoch": 2949} {"train_loss": -24.926427841186523, "global_step": 244773, "epoch": 2949} {"train_loss": -24.68195915222168, "global_step": 244774, "epoch": 2949} {"train_loss": -24.240070343017578, "global_step": 244775, "epoch": 2949} {"train_loss": -24.92975425720215, "global_step": 244776, "epoch": 2949} {"train_loss": -24.80457878112793, "global_step": 244777, "epoch": 2949} {"train_loss": -24.844409942626953, "global_step": 244778, "epoch": 2949} {"train_loss": -24.884733200073242, "global_step": 244779, "epoch": 2949} {"train_loss": -24.89191436767578, "global_step": 244780, "epoch": 2949} {"train_loss": -24.57391929626465, "global_step": 244781, "epoch": 2949} {"train_loss": -24.76289176940918, "global_step": 244782, "epoch": 2949} {"train_loss": -25.42275047302246, "global_step": 244783, "epoch": 2949} {"train_loss": -24.58026695251465, "global_step": 244784, "epoch": 2949} {"train_loss": -24.976125717163086, "global_step": 244785, "epoch": 2949} {"train_loss": -25.1258487701416, "global_step": 244786, "epoch": 2949} {"train_loss": -24.448575973510742, "global_step": 244787, "epoch": 2949} {"train_loss": -25.18163299560547, "global_step": 244788, "epoch": 2949} {"train_loss": -24.5532283782959, "global_step": 244789, "epoch": 2949} {"train_loss": -24.740703582763672, "global_step": 244790, "epoch": 2949} {"train_loss": -24.58742904663086, "global_step": 244791, "epoch": 2949} {"train_loss": -24.565811157226562, "global_step": 244792, "epoch": 2949} {"train_loss": -24.798025131225586, "global_step": 244793, "epoch": 2949} {"train_loss": -25.0715389251709, "global_step": 244794, "epoch": 2949} {"train_loss": -24.696094512939453, "global_step": 244795, "epoch": 2949} {"train_loss": -24.99297523498535, "global_step": 244796, "epoch": 2949} {"train_loss": -24.70298194885254, "global_step": 244797, "epoch": 2949} {"train_loss": -24.806989669799805, "global_step": 244798, "epoch": 2949} {"train_loss": -24.873493194580078, "global_step": 244799, "epoch": 2949} {"train_loss": -24.98141860961914, "global_step": 244800, "epoch": 2949} {"train_loss": -24.705915451049805, "global_step": 244801, "epoch": 2949} {"train_loss": -24.99446678161621, "global_step": 244802, "epoch": 2949} {"train_loss": -24.716230392456055, "global_step": 244803, "epoch": 2949} {"train_loss": -24.991830825805664, "global_step": 244804, "epoch": 2949} {"train_loss": -24.89525032043457, "global_step": 244805, "epoch": 2949} {"train_loss": -25.236682891845703, "global_step": 244806, "epoch": 2949} {"train_loss": -24.9660701751709, "global_step": 244807, "epoch": 2949} {"train_loss": -24.70859718322754, "global_step": 244808, "epoch": 2949} {"train_loss": -24.863075256347656, "global_step": 244809, "epoch": 2949} {"train_loss": -24.8969669342041, "global_step": 244810, "epoch": 2949} {"train_loss": -25.09414291381836, "global_step": 244811, "epoch": 2949} {"train_loss": -25.19251823425293, "global_step": 244812, "epoch": 2949} {"train_loss": -25.040464401245117, "global_step": 244813, "epoch": 2949} {"train_loss": -24.66449546813965, "global_step": 244814, "epoch": 2949} {"train_loss": -24.536710739135742, "global_step": 244815, "epoch": 2949} {"train_loss": -24.400861740112305, "global_step": 244816, "epoch": 2949} {"train_loss": -24.202604293823242, "global_step": 244817, "epoch": 2949} {"train_loss": -24.21927261352539, "global_step": 244818, "epoch": 2949} {"train_loss": -24.996313095092773, "global_step": 244819, "epoch": 2949} {"train_loss": -25.107019424438477, "global_step": 244820, "epoch": 2949} {"train_loss": -24.663284301757812, "global_step": 244821, "epoch": 2949} {"train_loss": -24.648427963256836, "global_step": 244822, "epoch": 2949} {"train_loss": -24.357406616210938, "global_step": 244823, "epoch": 2949} {"train_loss": -25.48133659362793, "global_step": 244824, "epoch": 2949} {"train_loss": -24.95975112915039, "global_step": 244825, "epoch": 2949} {"train_loss": -24.994356155395508, "global_step": 244826, "epoch": 2949} {"train_loss": -25.031078338623047, "global_step": 244827, "epoch": 2949} {"train_loss": -25.195219039916992, "global_step": 244828, "epoch": 2949} {"train_loss": -24.772811889648438, "global_step": 244829, "epoch": 2949} {"train_loss": -24.708585739135742, "global_step": 244830, "epoch": 2949} {"train_loss": -24.95985984802246, "global_step": 244831, "epoch": 2949} {"train_loss": -24.79078483581543, "global_step": 244832, "epoch": 2949} {"train_loss": -24.698036193847656, "global_step": 244833, "epoch": 2949} {"train_loss": -24.961994171142578, "global_step": 244834, "epoch": 2949} {"train_loss": -24.926198959350586, "global_step": 244835, "epoch": 2949} {"train_loss": -24.895305633544922, "global_step": 244836, "epoch": 2949} {"train_loss": -25.353315353393555, "global_step": 244837, "epoch": 2949} {"train_loss": -24.79681968688965, "global_step": 244838, "epoch": 2949} {"train_loss": -24.890548706054688, "global_step": 244839, "epoch": 2949} {"train_loss": -24.997770309448242, "global_step": 244840, "epoch": 2949} {"train_loss": -25.15513038635254, "global_step": 244841, "epoch": 2949} {"train_loss": -25.055557250976562, "global_step": 244842, "epoch": 2949} {"train_loss": -24.921884536743164, "global_step": 244843, "epoch": 2949} {"train_loss": -25.10433006286621, "global_step": 244844, "epoch": 2949} {"train_loss": -25.042875289916992, "global_step": 244845, "epoch": 2949} {"train_loss": -25.07111930847168, "global_step": 244846, "epoch": 2949} {"train_loss": -24.990921020507812, "global_step": 244847, "epoch": 2949} {"train_loss": -24.989490509033203, "global_step": 244848, "epoch": 2949} {"train_loss": -24.840470256575617, "global_step": 244849, "epoch": 2949, "val_loss": 6758871.0} {"train_loss": -24.648691177368164, "global_step": 244850, "epoch": 2950} {"train_loss": -24.72957420349121, "global_step": 244851, "epoch": 2950} {"train_loss": -24.582921981811523, "global_step": 244852, "epoch": 2950} {"train_loss": -24.91383934020996, "global_step": 244853, "epoch": 2950} {"train_loss": -24.447614669799805, "global_step": 244854, "epoch": 2950} {"train_loss": -24.31720733642578, "global_step": 244855, "epoch": 2950} {"train_loss": -24.755329132080078, "global_step": 244856, "epoch": 2950} {"train_loss": -24.704452514648438, "global_step": 244857, "epoch": 2950} {"train_loss": -24.89129066467285, "global_step": 244858, "epoch": 2950} {"train_loss": -24.79387092590332, "global_step": 244859, "epoch": 2950} {"train_loss": -24.65826988220215, "global_step": 244860, "epoch": 2950} {"train_loss": -24.64796257019043, "global_step": 244861, "epoch": 2950} {"train_loss": -24.859094619750977, "global_step": 244862, "epoch": 2950} {"train_loss": -25.32184410095215, "global_step": 244863, "epoch": 2950} {"train_loss": -24.94249725341797, "global_step": 244864, "epoch": 2950} {"train_loss": -24.784452438354492, "global_step": 244865, "epoch": 2950} {"train_loss": -24.66669273376465, "global_step": 244866, "epoch": 2950} {"train_loss": -25.250160217285156, "global_step": 244867, "epoch": 2950} {"train_loss": -24.95022201538086, "global_step": 244868, "epoch": 2950} {"train_loss": -24.759902954101562, "global_step": 244869, "epoch": 2950} {"train_loss": -24.866891860961914, "global_step": 244870, "epoch": 2950} {"train_loss": -24.654417037963867, "global_step": 244871, "epoch": 2950} {"train_loss": -24.359872817993164, "global_step": 244872, "epoch": 2950} {"train_loss": -24.508502960205078, "global_step": 244873, "epoch": 2950} {"train_loss": -25.139251708984375, "global_step": 244874, "epoch": 2950} {"train_loss": -24.788314819335938, "global_step": 244875, "epoch": 2950} {"train_loss": -24.706785202026367, "global_step": 244876, "epoch": 2950} {"train_loss": -25.085905075073242, "global_step": 244877, "epoch": 2950} {"train_loss": -24.766775131225586, "global_step": 244878, "epoch": 2950} {"train_loss": -25.04481315612793, "global_step": 244879, "epoch": 2950} {"train_loss": -24.80611228942871, "global_step": 244880, "epoch": 2950} {"train_loss": -25.10651206970215, "global_step": 244881, "epoch": 2950} {"train_loss": -25.234235763549805, "global_step": 244882, "epoch": 2950} {"train_loss": -24.95229148864746, "global_step": 244883, "epoch": 2950} {"train_loss": -24.799039840698242, "global_step": 244884, "epoch": 2950} {"train_loss": -25.176786422729492, "global_step": 244885, "epoch": 2950} {"train_loss": -25.157119750976562, "global_step": 244886, "epoch": 2950} {"train_loss": -25.07058334350586, "global_step": 244887, "epoch": 2950} {"train_loss": -24.97574234008789, "global_step": 244888, "epoch": 2950} {"train_loss": -24.98310661315918, "global_step": 244889, "epoch": 2950} {"train_loss": -24.924558639526367, "global_step": 244890, "epoch": 2950} {"train_loss": -24.729883193969727, "global_step": 244891, "epoch": 2950} {"train_loss": -25.220651626586914, "global_step": 244892, "epoch": 2950} {"train_loss": -24.735883712768555, "global_step": 244893, "epoch": 2950} {"train_loss": -24.800189971923828, "global_step": 244894, "epoch": 2950} {"train_loss": -24.599288940429688, "global_step": 244895, "epoch": 2950} {"train_loss": -25.117515563964844, "global_step": 244896, "epoch": 2950} {"train_loss": -24.856107711791992, "global_step": 244897, "epoch": 2950} {"train_loss": -24.6048641204834, "global_step": 244898, "epoch": 2950} {"train_loss": -25.143083572387695, "global_step": 244899, "epoch": 2950} {"train_loss": -24.861408233642578, "global_step": 244900, "epoch": 2950} {"train_loss": -25.02317237854004, "global_step": 244901, "epoch": 2950} {"train_loss": -24.95526695251465, "global_step": 244902, "epoch": 2950} {"train_loss": -24.79896354675293, "global_step": 244903, "epoch": 2950} {"train_loss": -25.112579345703125, "global_step": 244904, "epoch": 2950} {"train_loss": -24.76969337463379, "global_step": 244905, "epoch": 2950} {"train_loss": -25.035430908203125, "global_step": 244906, "epoch": 2950} {"train_loss": -25.345233917236328, "global_step": 244907, "epoch": 2950} {"train_loss": -25.13348388671875, "global_step": 244908, "epoch": 2950} {"train_loss": -24.9785213470459, "global_step": 244909, "epoch": 2950} {"train_loss": -25.123186111450195, "global_step": 244910, "epoch": 2950} {"train_loss": -25.309078216552734, "global_step": 244911, "epoch": 2950} {"train_loss": -24.656082153320312, "global_step": 244912, "epoch": 2950} {"train_loss": -24.813581466674805, "global_step": 244913, "epoch": 2950} {"train_loss": -25.279401779174805, "global_step": 244914, "epoch": 2950} {"train_loss": -25.19608497619629, "global_step": 244915, "epoch": 2950} {"train_loss": -25.026378631591797, "global_step": 244916, "epoch": 2950} {"train_loss": -24.76189613342285, "global_step": 244917, "epoch": 2950} {"train_loss": -24.830238342285156, "global_step": 244918, "epoch": 2950} {"train_loss": -25.03998565673828, "global_step": 244919, "epoch": 2950} {"train_loss": -25.14418601989746, "global_step": 244920, "epoch": 2950} {"train_loss": -24.82480812072754, "global_step": 244921, "epoch": 2950} {"train_loss": -25.409440994262695, "global_step": 244922, "epoch": 2950} {"train_loss": -25.143972396850586, "global_step": 244923, "epoch": 2950} {"train_loss": -24.67512321472168, "global_step": 244924, "epoch": 2950} {"train_loss": -24.92026710510254, "global_step": 244925, "epoch": 2950} {"train_loss": -24.834396362304688, "global_step": 244926, "epoch": 2950} {"train_loss": -25.266189575195312, "global_step": 244927, "epoch": 2950} {"train_loss": -24.930349349975586, "global_step": 244928, "epoch": 2950} {"train_loss": -25.042673110961914, "global_step": 244929, "epoch": 2950} {"train_loss": -24.89748191833496, "global_step": 244930, "epoch": 2950} {"train_loss": -24.89930534362793, "global_step": 244931, "epoch": 2950} {"train_loss": -24.892350644950408, "global_step": 244932, "epoch": 2950, "train/sim_max_reward_0": 1.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 0.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4500000": 1.0, "test/sim_max_reward_4500001": 1.0, "test/sim_max_reward_4500002": 1.0, "test/sim_max_reward_4500003": 1.0, "test/sim_max_reward_4500004": 1.0, "test/sim_max_reward_4500005": 1.0, "test/sim_max_reward_4500006": 1.0, "test/sim_max_reward_4500007": 0.0, "test/sim_max_reward_4500008": 1.0, "test/sim_max_reward_4500009": 1.0, "test/sim_max_reward_4500010": 1.0, "test/sim_max_reward_4500011": 1.0, "test/sim_max_reward_4500012": 1.0, "test/sim_max_reward_4500013": 0.0, "test/sim_max_reward_4500014": 1.0, "test/sim_max_reward_4500015": 1.0, "test/sim_max_reward_4500016": 1.0, "test/sim_max_reward_4500017": 1.0, "test/sim_max_reward_4500018": 1.0, "test/sim_max_reward_4500019": 0.0, "test/sim_max_reward_4500020": 1.0, "test/sim_max_reward_4500021": 1.0, "train/mean_score": 0.8333333333333334, "test/mean_score": 0.8636363636363636, "val_loss": 6886341.0} {"train_loss": -24.287017822265625, "global_step": 244933, "epoch": 2951} {"train_loss": -23.968753814697266, "global_step": 244934, "epoch": 2951} {"train_loss": -23.772123336791992, "global_step": 244935, "epoch": 2951} {"train_loss": -24.245054244995117, "global_step": 244936, "epoch": 2951} {"train_loss": -24.4603328704834, "global_step": 244937, "epoch": 2951} {"train_loss": -23.99343490600586, "global_step": 244938, "epoch": 2951} {"train_loss": -23.956674575805664, "global_step": 244939, "epoch": 2951} {"train_loss": -24.448781967163086, "global_step": 244940, "epoch": 2951} {"train_loss": -23.9788761138916, "global_step": 244941, "epoch": 2951} {"train_loss": -24.499528884887695, "global_step": 244942, "epoch": 2951} {"train_loss": -24.479581832885742, "global_step": 244943, "epoch": 2951} {"train_loss": -24.39102554321289, "global_step": 244944, "epoch": 2951} {"train_loss": -24.353853225708008, "global_step": 244945, "epoch": 2951} {"train_loss": -24.321630477905273, "global_step": 244946, "epoch": 2951} {"train_loss": -24.446529388427734, "global_step": 244947, "epoch": 2951} {"train_loss": -24.45435905456543, "global_step": 244948, "epoch": 2951} {"train_loss": -24.46653175354004, "global_step": 244949, "epoch": 2951} {"train_loss": -24.60260009765625, "global_step": 244950, "epoch": 2951} {"train_loss": -24.908994674682617, "global_step": 244951, "epoch": 2951} {"train_loss": -24.458452224731445, "global_step": 244952, "epoch": 2951} {"train_loss": -24.712432861328125, "global_step": 244953, "epoch": 2951} {"train_loss": -24.628952026367188, "global_step": 244954, "epoch": 2951} {"train_loss": -24.834863662719727, "global_step": 244955, "epoch": 2951} {"train_loss": -24.892820358276367, "global_step": 244956, "epoch": 2951} {"train_loss": -24.842910766601562, "global_step": 244957, "epoch": 2951} {"train_loss": -25.21988296508789, "global_step": 244958, "epoch": 2951} {"train_loss": -24.551307678222656, "global_step": 244959, "epoch": 2951} {"train_loss": -24.884387969970703, "global_step": 244960, "epoch": 2951} {"train_loss": -24.935129165649414, "global_step": 244961, "epoch": 2951} {"train_loss": -24.822301864624023, "global_step": 244962, "epoch": 2951} {"train_loss": -24.52659797668457, "global_step": 244963, "epoch": 2951} {"train_loss": -25.096363067626953, "global_step": 244964, "epoch": 2951} {"train_loss": -25.056076049804688, "global_step": 244965, "epoch": 2951} {"train_loss": -25.280668258666992, "global_step": 244966, "epoch": 2951} {"train_loss": -24.807968139648438, "global_step": 244967, "epoch": 2951} {"train_loss": -25.289438247680664, "global_step": 244968, "epoch": 2951} {"train_loss": -25.12148094177246, "global_step": 244969, "epoch": 2951} {"train_loss": -24.969945907592773, "global_step": 244970, "epoch": 2951} {"train_loss": -24.878128051757812, "global_step": 244971, "epoch": 2951} {"train_loss": -25.6893253326416, "global_step": 244972, "epoch": 2951} {"train_loss": -25.04939842224121, "global_step": 244973, "epoch": 2951} {"train_loss": -24.920156478881836, "global_step": 244974, "epoch": 2951} {"train_loss": -25.194059371948242, "global_step": 244975, "epoch": 2951} {"train_loss": -24.92085075378418, "global_step": 244976, "epoch": 2951} {"train_loss": -24.829824447631836, "global_step": 244977, "epoch": 2951} {"train_loss": -24.690969467163086, "global_step": 244978, "epoch": 2951} {"train_loss": -24.357526779174805, "global_step": 244979, "epoch": 2951} {"train_loss": -24.86272621154785, "global_step": 244980, "epoch": 2951} {"train_loss": -25.18906593322754, "global_step": 244981, "epoch": 2951} {"train_loss": -25.00592613220215, "global_step": 244982, "epoch": 2951} {"train_loss": -24.553457260131836, "global_step": 244983, "epoch": 2951} {"train_loss": -24.605688095092773, "global_step": 244984, "epoch": 2951} {"train_loss": -25.033172607421875, "global_step": 244985, "epoch": 2951} {"train_loss": -24.865137100219727, "global_step": 244986, "epoch": 2951} {"train_loss": -24.8988037109375, "global_step": 244987, "epoch": 2951} {"train_loss": -25.145483016967773, "global_step": 244988, "epoch": 2951} {"train_loss": -24.79090690612793, "global_step": 244989, "epoch": 2951} {"train_loss": -25.148334503173828, "global_step": 244990, "epoch": 2951} {"train_loss": -24.89252281188965, "global_step": 244991, "epoch": 2951} {"train_loss": -24.902463912963867, "global_step": 244992, "epoch": 2951} {"train_loss": -25.35658836364746, "global_step": 244993, "epoch": 2951} {"train_loss": -25.061891555786133, "global_step": 244994, "epoch": 2951} {"train_loss": -25.147663116455078, "global_step": 244995, "epoch": 2951} {"train_loss": -25.124134063720703, "global_step": 244996, "epoch": 2951} {"train_loss": -24.96490478515625, "global_step": 244997, "epoch": 2951} {"train_loss": -24.684419631958008, "global_step": 244998, "epoch": 2951} {"train_loss": -25.171010971069336, "global_step": 244999, "epoch": 2951} {"train_loss": -25.12931251525879, "global_step": 245000, "epoch": 2951} {"train_loss": -24.997150421142578, "global_step": 245001, "epoch": 2951} {"train_loss": -25.3034610748291, "global_step": 245002, "epoch": 2951} {"train_loss": -24.801542282104492, "global_step": 245003, "epoch": 2951} {"train_loss": -24.969728469848633, "global_step": 245004, "epoch": 2951} {"train_loss": -25.153858184814453, "global_step": 245005, "epoch": 2951} {"train_loss": -25.2348690032959, "global_step": 245006, "epoch": 2951} {"train_loss": -24.840932846069336, "global_step": 245007, "epoch": 2951} {"train_loss": -25.162336349487305, "global_step": 245008, "epoch": 2951} {"train_loss": -25.084257125854492, "global_step": 245009, "epoch": 2951} {"train_loss": -24.969812393188477, "global_step": 245010, "epoch": 2951} {"train_loss": -25.090396881103516, "global_step": 245011, "epoch": 2951} {"train_loss": -25.09012222290039, "global_step": 245012, "epoch": 2951} {"train_loss": -25.06440544128418, "global_step": 245013, "epoch": 2951} {"train_loss": -25.034992218017578, "global_step": 245014, "epoch": 2951} {"train_loss": -24.815334411988776, "global_step": 245015, "epoch": 2951, "val_loss": 6847997.0} {"train_loss": -25.034948348999023, "global_step": 245016, "epoch": 2952} {"train_loss": -24.740636825561523, "global_step": 245017, "epoch": 2952} {"train_loss": -24.827556610107422, "global_step": 245018, "epoch": 2952} {"train_loss": -24.75305938720703, "global_step": 245019, "epoch": 2952} {"train_loss": -24.860301971435547, "global_step": 245020, "epoch": 2952} {"train_loss": -24.899429321289062, "global_step": 245021, "epoch": 2952} {"train_loss": -24.880245208740234, "global_step": 245022, "epoch": 2952} {"train_loss": -24.630844116210938, "global_step": 245023, "epoch": 2952} {"train_loss": -24.44574546813965, "global_step": 245024, "epoch": 2952} {"train_loss": -24.662588119506836, "global_step": 245025, "epoch": 2952} {"train_loss": -24.46318244934082, "global_step": 245026, "epoch": 2952} {"train_loss": -25.139554977416992, "global_step": 245027, "epoch": 2952} {"train_loss": -25.003543853759766, "global_step": 245028, "epoch": 2952} {"train_loss": -24.985654830932617, "global_step": 245029, "epoch": 2952} {"train_loss": -24.96245765686035, "global_step": 245030, "epoch": 2952} {"train_loss": -24.53590965270996, "global_step": 245031, "epoch": 2952} {"train_loss": -25.07569122314453, "global_step": 245032, "epoch": 2952} {"train_loss": -24.8090763092041, "global_step": 245033, "epoch": 2952} {"train_loss": -25.096057891845703, "global_step": 245034, "epoch": 2952} {"train_loss": -24.86911964416504, "global_step": 245035, "epoch": 2952} {"train_loss": -24.68060874938965, "global_step": 245036, "epoch": 2952} {"train_loss": -25.16129493713379, "global_step": 245037, "epoch": 2952} {"train_loss": -24.606748580932617, "global_step": 245038, "epoch": 2952} {"train_loss": -24.94001579284668, "global_step": 245039, "epoch": 2952} {"train_loss": -24.82686424255371, "global_step": 245040, "epoch": 2952} {"train_loss": -25.06252098083496, "global_step": 245041, "epoch": 2952} {"train_loss": -24.98583221435547, "global_step": 245042, "epoch": 2952} {"train_loss": -25.192115783691406, "global_step": 245043, "epoch": 2952} {"train_loss": -25.028356552124023, "global_step": 245044, "epoch": 2952} {"train_loss": -25.288131713867188, "global_step": 245045, "epoch": 2952} {"train_loss": -24.9388427734375, "global_step": 245046, "epoch": 2952} {"train_loss": -25.245580673217773, "global_step": 245047, "epoch": 2952} {"train_loss": -25.026657104492188, "global_step": 245048, "epoch": 2952} {"train_loss": -25.06199836730957, "global_step": 245049, "epoch": 2952} {"train_loss": -24.893171310424805, "global_step": 245050, "epoch": 2952} {"train_loss": -25.001981735229492, "global_step": 245051, "epoch": 2952} {"train_loss": -24.991214752197266, "global_step": 245052, "epoch": 2952} {"train_loss": -24.55077362060547, "global_step": 245053, "epoch": 2952} {"train_loss": -24.408185958862305, "global_step": 245054, "epoch": 2952} {"train_loss": -24.274368286132812, "global_step": 245055, "epoch": 2952} {"train_loss": -24.799854278564453, "global_step": 245056, "epoch": 2952} {"train_loss": -25.092666625976562, "global_step": 245057, "epoch": 2952} {"train_loss": -24.55299949645996, "global_step": 245058, "epoch": 2952} {"train_loss": -24.395700454711914, "global_step": 245059, "epoch": 2952} {"train_loss": -25.011137008666992, "global_step": 245060, "epoch": 2952} {"train_loss": -24.888071060180664, "global_step": 245061, "epoch": 2952} {"train_loss": -24.909320831298828, "global_step": 245062, "epoch": 2952} {"train_loss": -25.00948143005371, "global_step": 245063, "epoch": 2952} {"train_loss": -25.012866973876953, "global_step": 245064, "epoch": 2952} {"train_loss": -25.036602020263672, "global_step": 245065, "epoch": 2952} {"train_loss": -24.620264053344727, "global_step": 245066, "epoch": 2952} {"train_loss": -24.88986587524414, "global_step": 245067, "epoch": 2952} {"train_loss": -24.73629379272461, "global_step": 245068, "epoch": 2952} {"train_loss": -24.873510360717773, "global_step": 245069, "epoch": 2952} {"train_loss": -25.05924415588379, "global_step": 245070, "epoch": 2952} {"train_loss": -25.016010284423828, "global_step": 245071, "epoch": 2952} {"train_loss": -24.925983428955078, "global_step": 245072, "epoch": 2952} {"train_loss": -24.95994758605957, "global_step": 245073, "epoch": 2952} {"train_loss": -25.311254501342773, "global_step": 245074, "epoch": 2952} {"train_loss": -25.239521026611328, "global_step": 245075, "epoch": 2952} {"train_loss": -25.21100616455078, "global_step": 245076, "epoch": 2952} {"train_loss": -25.13189125061035, "global_step": 245077, "epoch": 2952} {"train_loss": -24.848424911499023, "global_step": 245078, "epoch": 2952} {"train_loss": -25.225473403930664, "global_step": 245079, "epoch": 2952} {"train_loss": -25.182973861694336, "global_step": 245080, "epoch": 2952} {"train_loss": -24.912418365478516, "global_step": 245081, "epoch": 2952} {"train_loss": -24.845703125, "global_step": 245082, "epoch": 2952} {"train_loss": -24.71278953552246, "global_step": 245083, "epoch": 2952} {"train_loss": -25.144498825073242, "global_step": 245084, "epoch": 2952} {"train_loss": -25.454051971435547, "global_step": 245085, "epoch": 2952} {"train_loss": -24.920387268066406, "global_step": 245086, "epoch": 2952} {"train_loss": -24.451204299926758, "global_step": 245087, "epoch": 2952} {"train_loss": -25.317182540893555, "global_step": 245088, "epoch": 2952} {"train_loss": -24.902034759521484, "global_step": 245089, "epoch": 2952} {"train_loss": -24.79170799255371, "global_step": 245090, "epoch": 2952} {"train_loss": -24.70920753479004, "global_step": 245091, "epoch": 2952} {"train_loss": -24.814697265625, "global_step": 245092, "epoch": 2952} {"train_loss": -25.0899658203125, "global_step": 245093, "epoch": 2952} {"train_loss": -24.87116813659668, "global_step": 245094, "epoch": 2952} {"train_loss": -24.736886978149414, "global_step": 245095, "epoch": 2952} {"train_loss": -24.884756088256836, "global_step": 245096, "epoch": 2952} {"train_loss": -25.287261962890625, "global_step": 245097, "epoch": 2952} {"train_loss": -24.8997241100633, "global_step": 245098, "epoch": 2952, "val_loss": 6834030.0} {"train_loss": -22.918500900268555, "global_step": 245099, "epoch": 2953} {"train_loss": -22.134267807006836, "global_step": 245100, "epoch": 2953} {"train_loss": -24.614967346191406, "global_step": 245101, "epoch": 2953} {"train_loss": -22.83244514465332, "global_step": 245102, "epoch": 2953} {"train_loss": -23.126523971557617, "global_step": 245103, "epoch": 2953} {"train_loss": -24.567419052124023, "global_step": 245104, "epoch": 2953} {"train_loss": -23.682058334350586, "global_step": 245105, "epoch": 2953} {"train_loss": -24.08661460876465, "global_step": 245106, "epoch": 2953} {"train_loss": -23.84040641784668, "global_step": 245107, "epoch": 2953} {"train_loss": -24.22749900817871, "global_step": 245108, "epoch": 2953} {"train_loss": -24.32164764404297, "global_step": 245109, "epoch": 2953} {"train_loss": -24.21270751953125, "global_step": 245110, "epoch": 2953} {"train_loss": -24.09950828552246, "global_step": 245111, "epoch": 2953} {"train_loss": -24.02253532409668, "global_step": 245112, "epoch": 2953} {"train_loss": -24.028600692749023, "global_step": 245113, "epoch": 2953} {"train_loss": -24.224485397338867, "global_step": 245114, "epoch": 2953} {"train_loss": -24.14632225036621, "global_step": 245115, "epoch": 2953} {"train_loss": -24.563091278076172, "global_step": 245116, "epoch": 2953} {"train_loss": -24.608579635620117, "global_step": 245117, "epoch": 2953} {"train_loss": -24.855484008789062, "global_step": 245118, "epoch": 2953} {"train_loss": -24.269086837768555, "global_step": 245119, "epoch": 2953} {"train_loss": -24.405202865600586, "global_step": 245120, "epoch": 2953} {"train_loss": -24.7242374420166, "global_step": 245121, "epoch": 2953} {"train_loss": -24.4938907623291, "global_step": 245122, "epoch": 2953} {"train_loss": -24.398117065429688, "global_step": 245123, "epoch": 2953} {"train_loss": -24.496997833251953, "global_step": 245124, "epoch": 2953} {"train_loss": -24.485061645507812, "global_step": 245125, "epoch": 2953} {"train_loss": -24.623037338256836, "global_step": 245126, "epoch": 2953} {"train_loss": -24.69817543029785, "global_step": 245127, "epoch": 2953} {"train_loss": -24.696481704711914, "global_step": 245128, "epoch": 2953} {"train_loss": -24.415483474731445, "global_step": 245129, "epoch": 2953} {"train_loss": -24.843475341796875, "global_step": 245130, "epoch": 2953} {"train_loss": -24.572757720947266, "global_step": 245131, "epoch": 2953} {"train_loss": -24.95914649963379, "global_step": 245132, "epoch": 2953} {"train_loss": -25.07797622680664, "global_step": 245133, "epoch": 2953} {"train_loss": -25.068273544311523, "global_step": 245134, "epoch": 2953} {"train_loss": -24.338525772094727, "global_step": 245135, "epoch": 2953} {"train_loss": -24.880191802978516, "global_step": 245136, "epoch": 2953} {"train_loss": -24.897390365600586, "global_step": 245137, "epoch": 2953} {"train_loss": -24.780668258666992, "global_step": 245138, "epoch": 2953} {"train_loss": -24.779747009277344, "global_step": 245139, "epoch": 2953} {"train_loss": -24.917722702026367, "global_step": 245140, "epoch": 2953} {"train_loss": -24.987695693969727, "global_step": 245141, "epoch": 2953} {"train_loss": -24.812589645385742, "global_step": 245142, "epoch": 2953} {"train_loss": -25.07892417907715, "global_step": 245143, "epoch": 2953} {"train_loss": -24.666658401489258, "global_step": 245144, "epoch": 2953} {"train_loss": -24.933807373046875, "global_step": 245145, "epoch": 2953} {"train_loss": -24.907636642456055, "global_step": 245146, "epoch": 2953} {"train_loss": -24.855031967163086, "global_step": 245147, "epoch": 2953} {"train_loss": -24.932153701782227, "global_step": 245148, "epoch": 2953} {"train_loss": -25.203136444091797, "global_step": 245149, "epoch": 2953} {"train_loss": -25.06045913696289, "global_step": 245150, "epoch": 2953} {"train_loss": -24.745227813720703, "global_step": 245151, "epoch": 2953} {"train_loss": -24.96364402770996, "global_step": 245152, "epoch": 2953} {"train_loss": -24.906736373901367, "global_step": 245153, "epoch": 2953} {"train_loss": -24.8507080078125, "global_step": 245154, "epoch": 2953} {"train_loss": -24.83988380432129, "global_step": 245155, "epoch": 2953} {"train_loss": -24.99360466003418, "global_step": 245156, "epoch": 2953} {"train_loss": -24.86237907409668, "global_step": 245157, "epoch": 2953} {"train_loss": -25.603918075561523, "global_step": 245158, "epoch": 2953} {"train_loss": -25.247121810913086, "global_step": 245159, "epoch": 2953} {"train_loss": -24.71124839782715, "global_step": 245160, "epoch": 2953} {"train_loss": -25.126052856445312, "global_step": 245161, "epoch": 2953} {"train_loss": -25.35099983215332, "global_step": 245162, "epoch": 2953} {"train_loss": -24.955230712890625, "global_step": 245163, "epoch": 2953} {"train_loss": -25.209854125976562, "global_step": 245164, "epoch": 2953} {"train_loss": -25.205049514770508, "global_step": 245165, "epoch": 2953} {"train_loss": -24.9623966217041, "global_step": 245166, "epoch": 2953} {"train_loss": -25.0902099609375, "global_step": 245167, "epoch": 2953} {"train_loss": -24.431013107299805, "global_step": 245168, "epoch": 2953} {"train_loss": -24.797489166259766, "global_step": 245169, "epoch": 2953} {"train_loss": -24.980318069458008, "global_step": 245170, "epoch": 2953} {"train_loss": -25.071640014648438, "global_step": 245171, "epoch": 2953} {"train_loss": -24.855161666870117, "global_step": 245172, "epoch": 2953} {"train_loss": -25.33193588256836, "global_step": 245173, "epoch": 2953} {"train_loss": -24.662267684936523, "global_step": 245174, "epoch": 2953} {"train_loss": -25.033517837524414, "global_step": 245175, "epoch": 2953} {"train_loss": -24.947181701660156, "global_step": 245176, "epoch": 2953} {"train_loss": -25.13770866394043, "global_step": 245177, "epoch": 2953} {"train_loss": -24.90306854248047, "global_step": 245178, "epoch": 2953} {"train_loss": -24.956247329711914, "global_step": 245179, "epoch": 2953} {"train_loss": -25.261045455932617, "global_step": 245180, "epoch": 2953} {"train_loss": -24.645970447953925, "global_step": 245181, "epoch": 2953, "val_loss": 7049125.0} {"train_loss": -23.5178279876709, "global_step": 245182, "epoch": 2954} {"train_loss": -23.96908950805664, "global_step": 245183, "epoch": 2954} {"train_loss": -23.91390037536621, "global_step": 245184, "epoch": 2954} {"train_loss": -24.477231979370117, "global_step": 245185, "epoch": 2954} {"train_loss": -24.191593170166016, "global_step": 245186, "epoch": 2954} {"train_loss": -24.063955307006836, "global_step": 245187, "epoch": 2954} {"train_loss": -24.53134536743164, "global_step": 245188, "epoch": 2954} {"train_loss": -24.38857650756836, "global_step": 245189, "epoch": 2954} {"train_loss": -24.315603256225586, "global_step": 245190, "epoch": 2954} {"train_loss": -24.225732803344727, "global_step": 245191, "epoch": 2954} {"train_loss": -24.701011657714844, "global_step": 245192, "epoch": 2954} {"train_loss": -24.12179183959961, "global_step": 245193, "epoch": 2954} {"train_loss": -24.431211471557617, "global_step": 245194, "epoch": 2954} {"train_loss": -24.615827560424805, "global_step": 245195, "epoch": 2954} {"train_loss": -25.11297607421875, "global_step": 245196, "epoch": 2954} {"train_loss": -24.701576232910156, "global_step": 245197, "epoch": 2954} {"train_loss": -24.7451114654541, "global_step": 245198, "epoch": 2954} {"train_loss": -24.732725143432617, "global_step": 245199, "epoch": 2954} {"train_loss": -24.81715965270996, "global_step": 245200, "epoch": 2954} {"train_loss": -24.593547821044922, "global_step": 245201, "epoch": 2954} {"train_loss": -24.7584171295166, "global_step": 245202, "epoch": 2954} {"train_loss": -24.720102310180664, "global_step": 245203, "epoch": 2954} {"train_loss": -24.941991806030273, "global_step": 245204, "epoch": 2954} {"train_loss": -24.780088424682617, "global_step": 245205, "epoch": 2954} {"train_loss": -24.4575252532959, "global_step": 245206, "epoch": 2954} {"train_loss": -25.129669189453125, "global_step": 245207, "epoch": 2954} {"train_loss": -24.643381118774414, "global_step": 245208, "epoch": 2954} {"train_loss": -24.694665908813477, "global_step": 245209, "epoch": 2954} {"train_loss": -24.729673385620117, "global_step": 245210, "epoch": 2954} {"train_loss": -24.36941909790039, "global_step": 245211, "epoch": 2954} {"train_loss": -25.094030380249023, "global_step": 245212, "epoch": 2954} {"train_loss": -24.88958168029785, "global_step": 245213, "epoch": 2954} {"train_loss": -24.929292678833008, "global_step": 245214, "epoch": 2954} {"train_loss": -24.797748565673828, "global_step": 245215, "epoch": 2954} {"train_loss": -24.794723510742188, "global_step": 245216, "epoch": 2954} {"train_loss": -24.626218795776367, "global_step": 245217, "epoch": 2954} {"train_loss": -24.856678009033203, "global_step": 245218, "epoch": 2954} {"train_loss": -25.299665451049805, "global_step": 245219, "epoch": 2954} {"train_loss": -25.059377670288086, "global_step": 245220, "epoch": 2954} {"train_loss": -24.831296920776367, "global_step": 245221, "epoch": 2954} {"train_loss": -24.948701858520508, "global_step": 245222, "epoch": 2954} {"train_loss": -25.33519172668457, "global_step": 245223, "epoch": 2954} {"train_loss": -24.81850242614746, "global_step": 245224, "epoch": 2954} {"train_loss": -24.542020797729492, "global_step": 245225, "epoch": 2954} {"train_loss": -24.854894638061523, "global_step": 245226, "epoch": 2954} {"train_loss": -24.792001724243164, "global_step": 245227, "epoch": 2954} {"train_loss": -24.96382713317871, "global_step": 245228, "epoch": 2954} {"train_loss": -25.153722763061523, "global_step": 245229, "epoch": 2954} {"train_loss": -24.791669845581055, "global_step": 245230, "epoch": 2954} {"train_loss": -24.977436065673828, "global_step": 245231, "epoch": 2954} {"train_loss": -24.877267837524414, "global_step": 245232, "epoch": 2954} {"train_loss": -24.828617095947266, "global_step": 245233, "epoch": 2954} {"train_loss": -24.735654830932617, "global_step": 245234, "epoch": 2954} {"train_loss": -24.947555541992188, "global_step": 245235, "epoch": 2954} {"train_loss": -24.7696533203125, "global_step": 245236, "epoch": 2954} {"train_loss": -24.8145751953125, "global_step": 245237, "epoch": 2954} {"train_loss": -25.538610458374023, "global_step": 245238, "epoch": 2954} {"train_loss": -24.86330223083496, "global_step": 245239, "epoch": 2954} {"train_loss": -25.196134567260742, "global_step": 245240, "epoch": 2954} {"train_loss": -24.485206604003906, "global_step": 245241, "epoch": 2954} {"train_loss": -25.091760635375977, "global_step": 245242, "epoch": 2954} {"train_loss": -24.860828399658203, "global_step": 245243, "epoch": 2954} {"train_loss": -24.996795654296875, "global_step": 245244, "epoch": 2954} {"train_loss": -24.99738883972168, "global_step": 245245, "epoch": 2954} {"train_loss": -25.088703155517578, "global_step": 245246, "epoch": 2954} {"train_loss": -24.842247009277344, "global_step": 245247, "epoch": 2954} {"train_loss": -25.2340030670166, "global_step": 245248, "epoch": 2954} {"train_loss": -24.885995864868164, "global_step": 245249, "epoch": 2954} {"train_loss": -24.681880950927734, "global_step": 245250, "epoch": 2954} {"train_loss": -25.044544219970703, "global_step": 245251, "epoch": 2954} {"train_loss": -24.9251766204834, "global_step": 245252, "epoch": 2954} {"train_loss": -24.93044662475586, "global_step": 245253, "epoch": 2954} {"train_loss": -25.07917594909668, "global_step": 245254, "epoch": 2954} {"train_loss": -24.918109893798828, "global_step": 245255, "epoch": 2954} {"train_loss": -25.19816017150879, "global_step": 245256, "epoch": 2954} {"train_loss": -24.805509567260742, "global_step": 245257, "epoch": 2954} {"train_loss": -25.02485466003418, "global_step": 245258, "epoch": 2954} {"train_loss": -24.993824005126953, "global_step": 245259, "epoch": 2954} {"train_loss": -25.106760025024414, "global_step": 245260, "epoch": 2954} {"train_loss": -25.207454681396484, "global_step": 245261, "epoch": 2954} {"train_loss": -25.255884170532227, "global_step": 245262, "epoch": 2954} {"train_loss": -24.440052032470703, "global_step": 245263, "epoch": 2954} {"train_loss": -24.793362950704182, "global_step": 245264, "epoch": 2954, "val_loss": 6769757.0} {"train_loss": -24.912263870239258, "global_step": 245265, "epoch": 2955} {"train_loss": -24.242361068725586, "global_step": 245266, "epoch": 2955} {"train_loss": -24.316539764404297, "global_step": 245267, "epoch": 2955} {"train_loss": -24.594114303588867, "global_step": 245268, "epoch": 2955} {"train_loss": -24.379058837890625, "global_step": 245269, "epoch": 2955} {"train_loss": -24.586477279663086, "global_step": 245270, "epoch": 2955} {"train_loss": -24.845794677734375, "global_step": 245271, "epoch": 2955} {"train_loss": -24.767078399658203, "global_step": 245272, "epoch": 2955} {"train_loss": -24.60684585571289, "global_step": 245273, "epoch": 2955} {"train_loss": -24.455856323242188, "global_step": 245274, "epoch": 2955} {"train_loss": -24.321796417236328, "global_step": 245275, "epoch": 2955} {"train_loss": -24.660762786865234, "global_step": 245276, "epoch": 2955} {"train_loss": -24.61676025390625, "global_step": 245277, "epoch": 2955} {"train_loss": -24.772043228149414, "global_step": 245278, "epoch": 2955} {"train_loss": -24.6162166595459, "global_step": 245279, "epoch": 2955} {"train_loss": -24.578664779663086, "global_step": 245280, "epoch": 2955} {"train_loss": -24.60062026977539, "global_step": 245281, "epoch": 2955} {"train_loss": -24.740814208984375, "global_step": 245282, "epoch": 2955} {"train_loss": -24.84522247314453, "global_step": 245283, "epoch": 2955} {"train_loss": -24.683956146240234, "global_step": 245284, "epoch": 2955} {"train_loss": -24.632966995239258, "global_step": 245285, "epoch": 2955} {"train_loss": -24.505367279052734, "global_step": 245286, "epoch": 2955} {"train_loss": -25.375268936157227, "global_step": 245287, "epoch": 2955} {"train_loss": -24.933185577392578, "global_step": 245288, "epoch": 2955} {"train_loss": -25.09929847717285, "global_step": 245289, "epoch": 2955} {"train_loss": -25.2439022064209, "global_step": 245290, "epoch": 2955} {"train_loss": -24.69987678527832, "global_step": 245291, "epoch": 2955} {"train_loss": -24.4084529876709, "global_step": 245292, "epoch": 2955} {"train_loss": -24.756061553955078, "global_step": 245293, "epoch": 2955} {"train_loss": -25.07936668395996, "global_step": 245294, "epoch": 2955} {"train_loss": -24.818023681640625, "global_step": 245295, "epoch": 2955} {"train_loss": -25.102170944213867, "global_step": 245296, "epoch": 2955} {"train_loss": -25.214588165283203, "global_step": 245297, "epoch": 2955} {"train_loss": -25.145973205566406, "global_step": 245298, "epoch": 2955} {"train_loss": -25.0391845703125, "global_step": 245299, "epoch": 2955} {"train_loss": -24.744752883911133, "global_step": 245300, "epoch": 2955} {"train_loss": -25.130517959594727, "global_step": 245301, "epoch": 2955} {"train_loss": -25.1623477935791, "global_step": 245302, "epoch": 2955} {"train_loss": -25.2086124420166, "global_step": 245303, "epoch": 2955} {"train_loss": -25.477476119995117, "global_step": 245304, "epoch": 2955} {"train_loss": -25.14510154724121, "global_step": 245305, "epoch": 2955} {"train_loss": -24.952207565307617, "global_step": 245306, "epoch": 2955} {"train_loss": -25.042253494262695, "global_step": 245307, "epoch": 2955} {"train_loss": -25.106658935546875, "global_step": 245308, "epoch": 2955} {"train_loss": -25.105377197265625, "global_step": 245309, "epoch": 2955} {"train_loss": -25.48085594177246, "global_step": 245310, "epoch": 2955} {"train_loss": -24.919647216796875, "global_step": 245311, "epoch": 2955} {"train_loss": -25.287296295166016, "global_step": 245312, "epoch": 2955} {"train_loss": -25.134296417236328, "global_step": 245313, "epoch": 2955} {"train_loss": -24.79104232788086, "global_step": 245314, "epoch": 2955} {"train_loss": -24.740509033203125, "global_step": 245315, "epoch": 2955} {"train_loss": -24.604248046875, "global_step": 245316, "epoch": 2955} {"train_loss": -24.553625106811523, "global_step": 245317, "epoch": 2955} {"train_loss": -24.995290756225586, "global_step": 245318, "epoch": 2955} {"train_loss": -25.010517120361328, "global_step": 245319, "epoch": 2955} {"train_loss": -25.004688262939453, "global_step": 245320, "epoch": 2955} {"train_loss": -24.770206451416016, "global_step": 245321, "epoch": 2955} {"train_loss": -24.335529327392578, "global_step": 245322, "epoch": 2955} {"train_loss": -24.60752296447754, "global_step": 245323, "epoch": 2955} {"train_loss": -25.115018844604492, "global_step": 245324, "epoch": 2955} {"train_loss": -24.066267013549805, "global_step": 245325, "epoch": 2955} {"train_loss": -24.908193588256836, "global_step": 245326, "epoch": 2955} {"train_loss": -24.32493019104004, "global_step": 245327, "epoch": 2955} {"train_loss": -24.958175659179688, "global_step": 245328, "epoch": 2955} {"train_loss": -24.574554443359375, "global_step": 245329, "epoch": 2955} {"train_loss": -24.451553344726562, "global_step": 245330, "epoch": 2955} {"train_loss": -24.63978385925293, "global_step": 245331, "epoch": 2955} {"train_loss": -24.608013153076172, "global_step": 245332, "epoch": 2955} {"train_loss": -24.49971580505371, "global_step": 245333, "epoch": 2955} {"train_loss": -24.308557510375977, "global_step": 245334, "epoch": 2955} {"train_loss": -24.495832443237305, "global_step": 245335, "epoch": 2955} {"train_loss": -24.447080612182617, "global_step": 245336, "epoch": 2955} {"train_loss": -24.40431022644043, "global_step": 245337, "epoch": 2955} {"train_loss": -24.410947799682617, "global_step": 245338, "epoch": 2955} {"train_loss": -24.861183166503906, "global_step": 245339, "epoch": 2955} {"train_loss": -24.813222885131836, "global_step": 245340, "epoch": 2955} {"train_loss": -24.676013946533203, "global_step": 245341, "epoch": 2955} {"train_loss": -24.373502731323242, "global_step": 245342, "epoch": 2955} {"train_loss": -24.956663131713867, "global_step": 245343, "epoch": 2955} {"train_loss": -24.676605224609375, "global_step": 245344, "epoch": 2955} {"train_loss": -24.9885311126709, "global_step": 245345, "epoch": 2955} {"train_loss": -25.16891098022461, "global_step": 245346, "epoch": 2955} {"train_loss": -24.792988145207783, "global_step": 245347, "epoch": 2955, "val_loss": 6742261.5} {"train_loss": -24.846725463867188, "global_step": 245348, "epoch": 2956} {"train_loss": -24.338960647583008, "global_step": 245349, "epoch": 2956} {"train_loss": -24.361886978149414, "global_step": 245350, "epoch": 2956} {"train_loss": -24.529096603393555, "global_step": 245351, "epoch": 2956} {"train_loss": -24.87662696838379, "global_step": 245352, "epoch": 2956} {"train_loss": -24.649499893188477, "global_step": 245353, "epoch": 2956} {"train_loss": -24.5107479095459, "global_step": 245354, "epoch": 2956} {"train_loss": -24.265363693237305, "global_step": 245355, "epoch": 2956} {"train_loss": -25.170679092407227, "global_step": 245356, "epoch": 2956} {"train_loss": -24.61781120300293, "global_step": 245357, "epoch": 2956} {"train_loss": -24.286291122436523, "global_step": 245358, "epoch": 2956} {"train_loss": -25.01144790649414, "global_step": 245359, "epoch": 2956} {"train_loss": -24.45503807067871, "global_step": 245360, "epoch": 2956} {"train_loss": -24.850576400756836, "global_step": 245361, "epoch": 2956} {"train_loss": -24.5501766204834, "global_step": 245362, "epoch": 2956} {"train_loss": -23.87425422668457, "global_step": 245363, "epoch": 2956} {"train_loss": -24.80802345275879, "global_step": 245364, "epoch": 2956} {"train_loss": -24.883657455444336, "global_step": 245365, "epoch": 2956} {"train_loss": -24.789621353149414, "global_step": 245366, "epoch": 2956} {"train_loss": -25.003244400024414, "global_step": 245367, "epoch": 2956} {"train_loss": -24.90608787536621, "global_step": 245368, "epoch": 2956} {"train_loss": -24.75668716430664, "global_step": 245369, "epoch": 2956} {"train_loss": -25.029783248901367, "global_step": 245370, "epoch": 2956} {"train_loss": -25.131608963012695, "global_step": 245371, "epoch": 2956} {"train_loss": -24.839895248413086, "global_step": 245372, "epoch": 2956} {"train_loss": -24.94422721862793, "global_step": 245373, "epoch": 2956} {"train_loss": -24.941665649414062, "global_step": 245374, "epoch": 2956} {"train_loss": -24.939067840576172, "global_step": 245375, "epoch": 2956} {"train_loss": -25.257360458374023, "global_step": 245376, "epoch": 2956} {"train_loss": -24.3607177734375, "global_step": 245377, "epoch": 2956} {"train_loss": -25.306983947753906, "global_step": 245378, "epoch": 2956} {"train_loss": -24.723262786865234, "global_step": 245379, "epoch": 2956} {"train_loss": -24.921781539916992, "global_step": 245380, "epoch": 2956} {"train_loss": -24.93268394470215, "global_step": 245381, "epoch": 2956} {"train_loss": -24.875532150268555, "global_step": 245382, "epoch": 2956} {"train_loss": -25.07061195373535, "global_step": 245383, "epoch": 2956} {"train_loss": -24.914226531982422, "global_step": 245384, "epoch": 2956} {"train_loss": -25.190021514892578, "global_step": 245385, "epoch": 2956} {"train_loss": -25.142423629760742, "global_step": 245386, "epoch": 2956} {"train_loss": -25.103801727294922, "global_step": 245387, "epoch": 2956} {"train_loss": -24.92396354675293, "global_step": 245388, "epoch": 2956} {"train_loss": -24.787004470825195, "global_step": 245389, "epoch": 2956} {"train_loss": -24.79804801940918, "global_step": 245390, "epoch": 2956} {"train_loss": -25.125137329101562, "global_step": 245391, "epoch": 2956} {"train_loss": -25.023752212524414, "global_step": 245392, "epoch": 2956} {"train_loss": -25.03504753112793, "global_step": 245393, "epoch": 2956} {"train_loss": -24.858240127563477, "global_step": 245394, "epoch": 2956} {"train_loss": -25.19228172302246, "global_step": 245395, "epoch": 2956} {"train_loss": -25.249710083007812, "global_step": 245396, "epoch": 2956} {"train_loss": -25.25485610961914, "global_step": 245397, "epoch": 2956} {"train_loss": -24.58964729309082, "global_step": 245398, "epoch": 2956} {"train_loss": -25.255109786987305, "global_step": 245399, "epoch": 2956} {"train_loss": -25.130577087402344, "global_step": 245400, "epoch": 2956} {"train_loss": -25.238794326782227, "global_step": 245401, "epoch": 2956} {"train_loss": -24.72320556640625, "global_step": 245402, "epoch": 2956} {"train_loss": -24.57986831665039, "global_step": 245403, "epoch": 2956} {"train_loss": -25.020671844482422, "global_step": 245404, "epoch": 2956} {"train_loss": -25.24458122253418, "global_step": 245405, "epoch": 2956} {"train_loss": -25.26089859008789, "global_step": 245406, "epoch": 2956} {"train_loss": -25.211973190307617, "global_step": 245407, "epoch": 2956} {"train_loss": -24.690702438354492, "global_step": 245408, "epoch": 2956} {"train_loss": -24.781112670898438, "global_step": 245409, "epoch": 2956} {"train_loss": -25.323474884033203, "global_step": 245410, "epoch": 2956} {"train_loss": -24.965730667114258, "global_step": 245411, "epoch": 2956} {"train_loss": -24.85944366455078, "global_step": 245412, "epoch": 2956} {"train_loss": -25.126585006713867, "global_step": 245413, "epoch": 2956} {"train_loss": -25.02034568786621, "global_step": 245414, "epoch": 2956} {"train_loss": -24.77996253967285, "global_step": 245415, "epoch": 2956} {"train_loss": -24.928604125976562, "global_step": 245416, "epoch": 2956} {"train_loss": -25.079687118530273, "global_step": 245417, "epoch": 2956} {"train_loss": -25.264028549194336, "global_step": 245418, "epoch": 2956} {"train_loss": -25.059629440307617, "global_step": 245419, "epoch": 2956} {"train_loss": -24.987619400024414, "global_step": 245420, "epoch": 2956} {"train_loss": -25.11907958984375, "global_step": 245421, "epoch": 2956} {"train_loss": -24.482372283935547, "global_step": 245422, "epoch": 2956} {"train_loss": -25.029504776000977, "global_step": 245423, "epoch": 2956} {"train_loss": -24.845502853393555, "global_step": 245424, "epoch": 2956} {"train_loss": -24.98287010192871, "global_step": 245425, "epoch": 2956} {"train_loss": -24.648181915283203, "global_step": 245426, "epoch": 2956} {"train_loss": -25.277441024780273, "global_step": 245427, "epoch": 2956} {"train_loss": -24.864824295043945, "global_step": 245428, "epoch": 2956} {"train_loss": -25.247451782226562, "global_step": 245429, "epoch": 2956} {"train_loss": -24.89876606952713, "global_step": 245430, "epoch": 2956, "val_loss": 6804871.0} {"train_loss": -24.306318283081055, "global_step": 245431, "epoch": 2957} {"train_loss": -24.236331939697266, "global_step": 245432, "epoch": 2957} {"train_loss": -24.596668243408203, "global_step": 245433, "epoch": 2957} {"train_loss": -24.32154655456543, "global_step": 245434, "epoch": 2957} {"train_loss": -24.676206588745117, "global_step": 245435, "epoch": 2957} {"train_loss": -24.626190185546875, "global_step": 245436, "epoch": 2957} {"train_loss": -24.747838973999023, "global_step": 245437, "epoch": 2957} {"train_loss": -24.914670944213867, "global_step": 245438, "epoch": 2957} {"train_loss": -24.399206161499023, "global_step": 245439, "epoch": 2957} {"train_loss": -24.795541763305664, "global_step": 245440, "epoch": 2957} {"train_loss": -24.947355270385742, "global_step": 245441, "epoch": 2957} {"train_loss": -24.610321044921875, "global_step": 245442, "epoch": 2957} {"train_loss": -24.948163986206055, "global_step": 245443, "epoch": 2957} {"train_loss": -24.678348541259766, "global_step": 245444, "epoch": 2957} {"train_loss": -25.050613403320312, "global_step": 245445, "epoch": 2957} {"train_loss": -24.16860580444336, "global_step": 245446, "epoch": 2957} {"train_loss": -24.276952743530273, "global_step": 245447, "epoch": 2957} {"train_loss": -24.74074363708496, "global_step": 245448, "epoch": 2957} {"train_loss": -24.582735061645508, "global_step": 245449, "epoch": 2957} {"train_loss": -24.833454132080078, "global_step": 245450, "epoch": 2957} {"train_loss": -24.769357681274414, "global_step": 245451, "epoch": 2957} {"train_loss": -24.74690055847168, "global_step": 245452, "epoch": 2957} {"train_loss": -25.1113224029541, "global_step": 245453, "epoch": 2957} {"train_loss": -24.57954978942871, "global_step": 245454, "epoch": 2957} {"train_loss": -24.307035446166992, "global_step": 245455, "epoch": 2957} {"train_loss": -24.64249610900879, "global_step": 245456, "epoch": 2957} {"train_loss": -24.07354736328125, "global_step": 245457, "epoch": 2957} {"train_loss": -24.90253257751465, "global_step": 245458, "epoch": 2957} {"train_loss": -24.55722999572754, "global_step": 245459, "epoch": 2957} {"train_loss": -24.842885971069336, "global_step": 245460, "epoch": 2957} {"train_loss": -25.27039909362793, "global_step": 245461, "epoch": 2957} {"train_loss": -25.209228515625, "global_step": 245462, "epoch": 2957} {"train_loss": -24.95638656616211, "global_step": 245463, "epoch": 2957} {"train_loss": -25.22517204284668, "global_step": 245464, "epoch": 2957} {"train_loss": -25.07049560546875, "global_step": 245465, "epoch": 2957} {"train_loss": -25.00774574279785, "global_step": 245466, "epoch": 2957} {"train_loss": -24.571298599243164, "global_step": 245467, "epoch": 2957} {"train_loss": -24.881872177124023, "global_step": 245468, "epoch": 2957} {"train_loss": -24.697696685791016, "global_step": 245469, "epoch": 2957} {"train_loss": -24.875835418701172, "global_step": 245470, "epoch": 2957} {"train_loss": -25.275833129882812, "global_step": 245471, "epoch": 2957} {"train_loss": -25.008235931396484, "global_step": 245472, "epoch": 2957} {"train_loss": -25.226491928100586, "global_step": 245473, "epoch": 2957} {"train_loss": -24.961994171142578, "global_step": 245474, "epoch": 2957} {"train_loss": -25.093597412109375, "global_step": 245475, "epoch": 2957} {"train_loss": -25.000646591186523, "global_step": 245476, "epoch": 2957} {"train_loss": -25.02956771850586, "global_step": 245477, "epoch": 2957} {"train_loss": -25.302593231201172, "global_step": 245478, "epoch": 2957} {"train_loss": -25.18036460876465, "global_step": 245479, "epoch": 2957} {"train_loss": -25.295196533203125, "global_step": 245480, "epoch": 2957} {"train_loss": -25.196426391601562, "global_step": 245481, "epoch": 2957} {"train_loss": -24.967695236206055, "global_step": 245482, "epoch": 2957} {"train_loss": -25.345815658569336, "global_step": 245483, "epoch": 2957} {"train_loss": -25.191558837890625, "global_step": 245484, "epoch": 2957} {"train_loss": -24.91840934753418, "global_step": 245485, "epoch": 2957} {"train_loss": -25.206113815307617, "global_step": 245486, "epoch": 2957} {"train_loss": -24.97474479675293, "global_step": 245487, "epoch": 2957} {"train_loss": -25.127229690551758, "global_step": 245488, "epoch": 2957} {"train_loss": -25.424728393554688, "global_step": 245489, "epoch": 2957} {"train_loss": -24.866741180419922, "global_step": 245490, "epoch": 2957} {"train_loss": -25.13114356994629, "global_step": 245491, "epoch": 2957} {"train_loss": -25.350271224975586, "global_step": 245492, "epoch": 2957} {"train_loss": -24.719465255737305, "global_step": 245493, "epoch": 2957} {"train_loss": -24.941068649291992, "global_step": 245494, "epoch": 2957} {"train_loss": -24.313663482666016, "global_step": 245495, "epoch": 2957} {"train_loss": -23.86429786682129, "global_step": 245496, "epoch": 2957} {"train_loss": -24.186859130859375, "global_step": 245497, "epoch": 2957} {"train_loss": -24.16328239440918, "global_step": 245498, "epoch": 2957} {"train_loss": -24.26881980895996, "global_step": 245499, "epoch": 2957} {"train_loss": -24.466154098510742, "global_step": 245500, "epoch": 2957} {"train_loss": -24.75094985961914, "global_step": 245501, "epoch": 2957} {"train_loss": -23.854764938354492, "global_step": 245502, "epoch": 2957} {"train_loss": -24.711225509643555, "global_step": 245503, "epoch": 2957} {"train_loss": -24.35257911682129, "global_step": 245504, "epoch": 2957} {"train_loss": -24.663265228271484, "global_step": 245505, "epoch": 2957} {"train_loss": -24.927881240844727, "global_step": 245506, "epoch": 2957} {"train_loss": -24.610849380493164, "global_step": 245507, "epoch": 2957} {"train_loss": -24.732845306396484, "global_step": 245508, "epoch": 2957} {"train_loss": -24.827512741088867, "global_step": 245509, "epoch": 2957} {"train_loss": -24.15032386779785, "global_step": 245510, "epoch": 2957} {"train_loss": -24.795148849487305, "global_step": 245511, "epoch": 2957} {"train_loss": -24.553110122680664, "global_step": 245512, "epoch": 2957} {"train_loss": -24.789304848176887, "global_step": 245513, "epoch": 2957, "val_loss": 6839256.0} {"train_loss": -24.537111282348633, "global_step": 245514, "epoch": 2958} {"train_loss": -24.468734741210938, "global_step": 245515, "epoch": 2958} {"train_loss": -24.320816040039062, "global_step": 245516, "epoch": 2958} {"train_loss": -24.640745162963867, "global_step": 245517, "epoch": 2958} {"train_loss": -24.154870986938477, "global_step": 245518, "epoch": 2958} {"train_loss": -24.470945358276367, "global_step": 245519, "epoch": 2958} {"train_loss": -24.46284294128418, "global_step": 245520, "epoch": 2958} {"train_loss": -24.274320602416992, "global_step": 245521, "epoch": 2958} {"train_loss": -24.813434600830078, "global_step": 245522, "epoch": 2958} {"train_loss": -24.310033798217773, "global_step": 245523, "epoch": 2958} {"train_loss": -24.90756607055664, "global_step": 245524, "epoch": 2958} {"train_loss": -25.064733505249023, "global_step": 245525, "epoch": 2958} {"train_loss": -24.774219512939453, "global_step": 245526, "epoch": 2958} {"train_loss": -24.845584869384766, "global_step": 245527, "epoch": 2958} {"train_loss": -24.59699821472168, "global_step": 245528, "epoch": 2958} {"train_loss": -24.795297622680664, "global_step": 245529, "epoch": 2958} {"train_loss": -24.995603561401367, "global_step": 245530, "epoch": 2958} {"train_loss": -24.68397331237793, "global_step": 245531, "epoch": 2958} {"train_loss": -24.844568252563477, "global_step": 245532, "epoch": 2958} {"train_loss": -24.693723678588867, "global_step": 245533, "epoch": 2958} {"train_loss": -24.442296981811523, "global_step": 245534, "epoch": 2958} {"train_loss": -25.010162353515625, "global_step": 245535, "epoch": 2958} {"train_loss": -25.114978790283203, "global_step": 245536, "epoch": 2958} {"train_loss": -25.308401107788086, "global_step": 245537, "epoch": 2958} {"train_loss": -24.728971481323242, "global_step": 245538, "epoch": 2958} {"train_loss": -24.546829223632812, "global_step": 245539, "epoch": 2958} {"train_loss": -24.99525260925293, "global_step": 245540, "epoch": 2958} {"train_loss": -25.024999618530273, "global_step": 245541, "epoch": 2958} {"train_loss": -25.14017105102539, "global_step": 245542, "epoch": 2958} {"train_loss": -24.95172882080078, "global_step": 245543, "epoch": 2958} {"train_loss": -24.62885856628418, "global_step": 245544, "epoch": 2958} {"train_loss": -25.282812118530273, "global_step": 245545, "epoch": 2958} {"train_loss": -25.282094955444336, "global_step": 245546, "epoch": 2958} {"train_loss": -24.77508544921875, "global_step": 245547, "epoch": 2958} {"train_loss": -24.994873046875, "global_step": 245548, "epoch": 2958} {"train_loss": -24.8985538482666, "global_step": 245549, "epoch": 2958} {"train_loss": -24.957075119018555, "global_step": 245550, "epoch": 2958} {"train_loss": -25.24259376525879, "global_step": 245551, "epoch": 2958} {"train_loss": -24.52658462524414, "global_step": 245552, "epoch": 2958} {"train_loss": -24.62605857849121, "global_step": 245553, "epoch": 2958} {"train_loss": -24.680795669555664, "global_step": 245554, "epoch": 2958} {"train_loss": -24.974899291992188, "global_step": 245555, "epoch": 2958} {"train_loss": -24.93596649169922, "global_step": 245556, "epoch": 2958} {"train_loss": -25.067977905273438, "global_step": 245557, "epoch": 2958} {"train_loss": -24.541669845581055, "global_step": 245558, "epoch": 2958} {"train_loss": -24.433908462524414, "global_step": 245559, "epoch": 2958} {"train_loss": -25.08955955505371, "global_step": 245560, "epoch": 2958} {"train_loss": -25.00287437438965, "global_step": 245561, "epoch": 2958} {"train_loss": -24.785350799560547, "global_step": 245562, "epoch": 2958} {"train_loss": -24.83125877380371, "global_step": 245563, "epoch": 2958} {"train_loss": -25.05708885192871, "global_step": 245564, "epoch": 2958} {"train_loss": -24.822677612304688, "global_step": 245565, "epoch": 2958} {"train_loss": -25.0237979888916, "global_step": 245566, "epoch": 2958} {"train_loss": -25.510311126708984, "global_step": 245567, "epoch": 2958} {"train_loss": -25.003612518310547, "global_step": 245568, "epoch": 2958} {"train_loss": -24.91407585144043, "global_step": 245569, "epoch": 2958} {"train_loss": -25.04277801513672, "global_step": 245570, "epoch": 2958} {"train_loss": -25.154098510742188, "global_step": 245571, "epoch": 2958} {"train_loss": -25.007253646850586, "global_step": 245572, "epoch": 2958} {"train_loss": -25.069612503051758, "global_step": 245573, "epoch": 2958} {"train_loss": -25.193952560424805, "global_step": 245574, "epoch": 2958} {"train_loss": -24.863515853881836, "global_step": 245575, "epoch": 2958} {"train_loss": -25.320383071899414, "global_step": 245576, "epoch": 2958} {"train_loss": -25.075809478759766, "global_step": 245577, "epoch": 2958} {"train_loss": -25.152982711791992, "global_step": 245578, "epoch": 2958} {"train_loss": -25.305837631225586, "global_step": 245579, "epoch": 2958} {"train_loss": -25.006656646728516, "global_step": 245580, "epoch": 2958} {"train_loss": -24.569074630737305, "global_step": 245581, "epoch": 2958} {"train_loss": -24.873214721679688, "global_step": 245582, "epoch": 2958} {"train_loss": -25.098602294921875, "global_step": 245583, "epoch": 2958} {"train_loss": -24.940338134765625, "global_step": 245584, "epoch": 2958} {"train_loss": -25.12433433532715, "global_step": 245585, "epoch": 2958} {"train_loss": -24.94086265563965, "global_step": 245586, "epoch": 2958} {"train_loss": -24.941308975219727, "global_step": 245587, "epoch": 2958} {"train_loss": -24.7947998046875, "global_step": 245588, "epoch": 2958} {"train_loss": -25.12860107421875, "global_step": 245589, "epoch": 2958} {"train_loss": -24.724342346191406, "global_step": 245590, "epoch": 2958} {"train_loss": -25.136930465698242, "global_step": 245591, "epoch": 2958} {"train_loss": -24.88470458984375, "global_step": 245592, "epoch": 2958} {"train_loss": -25.13628578186035, "global_step": 245593, "epoch": 2958} {"train_loss": -25.08150291442871, "global_step": 245594, "epoch": 2958} {"train_loss": -24.8275203704834, "global_step": 245595, "epoch": 2958} {"train_loss": -24.864141050591527, "global_step": 245596, "epoch": 2958, "val_loss": 6942293.0} {"train_loss": -24.104881286621094, "global_step": 245597, "epoch": 2959} {"train_loss": -24.075824737548828, "global_step": 245598, "epoch": 2959} {"train_loss": -24.26104736328125, "global_step": 245599, "epoch": 2959} {"train_loss": -24.62249755859375, "global_step": 245600, "epoch": 2959} {"train_loss": -24.379026412963867, "global_step": 245601, "epoch": 2959} {"train_loss": -24.42095375061035, "global_step": 245602, "epoch": 2959} {"train_loss": -24.607223510742188, "global_step": 245603, "epoch": 2959} {"train_loss": -24.627866744995117, "global_step": 245604, "epoch": 2959} {"train_loss": -24.6994686126709, "global_step": 245605, "epoch": 2959} {"train_loss": -24.664335250854492, "global_step": 245606, "epoch": 2959} {"train_loss": -24.833194732666016, "global_step": 245607, "epoch": 2959} {"train_loss": -25.003225326538086, "global_step": 245608, "epoch": 2959} {"train_loss": -24.69284439086914, "global_step": 245609, "epoch": 2959} {"train_loss": -25.023162841796875, "global_step": 245610, "epoch": 2959} {"train_loss": -24.93851089477539, "global_step": 245611, "epoch": 2959} {"train_loss": -25.0487003326416, "global_step": 245612, "epoch": 2959} {"train_loss": -24.683231353759766, "global_step": 245613, "epoch": 2959} {"train_loss": -25.20709800720215, "global_step": 245614, "epoch": 2959} {"train_loss": -24.790395736694336, "global_step": 245615, "epoch": 2959} {"train_loss": -25.116718292236328, "global_step": 245616, "epoch": 2959} {"train_loss": -24.61787986755371, "global_step": 245617, "epoch": 2959} {"train_loss": -25.274593353271484, "global_step": 245618, "epoch": 2959} {"train_loss": -24.779216766357422, "global_step": 245619, "epoch": 2959} {"train_loss": -25.10759735107422, "global_step": 245620, "epoch": 2959} {"train_loss": -24.708391189575195, "global_step": 245621, "epoch": 2959} {"train_loss": -24.696531295776367, "global_step": 245622, "epoch": 2959} {"train_loss": -24.812679290771484, "global_step": 245623, "epoch": 2959} {"train_loss": -25.03325080871582, "global_step": 245624, "epoch": 2959} {"train_loss": -24.930715560913086, "global_step": 245625, "epoch": 2959} {"train_loss": -24.931217193603516, "global_step": 245626, "epoch": 2959} {"train_loss": -25.044279098510742, "global_step": 245627, "epoch": 2959} {"train_loss": -24.94761085510254, "global_step": 245628, "epoch": 2959} {"train_loss": -24.88051414489746, "global_step": 245629, "epoch": 2959} {"train_loss": -24.652191162109375, "global_step": 245630, "epoch": 2959} {"train_loss": -24.951906204223633, "global_step": 245631, "epoch": 2959} {"train_loss": -24.875680923461914, "global_step": 245632, "epoch": 2959} {"train_loss": -24.89690589904785, "global_step": 245633, "epoch": 2959} {"train_loss": -24.837039947509766, "global_step": 245634, "epoch": 2959} {"train_loss": -24.902257919311523, "global_step": 245635, "epoch": 2959} {"train_loss": -25.291004180908203, "global_step": 245636, "epoch": 2959} {"train_loss": -25.273529052734375, "global_step": 245637, "epoch": 2959} {"train_loss": -24.967435836791992, "global_step": 245638, "epoch": 2959} {"train_loss": -25.2338924407959, "global_step": 245639, "epoch": 2959} {"train_loss": -24.83144760131836, "global_step": 245640, "epoch": 2959} {"train_loss": -24.96123695373535, "global_step": 245641, "epoch": 2959} {"train_loss": -25.17041015625, "global_step": 245642, "epoch": 2959} {"train_loss": -25.068891525268555, "global_step": 245643, "epoch": 2959} {"train_loss": -25.348203659057617, "global_step": 245644, "epoch": 2959} {"train_loss": -25.176937103271484, "global_step": 245645, "epoch": 2959} {"train_loss": -25.121461868286133, "global_step": 245646, "epoch": 2959} {"train_loss": -24.898962020874023, "global_step": 245647, "epoch": 2959} {"train_loss": -25.126544952392578, "global_step": 245648, "epoch": 2959} {"train_loss": -24.919967651367188, "global_step": 245649, "epoch": 2959} {"train_loss": -25.161773681640625, "global_step": 245650, "epoch": 2959} {"train_loss": -24.87236976623535, "global_step": 245651, "epoch": 2959} {"train_loss": -25.219533920288086, "global_step": 245652, "epoch": 2959} {"train_loss": -24.613327026367188, "global_step": 245653, "epoch": 2959} {"train_loss": -25.263275146484375, "global_step": 245654, "epoch": 2959} {"train_loss": -24.994626998901367, "global_step": 245655, "epoch": 2959} {"train_loss": -25.43812370300293, "global_step": 245656, "epoch": 2959} {"train_loss": -24.928808212280273, "global_step": 245657, "epoch": 2959} {"train_loss": -24.876577377319336, "global_step": 245658, "epoch": 2959} {"train_loss": -24.68732261657715, "global_step": 245659, "epoch": 2959} {"train_loss": -25.279300689697266, "global_step": 245660, "epoch": 2959} {"train_loss": -25.14366912841797, "global_step": 245661, "epoch": 2959} {"train_loss": -24.98331642150879, "global_step": 245662, "epoch": 2959} {"train_loss": -24.37391471862793, "global_step": 245663, "epoch": 2959} {"train_loss": -24.898229598999023, "global_step": 245664, "epoch": 2959} {"train_loss": -24.742717742919922, "global_step": 245665, "epoch": 2959} {"train_loss": -24.725200653076172, "global_step": 245666, "epoch": 2959} {"train_loss": -24.872318267822266, "global_step": 245667, "epoch": 2959} {"train_loss": -24.752227783203125, "global_step": 245668, "epoch": 2959} {"train_loss": -24.955219268798828, "global_step": 245669, "epoch": 2959} {"train_loss": -24.99310874938965, "global_step": 245670, "epoch": 2959} {"train_loss": -24.43825340270996, "global_step": 245671, "epoch": 2959} {"train_loss": -25.048294067382812, "global_step": 245672, "epoch": 2959} {"train_loss": -25.019187927246094, "global_step": 245673, "epoch": 2959} {"train_loss": -25.04794692993164, "global_step": 245674, "epoch": 2959} {"train_loss": -24.738208770751953, "global_step": 245675, "epoch": 2959} {"train_loss": -24.69944190979004, "global_step": 245676, "epoch": 2959} {"train_loss": -24.722400665283203, "global_step": 245677, "epoch": 2959} {"train_loss": -25.20966148376465, "global_step": 245678, "epoch": 2959} {"train_loss": -24.87741801250412, "global_step": 245679, "epoch": 2959, "val_loss": 6805629.0} {"train_loss": -23.973495483398438, "global_step": 245680, "epoch": 2960} {"train_loss": -23.566268920898438, "global_step": 245681, "epoch": 2960} {"train_loss": -24.591650009155273, "global_step": 245682, "epoch": 2960} {"train_loss": -24.00736427307129, "global_step": 245683, "epoch": 2960} {"train_loss": -24.254837036132812, "global_step": 245684, "epoch": 2960} {"train_loss": -24.128427505493164, "global_step": 245685, "epoch": 2960} {"train_loss": -23.972169876098633, "global_step": 245686, "epoch": 2960} {"train_loss": -23.811506271362305, "global_step": 245687, "epoch": 2960} {"train_loss": -24.489927291870117, "global_step": 245688, "epoch": 2960} {"train_loss": -24.552444458007812, "global_step": 245689, "epoch": 2960} {"train_loss": -24.67251968383789, "global_step": 245690, "epoch": 2960} {"train_loss": -24.69464111328125, "global_step": 245691, "epoch": 2960} {"train_loss": -24.274076461791992, "global_step": 245692, "epoch": 2960} {"train_loss": -24.675981521606445, "global_step": 245693, "epoch": 2960} {"train_loss": -24.61762046813965, "global_step": 245694, "epoch": 2960} {"train_loss": -24.811735153198242, "global_step": 245695, "epoch": 2960} {"train_loss": -24.808813095092773, "global_step": 245696, "epoch": 2960} {"train_loss": -24.905139923095703, "global_step": 245697, "epoch": 2960} {"train_loss": -24.777132034301758, "global_step": 245698, "epoch": 2960} {"train_loss": -25.153223037719727, "global_step": 245699, "epoch": 2960} {"train_loss": -24.716323852539062, "global_step": 245700, "epoch": 2960} {"train_loss": -24.985685348510742, "global_step": 245701, "epoch": 2960} {"train_loss": -25.021896362304688, "global_step": 245702, "epoch": 2960} {"train_loss": -25.166976928710938, "global_step": 245703, "epoch": 2960} {"train_loss": -24.685224533081055, "global_step": 245704, "epoch": 2960} {"train_loss": -24.577112197875977, "global_step": 245705, "epoch": 2960} {"train_loss": -24.6115779876709, "global_step": 245706, "epoch": 2960} {"train_loss": -24.731351852416992, "global_step": 245707, "epoch": 2960} {"train_loss": -25.062978744506836, "global_step": 245708, "epoch": 2960} {"train_loss": -24.989465713500977, "global_step": 245709, "epoch": 2960} {"train_loss": -24.81928825378418, "global_step": 245710, "epoch": 2960} {"train_loss": -24.71986961364746, "global_step": 245711, "epoch": 2960} {"train_loss": -24.908756256103516, "global_step": 245712, "epoch": 2960} {"train_loss": -25.541126251220703, "global_step": 245713, "epoch": 2960} {"train_loss": -24.96712303161621, "global_step": 245714, "epoch": 2960} {"train_loss": -24.977571487426758, "global_step": 245715, "epoch": 2960} {"train_loss": -25.0715274810791, "global_step": 245716, "epoch": 2960} {"train_loss": -25.046863555908203, "global_step": 245717, "epoch": 2960} {"train_loss": -24.849578857421875, "global_step": 245718, "epoch": 2960} {"train_loss": -25.07228660583496, "global_step": 245719, "epoch": 2960} {"train_loss": -24.55733299255371, "global_step": 245720, "epoch": 2960} {"train_loss": -24.768430709838867, "global_step": 245721, "epoch": 2960} {"train_loss": -25.306758880615234, "global_step": 245722, "epoch": 2960} {"train_loss": -25.155149459838867, "global_step": 245723, "epoch": 2960} {"train_loss": -24.5186767578125, "global_step": 245724, "epoch": 2960} {"train_loss": -24.911319732666016, "global_step": 245725, "epoch": 2960} {"train_loss": -25.37114715576172, "global_step": 245726, "epoch": 2960} {"train_loss": -24.958158493041992, "global_step": 245727, "epoch": 2960} {"train_loss": -25.1834774017334, "global_step": 245728, "epoch": 2960} {"train_loss": -25.162343978881836, "global_step": 245729, "epoch": 2960} {"train_loss": -25.435523986816406, "global_step": 245730, "epoch": 2960} {"train_loss": -25.406007766723633, "global_step": 245731, "epoch": 2960} {"train_loss": -25.350767135620117, "global_step": 245732, "epoch": 2960} {"train_loss": -25.431243896484375, "global_step": 245733, "epoch": 2960} {"train_loss": -24.92601776123047, "global_step": 245734, "epoch": 2960} {"train_loss": -25.28101348876953, "global_step": 245735, "epoch": 2960} {"train_loss": -25.439069747924805, "global_step": 245736, "epoch": 2960} {"train_loss": -25.13443374633789, "global_step": 245737, "epoch": 2960} {"train_loss": -24.789121627807617, "global_step": 245738, "epoch": 2960} {"train_loss": -24.945898056030273, "global_step": 245739, "epoch": 2960} {"train_loss": -25.228437423706055, "global_step": 245740, "epoch": 2960} {"train_loss": -24.99031639099121, "global_step": 245741, "epoch": 2960} {"train_loss": -25.108570098876953, "global_step": 245742, "epoch": 2960} {"train_loss": -25.0006160736084, "global_step": 245743, "epoch": 2960} {"train_loss": -24.92162322998047, "global_step": 245744, "epoch": 2960} {"train_loss": -25.065353393554688, "global_step": 245745, "epoch": 2960} {"train_loss": -25.364416122436523, "global_step": 245746, "epoch": 2960} {"train_loss": -24.9338436126709, "global_step": 245747, "epoch": 2960} {"train_loss": -24.591835021972656, "global_step": 245748, "epoch": 2960} {"train_loss": -24.43952751159668, "global_step": 245749, "epoch": 2960} {"train_loss": -24.220510482788086, "global_step": 245750, "epoch": 2960} {"train_loss": -24.727375030517578, "global_step": 245751, "epoch": 2960} {"train_loss": -25.100631713867188, "global_step": 245752, "epoch": 2960} {"train_loss": -24.924314498901367, "global_step": 245753, "epoch": 2960} {"train_loss": -24.55742073059082, "global_step": 245754, "epoch": 2960} {"train_loss": -25.1707706451416, "global_step": 245755, "epoch": 2960} {"train_loss": -25.042850494384766, "global_step": 245756, "epoch": 2960} {"train_loss": -24.482364654541016, "global_step": 245757, "epoch": 2960} {"train_loss": -24.609159469604492, "global_step": 245758, "epoch": 2960} {"train_loss": -24.85685157775879, "global_step": 245759, "epoch": 2960} {"train_loss": -24.673797607421875, "global_step": 245760, "epoch": 2960} {"train_loss": -25.068212509155273, "global_step": 245761, "epoch": 2960} {"train_loss": -24.84589859376471, "global_step": 245762, "epoch": 2960, "val_loss": 6989732.0} {"train_loss": -24.64021110534668, "global_step": 245763, "epoch": 2961} {"train_loss": -24.62040138244629, "global_step": 245764, "epoch": 2961} {"train_loss": -24.955551147460938, "global_step": 245765, "epoch": 2961} {"train_loss": -24.63028335571289, "global_step": 245766, "epoch": 2961} {"train_loss": -24.17487144470215, "global_step": 245767, "epoch": 2961} {"train_loss": -24.57158088684082, "global_step": 245768, "epoch": 2961} {"train_loss": -24.803070068359375, "global_step": 245769, "epoch": 2961} {"train_loss": -24.94561767578125, "global_step": 245770, "epoch": 2961} {"train_loss": -24.50814437866211, "global_step": 245771, "epoch": 2961} {"train_loss": -24.718549728393555, "global_step": 245772, "epoch": 2961} {"train_loss": -24.82832908630371, "global_step": 245773, "epoch": 2961} {"train_loss": -24.929487228393555, "global_step": 245774, "epoch": 2961} {"train_loss": -24.899534225463867, "global_step": 245775, "epoch": 2961} {"train_loss": -24.763303756713867, "global_step": 245776, "epoch": 2961} {"train_loss": -24.907766342163086, "global_step": 245777, "epoch": 2961} {"train_loss": -25.029264450073242, "global_step": 245778, "epoch": 2961} {"train_loss": -25.087326049804688, "global_step": 245779, "epoch": 2961} {"train_loss": -24.74561309814453, "global_step": 245780, "epoch": 2961} {"train_loss": -25.022682189941406, "global_step": 245781, "epoch": 2961} {"train_loss": -25.105655670166016, "global_step": 245782, "epoch": 2961} {"train_loss": -25.118907928466797, "global_step": 245783, "epoch": 2961} {"train_loss": -24.940000534057617, "global_step": 245784, "epoch": 2961} {"train_loss": -25.161819458007812, "global_step": 245785, "epoch": 2961} {"train_loss": -24.844362258911133, "global_step": 245786, "epoch": 2961} {"train_loss": -25.15036392211914, "global_step": 245787, "epoch": 2961} {"train_loss": -25.09041976928711, "global_step": 245788, "epoch": 2961} {"train_loss": -25.058198928833008, "global_step": 245789, "epoch": 2961} {"train_loss": -25.296985626220703, "global_step": 245790, "epoch": 2961} {"train_loss": -25.195497512817383, "global_step": 245791, "epoch": 2961} {"train_loss": -24.99705696105957, "global_step": 245792, "epoch": 2961} {"train_loss": -25.35986328125, "global_step": 245793, "epoch": 2961} {"train_loss": -24.91300392150879, "global_step": 245794, "epoch": 2961} {"train_loss": -25.037994384765625, "global_step": 245795, "epoch": 2961} {"train_loss": -25.321321487426758, "global_step": 245796, "epoch": 2961} {"train_loss": -24.985456466674805, "global_step": 245797, "epoch": 2961} {"train_loss": -25.45687484741211, "global_step": 245798, "epoch": 2961} {"train_loss": -25.188989639282227, "global_step": 245799, "epoch": 2961} {"train_loss": -25.017602920532227, "global_step": 245800, "epoch": 2961} {"train_loss": -24.949844360351562, "global_step": 245801, "epoch": 2961} {"train_loss": -24.811128616333008, "global_step": 245802, "epoch": 2961} {"train_loss": -25.128482818603516, "global_step": 245803, "epoch": 2961} {"train_loss": -25.011249542236328, "global_step": 245804, "epoch": 2961} {"train_loss": -24.68551254272461, "global_step": 245805, "epoch": 2961} {"train_loss": -24.6955623626709, "global_step": 245806, "epoch": 2961} {"train_loss": -24.376245498657227, "global_step": 245807, "epoch": 2961} {"train_loss": -25.077598571777344, "global_step": 245808, "epoch": 2961} {"train_loss": -24.5900936126709, "global_step": 245809, "epoch": 2961} {"train_loss": -24.563339233398438, "global_step": 245810, "epoch": 2961} {"train_loss": -24.890727996826172, "global_step": 245811, "epoch": 2961} {"train_loss": -24.706661224365234, "global_step": 245812, "epoch": 2961} {"train_loss": -24.574419021606445, "global_step": 245813, "epoch": 2961} {"train_loss": -24.81351661682129, "global_step": 245814, "epoch": 2961} {"train_loss": -24.71700096130371, "global_step": 245815, "epoch": 2961} {"train_loss": -24.907989501953125, "global_step": 245816, "epoch": 2961} {"train_loss": -24.83137321472168, "global_step": 245817, "epoch": 2961} {"train_loss": -24.3930721282959, "global_step": 245818, "epoch": 2961} {"train_loss": -24.964614868164062, "global_step": 245819, "epoch": 2961} {"train_loss": -24.509550094604492, "global_step": 245820, "epoch": 2961} {"train_loss": -24.943302154541016, "global_step": 245821, "epoch": 2961} {"train_loss": -25.09708595275879, "global_step": 245822, "epoch": 2961} {"train_loss": -25.140792846679688, "global_step": 245823, "epoch": 2961} {"train_loss": -24.683340072631836, "global_step": 245824, "epoch": 2961} {"train_loss": -24.7829647064209, "global_step": 245825, "epoch": 2961} {"train_loss": -24.93440818786621, "global_step": 245826, "epoch": 2961} {"train_loss": -25.298742294311523, "global_step": 245827, "epoch": 2961} {"train_loss": -25.240522384643555, "global_step": 245828, "epoch": 2961} {"train_loss": -24.74109649658203, "global_step": 245829, "epoch": 2961} {"train_loss": -24.88025665283203, "global_step": 245830, "epoch": 2961} {"train_loss": -24.929458618164062, "global_step": 245831, "epoch": 2961} {"train_loss": -24.59278678894043, "global_step": 245832, "epoch": 2961} {"train_loss": -25.068828582763672, "global_step": 245833, "epoch": 2961} {"train_loss": -24.881277084350586, "global_step": 245834, "epoch": 2961} {"train_loss": -25.17943000793457, "global_step": 245835, "epoch": 2961} {"train_loss": -25.1768856048584, "global_step": 245836, "epoch": 2961} {"train_loss": -25.209463119506836, "global_step": 245837, "epoch": 2961} {"train_loss": -25.30996322631836, "global_step": 245838, "epoch": 2961} {"train_loss": -24.34195327758789, "global_step": 245839, "epoch": 2961} {"train_loss": -24.936603546142578, "global_step": 245840, "epoch": 2961} {"train_loss": -25.06631851196289, "global_step": 245841, "epoch": 2961} {"train_loss": -24.87911033630371, "global_step": 245842, "epoch": 2961} {"train_loss": -25.015684127807617, "global_step": 245843, "epoch": 2961} {"train_loss": -25.20766258239746, "global_step": 245844, "epoch": 2961} {"train_loss": -24.908337673508978, "global_step": 245845, "epoch": 2961, "val_loss": 6745112.5} {"train_loss": -24.223217010498047, "global_step": 245846, "epoch": 2962} {"train_loss": -24.262441635131836, "global_step": 245847, "epoch": 2962} {"train_loss": -23.84381675720215, "global_step": 245848, "epoch": 2962} {"train_loss": -25.085189819335938, "global_step": 245849, "epoch": 2962} {"train_loss": -24.449216842651367, "global_step": 245850, "epoch": 2962} {"train_loss": -23.886682510375977, "global_step": 245851, "epoch": 2962} {"train_loss": -24.532512664794922, "global_step": 245852, "epoch": 2962} {"train_loss": -24.10999870300293, "global_step": 245853, "epoch": 2962} {"train_loss": -24.805618286132812, "global_step": 245854, "epoch": 2962} {"train_loss": -24.64659309387207, "global_step": 245855, "epoch": 2962} {"train_loss": -24.574342727661133, "global_step": 245856, "epoch": 2962} {"train_loss": -24.51386070251465, "global_step": 245857, "epoch": 2962} {"train_loss": -24.7790470123291, "global_step": 245858, "epoch": 2962} {"train_loss": -24.620756149291992, "global_step": 245859, "epoch": 2962} {"train_loss": -25.19361686706543, "global_step": 245860, "epoch": 2962} {"train_loss": -24.366779327392578, "global_step": 245861, "epoch": 2962} {"train_loss": -24.92782211303711, "global_step": 245862, "epoch": 2962} {"train_loss": -24.489065170288086, "global_step": 245863, "epoch": 2962} {"train_loss": -24.79522132873535, "global_step": 245864, "epoch": 2962} {"train_loss": -24.74686050415039, "global_step": 245865, "epoch": 2962} {"train_loss": -24.6661376953125, "global_step": 245866, "epoch": 2962} {"train_loss": -24.841989517211914, "global_step": 245867, "epoch": 2962} {"train_loss": -24.571367263793945, "global_step": 245868, "epoch": 2962} {"train_loss": -24.794281005859375, "global_step": 245869, "epoch": 2962} {"train_loss": -24.7430477142334, "global_step": 245870, "epoch": 2962} {"train_loss": -24.74885368347168, "global_step": 245871, "epoch": 2962} {"train_loss": -24.973737716674805, "global_step": 245872, "epoch": 2962} {"train_loss": -24.87984275817871, "global_step": 245873, "epoch": 2962} {"train_loss": -24.883380889892578, "global_step": 245874, "epoch": 2962} {"train_loss": -25.002099990844727, "global_step": 245875, "epoch": 2962} {"train_loss": -24.964574813842773, "global_step": 245876, "epoch": 2962} {"train_loss": -24.97892189025879, "global_step": 245877, "epoch": 2962} {"train_loss": -24.789548873901367, "global_step": 245878, "epoch": 2962} {"train_loss": -25.11720848083496, "global_step": 245879, "epoch": 2962} {"train_loss": -25.13276481628418, "global_step": 245880, "epoch": 2962} {"train_loss": -25.042814254760742, "global_step": 245881, "epoch": 2962} {"train_loss": -24.543745040893555, "global_step": 245882, "epoch": 2962} {"train_loss": -25.16090202331543, "global_step": 245883, "epoch": 2962} {"train_loss": -24.57234001159668, "global_step": 245884, "epoch": 2962} {"train_loss": -25.035444259643555, "global_step": 245885, "epoch": 2962} {"train_loss": -25.060373306274414, "global_step": 245886, "epoch": 2962} {"train_loss": -25.080411911010742, "global_step": 245887, "epoch": 2962} {"train_loss": -25.106910705566406, "global_step": 245888, "epoch": 2962} {"train_loss": -24.78607749938965, "global_step": 245889, "epoch": 2962} {"train_loss": -24.97395896911621, "global_step": 245890, "epoch": 2962} {"train_loss": -25.264516830444336, "global_step": 245891, "epoch": 2962} {"train_loss": -24.962095260620117, "global_step": 245892, "epoch": 2962} {"train_loss": -25.542098999023438, "global_step": 245893, "epoch": 2962} {"train_loss": -25.05586814880371, "global_step": 245894, "epoch": 2962} {"train_loss": -25.218353271484375, "global_step": 245895, "epoch": 2962} {"train_loss": -24.96739959716797, "global_step": 245896, "epoch": 2962} {"train_loss": -25.308645248413086, "global_step": 245897, "epoch": 2962} {"train_loss": -24.842798233032227, "global_step": 245898, "epoch": 2962} {"train_loss": -25.083707809448242, "global_step": 245899, "epoch": 2962} {"train_loss": -24.5445499420166, "global_step": 245900, "epoch": 2962} {"train_loss": -24.9359188079834, "global_step": 245901, "epoch": 2962} {"train_loss": -25.323291778564453, "global_step": 245902, "epoch": 2962} {"train_loss": -24.90959358215332, "global_step": 245903, "epoch": 2962} {"train_loss": -24.93604850769043, "global_step": 245904, "epoch": 2962} {"train_loss": -24.866012573242188, "global_step": 245905, "epoch": 2962} {"train_loss": -24.923324584960938, "global_step": 245906, "epoch": 2962} {"train_loss": -25.06534194946289, "global_step": 245907, "epoch": 2962} {"train_loss": -24.418842315673828, "global_step": 245908, "epoch": 2962} {"train_loss": -24.91046714782715, "global_step": 245909, "epoch": 2962} {"train_loss": -25.039770126342773, "global_step": 245910, "epoch": 2962} {"train_loss": -24.778676986694336, "global_step": 245911, "epoch": 2962} {"train_loss": -24.661725997924805, "global_step": 245912, "epoch": 2962} {"train_loss": -24.895734786987305, "global_step": 245913, "epoch": 2962} {"train_loss": -24.879541397094727, "global_step": 245914, "epoch": 2962} {"train_loss": -24.647445678710938, "global_step": 245915, "epoch": 2962} {"train_loss": -24.75611686706543, "global_step": 245916, "epoch": 2962} {"train_loss": -25.031930923461914, "global_step": 245917, "epoch": 2962} {"train_loss": -24.742490768432617, "global_step": 245918, "epoch": 2962} {"train_loss": -24.38115119934082, "global_step": 245919, "epoch": 2962} {"train_loss": -24.7829647064209, "global_step": 245920, "epoch": 2962} {"train_loss": -25.329256057739258, "global_step": 245921, "epoch": 2962} {"train_loss": -24.571420669555664, "global_step": 245922, "epoch": 2962} {"train_loss": -25.11200523376465, "global_step": 245923, "epoch": 2962} {"train_loss": -25.103361129760742, "global_step": 245924, "epoch": 2962} {"train_loss": -24.798608779907227, "global_step": 245925, "epoch": 2962} {"train_loss": -24.84761619567871, "global_step": 245926, "epoch": 2962} {"train_loss": -24.557044982910156, "global_step": 245927, "epoch": 2962} {"train_loss": -24.8152858320489, "global_step": 245928, "epoch": 2962, "val_loss": 6743582.0} {"train_loss": -24.566730499267578, "global_step": 245929, "epoch": 2963} {"train_loss": -24.57107925415039, "global_step": 245930, "epoch": 2963} {"train_loss": -24.735719680786133, "global_step": 245931, "epoch": 2963} {"train_loss": -24.006996154785156, "global_step": 245932, "epoch": 2963} {"train_loss": -24.564468383789062, "global_step": 245933, "epoch": 2963} {"train_loss": -24.442346572875977, "global_step": 245934, "epoch": 2963} {"train_loss": -24.325925827026367, "global_step": 245935, "epoch": 2963} {"train_loss": -24.426366806030273, "global_step": 245936, "epoch": 2963} {"train_loss": -24.641347885131836, "global_step": 245937, "epoch": 2963} {"train_loss": -24.69684410095215, "global_step": 245938, "epoch": 2963} {"train_loss": -24.832630157470703, "global_step": 245939, "epoch": 2963} {"train_loss": -24.475126266479492, "global_step": 245940, "epoch": 2963} {"train_loss": -24.629098892211914, "global_step": 245941, "epoch": 2963} {"train_loss": -24.553152084350586, "global_step": 245942, "epoch": 2963} {"train_loss": -24.820356369018555, "global_step": 245943, "epoch": 2963} {"train_loss": -24.629608154296875, "global_step": 245944, "epoch": 2963} {"train_loss": -24.593923568725586, "global_step": 245945, "epoch": 2963} {"train_loss": -24.743499755859375, "global_step": 245946, "epoch": 2963} {"train_loss": -24.930004119873047, "global_step": 245947, "epoch": 2963} {"train_loss": -25.107202529907227, "global_step": 245948, "epoch": 2963} {"train_loss": -24.916545867919922, "global_step": 245949, "epoch": 2963} {"train_loss": -24.769670486450195, "global_step": 245950, "epoch": 2963} {"train_loss": -24.765043258666992, "global_step": 245951, "epoch": 2963} {"train_loss": -24.84903907775879, "global_step": 245952, "epoch": 2963} {"train_loss": -24.77164649963379, "global_step": 245953, "epoch": 2963} {"train_loss": -24.709339141845703, "global_step": 245954, "epoch": 2963} {"train_loss": -24.9588680267334, "global_step": 245955, "epoch": 2963} {"train_loss": -24.818180084228516, "global_step": 245956, "epoch": 2963} {"train_loss": -25.31122398376465, "global_step": 245957, "epoch": 2963} {"train_loss": -25.289941787719727, "global_step": 245958, "epoch": 2963} {"train_loss": -24.878263473510742, "global_step": 245959, "epoch": 2963} {"train_loss": -25.07936668395996, "global_step": 245960, "epoch": 2963} {"train_loss": -25.05747413635254, "global_step": 245961, "epoch": 2963} {"train_loss": -25.2071590423584, "global_step": 245962, "epoch": 2963} {"train_loss": -25.14934730529785, "global_step": 245963, "epoch": 2963} {"train_loss": -25.13376808166504, "global_step": 245964, "epoch": 2963} {"train_loss": -24.685701370239258, "global_step": 245965, "epoch": 2963} {"train_loss": -25.02635955810547, "global_step": 245966, "epoch": 2963} {"train_loss": -24.9896297454834, "global_step": 245967, "epoch": 2963} {"train_loss": -25.126705169677734, "global_step": 245968, "epoch": 2963} {"train_loss": -25.08453941345215, "global_step": 245969, "epoch": 2963} {"train_loss": -25.298763275146484, "global_step": 245970, "epoch": 2963} {"train_loss": -25.2918643951416, "global_step": 245971, "epoch": 2963} {"train_loss": -25.28896141052246, "global_step": 245972, "epoch": 2963} {"train_loss": -25.172515869140625, "global_step": 245973, "epoch": 2963} {"train_loss": -24.76979637145996, "global_step": 245974, "epoch": 2963} {"train_loss": -24.390050888061523, "global_step": 245975, "epoch": 2963} {"train_loss": -24.557655334472656, "global_step": 245976, "epoch": 2963} {"train_loss": -24.159875869750977, "global_step": 245977, "epoch": 2963} {"train_loss": -24.17502784729004, "global_step": 245978, "epoch": 2963} {"train_loss": -24.30494499206543, "global_step": 245979, "epoch": 2963} {"train_loss": -25.023048400878906, "global_step": 245980, "epoch": 2963} {"train_loss": -25.139822006225586, "global_step": 245981, "epoch": 2963} {"train_loss": -24.809965133666992, "global_step": 245982, "epoch": 2963} {"train_loss": -25.205493927001953, "global_step": 245983, "epoch": 2963} {"train_loss": -24.75632667541504, "global_step": 245984, "epoch": 2963} {"train_loss": -24.57538414001465, "global_step": 245985, "epoch": 2963} {"train_loss": -24.74708366394043, "global_step": 245986, "epoch": 2963} {"train_loss": -24.935853958129883, "global_step": 245987, "epoch": 2963} {"train_loss": -24.841642379760742, "global_step": 245988, "epoch": 2963} {"train_loss": -24.707420349121094, "global_step": 245989, "epoch": 2963} {"train_loss": -25.009204864501953, "global_step": 245990, "epoch": 2963} {"train_loss": -24.89839744567871, "global_step": 245991, "epoch": 2963} {"train_loss": -25.124662399291992, "global_step": 245992, "epoch": 2963} {"train_loss": -24.906375885009766, "global_step": 245993, "epoch": 2963} {"train_loss": -24.97076416015625, "global_step": 245994, "epoch": 2963} {"train_loss": -24.73430824279785, "global_step": 245995, "epoch": 2963} {"train_loss": -24.80424690246582, "global_step": 245996, "epoch": 2963} {"train_loss": -25.126996994018555, "global_step": 245997, "epoch": 2963} {"train_loss": -24.87557029724121, "global_step": 245998, "epoch": 2963} {"train_loss": -24.86895751953125, "global_step": 245999, "epoch": 2963} {"train_loss": -24.93793296813965, "global_step": 246000, "epoch": 2963} {"train_loss": -25.09004783630371, "global_step": 246001, "epoch": 2963} {"train_loss": -25.34139060974121, "global_step": 246002, "epoch": 2963} {"train_loss": -24.987646102905273, "global_step": 246003, "epoch": 2963} {"train_loss": -24.768516540527344, "global_step": 246004, "epoch": 2963} {"train_loss": -25.119150161743164, "global_step": 246005, "epoch": 2963} {"train_loss": -25.26189422607422, "global_step": 246006, "epoch": 2963} {"train_loss": -25.531265258789062, "global_step": 246007, "epoch": 2963} {"train_loss": -24.954574584960938, "global_step": 246008, "epoch": 2963} {"train_loss": -25.135190963745117, "global_step": 246009, "epoch": 2963} {"train_loss": -24.711759567260742, "global_step": 246010, "epoch": 2963} {"train_loss": -24.863748803196184, "global_step": 246011, "epoch": 2963, "val_loss": 6856438.0} {"train_loss": -24.467483520507812, "global_step": 246012, "epoch": 2964} {"train_loss": -24.608230590820312, "global_step": 246013, "epoch": 2964} {"train_loss": -24.386005401611328, "global_step": 246014, "epoch": 2964} {"train_loss": -24.54359245300293, "global_step": 246015, "epoch": 2964} {"train_loss": -24.87207794189453, "global_step": 246016, "epoch": 2964} {"train_loss": -24.801776885986328, "global_step": 246017, "epoch": 2964} {"train_loss": -24.8543643951416, "global_step": 246018, "epoch": 2964} {"train_loss": -25.0445613861084, "global_step": 246019, "epoch": 2964} {"train_loss": -24.801837921142578, "global_step": 246020, "epoch": 2964} {"train_loss": -24.97132682800293, "global_step": 246021, "epoch": 2964} {"train_loss": -24.838552474975586, "global_step": 246022, "epoch": 2964} {"train_loss": -24.738100051879883, "global_step": 246023, "epoch": 2964} {"train_loss": -24.879304885864258, "global_step": 246024, "epoch": 2964} {"train_loss": -25.091352462768555, "global_step": 246025, "epoch": 2964} {"train_loss": -24.971845626831055, "global_step": 246026, "epoch": 2964} {"train_loss": -25.243528366088867, "global_step": 246027, "epoch": 2964} {"train_loss": -24.92508316040039, "global_step": 246028, "epoch": 2964} {"train_loss": -24.92082977294922, "global_step": 246029, "epoch": 2964} {"train_loss": -25.198711395263672, "global_step": 246030, "epoch": 2964} {"train_loss": -24.84535789489746, "global_step": 246031, "epoch": 2964} {"train_loss": -25.475513458251953, "global_step": 246032, "epoch": 2964} {"train_loss": -24.84787368774414, "global_step": 246033, "epoch": 2964} {"train_loss": -25.09059715270996, "global_step": 246034, "epoch": 2964} {"train_loss": -25.132062911987305, "global_step": 246035, "epoch": 2964} {"train_loss": -24.945730209350586, "global_step": 246036, "epoch": 2964} {"train_loss": -25.220184326171875, "global_step": 246037, "epoch": 2964} {"train_loss": -24.864364624023438, "global_step": 246038, "epoch": 2964} {"train_loss": -25.0847225189209, "global_step": 246039, "epoch": 2964} {"train_loss": -25.129146575927734, "global_step": 246040, "epoch": 2964} {"train_loss": -24.985239028930664, "global_step": 246041, "epoch": 2964} {"train_loss": -25.059972763061523, "global_step": 246042, "epoch": 2964} {"train_loss": -24.96438980102539, "global_step": 246043, "epoch": 2964} {"train_loss": -24.959598541259766, "global_step": 246044, "epoch": 2964} {"train_loss": -25.249109268188477, "global_step": 246045, "epoch": 2964} {"train_loss": -25.30111312866211, "global_step": 246046, "epoch": 2964} {"train_loss": -24.700347900390625, "global_step": 246047, "epoch": 2964} {"train_loss": -25.204248428344727, "global_step": 246048, "epoch": 2964} {"train_loss": -24.887922286987305, "global_step": 246049, "epoch": 2964} {"train_loss": -24.864160537719727, "global_step": 246050, "epoch": 2964} {"train_loss": -24.90260124206543, "global_step": 246051, "epoch": 2964} {"train_loss": -24.78293800354004, "global_step": 246052, "epoch": 2964} {"train_loss": -25.230236053466797, "global_step": 246053, "epoch": 2964} {"train_loss": -24.882347106933594, "global_step": 246054, "epoch": 2964} {"train_loss": -24.631183624267578, "global_step": 246055, "epoch": 2964} {"train_loss": -24.635133743286133, "global_step": 246056, "epoch": 2964} {"train_loss": -24.428390502929688, "global_step": 246057, "epoch": 2964} {"train_loss": -25.057544708251953, "global_step": 246058, "epoch": 2964} {"train_loss": -25.437456130981445, "global_step": 246059, "epoch": 2964} {"train_loss": -25.460643768310547, "global_step": 246060, "epoch": 2964} {"train_loss": -25.20153045654297, "global_step": 246061, "epoch": 2964} {"train_loss": -24.78183937072754, "global_step": 246062, "epoch": 2964} {"train_loss": -25.155029296875, "global_step": 246063, "epoch": 2964} {"train_loss": -25.045873641967773, "global_step": 246064, "epoch": 2964} {"train_loss": -25.06512451171875, "global_step": 246065, "epoch": 2964} {"train_loss": -25.17020606994629, "global_step": 246066, "epoch": 2964} {"train_loss": -25.28022575378418, "global_step": 246067, "epoch": 2964} {"train_loss": -25.09358787536621, "global_step": 246068, "epoch": 2964} {"train_loss": -24.879026412963867, "global_step": 246069, "epoch": 2964} {"train_loss": -24.845767974853516, "global_step": 246070, "epoch": 2964} {"train_loss": -25.018136978149414, "global_step": 246071, "epoch": 2964} {"train_loss": -24.885948181152344, "global_step": 246072, "epoch": 2964} {"train_loss": -25.18806266784668, "global_step": 246073, "epoch": 2964} {"train_loss": -24.897550582885742, "global_step": 246074, "epoch": 2964} {"train_loss": -24.815614700317383, "global_step": 246075, "epoch": 2964} {"train_loss": -25.354047775268555, "global_step": 246076, "epoch": 2964} {"train_loss": -24.776947021484375, "global_step": 246077, "epoch": 2964} {"train_loss": -25.161584854125977, "global_step": 246078, "epoch": 2964} {"train_loss": -24.64725112915039, "global_step": 246079, "epoch": 2964} {"train_loss": -24.99945831298828, "global_step": 246080, "epoch": 2964} {"train_loss": -24.707204818725586, "global_step": 246081, "epoch": 2964} {"train_loss": -25.127553939819336, "global_step": 246082, "epoch": 2964} {"train_loss": -24.90080451965332, "global_step": 246083, "epoch": 2964} {"train_loss": -24.967803955078125, "global_step": 246084, "epoch": 2964} {"train_loss": -24.885150909423828, "global_step": 246085, "epoch": 2964} {"train_loss": -24.777616500854492, "global_step": 246086, "epoch": 2964} {"train_loss": -24.67388343811035, "global_step": 246087, "epoch": 2964} {"train_loss": -25.30037498474121, "global_step": 246088, "epoch": 2964} {"train_loss": -25.034902572631836, "global_step": 246089, "epoch": 2964} {"train_loss": -25.270002365112305, "global_step": 246090, "epoch": 2964} {"train_loss": -25.21205711364746, "global_step": 246091, "epoch": 2964} {"train_loss": -24.89480972290039, "global_step": 246092, "epoch": 2964} {"train_loss": -24.899829864501953, "global_step": 246093, "epoch": 2964} {"train_loss": -24.954238202198443, "global_step": 246094, "epoch": 2964, "val_loss": 6834098.0} {"train_loss": -24.426462173461914, "global_step": 246095, "epoch": 2965} {"train_loss": -24.24169921875, "global_step": 246096, "epoch": 2965} {"train_loss": -24.340343475341797, "global_step": 246097, "epoch": 2965} {"train_loss": -24.409757614135742, "global_step": 246098, "epoch": 2965} {"train_loss": -24.703048706054688, "global_step": 246099, "epoch": 2965} {"train_loss": -24.803842544555664, "global_step": 246100, "epoch": 2965} {"train_loss": -24.691495895385742, "global_step": 246101, "epoch": 2965} {"train_loss": -24.47040557861328, "global_step": 246102, "epoch": 2965} {"train_loss": -24.612220764160156, "global_step": 246103, "epoch": 2965} {"train_loss": -24.428855895996094, "global_step": 246104, "epoch": 2965} {"train_loss": -24.829975128173828, "global_step": 246105, "epoch": 2965} {"train_loss": -24.57281494140625, "global_step": 246106, "epoch": 2965} {"train_loss": -24.711273193359375, "global_step": 246107, "epoch": 2965} {"train_loss": -24.649030685424805, "global_step": 246108, "epoch": 2965} {"train_loss": -24.964052200317383, "global_step": 246109, "epoch": 2965} {"train_loss": -24.74763298034668, "global_step": 246110, "epoch": 2965} {"train_loss": -24.943603515625, "global_step": 246111, "epoch": 2965} {"train_loss": -24.60694694519043, "global_step": 246112, "epoch": 2965} {"train_loss": -25.000343322753906, "global_step": 246113, "epoch": 2965} {"train_loss": -24.95667266845703, "global_step": 246114, "epoch": 2965} {"train_loss": -24.663755416870117, "global_step": 246115, "epoch": 2965} {"train_loss": -24.591293334960938, "global_step": 246116, "epoch": 2965} {"train_loss": -24.834630966186523, "global_step": 246117, "epoch": 2965} {"train_loss": -25.029144287109375, "global_step": 246118, "epoch": 2965} {"train_loss": -24.83534812927246, "global_step": 246119, "epoch": 2965} {"train_loss": -25.09197235107422, "global_step": 246120, "epoch": 2965} {"train_loss": -24.975263595581055, "global_step": 246121, "epoch": 2965} {"train_loss": -25.14447784423828, "global_step": 246122, "epoch": 2965} {"train_loss": -24.94183921813965, "global_step": 246123, "epoch": 2965} {"train_loss": -24.88204002380371, "global_step": 246124, "epoch": 2965} {"train_loss": -24.951345443725586, "global_step": 246125, "epoch": 2965} {"train_loss": -24.8026180267334, "global_step": 246126, "epoch": 2965} {"train_loss": -25.015859603881836, "global_step": 246127, "epoch": 2965} {"train_loss": -24.918088912963867, "global_step": 246128, "epoch": 2965} {"train_loss": -24.720508575439453, "global_step": 246129, "epoch": 2965} {"train_loss": -24.66815757751465, "global_step": 246130, "epoch": 2965} {"train_loss": -25.22059440612793, "global_step": 246131, "epoch": 2965} {"train_loss": -24.82554054260254, "global_step": 246132, "epoch": 2965} {"train_loss": -25.196165084838867, "global_step": 246133, "epoch": 2965} {"train_loss": -25.354618072509766, "global_step": 246134, "epoch": 2965} {"train_loss": -25.125131607055664, "global_step": 246135, "epoch": 2965} {"train_loss": -24.969520568847656, "global_step": 246136, "epoch": 2965} {"train_loss": -25.282983779907227, "global_step": 246137, "epoch": 2965} {"train_loss": -25.31659507751465, "global_step": 246138, "epoch": 2965} {"train_loss": -24.668365478515625, "global_step": 246139, "epoch": 2965} {"train_loss": -25.330718994140625, "global_step": 246140, "epoch": 2965} {"train_loss": -24.810062408447266, "global_step": 246141, "epoch": 2965} {"train_loss": -24.797382354736328, "global_step": 246142, "epoch": 2965} {"train_loss": -25.03621482849121, "global_step": 246143, "epoch": 2965} {"train_loss": -25.071908950805664, "global_step": 246144, "epoch": 2965} {"train_loss": -25.09347915649414, "global_step": 246145, "epoch": 2965} {"train_loss": -25.325307846069336, "global_step": 246146, "epoch": 2965} {"train_loss": -24.522476196289062, "global_step": 246147, "epoch": 2965} {"train_loss": -24.854297637939453, "global_step": 246148, "epoch": 2965} {"train_loss": -24.745281219482422, "global_step": 246149, "epoch": 2965} {"train_loss": -24.932376861572266, "global_step": 246150, "epoch": 2965} {"train_loss": -24.799217224121094, "global_step": 246151, "epoch": 2965} {"train_loss": -24.706022262573242, "global_step": 246152, "epoch": 2965} {"train_loss": -24.648042678833008, "global_step": 246153, "epoch": 2965} {"train_loss": -25.066617965698242, "global_step": 246154, "epoch": 2965} {"train_loss": -24.82771873474121, "global_step": 246155, "epoch": 2965} {"train_loss": -25.035242080688477, "global_step": 246156, "epoch": 2965} {"train_loss": -25.11049461364746, "global_step": 246157, "epoch": 2965} {"train_loss": -25.355112075805664, "global_step": 246158, "epoch": 2965} {"train_loss": -24.968976974487305, "global_step": 246159, "epoch": 2965} {"train_loss": -25.424030303955078, "global_step": 246160, "epoch": 2965} {"train_loss": -25.19416046142578, "global_step": 246161, "epoch": 2965} {"train_loss": -25.020925521850586, "global_step": 246162, "epoch": 2965} {"train_loss": -24.88367462158203, "global_step": 246163, "epoch": 2965} {"train_loss": -25.279144287109375, "global_step": 246164, "epoch": 2965} {"train_loss": -25.03962516784668, "global_step": 246165, "epoch": 2965} {"train_loss": -25.035749435424805, "global_step": 246166, "epoch": 2965} {"train_loss": -24.906309127807617, "global_step": 246167, "epoch": 2965} {"train_loss": -25.18426513671875, "global_step": 246168, "epoch": 2965} {"train_loss": -25.044864654541016, "global_step": 246169, "epoch": 2965} {"train_loss": -24.85373878479004, "global_step": 246170, "epoch": 2965} {"train_loss": -24.410446166992188, "global_step": 246171, "epoch": 2965} {"train_loss": -24.8326358795166, "global_step": 246172, "epoch": 2965} {"train_loss": -25.060529708862305, "global_step": 246173, "epoch": 2965} {"train_loss": -24.72633934020996, "global_step": 246174, "epoch": 2965} {"train_loss": -24.880014419555664, "global_step": 246175, "epoch": 2965} {"train_loss": -24.71116828918457, "global_step": 246176, "epoch": 2965} {"train_loss": -24.878055434629143, "global_step": 246177, "epoch": 2965, "val_loss": 6830484.0} {"train_loss": -24.599985122680664, "global_step": 246178, "epoch": 2966} {"train_loss": -24.486160278320312, "global_step": 246179, "epoch": 2966} {"train_loss": -25.05109977722168, "global_step": 246180, "epoch": 2966} {"train_loss": -24.789838790893555, "global_step": 246181, "epoch": 2966} {"train_loss": -25.007699966430664, "global_step": 246182, "epoch": 2966} {"train_loss": -24.14890480041504, "global_step": 246183, "epoch": 2966} {"train_loss": -24.56869125366211, "global_step": 246184, "epoch": 2966} {"train_loss": -24.6923828125, "global_step": 246185, "epoch": 2966} {"train_loss": -24.294614791870117, "global_step": 246186, "epoch": 2966} {"train_loss": -24.768131256103516, "global_step": 246187, "epoch": 2966} {"train_loss": -24.75998306274414, "global_step": 246188, "epoch": 2966} {"train_loss": -24.89571189880371, "global_step": 246189, "epoch": 2966} {"train_loss": -24.38941764831543, "global_step": 246190, "epoch": 2966} {"train_loss": -24.715497970581055, "global_step": 246191, "epoch": 2966} {"train_loss": -24.45058250427246, "global_step": 246192, "epoch": 2966} {"train_loss": -24.59370994567871, "global_step": 246193, "epoch": 2966} {"train_loss": -24.749420166015625, "global_step": 246194, "epoch": 2966} {"train_loss": -24.8316707611084, "global_step": 246195, "epoch": 2966} {"train_loss": -24.848867416381836, "global_step": 246196, "epoch": 2966} {"train_loss": -24.72491455078125, "global_step": 246197, "epoch": 2966} {"train_loss": -24.69205665588379, "global_step": 246198, "epoch": 2966} {"train_loss": -24.973508834838867, "global_step": 246199, "epoch": 2966} {"train_loss": -25.269033432006836, "global_step": 246200, "epoch": 2966} {"train_loss": -24.855850219726562, "global_step": 246201, "epoch": 2966} {"train_loss": -24.975788116455078, "global_step": 246202, "epoch": 2966} {"train_loss": -24.918622970581055, "global_step": 246203, "epoch": 2966} {"train_loss": -24.680227279663086, "global_step": 246204, "epoch": 2966} {"train_loss": -24.823257446289062, "global_step": 246205, "epoch": 2966} {"train_loss": -24.939611434936523, "global_step": 246206, "epoch": 2966} {"train_loss": -24.848966598510742, "global_step": 246207, "epoch": 2966} {"train_loss": -25.168134689331055, "global_step": 246208, "epoch": 2966} {"train_loss": -25.31842613220215, "global_step": 246209, "epoch": 2966} {"train_loss": -25.065317153930664, "global_step": 246210, "epoch": 2966} {"train_loss": -24.89046287536621, "global_step": 246211, "epoch": 2966} {"train_loss": -24.96491050720215, "global_step": 246212, "epoch": 2966} {"train_loss": -25.45368766784668, "global_step": 246213, "epoch": 2966} {"train_loss": -24.904048919677734, "global_step": 246214, "epoch": 2966} {"train_loss": -24.94516944885254, "global_step": 246215, "epoch": 2966} {"train_loss": -25.194334030151367, "global_step": 246216, "epoch": 2966} {"train_loss": -24.570850372314453, "global_step": 246217, "epoch": 2966} {"train_loss": -25.12746810913086, "global_step": 246218, "epoch": 2966} {"train_loss": -25.106201171875, "global_step": 246219, "epoch": 2966} {"train_loss": -25.233747482299805, "global_step": 246220, "epoch": 2966} {"train_loss": -25.105165481567383, "global_step": 246221, "epoch": 2966} {"train_loss": -25.230514526367188, "global_step": 246222, "epoch": 2966} {"train_loss": -25.068052291870117, "global_step": 246223, "epoch": 2966} {"train_loss": -25.10044288635254, "global_step": 246224, "epoch": 2966} {"train_loss": -25.268375396728516, "global_step": 246225, "epoch": 2966} {"train_loss": -25.038434982299805, "global_step": 246226, "epoch": 2966} {"train_loss": -24.3497257232666, "global_step": 246227, "epoch": 2966} {"train_loss": -24.3463077545166, "global_step": 246228, "epoch": 2966} {"train_loss": -23.954193115234375, "global_step": 246229, "epoch": 2966} {"train_loss": -24.054370880126953, "global_step": 246230, "epoch": 2966} {"train_loss": -24.732572555541992, "global_step": 246231, "epoch": 2966} {"train_loss": -24.518890380859375, "global_step": 246232, "epoch": 2966} {"train_loss": -23.695907592773438, "global_step": 246233, "epoch": 2966} {"train_loss": -24.056442260742188, "global_step": 246234, "epoch": 2966} {"train_loss": -24.853336334228516, "global_step": 246235, "epoch": 2966} {"train_loss": -24.527372360229492, "global_step": 246236, "epoch": 2966} {"train_loss": -24.718368530273438, "global_step": 246237, "epoch": 2966} {"train_loss": -24.305400848388672, "global_step": 246238, "epoch": 2966} {"train_loss": -24.42409324645996, "global_step": 246239, "epoch": 2966} {"train_loss": -24.623498916625977, "global_step": 246240, "epoch": 2966} {"train_loss": -23.81910514831543, "global_step": 246241, "epoch": 2966} {"train_loss": -24.720745086669922, "global_step": 246242, "epoch": 2966} {"train_loss": -24.419858932495117, "global_step": 246243, "epoch": 2966} {"train_loss": -24.63971519470215, "global_step": 246244, "epoch": 2966} {"train_loss": -24.7764949798584, "global_step": 246245, "epoch": 2966} {"train_loss": -24.241798400878906, "global_step": 246246, "epoch": 2966} {"train_loss": -24.702882766723633, "global_step": 246247, "epoch": 2966} {"train_loss": -24.583499908447266, "global_step": 246248, "epoch": 2966} {"train_loss": -24.893579483032227, "global_step": 246249, "epoch": 2966} {"train_loss": -24.58894157409668, "global_step": 246250, "epoch": 2966} {"train_loss": -24.40387725830078, "global_step": 246251, "epoch": 2966} {"train_loss": -24.418973922729492, "global_step": 246252, "epoch": 2966} {"train_loss": -24.92250633239746, "global_step": 246253, "epoch": 2966} {"train_loss": -24.60370445251465, "global_step": 246254, "epoch": 2966} {"train_loss": -24.58016586303711, "global_step": 246255, "epoch": 2966} {"train_loss": -24.570270538330078, "global_step": 246256, "epoch": 2966} {"train_loss": -24.58370590209961, "global_step": 246257, "epoch": 2966} {"train_loss": -24.96064567565918, "global_step": 246258, "epoch": 2966} {"train_loss": -24.746706008911133, "global_step": 246259, "epoch": 2966} {"train_loss": -24.72349665538374, "global_step": 246260, "epoch": 2966, "val_loss": 6987963.0} {"train_loss": -24.595285415649414, "global_step": 246261, "epoch": 2967} {"train_loss": -24.613698959350586, "global_step": 246262, "epoch": 2967} {"train_loss": -25.141061782836914, "global_step": 246263, "epoch": 2967} {"train_loss": -24.850717544555664, "global_step": 246264, "epoch": 2967} {"train_loss": -24.915021896362305, "global_step": 246265, "epoch": 2967} {"train_loss": -24.915058135986328, "global_step": 246266, "epoch": 2967} {"train_loss": -24.777360916137695, "global_step": 246267, "epoch": 2967} {"train_loss": -24.975570678710938, "global_step": 246268, "epoch": 2967} {"train_loss": -24.968372344970703, "global_step": 246269, "epoch": 2967} {"train_loss": -25.179941177368164, "global_step": 246270, "epoch": 2967} {"train_loss": -24.752328872680664, "global_step": 246271, "epoch": 2967} {"train_loss": -25.3233699798584, "global_step": 246272, "epoch": 2967} {"train_loss": -25.159164428710938, "global_step": 246273, "epoch": 2967} {"train_loss": -24.76204490661621, "global_step": 246274, "epoch": 2967} {"train_loss": -24.896940231323242, "global_step": 246275, "epoch": 2967} {"train_loss": -25.34232521057129, "global_step": 246276, "epoch": 2967} {"train_loss": -25.058246612548828, "global_step": 246277, "epoch": 2967} {"train_loss": -25.067371368408203, "global_step": 246278, "epoch": 2967} {"train_loss": -24.87038803100586, "global_step": 246279, "epoch": 2967} {"train_loss": -24.930234909057617, "global_step": 246280, "epoch": 2967} {"train_loss": -24.816125869750977, "global_step": 246281, "epoch": 2967} {"train_loss": -25.61577796936035, "global_step": 246282, "epoch": 2967} {"train_loss": -24.772979736328125, "global_step": 246283, "epoch": 2967} {"train_loss": -25.002952575683594, "global_step": 246284, "epoch": 2967} {"train_loss": -24.997013092041016, "global_step": 246285, "epoch": 2967} {"train_loss": -24.823633193969727, "global_step": 246286, "epoch": 2967} {"train_loss": -25.04117774963379, "global_step": 246287, "epoch": 2967} {"train_loss": -25.32306671142578, "global_step": 246288, "epoch": 2967} {"train_loss": -25.28224754333496, "global_step": 246289, "epoch": 2967} {"train_loss": -24.979917526245117, "global_step": 246290, "epoch": 2967} {"train_loss": -25.146657943725586, "global_step": 246291, "epoch": 2967} {"train_loss": -25.130308151245117, "global_step": 246292, "epoch": 2967} {"train_loss": -24.862485885620117, "global_step": 246293, "epoch": 2967} {"train_loss": -24.91707420349121, "global_step": 246294, "epoch": 2967} {"train_loss": -24.899572372436523, "global_step": 246295, "epoch": 2967} {"train_loss": -25.19464111328125, "global_step": 246296, "epoch": 2967} {"train_loss": -25.01860809326172, "global_step": 246297, "epoch": 2967} {"train_loss": -24.930072784423828, "global_step": 246298, "epoch": 2967} {"train_loss": -24.89642333984375, "global_step": 246299, "epoch": 2967} {"train_loss": -24.820585250854492, "global_step": 246300, "epoch": 2967} {"train_loss": -25.160062789916992, "global_step": 246301, "epoch": 2967} {"train_loss": -25.333023071289062, "global_step": 246302, "epoch": 2967} {"train_loss": -25.20891761779785, "global_step": 246303, "epoch": 2967} {"train_loss": -24.944866180419922, "global_step": 246304, "epoch": 2967} {"train_loss": -24.86588478088379, "global_step": 246305, "epoch": 2967} {"train_loss": -24.586637496948242, "global_step": 246306, "epoch": 2967} {"train_loss": -25.1922607421875, "global_step": 246307, "epoch": 2967} {"train_loss": -24.741479873657227, "global_step": 246308, "epoch": 2967} {"train_loss": -24.84372901916504, "global_step": 246309, "epoch": 2967} {"train_loss": -24.577119827270508, "global_step": 246310, "epoch": 2967} {"train_loss": -25.063867568969727, "global_step": 246311, "epoch": 2967} {"train_loss": -24.606918334960938, "global_step": 246312, "epoch": 2967} {"train_loss": -24.523046493530273, "global_step": 246313, "epoch": 2967} {"train_loss": -25.00723648071289, "global_step": 246314, "epoch": 2967} {"train_loss": -24.428918838500977, "global_step": 246315, "epoch": 2967} {"train_loss": -24.835607528686523, "global_step": 246316, "epoch": 2967} {"train_loss": -25.049880981445312, "global_step": 246317, "epoch": 2967} {"train_loss": -25.06542205810547, "global_step": 246318, "epoch": 2967} {"train_loss": -25.081602096557617, "global_step": 246319, "epoch": 2967} {"train_loss": -25.16370964050293, "global_step": 246320, "epoch": 2967} {"train_loss": -24.918123245239258, "global_step": 246321, "epoch": 2967} {"train_loss": -24.955503463745117, "global_step": 246322, "epoch": 2967} {"train_loss": -25.172115325927734, "global_step": 246323, "epoch": 2967} {"train_loss": -24.97769546508789, "global_step": 246324, "epoch": 2967} {"train_loss": -25.096616744995117, "global_step": 246325, "epoch": 2967} {"train_loss": -24.60346031188965, "global_step": 246326, "epoch": 2967} {"train_loss": -24.84433937072754, "global_step": 246327, "epoch": 2967} {"train_loss": -24.930973052978516, "global_step": 246328, "epoch": 2967} {"train_loss": -24.742834091186523, "global_step": 246329, "epoch": 2967} {"train_loss": -24.96892738342285, "global_step": 246330, "epoch": 2967} {"train_loss": -24.86774253845215, "global_step": 246331, "epoch": 2967} {"train_loss": -24.989818572998047, "global_step": 246332, "epoch": 2967} {"train_loss": -25.1733341217041, "global_step": 246333, "epoch": 2967} {"train_loss": -25.179462432861328, "global_step": 246334, "epoch": 2967} {"train_loss": -25.02430534362793, "global_step": 246335, "epoch": 2967} {"train_loss": -24.97572898864746, "global_step": 246336, "epoch": 2967} {"train_loss": -24.816699981689453, "global_step": 246337, "epoch": 2967} {"train_loss": -25.35280418395996, "global_step": 246338, "epoch": 2967} {"train_loss": -25.112167358398438, "global_step": 246339, "epoch": 2967} {"train_loss": -24.8817195892334, "global_step": 246340, "epoch": 2967} {"train_loss": -24.89546012878418, "global_step": 246341, "epoch": 2967} {"train_loss": -25.109956741333008, "global_step": 246342, "epoch": 2967} {"train_loss": -24.965658670448395, "global_step": 246343, "epoch": 2967, "val_loss": 6820191.0} {"train_loss": -25.07330322265625, "global_step": 246344, "epoch": 2968} {"train_loss": -24.23499870300293, "global_step": 246345, "epoch": 2968} {"train_loss": -24.481435775756836, "global_step": 246346, "epoch": 2968} {"train_loss": -24.093042373657227, "global_step": 246347, "epoch": 2968} {"train_loss": -24.460529327392578, "global_step": 246348, "epoch": 2968} {"train_loss": -24.98432731628418, "global_step": 246349, "epoch": 2968} {"train_loss": -24.523544311523438, "global_step": 246350, "epoch": 2968} {"train_loss": -24.810903549194336, "global_step": 246351, "epoch": 2968} {"train_loss": -24.8873348236084, "global_step": 246352, "epoch": 2968} {"train_loss": -24.68731117248535, "global_step": 246353, "epoch": 2968} {"train_loss": -24.700824737548828, "global_step": 246354, "epoch": 2968} {"train_loss": -24.824844360351562, "global_step": 246355, "epoch": 2968} {"train_loss": -25.01263427734375, "global_step": 246356, "epoch": 2968} {"train_loss": -24.656068801879883, "global_step": 246357, "epoch": 2968} {"train_loss": -24.899993896484375, "global_step": 246358, "epoch": 2968} {"train_loss": -24.75966453552246, "global_step": 246359, "epoch": 2968} {"train_loss": -24.960142135620117, "global_step": 246360, "epoch": 2968} {"train_loss": -24.937097549438477, "global_step": 246361, "epoch": 2968} {"train_loss": -25.13344383239746, "global_step": 246362, "epoch": 2968} {"train_loss": -24.890222549438477, "global_step": 246363, "epoch": 2968} {"train_loss": -25.06711196899414, "global_step": 246364, "epoch": 2968} {"train_loss": -24.743040084838867, "global_step": 246365, "epoch": 2968} {"train_loss": -24.99920654296875, "global_step": 246366, "epoch": 2968} {"train_loss": -24.904497146606445, "global_step": 246367, "epoch": 2968} {"train_loss": -24.936769485473633, "global_step": 246368, "epoch": 2968} {"train_loss": -25.05620574951172, "global_step": 246369, "epoch": 2968} {"train_loss": -24.892202377319336, "global_step": 246370, "epoch": 2968} {"train_loss": -25.02423667907715, "global_step": 246371, "epoch": 2968} {"train_loss": -25.059032440185547, "global_step": 246372, "epoch": 2968} {"train_loss": -24.941410064697266, "global_step": 246373, "epoch": 2968} {"train_loss": -25.256519317626953, "global_step": 246374, "epoch": 2968} {"train_loss": -24.60552215576172, "global_step": 246375, "epoch": 2968} {"train_loss": -24.691495895385742, "global_step": 246376, "epoch": 2968} {"train_loss": -24.8399658203125, "global_step": 246377, "epoch": 2968} {"train_loss": -25.07855796813965, "global_step": 246378, "epoch": 2968} {"train_loss": -24.9714412689209, "global_step": 246379, "epoch": 2968} {"train_loss": -25.066125869750977, "global_step": 246380, "epoch": 2968} {"train_loss": -25.1146240234375, "global_step": 246381, "epoch": 2968} {"train_loss": -25.008325576782227, "global_step": 246382, "epoch": 2968} {"train_loss": -24.92038345336914, "global_step": 246383, "epoch": 2968} {"train_loss": -25.31880760192871, "global_step": 246384, "epoch": 2968} {"train_loss": -24.66737174987793, "global_step": 246385, "epoch": 2968} {"train_loss": -24.75470542907715, "global_step": 246386, "epoch": 2968} {"train_loss": -25.45176887512207, "global_step": 246387, "epoch": 2968} {"train_loss": -25.094167709350586, "global_step": 246388, "epoch": 2968} {"train_loss": -24.66478729248047, "global_step": 246389, "epoch": 2968} {"train_loss": -25.20917320251465, "global_step": 246390, "epoch": 2968} {"train_loss": -25.26690673828125, "global_step": 246391, "epoch": 2968} {"train_loss": -24.876691818237305, "global_step": 246392, "epoch": 2968} {"train_loss": -25.00874137878418, "global_step": 246393, "epoch": 2968} {"train_loss": -24.723834991455078, "global_step": 246394, "epoch": 2968} {"train_loss": -25.036453247070312, "global_step": 246395, "epoch": 2968} {"train_loss": -25.193326950073242, "global_step": 246396, "epoch": 2968} {"train_loss": -24.837055206298828, "global_step": 246397, "epoch": 2968} {"train_loss": -25.207618713378906, "global_step": 246398, "epoch": 2968} {"train_loss": -25.236957550048828, "global_step": 246399, "epoch": 2968} {"train_loss": -25.144338607788086, "global_step": 246400, "epoch": 2968} {"train_loss": -25.042423248291016, "global_step": 246401, "epoch": 2968} {"train_loss": -25.03492546081543, "global_step": 246402, "epoch": 2968} {"train_loss": -25.25275230407715, "global_step": 246403, "epoch": 2968} {"train_loss": -24.83330726623535, "global_step": 246404, "epoch": 2968} {"train_loss": -24.951404571533203, "global_step": 246405, "epoch": 2968} {"train_loss": -24.628440856933594, "global_step": 246406, "epoch": 2968} {"train_loss": -25.28009796142578, "global_step": 246407, "epoch": 2968} {"train_loss": -25.208171844482422, "global_step": 246408, "epoch": 2968} {"train_loss": -24.924985885620117, "global_step": 246409, "epoch": 2968} {"train_loss": -24.8874454498291, "global_step": 246410, "epoch": 2968} {"train_loss": -25.141889572143555, "global_step": 246411, "epoch": 2968} {"train_loss": -24.907222747802734, "global_step": 246412, "epoch": 2968} {"train_loss": -25.230396270751953, "global_step": 246413, "epoch": 2968} {"train_loss": -25.040922164916992, "global_step": 246414, "epoch": 2968} {"train_loss": -25.25182342529297, "global_step": 246415, "epoch": 2968} {"train_loss": -25.153888702392578, "global_step": 246416, "epoch": 2968} {"train_loss": -24.91677474975586, "global_step": 246417, "epoch": 2968} {"train_loss": -24.999618530273438, "global_step": 246418, "epoch": 2968} {"train_loss": -25.308225631713867, "global_step": 246419, "epoch": 2968} {"train_loss": -25.38283348083496, "global_step": 246420, "epoch": 2968} {"train_loss": -25.01910972595215, "global_step": 246421, "epoch": 2968} {"train_loss": -25.41946792602539, "global_step": 246422, "epoch": 2968} {"train_loss": -25.255414962768555, "global_step": 246423, "epoch": 2968} {"train_loss": -25.147363662719727, "global_step": 246424, "epoch": 2968} {"train_loss": -25.516891479492188, "global_step": 246425, "epoch": 2968} {"train_loss": -24.95343343895602, "global_step": 246426, "epoch": 2968, "val_loss": 6734740.0} {"train_loss": -23.99115562438965, "global_step": 246427, "epoch": 2969} {"train_loss": -22.545856475830078, "global_step": 246428, "epoch": 2969} {"train_loss": -21.865217208862305, "global_step": 246429, "epoch": 2969} {"train_loss": -22.608125686645508, "global_step": 246430, "epoch": 2969} {"train_loss": -23.57143211364746, "global_step": 246431, "epoch": 2969} {"train_loss": -23.548282623291016, "global_step": 246432, "epoch": 2969} {"train_loss": -23.327838897705078, "global_step": 246433, "epoch": 2969} {"train_loss": -23.890094757080078, "global_step": 246434, "epoch": 2969} {"train_loss": -23.61166763305664, "global_step": 246435, "epoch": 2969} {"train_loss": -24.22755241394043, "global_step": 246436, "epoch": 2969} {"train_loss": -23.706457138061523, "global_step": 246437, "epoch": 2969} {"train_loss": -24.315067291259766, "global_step": 246438, "epoch": 2969} {"train_loss": -24.128097534179688, "global_step": 246439, "epoch": 2969} {"train_loss": -24.25812339782715, "global_step": 246440, "epoch": 2969} {"train_loss": -24.14154815673828, "global_step": 246441, "epoch": 2969} {"train_loss": -23.91203498840332, "global_step": 246442, "epoch": 2969} {"train_loss": -24.43025016784668, "global_step": 246443, "epoch": 2969} {"train_loss": -24.61125946044922, "global_step": 246444, "epoch": 2969} {"train_loss": -24.18767738342285, "global_step": 246445, "epoch": 2969} {"train_loss": -24.522022247314453, "global_step": 246446, "epoch": 2969} {"train_loss": -24.40907859802246, "global_step": 246447, "epoch": 2969} {"train_loss": -24.565597534179688, "global_step": 246448, "epoch": 2969} {"train_loss": -24.234495162963867, "global_step": 246449, "epoch": 2969} {"train_loss": -24.52448081970215, "global_step": 246450, "epoch": 2969} {"train_loss": -24.454458236694336, "global_step": 246451, "epoch": 2969} {"train_loss": -24.548431396484375, "global_step": 246452, "epoch": 2969} {"train_loss": -24.69140625, "global_step": 246453, "epoch": 2969} {"train_loss": -25.00935173034668, "global_step": 246454, "epoch": 2969} {"train_loss": -25.032062530517578, "global_step": 246455, "epoch": 2969} {"train_loss": -24.823898315429688, "global_step": 246456, "epoch": 2969} {"train_loss": -25.06496238708496, "global_step": 246457, "epoch": 2969} {"train_loss": -25.0208740234375, "global_step": 246458, "epoch": 2969} {"train_loss": -24.846494674682617, "global_step": 246459, "epoch": 2969} {"train_loss": -24.999027252197266, "global_step": 246460, "epoch": 2969} {"train_loss": -24.754138946533203, "global_step": 246461, "epoch": 2969} {"train_loss": -24.481149673461914, "global_step": 246462, "epoch": 2969} {"train_loss": -25.229110717773438, "global_step": 246463, "epoch": 2969} {"train_loss": -24.874746322631836, "global_step": 246464, "epoch": 2969} {"train_loss": -24.79619789123535, "global_step": 246465, "epoch": 2969} {"train_loss": -24.851964950561523, "global_step": 246466, "epoch": 2969} {"train_loss": -24.561120986938477, "global_step": 246467, "epoch": 2969} {"train_loss": -25.136022567749023, "global_step": 246468, "epoch": 2969} {"train_loss": -25.123327255249023, "global_step": 246469, "epoch": 2969} {"train_loss": -25.019710540771484, "global_step": 246470, "epoch": 2969} {"train_loss": -25.038414001464844, "global_step": 246471, "epoch": 2969} {"train_loss": -25.095144271850586, "global_step": 246472, "epoch": 2969} {"train_loss": -25.495351791381836, "global_step": 246473, "epoch": 2969} {"train_loss": -25.21193504333496, "global_step": 246474, "epoch": 2969} {"train_loss": -24.85048484802246, "global_step": 246475, "epoch": 2969} {"train_loss": -24.935956954956055, "global_step": 246476, "epoch": 2969} {"train_loss": -25.15730094909668, "global_step": 246477, "epoch": 2969} {"train_loss": -24.932558059692383, "global_step": 246478, "epoch": 2969} {"train_loss": -25.399850845336914, "global_step": 246479, "epoch": 2969} {"train_loss": -24.805944442749023, "global_step": 246480, "epoch": 2969} {"train_loss": -24.881052017211914, "global_step": 246481, "epoch": 2969} {"train_loss": -25.19405174255371, "global_step": 246482, "epoch": 2969} {"train_loss": -25.23307228088379, "global_step": 246483, "epoch": 2969} {"train_loss": -25.176301956176758, "global_step": 246484, "epoch": 2969} {"train_loss": -24.985456466674805, "global_step": 246485, "epoch": 2969} {"train_loss": -25.173234939575195, "global_step": 246486, "epoch": 2969} {"train_loss": -25.129186630249023, "global_step": 246487, "epoch": 2969} {"train_loss": -24.94061279296875, "global_step": 246488, "epoch": 2969} {"train_loss": -25.195880889892578, "global_step": 246489, "epoch": 2969} {"train_loss": -25.0352725982666, "global_step": 246490, "epoch": 2969} {"train_loss": -24.890714645385742, "global_step": 246491, "epoch": 2969} {"train_loss": -25.20963478088379, "global_step": 246492, "epoch": 2969} {"train_loss": -25.133472442626953, "global_step": 246493, "epoch": 2969} {"train_loss": -25.245853424072266, "global_step": 246494, "epoch": 2969} {"train_loss": -25.17436408996582, "global_step": 246495, "epoch": 2969} {"train_loss": -25.10761260986328, "global_step": 246496, "epoch": 2969} {"train_loss": -25.366188049316406, "global_step": 246497, "epoch": 2969} {"train_loss": -24.569116592407227, "global_step": 246498, "epoch": 2969} {"train_loss": -24.73302459716797, "global_step": 246499, "epoch": 2969} {"train_loss": -24.85797691345215, "global_step": 246500, "epoch": 2969} {"train_loss": -24.918169021606445, "global_step": 246501, "epoch": 2969} {"train_loss": -24.91257095336914, "global_step": 246502, "epoch": 2969} {"train_loss": -24.725616455078125, "global_step": 246503, "epoch": 2969} {"train_loss": -24.660398483276367, "global_step": 246504, "epoch": 2969} {"train_loss": -24.996530532836914, "global_step": 246505, "epoch": 2969} {"train_loss": -24.84229850769043, "global_step": 246506, "epoch": 2969} {"train_loss": -25.00787925720215, "global_step": 246507, "epoch": 2969} {"train_loss": -24.805952072143555, "global_step": 246508, "epoch": 2969} {"train_loss": -24.66393808571689, "global_step": 246509, "epoch": 2969, "val_loss": 7005949.5} {"train_loss": -24.584875106811523, "global_step": 246510, "epoch": 2970} {"train_loss": -25.061790466308594, "global_step": 246511, "epoch": 2970} {"train_loss": -24.44881248474121, "global_step": 246512, "epoch": 2970} {"train_loss": -24.50726890563965, "global_step": 246513, "epoch": 2970} {"train_loss": -24.631244659423828, "global_step": 246514, "epoch": 2970} {"train_loss": -24.58387565612793, "global_step": 246515, "epoch": 2970} {"train_loss": -24.6759033203125, "global_step": 246516, "epoch": 2970} {"train_loss": -24.193456649780273, "global_step": 246517, "epoch": 2970} {"train_loss": -24.660446166992188, "global_step": 246518, "epoch": 2970} {"train_loss": -24.346128463745117, "global_step": 246519, "epoch": 2970} {"train_loss": -24.64505958557129, "global_step": 246520, "epoch": 2970} {"train_loss": -24.346582412719727, "global_step": 246521, "epoch": 2970} {"train_loss": -25.06097984313965, "global_step": 246522, "epoch": 2970} {"train_loss": -24.44304847717285, "global_step": 246523, "epoch": 2970} {"train_loss": -24.461332321166992, "global_step": 246524, "epoch": 2970} {"train_loss": -24.82261085510254, "global_step": 246525, "epoch": 2970} {"train_loss": -25.003284454345703, "global_step": 246526, "epoch": 2970} {"train_loss": -24.052228927612305, "global_step": 246527, "epoch": 2970} {"train_loss": -24.972610473632812, "global_step": 246528, "epoch": 2970} {"train_loss": -24.240928649902344, "global_step": 246529, "epoch": 2970} {"train_loss": -25.06452751159668, "global_step": 246530, "epoch": 2970} {"train_loss": -24.609161376953125, "global_step": 246531, "epoch": 2970} {"train_loss": -25.132770538330078, "global_step": 246532, "epoch": 2970} {"train_loss": -24.848682403564453, "global_step": 246533, "epoch": 2970} {"train_loss": -24.719907760620117, "global_step": 246534, "epoch": 2970} {"train_loss": -24.71396255493164, "global_step": 246535, "epoch": 2970} {"train_loss": -24.898038864135742, "global_step": 246536, "epoch": 2970} {"train_loss": -24.943878173828125, "global_step": 246537, "epoch": 2970} {"train_loss": -25.078588485717773, "global_step": 246538, "epoch": 2970} {"train_loss": -24.83934211730957, "global_step": 246539, "epoch": 2970} {"train_loss": -24.700157165527344, "global_step": 246540, "epoch": 2970} {"train_loss": -24.938013076782227, "global_step": 246541, "epoch": 2970} {"train_loss": -24.91358757019043, "global_step": 246542, "epoch": 2970} {"train_loss": -25.00354766845703, "global_step": 246543, "epoch": 2970} {"train_loss": -24.85381317138672, "global_step": 246544, "epoch": 2970} {"train_loss": -25.289997100830078, "global_step": 246545, "epoch": 2970} {"train_loss": -24.780689239501953, "global_step": 246546, "epoch": 2970} {"train_loss": -24.877744674682617, "global_step": 246547, "epoch": 2970} {"train_loss": -25.001256942749023, "global_step": 246548, "epoch": 2970} {"train_loss": -25.016862869262695, "global_step": 246549, "epoch": 2970} {"train_loss": -25.159225463867188, "global_step": 246550, "epoch": 2970} {"train_loss": -25.241300582885742, "global_step": 246551, "epoch": 2970} {"train_loss": -24.975751876831055, "global_step": 246552, "epoch": 2970} {"train_loss": -25.397960662841797, "global_step": 246553, "epoch": 2970} {"train_loss": -25.057430267333984, "global_step": 246554, "epoch": 2970} {"train_loss": -24.76715660095215, "global_step": 246555, "epoch": 2970} {"train_loss": -25.162643432617188, "global_step": 246556, "epoch": 2970} {"train_loss": -25.08432388305664, "global_step": 246557, "epoch": 2970} {"train_loss": -24.86065673828125, "global_step": 246558, "epoch": 2970} {"train_loss": -24.506521224975586, "global_step": 246559, "epoch": 2970} {"train_loss": -25.189199447631836, "global_step": 246560, "epoch": 2970} {"train_loss": -24.995012283325195, "global_step": 246561, "epoch": 2970} {"train_loss": -24.905820846557617, "global_step": 246562, "epoch": 2970} {"train_loss": -24.805803298950195, "global_step": 246563, "epoch": 2970} {"train_loss": -25.203468322753906, "global_step": 246564, "epoch": 2970} {"train_loss": -24.57790184020996, "global_step": 246565, "epoch": 2970} {"train_loss": -24.423765182495117, "global_step": 246566, "epoch": 2970} {"train_loss": -24.887788772583008, "global_step": 246567, "epoch": 2970} {"train_loss": -25.105478286743164, "global_step": 246568, "epoch": 2970} {"train_loss": -24.34980583190918, "global_step": 246569, "epoch": 2970} {"train_loss": -24.15250015258789, "global_step": 246570, "epoch": 2970} {"train_loss": -24.959157943725586, "global_step": 246571, "epoch": 2970} {"train_loss": -24.296926498413086, "global_step": 246572, "epoch": 2970} {"train_loss": -25.006114959716797, "global_step": 246573, "epoch": 2970} {"train_loss": -24.845876693725586, "global_step": 246574, "epoch": 2970} {"train_loss": -24.594205856323242, "global_step": 246575, "epoch": 2970} {"train_loss": -24.76559829711914, "global_step": 246576, "epoch": 2970} {"train_loss": -25.118696212768555, "global_step": 246577, "epoch": 2970} {"train_loss": -24.606367111206055, "global_step": 246578, "epoch": 2970} {"train_loss": -24.705522537231445, "global_step": 246579, "epoch": 2970} {"train_loss": -24.80795669555664, "global_step": 246580, "epoch": 2970} {"train_loss": -24.82857322692871, "global_step": 246581, "epoch": 2970} {"train_loss": -24.569599151611328, "global_step": 246582, "epoch": 2970} {"train_loss": -24.80057716369629, "global_step": 246583, "epoch": 2970} {"train_loss": -24.938825607299805, "global_step": 246584, "epoch": 2970} {"train_loss": -24.891569137573242, "global_step": 246585, "epoch": 2970} {"train_loss": -24.694049835205078, "global_step": 246586, "epoch": 2970} {"train_loss": -24.9688777923584, "global_step": 246587, "epoch": 2970} {"train_loss": -25.184974670410156, "global_step": 246588, "epoch": 2970} {"train_loss": -24.968114852905273, "global_step": 246589, "epoch": 2970} {"train_loss": -25.250600814819336, "global_step": 246590, "epoch": 2970} {"train_loss": -24.893070220947266, "global_step": 246591, "epoch": 2970} {"train_loss": -24.814332226672803, "global_step": 246592, "epoch": 2970, "val_loss": 6770274.0} {"train_loss": -24.691024780273438, "global_step": 246593, "epoch": 2971} {"train_loss": -24.742046356201172, "global_step": 246594, "epoch": 2971} {"train_loss": -24.593164443969727, "global_step": 246595, "epoch": 2971} {"train_loss": -25.33690643310547, "global_step": 246596, "epoch": 2971} {"train_loss": -24.571252822875977, "global_step": 246597, "epoch": 2971} {"train_loss": -25.14125633239746, "global_step": 246598, "epoch": 2971} {"train_loss": -24.724027633666992, "global_step": 246599, "epoch": 2971} {"train_loss": -24.660184860229492, "global_step": 246600, "epoch": 2971} {"train_loss": -24.836977005004883, "global_step": 246601, "epoch": 2971} {"train_loss": -25.128952026367188, "global_step": 246602, "epoch": 2971} {"train_loss": -24.96982765197754, "global_step": 246603, "epoch": 2971} {"train_loss": -24.870779037475586, "global_step": 246604, "epoch": 2971} {"train_loss": -25.011587142944336, "global_step": 246605, "epoch": 2971} {"train_loss": -25.185102462768555, "global_step": 246606, "epoch": 2971} {"train_loss": -25.195131301879883, "global_step": 246607, "epoch": 2971} {"train_loss": -24.926023483276367, "global_step": 246608, "epoch": 2971} {"train_loss": -25.139646530151367, "global_step": 246609, "epoch": 2971} {"train_loss": -24.785707473754883, "global_step": 246610, "epoch": 2971} {"train_loss": -25.038619995117188, "global_step": 246611, "epoch": 2971} {"train_loss": -24.9923152923584, "global_step": 246612, "epoch": 2971} {"train_loss": -25.080196380615234, "global_step": 246613, "epoch": 2971} {"train_loss": -24.7882080078125, "global_step": 246614, "epoch": 2971} {"train_loss": -25.14471435546875, "global_step": 246615, "epoch": 2971} {"train_loss": -24.688840866088867, "global_step": 246616, "epoch": 2971} {"train_loss": -24.845678329467773, "global_step": 246617, "epoch": 2971} {"train_loss": -25.035858154296875, "global_step": 246618, "epoch": 2971} {"train_loss": -25.05805015563965, "global_step": 246619, "epoch": 2971} {"train_loss": -25.135793685913086, "global_step": 246620, "epoch": 2971} {"train_loss": -24.934202194213867, "global_step": 246621, "epoch": 2971} {"train_loss": -24.842077255249023, "global_step": 246622, "epoch": 2971} {"train_loss": -25.133373260498047, "global_step": 246623, "epoch": 2971} {"train_loss": -25.0616397857666, "global_step": 246624, "epoch": 2971} {"train_loss": -25.061567306518555, "global_step": 246625, "epoch": 2971} {"train_loss": -24.913955688476562, "global_step": 246626, "epoch": 2971} {"train_loss": -25.275959014892578, "global_step": 246627, "epoch": 2971} {"train_loss": -24.860570907592773, "global_step": 246628, "epoch": 2971} {"train_loss": -25.052906036376953, "global_step": 246629, "epoch": 2971} {"train_loss": -25.106168746948242, "global_step": 246630, "epoch": 2971} {"train_loss": -24.702783584594727, "global_step": 246631, "epoch": 2971} {"train_loss": -25.23814582824707, "global_step": 246632, "epoch": 2971} {"train_loss": -25.109827041625977, "global_step": 246633, "epoch": 2971} {"train_loss": -24.577960968017578, "global_step": 246634, "epoch": 2971} {"train_loss": -24.745986938476562, "global_step": 246635, "epoch": 2971} {"train_loss": -24.699848175048828, "global_step": 246636, "epoch": 2971} {"train_loss": -24.824438095092773, "global_step": 246637, "epoch": 2971} {"train_loss": -25.35542869567871, "global_step": 246638, "epoch": 2971} {"train_loss": -25.229246139526367, "global_step": 246639, "epoch": 2971} {"train_loss": -24.75655174255371, "global_step": 246640, "epoch": 2971} {"train_loss": -24.9955997467041, "global_step": 246641, "epoch": 2971} {"train_loss": -25.06800651550293, "global_step": 246642, "epoch": 2971} {"train_loss": -24.795547485351562, "global_step": 246643, "epoch": 2971} {"train_loss": -25.212566375732422, "global_step": 246644, "epoch": 2971} {"train_loss": -24.782445907592773, "global_step": 246645, "epoch": 2971} {"train_loss": -24.71697998046875, "global_step": 246646, "epoch": 2971} {"train_loss": -25.09149932861328, "global_step": 246647, "epoch": 2971} {"train_loss": -25.028757095336914, "global_step": 246648, "epoch": 2971} {"train_loss": -24.731698989868164, "global_step": 246649, "epoch": 2971} {"train_loss": -24.620553970336914, "global_step": 246650, "epoch": 2971} {"train_loss": -24.855510711669922, "global_step": 246651, "epoch": 2971} {"train_loss": -24.833833694458008, "global_step": 246652, "epoch": 2971} {"train_loss": -24.61445426940918, "global_step": 246653, "epoch": 2971} {"train_loss": -25.178075790405273, "global_step": 246654, "epoch": 2971} {"train_loss": -24.773666381835938, "global_step": 246655, "epoch": 2971} {"train_loss": -24.80521011352539, "global_step": 246656, "epoch": 2971} {"train_loss": -25.087024688720703, "global_step": 246657, "epoch": 2971} {"train_loss": -24.904769897460938, "global_step": 246658, "epoch": 2971} {"train_loss": -25.304025650024414, "global_step": 246659, "epoch": 2971} {"train_loss": -25.210519790649414, "global_step": 246660, "epoch": 2971} {"train_loss": -25.10308265686035, "global_step": 246661, "epoch": 2971} {"train_loss": -25.1839656829834, "global_step": 246662, "epoch": 2971} {"train_loss": -25.151355743408203, "global_step": 246663, "epoch": 2971} {"train_loss": -25.075424194335938, "global_step": 246664, "epoch": 2971} {"train_loss": -24.667043685913086, "global_step": 246665, "epoch": 2971} {"train_loss": -24.94251823425293, "global_step": 246666, "epoch": 2971} {"train_loss": -24.791547775268555, "global_step": 246667, "epoch": 2971} {"train_loss": -25.077728271484375, "global_step": 246668, "epoch": 2971} {"train_loss": -25.16914939880371, "global_step": 246669, "epoch": 2971} {"train_loss": -25.142154693603516, "global_step": 246670, "epoch": 2971} {"train_loss": -25.032817840576172, "global_step": 246671, "epoch": 2971} {"train_loss": -25.237470626831055, "global_step": 246672, "epoch": 2971} {"train_loss": -25.414052963256836, "global_step": 246673, "epoch": 2971} {"train_loss": -25.075864791870117, "global_step": 246674, "epoch": 2971} {"train_loss": -24.98894277825413, "global_step": 246675, "epoch": 2971, "val_loss": 6812602.5} {"train_loss": -24.840726852416992, "global_step": 246676, "epoch": 2972} {"train_loss": -24.64543342590332, "global_step": 246677, "epoch": 2972} {"train_loss": -24.8121337890625, "global_step": 246678, "epoch": 2972} {"train_loss": -25.060853958129883, "global_step": 246679, "epoch": 2972} {"train_loss": -25.02053451538086, "global_step": 246680, "epoch": 2972} {"train_loss": -24.823102951049805, "global_step": 246681, "epoch": 2972} {"train_loss": -25.113529205322266, "global_step": 246682, "epoch": 2972} {"train_loss": -25.209522247314453, "global_step": 246683, "epoch": 2972} {"train_loss": -24.82084083557129, "global_step": 246684, "epoch": 2972} {"train_loss": -25.011796951293945, "global_step": 246685, "epoch": 2972} {"train_loss": -24.72555923461914, "global_step": 246686, "epoch": 2972} {"train_loss": -25.124107360839844, "global_step": 246687, "epoch": 2972} {"train_loss": -25.052658081054688, "global_step": 246688, "epoch": 2972} {"train_loss": -25.12058448791504, "global_step": 246689, "epoch": 2972} {"train_loss": -24.90915298461914, "global_step": 246690, "epoch": 2972} {"train_loss": -25.125593185424805, "global_step": 246691, "epoch": 2972} {"train_loss": -24.881397247314453, "global_step": 246692, "epoch": 2972} {"train_loss": -24.942026138305664, "global_step": 246693, "epoch": 2972} {"train_loss": -24.837610244750977, "global_step": 246694, "epoch": 2972} {"train_loss": -24.93690299987793, "global_step": 246695, "epoch": 2972} {"train_loss": -24.92133140563965, "global_step": 246696, "epoch": 2972} {"train_loss": -25.055709838867188, "global_step": 246697, "epoch": 2972} {"train_loss": -24.978647232055664, "global_step": 246698, "epoch": 2972} {"train_loss": -25.014965057373047, "global_step": 246699, "epoch": 2972} {"train_loss": -24.780641555786133, "global_step": 246700, "epoch": 2972} {"train_loss": -24.648969650268555, "global_step": 246701, "epoch": 2972} {"train_loss": -24.784828186035156, "global_step": 246702, "epoch": 2972} {"train_loss": -24.492685317993164, "global_step": 246703, "epoch": 2972} {"train_loss": -24.627696990966797, "global_step": 246704, "epoch": 2972} {"train_loss": -25.17693519592285, "global_step": 246705, "epoch": 2972} {"train_loss": -25.04193687438965, "global_step": 246706, "epoch": 2972} {"train_loss": -24.813974380493164, "global_step": 246707, "epoch": 2972} {"train_loss": -24.770917892456055, "global_step": 246708, "epoch": 2972} {"train_loss": -24.864086151123047, "global_step": 246709, "epoch": 2972} {"train_loss": -24.64655876159668, "global_step": 246710, "epoch": 2972} {"train_loss": -24.787782669067383, "global_step": 246711, "epoch": 2972} {"train_loss": -24.785350799560547, "global_step": 246712, "epoch": 2972} {"train_loss": -24.708921432495117, "global_step": 246713, "epoch": 2972} {"train_loss": -25.236356735229492, "global_step": 246714, "epoch": 2972} {"train_loss": -25.065704345703125, "global_step": 246715, "epoch": 2972} {"train_loss": -25.199506759643555, "global_step": 246716, "epoch": 2972} {"train_loss": -24.94893455505371, "global_step": 246717, "epoch": 2972} {"train_loss": -24.95895767211914, "global_step": 246718, "epoch": 2972} {"train_loss": -24.89919090270996, "global_step": 246719, "epoch": 2972} {"train_loss": -24.921308517456055, "global_step": 246720, "epoch": 2972} {"train_loss": -24.962217330932617, "global_step": 246721, "epoch": 2972} {"train_loss": -25.03898048400879, "global_step": 246722, "epoch": 2972} {"train_loss": -25.043540954589844, "global_step": 246723, "epoch": 2972} {"train_loss": -24.74233627319336, "global_step": 246724, "epoch": 2972} {"train_loss": -24.891305923461914, "global_step": 246725, "epoch": 2972} {"train_loss": -25.010025024414062, "global_step": 246726, "epoch": 2972} {"train_loss": -25.38651466369629, "global_step": 246727, "epoch": 2972} {"train_loss": -25.15888786315918, "global_step": 246728, "epoch": 2972} {"train_loss": -25.11135482788086, "global_step": 246729, "epoch": 2972} {"train_loss": -24.749418258666992, "global_step": 246730, "epoch": 2972} {"train_loss": -25.091249465942383, "global_step": 246731, "epoch": 2972} {"train_loss": -24.939273834228516, "global_step": 246732, "epoch": 2972} {"train_loss": -24.940284729003906, "global_step": 246733, "epoch": 2972} {"train_loss": -24.815847396850586, "global_step": 246734, "epoch": 2972} {"train_loss": -24.961645126342773, "global_step": 246735, "epoch": 2972} {"train_loss": -25.316633224487305, "global_step": 246736, "epoch": 2972} {"train_loss": -24.66754722595215, "global_step": 246737, "epoch": 2972} {"train_loss": -24.811195373535156, "global_step": 246738, "epoch": 2972} {"train_loss": -25.093557357788086, "global_step": 246739, "epoch": 2972} {"train_loss": -25.050851821899414, "global_step": 246740, "epoch": 2972} {"train_loss": -25.455902099609375, "global_step": 246741, "epoch": 2972} {"train_loss": -24.766706466674805, "global_step": 246742, "epoch": 2972} {"train_loss": -24.887460708618164, "global_step": 246743, "epoch": 2972} {"train_loss": -25.165014266967773, "global_step": 246744, "epoch": 2972} {"train_loss": -25.431121826171875, "global_step": 246745, "epoch": 2972} {"train_loss": -24.854145050048828, "global_step": 246746, "epoch": 2972} {"train_loss": -24.855422973632812, "global_step": 246747, "epoch": 2972} {"train_loss": -25.085948944091797, "global_step": 246748, "epoch": 2972} {"train_loss": -25.057411193847656, "global_step": 246749, "epoch": 2972} {"train_loss": -25.1103515625, "global_step": 246750, "epoch": 2972} {"train_loss": -25.165264129638672, "global_step": 246751, "epoch": 2972} {"train_loss": -24.752553939819336, "global_step": 246752, "epoch": 2972} {"train_loss": -24.94780921936035, "global_step": 246753, "epoch": 2972} {"train_loss": -25.215633392333984, "global_step": 246754, "epoch": 2972} {"train_loss": -24.519948959350586, "global_step": 246755, "epoch": 2972} {"train_loss": -24.61913299560547, "global_step": 246756, "epoch": 2972} {"train_loss": -23.87504005432129, "global_step": 246757, "epoch": 2972} {"train_loss": -24.93345214659909, "global_step": 246758, "epoch": 2972, "val_loss": 6973487.0} {"train_loss": -24.079296112060547, "global_step": 246759, "epoch": 2973} {"train_loss": -23.4196720123291, "global_step": 246760, "epoch": 2973} {"train_loss": -24.378936767578125, "global_step": 246761, "epoch": 2973} {"train_loss": -24.24439811706543, "global_step": 246762, "epoch": 2973} {"train_loss": -24.06060218811035, "global_step": 246763, "epoch": 2973} {"train_loss": -24.321945190429688, "global_step": 246764, "epoch": 2973} {"train_loss": -24.289152145385742, "global_step": 246765, "epoch": 2973} {"train_loss": -24.06622886657715, "global_step": 246766, "epoch": 2973} {"train_loss": -24.32368278503418, "global_step": 246767, "epoch": 2973} {"train_loss": -24.35677146911621, "global_step": 246768, "epoch": 2973} {"train_loss": -24.671567916870117, "global_step": 246769, "epoch": 2973} {"train_loss": -24.19510269165039, "global_step": 246770, "epoch": 2973} {"train_loss": -24.38875389099121, "global_step": 246771, "epoch": 2973} {"train_loss": -24.24216079711914, "global_step": 246772, "epoch": 2973} {"train_loss": -24.557817459106445, "global_step": 246773, "epoch": 2973} {"train_loss": -24.495664596557617, "global_step": 246774, "epoch": 2973} {"train_loss": -24.405471801757812, "global_step": 246775, "epoch": 2973} {"train_loss": -24.34400749206543, "global_step": 246776, "epoch": 2973} {"train_loss": -24.55048179626465, "global_step": 246777, "epoch": 2973} {"train_loss": -24.5469970703125, "global_step": 246778, "epoch": 2973} {"train_loss": -24.885421752929688, "global_step": 246779, "epoch": 2973} {"train_loss": -24.623619079589844, "global_step": 246780, "epoch": 2973} {"train_loss": -24.537885665893555, "global_step": 246781, "epoch": 2973} {"train_loss": -24.70416831970215, "global_step": 246782, "epoch": 2973} {"train_loss": -24.397043228149414, "global_step": 246783, "epoch": 2973} {"train_loss": -24.47480583190918, "global_step": 246784, "epoch": 2973} {"train_loss": -24.68892478942871, "global_step": 246785, "epoch": 2973} {"train_loss": -24.622583389282227, "global_step": 246786, "epoch": 2973} {"train_loss": -24.646574020385742, "global_step": 246787, "epoch": 2973} {"train_loss": -24.98986053466797, "global_step": 246788, "epoch": 2973} {"train_loss": -24.627164840698242, "global_step": 246789, "epoch": 2973} {"train_loss": -24.865692138671875, "global_step": 246790, "epoch": 2973} {"train_loss": -25.16766357421875, "global_step": 246791, "epoch": 2973} {"train_loss": -24.875741958618164, "global_step": 246792, "epoch": 2973} {"train_loss": -24.914356231689453, "global_step": 246793, "epoch": 2973} {"train_loss": -25.532339096069336, "global_step": 246794, "epoch": 2973} {"train_loss": -24.963525772094727, "global_step": 246795, "epoch": 2973} {"train_loss": -25.259225845336914, "global_step": 246796, "epoch": 2973} {"train_loss": -24.978464126586914, "global_step": 246797, "epoch": 2973} {"train_loss": -25.119659423828125, "global_step": 246798, "epoch": 2973} {"train_loss": -24.98834228515625, "global_step": 246799, "epoch": 2973} {"train_loss": -24.613739013671875, "global_step": 246800, "epoch": 2973} {"train_loss": -25.03388786315918, "global_step": 246801, "epoch": 2973} {"train_loss": -25.317485809326172, "global_step": 246802, "epoch": 2973} {"train_loss": -24.98539161682129, "global_step": 246803, "epoch": 2973} {"train_loss": -24.911067962646484, "global_step": 246804, "epoch": 2973} {"train_loss": -25.20936393737793, "global_step": 246805, "epoch": 2973} {"train_loss": -25.225631713867188, "global_step": 246806, "epoch": 2973} {"train_loss": -25.032865524291992, "global_step": 246807, "epoch": 2973} {"train_loss": -24.961488723754883, "global_step": 246808, "epoch": 2973} {"train_loss": -24.80000114440918, "global_step": 246809, "epoch": 2973} {"train_loss": -25.24238395690918, "global_step": 246810, "epoch": 2973} {"train_loss": -24.9649600982666, "global_step": 246811, "epoch": 2973} {"train_loss": -24.638158798217773, "global_step": 246812, "epoch": 2973} {"train_loss": -24.992645263671875, "global_step": 246813, "epoch": 2973} {"train_loss": -24.634544372558594, "global_step": 246814, "epoch": 2973} {"train_loss": -24.951099395751953, "global_step": 246815, "epoch": 2973} {"train_loss": -25.210018157958984, "global_step": 246816, "epoch": 2973} {"train_loss": -24.41347312927246, "global_step": 246817, "epoch": 2973} {"train_loss": -25.06563377380371, "global_step": 246818, "epoch": 2973} {"train_loss": -25.04291343688965, "global_step": 246819, "epoch": 2973} {"train_loss": -24.785362243652344, "global_step": 246820, "epoch": 2973} {"train_loss": -24.530216217041016, "global_step": 246821, "epoch": 2973} {"train_loss": -24.91798973083496, "global_step": 246822, "epoch": 2973} {"train_loss": -24.545774459838867, "global_step": 246823, "epoch": 2973} {"train_loss": -25.056264877319336, "global_step": 246824, "epoch": 2973} {"train_loss": -24.593652725219727, "global_step": 246825, "epoch": 2973} {"train_loss": -24.4344425201416, "global_step": 246826, "epoch": 2973} {"train_loss": -24.956741333007812, "global_step": 246827, "epoch": 2973} {"train_loss": -24.65521240234375, "global_step": 246828, "epoch": 2973} {"train_loss": -25.006412506103516, "global_step": 246829, "epoch": 2973} {"train_loss": -25.251113891601562, "global_step": 246830, "epoch": 2973} {"train_loss": -24.474821090698242, "global_step": 246831, "epoch": 2973} {"train_loss": -24.838491439819336, "global_step": 246832, "epoch": 2973} {"train_loss": -25.00772476196289, "global_step": 246833, "epoch": 2973} {"train_loss": -24.89999771118164, "global_step": 246834, "epoch": 2973} {"train_loss": -24.975988388061523, "global_step": 246835, "epoch": 2973} {"train_loss": -24.889331817626953, "global_step": 246836, "epoch": 2973} {"train_loss": -24.716081619262695, "global_step": 246837, "epoch": 2973} {"train_loss": -24.766286849975586, "global_step": 246838, "epoch": 2973} {"train_loss": -24.86240577697754, "global_step": 246839, "epoch": 2973} {"train_loss": -24.84439468383789, "global_step": 246840, "epoch": 2973} {"train_loss": -24.724922318056404, "global_step": 246841, "epoch": 2973, "val_loss": 6777366.5} {"train_loss": -24.898582458496094, "global_step": 246842, "epoch": 2974} {"train_loss": -24.707040786743164, "global_step": 246843, "epoch": 2974} {"train_loss": -24.656766891479492, "global_step": 246844, "epoch": 2974} {"train_loss": -24.588966369628906, "global_step": 246845, "epoch": 2974} {"train_loss": -24.36729621887207, "global_step": 246846, "epoch": 2974} {"train_loss": -24.226654052734375, "global_step": 246847, "epoch": 2974} {"train_loss": -24.73004150390625, "global_step": 246848, "epoch": 2974} {"train_loss": -24.4268741607666, "global_step": 246849, "epoch": 2974} {"train_loss": -24.955854415893555, "global_step": 246850, "epoch": 2974} {"train_loss": -24.455657958984375, "global_step": 246851, "epoch": 2974} {"train_loss": -24.751611709594727, "global_step": 246852, "epoch": 2974} {"train_loss": -24.688764572143555, "global_step": 246853, "epoch": 2974} {"train_loss": -24.646900177001953, "global_step": 246854, "epoch": 2974} {"train_loss": -25.0374813079834, "global_step": 246855, "epoch": 2974} {"train_loss": -24.525175094604492, "global_step": 246856, "epoch": 2974} {"train_loss": -24.880146026611328, "global_step": 246857, "epoch": 2974} {"train_loss": -24.736175537109375, "global_step": 246858, "epoch": 2974} {"train_loss": -24.863161087036133, "global_step": 246859, "epoch": 2974} {"train_loss": -24.765033721923828, "global_step": 246860, "epoch": 2974} {"train_loss": -24.82448387145996, "global_step": 246861, "epoch": 2974} {"train_loss": -24.96929359436035, "global_step": 246862, "epoch": 2974} {"train_loss": -25.17549705505371, "global_step": 246863, "epoch": 2974} {"train_loss": -24.85493278503418, "global_step": 246864, "epoch": 2974} {"train_loss": -25.100629806518555, "global_step": 246865, "epoch": 2974} {"train_loss": -25.179731369018555, "global_step": 246866, "epoch": 2974} {"train_loss": -25.17835807800293, "global_step": 246867, "epoch": 2974} {"train_loss": -24.577978134155273, "global_step": 246868, "epoch": 2974} {"train_loss": -24.84616470336914, "global_step": 246869, "epoch": 2974} {"train_loss": -25.104551315307617, "global_step": 246870, "epoch": 2974} {"train_loss": -25.42983055114746, "global_step": 246871, "epoch": 2974} {"train_loss": -25.13020133972168, "global_step": 246872, "epoch": 2974} {"train_loss": -24.869413375854492, "global_step": 246873, "epoch": 2974} {"train_loss": -25.37591552734375, "global_step": 246874, "epoch": 2974} {"train_loss": -24.9437198638916, "global_step": 246875, "epoch": 2974} {"train_loss": -25.23420524597168, "global_step": 246876, "epoch": 2974} {"train_loss": -25.032203674316406, "global_step": 246877, "epoch": 2974} {"train_loss": -24.741174697875977, "global_step": 246878, "epoch": 2974} {"train_loss": -25.460920333862305, "global_step": 246879, "epoch": 2974} {"train_loss": -25.24592399597168, "global_step": 246880, "epoch": 2974} {"train_loss": -24.971832275390625, "global_step": 246881, "epoch": 2974} {"train_loss": -25.042495727539062, "global_step": 246882, "epoch": 2974} {"train_loss": -24.984045028686523, "global_step": 246883, "epoch": 2974} {"train_loss": -24.923385620117188, "global_step": 246884, "epoch": 2974} {"train_loss": -25.18113136291504, "global_step": 246885, "epoch": 2974} {"train_loss": -25.0667724609375, "global_step": 246886, "epoch": 2974} {"train_loss": -25.193424224853516, "global_step": 246887, "epoch": 2974} {"train_loss": -24.78175926208496, "global_step": 246888, "epoch": 2974} {"train_loss": -24.456518173217773, "global_step": 246889, "epoch": 2974} {"train_loss": -24.479568481445312, "global_step": 246890, "epoch": 2974} {"train_loss": -24.799806594848633, "global_step": 246891, "epoch": 2974} {"train_loss": -25.08745002746582, "global_step": 246892, "epoch": 2974} {"train_loss": -24.675748825073242, "global_step": 246893, "epoch": 2974} {"train_loss": -24.360881805419922, "global_step": 246894, "epoch": 2974} {"train_loss": -24.80864906311035, "global_step": 246895, "epoch": 2974} {"train_loss": -24.230010986328125, "global_step": 246896, "epoch": 2974} {"train_loss": -24.05729103088379, "global_step": 246897, "epoch": 2974} {"train_loss": -24.48733901977539, "global_step": 246898, "epoch": 2974} {"train_loss": -24.941694259643555, "global_step": 246899, "epoch": 2974} {"train_loss": -24.671602249145508, "global_step": 246900, "epoch": 2974} {"train_loss": -24.508344650268555, "global_step": 246901, "epoch": 2974} {"train_loss": -25.36614418029785, "global_step": 246902, "epoch": 2974} {"train_loss": -24.598581314086914, "global_step": 246903, "epoch": 2974} {"train_loss": -24.381071090698242, "global_step": 246904, "epoch": 2974} {"train_loss": -24.80872917175293, "global_step": 246905, "epoch": 2974} {"train_loss": -24.671064376831055, "global_step": 246906, "epoch": 2974} {"train_loss": -24.833465576171875, "global_step": 246907, "epoch": 2974} {"train_loss": -24.862890243530273, "global_step": 246908, "epoch": 2974} {"train_loss": -25.032608032226562, "global_step": 246909, "epoch": 2974} {"train_loss": -24.92152214050293, "global_step": 246910, "epoch": 2974} {"train_loss": -24.659332275390625, "global_step": 246911, "epoch": 2974} {"train_loss": -24.95313835144043, "global_step": 246912, "epoch": 2974} {"train_loss": -25.157012939453125, "global_step": 246913, "epoch": 2974} {"train_loss": -25.313215255737305, "global_step": 246914, "epoch": 2974} {"train_loss": -25.036375045776367, "global_step": 246915, "epoch": 2974} {"train_loss": -24.823339462280273, "global_step": 246916, "epoch": 2974} {"train_loss": -25.021879196166992, "global_step": 246917, "epoch": 2974} {"train_loss": -24.951692581176758, "global_step": 246918, "epoch": 2974} {"train_loss": -25.459800720214844, "global_step": 246919, "epoch": 2974} {"train_loss": -25.321380615234375, "global_step": 246920, "epoch": 2974} {"train_loss": -24.954931259155273, "global_step": 246921, "epoch": 2974} {"train_loss": -25.305688858032227, "global_step": 246922, "epoch": 2974} {"train_loss": -25.439489364624023, "global_step": 246923, "epoch": 2974} {"train_loss": -24.86175560089479, "global_step": 246924, "epoch": 2974, "val_loss": 6931533.0} {"train_loss": -25.00518798828125, "global_step": 246925, "epoch": 2975} {"train_loss": -24.657873153686523, "global_step": 246926, "epoch": 2975} {"train_loss": -24.7935733795166, "global_step": 246927, "epoch": 2975} {"train_loss": -24.64312171936035, "global_step": 246928, "epoch": 2975} {"train_loss": -25.178129196166992, "global_step": 246929, "epoch": 2975} {"train_loss": -25.402442932128906, "global_step": 246930, "epoch": 2975} {"train_loss": -24.288049697875977, "global_step": 246931, "epoch": 2975} {"train_loss": -24.89008140563965, "global_step": 246932, "epoch": 2975} {"train_loss": -24.75408363342285, "global_step": 246933, "epoch": 2975} {"train_loss": -24.789949417114258, "global_step": 246934, "epoch": 2975} {"train_loss": -24.976903915405273, "global_step": 246935, "epoch": 2975} {"train_loss": -24.94394302368164, "global_step": 246936, "epoch": 2975} {"train_loss": -24.737518310546875, "global_step": 246937, "epoch": 2975} {"train_loss": -24.837202072143555, "global_step": 246938, "epoch": 2975} {"train_loss": -24.661191940307617, "global_step": 246939, "epoch": 2975} {"train_loss": -24.4871826171875, "global_step": 246940, "epoch": 2975} {"train_loss": -24.82634925842285, "global_step": 246941, "epoch": 2975} {"train_loss": -24.737998962402344, "global_step": 246942, "epoch": 2975} {"train_loss": -25.282100677490234, "global_step": 246943, "epoch": 2975} {"train_loss": -24.95789909362793, "global_step": 246944, "epoch": 2975} {"train_loss": -24.567296981811523, "global_step": 246945, "epoch": 2975} {"train_loss": -24.599105834960938, "global_step": 246946, "epoch": 2975} {"train_loss": -24.901798248291016, "global_step": 246947, "epoch": 2975} {"train_loss": -24.83796501159668, "global_step": 246948, "epoch": 2975} {"train_loss": -25.122709274291992, "global_step": 246949, "epoch": 2975} {"train_loss": -24.93756675720215, "global_step": 246950, "epoch": 2975} {"train_loss": -24.954105377197266, "global_step": 246951, "epoch": 2975} {"train_loss": -24.741233825683594, "global_step": 246952, "epoch": 2975} {"train_loss": -24.98492431640625, "global_step": 246953, "epoch": 2975} {"train_loss": -25.010278701782227, "global_step": 246954, "epoch": 2975} {"train_loss": -25.02223014831543, "global_step": 246955, "epoch": 2975} {"train_loss": -25.238393783569336, "global_step": 246956, "epoch": 2975} {"train_loss": -24.482664108276367, "global_step": 246957, "epoch": 2975} {"train_loss": -24.598623275756836, "global_step": 246958, "epoch": 2975} {"train_loss": -25.205793380737305, "global_step": 246959, "epoch": 2975} {"train_loss": -25.21229362487793, "global_step": 246960, "epoch": 2975} {"train_loss": -25.089462280273438, "global_step": 246961, "epoch": 2975} {"train_loss": -25.383228302001953, "global_step": 246962, "epoch": 2975} {"train_loss": -25.119863510131836, "global_step": 246963, "epoch": 2975} {"train_loss": -25.395219802856445, "global_step": 246964, "epoch": 2975} {"train_loss": -25.093318939208984, "global_step": 246965, "epoch": 2975} {"train_loss": -24.8817195892334, "global_step": 246966, "epoch": 2975} {"train_loss": -24.966934204101562, "global_step": 246967, "epoch": 2975} {"train_loss": -25.08527946472168, "global_step": 246968, "epoch": 2975} {"train_loss": -25.018310546875, "global_step": 246969, "epoch": 2975} {"train_loss": -25.11197280883789, "global_step": 246970, "epoch": 2975} {"train_loss": -25.107425689697266, "global_step": 246971, "epoch": 2975} {"train_loss": -24.8535099029541, "global_step": 246972, "epoch": 2975} {"train_loss": -25.029449462890625, "global_step": 246973, "epoch": 2975} {"train_loss": -24.726741790771484, "global_step": 246974, "epoch": 2975} {"train_loss": -25.13453483581543, "global_step": 246975, "epoch": 2975} {"train_loss": -25.612060546875, "global_step": 246976, "epoch": 2975} {"train_loss": -25.148866653442383, "global_step": 246977, "epoch": 2975} {"train_loss": -25.08698272705078, "global_step": 246978, "epoch": 2975} {"train_loss": -25.221738815307617, "global_step": 246979, "epoch": 2975} {"train_loss": -24.971309661865234, "global_step": 246980, "epoch": 2975} {"train_loss": -25.11008071899414, "global_step": 246981, "epoch": 2975} {"train_loss": -24.827878952026367, "global_step": 246982, "epoch": 2975} {"train_loss": -25.15347671508789, "global_step": 246983, "epoch": 2975} {"train_loss": -24.87765884399414, "global_step": 246984, "epoch": 2975} {"train_loss": -25.21242332458496, "global_step": 246985, "epoch": 2975} {"train_loss": -25.139360427856445, "global_step": 246986, "epoch": 2975} {"train_loss": -24.916080474853516, "global_step": 246987, "epoch": 2975} {"train_loss": -24.958431243896484, "global_step": 246988, "epoch": 2975} {"train_loss": -25.32680320739746, "global_step": 246989, "epoch": 2975} {"train_loss": -24.726951599121094, "global_step": 246990, "epoch": 2975} {"train_loss": -25.147872924804688, "global_step": 246991, "epoch": 2975} {"train_loss": -24.88252067565918, "global_step": 246992, "epoch": 2975} {"train_loss": -24.954883575439453, "global_step": 246993, "epoch": 2975} {"train_loss": -24.99448013305664, "global_step": 246994, "epoch": 2975} {"train_loss": -24.617860794067383, "global_step": 246995, "epoch": 2975} {"train_loss": -24.879121780395508, "global_step": 246996, "epoch": 2975} {"train_loss": -24.699621200561523, "global_step": 246997, "epoch": 2975} {"train_loss": -25.08445930480957, "global_step": 246998, "epoch": 2975} {"train_loss": -25.0278263092041, "global_step": 246999, "epoch": 2975} {"train_loss": -24.84726333618164, "global_step": 247000, "epoch": 2975} {"train_loss": -24.84078025817871, "global_step": 247001, "epoch": 2975} {"train_loss": -25.06415367126465, "global_step": 247002, "epoch": 2975} {"train_loss": -24.618640899658203, "global_step": 247003, "epoch": 2975} {"train_loss": -24.841655731201172, "global_step": 247004, "epoch": 2975} {"train_loss": -25.229476928710938, "global_step": 247005, "epoch": 2975} {"train_loss": -25.108585357666016, "global_step": 247006, "epoch": 2975} {"train_loss": -24.96913289449301, "global_step": 247007, "epoch": 2975, "val_loss": 6753873.0} {"train_loss": -24.481489181518555, "global_step": 247008, "epoch": 2976} {"train_loss": -24.262277603149414, "global_step": 247009, "epoch": 2976} {"train_loss": -24.244529724121094, "global_step": 247010, "epoch": 2976} {"train_loss": -25.002023696899414, "global_step": 247011, "epoch": 2976} {"train_loss": -24.515716552734375, "global_step": 247012, "epoch": 2976} {"train_loss": -24.82477378845215, "global_step": 247013, "epoch": 2976} {"train_loss": -24.020889282226562, "global_step": 247014, "epoch": 2976} {"train_loss": -24.660629272460938, "global_step": 247015, "epoch": 2976} {"train_loss": -24.60346031188965, "global_step": 247016, "epoch": 2976} {"train_loss": -24.599210739135742, "global_step": 247017, "epoch": 2976} {"train_loss": -24.7793025970459, "global_step": 247018, "epoch": 2976} {"train_loss": -24.55777931213379, "global_step": 247019, "epoch": 2976} {"train_loss": -24.877761840820312, "global_step": 247020, "epoch": 2976} {"train_loss": -24.1711483001709, "global_step": 247021, "epoch": 2976} {"train_loss": -24.653318405151367, "global_step": 247022, "epoch": 2976} {"train_loss": -24.729333877563477, "global_step": 247023, "epoch": 2976} {"train_loss": -25.100317001342773, "global_step": 247024, "epoch": 2976} {"train_loss": -24.84006118774414, "global_step": 247025, "epoch": 2976} {"train_loss": -24.840930938720703, "global_step": 247026, "epoch": 2976} {"train_loss": -24.803647994995117, "global_step": 247027, "epoch": 2976} {"train_loss": -24.920711517333984, "global_step": 247028, "epoch": 2976} {"train_loss": -25.03135871887207, "global_step": 247029, "epoch": 2976} {"train_loss": -25.438385009765625, "global_step": 247030, "epoch": 2976} {"train_loss": -24.817596435546875, "global_step": 247031, "epoch": 2976} {"train_loss": -24.567001342773438, "global_step": 247032, "epoch": 2976} {"train_loss": -25.2905216217041, "global_step": 247033, "epoch": 2976} {"train_loss": -24.821874618530273, "global_step": 247034, "epoch": 2976} {"train_loss": -25.2142276763916, "global_step": 247035, "epoch": 2976} {"train_loss": -25.029247283935547, "global_step": 247036, "epoch": 2976} {"train_loss": -25.264551162719727, "global_step": 247037, "epoch": 2976} {"train_loss": -24.739608764648438, "global_step": 247038, "epoch": 2976} {"train_loss": -24.778085708618164, "global_step": 247039, "epoch": 2976} {"train_loss": -24.99049186706543, "global_step": 247040, "epoch": 2976} {"train_loss": -25.206985473632812, "global_step": 247041, "epoch": 2976} {"train_loss": -25.222183227539062, "global_step": 247042, "epoch": 2976} {"train_loss": -24.958953857421875, "global_step": 247043, "epoch": 2976} {"train_loss": -24.992904663085938, "global_step": 247044, "epoch": 2976} {"train_loss": -25.0964298248291, "global_step": 247045, "epoch": 2976} {"train_loss": -24.801177978515625, "global_step": 247046, "epoch": 2976} {"train_loss": -24.8662052154541, "global_step": 247047, "epoch": 2976} {"train_loss": -25.084312438964844, "global_step": 247048, "epoch": 2976} {"train_loss": -25.6557559967041, "global_step": 247049, "epoch": 2976} {"train_loss": -24.972028732299805, "global_step": 247050, "epoch": 2976} {"train_loss": -25.484769821166992, "global_step": 247051, "epoch": 2976} {"train_loss": -24.7388973236084, "global_step": 247052, "epoch": 2976} {"train_loss": -25.236051559448242, "global_step": 247053, "epoch": 2976} {"train_loss": -25.14858055114746, "global_step": 247054, "epoch": 2976} {"train_loss": -24.826213836669922, "global_step": 247055, "epoch": 2976} {"train_loss": -25.229063034057617, "global_step": 247056, "epoch": 2976} {"train_loss": -25.124839782714844, "global_step": 247057, "epoch": 2976} {"train_loss": -24.983295440673828, "global_step": 247058, "epoch": 2976} {"train_loss": -25.132612228393555, "global_step": 247059, "epoch": 2976} {"train_loss": -24.958942413330078, "global_step": 247060, "epoch": 2976} {"train_loss": -24.90372657775879, "global_step": 247061, "epoch": 2976} {"train_loss": -24.799070358276367, "global_step": 247062, "epoch": 2976} {"train_loss": -25.119239807128906, "global_step": 247063, "epoch": 2976} {"train_loss": -25.269563674926758, "global_step": 247064, "epoch": 2976} {"train_loss": -24.816307067871094, "global_step": 247065, "epoch": 2976} {"train_loss": -24.95338249206543, "global_step": 247066, "epoch": 2976} {"train_loss": -25.078754425048828, "global_step": 247067, "epoch": 2976} {"train_loss": -24.912059783935547, "global_step": 247068, "epoch": 2976} {"train_loss": -25.021081924438477, "global_step": 247069, "epoch": 2976} {"train_loss": -24.844402313232422, "global_step": 247070, "epoch": 2976} {"train_loss": -25.06260108947754, "global_step": 247071, "epoch": 2976} {"train_loss": -25.240049362182617, "global_step": 247072, "epoch": 2976} {"train_loss": -24.868364334106445, "global_step": 247073, "epoch": 2976} {"train_loss": -25.05129051208496, "global_step": 247074, "epoch": 2976} {"train_loss": -25.03627586364746, "global_step": 247075, "epoch": 2976} {"train_loss": -25.21367835998535, "global_step": 247076, "epoch": 2976} {"train_loss": -24.826093673706055, "global_step": 247077, "epoch": 2976} {"train_loss": -25.195096969604492, "global_step": 247078, "epoch": 2976} {"train_loss": -24.985645294189453, "global_step": 247079, "epoch": 2976} {"train_loss": -25.02057456970215, "global_step": 247080, "epoch": 2976} {"train_loss": -25.00340461730957, "global_step": 247081, "epoch": 2976} {"train_loss": -24.976070404052734, "global_step": 247082, "epoch": 2976} {"train_loss": -25.022113800048828, "global_step": 247083, "epoch": 2976} {"train_loss": -25.1785945892334, "global_step": 247084, "epoch": 2976} {"train_loss": -25.093891143798828, "global_step": 247085, "epoch": 2976} {"train_loss": -24.860376358032227, "global_step": 247086, "epoch": 2976} {"train_loss": -24.52399253845215, "global_step": 247087, "epoch": 2976} {"train_loss": -24.236486434936523, "global_step": 247088, "epoch": 2976} {"train_loss": -24.540027618408203, "global_step": 247089, "epoch": 2976} {"train_loss": -24.91520980467279, "global_step": 247090, "epoch": 2976, "val_loss": 6971491.0} {"train_loss": -21.606979370117188, "global_step": 247091, "epoch": 2977} {"train_loss": -24.069822311401367, "global_step": 247092, "epoch": 2977} {"train_loss": -22.569808959960938, "global_step": 247093, "epoch": 2977} {"train_loss": -23.12220573425293, "global_step": 247094, "epoch": 2977} {"train_loss": -22.25330924987793, "global_step": 247095, "epoch": 2977} {"train_loss": -24.06719970703125, "global_step": 247096, "epoch": 2977} {"train_loss": -23.116682052612305, "global_step": 247097, "epoch": 2977} {"train_loss": -23.50324821472168, "global_step": 247098, "epoch": 2977} {"train_loss": -23.818111419677734, "global_step": 247099, "epoch": 2977} {"train_loss": -23.286596298217773, "global_step": 247100, "epoch": 2977} {"train_loss": -23.10053825378418, "global_step": 247101, "epoch": 2977} {"train_loss": -23.833120346069336, "global_step": 247102, "epoch": 2977} {"train_loss": -23.592145919799805, "global_step": 247103, "epoch": 2977} {"train_loss": -23.919605255126953, "global_step": 247104, "epoch": 2977} {"train_loss": -24.21770477294922, "global_step": 247105, "epoch": 2977} {"train_loss": -24.120840072631836, "global_step": 247106, "epoch": 2977} {"train_loss": -24.270668029785156, "global_step": 247107, "epoch": 2977} {"train_loss": -23.89335823059082, "global_step": 247108, "epoch": 2977} {"train_loss": -23.831771850585938, "global_step": 247109, "epoch": 2977} {"train_loss": -23.956527709960938, "global_step": 247110, "epoch": 2977} {"train_loss": -23.95859146118164, "global_step": 247111, "epoch": 2977} {"train_loss": -24.366865158081055, "global_step": 247112, "epoch": 2977} {"train_loss": -24.18181800842285, "global_step": 247113, "epoch": 2977} {"train_loss": -24.100126266479492, "global_step": 247114, "epoch": 2977} {"train_loss": -24.442861557006836, "global_step": 247115, "epoch": 2977} {"train_loss": -24.169496536254883, "global_step": 247116, "epoch": 2977} {"train_loss": -24.605430603027344, "global_step": 247117, "epoch": 2977} {"train_loss": -24.63746452331543, "global_step": 247118, "epoch": 2977} {"train_loss": -24.380868911743164, "global_step": 247119, "epoch": 2977} {"train_loss": -24.064289093017578, "global_step": 247120, "epoch": 2977} {"train_loss": -24.048648834228516, "global_step": 247121, "epoch": 2977} {"train_loss": -24.689359664916992, "global_step": 247122, "epoch": 2977} {"train_loss": -24.263172149658203, "global_step": 247123, "epoch": 2977} {"train_loss": -24.553558349609375, "global_step": 247124, "epoch": 2977} {"train_loss": -24.687374114990234, "global_step": 247125, "epoch": 2977} {"train_loss": -24.400917053222656, "global_step": 247126, "epoch": 2977} {"train_loss": -24.709409713745117, "global_step": 247127, "epoch": 2977} {"train_loss": -24.414113998413086, "global_step": 247128, "epoch": 2977} {"train_loss": -24.67252540588379, "global_step": 247129, "epoch": 2977} {"train_loss": -24.597362518310547, "global_step": 247130, "epoch": 2977} {"train_loss": -24.601036071777344, "global_step": 247131, "epoch": 2977} {"train_loss": -24.41304588317871, "global_step": 247132, "epoch": 2977} {"train_loss": -24.832462310791016, "global_step": 247133, "epoch": 2977} {"train_loss": -24.47358512878418, "global_step": 247134, "epoch": 2977} {"train_loss": -25.040515899658203, "global_step": 247135, "epoch": 2977} {"train_loss": -24.506107330322266, "global_step": 247136, "epoch": 2977} {"train_loss": -24.288583755493164, "global_step": 247137, "epoch": 2977} {"train_loss": -24.895366668701172, "global_step": 247138, "epoch": 2977} {"train_loss": -24.764232635498047, "global_step": 247139, "epoch": 2977} {"train_loss": -25.028064727783203, "global_step": 247140, "epoch": 2977} {"train_loss": -24.70374870300293, "global_step": 247141, "epoch": 2977} {"train_loss": -24.685590744018555, "global_step": 247142, "epoch": 2977} {"train_loss": -24.934635162353516, "global_step": 247143, "epoch": 2977} {"train_loss": -25.1851749420166, "global_step": 247144, "epoch": 2977} {"train_loss": -24.80143165588379, "global_step": 247145, "epoch": 2977} {"train_loss": -25.11321258544922, "global_step": 247146, "epoch": 2977} {"train_loss": -24.810300827026367, "global_step": 247147, "epoch": 2977} {"train_loss": -24.8988037109375, "global_step": 247148, "epoch": 2977} {"train_loss": -24.78785514831543, "global_step": 247149, "epoch": 2977} {"train_loss": -25.391769409179688, "global_step": 247150, "epoch": 2977} {"train_loss": -25.015344619750977, "global_step": 247151, "epoch": 2977} {"train_loss": -25.264440536499023, "global_step": 247152, "epoch": 2977} {"train_loss": -25.004064559936523, "global_step": 247153, "epoch": 2977} {"train_loss": -24.808551788330078, "global_step": 247154, "epoch": 2977} {"train_loss": -25.290298461914062, "global_step": 247155, "epoch": 2977} {"train_loss": -24.76917839050293, "global_step": 247156, "epoch": 2977} {"train_loss": -24.941465377807617, "global_step": 247157, "epoch": 2977} {"train_loss": -24.635486602783203, "global_step": 247158, "epoch": 2977} {"train_loss": -24.816619873046875, "global_step": 247159, "epoch": 2977} {"train_loss": -24.82112693786621, "global_step": 247160, "epoch": 2977} {"train_loss": -25.225858688354492, "global_step": 247161, "epoch": 2977} {"train_loss": -24.833494186401367, "global_step": 247162, "epoch": 2977} {"train_loss": -24.742538452148438, "global_step": 247163, "epoch": 2977} {"train_loss": -25.073280334472656, "global_step": 247164, "epoch": 2977} {"train_loss": -25.041414260864258, "global_step": 247165, "epoch": 2977} {"train_loss": -25.041950225830078, "global_step": 247166, "epoch": 2977} {"train_loss": -24.966171264648438, "global_step": 247167, "epoch": 2977} {"train_loss": -25.177661895751953, "global_step": 247168, "epoch": 2977} {"train_loss": -24.92143440246582, "global_step": 247169, "epoch": 2977} {"train_loss": -24.666105270385742, "global_step": 247170, "epoch": 2977} {"train_loss": -24.773033142089844, "global_step": 247171, "epoch": 2977} {"train_loss": -24.786489486694336, "global_step": 247172, "epoch": 2977} {"train_loss": -24.431439066507732, "global_step": 247173, "epoch": 2977, "val_loss": 6895696.0} {"train_loss": -24.751604080200195, "global_step": 247174, "epoch": 2978} {"train_loss": -24.568952560424805, "global_step": 247175, "epoch": 2978} {"train_loss": -24.780925750732422, "global_step": 247176, "epoch": 2978} {"train_loss": -24.459272384643555, "global_step": 247177, "epoch": 2978} {"train_loss": -24.44888687133789, "global_step": 247178, "epoch": 2978} {"train_loss": -24.666654586791992, "global_step": 247179, "epoch": 2978} {"train_loss": -24.637710571289062, "global_step": 247180, "epoch": 2978} {"train_loss": -24.995527267456055, "global_step": 247181, "epoch": 2978} {"train_loss": -24.82672882080078, "global_step": 247182, "epoch": 2978} {"train_loss": -24.604066848754883, "global_step": 247183, "epoch": 2978} {"train_loss": -24.50843620300293, "global_step": 247184, "epoch": 2978} {"train_loss": -24.77320671081543, "global_step": 247185, "epoch": 2978} {"train_loss": -24.92241859436035, "global_step": 247186, "epoch": 2978} {"train_loss": -25.100942611694336, "global_step": 247187, "epoch": 2978} {"train_loss": -25.106576919555664, "global_step": 247188, "epoch": 2978} {"train_loss": -24.51877784729004, "global_step": 247189, "epoch": 2978} {"train_loss": -24.862125396728516, "global_step": 247190, "epoch": 2978} {"train_loss": -24.805089950561523, "global_step": 247191, "epoch": 2978} {"train_loss": -24.508804321289062, "global_step": 247192, "epoch": 2978} {"train_loss": -24.88581657409668, "global_step": 247193, "epoch": 2978} {"train_loss": -24.656940460205078, "global_step": 247194, "epoch": 2978} {"train_loss": -24.631210327148438, "global_step": 247195, "epoch": 2978} {"train_loss": -24.934762954711914, "global_step": 247196, "epoch": 2978} {"train_loss": -24.91290283203125, "global_step": 247197, "epoch": 2978} {"train_loss": -25.166738510131836, "global_step": 247198, "epoch": 2978} {"train_loss": -24.71900749206543, "global_step": 247199, "epoch": 2978} {"train_loss": -25.17262840270996, "global_step": 247200, "epoch": 2978} {"train_loss": -25.06002426147461, "global_step": 247201, "epoch": 2978} {"train_loss": -25.020748138427734, "global_step": 247202, "epoch": 2978} {"train_loss": -24.862499237060547, "global_step": 247203, "epoch": 2978} {"train_loss": -25.025516510009766, "global_step": 247204, "epoch": 2978} {"train_loss": -24.94911003112793, "global_step": 247205, "epoch": 2978} {"train_loss": -25.179203033447266, "global_step": 247206, "epoch": 2978} {"train_loss": -24.84517478942871, "global_step": 247207, "epoch": 2978} {"train_loss": -25.142736434936523, "global_step": 247208, "epoch": 2978} {"train_loss": -24.601749420166016, "global_step": 247209, "epoch": 2978} {"train_loss": -25.14112091064453, "global_step": 247210, "epoch": 2978} {"train_loss": -24.953638076782227, "global_step": 247211, "epoch": 2978} {"train_loss": -24.91006851196289, "global_step": 247212, "epoch": 2978} {"train_loss": -25.115171432495117, "global_step": 247213, "epoch": 2978} {"train_loss": -24.99031639099121, "global_step": 247214, "epoch": 2978} {"train_loss": -24.896621704101562, "global_step": 247215, "epoch": 2978} {"train_loss": -24.8756046295166, "global_step": 247216, "epoch": 2978} {"train_loss": -24.729110717773438, "global_step": 247217, "epoch": 2978} {"train_loss": -25.142576217651367, "global_step": 247218, "epoch": 2978} {"train_loss": -25.077978134155273, "global_step": 247219, "epoch": 2978} {"train_loss": -24.66305923461914, "global_step": 247220, "epoch": 2978} {"train_loss": -25.124046325683594, "global_step": 247221, "epoch": 2978} {"train_loss": -25.39715576171875, "global_step": 247222, "epoch": 2978} {"train_loss": -24.861818313598633, "global_step": 247223, "epoch": 2978} {"train_loss": -24.967193603515625, "global_step": 247224, "epoch": 2978} {"train_loss": -25.103153228759766, "global_step": 247225, "epoch": 2978} {"train_loss": -24.740896224975586, "global_step": 247226, "epoch": 2978} {"train_loss": -25.43364906311035, "global_step": 247227, "epoch": 2978} {"train_loss": -25.172943115234375, "global_step": 247228, "epoch": 2978} {"train_loss": -24.738000869750977, "global_step": 247229, "epoch": 2978} {"train_loss": -25.29851531982422, "global_step": 247230, "epoch": 2978} {"train_loss": -25.289838790893555, "global_step": 247231, "epoch": 2978} {"train_loss": -25.335004806518555, "global_step": 247232, "epoch": 2978} {"train_loss": -25.08579444885254, "global_step": 247233, "epoch": 2978} {"train_loss": -25.134904861450195, "global_step": 247234, "epoch": 2978} {"train_loss": -25.206174850463867, "global_step": 247235, "epoch": 2978} {"train_loss": -24.918842315673828, "global_step": 247236, "epoch": 2978} {"train_loss": -24.891042709350586, "global_step": 247237, "epoch": 2978} {"train_loss": -25.24518585205078, "global_step": 247238, "epoch": 2978} {"train_loss": -24.980440139770508, "global_step": 247239, "epoch": 2978} {"train_loss": -25.028711318969727, "global_step": 247240, "epoch": 2978} {"train_loss": -25.124422073364258, "global_step": 247241, "epoch": 2978} {"train_loss": -25.246768951416016, "global_step": 247242, "epoch": 2978} {"train_loss": -25.06634521484375, "global_step": 247243, "epoch": 2978} {"train_loss": -24.806516647338867, "global_step": 247244, "epoch": 2978} {"train_loss": -24.788795471191406, "global_step": 247245, "epoch": 2978} {"train_loss": -24.884654998779297, "global_step": 247246, "epoch": 2978} {"train_loss": -24.578784942626953, "global_step": 247247, "epoch": 2978} {"train_loss": -25.066120147705078, "global_step": 247248, "epoch": 2978} {"train_loss": -24.846527099609375, "global_step": 247249, "epoch": 2978} {"train_loss": -24.788602828979492, "global_step": 247250, "epoch": 2978} {"train_loss": -25.20086669921875, "global_step": 247251, "epoch": 2978} {"train_loss": -25.017499923706055, "global_step": 247252, "epoch": 2978} {"train_loss": -24.691272735595703, "global_step": 247253, "epoch": 2978} {"train_loss": -25.009672164916992, "global_step": 247254, "epoch": 2978} {"train_loss": -25.121572494506836, "global_step": 247255, "epoch": 2978} {"train_loss": -24.926002548401613, "global_step": 247256, "epoch": 2978, "val_loss": 6789093.0} {"train_loss": -24.97499656677246, "global_step": 247257, "epoch": 2979} {"train_loss": -24.516136169433594, "global_step": 247258, "epoch": 2979} {"train_loss": -24.902265548706055, "global_step": 247259, "epoch": 2979} {"train_loss": -24.65944480895996, "global_step": 247260, "epoch": 2979} {"train_loss": -24.590667724609375, "global_step": 247261, "epoch": 2979} {"train_loss": -24.425058364868164, "global_step": 247262, "epoch": 2979} {"train_loss": -24.54656410217285, "global_step": 247263, "epoch": 2979} {"train_loss": -24.57704734802246, "global_step": 247264, "epoch": 2979} {"train_loss": -24.925609588623047, "global_step": 247265, "epoch": 2979} {"train_loss": -24.941564559936523, "global_step": 247266, "epoch": 2979} {"train_loss": -25.043842315673828, "global_step": 247267, "epoch": 2979} {"train_loss": -24.965778350830078, "global_step": 247268, "epoch": 2979} {"train_loss": -25.21507453918457, "global_step": 247269, "epoch": 2979} {"train_loss": -24.816089630126953, "global_step": 247270, "epoch": 2979} {"train_loss": -25.020008087158203, "global_step": 247271, "epoch": 2979} {"train_loss": -24.759855270385742, "global_step": 247272, "epoch": 2979} {"train_loss": -24.706335067749023, "global_step": 247273, "epoch": 2979} {"train_loss": -24.811193466186523, "global_step": 247274, "epoch": 2979} {"train_loss": -25.291610717773438, "global_step": 247275, "epoch": 2979} {"train_loss": -24.99532127380371, "global_step": 247276, "epoch": 2979} {"train_loss": -24.955745697021484, "global_step": 247277, "epoch": 2979} {"train_loss": -25.024423599243164, "global_step": 247278, "epoch": 2979} {"train_loss": -25.2724609375, "global_step": 247279, "epoch": 2979} {"train_loss": -24.741443634033203, "global_step": 247280, "epoch": 2979} {"train_loss": -25.359710693359375, "global_step": 247281, "epoch": 2979} {"train_loss": -25.03722381591797, "global_step": 247282, "epoch": 2979} {"train_loss": -24.925785064697266, "global_step": 247283, "epoch": 2979} {"train_loss": -24.825355529785156, "global_step": 247284, "epoch": 2979} {"train_loss": -25.162858963012695, "global_step": 247285, "epoch": 2979} {"train_loss": -24.824268341064453, "global_step": 247286, "epoch": 2979} {"train_loss": -24.764705657958984, "global_step": 247287, "epoch": 2979} {"train_loss": -25.165924072265625, "global_step": 247288, "epoch": 2979} {"train_loss": -25.424535751342773, "global_step": 247289, "epoch": 2979} {"train_loss": -25.156274795532227, "global_step": 247290, "epoch": 2979} {"train_loss": -25.23099708557129, "global_step": 247291, "epoch": 2979} {"train_loss": -25.196969985961914, "global_step": 247292, "epoch": 2979} {"train_loss": -24.933204650878906, "global_step": 247293, "epoch": 2979} {"train_loss": -25.399085998535156, "global_step": 247294, "epoch": 2979} {"train_loss": -24.816408157348633, "global_step": 247295, "epoch": 2979} {"train_loss": -24.957748413085938, "global_step": 247296, "epoch": 2979} {"train_loss": -24.94573974609375, "global_step": 247297, "epoch": 2979} {"train_loss": -25.367027282714844, "global_step": 247298, "epoch": 2979} {"train_loss": -24.70302391052246, "global_step": 247299, "epoch": 2979} {"train_loss": -24.401853561401367, "global_step": 247300, "epoch": 2979} {"train_loss": -24.76605796813965, "global_step": 247301, "epoch": 2979} {"train_loss": -25.323551177978516, "global_step": 247302, "epoch": 2979} {"train_loss": -25.072959899902344, "global_step": 247303, "epoch": 2979} {"train_loss": -24.853384017944336, "global_step": 247304, "epoch": 2979} {"train_loss": -25.363832473754883, "global_step": 247305, "epoch": 2979} {"train_loss": -24.98674964904785, "global_step": 247306, "epoch": 2979} {"train_loss": -25.007221221923828, "global_step": 247307, "epoch": 2979} {"train_loss": -25.326940536499023, "global_step": 247308, "epoch": 2979} {"train_loss": -24.76926040649414, "global_step": 247309, "epoch": 2979} {"train_loss": -24.986595153808594, "global_step": 247310, "epoch": 2979} {"train_loss": -25.045522689819336, "global_step": 247311, "epoch": 2979} {"train_loss": -24.378271102905273, "global_step": 247312, "epoch": 2979} {"train_loss": -25.079912185668945, "global_step": 247313, "epoch": 2979} {"train_loss": -24.871824264526367, "global_step": 247314, "epoch": 2979} {"train_loss": -25.223400115966797, "global_step": 247315, "epoch": 2979} {"train_loss": -24.941028594970703, "global_step": 247316, "epoch": 2979} {"train_loss": -24.869230270385742, "global_step": 247317, "epoch": 2979} {"train_loss": -24.95734214782715, "global_step": 247318, "epoch": 2979} {"train_loss": -25.312305450439453, "global_step": 247319, "epoch": 2979} {"train_loss": -24.780902862548828, "global_step": 247320, "epoch": 2979} {"train_loss": -24.93475914001465, "global_step": 247321, "epoch": 2979} {"train_loss": -25.254858016967773, "global_step": 247322, "epoch": 2979} {"train_loss": -25.088150024414062, "global_step": 247323, "epoch": 2979} {"train_loss": -24.808605194091797, "global_step": 247324, "epoch": 2979} {"train_loss": -25.056203842163086, "global_step": 247325, "epoch": 2979} {"train_loss": -24.80249786376953, "global_step": 247326, "epoch": 2979} {"train_loss": -24.828205108642578, "global_step": 247327, "epoch": 2979} {"train_loss": -25.333126068115234, "global_step": 247328, "epoch": 2979} {"train_loss": -24.96424674987793, "global_step": 247329, "epoch": 2979} {"train_loss": -25.0230770111084, "global_step": 247330, "epoch": 2979} {"train_loss": -24.886655807495117, "global_step": 247331, "epoch": 2979} {"train_loss": -25.115610122680664, "global_step": 247332, "epoch": 2979} {"train_loss": -25.30678367614746, "global_step": 247333, "epoch": 2979} {"train_loss": -25.141813278198242, "global_step": 247334, "epoch": 2979} {"train_loss": -24.922443389892578, "global_step": 247335, "epoch": 2979} {"train_loss": -25.16636848449707, "global_step": 247336, "epoch": 2979} {"train_loss": -25.163721084594727, "global_step": 247337, "epoch": 2979} {"train_loss": -24.876188278198242, "global_step": 247338, "epoch": 2979} {"train_loss": -24.97697984166892, "global_step": 247339, "epoch": 2979, "val_loss": 6815291.5} {"train_loss": -25.06386375427246, "global_step": 247340, "epoch": 2980} {"train_loss": -24.889753341674805, "global_step": 247341, "epoch": 2980} {"train_loss": -24.90270233154297, "global_step": 247342, "epoch": 2980} {"train_loss": -24.631988525390625, "global_step": 247343, "epoch": 2980} {"train_loss": -24.497846603393555, "global_step": 247344, "epoch": 2980} {"train_loss": -25.013141632080078, "global_step": 247345, "epoch": 2980} {"train_loss": -24.46997833251953, "global_step": 247346, "epoch": 2980} {"train_loss": -24.95884132385254, "global_step": 247347, "epoch": 2980} {"train_loss": -24.99319839477539, "global_step": 247348, "epoch": 2980} {"train_loss": -24.677278518676758, "global_step": 247349, "epoch": 2980} {"train_loss": -24.764501571655273, "global_step": 247350, "epoch": 2980} {"train_loss": -24.86147117614746, "global_step": 247351, "epoch": 2980} {"train_loss": -24.539487838745117, "global_step": 247352, "epoch": 2980} {"train_loss": -24.772592544555664, "global_step": 247353, "epoch": 2980} {"train_loss": -24.9193058013916, "global_step": 247354, "epoch": 2980} {"train_loss": -25.140125274658203, "global_step": 247355, "epoch": 2980} {"train_loss": -25.038040161132812, "global_step": 247356, "epoch": 2980} {"train_loss": -25.14524269104004, "global_step": 247357, "epoch": 2980} {"train_loss": -24.884750366210938, "global_step": 247358, "epoch": 2980} {"train_loss": -24.6029109954834, "global_step": 247359, "epoch": 2980} {"train_loss": -24.892929077148438, "global_step": 247360, "epoch": 2980} {"train_loss": -24.968759536743164, "global_step": 247361, "epoch": 2980} {"train_loss": -24.841575622558594, "global_step": 247362, "epoch": 2980} {"train_loss": -24.97120475769043, "global_step": 247363, "epoch": 2980} {"train_loss": -25.2511043548584, "global_step": 247364, "epoch": 2980} {"train_loss": -24.840763092041016, "global_step": 247365, "epoch": 2980} {"train_loss": -25.14869499206543, "global_step": 247366, "epoch": 2980} {"train_loss": -25.21405029296875, "global_step": 247367, "epoch": 2980} {"train_loss": -24.923831939697266, "global_step": 247368, "epoch": 2980} {"train_loss": -25.443716049194336, "global_step": 247369, "epoch": 2980} {"train_loss": -24.732349395751953, "global_step": 247370, "epoch": 2980} {"train_loss": -24.667465209960938, "global_step": 247371, "epoch": 2980} {"train_loss": -25.033533096313477, "global_step": 247372, "epoch": 2980} {"train_loss": -24.870458602905273, "global_step": 247373, "epoch": 2980} {"train_loss": -25.100698471069336, "global_step": 247374, "epoch": 2980} {"train_loss": -24.691669464111328, "global_step": 247375, "epoch": 2980} {"train_loss": -25.2221622467041, "global_step": 247376, "epoch": 2980} {"train_loss": -25.03646469116211, "global_step": 247377, "epoch": 2980} {"train_loss": -25.376920700073242, "global_step": 247378, "epoch": 2980} {"train_loss": -25.069473266601562, "global_step": 247379, "epoch": 2980} {"train_loss": -24.676610946655273, "global_step": 247380, "epoch": 2980} {"train_loss": -24.729042053222656, "global_step": 247381, "epoch": 2980} {"train_loss": -25.173995971679688, "global_step": 247382, "epoch": 2980} {"train_loss": -24.667646408081055, "global_step": 247383, "epoch": 2980} {"train_loss": -24.921588897705078, "global_step": 247384, "epoch": 2980} {"train_loss": -24.739667892456055, "global_step": 247385, "epoch": 2980} {"train_loss": -25.13514518737793, "global_step": 247386, "epoch": 2980} {"train_loss": -25.05621910095215, "global_step": 247387, "epoch": 2980} {"train_loss": -24.60666847229004, "global_step": 247388, "epoch": 2980} {"train_loss": -25.07293128967285, "global_step": 247389, "epoch": 2980} {"train_loss": -25.031736373901367, "global_step": 247390, "epoch": 2980} {"train_loss": -25.286996841430664, "global_step": 247391, "epoch": 2980} {"train_loss": -24.977771759033203, "global_step": 247392, "epoch": 2980} {"train_loss": -24.861989974975586, "global_step": 247393, "epoch": 2980} {"train_loss": -25.123746871948242, "global_step": 247394, "epoch": 2980} {"train_loss": -24.975801467895508, "global_step": 247395, "epoch": 2980} {"train_loss": -25.077314376831055, "global_step": 247396, "epoch": 2980} {"train_loss": -24.65105628967285, "global_step": 247397, "epoch": 2980} {"train_loss": -23.592954635620117, "global_step": 247398, "epoch": 2980} {"train_loss": -23.78653335571289, "global_step": 247399, "epoch": 2980} {"train_loss": -24.404598236083984, "global_step": 247400, "epoch": 2980} {"train_loss": -24.920217514038086, "global_step": 247401, "epoch": 2980} {"train_loss": -24.395095825195312, "global_step": 247402, "epoch": 2980} {"train_loss": -24.569440841674805, "global_step": 247403, "epoch": 2980} {"train_loss": -24.750289916992188, "global_step": 247404, "epoch": 2980} {"train_loss": -24.76396369934082, "global_step": 247405, "epoch": 2980} {"train_loss": -24.69809341430664, "global_step": 247406, "epoch": 2980} {"train_loss": -24.81732749938965, "global_step": 247407, "epoch": 2980} {"train_loss": -24.847076416015625, "global_step": 247408, "epoch": 2980} {"train_loss": -24.650005340576172, "global_step": 247409, "epoch": 2980} {"train_loss": -24.577383041381836, "global_step": 247410, "epoch": 2980} {"train_loss": -24.66132926940918, "global_step": 247411, "epoch": 2980} {"train_loss": -24.839704513549805, "global_step": 247412, "epoch": 2980} {"train_loss": -24.81069564819336, "global_step": 247413, "epoch": 2980} {"train_loss": -25.1324462890625, "global_step": 247414, "epoch": 2980} {"train_loss": -24.657041549682617, "global_step": 247415, "epoch": 2980} {"train_loss": -25.248517990112305, "global_step": 247416, "epoch": 2980} {"train_loss": -24.99937629699707, "global_step": 247417, "epoch": 2980} {"train_loss": -25.014734268188477, "global_step": 247418, "epoch": 2980} {"train_loss": -24.765274047851562, "global_step": 247419, "epoch": 2980} {"train_loss": -25.052867889404297, "global_step": 247420, "epoch": 2980} {"train_loss": -25.12787437438965, "global_step": 247421, "epoch": 2980} {"train_loss": -24.88084832156997, "global_step": 247422, "epoch": 2980, "val_loss": 6975006.0} {"train_loss": -24.32588005065918, "global_step": 247423, "epoch": 2981} {"train_loss": -24.85088539123535, "global_step": 247424, "epoch": 2981} {"train_loss": -24.507421493530273, "global_step": 247425, "epoch": 2981} {"train_loss": -24.548620223999023, "global_step": 247426, "epoch": 2981} {"train_loss": -24.41575813293457, "global_step": 247427, "epoch": 2981} {"train_loss": -24.401193618774414, "global_step": 247428, "epoch": 2981} {"train_loss": -24.53616714477539, "global_step": 247429, "epoch": 2981} {"train_loss": -24.80409812927246, "global_step": 247430, "epoch": 2981} {"train_loss": -25.06290054321289, "global_step": 247431, "epoch": 2981} {"train_loss": -24.675790786743164, "global_step": 247432, "epoch": 2981} {"train_loss": -24.69036293029785, "global_step": 247433, "epoch": 2981} {"train_loss": -24.85322380065918, "global_step": 247434, "epoch": 2981} {"train_loss": -24.5799560546875, "global_step": 247435, "epoch": 2981} {"train_loss": -24.462467193603516, "global_step": 247436, "epoch": 2981} {"train_loss": -24.9724178314209, "global_step": 247437, "epoch": 2981} {"train_loss": -24.72480583190918, "global_step": 247438, "epoch": 2981} {"train_loss": -24.899803161621094, "global_step": 247439, "epoch": 2981} {"train_loss": -24.830184936523438, "global_step": 247440, "epoch": 2981} {"train_loss": -24.807851791381836, "global_step": 247441, "epoch": 2981} {"train_loss": -25.116207122802734, "global_step": 247442, "epoch": 2981} {"train_loss": -24.971054077148438, "global_step": 247443, "epoch": 2981} {"train_loss": -24.838077545166016, "global_step": 247444, "epoch": 2981} {"train_loss": -25.18480110168457, "global_step": 247445, "epoch": 2981} {"train_loss": -25.05537986755371, "global_step": 247446, "epoch": 2981} {"train_loss": -25.127817153930664, "global_step": 247447, "epoch": 2981} {"train_loss": -24.902456283569336, "global_step": 247448, "epoch": 2981} {"train_loss": -24.9957218170166, "global_step": 247449, "epoch": 2981} {"train_loss": -24.96478843688965, "global_step": 247450, "epoch": 2981} {"train_loss": -25.29713249206543, "global_step": 247451, "epoch": 2981} {"train_loss": -24.931350708007812, "global_step": 247452, "epoch": 2981} {"train_loss": -25.031452178955078, "global_step": 247453, "epoch": 2981} {"train_loss": -25.000308990478516, "global_step": 247454, "epoch": 2981} {"train_loss": -25.22626304626465, "global_step": 247455, "epoch": 2981} {"train_loss": -25.200122833251953, "global_step": 247456, "epoch": 2981} {"train_loss": -25.034284591674805, "global_step": 247457, "epoch": 2981} {"train_loss": -24.868091583251953, "global_step": 247458, "epoch": 2981} {"train_loss": -24.882389068603516, "global_step": 247459, "epoch": 2981} {"train_loss": -25.1536808013916, "global_step": 247460, "epoch": 2981} {"train_loss": -25.302677154541016, "global_step": 247461, "epoch": 2981} {"train_loss": -25.367353439331055, "global_step": 247462, "epoch": 2981} {"train_loss": -24.97336769104004, "global_step": 247463, "epoch": 2981} {"train_loss": -25.282344818115234, "global_step": 247464, "epoch": 2981} {"train_loss": -25.662460327148438, "global_step": 247465, "epoch": 2981} {"train_loss": -25.131916046142578, "global_step": 247466, "epoch": 2981} {"train_loss": -25.118017196655273, "global_step": 247467, "epoch": 2981} {"train_loss": -24.756765365600586, "global_step": 247468, "epoch": 2981} {"train_loss": -25.162723541259766, "global_step": 247469, "epoch": 2981} {"train_loss": -25.260822296142578, "global_step": 247470, "epoch": 2981} {"train_loss": -24.97576332092285, "global_step": 247471, "epoch": 2981} {"train_loss": -24.917600631713867, "global_step": 247472, "epoch": 2981} {"train_loss": -24.827062606811523, "global_step": 247473, "epoch": 2981} {"train_loss": -24.886642456054688, "global_step": 247474, "epoch": 2981} {"train_loss": -24.764896392822266, "global_step": 247475, "epoch": 2981} {"train_loss": -25.05453109741211, "global_step": 247476, "epoch": 2981} {"train_loss": -24.471437454223633, "global_step": 247477, "epoch": 2981} {"train_loss": -24.908559799194336, "global_step": 247478, "epoch": 2981} {"train_loss": -24.98792839050293, "global_step": 247479, "epoch": 2981} {"train_loss": -24.900190353393555, "global_step": 247480, "epoch": 2981} {"train_loss": -25.28928565979004, "global_step": 247481, "epoch": 2981} {"train_loss": -24.880590438842773, "global_step": 247482, "epoch": 2981} {"train_loss": -24.77191162109375, "global_step": 247483, "epoch": 2981} {"train_loss": -24.879064559936523, "global_step": 247484, "epoch": 2981} {"train_loss": -24.922346115112305, "global_step": 247485, "epoch": 2981} {"train_loss": -25.21147918701172, "global_step": 247486, "epoch": 2981} {"train_loss": -24.54922866821289, "global_step": 247487, "epoch": 2981} {"train_loss": -25.115259170532227, "global_step": 247488, "epoch": 2981} {"train_loss": -24.905675888061523, "global_step": 247489, "epoch": 2981} {"train_loss": -24.894906997680664, "global_step": 247490, "epoch": 2981} {"train_loss": -25.235647201538086, "global_step": 247491, "epoch": 2981} {"train_loss": -24.719511032104492, "global_step": 247492, "epoch": 2981} {"train_loss": -25.101652145385742, "global_step": 247493, "epoch": 2981} {"train_loss": -24.836477279663086, "global_step": 247494, "epoch": 2981} {"train_loss": -25.07660484313965, "global_step": 247495, "epoch": 2981} {"train_loss": -24.870328903198242, "global_step": 247496, "epoch": 2981} {"train_loss": -24.913005828857422, "global_step": 247497, "epoch": 2981} {"train_loss": -25.592573165893555, "global_step": 247498, "epoch": 2981} {"train_loss": -24.699796676635742, "global_step": 247499, "epoch": 2981} {"train_loss": -25.2785701751709, "global_step": 247500, "epoch": 2981} {"train_loss": -25.21568489074707, "global_step": 247501, "epoch": 2981} {"train_loss": -24.95622444152832, "global_step": 247502, "epoch": 2981} {"train_loss": -24.636194229125977, "global_step": 247503, "epoch": 2981} {"train_loss": -25.104276657104492, "global_step": 247504, "epoch": 2981} {"train_loss": -24.934347566351832, "global_step": 247505, "epoch": 2981, "val_loss": 6754038.0} {"train_loss": -24.6154842376709, "global_step": 247506, "epoch": 2982} {"train_loss": -24.37086296081543, "global_step": 247507, "epoch": 2982} {"train_loss": -25.10951805114746, "global_step": 247508, "epoch": 2982} {"train_loss": -24.91634750366211, "global_step": 247509, "epoch": 2982} {"train_loss": -24.279611587524414, "global_step": 247510, "epoch": 2982} {"train_loss": -24.660512924194336, "global_step": 247511, "epoch": 2982} {"train_loss": -24.524673461914062, "global_step": 247512, "epoch": 2982} {"train_loss": -24.712621688842773, "global_step": 247513, "epoch": 2982} {"train_loss": -25.008840560913086, "global_step": 247514, "epoch": 2982} {"train_loss": -25.033517837524414, "global_step": 247515, "epoch": 2982} {"train_loss": -24.496139526367188, "global_step": 247516, "epoch": 2982} {"train_loss": -25.30126953125, "global_step": 247517, "epoch": 2982} {"train_loss": -24.908031463623047, "global_step": 247518, "epoch": 2982} {"train_loss": -24.810091018676758, "global_step": 247519, "epoch": 2982} {"train_loss": -24.79581642150879, "global_step": 247520, "epoch": 2982} {"train_loss": -24.841638565063477, "global_step": 247521, "epoch": 2982} {"train_loss": -24.9726505279541, "global_step": 247522, "epoch": 2982} {"train_loss": -24.904993057250977, "global_step": 247523, "epoch": 2982} {"train_loss": -24.659563064575195, "global_step": 247524, "epoch": 2982} {"train_loss": -24.89352035522461, "global_step": 247525, "epoch": 2982} {"train_loss": -24.727920532226562, "global_step": 247526, "epoch": 2982} {"train_loss": -24.92458152770996, "global_step": 247527, "epoch": 2982} {"train_loss": -25.036367416381836, "global_step": 247528, "epoch": 2982} {"train_loss": -25.421722412109375, "global_step": 247529, "epoch": 2982} {"train_loss": -24.56551170349121, "global_step": 247530, "epoch": 2982} {"train_loss": -24.861820220947266, "global_step": 247531, "epoch": 2982} {"train_loss": -24.85481834411621, "global_step": 247532, "epoch": 2982} {"train_loss": -24.925586700439453, "global_step": 247533, "epoch": 2982} {"train_loss": -24.673458099365234, "global_step": 247534, "epoch": 2982} {"train_loss": -25.20205307006836, "global_step": 247535, "epoch": 2982} {"train_loss": -24.660964965820312, "global_step": 247536, "epoch": 2982} {"train_loss": -25.019784927368164, "global_step": 247537, "epoch": 2982} {"train_loss": -24.620899200439453, "global_step": 247538, "epoch": 2982} {"train_loss": -24.98237419128418, "global_step": 247539, "epoch": 2982} {"train_loss": -25.07489013671875, "global_step": 247540, "epoch": 2982} {"train_loss": -25.012935638427734, "global_step": 247541, "epoch": 2982} {"train_loss": -24.94577407836914, "global_step": 247542, "epoch": 2982} {"train_loss": -24.823871612548828, "global_step": 247543, "epoch": 2982} {"train_loss": -25.140012741088867, "global_step": 247544, "epoch": 2982} {"train_loss": -24.738126754760742, "global_step": 247545, "epoch": 2982} {"train_loss": -24.74007225036621, "global_step": 247546, "epoch": 2982} {"train_loss": -25.018598556518555, "global_step": 247547, "epoch": 2982} {"train_loss": -24.909101486206055, "global_step": 247548, "epoch": 2982} {"train_loss": -25.265594482421875, "global_step": 247549, "epoch": 2982} {"train_loss": -24.974458694458008, "global_step": 247550, "epoch": 2982} {"train_loss": -24.828771591186523, "global_step": 247551, "epoch": 2982} {"train_loss": -24.948406219482422, "global_step": 247552, "epoch": 2982} {"train_loss": -24.943729400634766, "global_step": 247553, "epoch": 2982} {"train_loss": -24.796186447143555, "global_step": 247554, "epoch": 2982} {"train_loss": -24.372217178344727, "global_step": 247555, "epoch": 2982} {"train_loss": -24.924179077148438, "global_step": 247556, "epoch": 2982} {"train_loss": -25.157384872436523, "global_step": 247557, "epoch": 2982} {"train_loss": -25.003665924072266, "global_step": 247558, "epoch": 2982} {"train_loss": -25.2453556060791, "global_step": 247559, "epoch": 2982} {"train_loss": -24.957178115844727, "global_step": 247560, "epoch": 2982} {"train_loss": -24.80374526977539, "global_step": 247561, "epoch": 2982} {"train_loss": -25.064544677734375, "global_step": 247562, "epoch": 2982} {"train_loss": -25.072229385375977, "global_step": 247563, "epoch": 2982} {"train_loss": -24.36601448059082, "global_step": 247564, "epoch": 2982} {"train_loss": -25.2918758392334, "global_step": 247565, "epoch": 2982} {"train_loss": -24.703840255737305, "global_step": 247566, "epoch": 2982} {"train_loss": -24.639427185058594, "global_step": 247567, "epoch": 2982} {"train_loss": -24.603479385375977, "global_step": 247568, "epoch": 2982} {"train_loss": -25.13620376586914, "global_step": 247569, "epoch": 2982} {"train_loss": -24.7788143157959, "global_step": 247570, "epoch": 2982} {"train_loss": -25.03537368774414, "global_step": 247571, "epoch": 2982} {"train_loss": -25.158544540405273, "global_step": 247572, "epoch": 2982} {"train_loss": -24.98310661315918, "global_step": 247573, "epoch": 2982} {"train_loss": -24.889219284057617, "global_step": 247574, "epoch": 2982} {"train_loss": -25.193557739257812, "global_step": 247575, "epoch": 2982} {"train_loss": -24.959579467773438, "global_step": 247576, "epoch": 2982} {"train_loss": -25.301136016845703, "global_step": 247577, "epoch": 2982} {"train_loss": -24.630428314208984, "global_step": 247578, "epoch": 2982} {"train_loss": -25.061506271362305, "global_step": 247579, "epoch": 2982} {"train_loss": -25.164291381835938, "global_step": 247580, "epoch": 2982} {"train_loss": -25.583534240722656, "global_step": 247581, "epoch": 2982} {"train_loss": -24.694366455078125, "global_step": 247582, "epoch": 2982} {"train_loss": -24.85416603088379, "global_step": 247583, "epoch": 2982} {"train_loss": -25.137344360351562, "global_step": 247584, "epoch": 2982} {"train_loss": -25.124332427978516, "global_step": 247585, "epoch": 2982} {"train_loss": -25.2199764251709, "global_step": 247586, "epoch": 2982} {"train_loss": -25.401092529296875, "global_step": 247587, "epoch": 2982} {"train_loss": -24.913496591958655, "global_step": 247588, "epoch": 2982, "val_loss": 6819986.0} {"train_loss": -24.97606658935547, "global_step": 247589, "epoch": 2983} {"train_loss": -24.85675048828125, "global_step": 247590, "epoch": 2983} {"train_loss": -25.049718856811523, "global_step": 247591, "epoch": 2983} {"train_loss": -24.965246200561523, "global_step": 247592, "epoch": 2983} {"train_loss": -24.893280029296875, "global_step": 247593, "epoch": 2983} {"train_loss": -25.13068962097168, "global_step": 247594, "epoch": 2983} {"train_loss": -24.915485382080078, "global_step": 247595, "epoch": 2983} {"train_loss": -24.853174209594727, "global_step": 247596, "epoch": 2983} {"train_loss": -24.956357955932617, "global_step": 247597, "epoch": 2983} {"train_loss": -24.984548568725586, "global_step": 247598, "epoch": 2983} {"train_loss": -25.14397621154785, "global_step": 247599, "epoch": 2983} {"train_loss": -24.967878341674805, "global_step": 247600, "epoch": 2983} {"train_loss": -24.968442916870117, "global_step": 247601, "epoch": 2983} {"train_loss": -24.76631736755371, "global_step": 247602, "epoch": 2983} {"train_loss": -25.032550811767578, "global_step": 247603, "epoch": 2983} {"train_loss": -25.022205352783203, "global_step": 247604, "epoch": 2983} {"train_loss": -25.159936904907227, "global_step": 247605, "epoch": 2983} {"train_loss": -25.14491081237793, "global_step": 247606, "epoch": 2983} {"train_loss": -25.01658058166504, "global_step": 247607, "epoch": 2983} {"train_loss": -24.980731964111328, "global_step": 247608, "epoch": 2983} {"train_loss": -24.941781997680664, "global_step": 247609, "epoch": 2983} {"train_loss": -25.07191276550293, "global_step": 247610, "epoch": 2983} {"train_loss": -25.47015380859375, "global_step": 247611, "epoch": 2983} {"train_loss": -25.02337074279785, "global_step": 247612, "epoch": 2983} {"train_loss": -25.208534240722656, "global_step": 247613, "epoch": 2983} {"train_loss": -24.903345108032227, "global_step": 247614, "epoch": 2983} {"train_loss": -24.97528839111328, "global_step": 247615, "epoch": 2983} {"train_loss": -25.16074562072754, "global_step": 247616, "epoch": 2983} {"train_loss": -24.953779220581055, "global_step": 247617, "epoch": 2983} {"train_loss": -24.567922592163086, "global_step": 247618, "epoch": 2983} {"train_loss": -25.008499145507812, "global_step": 247619, "epoch": 2983} {"train_loss": -24.504240036010742, "global_step": 247620, "epoch": 2983} {"train_loss": -24.902271270751953, "global_step": 247621, "epoch": 2983} {"train_loss": -24.983049392700195, "global_step": 247622, "epoch": 2983} {"train_loss": -25.1633358001709, "global_step": 247623, "epoch": 2983} {"train_loss": -24.551082611083984, "global_step": 247624, "epoch": 2983} {"train_loss": -24.960622787475586, "global_step": 247625, "epoch": 2983} {"train_loss": -24.617643356323242, "global_step": 247626, "epoch": 2983} {"train_loss": -24.70401382446289, "global_step": 247627, "epoch": 2983} {"train_loss": -24.862245559692383, "global_step": 247628, "epoch": 2983} {"train_loss": -24.66558265686035, "global_step": 247629, "epoch": 2983} {"train_loss": -24.426420211791992, "global_step": 247630, "epoch": 2983} {"train_loss": -24.37102508544922, "global_step": 247631, "epoch": 2983} {"train_loss": -25.010639190673828, "global_step": 247632, "epoch": 2983} {"train_loss": -24.546865463256836, "global_step": 247633, "epoch": 2983} {"train_loss": -24.540630340576172, "global_step": 247634, "epoch": 2983} {"train_loss": -25.04805564880371, "global_step": 247635, "epoch": 2983} {"train_loss": -24.609683990478516, "global_step": 247636, "epoch": 2983} {"train_loss": -25.047338485717773, "global_step": 247637, "epoch": 2983} {"train_loss": -24.971662521362305, "global_step": 247638, "epoch": 2983} {"train_loss": -24.82001495361328, "global_step": 247639, "epoch": 2983} {"train_loss": -25.05826759338379, "global_step": 247640, "epoch": 2983} {"train_loss": -24.69805908203125, "global_step": 247641, "epoch": 2983} {"train_loss": -24.981225967407227, "global_step": 247642, "epoch": 2983} {"train_loss": -25.014951705932617, "global_step": 247643, "epoch": 2983} {"train_loss": -24.673782348632812, "global_step": 247644, "epoch": 2983} {"train_loss": -25.192075729370117, "global_step": 247645, "epoch": 2983} {"train_loss": -24.89674949645996, "global_step": 247646, "epoch": 2983} {"train_loss": -25.052648544311523, "global_step": 247647, "epoch": 2983} {"train_loss": -24.94801902770996, "global_step": 247648, "epoch": 2983} {"train_loss": -24.96331024169922, "global_step": 247649, "epoch": 2983} {"train_loss": -25.10744857788086, "global_step": 247650, "epoch": 2983} {"train_loss": -25.14318084716797, "global_step": 247651, "epoch": 2983} {"train_loss": -25.282453536987305, "global_step": 247652, "epoch": 2983} {"train_loss": -24.983083724975586, "global_step": 247653, "epoch": 2983} {"train_loss": -25.382022857666016, "global_step": 247654, "epoch": 2983} {"train_loss": -25.275388717651367, "global_step": 247655, "epoch": 2983} {"train_loss": -24.872167587280273, "global_step": 247656, "epoch": 2983} {"train_loss": -25.235334396362305, "global_step": 247657, "epoch": 2983} {"train_loss": -24.764907836914062, "global_step": 247658, "epoch": 2983} {"train_loss": -25.339168548583984, "global_step": 247659, "epoch": 2983} {"train_loss": -24.909387588500977, "global_step": 247660, "epoch": 2983} {"train_loss": -25.051929473876953, "global_step": 247661, "epoch": 2983} {"train_loss": -24.928258895874023, "global_step": 247662, "epoch": 2983} {"train_loss": -25.54163932800293, "global_step": 247663, "epoch": 2983} {"train_loss": -25.38752555847168, "global_step": 247664, "epoch": 2983} {"train_loss": -25.062891006469727, "global_step": 247665, "epoch": 2983} {"train_loss": -25.262113571166992, "global_step": 247666, "epoch": 2983} {"train_loss": -25.234079360961914, "global_step": 247667, "epoch": 2983} {"train_loss": -25.330381393432617, "global_step": 247668, "epoch": 2983} {"train_loss": -24.800268173217773, "global_step": 247669, "epoch": 2983} {"train_loss": -25.188322067260742, "global_step": 247670, "epoch": 2983} {"train_loss": -24.987921450511518, "global_step": 247671, "epoch": 2983, "val_loss": 6917536.5} {"train_loss": -24.295286178588867, "global_step": 247672, "epoch": 2984} {"train_loss": -24.36800765991211, "global_step": 247673, "epoch": 2984} {"train_loss": -24.581281661987305, "global_step": 247674, "epoch": 2984} {"train_loss": -24.5761775970459, "global_step": 247675, "epoch": 2984} {"train_loss": -24.557302474975586, "global_step": 247676, "epoch": 2984} {"train_loss": -25.067672729492188, "global_step": 247677, "epoch": 2984} {"train_loss": -24.785215377807617, "global_step": 247678, "epoch": 2984} {"train_loss": -24.241300582885742, "global_step": 247679, "epoch": 2984} {"train_loss": -24.728229522705078, "global_step": 247680, "epoch": 2984} {"train_loss": -24.377744674682617, "global_step": 247681, "epoch": 2984} {"train_loss": -24.88237190246582, "global_step": 247682, "epoch": 2984} {"train_loss": -24.411848068237305, "global_step": 247683, "epoch": 2984} {"train_loss": -24.869504928588867, "global_step": 247684, "epoch": 2984} {"train_loss": -24.574466705322266, "global_step": 247685, "epoch": 2984} {"train_loss": -24.546613693237305, "global_step": 247686, "epoch": 2984} {"train_loss": -24.85184669494629, "global_step": 247687, "epoch": 2984} {"train_loss": -25.16341209411621, "global_step": 247688, "epoch": 2984} {"train_loss": -24.665958404541016, "global_step": 247689, "epoch": 2984} {"train_loss": -24.738012313842773, "global_step": 247690, "epoch": 2984} {"train_loss": -25.336891174316406, "global_step": 247691, "epoch": 2984} {"train_loss": -24.545486450195312, "global_step": 247692, "epoch": 2984} {"train_loss": -24.714651107788086, "global_step": 247693, "epoch": 2984} {"train_loss": -24.993576049804688, "global_step": 247694, "epoch": 2984} {"train_loss": -24.84612274169922, "global_step": 247695, "epoch": 2984} {"train_loss": -25.10440444946289, "global_step": 247696, "epoch": 2984} {"train_loss": -24.80828857421875, "global_step": 247697, "epoch": 2984} {"train_loss": -24.82052230834961, "global_step": 247698, "epoch": 2984} {"train_loss": -25.195585250854492, "global_step": 247699, "epoch": 2984} {"train_loss": -25.086828231811523, "global_step": 247700, "epoch": 2984} {"train_loss": -24.98727798461914, "global_step": 247701, "epoch": 2984} {"train_loss": -25.037906646728516, "global_step": 247702, "epoch": 2984} {"train_loss": -25.14864158630371, "global_step": 247703, "epoch": 2984} {"train_loss": -25.400339126586914, "global_step": 247704, "epoch": 2984} {"train_loss": -25.22678565979004, "global_step": 247705, "epoch": 2984} {"train_loss": -25.17475700378418, "global_step": 247706, "epoch": 2984} {"train_loss": -25.31882095336914, "global_step": 247707, "epoch": 2984} {"train_loss": -24.920480728149414, "global_step": 247708, "epoch": 2984} {"train_loss": -25.317487716674805, "global_step": 247709, "epoch": 2984} {"train_loss": -25.12213706970215, "global_step": 247710, "epoch": 2984} {"train_loss": -25.100677490234375, "global_step": 247711, "epoch": 2984} {"train_loss": -24.79183578491211, "global_step": 247712, "epoch": 2984} {"train_loss": -25.0838680267334, "global_step": 247713, "epoch": 2984} {"train_loss": -25.21320915222168, "global_step": 247714, "epoch": 2984} {"train_loss": -25.14321517944336, "global_step": 247715, "epoch": 2984} {"train_loss": -24.52117919921875, "global_step": 247716, "epoch": 2984} {"train_loss": -24.875829696655273, "global_step": 247717, "epoch": 2984} {"train_loss": -25.00815200805664, "global_step": 247718, "epoch": 2984} {"train_loss": -24.343969345092773, "global_step": 247719, "epoch": 2984} {"train_loss": -23.776126861572266, "global_step": 247720, "epoch": 2984} {"train_loss": -23.73666000366211, "global_step": 247721, "epoch": 2984} {"train_loss": -24.633764266967773, "global_step": 247722, "epoch": 2984} {"train_loss": -24.481109619140625, "global_step": 247723, "epoch": 2984} {"train_loss": -24.022823333740234, "global_step": 247724, "epoch": 2984} {"train_loss": -24.690427780151367, "global_step": 247725, "epoch": 2984} {"train_loss": -24.54811668395996, "global_step": 247726, "epoch": 2984} {"train_loss": -24.85526466369629, "global_step": 247727, "epoch": 2984} {"train_loss": -25.125293731689453, "global_step": 247728, "epoch": 2984} {"train_loss": -24.853178024291992, "global_step": 247729, "epoch": 2984} {"train_loss": -25.053176879882812, "global_step": 247730, "epoch": 2984} {"train_loss": -24.771625518798828, "global_step": 247731, "epoch": 2984} {"train_loss": -24.777185440063477, "global_step": 247732, "epoch": 2984} {"train_loss": -24.813756942749023, "global_step": 247733, "epoch": 2984} {"train_loss": -25.030349731445312, "global_step": 247734, "epoch": 2984} {"train_loss": -24.881929397583008, "global_step": 247735, "epoch": 2984} {"train_loss": -25.061819076538086, "global_step": 247736, "epoch": 2984} {"train_loss": -24.868457794189453, "global_step": 247737, "epoch": 2984} {"train_loss": -25.063976287841797, "global_step": 247738, "epoch": 2984} {"train_loss": -24.849323272705078, "global_step": 247739, "epoch": 2984} {"train_loss": -24.858339309692383, "global_step": 247740, "epoch": 2984} {"train_loss": -25.126962661743164, "global_step": 247741, "epoch": 2984} {"train_loss": -24.808740615844727, "global_step": 247742, "epoch": 2984} {"train_loss": -25.033782958984375, "global_step": 247743, "epoch": 2984} {"train_loss": -25.059553146362305, "global_step": 247744, "epoch": 2984} {"train_loss": -24.865100860595703, "global_step": 247745, "epoch": 2984} {"train_loss": -25.125022888183594, "global_step": 247746, "epoch": 2984} {"train_loss": -24.891647338867188, "global_step": 247747, "epoch": 2984} {"train_loss": -25.154104232788086, "global_step": 247748, "epoch": 2984} {"train_loss": -25.105321884155273, "global_step": 247749, "epoch": 2984} {"train_loss": -24.957799911499023, "global_step": 247750, "epoch": 2984} {"train_loss": -24.93848991394043, "global_step": 247751, "epoch": 2984} {"train_loss": -24.82231903076172, "global_step": 247752, "epoch": 2984} {"train_loss": -24.933469772338867, "global_step": 247753, "epoch": 2984} {"train_loss": -24.838733466274768, "global_step": 247754, "epoch": 2984, "val_loss": 6805534.0} {"train_loss": -23.366878509521484, "global_step": 247755, "epoch": 2985} {"train_loss": -23.934276580810547, "global_step": 247756, "epoch": 2985} {"train_loss": -23.78782081604004, "global_step": 247757, "epoch": 2985} {"train_loss": -24.33443832397461, "global_step": 247758, "epoch": 2985} {"train_loss": -23.9549617767334, "global_step": 247759, "epoch": 2985} {"train_loss": -23.98737144470215, "global_step": 247760, "epoch": 2985} {"train_loss": -24.15155601501465, "global_step": 247761, "epoch": 2985} {"train_loss": -24.020238876342773, "global_step": 247762, "epoch": 2985} {"train_loss": -24.391189575195312, "global_step": 247763, "epoch": 2985} {"train_loss": -24.144699096679688, "global_step": 247764, "epoch": 2985} {"train_loss": -24.401729583740234, "global_step": 247765, "epoch": 2985} {"train_loss": -24.761917114257812, "global_step": 247766, "epoch": 2985} {"train_loss": -24.680625915527344, "global_step": 247767, "epoch": 2985} {"train_loss": -24.787137985229492, "global_step": 247768, "epoch": 2985} {"train_loss": -24.644418716430664, "global_step": 247769, "epoch": 2985} {"train_loss": -24.2038631439209, "global_step": 247770, "epoch": 2985} {"train_loss": -24.55470848083496, "global_step": 247771, "epoch": 2985} {"train_loss": -24.577802658081055, "global_step": 247772, "epoch": 2985} {"train_loss": -24.627817153930664, "global_step": 247773, "epoch": 2985} {"train_loss": -24.946422576904297, "global_step": 247774, "epoch": 2985} {"train_loss": -25.103952407836914, "global_step": 247775, "epoch": 2985} {"train_loss": -24.814794540405273, "global_step": 247776, "epoch": 2985} {"train_loss": -24.525880813598633, "global_step": 247777, "epoch": 2985} {"train_loss": -24.6898136138916, "global_step": 247778, "epoch": 2985} {"train_loss": -24.860525131225586, "global_step": 247779, "epoch": 2985} {"train_loss": -24.856260299682617, "global_step": 247780, "epoch": 2985} {"train_loss": -24.66004753112793, "global_step": 247781, "epoch": 2985} {"train_loss": -25.20391845703125, "global_step": 247782, "epoch": 2985} {"train_loss": -24.789405822753906, "global_step": 247783, "epoch": 2985} {"train_loss": -24.971546173095703, "global_step": 247784, "epoch": 2985} {"train_loss": -24.879697799682617, "global_step": 247785, "epoch": 2985} {"train_loss": -24.740428924560547, "global_step": 247786, "epoch": 2985} {"train_loss": -25.21563148498535, "global_step": 247787, "epoch": 2985} {"train_loss": -24.883056640625, "global_step": 247788, "epoch": 2985} {"train_loss": -25.207544326782227, "global_step": 247789, "epoch": 2985} {"train_loss": -25.14739990234375, "global_step": 247790, "epoch": 2985} {"train_loss": -25.043228149414062, "global_step": 247791, "epoch": 2985} {"train_loss": -25.10744285583496, "global_step": 247792, "epoch": 2985} {"train_loss": -25.074344635009766, "global_step": 247793, "epoch": 2985} {"train_loss": -24.957021713256836, "global_step": 247794, "epoch": 2985} {"train_loss": -25.04515838623047, "global_step": 247795, "epoch": 2985} {"train_loss": -25.002836227416992, "global_step": 247796, "epoch": 2985} {"train_loss": -25.237903594970703, "global_step": 247797, "epoch": 2985} {"train_loss": -25.456478118896484, "global_step": 247798, "epoch": 2985} {"train_loss": -25.13630485534668, "global_step": 247799, "epoch": 2985} {"train_loss": -24.908491134643555, "global_step": 247800, "epoch": 2985} {"train_loss": -25.100309371948242, "global_step": 247801, "epoch": 2985} {"train_loss": -24.7644100189209, "global_step": 247802, "epoch": 2985} {"train_loss": -25.153106689453125, "global_step": 247803, "epoch": 2985} {"train_loss": -24.968399047851562, "global_step": 247804, "epoch": 2985} {"train_loss": -25.33803939819336, "global_step": 247805, "epoch": 2985} {"train_loss": -25.409692764282227, "global_step": 247806, "epoch": 2985} {"train_loss": -24.999597549438477, "global_step": 247807, "epoch": 2985} {"train_loss": -24.884469985961914, "global_step": 247808, "epoch": 2985} {"train_loss": -24.282119750976562, "global_step": 247809, "epoch": 2985} {"train_loss": -24.848508834838867, "global_step": 247810, "epoch": 2985} {"train_loss": -25.22638511657715, "global_step": 247811, "epoch": 2985} {"train_loss": -25.066486358642578, "global_step": 247812, "epoch": 2985} {"train_loss": -24.840686798095703, "global_step": 247813, "epoch": 2985} {"train_loss": -25.0075740814209, "global_step": 247814, "epoch": 2985} {"train_loss": -24.874448776245117, "global_step": 247815, "epoch": 2985} {"train_loss": -24.8970947265625, "global_step": 247816, "epoch": 2985} {"train_loss": -24.77554702758789, "global_step": 247817, "epoch": 2985} {"train_loss": -24.979013442993164, "global_step": 247818, "epoch": 2985} {"train_loss": -25.374929428100586, "global_step": 247819, "epoch": 2985} {"train_loss": -25.019519805908203, "global_step": 247820, "epoch": 2985} {"train_loss": -25.11081314086914, "global_step": 247821, "epoch": 2985} {"train_loss": -24.86551284790039, "global_step": 247822, "epoch": 2985} {"train_loss": -25.07647132873535, "global_step": 247823, "epoch": 2985} {"train_loss": -25.055734634399414, "global_step": 247824, "epoch": 2985} {"train_loss": -25.035186767578125, "global_step": 247825, "epoch": 2985} {"train_loss": -25.242671966552734, "global_step": 247826, "epoch": 2985} {"train_loss": -24.672407150268555, "global_step": 247827, "epoch": 2985} {"train_loss": -25.18893814086914, "global_step": 247828, "epoch": 2985} {"train_loss": -25.172407150268555, "global_step": 247829, "epoch": 2985} {"train_loss": -25.209089279174805, "global_step": 247830, "epoch": 2985} {"train_loss": -25.17092514038086, "global_step": 247831, "epoch": 2985} {"train_loss": -24.791227340698242, "global_step": 247832, "epoch": 2985} {"train_loss": -25.10933494567871, "global_step": 247833, "epoch": 2985} {"train_loss": -25.554981231689453, "global_step": 247834, "epoch": 2985} {"train_loss": -24.87457847595215, "global_step": 247835, "epoch": 2985} {"train_loss": -25.2888240814209, "global_step": 247836, "epoch": 2985} {"train_loss": -24.855275832026837, "global_step": 247837, "epoch": 2985, "val_loss": 6688036.0} {"train_loss": -23.861669540405273, "global_step": 247838, "epoch": 2986} {"train_loss": -24.137081146240234, "global_step": 247839, "epoch": 2986} {"train_loss": -23.958261489868164, "global_step": 247840, "epoch": 2986} {"train_loss": -24.32770347595215, "global_step": 247841, "epoch": 2986} {"train_loss": -24.015213012695312, "global_step": 247842, "epoch": 2986} {"train_loss": -23.54153060913086, "global_step": 247843, "epoch": 2986} {"train_loss": -24.003156661987305, "global_step": 247844, "epoch": 2986} {"train_loss": -24.628755569458008, "global_step": 247845, "epoch": 2986} {"train_loss": -24.166223526000977, "global_step": 247846, "epoch": 2986} {"train_loss": -24.05641746520996, "global_step": 247847, "epoch": 2986} {"train_loss": -24.302326202392578, "global_step": 247848, "epoch": 2986} {"train_loss": -24.192337036132812, "global_step": 247849, "epoch": 2986} {"train_loss": -24.101491928100586, "global_step": 247850, "epoch": 2986} {"train_loss": -24.338537216186523, "global_step": 247851, "epoch": 2986} {"train_loss": -24.463415145874023, "global_step": 247852, "epoch": 2986} {"train_loss": -24.25552749633789, "global_step": 247853, "epoch": 2986} {"train_loss": -24.58023452758789, "global_step": 247854, "epoch": 2986} {"train_loss": -24.89021873474121, "global_step": 247855, "epoch": 2986} {"train_loss": -24.598730087280273, "global_step": 247856, "epoch": 2986} {"train_loss": -24.424551010131836, "global_step": 247857, "epoch": 2986} {"train_loss": -24.388124465942383, "global_step": 247858, "epoch": 2986} {"train_loss": -24.644275665283203, "global_step": 247859, "epoch": 2986} {"train_loss": -24.48085594177246, "global_step": 247860, "epoch": 2986} {"train_loss": -24.703500747680664, "global_step": 247861, "epoch": 2986} {"train_loss": -25.011632919311523, "global_step": 247862, "epoch": 2986} {"train_loss": -24.82114601135254, "global_step": 247863, "epoch": 2986} {"train_loss": -24.759326934814453, "global_step": 247864, "epoch": 2986} {"train_loss": -25.07645034790039, "global_step": 247865, "epoch": 2986} {"train_loss": -24.8212947845459, "global_step": 247866, "epoch": 2986} {"train_loss": -24.916248321533203, "global_step": 247867, "epoch": 2986} {"train_loss": -24.940305709838867, "global_step": 247868, "epoch": 2986} {"train_loss": -24.855932235717773, "global_step": 247869, "epoch": 2986} {"train_loss": -24.86273193359375, "global_step": 247870, "epoch": 2986} {"train_loss": -24.72574234008789, "global_step": 247871, "epoch": 2986} {"train_loss": -25.06964111328125, "global_step": 247872, "epoch": 2986} {"train_loss": -24.912160873413086, "global_step": 247873, "epoch": 2986} {"train_loss": -24.66910171508789, "global_step": 247874, "epoch": 2986} {"train_loss": -24.98313331604004, "global_step": 247875, "epoch": 2986} {"train_loss": -24.93558120727539, "global_step": 247876, "epoch": 2986} {"train_loss": -25.15968132019043, "global_step": 247877, "epoch": 2986} {"train_loss": -25.273996353149414, "global_step": 247878, "epoch": 2986} {"train_loss": -25.087427139282227, "global_step": 247879, "epoch": 2986} {"train_loss": -25.196205139160156, "global_step": 247880, "epoch": 2986} {"train_loss": -25.46584701538086, "global_step": 247881, "epoch": 2986} {"train_loss": -25.331186294555664, "global_step": 247882, "epoch": 2986} {"train_loss": -25.178308486938477, "global_step": 247883, "epoch": 2986} {"train_loss": -25.31587028503418, "global_step": 247884, "epoch": 2986} {"train_loss": -25.405067443847656, "global_step": 247885, "epoch": 2986} {"train_loss": -24.726242065429688, "global_step": 247886, "epoch": 2986} {"train_loss": -25.043399810791016, "global_step": 247887, "epoch": 2986} {"train_loss": -24.940959930419922, "global_step": 247888, "epoch": 2986} {"train_loss": -24.74574851989746, "global_step": 247889, "epoch": 2986} {"train_loss": -25.225210189819336, "global_step": 247890, "epoch": 2986} {"train_loss": -25.013212203979492, "global_step": 247891, "epoch": 2986} {"train_loss": -24.950281143188477, "global_step": 247892, "epoch": 2986} {"train_loss": -25.11528968811035, "global_step": 247893, "epoch": 2986} {"train_loss": -25.157001495361328, "global_step": 247894, "epoch": 2986} {"train_loss": -25.3458309173584, "global_step": 247895, "epoch": 2986} {"train_loss": -25.036367416381836, "global_step": 247896, "epoch": 2986} {"train_loss": -24.955686569213867, "global_step": 247897, "epoch": 2986} {"train_loss": -25.34002685546875, "global_step": 247898, "epoch": 2986} {"train_loss": -24.989700317382812, "global_step": 247899, "epoch": 2986} {"train_loss": -25.263517379760742, "global_step": 247900, "epoch": 2986} {"train_loss": -24.779272079467773, "global_step": 247901, "epoch": 2986} {"train_loss": -24.91261863708496, "global_step": 247902, "epoch": 2986} {"train_loss": -24.631858825683594, "global_step": 247903, "epoch": 2986} {"train_loss": -25.14662742614746, "global_step": 247904, "epoch": 2986} {"train_loss": -25.244131088256836, "global_step": 247905, "epoch": 2986} {"train_loss": -24.823530197143555, "global_step": 247906, "epoch": 2986} {"train_loss": -25.042945861816406, "global_step": 247907, "epoch": 2986} {"train_loss": -24.90156364440918, "global_step": 247908, "epoch": 2986} {"train_loss": -24.825925827026367, "global_step": 247909, "epoch": 2986} {"train_loss": -25.195053100585938, "global_step": 247910, "epoch": 2986} {"train_loss": -24.818395614624023, "global_step": 247911, "epoch": 2986} {"train_loss": -25.166778564453125, "global_step": 247912, "epoch": 2986} {"train_loss": -25.166473388671875, "global_step": 247913, "epoch": 2986} {"train_loss": -24.88682746887207, "global_step": 247914, "epoch": 2986} {"train_loss": -24.94022560119629, "global_step": 247915, "epoch": 2986} {"train_loss": -24.9882869720459, "global_step": 247916, "epoch": 2986} {"train_loss": -25.18670654296875, "global_step": 247917, "epoch": 2986} {"train_loss": -25.046035766601562, "global_step": 247918, "epoch": 2986} {"train_loss": -24.489906311035156, "global_step": 247919, "epoch": 2986} {"train_loss": -24.81091451070395, "global_step": 247920, "epoch": 2986, "val_loss": 6854666.0} {"train_loss": -24.73331069946289, "global_step": 247921, "epoch": 2987} {"train_loss": -24.81080436706543, "global_step": 247922, "epoch": 2987} {"train_loss": -24.815017700195312, "global_step": 247923, "epoch": 2987} {"train_loss": -24.632633209228516, "global_step": 247924, "epoch": 2987} {"train_loss": -24.583446502685547, "global_step": 247925, "epoch": 2987} {"train_loss": -24.96537208557129, "global_step": 247926, "epoch": 2987} {"train_loss": -24.917381286621094, "global_step": 247927, "epoch": 2987} {"train_loss": -24.302309036254883, "global_step": 247928, "epoch": 2987} {"train_loss": -24.46259117126465, "global_step": 247929, "epoch": 2987} {"train_loss": -24.825408935546875, "global_step": 247930, "epoch": 2987} {"train_loss": -24.703710556030273, "global_step": 247931, "epoch": 2987} {"train_loss": -25.190603256225586, "global_step": 247932, "epoch": 2987} {"train_loss": -24.78329086303711, "global_step": 247933, "epoch": 2987} {"train_loss": -24.945743560791016, "global_step": 247934, "epoch": 2987} {"train_loss": -25.19388198852539, "global_step": 247935, "epoch": 2987} {"train_loss": -24.898374557495117, "global_step": 247936, "epoch": 2987} {"train_loss": -24.792407989501953, "global_step": 247937, "epoch": 2987} {"train_loss": -24.512939453125, "global_step": 247938, "epoch": 2987} {"train_loss": -25.32280158996582, "global_step": 247939, "epoch": 2987} {"train_loss": -24.94121742248535, "global_step": 247940, "epoch": 2987} {"train_loss": -25.057086944580078, "global_step": 247941, "epoch": 2987} {"train_loss": -24.931594848632812, "global_step": 247942, "epoch": 2987} {"train_loss": -24.749500274658203, "global_step": 247943, "epoch": 2987} {"train_loss": -24.906787872314453, "global_step": 247944, "epoch": 2987} {"train_loss": -24.66107177734375, "global_step": 247945, "epoch": 2987} {"train_loss": -25.192861557006836, "global_step": 247946, "epoch": 2987} {"train_loss": -24.94296646118164, "global_step": 247947, "epoch": 2987} {"train_loss": -25.029325485229492, "global_step": 247948, "epoch": 2987} {"train_loss": -24.923696517944336, "global_step": 247949, "epoch": 2987} {"train_loss": -25.110050201416016, "global_step": 247950, "epoch": 2987} {"train_loss": -25.239606857299805, "global_step": 247951, "epoch": 2987} {"train_loss": -25.060640335083008, "global_step": 247952, "epoch": 2987} {"train_loss": -25.13326072692871, "global_step": 247953, "epoch": 2987} {"train_loss": -25.00004005432129, "global_step": 247954, "epoch": 2987} {"train_loss": -24.948781967163086, "global_step": 247955, "epoch": 2987} {"train_loss": -25.315176010131836, "global_step": 247956, "epoch": 2987} {"train_loss": -25.27332878112793, "global_step": 247957, "epoch": 2987} {"train_loss": -25.16847038269043, "global_step": 247958, "epoch": 2987} {"train_loss": -25.056053161621094, "global_step": 247959, "epoch": 2987} {"train_loss": -25.023046493530273, "global_step": 247960, "epoch": 2987} {"train_loss": -24.853803634643555, "global_step": 247961, "epoch": 2987} {"train_loss": -25.161211013793945, "global_step": 247962, "epoch": 2987} {"train_loss": -24.891653060913086, "global_step": 247963, "epoch": 2987} {"train_loss": -24.741878509521484, "global_step": 247964, "epoch": 2987} {"train_loss": -24.73273468017578, "global_step": 247965, "epoch": 2987} {"train_loss": -24.995832443237305, "global_step": 247966, "epoch": 2987} {"train_loss": -25.015583038330078, "global_step": 247967, "epoch": 2987} {"train_loss": -25.137165069580078, "global_step": 247968, "epoch": 2987} {"train_loss": -24.84197425842285, "global_step": 247969, "epoch": 2987} {"train_loss": -24.868932723999023, "global_step": 247970, "epoch": 2987} {"train_loss": -25.246967315673828, "global_step": 247971, "epoch": 2987} {"train_loss": -24.975635528564453, "global_step": 247972, "epoch": 2987} {"train_loss": -24.561492919921875, "global_step": 247973, "epoch": 2987} {"train_loss": -24.434635162353516, "global_step": 247974, "epoch": 2987} {"train_loss": -24.990985870361328, "global_step": 247975, "epoch": 2987} {"train_loss": -25.13142204284668, "global_step": 247976, "epoch": 2987} {"train_loss": -24.77840232849121, "global_step": 247977, "epoch": 2987} {"train_loss": -24.87946128845215, "global_step": 247978, "epoch": 2987} {"train_loss": -24.946327209472656, "global_step": 247979, "epoch": 2987} {"train_loss": -24.932327270507812, "global_step": 247980, "epoch": 2987} {"train_loss": -24.89630699157715, "global_step": 247981, "epoch": 2987} {"train_loss": -24.855167388916016, "global_step": 247982, "epoch": 2987} {"train_loss": -25.037513732910156, "global_step": 247983, "epoch": 2987} {"train_loss": -25.404508590698242, "global_step": 247984, "epoch": 2987} {"train_loss": -24.94581413269043, "global_step": 247985, "epoch": 2987} {"train_loss": -24.866405487060547, "global_step": 247986, "epoch": 2987} {"train_loss": -25.536590576171875, "global_step": 247987, "epoch": 2987} {"train_loss": -25.111066818237305, "global_step": 247988, "epoch": 2987} {"train_loss": -25.006122589111328, "global_step": 247989, "epoch": 2987} {"train_loss": -25.141035079956055, "global_step": 247990, "epoch": 2987} {"train_loss": -25.40375518798828, "global_step": 247991, "epoch": 2987} {"train_loss": -24.90374183654785, "global_step": 247992, "epoch": 2987} {"train_loss": -24.916746139526367, "global_step": 247993, "epoch": 2987} {"train_loss": -24.906208038330078, "global_step": 247994, "epoch": 2987} {"train_loss": -25.733789443969727, "global_step": 247995, "epoch": 2987} {"train_loss": -24.79999351501465, "global_step": 247996, "epoch": 2987} {"train_loss": -24.789522171020508, "global_step": 247997, "epoch": 2987} {"train_loss": -25.47075843811035, "global_step": 247998, "epoch": 2987} {"train_loss": -25.004779815673828, "global_step": 247999, "epoch": 2987} {"train_loss": -24.70448875427246, "global_step": 248000, "epoch": 2987} {"train_loss": -25.256298065185547, "global_step": 248001, "epoch": 2987} {"train_loss": -24.980802536010742, "global_step": 248002, "epoch": 2987} {"train_loss": -24.95266199686441, "global_step": 248003, "epoch": 2987, "val_loss": 6771448.0} {"train_loss": -24.84840965270996, "global_step": 248004, "epoch": 2988} {"train_loss": -23.819711685180664, "global_step": 248005, "epoch": 2988} {"train_loss": -24.683727264404297, "global_step": 248006, "epoch": 2988} {"train_loss": -24.55667495727539, "global_step": 248007, "epoch": 2988} {"train_loss": -24.70784568786621, "global_step": 248008, "epoch": 2988} {"train_loss": -24.212507247924805, "global_step": 248009, "epoch": 2988} {"train_loss": -24.071340560913086, "global_step": 248010, "epoch": 2988} {"train_loss": -24.286645889282227, "global_step": 248011, "epoch": 2988} {"train_loss": -24.470462799072266, "global_step": 248012, "epoch": 2988} {"train_loss": -24.32956886291504, "global_step": 248013, "epoch": 2988} {"train_loss": -24.42191505432129, "global_step": 248014, "epoch": 2988} {"train_loss": -24.908252716064453, "global_step": 248015, "epoch": 2988} {"train_loss": -24.36856460571289, "global_step": 248016, "epoch": 2988} {"train_loss": -24.877222061157227, "global_step": 248017, "epoch": 2988} {"train_loss": -25.181169509887695, "global_step": 248018, "epoch": 2988} {"train_loss": -24.19451904296875, "global_step": 248019, "epoch": 2988} {"train_loss": -24.966876983642578, "global_step": 248020, "epoch": 2988} {"train_loss": -24.96089744567871, "global_step": 248021, "epoch": 2988} {"train_loss": -24.888389587402344, "global_step": 248022, "epoch": 2988} {"train_loss": -24.82985496520996, "global_step": 248023, "epoch": 2988} {"train_loss": -25.120100021362305, "global_step": 248024, "epoch": 2988} {"train_loss": -24.787033081054688, "global_step": 248025, "epoch": 2988} {"train_loss": -24.8690242767334, "global_step": 248026, "epoch": 2988} {"train_loss": -24.89776039123535, "global_step": 248027, "epoch": 2988} {"train_loss": -24.983179092407227, "global_step": 248028, "epoch": 2988} {"train_loss": -24.996318817138672, "global_step": 248029, "epoch": 2988} {"train_loss": -24.89491081237793, "global_step": 248030, "epoch": 2988} {"train_loss": -25.24753761291504, "global_step": 248031, "epoch": 2988} {"train_loss": -25.106985092163086, "global_step": 248032, "epoch": 2988} {"train_loss": -24.74470329284668, "global_step": 248033, "epoch": 2988} {"train_loss": -25.15852165222168, "global_step": 248034, "epoch": 2988} {"train_loss": -25.005102157592773, "global_step": 248035, "epoch": 2988} {"train_loss": -25.154109954833984, "global_step": 248036, "epoch": 2988} {"train_loss": -25.03386116027832, "global_step": 248037, "epoch": 2988} {"train_loss": -25.00434112548828, "global_step": 248038, "epoch": 2988} {"train_loss": -24.919509887695312, "global_step": 248039, "epoch": 2988} {"train_loss": -25.388010025024414, "global_step": 248040, "epoch": 2988} {"train_loss": -25.141843795776367, "global_step": 248041, "epoch": 2988} {"train_loss": -24.963659286499023, "global_step": 248042, "epoch": 2988} {"train_loss": -25.188438415527344, "global_step": 248043, "epoch": 2988} {"train_loss": -24.96845817565918, "global_step": 248044, "epoch": 2988} {"train_loss": -25.195592880249023, "global_step": 248045, "epoch": 2988} {"train_loss": -25.576343536376953, "global_step": 248046, "epoch": 2988} {"train_loss": -24.99763298034668, "global_step": 248047, "epoch": 2988} {"train_loss": -24.98359489440918, "global_step": 248048, "epoch": 2988} {"train_loss": -24.96550750732422, "global_step": 248049, "epoch": 2988} {"train_loss": -25.18807029724121, "global_step": 248050, "epoch": 2988} {"train_loss": -25.150161743164062, "global_step": 248051, "epoch": 2988} {"train_loss": -25.300514221191406, "global_step": 248052, "epoch": 2988} {"train_loss": -24.9999942779541, "global_step": 248053, "epoch": 2988} {"train_loss": -24.836111068725586, "global_step": 248054, "epoch": 2988} {"train_loss": -25.12417221069336, "global_step": 248055, "epoch": 2988} {"train_loss": -24.90711784362793, "global_step": 248056, "epoch": 2988} {"train_loss": -24.404712677001953, "global_step": 248057, "epoch": 2988} {"train_loss": -24.89168357849121, "global_step": 248058, "epoch": 2988} {"train_loss": -24.8719425201416, "global_step": 248059, "epoch": 2988} {"train_loss": -25.112045288085938, "global_step": 248060, "epoch": 2988} {"train_loss": -24.97146224975586, "global_step": 248061, "epoch": 2988} {"train_loss": -25.10577392578125, "global_step": 248062, "epoch": 2988} {"train_loss": -24.67164421081543, "global_step": 248063, "epoch": 2988} {"train_loss": -25.035079956054688, "global_step": 248064, "epoch": 2988} {"train_loss": -24.94302749633789, "global_step": 248065, "epoch": 2988} {"train_loss": -24.896217346191406, "global_step": 248066, "epoch": 2988} {"train_loss": -24.995283126831055, "global_step": 248067, "epoch": 2988} {"train_loss": -25.196136474609375, "global_step": 248068, "epoch": 2988} {"train_loss": -25.047189712524414, "global_step": 248069, "epoch": 2988} {"train_loss": -24.913589477539062, "global_step": 248070, "epoch": 2988} {"train_loss": -24.998321533203125, "global_step": 248071, "epoch": 2988} {"train_loss": -25.066381454467773, "global_step": 248072, "epoch": 2988} {"train_loss": -24.64563751220703, "global_step": 248073, "epoch": 2988} {"train_loss": -25.460662841796875, "global_step": 248074, "epoch": 2988} {"train_loss": -25.461984634399414, "global_step": 248075, "epoch": 2988} {"train_loss": -24.932727813720703, "global_step": 248076, "epoch": 2988} {"train_loss": -25.24139976501465, "global_step": 248077, "epoch": 2988} {"train_loss": -25.05018424987793, "global_step": 248078, "epoch": 2988} {"train_loss": -25.041654586791992, "global_step": 248079, "epoch": 2988} {"train_loss": -24.843250274658203, "global_step": 248080, "epoch": 2988} {"train_loss": -24.704326629638672, "global_step": 248081, "epoch": 2988} {"train_loss": -24.92640495300293, "global_step": 248082, "epoch": 2988} {"train_loss": -24.821605682373047, "global_step": 248083, "epoch": 2988} {"train_loss": -25.043649673461914, "global_step": 248084, "epoch": 2988} {"train_loss": -24.750608444213867, "global_step": 248085, "epoch": 2988} {"train_loss": -24.910198786172522, "global_step": 248086, "epoch": 2988, "val_loss": 6828678.5} {"train_loss": -23.93082046508789, "global_step": 248087, "epoch": 2989} {"train_loss": -24.18606948852539, "global_step": 248088, "epoch": 2989} {"train_loss": -24.100004196166992, "global_step": 248089, "epoch": 2989} {"train_loss": -24.357481002807617, "global_step": 248090, "epoch": 2989} {"train_loss": -24.813451766967773, "global_step": 248091, "epoch": 2989} {"train_loss": -23.91748046875, "global_step": 248092, "epoch": 2989} {"train_loss": -24.5562801361084, "global_step": 248093, "epoch": 2989} {"train_loss": -24.711374282836914, "global_step": 248094, "epoch": 2989} {"train_loss": -24.861379623413086, "global_step": 248095, "epoch": 2989} {"train_loss": -24.54975128173828, "global_step": 248096, "epoch": 2989} {"train_loss": -24.860214233398438, "global_step": 248097, "epoch": 2989} {"train_loss": -24.713991165161133, "global_step": 248098, "epoch": 2989} {"train_loss": -24.74806785583496, "global_step": 248099, "epoch": 2989} {"train_loss": -24.611051559448242, "global_step": 248100, "epoch": 2989} {"train_loss": -24.852706909179688, "global_step": 248101, "epoch": 2989} {"train_loss": -24.661409378051758, "global_step": 248102, "epoch": 2989} {"train_loss": -24.80861473083496, "global_step": 248103, "epoch": 2989} {"train_loss": -24.911657333374023, "global_step": 248104, "epoch": 2989} {"train_loss": -24.91060447692871, "global_step": 248105, "epoch": 2989} {"train_loss": -24.59722900390625, "global_step": 248106, "epoch": 2989} {"train_loss": -25.099197387695312, "global_step": 248107, "epoch": 2989} {"train_loss": -24.90083885192871, "global_step": 248108, "epoch": 2989} {"train_loss": -24.97101402282715, "global_step": 248109, "epoch": 2989} {"train_loss": -25.23348045349121, "global_step": 248110, "epoch": 2989} {"train_loss": -24.74283790588379, "global_step": 248111, "epoch": 2989} {"train_loss": -24.893945693969727, "global_step": 248112, "epoch": 2989} {"train_loss": -25.079374313354492, "global_step": 248113, "epoch": 2989} {"train_loss": -24.743640899658203, "global_step": 248114, "epoch": 2989} {"train_loss": -25.099950790405273, "global_step": 248115, "epoch": 2989} {"train_loss": -25.16206932067871, "global_step": 248116, "epoch": 2989} {"train_loss": -25.312829971313477, "global_step": 248117, "epoch": 2989} {"train_loss": -25.231992721557617, "global_step": 248118, "epoch": 2989} {"train_loss": -25.0826416015625, "global_step": 248119, "epoch": 2989} {"train_loss": -25.15323257446289, "global_step": 248120, "epoch": 2989} {"train_loss": -25.058040618896484, "global_step": 248121, "epoch": 2989} {"train_loss": -24.67630958557129, "global_step": 248122, "epoch": 2989} {"train_loss": -25.094419479370117, "global_step": 248123, "epoch": 2989} {"train_loss": -24.95366668701172, "global_step": 248124, "epoch": 2989} {"train_loss": -24.99900245666504, "global_step": 248125, "epoch": 2989} {"train_loss": -25.173622131347656, "global_step": 248126, "epoch": 2989} {"train_loss": -25.173431396484375, "global_step": 248127, "epoch": 2989} {"train_loss": -25.16555404663086, "global_step": 248128, "epoch": 2989} {"train_loss": -25.084890365600586, "global_step": 248129, "epoch": 2989} {"train_loss": -25.124448776245117, "global_step": 248130, "epoch": 2989} {"train_loss": -25.04401206970215, "global_step": 248131, "epoch": 2989} {"train_loss": -24.934650421142578, "global_step": 248132, "epoch": 2989} {"train_loss": -25.0714168548584, "global_step": 248133, "epoch": 2989} {"train_loss": -24.78976821899414, "global_step": 248134, "epoch": 2989} {"train_loss": -25.419681549072266, "global_step": 248135, "epoch": 2989} {"train_loss": -24.750694274902344, "global_step": 248136, "epoch": 2989} {"train_loss": -25.133520126342773, "global_step": 248137, "epoch": 2989} {"train_loss": -25.034521102905273, "global_step": 248138, "epoch": 2989} {"train_loss": -25.074600219726562, "global_step": 248139, "epoch": 2989} {"train_loss": -24.810688018798828, "global_step": 248140, "epoch": 2989} {"train_loss": -25.18840789794922, "global_step": 248141, "epoch": 2989} {"train_loss": -24.926679611206055, "global_step": 248142, "epoch": 2989} {"train_loss": -25.349613189697266, "global_step": 248143, "epoch": 2989} {"train_loss": -24.9033260345459, "global_step": 248144, "epoch": 2989} {"train_loss": -25.161413192749023, "global_step": 248145, "epoch": 2989} {"train_loss": -25.29088020324707, "global_step": 248146, "epoch": 2989} {"train_loss": -25.031391143798828, "global_step": 248147, "epoch": 2989} {"train_loss": -25.175519943237305, "global_step": 248148, "epoch": 2989} {"train_loss": -24.803651809692383, "global_step": 248149, "epoch": 2989} {"train_loss": -25.0020809173584, "global_step": 248150, "epoch": 2989} {"train_loss": -25.212711334228516, "global_step": 248151, "epoch": 2989} {"train_loss": -25.153921127319336, "global_step": 248152, "epoch": 2989} {"train_loss": -24.837162017822266, "global_step": 248153, "epoch": 2989} {"train_loss": -25.32744789123535, "global_step": 248154, "epoch": 2989} {"train_loss": -25.379364013671875, "global_step": 248155, "epoch": 2989} {"train_loss": -24.65933609008789, "global_step": 248156, "epoch": 2989} {"train_loss": -24.614145278930664, "global_step": 248157, "epoch": 2989} {"train_loss": -25.052396774291992, "global_step": 248158, "epoch": 2989} {"train_loss": -25.178438186645508, "global_step": 248159, "epoch": 2989} {"train_loss": -24.776769638061523, "global_step": 248160, "epoch": 2989} {"train_loss": -24.703908920288086, "global_step": 248161, "epoch": 2989} {"train_loss": -24.643747329711914, "global_step": 248162, "epoch": 2989} {"train_loss": -24.813940048217773, "global_step": 248163, "epoch": 2989} {"train_loss": -25.014427185058594, "global_step": 248164, "epoch": 2989} {"train_loss": -24.8365535736084, "global_step": 248165, "epoch": 2989} {"train_loss": -25.01306915283203, "global_step": 248166, "epoch": 2989} {"train_loss": -24.436988830566406, "global_step": 248167, "epoch": 2989} {"train_loss": -25.2437801361084, "global_step": 248168, "epoch": 2989} {"train_loss": -24.901048867099256, "global_step": 248169, "epoch": 2989, "val_loss": 6730610.0} {"train_loss": -24.793231964111328, "global_step": 248170, "epoch": 2990} {"train_loss": -24.514375686645508, "global_step": 248171, "epoch": 2990} {"train_loss": -24.639265060424805, "global_step": 248172, "epoch": 2990} {"train_loss": -24.424652099609375, "global_step": 248173, "epoch": 2990} {"train_loss": -24.595266342163086, "global_step": 248174, "epoch": 2990} {"train_loss": -24.47440528869629, "global_step": 248175, "epoch": 2990} {"train_loss": -24.581966400146484, "global_step": 248176, "epoch": 2990} {"train_loss": -24.6213436126709, "global_step": 248177, "epoch": 2990} {"train_loss": -24.68344497680664, "global_step": 248178, "epoch": 2990} {"train_loss": -24.65091896057129, "global_step": 248179, "epoch": 2990} {"train_loss": -25.026905059814453, "global_step": 248180, "epoch": 2990} {"train_loss": -24.9566707611084, "global_step": 248181, "epoch": 2990} {"train_loss": -24.548166275024414, "global_step": 248182, "epoch": 2990} {"train_loss": -24.643051147460938, "global_step": 248183, "epoch": 2990} {"train_loss": -24.721027374267578, "global_step": 248184, "epoch": 2990} {"train_loss": -25.000930786132812, "global_step": 248185, "epoch": 2990} {"train_loss": -24.715662002563477, "global_step": 248186, "epoch": 2990} {"train_loss": -24.5776309967041, "global_step": 248187, "epoch": 2990} {"train_loss": -25.390487670898438, "global_step": 248188, "epoch": 2990} {"train_loss": -24.9322566986084, "global_step": 248189, "epoch": 2990} {"train_loss": -24.552305221557617, "global_step": 248190, "epoch": 2990} {"train_loss": -24.985628128051758, "global_step": 248191, "epoch": 2990} {"train_loss": -24.61445426940918, "global_step": 248192, "epoch": 2990} {"train_loss": -24.789783477783203, "global_step": 248193, "epoch": 2990} {"train_loss": -24.838871002197266, "global_step": 248194, "epoch": 2990} {"train_loss": -24.87064552307129, "global_step": 248195, "epoch": 2990} {"train_loss": -25.10890769958496, "global_step": 248196, "epoch": 2990} {"train_loss": -25.174962997436523, "global_step": 248197, "epoch": 2990} {"train_loss": -24.85031509399414, "global_step": 248198, "epoch": 2990} {"train_loss": -24.970293045043945, "global_step": 248199, "epoch": 2990} {"train_loss": -25.16686248779297, "global_step": 248200, "epoch": 2990} {"train_loss": -25.047687530517578, "global_step": 248201, "epoch": 2990} {"train_loss": -24.753746032714844, "global_step": 248202, "epoch": 2990} {"train_loss": -24.922788619995117, "global_step": 248203, "epoch": 2990} {"train_loss": -24.89090347290039, "global_step": 248204, "epoch": 2990} {"train_loss": -25.08161735534668, "global_step": 248205, "epoch": 2990} {"train_loss": -24.89735221862793, "global_step": 248206, "epoch": 2990} {"train_loss": -24.87789535522461, "global_step": 248207, "epoch": 2990} {"train_loss": -24.985498428344727, "global_step": 248208, "epoch": 2990} {"train_loss": -25.281034469604492, "global_step": 248209, "epoch": 2990} {"train_loss": -24.74519157409668, "global_step": 248210, "epoch": 2990} {"train_loss": -24.67368507385254, "global_step": 248211, "epoch": 2990} {"train_loss": -24.983951568603516, "global_step": 248212, "epoch": 2990} {"train_loss": -25.026975631713867, "global_step": 248213, "epoch": 2990} {"train_loss": -25.26895523071289, "global_step": 248214, "epoch": 2990} {"train_loss": -25.400196075439453, "global_step": 248215, "epoch": 2990} {"train_loss": -25.01154899597168, "global_step": 248216, "epoch": 2990} {"train_loss": -24.928796768188477, "global_step": 248217, "epoch": 2990} {"train_loss": -24.939559936523438, "global_step": 248218, "epoch": 2990} {"train_loss": -25.1397762298584, "global_step": 248219, "epoch": 2990} {"train_loss": -24.883047103881836, "global_step": 248220, "epoch": 2990} {"train_loss": -25.210031509399414, "global_step": 248221, "epoch": 2990} {"train_loss": -24.946619033813477, "global_step": 248222, "epoch": 2990} {"train_loss": -25.194381713867188, "global_step": 248223, "epoch": 2990} {"train_loss": -25.279178619384766, "global_step": 248224, "epoch": 2990} {"train_loss": -25.23252296447754, "global_step": 248225, "epoch": 2990} {"train_loss": -25.076705932617188, "global_step": 248226, "epoch": 2990} {"train_loss": -24.79911231994629, "global_step": 248227, "epoch": 2990} {"train_loss": -25.295515060424805, "global_step": 248228, "epoch": 2990} {"train_loss": -24.957382202148438, "global_step": 248229, "epoch": 2990} {"train_loss": -24.92214012145996, "global_step": 248230, "epoch": 2990} {"train_loss": -24.93025779724121, "global_step": 248231, "epoch": 2990} {"train_loss": -25.017114639282227, "global_step": 248232, "epoch": 2990} {"train_loss": -25.000802993774414, "global_step": 248233, "epoch": 2990} {"train_loss": -24.952247619628906, "global_step": 248234, "epoch": 2990} {"train_loss": -25.34041404724121, "global_step": 248235, "epoch": 2990} {"train_loss": -25.12503433227539, "global_step": 248236, "epoch": 2990} {"train_loss": -24.3652400970459, "global_step": 248237, "epoch": 2990} {"train_loss": -23.700803756713867, "global_step": 248238, "epoch": 2990} {"train_loss": -24.47989845275879, "global_step": 248239, "epoch": 2990} {"train_loss": -24.972488403320312, "global_step": 248240, "epoch": 2990} {"train_loss": -25.04975700378418, "global_step": 248241, "epoch": 2990} {"train_loss": -24.53346061706543, "global_step": 248242, "epoch": 2990} {"train_loss": -24.744993209838867, "global_step": 248243, "epoch": 2990} {"train_loss": -25.437026977539062, "global_step": 248244, "epoch": 2990} {"train_loss": -24.781164169311523, "global_step": 248245, "epoch": 2990} {"train_loss": -24.92299461364746, "global_step": 248246, "epoch": 2990} {"train_loss": -24.73046112060547, "global_step": 248247, "epoch": 2990} {"train_loss": -25.209487915039062, "global_step": 248248, "epoch": 2990} {"train_loss": -25.026084899902344, "global_step": 248249, "epoch": 2990} {"train_loss": -24.781505584716797, "global_step": 248250, "epoch": 2990} {"train_loss": -24.888431549072266, "global_step": 248251, "epoch": 2990} {"train_loss": -24.899598615715302, "global_step": 248252, "epoch": 2990, "val_loss": 6748066.0} {"train_loss": -24.443012237548828, "global_step": 248253, "epoch": 2991} {"train_loss": -24.857240676879883, "global_step": 248254, "epoch": 2991} {"train_loss": -24.20823860168457, "global_step": 248255, "epoch": 2991} {"train_loss": -24.384016036987305, "global_step": 248256, "epoch": 2991} {"train_loss": -24.999807357788086, "global_step": 248257, "epoch": 2991} {"train_loss": -24.682392120361328, "global_step": 248258, "epoch": 2991} {"train_loss": -24.743406295776367, "global_step": 248259, "epoch": 2991} {"train_loss": -24.567808151245117, "global_step": 248260, "epoch": 2991} {"train_loss": -24.739728927612305, "global_step": 248261, "epoch": 2991} {"train_loss": -25.389354705810547, "global_step": 248262, "epoch": 2991} {"train_loss": -24.738882064819336, "global_step": 248263, "epoch": 2991} {"train_loss": -24.78369140625, "global_step": 248264, "epoch": 2991} {"train_loss": -24.883010864257812, "global_step": 248265, "epoch": 2991} {"train_loss": -24.989826202392578, "global_step": 248266, "epoch": 2991} {"train_loss": -25.07252311706543, "global_step": 248267, "epoch": 2991} {"train_loss": -24.868667602539062, "global_step": 248268, "epoch": 2991} {"train_loss": -24.856054306030273, "global_step": 248269, "epoch": 2991} {"train_loss": -24.940885543823242, "global_step": 248270, "epoch": 2991} {"train_loss": -25.189741134643555, "global_step": 248271, "epoch": 2991} {"train_loss": -24.81473159790039, "global_step": 248272, "epoch": 2991} {"train_loss": -25.15378761291504, "global_step": 248273, "epoch": 2991} {"train_loss": -25.00758171081543, "global_step": 248274, "epoch": 2991} {"train_loss": -24.941125869750977, "global_step": 248275, "epoch": 2991} {"train_loss": -24.938688278198242, "global_step": 248276, "epoch": 2991} {"train_loss": -25.001041412353516, "global_step": 248277, "epoch": 2991} {"train_loss": -25.133588790893555, "global_step": 248278, "epoch": 2991} {"train_loss": -25.37929344177246, "global_step": 248279, "epoch": 2991} {"train_loss": -24.52670669555664, "global_step": 248280, "epoch": 2991} {"train_loss": -25.017061233520508, "global_step": 248281, "epoch": 2991} {"train_loss": -25.26581382751465, "global_step": 248282, "epoch": 2991} {"train_loss": -24.98067855834961, "global_step": 248283, "epoch": 2991} {"train_loss": -24.709300994873047, "global_step": 248284, "epoch": 2991} {"train_loss": -24.844676971435547, "global_step": 248285, "epoch": 2991} {"train_loss": -24.73091697692871, "global_step": 248286, "epoch": 2991} {"train_loss": -25.05086326599121, "global_step": 248287, "epoch": 2991} {"train_loss": -24.618932723999023, "global_step": 248288, "epoch": 2991} {"train_loss": -25.091083526611328, "global_step": 248289, "epoch": 2991} {"train_loss": -25.174833297729492, "global_step": 248290, "epoch": 2991} {"train_loss": -24.988752365112305, "global_step": 248291, "epoch": 2991} {"train_loss": -25.01721954345703, "global_step": 248292, "epoch": 2991} {"train_loss": -25.119115829467773, "global_step": 248293, "epoch": 2991} {"train_loss": -25.385990142822266, "global_step": 248294, "epoch": 2991} {"train_loss": -24.84929847717285, "global_step": 248295, "epoch": 2991} {"train_loss": -25.160776138305664, "global_step": 248296, "epoch": 2991} {"train_loss": -25.156415939331055, "global_step": 248297, "epoch": 2991} {"train_loss": -25.2333984375, "global_step": 248298, "epoch": 2991} {"train_loss": -25.015470504760742, "global_step": 248299, "epoch": 2991} {"train_loss": -25.436904907226562, "global_step": 248300, "epoch": 2991} {"train_loss": -24.94675064086914, "global_step": 248301, "epoch": 2991} {"train_loss": -24.957063674926758, "global_step": 248302, "epoch": 2991} {"train_loss": -25.25836753845215, "global_step": 248303, "epoch": 2991} {"train_loss": -25.465240478515625, "global_step": 248304, "epoch": 2991} {"train_loss": -25.16180419921875, "global_step": 248305, "epoch": 2991} {"train_loss": -25.143741607666016, "global_step": 248306, "epoch": 2991} {"train_loss": -25.205663681030273, "global_step": 248307, "epoch": 2991} {"train_loss": -25.231889724731445, "global_step": 248308, "epoch": 2991} {"train_loss": -25.20522117614746, "global_step": 248309, "epoch": 2991} {"train_loss": -25.16815185546875, "global_step": 248310, "epoch": 2991} {"train_loss": -25.13418960571289, "global_step": 248311, "epoch": 2991} {"train_loss": -24.98750114440918, "global_step": 248312, "epoch": 2991} {"train_loss": -25.087995529174805, "global_step": 248313, "epoch": 2991} {"train_loss": -24.957712173461914, "global_step": 248314, "epoch": 2991} {"train_loss": -24.664260864257812, "global_step": 248315, "epoch": 2991} {"train_loss": -25.24786376953125, "global_step": 248316, "epoch": 2991} {"train_loss": -24.89303207397461, "global_step": 248317, "epoch": 2991} {"train_loss": -25.022798538208008, "global_step": 248318, "epoch": 2991} {"train_loss": -24.58106803894043, "global_step": 248319, "epoch": 2991} {"train_loss": -25.168210983276367, "global_step": 248320, "epoch": 2991} {"train_loss": -25.20969581604004, "global_step": 248321, "epoch": 2991} {"train_loss": -24.46390724182129, "global_step": 248322, "epoch": 2991} {"train_loss": -24.842004776000977, "global_step": 248323, "epoch": 2991} {"train_loss": -24.969715118408203, "global_step": 248324, "epoch": 2991} {"train_loss": -25.1326961517334, "global_step": 248325, "epoch": 2991} {"train_loss": -25.105728149414062, "global_step": 248326, "epoch": 2991} {"train_loss": -25.389175415039062, "global_step": 248327, "epoch": 2991} {"train_loss": -25.242990493774414, "global_step": 248328, "epoch": 2991} {"train_loss": -25.136756896972656, "global_step": 248329, "epoch": 2991} {"train_loss": -25.423664093017578, "global_step": 248330, "epoch": 2991} {"train_loss": -24.94367790222168, "global_step": 248331, "epoch": 2991} {"train_loss": -24.88285255432129, "global_step": 248332, "epoch": 2991} {"train_loss": -24.965442657470703, "global_step": 248333, "epoch": 2991} {"train_loss": -24.576751708984375, "global_step": 248334, "epoch": 2991} {"train_loss": -24.973187940666474, "global_step": 248335, "epoch": 2991, "val_loss": 6806841.0} {"train_loss": -24.076169967651367, "global_step": 248336, "epoch": 2992} {"train_loss": -23.77276039123535, "global_step": 248337, "epoch": 2992} {"train_loss": -24.1990966796875, "global_step": 248338, "epoch": 2992} {"train_loss": -24.02042579650879, "global_step": 248339, "epoch": 2992} {"train_loss": -24.34358787536621, "global_step": 248340, "epoch": 2992} {"train_loss": -23.938398361206055, "global_step": 248341, "epoch": 2992} {"train_loss": -24.2561092376709, "global_step": 248342, "epoch": 2992} {"train_loss": -24.50621223449707, "global_step": 248343, "epoch": 2992} {"train_loss": -24.037418365478516, "global_step": 248344, "epoch": 2992} {"train_loss": -24.59769058227539, "global_step": 248345, "epoch": 2992} {"train_loss": -24.239444732666016, "global_step": 248346, "epoch": 2992} {"train_loss": -24.426424026489258, "global_step": 248347, "epoch": 2992} {"train_loss": -24.484037399291992, "global_step": 248348, "epoch": 2992} {"train_loss": -24.413129806518555, "global_step": 248349, "epoch": 2992} {"train_loss": -24.352264404296875, "global_step": 248350, "epoch": 2992} {"train_loss": -24.701171875, "global_step": 248351, "epoch": 2992} {"train_loss": -24.603635787963867, "global_step": 248352, "epoch": 2992} {"train_loss": -24.539752960205078, "global_step": 248353, "epoch": 2992} {"train_loss": -24.47670555114746, "global_step": 248354, "epoch": 2992} {"train_loss": -24.695215225219727, "global_step": 248355, "epoch": 2992} {"train_loss": -24.8283634185791, "global_step": 248356, "epoch": 2992} {"train_loss": -25.038671493530273, "global_step": 248357, "epoch": 2992} {"train_loss": -24.99591636657715, "global_step": 248358, "epoch": 2992} {"train_loss": -24.686960220336914, "global_step": 248359, "epoch": 2992} {"train_loss": -24.836164474487305, "global_step": 248360, "epoch": 2992} {"train_loss": -25.025896072387695, "global_step": 248361, "epoch": 2992} {"train_loss": -25.106796264648438, "global_step": 248362, "epoch": 2992} {"train_loss": -25.348302841186523, "global_step": 248363, "epoch": 2992} {"train_loss": -24.646093368530273, "global_step": 248364, "epoch": 2992} {"train_loss": -24.857328414916992, "global_step": 248365, "epoch": 2992} {"train_loss": -25.134695053100586, "global_step": 248366, "epoch": 2992} {"train_loss": -25.13149642944336, "global_step": 248367, "epoch": 2992} {"train_loss": -24.999555587768555, "global_step": 248368, "epoch": 2992} {"train_loss": -25.115774154663086, "global_step": 248369, "epoch": 2992} {"train_loss": -25.05867576599121, "global_step": 248370, "epoch": 2992} {"train_loss": -25.17535972595215, "global_step": 248371, "epoch": 2992} {"train_loss": -24.91300392150879, "global_step": 248372, "epoch": 2992} {"train_loss": -24.975757598876953, "global_step": 248373, "epoch": 2992} {"train_loss": -24.87502098083496, "global_step": 248374, "epoch": 2992} {"train_loss": -24.871992111206055, "global_step": 248375, "epoch": 2992} {"train_loss": -24.941619873046875, "global_step": 248376, "epoch": 2992} {"train_loss": -24.97098159790039, "global_step": 248377, "epoch": 2992} {"train_loss": -25.020599365234375, "global_step": 248378, "epoch": 2992} {"train_loss": -25.366064071655273, "global_step": 248379, "epoch": 2992} {"train_loss": -24.722562789916992, "global_step": 248380, "epoch": 2992} {"train_loss": -25.186437606811523, "global_step": 248381, "epoch": 2992} {"train_loss": -24.76734161376953, "global_step": 248382, "epoch": 2992} {"train_loss": -25.025880813598633, "global_step": 248383, "epoch": 2992} {"train_loss": -25.157163619995117, "global_step": 248384, "epoch": 2992} {"train_loss": -25.091886520385742, "global_step": 248385, "epoch": 2992} {"train_loss": -24.69044303894043, "global_step": 248386, "epoch": 2992} {"train_loss": -24.930953979492188, "global_step": 248387, "epoch": 2992} {"train_loss": -25.248857498168945, "global_step": 248388, "epoch": 2992} {"train_loss": -24.772796630859375, "global_step": 248389, "epoch": 2992} {"train_loss": -24.7177734375, "global_step": 248390, "epoch": 2992} {"train_loss": -24.6639461517334, "global_step": 248391, "epoch": 2992} {"train_loss": -25.294208526611328, "global_step": 248392, "epoch": 2992} {"train_loss": -25.070453643798828, "global_step": 248393, "epoch": 2992} {"train_loss": -25.14438819885254, "global_step": 248394, "epoch": 2992} {"train_loss": -24.863101959228516, "global_step": 248395, "epoch": 2992} {"train_loss": -25.376657485961914, "global_step": 248396, "epoch": 2992} {"train_loss": -25.28006935119629, "global_step": 248397, "epoch": 2992} {"train_loss": -25.063344955444336, "global_step": 248398, "epoch": 2992} {"train_loss": -24.709197998046875, "global_step": 248399, "epoch": 2992} {"train_loss": -24.770061492919922, "global_step": 248400, "epoch": 2992} {"train_loss": -25.19083023071289, "global_step": 248401, "epoch": 2992} {"train_loss": -25.17445945739746, "global_step": 248402, "epoch": 2992} {"train_loss": -25.215381622314453, "global_step": 248403, "epoch": 2992} {"train_loss": -25.100360870361328, "global_step": 248404, "epoch": 2992} {"train_loss": -25.06256103515625, "global_step": 248405, "epoch": 2992} {"train_loss": -24.90467643737793, "global_step": 248406, "epoch": 2992} {"train_loss": -25.266345977783203, "global_step": 248407, "epoch": 2992} {"train_loss": -25.133310317993164, "global_step": 248408, "epoch": 2992} {"train_loss": -25.14607048034668, "global_step": 248409, "epoch": 2992} {"train_loss": -24.855165481567383, "global_step": 248410, "epoch": 2992} {"train_loss": -25.245407104492188, "global_step": 248411, "epoch": 2992} {"train_loss": -25.268844604492188, "global_step": 248412, "epoch": 2992} {"train_loss": -25.065401077270508, "global_step": 248413, "epoch": 2992} {"train_loss": -25.117475509643555, "global_step": 248414, "epoch": 2992} {"train_loss": -25.15813636779785, "global_step": 248415, "epoch": 2992} {"train_loss": -25.020299911499023, "global_step": 248416, "epoch": 2992} {"train_loss": -24.6878719329834, "global_step": 248417, "epoch": 2992} {"train_loss": -24.84563211647861, "global_step": 248418, "epoch": 2992, "val_loss": 6982126.0} {"train_loss": -24.313989639282227, "global_step": 248419, "epoch": 2993} {"train_loss": -23.71103286743164, "global_step": 248420, "epoch": 2993} {"train_loss": -23.87347412109375, "global_step": 248421, "epoch": 2993} {"train_loss": -23.958860397338867, "global_step": 248422, "epoch": 2993} {"train_loss": -24.321256637573242, "global_step": 248423, "epoch": 2993} {"train_loss": -23.224210739135742, "global_step": 248424, "epoch": 2993} {"train_loss": -24.41768455505371, "global_step": 248425, "epoch": 2993} {"train_loss": -24.200788497924805, "global_step": 248426, "epoch": 2993} {"train_loss": -24.56669044494629, "global_step": 248427, "epoch": 2993} {"train_loss": -24.142677307128906, "global_step": 248428, "epoch": 2993} {"train_loss": -24.19036293029785, "global_step": 248429, "epoch": 2993} {"train_loss": -24.726726531982422, "global_step": 248430, "epoch": 2993} {"train_loss": -24.467702865600586, "global_step": 248431, "epoch": 2993} {"train_loss": -24.623680114746094, "global_step": 248432, "epoch": 2993} {"train_loss": -24.080793380737305, "global_step": 248433, "epoch": 2993} {"train_loss": -24.6013126373291, "global_step": 248434, "epoch": 2993} {"train_loss": -24.37334632873535, "global_step": 248435, "epoch": 2993} {"train_loss": -24.401636123657227, "global_step": 248436, "epoch": 2993} {"train_loss": -24.4799747467041, "global_step": 248437, "epoch": 2993} {"train_loss": -24.49903106689453, "global_step": 248438, "epoch": 2993} {"train_loss": -24.355443954467773, "global_step": 248439, "epoch": 2993} {"train_loss": -24.73328971862793, "global_step": 248440, "epoch": 2993} {"train_loss": -24.877246856689453, "global_step": 248441, "epoch": 2993} {"train_loss": -24.826889038085938, "global_step": 248442, "epoch": 2993} {"train_loss": -24.918792724609375, "global_step": 248443, "epoch": 2993} {"train_loss": -24.983732223510742, "global_step": 248444, "epoch": 2993} {"train_loss": -24.396224975585938, "global_step": 248445, "epoch": 2993} {"train_loss": -24.990447998046875, "global_step": 248446, "epoch": 2993} {"train_loss": -24.789785385131836, "global_step": 248447, "epoch": 2993} {"train_loss": -24.979141235351562, "global_step": 248448, "epoch": 2993} {"train_loss": -24.969667434692383, "global_step": 248449, "epoch": 2993} {"train_loss": -24.78458023071289, "global_step": 248450, "epoch": 2993} {"train_loss": -24.916961669921875, "global_step": 248451, "epoch": 2993} {"train_loss": -24.647476196289062, "global_step": 248452, "epoch": 2993} {"train_loss": -25.055856704711914, "global_step": 248453, "epoch": 2993} {"train_loss": -24.910812377929688, "global_step": 248454, "epoch": 2993} {"train_loss": -24.982389450073242, "global_step": 248455, "epoch": 2993} {"train_loss": -24.84772300720215, "global_step": 248456, "epoch": 2993} {"train_loss": -25.31822395324707, "global_step": 248457, "epoch": 2993} {"train_loss": -25.08673667907715, "global_step": 248458, "epoch": 2993} {"train_loss": -24.955501556396484, "global_step": 248459, "epoch": 2993} {"train_loss": -24.93692398071289, "global_step": 248460, "epoch": 2993} {"train_loss": -25.077550888061523, "global_step": 248461, "epoch": 2993} {"train_loss": -25.29253387451172, "global_step": 248462, "epoch": 2993} {"train_loss": -25.081247329711914, "global_step": 248463, "epoch": 2993} {"train_loss": -25.07216453552246, "global_step": 248464, "epoch": 2993} {"train_loss": -25.106754302978516, "global_step": 248465, "epoch": 2993} {"train_loss": -25.069095611572266, "global_step": 248466, "epoch": 2993} {"train_loss": -24.9608097076416, "global_step": 248467, "epoch": 2993} {"train_loss": -24.49786949157715, "global_step": 248468, "epoch": 2993} {"train_loss": -24.429515838623047, "global_step": 248469, "epoch": 2993} {"train_loss": -24.9853572845459, "global_step": 248470, "epoch": 2993} {"train_loss": -24.79780387878418, "global_step": 248471, "epoch": 2993} {"train_loss": -24.41898536682129, "global_step": 248472, "epoch": 2993} {"train_loss": -24.361358642578125, "global_step": 248473, "epoch": 2993} {"train_loss": -25.085432052612305, "global_step": 248474, "epoch": 2993} {"train_loss": -24.713516235351562, "global_step": 248475, "epoch": 2993} {"train_loss": -25.142118453979492, "global_step": 248476, "epoch": 2993} {"train_loss": -24.893821716308594, "global_step": 248477, "epoch": 2993} {"train_loss": -24.8095703125, "global_step": 248478, "epoch": 2993} {"train_loss": -24.90252685546875, "global_step": 248479, "epoch": 2993} {"train_loss": -24.933504104614258, "global_step": 248480, "epoch": 2993} {"train_loss": -24.806272506713867, "global_step": 248481, "epoch": 2993} {"train_loss": -24.971296310424805, "global_step": 248482, "epoch": 2993} {"train_loss": -25.041685104370117, "global_step": 248483, "epoch": 2993} {"train_loss": -24.69282341003418, "global_step": 248484, "epoch": 2993} {"train_loss": -24.979801177978516, "global_step": 248485, "epoch": 2993} {"train_loss": -24.933231353759766, "global_step": 248486, "epoch": 2993} {"train_loss": -24.507017135620117, "global_step": 248487, "epoch": 2993} {"train_loss": -24.876544952392578, "global_step": 248488, "epoch": 2993} {"train_loss": -24.846187591552734, "global_step": 248489, "epoch": 2993} {"train_loss": -24.829015731811523, "global_step": 248490, "epoch": 2993} {"train_loss": -25.2380313873291, "global_step": 248491, "epoch": 2993} {"train_loss": -25.011371612548828, "global_step": 248492, "epoch": 2993} {"train_loss": -25.574392318725586, "global_step": 248493, "epoch": 2993} {"train_loss": -24.903623580932617, "global_step": 248494, "epoch": 2993} {"train_loss": -25.045989990234375, "global_step": 248495, "epoch": 2993} {"train_loss": -25.0678768157959, "global_step": 248496, "epoch": 2993} {"train_loss": -25.12894630432129, "global_step": 248497, "epoch": 2993} {"train_loss": -25.101802825927734, "global_step": 248498, "epoch": 2993} {"train_loss": -24.88018798828125, "global_step": 248499, "epoch": 2993} {"train_loss": -25.614364624023438, "global_step": 248500, "epoch": 2993} {"train_loss": -24.756693989397533, "global_step": 248501, "epoch": 2993, "val_loss": 6861645.0} {"train_loss": -24.27206039428711, "global_step": 248502, "epoch": 2994} {"train_loss": -23.525299072265625, "global_step": 248503, "epoch": 2994} {"train_loss": -23.42037010192871, "global_step": 248504, "epoch": 2994} {"train_loss": -24.47421646118164, "global_step": 248505, "epoch": 2994} {"train_loss": -24.506120681762695, "global_step": 248506, "epoch": 2994} {"train_loss": -24.19980239868164, "global_step": 248507, "epoch": 2994} {"train_loss": -24.273365020751953, "global_step": 248508, "epoch": 2994} {"train_loss": -24.56954574584961, "global_step": 248509, "epoch": 2994} {"train_loss": -24.340587615966797, "global_step": 248510, "epoch": 2994} {"train_loss": -24.584125518798828, "global_step": 248511, "epoch": 2994} {"train_loss": -24.173269271850586, "global_step": 248512, "epoch": 2994} {"train_loss": -24.041227340698242, "global_step": 248513, "epoch": 2994} {"train_loss": -24.92303466796875, "global_step": 248514, "epoch": 2994} {"train_loss": -24.477182388305664, "global_step": 248515, "epoch": 2994} {"train_loss": -24.478572845458984, "global_step": 248516, "epoch": 2994} {"train_loss": -24.520057678222656, "global_step": 248517, "epoch": 2994} {"train_loss": -24.39789581298828, "global_step": 248518, "epoch": 2994} {"train_loss": -24.445823669433594, "global_step": 248519, "epoch": 2994} {"train_loss": -25.019723892211914, "global_step": 248520, "epoch": 2994} {"train_loss": -24.69610595703125, "global_step": 248521, "epoch": 2994} {"train_loss": -24.69260597229004, "global_step": 248522, "epoch": 2994} {"train_loss": -24.294204711914062, "global_step": 248523, "epoch": 2994} {"train_loss": -24.994739532470703, "global_step": 248524, "epoch": 2994} {"train_loss": -24.65919303894043, "global_step": 248525, "epoch": 2994} {"train_loss": -25.038129806518555, "global_step": 248526, "epoch": 2994} {"train_loss": -24.657155990600586, "global_step": 248527, "epoch": 2994} {"train_loss": -24.96280860900879, "global_step": 248528, "epoch": 2994} {"train_loss": -24.994657516479492, "global_step": 248529, "epoch": 2994} {"train_loss": -24.583328247070312, "global_step": 248530, "epoch": 2994} {"train_loss": -24.640146255493164, "global_step": 248531, "epoch": 2994} {"train_loss": -24.946516036987305, "global_step": 248532, "epoch": 2994} {"train_loss": -25.054227828979492, "global_step": 248533, "epoch": 2994} {"train_loss": -24.88111686706543, "global_step": 248534, "epoch": 2994} {"train_loss": -25.224287033081055, "global_step": 248535, "epoch": 2994} {"train_loss": -25.154037475585938, "global_step": 248536, "epoch": 2994} {"train_loss": -24.969314575195312, "global_step": 248537, "epoch": 2994} {"train_loss": -25.009845733642578, "global_step": 248538, "epoch": 2994} {"train_loss": -24.85697364807129, "global_step": 248539, "epoch": 2994} {"train_loss": -25.13333511352539, "global_step": 248540, "epoch": 2994} {"train_loss": -24.79732322692871, "global_step": 248541, "epoch": 2994} {"train_loss": -25.13372802734375, "global_step": 248542, "epoch": 2994} {"train_loss": -25.126041412353516, "global_step": 248543, "epoch": 2994} {"train_loss": -25.07880210876465, "global_step": 248544, "epoch": 2994} {"train_loss": -25.082782745361328, "global_step": 248545, "epoch": 2994} {"train_loss": -25.114490509033203, "global_step": 248546, "epoch": 2994} {"train_loss": -25.28792381286621, "global_step": 248547, "epoch": 2994} {"train_loss": -25.32796287536621, "global_step": 248548, "epoch": 2994} {"train_loss": -25.090269088745117, "global_step": 248549, "epoch": 2994} {"train_loss": -25.108448028564453, "global_step": 248550, "epoch": 2994} {"train_loss": -25.259849548339844, "global_step": 248551, "epoch": 2994} {"train_loss": -25.22035026550293, "global_step": 248552, "epoch": 2994} {"train_loss": -24.8154296875, "global_step": 248553, "epoch": 2994} {"train_loss": -25.260929107666016, "global_step": 248554, "epoch": 2994} {"train_loss": -25.260160446166992, "global_step": 248555, "epoch": 2994} {"train_loss": -24.98383903503418, "global_step": 248556, "epoch": 2994} {"train_loss": -25.425378799438477, "global_step": 248557, "epoch": 2994} {"train_loss": -25.116003036499023, "global_step": 248558, "epoch": 2994} {"train_loss": -25.172561645507812, "global_step": 248559, "epoch": 2994} {"train_loss": -25.19989013671875, "global_step": 248560, "epoch": 2994} {"train_loss": -25.260602951049805, "global_step": 248561, "epoch": 2994} {"train_loss": -24.45631980895996, "global_step": 248562, "epoch": 2994} {"train_loss": -25.244855880737305, "global_step": 248563, "epoch": 2994} {"train_loss": -25.15421485900879, "global_step": 248564, "epoch": 2994} {"train_loss": -25.133291244506836, "global_step": 248565, "epoch": 2994} {"train_loss": -25.212369918823242, "global_step": 248566, "epoch": 2994} {"train_loss": -24.570337295532227, "global_step": 248567, "epoch": 2994} {"train_loss": -24.575252532958984, "global_step": 248568, "epoch": 2994} {"train_loss": -24.949600219726562, "global_step": 248569, "epoch": 2994} {"train_loss": -24.4085750579834, "global_step": 248570, "epoch": 2994} {"train_loss": -24.662961959838867, "global_step": 248571, "epoch": 2994} {"train_loss": -24.91097068786621, "global_step": 248572, "epoch": 2994} {"train_loss": -25.0974178314209, "global_step": 248573, "epoch": 2994} {"train_loss": -25.02878761291504, "global_step": 248574, "epoch": 2994} {"train_loss": -24.785858154296875, "global_step": 248575, "epoch": 2994} {"train_loss": -25.055374145507812, "global_step": 248576, "epoch": 2994} {"train_loss": -24.4895076751709, "global_step": 248577, "epoch": 2994} {"train_loss": -25.03750991821289, "global_step": 248578, "epoch": 2994} {"train_loss": -25.377992630004883, "global_step": 248579, "epoch": 2994} {"train_loss": -24.46908950805664, "global_step": 248580, "epoch": 2994} {"train_loss": -24.892362594604492, "global_step": 248581, "epoch": 2994} {"train_loss": -24.8365421295166, "global_step": 248582, "epoch": 2994} {"train_loss": -24.7205753326416, "global_step": 248583, "epoch": 2994} {"train_loss": -24.81117131336626, "global_step": 248584, "epoch": 2994, "val_loss": 6869717.0} {"train_loss": -24.372661590576172, "global_step": 248585, "epoch": 2995} {"train_loss": -24.62702751159668, "global_step": 248586, "epoch": 2995} {"train_loss": -24.410919189453125, "global_step": 248587, "epoch": 2995} {"train_loss": -24.834035873413086, "global_step": 248588, "epoch": 2995} {"train_loss": -25.144094467163086, "global_step": 248589, "epoch": 2995} {"train_loss": -25.14560317993164, "global_step": 248590, "epoch": 2995} {"train_loss": -24.877246856689453, "global_step": 248591, "epoch": 2995} {"train_loss": -24.889244079589844, "global_step": 248592, "epoch": 2995} {"train_loss": -24.68865966796875, "global_step": 248593, "epoch": 2995} {"train_loss": -25.133846282958984, "global_step": 248594, "epoch": 2995} {"train_loss": -25.02605438232422, "global_step": 248595, "epoch": 2995} {"train_loss": -25.1270809173584, "global_step": 248596, "epoch": 2995} {"train_loss": -24.87470054626465, "global_step": 248597, "epoch": 2995} {"train_loss": -25.199914932250977, "global_step": 248598, "epoch": 2995} {"train_loss": -24.760122299194336, "global_step": 248599, "epoch": 2995} {"train_loss": -24.814363479614258, "global_step": 248600, "epoch": 2995} {"train_loss": -25.09773063659668, "global_step": 248601, "epoch": 2995} {"train_loss": -24.961545944213867, "global_step": 248602, "epoch": 2995} {"train_loss": -25.37116813659668, "global_step": 248603, "epoch": 2995} {"train_loss": -25.134023666381836, "global_step": 248604, "epoch": 2995} {"train_loss": -24.908275604248047, "global_step": 248605, "epoch": 2995} {"train_loss": -25.055883407592773, "global_step": 248606, "epoch": 2995} {"train_loss": -24.916833877563477, "global_step": 248607, "epoch": 2995} {"train_loss": -25.105247497558594, "global_step": 248608, "epoch": 2995} {"train_loss": -24.998926162719727, "global_step": 248609, "epoch": 2995} {"train_loss": -24.75275230407715, "global_step": 248610, "epoch": 2995} {"train_loss": -25.39669418334961, "global_step": 248611, "epoch": 2995} {"train_loss": -25.228822708129883, "global_step": 248612, "epoch": 2995} {"train_loss": -24.980379104614258, "global_step": 248613, "epoch": 2995} {"train_loss": -25.429662704467773, "global_step": 248614, "epoch": 2995} {"train_loss": -25.258575439453125, "global_step": 248615, "epoch": 2995} {"train_loss": -25.227718353271484, "global_step": 248616, "epoch": 2995} {"train_loss": -25.18804931640625, "global_step": 248617, "epoch": 2995} {"train_loss": -25.221731185913086, "global_step": 248618, "epoch": 2995} {"train_loss": -25.185394287109375, "global_step": 248619, "epoch": 2995} {"train_loss": -24.99811363220215, "global_step": 248620, "epoch": 2995} {"train_loss": -25.08609962463379, "global_step": 248621, "epoch": 2995} {"train_loss": -25.395492553710938, "global_step": 248622, "epoch": 2995} {"train_loss": -25.29756736755371, "global_step": 248623, "epoch": 2995} {"train_loss": -25.176942825317383, "global_step": 248624, "epoch": 2995} {"train_loss": -25.39999771118164, "global_step": 248625, "epoch": 2995} {"train_loss": -24.994461059570312, "global_step": 248626, "epoch": 2995} {"train_loss": -24.994644165039062, "global_step": 248627, "epoch": 2995} {"train_loss": -24.96938133239746, "global_step": 248628, "epoch": 2995} {"train_loss": -25.33918571472168, "global_step": 248629, "epoch": 2995} {"train_loss": -25.10993003845215, "global_step": 248630, "epoch": 2995} {"train_loss": -25.123525619506836, "global_step": 248631, "epoch": 2995} {"train_loss": -25.11094856262207, "global_step": 248632, "epoch": 2995} {"train_loss": -24.581525802612305, "global_step": 248633, "epoch": 2995} {"train_loss": -24.24913787841797, "global_step": 248634, "epoch": 2995} {"train_loss": -24.277034759521484, "global_step": 248635, "epoch": 2995} {"train_loss": -24.88075065612793, "global_step": 248636, "epoch": 2995} {"train_loss": -24.908672332763672, "global_step": 248637, "epoch": 2995} {"train_loss": -24.902978897094727, "global_step": 248638, "epoch": 2995} {"train_loss": -24.742624282836914, "global_step": 248639, "epoch": 2995} {"train_loss": -25.029865264892578, "global_step": 248640, "epoch": 2995} {"train_loss": -25.10607147216797, "global_step": 248641, "epoch": 2995} {"train_loss": -24.984954833984375, "global_step": 248642, "epoch": 2995} {"train_loss": -24.773672103881836, "global_step": 248643, "epoch": 2995} {"train_loss": -24.96071434020996, "global_step": 248644, "epoch": 2995} {"train_loss": -24.941486358642578, "global_step": 248645, "epoch": 2995} {"train_loss": -24.54619026184082, "global_step": 248646, "epoch": 2995} {"train_loss": -24.937198638916016, "global_step": 248647, "epoch": 2995} {"train_loss": -25.094396591186523, "global_step": 248648, "epoch": 2995} {"train_loss": -24.903757095336914, "global_step": 248649, "epoch": 2995} {"train_loss": -24.66407012939453, "global_step": 248650, "epoch": 2995} {"train_loss": -25.088394165039062, "global_step": 248651, "epoch": 2995} {"train_loss": -25.09528350830078, "global_step": 248652, "epoch": 2995} {"train_loss": -24.81063461303711, "global_step": 248653, "epoch": 2995} {"train_loss": -25.076847076416016, "global_step": 248654, "epoch": 2995} {"train_loss": -25.184247970581055, "global_step": 248655, "epoch": 2995} {"train_loss": -24.967885971069336, "global_step": 248656, "epoch": 2995} {"train_loss": -25.123498916625977, "global_step": 248657, "epoch": 2995} {"train_loss": -24.85181999206543, "global_step": 248658, "epoch": 2995} {"train_loss": -25.060108184814453, "global_step": 248659, "epoch": 2995} {"train_loss": -25.06962776184082, "global_step": 248660, "epoch": 2995} {"train_loss": -25.155319213867188, "global_step": 248661, "epoch": 2995} {"train_loss": -24.842294692993164, "global_step": 248662, "epoch": 2995} {"train_loss": -24.797971725463867, "global_step": 248663, "epoch": 2995} {"train_loss": -25.021076202392578, "global_step": 248664, "epoch": 2995} {"train_loss": -25.217756271362305, "global_step": 248665, "epoch": 2995} {"train_loss": -24.970840454101562, "global_step": 248666, "epoch": 2995} {"train_loss": -25.003183985330974, "global_step": 248667, "epoch": 2995, "val_loss": 6817951.0} {"train_loss": -24.667984008789062, "global_step": 248668, "epoch": 2996} {"train_loss": -24.668792724609375, "global_step": 248669, "epoch": 2996} {"train_loss": -24.786331176757812, "global_step": 248670, "epoch": 2996} {"train_loss": -24.591882705688477, "global_step": 248671, "epoch": 2996} {"train_loss": -25.044158935546875, "global_step": 248672, "epoch": 2996} {"train_loss": -24.428823471069336, "global_step": 248673, "epoch": 2996} {"train_loss": -24.40363121032715, "global_step": 248674, "epoch": 2996} {"train_loss": -24.526384353637695, "global_step": 248675, "epoch": 2996} {"train_loss": -24.982160568237305, "global_step": 248676, "epoch": 2996} {"train_loss": -24.535959243774414, "global_step": 248677, "epoch": 2996} {"train_loss": -24.576047897338867, "global_step": 248678, "epoch": 2996} {"train_loss": -24.598356246948242, "global_step": 248679, "epoch": 2996} {"train_loss": -24.558584213256836, "global_step": 248680, "epoch": 2996} {"train_loss": -24.785886764526367, "global_step": 248681, "epoch": 2996} {"train_loss": -24.3983097076416, "global_step": 248682, "epoch": 2996} {"train_loss": -24.90006446838379, "global_step": 248683, "epoch": 2996} {"train_loss": -24.86756706237793, "global_step": 248684, "epoch": 2996} {"train_loss": -24.86871910095215, "global_step": 248685, "epoch": 2996} {"train_loss": -25.05398941040039, "global_step": 248686, "epoch": 2996} {"train_loss": -24.054792404174805, "global_step": 248687, "epoch": 2996} {"train_loss": -25.161043167114258, "global_step": 248688, "epoch": 2996} {"train_loss": -24.830665588378906, "global_step": 248689, "epoch": 2996} {"train_loss": -24.447477340698242, "global_step": 248690, "epoch": 2996} {"train_loss": -24.616374969482422, "global_step": 248691, "epoch": 2996} {"train_loss": -24.80031394958496, "global_step": 248692, "epoch": 2996} {"train_loss": -24.769826889038086, "global_step": 248693, "epoch": 2996} {"train_loss": -24.741384506225586, "global_step": 248694, "epoch": 2996} {"train_loss": -24.967002868652344, "global_step": 248695, "epoch": 2996} {"train_loss": -24.752344131469727, "global_step": 248696, "epoch": 2996} {"train_loss": -24.68503761291504, "global_step": 248697, "epoch": 2996} {"train_loss": -24.973011016845703, "global_step": 248698, "epoch": 2996} {"train_loss": -24.930837631225586, "global_step": 248699, "epoch": 2996} {"train_loss": -24.886232376098633, "global_step": 248700, "epoch": 2996} {"train_loss": -25.27142333984375, "global_step": 248701, "epoch": 2996} {"train_loss": -24.641122817993164, "global_step": 248702, "epoch": 2996} {"train_loss": -24.208776473999023, "global_step": 248703, "epoch": 2996} {"train_loss": -24.22693634033203, "global_step": 248704, "epoch": 2996} {"train_loss": -24.952857971191406, "global_step": 248705, "epoch": 2996} {"train_loss": -24.890954971313477, "global_step": 248706, "epoch": 2996} {"train_loss": -24.84352684020996, "global_step": 248707, "epoch": 2996} {"train_loss": -25.193363189697266, "global_step": 248708, "epoch": 2996} {"train_loss": -24.67978858947754, "global_step": 248709, "epoch": 2996} {"train_loss": -25.045564651489258, "global_step": 248710, "epoch": 2996} {"train_loss": -24.41204261779785, "global_step": 248711, "epoch": 2996} {"train_loss": -25.231903076171875, "global_step": 248712, "epoch": 2996} {"train_loss": -24.56793785095215, "global_step": 248713, "epoch": 2996} {"train_loss": -24.929872512817383, "global_step": 248714, "epoch": 2996} {"train_loss": -24.980365753173828, "global_step": 248715, "epoch": 2996} {"train_loss": -25.05866050720215, "global_step": 248716, "epoch": 2996} {"train_loss": -24.557584762573242, "global_step": 248717, "epoch": 2996} {"train_loss": -25.007797241210938, "global_step": 248718, "epoch": 2996} {"train_loss": -25.009801864624023, "global_step": 248719, "epoch": 2996} {"train_loss": -25.05209732055664, "global_step": 248720, "epoch": 2996} {"train_loss": -25.2500057220459, "global_step": 248721, "epoch": 2996} {"train_loss": -25.1878662109375, "global_step": 248722, "epoch": 2996} {"train_loss": -24.985626220703125, "global_step": 248723, "epoch": 2996} {"train_loss": -24.827518463134766, "global_step": 248724, "epoch": 2996} {"train_loss": -24.91526222229004, "global_step": 248725, "epoch": 2996} {"train_loss": -24.733327865600586, "global_step": 248726, "epoch": 2996} {"train_loss": -25.23557472229004, "global_step": 248727, "epoch": 2996} {"train_loss": -25.05267906188965, "global_step": 248728, "epoch": 2996} {"train_loss": -24.940067291259766, "global_step": 248729, "epoch": 2996} {"train_loss": -25.154430389404297, "global_step": 248730, "epoch": 2996} {"train_loss": -25.145124435424805, "global_step": 248731, "epoch": 2996} {"train_loss": -25.07984733581543, "global_step": 248732, "epoch": 2996} {"train_loss": -24.998281478881836, "global_step": 248733, "epoch": 2996} {"train_loss": -25.40097427368164, "global_step": 248734, "epoch": 2996} {"train_loss": -24.828632354736328, "global_step": 248735, "epoch": 2996} {"train_loss": -25.11581039428711, "global_step": 248736, "epoch": 2996} {"train_loss": -24.93549346923828, "global_step": 248737, "epoch": 2996} {"train_loss": -25.109251022338867, "global_step": 248738, "epoch": 2996} {"train_loss": -25.250608444213867, "global_step": 248739, "epoch": 2996} {"train_loss": -24.776330947875977, "global_step": 248740, "epoch": 2996} {"train_loss": -24.935178756713867, "global_step": 248741, "epoch": 2996} {"train_loss": -25.10383415222168, "global_step": 248742, "epoch": 2996} {"train_loss": -25.063894271850586, "global_step": 248743, "epoch": 2996} {"train_loss": -24.934946060180664, "global_step": 248744, "epoch": 2996} {"train_loss": -24.936073303222656, "global_step": 248745, "epoch": 2996} {"train_loss": -25.046262741088867, "global_step": 248746, "epoch": 2996} {"train_loss": -25.29347038269043, "global_step": 248747, "epoch": 2996} {"train_loss": -25.00033187866211, "global_step": 248748, "epoch": 2996} {"train_loss": -24.816112518310547, "global_step": 248749, "epoch": 2996} {"train_loss": -24.869078509778863, "global_step": 248750, "epoch": 2996, "val_loss": 6829493.0} {"train_loss": -24.846166610717773, "global_step": 248751, "epoch": 2997} {"train_loss": -24.941654205322266, "global_step": 248752, "epoch": 2997} {"train_loss": -24.374034881591797, "global_step": 248753, "epoch": 2997} {"train_loss": -24.996959686279297, "global_step": 248754, "epoch": 2997} {"train_loss": -24.90114402770996, "global_step": 248755, "epoch": 2997} {"train_loss": -24.743906021118164, "global_step": 248756, "epoch": 2997} {"train_loss": -24.79439926147461, "global_step": 248757, "epoch": 2997} {"train_loss": -25.172956466674805, "global_step": 248758, "epoch": 2997} {"train_loss": -24.63238525390625, "global_step": 248759, "epoch": 2997} {"train_loss": -25.063526153564453, "global_step": 248760, "epoch": 2997} {"train_loss": -25.183761596679688, "global_step": 248761, "epoch": 2997} {"train_loss": -24.828222274780273, "global_step": 248762, "epoch": 2997} {"train_loss": -24.485187530517578, "global_step": 248763, "epoch": 2997} {"train_loss": -25.049222946166992, "global_step": 248764, "epoch": 2997} {"train_loss": -24.657983779907227, "global_step": 248765, "epoch": 2997} {"train_loss": -24.69748878479004, "global_step": 248766, "epoch": 2997} {"train_loss": -24.98160743713379, "global_step": 248767, "epoch": 2997} {"train_loss": -25.011369705200195, "global_step": 248768, "epoch": 2997} {"train_loss": -24.745243072509766, "global_step": 248769, "epoch": 2997} {"train_loss": -25.49966049194336, "global_step": 248770, "epoch": 2997} {"train_loss": -24.974767684936523, "global_step": 248771, "epoch": 2997} {"train_loss": -24.777856826782227, "global_step": 248772, "epoch": 2997} {"train_loss": -25.141380310058594, "global_step": 248773, "epoch": 2997} {"train_loss": -24.838186264038086, "global_step": 248774, "epoch": 2997} {"train_loss": -25.13240623474121, "global_step": 248775, "epoch": 2997} {"train_loss": -25.10896110534668, "global_step": 248776, "epoch": 2997} {"train_loss": -25.01555633544922, "global_step": 248777, "epoch": 2997} {"train_loss": -24.877044677734375, "global_step": 248778, "epoch": 2997} {"train_loss": -25.587371826171875, "global_step": 248779, "epoch": 2997} {"train_loss": -25.215261459350586, "global_step": 248780, "epoch": 2997} {"train_loss": -25.179136276245117, "global_step": 248781, "epoch": 2997} {"train_loss": -25.202781677246094, "global_step": 248782, "epoch": 2997} {"train_loss": -25.1049861907959, "global_step": 248783, "epoch": 2997} {"train_loss": -24.964706420898438, "global_step": 248784, "epoch": 2997} {"train_loss": -25.481857299804688, "global_step": 248785, "epoch": 2997} {"train_loss": -25.226497650146484, "global_step": 248786, "epoch": 2997} {"train_loss": -24.95261001586914, "global_step": 248787, "epoch": 2997} {"train_loss": -24.902135848999023, "global_step": 248788, "epoch": 2997} {"train_loss": -24.861677169799805, "global_step": 248789, "epoch": 2997} {"train_loss": -24.970163345336914, "global_step": 248790, "epoch": 2997} {"train_loss": -24.856903076171875, "global_step": 248791, "epoch": 2997} {"train_loss": -24.869178771972656, "global_step": 248792, "epoch": 2997} {"train_loss": -25.01630401611328, "global_step": 248793, "epoch": 2997} {"train_loss": -24.887130737304688, "global_step": 248794, "epoch": 2997} {"train_loss": -25.089740753173828, "global_step": 248795, "epoch": 2997} {"train_loss": -25.308515548706055, "global_step": 248796, "epoch": 2997} {"train_loss": -25.114532470703125, "global_step": 248797, "epoch": 2997} {"train_loss": -24.907989501953125, "global_step": 248798, "epoch": 2997} {"train_loss": -25.103172302246094, "global_step": 248799, "epoch": 2997} {"train_loss": -24.932954788208008, "global_step": 248800, "epoch": 2997} {"train_loss": -25.30118751525879, "global_step": 248801, "epoch": 2997} {"train_loss": -25.367473602294922, "global_step": 248802, "epoch": 2997} {"train_loss": -24.961172103881836, "global_step": 248803, "epoch": 2997} {"train_loss": -24.82653045654297, "global_step": 248804, "epoch": 2997} {"train_loss": -24.846694946289062, "global_step": 248805, "epoch": 2997} {"train_loss": -24.9449520111084, "global_step": 248806, "epoch": 2997} {"train_loss": -25.15198516845703, "global_step": 248807, "epoch": 2997} {"train_loss": -25.282501220703125, "global_step": 248808, "epoch": 2997} {"train_loss": -25.064390182495117, "global_step": 248809, "epoch": 2997} {"train_loss": -25.017820358276367, "global_step": 248810, "epoch": 2997} {"train_loss": -24.660579681396484, "global_step": 248811, "epoch": 2997} {"train_loss": -24.93715476989746, "global_step": 248812, "epoch": 2997} {"train_loss": -25.16669273376465, "global_step": 248813, "epoch": 2997} {"train_loss": -24.7083683013916, "global_step": 248814, "epoch": 2997} {"train_loss": -25.066946029663086, "global_step": 248815, "epoch": 2997} {"train_loss": -24.703781127929688, "global_step": 248816, "epoch": 2997} {"train_loss": -24.801677703857422, "global_step": 248817, "epoch": 2997} {"train_loss": -24.86165428161621, "global_step": 248818, "epoch": 2997} {"train_loss": -24.84320640563965, "global_step": 248819, "epoch": 2997} {"train_loss": -24.7142276763916, "global_step": 248820, "epoch": 2997} {"train_loss": -25.135913848876953, "global_step": 248821, "epoch": 2997} {"train_loss": -24.92949676513672, "global_step": 248822, "epoch": 2997} {"train_loss": -24.9965877532959, "global_step": 248823, "epoch": 2997} {"train_loss": -25.169795989990234, "global_step": 248824, "epoch": 2997} {"train_loss": -25.058353424072266, "global_step": 248825, "epoch": 2997} {"train_loss": -25.190092086791992, "global_step": 248826, "epoch": 2997} {"train_loss": -24.992090225219727, "global_step": 248827, "epoch": 2997} {"train_loss": -25.285457611083984, "global_step": 248828, "epoch": 2997} {"train_loss": -25.431488037109375, "global_step": 248829, "epoch": 2997} {"train_loss": -24.97325325012207, "global_step": 248830, "epoch": 2997} {"train_loss": -25.283639907836914, "global_step": 248831, "epoch": 2997} {"train_loss": -25.364791870117188, "global_step": 248832, "epoch": 2997} {"train_loss": -25.00992616400661, "global_step": 248833, "epoch": 2997, "val_loss": 6907248.0} {"train_loss": -24.609384536743164, "global_step": 248834, "epoch": 2998} {"train_loss": -25.047292709350586, "global_step": 248835, "epoch": 2998} {"train_loss": -24.82493782043457, "global_step": 248836, "epoch": 2998} {"train_loss": -24.878707885742188, "global_step": 248837, "epoch": 2998} {"train_loss": -24.844818115234375, "global_step": 248838, "epoch": 2998} {"train_loss": -24.794504165649414, "global_step": 248839, "epoch": 2998} {"train_loss": -24.939035415649414, "global_step": 248840, "epoch": 2998} {"train_loss": -24.56818199157715, "global_step": 248841, "epoch": 2998} {"train_loss": -25.060644149780273, "global_step": 248842, "epoch": 2998} {"train_loss": -24.644371032714844, "global_step": 248843, "epoch": 2998} {"train_loss": -24.749103546142578, "global_step": 248844, "epoch": 2998} {"train_loss": -24.918899536132812, "global_step": 248845, "epoch": 2998} {"train_loss": -24.809125900268555, "global_step": 248846, "epoch": 2998} {"train_loss": -24.7601261138916, "global_step": 248847, "epoch": 2998} {"train_loss": -25.2025146484375, "global_step": 248848, "epoch": 2998} {"train_loss": -24.91566276550293, "global_step": 248849, "epoch": 2998} {"train_loss": -24.87490463256836, "global_step": 248850, "epoch": 2998} {"train_loss": -24.84522819519043, "global_step": 248851, "epoch": 2998} {"train_loss": -25.069576263427734, "global_step": 248852, "epoch": 2998} {"train_loss": -24.87165069580078, "global_step": 248853, "epoch": 2998} {"train_loss": -24.986804962158203, "global_step": 248854, "epoch": 2998} {"train_loss": -25.001962661743164, "global_step": 248855, "epoch": 2998} {"train_loss": -24.821674346923828, "global_step": 248856, "epoch": 2998} {"train_loss": -25.117650985717773, "global_step": 248857, "epoch": 2998} {"train_loss": -24.979406356811523, "global_step": 248858, "epoch": 2998} {"train_loss": -24.822174072265625, "global_step": 248859, "epoch": 2998} {"train_loss": -25.071884155273438, "global_step": 248860, "epoch": 2998} {"train_loss": -25.30069351196289, "global_step": 248861, "epoch": 2998} {"train_loss": -25.431177139282227, "global_step": 248862, "epoch": 2998} {"train_loss": -25.484596252441406, "global_step": 248863, "epoch": 2998} {"train_loss": -25.207908630371094, "global_step": 248864, "epoch": 2998} {"train_loss": -25.18011474609375, "global_step": 248865, "epoch": 2998} {"train_loss": -25.11395835876465, "global_step": 248866, "epoch": 2998} {"train_loss": -25.16478157043457, "global_step": 248867, "epoch": 2998} {"train_loss": -25.09160804748535, "global_step": 248868, "epoch": 2998} {"train_loss": -25.067529678344727, "global_step": 248869, "epoch": 2998} {"train_loss": -25.116361618041992, "global_step": 248870, "epoch": 2998} {"train_loss": -25.186878204345703, "global_step": 248871, "epoch": 2998} {"train_loss": -25.2871150970459, "global_step": 248872, "epoch": 2998} {"train_loss": -25.259586334228516, "global_step": 248873, "epoch": 2998} {"train_loss": -25.328475952148438, "global_step": 248874, "epoch": 2998} {"train_loss": -25.011808395385742, "global_step": 248875, "epoch": 2998} {"train_loss": -24.71965980529785, "global_step": 248876, "epoch": 2998} {"train_loss": -25.336217880249023, "global_step": 248877, "epoch": 2998} {"train_loss": -24.71912956237793, "global_step": 248878, "epoch": 2998} {"train_loss": -25.395715713500977, "global_step": 248879, "epoch": 2998} {"train_loss": -24.98256492614746, "global_step": 248880, "epoch": 2998} {"train_loss": -25.14325714111328, "global_step": 248881, "epoch": 2998} {"train_loss": -25.102466583251953, "global_step": 248882, "epoch": 2998} {"train_loss": -24.67537498474121, "global_step": 248883, "epoch": 2998} {"train_loss": -24.94660758972168, "global_step": 248884, "epoch": 2998} {"train_loss": -24.81537437438965, "global_step": 248885, "epoch": 2998} {"train_loss": -25.049680709838867, "global_step": 248886, "epoch": 2998} {"train_loss": -24.82501792907715, "global_step": 248887, "epoch": 2998} {"train_loss": -24.828847885131836, "global_step": 248888, "epoch": 2998} {"train_loss": -24.772390365600586, "global_step": 248889, "epoch": 2998} {"train_loss": -25.186065673828125, "global_step": 248890, "epoch": 2998} {"train_loss": -25.433704376220703, "global_step": 248891, "epoch": 2998} {"train_loss": -24.821687698364258, "global_step": 248892, "epoch": 2998} {"train_loss": -24.983592987060547, "global_step": 248893, "epoch": 2998} {"train_loss": -24.973602294921875, "global_step": 248894, "epoch": 2998} {"train_loss": -24.623485565185547, "global_step": 248895, "epoch": 2998} {"train_loss": -25.11881446838379, "global_step": 248896, "epoch": 2998} {"train_loss": -24.916240692138672, "global_step": 248897, "epoch": 2998} {"train_loss": -25.170223236083984, "global_step": 248898, "epoch": 2998} {"train_loss": -25.38726234436035, "global_step": 248899, "epoch": 2998} {"train_loss": -24.861486434936523, "global_step": 248900, "epoch": 2998} {"train_loss": -25.399627685546875, "global_step": 248901, "epoch": 2998} {"train_loss": -25.025222778320312, "global_step": 248902, "epoch": 2998} {"train_loss": -25.127471923828125, "global_step": 248903, "epoch": 2998} {"train_loss": -24.952733993530273, "global_step": 248904, "epoch": 2998} {"train_loss": -25.084192276000977, "global_step": 248905, "epoch": 2998} {"train_loss": -24.71197509765625, "global_step": 248906, "epoch": 2998} {"train_loss": -24.971790313720703, "global_step": 248907, "epoch": 2998} {"train_loss": -24.7634220123291, "global_step": 248908, "epoch": 2998} {"train_loss": -25.063379287719727, "global_step": 248909, "epoch": 2998} {"train_loss": -25.072265625, "global_step": 248910, "epoch": 2998} {"train_loss": -25.45249366760254, "global_step": 248911, "epoch": 2998} {"train_loss": -25.315357208251953, "global_step": 248912, "epoch": 2998} {"train_loss": -24.975797653198242, "global_step": 248913, "epoch": 2998} {"train_loss": -24.8523006439209, "global_step": 248914, "epoch": 2998} {"train_loss": -25.109695434570312, "global_step": 248915, "epoch": 2998} {"train_loss": -24.995432773268366, "global_step": 248916, "epoch": 2998, "val_loss": 6818987.0} {"train_loss": -24.720720291137695, "global_step": 248917, "epoch": 2999} {"train_loss": -24.77849769592285, "global_step": 248918, "epoch": 2999} {"train_loss": -24.88783073425293, "global_step": 248919, "epoch": 2999} {"train_loss": -25.187503814697266, "global_step": 248920, "epoch": 2999} {"train_loss": -24.48516082763672, "global_step": 248921, "epoch": 2999} {"train_loss": -24.642763137817383, "global_step": 248922, "epoch": 2999} {"train_loss": -24.95460319519043, "global_step": 248923, "epoch": 2999} {"train_loss": -24.269289016723633, "global_step": 248924, "epoch": 2999} {"train_loss": -24.548444747924805, "global_step": 248925, "epoch": 2999} {"train_loss": -24.999399185180664, "global_step": 248926, "epoch": 2999} {"train_loss": -24.977750778198242, "global_step": 248927, "epoch": 2999} {"train_loss": -24.748380661010742, "global_step": 248928, "epoch": 2999} {"train_loss": -24.585140228271484, "global_step": 248929, "epoch": 2999} {"train_loss": -24.827611923217773, "global_step": 248930, "epoch": 2999} {"train_loss": -25.06548309326172, "global_step": 248931, "epoch": 2999} {"train_loss": -24.673980712890625, "global_step": 248932, "epoch": 2999} {"train_loss": -24.83135414123535, "global_step": 248933, "epoch": 2999} {"train_loss": -24.989887237548828, "global_step": 248934, "epoch": 2999} {"train_loss": -24.875293731689453, "global_step": 248935, "epoch": 2999} {"train_loss": -24.722652435302734, "global_step": 248936, "epoch": 2999} {"train_loss": -24.605499267578125, "global_step": 248937, "epoch": 2999} {"train_loss": -24.85791778564453, "global_step": 248938, "epoch": 2999} {"train_loss": -24.2659912109375, "global_step": 248939, "epoch": 2999} {"train_loss": -24.942846298217773, "global_step": 248940, "epoch": 2999} {"train_loss": -24.684682846069336, "global_step": 248941, "epoch": 2999} {"train_loss": -24.881921768188477, "global_step": 248942, "epoch": 2999} {"train_loss": -25.116992950439453, "global_step": 248943, "epoch": 2999} {"train_loss": -24.827157974243164, "global_step": 248944, "epoch": 2999} {"train_loss": -24.872934341430664, "global_step": 248945, "epoch": 2999} {"train_loss": -24.456314086914062, "global_step": 248946, "epoch": 2999} {"train_loss": -24.983280181884766, "global_step": 248947, "epoch": 2999} {"train_loss": -24.88481330871582, "global_step": 248948, "epoch": 2999} {"train_loss": -24.877918243408203, "global_step": 248949, "epoch": 2999} {"train_loss": -24.936452865600586, "global_step": 248950, "epoch": 2999} {"train_loss": -24.963623046875, "global_step": 248951, "epoch": 2999} {"train_loss": -24.999744415283203, "global_step": 248952, "epoch": 2999} {"train_loss": -24.779926300048828, "global_step": 248953, "epoch": 2999} {"train_loss": -24.76474380493164, "global_step": 248954, "epoch": 2999} {"train_loss": -24.738218307495117, "global_step": 248955, "epoch": 2999} {"train_loss": -25.152769088745117, "global_step": 248956, "epoch": 2999} {"train_loss": -24.91315269470215, "global_step": 248957, "epoch": 2999} {"train_loss": -24.721698760986328, "global_step": 248958, "epoch": 2999} {"train_loss": -25.07209587097168, "global_step": 248959, "epoch": 2999} {"train_loss": -25.165363311767578, "global_step": 248960, "epoch": 2999} {"train_loss": -24.734222412109375, "global_step": 248961, "epoch": 2999} {"train_loss": -25.25773048400879, "global_step": 248962, "epoch": 2999} {"train_loss": -24.981693267822266, "global_step": 248963, "epoch": 2999} {"train_loss": -24.648284912109375, "global_step": 248964, "epoch": 2999} {"train_loss": -24.96285057067871, "global_step": 248965, "epoch": 2999} {"train_loss": -24.846637725830078, "global_step": 248966, "epoch": 2999} {"train_loss": -24.9364013671875, "global_step": 248967, "epoch": 2999} {"train_loss": -24.61745262145996, "global_step": 248968, "epoch": 2999} {"train_loss": -24.276611328125, "global_step": 248969, "epoch": 2999} {"train_loss": -25.058515548706055, "global_step": 248970, "epoch": 2999} {"train_loss": -25.292236328125, "global_step": 248971, "epoch": 2999} {"train_loss": -24.920438766479492, "global_step": 248972, "epoch": 2999} {"train_loss": -25.066516876220703, "global_step": 248973, "epoch": 2999} {"train_loss": -24.856969833374023, "global_step": 248974, "epoch": 2999} {"train_loss": -24.9081974029541, "global_step": 248975, "epoch": 2999} {"train_loss": -24.92464828491211, "global_step": 248976, "epoch": 2999} {"train_loss": -25.174945831298828, "global_step": 248977, "epoch": 2999} {"train_loss": -25.093908309936523, "global_step": 248978, "epoch": 2999} {"train_loss": -25.236875534057617, "global_step": 248979, "epoch": 2999} {"train_loss": -24.768821716308594, "global_step": 248980, "epoch": 2999} {"train_loss": -25.0214786529541, "global_step": 248981, "epoch": 2999} {"train_loss": -24.83807373046875, "global_step": 248982, "epoch": 2999} {"train_loss": -25.024377822875977, "global_step": 248983, "epoch": 2999} {"train_loss": -24.85377311706543, "global_step": 248984, "epoch": 2999} {"train_loss": -25.14676856994629, "global_step": 248985, "epoch": 2999} {"train_loss": -25.13263702392578, "global_step": 248986, "epoch": 2999} {"train_loss": -25.303085327148438, "global_step": 248987, "epoch": 2999} {"train_loss": -25.576980590820312, "global_step": 248988, "epoch": 2999} {"train_loss": -25.264354705810547, "global_step": 248989, "epoch": 2999} {"train_loss": -25.048931121826172, "global_step": 248990, "epoch": 2999} {"train_loss": -24.992612838745117, "global_step": 248991, "epoch": 2999} {"train_loss": -25.129638671875, "global_step": 248992, "epoch": 2999} {"train_loss": -25.23333168029785, "global_step": 248993, "epoch": 2999} {"train_loss": -24.817197799682617, "global_step": 248994, "epoch": 2999} {"train_loss": -25.300025939941406, "global_step": 248995, "epoch": 2999} {"train_loss": -25.17654800415039, "global_step": 248996, "epoch": 2999} {"train_loss": -25.507156372070312, "global_step": 248997, "epoch": 2999} {"train_loss": -24.437597274780273, "global_step": 248998, "epoch": 2999} {"train_loss": -24.90692407539092, "global_step": 248999, "epoch": 2999, "val_loss": 6973630.0} {"train_loss": -23.916208267211914, "global_step": 249000, "epoch": 3000} {"train_loss": -23.417606353759766, "global_step": 249001, "epoch": 3000} {"train_loss": -22.989181518554688, "global_step": 249002, "epoch": 3000} {"train_loss": -23.04034423828125, "global_step": 249003, "epoch": 3000} {"train_loss": -23.531085968017578, "global_step": 249004, "epoch": 3000} {"train_loss": -23.447772979736328, "global_step": 249005, "epoch": 3000} {"train_loss": -23.37851905822754, "global_step": 249006, "epoch": 3000} {"train_loss": -24.349912643432617, "global_step": 249007, "epoch": 3000} {"train_loss": -23.3641414642334, "global_step": 249008, "epoch": 3000} {"train_loss": -24.487628936767578, "global_step": 249009, "epoch": 3000} {"train_loss": -24.387304306030273, "global_step": 249010, "epoch": 3000} {"train_loss": -24.485965728759766, "global_step": 249011, "epoch": 3000} {"train_loss": -24.479154586791992, "global_step": 249012, "epoch": 3000} {"train_loss": -24.44527816772461, "global_step": 249013, "epoch": 3000} {"train_loss": -24.31172752380371, "global_step": 249014, "epoch": 3000} {"train_loss": -24.38275146484375, "global_step": 249015, "epoch": 3000} {"train_loss": -24.013792037963867, "global_step": 249016, "epoch": 3000} {"train_loss": -24.718046188354492, "global_step": 249017, "epoch": 3000} {"train_loss": -24.00185203552246, "global_step": 249018, "epoch": 3000} {"train_loss": -24.467134475708008, "global_step": 249019, "epoch": 3000} {"train_loss": -24.580669403076172, "global_step": 249020, "epoch": 3000} {"train_loss": -24.2523250579834, "global_step": 249021, "epoch": 3000} {"train_loss": -24.602840423583984, "global_step": 249022, "epoch": 3000} {"train_loss": -24.486572265625, "global_step": 249023, "epoch": 3000} {"train_loss": -24.98888397216797, "global_step": 249024, "epoch": 3000} {"train_loss": -24.299962997436523, "global_step": 249025, "epoch": 3000} {"train_loss": -24.52250099182129, "global_step": 249026, "epoch": 3000} {"train_loss": -24.597749710083008, "global_step": 249027, "epoch": 3000} {"train_loss": -24.475223541259766, "global_step": 249028, "epoch": 3000} {"train_loss": -25.230958938598633, "global_step": 249029, "epoch": 3000} {"train_loss": -24.753250122070312, "global_step": 249030, "epoch": 3000} {"train_loss": -24.907155990600586, "global_step": 249031, "epoch": 3000} {"train_loss": -24.87240982055664, "global_step": 249032, "epoch": 3000} {"train_loss": -24.580963134765625, "global_step": 249033, "epoch": 3000} {"train_loss": -24.692495346069336, "global_step": 249034, "epoch": 3000} {"train_loss": -25.0277042388916, "global_step": 249035, "epoch": 3000} {"train_loss": -25.270872116088867, "global_step": 249036, "epoch": 3000} {"train_loss": -24.717374801635742, "global_step": 249037, "epoch": 3000} {"train_loss": -24.84834861755371, "global_step": 249038, "epoch": 3000} {"train_loss": -24.99905776977539, "global_step": 249039, "epoch": 3000} {"train_loss": -25.304365158081055, "global_step": 249040, "epoch": 3000} {"train_loss": -25.003326416015625, "global_step": 249041, "epoch": 3000} {"train_loss": -25.02585220336914, "global_step": 249042, "epoch": 3000} {"train_loss": -24.869823455810547, "global_step": 249043, "epoch": 3000} {"train_loss": -25.13472557067871, "global_step": 249044, "epoch": 3000} {"train_loss": -25.143186569213867, "global_step": 249045, "epoch": 3000} {"train_loss": -25.10811996459961, "global_step": 249046, "epoch": 3000} {"train_loss": -24.985191345214844, "global_step": 249047, "epoch": 3000} {"train_loss": -25.55046272277832, "global_step": 249048, "epoch": 3000} {"train_loss": -25.313081741333008, "global_step": 249049, "epoch": 3000} {"train_loss": -25.203113555908203, "global_step": 249050, "epoch": 3000} {"train_loss": -25.050275802612305, "global_step": 249051, "epoch": 3000} {"train_loss": -25.465457916259766, "global_step": 249052, "epoch": 3000} {"train_loss": -24.92266273498535, "global_step": 249053, "epoch": 3000} {"train_loss": -25.154186248779297, "global_step": 249054, "epoch": 3000} {"train_loss": -25.190221786499023, "global_step": 249055, "epoch": 3000} {"train_loss": -24.94684410095215, "global_step": 249056, "epoch": 3000} {"train_loss": -25.130966186523438, "global_step": 249057, "epoch": 3000} {"train_loss": -24.89170265197754, "global_step": 249058, "epoch": 3000} {"train_loss": -25.059858322143555, "global_step": 249059, "epoch": 3000} {"train_loss": -25.085227966308594, "global_step": 249060, "epoch": 3000} {"train_loss": -25.100175857543945, "global_step": 249061, "epoch": 3000} {"train_loss": -25.320985794067383, "global_step": 249062, "epoch": 3000} {"train_loss": -25.23552894592285, "global_step": 249063, "epoch": 3000} {"train_loss": -25.1330509185791, "global_step": 249064, "epoch": 3000} {"train_loss": -24.90616226196289, "global_step": 249065, "epoch": 3000} {"train_loss": -25.356266021728516, "global_step": 249066, "epoch": 3000} {"train_loss": -24.606019973754883, "global_step": 249067, "epoch": 3000} {"train_loss": -25.237451553344727, "global_step": 249068, "epoch": 3000} {"train_loss": -25.156879425048828, "global_step": 249069, "epoch": 3000} {"train_loss": -24.628427505493164, "global_step": 249070, "epoch": 3000} {"train_loss": -24.88997459411621, "global_step": 249071, "epoch": 3000} {"train_loss": -25.081003189086914, "global_step": 249072, "epoch": 3000} {"train_loss": -24.805988311767578, "global_step": 249073, "epoch": 3000} {"train_loss": -25.02427101135254, "global_step": 249074, "epoch": 3000} {"train_loss": -25.3068790435791, "global_step": 249075, "epoch": 3000} {"train_loss": -24.955472946166992, "global_step": 249076, "epoch": 3000} {"train_loss": -25.293136596679688, "global_step": 249077, "epoch": 3000} {"train_loss": -25.1781005859375, "global_step": 249078, "epoch": 3000} {"train_loss": -24.8887882232666, "global_step": 249079, "epoch": 3000} {"train_loss": -24.721065521240234, "global_step": 249080, "epoch": 3000} {"train_loss": -24.515405654907227, "global_step": 249081, "epoch": 3000} {"train_loss": -24.722138209515307, "global_step": 249082, "epoch": 3000, "train/sim_max_reward_0": 1.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4500000": 1.0, "test/sim_max_reward_4500001": 1.0, "test/sim_max_reward_4500002": 1.0, "test/sim_max_reward_4500003": 1.0, "test/sim_max_reward_4500004": 1.0, "test/sim_max_reward_4500005": 0.0, "test/sim_max_reward_4500006": 1.0, "test/sim_max_reward_4500007": 0.0, "test/sim_max_reward_4500008": 1.0, "test/sim_max_reward_4500009": 1.0, "test/sim_max_reward_4500010": 1.0, "test/sim_max_reward_4500011": 1.0, "test/sim_max_reward_4500012": 1.0, "test/sim_max_reward_4500013": 1.0, "test/sim_max_reward_4500014": 1.0, "test/sim_max_reward_4500015": 1.0, "test/sim_max_reward_4500016": 1.0, "test/sim_max_reward_4500017": 1.0, "test/sim_max_reward_4500018": 0.0, "test/sim_max_reward_4500019": 1.0, "test/sim_max_reward_4500020": 1.0, "test/sim_max_reward_4500021": 1.0, "train/mean_score": 1.0, "test/mean_score": 0.8636363636363636, "val_loss": 6807449.0} {"train_loss": -24.37298583984375, "global_step": 249083, "epoch": 3001} {"train_loss": -24.133535385131836, "global_step": 249084, "epoch": 3001} {"train_loss": -23.775070190429688, "global_step": 249085, "epoch": 3001} {"train_loss": -24.153854370117188, "global_step": 249086, "epoch": 3001} {"train_loss": -24.696807861328125, "global_step": 249087, "epoch": 3001} {"train_loss": -24.238828659057617, "global_step": 249088, "epoch": 3001} {"train_loss": -24.605743408203125, "global_step": 249089, "epoch": 3001} {"train_loss": -24.52120590209961, "global_step": 249090, "epoch": 3001} {"train_loss": -24.433605194091797, "global_step": 249091, "epoch": 3001} {"train_loss": -24.74224853515625, "global_step": 249092, "epoch": 3001} {"train_loss": -23.998878479003906, "global_step": 249093, "epoch": 3001} {"train_loss": -24.646604537963867, "global_step": 249094, "epoch": 3001} {"train_loss": -24.718791961669922, "global_step": 249095, "epoch": 3001} {"train_loss": -24.477262496948242, "global_step": 249096, "epoch": 3001} {"train_loss": -24.566856384277344, "global_step": 249097, "epoch": 3001} {"train_loss": -24.48892593383789, "global_step": 249098, "epoch": 3001} {"train_loss": -24.55360984802246, "global_step": 249099, "epoch": 3001} {"train_loss": -24.811506271362305, "global_step": 249100, "epoch": 3001} {"train_loss": -24.575956344604492, "global_step": 249101, "epoch": 3001} {"train_loss": -24.660898208618164, "global_step": 249102, "epoch": 3001} {"train_loss": -24.606538772583008, "global_step": 249103, "epoch": 3001} {"train_loss": -24.794851303100586, "global_step": 249104, "epoch": 3001} {"train_loss": -24.534503936767578, "global_step": 249105, "epoch": 3001} {"train_loss": -24.61810302734375, "global_step": 249106, "epoch": 3001} {"train_loss": -24.801010131835938, "global_step": 249107, "epoch": 3001} {"train_loss": -24.689748764038086, "global_step": 249108, "epoch": 3001} {"train_loss": -24.960630416870117, "global_step": 249109, "epoch": 3001} {"train_loss": -25.203094482421875, "global_step": 249110, "epoch": 3001} {"train_loss": -24.82720375061035, "global_step": 249111, "epoch": 3001} {"train_loss": -24.939817428588867, "global_step": 249112, "epoch": 3001} {"train_loss": -25.188823699951172, "global_step": 249113, "epoch": 3001} {"train_loss": -24.62619972229004, "global_step": 249114, "epoch": 3001} {"train_loss": -24.547399520874023, "global_step": 249115, "epoch": 3001} {"train_loss": -25.176462173461914, "global_step": 249116, "epoch": 3001} {"train_loss": -25.005584716796875, "global_step": 249117, "epoch": 3001} {"train_loss": -25.37908363342285, "global_step": 249118, "epoch": 3001} {"train_loss": -25.237548828125, "global_step": 249119, "epoch": 3001} {"train_loss": -25.357830047607422, "global_step": 249120, "epoch": 3001} {"train_loss": -24.8737735748291, "global_step": 249121, "epoch": 3001} {"train_loss": -24.955913543701172, "global_step": 249122, "epoch": 3001} {"train_loss": -25.341833114624023, "global_step": 249123, "epoch": 3001} {"train_loss": -25.474079132080078, "global_step": 249124, "epoch": 3001} {"train_loss": -25.12163734436035, "global_step": 249125, "epoch": 3001} {"train_loss": -25.367273330688477, "global_step": 249126, "epoch": 3001} {"train_loss": -25.538528442382812, "global_step": 249127, "epoch": 3001} {"train_loss": -25.32684898376465, "global_step": 249128, "epoch": 3001} {"train_loss": -25.194913864135742, "global_step": 249129, "epoch": 3001} {"train_loss": -25.11942481994629, "global_step": 249130, "epoch": 3001} {"train_loss": -25.333921432495117, "global_step": 249131, "epoch": 3001} {"train_loss": -25.2054500579834, "global_step": 249132, "epoch": 3001} {"train_loss": -24.917917251586914, "global_step": 249133, "epoch": 3001} {"train_loss": -25.17522621154785, "global_step": 249134, "epoch": 3001} {"train_loss": -25.076295852661133, "global_step": 249135, "epoch": 3001} {"train_loss": -24.44536781311035, "global_step": 249136, "epoch": 3001} {"train_loss": -23.971101760864258, "global_step": 249137, "epoch": 3001} {"train_loss": -23.745038986206055, "global_step": 249138, "epoch": 3001} {"train_loss": -24.266550064086914, "global_step": 249139, "epoch": 3001} {"train_loss": -24.74570655822754, "global_step": 249140, "epoch": 3001} {"train_loss": -24.51099967956543, "global_step": 249141, "epoch": 3001} {"train_loss": -24.493803024291992, "global_step": 249142, "epoch": 3001} {"train_loss": -25.006458282470703, "global_step": 249143, "epoch": 3001} {"train_loss": -24.782217025756836, "global_step": 249144, "epoch": 3001} {"train_loss": -24.455997467041016, "global_step": 249145, "epoch": 3001} {"train_loss": -25.17469596862793, "global_step": 249146, "epoch": 3001} {"train_loss": -24.705015182495117, "global_step": 249147, "epoch": 3001} {"train_loss": -24.619626998901367, "global_step": 249148, "epoch": 3001} {"train_loss": -25.002336502075195, "global_step": 249149, "epoch": 3001} {"train_loss": -24.810115814208984, "global_step": 249150, "epoch": 3001} {"train_loss": -24.81764030456543, "global_step": 249151, "epoch": 3001} {"train_loss": -24.818498611450195, "global_step": 249152, "epoch": 3001} {"train_loss": -25.23649024963379, "global_step": 249153, "epoch": 3001} {"train_loss": -24.671188354492188, "global_step": 249154, "epoch": 3001} {"train_loss": -25.00536346435547, "global_step": 249155, "epoch": 3001} {"train_loss": -25.155933380126953, "global_step": 249156, "epoch": 3001} {"train_loss": -25.042579650878906, "global_step": 249157, "epoch": 3001} {"train_loss": -24.65884017944336, "global_step": 249158, "epoch": 3001} {"train_loss": -24.799589157104492, "global_step": 249159, "epoch": 3001} {"train_loss": -25.073816299438477, "global_step": 249160, "epoch": 3001} {"train_loss": -25.329544067382812, "global_step": 249161, "epoch": 3001} {"train_loss": -25.025148391723633, "global_step": 249162, "epoch": 3001} {"train_loss": -25.24521827697754, "global_step": 249163, "epoch": 3001} {"train_loss": -25.388120651245117, "global_step": 249164, "epoch": 3001} {"train_loss": -24.810169564672265, "global_step": 249165, "epoch": 3001, "val_loss": 6846239.0} {"train_loss": -24.69341468811035, "global_step": 249166, "epoch": 3002} {"train_loss": -24.97629165649414, "global_step": 249167, "epoch": 3002} {"train_loss": -24.95863151550293, "global_step": 249168, "epoch": 3002} {"train_loss": -24.9985294342041, "global_step": 249169, "epoch": 3002} {"train_loss": -24.979089736938477, "global_step": 249170, "epoch": 3002} {"train_loss": -24.760421752929688, "global_step": 249171, "epoch": 3002} {"train_loss": -24.895044326782227, "global_step": 249172, "epoch": 3002} {"train_loss": -25.348325729370117, "global_step": 249173, "epoch": 3002} {"train_loss": -24.804977416992188, "global_step": 249174, "epoch": 3002} {"train_loss": -25.13459587097168, "global_step": 249175, "epoch": 3002} {"train_loss": -24.95745277404785, "global_step": 249176, "epoch": 3002} {"train_loss": -25.010663986206055, "global_step": 249177, "epoch": 3002} {"train_loss": -25.43634796142578, "global_step": 249178, "epoch": 3002} {"train_loss": -25.026273727416992, "global_step": 249179, "epoch": 3002} {"train_loss": -25.463787078857422, "global_step": 249180, "epoch": 3002} {"train_loss": -24.991762161254883, "global_step": 249181, "epoch": 3002} {"train_loss": -24.916696548461914, "global_step": 249182, "epoch": 3002} {"train_loss": -25.078649520874023, "global_step": 249183, "epoch": 3002} {"train_loss": -24.97899055480957, "global_step": 249184, "epoch": 3002} {"train_loss": -25.15591812133789, "global_step": 249185, "epoch": 3002} {"train_loss": -25.006372451782227, "global_step": 249186, "epoch": 3002} {"train_loss": -25.244640350341797, "global_step": 249187, "epoch": 3002} {"train_loss": -24.906497955322266, "global_step": 249188, "epoch": 3002} {"train_loss": -24.779020309448242, "global_step": 249189, "epoch": 3002} {"train_loss": -25.069095611572266, "global_step": 249190, "epoch": 3002} {"train_loss": -25.1180477142334, "global_step": 249191, "epoch": 3002} {"train_loss": -25.11402702331543, "global_step": 249192, "epoch": 3002} {"train_loss": -24.821880340576172, "global_step": 249193, "epoch": 3002} {"train_loss": -24.860876083374023, "global_step": 249194, "epoch": 3002} {"train_loss": -24.883920669555664, "global_step": 249195, "epoch": 3002} {"train_loss": -24.900903701782227, "global_step": 249196, "epoch": 3002} {"train_loss": -25.004230499267578, "global_step": 249197, "epoch": 3002} {"train_loss": -25.217920303344727, "global_step": 249198, "epoch": 3002} {"train_loss": -25.21095085144043, "global_step": 249199, "epoch": 3002} {"train_loss": -25.169513702392578, "global_step": 249200, "epoch": 3002} {"train_loss": -24.8406925201416, "global_step": 249201, "epoch": 3002} {"train_loss": -25.230920791625977, "global_step": 249202, "epoch": 3002} {"train_loss": -24.902124404907227, "global_step": 249203, "epoch": 3002} {"train_loss": -25.021778106689453, "global_step": 249204, "epoch": 3002} {"train_loss": -25.331491470336914, "global_step": 249205, "epoch": 3002} {"train_loss": -24.721054077148438, "global_step": 249206, "epoch": 3002} {"train_loss": -24.941253662109375, "global_step": 249207, "epoch": 3002} {"train_loss": -24.921110153198242, "global_step": 249208, "epoch": 3002} {"train_loss": -24.803678512573242, "global_step": 249209, "epoch": 3002} {"train_loss": -24.863393783569336, "global_step": 249210, "epoch": 3002} {"train_loss": -25.208539962768555, "global_step": 249211, "epoch": 3002} {"train_loss": -25.060606002807617, "global_step": 249212, "epoch": 3002} {"train_loss": -25.298383712768555, "global_step": 249213, "epoch": 3002} {"train_loss": -24.985965728759766, "global_step": 249214, "epoch": 3002} {"train_loss": -24.813261032104492, "global_step": 249215, "epoch": 3002} {"train_loss": -24.857446670532227, "global_step": 249216, "epoch": 3002} {"train_loss": -25.115631103515625, "global_step": 249217, "epoch": 3002} {"train_loss": -25.21333122253418, "global_step": 249218, "epoch": 3002} {"train_loss": -25.0233211517334, "global_step": 249219, "epoch": 3002} {"train_loss": -25.091690063476562, "global_step": 249220, "epoch": 3002} {"train_loss": -25.036527633666992, "global_step": 249221, "epoch": 3002} {"train_loss": -25.246000289916992, "global_step": 249222, "epoch": 3002} {"train_loss": -25.55186653137207, "global_step": 249223, "epoch": 3002} {"train_loss": -25.0933895111084, "global_step": 249224, "epoch": 3002} {"train_loss": -25.09853172302246, "global_step": 249225, "epoch": 3002} {"train_loss": -25.45396614074707, "global_step": 249226, "epoch": 3002} {"train_loss": -25.197343826293945, "global_step": 249227, "epoch": 3002} {"train_loss": -25.221872329711914, "global_step": 249228, "epoch": 3002} {"train_loss": -25.197879791259766, "global_step": 249229, "epoch": 3002} {"train_loss": -24.968162536621094, "global_step": 249230, "epoch": 3002} {"train_loss": -24.895761489868164, "global_step": 249231, "epoch": 3002} {"train_loss": -24.91617774963379, "global_step": 249232, "epoch": 3002} {"train_loss": -25.236675262451172, "global_step": 249233, "epoch": 3002} {"train_loss": -25.163806915283203, "global_step": 249234, "epoch": 3002} {"train_loss": -24.95502281188965, "global_step": 249235, "epoch": 3002} {"train_loss": -25.38553810119629, "global_step": 249236, "epoch": 3002} {"train_loss": -24.954221725463867, "global_step": 249237, "epoch": 3002} {"train_loss": -25.04767417907715, "global_step": 249238, "epoch": 3002} {"train_loss": -25.136621475219727, "global_step": 249239, "epoch": 3002} {"train_loss": -25.15924072265625, "global_step": 249240, "epoch": 3002} {"train_loss": -24.893625259399414, "global_step": 249241, "epoch": 3002} {"train_loss": -25.253732681274414, "global_step": 249242, "epoch": 3002} {"train_loss": -25.176326751708984, "global_step": 249243, "epoch": 3002} {"train_loss": -24.9635066986084, "global_step": 249244, "epoch": 3002} {"train_loss": -24.93257713317871, "global_step": 249245, "epoch": 3002} {"train_loss": -25.168119430541992, "global_step": 249246, "epoch": 3002} {"train_loss": -24.646390914916992, "global_step": 249247, "epoch": 3002} {"train_loss": -25.045410294130622, "global_step": 249248, "epoch": 3002, "val_loss": 6869158.5} {"train_loss": -23.959665298461914, "global_step": 249249, "epoch": 3003} {"train_loss": -23.764381408691406, "global_step": 249250, "epoch": 3003} {"train_loss": -24.28023338317871, "global_step": 249251, "epoch": 3003} {"train_loss": -23.581886291503906, "global_step": 249252, "epoch": 3003} {"train_loss": -23.982282638549805, "global_step": 249253, "epoch": 3003} {"train_loss": -24.536401748657227, "global_step": 249254, "epoch": 3003} {"train_loss": -24.369220733642578, "global_step": 249255, "epoch": 3003} {"train_loss": -24.255449295043945, "global_step": 249256, "epoch": 3003} {"train_loss": -24.230548858642578, "global_step": 249257, "epoch": 3003} {"train_loss": -24.662927627563477, "global_step": 249258, "epoch": 3003} {"train_loss": -24.1256103515625, "global_step": 249259, "epoch": 3003} {"train_loss": -24.200735092163086, "global_step": 249260, "epoch": 3003} {"train_loss": -24.299972534179688, "global_step": 249261, "epoch": 3003} {"train_loss": -24.621572494506836, "global_step": 249262, "epoch": 3003} {"train_loss": -24.519775390625, "global_step": 249263, "epoch": 3003} {"train_loss": -24.645891189575195, "global_step": 249264, "epoch": 3003} {"train_loss": -24.6599178314209, "global_step": 249265, "epoch": 3003} {"train_loss": -24.487438201904297, "global_step": 249266, "epoch": 3003} {"train_loss": -25.110708236694336, "global_step": 249267, "epoch": 3003} {"train_loss": -25.02642250061035, "global_step": 249268, "epoch": 3003} {"train_loss": -24.6375675201416, "global_step": 249269, "epoch": 3003} {"train_loss": -24.52645492553711, "global_step": 249270, "epoch": 3003} {"train_loss": -24.588903427124023, "global_step": 249271, "epoch": 3003} {"train_loss": -24.50002098083496, "global_step": 249272, "epoch": 3003} {"train_loss": -24.872434616088867, "global_step": 249273, "epoch": 3003} {"train_loss": -24.87979507446289, "global_step": 249274, "epoch": 3003} {"train_loss": -25.02760887145996, "global_step": 249275, "epoch": 3003} {"train_loss": -24.620254516601562, "global_step": 249276, "epoch": 3003} {"train_loss": -24.48818016052246, "global_step": 249277, "epoch": 3003} {"train_loss": -24.602771759033203, "global_step": 249278, "epoch": 3003} {"train_loss": -25.249326705932617, "global_step": 249279, "epoch": 3003} {"train_loss": -24.691532135009766, "global_step": 249280, "epoch": 3003} {"train_loss": -24.92591667175293, "global_step": 249281, "epoch": 3003} {"train_loss": -25.040346145629883, "global_step": 249282, "epoch": 3003} {"train_loss": -25.220884323120117, "global_step": 249283, "epoch": 3003} {"train_loss": -24.933027267456055, "global_step": 249284, "epoch": 3003} {"train_loss": -24.796117782592773, "global_step": 249285, "epoch": 3003} {"train_loss": -25.03769302368164, "global_step": 249286, "epoch": 3003} {"train_loss": -25.233671188354492, "global_step": 249287, "epoch": 3003} {"train_loss": -25.1353702545166, "global_step": 249288, "epoch": 3003} {"train_loss": -25.228286743164062, "global_step": 249289, "epoch": 3003} {"train_loss": -25.01789665222168, "global_step": 249290, "epoch": 3003} {"train_loss": -25.086671829223633, "global_step": 249291, "epoch": 3003} {"train_loss": -25.08010482788086, "global_step": 249292, "epoch": 3003} {"train_loss": -25.36219596862793, "global_step": 249293, "epoch": 3003} {"train_loss": -25.091827392578125, "global_step": 249294, "epoch": 3003} {"train_loss": -25.19822120666504, "global_step": 249295, "epoch": 3003} {"train_loss": -25.142343521118164, "global_step": 249296, "epoch": 3003} {"train_loss": -25.14706802368164, "global_step": 249297, "epoch": 3003} {"train_loss": -24.523542404174805, "global_step": 249298, "epoch": 3003} {"train_loss": -25.031538009643555, "global_step": 249299, "epoch": 3003} {"train_loss": -24.79030418395996, "global_step": 249300, "epoch": 3003} {"train_loss": -25.276823043823242, "global_step": 249301, "epoch": 3003} {"train_loss": -25.174959182739258, "global_step": 249302, "epoch": 3003} {"train_loss": -25.409149169921875, "global_step": 249303, "epoch": 3003} {"train_loss": -25.37798500061035, "global_step": 249304, "epoch": 3003} {"train_loss": -25.269153594970703, "global_step": 249305, "epoch": 3003} {"train_loss": -25.419248580932617, "global_step": 249306, "epoch": 3003} {"train_loss": -25.16619873046875, "global_step": 249307, "epoch": 3003} {"train_loss": -25.06650733947754, "global_step": 249308, "epoch": 3003} {"train_loss": -25.427051544189453, "global_step": 249309, "epoch": 3003} {"train_loss": -25.077423095703125, "global_step": 249310, "epoch": 3003} {"train_loss": -24.836746215820312, "global_step": 249311, "epoch": 3003} {"train_loss": -25.359771728515625, "global_step": 249312, "epoch": 3003} {"train_loss": -24.871854782104492, "global_step": 249313, "epoch": 3003} {"train_loss": -25.378089904785156, "global_step": 249314, "epoch": 3003} {"train_loss": -25.037267684936523, "global_step": 249315, "epoch": 3003} {"train_loss": -24.52020835876465, "global_step": 249316, "epoch": 3003} {"train_loss": -24.348114013671875, "global_step": 249317, "epoch": 3003} {"train_loss": -24.016555786132812, "global_step": 249318, "epoch": 3003} {"train_loss": -24.671628952026367, "global_step": 249319, "epoch": 3003} {"train_loss": -25.050275802612305, "global_step": 249320, "epoch": 3003} {"train_loss": -24.291868209838867, "global_step": 249321, "epoch": 3003} {"train_loss": -25.1359920501709, "global_step": 249322, "epoch": 3003} {"train_loss": -24.9066104888916, "global_step": 249323, "epoch": 3003} {"train_loss": -25.049911499023438, "global_step": 249324, "epoch": 3003} {"train_loss": -24.650800704956055, "global_step": 249325, "epoch": 3003} {"train_loss": -25.356842041015625, "global_step": 249326, "epoch": 3003} {"train_loss": -24.72620964050293, "global_step": 249327, "epoch": 3003} {"train_loss": -24.904739379882812, "global_step": 249328, "epoch": 3003} {"train_loss": -24.70564079284668, "global_step": 249329, "epoch": 3003} {"train_loss": -25.32154655456543, "global_step": 249330, "epoch": 3003} {"train_loss": -24.819558614707855, "global_step": 249331, "epoch": 3003, "val_loss": 6882861.5} {"train_loss": -25.128372192382812, "global_step": 249332, "epoch": 3004} {"train_loss": -24.73110008239746, "global_step": 249333, "epoch": 3004} {"train_loss": -25.198165893554688, "global_step": 249334, "epoch": 3004} {"train_loss": -25.10072898864746, "global_step": 249335, "epoch": 3004} {"train_loss": -25.00931167602539, "global_step": 249336, "epoch": 3004} {"train_loss": -24.702939987182617, "global_step": 249337, "epoch": 3004} {"train_loss": -25.318359375, "global_step": 249338, "epoch": 3004} {"train_loss": -25.007511138916016, "global_step": 249339, "epoch": 3004} {"train_loss": -24.9569149017334, "global_step": 249340, "epoch": 3004} {"train_loss": -24.54123878479004, "global_step": 249341, "epoch": 3004} {"train_loss": -24.47592544555664, "global_step": 249342, "epoch": 3004} {"train_loss": -24.736560821533203, "global_step": 249343, "epoch": 3004} {"train_loss": -24.66448211669922, "global_step": 249344, "epoch": 3004} {"train_loss": -24.928884506225586, "global_step": 249345, "epoch": 3004} {"train_loss": -25.266572952270508, "global_step": 249346, "epoch": 3004} {"train_loss": -25.284225463867188, "global_step": 249347, "epoch": 3004} {"train_loss": -24.69014549255371, "global_step": 249348, "epoch": 3004} {"train_loss": -24.84369468688965, "global_step": 249349, "epoch": 3004} {"train_loss": -24.924970626831055, "global_step": 249350, "epoch": 3004} {"train_loss": -25.139324188232422, "global_step": 249351, "epoch": 3004} {"train_loss": -24.978771209716797, "global_step": 249352, "epoch": 3004} {"train_loss": -25.171335220336914, "global_step": 249353, "epoch": 3004} {"train_loss": -24.632404327392578, "global_step": 249354, "epoch": 3004} {"train_loss": -25.318588256835938, "global_step": 249355, "epoch": 3004} {"train_loss": -24.982177734375, "global_step": 249356, "epoch": 3004} {"train_loss": -24.74161720275879, "global_step": 249357, "epoch": 3004} {"train_loss": -24.983186721801758, "global_step": 249358, "epoch": 3004} {"train_loss": -25.2192325592041, "global_step": 249359, "epoch": 3004} {"train_loss": -24.99022102355957, "global_step": 249360, "epoch": 3004} {"train_loss": -25.014753341674805, "global_step": 249361, "epoch": 3004} {"train_loss": -25.36783790588379, "global_step": 249362, "epoch": 3004} {"train_loss": -25.46068000793457, "global_step": 249363, "epoch": 3004} {"train_loss": -25.454580307006836, "global_step": 249364, "epoch": 3004} {"train_loss": -25.3472957611084, "global_step": 249365, "epoch": 3004} {"train_loss": -25.398975372314453, "global_step": 249366, "epoch": 3004} {"train_loss": -24.93589973449707, "global_step": 249367, "epoch": 3004} {"train_loss": -25.01421546936035, "global_step": 249368, "epoch": 3004} {"train_loss": -25.161983489990234, "global_step": 249369, "epoch": 3004} {"train_loss": -24.98744010925293, "global_step": 249370, "epoch": 3004} {"train_loss": -24.78652572631836, "global_step": 249371, "epoch": 3004} {"train_loss": -25.11732292175293, "global_step": 249372, "epoch": 3004} {"train_loss": -25.010086059570312, "global_step": 249373, "epoch": 3004} {"train_loss": -25.0366153717041, "global_step": 249374, "epoch": 3004} {"train_loss": -24.817724227905273, "global_step": 249375, "epoch": 3004} {"train_loss": -25.11754035949707, "global_step": 249376, "epoch": 3004} {"train_loss": -24.944345474243164, "global_step": 249377, "epoch": 3004} {"train_loss": -24.627365112304688, "global_step": 249378, "epoch": 3004} {"train_loss": -24.879011154174805, "global_step": 249379, "epoch": 3004} {"train_loss": -24.922086715698242, "global_step": 249380, "epoch": 3004} {"train_loss": -24.680448532104492, "global_step": 249381, "epoch": 3004} {"train_loss": -24.489654541015625, "global_step": 249382, "epoch": 3004} {"train_loss": -24.404531478881836, "global_step": 249383, "epoch": 3004} {"train_loss": -24.663433074951172, "global_step": 249384, "epoch": 3004} {"train_loss": -24.8436336517334, "global_step": 249385, "epoch": 3004} {"train_loss": -24.679664611816406, "global_step": 249386, "epoch": 3004} {"train_loss": -24.773975372314453, "global_step": 249387, "epoch": 3004} {"train_loss": -25.376876831054688, "global_step": 249388, "epoch": 3004} {"train_loss": -24.610261917114258, "global_step": 249389, "epoch": 3004} {"train_loss": -25.010974884033203, "global_step": 249390, "epoch": 3004} {"train_loss": -25.220901489257812, "global_step": 249391, "epoch": 3004} {"train_loss": -24.836502075195312, "global_step": 249392, "epoch": 3004} {"train_loss": -24.915719985961914, "global_step": 249393, "epoch": 3004} {"train_loss": -25.3568172454834, "global_step": 249394, "epoch": 3004} {"train_loss": -24.795856475830078, "global_step": 249395, "epoch": 3004} {"train_loss": -25.27925682067871, "global_step": 249396, "epoch": 3004} {"train_loss": -25.01359748840332, "global_step": 249397, "epoch": 3004} {"train_loss": -25.164052963256836, "global_step": 249398, "epoch": 3004} {"train_loss": -24.85672950744629, "global_step": 249399, "epoch": 3004} {"train_loss": -24.599689483642578, "global_step": 249400, "epoch": 3004} {"train_loss": -24.924177169799805, "global_step": 249401, "epoch": 3004} {"train_loss": -25.059396743774414, "global_step": 249402, "epoch": 3004} {"train_loss": -24.691801071166992, "global_step": 249403, "epoch": 3004} {"train_loss": -25.178274154663086, "global_step": 249404, "epoch": 3004} {"train_loss": -25.705768585205078, "global_step": 249405, "epoch": 3004} {"train_loss": -24.877145767211914, "global_step": 249406, "epoch": 3004} {"train_loss": -25.204824447631836, "global_step": 249407, "epoch": 3004} {"train_loss": -24.939420700073242, "global_step": 249408, "epoch": 3004} {"train_loss": -25.06539535522461, "global_step": 249409, "epoch": 3004} {"train_loss": -24.717748641967773, "global_step": 249410, "epoch": 3004} {"train_loss": -24.784814834594727, "global_step": 249411, "epoch": 3004} {"train_loss": -24.665311813354492, "global_step": 249412, "epoch": 3004} {"train_loss": -24.56886100769043, "global_step": 249413, "epoch": 3004} {"train_loss": -24.98176990646914, "global_step": 249414, "epoch": 3004, "val_loss": 6867259.0} {"train_loss": -24.150808334350586, "global_step": 249415, "epoch": 3005} {"train_loss": -24.53175163269043, "global_step": 249416, "epoch": 3005} {"train_loss": -23.836286544799805, "global_step": 249417, "epoch": 3005} {"train_loss": -24.789199829101562, "global_step": 249418, "epoch": 3005} {"train_loss": -24.49308204650879, "global_step": 249419, "epoch": 3005} {"train_loss": -24.255422592163086, "global_step": 249420, "epoch": 3005} {"train_loss": -24.30925178527832, "global_step": 249421, "epoch": 3005} {"train_loss": -24.428125381469727, "global_step": 249422, "epoch": 3005} {"train_loss": -24.34769058227539, "global_step": 249423, "epoch": 3005} {"train_loss": -24.633499145507812, "global_step": 249424, "epoch": 3005} {"train_loss": -24.820453643798828, "global_step": 249425, "epoch": 3005} {"train_loss": -24.5504207611084, "global_step": 249426, "epoch": 3005} {"train_loss": -24.851789474487305, "global_step": 249427, "epoch": 3005} {"train_loss": -24.357099533081055, "global_step": 249428, "epoch": 3005} {"train_loss": -24.71084976196289, "global_step": 249429, "epoch": 3005} {"train_loss": -24.187387466430664, "global_step": 249430, "epoch": 3005} {"train_loss": -24.65691566467285, "global_step": 249431, "epoch": 3005} {"train_loss": -24.8210506439209, "global_step": 249432, "epoch": 3005} {"train_loss": -24.43715476989746, "global_step": 249433, "epoch": 3005} {"train_loss": -24.5350341796875, "global_step": 249434, "epoch": 3005} {"train_loss": -24.62118911743164, "global_step": 249435, "epoch": 3005} {"train_loss": -24.77621078491211, "global_step": 249436, "epoch": 3005} {"train_loss": -25.10667610168457, "global_step": 249437, "epoch": 3005} {"train_loss": -24.839879989624023, "global_step": 249438, "epoch": 3005} {"train_loss": -25.078317642211914, "global_step": 249439, "epoch": 3005} {"train_loss": -24.631567001342773, "global_step": 249440, "epoch": 3005} {"train_loss": -24.923166275024414, "global_step": 249441, "epoch": 3005} {"train_loss": -24.45297622680664, "global_step": 249442, "epoch": 3005} {"train_loss": -24.725309371948242, "global_step": 249443, "epoch": 3005} {"train_loss": -24.964096069335938, "global_step": 249444, "epoch": 3005} {"train_loss": -25.00263023376465, "global_step": 249445, "epoch": 3005} {"train_loss": -24.507854461669922, "global_step": 249446, "epoch": 3005} {"train_loss": -25.38740348815918, "global_step": 249447, "epoch": 3005} {"train_loss": -24.941482543945312, "global_step": 249448, "epoch": 3005} {"train_loss": -24.98888397216797, "global_step": 249449, "epoch": 3005} {"train_loss": -25.233396530151367, "global_step": 249450, "epoch": 3005} {"train_loss": -24.858352661132812, "global_step": 249451, "epoch": 3005} {"train_loss": -25.093856811523438, "global_step": 249452, "epoch": 3005} {"train_loss": -24.90699005126953, "global_step": 249453, "epoch": 3005} {"train_loss": -25.156702041625977, "global_step": 249454, "epoch": 3005} {"train_loss": -25.137039184570312, "global_step": 249455, "epoch": 3005} {"train_loss": -24.772737503051758, "global_step": 249456, "epoch": 3005} {"train_loss": -25.037485122680664, "global_step": 249457, "epoch": 3005} {"train_loss": -25.111040115356445, "global_step": 249458, "epoch": 3005} {"train_loss": -25.24239730834961, "global_step": 249459, "epoch": 3005} {"train_loss": -25.308780670166016, "global_step": 249460, "epoch": 3005} {"train_loss": -25.1937313079834, "global_step": 249461, "epoch": 3005} {"train_loss": -25.12723159790039, "global_step": 249462, "epoch": 3005} {"train_loss": -25.18867301940918, "global_step": 249463, "epoch": 3005} {"train_loss": -25.413684844970703, "global_step": 249464, "epoch": 3005} {"train_loss": -25.328035354614258, "global_step": 249465, "epoch": 3005} {"train_loss": -24.903024673461914, "global_step": 249466, "epoch": 3005} {"train_loss": -25.028972625732422, "global_step": 249467, "epoch": 3005} {"train_loss": -25.1302490234375, "global_step": 249468, "epoch": 3005} {"train_loss": -25.223459243774414, "global_step": 249469, "epoch": 3005} {"train_loss": -25.17693519592285, "global_step": 249470, "epoch": 3005} {"train_loss": -24.9755916595459, "global_step": 249471, "epoch": 3005} {"train_loss": -25.391324996948242, "global_step": 249472, "epoch": 3005} {"train_loss": -25.04030418395996, "global_step": 249473, "epoch": 3005} {"train_loss": -25.425764083862305, "global_step": 249474, "epoch": 3005} {"train_loss": -25.081151962280273, "global_step": 249475, "epoch": 3005} {"train_loss": -25.294513702392578, "global_step": 249476, "epoch": 3005} {"train_loss": -24.890928268432617, "global_step": 249477, "epoch": 3005} {"train_loss": -25.074905395507812, "global_step": 249478, "epoch": 3005} {"train_loss": -24.631284713745117, "global_step": 249479, "epoch": 3005} {"train_loss": -24.48714256286621, "global_step": 249480, "epoch": 3005} {"train_loss": -24.814260482788086, "global_step": 249481, "epoch": 3005} {"train_loss": -25.222522735595703, "global_step": 249482, "epoch": 3005} {"train_loss": -24.6478271484375, "global_step": 249483, "epoch": 3005} {"train_loss": -24.206159591674805, "global_step": 249484, "epoch": 3005} {"train_loss": -24.953205108642578, "global_step": 249485, "epoch": 3005} {"train_loss": -24.708494186401367, "global_step": 249486, "epoch": 3005} {"train_loss": -24.64422035217285, "global_step": 249487, "epoch": 3005} {"train_loss": -24.980148315429688, "global_step": 249488, "epoch": 3005} {"train_loss": -24.396018981933594, "global_step": 249489, "epoch": 3005} {"train_loss": -24.455724716186523, "global_step": 249490, "epoch": 3005} {"train_loss": -24.719907760620117, "global_step": 249491, "epoch": 3005} {"train_loss": -24.442533493041992, "global_step": 249492, "epoch": 3005} {"train_loss": -24.93778419494629, "global_step": 249493, "epoch": 3005} {"train_loss": -24.795331954956055, "global_step": 249494, "epoch": 3005} {"train_loss": -24.433021545410156, "global_step": 249495, "epoch": 3005} {"train_loss": -24.970617294311523, "global_step": 249496, "epoch": 3005} {"train_loss": -24.83309853795063, "global_step": 249497, "epoch": 3005, "val_loss": 6759867.0} {"train_loss": -24.41425132751465, "global_step": 249498, "epoch": 3006} {"train_loss": -23.75337791442871, "global_step": 249499, "epoch": 3006} {"train_loss": -24.674100875854492, "global_step": 249500, "epoch": 3006} {"train_loss": -23.85668182373047, "global_step": 249501, "epoch": 3006} {"train_loss": -24.450347900390625, "global_step": 249502, "epoch": 3006} {"train_loss": -24.518369674682617, "global_step": 249503, "epoch": 3006} {"train_loss": -24.419092178344727, "global_step": 249504, "epoch": 3006} {"train_loss": -24.57394790649414, "global_step": 249505, "epoch": 3006} {"train_loss": -24.628860473632812, "global_step": 249506, "epoch": 3006} {"train_loss": -24.555673599243164, "global_step": 249507, "epoch": 3006} {"train_loss": -24.249921798706055, "global_step": 249508, "epoch": 3006} {"train_loss": -24.890953063964844, "global_step": 249509, "epoch": 3006} {"train_loss": -24.645326614379883, "global_step": 249510, "epoch": 3006} {"train_loss": -24.943111419677734, "global_step": 249511, "epoch": 3006} {"train_loss": -24.735387802124023, "global_step": 249512, "epoch": 3006} {"train_loss": -24.865676879882812, "global_step": 249513, "epoch": 3006} {"train_loss": -24.694425582885742, "global_step": 249514, "epoch": 3006} {"train_loss": -25.00355339050293, "global_step": 249515, "epoch": 3006} {"train_loss": -24.453275680541992, "global_step": 249516, "epoch": 3006} {"train_loss": -24.937593460083008, "global_step": 249517, "epoch": 3006} {"train_loss": -24.639997482299805, "global_step": 249518, "epoch": 3006} {"train_loss": -24.99005126953125, "global_step": 249519, "epoch": 3006} {"train_loss": -25.000328063964844, "global_step": 249520, "epoch": 3006} {"train_loss": -24.821134567260742, "global_step": 249521, "epoch": 3006} {"train_loss": -24.884531021118164, "global_step": 249522, "epoch": 3006} {"train_loss": -24.78855323791504, "global_step": 249523, "epoch": 3006} {"train_loss": -25.14935874938965, "global_step": 249524, "epoch": 3006} {"train_loss": -25.20760154724121, "global_step": 249525, "epoch": 3006} {"train_loss": -25.057891845703125, "global_step": 249526, "epoch": 3006} {"train_loss": -25.106481552124023, "global_step": 249527, "epoch": 3006} {"train_loss": -25.18863296508789, "global_step": 249528, "epoch": 3006} {"train_loss": -24.93861198425293, "global_step": 249529, "epoch": 3006} {"train_loss": -24.947879791259766, "global_step": 249530, "epoch": 3006} {"train_loss": -24.994447708129883, "global_step": 249531, "epoch": 3006} {"train_loss": -24.91828155517578, "global_step": 249532, "epoch": 3006} {"train_loss": -24.966629028320312, "global_step": 249533, "epoch": 3006} {"train_loss": -24.81353187561035, "global_step": 249534, "epoch": 3006} {"train_loss": -25.512380599975586, "global_step": 249535, "epoch": 3006} {"train_loss": -25.064680099487305, "global_step": 249536, "epoch": 3006} {"train_loss": -25.050451278686523, "global_step": 249537, "epoch": 3006} {"train_loss": -25.18924903869629, "global_step": 249538, "epoch": 3006} {"train_loss": -25.02168846130371, "global_step": 249539, "epoch": 3006} {"train_loss": -25.239717483520508, "global_step": 249540, "epoch": 3006} {"train_loss": -25.03274917602539, "global_step": 249541, "epoch": 3006} {"train_loss": -25.016000747680664, "global_step": 249542, "epoch": 3006} {"train_loss": -24.86652946472168, "global_step": 249543, "epoch": 3006} {"train_loss": -24.95845603942871, "global_step": 249544, "epoch": 3006} {"train_loss": -25.316579818725586, "global_step": 249545, "epoch": 3006} {"train_loss": -25.09051513671875, "global_step": 249546, "epoch": 3006} {"train_loss": -25.18383026123047, "global_step": 249547, "epoch": 3006} {"train_loss": -24.949695587158203, "global_step": 249548, "epoch": 3006} {"train_loss": -25.092361450195312, "global_step": 249549, "epoch": 3006} {"train_loss": -25.221012115478516, "global_step": 249550, "epoch": 3006} {"train_loss": -25.17864418029785, "global_step": 249551, "epoch": 3006} {"train_loss": -24.9368896484375, "global_step": 249552, "epoch": 3006} {"train_loss": -25.27474021911621, "global_step": 249553, "epoch": 3006} {"train_loss": -25.28951072692871, "global_step": 249554, "epoch": 3006} {"train_loss": -25.241153717041016, "global_step": 249555, "epoch": 3006} {"train_loss": -25.069822311401367, "global_step": 249556, "epoch": 3006} {"train_loss": -25.197965621948242, "global_step": 249557, "epoch": 3006} {"train_loss": -25.02100944519043, "global_step": 249558, "epoch": 3006} {"train_loss": -25.123065948486328, "global_step": 249559, "epoch": 3006} {"train_loss": -25.038694381713867, "global_step": 249560, "epoch": 3006} {"train_loss": -24.872705459594727, "global_step": 249561, "epoch": 3006} {"train_loss": -25.087024688720703, "global_step": 249562, "epoch": 3006} {"train_loss": -25.129560470581055, "global_step": 249563, "epoch": 3006} {"train_loss": -25.108516693115234, "global_step": 249564, "epoch": 3006} {"train_loss": -25.0509033203125, "global_step": 249565, "epoch": 3006} {"train_loss": -25.26978874206543, "global_step": 249566, "epoch": 3006} {"train_loss": -24.639169692993164, "global_step": 249567, "epoch": 3006} {"train_loss": -23.917434692382812, "global_step": 249568, "epoch": 3006} {"train_loss": -23.729141235351562, "global_step": 249569, "epoch": 3006} {"train_loss": -23.899852752685547, "global_step": 249570, "epoch": 3006} {"train_loss": -24.928659439086914, "global_step": 249571, "epoch": 3006} {"train_loss": -24.517972946166992, "global_step": 249572, "epoch": 3006} {"train_loss": -24.488306045532227, "global_step": 249573, "epoch": 3006} {"train_loss": -24.61237144470215, "global_step": 249574, "epoch": 3006} {"train_loss": -24.78700828552246, "global_step": 249575, "epoch": 3006} {"train_loss": -24.413732528686523, "global_step": 249576, "epoch": 3006} {"train_loss": -24.177581787109375, "global_step": 249577, "epoch": 3006} {"train_loss": -24.5627384185791, "global_step": 249578, "epoch": 3006} {"train_loss": -24.956098556518555, "global_step": 249579, "epoch": 3006} {"train_loss": -24.84621610986181, "global_step": 249580, "epoch": 3006, "val_loss": 6849403.0} {"train_loss": -23.59453582763672, "global_step": 249581, "epoch": 3007} {"train_loss": -24.119260787963867, "global_step": 249582, "epoch": 3007} {"train_loss": -24.290441513061523, "global_step": 249583, "epoch": 3007} {"train_loss": -24.445392608642578, "global_step": 249584, "epoch": 3007} {"train_loss": -23.715625762939453, "global_step": 249585, "epoch": 3007} {"train_loss": -24.63543128967285, "global_step": 249586, "epoch": 3007} {"train_loss": -24.24168586730957, "global_step": 249587, "epoch": 3007} {"train_loss": -24.680988311767578, "global_step": 249588, "epoch": 3007} {"train_loss": -23.908851623535156, "global_step": 249589, "epoch": 3007} {"train_loss": -24.995777130126953, "global_step": 249590, "epoch": 3007} {"train_loss": -24.071945190429688, "global_step": 249591, "epoch": 3007} {"train_loss": -24.631948471069336, "global_step": 249592, "epoch": 3007} {"train_loss": -24.33698844909668, "global_step": 249593, "epoch": 3007} {"train_loss": -24.538740158081055, "global_step": 249594, "epoch": 3007} {"train_loss": -24.24055290222168, "global_step": 249595, "epoch": 3007} {"train_loss": -24.49945640563965, "global_step": 249596, "epoch": 3007} {"train_loss": -24.665985107421875, "global_step": 249597, "epoch": 3007} {"train_loss": -24.967803955078125, "global_step": 249598, "epoch": 3007} {"train_loss": -24.683887481689453, "global_step": 249599, "epoch": 3007} {"train_loss": -24.983623504638672, "global_step": 249600, "epoch": 3007} {"train_loss": -24.83945655822754, "global_step": 249601, "epoch": 3007} {"train_loss": -24.536420822143555, "global_step": 249602, "epoch": 3007} {"train_loss": -24.902868270874023, "global_step": 249603, "epoch": 3007} {"train_loss": -24.488941192626953, "global_step": 249604, "epoch": 3007} {"train_loss": -24.83838653564453, "global_step": 249605, "epoch": 3007} {"train_loss": -25.210241317749023, "global_step": 249606, "epoch": 3007} {"train_loss": -25.0180721282959, "global_step": 249607, "epoch": 3007} {"train_loss": -24.675596237182617, "global_step": 249608, "epoch": 3007} {"train_loss": -24.7066650390625, "global_step": 249609, "epoch": 3007} {"train_loss": -24.71585464477539, "global_step": 249610, "epoch": 3007} {"train_loss": -25.289175033569336, "global_step": 249611, "epoch": 3007} {"train_loss": -24.923837661743164, "global_step": 249612, "epoch": 3007} {"train_loss": -25.110797882080078, "global_step": 249613, "epoch": 3007} {"train_loss": -25.189687728881836, "global_step": 249614, "epoch": 3007} {"train_loss": -24.71556282043457, "global_step": 249615, "epoch": 3007} {"train_loss": -25.127182006835938, "global_step": 249616, "epoch": 3007} {"train_loss": -24.78461456298828, "global_step": 249617, "epoch": 3007} {"train_loss": -24.91330909729004, "global_step": 249618, "epoch": 3007} {"train_loss": -25.15360450744629, "global_step": 249619, "epoch": 3007} {"train_loss": -25.137784957885742, "global_step": 249620, "epoch": 3007} {"train_loss": -24.894323348999023, "global_step": 249621, "epoch": 3007} {"train_loss": -25.24239158630371, "global_step": 249622, "epoch": 3007} {"train_loss": -24.83148193359375, "global_step": 249623, "epoch": 3007} {"train_loss": -25.09159278869629, "global_step": 249624, "epoch": 3007} {"train_loss": -25.203989028930664, "global_step": 249625, "epoch": 3007} {"train_loss": -25.09290885925293, "global_step": 249626, "epoch": 3007} {"train_loss": -25.120664596557617, "global_step": 249627, "epoch": 3007} {"train_loss": -24.80702018737793, "global_step": 249628, "epoch": 3007} {"train_loss": -24.69581413269043, "global_step": 249629, "epoch": 3007} {"train_loss": -25.078317642211914, "global_step": 249630, "epoch": 3007} {"train_loss": -25.187969207763672, "global_step": 249631, "epoch": 3007} {"train_loss": -25.234739303588867, "global_step": 249632, "epoch": 3007} {"train_loss": -24.737499237060547, "global_step": 249633, "epoch": 3007} {"train_loss": -24.888626098632812, "global_step": 249634, "epoch": 3007} {"train_loss": -24.341297149658203, "global_step": 249635, "epoch": 3007} {"train_loss": -24.57818603515625, "global_step": 249636, "epoch": 3007} {"train_loss": -24.73626136779785, "global_step": 249637, "epoch": 3007} {"train_loss": -24.644351959228516, "global_step": 249638, "epoch": 3007} {"train_loss": -24.729089736938477, "global_step": 249639, "epoch": 3007} {"train_loss": -24.98439598083496, "global_step": 249640, "epoch": 3007} {"train_loss": -24.653446197509766, "global_step": 249641, "epoch": 3007} {"train_loss": -24.776472091674805, "global_step": 249642, "epoch": 3007} {"train_loss": -25.048126220703125, "global_step": 249643, "epoch": 3007} {"train_loss": -24.775964736938477, "global_step": 249644, "epoch": 3007} {"train_loss": -24.66623878479004, "global_step": 249645, "epoch": 3007} {"train_loss": -24.370004653930664, "global_step": 249646, "epoch": 3007} {"train_loss": -24.86817741394043, "global_step": 249647, "epoch": 3007} {"train_loss": -25.23097801208496, "global_step": 249648, "epoch": 3007} {"train_loss": -24.9444637298584, "global_step": 249649, "epoch": 3007} {"train_loss": -24.92117691040039, "global_step": 249650, "epoch": 3007} {"train_loss": -24.80183982849121, "global_step": 249651, "epoch": 3007} {"train_loss": -24.901884078979492, "global_step": 249652, "epoch": 3007} {"train_loss": -24.967824935913086, "global_step": 249653, "epoch": 3007} {"train_loss": -24.852928161621094, "global_step": 249654, "epoch": 3007} {"train_loss": -25.00734519958496, "global_step": 249655, "epoch": 3007} {"train_loss": -24.970958709716797, "global_step": 249656, "epoch": 3007} {"train_loss": -25.11236000061035, "global_step": 249657, "epoch": 3007} {"train_loss": -25.19519805908203, "global_step": 249658, "epoch": 3007} {"train_loss": -24.831684112548828, "global_step": 249659, "epoch": 3007} {"train_loss": -25.35286521911621, "global_step": 249660, "epoch": 3007} {"train_loss": -24.8432559967041, "global_step": 249661, "epoch": 3007} {"train_loss": -24.9403133392334, "global_step": 249662, "epoch": 3007} {"train_loss": -24.80200648020549, "global_step": 249663, "epoch": 3007, "val_loss": 6794912.0} {"train_loss": -24.557737350463867, "global_step": 249664, "epoch": 3008} {"train_loss": -24.693920135498047, "global_step": 249665, "epoch": 3008} {"train_loss": -24.62368392944336, "global_step": 249666, "epoch": 3008} {"train_loss": -24.433258056640625, "global_step": 249667, "epoch": 3008} {"train_loss": -24.782501220703125, "global_step": 249668, "epoch": 3008} {"train_loss": -24.4912052154541, "global_step": 249669, "epoch": 3008} {"train_loss": -24.857080459594727, "global_step": 249670, "epoch": 3008} {"train_loss": -24.98126792907715, "global_step": 249671, "epoch": 3008} {"train_loss": -24.967954635620117, "global_step": 249672, "epoch": 3008} {"train_loss": -24.516834259033203, "global_step": 249673, "epoch": 3008} {"train_loss": -24.819982528686523, "global_step": 249674, "epoch": 3008} {"train_loss": -24.810871124267578, "global_step": 249675, "epoch": 3008} {"train_loss": -24.77324867248535, "global_step": 249676, "epoch": 3008} {"train_loss": -25.022445678710938, "global_step": 249677, "epoch": 3008} {"train_loss": -25.003095626831055, "global_step": 249678, "epoch": 3008} {"train_loss": -24.916364669799805, "global_step": 249679, "epoch": 3008} {"train_loss": -24.95937156677246, "global_step": 249680, "epoch": 3008} {"train_loss": -25.038633346557617, "global_step": 249681, "epoch": 3008} {"train_loss": -25.007675170898438, "global_step": 249682, "epoch": 3008} {"train_loss": -24.684690475463867, "global_step": 249683, "epoch": 3008} {"train_loss": -24.866172790527344, "global_step": 249684, "epoch": 3008} {"train_loss": -25.005001068115234, "global_step": 249685, "epoch": 3008} {"train_loss": -25.017581939697266, "global_step": 249686, "epoch": 3008} {"train_loss": -25.173871994018555, "global_step": 249687, "epoch": 3008} {"train_loss": -25.185640335083008, "global_step": 249688, "epoch": 3008} {"train_loss": -24.805490493774414, "global_step": 249689, "epoch": 3008} {"train_loss": -24.87789535522461, "global_step": 249690, "epoch": 3008} {"train_loss": -25.191076278686523, "global_step": 249691, "epoch": 3008} {"train_loss": -25.1395320892334, "global_step": 249692, "epoch": 3008} {"train_loss": -25.002033233642578, "global_step": 249693, "epoch": 3008} {"train_loss": -24.892475128173828, "global_step": 249694, "epoch": 3008} {"train_loss": -24.955453872680664, "global_step": 249695, "epoch": 3008} {"train_loss": -24.995019912719727, "global_step": 249696, "epoch": 3008} {"train_loss": -25.56816291809082, "global_step": 249697, "epoch": 3008} {"train_loss": -25.12912368774414, "global_step": 249698, "epoch": 3008} {"train_loss": -25.1129207611084, "global_step": 249699, "epoch": 3008} {"train_loss": -25.075830459594727, "global_step": 249700, "epoch": 3008} {"train_loss": -25.40736198425293, "global_step": 249701, "epoch": 3008} {"train_loss": -25.1351318359375, "global_step": 249702, "epoch": 3008} {"train_loss": -25.21744155883789, "global_step": 249703, "epoch": 3008} {"train_loss": -25.35244369506836, "global_step": 249704, "epoch": 3008} {"train_loss": -24.96820068359375, "global_step": 249705, "epoch": 3008} {"train_loss": -25.320913314819336, "global_step": 249706, "epoch": 3008} {"train_loss": -25.056711196899414, "global_step": 249707, "epoch": 3008} {"train_loss": -25.136566162109375, "global_step": 249708, "epoch": 3008} {"train_loss": -25.51005744934082, "global_step": 249709, "epoch": 3008} {"train_loss": -25.053634643554688, "global_step": 249710, "epoch": 3008} {"train_loss": -25.21356201171875, "global_step": 249711, "epoch": 3008} {"train_loss": -25.12877655029297, "global_step": 249712, "epoch": 3008} {"train_loss": -25.157793045043945, "global_step": 249713, "epoch": 3008} {"train_loss": -25.22918701171875, "global_step": 249714, "epoch": 3008} {"train_loss": -25.146772384643555, "global_step": 249715, "epoch": 3008} {"train_loss": -25.23528289794922, "global_step": 249716, "epoch": 3008} {"train_loss": -25.16139030456543, "global_step": 249717, "epoch": 3008} {"train_loss": -25.0854549407959, "global_step": 249718, "epoch": 3008} {"train_loss": -25.082338333129883, "global_step": 249719, "epoch": 3008} {"train_loss": -25.577253341674805, "global_step": 249720, "epoch": 3008} {"train_loss": -25.21040153503418, "global_step": 249721, "epoch": 3008} {"train_loss": -25.11893653869629, "global_step": 249722, "epoch": 3008} {"train_loss": -25.13323974609375, "global_step": 249723, "epoch": 3008} {"train_loss": -25.15580177307129, "global_step": 249724, "epoch": 3008} {"train_loss": -25.280927658081055, "global_step": 249725, "epoch": 3008} {"train_loss": -25.034635543823242, "global_step": 249726, "epoch": 3008} {"train_loss": -25.022130966186523, "global_step": 249727, "epoch": 3008} {"train_loss": -25.1320858001709, "global_step": 249728, "epoch": 3008} {"train_loss": -25.35650634765625, "global_step": 249729, "epoch": 3008} {"train_loss": -24.84378433227539, "global_step": 249730, "epoch": 3008} {"train_loss": -24.33377456665039, "global_step": 249731, "epoch": 3008} {"train_loss": -24.28948974609375, "global_step": 249732, "epoch": 3008} {"train_loss": -24.46306800842285, "global_step": 249733, "epoch": 3008} {"train_loss": -24.27144432067871, "global_step": 249734, "epoch": 3008} {"train_loss": -24.463075637817383, "global_step": 249735, "epoch": 3008} {"train_loss": -24.88381004333496, "global_step": 249736, "epoch": 3008} {"train_loss": -25.068134307861328, "global_step": 249737, "epoch": 3008} {"train_loss": -24.647335052490234, "global_step": 249738, "epoch": 3008} {"train_loss": -24.798460006713867, "global_step": 249739, "epoch": 3008} {"train_loss": -24.73540687561035, "global_step": 249740, "epoch": 3008} {"train_loss": -24.892982482910156, "global_step": 249741, "epoch": 3008} {"train_loss": -24.663599014282227, "global_step": 249742, "epoch": 3008} {"train_loss": -25.07758903503418, "global_step": 249743, "epoch": 3008} {"train_loss": -25.163942337036133, "global_step": 249744, "epoch": 3008} {"train_loss": -25.056821823120117, "global_step": 249745, "epoch": 3008} {"train_loss": -24.952076302953515, "global_step": 249746, "epoch": 3008, "val_loss": 6638009.0} {"train_loss": -24.61181640625, "global_step": 249747, "epoch": 3009} {"train_loss": -24.980205535888672, "global_step": 249748, "epoch": 3009} {"train_loss": -24.620908737182617, "global_step": 249749, "epoch": 3009} {"train_loss": -24.72515296936035, "global_step": 249750, "epoch": 3009} {"train_loss": -24.681516647338867, "global_step": 249751, "epoch": 3009} {"train_loss": -24.829328536987305, "global_step": 249752, "epoch": 3009} {"train_loss": -25.08234405517578, "global_step": 249753, "epoch": 3009} {"train_loss": -24.58875846862793, "global_step": 249754, "epoch": 3009} {"train_loss": -25.099960327148438, "global_step": 249755, "epoch": 3009} {"train_loss": -24.870685577392578, "global_step": 249756, "epoch": 3009} {"train_loss": -24.855966567993164, "global_step": 249757, "epoch": 3009} {"train_loss": -25.0297908782959, "global_step": 249758, "epoch": 3009} {"train_loss": -24.85997200012207, "global_step": 249759, "epoch": 3009} {"train_loss": -24.9571475982666, "global_step": 249760, "epoch": 3009} {"train_loss": -24.969816207885742, "global_step": 249761, "epoch": 3009} {"train_loss": -24.983642578125, "global_step": 249762, "epoch": 3009} {"train_loss": -25.218097686767578, "global_step": 249763, "epoch": 3009} {"train_loss": -24.869150161743164, "global_step": 249764, "epoch": 3009} {"train_loss": -24.906843185424805, "global_step": 249765, "epoch": 3009} {"train_loss": -25.31635856628418, "global_step": 249766, "epoch": 3009} {"train_loss": -24.825849533081055, "global_step": 249767, "epoch": 3009} {"train_loss": -25.46918296813965, "global_step": 249768, "epoch": 3009} {"train_loss": -24.95354652404785, "global_step": 249769, "epoch": 3009} {"train_loss": -25.00362205505371, "global_step": 249770, "epoch": 3009} {"train_loss": -25.208770751953125, "global_step": 249771, "epoch": 3009} {"train_loss": -25.327146530151367, "global_step": 249772, "epoch": 3009} {"train_loss": -25.11913299560547, "global_step": 249773, "epoch": 3009} {"train_loss": -25.035398483276367, "global_step": 249774, "epoch": 3009} {"train_loss": -25.209375381469727, "global_step": 249775, "epoch": 3009} {"train_loss": -25.044462203979492, "global_step": 249776, "epoch": 3009} {"train_loss": -25.16176414489746, "global_step": 249777, "epoch": 3009} {"train_loss": -24.984182357788086, "global_step": 249778, "epoch": 3009} {"train_loss": -25.10955047607422, "global_step": 249779, "epoch": 3009} {"train_loss": -25.330060958862305, "global_step": 249780, "epoch": 3009} {"train_loss": -25.278411865234375, "global_step": 249781, "epoch": 3009} {"train_loss": -25.097095489501953, "global_step": 249782, "epoch": 3009} {"train_loss": -25.185596466064453, "global_step": 249783, "epoch": 3009} {"train_loss": -25.11008071899414, "global_step": 249784, "epoch": 3009} {"train_loss": -25.234237670898438, "global_step": 249785, "epoch": 3009} {"train_loss": -24.861984252929688, "global_step": 249786, "epoch": 3009} {"train_loss": -24.82156753540039, "global_step": 249787, "epoch": 3009} {"train_loss": -25.38694190979004, "global_step": 249788, "epoch": 3009} {"train_loss": -25.134674072265625, "global_step": 249789, "epoch": 3009} {"train_loss": -25.22589683532715, "global_step": 249790, "epoch": 3009} {"train_loss": -25.133956909179688, "global_step": 249791, "epoch": 3009} {"train_loss": -24.927410125732422, "global_step": 249792, "epoch": 3009} {"train_loss": -25.293601989746094, "global_step": 249793, "epoch": 3009} {"train_loss": -24.61896324157715, "global_step": 249794, "epoch": 3009} {"train_loss": -24.823272705078125, "global_step": 249795, "epoch": 3009} {"train_loss": -24.921995162963867, "global_step": 249796, "epoch": 3009} {"train_loss": -25.447254180908203, "global_step": 249797, "epoch": 3009} {"train_loss": -24.804227828979492, "global_step": 249798, "epoch": 3009} {"train_loss": -24.81366729736328, "global_step": 249799, "epoch": 3009} {"train_loss": -24.91330909729004, "global_step": 249800, "epoch": 3009} {"train_loss": -25.096511840820312, "global_step": 249801, "epoch": 3009} {"train_loss": -25.197895050048828, "global_step": 249802, "epoch": 3009} {"train_loss": -24.897796630859375, "global_step": 249803, "epoch": 3009} {"train_loss": -25.36672019958496, "global_step": 249804, "epoch": 3009} {"train_loss": -24.635217666625977, "global_step": 249805, "epoch": 3009} {"train_loss": -24.940181732177734, "global_step": 249806, "epoch": 3009} {"train_loss": -24.75446891784668, "global_step": 249807, "epoch": 3009} {"train_loss": -25.188016891479492, "global_step": 249808, "epoch": 3009} {"train_loss": -25.239835739135742, "global_step": 249809, "epoch": 3009} {"train_loss": -25.001882553100586, "global_step": 249810, "epoch": 3009} {"train_loss": -25.186927795410156, "global_step": 249811, "epoch": 3009} {"train_loss": -25.433256149291992, "global_step": 249812, "epoch": 3009} {"train_loss": -25.42497444152832, "global_step": 249813, "epoch": 3009} {"train_loss": -25.21991539001465, "global_step": 249814, "epoch": 3009} {"train_loss": -24.999813079833984, "global_step": 249815, "epoch": 3009} {"train_loss": -25.150928497314453, "global_step": 249816, "epoch": 3009} {"train_loss": -25.021512985229492, "global_step": 249817, "epoch": 3009} {"train_loss": -25.277755737304688, "global_step": 249818, "epoch": 3009} {"train_loss": -25.143117904663086, "global_step": 249819, "epoch": 3009} {"train_loss": -25.104360580444336, "global_step": 249820, "epoch": 3009} {"train_loss": -25.315048217773438, "global_step": 249821, "epoch": 3009} {"train_loss": -25.037208557128906, "global_step": 249822, "epoch": 3009} {"train_loss": -25.2950496673584, "global_step": 249823, "epoch": 3009} {"train_loss": -25.318132400512695, "global_step": 249824, "epoch": 3009} {"train_loss": -25.22065544128418, "global_step": 249825, "epoch": 3009} {"train_loss": -25.191194534301758, "global_step": 249826, "epoch": 3009} {"train_loss": -25.283430099487305, "global_step": 249827, "epoch": 3009} {"train_loss": -24.952360153198242, "global_step": 249828, "epoch": 3009} {"train_loss": -25.06312043982816, "global_step": 249829, "epoch": 3009, "val_loss": 6817389.0} {"train_loss": -24.44057273864746, "global_step": 249830, "epoch": 3010} {"train_loss": -23.584217071533203, "global_step": 249831, "epoch": 3010} {"train_loss": -23.587480545043945, "global_step": 249832, "epoch": 3010} {"train_loss": -24.559301376342773, "global_step": 249833, "epoch": 3010} {"train_loss": -23.776498794555664, "global_step": 249834, "epoch": 3010} {"train_loss": -24.508275985717773, "global_step": 249835, "epoch": 3010} {"train_loss": -24.454605102539062, "global_step": 249836, "epoch": 3010} {"train_loss": -24.539474487304688, "global_step": 249837, "epoch": 3010} {"train_loss": -24.658132553100586, "global_step": 249838, "epoch": 3010} {"train_loss": -24.762502670288086, "global_step": 249839, "epoch": 3010} {"train_loss": -24.67641258239746, "global_step": 249840, "epoch": 3010} {"train_loss": -24.300975799560547, "global_step": 249841, "epoch": 3010} {"train_loss": -24.662918090820312, "global_step": 249842, "epoch": 3010} {"train_loss": -24.735082626342773, "global_step": 249843, "epoch": 3010} {"train_loss": -24.418899536132812, "global_step": 249844, "epoch": 3010} {"train_loss": -24.552715301513672, "global_step": 249845, "epoch": 3010} {"train_loss": -24.729398727416992, "global_step": 249846, "epoch": 3010} {"train_loss": -24.806625366210938, "global_step": 249847, "epoch": 3010} {"train_loss": -24.62433624267578, "global_step": 249848, "epoch": 3010} {"train_loss": -24.18482780456543, "global_step": 249849, "epoch": 3010} {"train_loss": -24.62774085998535, "global_step": 249850, "epoch": 3010} {"train_loss": -24.680402755737305, "global_step": 249851, "epoch": 3010} {"train_loss": -24.69869041442871, "global_step": 249852, "epoch": 3010} {"train_loss": -25.120969772338867, "global_step": 249853, "epoch": 3010} {"train_loss": -24.889638900756836, "global_step": 249854, "epoch": 3010} {"train_loss": -24.91394805908203, "global_step": 249855, "epoch": 3010} {"train_loss": -24.84991455078125, "global_step": 249856, "epoch": 3010} {"train_loss": -24.86714744567871, "global_step": 249857, "epoch": 3010} {"train_loss": -24.65338706970215, "global_step": 249858, "epoch": 3010} {"train_loss": -25.178152084350586, "global_step": 249859, "epoch": 3010} {"train_loss": -25.13844108581543, "global_step": 249860, "epoch": 3010} {"train_loss": -25.012475967407227, "global_step": 249861, "epoch": 3010} {"train_loss": -24.644411087036133, "global_step": 249862, "epoch": 3010} {"train_loss": -25.223325729370117, "global_step": 249863, "epoch": 3010} {"train_loss": -24.76949119567871, "global_step": 249864, "epoch": 3010} {"train_loss": -24.852964401245117, "global_step": 249865, "epoch": 3010} {"train_loss": -24.878461837768555, "global_step": 249866, "epoch": 3010} {"train_loss": -24.80425453186035, "global_step": 249867, "epoch": 3010} {"train_loss": -24.82259178161621, "global_step": 249868, "epoch": 3010} {"train_loss": -25.388547897338867, "global_step": 249869, "epoch": 3010} {"train_loss": -24.870882034301758, "global_step": 249870, "epoch": 3010} {"train_loss": -24.984516143798828, "global_step": 249871, "epoch": 3010} {"train_loss": -24.96270751953125, "global_step": 249872, "epoch": 3010} {"train_loss": -24.777257919311523, "global_step": 249873, "epoch": 3010} {"train_loss": -25.016149520874023, "global_step": 249874, "epoch": 3010} {"train_loss": -24.773666381835938, "global_step": 249875, "epoch": 3010} {"train_loss": -24.9531192779541, "global_step": 249876, "epoch": 3010} {"train_loss": -24.9508113861084, "global_step": 249877, "epoch": 3010} {"train_loss": -25.085615158081055, "global_step": 249878, "epoch": 3010} {"train_loss": -24.908864974975586, "global_step": 249879, "epoch": 3010} {"train_loss": -24.67207145690918, "global_step": 249880, "epoch": 3010} {"train_loss": -25.066131591796875, "global_step": 249881, "epoch": 3010} {"train_loss": -24.895782470703125, "global_step": 249882, "epoch": 3010} {"train_loss": -25.16397476196289, "global_step": 249883, "epoch": 3010} {"train_loss": -25.033981323242188, "global_step": 249884, "epoch": 3010} {"train_loss": -24.889911651611328, "global_step": 249885, "epoch": 3010} {"train_loss": -25.266633987426758, "global_step": 249886, "epoch": 3010} {"train_loss": -25.172136306762695, "global_step": 249887, "epoch": 3010} {"train_loss": -24.643783569335938, "global_step": 249888, "epoch": 3010} {"train_loss": -25.026870727539062, "global_step": 249889, "epoch": 3010} {"train_loss": -25.2855167388916, "global_step": 249890, "epoch": 3010} {"train_loss": -25.278217315673828, "global_step": 249891, "epoch": 3010} {"train_loss": -25.02756118774414, "global_step": 249892, "epoch": 3010} {"train_loss": -25.1054744720459, "global_step": 249893, "epoch": 3010} {"train_loss": -25.388031005859375, "global_step": 249894, "epoch": 3010} {"train_loss": -25.196779251098633, "global_step": 249895, "epoch": 3010} {"train_loss": -25.47002410888672, "global_step": 249896, "epoch": 3010} {"train_loss": -25.3189754486084, "global_step": 249897, "epoch": 3010} {"train_loss": -25.035770416259766, "global_step": 249898, "epoch": 3010} {"train_loss": -25.145645141601562, "global_step": 249899, "epoch": 3010} {"train_loss": -25.36741828918457, "global_step": 249900, "epoch": 3010} {"train_loss": -25.19964599609375, "global_step": 249901, "epoch": 3010} {"train_loss": -25.322790145874023, "global_step": 249902, "epoch": 3010} {"train_loss": -24.970754623413086, "global_step": 249903, "epoch": 3010} {"train_loss": -25.1795711517334, "global_step": 249904, "epoch": 3010} {"train_loss": -25.531538009643555, "global_step": 249905, "epoch": 3010} {"train_loss": -25.010622024536133, "global_step": 249906, "epoch": 3010} {"train_loss": -24.994903564453125, "global_step": 249907, "epoch": 3010} {"train_loss": -24.802515029907227, "global_step": 249908, "epoch": 3010} {"train_loss": -25.01747703552246, "global_step": 249909, "epoch": 3010} {"train_loss": -24.963422775268555, "global_step": 249910, "epoch": 3010} {"train_loss": -24.971446990966797, "global_step": 249911, "epoch": 3010} {"train_loss": -24.88198919181364, "global_step": 249912, "epoch": 3010, "val_loss": 6817260.0} {"train_loss": -24.56976890563965, "global_step": 249913, "epoch": 3011} {"train_loss": -24.06256675720215, "global_step": 249914, "epoch": 3011} {"train_loss": -24.593477249145508, "global_step": 249915, "epoch": 3011} {"train_loss": -24.374313354492188, "global_step": 249916, "epoch": 3011} {"train_loss": -24.67937660217285, "global_step": 249917, "epoch": 3011} {"train_loss": -24.70962905883789, "global_step": 249918, "epoch": 3011} {"train_loss": -24.359148025512695, "global_step": 249919, "epoch": 3011} {"train_loss": -24.626977920532227, "global_step": 249920, "epoch": 3011} {"train_loss": -24.56900405883789, "global_step": 249921, "epoch": 3011} {"train_loss": -24.280393600463867, "global_step": 249922, "epoch": 3011} {"train_loss": -24.94207191467285, "global_step": 249923, "epoch": 3011} {"train_loss": -24.801803588867188, "global_step": 249924, "epoch": 3011} {"train_loss": -24.724889755249023, "global_step": 249925, "epoch": 3011} {"train_loss": -24.441415786743164, "global_step": 249926, "epoch": 3011} {"train_loss": -25.0310115814209, "global_step": 249927, "epoch": 3011} {"train_loss": -24.662588119506836, "global_step": 249928, "epoch": 3011} {"train_loss": -24.410282135009766, "global_step": 249929, "epoch": 3011} {"train_loss": -24.874225616455078, "global_step": 249930, "epoch": 3011} {"train_loss": -24.59859848022461, "global_step": 249931, "epoch": 3011} {"train_loss": -24.71135139465332, "global_step": 249932, "epoch": 3011} {"train_loss": -24.86121940612793, "global_step": 249933, "epoch": 3011} {"train_loss": -24.9502010345459, "global_step": 249934, "epoch": 3011} {"train_loss": -25.054994583129883, "global_step": 249935, "epoch": 3011} {"train_loss": -24.675800323486328, "global_step": 249936, "epoch": 3011} {"train_loss": -24.99538803100586, "global_step": 249937, "epoch": 3011} {"train_loss": -24.657455444335938, "global_step": 249938, "epoch": 3011} {"train_loss": -24.864933013916016, "global_step": 249939, "epoch": 3011} {"train_loss": -24.559186935424805, "global_step": 249940, "epoch": 3011} {"train_loss": -24.930051803588867, "global_step": 249941, "epoch": 3011} {"train_loss": -24.82294273376465, "global_step": 249942, "epoch": 3011} {"train_loss": -25.12104606628418, "global_step": 249943, "epoch": 3011} {"train_loss": -25.14299964904785, "global_step": 249944, "epoch": 3011} {"train_loss": -24.600147247314453, "global_step": 249945, "epoch": 3011} {"train_loss": -25.137344360351562, "global_step": 249946, "epoch": 3011} {"train_loss": -25.125194549560547, "global_step": 249947, "epoch": 3011} {"train_loss": -25.150217056274414, "global_step": 249948, "epoch": 3011} {"train_loss": -24.663053512573242, "global_step": 249949, "epoch": 3011} {"train_loss": -25.157133102416992, "global_step": 249950, "epoch": 3011} {"train_loss": -25.12588119506836, "global_step": 249951, "epoch": 3011} {"train_loss": -25.087888717651367, "global_step": 249952, "epoch": 3011} {"train_loss": -25.16566276550293, "global_step": 249953, "epoch": 3011} {"train_loss": -25.059467315673828, "global_step": 249954, "epoch": 3011} {"train_loss": -25.209482192993164, "global_step": 249955, "epoch": 3011} {"train_loss": -25.25939178466797, "global_step": 249956, "epoch": 3011} {"train_loss": -25.122827529907227, "global_step": 249957, "epoch": 3011} {"train_loss": -25.1143798828125, "global_step": 249958, "epoch": 3011} {"train_loss": -25.07591438293457, "global_step": 249959, "epoch": 3011} {"train_loss": -25.214200973510742, "global_step": 249960, "epoch": 3011} {"train_loss": -24.815820693969727, "global_step": 249961, "epoch": 3011} {"train_loss": -25.399221420288086, "global_step": 249962, "epoch": 3011} {"train_loss": -25.073627471923828, "global_step": 249963, "epoch": 3011} {"train_loss": -25.168277740478516, "global_step": 249964, "epoch": 3011} {"train_loss": -24.691617965698242, "global_step": 249965, "epoch": 3011} {"train_loss": -25.028553009033203, "global_step": 249966, "epoch": 3011} {"train_loss": -25.094636917114258, "global_step": 249967, "epoch": 3011} {"train_loss": -25.26541519165039, "global_step": 249968, "epoch": 3011} {"train_loss": -24.96571159362793, "global_step": 249969, "epoch": 3011} {"train_loss": -25.112112045288086, "global_step": 249970, "epoch": 3011} {"train_loss": -25.310312271118164, "global_step": 249971, "epoch": 3011} {"train_loss": -25.244901657104492, "global_step": 249972, "epoch": 3011} {"train_loss": -24.904630661010742, "global_step": 249973, "epoch": 3011} {"train_loss": -25.0245361328125, "global_step": 249974, "epoch": 3011} {"train_loss": -24.35682487487793, "global_step": 249975, "epoch": 3011} {"train_loss": -25.13104248046875, "global_step": 249976, "epoch": 3011} {"train_loss": -25.12318229675293, "global_step": 249977, "epoch": 3011} {"train_loss": -24.666494369506836, "global_step": 249978, "epoch": 3011} {"train_loss": -24.724210739135742, "global_step": 249979, "epoch": 3011} {"train_loss": -24.930967330932617, "global_step": 249980, "epoch": 3011} {"train_loss": -25.336580276489258, "global_step": 249981, "epoch": 3011} {"train_loss": -25.004663467407227, "global_step": 249982, "epoch": 3011} {"train_loss": -25.071054458618164, "global_step": 249983, "epoch": 3011} {"train_loss": -24.6998291015625, "global_step": 249984, "epoch": 3011} {"train_loss": -25.131162643432617, "global_step": 249985, "epoch": 3011} {"train_loss": -25.09303855895996, "global_step": 249986, "epoch": 3011} {"train_loss": -25.353225708007812, "global_step": 249987, "epoch": 3011} {"train_loss": -24.96870231628418, "global_step": 249988, "epoch": 3011} {"train_loss": -25.047094345092773, "global_step": 249989, "epoch": 3011} {"train_loss": -25.11176109313965, "global_step": 249990, "epoch": 3011} {"train_loss": -24.99225425720215, "global_step": 249991, "epoch": 3011} {"train_loss": -24.76500701904297, "global_step": 249992, "epoch": 3011} {"train_loss": -24.874649047851562, "global_step": 249993, "epoch": 3011} {"train_loss": -25.09921646118164, "global_step": 249994, "epoch": 3011} {"train_loss": -24.901865602975867, "global_step": 249995, "epoch": 3011, "val_loss": 6777878.0} {"train_loss": -24.91010856628418, "global_step": 249996, "epoch": 3012} {"train_loss": -25.001266479492188, "global_step": 249997, "epoch": 3012} {"train_loss": -24.9725284576416, "global_step": 249998, "epoch": 3012} {"train_loss": -24.726041793823242, "global_step": 249999, "epoch": 3012} {"train_loss": -24.66887855529785, "global_step": 250000, "epoch": 3012} {"train_loss": -24.84449577331543, "global_step": 250001, "epoch": 3012} {"train_loss": -24.89814567565918, "global_step": 250002, "epoch": 3012} {"train_loss": -24.701101303100586, "global_step": 250003, "epoch": 3012} {"train_loss": -24.90726089477539, "global_step": 250004, "epoch": 3012} {"train_loss": -25.09088706970215, "global_step": 250005, "epoch": 3012} {"train_loss": -24.921768188476562, "global_step": 250006, "epoch": 3012} {"train_loss": -24.969751358032227, "global_step": 250007, "epoch": 3012} {"train_loss": -24.644865036010742, "global_step": 250008, "epoch": 3012} {"train_loss": -24.54122543334961, "global_step": 250009, "epoch": 3012} {"train_loss": -24.566848754882812, "global_step": 250010, "epoch": 3012} {"train_loss": -25.348440170288086, "global_step": 250011, "epoch": 3012} {"train_loss": -25.248136520385742, "global_step": 250012, "epoch": 3012} {"train_loss": -25.113086700439453, "global_step": 250013, "epoch": 3012} {"train_loss": -24.875553131103516, "global_step": 250014, "epoch": 3012} {"train_loss": -25.23243522644043, "global_step": 250015, "epoch": 3012} {"train_loss": -25.23933219909668, "global_step": 250016, "epoch": 3012} {"train_loss": -24.839048385620117, "global_step": 250017, "epoch": 3012} {"train_loss": -25.084218978881836, "global_step": 250018, "epoch": 3012} {"train_loss": -24.998645782470703, "global_step": 250019, "epoch": 3012} {"train_loss": -25.517066955566406, "global_step": 250020, "epoch": 3012} {"train_loss": -24.86628532409668, "global_step": 250021, "epoch": 3012} {"train_loss": -25.228073120117188, "global_step": 250022, "epoch": 3012} {"train_loss": -25.173202514648438, "global_step": 250023, "epoch": 3012} {"train_loss": -25.24100685119629, "global_step": 250024, "epoch": 3012} {"train_loss": -25.553531646728516, "global_step": 250025, "epoch": 3012} {"train_loss": -25.072132110595703, "global_step": 250026, "epoch": 3012} {"train_loss": -24.86895179748535, "global_step": 250027, "epoch": 3012} {"train_loss": -25.16172218322754, "global_step": 250028, "epoch": 3012} {"train_loss": -24.968835830688477, "global_step": 250029, "epoch": 3012} {"train_loss": -24.81195640563965, "global_step": 250030, "epoch": 3012} {"train_loss": -24.24384880065918, "global_step": 250031, "epoch": 3012} {"train_loss": -25.026519775390625, "global_step": 250032, "epoch": 3012} {"train_loss": -24.84978675842285, "global_step": 250033, "epoch": 3012} {"train_loss": -24.98310089111328, "global_step": 250034, "epoch": 3012} {"train_loss": -25.1785945892334, "global_step": 250035, "epoch": 3012} {"train_loss": -25.071008682250977, "global_step": 250036, "epoch": 3012} {"train_loss": -24.961111068725586, "global_step": 250037, "epoch": 3012} {"train_loss": -24.99591827392578, "global_step": 250038, "epoch": 3012} {"train_loss": -25.003009796142578, "global_step": 250039, "epoch": 3012} {"train_loss": -24.807952880859375, "global_step": 250040, "epoch": 3012} {"train_loss": -24.667579650878906, "global_step": 250041, "epoch": 3012} {"train_loss": -24.924488067626953, "global_step": 250042, "epoch": 3012} {"train_loss": -24.896865844726562, "global_step": 250043, "epoch": 3012} {"train_loss": -24.925731658935547, "global_step": 250044, "epoch": 3012} {"train_loss": -25.051158905029297, "global_step": 250045, "epoch": 3012} {"train_loss": -25.134300231933594, "global_step": 250046, "epoch": 3012} {"train_loss": -24.965229034423828, "global_step": 250047, "epoch": 3012} {"train_loss": -24.949005126953125, "global_step": 250048, "epoch": 3012} {"train_loss": -25.189294815063477, "global_step": 250049, "epoch": 3012} {"train_loss": -25.206857681274414, "global_step": 250050, "epoch": 3012} {"train_loss": -25.112089157104492, "global_step": 250051, "epoch": 3012} {"train_loss": -24.393001556396484, "global_step": 250052, "epoch": 3012} {"train_loss": -24.964414596557617, "global_step": 250053, "epoch": 3012} {"train_loss": -24.984512329101562, "global_step": 250054, "epoch": 3012} {"train_loss": -25.073848724365234, "global_step": 250055, "epoch": 3012} {"train_loss": -25.020797729492188, "global_step": 250056, "epoch": 3012} {"train_loss": -25.716552734375, "global_step": 250057, "epoch": 3012} {"train_loss": -24.908994674682617, "global_step": 250058, "epoch": 3012} {"train_loss": -25.362472534179688, "global_step": 250059, "epoch": 3012} {"train_loss": -25.29475975036621, "global_step": 250060, "epoch": 3012} {"train_loss": -24.878644943237305, "global_step": 250061, "epoch": 3012} {"train_loss": -25.11481285095215, "global_step": 250062, "epoch": 3012} {"train_loss": -25.07378578186035, "global_step": 250063, "epoch": 3012} {"train_loss": -25.459657669067383, "global_step": 250064, "epoch": 3012} {"train_loss": -25.12056541442871, "global_step": 250065, "epoch": 3012} {"train_loss": -25.059019088745117, "global_step": 250066, "epoch": 3012} {"train_loss": -25.0653133392334, "global_step": 250067, "epoch": 3012} {"train_loss": -25.314599990844727, "global_step": 250068, "epoch": 3012} {"train_loss": -24.723175048828125, "global_step": 250069, "epoch": 3012} {"train_loss": -25.038320541381836, "global_step": 250070, "epoch": 3012} {"train_loss": -25.4266300201416, "global_step": 250071, "epoch": 3012} {"train_loss": -24.85663414001465, "global_step": 250072, "epoch": 3012} {"train_loss": -25.197019577026367, "global_step": 250073, "epoch": 3012} {"train_loss": -25.01374626159668, "global_step": 250074, "epoch": 3012} {"train_loss": -24.73878288269043, "global_step": 250075, "epoch": 3012} {"train_loss": -25.39298439025879, "global_step": 250076, "epoch": 3012} {"train_loss": -25.154401779174805, "global_step": 250077, "epoch": 3012} {"train_loss": -25.01742098704878, "global_step": 250078, "epoch": 3012, "val_loss": 6825830.0} {"train_loss": -24.410036087036133, "global_step": 250079, "epoch": 3013} {"train_loss": -24.847885131835938, "global_step": 250080, "epoch": 3013} {"train_loss": -24.820770263671875, "global_step": 250081, "epoch": 3013} {"train_loss": -24.258981704711914, "global_step": 250082, "epoch": 3013} {"train_loss": -25.02988052368164, "global_step": 250083, "epoch": 3013} {"train_loss": -24.130680084228516, "global_step": 250084, "epoch": 3013} {"train_loss": -24.233495712280273, "global_step": 250085, "epoch": 3013} {"train_loss": -24.679428100585938, "global_step": 250086, "epoch": 3013} {"train_loss": -24.816326141357422, "global_step": 250087, "epoch": 3013} {"train_loss": -24.658695220947266, "global_step": 250088, "epoch": 3013} {"train_loss": -24.745641708374023, "global_step": 250089, "epoch": 3013} {"train_loss": -25.02337646484375, "global_step": 250090, "epoch": 3013} {"train_loss": -24.8531551361084, "global_step": 250091, "epoch": 3013} {"train_loss": -25.14492416381836, "global_step": 250092, "epoch": 3013} {"train_loss": -24.942752838134766, "global_step": 250093, "epoch": 3013} {"train_loss": -25.133466720581055, "global_step": 250094, "epoch": 3013} {"train_loss": -24.715490341186523, "global_step": 250095, "epoch": 3013} {"train_loss": -25.260007858276367, "global_step": 250096, "epoch": 3013} {"train_loss": -25.08217430114746, "global_step": 250097, "epoch": 3013} {"train_loss": -24.9769229888916, "global_step": 250098, "epoch": 3013} {"train_loss": -24.672277450561523, "global_step": 250099, "epoch": 3013} {"train_loss": -24.7841854095459, "global_step": 250100, "epoch": 3013} {"train_loss": -24.631711959838867, "global_step": 250101, "epoch": 3013} {"train_loss": -25.225313186645508, "global_step": 250102, "epoch": 3013} {"train_loss": -24.88482093811035, "global_step": 250103, "epoch": 3013} {"train_loss": -24.871015548706055, "global_step": 250104, "epoch": 3013} {"train_loss": -24.956579208374023, "global_step": 250105, "epoch": 3013} {"train_loss": -24.92177391052246, "global_step": 250106, "epoch": 3013} {"train_loss": -24.803346633911133, "global_step": 250107, "epoch": 3013} {"train_loss": -25.005203247070312, "global_step": 250108, "epoch": 3013} {"train_loss": -25.16205406188965, "global_step": 250109, "epoch": 3013} {"train_loss": -25.263782501220703, "global_step": 250110, "epoch": 3013} {"train_loss": -25.085161209106445, "global_step": 250111, "epoch": 3013} {"train_loss": -25.08106231689453, "global_step": 250112, "epoch": 3013} {"train_loss": -24.701292037963867, "global_step": 250113, "epoch": 3013} {"train_loss": -24.573068618774414, "global_step": 250114, "epoch": 3013} {"train_loss": -24.53687858581543, "global_step": 250115, "epoch": 3013} {"train_loss": -24.93472671508789, "global_step": 250116, "epoch": 3013} {"train_loss": -24.594486236572266, "global_step": 250117, "epoch": 3013} {"train_loss": -24.831941604614258, "global_step": 250118, "epoch": 3013} {"train_loss": -24.934804916381836, "global_step": 250119, "epoch": 3013} {"train_loss": -24.539094924926758, "global_step": 250120, "epoch": 3013} {"train_loss": -24.436758041381836, "global_step": 250121, "epoch": 3013} {"train_loss": -24.9404354095459, "global_step": 250122, "epoch": 3013} {"train_loss": -24.869565963745117, "global_step": 250123, "epoch": 3013} {"train_loss": -24.474075317382812, "global_step": 250124, "epoch": 3013} {"train_loss": -24.773916244506836, "global_step": 250125, "epoch": 3013} {"train_loss": -25.054187774658203, "global_step": 250126, "epoch": 3013} {"train_loss": -25.018503189086914, "global_step": 250127, "epoch": 3013} {"train_loss": -24.680978775024414, "global_step": 250128, "epoch": 3013} {"train_loss": -24.963016510009766, "global_step": 250129, "epoch": 3013} {"train_loss": -25.137065887451172, "global_step": 250130, "epoch": 3013} {"train_loss": -24.92476463317871, "global_step": 250131, "epoch": 3013} {"train_loss": -25.436975479125977, "global_step": 250132, "epoch": 3013} {"train_loss": -25.156192779541016, "global_step": 250133, "epoch": 3013} {"train_loss": -24.750492095947266, "global_step": 250134, "epoch": 3013} {"train_loss": -25.022680282592773, "global_step": 250135, "epoch": 3013} {"train_loss": -25.006338119506836, "global_step": 250136, "epoch": 3013} {"train_loss": -24.614151000976562, "global_step": 250137, "epoch": 3013} {"train_loss": -24.947656631469727, "global_step": 250138, "epoch": 3013} {"train_loss": -25.016401290893555, "global_step": 250139, "epoch": 3013} {"train_loss": -25.10638999938965, "global_step": 250140, "epoch": 3013} {"train_loss": -25.209930419921875, "global_step": 250141, "epoch": 3013} {"train_loss": -25.433202743530273, "global_step": 250142, "epoch": 3013} {"train_loss": -24.940610885620117, "global_step": 250143, "epoch": 3013} {"train_loss": -25.268484115600586, "global_step": 250144, "epoch": 3013} {"train_loss": -25.21489715576172, "global_step": 250145, "epoch": 3013} {"train_loss": -25.538389205932617, "global_step": 250146, "epoch": 3013} {"train_loss": -24.99661636352539, "global_step": 250147, "epoch": 3013} {"train_loss": -25.078571319580078, "global_step": 250148, "epoch": 3013} {"train_loss": -24.74873161315918, "global_step": 250149, "epoch": 3013} {"train_loss": -25.158920288085938, "global_step": 250150, "epoch": 3013} {"train_loss": -24.94600486755371, "global_step": 250151, "epoch": 3013} {"train_loss": -25.350372314453125, "global_step": 250152, "epoch": 3013} {"train_loss": -25.219074249267578, "global_step": 250153, "epoch": 3013} {"train_loss": -24.90589714050293, "global_step": 250154, "epoch": 3013} {"train_loss": -24.620805740356445, "global_step": 250155, "epoch": 3013} {"train_loss": -25.23891258239746, "global_step": 250156, "epoch": 3013} {"train_loss": -25.14139175415039, "global_step": 250157, "epoch": 3013} {"train_loss": -25.158903121948242, "global_step": 250158, "epoch": 3013} {"train_loss": -25.074951171875, "global_step": 250159, "epoch": 3013} {"train_loss": -24.722238540649414, "global_step": 250160, "epoch": 3013} {"train_loss": -24.91300863243011, "global_step": 250161, "epoch": 3013, "val_loss": 6831331.0} {"train_loss": -24.535009384155273, "global_step": 250162, "epoch": 3014} {"train_loss": -24.369510650634766, "global_step": 250163, "epoch": 3014} {"train_loss": -24.725847244262695, "global_step": 250164, "epoch": 3014} {"train_loss": -24.967870712280273, "global_step": 250165, "epoch": 3014} {"train_loss": -24.611841201782227, "global_step": 250166, "epoch": 3014} {"train_loss": -24.58085823059082, "global_step": 250167, "epoch": 3014} {"train_loss": -24.329084396362305, "global_step": 250168, "epoch": 3014} {"train_loss": -24.727840423583984, "global_step": 250169, "epoch": 3014} {"train_loss": -24.612207412719727, "global_step": 250170, "epoch": 3014} {"train_loss": -24.56041145324707, "global_step": 250171, "epoch": 3014} {"train_loss": -25.037023544311523, "global_step": 250172, "epoch": 3014} {"train_loss": -24.634254455566406, "global_step": 250173, "epoch": 3014} {"train_loss": -24.806228637695312, "global_step": 250174, "epoch": 3014} {"train_loss": -24.672353744506836, "global_step": 250175, "epoch": 3014} {"train_loss": -24.65007972717285, "global_step": 250176, "epoch": 3014} {"train_loss": -24.956289291381836, "global_step": 250177, "epoch": 3014} {"train_loss": -24.95101547241211, "global_step": 250178, "epoch": 3014} {"train_loss": -25.010534286499023, "global_step": 250179, "epoch": 3014} {"train_loss": -24.735265731811523, "global_step": 250180, "epoch": 3014} {"train_loss": -24.571264266967773, "global_step": 250181, "epoch": 3014} {"train_loss": -25.186431884765625, "global_step": 250182, "epoch": 3014} {"train_loss": -24.587757110595703, "global_step": 250183, "epoch": 3014} {"train_loss": -25.111434936523438, "global_step": 250184, "epoch": 3014} {"train_loss": -24.9030818939209, "global_step": 250185, "epoch": 3014} {"train_loss": -25.02654457092285, "global_step": 250186, "epoch": 3014} {"train_loss": -24.76776695251465, "global_step": 250187, "epoch": 3014} {"train_loss": -25.05251121520996, "global_step": 250188, "epoch": 3014} {"train_loss": -24.94061851501465, "global_step": 250189, "epoch": 3014} {"train_loss": -24.83820915222168, "global_step": 250190, "epoch": 3014} {"train_loss": -25.1173038482666, "global_step": 250191, "epoch": 3014} {"train_loss": -24.89794921875, "global_step": 250192, "epoch": 3014} {"train_loss": -25.073841094970703, "global_step": 250193, "epoch": 3014} {"train_loss": -25.01874351501465, "global_step": 250194, "epoch": 3014} {"train_loss": -25.1585693359375, "global_step": 250195, "epoch": 3014} {"train_loss": -25.444944381713867, "global_step": 250196, "epoch": 3014} {"train_loss": -24.870573043823242, "global_step": 250197, "epoch": 3014} {"train_loss": -24.94900894165039, "global_step": 250198, "epoch": 3014} {"train_loss": -25.226476669311523, "global_step": 250199, "epoch": 3014} {"train_loss": -25.347455978393555, "global_step": 250200, "epoch": 3014} {"train_loss": -25.464691162109375, "global_step": 250201, "epoch": 3014} {"train_loss": -25.129140853881836, "global_step": 250202, "epoch": 3014} {"train_loss": -25.158994674682617, "global_step": 250203, "epoch": 3014} {"train_loss": -25.321014404296875, "global_step": 250204, "epoch": 3014} {"train_loss": -25.151294708251953, "global_step": 250205, "epoch": 3014} {"train_loss": -25.058521270751953, "global_step": 250206, "epoch": 3014} {"train_loss": -25.19061851501465, "global_step": 250207, "epoch": 3014} {"train_loss": -25.080385208129883, "global_step": 250208, "epoch": 3014} {"train_loss": -25.050556182861328, "global_step": 250209, "epoch": 3014} {"train_loss": -24.836074829101562, "global_step": 250210, "epoch": 3014} {"train_loss": -25.484527587890625, "global_step": 250211, "epoch": 3014} {"train_loss": -25.32356071472168, "global_step": 250212, "epoch": 3014} {"train_loss": -25.145265579223633, "global_step": 250213, "epoch": 3014} {"train_loss": -24.435436248779297, "global_step": 250214, "epoch": 3014} {"train_loss": -24.97458839416504, "global_step": 250215, "epoch": 3014} {"train_loss": -25.541723251342773, "global_step": 250216, "epoch": 3014} {"train_loss": -25.48752212524414, "global_step": 250217, "epoch": 3014} {"train_loss": -24.68077278137207, "global_step": 250218, "epoch": 3014} {"train_loss": -25.44453239440918, "global_step": 250219, "epoch": 3014} {"train_loss": -24.95598793029785, "global_step": 250220, "epoch": 3014} {"train_loss": -24.516111373901367, "global_step": 250221, "epoch": 3014} {"train_loss": -24.502410888671875, "global_step": 250222, "epoch": 3014} {"train_loss": -24.41048240661621, "global_step": 250223, "epoch": 3014} {"train_loss": -24.691444396972656, "global_step": 250224, "epoch": 3014} {"train_loss": -24.640439987182617, "global_step": 250225, "epoch": 3014} {"train_loss": -24.385343551635742, "global_step": 250226, "epoch": 3014} {"train_loss": -24.6717586517334, "global_step": 250227, "epoch": 3014} {"train_loss": -24.460193634033203, "global_step": 250228, "epoch": 3014} {"train_loss": -24.991806030273438, "global_step": 250229, "epoch": 3014} {"train_loss": -24.454120635986328, "global_step": 250230, "epoch": 3014} {"train_loss": -24.1965389251709, "global_step": 250231, "epoch": 3014} {"train_loss": -25.015451431274414, "global_step": 250232, "epoch": 3014} {"train_loss": -24.993701934814453, "global_step": 250233, "epoch": 3014} {"train_loss": -25.05354118347168, "global_step": 250234, "epoch": 3014} {"train_loss": -24.70492172241211, "global_step": 250235, "epoch": 3014} {"train_loss": -24.96828842163086, "global_step": 250236, "epoch": 3014} {"train_loss": -25.022422790527344, "global_step": 250237, "epoch": 3014} {"train_loss": -24.62188148498535, "global_step": 250238, "epoch": 3014} {"train_loss": -24.71150779724121, "global_step": 250239, "epoch": 3014} {"train_loss": -24.629560470581055, "global_step": 250240, "epoch": 3014} {"train_loss": -25.114383697509766, "global_step": 250241, "epoch": 3014} {"train_loss": -24.576494216918945, "global_step": 250242, "epoch": 3014} {"train_loss": -24.917377471923828, "global_step": 250243, "epoch": 3014} {"train_loss": -24.91627725348415, "global_step": 250244, "epoch": 3014, "val_loss": 6926002.0} {"train_loss": -24.414793014526367, "global_step": 250245, "epoch": 3015} {"train_loss": -24.75267791748047, "global_step": 250246, "epoch": 3015} {"train_loss": -24.394580841064453, "global_step": 250247, "epoch": 3015} {"train_loss": -24.781875610351562, "global_step": 250248, "epoch": 3015} {"train_loss": -24.725587844848633, "global_step": 250249, "epoch": 3015} {"train_loss": -25.08394432067871, "global_step": 250250, "epoch": 3015} {"train_loss": -24.894479751586914, "global_step": 250251, "epoch": 3015} {"train_loss": -25.290380477905273, "global_step": 250252, "epoch": 3015} {"train_loss": -25.06866455078125, "global_step": 250253, "epoch": 3015} {"train_loss": -24.827768325805664, "global_step": 250254, "epoch": 3015} {"train_loss": -25.097692489624023, "global_step": 250255, "epoch": 3015} {"train_loss": -24.976337432861328, "global_step": 250256, "epoch": 3015} {"train_loss": -24.78563117980957, "global_step": 250257, "epoch": 3015} {"train_loss": -24.7021541595459, "global_step": 250258, "epoch": 3015} {"train_loss": -25.15744972229004, "global_step": 250259, "epoch": 3015} {"train_loss": -24.771799087524414, "global_step": 250260, "epoch": 3015} {"train_loss": -25.249074935913086, "global_step": 250261, "epoch": 3015} {"train_loss": -24.778470993041992, "global_step": 250262, "epoch": 3015} {"train_loss": -25.314088821411133, "global_step": 250263, "epoch": 3015} {"train_loss": -25.062864303588867, "global_step": 250264, "epoch": 3015} {"train_loss": -24.936182022094727, "global_step": 250265, "epoch": 3015} {"train_loss": -24.641965866088867, "global_step": 250266, "epoch": 3015} {"train_loss": -25.301298141479492, "global_step": 250267, "epoch": 3015} {"train_loss": -25.295974731445312, "global_step": 250268, "epoch": 3015} {"train_loss": -24.882265090942383, "global_step": 250269, "epoch": 3015} {"train_loss": -24.797061920166016, "global_step": 250270, "epoch": 3015} {"train_loss": -24.789949417114258, "global_step": 250271, "epoch": 3015} {"train_loss": -25.243770599365234, "global_step": 250272, "epoch": 3015} {"train_loss": -24.80274772644043, "global_step": 250273, "epoch": 3015} {"train_loss": -25.095388412475586, "global_step": 250274, "epoch": 3015} {"train_loss": -24.909143447875977, "global_step": 250275, "epoch": 3015} {"train_loss": -25.128997802734375, "global_step": 250276, "epoch": 3015} {"train_loss": -25.176984786987305, "global_step": 250277, "epoch": 3015} {"train_loss": -24.72087287902832, "global_step": 250278, "epoch": 3015} {"train_loss": -25.050596237182617, "global_step": 250279, "epoch": 3015} {"train_loss": -24.749176025390625, "global_step": 250280, "epoch": 3015} {"train_loss": -25.35140037536621, "global_step": 250281, "epoch": 3015} {"train_loss": -25.33030891418457, "global_step": 250282, "epoch": 3015} {"train_loss": -25.136280059814453, "global_step": 250283, "epoch": 3015} {"train_loss": -25.053056716918945, "global_step": 250284, "epoch": 3015} {"train_loss": -25.025407791137695, "global_step": 250285, "epoch": 3015} {"train_loss": -25.077489852905273, "global_step": 250286, "epoch": 3015} {"train_loss": -25.251632690429688, "global_step": 250287, "epoch": 3015} {"train_loss": -25.243574142456055, "global_step": 250288, "epoch": 3015} {"train_loss": -25.146268844604492, "global_step": 250289, "epoch": 3015} {"train_loss": -24.766708374023438, "global_step": 250290, "epoch": 3015} {"train_loss": -25.099712371826172, "global_step": 250291, "epoch": 3015} {"train_loss": -25.087369918823242, "global_step": 250292, "epoch": 3015} {"train_loss": -24.849124908447266, "global_step": 250293, "epoch": 3015} {"train_loss": -25.222158432006836, "global_step": 250294, "epoch": 3015} {"train_loss": -24.949634552001953, "global_step": 250295, "epoch": 3015} {"train_loss": -24.721891403198242, "global_step": 250296, "epoch": 3015} {"train_loss": -24.97089195251465, "global_step": 250297, "epoch": 3015} {"train_loss": -24.8796443939209, "global_step": 250298, "epoch": 3015} {"train_loss": -24.979032516479492, "global_step": 250299, "epoch": 3015} {"train_loss": -25.077199935913086, "global_step": 250300, "epoch": 3015} {"train_loss": -25.219846725463867, "global_step": 250301, "epoch": 3015} {"train_loss": -24.879919052124023, "global_step": 250302, "epoch": 3015} {"train_loss": -25.141942977905273, "global_step": 250303, "epoch": 3015} {"train_loss": -25.605955123901367, "global_step": 250304, "epoch": 3015} {"train_loss": -24.663339614868164, "global_step": 250305, "epoch": 3015} {"train_loss": -25.157102584838867, "global_step": 250306, "epoch": 3015} {"train_loss": -25.226783752441406, "global_step": 250307, "epoch": 3015} {"train_loss": -24.74942970275879, "global_step": 250308, "epoch": 3015} {"train_loss": -24.822402954101562, "global_step": 250309, "epoch": 3015} {"train_loss": -25.185216903686523, "global_step": 250310, "epoch": 3015} {"train_loss": -24.509023666381836, "global_step": 250311, "epoch": 3015} {"train_loss": -25.357343673706055, "global_step": 250312, "epoch": 3015} {"train_loss": -25.258609771728516, "global_step": 250313, "epoch": 3015} {"train_loss": -24.78536033630371, "global_step": 250314, "epoch": 3015} {"train_loss": -25.06577491760254, "global_step": 250315, "epoch": 3015} {"train_loss": -25.314504623413086, "global_step": 250316, "epoch": 3015} {"train_loss": -24.87705421447754, "global_step": 250317, "epoch": 3015} {"train_loss": -25.167070388793945, "global_step": 250318, "epoch": 3015} {"train_loss": -24.990476608276367, "global_step": 250319, "epoch": 3015} {"train_loss": -25.336891174316406, "global_step": 250320, "epoch": 3015} {"train_loss": -25.635913848876953, "global_step": 250321, "epoch": 3015} {"train_loss": -24.91239356994629, "global_step": 250322, "epoch": 3015} {"train_loss": -25.026700973510742, "global_step": 250323, "epoch": 3015} {"train_loss": -24.914464950561523, "global_step": 250324, "epoch": 3015} {"train_loss": -24.941251754760742, "global_step": 250325, "epoch": 3015} {"train_loss": -25.517362594604492, "global_step": 250326, "epoch": 3015} {"train_loss": -24.997683559555604, "global_step": 250327, "epoch": 3015, "val_loss": 6741789.0} {"train_loss": -24.58968734741211, "global_step": 250328, "epoch": 3016} {"train_loss": -24.535356521606445, "global_step": 250329, "epoch": 3016} {"train_loss": -24.814451217651367, "global_step": 250330, "epoch": 3016} {"train_loss": -24.53505516052246, "global_step": 250331, "epoch": 3016} {"train_loss": -24.276901245117188, "global_step": 250332, "epoch": 3016} {"train_loss": -24.806827545166016, "global_step": 250333, "epoch": 3016} {"train_loss": -25.012832641601562, "global_step": 250334, "epoch": 3016} {"train_loss": -25.036617279052734, "global_step": 250335, "epoch": 3016} {"train_loss": -24.375890731811523, "global_step": 250336, "epoch": 3016} {"train_loss": -25.187789916992188, "global_step": 250337, "epoch": 3016} {"train_loss": -24.52333641052246, "global_step": 250338, "epoch": 3016} {"train_loss": -24.761362075805664, "global_step": 250339, "epoch": 3016} {"train_loss": -24.88644790649414, "global_step": 250340, "epoch": 3016} {"train_loss": -24.69162368774414, "global_step": 250341, "epoch": 3016} {"train_loss": -24.785436630249023, "global_step": 250342, "epoch": 3016} {"train_loss": -25.004619598388672, "global_step": 250343, "epoch": 3016} {"train_loss": -24.754573822021484, "global_step": 250344, "epoch": 3016} {"train_loss": -25.040542602539062, "global_step": 250345, "epoch": 3016} {"train_loss": -25.047643661499023, "global_step": 250346, "epoch": 3016} {"train_loss": -24.939573287963867, "global_step": 250347, "epoch": 3016} {"train_loss": -24.96683692932129, "global_step": 250348, "epoch": 3016} {"train_loss": -25.076236724853516, "global_step": 250349, "epoch": 3016} {"train_loss": -24.8325252532959, "global_step": 250350, "epoch": 3016} {"train_loss": -25.03757095336914, "global_step": 250351, "epoch": 3016} {"train_loss": -24.825225830078125, "global_step": 250352, "epoch": 3016} {"train_loss": -24.691404342651367, "global_step": 250353, "epoch": 3016} {"train_loss": -25.102590560913086, "global_step": 250354, "epoch": 3016} {"train_loss": -25.266626358032227, "global_step": 250355, "epoch": 3016} {"train_loss": -25.000762939453125, "global_step": 250356, "epoch": 3016} {"train_loss": -24.951480865478516, "global_step": 250357, "epoch": 3016} {"train_loss": -25.17189598083496, "global_step": 250358, "epoch": 3016} {"train_loss": -24.846221923828125, "global_step": 250359, "epoch": 3016} {"train_loss": -24.901622772216797, "global_step": 250360, "epoch": 3016} {"train_loss": -25.110458374023438, "global_step": 250361, "epoch": 3016} {"train_loss": -24.59791374206543, "global_step": 250362, "epoch": 3016} {"train_loss": -25.25193977355957, "global_step": 250363, "epoch": 3016} {"train_loss": -24.971960067749023, "global_step": 250364, "epoch": 3016} {"train_loss": -24.88823127746582, "global_step": 250365, "epoch": 3016} {"train_loss": -24.966007232666016, "global_step": 250366, "epoch": 3016} {"train_loss": -25.19400978088379, "global_step": 250367, "epoch": 3016} {"train_loss": -25.277023315429688, "global_step": 250368, "epoch": 3016} {"train_loss": -24.898481369018555, "global_step": 250369, "epoch": 3016} {"train_loss": -25.0516414642334, "global_step": 250370, "epoch": 3016} {"train_loss": -25.007078170776367, "global_step": 250371, "epoch": 3016} {"train_loss": -25.20780372619629, "global_step": 250372, "epoch": 3016} {"train_loss": -24.990949630737305, "global_step": 250373, "epoch": 3016} {"train_loss": -25.42232894897461, "global_step": 250374, "epoch": 3016} {"train_loss": -25.239530563354492, "global_step": 250375, "epoch": 3016} {"train_loss": -24.67218589782715, "global_step": 250376, "epoch": 3016} {"train_loss": -25.141164779663086, "global_step": 250377, "epoch": 3016} {"train_loss": -25.011234283447266, "global_step": 250378, "epoch": 3016} {"train_loss": -24.91701889038086, "global_step": 250379, "epoch": 3016} {"train_loss": -24.52953338623047, "global_step": 250380, "epoch": 3016} {"train_loss": -25.099002838134766, "global_step": 250381, "epoch": 3016} {"train_loss": -25.129722595214844, "global_step": 250382, "epoch": 3016} {"train_loss": -24.84429359436035, "global_step": 250383, "epoch": 3016} {"train_loss": -24.793521881103516, "global_step": 250384, "epoch": 3016} {"train_loss": -25.315792083740234, "global_step": 250385, "epoch": 3016} {"train_loss": -25.122589111328125, "global_step": 250386, "epoch": 3016} {"train_loss": -24.815622329711914, "global_step": 250387, "epoch": 3016} {"train_loss": -24.848581314086914, "global_step": 250388, "epoch": 3016} {"train_loss": -25.3023738861084, "global_step": 250389, "epoch": 3016} {"train_loss": -25.503585815429688, "global_step": 250390, "epoch": 3016} {"train_loss": -25.326757431030273, "global_step": 250391, "epoch": 3016} {"train_loss": -24.51121711730957, "global_step": 250392, "epoch": 3016} {"train_loss": -24.971328735351562, "global_step": 250393, "epoch": 3016} {"train_loss": -25.086698532104492, "global_step": 250394, "epoch": 3016} {"train_loss": -25.16986656188965, "global_step": 250395, "epoch": 3016} {"train_loss": -25.424423217773438, "global_step": 250396, "epoch": 3016} {"train_loss": -24.78946304321289, "global_step": 250397, "epoch": 3016} {"train_loss": -24.831018447875977, "global_step": 250398, "epoch": 3016} {"train_loss": -24.895797729492188, "global_step": 250399, "epoch": 3016} {"train_loss": -25.0024356842041, "global_step": 250400, "epoch": 3016} {"train_loss": -25.028440475463867, "global_step": 250401, "epoch": 3016} {"train_loss": -25.250200271606445, "global_step": 250402, "epoch": 3016} {"train_loss": -25.272335052490234, "global_step": 250403, "epoch": 3016} {"train_loss": -24.68821907043457, "global_step": 250404, "epoch": 3016} {"train_loss": -24.849393844604492, "global_step": 250405, "epoch": 3016} {"train_loss": -25.155132293701172, "global_step": 250406, "epoch": 3016} {"train_loss": -24.772708892822266, "global_step": 250407, "epoch": 3016} {"train_loss": -24.94718360900879, "global_step": 250408, "epoch": 3016} {"train_loss": -25.237995147705078, "global_step": 250409, "epoch": 3016} {"train_loss": -24.946827417396637, "global_step": 250410, "epoch": 3016, "val_loss": 6826143.0} {"train_loss": -23.96035385131836, "global_step": 250411, "epoch": 3017} {"train_loss": -21.184354782104492, "global_step": 250412, "epoch": 3017} {"train_loss": -22.678110122680664, "global_step": 250413, "epoch": 3017} {"train_loss": -23.988983154296875, "global_step": 250414, "epoch": 3017} {"train_loss": -22.78968620300293, "global_step": 250415, "epoch": 3017} {"train_loss": -23.172489166259766, "global_step": 250416, "epoch": 3017} {"train_loss": -22.81502342224121, "global_step": 250417, "epoch": 3017} {"train_loss": -23.81111717224121, "global_step": 250418, "epoch": 3017} {"train_loss": -22.8085880279541, "global_step": 250419, "epoch": 3017} {"train_loss": -24.0356388092041, "global_step": 250420, "epoch": 3017} {"train_loss": -23.89376449584961, "global_step": 250421, "epoch": 3017} {"train_loss": -23.401029586791992, "global_step": 250422, "epoch": 3017} {"train_loss": -24.37603759765625, "global_step": 250423, "epoch": 3017} {"train_loss": -24.301204681396484, "global_step": 250424, "epoch": 3017} {"train_loss": -23.776084899902344, "global_step": 250425, "epoch": 3017} {"train_loss": -23.550113677978516, "global_step": 250426, "epoch": 3017} {"train_loss": -24.207813262939453, "global_step": 250427, "epoch": 3017} {"train_loss": -24.088354110717773, "global_step": 250428, "epoch": 3017} {"train_loss": -24.330326080322266, "global_step": 250429, "epoch": 3017} {"train_loss": -24.322219848632812, "global_step": 250430, "epoch": 3017} {"train_loss": -23.715560913085938, "global_step": 250431, "epoch": 3017} {"train_loss": -24.060285568237305, "global_step": 250432, "epoch": 3017} {"train_loss": -24.310544967651367, "global_step": 250433, "epoch": 3017} {"train_loss": -23.94573211669922, "global_step": 250434, "epoch": 3017} {"train_loss": -24.272703170776367, "global_step": 250435, "epoch": 3017} {"train_loss": -24.387714385986328, "global_step": 250436, "epoch": 3017} {"train_loss": -24.842161178588867, "global_step": 250437, "epoch": 3017} {"train_loss": -24.355690002441406, "global_step": 250438, "epoch": 3017} {"train_loss": -24.581830978393555, "global_step": 250439, "epoch": 3017} {"train_loss": -24.349735260009766, "global_step": 250440, "epoch": 3017} {"train_loss": -24.436513900756836, "global_step": 250441, "epoch": 3017} {"train_loss": -24.307350158691406, "global_step": 250442, "epoch": 3017} {"train_loss": -24.53230857849121, "global_step": 250443, "epoch": 3017} {"train_loss": -24.193893432617188, "global_step": 250444, "epoch": 3017} {"train_loss": -24.77728843688965, "global_step": 250445, "epoch": 3017} {"train_loss": -24.386701583862305, "global_step": 250446, "epoch": 3017} {"train_loss": -24.731525421142578, "global_step": 250447, "epoch": 3017} {"train_loss": -24.95086097717285, "global_step": 250448, "epoch": 3017} {"train_loss": -24.848508834838867, "global_step": 250449, "epoch": 3017} {"train_loss": -25.11033058166504, "global_step": 250450, "epoch": 3017} {"train_loss": -24.62238883972168, "global_step": 250451, "epoch": 3017} {"train_loss": -25.007131576538086, "global_step": 250452, "epoch": 3017} {"train_loss": -25.1558780670166, "global_step": 250453, "epoch": 3017} {"train_loss": -25.194053649902344, "global_step": 250454, "epoch": 3017} {"train_loss": -24.967721939086914, "global_step": 250455, "epoch": 3017} {"train_loss": -25.11244010925293, "global_step": 250456, "epoch": 3017} {"train_loss": -24.937755584716797, "global_step": 250457, "epoch": 3017} {"train_loss": -25.066495895385742, "global_step": 250458, "epoch": 3017} {"train_loss": -24.86639404296875, "global_step": 250459, "epoch": 3017} {"train_loss": -25.077199935913086, "global_step": 250460, "epoch": 3017} {"train_loss": -24.973403930664062, "global_step": 250461, "epoch": 3017} {"train_loss": -25.293615341186523, "global_step": 250462, "epoch": 3017} {"train_loss": -25.27366828918457, "global_step": 250463, "epoch": 3017} {"train_loss": -25.151227951049805, "global_step": 250464, "epoch": 3017} {"train_loss": -25.301654815673828, "global_step": 250465, "epoch": 3017} {"train_loss": -25.370107650756836, "global_step": 250466, "epoch": 3017} {"train_loss": -25.213428497314453, "global_step": 250467, "epoch": 3017} {"train_loss": -24.820451736450195, "global_step": 250468, "epoch": 3017} {"train_loss": -25.011682510375977, "global_step": 250469, "epoch": 3017} {"train_loss": -24.942031860351562, "global_step": 250470, "epoch": 3017} {"train_loss": -25.198400497436523, "global_step": 250471, "epoch": 3017} {"train_loss": -25.490707397460938, "global_step": 250472, "epoch": 3017} {"train_loss": -25.36720085144043, "global_step": 250473, "epoch": 3017} {"train_loss": -24.939367294311523, "global_step": 250474, "epoch": 3017} {"train_loss": -25.449560165405273, "global_step": 250475, "epoch": 3017} {"train_loss": -25.1392879486084, "global_step": 250476, "epoch": 3017} {"train_loss": -25.37253761291504, "global_step": 250477, "epoch": 3017} {"train_loss": -24.81148338317871, "global_step": 250478, "epoch": 3017} {"train_loss": -24.854267120361328, "global_step": 250479, "epoch": 3017} {"train_loss": -25.214092254638672, "global_step": 250480, "epoch": 3017} {"train_loss": -25.214046478271484, "global_step": 250481, "epoch": 3017} {"train_loss": -25.01151466369629, "global_step": 250482, "epoch": 3017} {"train_loss": -24.5424747467041, "global_step": 250483, "epoch": 3017} {"train_loss": -24.896896362304688, "global_step": 250484, "epoch": 3017} {"train_loss": -24.91836166381836, "global_step": 250485, "epoch": 3017} {"train_loss": -25.169645309448242, "global_step": 250486, "epoch": 3017} {"train_loss": -25.03668212890625, "global_step": 250487, "epoch": 3017} {"train_loss": -24.55446434020996, "global_step": 250488, "epoch": 3017} {"train_loss": -25.190017700195312, "global_step": 250489, "epoch": 3017} {"train_loss": -24.48489761352539, "global_step": 250490, "epoch": 3017} {"train_loss": -24.961164474487305, "global_step": 250491, "epoch": 3017} {"train_loss": -24.861581802368164, "global_step": 250492, "epoch": 3017} {"train_loss": -24.53208987684135, "global_step": 250493, "epoch": 3017, "val_loss": 6994961.0} {"train_loss": -24.826284408569336, "global_step": 250494, "epoch": 3018} {"train_loss": -24.59980583190918, "global_step": 250495, "epoch": 3018} {"train_loss": -24.881147384643555, "global_step": 250496, "epoch": 3018} {"train_loss": -24.491411209106445, "global_step": 250497, "epoch": 3018} {"train_loss": -25.023176193237305, "global_step": 250498, "epoch": 3018} {"train_loss": -24.48114013671875, "global_step": 250499, "epoch": 3018} {"train_loss": -25.063034057617188, "global_step": 250500, "epoch": 3018} {"train_loss": -24.963037490844727, "global_step": 250501, "epoch": 3018} {"train_loss": -24.879005432128906, "global_step": 250502, "epoch": 3018} {"train_loss": -24.95814323425293, "global_step": 250503, "epoch": 3018} {"train_loss": -25.158361434936523, "global_step": 250504, "epoch": 3018} {"train_loss": -25.014259338378906, "global_step": 250505, "epoch": 3018} {"train_loss": -25.223752975463867, "global_step": 250506, "epoch": 3018} {"train_loss": -24.643573760986328, "global_step": 250507, "epoch": 3018} {"train_loss": -25.197864532470703, "global_step": 250508, "epoch": 3018} {"train_loss": -25.182796478271484, "global_step": 250509, "epoch": 3018} {"train_loss": -25.169492721557617, "global_step": 250510, "epoch": 3018} {"train_loss": -24.987384796142578, "global_step": 250511, "epoch": 3018} {"train_loss": -24.784976959228516, "global_step": 250512, "epoch": 3018} {"train_loss": -24.91168975830078, "global_step": 250513, "epoch": 3018} {"train_loss": -25.057722091674805, "global_step": 250514, "epoch": 3018} {"train_loss": -25.13643455505371, "global_step": 250515, "epoch": 3018} {"train_loss": -25.157079696655273, "global_step": 250516, "epoch": 3018} {"train_loss": -25.139751434326172, "global_step": 250517, "epoch": 3018} {"train_loss": -25.11789321899414, "global_step": 250518, "epoch": 3018} {"train_loss": -24.901691436767578, "global_step": 250519, "epoch": 3018} {"train_loss": -24.793106079101562, "global_step": 250520, "epoch": 3018} {"train_loss": -24.862396240234375, "global_step": 250521, "epoch": 3018} {"train_loss": -25.191696166992188, "global_step": 250522, "epoch": 3018} {"train_loss": -24.93686294555664, "global_step": 250523, "epoch": 3018} {"train_loss": -25.28125762939453, "global_step": 250524, "epoch": 3018} {"train_loss": -25.255102157592773, "global_step": 250525, "epoch": 3018} {"train_loss": -24.698354721069336, "global_step": 250526, "epoch": 3018} {"train_loss": -24.842872619628906, "global_step": 250527, "epoch": 3018} {"train_loss": -25.376916885375977, "global_step": 250528, "epoch": 3018} {"train_loss": -25.056196212768555, "global_step": 250529, "epoch": 3018} {"train_loss": -24.76439094543457, "global_step": 250530, "epoch": 3018} {"train_loss": -24.97785758972168, "global_step": 250531, "epoch": 3018} {"train_loss": -25.33139991760254, "global_step": 250532, "epoch": 3018} {"train_loss": -25.583633422851562, "global_step": 250533, "epoch": 3018} {"train_loss": -25.156171798706055, "global_step": 250534, "epoch": 3018} {"train_loss": -25.041671752929688, "global_step": 250535, "epoch": 3018} {"train_loss": -25.151029586791992, "global_step": 250536, "epoch": 3018} {"train_loss": -24.931909561157227, "global_step": 250537, "epoch": 3018} {"train_loss": -25.072431564331055, "global_step": 250538, "epoch": 3018} {"train_loss": -25.240522384643555, "global_step": 250539, "epoch": 3018} {"train_loss": -25.122385025024414, "global_step": 250540, "epoch": 3018} {"train_loss": -24.986129760742188, "global_step": 250541, "epoch": 3018} {"train_loss": -24.576934814453125, "global_step": 250542, "epoch": 3018} {"train_loss": -25.006254196166992, "global_step": 250543, "epoch": 3018} {"train_loss": -24.774656295776367, "global_step": 250544, "epoch": 3018} {"train_loss": -24.917274475097656, "global_step": 250545, "epoch": 3018} {"train_loss": -25.030532836914062, "global_step": 250546, "epoch": 3018} {"train_loss": -25.133085250854492, "global_step": 250547, "epoch": 3018} {"train_loss": -24.865224838256836, "global_step": 250548, "epoch": 3018} {"train_loss": -25.241613388061523, "global_step": 250549, "epoch": 3018} {"train_loss": -25.187177658081055, "global_step": 250550, "epoch": 3018} {"train_loss": -25.056791305541992, "global_step": 250551, "epoch": 3018} {"train_loss": -24.87709617614746, "global_step": 250552, "epoch": 3018} {"train_loss": -25.37777328491211, "global_step": 250553, "epoch": 3018} {"train_loss": -25.368772506713867, "global_step": 250554, "epoch": 3018} {"train_loss": -25.4891300201416, "global_step": 250555, "epoch": 3018} {"train_loss": -25.033761978149414, "global_step": 250556, "epoch": 3018} {"train_loss": -25.117868423461914, "global_step": 250557, "epoch": 3018} {"train_loss": -24.76613426208496, "global_step": 250558, "epoch": 3018} {"train_loss": -25.330036163330078, "global_step": 250559, "epoch": 3018} {"train_loss": -25.041015625, "global_step": 250560, "epoch": 3018} {"train_loss": -25.055744171142578, "global_step": 250561, "epoch": 3018} {"train_loss": -24.996549606323242, "global_step": 250562, "epoch": 3018} {"train_loss": -25.148948669433594, "global_step": 250563, "epoch": 3018} {"train_loss": -25.171031951904297, "global_step": 250564, "epoch": 3018} {"train_loss": -25.11305809020996, "global_step": 250565, "epoch": 3018} {"train_loss": -24.98649024963379, "global_step": 250566, "epoch": 3018} {"train_loss": -24.694368362426758, "global_step": 250567, "epoch": 3018} {"train_loss": -25.27736473083496, "global_step": 250568, "epoch": 3018} {"train_loss": -25.2171573638916, "global_step": 250569, "epoch": 3018} {"train_loss": -24.54127311706543, "global_step": 250570, "epoch": 3018} {"train_loss": -24.957271575927734, "global_step": 250571, "epoch": 3018} {"train_loss": -24.893939971923828, "global_step": 250572, "epoch": 3018} {"train_loss": -24.458433151245117, "global_step": 250573, "epoch": 3018} {"train_loss": -24.253808975219727, "global_step": 250574, "epoch": 3018} {"train_loss": -24.084190368652344, "global_step": 250575, "epoch": 3018} {"train_loss": -24.98478340240846, "global_step": 250576, "epoch": 3018, "val_loss": 6872572.0} {"train_loss": -24.546628952026367, "global_step": 250577, "epoch": 3019} {"train_loss": -24.075428009033203, "global_step": 250578, "epoch": 3019} {"train_loss": -24.442564010620117, "global_step": 250579, "epoch": 3019} {"train_loss": -24.535858154296875, "global_step": 250580, "epoch": 3019} {"train_loss": -24.80271339416504, "global_step": 250581, "epoch": 3019} {"train_loss": -24.75885009765625, "global_step": 250582, "epoch": 3019} {"train_loss": -24.622467041015625, "global_step": 250583, "epoch": 3019} {"train_loss": -24.481603622436523, "global_step": 250584, "epoch": 3019} {"train_loss": -24.5606746673584, "global_step": 250585, "epoch": 3019} {"train_loss": -24.736454010009766, "global_step": 250586, "epoch": 3019} {"train_loss": -24.82037925720215, "global_step": 250587, "epoch": 3019} {"train_loss": -24.698511123657227, "global_step": 250588, "epoch": 3019} {"train_loss": -24.57091522216797, "global_step": 250589, "epoch": 3019} {"train_loss": -24.538894653320312, "global_step": 250590, "epoch": 3019} {"train_loss": -24.42629051208496, "global_step": 250591, "epoch": 3019} {"train_loss": -24.972204208374023, "global_step": 250592, "epoch": 3019} {"train_loss": -24.92631721496582, "global_step": 250593, "epoch": 3019} {"train_loss": -24.66697120666504, "global_step": 250594, "epoch": 3019} {"train_loss": -24.548072814941406, "global_step": 250595, "epoch": 3019} {"train_loss": -24.66204833984375, "global_step": 250596, "epoch": 3019} {"train_loss": -24.996747970581055, "global_step": 250597, "epoch": 3019} {"train_loss": -24.603179931640625, "global_step": 250598, "epoch": 3019} {"train_loss": -25.11454963684082, "global_step": 250599, "epoch": 3019} {"train_loss": -25.00494956970215, "global_step": 250600, "epoch": 3019} {"train_loss": -24.742603302001953, "global_step": 250601, "epoch": 3019} {"train_loss": -24.78632926940918, "global_step": 250602, "epoch": 3019} {"train_loss": -25.021451950073242, "global_step": 250603, "epoch": 3019} {"train_loss": -24.472379684448242, "global_step": 250604, "epoch": 3019} {"train_loss": -24.44660186767578, "global_step": 250605, "epoch": 3019} {"train_loss": -24.795074462890625, "global_step": 250606, "epoch": 3019} {"train_loss": -24.40571403503418, "global_step": 250607, "epoch": 3019} {"train_loss": -25.104780197143555, "global_step": 250608, "epoch": 3019} {"train_loss": -25.184728622436523, "global_step": 250609, "epoch": 3019} {"train_loss": -24.955928802490234, "global_step": 250610, "epoch": 3019} {"train_loss": -24.81151008605957, "global_step": 250611, "epoch": 3019} {"train_loss": -25.173221588134766, "global_step": 250612, "epoch": 3019} {"train_loss": -25.082134246826172, "global_step": 250613, "epoch": 3019} {"train_loss": -25.08211326599121, "global_step": 250614, "epoch": 3019} {"train_loss": -24.82454490661621, "global_step": 250615, "epoch": 3019} {"train_loss": -25.197599411010742, "global_step": 250616, "epoch": 3019} {"train_loss": -25.261173248291016, "global_step": 250617, "epoch": 3019} {"train_loss": -25.218189239501953, "global_step": 250618, "epoch": 3019} {"train_loss": -25.1306095123291, "global_step": 250619, "epoch": 3019} {"train_loss": -25.014617919921875, "global_step": 250620, "epoch": 3019} {"train_loss": -25.340015411376953, "global_step": 250621, "epoch": 3019} {"train_loss": -24.893945693969727, "global_step": 250622, "epoch": 3019} {"train_loss": -25.07844352722168, "global_step": 250623, "epoch": 3019} {"train_loss": -25.040029525756836, "global_step": 250624, "epoch": 3019} {"train_loss": -24.845609664916992, "global_step": 250625, "epoch": 3019} {"train_loss": -25.12863540649414, "global_step": 250626, "epoch": 3019} {"train_loss": -25.33478355407715, "global_step": 250627, "epoch": 3019} {"train_loss": -25.27416229248047, "global_step": 250628, "epoch": 3019} {"train_loss": -25.220016479492188, "global_step": 250629, "epoch": 3019} {"train_loss": -24.980924606323242, "global_step": 250630, "epoch": 3019} {"train_loss": -25.18378257751465, "global_step": 250631, "epoch": 3019} {"train_loss": -25.089702606201172, "global_step": 250632, "epoch": 3019} {"train_loss": -25.180957794189453, "global_step": 250633, "epoch": 3019} {"train_loss": -25.085494995117188, "global_step": 250634, "epoch": 3019} {"train_loss": -24.476760864257812, "global_step": 250635, "epoch": 3019} {"train_loss": -24.82163429260254, "global_step": 250636, "epoch": 3019} {"train_loss": -25.296384811401367, "global_step": 250637, "epoch": 3019} {"train_loss": -24.90471839904785, "global_step": 250638, "epoch": 3019} {"train_loss": -25.05779457092285, "global_step": 250639, "epoch": 3019} {"train_loss": -25.02062225341797, "global_step": 250640, "epoch": 3019} {"train_loss": -24.780994415283203, "global_step": 250641, "epoch": 3019} {"train_loss": -25.002290725708008, "global_step": 250642, "epoch": 3019} {"train_loss": -24.656476974487305, "global_step": 250643, "epoch": 3019} {"train_loss": -24.967300415039062, "global_step": 250644, "epoch": 3019} {"train_loss": -25.022689819335938, "global_step": 250645, "epoch": 3019} {"train_loss": -25.102161407470703, "global_step": 250646, "epoch": 3019} {"train_loss": -24.95432472229004, "global_step": 250647, "epoch": 3019} {"train_loss": -25.467992782592773, "global_step": 250648, "epoch": 3019} {"train_loss": -24.91709327697754, "global_step": 250649, "epoch": 3019} {"train_loss": -25.11671257019043, "global_step": 250650, "epoch": 3019} {"train_loss": -25.461536407470703, "global_step": 250651, "epoch": 3019} {"train_loss": -25.158124923706055, "global_step": 250652, "epoch": 3019} {"train_loss": -24.976484298706055, "global_step": 250653, "epoch": 3019} {"train_loss": -25.238622665405273, "global_step": 250654, "epoch": 3019} {"train_loss": -25.20685386657715, "global_step": 250655, "epoch": 3019} {"train_loss": -25.24875831604004, "global_step": 250656, "epoch": 3019} {"train_loss": -25.137441635131836, "global_step": 250657, "epoch": 3019} {"train_loss": -25.219440460205078, "global_step": 250658, "epoch": 3019} {"train_loss": -24.91666947789939, "global_step": 250659, "epoch": 3019, "val_loss": 6861581.5} {"train_loss": -24.333065032958984, "global_step": 250660, "epoch": 3020} {"train_loss": -24.204545974731445, "global_step": 250661, "epoch": 3020} {"train_loss": -24.640180587768555, "global_step": 250662, "epoch": 3020} {"train_loss": -24.846994400024414, "global_step": 250663, "epoch": 3020} {"train_loss": -24.78615379333496, "global_step": 250664, "epoch": 3020} {"train_loss": -24.42262840270996, "global_step": 250665, "epoch": 3020} {"train_loss": -24.610214233398438, "global_step": 250666, "epoch": 3020} {"train_loss": -24.836912155151367, "global_step": 250667, "epoch": 3020} {"train_loss": -24.82229995727539, "global_step": 250668, "epoch": 3020} {"train_loss": -24.93879508972168, "global_step": 250669, "epoch": 3020} {"train_loss": -24.7593994140625, "global_step": 250670, "epoch": 3020} {"train_loss": -24.459186553955078, "global_step": 250671, "epoch": 3020} {"train_loss": -24.70405387878418, "global_step": 250672, "epoch": 3020} {"train_loss": -24.74530029296875, "global_step": 250673, "epoch": 3020} {"train_loss": -24.638174057006836, "global_step": 250674, "epoch": 3020} {"train_loss": -24.400449752807617, "global_step": 250675, "epoch": 3020} {"train_loss": -24.728322982788086, "global_step": 250676, "epoch": 3020} {"train_loss": -24.815906524658203, "global_step": 250677, "epoch": 3020} {"train_loss": -24.51167106628418, "global_step": 250678, "epoch": 3020} {"train_loss": -24.284225463867188, "global_step": 250679, "epoch": 3020} {"train_loss": -24.858877182006836, "global_step": 250680, "epoch": 3020} {"train_loss": -24.687244415283203, "global_step": 250681, "epoch": 3020} {"train_loss": -24.877851486206055, "global_step": 250682, "epoch": 3020} {"train_loss": -24.41443634033203, "global_step": 250683, "epoch": 3020} {"train_loss": -24.947660446166992, "global_step": 250684, "epoch": 3020} {"train_loss": -24.882795333862305, "global_step": 250685, "epoch": 3020} {"train_loss": -24.227415084838867, "global_step": 250686, "epoch": 3020} {"train_loss": -24.813108444213867, "global_step": 250687, "epoch": 3020} {"train_loss": -25.162260055541992, "global_step": 250688, "epoch": 3020} {"train_loss": -24.677148818969727, "global_step": 250689, "epoch": 3020} {"train_loss": -24.948644638061523, "global_step": 250690, "epoch": 3020} {"train_loss": -24.558284759521484, "global_step": 250691, "epoch": 3020} {"train_loss": -24.961740493774414, "global_step": 250692, "epoch": 3020} {"train_loss": -25.1120662689209, "global_step": 250693, "epoch": 3020} {"train_loss": -25.224407196044922, "global_step": 250694, "epoch": 3020} {"train_loss": -25.25434684753418, "global_step": 250695, "epoch": 3020} {"train_loss": -24.7868709564209, "global_step": 250696, "epoch": 3020} {"train_loss": -24.88608169555664, "global_step": 250697, "epoch": 3020} {"train_loss": -24.949968338012695, "global_step": 250698, "epoch": 3020} {"train_loss": -24.672119140625, "global_step": 250699, "epoch": 3020} {"train_loss": -25.097028732299805, "global_step": 250700, "epoch": 3020} {"train_loss": -24.91206932067871, "global_step": 250701, "epoch": 3020} {"train_loss": -24.837467193603516, "global_step": 250702, "epoch": 3020} {"train_loss": -24.990764617919922, "global_step": 250703, "epoch": 3020} {"train_loss": -25.208446502685547, "global_step": 250704, "epoch": 3020} {"train_loss": -25.009435653686523, "global_step": 250705, "epoch": 3020} {"train_loss": -25.1741886138916, "global_step": 250706, "epoch": 3020} {"train_loss": -25.342208862304688, "global_step": 250707, "epoch": 3020} {"train_loss": -25.064199447631836, "global_step": 250708, "epoch": 3020} {"train_loss": -24.979705810546875, "global_step": 250709, "epoch": 3020} {"train_loss": -25.32118797302246, "global_step": 250710, "epoch": 3020} {"train_loss": -25.2511043548584, "global_step": 250711, "epoch": 3020} {"train_loss": -25.33894157409668, "global_step": 250712, "epoch": 3020} {"train_loss": -25.08647346496582, "global_step": 250713, "epoch": 3020} {"train_loss": -25.068361282348633, "global_step": 250714, "epoch": 3020} {"train_loss": -25.144901275634766, "global_step": 250715, "epoch": 3020} {"train_loss": -24.78897476196289, "global_step": 250716, "epoch": 3020} {"train_loss": -24.65229606628418, "global_step": 250717, "epoch": 3020} {"train_loss": -25.068347930908203, "global_step": 250718, "epoch": 3020} {"train_loss": -25.1256046295166, "global_step": 250719, "epoch": 3020} {"train_loss": -25.1247615814209, "global_step": 250720, "epoch": 3020} {"train_loss": -24.860090255737305, "global_step": 250721, "epoch": 3020} {"train_loss": -24.81998634338379, "global_step": 250722, "epoch": 3020} {"train_loss": -25.0728759765625, "global_step": 250723, "epoch": 3020} {"train_loss": -25.301578521728516, "global_step": 250724, "epoch": 3020} {"train_loss": -25.109556198120117, "global_step": 250725, "epoch": 3020} {"train_loss": -24.952539443969727, "global_step": 250726, "epoch": 3020} {"train_loss": -24.91050148010254, "global_step": 250727, "epoch": 3020} {"train_loss": -25.46384620666504, "global_step": 250728, "epoch": 3020} {"train_loss": -25.394439697265625, "global_step": 250729, "epoch": 3020} {"train_loss": -25.154041290283203, "global_step": 250730, "epoch": 3020} {"train_loss": -25.118392944335938, "global_step": 250731, "epoch": 3020} {"train_loss": -25.07952117919922, "global_step": 250732, "epoch": 3020} {"train_loss": -25.56075096130371, "global_step": 250733, "epoch": 3020} {"train_loss": -25.10091781616211, "global_step": 250734, "epoch": 3020} {"train_loss": -25.138391494750977, "global_step": 250735, "epoch": 3020} {"train_loss": -24.964523315429688, "global_step": 250736, "epoch": 3020} {"train_loss": -24.892276763916016, "global_step": 250737, "epoch": 3020} {"train_loss": -25.37529182434082, "global_step": 250738, "epoch": 3020} {"train_loss": -25.210477828979492, "global_step": 250739, "epoch": 3020} {"train_loss": -24.753087997436523, "global_step": 250740, "epoch": 3020} {"train_loss": -25.140607833862305, "global_step": 250741, "epoch": 3020} {"train_loss": -24.91202609510307, "global_step": 250742, "epoch": 3020, "val_loss": 6984865.0} {"train_loss": -24.5316162109375, "global_step": 250743, "epoch": 3021} {"train_loss": -24.675199508666992, "global_step": 250744, "epoch": 3021} {"train_loss": -24.822240829467773, "global_step": 250745, "epoch": 3021} {"train_loss": -24.88710594177246, "global_step": 250746, "epoch": 3021} {"train_loss": -25.018186569213867, "global_step": 250747, "epoch": 3021} {"train_loss": -24.75042724609375, "global_step": 250748, "epoch": 3021} {"train_loss": -24.60463523864746, "global_step": 250749, "epoch": 3021} {"train_loss": -24.820850372314453, "global_step": 250750, "epoch": 3021} {"train_loss": -25.299358367919922, "global_step": 250751, "epoch": 3021} {"train_loss": -25.077932357788086, "global_step": 250752, "epoch": 3021} {"train_loss": -24.877899169921875, "global_step": 250753, "epoch": 3021} {"train_loss": -24.871728897094727, "global_step": 250754, "epoch": 3021} {"train_loss": -25.312057495117188, "global_step": 250755, "epoch": 3021} {"train_loss": -25.03021812438965, "global_step": 250756, "epoch": 3021} {"train_loss": -24.75394630432129, "global_step": 250757, "epoch": 3021} {"train_loss": -24.771440505981445, "global_step": 250758, "epoch": 3021} {"train_loss": -25.093271255493164, "global_step": 250759, "epoch": 3021} {"train_loss": -25.033166885375977, "global_step": 250760, "epoch": 3021} {"train_loss": -24.704065322875977, "global_step": 250761, "epoch": 3021} {"train_loss": -25.10997200012207, "global_step": 250762, "epoch": 3021} {"train_loss": -24.968570709228516, "global_step": 250763, "epoch": 3021} {"train_loss": -24.90668296813965, "global_step": 250764, "epoch": 3021} {"train_loss": -25.031278610229492, "global_step": 250765, "epoch": 3021} {"train_loss": -25.29448890686035, "global_step": 250766, "epoch": 3021} {"train_loss": -25.06093978881836, "global_step": 250767, "epoch": 3021} {"train_loss": -24.920013427734375, "global_step": 250768, "epoch": 3021} {"train_loss": -25.36972999572754, "global_step": 250769, "epoch": 3021} {"train_loss": -25.03708839416504, "global_step": 250770, "epoch": 3021} {"train_loss": -25.21828842163086, "global_step": 250771, "epoch": 3021} {"train_loss": -25.010513305664062, "global_step": 250772, "epoch": 3021} {"train_loss": -25.049280166625977, "global_step": 250773, "epoch": 3021} {"train_loss": -24.845657348632812, "global_step": 250774, "epoch": 3021} {"train_loss": -24.90939712524414, "global_step": 250775, "epoch": 3021} {"train_loss": -25.08672523498535, "global_step": 250776, "epoch": 3021} {"train_loss": -25.03059959411621, "global_step": 250777, "epoch": 3021} {"train_loss": -25.095195770263672, "global_step": 250778, "epoch": 3021} {"train_loss": -25.26517105102539, "global_step": 250779, "epoch": 3021} {"train_loss": -25.149751663208008, "global_step": 250780, "epoch": 3021} {"train_loss": -24.793373107910156, "global_step": 250781, "epoch": 3021} {"train_loss": -25.384557723999023, "global_step": 250782, "epoch": 3021} {"train_loss": -24.8692569732666, "global_step": 250783, "epoch": 3021} {"train_loss": -24.89118003845215, "global_step": 250784, "epoch": 3021} {"train_loss": -25.25872802734375, "global_step": 250785, "epoch": 3021} {"train_loss": -24.731931686401367, "global_step": 250786, "epoch": 3021} {"train_loss": -25.382532119750977, "global_step": 250787, "epoch": 3021} {"train_loss": -25.149690628051758, "global_step": 250788, "epoch": 3021} {"train_loss": -25.30917739868164, "global_step": 250789, "epoch": 3021} {"train_loss": -24.98224449157715, "global_step": 250790, "epoch": 3021} {"train_loss": -25.351064682006836, "global_step": 250791, "epoch": 3021} {"train_loss": -25.096843719482422, "global_step": 250792, "epoch": 3021} {"train_loss": -24.779884338378906, "global_step": 250793, "epoch": 3021} {"train_loss": -25.191953659057617, "global_step": 250794, "epoch": 3021} {"train_loss": -25.490432739257812, "global_step": 250795, "epoch": 3021} {"train_loss": -25.260831832885742, "global_step": 250796, "epoch": 3021} {"train_loss": -24.829425811767578, "global_step": 250797, "epoch": 3021} {"train_loss": -25.22047996520996, "global_step": 250798, "epoch": 3021} {"train_loss": -24.846717834472656, "global_step": 250799, "epoch": 3021} {"train_loss": -24.904611587524414, "global_step": 250800, "epoch": 3021} {"train_loss": -25.10352897644043, "global_step": 250801, "epoch": 3021} {"train_loss": -25.075525283813477, "global_step": 250802, "epoch": 3021} {"train_loss": -24.85804557800293, "global_step": 250803, "epoch": 3021} {"train_loss": -24.986963272094727, "global_step": 250804, "epoch": 3021} {"train_loss": -24.660612106323242, "global_step": 250805, "epoch": 3021} {"train_loss": -25.038707733154297, "global_step": 250806, "epoch": 3021} {"train_loss": -25.18434715270996, "global_step": 250807, "epoch": 3021} {"train_loss": -25.257848739624023, "global_step": 250808, "epoch": 3021} {"train_loss": -25.286867141723633, "global_step": 250809, "epoch": 3021} {"train_loss": -25.319913864135742, "global_step": 250810, "epoch": 3021} {"train_loss": -25.338342666625977, "global_step": 250811, "epoch": 3021} {"train_loss": -25.12259292602539, "global_step": 250812, "epoch": 3021} {"train_loss": -25.154836654663086, "global_step": 250813, "epoch": 3021} {"train_loss": -25.1153621673584, "global_step": 250814, "epoch": 3021} {"train_loss": -24.71478843688965, "global_step": 250815, "epoch": 3021} {"train_loss": -25.26310157775879, "global_step": 250816, "epoch": 3021} {"train_loss": -25.148658752441406, "global_step": 250817, "epoch": 3021} {"train_loss": -25.119020462036133, "global_step": 250818, "epoch": 3021} {"train_loss": -25.26873779296875, "global_step": 250819, "epoch": 3021} {"train_loss": -24.91996955871582, "global_step": 250820, "epoch": 3021} {"train_loss": -25.067523956298828, "global_step": 250821, "epoch": 3021} {"train_loss": -24.920475006103516, "global_step": 250822, "epoch": 3021} {"train_loss": -25.68775749206543, "global_step": 250823, "epoch": 3021} {"train_loss": -25.3142032623291, "global_step": 250824, "epoch": 3021} {"train_loss": -25.065337054700738, "global_step": 250825, "epoch": 3021, "val_loss": 6948673.5} {"train_loss": -23.915618896484375, "global_step": 250826, "epoch": 3022} {"train_loss": -23.401451110839844, "global_step": 250827, "epoch": 3022} {"train_loss": -24.710189819335938, "global_step": 250828, "epoch": 3022} {"train_loss": -23.976716995239258, "global_step": 250829, "epoch": 3022} {"train_loss": -24.33465576171875, "global_step": 250830, "epoch": 3022} {"train_loss": -24.600509643554688, "global_step": 250831, "epoch": 3022} {"train_loss": -24.183626174926758, "global_step": 250832, "epoch": 3022} {"train_loss": -24.48400115966797, "global_step": 250833, "epoch": 3022} {"train_loss": -24.611291885375977, "global_step": 250834, "epoch": 3022} {"train_loss": -24.6423397064209, "global_step": 250835, "epoch": 3022} {"train_loss": -24.466772079467773, "global_step": 250836, "epoch": 3022} {"train_loss": -24.588340759277344, "global_step": 250837, "epoch": 3022} {"train_loss": -24.395721435546875, "global_step": 250838, "epoch": 3022} {"train_loss": -24.48323631286621, "global_step": 250839, "epoch": 3022} {"train_loss": -24.664737701416016, "global_step": 250840, "epoch": 3022} {"train_loss": -24.48457145690918, "global_step": 250841, "epoch": 3022} {"train_loss": -24.528318405151367, "global_step": 250842, "epoch": 3022} {"train_loss": -24.647357940673828, "global_step": 250843, "epoch": 3022} {"train_loss": -24.60320472717285, "global_step": 250844, "epoch": 3022} {"train_loss": -24.686586380004883, "global_step": 250845, "epoch": 3022} {"train_loss": -24.86252212524414, "global_step": 250846, "epoch": 3022} {"train_loss": -24.61078453063965, "global_step": 250847, "epoch": 3022} {"train_loss": -24.856861114501953, "global_step": 250848, "epoch": 3022} {"train_loss": -24.76472282409668, "global_step": 250849, "epoch": 3022} {"train_loss": -24.625490188598633, "global_step": 250850, "epoch": 3022} {"train_loss": -24.933914184570312, "global_step": 250851, "epoch": 3022} {"train_loss": -25.211088180541992, "global_step": 250852, "epoch": 3022} {"train_loss": -24.836288452148438, "global_step": 250853, "epoch": 3022} {"train_loss": -24.973438262939453, "global_step": 250854, "epoch": 3022} {"train_loss": -24.906274795532227, "global_step": 250855, "epoch": 3022} {"train_loss": -24.7268009185791, "global_step": 250856, "epoch": 3022} {"train_loss": -24.771787643432617, "global_step": 250857, "epoch": 3022} {"train_loss": -25.277393341064453, "global_step": 250858, "epoch": 3022} {"train_loss": -25.117996215820312, "global_step": 250859, "epoch": 3022} {"train_loss": -24.565092086791992, "global_step": 250860, "epoch": 3022} {"train_loss": -24.97340202331543, "global_step": 250861, "epoch": 3022} {"train_loss": -24.97859001159668, "global_step": 250862, "epoch": 3022} {"train_loss": -24.763235092163086, "global_step": 250863, "epoch": 3022} {"train_loss": -24.845075607299805, "global_step": 250864, "epoch": 3022} {"train_loss": -24.910079956054688, "global_step": 250865, "epoch": 3022} {"train_loss": -24.493040084838867, "global_step": 250866, "epoch": 3022} {"train_loss": -24.74771499633789, "global_step": 250867, "epoch": 3022} {"train_loss": -24.748470306396484, "global_step": 250868, "epoch": 3022} {"train_loss": -25.099613189697266, "global_step": 250869, "epoch": 3022} {"train_loss": -24.775836944580078, "global_step": 250870, "epoch": 3022} {"train_loss": -24.99844741821289, "global_step": 250871, "epoch": 3022} {"train_loss": -25.318708419799805, "global_step": 250872, "epoch": 3022} {"train_loss": -24.850727081298828, "global_step": 250873, "epoch": 3022} {"train_loss": -25.094419479370117, "global_step": 250874, "epoch": 3022} {"train_loss": -25.070804595947266, "global_step": 250875, "epoch": 3022} {"train_loss": -25.140247344970703, "global_step": 250876, "epoch": 3022} {"train_loss": -25.027542114257812, "global_step": 250877, "epoch": 3022} {"train_loss": -25.12035369873047, "global_step": 250878, "epoch": 3022} {"train_loss": -24.998611450195312, "global_step": 250879, "epoch": 3022} {"train_loss": -25.212209701538086, "global_step": 250880, "epoch": 3022} {"train_loss": -25.257572174072266, "global_step": 250881, "epoch": 3022} {"train_loss": -25.393814086914062, "global_step": 250882, "epoch": 3022} {"train_loss": -24.879819869995117, "global_step": 250883, "epoch": 3022} {"train_loss": -24.9864559173584, "global_step": 250884, "epoch": 3022} {"train_loss": -25.16243553161621, "global_step": 250885, "epoch": 3022} {"train_loss": -25.028493881225586, "global_step": 250886, "epoch": 3022} {"train_loss": -25.423688888549805, "global_step": 250887, "epoch": 3022} {"train_loss": -24.894752502441406, "global_step": 250888, "epoch": 3022} {"train_loss": -24.943416595458984, "global_step": 250889, "epoch": 3022} {"train_loss": -24.977949142456055, "global_step": 250890, "epoch": 3022} {"train_loss": -25.1231689453125, "global_step": 250891, "epoch": 3022} {"train_loss": -24.96845054626465, "global_step": 250892, "epoch": 3022} {"train_loss": -25.262537002563477, "global_step": 250893, "epoch": 3022} {"train_loss": -24.93282127380371, "global_step": 250894, "epoch": 3022} {"train_loss": -25.27737045288086, "global_step": 250895, "epoch": 3022} {"train_loss": -25.201818466186523, "global_step": 250896, "epoch": 3022} {"train_loss": -25.130910873413086, "global_step": 250897, "epoch": 3022} {"train_loss": -24.816129684448242, "global_step": 250898, "epoch": 3022} {"train_loss": -24.98750114440918, "global_step": 250899, "epoch": 3022} {"train_loss": -25.047021865844727, "global_step": 250900, "epoch": 3022} {"train_loss": -25.053525924682617, "global_step": 250901, "epoch": 3022} {"train_loss": -24.797428131103516, "global_step": 250902, "epoch": 3022} {"train_loss": -24.648040771484375, "global_step": 250903, "epoch": 3022} {"train_loss": -24.695375442504883, "global_step": 250904, "epoch": 3022} {"train_loss": -24.982213973999023, "global_step": 250905, "epoch": 3022} {"train_loss": -25.191190719604492, "global_step": 250906, "epoch": 3022} {"train_loss": -25.087011337280273, "global_step": 250907, "epoch": 3022} {"train_loss": -24.856981254485717, "global_step": 250908, "epoch": 3022, "val_loss": 6774768.0} {"train_loss": -24.7796630859375, "global_step": 250909, "epoch": 3023} {"train_loss": -24.749778747558594, "global_step": 250910, "epoch": 3023} {"train_loss": -24.7764949798584, "global_step": 250911, "epoch": 3023} {"train_loss": -24.508243560791016, "global_step": 250912, "epoch": 3023} {"train_loss": -24.305999755859375, "global_step": 250913, "epoch": 3023} {"train_loss": -24.8645076751709, "global_step": 250914, "epoch": 3023} {"train_loss": -25.092628479003906, "global_step": 250915, "epoch": 3023} {"train_loss": -24.975065231323242, "global_step": 250916, "epoch": 3023} {"train_loss": -24.795902252197266, "global_step": 250917, "epoch": 3023} {"train_loss": -25.03343391418457, "global_step": 250918, "epoch": 3023} {"train_loss": -24.82105827331543, "global_step": 250919, "epoch": 3023} {"train_loss": -24.74842643737793, "global_step": 250920, "epoch": 3023} {"train_loss": -24.778488159179688, "global_step": 250921, "epoch": 3023} {"train_loss": -25.237592697143555, "global_step": 250922, "epoch": 3023} {"train_loss": -24.847164154052734, "global_step": 250923, "epoch": 3023} {"train_loss": -24.992300033569336, "global_step": 250924, "epoch": 3023} {"train_loss": -24.637941360473633, "global_step": 250925, "epoch": 3023} {"train_loss": -25.096393585205078, "global_step": 250926, "epoch": 3023} {"train_loss": -24.924884796142578, "global_step": 250927, "epoch": 3023} {"train_loss": -24.88558006286621, "global_step": 250928, "epoch": 3023} {"train_loss": -24.90235710144043, "global_step": 250929, "epoch": 3023} {"train_loss": -25.06203269958496, "global_step": 250930, "epoch": 3023} {"train_loss": -24.806188583374023, "global_step": 250931, "epoch": 3023} {"train_loss": -25.128957748413086, "global_step": 250932, "epoch": 3023} {"train_loss": -24.6378231048584, "global_step": 250933, "epoch": 3023} {"train_loss": -25.099153518676758, "global_step": 250934, "epoch": 3023} {"train_loss": -25.25966453552246, "global_step": 250935, "epoch": 3023} {"train_loss": -24.936872482299805, "global_step": 250936, "epoch": 3023} {"train_loss": -24.938831329345703, "global_step": 250937, "epoch": 3023} {"train_loss": -24.879552841186523, "global_step": 250938, "epoch": 3023} {"train_loss": -25.13123893737793, "global_step": 250939, "epoch": 3023} {"train_loss": -25.034549713134766, "global_step": 250940, "epoch": 3023} {"train_loss": -25.509212493896484, "global_step": 250941, "epoch": 3023} {"train_loss": -24.85719871520996, "global_step": 250942, "epoch": 3023} {"train_loss": -25.1107234954834, "global_step": 250943, "epoch": 3023} {"train_loss": -24.842288970947266, "global_step": 250944, "epoch": 3023} {"train_loss": -24.976306915283203, "global_step": 250945, "epoch": 3023} {"train_loss": -24.94573974609375, "global_step": 250946, "epoch": 3023} {"train_loss": -25.060014724731445, "global_step": 250947, "epoch": 3023} {"train_loss": -25.144222259521484, "global_step": 250948, "epoch": 3023} {"train_loss": -24.738178253173828, "global_step": 250949, "epoch": 3023} {"train_loss": -25.118896484375, "global_step": 250950, "epoch": 3023} {"train_loss": -25.177783966064453, "global_step": 250951, "epoch": 3023} {"train_loss": -25.242212295532227, "global_step": 250952, "epoch": 3023} {"train_loss": -24.9920654296875, "global_step": 250953, "epoch": 3023} {"train_loss": -24.963947296142578, "global_step": 250954, "epoch": 3023} {"train_loss": -25.4073543548584, "global_step": 250955, "epoch": 3023} {"train_loss": -25.251890182495117, "global_step": 250956, "epoch": 3023} {"train_loss": -25.081829071044922, "global_step": 250957, "epoch": 3023} {"train_loss": -24.775432586669922, "global_step": 250958, "epoch": 3023} {"train_loss": -25.1840763092041, "global_step": 250959, "epoch": 3023} {"train_loss": -25.7452392578125, "global_step": 250960, "epoch": 3023} {"train_loss": -25.323545455932617, "global_step": 250961, "epoch": 3023} {"train_loss": -24.888437271118164, "global_step": 250962, "epoch": 3023} {"train_loss": -24.8967227935791, "global_step": 250963, "epoch": 3023} {"train_loss": -24.91360092163086, "global_step": 250964, "epoch": 3023} {"train_loss": -25.17719841003418, "global_step": 250965, "epoch": 3023} {"train_loss": -25.039630889892578, "global_step": 250966, "epoch": 3023} {"train_loss": -25.439029693603516, "global_step": 250967, "epoch": 3023} {"train_loss": -25.491313934326172, "global_step": 250968, "epoch": 3023} {"train_loss": -25.092639923095703, "global_step": 250969, "epoch": 3023} {"train_loss": -25.239652633666992, "global_step": 250970, "epoch": 3023} {"train_loss": -25.121505737304688, "global_step": 250971, "epoch": 3023} {"train_loss": -25.494232177734375, "global_step": 250972, "epoch": 3023} {"train_loss": -25.215042114257812, "global_step": 250973, "epoch": 3023} {"train_loss": -25.377939224243164, "global_step": 250974, "epoch": 3023} {"train_loss": -25.371259689331055, "global_step": 250975, "epoch": 3023} {"train_loss": -25.079362869262695, "global_step": 250976, "epoch": 3023} {"train_loss": -25.234207153320312, "global_step": 250977, "epoch": 3023} {"train_loss": -24.995052337646484, "global_step": 250978, "epoch": 3023} {"train_loss": -24.94789695739746, "global_step": 250979, "epoch": 3023} {"train_loss": -24.973005294799805, "global_step": 250980, "epoch": 3023} {"train_loss": -25.460254669189453, "global_step": 250981, "epoch": 3023} {"train_loss": -24.91627311706543, "global_step": 250982, "epoch": 3023} {"train_loss": -24.85830307006836, "global_step": 250983, "epoch": 3023} {"train_loss": -25.056608200073242, "global_step": 250984, "epoch": 3023} {"train_loss": -25.030126571655273, "global_step": 250985, "epoch": 3023} {"train_loss": -25.106800079345703, "global_step": 250986, "epoch": 3023} {"train_loss": -25.172630310058594, "global_step": 250987, "epoch": 3023} {"train_loss": -24.797183990478516, "global_step": 250988, "epoch": 3023} {"train_loss": -24.983304977416992, "global_step": 250989, "epoch": 3023} {"train_loss": -24.806482315063477, "global_step": 250990, "epoch": 3023} {"train_loss": -25.030978490071124, "global_step": 250991, "epoch": 3023, "val_loss": 6957905.0} {"train_loss": -24.0772762298584, "global_step": 250992, "epoch": 3024} {"train_loss": -24.186405181884766, "global_step": 250993, "epoch": 3024} {"train_loss": -23.68607521057129, "global_step": 250994, "epoch": 3024} {"train_loss": -24.800525665283203, "global_step": 250995, "epoch": 3024} {"train_loss": -23.856534957885742, "global_step": 250996, "epoch": 3024} {"train_loss": -24.375513076782227, "global_step": 250997, "epoch": 3024} {"train_loss": -24.43649673461914, "global_step": 250998, "epoch": 3024} {"train_loss": -24.149877548217773, "global_step": 250999, "epoch": 3024} {"train_loss": -24.061147689819336, "global_step": 251000, "epoch": 3024} {"train_loss": -24.427772521972656, "global_step": 251001, "epoch": 3024} {"train_loss": -24.525863647460938, "global_step": 251002, "epoch": 3024} {"train_loss": -24.502981185913086, "global_step": 251003, "epoch": 3024} {"train_loss": -24.699996948242188, "global_step": 251004, "epoch": 3024} {"train_loss": -25.082746505737305, "global_step": 251005, "epoch": 3024} {"train_loss": -24.497997283935547, "global_step": 251006, "epoch": 3024} {"train_loss": -24.56208610534668, "global_step": 251007, "epoch": 3024} {"train_loss": -24.480730056762695, "global_step": 251008, "epoch": 3024} {"train_loss": -24.648778915405273, "global_step": 251009, "epoch": 3024} {"train_loss": -24.74018669128418, "global_step": 251010, "epoch": 3024} {"train_loss": -24.605398178100586, "global_step": 251011, "epoch": 3024} {"train_loss": -24.822921752929688, "global_step": 251012, "epoch": 3024} {"train_loss": -24.502161026000977, "global_step": 251013, "epoch": 3024} {"train_loss": -24.656845092773438, "global_step": 251014, "epoch": 3024} {"train_loss": -24.89459800720215, "global_step": 251015, "epoch": 3024} {"train_loss": -24.75741958618164, "global_step": 251016, "epoch": 3024} {"train_loss": -24.8448429107666, "global_step": 251017, "epoch": 3024} {"train_loss": -24.608135223388672, "global_step": 251018, "epoch": 3024} {"train_loss": -24.75286865234375, "global_step": 251019, "epoch": 3024} {"train_loss": -24.832294464111328, "global_step": 251020, "epoch": 3024} {"train_loss": -24.769367218017578, "global_step": 251021, "epoch": 3024} {"train_loss": -25.081180572509766, "global_step": 251022, "epoch": 3024} {"train_loss": -24.87752342224121, "global_step": 251023, "epoch": 3024} {"train_loss": -24.811115264892578, "global_step": 251024, "epoch": 3024} {"train_loss": -25.449024200439453, "global_step": 251025, "epoch": 3024} {"train_loss": -24.979557037353516, "global_step": 251026, "epoch": 3024} {"train_loss": -24.988794326782227, "global_step": 251027, "epoch": 3024} {"train_loss": -25.069087982177734, "global_step": 251028, "epoch": 3024} {"train_loss": -24.887435913085938, "global_step": 251029, "epoch": 3024} {"train_loss": -24.847766876220703, "global_step": 251030, "epoch": 3024} {"train_loss": -25.072561264038086, "global_step": 251031, "epoch": 3024} {"train_loss": -25.032550811767578, "global_step": 251032, "epoch": 3024} {"train_loss": -25.176788330078125, "global_step": 251033, "epoch": 3024} {"train_loss": -24.893918991088867, "global_step": 251034, "epoch": 3024} {"train_loss": -24.746389389038086, "global_step": 251035, "epoch": 3024} {"train_loss": -24.732847213745117, "global_step": 251036, "epoch": 3024} {"train_loss": -25.2058048248291, "global_step": 251037, "epoch": 3024} {"train_loss": -24.920305252075195, "global_step": 251038, "epoch": 3024} {"train_loss": -25.230972290039062, "global_step": 251039, "epoch": 3024} {"train_loss": -25.194171905517578, "global_step": 251040, "epoch": 3024} {"train_loss": -24.633901596069336, "global_step": 251041, "epoch": 3024} {"train_loss": -25.224031448364258, "global_step": 251042, "epoch": 3024} {"train_loss": -24.84781837463379, "global_step": 251043, "epoch": 3024} {"train_loss": -25.094839096069336, "global_step": 251044, "epoch": 3024} {"train_loss": -25.130582809448242, "global_step": 251045, "epoch": 3024} {"train_loss": -24.64879608154297, "global_step": 251046, "epoch": 3024} {"train_loss": -24.885618209838867, "global_step": 251047, "epoch": 3024} {"train_loss": -25.416982650756836, "global_step": 251048, "epoch": 3024} {"train_loss": -25.089643478393555, "global_step": 251049, "epoch": 3024} {"train_loss": -25.112619400024414, "global_step": 251050, "epoch": 3024} {"train_loss": -25.03578758239746, "global_step": 251051, "epoch": 3024} {"train_loss": -24.996259689331055, "global_step": 251052, "epoch": 3024} {"train_loss": -25.160140991210938, "global_step": 251053, "epoch": 3024} {"train_loss": -24.728300094604492, "global_step": 251054, "epoch": 3024} {"train_loss": -24.91355323791504, "global_step": 251055, "epoch": 3024} {"train_loss": -25.294340133666992, "global_step": 251056, "epoch": 3024} {"train_loss": -25.237716674804688, "global_step": 251057, "epoch": 3024} {"train_loss": -24.81513786315918, "global_step": 251058, "epoch": 3024} {"train_loss": -24.333526611328125, "global_step": 251059, "epoch": 3024} {"train_loss": -24.579824447631836, "global_step": 251060, "epoch": 3024} {"train_loss": -24.42487144470215, "global_step": 251061, "epoch": 3024} {"train_loss": -25.15203094482422, "global_step": 251062, "epoch": 3024} {"train_loss": -24.973867416381836, "global_step": 251063, "epoch": 3024} {"train_loss": -25.001300811767578, "global_step": 251064, "epoch": 3024} {"train_loss": -25.151159286499023, "global_step": 251065, "epoch": 3024} {"train_loss": -24.392953872680664, "global_step": 251066, "epoch": 3024} {"train_loss": -24.94581413269043, "global_step": 251067, "epoch": 3024} {"train_loss": -24.96831512451172, "global_step": 251068, "epoch": 3024} {"train_loss": -24.879575729370117, "global_step": 251069, "epoch": 3024} {"train_loss": -25.20098114013672, "global_step": 251070, "epoch": 3024} {"train_loss": -25.010507583618164, "global_step": 251071, "epoch": 3024} {"train_loss": -24.437458038330078, "global_step": 251072, "epoch": 3024} {"train_loss": -24.906518936157227, "global_step": 251073, "epoch": 3024} {"train_loss": -24.812318709959467, "global_step": 251074, "epoch": 3024, "val_loss": 6890293.0} {"train_loss": -24.28798484802246, "global_step": 251075, "epoch": 3025} {"train_loss": -24.348615646362305, "global_step": 251076, "epoch": 3025} {"train_loss": -24.5615291595459, "global_step": 251077, "epoch": 3025} {"train_loss": -24.715940475463867, "global_step": 251078, "epoch": 3025} {"train_loss": -24.32177734375, "global_step": 251079, "epoch": 3025} {"train_loss": -24.665302276611328, "global_step": 251080, "epoch": 3025} {"train_loss": -24.568368911743164, "global_step": 251081, "epoch": 3025} {"train_loss": -24.281179428100586, "global_step": 251082, "epoch": 3025} {"train_loss": -24.70692253112793, "global_step": 251083, "epoch": 3025} {"train_loss": -24.84564781188965, "global_step": 251084, "epoch": 3025} {"train_loss": -24.689346313476562, "global_step": 251085, "epoch": 3025} {"train_loss": -25.110517501831055, "global_step": 251086, "epoch": 3025} {"train_loss": -24.791275024414062, "global_step": 251087, "epoch": 3025} {"train_loss": -24.758438110351562, "global_step": 251088, "epoch": 3025} {"train_loss": -25.3872127532959, "global_step": 251089, "epoch": 3025} {"train_loss": -25.162153244018555, "global_step": 251090, "epoch": 3025} {"train_loss": -24.827360153198242, "global_step": 251091, "epoch": 3025} {"train_loss": -24.87929344177246, "global_step": 251092, "epoch": 3025} {"train_loss": -24.89784049987793, "global_step": 251093, "epoch": 3025} {"train_loss": -24.91873550415039, "global_step": 251094, "epoch": 3025} {"train_loss": -24.68651008605957, "global_step": 251095, "epoch": 3025} {"train_loss": -24.904394149780273, "global_step": 251096, "epoch": 3025} {"train_loss": -25.03850746154785, "global_step": 251097, "epoch": 3025} {"train_loss": -25.103960037231445, "global_step": 251098, "epoch": 3025} {"train_loss": -25.027523040771484, "global_step": 251099, "epoch": 3025} {"train_loss": -24.759531021118164, "global_step": 251100, "epoch": 3025} {"train_loss": -25.187793731689453, "global_step": 251101, "epoch": 3025} {"train_loss": -24.573505401611328, "global_step": 251102, "epoch": 3025} {"train_loss": -25.164045333862305, "global_step": 251103, "epoch": 3025} {"train_loss": -25.402509689331055, "global_step": 251104, "epoch": 3025} {"train_loss": -25.221359252929688, "global_step": 251105, "epoch": 3025} {"train_loss": -25.172348022460938, "global_step": 251106, "epoch": 3025} {"train_loss": -25.64629554748535, "global_step": 251107, "epoch": 3025} {"train_loss": -25.330997467041016, "global_step": 251108, "epoch": 3025} {"train_loss": -24.824325561523438, "global_step": 251109, "epoch": 3025} {"train_loss": -24.88409996032715, "global_step": 251110, "epoch": 3025} {"train_loss": -24.715322494506836, "global_step": 251111, "epoch": 3025} {"train_loss": -24.9257755279541, "global_step": 251112, "epoch": 3025} {"train_loss": -25.308841705322266, "global_step": 251113, "epoch": 3025} {"train_loss": -24.844675064086914, "global_step": 251114, "epoch": 3025} {"train_loss": -25.28242301940918, "global_step": 251115, "epoch": 3025} {"train_loss": -25.431821823120117, "global_step": 251116, "epoch": 3025} {"train_loss": -25.178518295288086, "global_step": 251117, "epoch": 3025} {"train_loss": -24.95152473449707, "global_step": 251118, "epoch": 3025} {"train_loss": -25.388818740844727, "global_step": 251119, "epoch": 3025} {"train_loss": -24.98299789428711, "global_step": 251120, "epoch": 3025} {"train_loss": -25.040477752685547, "global_step": 251121, "epoch": 3025} {"train_loss": -25.29300880432129, "global_step": 251122, "epoch": 3025} {"train_loss": -24.951871871948242, "global_step": 251123, "epoch": 3025} {"train_loss": -24.942697525024414, "global_step": 251124, "epoch": 3025} {"train_loss": -25.161298751831055, "global_step": 251125, "epoch": 3025} {"train_loss": -24.726547241210938, "global_step": 251126, "epoch": 3025} {"train_loss": -24.9809627532959, "global_step": 251127, "epoch": 3025} {"train_loss": -24.729272842407227, "global_step": 251128, "epoch": 3025} {"train_loss": -24.962644577026367, "global_step": 251129, "epoch": 3025} {"train_loss": -24.84554100036621, "global_step": 251130, "epoch": 3025} {"train_loss": -25.302885055541992, "global_step": 251131, "epoch": 3025} {"train_loss": -25.365097045898438, "global_step": 251132, "epoch": 3025} {"train_loss": -25.12229347229004, "global_step": 251133, "epoch": 3025} {"train_loss": -25.112531661987305, "global_step": 251134, "epoch": 3025} {"train_loss": -25.1324520111084, "global_step": 251135, "epoch": 3025} {"train_loss": -25.100534439086914, "global_step": 251136, "epoch": 3025} {"train_loss": -25.26179313659668, "global_step": 251137, "epoch": 3025} {"train_loss": -25.048959732055664, "global_step": 251138, "epoch": 3025} {"train_loss": -25.31157112121582, "global_step": 251139, "epoch": 3025} {"train_loss": -24.98457908630371, "global_step": 251140, "epoch": 3025} {"train_loss": -25.137828826904297, "global_step": 251141, "epoch": 3025} {"train_loss": -24.79913902282715, "global_step": 251142, "epoch": 3025} {"train_loss": -25.042434692382812, "global_step": 251143, "epoch": 3025} {"train_loss": -24.896743774414062, "global_step": 251144, "epoch": 3025} {"train_loss": -25.056928634643555, "global_step": 251145, "epoch": 3025} {"train_loss": -25.1356258392334, "global_step": 251146, "epoch": 3025} {"train_loss": -24.839431762695312, "global_step": 251147, "epoch": 3025} {"train_loss": -24.908079147338867, "global_step": 251148, "epoch": 3025} {"train_loss": -24.993247985839844, "global_step": 251149, "epoch": 3025} {"train_loss": -25.16927146911621, "global_step": 251150, "epoch": 3025} {"train_loss": -25.298704147338867, "global_step": 251151, "epoch": 3025} {"train_loss": -25.143417358398438, "global_step": 251152, "epoch": 3025} {"train_loss": -25.376853942871094, "global_step": 251153, "epoch": 3025} {"train_loss": -25.11910057067871, "global_step": 251154, "epoch": 3025} {"train_loss": -24.915395736694336, "global_step": 251155, "epoch": 3025} {"train_loss": -24.859210968017578, "global_step": 251156, "epoch": 3025} {"train_loss": -24.98959575790957, "global_step": 251157, "epoch": 3025, "val_loss": 6975059.0} {"train_loss": -24.246795654296875, "global_step": 251158, "epoch": 3026} {"train_loss": -24.13321876525879, "global_step": 251159, "epoch": 3026} {"train_loss": -24.111907958984375, "global_step": 251160, "epoch": 3026} {"train_loss": -24.528650283813477, "global_step": 251161, "epoch": 3026} {"train_loss": -24.7531795501709, "global_step": 251162, "epoch": 3026} {"train_loss": -24.453964233398438, "global_step": 251163, "epoch": 3026} {"train_loss": -24.83835220336914, "global_step": 251164, "epoch": 3026} {"train_loss": -24.923288345336914, "global_step": 251165, "epoch": 3026} {"train_loss": -24.954669952392578, "global_step": 251166, "epoch": 3026} {"train_loss": -24.79804801940918, "global_step": 251167, "epoch": 3026} {"train_loss": -24.923860549926758, "global_step": 251168, "epoch": 3026} {"train_loss": -24.79850959777832, "global_step": 251169, "epoch": 3026} {"train_loss": -24.647598266601562, "global_step": 251170, "epoch": 3026} {"train_loss": -24.768888473510742, "global_step": 251171, "epoch": 3026} {"train_loss": -24.92820167541504, "global_step": 251172, "epoch": 3026} {"train_loss": -24.994428634643555, "global_step": 251173, "epoch": 3026} {"train_loss": -24.778106689453125, "global_step": 251174, "epoch": 3026} {"train_loss": -25.3215389251709, "global_step": 251175, "epoch": 3026} {"train_loss": -24.882692337036133, "global_step": 251176, "epoch": 3026} {"train_loss": -24.835546493530273, "global_step": 251177, "epoch": 3026} {"train_loss": -24.62982749938965, "global_step": 251178, "epoch": 3026} {"train_loss": -24.6694278717041, "global_step": 251179, "epoch": 3026} {"train_loss": -24.980504989624023, "global_step": 251180, "epoch": 3026} {"train_loss": -24.774524688720703, "global_step": 251181, "epoch": 3026} {"train_loss": -24.689306259155273, "global_step": 251182, "epoch": 3026} {"train_loss": -25.037548065185547, "global_step": 251183, "epoch": 3026} {"train_loss": -24.925827026367188, "global_step": 251184, "epoch": 3026} {"train_loss": -24.710453033447266, "global_step": 251185, "epoch": 3026} {"train_loss": -25.15646743774414, "global_step": 251186, "epoch": 3026} {"train_loss": -24.993906021118164, "global_step": 251187, "epoch": 3026} {"train_loss": -24.9017333984375, "global_step": 251188, "epoch": 3026} {"train_loss": -24.959440231323242, "global_step": 251189, "epoch": 3026} {"train_loss": -24.89457130432129, "global_step": 251190, "epoch": 3026} {"train_loss": -24.727235794067383, "global_step": 251191, "epoch": 3026} {"train_loss": -24.88967514038086, "global_step": 251192, "epoch": 3026} {"train_loss": -24.91721534729004, "global_step": 251193, "epoch": 3026} {"train_loss": -25.01190185546875, "global_step": 251194, "epoch": 3026} {"train_loss": -25.094894409179688, "global_step": 251195, "epoch": 3026} {"train_loss": -24.499521255493164, "global_step": 251196, "epoch": 3026} {"train_loss": -25.43105697631836, "global_step": 251197, "epoch": 3026} {"train_loss": -25.59590721130371, "global_step": 251198, "epoch": 3026} {"train_loss": -25.039884567260742, "global_step": 251199, "epoch": 3026} {"train_loss": -24.996564865112305, "global_step": 251200, "epoch": 3026} {"train_loss": -25.00873374938965, "global_step": 251201, "epoch": 3026} {"train_loss": -25.32566261291504, "global_step": 251202, "epoch": 3026} {"train_loss": -24.83763885498047, "global_step": 251203, "epoch": 3026} {"train_loss": -24.92872428894043, "global_step": 251204, "epoch": 3026} {"train_loss": -24.89791488647461, "global_step": 251205, "epoch": 3026} {"train_loss": -25.237886428833008, "global_step": 251206, "epoch": 3026} {"train_loss": -24.962596893310547, "global_step": 251207, "epoch": 3026} {"train_loss": -24.903636932373047, "global_step": 251208, "epoch": 3026} {"train_loss": -25.24045753479004, "global_step": 251209, "epoch": 3026} {"train_loss": -25.170541763305664, "global_step": 251210, "epoch": 3026} {"train_loss": -24.510221481323242, "global_step": 251211, "epoch": 3026} {"train_loss": -24.836782455444336, "global_step": 251212, "epoch": 3026} {"train_loss": -24.91993522644043, "global_step": 251213, "epoch": 3026} {"train_loss": -25.073974609375, "global_step": 251214, "epoch": 3026} {"train_loss": -24.898832321166992, "global_step": 251215, "epoch": 3026} {"train_loss": -25.033735275268555, "global_step": 251216, "epoch": 3026} {"train_loss": -24.719633102416992, "global_step": 251217, "epoch": 3026} {"train_loss": -24.696033477783203, "global_step": 251218, "epoch": 3026} {"train_loss": -25.091594696044922, "global_step": 251219, "epoch": 3026} {"train_loss": -24.770431518554688, "global_step": 251220, "epoch": 3026} {"train_loss": -24.956878662109375, "global_step": 251221, "epoch": 3026} {"train_loss": -25.25467872619629, "global_step": 251222, "epoch": 3026} {"train_loss": -24.747663497924805, "global_step": 251223, "epoch": 3026} {"train_loss": -24.836692810058594, "global_step": 251224, "epoch": 3026} {"train_loss": -25.342023849487305, "global_step": 251225, "epoch": 3026} {"train_loss": -25.099599838256836, "global_step": 251226, "epoch": 3026} {"train_loss": -24.98464012145996, "global_step": 251227, "epoch": 3026} {"train_loss": -25.013002395629883, "global_step": 251228, "epoch": 3026} {"train_loss": -24.87177848815918, "global_step": 251229, "epoch": 3026} {"train_loss": -24.889738082885742, "global_step": 251230, "epoch": 3026} {"train_loss": -24.879751205444336, "global_step": 251231, "epoch": 3026} {"train_loss": -24.977869033813477, "global_step": 251232, "epoch": 3026} {"train_loss": -25.08841323852539, "global_step": 251233, "epoch": 3026} {"train_loss": -25.218402862548828, "global_step": 251234, "epoch": 3026} {"train_loss": -25.0986385345459, "global_step": 251235, "epoch": 3026} {"train_loss": -24.972883224487305, "global_step": 251236, "epoch": 3026} {"train_loss": -25.375097274780273, "global_step": 251237, "epoch": 3026} {"train_loss": -25.264968872070312, "global_step": 251238, "epoch": 3026} {"train_loss": -24.474424362182617, "global_step": 251239, "epoch": 3026} {"train_loss": -24.919318371508496, "global_step": 251240, "epoch": 3026, "val_loss": 6951035.0} {"train_loss": -24.25807762145996, "global_step": 251241, "epoch": 3027} {"train_loss": -24.365535736083984, "global_step": 251242, "epoch": 3027} {"train_loss": -24.595064163208008, "global_step": 251243, "epoch": 3027} {"train_loss": -24.116384506225586, "global_step": 251244, "epoch": 3027} {"train_loss": -24.630483627319336, "global_step": 251245, "epoch": 3027} {"train_loss": -24.568899154663086, "global_step": 251246, "epoch": 3027} {"train_loss": -24.8508358001709, "global_step": 251247, "epoch": 3027} {"train_loss": -24.9154109954834, "global_step": 251248, "epoch": 3027} {"train_loss": -25.034215927124023, "global_step": 251249, "epoch": 3027} {"train_loss": -24.569782257080078, "global_step": 251250, "epoch": 3027} {"train_loss": -25.060163497924805, "global_step": 251251, "epoch": 3027} {"train_loss": -24.438709259033203, "global_step": 251252, "epoch": 3027} {"train_loss": -24.50587272644043, "global_step": 251253, "epoch": 3027} {"train_loss": -24.680194854736328, "global_step": 251254, "epoch": 3027} {"train_loss": -25.05530548095703, "global_step": 251255, "epoch": 3027} {"train_loss": -24.652843475341797, "global_step": 251256, "epoch": 3027} {"train_loss": -24.9774227142334, "global_step": 251257, "epoch": 3027} {"train_loss": -24.805261611938477, "global_step": 251258, "epoch": 3027} {"train_loss": -25.030622482299805, "global_step": 251259, "epoch": 3027} {"train_loss": -24.91126823425293, "global_step": 251260, "epoch": 3027} {"train_loss": -24.636728286743164, "global_step": 251261, "epoch": 3027} {"train_loss": -25.169692993164062, "global_step": 251262, "epoch": 3027} {"train_loss": -24.88690185546875, "global_step": 251263, "epoch": 3027} {"train_loss": -24.403034210205078, "global_step": 251264, "epoch": 3027} {"train_loss": -24.95699119567871, "global_step": 251265, "epoch": 3027} {"train_loss": -25.03925323486328, "global_step": 251266, "epoch": 3027} {"train_loss": -24.957712173461914, "global_step": 251267, "epoch": 3027} {"train_loss": -24.82559585571289, "global_step": 251268, "epoch": 3027} {"train_loss": -24.971364974975586, "global_step": 251269, "epoch": 3027} {"train_loss": -25.40577507019043, "global_step": 251270, "epoch": 3027} {"train_loss": -24.94345474243164, "global_step": 251271, "epoch": 3027} {"train_loss": -25.347314834594727, "global_step": 251272, "epoch": 3027} {"train_loss": -25.204864501953125, "global_step": 251273, "epoch": 3027} {"train_loss": -25.45846939086914, "global_step": 251274, "epoch": 3027} {"train_loss": -24.992080688476562, "global_step": 251275, "epoch": 3027} {"train_loss": -25.45734977722168, "global_step": 251276, "epoch": 3027} {"train_loss": -25.02855682373047, "global_step": 251277, "epoch": 3027} {"train_loss": -25.384519577026367, "global_step": 251278, "epoch": 3027} {"train_loss": -24.731582641601562, "global_step": 251279, "epoch": 3027} {"train_loss": -25.066486358642578, "global_step": 251280, "epoch": 3027} {"train_loss": -25.071420669555664, "global_step": 251281, "epoch": 3027} {"train_loss": -25.005821228027344, "global_step": 251282, "epoch": 3027} {"train_loss": -25.21772575378418, "global_step": 251283, "epoch": 3027} {"train_loss": -25.3536434173584, "global_step": 251284, "epoch": 3027} {"train_loss": -25.063892364501953, "global_step": 251285, "epoch": 3027} {"train_loss": -24.784835815429688, "global_step": 251286, "epoch": 3027} {"train_loss": -25.057767868041992, "global_step": 251287, "epoch": 3027} {"train_loss": -25.15028953552246, "global_step": 251288, "epoch": 3027} {"train_loss": -25.410703659057617, "global_step": 251289, "epoch": 3027} {"train_loss": -25.263160705566406, "global_step": 251290, "epoch": 3027} {"train_loss": -24.95508575439453, "global_step": 251291, "epoch": 3027} {"train_loss": -24.809539794921875, "global_step": 251292, "epoch": 3027} {"train_loss": -25.03607940673828, "global_step": 251293, "epoch": 3027} {"train_loss": -24.873441696166992, "global_step": 251294, "epoch": 3027} {"train_loss": -24.990201950073242, "global_step": 251295, "epoch": 3027} {"train_loss": -25.180377960205078, "global_step": 251296, "epoch": 3027} {"train_loss": -25.240694046020508, "global_step": 251297, "epoch": 3027} {"train_loss": -24.91756820678711, "global_step": 251298, "epoch": 3027} {"train_loss": -24.875553131103516, "global_step": 251299, "epoch": 3027} {"train_loss": -25.231769561767578, "global_step": 251300, "epoch": 3027} {"train_loss": -25.152053833007812, "global_step": 251301, "epoch": 3027} {"train_loss": -25.113927841186523, "global_step": 251302, "epoch": 3027} {"train_loss": -25.252187728881836, "global_step": 251303, "epoch": 3027} {"train_loss": -25.30510902404785, "global_step": 251304, "epoch": 3027} {"train_loss": -25.249088287353516, "global_step": 251305, "epoch": 3027} {"train_loss": -25.63648796081543, "global_step": 251306, "epoch": 3027} {"train_loss": -25.51954460144043, "global_step": 251307, "epoch": 3027} {"train_loss": -25.34113121032715, "global_step": 251308, "epoch": 3027} {"train_loss": -25.034385681152344, "global_step": 251309, "epoch": 3027} {"train_loss": -25.10504722595215, "global_step": 251310, "epoch": 3027} {"train_loss": -24.960052490234375, "global_step": 251311, "epoch": 3027} {"train_loss": -24.7447566986084, "global_step": 251312, "epoch": 3027} {"train_loss": -24.965835571289062, "global_step": 251313, "epoch": 3027} {"train_loss": -25.07305908203125, "global_step": 251314, "epoch": 3027} {"train_loss": -24.891952514648438, "global_step": 251315, "epoch": 3027} {"train_loss": -24.98284149169922, "global_step": 251316, "epoch": 3027} {"train_loss": -24.96848487854004, "global_step": 251317, "epoch": 3027} {"train_loss": -25.075481414794922, "global_step": 251318, "epoch": 3027} {"train_loss": -25.067604064941406, "global_step": 251319, "epoch": 3027} {"train_loss": -25.13776206970215, "global_step": 251320, "epoch": 3027} {"train_loss": -24.877042770385742, "global_step": 251321, "epoch": 3027} {"train_loss": -24.966703414916992, "global_step": 251322, "epoch": 3027} {"train_loss": -25.015943596161993, "global_step": 251323, "epoch": 3027, "val_loss": 6803420.0} {"train_loss": -24.01828384399414, "global_step": 251324, "epoch": 3028} {"train_loss": -24.278432846069336, "global_step": 251325, "epoch": 3028} {"train_loss": -24.785186767578125, "global_step": 251326, "epoch": 3028} {"train_loss": -24.6771183013916, "global_step": 251327, "epoch": 3028} {"train_loss": -24.675073623657227, "global_step": 251328, "epoch": 3028} {"train_loss": -24.659948348999023, "global_step": 251329, "epoch": 3028} {"train_loss": -24.761241912841797, "global_step": 251330, "epoch": 3028} {"train_loss": -24.543556213378906, "global_step": 251331, "epoch": 3028} {"train_loss": -24.827838897705078, "global_step": 251332, "epoch": 3028} {"train_loss": -24.940006256103516, "global_step": 251333, "epoch": 3028} {"train_loss": -24.652326583862305, "global_step": 251334, "epoch": 3028} {"train_loss": -24.77931022644043, "global_step": 251335, "epoch": 3028} {"train_loss": -25.208410263061523, "global_step": 251336, "epoch": 3028} {"train_loss": -24.66448211669922, "global_step": 251337, "epoch": 3028} {"train_loss": -24.654979705810547, "global_step": 251338, "epoch": 3028} {"train_loss": -24.405197143554688, "global_step": 251339, "epoch": 3028} {"train_loss": -24.24176597595215, "global_step": 251340, "epoch": 3028} {"train_loss": -24.535724639892578, "global_step": 251341, "epoch": 3028} {"train_loss": -24.843719482421875, "global_step": 251342, "epoch": 3028} {"train_loss": -24.970752716064453, "global_step": 251343, "epoch": 3028} {"train_loss": -24.66059684753418, "global_step": 251344, "epoch": 3028} {"train_loss": -25.045602798461914, "global_step": 251345, "epoch": 3028} {"train_loss": -24.841453552246094, "global_step": 251346, "epoch": 3028} {"train_loss": -25.159744262695312, "global_step": 251347, "epoch": 3028} {"train_loss": -24.545185089111328, "global_step": 251348, "epoch": 3028} {"train_loss": -24.96687889099121, "global_step": 251349, "epoch": 3028} {"train_loss": -24.8568115234375, "global_step": 251350, "epoch": 3028} {"train_loss": -24.93610954284668, "global_step": 251351, "epoch": 3028} {"train_loss": -24.846385955810547, "global_step": 251352, "epoch": 3028} {"train_loss": -25.11359977722168, "global_step": 251353, "epoch": 3028} {"train_loss": -24.878305435180664, "global_step": 251354, "epoch": 3028} {"train_loss": -24.68487548828125, "global_step": 251355, "epoch": 3028} {"train_loss": -24.906150817871094, "global_step": 251356, "epoch": 3028} {"train_loss": -24.793598175048828, "global_step": 251357, "epoch": 3028} {"train_loss": -25.10654067993164, "global_step": 251358, "epoch": 3028} {"train_loss": -25.04745864868164, "global_step": 251359, "epoch": 3028} {"train_loss": -24.83821678161621, "global_step": 251360, "epoch": 3028} {"train_loss": -24.942813873291016, "global_step": 251361, "epoch": 3028} {"train_loss": -24.95148277282715, "global_step": 251362, "epoch": 3028} {"train_loss": -25.022262573242188, "global_step": 251363, "epoch": 3028} {"train_loss": -24.93279266357422, "global_step": 251364, "epoch": 3028} {"train_loss": -24.85350799560547, "global_step": 251365, "epoch": 3028} {"train_loss": -24.75819969177246, "global_step": 251366, "epoch": 3028} {"train_loss": -25.176359176635742, "global_step": 251367, "epoch": 3028} {"train_loss": -25.07986831665039, "global_step": 251368, "epoch": 3028} {"train_loss": -25.05229949951172, "global_step": 251369, "epoch": 3028} {"train_loss": -25.220623016357422, "global_step": 251370, "epoch": 3028} {"train_loss": -25.280668258666992, "global_step": 251371, "epoch": 3028} {"train_loss": -25.16001319885254, "global_step": 251372, "epoch": 3028} {"train_loss": -25.272308349609375, "global_step": 251373, "epoch": 3028} {"train_loss": -24.870193481445312, "global_step": 251374, "epoch": 3028} {"train_loss": -25.399658203125, "global_step": 251375, "epoch": 3028} {"train_loss": -25.158248901367188, "global_step": 251376, "epoch": 3028} {"train_loss": -25.27144432067871, "global_step": 251377, "epoch": 3028} {"train_loss": -25.351247787475586, "global_step": 251378, "epoch": 3028} {"train_loss": -25.118961334228516, "global_step": 251379, "epoch": 3028} {"train_loss": -25.011938095092773, "global_step": 251380, "epoch": 3028} {"train_loss": -25.045595169067383, "global_step": 251381, "epoch": 3028} {"train_loss": -25.086589813232422, "global_step": 251382, "epoch": 3028} {"train_loss": -25.038867950439453, "global_step": 251383, "epoch": 3028} {"train_loss": -24.990753173828125, "global_step": 251384, "epoch": 3028} {"train_loss": -25.389535903930664, "global_step": 251385, "epoch": 3028} {"train_loss": -25.297399520874023, "global_step": 251386, "epoch": 3028} {"train_loss": -25.007688522338867, "global_step": 251387, "epoch": 3028} {"train_loss": -24.96953582763672, "global_step": 251388, "epoch": 3028} {"train_loss": -25.024070739746094, "global_step": 251389, "epoch": 3028} {"train_loss": -25.348392486572266, "global_step": 251390, "epoch": 3028} {"train_loss": -24.78359031677246, "global_step": 251391, "epoch": 3028} {"train_loss": -25.351924896240234, "global_step": 251392, "epoch": 3028} {"train_loss": -25.296688079833984, "global_step": 251393, "epoch": 3028} {"train_loss": -25.22321891784668, "global_step": 251394, "epoch": 3028} {"train_loss": -25.361331939697266, "global_step": 251395, "epoch": 3028} {"train_loss": -25.20755386352539, "global_step": 251396, "epoch": 3028} {"train_loss": -24.94117546081543, "global_step": 251397, "epoch": 3028} {"train_loss": -24.91316795349121, "global_step": 251398, "epoch": 3028} {"train_loss": -25.15325355529785, "global_step": 251399, "epoch": 3028} {"train_loss": -24.735668182373047, "global_step": 251400, "epoch": 3028} {"train_loss": -24.864835739135742, "global_step": 251401, "epoch": 3028} {"train_loss": -25.294601440429688, "global_step": 251402, "epoch": 3028} {"train_loss": -25.22585105895996, "global_step": 251403, "epoch": 3028} {"train_loss": -24.98452377319336, "global_step": 251404, "epoch": 3028} {"train_loss": -25.38693618774414, "global_step": 251405, "epoch": 3028} {"train_loss": -24.94909684054823, "global_step": 251406, "epoch": 3028, "val_loss": 6992180.0} {"train_loss": -23.99810791015625, "global_step": 251407, "epoch": 3029} {"train_loss": -24.43216896057129, "global_step": 251408, "epoch": 3029} {"train_loss": -24.33877944946289, "global_step": 251409, "epoch": 3029} {"train_loss": -24.138479232788086, "global_step": 251410, "epoch": 3029} {"train_loss": -24.19565773010254, "global_step": 251411, "epoch": 3029} {"train_loss": -23.964832305908203, "global_step": 251412, "epoch": 3029} {"train_loss": -24.643686294555664, "global_step": 251413, "epoch": 3029} {"train_loss": -24.23462677001953, "global_step": 251414, "epoch": 3029} {"train_loss": -24.459779739379883, "global_step": 251415, "epoch": 3029} {"train_loss": -23.876182556152344, "global_step": 251416, "epoch": 3029} {"train_loss": -23.95285415649414, "global_step": 251417, "epoch": 3029} {"train_loss": -24.732830047607422, "global_step": 251418, "epoch": 3029} {"train_loss": -24.258398056030273, "global_step": 251419, "epoch": 3029} {"train_loss": -24.320859909057617, "global_step": 251420, "epoch": 3029} {"train_loss": -24.824180603027344, "global_step": 251421, "epoch": 3029} {"train_loss": -24.84515380859375, "global_step": 251422, "epoch": 3029} {"train_loss": -24.280134201049805, "global_step": 251423, "epoch": 3029} {"train_loss": -24.77875518798828, "global_step": 251424, "epoch": 3029} {"train_loss": -24.63399314880371, "global_step": 251425, "epoch": 3029} {"train_loss": -24.750951766967773, "global_step": 251426, "epoch": 3029} {"train_loss": -24.78025245666504, "global_step": 251427, "epoch": 3029} {"train_loss": -24.803115844726562, "global_step": 251428, "epoch": 3029} {"train_loss": -24.69342613220215, "global_step": 251429, "epoch": 3029} {"train_loss": -24.653644561767578, "global_step": 251430, "epoch": 3029} {"train_loss": -24.986495971679688, "global_step": 251431, "epoch": 3029} {"train_loss": -24.91950035095215, "global_step": 251432, "epoch": 3029} {"train_loss": -24.62973976135254, "global_step": 251433, "epoch": 3029} {"train_loss": -24.975418090820312, "global_step": 251434, "epoch": 3029} {"train_loss": -24.874496459960938, "global_step": 251435, "epoch": 3029} {"train_loss": -25.22321891784668, "global_step": 251436, "epoch": 3029} {"train_loss": -24.944236755371094, "global_step": 251437, "epoch": 3029} {"train_loss": -25.039396286010742, "global_step": 251438, "epoch": 3029} {"train_loss": -24.92963218688965, "global_step": 251439, "epoch": 3029} {"train_loss": -24.984037399291992, "global_step": 251440, "epoch": 3029} {"train_loss": -25.07222557067871, "global_step": 251441, "epoch": 3029} {"train_loss": -25.100902557373047, "global_step": 251442, "epoch": 3029} {"train_loss": -25.19099235534668, "global_step": 251443, "epoch": 3029} {"train_loss": -25.22907066345215, "global_step": 251444, "epoch": 3029} {"train_loss": -24.776235580444336, "global_step": 251445, "epoch": 3029} {"train_loss": -25.511762619018555, "global_step": 251446, "epoch": 3029} {"train_loss": -25.148481369018555, "global_step": 251447, "epoch": 3029} {"train_loss": -25.54237174987793, "global_step": 251448, "epoch": 3029} {"train_loss": -25.329193115234375, "global_step": 251449, "epoch": 3029} {"train_loss": -25.225540161132812, "global_step": 251450, "epoch": 3029} {"train_loss": -24.82979393005371, "global_step": 251451, "epoch": 3029} {"train_loss": -24.783544540405273, "global_step": 251452, "epoch": 3029} {"train_loss": -24.71155548095703, "global_step": 251453, "epoch": 3029} {"train_loss": -25.109891891479492, "global_step": 251454, "epoch": 3029} {"train_loss": -25.291107177734375, "global_step": 251455, "epoch": 3029} {"train_loss": -24.991308212280273, "global_step": 251456, "epoch": 3029} {"train_loss": -25.184146881103516, "global_step": 251457, "epoch": 3029} {"train_loss": -24.848419189453125, "global_step": 251458, "epoch": 3029} {"train_loss": -25.11529541015625, "global_step": 251459, "epoch": 3029} {"train_loss": -24.955154418945312, "global_step": 251460, "epoch": 3029} {"train_loss": -24.71418571472168, "global_step": 251461, "epoch": 3029} {"train_loss": -25.231246948242188, "global_step": 251462, "epoch": 3029} {"train_loss": -25.132503509521484, "global_step": 251463, "epoch": 3029} {"train_loss": -24.7303409576416, "global_step": 251464, "epoch": 3029} {"train_loss": -25.11359214782715, "global_step": 251465, "epoch": 3029} {"train_loss": -25.014101028442383, "global_step": 251466, "epoch": 3029} {"train_loss": -24.93202018737793, "global_step": 251467, "epoch": 3029} {"train_loss": -24.931793212890625, "global_step": 251468, "epoch": 3029} {"train_loss": -25.101215362548828, "global_step": 251469, "epoch": 3029} {"train_loss": -25.019376754760742, "global_step": 251470, "epoch": 3029} {"train_loss": -25.19136619567871, "global_step": 251471, "epoch": 3029} {"train_loss": -25.01137351989746, "global_step": 251472, "epoch": 3029} {"train_loss": -25.175817489624023, "global_step": 251473, "epoch": 3029} {"train_loss": -25.19576072692871, "global_step": 251474, "epoch": 3029} {"train_loss": -25.056272506713867, "global_step": 251475, "epoch": 3029} {"train_loss": -24.951536178588867, "global_step": 251476, "epoch": 3029} {"train_loss": -24.9608097076416, "global_step": 251477, "epoch": 3029} {"train_loss": -25.142383575439453, "global_step": 251478, "epoch": 3029} {"train_loss": -25.104278564453125, "global_step": 251479, "epoch": 3029} {"train_loss": -25.196447372436523, "global_step": 251480, "epoch": 3029} {"train_loss": -25.031997680664062, "global_step": 251481, "epoch": 3029} {"train_loss": -24.92880630493164, "global_step": 251482, "epoch": 3029} {"train_loss": -24.888477325439453, "global_step": 251483, "epoch": 3029} {"train_loss": -25.188007354736328, "global_step": 251484, "epoch": 3029} {"train_loss": -25.087726593017578, "global_step": 251485, "epoch": 3029} {"train_loss": -25.258804321289062, "global_step": 251486, "epoch": 3029} {"train_loss": -25.026031494140625, "global_step": 251487, "epoch": 3029} {"train_loss": -24.977096557617188, "global_step": 251488, "epoch": 3029} {"train_loss": -24.881568770810784, "global_step": 251489, "epoch": 3029, "val_loss": 6814417.0} {"train_loss": -22.58791732788086, "global_step": 251490, "epoch": 3030} {"train_loss": -23.40997886657715, "global_step": 251491, "epoch": 3030} {"train_loss": -24.415281295776367, "global_step": 251492, "epoch": 3030} {"train_loss": -24.243946075439453, "global_step": 251493, "epoch": 3030} {"train_loss": -23.987672805786133, "global_step": 251494, "epoch": 3030} {"train_loss": -24.428909301757812, "global_step": 251495, "epoch": 3030} {"train_loss": -24.089452743530273, "global_step": 251496, "epoch": 3030} {"train_loss": -24.634782791137695, "global_step": 251497, "epoch": 3030} {"train_loss": -24.470993041992188, "global_step": 251498, "epoch": 3030} {"train_loss": -24.840124130249023, "global_step": 251499, "epoch": 3030} {"train_loss": -24.110074996948242, "global_step": 251500, "epoch": 3030} {"train_loss": -24.49934959411621, "global_step": 251501, "epoch": 3030} {"train_loss": -24.40105438232422, "global_step": 251502, "epoch": 3030} {"train_loss": -24.487674713134766, "global_step": 251503, "epoch": 3030} {"train_loss": -24.93916130065918, "global_step": 251504, "epoch": 3030} {"train_loss": -24.78688621520996, "global_step": 251505, "epoch": 3030} {"train_loss": -25.025270462036133, "global_step": 251506, "epoch": 3030} {"train_loss": -24.802093505859375, "global_step": 251507, "epoch": 3030} {"train_loss": -24.909183502197266, "global_step": 251508, "epoch": 3030} {"train_loss": -24.61051368713379, "global_step": 251509, "epoch": 3030} {"train_loss": -24.540197372436523, "global_step": 251510, "epoch": 3030} {"train_loss": -25.169660568237305, "global_step": 251511, "epoch": 3030} {"train_loss": -24.882389068603516, "global_step": 251512, "epoch": 3030} {"train_loss": -24.878671646118164, "global_step": 251513, "epoch": 3030} {"train_loss": -24.29863929748535, "global_step": 251514, "epoch": 3030} {"train_loss": -24.86661148071289, "global_step": 251515, "epoch": 3030} {"train_loss": -24.57401466369629, "global_step": 251516, "epoch": 3030} {"train_loss": -25.122358322143555, "global_step": 251517, "epoch": 3030} {"train_loss": -24.695632934570312, "global_step": 251518, "epoch": 3030} {"train_loss": -25.323699951171875, "global_step": 251519, "epoch": 3030} {"train_loss": -25.15492057800293, "global_step": 251520, "epoch": 3030} {"train_loss": -24.83266258239746, "global_step": 251521, "epoch": 3030} {"train_loss": -24.483524322509766, "global_step": 251522, "epoch": 3030} {"train_loss": -24.969085693359375, "global_step": 251523, "epoch": 3030} {"train_loss": -25.008459091186523, "global_step": 251524, "epoch": 3030} {"train_loss": -25.061019897460938, "global_step": 251525, "epoch": 3030} {"train_loss": -25.02004623413086, "global_step": 251526, "epoch": 3030} {"train_loss": -25.374013900756836, "global_step": 251527, "epoch": 3030} {"train_loss": -25.09942054748535, "global_step": 251528, "epoch": 3030} {"train_loss": -25.290075302124023, "global_step": 251529, "epoch": 3030} {"train_loss": -25.01039695739746, "global_step": 251530, "epoch": 3030} {"train_loss": -25.177143096923828, "global_step": 251531, "epoch": 3030} {"train_loss": -24.980024337768555, "global_step": 251532, "epoch": 3030} {"train_loss": -25.01534080505371, "global_step": 251533, "epoch": 3030} {"train_loss": -24.828144073486328, "global_step": 251534, "epoch": 3030} {"train_loss": -25.238056182861328, "global_step": 251535, "epoch": 3030} {"train_loss": -24.995290756225586, "global_step": 251536, "epoch": 3030} {"train_loss": -25.03253173828125, "global_step": 251537, "epoch": 3030} {"train_loss": -25.188879013061523, "global_step": 251538, "epoch": 3030} {"train_loss": -25.256845474243164, "global_step": 251539, "epoch": 3030} {"train_loss": -24.594465255737305, "global_step": 251540, "epoch": 3030} {"train_loss": -25.09718132019043, "global_step": 251541, "epoch": 3030} {"train_loss": -25.3427791595459, "global_step": 251542, "epoch": 3030} {"train_loss": -25.32883071899414, "global_step": 251543, "epoch": 3030} {"train_loss": -25.14524269104004, "global_step": 251544, "epoch": 3030} {"train_loss": -25.10943031311035, "global_step": 251545, "epoch": 3030} {"train_loss": -24.9239559173584, "global_step": 251546, "epoch": 3030} {"train_loss": -25.162582397460938, "global_step": 251547, "epoch": 3030} {"train_loss": -25.4017391204834, "global_step": 251548, "epoch": 3030} {"train_loss": -25.253686904907227, "global_step": 251549, "epoch": 3030} {"train_loss": -25.121381759643555, "global_step": 251550, "epoch": 3030} {"train_loss": -25.054601669311523, "global_step": 251551, "epoch": 3030} {"train_loss": -25.031633377075195, "global_step": 251552, "epoch": 3030} {"train_loss": -24.888938903808594, "global_step": 251553, "epoch": 3030} {"train_loss": -25.401960372924805, "global_step": 251554, "epoch": 3030} {"train_loss": -25.144718170166016, "global_step": 251555, "epoch": 3030} {"train_loss": -25.27555274963379, "global_step": 251556, "epoch": 3030} {"train_loss": -25.10958480834961, "global_step": 251557, "epoch": 3030} {"train_loss": -25.457151412963867, "global_step": 251558, "epoch": 3030} {"train_loss": -24.97585105895996, "global_step": 251559, "epoch": 3030} {"train_loss": -24.442594528198242, "global_step": 251560, "epoch": 3030} {"train_loss": -24.770292282104492, "global_step": 251561, "epoch": 3030} {"train_loss": -24.72463607788086, "global_step": 251562, "epoch": 3030} {"train_loss": -24.695560455322266, "global_step": 251563, "epoch": 3030} {"train_loss": -25.145038604736328, "global_step": 251564, "epoch": 3030} {"train_loss": -24.859024047851562, "global_step": 251565, "epoch": 3030} {"train_loss": -25.00636863708496, "global_step": 251566, "epoch": 3030} {"train_loss": -24.837369918823242, "global_step": 251567, "epoch": 3030} {"train_loss": -24.959949493408203, "global_step": 251568, "epoch": 3030} {"train_loss": -24.42171859741211, "global_step": 251569, "epoch": 3030} {"train_loss": -24.807249069213867, "global_step": 251570, "epoch": 3030} {"train_loss": -25.080352783203125, "global_step": 251571, "epoch": 3030} {"train_loss": -24.84425250593438, "global_step": 251572, "epoch": 3030, "val_loss": 6880273.0} {"train_loss": -23.967275619506836, "global_step": 251573, "epoch": 3031} {"train_loss": -23.946531295776367, "global_step": 251574, "epoch": 3031} {"train_loss": -24.764074325561523, "global_step": 251575, "epoch": 3031} {"train_loss": -23.020124435424805, "global_step": 251576, "epoch": 3031} {"train_loss": -23.682636260986328, "global_step": 251577, "epoch": 3031} {"train_loss": -24.79817771911621, "global_step": 251578, "epoch": 3031} {"train_loss": -24.373737335205078, "global_step": 251579, "epoch": 3031} {"train_loss": -24.768613815307617, "global_step": 251580, "epoch": 3031} {"train_loss": -24.367774963378906, "global_step": 251581, "epoch": 3031} {"train_loss": -24.37367057800293, "global_step": 251582, "epoch": 3031} {"train_loss": -23.874425888061523, "global_step": 251583, "epoch": 3031} {"train_loss": -24.677141189575195, "global_step": 251584, "epoch": 3031} {"train_loss": -24.448225021362305, "global_step": 251585, "epoch": 3031} {"train_loss": -24.462966918945312, "global_step": 251586, "epoch": 3031} {"train_loss": -24.585538864135742, "global_step": 251587, "epoch": 3031} {"train_loss": -24.70119285583496, "global_step": 251588, "epoch": 3031} {"train_loss": -24.737136840820312, "global_step": 251589, "epoch": 3031} {"train_loss": -24.672483444213867, "global_step": 251590, "epoch": 3031} {"train_loss": -25.080188751220703, "global_step": 251591, "epoch": 3031} {"train_loss": -24.623794555664062, "global_step": 251592, "epoch": 3031} {"train_loss": -24.619535446166992, "global_step": 251593, "epoch": 3031} {"train_loss": -24.75692367553711, "global_step": 251594, "epoch": 3031} {"train_loss": -24.86620330810547, "global_step": 251595, "epoch": 3031} {"train_loss": -24.812849044799805, "global_step": 251596, "epoch": 3031} {"train_loss": -24.917877197265625, "global_step": 251597, "epoch": 3031} {"train_loss": -24.917512893676758, "global_step": 251598, "epoch": 3031} {"train_loss": -25.268985748291016, "global_step": 251599, "epoch": 3031} {"train_loss": -25.01747703552246, "global_step": 251600, "epoch": 3031} {"train_loss": -24.783950805664062, "global_step": 251601, "epoch": 3031} {"train_loss": -24.88556480407715, "global_step": 251602, "epoch": 3031} {"train_loss": -24.83728790283203, "global_step": 251603, "epoch": 3031} {"train_loss": -25.135696411132812, "global_step": 251604, "epoch": 3031} {"train_loss": -25.212261199951172, "global_step": 251605, "epoch": 3031} {"train_loss": -24.853851318359375, "global_step": 251606, "epoch": 3031} {"train_loss": -25.175251007080078, "global_step": 251607, "epoch": 3031} {"train_loss": -25.19826316833496, "global_step": 251608, "epoch": 3031} {"train_loss": -24.9434757232666, "global_step": 251609, "epoch": 3031} {"train_loss": -24.909854888916016, "global_step": 251610, "epoch": 3031} {"train_loss": -25.16218376159668, "global_step": 251611, "epoch": 3031} {"train_loss": -25.097822189331055, "global_step": 251612, "epoch": 3031} {"train_loss": -25.199352264404297, "global_step": 251613, "epoch": 3031} {"train_loss": -25.303852081298828, "global_step": 251614, "epoch": 3031} {"train_loss": -25.036884307861328, "global_step": 251615, "epoch": 3031} {"train_loss": -24.817625045776367, "global_step": 251616, "epoch": 3031} {"train_loss": -24.86995506286621, "global_step": 251617, "epoch": 3031} {"train_loss": -25.084409713745117, "global_step": 251618, "epoch": 3031} {"train_loss": -24.971582412719727, "global_step": 251619, "epoch": 3031} {"train_loss": -25.276588439941406, "global_step": 251620, "epoch": 3031} {"train_loss": -24.836763381958008, "global_step": 251621, "epoch": 3031} {"train_loss": -25.064823150634766, "global_step": 251622, "epoch": 3031} {"train_loss": -25.027908325195312, "global_step": 251623, "epoch": 3031} {"train_loss": -25.346942901611328, "global_step": 251624, "epoch": 3031} {"train_loss": -25.136337280273438, "global_step": 251625, "epoch": 3031} {"train_loss": -25.0700626373291, "global_step": 251626, "epoch": 3031} {"train_loss": -25.097715377807617, "global_step": 251627, "epoch": 3031} {"train_loss": -24.925519943237305, "global_step": 251628, "epoch": 3031} {"train_loss": -24.59253692626953, "global_step": 251629, "epoch": 3031} {"train_loss": -25.283832550048828, "global_step": 251630, "epoch": 3031} {"train_loss": -25.02951431274414, "global_step": 251631, "epoch": 3031} {"train_loss": -24.8737850189209, "global_step": 251632, "epoch": 3031} {"train_loss": -25.3341121673584, "global_step": 251633, "epoch": 3031} {"train_loss": -25.7612247467041, "global_step": 251634, "epoch": 3031} {"train_loss": -24.528507232666016, "global_step": 251635, "epoch": 3031} {"train_loss": -24.981061935424805, "global_step": 251636, "epoch": 3031} {"train_loss": -25.09962272644043, "global_step": 251637, "epoch": 3031} {"train_loss": -24.89182472229004, "global_step": 251638, "epoch": 3031} {"train_loss": -25.32920265197754, "global_step": 251639, "epoch": 3031} {"train_loss": -25.15520668029785, "global_step": 251640, "epoch": 3031} {"train_loss": -24.57969093322754, "global_step": 251641, "epoch": 3031} {"train_loss": -24.992321014404297, "global_step": 251642, "epoch": 3031} {"train_loss": -25.10048484802246, "global_step": 251643, "epoch": 3031} {"train_loss": -24.683340072631836, "global_step": 251644, "epoch": 3031} {"train_loss": -24.558792114257812, "global_step": 251645, "epoch": 3031} {"train_loss": -24.984722137451172, "global_step": 251646, "epoch": 3031} {"train_loss": -24.857816696166992, "global_step": 251647, "epoch": 3031} {"train_loss": -24.5269832611084, "global_step": 251648, "epoch": 3031} {"train_loss": -24.906461715698242, "global_step": 251649, "epoch": 3031} {"train_loss": -24.96969985961914, "global_step": 251650, "epoch": 3031} {"train_loss": -25.006336212158203, "global_step": 251651, "epoch": 3031} {"train_loss": -25.35888671875, "global_step": 251652, "epoch": 3031} {"train_loss": -25.011640548706055, "global_step": 251653, "epoch": 3031} {"train_loss": -24.863798141479492, "global_step": 251654, "epoch": 3031} {"train_loss": -24.829421836209583, "global_step": 251655, "epoch": 3031, "val_loss": 6939395.5} {"train_loss": -23.717134475708008, "global_step": 251656, "epoch": 3032} {"train_loss": -24.903797149658203, "global_step": 251657, "epoch": 3032} {"train_loss": -23.60560417175293, "global_step": 251658, "epoch": 3032} {"train_loss": -24.1324405670166, "global_step": 251659, "epoch": 3032} {"train_loss": -24.506765365600586, "global_step": 251660, "epoch": 3032} {"train_loss": -24.247289657592773, "global_step": 251661, "epoch": 3032} {"train_loss": -24.523883819580078, "global_step": 251662, "epoch": 3032} {"train_loss": -24.319074630737305, "global_step": 251663, "epoch": 3032} {"train_loss": -24.25011444091797, "global_step": 251664, "epoch": 3032} {"train_loss": -24.51946449279785, "global_step": 251665, "epoch": 3032} {"train_loss": -24.750152587890625, "global_step": 251666, "epoch": 3032} {"train_loss": -24.729917526245117, "global_step": 251667, "epoch": 3032} {"train_loss": -24.970081329345703, "global_step": 251668, "epoch": 3032} {"train_loss": -24.506567001342773, "global_step": 251669, "epoch": 3032} {"train_loss": -24.64735221862793, "global_step": 251670, "epoch": 3032} {"train_loss": -24.674640655517578, "global_step": 251671, "epoch": 3032} {"train_loss": -24.834558486938477, "global_step": 251672, "epoch": 3032} {"train_loss": -24.429935455322266, "global_step": 251673, "epoch": 3032} {"train_loss": -25.16096305847168, "global_step": 251674, "epoch": 3032} {"train_loss": -24.586313247680664, "global_step": 251675, "epoch": 3032} {"train_loss": -24.525299072265625, "global_step": 251676, "epoch": 3032} {"train_loss": -24.80840301513672, "global_step": 251677, "epoch": 3032} {"train_loss": -25.319944381713867, "global_step": 251678, "epoch": 3032} {"train_loss": -24.719717025756836, "global_step": 251679, "epoch": 3032} {"train_loss": -25.25311851501465, "global_step": 251680, "epoch": 3032} {"train_loss": -24.669591903686523, "global_step": 251681, "epoch": 3032} {"train_loss": -24.739614486694336, "global_step": 251682, "epoch": 3032} {"train_loss": -24.43857765197754, "global_step": 251683, "epoch": 3032} {"train_loss": -25.015756607055664, "global_step": 251684, "epoch": 3032} {"train_loss": -24.952539443969727, "global_step": 251685, "epoch": 3032} {"train_loss": -25.08124351501465, "global_step": 251686, "epoch": 3032} {"train_loss": -25.143835067749023, "global_step": 251687, "epoch": 3032} {"train_loss": -24.85732650756836, "global_step": 251688, "epoch": 3032} {"train_loss": -25.46156120300293, "global_step": 251689, "epoch": 3032} {"train_loss": -25.29451560974121, "global_step": 251690, "epoch": 3032} {"train_loss": -24.70225715637207, "global_step": 251691, "epoch": 3032} {"train_loss": -24.919816970825195, "global_step": 251692, "epoch": 3032} {"train_loss": -25.189451217651367, "global_step": 251693, "epoch": 3032} {"train_loss": -24.53432273864746, "global_step": 251694, "epoch": 3032} {"train_loss": -24.880329132080078, "global_step": 251695, "epoch": 3032} {"train_loss": -25.415374755859375, "global_step": 251696, "epoch": 3032} {"train_loss": -25.03610610961914, "global_step": 251697, "epoch": 3032} {"train_loss": -25.315826416015625, "global_step": 251698, "epoch": 3032} {"train_loss": -25.02510643005371, "global_step": 251699, "epoch": 3032} {"train_loss": -24.97509765625, "global_step": 251700, "epoch": 3032} {"train_loss": -25.11751937866211, "global_step": 251701, "epoch": 3032} {"train_loss": -25.06476593017578, "global_step": 251702, "epoch": 3032} {"train_loss": -25.299352645874023, "global_step": 251703, "epoch": 3032} {"train_loss": -24.680524826049805, "global_step": 251704, "epoch": 3032} {"train_loss": -25.102018356323242, "global_step": 251705, "epoch": 3032} {"train_loss": -24.813108444213867, "global_step": 251706, "epoch": 3032} {"train_loss": -24.891403198242188, "global_step": 251707, "epoch": 3032} {"train_loss": -25.14383888244629, "global_step": 251708, "epoch": 3032} {"train_loss": -25.4838924407959, "global_step": 251709, "epoch": 3032} {"train_loss": -25.283571243286133, "global_step": 251710, "epoch": 3032} {"train_loss": -25.20635223388672, "global_step": 251711, "epoch": 3032} {"train_loss": -25.225616455078125, "global_step": 251712, "epoch": 3032} {"train_loss": -25.306974411010742, "global_step": 251713, "epoch": 3032} {"train_loss": -25.053537368774414, "global_step": 251714, "epoch": 3032} {"train_loss": -24.93575096130371, "global_step": 251715, "epoch": 3032} {"train_loss": -24.87301254272461, "global_step": 251716, "epoch": 3032} {"train_loss": -25.063600540161133, "global_step": 251717, "epoch": 3032} {"train_loss": -25.237468719482422, "global_step": 251718, "epoch": 3032} {"train_loss": -25.344083786010742, "global_step": 251719, "epoch": 3032} {"train_loss": -25.125333786010742, "global_step": 251720, "epoch": 3032} {"train_loss": -25.03999137878418, "global_step": 251721, "epoch": 3032} {"train_loss": -25.230545043945312, "global_step": 251722, "epoch": 3032} {"train_loss": -24.970722198486328, "global_step": 251723, "epoch": 3032} {"train_loss": -24.805313110351562, "global_step": 251724, "epoch": 3032} {"train_loss": -24.79197120666504, "global_step": 251725, "epoch": 3032} {"train_loss": -25.256332397460938, "global_step": 251726, "epoch": 3032} {"train_loss": -25.012571334838867, "global_step": 251727, "epoch": 3032} {"train_loss": -25.104223251342773, "global_step": 251728, "epoch": 3032} {"train_loss": -25.240442276000977, "global_step": 251729, "epoch": 3032} {"train_loss": -24.816390991210938, "global_step": 251730, "epoch": 3032} {"train_loss": -25.074325561523438, "global_step": 251731, "epoch": 3032} {"train_loss": -25.008291244506836, "global_step": 251732, "epoch": 3032} {"train_loss": -25.000669479370117, "global_step": 251733, "epoch": 3032} {"train_loss": -25.33707046508789, "global_step": 251734, "epoch": 3032} {"train_loss": -25.339956283569336, "global_step": 251735, "epoch": 3032} {"train_loss": -24.885103225708008, "global_step": 251736, "epoch": 3032} {"train_loss": -24.94032096862793, "global_step": 251737, "epoch": 3032} {"train_loss": -24.91120343035962, "global_step": 251738, "epoch": 3032, "val_loss": 6959406.0} {"train_loss": -25.1179256439209, "global_step": 251739, "epoch": 3033} {"train_loss": -24.31300926208496, "global_step": 251740, "epoch": 3033} {"train_loss": -24.366147994995117, "global_step": 251741, "epoch": 3033} {"train_loss": -25.136220932006836, "global_step": 251742, "epoch": 3033} {"train_loss": -25.243722915649414, "global_step": 251743, "epoch": 3033} {"train_loss": -24.585786819458008, "global_step": 251744, "epoch": 3033} {"train_loss": -24.55010414123535, "global_step": 251745, "epoch": 3033} {"train_loss": -25.198795318603516, "global_step": 251746, "epoch": 3033} {"train_loss": -24.5035400390625, "global_step": 251747, "epoch": 3033} {"train_loss": -24.80159568786621, "global_step": 251748, "epoch": 3033} {"train_loss": -24.785682678222656, "global_step": 251749, "epoch": 3033} {"train_loss": -24.865943908691406, "global_step": 251750, "epoch": 3033} {"train_loss": -24.919654846191406, "global_step": 251751, "epoch": 3033} {"train_loss": -24.679006576538086, "global_step": 251752, "epoch": 3033} {"train_loss": -25.069074630737305, "global_step": 251753, "epoch": 3033} {"train_loss": -25.056629180908203, "global_step": 251754, "epoch": 3033} {"train_loss": -25.016138076782227, "global_step": 251755, "epoch": 3033} {"train_loss": -25.022794723510742, "global_step": 251756, "epoch": 3033} {"train_loss": -24.968381881713867, "global_step": 251757, "epoch": 3033} {"train_loss": -24.996240615844727, "global_step": 251758, "epoch": 3033} {"train_loss": -24.92165756225586, "global_step": 251759, "epoch": 3033} {"train_loss": -24.84101676940918, "global_step": 251760, "epoch": 3033} {"train_loss": -24.846092224121094, "global_step": 251761, "epoch": 3033} {"train_loss": -24.711488723754883, "global_step": 251762, "epoch": 3033} {"train_loss": -24.734607696533203, "global_step": 251763, "epoch": 3033} {"train_loss": -24.940780639648438, "global_step": 251764, "epoch": 3033} {"train_loss": -24.817861557006836, "global_step": 251765, "epoch": 3033} {"train_loss": -25.4454402923584, "global_step": 251766, "epoch": 3033} {"train_loss": -25.099340438842773, "global_step": 251767, "epoch": 3033} {"train_loss": -25.059188842773438, "global_step": 251768, "epoch": 3033} {"train_loss": -25.021883010864258, "global_step": 251769, "epoch": 3033} {"train_loss": -25.49201011657715, "global_step": 251770, "epoch": 3033} {"train_loss": -25.314050674438477, "global_step": 251771, "epoch": 3033} {"train_loss": -25.01704216003418, "global_step": 251772, "epoch": 3033} {"train_loss": -25.128915786743164, "global_step": 251773, "epoch": 3033} {"train_loss": -25.120628356933594, "global_step": 251774, "epoch": 3033} {"train_loss": -25.34903335571289, "global_step": 251775, "epoch": 3033} {"train_loss": -24.92388343811035, "global_step": 251776, "epoch": 3033} {"train_loss": -24.85877799987793, "global_step": 251777, "epoch": 3033} {"train_loss": -24.84221839904785, "global_step": 251778, "epoch": 3033} {"train_loss": -25.179479598999023, "global_step": 251779, "epoch": 3033} {"train_loss": -24.888137817382812, "global_step": 251780, "epoch": 3033} {"train_loss": -25.113998413085938, "global_step": 251781, "epoch": 3033} {"train_loss": -24.750070571899414, "global_step": 251782, "epoch": 3033} {"train_loss": -25.073217391967773, "global_step": 251783, "epoch": 3033} {"train_loss": -25.227062225341797, "global_step": 251784, "epoch": 3033} {"train_loss": -24.960010528564453, "global_step": 251785, "epoch": 3033} {"train_loss": -24.88791847229004, "global_step": 251786, "epoch": 3033} {"train_loss": -25.234189987182617, "global_step": 251787, "epoch": 3033} {"train_loss": -25.33609390258789, "global_step": 251788, "epoch": 3033} {"train_loss": -24.68021011352539, "global_step": 251789, "epoch": 3033} {"train_loss": -24.855138778686523, "global_step": 251790, "epoch": 3033} {"train_loss": -25.043203353881836, "global_step": 251791, "epoch": 3033} {"train_loss": -24.9841365814209, "global_step": 251792, "epoch": 3033} {"train_loss": -24.961408615112305, "global_step": 251793, "epoch": 3033} {"train_loss": -25.069015502929688, "global_step": 251794, "epoch": 3033} {"train_loss": -24.748981475830078, "global_step": 251795, "epoch": 3033} {"train_loss": -25.080514907836914, "global_step": 251796, "epoch": 3033} {"train_loss": -24.92566680908203, "global_step": 251797, "epoch": 3033} {"train_loss": -24.89527702331543, "global_step": 251798, "epoch": 3033} {"train_loss": -25.10383415222168, "global_step": 251799, "epoch": 3033} {"train_loss": -24.517597198486328, "global_step": 251800, "epoch": 3033} {"train_loss": -24.661577224731445, "global_step": 251801, "epoch": 3033} {"train_loss": -25.051984786987305, "global_step": 251802, "epoch": 3033} {"train_loss": -24.94708824157715, "global_step": 251803, "epoch": 3033} {"train_loss": -24.923131942749023, "global_step": 251804, "epoch": 3033} {"train_loss": -24.853666305541992, "global_step": 251805, "epoch": 3033} {"train_loss": -25.010746002197266, "global_step": 251806, "epoch": 3033} {"train_loss": -24.96919822692871, "global_step": 251807, "epoch": 3033} {"train_loss": -24.99997329711914, "global_step": 251808, "epoch": 3033} {"train_loss": -24.972959518432617, "global_step": 251809, "epoch": 3033} {"train_loss": -24.958179473876953, "global_step": 251810, "epoch": 3033} {"train_loss": -25.02259635925293, "global_step": 251811, "epoch": 3033} {"train_loss": -25.11031150817871, "global_step": 251812, "epoch": 3033} {"train_loss": -24.836973190307617, "global_step": 251813, "epoch": 3033} {"train_loss": -24.911874771118164, "global_step": 251814, "epoch": 3033} {"train_loss": -25.16408348083496, "global_step": 251815, "epoch": 3033} {"train_loss": -25.29096031188965, "global_step": 251816, "epoch": 3033} {"train_loss": -25.335073471069336, "global_step": 251817, "epoch": 3033} {"train_loss": -25.05125617980957, "global_step": 251818, "epoch": 3033} {"train_loss": -25.153152465820312, "global_step": 251819, "epoch": 3033} {"train_loss": -24.999956130981445, "global_step": 251820, "epoch": 3033} {"train_loss": -24.983174795127777, "global_step": 251821, "epoch": 3033, "val_loss": 6763493.0} {"train_loss": -24.50157928466797, "global_step": 251822, "epoch": 3034} {"train_loss": -24.515172958374023, "global_step": 251823, "epoch": 3034} {"train_loss": -25.248985290527344, "global_step": 251824, "epoch": 3034} {"train_loss": -24.48333168029785, "global_step": 251825, "epoch": 3034} {"train_loss": -24.349328994750977, "global_step": 251826, "epoch": 3034} {"train_loss": -24.649471282958984, "global_step": 251827, "epoch": 3034} {"train_loss": -24.884580612182617, "global_step": 251828, "epoch": 3034} {"train_loss": -24.5411376953125, "global_step": 251829, "epoch": 3034} {"train_loss": -25.11057472229004, "global_step": 251830, "epoch": 3034} {"train_loss": -24.79530143737793, "global_step": 251831, "epoch": 3034} {"train_loss": -24.856657028198242, "global_step": 251832, "epoch": 3034} {"train_loss": -24.624210357666016, "global_step": 251833, "epoch": 3034} {"train_loss": -24.629323959350586, "global_step": 251834, "epoch": 3034} {"train_loss": -24.747547149658203, "global_step": 251835, "epoch": 3034} {"train_loss": -24.956260681152344, "global_step": 251836, "epoch": 3034} {"train_loss": -24.688308715820312, "global_step": 251837, "epoch": 3034} {"train_loss": -24.732559204101562, "global_step": 251838, "epoch": 3034} {"train_loss": -25.084171295166016, "global_step": 251839, "epoch": 3034} {"train_loss": -25.05704116821289, "global_step": 251840, "epoch": 3034} {"train_loss": -25.13201904296875, "global_step": 251841, "epoch": 3034} {"train_loss": -25.31732177734375, "global_step": 251842, "epoch": 3034} {"train_loss": -24.849395751953125, "global_step": 251843, "epoch": 3034} {"train_loss": -25.265504837036133, "global_step": 251844, "epoch": 3034} {"train_loss": -24.986534118652344, "global_step": 251845, "epoch": 3034} {"train_loss": -25.034208297729492, "global_step": 251846, "epoch": 3034} {"train_loss": -24.43082618713379, "global_step": 251847, "epoch": 3034} {"train_loss": -25.038969039916992, "global_step": 251848, "epoch": 3034} {"train_loss": -25.350433349609375, "global_step": 251849, "epoch": 3034} {"train_loss": -24.96309471130371, "global_step": 251850, "epoch": 3034} {"train_loss": -24.87754249572754, "global_step": 251851, "epoch": 3034} {"train_loss": -25.137950897216797, "global_step": 251852, "epoch": 3034} {"train_loss": -25.015714645385742, "global_step": 251853, "epoch": 3034} {"train_loss": -25.088462829589844, "global_step": 251854, "epoch": 3034} {"train_loss": -25.320371627807617, "global_step": 251855, "epoch": 3034} {"train_loss": -25.055246353149414, "global_step": 251856, "epoch": 3034} {"train_loss": -25.325891494750977, "global_step": 251857, "epoch": 3034} {"train_loss": -24.71735954284668, "global_step": 251858, "epoch": 3034} {"train_loss": -24.867355346679688, "global_step": 251859, "epoch": 3034} {"train_loss": -25.03740882873535, "global_step": 251860, "epoch": 3034} {"train_loss": -24.95371437072754, "global_step": 251861, "epoch": 3034} {"train_loss": -24.689041137695312, "global_step": 251862, "epoch": 3034} {"train_loss": -24.93716812133789, "global_step": 251863, "epoch": 3034} {"train_loss": -25.34001350402832, "global_step": 251864, "epoch": 3034} {"train_loss": -24.769657135009766, "global_step": 251865, "epoch": 3034} {"train_loss": -25.03142738342285, "global_step": 251866, "epoch": 3034} {"train_loss": -25.201448440551758, "global_step": 251867, "epoch": 3034} {"train_loss": -25.430253982543945, "global_step": 251868, "epoch": 3034} {"train_loss": -24.76293182373047, "global_step": 251869, "epoch": 3034} {"train_loss": -24.686689376831055, "global_step": 251870, "epoch": 3034} {"train_loss": -25.029455184936523, "global_step": 251871, "epoch": 3034} {"train_loss": -24.837177276611328, "global_step": 251872, "epoch": 3034} {"train_loss": -24.475975036621094, "global_step": 251873, "epoch": 3034} {"train_loss": -24.875577926635742, "global_step": 251874, "epoch": 3034} {"train_loss": -24.848148345947266, "global_step": 251875, "epoch": 3034} {"train_loss": -25.13290786743164, "global_step": 251876, "epoch": 3034} {"train_loss": -24.883787155151367, "global_step": 251877, "epoch": 3034} {"train_loss": -25.050779342651367, "global_step": 251878, "epoch": 3034} {"train_loss": -25.065587997436523, "global_step": 251879, "epoch": 3034} {"train_loss": -25.270397186279297, "global_step": 251880, "epoch": 3034} {"train_loss": -25.269376754760742, "global_step": 251881, "epoch": 3034} {"train_loss": -25.420583724975586, "global_step": 251882, "epoch": 3034} {"train_loss": -24.959949493408203, "global_step": 251883, "epoch": 3034} {"train_loss": -24.673933029174805, "global_step": 251884, "epoch": 3034} {"train_loss": -25.293466567993164, "global_step": 251885, "epoch": 3034} {"train_loss": -24.845809936523438, "global_step": 251886, "epoch": 3034} {"train_loss": -24.54445457458496, "global_step": 251887, "epoch": 3034} {"train_loss": -24.784011840820312, "global_step": 251888, "epoch": 3034} {"train_loss": -24.865697860717773, "global_step": 251889, "epoch": 3034} {"train_loss": -25.05573844909668, "global_step": 251890, "epoch": 3034} {"train_loss": -25.093900680541992, "global_step": 251891, "epoch": 3034} {"train_loss": -24.767051696777344, "global_step": 251892, "epoch": 3034} {"train_loss": -25.073902130126953, "global_step": 251893, "epoch": 3034} {"train_loss": -24.852807998657227, "global_step": 251894, "epoch": 3034} {"train_loss": -24.962265014648438, "global_step": 251895, "epoch": 3034} {"train_loss": -25.25645637512207, "global_step": 251896, "epoch": 3034} {"train_loss": -24.951826095581055, "global_step": 251897, "epoch": 3034} {"train_loss": -25.04389762878418, "global_step": 251898, "epoch": 3034} {"train_loss": -24.9903564453125, "global_step": 251899, "epoch": 3034} {"train_loss": -24.846786499023438, "global_step": 251900, "epoch": 3034} {"train_loss": -25.311660766601562, "global_step": 251901, "epoch": 3034} {"train_loss": -24.854446411132812, "global_step": 251902, "epoch": 3034} {"train_loss": -25.366994857788086, "global_step": 251903, "epoch": 3034} {"train_loss": -24.967173472944513, "global_step": 251904, "epoch": 3034, "val_loss": 6876427.0} {"train_loss": -24.344501495361328, "global_step": 251905, "epoch": 3035} {"train_loss": -23.421855926513672, "global_step": 251906, "epoch": 3035} {"train_loss": -24.29951286315918, "global_step": 251907, "epoch": 3035} {"train_loss": -24.50898551940918, "global_step": 251908, "epoch": 3035} {"train_loss": -23.86085319519043, "global_step": 251909, "epoch": 3035} {"train_loss": -24.385953903198242, "global_step": 251910, "epoch": 3035} {"train_loss": -24.236539840698242, "global_step": 251911, "epoch": 3035} {"train_loss": -23.973939895629883, "global_step": 251912, "epoch": 3035} {"train_loss": -24.496173858642578, "global_step": 251913, "epoch": 3035} {"train_loss": -24.241744995117188, "global_step": 251914, "epoch": 3035} {"train_loss": -24.508756637573242, "global_step": 251915, "epoch": 3035} {"train_loss": -24.56143569946289, "global_step": 251916, "epoch": 3035} {"train_loss": -24.607328414916992, "global_step": 251917, "epoch": 3035} {"train_loss": -24.713363647460938, "global_step": 251918, "epoch": 3035} {"train_loss": -24.518522262573242, "global_step": 251919, "epoch": 3035} {"train_loss": -24.631366729736328, "global_step": 251920, "epoch": 3035} {"train_loss": -24.866161346435547, "global_step": 251921, "epoch": 3035} {"train_loss": -24.258634567260742, "global_step": 251922, "epoch": 3035} {"train_loss": -24.85089683532715, "global_step": 251923, "epoch": 3035} {"train_loss": -24.554874420166016, "global_step": 251924, "epoch": 3035} {"train_loss": -24.6335506439209, "global_step": 251925, "epoch": 3035} {"train_loss": -24.999155044555664, "global_step": 251926, "epoch": 3035} {"train_loss": -24.805667877197266, "global_step": 251927, "epoch": 3035} {"train_loss": -25.027639389038086, "global_step": 251928, "epoch": 3035} {"train_loss": -24.716054916381836, "global_step": 251929, "epoch": 3035} {"train_loss": -24.933778762817383, "global_step": 251930, "epoch": 3035} {"train_loss": -24.619787216186523, "global_step": 251931, "epoch": 3035} {"train_loss": -24.982357025146484, "global_step": 251932, "epoch": 3035} {"train_loss": -24.765653610229492, "global_step": 251933, "epoch": 3035} {"train_loss": -25.06050682067871, "global_step": 251934, "epoch": 3035} {"train_loss": -25.07616424560547, "global_step": 251935, "epoch": 3035} {"train_loss": -24.52839469909668, "global_step": 251936, "epoch": 3035} {"train_loss": -25.13688087463379, "global_step": 251937, "epoch": 3035} {"train_loss": -25.370616912841797, "global_step": 251938, "epoch": 3035} {"train_loss": -24.984540939331055, "global_step": 251939, "epoch": 3035} {"train_loss": -25.339704513549805, "global_step": 251940, "epoch": 3035} {"train_loss": -24.966495513916016, "global_step": 251941, "epoch": 3035} {"train_loss": -25.069915771484375, "global_step": 251942, "epoch": 3035} {"train_loss": -24.948808670043945, "global_step": 251943, "epoch": 3035} {"train_loss": -25.222623825073242, "global_step": 251944, "epoch": 3035} {"train_loss": -25.091032028198242, "global_step": 251945, "epoch": 3035} {"train_loss": -25.231586456298828, "global_step": 251946, "epoch": 3035} {"train_loss": -24.94837760925293, "global_step": 251947, "epoch": 3035} {"train_loss": -25.143939971923828, "global_step": 251948, "epoch": 3035} {"train_loss": -25.1453800201416, "global_step": 251949, "epoch": 3035} {"train_loss": -25.333621978759766, "global_step": 251950, "epoch": 3035} {"train_loss": -25.2391300201416, "global_step": 251951, "epoch": 3035} {"train_loss": -24.53590202331543, "global_step": 251952, "epoch": 3035} {"train_loss": -25.079391479492188, "global_step": 251953, "epoch": 3035} {"train_loss": -24.878515243530273, "global_step": 251954, "epoch": 3035} {"train_loss": -25.29205322265625, "global_step": 251955, "epoch": 3035} {"train_loss": -25.288373947143555, "global_step": 251956, "epoch": 3035} {"train_loss": -25.303691864013672, "global_step": 251957, "epoch": 3035} {"train_loss": -25.252599716186523, "global_step": 251958, "epoch": 3035} {"train_loss": -25.014869689941406, "global_step": 251959, "epoch": 3035} {"train_loss": -24.93914794921875, "global_step": 251960, "epoch": 3035} {"train_loss": -25.013572692871094, "global_step": 251961, "epoch": 3035} {"train_loss": -24.051666259765625, "global_step": 251962, "epoch": 3035} {"train_loss": -24.581214904785156, "global_step": 251963, "epoch": 3035} {"train_loss": -24.79831886291504, "global_step": 251964, "epoch": 3035} {"train_loss": -25.154794692993164, "global_step": 251965, "epoch": 3035} {"train_loss": -24.887964248657227, "global_step": 251966, "epoch": 3035} {"train_loss": -25.02867889404297, "global_step": 251967, "epoch": 3035} {"train_loss": -24.783414840698242, "global_step": 251968, "epoch": 3035} {"train_loss": -24.794662475585938, "global_step": 251969, "epoch": 3035} {"train_loss": -25.370500564575195, "global_step": 251970, "epoch": 3035} {"train_loss": -24.781768798828125, "global_step": 251971, "epoch": 3035} {"train_loss": -25.21475601196289, "global_step": 251972, "epoch": 3035} {"train_loss": -24.965696334838867, "global_step": 251973, "epoch": 3035} {"train_loss": -25.293867111206055, "global_step": 251974, "epoch": 3035} {"train_loss": -24.84789276123047, "global_step": 251975, "epoch": 3035} {"train_loss": -24.847143173217773, "global_step": 251976, "epoch": 3035} {"train_loss": -24.782087326049805, "global_step": 251977, "epoch": 3035} {"train_loss": -25.2011661529541, "global_step": 251978, "epoch": 3035} {"train_loss": -25.253921508789062, "global_step": 251979, "epoch": 3035} {"train_loss": -24.944639205932617, "global_step": 251980, "epoch": 3035} {"train_loss": -24.952960968017578, "global_step": 251981, "epoch": 3035} {"train_loss": -25.090383529663086, "global_step": 251982, "epoch": 3035} {"train_loss": -24.917566299438477, "global_step": 251983, "epoch": 3035} {"train_loss": -25.278867721557617, "global_step": 251984, "epoch": 3035} {"train_loss": -24.720157623291016, "global_step": 251985, "epoch": 3035} {"train_loss": -25.021411895751953, "global_step": 251986, "epoch": 3035} {"train_loss": -24.87213587473674, "global_step": 251987, "epoch": 3035, "val_loss": 6974153.0} {"train_loss": -24.659719467163086, "global_step": 251988, "epoch": 3036} {"train_loss": -24.696401596069336, "global_step": 251989, "epoch": 3036} {"train_loss": -24.829975128173828, "global_step": 251990, "epoch": 3036} {"train_loss": -24.691612243652344, "global_step": 251991, "epoch": 3036} {"train_loss": -24.72071647644043, "global_step": 251992, "epoch": 3036} {"train_loss": -24.650007247924805, "global_step": 251993, "epoch": 3036} {"train_loss": -24.81418800354004, "global_step": 251994, "epoch": 3036} {"train_loss": -24.30592918395996, "global_step": 251995, "epoch": 3036} {"train_loss": -24.308073043823242, "global_step": 251996, "epoch": 3036} {"train_loss": -24.64438819885254, "global_step": 251997, "epoch": 3036} {"train_loss": -24.5002498626709, "global_step": 251998, "epoch": 3036} {"train_loss": -24.7325382232666, "global_step": 251999, "epoch": 3036} {"train_loss": -25.229921340942383, "global_step": 252000, "epoch": 3036} {"train_loss": -25.038330078125, "global_step": 252001, "epoch": 3036} {"train_loss": -24.29843521118164, "global_step": 252002, "epoch": 3036} {"train_loss": -25.288976669311523, "global_step": 252003, "epoch": 3036} {"train_loss": -25.135589599609375, "global_step": 252004, "epoch": 3036} {"train_loss": -24.704214096069336, "global_step": 252005, "epoch": 3036} {"train_loss": -24.899627685546875, "global_step": 252006, "epoch": 3036} {"train_loss": -24.76094627380371, "global_step": 252007, "epoch": 3036} {"train_loss": -24.729406356811523, "global_step": 252008, "epoch": 3036} {"train_loss": -24.837203979492188, "global_step": 252009, "epoch": 3036} {"train_loss": -24.75714683532715, "global_step": 252010, "epoch": 3036} {"train_loss": -24.890783309936523, "global_step": 252011, "epoch": 3036} {"train_loss": -24.85611343383789, "global_step": 252012, "epoch": 3036} {"train_loss": -25.008594512939453, "global_step": 252013, "epoch": 3036} {"train_loss": -24.755237579345703, "global_step": 252014, "epoch": 3036} {"train_loss": -24.802265167236328, "global_step": 252015, "epoch": 3036} {"train_loss": -25.205087661743164, "global_step": 252016, "epoch": 3036} {"train_loss": -25.144287109375, "global_step": 252017, "epoch": 3036} {"train_loss": -25.005786895751953, "global_step": 252018, "epoch": 3036} {"train_loss": -24.889379501342773, "global_step": 252019, "epoch": 3036} {"train_loss": -25.155399322509766, "global_step": 252020, "epoch": 3036} {"train_loss": -24.8680477142334, "global_step": 252021, "epoch": 3036} {"train_loss": -25.043766021728516, "global_step": 252022, "epoch": 3036} {"train_loss": -25.199176788330078, "global_step": 252023, "epoch": 3036} {"train_loss": -25.035524368286133, "global_step": 252024, "epoch": 3036} {"train_loss": -24.859155654907227, "global_step": 252025, "epoch": 3036} {"train_loss": -25.39133644104004, "global_step": 252026, "epoch": 3036} {"train_loss": -24.679197311401367, "global_step": 252027, "epoch": 3036} {"train_loss": -25.172733306884766, "global_step": 252028, "epoch": 3036} {"train_loss": -24.962799072265625, "global_step": 252029, "epoch": 3036} {"train_loss": -25.177473068237305, "global_step": 252030, "epoch": 3036} {"train_loss": -24.783124923706055, "global_step": 252031, "epoch": 3036} {"train_loss": -25.08613395690918, "global_step": 252032, "epoch": 3036} {"train_loss": -24.566104888916016, "global_step": 252033, "epoch": 3036} {"train_loss": -25.038188934326172, "global_step": 252034, "epoch": 3036} {"train_loss": -25.374849319458008, "global_step": 252035, "epoch": 3036} {"train_loss": -24.856473922729492, "global_step": 252036, "epoch": 3036} {"train_loss": -24.53522300720215, "global_step": 252037, "epoch": 3036} {"train_loss": -25.147993087768555, "global_step": 252038, "epoch": 3036} {"train_loss": -25.120206832885742, "global_step": 252039, "epoch": 3036} {"train_loss": -24.65681266784668, "global_step": 252040, "epoch": 3036} {"train_loss": -24.83883285522461, "global_step": 252041, "epoch": 3036} {"train_loss": -25.169588088989258, "global_step": 252042, "epoch": 3036} {"train_loss": -25.05866813659668, "global_step": 252043, "epoch": 3036} {"train_loss": -24.90639877319336, "global_step": 252044, "epoch": 3036} {"train_loss": -24.790685653686523, "global_step": 252045, "epoch": 3036} {"train_loss": -24.92601203918457, "global_step": 252046, "epoch": 3036} {"train_loss": -25.2345027923584, "global_step": 252047, "epoch": 3036} {"train_loss": -25.00614356994629, "global_step": 252048, "epoch": 3036} {"train_loss": -24.842212677001953, "global_step": 252049, "epoch": 3036} {"train_loss": -24.82485008239746, "global_step": 252050, "epoch": 3036} {"train_loss": -24.71443748474121, "global_step": 252051, "epoch": 3036} {"train_loss": -25.05841636657715, "global_step": 252052, "epoch": 3036} {"train_loss": -25.100980758666992, "global_step": 252053, "epoch": 3036} {"train_loss": -24.749103546142578, "global_step": 252054, "epoch": 3036} {"train_loss": -25.024993896484375, "global_step": 252055, "epoch": 3036} {"train_loss": -24.90143585205078, "global_step": 252056, "epoch": 3036} {"train_loss": -24.750919342041016, "global_step": 252057, "epoch": 3036} {"train_loss": -24.740774154663086, "global_step": 252058, "epoch": 3036} {"train_loss": -25.0446834564209, "global_step": 252059, "epoch": 3036} {"train_loss": -25.026762008666992, "global_step": 252060, "epoch": 3036} {"train_loss": -25.29483413696289, "global_step": 252061, "epoch": 3036} {"train_loss": -24.85967445373535, "global_step": 252062, "epoch": 3036} {"train_loss": -24.949350357055664, "global_step": 252063, "epoch": 3036} {"train_loss": -25.03656005859375, "global_step": 252064, "epoch": 3036} {"train_loss": -24.875450134277344, "global_step": 252065, "epoch": 3036} {"train_loss": -25.24495506286621, "global_step": 252066, "epoch": 3036} {"train_loss": -24.973495483398438, "global_step": 252067, "epoch": 3036} {"train_loss": -25.091459274291992, "global_step": 252068, "epoch": 3036} {"train_loss": -25.408538818359375, "global_step": 252069, "epoch": 3036} {"train_loss": -24.90815086824348, "global_step": 252070, "epoch": 3036, "val_loss": 6921373.5} {"train_loss": -24.79102897644043, "global_step": 252071, "epoch": 3037} {"train_loss": -24.400310516357422, "global_step": 252072, "epoch": 3037} {"train_loss": -24.531278610229492, "global_step": 252073, "epoch": 3037} {"train_loss": -24.780744552612305, "global_step": 252074, "epoch": 3037} {"train_loss": -24.110422134399414, "global_step": 252075, "epoch": 3037} {"train_loss": -24.275541305541992, "global_step": 252076, "epoch": 3037} {"train_loss": -24.70450782775879, "global_step": 252077, "epoch": 3037} {"train_loss": -24.2083740234375, "global_step": 252078, "epoch": 3037} {"train_loss": -24.65962791442871, "global_step": 252079, "epoch": 3037} {"train_loss": -24.695758819580078, "global_step": 252080, "epoch": 3037} {"train_loss": -24.620410919189453, "global_step": 252081, "epoch": 3037} {"train_loss": -24.436595916748047, "global_step": 252082, "epoch": 3037} {"train_loss": -24.618955612182617, "global_step": 252083, "epoch": 3037} {"train_loss": -24.900415420532227, "global_step": 252084, "epoch": 3037} {"train_loss": -25.0439510345459, "global_step": 252085, "epoch": 3037} {"train_loss": -24.862173080444336, "global_step": 252086, "epoch": 3037} {"train_loss": -24.885303497314453, "global_step": 252087, "epoch": 3037} {"train_loss": -24.73914909362793, "global_step": 252088, "epoch": 3037} {"train_loss": -24.75723648071289, "global_step": 252089, "epoch": 3037} {"train_loss": -24.847654342651367, "global_step": 252090, "epoch": 3037} {"train_loss": -24.80415153503418, "global_step": 252091, "epoch": 3037} {"train_loss": -24.905176162719727, "global_step": 252092, "epoch": 3037} {"train_loss": -25.090381622314453, "global_step": 252093, "epoch": 3037} {"train_loss": -25.170488357543945, "global_step": 252094, "epoch": 3037} {"train_loss": -24.697851181030273, "global_step": 252095, "epoch": 3037} {"train_loss": -24.751352310180664, "global_step": 252096, "epoch": 3037} {"train_loss": -25.4596004486084, "global_step": 252097, "epoch": 3037} {"train_loss": -24.819196701049805, "global_step": 252098, "epoch": 3037} {"train_loss": -24.926982879638672, "global_step": 252099, "epoch": 3037} {"train_loss": -24.92122459411621, "global_step": 252100, "epoch": 3037} {"train_loss": -25.071256637573242, "global_step": 252101, "epoch": 3037} {"train_loss": -25.036083221435547, "global_step": 252102, "epoch": 3037} {"train_loss": -25.31417465209961, "global_step": 252103, "epoch": 3037} {"train_loss": -25.250452041625977, "global_step": 252104, "epoch": 3037} {"train_loss": -25.22416877746582, "global_step": 252105, "epoch": 3037} {"train_loss": -25.38776206970215, "global_step": 252106, "epoch": 3037} {"train_loss": -25.404394149780273, "global_step": 252107, "epoch": 3037} {"train_loss": -24.761083602905273, "global_step": 252108, "epoch": 3037} {"train_loss": -24.91590690612793, "global_step": 252109, "epoch": 3037} {"train_loss": -24.81475257873535, "global_step": 252110, "epoch": 3037} {"train_loss": -25.14802360534668, "global_step": 252111, "epoch": 3037} {"train_loss": -24.9935302734375, "global_step": 252112, "epoch": 3037} {"train_loss": -24.840551376342773, "global_step": 252113, "epoch": 3037} {"train_loss": -24.995813369750977, "global_step": 252114, "epoch": 3037} {"train_loss": -25.056177139282227, "global_step": 252115, "epoch": 3037} {"train_loss": -25.312971115112305, "global_step": 252116, "epoch": 3037} {"train_loss": -24.81284523010254, "global_step": 252117, "epoch": 3037} {"train_loss": -25.324766159057617, "global_step": 252118, "epoch": 3037} {"train_loss": -25.34914779663086, "global_step": 252119, "epoch": 3037} {"train_loss": -25.003408432006836, "global_step": 252120, "epoch": 3037} {"train_loss": -24.966188430786133, "global_step": 252121, "epoch": 3037} {"train_loss": -24.737558364868164, "global_step": 252122, "epoch": 3037} {"train_loss": -25.257795333862305, "global_step": 252123, "epoch": 3037} {"train_loss": -25.047388076782227, "global_step": 252124, "epoch": 3037} {"train_loss": -25.27088737487793, "global_step": 252125, "epoch": 3037} {"train_loss": -24.860797882080078, "global_step": 252126, "epoch": 3037} {"train_loss": -25.283140182495117, "global_step": 252127, "epoch": 3037} {"train_loss": -25.537857055664062, "global_step": 252128, "epoch": 3037} {"train_loss": -25.052764892578125, "global_step": 252129, "epoch": 3037} {"train_loss": -25.14005470275879, "global_step": 252130, "epoch": 3037} {"train_loss": -25.284250259399414, "global_step": 252131, "epoch": 3037} {"train_loss": -25.330081939697266, "global_step": 252132, "epoch": 3037} {"train_loss": -25.001405715942383, "global_step": 252133, "epoch": 3037} {"train_loss": -25.17927360534668, "global_step": 252134, "epoch": 3037} {"train_loss": -24.79279899597168, "global_step": 252135, "epoch": 3037} {"train_loss": -24.70566177368164, "global_step": 252136, "epoch": 3037} {"train_loss": -24.375181198120117, "global_step": 252137, "epoch": 3037} {"train_loss": -24.70921516418457, "global_step": 252138, "epoch": 3037} {"train_loss": -24.586387634277344, "global_step": 252139, "epoch": 3037} {"train_loss": -25.104333877563477, "global_step": 252140, "epoch": 3037} {"train_loss": -25.06953239440918, "global_step": 252141, "epoch": 3037} {"train_loss": -24.943166732788086, "global_step": 252142, "epoch": 3037} {"train_loss": -24.94109344482422, "global_step": 252143, "epoch": 3037} {"train_loss": -25.130023956298828, "global_step": 252144, "epoch": 3037} {"train_loss": -24.882221221923828, "global_step": 252145, "epoch": 3037} {"train_loss": -24.989654541015625, "global_step": 252146, "epoch": 3037} {"train_loss": -25.030149459838867, "global_step": 252147, "epoch": 3037} {"train_loss": -25.123193740844727, "global_step": 252148, "epoch": 3037} {"train_loss": -24.72644805908203, "global_step": 252149, "epoch": 3037} {"train_loss": -25.307920455932617, "global_step": 252150, "epoch": 3037} {"train_loss": -24.65643310546875, "global_step": 252151, "epoch": 3037} {"train_loss": -25.094615936279297, "global_step": 252152, "epoch": 3037} {"train_loss": -24.95478848376906, "global_step": 252153, "epoch": 3037, "val_loss": 6677752.5} {"train_loss": -24.533336639404297, "global_step": 252154, "epoch": 3038} {"train_loss": -24.218976974487305, "global_step": 252155, "epoch": 3038} {"train_loss": -24.50703239440918, "global_step": 252156, "epoch": 3038} {"train_loss": -24.477468490600586, "global_step": 252157, "epoch": 3038} {"train_loss": -24.488136291503906, "global_step": 252158, "epoch": 3038} {"train_loss": -24.323211669921875, "global_step": 252159, "epoch": 3038} {"train_loss": -24.802000045776367, "global_step": 252160, "epoch": 3038} {"train_loss": -24.61836814880371, "global_step": 252161, "epoch": 3038} {"train_loss": -24.3831729888916, "global_step": 252162, "epoch": 3038} {"train_loss": -24.83966064453125, "global_step": 252163, "epoch": 3038} {"train_loss": -24.570919036865234, "global_step": 252164, "epoch": 3038} {"train_loss": -24.406286239624023, "global_step": 252165, "epoch": 3038} {"train_loss": -24.70346450805664, "global_step": 252166, "epoch": 3038} {"train_loss": -24.7114315032959, "global_step": 252167, "epoch": 3038} {"train_loss": -24.829330444335938, "global_step": 252168, "epoch": 3038} {"train_loss": -24.57503318786621, "global_step": 252169, "epoch": 3038} {"train_loss": -25.05205726623535, "global_step": 252170, "epoch": 3038} {"train_loss": -24.55409812927246, "global_step": 252171, "epoch": 3038} {"train_loss": -24.96382713317871, "global_step": 252172, "epoch": 3038} {"train_loss": -24.784500122070312, "global_step": 252173, "epoch": 3038} {"train_loss": -24.725366592407227, "global_step": 252174, "epoch": 3038} {"train_loss": -25.1444091796875, "global_step": 252175, "epoch": 3038} {"train_loss": -24.958757400512695, "global_step": 252176, "epoch": 3038} {"train_loss": -24.974470138549805, "global_step": 252177, "epoch": 3038} {"train_loss": -24.748498916625977, "global_step": 252178, "epoch": 3038} {"train_loss": -24.97910499572754, "global_step": 252179, "epoch": 3038} {"train_loss": -25.01642417907715, "global_step": 252180, "epoch": 3038} {"train_loss": -24.699209213256836, "global_step": 252181, "epoch": 3038} {"train_loss": -25.162620544433594, "global_step": 252182, "epoch": 3038} {"train_loss": -25.171463012695312, "global_step": 252183, "epoch": 3038} {"train_loss": -24.868371963500977, "global_step": 252184, "epoch": 3038} {"train_loss": -25.16032600402832, "global_step": 252185, "epoch": 3038} {"train_loss": -24.708654403686523, "global_step": 252186, "epoch": 3038} {"train_loss": -24.975881576538086, "global_step": 252187, "epoch": 3038} {"train_loss": -25.302597045898438, "global_step": 252188, "epoch": 3038} {"train_loss": -24.947128295898438, "global_step": 252189, "epoch": 3038} {"train_loss": -24.869144439697266, "global_step": 252190, "epoch": 3038} {"train_loss": -25.0919132232666, "global_step": 252191, "epoch": 3038} {"train_loss": -25.313098907470703, "global_step": 252192, "epoch": 3038} {"train_loss": -25.122196197509766, "global_step": 252193, "epoch": 3038} {"train_loss": -25.01156997680664, "global_step": 252194, "epoch": 3038} {"train_loss": -25.130796432495117, "global_step": 252195, "epoch": 3038} {"train_loss": -25.24824333190918, "global_step": 252196, "epoch": 3038} {"train_loss": -25.18747901916504, "global_step": 252197, "epoch": 3038} {"train_loss": -25.11618423461914, "global_step": 252198, "epoch": 3038} {"train_loss": -24.733362197875977, "global_step": 252199, "epoch": 3038} {"train_loss": -24.858448028564453, "global_step": 252200, "epoch": 3038} {"train_loss": -25.47182846069336, "global_step": 252201, "epoch": 3038} {"train_loss": -25.02459716796875, "global_step": 252202, "epoch": 3038} {"train_loss": -25.163686752319336, "global_step": 252203, "epoch": 3038} {"train_loss": -25.0806827545166, "global_step": 252204, "epoch": 3038} {"train_loss": -25.095218658447266, "global_step": 252205, "epoch": 3038} {"train_loss": -25.575550079345703, "global_step": 252206, "epoch": 3038} {"train_loss": -25.14253044128418, "global_step": 252207, "epoch": 3038} {"train_loss": -25.09491729736328, "global_step": 252208, "epoch": 3038} {"train_loss": -24.79282569885254, "global_step": 252209, "epoch": 3038} {"train_loss": -24.82496452331543, "global_step": 252210, "epoch": 3038} {"train_loss": -25.454618453979492, "global_step": 252211, "epoch": 3038} {"train_loss": -25.119403839111328, "global_step": 252212, "epoch": 3038} {"train_loss": -25.007125854492188, "global_step": 252213, "epoch": 3038} {"train_loss": -25.09632682800293, "global_step": 252214, "epoch": 3038} {"train_loss": -24.90663719177246, "global_step": 252215, "epoch": 3038} {"train_loss": -24.65439224243164, "global_step": 252216, "epoch": 3038} {"train_loss": -25.288084030151367, "global_step": 252217, "epoch": 3038} {"train_loss": -25.184341430664062, "global_step": 252218, "epoch": 3038} {"train_loss": -25.289535522460938, "global_step": 252219, "epoch": 3038} {"train_loss": -25.047840118408203, "global_step": 252220, "epoch": 3038} {"train_loss": -25.188379287719727, "global_step": 252221, "epoch": 3038} {"train_loss": -25.02070426940918, "global_step": 252222, "epoch": 3038} {"train_loss": -25.117328643798828, "global_step": 252223, "epoch": 3038} {"train_loss": -25.116971969604492, "global_step": 252224, "epoch": 3038} {"train_loss": -25.323240280151367, "global_step": 252225, "epoch": 3038} {"train_loss": -25.048561096191406, "global_step": 252226, "epoch": 3038} {"train_loss": -25.29606056213379, "global_step": 252227, "epoch": 3038} {"train_loss": -25.21038818359375, "global_step": 252228, "epoch": 3038} {"train_loss": -25.24513053894043, "global_step": 252229, "epoch": 3038} {"train_loss": -24.598941802978516, "global_step": 252230, "epoch": 3038} {"train_loss": -24.77754783630371, "global_step": 252231, "epoch": 3038} {"train_loss": -25.173114776611328, "global_step": 252232, "epoch": 3038} {"train_loss": -25.37479591369629, "global_step": 252233, "epoch": 3038} {"train_loss": -25.116979598999023, "global_step": 252234, "epoch": 3038} {"train_loss": -25.155187606811523, "global_step": 252235, "epoch": 3038} {"train_loss": -24.96199520524726, "global_step": 252236, "epoch": 3038, "val_loss": 6905621.5} {"train_loss": -24.418689727783203, "global_step": 252237, "epoch": 3039} {"train_loss": -24.06279945373535, "global_step": 252238, "epoch": 3039} {"train_loss": -24.81383514404297, "global_step": 252239, "epoch": 3039} {"train_loss": -24.209928512573242, "global_step": 252240, "epoch": 3039} {"train_loss": -24.579809188842773, "global_step": 252241, "epoch": 3039} {"train_loss": -24.982542037963867, "global_step": 252242, "epoch": 3039} {"train_loss": -24.52203941345215, "global_step": 252243, "epoch": 3039} {"train_loss": -24.649106979370117, "global_step": 252244, "epoch": 3039} {"train_loss": -24.819387435913086, "global_step": 252245, "epoch": 3039} {"train_loss": -24.873872756958008, "global_step": 252246, "epoch": 3039} {"train_loss": -24.592947006225586, "global_step": 252247, "epoch": 3039} {"train_loss": -24.885847091674805, "global_step": 252248, "epoch": 3039} {"train_loss": -24.85948944091797, "global_step": 252249, "epoch": 3039} {"train_loss": -24.75128746032715, "global_step": 252250, "epoch": 3039} {"train_loss": -24.97275733947754, "global_step": 252251, "epoch": 3039} {"train_loss": -25.011545181274414, "global_step": 252252, "epoch": 3039} {"train_loss": -24.974172592163086, "global_step": 252253, "epoch": 3039} {"train_loss": -24.960142135620117, "global_step": 252254, "epoch": 3039} {"train_loss": -24.747255325317383, "global_step": 252255, "epoch": 3039} {"train_loss": -24.940488815307617, "global_step": 252256, "epoch": 3039} {"train_loss": -24.55938720703125, "global_step": 252257, "epoch": 3039} {"train_loss": -24.91948890686035, "global_step": 252258, "epoch": 3039} {"train_loss": -25.02433204650879, "global_step": 252259, "epoch": 3039} {"train_loss": -25.10731315612793, "global_step": 252260, "epoch": 3039} {"train_loss": -24.69866180419922, "global_step": 252261, "epoch": 3039} {"train_loss": -24.876541137695312, "global_step": 252262, "epoch": 3039} {"train_loss": -25.364273071289062, "global_step": 252263, "epoch": 3039} {"train_loss": -25.190460205078125, "global_step": 252264, "epoch": 3039} {"train_loss": -25.12537956237793, "global_step": 252265, "epoch": 3039} {"train_loss": -25.11610984802246, "global_step": 252266, "epoch": 3039} {"train_loss": -25.03986930847168, "global_step": 252267, "epoch": 3039} {"train_loss": -25.113142013549805, "global_step": 252268, "epoch": 3039} {"train_loss": -25.49770164489746, "global_step": 252269, "epoch": 3039} {"train_loss": -25.3354434967041, "global_step": 252270, "epoch": 3039} {"train_loss": -25.086387634277344, "global_step": 252271, "epoch": 3039} {"train_loss": -25.295307159423828, "global_step": 252272, "epoch": 3039} {"train_loss": -24.9960994720459, "global_step": 252273, "epoch": 3039} {"train_loss": -24.92267608642578, "global_step": 252274, "epoch": 3039} {"train_loss": -24.760053634643555, "global_step": 252275, "epoch": 3039} {"train_loss": -25.12150001525879, "global_step": 252276, "epoch": 3039} {"train_loss": -25.368789672851562, "global_step": 252277, "epoch": 3039} {"train_loss": -24.951904296875, "global_step": 252278, "epoch": 3039} {"train_loss": -25.078927993774414, "global_step": 252279, "epoch": 3039} {"train_loss": -24.66353416442871, "global_step": 252280, "epoch": 3039} {"train_loss": -25.243228912353516, "global_step": 252281, "epoch": 3039} {"train_loss": -25.296972274780273, "global_step": 252282, "epoch": 3039} {"train_loss": -24.801233291625977, "global_step": 252283, "epoch": 3039} {"train_loss": -25.36552619934082, "global_step": 252284, "epoch": 3039} {"train_loss": -25.175838470458984, "global_step": 252285, "epoch": 3039} {"train_loss": -24.89734649658203, "global_step": 252286, "epoch": 3039} {"train_loss": -25.08295249938965, "global_step": 252287, "epoch": 3039} {"train_loss": -25.198535919189453, "global_step": 252288, "epoch": 3039} {"train_loss": -24.967321395874023, "global_step": 252289, "epoch": 3039} {"train_loss": -25.204504013061523, "global_step": 252290, "epoch": 3039} {"train_loss": -24.940738677978516, "global_step": 252291, "epoch": 3039} {"train_loss": -25.024852752685547, "global_step": 252292, "epoch": 3039} {"train_loss": -24.863262176513672, "global_step": 252293, "epoch": 3039} {"train_loss": -24.87528419494629, "global_step": 252294, "epoch": 3039} {"train_loss": -25.355958938598633, "global_step": 252295, "epoch": 3039} {"train_loss": -25.157123565673828, "global_step": 252296, "epoch": 3039} {"train_loss": -25.091293334960938, "global_step": 252297, "epoch": 3039} {"train_loss": -24.7716007232666, "global_step": 252298, "epoch": 3039} {"train_loss": -25.016345977783203, "global_step": 252299, "epoch": 3039} {"train_loss": -24.883684158325195, "global_step": 252300, "epoch": 3039} {"train_loss": -25.286975860595703, "global_step": 252301, "epoch": 3039} {"train_loss": -25.123777389526367, "global_step": 252302, "epoch": 3039} {"train_loss": -25.30672836303711, "global_step": 252303, "epoch": 3039} {"train_loss": -24.843969345092773, "global_step": 252304, "epoch": 3039} {"train_loss": -25.025577545166016, "global_step": 252305, "epoch": 3039} {"train_loss": -25.4431209564209, "global_step": 252306, "epoch": 3039} {"train_loss": -25.199018478393555, "global_step": 252307, "epoch": 3039} {"train_loss": -25.161161422729492, "global_step": 252308, "epoch": 3039} {"train_loss": -25.275163650512695, "global_step": 252309, "epoch": 3039} {"train_loss": -24.752347946166992, "global_step": 252310, "epoch": 3039} {"train_loss": -25.1729736328125, "global_step": 252311, "epoch": 3039} {"train_loss": -25.02848243713379, "global_step": 252312, "epoch": 3039} {"train_loss": -25.17165184020996, "global_step": 252313, "epoch": 3039} {"train_loss": -24.712234497070312, "global_step": 252314, "epoch": 3039} {"train_loss": -24.928791046142578, "global_step": 252315, "epoch": 3039} {"train_loss": -24.782154083251953, "global_step": 252316, "epoch": 3039} {"train_loss": -25.494335174560547, "global_step": 252317, "epoch": 3039} {"train_loss": -24.592975616455078, "global_step": 252318, "epoch": 3039} {"train_loss": -24.99706658972315, "global_step": 252319, "epoch": 3039, "val_loss": 6805896.0} {"train_loss": -23.73054313659668, "global_step": 252320, "epoch": 3040} {"train_loss": -24.409503936767578, "global_step": 252321, "epoch": 3040} {"train_loss": -24.386682510375977, "global_step": 252322, "epoch": 3040} {"train_loss": -24.328489303588867, "global_step": 252323, "epoch": 3040} {"train_loss": -24.343568801879883, "global_step": 252324, "epoch": 3040} {"train_loss": -24.57187843322754, "global_step": 252325, "epoch": 3040} {"train_loss": -24.725751876831055, "global_step": 252326, "epoch": 3040} {"train_loss": -24.32908058166504, "global_step": 252327, "epoch": 3040} {"train_loss": -24.302738189697266, "global_step": 252328, "epoch": 3040} {"train_loss": -24.633085250854492, "global_step": 252329, "epoch": 3040} {"train_loss": -24.265775680541992, "global_step": 252330, "epoch": 3040} {"train_loss": -24.562732696533203, "global_step": 252331, "epoch": 3040} {"train_loss": -24.50506019592285, "global_step": 252332, "epoch": 3040} {"train_loss": -24.77293586730957, "global_step": 252333, "epoch": 3040} {"train_loss": -24.8553524017334, "global_step": 252334, "epoch": 3040} {"train_loss": -24.473541259765625, "global_step": 252335, "epoch": 3040} {"train_loss": -24.686065673828125, "global_step": 252336, "epoch": 3040} {"train_loss": -24.94331169128418, "global_step": 252337, "epoch": 3040} {"train_loss": -24.52556610107422, "global_step": 252338, "epoch": 3040} {"train_loss": -24.620380401611328, "global_step": 252339, "epoch": 3040} {"train_loss": -25.160232543945312, "global_step": 252340, "epoch": 3040} {"train_loss": -24.75190544128418, "global_step": 252341, "epoch": 3040} {"train_loss": -24.540090560913086, "global_step": 252342, "epoch": 3040} {"train_loss": -24.49698829650879, "global_step": 252343, "epoch": 3040} {"train_loss": -24.785192489624023, "global_step": 252344, "epoch": 3040} {"train_loss": -24.829010009765625, "global_step": 252345, "epoch": 3040} {"train_loss": -25.057844161987305, "global_step": 252346, "epoch": 3040} {"train_loss": -24.88358497619629, "global_step": 252347, "epoch": 3040} {"train_loss": -24.956022262573242, "global_step": 252348, "epoch": 3040} {"train_loss": -24.88690948486328, "global_step": 252349, "epoch": 3040} {"train_loss": -24.86815643310547, "global_step": 252350, "epoch": 3040} {"train_loss": -24.724746704101562, "global_step": 252351, "epoch": 3040} {"train_loss": -24.93977928161621, "global_step": 252352, "epoch": 3040} {"train_loss": -25.121545791625977, "global_step": 252353, "epoch": 3040} {"train_loss": -24.817289352416992, "global_step": 252354, "epoch": 3040} {"train_loss": -24.945362091064453, "global_step": 252355, "epoch": 3040} {"train_loss": -25.0604248046875, "global_step": 252356, "epoch": 3040} {"train_loss": -25.02906608581543, "global_step": 252357, "epoch": 3040} {"train_loss": -25.178152084350586, "global_step": 252358, "epoch": 3040} {"train_loss": -25.14033317565918, "global_step": 252359, "epoch": 3040} {"train_loss": -25.078969955444336, "global_step": 252360, "epoch": 3040} {"train_loss": -25.247894287109375, "global_step": 252361, "epoch": 3040} {"train_loss": -25.324201583862305, "global_step": 252362, "epoch": 3040} {"train_loss": -25.085742950439453, "global_step": 252363, "epoch": 3040} {"train_loss": -25.584930419921875, "global_step": 252364, "epoch": 3040} {"train_loss": -25.02195930480957, "global_step": 252365, "epoch": 3040} {"train_loss": -25.09198760986328, "global_step": 252366, "epoch": 3040} {"train_loss": -25.313756942749023, "global_step": 252367, "epoch": 3040} {"train_loss": -24.960708618164062, "global_step": 252368, "epoch": 3040} {"train_loss": -25.537460327148438, "global_step": 252369, "epoch": 3040} {"train_loss": -25.25498390197754, "global_step": 252370, "epoch": 3040} {"train_loss": -25.19316864013672, "global_step": 252371, "epoch": 3040} {"train_loss": -24.72916603088379, "global_step": 252372, "epoch": 3040} {"train_loss": -24.631086349487305, "global_step": 252373, "epoch": 3040} {"train_loss": -25.046545028686523, "global_step": 252374, "epoch": 3040} {"train_loss": -25.023073196411133, "global_step": 252375, "epoch": 3040} {"train_loss": -25.03693962097168, "global_step": 252376, "epoch": 3040} {"train_loss": -24.63046646118164, "global_step": 252377, "epoch": 3040} {"train_loss": -24.990894317626953, "global_step": 252378, "epoch": 3040} {"train_loss": -24.935199737548828, "global_step": 252379, "epoch": 3040} {"train_loss": -24.831106185913086, "global_step": 252380, "epoch": 3040} {"train_loss": -25.163503646850586, "global_step": 252381, "epoch": 3040} {"train_loss": -24.89558219909668, "global_step": 252382, "epoch": 3040} {"train_loss": -25.22334861755371, "global_step": 252383, "epoch": 3040} {"train_loss": -25.209150314331055, "global_step": 252384, "epoch": 3040} {"train_loss": -25.07647132873535, "global_step": 252385, "epoch": 3040} {"train_loss": -25.463661193847656, "global_step": 252386, "epoch": 3040} {"train_loss": -25.4197940826416, "global_step": 252387, "epoch": 3040} {"train_loss": -25.0842227935791, "global_step": 252388, "epoch": 3040} {"train_loss": -25.20876693725586, "global_step": 252389, "epoch": 3040} {"train_loss": -25.118452072143555, "global_step": 252390, "epoch": 3040} {"train_loss": -24.57465171813965, "global_step": 252391, "epoch": 3040} {"train_loss": -24.980758666992188, "global_step": 252392, "epoch": 3040} {"train_loss": -25.053455352783203, "global_step": 252393, "epoch": 3040} {"train_loss": -25.118993759155273, "global_step": 252394, "epoch": 3040} {"train_loss": -25.206438064575195, "global_step": 252395, "epoch": 3040} {"train_loss": -25.15592384338379, "global_step": 252396, "epoch": 3040} {"train_loss": -24.921110153198242, "global_step": 252397, "epoch": 3040} {"train_loss": -25.089292526245117, "global_step": 252398, "epoch": 3040} {"train_loss": -25.13323974609375, "global_step": 252399, "epoch": 3040} {"train_loss": -24.785612106323242, "global_step": 252400, "epoch": 3040} {"train_loss": -25.18343162536621, "global_step": 252401, "epoch": 3040} {"train_loss": -24.904701669532134, "global_step": 252402, "epoch": 3040, "val_loss": 6857867.0} {"train_loss": -24.71302604675293, "global_step": 252403, "epoch": 3041} {"train_loss": -24.853843688964844, "global_step": 252404, "epoch": 3041} {"train_loss": -24.952560424804688, "global_step": 252405, "epoch": 3041} {"train_loss": -24.797252655029297, "global_step": 252406, "epoch": 3041} {"train_loss": -24.383087158203125, "global_step": 252407, "epoch": 3041} {"train_loss": -24.87748146057129, "global_step": 252408, "epoch": 3041} {"train_loss": -24.816003799438477, "global_step": 252409, "epoch": 3041} {"train_loss": -24.547183990478516, "global_step": 252410, "epoch": 3041} {"train_loss": -25.005624771118164, "global_step": 252411, "epoch": 3041} {"train_loss": -24.73221778869629, "global_step": 252412, "epoch": 3041} {"train_loss": -24.89767837524414, "global_step": 252413, "epoch": 3041} {"train_loss": -24.826047897338867, "global_step": 252414, "epoch": 3041} {"train_loss": -25.210424423217773, "global_step": 252415, "epoch": 3041} {"train_loss": -25.341642379760742, "global_step": 252416, "epoch": 3041} {"train_loss": -25.18602180480957, "global_step": 252417, "epoch": 3041} {"train_loss": -24.90654945373535, "global_step": 252418, "epoch": 3041} {"train_loss": -25.057506561279297, "global_step": 252419, "epoch": 3041} {"train_loss": -24.7857608795166, "global_step": 252420, "epoch": 3041} {"train_loss": -25.08392906188965, "global_step": 252421, "epoch": 3041} {"train_loss": -25.05280876159668, "global_step": 252422, "epoch": 3041} {"train_loss": -25.225584030151367, "global_step": 252423, "epoch": 3041} {"train_loss": -25.002817153930664, "global_step": 252424, "epoch": 3041} {"train_loss": -25.252290725708008, "global_step": 252425, "epoch": 3041} {"train_loss": -25.252552032470703, "global_step": 252426, "epoch": 3041} {"train_loss": -24.872068405151367, "global_step": 252427, "epoch": 3041} {"train_loss": -25.049213409423828, "global_step": 252428, "epoch": 3041} {"train_loss": -25.387975692749023, "global_step": 252429, "epoch": 3041} {"train_loss": -25.523515701293945, "global_step": 252430, "epoch": 3041} {"train_loss": -24.54654312133789, "global_step": 252431, "epoch": 3041} {"train_loss": -25.019804000854492, "global_step": 252432, "epoch": 3041} {"train_loss": -24.615434646606445, "global_step": 252433, "epoch": 3041} {"train_loss": -25.1069278717041, "global_step": 252434, "epoch": 3041} {"train_loss": -24.930036544799805, "global_step": 252435, "epoch": 3041} {"train_loss": -24.80413818359375, "global_step": 252436, "epoch": 3041} {"train_loss": -25.012670516967773, "global_step": 252437, "epoch": 3041} {"train_loss": -24.64853858947754, "global_step": 252438, "epoch": 3041} {"train_loss": -25.11608123779297, "global_step": 252439, "epoch": 3041} {"train_loss": -24.488052368164062, "global_step": 252440, "epoch": 3041} {"train_loss": -25.06812858581543, "global_step": 252441, "epoch": 3041} {"train_loss": -24.977144241333008, "global_step": 252442, "epoch": 3041} {"train_loss": -25.260629653930664, "global_step": 252443, "epoch": 3041} {"train_loss": -24.719425201416016, "global_step": 252444, "epoch": 3041} {"train_loss": -24.774015426635742, "global_step": 252445, "epoch": 3041} {"train_loss": -24.819360733032227, "global_step": 252446, "epoch": 3041} {"train_loss": -25.024534225463867, "global_step": 252447, "epoch": 3041} {"train_loss": -25.130090713500977, "global_step": 252448, "epoch": 3041} {"train_loss": -24.821386337280273, "global_step": 252449, "epoch": 3041} {"train_loss": -25.21857261657715, "global_step": 252450, "epoch": 3041} {"train_loss": -25.183135986328125, "global_step": 252451, "epoch": 3041} {"train_loss": -24.954023361206055, "global_step": 252452, "epoch": 3041} {"train_loss": -24.7972469329834, "global_step": 252453, "epoch": 3041} {"train_loss": -25.196857452392578, "global_step": 252454, "epoch": 3041} {"train_loss": -24.683231353759766, "global_step": 252455, "epoch": 3041} {"train_loss": -24.47224235534668, "global_step": 252456, "epoch": 3041} {"train_loss": -24.798093795776367, "global_step": 252457, "epoch": 3041} {"train_loss": -25.154081344604492, "global_step": 252458, "epoch": 3041} {"train_loss": -24.435184478759766, "global_step": 252459, "epoch": 3041} {"train_loss": -25.217525482177734, "global_step": 252460, "epoch": 3041} {"train_loss": -25.064207077026367, "global_step": 252461, "epoch": 3041} {"train_loss": -25.026355743408203, "global_step": 252462, "epoch": 3041} {"train_loss": -25.092626571655273, "global_step": 252463, "epoch": 3041} {"train_loss": -25.099157333374023, "global_step": 252464, "epoch": 3041} {"train_loss": -25.060590744018555, "global_step": 252465, "epoch": 3041} {"train_loss": -24.99258804321289, "global_step": 252466, "epoch": 3041} {"train_loss": -24.5835018157959, "global_step": 252467, "epoch": 3041} {"train_loss": -25.13277816772461, "global_step": 252468, "epoch": 3041} {"train_loss": -25.4272518157959, "global_step": 252469, "epoch": 3041} {"train_loss": -25.336362838745117, "global_step": 252470, "epoch": 3041} {"train_loss": -25.1638126373291, "global_step": 252471, "epoch": 3041} {"train_loss": -25.19146728515625, "global_step": 252472, "epoch": 3041} {"train_loss": -25.385028839111328, "global_step": 252473, "epoch": 3041} {"train_loss": -25.39584732055664, "global_step": 252474, "epoch": 3041} {"train_loss": -25.121902465820312, "global_step": 252475, "epoch": 3041} {"train_loss": -25.181598663330078, "global_step": 252476, "epoch": 3041} {"train_loss": -25.15326499938965, "global_step": 252477, "epoch": 3041} {"train_loss": -25.24648094177246, "global_step": 252478, "epoch": 3041} {"train_loss": -25.278284072875977, "global_step": 252479, "epoch": 3041} {"train_loss": -25.216053009033203, "global_step": 252480, "epoch": 3041} {"train_loss": -25.192508697509766, "global_step": 252481, "epoch": 3041} {"train_loss": -25.07858657836914, "global_step": 252482, "epoch": 3041} {"train_loss": -25.340604782104492, "global_step": 252483, "epoch": 3041} {"train_loss": -25.120054244995117, "global_step": 252484, "epoch": 3041} {"train_loss": -25.018568705363446, "global_step": 252485, "epoch": 3041, "val_loss": 6811102.0} {"train_loss": -24.618253707885742, "global_step": 252486, "epoch": 3042} {"train_loss": -25.142383575439453, "global_step": 252487, "epoch": 3042} {"train_loss": -24.905370712280273, "global_step": 252488, "epoch": 3042} {"train_loss": -25.198217391967773, "global_step": 252489, "epoch": 3042} {"train_loss": -24.720129013061523, "global_step": 252490, "epoch": 3042} {"train_loss": -25.034759521484375, "global_step": 252491, "epoch": 3042} {"train_loss": -24.569820404052734, "global_step": 252492, "epoch": 3042} {"train_loss": -24.87589454650879, "global_step": 252493, "epoch": 3042} {"train_loss": -24.15228271484375, "global_step": 252494, "epoch": 3042} {"train_loss": -23.81396484375, "global_step": 252495, "epoch": 3042} {"train_loss": -24.019439697265625, "global_step": 252496, "epoch": 3042} {"train_loss": -24.712217330932617, "global_step": 252497, "epoch": 3042} {"train_loss": -24.679590225219727, "global_step": 252498, "epoch": 3042} {"train_loss": -24.287429809570312, "global_step": 252499, "epoch": 3042} {"train_loss": -24.66377067565918, "global_step": 252500, "epoch": 3042} {"train_loss": -24.712621688842773, "global_step": 252501, "epoch": 3042} {"train_loss": -24.421422958374023, "global_step": 252502, "epoch": 3042} {"train_loss": -24.716999053955078, "global_step": 252503, "epoch": 3042} {"train_loss": -24.768964767456055, "global_step": 252504, "epoch": 3042} {"train_loss": -24.575027465820312, "global_step": 252505, "epoch": 3042} {"train_loss": -24.642656326293945, "global_step": 252506, "epoch": 3042} {"train_loss": -24.664640426635742, "global_step": 252507, "epoch": 3042} {"train_loss": -24.70531463623047, "global_step": 252508, "epoch": 3042} {"train_loss": -24.93817138671875, "global_step": 252509, "epoch": 3042} {"train_loss": -25.115835189819336, "global_step": 252510, "epoch": 3042} {"train_loss": -24.715085983276367, "global_step": 252511, "epoch": 3042} {"train_loss": -24.63125991821289, "global_step": 252512, "epoch": 3042} {"train_loss": -25.035757064819336, "global_step": 252513, "epoch": 3042} {"train_loss": -24.790380477905273, "global_step": 252514, "epoch": 3042} {"train_loss": -24.82242774963379, "global_step": 252515, "epoch": 3042} {"train_loss": -25.135862350463867, "global_step": 252516, "epoch": 3042} {"train_loss": -25.037561416625977, "global_step": 252517, "epoch": 3042} {"train_loss": -24.914371490478516, "global_step": 252518, "epoch": 3042} {"train_loss": -25.322065353393555, "global_step": 252519, "epoch": 3042} {"train_loss": -25.167964935302734, "global_step": 252520, "epoch": 3042} {"train_loss": -25.121259689331055, "global_step": 252521, "epoch": 3042} {"train_loss": -24.85220718383789, "global_step": 252522, "epoch": 3042} {"train_loss": -25.573226928710938, "global_step": 252523, "epoch": 3042} {"train_loss": -25.43562126159668, "global_step": 252524, "epoch": 3042} {"train_loss": -25.02932357788086, "global_step": 252525, "epoch": 3042} {"train_loss": -25.23780632019043, "global_step": 252526, "epoch": 3042} {"train_loss": -25.28694725036621, "global_step": 252527, "epoch": 3042} {"train_loss": -25.30293846130371, "global_step": 252528, "epoch": 3042} {"train_loss": -25.184730529785156, "global_step": 252529, "epoch": 3042} {"train_loss": -25.051694869995117, "global_step": 252530, "epoch": 3042} {"train_loss": -25.223880767822266, "global_step": 252531, "epoch": 3042} {"train_loss": -24.825870513916016, "global_step": 252532, "epoch": 3042} {"train_loss": -24.828750610351562, "global_step": 252533, "epoch": 3042} {"train_loss": -25.116138458251953, "global_step": 252534, "epoch": 3042} {"train_loss": -25.118545532226562, "global_step": 252535, "epoch": 3042} {"train_loss": -25.170169830322266, "global_step": 252536, "epoch": 3042} {"train_loss": -25.264972686767578, "global_step": 252537, "epoch": 3042} {"train_loss": -25.397598266601562, "global_step": 252538, "epoch": 3042} {"train_loss": -24.84929847717285, "global_step": 252539, "epoch": 3042} {"train_loss": -25.155942916870117, "global_step": 252540, "epoch": 3042} {"train_loss": -25.259098052978516, "global_step": 252541, "epoch": 3042} {"train_loss": -24.9678955078125, "global_step": 252542, "epoch": 3042} {"train_loss": -25.387609481811523, "global_step": 252543, "epoch": 3042} {"train_loss": -24.954448699951172, "global_step": 252544, "epoch": 3042} {"train_loss": -25.192228317260742, "global_step": 252545, "epoch": 3042} {"train_loss": -25.280832290649414, "global_step": 252546, "epoch": 3042} {"train_loss": -24.77396583557129, "global_step": 252547, "epoch": 3042} {"train_loss": -25.04062843322754, "global_step": 252548, "epoch": 3042} {"train_loss": -25.309600830078125, "global_step": 252549, "epoch": 3042} {"train_loss": -24.972171783447266, "global_step": 252550, "epoch": 3042} {"train_loss": -24.666913986206055, "global_step": 252551, "epoch": 3042} {"train_loss": -24.732873916625977, "global_step": 252552, "epoch": 3042} {"train_loss": -24.81351089477539, "global_step": 252553, "epoch": 3042} {"train_loss": -25.343427658081055, "global_step": 252554, "epoch": 3042} {"train_loss": -25.170297622680664, "global_step": 252555, "epoch": 3042} {"train_loss": -25.50228500366211, "global_step": 252556, "epoch": 3042} {"train_loss": -25.049732208251953, "global_step": 252557, "epoch": 3042} {"train_loss": -25.148874282836914, "global_step": 252558, "epoch": 3042} {"train_loss": -24.947141647338867, "global_step": 252559, "epoch": 3042} {"train_loss": -25.381149291992188, "global_step": 252560, "epoch": 3042} {"train_loss": -25.138290405273438, "global_step": 252561, "epoch": 3042} {"train_loss": -24.890426635742188, "global_step": 252562, "epoch": 3042} {"train_loss": -25.280624389648438, "global_step": 252563, "epoch": 3042} {"train_loss": -25.492168426513672, "global_step": 252564, "epoch": 3042} {"train_loss": -25.196332931518555, "global_step": 252565, "epoch": 3042} {"train_loss": -24.96987533569336, "global_step": 252566, "epoch": 3042} {"train_loss": -25.217161178588867, "global_step": 252567, "epoch": 3042} {"train_loss": -24.971707608326373, "global_step": 252568, "epoch": 3042, "val_loss": 6846518.0} {"train_loss": -24.8587646484375, "global_step": 252569, "epoch": 3043} {"train_loss": -24.383020401000977, "global_step": 252570, "epoch": 3043} {"train_loss": -24.264928817749023, "global_step": 252571, "epoch": 3043} {"train_loss": -24.612165451049805, "global_step": 252572, "epoch": 3043} {"train_loss": -24.469480514526367, "global_step": 252573, "epoch": 3043} {"train_loss": -24.538297653198242, "global_step": 252574, "epoch": 3043} {"train_loss": -24.422658920288086, "global_step": 252575, "epoch": 3043} {"train_loss": -24.48668098449707, "global_step": 252576, "epoch": 3043} {"train_loss": -24.836179733276367, "global_step": 252577, "epoch": 3043} {"train_loss": -24.741804122924805, "global_step": 252578, "epoch": 3043} {"train_loss": -24.35731315612793, "global_step": 252579, "epoch": 3043} {"train_loss": -24.716611862182617, "global_step": 252580, "epoch": 3043} {"train_loss": -24.57213020324707, "global_step": 252581, "epoch": 3043} {"train_loss": -24.667444229125977, "global_step": 252582, "epoch": 3043} {"train_loss": -24.79694175720215, "global_step": 252583, "epoch": 3043} {"train_loss": -24.088293075561523, "global_step": 252584, "epoch": 3043} {"train_loss": -24.530969619750977, "global_step": 252585, "epoch": 3043} {"train_loss": -24.624595642089844, "global_step": 252586, "epoch": 3043} {"train_loss": -24.467350006103516, "global_step": 252587, "epoch": 3043} {"train_loss": -24.726743698120117, "global_step": 252588, "epoch": 3043} {"train_loss": -24.56260871887207, "global_step": 252589, "epoch": 3043} {"train_loss": -24.941259384155273, "global_step": 252590, "epoch": 3043} {"train_loss": -25.191648483276367, "global_step": 252591, "epoch": 3043} {"train_loss": -24.61392593383789, "global_step": 252592, "epoch": 3043} {"train_loss": -24.872522354125977, "global_step": 252593, "epoch": 3043} {"train_loss": -25.069225311279297, "global_step": 252594, "epoch": 3043} {"train_loss": -24.455183029174805, "global_step": 252595, "epoch": 3043} {"train_loss": -24.947553634643555, "global_step": 252596, "epoch": 3043} {"train_loss": -24.70099449157715, "global_step": 252597, "epoch": 3043} {"train_loss": -24.84391212463379, "global_step": 252598, "epoch": 3043} {"train_loss": -24.903287887573242, "global_step": 252599, "epoch": 3043} {"train_loss": -24.91434097290039, "global_step": 252600, "epoch": 3043} {"train_loss": -24.6987247467041, "global_step": 252601, "epoch": 3043} {"train_loss": -24.972122192382812, "global_step": 252602, "epoch": 3043} {"train_loss": -24.93036460876465, "global_step": 252603, "epoch": 3043} {"train_loss": -25.30536460876465, "global_step": 252604, "epoch": 3043} {"train_loss": -24.97327995300293, "global_step": 252605, "epoch": 3043} {"train_loss": -25.066970825195312, "global_step": 252606, "epoch": 3043} {"train_loss": -24.908069610595703, "global_step": 252607, "epoch": 3043} {"train_loss": -24.996267318725586, "global_step": 252608, "epoch": 3043} {"train_loss": -25.267942428588867, "global_step": 252609, "epoch": 3043} {"train_loss": -24.523303985595703, "global_step": 252610, "epoch": 3043} {"train_loss": -24.9222469329834, "global_step": 252611, "epoch": 3043} {"train_loss": -24.873273849487305, "global_step": 252612, "epoch": 3043} {"train_loss": -25.159215927124023, "global_step": 252613, "epoch": 3043} {"train_loss": -24.57154083251953, "global_step": 252614, "epoch": 3043} {"train_loss": -25.06038475036621, "global_step": 252615, "epoch": 3043} {"train_loss": -25.2268009185791, "global_step": 252616, "epoch": 3043} {"train_loss": -24.971830368041992, "global_step": 252617, "epoch": 3043} {"train_loss": -24.7229061126709, "global_step": 252618, "epoch": 3043} {"train_loss": -24.713056564331055, "global_step": 252619, "epoch": 3043} {"train_loss": -24.85268783569336, "global_step": 252620, "epoch": 3043} {"train_loss": -25.02634048461914, "global_step": 252621, "epoch": 3043} {"train_loss": -25.273563385009766, "global_step": 252622, "epoch": 3043} {"train_loss": -25.078889846801758, "global_step": 252623, "epoch": 3043} {"train_loss": -25.17147445678711, "global_step": 252624, "epoch": 3043} {"train_loss": -24.585508346557617, "global_step": 252625, "epoch": 3043} {"train_loss": -25.0916805267334, "global_step": 252626, "epoch": 3043} {"train_loss": -24.9465389251709, "global_step": 252627, "epoch": 3043} {"train_loss": -24.961013793945312, "global_step": 252628, "epoch": 3043} {"train_loss": -25.181970596313477, "global_step": 252629, "epoch": 3043} {"train_loss": -24.819822311401367, "global_step": 252630, "epoch": 3043} {"train_loss": -25.384851455688477, "global_step": 252631, "epoch": 3043} {"train_loss": -24.66535758972168, "global_step": 252632, "epoch": 3043} {"train_loss": -25.050844192504883, "global_step": 252633, "epoch": 3043} {"train_loss": -24.99138832092285, "global_step": 252634, "epoch": 3043} {"train_loss": -24.68610954284668, "global_step": 252635, "epoch": 3043} {"train_loss": -24.71217155456543, "global_step": 252636, "epoch": 3043} {"train_loss": -24.707170486450195, "global_step": 252637, "epoch": 3043} {"train_loss": -25.256162643432617, "global_step": 252638, "epoch": 3043} {"train_loss": -24.90498924255371, "global_step": 252639, "epoch": 3043} {"train_loss": -25.268949508666992, "global_step": 252640, "epoch": 3043} {"train_loss": -25.605493545532227, "global_step": 252641, "epoch": 3043} {"train_loss": -25.3460750579834, "global_step": 252642, "epoch": 3043} {"train_loss": -25.27933120727539, "global_step": 252643, "epoch": 3043} {"train_loss": -25.101377487182617, "global_step": 252644, "epoch": 3043} {"train_loss": -24.994565963745117, "global_step": 252645, "epoch": 3043} {"train_loss": -25.049535751342773, "global_step": 252646, "epoch": 3043} {"train_loss": -25.66910743713379, "global_step": 252647, "epoch": 3043} {"train_loss": -25.168439865112305, "global_step": 252648, "epoch": 3043} {"train_loss": -25.062000274658203, "global_step": 252649, "epoch": 3043} {"train_loss": -24.81560516357422, "global_step": 252650, "epoch": 3043} {"train_loss": -24.8804335536727, "global_step": 252651, "epoch": 3043, "val_loss": 6880566.5} {"train_loss": -24.62736701965332, "global_step": 252652, "epoch": 3044} {"train_loss": -24.24662208557129, "global_step": 252653, "epoch": 3044} {"train_loss": -24.70911979675293, "global_step": 252654, "epoch": 3044} {"train_loss": -24.431669235229492, "global_step": 252655, "epoch": 3044} {"train_loss": -24.998132705688477, "global_step": 252656, "epoch": 3044} {"train_loss": -24.50752830505371, "global_step": 252657, "epoch": 3044} {"train_loss": -24.2576847076416, "global_step": 252658, "epoch": 3044} {"train_loss": -24.876203536987305, "global_step": 252659, "epoch": 3044} {"train_loss": -25.126041412353516, "global_step": 252660, "epoch": 3044} {"train_loss": -24.969894409179688, "global_step": 252661, "epoch": 3044} {"train_loss": -24.785524368286133, "global_step": 252662, "epoch": 3044} {"train_loss": -24.557693481445312, "global_step": 252663, "epoch": 3044} {"train_loss": -25.31427764892578, "global_step": 252664, "epoch": 3044} {"train_loss": -24.772993087768555, "global_step": 252665, "epoch": 3044} {"train_loss": -25.080419540405273, "global_step": 252666, "epoch": 3044} {"train_loss": -25.0432071685791, "global_step": 252667, "epoch": 3044} {"train_loss": -24.500064849853516, "global_step": 252668, "epoch": 3044} {"train_loss": -24.946857452392578, "global_step": 252669, "epoch": 3044} {"train_loss": -24.865034103393555, "global_step": 252670, "epoch": 3044} {"train_loss": -25.02510643005371, "global_step": 252671, "epoch": 3044} {"train_loss": -24.857580184936523, "global_step": 252672, "epoch": 3044} {"train_loss": -25.082059860229492, "global_step": 252673, "epoch": 3044} {"train_loss": -24.74825668334961, "global_step": 252674, "epoch": 3044} {"train_loss": -24.82918357849121, "global_step": 252675, "epoch": 3044} {"train_loss": -24.97223472595215, "global_step": 252676, "epoch": 3044} {"train_loss": -24.86387062072754, "global_step": 252677, "epoch": 3044} {"train_loss": -25.18311882019043, "global_step": 252678, "epoch": 3044} {"train_loss": -25.000064849853516, "global_step": 252679, "epoch": 3044} {"train_loss": -25.06244468688965, "global_step": 252680, "epoch": 3044} {"train_loss": -25.117727279663086, "global_step": 252681, "epoch": 3044} {"train_loss": -25.282230377197266, "global_step": 252682, "epoch": 3044} {"train_loss": -24.897974014282227, "global_step": 252683, "epoch": 3044} {"train_loss": -25.175399780273438, "global_step": 252684, "epoch": 3044} {"train_loss": -25.349225997924805, "global_step": 252685, "epoch": 3044} {"train_loss": -24.786746978759766, "global_step": 252686, "epoch": 3044} {"train_loss": -25.214191436767578, "global_step": 252687, "epoch": 3044} {"train_loss": -24.827163696289062, "global_step": 252688, "epoch": 3044} {"train_loss": -24.935171127319336, "global_step": 252689, "epoch": 3044} {"train_loss": -25.070905685424805, "global_step": 252690, "epoch": 3044} {"train_loss": -24.922536849975586, "global_step": 252691, "epoch": 3044} {"train_loss": -25.64939308166504, "global_step": 252692, "epoch": 3044} {"train_loss": -24.857187271118164, "global_step": 252693, "epoch": 3044} {"train_loss": -24.762802124023438, "global_step": 252694, "epoch": 3044} {"train_loss": -24.667325973510742, "global_step": 252695, "epoch": 3044} {"train_loss": -25.610004425048828, "global_step": 252696, "epoch": 3044} {"train_loss": -24.765348434448242, "global_step": 252697, "epoch": 3044} {"train_loss": -25.044692993164062, "global_step": 252698, "epoch": 3044} {"train_loss": -24.829994201660156, "global_step": 252699, "epoch": 3044} {"train_loss": -24.86415672302246, "global_step": 252700, "epoch": 3044} {"train_loss": -25.10590171813965, "global_step": 252701, "epoch": 3044} {"train_loss": -24.84688377380371, "global_step": 252702, "epoch": 3044} {"train_loss": -24.96542739868164, "global_step": 252703, "epoch": 3044} {"train_loss": -25.021921157836914, "global_step": 252704, "epoch": 3044} {"train_loss": -24.828327178955078, "global_step": 252705, "epoch": 3044} {"train_loss": -24.505802154541016, "global_step": 252706, "epoch": 3044} {"train_loss": -24.7786865234375, "global_step": 252707, "epoch": 3044} {"train_loss": -24.866575241088867, "global_step": 252708, "epoch": 3044} {"train_loss": -24.710840225219727, "global_step": 252709, "epoch": 3044} {"train_loss": -25.118436813354492, "global_step": 252710, "epoch": 3044} {"train_loss": -25.089651107788086, "global_step": 252711, "epoch": 3044} {"train_loss": -24.766687393188477, "global_step": 252712, "epoch": 3044} {"train_loss": -25.055309295654297, "global_step": 252713, "epoch": 3044} {"train_loss": -25.181324005126953, "global_step": 252714, "epoch": 3044} {"train_loss": -24.893945693969727, "global_step": 252715, "epoch": 3044} {"train_loss": -24.79532241821289, "global_step": 252716, "epoch": 3044} {"train_loss": -25.042795181274414, "global_step": 252717, "epoch": 3044} {"train_loss": -24.904722213745117, "global_step": 252718, "epoch": 3044} {"train_loss": -24.98727798461914, "global_step": 252719, "epoch": 3044} {"train_loss": -25.166776657104492, "global_step": 252720, "epoch": 3044} {"train_loss": -24.990474700927734, "global_step": 252721, "epoch": 3044} {"train_loss": -25.2558536529541, "global_step": 252722, "epoch": 3044} {"train_loss": -24.73586082458496, "global_step": 252723, "epoch": 3044} {"train_loss": -25.113452911376953, "global_step": 252724, "epoch": 3044} {"train_loss": -25.221792221069336, "global_step": 252725, "epoch": 3044} {"train_loss": -25.22749137878418, "global_step": 252726, "epoch": 3044} {"train_loss": -24.909704208374023, "global_step": 252727, "epoch": 3044} {"train_loss": -24.90570640563965, "global_step": 252728, "epoch": 3044} {"train_loss": -25.210721969604492, "global_step": 252729, "epoch": 3044} {"train_loss": -25.371240615844727, "global_step": 252730, "epoch": 3044} {"train_loss": -25.25470542907715, "global_step": 252731, "epoch": 3044} {"train_loss": -25.030712127685547, "global_step": 252732, "epoch": 3044} {"train_loss": -25.406471252441406, "global_step": 252733, "epoch": 3044} {"train_loss": -24.95167380643178, "global_step": 252734, "epoch": 3044, "val_loss": 6870970.0} {"train_loss": -24.75143051147461, "global_step": 252735, "epoch": 3045} {"train_loss": -24.775562286376953, "global_step": 252736, "epoch": 3045} {"train_loss": -24.55368995666504, "global_step": 252737, "epoch": 3045} {"train_loss": -24.77923583984375, "global_step": 252738, "epoch": 3045} {"train_loss": -24.45078468322754, "global_step": 252739, "epoch": 3045} {"train_loss": -24.259145736694336, "global_step": 252740, "epoch": 3045} {"train_loss": -24.491323471069336, "global_step": 252741, "epoch": 3045} {"train_loss": -24.977270126342773, "global_step": 252742, "epoch": 3045} {"train_loss": -24.373340606689453, "global_step": 252743, "epoch": 3045} {"train_loss": -24.813566207885742, "global_step": 252744, "epoch": 3045} {"train_loss": -24.96065330505371, "global_step": 252745, "epoch": 3045} {"train_loss": -24.44561195373535, "global_step": 252746, "epoch": 3045} {"train_loss": -24.799713134765625, "global_step": 252747, "epoch": 3045} {"train_loss": -24.610280990600586, "global_step": 252748, "epoch": 3045} {"train_loss": -24.87923812866211, "global_step": 252749, "epoch": 3045} {"train_loss": -24.86530876159668, "global_step": 252750, "epoch": 3045} {"train_loss": -25.096607208251953, "global_step": 252751, "epoch": 3045} {"train_loss": -25.01624870300293, "global_step": 252752, "epoch": 3045} {"train_loss": -24.5877628326416, "global_step": 252753, "epoch": 3045} {"train_loss": -25.13715171813965, "global_step": 252754, "epoch": 3045} {"train_loss": -25.08835220336914, "global_step": 252755, "epoch": 3045} {"train_loss": -24.777738571166992, "global_step": 252756, "epoch": 3045} {"train_loss": -25.062772750854492, "global_step": 252757, "epoch": 3045} {"train_loss": -25.19454002380371, "global_step": 252758, "epoch": 3045} {"train_loss": -25.35976219177246, "global_step": 252759, "epoch": 3045} {"train_loss": -25.140546798706055, "global_step": 252760, "epoch": 3045} {"train_loss": -25.431394577026367, "global_step": 252761, "epoch": 3045} {"train_loss": -25.21152114868164, "global_step": 252762, "epoch": 3045} {"train_loss": -24.9702091217041, "global_step": 252763, "epoch": 3045} {"train_loss": -25.04823875427246, "global_step": 252764, "epoch": 3045} {"train_loss": -25.218793869018555, "global_step": 252765, "epoch": 3045} {"train_loss": -24.98213768005371, "global_step": 252766, "epoch": 3045} {"train_loss": -24.705419540405273, "global_step": 252767, "epoch": 3045} {"train_loss": -25.24531364440918, "global_step": 252768, "epoch": 3045} {"train_loss": -25.19441795349121, "global_step": 252769, "epoch": 3045} {"train_loss": -25.14396095275879, "global_step": 252770, "epoch": 3045} {"train_loss": -25.02411460876465, "global_step": 252771, "epoch": 3045} {"train_loss": -25.096357345581055, "global_step": 252772, "epoch": 3045} {"train_loss": -25.149641036987305, "global_step": 252773, "epoch": 3045} {"train_loss": -25.19782829284668, "global_step": 252774, "epoch": 3045} {"train_loss": -24.90851593017578, "global_step": 252775, "epoch": 3045} {"train_loss": -25.35129737854004, "global_step": 252776, "epoch": 3045} {"train_loss": -25.166759490966797, "global_step": 252777, "epoch": 3045} {"train_loss": -24.718610763549805, "global_step": 252778, "epoch": 3045} {"train_loss": -25.155860900878906, "global_step": 252779, "epoch": 3045} {"train_loss": -25.368738174438477, "global_step": 252780, "epoch": 3045} {"train_loss": -24.984479904174805, "global_step": 252781, "epoch": 3045} {"train_loss": -24.768714904785156, "global_step": 252782, "epoch": 3045} {"train_loss": -24.719770431518555, "global_step": 252783, "epoch": 3045} {"train_loss": -25.02276039123535, "global_step": 252784, "epoch": 3045} {"train_loss": -25.0631160736084, "global_step": 252785, "epoch": 3045} {"train_loss": -24.94223976135254, "global_step": 252786, "epoch": 3045} {"train_loss": -25.113882064819336, "global_step": 252787, "epoch": 3045} {"train_loss": -25.196258544921875, "global_step": 252788, "epoch": 3045} {"train_loss": -24.999454498291016, "global_step": 252789, "epoch": 3045} {"train_loss": -25.463459014892578, "global_step": 252790, "epoch": 3045} {"train_loss": -25.09746551513672, "global_step": 252791, "epoch": 3045} {"train_loss": -24.8873348236084, "global_step": 252792, "epoch": 3045} {"train_loss": -25.204269409179688, "global_step": 252793, "epoch": 3045} {"train_loss": -24.988866806030273, "global_step": 252794, "epoch": 3045} {"train_loss": -25.003023147583008, "global_step": 252795, "epoch": 3045} {"train_loss": -24.76435089111328, "global_step": 252796, "epoch": 3045} {"train_loss": -25.124799728393555, "global_step": 252797, "epoch": 3045} {"train_loss": -25.004854202270508, "global_step": 252798, "epoch": 3045} {"train_loss": -24.8199520111084, "global_step": 252799, "epoch": 3045} {"train_loss": -25.286579132080078, "global_step": 252800, "epoch": 3045} {"train_loss": -24.785844802856445, "global_step": 252801, "epoch": 3045} {"train_loss": -25.175952911376953, "global_step": 252802, "epoch": 3045} {"train_loss": -25.181217193603516, "global_step": 252803, "epoch": 3045} {"train_loss": -25.146486282348633, "global_step": 252804, "epoch": 3045} {"train_loss": -25.182554244995117, "global_step": 252805, "epoch": 3045} {"train_loss": -25.390789031982422, "global_step": 252806, "epoch": 3045} {"train_loss": -25.118337631225586, "global_step": 252807, "epoch": 3045} {"train_loss": -25.375852584838867, "global_step": 252808, "epoch": 3045} {"train_loss": -25.36208152770996, "global_step": 252809, "epoch": 3045} {"train_loss": -25.02046775817871, "global_step": 252810, "epoch": 3045} {"train_loss": -24.629016876220703, "global_step": 252811, "epoch": 3045} {"train_loss": -24.87931251525879, "global_step": 252812, "epoch": 3045} {"train_loss": -25.297168731689453, "global_step": 252813, "epoch": 3045} {"train_loss": -25.13075828552246, "global_step": 252814, "epoch": 3045} {"train_loss": -25.256418228149414, "global_step": 252815, "epoch": 3045} {"train_loss": -25.35152816772461, "global_step": 252816, "epoch": 3045} {"train_loss": -25.0121881186244, "global_step": 252817, "epoch": 3045, "val_loss": 6952122.0} {"train_loss": -25.04930877685547, "global_step": 252818, "epoch": 3046} {"train_loss": -24.755760192871094, "global_step": 252819, "epoch": 3046} {"train_loss": -24.812782287597656, "global_step": 252820, "epoch": 3046} {"train_loss": -24.34107208251953, "global_step": 252821, "epoch": 3046} {"train_loss": -25.0015811920166, "global_step": 252822, "epoch": 3046} {"train_loss": -25.153013229370117, "global_step": 252823, "epoch": 3046} {"train_loss": -25.107688903808594, "global_step": 252824, "epoch": 3046} {"train_loss": -24.976032257080078, "global_step": 252825, "epoch": 3046} {"train_loss": -24.933456420898438, "global_step": 252826, "epoch": 3046} {"train_loss": -24.84891700744629, "global_step": 252827, "epoch": 3046} {"train_loss": -24.931364059448242, "global_step": 252828, "epoch": 3046} {"train_loss": -24.880741119384766, "global_step": 252829, "epoch": 3046} {"train_loss": -24.714479446411133, "global_step": 252830, "epoch": 3046} {"train_loss": -24.747379302978516, "global_step": 252831, "epoch": 3046} {"train_loss": -24.791318893432617, "global_step": 252832, "epoch": 3046} {"train_loss": -25.206775665283203, "global_step": 252833, "epoch": 3046} {"train_loss": -24.96100425720215, "global_step": 252834, "epoch": 3046} {"train_loss": -24.898237228393555, "global_step": 252835, "epoch": 3046} {"train_loss": -24.754552841186523, "global_step": 252836, "epoch": 3046} {"train_loss": -24.251205444335938, "global_step": 252837, "epoch": 3046} {"train_loss": -24.76584243774414, "global_step": 252838, "epoch": 3046} {"train_loss": -25.059764862060547, "global_step": 252839, "epoch": 3046} {"train_loss": -25.090429306030273, "global_step": 252840, "epoch": 3046} {"train_loss": -25.27878761291504, "global_step": 252841, "epoch": 3046} {"train_loss": -24.617300033569336, "global_step": 252842, "epoch": 3046} {"train_loss": -25.168516159057617, "global_step": 252843, "epoch": 3046} {"train_loss": -24.904796600341797, "global_step": 252844, "epoch": 3046} {"train_loss": -24.97614097595215, "global_step": 252845, "epoch": 3046} {"train_loss": -24.999042510986328, "global_step": 252846, "epoch": 3046} {"train_loss": -24.719778060913086, "global_step": 252847, "epoch": 3046} {"train_loss": -25.010496139526367, "global_step": 252848, "epoch": 3046} {"train_loss": -24.914335250854492, "global_step": 252849, "epoch": 3046} {"train_loss": -24.669477462768555, "global_step": 252850, "epoch": 3046} {"train_loss": -24.954614639282227, "global_step": 252851, "epoch": 3046} {"train_loss": -24.93906593322754, "global_step": 252852, "epoch": 3046} {"train_loss": -24.663137435913086, "global_step": 252853, "epoch": 3046} {"train_loss": -25.04499626159668, "global_step": 252854, "epoch": 3046} {"train_loss": -24.86802864074707, "global_step": 252855, "epoch": 3046} {"train_loss": -25.123376846313477, "global_step": 252856, "epoch": 3046} {"train_loss": -25.2197208404541, "global_step": 252857, "epoch": 3046} {"train_loss": -24.94382095336914, "global_step": 252858, "epoch": 3046} {"train_loss": -25.24176597595215, "global_step": 252859, "epoch": 3046} {"train_loss": -24.78022003173828, "global_step": 252860, "epoch": 3046} {"train_loss": -24.920612335205078, "global_step": 252861, "epoch": 3046} {"train_loss": -24.91827964782715, "global_step": 252862, "epoch": 3046} {"train_loss": -24.65042495727539, "global_step": 252863, "epoch": 3046} {"train_loss": -24.831729888916016, "global_step": 252864, "epoch": 3046} {"train_loss": -24.989225387573242, "global_step": 252865, "epoch": 3046} {"train_loss": -24.943803787231445, "global_step": 252866, "epoch": 3046} {"train_loss": -25.024839401245117, "global_step": 252867, "epoch": 3046} {"train_loss": -24.95114517211914, "global_step": 252868, "epoch": 3046} {"train_loss": -25.076108932495117, "global_step": 252869, "epoch": 3046} {"train_loss": -25.058109283447266, "global_step": 252870, "epoch": 3046} {"train_loss": -25.17693519592285, "global_step": 252871, "epoch": 3046} {"train_loss": -25.362144470214844, "global_step": 252872, "epoch": 3046} {"train_loss": -25.199235916137695, "global_step": 252873, "epoch": 3046} {"train_loss": -25.36050796508789, "global_step": 252874, "epoch": 3046} {"train_loss": -25.373580932617188, "global_step": 252875, "epoch": 3046} {"train_loss": -24.862035751342773, "global_step": 252876, "epoch": 3046} {"train_loss": -25.06867790222168, "global_step": 252877, "epoch": 3046} {"train_loss": -24.978158950805664, "global_step": 252878, "epoch": 3046} {"train_loss": -25.260704040527344, "global_step": 252879, "epoch": 3046} {"train_loss": -25.369413375854492, "global_step": 252880, "epoch": 3046} {"train_loss": -25.26786994934082, "global_step": 252881, "epoch": 3046} {"train_loss": -25.35542106628418, "global_step": 252882, "epoch": 3046} {"train_loss": -24.894174575805664, "global_step": 252883, "epoch": 3046} {"train_loss": -25.129220962524414, "global_step": 252884, "epoch": 3046} {"train_loss": -24.764205932617188, "global_step": 252885, "epoch": 3046} {"train_loss": -25.080448150634766, "global_step": 252886, "epoch": 3046} {"train_loss": -25.065380096435547, "global_step": 252887, "epoch": 3046} {"train_loss": -25.02033042907715, "global_step": 252888, "epoch": 3046} {"train_loss": -24.72481918334961, "global_step": 252889, "epoch": 3046} {"train_loss": -25.187829971313477, "global_step": 252890, "epoch": 3046} {"train_loss": -24.74677085876465, "global_step": 252891, "epoch": 3046} {"train_loss": -24.834108352661133, "global_step": 252892, "epoch": 3046} {"train_loss": -25.1829776763916, "global_step": 252893, "epoch": 3046} {"train_loss": -25.00211524963379, "global_step": 252894, "epoch": 3046} {"train_loss": -24.635515213012695, "global_step": 252895, "epoch": 3046} {"train_loss": -24.762577056884766, "global_step": 252896, "epoch": 3046} {"train_loss": -24.87339210510254, "global_step": 252897, "epoch": 3046} {"train_loss": -25.261831283569336, "global_step": 252898, "epoch": 3046} {"train_loss": -24.819089889526367, "global_step": 252899, "epoch": 3046} {"train_loss": -24.94558099953525, "global_step": 252900, "epoch": 3046, "val_loss": 6662362.0} {"train_loss": -24.43699073791504, "global_step": 252901, "epoch": 3047} {"train_loss": -24.141143798828125, "global_step": 252902, "epoch": 3047} {"train_loss": -24.943815231323242, "global_step": 252903, "epoch": 3047} {"train_loss": -24.105804443359375, "global_step": 252904, "epoch": 3047} {"train_loss": -24.728302001953125, "global_step": 252905, "epoch": 3047} {"train_loss": -24.333709716796875, "global_step": 252906, "epoch": 3047} {"train_loss": -24.36654281616211, "global_step": 252907, "epoch": 3047} {"train_loss": -24.284765243530273, "global_step": 252908, "epoch": 3047} {"train_loss": -24.383506774902344, "global_step": 252909, "epoch": 3047} {"train_loss": -24.646177291870117, "global_step": 252910, "epoch": 3047} {"train_loss": -24.669095993041992, "global_step": 252911, "epoch": 3047} {"train_loss": -24.158843994140625, "global_step": 252912, "epoch": 3047} {"train_loss": -24.83487319946289, "global_step": 252913, "epoch": 3047} {"train_loss": -24.63204002380371, "global_step": 252914, "epoch": 3047} {"train_loss": -24.27379608154297, "global_step": 252915, "epoch": 3047} {"train_loss": -24.919677734375, "global_step": 252916, "epoch": 3047} {"train_loss": -24.46066665649414, "global_step": 252917, "epoch": 3047} {"train_loss": -24.307565689086914, "global_step": 252918, "epoch": 3047} {"train_loss": -24.78190040588379, "global_step": 252919, "epoch": 3047} {"train_loss": -24.5049991607666, "global_step": 252920, "epoch": 3047} {"train_loss": -24.536088943481445, "global_step": 252921, "epoch": 3047} {"train_loss": -24.45759391784668, "global_step": 252922, "epoch": 3047} {"train_loss": -24.73242950439453, "global_step": 252923, "epoch": 3047} {"train_loss": -24.701932907104492, "global_step": 252924, "epoch": 3047} {"train_loss": -24.90789222717285, "global_step": 252925, "epoch": 3047} {"train_loss": -25.01150894165039, "global_step": 252926, "epoch": 3047} {"train_loss": -24.505674362182617, "global_step": 252927, "epoch": 3047} {"train_loss": -25.168582916259766, "global_step": 252928, "epoch": 3047} {"train_loss": -24.50115203857422, "global_step": 252929, "epoch": 3047} {"train_loss": -24.853654861450195, "global_step": 252930, "epoch": 3047} {"train_loss": -24.663789749145508, "global_step": 252931, "epoch": 3047} {"train_loss": -24.77042579650879, "global_step": 252932, "epoch": 3047} {"train_loss": -25.113988876342773, "global_step": 252933, "epoch": 3047} {"train_loss": -24.95656394958496, "global_step": 252934, "epoch": 3047} {"train_loss": -24.990591049194336, "global_step": 252935, "epoch": 3047} {"train_loss": -25.156675338745117, "global_step": 252936, "epoch": 3047} {"train_loss": -24.871370315551758, "global_step": 252937, "epoch": 3047} {"train_loss": -25.602087020874023, "global_step": 252938, "epoch": 3047} {"train_loss": -25.101781845092773, "global_step": 252939, "epoch": 3047} {"train_loss": -25.0330867767334, "global_step": 252940, "epoch": 3047} {"train_loss": -25.153833389282227, "global_step": 252941, "epoch": 3047} {"train_loss": -25.014379501342773, "global_step": 252942, "epoch": 3047} {"train_loss": -25.30245018005371, "global_step": 252943, "epoch": 3047} {"train_loss": -25.369140625, "global_step": 252944, "epoch": 3047} {"train_loss": -25.034523010253906, "global_step": 252945, "epoch": 3047} {"train_loss": -24.5603084564209, "global_step": 252946, "epoch": 3047} {"train_loss": -24.706096649169922, "global_step": 252947, "epoch": 3047} {"train_loss": -25.3513126373291, "global_step": 252948, "epoch": 3047} {"train_loss": -25.22829246520996, "global_step": 252949, "epoch": 3047} {"train_loss": -25.0092830657959, "global_step": 252950, "epoch": 3047} {"train_loss": -24.621307373046875, "global_step": 252951, "epoch": 3047} {"train_loss": -24.76784324645996, "global_step": 252952, "epoch": 3047} {"train_loss": -24.910724639892578, "global_step": 252953, "epoch": 3047} {"train_loss": -25.17927360534668, "global_step": 252954, "epoch": 3047} {"train_loss": -24.799034118652344, "global_step": 252955, "epoch": 3047} {"train_loss": -24.764318466186523, "global_step": 252956, "epoch": 3047} {"train_loss": -25.4950008392334, "global_step": 252957, "epoch": 3047} {"train_loss": -25.035612106323242, "global_step": 252958, "epoch": 3047} {"train_loss": -25.091049194335938, "global_step": 252959, "epoch": 3047} {"train_loss": -25.037296295166016, "global_step": 252960, "epoch": 3047} {"train_loss": -25.226118087768555, "global_step": 252961, "epoch": 3047} {"train_loss": -25.207338333129883, "global_step": 252962, "epoch": 3047} {"train_loss": -25.109893798828125, "global_step": 252963, "epoch": 3047} {"train_loss": -25.361032485961914, "global_step": 252964, "epoch": 3047} {"train_loss": -25.274381637573242, "global_step": 252965, "epoch": 3047} {"train_loss": -25.12409019470215, "global_step": 252966, "epoch": 3047} {"train_loss": -25.412931442260742, "global_step": 252967, "epoch": 3047} {"train_loss": -25.402170181274414, "global_step": 252968, "epoch": 3047} {"train_loss": -25.32054901123047, "global_step": 252969, "epoch": 3047} {"train_loss": -24.65972328186035, "global_step": 252970, "epoch": 3047} {"train_loss": -25.320140838623047, "global_step": 252971, "epoch": 3047} {"train_loss": -25.25231170654297, "global_step": 252972, "epoch": 3047} {"train_loss": -25.328079223632812, "global_step": 252973, "epoch": 3047} {"train_loss": -25.32803726196289, "global_step": 252974, "epoch": 3047} {"train_loss": -25.259584426879883, "global_step": 252975, "epoch": 3047} {"train_loss": -25.39603042602539, "global_step": 252976, "epoch": 3047} {"train_loss": -25.32149314880371, "global_step": 252977, "epoch": 3047} {"train_loss": -25.540159225463867, "global_step": 252978, "epoch": 3047} {"train_loss": -25.244770050048828, "global_step": 252979, "epoch": 3047} {"train_loss": -25.295276641845703, "global_step": 252980, "epoch": 3047} {"train_loss": -25.3289737701416, "global_step": 252981, "epoch": 3047} {"train_loss": -25.267105102539062, "global_step": 252982, "epoch": 3047} {"train_loss": -24.936162489006318, "global_step": 252983, "epoch": 3047, "val_loss": 6898545.0} {"train_loss": -24.452173233032227, "global_step": 252984, "epoch": 3048} {"train_loss": -24.381671905517578, "global_step": 252985, "epoch": 3048} {"train_loss": -24.630807876586914, "global_step": 252986, "epoch": 3048} {"train_loss": -24.333831787109375, "global_step": 252987, "epoch": 3048} {"train_loss": -24.665454864501953, "global_step": 252988, "epoch": 3048} {"train_loss": -24.04340362548828, "global_step": 252989, "epoch": 3048} {"train_loss": -24.657358169555664, "global_step": 252990, "epoch": 3048} {"train_loss": -24.242177963256836, "global_step": 252991, "epoch": 3048} {"train_loss": -24.7161808013916, "global_step": 252992, "epoch": 3048} {"train_loss": -24.656452178955078, "global_step": 252993, "epoch": 3048} {"train_loss": -24.96489906311035, "global_step": 252994, "epoch": 3048} {"train_loss": -24.68842887878418, "global_step": 252995, "epoch": 3048} {"train_loss": -24.531057357788086, "global_step": 252996, "epoch": 3048} {"train_loss": -25.113805770874023, "global_step": 252997, "epoch": 3048} {"train_loss": -24.455656051635742, "global_step": 252998, "epoch": 3048} {"train_loss": -24.72237777709961, "global_step": 252999, "epoch": 3048} {"train_loss": -24.853866577148438, "global_step": 253000, "epoch": 3048} {"train_loss": -24.612110137939453, "global_step": 253001, "epoch": 3048} {"train_loss": -24.806747436523438, "global_step": 253002, "epoch": 3048} {"train_loss": -24.884307861328125, "global_step": 253003, "epoch": 3048} {"train_loss": -24.88344383239746, "global_step": 253004, "epoch": 3048} {"train_loss": -25.053125381469727, "global_step": 253005, "epoch": 3048} {"train_loss": -24.79914665222168, "global_step": 253006, "epoch": 3048} {"train_loss": -24.58168601989746, "global_step": 253007, "epoch": 3048} {"train_loss": -25.035770416259766, "global_step": 253008, "epoch": 3048} {"train_loss": -25.15125846862793, "global_step": 253009, "epoch": 3048} {"train_loss": -24.744314193725586, "global_step": 253010, "epoch": 3048} {"train_loss": -24.783308029174805, "global_step": 253011, "epoch": 3048} {"train_loss": -25.111967086791992, "global_step": 253012, "epoch": 3048} {"train_loss": -24.913373947143555, "global_step": 253013, "epoch": 3048} {"train_loss": -24.883779525756836, "global_step": 253014, "epoch": 3048} {"train_loss": -25.368106842041016, "global_step": 253015, "epoch": 3048} {"train_loss": -25.154163360595703, "global_step": 253016, "epoch": 3048} {"train_loss": -25.296253204345703, "global_step": 253017, "epoch": 3048} {"train_loss": -24.940515518188477, "global_step": 253018, "epoch": 3048} {"train_loss": -25.024974822998047, "global_step": 253019, "epoch": 3048} {"train_loss": -25.171253204345703, "global_step": 253020, "epoch": 3048} {"train_loss": -25.290189743041992, "global_step": 253021, "epoch": 3048} {"train_loss": -25.223302841186523, "global_step": 253022, "epoch": 3048} {"train_loss": -25.124364852905273, "global_step": 253023, "epoch": 3048} {"train_loss": -25.074874877929688, "global_step": 253024, "epoch": 3048} {"train_loss": -25.05162811279297, "global_step": 253025, "epoch": 3048} {"train_loss": -25.16375160217285, "global_step": 253026, "epoch": 3048} {"train_loss": -25.129514694213867, "global_step": 253027, "epoch": 3048} {"train_loss": -24.833770751953125, "global_step": 253028, "epoch": 3048} {"train_loss": -25.01267433166504, "global_step": 253029, "epoch": 3048} {"train_loss": -25.312820434570312, "global_step": 253030, "epoch": 3048} {"train_loss": -25.21367073059082, "global_step": 253031, "epoch": 3048} {"train_loss": -25.35574722290039, "global_step": 253032, "epoch": 3048} {"train_loss": -24.9800968170166, "global_step": 253033, "epoch": 3048} {"train_loss": -25.184097290039062, "global_step": 253034, "epoch": 3048} {"train_loss": -25.16010284423828, "global_step": 253035, "epoch": 3048} {"train_loss": -25.271955490112305, "global_step": 253036, "epoch": 3048} {"train_loss": -25.515554428100586, "global_step": 253037, "epoch": 3048} {"train_loss": -25.006444931030273, "global_step": 253038, "epoch": 3048} {"train_loss": -24.869308471679688, "global_step": 253039, "epoch": 3048} {"train_loss": -25.010690689086914, "global_step": 253040, "epoch": 3048} {"train_loss": -25.103918075561523, "global_step": 253041, "epoch": 3048} {"train_loss": -24.999048233032227, "global_step": 253042, "epoch": 3048} {"train_loss": -25.22695541381836, "global_step": 253043, "epoch": 3048} {"train_loss": -25.167802810668945, "global_step": 253044, "epoch": 3048} {"train_loss": -25.20096206665039, "global_step": 253045, "epoch": 3048} {"train_loss": -25.09630584716797, "global_step": 253046, "epoch": 3048} {"train_loss": -25.105825424194336, "global_step": 253047, "epoch": 3048} {"train_loss": -24.89143943786621, "global_step": 253048, "epoch": 3048} {"train_loss": -25.044422149658203, "global_step": 253049, "epoch": 3048} {"train_loss": -25.392353057861328, "global_step": 253050, "epoch": 3048} {"train_loss": -25.157865524291992, "global_step": 253051, "epoch": 3048} {"train_loss": -25.265918731689453, "global_step": 253052, "epoch": 3048} {"train_loss": -24.913312911987305, "global_step": 253053, "epoch": 3048} {"train_loss": -25.192426681518555, "global_step": 253054, "epoch": 3048} {"train_loss": -25.111997604370117, "global_step": 253055, "epoch": 3048} {"train_loss": -24.61646842956543, "global_step": 253056, "epoch": 3048} {"train_loss": -25.11677360534668, "global_step": 253057, "epoch": 3048} {"train_loss": -25.17421531677246, "global_step": 253058, "epoch": 3048} {"train_loss": -24.96285057067871, "global_step": 253059, "epoch": 3048} {"train_loss": -25.071880340576172, "global_step": 253060, "epoch": 3048} {"train_loss": -25.113906860351562, "global_step": 253061, "epoch": 3048} {"train_loss": -25.23162269592285, "global_step": 253062, "epoch": 3048} {"train_loss": -25.229473114013672, "global_step": 253063, "epoch": 3048} {"train_loss": -25.234771728515625, "global_step": 253064, "epoch": 3048} {"train_loss": -25.154239654541016, "global_step": 253065, "epoch": 3048} {"train_loss": -24.983648575932147, "global_step": 253066, "epoch": 3048, "val_loss": 6779439.5} {"train_loss": -24.430845260620117, "global_step": 253067, "epoch": 3049} {"train_loss": -24.42841911315918, "global_step": 253068, "epoch": 3049} {"train_loss": -24.866952896118164, "global_step": 253069, "epoch": 3049} {"train_loss": -24.15045166015625, "global_step": 253070, "epoch": 3049} {"train_loss": -24.716890335083008, "global_step": 253071, "epoch": 3049} {"train_loss": -24.75520896911621, "global_step": 253072, "epoch": 3049} {"train_loss": -25.066457748413086, "global_step": 253073, "epoch": 3049} {"train_loss": -24.67987823486328, "global_step": 253074, "epoch": 3049} {"train_loss": -24.656320571899414, "global_step": 253075, "epoch": 3049} {"train_loss": -24.75383949279785, "global_step": 253076, "epoch": 3049} {"train_loss": -24.809904098510742, "global_step": 253077, "epoch": 3049} {"train_loss": -24.937742233276367, "global_step": 253078, "epoch": 3049} {"train_loss": -24.563379287719727, "global_step": 253079, "epoch": 3049} {"train_loss": -24.87055015563965, "global_step": 253080, "epoch": 3049} {"train_loss": -25.03915786743164, "global_step": 253081, "epoch": 3049} {"train_loss": -24.951868057250977, "global_step": 253082, "epoch": 3049} {"train_loss": -24.517656326293945, "global_step": 253083, "epoch": 3049} {"train_loss": -24.625812530517578, "global_step": 253084, "epoch": 3049} {"train_loss": -24.599397659301758, "global_step": 253085, "epoch": 3049} {"train_loss": -24.875398635864258, "global_step": 253086, "epoch": 3049} {"train_loss": -24.941091537475586, "global_step": 253087, "epoch": 3049} {"train_loss": -24.86865997314453, "global_step": 253088, "epoch": 3049} {"train_loss": -24.58814811706543, "global_step": 253089, "epoch": 3049} {"train_loss": -25.140165328979492, "global_step": 253090, "epoch": 3049} {"train_loss": -24.401811599731445, "global_step": 253091, "epoch": 3049} {"train_loss": -25.083894729614258, "global_step": 253092, "epoch": 3049} {"train_loss": -24.927480697631836, "global_step": 253093, "epoch": 3049} {"train_loss": -25.201414108276367, "global_step": 253094, "epoch": 3049} {"train_loss": -24.698589324951172, "global_step": 253095, "epoch": 3049} {"train_loss": -25.05484962463379, "global_step": 253096, "epoch": 3049} {"train_loss": -24.799039840698242, "global_step": 253097, "epoch": 3049} {"train_loss": -24.94960594177246, "global_step": 253098, "epoch": 3049} {"train_loss": -24.760770797729492, "global_step": 253099, "epoch": 3049} {"train_loss": -24.606063842773438, "global_step": 253100, "epoch": 3049} {"train_loss": -25.19459342956543, "global_step": 253101, "epoch": 3049} {"train_loss": -24.530181884765625, "global_step": 253102, "epoch": 3049} {"train_loss": -24.68654441833496, "global_step": 253103, "epoch": 3049} {"train_loss": -24.763568878173828, "global_step": 253104, "epoch": 3049} {"train_loss": -24.916181564331055, "global_step": 253105, "epoch": 3049} {"train_loss": -25.018112182617188, "global_step": 253106, "epoch": 3049} {"train_loss": -25.114362716674805, "global_step": 253107, "epoch": 3049} {"train_loss": -24.86052894592285, "global_step": 253108, "epoch": 3049} {"train_loss": -24.973588943481445, "global_step": 253109, "epoch": 3049} {"train_loss": -25.672128677368164, "global_step": 253110, "epoch": 3049} {"train_loss": -25.166038513183594, "global_step": 253111, "epoch": 3049} {"train_loss": -25.077213287353516, "global_step": 253112, "epoch": 3049} {"train_loss": -25.128536224365234, "global_step": 253113, "epoch": 3049} {"train_loss": -24.974891662597656, "global_step": 253114, "epoch": 3049} {"train_loss": -25.035791397094727, "global_step": 253115, "epoch": 3049} {"train_loss": -24.984935760498047, "global_step": 253116, "epoch": 3049} {"train_loss": -25.229328155517578, "global_step": 253117, "epoch": 3049} {"train_loss": -24.857418060302734, "global_step": 253118, "epoch": 3049} {"train_loss": -24.893360137939453, "global_step": 253119, "epoch": 3049} {"train_loss": -24.770124435424805, "global_step": 253120, "epoch": 3049} {"train_loss": -25.451074600219727, "global_step": 253121, "epoch": 3049} {"train_loss": -25.22503089904785, "global_step": 253122, "epoch": 3049} {"train_loss": -24.739110946655273, "global_step": 253123, "epoch": 3049} {"train_loss": -25.16090202331543, "global_step": 253124, "epoch": 3049} {"train_loss": -25.461124420166016, "global_step": 253125, "epoch": 3049} {"train_loss": -25.00380516052246, "global_step": 253126, "epoch": 3049} {"train_loss": -24.921934127807617, "global_step": 253127, "epoch": 3049} {"train_loss": -25.085874557495117, "global_step": 253128, "epoch": 3049} {"train_loss": -24.769704818725586, "global_step": 253129, "epoch": 3049} {"train_loss": -25.276769638061523, "global_step": 253130, "epoch": 3049} {"train_loss": -24.712106704711914, "global_step": 253131, "epoch": 3049} {"train_loss": -25.276885986328125, "global_step": 253132, "epoch": 3049} {"train_loss": -25.130277633666992, "global_step": 253133, "epoch": 3049} {"train_loss": -24.890756607055664, "global_step": 253134, "epoch": 3049} {"train_loss": -24.825428009033203, "global_step": 253135, "epoch": 3049} {"train_loss": -24.848073959350586, "global_step": 253136, "epoch": 3049} {"train_loss": -25.26104164123535, "global_step": 253137, "epoch": 3049} {"train_loss": -25.187549591064453, "global_step": 253138, "epoch": 3049} {"train_loss": -25.46095848083496, "global_step": 253139, "epoch": 3049} {"train_loss": -24.932300567626953, "global_step": 253140, "epoch": 3049} {"train_loss": -25.470232009887695, "global_step": 253141, "epoch": 3049} {"train_loss": -25.057218551635742, "global_step": 253142, "epoch": 3049} {"train_loss": -25.107641220092773, "global_step": 253143, "epoch": 3049} {"train_loss": -25.03993034362793, "global_step": 253144, "epoch": 3049} {"train_loss": -24.711801528930664, "global_step": 253145, "epoch": 3049} {"train_loss": -24.69772720336914, "global_step": 253146, "epoch": 3049} {"train_loss": -24.9383544921875, "global_step": 253147, "epoch": 3049} {"train_loss": -25.1661319732666, "global_step": 253148, "epoch": 3049} {"train_loss": -24.924387001129517, "global_step": 253149, "epoch": 3049, "val_loss": 6809941.0} {"train_loss": -24.02338981628418, "global_step": 253150, "epoch": 3050} {"train_loss": -23.52004623413086, "global_step": 253151, "epoch": 3050} {"train_loss": -24.580623626708984, "global_step": 253152, "epoch": 3050} {"train_loss": -23.906618118286133, "global_step": 253153, "epoch": 3050} {"train_loss": -23.825109481811523, "global_step": 253154, "epoch": 3050} {"train_loss": -24.202322006225586, "global_step": 253155, "epoch": 3050} {"train_loss": -24.57574462890625, "global_step": 253156, "epoch": 3050} {"train_loss": -24.51106834411621, "global_step": 253157, "epoch": 3050} {"train_loss": -24.486438751220703, "global_step": 253158, "epoch": 3050} {"train_loss": -24.608993530273438, "global_step": 253159, "epoch": 3050} {"train_loss": -25.175695419311523, "global_step": 253160, "epoch": 3050} {"train_loss": -24.89411735534668, "global_step": 253161, "epoch": 3050} {"train_loss": -24.41987419128418, "global_step": 253162, "epoch": 3050} {"train_loss": -24.966968536376953, "global_step": 253163, "epoch": 3050} {"train_loss": -24.7938289642334, "global_step": 253164, "epoch": 3050} {"train_loss": -24.74210548400879, "global_step": 253165, "epoch": 3050} {"train_loss": -24.875457763671875, "global_step": 253166, "epoch": 3050} {"train_loss": -24.900110244750977, "global_step": 253167, "epoch": 3050} {"train_loss": -24.381521224975586, "global_step": 253168, "epoch": 3050} {"train_loss": -24.855619430541992, "global_step": 253169, "epoch": 3050} {"train_loss": -24.662052154541016, "global_step": 253170, "epoch": 3050} {"train_loss": -24.640058517456055, "global_step": 253171, "epoch": 3050} {"train_loss": -24.787216186523438, "global_step": 253172, "epoch": 3050} {"train_loss": -24.737335205078125, "global_step": 253173, "epoch": 3050} {"train_loss": -24.83768081665039, "global_step": 253174, "epoch": 3050} {"train_loss": -24.881757736206055, "global_step": 253175, "epoch": 3050} {"train_loss": -25.103174209594727, "global_step": 253176, "epoch": 3050} {"train_loss": -24.998138427734375, "global_step": 253177, "epoch": 3050} {"train_loss": -24.720956802368164, "global_step": 253178, "epoch": 3050} {"train_loss": -24.95903205871582, "global_step": 253179, "epoch": 3050} {"train_loss": -24.6032657623291, "global_step": 253180, "epoch": 3050} {"train_loss": -24.8197078704834, "global_step": 253181, "epoch": 3050} {"train_loss": -24.987234115600586, "global_step": 253182, "epoch": 3050} {"train_loss": -24.9984073638916, "global_step": 253183, "epoch": 3050} {"train_loss": -24.643024444580078, "global_step": 253184, "epoch": 3050} {"train_loss": -25.035573959350586, "global_step": 253185, "epoch": 3050} {"train_loss": -24.956960678100586, "global_step": 253186, "epoch": 3050} {"train_loss": -24.73677635192871, "global_step": 253187, "epoch": 3050} {"train_loss": -24.619611740112305, "global_step": 253188, "epoch": 3050} {"train_loss": -24.789342880249023, "global_step": 253189, "epoch": 3050} {"train_loss": -24.946409225463867, "global_step": 253190, "epoch": 3050} {"train_loss": -24.994264602661133, "global_step": 253191, "epoch": 3050} {"train_loss": -25.229150772094727, "global_step": 253192, "epoch": 3050} {"train_loss": -24.779226303100586, "global_step": 253193, "epoch": 3050} {"train_loss": -24.88898277282715, "global_step": 253194, "epoch": 3050} {"train_loss": -24.977773666381836, "global_step": 253195, "epoch": 3050} {"train_loss": -25.292709350585938, "global_step": 253196, "epoch": 3050} {"train_loss": -25.11021614074707, "global_step": 253197, "epoch": 3050} {"train_loss": -25.018339157104492, "global_step": 253198, "epoch": 3050} {"train_loss": -25.367666244506836, "global_step": 253199, "epoch": 3050} {"train_loss": -24.909706115722656, "global_step": 253200, "epoch": 3050} {"train_loss": -25.392322540283203, "global_step": 253201, "epoch": 3050} {"train_loss": -25.1630859375, "global_step": 253202, "epoch": 3050} {"train_loss": -24.968637466430664, "global_step": 253203, "epoch": 3050} {"train_loss": -25.212020874023438, "global_step": 253204, "epoch": 3050} {"train_loss": -25.664997100830078, "global_step": 253205, "epoch": 3050} {"train_loss": -25.23518943786621, "global_step": 253206, "epoch": 3050} {"train_loss": -24.86890983581543, "global_step": 253207, "epoch": 3050} {"train_loss": -24.802366256713867, "global_step": 253208, "epoch": 3050} {"train_loss": -25.12516212463379, "global_step": 253209, "epoch": 3050} {"train_loss": -25.266630172729492, "global_step": 253210, "epoch": 3050} {"train_loss": -24.997148513793945, "global_step": 253211, "epoch": 3050} {"train_loss": -25.00630760192871, "global_step": 253212, "epoch": 3050} {"train_loss": -25.06692886352539, "global_step": 253213, "epoch": 3050} {"train_loss": -24.845102310180664, "global_step": 253214, "epoch": 3050} {"train_loss": -25.16477394104004, "global_step": 253215, "epoch": 3050} {"train_loss": -24.921571731567383, "global_step": 253216, "epoch": 3050} {"train_loss": -25.15376853942871, "global_step": 253217, "epoch": 3050} {"train_loss": -24.920011520385742, "global_step": 253218, "epoch": 3050} {"train_loss": -24.79990005493164, "global_step": 253219, "epoch": 3050} {"train_loss": -25.109291076660156, "global_step": 253220, "epoch": 3050} {"train_loss": -24.470014572143555, "global_step": 253221, "epoch": 3050} {"train_loss": -24.744226455688477, "global_step": 253222, "epoch": 3050} {"train_loss": -25.243192672729492, "global_step": 253223, "epoch": 3050} {"train_loss": -24.67537498474121, "global_step": 253224, "epoch": 3050} {"train_loss": -24.765249252319336, "global_step": 253225, "epoch": 3050} {"train_loss": -24.801559448242188, "global_step": 253226, "epoch": 3050} {"train_loss": -24.789474487304688, "global_step": 253227, "epoch": 3050} {"train_loss": -24.687835693359375, "global_step": 253228, "epoch": 3050} {"train_loss": -24.433998107910156, "global_step": 253229, "epoch": 3050} {"train_loss": -24.859481811523438, "global_step": 253230, "epoch": 3050} {"train_loss": -24.84515953063965, "global_step": 253231, "epoch": 3050} {"train_loss": -24.835944876613386, "global_step": 253232, "epoch": 3050, "train/sim_max_reward_0": 1.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4500000": 1.0, "test/sim_max_reward_4500001": 1.0, "test/sim_max_reward_4500002": 1.0, "test/sim_max_reward_4500003": 1.0, "test/sim_max_reward_4500004": 1.0, "test/sim_max_reward_4500005": 1.0, "test/sim_max_reward_4500006": 1.0, "test/sim_max_reward_4500007": 0.0, "test/sim_max_reward_4500008": 1.0, "test/sim_max_reward_4500009": 1.0, "test/sim_max_reward_4500010": 1.0, "test/sim_max_reward_4500011": 1.0, "test/sim_max_reward_4500012": 1.0, "test/sim_max_reward_4500013": 1.0, "test/sim_max_reward_4500014": 1.0, "test/sim_max_reward_4500015": 1.0, "test/sim_max_reward_4500016": 1.0, "test/sim_max_reward_4500017": 1.0, "test/sim_max_reward_4500018": 1.0, "test/sim_max_reward_4500019": 1.0, "test/sim_max_reward_4500020": 1.0, "test/sim_max_reward_4500021": 1.0, "train/mean_score": 1.0, "test/mean_score": 0.9545454545454546, "val_loss": 6837170.0} {"train_loss": -24.224609375, "global_step": 253233, "epoch": 3051} {"train_loss": -24.53479766845703, "global_step": 253234, "epoch": 3051} {"train_loss": -24.4036808013916, "global_step": 253235, "epoch": 3051} {"train_loss": -24.43532371520996, "global_step": 253236, "epoch": 3051} {"train_loss": -24.474655151367188, "global_step": 253237, "epoch": 3051} {"train_loss": -24.53189468383789, "global_step": 253238, "epoch": 3051} {"train_loss": -24.796316146850586, "global_step": 253239, "epoch": 3051} {"train_loss": -24.776947021484375, "global_step": 253240, "epoch": 3051} {"train_loss": -24.60994529724121, "global_step": 253241, "epoch": 3051} {"train_loss": -24.78717613220215, "global_step": 253242, "epoch": 3051} {"train_loss": -24.569486618041992, "global_step": 253243, "epoch": 3051} {"train_loss": -24.874906539916992, "global_step": 253244, "epoch": 3051} {"train_loss": -24.804880142211914, "global_step": 253245, "epoch": 3051} {"train_loss": -24.876483917236328, "global_step": 253246, "epoch": 3051} {"train_loss": -24.47564125061035, "global_step": 253247, "epoch": 3051} {"train_loss": -24.565570831298828, "global_step": 253248, "epoch": 3051} {"train_loss": -25.057113647460938, "global_step": 253249, "epoch": 3051} {"train_loss": -24.70882225036621, "global_step": 253250, "epoch": 3051} {"train_loss": -25.257848739624023, "global_step": 253251, "epoch": 3051} {"train_loss": -25.098562240600586, "global_step": 253252, "epoch": 3051} {"train_loss": -24.824491500854492, "global_step": 253253, "epoch": 3051} {"train_loss": -24.696619033813477, "global_step": 253254, "epoch": 3051} {"train_loss": -24.72867202758789, "global_step": 253255, "epoch": 3051} {"train_loss": -25.111879348754883, "global_step": 253256, "epoch": 3051} {"train_loss": -25.204391479492188, "global_step": 253257, "epoch": 3051} {"train_loss": -24.80678939819336, "global_step": 253258, "epoch": 3051} {"train_loss": -25.18941879272461, "global_step": 253259, "epoch": 3051} {"train_loss": -25.003963470458984, "global_step": 253260, "epoch": 3051} {"train_loss": -25.079723358154297, "global_step": 253261, "epoch": 3051} {"train_loss": -25.184865951538086, "global_step": 253262, "epoch": 3051} {"train_loss": -25.189538955688477, "global_step": 253263, "epoch": 3051} {"train_loss": -24.803014755249023, "global_step": 253264, "epoch": 3051} {"train_loss": -25.079465866088867, "global_step": 253265, "epoch": 3051} {"train_loss": -25.353452682495117, "global_step": 253266, "epoch": 3051} {"train_loss": -25.035810470581055, "global_step": 253267, "epoch": 3051} {"train_loss": -24.973501205444336, "global_step": 253268, "epoch": 3051} {"train_loss": -24.849185943603516, "global_step": 253269, "epoch": 3051} {"train_loss": -25.163347244262695, "global_step": 253270, "epoch": 3051} {"train_loss": -25.046571731567383, "global_step": 253271, "epoch": 3051} {"train_loss": -25.295574188232422, "global_step": 253272, "epoch": 3051} {"train_loss": -25.054977416992188, "global_step": 253273, "epoch": 3051} {"train_loss": -25.420576095581055, "global_step": 253274, "epoch": 3051} {"train_loss": -25.031641006469727, "global_step": 253275, "epoch": 3051} {"train_loss": -25.11332130432129, "global_step": 253276, "epoch": 3051} {"train_loss": -25.241209030151367, "global_step": 253277, "epoch": 3051} {"train_loss": -24.98116111755371, "global_step": 253278, "epoch": 3051} {"train_loss": -25.126047134399414, "global_step": 253279, "epoch": 3051} {"train_loss": -24.998722076416016, "global_step": 253280, "epoch": 3051} {"train_loss": -24.578800201416016, "global_step": 253281, "epoch": 3051} {"train_loss": -25.16118812561035, "global_step": 253282, "epoch": 3051} {"train_loss": -24.935264587402344, "global_step": 253283, "epoch": 3051} {"train_loss": -25.35213279724121, "global_step": 253284, "epoch": 3051} {"train_loss": -24.981443405151367, "global_step": 253285, "epoch": 3051} {"train_loss": -25.04871940612793, "global_step": 253286, "epoch": 3051} {"train_loss": -25.316007614135742, "global_step": 253287, "epoch": 3051} {"train_loss": -25.129995346069336, "global_step": 253288, "epoch": 3051} {"train_loss": -25.33780860900879, "global_step": 253289, "epoch": 3051} {"train_loss": -24.921998977661133, "global_step": 253290, "epoch": 3051} {"train_loss": -24.866586685180664, "global_step": 253291, "epoch": 3051} {"train_loss": -24.74677848815918, "global_step": 253292, "epoch": 3051} {"train_loss": -25.303115844726562, "global_step": 253293, "epoch": 3051} {"train_loss": -25.174184799194336, "global_step": 253294, "epoch": 3051} {"train_loss": -24.888593673706055, "global_step": 253295, "epoch": 3051} {"train_loss": -24.87556266784668, "global_step": 253296, "epoch": 3051} {"train_loss": -25.288700103759766, "global_step": 253297, "epoch": 3051} {"train_loss": -25.192461013793945, "global_step": 253298, "epoch": 3051} {"train_loss": -25.304061889648438, "global_step": 253299, "epoch": 3051} {"train_loss": -25.21929931640625, "global_step": 253300, "epoch": 3051} {"train_loss": -24.89950942993164, "global_step": 253301, "epoch": 3051} {"train_loss": -24.761465072631836, "global_step": 253302, "epoch": 3051} {"train_loss": -25.213964462280273, "global_step": 253303, "epoch": 3051} {"train_loss": -25.109582901000977, "global_step": 253304, "epoch": 3051} {"train_loss": -25.283445358276367, "global_step": 253305, "epoch": 3051} {"train_loss": -25.134841918945312, "global_step": 253306, "epoch": 3051} {"train_loss": -24.632917404174805, "global_step": 253307, "epoch": 3051} {"train_loss": -24.84227180480957, "global_step": 253308, "epoch": 3051} {"train_loss": -24.935850143432617, "global_step": 253309, "epoch": 3051} {"train_loss": -25.393932342529297, "global_step": 253310, "epoch": 3051} {"train_loss": -25.215063095092773, "global_step": 253311, "epoch": 3051} {"train_loss": -25.1192569732666, "global_step": 253312, "epoch": 3051} {"train_loss": -25.360044479370117, "global_step": 253313, "epoch": 3051} {"train_loss": -25.10940933227539, "global_step": 253314, "epoch": 3051} {"train_loss": -24.95733688538333, "global_step": 253315, "epoch": 3051, "val_loss": 6820581.0} {"train_loss": -24.29607582092285, "global_step": 253316, "epoch": 3052} {"train_loss": -23.29193687438965, "global_step": 253317, "epoch": 3052} {"train_loss": -23.831424713134766, "global_step": 253318, "epoch": 3052} {"train_loss": -24.46414566040039, "global_step": 253319, "epoch": 3052} {"train_loss": -23.60302734375, "global_step": 253320, "epoch": 3052} {"train_loss": -24.29619789123535, "global_step": 253321, "epoch": 3052} {"train_loss": -24.078031539916992, "global_step": 253322, "epoch": 3052} {"train_loss": -24.197906494140625, "global_step": 253323, "epoch": 3052} {"train_loss": -24.067014694213867, "global_step": 253324, "epoch": 3052} {"train_loss": -24.06648063659668, "global_step": 253325, "epoch": 3052} {"train_loss": -24.37920570373535, "global_step": 253326, "epoch": 3052} {"train_loss": -24.60329246520996, "global_step": 253327, "epoch": 3052} {"train_loss": -24.35798454284668, "global_step": 253328, "epoch": 3052} {"train_loss": -24.005474090576172, "global_step": 253329, "epoch": 3052} {"train_loss": -24.822229385375977, "global_step": 253330, "epoch": 3052} {"train_loss": -24.668758392333984, "global_step": 253331, "epoch": 3052} {"train_loss": -24.50139808654785, "global_step": 253332, "epoch": 3052} {"train_loss": -24.47846031188965, "global_step": 253333, "epoch": 3052} {"train_loss": -24.53751564025879, "global_step": 253334, "epoch": 3052} {"train_loss": -24.956119537353516, "global_step": 253335, "epoch": 3052} {"train_loss": -24.521183013916016, "global_step": 253336, "epoch": 3052} {"train_loss": -25.1706600189209, "global_step": 253337, "epoch": 3052} {"train_loss": -24.701879501342773, "global_step": 253338, "epoch": 3052} {"train_loss": -24.65549087524414, "global_step": 253339, "epoch": 3052} {"train_loss": -24.956411361694336, "global_step": 253340, "epoch": 3052} {"train_loss": -24.84358787536621, "global_step": 253341, "epoch": 3052} {"train_loss": -24.788145065307617, "global_step": 253342, "epoch": 3052} {"train_loss": -24.79249382019043, "global_step": 253343, "epoch": 3052} {"train_loss": -24.69797134399414, "global_step": 253344, "epoch": 3052} {"train_loss": -25.233606338500977, "global_step": 253345, "epoch": 3052} {"train_loss": -25.235689163208008, "global_step": 253346, "epoch": 3052} {"train_loss": -25.4810791015625, "global_step": 253347, "epoch": 3052} {"train_loss": -24.845396041870117, "global_step": 253348, "epoch": 3052} {"train_loss": -24.967430114746094, "global_step": 253349, "epoch": 3052} {"train_loss": -24.902990341186523, "global_step": 253350, "epoch": 3052} {"train_loss": -25.015296936035156, "global_step": 253351, "epoch": 3052} {"train_loss": -24.90635108947754, "global_step": 253352, "epoch": 3052} {"train_loss": -25.260732650756836, "global_step": 253353, "epoch": 3052} {"train_loss": -25.092849731445312, "global_step": 253354, "epoch": 3052} {"train_loss": -24.871347427368164, "global_step": 253355, "epoch": 3052} {"train_loss": -24.961545944213867, "global_step": 253356, "epoch": 3052} {"train_loss": -25.25489616394043, "global_step": 253357, "epoch": 3052} {"train_loss": -25.26959800720215, "global_step": 253358, "epoch": 3052} {"train_loss": -25.1991024017334, "global_step": 253359, "epoch": 3052} {"train_loss": -25.424915313720703, "global_step": 253360, "epoch": 3052} {"train_loss": -25.415605545043945, "global_step": 253361, "epoch": 3052} {"train_loss": -25.01201820373535, "global_step": 253362, "epoch": 3052} {"train_loss": -25.52870750427246, "global_step": 253363, "epoch": 3052} {"train_loss": -25.20018768310547, "global_step": 253364, "epoch": 3052} {"train_loss": -24.90791130065918, "global_step": 253365, "epoch": 3052} {"train_loss": -25.03134536743164, "global_step": 253366, "epoch": 3052} {"train_loss": -24.972475051879883, "global_step": 253367, "epoch": 3052} {"train_loss": -25.127918243408203, "global_step": 253368, "epoch": 3052} {"train_loss": -25.188859939575195, "global_step": 253369, "epoch": 3052} {"train_loss": -24.901565551757812, "global_step": 253370, "epoch": 3052} {"train_loss": -25.022218704223633, "global_step": 253371, "epoch": 3052} {"train_loss": -24.781543731689453, "global_step": 253372, "epoch": 3052} {"train_loss": -24.967260360717773, "global_step": 253373, "epoch": 3052} {"train_loss": -25.235401153564453, "global_step": 253374, "epoch": 3052} {"train_loss": -25.15631103515625, "global_step": 253375, "epoch": 3052} {"train_loss": -25.184112548828125, "global_step": 253376, "epoch": 3052} {"train_loss": -25.715906143188477, "global_step": 253377, "epoch": 3052} {"train_loss": -24.72564697265625, "global_step": 253378, "epoch": 3052} {"train_loss": -25.459928512573242, "global_step": 253379, "epoch": 3052} {"train_loss": -24.915250778198242, "global_step": 253380, "epoch": 3052} {"train_loss": -24.55147933959961, "global_step": 253381, "epoch": 3052} {"train_loss": -25.239534378051758, "global_step": 253382, "epoch": 3052} {"train_loss": -25.01247215270996, "global_step": 253383, "epoch": 3052} {"train_loss": -24.96199607849121, "global_step": 253384, "epoch": 3052} {"train_loss": -24.906408309936523, "global_step": 253385, "epoch": 3052} {"train_loss": -25.254549026489258, "global_step": 253386, "epoch": 3052} {"train_loss": -24.958541870117188, "global_step": 253387, "epoch": 3052} {"train_loss": -24.839929580688477, "global_step": 253388, "epoch": 3052} {"train_loss": -24.817895889282227, "global_step": 253389, "epoch": 3052} {"train_loss": -24.815570831298828, "global_step": 253390, "epoch": 3052} {"train_loss": -25.000883102416992, "global_step": 253391, "epoch": 3052} {"train_loss": -24.66844940185547, "global_step": 253392, "epoch": 3052} {"train_loss": -25.113914489746094, "global_step": 253393, "epoch": 3052} {"train_loss": -24.9041805267334, "global_step": 253394, "epoch": 3052} {"train_loss": -24.908267974853516, "global_step": 253395, "epoch": 3052} {"train_loss": -25.122554779052734, "global_step": 253396, "epoch": 3052} {"train_loss": -24.689014434814453, "global_step": 253397, "epoch": 3052} {"train_loss": -24.844692758767003, "global_step": 253398, "epoch": 3052, "val_loss": 6855291.0} {"train_loss": -25.09969139099121, "global_step": 253399, "epoch": 3053} {"train_loss": -24.81644058227539, "global_step": 253400, "epoch": 3053} {"train_loss": -25.026456832885742, "global_step": 253401, "epoch": 3053} {"train_loss": -24.64955711364746, "global_step": 253402, "epoch": 3053} {"train_loss": -24.554351806640625, "global_step": 253403, "epoch": 3053} {"train_loss": -24.42403793334961, "global_step": 253404, "epoch": 3053} {"train_loss": -24.755664825439453, "global_step": 253405, "epoch": 3053} {"train_loss": -24.615671157836914, "global_step": 253406, "epoch": 3053} {"train_loss": -24.8797607421875, "global_step": 253407, "epoch": 3053} {"train_loss": -24.856468200683594, "global_step": 253408, "epoch": 3053} {"train_loss": -24.926633834838867, "global_step": 253409, "epoch": 3053} {"train_loss": -25.115951538085938, "global_step": 253410, "epoch": 3053} {"train_loss": -25.157339096069336, "global_step": 253411, "epoch": 3053} {"train_loss": -24.820215225219727, "global_step": 253412, "epoch": 3053} {"train_loss": -24.871307373046875, "global_step": 253413, "epoch": 3053} {"train_loss": -25.135547637939453, "global_step": 253414, "epoch": 3053} {"train_loss": -24.896484375, "global_step": 253415, "epoch": 3053} {"train_loss": -24.595245361328125, "global_step": 253416, "epoch": 3053} {"train_loss": -24.998945236206055, "global_step": 253417, "epoch": 3053} {"train_loss": -25.22323989868164, "global_step": 253418, "epoch": 3053} {"train_loss": -25.113561630249023, "global_step": 253419, "epoch": 3053} {"train_loss": -24.95145034790039, "global_step": 253420, "epoch": 3053} {"train_loss": -25.31224250793457, "global_step": 253421, "epoch": 3053} {"train_loss": -25.0631160736084, "global_step": 253422, "epoch": 3053} {"train_loss": -25.160757064819336, "global_step": 253423, "epoch": 3053} {"train_loss": -25.424259185791016, "global_step": 253424, "epoch": 3053} {"train_loss": -24.996719360351562, "global_step": 253425, "epoch": 3053} {"train_loss": -25.003040313720703, "global_step": 253426, "epoch": 3053} {"train_loss": -25.226242065429688, "global_step": 253427, "epoch": 3053} {"train_loss": -24.88910675048828, "global_step": 253428, "epoch": 3053} {"train_loss": -25.066390991210938, "global_step": 253429, "epoch": 3053} {"train_loss": -25.372264862060547, "global_step": 253430, "epoch": 3053} {"train_loss": -25.11092185974121, "global_step": 253431, "epoch": 3053} {"train_loss": -25.192472457885742, "global_step": 253432, "epoch": 3053} {"train_loss": -24.963285446166992, "global_step": 253433, "epoch": 3053} {"train_loss": -25.011260986328125, "global_step": 253434, "epoch": 3053} {"train_loss": -24.617300033569336, "global_step": 253435, "epoch": 3053} {"train_loss": -24.867834091186523, "global_step": 253436, "epoch": 3053} {"train_loss": -24.818117141723633, "global_step": 253437, "epoch": 3053} {"train_loss": -25.09177017211914, "global_step": 253438, "epoch": 3053} {"train_loss": -25.3397274017334, "global_step": 253439, "epoch": 3053} {"train_loss": -25.047788619995117, "global_step": 253440, "epoch": 3053} {"train_loss": -25.421070098876953, "global_step": 253441, "epoch": 3053} {"train_loss": -25.52033042907715, "global_step": 253442, "epoch": 3053} {"train_loss": -24.953718185424805, "global_step": 253443, "epoch": 3053} {"train_loss": -25.09865379333496, "global_step": 253444, "epoch": 3053} {"train_loss": -25.04678726196289, "global_step": 253445, "epoch": 3053} {"train_loss": -25.12047576904297, "global_step": 253446, "epoch": 3053} {"train_loss": -25.480472564697266, "global_step": 253447, "epoch": 3053} {"train_loss": -25.279621124267578, "global_step": 253448, "epoch": 3053} {"train_loss": -24.962390899658203, "global_step": 253449, "epoch": 3053} {"train_loss": -25.305587768554688, "global_step": 253450, "epoch": 3053} {"train_loss": -24.85384178161621, "global_step": 253451, "epoch": 3053} {"train_loss": -24.83322525024414, "global_step": 253452, "epoch": 3053} {"train_loss": -25.084304809570312, "global_step": 253453, "epoch": 3053} {"train_loss": -25.206409454345703, "global_step": 253454, "epoch": 3053} {"train_loss": -25.091421127319336, "global_step": 253455, "epoch": 3053} {"train_loss": -24.688161849975586, "global_step": 253456, "epoch": 3053} {"train_loss": -24.734954833984375, "global_step": 253457, "epoch": 3053} {"train_loss": -25.428647994995117, "global_step": 253458, "epoch": 3053} {"train_loss": -24.6175594329834, "global_step": 253459, "epoch": 3053} {"train_loss": -25.12590980529785, "global_step": 253460, "epoch": 3053} {"train_loss": -24.99700927734375, "global_step": 253461, "epoch": 3053} {"train_loss": -25.25459098815918, "global_step": 253462, "epoch": 3053} {"train_loss": -24.86281394958496, "global_step": 253463, "epoch": 3053} {"train_loss": -25.148025512695312, "global_step": 253464, "epoch": 3053} {"train_loss": -25.25699234008789, "global_step": 253465, "epoch": 3053} {"train_loss": -25.184934616088867, "global_step": 253466, "epoch": 3053} {"train_loss": -25.27126121520996, "global_step": 253467, "epoch": 3053} {"train_loss": -25.19877052307129, "global_step": 253468, "epoch": 3053} {"train_loss": -25.09649085998535, "global_step": 253469, "epoch": 3053} {"train_loss": -25.052270889282227, "global_step": 253470, "epoch": 3053} {"train_loss": -25.331838607788086, "global_step": 253471, "epoch": 3053} {"train_loss": -25.167850494384766, "global_step": 253472, "epoch": 3053} {"train_loss": -25.10560417175293, "global_step": 253473, "epoch": 3053} {"train_loss": -25.557432174682617, "global_step": 253474, "epoch": 3053} {"train_loss": -24.986770629882812, "global_step": 253475, "epoch": 3053} {"train_loss": -25.34103775024414, "global_step": 253476, "epoch": 3053} {"train_loss": -24.840042114257812, "global_step": 253477, "epoch": 3053} {"train_loss": -24.966976165771484, "global_step": 253478, "epoch": 3053} {"train_loss": -25.677663803100586, "global_step": 253479, "epoch": 3053} {"train_loss": -25.066574096679688, "global_step": 253480, "epoch": 3053} {"train_loss": -25.039834769375354, "global_step": 253481, "epoch": 3053, "val_loss": 6835342.0} {"train_loss": -24.784391403198242, "global_step": 253482, "epoch": 3054} {"train_loss": -24.141822814941406, "global_step": 253483, "epoch": 3054} {"train_loss": -24.45353126525879, "global_step": 253484, "epoch": 3054} {"train_loss": -24.549360275268555, "global_step": 253485, "epoch": 3054} {"train_loss": -24.16720962524414, "global_step": 253486, "epoch": 3054} {"train_loss": -24.547977447509766, "global_step": 253487, "epoch": 3054} {"train_loss": -24.74684715270996, "global_step": 253488, "epoch": 3054} {"train_loss": -24.600034713745117, "global_step": 253489, "epoch": 3054} {"train_loss": -24.564844131469727, "global_step": 253490, "epoch": 3054} {"train_loss": -24.514739990234375, "global_step": 253491, "epoch": 3054} {"train_loss": -24.78080940246582, "global_step": 253492, "epoch": 3054} {"train_loss": -24.56172752380371, "global_step": 253493, "epoch": 3054} {"train_loss": -24.97730827331543, "global_step": 253494, "epoch": 3054} {"train_loss": -24.689285278320312, "global_step": 253495, "epoch": 3054} {"train_loss": -24.817867279052734, "global_step": 253496, "epoch": 3054} {"train_loss": -24.892578125, "global_step": 253497, "epoch": 3054} {"train_loss": -24.776611328125, "global_step": 253498, "epoch": 3054} {"train_loss": -24.752206802368164, "global_step": 253499, "epoch": 3054} {"train_loss": -25.026525497436523, "global_step": 253500, "epoch": 3054} {"train_loss": -24.813278198242188, "global_step": 253501, "epoch": 3054} {"train_loss": -25.002161026000977, "global_step": 253502, "epoch": 3054} {"train_loss": -25.0076961517334, "global_step": 253503, "epoch": 3054} {"train_loss": -24.677339553833008, "global_step": 253504, "epoch": 3054} {"train_loss": -25.05529022216797, "global_step": 253505, "epoch": 3054} {"train_loss": -24.922748565673828, "global_step": 253506, "epoch": 3054} {"train_loss": -24.777936935424805, "global_step": 253507, "epoch": 3054} {"train_loss": -24.867603302001953, "global_step": 253508, "epoch": 3054} {"train_loss": -24.94632339477539, "global_step": 253509, "epoch": 3054} {"train_loss": -25.281982421875, "global_step": 253510, "epoch": 3054} {"train_loss": -24.734298706054688, "global_step": 253511, "epoch": 3054} {"train_loss": -24.87833023071289, "global_step": 253512, "epoch": 3054} {"train_loss": -24.906949996948242, "global_step": 253513, "epoch": 3054} {"train_loss": -25.613977432250977, "global_step": 253514, "epoch": 3054} {"train_loss": -25.329208374023438, "global_step": 253515, "epoch": 3054} {"train_loss": -25.319509506225586, "global_step": 253516, "epoch": 3054} {"train_loss": -25.096031188964844, "global_step": 253517, "epoch": 3054} {"train_loss": -25.01210594177246, "global_step": 253518, "epoch": 3054} {"train_loss": -25.005651473999023, "global_step": 253519, "epoch": 3054} {"train_loss": -25.548208236694336, "global_step": 253520, "epoch": 3054} {"train_loss": -24.999759674072266, "global_step": 253521, "epoch": 3054} {"train_loss": -25.007984161376953, "global_step": 253522, "epoch": 3054} {"train_loss": -25.098539352416992, "global_step": 253523, "epoch": 3054} {"train_loss": -24.792713165283203, "global_step": 253524, "epoch": 3054} {"train_loss": -24.784948348999023, "global_step": 253525, "epoch": 3054} {"train_loss": -24.92665672302246, "global_step": 253526, "epoch": 3054} {"train_loss": -25.270090103149414, "global_step": 253527, "epoch": 3054} {"train_loss": -25.05803871154785, "global_step": 253528, "epoch": 3054} {"train_loss": -24.88374137878418, "global_step": 253529, "epoch": 3054} {"train_loss": -25.18707847595215, "global_step": 253530, "epoch": 3054} {"train_loss": -25.24924659729004, "global_step": 253531, "epoch": 3054} {"train_loss": -25.1937313079834, "global_step": 253532, "epoch": 3054} {"train_loss": -25.24254035949707, "global_step": 253533, "epoch": 3054} {"train_loss": -25.249521255493164, "global_step": 253534, "epoch": 3054} {"train_loss": -25.106563568115234, "global_step": 253535, "epoch": 3054} {"train_loss": -25.188013076782227, "global_step": 253536, "epoch": 3054} {"train_loss": -25.203306198120117, "global_step": 253537, "epoch": 3054} {"train_loss": -24.322952270507812, "global_step": 253538, "epoch": 3054} {"train_loss": -25.129838943481445, "global_step": 253539, "epoch": 3054} {"train_loss": -25.191043853759766, "global_step": 253540, "epoch": 3054} {"train_loss": -25.400035858154297, "global_step": 253541, "epoch": 3054} {"train_loss": -25.238048553466797, "global_step": 253542, "epoch": 3054} {"train_loss": -24.82979393005371, "global_step": 253543, "epoch": 3054} {"train_loss": -25.181882858276367, "global_step": 253544, "epoch": 3054} {"train_loss": -25.40888214111328, "global_step": 253545, "epoch": 3054} {"train_loss": -24.92793846130371, "global_step": 253546, "epoch": 3054} {"train_loss": -25.16877555847168, "global_step": 253547, "epoch": 3054} {"train_loss": -25.305328369140625, "global_step": 253548, "epoch": 3054} {"train_loss": -25.103628158569336, "global_step": 253549, "epoch": 3054} {"train_loss": -25.273542404174805, "global_step": 253550, "epoch": 3054} {"train_loss": -25.20096206665039, "global_step": 253551, "epoch": 3054} {"train_loss": -25.60671043395996, "global_step": 253552, "epoch": 3054} {"train_loss": -25.286441802978516, "global_step": 253553, "epoch": 3054} {"train_loss": -25.457443237304688, "global_step": 253554, "epoch": 3054} {"train_loss": -25.193410873413086, "global_step": 253555, "epoch": 3054} {"train_loss": -24.900388717651367, "global_step": 253556, "epoch": 3054} {"train_loss": -24.797657012939453, "global_step": 253557, "epoch": 3054} {"train_loss": -24.321645736694336, "global_step": 253558, "epoch": 3054} {"train_loss": -24.86056900024414, "global_step": 253559, "epoch": 3054} {"train_loss": -25.290931701660156, "global_step": 253560, "epoch": 3054} {"train_loss": -24.698816299438477, "global_step": 253561, "epoch": 3054} {"train_loss": -24.710487365722656, "global_step": 253562, "epoch": 3054} {"train_loss": -24.700563430786133, "global_step": 253563, "epoch": 3054} {"train_loss": -24.963252791439196, "global_step": 253564, "epoch": 3054, "val_loss": 6876364.0} {"train_loss": -23.959186553955078, "global_step": 253565, "epoch": 3055} {"train_loss": -24.25318717956543, "global_step": 253566, "epoch": 3055} {"train_loss": -24.85481071472168, "global_step": 253567, "epoch": 3055} {"train_loss": -24.222196578979492, "global_step": 253568, "epoch": 3055} {"train_loss": -24.395835876464844, "global_step": 253569, "epoch": 3055} {"train_loss": -24.69534683227539, "global_step": 253570, "epoch": 3055} {"train_loss": -24.51142120361328, "global_step": 253571, "epoch": 3055} {"train_loss": -24.501220703125, "global_step": 253572, "epoch": 3055} {"train_loss": -24.67547607421875, "global_step": 253573, "epoch": 3055} {"train_loss": -24.611980438232422, "global_step": 253574, "epoch": 3055} {"train_loss": -24.723546981811523, "global_step": 253575, "epoch": 3055} {"train_loss": -24.70277976989746, "global_step": 253576, "epoch": 3055} {"train_loss": -24.732128143310547, "global_step": 253577, "epoch": 3055} {"train_loss": -24.62752342224121, "global_step": 253578, "epoch": 3055} {"train_loss": -24.585058212280273, "global_step": 253579, "epoch": 3055} {"train_loss": -24.62567710876465, "global_step": 253580, "epoch": 3055} {"train_loss": -24.8564510345459, "global_step": 253581, "epoch": 3055} {"train_loss": -24.657007217407227, "global_step": 253582, "epoch": 3055} {"train_loss": -25.004270553588867, "global_step": 253583, "epoch": 3055} {"train_loss": -24.837879180908203, "global_step": 253584, "epoch": 3055} {"train_loss": -25.124204635620117, "global_step": 253585, "epoch": 3055} {"train_loss": -24.953516006469727, "global_step": 253586, "epoch": 3055} {"train_loss": -25.2962703704834, "global_step": 253587, "epoch": 3055} {"train_loss": -25.097095489501953, "global_step": 253588, "epoch": 3055} {"train_loss": -25.2054500579834, "global_step": 253589, "epoch": 3055} {"train_loss": -24.972976684570312, "global_step": 253590, "epoch": 3055} {"train_loss": -25.178333282470703, "global_step": 253591, "epoch": 3055} {"train_loss": -25.280126571655273, "global_step": 253592, "epoch": 3055} {"train_loss": -24.858362197875977, "global_step": 253593, "epoch": 3055} {"train_loss": -25.33416748046875, "global_step": 253594, "epoch": 3055} {"train_loss": -25.208600997924805, "global_step": 253595, "epoch": 3055} {"train_loss": -25.181180953979492, "global_step": 253596, "epoch": 3055} {"train_loss": -24.99823570251465, "global_step": 253597, "epoch": 3055} {"train_loss": -25.186582565307617, "global_step": 253598, "epoch": 3055} {"train_loss": -25.315982818603516, "global_step": 253599, "epoch": 3055} {"train_loss": -25.3154296875, "global_step": 253600, "epoch": 3055} {"train_loss": -25.4619083404541, "global_step": 253601, "epoch": 3055} {"train_loss": -25.079835891723633, "global_step": 253602, "epoch": 3055} {"train_loss": -25.115610122680664, "global_step": 253603, "epoch": 3055} {"train_loss": -24.880361557006836, "global_step": 253604, "epoch": 3055} {"train_loss": -25.492340087890625, "global_step": 253605, "epoch": 3055} {"train_loss": -25.2930908203125, "global_step": 253606, "epoch": 3055} {"train_loss": -25.087387084960938, "global_step": 253607, "epoch": 3055} {"train_loss": -24.9405574798584, "global_step": 253608, "epoch": 3055} {"train_loss": -24.28253746032715, "global_step": 253609, "epoch": 3055} {"train_loss": -22.98138427734375, "global_step": 253610, "epoch": 3055} {"train_loss": -21.37596893310547, "global_step": 253611, "epoch": 3055} {"train_loss": -23.86366081237793, "global_step": 253612, "epoch": 3055} {"train_loss": -23.754919052124023, "global_step": 253613, "epoch": 3055} {"train_loss": -23.564573287963867, "global_step": 253614, "epoch": 3055} {"train_loss": -24.33536148071289, "global_step": 253615, "epoch": 3055} {"train_loss": -23.795169830322266, "global_step": 253616, "epoch": 3055} {"train_loss": -24.49152946472168, "global_step": 253617, "epoch": 3055} {"train_loss": -23.972883224487305, "global_step": 253618, "epoch": 3055} {"train_loss": -24.590316772460938, "global_step": 253619, "epoch": 3055} {"train_loss": -24.292177200317383, "global_step": 253620, "epoch": 3055} {"train_loss": -24.48065948486328, "global_step": 253621, "epoch": 3055} {"train_loss": -24.619665145874023, "global_step": 253622, "epoch": 3055} {"train_loss": -24.580059051513672, "global_step": 253623, "epoch": 3055} {"train_loss": -24.438873291015625, "global_step": 253624, "epoch": 3055} {"train_loss": -24.46209716796875, "global_step": 253625, "epoch": 3055} {"train_loss": -24.27210807800293, "global_step": 253626, "epoch": 3055} {"train_loss": -24.332595825195312, "global_step": 253627, "epoch": 3055} {"train_loss": -24.348224639892578, "global_step": 253628, "epoch": 3055} {"train_loss": -24.331302642822266, "global_step": 253629, "epoch": 3055} {"train_loss": -24.634811401367188, "global_step": 253630, "epoch": 3055} {"train_loss": -24.472537994384766, "global_step": 253631, "epoch": 3055} {"train_loss": -24.54656982421875, "global_step": 253632, "epoch": 3055} {"train_loss": -25.180959701538086, "global_step": 253633, "epoch": 3055} {"train_loss": -25.074987411499023, "global_step": 253634, "epoch": 3055} {"train_loss": -24.881492614746094, "global_step": 253635, "epoch": 3055} {"train_loss": -24.64753532409668, "global_step": 253636, "epoch": 3055} {"train_loss": -24.944873809814453, "global_step": 253637, "epoch": 3055} {"train_loss": -24.47698211669922, "global_step": 253638, "epoch": 3055} {"train_loss": -24.792072296142578, "global_step": 253639, "epoch": 3055} {"train_loss": -24.7589168548584, "global_step": 253640, "epoch": 3055} {"train_loss": -24.771942138671875, "global_step": 253641, "epoch": 3055} {"train_loss": -25.146743774414062, "global_step": 253642, "epoch": 3055} {"train_loss": -24.91468620300293, "global_step": 253643, "epoch": 3055} {"train_loss": -24.935441970825195, "global_step": 253644, "epoch": 3055} {"train_loss": -24.801088333129883, "global_step": 253645, "epoch": 3055} {"train_loss": -25.51339340209961, "global_step": 253646, "epoch": 3055} {"train_loss": -24.673361238226832, "global_step": 253647, "epoch": 3055, "val_loss": 6931636.0} {"train_loss": -24.490732192993164, "global_step": 253648, "epoch": 3056} {"train_loss": -24.795446395874023, "global_step": 253649, "epoch": 3056} {"train_loss": -24.912817001342773, "global_step": 253650, "epoch": 3056} {"train_loss": -24.5262508392334, "global_step": 253651, "epoch": 3056} {"train_loss": -24.75369644165039, "global_step": 253652, "epoch": 3056} {"train_loss": -24.407669067382812, "global_step": 253653, "epoch": 3056} {"train_loss": -24.519742965698242, "global_step": 253654, "epoch": 3056} {"train_loss": -24.77692222595215, "global_step": 253655, "epoch": 3056} {"train_loss": -25.02589988708496, "global_step": 253656, "epoch": 3056} {"train_loss": -24.516630172729492, "global_step": 253657, "epoch": 3056} {"train_loss": -24.909337997436523, "global_step": 253658, "epoch": 3056} {"train_loss": -25.03631591796875, "global_step": 253659, "epoch": 3056} {"train_loss": -24.786352157592773, "global_step": 253660, "epoch": 3056} {"train_loss": -24.97372055053711, "global_step": 253661, "epoch": 3056} {"train_loss": -24.850069046020508, "global_step": 253662, "epoch": 3056} {"train_loss": -25.179630279541016, "global_step": 253663, "epoch": 3056} {"train_loss": -24.926864624023438, "global_step": 253664, "epoch": 3056} {"train_loss": -25.080358505249023, "global_step": 253665, "epoch": 3056} {"train_loss": -24.947463989257812, "global_step": 253666, "epoch": 3056} {"train_loss": -24.932754516601562, "global_step": 253667, "epoch": 3056} {"train_loss": -25.301353454589844, "global_step": 253668, "epoch": 3056} {"train_loss": -24.661602020263672, "global_step": 253669, "epoch": 3056} {"train_loss": -24.702390670776367, "global_step": 253670, "epoch": 3056} {"train_loss": -24.958419799804688, "global_step": 253671, "epoch": 3056} {"train_loss": -25.336652755737305, "global_step": 253672, "epoch": 3056} {"train_loss": -25.38385581970215, "global_step": 253673, "epoch": 3056} {"train_loss": -24.91065216064453, "global_step": 253674, "epoch": 3056} {"train_loss": -25.34151268005371, "global_step": 253675, "epoch": 3056} {"train_loss": -24.956144332885742, "global_step": 253676, "epoch": 3056} {"train_loss": -25.231792449951172, "global_step": 253677, "epoch": 3056} {"train_loss": -25.34651756286621, "global_step": 253678, "epoch": 3056} {"train_loss": -25.363239288330078, "global_step": 253679, "epoch": 3056} {"train_loss": -25.242177963256836, "global_step": 253680, "epoch": 3056} {"train_loss": -25.017620086669922, "global_step": 253681, "epoch": 3056} {"train_loss": -25.141050338745117, "global_step": 253682, "epoch": 3056} {"train_loss": -25.03186798095703, "global_step": 253683, "epoch": 3056} {"train_loss": -25.029279708862305, "global_step": 253684, "epoch": 3056} {"train_loss": -25.167217254638672, "global_step": 253685, "epoch": 3056} {"train_loss": -24.8787841796875, "global_step": 253686, "epoch": 3056} {"train_loss": -25.068470001220703, "global_step": 253687, "epoch": 3056} {"train_loss": -25.162063598632812, "global_step": 253688, "epoch": 3056} {"train_loss": -25.440401077270508, "global_step": 253689, "epoch": 3056} {"train_loss": -25.11634635925293, "global_step": 253690, "epoch": 3056} {"train_loss": -25.039783477783203, "global_step": 253691, "epoch": 3056} {"train_loss": -25.259681701660156, "global_step": 253692, "epoch": 3056} {"train_loss": -24.95448112487793, "global_step": 253693, "epoch": 3056} {"train_loss": -25.12704086303711, "global_step": 253694, "epoch": 3056} {"train_loss": -24.787824630737305, "global_step": 253695, "epoch": 3056} {"train_loss": -25.293140411376953, "global_step": 253696, "epoch": 3056} {"train_loss": -24.888599395751953, "global_step": 253697, "epoch": 3056} {"train_loss": -25.156309127807617, "global_step": 253698, "epoch": 3056} {"train_loss": -25.002246856689453, "global_step": 253699, "epoch": 3056} {"train_loss": -25.246129989624023, "global_step": 253700, "epoch": 3056} {"train_loss": -25.244834899902344, "global_step": 253701, "epoch": 3056} {"train_loss": -24.925369262695312, "global_step": 253702, "epoch": 3056} {"train_loss": -25.357349395751953, "global_step": 253703, "epoch": 3056} {"train_loss": -25.23082733154297, "global_step": 253704, "epoch": 3056} {"train_loss": -24.97492790222168, "global_step": 253705, "epoch": 3056} {"train_loss": -25.354293823242188, "global_step": 253706, "epoch": 3056} {"train_loss": -25.305715560913086, "global_step": 253707, "epoch": 3056} {"train_loss": -25.21272087097168, "global_step": 253708, "epoch": 3056} {"train_loss": -25.198904037475586, "global_step": 253709, "epoch": 3056} {"train_loss": -25.261295318603516, "global_step": 253710, "epoch": 3056} {"train_loss": -25.121572494506836, "global_step": 253711, "epoch": 3056} {"train_loss": -25.2709903717041, "global_step": 253712, "epoch": 3056} {"train_loss": -25.26317024230957, "global_step": 253713, "epoch": 3056} {"train_loss": -25.041349411010742, "global_step": 253714, "epoch": 3056} {"train_loss": -25.3491268157959, "global_step": 253715, "epoch": 3056} {"train_loss": -24.665273666381836, "global_step": 253716, "epoch": 3056} {"train_loss": -25.35419273376465, "global_step": 253717, "epoch": 3056} {"train_loss": -25.062728881835938, "global_step": 253718, "epoch": 3056} {"train_loss": -25.088117599487305, "global_step": 253719, "epoch": 3056} {"train_loss": -25.366323471069336, "global_step": 253720, "epoch": 3056} {"train_loss": -24.677217483520508, "global_step": 253721, "epoch": 3056} {"train_loss": -24.93414306640625, "global_step": 253722, "epoch": 3056} {"train_loss": -24.899686813354492, "global_step": 253723, "epoch": 3056} {"train_loss": -24.928985595703125, "global_step": 253724, "epoch": 3056} {"train_loss": -24.884933471679688, "global_step": 253725, "epoch": 3056} {"train_loss": -24.679636001586914, "global_step": 253726, "epoch": 3056} {"train_loss": -25.38051986694336, "global_step": 253727, "epoch": 3056} {"train_loss": -25.088010787963867, "global_step": 253728, "epoch": 3056} {"train_loss": -24.66179656982422, "global_step": 253729, "epoch": 3056} {"train_loss": -25.048852897552123, "global_step": 253730, "epoch": 3056, "val_loss": 6977949.0} {"train_loss": -23.727645874023438, "global_step": 253731, "epoch": 3057} {"train_loss": -23.04304313659668, "global_step": 253732, "epoch": 3057} {"train_loss": -23.16648292541504, "global_step": 253733, "epoch": 3057} {"train_loss": -24.458471298217773, "global_step": 253734, "epoch": 3057} {"train_loss": -23.638216018676758, "global_step": 253735, "epoch": 3057} {"train_loss": -24.85055923461914, "global_step": 253736, "epoch": 3057} {"train_loss": -24.372207641601562, "global_step": 253737, "epoch": 3057} {"train_loss": -24.29546546936035, "global_step": 253738, "epoch": 3057} {"train_loss": -24.58499526977539, "global_step": 253739, "epoch": 3057} {"train_loss": -24.12623405456543, "global_step": 253740, "epoch": 3057} {"train_loss": -24.441997528076172, "global_step": 253741, "epoch": 3057} {"train_loss": -24.616321563720703, "global_step": 253742, "epoch": 3057} {"train_loss": -24.817243576049805, "global_step": 253743, "epoch": 3057} {"train_loss": -24.97242546081543, "global_step": 253744, "epoch": 3057} {"train_loss": -24.567228317260742, "global_step": 253745, "epoch": 3057} {"train_loss": -24.725778579711914, "global_step": 253746, "epoch": 3057} {"train_loss": -24.357473373413086, "global_step": 253747, "epoch": 3057} {"train_loss": -24.571413040161133, "global_step": 253748, "epoch": 3057} {"train_loss": -25.01932716369629, "global_step": 253749, "epoch": 3057} {"train_loss": -24.922040939331055, "global_step": 253750, "epoch": 3057} {"train_loss": -24.804458618164062, "global_step": 253751, "epoch": 3057} {"train_loss": -24.981842041015625, "global_step": 253752, "epoch": 3057} {"train_loss": -24.753297805786133, "global_step": 253753, "epoch": 3057} {"train_loss": -25.1099910736084, "global_step": 253754, "epoch": 3057} {"train_loss": -25.110822677612305, "global_step": 253755, "epoch": 3057} {"train_loss": -24.808441162109375, "global_step": 253756, "epoch": 3057} {"train_loss": -24.844314575195312, "global_step": 253757, "epoch": 3057} {"train_loss": -25.11227798461914, "global_step": 253758, "epoch": 3057} {"train_loss": -25.17425537109375, "global_step": 253759, "epoch": 3057} {"train_loss": -25.167062759399414, "global_step": 253760, "epoch": 3057} {"train_loss": -25.153654098510742, "global_step": 253761, "epoch": 3057} {"train_loss": -24.982765197753906, "global_step": 253762, "epoch": 3057} {"train_loss": -24.794605255126953, "global_step": 253763, "epoch": 3057} {"train_loss": -25.256338119506836, "global_step": 253764, "epoch": 3057} {"train_loss": -25.11575698852539, "global_step": 253765, "epoch": 3057} {"train_loss": -25.330060958862305, "global_step": 253766, "epoch": 3057} {"train_loss": -25.48752784729004, "global_step": 253767, "epoch": 3057} {"train_loss": -25.16822052001953, "global_step": 253768, "epoch": 3057} {"train_loss": -24.96164894104004, "global_step": 253769, "epoch": 3057} {"train_loss": -25.247055053710938, "global_step": 253770, "epoch": 3057} {"train_loss": -25.20075798034668, "global_step": 253771, "epoch": 3057} {"train_loss": -25.277341842651367, "global_step": 253772, "epoch": 3057} {"train_loss": -25.0214900970459, "global_step": 253773, "epoch": 3057} {"train_loss": -24.90032386779785, "global_step": 253774, "epoch": 3057} {"train_loss": -24.823129653930664, "global_step": 253775, "epoch": 3057} {"train_loss": -25.02799415588379, "global_step": 253776, "epoch": 3057} {"train_loss": -25.01877212524414, "global_step": 253777, "epoch": 3057} {"train_loss": -25.303752899169922, "global_step": 253778, "epoch": 3057} {"train_loss": -25.071975708007812, "global_step": 253779, "epoch": 3057} {"train_loss": -25.272197723388672, "global_step": 253780, "epoch": 3057} {"train_loss": -25.229843139648438, "global_step": 253781, "epoch": 3057} {"train_loss": -25.198368072509766, "global_step": 253782, "epoch": 3057} {"train_loss": -25.101797103881836, "global_step": 253783, "epoch": 3057} {"train_loss": -25.134695053100586, "global_step": 253784, "epoch": 3057} {"train_loss": -24.907766342163086, "global_step": 253785, "epoch": 3057} {"train_loss": -24.90163230895996, "global_step": 253786, "epoch": 3057} {"train_loss": -25.226591110229492, "global_step": 253787, "epoch": 3057} {"train_loss": -25.50901222229004, "global_step": 253788, "epoch": 3057} {"train_loss": -25.053640365600586, "global_step": 253789, "epoch": 3057} {"train_loss": -25.284997940063477, "global_step": 253790, "epoch": 3057} {"train_loss": -25.419355392456055, "global_step": 253791, "epoch": 3057} {"train_loss": -25.48353385925293, "global_step": 253792, "epoch": 3057} {"train_loss": -25.1451473236084, "global_step": 253793, "epoch": 3057} {"train_loss": -25.2492618560791, "global_step": 253794, "epoch": 3057} {"train_loss": -25.530330657958984, "global_step": 253795, "epoch": 3057} {"train_loss": -25.510181427001953, "global_step": 253796, "epoch": 3057} {"train_loss": -25.342233657836914, "global_step": 253797, "epoch": 3057} {"train_loss": -24.91834831237793, "global_step": 253798, "epoch": 3057} {"train_loss": -24.974010467529297, "global_step": 253799, "epoch": 3057} {"train_loss": -24.804777145385742, "global_step": 253800, "epoch": 3057} {"train_loss": -25.176923751831055, "global_step": 253801, "epoch": 3057} {"train_loss": -25.030248641967773, "global_step": 253802, "epoch": 3057} {"train_loss": -25.31789779663086, "global_step": 253803, "epoch": 3057} {"train_loss": -24.913721084594727, "global_step": 253804, "epoch": 3057} {"train_loss": -25.091379165649414, "global_step": 253805, "epoch": 3057} {"train_loss": -24.8985538482666, "global_step": 253806, "epoch": 3057} {"train_loss": -24.663312911987305, "global_step": 253807, "epoch": 3057} {"train_loss": -25.131267547607422, "global_step": 253808, "epoch": 3057} {"train_loss": -24.69582748413086, "global_step": 253809, "epoch": 3057} {"train_loss": -25.14388656616211, "global_step": 253810, "epoch": 3057} {"train_loss": -24.688018798828125, "global_step": 253811, "epoch": 3057} {"train_loss": -24.98048973083496, "global_step": 253812, "epoch": 3057} {"train_loss": -24.930413372545356, "global_step": 253813, "epoch": 3057, "val_loss": 6909201.5} {"train_loss": -24.109861373901367, "global_step": 253814, "epoch": 3058} {"train_loss": -24.253149032592773, "global_step": 253815, "epoch": 3058} {"train_loss": -24.620023727416992, "global_step": 253816, "epoch": 3058} {"train_loss": -24.271102905273438, "global_step": 253817, "epoch": 3058} {"train_loss": -24.363569259643555, "global_step": 253818, "epoch": 3058} {"train_loss": -24.220788955688477, "global_step": 253819, "epoch": 3058} {"train_loss": -24.57305145263672, "global_step": 253820, "epoch": 3058} {"train_loss": -24.434127807617188, "global_step": 253821, "epoch": 3058} {"train_loss": -24.3587589263916, "global_step": 253822, "epoch": 3058} {"train_loss": -24.824647903442383, "global_step": 253823, "epoch": 3058} {"train_loss": -24.447935104370117, "global_step": 253824, "epoch": 3058} {"train_loss": -24.61454200744629, "global_step": 253825, "epoch": 3058} {"train_loss": -24.830270767211914, "global_step": 253826, "epoch": 3058} {"train_loss": -24.782712936401367, "global_step": 253827, "epoch": 3058} {"train_loss": -24.955841064453125, "global_step": 253828, "epoch": 3058} {"train_loss": -24.721120834350586, "global_step": 253829, "epoch": 3058} {"train_loss": -24.693710327148438, "global_step": 253830, "epoch": 3058} {"train_loss": -24.84410285949707, "global_step": 253831, "epoch": 3058} {"train_loss": -24.86203384399414, "global_step": 253832, "epoch": 3058} {"train_loss": -24.63888931274414, "global_step": 253833, "epoch": 3058} {"train_loss": -25.063024520874023, "global_step": 253834, "epoch": 3058} {"train_loss": -24.594324111938477, "global_step": 253835, "epoch": 3058} {"train_loss": -24.692380905151367, "global_step": 253836, "epoch": 3058} {"train_loss": -25.161792755126953, "global_step": 253837, "epoch": 3058} {"train_loss": -25.089553833007812, "global_step": 253838, "epoch": 3058} {"train_loss": -25.234819412231445, "global_step": 253839, "epoch": 3058} {"train_loss": -25.083946228027344, "global_step": 253840, "epoch": 3058} {"train_loss": -25.133895874023438, "global_step": 253841, "epoch": 3058} {"train_loss": -24.932886123657227, "global_step": 253842, "epoch": 3058} {"train_loss": -25.097524642944336, "global_step": 253843, "epoch": 3058} {"train_loss": -25.133596420288086, "global_step": 253844, "epoch": 3058} {"train_loss": -25.242420196533203, "global_step": 253845, "epoch": 3058} {"train_loss": -25.0023250579834, "global_step": 253846, "epoch": 3058} {"train_loss": -24.99226951599121, "global_step": 253847, "epoch": 3058} {"train_loss": -25.218128204345703, "global_step": 253848, "epoch": 3058} {"train_loss": -25.063337326049805, "global_step": 253849, "epoch": 3058} {"train_loss": -24.936037063598633, "global_step": 253850, "epoch": 3058} {"train_loss": -25.117895126342773, "global_step": 253851, "epoch": 3058} {"train_loss": -24.823408126831055, "global_step": 253852, "epoch": 3058} {"train_loss": -25.142358779907227, "global_step": 253853, "epoch": 3058} {"train_loss": -25.5131893157959, "global_step": 253854, "epoch": 3058} {"train_loss": -25.036827087402344, "global_step": 253855, "epoch": 3058} {"train_loss": -25.42313575744629, "global_step": 253856, "epoch": 3058} {"train_loss": -25.24970245361328, "global_step": 253857, "epoch": 3058} {"train_loss": -25.412078857421875, "global_step": 253858, "epoch": 3058} {"train_loss": -25.085086822509766, "global_step": 253859, "epoch": 3058} {"train_loss": -25.018611907958984, "global_step": 253860, "epoch": 3058} {"train_loss": -25.31805992126465, "global_step": 253861, "epoch": 3058} {"train_loss": -25.170011520385742, "global_step": 253862, "epoch": 3058} {"train_loss": -24.6595516204834, "global_step": 253863, "epoch": 3058} {"train_loss": -24.74608612060547, "global_step": 253864, "epoch": 3058} {"train_loss": -25.190866470336914, "global_step": 253865, "epoch": 3058} {"train_loss": -25.204675674438477, "global_step": 253866, "epoch": 3058} {"train_loss": -24.92089080810547, "global_step": 253867, "epoch": 3058} {"train_loss": -24.54537010192871, "global_step": 253868, "epoch": 3058} {"train_loss": -25.25258445739746, "global_step": 253869, "epoch": 3058} {"train_loss": -24.905990600585938, "global_step": 253870, "epoch": 3058} {"train_loss": -25.1142635345459, "global_step": 253871, "epoch": 3058} {"train_loss": -25.139930725097656, "global_step": 253872, "epoch": 3058} {"train_loss": -24.787065505981445, "global_step": 253873, "epoch": 3058} {"train_loss": -24.98740005493164, "global_step": 253874, "epoch": 3058} {"train_loss": -25.291784286499023, "global_step": 253875, "epoch": 3058} {"train_loss": -25.422264099121094, "global_step": 253876, "epoch": 3058} {"train_loss": -24.525896072387695, "global_step": 253877, "epoch": 3058} {"train_loss": -24.792673110961914, "global_step": 253878, "epoch": 3058} {"train_loss": -25.1225643157959, "global_step": 253879, "epoch": 3058} {"train_loss": -24.997974395751953, "global_step": 253880, "epoch": 3058} {"train_loss": -24.94378089904785, "global_step": 253881, "epoch": 3058} {"train_loss": -24.804031372070312, "global_step": 253882, "epoch": 3058} {"train_loss": -25.225934982299805, "global_step": 253883, "epoch": 3058} {"train_loss": -25.0867977142334, "global_step": 253884, "epoch": 3058} {"train_loss": -25.472951889038086, "global_step": 253885, "epoch": 3058} {"train_loss": -25.197580337524414, "global_step": 253886, "epoch": 3058} {"train_loss": -25.283262252807617, "global_step": 253887, "epoch": 3058} {"train_loss": -25.11295509338379, "global_step": 253888, "epoch": 3058} {"train_loss": -25.43501853942871, "global_step": 253889, "epoch": 3058} {"train_loss": -25.034164428710938, "global_step": 253890, "epoch": 3058} {"train_loss": -25.170927047729492, "global_step": 253891, "epoch": 3058} {"train_loss": -25.160457611083984, "global_step": 253892, "epoch": 3058} {"train_loss": -25.35833740234375, "global_step": 253893, "epoch": 3058} {"train_loss": -24.78371810913086, "global_step": 253894, "epoch": 3058} {"train_loss": -24.922422409057617, "global_step": 253895, "epoch": 3058} {"train_loss": -24.94541880596115, "global_step": 253896, "epoch": 3058, "val_loss": 6882552.0} {"train_loss": -24.98395347595215, "global_step": 253897, "epoch": 3059} {"train_loss": -24.85655975341797, "global_step": 253898, "epoch": 3059} {"train_loss": -24.914392471313477, "global_step": 253899, "epoch": 3059} {"train_loss": -24.94330406188965, "global_step": 253900, "epoch": 3059} {"train_loss": -24.825193405151367, "global_step": 253901, "epoch": 3059} {"train_loss": -25.145429611206055, "global_step": 253902, "epoch": 3059} {"train_loss": -24.861637115478516, "global_step": 253903, "epoch": 3059} {"train_loss": -24.62264633178711, "global_step": 253904, "epoch": 3059} {"train_loss": -24.986831665039062, "global_step": 253905, "epoch": 3059} {"train_loss": -25.1517333984375, "global_step": 253906, "epoch": 3059} {"train_loss": -25.12699317932129, "global_step": 253907, "epoch": 3059} {"train_loss": -24.84295082092285, "global_step": 253908, "epoch": 3059} {"train_loss": -25.200956344604492, "global_step": 253909, "epoch": 3059} {"train_loss": -24.975357055664062, "global_step": 253910, "epoch": 3059} {"train_loss": -25.0438289642334, "global_step": 253911, "epoch": 3059} {"train_loss": -24.935863494873047, "global_step": 253912, "epoch": 3059} {"train_loss": -24.90358543395996, "global_step": 253913, "epoch": 3059} {"train_loss": -25.13868522644043, "global_step": 253914, "epoch": 3059} {"train_loss": -25.16839599609375, "global_step": 253915, "epoch": 3059} {"train_loss": -25.04500389099121, "global_step": 253916, "epoch": 3059} {"train_loss": -24.883819580078125, "global_step": 253917, "epoch": 3059} {"train_loss": -25.1937313079834, "global_step": 253918, "epoch": 3059} {"train_loss": -24.55118179321289, "global_step": 253919, "epoch": 3059} {"train_loss": -24.458759307861328, "global_step": 253920, "epoch": 3059} {"train_loss": -24.959915161132812, "global_step": 253921, "epoch": 3059} {"train_loss": -24.734811782836914, "global_step": 253922, "epoch": 3059} {"train_loss": -24.889678955078125, "global_step": 253923, "epoch": 3059} {"train_loss": -24.986677169799805, "global_step": 253924, "epoch": 3059} {"train_loss": -24.9584903717041, "global_step": 253925, "epoch": 3059} {"train_loss": -25.512908935546875, "global_step": 253926, "epoch": 3059} {"train_loss": -24.504526138305664, "global_step": 253927, "epoch": 3059} {"train_loss": -24.55104637145996, "global_step": 253928, "epoch": 3059} {"train_loss": -25.13418960571289, "global_step": 253929, "epoch": 3059} {"train_loss": -25.133638381958008, "global_step": 253930, "epoch": 3059} {"train_loss": -25.038166046142578, "global_step": 253931, "epoch": 3059} {"train_loss": -25.004669189453125, "global_step": 253932, "epoch": 3059} {"train_loss": -24.962173461914062, "global_step": 253933, "epoch": 3059} {"train_loss": -25.072797775268555, "global_step": 253934, "epoch": 3059} {"train_loss": -25.172550201416016, "global_step": 253935, "epoch": 3059} {"train_loss": -25.02313804626465, "global_step": 253936, "epoch": 3059} {"train_loss": -25.123926162719727, "global_step": 253937, "epoch": 3059} {"train_loss": -24.788236618041992, "global_step": 253938, "epoch": 3059} {"train_loss": -24.80158042907715, "global_step": 253939, "epoch": 3059} {"train_loss": -24.780019760131836, "global_step": 253940, "epoch": 3059} {"train_loss": -25.195131301879883, "global_step": 253941, "epoch": 3059} {"train_loss": -25.441850662231445, "global_step": 253942, "epoch": 3059} {"train_loss": -24.86702537536621, "global_step": 253943, "epoch": 3059} {"train_loss": -24.56631851196289, "global_step": 253944, "epoch": 3059} {"train_loss": -25.31475257873535, "global_step": 253945, "epoch": 3059} {"train_loss": -24.973468780517578, "global_step": 253946, "epoch": 3059} {"train_loss": -24.875783920288086, "global_step": 253947, "epoch": 3059} {"train_loss": -25.300662994384766, "global_step": 253948, "epoch": 3059} {"train_loss": -25.266464233398438, "global_step": 253949, "epoch": 3059} {"train_loss": -24.835901260375977, "global_step": 253950, "epoch": 3059} {"train_loss": -25.25568962097168, "global_step": 253951, "epoch": 3059} {"train_loss": -25.09028434753418, "global_step": 253952, "epoch": 3059} {"train_loss": -25.388395309448242, "global_step": 253953, "epoch": 3059} {"train_loss": -25.218313217163086, "global_step": 253954, "epoch": 3059} {"train_loss": -25.148283004760742, "global_step": 253955, "epoch": 3059} {"train_loss": -24.97740364074707, "global_step": 253956, "epoch": 3059} {"train_loss": -25.388410568237305, "global_step": 253957, "epoch": 3059} {"train_loss": -24.74464225769043, "global_step": 253958, "epoch": 3059} {"train_loss": -24.922346115112305, "global_step": 253959, "epoch": 3059} {"train_loss": -25.249195098876953, "global_step": 253960, "epoch": 3059} {"train_loss": -25.163068771362305, "global_step": 253961, "epoch": 3059} {"train_loss": -25.16742515563965, "global_step": 253962, "epoch": 3059} {"train_loss": -25.552587509155273, "global_step": 253963, "epoch": 3059} {"train_loss": -25.19434356689453, "global_step": 253964, "epoch": 3059} {"train_loss": -25.296375274658203, "global_step": 253965, "epoch": 3059} {"train_loss": -25.394437789916992, "global_step": 253966, "epoch": 3059} {"train_loss": -25.024076461791992, "global_step": 253967, "epoch": 3059} {"train_loss": -25.477140426635742, "global_step": 253968, "epoch": 3059} {"train_loss": -25.141233444213867, "global_step": 253969, "epoch": 3059} {"train_loss": -25.080976486206055, "global_step": 253970, "epoch": 3059} {"train_loss": -25.274669647216797, "global_step": 253971, "epoch": 3059} {"train_loss": -25.237939834594727, "global_step": 253972, "epoch": 3059} {"train_loss": -25.042707443237305, "global_step": 253973, "epoch": 3059} {"train_loss": -25.14063835144043, "global_step": 253974, "epoch": 3059} {"train_loss": -25.15203285217285, "global_step": 253975, "epoch": 3059} {"train_loss": -25.100793838500977, "global_step": 253976, "epoch": 3059} {"train_loss": -24.862228393554688, "global_step": 253977, "epoch": 3059} {"train_loss": -25.02010154724121, "global_step": 253978, "epoch": 3059} {"train_loss": -25.030418097254742, "global_step": 253979, "epoch": 3059, "val_loss": 6836063.0} {"train_loss": -24.8931941986084, "global_step": 253980, "epoch": 3060} {"train_loss": -24.117509841918945, "global_step": 253981, "epoch": 3060} {"train_loss": -24.750347137451172, "global_step": 253982, "epoch": 3060} {"train_loss": -24.64371681213379, "global_step": 253983, "epoch": 3060} {"train_loss": -24.6998348236084, "global_step": 253984, "epoch": 3060} {"train_loss": -24.262876510620117, "global_step": 253985, "epoch": 3060} {"train_loss": -25.27223014831543, "global_step": 253986, "epoch": 3060} {"train_loss": -24.55238151550293, "global_step": 253987, "epoch": 3060} {"train_loss": -24.74131202697754, "global_step": 253988, "epoch": 3060} {"train_loss": -24.71720314025879, "global_step": 253989, "epoch": 3060} {"train_loss": -24.929750442504883, "global_step": 253990, "epoch": 3060} {"train_loss": -24.661975860595703, "global_step": 253991, "epoch": 3060} {"train_loss": -24.88937759399414, "global_step": 253992, "epoch": 3060} {"train_loss": -24.57819175720215, "global_step": 253993, "epoch": 3060} {"train_loss": -24.582015991210938, "global_step": 253994, "epoch": 3060} {"train_loss": -24.947086334228516, "global_step": 253995, "epoch": 3060} {"train_loss": -24.628721237182617, "global_step": 253996, "epoch": 3060} {"train_loss": -25.001333236694336, "global_step": 253997, "epoch": 3060} {"train_loss": -24.677820205688477, "global_step": 253998, "epoch": 3060} {"train_loss": -24.648147583007812, "global_step": 253999, "epoch": 3060} {"train_loss": -24.866918563842773, "global_step": 254000, "epoch": 3060} {"train_loss": -24.78084373474121, "global_step": 254001, "epoch": 3060} {"train_loss": -25.200366973876953, "global_step": 254002, "epoch": 3060} {"train_loss": -25.120100021362305, "global_step": 254003, "epoch": 3060} {"train_loss": -24.825302124023438, "global_step": 254004, "epoch": 3060} {"train_loss": -24.64277458190918, "global_step": 254005, "epoch": 3060} {"train_loss": -24.973983764648438, "global_step": 254006, "epoch": 3060} {"train_loss": -24.81666374206543, "global_step": 254007, "epoch": 3060} {"train_loss": -24.836027145385742, "global_step": 254008, "epoch": 3060} {"train_loss": -25.094266891479492, "global_step": 254009, "epoch": 3060} {"train_loss": -25.020605087280273, "global_step": 254010, "epoch": 3060} {"train_loss": -24.791040420532227, "global_step": 254011, "epoch": 3060} {"train_loss": -24.929658889770508, "global_step": 254012, "epoch": 3060} {"train_loss": -25.18749237060547, "global_step": 254013, "epoch": 3060} {"train_loss": -25.036447525024414, "global_step": 254014, "epoch": 3060} {"train_loss": -25.221731185913086, "global_step": 254015, "epoch": 3060} {"train_loss": -25.078876495361328, "global_step": 254016, "epoch": 3060} {"train_loss": -25.166593551635742, "global_step": 254017, "epoch": 3060} {"train_loss": -24.988195419311523, "global_step": 254018, "epoch": 3060} {"train_loss": -25.15282440185547, "global_step": 254019, "epoch": 3060} {"train_loss": -25.190811157226562, "global_step": 254020, "epoch": 3060} {"train_loss": -25.089033126831055, "global_step": 254021, "epoch": 3060} {"train_loss": -24.960102081298828, "global_step": 254022, "epoch": 3060} {"train_loss": -25.16303825378418, "global_step": 254023, "epoch": 3060} {"train_loss": -24.96906089782715, "global_step": 254024, "epoch": 3060} {"train_loss": -25.349702835083008, "global_step": 254025, "epoch": 3060} {"train_loss": -25.13033103942871, "global_step": 254026, "epoch": 3060} {"train_loss": -25.124820709228516, "global_step": 254027, "epoch": 3060} {"train_loss": -25.20538330078125, "global_step": 254028, "epoch": 3060} {"train_loss": -24.735971450805664, "global_step": 254029, "epoch": 3060} {"train_loss": -24.97348976135254, "global_step": 254030, "epoch": 3060} {"train_loss": -25.074430465698242, "global_step": 254031, "epoch": 3060} {"train_loss": -24.877182006835938, "global_step": 254032, "epoch": 3060} {"train_loss": -24.640104293823242, "global_step": 254033, "epoch": 3060} {"train_loss": -24.448877334594727, "global_step": 254034, "epoch": 3060} {"train_loss": -24.712894439697266, "global_step": 254035, "epoch": 3060} {"train_loss": -24.865760803222656, "global_step": 254036, "epoch": 3060} {"train_loss": -24.590572357177734, "global_step": 254037, "epoch": 3060} {"train_loss": -25.35115623474121, "global_step": 254038, "epoch": 3060} {"train_loss": -24.88039779663086, "global_step": 254039, "epoch": 3060} {"train_loss": -25.190160751342773, "global_step": 254040, "epoch": 3060} {"train_loss": -24.958053588867188, "global_step": 254041, "epoch": 3060} {"train_loss": -24.708866119384766, "global_step": 254042, "epoch": 3060} {"train_loss": -24.712966918945312, "global_step": 254043, "epoch": 3060} {"train_loss": -25.036558151245117, "global_step": 254044, "epoch": 3060} {"train_loss": -25.217987060546875, "global_step": 254045, "epoch": 3060} {"train_loss": -25.226022720336914, "global_step": 254046, "epoch": 3060} {"train_loss": -24.950803756713867, "global_step": 254047, "epoch": 3060} {"train_loss": -24.830453872680664, "global_step": 254048, "epoch": 3060} {"train_loss": -24.98458480834961, "global_step": 254049, "epoch": 3060} {"train_loss": -24.922901153564453, "global_step": 254050, "epoch": 3060} {"train_loss": -24.857595443725586, "global_step": 254051, "epoch": 3060} {"train_loss": -25.177757263183594, "global_step": 254052, "epoch": 3060} {"train_loss": -25.329912185668945, "global_step": 254053, "epoch": 3060} {"train_loss": -25.359405517578125, "global_step": 254054, "epoch": 3060} {"train_loss": -25.034421920776367, "global_step": 254055, "epoch": 3060} {"train_loss": -25.28628921508789, "global_step": 254056, "epoch": 3060} {"train_loss": -24.74952507019043, "global_step": 254057, "epoch": 3060} {"train_loss": -25.119787216186523, "global_step": 254058, "epoch": 3060} {"train_loss": -25.271270751953125, "global_step": 254059, "epoch": 3060} {"train_loss": -25.360124588012695, "global_step": 254060, "epoch": 3060} {"train_loss": -24.94593620300293, "global_step": 254061, "epoch": 3060} {"train_loss": -24.916641304291876, "global_step": 254062, "epoch": 3060, "val_loss": 6980315.0} {"train_loss": -24.690338134765625, "global_step": 254063, "epoch": 3061} {"train_loss": -24.14626121520996, "global_step": 254064, "epoch": 3061} {"train_loss": -24.55777931213379, "global_step": 254065, "epoch": 3061} {"train_loss": -24.45539093017578, "global_step": 254066, "epoch": 3061} {"train_loss": -24.685684204101562, "global_step": 254067, "epoch": 3061} {"train_loss": -24.19693946838379, "global_step": 254068, "epoch": 3061} {"train_loss": -24.8142032623291, "global_step": 254069, "epoch": 3061} {"train_loss": -24.307861328125, "global_step": 254070, "epoch": 3061} {"train_loss": -24.39463233947754, "global_step": 254071, "epoch": 3061} {"train_loss": -24.79792594909668, "global_step": 254072, "epoch": 3061} {"train_loss": -24.4655704498291, "global_step": 254073, "epoch": 3061} {"train_loss": -24.643634796142578, "global_step": 254074, "epoch": 3061} {"train_loss": -25.087051391601562, "global_step": 254075, "epoch": 3061} {"train_loss": -24.930709838867188, "global_step": 254076, "epoch": 3061} {"train_loss": -24.441070556640625, "global_step": 254077, "epoch": 3061} {"train_loss": -24.735986709594727, "global_step": 254078, "epoch": 3061} {"train_loss": -24.766651153564453, "global_step": 254079, "epoch": 3061} {"train_loss": -25.120651245117188, "global_step": 254080, "epoch": 3061} {"train_loss": -24.797399520874023, "global_step": 254081, "epoch": 3061} {"train_loss": -24.665023803710938, "global_step": 254082, "epoch": 3061} {"train_loss": -24.423738479614258, "global_step": 254083, "epoch": 3061} {"train_loss": -24.92768669128418, "global_step": 254084, "epoch": 3061} {"train_loss": -25.07538414001465, "global_step": 254085, "epoch": 3061} {"train_loss": -24.663867950439453, "global_step": 254086, "epoch": 3061} {"train_loss": -25.206993103027344, "global_step": 254087, "epoch": 3061} {"train_loss": -24.72706413269043, "global_step": 254088, "epoch": 3061} {"train_loss": -24.5780086517334, "global_step": 254089, "epoch": 3061} {"train_loss": -24.927610397338867, "global_step": 254090, "epoch": 3061} {"train_loss": -24.77802085876465, "global_step": 254091, "epoch": 3061} {"train_loss": -25.383901596069336, "global_step": 254092, "epoch": 3061} {"train_loss": -24.984838485717773, "global_step": 254093, "epoch": 3061} {"train_loss": -24.737319946289062, "global_step": 254094, "epoch": 3061} {"train_loss": -24.972639083862305, "global_step": 254095, "epoch": 3061} {"train_loss": -24.89410400390625, "global_step": 254096, "epoch": 3061} {"train_loss": -24.970237731933594, "global_step": 254097, "epoch": 3061} {"train_loss": -24.6177921295166, "global_step": 254098, "epoch": 3061} {"train_loss": -24.906042098999023, "global_step": 254099, "epoch": 3061} {"train_loss": -24.854894638061523, "global_step": 254100, "epoch": 3061} {"train_loss": -24.962066650390625, "global_step": 254101, "epoch": 3061} {"train_loss": -24.895978927612305, "global_step": 254102, "epoch": 3061} {"train_loss": -24.867536544799805, "global_step": 254103, "epoch": 3061} {"train_loss": -24.764358520507812, "global_step": 254104, "epoch": 3061} {"train_loss": -25.17087173461914, "global_step": 254105, "epoch": 3061} {"train_loss": -24.84889030456543, "global_step": 254106, "epoch": 3061} {"train_loss": -25.3333740234375, "global_step": 254107, "epoch": 3061} {"train_loss": -25.04189109802246, "global_step": 254108, "epoch": 3061} {"train_loss": -24.7552547454834, "global_step": 254109, "epoch": 3061} {"train_loss": -25.141408920288086, "global_step": 254110, "epoch": 3061} {"train_loss": -24.935333251953125, "global_step": 254111, "epoch": 3061} {"train_loss": -25.171607971191406, "global_step": 254112, "epoch": 3061} {"train_loss": -25.34340476989746, "global_step": 254113, "epoch": 3061} {"train_loss": -24.8772029876709, "global_step": 254114, "epoch": 3061} {"train_loss": -24.860458374023438, "global_step": 254115, "epoch": 3061} {"train_loss": -25.107471466064453, "global_step": 254116, "epoch": 3061} {"train_loss": -24.918750762939453, "global_step": 254117, "epoch": 3061} {"train_loss": -25.549901962280273, "global_step": 254118, "epoch": 3061} {"train_loss": -24.96320915222168, "global_step": 254119, "epoch": 3061} {"train_loss": -25.341461181640625, "global_step": 254120, "epoch": 3061} {"train_loss": -25.19904136657715, "global_step": 254121, "epoch": 3061} {"train_loss": -25.36136245727539, "global_step": 254122, "epoch": 3061} {"train_loss": -25.127065658569336, "global_step": 254123, "epoch": 3061} {"train_loss": -24.53127098083496, "global_step": 254124, "epoch": 3061} {"train_loss": -24.822933197021484, "global_step": 254125, "epoch": 3061} {"train_loss": -24.501178741455078, "global_step": 254126, "epoch": 3061} {"train_loss": -24.66529655456543, "global_step": 254127, "epoch": 3061} {"train_loss": -25.11859703063965, "global_step": 254128, "epoch": 3061} {"train_loss": -24.76352310180664, "global_step": 254129, "epoch": 3061} {"train_loss": -24.65657615661621, "global_step": 254130, "epoch": 3061} {"train_loss": -24.900806427001953, "global_step": 254131, "epoch": 3061} {"train_loss": -24.65635108947754, "global_step": 254132, "epoch": 3061} {"train_loss": -24.719993591308594, "global_step": 254133, "epoch": 3061} {"train_loss": -24.875791549682617, "global_step": 254134, "epoch": 3061} {"train_loss": -24.895063400268555, "global_step": 254135, "epoch": 3061} {"train_loss": -24.741260528564453, "global_step": 254136, "epoch": 3061} {"train_loss": -25.017446517944336, "global_step": 254137, "epoch": 3061} {"train_loss": -24.99749755859375, "global_step": 254138, "epoch": 3061} {"train_loss": -25.02265167236328, "global_step": 254139, "epoch": 3061} {"train_loss": -25.01767349243164, "global_step": 254140, "epoch": 3061} {"train_loss": -24.865249633789062, "global_step": 254141, "epoch": 3061} {"train_loss": -24.576976776123047, "global_step": 254142, "epoch": 3061} {"train_loss": -25.070980072021484, "global_step": 254143, "epoch": 3061} {"train_loss": -24.906484603881836, "global_step": 254144, "epoch": 3061} {"train_loss": -24.836521746164344, "global_step": 254145, "epoch": 3061, "val_loss": 6818211.0} {"train_loss": -24.652280807495117, "global_step": 254146, "epoch": 3062} {"train_loss": -24.435733795166016, "global_step": 254147, "epoch": 3062} {"train_loss": -24.56903648376465, "global_step": 254148, "epoch": 3062} {"train_loss": -24.817325592041016, "global_step": 254149, "epoch": 3062} {"train_loss": -24.637971878051758, "global_step": 254150, "epoch": 3062} {"train_loss": -24.655208587646484, "global_step": 254151, "epoch": 3062} {"train_loss": -24.571186065673828, "global_step": 254152, "epoch": 3062} {"train_loss": -24.640731811523438, "global_step": 254153, "epoch": 3062} {"train_loss": -25.088577270507812, "global_step": 254154, "epoch": 3062} {"train_loss": -25.185148239135742, "global_step": 254155, "epoch": 3062} {"train_loss": -25.11885643005371, "global_step": 254156, "epoch": 3062} {"train_loss": -24.8354549407959, "global_step": 254157, "epoch": 3062} {"train_loss": -24.75713539123535, "global_step": 254158, "epoch": 3062} {"train_loss": -24.716821670532227, "global_step": 254159, "epoch": 3062} {"train_loss": -25.06175994873047, "global_step": 254160, "epoch": 3062} {"train_loss": -24.568756103515625, "global_step": 254161, "epoch": 3062} {"train_loss": -24.869718551635742, "global_step": 254162, "epoch": 3062} {"train_loss": -25.220977783203125, "global_step": 254163, "epoch": 3062} {"train_loss": -25.44913101196289, "global_step": 254164, "epoch": 3062} {"train_loss": -25.07950782775879, "global_step": 254165, "epoch": 3062} {"train_loss": -25.111011505126953, "global_step": 254166, "epoch": 3062} {"train_loss": -24.717573165893555, "global_step": 254167, "epoch": 3062} {"train_loss": -25.20124626159668, "global_step": 254168, "epoch": 3062} {"train_loss": -25.296293258666992, "global_step": 254169, "epoch": 3062} {"train_loss": -24.788715362548828, "global_step": 254170, "epoch": 3062} {"train_loss": -25.092788696289062, "global_step": 254171, "epoch": 3062} {"train_loss": -24.964651107788086, "global_step": 254172, "epoch": 3062} {"train_loss": -25.176883697509766, "global_step": 254173, "epoch": 3062} {"train_loss": -25.54058074951172, "global_step": 254174, "epoch": 3062} {"train_loss": -25.035070419311523, "global_step": 254175, "epoch": 3062} {"train_loss": -25.260351181030273, "global_step": 254176, "epoch": 3062} {"train_loss": -25.252164840698242, "global_step": 254177, "epoch": 3062} {"train_loss": -24.795089721679688, "global_step": 254178, "epoch": 3062} {"train_loss": -25.366971969604492, "global_step": 254179, "epoch": 3062} {"train_loss": -25.187744140625, "global_step": 254180, "epoch": 3062} {"train_loss": -25.10622215270996, "global_step": 254181, "epoch": 3062} {"train_loss": -24.930908203125, "global_step": 254182, "epoch": 3062} {"train_loss": -25.02674674987793, "global_step": 254183, "epoch": 3062} {"train_loss": -25.307342529296875, "global_step": 254184, "epoch": 3062} {"train_loss": -24.967885971069336, "global_step": 254185, "epoch": 3062} {"train_loss": -24.937883377075195, "global_step": 254186, "epoch": 3062} {"train_loss": -25.084020614624023, "global_step": 254187, "epoch": 3062} {"train_loss": -25.090707778930664, "global_step": 254188, "epoch": 3062} {"train_loss": -24.913665771484375, "global_step": 254189, "epoch": 3062} {"train_loss": -25.042390823364258, "global_step": 254190, "epoch": 3062} {"train_loss": -25.070653915405273, "global_step": 254191, "epoch": 3062} {"train_loss": -25.375898361206055, "global_step": 254192, "epoch": 3062} {"train_loss": -24.755966186523438, "global_step": 254193, "epoch": 3062} {"train_loss": -25.084020614624023, "global_step": 254194, "epoch": 3062} {"train_loss": -25.11762046813965, "global_step": 254195, "epoch": 3062} {"train_loss": -25.020978927612305, "global_step": 254196, "epoch": 3062} {"train_loss": -24.386579513549805, "global_step": 254197, "epoch": 3062} {"train_loss": -25.283781051635742, "global_step": 254198, "epoch": 3062} {"train_loss": -25.376371383666992, "global_step": 254199, "epoch": 3062} {"train_loss": -24.855833053588867, "global_step": 254200, "epoch": 3062} {"train_loss": -25.18623924255371, "global_step": 254201, "epoch": 3062} {"train_loss": -24.890907287597656, "global_step": 254202, "epoch": 3062} {"train_loss": -24.812360763549805, "global_step": 254203, "epoch": 3062} {"train_loss": -25.090682983398438, "global_step": 254204, "epoch": 3062} {"train_loss": -25.176353454589844, "global_step": 254205, "epoch": 3062} {"train_loss": -24.910951614379883, "global_step": 254206, "epoch": 3062} {"train_loss": -25.189661026000977, "global_step": 254207, "epoch": 3062} {"train_loss": -25.19544792175293, "global_step": 254208, "epoch": 3062} {"train_loss": -25.032917022705078, "global_step": 254209, "epoch": 3062} {"train_loss": -25.343997955322266, "global_step": 254210, "epoch": 3062} {"train_loss": -25.43592071533203, "global_step": 254211, "epoch": 3062} {"train_loss": -25.218399047851562, "global_step": 254212, "epoch": 3062} {"train_loss": -25.320783615112305, "global_step": 254213, "epoch": 3062} {"train_loss": -25.380067825317383, "global_step": 254214, "epoch": 3062} {"train_loss": -25.28696632385254, "global_step": 254215, "epoch": 3062} {"train_loss": -24.964038848876953, "global_step": 254216, "epoch": 3062} {"train_loss": -25.14177703857422, "global_step": 254217, "epoch": 3062} {"train_loss": -24.909912109375, "global_step": 254218, "epoch": 3062} {"train_loss": -24.956754684448242, "global_step": 254219, "epoch": 3062} {"train_loss": -25.011442184448242, "global_step": 254220, "epoch": 3062} {"train_loss": -24.942548751831055, "global_step": 254221, "epoch": 3062} {"train_loss": -25.3481502532959, "global_step": 254222, "epoch": 3062} {"train_loss": -25.218353271484375, "global_step": 254223, "epoch": 3062} {"train_loss": -24.971359252929688, "global_step": 254224, "epoch": 3062} {"train_loss": -25.218530654907227, "global_step": 254225, "epoch": 3062} {"train_loss": -25.02434730529785, "global_step": 254226, "epoch": 3062} {"train_loss": -24.802448272705078, "global_step": 254227, "epoch": 3062} {"train_loss": -25.045939870627528, "global_step": 254228, "epoch": 3062, "val_loss": 6886143.0} {"train_loss": -24.76266860961914, "global_step": 254229, "epoch": 3063} {"train_loss": -24.810108184814453, "global_step": 254230, "epoch": 3063} {"train_loss": -25.435636520385742, "global_step": 254231, "epoch": 3063} {"train_loss": -24.499588012695312, "global_step": 254232, "epoch": 3063} {"train_loss": -24.498088836669922, "global_step": 254233, "epoch": 3063} {"train_loss": -24.401180267333984, "global_step": 254234, "epoch": 3063} {"train_loss": -24.903057098388672, "global_step": 254235, "epoch": 3063} {"train_loss": -24.485015869140625, "global_step": 254236, "epoch": 3063} {"train_loss": -24.78585433959961, "global_step": 254237, "epoch": 3063} {"train_loss": -24.369842529296875, "global_step": 254238, "epoch": 3063} {"train_loss": -24.597925186157227, "global_step": 254239, "epoch": 3063} {"train_loss": -24.79446792602539, "global_step": 254240, "epoch": 3063} {"train_loss": -24.259334564208984, "global_step": 254241, "epoch": 3063} {"train_loss": -24.560285568237305, "global_step": 254242, "epoch": 3063} {"train_loss": -25.011011123657227, "global_step": 254243, "epoch": 3063} {"train_loss": -24.97153091430664, "global_step": 254244, "epoch": 3063} {"train_loss": -25.034751892089844, "global_step": 254245, "epoch": 3063} {"train_loss": -24.33817481994629, "global_step": 254246, "epoch": 3063} {"train_loss": -24.951223373413086, "global_step": 254247, "epoch": 3063} {"train_loss": -24.982032775878906, "global_step": 254248, "epoch": 3063} {"train_loss": -24.52225112915039, "global_step": 254249, "epoch": 3063} {"train_loss": -24.770326614379883, "global_step": 254250, "epoch": 3063} {"train_loss": -24.87092399597168, "global_step": 254251, "epoch": 3063} {"train_loss": -25.123014450073242, "global_step": 254252, "epoch": 3063} {"train_loss": -24.87379264831543, "global_step": 254253, "epoch": 3063} {"train_loss": -24.92722511291504, "global_step": 254254, "epoch": 3063} {"train_loss": -25.334190368652344, "global_step": 254255, "epoch": 3063} {"train_loss": -24.570756912231445, "global_step": 254256, "epoch": 3063} {"train_loss": -25.020740509033203, "global_step": 254257, "epoch": 3063} {"train_loss": -24.864221572875977, "global_step": 254258, "epoch": 3063} {"train_loss": -24.806604385375977, "global_step": 254259, "epoch": 3063} {"train_loss": -25.00833511352539, "global_step": 254260, "epoch": 3063} {"train_loss": -25.21607780456543, "global_step": 254261, "epoch": 3063} {"train_loss": -24.957260131835938, "global_step": 254262, "epoch": 3063} {"train_loss": -25.252315521240234, "global_step": 254263, "epoch": 3063} {"train_loss": -24.948410034179688, "global_step": 254264, "epoch": 3063} {"train_loss": -24.848148345947266, "global_step": 254265, "epoch": 3063} {"train_loss": -24.83975601196289, "global_step": 254266, "epoch": 3063} {"train_loss": -25.15549087524414, "global_step": 254267, "epoch": 3063} {"train_loss": -25.087722778320312, "global_step": 254268, "epoch": 3063} {"train_loss": -25.363805770874023, "global_step": 254269, "epoch": 3063} {"train_loss": -25.42413902282715, "global_step": 254270, "epoch": 3063} {"train_loss": -25.082691192626953, "global_step": 254271, "epoch": 3063} {"train_loss": -24.898786544799805, "global_step": 254272, "epoch": 3063} {"train_loss": -24.995372772216797, "global_step": 254273, "epoch": 3063} {"train_loss": -25.46071434020996, "global_step": 254274, "epoch": 3063} {"train_loss": -24.96625328063965, "global_step": 254275, "epoch": 3063} {"train_loss": -25.074575424194336, "global_step": 254276, "epoch": 3063} {"train_loss": -25.122844696044922, "global_step": 254277, "epoch": 3063} {"train_loss": -24.790603637695312, "global_step": 254278, "epoch": 3063} {"train_loss": -25.295984268188477, "global_step": 254279, "epoch": 3063} {"train_loss": -25.50206184387207, "global_step": 254280, "epoch": 3063} {"train_loss": -25.43766212463379, "global_step": 254281, "epoch": 3063} {"train_loss": -25.09261131286621, "global_step": 254282, "epoch": 3063} {"train_loss": -24.983633041381836, "global_step": 254283, "epoch": 3063} {"train_loss": -25.02519989013672, "global_step": 254284, "epoch": 3063} {"train_loss": -25.4935359954834, "global_step": 254285, "epoch": 3063} {"train_loss": -25.043659210205078, "global_step": 254286, "epoch": 3063} {"train_loss": -24.900989532470703, "global_step": 254287, "epoch": 3063} {"train_loss": -25.403547286987305, "global_step": 254288, "epoch": 3063} {"train_loss": -25.197111129760742, "global_step": 254289, "epoch": 3063} {"train_loss": -25.381549835205078, "global_step": 254290, "epoch": 3063} {"train_loss": -24.65879249572754, "global_step": 254291, "epoch": 3063} {"train_loss": -24.948511123657227, "global_step": 254292, "epoch": 3063} {"train_loss": -25.020612716674805, "global_step": 254293, "epoch": 3063} {"train_loss": -25.203947067260742, "global_step": 254294, "epoch": 3063} {"train_loss": -25.325611114501953, "global_step": 254295, "epoch": 3063} {"train_loss": -25.45649528503418, "global_step": 254296, "epoch": 3063} {"train_loss": -25.078445434570312, "global_step": 254297, "epoch": 3063} {"train_loss": -25.11728858947754, "global_step": 254298, "epoch": 3063} {"train_loss": -25.15613555908203, "global_step": 254299, "epoch": 3063} {"train_loss": -25.055150985717773, "global_step": 254300, "epoch": 3063} {"train_loss": -24.811859130859375, "global_step": 254301, "epoch": 3063} {"train_loss": -25.2246150970459, "global_step": 254302, "epoch": 3063} {"train_loss": -24.870271682739258, "global_step": 254303, "epoch": 3063} {"train_loss": -24.956953048706055, "global_step": 254304, "epoch": 3063} {"train_loss": -25.024633407592773, "global_step": 254305, "epoch": 3063} {"train_loss": -24.99066734313965, "global_step": 254306, "epoch": 3063} {"train_loss": -25.15604019165039, "global_step": 254307, "epoch": 3063} {"train_loss": -25.163589477539062, "global_step": 254308, "epoch": 3063} {"train_loss": -24.79383659362793, "global_step": 254309, "epoch": 3063} {"train_loss": -25.247289657592773, "global_step": 254310, "epoch": 3063} {"train_loss": -24.98907447723021, "global_step": 254311, "epoch": 3063, "val_loss": 6934319.0} {"train_loss": -24.52111053466797, "global_step": 254312, "epoch": 3064} {"train_loss": -24.494131088256836, "global_step": 254313, "epoch": 3064} {"train_loss": -24.758474349975586, "global_step": 254314, "epoch": 3064} {"train_loss": -24.277761459350586, "global_step": 254315, "epoch": 3064} {"train_loss": -24.4638671875, "global_step": 254316, "epoch": 3064} {"train_loss": -24.445064544677734, "global_step": 254317, "epoch": 3064} {"train_loss": -24.666824340820312, "global_step": 254318, "epoch": 3064} {"train_loss": -24.81153678894043, "global_step": 254319, "epoch": 3064} {"train_loss": -24.894412994384766, "global_step": 254320, "epoch": 3064} {"train_loss": -24.65781021118164, "global_step": 254321, "epoch": 3064} {"train_loss": -25.115503311157227, "global_step": 254322, "epoch": 3064} {"train_loss": -24.6262149810791, "global_step": 254323, "epoch": 3064} {"train_loss": -24.90166664123535, "global_step": 254324, "epoch": 3064} {"train_loss": -25.03072166442871, "global_step": 254325, "epoch": 3064} {"train_loss": -25.132997512817383, "global_step": 254326, "epoch": 3064} {"train_loss": -25.099140167236328, "global_step": 254327, "epoch": 3064} {"train_loss": -24.94683837890625, "global_step": 254328, "epoch": 3064} {"train_loss": -24.808502197265625, "global_step": 254329, "epoch": 3064} {"train_loss": -25.051572799682617, "global_step": 254330, "epoch": 3064} {"train_loss": -25.5023250579834, "global_step": 254331, "epoch": 3064} {"train_loss": -25.000476837158203, "global_step": 254332, "epoch": 3064} {"train_loss": -25.193361282348633, "global_step": 254333, "epoch": 3064} {"train_loss": -24.892892837524414, "global_step": 254334, "epoch": 3064} {"train_loss": -24.904754638671875, "global_step": 254335, "epoch": 3064} {"train_loss": -25.298320770263672, "global_step": 254336, "epoch": 3064} {"train_loss": -25.3746395111084, "global_step": 254337, "epoch": 3064} {"train_loss": -24.950977325439453, "global_step": 254338, "epoch": 3064} {"train_loss": -24.991697311401367, "global_step": 254339, "epoch": 3064} {"train_loss": -25.06049156188965, "global_step": 254340, "epoch": 3064} {"train_loss": -25.022611618041992, "global_step": 254341, "epoch": 3064} {"train_loss": -25.06764030456543, "global_step": 254342, "epoch": 3064} {"train_loss": -25.254304885864258, "global_step": 254343, "epoch": 3064} {"train_loss": -25.0089168548584, "global_step": 254344, "epoch": 3064} {"train_loss": -25.25294303894043, "global_step": 254345, "epoch": 3064} {"train_loss": -25.26165199279785, "global_step": 254346, "epoch": 3064} {"train_loss": -25.411426544189453, "global_step": 254347, "epoch": 3064} {"train_loss": -25.143129348754883, "global_step": 254348, "epoch": 3064} {"train_loss": -25.251407623291016, "global_step": 254349, "epoch": 3064} {"train_loss": -24.939218521118164, "global_step": 254350, "epoch": 3064} {"train_loss": -25.100324630737305, "global_step": 254351, "epoch": 3064} {"train_loss": -25.404905319213867, "global_step": 254352, "epoch": 3064} {"train_loss": -25.127222061157227, "global_step": 254353, "epoch": 3064} {"train_loss": -25.238805770874023, "global_step": 254354, "epoch": 3064} {"train_loss": -24.76133155822754, "global_step": 254355, "epoch": 3064} {"train_loss": -24.891159057617188, "global_step": 254356, "epoch": 3064} {"train_loss": -24.796579360961914, "global_step": 254357, "epoch": 3064} {"train_loss": -24.775121688842773, "global_step": 254358, "epoch": 3064} {"train_loss": -24.887319564819336, "global_step": 254359, "epoch": 3064} {"train_loss": -25.179487228393555, "global_step": 254360, "epoch": 3064} {"train_loss": -25.295047760009766, "global_step": 254361, "epoch": 3064} {"train_loss": -25.186437606811523, "global_step": 254362, "epoch": 3064} {"train_loss": -24.74432945251465, "global_step": 254363, "epoch": 3064} {"train_loss": -25.125370025634766, "global_step": 254364, "epoch": 3064} {"train_loss": -25.068103790283203, "global_step": 254365, "epoch": 3064} {"train_loss": -25.16286277770996, "global_step": 254366, "epoch": 3064} {"train_loss": -25.39011573791504, "global_step": 254367, "epoch": 3064} {"train_loss": -25.481922149658203, "global_step": 254368, "epoch": 3064} {"train_loss": -25.044330596923828, "global_step": 254369, "epoch": 3064} {"train_loss": -25.19898796081543, "global_step": 254370, "epoch": 3064} {"train_loss": -24.93731689453125, "global_step": 254371, "epoch": 3064} {"train_loss": -24.9945011138916, "global_step": 254372, "epoch": 3064} {"train_loss": -25.080595016479492, "global_step": 254373, "epoch": 3064} {"train_loss": -25.061241149902344, "global_step": 254374, "epoch": 3064} {"train_loss": -24.898916244506836, "global_step": 254375, "epoch": 3064} {"train_loss": -25.057010650634766, "global_step": 254376, "epoch": 3064} {"train_loss": -25.06861686706543, "global_step": 254377, "epoch": 3064} {"train_loss": -25.07021713256836, "global_step": 254378, "epoch": 3064} {"train_loss": -25.16017723083496, "global_step": 254379, "epoch": 3064} {"train_loss": -25.43935775756836, "global_step": 254380, "epoch": 3064} {"train_loss": -25.305038452148438, "global_step": 254381, "epoch": 3064} {"train_loss": -25.151199340820312, "global_step": 254382, "epoch": 3064} {"train_loss": -25.178693771362305, "global_step": 254383, "epoch": 3064} {"train_loss": -25.421537399291992, "global_step": 254384, "epoch": 3064} {"train_loss": -25.017087936401367, "global_step": 254385, "epoch": 3064} {"train_loss": -25.596332550048828, "global_step": 254386, "epoch": 3064} {"train_loss": -25.4500789642334, "global_step": 254387, "epoch": 3064} {"train_loss": -24.767026901245117, "global_step": 254388, "epoch": 3064} {"train_loss": -24.961469650268555, "global_step": 254389, "epoch": 3064} {"train_loss": -24.38002586364746, "global_step": 254390, "epoch": 3064} {"train_loss": -24.15350914001465, "global_step": 254391, "epoch": 3064} {"train_loss": -24.614641189575195, "global_step": 254392, "epoch": 3064} {"train_loss": -25.08941650390625, "global_step": 254393, "epoch": 3064} {"train_loss": -25.008440707103315, "global_step": 254394, "epoch": 3064, "val_loss": 6748661.0} {"train_loss": -24.061307907104492, "global_step": 254395, "epoch": 3065} {"train_loss": -24.180198669433594, "global_step": 254396, "epoch": 3065} {"train_loss": -24.085872650146484, "global_step": 254397, "epoch": 3065} {"train_loss": -24.2424259185791, "global_step": 254398, "epoch": 3065} {"train_loss": -24.641279220581055, "global_step": 254399, "epoch": 3065} {"train_loss": -24.15940284729004, "global_step": 254400, "epoch": 3065} {"train_loss": -24.42970848083496, "global_step": 254401, "epoch": 3065} {"train_loss": -24.435392379760742, "global_step": 254402, "epoch": 3065} {"train_loss": -24.515457153320312, "global_step": 254403, "epoch": 3065} {"train_loss": -24.80787467956543, "global_step": 254404, "epoch": 3065} {"train_loss": -24.428245544433594, "global_step": 254405, "epoch": 3065} {"train_loss": -24.81245994567871, "global_step": 254406, "epoch": 3065} {"train_loss": -24.553503036499023, "global_step": 254407, "epoch": 3065} {"train_loss": -24.642662048339844, "global_step": 254408, "epoch": 3065} {"train_loss": -24.372343063354492, "global_step": 254409, "epoch": 3065} {"train_loss": -24.41417121887207, "global_step": 254410, "epoch": 3065} {"train_loss": -24.59551239013672, "global_step": 254411, "epoch": 3065} {"train_loss": -24.902008056640625, "global_step": 254412, "epoch": 3065} {"train_loss": -24.820363998413086, "global_step": 254413, "epoch": 3065} {"train_loss": -24.58558464050293, "global_step": 254414, "epoch": 3065} {"train_loss": -24.618545532226562, "global_step": 254415, "epoch": 3065} {"train_loss": -25.0328426361084, "global_step": 254416, "epoch": 3065} {"train_loss": -24.7269344329834, "global_step": 254417, "epoch": 3065} {"train_loss": -24.524944305419922, "global_step": 254418, "epoch": 3065} {"train_loss": -24.5767879486084, "global_step": 254419, "epoch": 3065} {"train_loss": -25.37691307067871, "global_step": 254420, "epoch": 3065} {"train_loss": -25.07413101196289, "global_step": 254421, "epoch": 3065} {"train_loss": -25.05545425415039, "global_step": 254422, "epoch": 3065} {"train_loss": -25.2120361328125, "global_step": 254423, "epoch": 3065} {"train_loss": -25.215120315551758, "global_step": 254424, "epoch": 3065} {"train_loss": -24.929807662963867, "global_step": 254425, "epoch": 3065} {"train_loss": -24.954404830932617, "global_step": 254426, "epoch": 3065} {"train_loss": -25.149097442626953, "global_step": 254427, "epoch": 3065} {"train_loss": -25.23349380493164, "global_step": 254428, "epoch": 3065} {"train_loss": -25.321577072143555, "global_step": 254429, "epoch": 3065} {"train_loss": -25.13636016845703, "global_step": 254430, "epoch": 3065} {"train_loss": -25.15357780456543, "global_step": 254431, "epoch": 3065} {"train_loss": -24.757490158081055, "global_step": 254432, "epoch": 3065} {"train_loss": -25.087894439697266, "global_step": 254433, "epoch": 3065} {"train_loss": -25.38498306274414, "global_step": 254434, "epoch": 3065} {"train_loss": -25.343093872070312, "global_step": 254435, "epoch": 3065} {"train_loss": -25.588092803955078, "global_step": 254436, "epoch": 3065} {"train_loss": -25.3377685546875, "global_step": 254437, "epoch": 3065} {"train_loss": -25.19465446472168, "global_step": 254438, "epoch": 3065} {"train_loss": -25.076614379882812, "global_step": 254439, "epoch": 3065} {"train_loss": -25.212650299072266, "global_step": 254440, "epoch": 3065} {"train_loss": -25.037466049194336, "global_step": 254441, "epoch": 3065} {"train_loss": -25.4152774810791, "global_step": 254442, "epoch": 3065} {"train_loss": -25.093076705932617, "global_step": 254443, "epoch": 3065} {"train_loss": -25.56503677368164, "global_step": 254444, "epoch": 3065} {"train_loss": -25.170488357543945, "global_step": 254445, "epoch": 3065} {"train_loss": -25.36919593811035, "global_step": 254446, "epoch": 3065} {"train_loss": -25.252553939819336, "global_step": 254447, "epoch": 3065} {"train_loss": -25.216461181640625, "global_step": 254448, "epoch": 3065} {"train_loss": -24.777982711791992, "global_step": 254449, "epoch": 3065} {"train_loss": -24.645490646362305, "global_step": 254450, "epoch": 3065} {"train_loss": -24.961896896362305, "global_step": 254451, "epoch": 3065} {"train_loss": -24.847843170166016, "global_step": 254452, "epoch": 3065} {"train_loss": -24.827640533447266, "global_step": 254453, "epoch": 3065} {"train_loss": -25.356538772583008, "global_step": 254454, "epoch": 3065} {"train_loss": -25.294782638549805, "global_step": 254455, "epoch": 3065} {"train_loss": -25.184606552124023, "global_step": 254456, "epoch": 3065} {"train_loss": -25.063215255737305, "global_step": 254457, "epoch": 3065} {"train_loss": -25.30939292907715, "global_step": 254458, "epoch": 3065} {"train_loss": -25.288015365600586, "global_step": 254459, "epoch": 3065} {"train_loss": -25.163311004638672, "global_step": 254460, "epoch": 3065} {"train_loss": -25.19292640686035, "global_step": 254461, "epoch": 3065} {"train_loss": -25.076536178588867, "global_step": 254462, "epoch": 3065} {"train_loss": -25.088327407836914, "global_step": 254463, "epoch": 3065} {"train_loss": -25.22532844543457, "global_step": 254464, "epoch": 3065} {"train_loss": -25.09914779663086, "global_step": 254465, "epoch": 3065} {"train_loss": -25.27872085571289, "global_step": 254466, "epoch": 3065} {"train_loss": -24.975709915161133, "global_step": 254467, "epoch": 3065} {"train_loss": -25.015899658203125, "global_step": 254468, "epoch": 3065} {"train_loss": -25.423599243164062, "global_step": 254469, "epoch": 3065} {"train_loss": -25.300395965576172, "global_step": 254470, "epoch": 3065} {"train_loss": -25.226781845092773, "global_step": 254471, "epoch": 3065} {"train_loss": -25.05805778503418, "global_step": 254472, "epoch": 3065} {"train_loss": -25.125337600708008, "global_step": 254473, "epoch": 3065} {"train_loss": -25.095300674438477, "global_step": 254474, "epoch": 3065} {"train_loss": -25.59391975402832, "global_step": 254475, "epoch": 3065} {"train_loss": -25.561614990234375, "global_step": 254476, "epoch": 3065} {"train_loss": -24.99418428719762, "global_step": 254477, "epoch": 3065, "val_loss": 6929385.5} {"train_loss": -24.807987213134766, "global_step": 254478, "epoch": 3066} {"train_loss": -24.84033203125, "global_step": 254479, "epoch": 3066} {"train_loss": -24.71283721923828, "global_step": 254480, "epoch": 3066} {"train_loss": -24.982280731201172, "global_step": 254481, "epoch": 3066} {"train_loss": -24.799346923828125, "global_step": 254482, "epoch": 3066} {"train_loss": -24.868606567382812, "global_step": 254483, "epoch": 3066} {"train_loss": -25.167430877685547, "global_step": 254484, "epoch": 3066} {"train_loss": -24.875926971435547, "global_step": 254485, "epoch": 3066} {"train_loss": -25.09156608581543, "global_step": 254486, "epoch": 3066} {"train_loss": -25.003082275390625, "global_step": 254487, "epoch": 3066} {"train_loss": -24.962186813354492, "global_step": 254488, "epoch": 3066} {"train_loss": -25.12006950378418, "global_step": 254489, "epoch": 3066} {"train_loss": -25.06580924987793, "global_step": 254490, "epoch": 3066} {"train_loss": -24.911212921142578, "global_step": 254491, "epoch": 3066} {"train_loss": -25.00613784790039, "global_step": 254492, "epoch": 3066} {"train_loss": -25.358728408813477, "global_step": 254493, "epoch": 3066} {"train_loss": -25.1441707611084, "global_step": 254494, "epoch": 3066} {"train_loss": -25.230138778686523, "global_step": 254495, "epoch": 3066} {"train_loss": -25.375669479370117, "global_step": 254496, "epoch": 3066} {"train_loss": -25.250198364257812, "global_step": 254497, "epoch": 3066} {"train_loss": -24.995376586914062, "global_step": 254498, "epoch": 3066} {"train_loss": -24.774856567382812, "global_step": 254499, "epoch": 3066} {"train_loss": -25.276809692382812, "global_step": 254500, "epoch": 3066} {"train_loss": -25.307401657104492, "global_step": 254501, "epoch": 3066} {"train_loss": -25.164825439453125, "global_step": 254502, "epoch": 3066} {"train_loss": -25.156574249267578, "global_step": 254503, "epoch": 3066} {"train_loss": -25.049541473388672, "global_step": 254504, "epoch": 3066} {"train_loss": -25.306318283081055, "global_step": 254505, "epoch": 3066} {"train_loss": -25.149383544921875, "global_step": 254506, "epoch": 3066} {"train_loss": -25.305431365966797, "global_step": 254507, "epoch": 3066} {"train_loss": -25.162490844726562, "global_step": 254508, "epoch": 3066} {"train_loss": -25.320941925048828, "global_step": 254509, "epoch": 3066} {"train_loss": -25.02254295349121, "global_step": 254510, "epoch": 3066} {"train_loss": -24.840246200561523, "global_step": 254511, "epoch": 3066} {"train_loss": -25.376834869384766, "global_step": 254512, "epoch": 3066} {"train_loss": -24.861835479736328, "global_step": 254513, "epoch": 3066} {"train_loss": -25.387723922729492, "global_step": 254514, "epoch": 3066} {"train_loss": -25.290271759033203, "global_step": 254515, "epoch": 3066} {"train_loss": -25.077743530273438, "global_step": 254516, "epoch": 3066} {"train_loss": -25.099607467651367, "global_step": 254517, "epoch": 3066} {"train_loss": -25.31726837158203, "global_step": 254518, "epoch": 3066} {"train_loss": -25.080650329589844, "global_step": 254519, "epoch": 3066} {"train_loss": -25.085378646850586, "global_step": 254520, "epoch": 3066} {"train_loss": -24.74184226989746, "global_step": 254521, "epoch": 3066} {"train_loss": -25.277868270874023, "global_step": 254522, "epoch": 3066} {"train_loss": -24.991413116455078, "global_step": 254523, "epoch": 3066} {"train_loss": -25.437658309936523, "global_step": 254524, "epoch": 3066} {"train_loss": -25.120960235595703, "global_step": 254525, "epoch": 3066} {"train_loss": -25.24852752685547, "global_step": 254526, "epoch": 3066} {"train_loss": -25.17108154296875, "global_step": 254527, "epoch": 3066} {"train_loss": -24.924711227416992, "global_step": 254528, "epoch": 3066} {"train_loss": -25.39627456665039, "global_step": 254529, "epoch": 3066} {"train_loss": -24.952373504638672, "global_step": 254530, "epoch": 3066} {"train_loss": -24.9117488861084, "global_step": 254531, "epoch": 3066} {"train_loss": -24.732879638671875, "global_step": 254532, "epoch": 3066} {"train_loss": -24.851104736328125, "global_step": 254533, "epoch": 3066} {"train_loss": -25.435611724853516, "global_step": 254534, "epoch": 3066} {"train_loss": -25.14396095275879, "global_step": 254535, "epoch": 3066} {"train_loss": -24.809101104736328, "global_step": 254536, "epoch": 3066} {"train_loss": -24.827354431152344, "global_step": 254537, "epoch": 3066} {"train_loss": -24.92424774169922, "global_step": 254538, "epoch": 3066} {"train_loss": -24.75141716003418, "global_step": 254539, "epoch": 3066} {"train_loss": -24.975204467773438, "global_step": 254540, "epoch": 3066} {"train_loss": -24.939464569091797, "global_step": 254541, "epoch": 3066} {"train_loss": -25.012052536010742, "global_step": 254542, "epoch": 3066} {"train_loss": -25.080854415893555, "global_step": 254543, "epoch": 3066} {"train_loss": -24.9499454498291, "global_step": 254544, "epoch": 3066} {"train_loss": -24.898351669311523, "global_step": 254545, "epoch": 3066} {"train_loss": -24.871885299682617, "global_step": 254546, "epoch": 3066} {"train_loss": -24.108686447143555, "global_step": 254547, "epoch": 3066} {"train_loss": -24.500505447387695, "global_step": 254548, "epoch": 3066} {"train_loss": -24.677982330322266, "global_step": 254549, "epoch": 3066} {"train_loss": -24.815614700317383, "global_step": 254550, "epoch": 3066} {"train_loss": -25.01873207092285, "global_step": 254551, "epoch": 3066} {"train_loss": -24.982839584350586, "global_step": 254552, "epoch": 3066} {"train_loss": -24.88258171081543, "global_step": 254553, "epoch": 3066} {"train_loss": -24.9493408203125, "global_step": 254554, "epoch": 3066} {"train_loss": -25.036243438720703, "global_step": 254555, "epoch": 3066} {"train_loss": -24.969152450561523, "global_step": 254556, "epoch": 3066} {"train_loss": -24.945674896240234, "global_step": 254557, "epoch": 3066} {"train_loss": -25.02040672302246, "global_step": 254558, "epoch": 3066} {"train_loss": -25.00503158569336, "global_step": 254559, "epoch": 3066} {"train_loss": -25.025482591376246, "global_step": 254560, "epoch": 3066, "val_loss": 6954318.0} {"train_loss": -24.96792984008789, "global_step": 254561, "epoch": 3067} {"train_loss": -24.838598251342773, "global_step": 254562, "epoch": 3067} {"train_loss": -25.086788177490234, "global_step": 254563, "epoch": 3067} {"train_loss": -24.952869415283203, "global_step": 254564, "epoch": 3067} {"train_loss": -24.78227996826172, "global_step": 254565, "epoch": 3067} {"train_loss": -24.861251831054688, "global_step": 254566, "epoch": 3067} {"train_loss": -25.19832420349121, "global_step": 254567, "epoch": 3067} {"train_loss": -24.92975425720215, "global_step": 254568, "epoch": 3067} {"train_loss": -24.977216720581055, "global_step": 254569, "epoch": 3067} {"train_loss": -24.747217178344727, "global_step": 254570, "epoch": 3067} {"train_loss": -25.02760124206543, "global_step": 254571, "epoch": 3067} {"train_loss": -25.12467384338379, "global_step": 254572, "epoch": 3067} {"train_loss": -25.312707901000977, "global_step": 254573, "epoch": 3067} {"train_loss": -24.70242691040039, "global_step": 254574, "epoch": 3067} {"train_loss": -25.1616268157959, "global_step": 254575, "epoch": 3067} {"train_loss": -24.866125106811523, "global_step": 254576, "epoch": 3067} {"train_loss": -24.598854064941406, "global_step": 254577, "epoch": 3067} {"train_loss": -25.269285202026367, "global_step": 254578, "epoch": 3067} {"train_loss": -24.98440933227539, "global_step": 254579, "epoch": 3067} {"train_loss": -25.33562660217285, "global_step": 254580, "epoch": 3067} {"train_loss": -25.30014991760254, "global_step": 254581, "epoch": 3067} {"train_loss": -25.251462936401367, "global_step": 254582, "epoch": 3067} {"train_loss": -25.4913330078125, "global_step": 254583, "epoch": 3067} {"train_loss": -25.425556182861328, "global_step": 254584, "epoch": 3067} {"train_loss": -24.863922119140625, "global_step": 254585, "epoch": 3067} {"train_loss": -24.959068298339844, "global_step": 254586, "epoch": 3067} {"train_loss": -25.24427032470703, "global_step": 254587, "epoch": 3067} {"train_loss": -25.037019729614258, "global_step": 254588, "epoch": 3067} {"train_loss": -24.913724899291992, "global_step": 254589, "epoch": 3067} {"train_loss": -24.843137741088867, "global_step": 254590, "epoch": 3067} {"train_loss": -25.18720245361328, "global_step": 254591, "epoch": 3067} {"train_loss": -24.882041931152344, "global_step": 254592, "epoch": 3067} {"train_loss": -25.103933334350586, "global_step": 254593, "epoch": 3067} {"train_loss": -24.895109176635742, "global_step": 254594, "epoch": 3067} {"train_loss": -25.3275203704834, "global_step": 254595, "epoch": 3067} {"train_loss": -25.169843673706055, "global_step": 254596, "epoch": 3067} {"train_loss": -25.111623764038086, "global_step": 254597, "epoch": 3067} {"train_loss": -24.82672691345215, "global_step": 254598, "epoch": 3067} {"train_loss": -25.023595809936523, "global_step": 254599, "epoch": 3067} {"train_loss": -24.961111068725586, "global_step": 254600, "epoch": 3067} {"train_loss": -24.961400985717773, "global_step": 254601, "epoch": 3067} {"train_loss": -25.458099365234375, "global_step": 254602, "epoch": 3067} {"train_loss": -25.065481185913086, "global_step": 254603, "epoch": 3067} {"train_loss": -24.932222366333008, "global_step": 254604, "epoch": 3067} {"train_loss": -25.226783752441406, "global_step": 254605, "epoch": 3067} {"train_loss": -25.132381439208984, "global_step": 254606, "epoch": 3067} {"train_loss": -24.862716674804688, "global_step": 254607, "epoch": 3067} {"train_loss": -25.293516159057617, "global_step": 254608, "epoch": 3067} {"train_loss": -25.2091007232666, "global_step": 254609, "epoch": 3067} {"train_loss": -25.22307014465332, "global_step": 254610, "epoch": 3067} {"train_loss": -25.012210845947266, "global_step": 254611, "epoch": 3067} {"train_loss": -24.995624542236328, "global_step": 254612, "epoch": 3067} {"train_loss": -25.20998191833496, "global_step": 254613, "epoch": 3067} {"train_loss": -25.082660675048828, "global_step": 254614, "epoch": 3067} {"train_loss": -24.992725372314453, "global_step": 254615, "epoch": 3067} {"train_loss": -24.9404239654541, "global_step": 254616, "epoch": 3067} {"train_loss": -25.051986694335938, "global_step": 254617, "epoch": 3067} {"train_loss": -25.222009658813477, "global_step": 254618, "epoch": 3067} {"train_loss": -24.698810577392578, "global_step": 254619, "epoch": 3067} {"train_loss": -25.127490997314453, "global_step": 254620, "epoch": 3067} {"train_loss": -25.215608596801758, "global_step": 254621, "epoch": 3067} {"train_loss": -25.447134017944336, "global_step": 254622, "epoch": 3067} {"train_loss": -25.186351776123047, "global_step": 254623, "epoch": 3067} {"train_loss": -24.874937057495117, "global_step": 254624, "epoch": 3067} {"train_loss": -25.242033004760742, "global_step": 254625, "epoch": 3067} {"train_loss": -25.27223777770996, "global_step": 254626, "epoch": 3067} {"train_loss": -24.804433822631836, "global_step": 254627, "epoch": 3067} {"train_loss": -25.19913101196289, "global_step": 254628, "epoch": 3067} {"train_loss": -25.016088485717773, "global_step": 254629, "epoch": 3067} {"train_loss": -24.565166473388672, "global_step": 254630, "epoch": 3067} {"train_loss": -25.319690704345703, "global_step": 254631, "epoch": 3067} {"train_loss": -24.74505043029785, "global_step": 254632, "epoch": 3067} {"train_loss": -24.6844482421875, "global_step": 254633, "epoch": 3067} {"train_loss": -24.857158660888672, "global_step": 254634, "epoch": 3067} {"train_loss": -24.762296676635742, "global_step": 254635, "epoch": 3067} {"train_loss": -24.666263580322266, "global_step": 254636, "epoch": 3067} {"train_loss": -25.02552032470703, "global_step": 254637, "epoch": 3067} {"train_loss": -24.484102249145508, "global_step": 254638, "epoch": 3067} {"train_loss": -24.53537368774414, "global_step": 254639, "epoch": 3067} {"train_loss": -24.53434181213379, "global_step": 254640, "epoch": 3067} {"train_loss": -25.53402328491211, "global_step": 254641, "epoch": 3067} {"train_loss": -24.64278221130371, "global_step": 254642, "epoch": 3067} {"train_loss": -25.02584216106369, "global_step": 254643, "epoch": 3067, "val_loss": 6831450.0} {"train_loss": -24.198354721069336, "global_step": 254644, "epoch": 3068} {"train_loss": -24.75309181213379, "global_step": 254645, "epoch": 3068} {"train_loss": -24.548063278198242, "global_step": 254646, "epoch": 3068} {"train_loss": -24.653120040893555, "global_step": 254647, "epoch": 3068} {"train_loss": -24.975910186767578, "global_step": 254648, "epoch": 3068} {"train_loss": -24.24576187133789, "global_step": 254649, "epoch": 3068} {"train_loss": -24.455718994140625, "global_step": 254650, "epoch": 3068} {"train_loss": -25.08294677734375, "global_step": 254651, "epoch": 3068} {"train_loss": -24.582584381103516, "global_step": 254652, "epoch": 3068} {"train_loss": -25.036331176757812, "global_step": 254653, "epoch": 3068} {"train_loss": -25.02792739868164, "global_step": 254654, "epoch": 3068} {"train_loss": -24.746097564697266, "global_step": 254655, "epoch": 3068} {"train_loss": -24.576955795288086, "global_step": 254656, "epoch": 3068} {"train_loss": -25.008766174316406, "global_step": 254657, "epoch": 3068} {"train_loss": -24.7237606048584, "global_step": 254658, "epoch": 3068} {"train_loss": -24.946949005126953, "global_step": 254659, "epoch": 3068} {"train_loss": -24.98805809020996, "global_step": 254660, "epoch": 3068} {"train_loss": -24.942951202392578, "global_step": 254661, "epoch": 3068} {"train_loss": -25.03391456604004, "global_step": 254662, "epoch": 3068} {"train_loss": -24.971267700195312, "global_step": 254663, "epoch": 3068} {"train_loss": -24.999608993530273, "global_step": 254664, "epoch": 3068} {"train_loss": -25.11344337463379, "global_step": 254665, "epoch": 3068} {"train_loss": -24.915462493896484, "global_step": 254666, "epoch": 3068} {"train_loss": -24.89869499206543, "global_step": 254667, "epoch": 3068} {"train_loss": -24.8106746673584, "global_step": 254668, "epoch": 3068} {"train_loss": -25.042232513427734, "global_step": 254669, "epoch": 3068} {"train_loss": -24.974451065063477, "global_step": 254670, "epoch": 3068} {"train_loss": -25.179990768432617, "global_step": 254671, "epoch": 3068} {"train_loss": -25.55138397216797, "global_step": 254672, "epoch": 3068} {"train_loss": -24.84833335876465, "global_step": 254673, "epoch": 3068} {"train_loss": -25.269763946533203, "global_step": 254674, "epoch": 3068} {"train_loss": -25.07045555114746, "global_step": 254675, "epoch": 3068} {"train_loss": -25.52435302734375, "global_step": 254676, "epoch": 3068} {"train_loss": -25.03301429748535, "global_step": 254677, "epoch": 3068} {"train_loss": -25.488380432128906, "global_step": 254678, "epoch": 3068} {"train_loss": -25.096651077270508, "global_step": 254679, "epoch": 3068} {"train_loss": -25.211524963378906, "global_step": 254680, "epoch": 3068} {"train_loss": -25.042776107788086, "global_step": 254681, "epoch": 3068} {"train_loss": -25.4832706451416, "global_step": 254682, "epoch": 3068} {"train_loss": -24.835386276245117, "global_step": 254683, "epoch": 3068} {"train_loss": -24.93316078186035, "global_step": 254684, "epoch": 3068} {"train_loss": -25.0762996673584, "global_step": 254685, "epoch": 3068} {"train_loss": -25.005184173583984, "global_step": 254686, "epoch": 3068} {"train_loss": -25.135637283325195, "global_step": 254687, "epoch": 3068} {"train_loss": -25.240007400512695, "global_step": 254688, "epoch": 3068} {"train_loss": -25.25776481628418, "global_step": 254689, "epoch": 3068} {"train_loss": -24.993404388427734, "global_step": 254690, "epoch": 3068} {"train_loss": -25.176048278808594, "global_step": 254691, "epoch": 3068} {"train_loss": -25.289785385131836, "global_step": 254692, "epoch": 3068} {"train_loss": -25.144853591918945, "global_step": 254693, "epoch": 3068} {"train_loss": -25.35833168029785, "global_step": 254694, "epoch": 3068} {"train_loss": -25.34586524963379, "global_step": 254695, "epoch": 3068} {"train_loss": -25.3794002532959, "global_step": 254696, "epoch": 3068} {"train_loss": -24.83570671081543, "global_step": 254697, "epoch": 3068} {"train_loss": -25.077274322509766, "global_step": 254698, "epoch": 3068} {"train_loss": -25.18214225769043, "global_step": 254699, "epoch": 3068} {"train_loss": -24.995969772338867, "global_step": 254700, "epoch": 3068} {"train_loss": -24.930749893188477, "global_step": 254701, "epoch": 3068} {"train_loss": -25.3067569732666, "global_step": 254702, "epoch": 3068} {"train_loss": -25.207990646362305, "global_step": 254703, "epoch": 3068} {"train_loss": -25.3287410736084, "global_step": 254704, "epoch": 3068} {"train_loss": -25.047666549682617, "global_step": 254705, "epoch": 3068} {"train_loss": -25.01639747619629, "global_step": 254706, "epoch": 3068} {"train_loss": -24.876920700073242, "global_step": 254707, "epoch": 3068} {"train_loss": -25.09181022644043, "global_step": 254708, "epoch": 3068} {"train_loss": -25.097410202026367, "global_step": 254709, "epoch": 3068} {"train_loss": -25.26725196838379, "global_step": 254710, "epoch": 3068} {"train_loss": -24.94904136657715, "global_step": 254711, "epoch": 3068} {"train_loss": -24.561185836791992, "global_step": 254712, "epoch": 3068} {"train_loss": -24.37980842590332, "global_step": 254713, "epoch": 3068} {"train_loss": -24.907590866088867, "global_step": 254714, "epoch": 3068} {"train_loss": -24.8964786529541, "global_step": 254715, "epoch": 3068} {"train_loss": -25.14769172668457, "global_step": 254716, "epoch": 3068} {"train_loss": -25.202733993530273, "global_step": 254717, "epoch": 3068} {"train_loss": -24.860572814941406, "global_step": 254718, "epoch": 3068} {"train_loss": -24.947908401489258, "global_step": 254719, "epoch": 3068} {"train_loss": -25.05067253112793, "global_step": 254720, "epoch": 3068} {"train_loss": -25.03511619567871, "global_step": 254721, "epoch": 3068} {"train_loss": -25.267908096313477, "global_step": 254722, "epoch": 3068} {"train_loss": -24.910785675048828, "global_step": 254723, "epoch": 3068} {"train_loss": -24.504047393798828, "global_step": 254724, "epoch": 3068} {"train_loss": -24.742080688476562, "global_step": 254725, "epoch": 3068} {"train_loss": -25.013862334102033, "global_step": 254726, "epoch": 3068, "val_loss": 6744110.0} {"train_loss": -24.47772789001465, "global_step": 254727, "epoch": 3069} {"train_loss": -23.93820571899414, "global_step": 254728, "epoch": 3069} {"train_loss": -24.399057388305664, "global_step": 254729, "epoch": 3069} {"train_loss": -24.782079696655273, "global_step": 254730, "epoch": 3069} {"train_loss": -24.59393310546875, "global_step": 254731, "epoch": 3069} {"train_loss": -24.64089012145996, "global_step": 254732, "epoch": 3069} {"train_loss": -24.492923736572266, "global_step": 254733, "epoch": 3069} {"train_loss": -24.341787338256836, "global_step": 254734, "epoch": 3069} {"train_loss": -24.4559268951416, "global_step": 254735, "epoch": 3069} {"train_loss": -24.985151290893555, "global_step": 254736, "epoch": 3069} {"train_loss": -24.557294845581055, "global_step": 254737, "epoch": 3069} {"train_loss": -25.0360107421875, "global_step": 254738, "epoch": 3069} {"train_loss": -24.6825008392334, "global_step": 254739, "epoch": 3069} {"train_loss": -24.84904670715332, "global_step": 254740, "epoch": 3069} {"train_loss": -24.78643226623535, "global_step": 254741, "epoch": 3069} {"train_loss": -25.012939453125, "global_step": 254742, "epoch": 3069} {"train_loss": -24.9283390045166, "global_step": 254743, "epoch": 3069} {"train_loss": -24.89825439453125, "global_step": 254744, "epoch": 3069} {"train_loss": -25.056488037109375, "global_step": 254745, "epoch": 3069} {"train_loss": -24.944686889648438, "global_step": 254746, "epoch": 3069} {"train_loss": -25.05113983154297, "global_step": 254747, "epoch": 3069} {"train_loss": -25.161222457885742, "global_step": 254748, "epoch": 3069} {"train_loss": -25.22603988647461, "global_step": 254749, "epoch": 3069} {"train_loss": -25.21772003173828, "global_step": 254750, "epoch": 3069} {"train_loss": -24.98651123046875, "global_step": 254751, "epoch": 3069} {"train_loss": -25.497812271118164, "global_step": 254752, "epoch": 3069} {"train_loss": -24.821182250976562, "global_step": 254753, "epoch": 3069} {"train_loss": -25.42218589782715, "global_step": 254754, "epoch": 3069} {"train_loss": -25.062528610229492, "global_step": 254755, "epoch": 3069} {"train_loss": -25.231754302978516, "global_step": 254756, "epoch": 3069} {"train_loss": -25.211589813232422, "global_step": 254757, "epoch": 3069} {"train_loss": -25.112043380737305, "global_step": 254758, "epoch": 3069} {"train_loss": -25.150320053100586, "global_step": 254759, "epoch": 3069} {"train_loss": -25.03314971923828, "global_step": 254760, "epoch": 3069} {"train_loss": -24.773298263549805, "global_step": 254761, "epoch": 3069} {"train_loss": -24.977149963378906, "global_step": 254762, "epoch": 3069} {"train_loss": -25.1209659576416, "global_step": 254763, "epoch": 3069} {"train_loss": -25.3099365234375, "global_step": 254764, "epoch": 3069} {"train_loss": -25.243017196655273, "global_step": 254765, "epoch": 3069} {"train_loss": -25.41286849975586, "global_step": 254766, "epoch": 3069} {"train_loss": -25.38126564025879, "global_step": 254767, "epoch": 3069} {"train_loss": -25.52484130859375, "global_step": 254768, "epoch": 3069} {"train_loss": -25.225229263305664, "global_step": 254769, "epoch": 3069} {"train_loss": -25.22953224182129, "global_step": 254770, "epoch": 3069} {"train_loss": -25.405170440673828, "global_step": 254771, "epoch": 3069} {"train_loss": -25.367948532104492, "global_step": 254772, "epoch": 3069} {"train_loss": -25.04158592224121, "global_step": 254773, "epoch": 3069} {"train_loss": -24.564929962158203, "global_step": 254774, "epoch": 3069} {"train_loss": -24.020578384399414, "global_step": 254775, "epoch": 3069} {"train_loss": -23.826547622680664, "global_step": 254776, "epoch": 3069} {"train_loss": -24.34515380859375, "global_step": 254777, "epoch": 3069} {"train_loss": -24.51817512512207, "global_step": 254778, "epoch": 3069} {"train_loss": -24.45514678955078, "global_step": 254779, "epoch": 3069} {"train_loss": -24.62174415588379, "global_step": 254780, "epoch": 3069} {"train_loss": -24.604084014892578, "global_step": 254781, "epoch": 3069} {"train_loss": -24.6219482421875, "global_step": 254782, "epoch": 3069} {"train_loss": -24.607513427734375, "global_step": 254783, "epoch": 3069} {"train_loss": -24.846637725830078, "global_step": 254784, "epoch": 3069} {"train_loss": -24.79511070251465, "global_step": 254785, "epoch": 3069} {"train_loss": -24.30901336669922, "global_step": 254786, "epoch": 3069} {"train_loss": -24.68344497680664, "global_step": 254787, "epoch": 3069} {"train_loss": -24.870756149291992, "global_step": 254788, "epoch": 3069} {"train_loss": -24.83710289001465, "global_step": 254789, "epoch": 3069} {"train_loss": -25.089664459228516, "global_step": 254790, "epoch": 3069} {"train_loss": -24.870134353637695, "global_step": 254791, "epoch": 3069} {"train_loss": -25.071256637573242, "global_step": 254792, "epoch": 3069} {"train_loss": -25.005970001220703, "global_step": 254793, "epoch": 3069} {"train_loss": -24.734477996826172, "global_step": 254794, "epoch": 3069} {"train_loss": -24.956262588500977, "global_step": 254795, "epoch": 3069} {"train_loss": -25.179929733276367, "global_step": 254796, "epoch": 3069} {"train_loss": -25.028913497924805, "global_step": 254797, "epoch": 3069} {"train_loss": -25.06513023376465, "global_step": 254798, "epoch": 3069} {"train_loss": -24.893980026245117, "global_step": 254799, "epoch": 3069} {"train_loss": -25.155715942382812, "global_step": 254800, "epoch": 3069} {"train_loss": -25.047452926635742, "global_step": 254801, "epoch": 3069} {"train_loss": -25.285236358642578, "global_step": 254802, "epoch": 3069} {"train_loss": -25.53779411315918, "global_step": 254803, "epoch": 3069} {"train_loss": -24.808853149414062, "global_step": 254804, "epoch": 3069} {"train_loss": -24.9211483001709, "global_step": 254805, "epoch": 3069} {"train_loss": -25.059133529663086, "global_step": 254806, "epoch": 3069} {"train_loss": -24.8028621673584, "global_step": 254807, "epoch": 3069} {"train_loss": -24.95087242126465, "global_step": 254808, "epoch": 3069} {"train_loss": -24.91753518437765, "global_step": 254809, "epoch": 3069, "val_loss": 7013276.0} {"train_loss": -24.196866989135742, "global_step": 254810, "epoch": 3070} {"train_loss": -25.028287887573242, "global_step": 254811, "epoch": 3070} {"train_loss": -24.761962890625, "global_step": 254812, "epoch": 3070} {"train_loss": -24.53139305114746, "global_step": 254813, "epoch": 3070} {"train_loss": -24.604969024658203, "global_step": 254814, "epoch": 3070} {"train_loss": -24.971853256225586, "global_step": 254815, "epoch": 3070} {"train_loss": -24.79292106628418, "global_step": 254816, "epoch": 3070} {"train_loss": -24.50310707092285, "global_step": 254817, "epoch": 3070} {"train_loss": -25.246217727661133, "global_step": 254818, "epoch": 3070} {"train_loss": -24.423192977905273, "global_step": 254819, "epoch": 3070} {"train_loss": -24.71523094177246, "global_step": 254820, "epoch": 3070} {"train_loss": -24.618961334228516, "global_step": 254821, "epoch": 3070} {"train_loss": -24.271780014038086, "global_step": 254822, "epoch": 3070} {"train_loss": -24.827186584472656, "global_step": 254823, "epoch": 3070} {"train_loss": -25.07368278503418, "global_step": 254824, "epoch": 3070} {"train_loss": -24.85739517211914, "global_step": 254825, "epoch": 3070} {"train_loss": -24.896100997924805, "global_step": 254826, "epoch": 3070} {"train_loss": -24.709747314453125, "global_step": 254827, "epoch": 3070} {"train_loss": -24.790929794311523, "global_step": 254828, "epoch": 3070} {"train_loss": -24.781932830810547, "global_step": 254829, "epoch": 3070} {"train_loss": -24.58085060119629, "global_step": 254830, "epoch": 3070} {"train_loss": -24.696054458618164, "global_step": 254831, "epoch": 3070} {"train_loss": -25.06634521484375, "global_step": 254832, "epoch": 3070} {"train_loss": -24.955434799194336, "global_step": 254833, "epoch": 3070} {"train_loss": -24.895719528198242, "global_step": 254834, "epoch": 3070} {"train_loss": -25.147972106933594, "global_step": 254835, "epoch": 3070} {"train_loss": -24.854814529418945, "global_step": 254836, "epoch": 3070} {"train_loss": -24.965829849243164, "global_step": 254837, "epoch": 3070} {"train_loss": -24.955259323120117, "global_step": 254838, "epoch": 3070} {"train_loss": -24.816547393798828, "global_step": 254839, "epoch": 3070} {"train_loss": -25.575592041015625, "global_step": 254840, "epoch": 3070} {"train_loss": -24.78226661682129, "global_step": 254841, "epoch": 3070} {"train_loss": -25.236976623535156, "global_step": 254842, "epoch": 3070} {"train_loss": -25.42629051208496, "global_step": 254843, "epoch": 3070} {"train_loss": -25.137744903564453, "global_step": 254844, "epoch": 3070} {"train_loss": -25.233713150024414, "global_step": 254845, "epoch": 3070} {"train_loss": -25.313108444213867, "global_step": 254846, "epoch": 3070} {"train_loss": -24.895227432250977, "global_step": 254847, "epoch": 3070} {"train_loss": -25.137168884277344, "global_step": 254848, "epoch": 3070} {"train_loss": -25.23560333251953, "global_step": 254849, "epoch": 3070} {"train_loss": -25.5167293548584, "global_step": 254850, "epoch": 3070} {"train_loss": -25.388647079467773, "global_step": 254851, "epoch": 3070} {"train_loss": -24.994800567626953, "global_step": 254852, "epoch": 3070} {"train_loss": -25.11724090576172, "global_step": 254853, "epoch": 3070} {"train_loss": -24.939849853515625, "global_step": 254854, "epoch": 3070} {"train_loss": -25.60089683532715, "global_step": 254855, "epoch": 3070} {"train_loss": -25.010292053222656, "global_step": 254856, "epoch": 3070} {"train_loss": -24.966493606567383, "global_step": 254857, "epoch": 3070} {"train_loss": -25.150178909301758, "global_step": 254858, "epoch": 3070} {"train_loss": -25.45192527770996, "global_step": 254859, "epoch": 3070} {"train_loss": -25.053897857666016, "global_step": 254860, "epoch": 3070} {"train_loss": -25.46541976928711, "global_step": 254861, "epoch": 3070} {"train_loss": -25.292572021484375, "global_step": 254862, "epoch": 3070} {"train_loss": -25.202909469604492, "global_step": 254863, "epoch": 3070} {"train_loss": -25.233304977416992, "global_step": 254864, "epoch": 3070} {"train_loss": -25.061391830444336, "global_step": 254865, "epoch": 3070} {"train_loss": -25.182146072387695, "global_step": 254866, "epoch": 3070} {"train_loss": -24.707088470458984, "global_step": 254867, "epoch": 3070} {"train_loss": -25.040124893188477, "global_step": 254868, "epoch": 3070} {"train_loss": -24.80690574645996, "global_step": 254869, "epoch": 3070} {"train_loss": -24.520797729492188, "global_step": 254870, "epoch": 3070} {"train_loss": -24.938474655151367, "global_step": 254871, "epoch": 3070} {"train_loss": -24.549331665039062, "global_step": 254872, "epoch": 3070} {"train_loss": -24.62415885925293, "global_step": 254873, "epoch": 3070} {"train_loss": -24.562625885009766, "global_step": 254874, "epoch": 3070} {"train_loss": -24.750444412231445, "global_step": 254875, "epoch": 3070} {"train_loss": -25.17234992980957, "global_step": 254876, "epoch": 3070} {"train_loss": -25.103534698486328, "global_step": 254877, "epoch": 3070} {"train_loss": -25.181737899780273, "global_step": 254878, "epoch": 3070} {"train_loss": -24.942060470581055, "global_step": 254879, "epoch": 3070} {"train_loss": -24.907602310180664, "global_step": 254880, "epoch": 3070} {"train_loss": -24.95278549194336, "global_step": 254881, "epoch": 3070} {"train_loss": -25.133106231689453, "global_step": 254882, "epoch": 3070} {"train_loss": -24.984088897705078, "global_step": 254883, "epoch": 3070} {"train_loss": -25.237163543701172, "global_step": 254884, "epoch": 3070} {"train_loss": -25.48026466369629, "global_step": 254885, "epoch": 3070} {"train_loss": -24.960607528686523, "global_step": 254886, "epoch": 3070} {"train_loss": -25.087594985961914, "global_step": 254887, "epoch": 3070} {"train_loss": -25.070446014404297, "global_step": 254888, "epoch": 3070} {"train_loss": -24.981008529663086, "global_step": 254889, "epoch": 3070} {"train_loss": -24.886417388916016, "global_step": 254890, "epoch": 3070} {"train_loss": -24.890361785888672, "global_step": 254891, "epoch": 3070} {"train_loss": -24.95554128899632, "global_step": 254892, "epoch": 3070, "val_loss": 6972234.5} {"train_loss": -23.806285858154297, "global_step": 254893, "epoch": 3071} {"train_loss": -24.14841079711914, "global_step": 254894, "epoch": 3071} {"train_loss": -24.160049438476562, "global_step": 254895, "epoch": 3071} {"train_loss": -24.608373641967773, "global_step": 254896, "epoch": 3071} {"train_loss": -24.492992401123047, "global_step": 254897, "epoch": 3071} {"train_loss": -24.62017822265625, "global_step": 254898, "epoch": 3071} {"train_loss": -24.511274337768555, "global_step": 254899, "epoch": 3071} {"train_loss": -24.465742111206055, "global_step": 254900, "epoch": 3071} {"train_loss": -24.65182876586914, "global_step": 254901, "epoch": 3071} {"train_loss": -24.409988403320312, "global_step": 254902, "epoch": 3071} {"train_loss": -24.801382064819336, "global_step": 254903, "epoch": 3071} {"train_loss": -24.606433868408203, "global_step": 254904, "epoch": 3071} {"train_loss": -24.81422233581543, "global_step": 254905, "epoch": 3071} {"train_loss": -24.772014617919922, "global_step": 254906, "epoch": 3071} {"train_loss": -24.775053024291992, "global_step": 254907, "epoch": 3071} {"train_loss": -24.978551864624023, "global_step": 254908, "epoch": 3071} {"train_loss": -24.78074836730957, "global_step": 254909, "epoch": 3071} {"train_loss": -24.784421920776367, "global_step": 254910, "epoch": 3071} {"train_loss": -24.90850830078125, "global_step": 254911, "epoch": 3071} {"train_loss": -24.669677734375, "global_step": 254912, "epoch": 3071} {"train_loss": -24.641202926635742, "global_step": 254913, "epoch": 3071} {"train_loss": -25.100818634033203, "global_step": 254914, "epoch": 3071} {"train_loss": -25.13413429260254, "global_step": 254915, "epoch": 3071} {"train_loss": -25.145666122436523, "global_step": 254916, "epoch": 3071} {"train_loss": -25.09089469909668, "global_step": 254917, "epoch": 3071} {"train_loss": -25.37457847595215, "global_step": 254918, "epoch": 3071} {"train_loss": -25.26282501220703, "global_step": 254919, "epoch": 3071} {"train_loss": -25.052915573120117, "global_step": 254920, "epoch": 3071} {"train_loss": -24.82248306274414, "global_step": 254921, "epoch": 3071} {"train_loss": -24.663349151611328, "global_step": 254922, "epoch": 3071} {"train_loss": -24.74969482421875, "global_step": 254923, "epoch": 3071} {"train_loss": -25.147140502929688, "global_step": 254924, "epoch": 3071} {"train_loss": -25.136924743652344, "global_step": 254925, "epoch": 3071} {"train_loss": -25.081796646118164, "global_step": 254926, "epoch": 3071} {"train_loss": -24.731428146362305, "global_step": 254927, "epoch": 3071} {"train_loss": -25.06439208984375, "global_step": 254928, "epoch": 3071} {"train_loss": -25.109161376953125, "global_step": 254929, "epoch": 3071} {"train_loss": -25.390851974487305, "global_step": 254930, "epoch": 3071} {"train_loss": -25.372243881225586, "global_step": 254931, "epoch": 3071} {"train_loss": -24.949560165405273, "global_step": 254932, "epoch": 3071} {"train_loss": -24.977691650390625, "global_step": 254933, "epoch": 3071} {"train_loss": -25.339954376220703, "global_step": 254934, "epoch": 3071} {"train_loss": -25.071063995361328, "global_step": 254935, "epoch": 3071} {"train_loss": -25.100645065307617, "global_step": 254936, "epoch": 3071} {"train_loss": -25.35007095336914, "global_step": 254937, "epoch": 3071} {"train_loss": -24.94573211669922, "global_step": 254938, "epoch": 3071} {"train_loss": -25.3891544342041, "global_step": 254939, "epoch": 3071} {"train_loss": -25.013092041015625, "global_step": 254940, "epoch": 3071} {"train_loss": -25.276660919189453, "global_step": 254941, "epoch": 3071} {"train_loss": -25.10834312438965, "global_step": 254942, "epoch": 3071} {"train_loss": -25.22780418395996, "global_step": 254943, "epoch": 3071} {"train_loss": -25.21401023864746, "global_step": 254944, "epoch": 3071} {"train_loss": -25.553850173950195, "global_step": 254945, "epoch": 3071} {"train_loss": -25.39813232421875, "global_step": 254946, "epoch": 3071} {"train_loss": -24.72275733947754, "global_step": 254947, "epoch": 3071} {"train_loss": -24.777088165283203, "global_step": 254948, "epoch": 3071} {"train_loss": -25.1019229888916, "global_step": 254949, "epoch": 3071} {"train_loss": -25.573694229125977, "global_step": 254950, "epoch": 3071} {"train_loss": -25.08985137939453, "global_step": 254951, "epoch": 3071} {"train_loss": -25.159921646118164, "global_step": 254952, "epoch": 3071} {"train_loss": -25.068470001220703, "global_step": 254953, "epoch": 3071} {"train_loss": -25.062421798706055, "global_step": 254954, "epoch": 3071} {"train_loss": -25.05939292907715, "global_step": 254955, "epoch": 3071} {"train_loss": -24.93174171447754, "global_step": 254956, "epoch": 3071} {"train_loss": -24.90907859802246, "global_step": 254957, "epoch": 3071} {"train_loss": -25.166236877441406, "global_step": 254958, "epoch": 3071} {"train_loss": -25.010700225830078, "global_step": 254959, "epoch": 3071} {"train_loss": -24.756772994995117, "global_step": 254960, "epoch": 3071} {"train_loss": -25.0716495513916, "global_step": 254961, "epoch": 3071} {"train_loss": -25.32557487487793, "global_step": 254962, "epoch": 3071} {"train_loss": -25.1097412109375, "global_step": 254963, "epoch": 3071} {"train_loss": -25.15482521057129, "global_step": 254964, "epoch": 3071} {"train_loss": -25.228927612304688, "global_step": 254965, "epoch": 3071} {"train_loss": -25.462690353393555, "global_step": 254966, "epoch": 3071} {"train_loss": -25.168365478515625, "global_step": 254967, "epoch": 3071} {"train_loss": -25.29178237915039, "global_step": 254968, "epoch": 3071} {"train_loss": -25.22989273071289, "global_step": 254969, "epoch": 3071} {"train_loss": -24.996747970581055, "global_step": 254970, "epoch": 3071} {"train_loss": -25.00798797607422, "global_step": 254971, "epoch": 3071} {"train_loss": -25.356931686401367, "global_step": 254972, "epoch": 3071} {"train_loss": -25.36446189880371, "global_step": 254973, "epoch": 3071} {"train_loss": -25.2664794921875, "global_step": 254974, "epoch": 3071} {"train_loss": -24.982284706759167, "global_step": 254975, "epoch": 3071, "val_loss": 6869119.0} {"train_loss": -23.148344039916992, "global_step": 254976, "epoch": 3072} {"train_loss": -22.640066146850586, "global_step": 254977, "epoch": 3072} {"train_loss": -24.050222396850586, "global_step": 254978, "epoch": 3072} {"train_loss": -24.554685592651367, "global_step": 254979, "epoch": 3072} {"train_loss": -24.200414657592773, "global_step": 254980, "epoch": 3072} {"train_loss": -24.350305557250977, "global_step": 254981, "epoch": 3072} {"train_loss": -23.86231803894043, "global_step": 254982, "epoch": 3072} {"train_loss": -24.23215675354004, "global_step": 254983, "epoch": 3072} {"train_loss": -24.57132911682129, "global_step": 254984, "epoch": 3072} {"train_loss": -24.160537719726562, "global_step": 254985, "epoch": 3072} {"train_loss": -24.560287475585938, "global_step": 254986, "epoch": 3072} {"train_loss": -24.297653198242188, "global_step": 254987, "epoch": 3072} {"train_loss": -24.342321395874023, "global_step": 254988, "epoch": 3072} {"train_loss": -24.303516387939453, "global_step": 254989, "epoch": 3072} {"train_loss": -24.7562313079834, "global_step": 254990, "epoch": 3072} {"train_loss": -24.66084861755371, "global_step": 254991, "epoch": 3072} {"train_loss": -24.850549697875977, "global_step": 254992, "epoch": 3072} {"train_loss": -25.070585250854492, "global_step": 254993, "epoch": 3072} {"train_loss": -25.026586532592773, "global_step": 254994, "epoch": 3072} {"train_loss": -24.22530174255371, "global_step": 254995, "epoch": 3072} {"train_loss": -24.71689796447754, "global_step": 254996, "epoch": 3072} {"train_loss": -24.316267013549805, "global_step": 254997, "epoch": 3072} {"train_loss": -25.17510414123535, "global_step": 254998, "epoch": 3072} {"train_loss": -24.602680206298828, "global_step": 254999, "epoch": 3072} {"train_loss": -24.715322494506836, "global_step": 255000, "epoch": 3072} {"train_loss": -24.9000244140625, "global_step": 255001, "epoch": 3072} {"train_loss": -25.022754669189453, "global_step": 255002, "epoch": 3072} {"train_loss": -24.8049259185791, "global_step": 255003, "epoch": 3072} {"train_loss": -24.819486618041992, "global_step": 255004, "epoch": 3072} {"train_loss": -24.979454040527344, "global_step": 255005, "epoch": 3072} {"train_loss": -25.26618003845215, "global_step": 255006, "epoch": 3072} {"train_loss": -24.989015579223633, "global_step": 255007, "epoch": 3072} {"train_loss": -24.567882537841797, "global_step": 255008, "epoch": 3072} {"train_loss": -24.74119758605957, "global_step": 255009, "epoch": 3072} {"train_loss": -24.942062377929688, "global_step": 255010, "epoch": 3072} {"train_loss": -24.84324073791504, "global_step": 255011, "epoch": 3072} {"train_loss": -25.10909080505371, "global_step": 255012, "epoch": 3072} {"train_loss": -24.827146530151367, "global_step": 255013, "epoch": 3072} {"train_loss": -25.44276237487793, "global_step": 255014, "epoch": 3072} {"train_loss": -25.19339942932129, "global_step": 255015, "epoch": 3072} {"train_loss": -25.188852310180664, "global_step": 255016, "epoch": 3072} {"train_loss": -24.900711059570312, "global_step": 255017, "epoch": 3072} {"train_loss": -25.19797134399414, "global_step": 255018, "epoch": 3072} {"train_loss": -25.168508529663086, "global_step": 255019, "epoch": 3072} {"train_loss": -25.300769805908203, "global_step": 255020, "epoch": 3072} {"train_loss": -25.199556350708008, "global_step": 255021, "epoch": 3072} {"train_loss": -25.130041122436523, "global_step": 255022, "epoch": 3072} {"train_loss": -25.219070434570312, "global_step": 255023, "epoch": 3072} {"train_loss": -25.149465560913086, "global_step": 255024, "epoch": 3072} {"train_loss": -25.19419288635254, "global_step": 255025, "epoch": 3072} {"train_loss": -25.252716064453125, "global_step": 255026, "epoch": 3072} {"train_loss": -25.09266471862793, "global_step": 255027, "epoch": 3072} {"train_loss": -25.276350021362305, "global_step": 255028, "epoch": 3072} {"train_loss": -25.247526168823242, "global_step": 255029, "epoch": 3072} {"train_loss": -25.40166473388672, "global_step": 255030, "epoch": 3072} {"train_loss": -25.205047607421875, "global_step": 255031, "epoch": 3072} {"train_loss": -24.95364761352539, "global_step": 255032, "epoch": 3072} {"train_loss": -25.192703247070312, "global_step": 255033, "epoch": 3072} {"train_loss": -25.365751266479492, "global_step": 255034, "epoch": 3072} {"train_loss": -25.195608139038086, "global_step": 255035, "epoch": 3072} {"train_loss": -25.262195587158203, "global_step": 255036, "epoch": 3072} {"train_loss": -25.160415649414062, "global_step": 255037, "epoch": 3072} {"train_loss": -25.112274169921875, "global_step": 255038, "epoch": 3072} {"train_loss": -25.04286766052246, "global_step": 255039, "epoch": 3072} {"train_loss": -24.941797256469727, "global_step": 255040, "epoch": 3072} {"train_loss": -25.055891036987305, "global_step": 255041, "epoch": 3072} {"train_loss": -24.97054100036621, "global_step": 255042, "epoch": 3072} {"train_loss": -25.5231990814209, "global_step": 255043, "epoch": 3072} {"train_loss": -25.203474044799805, "global_step": 255044, "epoch": 3072} {"train_loss": -24.972030639648438, "global_step": 255045, "epoch": 3072} {"train_loss": -24.98224449157715, "global_step": 255046, "epoch": 3072} {"train_loss": -25.383543014526367, "global_step": 255047, "epoch": 3072} {"train_loss": -25.159265518188477, "global_step": 255048, "epoch": 3072} {"train_loss": -24.949871063232422, "global_step": 255049, "epoch": 3072} {"train_loss": -25.32740592956543, "global_step": 255050, "epoch": 3072} {"train_loss": -25.325971603393555, "global_step": 255051, "epoch": 3072} {"train_loss": -25.227991104125977, "global_step": 255052, "epoch": 3072} {"train_loss": -25.026824951171875, "global_step": 255053, "epoch": 3072} {"train_loss": -25.13002586364746, "global_step": 255054, "epoch": 3072} {"train_loss": -24.984268188476562, "global_step": 255055, "epoch": 3072} {"train_loss": -25.144075393676758, "global_step": 255056, "epoch": 3072} {"train_loss": -24.68208885192871, "global_step": 255057, "epoch": 3072} {"train_loss": -24.891708029321876, "global_step": 255058, "epoch": 3072, "val_loss": 6937710.0} {"train_loss": -24.166175842285156, "global_step": 255059, "epoch": 3073} {"train_loss": -23.96528434753418, "global_step": 255060, "epoch": 3073} {"train_loss": -24.365219116210938, "global_step": 255061, "epoch": 3073} {"train_loss": -25.093280792236328, "global_step": 255062, "epoch": 3073} {"train_loss": -24.571603775024414, "global_step": 255063, "epoch": 3073} {"train_loss": -24.705921173095703, "global_step": 255064, "epoch": 3073} {"train_loss": -24.702768325805664, "global_step": 255065, "epoch": 3073} {"train_loss": -25.03607749938965, "global_step": 255066, "epoch": 3073} {"train_loss": -24.71765899658203, "global_step": 255067, "epoch": 3073} {"train_loss": -24.746389389038086, "global_step": 255068, "epoch": 3073} {"train_loss": -25.03296661376953, "global_step": 255069, "epoch": 3073} {"train_loss": -24.785070419311523, "global_step": 255070, "epoch": 3073} {"train_loss": -25.025259017944336, "global_step": 255071, "epoch": 3073} {"train_loss": -25.014423370361328, "global_step": 255072, "epoch": 3073} {"train_loss": -25.07019805908203, "global_step": 255073, "epoch": 3073} {"train_loss": -25.301895141601562, "global_step": 255074, "epoch": 3073} {"train_loss": -24.987831115722656, "global_step": 255075, "epoch": 3073} {"train_loss": -25.051807403564453, "global_step": 255076, "epoch": 3073} {"train_loss": -25.046283721923828, "global_step": 255077, "epoch": 3073} {"train_loss": -24.991418838500977, "global_step": 255078, "epoch": 3073} {"train_loss": -25.034400939941406, "global_step": 255079, "epoch": 3073} {"train_loss": -25.19286346435547, "global_step": 255080, "epoch": 3073} {"train_loss": -24.994810104370117, "global_step": 255081, "epoch": 3073} {"train_loss": -25.18365478515625, "global_step": 255082, "epoch": 3073} {"train_loss": -25.030820846557617, "global_step": 255083, "epoch": 3073} {"train_loss": -25.39737319946289, "global_step": 255084, "epoch": 3073} {"train_loss": -25.43557357788086, "global_step": 255085, "epoch": 3073} {"train_loss": -25.190595626831055, "global_step": 255086, "epoch": 3073} {"train_loss": -25.18743896484375, "global_step": 255087, "epoch": 3073} {"train_loss": -25.328781127929688, "global_step": 255088, "epoch": 3073} {"train_loss": -25.435958862304688, "global_step": 255089, "epoch": 3073} {"train_loss": -25.299930572509766, "global_step": 255090, "epoch": 3073} {"train_loss": -24.93782615661621, "global_step": 255091, "epoch": 3073} {"train_loss": -25.277433395385742, "global_step": 255092, "epoch": 3073} {"train_loss": -24.976354598999023, "global_step": 255093, "epoch": 3073} {"train_loss": -25.04517936706543, "global_step": 255094, "epoch": 3073} {"train_loss": -25.104476928710938, "global_step": 255095, "epoch": 3073} {"train_loss": -25.42193031311035, "global_step": 255096, "epoch": 3073} {"train_loss": -25.34822654724121, "global_step": 255097, "epoch": 3073} {"train_loss": -25.282644271850586, "global_step": 255098, "epoch": 3073} {"train_loss": -24.65981101989746, "global_step": 255099, "epoch": 3073} {"train_loss": -24.805631637573242, "global_step": 255100, "epoch": 3073} {"train_loss": -24.835651397705078, "global_step": 255101, "epoch": 3073} {"train_loss": -25.150070190429688, "global_step": 255102, "epoch": 3073} {"train_loss": -25.350038528442383, "global_step": 255103, "epoch": 3073} {"train_loss": -24.627012252807617, "global_step": 255104, "epoch": 3073} {"train_loss": -24.917694091796875, "global_step": 255105, "epoch": 3073} {"train_loss": -25.055377960205078, "global_step": 255106, "epoch": 3073} {"train_loss": -25.14606285095215, "global_step": 255107, "epoch": 3073} {"train_loss": -24.683502197265625, "global_step": 255108, "epoch": 3073} {"train_loss": -24.5866641998291, "global_step": 255109, "epoch": 3073} {"train_loss": -24.867996215820312, "global_step": 255110, "epoch": 3073} {"train_loss": -24.95224380493164, "global_step": 255111, "epoch": 3073} {"train_loss": -25.065034866333008, "global_step": 255112, "epoch": 3073} {"train_loss": -24.792142868041992, "global_step": 255113, "epoch": 3073} {"train_loss": -24.914867401123047, "global_step": 255114, "epoch": 3073} {"train_loss": -25.27301025390625, "global_step": 255115, "epoch": 3073} {"train_loss": -24.684507369995117, "global_step": 255116, "epoch": 3073} {"train_loss": -25.274133682250977, "global_step": 255117, "epoch": 3073} {"train_loss": -25.0433349609375, "global_step": 255118, "epoch": 3073} {"train_loss": -25.170907974243164, "global_step": 255119, "epoch": 3073} {"train_loss": -25.180368423461914, "global_step": 255120, "epoch": 3073} {"train_loss": -25.21296501159668, "global_step": 255121, "epoch": 3073} {"train_loss": -25.0527400970459, "global_step": 255122, "epoch": 3073} {"train_loss": -25.0192813873291, "global_step": 255123, "epoch": 3073} {"train_loss": -25.483612060546875, "global_step": 255124, "epoch": 3073} {"train_loss": -25.157590866088867, "global_step": 255125, "epoch": 3073} {"train_loss": -24.935216903686523, "global_step": 255126, "epoch": 3073} {"train_loss": -25.11092185974121, "global_step": 255127, "epoch": 3073} {"train_loss": -25.540298461914062, "global_step": 255128, "epoch": 3073} {"train_loss": -25.275615692138672, "global_step": 255129, "epoch": 3073} {"train_loss": -24.68145751953125, "global_step": 255130, "epoch": 3073} {"train_loss": -25.283674240112305, "global_step": 255131, "epoch": 3073} {"train_loss": -25.152067184448242, "global_step": 255132, "epoch": 3073} {"train_loss": -24.60988426208496, "global_step": 255133, "epoch": 3073} {"train_loss": -24.615245819091797, "global_step": 255134, "epoch": 3073} {"train_loss": -25.05568504333496, "global_step": 255135, "epoch": 3073} {"train_loss": -24.82389259338379, "global_step": 255136, "epoch": 3073} {"train_loss": -25.066213607788086, "global_step": 255137, "epoch": 3073} {"train_loss": -25.017911911010742, "global_step": 255138, "epoch": 3073} {"train_loss": -25.22743034362793, "global_step": 255139, "epoch": 3073} {"train_loss": -25.087949752807617, "global_step": 255140, "epoch": 3073} {"train_loss": -25.022388412291747, "global_step": 255141, "epoch": 3073, "val_loss": 6895724.0} {"train_loss": -24.604711532592773, "global_step": 255142, "epoch": 3074} {"train_loss": -24.395475387573242, "global_step": 255143, "epoch": 3074} {"train_loss": -24.67009735107422, "global_step": 255144, "epoch": 3074} {"train_loss": -24.89533042907715, "global_step": 255145, "epoch": 3074} {"train_loss": -24.216089248657227, "global_step": 255146, "epoch": 3074} {"train_loss": -23.807111740112305, "global_step": 255147, "epoch": 3074} {"train_loss": -24.134855270385742, "global_step": 255148, "epoch": 3074} {"train_loss": -24.38191032409668, "global_step": 255149, "epoch": 3074} {"train_loss": -24.419998168945312, "global_step": 255150, "epoch": 3074} {"train_loss": -24.75054359436035, "global_step": 255151, "epoch": 3074} {"train_loss": -24.239458084106445, "global_step": 255152, "epoch": 3074} {"train_loss": -24.543319702148438, "global_step": 255153, "epoch": 3074} {"train_loss": -24.625598907470703, "global_step": 255154, "epoch": 3074} {"train_loss": -24.78558349609375, "global_step": 255155, "epoch": 3074} {"train_loss": -24.3399600982666, "global_step": 255156, "epoch": 3074} {"train_loss": -24.487995147705078, "global_step": 255157, "epoch": 3074} {"train_loss": -25.01032066345215, "global_step": 255158, "epoch": 3074} {"train_loss": -24.58588981628418, "global_step": 255159, "epoch": 3074} {"train_loss": -24.858800888061523, "global_step": 255160, "epoch": 3074} {"train_loss": -24.5407772064209, "global_step": 255161, "epoch": 3074} {"train_loss": -24.552845001220703, "global_step": 255162, "epoch": 3074} {"train_loss": -25.13633155822754, "global_step": 255163, "epoch": 3074} {"train_loss": -25.0650577545166, "global_step": 255164, "epoch": 3074} {"train_loss": -24.5957088470459, "global_step": 255165, "epoch": 3074} {"train_loss": -24.70047950744629, "global_step": 255166, "epoch": 3074} {"train_loss": -25.17793083190918, "global_step": 255167, "epoch": 3074} {"train_loss": -24.98612403869629, "global_step": 255168, "epoch": 3074} {"train_loss": -24.8931941986084, "global_step": 255169, "epoch": 3074} {"train_loss": -25.268774032592773, "global_step": 255170, "epoch": 3074} {"train_loss": -24.993494033813477, "global_step": 255171, "epoch": 3074} {"train_loss": -24.823232650756836, "global_step": 255172, "epoch": 3074} {"train_loss": -25.289703369140625, "global_step": 255173, "epoch": 3074} {"train_loss": -24.840866088867188, "global_step": 255174, "epoch": 3074} {"train_loss": -24.996906280517578, "global_step": 255175, "epoch": 3074} {"train_loss": -24.660367965698242, "global_step": 255176, "epoch": 3074} {"train_loss": -24.5882625579834, "global_step": 255177, "epoch": 3074} {"train_loss": -25.32450294494629, "global_step": 255178, "epoch": 3074} {"train_loss": -24.944629669189453, "global_step": 255179, "epoch": 3074} {"train_loss": -24.9744873046875, "global_step": 255180, "epoch": 3074} {"train_loss": -25.266616821289062, "global_step": 255181, "epoch": 3074} {"train_loss": -25.1870059967041, "global_step": 255182, "epoch": 3074} {"train_loss": -25.0745849609375, "global_step": 255183, "epoch": 3074} {"train_loss": -25.157119750976562, "global_step": 255184, "epoch": 3074} {"train_loss": -24.977323532104492, "global_step": 255185, "epoch": 3074} {"train_loss": -25.54010009765625, "global_step": 255186, "epoch": 3074} {"train_loss": -25.222890853881836, "global_step": 255187, "epoch": 3074} {"train_loss": -25.112340927124023, "global_step": 255188, "epoch": 3074} {"train_loss": -25.02530288696289, "global_step": 255189, "epoch": 3074} {"train_loss": -25.380151748657227, "global_step": 255190, "epoch": 3074} {"train_loss": -25.038869857788086, "global_step": 255191, "epoch": 3074} {"train_loss": -25.51143455505371, "global_step": 255192, "epoch": 3074} {"train_loss": -25.235675811767578, "global_step": 255193, "epoch": 3074} {"train_loss": -25.138219833374023, "global_step": 255194, "epoch": 3074} {"train_loss": -25.399845123291016, "global_step": 255195, "epoch": 3074} {"train_loss": -25.185598373413086, "global_step": 255196, "epoch": 3074} {"train_loss": -25.266576766967773, "global_step": 255197, "epoch": 3074} {"train_loss": -25.354633331298828, "global_step": 255198, "epoch": 3074} {"train_loss": -25.0203914642334, "global_step": 255199, "epoch": 3074} {"train_loss": -25.431859970092773, "global_step": 255200, "epoch": 3074} {"train_loss": -25.25111961364746, "global_step": 255201, "epoch": 3074} {"train_loss": -25.1532039642334, "global_step": 255202, "epoch": 3074} {"train_loss": -25.37028694152832, "global_step": 255203, "epoch": 3074} {"train_loss": -24.968671798706055, "global_step": 255204, "epoch": 3074} {"train_loss": -25.002914428710938, "global_step": 255205, "epoch": 3074} {"train_loss": -24.474834442138672, "global_step": 255206, "epoch": 3074} {"train_loss": -25.130678176879883, "global_step": 255207, "epoch": 3074} {"train_loss": -25.50556755065918, "global_step": 255208, "epoch": 3074} {"train_loss": -25.318801879882812, "global_step": 255209, "epoch": 3074} {"train_loss": -24.6133975982666, "global_step": 255210, "epoch": 3074} {"train_loss": -24.91582679748535, "global_step": 255211, "epoch": 3074} {"train_loss": -24.997344970703125, "global_step": 255212, "epoch": 3074} {"train_loss": -25.280675888061523, "global_step": 255213, "epoch": 3074} {"train_loss": -24.910764694213867, "global_step": 255214, "epoch": 3074} {"train_loss": -25.18800926208496, "global_step": 255215, "epoch": 3074} {"train_loss": -25.092702865600586, "global_step": 255216, "epoch": 3074} {"train_loss": -25.29463005065918, "global_step": 255217, "epoch": 3074} {"train_loss": -25.221084594726562, "global_step": 255218, "epoch": 3074} {"train_loss": -25.373716354370117, "global_step": 255219, "epoch": 3074} {"train_loss": -24.997390747070312, "global_step": 255220, "epoch": 3074} {"train_loss": -25.164030075073242, "global_step": 255221, "epoch": 3074} {"train_loss": -25.169408798217773, "global_step": 255222, "epoch": 3074} {"train_loss": -25.182178497314453, "global_step": 255223, "epoch": 3074} {"train_loss": -24.94250414744917, "global_step": 255224, "epoch": 3074, "val_loss": 6936246.0} {"train_loss": -25.325937271118164, "global_step": 255225, "epoch": 3075} {"train_loss": -24.856016159057617, "global_step": 255226, "epoch": 3075} {"train_loss": -25.3962345123291, "global_step": 255227, "epoch": 3075} {"train_loss": -25.513933181762695, "global_step": 255228, "epoch": 3075} {"train_loss": -25.044771194458008, "global_step": 255229, "epoch": 3075} {"train_loss": -25.189849853515625, "global_step": 255230, "epoch": 3075} {"train_loss": -25.109907150268555, "global_step": 255231, "epoch": 3075} {"train_loss": -24.764001846313477, "global_step": 255232, "epoch": 3075} {"train_loss": -25.28481101989746, "global_step": 255233, "epoch": 3075} {"train_loss": -25.008106231689453, "global_step": 255234, "epoch": 3075} {"train_loss": -25.015125274658203, "global_step": 255235, "epoch": 3075} {"train_loss": -24.837631225585938, "global_step": 255236, "epoch": 3075} {"train_loss": -24.70055389404297, "global_step": 255237, "epoch": 3075} {"train_loss": -25.258283615112305, "global_step": 255238, "epoch": 3075} {"train_loss": -24.972688674926758, "global_step": 255239, "epoch": 3075} {"train_loss": -25.131500244140625, "global_step": 255240, "epoch": 3075} {"train_loss": -24.93942642211914, "global_step": 255241, "epoch": 3075} {"train_loss": -24.795143127441406, "global_step": 255242, "epoch": 3075} {"train_loss": -25.261737823486328, "global_step": 255243, "epoch": 3075} {"train_loss": -25.385700225830078, "global_step": 255244, "epoch": 3075} {"train_loss": -25.494272232055664, "global_step": 255245, "epoch": 3075} {"train_loss": -25.214818954467773, "global_step": 255246, "epoch": 3075} {"train_loss": -25.28481674194336, "global_step": 255247, "epoch": 3075} {"train_loss": -24.880752563476562, "global_step": 255248, "epoch": 3075} {"train_loss": -24.702795028686523, "global_step": 255249, "epoch": 3075} {"train_loss": -24.932401657104492, "global_step": 255250, "epoch": 3075} {"train_loss": -25.250225067138672, "global_step": 255251, "epoch": 3075} {"train_loss": -25.202800750732422, "global_step": 255252, "epoch": 3075} {"train_loss": -25.314504623413086, "global_step": 255253, "epoch": 3075} {"train_loss": -25.284887313842773, "global_step": 255254, "epoch": 3075} {"train_loss": -25.400678634643555, "global_step": 255255, "epoch": 3075} {"train_loss": -25.246707916259766, "global_step": 255256, "epoch": 3075} {"train_loss": -25.085403442382812, "global_step": 255257, "epoch": 3075} {"train_loss": -25.29144859313965, "global_step": 255258, "epoch": 3075} {"train_loss": -25.152132034301758, "global_step": 255259, "epoch": 3075} {"train_loss": -25.000537872314453, "global_step": 255260, "epoch": 3075} {"train_loss": -25.21009635925293, "global_step": 255261, "epoch": 3075} {"train_loss": -25.642377853393555, "global_step": 255262, "epoch": 3075} {"train_loss": -25.27311134338379, "global_step": 255263, "epoch": 3075} {"train_loss": -24.768186569213867, "global_step": 255264, "epoch": 3075} {"train_loss": -24.766965866088867, "global_step": 255265, "epoch": 3075} {"train_loss": -25.034299850463867, "global_step": 255266, "epoch": 3075} {"train_loss": -25.271642684936523, "global_step": 255267, "epoch": 3075} {"train_loss": -25.182018280029297, "global_step": 255268, "epoch": 3075} {"train_loss": -25.14560317993164, "global_step": 255269, "epoch": 3075} {"train_loss": -24.772415161132812, "global_step": 255270, "epoch": 3075} {"train_loss": -25.098798751831055, "global_step": 255271, "epoch": 3075} {"train_loss": -25.113187789916992, "global_step": 255272, "epoch": 3075} {"train_loss": -25.089874267578125, "global_step": 255273, "epoch": 3075} {"train_loss": -25.12958526611328, "global_step": 255274, "epoch": 3075} {"train_loss": -24.85121726989746, "global_step": 255275, "epoch": 3075} {"train_loss": -24.562307357788086, "global_step": 255276, "epoch": 3075} {"train_loss": -24.965482711791992, "global_step": 255277, "epoch": 3075} {"train_loss": -25.286413192749023, "global_step": 255278, "epoch": 3075} {"train_loss": -25.12136459350586, "global_step": 255279, "epoch": 3075} {"train_loss": -24.818252563476562, "global_step": 255280, "epoch": 3075} {"train_loss": -25.08892250061035, "global_step": 255281, "epoch": 3075} {"train_loss": -25.122562408447266, "global_step": 255282, "epoch": 3075} {"train_loss": -25.208251953125, "global_step": 255283, "epoch": 3075} {"train_loss": -25.16199493408203, "global_step": 255284, "epoch": 3075} {"train_loss": -25.23365020751953, "global_step": 255285, "epoch": 3075} {"train_loss": -25.345937728881836, "global_step": 255286, "epoch": 3075} {"train_loss": -25.071630477905273, "global_step": 255287, "epoch": 3075} {"train_loss": -25.194250106811523, "global_step": 255288, "epoch": 3075} {"train_loss": -25.198911666870117, "global_step": 255289, "epoch": 3075} {"train_loss": -25.02714729309082, "global_step": 255290, "epoch": 3075} {"train_loss": -25.072622299194336, "global_step": 255291, "epoch": 3075} {"train_loss": -25.012636184692383, "global_step": 255292, "epoch": 3075} {"train_loss": -24.856403350830078, "global_step": 255293, "epoch": 3075} {"train_loss": -25.03095054626465, "global_step": 255294, "epoch": 3075} {"train_loss": -25.2008113861084, "global_step": 255295, "epoch": 3075} {"train_loss": -24.85296058654785, "global_step": 255296, "epoch": 3075} {"train_loss": -25.207916259765625, "global_step": 255297, "epoch": 3075} {"train_loss": -24.831281661987305, "global_step": 255298, "epoch": 3075} {"train_loss": -24.912704467773438, "global_step": 255299, "epoch": 3075} {"train_loss": -25.32636070251465, "global_step": 255300, "epoch": 3075} {"train_loss": -25.137161254882812, "global_step": 255301, "epoch": 3075} {"train_loss": -25.317670822143555, "global_step": 255302, "epoch": 3075} {"train_loss": -25.34507179260254, "global_step": 255303, "epoch": 3075} {"train_loss": -24.901966094970703, "global_step": 255304, "epoch": 3075} {"train_loss": -25.209308624267578, "global_step": 255305, "epoch": 3075} {"train_loss": -24.982074737548828, "global_step": 255306, "epoch": 3075} {"train_loss": -25.108011889170452, "global_step": 255307, "epoch": 3075, "val_loss": 6908614.0} {"train_loss": -24.310935974121094, "global_step": 255308, "epoch": 3076} {"train_loss": -24.612951278686523, "global_step": 255309, "epoch": 3076} {"train_loss": -24.184850692749023, "global_step": 255310, "epoch": 3076} {"train_loss": -24.521602630615234, "global_step": 255311, "epoch": 3076} {"train_loss": -24.587459564208984, "global_step": 255312, "epoch": 3076} {"train_loss": -24.291263580322266, "global_step": 255313, "epoch": 3076} {"train_loss": -23.922040939331055, "global_step": 255314, "epoch": 3076} {"train_loss": -24.747400283813477, "global_step": 255315, "epoch": 3076} {"train_loss": -24.495344161987305, "global_step": 255316, "epoch": 3076} {"train_loss": -24.135211944580078, "global_step": 255317, "epoch": 3076} {"train_loss": -24.731658935546875, "global_step": 255318, "epoch": 3076} {"train_loss": -24.395593643188477, "global_step": 255319, "epoch": 3076} {"train_loss": -24.592639923095703, "global_step": 255320, "epoch": 3076} {"train_loss": -24.84895896911621, "global_step": 255321, "epoch": 3076} {"train_loss": -24.603857040405273, "global_step": 255322, "epoch": 3076} {"train_loss": -24.380197525024414, "global_step": 255323, "epoch": 3076} {"train_loss": -24.586990356445312, "global_step": 255324, "epoch": 3076} {"train_loss": -24.857486724853516, "global_step": 255325, "epoch": 3076} {"train_loss": -24.72283935546875, "global_step": 255326, "epoch": 3076} {"train_loss": -24.436750411987305, "global_step": 255327, "epoch": 3076} {"train_loss": -25.02736473083496, "global_step": 255328, "epoch": 3076} {"train_loss": -24.985828399658203, "global_step": 255329, "epoch": 3076} {"train_loss": -24.87213706970215, "global_step": 255330, "epoch": 3076} {"train_loss": -25.01533317565918, "global_step": 255331, "epoch": 3076} {"train_loss": -25.066123962402344, "global_step": 255332, "epoch": 3076} {"train_loss": -25.21815299987793, "global_step": 255333, "epoch": 3076} {"train_loss": -24.784391403198242, "global_step": 255334, "epoch": 3076} {"train_loss": -25.092987060546875, "global_step": 255335, "epoch": 3076} {"train_loss": -25.004491806030273, "global_step": 255336, "epoch": 3076} {"train_loss": -24.506250381469727, "global_step": 255337, "epoch": 3076} {"train_loss": -24.776676177978516, "global_step": 255338, "epoch": 3076} {"train_loss": -25.236183166503906, "global_step": 255339, "epoch": 3076} {"train_loss": -25.350221633911133, "global_step": 255340, "epoch": 3076} {"train_loss": -25.092031478881836, "global_step": 255341, "epoch": 3076} {"train_loss": -24.730710983276367, "global_step": 255342, "epoch": 3076} {"train_loss": -25.540246963500977, "global_step": 255343, "epoch": 3076} {"train_loss": -25.001707077026367, "global_step": 255344, "epoch": 3076} {"train_loss": -25.206396102905273, "global_step": 255345, "epoch": 3076} {"train_loss": -25.590566635131836, "global_step": 255346, "epoch": 3076} {"train_loss": -25.245445251464844, "global_step": 255347, "epoch": 3076} {"train_loss": -25.182836532592773, "global_step": 255348, "epoch": 3076} {"train_loss": -24.883838653564453, "global_step": 255349, "epoch": 3076} {"train_loss": -25.322101593017578, "global_step": 255350, "epoch": 3076} {"train_loss": -25.585073471069336, "global_step": 255351, "epoch": 3076} {"train_loss": -25.40253257751465, "global_step": 255352, "epoch": 3076} {"train_loss": -25.11378288269043, "global_step": 255353, "epoch": 3076} {"train_loss": -25.214345932006836, "global_step": 255354, "epoch": 3076} {"train_loss": -25.559030532836914, "global_step": 255355, "epoch": 3076} {"train_loss": -25.408971786499023, "global_step": 255356, "epoch": 3076} {"train_loss": -25.203733444213867, "global_step": 255357, "epoch": 3076} {"train_loss": -25.134267807006836, "global_step": 255358, "epoch": 3076} {"train_loss": -25.626394271850586, "global_step": 255359, "epoch": 3076} {"train_loss": -25.170303344726562, "global_step": 255360, "epoch": 3076} {"train_loss": -24.936548233032227, "global_step": 255361, "epoch": 3076} {"train_loss": -25.45781898498535, "global_step": 255362, "epoch": 3076} {"train_loss": -25.302724838256836, "global_step": 255363, "epoch": 3076} {"train_loss": -25.35988426208496, "global_step": 255364, "epoch": 3076} {"train_loss": -24.849660873413086, "global_step": 255365, "epoch": 3076} {"train_loss": -25.02920913696289, "global_step": 255366, "epoch": 3076} {"train_loss": -25.011272430419922, "global_step": 255367, "epoch": 3076} {"train_loss": -25.164817810058594, "global_step": 255368, "epoch": 3076} {"train_loss": -25.204801559448242, "global_step": 255369, "epoch": 3076} {"train_loss": -25.148115158081055, "global_step": 255370, "epoch": 3076} {"train_loss": -24.99945068359375, "global_step": 255371, "epoch": 3076} {"train_loss": -25.163137435913086, "global_step": 255372, "epoch": 3076} {"train_loss": -25.326547622680664, "global_step": 255373, "epoch": 3076} {"train_loss": -25.039825439453125, "global_step": 255374, "epoch": 3076} {"train_loss": -24.951080322265625, "global_step": 255375, "epoch": 3076} {"train_loss": -24.974782943725586, "global_step": 255376, "epoch": 3076} {"train_loss": -24.83770179748535, "global_step": 255377, "epoch": 3076} {"train_loss": -24.948137283325195, "global_step": 255378, "epoch": 3076} {"train_loss": -25.34067726135254, "global_step": 255379, "epoch": 3076} {"train_loss": -25.088407516479492, "global_step": 255380, "epoch": 3076} {"train_loss": -25.184587478637695, "global_step": 255381, "epoch": 3076} {"train_loss": -25.57573890686035, "global_step": 255382, "epoch": 3076} {"train_loss": -24.877050399780273, "global_step": 255383, "epoch": 3076} {"train_loss": -24.971622467041016, "global_step": 255384, "epoch": 3076} {"train_loss": -24.886747360229492, "global_step": 255385, "epoch": 3076} {"train_loss": -24.972829818725586, "global_step": 255386, "epoch": 3076} {"train_loss": -25.002933502197266, "global_step": 255387, "epoch": 3076} {"train_loss": -25.481107711791992, "global_step": 255388, "epoch": 3076} {"train_loss": -25.07737159729004, "global_step": 255389, "epoch": 3076} {"train_loss": -24.98439724474068, "global_step": 255390, "epoch": 3076, "val_loss": 7157167.0} {"train_loss": -24.38149642944336, "global_step": 255391, "epoch": 3077} {"train_loss": -24.343387603759766, "global_step": 255392, "epoch": 3077} {"train_loss": -24.503339767456055, "global_step": 255393, "epoch": 3077} {"train_loss": -24.383438110351562, "global_step": 255394, "epoch": 3077} {"train_loss": -24.897140502929688, "global_step": 255395, "epoch": 3077} {"train_loss": -24.923242568969727, "global_step": 255396, "epoch": 3077} {"train_loss": -24.280517578125, "global_step": 255397, "epoch": 3077} {"train_loss": -24.971717834472656, "global_step": 255398, "epoch": 3077} {"train_loss": -24.65549087524414, "global_step": 255399, "epoch": 3077} {"train_loss": -24.429412841796875, "global_step": 255400, "epoch": 3077} {"train_loss": -24.265640258789062, "global_step": 255401, "epoch": 3077} {"train_loss": -24.921764373779297, "global_step": 255402, "epoch": 3077} {"train_loss": -24.251901626586914, "global_step": 255403, "epoch": 3077} {"train_loss": -24.87497329711914, "global_step": 255404, "epoch": 3077} {"train_loss": -24.745487213134766, "global_step": 255405, "epoch": 3077} {"train_loss": -24.675451278686523, "global_step": 255406, "epoch": 3077} {"train_loss": -24.43044090270996, "global_step": 255407, "epoch": 3077} {"train_loss": -24.413070678710938, "global_step": 255408, "epoch": 3077} {"train_loss": -24.764570236206055, "global_step": 255409, "epoch": 3077} {"train_loss": -24.55141258239746, "global_step": 255410, "epoch": 3077} {"train_loss": -25.051250457763672, "global_step": 255411, "epoch": 3077} {"train_loss": -24.938369750976562, "global_step": 255412, "epoch": 3077} {"train_loss": -24.712377548217773, "global_step": 255413, "epoch": 3077} {"train_loss": -24.755861282348633, "global_step": 255414, "epoch": 3077} {"train_loss": -24.9924373626709, "global_step": 255415, "epoch": 3077} {"train_loss": -24.922849655151367, "global_step": 255416, "epoch": 3077} {"train_loss": -24.8558406829834, "global_step": 255417, "epoch": 3077} {"train_loss": -25.096349716186523, "global_step": 255418, "epoch": 3077} {"train_loss": -25.040836334228516, "global_step": 255419, "epoch": 3077} {"train_loss": -24.84432029724121, "global_step": 255420, "epoch": 3077} {"train_loss": -24.8359375, "global_step": 255421, "epoch": 3077} {"train_loss": -25.139341354370117, "global_step": 255422, "epoch": 3077} {"train_loss": -25.11786651611328, "global_step": 255423, "epoch": 3077} {"train_loss": -25.146203994750977, "global_step": 255424, "epoch": 3077} {"train_loss": -24.955585479736328, "global_step": 255425, "epoch": 3077} {"train_loss": -25.044851303100586, "global_step": 255426, "epoch": 3077} {"train_loss": -25.201261520385742, "global_step": 255427, "epoch": 3077} {"train_loss": -25.16131591796875, "global_step": 255428, "epoch": 3077} {"train_loss": -25.32952117919922, "global_step": 255429, "epoch": 3077} {"train_loss": -25.226953506469727, "global_step": 255430, "epoch": 3077} {"train_loss": -25.079967498779297, "global_step": 255431, "epoch": 3077} {"train_loss": -25.468420028686523, "global_step": 255432, "epoch": 3077} {"train_loss": -25.04612922668457, "global_step": 255433, "epoch": 3077} {"train_loss": -25.242076873779297, "global_step": 255434, "epoch": 3077} {"train_loss": -24.756439208984375, "global_step": 255435, "epoch": 3077} {"train_loss": -25.13568687438965, "global_step": 255436, "epoch": 3077} {"train_loss": -25.366260528564453, "global_step": 255437, "epoch": 3077} {"train_loss": -25.48995018005371, "global_step": 255438, "epoch": 3077} {"train_loss": -25.159326553344727, "global_step": 255439, "epoch": 3077} {"train_loss": -25.4099063873291, "global_step": 255440, "epoch": 3077} {"train_loss": -25.257410049438477, "global_step": 255441, "epoch": 3077} {"train_loss": -25.4007511138916, "global_step": 255442, "epoch": 3077} {"train_loss": -24.70110511779785, "global_step": 255443, "epoch": 3077} {"train_loss": -25.490713119506836, "global_step": 255444, "epoch": 3077} {"train_loss": -25.092851638793945, "global_step": 255445, "epoch": 3077} {"train_loss": -24.9084529876709, "global_step": 255446, "epoch": 3077} {"train_loss": -25.001087188720703, "global_step": 255447, "epoch": 3077} {"train_loss": -25.223546981811523, "global_step": 255448, "epoch": 3077} {"train_loss": -24.914493560791016, "global_step": 255449, "epoch": 3077} {"train_loss": -25.025745391845703, "global_step": 255450, "epoch": 3077} {"train_loss": -24.940692901611328, "global_step": 255451, "epoch": 3077} {"train_loss": -25.192068099975586, "global_step": 255452, "epoch": 3077} {"train_loss": -25.17963218688965, "global_step": 255453, "epoch": 3077} {"train_loss": -24.65646743774414, "global_step": 255454, "epoch": 3077} {"train_loss": -24.810583114624023, "global_step": 255455, "epoch": 3077} {"train_loss": -25.00583267211914, "global_step": 255456, "epoch": 3077} {"train_loss": -24.349578857421875, "global_step": 255457, "epoch": 3077} {"train_loss": -24.96858787536621, "global_step": 255458, "epoch": 3077} {"train_loss": -24.924217224121094, "global_step": 255459, "epoch": 3077} {"train_loss": -25.213214874267578, "global_step": 255460, "epoch": 3077} {"train_loss": -24.96906089782715, "global_step": 255461, "epoch": 3077} {"train_loss": -24.947769165039062, "global_step": 255462, "epoch": 3077} {"train_loss": -24.868207931518555, "global_step": 255463, "epoch": 3077} {"train_loss": -24.816497802734375, "global_step": 255464, "epoch": 3077} {"train_loss": -24.67647361755371, "global_step": 255465, "epoch": 3077} {"train_loss": -25.153461456298828, "global_step": 255466, "epoch": 3077} {"train_loss": -25.17439079284668, "global_step": 255467, "epoch": 3077} {"train_loss": -24.82139015197754, "global_step": 255468, "epoch": 3077} {"train_loss": -24.894210815429688, "global_step": 255469, "epoch": 3077} {"train_loss": -25.373668670654297, "global_step": 255470, "epoch": 3077} {"train_loss": -25.11750602722168, "global_step": 255471, "epoch": 3077} {"train_loss": -24.824270248413086, "global_step": 255472, "epoch": 3077} {"train_loss": -24.933192999966174, "global_step": 255473, "epoch": 3077, "val_loss": 6838131.0} {"train_loss": -24.919750213623047, "global_step": 255474, "epoch": 3078} {"train_loss": -25.215200424194336, "global_step": 255475, "epoch": 3078} {"train_loss": -24.815214157104492, "global_step": 255476, "epoch": 3078} {"train_loss": -25.2587833404541, "global_step": 255477, "epoch": 3078} {"train_loss": -25.015430450439453, "global_step": 255478, "epoch": 3078} {"train_loss": -24.735933303833008, "global_step": 255479, "epoch": 3078} {"train_loss": -24.68515396118164, "global_step": 255480, "epoch": 3078} {"train_loss": -25.075260162353516, "global_step": 255481, "epoch": 3078} {"train_loss": -25.008878707885742, "global_step": 255482, "epoch": 3078} {"train_loss": -24.751392364501953, "global_step": 255483, "epoch": 3078} {"train_loss": -25.13492774963379, "global_step": 255484, "epoch": 3078} {"train_loss": -25.263769149780273, "global_step": 255485, "epoch": 3078} {"train_loss": -25.258209228515625, "global_step": 255486, "epoch": 3078} {"train_loss": -24.787185668945312, "global_step": 255487, "epoch": 3078} {"train_loss": -24.577836990356445, "global_step": 255488, "epoch": 3078} {"train_loss": -24.84854507446289, "global_step": 255489, "epoch": 3078} {"train_loss": -25.345294952392578, "global_step": 255490, "epoch": 3078} {"train_loss": -24.87533187866211, "global_step": 255491, "epoch": 3078} {"train_loss": -24.946081161499023, "global_step": 255492, "epoch": 3078} {"train_loss": -25.01296043395996, "global_step": 255493, "epoch": 3078} {"train_loss": -25.100637435913086, "global_step": 255494, "epoch": 3078} {"train_loss": -24.9141788482666, "global_step": 255495, "epoch": 3078} {"train_loss": -25.07716941833496, "global_step": 255496, "epoch": 3078} {"train_loss": -25.015003204345703, "global_step": 255497, "epoch": 3078} {"train_loss": -25.178287506103516, "global_step": 255498, "epoch": 3078} {"train_loss": -25.144929885864258, "global_step": 255499, "epoch": 3078} {"train_loss": -24.8582763671875, "global_step": 255500, "epoch": 3078} {"train_loss": -25.35062026977539, "global_step": 255501, "epoch": 3078} {"train_loss": -25.359861373901367, "global_step": 255502, "epoch": 3078} {"train_loss": -25.312143325805664, "global_step": 255503, "epoch": 3078} {"train_loss": -25.335556030273438, "global_step": 255504, "epoch": 3078} {"train_loss": -25.178237915039062, "global_step": 255505, "epoch": 3078} {"train_loss": -25.364688873291016, "global_step": 255506, "epoch": 3078} {"train_loss": -25.399208068847656, "global_step": 255507, "epoch": 3078} {"train_loss": -25.207124710083008, "global_step": 255508, "epoch": 3078} {"train_loss": -25.168798446655273, "global_step": 255509, "epoch": 3078} {"train_loss": -25.274307250976562, "global_step": 255510, "epoch": 3078} {"train_loss": -25.421127319335938, "global_step": 255511, "epoch": 3078} {"train_loss": -25.104867935180664, "global_step": 255512, "epoch": 3078} {"train_loss": -25.251401901245117, "global_step": 255513, "epoch": 3078} {"train_loss": -25.066539764404297, "global_step": 255514, "epoch": 3078} {"train_loss": -25.06583595275879, "global_step": 255515, "epoch": 3078} {"train_loss": -25.16167449951172, "global_step": 255516, "epoch": 3078} {"train_loss": -25.25215721130371, "global_step": 255517, "epoch": 3078} {"train_loss": -24.97508430480957, "global_step": 255518, "epoch": 3078} {"train_loss": -24.649545669555664, "global_step": 255519, "epoch": 3078} {"train_loss": -24.52030372619629, "global_step": 255520, "epoch": 3078} {"train_loss": -24.663482666015625, "global_step": 255521, "epoch": 3078} {"train_loss": -24.903554916381836, "global_step": 255522, "epoch": 3078} {"train_loss": -25.079389572143555, "global_step": 255523, "epoch": 3078} {"train_loss": -24.771656036376953, "global_step": 255524, "epoch": 3078} {"train_loss": -24.518463134765625, "global_step": 255525, "epoch": 3078} {"train_loss": -24.574243545532227, "global_step": 255526, "epoch": 3078} {"train_loss": -24.644168853759766, "global_step": 255527, "epoch": 3078} {"train_loss": -24.59105682373047, "global_step": 255528, "epoch": 3078} {"train_loss": -24.886146545410156, "global_step": 255529, "epoch": 3078} {"train_loss": -24.62497329711914, "global_step": 255530, "epoch": 3078} {"train_loss": -24.57623863220215, "global_step": 255531, "epoch": 3078} {"train_loss": -24.953781127929688, "global_step": 255532, "epoch": 3078} {"train_loss": -24.576650619506836, "global_step": 255533, "epoch": 3078} {"train_loss": -24.44597816467285, "global_step": 255534, "epoch": 3078} {"train_loss": -25.03724479675293, "global_step": 255535, "epoch": 3078} {"train_loss": -24.85544204711914, "global_step": 255536, "epoch": 3078} {"train_loss": -24.960180282592773, "global_step": 255537, "epoch": 3078} {"train_loss": -25.041929244995117, "global_step": 255538, "epoch": 3078} {"train_loss": -24.812122344970703, "global_step": 255539, "epoch": 3078} {"train_loss": -24.856027603149414, "global_step": 255540, "epoch": 3078} {"train_loss": -25.153295516967773, "global_step": 255541, "epoch": 3078} {"train_loss": -25.212820053100586, "global_step": 255542, "epoch": 3078} {"train_loss": -24.824411392211914, "global_step": 255543, "epoch": 3078} {"train_loss": -24.988296508789062, "global_step": 255544, "epoch": 3078} {"train_loss": -24.915878295898438, "global_step": 255545, "epoch": 3078} {"train_loss": -25.097410202026367, "global_step": 255546, "epoch": 3078} {"train_loss": -24.9072265625, "global_step": 255547, "epoch": 3078} {"train_loss": -25.073556900024414, "global_step": 255548, "epoch": 3078} {"train_loss": -25.05396842956543, "global_step": 255549, "epoch": 3078} {"train_loss": -25.22743797302246, "global_step": 255550, "epoch": 3078} {"train_loss": -25.011978149414062, "global_step": 255551, "epoch": 3078} {"train_loss": -24.960081100463867, "global_step": 255552, "epoch": 3078} {"train_loss": -25.207969665527344, "global_step": 255553, "epoch": 3078} {"train_loss": -25.15018081665039, "global_step": 255554, "epoch": 3078} {"train_loss": -25.130544662475586, "global_step": 255555, "epoch": 3078} {"train_loss": -24.99275216711573, "global_step": 255556, "epoch": 3078, "val_loss": 6855777.0} {"train_loss": -24.344396591186523, "global_step": 255557, "epoch": 3079} {"train_loss": -24.776052474975586, "global_step": 255558, "epoch": 3079} {"train_loss": -24.651464462280273, "global_step": 255559, "epoch": 3079} {"train_loss": -24.59254264831543, "global_step": 255560, "epoch": 3079} {"train_loss": -24.88777732849121, "global_step": 255561, "epoch": 3079} {"train_loss": -24.777851104736328, "global_step": 255562, "epoch": 3079} {"train_loss": -24.808103561401367, "global_step": 255563, "epoch": 3079} {"train_loss": -24.783212661743164, "global_step": 255564, "epoch": 3079} {"train_loss": -25.044723510742188, "global_step": 255565, "epoch": 3079} {"train_loss": -25.0648250579834, "global_step": 255566, "epoch": 3079} {"train_loss": -24.99432945251465, "global_step": 255567, "epoch": 3079} {"train_loss": -24.88547134399414, "global_step": 255568, "epoch": 3079} {"train_loss": -24.5367488861084, "global_step": 255569, "epoch": 3079} {"train_loss": -24.046873092651367, "global_step": 255570, "epoch": 3079} {"train_loss": -24.787084579467773, "global_step": 255571, "epoch": 3079} {"train_loss": -25.11885643005371, "global_step": 255572, "epoch": 3079} {"train_loss": -24.608701705932617, "global_step": 255573, "epoch": 3079} {"train_loss": -24.50359535217285, "global_step": 255574, "epoch": 3079} {"train_loss": -25.0388240814209, "global_step": 255575, "epoch": 3079} {"train_loss": -25.111682891845703, "global_step": 255576, "epoch": 3079} {"train_loss": -24.88925552368164, "global_step": 255577, "epoch": 3079} {"train_loss": -24.736085891723633, "global_step": 255578, "epoch": 3079} {"train_loss": -24.966249465942383, "global_step": 255579, "epoch": 3079} {"train_loss": -24.84050941467285, "global_step": 255580, "epoch": 3079} {"train_loss": -25.20992088317871, "global_step": 255581, "epoch": 3079} {"train_loss": -25.10544204711914, "global_step": 255582, "epoch": 3079} {"train_loss": -25.315458297729492, "global_step": 255583, "epoch": 3079} {"train_loss": -24.93238067626953, "global_step": 255584, "epoch": 3079} {"train_loss": -25.046180725097656, "global_step": 255585, "epoch": 3079} {"train_loss": -25.01331901550293, "global_step": 255586, "epoch": 3079} {"train_loss": -24.877111434936523, "global_step": 255587, "epoch": 3079} {"train_loss": -25.345670700073242, "global_step": 255588, "epoch": 3079} {"train_loss": -25.66969108581543, "global_step": 255589, "epoch": 3079} {"train_loss": -25.326261520385742, "global_step": 255590, "epoch": 3079} {"train_loss": -25.125600814819336, "global_step": 255591, "epoch": 3079} {"train_loss": -25.458450317382812, "global_step": 255592, "epoch": 3079} {"train_loss": -25.314908981323242, "global_step": 255593, "epoch": 3079} {"train_loss": -25.41095542907715, "global_step": 255594, "epoch": 3079} {"train_loss": -25.013490676879883, "global_step": 255595, "epoch": 3079} {"train_loss": -25.568843841552734, "global_step": 255596, "epoch": 3079} {"train_loss": -25.010665893554688, "global_step": 255597, "epoch": 3079} {"train_loss": -25.267438888549805, "global_step": 255598, "epoch": 3079} {"train_loss": -24.902812957763672, "global_step": 255599, "epoch": 3079} {"train_loss": -25.127790451049805, "global_step": 255600, "epoch": 3079} {"train_loss": -25.127086639404297, "global_step": 255601, "epoch": 3079} {"train_loss": -24.95467185974121, "global_step": 255602, "epoch": 3079} {"train_loss": -25.356077194213867, "global_step": 255603, "epoch": 3079} {"train_loss": -25.308822631835938, "global_step": 255604, "epoch": 3079} {"train_loss": -25.423105239868164, "global_step": 255605, "epoch": 3079} {"train_loss": -24.85943603515625, "global_step": 255606, "epoch": 3079} {"train_loss": -25.092496871948242, "global_step": 255607, "epoch": 3079} {"train_loss": -25.500947952270508, "global_step": 255608, "epoch": 3079} {"train_loss": -25.427719116210938, "global_step": 255609, "epoch": 3079} {"train_loss": -25.15497589111328, "global_step": 255610, "epoch": 3079} {"train_loss": -25.261960983276367, "global_step": 255611, "epoch": 3079} {"train_loss": -25.511825561523438, "global_step": 255612, "epoch": 3079} {"train_loss": -25.64890480041504, "global_step": 255613, "epoch": 3079} {"train_loss": -25.6698055267334, "global_step": 255614, "epoch": 3079} {"train_loss": -25.190122604370117, "global_step": 255615, "epoch": 3079} {"train_loss": -25.18282127380371, "global_step": 255616, "epoch": 3079} {"train_loss": -24.689590454101562, "global_step": 255617, "epoch": 3079} {"train_loss": -24.560150146484375, "global_step": 255618, "epoch": 3079} {"train_loss": -24.89972496032715, "global_step": 255619, "epoch": 3079} {"train_loss": -25.2489070892334, "global_step": 255620, "epoch": 3079} {"train_loss": -24.994245529174805, "global_step": 255621, "epoch": 3079} {"train_loss": -25.1893310546875, "global_step": 255622, "epoch": 3079} {"train_loss": -24.730667114257812, "global_step": 255623, "epoch": 3079} {"train_loss": -25.246891021728516, "global_step": 255624, "epoch": 3079} {"train_loss": -24.903993606567383, "global_step": 255625, "epoch": 3079} {"train_loss": -25.13127899169922, "global_step": 255626, "epoch": 3079} {"train_loss": -24.8882999420166, "global_step": 255627, "epoch": 3079} {"train_loss": -24.763425827026367, "global_step": 255628, "epoch": 3079} {"train_loss": -25.1043701171875, "global_step": 255629, "epoch": 3079} {"train_loss": -25.01190185546875, "global_step": 255630, "epoch": 3079} {"train_loss": -24.847517013549805, "global_step": 255631, "epoch": 3079} {"train_loss": -24.8669490814209, "global_step": 255632, "epoch": 3079} {"train_loss": -24.9752254486084, "global_step": 255633, "epoch": 3079} {"train_loss": -24.513700485229492, "global_step": 255634, "epoch": 3079} {"train_loss": -24.951866149902344, "global_step": 255635, "epoch": 3079} {"train_loss": -25.20543670654297, "global_step": 255636, "epoch": 3079} {"train_loss": -24.715967178344727, "global_step": 255637, "epoch": 3079} {"train_loss": -24.843481063842773, "global_step": 255638, "epoch": 3079} {"train_loss": -25.016541883169886, "global_step": 255639, "epoch": 3079, "val_loss": 6863550.0} {"train_loss": -24.37581443786621, "global_step": 255640, "epoch": 3080} {"train_loss": -24.77765655517578, "global_step": 255641, "epoch": 3080} {"train_loss": -24.685230255126953, "global_step": 255642, "epoch": 3080} {"train_loss": -25.028244018554688, "global_step": 255643, "epoch": 3080} {"train_loss": -24.963050842285156, "global_step": 255644, "epoch": 3080} {"train_loss": -24.962621688842773, "global_step": 255645, "epoch": 3080} {"train_loss": -25.034101486206055, "global_step": 255646, "epoch": 3080} {"train_loss": -25.01321792602539, "global_step": 255647, "epoch": 3080} {"train_loss": -24.752368927001953, "global_step": 255648, "epoch": 3080} {"train_loss": -24.896713256835938, "global_step": 255649, "epoch": 3080} {"train_loss": -25.053089141845703, "global_step": 255650, "epoch": 3080} {"train_loss": -25.103445053100586, "global_step": 255651, "epoch": 3080} {"train_loss": -24.87462615966797, "global_step": 255652, "epoch": 3080} {"train_loss": -25.00282859802246, "global_step": 255653, "epoch": 3080} {"train_loss": -25.18147087097168, "global_step": 255654, "epoch": 3080} {"train_loss": -25.000429153442383, "global_step": 255655, "epoch": 3080} {"train_loss": -24.98517417907715, "global_step": 255656, "epoch": 3080} {"train_loss": -25.084165573120117, "global_step": 255657, "epoch": 3080} {"train_loss": -24.991634368896484, "global_step": 255658, "epoch": 3080} {"train_loss": -25.13191032409668, "global_step": 255659, "epoch": 3080} {"train_loss": -25.15522003173828, "global_step": 255660, "epoch": 3080} {"train_loss": -24.977914810180664, "global_step": 255661, "epoch": 3080} {"train_loss": -25.077835083007812, "global_step": 255662, "epoch": 3080} {"train_loss": -25.12764549255371, "global_step": 255663, "epoch": 3080} {"train_loss": -24.989572525024414, "global_step": 255664, "epoch": 3080} {"train_loss": -25.127511978149414, "global_step": 255665, "epoch": 3080} {"train_loss": -24.88649559020996, "global_step": 255666, "epoch": 3080} {"train_loss": -24.698877334594727, "global_step": 255667, "epoch": 3080} {"train_loss": -24.958890914916992, "global_step": 255668, "epoch": 3080} {"train_loss": -24.70808982849121, "global_step": 255669, "epoch": 3080} {"train_loss": -24.75765037536621, "global_step": 255670, "epoch": 3080} {"train_loss": -25.06007194519043, "global_step": 255671, "epoch": 3080} {"train_loss": -25.093290328979492, "global_step": 255672, "epoch": 3080} {"train_loss": -24.975046157836914, "global_step": 255673, "epoch": 3080} {"train_loss": -25.06589126586914, "global_step": 255674, "epoch": 3080} {"train_loss": -25.412626266479492, "global_step": 255675, "epoch": 3080} {"train_loss": -24.764827728271484, "global_step": 255676, "epoch": 3080} {"train_loss": -25.308683395385742, "global_step": 255677, "epoch": 3080} {"train_loss": -25.17840003967285, "global_step": 255678, "epoch": 3080} {"train_loss": -24.93537712097168, "global_step": 255679, "epoch": 3080} {"train_loss": -25.03523826599121, "global_step": 255680, "epoch": 3080} {"train_loss": -25.30866241455078, "global_step": 255681, "epoch": 3080} {"train_loss": -25.151960372924805, "global_step": 255682, "epoch": 3080} {"train_loss": -24.982566833496094, "global_step": 255683, "epoch": 3080} {"train_loss": -24.968448638916016, "global_step": 255684, "epoch": 3080} {"train_loss": -25.18726921081543, "global_step": 255685, "epoch": 3080} {"train_loss": -25.199127197265625, "global_step": 255686, "epoch": 3080} {"train_loss": -24.968393325805664, "global_step": 255687, "epoch": 3080} {"train_loss": -24.884557723999023, "global_step": 255688, "epoch": 3080} {"train_loss": -25.207088470458984, "global_step": 255689, "epoch": 3080} {"train_loss": -24.939207077026367, "global_step": 255690, "epoch": 3080} {"train_loss": -24.971572875976562, "global_step": 255691, "epoch": 3080} {"train_loss": -25.326366424560547, "global_step": 255692, "epoch": 3080} {"train_loss": -24.943185806274414, "global_step": 255693, "epoch": 3080} {"train_loss": -25.292205810546875, "global_step": 255694, "epoch": 3080} {"train_loss": -25.010303497314453, "global_step": 255695, "epoch": 3080} {"train_loss": -25.355056762695312, "global_step": 255696, "epoch": 3080} {"train_loss": -25.218740463256836, "global_step": 255697, "epoch": 3080} {"train_loss": -25.05584144592285, "global_step": 255698, "epoch": 3080} {"train_loss": -25.109539031982422, "global_step": 255699, "epoch": 3080} {"train_loss": -25.288503646850586, "global_step": 255700, "epoch": 3080} {"train_loss": -25.325632095336914, "global_step": 255701, "epoch": 3080} {"train_loss": -24.971723556518555, "global_step": 255702, "epoch": 3080} {"train_loss": -24.889463424682617, "global_step": 255703, "epoch": 3080} {"train_loss": -24.5871639251709, "global_step": 255704, "epoch": 3080} {"train_loss": -24.627531051635742, "global_step": 255705, "epoch": 3080} {"train_loss": -25.441240310668945, "global_step": 255706, "epoch": 3080} {"train_loss": -24.7374210357666, "global_step": 255707, "epoch": 3080} {"train_loss": -24.406885147094727, "global_step": 255708, "epoch": 3080} {"train_loss": -24.903573989868164, "global_step": 255709, "epoch": 3080} {"train_loss": -24.565439224243164, "global_step": 255710, "epoch": 3080} {"train_loss": -24.998300552368164, "global_step": 255711, "epoch": 3080} {"train_loss": -24.32205581665039, "global_step": 255712, "epoch": 3080} {"train_loss": -24.975202560424805, "global_step": 255713, "epoch": 3080} {"train_loss": -24.265806198120117, "global_step": 255714, "epoch": 3080} {"train_loss": -24.568246841430664, "global_step": 255715, "epoch": 3080} {"train_loss": -25.09363555908203, "global_step": 255716, "epoch": 3080} {"train_loss": -24.966184616088867, "global_step": 255717, "epoch": 3080} {"train_loss": -24.625837326049805, "global_step": 255718, "epoch": 3080} {"train_loss": -24.903013229370117, "global_step": 255719, "epoch": 3080} {"train_loss": -24.819629669189453, "global_step": 255720, "epoch": 3080} {"train_loss": -24.656452178955078, "global_step": 255721, "epoch": 3080} {"train_loss": -24.97892476277179, "global_step": 255722, "epoch": 3080, "val_loss": 7019551.0} {"train_loss": -24.421873092651367, "global_step": 255723, "epoch": 3081} {"train_loss": -24.467140197753906, "global_step": 255724, "epoch": 3081} {"train_loss": -24.47515869140625, "global_step": 255725, "epoch": 3081} {"train_loss": -24.379352569580078, "global_step": 255726, "epoch": 3081} {"train_loss": -24.56602668762207, "global_step": 255727, "epoch": 3081} {"train_loss": -24.324951171875, "global_step": 255728, "epoch": 3081} {"train_loss": -24.486133575439453, "global_step": 255729, "epoch": 3081} {"train_loss": -24.805078506469727, "global_step": 255730, "epoch": 3081} {"train_loss": -24.66366958618164, "global_step": 255731, "epoch": 3081} {"train_loss": -24.254791259765625, "global_step": 255732, "epoch": 3081} {"train_loss": -24.602710723876953, "global_step": 255733, "epoch": 3081} {"train_loss": -25.13429832458496, "global_step": 255734, "epoch": 3081} {"train_loss": -24.987201690673828, "global_step": 255735, "epoch": 3081} {"train_loss": -24.668203353881836, "global_step": 255736, "epoch": 3081} {"train_loss": -25.01205062866211, "global_step": 255737, "epoch": 3081} {"train_loss": -24.721033096313477, "global_step": 255738, "epoch": 3081} {"train_loss": -24.361326217651367, "global_step": 255739, "epoch": 3081} {"train_loss": -24.859521865844727, "global_step": 255740, "epoch": 3081} {"train_loss": -24.713621139526367, "global_step": 255741, "epoch": 3081} {"train_loss": -24.957101821899414, "global_step": 255742, "epoch": 3081} {"train_loss": -24.58523941040039, "global_step": 255743, "epoch": 3081} {"train_loss": -25.14236068725586, "global_step": 255744, "epoch": 3081} {"train_loss": -25.138263702392578, "global_step": 255745, "epoch": 3081} {"train_loss": -25.086654663085938, "global_step": 255746, "epoch": 3081} {"train_loss": -24.987804412841797, "global_step": 255747, "epoch": 3081} {"train_loss": -24.792394638061523, "global_step": 255748, "epoch": 3081} {"train_loss": -24.939773559570312, "global_step": 255749, "epoch": 3081} {"train_loss": -25.061859130859375, "global_step": 255750, "epoch": 3081} {"train_loss": -24.918798446655273, "global_step": 255751, "epoch": 3081} {"train_loss": -24.873943328857422, "global_step": 255752, "epoch": 3081} {"train_loss": -25.321544647216797, "global_step": 255753, "epoch": 3081} {"train_loss": -25.34720230102539, "global_step": 255754, "epoch": 3081} {"train_loss": -24.80535125732422, "global_step": 255755, "epoch": 3081} {"train_loss": -25.32039451599121, "global_step": 255756, "epoch": 3081} {"train_loss": -25.349843978881836, "global_step": 255757, "epoch": 3081} {"train_loss": -24.990610122680664, "global_step": 255758, "epoch": 3081} {"train_loss": -25.27925682067871, "global_step": 255759, "epoch": 3081} {"train_loss": -24.927396774291992, "global_step": 255760, "epoch": 3081} {"train_loss": -25.081636428833008, "global_step": 255761, "epoch": 3081} {"train_loss": -25.435110092163086, "global_step": 255762, "epoch": 3081} {"train_loss": -24.980844497680664, "global_step": 255763, "epoch": 3081} {"train_loss": -25.01848793029785, "global_step": 255764, "epoch": 3081} {"train_loss": -25.427173614501953, "global_step": 255765, "epoch": 3081} {"train_loss": -25.245868682861328, "global_step": 255766, "epoch": 3081} {"train_loss": -24.693714141845703, "global_step": 255767, "epoch": 3081} {"train_loss": -24.880050659179688, "global_step": 255768, "epoch": 3081} {"train_loss": -24.750600814819336, "global_step": 255769, "epoch": 3081} {"train_loss": -24.961767196655273, "global_step": 255770, "epoch": 3081} {"train_loss": -25.110595703125, "global_step": 255771, "epoch": 3081} {"train_loss": -25.054153442382812, "global_step": 255772, "epoch": 3081} {"train_loss": -25.440587997436523, "global_step": 255773, "epoch": 3081} {"train_loss": -25.102060317993164, "global_step": 255774, "epoch": 3081} {"train_loss": -25.073577880859375, "global_step": 255775, "epoch": 3081} {"train_loss": -25.15253257751465, "global_step": 255776, "epoch": 3081} {"train_loss": -25.036338806152344, "global_step": 255777, "epoch": 3081} {"train_loss": -24.802047729492188, "global_step": 255778, "epoch": 3081} {"train_loss": -24.840749740600586, "global_step": 255779, "epoch": 3081} {"train_loss": -25.212295532226562, "global_step": 255780, "epoch": 3081} {"train_loss": -24.67299461364746, "global_step": 255781, "epoch": 3081} {"train_loss": -25.174707412719727, "global_step": 255782, "epoch": 3081} {"train_loss": -24.968948364257812, "global_step": 255783, "epoch": 3081} {"train_loss": -24.808759689331055, "global_step": 255784, "epoch": 3081} {"train_loss": -25.28170394897461, "global_step": 255785, "epoch": 3081} {"train_loss": -25.011564254760742, "global_step": 255786, "epoch": 3081} {"train_loss": -25.019079208374023, "global_step": 255787, "epoch": 3081} {"train_loss": -25.087039947509766, "global_step": 255788, "epoch": 3081} {"train_loss": -25.331449508666992, "global_step": 255789, "epoch": 3081} {"train_loss": -25.017122268676758, "global_step": 255790, "epoch": 3081} {"train_loss": -24.798917770385742, "global_step": 255791, "epoch": 3081} {"train_loss": -25.229206085205078, "global_step": 255792, "epoch": 3081} {"train_loss": -25.37105369567871, "global_step": 255793, "epoch": 3081} {"train_loss": -25.39290428161621, "global_step": 255794, "epoch": 3081} {"train_loss": -25.173511505126953, "global_step": 255795, "epoch": 3081} {"train_loss": -24.854787826538086, "global_step": 255796, "epoch": 3081} {"train_loss": -25.040184020996094, "global_step": 255797, "epoch": 3081} {"train_loss": -25.158445358276367, "global_step": 255798, "epoch": 3081} {"train_loss": -25.10846519470215, "global_step": 255799, "epoch": 3081} {"train_loss": -25.482688903808594, "global_step": 255800, "epoch": 3081} {"train_loss": -25.198392868041992, "global_step": 255801, "epoch": 3081} {"train_loss": -25.501880645751953, "global_step": 255802, "epoch": 3081} {"train_loss": -25.00740623474121, "global_step": 255803, "epoch": 3081} {"train_loss": -25.15602684020996, "global_step": 255804, "epoch": 3081} {"train_loss": -24.98699647834502, "global_step": 255805, "epoch": 3081, "val_loss": 6853865.5} {"train_loss": -24.47022247314453, "global_step": 255806, "epoch": 3082} {"train_loss": -24.401273727416992, "global_step": 255807, "epoch": 3082} {"train_loss": -24.558109283447266, "global_step": 255808, "epoch": 3082} {"train_loss": -24.636831283569336, "global_step": 255809, "epoch": 3082} {"train_loss": -24.690563201904297, "global_step": 255810, "epoch": 3082} {"train_loss": -24.665149688720703, "global_step": 255811, "epoch": 3082} {"train_loss": -24.98139762878418, "global_step": 255812, "epoch": 3082} {"train_loss": -25.018274307250977, "global_step": 255813, "epoch": 3082} {"train_loss": -24.51026725769043, "global_step": 255814, "epoch": 3082} {"train_loss": -24.360702514648438, "global_step": 255815, "epoch": 3082} {"train_loss": -25.228315353393555, "global_step": 255816, "epoch": 3082} {"train_loss": -24.588422775268555, "global_step": 255817, "epoch": 3082} {"train_loss": -24.440185546875, "global_step": 255818, "epoch": 3082} {"train_loss": -24.938709259033203, "global_step": 255819, "epoch": 3082} {"train_loss": -24.878286361694336, "global_step": 255820, "epoch": 3082} {"train_loss": -24.481985092163086, "global_step": 255821, "epoch": 3082} {"train_loss": -24.42658233642578, "global_step": 255822, "epoch": 3082} {"train_loss": -24.698827743530273, "global_step": 255823, "epoch": 3082} {"train_loss": -24.55451011657715, "global_step": 255824, "epoch": 3082} {"train_loss": -24.90555763244629, "global_step": 255825, "epoch": 3082} {"train_loss": -24.879560470581055, "global_step": 255826, "epoch": 3082} {"train_loss": -24.66486930847168, "global_step": 255827, "epoch": 3082} {"train_loss": -24.976057052612305, "global_step": 255828, "epoch": 3082} {"train_loss": -24.567930221557617, "global_step": 255829, "epoch": 3082} {"train_loss": -24.69483184814453, "global_step": 255830, "epoch": 3082} {"train_loss": -24.771682739257812, "global_step": 255831, "epoch": 3082} {"train_loss": -25.018325805664062, "global_step": 255832, "epoch": 3082} {"train_loss": -24.632169723510742, "global_step": 255833, "epoch": 3082} {"train_loss": -25.339956283569336, "global_step": 255834, "epoch": 3082} {"train_loss": -24.9179744720459, "global_step": 255835, "epoch": 3082} {"train_loss": -25.1771297454834, "global_step": 255836, "epoch": 3082} {"train_loss": -24.99873161315918, "global_step": 255837, "epoch": 3082} {"train_loss": -25.544456481933594, "global_step": 255838, "epoch": 3082} {"train_loss": -25.137287139892578, "global_step": 255839, "epoch": 3082} {"train_loss": -25.237411499023438, "global_step": 255840, "epoch": 3082} {"train_loss": -24.84113311767578, "global_step": 255841, "epoch": 3082} {"train_loss": -25.043935775756836, "global_step": 255842, "epoch": 3082} {"train_loss": -25.37839126586914, "global_step": 255843, "epoch": 3082} {"train_loss": -25.324878692626953, "global_step": 255844, "epoch": 3082} {"train_loss": -25.155080795288086, "global_step": 255845, "epoch": 3082} {"train_loss": -24.815982818603516, "global_step": 255846, "epoch": 3082} {"train_loss": -25.078540802001953, "global_step": 255847, "epoch": 3082} {"train_loss": -25.245403289794922, "global_step": 255848, "epoch": 3082} {"train_loss": -24.998151779174805, "global_step": 255849, "epoch": 3082} {"train_loss": -25.180200576782227, "global_step": 255850, "epoch": 3082} {"train_loss": -24.949148178100586, "global_step": 255851, "epoch": 3082} {"train_loss": -25.145273208618164, "global_step": 255852, "epoch": 3082} {"train_loss": -24.98583984375, "global_step": 255853, "epoch": 3082} {"train_loss": -25.22486686706543, "global_step": 255854, "epoch": 3082} {"train_loss": -25.08748435974121, "global_step": 255855, "epoch": 3082} {"train_loss": -24.767709732055664, "global_step": 255856, "epoch": 3082} {"train_loss": -24.791709899902344, "global_step": 255857, "epoch": 3082} {"train_loss": -24.6037540435791, "global_step": 255858, "epoch": 3082} {"train_loss": -23.92777442932129, "global_step": 255859, "epoch": 3082} {"train_loss": -24.033248901367188, "global_step": 255860, "epoch": 3082} {"train_loss": -24.871610641479492, "global_step": 255861, "epoch": 3082} {"train_loss": -24.929798126220703, "global_step": 255862, "epoch": 3082} {"train_loss": -25.059961318969727, "global_step": 255863, "epoch": 3082} {"train_loss": -24.236919403076172, "global_step": 255864, "epoch": 3082} {"train_loss": -24.396703720092773, "global_step": 255865, "epoch": 3082} {"train_loss": -24.6160888671875, "global_step": 255866, "epoch": 3082} {"train_loss": -24.611297607421875, "global_step": 255867, "epoch": 3082} {"train_loss": -24.557876586914062, "global_step": 255868, "epoch": 3082} {"train_loss": -24.612401962280273, "global_step": 255869, "epoch": 3082} {"train_loss": -24.683996200561523, "global_step": 255870, "epoch": 3082} {"train_loss": -24.853973388671875, "global_step": 255871, "epoch": 3082} {"train_loss": -24.709598541259766, "global_step": 255872, "epoch": 3082} {"train_loss": -24.93678855895996, "global_step": 255873, "epoch": 3082} {"train_loss": -24.647443771362305, "global_step": 255874, "epoch": 3082} {"train_loss": -24.894994735717773, "global_step": 255875, "epoch": 3082} {"train_loss": -24.88400650024414, "global_step": 255876, "epoch": 3082} {"train_loss": -24.930103302001953, "global_step": 255877, "epoch": 3082} {"train_loss": -24.73361587524414, "global_step": 255878, "epoch": 3082} {"train_loss": -25.09271240234375, "global_step": 255879, "epoch": 3082} {"train_loss": -24.906599044799805, "global_step": 255880, "epoch": 3082} {"train_loss": -24.935306549072266, "global_step": 255881, "epoch": 3082} {"train_loss": -24.721668243408203, "global_step": 255882, "epoch": 3082} {"train_loss": -24.41988182067871, "global_step": 255883, "epoch": 3082} {"train_loss": -24.629281997680664, "global_step": 255884, "epoch": 3082} {"train_loss": -24.737783432006836, "global_step": 255885, "epoch": 3082} {"train_loss": -24.890079498291016, "global_step": 255886, "epoch": 3082} {"train_loss": -25.13907814025879, "global_step": 255887, "epoch": 3082} {"train_loss": -24.832040786743164, "global_step": 255888, "epoch": 3082, "val_loss": 6826750.0} {"train_loss": -24.445775985717773, "global_step": 255889, "epoch": 3083} {"train_loss": -24.589033126831055, "global_step": 255890, "epoch": 3083} {"train_loss": -24.980201721191406, "global_step": 255891, "epoch": 3083} {"train_loss": -24.6041259765625, "global_step": 255892, "epoch": 3083} {"train_loss": -24.834075927734375, "global_step": 255893, "epoch": 3083} {"train_loss": -24.410741806030273, "global_step": 255894, "epoch": 3083} {"train_loss": -24.3856201171875, "global_step": 255895, "epoch": 3083} {"train_loss": -24.760671615600586, "global_step": 255896, "epoch": 3083} {"train_loss": -25.001386642456055, "global_step": 255897, "epoch": 3083} {"train_loss": -25.102882385253906, "global_step": 255898, "epoch": 3083} {"train_loss": -25.282331466674805, "global_step": 255899, "epoch": 3083} {"train_loss": -25.038990020751953, "global_step": 255900, "epoch": 3083} {"train_loss": -24.99293327331543, "global_step": 255901, "epoch": 3083} {"train_loss": -24.951908111572266, "global_step": 255902, "epoch": 3083} {"train_loss": -24.979013442993164, "global_step": 255903, "epoch": 3083} {"train_loss": -24.96003532409668, "global_step": 255904, "epoch": 3083} {"train_loss": -24.923307418823242, "global_step": 255905, "epoch": 3083} {"train_loss": -25.275720596313477, "global_step": 255906, "epoch": 3083} {"train_loss": -25.121356964111328, "global_step": 255907, "epoch": 3083} {"train_loss": -24.907197952270508, "global_step": 255908, "epoch": 3083} {"train_loss": -25.24011993408203, "global_step": 255909, "epoch": 3083} {"train_loss": -25.274372100830078, "global_step": 255910, "epoch": 3083} {"train_loss": -25.006778717041016, "global_step": 255911, "epoch": 3083} {"train_loss": -24.81184959411621, "global_step": 255912, "epoch": 3083} {"train_loss": -25.298398971557617, "global_step": 255913, "epoch": 3083} {"train_loss": -25.061521530151367, "global_step": 255914, "epoch": 3083} {"train_loss": -25.217910766601562, "global_step": 255915, "epoch": 3083} {"train_loss": -25.420743942260742, "global_step": 255916, "epoch": 3083} {"train_loss": -24.889888763427734, "global_step": 255917, "epoch": 3083} {"train_loss": -25.45207977294922, "global_step": 255918, "epoch": 3083} {"train_loss": -25.071125030517578, "global_step": 255919, "epoch": 3083} {"train_loss": -24.888111114501953, "global_step": 255920, "epoch": 3083} {"train_loss": -25.09554100036621, "global_step": 255921, "epoch": 3083} {"train_loss": -25.520389556884766, "global_step": 255922, "epoch": 3083} {"train_loss": -25.31196403503418, "global_step": 255923, "epoch": 3083} {"train_loss": -25.255224227905273, "global_step": 255924, "epoch": 3083} {"train_loss": -24.87544059753418, "global_step": 255925, "epoch": 3083} {"train_loss": -24.85525894165039, "global_step": 255926, "epoch": 3083} {"train_loss": -24.56571388244629, "global_step": 255927, "epoch": 3083} {"train_loss": -25.58083152770996, "global_step": 255928, "epoch": 3083} {"train_loss": -25.381492614746094, "global_step": 255929, "epoch": 3083} {"train_loss": -24.997602462768555, "global_step": 255930, "epoch": 3083} {"train_loss": -24.786022186279297, "global_step": 255931, "epoch": 3083} {"train_loss": -25.281173706054688, "global_step": 255932, "epoch": 3083} {"train_loss": -25.014892578125, "global_step": 255933, "epoch": 3083} {"train_loss": -24.742591857910156, "global_step": 255934, "epoch": 3083} {"train_loss": -25.241256713867188, "global_step": 255935, "epoch": 3083} {"train_loss": -24.990650177001953, "global_step": 255936, "epoch": 3083} {"train_loss": -24.978809356689453, "global_step": 255937, "epoch": 3083} {"train_loss": -25.263587951660156, "global_step": 255938, "epoch": 3083} {"train_loss": -25.120634078979492, "global_step": 255939, "epoch": 3083} {"train_loss": -25.322324752807617, "global_step": 255940, "epoch": 3083} {"train_loss": -24.833850860595703, "global_step": 255941, "epoch": 3083} {"train_loss": -25.5871639251709, "global_step": 255942, "epoch": 3083} {"train_loss": -25.006046295166016, "global_step": 255943, "epoch": 3083} {"train_loss": -25.2166748046875, "global_step": 255944, "epoch": 3083} {"train_loss": -25.051420211791992, "global_step": 255945, "epoch": 3083} {"train_loss": -25.220300674438477, "global_step": 255946, "epoch": 3083} {"train_loss": -25.073200225830078, "global_step": 255947, "epoch": 3083} {"train_loss": -25.329313278198242, "global_step": 255948, "epoch": 3083} {"train_loss": -24.894163131713867, "global_step": 255949, "epoch": 3083} {"train_loss": -25.10062026977539, "global_step": 255950, "epoch": 3083} {"train_loss": -25.0252742767334, "global_step": 255951, "epoch": 3083} {"train_loss": -25.12353515625, "global_step": 255952, "epoch": 3083} {"train_loss": -25.415998458862305, "global_step": 255953, "epoch": 3083} {"train_loss": -25.360044479370117, "global_step": 255954, "epoch": 3083} {"train_loss": -25.3216609954834, "global_step": 255955, "epoch": 3083} {"train_loss": -25.196035385131836, "global_step": 255956, "epoch": 3083} {"train_loss": -25.49696922302246, "global_step": 255957, "epoch": 3083} {"train_loss": -25.087308883666992, "global_step": 255958, "epoch": 3083} {"train_loss": -25.54633140563965, "global_step": 255959, "epoch": 3083} {"train_loss": -25.38337516784668, "global_step": 255960, "epoch": 3083} {"train_loss": -25.31707191467285, "global_step": 255961, "epoch": 3083} {"train_loss": -25.156906127929688, "global_step": 255962, "epoch": 3083} {"train_loss": -25.364906311035156, "global_step": 255963, "epoch": 3083} {"train_loss": -25.09490394592285, "global_step": 255964, "epoch": 3083} {"train_loss": -24.971302032470703, "global_step": 255965, "epoch": 3083} {"train_loss": -25.25815200805664, "global_step": 255966, "epoch": 3083} {"train_loss": -25.122896194458008, "global_step": 255967, "epoch": 3083} {"train_loss": -25.570650100708008, "global_step": 255968, "epoch": 3083} {"train_loss": -25.429777145385742, "global_step": 255969, "epoch": 3083} {"train_loss": -25.628437042236328, "global_step": 255970, "epoch": 3083} {"train_loss": -25.106288932892213, "global_step": 255971, "epoch": 3083, "val_loss": 6840865.0} {"train_loss": -24.6156063079834, "global_step": 255972, "epoch": 3084} {"train_loss": -24.73808479309082, "global_step": 255973, "epoch": 3084} {"train_loss": -24.938854217529297, "global_step": 255974, "epoch": 3084} {"train_loss": -24.467275619506836, "global_step": 255975, "epoch": 3084} {"train_loss": -24.261842727661133, "global_step": 255976, "epoch": 3084} {"train_loss": -24.883848190307617, "global_step": 255977, "epoch": 3084} {"train_loss": -24.556608200073242, "global_step": 255978, "epoch": 3084} {"train_loss": -24.838058471679688, "global_step": 255979, "epoch": 3084} {"train_loss": -24.877059936523438, "global_step": 255980, "epoch": 3084} {"train_loss": -24.970548629760742, "global_step": 255981, "epoch": 3084} {"train_loss": -24.85013198852539, "global_step": 255982, "epoch": 3084} {"train_loss": -24.784372329711914, "global_step": 255983, "epoch": 3084} {"train_loss": -24.85470962524414, "global_step": 255984, "epoch": 3084} {"train_loss": -24.76252555847168, "global_step": 255985, "epoch": 3084} {"train_loss": -24.454965591430664, "global_step": 255986, "epoch": 3084} {"train_loss": -25.049957275390625, "global_step": 255987, "epoch": 3084} {"train_loss": -24.744123458862305, "global_step": 255988, "epoch": 3084} {"train_loss": -24.706422805786133, "global_step": 255989, "epoch": 3084} {"train_loss": -24.801244735717773, "global_step": 255990, "epoch": 3084} {"train_loss": -25.06875991821289, "global_step": 255991, "epoch": 3084} {"train_loss": -24.850128173828125, "global_step": 255992, "epoch": 3084} {"train_loss": -24.423513412475586, "global_step": 255993, "epoch": 3084} {"train_loss": -25.137609481811523, "global_step": 255994, "epoch": 3084} {"train_loss": -24.805524826049805, "global_step": 255995, "epoch": 3084} {"train_loss": -24.387399673461914, "global_step": 255996, "epoch": 3084} {"train_loss": -24.843069076538086, "global_step": 255997, "epoch": 3084} {"train_loss": -24.61844825744629, "global_step": 255998, "epoch": 3084} {"train_loss": -25.194318771362305, "global_step": 255999, "epoch": 3084} {"train_loss": -25.18659019470215, "global_step": 256000, "epoch": 3084} {"train_loss": -25.131311416625977, "global_step": 256001, "epoch": 3084} {"train_loss": -25.118091583251953, "global_step": 256002, "epoch": 3084} {"train_loss": -24.927200317382812, "global_step": 256003, "epoch": 3084} {"train_loss": -25.18122673034668, "global_step": 256004, "epoch": 3084} {"train_loss": -24.909500122070312, "global_step": 256005, "epoch": 3084} {"train_loss": -24.955514907836914, "global_step": 256006, "epoch": 3084} {"train_loss": -25.39703941345215, "global_step": 256007, "epoch": 3084} {"train_loss": -25.43053436279297, "global_step": 256008, "epoch": 3084} {"train_loss": -25.19000816345215, "global_step": 256009, "epoch": 3084} {"train_loss": -25.180002212524414, "global_step": 256010, "epoch": 3084} {"train_loss": -25.592132568359375, "global_step": 256011, "epoch": 3084} {"train_loss": -25.563993453979492, "global_step": 256012, "epoch": 3084} {"train_loss": -25.331632614135742, "global_step": 256013, "epoch": 3084} {"train_loss": -25.275205612182617, "global_step": 256014, "epoch": 3084} {"train_loss": -25.388463973999023, "global_step": 256015, "epoch": 3084} {"train_loss": -25.351221084594727, "global_step": 256016, "epoch": 3084} {"train_loss": -25.33740234375, "global_step": 256017, "epoch": 3084} {"train_loss": -25.36237907409668, "global_step": 256018, "epoch": 3084} {"train_loss": -25.6242733001709, "global_step": 256019, "epoch": 3084} {"train_loss": -25.171478271484375, "global_step": 256020, "epoch": 3084} {"train_loss": -24.96146011352539, "global_step": 256021, "epoch": 3084} {"train_loss": -25.057666778564453, "global_step": 256022, "epoch": 3084} {"train_loss": -25.11745262145996, "global_step": 256023, "epoch": 3084} {"train_loss": -25.283370971679688, "global_step": 256024, "epoch": 3084} {"train_loss": -25.00510597229004, "global_step": 256025, "epoch": 3084} {"train_loss": -24.7195987701416, "global_step": 256026, "epoch": 3084} {"train_loss": -24.878644943237305, "global_step": 256027, "epoch": 3084} {"train_loss": -24.942371368408203, "global_step": 256028, "epoch": 3084} {"train_loss": -25.14219093322754, "global_step": 256029, "epoch": 3084} {"train_loss": -24.8117733001709, "global_step": 256030, "epoch": 3084} {"train_loss": -25.05961799621582, "global_step": 256031, "epoch": 3084} {"train_loss": -25.271541595458984, "global_step": 256032, "epoch": 3084} {"train_loss": -25.256715774536133, "global_step": 256033, "epoch": 3084} {"train_loss": -25.00527000427246, "global_step": 256034, "epoch": 3084} {"train_loss": -25.25516128540039, "global_step": 256035, "epoch": 3084} {"train_loss": -24.9354190826416, "global_step": 256036, "epoch": 3084} {"train_loss": -25.294301986694336, "global_step": 256037, "epoch": 3084} {"train_loss": -25.11878776550293, "global_step": 256038, "epoch": 3084} {"train_loss": -25.00969696044922, "global_step": 256039, "epoch": 3084} {"train_loss": -25.3145809173584, "global_step": 256040, "epoch": 3084} {"train_loss": -25.25572967529297, "global_step": 256041, "epoch": 3084} {"train_loss": -25.177932739257812, "global_step": 256042, "epoch": 3084} {"train_loss": -25.241132736206055, "global_step": 256043, "epoch": 3084} {"train_loss": -24.967966079711914, "global_step": 256044, "epoch": 3084} {"train_loss": -24.89459800720215, "global_step": 256045, "epoch": 3084} {"train_loss": -25.140146255493164, "global_step": 256046, "epoch": 3084} {"train_loss": -24.999614715576172, "global_step": 256047, "epoch": 3084} {"train_loss": -24.93141746520996, "global_step": 256048, "epoch": 3084} {"train_loss": -24.415006637573242, "global_step": 256049, "epoch": 3084} {"train_loss": -24.24513053894043, "global_step": 256050, "epoch": 3084} {"train_loss": -24.64678192138672, "global_step": 256051, "epoch": 3084} {"train_loss": -25.036441802978516, "global_step": 256052, "epoch": 3084} {"train_loss": -24.875812530517578, "global_step": 256053, "epoch": 3084} {"train_loss": -25.001527372613012, "global_step": 256054, "epoch": 3084, "val_loss": 7124340.0} {"train_loss": -23.627164840698242, "global_step": 256055, "epoch": 3085} {"train_loss": -24.38400650024414, "global_step": 256056, "epoch": 3085} {"train_loss": -24.303394317626953, "global_step": 256057, "epoch": 3085} {"train_loss": -23.989517211914062, "global_step": 256058, "epoch": 3085} {"train_loss": -24.02018928527832, "global_step": 256059, "epoch": 3085} {"train_loss": -24.236454010009766, "global_step": 256060, "epoch": 3085} {"train_loss": -24.250778198242188, "global_step": 256061, "epoch": 3085} {"train_loss": -23.956748962402344, "global_step": 256062, "epoch": 3085} {"train_loss": -24.6051025390625, "global_step": 256063, "epoch": 3085} {"train_loss": -24.488428115844727, "global_step": 256064, "epoch": 3085} {"train_loss": -24.328523635864258, "global_step": 256065, "epoch": 3085} {"train_loss": -24.651424407958984, "global_step": 256066, "epoch": 3085} {"train_loss": -24.63947868347168, "global_step": 256067, "epoch": 3085} {"train_loss": -24.557886123657227, "global_step": 256068, "epoch": 3085} {"train_loss": -24.441741943359375, "global_step": 256069, "epoch": 3085} {"train_loss": -24.638166427612305, "global_step": 256070, "epoch": 3085} {"train_loss": -24.791107177734375, "global_step": 256071, "epoch": 3085} {"train_loss": -24.719257354736328, "global_step": 256072, "epoch": 3085} {"train_loss": -25.148113250732422, "global_step": 256073, "epoch": 3085} {"train_loss": -24.75690269470215, "global_step": 256074, "epoch": 3085} {"train_loss": -24.775508880615234, "global_step": 256075, "epoch": 3085} {"train_loss": -24.760711669921875, "global_step": 256076, "epoch": 3085} {"train_loss": -25.233861923217773, "global_step": 256077, "epoch": 3085} {"train_loss": -25.02647590637207, "global_step": 256078, "epoch": 3085} {"train_loss": -24.827146530151367, "global_step": 256079, "epoch": 3085} {"train_loss": -24.767305374145508, "global_step": 256080, "epoch": 3085} {"train_loss": -24.842618942260742, "global_step": 256081, "epoch": 3085} {"train_loss": -25.092554092407227, "global_step": 256082, "epoch": 3085} {"train_loss": -25.060911178588867, "global_step": 256083, "epoch": 3085} {"train_loss": -24.923337936401367, "global_step": 256084, "epoch": 3085} {"train_loss": -25.343175888061523, "global_step": 256085, "epoch": 3085} {"train_loss": -25.172178268432617, "global_step": 256086, "epoch": 3085} {"train_loss": -24.94322967529297, "global_step": 256087, "epoch": 3085} {"train_loss": -25.3630313873291, "global_step": 256088, "epoch": 3085} {"train_loss": -25.23731803894043, "global_step": 256089, "epoch": 3085} {"train_loss": -25.278644561767578, "global_step": 256090, "epoch": 3085} {"train_loss": -25.261924743652344, "global_step": 256091, "epoch": 3085} {"train_loss": -25.2836971282959, "global_step": 256092, "epoch": 3085} {"train_loss": -25.077245712280273, "global_step": 256093, "epoch": 3085} {"train_loss": -25.259082794189453, "global_step": 256094, "epoch": 3085} {"train_loss": -25.087827682495117, "global_step": 256095, "epoch": 3085} {"train_loss": -24.952085494995117, "global_step": 256096, "epoch": 3085} {"train_loss": -25.295490264892578, "global_step": 256097, "epoch": 3085} {"train_loss": -25.031789779663086, "global_step": 256098, "epoch": 3085} {"train_loss": -25.447599411010742, "global_step": 256099, "epoch": 3085} {"train_loss": -24.986570358276367, "global_step": 256100, "epoch": 3085} {"train_loss": -24.962961196899414, "global_step": 256101, "epoch": 3085} {"train_loss": -25.00409507751465, "global_step": 256102, "epoch": 3085} {"train_loss": -25.114866256713867, "global_step": 256103, "epoch": 3085} {"train_loss": -24.90968132019043, "global_step": 256104, "epoch": 3085} {"train_loss": -25.001440048217773, "global_step": 256105, "epoch": 3085} {"train_loss": -24.951356887817383, "global_step": 256106, "epoch": 3085} {"train_loss": -24.838613510131836, "global_step": 256107, "epoch": 3085} {"train_loss": -25.21824073791504, "global_step": 256108, "epoch": 3085} {"train_loss": -24.81270408630371, "global_step": 256109, "epoch": 3085} {"train_loss": -24.99030876159668, "global_step": 256110, "epoch": 3085} {"train_loss": -25.495147705078125, "global_step": 256111, "epoch": 3085} {"train_loss": -25.080747604370117, "global_step": 256112, "epoch": 3085} {"train_loss": -25.335933685302734, "global_step": 256113, "epoch": 3085} {"train_loss": -25.47464942932129, "global_step": 256114, "epoch": 3085} {"train_loss": -24.98341941833496, "global_step": 256115, "epoch": 3085} {"train_loss": -25.292903900146484, "global_step": 256116, "epoch": 3085} {"train_loss": -25.086610794067383, "global_step": 256117, "epoch": 3085} {"train_loss": -25.477291107177734, "global_step": 256118, "epoch": 3085} {"train_loss": -25.392345428466797, "global_step": 256119, "epoch": 3085} {"train_loss": -24.939722061157227, "global_step": 256120, "epoch": 3085} {"train_loss": -24.89954376220703, "global_step": 256121, "epoch": 3085} {"train_loss": -25.459150314331055, "global_step": 256122, "epoch": 3085} {"train_loss": -24.967100143432617, "global_step": 256123, "epoch": 3085} {"train_loss": -25.143352508544922, "global_step": 256124, "epoch": 3085} {"train_loss": -25.271408081054688, "global_step": 256125, "epoch": 3085} {"train_loss": -25.29880714416504, "global_step": 256126, "epoch": 3085} {"train_loss": -25.55091667175293, "global_step": 256127, "epoch": 3085} {"train_loss": -25.07175064086914, "global_step": 256128, "epoch": 3085} {"train_loss": -25.40060043334961, "global_step": 256129, "epoch": 3085} {"train_loss": -24.778818130493164, "global_step": 256130, "epoch": 3085} {"train_loss": -25.29720687866211, "global_step": 256131, "epoch": 3085} {"train_loss": -25.253103256225586, "global_step": 256132, "epoch": 3085} {"train_loss": -24.958791732788086, "global_step": 256133, "epoch": 3085} {"train_loss": -24.943973541259766, "global_step": 256134, "epoch": 3085} {"train_loss": -25.205257415771484, "global_step": 256135, "epoch": 3085} {"train_loss": -25.0551815032959, "global_step": 256136, "epoch": 3085} {"train_loss": -24.942433598529863, "global_step": 256137, "epoch": 3085, "val_loss": 6880660.0} {"train_loss": -22.32929801940918, "global_step": 256138, "epoch": 3086} {"train_loss": -22.4091854095459, "global_step": 256139, "epoch": 3086} {"train_loss": -23.60055160522461, "global_step": 256140, "epoch": 3086} {"train_loss": -23.015838623046875, "global_step": 256141, "epoch": 3086} {"train_loss": -23.791532516479492, "global_step": 256142, "epoch": 3086} {"train_loss": -23.898601531982422, "global_step": 256143, "epoch": 3086} {"train_loss": -23.655912399291992, "global_step": 256144, "epoch": 3086} {"train_loss": -24.499601364135742, "global_step": 256145, "epoch": 3086} {"train_loss": -24.066192626953125, "global_step": 256146, "epoch": 3086} {"train_loss": -24.26247215270996, "global_step": 256147, "epoch": 3086} {"train_loss": -24.231313705444336, "global_step": 256148, "epoch": 3086} {"train_loss": -24.118207931518555, "global_step": 256149, "epoch": 3086} {"train_loss": -24.43985366821289, "global_step": 256150, "epoch": 3086} {"train_loss": -24.58265495300293, "global_step": 256151, "epoch": 3086} {"train_loss": -24.324796676635742, "global_step": 256152, "epoch": 3086} {"train_loss": -24.385696411132812, "global_step": 256153, "epoch": 3086} {"train_loss": -24.521862030029297, "global_step": 256154, "epoch": 3086} {"train_loss": -24.46834945678711, "global_step": 256155, "epoch": 3086} {"train_loss": -24.292505264282227, "global_step": 256156, "epoch": 3086} {"train_loss": -24.108627319335938, "global_step": 256157, "epoch": 3086} {"train_loss": -24.517988204956055, "global_step": 256158, "epoch": 3086} {"train_loss": -24.5907039642334, "global_step": 256159, "epoch": 3086} {"train_loss": -24.886323928833008, "global_step": 256160, "epoch": 3086} {"train_loss": -24.783729553222656, "global_step": 256161, "epoch": 3086} {"train_loss": -24.811140060424805, "global_step": 256162, "epoch": 3086} {"train_loss": -24.605693817138672, "global_step": 256163, "epoch": 3086} {"train_loss": -24.404672622680664, "global_step": 256164, "epoch": 3086} {"train_loss": -24.898496627807617, "global_step": 256165, "epoch": 3086} {"train_loss": -24.638280868530273, "global_step": 256166, "epoch": 3086} {"train_loss": -24.807340621948242, "global_step": 256167, "epoch": 3086} {"train_loss": -24.864721298217773, "global_step": 256168, "epoch": 3086} {"train_loss": -24.959558486938477, "global_step": 256169, "epoch": 3086} {"train_loss": -25.001388549804688, "global_step": 256170, "epoch": 3086} {"train_loss": -24.940549850463867, "global_step": 256171, "epoch": 3086} {"train_loss": -24.966215133666992, "global_step": 256172, "epoch": 3086} {"train_loss": -25.055248260498047, "global_step": 256173, "epoch": 3086} {"train_loss": -24.889690399169922, "global_step": 256174, "epoch": 3086} {"train_loss": -25.1633243560791, "global_step": 256175, "epoch": 3086} {"train_loss": -25.108722686767578, "global_step": 256176, "epoch": 3086} {"train_loss": -24.994979858398438, "global_step": 256177, "epoch": 3086} {"train_loss": -25.331279754638672, "global_step": 256178, "epoch": 3086} {"train_loss": -25.241880416870117, "global_step": 256179, "epoch": 3086} {"train_loss": -25.102140426635742, "global_step": 256180, "epoch": 3086} {"train_loss": -25.35870933532715, "global_step": 256181, "epoch": 3086} {"train_loss": -25.455875396728516, "global_step": 256182, "epoch": 3086} {"train_loss": -25.191579818725586, "global_step": 256183, "epoch": 3086} {"train_loss": -24.959089279174805, "global_step": 256184, "epoch": 3086} {"train_loss": -25.19917869567871, "global_step": 256185, "epoch": 3086} {"train_loss": -25.296415328979492, "global_step": 256186, "epoch": 3086} {"train_loss": -24.986095428466797, "global_step": 256187, "epoch": 3086} {"train_loss": -25.38051986694336, "global_step": 256188, "epoch": 3086} {"train_loss": -25.13400650024414, "global_step": 256189, "epoch": 3086} {"train_loss": -25.150074005126953, "global_step": 256190, "epoch": 3086} {"train_loss": -25.253202438354492, "global_step": 256191, "epoch": 3086} {"train_loss": -25.244516372680664, "global_step": 256192, "epoch": 3086} {"train_loss": -25.154172897338867, "global_step": 256193, "epoch": 3086} {"train_loss": -25.28468132019043, "global_step": 256194, "epoch": 3086} {"train_loss": -25.288475036621094, "global_step": 256195, "epoch": 3086} {"train_loss": -25.042083740234375, "global_step": 256196, "epoch": 3086} {"train_loss": -25.13607406616211, "global_step": 256197, "epoch": 3086} {"train_loss": -25.145523071289062, "global_step": 256198, "epoch": 3086} {"train_loss": -25.04825210571289, "global_step": 256199, "epoch": 3086} {"train_loss": -25.33522605895996, "global_step": 256200, "epoch": 3086} {"train_loss": -25.33380699157715, "global_step": 256201, "epoch": 3086} {"train_loss": -25.193767547607422, "global_step": 256202, "epoch": 3086} {"train_loss": -25.350133895874023, "global_step": 256203, "epoch": 3086} {"train_loss": -25.082826614379883, "global_step": 256204, "epoch": 3086} {"train_loss": -25.178234100341797, "global_step": 256205, "epoch": 3086} {"train_loss": -25.524389266967773, "global_step": 256206, "epoch": 3086} {"train_loss": -25.1242618560791, "global_step": 256207, "epoch": 3086} {"train_loss": -25.318004608154297, "global_step": 256208, "epoch": 3086} {"train_loss": -24.865541458129883, "global_step": 256209, "epoch": 3086} {"train_loss": -25.4315242767334, "global_step": 256210, "epoch": 3086} {"train_loss": -25.21784019470215, "global_step": 256211, "epoch": 3086} {"train_loss": -24.978940963745117, "global_step": 256212, "epoch": 3086} {"train_loss": -25.034284591674805, "global_step": 256213, "epoch": 3086} {"train_loss": -25.19131851196289, "global_step": 256214, "epoch": 3086} {"train_loss": -25.15691566467285, "global_step": 256215, "epoch": 3086} {"train_loss": -25.239471435546875, "global_step": 256216, "epoch": 3086} {"train_loss": -25.540721893310547, "global_step": 256217, "epoch": 3086} {"train_loss": -25.176111221313477, "global_step": 256218, "epoch": 3086} {"train_loss": -25.438154220581055, "global_step": 256219, "epoch": 3086} {"train_loss": -24.840572426118047, "global_step": 256220, "epoch": 3086, "val_loss": 6822148.0} {"train_loss": -24.042726516723633, "global_step": 256221, "epoch": 3087} {"train_loss": -24.237125396728516, "global_step": 256222, "epoch": 3087} {"train_loss": -24.0018310546875, "global_step": 256223, "epoch": 3087} {"train_loss": -24.84621238708496, "global_step": 256224, "epoch": 3087} {"train_loss": -24.27729606628418, "global_step": 256225, "epoch": 3087} {"train_loss": -23.858301162719727, "global_step": 256226, "epoch": 3087} {"train_loss": -24.491552352905273, "global_step": 256227, "epoch": 3087} {"train_loss": -24.718647003173828, "global_step": 256228, "epoch": 3087} {"train_loss": -24.43613052368164, "global_step": 256229, "epoch": 3087} {"train_loss": -24.619403839111328, "global_step": 256230, "epoch": 3087} {"train_loss": -24.648115158081055, "global_step": 256231, "epoch": 3087} {"train_loss": -24.693788528442383, "global_step": 256232, "epoch": 3087} {"train_loss": -24.884265899658203, "global_step": 256233, "epoch": 3087} {"train_loss": -24.90813446044922, "global_step": 256234, "epoch": 3087} {"train_loss": -24.618738174438477, "global_step": 256235, "epoch": 3087} {"train_loss": -24.686279296875, "global_step": 256236, "epoch": 3087} {"train_loss": -24.689970016479492, "global_step": 256237, "epoch": 3087} {"train_loss": -24.8901424407959, "global_step": 256238, "epoch": 3087} {"train_loss": -24.791929244995117, "global_step": 256239, "epoch": 3087} {"train_loss": -25.02435874938965, "global_step": 256240, "epoch": 3087} {"train_loss": -25.30649185180664, "global_step": 256241, "epoch": 3087} {"train_loss": -24.832326889038086, "global_step": 256242, "epoch": 3087} {"train_loss": -25.05929946899414, "global_step": 256243, "epoch": 3087} {"train_loss": -24.87397575378418, "global_step": 256244, "epoch": 3087} {"train_loss": -25.0589656829834, "global_step": 256245, "epoch": 3087} {"train_loss": -25.40437126159668, "global_step": 256246, "epoch": 3087} {"train_loss": -25.061603546142578, "global_step": 256247, "epoch": 3087} {"train_loss": -24.8015193939209, "global_step": 256248, "epoch": 3087} {"train_loss": -24.97562026977539, "global_step": 256249, "epoch": 3087} {"train_loss": -24.802459716796875, "global_step": 256250, "epoch": 3087} {"train_loss": -25.2393856048584, "global_step": 256251, "epoch": 3087} {"train_loss": -25.319061279296875, "global_step": 256252, "epoch": 3087} {"train_loss": -25.084325790405273, "global_step": 256253, "epoch": 3087} {"train_loss": -25.15321922302246, "global_step": 256254, "epoch": 3087} {"train_loss": -25.37482261657715, "global_step": 256255, "epoch": 3087} {"train_loss": -25.195388793945312, "global_step": 256256, "epoch": 3087} {"train_loss": -25.282041549682617, "global_step": 256257, "epoch": 3087} {"train_loss": -25.307355880737305, "global_step": 256258, "epoch": 3087} {"train_loss": -25.226911544799805, "global_step": 256259, "epoch": 3087} {"train_loss": -25.020286560058594, "global_step": 256260, "epoch": 3087} {"train_loss": -25.36756706237793, "global_step": 256261, "epoch": 3087} {"train_loss": -25.394775390625, "global_step": 256262, "epoch": 3087} {"train_loss": -25.183425903320312, "global_step": 256263, "epoch": 3087} {"train_loss": -25.194698333740234, "global_step": 256264, "epoch": 3087} {"train_loss": -25.309839248657227, "global_step": 256265, "epoch": 3087} {"train_loss": -24.74338150024414, "global_step": 256266, "epoch": 3087} {"train_loss": -25.157886505126953, "global_step": 256267, "epoch": 3087} {"train_loss": -25.136091232299805, "global_step": 256268, "epoch": 3087} {"train_loss": -25.059770584106445, "global_step": 256269, "epoch": 3087} {"train_loss": -25.37502670288086, "global_step": 256270, "epoch": 3087} {"train_loss": -25.697168350219727, "global_step": 256271, "epoch": 3087} {"train_loss": -25.223800659179688, "global_step": 256272, "epoch": 3087} {"train_loss": -25.30940055847168, "global_step": 256273, "epoch": 3087} {"train_loss": -24.746191024780273, "global_step": 256274, "epoch": 3087} {"train_loss": -25.010169982910156, "global_step": 256275, "epoch": 3087} {"train_loss": -25.310699462890625, "global_step": 256276, "epoch": 3087} {"train_loss": -24.662689208984375, "global_step": 256277, "epoch": 3087} {"train_loss": -24.880346298217773, "global_step": 256278, "epoch": 3087} {"train_loss": -25.199066162109375, "global_step": 256279, "epoch": 3087} {"train_loss": -25.124631881713867, "global_step": 256280, "epoch": 3087} {"train_loss": -25.030784606933594, "global_step": 256281, "epoch": 3087} {"train_loss": -25.226396560668945, "global_step": 256282, "epoch": 3087} {"train_loss": -24.91250991821289, "global_step": 256283, "epoch": 3087} {"train_loss": -24.820913314819336, "global_step": 256284, "epoch": 3087} {"train_loss": -24.903812408447266, "global_step": 256285, "epoch": 3087} {"train_loss": -25.0872859954834, "global_step": 256286, "epoch": 3087} {"train_loss": -24.92831802368164, "global_step": 256287, "epoch": 3087} {"train_loss": -25.42714500427246, "global_step": 256288, "epoch": 3087} {"train_loss": -24.864126205444336, "global_step": 256289, "epoch": 3087} {"train_loss": -24.843313217163086, "global_step": 256290, "epoch": 3087} {"train_loss": -25.457782745361328, "global_step": 256291, "epoch": 3087} {"train_loss": -25.244647979736328, "global_step": 256292, "epoch": 3087} {"train_loss": -24.92591667175293, "global_step": 256293, "epoch": 3087} {"train_loss": -25.029844284057617, "global_step": 256294, "epoch": 3087} {"train_loss": -24.99358558654785, "global_step": 256295, "epoch": 3087} {"train_loss": -25.21181297302246, "global_step": 256296, "epoch": 3087} {"train_loss": -24.836742401123047, "global_step": 256297, "epoch": 3087} {"train_loss": -24.89052391052246, "global_step": 256298, "epoch": 3087} {"train_loss": -24.875024795532227, "global_step": 256299, "epoch": 3087} {"train_loss": -25.197690963745117, "global_step": 256300, "epoch": 3087} {"train_loss": -25.261716842651367, "global_step": 256301, "epoch": 3087} {"train_loss": -25.219404220581055, "global_step": 256302, "epoch": 3087} {"train_loss": -24.994421189089856, "global_step": 256303, "epoch": 3087, "val_loss": 6910381.0} {"train_loss": -24.421201705932617, "global_step": 256304, "epoch": 3088} {"train_loss": -24.705974578857422, "global_step": 256305, "epoch": 3088} {"train_loss": -24.737567901611328, "global_step": 256306, "epoch": 3088} {"train_loss": -24.39107322692871, "global_step": 256307, "epoch": 3088} {"train_loss": -24.904205322265625, "global_step": 256308, "epoch": 3088} {"train_loss": -24.68174171447754, "global_step": 256309, "epoch": 3088} {"train_loss": -24.551513671875, "global_step": 256310, "epoch": 3088} {"train_loss": -24.80280113220215, "global_step": 256311, "epoch": 3088} {"train_loss": -24.918106079101562, "global_step": 256312, "epoch": 3088} {"train_loss": -24.586624145507812, "global_step": 256313, "epoch": 3088} {"train_loss": -24.918119430541992, "global_step": 256314, "epoch": 3088} {"train_loss": -25.06583595275879, "global_step": 256315, "epoch": 3088} {"train_loss": -25.056171417236328, "global_step": 256316, "epoch": 3088} {"train_loss": -24.9833927154541, "global_step": 256317, "epoch": 3088} {"train_loss": -24.96486473083496, "global_step": 256318, "epoch": 3088} {"train_loss": -25.147626876831055, "global_step": 256319, "epoch": 3088} {"train_loss": -24.52772331237793, "global_step": 256320, "epoch": 3088} {"train_loss": -24.655284881591797, "global_step": 256321, "epoch": 3088} {"train_loss": -24.529701232910156, "global_step": 256322, "epoch": 3088} {"train_loss": -24.971179962158203, "global_step": 256323, "epoch": 3088} {"train_loss": -24.813663482666016, "global_step": 256324, "epoch": 3088} {"train_loss": -25.096715927124023, "global_step": 256325, "epoch": 3088} {"train_loss": -24.929248809814453, "global_step": 256326, "epoch": 3088} {"train_loss": -25.04884910583496, "global_step": 256327, "epoch": 3088} {"train_loss": -25.292388916015625, "global_step": 256328, "epoch": 3088} {"train_loss": -25.264755249023438, "global_step": 256329, "epoch": 3088} {"train_loss": -25.12672233581543, "global_step": 256330, "epoch": 3088} {"train_loss": -24.871938705444336, "global_step": 256331, "epoch": 3088} {"train_loss": -25.23548698425293, "global_step": 256332, "epoch": 3088} {"train_loss": -25.244857788085938, "global_step": 256333, "epoch": 3088} {"train_loss": -24.91360855102539, "global_step": 256334, "epoch": 3088} {"train_loss": -25.07378578186035, "global_step": 256335, "epoch": 3088} {"train_loss": -25.017560958862305, "global_step": 256336, "epoch": 3088} {"train_loss": -25.09488296508789, "global_step": 256337, "epoch": 3088} {"train_loss": -25.261281967163086, "global_step": 256338, "epoch": 3088} {"train_loss": -25.2723331451416, "global_step": 256339, "epoch": 3088} {"train_loss": -25.518569946289062, "global_step": 256340, "epoch": 3088} {"train_loss": -24.996274948120117, "global_step": 256341, "epoch": 3088} {"train_loss": -25.34186363220215, "global_step": 256342, "epoch": 3088} {"train_loss": -25.1983699798584, "global_step": 256343, "epoch": 3088} {"train_loss": -25.224971771240234, "global_step": 256344, "epoch": 3088} {"train_loss": -25.232126235961914, "global_step": 256345, "epoch": 3088} {"train_loss": -25.087453842163086, "global_step": 256346, "epoch": 3088} {"train_loss": -25.240127563476562, "global_step": 256347, "epoch": 3088} {"train_loss": -24.776145935058594, "global_step": 256348, "epoch": 3088} {"train_loss": -25.011322021484375, "global_step": 256349, "epoch": 3088} {"train_loss": -25.520727157592773, "global_step": 256350, "epoch": 3088} {"train_loss": -25.05942153930664, "global_step": 256351, "epoch": 3088} {"train_loss": -24.871957778930664, "global_step": 256352, "epoch": 3088} {"train_loss": -24.979154586791992, "global_step": 256353, "epoch": 3088} {"train_loss": -25.480499267578125, "global_step": 256354, "epoch": 3088} {"train_loss": -25.069091796875, "global_step": 256355, "epoch": 3088} {"train_loss": -25.243518829345703, "global_step": 256356, "epoch": 3088} {"train_loss": -24.973072052001953, "global_step": 256357, "epoch": 3088} {"train_loss": -25.279436111450195, "global_step": 256358, "epoch": 3088} {"train_loss": -24.859132766723633, "global_step": 256359, "epoch": 3088} {"train_loss": -25.034948348999023, "global_step": 256360, "epoch": 3088} {"train_loss": -25.05214500427246, "global_step": 256361, "epoch": 3088} {"train_loss": -25.081663131713867, "global_step": 256362, "epoch": 3088} {"train_loss": -25.410642623901367, "global_step": 256363, "epoch": 3088} {"train_loss": -24.94257926940918, "global_step": 256364, "epoch": 3088} {"train_loss": -25.563861846923828, "global_step": 256365, "epoch": 3088} {"train_loss": -25.682147979736328, "global_step": 256366, "epoch": 3088} {"train_loss": -25.216888427734375, "global_step": 256367, "epoch": 3088} {"train_loss": -25.3350887298584, "global_step": 256368, "epoch": 3088} {"train_loss": -25.103811264038086, "global_step": 256369, "epoch": 3088} {"train_loss": -25.056455612182617, "global_step": 256370, "epoch": 3088} {"train_loss": -25.369937896728516, "global_step": 256371, "epoch": 3088} {"train_loss": -25.324121475219727, "global_step": 256372, "epoch": 3088} {"train_loss": -24.82411766052246, "global_step": 256373, "epoch": 3088} {"train_loss": -25.033933639526367, "global_step": 256374, "epoch": 3088} {"train_loss": -25.44797134399414, "global_step": 256375, "epoch": 3088} {"train_loss": -25.233694076538086, "global_step": 256376, "epoch": 3088} {"train_loss": -25.3444766998291, "global_step": 256377, "epoch": 3088} {"train_loss": -24.765775680541992, "global_step": 256378, "epoch": 3088} {"train_loss": -24.963014602661133, "global_step": 256379, "epoch": 3088} {"train_loss": -24.70118522644043, "global_step": 256380, "epoch": 3088} {"train_loss": -25.20711898803711, "global_step": 256381, "epoch": 3088} {"train_loss": -25.17841339111328, "global_step": 256382, "epoch": 3088} {"train_loss": -25.03351402282715, "global_step": 256383, "epoch": 3088} {"train_loss": -25.038007736206055, "global_step": 256384, "epoch": 3088} {"train_loss": -25.288251876831055, "global_step": 256385, "epoch": 3088} {"train_loss": -25.065965330744366, "global_step": 256386, "epoch": 3088, "val_loss": 6894761.0} {"train_loss": -24.636638641357422, "global_step": 256387, "epoch": 3089} {"train_loss": -23.946075439453125, "global_step": 256388, "epoch": 3089} {"train_loss": -24.435672760009766, "global_step": 256389, "epoch": 3089} {"train_loss": -24.668691635131836, "global_step": 256390, "epoch": 3089} {"train_loss": -24.740461349487305, "global_step": 256391, "epoch": 3089} {"train_loss": -24.844831466674805, "global_step": 256392, "epoch": 3089} {"train_loss": -25.08243751525879, "global_step": 256393, "epoch": 3089} {"train_loss": -24.797765731811523, "global_step": 256394, "epoch": 3089} {"train_loss": -24.833662033081055, "global_step": 256395, "epoch": 3089} {"train_loss": -24.893512725830078, "global_step": 256396, "epoch": 3089} {"train_loss": -24.803787231445312, "global_step": 256397, "epoch": 3089} {"train_loss": -24.81093978881836, "global_step": 256398, "epoch": 3089} {"train_loss": -25.32062530517578, "global_step": 256399, "epoch": 3089} {"train_loss": -25.395679473876953, "global_step": 256400, "epoch": 3089} {"train_loss": -25.23696517944336, "global_step": 256401, "epoch": 3089} {"train_loss": -25.096715927124023, "global_step": 256402, "epoch": 3089} {"train_loss": -24.78006362915039, "global_step": 256403, "epoch": 3089} {"train_loss": -25.31319236755371, "global_step": 256404, "epoch": 3089} {"train_loss": -24.6627197265625, "global_step": 256405, "epoch": 3089} {"train_loss": -24.78704833984375, "global_step": 256406, "epoch": 3089} {"train_loss": -24.827783584594727, "global_step": 256407, "epoch": 3089} {"train_loss": -24.852766036987305, "global_step": 256408, "epoch": 3089} {"train_loss": -25.333646774291992, "global_step": 256409, "epoch": 3089} {"train_loss": -24.97443199157715, "global_step": 256410, "epoch": 3089} {"train_loss": -25.168460845947266, "global_step": 256411, "epoch": 3089} {"train_loss": -25.00237274169922, "global_step": 256412, "epoch": 3089} {"train_loss": -24.674442291259766, "global_step": 256413, "epoch": 3089} {"train_loss": -25.072782516479492, "global_step": 256414, "epoch": 3089} {"train_loss": -25.087482452392578, "global_step": 256415, "epoch": 3089} {"train_loss": -25.29891014099121, "global_step": 256416, "epoch": 3089} {"train_loss": -25.099294662475586, "global_step": 256417, "epoch": 3089} {"train_loss": -25.51962661743164, "global_step": 256418, "epoch": 3089} {"train_loss": -25.358779907226562, "global_step": 256419, "epoch": 3089} {"train_loss": -25.600753784179688, "global_step": 256420, "epoch": 3089} {"train_loss": -25.48334503173828, "global_step": 256421, "epoch": 3089} {"train_loss": -25.023157119750977, "global_step": 256422, "epoch": 3089} {"train_loss": -25.15703773498535, "global_step": 256423, "epoch": 3089} {"train_loss": -25.14316177368164, "global_step": 256424, "epoch": 3089} {"train_loss": -25.610334396362305, "global_step": 256425, "epoch": 3089} {"train_loss": -25.478132247924805, "global_step": 256426, "epoch": 3089} {"train_loss": -25.014707565307617, "global_step": 256427, "epoch": 3089} {"train_loss": -25.161163330078125, "global_step": 256428, "epoch": 3089} {"train_loss": -25.12627410888672, "global_step": 256429, "epoch": 3089} {"train_loss": -25.1202335357666, "global_step": 256430, "epoch": 3089} {"train_loss": -25.2082462310791, "global_step": 256431, "epoch": 3089} {"train_loss": -25.216175079345703, "global_step": 256432, "epoch": 3089} {"train_loss": -25.352935791015625, "global_step": 256433, "epoch": 3089} {"train_loss": -25.11867332458496, "global_step": 256434, "epoch": 3089} {"train_loss": -25.315587997436523, "global_step": 256435, "epoch": 3089} {"train_loss": -25.267786026000977, "global_step": 256436, "epoch": 3089} {"train_loss": -25.482379913330078, "global_step": 256437, "epoch": 3089} {"train_loss": -25.13541030883789, "global_step": 256438, "epoch": 3089} {"train_loss": -25.345388412475586, "global_step": 256439, "epoch": 3089} {"train_loss": -24.89748191833496, "global_step": 256440, "epoch": 3089} {"train_loss": -25.394699096679688, "global_step": 256441, "epoch": 3089} {"train_loss": -25.165590286254883, "global_step": 256442, "epoch": 3089} {"train_loss": -25.241153717041016, "global_step": 256443, "epoch": 3089} {"train_loss": -24.98452377319336, "global_step": 256444, "epoch": 3089} {"train_loss": -25.176115036010742, "global_step": 256445, "epoch": 3089} {"train_loss": -25.316884994506836, "global_step": 256446, "epoch": 3089} {"train_loss": -25.22393226623535, "global_step": 256447, "epoch": 3089} {"train_loss": -25.20169448852539, "global_step": 256448, "epoch": 3089} {"train_loss": -25.46736717224121, "global_step": 256449, "epoch": 3089} {"train_loss": -25.257246017456055, "global_step": 256450, "epoch": 3089} {"train_loss": -25.18857765197754, "global_step": 256451, "epoch": 3089} {"train_loss": -25.162799835205078, "global_step": 256452, "epoch": 3089} {"train_loss": -25.14491844177246, "global_step": 256453, "epoch": 3089} {"train_loss": -24.916799545288086, "global_step": 256454, "epoch": 3089} {"train_loss": -25.30829429626465, "global_step": 256455, "epoch": 3089} {"train_loss": -25.247671127319336, "global_step": 256456, "epoch": 3089} {"train_loss": -24.8961238861084, "global_step": 256457, "epoch": 3089} {"train_loss": -24.607492446899414, "global_step": 256458, "epoch": 3089} {"train_loss": -25.069684982299805, "global_step": 256459, "epoch": 3089} {"train_loss": -25.3632755279541, "global_step": 256460, "epoch": 3089} {"train_loss": -25.141090393066406, "global_step": 256461, "epoch": 3089} {"train_loss": -24.754932403564453, "global_step": 256462, "epoch": 3089} {"train_loss": -24.601205825805664, "global_step": 256463, "epoch": 3089} {"train_loss": -25.007932662963867, "global_step": 256464, "epoch": 3089} {"train_loss": -25.07501792907715, "global_step": 256465, "epoch": 3089} {"train_loss": -24.834369659423828, "global_step": 256466, "epoch": 3089} {"train_loss": -24.844226837158203, "global_step": 256467, "epoch": 3089} {"train_loss": -25.121997833251953, "global_step": 256468, "epoch": 3089} {"train_loss": -25.087268622524768, "global_step": 256469, "epoch": 3089, "val_loss": 6942664.5} {"train_loss": -24.72829246520996, "global_step": 256470, "epoch": 3090} {"train_loss": -24.649860382080078, "global_step": 256471, "epoch": 3090} {"train_loss": -24.59682273864746, "global_step": 256472, "epoch": 3090} {"train_loss": -24.662456512451172, "global_step": 256473, "epoch": 3090} {"train_loss": -24.533716201782227, "global_step": 256474, "epoch": 3090} {"train_loss": -24.590559005737305, "global_step": 256475, "epoch": 3090} {"train_loss": -24.45795249938965, "global_step": 256476, "epoch": 3090} {"train_loss": -24.47466468811035, "global_step": 256477, "epoch": 3090} {"train_loss": -24.667713165283203, "global_step": 256478, "epoch": 3090} {"train_loss": -24.51901626586914, "global_step": 256479, "epoch": 3090} {"train_loss": -24.212003707885742, "global_step": 256480, "epoch": 3090} {"train_loss": -24.475507736206055, "global_step": 256481, "epoch": 3090} {"train_loss": -24.56460189819336, "global_step": 256482, "epoch": 3090} {"train_loss": -25.050140380859375, "global_step": 256483, "epoch": 3090} {"train_loss": -24.474863052368164, "global_step": 256484, "epoch": 3090} {"train_loss": -24.942096710205078, "global_step": 256485, "epoch": 3090} {"train_loss": -24.579877853393555, "global_step": 256486, "epoch": 3090} {"train_loss": -24.864383697509766, "global_step": 256487, "epoch": 3090} {"train_loss": -24.651945114135742, "global_step": 256488, "epoch": 3090} {"train_loss": -25.176416397094727, "global_step": 256489, "epoch": 3090} {"train_loss": -25.171985626220703, "global_step": 256490, "epoch": 3090} {"train_loss": -24.883703231811523, "global_step": 256491, "epoch": 3090} {"train_loss": -24.877710342407227, "global_step": 256492, "epoch": 3090} {"train_loss": -24.831417083740234, "global_step": 256493, "epoch": 3090} {"train_loss": -24.850122451782227, "global_step": 256494, "epoch": 3090} {"train_loss": -24.765600204467773, "global_step": 256495, "epoch": 3090} {"train_loss": -24.829702377319336, "global_step": 256496, "epoch": 3090} {"train_loss": -24.88295555114746, "global_step": 256497, "epoch": 3090} {"train_loss": -24.826536178588867, "global_step": 256498, "epoch": 3090} {"train_loss": -25.5247859954834, "global_step": 256499, "epoch": 3090} {"train_loss": -24.89740562438965, "global_step": 256500, "epoch": 3090} {"train_loss": -25.421892166137695, "global_step": 256501, "epoch": 3090} {"train_loss": -25.005155563354492, "global_step": 256502, "epoch": 3090} {"train_loss": -25.072107315063477, "global_step": 256503, "epoch": 3090} {"train_loss": -25.235153198242188, "global_step": 256504, "epoch": 3090} {"train_loss": -25.304513931274414, "global_step": 256505, "epoch": 3090} {"train_loss": -24.924331665039062, "global_step": 256506, "epoch": 3090} {"train_loss": -25.700027465820312, "global_step": 256507, "epoch": 3090} {"train_loss": -25.182903289794922, "global_step": 256508, "epoch": 3090} {"train_loss": -25.272382736206055, "global_step": 256509, "epoch": 3090} {"train_loss": -25.0623836517334, "global_step": 256510, "epoch": 3090} {"train_loss": -25.75111198425293, "global_step": 256511, "epoch": 3090} {"train_loss": -25.347213745117188, "global_step": 256512, "epoch": 3090} {"train_loss": -25.25058364868164, "global_step": 256513, "epoch": 3090} {"train_loss": -24.988876342773438, "global_step": 256514, "epoch": 3090} {"train_loss": -25.38833999633789, "global_step": 256515, "epoch": 3090} {"train_loss": -24.9729061126709, "global_step": 256516, "epoch": 3090} {"train_loss": -25.035032272338867, "global_step": 256517, "epoch": 3090} {"train_loss": -25.175939559936523, "global_step": 256518, "epoch": 3090} {"train_loss": -25.330081939697266, "global_step": 256519, "epoch": 3090} {"train_loss": -25.43762969970703, "global_step": 256520, "epoch": 3090} {"train_loss": -25.12926483154297, "global_step": 256521, "epoch": 3090} {"train_loss": -25.108083724975586, "global_step": 256522, "epoch": 3090} {"train_loss": -24.959840774536133, "global_step": 256523, "epoch": 3090} {"train_loss": -24.929397583007812, "global_step": 256524, "epoch": 3090} {"train_loss": -25.31252098083496, "global_step": 256525, "epoch": 3090} {"train_loss": -25.360044479370117, "global_step": 256526, "epoch": 3090} {"train_loss": -24.78169059753418, "global_step": 256527, "epoch": 3090} {"train_loss": -25.02378273010254, "global_step": 256528, "epoch": 3090} {"train_loss": -25.402067184448242, "global_step": 256529, "epoch": 3090} {"train_loss": -25.220691680908203, "global_step": 256530, "epoch": 3090} {"train_loss": -24.912443161010742, "global_step": 256531, "epoch": 3090} {"train_loss": -25.385812759399414, "global_step": 256532, "epoch": 3090} {"train_loss": -25.19223976135254, "global_step": 256533, "epoch": 3090} {"train_loss": -24.836652755737305, "global_step": 256534, "epoch": 3090} {"train_loss": -25.17925453186035, "global_step": 256535, "epoch": 3090} {"train_loss": -24.73617935180664, "global_step": 256536, "epoch": 3090} {"train_loss": -25.261878967285156, "global_step": 256537, "epoch": 3090} {"train_loss": -24.59919548034668, "global_step": 256538, "epoch": 3090} {"train_loss": -24.790756225585938, "global_step": 256539, "epoch": 3090} {"train_loss": -25.06519317626953, "global_step": 256540, "epoch": 3090} {"train_loss": -25.102170944213867, "global_step": 256541, "epoch": 3090} {"train_loss": -25.403600692749023, "global_step": 256542, "epoch": 3090} {"train_loss": -25.092893600463867, "global_step": 256543, "epoch": 3090} {"train_loss": -24.769289016723633, "global_step": 256544, "epoch": 3090} {"train_loss": -24.812841415405273, "global_step": 256545, "epoch": 3090} {"train_loss": -25.01012420654297, "global_step": 256546, "epoch": 3090} {"train_loss": -25.0455379486084, "global_step": 256547, "epoch": 3090} {"train_loss": -25.220178604125977, "global_step": 256548, "epoch": 3090} {"train_loss": -24.798519134521484, "global_step": 256549, "epoch": 3090} {"train_loss": -25.158063888549805, "global_step": 256550, "epoch": 3090} {"train_loss": -24.813232421875, "global_step": 256551, "epoch": 3090} {"train_loss": -24.963876632322748, "global_step": 256552, "epoch": 3090, "val_loss": 6870687.5} {"train_loss": -24.609033584594727, "global_step": 256553, "epoch": 3091} {"train_loss": -24.506244659423828, "global_step": 256554, "epoch": 3091} {"train_loss": -25.01283073425293, "global_step": 256555, "epoch": 3091} {"train_loss": -24.88393211364746, "global_step": 256556, "epoch": 3091} {"train_loss": -24.67677116394043, "global_step": 256557, "epoch": 3091} {"train_loss": -24.917377471923828, "global_step": 256558, "epoch": 3091} {"train_loss": -24.915546417236328, "global_step": 256559, "epoch": 3091} {"train_loss": -24.401655197143555, "global_step": 256560, "epoch": 3091} {"train_loss": -24.782833099365234, "global_step": 256561, "epoch": 3091} {"train_loss": -25.26834487915039, "global_step": 256562, "epoch": 3091} {"train_loss": -24.656570434570312, "global_step": 256563, "epoch": 3091} {"train_loss": -24.893095016479492, "global_step": 256564, "epoch": 3091} {"train_loss": -25.102066040039062, "global_step": 256565, "epoch": 3091} {"train_loss": -25.135604858398438, "global_step": 256566, "epoch": 3091} {"train_loss": -25.050521850585938, "global_step": 256567, "epoch": 3091} {"train_loss": -24.66942024230957, "global_step": 256568, "epoch": 3091} {"train_loss": -25.194204330444336, "global_step": 256569, "epoch": 3091} {"train_loss": -25.231595993041992, "global_step": 256570, "epoch": 3091} {"train_loss": -24.767602920532227, "global_step": 256571, "epoch": 3091} {"train_loss": -24.86211395263672, "global_step": 256572, "epoch": 3091} {"train_loss": -25.23813819885254, "global_step": 256573, "epoch": 3091} {"train_loss": -25.080703735351562, "global_step": 256574, "epoch": 3091} {"train_loss": -25.12165069580078, "global_step": 256575, "epoch": 3091} {"train_loss": -24.78807830810547, "global_step": 256576, "epoch": 3091} {"train_loss": -25.141759872436523, "global_step": 256577, "epoch": 3091} {"train_loss": -24.91873550415039, "global_step": 256578, "epoch": 3091} {"train_loss": -24.981613159179688, "global_step": 256579, "epoch": 3091} {"train_loss": -25.343856811523438, "global_step": 256580, "epoch": 3091} {"train_loss": -25.159265518188477, "global_step": 256581, "epoch": 3091} {"train_loss": -25.020795822143555, "global_step": 256582, "epoch": 3091} {"train_loss": -25.250455856323242, "global_step": 256583, "epoch": 3091} {"train_loss": -25.141834259033203, "global_step": 256584, "epoch": 3091} {"train_loss": -25.129133224487305, "global_step": 256585, "epoch": 3091} {"train_loss": -25.021373748779297, "global_step": 256586, "epoch": 3091} {"train_loss": -24.934904098510742, "global_step": 256587, "epoch": 3091} {"train_loss": -24.750362396240234, "global_step": 256588, "epoch": 3091} {"train_loss": -25.063329696655273, "global_step": 256589, "epoch": 3091} {"train_loss": -25.502363204956055, "global_step": 256590, "epoch": 3091} {"train_loss": -25.204030990600586, "global_step": 256591, "epoch": 3091} {"train_loss": -25.495725631713867, "global_step": 256592, "epoch": 3091} {"train_loss": -25.135587692260742, "global_step": 256593, "epoch": 3091} {"train_loss": -25.103206634521484, "global_step": 256594, "epoch": 3091} {"train_loss": -25.25644874572754, "global_step": 256595, "epoch": 3091} {"train_loss": -25.2705135345459, "global_step": 256596, "epoch": 3091} {"train_loss": -25.096525192260742, "global_step": 256597, "epoch": 3091} {"train_loss": -25.366811752319336, "global_step": 256598, "epoch": 3091} {"train_loss": -24.705398559570312, "global_step": 256599, "epoch": 3091} {"train_loss": -24.92327880859375, "global_step": 256600, "epoch": 3091} {"train_loss": -24.79535484313965, "global_step": 256601, "epoch": 3091} {"train_loss": -24.4097900390625, "global_step": 256602, "epoch": 3091} {"train_loss": -24.353731155395508, "global_step": 256603, "epoch": 3091} {"train_loss": -25.019901275634766, "global_step": 256604, "epoch": 3091} {"train_loss": -24.684707641601562, "global_step": 256605, "epoch": 3091} {"train_loss": -24.299150466918945, "global_step": 256606, "epoch": 3091} {"train_loss": -24.864612579345703, "global_step": 256607, "epoch": 3091} {"train_loss": -24.68125343322754, "global_step": 256608, "epoch": 3091} {"train_loss": -24.802593231201172, "global_step": 256609, "epoch": 3091} {"train_loss": -24.519067764282227, "global_step": 256610, "epoch": 3091} {"train_loss": -24.66679573059082, "global_step": 256611, "epoch": 3091} {"train_loss": -24.699350357055664, "global_step": 256612, "epoch": 3091} {"train_loss": -24.665040969848633, "global_step": 256613, "epoch": 3091} {"train_loss": -24.883691787719727, "global_step": 256614, "epoch": 3091} {"train_loss": -25.06340789794922, "global_step": 256615, "epoch": 3091} {"train_loss": -24.438352584838867, "global_step": 256616, "epoch": 3091} {"train_loss": -24.934680938720703, "global_step": 256617, "epoch": 3091} {"train_loss": -24.786596298217773, "global_step": 256618, "epoch": 3091} {"train_loss": -24.799606323242188, "global_step": 256619, "epoch": 3091} {"train_loss": -25.134662628173828, "global_step": 256620, "epoch": 3091} {"train_loss": -24.72282600402832, "global_step": 256621, "epoch": 3091} {"train_loss": -24.81840705871582, "global_step": 256622, "epoch": 3091} {"train_loss": -24.991687774658203, "global_step": 256623, "epoch": 3091} {"train_loss": -24.86197853088379, "global_step": 256624, "epoch": 3091} {"train_loss": -25.189786911010742, "global_step": 256625, "epoch": 3091} {"train_loss": -25.21169090270996, "global_step": 256626, "epoch": 3091} {"train_loss": -25.24430274963379, "global_step": 256627, "epoch": 3091} {"train_loss": -24.93138313293457, "global_step": 256628, "epoch": 3091} {"train_loss": -25.193771362304688, "global_step": 256629, "epoch": 3091} {"train_loss": -24.68939208984375, "global_step": 256630, "epoch": 3091} {"train_loss": -25.19443130493164, "global_step": 256631, "epoch": 3091} {"train_loss": -25.027847290039062, "global_step": 256632, "epoch": 3091} {"train_loss": -24.98250389099121, "global_step": 256633, "epoch": 3091} {"train_loss": -25.141386032104492, "global_step": 256634, "epoch": 3091} {"train_loss": -24.949377473578394, "global_step": 256635, "epoch": 3091, "val_loss": 6944232.5} {"train_loss": -24.224857330322266, "global_step": 256636, "epoch": 3092} {"train_loss": -24.533926010131836, "global_step": 256637, "epoch": 3092} {"train_loss": -24.481489181518555, "global_step": 256638, "epoch": 3092} {"train_loss": -24.8988094329834, "global_step": 256639, "epoch": 3092} {"train_loss": -24.672048568725586, "global_step": 256640, "epoch": 3092} {"train_loss": -24.703449249267578, "global_step": 256641, "epoch": 3092} {"train_loss": -24.69493865966797, "global_step": 256642, "epoch": 3092} {"train_loss": -24.84010887145996, "global_step": 256643, "epoch": 3092} {"train_loss": -25.252553939819336, "global_step": 256644, "epoch": 3092} {"train_loss": -24.7707576751709, "global_step": 256645, "epoch": 3092} {"train_loss": -24.902196884155273, "global_step": 256646, "epoch": 3092} {"train_loss": -24.714780807495117, "global_step": 256647, "epoch": 3092} {"train_loss": -25.178104400634766, "global_step": 256648, "epoch": 3092} {"train_loss": -24.720144271850586, "global_step": 256649, "epoch": 3092} {"train_loss": -24.981142044067383, "global_step": 256650, "epoch": 3092} {"train_loss": -24.86116600036621, "global_step": 256651, "epoch": 3092} {"train_loss": -25.0893611907959, "global_step": 256652, "epoch": 3092} {"train_loss": -24.663421630859375, "global_step": 256653, "epoch": 3092} {"train_loss": -24.64253807067871, "global_step": 256654, "epoch": 3092} {"train_loss": -25.368261337280273, "global_step": 256655, "epoch": 3092} {"train_loss": -25.143415451049805, "global_step": 256656, "epoch": 3092} {"train_loss": -25.373010635375977, "global_step": 256657, "epoch": 3092} {"train_loss": -24.669795989990234, "global_step": 256658, "epoch": 3092} {"train_loss": -24.923131942749023, "global_step": 256659, "epoch": 3092} {"train_loss": -24.926334381103516, "global_step": 256660, "epoch": 3092} {"train_loss": -24.822433471679688, "global_step": 256661, "epoch": 3092} {"train_loss": -25.1301326751709, "global_step": 256662, "epoch": 3092} {"train_loss": -25.002199172973633, "global_step": 256663, "epoch": 3092} {"train_loss": -25.087501525878906, "global_step": 256664, "epoch": 3092} {"train_loss": -25.253202438354492, "global_step": 256665, "epoch": 3092} {"train_loss": -25.055078506469727, "global_step": 256666, "epoch": 3092} {"train_loss": -25.150789260864258, "global_step": 256667, "epoch": 3092} {"train_loss": -25.287622451782227, "global_step": 256668, "epoch": 3092} {"train_loss": -25.174518585205078, "global_step": 256669, "epoch": 3092} {"train_loss": -24.769699096679688, "global_step": 256670, "epoch": 3092} {"train_loss": -25.031888961791992, "global_step": 256671, "epoch": 3092} {"train_loss": -25.0659122467041, "global_step": 256672, "epoch": 3092} {"train_loss": -25.716602325439453, "global_step": 256673, "epoch": 3092} {"train_loss": -25.30689811706543, "global_step": 256674, "epoch": 3092} {"train_loss": -25.113969802856445, "global_step": 256675, "epoch": 3092} {"train_loss": -24.97401237487793, "global_step": 256676, "epoch": 3092} {"train_loss": -25.081010818481445, "global_step": 256677, "epoch": 3092} {"train_loss": -25.229183197021484, "global_step": 256678, "epoch": 3092} {"train_loss": -24.987804412841797, "global_step": 256679, "epoch": 3092} {"train_loss": -24.93276023864746, "global_step": 256680, "epoch": 3092} {"train_loss": -25.027557373046875, "global_step": 256681, "epoch": 3092} {"train_loss": -25.036209106445312, "global_step": 256682, "epoch": 3092} {"train_loss": -25.11652946472168, "global_step": 256683, "epoch": 3092} {"train_loss": -25.028213500976562, "global_step": 256684, "epoch": 3092} {"train_loss": -24.72035789489746, "global_step": 256685, "epoch": 3092} {"train_loss": -24.802749633789062, "global_step": 256686, "epoch": 3092} {"train_loss": -24.886377334594727, "global_step": 256687, "epoch": 3092} {"train_loss": -24.953413009643555, "global_step": 256688, "epoch": 3092} {"train_loss": -25.441375732421875, "global_step": 256689, "epoch": 3092} {"train_loss": -25.02716636657715, "global_step": 256690, "epoch": 3092} {"train_loss": -25.130502700805664, "global_step": 256691, "epoch": 3092} {"train_loss": -25.269277572631836, "global_step": 256692, "epoch": 3092} {"train_loss": -25.05913734436035, "global_step": 256693, "epoch": 3092} {"train_loss": -25.319183349609375, "global_step": 256694, "epoch": 3092} {"train_loss": -25.19001579284668, "global_step": 256695, "epoch": 3092} {"train_loss": -25.5137996673584, "global_step": 256696, "epoch": 3092} {"train_loss": -25.163970947265625, "global_step": 256697, "epoch": 3092} {"train_loss": -24.93498992919922, "global_step": 256698, "epoch": 3092} {"train_loss": -25.126157760620117, "global_step": 256699, "epoch": 3092} {"train_loss": -25.281330108642578, "global_step": 256700, "epoch": 3092} {"train_loss": -25.39324951171875, "global_step": 256701, "epoch": 3092} {"train_loss": -25.779315948486328, "global_step": 256702, "epoch": 3092} {"train_loss": -25.319974899291992, "global_step": 256703, "epoch": 3092} {"train_loss": -25.01905632019043, "global_step": 256704, "epoch": 3092} {"train_loss": -25.31985855102539, "global_step": 256705, "epoch": 3092} {"train_loss": -25.15865135192871, "global_step": 256706, "epoch": 3092} {"train_loss": -25.343297958374023, "global_step": 256707, "epoch": 3092} {"train_loss": -25.289770126342773, "global_step": 256708, "epoch": 3092} {"train_loss": -25.103315353393555, "global_step": 256709, "epoch": 3092} {"train_loss": -25.000883102416992, "global_step": 256710, "epoch": 3092} {"train_loss": -25.28279685974121, "global_step": 256711, "epoch": 3092} {"train_loss": -25.071664810180664, "global_step": 256712, "epoch": 3092} {"train_loss": -24.975324630737305, "global_step": 256713, "epoch": 3092} {"train_loss": -25.170618057250977, "global_step": 256714, "epoch": 3092} {"train_loss": -25.246702194213867, "global_step": 256715, "epoch": 3092} {"train_loss": -25.274686813354492, "global_step": 256716, "epoch": 3092} {"train_loss": -25.3651065826416, "global_step": 256717, "epoch": 3092} {"train_loss": -25.070348234061736, "global_step": 256718, "epoch": 3092, "val_loss": 6916289.0} {"train_loss": -24.29640769958496, "global_step": 256719, "epoch": 3093} {"train_loss": -23.967687606811523, "global_step": 256720, "epoch": 3093} {"train_loss": -23.709306716918945, "global_step": 256721, "epoch": 3093} {"train_loss": -24.609392166137695, "global_step": 256722, "epoch": 3093} {"train_loss": -24.819143295288086, "global_step": 256723, "epoch": 3093} {"train_loss": -24.052610397338867, "global_step": 256724, "epoch": 3093} {"train_loss": -24.412866592407227, "global_step": 256725, "epoch": 3093} {"train_loss": -24.36453628540039, "global_step": 256726, "epoch": 3093} {"train_loss": -24.041711807250977, "global_step": 256727, "epoch": 3093} {"train_loss": -24.71420669555664, "global_step": 256728, "epoch": 3093} {"train_loss": -24.552658081054688, "global_step": 256729, "epoch": 3093} {"train_loss": -24.605270385742188, "global_step": 256730, "epoch": 3093} {"train_loss": -24.928062438964844, "global_step": 256731, "epoch": 3093} {"train_loss": -24.899856567382812, "global_step": 256732, "epoch": 3093} {"train_loss": -24.41872215270996, "global_step": 256733, "epoch": 3093} {"train_loss": -24.971317291259766, "global_step": 256734, "epoch": 3093} {"train_loss": -24.70786476135254, "global_step": 256735, "epoch": 3093} {"train_loss": -25.035232543945312, "global_step": 256736, "epoch": 3093} {"train_loss": -24.859045028686523, "global_step": 256737, "epoch": 3093} {"train_loss": -24.703229904174805, "global_step": 256738, "epoch": 3093} {"train_loss": -24.643217086791992, "global_step": 256739, "epoch": 3093} {"train_loss": -25.28642463684082, "global_step": 256740, "epoch": 3093} {"train_loss": -24.830307006835938, "global_step": 256741, "epoch": 3093} {"train_loss": -24.70247459411621, "global_step": 256742, "epoch": 3093} {"train_loss": -25.060684204101562, "global_step": 256743, "epoch": 3093} {"train_loss": -24.726703643798828, "global_step": 256744, "epoch": 3093} {"train_loss": -24.948467254638672, "global_step": 256745, "epoch": 3093} {"train_loss": -25.207456588745117, "global_step": 256746, "epoch": 3093} {"train_loss": -25.304489135742188, "global_step": 256747, "epoch": 3093} {"train_loss": -25.183887481689453, "global_step": 256748, "epoch": 3093} {"train_loss": -24.798009872436523, "global_step": 256749, "epoch": 3093} {"train_loss": -25.060726165771484, "global_step": 256750, "epoch": 3093} {"train_loss": -25.102514266967773, "global_step": 256751, "epoch": 3093} {"train_loss": -25.335525512695312, "global_step": 256752, "epoch": 3093} {"train_loss": -25.31592559814453, "global_step": 256753, "epoch": 3093} {"train_loss": -25.162275314331055, "global_step": 256754, "epoch": 3093} {"train_loss": -25.34037208557129, "global_step": 256755, "epoch": 3093} {"train_loss": -25.020963668823242, "global_step": 256756, "epoch": 3093} {"train_loss": -25.270801544189453, "global_step": 256757, "epoch": 3093} {"train_loss": -25.644269943237305, "global_step": 256758, "epoch": 3093} {"train_loss": -25.071443557739258, "global_step": 256759, "epoch": 3093} {"train_loss": -25.496356964111328, "global_step": 256760, "epoch": 3093} {"train_loss": -25.211355209350586, "global_step": 256761, "epoch": 3093} {"train_loss": -25.303922653198242, "global_step": 256762, "epoch": 3093} {"train_loss": -25.051891326904297, "global_step": 256763, "epoch": 3093} {"train_loss": -24.973674774169922, "global_step": 256764, "epoch": 3093} {"train_loss": -25.6771297454834, "global_step": 256765, "epoch": 3093} {"train_loss": -25.224124908447266, "global_step": 256766, "epoch": 3093} {"train_loss": -25.067432403564453, "global_step": 256767, "epoch": 3093} {"train_loss": -25.309080123901367, "global_step": 256768, "epoch": 3093} {"train_loss": -25.550092697143555, "global_step": 256769, "epoch": 3093} {"train_loss": -25.150409698486328, "global_step": 256770, "epoch": 3093} {"train_loss": -25.350290298461914, "global_step": 256771, "epoch": 3093} {"train_loss": -25.106740951538086, "global_step": 256772, "epoch": 3093} {"train_loss": -25.52998161315918, "global_step": 256773, "epoch": 3093} {"train_loss": -25.095233917236328, "global_step": 256774, "epoch": 3093} {"train_loss": -25.491539001464844, "global_step": 256775, "epoch": 3093} {"train_loss": -25.376604080200195, "global_step": 256776, "epoch": 3093} {"train_loss": -25.41400909423828, "global_step": 256777, "epoch": 3093} {"train_loss": -25.329696655273438, "global_step": 256778, "epoch": 3093} {"train_loss": -25.40997314453125, "global_step": 256779, "epoch": 3093} {"train_loss": -25.552167892456055, "global_step": 256780, "epoch": 3093} {"train_loss": -25.1136417388916, "global_step": 256781, "epoch": 3093} {"train_loss": -25.055133819580078, "global_step": 256782, "epoch": 3093} {"train_loss": -25.039505004882812, "global_step": 256783, "epoch": 3093} {"train_loss": -24.895191192626953, "global_step": 256784, "epoch": 3093} {"train_loss": -25.65289306640625, "global_step": 256785, "epoch": 3093} {"train_loss": -25.2006893157959, "global_step": 256786, "epoch": 3093} {"train_loss": -25.40471076965332, "global_step": 256787, "epoch": 3093} {"train_loss": -25.279356002807617, "global_step": 256788, "epoch": 3093} {"train_loss": -25.521699905395508, "global_step": 256789, "epoch": 3093} {"train_loss": -25.046232223510742, "global_step": 256790, "epoch": 3093} {"train_loss": -25.08917236328125, "global_step": 256791, "epoch": 3093} {"train_loss": -25.319162368774414, "global_step": 256792, "epoch": 3093} {"train_loss": -25.115880966186523, "global_step": 256793, "epoch": 3093} {"train_loss": -24.829999923706055, "global_step": 256794, "epoch": 3093} {"train_loss": -25.261615753173828, "global_step": 256795, "epoch": 3093} {"train_loss": -24.7572078704834, "global_step": 256796, "epoch": 3093} {"train_loss": -24.94725799560547, "global_step": 256797, "epoch": 3093} {"train_loss": -25.2130069732666, "global_step": 256798, "epoch": 3093} {"train_loss": -25.1661434173584, "global_step": 256799, "epoch": 3093} {"train_loss": -25.182952880859375, "global_step": 256800, "epoch": 3093} {"train_loss": -25.022941451474846, "global_step": 256801, "epoch": 3093, "val_loss": 7073016.5} {"train_loss": -24.92806053161621, "global_step": 256802, "epoch": 3094} {"train_loss": -25.200668334960938, "global_step": 256803, "epoch": 3094} {"train_loss": -24.75534439086914, "global_step": 256804, "epoch": 3094} {"train_loss": -24.71413230895996, "global_step": 256805, "epoch": 3094} {"train_loss": -24.61187171936035, "global_step": 256806, "epoch": 3094} {"train_loss": -25.102359771728516, "global_step": 256807, "epoch": 3094} {"train_loss": -24.440771102905273, "global_step": 256808, "epoch": 3094} {"train_loss": -24.955095291137695, "global_step": 256809, "epoch": 3094} {"train_loss": -24.81052017211914, "global_step": 256810, "epoch": 3094} {"train_loss": -24.818601608276367, "global_step": 256811, "epoch": 3094} {"train_loss": -24.8603572845459, "global_step": 256812, "epoch": 3094} {"train_loss": -24.835712432861328, "global_step": 256813, "epoch": 3094} {"train_loss": -25.090787887573242, "global_step": 256814, "epoch": 3094} {"train_loss": -24.641357421875, "global_step": 256815, "epoch": 3094} {"train_loss": -24.82008934020996, "global_step": 256816, "epoch": 3094} {"train_loss": -24.72515869140625, "global_step": 256817, "epoch": 3094} {"train_loss": -24.93812370300293, "global_step": 256818, "epoch": 3094} {"train_loss": -25.0346622467041, "global_step": 256819, "epoch": 3094} {"train_loss": -25.092771530151367, "global_step": 256820, "epoch": 3094} {"train_loss": -24.974206924438477, "global_step": 256821, "epoch": 3094} {"train_loss": -25.03239631652832, "global_step": 256822, "epoch": 3094} {"train_loss": -24.782434463500977, "global_step": 256823, "epoch": 3094} {"train_loss": -24.932086944580078, "global_step": 256824, "epoch": 3094} {"train_loss": -24.93305015563965, "global_step": 256825, "epoch": 3094} {"train_loss": -24.873395919799805, "global_step": 256826, "epoch": 3094} {"train_loss": -25.25170135498047, "global_step": 256827, "epoch": 3094} {"train_loss": -24.556638717651367, "global_step": 256828, "epoch": 3094} {"train_loss": -25.241195678710938, "global_step": 256829, "epoch": 3094} {"train_loss": -24.872468948364258, "global_step": 256830, "epoch": 3094} {"train_loss": -25.045610427856445, "global_step": 256831, "epoch": 3094} {"train_loss": -25.215360641479492, "global_step": 256832, "epoch": 3094} {"train_loss": -24.957082748413086, "global_step": 256833, "epoch": 3094} {"train_loss": -24.861621856689453, "global_step": 256834, "epoch": 3094} {"train_loss": -25.539026260375977, "global_step": 256835, "epoch": 3094} {"train_loss": -25.2104549407959, "global_step": 256836, "epoch": 3094} {"train_loss": -25.10477066040039, "global_step": 256837, "epoch": 3094} {"train_loss": -24.94083595275879, "global_step": 256838, "epoch": 3094} {"train_loss": -25.34712791442871, "global_step": 256839, "epoch": 3094} {"train_loss": -25.24333953857422, "global_step": 256840, "epoch": 3094} {"train_loss": -25.190671920776367, "global_step": 256841, "epoch": 3094} {"train_loss": -24.819028854370117, "global_step": 256842, "epoch": 3094} {"train_loss": -25.16436767578125, "global_step": 256843, "epoch": 3094} {"train_loss": -25.206205368041992, "global_step": 256844, "epoch": 3094} {"train_loss": -25.1275691986084, "global_step": 256845, "epoch": 3094} {"train_loss": -25.071292877197266, "global_step": 256846, "epoch": 3094} {"train_loss": -25.117013931274414, "global_step": 256847, "epoch": 3094} {"train_loss": -24.89166831970215, "global_step": 256848, "epoch": 3094} {"train_loss": -25.406057357788086, "global_step": 256849, "epoch": 3094} {"train_loss": -25.238576889038086, "global_step": 256850, "epoch": 3094} {"train_loss": -24.861557006835938, "global_step": 256851, "epoch": 3094} {"train_loss": -25.372591018676758, "global_step": 256852, "epoch": 3094} {"train_loss": -24.699932098388672, "global_step": 256853, "epoch": 3094} {"train_loss": -25.153825759887695, "global_step": 256854, "epoch": 3094} {"train_loss": -25.0665283203125, "global_step": 256855, "epoch": 3094} {"train_loss": -25.055984497070312, "global_step": 256856, "epoch": 3094} {"train_loss": -25.10713768005371, "global_step": 256857, "epoch": 3094} {"train_loss": -24.578596115112305, "global_step": 256858, "epoch": 3094} {"train_loss": -24.815027236938477, "global_step": 256859, "epoch": 3094} {"train_loss": -25.339109420776367, "global_step": 256860, "epoch": 3094} {"train_loss": -24.936155319213867, "global_step": 256861, "epoch": 3094} {"train_loss": -24.62920570373535, "global_step": 256862, "epoch": 3094} {"train_loss": -25.448150634765625, "global_step": 256863, "epoch": 3094} {"train_loss": -24.465869903564453, "global_step": 256864, "epoch": 3094} {"train_loss": -24.618885040283203, "global_step": 256865, "epoch": 3094} {"train_loss": -24.997360229492188, "global_step": 256866, "epoch": 3094} {"train_loss": -25.48374366760254, "global_step": 256867, "epoch": 3094} {"train_loss": -25.16631507873535, "global_step": 256868, "epoch": 3094} {"train_loss": -25.266775131225586, "global_step": 256869, "epoch": 3094} {"train_loss": -25.184200286865234, "global_step": 256870, "epoch": 3094} {"train_loss": -25.18781852722168, "global_step": 256871, "epoch": 3094} {"train_loss": -25.412235260009766, "global_step": 256872, "epoch": 3094} {"train_loss": -25.0604305267334, "global_step": 256873, "epoch": 3094} {"train_loss": -25.229629516601562, "global_step": 256874, "epoch": 3094} {"train_loss": -25.38074493408203, "global_step": 256875, "epoch": 3094} {"train_loss": -25.126325607299805, "global_step": 256876, "epoch": 3094} {"train_loss": -25.126949310302734, "global_step": 256877, "epoch": 3094} {"train_loss": -25.103492736816406, "global_step": 256878, "epoch": 3094} {"train_loss": -24.809751510620117, "global_step": 256879, "epoch": 3094} {"train_loss": -25.121381759643555, "global_step": 256880, "epoch": 3094} {"train_loss": -24.934017181396484, "global_step": 256881, "epoch": 3094} {"train_loss": -24.837743759155273, "global_step": 256882, "epoch": 3094} {"train_loss": -24.792848587036133, "global_step": 256883, "epoch": 3094} {"train_loss": -25.024175735841315, "global_step": 256884, "epoch": 3094, "val_loss": 6932461.0} {"train_loss": -24.436010360717773, "global_step": 256885, "epoch": 3095} {"train_loss": -24.708776473999023, "global_step": 256886, "epoch": 3095} {"train_loss": -24.05940818786621, "global_step": 256887, "epoch": 3095} {"train_loss": -22.861318588256836, "global_step": 256888, "epoch": 3095} {"train_loss": -23.898731231689453, "global_step": 256889, "epoch": 3095} {"train_loss": -23.894025802612305, "global_step": 256890, "epoch": 3095} {"train_loss": -24.597126007080078, "global_step": 256891, "epoch": 3095} {"train_loss": -23.81732940673828, "global_step": 256892, "epoch": 3095} {"train_loss": -24.93007469177246, "global_step": 256893, "epoch": 3095} {"train_loss": -24.39173126220703, "global_step": 256894, "epoch": 3095} {"train_loss": -24.268447875976562, "global_step": 256895, "epoch": 3095} {"train_loss": -24.535545349121094, "global_step": 256896, "epoch": 3095} {"train_loss": -25.10074234008789, "global_step": 256897, "epoch": 3095} {"train_loss": -24.291715621948242, "global_step": 256898, "epoch": 3095} {"train_loss": -24.561851501464844, "global_step": 256899, "epoch": 3095} {"train_loss": -24.98261070251465, "global_step": 256900, "epoch": 3095} {"train_loss": -24.6445255279541, "global_step": 256901, "epoch": 3095} {"train_loss": -25.27921485900879, "global_step": 256902, "epoch": 3095} {"train_loss": -24.592199325561523, "global_step": 256903, "epoch": 3095} {"train_loss": -24.737117767333984, "global_step": 256904, "epoch": 3095} {"train_loss": -24.768360137939453, "global_step": 256905, "epoch": 3095} {"train_loss": -24.443567276000977, "global_step": 256906, "epoch": 3095} {"train_loss": -24.496530532836914, "global_step": 256907, "epoch": 3095} {"train_loss": -24.82234001159668, "global_step": 256908, "epoch": 3095} {"train_loss": -24.664220809936523, "global_step": 256909, "epoch": 3095} {"train_loss": -24.422256469726562, "global_step": 256910, "epoch": 3095} {"train_loss": -25.245786666870117, "global_step": 256911, "epoch": 3095} {"train_loss": -24.80744171142578, "global_step": 256912, "epoch": 3095} {"train_loss": -24.76690101623535, "global_step": 256913, "epoch": 3095} {"train_loss": -24.851903915405273, "global_step": 256914, "epoch": 3095} {"train_loss": -24.669179916381836, "global_step": 256915, "epoch": 3095} {"train_loss": -24.85157585144043, "global_step": 256916, "epoch": 3095} {"train_loss": -24.924665451049805, "global_step": 256917, "epoch": 3095} {"train_loss": -25.01789665222168, "global_step": 256918, "epoch": 3095} {"train_loss": -25.01417350769043, "global_step": 256919, "epoch": 3095} {"train_loss": -24.63804054260254, "global_step": 256920, "epoch": 3095} {"train_loss": -24.712440490722656, "global_step": 256921, "epoch": 3095} {"train_loss": -25.264118194580078, "global_step": 256922, "epoch": 3095} {"train_loss": -24.8234806060791, "global_step": 256923, "epoch": 3095} {"train_loss": -24.898487091064453, "global_step": 256924, "epoch": 3095} {"train_loss": -24.691307067871094, "global_step": 256925, "epoch": 3095} {"train_loss": -25.01279067993164, "global_step": 256926, "epoch": 3095} {"train_loss": -25.5068359375, "global_step": 256927, "epoch": 3095} {"train_loss": -25.39409637451172, "global_step": 256928, "epoch": 3095} {"train_loss": -25.470041275024414, "global_step": 256929, "epoch": 3095} {"train_loss": -25.12617301940918, "global_step": 256930, "epoch": 3095} {"train_loss": -25.496288299560547, "global_step": 256931, "epoch": 3095} {"train_loss": -25.28189468383789, "global_step": 256932, "epoch": 3095} {"train_loss": -25.221206665039062, "global_step": 256933, "epoch": 3095} {"train_loss": -25.042428970336914, "global_step": 256934, "epoch": 3095} {"train_loss": -25.295063018798828, "global_step": 256935, "epoch": 3095} {"train_loss": -25.289104461669922, "global_step": 256936, "epoch": 3095} {"train_loss": -25.082124710083008, "global_step": 256937, "epoch": 3095} {"train_loss": -25.111032485961914, "global_step": 256938, "epoch": 3095} {"train_loss": -24.680593490600586, "global_step": 256939, "epoch": 3095} {"train_loss": -24.371599197387695, "global_step": 256940, "epoch": 3095} {"train_loss": -24.62394142150879, "global_step": 256941, "epoch": 3095} {"train_loss": -25.142684936523438, "global_step": 256942, "epoch": 3095} {"train_loss": -24.8791561126709, "global_step": 256943, "epoch": 3095} {"train_loss": -24.584707260131836, "global_step": 256944, "epoch": 3095} {"train_loss": -25.316415786743164, "global_step": 256945, "epoch": 3095} {"train_loss": -25.035123825073242, "global_step": 256946, "epoch": 3095} {"train_loss": -25.295129776000977, "global_step": 256947, "epoch": 3095} {"train_loss": -24.959562301635742, "global_step": 256948, "epoch": 3095} {"train_loss": -25.03074073791504, "global_step": 256949, "epoch": 3095} {"train_loss": -24.863422393798828, "global_step": 256950, "epoch": 3095} {"train_loss": -25.12415885925293, "global_step": 256951, "epoch": 3095} {"train_loss": -24.998004913330078, "global_step": 256952, "epoch": 3095} {"train_loss": -25.11334228515625, "global_step": 256953, "epoch": 3095} {"train_loss": -25.224424362182617, "global_step": 256954, "epoch": 3095} {"train_loss": -25.092546463012695, "global_step": 256955, "epoch": 3095} {"train_loss": -24.81906509399414, "global_step": 256956, "epoch": 3095} {"train_loss": -24.706361770629883, "global_step": 256957, "epoch": 3095} {"train_loss": -25.166444778442383, "global_step": 256958, "epoch": 3095} {"train_loss": -24.833078384399414, "global_step": 256959, "epoch": 3095} {"train_loss": -25.169946670532227, "global_step": 256960, "epoch": 3095} {"train_loss": -25.059247970581055, "global_step": 256961, "epoch": 3095} {"train_loss": -25.169921875, "global_step": 256962, "epoch": 3095} {"train_loss": -24.782079696655273, "global_step": 256963, "epoch": 3095} {"train_loss": -25.397171020507812, "global_step": 256964, "epoch": 3095} {"train_loss": -25.36537742614746, "global_step": 256965, "epoch": 3095} {"train_loss": -24.93436622619629, "global_step": 256966, "epoch": 3095} {"train_loss": -24.855066644140038, "global_step": 256967, "epoch": 3095, "val_loss": 6801174.0} {"train_loss": -24.76117515563965, "global_step": 256968, "epoch": 3096} {"train_loss": -25.0139217376709, "global_step": 256969, "epoch": 3096} {"train_loss": -24.86614227294922, "global_step": 256970, "epoch": 3096} {"train_loss": -24.788854598999023, "global_step": 256971, "epoch": 3096} {"train_loss": -24.722257614135742, "global_step": 256972, "epoch": 3096} {"train_loss": -24.833358764648438, "global_step": 256973, "epoch": 3096} {"train_loss": -24.829397201538086, "global_step": 256974, "epoch": 3096} {"train_loss": -24.91151237487793, "global_step": 256975, "epoch": 3096} {"train_loss": -24.116674423217773, "global_step": 256976, "epoch": 3096} {"train_loss": -25.061464309692383, "global_step": 256977, "epoch": 3096} {"train_loss": -24.639068603515625, "global_step": 256978, "epoch": 3096} {"train_loss": -25.037458419799805, "global_step": 256979, "epoch": 3096} {"train_loss": -24.60923957824707, "global_step": 256980, "epoch": 3096} {"train_loss": -25.19612693786621, "global_step": 256981, "epoch": 3096} {"train_loss": -24.707015991210938, "global_step": 256982, "epoch": 3096} {"train_loss": -24.989913940429688, "global_step": 256983, "epoch": 3096} {"train_loss": -24.871665954589844, "global_step": 256984, "epoch": 3096} {"train_loss": -24.628482818603516, "global_step": 256985, "epoch": 3096} {"train_loss": -25.323043823242188, "global_step": 256986, "epoch": 3096} {"train_loss": -24.860055923461914, "global_step": 256987, "epoch": 3096} {"train_loss": -25.32733726501465, "global_step": 256988, "epoch": 3096} {"train_loss": -24.710296630859375, "global_step": 256989, "epoch": 3096} {"train_loss": -24.91303062438965, "global_step": 256990, "epoch": 3096} {"train_loss": -24.608642578125, "global_step": 256991, "epoch": 3096} {"train_loss": -25.141239166259766, "global_step": 256992, "epoch": 3096} {"train_loss": -24.94365882873535, "global_step": 256993, "epoch": 3096} {"train_loss": -24.973468780517578, "global_step": 256994, "epoch": 3096} {"train_loss": -24.888778686523438, "global_step": 256995, "epoch": 3096} {"train_loss": -25.306066513061523, "global_step": 256996, "epoch": 3096} {"train_loss": -25.22067642211914, "global_step": 256997, "epoch": 3096} {"train_loss": -24.929044723510742, "global_step": 256998, "epoch": 3096} {"train_loss": -25.075305938720703, "global_step": 256999, "epoch": 3096} {"train_loss": -24.980966567993164, "global_step": 257000, "epoch": 3096} {"train_loss": -25.37228775024414, "global_step": 257001, "epoch": 3096} {"train_loss": -24.91395378112793, "global_step": 257002, "epoch": 3096} {"train_loss": -25.23493003845215, "global_step": 257003, "epoch": 3096} {"train_loss": -25.000593185424805, "global_step": 257004, "epoch": 3096} {"train_loss": -24.97972297668457, "global_step": 257005, "epoch": 3096} {"train_loss": -25.467422485351562, "global_step": 257006, "epoch": 3096} {"train_loss": -25.036792755126953, "global_step": 257007, "epoch": 3096} {"train_loss": -25.28263282775879, "global_step": 257008, "epoch": 3096} {"train_loss": -24.9918155670166, "global_step": 257009, "epoch": 3096} {"train_loss": -25.209545135498047, "global_step": 257010, "epoch": 3096} {"train_loss": -25.347257614135742, "global_step": 257011, "epoch": 3096} {"train_loss": -25.1038875579834, "global_step": 257012, "epoch": 3096} {"train_loss": -25.158954620361328, "global_step": 257013, "epoch": 3096} {"train_loss": -25.098480224609375, "global_step": 257014, "epoch": 3096} {"train_loss": -24.97296142578125, "global_step": 257015, "epoch": 3096} {"train_loss": -25.013885498046875, "global_step": 257016, "epoch": 3096} {"train_loss": -25.359256744384766, "global_step": 257017, "epoch": 3096} {"train_loss": -24.92827796936035, "global_step": 257018, "epoch": 3096} {"train_loss": -25.0982723236084, "global_step": 257019, "epoch": 3096} {"train_loss": -25.43096923828125, "global_step": 257020, "epoch": 3096} {"train_loss": -25.621572494506836, "global_step": 257021, "epoch": 3096} {"train_loss": -25.102413177490234, "global_step": 257022, "epoch": 3096} {"train_loss": -25.60828971862793, "global_step": 257023, "epoch": 3096} {"train_loss": -25.142385482788086, "global_step": 257024, "epoch": 3096} {"train_loss": -25.014219284057617, "global_step": 257025, "epoch": 3096} {"train_loss": -25.14227294921875, "global_step": 257026, "epoch": 3096} {"train_loss": -25.22755241394043, "global_step": 257027, "epoch": 3096} {"train_loss": -25.62906837463379, "global_step": 257028, "epoch": 3096} {"train_loss": -25.344505310058594, "global_step": 257029, "epoch": 3096} {"train_loss": -25.40682029724121, "global_step": 257030, "epoch": 3096} {"train_loss": -25.45134162902832, "global_step": 257031, "epoch": 3096} {"train_loss": -25.175718307495117, "global_step": 257032, "epoch": 3096} {"train_loss": -25.440448760986328, "global_step": 257033, "epoch": 3096} {"train_loss": -25.27783203125, "global_step": 257034, "epoch": 3096} {"train_loss": -25.602872848510742, "global_step": 257035, "epoch": 3096} {"train_loss": -25.44986343383789, "global_step": 257036, "epoch": 3096} {"train_loss": -25.061843872070312, "global_step": 257037, "epoch": 3096} {"train_loss": -24.40005874633789, "global_step": 257038, "epoch": 3096} {"train_loss": -24.103294372558594, "global_step": 257039, "epoch": 3096} {"train_loss": -24.081668853759766, "global_step": 257040, "epoch": 3096} {"train_loss": -24.26386070251465, "global_step": 257041, "epoch": 3096} {"train_loss": -25.0277099609375, "global_step": 257042, "epoch": 3096} {"train_loss": -24.279367446899414, "global_step": 257043, "epoch": 3096} {"train_loss": -25.19832420349121, "global_step": 257044, "epoch": 3096} {"train_loss": -24.833473205566406, "global_step": 257045, "epoch": 3096} {"train_loss": -24.82712173461914, "global_step": 257046, "epoch": 3096} {"train_loss": -24.50652503967285, "global_step": 257047, "epoch": 3096} {"train_loss": -24.833131790161133, "global_step": 257048, "epoch": 3096} {"train_loss": -24.94392204284668, "global_step": 257049, "epoch": 3096} {"train_loss": -25.0128242538636, "global_step": 257050, "epoch": 3096, "val_loss": 6792092.0} {"train_loss": -24.203231811523438, "global_step": 257051, "epoch": 3097} {"train_loss": -24.33283042907715, "global_step": 257052, "epoch": 3097} {"train_loss": -24.129236221313477, "global_step": 257053, "epoch": 3097} {"train_loss": -24.637144088745117, "global_step": 257054, "epoch": 3097} {"train_loss": -24.584074020385742, "global_step": 257055, "epoch": 3097} {"train_loss": -24.53551483154297, "global_step": 257056, "epoch": 3097} {"train_loss": -24.48003578186035, "global_step": 257057, "epoch": 3097} {"train_loss": -25.373319625854492, "global_step": 257058, "epoch": 3097} {"train_loss": -24.399986267089844, "global_step": 257059, "epoch": 3097} {"train_loss": -24.65333366394043, "global_step": 257060, "epoch": 3097} {"train_loss": -24.492721557617188, "global_step": 257061, "epoch": 3097} {"train_loss": -24.924047470092773, "global_step": 257062, "epoch": 3097} {"train_loss": -24.66630744934082, "global_step": 257063, "epoch": 3097} {"train_loss": -24.828657150268555, "global_step": 257064, "epoch": 3097} {"train_loss": -24.923612594604492, "global_step": 257065, "epoch": 3097} {"train_loss": -24.943422317504883, "global_step": 257066, "epoch": 3097} {"train_loss": -24.763586044311523, "global_step": 257067, "epoch": 3097} {"train_loss": -24.47579002380371, "global_step": 257068, "epoch": 3097} {"train_loss": -24.989639282226562, "global_step": 257069, "epoch": 3097} {"train_loss": -24.88291358947754, "global_step": 257070, "epoch": 3097} {"train_loss": -24.742780685424805, "global_step": 257071, "epoch": 3097} {"train_loss": -24.74537467956543, "global_step": 257072, "epoch": 3097} {"train_loss": -24.436702728271484, "global_step": 257073, "epoch": 3097} {"train_loss": -24.914443969726562, "global_step": 257074, "epoch": 3097} {"train_loss": -24.810720443725586, "global_step": 257075, "epoch": 3097} {"train_loss": -25.415925979614258, "global_step": 257076, "epoch": 3097} {"train_loss": -24.781110763549805, "global_step": 257077, "epoch": 3097} {"train_loss": -25.260868072509766, "global_step": 257078, "epoch": 3097} {"train_loss": -25.04963493347168, "global_step": 257079, "epoch": 3097} {"train_loss": -25.5184326171875, "global_step": 257080, "epoch": 3097} {"train_loss": -25.40081024169922, "global_step": 257081, "epoch": 3097} {"train_loss": -25.145118713378906, "global_step": 257082, "epoch": 3097} {"train_loss": -25.393661499023438, "global_step": 257083, "epoch": 3097} {"train_loss": -25.106292724609375, "global_step": 257084, "epoch": 3097} {"train_loss": -25.155895233154297, "global_step": 257085, "epoch": 3097} {"train_loss": -25.38121795654297, "global_step": 257086, "epoch": 3097} {"train_loss": -25.640640258789062, "global_step": 257087, "epoch": 3097} {"train_loss": -24.983238220214844, "global_step": 257088, "epoch": 3097} {"train_loss": -25.208494186401367, "global_step": 257089, "epoch": 3097} {"train_loss": -25.266416549682617, "global_step": 257090, "epoch": 3097} {"train_loss": -24.859695434570312, "global_step": 257091, "epoch": 3097} {"train_loss": -25.21761131286621, "global_step": 257092, "epoch": 3097} {"train_loss": -25.154829025268555, "global_step": 257093, "epoch": 3097} {"train_loss": -24.938627243041992, "global_step": 257094, "epoch": 3097} {"train_loss": -24.91362190246582, "global_step": 257095, "epoch": 3097} {"train_loss": -25.0858097076416, "global_step": 257096, "epoch": 3097} {"train_loss": -25.095060348510742, "global_step": 257097, "epoch": 3097} {"train_loss": -24.935062408447266, "global_step": 257098, "epoch": 3097} {"train_loss": -25.3001766204834, "global_step": 257099, "epoch": 3097} {"train_loss": -25.433313369750977, "global_step": 257100, "epoch": 3097} {"train_loss": -25.126632690429688, "global_step": 257101, "epoch": 3097} {"train_loss": -24.96942710876465, "global_step": 257102, "epoch": 3097} {"train_loss": -24.927488327026367, "global_step": 257103, "epoch": 3097} {"train_loss": -24.732227325439453, "global_step": 257104, "epoch": 3097} {"train_loss": -25.30402183532715, "global_step": 257105, "epoch": 3097} {"train_loss": -25.492464065551758, "global_step": 257106, "epoch": 3097} {"train_loss": -24.971242904663086, "global_step": 257107, "epoch": 3097} {"train_loss": -24.834611892700195, "global_step": 257108, "epoch": 3097} {"train_loss": -25.09299087524414, "global_step": 257109, "epoch": 3097} {"train_loss": -25.053234100341797, "global_step": 257110, "epoch": 3097} {"train_loss": -24.980924606323242, "global_step": 257111, "epoch": 3097} {"train_loss": -25.175329208374023, "global_step": 257112, "epoch": 3097} {"train_loss": -25.2640438079834, "global_step": 257113, "epoch": 3097} {"train_loss": -24.70921516418457, "global_step": 257114, "epoch": 3097} {"train_loss": -25.049795150756836, "global_step": 257115, "epoch": 3097} {"train_loss": -25.00665283203125, "global_step": 257116, "epoch": 3097} {"train_loss": -24.85595703125, "global_step": 257117, "epoch": 3097} {"train_loss": -25.29762077331543, "global_step": 257118, "epoch": 3097} {"train_loss": -25.62241554260254, "global_step": 257119, "epoch": 3097} {"train_loss": -25.09783935546875, "global_step": 257120, "epoch": 3097} {"train_loss": -25.481565475463867, "global_step": 257121, "epoch": 3097} {"train_loss": -25.30904197692871, "global_step": 257122, "epoch": 3097} {"train_loss": -24.82662010192871, "global_step": 257123, "epoch": 3097} {"train_loss": -25.182315826416016, "global_step": 257124, "epoch": 3097} {"train_loss": -25.077314376831055, "global_step": 257125, "epoch": 3097} {"train_loss": -25.123159408569336, "global_step": 257126, "epoch": 3097} {"train_loss": -25.238386154174805, "global_step": 257127, "epoch": 3097} {"train_loss": -25.470142364501953, "global_step": 257128, "epoch": 3097} {"train_loss": -25.335216522216797, "global_step": 257129, "epoch": 3097} {"train_loss": -25.37424087524414, "global_step": 257130, "epoch": 3097} {"train_loss": -25.516263961791992, "global_step": 257131, "epoch": 3097} {"train_loss": -25.104496002197266, "global_step": 257132, "epoch": 3097} {"train_loss": -25.017565784684148, "global_step": 257133, "epoch": 3097, "val_loss": 6869283.0} {"train_loss": -24.92051124572754, "global_step": 257134, "epoch": 3098} {"train_loss": -25.033273696899414, "global_step": 257135, "epoch": 3098} {"train_loss": -24.653894424438477, "global_step": 257136, "epoch": 3098} {"train_loss": -24.919692993164062, "global_step": 257137, "epoch": 3098} {"train_loss": -24.98002815246582, "global_step": 257138, "epoch": 3098} {"train_loss": -25.010086059570312, "global_step": 257139, "epoch": 3098} {"train_loss": -24.56798553466797, "global_step": 257140, "epoch": 3098} {"train_loss": -24.596576690673828, "global_step": 257141, "epoch": 3098} {"train_loss": -24.850706100463867, "global_step": 257142, "epoch": 3098} {"train_loss": -24.84354591369629, "global_step": 257143, "epoch": 3098} {"train_loss": -24.925384521484375, "global_step": 257144, "epoch": 3098} {"train_loss": -24.883914947509766, "global_step": 257145, "epoch": 3098} {"train_loss": -24.963314056396484, "global_step": 257146, "epoch": 3098} {"train_loss": -24.919754028320312, "global_step": 257147, "epoch": 3098} {"train_loss": -25.370939254760742, "global_step": 257148, "epoch": 3098} {"train_loss": -25.023527145385742, "global_step": 257149, "epoch": 3098} {"train_loss": -24.95697593688965, "global_step": 257150, "epoch": 3098} {"train_loss": -25.37468910217285, "global_step": 257151, "epoch": 3098} {"train_loss": -24.954431533813477, "global_step": 257152, "epoch": 3098} {"train_loss": -24.97784996032715, "global_step": 257153, "epoch": 3098} {"train_loss": -25.490625381469727, "global_step": 257154, "epoch": 3098} {"train_loss": -24.870311737060547, "global_step": 257155, "epoch": 3098} {"train_loss": -24.933382034301758, "global_step": 257156, "epoch": 3098} {"train_loss": -25.281949996948242, "global_step": 257157, "epoch": 3098} {"train_loss": -25.158472061157227, "global_step": 257158, "epoch": 3098} {"train_loss": -25.13544273376465, "global_step": 257159, "epoch": 3098} {"train_loss": -25.216062545776367, "global_step": 257160, "epoch": 3098} {"train_loss": -25.149280548095703, "global_step": 257161, "epoch": 3098} {"train_loss": -24.76459503173828, "global_step": 257162, "epoch": 3098} {"train_loss": -25.165815353393555, "global_step": 257163, "epoch": 3098} {"train_loss": -25.05653190612793, "global_step": 257164, "epoch": 3098} {"train_loss": -24.600727081298828, "global_step": 257165, "epoch": 3098} {"train_loss": -24.9633846282959, "global_step": 257166, "epoch": 3098} {"train_loss": -25.006887435913086, "global_step": 257167, "epoch": 3098} {"train_loss": -25.045774459838867, "global_step": 257168, "epoch": 3098} {"train_loss": -25.362836837768555, "global_step": 257169, "epoch": 3098} {"train_loss": -24.872276306152344, "global_step": 257170, "epoch": 3098} {"train_loss": -25.49495506286621, "global_step": 257171, "epoch": 3098} {"train_loss": -24.96783447265625, "global_step": 257172, "epoch": 3098} {"train_loss": -25.08152198791504, "global_step": 257173, "epoch": 3098} {"train_loss": -24.840421676635742, "global_step": 257174, "epoch": 3098} {"train_loss": -25.419729232788086, "global_step": 257175, "epoch": 3098} {"train_loss": -24.818174362182617, "global_step": 257176, "epoch": 3098} {"train_loss": -25.049396514892578, "global_step": 257177, "epoch": 3098} {"train_loss": -25.078022003173828, "global_step": 257178, "epoch": 3098} {"train_loss": -25.07931900024414, "global_step": 257179, "epoch": 3098} {"train_loss": -25.427335739135742, "global_step": 257180, "epoch": 3098} {"train_loss": -24.975452423095703, "global_step": 257181, "epoch": 3098} {"train_loss": -25.137205123901367, "global_step": 257182, "epoch": 3098} {"train_loss": -25.416296005249023, "global_step": 257183, "epoch": 3098} {"train_loss": -25.35072898864746, "global_step": 257184, "epoch": 3098} {"train_loss": -24.95499610900879, "global_step": 257185, "epoch": 3098} {"train_loss": -25.104629516601562, "global_step": 257186, "epoch": 3098} {"train_loss": -25.123886108398438, "global_step": 257187, "epoch": 3098} {"train_loss": -24.902616500854492, "global_step": 257188, "epoch": 3098} {"train_loss": -25.3509578704834, "global_step": 257189, "epoch": 3098} {"train_loss": -25.010496139526367, "global_step": 257190, "epoch": 3098} {"train_loss": -25.342670440673828, "global_step": 257191, "epoch": 3098} {"train_loss": -25.343252182006836, "global_step": 257192, "epoch": 3098} {"train_loss": -25.3701114654541, "global_step": 257193, "epoch": 3098} {"train_loss": -25.067869186401367, "global_step": 257194, "epoch": 3098} {"train_loss": -25.162811279296875, "global_step": 257195, "epoch": 3098} {"train_loss": -25.01008415222168, "global_step": 257196, "epoch": 3098} {"train_loss": -24.981346130371094, "global_step": 257197, "epoch": 3098} {"train_loss": -25.080204010009766, "global_step": 257198, "epoch": 3098} {"train_loss": -25.086151123046875, "global_step": 257199, "epoch": 3098} {"train_loss": -25.30125617980957, "global_step": 257200, "epoch": 3098} {"train_loss": -25.164627075195312, "global_step": 257201, "epoch": 3098} {"train_loss": -24.973793029785156, "global_step": 257202, "epoch": 3098} {"train_loss": -25.02908706665039, "global_step": 257203, "epoch": 3098} {"train_loss": -25.218421936035156, "global_step": 257204, "epoch": 3098} {"train_loss": -24.994205474853516, "global_step": 257205, "epoch": 3098} {"train_loss": -25.296142578125, "global_step": 257206, "epoch": 3098} {"train_loss": -25.086217880249023, "global_step": 257207, "epoch": 3098} {"train_loss": -25.042882919311523, "global_step": 257208, "epoch": 3098} {"train_loss": -25.354732513427734, "global_step": 257209, "epoch": 3098} {"train_loss": -24.92408561706543, "global_step": 257210, "epoch": 3098} {"train_loss": -25.431970596313477, "global_step": 257211, "epoch": 3098} {"train_loss": -25.448896408081055, "global_step": 257212, "epoch": 3098} {"train_loss": -25.565515518188477, "global_step": 257213, "epoch": 3098} {"train_loss": -25.530942916870117, "global_step": 257214, "epoch": 3098} {"train_loss": -25.3415470123291, "global_step": 257215, "epoch": 3098} {"train_loss": -25.08870533862746, "global_step": 257216, "epoch": 3098, "val_loss": 6944864.5} {"train_loss": -25.100448608398438, "global_step": 257217, "epoch": 3099} {"train_loss": -24.06285285949707, "global_step": 257218, "epoch": 3099} {"train_loss": -24.985591888427734, "global_step": 257219, "epoch": 3099} {"train_loss": -24.750110626220703, "global_step": 257220, "epoch": 3099} {"train_loss": -24.545637130737305, "global_step": 257221, "epoch": 3099} {"train_loss": -24.428308486938477, "global_step": 257222, "epoch": 3099} {"train_loss": -24.642555236816406, "global_step": 257223, "epoch": 3099} {"train_loss": -24.890247344970703, "global_step": 257224, "epoch": 3099} {"train_loss": -24.662220001220703, "global_step": 257225, "epoch": 3099} {"train_loss": -24.979450225830078, "global_step": 257226, "epoch": 3099} {"train_loss": -25.017148971557617, "global_step": 257227, "epoch": 3099} {"train_loss": -24.78230857849121, "global_step": 257228, "epoch": 3099} {"train_loss": -25.089622497558594, "global_step": 257229, "epoch": 3099} {"train_loss": -24.813642501831055, "global_step": 257230, "epoch": 3099} {"train_loss": -24.51068687438965, "global_step": 257231, "epoch": 3099} {"train_loss": -25.177001953125, "global_step": 257232, "epoch": 3099} {"train_loss": -24.940109252929688, "global_step": 257233, "epoch": 3099} {"train_loss": -24.409849166870117, "global_step": 257234, "epoch": 3099} {"train_loss": -24.802371978759766, "global_step": 257235, "epoch": 3099} {"train_loss": -25.305753707885742, "global_step": 257236, "epoch": 3099} {"train_loss": -24.941394805908203, "global_step": 257237, "epoch": 3099} {"train_loss": -24.93184471130371, "global_step": 257238, "epoch": 3099} {"train_loss": -25.15260124206543, "global_step": 257239, "epoch": 3099} {"train_loss": -25.177663803100586, "global_step": 257240, "epoch": 3099} {"train_loss": -25.09810447692871, "global_step": 257241, "epoch": 3099} {"train_loss": -25.133991241455078, "global_step": 257242, "epoch": 3099} {"train_loss": -25.209806442260742, "global_step": 257243, "epoch": 3099} {"train_loss": -25.39873504638672, "global_step": 257244, "epoch": 3099} {"train_loss": -25.234922409057617, "global_step": 257245, "epoch": 3099} {"train_loss": -25.33400535583496, "global_step": 257246, "epoch": 3099} {"train_loss": -25.045513153076172, "global_step": 257247, "epoch": 3099} {"train_loss": -24.84969139099121, "global_step": 257248, "epoch": 3099} {"train_loss": -25.047462463378906, "global_step": 257249, "epoch": 3099} {"train_loss": -25.37298583984375, "global_step": 257250, "epoch": 3099} {"train_loss": -25.581098556518555, "global_step": 257251, "epoch": 3099} {"train_loss": -24.951719284057617, "global_step": 257252, "epoch": 3099} {"train_loss": -25.02033042907715, "global_step": 257253, "epoch": 3099} {"train_loss": -25.002653121948242, "global_step": 257254, "epoch": 3099} {"train_loss": -25.37554359436035, "global_step": 257255, "epoch": 3099} {"train_loss": -24.936864852905273, "global_step": 257256, "epoch": 3099} {"train_loss": -24.9824161529541, "global_step": 257257, "epoch": 3099} {"train_loss": -25.177732467651367, "global_step": 257258, "epoch": 3099} {"train_loss": -25.13490867614746, "global_step": 257259, "epoch": 3099} {"train_loss": -25.343870162963867, "global_step": 257260, "epoch": 3099} {"train_loss": -25.111406326293945, "global_step": 257261, "epoch": 3099} {"train_loss": -25.522695541381836, "global_step": 257262, "epoch": 3099} {"train_loss": -25.440204620361328, "global_step": 257263, "epoch": 3099} {"train_loss": -25.319499969482422, "global_step": 257264, "epoch": 3099} {"train_loss": -25.342641830444336, "global_step": 257265, "epoch": 3099} {"train_loss": -25.33294105529785, "global_step": 257266, "epoch": 3099} {"train_loss": -25.219322204589844, "global_step": 257267, "epoch": 3099} {"train_loss": -25.61834716796875, "global_step": 257268, "epoch": 3099} {"train_loss": -25.23225975036621, "global_step": 257269, "epoch": 3099} {"train_loss": -25.153179168701172, "global_step": 257270, "epoch": 3099} {"train_loss": -25.553762435913086, "global_step": 257271, "epoch": 3099} {"train_loss": -24.739648818969727, "global_step": 257272, "epoch": 3099} {"train_loss": -24.976511001586914, "global_step": 257273, "epoch": 3099} {"train_loss": -25.022932052612305, "global_step": 257274, "epoch": 3099} {"train_loss": -25.062795639038086, "global_step": 257275, "epoch": 3099} {"train_loss": -25.027772903442383, "global_step": 257276, "epoch": 3099} {"train_loss": -25.26234245300293, "global_step": 257277, "epoch": 3099} {"train_loss": -25.120807647705078, "global_step": 257278, "epoch": 3099} {"train_loss": -25.271635055541992, "global_step": 257279, "epoch": 3099} {"train_loss": -25.31924819946289, "global_step": 257280, "epoch": 3099} {"train_loss": -24.970388412475586, "global_step": 257281, "epoch": 3099} {"train_loss": -24.890487670898438, "global_step": 257282, "epoch": 3099} {"train_loss": -24.98356819152832, "global_step": 257283, "epoch": 3099} {"train_loss": -25.180484771728516, "global_step": 257284, "epoch": 3099} {"train_loss": -25.513917922973633, "global_step": 257285, "epoch": 3099} {"train_loss": -25.45015525817871, "global_step": 257286, "epoch": 3099} {"train_loss": -25.023822784423828, "global_step": 257287, "epoch": 3099} {"train_loss": -24.933149337768555, "global_step": 257288, "epoch": 3099} {"train_loss": -25.55567169189453, "global_step": 257289, "epoch": 3099} {"train_loss": -25.185266494750977, "global_step": 257290, "epoch": 3099} {"train_loss": -25.106821060180664, "global_step": 257291, "epoch": 3099} {"train_loss": -25.610158920288086, "global_step": 257292, "epoch": 3099} {"train_loss": -25.231473922729492, "global_step": 257293, "epoch": 3099} {"train_loss": -25.111738204956055, "global_step": 257294, "epoch": 3099} {"train_loss": -25.335519790649414, "global_step": 257295, "epoch": 3099} {"train_loss": -25.147485733032227, "global_step": 257296, "epoch": 3099} {"train_loss": -25.4628849029541, "global_step": 257297, "epoch": 3099} {"train_loss": -25.564777374267578, "global_step": 257298, "epoch": 3099} {"train_loss": -25.103910928749176, "global_step": 257299, "epoch": 3099, "val_loss": 6890089.5} {"train_loss": -24.277883529663086, "global_step": 257300, "epoch": 3100} {"train_loss": -23.779306411743164, "global_step": 257301, "epoch": 3100} {"train_loss": -24.294729232788086, "global_step": 257302, "epoch": 3100} {"train_loss": -24.857839584350586, "global_step": 257303, "epoch": 3100} {"train_loss": -24.41097068786621, "global_step": 257304, "epoch": 3100} {"train_loss": -24.341642379760742, "global_step": 257305, "epoch": 3100} {"train_loss": -24.931547164916992, "global_step": 257306, "epoch": 3100} {"train_loss": -24.336570739746094, "global_step": 257307, "epoch": 3100} {"train_loss": -24.876739501953125, "global_step": 257308, "epoch": 3100} {"train_loss": -24.568265914916992, "global_step": 257309, "epoch": 3100} {"train_loss": -24.800870895385742, "global_step": 257310, "epoch": 3100} {"train_loss": -24.514089584350586, "global_step": 257311, "epoch": 3100} {"train_loss": -24.97381019592285, "global_step": 257312, "epoch": 3100} {"train_loss": -24.964149475097656, "global_step": 257313, "epoch": 3100} {"train_loss": -24.640625, "global_step": 257314, "epoch": 3100} {"train_loss": -25.125741958618164, "global_step": 257315, "epoch": 3100} {"train_loss": -24.982908248901367, "global_step": 257316, "epoch": 3100} {"train_loss": -25.344709396362305, "global_step": 257317, "epoch": 3100} {"train_loss": -25.085580825805664, "global_step": 257318, "epoch": 3100} {"train_loss": -25.172677993774414, "global_step": 257319, "epoch": 3100} {"train_loss": -24.9991397857666, "global_step": 257320, "epoch": 3100} {"train_loss": -24.892744064331055, "global_step": 257321, "epoch": 3100} {"train_loss": -25.046981811523438, "global_step": 257322, "epoch": 3100} {"train_loss": -24.883987426757812, "global_step": 257323, "epoch": 3100} {"train_loss": -24.901830673217773, "global_step": 257324, "epoch": 3100} {"train_loss": -25.007177352905273, "global_step": 257325, "epoch": 3100} {"train_loss": -25.17986488342285, "global_step": 257326, "epoch": 3100} {"train_loss": -24.883380889892578, "global_step": 257327, "epoch": 3100} {"train_loss": -25.1879940032959, "global_step": 257328, "epoch": 3100} {"train_loss": -25.0263729095459, "global_step": 257329, "epoch": 3100} {"train_loss": -24.951948165893555, "global_step": 257330, "epoch": 3100} {"train_loss": -25.233190536499023, "global_step": 257331, "epoch": 3100} {"train_loss": -25.119138717651367, "global_step": 257332, "epoch": 3100} {"train_loss": -25.15610694885254, "global_step": 257333, "epoch": 3100} {"train_loss": -25.058744430541992, "global_step": 257334, "epoch": 3100} {"train_loss": -24.918800354003906, "global_step": 257335, "epoch": 3100} {"train_loss": -24.962417602539062, "global_step": 257336, "epoch": 3100} {"train_loss": -25.1978702545166, "global_step": 257337, "epoch": 3100} {"train_loss": -25.164823532104492, "global_step": 257338, "epoch": 3100} {"train_loss": -25.046157836914062, "global_step": 257339, "epoch": 3100} {"train_loss": -25.31147575378418, "global_step": 257340, "epoch": 3100} {"train_loss": -25.36025619506836, "global_step": 257341, "epoch": 3100} {"train_loss": -25.207902908325195, "global_step": 257342, "epoch": 3100} {"train_loss": -25.434772491455078, "global_step": 257343, "epoch": 3100} {"train_loss": -25.012521743774414, "global_step": 257344, "epoch": 3100} {"train_loss": -25.529571533203125, "global_step": 257345, "epoch": 3100} {"train_loss": -25.633071899414062, "global_step": 257346, "epoch": 3100} {"train_loss": -25.426273345947266, "global_step": 257347, "epoch": 3100} {"train_loss": -25.165559768676758, "global_step": 257348, "epoch": 3100} {"train_loss": -25.31282615661621, "global_step": 257349, "epoch": 3100} {"train_loss": -25.311975479125977, "global_step": 257350, "epoch": 3100} {"train_loss": -25.31290054321289, "global_step": 257351, "epoch": 3100} {"train_loss": -25.080860137939453, "global_step": 257352, "epoch": 3100} {"train_loss": -25.228118896484375, "global_step": 257353, "epoch": 3100} {"train_loss": -25.025989532470703, "global_step": 257354, "epoch": 3100} {"train_loss": -25.17465591430664, "global_step": 257355, "epoch": 3100} {"train_loss": -24.829801559448242, "global_step": 257356, "epoch": 3100} {"train_loss": -25.48842430114746, "global_step": 257357, "epoch": 3100} {"train_loss": -25.03359031677246, "global_step": 257358, "epoch": 3100} {"train_loss": -25.561132431030273, "global_step": 257359, "epoch": 3100} {"train_loss": -24.927011489868164, "global_step": 257360, "epoch": 3100} {"train_loss": -25.067548751831055, "global_step": 257361, "epoch": 3100} {"train_loss": -24.60540771484375, "global_step": 257362, "epoch": 3100} {"train_loss": -24.707237243652344, "global_step": 257363, "epoch": 3100} {"train_loss": -24.304641723632812, "global_step": 257364, "epoch": 3100} {"train_loss": -24.075918197631836, "global_step": 257365, "epoch": 3100} {"train_loss": -23.896015167236328, "global_step": 257366, "epoch": 3100} {"train_loss": -24.97633171081543, "global_step": 257367, "epoch": 3100} {"train_loss": -25.08924674987793, "global_step": 257368, "epoch": 3100} {"train_loss": -24.957860946655273, "global_step": 257369, "epoch": 3100} {"train_loss": -24.960941314697266, "global_step": 257370, "epoch": 3100} {"train_loss": -24.67072868347168, "global_step": 257371, "epoch": 3100} {"train_loss": -25.07610511779785, "global_step": 257372, "epoch": 3100} {"train_loss": -25.225439071655273, "global_step": 257373, "epoch": 3100} {"train_loss": -25.25504493713379, "global_step": 257374, "epoch": 3100} {"train_loss": -25.03084373474121, "global_step": 257375, "epoch": 3100} {"train_loss": -25.314828872680664, "global_step": 257376, "epoch": 3100} {"train_loss": -25.092426300048828, "global_step": 257377, "epoch": 3100} {"train_loss": -24.78157615661621, "global_step": 257378, "epoch": 3100} {"train_loss": -25.021848678588867, "global_step": 257379, "epoch": 3100} {"train_loss": -25.086444854736328, "global_step": 257380, "epoch": 3100} {"train_loss": -25.010364532470703, "global_step": 257381, "epoch": 3100} {"train_loss": -24.983727995171606, "global_step": 257382, "epoch": 3100, "train/sim_max_reward_0": 1.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4500000": 1.0, "test/sim_max_reward_4500001": 1.0, "test/sim_max_reward_4500002": 1.0, "test/sim_max_reward_4500003": 1.0, "test/sim_max_reward_4500004": 1.0, "test/sim_max_reward_4500005": 1.0, "test/sim_max_reward_4500006": 1.0, "test/sim_max_reward_4500007": 1.0, "test/sim_max_reward_4500008": 1.0, "test/sim_max_reward_4500009": 1.0, "test/sim_max_reward_4500010": 1.0, "test/sim_max_reward_4500011": 1.0, "test/sim_max_reward_4500012": 1.0, "test/sim_max_reward_4500013": 1.0, "test/sim_max_reward_4500014": 1.0, "test/sim_max_reward_4500015": 1.0, "test/sim_max_reward_4500016": 1.0, "test/sim_max_reward_4500017": 1.0, "test/sim_max_reward_4500018": 0.0, "test/sim_max_reward_4500019": 1.0, "test/sim_max_reward_4500020": 1.0, "test/sim_max_reward_4500021": 1.0, "train/mean_score": 1.0, "test/mean_score": 0.9545454545454546, "val_loss": 6901887.5} {"train_loss": -24.788867950439453, "global_step": 257383, "epoch": 3101} {"train_loss": -24.802621841430664, "global_step": 257384, "epoch": 3101} {"train_loss": -24.709217071533203, "global_step": 257385, "epoch": 3101} {"train_loss": -25.070608139038086, "global_step": 257386, "epoch": 3101} {"train_loss": -24.577238082885742, "global_step": 257387, "epoch": 3101} {"train_loss": -24.586835861206055, "global_step": 257388, "epoch": 3101} {"train_loss": -24.59529685974121, "global_step": 257389, "epoch": 3101} {"train_loss": -24.451017379760742, "global_step": 257390, "epoch": 3101} {"train_loss": -24.673629760742188, "global_step": 257391, "epoch": 3101} {"train_loss": -24.537799835205078, "global_step": 257392, "epoch": 3101} {"train_loss": -24.690385818481445, "global_step": 257393, "epoch": 3101} {"train_loss": -24.540124893188477, "global_step": 257394, "epoch": 3101} {"train_loss": -25.165538787841797, "global_step": 257395, "epoch": 3101} {"train_loss": -25.002614974975586, "global_step": 257396, "epoch": 3101} {"train_loss": -24.969385147094727, "global_step": 257397, "epoch": 3101} {"train_loss": -24.99277114868164, "global_step": 257398, "epoch": 3101} {"train_loss": -24.619794845581055, "global_step": 257399, "epoch": 3101} {"train_loss": -25.129791259765625, "global_step": 257400, "epoch": 3101} {"train_loss": -25.21234130859375, "global_step": 257401, "epoch": 3101} {"train_loss": -25.392414093017578, "global_step": 257402, "epoch": 3101} {"train_loss": -25.27695083618164, "global_step": 257403, "epoch": 3101} {"train_loss": -25.12994384765625, "global_step": 257404, "epoch": 3101} {"train_loss": -24.980356216430664, "global_step": 257405, "epoch": 3101} {"train_loss": -24.85291862487793, "global_step": 257406, "epoch": 3101} {"train_loss": -25.54633903503418, "global_step": 257407, "epoch": 3101} {"train_loss": -25.198461532592773, "global_step": 257408, "epoch": 3101} {"train_loss": -25.240575790405273, "global_step": 257409, "epoch": 3101} {"train_loss": -25.230253219604492, "global_step": 257410, "epoch": 3101} {"train_loss": -25.111143112182617, "global_step": 257411, "epoch": 3101} {"train_loss": -25.118152618408203, "global_step": 257412, "epoch": 3101} {"train_loss": -25.09967613220215, "global_step": 257413, "epoch": 3101} {"train_loss": -25.181798934936523, "global_step": 257414, "epoch": 3101} {"train_loss": -25.050291061401367, "global_step": 257415, "epoch": 3101} {"train_loss": -25.353961944580078, "global_step": 257416, "epoch": 3101} {"train_loss": -25.278053283691406, "global_step": 257417, "epoch": 3101} {"train_loss": -25.25848960876465, "global_step": 257418, "epoch": 3101} {"train_loss": -25.57625389099121, "global_step": 257419, "epoch": 3101} {"train_loss": -25.365291595458984, "global_step": 257420, "epoch": 3101} {"train_loss": -25.59625816345215, "global_step": 257421, "epoch": 3101} {"train_loss": -25.456825256347656, "global_step": 257422, "epoch": 3101} {"train_loss": -25.6182918548584, "global_step": 257423, "epoch": 3101} {"train_loss": -25.125534057617188, "global_step": 257424, "epoch": 3101} {"train_loss": -25.33504295349121, "global_step": 257425, "epoch": 3101} {"train_loss": -25.2701473236084, "global_step": 257426, "epoch": 3101} {"train_loss": -25.525300979614258, "global_step": 257427, "epoch": 3101} {"train_loss": -24.94746971130371, "global_step": 257428, "epoch": 3101} {"train_loss": -24.963703155517578, "global_step": 257429, "epoch": 3101} {"train_loss": -25.3720645904541, "global_step": 257430, "epoch": 3101} {"train_loss": -25.015905380249023, "global_step": 257431, "epoch": 3101} {"train_loss": -25.155603408813477, "global_step": 257432, "epoch": 3101} {"train_loss": -25.463581085205078, "global_step": 257433, "epoch": 3101} {"train_loss": -25.141096115112305, "global_step": 257434, "epoch": 3101} {"train_loss": -24.815771102905273, "global_step": 257435, "epoch": 3101} {"train_loss": -25.209888458251953, "global_step": 257436, "epoch": 3101} {"train_loss": -25.033843994140625, "global_step": 257437, "epoch": 3101} {"train_loss": -25.033504486083984, "global_step": 257438, "epoch": 3101} {"train_loss": -24.843053817749023, "global_step": 257439, "epoch": 3101} {"train_loss": -25.069005966186523, "global_step": 257440, "epoch": 3101} {"train_loss": -25.578691482543945, "global_step": 257441, "epoch": 3101} {"train_loss": -25.11394500732422, "global_step": 257442, "epoch": 3101} {"train_loss": -24.556079864501953, "global_step": 257443, "epoch": 3101} {"train_loss": -24.526147842407227, "global_step": 257444, "epoch": 3101} {"train_loss": -25.1895751953125, "global_step": 257445, "epoch": 3101} {"train_loss": -24.99639892578125, "global_step": 257446, "epoch": 3101} {"train_loss": -25.10850715637207, "global_step": 257447, "epoch": 3101} {"train_loss": -24.900136947631836, "global_step": 257448, "epoch": 3101} {"train_loss": -25.47809410095215, "global_step": 257449, "epoch": 3101} {"train_loss": -25.1564884185791, "global_step": 257450, "epoch": 3101} {"train_loss": -25.137062072753906, "global_step": 257451, "epoch": 3101} {"train_loss": -25.018014907836914, "global_step": 257452, "epoch": 3101} {"train_loss": -25.220579147338867, "global_step": 257453, "epoch": 3101} {"train_loss": -25.099018096923828, "global_step": 257454, "epoch": 3101} {"train_loss": -24.851131439208984, "global_step": 257455, "epoch": 3101} {"train_loss": -25.19893455505371, "global_step": 257456, "epoch": 3101} {"train_loss": -24.988380432128906, "global_step": 257457, "epoch": 3101} {"train_loss": -25.04648208618164, "global_step": 257458, "epoch": 3101} {"train_loss": -25.110544204711914, "global_step": 257459, "epoch": 3101} {"train_loss": -25.254592895507812, "global_step": 257460, "epoch": 3101} {"train_loss": -25.305322647094727, "global_step": 257461, "epoch": 3101} {"train_loss": -25.26397132873535, "global_step": 257462, "epoch": 3101} {"train_loss": -25.09649658203125, "global_step": 257463, "epoch": 3101} {"train_loss": -25.19076919555664, "global_step": 257464, "epoch": 3101} {"train_loss": -25.05652073779738, "global_step": 257465, "epoch": 3101, "val_loss": 6991785.0} {"train_loss": -23.718000411987305, "global_step": 257466, "epoch": 3102} {"train_loss": -22.354026794433594, "global_step": 257467, "epoch": 3102} {"train_loss": -23.764312744140625, "global_step": 257468, "epoch": 3102} {"train_loss": -24.90992546081543, "global_step": 257469, "epoch": 3102} {"train_loss": -23.38547706604004, "global_step": 257470, "epoch": 3102} {"train_loss": -24.229381561279297, "global_step": 257471, "epoch": 3102} {"train_loss": -23.991531372070312, "global_step": 257472, "epoch": 3102} {"train_loss": -24.3001766204834, "global_step": 257473, "epoch": 3102} {"train_loss": -24.30596160888672, "global_step": 257474, "epoch": 3102} {"train_loss": -24.48231315612793, "global_step": 257475, "epoch": 3102} {"train_loss": -24.167587280273438, "global_step": 257476, "epoch": 3102} {"train_loss": -24.872989654541016, "global_step": 257477, "epoch": 3102} {"train_loss": -24.667266845703125, "global_step": 257478, "epoch": 3102} {"train_loss": -24.668413162231445, "global_step": 257479, "epoch": 3102} {"train_loss": -24.40484046936035, "global_step": 257480, "epoch": 3102} {"train_loss": -24.34222412109375, "global_step": 257481, "epoch": 3102} {"train_loss": -24.407690048217773, "global_step": 257482, "epoch": 3102} {"train_loss": -24.773202896118164, "global_step": 257483, "epoch": 3102} {"train_loss": -24.3819522857666, "global_step": 257484, "epoch": 3102} {"train_loss": -24.689393997192383, "global_step": 257485, "epoch": 3102} {"train_loss": -24.647180557250977, "global_step": 257486, "epoch": 3102} {"train_loss": -24.579919815063477, "global_step": 257487, "epoch": 3102} {"train_loss": -24.622638702392578, "global_step": 257488, "epoch": 3102} {"train_loss": -24.641687393188477, "global_step": 257489, "epoch": 3102} {"train_loss": -24.724529266357422, "global_step": 257490, "epoch": 3102} {"train_loss": -24.73658561706543, "global_step": 257491, "epoch": 3102} {"train_loss": -24.716123580932617, "global_step": 257492, "epoch": 3102} {"train_loss": -24.992799758911133, "global_step": 257493, "epoch": 3102} {"train_loss": -24.999753952026367, "global_step": 257494, "epoch": 3102} {"train_loss": -25.001848220825195, "global_step": 257495, "epoch": 3102} {"train_loss": -24.847734451293945, "global_step": 257496, "epoch": 3102} {"train_loss": -24.741994857788086, "global_step": 257497, "epoch": 3102} {"train_loss": -25.125747680664062, "global_step": 257498, "epoch": 3102} {"train_loss": -25.5113525390625, "global_step": 257499, "epoch": 3102} {"train_loss": -25.383079528808594, "global_step": 257500, "epoch": 3102} {"train_loss": -24.99005889892578, "global_step": 257501, "epoch": 3102} {"train_loss": -25.03093910217285, "global_step": 257502, "epoch": 3102} {"train_loss": -24.843048095703125, "global_step": 257503, "epoch": 3102} {"train_loss": -25.03270721435547, "global_step": 257504, "epoch": 3102} {"train_loss": -25.346235275268555, "global_step": 257505, "epoch": 3102} {"train_loss": -25.150598526000977, "global_step": 257506, "epoch": 3102} {"train_loss": -25.163593292236328, "global_step": 257507, "epoch": 3102} {"train_loss": -25.302785873413086, "global_step": 257508, "epoch": 3102} {"train_loss": -25.240859985351562, "global_step": 257509, "epoch": 3102} {"train_loss": -25.239501953125, "global_step": 257510, "epoch": 3102} {"train_loss": -25.071224212646484, "global_step": 257511, "epoch": 3102} {"train_loss": -24.978731155395508, "global_step": 257512, "epoch": 3102} {"train_loss": -25.6363468170166, "global_step": 257513, "epoch": 3102} {"train_loss": -25.283021926879883, "global_step": 257514, "epoch": 3102} {"train_loss": -25.420913696289062, "global_step": 257515, "epoch": 3102} {"train_loss": -25.601547241210938, "global_step": 257516, "epoch": 3102} {"train_loss": -24.98651695251465, "global_step": 257517, "epoch": 3102} {"train_loss": -25.296649932861328, "global_step": 257518, "epoch": 3102} {"train_loss": -24.777801513671875, "global_step": 257519, "epoch": 3102} {"train_loss": -25.235116958618164, "global_step": 257520, "epoch": 3102} {"train_loss": -25.1187801361084, "global_step": 257521, "epoch": 3102} {"train_loss": -24.93672752380371, "global_step": 257522, "epoch": 3102} {"train_loss": -24.861560821533203, "global_step": 257523, "epoch": 3102} {"train_loss": -25.46918487548828, "global_step": 257524, "epoch": 3102} {"train_loss": -25.539596557617188, "global_step": 257525, "epoch": 3102} {"train_loss": -25.212934494018555, "global_step": 257526, "epoch": 3102} {"train_loss": -24.94853401184082, "global_step": 257527, "epoch": 3102} {"train_loss": -25.14019012451172, "global_step": 257528, "epoch": 3102} {"train_loss": -24.626676559448242, "global_step": 257529, "epoch": 3102} {"train_loss": -24.962966918945312, "global_step": 257530, "epoch": 3102} {"train_loss": -24.945714950561523, "global_step": 257531, "epoch": 3102} {"train_loss": -25.374038696289062, "global_step": 257532, "epoch": 3102} {"train_loss": -25.179630279541016, "global_step": 257533, "epoch": 3102} {"train_loss": -25.12778663635254, "global_step": 257534, "epoch": 3102} {"train_loss": -24.9107723236084, "global_step": 257535, "epoch": 3102} {"train_loss": -25.195531845092773, "global_step": 257536, "epoch": 3102} {"train_loss": -25.16697120666504, "global_step": 257537, "epoch": 3102} {"train_loss": -25.27260398864746, "global_step": 257538, "epoch": 3102} {"train_loss": -24.92705535888672, "global_step": 257539, "epoch": 3102} {"train_loss": -25.145374298095703, "global_step": 257540, "epoch": 3102} {"train_loss": -25.151073455810547, "global_step": 257541, "epoch": 3102} {"train_loss": -24.947223663330078, "global_step": 257542, "epoch": 3102} {"train_loss": -25.168527603149414, "global_step": 257543, "epoch": 3102} {"train_loss": -24.987823486328125, "global_step": 257544, "epoch": 3102} {"train_loss": -24.633331298828125, "global_step": 257545, "epoch": 3102} {"train_loss": -25.179946899414062, "global_step": 257546, "epoch": 3102} {"train_loss": -25.286331176757812, "global_step": 257547, "epoch": 3102} {"train_loss": -24.87148466454931, "global_step": 257548, "epoch": 3102, "val_loss": 6833155.0} {"train_loss": -25.157461166381836, "global_step": 257549, "epoch": 3103} {"train_loss": -24.838716506958008, "global_step": 257550, "epoch": 3103} {"train_loss": -24.59978675842285, "global_step": 257551, "epoch": 3103} {"train_loss": -25.04269790649414, "global_step": 257552, "epoch": 3103} {"train_loss": -24.969970703125, "global_step": 257553, "epoch": 3103} {"train_loss": -25.12250328063965, "global_step": 257554, "epoch": 3103} {"train_loss": -25.12900733947754, "global_step": 257555, "epoch": 3103} {"train_loss": -24.6295108795166, "global_step": 257556, "epoch": 3103} {"train_loss": -24.7114315032959, "global_step": 257557, "epoch": 3103} {"train_loss": -25.095245361328125, "global_step": 257558, "epoch": 3103} {"train_loss": -24.81586265563965, "global_step": 257559, "epoch": 3103} {"train_loss": -25.164169311523438, "global_step": 257560, "epoch": 3103} {"train_loss": -25.048898696899414, "global_step": 257561, "epoch": 3103} {"train_loss": -25.376632690429688, "global_step": 257562, "epoch": 3103} {"train_loss": -25.376718521118164, "global_step": 257563, "epoch": 3103} {"train_loss": -24.954660415649414, "global_step": 257564, "epoch": 3103} {"train_loss": -24.719236373901367, "global_step": 257565, "epoch": 3103} {"train_loss": -25.644956588745117, "global_step": 257566, "epoch": 3103} {"train_loss": -25.10023307800293, "global_step": 257567, "epoch": 3103} {"train_loss": -25.092639923095703, "global_step": 257568, "epoch": 3103} {"train_loss": -25.276708602905273, "global_step": 257569, "epoch": 3103} {"train_loss": -25.177892684936523, "global_step": 257570, "epoch": 3103} {"train_loss": -25.183557510375977, "global_step": 257571, "epoch": 3103} {"train_loss": -25.253881454467773, "global_step": 257572, "epoch": 3103} {"train_loss": -25.04810905456543, "global_step": 257573, "epoch": 3103} {"train_loss": -25.08550453186035, "global_step": 257574, "epoch": 3103} {"train_loss": -25.039737701416016, "global_step": 257575, "epoch": 3103} {"train_loss": -25.47446060180664, "global_step": 257576, "epoch": 3103} {"train_loss": -24.798954010009766, "global_step": 257577, "epoch": 3103} {"train_loss": -25.334455490112305, "global_step": 257578, "epoch": 3103} {"train_loss": -24.930761337280273, "global_step": 257579, "epoch": 3103} {"train_loss": -25.30531883239746, "global_step": 257580, "epoch": 3103} {"train_loss": -24.829837799072266, "global_step": 257581, "epoch": 3103} {"train_loss": -25.122465133666992, "global_step": 257582, "epoch": 3103} {"train_loss": -25.268320083618164, "global_step": 257583, "epoch": 3103} {"train_loss": -25.341232299804688, "global_step": 257584, "epoch": 3103} {"train_loss": -25.280675888061523, "global_step": 257585, "epoch": 3103} {"train_loss": -25.373458862304688, "global_step": 257586, "epoch": 3103} {"train_loss": -25.25469970703125, "global_step": 257587, "epoch": 3103} {"train_loss": -25.30423927307129, "global_step": 257588, "epoch": 3103} {"train_loss": -25.06793212890625, "global_step": 257589, "epoch": 3103} {"train_loss": -25.347095489501953, "global_step": 257590, "epoch": 3103} {"train_loss": -25.131460189819336, "global_step": 257591, "epoch": 3103} {"train_loss": -25.332624435424805, "global_step": 257592, "epoch": 3103} {"train_loss": -25.238744735717773, "global_step": 257593, "epoch": 3103} {"train_loss": -25.203596115112305, "global_step": 257594, "epoch": 3103} {"train_loss": -25.387704849243164, "global_step": 257595, "epoch": 3103} {"train_loss": -25.234844207763672, "global_step": 257596, "epoch": 3103} {"train_loss": -25.238426208496094, "global_step": 257597, "epoch": 3103} {"train_loss": -25.215864181518555, "global_step": 257598, "epoch": 3103} {"train_loss": -25.28230094909668, "global_step": 257599, "epoch": 3103} {"train_loss": -25.561140060424805, "global_step": 257600, "epoch": 3103} {"train_loss": -24.7753849029541, "global_step": 257601, "epoch": 3103} {"train_loss": -25.012243270874023, "global_step": 257602, "epoch": 3103} {"train_loss": -25.69891929626465, "global_step": 257603, "epoch": 3103} {"train_loss": -25.327192306518555, "global_step": 257604, "epoch": 3103} {"train_loss": -25.230703353881836, "global_step": 257605, "epoch": 3103} {"train_loss": -25.252685546875, "global_step": 257606, "epoch": 3103} {"train_loss": -25.367284774780273, "global_step": 257607, "epoch": 3103} {"train_loss": -25.13126564025879, "global_step": 257608, "epoch": 3103} {"train_loss": -25.428251266479492, "global_step": 257609, "epoch": 3103} {"train_loss": -25.01518440246582, "global_step": 257610, "epoch": 3103} {"train_loss": -25.2878360748291, "global_step": 257611, "epoch": 3103} {"train_loss": -25.23040771484375, "global_step": 257612, "epoch": 3103} {"train_loss": -25.483169555664062, "global_step": 257613, "epoch": 3103} {"train_loss": -25.209680557250977, "global_step": 257614, "epoch": 3103} {"train_loss": -25.626489639282227, "global_step": 257615, "epoch": 3103} {"train_loss": -25.02448844909668, "global_step": 257616, "epoch": 3103} {"train_loss": -25.338775634765625, "global_step": 257617, "epoch": 3103} {"train_loss": -25.56435203552246, "global_step": 257618, "epoch": 3103} {"train_loss": -25.234895706176758, "global_step": 257619, "epoch": 3103} {"train_loss": -24.695831298828125, "global_step": 257620, "epoch": 3103} {"train_loss": -24.06060028076172, "global_step": 257621, "epoch": 3103} {"train_loss": -23.477500915527344, "global_step": 257622, "epoch": 3103} {"train_loss": -24.44999885559082, "global_step": 257623, "epoch": 3103} {"train_loss": -25.193140029907227, "global_step": 257624, "epoch": 3103} {"train_loss": -24.836050033569336, "global_step": 257625, "epoch": 3103} {"train_loss": -24.655887603759766, "global_step": 257626, "epoch": 3103} {"train_loss": -24.676599502563477, "global_step": 257627, "epoch": 3103} {"train_loss": -24.31085777282715, "global_step": 257628, "epoch": 3103} {"train_loss": -24.71746063232422, "global_step": 257629, "epoch": 3103} {"train_loss": -24.49253273010254, "global_step": 257630, "epoch": 3103} {"train_loss": -25.090328974896167, "global_step": 257631, "epoch": 3103, "val_loss": 7054667.5} {"train_loss": -22.896642684936523, "global_step": 257632, "epoch": 3104} {"train_loss": -22.611820220947266, "global_step": 257633, "epoch": 3104} {"train_loss": -23.16415786743164, "global_step": 257634, "epoch": 3104} {"train_loss": -23.637170791625977, "global_step": 257635, "epoch": 3104} {"train_loss": -23.860074996948242, "global_step": 257636, "epoch": 3104} {"train_loss": -24.144346237182617, "global_step": 257637, "epoch": 3104} {"train_loss": -24.10725975036621, "global_step": 257638, "epoch": 3104} {"train_loss": -23.839845657348633, "global_step": 257639, "epoch": 3104} {"train_loss": -24.547300338745117, "global_step": 257640, "epoch": 3104} {"train_loss": -24.134695053100586, "global_step": 257641, "epoch": 3104} {"train_loss": -24.429304122924805, "global_step": 257642, "epoch": 3104} {"train_loss": -24.60109519958496, "global_step": 257643, "epoch": 3104} {"train_loss": -24.386442184448242, "global_step": 257644, "epoch": 3104} {"train_loss": -24.330495834350586, "global_step": 257645, "epoch": 3104} {"train_loss": -24.66302490234375, "global_step": 257646, "epoch": 3104} {"train_loss": -24.38568115234375, "global_step": 257647, "epoch": 3104} {"train_loss": -24.586292266845703, "global_step": 257648, "epoch": 3104} {"train_loss": -24.532968521118164, "global_step": 257649, "epoch": 3104} {"train_loss": -24.599252700805664, "global_step": 257650, "epoch": 3104} {"train_loss": -24.813650131225586, "global_step": 257651, "epoch": 3104} {"train_loss": -24.677406311035156, "global_step": 257652, "epoch": 3104} {"train_loss": -24.787734985351562, "global_step": 257653, "epoch": 3104} {"train_loss": -24.725854873657227, "global_step": 257654, "epoch": 3104} {"train_loss": -25.09009552001953, "global_step": 257655, "epoch": 3104} {"train_loss": -24.932254791259766, "global_step": 257656, "epoch": 3104} {"train_loss": -24.874038696289062, "global_step": 257657, "epoch": 3104} {"train_loss": -24.957962036132812, "global_step": 257658, "epoch": 3104} {"train_loss": -24.863140106201172, "global_step": 257659, "epoch": 3104} {"train_loss": -24.8115234375, "global_step": 257660, "epoch": 3104} {"train_loss": -25.084394454956055, "global_step": 257661, "epoch": 3104} {"train_loss": -25.030426025390625, "global_step": 257662, "epoch": 3104} {"train_loss": -24.799665451049805, "global_step": 257663, "epoch": 3104} {"train_loss": -24.809614181518555, "global_step": 257664, "epoch": 3104} {"train_loss": -24.957897186279297, "global_step": 257665, "epoch": 3104} {"train_loss": -25.092443466186523, "global_step": 257666, "epoch": 3104} {"train_loss": -24.922740936279297, "global_step": 257667, "epoch": 3104} {"train_loss": -25.252580642700195, "global_step": 257668, "epoch": 3104} {"train_loss": -25.104934692382812, "global_step": 257669, "epoch": 3104} {"train_loss": -25.118925094604492, "global_step": 257670, "epoch": 3104} {"train_loss": -24.861188888549805, "global_step": 257671, "epoch": 3104} {"train_loss": -25.19896125793457, "global_step": 257672, "epoch": 3104} {"train_loss": -24.99519157409668, "global_step": 257673, "epoch": 3104} {"train_loss": -25.07052230834961, "global_step": 257674, "epoch": 3104} {"train_loss": -25.315048217773438, "global_step": 257675, "epoch": 3104} {"train_loss": -25.35220718383789, "global_step": 257676, "epoch": 3104} {"train_loss": -25.373409271240234, "global_step": 257677, "epoch": 3104} {"train_loss": -24.851621627807617, "global_step": 257678, "epoch": 3104} {"train_loss": -24.94930076599121, "global_step": 257679, "epoch": 3104} {"train_loss": -25.312856674194336, "global_step": 257680, "epoch": 3104} {"train_loss": -25.388046264648438, "global_step": 257681, "epoch": 3104} {"train_loss": -25.642118453979492, "global_step": 257682, "epoch": 3104} {"train_loss": -25.0715389251709, "global_step": 257683, "epoch": 3104} {"train_loss": -25.12799072265625, "global_step": 257684, "epoch": 3104} {"train_loss": -25.114774703979492, "global_step": 257685, "epoch": 3104} {"train_loss": -25.23481559753418, "global_step": 257686, "epoch": 3104} {"train_loss": -25.004501342773438, "global_step": 257687, "epoch": 3104} {"train_loss": -25.418411254882812, "global_step": 257688, "epoch": 3104} {"train_loss": -25.121442794799805, "global_step": 257689, "epoch": 3104} {"train_loss": -25.141925811767578, "global_step": 257690, "epoch": 3104} {"train_loss": -25.227508544921875, "global_step": 257691, "epoch": 3104} {"train_loss": -24.842185974121094, "global_step": 257692, "epoch": 3104} {"train_loss": -24.795942306518555, "global_step": 257693, "epoch": 3104} {"train_loss": -24.699338912963867, "global_step": 257694, "epoch": 3104} {"train_loss": -25.172758102416992, "global_step": 257695, "epoch": 3104} {"train_loss": -25.01337242126465, "global_step": 257696, "epoch": 3104} {"train_loss": -24.93377113342285, "global_step": 257697, "epoch": 3104} {"train_loss": -25.303756713867188, "global_step": 257698, "epoch": 3104} {"train_loss": -25.200841903686523, "global_step": 257699, "epoch": 3104} {"train_loss": -25.077341079711914, "global_step": 257700, "epoch": 3104} {"train_loss": -25.038532257080078, "global_step": 257701, "epoch": 3104} {"train_loss": -25.35973358154297, "global_step": 257702, "epoch": 3104} {"train_loss": -24.80900001525879, "global_step": 257703, "epoch": 3104} {"train_loss": -24.99573516845703, "global_step": 257704, "epoch": 3104} {"train_loss": -25.140615463256836, "global_step": 257705, "epoch": 3104} {"train_loss": -24.577484130859375, "global_step": 257706, "epoch": 3104} {"train_loss": -24.906431198120117, "global_step": 257707, "epoch": 3104} {"train_loss": -25.05483055114746, "global_step": 257708, "epoch": 3104} {"train_loss": -25.204267501831055, "global_step": 257709, "epoch": 3104} {"train_loss": -24.916950225830078, "global_step": 257710, "epoch": 3104} {"train_loss": -25.131389617919922, "global_step": 257711, "epoch": 3104} {"train_loss": -25.125263214111328, "global_step": 257712, "epoch": 3104} {"train_loss": -25.036672592163086, "global_step": 257713, "epoch": 3104} {"train_loss": -24.829478849847632, "global_step": 257714, "epoch": 3104, "val_loss": 6784245.0} {"train_loss": -25.174564361572266, "global_step": 257715, "epoch": 3105} {"train_loss": -24.897504806518555, "global_step": 257716, "epoch": 3105} {"train_loss": -24.97113037109375, "global_step": 257717, "epoch": 3105} {"train_loss": -24.35312843322754, "global_step": 257718, "epoch": 3105} {"train_loss": -24.996728897094727, "global_step": 257719, "epoch": 3105} {"train_loss": -24.833375930786133, "global_step": 257720, "epoch": 3105} {"train_loss": -24.69784927368164, "global_step": 257721, "epoch": 3105} {"train_loss": -24.6712589263916, "global_step": 257722, "epoch": 3105} {"train_loss": -24.734146118164062, "global_step": 257723, "epoch": 3105} {"train_loss": -24.916900634765625, "global_step": 257724, "epoch": 3105} {"train_loss": -24.629621505737305, "global_step": 257725, "epoch": 3105} {"train_loss": -24.689001083374023, "global_step": 257726, "epoch": 3105} {"train_loss": -25.065990447998047, "global_step": 257727, "epoch": 3105} {"train_loss": -24.864133834838867, "global_step": 257728, "epoch": 3105} {"train_loss": -24.84737205505371, "global_step": 257729, "epoch": 3105} {"train_loss": -25.133520126342773, "global_step": 257730, "epoch": 3105} {"train_loss": -25.018680572509766, "global_step": 257731, "epoch": 3105} {"train_loss": -25.090879440307617, "global_step": 257732, "epoch": 3105} {"train_loss": -24.88819694519043, "global_step": 257733, "epoch": 3105} {"train_loss": -25.14272689819336, "global_step": 257734, "epoch": 3105} {"train_loss": -24.97309684753418, "global_step": 257735, "epoch": 3105} {"train_loss": -25.165536880493164, "global_step": 257736, "epoch": 3105} {"train_loss": -24.845548629760742, "global_step": 257737, "epoch": 3105} {"train_loss": -25.14727783203125, "global_step": 257738, "epoch": 3105} {"train_loss": -24.994770050048828, "global_step": 257739, "epoch": 3105} {"train_loss": -25.3394775390625, "global_step": 257740, "epoch": 3105} {"train_loss": -25.198211669921875, "global_step": 257741, "epoch": 3105} {"train_loss": -24.830585479736328, "global_step": 257742, "epoch": 3105} {"train_loss": -25.089920043945312, "global_step": 257743, "epoch": 3105} {"train_loss": -24.921825408935547, "global_step": 257744, "epoch": 3105} {"train_loss": -25.346038818359375, "global_step": 257745, "epoch": 3105} {"train_loss": -25.553333282470703, "global_step": 257746, "epoch": 3105} {"train_loss": -25.237876892089844, "global_step": 257747, "epoch": 3105} {"train_loss": -25.27761459350586, "global_step": 257748, "epoch": 3105} {"train_loss": -25.289487838745117, "global_step": 257749, "epoch": 3105} {"train_loss": -25.227407455444336, "global_step": 257750, "epoch": 3105} {"train_loss": -25.10525131225586, "global_step": 257751, "epoch": 3105} {"train_loss": -25.315622329711914, "global_step": 257752, "epoch": 3105} {"train_loss": -25.087749481201172, "global_step": 257753, "epoch": 3105} {"train_loss": -25.372879028320312, "global_step": 257754, "epoch": 3105} {"train_loss": -24.748271942138672, "global_step": 257755, "epoch": 3105} {"train_loss": -25.261438369750977, "global_step": 257756, "epoch": 3105} {"train_loss": -25.34967803955078, "global_step": 257757, "epoch": 3105} {"train_loss": -25.192325592041016, "global_step": 257758, "epoch": 3105} {"train_loss": -25.217941284179688, "global_step": 257759, "epoch": 3105} {"train_loss": -25.0015869140625, "global_step": 257760, "epoch": 3105} {"train_loss": -25.18532943725586, "global_step": 257761, "epoch": 3105} {"train_loss": -25.18259048461914, "global_step": 257762, "epoch": 3105} {"train_loss": -25.46675682067871, "global_step": 257763, "epoch": 3105} {"train_loss": -25.125457763671875, "global_step": 257764, "epoch": 3105} {"train_loss": -24.592533111572266, "global_step": 257765, "epoch": 3105} {"train_loss": -25.39674186706543, "global_step": 257766, "epoch": 3105} {"train_loss": -24.686599731445312, "global_step": 257767, "epoch": 3105} {"train_loss": -24.513715744018555, "global_step": 257768, "epoch": 3105} {"train_loss": -24.748083114624023, "global_step": 257769, "epoch": 3105} {"train_loss": -24.894193649291992, "global_step": 257770, "epoch": 3105} {"train_loss": -24.90279769897461, "global_step": 257771, "epoch": 3105} {"train_loss": -24.954315185546875, "global_step": 257772, "epoch": 3105} {"train_loss": -25.175914764404297, "global_step": 257773, "epoch": 3105} {"train_loss": -25.297893524169922, "global_step": 257774, "epoch": 3105} {"train_loss": -24.625957489013672, "global_step": 257775, "epoch": 3105} {"train_loss": -25.17203712463379, "global_step": 257776, "epoch": 3105} {"train_loss": -24.908096313476562, "global_step": 257777, "epoch": 3105} {"train_loss": -25.10389518737793, "global_step": 257778, "epoch": 3105} {"train_loss": -25.061498641967773, "global_step": 257779, "epoch": 3105} {"train_loss": -24.927953720092773, "global_step": 257780, "epoch": 3105} {"train_loss": -25.03142738342285, "global_step": 257781, "epoch": 3105} {"train_loss": -24.858774185180664, "global_step": 257782, "epoch": 3105} {"train_loss": -24.91328239440918, "global_step": 257783, "epoch": 3105} {"train_loss": -24.799884796142578, "global_step": 257784, "epoch": 3105} {"train_loss": -25.244155883789062, "global_step": 257785, "epoch": 3105} {"train_loss": -25.253934860229492, "global_step": 257786, "epoch": 3105} {"train_loss": -25.13104820251465, "global_step": 257787, "epoch": 3105} {"train_loss": -25.065427780151367, "global_step": 257788, "epoch": 3105} {"train_loss": -25.284515380859375, "global_step": 257789, "epoch": 3105} {"train_loss": -25.11760902404785, "global_step": 257790, "epoch": 3105} {"train_loss": -25.08466148376465, "global_step": 257791, "epoch": 3105} {"train_loss": -25.191930770874023, "global_step": 257792, "epoch": 3105} {"train_loss": -24.845489501953125, "global_step": 257793, "epoch": 3105} {"train_loss": -25.017484664916992, "global_step": 257794, "epoch": 3105} {"train_loss": -24.746124267578125, "global_step": 257795, "epoch": 3105} {"train_loss": -24.884347915649414, "global_step": 257796, "epoch": 3105} {"train_loss": -25.015806565801782, "global_step": 257797, "epoch": 3105, "val_loss": 6913807.0} {"train_loss": -24.676076889038086, "global_step": 257798, "epoch": 3106} {"train_loss": -24.62318992614746, "global_step": 257799, "epoch": 3106} {"train_loss": -24.55647850036621, "global_step": 257800, "epoch": 3106} {"train_loss": -24.86117935180664, "global_step": 257801, "epoch": 3106} {"train_loss": -24.295433044433594, "global_step": 257802, "epoch": 3106} {"train_loss": -24.06146240234375, "global_step": 257803, "epoch": 3106} {"train_loss": -24.909814834594727, "global_step": 257804, "epoch": 3106} {"train_loss": -24.676122665405273, "global_step": 257805, "epoch": 3106} {"train_loss": -24.007795333862305, "global_step": 257806, "epoch": 3106} {"train_loss": -24.78152084350586, "global_step": 257807, "epoch": 3106} {"train_loss": -24.49068260192871, "global_step": 257808, "epoch": 3106} {"train_loss": -25.07535743713379, "global_step": 257809, "epoch": 3106} {"train_loss": -25.083438873291016, "global_step": 257810, "epoch": 3106} {"train_loss": -24.53522300720215, "global_step": 257811, "epoch": 3106} {"train_loss": -25.032968521118164, "global_step": 257812, "epoch": 3106} {"train_loss": -24.81719970703125, "global_step": 257813, "epoch": 3106} {"train_loss": -25.030807495117188, "global_step": 257814, "epoch": 3106} {"train_loss": -24.847003936767578, "global_step": 257815, "epoch": 3106} {"train_loss": -24.8407039642334, "global_step": 257816, "epoch": 3106} {"train_loss": -25.023466110229492, "global_step": 257817, "epoch": 3106} {"train_loss": -25.00188636779785, "global_step": 257818, "epoch": 3106} {"train_loss": -25.08350944519043, "global_step": 257819, "epoch": 3106} {"train_loss": -25.503477096557617, "global_step": 257820, "epoch": 3106} {"train_loss": -25.063060760498047, "global_step": 257821, "epoch": 3106} {"train_loss": -25.5201358795166, "global_step": 257822, "epoch": 3106} {"train_loss": -24.74159812927246, "global_step": 257823, "epoch": 3106} {"train_loss": -25.156524658203125, "global_step": 257824, "epoch": 3106} {"train_loss": -25.385244369506836, "global_step": 257825, "epoch": 3106} {"train_loss": -24.64027214050293, "global_step": 257826, "epoch": 3106} {"train_loss": -25.19746971130371, "global_step": 257827, "epoch": 3106} {"train_loss": -25.228174209594727, "global_step": 257828, "epoch": 3106} {"train_loss": -25.308324813842773, "global_step": 257829, "epoch": 3106} {"train_loss": -24.943058013916016, "global_step": 257830, "epoch": 3106} {"train_loss": -25.134178161621094, "global_step": 257831, "epoch": 3106} {"train_loss": -25.1402587890625, "global_step": 257832, "epoch": 3106} {"train_loss": -25.33600425720215, "global_step": 257833, "epoch": 3106} {"train_loss": -24.918439865112305, "global_step": 257834, "epoch": 3106} {"train_loss": -25.053409576416016, "global_step": 257835, "epoch": 3106} {"train_loss": -25.172443389892578, "global_step": 257836, "epoch": 3106} {"train_loss": -25.368450164794922, "global_step": 257837, "epoch": 3106} {"train_loss": -24.92762565612793, "global_step": 257838, "epoch": 3106} {"train_loss": -25.372989654541016, "global_step": 257839, "epoch": 3106} {"train_loss": -24.91189956665039, "global_step": 257840, "epoch": 3106} {"train_loss": -25.254865646362305, "global_step": 257841, "epoch": 3106} {"train_loss": -25.173131942749023, "global_step": 257842, "epoch": 3106} {"train_loss": -25.515975952148438, "global_step": 257843, "epoch": 3106} {"train_loss": -25.45556640625, "global_step": 257844, "epoch": 3106} {"train_loss": -25.17995262145996, "global_step": 257845, "epoch": 3106} {"train_loss": -25.387130737304688, "global_step": 257846, "epoch": 3106} {"train_loss": -25.07911491394043, "global_step": 257847, "epoch": 3106} {"train_loss": -25.423114776611328, "global_step": 257848, "epoch": 3106} {"train_loss": -25.38654327392578, "global_step": 257849, "epoch": 3106} {"train_loss": -25.213285446166992, "global_step": 257850, "epoch": 3106} {"train_loss": -24.936670303344727, "global_step": 257851, "epoch": 3106} {"train_loss": -25.301469802856445, "global_step": 257852, "epoch": 3106} {"train_loss": -25.01325035095215, "global_step": 257853, "epoch": 3106} {"train_loss": -25.529905319213867, "global_step": 257854, "epoch": 3106} {"train_loss": -25.164335250854492, "global_step": 257855, "epoch": 3106} {"train_loss": -25.101465225219727, "global_step": 257856, "epoch": 3106} {"train_loss": -25.272035598754883, "global_step": 257857, "epoch": 3106} {"train_loss": -25.209253311157227, "global_step": 257858, "epoch": 3106} {"train_loss": -25.062292098999023, "global_step": 257859, "epoch": 3106} {"train_loss": -25.55782127380371, "global_step": 257860, "epoch": 3106} {"train_loss": -25.185108184814453, "global_step": 257861, "epoch": 3106} {"train_loss": -25.380834579467773, "global_step": 257862, "epoch": 3106} {"train_loss": -25.154632568359375, "global_step": 257863, "epoch": 3106} {"train_loss": -24.811199188232422, "global_step": 257864, "epoch": 3106} {"train_loss": -24.80695915222168, "global_step": 257865, "epoch": 3106} {"train_loss": -24.618925094604492, "global_step": 257866, "epoch": 3106} {"train_loss": -25.14832878112793, "global_step": 257867, "epoch": 3106} {"train_loss": -24.9565372467041, "global_step": 257868, "epoch": 3106} {"train_loss": -25.006542205810547, "global_step": 257869, "epoch": 3106} {"train_loss": -24.964466094970703, "global_step": 257870, "epoch": 3106} {"train_loss": -25.02578353881836, "global_step": 257871, "epoch": 3106} {"train_loss": -24.756494522094727, "global_step": 257872, "epoch": 3106} {"train_loss": -24.99276351928711, "global_step": 257873, "epoch": 3106} {"train_loss": -24.82756996154785, "global_step": 257874, "epoch": 3106} {"train_loss": -25.145605087280273, "global_step": 257875, "epoch": 3106} {"train_loss": -25.270614624023438, "global_step": 257876, "epoch": 3106} {"train_loss": -24.94306755065918, "global_step": 257877, "epoch": 3106} {"train_loss": -25.252546310424805, "global_step": 257878, "epoch": 3106} {"train_loss": -25.441120147705078, "global_step": 257879, "epoch": 3106} {"train_loss": -25.048363995839313, "global_step": 257880, "epoch": 3106, "val_loss": 6927352.0} {"train_loss": -24.687768936157227, "global_step": 257881, "epoch": 3107} {"train_loss": -24.97938346862793, "global_step": 257882, "epoch": 3107} {"train_loss": -24.981393814086914, "global_step": 257883, "epoch": 3107} {"train_loss": -24.912294387817383, "global_step": 257884, "epoch": 3107} {"train_loss": -25.16061782836914, "global_step": 257885, "epoch": 3107} {"train_loss": -25.086441040039062, "global_step": 257886, "epoch": 3107} {"train_loss": -24.929182052612305, "global_step": 257887, "epoch": 3107} {"train_loss": -24.819988250732422, "global_step": 257888, "epoch": 3107} {"train_loss": -25.145828247070312, "global_step": 257889, "epoch": 3107} {"train_loss": -24.7742862701416, "global_step": 257890, "epoch": 3107} {"train_loss": -24.853759765625, "global_step": 257891, "epoch": 3107} {"train_loss": -25.152359008789062, "global_step": 257892, "epoch": 3107} {"train_loss": -24.93747901916504, "global_step": 257893, "epoch": 3107} {"train_loss": -24.841373443603516, "global_step": 257894, "epoch": 3107} {"train_loss": -24.994691848754883, "global_step": 257895, "epoch": 3107} {"train_loss": -24.911672592163086, "global_step": 257896, "epoch": 3107} {"train_loss": -24.92041778564453, "global_step": 257897, "epoch": 3107} {"train_loss": -25.01595115661621, "global_step": 257898, "epoch": 3107} {"train_loss": -25.333295822143555, "global_step": 257899, "epoch": 3107} {"train_loss": -25.301435470581055, "global_step": 257900, "epoch": 3107} {"train_loss": -24.860885620117188, "global_step": 257901, "epoch": 3107} {"train_loss": -25.26447868347168, "global_step": 257902, "epoch": 3107} {"train_loss": -25.246484756469727, "global_step": 257903, "epoch": 3107} {"train_loss": -24.99677848815918, "global_step": 257904, "epoch": 3107} {"train_loss": -25.30400848388672, "global_step": 257905, "epoch": 3107} {"train_loss": -25.0815486907959, "global_step": 257906, "epoch": 3107} {"train_loss": -25.160648345947266, "global_step": 257907, "epoch": 3107} {"train_loss": -24.900182723999023, "global_step": 257908, "epoch": 3107} {"train_loss": -25.332645416259766, "global_step": 257909, "epoch": 3107} {"train_loss": -25.2641544342041, "global_step": 257910, "epoch": 3107} {"train_loss": -24.7806453704834, "global_step": 257911, "epoch": 3107} {"train_loss": -25.222963333129883, "global_step": 257912, "epoch": 3107} {"train_loss": -25.246335983276367, "global_step": 257913, "epoch": 3107} {"train_loss": -25.029233932495117, "global_step": 257914, "epoch": 3107} {"train_loss": -25.12261962890625, "global_step": 257915, "epoch": 3107} {"train_loss": -24.97789192199707, "global_step": 257916, "epoch": 3107} {"train_loss": -25.392133712768555, "global_step": 257917, "epoch": 3107} {"train_loss": -25.047250747680664, "global_step": 257918, "epoch": 3107} {"train_loss": -24.73894691467285, "global_step": 257919, "epoch": 3107} {"train_loss": -25.09787940979004, "global_step": 257920, "epoch": 3107} {"train_loss": -24.87972068786621, "global_step": 257921, "epoch": 3107} {"train_loss": -25.161455154418945, "global_step": 257922, "epoch": 3107} {"train_loss": -24.917774200439453, "global_step": 257923, "epoch": 3107} {"train_loss": -24.970474243164062, "global_step": 257924, "epoch": 3107} {"train_loss": -24.64084243774414, "global_step": 257925, "epoch": 3107} {"train_loss": -25.157020568847656, "global_step": 257926, "epoch": 3107} {"train_loss": -25.090368270874023, "global_step": 257927, "epoch": 3107} {"train_loss": -25.124975204467773, "global_step": 257928, "epoch": 3107} {"train_loss": -24.778257369995117, "global_step": 257929, "epoch": 3107} {"train_loss": -25.229406356811523, "global_step": 257930, "epoch": 3107} {"train_loss": -24.804121017456055, "global_step": 257931, "epoch": 3107} {"train_loss": -25.003854751586914, "global_step": 257932, "epoch": 3107} {"train_loss": -25.005386352539062, "global_step": 257933, "epoch": 3107} {"train_loss": -25.455419540405273, "global_step": 257934, "epoch": 3107} {"train_loss": -25.291704177856445, "global_step": 257935, "epoch": 3107} {"train_loss": -25.170650482177734, "global_step": 257936, "epoch": 3107} {"train_loss": -25.058359146118164, "global_step": 257937, "epoch": 3107} {"train_loss": -25.192106246948242, "global_step": 257938, "epoch": 3107} {"train_loss": -24.6044979095459, "global_step": 257939, "epoch": 3107} {"train_loss": -25.00029945373535, "global_step": 257940, "epoch": 3107} {"train_loss": -24.815105438232422, "global_step": 257941, "epoch": 3107} {"train_loss": -24.94692039489746, "global_step": 257942, "epoch": 3107} {"train_loss": -24.877195358276367, "global_step": 257943, "epoch": 3107} {"train_loss": -25.179670333862305, "global_step": 257944, "epoch": 3107} {"train_loss": -24.637319564819336, "global_step": 257945, "epoch": 3107} {"train_loss": -25.473478317260742, "global_step": 257946, "epoch": 3107} {"train_loss": -24.986982345581055, "global_step": 257947, "epoch": 3107} {"train_loss": -25.234907150268555, "global_step": 257948, "epoch": 3107} {"train_loss": -25.04017448425293, "global_step": 257949, "epoch": 3107} {"train_loss": -25.12933921813965, "global_step": 257950, "epoch": 3107} {"train_loss": -24.695158004760742, "global_step": 257951, "epoch": 3107} {"train_loss": -25.148475646972656, "global_step": 257952, "epoch": 3107} {"train_loss": -25.396760940551758, "global_step": 257953, "epoch": 3107} {"train_loss": -25.02024269104004, "global_step": 257954, "epoch": 3107} {"train_loss": -25.23390769958496, "global_step": 257955, "epoch": 3107} {"train_loss": -25.255874633789062, "global_step": 257956, "epoch": 3107} {"train_loss": -24.97610855102539, "global_step": 257957, "epoch": 3107} {"train_loss": -25.151803970336914, "global_step": 257958, "epoch": 3107} {"train_loss": -25.301376342773438, "global_step": 257959, "epoch": 3107} {"train_loss": -24.928882598876953, "global_step": 257960, "epoch": 3107} {"train_loss": -25.289304733276367, "global_step": 257961, "epoch": 3107} {"train_loss": -25.083757400512695, "global_step": 257962, "epoch": 3107} {"train_loss": -25.06973199959261, "global_step": 257963, "epoch": 3107, "val_loss": 6883070.0} {"train_loss": -24.73750877380371, "global_step": 257964, "epoch": 3108} {"train_loss": -24.502370834350586, "global_step": 257965, "epoch": 3108} {"train_loss": -24.050485610961914, "global_step": 257966, "epoch": 3108} {"train_loss": -24.60371971130371, "global_step": 257967, "epoch": 3108} {"train_loss": -25.187393188476562, "global_step": 257968, "epoch": 3108} {"train_loss": -24.348661422729492, "global_step": 257969, "epoch": 3108} {"train_loss": -24.62015151977539, "global_step": 257970, "epoch": 3108} {"train_loss": -24.756107330322266, "global_step": 257971, "epoch": 3108} {"train_loss": -24.883588790893555, "global_step": 257972, "epoch": 3108} {"train_loss": -24.942304611206055, "global_step": 257973, "epoch": 3108} {"train_loss": -25.164426803588867, "global_step": 257974, "epoch": 3108} {"train_loss": -25.16966438293457, "global_step": 257975, "epoch": 3108} {"train_loss": -25.130741119384766, "global_step": 257976, "epoch": 3108} {"train_loss": -25.20442008972168, "global_step": 257977, "epoch": 3108} {"train_loss": -25.053579330444336, "global_step": 257978, "epoch": 3108} {"train_loss": -25.18499183654785, "global_step": 257979, "epoch": 3108} {"train_loss": -25.07048988342285, "global_step": 257980, "epoch": 3108} {"train_loss": -24.999975204467773, "global_step": 257981, "epoch": 3108} {"train_loss": -25.555891036987305, "global_step": 257982, "epoch": 3108} {"train_loss": -25.29539680480957, "global_step": 257983, "epoch": 3108} {"train_loss": -25.01718521118164, "global_step": 257984, "epoch": 3108} {"train_loss": -25.1097354888916, "global_step": 257985, "epoch": 3108} {"train_loss": -25.510589599609375, "global_step": 257986, "epoch": 3108} {"train_loss": -25.23551368713379, "global_step": 257987, "epoch": 3108} {"train_loss": -25.13875961303711, "global_step": 257988, "epoch": 3108} {"train_loss": -24.886491775512695, "global_step": 257989, "epoch": 3108} {"train_loss": -25.11118507385254, "global_step": 257990, "epoch": 3108} {"train_loss": -24.95448875427246, "global_step": 257991, "epoch": 3108} {"train_loss": -25.626407623291016, "global_step": 257992, "epoch": 3108} {"train_loss": -24.911544799804688, "global_step": 257993, "epoch": 3108} {"train_loss": -24.832897186279297, "global_step": 257994, "epoch": 3108} {"train_loss": -25.447818756103516, "global_step": 257995, "epoch": 3108} {"train_loss": -25.56743621826172, "global_step": 257996, "epoch": 3108} {"train_loss": -25.36679458618164, "global_step": 257997, "epoch": 3108} {"train_loss": -25.387760162353516, "global_step": 257998, "epoch": 3108} {"train_loss": -25.085142135620117, "global_step": 257999, "epoch": 3108} {"train_loss": -25.038700103759766, "global_step": 258000, "epoch": 3108} {"train_loss": -25.146224975585938, "global_step": 258001, "epoch": 3108} {"train_loss": -24.819766998291016, "global_step": 258002, "epoch": 3108} {"train_loss": -24.789648056030273, "global_step": 258003, "epoch": 3108} {"train_loss": -25.07087516784668, "global_step": 258004, "epoch": 3108} {"train_loss": -24.881649017333984, "global_step": 258005, "epoch": 3108} {"train_loss": -24.862695693969727, "global_step": 258006, "epoch": 3108} {"train_loss": -24.90787696838379, "global_step": 258007, "epoch": 3108} {"train_loss": -25.070219039916992, "global_step": 258008, "epoch": 3108} {"train_loss": -25.23658561706543, "global_step": 258009, "epoch": 3108} {"train_loss": -25.01806640625, "global_step": 258010, "epoch": 3108} {"train_loss": -25.088563919067383, "global_step": 258011, "epoch": 3108} {"train_loss": -24.689990997314453, "global_step": 258012, "epoch": 3108} {"train_loss": -24.933490753173828, "global_step": 258013, "epoch": 3108} {"train_loss": -24.892436981201172, "global_step": 258014, "epoch": 3108} {"train_loss": -25.212236404418945, "global_step": 258015, "epoch": 3108} {"train_loss": -25.08994483947754, "global_step": 258016, "epoch": 3108} {"train_loss": -25.644824981689453, "global_step": 258017, "epoch": 3108} {"train_loss": -24.902029037475586, "global_step": 258018, "epoch": 3108} {"train_loss": -25.075647354125977, "global_step": 258019, "epoch": 3108} {"train_loss": -25.295053482055664, "global_step": 258020, "epoch": 3108} {"train_loss": -25.166303634643555, "global_step": 258021, "epoch": 3108} {"train_loss": -25.26064109802246, "global_step": 258022, "epoch": 3108} {"train_loss": -25.31618309020996, "global_step": 258023, "epoch": 3108} {"train_loss": -25.06724739074707, "global_step": 258024, "epoch": 3108} {"train_loss": -25.191192626953125, "global_step": 258025, "epoch": 3108} {"train_loss": -25.58564567565918, "global_step": 258026, "epoch": 3108} {"train_loss": -25.248886108398438, "global_step": 258027, "epoch": 3108} {"train_loss": -25.4387264251709, "global_step": 258028, "epoch": 3108} {"train_loss": -25.223783493041992, "global_step": 258029, "epoch": 3108} {"train_loss": -25.184919357299805, "global_step": 258030, "epoch": 3108} {"train_loss": -24.974321365356445, "global_step": 258031, "epoch": 3108} {"train_loss": -25.145559310913086, "global_step": 258032, "epoch": 3108} {"train_loss": -25.016881942749023, "global_step": 258033, "epoch": 3108} {"train_loss": -25.071374893188477, "global_step": 258034, "epoch": 3108} {"train_loss": -25.249038696289062, "global_step": 258035, "epoch": 3108} {"train_loss": -25.172649383544922, "global_step": 258036, "epoch": 3108} {"train_loss": -25.316116333007812, "global_step": 258037, "epoch": 3108} {"train_loss": -25.087568283081055, "global_step": 258038, "epoch": 3108} {"train_loss": -24.86497688293457, "global_step": 258039, "epoch": 3108} {"train_loss": -24.976964950561523, "global_step": 258040, "epoch": 3108} {"train_loss": -25.254718780517578, "global_step": 258041, "epoch": 3108} {"train_loss": -25.278156280517578, "global_step": 258042, "epoch": 3108} {"train_loss": -25.189420700073242, "global_step": 258043, "epoch": 3108} {"train_loss": -24.90431785583496, "global_step": 258044, "epoch": 3108} {"train_loss": -24.980932235717773, "global_step": 258045, "epoch": 3108} {"train_loss": -25.08581271803523, "global_step": 258046, "epoch": 3108, "val_loss": 6815331.0} {"train_loss": -24.990869522094727, "global_step": 258047, "epoch": 3109} {"train_loss": -24.917173385620117, "global_step": 258048, "epoch": 3109} {"train_loss": -25.043752670288086, "global_step": 258049, "epoch": 3109} {"train_loss": -25.246326446533203, "global_step": 258050, "epoch": 3109} {"train_loss": -24.822416305541992, "global_step": 258051, "epoch": 3109} {"train_loss": -25.32528305053711, "global_step": 258052, "epoch": 3109} {"train_loss": -24.7329158782959, "global_step": 258053, "epoch": 3109} {"train_loss": -24.810964584350586, "global_step": 258054, "epoch": 3109} {"train_loss": -24.848648071289062, "global_step": 258055, "epoch": 3109} {"train_loss": -25.04740333557129, "global_step": 258056, "epoch": 3109} {"train_loss": -25.195566177368164, "global_step": 258057, "epoch": 3109} {"train_loss": -25.177030563354492, "global_step": 258058, "epoch": 3109} {"train_loss": -25.0393009185791, "global_step": 258059, "epoch": 3109} {"train_loss": -24.787221908569336, "global_step": 258060, "epoch": 3109} {"train_loss": -24.901975631713867, "global_step": 258061, "epoch": 3109} {"train_loss": -24.98097038269043, "global_step": 258062, "epoch": 3109} {"train_loss": -25.203760147094727, "global_step": 258063, "epoch": 3109} {"train_loss": -24.95415687561035, "global_step": 258064, "epoch": 3109} {"train_loss": -25.014556884765625, "global_step": 258065, "epoch": 3109} {"train_loss": -25.3489933013916, "global_step": 258066, "epoch": 3109} {"train_loss": -24.96559715270996, "global_step": 258067, "epoch": 3109} {"train_loss": -25.156787872314453, "global_step": 258068, "epoch": 3109} {"train_loss": -25.0241641998291, "global_step": 258069, "epoch": 3109} {"train_loss": -25.005632400512695, "global_step": 258070, "epoch": 3109} {"train_loss": -25.092470169067383, "global_step": 258071, "epoch": 3109} {"train_loss": -25.576574325561523, "global_step": 258072, "epoch": 3109} {"train_loss": -25.479068756103516, "global_step": 258073, "epoch": 3109} {"train_loss": -25.43754005432129, "global_step": 258074, "epoch": 3109} {"train_loss": -25.36857032775879, "global_step": 258075, "epoch": 3109} {"train_loss": -25.421131134033203, "global_step": 258076, "epoch": 3109} {"train_loss": -24.835891723632812, "global_step": 258077, "epoch": 3109} {"train_loss": -25.18345069885254, "global_step": 258078, "epoch": 3109} {"train_loss": -24.82991600036621, "global_step": 258079, "epoch": 3109} {"train_loss": -25.528615951538086, "global_step": 258080, "epoch": 3109} {"train_loss": -25.402685165405273, "global_step": 258081, "epoch": 3109} {"train_loss": -25.11094093322754, "global_step": 258082, "epoch": 3109} {"train_loss": -25.07722282409668, "global_step": 258083, "epoch": 3109} {"train_loss": -25.300514221191406, "global_step": 258084, "epoch": 3109} {"train_loss": -24.749006271362305, "global_step": 258085, "epoch": 3109} {"train_loss": -24.99061393737793, "global_step": 258086, "epoch": 3109} {"train_loss": -25.3392391204834, "global_step": 258087, "epoch": 3109} {"train_loss": -24.861642837524414, "global_step": 258088, "epoch": 3109} {"train_loss": -25.217924118041992, "global_step": 258089, "epoch": 3109} {"train_loss": -25.017763137817383, "global_step": 258090, "epoch": 3109} {"train_loss": -24.772857666015625, "global_step": 258091, "epoch": 3109} {"train_loss": -24.787734985351562, "global_step": 258092, "epoch": 3109} {"train_loss": -24.87799644470215, "global_step": 258093, "epoch": 3109} {"train_loss": -24.87775993347168, "global_step": 258094, "epoch": 3109} {"train_loss": -24.73396873474121, "global_step": 258095, "epoch": 3109} {"train_loss": -25.20108413696289, "global_step": 258096, "epoch": 3109} {"train_loss": -24.905986785888672, "global_step": 258097, "epoch": 3109} {"train_loss": -24.74370765686035, "global_step": 258098, "epoch": 3109} {"train_loss": -25.056833267211914, "global_step": 258099, "epoch": 3109} {"train_loss": -24.897541046142578, "global_step": 258100, "epoch": 3109} {"train_loss": -24.722206115722656, "global_step": 258101, "epoch": 3109} {"train_loss": -25.03763771057129, "global_step": 258102, "epoch": 3109} {"train_loss": -25.086332321166992, "global_step": 258103, "epoch": 3109} {"train_loss": -25.050783157348633, "global_step": 258104, "epoch": 3109} {"train_loss": -24.84565544128418, "global_step": 258105, "epoch": 3109} {"train_loss": -25.016672134399414, "global_step": 258106, "epoch": 3109} {"train_loss": -25.188982009887695, "global_step": 258107, "epoch": 3109} {"train_loss": -25.27179718017578, "global_step": 258108, "epoch": 3109} {"train_loss": -25.064620971679688, "global_step": 258109, "epoch": 3109} {"train_loss": -25.291765213012695, "global_step": 258110, "epoch": 3109} {"train_loss": -25.24947166442871, "global_step": 258111, "epoch": 3109} {"train_loss": -25.014375686645508, "global_step": 258112, "epoch": 3109} {"train_loss": -25.141050338745117, "global_step": 258113, "epoch": 3109} {"train_loss": -25.07944679260254, "global_step": 258114, "epoch": 3109} {"train_loss": -25.378992080688477, "global_step": 258115, "epoch": 3109} {"train_loss": -25.121906280517578, "global_step": 258116, "epoch": 3109} {"train_loss": -25.396291732788086, "global_step": 258117, "epoch": 3109} {"train_loss": -25.156919479370117, "global_step": 258118, "epoch": 3109} {"train_loss": -25.24896812438965, "global_step": 258119, "epoch": 3109} {"train_loss": -25.3155460357666, "global_step": 258120, "epoch": 3109} {"train_loss": -25.116073608398438, "global_step": 258121, "epoch": 3109} {"train_loss": -25.565427780151367, "global_step": 258122, "epoch": 3109} {"train_loss": -25.11049461364746, "global_step": 258123, "epoch": 3109} {"train_loss": -24.712976455688477, "global_step": 258124, "epoch": 3109} {"train_loss": -25.321107864379883, "global_step": 258125, "epoch": 3109} {"train_loss": -24.93410301208496, "global_step": 258126, "epoch": 3109} {"train_loss": -25.528566360473633, "global_step": 258127, "epoch": 3109} {"train_loss": -25.04334831237793, "global_step": 258128, "epoch": 3109} {"train_loss": -25.094468748713116, "global_step": 258129, "epoch": 3109, "val_loss": 6852154.0} {"train_loss": -23.90765953063965, "global_step": 258130, "epoch": 3110} {"train_loss": -23.200185775756836, "global_step": 258131, "epoch": 3110} {"train_loss": -23.42624282836914, "global_step": 258132, "epoch": 3110} {"train_loss": -24.588842391967773, "global_step": 258133, "epoch": 3110} {"train_loss": -23.57204246520996, "global_step": 258134, "epoch": 3110} {"train_loss": -24.137807846069336, "global_step": 258135, "epoch": 3110} {"train_loss": -23.932844161987305, "global_step": 258136, "epoch": 3110} {"train_loss": -24.113327026367188, "global_step": 258137, "epoch": 3110} {"train_loss": -24.458805084228516, "global_step": 258138, "epoch": 3110} {"train_loss": -24.637136459350586, "global_step": 258139, "epoch": 3110} {"train_loss": -24.406692504882812, "global_step": 258140, "epoch": 3110} {"train_loss": -24.14693832397461, "global_step": 258141, "epoch": 3110} {"train_loss": -24.59381675720215, "global_step": 258142, "epoch": 3110} {"train_loss": -24.32077980041504, "global_step": 258143, "epoch": 3110} {"train_loss": -24.617755889892578, "global_step": 258144, "epoch": 3110} {"train_loss": -24.930767059326172, "global_step": 258145, "epoch": 3110} {"train_loss": -24.163984298706055, "global_step": 258146, "epoch": 3110} {"train_loss": -24.879140853881836, "global_step": 258147, "epoch": 3110} {"train_loss": -24.96039390563965, "global_step": 258148, "epoch": 3110} {"train_loss": -24.855390548706055, "global_step": 258149, "epoch": 3110} {"train_loss": -25.032072067260742, "global_step": 258150, "epoch": 3110} {"train_loss": -24.671283721923828, "global_step": 258151, "epoch": 3110} {"train_loss": -25.235668182373047, "global_step": 258152, "epoch": 3110} {"train_loss": -24.7077579498291, "global_step": 258153, "epoch": 3110} {"train_loss": -25.07890510559082, "global_step": 258154, "epoch": 3110} {"train_loss": -24.668682098388672, "global_step": 258155, "epoch": 3110} {"train_loss": -24.793874740600586, "global_step": 258156, "epoch": 3110} {"train_loss": -24.99888801574707, "global_step": 258157, "epoch": 3110} {"train_loss": -24.86361312866211, "global_step": 258158, "epoch": 3110} {"train_loss": -25.068384170532227, "global_step": 258159, "epoch": 3110} {"train_loss": -25.158592224121094, "global_step": 258160, "epoch": 3110} {"train_loss": -24.977075576782227, "global_step": 258161, "epoch": 3110} {"train_loss": -25.6458797454834, "global_step": 258162, "epoch": 3110} {"train_loss": -25.039072036743164, "global_step": 258163, "epoch": 3110} {"train_loss": -25.143375396728516, "global_step": 258164, "epoch": 3110} {"train_loss": -24.87906837463379, "global_step": 258165, "epoch": 3110} {"train_loss": -25.124771118164062, "global_step": 258166, "epoch": 3110} {"train_loss": -25.34519386291504, "global_step": 258167, "epoch": 3110} {"train_loss": -25.293546676635742, "global_step": 258168, "epoch": 3110} {"train_loss": -25.15827751159668, "global_step": 258169, "epoch": 3110} {"train_loss": -25.30665397644043, "global_step": 258170, "epoch": 3110} {"train_loss": -24.950027465820312, "global_step": 258171, "epoch": 3110} {"train_loss": -25.17901611328125, "global_step": 258172, "epoch": 3110} {"train_loss": -25.204591751098633, "global_step": 258173, "epoch": 3110} {"train_loss": -25.109821319580078, "global_step": 258174, "epoch": 3110} {"train_loss": -25.239551544189453, "global_step": 258175, "epoch": 3110} {"train_loss": -25.087915420532227, "global_step": 258176, "epoch": 3110} {"train_loss": -25.20147132873535, "global_step": 258177, "epoch": 3110} {"train_loss": -25.57427406311035, "global_step": 258178, "epoch": 3110} {"train_loss": -25.001625061035156, "global_step": 258179, "epoch": 3110} {"train_loss": -25.40427589416504, "global_step": 258180, "epoch": 3110} {"train_loss": -25.11237907409668, "global_step": 258181, "epoch": 3110} {"train_loss": -25.22977638244629, "global_step": 258182, "epoch": 3110} {"train_loss": -25.142757415771484, "global_step": 258183, "epoch": 3110} {"train_loss": -25.32785987854004, "global_step": 258184, "epoch": 3110} {"train_loss": -25.605560302734375, "global_step": 258185, "epoch": 3110} {"train_loss": -25.189773559570312, "global_step": 258186, "epoch": 3110} {"train_loss": -25.406171798706055, "global_step": 258187, "epoch": 3110} {"train_loss": -25.269947052001953, "global_step": 258188, "epoch": 3110} {"train_loss": -25.109529495239258, "global_step": 258189, "epoch": 3110} {"train_loss": -25.350858688354492, "global_step": 258190, "epoch": 3110} {"train_loss": -25.097684860229492, "global_step": 258191, "epoch": 3110} {"train_loss": -25.51491355895996, "global_step": 258192, "epoch": 3110} {"train_loss": -25.2453670501709, "global_step": 258193, "epoch": 3110} {"train_loss": -25.36831283569336, "global_step": 258194, "epoch": 3110} {"train_loss": -24.9615478515625, "global_step": 258195, "epoch": 3110} {"train_loss": -24.994552612304688, "global_step": 258196, "epoch": 3110} {"train_loss": -24.36876106262207, "global_step": 258197, "epoch": 3110} {"train_loss": -24.706340789794922, "global_step": 258198, "epoch": 3110} {"train_loss": -24.76974868774414, "global_step": 258199, "epoch": 3110} {"train_loss": -25.09061050415039, "global_step": 258200, "epoch": 3110} {"train_loss": -25.16022491455078, "global_step": 258201, "epoch": 3110} {"train_loss": -25.343257904052734, "global_step": 258202, "epoch": 3110} {"train_loss": -24.364315032958984, "global_step": 258203, "epoch": 3110} {"train_loss": -24.797651290893555, "global_step": 258204, "epoch": 3110} {"train_loss": -25.55982208251953, "global_step": 258205, "epoch": 3110} {"train_loss": -24.755443572998047, "global_step": 258206, "epoch": 3110} {"train_loss": -24.965625762939453, "global_step": 258207, "epoch": 3110} {"train_loss": -24.65077781677246, "global_step": 258208, "epoch": 3110} {"train_loss": -24.762556076049805, "global_step": 258209, "epoch": 3110} {"train_loss": -25.191579818725586, "global_step": 258210, "epoch": 3110} {"train_loss": -24.78064727783203, "global_step": 258211, "epoch": 3110} {"train_loss": -24.911829845014825, "global_step": 258212, "epoch": 3110, "val_loss": 6926574.0} {"train_loss": -24.96534538269043, "global_step": 258213, "epoch": 3111} {"train_loss": -24.511638641357422, "global_step": 258214, "epoch": 3111} {"train_loss": -24.679582595825195, "global_step": 258215, "epoch": 3111} {"train_loss": -24.724348068237305, "global_step": 258216, "epoch": 3111} {"train_loss": -24.745391845703125, "global_step": 258217, "epoch": 3111} {"train_loss": -24.851642608642578, "global_step": 258218, "epoch": 3111} {"train_loss": -24.719928741455078, "global_step": 258219, "epoch": 3111} {"train_loss": -24.885501861572266, "global_step": 258220, "epoch": 3111} {"train_loss": -24.5213680267334, "global_step": 258221, "epoch": 3111} {"train_loss": -25.07136344909668, "global_step": 258222, "epoch": 3111} {"train_loss": -24.578393936157227, "global_step": 258223, "epoch": 3111} {"train_loss": -24.487850189208984, "global_step": 258224, "epoch": 3111} {"train_loss": -24.737812042236328, "global_step": 258225, "epoch": 3111} {"train_loss": -24.98322105407715, "global_step": 258226, "epoch": 3111} {"train_loss": -25.015869140625, "global_step": 258227, "epoch": 3111} {"train_loss": -24.853376388549805, "global_step": 258228, "epoch": 3111} {"train_loss": -25.046361923217773, "global_step": 258229, "epoch": 3111} {"train_loss": -24.816537857055664, "global_step": 258230, "epoch": 3111} {"train_loss": -25.052154541015625, "global_step": 258231, "epoch": 3111} {"train_loss": -25.125329971313477, "global_step": 258232, "epoch": 3111} {"train_loss": -24.97178077697754, "global_step": 258233, "epoch": 3111} {"train_loss": -25.018707275390625, "global_step": 258234, "epoch": 3111} {"train_loss": -25.043643951416016, "global_step": 258235, "epoch": 3111} {"train_loss": -25.110595703125, "global_step": 258236, "epoch": 3111} {"train_loss": -24.62034034729004, "global_step": 258237, "epoch": 3111} {"train_loss": -25.148319244384766, "global_step": 258238, "epoch": 3111} {"train_loss": -25.341354370117188, "global_step": 258239, "epoch": 3111} {"train_loss": -25.239486694335938, "global_step": 258240, "epoch": 3111} {"train_loss": -25.004331588745117, "global_step": 258241, "epoch": 3111} {"train_loss": -25.314558029174805, "global_step": 258242, "epoch": 3111} {"train_loss": -25.24384307861328, "global_step": 258243, "epoch": 3111} {"train_loss": -25.33902931213379, "global_step": 258244, "epoch": 3111} {"train_loss": -25.455842971801758, "global_step": 258245, "epoch": 3111} {"train_loss": -25.47027015686035, "global_step": 258246, "epoch": 3111} {"train_loss": -25.196012496948242, "global_step": 258247, "epoch": 3111} {"train_loss": -25.312633514404297, "global_step": 258248, "epoch": 3111} {"train_loss": -25.484113693237305, "global_step": 258249, "epoch": 3111} {"train_loss": -25.167816162109375, "global_step": 258250, "epoch": 3111} {"train_loss": -25.62113380432129, "global_step": 258251, "epoch": 3111} {"train_loss": -25.114953994750977, "global_step": 258252, "epoch": 3111} {"train_loss": -25.346298217773438, "global_step": 258253, "epoch": 3111} {"train_loss": -25.455976486206055, "global_step": 258254, "epoch": 3111} {"train_loss": -25.231822967529297, "global_step": 258255, "epoch": 3111} {"train_loss": -25.198518753051758, "global_step": 258256, "epoch": 3111} {"train_loss": -25.487468719482422, "global_step": 258257, "epoch": 3111} {"train_loss": -25.125513076782227, "global_step": 258258, "epoch": 3111} {"train_loss": -25.117691040039062, "global_step": 258259, "epoch": 3111} {"train_loss": -25.178081512451172, "global_step": 258260, "epoch": 3111} {"train_loss": -25.213769912719727, "global_step": 258261, "epoch": 3111} {"train_loss": -25.339282989501953, "global_step": 258262, "epoch": 3111} {"train_loss": -25.30068016052246, "global_step": 258263, "epoch": 3111} {"train_loss": -24.86934471130371, "global_step": 258264, "epoch": 3111} {"train_loss": -25.24619483947754, "global_step": 258265, "epoch": 3111} {"train_loss": -25.233013153076172, "global_step": 258266, "epoch": 3111} {"train_loss": -25.31972312927246, "global_step": 258267, "epoch": 3111} {"train_loss": -25.573240280151367, "global_step": 258268, "epoch": 3111} {"train_loss": -25.46653175354004, "global_step": 258269, "epoch": 3111} {"train_loss": -25.014333724975586, "global_step": 258270, "epoch": 3111} {"train_loss": -24.933380126953125, "global_step": 258271, "epoch": 3111} {"train_loss": -25.090415954589844, "global_step": 258272, "epoch": 3111} {"train_loss": -25.015731811523438, "global_step": 258273, "epoch": 3111} {"train_loss": -25.080949783325195, "global_step": 258274, "epoch": 3111} {"train_loss": -25.26578140258789, "global_step": 258275, "epoch": 3111} {"train_loss": -24.958059310913086, "global_step": 258276, "epoch": 3111} {"train_loss": -25.390182495117188, "global_step": 258277, "epoch": 3111} {"train_loss": -25.432523727416992, "global_step": 258278, "epoch": 3111} {"train_loss": -25.290420532226562, "global_step": 258279, "epoch": 3111} {"train_loss": -25.067428588867188, "global_step": 258280, "epoch": 3111} {"train_loss": -25.08167839050293, "global_step": 258281, "epoch": 3111} {"train_loss": -25.419452667236328, "global_step": 258282, "epoch": 3111} {"train_loss": -25.30307960510254, "global_step": 258283, "epoch": 3111} {"train_loss": -25.445287704467773, "global_step": 258284, "epoch": 3111} {"train_loss": -25.259592056274414, "global_step": 258285, "epoch": 3111} {"train_loss": -24.992456436157227, "global_step": 258286, "epoch": 3111} {"train_loss": -24.9834041595459, "global_step": 258287, "epoch": 3111} {"train_loss": -25.205995559692383, "global_step": 258288, "epoch": 3111} {"train_loss": -25.271041870117188, "global_step": 258289, "epoch": 3111} {"train_loss": -24.689786911010742, "global_step": 258290, "epoch": 3111} {"train_loss": -24.469541549682617, "global_step": 258291, "epoch": 3111} {"train_loss": -24.59859275817871, "global_step": 258292, "epoch": 3111} {"train_loss": -25.094303131103516, "global_step": 258293, "epoch": 3111} {"train_loss": -25.0557804107666, "global_step": 258294, "epoch": 3111} {"train_loss": -25.08514523793416, "global_step": 258295, "epoch": 3111, "val_loss": 6838504.0} {"train_loss": -25.03145408630371, "global_step": 258296, "epoch": 3112} {"train_loss": -24.401430130004883, "global_step": 258297, "epoch": 3112} {"train_loss": -24.662378311157227, "global_step": 258298, "epoch": 3112} {"train_loss": -24.543235778808594, "global_step": 258299, "epoch": 3112} {"train_loss": -24.343435287475586, "global_step": 258300, "epoch": 3112} {"train_loss": -24.47684669494629, "global_step": 258301, "epoch": 3112} {"train_loss": -24.874948501586914, "global_step": 258302, "epoch": 3112} {"train_loss": -24.326265335083008, "global_step": 258303, "epoch": 3112} {"train_loss": -24.9085636138916, "global_step": 258304, "epoch": 3112} {"train_loss": -24.28670310974121, "global_step": 258305, "epoch": 3112} {"train_loss": -24.6876220703125, "global_step": 258306, "epoch": 3112} {"train_loss": -24.82767677307129, "global_step": 258307, "epoch": 3112} {"train_loss": -24.570648193359375, "global_step": 258308, "epoch": 3112} {"train_loss": -24.72706413269043, "global_step": 258309, "epoch": 3112} {"train_loss": -24.90858268737793, "global_step": 258310, "epoch": 3112} {"train_loss": -24.84578514099121, "global_step": 258311, "epoch": 3112} {"train_loss": -25.06351661682129, "global_step": 258312, "epoch": 3112} {"train_loss": -24.616870880126953, "global_step": 258313, "epoch": 3112} {"train_loss": -24.952924728393555, "global_step": 258314, "epoch": 3112} {"train_loss": -24.9244384765625, "global_step": 258315, "epoch": 3112} {"train_loss": -24.507543563842773, "global_step": 258316, "epoch": 3112} {"train_loss": -25.300138473510742, "global_step": 258317, "epoch": 3112} {"train_loss": -25.120481491088867, "global_step": 258318, "epoch": 3112} {"train_loss": -25.039968490600586, "global_step": 258319, "epoch": 3112} {"train_loss": -24.791311264038086, "global_step": 258320, "epoch": 3112} {"train_loss": -24.730039596557617, "global_step": 258321, "epoch": 3112} {"train_loss": -24.65154457092285, "global_step": 258322, "epoch": 3112} {"train_loss": -25.064603805541992, "global_step": 258323, "epoch": 3112} {"train_loss": -24.89021873474121, "global_step": 258324, "epoch": 3112} {"train_loss": -25.135175704956055, "global_step": 258325, "epoch": 3112} {"train_loss": -25.400135040283203, "global_step": 258326, "epoch": 3112} {"train_loss": -25.099689483642578, "global_step": 258327, "epoch": 3112} {"train_loss": -24.863378524780273, "global_step": 258328, "epoch": 3112} {"train_loss": -25.276662826538086, "global_step": 258329, "epoch": 3112} {"train_loss": -25.29401206970215, "global_step": 258330, "epoch": 3112} {"train_loss": -24.79585838317871, "global_step": 258331, "epoch": 3112} {"train_loss": -25.207807540893555, "global_step": 258332, "epoch": 3112} {"train_loss": -24.66463279724121, "global_step": 258333, "epoch": 3112} {"train_loss": -25.235660552978516, "global_step": 258334, "epoch": 3112} {"train_loss": -25.196090698242188, "global_step": 258335, "epoch": 3112} {"train_loss": -25.125425338745117, "global_step": 258336, "epoch": 3112} {"train_loss": -24.88101577758789, "global_step": 258337, "epoch": 3112} {"train_loss": -25.347103118896484, "global_step": 258338, "epoch": 3112} {"train_loss": -24.661396026611328, "global_step": 258339, "epoch": 3112} {"train_loss": -25.252460479736328, "global_step": 258340, "epoch": 3112} {"train_loss": -24.853178024291992, "global_step": 258341, "epoch": 3112} {"train_loss": -25.241994857788086, "global_step": 258342, "epoch": 3112} {"train_loss": -24.978260040283203, "global_step": 258343, "epoch": 3112} {"train_loss": -24.809093475341797, "global_step": 258344, "epoch": 3112} {"train_loss": -25.304121017456055, "global_step": 258345, "epoch": 3112} {"train_loss": -24.87911033630371, "global_step": 258346, "epoch": 3112} {"train_loss": -24.727649688720703, "global_step": 258347, "epoch": 3112} {"train_loss": -25.095251083374023, "global_step": 258348, "epoch": 3112} {"train_loss": -24.9431095123291, "global_step": 258349, "epoch": 3112} {"train_loss": -25.190319061279297, "global_step": 258350, "epoch": 3112} {"train_loss": -25.11472511291504, "global_step": 258351, "epoch": 3112} {"train_loss": -25.237401962280273, "global_step": 258352, "epoch": 3112} {"train_loss": -24.85495948791504, "global_step": 258353, "epoch": 3112} {"train_loss": -24.997190475463867, "global_step": 258354, "epoch": 3112} {"train_loss": -25.155553817749023, "global_step": 258355, "epoch": 3112} {"train_loss": -25.274877548217773, "global_step": 258356, "epoch": 3112} {"train_loss": -25.30455207824707, "global_step": 258357, "epoch": 3112} {"train_loss": -24.912378311157227, "global_step": 258358, "epoch": 3112} {"train_loss": -25.167003631591797, "global_step": 258359, "epoch": 3112} {"train_loss": -25.617456436157227, "global_step": 258360, "epoch": 3112} {"train_loss": -25.240962982177734, "global_step": 258361, "epoch": 3112} {"train_loss": -24.916147232055664, "global_step": 258362, "epoch": 3112} {"train_loss": -25.009458541870117, "global_step": 258363, "epoch": 3112} {"train_loss": -25.472280502319336, "global_step": 258364, "epoch": 3112} {"train_loss": -25.335418701171875, "global_step": 258365, "epoch": 3112} {"train_loss": -24.905134201049805, "global_step": 258366, "epoch": 3112} {"train_loss": -25.039630889892578, "global_step": 258367, "epoch": 3112} {"train_loss": -25.230382919311523, "global_step": 258368, "epoch": 3112} {"train_loss": -25.609296798706055, "global_step": 258369, "epoch": 3112} {"train_loss": -25.19917106628418, "global_step": 258370, "epoch": 3112} {"train_loss": -25.376840591430664, "global_step": 258371, "epoch": 3112} {"train_loss": -25.39520263671875, "global_step": 258372, "epoch": 3112} {"train_loss": -25.329374313354492, "global_step": 258373, "epoch": 3112} {"train_loss": -25.419963836669922, "global_step": 258374, "epoch": 3112} {"train_loss": -25.142858505249023, "global_step": 258375, "epoch": 3112} {"train_loss": -25.139686584472656, "global_step": 258376, "epoch": 3112} {"train_loss": -25.14564323425293, "global_step": 258377, "epoch": 3112} {"train_loss": -25.003336205539934, "global_step": 258378, "epoch": 3112, "val_loss": 6824832.5} {"train_loss": -24.73024559020996, "global_step": 258379, "epoch": 3113} {"train_loss": -24.72309112548828, "global_step": 258380, "epoch": 3113} {"train_loss": -25.124059677124023, "global_step": 258381, "epoch": 3113} {"train_loss": -24.898151397705078, "global_step": 258382, "epoch": 3113} {"train_loss": -24.452367782592773, "global_step": 258383, "epoch": 3113} {"train_loss": -24.89398765563965, "global_step": 258384, "epoch": 3113} {"train_loss": -24.715036392211914, "global_step": 258385, "epoch": 3113} {"train_loss": -24.89855194091797, "global_step": 258386, "epoch": 3113} {"train_loss": -25.115163803100586, "global_step": 258387, "epoch": 3113} {"train_loss": -24.476919174194336, "global_step": 258388, "epoch": 3113} {"train_loss": -24.877578735351562, "global_step": 258389, "epoch": 3113} {"train_loss": -24.747129440307617, "global_step": 258390, "epoch": 3113} {"train_loss": -24.742422103881836, "global_step": 258391, "epoch": 3113} {"train_loss": -24.944929122924805, "global_step": 258392, "epoch": 3113} {"train_loss": -24.729373931884766, "global_step": 258393, "epoch": 3113} {"train_loss": -24.64293098449707, "global_step": 258394, "epoch": 3113} {"train_loss": -24.9859619140625, "global_step": 258395, "epoch": 3113} {"train_loss": -24.77939796447754, "global_step": 258396, "epoch": 3113} {"train_loss": -24.97963523864746, "global_step": 258397, "epoch": 3113} {"train_loss": -25.086843490600586, "global_step": 258398, "epoch": 3113} {"train_loss": -25.062877655029297, "global_step": 258399, "epoch": 3113} {"train_loss": -25.070480346679688, "global_step": 258400, "epoch": 3113} {"train_loss": -24.935216903686523, "global_step": 258401, "epoch": 3113} {"train_loss": -24.89716148376465, "global_step": 258402, "epoch": 3113} {"train_loss": -25.184690475463867, "global_step": 258403, "epoch": 3113} {"train_loss": -25.086109161376953, "global_step": 258404, "epoch": 3113} {"train_loss": -25.37717628479004, "global_step": 258405, "epoch": 3113} {"train_loss": -25.006149291992188, "global_step": 258406, "epoch": 3113} {"train_loss": -24.98775291442871, "global_step": 258407, "epoch": 3113} {"train_loss": -24.94795799255371, "global_step": 258408, "epoch": 3113} {"train_loss": -25.01067543029785, "global_step": 258409, "epoch": 3113} {"train_loss": -24.94623374938965, "global_step": 258410, "epoch": 3113} {"train_loss": -25.32517433166504, "global_step": 258411, "epoch": 3113} {"train_loss": -25.13100242614746, "global_step": 258412, "epoch": 3113} {"train_loss": -24.946786880493164, "global_step": 258413, "epoch": 3113} {"train_loss": -25.160709381103516, "global_step": 258414, "epoch": 3113} {"train_loss": -25.122638702392578, "global_step": 258415, "epoch": 3113} {"train_loss": -25.287107467651367, "global_step": 258416, "epoch": 3113} {"train_loss": -24.97734832763672, "global_step": 258417, "epoch": 3113} {"train_loss": -25.35744285583496, "global_step": 258418, "epoch": 3113} {"train_loss": -25.1837215423584, "global_step": 258419, "epoch": 3113} {"train_loss": -25.6899356842041, "global_step": 258420, "epoch": 3113} {"train_loss": -25.14381980895996, "global_step": 258421, "epoch": 3113} {"train_loss": -25.06870460510254, "global_step": 258422, "epoch": 3113} {"train_loss": -25.0683650970459, "global_step": 258423, "epoch": 3113} {"train_loss": -25.361671447753906, "global_step": 258424, "epoch": 3113} {"train_loss": -25.042463302612305, "global_step": 258425, "epoch": 3113} {"train_loss": -25.612340927124023, "global_step": 258426, "epoch": 3113} {"train_loss": -25.116357803344727, "global_step": 258427, "epoch": 3113} {"train_loss": -25.673877716064453, "global_step": 258428, "epoch": 3113} {"train_loss": -25.18364143371582, "global_step": 258429, "epoch": 3113} {"train_loss": -24.532180786132812, "global_step": 258430, "epoch": 3113} {"train_loss": -24.95216178894043, "global_step": 258431, "epoch": 3113} {"train_loss": -25.459915161132812, "global_step": 258432, "epoch": 3113} {"train_loss": -25.142797470092773, "global_step": 258433, "epoch": 3113} {"train_loss": -25.01059341430664, "global_step": 258434, "epoch": 3113} {"train_loss": -25.014280319213867, "global_step": 258435, "epoch": 3113} {"train_loss": -24.909534454345703, "global_step": 258436, "epoch": 3113} {"train_loss": -24.189138412475586, "global_step": 258437, "epoch": 3113} {"train_loss": -24.785009384155273, "global_step": 258438, "epoch": 3113} {"train_loss": -24.808286666870117, "global_step": 258439, "epoch": 3113} {"train_loss": -24.831544876098633, "global_step": 258440, "epoch": 3113} {"train_loss": -24.927759170532227, "global_step": 258441, "epoch": 3113} {"train_loss": -25.429197311401367, "global_step": 258442, "epoch": 3113} {"train_loss": -24.63081169128418, "global_step": 258443, "epoch": 3113} {"train_loss": -24.848459243774414, "global_step": 258444, "epoch": 3113} {"train_loss": -25.099536895751953, "global_step": 258445, "epoch": 3113} {"train_loss": -24.89980125427246, "global_step": 258446, "epoch": 3113} {"train_loss": -24.887012481689453, "global_step": 258447, "epoch": 3113} {"train_loss": -25.038183212280273, "global_step": 258448, "epoch": 3113} {"train_loss": -25.057937622070312, "global_step": 258449, "epoch": 3113} {"train_loss": -25.066028594970703, "global_step": 258450, "epoch": 3113} {"train_loss": -25.130834579467773, "global_step": 258451, "epoch": 3113} {"train_loss": -24.976125717163086, "global_step": 258452, "epoch": 3113} {"train_loss": -24.8872013092041, "global_step": 258453, "epoch": 3113} {"train_loss": -24.876981735229492, "global_step": 258454, "epoch": 3113} {"train_loss": -24.77768898010254, "global_step": 258455, "epoch": 3113} {"train_loss": -25.07396697998047, "global_step": 258456, "epoch": 3113} {"train_loss": -25.05868911743164, "global_step": 258457, "epoch": 3113} {"train_loss": -25.2531795501709, "global_step": 258458, "epoch": 3113} {"train_loss": -25.093046188354492, "global_step": 258459, "epoch": 3113} {"train_loss": -24.593555450439453, "global_step": 258460, "epoch": 3113} {"train_loss": -25.017353103821534, "global_step": 258461, "epoch": 3113, "val_loss": 6864417.0} {"train_loss": -24.822660446166992, "global_step": 258462, "epoch": 3114} {"train_loss": -24.98109245300293, "global_step": 258463, "epoch": 3114} {"train_loss": -24.510311126708984, "global_step": 258464, "epoch": 3114} {"train_loss": -25.014394760131836, "global_step": 258465, "epoch": 3114} {"train_loss": -24.778640747070312, "global_step": 258466, "epoch": 3114} {"train_loss": -24.59623146057129, "global_step": 258467, "epoch": 3114} {"train_loss": -24.93952751159668, "global_step": 258468, "epoch": 3114} {"train_loss": -24.984434127807617, "global_step": 258469, "epoch": 3114} {"train_loss": -24.9932804107666, "global_step": 258470, "epoch": 3114} {"train_loss": -24.911060333251953, "global_step": 258471, "epoch": 3114} {"train_loss": -25.051618576049805, "global_step": 258472, "epoch": 3114} {"train_loss": -25.081361770629883, "global_step": 258473, "epoch": 3114} {"train_loss": -25.1494140625, "global_step": 258474, "epoch": 3114} {"train_loss": -24.887094497680664, "global_step": 258475, "epoch": 3114} {"train_loss": -24.849964141845703, "global_step": 258476, "epoch": 3114} {"train_loss": -24.98679542541504, "global_step": 258477, "epoch": 3114} {"train_loss": -25.0970401763916, "global_step": 258478, "epoch": 3114} {"train_loss": -25.06096839904785, "global_step": 258479, "epoch": 3114} {"train_loss": -24.89254379272461, "global_step": 258480, "epoch": 3114} {"train_loss": -24.81903648376465, "global_step": 258481, "epoch": 3114} {"train_loss": -25.180953979492188, "global_step": 258482, "epoch": 3114} {"train_loss": -24.9822940826416, "global_step": 258483, "epoch": 3114} {"train_loss": -25.215023040771484, "global_step": 258484, "epoch": 3114} {"train_loss": -25.32477378845215, "global_step": 258485, "epoch": 3114} {"train_loss": -25.2391414642334, "global_step": 258486, "epoch": 3114} {"train_loss": -25.3605899810791, "global_step": 258487, "epoch": 3114} {"train_loss": -25.49982261657715, "global_step": 258488, "epoch": 3114} {"train_loss": -25.33856201171875, "global_step": 258489, "epoch": 3114} {"train_loss": -25.120908737182617, "global_step": 258490, "epoch": 3114} {"train_loss": -25.28169059753418, "global_step": 258491, "epoch": 3114} {"train_loss": -25.224620819091797, "global_step": 258492, "epoch": 3114} {"train_loss": -25.1160945892334, "global_step": 258493, "epoch": 3114} {"train_loss": -25.271894454956055, "global_step": 258494, "epoch": 3114} {"train_loss": -25.28351402282715, "global_step": 258495, "epoch": 3114} {"train_loss": -25.611007690429688, "global_step": 258496, "epoch": 3114} {"train_loss": -25.236957550048828, "global_step": 258497, "epoch": 3114} {"train_loss": -25.27499771118164, "global_step": 258498, "epoch": 3114} {"train_loss": -25.11359214782715, "global_step": 258499, "epoch": 3114} {"train_loss": -25.169525146484375, "global_step": 258500, "epoch": 3114} {"train_loss": -25.390554428100586, "global_step": 258501, "epoch": 3114} {"train_loss": -25.229049682617188, "global_step": 258502, "epoch": 3114} {"train_loss": -25.401350021362305, "global_step": 258503, "epoch": 3114} {"train_loss": -25.261430740356445, "global_step": 258504, "epoch": 3114} {"train_loss": -25.465871810913086, "global_step": 258505, "epoch": 3114} {"train_loss": -24.784765243530273, "global_step": 258506, "epoch": 3114} {"train_loss": -24.989355087280273, "global_step": 258507, "epoch": 3114} {"train_loss": -24.924427032470703, "global_step": 258508, "epoch": 3114} {"train_loss": -25.216175079345703, "global_step": 258509, "epoch": 3114} {"train_loss": -25.032052993774414, "global_step": 258510, "epoch": 3114} {"train_loss": -24.93913459777832, "global_step": 258511, "epoch": 3114} {"train_loss": -25.107698440551758, "global_step": 258512, "epoch": 3114} {"train_loss": -25.536760330200195, "global_step": 258513, "epoch": 3114} {"train_loss": -24.686925888061523, "global_step": 258514, "epoch": 3114} {"train_loss": -24.878089904785156, "global_step": 258515, "epoch": 3114} {"train_loss": -25.117647171020508, "global_step": 258516, "epoch": 3114} {"train_loss": -24.79551887512207, "global_step": 258517, "epoch": 3114} {"train_loss": -24.81934928894043, "global_step": 258518, "epoch": 3114} {"train_loss": -25.196622848510742, "global_step": 258519, "epoch": 3114} {"train_loss": -24.89813232421875, "global_step": 258520, "epoch": 3114} {"train_loss": -25.044248580932617, "global_step": 258521, "epoch": 3114} {"train_loss": -24.70245933532715, "global_step": 258522, "epoch": 3114} {"train_loss": -25.571765899658203, "global_step": 258523, "epoch": 3114} {"train_loss": -25.074857711791992, "global_step": 258524, "epoch": 3114} {"train_loss": -25.29525375366211, "global_step": 258525, "epoch": 3114} {"train_loss": -25.099355697631836, "global_step": 258526, "epoch": 3114} {"train_loss": -25.23349380493164, "global_step": 258527, "epoch": 3114} {"train_loss": -25.395490646362305, "global_step": 258528, "epoch": 3114} {"train_loss": -25.069501876831055, "global_step": 258529, "epoch": 3114} {"train_loss": -25.55503273010254, "global_step": 258530, "epoch": 3114} {"train_loss": -24.913848876953125, "global_step": 258531, "epoch": 3114} {"train_loss": -25.304943084716797, "global_step": 258532, "epoch": 3114} {"train_loss": -25.599369049072266, "global_step": 258533, "epoch": 3114} {"train_loss": -25.02056884765625, "global_step": 258534, "epoch": 3114} {"train_loss": -25.19013786315918, "global_step": 258535, "epoch": 3114} {"train_loss": -24.74795913696289, "global_step": 258536, "epoch": 3114} {"train_loss": -25.083938598632812, "global_step": 258537, "epoch": 3114} {"train_loss": -25.011615753173828, "global_step": 258538, "epoch": 3114} {"train_loss": -24.7238712310791, "global_step": 258539, "epoch": 3114} {"train_loss": -25.008420944213867, "global_step": 258540, "epoch": 3114} {"train_loss": -25.265186309814453, "global_step": 258541, "epoch": 3114} {"train_loss": -25.04316520690918, "global_step": 258542, "epoch": 3114} {"train_loss": -25.0044002532959, "global_step": 258543, "epoch": 3114} {"train_loss": -25.1086563432073, "global_step": 258544, "epoch": 3114, "val_loss": 6831557.0} {"train_loss": -24.864988327026367, "global_step": 258545, "epoch": 3115} {"train_loss": -24.649627685546875, "global_step": 258546, "epoch": 3115} {"train_loss": -24.862171173095703, "global_step": 258547, "epoch": 3115} {"train_loss": -24.476791381835938, "global_step": 258548, "epoch": 3115} {"train_loss": -25.108911514282227, "global_step": 258549, "epoch": 3115} {"train_loss": -24.51544761657715, "global_step": 258550, "epoch": 3115} {"train_loss": -25.131366729736328, "global_step": 258551, "epoch": 3115} {"train_loss": -24.96357536315918, "global_step": 258552, "epoch": 3115} {"train_loss": -24.69053077697754, "global_step": 258553, "epoch": 3115} {"train_loss": -24.649213790893555, "global_step": 258554, "epoch": 3115} {"train_loss": -25.149023056030273, "global_step": 258555, "epoch": 3115} {"train_loss": -24.99160385131836, "global_step": 258556, "epoch": 3115} {"train_loss": -25.194660186767578, "global_step": 258557, "epoch": 3115} {"train_loss": -25.17544937133789, "global_step": 258558, "epoch": 3115} {"train_loss": -24.88300895690918, "global_step": 258559, "epoch": 3115} {"train_loss": -24.977445602416992, "global_step": 258560, "epoch": 3115} {"train_loss": -25.254194259643555, "global_step": 258561, "epoch": 3115} {"train_loss": -25.13532066345215, "global_step": 258562, "epoch": 3115} {"train_loss": -25.127134323120117, "global_step": 258563, "epoch": 3115} {"train_loss": -24.964557647705078, "global_step": 258564, "epoch": 3115} {"train_loss": -25.097951889038086, "global_step": 258565, "epoch": 3115} {"train_loss": -25.237659454345703, "global_step": 258566, "epoch": 3115} {"train_loss": -24.862228393554688, "global_step": 258567, "epoch": 3115} {"train_loss": -25.047637939453125, "global_step": 258568, "epoch": 3115} {"train_loss": -24.932992935180664, "global_step": 258569, "epoch": 3115} {"train_loss": -24.66170883178711, "global_step": 258570, "epoch": 3115} {"train_loss": -25.03687858581543, "global_step": 258571, "epoch": 3115} {"train_loss": -25.060333251953125, "global_step": 258572, "epoch": 3115} {"train_loss": -25.14078140258789, "global_step": 258573, "epoch": 3115} {"train_loss": -25.389801025390625, "global_step": 258574, "epoch": 3115} {"train_loss": -25.104150772094727, "global_step": 258575, "epoch": 3115} {"train_loss": -25.339521408081055, "global_step": 258576, "epoch": 3115} {"train_loss": -24.962263107299805, "global_step": 258577, "epoch": 3115} {"train_loss": -25.200578689575195, "global_step": 258578, "epoch": 3115} {"train_loss": -25.14239501953125, "global_step": 258579, "epoch": 3115} {"train_loss": -25.16313362121582, "global_step": 258580, "epoch": 3115} {"train_loss": -24.892770767211914, "global_step": 258581, "epoch": 3115} {"train_loss": -25.324806213378906, "global_step": 258582, "epoch": 3115} {"train_loss": -25.15305519104004, "global_step": 258583, "epoch": 3115} {"train_loss": -25.175302505493164, "global_step": 258584, "epoch": 3115} {"train_loss": -25.148345947265625, "global_step": 258585, "epoch": 3115} {"train_loss": -25.035938262939453, "global_step": 258586, "epoch": 3115} {"train_loss": -25.131290435791016, "global_step": 258587, "epoch": 3115} {"train_loss": -25.25260353088379, "global_step": 258588, "epoch": 3115} {"train_loss": -25.113941192626953, "global_step": 258589, "epoch": 3115} {"train_loss": -25.025482177734375, "global_step": 258590, "epoch": 3115} {"train_loss": -24.88515281677246, "global_step": 258591, "epoch": 3115} {"train_loss": -25.04432487487793, "global_step": 258592, "epoch": 3115} {"train_loss": -25.158803939819336, "global_step": 258593, "epoch": 3115} {"train_loss": -25.141788482666016, "global_step": 258594, "epoch": 3115} {"train_loss": -25.151662826538086, "global_step": 258595, "epoch": 3115} {"train_loss": -25.3887939453125, "global_step": 258596, "epoch": 3115} {"train_loss": -25.41029167175293, "global_step": 258597, "epoch": 3115} {"train_loss": -25.059246063232422, "global_step": 258598, "epoch": 3115} {"train_loss": -25.166006088256836, "global_step": 258599, "epoch": 3115} {"train_loss": -25.200559616088867, "global_step": 258600, "epoch": 3115} {"train_loss": -25.30303955078125, "global_step": 258601, "epoch": 3115} {"train_loss": -24.848840713500977, "global_step": 258602, "epoch": 3115} {"train_loss": -24.766468048095703, "global_step": 258603, "epoch": 3115} {"train_loss": -25.220388412475586, "global_step": 258604, "epoch": 3115} {"train_loss": -25.0369930267334, "global_step": 258605, "epoch": 3115} {"train_loss": -25.193496704101562, "global_step": 258606, "epoch": 3115} {"train_loss": -25.143186569213867, "global_step": 258607, "epoch": 3115} {"train_loss": -25.420211791992188, "global_step": 258608, "epoch": 3115} {"train_loss": -24.765464782714844, "global_step": 258609, "epoch": 3115} {"train_loss": -25.143823623657227, "global_step": 258610, "epoch": 3115} {"train_loss": -25.52686882019043, "global_step": 258611, "epoch": 3115} {"train_loss": -25.452985763549805, "global_step": 258612, "epoch": 3115} {"train_loss": -25.326452255249023, "global_step": 258613, "epoch": 3115} {"train_loss": -24.81222915649414, "global_step": 258614, "epoch": 3115} {"train_loss": -24.790668487548828, "global_step": 258615, "epoch": 3115} {"train_loss": -25.095914840698242, "global_step": 258616, "epoch": 3115} {"train_loss": -25.063037872314453, "global_step": 258617, "epoch": 3115} {"train_loss": -25.24335289001465, "global_step": 258618, "epoch": 3115} {"train_loss": -25.225290298461914, "global_step": 258619, "epoch": 3115} {"train_loss": -25.270761489868164, "global_step": 258620, "epoch": 3115} {"train_loss": -25.096603393554688, "global_step": 258621, "epoch": 3115} {"train_loss": -25.142383575439453, "global_step": 258622, "epoch": 3115} {"train_loss": -25.06549835205078, "global_step": 258623, "epoch": 3115} {"train_loss": -25.1090030670166, "global_step": 258624, "epoch": 3115} {"train_loss": -25.25275230407715, "global_step": 258625, "epoch": 3115} {"train_loss": -25.8505859375, "global_step": 258626, "epoch": 3115} {"train_loss": -25.07015003066465, "global_step": 258627, "epoch": 3115, "val_loss": 6874298.0} {"train_loss": -24.895490646362305, "global_step": 258628, "epoch": 3116} {"train_loss": -24.66289710998535, "global_step": 258629, "epoch": 3116} {"train_loss": -24.85287857055664, "global_step": 258630, "epoch": 3116} {"train_loss": -24.403629302978516, "global_step": 258631, "epoch": 3116} {"train_loss": -24.755685806274414, "global_step": 258632, "epoch": 3116} {"train_loss": -24.996137619018555, "global_step": 258633, "epoch": 3116} {"train_loss": -24.934885025024414, "global_step": 258634, "epoch": 3116} {"train_loss": -24.75945281982422, "global_step": 258635, "epoch": 3116} {"train_loss": -24.62413215637207, "global_step": 258636, "epoch": 3116} {"train_loss": -25.086050033569336, "global_step": 258637, "epoch": 3116} {"train_loss": -25.130521774291992, "global_step": 258638, "epoch": 3116} {"train_loss": -24.88836669921875, "global_step": 258639, "epoch": 3116} {"train_loss": -24.740543365478516, "global_step": 258640, "epoch": 3116} {"train_loss": -24.750356674194336, "global_step": 258641, "epoch": 3116} {"train_loss": -25.156782150268555, "global_step": 258642, "epoch": 3116} {"train_loss": -25.095443725585938, "global_step": 258643, "epoch": 3116} {"train_loss": -25.27045249938965, "global_step": 258644, "epoch": 3116} {"train_loss": -24.89318084716797, "global_step": 258645, "epoch": 3116} {"train_loss": -25.163434982299805, "global_step": 258646, "epoch": 3116} {"train_loss": -25.21312141418457, "global_step": 258647, "epoch": 3116} {"train_loss": -25.00790786743164, "global_step": 258648, "epoch": 3116} {"train_loss": -25.18381118774414, "global_step": 258649, "epoch": 3116} {"train_loss": -25.2128849029541, "global_step": 258650, "epoch": 3116} {"train_loss": -25.135986328125, "global_step": 258651, "epoch": 3116} {"train_loss": -25.283124923706055, "global_step": 258652, "epoch": 3116} {"train_loss": -25.396543502807617, "global_step": 258653, "epoch": 3116} {"train_loss": -25.331113815307617, "global_step": 258654, "epoch": 3116} {"train_loss": -25.338838577270508, "global_step": 258655, "epoch": 3116} {"train_loss": -24.926328659057617, "global_step": 258656, "epoch": 3116} {"train_loss": -25.108678817749023, "global_step": 258657, "epoch": 3116} {"train_loss": -25.16461753845215, "global_step": 258658, "epoch": 3116} {"train_loss": -25.37701988220215, "global_step": 258659, "epoch": 3116} {"train_loss": -25.326889038085938, "global_step": 258660, "epoch": 3116} {"train_loss": -24.980981826782227, "global_step": 258661, "epoch": 3116} {"train_loss": -25.125137329101562, "global_step": 258662, "epoch": 3116} {"train_loss": -25.4075984954834, "global_step": 258663, "epoch": 3116} {"train_loss": -25.235422134399414, "global_step": 258664, "epoch": 3116} {"train_loss": -24.674230575561523, "global_step": 258665, "epoch": 3116} {"train_loss": -24.876842498779297, "global_step": 258666, "epoch": 3116} {"train_loss": -25.554426193237305, "global_step": 258667, "epoch": 3116} {"train_loss": -25.08359718322754, "global_step": 258668, "epoch": 3116} {"train_loss": -25.336231231689453, "global_step": 258669, "epoch": 3116} {"train_loss": -24.819272994995117, "global_step": 258670, "epoch": 3116} {"train_loss": -25.310657501220703, "global_step": 258671, "epoch": 3116} {"train_loss": -25.00057029724121, "global_step": 258672, "epoch": 3116} {"train_loss": -24.4800968170166, "global_step": 258673, "epoch": 3116} {"train_loss": -25.013654708862305, "global_step": 258674, "epoch": 3116} {"train_loss": -25.291006088256836, "global_step": 258675, "epoch": 3116} {"train_loss": -25.122692108154297, "global_step": 258676, "epoch": 3116} {"train_loss": -25.14196014404297, "global_step": 258677, "epoch": 3116} {"train_loss": -25.14534568786621, "global_step": 258678, "epoch": 3116} {"train_loss": -25.051197052001953, "global_step": 258679, "epoch": 3116} {"train_loss": -25.15909194946289, "global_step": 258680, "epoch": 3116} {"train_loss": -24.787940979003906, "global_step": 258681, "epoch": 3116} {"train_loss": -25.030969619750977, "global_step": 258682, "epoch": 3116} {"train_loss": -25.027984619140625, "global_step": 258683, "epoch": 3116} {"train_loss": -25.493114471435547, "global_step": 258684, "epoch": 3116} {"train_loss": -25.359479904174805, "global_step": 258685, "epoch": 3116} {"train_loss": -25.144485473632812, "global_step": 258686, "epoch": 3116} {"train_loss": -25.2169132232666, "global_step": 258687, "epoch": 3116} {"train_loss": -25.27381706237793, "global_step": 258688, "epoch": 3116} {"train_loss": -25.629653930664062, "global_step": 258689, "epoch": 3116} {"train_loss": -25.047748565673828, "global_step": 258690, "epoch": 3116} {"train_loss": -24.98880386352539, "global_step": 258691, "epoch": 3116} {"train_loss": -25.221506118774414, "global_step": 258692, "epoch": 3116} {"train_loss": -24.768234252929688, "global_step": 258693, "epoch": 3116} {"train_loss": -25.263214111328125, "global_step": 258694, "epoch": 3116} {"train_loss": -25.268430709838867, "global_step": 258695, "epoch": 3116} {"train_loss": -24.947904586791992, "global_step": 258696, "epoch": 3116} {"train_loss": -25.178647994995117, "global_step": 258697, "epoch": 3116} {"train_loss": -25.044506072998047, "global_step": 258698, "epoch": 3116} {"train_loss": -24.896169662475586, "global_step": 258699, "epoch": 3116} {"train_loss": -25.42559242248535, "global_step": 258700, "epoch": 3116} {"train_loss": -24.888425827026367, "global_step": 258701, "epoch": 3116} {"train_loss": -25.4399356842041, "global_step": 258702, "epoch": 3116} {"train_loss": -25.058975219726562, "global_step": 258703, "epoch": 3116} {"train_loss": -25.120624542236328, "global_step": 258704, "epoch": 3116} {"train_loss": -25.270009994506836, "global_step": 258705, "epoch": 3116} {"train_loss": -24.8903865814209, "global_step": 258706, "epoch": 3116} {"train_loss": -25.36288070678711, "global_step": 258707, "epoch": 3116} {"train_loss": -25.463844299316406, "global_step": 258708, "epoch": 3116} {"train_loss": -24.94721031188965, "global_step": 258709, "epoch": 3116} {"train_loss": -25.080439027533473, "global_step": 258710, "epoch": 3116, "val_loss": 6858125.0} {"train_loss": -24.67436408996582, "global_step": 258711, "epoch": 3117} {"train_loss": -24.666015625, "global_step": 258712, "epoch": 3117} {"train_loss": -24.702871322631836, "global_step": 258713, "epoch": 3117} {"train_loss": -24.64039421081543, "global_step": 258714, "epoch": 3117} {"train_loss": -24.460289001464844, "global_step": 258715, "epoch": 3117} {"train_loss": -24.516952514648438, "global_step": 258716, "epoch": 3117} {"train_loss": -24.527353286743164, "global_step": 258717, "epoch": 3117} {"train_loss": -24.997901916503906, "global_step": 258718, "epoch": 3117} {"train_loss": -24.15549087524414, "global_step": 258719, "epoch": 3117} {"train_loss": -24.6679630279541, "global_step": 258720, "epoch": 3117} {"train_loss": -24.806547164916992, "global_step": 258721, "epoch": 3117} {"train_loss": -24.7424373626709, "global_step": 258722, "epoch": 3117} {"train_loss": -24.777206420898438, "global_step": 258723, "epoch": 3117} {"train_loss": -24.63711929321289, "global_step": 258724, "epoch": 3117} {"train_loss": -25.072492599487305, "global_step": 258725, "epoch": 3117} {"train_loss": -24.869354248046875, "global_step": 258726, "epoch": 3117} {"train_loss": -24.65399932861328, "global_step": 258727, "epoch": 3117} {"train_loss": -24.93289566040039, "global_step": 258728, "epoch": 3117} {"train_loss": -24.666624069213867, "global_step": 258729, "epoch": 3117} {"train_loss": -25.104248046875, "global_step": 258730, "epoch": 3117} {"train_loss": -24.77192497253418, "global_step": 258731, "epoch": 3117} {"train_loss": -25.039844512939453, "global_step": 258732, "epoch": 3117} {"train_loss": -24.982099533081055, "global_step": 258733, "epoch": 3117} {"train_loss": -24.890365600585938, "global_step": 258734, "epoch": 3117} {"train_loss": -25.345895767211914, "global_step": 258735, "epoch": 3117} {"train_loss": -25.242399215698242, "global_step": 258736, "epoch": 3117} {"train_loss": -25.19275665283203, "global_step": 258737, "epoch": 3117} {"train_loss": -25.281221389770508, "global_step": 258738, "epoch": 3117} {"train_loss": -25.24821662902832, "global_step": 258739, "epoch": 3117} {"train_loss": -25.319149017333984, "global_step": 258740, "epoch": 3117} {"train_loss": -24.941282272338867, "global_step": 258741, "epoch": 3117} {"train_loss": -25.208372116088867, "global_step": 258742, "epoch": 3117} {"train_loss": -25.339757919311523, "global_step": 258743, "epoch": 3117} {"train_loss": -24.868640899658203, "global_step": 258744, "epoch": 3117} {"train_loss": -24.943525314331055, "global_step": 258745, "epoch": 3117} {"train_loss": -25.559829711914062, "global_step": 258746, "epoch": 3117} {"train_loss": -25.508398056030273, "global_step": 258747, "epoch": 3117} {"train_loss": -25.49472999572754, "global_step": 258748, "epoch": 3117} {"train_loss": -25.323347091674805, "global_step": 258749, "epoch": 3117} {"train_loss": -25.536523818969727, "global_step": 258750, "epoch": 3117} {"train_loss": -25.305011749267578, "global_step": 258751, "epoch": 3117} {"train_loss": -25.142757415771484, "global_step": 258752, "epoch": 3117} {"train_loss": -25.26641082763672, "global_step": 258753, "epoch": 3117} {"train_loss": -25.396020889282227, "global_step": 258754, "epoch": 3117} {"train_loss": -25.056509017944336, "global_step": 258755, "epoch": 3117} {"train_loss": -25.173044204711914, "global_step": 258756, "epoch": 3117} {"train_loss": -25.230976104736328, "global_step": 258757, "epoch": 3117} {"train_loss": -25.20491600036621, "global_step": 258758, "epoch": 3117} {"train_loss": -25.2224178314209, "global_step": 258759, "epoch": 3117} {"train_loss": -24.99239730834961, "global_step": 258760, "epoch": 3117} {"train_loss": -25.283851623535156, "global_step": 258761, "epoch": 3117} {"train_loss": -25.1517333984375, "global_step": 258762, "epoch": 3117} {"train_loss": -24.97340202331543, "global_step": 258763, "epoch": 3117} {"train_loss": -25.064058303833008, "global_step": 258764, "epoch": 3117} {"train_loss": -25.34037971496582, "global_step": 258765, "epoch": 3117} {"train_loss": -25.28875732421875, "global_step": 258766, "epoch": 3117} {"train_loss": -25.07731056213379, "global_step": 258767, "epoch": 3117} {"train_loss": -25.377084732055664, "global_step": 258768, "epoch": 3117} {"train_loss": -25.253156661987305, "global_step": 258769, "epoch": 3117} {"train_loss": -25.273059844970703, "global_step": 258770, "epoch": 3117} {"train_loss": -24.958940505981445, "global_step": 258771, "epoch": 3117} {"train_loss": -25.16979217529297, "global_step": 258772, "epoch": 3117} {"train_loss": -25.053558349609375, "global_step": 258773, "epoch": 3117} {"train_loss": -25.455190658569336, "global_step": 258774, "epoch": 3117} {"train_loss": -25.09417724609375, "global_step": 258775, "epoch": 3117} {"train_loss": -25.20235252380371, "global_step": 258776, "epoch": 3117} {"train_loss": -24.806304931640625, "global_step": 258777, "epoch": 3117} {"train_loss": -24.539730072021484, "global_step": 258778, "epoch": 3117} {"train_loss": -25.214155197143555, "global_step": 258779, "epoch": 3117} {"train_loss": -25.40696144104004, "global_step": 258780, "epoch": 3117} {"train_loss": -25.07858657836914, "global_step": 258781, "epoch": 3117} {"train_loss": -25.107465744018555, "global_step": 258782, "epoch": 3117} {"train_loss": -24.872791290283203, "global_step": 258783, "epoch": 3117} {"train_loss": -25.070297241210938, "global_step": 258784, "epoch": 3117} {"train_loss": -25.2012996673584, "global_step": 258785, "epoch": 3117} {"train_loss": -25.293174743652344, "global_step": 258786, "epoch": 3117} {"train_loss": -25.087087631225586, "global_step": 258787, "epoch": 3117} {"train_loss": -25.66901969909668, "global_step": 258788, "epoch": 3117} {"train_loss": -24.913305282592773, "global_step": 258789, "epoch": 3117} {"train_loss": -25.088804244995117, "global_step": 258790, "epoch": 3117} {"train_loss": -24.79221534729004, "global_step": 258791, "epoch": 3117} {"train_loss": -24.987375259399414, "global_step": 258792, "epoch": 3117} {"train_loss": -25.055358863738647, "global_step": 258793, "epoch": 3117, "val_loss": 6857640.0} {"train_loss": -24.684383392333984, "global_step": 258794, "epoch": 3118} {"train_loss": -24.74811363220215, "global_step": 258795, "epoch": 3118} {"train_loss": -24.997472763061523, "global_step": 258796, "epoch": 3118} {"train_loss": -24.48383903503418, "global_step": 258797, "epoch": 3118} {"train_loss": -24.01447296142578, "global_step": 258798, "epoch": 3118} {"train_loss": -24.188142776489258, "global_step": 258799, "epoch": 3118} {"train_loss": -24.52187728881836, "global_step": 258800, "epoch": 3118} {"train_loss": -24.707229614257812, "global_step": 258801, "epoch": 3118} {"train_loss": -24.778799057006836, "global_step": 258802, "epoch": 3118} {"train_loss": -24.56971549987793, "global_step": 258803, "epoch": 3118} {"train_loss": -24.588218688964844, "global_step": 258804, "epoch": 3118} {"train_loss": -24.7720890045166, "global_step": 258805, "epoch": 3118} {"train_loss": -25.00166130065918, "global_step": 258806, "epoch": 3118} {"train_loss": -24.651269912719727, "global_step": 258807, "epoch": 3118} {"train_loss": -24.708871841430664, "global_step": 258808, "epoch": 3118} {"train_loss": -24.778305053710938, "global_step": 258809, "epoch": 3118} {"train_loss": -24.827411651611328, "global_step": 258810, "epoch": 3118} {"train_loss": -24.774089813232422, "global_step": 258811, "epoch": 3118} {"train_loss": -25.208154678344727, "global_step": 258812, "epoch": 3118} {"train_loss": -24.585111618041992, "global_step": 258813, "epoch": 3118} {"train_loss": -25.05267333984375, "global_step": 258814, "epoch": 3118} {"train_loss": -24.998592376708984, "global_step": 258815, "epoch": 3118} {"train_loss": -25.409162521362305, "global_step": 258816, "epoch": 3118} {"train_loss": -24.993528366088867, "global_step": 258817, "epoch": 3118} {"train_loss": -24.9846248626709, "global_step": 258818, "epoch": 3118} {"train_loss": -24.98577308654785, "global_step": 258819, "epoch": 3118} {"train_loss": -24.98286247253418, "global_step": 258820, "epoch": 3118} {"train_loss": -24.769994735717773, "global_step": 258821, "epoch": 3118} {"train_loss": -25.034793853759766, "global_step": 258822, "epoch": 3118} {"train_loss": -25.43037223815918, "global_step": 258823, "epoch": 3118} {"train_loss": -25.417808532714844, "global_step": 258824, "epoch": 3118} {"train_loss": -25.093297958374023, "global_step": 258825, "epoch": 3118} {"train_loss": -24.954240798950195, "global_step": 258826, "epoch": 3118} {"train_loss": -25.353322982788086, "global_step": 258827, "epoch": 3118} {"train_loss": -25.210407257080078, "global_step": 258828, "epoch": 3118} {"train_loss": -25.16255760192871, "global_step": 258829, "epoch": 3118} {"train_loss": -24.896474838256836, "global_step": 258830, "epoch": 3118} {"train_loss": -25.402753829956055, "global_step": 258831, "epoch": 3118} {"train_loss": -25.292219161987305, "global_step": 258832, "epoch": 3118} {"train_loss": -24.938688278198242, "global_step": 258833, "epoch": 3118} {"train_loss": -25.010290145874023, "global_step": 258834, "epoch": 3118} {"train_loss": -25.159875869750977, "global_step": 258835, "epoch": 3118} {"train_loss": -24.9150390625, "global_step": 258836, "epoch": 3118} {"train_loss": -25.015010833740234, "global_step": 258837, "epoch": 3118} {"train_loss": -24.807390213012695, "global_step": 258838, "epoch": 3118} {"train_loss": -25.260833740234375, "global_step": 258839, "epoch": 3118} {"train_loss": -25.459455490112305, "global_step": 258840, "epoch": 3118} {"train_loss": -24.873273849487305, "global_step": 258841, "epoch": 3118} {"train_loss": -25.176786422729492, "global_step": 258842, "epoch": 3118} {"train_loss": -25.23365020751953, "global_step": 258843, "epoch": 3118} {"train_loss": -25.25177574157715, "global_step": 258844, "epoch": 3118} {"train_loss": -25.155187606811523, "global_step": 258845, "epoch": 3118} {"train_loss": -25.223909378051758, "global_step": 258846, "epoch": 3118} {"train_loss": -25.22723960876465, "global_step": 258847, "epoch": 3118} {"train_loss": -25.259540557861328, "global_step": 258848, "epoch": 3118} {"train_loss": -25.207168579101562, "global_step": 258849, "epoch": 3118} {"train_loss": -25.285924911499023, "global_step": 258850, "epoch": 3118} {"train_loss": -25.307397842407227, "global_step": 258851, "epoch": 3118} {"train_loss": -24.604337692260742, "global_step": 258852, "epoch": 3118} {"train_loss": -25.269115447998047, "global_step": 258853, "epoch": 3118} {"train_loss": -25.123762130737305, "global_step": 258854, "epoch": 3118} {"train_loss": -25.38531494140625, "global_step": 258855, "epoch": 3118} {"train_loss": -24.71430778503418, "global_step": 258856, "epoch": 3118} {"train_loss": -25.547666549682617, "global_step": 258857, "epoch": 3118} {"train_loss": -24.884872436523438, "global_step": 258858, "epoch": 3118} {"train_loss": -25.445402145385742, "global_step": 258859, "epoch": 3118} {"train_loss": -25.536026000976562, "global_step": 258860, "epoch": 3118} {"train_loss": -25.263242721557617, "global_step": 258861, "epoch": 3118} {"train_loss": -24.986791610717773, "global_step": 258862, "epoch": 3118} {"train_loss": -25.27149200439453, "global_step": 258863, "epoch": 3118} {"train_loss": -25.653705596923828, "global_step": 258864, "epoch": 3118} {"train_loss": -25.27773666381836, "global_step": 258865, "epoch": 3118} {"train_loss": -25.34898567199707, "global_step": 258866, "epoch": 3118} {"train_loss": -25.135969161987305, "global_step": 258867, "epoch": 3118} {"train_loss": -25.187891006469727, "global_step": 258868, "epoch": 3118} {"train_loss": -25.00470542907715, "global_step": 258869, "epoch": 3118} {"train_loss": -25.192655563354492, "global_step": 258870, "epoch": 3118} {"train_loss": -25.18605613708496, "global_step": 258871, "epoch": 3118} {"train_loss": -24.75804328918457, "global_step": 258872, "epoch": 3118} {"train_loss": -24.61656379699707, "global_step": 258873, "epoch": 3118} {"train_loss": -25.296987533569336, "global_step": 258874, "epoch": 3118} {"train_loss": -25.37411117553711, "global_step": 258875, "epoch": 3118} {"train_loss": -25.039685099957936, "global_step": 258876, "epoch": 3118, "val_loss": 6820474.0} {"train_loss": -24.815608978271484, "global_step": 258877, "epoch": 3119} {"train_loss": -24.87856674194336, "global_step": 258878, "epoch": 3119} {"train_loss": -24.78622817993164, "global_step": 258879, "epoch": 3119} {"train_loss": -24.990732192993164, "global_step": 258880, "epoch": 3119} {"train_loss": -25.10207176208496, "global_step": 258881, "epoch": 3119} {"train_loss": -25.26728630065918, "global_step": 258882, "epoch": 3119} {"train_loss": -25.23536491394043, "global_step": 258883, "epoch": 3119} {"train_loss": -24.925086975097656, "global_step": 258884, "epoch": 3119} {"train_loss": -25.342405319213867, "global_step": 258885, "epoch": 3119} {"train_loss": -25.461095809936523, "global_step": 258886, "epoch": 3119} {"train_loss": -25.137296676635742, "global_step": 258887, "epoch": 3119} {"train_loss": -25.052968978881836, "global_step": 258888, "epoch": 3119} {"train_loss": -25.081174850463867, "global_step": 258889, "epoch": 3119} {"train_loss": -25.14223289489746, "global_step": 258890, "epoch": 3119} {"train_loss": -24.72601318359375, "global_step": 258891, "epoch": 3119} {"train_loss": -25.3946533203125, "global_step": 258892, "epoch": 3119} {"train_loss": -25.1110782623291, "global_step": 258893, "epoch": 3119} {"train_loss": -25.101348876953125, "global_step": 258894, "epoch": 3119} {"train_loss": -25.06184959411621, "global_step": 258895, "epoch": 3119} {"train_loss": -25.1582088470459, "global_step": 258896, "epoch": 3119} {"train_loss": -25.11332893371582, "global_step": 258897, "epoch": 3119} {"train_loss": -25.141019821166992, "global_step": 258898, "epoch": 3119} {"train_loss": -25.465566635131836, "global_step": 258899, "epoch": 3119} {"train_loss": -25.282135009765625, "global_step": 258900, "epoch": 3119} {"train_loss": -24.893962860107422, "global_step": 258901, "epoch": 3119} {"train_loss": -25.09596061706543, "global_step": 258902, "epoch": 3119} {"train_loss": -24.906980514526367, "global_step": 258903, "epoch": 3119} {"train_loss": -24.97224235534668, "global_step": 258904, "epoch": 3119} {"train_loss": -25.16057777404785, "global_step": 258905, "epoch": 3119} {"train_loss": -25.162220001220703, "global_step": 258906, "epoch": 3119} {"train_loss": -25.397018432617188, "global_step": 258907, "epoch": 3119} {"train_loss": -25.103796005249023, "global_step": 258908, "epoch": 3119} {"train_loss": -25.057600021362305, "global_step": 258909, "epoch": 3119} {"train_loss": -25.277000427246094, "global_step": 258910, "epoch": 3119} {"train_loss": -25.152315139770508, "global_step": 258911, "epoch": 3119} {"train_loss": -25.315824508666992, "global_step": 258912, "epoch": 3119} {"train_loss": -25.047269821166992, "global_step": 258913, "epoch": 3119} {"train_loss": -25.241243362426758, "global_step": 258914, "epoch": 3119} {"train_loss": -25.93145751953125, "global_step": 258915, "epoch": 3119} {"train_loss": -24.750263214111328, "global_step": 258916, "epoch": 3119} {"train_loss": -25.037736892700195, "global_step": 258917, "epoch": 3119} {"train_loss": -25.020723342895508, "global_step": 258918, "epoch": 3119} {"train_loss": -24.851398468017578, "global_step": 258919, "epoch": 3119} {"train_loss": -25.187421798706055, "global_step": 258920, "epoch": 3119} {"train_loss": -25.306549072265625, "global_step": 258921, "epoch": 3119} {"train_loss": -25.26763153076172, "global_step": 258922, "epoch": 3119} {"train_loss": -25.3193416595459, "global_step": 258923, "epoch": 3119} {"train_loss": -25.515962600708008, "global_step": 258924, "epoch": 3119} {"train_loss": -25.024560928344727, "global_step": 258925, "epoch": 3119} {"train_loss": -25.225465774536133, "global_step": 258926, "epoch": 3119} {"train_loss": -25.169858932495117, "global_step": 258927, "epoch": 3119} {"train_loss": -25.44670295715332, "global_step": 258928, "epoch": 3119} {"train_loss": -24.973796844482422, "global_step": 258929, "epoch": 3119} {"train_loss": -25.216821670532227, "global_step": 258930, "epoch": 3119} {"train_loss": -25.250844955444336, "global_step": 258931, "epoch": 3119} {"train_loss": -25.287412643432617, "global_step": 258932, "epoch": 3119} {"train_loss": -24.982744216918945, "global_step": 258933, "epoch": 3119} {"train_loss": -25.37853240966797, "global_step": 258934, "epoch": 3119} {"train_loss": -24.97542381286621, "global_step": 258935, "epoch": 3119} {"train_loss": -25.260068893432617, "global_step": 258936, "epoch": 3119} {"train_loss": -25.33719825744629, "global_step": 258937, "epoch": 3119} {"train_loss": -25.272184371948242, "global_step": 258938, "epoch": 3119} {"train_loss": -25.010313034057617, "global_step": 258939, "epoch": 3119} {"train_loss": -24.89544105529785, "global_step": 258940, "epoch": 3119} {"train_loss": -25.096834182739258, "global_step": 258941, "epoch": 3119} {"train_loss": -25.201034545898438, "global_step": 258942, "epoch": 3119} {"train_loss": -25.303525924682617, "global_step": 258943, "epoch": 3119} {"train_loss": -25.250707626342773, "global_step": 258944, "epoch": 3119} {"train_loss": -25.4310359954834, "global_step": 258945, "epoch": 3119} {"train_loss": -25.21577262878418, "global_step": 258946, "epoch": 3119} {"train_loss": -24.882287979125977, "global_step": 258947, "epoch": 3119} {"train_loss": -25.184873580932617, "global_step": 258948, "epoch": 3119} {"train_loss": -25.32846450805664, "global_step": 258949, "epoch": 3119} {"train_loss": -25.234098434448242, "global_step": 258950, "epoch": 3119} {"train_loss": -25.325969696044922, "global_step": 258951, "epoch": 3119} {"train_loss": -25.15492820739746, "global_step": 258952, "epoch": 3119} {"train_loss": -24.894107818603516, "global_step": 258953, "epoch": 3119} {"train_loss": -25.405935287475586, "global_step": 258954, "epoch": 3119} {"train_loss": -24.88311195373535, "global_step": 258955, "epoch": 3119} {"train_loss": -25.260236740112305, "global_step": 258956, "epoch": 3119} {"train_loss": -25.358335494995117, "global_step": 258957, "epoch": 3119} {"train_loss": -25.21390724182129, "global_step": 258958, "epoch": 3119} {"train_loss": -25.15811894887901, "global_step": 258959, "epoch": 3119, "val_loss": 6819520.0} {"train_loss": -24.619094848632812, "global_step": 258960, "epoch": 3120} {"train_loss": -24.945226669311523, "global_step": 258961, "epoch": 3120} {"train_loss": -25.06095314025879, "global_step": 258962, "epoch": 3120} {"train_loss": -24.64266014099121, "global_step": 258963, "epoch": 3120} {"train_loss": -24.523466110229492, "global_step": 258964, "epoch": 3120} {"train_loss": -24.689477920532227, "global_step": 258965, "epoch": 3120} {"train_loss": -24.664106369018555, "global_step": 258966, "epoch": 3120} {"train_loss": -24.388744354248047, "global_step": 258967, "epoch": 3120} {"train_loss": -24.796518325805664, "global_step": 258968, "epoch": 3120} {"train_loss": -24.72570037841797, "global_step": 258969, "epoch": 3120} {"train_loss": -24.48331642150879, "global_step": 258970, "epoch": 3120} {"train_loss": -24.975448608398438, "global_step": 258971, "epoch": 3120} {"train_loss": -24.70082664489746, "global_step": 258972, "epoch": 3120} {"train_loss": -25.127012252807617, "global_step": 258973, "epoch": 3120} {"train_loss": -24.836124420166016, "global_step": 258974, "epoch": 3120} {"train_loss": -24.714536666870117, "global_step": 258975, "epoch": 3120} {"train_loss": -24.591442108154297, "global_step": 258976, "epoch": 3120} {"train_loss": -25.15995216369629, "global_step": 258977, "epoch": 3120} {"train_loss": -25.017621994018555, "global_step": 258978, "epoch": 3120} {"train_loss": -25.150348663330078, "global_step": 258979, "epoch": 3120} {"train_loss": -24.92494010925293, "global_step": 258980, "epoch": 3120} {"train_loss": -24.9348201751709, "global_step": 258981, "epoch": 3120} {"train_loss": -25.23301887512207, "global_step": 258982, "epoch": 3120} {"train_loss": -25.100004196166992, "global_step": 258983, "epoch": 3120} {"train_loss": -25.377321243286133, "global_step": 258984, "epoch": 3120} {"train_loss": -24.986175537109375, "global_step": 258985, "epoch": 3120} {"train_loss": -25.060216903686523, "global_step": 258986, "epoch": 3120} {"train_loss": -24.94275665283203, "global_step": 258987, "epoch": 3120} {"train_loss": -25.03899383544922, "global_step": 258988, "epoch": 3120} {"train_loss": -25.2294979095459, "global_step": 258989, "epoch": 3120} {"train_loss": -25.00567054748535, "global_step": 258990, "epoch": 3120} {"train_loss": -25.108291625976562, "global_step": 258991, "epoch": 3120} {"train_loss": -24.963088989257812, "global_step": 258992, "epoch": 3120} {"train_loss": -24.709739685058594, "global_step": 258993, "epoch": 3120} {"train_loss": -25.189313888549805, "global_step": 258994, "epoch": 3120} {"train_loss": -25.098203659057617, "global_step": 258995, "epoch": 3120} {"train_loss": -25.248952865600586, "global_step": 258996, "epoch": 3120} {"train_loss": -25.042118072509766, "global_step": 258997, "epoch": 3120} {"train_loss": -24.854633331298828, "global_step": 258998, "epoch": 3120} {"train_loss": -25.432971954345703, "global_step": 258999, "epoch": 3120} {"train_loss": -24.980926513671875, "global_step": 259000, "epoch": 3120} {"train_loss": -25.035608291625977, "global_step": 259001, "epoch": 3120} {"train_loss": -25.194957733154297, "global_step": 259002, "epoch": 3120} {"train_loss": -24.955413818359375, "global_step": 259003, "epoch": 3120} {"train_loss": -25.4000244140625, "global_step": 259004, "epoch": 3120} {"train_loss": -25.144834518432617, "global_step": 259005, "epoch": 3120} {"train_loss": -24.745620727539062, "global_step": 259006, "epoch": 3120} {"train_loss": -25.248790740966797, "global_step": 259007, "epoch": 3120} {"train_loss": -25.028823852539062, "global_step": 259008, "epoch": 3120} {"train_loss": -25.419248580932617, "global_step": 259009, "epoch": 3120} {"train_loss": -25.250770568847656, "global_step": 259010, "epoch": 3120} {"train_loss": -25.25251579284668, "global_step": 259011, "epoch": 3120} {"train_loss": -24.951921463012695, "global_step": 259012, "epoch": 3120} {"train_loss": -24.81017303466797, "global_step": 259013, "epoch": 3120} {"train_loss": -25.37843894958496, "global_step": 259014, "epoch": 3120} {"train_loss": -25.06407356262207, "global_step": 259015, "epoch": 3120} {"train_loss": -24.941648483276367, "global_step": 259016, "epoch": 3120} {"train_loss": -24.66855239868164, "global_step": 259017, "epoch": 3120} {"train_loss": -25.050119400024414, "global_step": 259018, "epoch": 3120} {"train_loss": -25.133047103881836, "global_step": 259019, "epoch": 3120} {"train_loss": -25.190698623657227, "global_step": 259020, "epoch": 3120} {"train_loss": -25.328584671020508, "global_step": 259021, "epoch": 3120} {"train_loss": -25.096866607666016, "global_step": 259022, "epoch": 3120} {"train_loss": -25.44631576538086, "global_step": 259023, "epoch": 3120} {"train_loss": -25.144790649414062, "global_step": 259024, "epoch": 3120} {"train_loss": -25.174278259277344, "global_step": 259025, "epoch": 3120} {"train_loss": -25.21392822265625, "global_step": 259026, "epoch": 3120} {"train_loss": -25.05914878845215, "global_step": 259027, "epoch": 3120} {"train_loss": -25.147974014282227, "global_step": 259028, "epoch": 3120} {"train_loss": -25.114938735961914, "global_step": 259029, "epoch": 3120} {"train_loss": -24.976043701171875, "global_step": 259030, "epoch": 3120} {"train_loss": -24.925392150878906, "global_step": 259031, "epoch": 3120} {"train_loss": -24.991044998168945, "global_step": 259032, "epoch": 3120} {"train_loss": -25.10271644592285, "global_step": 259033, "epoch": 3120} {"train_loss": -25.24586296081543, "global_step": 259034, "epoch": 3120} {"train_loss": -24.854978561401367, "global_step": 259035, "epoch": 3120} {"train_loss": -24.739370346069336, "global_step": 259036, "epoch": 3120} {"train_loss": -24.58429527282715, "global_step": 259037, "epoch": 3120} {"train_loss": -25.369516372680664, "global_step": 259038, "epoch": 3120} {"train_loss": -24.79644775390625, "global_step": 259039, "epoch": 3120} {"train_loss": -24.42337989807129, "global_step": 259040, "epoch": 3120} {"train_loss": -25.032028198242188, "global_step": 259041, "epoch": 3120} {"train_loss": -25.003854016223585, "global_step": 259042, "epoch": 3120, "val_loss": 6954425.0} {"train_loss": -24.558225631713867, "global_step": 259043, "epoch": 3121} {"train_loss": -24.888919830322266, "global_step": 259044, "epoch": 3121} {"train_loss": -24.925777435302734, "global_step": 259045, "epoch": 3121} {"train_loss": -24.73322105407715, "global_step": 259046, "epoch": 3121} {"train_loss": -24.750995635986328, "global_step": 259047, "epoch": 3121} {"train_loss": -24.72585678100586, "global_step": 259048, "epoch": 3121} {"train_loss": -24.851970672607422, "global_step": 259049, "epoch": 3121} {"train_loss": -24.72882080078125, "global_step": 259050, "epoch": 3121} {"train_loss": -24.492374420166016, "global_step": 259051, "epoch": 3121} {"train_loss": -25.301101684570312, "global_step": 259052, "epoch": 3121} {"train_loss": -24.64766502380371, "global_step": 259053, "epoch": 3121} {"train_loss": -24.665542602539062, "global_step": 259054, "epoch": 3121} {"train_loss": -25.146970748901367, "global_step": 259055, "epoch": 3121} {"train_loss": -24.960556030273438, "global_step": 259056, "epoch": 3121} {"train_loss": -24.858423233032227, "global_step": 259057, "epoch": 3121} {"train_loss": -24.76558494567871, "global_step": 259058, "epoch": 3121} {"train_loss": -25.011037826538086, "global_step": 259059, "epoch": 3121} {"train_loss": -25.546314239501953, "global_step": 259060, "epoch": 3121} {"train_loss": -25.253738403320312, "global_step": 259061, "epoch": 3121} {"train_loss": -24.901201248168945, "global_step": 259062, "epoch": 3121} {"train_loss": -25.03127098083496, "global_step": 259063, "epoch": 3121} {"train_loss": -24.986507415771484, "global_step": 259064, "epoch": 3121} {"train_loss": -25.250471115112305, "global_step": 259065, "epoch": 3121} {"train_loss": -25.060672760009766, "global_step": 259066, "epoch": 3121} {"train_loss": -25.080381393432617, "global_step": 259067, "epoch": 3121} {"train_loss": -25.34067153930664, "global_step": 259068, "epoch": 3121} {"train_loss": -25.006271362304688, "global_step": 259069, "epoch": 3121} {"train_loss": -24.849727630615234, "global_step": 259070, "epoch": 3121} {"train_loss": -24.955053329467773, "global_step": 259071, "epoch": 3121} {"train_loss": -25.318307876586914, "global_step": 259072, "epoch": 3121} {"train_loss": -25.241392135620117, "global_step": 259073, "epoch": 3121} {"train_loss": -25.633380889892578, "global_step": 259074, "epoch": 3121} {"train_loss": -25.29685401916504, "global_step": 259075, "epoch": 3121} {"train_loss": -25.33982276916504, "global_step": 259076, "epoch": 3121} {"train_loss": -25.54441261291504, "global_step": 259077, "epoch": 3121} {"train_loss": -25.122142791748047, "global_step": 259078, "epoch": 3121} {"train_loss": -24.914691925048828, "global_step": 259079, "epoch": 3121} {"train_loss": -25.222726821899414, "global_step": 259080, "epoch": 3121} {"train_loss": -25.58745002746582, "global_step": 259081, "epoch": 3121} {"train_loss": -25.107196807861328, "global_step": 259082, "epoch": 3121} {"train_loss": -25.3437557220459, "global_step": 259083, "epoch": 3121} {"train_loss": -25.06217384338379, "global_step": 259084, "epoch": 3121} {"train_loss": -25.20832061767578, "global_step": 259085, "epoch": 3121} {"train_loss": -25.299856185913086, "global_step": 259086, "epoch": 3121} {"train_loss": -25.4019832611084, "global_step": 259087, "epoch": 3121} {"train_loss": -25.290433883666992, "global_step": 259088, "epoch": 3121} {"train_loss": -25.24131965637207, "global_step": 259089, "epoch": 3121} {"train_loss": -25.169050216674805, "global_step": 259090, "epoch": 3121} {"train_loss": -25.07503318786621, "global_step": 259091, "epoch": 3121} {"train_loss": -24.639389038085938, "global_step": 259092, "epoch": 3121} {"train_loss": -24.692047119140625, "global_step": 259093, "epoch": 3121} {"train_loss": -24.205276489257812, "global_step": 259094, "epoch": 3121} {"train_loss": -24.398542404174805, "global_step": 259095, "epoch": 3121} {"train_loss": -25.0969295501709, "global_step": 259096, "epoch": 3121} {"train_loss": -24.9176082611084, "global_step": 259097, "epoch": 3121} {"train_loss": -24.856603622436523, "global_step": 259098, "epoch": 3121} {"train_loss": -24.98046875, "global_step": 259099, "epoch": 3121} {"train_loss": -24.720584869384766, "global_step": 259100, "epoch": 3121} {"train_loss": -25.170564651489258, "global_step": 259101, "epoch": 3121} {"train_loss": -24.9567928314209, "global_step": 259102, "epoch": 3121} {"train_loss": -24.776037216186523, "global_step": 259103, "epoch": 3121} {"train_loss": -24.706310272216797, "global_step": 259104, "epoch": 3121} {"train_loss": -24.580429077148438, "global_step": 259105, "epoch": 3121} {"train_loss": -25.3146915435791, "global_step": 259106, "epoch": 3121} {"train_loss": -24.61128807067871, "global_step": 259107, "epoch": 3121} {"train_loss": -25.43622398376465, "global_step": 259108, "epoch": 3121} {"train_loss": -24.932308197021484, "global_step": 259109, "epoch": 3121} {"train_loss": -25.11336326599121, "global_step": 259110, "epoch": 3121} {"train_loss": -25.041807174682617, "global_step": 259111, "epoch": 3121} {"train_loss": -25.04058265686035, "global_step": 259112, "epoch": 3121} {"train_loss": -25.36643409729004, "global_step": 259113, "epoch": 3121} {"train_loss": -25.2310733795166, "global_step": 259114, "epoch": 3121} {"train_loss": -24.67274284362793, "global_step": 259115, "epoch": 3121} {"train_loss": -25.11098289489746, "global_step": 259116, "epoch": 3121} {"train_loss": -25.056806564331055, "global_step": 259117, "epoch": 3121} {"train_loss": -25.333499908447266, "global_step": 259118, "epoch": 3121} {"train_loss": -25.08963966369629, "global_step": 259119, "epoch": 3121} {"train_loss": -25.407941818237305, "global_step": 259120, "epoch": 3121} {"train_loss": -25.000568389892578, "global_step": 259121, "epoch": 3121} {"train_loss": -25.213825225830078, "global_step": 259122, "epoch": 3121} {"train_loss": -25.368757247924805, "global_step": 259123, "epoch": 3121} {"train_loss": -25.009292602539062, "global_step": 259124, "epoch": 3121} {"train_loss": -25.04340185602027, "global_step": 259125, "epoch": 3121, "val_loss": 6860376.0} {"train_loss": -24.113718032836914, "global_step": 259126, "epoch": 3122} {"train_loss": -24.30190658569336, "global_step": 259127, "epoch": 3122} {"train_loss": -24.4635009765625, "global_step": 259128, "epoch": 3122} {"train_loss": -24.89033317565918, "global_step": 259129, "epoch": 3122} {"train_loss": -24.864564895629883, "global_step": 259130, "epoch": 3122} {"train_loss": -24.745664596557617, "global_step": 259131, "epoch": 3122} {"train_loss": -24.81978416442871, "global_step": 259132, "epoch": 3122} {"train_loss": -23.960559844970703, "global_step": 259133, "epoch": 3122} {"train_loss": -24.72533416748047, "global_step": 259134, "epoch": 3122} {"train_loss": -24.66238784790039, "global_step": 259135, "epoch": 3122} {"train_loss": -24.398120880126953, "global_step": 259136, "epoch": 3122} {"train_loss": -24.840789794921875, "global_step": 259137, "epoch": 3122} {"train_loss": -24.640216827392578, "global_step": 259138, "epoch": 3122} {"train_loss": -24.937955856323242, "global_step": 259139, "epoch": 3122} {"train_loss": -24.83168601989746, "global_step": 259140, "epoch": 3122} {"train_loss": -25.24147605895996, "global_step": 259141, "epoch": 3122} {"train_loss": -24.80592155456543, "global_step": 259142, "epoch": 3122} {"train_loss": -25.14265251159668, "global_step": 259143, "epoch": 3122} {"train_loss": -24.601520538330078, "global_step": 259144, "epoch": 3122} {"train_loss": -24.742111206054688, "global_step": 259145, "epoch": 3122} {"train_loss": -24.93025016784668, "global_step": 259146, "epoch": 3122} {"train_loss": -24.573652267456055, "global_step": 259147, "epoch": 3122} {"train_loss": -24.721830368041992, "global_step": 259148, "epoch": 3122} {"train_loss": -25.083372116088867, "global_step": 259149, "epoch": 3122} {"train_loss": -25.103487014770508, "global_step": 259150, "epoch": 3122} {"train_loss": -25.010786056518555, "global_step": 259151, "epoch": 3122} {"train_loss": -25.292593002319336, "global_step": 259152, "epoch": 3122} {"train_loss": -25.215024948120117, "global_step": 259153, "epoch": 3122} {"train_loss": -25.068769454956055, "global_step": 259154, "epoch": 3122} {"train_loss": -25.080907821655273, "global_step": 259155, "epoch": 3122} {"train_loss": -24.896976470947266, "global_step": 259156, "epoch": 3122} {"train_loss": -24.819799423217773, "global_step": 259157, "epoch": 3122} {"train_loss": -25.319421768188477, "global_step": 259158, "epoch": 3122} {"train_loss": -24.99627113342285, "global_step": 259159, "epoch": 3122} {"train_loss": -24.721923828125, "global_step": 259160, "epoch": 3122} {"train_loss": -25.42732048034668, "global_step": 259161, "epoch": 3122} {"train_loss": -25.27939224243164, "global_step": 259162, "epoch": 3122} {"train_loss": -25.096500396728516, "global_step": 259163, "epoch": 3122} {"train_loss": -24.9910831451416, "global_step": 259164, "epoch": 3122} {"train_loss": -24.912321090698242, "global_step": 259165, "epoch": 3122} {"train_loss": -25.097177505493164, "global_step": 259166, "epoch": 3122} {"train_loss": -24.95982551574707, "global_step": 259167, "epoch": 3122} {"train_loss": -25.090225219726562, "global_step": 259168, "epoch": 3122} {"train_loss": -24.84079360961914, "global_step": 259169, "epoch": 3122} {"train_loss": -24.86932945251465, "global_step": 259170, "epoch": 3122} {"train_loss": -25.27750015258789, "global_step": 259171, "epoch": 3122} {"train_loss": -25.078821182250977, "global_step": 259172, "epoch": 3122} {"train_loss": -24.711334228515625, "global_step": 259173, "epoch": 3122} {"train_loss": -25.135746002197266, "global_step": 259174, "epoch": 3122} {"train_loss": -25.318614959716797, "global_step": 259175, "epoch": 3122} {"train_loss": -24.908035278320312, "global_step": 259176, "epoch": 3122} {"train_loss": -25.06867790222168, "global_step": 259177, "epoch": 3122} {"train_loss": -24.6981201171875, "global_step": 259178, "epoch": 3122} {"train_loss": -25.070249557495117, "global_step": 259179, "epoch": 3122} {"train_loss": -25.65058708190918, "global_step": 259180, "epoch": 3122} {"train_loss": -25.265653610229492, "global_step": 259181, "epoch": 3122} {"train_loss": -25.261444091796875, "global_step": 259182, "epoch": 3122} {"train_loss": -24.978418350219727, "global_step": 259183, "epoch": 3122} {"train_loss": -25.06180191040039, "global_step": 259184, "epoch": 3122} {"train_loss": -24.84714126586914, "global_step": 259185, "epoch": 3122} {"train_loss": -24.937849044799805, "global_step": 259186, "epoch": 3122} {"train_loss": -24.94769859313965, "global_step": 259187, "epoch": 3122} {"train_loss": -24.920995712280273, "global_step": 259188, "epoch": 3122} {"train_loss": -24.800491333007812, "global_step": 259189, "epoch": 3122} {"train_loss": -25.22774887084961, "global_step": 259190, "epoch": 3122} {"train_loss": -25.150728225708008, "global_step": 259191, "epoch": 3122} {"train_loss": -25.301288604736328, "global_step": 259192, "epoch": 3122} {"train_loss": -25.117801666259766, "global_step": 259193, "epoch": 3122} {"train_loss": -25.423795700073242, "global_step": 259194, "epoch": 3122} {"train_loss": -25.160188674926758, "global_step": 259195, "epoch": 3122} {"train_loss": -25.26729393005371, "global_step": 259196, "epoch": 3122} {"train_loss": -25.169748306274414, "global_step": 259197, "epoch": 3122} {"train_loss": -25.36481475830078, "global_step": 259198, "epoch": 3122} {"train_loss": -25.11640167236328, "global_step": 259199, "epoch": 3122} {"train_loss": -25.215377807617188, "global_step": 259200, "epoch": 3122} {"train_loss": -25.246234893798828, "global_step": 259201, "epoch": 3122} {"train_loss": -25.397205352783203, "global_step": 259202, "epoch": 3122} {"train_loss": -25.11016273498535, "global_step": 259203, "epoch": 3122} {"train_loss": -25.275266647338867, "global_step": 259204, "epoch": 3122} {"train_loss": -24.872549057006836, "global_step": 259205, "epoch": 3122} {"train_loss": -25.200925827026367, "global_step": 259206, "epoch": 3122} {"train_loss": -25.243619918823242, "global_step": 259207, "epoch": 3122} {"train_loss": -24.988002570278674, "global_step": 259208, "epoch": 3122, "val_loss": 6961104.0} {"train_loss": -24.2130069732666, "global_step": 259209, "epoch": 3123} {"train_loss": -23.239728927612305, "global_step": 259210, "epoch": 3123} {"train_loss": -24.212011337280273, "global_step": 259211, "epoch": 3123} {"train_loss": -23.39888572692871, "global_step": 259212, "epoch": 3123} {"train_loss": -24.255956649780273, "global_step": 259213, "epoch": 3123} {"train_loss": -23.760622024536133, "global_step": 259214, "epoch": 3123} {"train_loss": -24.25404930114746, "global_step": 259215, "epoch": 3123} {"train_loss": -23.993606567382812, "global_step": 259216, "epoch": 3123} {"train_loss": -24.367027282714844, "global_step": 259217, "epoch": 3123} {"train_loss": -24.28417205810547, "global_step": 259218, "epoch": 3123} {"train_loss": -24.18927764892578, "global_step": 259219, "epoch": 3123} {"train_loss": -24.389944076538086, "global_step": 259220, "epoch": 3123} {"train_loss": -24.672834396362305, "global_step": 259221, "epoch": 3123} {"train_loss": -24.3023681640625, "global_step": 259222, "epoch": 3123} {"train_loss": -24.111665725708008, "global_step": 259223, "epoch": 3123} {"train_loss": -24.50782585144043, "global_step": 259224, "epoch": 3123} {"train_loss": -24.45001792907715, "global_step": 259225, "epoch": 3123} {"train_loss": -24.639463424682617, "global_step": 259226, "epoch": 3123} {"train_loss": -24.811386108398438, "global_step": 259227, "epoch": 3123} {"train_loss": -24.601890563964844, "global_step": 259228, "epoch": 3123} {"train_loss": -24.92702865600586, "global_step": 259229, "epoch": 3123} {"train_loss": -24.55104637145996, "global_step": 259230, "epoch": 3123} {"train_loss": -24.6109561920166, "global_step": 259231, "epoch": 3123} {"train_loss": -24.699831008911133, "global_step": 259232, "epoch": 3123} {"train_loss": -24.92225456237793, "global_step": 259233, "epoch": 3123} {"train_loss": -24.564697265625, "global_step": 259234, "epoch": 3123} {"train_loss": -24.885900497436523, "global_step": 259235, "epoch": 3123} {"train_loss": -24.938390731811523, "global_step": 259236, "epoch": 3123} {"train_loss": -24.75189781188965, "global_step": 259237, "epoch": 3123} {"train_loss": -24.721940994262695, "global_step": 259238, "epoch": 3123} {"train_loss": -25.003713607788086, "global_step": 259239, "epoch": 3123} {"train_loss": -25.017847061157227, "global_step": 259240, "epoch": 3123} {"train_loss": -24.95204734802246, "global_step": 259241, "epoch": 3123} {"train_loss": -25.064544677734375, "global_step": 259242, "epoch": 3123} {"train_loss": -24.804367065429688, "global_step": 259243, "epoch": 3123} {"train_loss": -24.97992706298828, "global_step": 259244, "epoch": 3123} {"train_loss": -24.907764434814453, "global_step": 259245, "epoch": 3123} {"train_loss": -24.99492645263672, "global_step": 259246, "epoch": 3123} {"train_loss": -24.9801025390625, "global_step": 259247, "epoch": 3123} {"train_loss": -24.8237361907959, "global_step": 259248, "epoch": 3123} {"train_loss": -25.068002700805664, "global_step": 259249, "epoch": 3123} {"train_loss": -24.936857223510742, "global_step": 259250, "epoch": 3123} {"train_loss": -25.836627960205078, "global_step": 259251, "epoch": 3123} {"train_loss": -24.931303024291992, "global_step": 259252, "epoch": 3123} {"train_loss": -25.0053653717041, "global_step": 259253, "epoch": 3123} {"train_loss": -25.19087028503418, "global_step": 259254, "epoch": 3123} {"train_loss": -25.220884323120117, "global_step": 259255, "epoch": 3123} {"train_loss": -25.55048179626465, "global_step": 259256, "epoch": 3123} {"train_loss": -24.85079574584961, "global_step": 259257, "epoch": 3123} {"train_loss": -24.7622127532959, "global_step": 259258, "epoch": 3123} {"train_loss": -25.272985458374023, "global_step": 259259, "epoch": 3123} {"train_loss": -25.3471622467041, "global_step": 259260, "epoch": 3123} {"train_loss": -25.325271606445312, "global_step": 259261, "epoch": 3123} {"train_loss": -25.261463165283203, "global_step": 259262, "epoch": 3123} {"train_loss": -25.03585433959961, "global_step": 259263, "epoch": 3123} {"train_loss": -25.483875274658203, "global_step": 259264, "epoch": 3123} {"train_loss": -25.175369262695312, "global_step": 259265, "epoch": 3123} {"train_loss": -25.129684448242188, "global_step": 259266, "epoch": 3123} {"train_loss": -25.333471298217773, "global_step": 259267, "epoch": 3123} {"train_loss": -25.066898345947266, "global_step": 259268, "epoch": 3123} {"train_loss": -25.123395919799805, "global_step": 259269, "epoch": 3123} {"train_loss": -25.251220703125, "global_step": 259270, "epoch": 3123} {"train_loss": -24.935409545898438, "global_step": 259271, "epoch": 3123} {"train_loss": -25.32413101196289, "global_step": 259272, "epoch": 3123} {"train_loss": -25.174589157104492, "global_step": 259273, "epoch": 3123} {"train_loss": -25.254003524780273, "global_step": 259274, "epoch": 3123} {"train_loss": -25.15007972717285, "global_step": 259275, "epoch": 3123} {"train_loss": -25.516338348388672, "global_step": 259276, "epoch": 3123} {"train_loss": -24.918981552124023, "global_step": 259277, "epoch": 3123} {"train_loss": -25.196332931518555, "global_step": 259278, "epoch": 3123} {"train_loss": -25.127267837524414, "global_step": 259279, "epoch": 3123} {"train_loss": -25.38063621520996, "global_step": 259280, "epoch": 3123} {"train_loss": -25.209108352661133, "global_step": 259281, "epoch": 3123} {"train_loss": -24.94915008544922, "global_step": 259282, "epoch": 3123} {"train_loss": -25.188600540161133, "global_step": 259283, "epoch": 3123} {"train_loss": -25.317890167236328, "global_step": 259284, "epoch": 3123} {"train_loss": -25.473875045776367, "global_step": 259285, "epoch": 3123} {"train_loss": -24.926572799682617, "global_step": 259286, "epoch": 3123} {"train_loss": -24.932226181030273, "global_step": 259287, "epoch": 3123} {"train_loss": -25.518234252929688, "global_step": 259288, "epoch": 3123} {"train_loss": -25.167280197143555, "global_step": 259289, "epoch": 3123} {"train_loss": -24.81482696533203, "global_step": 259290, "epoch": 3123} {"train_loss": -24.882875166743634, "global_step": 259291, "epoch": 3123, "val_loss": 7005389.0} {"train_loss": -24.751874923706055, "global_step": 259292, "epoch": 3124} {"train_loss": -25.209125518798828, "global_step": 259293, "epoch": 3124} {"train_loss": -24.914981842041016, "global_step": 259294, "epoch": 3124} {"train_loss": -24.3378849029541, "global_step": 259295, "epoch": 3124} {"train_loss": -24.232553482055664, "global_step": 259296, "epoch": 3124} {"train_loss": -24.133535385131836, "global_step": 259297, "epoch": 3124} {"train_loss": -24.23335838317871, "global_step": 259298, "epoch": 3124} {"train_loss": -24.790136337280273, "global_step": 259299, "epoch": 3124} {"train_loss": -24.58148193359375, "global_step": 259300, "epoch": 3124} {"train_loss": -24.061426162719727, "global_step": 259301, "epoch": 3124} {"train_loss": -24.23964500427246, "global_step": 259302, "epoch": 3124} {"train_loss": -24.423913955688477, "global_step": 259303, "epoch": 3124} {"train_loss": -24.040231704711914, "global_step": 259304, "epoch": 3124} {"train_loss": -23.96380043029785, "global_step": 259305, "epoch": 3124} {"train_loss": -24.825475692749023, "global_step": 259306, "epoch": 3124} {"train_loss": -24.542972564697266, "global_step": 259307, "epoch": 3124} {"train_loss": -25.114286422729492, "global_step": 259308, "epoch": 3124} {"train_loss": -24.2865047454834, "global_step": 259309, "epoch": 3124} {"train_loss": -24.236919403076172, "global_step": 259310, "epoch": 3124} {"train_loss": -24.493762969970703, "global_step": 259311, "epoch": 3124} {"train_loss": -24.83540153503418, "global_step": 259312, "epoch": 3124} {"train_loss": -24.58721351623535, "global_step": 259313, "epoch": 3124} {"train_loss": -24.6117000579834, "global_step": 259314, "epoch": 3124} {"train_loss": -25.071264266967773, "global_step": 259315, "epoch": 3124} {"train_loss": -24.70263671875, "global_step": 259316, "epoch": 3124} {"train_loss": -25.40119743347168, "global_step": 259317, "epoch": 3124} {"train_loss": -25.221235275268555, "global_step": 259318, "epoch": 3124} {"train_loss": -25.141357421875, "global_step": 259319, "epoch": 3124} {"train_loss": -25.019956588745117, "global_step": 259320, "epoch": 3124} {"train_loss": -25.183454513549805, "global_step": 259321, "epoch": 3124} {"train_loss": -25.291128158569336, "global_step": 259322, "epoch": 3124} {"train_loss": -25.01875114440918, "global_step": 259323, "epoch": 3124} {"train_loss": -24.90198516845703, "global_step": 259324, "epoch": 3124} {"train_loss": -24.829391479492188, "global_step": 259325, "epoch": 3124} {"train_loss": -25.146499633789062, "global_step": 259326, "epoch": 3124} {"train_loss": -24.984167098999023, "global_step": 259327, "epoch": 3124} {"train_loss": -24.844709396362305, "global_step": 259328, "epoch": 3124} {"train_loss": -25.233076095581055, "global_step": 259329, "epoch": 3124} {"train_loss": -25.176002502441406, "global_step": 259330, "epoch": 3124} {"train_loss": -25.2033748626709, "global_step": 259331, "epoch": 3124} {"train_loss": -24.92988395690918, "global_step": 259332, "epoch": 3124} {"train_loss": -25.28350257873535, "global_step": 259333, "epoch": 3124} {"train_loss": -25.226165771484375, "global_step": 259334, "epoch": 3124} {"train_loss": -25.12147331237793, "global_step": 259335, "epoch": 3124} {"train_loss": -25.3757381439209, "global_step": 259336, "epoch": 3124} {"train_loss": -25.226415634155273, "global_step": 259337, "epoch": 3124} {"train_loss": -25.066373825073242, "global_step": 259338, "epoch": 3124} {"train_loss": -25.13136100769043, "global_step": 259339, "epoch": 3124} {"train_loss": -25.248554229736328, "global_step": 259340, "epoch": 3124} {"train_loss": -25.767852783203125, "global_step": 259341, "epoch": 3124} {"train_loss": -25.136274337768555, "global_step": 259342, "epoch": 3124} {"train_loss": -25.162931442260742, "global_step": 259343, "epoch": 3124} {"train_loss": -25.188695907592773, "global_step": 259344, "epoch": 3124} {"train_loss": -25.204999923706055, "global_step": 259345, "epoch": 3124} {"train_loss": -25.11952781677246, "global_step": 259346, "epoch": 3124} {"train_loss": -25.156208038330078, "global_step": 259347, "epoch": 3124} {"train_loss": -25.075653076171875, "global_step": 259348, "epoch": 3124} {"train_loss": -25.116207122802734, "global_step": 259349, "epoch": 3124} {"train_loss": -25.205522537231445, "global_step": 259350, "epoch": 3124} {"train_loss": -25.167226791381836, "global_step": 259351, "epoch": 3124} {"train_loss": -25.01383399963379, "global_step": 259352, "epoch": 3124} {"train_loss": -25.56529998779297, "global_step": 259353, "epoch": 3124} {"train_loss": -25.212434768676758, "global_step": 259354, "epoch": 3124} {"train_loss": -24.96004295349121, "global_step": 259355, "epoch": 3124} {"train_loss": -24.923126220703125, "global_step": 259356, "epoch": 3124} {"train_loss": -25.02039909362793, "global_step": 259357, "epoch": 3124} {"train_loss": -24.882400512695312, "global_step": 259358, "epoch": 3124} {"train_loss": -25.473251342773438, "global_step": 259359, "epoch": 3124} {"train_loss": -25.17383575439453, "global_step": 259360, "epoch": 3124} {"train_loss": -25.204273223876953, "global_step": 259361, "epoch": 3124} {"train_loss": -24.8508358001709, "global_step": 259362, "epoch": 3124} {"train_loss": -25.44603157043457, "global_step": 259363, "epoch": 3124} {"train_loss": -25.04947853088379, "global_step": 259364, "epoch": 3124} {"train_loss": -25.43841552734375, "global_step": 259365, "epoch": 3124} {"train_loss": -25.24285316467285, "global_step": 259366, "epoch": 3124} {"train_loss": -25.201549530029297, "global_step": 259367, "epoch": 3124} {"train_loss": -24.587432861328125, "global_step": 259368, "epoch": 3124} {"train_loss": -24.719953536987305, "global_step": 259369, "epoch": 3124} {"train_loss": -25.102691650390625, "global_step": 259370, "epoch": 3124} {"train_loss": -25.006261825561523, "global_step": 259371, "epoch": 3124} {"train_loss": -24.914453506469727, "global_step": 259372, "epoch": 3124} {"train_loss": -24.98525047302246, "global_step": 259373, "epoch": 3124} {"train_loss": -24.95659878742264, "global_step": 259374, "epoch": 3124, "val_loss": 6899466.0} {"train_loss": -24.7365779876709, "global_step": 259375, "epoch": 3125} {"train_loss": -24.422204971313477, "global_step": 259376, "epoch": 3125} {"train_loss": -24.913700103759766, "global_step": 259377, "epoch": 3125} {"train_loss": -24.582380294799805, "global_step": 259378, "epoch": 3125} {"train_loss": -24.63273048400879, "global_step": 259379, "epoch": 3125} {"train_loss": -24.790929794311523, "global_step": 259380, "epoch": 3125} {"train_loss": -24.894521713256836, "global_step": 259381, "epoch": 3125} {"train_loss": -24.85054588317871, "global_step": 259382, "epoch": 3125} {"train_loss": -24.896305084228516, "global_step": 259383, "epoch": 3125} {"train_loss": -24.882427215576172, "global_step": 259384, "epoch": 3125} {"train_loss": -25.01017951965332, "global_step": 259385, "epoch": 3125} {"train_loss": -24.547256469726562, "global_step": 259386, "epoch": 3125} {"train_loss": -24.650848388671875, "global_step": 259387, "epoch": 3125} {"train_loss": -25.122426986694336, "global_step": 259388, "epoch": 3125} {"train_loss": -24.92578125, "global_step": 259389, "epoch": 3125} {"train_loss": -24.80803871154785, "global_step": 259390, "epoch": 3125} {"train_loss": -25.00151252746582, "global_step": 259391, "epoch": 3125} {"train_loss": -25.073286056518555, "global_step": 259392, "epoch": 3125} {"train_loss": -25.270160675048828, "global_step": 259393, "epoch": 3125} {"train_loss": -25.251672744750977, "global_step": 259394, "epoch": 3125} {"train_loss": -24.889114379882812, "global_step": 259395, "epoch": 3125} {"train_loss": -24.740737915039062, "global_step": 259396, "epoch": 3125} {"train_loss": -25.37869644165039, "global_step": 259397, "epoch": 3125} {"train_loss": -25.031719207763672, "global_step": 259398, "epoch": 3125} {"train_loss": -25.142595291137695, "global_step": 259399, "epoch": 3125} {"train_loss": -24.990402221679688, "global_step": 259400, "epoch": 3125} {"train_loss": -24.904794692993164, "global_step": 259401, "epoch": 3125} {"train_loss": -24.828031539916992, "global_step": 259402, "epoch": 3125} {"train_loss": -25.225116729736328, "global_step": 259403, "epoch": 3125} {"train_loss": -25.402042388916016, "global_step": 259404, "epoch": 3125} {"train_loss": -25.16071891784668, "global_step": 259405, "epoch": 3125} {"train_loss": -24.959980010986328, "global_step": 259406, "epoch": 3125} {"train_loss": -25.202199935913086, "global_step": 259407, "epoch": 3125} {"train_loss": -25.329946517944336, "global_step": 259408, "epoch": 3125} {"train_loss": -25.580873489379883, "global_step": 259409, "epoch": 3125} {"train_loss": -25.0103816986084, "global_step": 259410, "epoch": 3125} {"train_loss": -25.557811737060547, "global_step": 259411, "epoch": 3125} {"train_loss": -25.232528686523438, "global_step": 259412, "epoch": 3125} {"train_loss": -25.469106674194336, "global_step": 259413, "epoch": 3125} {"train_loss": -25.18242835998535, "global_step": 259414, "epoch": 3125} {"train_loss": -25.62660026550293, "global_step": 259415, "epoch": 3125} {"train_loss": -25.638532638549805, "global_step": 259416, "epoch": 3125} {"train_loss": -25.485246658325195, "global_step": 259417, "epoch": 3125} {"train_loss": -25.43150520324707, "global_step": 259418, "epoch": 3125} {"train_loss": -25.533920288085938, "global_step": 259419, "epoch": 3125} {"train_loss": -24.651676177978516, "global_step": 259420, "epoch": 3125} {"train_loss": -24.537145614624023, "global_step": 259421, "epoch": 3125} {"train_loss": -25.43561363220215, "global_step": 259422, "epoch": 3125} {"train_loss": -25.207639694213867, "global_step": 259423, "epoch": 3125} {"train_loss": -25.012954711914062, "global_step": 259424, "epoch": 3125} {"train_loss": -24.645397186279297, "global_step": 259425, "epoch": 3125} {"train_loss": -25.218896865844727, "global_step": 259426, "epoch": 3125} {"train_loss": -24.894920349121094, "global_step": 259427, "epoch": 3125} {"train_loss": -25.023508071899414, "global_step": 259428, "epoch": 3125} {"train_loss": -25.513402938842773, "global_step": 259429, "epoch": 3125} {"train_loss": -25.185705184936523, "global_step": 259430, "epoch": 3125} {"train_loss": -25.445463180541992, "global_step": 259431, "epoch": 3125} {"train_loss": -25.102455139160156, "global_step": 259432, "epoch": 3125} {"train_loss": -25.01325798034668, "global_step": 259433, "epoch": 3125} {"train_loss": -24.653512954711914, "global_step": 259434, "epoch": 3125} {"train_loss": -25.11092185974121, "global_step": 259435, "epoch": 3125} {"train_loss": -25.121652603149414, "global_step": 259436, "epoch": 3125} {"train_loss": -24.541067123413086, "global_step": 259437, "epoch": 3125} {"train_loss": -25.26727867126465, "global_step": 259438, "epoch": 3125} {"train_loss": -24.83925437927246, "global_step": 259439, "epoch": 3125} {"train_loss": -25.426437377929688, "global_step": 259440, "epoch": 3125} {"train_loss": -25.33330726623535, "global_step": 259441, "epoch": 3125} {"train_loss": -24.956809997558594, "global_step": 259442, "epoch": 3125} {"train_loss": -25.26190185546875, "global_step": 259443, "epoch": 3125} {"train_loss": -25.334325790405273, "global_step": 259444, "epoch": 3125} {"train_loss": -24.975019454956055, "global_step": 259445, "epoch": 3125} {"train_loss": -25.447599411010742, "global_step": 259446, "epoch": 3125} {"train_loss": -25.47048568725586, "global_step": 259447, "epoch": 3125} {"train_loss": -25.19479751586914, "global_step": 259448, "epoch": 3125} {"train_loss": -24.92685890197754, "global_step": 259449, "epoch": 3125} {"train_loss": -24.995065689086914, "global_step": 259450, "epoch": 3125} {"train_loss": -24.986623764038086, "global_step": 259451, "epoch": 3125} {"train_loss": -25.029491424560547, "global_step": 259452, "epoch": 3125} {"train_loss": -25.15253448486328, "global_step": 259453, "epoch": 3125} {"train_loss": -25.152585983276367, "global_step": 259454, "epoch": 3125} {"train_loss": -25.393335342407227, "global_step": 259455, "epoch": 3125} {"train_loss": -25.22612953186035, "global_step": 259456, "epoch": 3125} {"train_loss": -25.087871873235127, "global_step": 259457, "epoch": 3125, "val_loss": 6873026.0} {"train_loss": -25.170883178710938, "global_step": 259458, "epoch": 3126} {"train_loss": -25.158864974975586, "global_step": 259459, "epoch": 3126} {"train_loss": -25.061450958251953, "global_step": 259460, "epoch": 3126} {"train_loss": -25.224639892578125, "global_step": 259461, "epoch": 3126} {"train_loss": -24.70400047302246, "global_step": 259462, "epoch": 3126} {"train_loss": -24.779813766479492, "global_step": 259463, "epoch": 3126} {"train_loss": -25.0709285736084, "global_step": 259464, "epoch": 3126} {"train_loss": -25.03778648376465, "global_step": 259465, "epoch": 3126} {"train_loss": -25.252798080444336, "global_step": 259466, "epoch": 3126} {"train_loss": -25.113285064697266, "global_step": 259467, "epoch": 3126} {"train_loss": -24.972061157226562, "global_step": 259468, "epoch": 3126} {"train_loss": -25.478479385375977, "global_step": 259469, "epoch": 3126} {"train_loss": -24.959943771362305, "global_step": 259470, "epoch": 3126} {"train_loss": -25.39531898498535, "global_step": 259471, "epoch": 3126} {"train_loss": -25.146799087524414, "global_step": 259472, "epoch": 3126} {"train_loss": -25.010723114013672, "global_step": 259473, "epoch": 3126} {"train_loss": -25.012006759643555, "global_step": 259474, "epoch": 3126} {"train_loss": -25.13041114807129, "global_step": 259475, "epoch": 3126} {"train_loss": -25.0296573638916, "global_step": 259476, "epoch": 3126} {"train_loss": -25.20693588256836, "global_step": 259477, "epoch": 3126} {"train_loss": -24.82000160217285, "global_step": 259478, "epoch": 3126} {"train_loss": -24.85342788696289, "global_step": 259479, "epoch": 3126} {"train_loss": -25.28010368347168, "global_step": 259480, "epoch": 3126} {"train_loss": -24.862951278686523, "global_step": 259481, "epoch": 3126} {"train_loss": -25.087600708007812, "global_step": 259482, "epoch": 3126} {"train_loss": -25.362680435180664, "global_step": 259483, "epoch": 3126} {"train_loss": -25.11370086669922, "global_step": 259484, "epoch": 3126} {"train_loss": -25.318845748901367, "global_step": 259485, "epoch": 3126} {"train_loss": -24.89692497253418, "global_step": 259486, "epoch": 3126} {"train_loss": -25.05356216430664, "global_step": 259487, "epoch": 3126} {"train_loss": -24.949481964111328, "global_step": 259488, "epoch": 3126} {"train_loss": -25.223474502563477, "global_step": 259489, "epoch": 3126} {"train_loss": -25.243314743041992, "global_step": 259490, "epoch": 3126} {"train_loss": -25.271392822265625, "global_step": 259491, "epoch": 3126} {"train_loss": -25.387622833251953, "global_step": 259492, "epoch": 3126} {"train_loss": -25.07198715209961, "global_step": 259493, "epoch": 3126} {"train_loss": -25.6512393951416, "global_step": 259494, "epoch": 3126} {"train_loss": -25.27029800415039, "global_step": 259495, "epoch": 3126} {"train_loss": -25.416248321533203, "global_step": 259496, "epoch": 3126} {"train_loss": -25.36116600036621, "global_step": 259497, "epoch": 3126} {"train_loss": -25.627853393554688, "global_step": 259498, "epoch": 3126} {"train_loss": -25.502330780029297, "global_step": 259499, "epoch": 3126} {"train_loss": -25.177648544311523, "global_step": 259500, "epoch": 3126} {"train_loss": -25.185361862182617, "global_step": 259501, "epoch": 3126} {"train_loss": -25.0985164642334, "global_step": 259502, "epoch": 3126} {"train_loss": -25.156667709350586, "global_step": 259503, "epoch": 3126} {"train_loss": -25.43259048461914, "global_step": 259504, "epoch": 3126} {"train_loss": -25.456661224365234, "global_step": 259505, "epoch": 3126} {"train_loss": -25.50806999206543, "global_step": 259506, "epoch": 3126} {"train_loss": -25.15639305114746, "global_step": 259507, "epoch": 3126} {"train_loss": -25.33315086364746, "global_step": 259508, "epoch": 3126} {"train_loss": -25.60239028930664, "global_step": 259509, "epoch": 3126} {"train_loss": -25.058801651000977, "global_step": 259510, "epoch": 3126} {"train_loss": -25.136585235595703, "global_step": 259511, "epoch": 3126} {"train_loss": -25.11219596862793, "global_step": 259512, "epoch": 3126} {"train_loss": -25.441091537475586, "global_step": 259513, "epoch": 3126} {"train_loss": -25.353975296020508, "global_step": 259514, "epoch": 3126} {"train_loss": -25.232385635375977, "global_step": 259515, "epoch": 3126} {"train_loss": -25.184541702270508, "global_step": 259516, "epoch": 3126} {"train_loss": -25.605398178100586, "global_step": 259517, "epoch": 3126} {"train_loss": -25.231847763061523, "global_step": 259518, "epoch": 3126} {"train_loss": -25.373594284057617, "global_step": 259519, "epoch": 3126} {"train_loss": -25.548887252807617, "global_step": 259520, "epoch": 3126} {"train_loss": -25.1651668548584, "global_step": 259521, "epoch": 3126} {"train_loss": -25.520902633666992, "global_step": 259522, "epoch": 3126} {"train_loss": -25.13294792175293, "global_step": 259523, "epoch": 3126} {"train_loss": -24.884958267211914, "global_step": 259524, "epoch": 3126} {"train_loss": -24.54825782775879, "global_step": 259525, "epoch": 3126} {"train_loss": -23.976652145385742, "global_step": 259526, "epoch": 3126} {"train_loss": -23.630115509033203, "global_step": 259527, "epoch": 3126} {"train_loss": -24.059717178344727, "global_step": 259528, "epoch": 3126} {"train_loss": -23.414304733276367, "global_step": 259529, "epoch": 3126} {"train_loss": -24.506372451782227, "global_step": 259530, "epoch": 3126} {"train_loss": -24.728731155395508, "global_step": 259531, "epoch": 3126} {"train_loss": -24.426105499267578, "global_step": 259532, "epoch": 3126} {"train_loss": -24.6147518157959, "global_step": 259533, "epoch": 3126} {"train_loss": -24.85353660583496, "global_step": 259534, "epoch": 3126} {"train_loss": -24.254261016845703, "global_step": 259535, "epoch": 3126} {"train_loss": -24.714155197143555, "global_step": 259536, "epoch": 3126} {"train_loss": -24.760589599609375, "global_step": 259537, "epoch": 3126} {"train_loss": -24.859500885009766, "global_step": 259538, "epoch": 3126} {"train_loss": -24.871593475341797, "global_step": 259539, "epoch": 3126} {"train_loss": -25.074234767132495, "global_step": 259540, "epoch": 3126, "val_loss": 6949112.0} {"train_loss": -24.495771408081055, "global_step": 259541, "epoch": 3127} {"train_loss": -24.185035705566406, "global_step": 259542, "epoch": 3127} {"train_loss": -24.3404598236084, "global_step": 259543, "epoch": 3127} {"train_loss": -24.92921257019043, "global_step": 259544, "epoch": 3127} {"train_loss": -24.9229679107666, "global_step": 259545, "epoch": 3127} {"train_loss": -24.624866485595703, "global_step": 259546, "epoch": 3127} {"train_loss": -24.905534744262695, "global_step": 259547, "epoch": 3127} {"train_loss": -24.931840896606445, "global_step": 259548, "epoch": 3127} {"train_loss": -24.94717788696289, "global_step": 259549, "epoch": 3127} {"train_loss": -24.73075294494629, "global_step": 259550, "epoch": 3127} {"train_loss": -24.360212326049805, "global_step": 259551, "epoch": 3127} {"train_loss": -24.891359329223633, "global_step": 259552, "epoch": 3127} {"train_loss": -25.000457763671875, "global_step": 259553, "epoch": 3127} {"train_loss": -24.58169937133789, "global_step": 259554, "epoch": 3127} {"train_loss": -24.848461151123047, "global_step": 259555, "epoch": 3127} {"train_loss": -24.90059471130371, "global_step": 259556, "epoch": 3127} {"train_loss": -25.068023681640625, "global_step": 259557, "epoch": 3127} {"train_loss": -24.844449996948242, "global_step": 259558, "epoch": 3127} {"train_loss": -24.84983253479004, "global_step": 259559, "epoch": 3127} {"train_loss": -24.821502685546875, "global_step": 259560, "epoch": 3127} {"train_loss": -25.07808494567871, "global_step": 259561, "epoch": 3127} {"train_loss": -24.95307731628418, "global_step": 259562, "epoch": 3127} {"train_loss": -25.123615264892578, "global_step": 259563, "epoch": 3127} {"train_loss": -25.00066566467285, "global_step": 259564, "epoch": 3127} {"train_loss": -25.23426628112793, "global_step": 259565, "epoch": 3127} {"train_loss": -25.156513214111328, "global_step": 259566, "epoch": 3127} {"train_loss": -24.811857223510742, "global_step": 259567, "epoch": 3127} {"train_loss": -24.984394073486328, "global_step": 259568, "epoch": 3127} {"train_loss": -25.468175888061523, "global_step": 259569, "epoch": 3127} {"train_loss": -25.02530860900879, "global_step": 259570, "epoch": 3127} {"train_loss": -25.566431045532227, "global_step": 259571, "epoch": 3127} {"train_loss": -25.044601440429688, "global_step": 259572, "epoch": 3127} {"train_loss": -25.157752990722656, "global_step": 259573, "epoch": 3127} {"train_loss": -25.33745765686035, "global_step": 259574, "epoch": 3127} {"train_loss": -25.639699935913086, "global_step": 259575, "epoch": 3127} {"train_loss": -25.219741821289062, "global_step": 259576, "epoch": 3127} {"train_loss": -24.92691421508789, "global_step": 259577, "epoch": 3127} {"train_loss": -24.854835510253906, "global_step": 259578, "epoch": 3127} {"train_loss": -24.87271499633789, "global_step": 259579, "epoch": 3127} {"train_loss": -25.193845748901367, "global_step": 259580, "epoch": 3127} {"train_loss": -24.6983585357666, "global_step": 259581, "epoch": 3127} {"train_loss": -24.17331314086914, "global_step": 259582, "epoch": 3127} {"train_loss": -24.246234893798828, "global_step": 259583, "epoch": 3127} {"train_loss": -24.67037010192871, "global_step": 259584, "epoch": 3127} {"train_loss": -24.57642936706543, "global_step": 259585, "epoch": 3127} {"train_loss": -25.177000045776367, "global_step": 259586, "epoch": 3127} {"train_loss": -24.737607955932617, "global_step": 259587, "epoch": 3127} {"train_loss": -25.205907821655273, "global_step": 259588, "epoch": 3127} {"train_loss": -24.552690505981445, "global_step": 259589, "epoch": 3127} {"train_loss": -25.09571647644043, "global_step": 259590, "epoch": 3127} {"train_loss": -24.934677124023438, "global_step": 259591, "epoch": 3127} {"train_loss": -24.825937271118164, "global_step": 259592, "epoch": 3127} {"train_loss": -25.022520065307617, "global_step": 259593, "epoch": 3127} {"train_loss": -25.081571578979492, "global_step": 259594, "epoch": 3127} {"train_loss": -24.747406005859375, "global_step": 259595, "epoch": 3127} {"train_loss": -25.444929122924805, "global_step": 259596, "epoch": 3127} {"train_loss": -24.890077590942383, "global_step": 259597, "epoch": 3127} {"train_loss": -24.912824630737305, "global_step": 259598, "epoch": 3127} {"train_loss": -25.078861236572266, "global_step": 259599, "epoch": 3127} {"train_loss": -24.969575881958008, "global_step": 259600, "epoch": 3127} {"train_loss": -25.073755264282227, "global_step": 259601, "epoch": 3127} {"train_loss": -25.222095489501953, "global_step": 259602, "epoch": 3127} {"train_loss": -25.06688117980957, "global_step": 259603, "epoch": 3127} {"train_loss": -25.26988983154297, "global_step": 259604, "epoch": 3127} {"train_loss": -25.19034194946289, "global_step": 259605, "epoch": 3127} {"train_loss": -25.184337615966797, "global_step": 259606, "epoch": 3127} {"train_loss": -25.196130752563477, "global_step": 259607, "epoch": 3127} {"train_loss": -25.264602661132812, "global_step": 259608, "epoch": 3127} {"train_loss": -25.050783157348633, "global_step": 259609, "epoch": 3127} {"train_loss": -25.05632781982422, "global_step": 259610, "epoch": 3127} {"train_loss": -25.218368530273438, "global_step": 259611, "epoch": 3127} {"train_loss": -25.259628295898438, "global_step": 259612, "epoch": 3127} {"train_loss": -25.134775161743164, "global_step": 259613, "epoch": 3127} {"train_loss": -24.6932373046875, "global_step": 259614, "epoch": 3127} {"train_loss": -25.525108337402344, "global_step": 259615, "epoch": 3127} {"train_loss": -25.040952682495117, "global_step": 259616, "epoch": 3127} {"train_loss": -24.91556167602539, "global_step": 259617, "epoch": 3127} {"train_loss": -25.289031982421875, "global_step": 259618, "epoch": 3127} {"train_loss": -25.08762550354004, "global_step": 259619, "epoch": 3127} {"train_loss": -25.247894287109375, "global_step": 259620, "epoch": 3127} {"train_loss": -25.260591506958008, "global_step": 259621, "epoch": 3127} {"train_loss": -25.432178497314453, "global_step": 259622, "epoch": 3127} {"train_loss": -24.985057417168676, "global_step": 259623, "epoch": 3127, "val_loss": 6973666.5} {"train_loss": -25.11079978942871, "global_step": 259624, "epoch": 3128} {"train_loss": -24.546703338623047, "global_step": 259625, "epoch": 3128} {"train_loss": -24.72063636779785, "global_step": 259626, "epoch": 3128} {"train_loss": -24.977750778198242, "global_step": 259627, "epoch": 3128} {"train_loss": -24.94438934326172, "global_step": 259628, "epoch": 3128} {"train_loss": -24.358491897583008, "global_step": 259629, "epoch": 3128} {"train_loss": -24.7780818939209, "global_step": 259630, "epoch": 3128} {"train_loss": -24.846723556518555, "global_step": 259631, "epoch": 3128} {"train_loss": -24.405942916870117, "global_step": 259632, "epoch": 3128} {"train_loss": -24.71750259399414, "global_step": 259633, "epoch": 3128} {"train_loss": -24.4631404876709, "global_step": 259634, "epoch": 3128} {"train_loss": -25.193744659423828, "global_step": 259635, "epoch": 3128} {"train_loss": -24.988872528076172, "global_step": 259636, "epoch": 3128} {"train_loss": -25.378313064575195, "global_step": 259637, "epoch": 3128} {"train_loss": -24.866804122924805, "global_step": 259638, "epoch": 3128} {"train_loss": -25.004152297973633, "global_step": 259639, "epoch": 3128} {"train_loss": -24.942014694213867, "global_step": 259640, "epoch": 3128} {"train_loss": -25.139963150024414, "global_step": 259641, "epoch": 3128} {"train_loss": -25.220090866088867, "global_step": 259642, "epoch": 3128} {"train_loss": -25.124469757080078, "global_step": 259643, "epoch": 3128} {"train_loss": -25.118188858032227, "global_step": 259644, "epoch": 3128} {"train_loss": -25.36500358581543, "global_step": 259645, "epoch": 3128} {"train_loss": -24.772321701049805, "global_step": 259646, "epoch": 3128} {"train_loss": -25.039186477661133, "global_step": 259647, "epoch": 3128} {"train_loss": -25.201091766357422, "global_step": 259648, "epoch": 3128} {"train_loss": -25.281044006347656, "global_step": 259649, "epoch": 3128} {"train_loss": -25.428375244140625, "global_step": 259650, "epoch": 3128} {"train_loss": -25.265979766845703, "global_step": 259651, "epoch": 3128} {"train_loss": -25.10614013671875, "global_step": 259652, "epoch": 3128} {"train_loss": -25.28119468688965, "global_step": 259653, "epoch": 3128} {"train_loss": -25.213361740112305, "global_step": 259654, "epoch": 3128} {"train_loss": -25.35809898376465, "global_step": 259655, "epoch": 3128} {"train_loss": -24.885435104370117, "global_step": 259656, "epoch": 3128} {"train_loss": -25.41370964050293, "global_step": 259657, "epoch": 3128} {"train_loss": -25.694604873657227, "global_step": 259658, "epoch": 3128} {"train_loss": -25.550405502319336, "global_step": 259659, "epoch": 3128} {"train_loss": -25.497196197509766, "global_step": 259660, "epoch": 3128} {"train_loss": -25.244802474975586, "global_step": 259661, "epoch": 3128} {"train_loss": -24.982370376586914, "global_step": 259662, "epoch": 3128} {"train_loss": -25.10076904296875, "global_step": 259663, "epoch": 3128} {"train_loss": -24.964468002319336, "global_step": 259664, "epoch": 3128} {"train_loss": -25.01190757751465, "global_step": 259665, "epoch": 3128} {"train_loss": -25.077529907226562, "global_step": 259666, "epoch": 3128} {"train_loss": -25.410200119018555, "global_step": 259667, "epoch": 3128} {"train_loss": -25.449005126953125, "global_step": 259668, "epoch": 3128} {"train_loss": -24.80043601989746, "global_step": 259669, "epoch": 3128} {"train_loss": -25.01930046081543, "global_step": 259670, "epoch": 3128} {"train_loss": -25.08504295349121, "global_step": 259671, "epoch": 3128} {"train_loss": -25.045591354370117, "global_step": 259672, "epoch": 3128} {"train_loss": -25.23836898803711, "global_step": 259673, "epoch": 3128} {"train_loss": -25.215787887573242, "global_step": 259674, "epoch": 3128} {"train_loss": -25.05769157409668, "global_step": 259675, "epoch": 3128} {"train_loss": -25.173086166381836, "global_step": 259676, "epoch": 3128} {"train_loss": -25.209226608276367, "global_step": 259677, "epoch": 3128} {"train_loss": -25.01717185974121, "global_step": 259678, "epoch": 3128} {"train_loss": -25.203018188476562, "global_step": 259679, "epoch": 3128} {"train_loss": -24.987424850463867, "global_step": 259680, "epoch": 3128} {"train_loss": -24.894927978515625, "global_step": 259681, "epoch": 3128} {"train_loss": -25.31275177001953, "global_step": 259682, "epoch": 3128} {"train_loss": -25.103017807006836, "global_step": 259683, "epoch": 3128} {"train_loss": -25.170629501342773, "global_step": 259684, "epoch": 3128} {"train_loss": -25.055912017822266, "global_step": 259685, "epoch": 3128} {"train_loss": -24.987546920776367, "global_step": 259686, "epoch": 3128} {"train_loss": -25.17469596862793, "global_step": 259687, "epoch": 3128} {"train_loss": -24.811368942260742, "global_step": 259688, "epoch": 3128} {"train_loss": -25.111303329467773, "global_step": 259689, "epoch": 3128} {"train_loss": -25.37190818786621, "global_step": 259690, "epoch": 3128} {"train_loss": -25.117393493652344, "global_step": 259691, "epoch": 3128} {"train_loss": -25.296382904052734, "global_step": 259692, "epoch": 3128} {"train_loss": -25.199146270751953, "global_step": 259693, "epoch": 3128} {"train_loss": -25.167747497558594, "global_step": 259694, "epoch": 3128} {"train_loss": -25.543516159057617, "global_step": 259695, "epoch": 3128} {"train_loss": -25.20650863647461, "global_step": 259696, "epoch": 3128} {"train_loss": -25.040321350097656, "global_step": 259697, "epoch": 3128} {"train_loss": -24.86348533630371, "global_step": 259698, "epoch": 3128} {"train_loss": -24.934141159057617, "global_step": 259699, "epoch": 3128} {"train_loss": -24.98811912536621, "global_step": 259700, "epoch": 3128} {"train_loss": -25.255168914794922, "global_step": 259701, "epoch": 3128} {"train_loss": -25.328519821166992, "global_step": 259702, "epoch": 3128} {"train_loss": -25.137004852294922, "global_step": 259703, "epoch": 3128} {"train_loss": -25.400299072265625, "global_step": 259704, "epoch": 3128} {"train_loss": -25.15718650817871, "global_step": 259705, "epoch": 3128} {"train_loss": -25.107869274644965, "global_step": 259706, "epoch": 3128, "val_loss": 6840460.0} {"train_loss": -24.808837890625, "global_step": 259707, "epoch": 3129} {"train_loss": -24.576480865478516, "global_step": 259708, "epoch": 3129} {"train_loss": -25.01759910583496, "global_step": 259709, "epoch": 3129} {"train_loss": -23.67226219177246, "global_step": 259710, "epoch": 3129} {"train_loss": -23.927011489868164, "global_step": 259711, "epoch": 3129} {"train_loss": -24.353750228881836, "global_step": 259712, "epoch": 3129} {"train_loss": -25.091766357421875, "global_step": 259713, "epoch": 3129} {"train_loss": -24.5299129486084, "global_step": 259714, "epoch": 3129} {"train_loss": -25.090574264526367, "global_step": 259715, "epoch": 3129} {"train_loss": -24.687965393066406, "global_step": 259716, "epoch": 3129} {"train_loss": -25.150171279907227, "global_step": 259717, "epoch": 3129} {"train_loss": -24.959163665771484, "global_step": 259718, "epoch": 3129} {"train_loss": -24.970382690429688, "global_step": 259719, "epoch": 3129} {"train_loss": -24.912214279174805, "global_step": 259720, "epoch": 3129} {"train_loss": -25.20122718811035, "global_step": 259721, "epoch": 3129} {"train_loss": -25.006210327148438, "global_step": 259722, "epoch": 3129} {"train_loss": -24.323375701904297, "global_step": 259723, "epoch": 3129} {"train_loss": -25.11737632751465, "global_step": 259724, "epoch": 3129} {"train_loss": -25.100269317626953, "global_step": 259725, "epoch": 3129} {"train_loss": -24.70411491394043, "global_step": 259726, "epoch": 3129} {"train_loss": -25.047439575195312, "global_step": 259727, "epoch": 3129} {"train_loss": -25.116342544555664, "global_step": 259728, "epoch": 3129} {"train_loss": -25.087255477905273, "global_step": 259729, "epoch": 3129} {"train_loss": -25.03383445739746, "global_step": 259730, "epoch": 3129} {"train_loss": -24.820459365844727, "global_step": 259731, "epoch": 3129} {"train_loss": -24.939870834350586, "global_step": 259732, "epoch": 3129} {"train_loss": -25.331098556518555, "global_step": 259733, "epoch": 3129} {"train_loss": -25.020429611206055, "global_step": 259734, "epoch": 3129} {"train_loss": -25.2902774810791, "global_step": 259735, "epoch": 3129} {"train_loss": -24.890871047973633, "global_step": 259736, "epoch": 3129} {"train_loss": -25.110559463500977, "global_step": 259737, "epoch": 3129} {"train_loss": -24.827726364135742, "global_step": 259738, "epoch": 3129} {"train_loss": -24.85883140563965, "global_step": 259739, "epoch": 3129} {"train_loss": -24.87202262878418, "global_step": 259740, "epoch": 3129} {"train_loss": -25.218765258789062, "global_step": 259741, "epoch": 3129} {"train_loss": -25.2274227142334, "global_step": 259742, "epoch": 3129} {"train_loss": -25.20985221862793, "global_step": 259743, "epoch": 3129} {"train_loss": -25.259044647216797, "global_step": 259744, "epoch": 3129} {"train_loss": -24.901195526123047, "global_step": 259745, "epoch": 3129} {"train_loss": -24.97479248046875, "global_step": 259746, "epoch": 3129} {"train_loss": -25.3924503326416, "global_step": 259747, "epoch": 3129} {"train_loss": -25.130138397216797, "global_step": 259748, "epoch": 3129} {"train_loss": -24.9770565032959, "global_step": 259749, "epoch": 3129} {"train_loss": -25.064260482788086, "global_step": 259750, "epoch": 3129} {"train_loss": -25.226102828979492, "global_step": 259751, "epoch": 3129} {"train_loss": -25.330707550048828, "global_step": 259752, "epoch": 3129} {"train_loss": -24.951583862304688, "global_step": 259753, "epoch": 3129} {"train_loss": -25.07340431213379, "global_step": 259754, "epoch": 3129} {"train_loss": -24.966354370117188, "global_step": 259755, "epoch": 3129} {"train_loss": -25.360227584838867, "global_step": 259756, "epoch": 3129} {"train_loss": -25.175975799560547, "global_step": 259757, "epoch": 3129} {"train_loss": -25.1393985748291, "global_step": 259758, "epoch": 3129} {"train_loss": -25.04890251159668, "global_step": 259759, "epoch": 3129} {"train_loss": -25.226957321166992, "global_step": 259760, "epoch": 3129} {"train_loss": -25.250802993774414, "global_step": 259761, "epoch": 3129} {"train_loss": -25.1716251373291, "global_step": 259762, "epoch": 3129} {"train_loss": -25.275571823120117, "global_step": 259763, "epoch": 3129} {"train_loss": -25.665674209594727, "global_step": 259764, "epoch": 3129} {"train_loss": -25.289243698120117, "global_step": 259765, "epoch": 3129} {"train_loss": -25.240985870361328, "global_step": 259766, "epoch": 3129} {"train_loss": -25.38579750061035, "global_step": 259767, "epoch": 3129} {"train_loss": -25.179601669311523, "global_step": 259768, "epoch": 3129} {"train_loss": -24.96046257019043, "global_step": 259769, "epoch": 3129} {"train_loss": -25.361221313476562, "global_step": 259770, "epoch": 3129} {"train_loss": -25.202007293701172, "global_step": 259771, "epoch": 3129} {"train_loss": -25.539993286132812, "global_step": 259772, "epoch": 3129} {"train_loss": -25.283523559570312, "global_step": 259773, "epoch": 3129} {"train_loss": -25.931013107299805, "global_step": 259774, "epoch": 3129} {"train_loss": -24.97524642944336, "global_step": 259775, "epoch": 3129} {"train_loss": -24.988523483276367, "global_step": 259776, "epoch": 3129} {"train_loss": -25.092519760131836, "global_step": 259777, "epoch": 3129} {"train_loss": -25.682117462158203, "global_step": 259778, "epoch": 3129} {"train_loss": -25.511531829833984, "global_step": 259779, "epoch": 3129} {"train_loss": -25.557497024536133, "global_step": 259780, "epoch": 3129} {"train_loss": -25.001911163330078, "global_step": 259781, "epoch": 3129} {"train_loss": -25.238271713256836, "global_step": 259782, "epoch": 3129} {"train_loss": -25.31514549255371, "global_step": 259783, "epoch": 3129} {"train_loss": -25.22765350341797, "global_step": 259784, "epoch": 3129} {"train_loss": -25.26527976989746, "global_step": 259785, "epoch": 3129} {"train_loss": -24.8785343170166, "global_step": 259786, "epoch": 3129} {"train_loss": -25.159727096557617, "global_step": 259787, "epoch": 3129} {"train_loss": -25.442901611328125, "global_step": 259788, "epoch": 3129} {"train_loss": -25.066727396953535, "global_step": 259789, "epoch": 3129, "val_loss": 6882766.0} {"train_loss": -24.95612907409668, "global_step": 259790, "epoch": 3130} {"train_loss": -24.423091888427734, "global_step": 259791, "epoch": 3130} {"train_loss": -23.660539627075195, "global_step": 259792, "epoch": 3130} {"train_loss": -23.901445388793945, "global_step": 259793, "epoch": 3130} {"train_loss": -24.358186721801758, "global_step": 259794, "epoch": 3130} {"train_loss": -24.658374786376953, "global_step": 259795, "epoch": 3130} {"train_loss": -24.442541122436523, "global_step": 259796, "epoch": 3130} {"train_loss": -24.725372314453125, "global_step": 259797, "epoch": 3130} {"train_loss": -24.436559677124023, "global_step": 259798, "epoch": 3130} {"train_loss": -24.6614933013916, "global_step": 259799, "epoch": 3130} {"train_loss": -24.908498764038086, "global_step": 259800, "epoch": 3130} {"train_loss": -24.405344009399414, "global_step": 259801, "epoch": 3130} {"train_loss": -24.901254653930664, "global_step": 259802, "epoch": 3130} {"train_loss": -24.3951358795166, "global_step": 259803, "epoch": 3130} {"train_loss": -25.092060089111328, "global_step": 259804, "epoch": 3130} {"train_loss": -25.125934600830078, "global_step": 259805, "epoch": 3130} {"train_loss": -24.517118453979492, "global_step": 259806, "epoch": 3130} {"train_loss": -24.726823806762695, "global_step": 259807, "epoch": 3130} {"train_loss": -25.17817497253418, "global_step": 259808, "epoch": 3130} {"train_loss": -24.794076919555664, "global_step": 259809, "epoch": 3130} {"train_loss": -24.934467315673828, "global_step": 259810, "epoch": 3130} {"train_loss": -24.700674057006836, "global_step": 259811, "epoch": 3130} {"train_loss": -24.715072631835938, "global_step": 259812, "epoch": 3130} {"train_loss": -24.79292869567871, "global_step": 259813, "epoch": 3130} {"train_loss": -25.147266387939453, "global_step": 259814, "epoch": 3130} {"train_loss": -24.78061866760254, "global_step": 259815, "epoch": 3130} {"train_loss": -24.96310806274414, "global_step": 259816, "epoch": 3130} {"train_loss": -24.968698501586914, "global_step": 259817, "epoch": 3130} {"train_loss": -24.972455978393555, "global_step": 259818, "epoch": 3130} {"train_loss": -25.205793380737305, "global_step": 259819, "epoch": 3130} {"train_loss": -25.35964012145996, "global_step": 259820, "epoch": 3130} {"train_loss": -24.81985855102539, "global_step": 259821, "epoch": 3130} {"train_loss": -25.276092529296875, "global_step": 259822, "epoch": 3130} {"train_loss": -25.7432804107666, "global_step": 259823, "epoch": 3130} {"train_loss": -25.249652862548828, "global_step": 259824, "epoch": 3130} {"train_loss": -25.363052368164062, "global_step": 259825, "epoch": 3130} {"train_loss": -25.126840591430664, "global_step": 259826, "epoch": 3130} {"train_loss": -24.853200912475586, "global_step": 259827, "epoch": 3130} {"train_loss": -24.811063766479492, "global_step": 259828, "epoch": 3130} {"train_loss": -25.03949546813965, "global_step": 259829, "epoch": 3130} {"train_loss": -25.08313751220703, "global_step": 259830, "epoch": 3130} {"train_loss": -25.0880069732666, "global_step": 259831, "epoch": 3130} {"train_loss": -24.97701072692871, "global_step": 259832, "epoch": 3130} {"train_loss": -25.626773834228516, "global_step": 259833, "epoch": 3130} {"train_loss": -25.55922508239746, "global_step": 259834, "epoch": 3130} {"train_loss": -24.866029739379883, "global_step": 259835, "epoch": 3130} {"train_loss": -25.11318016052246, "global_step": 259836, "epoch": 3130} {"train_loss": -24.93906021118164, "global_step": 259837, "epoch": 3130} {"train_loss": -25.411752700805664, "global_step": 259838, "epoch": 3130} {"train_loss": -25.0423641204834, "global_step": 259839, "epoch": 3130} {"train_loss": -25.40351676940918, "global_step": 259840, "epoch": 3130} {"train_loss": -25.07012367248535, "global_step": 259841, "epoch": 3130} {"train_loss": -25.31199836730957, "global_step": 259842, "epoch": 3130} {"train_loss": -25.308380126953125, "global_step": 259843, "epoch": 3130} {"train_loss": -25.02742576599121, "global_step": 259844, "epoch": 3130} {"train_loss": -25.455764770507812, "global_step": 259845, "epoch": 3130} {"train_loss": -25.058685302734375, "global_step": 259846, "epoch": 3130} {"train_loss": -25.585973739624023, "global_step": 259847, "epoch": 3130} {"train_loss": -25.514799118041992, "global_step": 259848, "epoch": 3130} {"train_loss": -25.143064498901367, "global_step": 259849, "epoch": 3130} {"train_loss": -25.228178024291992, "global_step": 259850, "epoch": 3130} {"train_loss": -25.565143585205078, "global_step": 259851, "epoch": 3130} {"train_loss": -25.501432418823242, "global_step": 259852, "epoch": 3130} {"train_loss": -25.051969528198242, "global_step": 259853, "epoch": 3130} {"train_loss": -25.267301559448242, "global_step": 259854, "epoch": 3130} {"train_loss": -25.005783081054688, "global_step": 259855, "epoch": 3130} {"train_loss": -25.061731338500977, "global_step": 259856, "epoch": 3130} {"train_loss": -25.155471801757812, "global_step": 259857, "epoch": 3130} {"train_loss": -25.153331756591797, "global_step": 259858, "epoch": 3130} {"train_loss": -25.55213165283203, "global_step": 259859, "epoch": 3130} {"train_loss": -25.39809226989746, "global_step": 259860, "epoch": 3130} {"train_loss": -24.925498962402344, "global_step": 259861, "epoch": 3130} {"train_loss": -25.110647201538086, "global_step": 259862, "epoch": 3130} {"train_loss": -25.144296646118164, "global_step": 259863, "epoch": 3130} {"train_loss": -24.886133193969727, "global_step": 259864, "epoch": 3130} {"train_loss": -25.329248428344727, "global_step": 259865, "epoch": 3130} {"train_loss": -24.77402114868164, "global_step": 259866, "epoch": 3130} {"train_loss": -25.41213035583496, "global_step": 259867, "epoch": 3130} {"train_loss": -25.012344360351562, "global_step": 259868, "epoch": 3130} {"train_loss": -25.20721435546875, "global_step": 259869, "epoch": 3130} {"train_loss": -24.78282928466797, "global_step": 259870, "epoch": 3130} {"train_loss": -25.06637954711914, "global_step": 259871, "epoch": 3130} {"train_loss": -25.030063100607997, "global_step": 259872, "epoch": 3130, "val_loss": 6893890.0} {"train_loss": -22.990262985229492, "global_step": 259873, "epoch": 3131} {"train_loss": -24.128143310546875, "global_step": 259874, "epoch": 3131} {"train_loss": -24.196701049804688, "global_step": 259875, "epoch": 3131} {"train_loss": -23.934961318969727, "global_step": 259876, "epoch": 3131} {"train_loss": -24.250314712524414, "global_step": 259877, "epoch": 3131} {"train_loss": -23.78364372253418, "global_step": 259878, "epoch": 3131} {"train_loss": -24.46463394165039, "global_step": 259879, "epoch": 3131} {"train_loss": -24.185291290283203, "global_step": 259880, "epoch": 3131} {"train_loss": -24.595075607299805, "global_step": 259881, "epoch": 3131} {"train_loss": -24.214920043945312, "global_step": 259882, "epoch": 3131} {"train_loss": -24.494569778442383, "global_step": 259883, "epoch": 3131} {"train_loss": -24.2288875579834, "global_step": 259884, "epoch": 3131} {"train_loss": -24.477357864379883, "global_step": 259885, "epoch": 3131} {"train_loss": -24.521379470825195, "global_step": 259886, "epoch": 3131} {"train_loss": -24.87004280090332, "global_step": 259887, "epoch": 3131} {"train_loss": -24.68848419189453, "global_step": 259888, "epoch": 3131} {"train_loss": -24.82884407043457, "global_step": 259889, "epoch": 3131} {"train_loss": -24.610692977905273, "global_step": 259890, "epoch": 3131} {"train_loss": -24.484283447265625, "global_step": 259891, "epoch": 3131} {"train_loss": -24.606870651245117, "global_step": 259892, "epoch": 3131} {"train_loss": -24.62509536743164, "global_step": 259893, "epoch": 3131} {"train_loss": -24.976896286010742, "global_step": 259894, "epoch": 3131} {"train_loss": -24.971193313598633, "global_step": 259895, "epoch": 3131} {"train_loss": -24.96306800842285, "global_step": 259896, "epoch": 3131} {"train_loss": -24.737932205200195, "global_step": 259897, "epoch": 3131} {"train_loss": -25.083139419555664, "global_step": 259898, "epoch": 3131} {"train_loss": -24.96817398071289, "global_step": 259899, "epoch": 3131} {"train_loss": -25.4200496673584, "global_step": 259900, "epoch": 3131} {"train_loss": -24.990970611572266, "global_step": 259901, "epoch": 3131} {"train_loss": -24.885587692260742, "global_step": 259902, "epoch": 3131} {"train_loss": -24.844480514526367, "global_step": 259903, "epoch": 3131} {"train_loss": -24.849119186401367, "global_step": 259904, "epoch": 3131} {"train_loss": -25.05508804321289, "global_step": 259905, "epoch": 3131} {"train_loss": -25.033294677734375, "global_step": 259906, "epoch": 3131} {"train_loss": -25.233657836914062, "global_step": 259907, "epoch": 3131} {"train_loss": -25.376489639282227, "global_step": 259908, "epoch": 3131} {"train_loss": -25.28258514404297, "global_step": 259909, "epoch": 3131} {"train_loss": -25.249677658081055, "global_step": 259910, "epoch": 3131} {"train_loss": -25.322473526000977, "global_step": 259911, "epoch": 3131} {"train_loss": -24.805633544921875, "global_step": 259912, "epoch": 3131} {"train_loss": -25.261327743530273, "global_step": 259913, "epoch": 3131} {"train_loss": -24.933439254760742, "global_step": 259914, "epoch": 3131} {"train_loss": -25.46138572692871, "global_step": 259915, "epoch": 3131} {"train_loss": -25.33064079284668, "global_step": 259916, "epoch": 3131} {"train_loss": -24.942413330078125, "global_step": 259917, "epoch": 3131} {"train_loss": -24.869857788085938, "global_step": 259918, "epoch": 3131} {"train_loss": -25.057016372680664, "global_step": 259919, "epoch": 3131} {"train_loss": -25.364124298095703, "global_step": 259920, "epoch": 3131} {"train_loss": -25.24481773376465, "global_step": 259921, "epoch": 3131} {"train_loss": -25.29713249206543, "global_step": 259922, "epoch": 3131} {"train_loss": -25.089269638061523, "global_step": 259923, "epoch": 3131} {"train_loss": -25.261640548706055, "global_step": 259924, "epoch": 3131} {"train_loss": -24.990917205810547, "global_step": 259925, "epoch": 3131} {"train_loss": -25.55744171142578, "global_step": 259926, "epoch": 3131} {"train_loss": -25.692419052124023, "global_step": 259927, "epoch": 3131} {"train_loss": -25.06119728088379, "global_step": 259928, "epoch": 3131} {"train_loss": -25.285449981689453, "global_step": 259929, "epoch": 3131} {"train_loss": -25.085718154907227, "global_step": 259930, "epoch": 3131} {"train_loss": -25.21189308166504, "global_step": 259931, "epoch": 3131} {"train_loss": -25.273029327392578, "global_step": 259932, "epoch": 3131} {"train_loss": -25.434186935424805, "global_step": 259933, "epoch": 3131} {"train_loss": -25.29525375366211, "global_step": 259934, "epoch": 3131} {"train_loss": -25.46650505065918, "global_step": 259935, "epoch": 3131} {"train_loss": -25.4569034576416, "global_step": 259936, "epoch": 3131} {"train_loss": -25.085477828979492, "global_step": 259937, "epoch": 3131} {"train_loss": -25.570913314819336, "global_step": 259938, "epoch": 3131} {"train_loss": -24.807870864868164, "global_step": 259939, "epoch": 3131} {"train_loss": -25.036657333374023, "global_step": 259940, "epoch": 3131} {"train_loss": -25.012271881103516, "global_step": 259941, "epoch": 3131} {"train_loss": -25.06041145324707, "global_step": 259942, "epoch": 3131} {"train_loss": -24.527271270751953, "global_step": 259943, "epoch": 3131} {"train_loss": -24.5439395904541, "global_step": 259944, "epoch": 3131} {"train_loss": -25.18580436706543, "global_step": 259945, "epoch": 3131} {"train_loss": -25.2900447845459, "global_step": 259946, "epoch": 3131} {"train_loss": -25.484878540039062, "global_step": 259947, "epoch": 3131} {"train_loss": -24.896013259887695, "global_step": 259948, "epoch": 3131} {"train_loss": -25.081663131713867, "global_step": 259949, "epoch": 3131} {"train_loss": -25.18024253845215, "global_step": 259950, "epoch": 3131} {"train_loss": -24.85929298400879, "global_step": 259951, "epoch": 3131} {"train_loss": -25.047771453857422, "global_step": 259952, "epoch": 3131} {"train_loss": -25.417118072509766, "global_step": 259953, "epoch": 3131} {"train_loss": -25.08632469177246, "global_step": 259954, "epoch": 3131} {"train_loss": -24.913697461047803, "global_step": 259955, "epoch": 3131, "val_loss": 6895849.0} {"train_loss": -24.32354164123535, "global_step": 259956, "epoch": 3132} {"train_loss": -23.562599182128906, "global_step": 259957, "epoch": 3132} {"train_loss": -24.26417350769043, "global_step": 259958, "epoch": 3132} {"train_loss": -24.94562339782715, "global_step": 259959, "epoch": 3132} {"train_loss": -24.4766845703125, "global_step": 259960, "epoch": 3132} {"train_loss": -24.468473434448242, "global_step": 259961, "epoch": 3132} {"train_loss": -24.70429801940918, "global_step": 259962, "epoch": 3132} {"train_loss": -24.8531551361084, "global_step": 259963, "epoch": 3132} {"train_loss": -24.462711334228516, "global_step": 259964, "epoch": 3132} {"train_loss": -24.846643447875977, "global_step": 259965, "epoch": 3132} {"train_loss": -24.8165283203125, "global_step": 259966, "epoch": 3132} {"train_loss": -25.0201473236084, "global_step": 259967, "epoch": 3132} {"train_loss": -24.747900009155273, "global_step": 259968, "epoch": 3132} {"train_loss": -24.71870994567871, "global_step": 259969, "epoch": 3132} {"train_loss": -24.892587661743164, "global_step": 259970, "epoch": 3132} {"train_loss": -24.8642635345459, "global_step": 259971, "epoch": 3132} {"train_loss": -24.698822021484375, "global_step": 259972, "epoch": 3132} {"train_loss": -24.9628963470459, "global_step": 259973, "epoch": 3132} {"train_loss": -24.993576049804688, "global_step": 259974, "epoch": 3132} {"train_loss": -24.85584831237793, "global_step": 259975, "epoch": 3132} {"train_loss": -25.028583526611328, "global_step": 259976, "epoch": 3132} {"train_loss": -24.961894989013672, "global_step": 259977, "epoch": 3132} {"train_loss": -25.181427001953125, "global_step": 259978, "epoch": 3132} {"train_loss": -25.501474380493164, "global_step": 259979, "epoch": 3132} {"train_loss": -25.00809669494629, "global_step": 259980, "epoch": 3132} {"train_loss": -25.066801071166992, "global_step": 259981, "epoch": 3132} {"train_loss": -25.318941116333008, "global_step": 259982, "epoch": 3132} {"train_loss": -25.5566349029541, "global_step": 259983, "epoch": 3132} {"train_loss": -25.11762046813965, "global_step": 259984, "epoch": 3132} {"train_loss": -25.059852600097656, "global_step": 259985, "epoch": 3132} {"train_loss": -25.093708038330078, "global_step": 259986, "epoch": 3132} {"train_loss": -25.357702255249023, "global_step": 259987, "epoch": 3132} {"train_loss": -25.227567672729492, "global_step": 259988, "epoch": 3132} {"train_loss": -25.187604904174805, "global_step": 259989, "epoch": 3132} {"train_loss": -25.200809478759766, "global_step": 259990, "epoch": 3132} {"train_loss": -25.111839294433594, "global_step": 259991, "epoch": 3132} {"train_loss": -25.346723556518555, "global_step": 259992, "epoch": 3132} {"train_loss": -25.061677932739258, "global_step": 259993, "epoch": 3132} {"train_loss": -25.039796829223633, "global_step": 259994, "epoch": 3132} {"train_loss": -24.952138900756836, "global_step": 259995, "epoch": 3132} {"train_loss": -25.237071990966797, "global_step": 259996, "epoch": 3132} {"train_loss": -25.175989151000977, "global_step": 259997, "epoch": 3132} {"train_loss": -25.357553482055664, "global_step": 259998, "epoch": 3132} {"train_loss": -25.296598434448242, "global_step": 259999, "epoch": 3132} {"train_loss": -25.446287155151367, "global_step": 260000, "epoch": 3132} {"train_loss": -25.157617568969727, "global_step": 260001, "epoch": 3132} {"train_loss": -25.531606674194336, "global_step": 260002, "epoch": 3132} {"train_loss": -25.091630935668945, "global_step": 260003, "epoch": 3132} {"train_loss": -25.121408462524414, "global_step": 260004, "epoch": 3132} {"train_loss": -25.465635299682617, "global_step": 260005, "epoch": 3132} {"train_loss": -25.174198150634766, "global_step": 260006, "epoch": 3132} {"train_loss": -25.193510055541992, "global_step": 260007, "epoch": 3132} {"train_loss": -25.383625030517578, "global_step": 260008, "epoch": 3132} {"train_loss": -25.336196899414062, "global_step": 260009, "epoch": 3132} {"train_loss": -25.115432739257812, "global_step": 260010, "epoch": 3132} {"train_loss": -25.6002254486084, "global_step": 260011, "epoch": 3132} {"train_loss": -24.73402214050293, "global_step": 260012, "epoch": 3132} {"train_loss": -24.83318328857422, "global_step": 260013, "epoch": 3132} {"train_loss": -24.256711959838867, "global_step": 260014, "epoch": 3132} {"train_loss": -24.275732040405273, "global_step": 260015, "epoch": 3132} {"train_loss": -24.54615592956543, "global_step": 260016, "epoch": 3132} {"train_loss": -24.97783088684082, "global_step": 260017, "epoch": 3132} {"train_loss": -24.954553604125977, "global_step": 260018, "epoch": 3132} {"train_loss": -25.070594787597656, "global_step": 260019, "epoch": 3132} {"train_loss": -25.299959182739258, "global_step": 260020, "epoch": 3132} {"train_loss": -24.908634185791016, "global_step": 260021, "epoch": 3132} {"train_loss": -25.325841903686523, "global_step": 260022, "epoch": 3132} {"train_loss": -24.94447898864746, "global_step": 260023, "epoch": 3132} {"train_loss": -25.464599609375, "global_step": 260024, "epoch": 3132} {"train_loss": -24.916650772094727, "global_step": 260025, "epoch": 3132} {"train_loss": -25.46418571472168, "global_step": 260026, "epoch": 3132} {"train_loss": -24.708301544189453, "global_step": 260027, "epoch": 3132} {"train_loss": -25.331317901611328, "global_step": 260028, "epoch": 3132} {"train_loss": -24.92177391052246, "global_step": 260029, "epoch": 3132} {"train_loss": -25.467514038085938, "global_step": 260030, "epoch": 3132} {"train_loss": -25.07075309753418, "global_step": 260031, "epoch": 3132} {"train_loss": -25.162124633789062, "global_step": 260032, "epoch": 3132} {"train_loss": -25.283405303955078, "global_step": 260033, "epoch": 3132} {"train_loss": -25.06060028076172, "global_step": 260034, "epoch": 3132} {"train_loss": -25.108976364135742, "global_step": 260035, "epoch": 3132} {"train_loss": -24.933317184448242, "global_step": 260036, "epoch": 3132} {"train_loss": -25.333425521850586, "global_step": 260037, "epoch": 3132} {"train_loss": -25.03312770429864, "global_step": 260038, "epoch": 3132, "val_loss": 7013476.0} {"train_loss": -24.91535758972168, "global_step": 260039, "epoch": 3133} {"train_loss": -24.860567092895508, "global_step": 260040, "epoch": 3133} {"train_loss": -25.160329818725586, "global_step": 260041, "epoch": 3133} {"train_loss": -24.94593620300293, "global_step": 260042, "epoch": 3133} {"train_loss": -24.800935745239258, "global_step": 260043, "epoch": 3133} {"train_loss": -24.98456382751465, "global_step": 260044, "epoch": 3133} {"train_loss": -24.94410514831543, "global_step": 260045, "epoch": 3133} {"train_loss": -24.87152671813965, "global_step": 260046, "epoch": 3133} {"train_loss": -24.948034286499023, "global_step": 260047, "epoch": 3133} {"train_loss": -25.18216896057129, "global_step": 260048, "epoch": 3133} {"train_loss": -25.047269821166992, "global_step": 260049, "epoch": 3133} {"train_loss": -25.457395553588867, "global_step": 260050, "epoch": 3133} {"train_loss": -25.1475887298584, "global_step": 260051, "epoch": 3133} {"train_loss": -24.8581600189209, "global_step": 260052, "epoch": 3133} {"train_loss": -25.113508224487305, "global_step": 260053, "epoch": 3133} {"train_loss": -25.1107120513916, "global_step": 260054, "epoch": 3133} {"train_loss": -24.734756469726562, "global_step": 260055, "epoch": 3133} {"train_loss": -25.114831924438477, "global_step": 260056, "epoch": 3133} {"train_loss": -25.09161376953125, "global_step": 260057, "epoch": 3133} {"train_loss": -25.221311569213867, "global_step": 260058, "epoch": 3133} {"train_loss": -25.206418991088867, "global_step": 260059, "epoch": 3133} {"train_loss": -25.31684112548828, "global_step": 260060, "epoch": 3133} {"train_loss": -25.424680709838867, "global_step": 260061, "epoch": 3133} {"train_loss": -25.16720962524414, "global_step": 260062, "epoch": 3133} {"train_loss": -25.212345123291016, "global_step": 260063, "epoch": 3133} {"train_loss": -25.055938720703125, "global_step": 260064, "epoch": 3133} {"train_loss": -25.329151153564453, "global_step": 260065, "epoch": 3133} {"train_loss": -25.049802780151367, "global_step": 260066, "epoch": 3133} {"train_loss": -25.645221710205078, "global_step": 260067, "epoch": 3133} {"train_loss": -25.07137107849121, "global_step": 260068, "epoch": 3133} {"train_loss": -25.20870018005371, "global_step": 260069, "epoch": 3133} {"train_loss": -25.052968978881836, "global_step": 260070, "epoch": 3133} {"train_loss": -25.124448776245117, "global_step": 260071, "epoch": 3133} {"train_loss": -25.08283042907715, "global_step": 260072, "epoch": 3133} {"train_loss": -25.277982711791992, "global_step": 260073, "epoch": 3133} {"train_loss": -25.322004318237305, "global_step": 260074, "epoch": 3133} {"train_loss": -25.283124923706055, "global_step": 260075, "epoch": 3133} {"train_loss": -24.99879264831543, "global_step": 260076, "epoch": 3133} {"train_loss": -25.490314483642578, "global_step": 260077, "epoch": 3133} {"train_loss": -25.248910903930664, "global_step": 260078, "epoch": 3133} {"train_loss": -25.643644332885742, "global_step": 260079, "epoch": 3133} {"train_loss": -25.27821922302246, "global_step": 260080, "epoch": 3133} {"train_loss": -25.27452278137207, "global_step": 260081, "epoch": 3133} {"train_loss": -25.244281768798828, "global_step": 260082, "epoch": 3133} {"train_loss": -25.578046798706055, "global_step": 260083, "epoch": 3133} {"train_loss": -25.31348419189453, "global_step": 260084, "epoch": 3133} {"train_loss": -25.533180236816406, "global_step": 260085, "epoch": 3133} {"train_loss": -25.39952850341797, "global_step": 260086, "epoch": 3133} {"train_loss": -25.483078002929688, "global_step": 260087, "epoch": 3133} {"train_loss": -25.091495513916016, "global_step": 260088, "epoch": 3133} {"train_loss": -25.063329696655273, "global_step": 260089, "epoch": 3133} {"train_loss": -25.373615264892578, "global_step": 260090, "epoch": 3133} {"train_loss": -25.75319480895996, "global_step": 260091, "epoch": 3133} {"train_loss": -25.34089469909668, "global_step": 260092, "epoch": 3133} {"train_loss": -25.363245010375977, "global_step": 260093, "epoch": 3133} {"train_loss": -25.30218505859375, "global_step": 260094, "epoch": 3133} {"train_loss": -25.2393741607666, "global_step": 260095, "epoch": 3133} {"train_loss": -25.114728927612305, "global_step": 260096, "epoch": 3133} {"train_loss": -25.139875411987305, "global_step": 260097, "epoch": 3133} {"train_loss": -25.344451904296875, "global_step": 260098, "epoch": 3133} {"train_loss": -25.20173454284668, "global_step": 260099, "epoch": 3133} {"train_loss": -24.683074951171875, "global_step": 260100, "epoch": 3133} {"train_loss": -24.433792114257812, "global_step": 260101, "epoch": 3133} {"train_loss": -24.172948837280273, "global_step": 260102, "epoch": 3133} {"train_loss": -24.5833683013916, "global_step": 260103, "epoch": 3133} {"train_loss": -25.02475357055664, "global_step": 260104, "epoch": 3133} {"train_loss": -24.996191024780273, "global_step": 260105, "epoch": 3133} {"train_loss": -24.848989486694336, "global_step": 260106, "epoch": 3133} {"train_loss": -24.70369529724121, "global_step": 260107, "epoch": 3133} {"train_loss": -24.792606353759766, "global_step": 260108, "epoch": 3133} {"train_loss": -24.961660385131836, "global_step": 260109, "epoch": 3133} {"train_loss": -24.36861228942871, "global_step": 260110, "epoch": 3133} {"train_loss": -24.943532943725586, "global_step": 260111, "epoch": 3133} {"train_loss": -25.096988677978516, "global_step": 260112, "epoch": 3133} {"train_loss": -25.093244552612305, "global_step": 260113, "epoch": 3133} {"train_loss": -25.232439041137695, "global_step": 260114, "epoch": 3133} {"train_loss": -25.03641128540039, "global_step": 260115, "epoch": 3133} {"train_loss": -25.150089263916016, "global_step": 260116, "epoch": 3133} {"train_loss": -25.081979751586914, "global_step": 260117, "epoch": 3133} {"train_loss": -25.06672477722168, "global_step": 260118, "epoch": 3133} {"train_loss": -24.82730484008789, "global_step": 260119, "epoch": 3133} {"train_loss": -24.873899459838867, "global_step": 260120, "epoch": 3133} {"train_loss": -25.118881018765002, "global_step": 260121, "epoch": 3133, "val_loss": 6939639.0} {"train_loss": -25.12742805480957, "global_step": 260122, "epoch": 3134} {"train_loss": -25.140037536621094, "global_step": 260123, "epoch": 3134} {"train_loss": -25.104145050048828, "global_step": 260124, "epoch": 3134} {"train_loss": -25.015403747558594, "global_step": 260125, "epoch": 3134} {"train_loss": -24.919233322143555, "global_step": 260126, "epoch": 3134} {"train_loss": -24.996896743774414, "global_step": 260127, "epoch": 3134} {"train_loss": -24.778301239013672, "global_step": 260128, "epoch": 3134} {"train_loss": -24.847137451171875, "global_step": 260129, "epoch": 3134} {"train_loss": -25.25849151611328, "global_step": 260130, "epoch": 3134} {"train_loss": -24.733802795410156, "global_step": 260131, "epoch": 3134} {"train_loss": -25.032175064086914, "global_step": 260132, "epoch": 3134} {"train_loss": -24.950956344604492, "global_step": 260133, "epoch": 3134} {"train_loss": -24.9536075592041, "global_step": 260134, "epoch": 3134} {"train_loss": -25.23896598815918, "global_step": 260135, "epoch": 3134} {"train_loss": -25.306276321411133, "global_step": 260136, "epoch": 3134} {"train_loss": -25.411060333251953, "global_step": 260137, "epoch": 3134} {"train_loss": -25.105310440063477, "global_step": 260138, "epoch": 3134} {"train_loss": -24.79199981689453, "global_step": 260139, "epoch": 3134} {"train_loss": -25.134408950805664, "global_step": 260140, "epoch": 3134} {"train_loss": -25.352079391479492, "global_step": 260141, "epoch": 3134} {"train_loss": -25.129613876342773, "global_step": 260142, "epoch": 3134} {"train_loss": -24.54242706298828, "global_step": 260143, "epoch": 3134} {"train_loss": -24.827796936035156, "global_step": 260144, "epoch": 3134} {"train_loss": -25.19830894470215, "global_step": 260145, "epoch": 3134} {"train_loss": -25.162240982055664, "global_step": 260146, "epoch": 3134} {"train_loss": -25.06500244140625, "global_step": 260147, "epoch": 3134} {"train_loss": -25.036338806152344, "global_step": 260148, "epoch": 3134} {"train_loss": -25.113805770874023, "global_step": 260149, "epoch": 3134} {"train_loss": -25.4764347076416, "global_step": 260150, "epoch": 3134} {"train_loss": -24.805715560913086, "global_step": 260151, "epoch": 3134} {"train_loss": -25.024890899658203, "global_step": 260152, "epoch": 3134} {"train_loss": -25.361499786376953, "global_step": 260153, "epoch": 3134} {"train_loss": -25.32270622253418, "global_step": 260154, "epoch": 3134} {"train_loss": -25.197208404541016, "global_step": 260155, "epoch": 3134} {"train_loss": -24.809988021850586, "global_step": 260156, "epoch": 3134} {"train_loss": -25.24382781982422, "global_step": 260157, "epoch": 3134} {"train_loss": -25.0367374420166, "global_step": 260158, "epoch": 3134} {"train_loss": -24.94093894958496, "global_step": 260159, "epoch": 3134} {"train_loss": -25.089902877807617, "global_step": 260160, "epoch": 3134} {"train_loss": -25.099332809448242, "global_step": 260161, "epoch": 3134} {"train_loss": -25.149993896484375, "global_step": 260162, "epoch": 3134} {"train_loss": -25.47739601135254, "global_step": 260163, "epoch": 3134} {"train_loss": -25.261493682861328, "global_step": 260164, "epoch": 3134} {"train_loss": -25.226388931274414, "global_step": 260165, "epoch": 3134} {"train_loss": -25.07200813293457, "global_step": 260166, "epoch": 3134} {"train_loss": -25.475839614868164, "global_step": 260167, "epoch": 3134} {"train_loss": -25.36602783203125, "global_step": 260168, "epoch": 3134} {"train_loss": -25.28339385986328, "global_step": 260169, "epoch": 3134} {"train_loss": -25.367467880249023, "global_step": 260170, "epoch": 3134} {"train_loss": -25.264225006103516, "global_step": 260171, "epoch": 3134} {"train_loss": -25.0931453704834, "global_step": 260172, "epoch": 3134} {"train_loss": -25.28325843811035, "global_step": 260173, "epoch": 3134} {"train_loss": -25.3569278717041, "global_step": 260174, "epoch": 3134} {"train_loss": -25.058460235595703, "global_step": 260175, "epoch": 3134} {"train_loss": -25.03193473815918, "global_step": 260176, "epoch": 3134} {"train_loss": -25.322784423828125, "global_step": 260177, "epoch": 3134} {"train_loss": -25.234394073486328, "global_step": 260178, "epoch": 3134} {"train_loss": -25.45371437072754, "global_step": 260179, "epoch": 3134} {"train_loss": -24.967554092407227, "global_step": 260180, "epoch": 3134} {"train_loss": -25.19191551208496, "global_step": 260181, "epoch": 3134} {"train_loss": -25.08998680114746, "global_step": 260182, "epoch": 3134} {"train_loss": -25.187536239624023, "global_step": 260183, "epoch": 3134} {"train_loss": -25.16470718383789, "global_step": 260184, "epoch": 3134} {"train_loss": -24.936491012573242, "global_step": 260185, "epoch": 3134} {"train_loss": -25.523029327392578, "global_step": 260186, "epoch": 3134} {"train_loss": -25.31313133239746, "global_step": 260187, "epoch": 3134} {"train_loss": -25.511016845703125, "global_step": 260188, "epoch": 3134} {"train_loss": -25.6792049407959, "global_step": 260189, "epoch": 3134} {"train_loss": -25.137914657592773, "global_step": 260190, "epoch": 3134} {"train_loss": -25.23342514038086, "global_step": 260191, "epoch": 3134} {"train_loss": -25.45552635192871, "global_step": 260192, "epoch": 3134} {"train_loss": -25.3184871673584, "global_step": 260193, "epoch": 3134} {"train_loss": -25.15937042236328, "global_step": 260194, "epoch": 3134} {"train_loss": -24.825469970703125, "global_step": 260195, "epoch": 3134} {"train_loss": -25.051374435424805, "global_step": 260196, "epoch": 3134} {"train_loss": -25.053239822387695, "global_step": 260197, "epoch": 3134} {"train_loss": -24.88933753967285, "global_step": 260198, "epoch": 3134} {"train_loss": -25.300451278686523, "global_step": 260199, "epoch": 3134} {"train_loss": -25.007904052734375, "global_step": 260200, "epoch": 3134} {"train_loss": -24.933759689331055, "global_step": 260201, "epoch": 3134} {"train_loss": -25.423147201538086, "global_step": 260202, "epoch": 3134} {"train_loss": -25.222503662109375, "global_step": 260203, "epoch": 3134} {"train_loss": -25.15155808322401, "global_step": 260204, "epoch": 3134, "val_loss": 6812358.0} {"train_loss": -24.51753044128418, "global_step": 260205, "epoch": 3135} {"train_loss": -24.7833194732666, "global_step": 260206, "epoch": 3135} {"train_loss": -24.526071548461914, "global_step": 260207, "epoch": 3135} {"train_loss": -24.376502990722656, "global_step": 260208, "epoch": 3135} {"train_loss": -25.06900405883789, "global_step": 260209, "epoch": 3135} {"train_loss": -24.537931442260742, "global_step": 260210, "epoch": 3135} {"train_loss": -24.227670669555664, "global_step": 260211, "epoch": 3135} {"train_loss": -25.074377059936523, "global_step": 260212, "epoch": 3135} {"train_loss": -24.634275436401367, "global_step": 260213, "epoch": 3135} {"train_loss": -24.956073760986328, "global_step": 260214, "epoch": 3135} {"train_loss": -24.620716094970703, "global_step": 260215, "epoch": 3135} {"train_loss": -25.023250579833984, "global_step": 260216, "epoch": 3135} {"train_loss": -25.182710647583008, "global_step": 260217, "epoch": 3135} {"train_loss": -25.19080352783203, "global_step": 260218, "epoch": 3135} {"train_loss": -24.95631217956543, "global_step": 260219, "epoch": 3135} {"train_loss": -24.533700942993164, "global_step": 260220, "epoch": 3135} {"train_loss": -25.247135162353516, "global_step": 260221, "epoch": 3135} {"train_loss": -24.9621639251709, "global_step": 260222, "epoch": 3135} {"train_loss": -24.712162017822266, "global_step": 260223, "epoch": 3135} {"train_loss": -25.15450096130371, "global_step": 260224, "epoch": 3135} {"train_loss": -24.501943588256836, "global_step": 260225, "epoch": 3135} {"train_loss": -25.127838134765625, "global_step": 260226, "epoch": 3135} {"train_loss": -24.887502670288086, "global_step": 260227, "epoch": 3135} {"train_loss": -24.95912742614746, "global_step": 260228, "epoch": 3135} {"train_loss": -24.770933151245117, "global_step": 260229, "epoch": 3135} {"train_loss": -25.001272201538086, "global_step": 260230, "epoch": 3135} {"train_loss": -24.830909729003906, "global_step": 260231, "epoch": 3135} {"train_loss": -25.05132293701172, "global_step": 260232, "epoch": 3135} {"train_loss": -25.39436149597168, "global_step": 260233, "epoch": 3135} {"train_loss": -24.986169815063477, "global_step": 260234, "epoch": 3135} {"train_loss": -25.055007934570312, "global_step": 260235, "epoch": 3135} {"train_loss": -24.829137802124023, "global_step": 260236, "epoch": 3135} {"train_loss": -25.10573387145996, "global_step": 260237, "epoch": 3135} {"train_loss": -25.316104888916016, "global_step": 260238, "epoch": 3135} {"train_loss": -25.449132919311523, "global_step": 260239, "epoch": 3135} {"train_loss": -25.20104217529297, "global_step": 260240, "epoch": 3135} {"train_loss": -24.95064926147461, "global_step": 260241, "epoch": 3135} {"train_loss": -25.32618522644043, "global_step": 260242, "epoch": 3135} {"train_loss": -24.850067138671875, "global_step": 260243, "epoch": 3135} {"train_loss": -25.12166976928711, "global_step": 260244, "epoch": 3135} {"train_loss": -25.133636474609375, "global_step": 260245, "epoch": 3135} {"train_loss": -24.83642578125, "global_step": 260246, "epoch": 3135} {"train_loss": -25.020065307617188, "global_step": 260247, "epoch": 3135} {"train_loss": -25.404949188232422, "global_step": 260248, "epoch": 3135} {"train_loss": -25.11777687072754, "global_step": 260249, "epoch": 3135} {"train_loss": -25.3538818359375, "global_step": 260250, "epoch": 3135} {"train_loss": -25.093420028686523, "global_step": 260251, "epoch": 3135} {"train_loss": -25.519622802734375, "global_step": 260252, "epoch": 3135} {"train_loss": -25.2408390045166, "global_step": 260253, "epoch": 3135} {"train_loss": -25.48557472229004, "global_step": 260254, "epoch": 3135} {"train_loss": -24.5986328125, "global_step": 260255, "epoch": 3135} {"train_loss": -25.078672409057617, "global_step": 260256, "epoch": 3135} {"train_loss": -25.08928108215332, "global_step": 260257, "epoch": 3135} {"train_loss": -25.27252960205078, "global_step": 260258, "epoch": 3135} {"train_loss": -24.796344757080078, "global_step": 260259, "epoch": 3135} {"train_loss": -25.033782958984375, "global_step": 260260, "epoch": 3135} {"train_loss": -25.151517868041992, "global_step": 260261, "epoch": 3135} {"train_loss": -25.640552520751953, "global_step": 260262, "epoch": 3135} {"train_loss": -25.406978607177734, "global_step": 260263, "epoch": 3135} {"train_loss": -24.80374526977539, "global_step": 260264, "epoch": 3135} {"train_loss": -24.900680541992188, "global_step": 260265, "epoch": 3135} {"train_loss": -25.1865291595459, "global_step": 260266, "epoch": 3135} {"train_loss": -24.72585678100586, "global_step": 260267, "epoch": 3135} {"train_loss": -24.868595123291016, "global_step": 260268, "epoch": 3135} {"train_loss": -25.012346267700195, "global_step": 260269, "epoch": 3135} {"train_loss": -25.25661277770996, "global_step": 260270, "epoch": 3135} {"train_loss": -25.234914779663086, "global_step": 260271, "epoch": 3135} {"train_loss": -25.058935165405273, "global_step": 260272, "epoch": 3135} {"train_loss": -25.404733657836914, "global_step": 260273, "epoch": 3135} {"train_loss": -25.15887451171875, "global_step": 260274, "epoch": 3135} {"train_loss": -25.32863426208496, "global_step": 260275, "epoch": 3135} {"train_loss": -25.42301368713379, "global_step": 260276, "epoch": 3135} {"train_loss": -25.57891845703125, "global_step": 260277, "epoch": 3135} {"train_loss": -25.081724166870117, "global_step": 260278, "epoch": 3135} {"train_loss": -25.266324996948242, "global_step": 260279, "epoch": 3135} {"train_loss": -25.210500717163086, "global_step": 260280, "epoch": 3135} {"train_loss": -25.0293025970459, "global_step": 260281, "epoch": 3135} {"train_loss": -25.27898597717285, "global_step": 260282, "epoch": 3135} {"train_loss": -25.38112449645996, "global_step": 260283, "epoch": 3135} {"train_loss": -24.91499900817871, "global_step": 260284, "epoch": 3135} {"train_loss": -24.981597900390625, "global_step": 260285, "epoch": 3135} {"train_loss": -25.11839485168457, "global_step": 260286, "epoch": 3135} {"train_loss": -25.066246308476092, "global_step": 260287, "epoch": 3135, "val_loss": 6961687.0} {"train_loss": -23.701353073120117, "global_step": 260288, "epoch": 3136} {"train_loss": -23.259164810180664, "global_step": 260289, "epoch": 3136} {"train_loss": -23.824975967407227, "global_step": 260290, "epoch": 3136} {"train_loss": -24.229232788085938, "global_step": 260291, "epoch": 3136} {"train_loss": -24.054351806640625, "global_step": 260292, "epoch": 3136} {"train_loss": -23.949981689453125, "global_step": 260293, "epoch": 3136} {"train_loss": -24.33728790283203, "global_step": 260294, "epoch": 3136} {"train_loss": -24.213037490844727, "global_step": 260295, "epoch": 3136} {"train_loss": -24.90039825439453, "global_step": 260296, "epoch": 3136} {"train_loss": -23.51067543029785, "global_step": 260297, "epoch": 3136} {"train_loss": -24.479969024658203, "global_step": 260298, "epoch": 3136} {"train_loss": -24.71714973449707, "global_step": 260299, "epoch": 3136} {"train_loss": -24.2509708404541, "global_step": 260300, "epoch": 3136} {"train_loss": -24.411354064941406, "global_step": 260301, "epoch": 3136} {"train_loss": -24.949275970458984, "global_step": 260302, "epoch": 3136} {"train_loss": -24.514148712158203, "global_step": 260303, "epoch": 3136} {"train_loss": -24.45362663269043, "global_step": 260304, "epoch": 3136} {"train_loss": -24.714401245117188, "global_step": 260305, "epoch": 3136} {"train_loss": -24.900569915771484, "global_step": 260306, "epoch": 3136} {"train_loss": -24.6346492767334, "global_step": 260307, "epoch": 3136} {"train_loss": -24.890775680541992, "global_step": 260308, "epoch": 3136} {"train_loss": -24.73844337463379, "global_step": 260309, "epoch": 3136} {"train_loss": -24.73777198791504, "global_step": 260310, "epoch": 3136} {"train_loss": -25.034019470214844, "global_step": 260311, "epoch": 3136} {"train_loss": -24.86917495727539, "global_step": 260312, "epoch": 3136} {"train_loss": -24.907367706298828, "global_step": 260313, "epoch": 3136} {"train_loss": -25.0051212310791, "global_step": 260314, "epoch": 3136} {"train_loss": -24.902467727661133, "global_step": 260315, "epoch": 3136} {"train_loss": -25.08493995666504, "global_step": 260316, "epoch": 3136} {"train_loss": -25.150205612182617, "global_step": 260317, "epoch": 3136} {"train_loss": -25.136280059814453, "global_step": 260318, "epoch": 3136} {"train_loss": -24.942529678344727, "global_step": 260319, "epoch": 3136} {"train_loss": -25.274520874023438, "global_step": 260320, "epoch": 3136} {"train_loss": -24.969985961914062, "global_step": 260321, "epoch": 3136} {"train_loss": -25.252302169799805, "global_step": 260322, "epoch": 3136} {"train_loss": -25.355012893676758, "global_step": 260323, "epoch": 3136} {"train_loss": -25.25482940673828, "global_step": 260324, "epoch": 3136} {"train_loss": -25.37403678894043, "global_step": 260325, "epoch": 3136} {"train_loss": -25.162967681884766, "global_step": 260326, "epoch": 3136} {"train_loss": -25.159042358398438, "global_step": 260327, "epoch": 3136} {"train_loss": -25.097135543823242, "global_step": 260328, "epoch": 3136} {"train_loss": -25.353351593017578, "global_step": 260329, "epoch": 3136} {"train_loss": -25.3515625, "global_step": 260330, "epoch": 3136} {"train_loss": -25.0303897857666, "global_step": 260331, "epoch": 3136} {"train_loss": -24.882658004760742, "global_step": 260332, "epoch": 3136} {"train_loss": -25.062437057495117, "global_step": 260333, "epoch": 3136} {"train_loss": -25.199935913085938, "global_step": 260334, "epoch": 3136} {"train_loss": -25.271390914916992, "global_step": 260335, "epoch": 3136} {"train_loss": -25.03363800048828, "global_step": 260336, "epoch": 3136} {"train_loss": -24.642683029174805, "global_step": 260337, "epoch": 3136} {"train_loss": -25.5019588470459, "global_step": 260338, "epoch": 3136} {"train_loss": -25.275196075439453, "global_step": 260339, "epoch": 3136} {"train_loss": -25.359943389892578, "global_step": 260340, "epoch": 3136} {"train_loss": -25.258024215698242, "global_step": 260341, "epoch": 3136} {"train_loss": -25.199081420898438, "global_step": 260342, "epoch": 3136} {"train_loss": -25.055068969726562, "global_step": 260343, "epoch": 3136} {"train_loss": -25.11276626586914, "global_step": 260344, "epoch": 3136} {"train_loss": -25.00946617126465, "global_step": 260345, "epoch": 3136} {"train_loss": -25.169153213500977, "global_step": 260346, "epoch": 3136} {"train_loss": -25.2868709564209, "global_step": 260347, "epoch": 3136} {"train_loss": -24.867965698242188, "global_step": 260348, "epoch": 3136} {"train_loss": -25.44605827331543, "global_step": 260349, "epoch": 3136} {"train_loss": -25.163068771362305, "global_step": 260350, "epoch": 3136} {"train_loss": -25.172643661499023, "global_step": 260351, "epoch": 3136} {"train_loss": -25.176055908203125, "global_step": 260352, "epoch": 3136} {"train_loss": -25.155155181884766, "global_step": 260353, "epoch": 3136} {"train_loss": -25.17683219909668, "global_step": 260354, "epoch": 3136} {"train_loss": -25.11490821838379, "global_step": 260355, "epoch": 3136} {"train_loss": -25.262182235717773, "global_step": 260356, "epoch": 3136} {"train_loss": -25.229202270507812, "global_step": 260357, "epoch": 3136} {"train_loss": -25.12057113647461, "global_step": 260358, "epoch": 3136} {"train_loss": -25.414161682128906, "global_step": 260359, "epoch": 3136} {"train_loss": -25.33003044128418, "global_step": 260360, "epoch": 3136} {"train_loss": -25.176681518554688, "global_step": 260361, "epoch": 3136} {"train_loss": -25.129074096679688, "global_step": 260362, "epoch": 3136} {"train_loss": -25.290428161621094, "global_step": 260363, "epoch": 3136} {"train_loss": -25.092111587524414, "global_step": 260364, "epoch": 3136} {"train_loss": -25.23552894592285, "global_step": 260365, "epoch": 3136} {"train_loss": -25.16934585571289, "global_step": 260366, "epoch": 3136} {"train_loss": -25.369577407836914, "global_step": 260367, "epoch": 3136} {"train_loss": -25.37605094909668, "global_step": 260368, "epoch": 3136} {"train_loss": -25.20144271850586, "global_step": 260369, "epoch": 3136} {"train_loss": -24.931016990937383, "global_step": 260370, "epoch": 3136, "val_loss": 7140033.0} {"train_loss": -24.37151527404785, "global_step": 260371, "epoch": 3137} {"train_loss": -23.525976181030273, "global_step": 260372, "epoch": 3137} {"train_loss": -24.67440414428711, "global_step": 260373, "epoch": 3137} {"train_loss": -24.600793838500977, "global_step": 260374, "epoch": 3137} {"train_loss": -25.2752685546875, "global_step": 260375, "epoch": 3137} {"train_loss": -24.869871139526367, "global_step": 260376, "epoch": 3137} {"train_loss": -24.84372329711914, "global_step": 260377, "epoch": 3137} {"train_loss": -25.32383155822754, "global_step": 260378, "epoch": 3137} {"train_loss": -25.030942916870117, "global_step": 260379, "epoch": 3137} {"train_loss": -24.715909957885742, "global_step": 260380, "epoch": 3137} {"train_loss": -25.17742919921875, "global_step": 260381, "epoch": 3137} {"train_loss": -24.66035270690918, "global_step": 260382, "epoch": 3137} {"train_loss": -24.800107955932617, "global_step": 260383, "epoch": 3137} {"train_loss": -24.519332885742188, "global_step": 260384, "epoch": 3137} {"train_loss": -25.130863189697266, "global_step": 260385, "epoch": 3137} {"train_loss": -25.1114501953125, "global_step": 260386, "epoch": 3137} {"train_loss": -24.91013526916504, "global_step": 260387, "epoch": 3137} {"train_loss": -25.286548614501953, "global_step": 260388, "epoch": 3137} {"train_loss": -25.302997589111328, "global_step": 260389, "epoch": 3137} {"train_loss": -24.957366943359375, "global_step": 260390, "epoch": 3137} {"train_loss": -24.67473793029785, "global_step": 260391, "epoch": 3137} {"train_loss": -24.83221435546875, "global_step": 260392, "epoch": 3137} {"train_loss": -25.045726776123047, "global_step": 260393, "epoch": 3137} {"train_loss": -24.87135887145996, "global_step": 260394, "epoch": 3137} {"train_loss": -25.27332305908203, "global_step": 260395, "epoch": 3137} {"train_loss": -25.206501007080078, "global_step": 260396, "epoch": 3137} {"train_loss": -25.07976722717285, "global_step": 260397, "epoch": 3137} {"train_loss": -25.131290435791016, "global_step": 260398, "epoch": 3137} {"train_loss": -25.15582275390625, "global_step": 260399, "epoch": 3137} {"train_loss": -25.1910457611084, "global_step": 260400, "epoch": 3137} {"train_loss": -25.637609481811523, "global_step": 260401, "epoch": 3137} {"train_loss": -25.4002628326416, "global_step": 260402, "epoch": 3137} {"train_loss": -25.313749313354492, "global_step": 260403, "epoch": 3137} {"train_loss": -25.3837890625, "global_step": 260404, "epoch": 3137} {"train_loss": -25.27680778503418, "global_step": 260405, "epoch": 3137} {"train_loss": -25.312923431396484, "global_step": 260406, "epoch": 3137} {"train_loss": -25.001325607299805, "global_step": 260407, "epoch": 3137} {"train_loss": -24.87405014038086, "global_step": 260408, "epoch": 3137} {"train_loss": -25.1097412109375, "global_step": 260409, "epoch": 3137} {"train_loss": -25.15596580505371, "global_step": 260410, "epoch": 3137} {"train_loss": -25.039426803588867, "global_step": 260411, "epoch": 3137} {"train_loss": -25.37935447692871, "global_step": 260412, "epoch": 3137} {"train_loss": -25.348474502563477, "global_step": 260413, "epoch": 3137} {"train_loss": -25.139432907104492, "global_step": 260414, "epoch": 3137} {"train_loss": -25.385196685791016, "global_step": 260415, "epoch": 3137} {"train_loss": -25.387277603149414, "global_step": 260416, "epoch": 3137} {"train_loss": -25.749937057495117, "global_step": 260417, "epoch": 3137} {"train_loss": -25.085861206054688, "global_step": 260418, "epoch": 3137} {"train_loss": -25.428808212280273, "global_step": 260419, "epoch": 3137} {"train_loss": -25.027341842651367, "global_step": 260420, "epoch": 3137} {"train_loss": -25.66364097595215, "global_step": 260421, "epoch": 3137} {"train_loss": -24.851516723632812, "global_step": 260422, "epoch": 3137} {"train_loss": -25.086660385131836, "global_step": 260423, "epoch": 3137} {"train_loss": -25.042722702026367, "global_step": 260424, "epoch": 3137} {"train_loss": -25.404701232910156, "global_step": 260425, "epoch": 3137} {"train_loss": -25.589275360107422, "global_step": 260426, "epoch": 3137} {"train_loss": -25.39845085144043, "global_step": 260427, "epoch": 3137} {"train_loss": -25.103139877319336, "global_step": 260428, "epoch": 3137} {"train_loss": -25.21463394165039, "global_step": 260429, "epoch": 3137} {"train_loss": -25.425634384155273, "global_step": 260430, "epoch": 3137} {"train_loss": -25.115217208862305, "global_step": 260431, "epoch": 3137} {"train_loss": -25.598608016967773, "global_step": 260432, "epoch": 3137} {"train_loss": -25.56130027770996, "global_step": 260433, "epoch": 3137} {"train_loss": -25.442930221557617, "global_step": 260434, "epoch": 3137} {"train_loss": -25.51889419555664, "global_step": 260435, "epoch": 3137} {"train_loss": -25.338773727416992, "global_step": 260436, "epoch": 3137} {"train_loss": -25.092283248901367, "global_step": 260437, "epoch": 3137} {"train_loss": -24.974143981933594, "global_step": 260438, "epoch": 3137} {"train_loss": -25.31337547302246, "global_step": 260439, "epoch": 3137} {"train_loss": -24.972341537475586, "global_step": 260440, "epoch": 3137} {"train_loss": -24.959182739257812, "global_step": 260441, "epoch": 3137} {"train_loss": -25.398584365844727, "global_step": 260442, "epoch": 3137} {"train_loss": -25.236722946166992, "global_step": 260443, "epoch": 3137} {"train_loss": -25.122480392456055, "global_step": 260444, "epoch": 3137} {"train_loss": -25.221607208251953, "global_step": 260445, "epoch": 3137} {"train_loss": -25.42753791809082, "global_step": 260446, "epoch": 3137} {"train_loss": -25.158950805664062, "global_step": 260447, "epoch": 3137} {"train_loss": -25.284595489501953, "global_step": 260448, "epoch": 3137} {"train_loss": -25.00213623046875, "global_step": 260449, "epoch": 3137} {"train_loss": -25.189802169799805, "global_step": 260450, "epoch": 3137} {"train_loss": -25.05479621887207, "global_step": 260451, "epoch": 3137} {"train_loss": -25.197362899780273, "global_step": 260452, "epoch": 3137} {"train_loss": -25.1314083926649, "global_step": 260453, "epoch": 3137, "val_loss": 6995989.0} {"train_loss": -24.501176834106445, "global_step": 260454, "epoch": 3138} {"train_loss": -25.2286434173584, "global_step": 260455, "epoch": 3138} {"train_loss": -25.18528938293457, "global_step": 260456, "epoch": 3138} {"train_loss": -25.002103805541992, "global_step": 260457, "epoch": 3138} {"train_loss": -24.701873779296875, "global_step": 260458, "epoch": 3138} {"train_loss": -24.730226516723633, "global_step": 260459, "epoch": 3138} {"train_loss": -25.224924087524414, "global_step": 260460, "epoch": 3138} {"train_loss": -24.87807273864746, "global_step": 260461, "epoch": 3138} {"train_loss": -25.1381778717041, "global_step": 260462, "epoch": 3138} {"train_loss": -24.78143882751465, "global_step": 260463, "epoch": 3138} {"train_loss": -25.173410415649414, "global_step": 260464, "epoch": 3138} {"train_loss": -25.032814025878906, "global_step": 260465, "epoch": 3138} {"train_loss": -25.1439151763916, "global_step": 260466, "epoch": 3138} {"train_loss": -25.282468795776367, "global_step": 260467, "epoch": 3138} {"train_loss": -24.835599899291992, "global_step": 260468, "epoch": 3138} {"train_loss": -25.01943016052246, "global_step": 260469, "epoch": 3138} {"train_loss": -25.32013702392578, "global_step": 260470, "epoch": 3138} {"train_loss": -25.13734245300293, "global_step": 260471, "epoch": 3138} {"train_loss": -25.258424758911133, "global_step": 260472, "epoch": 3138} {"train_loss": -24.686796188354492, "global_step": 260473, "epoch": 3138} {"train_loss": -25.5364990234375, "global_step": 260474, "epoch": 3138} {"train_loss": -25.38568687438965, "global_step": 260475, "epoch": 3138} {"train_loss": -25.03194236755371, "global_step": 260476, "epoch": 3138} {"train_loss": -25.488262176513672, "global_step": 260477, "epoch": 3138} {"train_loss": -24.940610885620117, "global_step": 260478, "epoch": 3138} {"train_loss": -25.607501983642578, "global_step": 260479, "epoch": 3138} {"train_loss": -25.3179988861084, "global_step": 260480, "epoch": 3138} {"train_loss": -25.435400009155273, "global_step": 260481, "epoch": 3138} {"train_loss": -24.942861557006836, "global_step": 260482, "epoch": 3138} {"train_loss": -25.434873580932617, "global_step": 260483, "epoch": 3138} {"train_loss": -25.14101219177246, "global_step": 260484, "epoch": 3138} {"train_loss": -25.12874412536621, "global_step": 260485, "epoch": 3138} {"train_loss": -25.35963249206543, "global_step": 260486, "epoch": 3138} {"train_loss": -24.9383602142334, "global_step": 260487, "epoch": 3138} {"train_loss": -25.361804962158203, "global_step": 260488, "epoch": 3138} {"train_loss": -25.0788516998291, "global_step": 260489, "epoch": 3138} {"train_loss": -25.0203800201416, "global_step": 260490, "epoch": 3138} {"train_loss": -24.898561477661133, "global_step": 260491, "epoch": 3138} {"train_loss": -25.078054428100586, "global_step": 260492, "epoch": 3138} {"train_loss": -24.914188385009766, "global_step": 260493, "epoch": 3138} {"train_loss": -25.321937561035156, "global_step": 260494, "epoch": 3138} {"train_loss": -25.67841148376465, "global_step": 260495, "epoch": 3138} {"train_loss": -25.073781967163086, "global_step": 260496, "epoch": 3138} {"train_loss": -25.35248565673828, "global_step": 260497, "epoch": 3138} {"train_loss": -25.27843475341797, "global_step": 260498, "epoch": 3138} {"train_loss": -25.416654586791992, "global_step": 260499, "epoch": 3138} {"train_loss": -24.884992599487305, "global_step": 260500, "epoch": 3138} {"train_loss": -25.34303092956543, "global_step": 260501, "epoch": 3138} {"train_loss": -25.40252685546875, "global_step": 260502, "epoch": 3138} {"train_loss": -25.3364200592041, "global_step": 260503, "epoch": 3138} {"train_loss": -25.22469139099121, "global_step": 260504, "epoch": 3138} {"train_loss": -25.100849151611328, "global_step": 260505, "epoch": 3138} {"train_loss": -25.35849952697754, "global_step": 260506, "epoch": 3138} {"train_loss": -25.232885360717773, "global_step": 260507, "epoch": 3138} {"train_loss": -25.310115814208984, "global_step": 260508, "epoch": 3138} {"train_loss": -25.18882942199707, "global_step": 260509, "epoch": 3138} {"train_loss": -25.079370498657227, "global_step": 260510, "epoch": 3138} {"train_loss": -25.059432983398438, "global_step": 260511, "epoch": 3138} {"train_loss": -25.121505737304688, "global_step": 260512, "epoch": 3138} {"train_loss": -25.269100189208984, "global_step": 260513, "epoch": 3138} {"train_loss": -25.37667465209961, "global_step": 260514, "epoch": 3138} {"train_loss": -25.75261878967285, "global_step": 260515, "epoch": 3138} {"train_loss": -25.170015335083008, "global_step": 260516, "epoch": 3138} {"train_loss": -25.066328048706055, "global_step": 260517, "epoch": 3138} {"train_loss": -25.09779930114746, "global_step": 260518, "epoch": 3138} {"train_loss": -25.228635787963867, "global_step": 260519, "epoch": 3138} {"train_loss": -24.7742862701416, "global_step": 260520, "epoch": 3138} {"train_loss": -25.11970329284668, "global_step": 260521, "epoch": 3138} {"train_loss": -24.880783081054688, "global_step": 260522, "epoch": 3138} {"train_loss": -24.934112548828125, "global_step": 260523, "epoch": 3138} {"train_loss": -24.533597946166992, "global_step": 260524, "epoch": 3138} {"train_loss": -25.08877944946289, "global_step": 260525, "epoch": 3138} {"train_loss": -25.10442543029785, "global_step": 260526, "epoch": 3138} {"train_loss": -25.168502807617188, "global_step": 260527, "epoch": 3138} {"train_loss": -25.32431411743164, "global_step": 260528, "epoch": 3138} {"train_loss": -25.083852767944336, "global_step": 260529, "epoch": 3138} {"train_loss": -25.116783142089844, "global_step": 260530, "epoch": 3138} {"train_loss": -24.837158203125, "global_step": 260531, "epoch": 3138} {"train_loss": -24.771835327148438, "global_step": 260532, "epoch": 3138} {"train_loss": -25.219314575195312, "global_step": 260533, "epoch": 3138} {"train_loss": -24.915847778320312, "global_step": 260534, "epoch": 3138} {"train_loss": -24.62541389465332, "global_step": 260535, "epoch": 3138} {"train_loss": -25.127959079053028, "global_step": 260536, "epoch": 3138, "val_loss": 6999095.0} {"train_loss": -24.78104591369629, "global_step": 260537, "epoch": 3139} {"train_loss": -24.535797119140625, "global_step": 260538, "epoch": 3139} {"train_loss": -23.96528434753418, "global_step": 260539, "epoch": 3139} {"train_loss": -24.264545440673828, "global_step": 260540, "epoch": 3139} {"train_loss": -24.8912410736084, "global_step": 260541, "epoch": 3139} {"train_loss": -24.72743797302246, "global_step": 260542, "epoch": 3139} {"train_loss": -24.313079833984375, "global_step": 260543, "epoch": 3139} {"train_loss": -24.41190528869629, "global_step": 260544, "epoch": 3139} {"train_loss": -24.789438247680664, "global_step": 260545, "epoch": 3139} {"train_loss": -24.623756408691406, "global_step": 260546, "epoch": 3139} {"train_loss": -24.854385375976562, "global_step": 260547, "epoch": 3139} {"train_loss": -24.813352584838867, "global_step": 260548, "epoch": 3139} {"train_loss": -25.06647300720215, "global_step": 260549, "epoch": 3139} {"train_loss": -24.686063766479492, "global_step": 260550, "epoch": 3139} {"train_loss": -25.048765182495117, "global_step": 260551, "epoch": 3139} {"train_loss": -25.06908416748047, "global_step": 260552, "epoch": 3139} {"train_loss": -24.920202255249023, "global_step": 260553, "epoch": 3139} {"train_loss": -25.035614013671875, "global_step": 260554, "epoch": 3139} {"train_loss": -24.987943649291992, "global_step": 260555, "epoch": 3139} {"train_loss": -25.333477020263672, "global_step": 260556, "epoch": 3139} {"train_loss": -25.1192626953125, "global_step": 260557, "epoch": 3139} {"train_loss": -24.782459259033203, "global_step": 260558, "epoch": 3139} {"train_loss": -24.888269424438477, "global_step": 260559, "epoch": 3139} {"train_loss": -24.791433334350586, "global_step": 260560, "epoch": 3139} {"train_loss": -25.54884147644043, "global_step": 260561, "epoch": 3139} {"train_loss": -25.185810089111328, "global_step": 260562, "epoch": 3139} {"train_loss": -25.474973678588867, "global_step": 260563, "epoch": 3139} {"train_loss": -25.418317794799805, "global_step": 260564, "epoch": 3139} {"train_loss": -25.333269119262695, "global_step": 260565, "epoch": 3139} {"train_loss": -25.00782585144043, "global_step": 260566, "epoch": 3139} {"train_loss": -25.10685157775879, "global_step": 260567, "epoch": 3139} {"train_loss": -25.314542770385742, "global_step": 260568, "epoch": 3139} {"train_loss": -25.28611183166504, "global_step": 260569, "epoch": 3139} {"train_loss": -25.14105224609375, "global_step": 260570, "epoch": 3139} {"train_loss": -25.29634666442871, "global_step": 260571, "epoch": 3139} {"train_loss": -25.156879425048828, "global_step": 260572, "epoch": 3139} {"train_loss": -25.24598503112793, "global_step": 260573, "epoch": 3139} {"train_loss": -25.187850952148438, "global_step": 260574, "epoch": 3139} {"train_loss": -25.311782836914062, "global_step": 260575, "epoch": 3139} {"train_loss": -25.297061920166016, "global_step": 260576, "epoch": 3139} {"train_loss": -25.888879776000977, "global_step": 260577, "epoch": 3139} {"train_loss": -24.862197875976562, "global_step": 260578, "epoch": 3139} {"train_loss": -25.244089126586914, "global_step": 260579, "epoch": 3139} {"train_loss": -25.41299819946289, "global_step": 260580, "epoch": 3139} {"train_loss": -24.959457397460938, "global_step": 260581, "epoch": 3139} {"train_loss": -25.52138328552246, "global_step": 260582, "epoch": 3139} {"train_loss": -25.111066818237305, "global_step": 260583, "epoch": 3139} {"train_loss": -24.886030197143555, "global_step": 260584, "epoch": 3139} {"train_loss": -25.293354034423828, "global_step": 260585, "epoch": 3139} {"train_loss": -25.260316848754883, "global_step": 260586, "epoch": 3139} {"train_loss": -25.466611862182617, "global_step": 260587, "epoch": 3139} {"train_loss": -25.232086181640625, "global_step": 260588, "epoch": 3139} {"train_loss": -25.20961570739746, "global_step": 260589, "epoch": 3139} {"train_loss": -25.562856674194336, "global_step": 260590, "epoch": 3139} {"train_loss": -25.237064361572266, "global_step": 260591, "epoch": 3139} {"train_loss": -25.093366622924805, "global_step": 260592, "epoch": 3139} {"train_loss": -25.276962280273438, "global_step": 260593, "epoch": 3139} {"train_loss": -25.248769760131836, "global_step": 260594, "epoch": 3139} {"train_loss": -25.368925094604492, "global_step": 260595, "epoch": 3139} {"train_loss": -25.287351608276367, "global_step": 260596, "epoch": 3139} {"train_loss": -25.319257736206055, "global_step": 260597, "epoch": 3139} {"train_loss": -24.968753814697266, "global_step": 260598, "epoch": 3139} {"train_loss": -25.53826332092285, "global_step": 260599, "epoch": 3139} {"train_loss": -25.106008529663086, "global_step": 260600, "epoch": 3139} {"train_loss": -24.929407119750977, "global_step": 260601, "epoch": 3139} {"train_loss": -25.16043472290039, "global_step": 260602, "epoch": 3139} {"train_loss": -24.736942291259766, "global_step": 260603, "epoch": 3139} {"train_loss": -25.038930892944336, "global_step": 260604, "epoch": 3139} {"train_loss": -24.710973739624023, "global_step": 260605, "epoch": 3139} {"train_loss": -24.371091842651367, "global_step": 260606, "epoch": 3139} {"train_loss": -24.948589324951172, "global_step": 260607, "epoch": 3139} {"train_loss": -25.335128784179688, "global_step": 260608, "epoch": 3139} {"train_loss": -24.998762130737305, "global_step": 260609, "epoch": 3139} {"train_loss": -24.804309844970703, "global_step": 260610, "epoch": 3139} {"train_loss": -24.86918067932129, "global_step": 260611, "epoch": 3139} {"train_loss": -24.797649383544922, "global_step": 260612, "epoch": 3139} {"train_loss": -25.1865234375, "global_step": 260613, "epoch": 3139} {"train_loss": -24.69477653503418, "global_step": 260614, "epoch": 3139} {"train_loss": -24.99982452392578, "global_step": 260615, "epoch": 3139} {"train_loss": -25.257959365844727, "global_step": 260616, "epoch": 3139} {"train_loss": -24.98438262939453, "global_step": 260617, "epoch": 3139} {"train_loss": -24.85707664489746, "global_step": 260618, "epoch": 3139} {"train_loss": -25.047834695103656, "global_step": 260619, "epoch": 3139, "val_loss": 6925253.0} {"train_loss": -24.874605178833008, "global_step": 260620, "epoch": 3140} {"train_loss": -24.68983268737793, "global_step": 260621, "epoch": 3140} {"train_loss": -24.643798828125, "global_step": 260622, "epoch": 3140} {"train_loss": -24.883909225463867, "global_step": 260623, "epoch": 3140} {"train_loss": -24.60491371154785, "global_step": 260624, "epoch": 3140} {"train_loss": -24.872697830200195, "global_step": 260625, "epoch": 3140} {"train_loss": -24.47237205505371, "global_step": 260626, "epoch": 3140} {"train_loss": -24.59256362915039, "global_step": 260627, "epoch": 3140} {"train_loss": -24.92946434020996, "global_step": 260628, "epoch": 3140} {"train_loss": -24.797658920288086, "global_step": 260629, "epoch": 3140} {"train_loss": -24.88894271850586, "global_step": 260630, "epoch": 3140} {"train_loss": -25.226728439331055, "global_step": 260631, "epoch": 3140} {"train_loss": -25.076936721801758, "global_step": 260632, "epoch": 3140} {"train_loss": -24.696365356445312, "global_step": 260633, "epoch": 3140} {"train_loss": -24.919391632080078, "global_step": 260634, "epoch": 3140} {"train_loss": -25.191776275634766, "global_step": 260635, "epoch": 3140} {"train_loss": -25.12642478942871, "global_step": 260636, "epoch": 3140} {"train_loss": -24.934032440185547, "global_step": 260637, "epoch": 3140} {"train_loss": -24.87153434753418, "global_step": 260638, "epoch": 3140} {"train_loss": -24.93715476989746, "global_step": 260639, "epoch": 3140} {"train_loss": -25.190473556518555, "global_step": 260640, "epoch": 3140} {"train_loss": -24.889297485351562, "global_step": 260641, "epoch": 3140} {"train_loss": -25.128019332885742, "global_step": 260642, "epoch": 3140} {"train_loss": -25.108755111694336, "global_step": 260643, "epoch": 3140} {"train_loss": -25.13108253479004, "global_step": 260644, "epoch": 3140} {"train_loss": -25.244199752807617, "global_step": 260645, "epoch": 3140} {"train_loss": -25.223907470703125, "global_step": 260646, "epoch": 3140} {"train_loss": -25.332427978515625, "global_step": 260647, "epoch": 3140} {"train_loss": -25.140928268432617, "global_step": 260648, "epoch": 3140} {"train_loss": -24.986108779907227, "global_step": 260649, "epoch": 3140} {"train_loss": -25.018705368041992, "global_step": 260650, "epoch": 3140} {"train_loss": -24.965591430664062, "global_step": 260651, "epoch": 3140} {"train_loss": -25.0674991607666, "global_step": 260652, "epoch": 3140} {"train_loss": -25.4453067779541, "global_step": 260653, "epoch": 3140} {"train_loss": -25.047292709350586, "global_step": 260654, "epoch": 3140} {"train_loss": -25.406103134155273, "global_step": 260655, "epoch": 3140} {"train_loss": -24.919363021850586, "global_step": 260656, "epoch": 3140} {"train_loss": -25.575719833374023, "global_step": 260657, "epoch": 3140} {"train_loss": -25.476720809936523, "global_step": 260658, "epoch": 3140} {"train_loss": -25.03550148010254, "global_step": 260659, "epoch": 3140} {"train_loss": -25.361042022705078, "global_step": 260660, "epoch": 3140} {"train_loss": -25.215866088867188, "global_step": 260661, "epoch": 3140} {"train_loss": -25.03890609741211, "global_step": 260662, "epoch": 3140} {"train_loss": -25.104663848876953, "global_step": 260663, "epoch": 3140} {"train_loss": -25.123428344726562, "global_step": 260664, "epoch": 3140} {"train_loss": -25.064760208129883, "global_step": 260665, "epoch": 3140} {"train_loss": -25.454130172729492, "global_step": 260666, "epoch": 3140} {"train_loss": -24.96479606628418, "global_step": 260667, "epoch": 3140} {"train_loss": -25.60310935974121, "global_step": 260668, "epoch": 3140} {"train_loss": -25.170475006103516, "global_step": 260669, "epoch": 3140} {"train_loss": -25.126712799072266, "global_step": 260670, "epoch": 3140} {"train_loss": -25.463560104370117, "global_step": 260671, "epoch": 3140} {"train_loss": -25.2515869140625, "global_step": 260672, "epoch": 3140} {"train_loss": -24.972410202026367, "global_step": 260673, "epoch": 3140} {"train_loss": -25.285022735595703, "global_step": 260674, "epoch": 3140} {"train_loss": -25.284902572631836, "global_step": 260675, "epoch": 3140} {"train_loss": -25.281553268432617, "global_step": 260676, "epoch": 3140} {"train_loss": -25.25373649597168, "global_step": 260677, "epoch": 3140} {"train_loss": -25.298181533813477, "global_step": 260678, "epoch": 3140} {"train_loss": -25.33995246887207, "global_step": 260679, "epoch": 3140} {"train_loss": -24.39678955078125, "global_step": 260680, "epoch": 3140} {"train_loss": -24.36395835876465, "global_step": 260681, "epoch": 3140} {"train_loss": -25.00068473815918, "global_step": 260682, "epoch": 3140} {"train_loss": -24.88234519958496, "global_step": 260683, "epoch": 3140} {"train_loss": -25.060007095336914, "global_step": 260684, "epoch": 3140} {"train_loss": -24.865652084350586, "global_step": 260685, "epoch": 3140} {"train_loss": -24.775285720825195, "global_step": 260686, "epoch": 3140} {"train_loss": -25.007505416870117, "global_step": 260687, "epoch": 3140} {"train_loss": -24.923200607299805, "global_step": 260688, "epoch": 3140} {"train_loss": -24.518436431884766, "global_step": 260689, "epoch": 3140} {"train_loss": -24.794570922851562, "global_step": 260690, "epoch": 3140} {"train_loss": -24.8195858001709, "global_step": 260691, "epoch": 3140} {"train_loss": -24.508981704711914, "global_step": 260692, "epoch": 3140} {"train_loss": -25.35753059387207, "global_step": 260693, "epoch": 3140} {"train_loss": -25.029813766479492, "global_step": 260694, "epoch": 3140} {"train_loss": -25.182905197143555, "global_step": 260695, "epoch": 3140} {"train_loss": -25.05470085144043, "global_step": 260696, "epoch": 3140} {"train_loss": -25.139638900756836, "global_step": 260697, "epoch": 3140} {"train_loss": -25.030410766601562, "global_step": 260698, "epoch": 3140} {"train_loss": -25.129901885986328, "global_step": 260699, "epoch": 3140} {"train_loss": -25.11115074157715, "global_step": 260700, "epoch": 3140} {"train_loss": -25.34482765197754, "global_step": 260701, "epoch": 3140} {"train_loss": -25.04720292608422, "global_step": 260702, "epoch": 3140, "val_loss": 7016247.0} {"train_loss": -24.76216697692871, "global_step": 260703, "epoch": 3141} {"train_loss": -25.12265968322754, "global_step": 260704, "epoch": 3141} {"train_loss": -25.097013473510742, "global_step": 260705, "epoch": 3141} {"train_loss": -24.68951416015625, "global_step": 260706, "epoch": 3141} {"train_loss": -24.9628963470459, "global_step": 260707, "epoch": 3141} {"train_loss": -24.790882110595703, "global_step": 260708, "epoch": 3141} {"train_loss": -25.16252326965332, "global_step": 260709, "epoch": 3141} {"train_loss": -25.08732795715332, "global_step": 260710, "epoch": 3141} {"train_loss": -24.973636627197266, "global_step": 260711, "epoch": 3141} {"train_loss": -25.1335391998291, "global_step": 260712, "epoch": 3141} {"train_loss": -25.14234161376953, "global_step": 260713, "epoch": 3141} {"train_loss": -24.674394607543945, "global_step": 260714, "epoch": 3141} {"train_loss": -25.213825225830078, "global_step": 260715, "epoch": 3141} {"train_loss": -25.34169578552246, "global_step": 260716, "epoch": 3141} {"train_loss": -24.951642990112305, "global_step": 260717, "epoch": 3141} {"train_loss": -25.036285400390625, "global_step": 260718, "epoch": 3141} {"train_loss": -25.354318618774414, "global_step": 260719, "epoch": 3141} {"train_loss": -24.942228317260742, "global_step": 260720, "epoch": 3141} {"train_loss": -24.917987823486328, "global_step": 260721, "epoch": 3141} {"train_loss": -24.941946029663086, "global_step": 260722, "epoch": 3141} {"train_loss": -25.395681381225586, "global_step": 260723, "epoch": 3141} {"train_loss": -25.514053344726562, "global_step": 260724, "epoch": 3141} {"train_loss": -24.95253562927246, "global_step": 260725, "epoch": 3141} {"train_loss": -25.141172409057617, "global_step": 260726, "epoch": 3141} {"train_loss": -25.209701538085938, "global_step": 260727, "epoch": 3141} {"train_loss": -25.365224838256836, "global_step": 260728, "epoch": 3141} {"train_loss": -25.1667537689209, "global_step": 260729, "epoch": 3141} {"train_loss": -25.418745040893555, "global_step": 260730, "epoch": 3141} {"train_loss": -25.18060874938965, "global_step": 260731, "epoch": 3141} {"train_loss": -25.45104217529297, "global_step": 260732, "epoch": 3141} {"train_loss": -25.47560691833496, "global_step": 260733, "epoch": 3141} {"train_loss": -25.471128463745117, "global_step": 260734, "epoch": 3141} {"train_loss": -25.361114501953125, "global_step": 260735, "epoch": 3141} {"train_loss": -25.13262939453125, "global_step": 260736, "epoch": 3141} {"train_loss": -25.275556564331055, "global_step": 260737, "epoch": 3141} {"train_loss": -25.132810592651367, "global_step": 260738, "epoch": 3141} {"train_loss": -25.030746459960938, "global_step": 260739, "epoch": 3141} {"train_loss": -25.166181564331055, "global_step": 260740, "epoch": 3141} {"train_loss": -25.413022994995117, "global_step": 260741, "epoch": 3141} {"train_loss": -25.619979858398438, "global_step": 260742, "epoch": 3141} {"train_loss": -25.633352279663086, "global_step": 260743, "epoch": 3141} {"train_loss": -25.07605743408203, "global_step": 260744, "epoch": 3141} {"train_loss": -25.32217025756836, "global_step": 260745, "epoch": 3141} {"train_loss": -25.509408950805664, "global_step": 260746, "epoch": 3141} {"train_loss": -25.6275634765625, "global_step": 260747, "epoch": 3141} {"train_loss": -25.564496994018555, "global_step": 260748, "epoch": 3141} {"train_loss": -25.392772674560547, "global_step": 260749, "epoch": 3141} {"train_loss": -25.191333770751953, "global_step": 260750, "epoch": 3141} {"train_loss": -25.46495246887207, "global_step": 260751, "epoch": 3141} {"train_loss": -25.043663024902344, "global_step": 260752, "epoch": 3141} {"train_loss": -24.645254135131836, "global_step": 260753, "epoch": 3141} {"train_loss": -24.88808822631836, "global_step": 260754, "epoch": 3141} {"train_loss": -25.194595336914062, "global_step": 260755, "epoch": 3141} {"train_loss": -24.98404312133789, "global_step": 260756, "epoch": 3141} {"train_loss": -25.103126525878906, "global_step": 260757, "epoch": 3141} {"train_loss": -24.88227653503418, "global_step": 260758, "epoch": 3141} {"train_loss": -25.09172821044922, "global_step": 260759, "epoch": 3141} {"train_loss": -25.69707679748535, "global_step": 260760, "epoch": 3141} {"train_loss": -25.163211822509766, "global_step": 260761, "epoch": 3141} {"train_loss": -25.033933639526367, "global_step": 260762, "epoch": 3141} {"train_loss": -25.102590560913086, "global_step": 260763, "epoch": 3141} {"train_loss": -25.373119354248047, "global_step": 260764, "epoch": 3141} {"train_loss": -25.339540481567383, "global_step": 260765, "epoch": 3141} {"train_loss": -25.232196807861328, "global_step": 260766, "epoch": 3141} {"train_loss": -25.084768295288086, "global_step": 260767, "epoch": 3141} {"train_loss": -25.203622817993164, "global_step": 260768, "epoch": 3141} {"train_loss": -25.063785552978516, "global_step": 260769, "epoch": 3141} {"train_loss": -25.505971908569336, "global_step": 260770, "epoch": 3141} {"train_loss": -25.03059196472168, "global_step": 260771, "epoch": 3141} {"train_loss": -25.296796798706055, "global_step": 260772, "epoch": 3141} {"train_loss": -24.67194938659668, "global_step": 260773, "epoch": 3141} {"train_loss": -25.057645797729492, "global_step": 260774, "epoch": 3141} {"train_loss": -25.185758590698242, "global_step": 260775, "epoch": 3141} {"train_loss": -25.24576759338379, "global_step": 260776, "epoch": 3141} {"train_loss": -24.927398681640625, "global_step": 260777, "epoch": 3141} {"train_loss": -25.373788833618164, "global_step": 260778, "epoch": 3141} {"train_loss": -25.424732208251953, "global_step": 260779, "epoch": 3141} {"train_loss": -24.822847366333008, "global_step": 260780, "epoch": 3141} {"train_loss": -25.503786087036133, "global_step": 260781, "epoch": 3141} {"train_loss": -25.690052032470703, "global_step": 260782, "epoch": 3141} {"train_loss": -25.26782989501953, "global_step": 260783, "epoch": 3141} {"train_loss": -25.12406349182129, "global_step": 260784, "epoch": 3141} {"train_loss": -25.181770807289215, "global_step": 260785, "epoch": 3141, "val_loss": 6968860.0} {"train_loss": -23.313512802124023, "global_step": 260786, "epoch": 3142} {"train_loss": -24.164764404296875, "global_step": 260787, "epoch": 3142} {"train_loss": -24.52849578857422, "global_step": 260788, "epoch": 3142} {"train_loss": -23.70529556274414, "global_step": 260789, "epoch": 3142} {"train_loss": -24.14728355407715, "global_step": 260790, "epoch": 3142} {"train_loss": -23.977277755737305, "global_step": 260791, "epoch": 3142} {"train_loss": -24.55047607421875, "global_step": 260792, "epoch": 3142} {"train_loss": -24.447891235351562, "global_step": 260793, "epoch": 3142} {"train_loss": -24.41962242126465, "global_step": 260794, "epoch": 3142} {"train_loss": -24.753149032592773, "global_step": 260795, "epoch": 3142} {"train_loss": -24.771677017211914, "global_step": 260796, "epoch": 3142} {"train_loss": -24.415693283081055, "global_step": 260797, "epoch": 3142} {"train_loss": -24.658716201782227, "global_step": 260798, "epoch": 3142} {"train_loss": -24.439916610717773, "global_step": 260799, "epoch": 3142} {"train_loss": -24.47589683532715, "global_step": 260800, "epoch": 3142} {"train_loss": -24.489267349243164, "global_step": 260801, "epoch": 3142} {"train_loss": -24.548261642456055, "global_step": 260802, "epoch": 3142} {"train_loss": -24.6428279876709, "global_step": 260803, "epoch": 3142} {"train_loss": -24.890216827392578, "global_step": 260804, "epoch": 3142} {"train_loss": -25.047277450561523, "global_step": 260805, "epoch": 3142} {"train_loss": -25.067880630493164, "global_step": 260806, "epoch": 3142} {"train_loss": -25.038888931274414, "global_step": 260807, "epoch": 3142} {"train_loss": -24.80437660217285, "global_step": 260808, "epoch": 3142} {"train_loss": -24.92633056640625, "global_step": 260809, "epoch": 3142} {"train_loss": -25.101163864135742, "global_step": 260810, "epoch": 3142} {"train_loss": -24.655948638916016, "global_step": 260811, "epoch": 3142} {"train_loss": -25.039594650268555, "global_step": 260812, "epoch": 3142} {"train_loss": -24.82415199279785, "global_step": 260813, "epoch": 3142} {"train_loss": -24.737974166870117, "global_step": 260814, "epoch": 3142} {"train_loss": -25.27079200744629, "global_step": 260815, "epoch": 3142} {"train_loss": -24.88020896911621, "global_step": 260816, "epoch": 3142} {"train_loss": -25.048954010009766, "global_step": 260817, "epoch": 3142} {"train_loss": -24.946502685546875, "global_step": 260818, "epoch": 3142} {"train_loss": -24.76578140258789, "global_step": 260819, "epoch": 3142} {"train_loss": -25.13964080810547, "global_step": 260820, "epoch": 3142} {"train_loss": -25.30585289001465, "global_step": 260821, "epoch": 3142} {"train_loss": -25.304685592651367, "global_step": 260822, "epoch": 3142} {"train_loss": -24.87706756591797, "global_step": 260823, "epoch": 3142} {"train_loss": -25.156538009643555, "global_step": 260824, "epoch": 3142} {"train_loss": -25.551898956298828, "global_step": 260825, "epoch": 3142} {"train_loss": -25.47649574279785, "global_step": 260826, "epoch": 3142} {"train_loss": -25.285512924194336, "global_step": 260827, "epoch": 3142} {"train_loss": -25.50351333618164, "global_step": 260828, "epoch": 3142} {"train_loss": -25.105100631713867, "global_step": 260829, "epoch": 3142} {"train_loss": -25.498075485229492, "global_step": 260830, "epoch": 3142} {"train_loss": -25.202295303344727, "global_step": 260831, "epoch": 3142} {"train_loss": -25.15015983581543, "global_step": 260832, "epoch": 3142} {"train_loss": -24.963775634765625, "global_step": 260833, "epoch": 3142} {"train_loss": -25.13458251953125, "global_step": 260834, "epoch": 3142} {"train_loss": -25.417789459228516, "global_step": 260835, "epoch": 3142} {"train_loss": -25.198801040649414, "global_step": 260836, "epoch": 3142} {"train_loss": -25.173770904541016, "global_step": 260837, "epoch": 3142} {"train_loss": -24.83982276916504, "global_step": 260838, "epoch": 3142} {"train_loss": -25.084218978881836, "global_step": 260839, "epoch": 3142} {"train_loss": -24.855031967163086, "global_step": 260840, "epoch": 3142} {"train_loss": -25.319150924682617, "global_step": 260841, "epoch": 3142} {"train_loss": -24.969343185424805, "global_step": 260842, "epoch": 3142} {"train_loss": -25.30536460876465, "global_step": 260843, "epoch": 3142} {"train_loss": -25.352880477905273, "global_step": 260844, "epoch": 3142} {"train_loss": -24.939537048339844, "global_step": 260845, "epoch": 3142} {"train_loss": -25.332809448242188, "global_step": 260846, "epoch": 3142} {"train_loss": -25.017160415649414, "global_step": 260847, "epoch": 3142} {"train_loss": -25.137939453125, "global_step": 260848, "epoch": 3142} {"train_loss": -24.3741512298584, "global_step": 260849, "epoch": 3142} {"train_loss": -24.870161056518555, "global_step": 260850, "epoch": 3142} {"train_loss": -25.005924224853516, "global_step": 260851, "epoch": 3142} {"train_loss": -24.978046417236328, "global_step": 260852, "epoch": 3142} {"train_loss": -25.102521896362305, "global_step": 260853, "epoch": 3142} {"train_loss": -25.112401962280273, "global_step": 260854, "epoch": 3142} {"train_loss": -25.336746215820312, "global_step": 260855, "epoch": 3142} {"train_loss": -24.71477699279785, "global_step": 260856, "epoch": 3142} {"train_loss": -24.793567657470703, "global_step": 260857, "epoch": 3142} {"train_loss": -25.061187744140625, "global_step": 260858, "epoch": 3142} {"train_loss": -25.16080093383789, "global_step": 260859, "epoch": 3142} {"train_loss": -25.381811141967773, "global_step": 260860, "epoch": 3142} {"train_loss": -24.81304168701172, "global_step": 260861, "epoch": 3142} {"train_loss": -24.841867446899414, "global_step": 260862, "epoch": 3142} {"train_loss": -24.97266960144043, "global_step": 260863, "epoch": 3142} {"train_loss": -25.271265029907227, "global_step": 260864, "epoch": 3142} {"train_loss": -25.224395751953125, "global_step": 260865, "epoch": 3142} {"train_loss": -25.192108154296875, "global_step": 260866, "epoch": 3142} {"train_loss": -25.003690719604492, "global_step": 260867, "epoch": 3142} {"train_loss": -24.922527313232422, "global_step": 260868, "epoch": 3142, "val_loss": 6908880.0} {"train_loss": -23.459012985229492, "global_step": 260869, "epoch": 3143} {"train_loss": -23.772109985351562, "global_step": 260870, "epoch": 3143} {"train_loss": -24.861526489257812, "global_step": 260871, "epoch": 3143} {"train_loss": -24.657520294189453, "global_step": 260872, "epoch": 3143} {"train_loss": -25.23488426208496, "global_step": 260873, "epoch": 3143} {"train_loss": -24.225427627563477, "global_step": 260874, "epoch": 3143} {"train_loss": -24.52565574645996, "global_step": 260875, "epoch": 3143} {"train_loss": -24.69150161743164, "global_step": 260876, "epoch": 3143} {"train_loss": -24.6274471282959, "global_step": 260877, "epoch": 3143} {"train_loss": -24.540359497070312, "global_step": 260878, "epoch": 3143} {"train_loss": -25.0423583984375, "global_step": 260879, "epoch": 3143} {"train_loss": -24.970264434814453, "global_step": 260880, "epoch": 3143} {"train_loss": -24.703128814697266, "global_step": 260881, "epoch": 3143} {"train_loss": -24.621810913085938, "global_step": 260882, "epoch": 3143} {"train_loss": -25.2907772064209, "global_step": 260883, "epoch": 3143} {"train_loss": -24.927791595458984, "global_step": 260884, "epoch": 3143} {"train_loss": -25.276458740234375, "global_step": 260885, "epoch": 3143} {"train_loss": -25.1864013671875, "global_step": 260886, "epoch": 3143} {"train_loss": -24.69147300720215, "global_step": 260887, "epoch": 3143} {"train_loss": -25.09480094909668, "global_step": 260888, "epoch": 3143} {"train_loss": -25.212657928466797, "global_step": 260889, "epoch": 3143} {"train_loss": -24.71209144592285, "global_step": 260890, "epoch": 3143} {"train_loss": -25.236276626586914, "global_step": 260891, "epoch": 3143} {"train_loss": -24.831235885620117, "global_step": 260892, "epoch": 3143} {"train_loss": -25.04363441467285, "global_step": 260893, "epoch": 3143} {"train_loss": -24.83240509033203, "global_step": 260894, "epoch": 3143} {"train_loss": -25.538299560546875, "global_step": 260895, "epoch": 3143} {"train_loss": -24.818073272705078, "global_step": 260896, "epoch": 3143} {"train_loss": -25.314985275268555, "global_step": 260897, "epoch": 3143} {"train_loss": -25.085920333862305, "global_step": 260898, "epoch": 3143} {"train_loss": -25.326370239257812, "global_step": 260899, "epoch": 3143} {"train_loss": -25.01506996154785, "global_step": 260900, "epoch": 3143} {"train_loss": -25.325408935546875, "global_step": 260901, "epoch": 3143} {"train_loss": -24.73769187927246, "global_step": 260902, "epoch": 3143} {"train_loss": -25.187559127807617, "global_step": 260903, "epoch": 3143} {"train_loss": -25.146345138549805, "global_step": 260904, "epoch": 3143} {"train_loss": -25.250940322875977, "global_step": 260905, "epoch": 3143} {"train_loss": -25.140823364257812, "global_step": 260906, "epoch": 3143} {"train_loss": -25.3765869140625, "global_step": 260907, "epoch": 3143} {"train_loss": -25.056865692138672, "global_step": 260908, "epoch": 3143} {"train_loss": -25.02308464050293, "global_step": 260909, "epoch": 3143} {"train_loss": -25.358753204345703, "global_step": 260910, "epoch": 3143} {"train_loss": -25.04619598388672, "global_step": 260911, "epoch": 3143} {"train_loss": -25.205554962158203, "global_step": 260912, "epoch": 3143} {"train_loss": -25.193527221679688, "global_step": 260913, "epoch": 3143} {"train_loss": -25.360675811767578, "global_step": 260914, "epoch": 3143} {"train_loss": -25.1607666015625, "global_step": 260915, "epoch": 3143} {"train_loss": -25.373762130737305, "global_step": 260916, "epoch": 3143} {"train_loss": -25.580224990844727, "global_step": 260917, "epoch": 3143} {"train_loss": -25.50713539123535, "global_step": 260918, "epoch": 3143} {"train_loss": -25.120426177978516, "global_step": 260919, "epoch": 3143} {"train_loss": -25.198205947875977, "global_step": 260920, "epoch": 3143} {"train_loss": -25.124908447265625, "global_step": 260921, "epoch": 3143} {"train_loss": -24.860349655151367, "global_step": 260922, "epoch": 3143} {"train_loss": -25.076169967651367, "global_step": 260923, "epoch": 3143} {"train_loss": -24.916202545166016, "global_step": 260924, "epoch": 3143} {"train_loss": -24.8597469329834, "global_step": 260925, "epoch": 3143} {"train_loss": -25.422388076782227, "global_step": 260926, "epoch": 3143} {"train_loss": -25.112091064453125, "global_step": 260927, "epoch": 3143} {"train_loss": -24.937467575073242, "global_step": 260928, "epoch": 3143} {"train_loss": -24.928022384643555, "global_step": 260929, "epoch": 3143} {"train_loss": -25.106918334960938, "global_step": 260930, "epoch": 3143} {"train_loss": -25.257963180541992, "global_step": 260931, "epoch": 3143} {"train_loss": -25.497634887695312, "global_step": 260932, "epoch": 3143} {"train_loss": -25.167675018310547, "global_step": 260933, "epoch": 3143} {"train_loss": -25.08220863342285, "global_step": 260934, "epoch": 3143} {"train_loss": -25.25836753845215, "global_step": 260935, "epoch": 3143} {"train_loss": -25.07374382019043, "global_step": 260936, "epoch": 3143} {"train_loss": -25.206974029541016, "global_step": 260937, "epoch": 3143} {"train_loss": -25.47530174255371, "global_step": 260938, "epoch": 3143} {"train_loss": -25.166147232055664, "global_step": 260939, "epoch": 3143} {"train_loss": -24.683332443237305, "global_step": 260940, "epoch": 3143} {"train_loss": -24.8969783782959, "global_step": 260941, "epoch": 3143} {"train_loss": -25.224872589111328, "global_step": 260942, "epoch": 3143} {"train_loss": -25.249967575073242, "global_step": 260943, "epoch": 3143} {"train_loss": -25.218852996826172, "global_step": 260944, "epoch": 3143} {"train_loss": -25.189037322998047, "global_step": 260945, "epoch": 3143} {"train_loss": -25.236141204833984, "global_step": 260946, "epoch": 3143} {"train_loss": -24.742630004882812, "global_step": 260947, "epoch": 3143} {"train_loss": -25.066389083862305, "global_step": 260948, "epoch": 3143} {"train_loss": -25.208751678466797, "global_step": 260949, "epoch": 3143} {"train_loss": -25.114185333251953, "global_step": 260950, "epoch": 3143} {"train_loss": -25.030470652752612, "global_step": 260951, "epoch": 3143, "val_loss": 6825511.0} {"train_loss": -23.972227096557617, "global_step": 260952, "epoch": 3144} {"train_loss": -24.844013214111328, "global_step": 260953, "epoch": 3144} {"train_loss": -24.932743072509766, "global_step": 260954, "epoch": 3144} {"train_loss": -23.890703201293945, "global_step": 260955, "epoch": 3144} {"train_loss": -25.00506591796875, "global_step": 260956, "epoch": 3144} {"train_loss": -24.561288833618164, "global_step": 260957, "epoch": 3144} {"train_loss": -24.645830154418945, "global_step": 260958, "epoch": 3144} {"train_loss": -25.10209846496582, "global_step": 260959, "epoch": 3144} {"train_loss": -24.711774826049805, "global_step": 260960, "epoch": 3144} {"train_loss": -24.572458267211914, "global_step": 260961, "epoch": 3144} {"train_loss": -24.783689498901367, "global_step": 260962, "epoch": 3144} {"train_loss": -24.891321182250977, "global_step": 260963, "epoch": 3144} {"train_loss": -24.54206657409668, "global_step": 260964, "epoch": 3144} {"train_loss": -24.851919174194336, "global_step": 260965, "epoch": 3144} {"train_loss": -24.569746017456055, "global_step": 260966, "epoch": 3144} {"train_loss": -25.490833282470703, "global_step": 260967, "epoch": 3144} {"train_loss": -25.266992568969727, "global_step": 260968, "epoch": 3144} {"train_loss": -24.882986068725586, "global_step": 260969, "epoch": 3144} {"train_loss": -25.132678985595703, "global_step": 260970, "epoch": 3144} {"train_loss": -25.085742950439453, "global_step": 260971, "epoch": 3144} {"train_loss": -25.116270065307617, "global_step": 260972, "epoch": 3144} {"train_loss": -24.658044815063477, "global_step": 260973, "epoch": 3144} {"train_loss": -25.408864974975586, "global_step": 260974, "epoch": 3144} {"train_loss": -25.379117965698242, "global_step": 260975, "epoch": 3144} {"train_loss": -24.819387435913086, "global_step": 260976, "epoch": 3144} {"train_loss": -25.224197387695312, "global_step": 260977, "epoch": 3144} {"train_loss": -25.245208740234375, "global_step": 260978, "epoch": 3144} {"train_loss": -25.47159194946289, "global_step": 260979, "epoch": 3144} {"train_loss": -25.01136589050293, "global_step": 260980, "epoch": 3144} {"train_loss": -25.134260177612305, "global_step": 260981, "epoch": 3144} {"train_loss": -25.135385513305664, "global_step": 260982, "epoch": 3144} {"train_loss": -25.2031307220459, "global_step": 260983, "epoch": 3144} {"train_loss": -25.439313888549805, "global_step": 260984, "epoch": 3144} {"train_loss": -25.24925994873047, "global_step": 260985, "epoch": 3144} {"train_loss": -25.273681640625, "global_step": 260986, "epoch": 3144} {"train_loss": -25.33539390563965, "global_step": 260987, "epoch": 3144} {"train_loss": -25.51751136779785, "global_step": 260988, "epoch": 3144} {"train_loss": -25.30728530883789, "global_step": 260989, "epoch": 3144} {"train_loss": -25.245023727416992, "global_step": 260990, "epoch": 3144} {"train_loss": -25.2569522857666, "global_step": 260991, "epoch": 3144} {"train_loss": -25.52684783935547, "global_step": 260992, "epoch": 3144} {"train_loss": -25.3732852935791, "global_step": 260993, "epoch": 3144} {"train_loss": -25.215227127075195, "global_step": 260994, "epoch": 3144} {"train_loss": -25.633886337280273, "global_step": 260995, "epoch": 3144} {"train_loss": -24.924686431884766, "global_step": 260996, "epoch": 3144} {"train_loss": -25.54445457458496, "global_step": 260997, "epoch": 3144} {"train_loss": -24.9602108001709, "global_step": 260998, "epoch": 3144} {"train_loss": -25.065942764282227, "global_step": 260999, "epoch": 3144} {"train_loss": -25.415002822875977, "global_step": 261000, "epoch": 3144} {"train_loss": -25.311254501342773, "global_step": 261001, "epoch": 3144} {"train_loss": -25.061918258666992, "global_step": 261002, "epoch": 3144} {"train_loss": -24.819889068603516, "global_step": 261003, "epoch": 3144} {"train_loss": -24.726741790771484, "global_step": 261004, "epoch": 3144} {"train_loss": -25.00286865234375, "global_step": 261005, "epoch": 3144} {"train_loss": -24.86175537109375, "global_step": 261006, "epoch": 3144} {"train_loss": -25.512434005737305, "global_step": 261007, "epoch": 3144} {"train_loss": -25.032176971435547, "global_step": 261008, "epoch": 3144} {"train_loss": -24.71626853942871, "global_step": 261009, "epoch": 3144} {"train_loss": -25.330503463745117, "global_step": 261010, "epoch": 3144} {"train_loss": -24.97210693359375, "global_step": 261011, "epoch": 3144} {"train_loss": -24.779544830322266, "global_step": 261012, "epoch": 3144} {"train_loss": -25.15895652770996, "global_step": 261013, "epoch": 3144} {"train_loss": -25.106992721557617, "global_step": 261014, "epoch": 3144} {"train_loss": -24.898109436035156, "global_step": 261015, "epoch": 3144} {"train_loss": -25.084396362304688, "global_step": 261016, "epoch": 3144} {"train_loss": -25.114667892456055, "global_step": 261017, "epoch": 3144} {"train_loss": -24.943449020385742, "global_step": 261018, "epoch": 3144} {"train_loss": -24.817005157470703, "global_step": 261019, "epoch": 3144} {"train_loss": -24.850324630737305, "global_step": 261020, "epoch": 3144} {"train_loss": -25.027353286743164, "global_step": 261021, "epoch": 3144} {"train_loss": -25.07356071472168, "global_step": 261022, "epoch": 3144} {"train_loss": -25.152973175048828, "global_step": 261023, "epoch": 3144} {"train_loss": -24.979246139526367, "global_step": 261024, "epoch": 3144} {"train_loss": -25.1066837310791, "global_step": 261025, "epoch": 3144} {"train_loss": -25.3080997467041, "global_step": 261026, "epoch": 3144} {"train_loss": -25.17612075805664, "global_step": 261027, "epoch": 3144} {"train_loss": -24.98417854309082, "global_step": 261028, "epoch": 3144} {"train_loss": -24.93167495727539, "global_step": 261029, "epoch": 3144} {"train_loss": -24.83916664123535, "global_step": 261030, "epoch": 3144} {"train_loss": -25.26336669921875, "global_step": 261031, "epoch": 3144} {"train_loss": -25.04733657836914, "global_step": 261032, "epoch": 3144} {"train_loss": -25.12347984313965, "global_step": 261033, "epoch": 3144} {"train_loss": -25.034812582544532, "global_step": 261034, "epoch": 3144, "val_loss": 6986127.0} {"train_loss": -24.570362091064453, "global_step": 261035, "epoch": 3145} {"train_loss": -24.347700119018555, "global_step": 261036, "epoch": 3145} {"train_loss": -24.52997398376465, "global_step": 261037, "epoch": 3145} {"train_loss": -24.35579490661621, "global_step": 261038, "epoch": 3145} {"train_loss": -24.532804489135742, "global_step": 261039, "epoch": 3145} {"train_loss": -24.81574058532715, "global_step": 261040, "epoch": 3145} {"train_loss": -24.458763122558594, "global_step": 261041, "epoch": 3145} {"train_loss": -24.899246215820312, "global_step": 261042, "epoch": 3145} {"train_loss": -24.838884353637695, "global_step": 261043, "epoch": 3145} {"train_loss": -24.614355087280273, "global_step": 261044, "epoch": 3145} {"train_loss": -24.77212142944336, "global_step": 261045, "epoch": 3145} {"train_loss": -24.660520553588867, "global_step": 261046, "epoch": 3145} {"train_loss": -24.823104858398438, "global_step": 261047, "epoch": 3145} {"train_loss": -24.819774627685547, "global_step": 261048, "epoch": 3145} {"train_loss": -24.671222686767578, "global_step": 261049, "epoch": 3145} {"train_loss": -25.30241584777832, "global_step": 261050, "epoch": 3145} {"train_loss": -25.05443572998047, "global_step": 261051, "epoch": 3145} {"train_loss": -24.803543090820312, "global_step": 261052, "epoch": 3145} {"train_loss": -25.226322174072266, "global_step": 261053, "epoch": 3145} {"train_loss": -25.043943405151367, "global_step": 261054, "epoch": 3145} {"train_loss": -24.844812393188477, "global_step": 261055, "epoch": 3145} {"train_loss": -25.269861221313477, "global_step": 261056, "epoch": 3145} {"train_loss": -25.035751342773438, "global_step": 261057, "epoch": 3145} {"train_loss": -25.149442672729492, "global_step": 261058, "epoch": 3145} {"train_loss": -25.634632110595703, "global_step": 261059, "epoch": 3145} {"train_loss": -25.065439224243164, "global_step": 261060, "epoch": 3145} {"train_loss": -25.174875259399414, "global_step": 261061, "epoch": 3145} {"train_loss": -25.30064582824707, "global_step": 261062, "epoch": 3145} {"train_loss": -25.01058006286621, "global_step": 261063, "epoch": 3145} {"train_loss": -25.46539306640625, "global_step": 261064, "epoch": 3145} {"train_loss": -25.011608123779297, "global_step": 261065, "epoch": 3145} {"train_loss": -25.190425872802734, "global_step": 261066, "epoch": 3145} {"train_loss": -25.231393814086914, "global_step": 261067, "epoch": 3145} {"train_loss": -25.526166915893555, "global_step": 261068, "epoch": 3145} {"train_loss": -25.07082748413086, "global_step": 261069, "epoch": 3145} {"train_loss": -25.529247283935547, "global_step": 261070, "epoch": 3145} {"train_loss": -24.890945434570312, "global_step": 261071, "epoch": 3145} {"train_loss": -25.474536895751953, "global_step": 261072, "epoch": 3145} {"train_loss": -25.23639488220215, "global_step": 261073, "epoch": 3145} {"train_loss": -25.62196922302246, "global_step": 261074, "epoch": 3145} {"train_loss": -25.10872459411621, "global_step": 261075, "epoch": 3145} {"train_loss": -25.323476791381836, "global_step": 261076, "epoch": 3145} {"train_loss": -25.56757926940918, "global_step": 261077, "epoch": 3145} {"train_loss": -25.131332397460938, "global_step": 261078, "epoch": 3145} {"train_loss": -25.1291446685791, "global_step": 261079, "epoch": 3145} {"train_loss": -25.590238571166992, "global_step": 261080, "epoch": 3145} {"train_loss": -25.1569881439209, "global_step": 261081, "epoch": 3145} {"train_loss": -25.6502742767334, "global_step": 261082, "epoch": 3145} {"train_loss": -25.364383697509766, "global_step": 261083, "epoch": 3145} {"train_loss": -25.34091567993164, "global_step": 261084, "epoch": 3145} {"train_loss": -24.731184005737305, "global_step": 261085, "epoch": 3145} {"train_loss": -24.914762496948242, "global_step": 261086, "epoch": 3145} {"train_loss": -25.108844757080078, "global_step": 261087, "epoch": 3145} {"train_loss": -25.225027084350586, "global_step": 261088, "epoch": 3145} {"train_loss": -25.3443660736084, "global_step": 261089, "epoch": 3145} {"train_loss": -25.409015655517578, "global_step": 261090, "epoch": 3145} {"train_loss": -25.260238647460938, "global_step": 261091, "epoch": 3145} {"train_loss": -25.25177764892578, "global_step": 261092, "epoch": 3145} {"train_loss": -25.531335830688477, "global_step": 261093, "epoch": 3145} {"train_loss": -25.187702178955078, "global_step": 261094, "epoch": 3145} {"train_loss": -25.2380428314209, "global_step": 261095, "epoch": 3145} {"train_loss": -25.45415496826172, "global_step": 261096, "epoch": 3145} {"train_loss": -25.398588180541992, "global_step": 261097, "epoch": 3145} {"train_loss": -25.329288482666016, "global_step": 261098, "epoch": 3145} {"train_loss": -25.73553466796875, "global_step": 261099, "epoch": 3145} {"train_loss": -25.17327308654785, "global_step": 261100, "epoch": 3145} {"train_loss": -25.359390258789062, "global_step": 261101, "epoch": 3145} {"train_loss": -25.227298736572266, "global_step": 261102, "epoch": 3145} {"train_loss": -25.411428451538086, "global_step": 261103, "epoch": 3145} {"train_loss": -25.46245574951172, "global_step": 261104, "epoch": 3145} {"train_loss": -25.286054611206055, "global_step": 261105, "epoch": 3145} {"train_loss": -25.017724990844727, "global_step": 261106, "epoch": 3145} {"train_loss": -25.064725875854492, "global_step": 261107, "epoch": 3145} {"train_loss": -25.094181060791016, "global_step": 261108, "epoch": 3145} {"train_loss": -25.499326705932617, "global_step": 261109, "epoch": 3145} {"train_loss": -24.853479385375977, "global_step": 261110, "epoch": 3145} {"train_loss": -24.822635650634766, "global_step": 261111, "epoch": 3145} {"train_loss": -25.051015853881836, "global_step": 261112, "epoch": 3145} {"train_loss": -25.537099838256836, "global_step": 261113, "epoch": 3145} {"train_loss": -24.867895126342773, "global_step": 261114, "epoch": 3145} {"train_loss": -24.94656753540039, "global_step": 261115, "epoch": 3145} {"train_loss": -24.178970336914062, "global_step": 261116, "epoch": 3145} {"train_loss": -25.113629536456372, "global_step": 261117, "epoch": 3145, "val_loss": 6890095.0} {"train_loss": -24.772506713867188, "global_step": 261118, "epoch": 3146} {"train_loss": -23.75751304626465, "global_step": 261119, "epoch": 3146} {"train_loss": -23.977102279663086, "global_step": 261120, "epoch": 3146} {"train_loss": -24.49350357055664, "global_step": 261121, "epoch": 3146} {"train_loss": -23.693004608154297, "global_step": 261122, "epoch": 3146} {"train_loss": -24.702280044555664, "global_step": 261123, "epoch": 3146} {"train_loss": -23.883014678955078, "global_step": 261124, "epoch": 3146} {"train_loss": -23.502439498901367, "global_step": 261125, "epoch": 3146} {"train_loss": -24.15155601501465, "global_step": 261126, "epoch": 3146} {"train_loss": -23.860986709594727, "global_step": 261127, "epoch": 3146} {"train_loss": -24.383481979370117, "global_step": 261128, "epoch": 3146} {"train_loss": -24.212757110595703, "global_step": 261129, "epoch": 3146} {"train_loss": -24.387365341186523, "global_step": 261130, "epoch": 3146} {"train_loss": -24.168746948242188, "global_step": 261131, "epoch": 3146} {"train_loss": -24.163854598999023, "global_step": 261132, "epoch": 3146} {"train_loss": -24.301593780517578, "global_step": 261133, "epoch": 3146} {"train_loss": -24.514053344726562, "global_step": 261134, "epoch": 3146} {"train_loss": -24.59076499938965, "global_step": 261135, "epoch": 3146} {"train_loss": -24.60028648376465, "global_step": 261136, "epoch": 3146} {"train_loss": -24.299325942993164, "global_step": 261137, "epoch": 3146} {"train_loss": -24.334150314331055, "global_step": 261138, "epoch": 3146} {"train_loss": -24.690893173217773, "global_step": 261139, "epoch": 3146} {"train_loss": -24.680631637573242, "global_step": 261140, "epoch": 3146} {"train_loss": -24.74208641052246, "global_step": 261141, "epoch": 3146} {"train_loss": -24.361013412475586, "global_step": 261142, "epoch": 3146} {"train_loss": -24.76998519897461, "global_step": 261143, "epoch": 3146} {"train_loss": -24.900606155395508, "global_step": 261144, "epoch": 3146} {"train_loss": -24.524381637573242, "global_step": 261145, "epoch": 3146} {"train_loss": -25.08660888671875, "global_step": 261146, "epoch": 3146} {"train_loss": -25.095598220825195, "global_step": 261147, "epoch": 3146} {"train_loss": -24.952579498291016, "global_step": 261148, "epoch": 3146} {"train_loss": -24.847461700439453, "global_step": 261149, "epoch": 3146} {"train_loss": -24.751237869262695, "global_step": 261150, "epoch": 3146} {"train_loss": -25.142040252685547, "global_step": 261151, "epoch": 3146} {"train_loss": -25.132856369018555, "global_step": 261152, "epoch": 3146} {"train_loss": -25.10662078857422, "global_step": 261153, "epoch": 3146} {"train_loss": -25.03632354736328, "global_step": 261154, "epoch": 3146} {"train_loss": -25.260711669921875, "global_step": 261155, "epoch": 3146} {"train_loss": -25.171972274780273, "global_step": 261156, "epoch": 3146} {"train_loss": -25.165719985961914, "global_step": 261157, "epoch": 3146} {"train_loss": -25.206289291381836, "global_step": 261158, "epoch": 3146} {"train_loss": -25.206378936767578, "global_step": 261159, "epoch": 3146} {"train_loss": -25.065845489501953, "global_step": 261160, "epoch": 3146} {"train_loss": -25.323972702026367, "global_step": 261161, "epoch": 3146} {"train_loss": -25.05684471130371, "global_step": 261162, "epoch": 3146} {"train_loss": -25.38925552368164, "global_step": 261163, "epoch": 3146} {"train_loss": -25.503721237182617, "global_step": 261164, "epoch": 3146} {"train_loss": -25.308120727539062, "global_step": 261165, "epoch": 3146} {"train_loss": -25.06354331970215, "global_step": 261166, "epoch": 3146} {"train_loss": -25.46894645690918, "global_step": 261167, "epoch": 3146} {"train_loss": -25.47722053527832, "global_step": 261168, "epoch": 3146} {"train_loss": -25.072649002075195, "global_step": 261169, "epoch": 3146} {"train_loss": -25.517528533935547, "global_step": 261170, "epoch": 3146} {"train_loss": -25.014358520507812, "global_step": 261171, "epoch": 3146} {"train_loss": -25.535140991210938, "global_step": 261172, "epoch": 3146} {"train_loss": -25.2087459564209, "global_step": 261173, "epoch": 3146} {"train_loss": -25.296768188476562, "global_step": 261174, "epoch": 3146} {"train_loss": -25.499439239501953, "global_step": 261175, "epoch": 3146} {"train_loss": -24.92231559753418, "global_step": 261176, "epoch": 3146} {"train_loss": -25.204429626464844, "global_step": 261177, "epoch": 3146} {"train_loss": -25.118427276611328, "global_step": 261178, "epoch": 3146} {"train_loss": -25.42072105407715, "global_step": 261179, "epoch": 3146} {"train_loss": -24.863605499267578, "global_step": 261180, "epoch": 3146} {"train_loss": -25.212936401367188, "global_step": 261181, "epoch": 3146} {"train_loss": -24.66044044494629, "global_step": 261182, "epoch": 3146} {"train_loss": -25.193466186523438, "global_step": 261183, "epoch": 3146} {"train_loss": -25.001840591430664, "global_step": 261184, "epoch": 3146} {"train_loss": -25.13519859313965, "global_step": 261185, "epoch": 3146} {"train_loss": -24.904401779174805, "global_step": 261186, "epoch": 3146} {"train_loss": -25.34571647644043, "global_step": 261187, "epoch": 3146} {"train_loss": -25.10102653503418, "global_step": 261188, "epoch": 3146} {"train_loss": -25.36969566345215, "global_step": 261189, "epoch": 3146} {"train_loss": -25.21217918395996, "global_step": 261190, "epoch": 3146} {"train_loss": -24.983190536499023, "global_step": 261191, "epoch": 3146} {"train_loss": -25.31340217590332, "global_step": 261192, "epoch": 3146} {"train_loss": -25.29636001586914, "global_step": 261193, "epoch": 3146} {"train_loss": -25.181915283203125, "global_step": 261194, "epoch": 3146} {"train_loss": -25.32073974609375, "global_step": 261195, "epoch": 3146} {"train_loss": -25.26460838317871, "global_step": 261196, "epoch": 3146} {"train_loss": -25.146886825561523, "global_step": 261197, "epoch": 3146} {"train_loss": -24.762252807617188, "global_step": 261198, "epoch": 3146} {"train_loss": -25.58097267150879, "global_step": 261199, "epoch": 3146} {"train_loss": -24.87874228695789, "global_step": 261200, "epoch": 3146, "val_loss": 6971149.0} {"train_loss": -24.68172264099121, "global_step": 261201, "epoch": 3147} {"train_loss": -24.518945693969727, "global_step": 261202, "epoch": 3147} {"train_loss": -24.602636337280273, "global_step": 261203, "epoch": 3147} {"train_loss": -24.091825485229492, "global_step": 261204, "epoch": 3147} {"train_loss": -23.907546997070312, "global_step": 261205, "epoch": 3147} {"train_loss": -24.706571578979492, "global_step": 261206, "epoch": 3147} {"train_loss": -24.856250762939453, "global_step": 261207, "epoch": 3147} {"train_loss": -24.231578826904297, "global_step": 261208, "epoch": 3147} {"train_loss": -24.7763729095459, "global_step": 261209, "epoch": 3147} {"train_loss": -24.44437026977539, "global_step": 261210, "epoch": 3147} {"train_loss": -24.403488159179688, "global_step": 261211, "epoch": 3147} {"train_loss": -24.95762062072754, "global_step": 261212, "epoch": 3147} {"train_loss": -24.651334762573242, "global_step": 261213, "epoch": 3147} {"train_loss": -24.780866622924805, "global_step": 261214, "epoch": 3147} {"train_loss": -25.01955795288086, "global_step": 261215, "epoch": 3147} {"train_loss": -24.564584732055664, "global_step": 261216, "epoch": 3147} {"train_loss": -25.440326690673828, "global_step": 261217, "epoch": 3147} {"train_loss": -25.043203353881836, "global_step": 261218, "epoch": 3147} {"train_loss": -25.158445358276367, "global_step": 261219, "epoch": 3147} {"train_loss": -24.93421745300293, "global_step": 261220, "epoch": 3147} {"train_loss": -25.063007354736328, "global_step": 261221, "epoch": 3147} {"train_loss": -25.048816680908203, "global_step": 261222, "epoch": 3147} {"train_loss": -24.843515396118164, "global_step": 261223, "epoch": 3147} {"train_loss": -25.49022674560547, "global_step": 261224, "epoch": 3147} {"train_loss": -24.54265785217285, "global_step": 261225, "epoch": 3147} {"train_loss": -24.9442138671875, "global_step": 261226, "epoch": 3147} {"train_loss": -25.232742309570312, "global_step": 261227, "epoch": 3147} {"train_loss": -25.338144302368164, "global_step": 261228, "epoch": 3147} {"train_loss": -25.260854721069336, "global_step": 261229, "epoch": 3147} {"train_loss": -25.154218673706055, "global_step": 261230, "epoch": 3147} {"train_loss": -25.269817352294922, "global_step": 261231, "epoch": 3147} {"train_loss": -25.33286476135254, "global_step": 261232, "epoch": 3147} {"train_loss": -25.24281883239746, "global_step": 261233, "epoch": 3147} {"train_loss": -24.990123748779297, "global_step": 261234, "epoch": 3147} {"train_loss": -25.46417808532715, "global_step": 261235, "epoch": 3147} {"train_loss": -24.948423385620117, "global_step": 261236, "epoch": 3147} {"train_loss": -25.208528518676758, "global_step": 261237, "epoch": 3147} {"train_loss": -25.276859283447266, "global_step": 261238, "epoch": 3147} {"train_loss": -25.4190731048584, "global_step": 261239, "epoch": 3147} {"train_loss": -25.157556533813477, "global_step": 261240, "epoch": 3147} {"train_loss": -25.240102767944336, "global_step": 261241, "epoch": 3147} {"train_loss": -25.161874771118164, "global_step": 261242, "epoch": 3147} {"train_loss": -25.539173126220703, "global_step": 261243, "epoch": 3147} {"train_loss": -25.390539169311523, "global_step": 261244, "epoch": 3147} {"train_loss": -25.364368438720703, "global_step": 261245, "epoch": 3147} {"train_loss": -25.714035034179688, "global_step": 261246, "epoch": 3147} {"train_loss": -25.427213668823242, "global_step": 261247, "epoch": 3147} {"train_loss": -25.1033992767334, "global_step": 261248, "epoch": 3147} {"train_loss": -25.127918243408203, "global_step": 261249, "epoch": 3147} {"train_loss": -25.29034996032715, "global_step": 261250, "epoch": 3147} {"train_loss": -25.2357177734375, "global_step": 261251, "epoch": 3147} {"train_loss": -25.558517456054688, "global_step": 261252, "epoch": 3147} {"train_loss": -25.161968231201172, "global_step": 261253, "epoch": 3147} {"train_loss": -25.357511520385742, "global_step": 261254, "epoch": 3147} {"train_loss": -25.228025436401367, "global_step": 261255, "epoch": 3147} {"train_loss": -25.269359588623047, "global_step": 261256, "epoch": 3147} {"train_loss": -24.853940963745117, "global_step": 261257, "epoch": 3147} {"train_loss": -25.2037410736084, "global_step": 261258, "epoch": 3147} {"train_loss": -25.30560874938965, "global_step": 261259, "epoch": 3147} {"train_loss": -25.098485946655273, "global_step": 261260, "epoch": 3147} {"train_loss": -25.151111602783203, "global_step": 261261, "epoch": 3147} {"train_loss": -25.20829963684082, "global_step": 261262, "epoch": 3147} {"train_loss": -25.127058029174805, "global_step": 261263, "epoch": 3147} {"train_loss": -25.128694534301758, "global_step": 261264, "epoch": 3147} {"train_loss": -25.439922332763672, "global_step": 261265, "epoch": 3147} {"train_loss": -25.513336181640625, "global_step": 261266, "epoch": 3147} {"train_loss": -25.17894172668457, "global_step": 261267, "epoch": 3147} {"train_loss": -25.408533096313477, "global_step": 261268, "epoch": 3147} {"train_loss": -25.380449295043945, "global_step": 261269, "epoch": 3147} {"train_loss": -25.51175308227539, "global_step": 261270, "epoch": 3147} {"train_loss": -25.315954208374023, "global_step": 261271, "epoch": 3147} {"train_loss": -25.26721954345703, "global_step": 261272, "epoch": 3147} {"train_loss": -25.17514991760254, "global_step": 261273, "epoch": 3147} {"train_loss": -25.02839469909668, "global_step": 261274, "epoch": 3147} {"train_loss": -24.78314781188965, "global_step": 261275, "epoch": 3147} {"train_loss": -24.879240036010742, "global_step": 261276, "epoch": 3147} {"train_loss": -25.27826690673828, "global_step": 261277, "epoch": 3147} {"train_loss": -25.019027709960938, "global_step": 261278, "epoch": 3147} {"train_loss": -24.566762924194336, "global_step": 261279, "epoch": 3147} {"train_loss": -25.195810317993164, "global_step": 261280, "epoch": 3147} {"train_loss": -25.28458595275879, "global_step": 261281, "epoch": 3147} {"train_loss": -24.842208862304688, "global_step": 261282, "epoch": 3147} {"train_loss": -25.07469149669969, "global_step": 261283, "epoch": 3147, "val_loss": 6953745.5} {"train_loss": -24.766895294189453, "global_step": 261284, "epoch": 3148} {"train_loss": -24.952438354492188, "global_step": 261285, "epoch": 3148} {"train_loss": -24.212364196777344, "global_step": 261286, "epoch": 3148} {"train_loss": -24.350027084350586, "global_step": 261287, "epoch": 3148} {"train_loss": -24.65022087097168, "global_step": 261288, "epoch": 3148} {"train_loss": -24.613910675048828, "global_step": 261289, "epoch": 3148} {"train_loss": -24.20347023010254, "global_step": 261290, "epoch": 3148} {"train_loss": -24.454519271850586, "global_step": 261291, "epoch": 3148} {"train_loss": -24.595428466796875, "global_step": 261292, "epoch": 3148} {"train_loss": -24.716459274291992, "global_step": 261293, "epoch": 3148} {"train_loss": -24.762237548828125, "global_step": 261294, "epoch": 3148} {"train_loss": -24.493711471557617, "global_step": 261295, "epoch": 3148} {"train_loss": -24.41434097290039, "global_step": 261296, "epoch": 3148} {"train_loss": -24.453413009643555, "global_step": 261297, "epoch": 3148} {"train_loss": -24.437297821044922, "global_step": 261298, "epoch": 3148} {"train_loss": -24.594486236572266, "global_step": 261299, "epoch": 3148} {"train_loss": -24.6879940032959, "global_step": 261300, "epoch": 3148} {"train_loss": -24.842737197875977, "global_step": 261301, "epoch": 3148} {"train_loss": -24.877979278564453, "global_step": 261302, "epoch": 3148} {"train_loss": -24.77424430847168, "global_step": 261303, "epoch": 3148} {"train_loss": -24.874330520629883, "global_step": 261304, "epoch": 3148} {"train_loss": -25.058446884155273, "global_step": 261305, "epoch": 3148} {"train_loss": -24.95454216003418, "global_step": 261306, "epoch": 3148} {"train_loss": -25.11672019958496, "global_step": 261307, "epoch": 3148} {"train_loss": -25.08270263671875, "global_step": 261308, "epoch": 3148} {"train_loss": -24.49782943725586, "global_step": 261309, "epoch": 3148} {"train_loss": -25.294713973999023, "global_step": 261310, "epoch": 3148} {"train_loss": -25.320589065551758, "global_step": 261311, "epoch": 3148} {"train_loss": -25.106502532958984, "global_step": 261312, "epoch": 3148} {"train_loss": -25.02156639099121, "global_step": 261313, "epoch": 3148} {"train_loss": -25.288578033447266, "global_step": 261314, "epoch": 3148} {"train_loss": -25.225034713745117, "global_step": 261315, "epoch": 3148} {"train_loss": -24.97791862487793, "global_step": 261316, "epoch": 3148} {"train_loss": -25.47443962097168, "global_step": 261317, "epoch": 3148} {"train_loss": -25.415172576904297, "global_step": 261318, "epoch": 3148} {"train_loss": -25.323911666870117, "global_step": 261319, "epoch": 3148} {"train_loss": -24.88307762145996, "global_step": 261320, "epoch": 3148} {"train_loss": -25.22165870666504, "global_step": 261321, "epoch": 3148} {"train_loss": -25.141605377197266, "global_step": 261322, "epoch": 3148} {"train_loss": -25.435562133789062, "global_step": 261323, "epoch": 3148} {"train_loss": -25.290557861328125, "global_step": 261324, "epoch": 3148} {"train_loss": -25.31132698059082, "global_step": 261325, "epoch": 3148} {"train_loss": -25.35550880432129, "global_step": 261326, "epoch": 3148} {"train_loss": -25.370901107788086, "global_step": 261327, "epoch": 3148} {"train_loss": -25.107315063476562, "global_step": 261328, "epoch": 3148} {"train_loss": -25.215940475463867, "global_step": 261329, "epoch": 3148} {"train_loss": -25.208465576171875, "global_step": 261330, "epoch": 3148} {"train_loss": -25.314186096191406, "global_step": 261331, "epoch": 3148} {"train_loss": -25.06654167175293, "global_step": 261332, "epoch": 3148} {"train_loss": -25.0921688079834, "global_step": 261333, "epoch": 3148} {"train_loss": -25.198806762695312, "global_step": 261334, "epoch": 3148} {"train_loss": -25.059247970581055, "global_step": 261335, "epoch": 3148} {"train_loss": -25.045690536499023, "global_step": 261336, "epoch": 3148} {"train_loss": -25.231473922729492, "global_step": 261337, "epoch": 3148} {"train_loss": -25.2598819732666, "global_step": 261338, "epoch": 3148} {"train_loss": -25.369474411010742, "global_step": 261339, "epoch": 3148} {"train_loss": -25.326868057250977, "global_step": 261340, "epoch": 3148} {"train_loss": -25.064533233642578, "global_step": 261341, "epoch": 3148} {"train_loss": -24.971694946289062, "global_step": 261342, "epoch": 3148} {"train_loss": -25.317890167236328, "global_step": 261343, "epoch": 3148} {"train_loss": -25.080034255981445, "global_step": 261344, "epoch": 3148} {"train_loss": -25.531904220581055, "global_step": 261345, "epoch": 3148} {"train_loss": -25.193832397460938, "global_step": 261346, "epoch": 3148} {"train_loss": -25.270923614501953, "global_step": 261347, "epoch": 3148} {"train_loss": -25.57010841369629, "global_step": 261348, "epoch": 3148} {"train_loss": -25.056900024414062, "global_step": 261349, "epoch": 3148} {"train_loss": -25.18385124206543, "global_step": 261350, "epoch": 3148} {"train_loss": -24.910558700561523, "global_step": 261351, "epoch": 3148} {"train_loss": -25.577123641967773, "global_step": 261352, "epoch": 3148} {"train_loss": -25.26944923400879, "global_step": 261353, "epoch": 3148} {"train_loss": -25.072214126586914, "global_step": 261354, "epoch": 3148} {"train_loss": -25.41777992248535, "global_step": 261355, "epoch": 3148} {"train_loss": -24.815675735473633, "global_step": 261356, "epoch": 3148} {"train_loss": -25.715717315673828, "global_step": 261357, "epoch": 3148} {"train_loss": -25.333772659301758, "global_step": 261358, "epoch": 3148} {"train_loss": -25.189224243164062, "global_step": 261359, "epoch": 3148} {"train_loss": -25.43398094177246, "global_step": 261360, "epoch": 3148} {"train_loss": -24.81903076171875, "global_step": 261361, "epoch": 3148} {"train_loss": -25.7049560546875, "global_step": 261362, "epoch": 3148} {"train_loss": -25.382165908813477, "global_step": 261363, "epoch": 3148} {"train_loss": -25.35038185119629, "global_step": 261364, "epoch": 3148} {"train_loss": -25.260482788085938, "global_step": 261365, "epoch": 3148} {"train_loss": -25.061245355261377, "global_step": 261366, "epoch": 3148, "val_loss": 6759413.0} {"train_loss": -24.07865333557129, "global_step": 261367, "epoch": 3149} {"train_loss": -23.942419052124023, "global_step": 261368, "epoch": 3149} {"train_loss": -23.20545768737793, "global_step": 261369, "epoch": 3149} {"train_loss": -22.653900146484375, "global_step": 261370, "epoch": 3149} {"train_loss": -24.378353118896484, "global_step": 261371, "epoch": 3149} {"train_loss": -23.590898513793945, "global_step": 261372, "epoch": 3149} {"train_loss": -23.425931930541992, "global_step": 261373, "epoch": 3149} {"train_loss": -23.98935890197754, "global_step": 261374, "epoch": 3149} {"train_loss": -24.233739852905273, "global_step": 261375, "epoch": 3149} {"train_loss": -24.075746536254883, "global_step": 261376, "epoch": 3149} {"train_loss": -24.532978057861328, "global_step": 261377, "epoch": 3149} {"train_loss": -24.530004501342773, "global_step": 261378, "epoch": 3149} {"train_loss": -24.312931060791016, "global_step": 261379, "epoch": 3149} {"train_loss": -24.681360244750977, "global_step": 261380, "epoch": 3149} {"train_loss": -24.431032180786133, "global_step": 261381, "epoch": 3149} {"train_loss": -24.713022232055664, "global_step": 261382, "epoch": 3149} {"train_loss": -24.91233253479004, "global_step": 261383, "epoch": 3149} {"train_loss": -24.74873161315918, "global_step": 261384, "epoch": 3149} {"train_loss": -24.356454849243164, "global_step": 261385, "epoch": 3149} {"train_loss": -24.662363052368164, "global_step": 261386, "epoch": 3149} {"train_loss": -24.300193786621094, "global_step": 261387, "epoch": 3149} {"train_loss": -24.638408660888672, "global_step": 261388, "epoch": 3149} {"train_loss": -24.607696533203125, "global_step": 261389, "epoch": 3149} {"train_loss": -24.383878707885742, "global_step": 261390, "epoch": 3149} {"train_loss": -25.04786491394043, "global_step": 261391, "epoch": 3149} {"train_loss": -24.608713150024414, "global_step": 261392, "epoch": 3149} {"train_loss": -24.923755645751953, "global_step": 261393, "epoch": 3149} {"train_loss": -24.711444854736328, "global_step": 261394, "epoch": 3149} {"train_loss": -24.844411849975586, "global_step": 261395, "epoch": 3149} {"train_loss": -25.085891723632812, "global_step": 261396, "epoch": 3149} {"train_loss": -25.312744140625, "global_step": 261397, "epoch": 3149} {"train_loss": -24.846702575683594, "global_step": 261398, "epoch": 3149} {"train_loss": -24.758983612060547, "global_step": 261399, "epoch": 3149} {"train_loss": -25.030906677246094, "global_step": 261400, "epoch": 3149} {"train_loss": -24.819921493530273, "global_step": 261401, "epoch": 3149} {"train_loss": -24.83266258239746, "global_step": 261402, "epoch": 3149} {"train_loss": -24.602724075317383, "global_step": 261403, "epoch": 3149} {"train_loss": -25.26735496520996, "global_step": 261404, "epoch": 3149} {"train_loss": -25.099706649780273, "global_step": 261405, "epoch": 3149} {"train_loss": -24.635761260986328, "global_step": 261406, "epoch": 3149} {"train_loss": -24.869558334350586, "global_step": 261407, "epoch": 3149} {"train_loss": -25.0902042388916, "global_step": 261408, "epoch": 3149} {"train_loss": -25.154356002807617, "global_step": 261409, "epoch": 3149} {"train_loss": -24.945968627929688, "global_step": 261410, "epoch": 3149} {"train_loss": -25.433603286743164, "global_step": 261411, "epoch": 3149} {"train_loss": -25.129758834838867, "global_step": 261412, "epoch": 3149} {"train_loss": -24.88434410095215, "global_step": 261413, "epoch": 3149} {"train_loss": -25.381277084350586, "global_step": 261414, "epoch": 3149} {"train_loss": -25.21636390686035, "global_step": 261415, "epoch": 3149} {"train_loss": -25.08281898498535, "global_step": 261416, "epoch": 3149} {"train_loss": -25.21974754333496, "global_step": 261417, "epoch": 3149} {"train_loss": -24.96124839782715, "global_step": 261418, "epoch": 3149} {"train_loss": -25.304628372192383, "global_step": 261419, "epoch": 3149} {"train_loss": -24.913373947143555, "global_step": 261420, "epoch": 3149} {"train_loss": -24.951663970947266, "global_step": 261421, "epoch": 3149} {"train_loss": -25.42560577392578, "global_step": 261422, "epoch": 3149} {"train_loss": -24.85065269470215, "global_step": 261423, "epoch": 3149} {"train_loss": -24.936498641967773, "global_step": 261424, "epoch": 3149} {"train_loss": -25.22897720336914, "global_step": 261425, "epoch": 3149} {"train_loss": -24.652067184448242, "global_step": 261426, "epoch": 3149} {"train_loss": -25.239368438720703, "global_step": 261427, "epoch": 3149} {"train_loss": -25.18714714050293, "global_step": 261428, "epoch": 3149} {"train_loss": -25.44202995300293, "global_step": 261429, "epoch": 3149} {"train_loss": -25.165433883666992, "global_step": 261430, "epoch": 3149} {"train_loss": -25.147703170776367, "global_step": 261431, "epoch": 3149} {"train_loss": -24.95325469970703, "global_step": 261432, "epoch": 3149} {"train_loss": -25.033004760742188, "global_step": 261433, "epoch": 3149} {"train_loss": -25.06319236755371, "global_step": 261434, "epoch": 3149} {"train_loss": -25.45278549194336, "global_step": 261435, "epoch": 3149} {"train_loss": -24.817859649658203, "global_step": 261436, "epoch": 3149} {"train_loss": -25.02017593383789, "global_step": 261437, "epoch": 3149} {"train_loss": -24.714466094970703, "global_step": 261438, "epoch": 3149} {"train_loss": -25.219331741333008, "global_step": 261439, "epoch": 3149} {"train_loss": -25.31709098815918, "global_step": 261440, "epoch": 3149} {"train_loss": -25.303070068359375, "global_step": 261441, "epoch": 3149} {"train_loss": -25.371437072753906, "global_step": 261442, "epoch": 3149} {"train_loss": -25.225189208984375, "global_step": 261443, "epoch": 3149} {"train_loss": -24.877477645874023, "global_step": 261444, "epoch": 3149} {"train_loss": -25.088245391845703, "global_step": 261445, "epoch": 3149} {"train_loss": -25.147748947143555, "global_step": 261446, "epoch": 3149} {"train_loss": -25.28596305847168, "global_step": 261447, "epoch": 3149} {"train_loss": -25.168806076049805, "global_step": 261448, "epoch": 3149} {"train_loss": -24.79084099918963, "global_step": 261449, "epoch": 3149, "val_loss": 6881517.0} {"train_loss": -22.919553756713867, "global_step": 261450, "epoch": 3150} {"train_loss": -23.84141731262207, "global_step": 261451, "epoch": 3150} {"train_loss": -23.156286239624023, "global_step": 261452, "epoch": 3150} {"train_loss": -24.042890548706055, "global_step": 261453, "epoch": 3150} {"train_loss": -23.54705047607422, "global_step": 261454, "epoch": 3150} {"train_loss": -23.866186141967773, "global_step": 261455, "epoch": 3150} {"train_loss": -23.90276336669922, "global_step": 261456, "epoch": 3150} {"train_loss": -24.08575439453125, "global_step": 261457, "epoch": 3150} {"train_loss": -24.096752166748047, "global_step": 261458, "epoch": 3150} {"train_loss": -24.337299346923828, "global_step": 261459, "epoch": 3150} {"train_loss": -24.84132194519043, "global_step": 261460, "epoch": 3150} {"train_loss": -24.143600463867188, "global_step": 261461, "epoch": 3150} {"train_loss": -24.646636962890625, "global_step": 261462, "epoch": 3150} {"train_loss": -24.61345100402832, "global_step": 261463, "epoch": 3150} {"train_loss": -24.715829849243164, "global_step": 261464, "epoch": 3150} {"train_loss": -24.826171875, "global_step": 261465, "epoch": 3150} {"train_loss": -24.42078971862793, "global_step": 261466, "epoch": 3150} {"train_loss": -24.696115493774414, "global_step": 261467, "epoch": 3150} {"train_loss": -24.92708969116211, "global_step": 261468, "epoch": 3150} {"train_loss": -24.446561813354492, "global_step": 261469, "epoch": 3150} {"train_loss": -24.724374771118164, "global_step": 261470, "epoch": 3150} {"train_loss": -24.422414779663086, "global_step": 261471, "epoch": 3150} {"train_loss": -24.80995750427246, "global_step": 261472, "epoch": 3150} {"train_loss": -24.709304809570312, "global_step": 261473, "epoch": 3150} {"train_loss": -24.652490615844727, "global_step": 261474, "epoch": 3150} {"train_loss": -24.943931579589844, "global_step": 261475, "epoch": 3150} {"train_loss": -24.839279174804688, "global_step": 261476, "epoch": 3150} {"train_loss": -24.89803123474121, "global_step": 261477, "epoch": 3150} {"train_loss": -25.129907608032227, "global_step": 261478, "epoch": 3150} {"train_loss": -25.191564559936523, "global_step": 261479, "epoch": 3150} {"train_loss": -24.985082626342773, "global_step": 261480, "epoch": 3150} {"train_loss": -25.1015682220459, "global_step": 261481, "epoch": 3150} {"train_loss": -25.343603134155273, "global_step": 261482, "epoch": 3150} {"train_loss": -24.76210594177246, "global_step": 261483, "epoch": 3150} {"train_loss": -25.011865615844727, "global_step": 261484, "epoch": 3150} {"train_loss": -25.094064712524414, "global_step": 261485, "epoch": 3150} {"train_loss": -25.296167373657227, "global_step": 261486, "epoch": 3150} {"train_loss": -25.359893798828125, "global_step": 261487, "epoch": 3150} {"train_loss": -25.32957649230957, "global_step": 261488, "epoch": 3150} {"train_loss": -25.284292221069336, "global_step": 261489, "epoch": 3150} {"train_loss": -24.703981399536133, "global_step": 261490, "epoch": 3150} {"train_loss": -25.46862030029297, "global_step": 261491, "epoch": 3150} {"train_loss": -24.79822540283203, "global_step": 261492, "epoch": 3150} {"train_loss": -24.98758888244629, "global_step": 261493, "epoch": 3150} {"train_loss": -25.322336196899414, "global_step": 261494, "epoch": 3150} {"train_loss": -24.77790641784668, "global_step": 261495, "epoch": 3150} {"train_loss": -25.421594619750977, "global_step": 261496, "epoch": 3150} {"train_loss": -25.08704948425293, "global_step": 261497, "epoch": 3150} {"train_loss": -25.024799346923828, "global_step": 261498, "epoch": 3150} {"train_loss": -24.788253784179688, "global_step": 261499, "epoch": 3150} {"train_loss": -25.305715560913086, "global_step": 261500, "epoch": 3150} {"train_loss": -25.311857223510742, "global_step": 261501, "epoch": 3150} {"train_loss": -25.06363868713379, "global_step": 261502, "epoch": 3150} {"train_loss": -25.211231231689453, "global_step": 261503, "epoch": 3150} {"train_loss": -25.205764770507812, "global_step": 261504, "epoch": 3150} {"train_loss": -25.0707950592041, "global_step": 261505, "epoch": 3150} {"train_loss": -25.654876708984375, "global_step": 261506, "epoch": 3150} {"train_loss": -25.4689998626709, "global_step": 261507, "epoch": 3150} {"train_loss": -25.204483032226562, "global_step": 261508, "epoch": 3150} {"train_loss": -25.37281608581543, "global_step": 261509, "epoch": 3150} {"train_loss": -25.0764217376709, "global_step": 261510, "epoch": 3150} {"train_loss": -24.81610679626465, "global_step": 261511, "epoch": 3150} {"train_loss": -24.878822326660156, "global_step": 261512, "epoch": 3150} {"train_loss": -25.455320358276367, "global_step": 261513, "epoch": 3150} {"train_loss": -25.09867286682129, "global_step": 261514, "epoch": 3150} {"train_loss": -25.22159767150879, "global_step": 261515, "epoch": 3150} {"train_loss": -24.73068618774414, "global_step": 261516, "epoch": 3150} {"train_loss": -25.274120330810547, "global_step": 261517, "epoch": 3150} {"train_loss": -25.024932861328125, "global_step": 261518, "epoch": 3150} {"train_loss": -24.79549217224121, "global_step": 261519, "epoch": 3150} {"train_loss": -25.0416316986084, "global_step": 261520, "epoch": 3150} {"train_loss": -25.445905685424805, "global_step": 261521, "epoch": 3150} {"train_loss": -25.34323501586914, "global_step": 261522, "epoch": 3150} {"train_loss": -25.635725021362305, "global_step": 261523, "epoch": 3150} {"train_loss": -25.235570907592773, "global_step": 261524, "epoch": 3150} {"train_loss": -25.1423282623291, "global_step": 261525, "epoch": 3150} {"train_loss": -25.268640518188477, "global_step": 261526, "epoch": 3150} {"train_loss": -25.29811668395996, "global_step": 261527, "epoch": 3150} {"train_loss": -25.103334426879883, "global_step": 261528, "epoch": 3150} {"train_loss": -25.08942985534668, "global_step": 261529, "epoch": 3150} {"train_loss": -25.67396354675293, "global_step": 261530, "epoch": 3150} {"train_loss": -24.99047088623047, "global_step": 261531, "epoch": 3150} {"train_loss": -24.8882277155497, "global_step": 261532, "epoch": 3150, "train/sim_max_reward_0": 1.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 0.0, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4500000": 1.0, "test/sim_max_reward_4500001": 1.0, "test/sim_max_reward_4500002": 1.0, "test/sim_max_reward_4500003": 1.0, "test/sim_max_reward_4500004": 1.0, "test/sim_max_reward_4500005": 1.0, "test/sim_max_reward_4500006": 1.0, "test/sim_max_reward_4500007": 0.0, "test/sim_max_reward_4500008": 0.0, "test/sim_max_reward_4500009": 1.0, "test/sim_max_reward_4500010": 1.0, "test/sim_max_reward_4500011": 1.0, "test/sim_max_reward_4500012": 1.0, "test/sim_max_reward_4500013": 1.0, "test/sim_max_reward_4500014": 1.0, "test/sim_max_reward_4500015": 1.0, "test/sim_max_reward_4500016": 1.0, "test/sim_max_reward_4500017": 1.0, "test/sim_max_reward_4500018": 1.0, "test/sim_max_reward_4500019": 0.0, "test/sim_max_reward_4500020": 1.0, "test/sim_max_reward_4500021": 1.0, "train/mean_score": 0.8333333333333334, "test/mean_score": 0.8636363636363636, "val_loss": 7070764.0} {"train_loss": -25.264806747436523, "global_step": 261533, "epoch": 3151} {"train_loss": -25.010778427124023, "global_step": 261534, "epoch": 3151} {"train_loss": -24.984106063842773, "global_step": 261535, "epoch": 3151} {"train_loss": -25.250059127807617, "global_step": 261536, "epoch": 3151} {"train_loss": -25.316497802734375, "global_step": 261537, "epoch": 3151} {"train_loss": -25.04168701171875, "global_step": 261538, "epoch": 3151} {"train_loss": -25.46858024597168, "global_step": 261539, "epoch": 3151} {"train_loss": -25.171506881713867, "global_step": 261540, "epoch": 3151} {"train_loss": -25.241737365722656, "global_step": 261541, "epoch": 3151} {"train_loss": -25.272146224975586, "global_step": 261542, "epoch": 3151} {"train_loss": -25.263032913208008, "global_step": 261543, "epoch": 3151} {"train_loss": -24.687213897705078, "global_step": 261544, "epoch": 3151} {"train_loss": -25.055438995361328, "global_step": 261545, "epoch": 3151} {"train_loss": -25.456491470336914, "global_step": 261546, "epoch": 3151} {"train_loss": -24.926868438720703, "global_step": 261547, "epoch": 3151} {"train_loss": -24.93532371520996, "global_step": 261548, "epoch": 3151} {"train_loss": -25.417280197143555, "global_step": 261549, "epoch": 3151} {"train_loss": -25.46722412109375, "global_step": 261550, "epoch": 3151} {"train_loss": -25.145462036132812, "global_step": 261551, "epoch": 3151} {"train_loss": -24.89286231994629, "global_step": 261552, "epoch": 3151} {"train_loss": -24.841161727905273, "global_step": 261553, "epoch": 3151} {"train_loss": -25.382116317749023, "global_step": 261554, "epoch": 3151} {"train_loss": -25.33737564086914, "global_step": 261555, "epoch": 3151} {"train_loss": -24.50132179260254, "global_step": 261556, "epoch": 3151} {"train_loss": -25.387928009033203, "global_step": 261557, "epoch": 3151} {"train_loss": -24.869171142578125, "global_step": 261558, "epoch": 3151} {"train_loss": -25.237070083618164, "global_step": 261559, "epoch": 3151} {"train_loss": -25.399154663085938, "global_step": 261560, "epoch": 3151} {"train_loss": -25.161945343017578, "global_step": 261561, "epoch": 3151} {"train_loss": -25.32110595703125, "global_step": 261562, "epoch": 3151} {"train_loss": -24.928163528442383, "global_step": 261563, "epoch": 3151} {"train_loss": -25.157121658325195, "global_step": 261564, "epoch": 3151} {"train_loss": -25.32621955871582, "global_step": 261565, "epoch": 3151} {"train_loss": -25.258394241333008, "global_step": 261566, "epoch": 3151} {"train_loss": -25.256406784057617, "global_step": 261567, "epoch": 3151} {"train_loss": -24.7943058013916, "global_step": 261568, "epoch": 3151} {"train_loss": -25.051401138305664, "global_step": 261569, "epoch": 3151} {"train_loss": -25.27144432067871, "global_step": 261570, "epoch": 3151} {"train_loss": -25.216449737548828, "global_step": 261571, "epoch": 3151} {"train_loss": -25.155080795288086, "global_step": 261572, "epoch": 3151} {"train_loss": -25.479005813598633, "global_step": 261573, "epoch": 3151} {"train_loss": -25.3698787689209, "global_step": 261574, "epoch": 3151} {"train_loss": -25.390714645385742, "global_step": 261575, "epoch": 3151} {"train_loss": -25.25522804260254, "global_step": 261576, "epoch": 3151} {"train_loss": -25.52742576599121, "global_step": 261577, "epoch": 3151} {"train_loss": -25.20586585998535, "global_step": 261578, "epoch": 3151} {"train_loss": -25.187170028686523, "global_step": 261579, "epoch": 3151} {"train_loss": -25.041234970092773, "global_step": 261580, "epoch": 3151} {"train_loss": -25.002546310424805, "global_step": 261581, "epoch": 3151} {"train_loss": -25.33762550354004, "global_step": 261582, "epoch": 3151} {"train_loss": -25.501728057861328, "global_step": 261583, "epoch": 3151} {"train_loss": -25.163785934448242, "global_step": 261584, "epoch": 3151} {"train_loss": -25.409761428833008, "global_step": 261585, "epoch": 3151} {"train_loss": -25.1022891998291, "global_step": 261586, "epoch": 3151} {"train_loss": -24.978660583496094, "global_step": 261587, "epoch": 3151} {"train_loss": -25.447616577148438, "global_step": 261588, "epoch": 3151} {"train_loss": -25.467321395874023, "global_step": 261589, "epoch": 3151} {"train_loss": -25.342432022094727, "global_step": 261590, "epoch": 3151} {"train_loss": -25.244033813476562, "global_step": 261591, "epoch": 3151} {"train_loss": -25.129487991333008, "global_step": 261592, "epoch": 3151} {"train_loss": -25.39961051940918, "global_step": 261593, "epoch": 3151} {"train_loss": -25.32826805114746, "global_step": 261594, "epoch": 3151} {"train_loss": -25.456024169921875, "global_step": 261595, "epoch": 3151} {"train_loss": -25.12563133239746, "global_step": 261596, "epoch": 3151} {"train_loss": -25.143814086914062, "global_step": 261597, "epoch": 3151} {"train_loss": -24.968887329101562, "global_step": 261598, "epoch": 3151} {"train_loss": -25.01631736755371, "global_step": 261599, "epoch": 3151} {"train_loss": -24.81184196472168, "global_step": 261600, "epoch": 3151} {"train_loss": -25.497018814086914, "global_step": 261601, "epoch": 3151} {"train_loss": -24.719491958618164, "global_step": 261602, "epoch": 3151} {"train_loss": -24.913034439086914, "global_step": 261603, "epoch": 3151} {"train_loss": -24.898578643798828, "global_step": 261604, "epoch": 3151} {"train_loss": -24.917255401611328, "global_step": 261605, "epoch": 3151} {"train_loss": -24.651945114135742, "global_step": 261606, "epoch": 3151} {"train_loss": -24.703689575195312, "global_step": 261607, "epoch": 3151} {"train_loss": -25.338632583618164, "global_step": 261608, "epoch": 3151} {"train_loss": -25.255069732666016, "global_step": 261609, "epoch": 3151} {"train_loss": -25.15276527404785, "global_step": 261610, "epoch": 3151} {"train_loss": -25.297468185424805, "global_step": 261611, "epoch": 3151} {"train_loss": -25.43684196472168, "global_step": 261612, "epoch": 3151} {"train_loss": -25.460140228271484, "global_step": 261613, "epoch": 3151} {"train_loss": -25.26637840270996, "global_step": 261614, "epoch": 3151} {"train_loss": -25.16665612645896, "global_step": 261615, "epoch": 3151, "val_loss": 6894378.0} {"train_loss": -25.129133224487305, "global_step": 261616, "epoch": 3152} {"train_loss": -25.15431022644043, "global_step": 261617, "epoch": 3152} {"train_loss": -25.003808975219727, "global_step": 261618, "epoch": 3152} {"train_loss": -25.401878356933594, "global_step": 261619, "epoch": 3152} {"train_loss": -25.036182403564453, "global_step": 261620, "epoch": 3152} {"train_loss": -24.96674156188965, "global_step": 261621, "epoch": 3152} {"train_loss": -25.05774688720703, "global_step": 261622, "epoch": 3152} {"train_loss": -25.002784729003906, "global_step": 261623, "epoch": 3152} {"train_loss": -25.47784423828125, "global_step": 261624, "epoch": 3152} {"train_loss": -24.63774299621582, "global_step": 261625, "epoch": 3152} {"train_loss": -24.988916397094727, "global_step": 261626, "epoch": 3152} {"train_loss": -25.12384605407715, "global_step": 261627, "epoch": 3152} {"train_loss": -25.312515258789062, "global_step": 261628, "epoch": 3152} {"train_loss": -25.552093505859375, "global_step": 261629, "epoch": 3152} {"train_loss": -25.28436851501465, "global_step": 261630, "epoch": 3152} {"train_loss": -24.806501388549805, "global_step": 261631, "epoch": 3152} {"train_loss": -25.284215927124023, "global_step": 261632, "epoch": 3152} {"train_loss": -25.516311645507812, "global_step": 261633, "epoch": 3152} {"train_loss": -24.992177963256836, "global_step": 261634, "epoch": 3152} {"train_loss": -24.939085006713867, "global_step": 261635, "epoch": 3152} {"train_loss": -24.914499282836914, "global_step": 261636, "epoch": 3152} {"train_loss": -24.874975204467773, "global_step": 261637, "epoch": 3152} {"train_loss": -24.88259506225586, "global_step": 261638, "epoch": 3152} {"train_loss": -25.292932510375977, "global_step": 261639, "epoch": 3152} {"train_loss": -25.33614158630371, "global_step": 261640, "epoch": 3152} {"train_loss": -25.516681671142578, "global_step": 261641, "epoch": 3152} {"train_loss": -24.982364654541016, "global_step": 261642, "epoch": 3152} {"train_loss": -25.32101821899414, "global_step": 261643, "epoch": 3152} {"train_loss": -25.33746910095215, "global_step": 261644, "epoch": 3152} {"train_loss": -25.365447998046875, "global_step": 261645, "epoch": 3152} {"train_loss": -25.033227920532227, "global_step": 261646, "epoch": 3152} {"train_loss": -25.29878807067871, "global_step": 261647, "epoch": 3152} {"train_loss": -25.079504013061523, "global_step": 261648, "epoch": 3152} {"train_loss": -25.287017822265625, "global_step": 261649, "epoch": 3152} {"train_loss": -25.25568962097168, "global_step": 261650, "epoch": 3152} {"train_loss": -25.078571319580078, "global_step": 261651, "epoch": 3152} {"train_loss": -25.207046508789062, "global_step": 261652, "epoch": 3152} {"train_loss": -24.872947692871094, "global_step": 261653, "epoch": 3152} {"train_loss": -25.291542053222656, "global_step": 261654, "epoch": 3152} {"train_loss": -25.157480239868164, "global_step": 261655, "epoch": 3152} {"train_loss": -25.0246639251709, "global_step": 261656, "epoch": 3152} {"train_loss": -25.198352813720703, "global_step": 261657, "epoch": 3152} {"train_loss": -25.292020797729492, "global_step": 261658, "epoch": 3152} {"train_loss": -25.280996322631836, "global_step": 261659, "epoch": 3152} {"train_loss": -25.278085708618164, "global_step": 261660, "epoch": 3152} {"train_loss": -25.27997398376465, "global_step": 261661, "epoch": 3152} {"train_loss": -25.441421508789062, "global_step": 261662, "epoch": 3152} {"train_loss": -25.60520362854004, "global_step": 261663, "epoch": 3152} {"train_loss": -25.111047744750977, "global_step": 261664, "epoch": 3152} {"train_loss": -25.50822639465332, "global_step": 261665, "epoch": 3152} {"train_loss": -25.300756454467773, "global_step": 261666, "epoch": 3152} {"train_loss": -25.361242294311523, "global_step": 261667, "epoch": 3152} {"train_loss": -25.21382713317871, "global_step": 261668, "epoch": 3152} {"train_loss": -25.000709533691406, "global_step": 261669, "epoch": 3152} {"train_loss": -24.95404624938965, "global_step": 261670, "epoch": 3152} {"train_loss": -25.332677841186523, "global_step": 261671, "epoch": 3152} {"train_loss": -25.406240463256836, "global_step": 261672, "epoch": 3152} {"train_loss": -25.620807647705078, "global_step": 261673, "epoch": 3152} {"train_loss": -25.205347061157227, "global_step": 261674, "epoch": 3152} {"train_loss": -25.203031539916992, "global_step": 261675, "epoch": 3152} {"train_loss": -25.470945358276367, "global_step": 261676, "epoch": 3152} {"train_loss": -25.20418930053711, "global_step": 261677, "epoch": 3152} {"train_loss": -25.245269775390625, "global_step": 261678, "epoch": 3152} {"train_loss": -25.471267700195312, "global_step": 261679, "epoch": 3152} {"train_loss": -25.188993453979492, "global_step": 261680, "epoch": 3152} {"train_loss": -25.31416893005371, "global_step": 261681, "epoch": 3152} {"train_loss": -24.89349937438965, "global_step": 261682, "epoch": 3152} {"train_loss": -24.740564346313477, "global_step": 261683, "epoch": 3152} {"train_loss": -24.955982208251953, "global_step": 261684, "epoch": 3152} {"train_loss": -25.11866569519043, "global_step": 261685, "epoch": 3152} {"train_loss": -24.833406448364258, "global_step": 261686, "epoch": 3152} {"train_loss": -24.980276107788086, "global_step": 261687, "epoch": 3152} {"train_loss": -25.19610595703125, "global_step": 261688, "epoch": 3152} {"train_loss": -24.897119522094727, "global_step": 261689, "epoch": 3152} {"train_loss": -24.980871200561523, "global_step": 261690, "epoch": 3152} {"train_loss": -25.235933303833008, "global_step": 261691, "epoch": 3152} {"train_loss": -25.074365615844727, "global_step": 261692, "epoch": 3152} {"train_loss": -25.137155532836914, "global_step": 261693, "epoch": 3152} {"train_loss": -24.857040405273438, "global_step": 261694, "epoch": 3152} {"train_loss": -24.885833740234375, "global_step": 261695, "epoch": 3152} {"train_loss": -24.74129295349121, "global_step": 261696, "epoch": 3152} {"train_loss": -25.305917739868164, "global_step": 261697, "epoch": 3152} {"train_loss": -25.172053325607116, "global_step": 261698, "epoch": 3152, "val_loss": 6809619.0} {"train_loss": -24.940420150756836, "global_step": 261699, "epoch": 3153} {"train_loss": -24.682514190673828, "global_step": 261700, "epoch": 3153} {"train_loss": -24.879165649414062, "global_step": 261701, "epoch": 3153} {"train_loss": -24.690046310424805, "global_step": 261702, "epoch": 3153} {"train_loss": -24.49071502685547, "global_step": 261703, "epoch": 3153} {"train_loss": -24.525150299072266, "global_step": 261704, "epoch": 3153} {"train_loss": -24.530380249023438, "global_step": 261705, "epoch": 3153} {"train_loss": -24.6044921875, "global_step": 261706, "epoch": 3153} {"train_loss": -24.579893112182617, "global_step": 261707, "epoch": 3153} {"train_loss": -24.66792106628418, "global_step": 261708, "epoch": 3153} {"train_loss": -24.33733558654785, "global_step": 261709, "epoch": 3153} {"train_loss": -24.61689567565918, "global_step": 261710, "epoch": 3153} {"train_loss": -24.693944931030273, "global_step": 261711, "epoch": 3153} {"train_loss": -24.980087280273438, "global_step": 261712, "epoch": 3153} {"train_loss": -24.33500862121582, "global_step": 261713, "epoch": 3153} {"train_loss": -24.444480895996094, "global_step": 261714, "epoch": 3153} {"train_loss": -24.706127166748047, "global_step": 261715, "epoch": 3153} {"train_loss": -24.747655868530273, "global_step": 261716, "epoch": 3153} {"train_loss": -24.97135353088379, "global_step": 261717, "epoch": 3153} {"train_loss": -24.970380783081055, "global_step": 261718, "epoch": 3153} {"train_loss": -24.815412521362305, "global_step": 261719, "epoch": 3153} {"train_loss": -25.015268325805664, "global_step": 261720, "epoch": 3153} {"train_loss": -25.396656036376953, "global_step": 261721, "epoch": 3153} {"train_loss": -25.193241119384766, "global_step": 261722, "epoch": 3153} {"train_loss": -25.274999618530273, "global_step": 261723, "epoch": 3153} {"train_loss": -25.423654556274414, "global_step": 261724, "epoch": 3153} {"train_loss": -25.179838180541992, "global_step": 261725, "epoch": 3153} {"train_loss": -25.063440322875977, "global_step": 261726, "epoch": 3153} {"train_loss": -25.09366798400879, "global_step": 261727, "epoch": 3153} {"train_loss": -24.784006118774414, "global_step": 261728, "epoch": 3153} {"train_loss": -25.044706344604492, "global_step": 261729, "epoch": 3153} {"train_loss": -25.153274536132812, "global_step": 261730, "epoch": 3153} {"train_loss": -25.26272201538086, "global_step": 261731, "epoch": 3153} {"train_loss": -25.64971351623535, "global_step": 261732, "epoch": 3153} {"train_loss": -25.38152503967285, "global_step": 261733, "epoch": 3153} {"train_loss": -25.56438636779785, "global_step": 261734, "epoch": 3153} {"train_loss": -25.842010498046875, "global_step": 261735, "epoch": 3153} {"train_loss": -25.623083114624023, "global_step": 261736, "epoch": 3153} {"train_loss": -25.13227653503418, "global_step": 261737, "epoch": 3153} {"train_loss": -25.17896842956543, "global_step": 261738, "epoch": 3153} {"train_loss": -24.924985885620117, "global_step": 261739, "epoch": 3153} {"train_loss": -24.40502166748047, "global_step": 261740, "epoch": 3153} {"train_loss": -24.915639877319336, "global_step": 261741, "epoch": 3153} {"train_loss": -24.894697189331055, "global_step": 261742, "epoch": 3153} {"train_loss": -25.105993270874023, "global_step": 261743, "epoch": 3153} {"train_loss": -25.09328842163086, "global_step": 261744, "epoch": 3153} {"train_loss": -25.260337829589844, "global_step": 261745, "epoch": 3153} {"train_loss": -25.017560958862305, "global_step": 261746, "epoch": 3153} {"train_loss": -25.130857467651367, "global_step": 261747, "epoch": 3153} {"train_loss": -25.236772537231445, "global_step": 261748, "epoch": 3153} {"train_loss": -24.98550796508789, "global_step": 261749, "epoch": 3153} {"train_loss": -25.13151741027832, "global_step": 261750, "epoch": 3153} {"train_loss": -24.800378799438477, "global_step": 261751, "epoch": 3153} {"train_loss": -24.865440368652344, "global_step": 261752, "epoch": 3153} {"train_loss": -24.782638549804688, "global_step": 261753, "epoch": 3153} {"train_loss": -24.03302764892578, "global_step": 261754, "epoch": 3153} {"train_loss": -25.16651725769043, "global_step": 261755, "epoch": 3153} {"train_loss": -25.0463809967041, "global_step": 261756, "epoch": 3153} {"train_loss": -24.93415069580078, "global_step": 261757, "epoch": 3153} {"train_loss": -24.97420310974121, "global_step": 261758, "epoch": 3153} {"train_loss": -24.922266006469727, "global_step": 261759, "epoch": 3153} {"train_loss": -25.01453971862793, "global_step": 261760, "epoch": 3153} {"train_loss": -25.356599807739258, "global_step": 261761, "epoch": 3153} {"train_loss": -24.720478057861328, "global_step": 261762, "epoch": 3153} {"train_loss": -25.213293075561523, "global_step": 261763, "epoch": 3153} {"train_loss": -25.102949142456055, "global_step": 261764, "epoch": 3153} {"train_loss": -25.0421199798584, "global_step": 261765, "epoch": 3153} {"train_loss": -25.550661087036133, "global_step": 261766, "epoch": 3153} {"train_loss": -25.177305221557617, "global_step": 261767, "epoch": 3153} {"train_loss": -25.26717185974121, "global_step": 261768, "epoch": 3153} {"train_loss": -25.13227081298828, "global_step": 261769, "epoch": 3153} {"train_loss": -25.0921573638916, "global_step": 261770, "epoch": 3153} {"train_loss": -25.025787353515625, "global_step": 261771, "epoch": 3153} {"train_loss": -24.915908813476562, "global_step": 261772, "epoch": 3153} {"train_loss": -25.271652221679688, "global_step": 261773, "epoch": 3153} {"train_loss": -25.574682235717773, "global_step": 261774, "epoch": 3153} {"train_loss": -25.368318557739258, "global_step": 261775, "epoch": 3153} {"train_loss": -24.756925582885742, "global_step": 261776, "epoch": 3153} {"train_loss": -25.199365615844727, "global_step": 261777, "epoch": 3153} {"train_loss": -25.15656089782715, "global_step": 261778, "epoch": 3153} {"train_loss": -25.49017333984375, "global_step": 261779, "epoch": 3153} {"train_loss": -25.34332847595215, "global_step": 261780, "epoch": 3153} {"train_loss": -25.02388496858528, "global_step": 261781, "epoch": 3153, "val_loss": 6890095.0} {"train_loss": -24.88937759399414, "global_step": 261782, "epoch": 3154} {"train_loss": -25.007600784301758, "global_step": 261783, "epoch": 3154} {"train_loss": -24.795202255249023, "global_step": 261784, "epoch": 3154} {"train_loss": -24.523832321166992, "global_step": 261785, "epoch": 3154} {"train_loss": -24.627765655517578, "global_step": 261786, "epoch": 3154} {"train_loss": -24.68849754333496, "global_step": 261787, "epoch": 3154} {"train_loss": -24.521860122680664, "global_step": 261788, "epoch": 3154} {"train_loss": -24.801816940307617, "global_step": 261789, "epoch": 3154} {"train_loss": -24.920455932617188, "global_step": 261790, "epoch": 3154} {"train_loss": -25.318193435668945, "global_step": 261791, "epoch": 3154} {"train_loss": -25.2825927734375, "global_step": 261792, "epoch": 3154} {"train_loss": -24.673656463623047, "global_step": 261793, "epoch": 3154} {"train_loss": -25.040943145751953, "global_step": 261794, "epoch": 3154} {"train_loss": -25.123701095581055, "global_step": 261795, "epoch": 3154} {"train_loss": -25.25787353515625, "global_step": 261796, "epoch": 3154} {"train_loss": -25.24555015563965, "global_step": 261797, "epoch": 3154} {"train_loss": -25.34747886657715, "global_step": 261798, "epoch": 3154} {"train_loss": -25.271902084350586, "global_step": 261799, "epoch": 3154} {"train_loss": -25.303363800048828, "global_step": 261800, "epoch": 3154} {"train_loss": -25.279970169067383, "global_step": 261801, "epoch": 3154} {"train_loss": -24.97201919555664, "global_step": 261802, "epoch": 3154} {"train_loss": -25.012277603149414, "global_step": 261803, "epoch": 3154} {"train_loss": -25.378250122070312, "global_step": 261804, "epoch": 3154} {"train_loss": -25.207300186157227, "global_step": 261805, "epoch": 3154} {"train_loss": -25.189115524291992, "global_step": 261806, "epoch": 3154} {"train_loss": -25.19571304321289, "global_step": 261807, "epoch": 3154} {"train_loss": -25.35585594177246, "global_step": 261808, "epoch": 3154} {"train_loss": -25.08588218688965, "global_step": 261809, "epoch": 3154} {"train_loss": -25.392271041870117, "global_step": 261810, "epoch": 3154} {"train_loss": -25.184173583984375, "global_step": 261811, "epoch": 3154} {"train_loss": -25.393699645996094, "global_step": 261812, "epoch": 3154} {"train_loss": -25.001480102539062, "global_step": 261813, "epoch": 3154} {"train_loss": -25.064163208007812, "global_step": 261814, "epoch": 3154} {"train_loss": -25.371875762939453, "global_step": 261815, "epoch": 3154} {"train_loss": -25.40981101989746, "global_step": 261816, "epoch": 3154} {"train_loss": -25.200218200683594, "global_step": 261817, "epoch": 3154} {"train_loss": -25.329214096069336, "global_step": 261818, "epoch": 3154} {"train_loss": -25.196439743041992, "global_step": 261819, "epoch": 3154} {"train_loss": -25.27545166015625, "global_step": 261820, "epoch": 3154} {"train_loss": -25.183950424194336, "global_step": 261821, "epoch": 3154} {"train_loss": -25.381025314331055, "global_step": 261822, "epoch": 3154} {"train_loss": -25.405078887939453, "global_step": 261823, "epoch": 3154} {"train_loss": -25.071779251098633, "global_step": 261824, "epoch": 3154} {"train_loss": -25.0545654296875, "global_step": 261825, "epoch": 3154} {"train_loss": -25.502309799194336, "global_step": 261826, "epoch": 3154} {"train_loss": -25.12786293029785, "global_step": 261827, "epoch": 3154} {"train_loss": -25.040205001831055, "global_step": 261828, "epoch": 3154} {"train_loss": -25.35281753540039, "global_step": 261829, "epoch": 3154} {"train_loss": -24.983304977416992, "global_step": 261830, "epoch": 3154} {"train_loss": -25.215194702148438, "global_step": 261831, "epoch": 3154} {"train_loss": -25.165029525756836, "global_step": 261832, "epoch": 3154} {"train_loss": -25.04646873474121, "global_step": 261833, "epoch": 3154} {"train_loss": -25.211166381835938, "global_step": 261834, "epoch": 3154} {"train_loss": -24.55377769470215, "global_step": 261835, "epoch": 3154} {"train_loss": -25.089744567871094, "global_step": 261836, "epoch": 3154} {"train_loss": -24.98829460144043, "global_step": 261837, "epoch": 3154} {"train_loss": -25.607385635375977, "global_step": 261838, "epoch": 3154} {"train_loss": -24.93491554260254, "global_step": 261839, "epoch": 3154} {"train_loss": -24.844831466674805, "global_step": 261840, "epoch": 3154} {"train_loss": -25.25153160095215, "global_step": 261841, "epoch": 3154} {"train_loss": -25.09278106689453, "global_step": 261842, "epoch": 3154} {"train_loss": -24.72623634338379, "global_step": 261843, "epoch": 3154} {"train_loss": -25.10963249206543, "global_step": 261844, "epoch": 3154} {"train_loss": -25.34661293029785, "global_step": 261845, "epoch": 3154} {"train_loss": -24.876964569091797, "global_step": 261846, "epoch": 3154} {"train_loss": -25.000511169433594, "global_step": 261847, "epoch": 3154} {"train_loss": -24.96393585205078, "global_step": 261848, "epoch": 3154} {"train_loss": -25.35199546813965, "global_step": 261849, "epoch": 3154} {"train_loss": -25.12419891357422, "global_step": 261850, "epoch": 3154} {"train_loss": -24.881643295288086, "global_step": 261851, "epoch": 3154} {"train_loss": -25.24400520324707, "global_step": 261852, "epoch": 3154} {"train_loss": -25.369638442993164, "global_step": 261853, "epoch": 3154} {"train_loss": -25.137191772460938, "global_step": 261854, "epoch": 3154} {"train_loss": -25.63655662536621, "global_step": 261855, "epoch": 3154} {"train_loss": -25.347986221313477, "global_step": 261856, "epoch": 3154} {"train_loss": -25.109704971313477, "global_step": 261857, "epoch": 3154} {"train_loss": -25.49258804321289, "global_step": 261858, "epoch": 3154} {"train_loss": -25.22328758239746, "global_step": 261859, "epoch": 3154} {"train_loss": -24.9903621673584, "global_step": 261860, "epoch": 3154} {"train_loss": -25.451337814331055, "global_step": 261861, "epoch": 3154} {"train_loss": -25.291486740112305, "global_step": 261862, "epoch": 3154} {"train_loss": -25.475841522216797, "global_step": 261863, "epoch": 3154} {"train_loss": -25.14394199417298, "global_step": 261864, "epoch": 3154, "val_loss": 6882581.0} {"train_loss": -24.792150497436523, "global_step": 261865, "epoch": 3155} {"train_loss": -23.679540634155273, "global_step": 261866, "epoch": 3155} {"train_loss": -24.367467880249023, "global_step": 261867, "epoch": 3155} {"train_loss": -24.171710968017578, "global_step": 261868, "epoch": 3155} {"train_loss": -24.507749557495117, "global_step": 261869, "epoch": 3155} {"train_loss": -23.705142974853516, "global_step": 261870, "epoch": 3155} {"train_loss": -24.947050094604492, "global_step": 261871, "epoch": 3155} {"train_loss": -24.3407039642334, "global_step": 261872, "epoch": 3155} {"train_loss": -24.3797550201416, "global_step": 261873, "epoch": 3155} {"train_loss": -24.58860206604004, "global_step": 261874, "epoch": 3155} {"train_loss": -24.77242088317871, "global_step": 261875, "epoch": 3155} {"train_loss": -24.790557861328125, "global_step": 261876, "epoch": 3155} {"train_loss": -24.758581161499023, "global_step": 261877, "epoch": 3155} {"train_loss": -24.7617130279541, "global_step": 261878, "epoch": 3155} {"train_loss": -24.810882568359375, "global_step": 261879, "epoch": 3155} {"train_loss": -24.656803131103516, "global_step": 261880, "epoch": 3155} {"train_loss": -24.674163818359375, "global_step": 261881, "epoch": 3155} {"train_loss": -24.699058532714844, "global_step": 261882, "epoch": 3155} {"train_loss": -24.98505973815918, "global_step": 261883, "epoch": 3155} {"train_loss": -24.898807525634766, "global_step": 261884, "epoch": 3155} {"train_loss": -24.958621978759766, "global_step": 261885, "epoch": 3155} {"train_loss": -24.764225006103516, "global_step": 261886, "epoch": 3155} {"train_loss": -25.172494888305664, "global_step": 261887, "epoch": 3155} {"train_loss": -25.049406051635742, "global_step": 261888, "epoch": 3155} {"train_loss": -25.237001419067383, "global_step": 261889, "epoch": 3155} {"train_loss": -25.028736114501953, "global_step": 261890, "epoch": 3155} {"train_loss": -24.9199275970459, "global_step": 261891, "epoch": 3155} {"train_loss": -25.331424713134766, "global_step": 261892, "epoch": 3155} {"train_loss": -25.00014305114746, "global_step": 261893, "epoch": 3155} {"train_loss": -25.122135162353516, "global_step": 261894, "epoch": 3155} {"train_loss": -25.22171974182129, "global_step": 261895, "epoch": 3155} {"train_loss": -25.32881736755371, "global_step": 261896, "epoch": 3155} {"train_loss": -24.870309829711914, "global_step": 261897, "epoch": 3155} {"train_loss": -25.398130416870117, "global_step": 261898, "epoch": 3155} {"train_loss": -25.185346603393555, "global_step": 261899, "epoch": 3155} {"train_loss": -25.6068172454834, "global_step": 261900, "epoch": 3155} {"train_loss": -25.18317222595215, "global_step": 261901, "epoch": 3155} {"train_loss": -25.48646354675293, "global_step": 261902, "epoch": 3155} {"train_loss": -25.210294723510742, "global_step": 261903, "epoch": 3155} {"train_loss": -25.005943298339844, "global_step": 261904, "epoch": 3155} {"train_loss": -25.449726104736328, "global_step": 261905, "epoch": 3155} {"train_loss": -25.120206832885742, "global_step": 261906, "epoch": 3155} {"train_loss": -25.61295509338379, "global_step": 261907, "epoch": 3155} {"train_loss": -25.551259994506836, "global_step": 261908, "epoch": 3155} {"train_loss": -25.582962036132812, "global_step": 261909, "epoch": 3155} {"train_loss": -25.65665054321289, "global_step": 261910, "epoch": 3155} {"train_loss": -25.014616012573242, "global_step": 261911, "epoch": 3155} {"train_loss": -24.963773727416992, "global_step": 261912, "epoch": 3155} {"train_loss": -24.80804443359375, "global_step": 261913, "epoch": 3155} {"train_loss": -25.66016960144043, "global_step": 261914, "epoch": 3155} {"train_loss": -25.297115325927734, "global_step": 261915, "epoch": 3155} {"train_loss": -25.14386558532715, "global_step": 261916, "epoch": 3155} {"train_loss": -25.13812828063965, "global_step": 261917, "epoch": 3155} {"train_loss": -24.944849014282227, "global_step": 261918, "epoch": 3155} {"train_loss": -25.44189453125, "global_step": 261919, "epoch": 3155} {"train_loss": -25.263755798339844, "global_step": 261920, "epoch": 3155} {"train_loss": -24.917049407958984, "global_step": 261921, "epoch": 3155} {"train_loss": -24.935760498046875, "global_step": 261922, "epoch": 3155} {"train_loss": -25.691532135009766, "global_step": 261923, "epoch": 3155} {"train_loss": -25.14998435974121, "global_step": 261924, "epoch": 3155} {"train_loss": -24.94684410095215, "global_step": 261925, "epoch": 3155} {"train_loss": -25.061145782470703, "global_step": 261926, "epoch": 3155} {"train_loss": -25.1455135345459, "global_step": 261927, "epoch": 3155} {"train_loss": -25.0018253326416, "global_step": 261928, "epoch": 3155} {"train_loss": -24.97406578063965, "global_step": 261929, "epoch": 3155} {"train_loss": -25.246078491210938, "global_step": 261930, "epoch": 3155} {"train_loss": -25.10471534729004, "global_step": 261931, "epoch": 3155} {"train_loss": -24.718313217163086, "global_step": 261932, "epoch": 3155} {"train_loss": -25.579198837280273, "global_step": 261933, "epoch": 3155} {"train_loss": -25.272829055786133, "global_step": 261934, "epoch": 3155} {"train_loss": -25.24574851989746, "global_step": 261935, "epoch": 3155} {"train_loss": -24.94931411743164, "global_step": 261936, "epoch": 3155} {"train_loss": -24.749887466430664, "global_step": 261937, "epoch": 3155} {"train_loss": -24.63344383239746, "global_step": 261938, "epoch": 3155} {"train_loss": -25.207792282104492, "global_step": 261939, "epoch": 3155} {"train_loss": -25.34866714477539, "global_step": 261940, "epoch": 3155} {"train_loss": -24.967710494995117, "global_step": 261941, "epoch": 3155} {"train_loss": -25.070781707763672, "global_step": 261942, "epoch": 3155} {"train_loss": -25.547534942626953, "global_step": 261943, "epoch": 3155} {"train_loss": -25.113122940063477, "global_step": 261944, "epoch": 3155} {"train_loss": -25.14603042602539, "global_step": 261945, "epoch": 3155} {"train_loss": -25.39410972595215, "global_step": 261946, "epoch": 3155} {"train_loss": -25.035316972847443, "global_step": 261947, "epoch": 3155, "val_loss": 6995358.5} {"train_loss": -24.78315544128418, "global_step": 261948, "epoch": 3156} {"train_loss": -24.950952529907227, "global_step": 261949, "epoch": 3156} {"train_loss": -24.83734703063965, "global_step": 261950, "epoch": 3156} {"train_loss": -24.747116088867188, "global_step": 261951, "epoch": 3156} {"train_loss": -25.2772274017334, "global_step": 261952, "epoch": 3156} {"train_loss": -25.2667236328125, "global_step": 261953, "epoch": 3156} {"train_loss": -24.842557907104492, "global_step": 261954, "epoch": 3156} {"train_loss": -25.107574462890625, "global_step": 261955, "epoch": 3156} {"train_loss": -25.406789779663086, "global_step": 261956, "epoch": 3156} {"train_loss": -25.2514705657959, "global_step": 261957, "epoch": 3156} {"train_loss": -25.098764419555664, "global_step": 261958, "epoch": 3156} {"train_loss": -25.21143341064453, "global_step": 261959, "epoch": 3156} {"train_loss": -25.219013214111328, "global_step": 261960, "epoch": 3156} {"train_loss": -25.207927703857422, "global_step": 261961, "epoch": 3156} {"train_loss": -25.533639907836914, "global_step": 261962, "epoch": 3156} {"train_loss": -24.89652442932129, "global_step": 261963, "epoch": 3156} {"train_loss": -25.26984977722168, "global_step": 261964, "epoch": 3156} {"train_loss": -25.253015518188477, "global_step": 261965, "epoch": 3156} {"train_loss": -25.29288673400879, "global_step": 261966, "epoch": 3156} {"train_loss": -25.33857536315918, "global_step": 261967, "epoch": 3156} {"train_loss": -25.047910690307617, "global_step": 261968, "epoch": 3156} {"train_loss": -25.178030014038086, "global_step": 261969, "epoch": 3156} {"train_loss": -25.262964248657227, "global_step": 261970, "epoch": 3156} {"train_loss": -25.114547729492188, "global_step": 261971, "epoch": 3156} {"train_loss": -25.275285720825195, "global_step": 261972, "epoch": 3156} {"train_loss": -24.83450698852539, "global_step": 261973, "epoch": 3156} {"train_loss": -24.893325805664062, "global_step": 261974, "epoch": 3156} {"train_loss": -25.13873291015625, "global_step": 261975, "epoch": 3156} {"train_loss": -25.448699951171875, "global_step": 261976, "epoch": 3156} {"train_loss": -25.448408126831055, "global_step": 261977, "epoch": 3156} {"train_loss": -25.521135330200195, "global_step": 261978, "epoch": 3156} {"train_loss": -25.25666618347168, "global_step": 261979, "epoch": 3156} {"train_loss": -24.991260528564453, "global_step": 261980, "epoch": 3156} {"train_loss": -25.354398727416992, "global_step": 261981, "epoch": 3156} {"train_loss": -25.131114959716797, "global_step": 261982, "epoch": 3156} {"train_loss": -25.482563018798828, "global_step": 261983, "epoch": 3156} {"train_loss": -25.760910034179688, "global_step": 261984, "epoch": 3156} {"train_loss": -25.20026969909668, "global_step": 261985, "epoch": 3156} {"train_loss": -25.2227725982666, "global_step": 261986, "epoch": 3156} {"train_loss": -25.687414169311523, "global_step": 261987, "epoch": 3156} {"train_loss": -25.03521728515625, "global_step": 261988, "epoch": 3156} {"train_loss": -25.026941299438477, "global_step": 261989, "epoch": 3156} {"train_loss": -25.18971061706543, "global_step": 261990, "epoch": 3156} {"train_loss": -24.93106460571289, "global_step": 261991, "epoch": 3156} {"train_loss": -25.291711807250977, "global_step": 261992, "epoch": 3156} {"train_loss": -24.995405197143555, "global_step": 261993, "epoch": 3156} {"train_loss": -25.66362953186035, "global_step": 261994, "epoch": 3156} {"train_loss": -25.369436264038086, "global_step": 261995, "epoch": 3156} {"train_loss": -25.0252742767334, "global_step": 261996, "epoch": 3156} {"train_loss": -25.064260482788086, "global_step": 261997, "epoch": 3156} {"train_loss": -25.31439781188965, "global_step": 261998, "epoch": 3156} {"train_loss": -25.058515548706055, "global_step": 261999, "epoch": 3156} {"train_loss": -25.164770126342773, "global_step": 262000, "epoch": 3156} {"train_loss": -25.032989501953125, "global_step": 262001, "epoch": 3156} {"train_loss": -24.950204849243164, "global_step": 262002, "epoch": 3156} {"train_loss": -25.314647674560547, "global_step": 262003, "epoch": 3156} {"train_loss": -25.305763244628906, "global_step": 262004, "epoch": 3156} {"train_loss": -25.310688018798828, "global_step": 262005, "epoch": 3156} {"train_loss": -25.20191764831543, "global_step": 262006, "epoch": 3156} {"train_loss": -25.255807876586914, "global_step": 262007, "epoch": 3156} {"train_loss": -24.423259735107422, "global_step": 262008, "epoch": 3156} {"train_loss": -25.183256149291992, "global_step": 262009, "epoch": 3156} {"train_loss": -25.228918075561523, "global_step": 262010, "epoch": 3156} {"train_loss": -25.342884063720703, "global_step": 262011, "epoch": 3156} {"train_loss": -24.889787673950195, "global_step": 262012, "epoch": 3156} {"train_loss": -24.855085372924805, "global_step": 262013, "epoch": 3156} {"train_loss": -25.37282371520996, "global_step": 262014, "epoch": 3156} {"train_loss": -25.486845016479492, "global_step": 262015, "epoch": 3156} {"train_loss": -25.115888595581055, "global_step": 262016, "epoch": 3156} {"train_loss": -25.1606388092041, "global_step": 262017, "epoch": 3156} {"train_loss": -24.71060562133789, "global_step": 262018, "epoch": 3156} {"train_loss": -25.228071212768555, "global_step": 262019, "epoch": 3156} {"train_loss": -25.255847930908203, "global_step": 262020, "epoch": 3156} {"train_loss": -25.081811904907227, "global_step": 262021, "epoch": 3156} {"train_loss": -25.13608741760254, "global_step": 262022, "epoch": 3156} {"train_loss": -25.049102783203125, "global_step": 262023, "epoch": 3156} {"train_loss": -25.472349166870117, "global_step": 262024, "epoch": 3156} {"train_loss": -25.207752227783203, "global_step": 262025, "epoch": 3156} {"train_loss": -24.993242263793945, "global_step": 262026, "epoch": 3156} {"train_loss": -25.47553253173828, "global_step": 262027, "epoch": 3156} {"train_loss": -25.18024444580078, "global_step": 262028, "epoch": 3156} {"train_loss": -25.352407455444336, "global_step": 262029, "epoch": 3156} {"train_loss": -25.152414505740246, "global_step": 262030, "epoch": 3156, "val_loss": 6844633.0} {"train_loss": -22.665475845336914, "global_step": 262031, "epoch": 3157} {"train_loss": -21.815847396850586, "global_step": 262032, "epoch": 3157} {"train_loss": -24.149032592773438, "global_step": 262033, "epoch": 3157} {"train_loss": -24.472976684570312, "global_step": 262034, "epoch": 3157} {"train_loss": -23.434995651245117, "global_step": 262035, "epoch": 3157} {"train_loss": -24.546476364135742, "global_step": 262036, "epoch": 3157} {"train_loss": -24.41946792602539, "global_step": 262037, "epoch": 3157} {"train_loss": -24.663610458374023, "global_step": 262038, "epoch": 3157} {"train_loss": -24.202146530151367, "global_step": 262039, "epoch": 3157} {"train_loss": -24.64076805114746, "global_step": 262040, "epoch": 3157} {"train_loss": -24.421648025512695, "global_step": 262041, "epoch": 3157} {"train_loss": -24.588205337524414, "global_step": 262042, "epoch": 3157} {"train_loss": -24.336406707763672, "global_step": 262043, "epoch": 3157} {"train_loss": -24.491308212280273, "global_step": 262044, "epoch": 3157} {"train_loss": -24.71281623840332, "global_step": 262045, "epoch": 3157} {"train_loss": -24.92054557800293, "global_step": 262046, "epoch": 3157} {"train_loss": -24.874082565307617, "global_step": 262047, "epoch": 3157} {"train_loss": -24.905887603759766, "global_step": 262048, "epoch": 3157} {"train_loss": -24.39138412475586, "global_step": 262049, "epoch": 3157} {"train_loss": -24.8540096282959, "global_step": 262050, "epoch": 3157} {"train_loss": -24.60378074645996, "global_step": 262051, "epoch": 3157} {"train_loss": -24.858173370361328, "global_step": 262052, "epoch": 3157} {"train_loss": -25.08306884765625, "global_step": 262053, "epoch": 3157} {"train_loss": -24.635786056518555, "global_step": 262054, "epoch": 3157} {"train_loss": -24.940637588500977, "global_step": 262055, "epoch": 3157} {"train_loss": -24.882598876953125, "global_step": 262056, "epoch": 3157} {"train_loss": -25.136859893798828, "global_step": 262057, "epoch": 3157} {"train_loss": -24.701284408569336, "global_step": 262058, "epoch": 3157} {"train_loss": -25.021408081054688, "global_step": 262059, "epoch": 3157} {"train_loss": -24.81232261657715, "global_step": 262060, "epoch": 3157} {"train_loss": -25.295379638671875, "global_step": 262061, "epoch": 3157} {"train_loss": -25.118518829345703, "global_step": 262062, "epoch": 3157} {"train_loss": -25.084571838378906, "global_step": 262063, "epoch": 3157} {"train_loss": -25.418607711791992, "global_step": 262064, "epoch": 3157} {"train_loss": -25.36981201171875, "global_step": 262065, "epoch": 3157} {"train_loss": -25.033109664916992, "global_step": 262066, "epoch": 3157} {"train_loss": -24.96259880065918, "global_step": 262067, "epoch": 3157} {"train_loss": -25.36666488647461, "global_step": 262068, "epoch": 3157} {"train_loss": -25.14208984375, "global_step": 262069, "epoch": 3157} {"train_loss": -25.362470626831055, "global_step": 262070, "epoch": 3157} {"train_loss": -25.051559448242188, "global_step": 262071, "epoch": 3157} {"train_loss": -25.170087814331055, "global_step": 262072, "epoch": 3157} {"train_loss": -25.266101837158203, "global_step": 262073, "epoch": 3157} {"train_loss": -25.00532341003418, "global_step": 262074, "epoch": 3157} {"train_loss": -24.741783142089844, "global_step": 262075, "epoch": 3157} {"train_loss": -25.104894638061523, "global_step": 262076, "epoch": 3157} {"train_loss": -25.128732681274414, "global_step": 262077, "epoch": 3157} {"train_loss": -25.34168815612793, "global_step": 262078, "epoch": 3157} {"train_loss": -25.048038482666016, "global_step": 262079, "epoch": 3157} {"train_loss": -25.31250762939453, "global_step": 262080, "epoch": 3157} {"train_loss": -25.247480392456055, "global_step": 262081, "epoch": 3157} {"train_loss": -24.968246459960938, "global_step": 262082, "epoch": 3157} {"train_loss": -25.159202575683594, "global_step": 262083, "epoch": 3157} {"train_loss": -25.087289810180664, "global_step": 262084, "epoch": 3157} {"train_loss": -25.226810455322266, "global_step": 262085, "epoch": 3157} {"train_loss": -25.118270874023438, "global_step": 262086, "epoch": 3157} {"train_loss": -25.23642921447754, "global_step": 262087, "epoch": 3157} {"train_loss": -25.13636016845703, "global_step": 262088, "epoch": 3157} {"train_loss": -25.618616104125977, "global_step": 262089, "epoch": 3157} {"train_loss": -25.092269897460938, "global_step": 262090, "epoch": 3157} {"train_loss": -25.17838478088379, "global_step": 262091, "epoch": 3157} {"train_loss": -25.115747451782227, "global_step": 262092, "epoch": 3157} {"train_loss": -25.374479293823242, "global_step": 262093, "epoch": 3157} {"train_loss": -25.373218536376953, "global_step": 262094, "epoch": 3157} {"train_loss": -24.9301815032959, "global_step": 262095, "epoch": 3157} {"train_loss": -25.13502311706543, "global_step": 262096, "epoch": 3157} {"train_loss": -25.46195411682129, "global_step": 262097, "epoch": 3157} {"train_loss": -25.134668350219727, "global_step": 262098, "epoch": 3157} {"train_loss": -24.786069869995117, "global_step": 262099, "epoch": 3157} {"train_loss": -25.585922241210938, "global_step": 262100, "epoch": 3157} {"train_loss": -24.981082916259766, "global_step": 262101, "epoch": 3157} {"train_loss": -24.82075309753418, "global_step": 262102, "epoch": 3157} {"train_loss": -25.210485458374023, "global_step": 262103, "epoch": 3157} {"train_loss": -25.255170822143555, "global_step": 262104, "epoch": 3157} {"train_loss": -25.154531478881836, "global_step": 262105, "epoch": 3157} {"train_loss": -24.98101234436035, "global_step": 262106, "epoch": 3157} {"train_loss": -25.44605827331543, "global_step": 262107, "epoch": 3157} {"train_loss": -25.345081329345703, "global_step": 262108, "epoch": 3157} {"train_loss": -25.429845809936523, "global_step": 262109, "epoch": 3157} {"train_loss": -25.33692741394043, "global_step": 262110, "epoch": 3157} {"train_loss": -24.999082565307617, "global_step": 262111, "epoch": 3157} {"train_loss": -24.999013900756836, "global_step": 262112, "epoch": 3157} {"train_loss": -24.89081194314612, "global_step": 262113, "epoch": 3157, "val_loss": 6949748.0} {"train_loss": -24.38421058654785, "global_step": 262114, "epoch": 3158} {"train_loss": -23.5544490814209, "global_step": 262115, "epoch": 3158} {"train_loss": -23.73294448852539, "global_step": 262116, "epoch": 3158} {"train_loss": -25.022563934326172, "global_step": 262117, "epoch": 3158} {"train_loss": -24.644227981567383, "global_step": 262118, "epoch": 3158} {"train_loss": -24.994794845581055, "global_step": 262119, "epoch": 3158} {"train_loss": -25.080846786499023, "global_step": 262120, "epoch": 3158} {"train_loss": -24.969356536865234, "global_step": 262121, "epoch": 3158} {"train_loss": -25.0914249420166, "global_step": 262122, "epoch": 3158} {"train_loss": -24.753376007080078, "global_step": 262123, "epoch": 3158} {"train_loss": -24.775146484375, "global_step": 262124, "epoch": 3158} {"train_loss": -25.150806427001953, "global_step": 262125, "epoch": 3158} {"train_loss": -25.290279388427734, "global_step": 262126, "epoch": 3158} {"train_loss": -25.211027145385742, "global_step": 262127, "epoch": 3158} {"train_loss": -24.873504638671875, "global_step": 262128, "epoch": 3158} {"train_loss": -24.741744995117188, "global_step": 262129, "epoch": 3158} {"train_loss": -25.00726318359375, "global_step": 262130, "epoch": 3158} {"train_loss": -25.012439727783203, "global_step": 262131, "epoch": 3158} {"train_loss": -24.974807739257812, "global_step": 262132, "epoch": 3158} {"train_loss": -25.114572525024414, "global_step": 262133, "epoch": 3158} {"train_loss": -25.278488159179688, "global_step": 262134, "epoch": 3158} {"train_loss": -25.203744888305664, "global_step": 262135, "epoch": 3158} {"train_loss": -25.19589614868164, "global_step": 262136, "epoch": 3158} {"train_loss": -25.201993942260742, "global_step": 262137, "epoch": 3158} {"train_loss": -25.347286224365234, "global_step": 262138, "epoch": 3158} {"train_loss": -25.274168014526367, "global_step": 262139, "epoch": 3158} {"train_loss": -25.334638595581055, "global_step": 262140, "epoch": 3158} {"train_loss": -24.708419799804688, "global_step": 262141, "epoch": 3158} {"train_loss": -25.18243980407715, "global_step": 262142, "epoch": 3158} {"train_loss": -25.04911231994629, "global_step": 262143, "epoch": 3158} {"train_loss": -25.121952056884766, "global_step": 262144, "epoch": 3158} {"train_loss": -25.2506103515625, "global_step": 262145, "epoch": 3158} {"train_loss": -25.144128799438477, "global_step": 262146, "epoch": 3158} {"train_loss": -25.244565963745117, "global_step": 262147, "epoch": 3158} {"train_loss": -25.246540069580078, "global_step": 262148, "epoch": 3158} {"train_loss": -25.158918380737305, "global_step": 262149, "epoch": 3158} {"train_loss": -25.125120162963867, "global_step": 262150, "epoch": 3158} {"train_loss": -25.23811912536621, "global_step": 262151, "epoch": 3158} {"train_loss": -25.257421493530273, "global_step": 262152, "epoch": 3158} {"train_loss": -25.385900497436523, "global_step": 262153, "epoch": 3158} {"train_loss": -25.62112808227539, "global_step": 262154, "epoch": 3158} {"train_loss": -25.122661590576172, "global_step": 262155, "epoch": 3158} {"train_loss": -25.389524459838867, "global_step": 262156, "epoch": 3158} {"train_loss": -25.225452423095703, "global_step": 262157, "epoch": 3158} {"train_loss": -25.387985229492188, "global_step": 262158, "epoch": 3158} {"train_loss": -25.09515380859375, "global_step": 262159, "epoch": 3158} {"train_loss": -25.38848304748535, "global_step": 262160, "epoch": 3158} {"train_loss": -24.8995361328125, "global_step": 262161, "epoch": 3158} {"train_loss": -24.71210479736328, "global_step": 262162, "epoch": 3158} {"train_loss": -25.37223243713379, "global_step": 262163, "epoch": 3158} {"train_loss": -25.341291427612305, "global_step": 262164, "epoch": 3158} {"train_loss": -25.168176651000977, "global_step": 262165, "epoch": 3158} {"train_loss": -24.78790283203125, "global_step": 262166, "epoch": 3158} {"train_loss": -24.863000869750977, "global_step": 262167, "epoch": 3158} {"train_loss": -24.966100692749023, "global_step": 262168, "epoch": 3158} {"train_loss": -24.91499137878418, "global_step": 262169, "epoch": 3158} {"train_loss": -24.66518211364746, "global_step": 262170, "epoch": 3158} {"train_loss": -25.119840621948242, "global_step": 262171, "epoch": 3158} {"train_loss": -25.041397094726562, "global_step": 262172, "epoch": 3158} {"train_loss": -25.189565658569336, "global_step": 262173, "epoch": 3158} {"train_loss": -25.017969131469727, "global_step": 262174, "epoch": 3158} {"train_loss": -25.0709228515625, "global_step": 262175, "epoch": 3158} {"train_loss": -24.59893798828125, "global_step": 262176, "epoch": 3158} {"train_loss": -24.86824607849121, "global_step": 262177, "epoch": 3158} {"train_loss": -24.945600509643555, "global_step": 262178, "epoch": 3158} {"train_loss": -25.295391082763672, "global_step": 262179, "epoch": 3158} {"train_loss": -25.284793853759766, "global_step": 262180, "epoch": 3158} {"train_loss": -25.27320671081543, "global_step": 262181, "epoch": 3158} {"train_loss": -25.036396026611328, "global_step": 262182, "epoch": 3158} {"train_loss": -25.06976890563965, "global_step": 262183, "epoch": 3158} {"train_loss": -24.953577041625977, "global_step": 262184, "epoch": 3158} {"train_loss": -25.318756103515625, "global_step": 262185, "epoch": 3158} {"train_loss": -25.413658142089844, "global_step": 262186, "epoch": 3158} {"train_loss": -25.176984786987305, "global_step": 262187, "epoch": 3158} {"train_loss": -25.002294540405273, "global_step": 262188, "epoch": 3158} {"train_loss": -25.148080825805664, "global_step": 262189, "epoch": 3158} {"train_loss": -25.069629669189453, "global_step": 262190, "epoch": 3158} {"train_loss": -25.593530654907227, "global_step": 262191, "epoch": 3158} {"train_loss": -25.147991180419922, "global_step": 262192, "epoch": 3158} {"train_loss": -25.2724666595459, "global_step": 262193, "epoch": 3158} {"train_loss": -24.921314239501953, "global_step": 262194, "epoch": 3158} {"train_loss": -25.003650665283203, "global_step": 262195, "epoch": 3158} {"train_loss": -25.047665860279498, "global_step": 262196, "epoch": 3158, "val_loss": 6937461.5} {"train_loss": -24.465913772583008, "global_step": 262197, "epoch": 3159} {"train_loss": -24.127506256103516, "global_step": 262198, "epoch": 3159} {"train_loss": -24.96902847290039, "global_step": 262199, "epoch": 3159} {"train_loss": -24.470666885375977, "global_step": 262200, "epoch": 3159} {"train_loss": -24.582176208496094, "global_step": 262201, "epoch": 3159} {"train_loss": -24.86080551147461, "global_step": 262202, "epoch": 3159} {"train_loss": -24.938268661499023, "global_step": 262203, "epoch": 3159} {"train_loss": -24.986791610717773, "global_step": 262204, "epoch": 3159} {"train_loss": -24.657434463500977, "global_step": 262205, "epoch": 3159} {"train_loss": -24.620450973510742, "global_step": 262206, "epoch": 3159} {"train_loss": -25.175622940063477, "global_step": 262207, "epoch": 3159} {"train_loss": -24.38873863220215, "global_step": 262208, "epoch": 3159} {"train_loss": -24.882728576660156, "global_step": 262209, "epoch": 3159} {"train_loss": -25.231679916381836, "global_step": 262210, "epoch": 3159} {"train_loss": -24.63229751586914, "global_step": 262211, "epoch": 3159} {"train_loss": -24.516019821166992, "global_step": 262212, "epoch": 3159} {"train_loss": -24.64438247680664, "global_step": 262213, "epoch": 3159} {"train_loss": -24.789207458496094, "global_step": 262214, "epoch": 3159} {"train_loss": -24.874771118164062, "global_step": 262215, "epoch": 3159} {"train_loss": -24.99897003173828, "global_step": 262216, "epoch": 3159} {"train_loss": -25.157480239868164, "global_step": 262217, "epoch": 3159} {"train_loss": -24.707733154296875, "global_step": 262218, "epoch": 3159} {"train_loss": -25.11539649963379, "global_step": 262219, "epoch": 3159} {"train_loss": -24.760128021240234, "global_step": 262220, "epoch": 3159} {"train_loss": -25.420047760009766, "global_step": 262221, "epoch": 3159} {"train_loss": -25.16627311706543, "global_step": 262222, "epoch": 3159} {"train_loss": -25.42626190185547, "global_step": 262223, "epoch": 3159} {"train_loss": -25.16428565979004, "global_step": 262224, "epoch": 3159} {"train_loss": -25.010391235351562, "global_step": 262225, "epoch": 3159} {"train_loss": -25.244142532348633, "global_step": 262226, "epoch": 3159} {"train_loss": -25.029085159301758, "global_step": 262227, "epoch": 3159} {"train_loss": -25.159072875976562, "global_step": 262228, "epoch": 3159} {"train_loss": -25.308156967163086, "global_step": 262229, "epoch": 3159} {"train_loss": -25.255338668823242, "global_step": 262230, "epoch": 3159} {"train_loss": -25.379446029663086, "global_step": 262231, "epoch": 3159} {"train_loss": -25.446744918823242, "global_step": 262232, "epoch": 3159} {"train_loss": -24.87030601501465, "global_step": 262233, "epoch": 3159} {"train_loss": -25.33201026916504, "global_step": 262234, "epoch": 3159} {"train_loss": -25.102415084838867, "global_step": 262235, "epoch": 3159} {"train_loss": -25.449357986450195, "global_step": 262236, "epoch": 3159} {"train_loss": -25.223941802978516, "global_step": 262237, "epoch": 3159} {"train_loss": -25.092086791992188, "global_step": 262238, "epoch": 3159} {"train_loss": -25.375356674194336, "global_step": 262239, "epoch": 3159} {"train_loss": -25.48434829711914, "global_step": 262240, "epoch": 3159} {"train_loss": -25.48647117614746, "global_step": 262241, "epoch": 3159} {"train_loss": -25.252212524414062, "global_step": 262242, "epoch": 3159} {"train_loss": -25.06119155883789, "global_step": 262243, "epoch": 3159} {"train_loss": -25.331340789794922, "global_step": 262244, "epoch": 3159} {"train_loss": -25.644678115844727, "global_step": 262245, "epoch": 3159} {"train_loss": -24.968976974487305, "global_step": 262246, "epoch": 3159} {"train_loss": -25.327505111694336, "global_step": 262247, "epoch": 3159} {"train_loss": -25.34714126586914, "global_step": 262248, "epoch": 3159} {"train_loss": -25.437833786010742, "global_step": 262249, "epoch": 3159} {"train_loss": -25.479511260986328, "global_step": 262250, "epoch": 3159} {"train_loss": -25.524738311767578, "global_step": 262251, "epoch": 3159} {"train_loss": -25.354782104492188, "global_step": 262252, "epoch": 3159} {"train_loss": -25.632848739624023, "global_step": 262253, "epoch": 3159} {"train_loss": -25.214269638061523, "global_step": 262254, "epoch": 3159} {"train_loss": -25.30878257751465, "global_step": 262255, "epoch": 3159} {"train_loss": -25.140005111694336, "global_step": 262256, "epoch": 3159} {"train_loss": -25.29353904724121, "global_step": 262257, "epoch": 3159} {"train_loss": -25.18851089477539, "global_step": 262258, "epoch": 3159} {"train_loss": -24.960134506225586, "global_step": 262259, "epoch": 3159} {"train_loss": -25.105384826660156, "global_step": 262260, "epoch": 3159} {"train_loss": -25.279203414916992, "global_step": 262261, "epoch": 3159} {"train_loss": -25.157379150390625, "global_step": 262262, "epoch": 3159} {"train_loss": -25.34897232055664, "global_step": 262263, "epoch": 3159} {"train_loss": -24.787357330322266, "global_step": 262264, "epoch": 3159} {"train_loss": -25.177490234375, "global_step": 262265, "epoch": 3159} {"train_loss": -25.095783233642578, "global_step": 262266, "epoch": 3159} {"train_loss": -25.277570724487305, "global_step": 262267, "epoch": 3159} {"train_loss": -25.26643943786621, "global_step": 262268, "epoch": 3159} {"train_loss": -25.105472564697266, "global_step": 262269, "epoch": 3159} {"train_loss": -24.930675506591797, "global_step": 262270, "epoch": 3159} {"train_loss": -25.074193954467773, "global_step": 262271, "epoch": 3159} {"train_loss": -25.528226852416992, "global_step": 262272, "epoch": 3159} {"train_loss": -24.886159896850586, "global_step": 262273, "epoch": 3159} {"train_loss": -24.582765579223633, "global_step": 262274, "epoch": 3159} {"train_loss": -25.161346435546875, "global_step": 262275, "epoch": 3159} {"train_loss": -25.23798942565918, "global_step": 262276, "epoch": 3159} {"train_loss": -24.94437026977539, "global_step": 262277, "epoch": 3159} {"train_loss": -25.460132598876953, "global_step": 262278, "epoch": 3159} {"train_loss": -25.09496886471668, "global_step": 262279, "epoch": 3159, "val_loss": 6847250.0} {"train_loss": -24.54585838317871, "global_step": 262280, "epoch": 3160} {"train_loss": -24.821298599243164, "global_step": 262281, "epoch": 3160} {"train_loss": -25.072607040405273, "global_step": 262282, "epoch": 3160} {"train_loss": -24.934661865234375, "global_step": 262283, "epoch": 3160} {"train_loss": -25.09221649169922, "global_step": 262284, "epoch": 3160} {"train_loss": -25.155502319335938, "global_step": 262285, "epoch": 3160} {"train_loss": -25.160045623779297, "global_step": 262286, "epoch": 3160} {"train_loss": -24.8251895904541, "global_step": 262287, "epoch": 3160} {"train_loss": -24.910011291503906, "global_step": 262288, "epoch": 3160} {"train_loss": -25.301925659179688, "global_step": 262289, "epoch": 3160} {"train_loss": -25.24560546875, "global_step": 262290, "epoch": 3160} {"train_loss": -25.370481491088867, "global_step": 262291, "epoch": 3160} {"train_loss": -24.946935653686523, "global_step": 262292, "epoch": 3160} {"train_loss": -25.115005493164062, "global_step": 262293, "epoch": 3160} {"train_loss": -24.98367691040039, "global_step": 262294, "epoch": 3160} {"train_loss": -25.34096336364746, "global_step": 262295, "epoch": 3160} {"train_loss": -25.41584587097168, "global_step": 262296, "epoch": 3160} {"train_loss": -25.356582641601562, "global_step": 262297, "epoch": 3160} {"train_loss": -25.17864990234375, "global_step": 262298, "epoch": 3160} {"train_loss": -25.372201919555664, "global_step": 262299, "epoch": 3160} {"train_loss": -25.311174392700195, "global_step": 262300, "epoch": 3160} {"train_loss": -25.094274520874023, "global_step": 262301, "epoch": 3160} {"train_loss": -25.26865577697754, "global_step": 262302, "epoch": 3160} {"train_loss": -25.372705459594727, "global_step": 262303, "epoch": 3160} {"train_loss": -25.16822624206543, "global_step": 262304, "epoch": 3160} {"train_loss": -25.189706802368164, "global_step": 262305, "epoch": 3160} {"train_loss": -25.253787994384766, "global_step": 262306, "epoch": 3160} {"train_loss": -25.372190475463867, "global_step": 262307, "epoch": 3160} {"train_loss": -25.473417282104492, "global_step": 262308, "epoch": 3160} {"train_loss": -24.965824127197266, "global_step": 262309, "epoch": 3160} {"train_loss": -25.42887306213379, "global_step": 262310, "epoch": 3160} {"train_loss": -25.16794776916504, "global_step": 262311, "epoch": 3160} {"train_loss": -25.308835983276367, "global_step": 262312, "epoch": 3160} {"train_loss": -24.953500747680664, "global_step": 262313, "epoch": 3160} {"train_loss": -25.332508087158203, "global_step": 262314, "epoch": 3160} {"train_loss": -25.112470626831055, "global_step": 262315, "epoch": 3160} {"train_loss": -25.238405227661133, "global_step": 262316, "epoch": 3160} {"train_loss": -25.391767501831055, "global_step": 262317, "epoch": 3160} {"train_loss": -25.297971725463867, "global_step": 262318, "epoch": 3160} {"train_loss": -25.198881149291992, "global_step": 262319, "epoch": 3160} {"train_loss": -25.201993942260742, "global_step": 262320, "epoch": 3160} {"train_loss": -25.09349822998047, "global_step": 262321, "epoch": 3160} {"train_loss": -25.336589813232422, "global_step": 262322, "epoch": 3160} {"train_loss": -25.405548095703125, "global_step": 262323, "epoch": 3160} {"train_loss": -25.404741287231445, "global_step": 262324, "epoch": 3160} {"train_loss": -25.487104415893555, "global_step": 262325, "epoch": 3160} {"train_loss": -25.17181968688965, "global_step": 262326, "epoch": 3160} {"train_loss": -25.325136184692383, "global_step": 262327, "epoch": 3160} {"train_loss": -25.095104217529297, "global_step": 262328, "epoch": 3160} {"train_loss": -25.187026977539062, "global_step": 262329, "epoch": 3160} {"train_loss": -25.620386123657227, "global_step": 262330, "epoch": 3160} {"train_loss": -25.620746612548828, "global_step": 262331, "epoch": 3160} {"train_loss": -25.274442672729492, "global_step": 262332, "epoch": 3160} {"train_loss": -25.565200805664062, "global_step": 262333, "epoch": 3160} {"train_loss": -25.384857177734375, "global_step": 262334, "epoch": 3160} {"train_loss": -24.762805938720703, "global_step": 262335, "epoch": 3160} {"train_loss": -24.711286544799805, "global_step": 262336, "epoch": 3160} {"train_loss": -24.952512741088867, "global_step": 262337, "epoch": 3160} {"train_loss": -25.228158950805664, "global_step": 262338, "epoch": 3160} {"train_loss": -25.140832901000977, "global_step": 262339, "epoch": 3160} {"train_loss": -25.228105545043945, "global_step": 262340, "epoch": 3160} {"train_loss": -25.300790786743164, "global_step": 262341, "epoch": 3160} {"train_loss": -24.6392879486084, "global_step": 262342, "epoch": 3160} {"train_loss": -24.809553146362305, "global_step": 262343, "epoch": 3160} {"train_loss": -25.172653198242188, "global_step": 262344, "epoch": 3160} {"train_loss": -24.888320922851562, "global_step": 262345, "epoch": 3160} {"train_loss": -24.916759490966797, "global_step": 262346, "epoch": 3160} {"train_loss": -25.384592056274414, "global_step": 262347, "epoch": 3160} {"train_loss": -25.253116607666016, "global_step": 262348, "epoch": 3160} {"train_loss": -25.01907730102539, "global_step": 262349, "epoch": 3160} {"train_loss": -25.108081817626953, "global_step": 262350, "epoch": 3160} {"train_loss": -25.099409103393555, "global_step": 262351, "epoch": 3160} {"train_loss": -25.498638153076172, "global_step": 262352, "epoch": 3160} {"train_loss": -25.09518814086914, "global_step": 262353, "epoch": 3160} {"train_loss": -25.31633949279785, "global_step": 262354, "epoch": 3160} {"train_loss": -25.16434669494629, "global_step": 262355, "epoch": 3160} {"train_loss": -25.094491958618164, "global_step": 262356, "epoch": 3160} {"train_loss": -25.143634796142578, "global_step": 262357, "epoch": 3160} {"train_loss": -25.307674407958984, "global_step": 262358, "epoch": 3160} {"train_loss": -25.37894630432129, "global_step": 262359, "epoch": 3160} {"train_loss": -25.243253707885742, "global_step": 262360, "epoch": 3160} {"train_loss": -25.15934181213379, "global_step": 262361, "epoch": 3160} {"train_loss": -25.186505076396895, "global_step": 262362, "epoch": 3160, "val_loss": 6924055.0} {"train_loss": -24.27301597595215, "global_step": 262363, "epoch": 3161} {"train_loss": -24.745859146118164, "global_step": 262364, "epoch": 3161} {"train_loss": -24.28889274597168, "global_step": 262365, "epoch": 3161} {"train_loss": -24.702207565307617, "global_step": 262366, "epoch": 3161} {"train_loss": -23.79970359802246, "global_step": 262367, "epoch": 3161} {"train_loss": -24.918331146240234, "global_step": 262368, "epoch": 3161} {"train_loss": -24.86859130859375, "global_step": 262369, "epoch": 3161} {"train_loss": -24.689542770385742, "global_step": 262370, "epoch": 3161} {"train_loss": -24.840606689453125, "global_step": 262371, "epoch": 3161} {"train_loss": -24.83279800415039, "global_step": 262372, "epoch": 3161} {"train_loss": -24.9027099609375, "global_step": 262373, "epoch": 3161} {"train_loss": -24.664926528930664, "global_step": 262374, "epoch": 3161} {"train_loss": -24.877782821655273, "global_step": 262375, "epoch": 3161} {"train_loss": -24.955495834350586, "global_step": 262376, "epoch": 3161} {"train_loss": -25.131853103637695, "global_step": 262377, "epoch": 3161} {"train_loss": -24.84840202331543, "global_step": 262378, "epoch": 3161} {"train_loss": -24.991058349609375, "global_step": 262379, "epoch": 3161} {"train_loss": -24.696435928344727, "global_step": 262380, "epoch": 3161} {"train_loss": -24.9998779296875, "global_step": 262381, "epoch": 3161} {"train_loss": -24.988895416259766, "global_step": 262382, "epoch": 3161} {"train_loss": -24.994304656982422, "global_step": 262383, "epoch": 3161} {"train_loss": -24.998666763305664, "global_step": 262384, "epoch": 3161} {"train_loss": -24.918567657470703, "global_step": 262385, "epoch": 3161} {"train_loss": -24.931425094604492, "global_step": 262386, "epoch": 3161} {"train_loss": -25.177093505859375, "global_step": 262387, "epoch": 3161} {"train_loss": -25.05622100830078, "global_step": 262388, "epoch": 3161} {"train_loss": -25.481069564819336, "global_step": 262389, "epoch": 3161} {"train_loss": -25.10577964782715, "global_step": 262390, "epoch": 3161} {"train_loss": -25.181474685668945, "global_step": 262391, "epoch": 3161} {"train_loss": -25.24371910095215, "global_step": 262392, "epoch": 3161} {"train_loss": -25.382572174072266, "global_step": 262393, "epoch": 3161} {"train_loss": -25.491348266601562, "global_step": 262394, "epoch": 3161} {"train_loss": -24.925033569335938, "global_step": 262395, "epoch": 3161} {"train_loss": -25.179201126098633, "global_step": 262396, "epoch": 3161} {"train_loss": -25.12409019470215, "global_step": 262397, "epoch": 3161} {"train_loss": -25.166746139526367, "global_step": 262398, "epoch": 3161} {"train_loss": -24.951017379760742, "global_step": 262399, "epoch": 3161} {"train_loss": -25.267454147338867, "global_step": 262400, "epoch": 3161} {"train_loss": -25.167251586914062, "global_step": 262401, "epoch": 3161} {"train_loss": -25.4007625579834, "global_step": 262402, "epoch": 3161} {"train_loss": -25.33198356628418, "global_step": 262403, "epoch": 3161} {"train_loss": -25.635900497436523, "global_step": 262404, "epoch": 3161} {"train_loss": -25.151342391967773, "global_step": 262405, "epoch": 3161} {"train_loss": -25.099262237548828, "global_step": 262406, "epoch": 3161} {"train_loss": -25.310007095336914, "global_step": 262407, "epoch": 3161} {"train_loss": -25.397125244140625, "global_step": 262408, "epoch": 3161} {"train_loss": -25.292221069335938, "global_step": 262409, "epoch": 3161} {"train_loss": -25.57508659362793, "global_step": 262410, "epoch": 3161} {"train_loss": -25.98748779296875, "global_step": 262411, "epoch": 3161} {"train_loss": -25.17451286315918, "global_step": 262412, "epoch": 3161} {"train_loss": -25.4611759185791, "global_step": 262413, "epoch": 3161} {"train_loss": -25.317405700683594, "global_step": 262414, "epoch": 3161} {"train_loss": -24.904394149780273, "global_step": 262415, "epoch": 3161} {"train_loss": -25.05301284790039, "global_step": 262416, "epoch": 3161} {"train_loss": -25.748411178588867, "global_step": 262417, "epoch": 3161} {"train_loss": -25.17410659790039, "global_step": 262418, "epoch": 3161} {"train_loss": -24.797788619995117, "global_step": 262419, "epoch": 3161} {"train_loss": -25.080907821655273, "global_step": 262420, "epoch": 3161} {"train_loss": -25.10902214050293, "global_step": 262421, "epoch": 3161} {"train_loss": -24.693662643432617, "global_step": 262422, "epoch": 3161} {"train_loss": -24.783279418945312, "global_step": 262423, "epoch": 3161} {"train_loss": -24.602794647216797, "global_step": 262424, "epoch": 3161} {"train_loss": -25.288471221923828, "global_step": 262425, "epoch": 3161} {"train_loss": -25.09857177734375, "global_step": 262426, "epoch": 3161} {"train_loss": -24.993261337280273, "global_step": 262427, "epoch": 3161} {"train_loss": -24.825103759765625, "global_step": 262428, "epoch": 3161} {"train_loss": -25.167638778686523, "global_step": 262429, "epoch": 3161} {"train_loss": -25.104698181152344, "global_step": 262430, "epoch": 3161} {"train_loss": -25.488378524780273, "global_step": 262431, "epoch": 3161} {"train_loss": -25.206541061401367, "global_step": 262432, "epoch": 3161} {"train_loss": -25.08848762512207, "global_step": 262433, "epoch": 3161} {"train_loss": -25.02671241760254, "global_step": 262434, "epoch": 3161} {"train_loss": -24.910024642944336, "global_step": 262435, "epoch": 3161} {"train_loss": -24.860401153564453, "global_step": 262436, "epoch": 3161} {"train_loss": -25.286359786987305, "global_step": 262437, "epoch": 3161} {"train_loss": -25.357690811157227, "global_step": 262438, "epoch": 3161} {"train_loss": -25.4637451171875, "global_step": 262439, "epoch": 3161} {"train_loss": -25.6210880279541, "global_step": 262440, "epoch": 3161} {"train_loss": -25.2309627532959, "global_step": 262441, "epoch": 3161} {"train_loss": -25.412458419799805, "global_step": 262442, "epoch": 3161} {"train_loss": -25.2666072845459, "global_step": 262443, "epoch": 3161} {"train_loss": -25.359046936035156, "global_step": 262444, "epoch": 3161} {"train_loss": -25.08210421183023, "global_step": 262445, "epoch": 3161, "val_loss": 6876165.0} {"train_loss": -24.86894989013672, "global_step": 262446, "epoch": 3162} {"train_loss": -24.949172973632812, "global_step": 262447, "epoch": 3162} {"train_loss": -24.698589324951172, "global_step": 262448, "epoch": 3162} {"train_loss": -25.012575149536133, "global_step": 262449, "epoch": 3162} {"train_loss": -24.974885940551758, "global_step": 262450, "epoch": 3162} {"train_loss": -24.775400161743164, "global_step": 262451, "epoch": 3162} {"train_loss": -25.305912017822266, "global_step": 262452, "epoch": 3162} {"train_loss": -24.918411254882812, "global_step": 262453, "epoch": 3162} {"train_loss": -25.390871047973633, "global_step": 262454, "epoch": 3162} {"train_loss": -24.834142684936523, "global_step": 262455, "epoch": 3162} {"train_loss": -25.160903930664062, "global_step": 262456, "epoch": 3162} {"train_loss": -24.74332618713379, "global_step": 262457, "epoch": 3162} {"train_loss": -25.054296493530273, "global_step": 262458, "epoch": 3162} {"train_loss": -24.817642211914062, "global_step": 262459, "epoch": 3162} {"train_loss": -24.89570426940918, "global_step": 262460, "epoch": 3162} {"train_loss": -25.434600830078125, "global_step": 262461, "epoch": 3162} {"train_loss": -25.200809478759766, "global_step": 262462, "epoch": 3162} {"train_loss": -25.2857608795166, "global_step": 262463, "epoch": 3162} {"train_loss": -25.247591018676758, "global_step": 262464, "epoch": 3162} {"train_loss": -25.265270233154297, "global_step": 262465, "epoch": 3162} {"train_loss": -25.21131706237793, "global_step": 262466, "epoch": 3162} {"train_loss": -25.00715446472168, "global_step": 262467, "epoch": 3162} {"train_loss": -25.168792724609375, "global_step": 262468, "epoch": 3162} {"train_loss": -25.16194725036621, "global_step": 262469, "epoch": 3162} {"train_loss": -25.0237979888916, "global_step": 262470, "epoch": 3162} {"train_loss": -25.378265380859375, "global_step": 262471, "epoch": 3162} {"train_loss": -24.920745849609375, "global_step": 262472, "epoch": 3162} {"train_loss": -25.333478927612305, "global_step": 262473, "epoch": 3162} {"train_loss": -24.93263053894043, "global_step": 262474, "epoch": 3162} {"train_loss": -25.061038970947266, "global_step": 262475, "epoch": 3162} {"train_loss": -25.442371368408203, "global_step": 262476, "epoch": 3162} {"train_loss": -25.213184356689453, "global_step": 262477, "epoch": 3162} {"train_loss": -25.40365982055664, "global_step": 262478, "epoch": 3162} {"train_loss": -25.520099639892578, "global_step": 262479, "epoch": 3162} {"train_loss": -24.831501007080078, "global_step": 262480, "epoch": 3162} {"train_loss": -25.40976905822754, "global_step": 262481, "epoch": 3162} {"train_loss": -25.11510467529297, "global_step": 262482, "epoch": 3162} {"train_loss": -24.799823760986328, "global_step": 262483, "epoch": 3162} {"train_loss": -25.369260787963867, "global_step": 262484, "epoch": 3162} {"train_loss": -25.774988174438477, "global_step": 262485, "epoch": 3162} {"train_loss": -25.27959442138672, "global_step": 262486, "epoch": 3162} {"train_loss": -25.29440689086914, "global_step": 262487, "epoch": 3162} {"train_loss": -25.287038803100586, "global_step": 262488, "epoch": 3162} {"train_loss": -25.164133071899414, "global_step": 262489, "epoch": 3162} {"train_loss": -25.08517074584961, "global_step": 262490, "epoch": 3162} {"train_loss": -25.276540756225586, "global_step": 262491, "epoch": 3162} {"train_loss": -25.195486068725586, "global_step": 262492, "epoch": 3162} {"train_loss": -25.2304630279541, "global_step": 262493, "epoch": 3162} {"train_loss": -25.251638412475586, "global_step": 262494, "epoch": 3162} {"train_loss": -25.169511795043945, "global_step": 262495, "epoch": 3162} {"train_loss": -24.87628173828125, "global_step": 262496, "epoch": 3162} {"train_loss": -25.327045440673828, "global_step": 262497, "epoch": 3162} {"train_loss": -25.26759147644043, "global_step": 262498, "epoch": 3162} {"train_loss": -25.256671905517578, "global_step": 262499, "epoch": 3162} {"train_loss": -25.17999839782715, "global_step": 262500, "epoch": 3162} {"train_loss": -24.935922622680664, "global_step": 262501, "epoch": 3162} {"train_loss": -25.40009117126465, "global_step": 262502, "epoch": 3162} {"train_loss": -25.246509552001953, "global_step": 262503, "epoch": 3162} {"train_loss": -24.991907119750977, "global_step": 262504, "epoch": 3162} {"train_loss": -25.239744186401367, "global_step": 262505, "epoch": 3162} {"train_loss": -25.323060989379883, "global_step": 262506, "epoch": 3162} {"train_loss": -25.068750381469727, "global_step": 262507, "epoch": 3162} {"train_loss": -25.280710220336914, "global_step": 262508, "epoch": 3162} {"train_loss": -24.96979331970215, "global_step": 262509, "epoch": 3162} {"train_loss": -25.264760971069336, "global_step": 262510, "epoch": 3162} {"train_loss": -25.33526039123535, "global_step": 262511, "epoch": 3162} {"train_loss": -25.153432846069336, "global_step": 262512, "epoch": 3162} {"train_loss": -25.21038246154785, "global_step": 262513, "epoch": 3162} {"train_loss": -25.21467399597168, "global_step": 262514, "epoch": 3162} {"train_loss": -25.32547378540039, "global_step": 262515, "epoch": 3162} {"train_loss": -25.547958374023438, "global_step": 262516, "epoch": 3162} {"train_loss": -25.25801658630371, "global_step": 262517, "epoch": 3162} {"train_loss": -24.919479370117188, "global_step": 262518, "epoch": 3162} {"train_loss": -25.402769088745117, "global_step": 262519, "epoch": 3162} {"train_loss": -24.92654800415039, "global_step": 262520, "epoch": 3162} {"train_loss": -25.090450286865234, "global_step": 262521, "epoch": 3162} {"train_loss": -24.982080459594727, "global_step": 262522, "epoch": 3162} {"train_loss": -25.051889419555664, "global_step": 262523, "epoch": 3162} {"train_loss": -25.1788272857666, "global_step": 262524, "epoch": 3162} {"train_loss": -25.35167694091797, "global_step": 262525, "epoch": 3162} {"train_loss": -24.85310935974121, "global_step": 262526, "epoch": 3162} {"train_loss": -25.20492935180664, "global_step": 262527, "epoch": 3162} {"train_loss": -25.154134704406005, "global_step": 262528, "epoch": 3162, "val_loss": 6965113.0} {"train_loss": -24.904586791992188, "global_step": 262529, "epoch": 3163} {"train_loss": -24.93678855895996, "global_step": 262530, "epoch": 3163} {"train_loss": -24.97771644592285, "global_step": 262531, "epoch": 3163} {"train_loss": -25.320863723754883, "global_step": 262532, "epoch": 3163} {"train_loss": -25.228546142578125, "global_step": 262533, "epoch": 3163} {"train_loss": -24.874441146850586, "global_step": 262534, "epoch": 3163} {"train_loss": -25.405588150024414, "global_step": 262535, "epoch": 3163} {"train_loss": -24.806949615478516, "global_step": 262536, "epoch": 3163} {"train_loss": -24.972633361816406, "global_step": 262537, "epoch": 3163} {"train_loss": -25.236236572265625, "global_step": 262538, "epoch": 3163} {"train_loss": -24.725341796875, "global_step": 262539, "epoch": 3163} {"train_loss": -25.21079444885254, "global_step": 262540, "epoch": 3163} {"train_loss": -25.143798828125, "global_step": 262541, "epoch": 3163} {"train_loss": -24.88006019592285, "global_step": 262542, "epoch": 3163} {"train_loss": -25.2590274810791, "global_step": 262543, "epoch": 3163} {"train_loss": -25.421979904174805, "global_step": 262544, "epoch": 3163} {"train_loss": -24.957412719726562, "global_step": 262545, "epoch": 3163} {"train_loss": -24.907011032104492, "global_step": 262546, "epoch": 3163} {"train_loss": -24.924962997436523, "global_step": 262547, "epoch": 3163} {"train_loss": -25.2475528717041, "global_step": 262548, "epoch": 3163} {"train_loss": -24.698705673217773, "global_step": 262549, "epoch": 3163} {"train_loss": -24.610889434814453, "global_step": 262550, "epoch": 3163} {"train_loss": -25.1069278717041, "global_step": 262551, "epoch": 3163} {"train_loss": -24.901687622070312, "global_step": 262552, "epoch": 3163} {"train_loss": -24.78451919555664, "global_step": 262553, "epoch": 3163} {"train_loss": -24.84341049194336, "global_step": 262554, "epoch": 3163} {"train_loss": -24.863943099975586, "global_step": 262555, "epoch": 3163} {"train_loss": -24.7860164642334, "global_step": 262556, "epoch": 3163} {"train_loss": -25.189640045166016, "global_step": 262557, "epoch": 3163} {"train_loss": -25.145017623901367, "global_step": 262558, "epoch": 3163} {"train_loss": -24.935117721557617, "global_step": 262559, "epoch": 3163} {"train_loss": -25.29722785949707, "global_step": 262560, "epoch": 3163} {"train_loss": -25.20515251159668, "global_step": 262561, "epoch": 3163} {"train_loss": -25.00481414794922, "global_step": 262562, "epoch": 3163} {"train_loss": -25.08304786682129, "global_step": 262563, "epoch": 3163} {"train_loss": -25.288320541381836, "global_step": 262564, "epoch": 3163} {"train_loss": -25.21205711364746, "global_step": 262565, "epoch": 3163} {"train_loss": -25.266681671142578, "global_step": 262566, "epoch": 3163} {"train_loss": -25.1019344329834, "global_step": 262567, "epoch": 3163} {"train_loss": -25.417598724365234, "global_step": 262568, "epoch": 3163} {"train_loss": -24.89565086364746, "global_step": 262569, "epoch": 3163} {"train_loss": -25.195087432861328, "global_step": 262570, "epoch": 3163} {"train_loss": -25.134206771850586, "global_step": 262571, "epoch": 3163} {"train_loss": -25.02865982055664, "global_step": 262572, "epoch": 3163} {"train_loss": -25.256567001342773, "global_step": 262573, "epoch": 3163} {"train_loss": -25.121963500976562, "global_step": 262574, "epoch": 3163} {"train_loss": -25.3231143951416, "global_step": 262575, "epoch": 3163} {"train_loss": -25.056041717529297, "global_step": 262576, "epoch": 3163} {"train_loss": -25.147253036499023, "global_step": 262577, "epoch": 3163} {"train_loss": -25.003713607788086, "global_step": 262578, "epoch": 3163} {"train_loss": -25.21197509765625, "global_step": 262579, "epoch": 3163} {"train_loss": -25.158061981201172, "global_step": 262580, "epoch": 3163} {"train_loss": -25.759933471679688, "global_step": 262581, "epoch": 3163} {"train_loss": -25.307300567626953, "global_step": 262582, "epoch": 3163} {"train_loss": -25.217010498046875, "global_step": 262583, "epoch": 3163} {"train_loss": -25.053081512451172, "global_step": 262584, "epoch": 3163} {"train_loss": -25.189619064331055, "global_step": 262585, "epoch": 3163} {"train_loss": -25.579633712768555, "global_step": 262586, "epoch": 3163} {"train_loss": -25.486482620239258, "global_step": 262587, "epoch": 3163} {"train_loss": -25.024354934692383, "global_step": 262588, "epoch": 3163} {"train_loss": -25.651172637939453, "global_step": 262589, "epoch": 3163} {"train_loss": -25.274648666381836, "global_step": 262590, "epoch": 3163} {"train_loss": -25.33842658996582, "global_step": 262591, "epoch": 3163} {"train_loss": -25.498889923095703, "global_step": 262592, "epoch": 3163} {"train_loss": -25.338972091674805, "global_step": 262593, "epoch": 3163} {"train_loss": -24.957015991210938, "global_step": 262594, "epoch": 3163} {"train_loss": -25.261585235595703, "global_step": 262595, "epoch": 3163} {"train_loss": -25.35605812072754, "global_step": 262596, "epoch": 3163} {"train_loss": -25.471832275390625, "global_step": 262597, "epoch": 3163} {"train_loss": -24.923879623413086, "global_step": 262598, "epoch": 3163} {"train_loss": -24.962305068969727, "global_step": 262599, "epoch": 3163} {"train_loss": -24.800180435180664, "global_step": 262600, "epoch": 3163} {"train_loss": -25.088180541992188, "global_step": 262601, "epoch": 3163} {"train_loss": -25.000120162963867, "global_step": 262602, "epoch": 3163} {"train_loss": -25.41179656982422, "global_step": 262603, "epoch": 3163} {"train_loss": -25.64849281311035, "global_step": 262604, "epoch": 3163} {"train_loss": -25.511320114135742, "global_step": 262605, "epoch": 3163} {"train_loss": -25.127222061157227, "global_step": 262606, "epoch": 3163} {"train_loss": -25.45721435546875, "global_step": 262607, "epoch": 3163} {"train_loss": -25.110149383544922, "global_step": 262608, "epoch": 3163} {"train_loss": -25.68741226196289, "global_step": 262609, "epoch": 3163} {"train_loss": -24.95859718322754, "global_step": 262610, "epoch": 3163} {"train_loss": -25.153345843395556, "global_step": 262611, "epoch": 3163, "val_loss": 6907329.5} {"train_loss": -23.848257064819336, "global_step": 262612, "epoch": 3164} {"train_loss": -24.65750503540039, "global_step": 262613, "epoch": 3164} {"train_loss": -24.695632934570312, "global_step": 262614, "epoch": 3164} {"train_loss": -24.399494171142578, "global_step": 262615, "epoch": 3164} {"train_loss": -24.7757625579834, "global_step": 262616, "epoch": 3164} {"train_loss": -24.79722023010254, "global_step": 262617, "epoch": 3164} {"train_loss": -24.54924774169922, "global_step": 262618, "epoch": 3164} {"train_loss": -24.711271286010742, "global_step": 262619, "epoch": 3164} {"train_loss": -24.669553756713867, "global_step": 262620, "epoch": 3164} {"train_loss": -24.836444854736328, "global_step": 262621, "epoch": 3164} {"train_loss": -24.63910484313965, "global_step": 262622, "epoch": 3164} {"train_loss": -25.074995040893555, "global_step": 262623, "epoch": 3164} {"train_loss": -24.77223014831543, "global_step": 262624, "epoch": 3164} {"train_loss": -25.055965423583984, "global_step": 262625, "epoch": 3164} {"train_loss": -24.928075790405273, "global_step": 262626, "epoch": 3164} {"train_loss": -24.7432861328125, "global_step": 262627, "epoch": 3164} {"train_loss": -24.67780876159668, "global_step": 262628, "epoch": 3164} {"train_loss": -24.761930465698242, "global_step": 262629, "epoch": 3164} {"train_loss": -25.082616806030273, "global_step": 262630, "epoch": 3164} {"train_loss": -25.073617935180664, "global_step": 262631, "epoch": 3164} {"train_loss": -25.303619384765625, "global_step": 262632, "epoch": 3164} {"train_loss": -25.019620895385742, "global_step": 262633, "epoch": 3164} {"train_loss": -25.009525299072266, "global_step": 262634, "epoch": 3164} {"train_loss": -25.102764129638672, "global_step": 262635, "epoch": 3164} {"train_loss": -24.840593338012695, "global_step": 262636, "epoch": 3164} {"train_loss": -24.99704933166504, "global_step": 262637, "epoch": 3164} {"train_loss": -25.241878509521484, "global_step": 262638, "epoch": 3164} {"train_loss": -24.938573837280273, "global_step": 262639, "epoch": 3164} {"train_loss": -25.138750076293945, "global_step": 262640, "epoch": 3164} {"train_loss": -24.693571090698242, "global_step": 262641, "epoch": 3164} {"train_loss": -25.190570831298828, "global_step": 262642, "epoch": 3164} {"train_loss": -25.043243408203125, "global_step": 262643, "epoch": 3164} {"train_loss": -25.213224411010742, "global_step": 262644, "epoch": 3164} {"train_loss": -25.249296188354492, "global_step": 262645, "epoch": 3164} {"train_loss": -24.72257423400879, "global_step": 262646, "epoch": 3164} {"train_loss": -25.224512100219727, "global_step": 262647, "epoch": 3164} {"train_loss": -25.188552856445312, "global_step": 262648, "epoch": 3164} {"train_loss": -25.35794448852539, "global_step": 262649, "epoch": 3164} {"train_loss": -25.022903442382812, "global_step": 262650, "epoch": 3164} {"train_loss": -25.377302169799805, "global_step": 262651, "epoch": 3164} {"train_loss": -25.158363342285156, "global_step": 262652, "epoch": 3164} {"train_loss": -25.192855834960938, "global_step": 262653, "epoch": 3164} {"train_loss": -25.452199935913086, "global_step": 262654, "epoch": 3164} {"train_loss": -25.793964385986328, "global_step": 262655, "epoch": 3164} {"train_loss": -25.4815616607666, "global_step": 262656, "epoch": 3164} {"train_loss": -25.391294479370117, "global_step": 262657, "epoch": 3164} {"train_loss": -25.33619499206543, "global_step": 262658, "epoch": 3164} {"train_loss": -25.108427047729492, "global_step": 262659, "epoch": 3164} {"train_loss": -25.419111251831055, "global_step": 262660, "epoch": 3164} {"train_loss": -25.175399780273438, "global_step": 262661, "epoch": 3164} {"train_loss": -25.10069465637207, "global_step": 262662, "epoch": 3164} {"train_loss": -25.394149780273438, "global_step": 262663, "epoch": 3164} {"train_loss": -25.45353889465332, "global_step": 262664, "epoch": 3164} {"train_loss": -24.9091854095459, "global_step": 262665, "epoch": 3164} {"train_loss": -25.11758804321289, "global_step": 262666, "epoch": 3164} {"train_loss": -25.288740158081055, "global_step": 262667, "epoch": 3164} {"train_loss": -25.081174850463867, "global_step": 262668, "epoch": 3164} {"train_loss": -24.873769760131836, "global_step": 262669, "epoch": 3164} {"train_loss": -25.186277389526367, "global_step": 262670, "epoch": 3164} {"train_loss": -25.04571533203125, "global_step": 262671, "epoch": 3164} {"train_loss": -24.695283889770508, "global_step": 262672, "epoch": 3164} {"train_loss": -24.3811092376709, "global_step": 262673, "epoch": 3164} {"train_loss": -24.462602615356445, "global_step": 262674, "epoch": 3164} {"train_loss": -24.90236473083496, "global_step": 262675, "epoch": 3164} {"train_loss": -24.629995346069336, "global_step": 262676, "epoch": 3164} {"train_loss": -25.236103057861328, "global_step": 262677, "epoch": 3164} {"train_loss": -24.987201690673828, "global_step": 262678, "epoch": 3164} {"train_loss": -25.131017684936523, "global_step": 262679, "epoch": 3164} {"train_loss": -25.140615463256836, "global_step": 262680, "epoch": 3164} {"train_loss": -25.04120445251465, "global_step": 262681, "epoch": 3164} {"train_loss": -25.063528060913086, "global_step": 262682, "epoch": 3164} {"train_loss": -25.660327911376953, "global_step": 262683, "epoch": 3164} {"train_loss": -25.099180221557617, "global_step": 262684, "epoch": 3164} {"train_loss": -25.27130699157715, "global_step": 262685, "epoch": 3164} {"train_loss": -25.558008193969727, "global_step": 262686, "epoch": 3164} {"train_loss": -25.18064308166504, "global_step": 262687, "epoch": 3164} {"train_loss": -25.59873390197754, "global_step": 262688, "epoch": 3164} {"train_loss": -25.284374237060547, "global_step": 262689, "epoch": 3164} {"train_loss": -25.192075729370117, "global_step": 262690, "epoch": 3164} {"train_loss": -25.447229385375977, "global_step": 262691, "epoch": 3164} {"train_loss": -25.13374137878418, "global_step": 262692, "epoch": 3164} {"train_loss": -24.934024810791016, "global_step": 262693, "epoch": 3164} {"train_loss": -25.04802975022649, "global_step": 262694, "epoch": 3164, "val_loss": 7038459.5} {"train_loss": -24.915143966674805, "global_step": 262695, "epoch": 3165} {"train_loss": -25.40288734436035, "global_step": 262696, "epoch": 3165} {"train_loss": -24.820484161376953, "global_step": 262697, "epoch": 3165} {"train_loss": -25.260345458984375, "global_step": 262698, "epoch": 3165} {"train_loss": -25.046710968017578, "global_step": 262699, "epoch": 3165} {"train_loss": -24.668794631958008, "global_step": 262700, "epoch": 3165} {"train_loss": -25.169456481933594, "global_step": 262701, "epoch": 3165} {"train_loss": -25.083295822143555, "global_step": 262702, "epoch": 3165} {"train_loss": -25.13883399963379, "global_step": 262703, "epoch": 3165} {"train_loss": -25.251861572265625, "global_step": 262704, "epoch": 3165} {"train_loss": -25.139699935913086, "global_step": 262705, "epoch": 3165} {"train_loss": -25.379316329956055, "global_step": 262706, "epoch": 3165} {"train_loss": -25.2595272064209, "global_step": 262707, "epoch": 3165} {"train_loss": -25.294187545776367, "global_step": 262708, "epoch": 3165} {"train_loss": -25.39438819885254, "global_step": 262709, "epoch": 3165} {"train_loss": -25.215078353881836, "global_step": 262710, "epoch": 3165} {"train_loss": -25.250768661499023, "global_step": 262711, "epoch": 3165} {"train_loss": -25.340490341186523, "global_step": 262712, "epoch": 3165} {"train_loss": -25.206083297729492, "global_step": 262713, "epoch": 3165} {"train_loss": -24.639328002929688, "global_step": 262714, "epoch": 3165} {"train_loss": -24.926223754882812, "global_step": 262715, "epoch": 3165} {"train_loss": -25.063745498657227, "global_step": 262716, "epoch": 3165} {"train_loss": -25.09854507446289, "global_step": 262717, "epoch": 3165} {"train_loss": -24.9876708984375, "global_step": 262718, "epoch": 3165} {"train_loss": -25.18900489807129, "global_step": 262719, "epoch": 3165} {"train_loss": -24.963348388671875, "global_step": 262720, "epoch": 3165} {"train_loss": -25.328474044799805, "global_step": 262721, "epoch": 3165} {"train_loss": -25.20253562927246, "global_step": 262722, "epoch": 3165} {"train_loss": -25.115835189819336, "global_step": 262723, "epoch": 3165} {"train_loss": -25.38327980041504, "global_step": 262724, "epoch": 3165} {"train_loss": -24.989187240600586, "global_step": 262725, "epoch": 3165} {"train_loss": -25.40180015563965, "global_step": 262726, "epoch": 3165} {"train_loss": -25.30280113220215, "global_step": 262727, "epoch": 3165} {"train_loss": -25.143627166748047, "global_step": 262728, "epoch": 3165} {"train_loss": -25.15130615234375, "global_step": 262729, "epoch": 3165} {"train_loss": -25.21392059326172, "global_step": 262730, "epoch": 3165} {"train_loss": -25.175241470336914, "global_step": 262731, "epoch": 3165} {"train_loss": -25.170957565307617, "global_step": 262732, "epoch": 3165} {"train_loss": -25.16694450378418, "global_step": 262733, "epoch": 3165} {"train_loss": -25.50690269470215, "global_step": 262734, "epoch": 3165} {"train_loss": -25.134552001953125, "global_step": 262735, "epoch": 3165} {"train_loss": -25.01829719543457, "global_step": 262736, "epoch": 3165} {"train_loss": -24.799264907836914, "global_step": 262737, "epoch": 3165} {"train_loss": -25.271495819091797, "global_step": 262738, "epoch": 3165} {"train_loss": -25.325660705566406, "global_step": 262739, "epoch": 3165} {"train_loss": -25.055753707885742, "global_step": 262740, "epoch": 3165} {"train_loss": -25.253751754760742, "global_step": 262741, "epoch": 3165} {"train_loss": -24.924747467041016, "global_step": 262742, "epoch": 3165} {"train_loss": -25.412126541137695, "global_step": 262743, "epoch": 3165} {"train_loss": -25.51987075805664, "global_step": 262744, "epoch": 3165} {"train_loss": -25.28749656677246, "global_step": 262745, "epoch": 3165} {"train_loss": -25.145898818969727, "global_step": 262746, "epoch": 3165} {"train_loss": -25.757471084594727, "global_step": 262747, "epoch": 3165} {"train_loss": -25.3670597076416, "global_step": 262748, "epoch": 3165} {"train_loss": -25.115543365478516, "global_step": 262749, "epoch": 3165} {"train_loss": -25.099573135375977, "global_step": 262750, "epoch": 3165} {"train_loss": -25.228912353515625, "global_step": 262751, "epoch": 3165} {"train_loss": -25.04842758178711, "global_step": 262752, "epoch": 3165} {"train_loss": -25.14216423034668, "global_step": 262753, "epoch": 3165} {"train_loss": -25.186683654785156, "global_step": 262754, "epoch": 3165} {"train_loss": -25.095232009887695, "global_step": 262755, "epoch": 3165} {"train_loss": -25.423276901245117, "global_step": 262756, "epoch": 3165} {"train_loss": -25.290481567382812, "global_step": 262757, "epoch": 3165} {"train_loss": -25.11865997314453, "global_step": 262758, "epoch": 3165} {"train_loss": -25.239742279052734, "global_step": 262759, "epoch": 3165} {"train_loss": -25.110322952270508, "global_step": 262760, "epoch": 3165} {"train_loss": -25.3464298248291, "global_step": 262761, "epoch": 3165} {"train_loss": -25.161781311035156, "global_step": 262762, "epoch": 3165} {"train_loss": -25.386459350585938, "global_step": 262763, "epoch": 3165} {"train_loss": -25.150907516479492, "global_step": 262764, "epoch": 3165} {"train_loss": -25.215646743774414, "global_step": 262765, "epoch": 3165} {"train_loss": -24.89800262451172, "global_step": 262766, "epoch": 3165} {"train_loss": -24.89920425415039, "global_step": 262767, "epoch": 3165} {"train_loss": -25.02275848388672, "global_step": 262768, "epoch": 3165} {"train_loss": -24.657054901123047, "global_step": 262769, "epoch": 3165} {"train_loss": -25.160995483398438, "global_step": 262770, "epoch": 3165} {"train_loss": -24.944570541381836, "global_step": 262771, "epoch": 3165} {"train_loss": -25.25710105895996, "global_step": 262772, "epoch": 3165} {"train_loss": -24.945236206054688, "global_step": 262773, "epoch": 3165} {"train_loss": -24.888830184936523, "global_step": 262774, "epoch": 3165} {"train_loss": -25.027759552001953, "global_step": 262775, "epoch": 3165} {"train_loss": -24.483198165893555, "global_step": 262776, "epoch": 3165} {"train_loss": -25.150084093392614, "global_step": 262777, "epoch": 3165, "val_loss": 7047051.0} {"train_loss": -24.330307006835938, "global_step": 262778, "epoch": 3166} {"train_loss": -24.462078094482422, "global_step": 262779, "epoch": 3166} {"train_loss": -24.473215103149414, "global_step": 262780, "epoch": 3166} {"train_loss": -23.53253936767578, "global_step": 262781, "epoch": 3166} {"train_loss": -23.54865074157715, "global_step": 262782, "epoch": 3166} {"train_loss": -24.41826629638672, "global_step": 262783, "epoch": 3166} {"train_loss": -24.257001876831055, "global_step": 262784, "epoch": 3166} {"train_loss": -24.389310836791992, "global_step": 262785, "epoch": 3166} {"train_loss": -24.7946834564209, "global_step": 262786, "epoch": 3166} {"train_loss": -24.51909065246582, "global_step": 262787, "epoch": 3166} {"train_loss": -24.556798934936523, "global_step": 262788, "epoch": 3166} {"train_loss": -24.350072860717773, "global_step": 262789, "epoch": 3166} {"train_loss": -24.73905372619629, "global_step": 262790, "epoch": 3166} {"train_loss": -24.686023712158203, "global_step": 262791, "epoch": 3166} {"train_loss": -24.773984909057617, "global_step": 262792, "epoch": 3166} {"train_loss": -24.39021873474121, "global_step": 262793, "epoch": 3166} {"train_loss": -25.058841705322266, "global_step": 262794, "epoch": 3166} {"train_loss": -25.0811824798584, "global_step": 262795, "epoch": 3166} {"train_loss": -25.152393341064453, "global_step": 262796, "epoch": 3166} {"train_loss": -25.26527976989746, "global_step": 262797, "epoch": 3166} {"train_loss": -24.826068878173828, "global_step": 262798, "epoch": 3166} {"train_loss": -24.731826782226562, "global_step": 262799, "epoch": 3166} {"train_loss": -25.09343719482422, "global_step": 262800, "epoch": 3166} {"train_loss": -25.099313735961914, "global_step": 262801, "epoch": 3166} {"train_loss": -25.13141632080078, "global_step": 262802, "epoch": 3166} {"train_loss": -25.095949172973633, "global_step": 262803, "epoch": 3166} {"train_loss": -24.882980346679688, "global_step": 262804, "epoch": 3166} {"train_loss": -25.21526527404785, "global_step": 262805, "epoch": 3166} {"train_loss": -25.235153198242188, "global_step": 262806, "epoch": 3166} {"train_loss": -25.123573303222656, "global_step": 262807, "epoch": 3166} {"train_loss": -25.204975128173828, "global_step": 262808, "epoch": 3166} {"train_loss": -25.23439598083496, "global_step": 262809, "epoch": 3166} {"train_loss": -25.173254013061523, "global_step": 262810, "epoch": 3166} {"train_loss": -25.01034927368164, "global_step": 262811, "epoch": 3166} {"train_loss": -25.435766220092773, "global_step": 262812, "epoch": 3166} {"train_loss": -24.893627166748047, "global_step": 262813, "epoch": 3166} {"train_loss": -24.79233741760254, "global_step": 262814, "epoch": 3166} {"train_loss": -25.229902267456055, "global_step": 262815, "epoch": 3166} {"train_loss": -25.329416275024414, "global_step": 262816, "epoch": 3166} {"train_loss": -25.1711483001709, "global_step": 262817, "epoch": 3166} {"train_loss": -25.3501033782959, "global_step": 262818, "epoch": 3166} {"train_loss": -25.286314010620117, "global_step": 262819, "epoch": 3166} {"train_loss": -24.941219329833984, "global_step": 262820, "epoch": 3166} {"train_loss": -25.488983154296875, "global_step": 262821, "epoch": 3166} {"train_loss": -25.561704635620117, "global_step": 262822, "epoch": 3166} {"train_loss": -25.080265045166016, "global_step": 262823, "epoch": 3166} {"train_loss": -25.29083251953125, "global_step": 262824, "epoch": 3166} {"train_loss": -25.283340454101562, "global_step": 262825, "epoch": 3166} {"train_loss": -25.11240005493164, "global_step": 262826, "epoch": 3166} {"train_loss": -24.885190963745117, "global_step": 262827, "epoch": 3166} {"train_loss": -24.83978843688965, "global_step": 262828, "epoch": 3166} {"train_loss": -24.852365493774414, "global_step": 262829, "epoch": 3166} {"train_loss": -25.325326919555664, "global_step": 262830, "epoch": 3166} {"train_loss": -25.32938575744629, "global_step": 262831, "epoch": 3166} {"train_loss": -25.213895797729492, "global_step": 262832, "epoch": 3166} {"train_loss": -25.097705841064453, "global_step": 262833, "epoch": 3166} {"train_loss": -25.351470947265625, "global_step": 262834, "epoch": 3166} {"train_loss": -25.40341567993164, "global_step": 262835, "epoch": 3166} {"train_loss": -25.298465728759766, "global_step": 262836, "epoch": 3166} {"train_loss": -24.995756149291992, "global_step": 262837, "epoch": 3166} {"train_loss": -25.277557373046875, "global_step": 262838, "epoch": 3166} {"train_loss": -25.15787124633789, "global_step": 262839, "epoch": 3166} {"train_loss": -25.2058162689209, "global_step": 262840, "epoch": 3166} {"train_loss": -25.204532623291016, "global_step": 262841, "epoch": 3166} {"train_loss": -25.434097290039062, "global_step": 262842, "epoch": 3166} {"train_loss": -25.318248748779297, "global_step": 262843, "epoch": 3166} {"train_loss": -25.484174728393555, "global_step": 262844, "epoch": 3166} {"train_loss": -25.015634536743164, "global_step": 262845, "epoch": 3166} {"train_loss": -25.713293075561523, "global_step": 262846, "epoch": 3166} {"train_loss": -25.148527145385742, "global_step": 262847, "epoch": 3166} {"train_loss": -25.029071807861328, "global_step": 262848, "epoch": 3166} {"train_loss": -25.48533058166504, "global_step": 262849, "epoch": 3166} {"train_loss": -25.200605392456055, "global_step": 262850, "epoch": 3166} {"train_loss": -25.092802047729492, "global_step": 262851, "epoch": 3166} {"train_loss": -25.55828857421875, "global_step": 262852, "epoch": 3166} {"train_loss": -25.257450103759766, "global_step": 262853, "epoch": 3166} {"train_loss": -25.103649139404297, "global_step": 262854, "epoch": 3166} {"train_loss": -25.240480422973633, "global_step": 262855, "epoch": 3166} {"train_loss": -25.172975540161133, "global_step": 262856, "epoch": 3166} {"train_loss": -24.967985153198242, "global_step": 262857, "epoch": 3166} {"train_loss": -25.149415969848633, "global_step": 262858, "epoch": 3166} {"train_loss": -25.283742904663086, "global_step": 262859, "epoch": 3166} {"train_loss": -25.027213062148498, "global_step": 262860, "epoch": 3166, "val_loss": 7028404.0} {"train_loss": -24.282804489135742, "global_step": 262861, "epoch": 3167} {"train_loss": -22.132814407348633, "global_step": 262862, "epoch": 3167} {"train_loss": -23.79834747314453, "global_step": 262863, "epoch": 3167} {"train_loss": -23.777551651000977, "global_step": 262864, "epoch": 3167} {"train_loss": -23.877117156982422, "global_step": 262865, "epoch": 3167} {"train_loss": -23.619068145751953, "global_step": 262866, "epoch": 3167} {"train_loss": -23.83358383178711, "global_step": 262867, "epoch": 3167} {"train_loss": -24.112407684326172, "global_step": 262868, "epoch": 3167} {"train_loss": -23.63538932800293, "global_step": 262869, "epoch": 3167} {"train_loss": -24.425844192504883, "global_step": 262870, "epoch": 3167} {"train_loss": -24.140254974365234, "global_step": 262871, "epoch": 3167} {"train_loss": -24.03426170349121, "global_step": 262872, "epoch": 3167} {"train_loss": -24.027387619018555, "global_step": 262873, "epoch": 3167} {"train_loss": -24.645191192626953, "global_step": 262874, "epoch": 3167} {"train_loss": -24.070398330688477, "global_step": 262875, "epoch": 3167} {"train_loss": -24.277021408081055, "global_step": 262876, "epoch": 3167} {"train_loss": -24.25836753845215, "global_step": 262877, "epoch": 3167} {"train_loss": -24.67873191833496, "global_step": 262878, "epoch": 3167} {"train_loss": -24.22720718383789, "global_step": 262879, "epoch": 3167} {"train_loss": -24.434377670288086, "global_step": 262880, "epoch": 3167} {"train_loss": -24.20332908630371, "global_step": 262881, "epoch": 3167} {"train_loss": -24.503793716430664, "global_step": 262882, "epoch": 3167} {"train_loss": -24.79952049255371, "global_step": 262883, "epoch": 3167} {"train_loss": -24.44061851501465, "global_step": 262884, "epoch": 3167} {"train_loss": -24.621854782104492, "global_step": 262885, "epoch": 3167} {"train_loss": -24.737369537353516, "global_step": 262886, "epoch": 3167} {"train_loss": -24.548192977905273, "global_step": 262887, "epoch": 3167} {"train_loss": -24.90291404724121, "global_step": 262888, "epoch": 3167} {"train_loss": -24.868528366088867, "global_step": 262889, "epoch": 3167} {"train_loss": -25.159013748168945, "global_step": 262890, "epoch": 3167} {"train_loss": -24.75174331665039, "global_step": 262891, "epoch": 3167} {"train_loss": -25.271255493164062, "global_step": 262892, "epoch": 3167} {"train_loss": -24.73038101196289, "global_step": 262893, "epoch": 3167} {"train_loss": -24.806367874145508, "global_step": 262894, "epoch": 3167} {"train_loss": -24.80948257446289, "global_step": 262895, "epoch": 3167} {"train_loss": -24.876005172729492, "global_step": 262896, "epoch": 3167} {"train_loss": -25.20540428161621, "global_step": 262897, "epoch": 3167} {"train_loss": -25.233495712280273, "global_step": 262898, "epoch": 3167} {"train_loss": -25.365554809570312, "global_step": 262899, "epoch": 3167} {"train_loss": -24.83167266845703, "global_step": 262900, "epoch": 3167} {"train_loss": -25.563756942749023, "global_step": 262901, "epoch": 3167} {"train_loss": -24.872358322143555, "global_step": 262902, "epoch": 3167} {"train_loss": -25.35794448852539, "global_step": 262903, "epoch": 3167} {"train_loss": -25.19647216796875, "global_step": 262904, "epoch": 3167} {"train_loss": -25.14438247680664, "global_step": 262905, "epoch": 3167} {"train_loss": -25.152570724487305, "global_step": 262906, "epoch": 3167} {"train_loss": -25.46870231628418, "global_step": 262907, "epoch": 3167} {"train_loss": -25.40688705444336, "global_step": 262908, "epoch": 3167} {"train_loss": -25.213300704956055, "global_step": 262909, "epoch": 3167} {"train_loss": -25.24818992614746, "global_step": 262910, "epoch": 3167} {"train_loss": -25.008684158325195, "global_step": 262911, "epoch": 3167} {"train_loss": -25.441125869750977, "global_step": 262912, "epoch": 3167} {"train_loss": -25.225210189819336, "global_step": 262913, "epoch": 3167} {"train_loss": -25.5496883392334, "global_step": 262914, "epoch": 3167} {"train_loss": -25.237030029296875, "global_step": 262915, "epoch": 3167} {"train_loss": -25.578458786010742, "global_step": 262916, "epoch": 3167} {"train_loss": -25.188627243041992, "global_step": 262917, "epoch": 3167} {"train_loss": -24.928998947143555, "global_step": 262918, "epoch": 3167} {"train_loss": -25.244211196899414, "global_step": 262919, "epoch": 3167} {"train_loss": -25.717260360717773, "global_step": 262920, "epoch": 3167} {"train_loss": -25.141035079956055, "global_step": 262921, "epoch": 3167} {"train_loss": -25.196866989135742, "global_step": 262922, "epoch": 3167} {"train_loss": -25.63325309753418, "global_step": 262923, "epoch": 3167} {"train_loss": -25.287851333618164, "global_step": 262924, "epoch": 3167} {"train_loss": -25.695480346679688, "global_step": 262925, "epoch": 3167} {"train_loss": -25.15452766418457, "global_step": 262926, "epoch": 3167} {"train_loss": -25.417194366455078, "global_step": 262927, "epoch": 3167} {"train_loss": -25.071317672729492, "global_step": 262928, "epoch": 3167} {"train_loss": -25.161542892456055, "global_step": 262929, "epoch": 3167} {"train_loss": -25.656030654907227, "global_step": 262930, "epoch": 3167} {"train_loss": -25.565937042236328, "global_step": 262931, "epoch": 3167} {"train_loss": -25.364965438842773, "global_step": 262932, "epoch": 3167} {"train_loss": -25.20736312866211, "global_step": 262933, "epoch": 3167} {"train_loss": -25.200963973999023, "global_step": 262934, "epoch": 3167} {"train_loss": -25.364164352416992, "global_step": 262935, "epoch": 3167} {"train_loss": -25.301713943481445, "global_step": 262936, "epoch": 3167} {"train_loss": -25.32952308654785, "global_step": 262937, "epoch": 3167} {"train_loss": -25.055627822875977, "global_step": 262938, "epoch": 3167} {"train_loss": -24.99211883544922, "global_step": 262939, "epoch": 3167} {"train_loss": -25.131738662719727, "global_step": 262940, "epoch": 3167} {"train_loss": -25.260116577148438, "global_step": 262941, "epoch": 3167} {"train_loss": -25.18105125427246, "global_step": 262942, "epoch": 3167} {"train_loss": -24.881832720285438, "global_step": 262943, "epoch": 3167, "val_loss": 6866113.0} {"train_loss": -24.69693374633789, "global_step": 262944, "epoch": 3168} {"train_loss": -24.065486907958984, "global_step": 262945, "epoch": 3168} {"train_loss": -24.513750076293945, "global_step": 262946, "epoch": 3168} {"train_loss": -24.23493766784668, "global_step": 262947, "epoch": 3168} {"train_loss": -24.909801483154297, "global_step": 262948, "epoch": 3168} {"train_loss": -24.664642333984375, "global_step": 262949, "epoch": 3168} {"train_loss": -24.33192253112793, "global_step": 262950, "epoch": 3168} {"train_loss": -24.47481918334961, "global_step": 262951, "epoch": 3168} {"train_loss": -24.543807983398438, "global_step": 262952, "epoch": 3168} {"train_loss": -24.8445987701416, "global_step": 262953, "epoch": 3168} {"train_loss": -24.93427085876465, "global_step": 262954, "epoch": 3168} {"train_loss": -24.472352981567383, "global_step": 262955, "epoch": 3168} {"train_loss": -24.79292869567871, "global_step": 262956, "epoch": 3168} {"train_loss": -24.807104110717773, "global_step": 262957, "epoch": 3168} {"train_loss": -24.53647232055664, "global_step": 262958, "epoch": 3168} {"train_loss": -24.91990089416504, "global_step": 262959, "epoch": 3168} {"train_loss": -24.908185958862305, "global_step": 262960, "epoch": 3168} {"train_loss": -24.753908157348633, "global_step": 262961, "epoch": 3168} {"train_loss": -24.87917137145996, "global_step": 262962, "epoch": 3168} {"train_loss": -24.90159034729004, "global_step": 262963, "epoch": 3168} {"train_loss": -24.886255264282227, "global_step": 262964, "epoch": 3168} {"train_loss": -24.869232177734375, "global_step": 262965, "epoch": 3168} {"train_loss": -24.734819412231445, "global_step": 262966, "epoch": 3168} {"train_loss": -24.63319206237793, "global_step": 262967, "epoch": 3168} {"train_loss": -25.01082420349121, "global_step": 262968, "epoch": 3168} {"train_loss": -25.0759220123291, "global_step": 262969, "epoch": 3168} {"train_loss": -24.848600387573242, "global_step": 262970, "epoch": 3168} {"train_loss": -25.252897262573242, "global_step": 262971, "epoch": 3168} {"train_loss": -24.979673385620117, "global_step": 262972, "epoch": 3168} {"train_loss": -25.258764266967773, "global_step": 262973, "epoch": 3168} {"train_loss": -24.945775985717773, "global_step": 262974, "epoch": 3168} {"train_loss": -25.202198028564453, "global_step": 262975, "epoch": 3168} {"train_loss": -25.075098037719727, "global_step": 262976, "epoch": 3168} {"train_loss": -25.27619743347168, "global_step": 262977, "epoch": 3168} {"train_loss": -25.492643356323242, "global_step": 262978, "epoch": 3168} {"train_loss": -25.355031967163086, "global_step": 262979, "epoch": 3168} {"train_loss": -25.496496200561523, "global_step": 262980, "epoch": 3168} {"train_loss": -24.882492065429688, "global_step": 262981, "epoch": 3168} {"train_loss": -24.84871482849121, "global_step": 262982, "epoch": 3168} {"train_loss": -25.367279052734375, "global_step": 262983, "epoch": 3168} {"train_loss": -25.124591827392578, "global_step": 262984, "epoch": 3168} {"train_loss": -25.338306427001953, "global_step": 262985, "epoch": 3168} {"train_loss": -24.939138412475586, "global_step": 262986, "epoch": 3168} {"train_loss": -24.94740104675293, "global_step": 262987, "epoch": 3168} {"train_loss": -25.14055824279785, "global_step": 262988, "epoch": 3168} {"train_loss": -25.420612335205078, "global_step": 262989, "epoch": 3168} {"train_loss": -25.13991355895996, "global_step": 262990, "epoch": 3168} {"train_loss": -25.33248519897461, "global_step": 262991, "epoch": 3168} {"train_loss": -25.334199905395508, "global_step": 262992, "epoch": 3168} {"train_loss": -25.552785873413086, "global_step": 262993, "epoch": 3168} {"train_loss": -25.345355987548828, "global_step": 262994, "epoch": 3168} {"train_loss": -24.855066299438477, "global_step": 262995, "epoch": 3168} {"train_loss": -25.05977439880371, "global_step": 262996, "epoch": 3168} {"train_loss": -25.183454513549805, "global_step": 262997, "epoch": 3168} {"train_loss": -25.657276153564453, "global_step": 262998, "epoch": 3168} {"train_loss": -25.337369918823242, "global_step": 262999, "epoch": 3168} {"train_loss": -25.40447425842285, "global_step": 263000, "epoch": 3168} {"train_loss": -25.304542541503906, "global_step": 263001, "epoch": 3168} {"train_loss": -25.225467681884766, "global_step": 263002, "epoch": 3168} {"train_loss": -25.719221115112305, "global_step": 263003, "epoch": 3168} {"train_loss": -25.31328773498535, "global_step": 263004, "epoch": 3168} {"train_loss": -25.300342559814453, "global_step": 263005, "epoch": 3168} {"train_loss": -25.4913272857666, "global_step": 263006, "epoch": 3168} {"train_loss": -24.839109420776367, "global_step": 263007, "epoch": 3168} {"train_loss": -25.093961715698242, "global_step": 263008, "epoch": 3168} {"train_loss": -24.775693893432617, "global_step": 263009, "epoch": 3168} {"train_loss": -23.88545799255371, "global_step": 263010, "epoch": 3168} {"train_loss": -24.389299392700195, "global_step": 263011, "epoch": 3168} {"train_loss": -25.055578231811523, "global_step": 263012, "epoch": 3168} {"train_loss": -25.01885414123535, "global_step": 263013, "epoch": 3168} {"train_loss": -24.681772232055664, "global_step": 263014, "epoch": 3168} {"train_loss": -24.811397552490234, "global_step": 263015, "epoch": 3168} {"train_loss": -25.28078269958496, "global_step": 263016, "epoch": 3168} {"train_loss": -24.909746170043945, "global_step": 263017, "epoch": 3168} {"train_loss": -25.078893661499023, "global_step": 263018, "epoch": 3168} {"train_loss": -25.201826095581055, "global_step": 263019, "epoch": 3168} {"train_loss": -25.10988998413086, "global_step": 263020, "epoch": 3168} {"train_loss": -25.18134880065918, "global_step": 263021, "epoch": 3168} {"train_loss": -25.431873321533203, "global_step": 263022, "epoch": 3168} {"train_loss": -25.065412521362305, "global_step": 263023, "epoch": 3168} {"train_loss": -24.86019515991211, "global_step": 263024, "epoch": 3168} {"train_loss": -25.111740112304688, "global_step": 263025, "epoch": 3168} {"train_loss": -24.99690228197948, "global_step": 263026, "epoch": 3168, "val_loss": 6995456.0} {"train_loss": -24.95953369140625, "global_step": 263027, "epoch": 3169} {"train_loss": -25.032649993896484, "global_step": 263028, "epoch": 3169} {"train_loss": -25.000446319580078, "global_step": 263029, "epoch": 3169} {"train_loss": -24.412586212158203, "global_step": 263030, "epoch": 3169} {"train_loss": -25.038818359375, "global_step": 263031, "epoch": 3169} {"train_loss": -24.839157104492188, "global_step": 263032, "epoch": 3169} {"train_loss": -25.0528507232666, "global_step": 263033, "epoch": 3169} {"train_loss": -24.78985595703125, "global_step": 263034, "epoch": 3169} {"train_loss": -24.87649917602539, "global_step": 263035, "epoch": 3169} {"train_loss": -25.12116050720215, "global_step": 263036, "epoch": 3169} {"train_loss": -25.1613826751709, "global_step": 263037, "epoch": 3169} {"train_loss": -24.82187271118164, "global_step": 263038, "epoch": 3169} {"train_loss": -25.288917541503906, "global_step": 263039, "epoch": 3169} {"train_loss": -25.306650161743164, "global_step": 263040, "epoch": 3169} {"train_loss": -24.73032569885254, "global_step": 263041, "epoch": 3169} {"train_loss": -24.86111068725586, "global_step": 263042, "epoch": 3169} {"train_loss": -25.212820053100586, "global_step": 263043, "epoch": 3169} {"train_loss": -25.510324478149414, "global_step": 263044, "epoch": 3169} {"train_loss": -24.69729995727539, "global_step": 263045, "epoch": 3169} {"train_loss": -25.0798282623291, "global_step": 263046, "epoch": 3169} {"train_loss": -25.364288330078125, "global_step": 263047, "epoch": 3169} {"train_loss": -25.085474014282227, "global_step": 263048, "epoch": 3169} {"train_loss": -25.092771530151367, "global_step": 263049, "epoch": 3169} {"train_loss": -24.894271850585938, "global_step": 263050, "epoch": 3169} {"train_loss": -25.241971969604492, "global_step": 263051, "epoch": 3169} {"train_loss": -25.096824645996094, "global_step": 263052, "epoch": 3169} {"train_loss": -25.27039909362793, "global_step": 263053, "epoch": 3169} {"train_loss": -25.26222038269043, "global_step": 263054, "epoch": 3169} {"train_loss": -25.29204559326172, "global_step": 263055, "epoch": 3169} {"train_loss": -25.2710018157959, "global_step": 263056, "epoch": 3169} {"train_loss": -25.679956436157227, "global_step": 263057, "epoch": 3169} {"train_loss": -25.34043312072754, "global_step": 263058, "epoch": 3169} {"train_loss": -25.182130813598633, "global_step": 263059, "epoch": 3169} {"train_loss": -24.90302276611328, "global_step": 263060, "epoch": 3169} {"train_loss": -25.3270320892334, "global_step": 263061, "epoch": 3169} {"train_loss": -24.850984573364258, "global_step": 263062, "epoch": 3169} {"train_loss": -25.148008346557617, "global_step": 263063, "epoch": 3169} {"train_loss": -25.37709617614746, "global_step": 263064, "epoch": 3169} {"train_loss": -25.04204750061035, "global_step": 263065, "epoch": 3169} {"train_loss": -25.060400009155273, "global_step": 263066, "epoch": 3169} {"train_loss": -25.287843704223633, "global_step": 263067, "epoch": 3169} {"train_loss": -25.20487403869629, "global_step": 263068, "epoch": 3169} {"train_loss": -25.348546981811523, "global_step": 263069, "epoch": 3169} {"train_loss": -25.511886596679688, "global_step": 263070, "epoch": 3169} {"train_loss": -25.067846298217773, "global_step": 263071, "epoch": 3169} {"train_loss": -25.351369857788086, "global_step": 263072, "epoch": 3169} {"train_loss": -25.675073623657227, "global_step": 263073, "epoch": 3169} {"train_loss": -25.090375900268555, "global_step": 263074, "epoch": 3169} {"train_loss": -25.27412986755371, "global_step": 263075, "epoch": 3169} {"train_loss": -25.57056427001953, "global_step": 263076, "epoch": 3169} {"train_loss": -25.523298263549805, "global_step": 263077, "epoch": 3169} {"train_loss": -25.115802764892578, "global_step": 263078, "epoch": 3169} {"train_loss": -24.98097801208496, "global_step": 263079, "epoch": 3169} {"train_loss": -24.899810791015625, "global_step": 263080, "epoch": 3169} {"train_loss": -24.332687377929688, "global_step": 263081, "epoch": 3169} {"train_loss": -25.00922203063965, "global_step": 263082, "epoch": 3169} {"train_loss": -25.624143600463867, "global_step": 263083, "epoch": 3169} {"train_loss": -24.876157760620117, "global_step": 263084, "epoch": 3169} {"train_loss": -25.11391830444336, "global_step": 263085, "epoch": 3169} {"train_loss": -25.31448745727539, "global_step": 263086, "epoch": 3169} {"train_loss": -25.16176986694336, "global_step": 263087, "epoch": 3169} {"train_loss": -24.982425689697266, "global_step": 263088, "epoch": 3169} {"train_loss": -25.07586097717285, "global_step": 263089, "epoch": 3169} {"train_loss": -25.066078186035156, "global_step": 263090, "epoch": 3169} {"train_loss": -25.16396141052246, "global_step": 263091, "epoch": 3169} {"train_loss": -25.121496200561523, "global_step": 263092, "epoch": 3169} {"train_loss": -25.016569137573242, "global_step": 263093, "epoch": 3169} {"train_loss": -25.287565231323242, "global_step": 263094, "epoch": 3169} {"train_loss": -25.366086959838867, "global_step": 263095, "epoch": 3169} {"train_loss": -25.581497192382812, "global_step": 263096, "epoch": 3169} {"train_loss": -25.47109031677246, "global_step": 263097, "epoch": 3169} {"train_loss": -25.169736862182617, "global_step": 263098, "epoch": 3169} {"train_loss": -25.106945037841797, "global_step": 263099, "epoch": 3169} {"train_loss": -25.203962326049805, "global_step": 263100, "epoch": 3169} {"train_loss": -25.31321907043457, "global_step": 263101, "epoch": 3169} {"train_loss": -25.20526695251465, "global_step": 263102, "epoch": 3169} {"train_loss": -25.211078643798828, "global_step": 263103, "epoch": 3169} {"train_loss": -25.332191467285156, "global_step": 263104, "epoch": 3169} {"train_loss": -25.077051162719727, "global_step": 263105, "epoch": 3169} {"train_loss": -25.271574020385742, "global_step": 263106, "epoch": 3169} {"train_loss": -25.34614372253418, "global_step": 263107, "epoch": 3169} {"train_loss": -25.523609161376953, "global_step": 263108, "epoch": 3169} {"train_loss": -25.1592639325613, "global_step": 263109, "epoch": 3169, "val_loss": 7081049.5} {"train_loss": -24.80833625793457, "global_step": 263110, "epoch": 3170} {"train_loss": -25.13844108581543, "global_step": 263111, "epoch": 3170} {"train_loss": -25.14472770690918, "global_step": 263112, "epoch": 3170} {"train_loss": -24.844633102416992, "global_step": 263113, "epoch": 3170} {"train_loss": -25.04628562927246, "global_step": 263114, "epoch": 3170} {"train_loss": -25.427793502807617, "global_step": 263115, "epoch": 3170} {"train_loss": -25.20018768310547, "global_step": 263116, "epoch": 3170} {"train_loss": -25.0280704498291, "global_step": 263117, "epoch": 3170} {"train_loss": -25.07233428955078, "global_step": 263118, "epoch": 3170} {"train_loss": -25.007837295532227, "global_step": 263119, "epoch": 3170} {"train_loss": -25.33121109008789, "global_step": 263120, "epoch": 3170} {"train_loss": -25.3049373626709, "global_step": 263121, "epoch": 3170} {"train_loss": -25.20583152770996, "global_step": 263122, "epoch": 3170} {"train_loss": -24.61772346496582, "global_step": 263123, "epoch": 3170} {"train_loss": -25.18039894104004, "global_step": 263124, "epoch": 3170} {"train_loss": -25.198078155517578, "global_step": 263125, "epoch": 3170} {"train_loss": -25.063871383666992, "global_step": 263126, "epoch": 3170} {"train_loss": -25.127824783325195, "global_step": 263127, "epoch": 3170} {"train_loss": -25.40514373779297, "global_step": 263128, "epoch": 3170} {"train_loss": -25.301448822021484, "global_step": 263129, "epoch": 3170} {"train_loss": -25.06760025024414, "global_step": 263130, "epoch": 3170} {"train_loss": -25.271093368530273, "global_step": 263131, "epoch": 3170} {"train_loss": -25.08211326599121, "global_step": 263132, "epoch": 3170} {"train_loss": -25.11519432067871, "global_step": 263133, "epoch": 3170} {"train_loss": -25.09454345703125, "global_step": 263134, "epoch": 3170} {"train_loss": -25.48639488220215, "global_step": 263135, "epoch": 3170} {"train_loss": -25.25418472290039, "global_step": 263136, "epoch": 3170} {"train_loss": -25.057832717895508, "global_step": 263137, "epoch": 3170} {"train_loss": -25.385852813720703, "global_step": 263138, "epoch": 3170} {"train_loss": -25.098997116088867, "global_step": 263139, "epoch": 3170} {"train_loss": -25.1005916595459, "global_step": 263140, "epoch": 3170} {"train_loss": -24.867528915405273, "global_step": 263141, "epoch": 3170} {"train_loss": -25.07146644592285, "global_step": 263142, "epoch": 3170} {"train_loss": -25.32478141784668, "global_step": 263143, "epoch": 3170} {"train_loss": -24.89678192138672, "global_step": 263144, "epoch": 3170} {"train_loss": -25.346994400024414, "global_step": 263145, "epoch": 3170} {"train_loss": -25.263654708862305, "global_step": 263146, "epoch": 3170} {"train_loss": -24.893531799316406, "global_step": 263147, "epoch": 3170} {"train_loss": -24.993459701538086, "global_step": 263148, "epoch": 3170} {"train_loss": -25.297536849975586, "global_step": 263149, "epoch": 3170} {"train_loss": -25.126083374023438, "global_step": 263150, "epoch": 3170} {"train_loss": -25.41571617126465, "global_step": 263151, "epoch": 3170} {"train_loss": -25.472082138061523, "global_step": 263152, "epoch": 3170} {"train_loss": -25.185123443603516, "global_step": 263153, "epoch": 3170} {"train_loss": -25.559646606445312, "global_step": 263154, "epoch": 3170} {"train_loss": -25.37129020690918, "global_step": 263155, "epoch": 3170} {"train_loss": -25.61232566833496, "global_step": 263156, "epoch": 3170} {"train_loss": -25.14983558654785, "global_step": 263157, "epoch": 3170} {"train_loss": -25.111059188842773, "global_step": 263158, "epoch": 3170} {"train_loss": -25.372343063354492, "global_step": 263159, "epoch": 3170} {"train_loss": -25.233924865722656, "global_step": 263160, "epoch": 3170} {"train_loss": -25.41395378112793, "global_step": 263161, "epoch": 3170} {"train_loss": -25.2984619140625, "global_step": 263162, "epoch": 3170} {"train_loss": -25.36601448059082, "global_step": 263163, "epoch": 3170} {"train_loss": -24.99128532409668, "global_step": 263164, "epoch": 3170} {"train_loss": -25.411231994628906, "global_step": 263165, "epoch": 3170} {"train_loss": -25.386123657226562, "global_step": 263166, "epoch": 3170} {"train_loss": -25.82154655456543, "global_step": 263167, "epoch": 3170} {"train_loss": -25.19293785095215, "global_step": 263168, "epoch": 3170} {"train_loss": -25.245609283447266, "global_step": 263169, "epoch": 3170} {"train_loss": -25.169340133666992, "global_step": 263170, "epoch": 3170} {"train_loss": -25.081743240356445, "global_step": 263171, "epoch": 3170} {"train_loss": -25.19783592224121, "global_step": 263172, "epoch": 3170} {"train_loss": -25.032100677490234, "global_step": 263173, "epoch": 3170} {"train_loss": -24.80387306213379, "global_step": 263174, "epoch": 3170} {"train_loss": -25.07349967956543, "global_step": 263175, "epoch": 3170} {"train_loss": -25.03839683532715, "global_step": 263176, "epoch": 3170} {"train_loss": -24.918771743774414, "global_step": 263177, "epoch": 3170} {"train_loss": -25.26303482055664, "global_step": 263178, "epoch": 3170} {"train_loss": -25.241199493408203, "global_step": 263179, "epoch": 3170} {"train_loss": -24.917312622070312, "global_step": 263180, "epoch": 3170} {"train_loss": -25.28139877319336, "global_step": 263181, "epoch": 3170} {"train_loss": -25.126419067382812, "global_step": 263182, "epoch": 3170} {"train_loss": -25.12449073791504, "global_step": 263183, "epoch": 3170} {"train_loss": -25.23429298400879, "global_step": 263184, "epoch": 3170} {"train_loss": -25.38521385192871, "global_step": 263185, "epoch": 3170} {"train_loss": -25.11628532409668, "global_step": 263186, "epoch": 3170} {"train_loss": -25.016550064086914, "global_step": 263187, "epoch": 3170} {"train_loss": -25.064620971679688, "global_step": 263188, "epoch": 3170} {"train_loss": -25.220670700073242, "global_step": 263189, "epoch": 3170} {"train_loss": -24.982412338256836, "global_step": 263190, "epoch": 3170} {"train_loss": -24.945960998535156, "global_step": 263191, "epoch": 3170} {"train_loss": -25.173326676150403, "global_step": 263192, "epoch": 3170, "val_loss": 6893292.0} {"train_loss": -24.47269630432129, "global_step": 263193, "epoch": 3171} {"train_loss": -23.83331871032715, "global_step": 263194, "epoch": 3171} {"train_loss": -23.690855026245117, "global_step": 263195, "epoch": 3171} {"train_loss": -23.822429656982422, "global_step": 263196, "epoch": 3171} {"train_loss": -24.11058235168457, "global_step": 263197, "epoch": 3171} {"train_loss": -23.875547409057617, "global_step": 263198, "epoch": 3171} {"train_loss": -24.24628448486328, "global_step": 263199, "epoch": 3171} {"train_loss": -24.6326904296875, "global_step": 263200, "epoch": 3171} {"train_loss": -24.22260856628418, "global_step": 263201, "epoch": 3171} {"train_loss": -24.55524253845215, "global_step": 263202, "epoch": 3171} {"train_loss": -23.758602142333984, "global_step": 263203, "epoch": 3171} {"train_loss": -24.67070960998535, "global_step": 263204, "epoch": 3171} {"train_loss": -24.173709869384766, "global_step": 263205, "epoch": 3171} {"train_loss": -24.6378173828125, "global_step": 263206, "epoch": 3171} {"train_loss": -24.64771842956543, "global_step": 263207, "epoch": 3171} {"train_loss": -24.750885009765625, "global_step": 263208, "epoch": 3171} {"train_loss": -24.785093307495117, "global_step": 263209, "epoch": 3171} {"train_loss": -24.62354278564453, "global_step": 263210, "epoch": 3171} {"train_loss": -25.011709213256836, "global_step": 263211, "epoch": 3171} {"train_loss": -23.759748458862305, "global_step": 263212, "epoch": 3171} {"train_loss": -24.931385040283203, "global_step": 263213, "epoch": 3171} {"train_loss": -24.912839889526367, "global_step": 263214, "epoch": 3171} {"train_loss": -24.59735107421875, "global_step": 263215, "epoch": 3171} {"train_loss": -24.79401969909668, "global_step": 263216, "epoch": 3171} {"train_loss": -24.74384117126465, "global_step": 263217, "epoch": 3171} {"train_loss": -24.830602645874023, "global_step": 263218, "epoch": 3171} {"train_loss": -24.53558349609375, "global_step": 263219, "epoch": 3171} {"train_loss": -24.96915626525879, "global_step": 263220, "epoch": 3171} {"train_loss": -24.993789672851562, "global_step": 263221, "epoch": 3171} {"train_loss": -24.625967025756836, "global_step": 263222, "epoch": 3171} {"train_loss": -24.83709716796875, "global_step": 263223, "epoch": 3171} {"train_loss": -24.835683822631836, "global_step": 263224, "epoch": 3171} {"train_loss": -25.082515716552734, "global_step": 263225, "epoch": 3171} {"train_loss": -25.03492546081543, "global_step": 263226, "epoch": 3171} {"train_loss": -25.361806869506836, "global_step": 263227, "epoch": 3171} {"train_loss": -25.17984390258789, "global_step": 263228, "epoch": 3171} {"train_loss": -24.979877471923828, "global_step": 263229, "epoch": 3171} {"train_loss": -24.878387451171875, "global_step": 263230, "epoch": 3171} {"train_loss": -25.07289695739746, "global_step": 263231, "epoch": 3171} {"train_loss": -25.025028228759766, "global_step": 263232, "epoch": 3171} {"train_loss": -25.01854133605957, "global_step": 263233, "epoch": 3171} {"train_loss": -25.320531845092773, "global_step": 263234, "epoch": 3171} {"train_loss": -24.808652877807617, "global_step": 263235, "epoch": 3171} {"train_loss": -25.157480239868164, "global_step": 263236, "epoch": 3171} {"train_loss": -25.604721069335938, "global_step": 263237, "epoch": 3171} {"train_loss": -25.17713737487793, "global_step": 263238, "epoch": 3171} {"train_loss": -25.38373565673828, "global_step": 263239, "epoch": 3171} {"train_loss": -25.485435485839844, "global_step": 263240, "epoch": 3171} {"train_loss": -25.162389755249023, "global_step": 263241, "epoch": 3171} {"train_loss": -25.137418746948242, "global_step": 263242, "epoch": 3171} {"train_loss": -25.175518035888672, "global_step": 263243, "epoch": 3171} {"train_loss": -25.66834831237793, "global_step": 263244, "epoch": 3171} {"train_loss": -25.62744140625, "global_step": 263245, "epoch": 3171} {"train_loss": -25.341459274291992, "global_step": 263246, "epoch": 3171} {"train_loss": -25.402313232421875, "global_step": 263247, "epoch": 3171} {"train_loss": -25.34419822692871, "global_step": 263248, "epoch": 3171} {"train_loss": -25.46297264099121, "global_step": 263249, "epoch": 3171} {"train_loss": -25.350299835205078, "global_step": 263250, "epoch": 3171} {"train_loss": -25.48348045349121, "global_step": 263251, "epoch": 3171} {"train_loss": -25.319665908813477, "global_step": 263252, "epoch": 3171} {"train_loss": -25.424602508544922, "global_step": 263253, "epoch": 3171} {"train_loss": -25.323562622070312, "global_step": 263254, "epoch": 3171} {"train_loss": -25.297727584838867, "global_step": 263255, "epoch": 3171} {"train_loss": -25.35053062438965, "global_step": 263256, "epoch": 3171} {"train_loss": -25.28348731994629, "global_step": 263257, "epoch": 3171} {"train_loss": -25.147573471069336, "global_step": 263258, "epoch": 3171} {"train_loss": -25.3239688873291, "global_step": 263259, "epoch": 3171} {"train_loss": -25.598875045776367, "global_step": 263260, "epoch": 3171} {"train_loss": -25.15118408203125, "global_step": 263261, "epoch": 3171} {"train_loss": -24.75665855407715, "global_step": 263262, "epoch": 3171} {"train_loss": -24.469924926757812, "global_step": 263263, "epoch": 3171} {"train_loss": -25.13874626159668, "global_step": 263264, "epoch": 3171} {"train_loss": -24.85233497619629, "global_step": 263265, "epoch": 3171} {"train_loss": -23.926706314086914, "global_step": 263266, "epoch": 3171} {"train_loss": -24.407873153686523, "global_step": 263267, "epoch": 3171} {"train_loss": -24.84333610534668, "global_step": 263268, "epoch": 3171} {"train_loss": -24.535799026489258, "global_step": 263269, "epoch": 3171} {"train_loss": -24.885263442993164, "global_step": 263270, "epoch": 3171} {"train_loss": -24.95650291442871, "global_step": 263271, "epoch": 3171} {"train_loss": -25.025793075561523, "global_step": 263272, "epoch": 3171} {"train_loss": -25.1964054107666, "global_step": 263273, "epoch": 3171} {"train_loss": -25.05470085144043, "global_step": 263274, "epoch": 3171} {"train_loss": -24.880671880331384, "global_step": 263275, "epoch": 3171, "val_loss": 7073198.0} {"train_loss": -24.260812759399414, "global_step": 263276, "epoch": 3172} {"train_loss": -24.12898063659668, "global_step": 263277, "epoch": 3172} {"train_loss": -24.575422286987305, "global_step": 263278, "epoch": 3172} {"train_loss": -24.3961124420166, "global_step": 263279, "epoch": 3172} {"train_loss": -23.94734001159668, "global_step": 263280, "epoch": 3172} {"train_loss": -24.397525787353516, "global_step": 263281, "epoch": 3172} {"train_loss": -24.220691680908203, "global_step": 263282, "epoch": 3172} {"train_loss": -24.222211837768555, "global_step": 263283, "epoch": 3172} {"train_loss": -24.593900680541992, "global_step": 263284, "epoch": 3172} {"train_loss": -24.643590927124023, "global_step": 263285, "epoch": 3172} {"train_loss": -24.74540138244629, "global_step": 263286, "epoch": 3172} {"train_loss": -24.8653621673584, "global_step": 263287, "epoch": 3172} {"train_loss": -24.991626739501953, "global_step": 263288, "epoch": 3172} {"train_loss": -24.591190338134766, "global_step": 263289, "epoch": 3172} {"train_loss": -24.876876831054688, "global_step": 263290, "epoch": 3172} {"train_loss": -24.9918155670166, "global_step": 263291, "epoch": 3172} {"train_loss": -24.81770896911621, "global_step": 263292, "epoch": 3172} {"train_loss": -25.343429565429688, "global_step": 263293, "epoch": 3172} {"train_loss": -24.989416122436523, "global_step": 263294, "epoch": 3172} {"train_loss": -25.2191219329834, "global_step": 263295, "epoch": 3172} {"train_loss": -24.895938873291016, "global_step": 263296, "epoch": 3172} {"train_loss": -24.827661514282227, "global_step": 263297, "epoch": 3172} {"train_loss": -25.14642333984375, "global_step": 263298, "epoch": 3172} {"train_loss": -24.690807342529297, "global_step": 263299, "epoch": 3172} {"train_loss": -25.50320816040039, "global_step": 263300, "epoch": 3172} {"train_loss": -25.164159774780273, "global_step": 263301, "epoch": 3172} {"train_loss": -24.992338180541992, "global_step": 263302, "epoch": 3172} {"train_loss": -25.308141708374023, "global_step": 263303, "epoch": 3172} {"train_loss": -25.014320373535156, "global_step": 263304, "epoch": 3172} {"train_loss": -25.2994441986084, "global_step": 263305, "epoch": 3172} {"train_loss": -25.217622756958008, "global_step": 263306, "epoch": 3172} {"train_loss": -25.152690887451172, "global_step": 263307, "epoch": 3172} {"train_loss": -24.94849967956543, "global_step": 263308, "epoch": 3172} {"train_loss": -25.014219284057617, "global_step": 263309, "epoch": 3172} {"train_loss": -25.155994415283203, "global_step": 263310, "epoch": 3172} {"train_loss": -25.302793502807617, "global_step": 263311, "epoch": 3172} {"train_loss": -25.253143310546875, "global_step": 263312, "epoch": 3172} {"train_loss": -25.121997833251953, "global_step": 263313, "epoch": 3172} {"train_loss": -25.345844268798828, "global_step": 263314, "epoch": 3172} {"train_loss": -25.254199981689453, "global_step": 263315, "epoch": 3172} {"train_loss": -25.006591796875, "global_step": 263316, "epoch": 3172} {"train_loss": -25.577375411987305, "global_step": 263317, "epoch": 3172} {"train_loss": -25.20237922668457, "global_step": 263318, "epoch": 3172} {"train_loss": -25.350351333618164, "global_step": 263319, "epoch": 3172} {"train_loss": -25.261808395385742, "global_step": 263320, "epoch": 3172} {"train_loss": -25.12518310546875, "global_step": 263321, "epoch": 3172} {"train_loss": -25.326658248901367, "global_step": 263322, "epoch": 3172} {"train_loss": -25.5695858001709, "global_step": 263323, "epoch": 3172} {"train_loss": -24.76590347290039, "global_step": 263324, "epoch": 3172} {"train_loss": -25.323490142822266, "global_step": 263325, "epoch": 3172} {"train_loss": -25.45879554748535, "global_step": 263326, "epoch": 3172} {"train_loss": -24.840192794799805, "global_step": 263327, "epoch": 3172} {"train_loss": -25.270803451538086, "global_step": 263328, "epoch": 3172} {"train_loss": -25.08028221130371, "global_step": 263329, "epoch": 3172} {"train_loss": -25.118452072143555, "global_step": 263330, "epoch": 3172} {"train_loss": -24.947858810424805, "global_step": 263331, "epoch": 3172} {"train_loss": -24.678205490112305, "global_step": 263332, "epoch": 3172} {"train_loss": -25.257457733154297, "global_step": 263333, "epoch": 3172} {"train_loss": -24.87288475036621, "global_step": 263334, "epoch": 3172} {"train_loss": -24.789724349975586, "global_step": 263335, "epoch": 3172} {"train_loss": -25.07791519165039, "global_step": 263336, "epoch": 3172} {"train_loss": -25.123947143554688, "global_step": 263337, "epoch": 3172} {"train_loss": -25.114439010620117, "global_step": 263338, "epoch": 3172} {"train_loss": -25.358078002929688, "global_step": 263339, "epoch": 3172} {"train_loss": -24.856945037841797, "global_step": 263340, "epoch": 3172} {"train_loss": -25.13949966430664, "global_step": 263341, "epoch": 3172} {"train_loss": -24.77556610107422, "global_step": 263342, "epoch": 3172} {"train_loss": -24.771114349365234, "global_step": 263343, "epoch": 3172} {"train_loss": -25.28431510925293, "global_step": 263344, "epoch": 3172} {"train_loss": -24.85495948791504, "global_step": 263345, "epoch": 3172} {"train_loss": -24.886310577392578, "global_step": 263346, "epoch": 3172} {"train_loss": -24.807126998901367, "global_step": 263347, "epoch": 3172} {"train_loss": -25.139799118041992, "global_step": 263348, "epoch": 3172} {"train_loss": -24.989795684814453, "global_step": 263349, "epoch": 3172} {"train_loss": -25.48665428161621, "global_step": 263350, "epoch": 3172} {"train_loss": -25.101932525634766, "global_step": 263351, "epoch": 3172} {"train_loss": -25.317075729370117, "global_step": 263352, "epoch": 3172} {"train_loss": -25.103492736816406, "global_step": 263353, "epoch": 3172} {"train_loss": -25.13186264038086, "global_step": 263354, "epoch": 3172} {"train_loss": -25.382366180419922, "global_step": 263355, "epoch": 3172} {"train_loss": -25.120222091674805, "global_step": 263356, "epoch": 3172} {"train_loss": -25.232818603515625, "global_step": 263357, "epoch": 3172} {"train_loss": -25.023209675248847, "global_step": 263358, "epoch": 3172, "val_loss": 6833060.0} {"train_loss": -24.7575626373291, "global_step": 263359, "epoch": 3173} {"train_loss": -25.077817916870117, "global_step": 263360, "epoch": 3173} {"train_loss": -24.717056274414062, "global_step": 263361, "epoch": 3173} {"train_loss": -24.94662094116211, "global_step": 263362, "epoch": 3173} {"train_loss": -24.915023803710938, "global_step": 263363, "epoch": 3173} {"train_loss": -24.779438018798828, "global_step": 263364, "epoch": 3173} {"train_loss": -25.11408805847168, "global_step": 263365, "epoch": 3173} {"train_loss": -25.055952072143555, "global_step": 263366, "epoch": 3173} {"train_loss": -25.313566207885742, "global_step": 263367, "epoch": 3173} {"train_loss": -25.085067749023438, "global_step": 263368, "epoch": 3173} {"train_loss": -25.1591796875, "global_step": 263369, "epoch": 3173} {"train_loss": -24.90431022644043, "global_step": 263370, "epoch": 3173} {"train_loss": -25.001312255859375, "global_step": 263371, "epoch": 3173} {"train_loss": -24.98365592956543, "global_step": 263372, "epoch": 3173} {"train_loss": -24.819137573242188, "global_step": 263373, "epoch": 3173} {"train_loss": -25.201967239379883, "global_step": 263374, "epoch": 3173} {"train_loss": -25.0979061126709, "global_step": 263375, "epoch": 3173} {"train_loss": -24.92075538635254, "global_step": 263376, "epoch": 3173} {"train_loss": -24.935514450073242, "global_step": 263377, "epoch": 3173} {"train_loss": -25.4808406829834, "global_step": 263378, "epoch": 3173} {"train_loss": -25.515960693359375, "global_step": 263379, "epoch": 3173} {"train_loss": -24.9442195892334, "global_step": 263380, "epoch": 3173} {"train_loss": -25.384143829345703, "global_step": 263381, "epoch": 3173} {"train_loss": -24.996549606323242, "global_step": 263382, "epoch": 3173} {"train_loss": -25.1628360748291, "global_step": 263383, "epoch": 3173} {"train_loss": -25.41458511352539, "global_step": 263384, "epoch": 3173} {"train_loss": -25.330589294433594, "global_step": 263385, "epoch": 3173} {"train_loss": -25.293338775634766, "global_step": 263386, "epoch": 3173} {"train_loss": -24.958452224731445, "global_step": 263387, "epoch": 3173} {"train_loss": -24.829086303710938, "global_step": 263388, "epoch": 3173} {"train_loss": -25.297964096069336, "global_step": 263389, "epoch": 3173} {"train_loss": -25.305540084838867, "global_step": 263390, "epoch": 3173} {"train_loss": -25.03701400756836, "global_step": 263391, "epoch": 3173} {"train_loss": -24.882402420043945, "global_step": 263392, "epoch": 3173} {"train_loss": -25.02908706665039, "global_step": 263393, "epoch": 3173} {"train_loss": -25.128265380859375, "global_step": 263394, "epoch": 3173} {"train_loss": -25.114301681518555, "global_step": 263395, "epoch": 3173} {"train_loss": -25.050931930541992, "global_step": 263396, "epoch": 3173} {"train_loss": -25.487415313720703, "global_step": 263397, "epoch": 3173} {"train_loss": -25.64357566833496, "global_step": 263398, "epoch": 3173} {"train_loss": -25.186704635620117, "global_step": 263399, "epoch": 3173} {"train_loss": -24.954774856567383, "global_step": 263400, "epoch": 3173} {"train_loss": -25.325037002563477, "global_step": 263401, "epoch": 3173} {"train_loss": -25.10608673095703, "global_step": 263402, "epoch": 3173} {"train_loss": -25.048765182495117, "global_step": 263403, "epoch": 3173} {"train_loss": -25.151538848876953, "global_step": 263404, "epoch": 3173} {"train_loss": -25.11787223815918, "global_step": 263405, "epoch": 3173} {"train_loss": -25.171283721923828, "global_step": 263406, "epoch": 3173} {"train_loss": -25.283884048461914, "global_step": 263407, "epoch": 3173} {"train_loss": -25.104450225830078, "global_step": 263408, "epoch": 3173} {"train_loss": -24.895849227905273, "global_step": 263409, "epoch": 3173} {"train_loss": -25.095197677612305, "global_step": 263410, "epoch": 3173} {"train_loss": -25.074203491210938, "global_step": 263411, "epoch": 3173} {"train_loss": -25.557443618774414, "global_step": 263412, "epoch": 3173} {"train_loss": -25.132688522338867, "global_step": 263413, "epoch": 3173} {"train_loss": -25.35219383239746, "global_step": 263414, "epoch": 3173} {"train_loss": -25.210840225219727, "global_step": 263415, "epoch": 3173} {"train_loss": -25.50886344909668, "global_step": 263416, "epoch": 3173} {"train_loss": -25.58683204650879, "global_step": 263417, "epoch": 3173} {"train_loss": -25.135955810546875, "global_step": 263418, "epoch": 3173} {"train_loss": -25.222530364990234, "global_step": 263419, "epoch": 3173} {"train_loss": -25.23689842224121, "global_step": 263420, "epoch": 3173} {"train_loss": -25.158004760742188, "global_step": 263421, "epoch": 3173} {"train_loss": -25.307077407836914, "global_step": 263422, "epoch": 3173} {"train_loss": -25.306304931640625, "global_step": 263423, "epoch": 3173} {"train_loss": -24.955854415893555, "global_step": 263424, "epoch": 3173} {"train_loss": -25.5257568359375, "global_step": 263425, "epoch": 3173} {"train_loss": -25.34819984436035, "global_step": 263426, "epoch": 3173} {"train_loss": -25.27280044555664, "global_step": 263427, "epoch": 3173} {"train_loss": -24.7424373626709, "global_step": 263428, "epoch": 3173} {"train_loss": -25.399261474609375, "global_step": 263429, "epoch": 3173} {"train_loss": -25.275060653686523, "global_step": 263430, "epoch": 3173} {"train_loss": -25.49234390258789, "global_step": 263431, "epoch": 3173} {"train_loss": -24.59980583190918, "global_step": 263432, "epoch": 3173} {"train_loss": -25.27489471435547, "global_step": 263433, "epoch": 3173} {"train_loss": -24.72442626953125, "global_step": 263434, "epoch": 3173} {"train_loss": -24.845359802246094, "global_step": 263435, "epoch": 3173} {"train_loss": -24.972869873046875, "global_step": 263436, "epoch": 3173} {"train_loss": -25.13461685180664, "global_step": 263437, "epoch": 3173} {"train_loss": -24.788373947143555, "global_step": 263438, "epoch": 3173} {"train_loss": -25.094125747680664, "global_step": 263439, "epoch": 3173} {"train_loss": -25.448484420776367, "global_step": 263440, "epoch": 3173} {"train_loss": -25.149943041514202, "global_step": 263441, "epoch": 3173, "val_loss": 7134983.5} {"train_loss": -24.522449493408203, "global_step": 263442, "epoch": 3174} {"train_loss": -24.57752799987793, "global_step": 263443, "epoch": 3174} {"train_loss": -24.861379623413086, "global_step": 263444, "epoch": 3174} {"train_loss": -24.6462345123291, "global_step": 263445, "epoch": 3174} {"train_loss": -24.763446807861328, "global_step": 263446, "epoch": 3174} {"train_loss": -24.731536865234375, "global_step": 263447, "epoch": 3174} {"train_loss": -24.637235641479492, "global_step": 263448, "epoch": 3174} {"train_loss": -24.895307540893555, "global_step": 263449, "epoch": 3174} {"train_loss": -25.208227157592773, "global_step": 263450, "epoch": 3174} {"train_loss": -24.714595794677734, "global_step": 263451, "epoch": 3174} {"train_loss": -24.670867919921875, "global_step": 263452, "epoch": 3174} {"train_loss": -25.311145782470703, "global_step": 263453, "epoch": 3174} {"train_loss": -25.20902442932129, "global_step": 263454, "epoch": 3174} {"train_loss": -25.030912399291992, "global_step": 263455, "epoch": 3174} {"train_loss": -24.961427688598633, "global_step": 263456, "epoch": 3174} {"train_loss": -25.237003326416016, "global_step": 263457, "epoch": 3174} {"train_loss": -25.159658432006836, "global_step": 263458, "epoch": 3174} {"train_loss": -24.89651870727539, "global_step": 263459, "epoch": 3174} {"train_loss": -24.973745346069336, "global_step": 263460, "epoch": 3174} {"train_loss": -25.0584659576416, "global_step": 263461, "epoch": 3174} {"train_loss": -25.361562728881836, "global_step": 263462, "epoch": 3174} {"train_loss": -25.377174377441406, "global_step": 263463, "epoch": 3174} {"train_loss": -25.050033569335938, "global_step": 263464, "epoch": 3174} {"train_loss": -25.086164474487305, "global_step": 263465, "epoch": 3174} {"train_loss": -25.408903121948242, "global_step": 263466, "epoch": 3174} {"train_loss": -25.052637100219727, "global_step": 263467, "epoch": 3174} {"train_loss": -25.393726348876953, "global_step": 263468, "epoch": 3174} {"train_loss": -25.257465362548828, "global_step": 263469, "epoch": 3174} {"train_loss": -25.17344856262207, "global_step": 263470, "epoch": 3174} {"train_loss": -25.21172523498535, "global_step": 263471, "epoch": 3174} {"train_loss": -24.912940979003906, "global_step": 263472, "epoch": 3174} {"train_loss": -24.842512130737305, "global_step": 263473, "epoch": 3174} {"train_loss": -25.189844131469727, "global_step": 263474, "epoch": 3174} {"train_loss": -25.49050521850586, "global_step": 263475, "epoch": 3174} {"train_loss": -25.402015686035156, "global_step": 263476, "epoch": 3174} {"train_loss": -25.217082977294922, "global_step": 263477, "epoch": 3174} {"train_loss": -25.309751510620117, "global_step": 263478, "epoch": 3174} {"train_loss": -24.97095489501953, "global_step": 263479, "epoch": 3174} {"train_loss": -25.33164405822754, "global_step": 263480, "epoch": 3174} {"train_loss": -25.162084579467773, "global_step": 263481, "epoch": 3174} {"train_loss": -25.360864639282227, "global_step": 263482, "epoch": 3174} {"train_loss": -25.306459426879883, "global_step": 263483, "epoch": 3174} {"train_loss": -25.304563522338867, "global_step": 263484, "epoch": 3174} {"train_loss": -25.51140594482422, "global_step": 263485, "epoch": 3174} {"train_loss": -25.50971031188965, "global_step": 263486, "epoch": 3174} {"train_loss": -25.330642700195312, "global_step": 263487, "epoch": 3174} {"train_loss": -24.713638305664062, "global_step": 263488, "epoch": 3174} {"train_loss": -24.545392990112305, "global_step": 263489, "epoch": 3174} {"train_loss": -25.056198120117188, "global_step": 263490, "epoch": 3174} {"train_loss": -25.13878059387207, "global_step": 263491, "epoch": 3174} {"train_loss": -25.11865234375, "global_step": 263492, "epoch": 3174} {"train_loss": -25.56801414489746, "global_step": 263493, "epoch": 3174} {"train_loss": -25.39442253112793, "global_step": 263494, "epoch": 3174} {"train_loss": -24.797809600830078, "global_step": 263495, "epoch": 3174} {"train_loss": -24.910818099975586, "global_step": 263496, "epoch": 3174} {"train_loss": -25.24717140197754, "global_step": 263497, "epoch": 3174} {"train_loss": -25.47264862060547, "global_step": 263498, "epoch": 3174} {"train_loss": -25.27444839477539, "global_step": 263499, "epoch": 3174} {"train_loss": -25.549707412719727, "global_step": 263500, "epoch": 3174} {"train_loss": -25.39487648010254, "global_step": 263501, "epoch": 3174} {"train_loss": -25.32355308532715, "global_step": 263502, "epoch": 3174} {"train_loss": -25.273605346679688, "global_step": 263503, "epoch": 3174} {"train_loss": -25.306400299072266, "global_step": 263504, "epoch": 3174} {"train_loss": -25.06572914123535, "global_step": 263505, "epoch": 3174} {"train_loss": -25.276243209838867, "global_step": 263506, "epoch": 3174} {"train_loss": -25.217205047607422, "global_step": 263507, "epoch": 3174} {"train_loss": -25.35951805114746, "global_step": 263508, "epoch": 3174} {"train_loss": -25.293272018432617, "global_step": 263509, "epoch": 3174} {"train_loss": -25.017847061157227, "global_step": 263510, "epoch": 3174} {"train_loss": -25.455472946166992, "global_step": 263511, "epoch": 3174} {"train_loss": -25.376131057739258, "global_step": 263512, "epoch": 3174} {"train_loss": -25.456275939941406, "global_step": 263513, "epoch": 3174} {"train_loss": -25.318479537963867, "global_step": 263514, "epoch": 3174} {"train_loss": -25.582666397094727, "global_step": 263515, "epoch": 3174} {"train_loss": -25.125322341918945, "global_step": 263516, "epoch": 3174} {"train_loss": -25.150846481323242, "global_step": 263517, "epoch": 3174} {"train_loss": -25.23529815673828, "global_step": 263518, "epoch": 3174} {"train_loss": -24.762187957763672, "global_step": 263519, "epoch": 3174} {"train_loss": -25.34990882873535, "global_step": 263520, "epoch": 3174} {"train_loss": -25.255481719970703, "global_step": 263521, "epoch": 3174} {"train_loss": -24.751113891601562, "global_step": 263522, "epoch": 3174} {"train_loss": -25.021421432495117, "global_step": 263523, "epoch": 3174} {"train_loss": -25.141611237123787, "global_step": 263524, "epoch": 3174, "val_loss": 6904973.0} {"train_loss": -24.8143310546875, "global_step": 263525, "epoch": 3175} {"train_loss": -24.5095272064209, "global_step": 263526, "epoch": 3175} {"train_loss": -24.993696212768555, "global_step": 263527, "epoch": 3175} {"train_loss": -24.87501335144043, "global_step": 263528, "epoch": 3175} {"train_loss": -24.385814666748047, "global_step": 263529, "epoch": 3175} {"train_loss": -24.236169815063477, "global_step": 263530, "epoch": 3175} {"train_loss": -24.39229393005371, "global_step": 263531, "epoch": 3175} {"train_loss": -24.805904388427734, "global_step": 263532, "epoch": 3175} {"train_loss": -24.5075740814209, "global_step": 263533, "epoch": 3175} {"train_loss": -24.558164596557617, "global_step": 263534, "epoch": 3175} {"train_loss": -24.781585693359375, "global_step": 263535, "epoch": 3175} {"train_loss": -24.867231369018555, "global_step": 263536, "epoch": 3175} {"train_loss": -24.734256744384766, "global_step": 263537, "epoch": 3175} {"train_loss": -24.338788986206055, "global_step": 263538, "epoch": 3175} {"train_loss": -24.509952545166016, "global_step": 263539, "epoch": 3175} {"train_loss": -24.710107803344727, "global_step": 263540, "epoch": 3175} {"train_loss": -24.48465919494629, "global_step": 263541, "epoch": 3175} {"train_loss": -24.45888328552246, "global_step": 263542, "epoch": 3175} {"train_loss": -24.561599731445312, "global_step": 263543, "epoch": 3175} {"train_loss": -24.7388973236084, "global_step": 263544, "epoch": 3175} {"train_loss": -24.695941925048828, "global_step": 263545, "epoch": 3175} {"train_loss": -24.741567611694336, "global_step": 263546, "epoch": 3175} {"train_loss": -24.97132682800293, "global_step": 263547, "epoch": 3175} {"train_loss": -25.00257682800293, "global_step": 263548, "epoch": 3175} {"train_loss": -25.019153594970703, "global_step": 263549, "epoch": 3175} {"train_loss": -24.98050308227539, "global_step": 263550, "epoch": 3175} {"train_loss": -25.33223533630371, "global_step": 263551, "epoch": 3175} {"train_loss": -25.21290397644043, "global_step": 263552, "epoch": 3175} {"train_loss": -25.060163497924805, "global_step": 263553, "epoch": 3175} {"train_loss": -25.156991958618164, "global_step": 263554, "epoch": 3175} {"train_loss": -25.146560668945312, "global_step": 263555, "epoch": 3175} {"train_loss": -25.112058639526367, "global_step": 263556, "epoch": 3175} {"train_loss": -25.146472930908203, "global_step": 263557, "epoch": 3175} {"train_loss": -25.205354690551758, "global_step": 263558, "epoch": 3175} {"train_loss": -25.30864143371582, "global_step": 263559, "epoch": 3175} {"train_loss": -25.175933837890625, "global_step": 263560, "epoch": 3175} {"train_loss": -25.27029037475586, "global_step": 263561, "epoch": 3175} {"train_loss": -25.1492977142334, "global_step": 263562, "epoch": 3175} {"train_loss": -25.244375228881836, "global_step": 263563, "epoch": 3175} {"train_loss": -25.020383834838867, "global_step": 263564, "epoch": 3175} {"train_loss": -25.151823043823242, "global_step": 263565, "epoch": 3175} {"train_loss": -25.10615348815918, "global_step": 263566, "epoch": 3175} {"train_loss": -25.558265686035156, "global_step": 263567, "epoch": 3175} {"train_loss": -25.06838035583496, "global_step": 263568, "epoch": 3175} {"train_loss": -25.357192993164062, "global_step": 263569, "epoch": 3175} {"train_loss": -25.320327758789062, "global_step": 263570, "epoch": 3175} {"train_loss": -25.342111587524414, "global_step": 263571, "epoch": 3175} {"train_loss": -25.236343383789062, "global_step": 263572, "epoch": 3175} {"train_loss": -25.272483825683594, "global_step": 263573, "epoch": 3175} {"train_loss": -25.10581398010254, "global_step": 263574, "epoch": 3175} {"train_loss": -25.404207229614258, "global_step": 263575, "epoch": 3175} {"train_loss": -24.95331573486328, "global_step": 263576, "epoch": 3175} {"train_loss": -25.245277404785156, "global_step": 263577, "epoch": 3175} {"train_loss": -25.52845573425293, "global_step": 263578, "epoch": 3175} {"train_loss": -25.153221130371094, "global_step": 263579, "epoch": 3175} {"train_loss": -25.47871971130371, "global_step": 263580, "epoch": 3175} {"train_loss": -25.359703063964844, "global_step": 263581, "epoch": 3175} {"train_loss": -24.927082061767578, "global_step": 263582, "epoch": 3175} {"train_loss": -25.008630752563477, "global_step": 263583, "epoch": 3175} {"train_loss": -25.6484375, "global_step": 263584, "epoch": 3175} {"train_loss": -25.048908233642578, "global_step": 263585, "epoch": 3175} {"train_loss": -24.804052352905273, "global_step": 263586, "epoch": 3175} {"train_loss": -25.57086753845215, "global_step": 263587, "epoch": 3175} {"train_loss": -25.208580017089844, "global_step": 263588, "epoch": 3175} {"train_loss": -25.406253814697266, "global_step": 263589, "epoch": 3175} {"train_loss": -25.183149337768555, "global_step": 263590, "epoch": 3175} {"train_loss": -24.915441513061523, "global_step": 263591, "epoch": 3175} {"train_loss": -25.193843841552734, "global_step": 263592, "epoch": 3175} {"train_loss": -25.071575164794922, "global_step": 263593, "epoch": 3175} {"train_loss": -25.164775848388672, "global_step": 263594, "epoch": 3175} {"train_loss": -25.160400390625, "global_step": 263595, "epoch": 3175} {"train_loss": -25.212148666381836, "global_step": 263596, "epoch": 3175} {"train_loss": -25.341373443603516, "global_step": 263597, "epoch": 3175} {"train_loss": -25.143943786621094, "global_step": 263598, "epoch": 3175} {"train_loss": -24.934703826904297, "global_step": 263599, "epoch": 3175} {"train_loss": -25.313064575195312, "global_step": 263600, "epoch": 3175} {"train_loss": -25.081329345703125, "global_step": 263601, "epoch": 3175} {"train_loss": -25.51972770690918, "global_step": 263602, "epoch": 3175} {"train_loss": -25.581005096435547, "global_step": 263603, "epoch": 3175} {"train_loss": -25.20576286315918, "global_step": 263604, "epoch": 3175} {"train_loss": -25.418245315551758, "global_step": 263605, "epoch": 3175} {"train_loss": -25.40314483642578, "global_step": 263606, "epoch": 3175} {"train_loss": -25.035811757466877, "global_step": 263607, "epoch": 3175, "val_loss": 6913457.0} {"train_loss": -24.595306396484375, "global_step": 263608, "epoch": 3176} {"train_loss": -24.890165328979492, "global_step": 263609, "epoch": 3176} {"train_loss": -24.330188751220703, "global_step": 263610, "epoch": 3176} {"train_loss": -24.706045150756836, "global_step": 263611, "epoch": 3176} {"train_loss": -24.680654525756836, "global_step": 263612, "epoch": 3176} {"train_loss": -24.917667388916016, "global_step": 263613, "epoch": 3176} {"train_loss": -25.53438949584961, "global_step": 263614, "epoch": 3176} {"train_loss": -24.97824478149414, "global_step": 263615, "epoch": 3176} {"train_loss": -24.344179153442383, "global_step": 263616, "epoch": 3176} {"train_loss": -25.20400619506836, "global_step": 263617, "epoch": 3176} {"train_loss": -24.49045753479004, "global_step": 263618, "epoch": 3176} {"train_loss": -24.91676139831543, "global_step": 263619, "epoch": 3176} {"train_loss": -25.240562438964844, "global_step": 263620, "epoch": 3176} {"train_loss": -25.142086029052734, "global_step": 263621, "epoch": 3176} {"train_loss": -24.931472778320312, "global_step": 263622, "epoch": 3176} {"train_loss": -25.160131454467773, "global_step": 263623, "epoch": 3176} {"train_loss": -24.99666404724121, "global_step": 263624, "epoch": 3176} {"train_loss": -24.809019088745117, "global_step": 263625, "epoch": 3176} {"train_loss": -24.913923263549805, "global_step": 263626, "epoch": 3176} {"train_loss": -24.961267471313477, "global_step": 263627, "epoch": 3176} {"train_loss": -25.41455841064453, "global_step": 263628, "epoch": 3176} {"train_loss": -24.868818283081055, "global_step": 263629, "epoch": 3176} {"train_loss": -25.297182083129883, "global_step": 263630, "epoch": 3176} {"train_loss": -25.42902946472168, "global_step": 263631, "epoch": 3176} {"train_loss": -25.329084396362305, "global_step": 263632, "epoch": 3176} {"train_loss": -24.98366928100586, "global_step": 263633, "epoch": 3176} {"train_loss": -25.33562469482422, "global_step": 263634, "epoch": 3176} {"train_loss": -25.01654624938965, "global_step": 263635, "epoch": 3176} {"train_loss": -24.81184196472168, "global_step": 263636, "epoch": 3176} {"train_loss": -25.050321578979492, "global_step": 263637, "epoch": 3176} {"train_loss": -25.321334838867188, "global_step": 263638, "epoch": 3176} {"train_loss": -25.491174697875977, "global_step": 263639, "epoch": 3176} {"train_loss": -25.298128128051758, "global_step": 263640, "epoch": 3176} {"train_loss": -25.179868698120117, "global_step": 263641, "epoch": 3176} {"train_loss": -25.24595832824707, "global_step": 263642, "epoch": 3176} {"train_loss": -25.53854751586914, "global_step": 263643, "epoch": 3176} {"train_loss": -24.83325958251953, "global_step": 263644, "epoch": 3176} {"train_loss": -24.973346710205078, "global_step": 263645, "epoch": 3176} {"train_loss": -25.745014190673828, "global_step": 263646, "epoch": 3176} {"train_loss": -25.181167602539062, "global_step": 263647, "epoch": 3176} {"train_loss": -25.508548736572266, "global_step": 263648, "epoch": 3176} {"train_loss": -25.387773513793945, "global_step": 263649, "epoch": 3176} {"train_loss": -25.070533752441406, "global_step": 263650, "epoch": 3176} {"train_loss": -25.551694869995117, "global_step": 263651, "epoch": 3176} {"train_loss": -25.340145111083984, "global_step": 263652, "epoch": 3176} {"train_loss": -25.257863998413086, "global_step": 263653, "epoch": 3176} {"train_loss": -25.3685302734375, "global_step": 263654, "epoch": 3176} {"train_loss": -25.16258430480957, "global_step": 263655, "epoch": 3176} {"train_loss": -25.109100341796875, "global_step": 263656, "epoch": 3176} {"train_loss": -25.33717155456543, "global_step": 263657, "epoch": 3176} {"train_loss": -25.30792808532715, "global_step": 263658, "epoch": 3176} {"train_loss": -25.518280029296875, "global_step": 263659, "epoch": 3176} {"train_loss": -25.483142852783203, "global_step": 263660, "epoch": 3176} {"train_loss": -25.07187271118164, "global_step": 263661, "epoch": 3176} {"train_loss": -24.891530990600586, "global_step": 263662, "epoch": 3176} {"train_loss": -24.724014282226562, "global_step": 263663, "epoch": 3176} {"train_loss": -25.3280029296875, "global_step": 263664, "epoch": 3176} {"train_loss": -25.072805404663086, "global_step": 263665, "epoch": 3176} {"train_loss": -24.893489837646484, "global_step": 263666, "epoch": 3176} {"train_loss": -25.64630699157715, "global_step": 263667, "epoch": 3176} {"train_loss": -25.159069061279297, "global_step": 263668, "epoch": 3176} {"train_loss": -25.113525390625, "global_step": 263669, "epoch": 3176} {"train_loss": -25.399574279785156, "global_step": 263670, "epoch": 3176} {"train_loss": -25.641305923461914, "global_step": 263671, "epoch": 3176} {"train_loss": -24.801925659179688, "global_step": 263672, "epoch": 3176} {"train_loss": -24.977088928222656, "global_step": 263673, "epoch": 3176} {"train_loss": -25.2398738861084, "global_step": 263674, "epoch": 3176} {"train_loss": -25.328144073486328, "global_step": 263675, "epoch": 3176} {"train_loss": -25.212034225463867, "global_step": 263676, "epoch": 3176} {"train_loss": -25.53814697265625, "global_step": 263677, "epoch": 3176} {"train_loss": -25.219511032104492, "global_step": 263678, "epoch": 3176} {"train_loss": -25.520902633666992, "global_step": 263679, "epoch": 3176} {"train_loss": -25.208881378173828, "global_step": 263680, "epoch": 3176} {"train_loss": -25.306753158569336, "global_step": 263681, "epoch": 3176} {"train_loss": -24.99422264099121, "global_step": 263682, "epoch": 3176} {"train_loss": -25.165884017944336, "global_step": 263683, "epoch": 3176} {"train_loss": -25.348894119262695, "global_step": 263684, "epoch": 3176} {"train_loss": -25.536060333251953, "global_step": 263685, "epoch": 3176} {"train_loss": -25.25612449645996, "global_step": 263686, "epoch": 3176} {"train_loss": -25.173202514648438, "global_step": 263687, "epoch": 3176} {"train_loss": -25.341312408447266, "global_step": 263688, "epoch": 3176} {"train_loss": -25.340478897094727, "global_step": 263689, "epoch": 3176} {"train_loss": -25.15267110158162, "global_step": 263690, "epoch": 3176, "val_loss": 6915619.0} {"train_loss": -24.913578033447266, "global_step": 263691, "epoch": 3177} {"train_loss": -24.771949768066406, "global_step": 263692, "epoch": 3177} {"train_loss": -24.39891815185547, "global_step": 263693, "epoch": 3177} {"train_loss": -24.693328857421875, "global_step": 263694, "epoch": 3177} {"train_loss": -24.627033233642578, "global_step": 263695, "epoch": 3177} {"train_loss": -24.48616600036621, "global_step": 263696, "epoch": 3177} {"train_loss": -24.922439575195312, "global_step": 263697, "epoch": 3177} {"train_loss": -24.724897384643555, "global_step": 263698, "epoch": 3177} {"train_loss": -25.02971839904785, "global_step": 263699, "epoch": 3177} {"train_loss": -24.967981338500977, "global_step": 263700, "epoch": 3177} {"train_loss": -24.74191665649414, "global_step": 263701, "epoch": 3177} {"train_loss": -25.01180076599121, "global_step": 263702, "epoch": 3177} {"train_loss": -24.816822052001953, "global_step": 263703, "epoch": 3177} {"train_loss": -25.41400718688965, "global_step": 263704, "epoch": 3177} {"train_loss": -24.805145263671875, "global_step": 263705, "epoch": 3177} {"train_loss": -24.77130699157715, "global_step": 263706, "epoch": 3177} {"train_loss": -25.147659301757812, "global_step": 263707, "epoch": 3177} {"train_loss": -25.02496910095215, "global_step": 263708, "epoch": 3177} {"train_loss": -25.370227813720703, "global_step": 263709, "epoch": 3177} {"train_loss": -24.938995361328125, "global_step": 263710, "epoch": 3177} {"train_loss": -25.044397354125977, "global_step": 263711, "epoch": 3177} {"train_loss": -24.964651107788086, "global_step": 263712, "epoch": 3177} {"train_loss": -24.944055557250977, "global_step": 263713, "epoch": 3177} {"train_loss": -25.317832946777344, "global_step": 263714, "epoch": 3177} {"train_loss": -25.384708404541016, "global_step": 263715, "epoch": 3177} {"train_loss": -25.196548461914062, "global_step": 263716, "epoch": 3177} {"train_loss": -25.166194915771484, "global_step": 263717, "epoch": 3177} {"train_loss": -25.4536075592041, "global_step": 263718, "epoch": 3177} {"train_loss": -25.37701988220215, "global_step": 263719, "epoch": 3177} {"train_loss": -25.183429718017578, "global_step": 263720, "epoch": 3177} {"train_loss": -25.485708236694336, "global_step": 263721, "epoch": 3177} {"train_loss": -25.278518676757812, "global_step": 263722, "epoch": 3177} {"train_loss": -25.107046127319336, "global_step": 263723, "epoch": 3177} {"train_loss": -25.276304244995117, "global_step": 263724, "epoch": 3177} {"train_loss": -25.279794692993164, "global_step": 263725, "epoch": 3177} {"train_loss": -25.54085350036621, "global_step": 263726, "epoch": 3177} {"train_loss": -25.424293518066406, "global_step": 263727, "epoch": 3177} {"train_loss": -24.829086303710938, "global_step": 263728, "epoch": 3177} {"train_loss": -25.325525283813477, "global_step": 263729, "epoch": 3177} {"train_loss": -25.260372161865234, "global_step": 263730, "epoch": 3177} {"train_loss": -25.116491317749023, "global_step": 263731, "epoch": 3177} {"train_loss": -25.050573348999023, "global_step": 263732, "epoch": 3177} {"train_loss": -25.233570098876953, "global_step": 263733, "epoch": 3177} {"train_loss": -24.945356369018555, "global_step": 263734, "epoch": 3177} {"train_loss": -24.754104614257812, "global_step": 263735, "epoch": 3177} {"train_loss": -24.940536499023438, "global_step": 263736, "epoch": 3177} {"train_loss": -25.172719955444336, "global_step": 263737, "epoch": 3177} {"train_loss": -25.088748931884766, "global_step": 263738, "epoch": 3177} {"train_loss": -25.23811149597168, "global_step": 263739, "epoch": 3177} {"train_loss": -24.99225425720215, "global_step": 263740, "epoch": 3177} {"train_loss": -24.99135398864746, "global_step": 263741, "epoch": 3177} {"train_loss": -25.2977294921875, "global_step": 263742, "epoch": 3177} {"train_loss": -25.108091354370117, "global_step": 263743, "epoch": 3177} {"train_loss": -25.216318130493164, "global_step": 263744, "epoch": 3177} {"train_loss": -25.069793701171875, "global_step": 263745, "epoch": 3177} {"train_loss": -25.317768096923828, "global_step": 263746, "epoch": 3177} {"train_loss": -25.325767517089844, "global_step": 263747, "epoch": 3177} {"train_loss": -25.317066192626953, "global_step": 263748, "epoch": 3177} {"train_loss": -25.199344635009766, "global_step": 263749, "epoch": 3177} {"train_loss": -25.60441017150879, "global_step": 263750, "epoch": 3177} {"train_loss": -25.182931900024414, "global_step": 263751, "epoch": 3177} {"train_loss": -24.813833236694336, "global_step": 263752, "epoch": 3177} {"train_loss": -25.097883224487305, "global_step": 263753, "epoch": 3177} {"train_loss": -24.986873626708984, "global_step": 263754, "epoch": 3177} {"train_loss": -25.320032119750977, "global_step": 263755, "epoch": 3177} {"train_loss": -25.363906860351562, "global_step": 263756, "epoch": 3177} {"train_loss": -25.134000778198242, "global_step": 263757, "epoch": 3177} {"train_loss": -25.347415924072266, "global_step": 263758, "epoch": 3177} {"train_loss": -25.581708908081055, "global_step": 263759, "epoch": 3177} {"train_loss": -25.331357955932617, "global_step": 263760, "epoch": 3177} {"train_loss": -25.297698974609375, "global_step": 263761, "epoch": 3177} {"train_loss": -25.171707153320312, "global_step": 263762, "epoch": 3177} {"train_loss": -25.15478515625, "global_step": 263763, "epoch": 3177} {"train_loss": -25.45660400390625, "global_step": 263764, "epoch": 3177} {"train_loss": -25.08109474182129, "global_step": 263765, "epoch": 3177} {"train_loss": -25.274246215820312, "global_step": 263766, "epoch": 3177} {"train_loss": -25.362411499023438, "global_step": 263767, "epoch": 3177} {"train_loss": -25.016759872436523, "global_step": 263768, "epoch": 3177} {"train_loss": -25.40988540649414, "global_step": 263769, "epoch": 3177} {"train_loss": -25.67719078063965, "global_step": 263770, "epoch": 3177} {"train_loss": -25.431869506835938, "global_step": 263771, "epoch": 3177} {"train_loss": -25.57328224182129, "global_step": 263772, "epoch": 3177} {"train_loss": -25.160149746630566, "global_step": 263773, "epoch": 3177, "val_loss": 6930981.0} {"train_loss": -25.05805778503418, "global_step": 263774, "epoch": 3178} {"train_loss": -24.775012969970703, "global_step": 263775, "epoch": 3178} {"train_loss": -25.025794982910156, "global_step": 263776, "epoch": 3178} {"train_loss": -24.890100479125977, "global_step": 263777, "epoch": 3178} {"train_loss": -25.257047653198242, "global_step": 263778, "epoch": 3178} {"train_loss": -24.84467887878418, "global_step": 263779, "epoch": 3178} {"train_loss": -24.22565269470215, "global_step": 263780, "epoch": 3178} {"train_loss": -24.15334129333496, "global_step": 263781, "epoch": 3178} {"train_loss": -23.590421676635742, "global_step": 263782, "epoch": 3178} {"train_loss": -24.40081214904785, "global_step": 263783, "epoch": 3178} {"train_loss": -24.99555778503418, "global_step": 263784, "epoch": 3178} {"train_loss": -24.442947387695312, "global_step": 263785, "epoch": 3178} {"train_loss": -24.404088973999023, "global_step": 263786, "epoch": 3178} {"train_loss": -24.484500885009766, "global_step": 263787, "epoch": 3178} {"train_loss": -25.225454330444336, "global_step": 263788, "epoch": 3178} {"train_loss": -24.2728214263916, "global_step": 263789, "epoch": 3178} {"train_loss": -24.906620025634766, "global_step": 263790, "epoch": 3178} {"train_loss": -24.710655212402344, "global_step": 263791, "epoch": 3178} {"train_loss": -24.8449764251709, "global_step": 263792, "epoch": 3178} {"train_loss": -25.069719314575195, "global_step": 263793, "epoch": 3178} {"train_loss": -24.579742431640625, "global_step": 263794, "epoch": 3178} {"train_loss": -24.655080795288086, "global_step": 263795, "epoch": 3178} {"train_loss": -24.87958335876465, "global_step": 263796, "epoch": 3178} {"train_loss": -25.1254940032959, "global_step": 263797, "epoch": 3178} {"train_loss": -25.193687438964844, "global_step": 263798, "epoch": 3178} {"train_loss": -24.964040756225586, "global_step": 263799, "epoch": 3178} {"train_loss": -24.52182388305664, "global_step": 263800, "epoch": 3178} {"train_loss": -25.076263427734375, "global_step": 263801, "epoch": 3178} {"train_loss": -25.28290367126465, "global_step": 263802, "epoch": 3178} {"train_loss": -25.048059463500977, "global_step": 263803, "epoch": 3178} {"train_loss": -25.183364868164062, "global_step": 263804, "epoch": 3178} {"train_loss": -25.050708770751953, "global_step": 263805, "epoch": 3178} {"train_loss": -24.960105895996094, "global_step": 263806, "epoch": 3178} {"train_loss": -25.10477066040039, "global_step": 263807, "epoch": 3178} {"train_loss": -25.174192428588867, "global_step": 263808, "epoch": 3178} {"train_loss": -24.983930587768555, "global_step": 263809, "epoch": 3178} {"train_loss": -25.252538681030273, "global_step": 263810, "epoch": 3178} {"train_loss": -25.208267211914062, "global_step": 263811, "epoch": 3178} {"train_loss": -25.00391387939453, "global_step": 263812, "epoch": 3178} {"train_loss": -25.256589889526367, "global_step": 263813, "epoch": 3178} {"train_loss": -25.518606185913086, "global_step": 263814, "epoch": 3178} {"train_loss": -24.830989837646484, "global_step": 263815, "epoch": 3178} {"train_loss": -25.476743698120117, "global_step": 263816, "epoch": 3178} {"train_loss": -25.139127731323242, "global_step": 263817, "epoch": 3178} {"train_loss": -25.320632934570312, "global_step": 263818, "epoch": 3178} {"train_loss": -25.264318466186523, "global_step": 263819, "epoch": 3178} {"train_loss": -24.88387680053711, "global_step": 263820, "epoch": 3178} {"train_loss": -25.268381118774414, "global_step": 263821, "epoch": 3178} {"train_loss": -25.09404182434082, "global_step": 263822, "epoch": 3178} {"train_loss": -25.19824981689453, "global_step": 263823, "epoch": 3178} {"train_loss": -25.25673484802246, "global_step": 263824, "epoch": 3178} {"train_loss": -24.984262466430664, "global_step": 263825, "epoch": 3178} {"train_loss": -25.26850128173828, "global_step": 263826, "epoch": 3178} {"train_loss": -25.340925216674805, "global_step": 263827, "epoch": 3178} {"train_loss": -25.687448501586914, "global_step": 263828, "epoch": 3178} {"train_loss": -25.52150535583496, "global_step": 263829, "epoch": 3178} {"train_loss": -25.590227127075195, "global_step": 263830, "epoch": 3178} {"train_loss": -25.614063262939453, "global_step": 263831, "epoch": 3178} {"train_loss": -25.252235412597656, "global_step": 263832, "epoch": 3178} {"train_loss": -25.375001907348633, "global_step": 263833, "epoch": 3178} {"train_loss": -25.103412628173828, "global_step": 263834, "epoch": 3178} {"train_loss": -25.148822784423828, "global_step": 263835, "epoch": 3178} {"train_loss": -25.245473861694336, "global_step": 263836, "epoch": 3178} {"train_loss": -25.438989639282227, "global_step": 263837, "epoch": 3178} {"train_loss": -25.237417221069336, "global_step": 263838, "epoch": 3178} {"train_loss": -25.474884033203125, "global_step": 263839, "epoch": 3178} {"train_loss": -25.23044204711914, "global_step": 263840, "epoch": 3178} {"train_loss": -25.064401626586914, "global_step": 263841, "epoch": 3178} {"train_loss": -25.148813247680664, "global_step": 263842, "epoch": 3178} {"train_loss": -25.20057487487793, "global_step": 263843, "epoch": 3178} {"train_loss": -24.977243423461914, "global_step": 263844, "epoch": 3178} {"train_loss": -25.16963005065918, "global_step": 263845, "epoch": 3178} {"train_loss": -25.189401626586914, "global_step": 263846, "epoch": 3178} {"train_loss": -25.100845336914062, "global_step": 263847, "epoch": 3178} {"train_loss": -25.142873764038086, "global_step": 263848, "epoch": 3178} {"train_loss": -25.31475257873535, "global_step": 263849, "epoch": 3178} {"train_loss": -25.192487716674805, "global_step": 263850, "epoch": 3178} {"train_loss": -25.540376663208008, "global_step": 263851, "epoch": 3178} {"train_loss": -25.268354415893555, "global_step": 263852, "epoch": 3178} {"train_loss": -25.09427833557129, "global_step": 263853, "epoch": 3178} {"train_loss": -24.780323028564453, "global_step": 263854, "epoch": 3178} {"train_loss": -25.10700798034668, "global_step": 263855, "epoch": 3178} {"train_loss": -25.067635869405354, "global_step": 263856, "epoch": 3178, "val_loss": 6975068.0} {"train_loss": -24.098684310913086, "global_step": 263857, "epoch": 3179} {"train_loss": -24.262786865234375, "global_step": 263858, "epoch": 3179} {"train_loss": -23.49445152282715, "global_step": 263859, "epoch": 3179} {"train_loss": -24.294347763061523, "global_step": 263860, "epoch": 3179} {"train_loss": -23.727231979370117, "global_step": 263861, "epoch": 3179} {"train_loss": -24.035776138305664, "global_step": 263862, "epoch": 3179} {"train_loss": -23.56793212890625, "global_step": 263863, "epoch": 3179} {"train_loss": -24.43692398071289, "global_step": 263864, "epoch": 3179} {"train_loss": -24.236494064331055, "global_step": 263865, "epoch": 3179} {"train_loss": -23.9442081451416, "global_step": 263866, "epoch": 3179} {"train_loss": -24.10761070251465, "global_step": 263867, "epoch": 3179} {"train_loss": -24.35889434814453, "global_step": 263868, "epoch": 3179} {"train_loss": -24.160037994384766, "global_step": 263869, "epoch": 3179} {"train_loss": -24.568422317504883, "global_step": 263870, "epoch": 3179} {"train_loss": -25.054197311401367, "global_step": 263871, "epoch": 3179} {"train_loss": -24.355802536010742, "global_step": 263872, "epoch": 3179} {"train_loss": -24.62033462524414, "global_step": 263873, "epoch": 3179} {"train_loss": -24.63727378845215, "global_step": 263874, "epoch": 3179} {"train_loss": -24.49774169921875, "global_step": 263875, "epoch": 3179} {"train_loss": -24.597898483276367, "global_step": 263876, "epoch": 3179} {"train_loss": -24.8016300201416, "global_step": 263877, "epoch": 3179} {"train_loss": -25.164710998535156, "global_step": 263878, "epoch": 3179} {"train_loss": -24.938966751098633, "global_step": 263879, "epoch": 3179} {"train_loss": -24.87172508239746, "global_step": 263880, "epoch": 3179} {"train_loss": -24.94856071472168, "global_step": 263881, "epoch": 3179} {"train_loss": -24.688709259033203, "global_step": 263882, "epoch": 3179} {"train_loss": -24.86017417907715, "global_step": 263883, "epoch": 3179} {"train_loss": -24.817480087280273, "global_step": 263884, "epoch": 3179} {"train_loss": -24.981008529663086, "global_step": 263885, "epoch": 3179} {"train_loss": -24.971603393554688, "global_step": 263886, "epoch": 3179} {"train_loss": -25.196910858154297, "global_step": 263887, "epoch": 3179} {"train_loss": -24.95808982849121, "global_step": 263888, "epoch": 3179} {"train_loss": -25.029071807861328, "global_step": 263889, "epoch": 3179} {"train_loss": -25.127588272094727, "global_step": 263890, "epoch": 3179} {"train_loss": -25.132474899291992, "global_step": 263891, "epoch": 3179} {"train_loss": -25.24167823791504, "global_step": 263892, "epoch": 3179} {"train_loss": -25.2227783203125, "global_step": 263893, "epoch": 3179} {"train_loss": -25.221378326416016, "global_step": 263894, "epoch": 3179} {"train_loss": -25.236547470092773, "global_step": 263895, "epoch": 3179} {"train_loss": -25.172712326049805, "global_step": 263896, "epoch": 3179} {"train_loss": -25.101505279541016, "global_step": 263897, "epoch": 3179} {"train_loss": -25.28083610534668, "global_step": 263898, "epoch": 3179} {"train_loss": -25.201108932495117, "global_step": 263899, "epoch": 3179} {"train_loss": -25.095260620117188, "global_step": 263900, "epoch": 3179} {"train_loss": -25.3037052154541, "global_step": 263901, "epoch": 3179} {"train_loss": -24.944202423095703, "global_step": 263902, "epoch": 3179} {"train_loss": -25.22520637512207, "global_step": 263903, "epoch": 3179} {"train_loss": -25.321744918823242, "global_step": 263904, "epoch": 3179} {"train_loss": -25.125198364257812, "global_step": 263905, "epoch": 3179} {"train_loss": -25.22281265258789, "global_step": 263906, "epoch": 3179} {"train_loss": -25.281679153442383, "global_step": 263907, "epoch": 3179} {"train_loss": -25.065656661987305, "global_step": 263908, "epoch": 3179} {"train_loss": -25.209447860717773, "global_step": 263909, "epoch": 3179} {"train_loss": -25.1856746673584, "global_step": 263910, "epoch": 3179} {"train_loss": -25.388219833374023, "global_step": 263911, "epoch": 3179} {"train_loss": -25.25038719177246, "global_step": 263912, "epoch": 3179} {"train_loss": -25.012807846069336, "global_step": 263913, "epoch": 3179} {"train_loss": -24.97475242614746, "global_step": 263914, "epoch": 3179} {"train_loss": -24.95572853088379, "global_step": 263915, "epoch": 3179} {"train_loss": -24.97603416442871, "global_step": 263916, "epoch": 3179} {"train_loss": -24.907861709594727, "global_step": 263917, "epoch": 3179} {"train_loss": -24.849897384643555, "global_step": 263918, "epoch": 3179} {"train_loss": -24.82381248474121, "global_step": 263919, "epoch": 3179} {"train_loss": -25.0350399017334, "global_step": 263920, "epoch": 3179} {"train_loss": -25.038713455200195, "global_step": 263921, "epoch": 3179} {"train_loss": -25.1016845703125, "global_step": 263922, "epoch": 3179} {"train_loss": -24.935697555541992, "global_step": 263923, "epoch": 3179} {"train_loss": -25.64569091796875, "global_step": 263924, "epoch": 3179} {"train_loss": -25.208444595336914, "global_step": 263925, "epoch": 3179} {"train_loss": -25.323040008544922, "global_step": 263926, "epoch": 3179} {"train_loss": -25.108137130737305, "global_step": 263927, "epoch": 3179} {"train_loss": -25.39032554626465, "global_step": 263928, "epoch": 3179} {"train_loss": -25.286619186401367, "global_step": 263929, "epoch": 3179} {"train_loss": -25.14231300354004, "global_step": 263930, "epoch": 3179} {"train_loss": -25.42683982849121, "global_step": 263931, "epoch": 3179} {"train_loss": -25.397520065307617, "global_step": 263932, "epoch": 3179} {"train_loss": -25.214439392089844, "global_step": 263933, "epoch": 3179} {"train_loss": -25.67473793029785, "global_step": 263934, "epoch": 3179} {"train_loss": -25.505102157592773, "global_step": 263935, "epoch": 3179} {"train_loss": -25.104942321777344, "global_step": 263936, "epoch": 3179} {"train_loss": -25.137388229370117, "global_step": 263937, "epoch": 3179} {"train_loss": -25.17149543762207, "global_step": 263938, "epoch": 3179} {"train_loss": -24.935394447970104, "global_step": 263939, "epoch": 3179, "val_loss": 6890866.0} {"train_loss": -24.31655502319336, "global_step": 263940, "epoch": 3180} {"train_loss": -24.629968643188477, "global_step": 263941, "epoch": 3180} {"train_loss": -24.880346298217773, "global_step": 263942, "epoch": 3180} {"train_loss": -24.035207748413086, "global_step": 263943, "epoch": 3180} {"train_loss": -24.61245346069336, "global_step": 263944, "epoch": 3180} {"train_loss": -25.098756790161133, "global_step": 263945, "epoch": 3180} {"train_loss": -24.116533279418945, "global_step": 263946, "epoch": 3180} {"train_loss": -24.56316566467285, "global_step": 263947, "epoch": 3180} {"train_loss": -24.493335723876953, "global_step": 263948, "epoch": 3180} {"train_loss": -24.672128677368164, "global_step": 263949, "epoch": 3180} {"train_loss": -24.916000366210938, "global_step": 263950, "epoch": 3180} {"train_loss": -25.018077850341797, "global_step": 263951, "epoch": 3180} {"train_loss": -24.4426326751709, "global_step": 263952, "epoch": 3180} {"train_loss": -25.155195236206055, "global_step": 263953, "epoch": 3180} {"train_loss": -24.578765869140625, "global_step": 263954, "epoch": 3180} {"train_loss": -24.938968658447266, "global_step": 263955, "epoch": 3180} {"train_loss": -24.632200241088867, "global_step": 263956, "epoch": 3180} {"train_loss": -24.93951416015625, "global_step": 263957, "epoch": 3180} {"train_loss": -24.67586326599121, "global_step": 263958, "epoch": 3180} {"train_loss": -25.162031173706055, "global_step": 263959, "epoch": 3180} {"train_loss": -25.157390594482422, "global_step": 263960, "epoch": 3180} {"train_loss": -25.283777236938477, "global_step": 263961, "epoch": 3180} {"train_loss": -25.008033752441406, "global_step": 263962, "epoch": 3180} {"train_loss": -25.33456039428711, "global_step": 263963, "epoch": 3180} {"train_loss": -24.812898635864258, "global_step": 263964, "epoch": 3180} {"train_loss": -25.256559371948242, "global_step": 263965, "epoch": 3180} {"train_loss": -25.00132942199707, "global_step": 263966, "epoch": 3180} {"train_loss": -25.491714477539062, "global_step": 263967, "epoch": 3180} {"train_loss": -24.83378028869629, "global_step": 263968, "epoch": 3180} {"train_loss": -25.353666305541992, "global_step": 263969, "epoch": 3180} {"train_loss": -25.357038497924805, "global_step": 263970, "epoch": 3180} {"train_loss": -25.302249908447266, "global_step": 263971, "epoch": 3180} {"train_loss": -24.819787979125977, "global_step": 263972, "epoch": 3180} {"train_loss": -25.16700553894043, "global_step": 263973, "epoch": 3180} {"train_loss": -25.27971649169922, "global_step": 263974, "epoch": 3180} {"train_loss": -25.321584701538086, "global_step": 263975, "epoch": 3180} {"train_loss": -25.34950065612793, "global_step": 263976, "epoch": 3180} {"train_loss": -25.56843376159668, "global_step": 263977, "epoch": 3180} {"train_loss": -25.2473201751709, "global_step": 263978, "epoch": 3180} {"train_loss": -25.05482292175293, "global_step": 263979, "epoch": 3180} {"train_loss": -25.422374725341797, "global_step": 263980, "epoch": 3180} {"train_loss": -25.322303771972656, "global_step": 263981, "epoch": 3180} {"train_loss": -25.5114803314209, "global_step": 263982, "epoch": 3180} {"train_loss": -25.06381607055664, "global_step": 263983, "epoch": 3180} {"train_loss": -25.1158447265625, "global_step": 263984, "epoch": 3180} {"train_loss": -25.3228816986084, "global_step": 263985, "epoch": 3180} {"train_loss": -25.5396785736084, "global_step": 263986, "epoch": 3180} {"train_loss": -25.58810806274414, "global_step": 263987, "epoch": 3180} {"train_loss": -25.397130966186523, "global_step": 263988, "epoch": 3180} {"train_loss": -25.459766387939453, "global_step": 263989, "epoch": 3180} {"train_loss": -25.237812042236328, "global_step": 263990, "epoch": 3180} {"train_loss": -25.039220809936523, "global_step": 263991, "epoch": 3180} {"train_loss": -25.125690460205078, "global_step": 263992, "epoch": 3180} {"train_loss": -25.281301498413086, "global_step": 263993, "epoch": 3180} {"train_loss": -25.370576858520508, "global_step": 263994, "epoch": 3180} {"train_loss": -24.628812789916992, "global_step": 263995, "epoch": 3180} {"train_loss": -25.407352447509766, "global_step": 263996, "epoch": 3180} {"train_loss": -25.219221115112305, "global_step": 263997, "epoch": 3180} {"train_loss": -25.245765686035156, "global_step": 263998, "epoch": 3180} {"train_loss": -24.97641944885254, "global_step": 263999, "epoch": 3180} {"train_loss": -25.1431941986084, "global_step": 264000, "epoch": 3180} {"train_loss": -25.222610473632812, "global_step": 264001, "epoch": 3180} {"train_loss": -24.932470321655273, "global_step": 264002, "epoch": 3180} {"train_loss": -25.103046417236328, "global_step": 264003, "epoch": 3180} {"train_loss": -25.262632369995117, "global_step": 264004, "epoch": 3180} {"train_loss": -25.0335750579834, "global_step": 264005, "epoch": 3180} {"train_loss": -25.24789810180664, "global_step": 264006, "epoch": 3180} {"train_loss": -24.869333267211914, "global_step": 264007, "epoch": 3180} {"train_loss": -25.263463973999023, "global_step": 264008, "epoch": 3180} {"train_loss": -25.327402114868164, "global_step": 264009, "epoch": 3180} {"train_loss": -24.734220504760742, "global_step": 264010, "epoch": 3180} {"train_loss": -25.269001007080078, "global_step": 264011, "epoch": 3180} {"train_loss": -25.213754653930664, "global_step": 264012, "epoch": 3180} {"train_loss": -25.47648048400879, "global_step": 264013, "epoch": 3180} {"train_loss": -24.791410446166992, "global_step": 264014, "epoch": 3180} {"train_loss": -24.936521530151367, "global_step": 264015, "epoch": 3180} {"train_loss": -25.17633056640625, "global_step": 264016, "epoch": 3180} {"train_loss": -25.392942428588867, "global_step": 264017, "epoch": 3180} {"train_loss": -25.289817810058594, "global_step": 264018, "epoch": 3180} {"train_loss": -25.674591064453125, "global_step": 264019, "epoch": 3180} {"train_loss": -25.48383140563965, "global_step": 264020, "epoch": 3180} {"train_loss": -25.19367790222168, "global_step": 264021, "epoch": 3180} {"train_loss": -25.112189878900367, "global_step": 264022, "epoch": 3180, "val_loss": 6975671.0} {"train_loss": -24.286418914794922, "global_step": 264023, "epoch": 3181} {"train_loss": -24.538854598999023, "global_step": 264024, "epoch": 3181} {"train_loss": -24.854114532470703, "global_step": 264025, "epoch": 3181} {"train_loss": -25.154321670532227, "global_step": 264026, "epoch": 3181} {"train_loss": -24.617420196533203, "global_step": 264027, "epoch": 3181} {"train_loss": -25.010854721069336, "global_step": 264028, "epoch": 3181} {"train_loss": -25.162105560302734, "global_step": 264029, "epoch": 3181} {"train_loss": -24.69080924987793, "global_step": 264030, "epoch": 3181} {"train_loss": -25.3111515045166, "global_step": 264031, "epoch": 3181} {"train_loss": -24.73555564880371, "global_step": 264032, "epoch": 3181} {"train_loss": -24.969532012939453, "global_step": 264033, "epoch": 3181} {"train_loss": -24.599889755249023, "global_step": 264034, "epoch": 3181} {"train_loss": -24.860376358032227, "global_step": 264035, "epoch": 3181} {"train_loss": -24.615386962890625, "global_step": 264036, "epoch": 3181} {"train_loss": -24.63863754272461, "global_step": 264037, "epoch": 3181} {"train_loss": -24.773757934570312, "global_step": 264038, "epoch": 3181} {"train_loss": -24.96096420288086, "global_step": 264039, "epoch": 3181} {"train_loss": -24.624353408813477, "global_step": 264040, "epoch": 3181} {"train_loss": -24.757070541381836, "global_step": 264041, "epoch": 3181} {"train_loss": -24.537065505981445, "global_step": 264042, "epoch": 3181} {"train_loss": -24.8574275970459, "global_step": 264043, "epoch": 3181} {"train_loss": -24.781614303588867, "global_step": 264044, "epoch": 3181} {"train_loss": -24.65239906311035, "global_step": 264045, "epoch": 3181} {"train_loss": -24.761457443237305, "global_step": 264046, "epoch": 3181} {"train_loss": -24.935138702392578, "global_step": 264047, "epoch": 3181} {"train_loss": -25.12763786315918, "global_step": 264048, "epoch": 3181} {"train_loss": -25.190269470214844, "global_step": 264049, "epoch": 3181} {"train_loss": -24.648805618286133, "global_step": 264050, "epoch": 3181} {"train_loss": -25.233427047729492, "global_step": 264051, "epoch": 3181} {"train_loss": -25.083984375, "global_step": 264052, "epoch": 3181} {"train_loss": -25.38083839416504, "global_step": 264053, "epoch": 3181} {"train_loss": -25.000097274780273, "global_step": 264054, "epoch": 3181} {"train_loss": -25.021467208862305, "global_step": 264055, "epoch": 3181} {"train_loss": -25.14596939086914, "global_step": 264056, "epoch": 3181} {"train_loss": -25.535863876342773, "global_step": 264057, "epoch": 3181} {"train_loss": -25.135499954223633, "global_step": 264058, "epoch": 3181} {"train_loss": -25.209529876708984, "global_step": 264059, "epoch": 3181} {"train_loss": -25.3024959564209, "global_step": 264060, "epoch": 3181} {"train_loss": -24.989469528198242, "global_step": 264061, "epoch": 3181} {"train_loss": -25.06959342956543, "global_step": 264062, "epoch": 3181} {"train_loss": -25.291339874267578, "global_step": 264063, "epoch": 3181} {"train_loss": -25.223249435424805, "global_step": 264064, "epoch": 3181} {"train_loss": -25.23543357849121, "global_step": 264065, "epoch": 3181} {"train_loss": -25.332151412963867, "global_step": 264066, "epoch": 3181} {"train_loss": -24.987730026245117, "global_step": 264067, "epoch": 3181} {"train_loss": -25.09418296813965, "global_step": 264068, "epoch": 3181} {"train_loss": -25.156007766723633, "global_step": 264069, "epoch": 3181} {"train_loss": -25.042083740234375, "global_step": 264070, "epoch": 3181} {"train_loss": -25.186338424682617, "global_step": 264071, "epoch": 3181} {"train_loss": -24.932836532592773, "global_step": 264072, "epoch": 3181} {"train_loss": -24.951889038085938, "global_step": 264073, "epoch": 3181} {"train_loss": -25.228052139282227, "global_step": 264074, "epoch": 3181} {"train_loss": -25.377307891845703, "global_step": 264075, "epoch": 3181} {"train_loss": -25.407562255859375, "global_step": 264076, "epoch": 3181} {"train_loss": -25.287839889526367, "global_step": 264077, "epoch": 3181} {"train_loss": -25.399765014648438, "global_step": 264078, "epoch": 3181} {"train_loss": -25.341922760009766, "global_step": 264079, "epoch": 3181} {"train_loss": -24.85383415222168, "global_step": 264080, "epoch": 3181} {"train_loss": -25.230499267578125, "global_step": 264081, "epoch": 3181} {"train_loss": -25.24395751953125, "global_step": 264082, "epoch": 3181} {"train_loss": -25.184524536132812, "global_step": 264083, "epoch": 3181} {"train_loss": -24.975522994995117, "global_step": 264084, "epoch": 3181} {"train_loss": -25.066715240478516, "global_step": 264085, "epoch": 3181} {"train_loss": -25.280961990356445, "global_step": 264086, "epoch": 3181} {"train_loss": -25.60529136657715, "global_step": 264087, "epoch": 3181} {"train_loss": -25.634634017944336, "global_step": 264088, "epoch": 3181} {"train_loss": -25.34639549255371, "global_step": 264089, "epoch": 3181} {"train_loss": -25.464710235595703, "global_step": 264090, "epoch": 3181} {"train_loss": -25.44727897644043, "global_step": 264091, "epoch": 3181} {"train_loss": -25.166051864624023, "global_step": 264092, "epoch": 3181} {"train_loss": -24.96685028076172, "global_step": 264093, "epoch": 3181} {"train_loss": -25.425376892089844, "global_step": 264094, "epoch": 3181} {"train_loss": -25.291603088378906, "global_step": 264095, "epoch": 3181} {"train_loss": -25.79707145690918, "global_step": 264096, "epoch": 3181} {"train_loss": -24.936614990234375, "global_step": 264097, "epoch": 3181} {"train_loss": -25.30208396911621, "global_step": 264098, "epoch": 3181} {"train_loss": -25.377914428710938, "global_step": 264099, "epoch": 3181} {"train_loss": -25.57757568359375, "global_step": 264100, "epoch": 3181} {"train_loss": -25.09440040588379, "global_step": 264101, "epoch": 3181} {"train_loss": -25.703845977783203, "global_step": 264102, "epoch": 3181} {"train_loss": -25.20887565612793, "global_step": 264103, "epoch": 3181} {"train_loss": -25.097671508789062, "global_step": 264104, "epoch": 3181} {"train_loss": -25.087630191481257, "global_step": 264105, "epoch": 3181, "val_loss": 6952331.0} {"train_loss": -25.080278396606445, "global_step": 264106, "epoch": 3182} {"train_loss": -24.501787185668945, "global_step": 264107, "epoch": 3182} {"train_loss": -24.580854415893555, "global_step": 264108, "epoch": 3182} {"train_loss": -24.797019958496094, "global_step": 264109, "epoch": 3182} {"train_loss": -25.059173583984375, "global_step": 264110, "epoch": 3182} {"train_loss": -24.49872398376465, "global_step": 264111, "epoch": 3182} {"train_loss": -24.5968074798584, "global_step": 264112, "epoch": 3182} {"train_loss": -25.16084861755371, "global_step": 264113, "epoch": 3182} {"train_loss": -24.82749366760254, "global_step": 264114, "epoch": 3182} {"train_loss": -24.803016662597656, "global_step": 264115, "epoch": 3182} {"train_loss": -24.64896583557129, "global_step": 264116, "epoch": 3182} {"train_loss": -25.040084838867188, "global_step": 264117, "epoch": 3182} {"train_loss": -24.771045684814453, "global_step": 264118, "epoch": 3182} {"train_loss": -25.157089233398438, "global_step": 264119, "epoch": 3182} {"train_loss": -25.015974044799805, "global_step": 264120, "epoch": 3182} {"train_loss": -25.3082332611084, "global_step": 264121, "epoch": 3182} {"train_loss": -24.964473724365234, "global_step": 264122, "epoch": 3182} {"train_loss": -25.228994369506836, "global_step": 264123, "epoch": 3182} {"train_loss": -25.071870803833008, "global_step": 264124, "epoch": 3182} {"train_loss": -25.485294342041016, "global_step": 264125, "epoch": 3182} {"train_loss": -24.7844295501709, "global_step": 264126, "epoch": 3182} {"train_loss": -25.210859298706055, "global_step": 264127, "epoch": 3182} {"train_loss": -25.0739803314209, "global_step": 264128, "epoch": 3182} {"train_loss": -25.149871826171875, "global_step": 264129, "epoch": 3182} {"train_loss": -25.043594360351562, "global_step": 264130, "epoch": 3182} {"train_loss": -25.268781661987305, "global_step": 264131, "epoch": 3182} {"train_loss": -25.21341896057129, "global_step": 264132, "epoch": 3182} {"train_loss": -25.307098388671875, "global_step": 264133, "epoch": 3182} {"train_loss": -25.18149185180664, "global_step": 264134, "epoch": 3182} {"train_loss": -25.340517044067383, "global_step": 264135, "epoch": 3182} {"train_loss": -25.18899154663086, "global_step": 264136, "epoch": 3182} {"train_loss": -25.338632583618164, "global_step": 264137, "epoch": 3182} {"train_loss": -25.034814834594727, "global_step": 264138, "epoch": 3182} {"train_loss": -24.57964515686035, "global_step": 264139, "epoch": 3182} {"train_loss": -24.999326705932617, "global_step": 264140, "epoch": 3182} {"train_loss": -25.120607376098633, "global_step": 264141, "epoch": 3182} {"train_loss": -25.15017318725586, "global_step": 264142, "epoch": 3182} {"train_loss": -25.1532039642334, "global_step": 264143, "epoch": 3182} {"train_loss": -25.505170822143555, "global_step": 264144, "epoch": 3182} {"train_loss": -25.00607681274414, "global_step": 264145, "epoch": 3182} {"train_loss": -24.936243057250977, "global_step": 264146, "epoch": 3182} {"train_loss": -24.920316696166992, "global_step": 264147, "epoch": 3182} {"train_loss": -25.433963775634766, "global_step": 264148, "epoch": 3182} {"train_loss": -25.210432052612305, "global_step": 264149, "epoch": 3182} {"train_loss": -25.201374053955078, "global_step": 264150, "epoch": 3182} {"train_loss": -25.151458740234375, "global_step": 264151, "epoch": 3182} {"train_loss": -25.127349853515625, "global_step": 264152, "epoch": 3182} {"train_loss": -25.457752227783203, "global_step": 264153, "epoch": 3182} {"train_loss": -25.36593246459961, "global_step": 264154, "epoch": 3182} {"train_loss": -25.298608779907227, "global_step": 264155, "epoch": 3182} {"train_loss": -25.177125930786133, "global_step": 264156, "epoch": 3182} {"train_loss": -25.17837142944336, "global_step": 264157, "epoch": 3182} {"train_loss": -25.50322151184082, "global_step": 264158, "epoch": 3182} {"train_loss": -24.8976993560791, "global_step": 264159, "epoch": 3182} {"train_loss": -25.07790184020996, "global_step": 264160, "epoch": 3182} {"train_loss": -25.14105224609375, "global_step": 264161, "epoch": 3182} {"train_loss": -25.440515518188477, "global_step": 264162, "epoch": 3182} {"train_loss": -25.545814514160156, "global_step": 264163, "epoch": 3182} {"train_loss": -25.313705444335938, "global_step": 264164, "epoch": 3182} {"train_loss": -25.589378356933594, "global_step": 264165, "epoch": 3182} {"train_loss": -24.923171997070312, "global_step": 264166, "epoch": 3182} {"train_loss": -25.381467819213867, "global_step": 264167, "epoch": 3182} {"train_loss": -25.179637908935547, "global_step": 264168, "epoch": 3182} {"train_loss": -24.992483139038086, "global_step": 264169, "epoch": 3182} {"train_loss": -25.436731338500977, "global_step": 264170, "epoch": 3182} {"train_loss": -24.973682403564453, "global_step": 264171, "epoch": 3182} {"train_loss": -24.549787521362305, "global_step": 264172, "epoch": 3182} {"train_loss": -24.812259674072266, "global_step": 264173, "epoch": 3182} {"train_loss": -24.74547576904297, "global_step": 264174, "epoch": 3182} {"train_loss": -24.923715591430664, "global_step": 264175, "epoch": 3182} {"train_loss": -25.466672897338867, "global_step": 264176, "epoch": 3182} {"train_loss": -25.10095977783203, "global_step": 264177, "epoch": 3182} {"train_loss": -25.104774475097656, "global_step": 264178, "epoch": 3182} {"train_loss": -24.942785263061523, "global_step": 264179, "epoch": 3182} {"train_loss": -25.233837127685547, "global_step": 264180, "epoch": 3182} {"train_loss": -24.669715881347656, "global_step": 264181, "epoch": 3182} {"train_loss": -25.152111053466797, "global_step": 264182, "epoch": 3182} {"train_loss": -24.901264190673828, "global_step": 264183, "epoch": 3182} {"train_loss": -25.014785766601562, "global_step": 264184, "epoch": 3182} {"train_loss": -25.60867691040039, "global_step": 264185, "epoch": 3182} {"train_loss": -24.87654685974121, "global_step": 264186, "epoch": 3182} {"train_loss": -25.24326515197754, "global_step": 264187, "epoch": 3182} {"train_loss": -25.108208506940358, "global_step": 264188, "epoch": 3182, "val_loss": 6965280.0} {"train_loss": -24.787147521972656, "global_step": 264189, "epoch": 3183} {"train_loss": -25.012611389160156, "global_step": 264190, "epoch": 3183} {"train_loss": -24.551008224487305, "global_step": 264191, "epoch": 3183} {"train_loss": -25.23285675048828, "global_step": 264192, "epoch": 3183} {"train_loss": -24.8212833404541, "global_step": 264193, "epoch": 3183} {"train_loss": -24.907154083251953, "global_step": 264194, "epoch": 3183} {"train_loss": -24.980512619018555, "global_step": 264195, "epoch": 3183} {"train_loss": -25.11533546447754, "global_step": 264196, "epoch": 3183} {"train_loss": -24.77010154724121, "global_step": 264197, "epoch": 3183} {"train_loss": -24.54248046875, "global_step": 264198, "epoch": 3183} {"train_loss": -24.79842185974121, "global_step": 264199, "epoch": 3183} {"train_loss": -24.602710723876953, "global_step": 264200, "epoch": 3183} {"train_loss": -25.39569664001465, "global_step": 264201, "epoch": 3183} {"train_loss": -25.081762313842773, "global_step": 264202, "epoch": 3183} {"train_loss": -24.527156829833984, "global_step": 264203, "epoch": 3183} {"train_loss": -25.074453353881836, "global_step": 264204, "epoch": 3183} {"train_loss": -25.165964126586914, "global_step": 264205, "epoch": 3183} {"train_loss": -24.936323165893555, "global_step": 264206, "epoch": 3183} {"train_loss": -25.090999603271484, "global_step": 264207, "epoch": 3183} {"train_loss": -25.283428192138672, "global_step": 264208, "epoch": 3183} {"train_loss": -25.29359245300293, "global_step": 264209, "epoch": 3183} {"train_loss": -25.09246826171875, "global_step": 264210, "epoch": 3183} {"train_loss": -25.268625259399414, "global_step": 264211, "epoch": 3183} {"train_loss": -25.36069107055664, "global_step": 264212, "epoch": 3183} {"train_loss": -25.24447250366211, "global_step": 264213, "epoch": 3183} {"train_loss": -25.39322853088379, "global_step": 264214, "epoch": 3183} {"train_loss": -25.113523483276367, "global_step": 264215, "epoch": 3183} {"train_loss": -25.266141891479492, "global_step": 264216, "epoch": 3183} {"train_loss": -25.42142105102539, "global_step": 264217, "epoch": 3183} {"train_loss": -25.380224227905273, "global_step": 264218, "epoch": 3183} {"train_loss": -25.210834503173828, "global_step": 264219, "epoch": 3183} {"train_loss": -25.068431854248047, "global_step": 264220, "epoch": 3183} {"train_loss": -25.385196685791016, "global_step": 264221, "epoch": 3183} {"train_loss": -25.442420959472656, "global_step": 264222, "epoch": 3183} {"train_loss": -25.213890075683594, "global_step": 264223, "epoch": 3183} {"train_loss": -25.39414405822754, "global_step": 264224, "epoch": 3183} {"train_loss": -25.23085594177246, "global_step": 264225, "epoch": 3183} {"train_loss": -25.423452377319336, "global_step": 264226, "epoch": 3183} {"train_loss": -25.337800979614258, "global_step": 264227, "epoch": 3183} {"train_loss": -25.388444900512695, "global_step": 264228, "epoch": 3183} {"train_loss": -26.049915313720703, "global_step": 264229, "epoch": 3183} {"train_loss": -25.403406143188477, "global_step": 264230, "epoch": 3183} {"train_loss": -25.67327308654785, "global_step": 264231, "epoch": 3183} {"train_loss": -25.64011001586914, "global_step": 264232, "epoch": 3183} {"train_loss": -25.12981605529785, "global_step": 264233, "epoch": 3183} {"train_loss": -25.398029327392578, "global_step": 264234, "epoch": 3183} {"train_loss": -25.412378311157227, "global_step": 264235, "epoch": 3183} {"train_loss": -25.53862953186035, "global_step": 264236, "epoch": 3183} {"train_loss": -25.339725494384766, "global_step": 264237, "epoch": 3183} {"train_loss": -25.372596740722656, "global_step": 264238, "epoch": 3183} {"train_loss": -25.5716609954834, "global_step": 264239, "epoch": 3183} {"train_loss": -25.128376007080078, "global_step": 264240, "epoch": 3183} {"train_loss": -25.3113956451416, "global_step": 264241, "epoch": 3183} {"train_loss": -24.770334243774414, "global_step": 264242, "epoch": 3183} {"train_loss": -25.154577255249023, "global_step": 264243, "epoch": 3183} {"train_loss": -24.95789337158203, "global_step": 264244, "epoch": 3183} {"train_loss": -24.68092918395996, "global_step": 264245, "epoch": 3183} {"train_loss": -24.777769088745117, "global_step": 264246, "epoch": 3183} {"train_loss": -24.972585678100586, "global_step": 264247, "epoch": 3183} {"train_loss": -25.1075439453125, "global_step": 264248, "epoch": 3183} {"train_loss": -25.076642990112305, "global_step": 264249, "epoch": 3183} {"train_loss": -24.800949096679688, "global_step": 264250, "epoch": 3183} {"train_loss": -25.458526611328125, "global_step": 264251, "epoch": 3183} {"train_loss": -25.06024169921875, "global_step": 264252, "epoch": 3183} {"train_loss": -24.99452781677246, "global_step": 264253, "epoch": 3183} {"train_loss": -25.314407348632812, "global_step": 264254, "epoch": 3183} {"train_loss": -25.036396026611328, "global_step": 264255, "epoch": 3183} {"train_loss": -25.107206344604492, "global_step": 264256, "epoch": 3183} {"train_loss": -24.947736740112305, "global_step": 264257, "epoch": 3183} {"train_loss": -25.32760238647461, "global_step": 264258, "epoch": 3183} {"train_loss": -25.10679054260254, "global_step": 264259, "epoch": 3183} {"train_loss": -25.39277458190918, "global_step": 264260, "epoch": 3183} {"train_loss": -25.05072593688965, "global_step": 264261, "epoch": 3183} {"train_loss": -24.818527221679688, "global_step": 264262, "epoch": 3183} {"train_loss": -25.423887252807617, "global_step": 264263, "epoch": 3183} {"train_loss": -25.028940200805664, "global_step": 264264, "epoch": 3183} {"train_loss": -25.18300437927246, "global_step": 264265, "epoch": 3183} {"train_loss": -25.37274742126465, "global_step": 264266, "epoch": 3183} {"train_loss": -25.121028900146484, "global_step": 264267, "epoch": 3183} {"train_loss": -25.468263626098633, "global_step": 264268, "epoch": 3183} {"train_loss": -24.9974422454834, "global_step": 264269, "epoch": 3183} {"train_loss": -25.219457626342773, "global_step": 264270, "epoch": 3183} {"train_loss": -25.15650737716491, "global_step": 264271, "epoch": 3183, "val_loss": 6875742.0} {"train_loss": -25.12339210510254, "global_step": 264272, "epoch": 3184} {"train_loss": -25.253934860229492, "global_step": 264273, "epoch": 3184} {"train_loss": -25.101516723632812, "global_step": 264274, "epoch": 3184} {"train_loss": -25.17929458618164, "global_step": 264275, "epoch": 3184} {"train_loss": -25.288204193115234, "global_step": 264276, "epoch": 3184} {"train_loss": -25.039371490478516, "global_step": 264277, "epoch": 3184} {"train_loss": -24.87271499633789, "global_step": 264278, "epoch": 3184} {"train_loss": -25.584976196289062, "global_step": 264279, "epoch": 3184} {"train_loss": -25.322219848632812, "global_step": 264280, "epoch": 3184} {"train_loss": -25.270517349243164, "global_step": 264281, "epoch": 3184} {"train_loss": -25.326749801635742, "global_step": 264282, "epoch": 3184} {"train_loss": -24.931598663330078, "global_step": 264283, "epoch": 3184} {"train_loss": -25.179553985595703, "global_step": 264284, "epoch": 3184} {"train_loss": -25.288114547729492, "global_step": 264285, "epoch": 3184} {"train_loss": -24.913806915283203, "global_step": 264286, "epoch": 3184} {"train_loss": -25.18869400024414, "global_step": 264287, "epoch": 3184} {"train_loss": -24.929494857788086, "global_step": 264288, "epoch": 3184} {"train_loss": -25.00048065185547, "global_step": 264289, "epoch": 3184} {"train_loss": -25.16162109375, "global_step": 264290, "epoch": 3184} {"train_loss": -25.1917667388916, "global_step": 264291, "epoch": 3184} {"train_loss": -25.56501579284668, "global_step": 264292, "epoch": 3184} {"train_loss": -24.92359733581543, "global_step": 264293, "epoch": 3184} {"train_loss": -25.242643356323242, "global_step": 264294, "epoch": 3184} {"train_loss": -24.884855270385742, "global_step": 264295, "epoch": 3184} {"train_loss": -25.162704467773438, "global_step": 264296, "epoch": 3184} {"train_loss": -25.116905212402344, "global_step": 264297, "epoch": 3184} {"train_loss": -24.994138717651367, "global_step": 264298, "epoch": 3184} {"train_loss": -25.219995498657227, "global_step": 264299, "epoch": 3184} {"train_loss": -25.305171966552734, "global_step": 264300, "epoch": 3184} {"train_loss": -25.148479461669922, "global_step": 264301, "epoch": 3184} {"train_loss": -25.17313575744629, "global_step": 264302, "epoch": 3184} {"train_loss": -25.033414840698242, "global_step": 264303, "epoch": 3184} {"train_loss": -25.094629287719727, "global_step": 264304, "epoch": 3184} {"train_loss": -25.04658317565918, "global_step": 264305, "epoch": 3184} {"train_loss": -25.050806045532227, "global_step": 264306, "epoch": 3184} {"train_loss": -25.335378646850586, "global_step": 264307, "epoch": 3184} {"train_loss": -25.368934631347656, "global_step": 264308, "epoch": 3184} {"train_loss": -25.36448097229004, "global_step": 264309, "epoch": 3184} {"train_loss": -25.48780632019043, "global_step": 264310, "epoch": 3184} {"train_loss": -25.166461944580078, "global_step": 264311, "epoch": 3184} {"train_loss": -25.36199188232422, "global_step": 264312, "epoch": 3184} {"train_loss": -25.473529815673828, "global_step": 264313, "epoch": 3184} {"train_loss": -24.964298248291016, "global_step": 264314, "epoch": 3184} {"train_loss": -25.8772029876709, "global_step": 264315, "epoch": 3184} {"train_loss": -25.7121639251709, "global_step": 264316, "epoch": 3184} {"train_loss": -25.11429786682129, "global_step": 264317, "epoch": 3184} {"train_loss": -25.427974700927734, "global_step": 264318, "epoch": 3184} {"train_loss": -25.158658981323242, "global_step": 264319, "epoch": 3184} {"train_loss": -25.071012496948242, "global_step": 264320, "epoch": 3184} {"train_loss": -25.31808090209961, "global_step": 264321, "epoch": 3184} {"train_loss": -25.12106704711914, "global_step": 264322, "epoch": 3184} {"train_loss": -24.40040397644043, "global_step": 264323, "epoch": 3184} {"train_loss": -24.697021484375, "global_step": 264324, "epoch": 3184} {"train_loss": -25.047353744506836, "global_step": 264325, "epoch": 3184} {"train_loss": -25.020421981811523, "global_step": 264326, "epoch": 3184} {"train_loss": -24.79655647277832, "global_step": 264327, "epoch": 3184} {"train_loss": -25.042646408081055, "global_step": 264328, "epoch": 3184} {"train_loss": -25.113710403442383, "global_step": 264329, "epoch": 3184} {"train_loss": -25.29070472717285, "global_step": 264330, "epoch": 3184} {"train_loss": -25.25845718383789, "global_step": 264331, "epoch": 3184} {"train_loss": -25.348968505859375, "global_step": 264332, "epoch": 3184} {"train_loss": -25.3159236907959, "global_step": 264333, "epoch": 3184} {"train_loss": -25.0889835357666, "global_step": 264334, "epoch": 3184} {"train_loss": -25.444583892822266, "global_step": 264335, "epoch": 3184} {"train_loss": -25.355960845947266, "global_step": 264336, "epoch": 3184} {"train_loss": -25.308551788330078, "global_step": 264337, "epoch": 3184} {"train_loss": -25.09811782836914, "global_step": 264338, "epoch": 3184} {"train_loss": -25.18852996826172, "global_step": 264339, "epoch": 3184} {"train_loss": -25.6965274810791, "global_step": 264340, "epoch": 3184} {"train_loss": -25.355316162109375, "global_step": 264341, "epoch": 3184} {"train_loss": -25.08623695373535, "global_step": 264342, "epoch": 3184} {"train_loss": -24.58595848083496, "global_step": 264343, "epoch": 3184} {"train_loss": -24.83281898498535, "global_step": 264344, "epoch": 3184} {"train_loss": -24.49029541015625, "global_step": 264345, "epoch": 3184} {"train_loss": -24.125289916992188, "global_step": 264346, "epoch": 3184} {"train_loss": -24.082128524780273, "global_step": 264347, "epoch": 3184} {"train_loss": -24.33576774597168, "global_step": 264348, "epoch": 3184} {"train_loss": -25.20100212097168, "global_step": 264349, "epoch": 3184} {"train_loss": -24.96356773376465, "global_step": 264350, "epoch": 3184} {"train_loss": -25.280187606811523, "global_step": 264351, "epoch": 3184} {"train_loss": -25.053396224975586, "global_step": 264352, "epoch": 3184} {"train_loss": -24.950092315673828, "global_step": 264353, "epoch": 3184} {"train_loss": -25.135279850787427, "global_step": 264354, "epoch": 3184, "val_loss": 7002153.0} {"train_loss": -24.17426872253418, "global_step": 264355, "epoch": 3185} {"train_loss": -24.643768310546875, "global_step": 264356, "epoch": 3185} {"train_loss": -24.446292877197266, "global_step": 264357, "epoch": 3185} {"train_loss": -24.73586082458496, "global_step": 264358, "epoch": 3185} {"train_loss": -24.46732521057129, "global_step": 264359, "epoch": 3185} {"train_loss": -24.507505416870117, "global_step": 264360, "epoch": 3185} {"train_loss": -24.710172653198242, "global_step": 264361, "epoch": 3185} {"train_loss": -24.46156883239746, "global_step": 264362, "epoch": 3185} {"train_loss": -24.672208786010742, "global_step": 264363, "epoch": 3185} {"train_loss": -24.505178451538086, "global_step": 264364, "epoch": 3185} {"train_loss": -24.637741088867188, "global_step": 264365, "epoch": 3185} {"train_loss": -24.845279693603516, "global_step": 264366, "epoch": 3185} {"train_loss": -24.723005294799805, "global_step": 264367, "epoch": 3185} {"train_loss": -24.784536361694336, "global_step": 264368, "epoch": 3185} {"train_loss": -24.45998191833496, "global_step": 264369, "epoch": 3185} {"train_loss": -24.900266647338867, "global_step": 264370, "epoch": 3185} {"train_loss": -24.672697067260742, "global_step": 264371, "epoch": 3185} {"train_loss": -24.692148208618164, "global_step": 264372, "epoch": 3185} {"train_loss": -24.73368263244629, "global_step": 264373, "epoch": 3185} {"train_loss": -24.550857543945312, "global_step": 264374, "epoch": 3185} {"train_loss": -25.1689453125, "global_step": 264375, "epoch": 3185} {"train_loss": -24.646377563476562, "global_step": 264376, "epoch": 3185} {"train_loss": -24.626684188842773, "global_step": 264377, "epoch": 3185} {"train_loss": -24.83112144470215, "global_step": 264378, "epoch": 3185} {"train_loss": -25.24452018737793, "global_step": 264379, "epoch": 3185} {"train_loss": -25.243412017822266, "global_step": 264380, "epoch": 3185} {"train_loss": -24.981563568115234, "global_step": 264381, "epoch": 3185} {"train_loss": -24.980487823486328, "global_step": 264382, "epoch": 3185} {"train_loss": -25.248931884765625, "global_step": 264383, "epoch": 3185} {"train_loss": -25.284753799438477, "global_step": 264384, "epoch": 3185} {"train_loss": -25.396589279174805, "global_step": 264385, "epoch": 3185} {"train_loss": -25.287399291992188, "global_step": 264386, "epoch": 3185} {"train_loss": -25.245014190673828, "global_step": 264387, "epoch": 3185} {"train_loss": -25.29274559020996, "global_step": 264388, "epoch": 3185} {"train_loss": -24.978515625, "global_step": 264389, "epoch": 3185} {"train_loss": -25.345556259155273, "global_step": 264390, "epoch": 3185} {"train_loss": -25.424030303955078, "global_step": 264391, "epoch": 3185} {"train_loss": -24.926593780517578, "global_step": 264392, "epoch": 3185} {"train_loss": -25.0454158782959, "global_step": 264393, "epoch": 3185} {"train_loss": -25.055648803710938, "global_step": 264394, "epoch": 3185} {"train_loss": -25.07478904724121, "global_step": 264395, "epoch": 3185} {"train_loss": -25.090030670166016, "global_step": 264396, "epoch": 3185} {"train_loss": -25.350004196166992, "global_step": 264397, "epoch": 3185} {"train_loss": -25.126392364501953, "global_step": 264398, "epoch": 3185} {"train_loss": -25.583059310913086, "global_step": 264399, "epoch": 3185} {"train_loss": -25.39228630065918, "global_step": 264400, "epoch": 3185} {"train_loss": -25.322301864624023, "global_step": 264401, "epoch": 3185} {"train_loss": -25.279705047607422, "global_step": 264402, "epoch": 3185} {"train_loss": -25.57317352294922, "global_step": 264403, "epoch": 3185} {"train_loss": -25.135778427124023, "global_step": 264404, "epoch": 3185} {"train_loss": -25.092187881469727, "global_step": 264405, "epoch": 3185} {"train_loss": -25.157657623291016, "global_step": 264406, "epoch": 3185} {"train_loss": -25.426462173461914, "global_step": 264407, "epoch": 3185} {"train_loss": -25.219358444213867, "global_step": 264408, "epoch": 3185} {"train_loss": -25.16506004333496, "global_step": 264409, "epoch": 3185} {"train_loss": -25.33902931213379, "global_step": 264410, "epoch": 3185} {"train_loss": -25.401611328125, "global_step": 264411, "epoch": 3185} {"train_loss": -25.15863037109375, "global_step": 264412, "epoch": 3185} {"train_loss": -25.27899169921875, "global_step": 264413, "epoch": 3185} {"train_loss": -25.327293395996094, "global_step": 264414, "epoch": 3185} {"train_loss": -25.42819595336914, "global_step": 264415, "epoch": 3185} {"train_loss": -25.121166229248047, "global_step": 264416, "epoch": 3185} {"train_loss": -25.670148849487305, "global_step": 264417, "epoch": 3185} {"train_loss": -25.51043128967285, "global_step": 264418, "epoch": 3185} {"train_loss": -25.287458419799805, "global_step": 264419, "epoch": 3185} {"train_loss": -24.92939567565918, "global_step": 264420, "epoch": 3185} {"train_loss": -25.132688522338867, "global_step": 264421, "epoch": 3185} {"train_loss": -24.884735107421875, "global_step": 264422, "epoch": 3185} {"train_loss": -25.404172897338867, "global_step": 264423, "epoch": 3185} {"train_loss": -25.37006187438965, "global_step": 264424, "epoch": 3185} {"train_loss": -24.989669799804688, "global_step": 264425, "epoch": 3185} {"train_loss": -25.13882064819336, "global_step": 264426, "epoch": 3185} {"train_loss": -24.808029174804688, "global_step": 264427, "epoch": 3185} {"train_loss": -25.139617919921875, "global_step": 264428, "epoch": 3185} {"train_loss": -24.992467880249023, "global_step": 264429, "epoch": 3185} {"train_loss": -24.835107803344727, "global_step": 264430, "epoch": 3185} {"train_loss": -25.139219284057617, "global_step": 264431, "epoch": 3185} {"train_loss": -24.98128890991211, "global_step": 264432, "epoch": 3185} {"train_loss": -25.071744918823242, "global_step": 264433, "epoch": 3185} {"train_loss": -24.849456787109375, "global_step": 264434, "epoch": 3185} {"train_loss": -24.984819412231445, "global_step": 264435, "epoch": 3185} {"train_loss": -24.964872360229492, "global_step": 264436, "epoch": 3185} {"train_loss": -25.016005113900427, "global_step": 264437, "epoch": 3185, "val_loss": 6942042.0} {"train_loss": -22.999006271362305, "global_step": 264438, "epoch": 3186} {"train_loss": -22.592227935791016, "global_step": 264439, "epoch": 3186} {"train_loss": -23.462997436523438, "global_step": 264440, "epoch": 3186} {"train_loss": -23.061176300048828, "global_step": 264441, "epoch": 3186} {"train_loss": -23.02461814880371, "global_step": 264442, "epoch": 3186} {"train_loss": -23.708547592163086, "global_step": 264443, "epoch": 3186} {"train_loss": -23.61166763305664, "global_step": 264444, "epoch": 3186} {"train_loss": -23.527544021606445, "global_step": 264445, "epoch": 3186} {"train_loss": -23.512351989746094, "global_step": 264446, "epoch": 3186} {"train_loss": -23.965837478637695, "global_step": 264447, "epoch": 3186} {"train_loss": -23.89221954345703, "global_step": 264448, "epoch": 3186} {"train_loss": -23.96742820739746, "global_step": 264449, "epoch": 3186} {"train_loss": -23.9189395904541, "global_step": 264450, "epoch": 3186} {"train_loss": -23.836912155151367, "global_step": 264451, "epoch": 3186} {"train_loss": -23.90895652770996, "global_step": 264452, "epoch": 3186} {"train_loss": -24.032766342163086, "global_step": 264453, "epoch": 3186} {"train_loss": -24.61060905456543, "global_step": 264454, "epoch": 3186} {"train_loss": -24.079544067382812, "global_step": 264455, "epoch": 3186} {"train_loss": -24.183168411254883, "global_step": 264456, "epoch": 3186} {"train_loss": -24.005502700805664, "global_step": 264457, "epoch": 3186} {"train_loss": -24.336631774902344, "global_step": 264458, "epoch": 3186} {"train_loss": -24.099308013916016, "global_step": 264459, "epoch": 3186} {"train_loss": -24.568634033203125, "global_step": 264460, "epoch": 3186} {"train_loss": -24.376752853393555, "global_step": 264461, "epoch": 3186} {"train_loss": -24.42063331604004, "global_step": 264462, "epoch": 3186} {"train_loss": -24.654499053955078, "global_step": 264463, "epoch": 3186} {"train_loss": -24.325342178344727, "global_step": 264464, "epoch": 3186} {"train_loss": -24.591455459594727, "global_step": 264465, "epoch": 3186} {"train_loss": -24.546476364135742, "global_step": 264466, "epoch": 3186} {"train_loss": -24.51691436767578, "global_step": 264467, "epoch": 3186} {"train_loss": -24.59758758544922, "global_step": 264468, "epoch": 3186} {"train_loss": -24.542856216430664, "global_step": 264469, "epoch": 3186} {"train_loss": -24.814847946166992, "global_step": 264470, "epoch": 3186} {"train_loss": -24.672361373901367, "global_step": 264471, "epoch": 3186} {"train_loss": -24.693029403686523, "global_step": 264472, "epoch": 3186} {"train_loss": -25.136844635009766, "global_step": 264473, "epoch": 3186} {"train_loss": -24.976411819458008, "global_step": 264474, "epoch": 3186} {"train_loss": -25.16468620300293, "global_step": 264475, "epoch": 3186} {"train_loss": -24.85965919494629, "global_step": 264476, "epoch": 3186} {"train_loss": -25.056997299194336, "global_step": 264477, "epoch": 3186} {"train_loss": -24.971044540405273, "global_step": 264478, "epoch": 3186} {"train_loss": -25.025720596313477, "global_step": 264479, "epoch": 3186} {"train_loss": -24.906494140625, "global_step": 264480, "epoch": 3186} {"train_loss": -25.068662643432617, "global_step": 264481, "epoch": 3186} {"train_loss": -24.985071182250977, "global_step": 264482, "epoch": 3186} {"train_loss": -25.0379695892334, "global_step": 264483, "epoch": 3186} {"train_loss": -24.839242935180664, "global_step": 264484, "epoch": 3186} {"train_loss": -25.162845611572266, "global_step": 264485, "epoch": 3186} {"train_loss": -25.130603790283203, "global_step": 264486, "epoch": 3186} {"train_loss": -25.281091690063477, "global_step": 264487, "epoch": 3186} {"train_loss": -25.28571891784668, "global_step": 264488, "epoch": 3186} {"train_loss": -25.007160186767578, "global_step": 264489, "epoch": 3186} {"train_loss": -25.044363021850586, "global_step": 264490, "epoch": 3186} {"train_loss": -25.2562198638916, "global_step": 264491, "epoch": 3186} {"train_loss": -25.115829467773438, "global_step": 264492, "epoch": 3186} {"train_loss": -25.073328018188477, "global_step": 264493, "epoch": 3186} {"train_loss": -24.89915657043457, "global_step": 264494, "epoch": 3186} {"train_loss": -25.119831085205078, "global_step": 264495, "epoch": 3186} {"train_loss": -24.69023895263672, "global_step": 264496, "epoch": 3186} {"train_loss": -25.06414031982422, "global_step": 264497, "epoch": 3186} {"train_loss": -25.315155029296875, "global_step": 264498, "epoch": 3186} {"train_loss": -25.343896865844727, "global_step": 264499, "epoch": 3186} {"train_loss": -25.111608505249023, "global_step": 264500, "epoch": 3186} {"train_loss": -25.502426147460938, "global_step": 264501, "epoch": 3186} {"train_loss": -25.17536163330078, "global_step": 264502, "epoch": 3186} {"train_loss": -24.7432918548584, "global_step": 264503, "epoch": 3186} {"train_loss": -24.7417049407959, "global_step": 264504, "epoch": 3186} {"train_loss": -25.25136375427246, "global_step": 264505, "epoch": 3186} {"train_loss": -25.272096633911133, "global_step": 264506, "epoch": 3186} {"train_loss": -25.094409942626953, "global_step": 264507, "epoch": 3186} {"train_loss": -25.120746612548828, "global_step": 264508, "epoch": 3186} {"train_loss": -25.385683059692383, "global_step": 264509, "epoch": 3186} {"train_loss": -25.182992935180664, "global_step": 264510, "epoch": 3186} {"train_loss": -25.32868194580078, "global_step": 264511, "epoch": 3186} {"train_loss": -25.13505744934082, "global_step": 264512, "epoch": 3186} {"train_loss": -24.813932418823242, "global_step": 264513, "epoch": 3186} {"train_loss": -25.242300033569336, "global_step": 264514, "epoch": 3186} {"train_loss": -25.13704490661621, "global_step": 264515, "epoch": 3186} {"train_loss": -24.997283935546875, "global_step": 264516, "epoch": 3186} {"train_loss": -25.25901222229004, "global_step": 264517, "epoch": 3186} {"train_loss": -25.318891525268555, "global_step": 264518, "epoch": 3186} {"train_loss": -25.211639404296875, "global_step": 264519, "epoch": 3186} {"train_loss": -24.659958621105517, "global_step": 264520, "epoch": 3186, "val_loss": 6854259.5} {"train_loss": -24.152795791625977, "global_step": 264521, "epoch": 3187} {"train_loss": -24.044050216674805, "global_step": 264522, "epoch": 3187} {"train_loss": -24.174346923828125, "global_step": 264523, "epoch": 3187} {"train_loss": -24.656423568725586, "global_step": 264524, "epoch": 3187} {"train_loss": -24.47847557067871, "global_step": 264525, "epoch": 3187} {"train_loss": -25.276779174804688, "global_step": 264526, "epoch": 3187} {"train_loss": -24.436845779418945, "global_step": 264527, "epoch": 3187} {"train_loss": -25.25046730041504, "global_step": 264528, "epoch": 3187} {"train_loss": -24.66777992248535, "global_step": 264529, "epoch": 3187} {"train_loss": -24.76643943786621, "global_step": 264530, "epoch": 3187} {"train_loss": -24.581581115722656, "global_step": 264531, "epoch": 3187} {"train_loss": -24.857038497924805, "global_step": 264532, "epoch": 3187} {"train_loss": -24.408761978149414, "global_step": 264533, "epoch": 3187} {"train_loss": -24.75725746154785, "global_step": 264534, "epoch": 3187} {"train_loss": -24.683013916015625, "global_step": 264535, "epoch": 3187} {"train_loss": -24.69287109375, "global_step": 264536, "epoch": 3187} {"train_loss": -24.7346134185791, "global_step": 264537, "epoch": 3187} {"train_loss": -24.922691345214844, "global_step": 264538, "epoch": 3187} {"train_loss": -25.14420509338379, "global_step": 264539, "epoch": 3187} {"train_loss": -25.076501846313477, "global_step": 264540, "epoch": 3187} {"train_loss": -25.074926376342773, "global_step": 264541, "epoch": 3187} {"train_loss": -25.056472778320312, "global_step": 264542, "epoch": 3187} {"train_loss": -25.019344329833984, "global_step": 264543, "epoch": 3187} {"train_loss": -25.018863677978516, "global_step": 264544, "epoch": 3187} {"train_loss": -24.965442657470703, "global_step": 264545, "epoch": 3187} {"train_loss": -25.004064559936523, "global_step": 264546, "epoch": 3187} {"train_loss": -24.97907257080078, "global_step": 264547, "epoch": 3187} {"train_loss": -24.7961483001709, "global_step": 264548, "epoch": 3187} {"train_loss": -24.874832153320312, "global_step": 264549, "epoch": 3187} {"train_loss": -25.27520751953125, "global_step": 264550, "epoch": 3187} {"train_loss": -25.641620635986328, "global_step": 264551, "epoch": 3187} {"train_loss": -25.197765350341797, "global_step": 264552, "epoch": 3187} {"train_loss": -25.3729248046875, "global_step": 264553, "epoch": 3187} {"train_loss": -25.114614486694336, "global_step": 264554, "epoch": 3187} {"train_loss": -25.100622177124023, "global_step": 264555, "epoch": 3187} {"train_loss": -24.836118698120117, "global_step": 264556, "epoch": 3187} {"train_loss": -25.25092315673828, "global_step": 264557, "epoch": 3187} {"train_loss": -25.540048599243164, "global_step": 264558, "epoch": 3187} {"train_loss": -25.25208854675293, "global_step": 264559, "epoch": 3187} {"train_loss": -25.391443252563477, "global_step": 264560, "epoch": 3187} {"train_loss": -25.53624153137207, "global_step": 264561, "epoch": 3187} {"train_loss": -25.424283981323242, "global_step": 264562, "epoch": 3187} {"train_loss": -25.198421478271484, "global_step": 264563, "epoch": 3187} {"train_loss": -25.41328239440918, "global_step": 264564, "epoch": 3187} {"train_loss": -25.369277954101562, "global_step": 264565, "epoch": 3187} {"train_loss": -25.550373077392578, "global_step": 264566, "epoch": 3187} {"train_loss": -25.391103744506836, "global_step": 264567, "epoch": 3187} {"train_loss": -25.250141143798828, "global_step": 264568, "epoch": 3187} {"train_loss": -25.311433792114258, "global_step": 264569, "epoch": 3187} {"train_loss": -25.159311294555664, "global_step": 264570, "epoch": 3187} {"train_loss": -25.51624870300293, "global_step": 264571, "epoch": 3187} {"train_loss": -25.275964736938477, "global_step": 264572, "epoch": 3187} {"train_loss": -25.40106964111328, "global_step": 264573, "epoch": 3187} {"train_loss": -25.09308624267578, "global_step": 264574, "epoch": 3187} {"train_loss": -25.187942504882812, "global_step": 264575, "epoch": 3187} {"train_loss": -25.488666534423828, "global_step": 264576, "epoch": 3187} {"train_loss": -24.855314254760742, "global_step": 264577, "epoch": 3187} {"train_loss": -25.21453285217285, "global_step": 264578, "epoch": 3187} {"train_loss": -24.65016746520996, "global_step": 264579, "epoch": 3187} {"train_loss": -25.38755989074707, "global_step": 264580, "epoch": 3187} {"train_loss": -25.25784683227539, "global_step": 264581, "epoch": 3187} {"train_loss": -24.955673217773438, "global_step": 264582, "epoch": 3187} {"train_loss": -25.071090698242188, "global_step": 264583, "epoch": 3187} {"train_loss": -25.203229904174805, "global_step": 264584, "epoch": 3187} {"train_loss": -24.952430725097656, "global_step": 264585, "epoch": 3187} {"train_loss": -25.078781127929688, "global_step": 264586, "epoch": 3187} {"train_loss": -25.106504440307617, "global_step": 264587, "epoch": 3187} {"train_loss": -25.179428100585938, "global_step": 264588, "epoch": 3187} {"train_loss": -25.32391929626465, "global_step": 264589, "epoch": 3187} {"train_loss": -25.044097900390625, "global_step": 264590, "epoch": 3187} {"train_loss": -24.630664825439453, "global_step": 264591, "epoch": 3187} {"train_loss": -25.17959976196289, "global_step": 264592, "epoch": 3187} {"train_loss": -24.91973304748535, "global_step": 264593, "epoch": 3187} {"train_loss": -25.095680236816406, "global_step": 264594, "epoch": 3187} {"train_loss": -25.352436065673828, "global_step": 264595, "epoch": 3187} {"train_loss": -24.73894691467285, "global_step": 264596, "epoch": 3187} {"train_loss": -25.093067169189453, "global_step": 264597, "epoch": 3187} {"train_loss": -25.06287956237793, "global_step": 264598, "epoch": 3187} {"train_loss": -24.727252960205078, "global_step": 264599, "epoch": 3187} {"train_loss": -25.116544723510742, "global_step": 264600, "epoch": 3187} {"train_loss": -25.35389518737793, "global_step": 264601, "epoch": 3187} {"train_loss": -25.4840030670166, "global_step": 264602, "epoch": 3187} {"train_loss": -25.058554293161414, "global_step": 264603, "epoch": 3187, "val_loss": 6880615.0} {"train_loss": -25.170072555541992, "global_step": 264604, "epoch": 3188} {"train_loss": -24.761432647705078, "global_step": 264605, "epoch": 3188} {"train_loss": -24.91078758239746, "global_step": 264606, "epoch": 3188} {"train_loss": -25.066970825195312, "global_step": 264607, "epoch": 3188} {"train_loss": -25.331798553466797, "global_step": 264608, "epoch": 3188} {"train_loss": -25.06330680847168, "global_step": 264609, "epoch": 3188} {"train_loss": -25.17117691040039, "global_step": 264610, "epoch": 3188} {"train_loss": -24.881423950195312, "global_step": 264611, "epoch": 3188} {"train_loss": -25.05108070373535, "global_step": 264612, "epoch": 3188} {"train_loss": -24.527048110961914, "global_step": 264613, "epoch": 3188} {"train_loss": -24.462406158447266, "global_step": 264614, "epoch": 3188} {"train_loss": -24.849838256835938, "global_step": 264615, "epoch": 3188} {"train_loss": -25.278284072875977, "global_step": 264616, "epoch": 3188} {"train_loss": -24.610017776489258, "global_step": 264617, "epoch": 3188} {"train_loss": -24.8095703125, "global_step": 264618, "epoch": 3188} {"train_loss": -24.81130027770996, "global_step": 264619, "epoch": 3188} {"train_loss": -24.990036010742188, "global_step": 264620, "epoch": 3188} {"train_loss": -25.080900192260742, "global_step": 264621, "epoch": 3188} {"train_loss": -24.4401798248291, "global_step": 264622, "epoch": 3188} {"train_loss": -24.58429527282715, "global_step": 264623, "epoch": 3188} {"train_loss": -25.018070220947266, "global_step": 264624, "epoch": 3188} {"train_loss": -24.829309463500977, "global_step": 264625, "epoch": 3188} {"train_loss": -25.09477424621582, "global_step": 264626, "epoch": 3188} {"train_loss": -24.91560173034668, "global_step": 264627, "epoch": 3188} {"train_loss": -25.23243522644043, "global_step": 264628, "epoch": 3188} {"train_loss": -25.154653549194336, "global_step": 264629, "epoch": 3188} {"train_loss": -25.10898780822754, "global_step": 264630, "epoch": 3188} {"train_loss": -25.025915145874023, "global_step": 264631, "epoch": 3188} {"train_loss": -25.349544525146484, "global_step": 264632, "epoch": 3188} {"train_loss": -25.13104248046875, "global_step": 264633, "epoch": 3188} {"train_loss": -25.167192459106445, "global_step": 264634, "epoch": 3188} {"train_loss": -25.130258560180664, "global_step": 264635, "epoch": 3188} {"train_loss": -25.17584228515625, "global_step": 264636, "epoch": 3188} {"train_loss": -25.174549102783203, "global_step": 264637, "epoch": 3188} {"train_loss": -25.0318660736084, "global_step": 264638, "epoch": 3188} {"train_loss": -25.44364356994629, "global_step": 264639, "epoch": 3188} {"train_loss": -25.313201904296875, "global_step": 264640, "epoch": 3188} {"train_loss": -25.028928756713867, "global_step": 264641, "epoch": 3188} {"train_loss": -25.081815719604492, "global_step": 264642, "epoch": 3188} {"train_loss": -25.159469604492188, "global_step": 264643, "epoch": 3188} {"train_loss": -24.791452407836914, "global_step": 264644, "epoch": 3188} {"train_loss": -25.162033081054688, "global_step": 264645, "epoch": 3188} {"train_loss": -25.321645736694336, "global_step": 264646, "epoch": 3188} {"train_loss": -25.496259689331055, "global_step": 264647, "epoch": 3188} {"train_loss": -25.11970329284668, "global_step": 264648, "epoch": 3188} {"train_loss": -25.640583038330078, "global_step": 264649, "epoch": 3188} {"train_loss": -25.442310333251953, "global_step": 264650, "epoch": 3188} {"train_loss": -25.204233169555664, "global_step": 264651, "epoch": 3188} {"train_loss": -25.433021545410156, "global_step": 264652, "epoch": 3188} {"train_loss": -25.46352195739746, "global_step": 264653, "epoch": 3188} {"train_loss": -25.24764633178711, "global_step": 264654, "epoch": 3188} {"train_loss": -25.530691146850586, "global_step": 264655, "epoch": 3188} {"train_loss": -25.272537231445312, "global_step": 264656, "epoch": 3188} {"train_loss": -25.358577728271484, "global_step": 264657, "epoch": 3188} {"train_loss": -25.523527145385742, "global_step": 264658, "epoch": 3188} {"train_loss": -25.13960838317871, "global_step": 264659, "epoch": 3188} {"train_loss": -25.258121490478516, "global_step": 264660, "epoch": 3188} {"train_loss": -25.371723175048828, "global_step": 264661, "epoch": 3188} {"train_loss": -25.513837814331055, "global_step": 264662, "epoch": 3188} {"train_loss": -25.002721786499023, "global_step": 264663, "epoch": 3188} {"train_loss": -25.43086814880371, "global_step": 264664, "epoch": 3188} {"train_loss": -25.359600067138672, "global_step": 264665, "epoch": 3188} {"train_loss": -25.432199478149414, "global_step": 264666, "epoch": 3188} {"train_loss": -25.488697052001953, "global_step": 264667, "epoch": 3188} {"train_loss": -25.13857078552246, "global_step": 264668, "epoch": 3188} {"train_loss": -24.77967071533203, "global_step": 264669, "epoch": 3188} {"train_loss": -24.730581283569336, "global_step": 264670, "epoch": 3188} {"train_loss": -25.247669219970703, "global_step": 264671, "epoch": 3188} {"train_loss": -24.99094581604004, "global_step": 264672, "epoch": 3188} {"train_loss": -24.809873580932617, "global_step": 264673, "epoch": 3188} {"train_loss": -25.490005493164062, "global_step": 264674, "epoch": 3188} {"train_loss": -24.954151153564453, "global_step": 264675, "epoch": 3188} {"train_loss": -25.058774948120117, "global_step": 264676, "epoch": 3188} {"train_loss": -24.97714614868164, "global_step": 264677, "epoch": 3188} {"train_loss": -25.21180534362793, "global_step": 264678, "epoch": 3188} {"train_loss": -24.800214767456055, "global_step": 264679, "epoch": 3188} {"train_loss": -25.279447555541992, "global_step": 264680, "epoch": 3188} {"train_loss": -24.95313835144043, "global_step": 264681, "epoch": 3188} {"train_loss": -25.27259635925293, "global_step": 264682, "epoch": 3188} {"train_loss": -25.144062042236328, "global_step": 264683, "epoch": 3188} {"train_loss": -25.087080001831055, "global_step": 264684, "epoch": 3188} {"train_loss": -25.446231842041016, "global_step": 264685, "epoch": 3188} {"train_loss": -25.11326645081302, "global_step": 264686, "epoch": 3188, "val_loss": 6835792.5} {"train_loss": -24.280879974365234, "global_step": 264687, "epoch": 3189} {"train_loss": -24.219709396362305, "global_step": 264688, "epoch": 3189} {"train_loss": -24.812875747680664, "global_step": 264689, "epoch": 3189} {"train_loss": -24.74588966369629, "global_step": 264690, "epoch": 3189} {"train_loss": -24.521900177001953, "global_step": 264691, "epoch": 3189} {"train_loss": -24.539400100708008, "global_step": 264692, "epoch": 3189} {"train_loss": -24.35951042175293, "global_step": 264693, "epoch": 3189} {"train_loss": -24.30691909790039, "global_step": 264694, "epoch": 3189} {"train_loss": -24.475772857666016, "global_step": 264695, "epoch": 3189} {"train_loss": -24.893770217895508, "global_step": 264696, "epoch": 3189} {"train_loss": -24.1853084564209, "global_step": 264697, "epoch": 3189} {"train_loss": -24.84857749938965, "global_step": 264698, "epoch": 3189} {"train_loss": -24.754255294799805, "global_step": 264699, "epoch": 3189} {"train_loss": -24.873950958251953, "global_step": 264700, "epoch": 3189} {"train_loss": -24.469629287719727, "global_step": 264701, "epoch": 3189} {"train_loss": -24.630691528320312, "global_step": 264702, "epoch": 3189} {"train_loss": -25.073820114135742, "global_step": 264703, "epoch": 3189} {"train_loss": -24.941387176513672, "global_step": 264704, "epoch": 3189} {"train_loss": -24.694324493408203, "global_step": 264705, "epoch": 3189} {"train_loss": -24.612340927124023, "global_step": 264706, "epoch": 3189} {"train_loss": -24.818708419799805, "global_step": 264707, "epoch": 3189} {"train_loss": -25.065872192382812, "global_step": 264708, "epoch": 3189} {"train_loss": -25.40396499633789, "global_step": 264709, "epoch": 3189} {"train_loss": -25.02522850036621, "global_step": 264710, "epoch": 3189} {"train_loss": -25.079816818237305, "global_step": 264711, "epoch": 3189} {"train_loss": -25.053844451904297, "global_step": 264712, "epoch": 3189} {"train_loss": -24.85874366760254, "global_step": 264713, "epoch": 3189} {"train_loss": -25.116321563720703, "global_step": 264714, "epoch": 3189} {"train_loss": -24.800519943237305, "global_step": 264715, "epoch": 3189} {"train_loss": -25.34956932067871, "global_step": 264716, "epoch": 3189} {"train_loss": -25.385452270507812, "global_step": 264717, "epoch": 3189} {"train_loss": -25.026090621948242, "global_step": 264718, "epoch": 3189} {"train_loss": -25.294830322265625, "global_step": 264719, "epoch": 3189} {"train_loss": -25.30290412902832, "global_step": 264720, "epoch": 3189} {"train_loss": -25.04315757751465, "global_step": 264721, "epoch": 3189} {"train_loss": -25.11608123779297, "global_step": 264722, "epoch": 3189} {"train_loss": -25.2730770111084, "global_step": 264723, "epoch": 3189} {"train_loss": -25.307153701782227, "global_step": 264724, "epoch": 3189} {"train_loss": -25.12229347229004, "global_step": 264725, "epoch": 3189} {"train_loss": -24.97882843017578, "global_step": 264726, "epoch": 3189} {"train_loss": -25.3719425201416, "global_step": 264727, "epoch": 3189} {"train_loss": -25.40728759765625, "global_step": 264728, "epoch": 3189} {"train_loss": -25.148122787475586, "global_step": 264729, "epoch": 3189} {"train_loss": -25.237213134765625, "global_step": 264730, "epoch": 3189} {"train_loss": -25.473085403442383, "global_step": 264731, "epoch": 3189} {"train_loss": -25.150774002075195, "global_step": 264732, "epoch": 3189} {"train_loss": -25.33461570739746, "global_step": 264733, "epoch": 3189} {"train_loss": -25.207265853881836, "global_step": 264734, "epoch": 3189} {"train_loss": -25.12917137145996, "global_step": 264735, "epoch": 3189} {"train_loss": -25.48211669921875, "global_step": 264736, "epoch": 3189} {"train_loss": -25.166227340698242, "global_step": 264737, "epoch": 3189} {"train_loss": -25.51525115966797, "global_step": 264738, "epoch": 3189} {"train_loss": -25.198841094970703, "global_step": 264739, "epoch": 3189} {"train_loss": -25.129749298095703, "global_step": 264740, "epoch": 3189} {"train_loss": -25.87761878967285, "global_step": 264741, "epoch": 3189} {"train_loss": -25.448991775512695, "global_step": 264742, "epoch": 3189} {"train_loss": -25.473434448242188, "global_step": 264743, "epoch": 3189} {"train_loss": -25.52670669555664, "global_step": 264744, "epoch": 3189} {"train_loss": -25.347606658935547, "global_step": 264745, "epoch": 3189} {"train_loss": -25.507770538330078, "global_step": 264746, "epoch": 3189} {"train_loss": -25.4166259765625, "global_step": 264747, "epoch": 3189} {"train_loss": -25.291250228881836, "global_step": 264748, "epoch": 3189} {"train_loss": -25.248151779174805, "global_step": 264749, "epoch": 3189} {"train_loss": -25.56236457824707, "global_step": 264750, "epoch": 3189} {"train_loss": -25.223440170288086, "global_step": 264751, "epoch": 3189} {"train_loss": -25.420621871948242, "global_step": 264752, "epoch": 3189} {"train_loss": -25.219045639038086, "global_step": 264753, "epoch": 3189} {"train_loss": -25.38278579711914, "global_step": 264754, "epoch": 3189} {"train_loss": -25.30230140686035, "global_step": 264755, "epoch": 3189} {"train_loss": -25.132246017456055, "global_step": 264756, "epoch": 3189} {"train_loss": -25.043962478637695, "global_step": 264757, "epoch": 3189} {"train_loss": -24.74616813659668, "global_step": 264758, "epoch": 3189} {"train_loss": -25.092031478881836, "global_step": 264759, "epoch": 3189} {"train_loss": -25.555957794189453, "global_step": 264760, "epoch": 3189} {"train_loss": -25.3348445892334, "global_step": 264761, "epoch": 3189} {"train_loss": -24.51962661743164, "global_step": 264762, "epoch": 3189} {"train_loss": -24.65744400024414, "global_step": 264763, "epoch": 3189} {"train_loss": -25.09992790222168, "global_step": 264764, "epoch": 3189} {"train_loss": -25.03972625732422, "global_step": 264765, "epoch": 3189} {"train_loss": -24.479145050048828, "global_step": 264766, "epoch": 3189} {"train_loss": -25.070737838745117, "global_step": 264767, "epoch": 3189} {"train_loss": -24.661937713623047, "global_step": 264768, "epoch": 3189} {"train_loss": -25.04087528550481, "global_step": 264769, "epoch": 3189, "val_loss": 6842141.0} {"train_loss": -24.341018676757812, "global_step": 264770, "epoch": 3190} {"train_loss": -22.863798141479492, "global_step": 264771, "epoch": 3190} {"train_loss": -24.428247451782227, "global_step": 264772, "epoch": 3190} {"train_loss": -23.83711051940918, "global_step": 264773, "epoch": 3190} {"train_loss": -24.587026596069336, "global_step": 264774, "epoch": 3190} {"train_loss": -23.974477767944336, "global_step": 264775, "epoch": 3190} {"train_loss": -24.37213134765625, "global_step": 264776, "epoch": 3190} {"train_loss": -24.579639434814453, "global_step": 264777, "epoch": 3190} {"train_loss": -24.62908935546875, "global_step": 264778, "epoch": 3190} {"train_loss": -24.085988998413086, "global_step": 264779, "epoch": 3190} {"train_loss": -24.965560913085938, "global_step": 264780, "epoch": 3190} {"train_loss": -24.562606811523438, "global_step": 264781, "epoch": 3190} {"train_loss": -24.57752799987793, "global_step": 264782, "epoch": 3190} {"train_loss": -24.636194229125977, "global_step": 264783, "epoch": 3190} {"train_loss": -25.01612091064453, "global_step": 264784, "epoch": 3190} {"train_loss": -24.912628173828125, "global_step": 264785, "epoch": 3190} {"train_loss": -24.925220489501953, "global_step": 264786, "epoch": 3190} {"train_loss": -24.970365524291992, "global_step": 264787, "epoch": 3190} {"train_loss": -24.374675750732422, "global_step": 264788, "epoch": 3190} {"train_loss": -25.130346298217773, "global_step": 264789, "epoch": 3190} {"train_loss": -24.717924118041992, "global_step": 264790, "epoch": 3190} {"train_loss": -24.81804847717285, "global_step": 264791, "epoch": 3190} {"train_loss": -25.024259567260742, "global_step": 264792, "epoch": 3190} {"train_loss": -25.089609146118164, "global_step": 264793, "epoch": 3190} {"train_loss": -25.253393173217773, "global_step": 264794, "epoch": 3190} {"train_loss": -25.012399673461914, "global_step": 264795, "epoch": 3190} {"train_loss": -24.914228439331055, "global_step": 264796, "epoch": 3190} {"train_loss": -24.92667007446289, "global_step": 264797, "epoch": 3190} {"train_loss": -25.02571678161621, "global_step": 264798, "epoch": 3190} {"train_loss": -24.770612716674805, "global_step": 264799, "epoch": 3190} {"train_loss": -25.276403427124023, "global_step": 264800, "epoch": 3190} {"train_loss": -25.215335845947266, "global_step": 264801, "epoch": 3190} {"train_loss": -25.302663803100586, "global_step": 264802, "epoch": 3190} {"train_loss": -25.1036319732666, "global_step": 264803, "epoch": 3190} {"train_loss": -25.021146774291992, "global_step": 264804, "epoch": 3190} {"train_loss": -24.97951316833496, "global_step": 264805, "epoch": 3190} {"train_loss": -25.36863136291504, "global_step": 264806, "epoch": 3190} {"train_loss": -25.25138282775879, "global_step": 264807, "epoch": 3190} {"train_loss": -24.92197036743164, "global_step": 264808, "epoch": 3190} {"train_loss": -25.27469253540039, "global_step": 264809, "epoch": 3190} {"train_loss": -25.564085006713867, "global_step": 264810, "epoch": 3190} {"train_loss": -25.157690048217773, "global_step": 264811, "epoch": 3190} {"train_loss": -24.991785049438477, "global_step": 264812, "epoch": 3190} {"train_loss": -25.003278732299805, "global_step": 264813, "epoch": 3190} {"train_loss": -25.419950485229492, "global_step": 264814, "epoch": 3190} {"train_loss": -25.46870994567871, "global_step": 264815, "epoch": 3190} {"train_loss": -25.197574615478516, "global_step": 264816, "epoch": 3190} {"train_loss": -25.35223388671875, "global_step": 264817, "epoch": 3190} {"train_loss": -25.220075607299805, "global_step": 264818, "epoch": 3190} {"train_loss": -25.199304580688477, "global_step": 264819, "epoch": 3190} {"train_loss": -25.71693229675293, "global_step": 264820, "epoch": 3190} {"train_loss": -25.295047760009766, "global_step": 264821, "epoch": 3190} {"train_loss": -25.593143463134766, "global_step": 264822, "epoch": 3190} {"train_loss": -24.955041885375977, "global_step": 264823, "epoch": 3190} {"train_loss": -25.25084686279297, "global_step": 264824, "epoch": 3190} {"train_loss": -25.181921005249023, "global_step": 264825, "epoch": 3190} {"train_loss": -25.25609588623047, "global_step": 264826, "epoch": 3190} {"train_loss": -24.670202255249023, "global_step": 264827, "epoch": 3190} {"train_loss": -24.83628273010254, "global_step": 264828, "epoch": 3190} {"train_loss": -24.820478439331055, "global_step": 264829, "epoch": 3190} {"train_loss": -25.19901466369629, "global_step": 264830, "epoch": 3190} {"train_loss": -25.18361473083496, "global_step": 264831, "epoch": 3190} {"train_loss": -25.091787338256836, "global_step": 264832, "epoch": 3190} {"train_loss": -25.15912437438965, "global_step": 264833, "epoch": 3190} {"train_loss": -25.431121826171875, "global_step": 264834, "epoch": 3190} {"train_loss": -25.104421615600586, "global_step": 264835, "epoch": 3190} {"train_loss": -24.393930435180664, "global_step": 264836, "epoch": 3190} {"train_loss": -25.18608856201172, "global_step": 264837, "epoch": 3190} {"train_loss": -24.96200942993164, "global_step": 264838, "epoch": 3190} {"train_loss": -25.393003463745117, "global_step": 264839, "epoch": 3190} {"train_loss": -25.339096069335938, "global_step": 264840, "epoch": 3190} {"train_loss": -25.45821762084961, "global_step": 264841, "epoch": 3190} {"train_loss": -25.09482765197754, "global_step": 264842, "epoch": 3190} {"train_loss": -25.538694381713867, "global_step": 264843, "epoch": 3190} {"train_loss": -24.9517879486084, "global_step": 264844, "epoch": 3190} {"train_loss": -25.189146041870117, "global_step": 264845, "epoch": 3190} {"train_loss": -25.299570083618164, "global_step": 264846, "epoch": 3190} {"train_loss": -25.18663787841797, "global_step": 264847, "epoch": 3190} {"train_loss": -25.57129669189453, "global_step": 264848, "epoch": 3190} {"train_loss": -25.642120361328125, "global_step": 264849, "epoch": 3190} {"train_loss": -25.039060592651367, "global_step": 264850, "epoch": 3190} {"train_loss": -25.607776641845703, "global_step": 264851, "epoch": 3190} {"train_loss": -24.995760009949464, "global_step": 264852, "epoch": 3190, "val_loss": 7037634.0} {"train_loss": -24.118131637573242, "global_step": 264853, "epoch": 3191} {"train_loss": -23.838151931762695, "global_step": 264854, "epoch": 3191} {"train_loss": -24.621984481811523, "global_step": 264855, "epoch": 3191} {"train_loss": -24.289464950561523, "global_step": 264856, "epoch": 3191} {"train_loss": -24.075056076049805, "global_step": 264857, "epoch": 3191} {"train_loss": -24.527332305908203, "global_step": 264858, "epoch": 3191} {"train_loss": -23.865537643432617, "global_step": 264859, "epoch": 3191} {"train_loss": -24.68253517150879, "global_step": 264860, "epoch": 3191} {"train_loss": -24.640493392944336, "global_step": 264861, "epoch": 3191} {"train_loss": -24.712751388549805, "global_step": 264862, "epoch": 3191} {"train_loss": -24.555315017700195, "global_step": 264863, "epoch": 3191} {"train_loss": -24.558164596557617, "global_step": 264864, "epoch": 3191} {"train_loss": -24.820293426513672, "global_step": 264865, "epoch": 3191} {"train_loss": -24.994953155517578, "global_step": 264866, "epoch": 3191} {"train_loss": -24.5377140045166, "global_step": 264867, "epoch": 3191} {"train_loss": -24.768774032592773, "global_step": 264868, "epoch": 3191} {"train_loss": -24.473440170288086, "global_step": 264869, "epoch": 3191} {"train_loss": -25.101205825805664, "global_step": 264870, "epoch": 3191} {"train_loss": -24.874433517456055, "global_step": 264871, "epoch": 3191} {"train_loss": -24.646631240844727, "global_step": 264872, "epoch": 3191} {"train_loss": -24.72875213623047, "global_step": 264873, "epoch": 3191} {"train_loss": -24.726606369018555, "global_step": 264874, "epoch": 3191} {"train_loss": -25.015504837036133, "global_step": 264875, "epoch": 3191} {"train_loss": -24.797216415405273, "global_step": 264876, "epoch": 3191} {"train_loss": -24.847078323364258, "global_step": 264877, "epoch": 3191} {"train_loss": -24.803003311157227, "global_step": 264878, "epoch": 3191} {"train_loss": -24.705923080444336, "global_step": 264879, "epoch": 3191} {"train_loss": -25.355222702026367, "global_step": 264880, "epoch": 3191} {"train_loss": -24.960933685302734, "global_step": 264881, "epoch": 3191} {"train_loss": -24.8637638092041, "global_step": 264882, "epoch": 3191} {"train_loss": -24.656644821166992, "global_step": 264883, "epoch": 3191} {"train_loss": -24.665334701538086, "global_step": 264884, "epoch": 3191} {"train_loss": -24.947656631469727, "global_step": 264885, "epoch": 3191} {"train_loss": -24.99783706665039, "global_step": 264886, "epoch": 3191} {"train_loss": -24.87403678894043, "global_step": 264887, "epoch": 3191} {"train_loss": -24.903593063354492, "global_step": 264888, "epoch": 3191} {"train_loss": -25.017499923706055, "global_step": 264889, "epoch": 3191} {"train_loss": -25.32857894897461, "global_step": 264890, "epoch": 3191} {"train_loss": -25.220680236816406, "global_step": 264891, "epoch": 3191} {"train_loss": -25.191356658935547, "global_step": 264892, "epoch": 3191} {"train_loss": -25.374794006347656, "global_step": 264893, "epoch": 3191} {"train_loss": -25.120676040649414, "global_step": 264894, "epoch": 3191} {"train_loss": -24.964937210083008, "global_step": 264895, "epoch": 3191} {"train_loss": -25.1755313873291, "global_step": 264896, "epoch": 3191} {"train_loss": -25.152509689331055, "global_step": 264897, "epoch": 3191} {"train_loss": -25.04328727722168, "global_step": 264898, "epoch": 3191} {"train_loss": -25.115856170654297, "global_step": 264899, "epoch": 3191} {"train_loss": -25.499710083007812, "global_step": 264900, "epoch": 3191} {"train_loss": -25.319225311279297, "global_step": 264901, "epoch": 3191} {"train_loss": -24.8625545501709, "global_step": 264902, "epoch": 3191} {"train_loss": -25.170785903930664, "global_step": 264903, "epoch": 3191} {"train_loss": -25.0229549407959, "global_step": 264904, "epoch": 3191} {"train_loss": -25.02332305908203, "global_step": 264905, "epoch": 3191} {"train_loss": -25.21990966796875, "global_step": 264906, "epoch": 3191} {"train_loss": -25.57597541809082, "global_step": 264907, "epoch": 3191} {"train_loss": -25.245235443115234, "global_step": 264908, "epoch": 3191} {"train_loss": -25.197534561157227, "global_step": 264909, "epoch": 3191} {"train_loss": -25.06583023071289, "global_step": 264910, "epoch": 3191} {"train_loss": -25.271713256835938, "global_step": 264911, "epoch": 3191} {"train_loss": -24.968730926513672, "global_step": 264912, "epoch": 3191} {"train_loss": -25.141130447387695, "global_step": 264913, "epoch": 3191} {"train_loss": -25.248563766479492, "global_step": 264914, "epoch": 3191} {"train_loss": -25.015050888061523, "global_step": 264915, "epoch": 3191} {"train_loss": -25.36695671081543, "global_step": 264916, "epoch": 3191} {"train_loss": -25.57698631286621, "global_step": 264917, "epoch": 3191} {"train_loss": -25.110807418823242, "global_step": 264918, "epoch": 3191} {"train_loss": -24.79182243347168, "global_step": 264919, "epoch": 3191} {"train_loss": -24.7921142578125, "global_step": 264920, "epoch": 3191} {"train_loss": -25.20845603942871, "global_step": 264921, "epoch": 3191} {"train_loss": -25.13004493713379, "global_step": 264922, "epoch": 3191} {"train_loss": -24.86237907409668, "global_step": 264923, "epoch": 3191} {"train_loss": -25.184789657592773, "global_step": 264924, "epoch": 3191} {"train_loss": -25.14728355407715, "global_step": 264925, "epoch": 3191} {"train_loss": -25.167327880859375, "global_step": 264926, "epoch": 3191} {"train_loss": -24.9401912689209, "global_step": 264927, "epoch": 3191} {"train_loss": -25.08083152770996, "global_step": 264928, "epoch": 3191} {"train_loss": -25.40532875061035, "global_step": 264929, "epoch": 3191} {"train_loss": -25.3253116607666, "global_step": 264930, "epoch": 3191} {"train_loss": -25.021257400512695, "global_step": 264931, "epoch": 3191} {"train_loss": -25.08319854736328, "global_step": 264932, "epoch": 3191} {"train_loss": -25.476560592651367, "global_step": 264933, "epoch": 3191} {"train_loss": -25.370506286621094, "global_step": 264934, "epoch": 3191} {"train_loss": -24.94744048061141, "global_step": 264935, "epoch": 3191, "val_loss": 7024540.0} {"train_loss": -24.92767906188965, "global_step": 264936, "epoch": 3192} {"train_loss": -24.06140899658203, "global_step": 264937, "epoch": 3192} {"train_loss": -24.943130493164062, "global_step": 264938, "epoch": 3192} {"train_loss": -24.610219955444336, "global_step": 264939, "epoch": 3192} {"train_loss": -24.6653995513916, "global_step": 264940, "epoch": 3192} {"train_loss": -25.202390670776367, "global_step": 264941, "epoch": 3192} {"train_loss": -24.41993522644043, "global_step": 264942, "epoch": 3192} {"train_loss": -24.774978637695312, "global_step": 264943, "epoch": 3192} {"train_loss": -24.932453155517578, "global_step": 264944, "epoch": 3192} {"train_loss": -24.66287612915039, "global_step": 264945, "epoch": 3192} {"train_loss": -24.76680564880371, "global_step": 264946, "epoch": 3192} {"train_loss": -25.082515716552734, "global_step": 264947, "epoch": 3192} {"train_loss": -24.907453536987305, "global_step": 264948, "epoch": 3192} {"train_loss": -24.926563262939453, "global_step": 264949, "epoch": 3192} {"train_loss": -24.841175079345703, "global_step": 264950, "epoch": 3192} {"train_loss": -25.351484298706055, "global_step": 264951, "epoch": 3192} {"train_loss": -24.923128128051758, "global_step": 264952, "epoch": 3192} {"train_loss": -25.069196701049805, "global_step": 264953, "epoch": 3192} {"train_loss": -25.600372314453125, "global_step": 264954, "epoch": 3192} {"train_loss": -24.83249855041504, "global_step": 264955, "epoch": 3192} {"train_loss": -24.958524703979492, "global_step": 264956, "epoch": 3192} {"train_loss": -25.03374671936035, "global_step": 264957, "epoch": 3192} {"train_loss": -25.506824493408203, "global_step": 264958, "epoch": 3192} {"train_loss": -25.148344039916992, "global_step": 264959, "epoch": 3192} {"train_loss": -25.122140884399414, "global_step": 264960, "epoch": 3192} {"train_loss": -25.602100372314453, "global_step": 264961, "epoch": 3192} {"train_loss": -25.418004989624023, "global_step": 264962, "epoch": 3192} {"train_loss": -25.14143943786621, "global_step": 264963, "epoch": 3192} {"train_loss": -25.48919677734375, "global_step": 264964, "epoch": 3192} {"train_loss": -25.268117904663086, "global_step": 264965, "epoch": 3192} {"train_loss": -25.293176651000977, "global_step": 264966, "epoch": 3192} {"train_loss": -24.745786666870117, "global_step": 264967, "epoch": 3192} {"train_loss": -24.950239181518555, "global_step": 264968, "epoch": 3192} {"train_loss": -25.22287940979004, "global_step": 264969, "epoch": 3192} {"train_loss": -25.176239013671875, "global_step": 264970, "epoch": 3192} {"train_loss": -25.414213180541992, "global_step": 264971, "epoch": 3192} {"train_loss": -25.372385025024414, "global_step": 264972, "epoch": 3192} {"train_loss": -25.187618255615234, "global_step": 264973, "epoch": 3192} {"train_loss": -25.582860946655273, "global_step": 264974, "epoch": 3192} {"train_loss": -24.713003158569336, "global_step": 264975, "epoch": 3192} {"train_loss": -25.38671875, "global_step": 264976, "epoch": 3192} {"train_loss": -25.273168563842773, "global_step": 264977, "epoch": 3192} {"train_loss": -25.62664794921875, "global_step": 264978, "epoch": 3192} {"train_loss": -25.20826530456543, "global_step": 264979, "epoch": 3192} {"train_loss": -25.293996810913086, "global_step": 264980, "epoch": 3192} {"train_loss": -25.159215927124023, "global_step": 264981, "epoch": 3192} {"train_loss": -24.991254806518555, "global_step": 264982, "epoch": 3192} {"train_loss": -25.720930099487305, "global_step": 264983, "epoch": 3192} {"train_loss": -24.907085418701172, "global_step": 264984, "epoch": 3192} {"train_loss": -25.327713012695312, "global_step": 264985, "epoch": 3192} {"train_loss": -25.393415451049805, "global_step": 264986, "epoch": 3192} {"train_loss": -25.369478225708008, "global_step": 264987, "epoch": 3192} {"train_loss": -25.49881935119629, "global_step": 264988, "epoch": 3192} {"train_loss": -25.194814682006836, "global_step": 264989, "epoch": 3192} {"train_loss": -25.548782348632812, "global_step": 264990, "epoch": 3192} {"train_loss": -25.343351364135742, "global_step": 264991, "epoch": 3192} {"train_loss": -24.97770118713379, "global_step": 264992, "epoch": 3192} {"train_loss": -25.32582664489746, "global_step": 264993, "epoch": 3192} {"train_loss": -25.301183700561523, "global_step": 264994, "epoch": 3192} {"train_loss": -25.1602840423584, "global_step": 264995, "epoch": 3192} {"train_loss": -25.10296630859375, "global_step": 264996, "epoch": 3192} {"train_loss": -25.134876251220703, "global_step": 264997, "epoch": 3192} {"train_loss": -25.143430709838867, "global_step": 264998, "epoch": 3192} {"train_loss": -24.867136001586914, "global_step": 264999, "epoch": 3192} {"train_loss": -25.09803581237793, "global_step": 265000, "epoch": 3192} {"train_loss": -24.960012435913086, "global_step": 265001, "epoch": 3192} {"train_loss": -25.166336059570312, "global_step": 265002, "epoch": 3192} {"train_loss": -25.12892723083496, "global_step": 265003, "epoch": 3192} {"train_loss": -25.28936195373535, "global_step": 265004, "epoch": 3192} {"train_loss": -24.957796096801758, "global_step": 265005, "epoch": 3192} {"train_loss": -25.06492042541504, "global_step": 265006, "epoch": 3192} {"train_loss": -25.482816696166992, "global_step": 265007, "epoch": 3192} {"train_loss": -25.311201095581055, "global_step": 265008, "epoch": 3192} {"train_loss": -25.46001434326172, "global_step": 265009, "epoch": 3192} {"train_loss": -24.877891540527344, "global_step": 265010, "epoch": 3192} {"train_loss": -24.94141387939453, "global_step": 265011, "epoch": 3192} {"train_loss": -25.226287841796875, "global_step": 265012, "epoch": 3192} {"train_loss": -25.338171005249023, "global_step": 265013, "epoch": 3192} {"train_loss": -25.12502098083496, "global_step": 265014, "epoch": 3192} {"train_loss": -25.270675659179688, "global_step": 265015, "epoch": 3192} {"train_loss": -25.05585289001465, "global_step": 265016, "epoch": 3192} {"train_loss": -24.960819244384766, "global_step": 265017, "epoch": 3192} {"train_loss": -25.13732581540763, "global_step": 265018, "epoch": 3192, "val_loss": 6979789.0} {"train_loss": -24.73876190185547, "global_step": 265019, "epoch": 3193} {"train_loss": -24.97820281982422, "global_step": 265020, "epoch": 3193} {"train_loss": -24.7611141204834, "global_step": 265021, "epoch": 3193} {"train_loss": -24.61164093017578, "global_step": 265022, "epoch": 3193} {"train_loss": -24.403852462768555, "global_step": 265023, "epoch": 3193} {"train_loss": -24.858869552612305, "global_step": 265024, "epoch": 3193} {"train_loss": -24.912927627563477, "global_step": 265025, "epoch": 3193} {"train_loss": -24.790149688720703, "global_step": 265026, "epoch": 3193} {"train_loss": -25.14767837524414, "global_step": 265027, "epoch": 3193} {"train_loss": -24.768199920654297, "global_step": 265028, "epoch": 3193} {"train_loss": -24.692928314208984, "global_step": 265029, "epoch": 3193} {"train_loss": -24.92850685119629, "global_step": 265030, "epoch": 3193} {"train_loss": -24.755765914916992, "global_step": 265031, "epoch": 3193} {"train_loss": -24.87446403503418, "global_step": 265032, "epoch": 3193} {"train_loss": -24.868087768554688, "global_step": 265033, "epoch": 3193} {"train_loss": -25.41919708251953, "global_step": 265034, "epoch": 3193} {"train_loss": -25.056598663330078, "global_step": 265035, "epoch": 3193} {"train_loss": -24.73368263244629, "global_step": 265036, "epoch": 3193} {"train_loss": -25.334836959838867, "global_step": 265037, "epoch": 3193} {"train_loss": -25.25796890258789, "global_step": 265038, "epoch": 3193} {"train_loss": -24.72672462463379, "global_step": 265039, "epoch": 3193} {"train_loss": -24.815265655517578, "global_step": 265040, "epoch": 3193} {"train_loss": -25.02928924560547, "global_step": 265041, "epoch": 3193} {"train_loss": -25.184894561767578, "global_step": 265042, "epoch": 3193} {"train_loss": -24.6368465423584, "global_step": 265043, "epoch": 3193} {"train_loss": -25.326248168945312, "global_step": 265044, "epoch": 3193} {"train_loss": -25.365753173828125, "global_step": 265045, "epoch": 3193} {"train_loss": -25.652387619018555, "global_step": 265046, "epoch": 3193} {"train_loss": -25.227636337280273, "global_step": 265047, "epoch": 3193} {"train_loss": -25.183496475219727, "global_step": 265048, "epoch": 3193} {"train_loss": -25.141891479492188, "global_step": 265049, "epoch": 3193} {"train_loss": -25.445602416992188, "global_step": 265050, "epoch": 3193} {"train_loss": -25.03828239440918, "global_step": 265051, "epoch": 3193} {"train_loss": -25.318021774291992, "global_step": 265052, "epoch": 3193} {"train_loss": -25.35859489440918, "global_step": 265053, "epoch": 3193} {"train_loss": -25.08368682861328, "global_step": 265054, "epoch": 3193} {"train_loss": -25.133155822753906, "global_step": 265055, "epoch": 3193} {"train_loss": -25.478363037109375, "global_step": 265056, "epoch": 3193} {"train_loss": -25.47468376159668, "global_step": 265057, "epoch": 3193} {"train_loss": -25.410755157470703, "global_step": 265058, "epoch": 3193} {"train_loss": -25.389389038085938, "global_step": 265059, "epoch": 3193} {"train_loss": -25.59457015991211, "global_step": 265060, "epoch": 3193} {"train_loss": -25.86603355407715, "global_step": 265061, "epoch": 3193} {"train_loss": -25.522703170776367, "global_step": 265062, "epoch": 3193} {"train_loss": -25.453947067260742, "global_step": 265063, "epoch": 3193} {"train_loss": -25.074674606323242, "global_step": 265064, "epoch": 3193} {"train_loss": -25.179716110229492, "global_step": 265065, "epoch": 3193} {"train_loss": -25.11053466796875, "global_step": 265066, "epoch": 3193} {"train_loss": -25.149824142456055, "global_step": 265067, "epoch": 3193} {"train_loss": -25.216190338134766, "global_step": 265068, "epoch": 3193} {"train_loss": -25.172908782958984, "global_step": 265069, "epoch": 3193} {"train_loss": -24.795604705810547, "global_step": 265070, "epoch": 3193} {"train_loss": -24.853918075561523, "global_step": 265071, "epoch": 3193} {"train_loss": -25.347883224487305, "global_step": 265072, "epoch": 3193} {"train_loss": -25.103565216064453, "global_step": 265073, "epoch": 3193} {"train_loss": -24.90040397644043, "global_step": 265074, "epoch": 3193} {"train_loss": -25.23350715637207, "global_step": 265075, "epoch": 3193} {"train_loss": -25.383756637573242, "global_step": 265076, "epoch": 3193} {"train_loss": -24.868539810180664, "global_step": 265077, "epoch": 3193} {"train_loss": -25.521223068237305, "global_step": 265078, "epoch": 3193} {"train_loss": -25.216787338256836, "global_step": 265079, "epoch": 3193} {"train_loss": -25.420562744140625, "global_step": 265080, "epoch": 3193} {"train_loss": -25.255084991455078, "global_step": 265081, "epoch": 3193} {"train_loss": -25.569705963134766, "global_step": 265082, "epoch": 3193} {"train_loss": -25.11847496032715, "global_step": 265083, "epoch": 3193} {"train_loss": -25.340246200561523, "global_step": 265084, "epoch": 3193} {"train_loss": -25.34792137145996, "global_step": 265085, "epoch": 3193} {"train_loss": -25.153478622436523, "global_step": 265086, "epoch": 3193} {"train_loss": -25.10342788696289, "global_step": 265087, "epoch": 3193} {"train_loss": -25.073148727416992, "global_step": 265088, "epoch": 3193} {"train_loss": -24.987272262573242, "global_step": 265089, "epoch": 3193} {"train_loss": -24.97887420654297, "global_step": 265090, "epoch": 3193} {"train_loss": -25.192489624023438, "global_step": 265091, "epoch": 3193} {"train_loss": -24.89354705810547, "global_step": 265092, "epoch": 3193} {"train_loss": -25.39291763305664, "global_step": 265093, "epoch": 3193} {"train_loss": -25.091615676879883, "global_step": 265094, "epoch": 3193} {"train_loss": -25.632160186767578, "global_step": 265095, "epoch": 3193} {"train_loss": -25.002845764160156, "global_step": 265096, "epoch": 3193} {"train_loss": -25.34209632873535, "global_step": 265097, "epoch": 3193} {"train_loss": -25.466306686401367, "global_step": 265098, "epoch": 3193} {"train_loss": -25.29170036315918, "global_step": 265099, "epoch": 3193} {"train_loss": -25.123706817626953, "global_step": 265100, "epoch": 3193} {"train_loss": -25.141373944569782, "global_step": 265101, "epoch": 3193, "val_loss": 6909259.0} {"train_loss": -24.71754264831543, "global_step": 265102, "epoch": 3194} {"train_loss": -24.867053985595703, "global_step": 265103, "epoch": 3194} {"train_loss": -25.078540802001953, "global_step": 265104, "epoch": 3194} {"train_loss": -24.9971923828125, "global_step": 265105, "epoch": 3194} {"train_loss": -24.8229923248291, "global_step": 265106, "epoch": 3194} {"train_loss": -24.928394317626953, "global_step": 265107, "epoch": 3194} {"train_loss": -25.0373477935791, "global_step": 265108, "epoch": 3194} {"train_loss": -24.936777114868164, "global_step": 265109, "epoch": 3194} {"train_loss": -24.549219131469727, "global_step": 265110, "epoch": 3194} {"train_loss": -24.92496109008789, "global_step": 265111, "epoch": 3194} {"train_loss": -25.25215721130371, "global_step": 265112, "epoch": 3194} {"train_loss": -25.106895446777344, "global_step": 265113, "epoch": 3194} {"train_loss": -25.248493194580078, "global_step": 265114, "epoch": 3194} {"train_loss": -25.029937744140625, "global_step": 265115, "epoch": 3194} {"train_loss": -25.291751861572266, "global_step": 265116, "epoch": 3194} {"train_loss": -25.063785552978516, "global_step": 265117, "epoch": 3194} {"train_loss": -24.95803451538086, "global_step": 265118, "epoch": 3194} {"train_loss": -25.012388229370117, "global_step": 265119, "epoch": 3194} {"train_loss": -25.192262649536133, "global_step": 265120, "epoch": 3194} {"train_loss": -25.23422622680664, "global_step": 265121, "epoch": 3194} {"train_loss": -25.037595748901367, "global_step": 265122, "epoch": 3194} {"train_loss": -25.291677474975586, "global_step": 265123, "epoch": 3194} {"train_loss": -25.064313888549805, "global_step": 265124, "epoch": 3194} {"train_loss": -25.03142738342285, "global_step": 265125, "epoch": 3194} {"train_loss": -24.760345458984375, "global_step": 265126, "epoch": 3194} {"train_loss": -25.078353881835938, "global_step": 265127, "epoch": 3194} {"train_loss": -25.229406356811523, "global_step": 265128, "epoch": 3194} {"train_loss": -25.26224708557129, "global_step": 265129, "epoch": 3194} {"train_loss": -24.804014205932617, "global_step": 265130, "epoch": 3194} {"train_loss": -24.864774703979492, "global_step": 265131, "epoch": 3194} {"train_loss": -25.390947341918945, "global_step": 265132, "epoch": 3194} {"train_loss": -25.265600204467773, "global_step": 265133, "epoch": 3194} {"train_loss": -25.17478370666504, "global_step": 265134, "epoch": 3194} {"train_loss": -25.597379684448242, "global_step": 265135, "epoch": 3194} {"train_loss": -25.275741577148438, "global_step": 265136, "epoch": 3194} {"train_loss": -25.32273292541504, "global_step": 265137, "epoch": 3194} {"train_loss": -25.20608901977539, "global_step": 265138, "epoch": 3194} {"train_loss": -25.304471969604492, "global_step": 265139, "epoch": 3194} {"train_loss": -25.421422958374023, "global_step": 265140, "epoch": 3194} {"train_loss": -25.35828399658203, "global_step": 265141, "epoch": 3194} {"train_loss": -25.563034057617188, "global_step": 265142, "epoch": 3194} {"train_loss": -25.369308471679688, "global_step": 265143, "epoch": 3194} {"train_loss": -25.144994735717773, "global_step": 265144, "epoch": 3194} {"train_loss": -25.149084091186523, "global_step": 265145, "epoch": 3194} {"train_loss": -24.66598129272461, "global_step": 265146, "epoch": 3194} {"train_loss": -24.05924415588379, "global_step": 265147, "epoch": 3194} {"train_loss": -23.992355346679688, "global_step": 265148, "epoch": 3194} {"train_loss": -25.29608726501465, "global_step": 265149, "epoch": 3194} {"train_loss": -24.584609985351562, "global_step": 265150, "epoch": 3194} {"train_loss": -24.82578468322754, "global_step": 265151, "epoch": 3194} {"train_loss": -24.55631446838379, "global_step": 265152, "epoch": 3194} {"train_loss": -25.016860961914062, "global_step": 265153, "epoch": 3194} {"train_loss": -24.492942810058594, "global_step": 265154, "epoch": 3194} {"train_loss": -24.8408203125, "global_step": 265155, "epoch": 3194} {"train_loss": -24.682523727416992, "global_step": 265156, "epoch": 3194} {"train_loss": -24.439001083374023, "global_step": 265157, "epoch": 3194} {"train_loss": -24.774335861206055, "global_step": 265158, "epoch": 3194} {"train_loss": -24.621017456054688, "global_step": 265159, "epoch": 3194} {"train_loss": -25.073698043823242, "global_step": 265160, "epoch": 3194} {"train_loss": -24.384050369262695, "global_step": 265161, "epoch": 3194} {"train_loss": -24.445798873901367, "global_step": 265162, "epoch": 3194} {"train_loss": -25.07547950744629, "global_step": 265163, "epoch": 3194} {"train_loss": -24.354297637939453, "global_step": 265164, "epoch": 3194} {"train_loss": -25.31140899658203, "global_step": 265165, "epoch": 3194} {"train_loss": -24.934019088745117, "global_step": 265166, "epoch": 3194} {"train_loss": -25.052274703979492, "global_step": 265167, "epoch": 3194} {"train_loss": -25.06890869140625, "global_step": 265168, "epoch": 3194} {"train_loss": -25.065929412841797, "global_step": 265169, "epoch": 3194} {"train_loss": -24.850341796875, "global_step": 265170, "epoch": 3194} {"train_loss": -25.458555221557617, "global_step": 265171, "epoch": 3194} {"train_loss": -25.020139694213867, "global_step": 265172, "epoch": 3194} {"train_loss": -25.37131118774414, "global_step": 265173, "epoch": 3194} {"train_loss": -24.743640899658203, "global_step": 265174, "epoch": 3194} {"train_loss": -25.200544357299805, "global_step": 265175, "epoch": 3194} {"train_loss": -24.83052635192871, "global_step": 265176, "epoch": 3194} {"train_loss": -25.23756980895996, "global_step": 265177, "epoch": 3194} {"train_loss": -25.065372467041016, "global_step": 265178, "epoch": 3194} {"train_loss": -25.262174606323242, "global_step": 265179, "epoch": 3194} {"train_loss": -25.048429489135742, "global_step": 265180, "epoch": 3194} {"train_loss": -25.269947052001953, "global_step": 265181, "epoch": 3194} {"train_loss": -25.276050567626953, "global_step": 265182, "epoch": 3194} {"train_loss": -25.548519134521484, "global_step": 265183, "epoch": 3194} {"train_loss": -25.010310437305865, "global_step": 265184, "epoch": 3194, "val_loss": 6962177.0} {"train_loss": -24.58645248413086, "global_step": 265185, "epoch": 3195} {"train_loss": -24.09793472290039, "global_step": 265186, "epoch": 3195} {"train_loss": -24.62395477294922, "global_step": 265187, "epoch": 3195} {"train_loss": -24.764034271240234, "global_step": 265188, "epoch": 3195} {"train_loss": -24.670625686645508, "global_step": 265189, "epoch": 3195} {"train_loss": -25.023740768432617, "global_step": 265190, "epoch": 3195} {"train_loss": -24.8654842376709, "global_step": 265191, "epoch": 3195} {"train_loss": -25.014883041381836, "global_step": 265192, "epoch": 3195} {"train_loss": -24.81492805480957, "global_step": 265193, "epoch": 3195} {"train_loss": -25.09218978881836, "global_step": 265194, "epoch": 3195} {"train_loss": -24.9898738861084, "global_step": 265195, "epoch": 3195} {"train_loss": -25.00825309753418, "global_step": 265196, "epoch": 3195} {"train_loss": -24.805789947509766, "global_step": 265197, "epoch": 3195} {"train_loss": -25.161848068237305, "global_step": 265198, "epoch": 3195} {"train_loss": -25.26252555847168, "global_step": 265199, "epoch": 3195} {"train_loss": -25.082189559936523, "global_step": 265200, "epoch": 3195} {"train_loss": -25.1912784576416, "global_step": 265201, "epoch": 3195} {"train_loss": -25.123626708984375, "global_step": 265202, "epoch": 3195} {"train_loss": -25.273618698120117, "global_step": 265203, "epoch": 3195} {"train_loss": -25.541906356811523, "global_step": 265204, "epoch": 3195} {"train_loss": -25.090126037597656, "global_step": 265205, "epoch": 3195} {"train_loss": -25.082168579101562, "global_step": 265206, "epoch": 3195} {"train_loss": -25.085599899291992, "global_step": 265207, "epoch": 3195} {"train_loss": -25.30457878112793, "global_step": 265208, "epoch": 3195} {"train_loss": -25.54831886291504, "global_step": 265209, "epoch": 3195} {"train_loss": -24.915647506713867, "global_step": 265210, "epoch": 3195} {"train_loss": -25.398542404174805, "global_step": 265211, "epoch": 3195} {"train_loss": -25.414810180664062, "global_step": 265212, "epoch": 3195} {"train_loss": -25.657154083251953, "global_step": 265213, "epoch": 3195} {"train_loss": -25.31776237487793, "global_step": 265214, "epoch": 3195} {"train_loss": -25.647680282592773, "global_step": 265215, "epoch": 3195} {"train_loss": -25.23773193359375, "global_step": 265216, "epoch": 3195} {"train_loss": -25.060468673706055, "global_step": 265217, "epoch": 3195} {"train_loss": -25.099985122680664, "global_step": 265218, "epoch": 3195} {"train_loss": -25.384611129760742, "global_step": 265219, "epoch": 3195} {"train_loss": -24.913801193237305, "global_step": 265220, "epoch": 3195} {"train_loss": -25.47175407409668, "global_step": 265221, "epoch": 3195} {"train_loss": -25.335987091064453, "global_step": 265222, "epoch": 3195} {"train_loss": -25.214906692504883, "global_step": 265223, "epoch": 3195} {"train_loss": -25.41815185546875, "global_step": 265224, "epoch": 3195} {"train_loss": -25.129608154296875, "global_step": 265225, "epoch": 3195} {"train_loss": -24.913284301757812, "global_step": 265226, "epoch": 3195} {"train_loss": -25.194135665893555, "global_step": 265227, "epoch": 3195} {"train_loss": -25.168981552124023, "global_step": 265228, "epoch": 3195} {"train_loss": -25.13335418701172, "global_step": 265229, "epoch": 3195} {"train_loss": -25.4526424407959, "global_step": 265230, "epoch": 3195} {"train_loss": -25.499053955078125, "global_step": 265231, "epoch": 3195} {"train_loss": -25.171802520751953, "global_step": 265232, "epoch": 3195} {"train_loss": -25.05855369567871, "global_step": 265233, "epoch": 3195} {"train_loss": -25.7883243560791, "global_step": 265234, "epoch": 3195} {"train_loss": -25.231321334838867, "global_step": 265235, "epoch": 3195} {"train_loss": -25.219871520996094, "global_step": 265236, "epoch": 3195} {"train_loss": -25.00878143310547, "global_step": 265237, "epoch": 3195} {"train_loss": -25.403167724609375, "global_step": 265238, "epoch": 3195} {"train_loss": -25.06366539001465, "global_step": 265239, "epoch": 3195} {"train_loss": -25.1177978515625, "global_step": 265240, "epoch": 3195} {"train_loss": -25.408973693847656, "global_step": 265241, "epoch": 3195} {"train_loss": -24.897287368774414, "global_step": 265242, "epoch": 3195} {"train_loss": -24.995397567749023, "global_step": 265243, "epoch": 3195} {"train_loss": -25.022533416748047, "global_step": 265244, "epoch": 3195} {"train_loss": -25.63758659362793, "global_step": 265245, "epoch": 3195} {"train_loss": -24.901113510131836, "global_step": 265246, "epoch": 3195} {"train_loss": -25.09113121032715, "global_step": 265247, "epoch": 3195} {"train_loss": -25.25849723815918, "global_step": 265248, "epoch": 3195} {"train_loss": -25.124181747436523, "global_step": 265249, "epoch": 3195} {"train_loss": -25.140066146850586, "global_step": 265250, "epoch": 3195} {"train_loss": -25.01168441772461, "global_step": 265251, "epoch": 3195} {"train_loss": -25.188297271728516, "global_step": 265252, "epoch": 3195} {"train_loss": -25.5075740814209, "global_step": 265253, "epoch": 3195} {"train_loss": -25.21014976501465, "global_step": 265254, "epoch": 3195} {"train_loss": -25.130168914794922, "global_step": 265255, "epoch": 3195} {"train_loss": -25.07694435119629, "global_step": 265256, "epoch": 3195} {"train_loss": -25.455617904663086, "global_step": 265257, "epoch": 3195} {"train_loss": -25.65456199645996, "global_step": 265258, "epoch": 3195} {"train_loss": -25.230131149291992, "global_step": 265259, "epoch": 3195} {"train_loss": -25.61151123046875, "global_step": 265260, "epoch": 3195} {"train_loss": -25.02128028869629, "global_step": 265261, "epoch": 3195} {"train_loss": -25.283987045288086, "global_step": 265262, "epoch": 3195} {"train_loss": -25.099077224731445, "global_step": 265263, "epoch": 3195} {"train_loss": -25.657346725463867, "global_step": 265264, "epoch": 3195} {"train_loss": -25.259977340698242, "global_step": 265265, "epoch": 3195} {"train_loss": -25.16196632385254, "global_step": 265266, "epoch": 3195} {"train_loss": -25.168972819684498, "global_step": 265267, "epoch": 3195, "val_loss": 6942898.0} {"train_loss": -24.583969116210938, "global_step": 265268, "epoch": 3196} {"train_loss": -25.365589141845703, "global_step": 265269, "epoch": 3196} {"train_loss": -24.783823013305664, "global_step": 265270, "epoch": 3196} {"train_loss": -24.937345504760742, "global_step": 265271, "epoch": 3196} {"train_loss": -25.092649459838867, "global_step": 265272, "epoch": 3196} {"train_loss": -24.256818771362305, "global_step": 265273, "epoch": 3196} {"train_loss": -24.93958854675293, "global_step": 265274, "epoch": 3196} {"train_loss": -24.744373321533203, "global_step": 265275, "epoch": 3196} {"train_loss": -25.042043685913086, "global_step": 265276, "epoch": 3196} {"train_loss": -25.02141761779785, "global_step": 265277, "epoch": 3196} {"train_loss": -25.12593650817871, "global_step": 265278, "epoch": 3196} {"train_loss": -25.27017593383789, "global_step": 265279, "epoch": 3196} {"train_loss": -25.186084747314453, "global_step": 265280, "epoch": 3196} {"train_loss": -24.929439544677734, "global_step": 265281, "epoch": 3196} {"train_loss": -25.085193634033203, "global_step": 265282, "epoch": 3196} {"train_loss": -25.09625816345215, "global_step": 265283, "epoch": 3196} {"train_loss": -25.36685562133789, "global_step": 265284, "epoch": 3196} {"train_loss": -25.095264434814453, "global_step": 265285, "epoch": 3196} {"train_loss": -24.936426162719727, "global_step": 265286, "epoch": 3196} {"train_loss": -24.779495239257812, "global_step": 265287, "epoch": 3196} {"train_loss": -25.8067626953125, "global_step": 265288, "epoch": 3196} {"train_loss": -25.09760093688965, "global_step": 265289, "epoch": 3196} {"train_loss": -24.97254753112793, "global_step": 265290, "epoch": 3196} {"train_loss": -25.04128646850586, "global_step": 265291, "epoch": 3196} {"train_loss": -24.976654052734375, "global_step": 265292, "epoch": 3196} {"train_loss": -25.23107147216797, "global_step": 265293, "epoch": 3196} {"train_loss": -24.96847915649414, "global_step": 265294, "epoch": 3196} {"train_loss": -25.431724548339844, "global_step": 265295, "epoch": 3196} {"train_loss": -24.963924407958984, "global_step": 265296, "epoch": 3196} {"train_loss": -25.359479904174805, "global_step": 265297, "epoch": 3196} {"train_loss": -25.206140518188477, "global_step": 265298, "epoch": 3196} {"train_loss": -25.685016632080078, "global_step": 265299, "epoch": 3196} {"train_loss": -25.2493839263916, "global_step": 265300, "epoch": 3196} {"train_loss": -24.896026611328125, "global_step": 265301, "epoch": 3196} {"train_loss": -25.50946044921875, "global_step": 265302, "epoch": 3196} {"train_loss": -25.416635513305664, "global_step": 265303, "epoch": 3196} {"train_loss": -25.493497848510742, "global_step": 265304, "epoch": 3196} {"train_loss": -25.07383918762207, "global_step": 265305, "epoch": 3196} {"train_loss": -25.23685073852539, "global_step": 265306, "epoch": 3196} {"train_loss": -25.38975715637207, "global_step": 265307, "epoch": 3196} {"train_loss": -25.16974449157715, "global_step": 265308, "epoch": 3196} {"train_loss": -25.020116806030273, "global_step": 265309, "epoch": 3196} {"train_loss": -24.94359016418457, "global_step": 265310, "epoch": 3196} {"train_loss": -25.460309982299805, "global_step": 265311, "epoch": 3196} {"train_loss": -24.999059677124023, "global_step": 265312, "epoch": 3196} {"train_loss": -24.99411964416504, "global_step": 265313, "epoch": 3196} {"train_loss": -24.8752384185791, "global_step": 265314, "epoch": 3196} {"train_loss": -24.858381271362305, "global_step": 265315, "epoch": 3196} {"train_loss": -25.381799697875977, "global_step": 265316, "epoch": 3196} {"train_loss": -24.852069854736328, "global_step": 265317, "epoch": 3196} {"train_loss": -25.422473907470703, "global_step": 265318, "epoch": 3196} {"train_loss": -25.452770233154297, "global_step": 265319, "epoch": 3196} {"train_loss": -25.794397354125977, "global_step": 265320, "epoch": 3196} {"train_loss": -24.807621002197266, "global_step": 265321, "epoch": 3196} {"train_loss": -25.216257095336914, "global_step": 265322, "epoch": 3196} {"train_loss": -25.381254196166992, "global_step": 265323, "epoch": 3196} {"train_loss": -25.5518856048584, "global_step": 265324, "epoch": 3196} {"train_loss": -25.228124618530273, "global_step": 265325, "epoch": 3196} {"train_loss": -25.429828643798828, "global_step": 265326, "epoch": 3196} {"train_loss": -24.973617553710938, "global_step": 265327, "epoch": 3196} {"train_loss": -25.051082611083984, "global_step": 265328, "epoch": 3196} {"train_loss": -25.06597328186035, "global_step": 265329, "epoch": 3196} {"train_loss": -25.331403732299805, "global_step": 265330, "epoch": 3196} {"train_loss": -25.067604064941406, "global_step": 265331, "epoch": 3196} {"train_loss": -25.314340591430664, "global_step": 265332, "epoch": 3196} {"train_loss": -25.26408576965332, "global_step": 265333, "epoch": 3196} {"train_loss": -25.42451286315918, "global_step": 265334, "epoch": 3196} {"train_loss": -25.638437271118164, "global_step": 265335, "epoch": 3196} {"train_loss": -25.564329147338867, "global_step": 265336, "epoch": 3196} {"train_loss": -25.647708892822266, "global_step": 265337, "epoch": 3196} {"train_loss": -25.2563533782959, "global_step": 265338, "epoch": 3196} {"train_loss": -25.587106704711914, "global_step": 265339, "epoch": 3196} {"train_loss": -25.469690322875977, "global_step": 265340, "epoch": 3196} {"train_loss": -25.244924545288086, "global_step": 265341, "epoch": 3196} {"train_loss": -25.387649536132812, "global_step": 265342, "epoch": 3196} {"train_loss": -25.459394454956055, "global_step": 265343, "epoch": 3196} {"train_loss": -25.056915283203125, "global_step": 265344, "epoch": 3196} {"train_loss": -25.42758560180664, "global_step": 265345, "epoch": 3196} {"train_loss": -25.264328002929688, "global_step": 265346, "epoch": 3196} {"train_loss": -25.2905330657959, "global_step": 265347, "epoch": 3196} {"train_loss": -24.558752059936523, "global_step": 265348, "epoch": 3196} {"train_loss": -23.50393295288086, "global_step": 265349, "epoch": 3196} {"train_loss": -25.15149139496217, "global_step": 265350, "epoch": 3196, "val_loss": 7108804.0} {"train_loss": -24.038223266601562, "global_step": 265351, "epoch": 3197} {"train_loss": -21.90806770324707, "global_step": 265352, "epoch": 3197} {"train_loss": -23.723968505859375, "global_step": 265353, "epoch": 3197} {"train_loss": -22.751741409301758, "global_step": 265354, "epoch": 3197} {"train_loss": -23.11075210571289, "global_step": 265355, "epoch": 3197} {"train_loss": -23.764371871948242, "global_step": 265356, "epoch": 3197} {"train_loss": -23.6680965423584, "global_step": 265357, "epoch": 3197} {"train_loss": -23.580745697021484, "global_step": 265358, "epoch": 3197} {"train_loss": -24.030324935913086, "global_step": 265359, "epoch": 3197} {"train_loss": -23.948257446289062, "global_step": 265360, "epoch": 3197} {"train_loss": -23.98666763305664, "global_step": 265361, "epoch": 3197} {"train_loss": -24.544843673706055, "global_step": 265362, "epoch": 3197} {"train_loss": -24.271512985229492, "global_step": 265363, "epoch": 3197} {"train_loss": -24.496158599853516, "global_step": 265364, "epoch": 3197} {"train_loss": -24.49602699279785, "global_step": 265365, "epoch": 3197} {"train_loss": -24.345884323120117, "global_step": 265366, "epoch": 3197} {"train_loss": -24.52235221862793, "global_step": 265367, "epoch": 3197} {"train_loss": -24.475584030151367, "global_step": 265368, "epoch": 3197} {"train_loss": -24.60321807861328, "global_step": 265369, "epoch": 3197} {"train_loss": -24.47389030456543, "global_step": 265370, "epoch": 3197} {"train_loss": -24.845869064331055, "global_step": 265371, "epoch": 3197} {"train_loss": -24.58210563659668, "global_step": 265372, "epoch": 3197} {"train_loss": -24.789794921875, "global_step": 265373, "epoch": 3197} {"train_loss": -24.596189498901367, "global_step": 265374, "epoch": 3197} {"train_loss": -24.67937469482422, "global_step": 265375, "epoch": 3197} {"train_loss": -24.8179874420166, "global_step": 265376, "epoch": 3197} {"train_loss": -24.570180892944336, "global_step": 265377, "epoch": 3197} {"train_loss": -24.629928588867188, "global_step": 265378, "epoch": 3197} {"train_loss": -25.206558227539062, "global_step": 265379, "epoch": 3197} {"train_loss": -25.091745376586914, "global_step": 265380, "epoch": 3197} {"train_loss": -24.88563346862793, "global_step": 265381, "epoch": 3197} {"train_loss": -24.703792572021484, "global_step": 265382, "epoch": 3197} {"train_loss": -25.106277465820312, "global_step": 265383, "epoch": 3197} {"train_loss": -24.48615837097168, "global_step": 265384, "epoch": 3197} {"train_loss": -25.003623962402344, "global_step": 265385, "epoch": 3197} {"train_loss": -24.94571876525879, "global_step": 265386, "epoch": 3197} {"train_loss": -25.130535125732422, "global_step": 265387, "epoch": 3197} {"train_loss": -25.176681518554688, "global_step": 265388, "epoch": 3197} {"train_loss": -25.089279174804688, "global_step": 265389, "epoch": 3197} {"train_loss": -25.377046585083008, "global_step": 265390, "epoch": 3197} {"train_loss": -25.387256622314453, "global_step": 265391, "epoch": 3197} {"train_loss": -25.421567916870117, "global_step": 265392, "epoch": 3197} {"train_loss": -25.008316040039062, "global_step": 265393, "epoch": 3197} {"train_loss": -25.12118911743164, "global_step": 265394, "epoch": 3197} {"train_loss": -25.498859405517578, "global_step": 265395, "epoch": 3197} {"train_loss": -25.412456512451172, "global_step": 265396, "epoch": 3197} {"train_loss": -25.50020980834961, "global_step": 265397, "epoch": 3197} {"train_loss": -25.3696346282959, "global_step": 265398, "epoch": 3197} {"train_loss": -25.34377098083496, "global_step": 265399, "epoch": 3197} {"train_loss": -25.448314666748047, "global_step": 265400, "epoch": 3197} {"train_loss": -25.280630111694336, "global_step": 265401, "epoch": 3197} {"train_loss": -25.281217575073242, "global_step": 265402, "epoch": 3197} {"train_loss": -25.167728424072266, "global_step": 265403, "epoch": 3197} {"train_loss": -25.377395629882812, "global_step": 265404, "epoch": 3197} {"train_loss": -25.02237892150879, "global_step": 265405, "epoch": 3197} {"train_loss": -24.8710994720459, "global_step": 265406, "epoch": 3197} {"train_loss": -25.337688446044922, "global_step": 265407, "epoch": 3197} {"train_loss": -25.367881774902344, "global_step": 265408, "epoch": 3197} {"train_loss": -25.37849998474121, "global_step": 265409, "epoch": 3197} {"train_loss": -25.142934799194336, "global_step": 265410, "epoch": 3197} {"train_loss": -25.214380264282227, "global_step": 265411, "epoch": 3197} {"train_loss": -25.157453536987305, "global_step": 265412, "epoch": 3197} {"train_loss": -25.290231704711914, "global_step": 265413, "epoch": 3197} {"train_loss": -25.182798385620117, "global_step": 265414, "epoch": 3197} {"train_loss": -25.54996109008789, "global_step": 265415, "epoch": 3197} {"train_loss": -25.36579704284668, "global_step": 265416, "epoch": 3197} {"train_loss": -25.398517608642578, "global_step": 265417, "epoch": 3197} {"train_loss": -25.492263793945312, "global_step": 265418, "epoch": 3197} {"train_loss": -25.850589752197266, "global_step": 265419, "epoch": 3197} {"train_loss": -25.20493507385254, "global_step": 265420, "epoch": 3197} {"train_loss": -25.157312393188477, "global_step": 265421, "epoch": 3197} {"train_loss": -25.233335494995117, "global_step": 265422, "epoch": 3197} {"train_loss": -25.387266159057617, "global_step": 265423, "epoch": 3197} {"train_loss": -25.226781845092773, "global_step": 265424, "epoch": 3197} {"train_loss": -25.47784996032715, "global_step": 265425, "epoch": 3197} {"train_loss": -25.19818115234375, "global_step": 265426, "epoch": 3197} {"train_loss": -25.58273696899414, "global_step": 265427, "epoch": 3197} {"train_loss": -25.10738182067871, "global_step": 265428, "epoch": 3197} {"train_loss": -25.33103370666504, "global_step": 265429, "epoch": 3197} {"train_loss": -24.98876190185547, "global_step": 265430, "epoch": 3197} {"train_loss": -25.327533721923828, "global_step": 265431, "epoch": 3197} {"train_loss": -25.178569793701172, "global_step": 265432, "epoch": 3197} {"train_loss": -24.87792366671275, "global_step": 265433, "epoch": 3197, "val_loss": 6968984.0} {"train_loss": -24.192840576171875, "global_step": 265434, "epoch": 3198} {"train_loss": -20.8199405670166, "global_step": 265435, "epoch": 3198} {"train_loss": -22.657560348510742, "global_step": 265436, "epoch": 3198} {"train_loss": -24.179763793945312, "global_step": 265437, "epoch": 3198} {"train_loss": -23.646581649780273, "global_step": 265438, "epoch": 3198} {"train_loss": -23.872167587280273, "global_step": 265439, "epoch": 3198} {"train_loss": -24.459447860717773, "global_step": 265440, "epoch": 3198} {"train_loss": -23.75653648376465, "global_step": 265441, "epoch": 3198} {"train_loss": -24.344297409057617, "global_step": 265442, "epoch": 3198} {"train_loss": -23.735187530517578, "global_step": 265443, "epoch": 3198} {"train_loss": -24.457727432250977, "global_step": 265444, "epoch": 3198} {"train_loss": -24.39433479309082, "global_step": 265445, "epoch": 3198} {"train_loss": -24.506345748901367, "global_step": 265446, "epoch": 3198} {"train_loss": -24.137556076049805, "global_step": 265447, "epoch": 3198} {"train_loss": -24.72735023498535, "global_step": 265448, "epoch": 3198} {"train_loss": -24.66281509399414, "global_step": 265449, "epoch": 3198} {"train_loss": -24.395902633666992, "global_step": 265450, "epoch": 3198} {"train_loss": -24.73213005065918, "global_step": 265451, "epoch": 3198} {"train_loss": -24.71319580078125, "global_step": 265452, "epoch": 3198} {"train_loss": -24.5285701751709, "global_step": 265453, "epoch": 3198} {"train_loss": -24.507465362548828, "global_step": 265454, "epoch": 3198} {"train_loss": -25.00528335571289, "global_step": 265455, "epoch": 3198} {"train_loss": -24.643056869506836, "global_step": 265456, "epoch": 3198} {"train_loss": -24.772207260131836, "global_step": 265457, "epoch": 3198} {"train_loss": -24.678268432617188, "global_step": 265458, "epoch": 3198} {"train_loss": -25.37505531311035, "global_step": 265459, "epoch": 3198} {"train_loss": -24.768909454345703, "global_step": 265460, "epoch": 3198} {"train_loss": -25.05301284790039, "global_step": 265461, "epoch": 3198} {"train_loss": -24.859472274780273, "global_step": 265462, "epoch": 3198} {"train_loss": -24.794879913330078, "global_step": 265463, "epoch": 3198} {"train_loss": -24.870981216430664, "global_step": 265464, "epoch": 3198} {"train_loss": -24.914417266845703, "global_step": 265465, "epoch": 3198} {"train_loss": -24.932897567749023, "global_step": 265466, "epoch": 3198} {"train_loss": -24.835824966430664, "global_step": 265467, "epoch": 3198} {"train_loss": -24.785390853881836, "global_step": 265468, "epoch": 3198} {"train_loss": -25.261640548706055, "global_step": 265469, "epoch": 3198} {"train_loss": -25.02676010131836, "global_step": 265470, "epoch": 3198} {"train_loss": -25.09536361694336, "global_step": 265471, "epoch": 3198} {"train_loss": -25.17072296142578, "global_step": 265472, "epoch": 3198} {"train_loss": -25.389484405517578, "global_step": 265473, "epoch": 3198} {"train_loss": -25.451231002807617, "global_step": 265474, "epoch": 3198} {"train_loss": -25.168197631835938, "global_step": 265475, "epoch": 3198} {"train_loss": -25.049715042114258, "global_step": 265476, "epoch": 3198} {"train_loss": -25.323148727416992, "global_step": 265477, "epoch": 3198} {"train_loss": -25.305404663085938, "global_step": 265478, "epoch": 3198} {"train_loss": -25.334218978881836, "global_step": 265479, "epoch": 3198} {"train_loss": -25.202871322631836, "global_step": 265480, "epoch": 3198} {"train_loss": -25.354101181030273, "global_step": 265481, "epoch": 3198} {"train_loss": -25.626712799072266, "global_step": 265482, "epoch": 3198} {"train_loss": -25.206811904907227, "global_step": 265483, "epoch": 3198} {"train_loss": -25.330537796020508, "global_step": 265484, "epoch": 3198} {"train_loss": -25.38287353515625, "global_step": 265485, "epoch": 3198} {"train_loss": -25.375944137573242, "global_step": 265486, "epoch": 3198} {"train_loss": -25.131488800048828, "global_step": 265487, "epoch": 3198} {"train_loss": -25.48206901550293, "global_step": 265488, "epoch": 3198} {"train_loss": -25.206212997436523, "global_step": 265489, "epoch": 3198} {"train_loss": -25.12505531311035, "global_step": 265490, "epoch": 3198} {"train_loss": -25.30586051940918, "global_step": 265491, "epoch": 3198} {"train_loss": -25.325241088867188, "global_step": 265492, "epoch": 3198} {"train_loss": -25.436262130737305, "global_step": 265493, "epoch": 3198} {"train_loss": -25.180604934692383, "global_step": 265494, "epoch": 3198} {"train_loss": -25.418508529663086, "global_step": 265495, "epoch": 3198} {"train_loss": -25.150428771972656, "global_step": 265496, "epoch": 3198} {"train_loss": -25.37993812561035, "global_step": 265497, "epoch": 3198} {"train_loss": -25.17649269104004, "global_step": 265498, "epoch": 3198} {"train_loss": -25.519861221313477, "global_step": 265499, "epoch": 3198} {"train_loss": -25.632232666015625, "global_step": 265500, "epoch": 3198} {"train_loss": -25.10350227355957, "global_step": 265501, "epoch": 3198} {"train_loss": -25.249656677246094, "global_step": 265502, "epoch": 3198} {"train_loss": -25.516433715820312, "global_step": 265503, "epoch": 3198} {"train_loss": -25.511804580688477, "global_step": 265504, "epoch": 3198} {"train_loss": -25.345273971557617, "global_step": 265505, "epoch": 3198} {"train_loss": -25.506500244140625, "global_step": 265506, "epoch": 3198} {"train_loss": -25.123004913330078, "global_step": 265507, "epoch": 3198} {"train_loss": -25.671361923217773, "global_step": 265508, "epoch": 3198} {"train_loss": -25.256582260131836, "global_step": 265509, "epoch": 3198} {"train_loss": -25.520706176757812, "global_step": 265510, "epoch": 3198} {"train_loss": -25.575117111206055, "global_step": 265511, "epoch": 3198} {"train_loss": -25.366880416870117, "global_step": 265512, "epoch": 3198} {"train_loss": -25.72564125061035, "global_step": 265513, "epoch": 3198} {"train_loss": -25.0928897857666, "global_step": 265514, "epoch": 3198} {"train_loss": -25.14385986328125, "global_step": 265515, "epoch": 3198} {"train_loss": -24.92876337809735, "global_step": 265516, "epoch": 3198, "val_loss": 6970789.0} {"train_loss": -24.49567222595215, "global_step": 265517, "epoch": 3199} {"train_loss": -23.655378341674805, "global_step": 265518, "epoch": 3199} {"train_loss": -23.87955093383789, "global_step": 265519, "epoch": 3199} {"train_loss": -24.602176666259766, "global_step": 265520, "epoch": 3199} {"train_loss": -24.496540069580078, "global_step": 265521, "epoch": 3199} {"train_loss": -23.59247398376465, "global_step": 265522, "epoch": 3199} {"train_loss": -24.91089630126953, "global_step": 265523, "epoch": 3199} {"train_loss": -24.89423179626465, "global_step": 265524, "epoch": 3199} {"train_loss": -24.83164405822754, "global_step": 265525, "epoch": 3199} {"train_loss": -24.82691764831543, "global_step": 265526, "epoch": 3199} {"train_loss": -25.213665008544922, "global_step": 265527, "epoch": 3199} {"train_loss": -24.83176040649414, "global_step": 265528, "epoch": 3199} {"train_loss": -24.74228858947754, "global_step": 265529, "epoch": 3199} {"train_loss": -24.7210636138916, "global_step": 265530, "epoch": 3199} {"train_loss": -24.94258689880371, "global_step": 265531, "epoch": 3199} {"train_loss": -24.635663986206055, "global_step": 265532, "epoch": 3199} {"train_loss": -24.928014755249023, "global_step": 265533, "epoch": 3199} {"train_loss": -25.169605255126953, "global_step": 265534, "epoch": 3199} {"train_loss": -24.99879264831543, "global_step": 265535, "epoch": 3199} {"train_loss": -24.901376724243164, "global_step": 265536, "epoch": 3199} {"train_loss": -24.804874420166016, "global_step": 265537, "epoch": 3199} {"train_loss": -25.110370635986328, "global_step": 265538, "epoch": 3199} {"train_loss": -25.2138729095459, "global_step": 265539, "epoch": 3199} {"train_loss": -24.77086067199707, "global_step": 265540, "epoch": 3199} {"train_loss": -25.003849029541016, "global_step": 265541, "epoch": 3199} {"train_loss": -25.245458602905273, "global_step": 265542, "epoch": 3199} {"train_loss": -25.073209762573242, "global_step": 265543, "epoch": 3199} {"train_loss": -24.843856811523438, "global_step": 265544, "epoch": 3199} {"train_loss": -25.265132904052734, "global_step": 265545, "epoch": 3199} {"train_loss": -24.951351165771484, "global_step": 265546, "epoch": 3199} {"train_loss": -25.279508590698242, "global_step": 265547, "epoch": 3199} {"train_loss": -25.0609073638916, "global_step": 265548, "epoch": 3199} {"train_loss": -25.254535675048828, "global_step": 265549, "epoch": 3199} {"train_loss": -25.181570053100586, "global_step": 265550, "epoch": 3199} {"train_loss": -25.128931045532227, "global_step": 265551, "epoch": 3199} {"train_loss": -25.118961334228516, "global_step": 265552, "epoch": 3199} {"train_loss": -25.22870445251465, "global_step": 265553, "epoch": 3199} {"train_loss": -25.096511840820312, "global_step": 265554, "epoch": 3199} {"train_loss": -25.206602096557617, "global_step": 265555, "epoch": 3199} {"train_loss": -25.155176162719727, "global_step": 265556, "epoch": 3199} {"train_loss": -25.441312789916992, "global_step": 265557, "epoch": 3199} {"train_loss": -25.35186195373535, "global_step": 265558, "epoch": 3199} {"train_loss": -25.686920166015625, "global_step": 265559, "epoch": 3199} {"train_loss": -25.316059112548828, "global_step": 265560, "epoch": 3199} {"train_loss": -25.697912216186523, "global_step": 265561, "epoch": 3199} {"train_loss": -25.461477279663086, "global_step": 265562, "epoch": 3199} {"train_loss": -25.48126792907715, "global_step": 265563, "epoch": 3199} {"train_loss": -25.231136322021484, "global_step": 265564, "epoch": 3199} {"train_loss": -25.676620483398438, "global_step": 265565, "epoch": 3199} {"train_loss": -25.727163314819336, "global_step": 265566, "epoch": 3199} {"train_loss": -25.36627197265625, "global_step": 265567, "epoch": 3199} {"train_loss": -25.655298233032227, "global_step": 265568, "epoch": 3199} {"train_loss": -25.383899688720703, "global_step": 265569, "epoch": 3199} {"train_loss": -25.654163360595703, "global_step": 265570, "epoch": 3199} {"train_loss": -25.451303482055664, "global_step": 265571, "epoch": 3199} {"train_loss": -25.563617706298828, "global_step": 265572, "epoch": 3199} {"train_loss": -25.520153045654297, "global_step": 265573, "epoch": 3199} {"train_loss": -25.763784408569336, "global_step": 265574, "epoch": 3199} {"train_loss": -24.90745735168457, "global_step": 265575, "epoch": 3199} {"train_loss": -25.078603744506836, "global_step": 265576, "epoch": 3199} {"train_loss": -24.952260971069336, "global_step": 265577, "epoch": 3199} {"train_loss": -25.22678565979004, "global_step": 265578, "epoch": 3199} {"train_loss": -24.982120513916016, "global_step": 265579, "epoch": 3199} {"train_loss": -24.9517822265625, "global_step": 265580, "epoch": 3199} {"train_loss": -25.382858276367188, "global_step": 265581, "epoch": 3199} {"train_loss": -25.46986961364746, "global_step": 265582, "epoch": 3199} {"train_loss": -25.357013702392578, "global_step": 265583, "epoch": 3199} {"train_loss": -25.35300064086914, "global_step": 265584, "epoch": 3199} {"train_loss": -24.966310501098633, "global_step": 265585, "epoch": 3199} {"train_loss": -25.3883056640625, "global_step": 265586, "epoch": 3199} {"train_loss": -25.203128814697266, "global_step": 265587, "epoch": 3199} {"train_loss": -25.006492614746094, "global_step": 265588, "epoch": 3199} {"train_loss": -25.136465072631836, "global_step": 265589, "epoch": 3199} {"train_loss": -25.430221557617188, "global_step": 265590, "epoch": 3199} {"train_loss": -25.137357711791992, "global_step": 265591, "epoch": 3199} {"train_loss": -25.32867431640625, "global_step": 265592, "epoch": 3199} {"train_loss": -25.147615432739258, "global_step": 265593, "epoch": 3199} {"train_loss": -25.409727096557617, "global_step": 265594, "epoch": 3199} {"train_loss": -25.274904251098633, "global_step": 265595, "epoch": 3199} {"train_loss": -25.084623336791992, "global_step": 265596, "epoch": 3199} {"train_loss": -25.109254837036133, "global_step": 265597, "epoch": 3199} {"train_loss": -25.197681427001953, "global_step": 265598, "epoch": 3199} {"train_loss": -25.126842200037945, "global_step": 265599, "epoch": 3199, "val_loss": 6914345.0} {"train_loss": -25.14312171936035, "global_step": 265600, "epoch": 3200} {"train_loss": -24.79095458984375, "global_step": 265601, "epoch": 3200} {"train_loss": -25.257667541503906, "global_step": 265602, "epoch": 3200} {"train_loss": -25.098125457763672, "global_step": 265603, "epoch": 3200} {"train_loss": -24.521753311157227, "global_step": 265604, "epoch": 3200} {"train_loss": -25.29131317138672, "global_step": 265605, "epoch": 3200} {"train_loss": -25.505292892456055, "global_step": 265606, "epoch": 3200} {"train_loss": -25.096149444580078, "global_step": 265607, "epoch": 3200} {"train_loss": -25.04291343688965, "global_step": 265608, "epoch": 3200} {"train_loss": -25.067350387573242, "global_step": 265609, "epoch": 3200} {"train_loss": -24.8776798248291, "global_step": 265610, "epoch": 3200} {"train_loss": -25.662256240844727, "global_step": 265611, "epoch": 3200} {"train_loss": -25.308521270751953, "global_step": 265612, "epoch": 3200} {"train_loss": -25.0722713470459, "global_step": 265613, "epoch": 3200} {"train_loss": -24.864389419555664, "global_step": 265614, "epoch": 3200} {"train_loss": -25.084735870361328, "global_step": 265615, "epoch": 3200} {"train_loss": -25.160659790039062, "global_step": 265616, "epoch": 3200} {"train_loss": -24.880002975463867, "global_step": 265617, "epoch": 3200} {"train_loss": -25.4307918548584, "global_step": 265618, "epoch": 3200} {"train_loss": -25.299442291259766, "global_step": 265619, "epoch": 3200} {"train_loss": -25.1093807220459, "global_step": 265620, "epoch": 3200} {"train_loss": -25.29216194152832, "global_step": 265621, "epoch": 3200} {"train_loss": -25.763992309570312, "global_step": 265622, "epoch": 3200} {"train_loss": -25.17743492126465, "global_step": 265623, "epoch": 3200} {"train_loss": -25.359970092773438, "global_step": 265624, "epoch": 3200} {"train_loss": -24.950952529907227, "global_step": 265625, "epoch": 3200} {"train_loss": -25.042465209960938, "global_step": 265626, "epoch": 3200} {"train_loss": -25.39051628112793, "global_step": 265627, "epoch": 3200} {"train_loss": -25.046506881713867, "global_step": 265628, "epoch": 3200} {"train_loss": -25.191030502319336, "global_step": 265629, "epoch": 3200} {"train_loss": -25.428741455078125, "global_step": 265630, "epoch": 3200} {"train_loss": -25.3377742767334, "global_step": 265631, "epoch": 3200} {"train_loss": -25.62764549255371, "global_step": 265632, "epoch": 3200} {"train_loss": -25.52460289001465, "global_step": 265633, "epoch": 3200} {"train_loss": -25.5841064453125, "global_step": 265634, "epoch": 3200} {"train_loss": -25.249916076660156, "global_step": 265635, "epoch": 3200} {"train_loss": -25.068038940429688, "global_step": 265636, "epoch": 3200} {"train_loss": -25.64198875427246, "global_step": 265637, "epoch": 3200} {"train_loss": -25.444046020507812, "global_step": 265638, "epoch": 3200} {"train_loss": -24.884674072265625, "global_step": 265639, "epoch": 3200} {"train_loss": -25.537412643432617, "global_step": 265640, "epoch": 3200} {"train_loss": -25.1649227142334, "global_step": 265641, "epoch": 3200} {"train_loss": -25.132720947265625, "global_step": 265642, "epoch": 3200} {"train_loss": -24.97262954711914, "global_step": 265643, "epoch": 3200} {"train_loss": -25.272836685180664, "global_step": 265644, "epoch": 3200} {"train_loss": -25.254728317260742, "global_step": 265645, "epoch": 3200} {"train_loss": -24.887453079223633, "global_step": 265646, "epoch": 3200} {"train_loss": -24.4329891204834, "global_step": 265647, "epoch": 3200} {"train_loss": -25.17299461364746, "global_step": 265648, "epoch": 3200} {"train_loss": -25.218137741088867, "global_step": 265649, "epoch": 3200} {"train_loss": -25.122114181518555, "global_step": 265650, "epoch": 3200} {"train_loss": -24.549381256103516, "global_step": 265651, "epoch": 3200} {"train_loss": -25.124021530151367, "global_step": 265652, "epoch": 3200} {"train_loss": -25.17188262939453, "global_step": 265653, "epoch": 3200} {"train_loss": -25.222135543823242, "global_step": 265654, "epoch": 3200} {"train_loss": -24.97602653503418, "global_step": 265655, "epoch": 3200} {"train_loss": -25.36524200439453, "global_step": 265656, "epoch": 3200} {"train_loss": -24.334970474243164, "global_step": 265657, "epoch": 3200} {"train_loss": -24.63806915283203, "global_step": 265658, "epoch": 3200} {"train_loss": -24.79422950744629, "global_step": 265659, "epoch": 3200} {"train_loss": -24.757429122924805, "global_step": 265660, "epoch": 3200} {"train_loss": -24.841135025024414, "global_step": 265661, "epoch": 3200} {"train_loss": -25.437602996826172, "global_step": 265662, "epoch": 3200} {"train_loss": -24.87944984436035, "global_step": 265663, "epoch": 3200} {"train_loss": -25.16712760925293, "global_step": 265664, "epoch": 3200} {"train_loss": -24.9998722076416, "global_step": 265665, "epoch": 3200} {"train_loss": -25.1614990234375, "global_step": 265666, "epoch": 3200} {"train_loss": -25.148300170898438, "global_step": 265667, "epoch": 3200} {"train_loss": -25.03236198425293, "global_step": 265668, "epoch": 3200} {"train_loss": -25.2756290435791, "global_step": 265669, "epoch": 3200} {"train_loss": -25.294527053833008, "global_step": 265670, "epoch": 3200} {"train_loss": -24.957929611206055, "global_step": 265671, "epoch": 3200} {"train_loss": -25.079687118530273, "global_step": 265672, "epoch": 3200} {"train_loss": -25.158620834350586, "global_step": 265673, "epoch": 3200} {"train_loss": -25.248044967651367, "global_step": 265674, "epoch": 3200} {"train_loss": -25.284164428710938, "global_step": 265675, "epoch": 3200} {"train_loss": -25.248531341552734, "global_step": 265676, "epoch": 3200} {"train_loss": -25.482975006103516, "global_step": 265677, "epoch": 3200} {"train_loss": -25.45162010192871, "global_step": 265678, "epoch": 3200} {"train_loss": -25.458765029907227, "global_step": 265679, "epoch": 3200} {"train_loss": -25.444400787353516, "global_step": 265680, "epoch": 3200} {"train_loss": -25.289316177368164, "global_step": 265681, "epoch": 3200} {"train_loss": -25.148894643209065, "global_step": 265682, "epoch": 3200, "train/sim_max_reward_0": 1.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4500000": 1.0, "test/sim_max_reward_4500001": 1.0, "test/sim_max_reward_4500002": 1.0, "test/sim_max_reward_4500003": 1.0, "test/sim_max_reward_4500004": 1.0, "test/sim_max_reward_4500005": 1.0, "test/sim_max_reward_4500006": 1.0, "test/sim_max_reward_4500007": 0.0, "test/sim_max_reward_4500008": 1.0, "test/sim_max_reward_4500009": 1.0, "test/sim_max_reward_4500010": 1.0, "test/sim_max_reward_4500011": 1.0, "test/sim_max_reward_4500012": 1.0, "test/sim_max_reward_4500013": 1.0, "test/sim_max_reward_4500014": 1.0, "test/sim_max_reward_4500015": 1.0, "test/sim_max_reward_4500016": 1.0, "test/sim_max_reward_4500017": 1.0, "test/sim_max_reward_4500018": 1.0, "test/sim_max_reward_4500019": 1.0, "test/sim_max_reward_4500020": 1.0, "test/sim_max_reward_4500021": 1.0, "train/mean_score": 1.0, "test/mean_score": 0.9545454545454546, "val_loss": 6931283.0} {"train_loss": -24.26117515563965, "global_step": 265683, "epoch": 3201} {"train_loss": -24.837278366088867, "global_step": 265684, "epoch": 3201} {"train_loss": -24.745176315307617, "global_step": 265685, "epoch": 3201} {"train_loss": -24.636734008789062, "global_step": 265686, "epoch": 3201} {"train_loss": -24.842016220092773, "global_step": 265687, "epoch": 3201} {"train_loss": -24.864288330078125, "global_step": 265688, "epoch": 3201} {"train_loss": -24.705753326416016, "global_step": 265689, "epoch": 3201} {"train_loss": -24.872926712036133, "global_step": 265690, "epoch": 3201} {"train_loss": -25.444263458251953, "global_step": 265691, "epoch": 3201} {"train_loss": -24.727252960205078, "global_step": 265692, "epoch": 3201} {"train_loss": -24.929738998413086, "global_step": 265693, "epoch": 3201} {"train_loss": -25.215415954589844, "global_step": 265694, "epoch": 3201} {"train_loss": -25.360111236572266, "global_step": 265695, "epoch": 3201} {"train_loss": -25.41034698486328, "global_step": 265696, "epoch": 3201} {"train_loss": -24.959253311157227, "global_step": 265697, "epoch": 3201} {"train_loss": -24.9677791595459, "global_step": 265698, "epoch": 3201} {"train_loss": -25.101322174072266, "global_step": 265699, "epoch": 3201} {"train_loss": -24.846263885498047, "global_step": 265700, "epoch": 3201} {"train_loss": -24.81580924987793, "global_step": 265701, "epoch": 3201} {"train_loss": -25.302013397216797, "global_step": 265702, "epoch": 3201} {"train_loss": -25.248952865600586, "global_step": 265703, "epoch": 3201} {"train_loss": -25.519393920898438, "global_step": 265704, "epoch": 3201} {"train_loss": -25.389652252197266, "global_step": 265705, "epoch": 3201} {"train_loss": -25.17705726623535, "global_step": 265706, "epoch": 3201} {"train_loss": -25.09522819519043, "global_step": 265707, "epoch": 3201} {"train_loss": -25.065092086791992, "global_step": 265708, "epoch": 3201} {"train_loss": -25.044767379760742, "global_step": 265709, "epoch": 3201} {"train_loss": -25.02860450744629, "global_step": 265710, "epoch": 3201} {"train_loss": -25.326099395751953, "global_step": 265711, "epoch": 3201} {"train_loss": -25.171052932739258, "global_step": 265712, "epoch": 3201} {"train_loss": -25.630023956298828, "global_step": 265713, "epoch": 3201} {"train_loss": -25.514720916748047, "global_step": 265714, "epoch": 3201} {"train_loss": -25.292011260986328, "global_step": 265715, "epoch": 3201} {"train_loss": -25.53912925720215, "global_step": 265716, "epoch": 3201} {"train_loss": -25.525146484375, "global_step": 265717, "epoch": 3201} {"train_loss": -25.21541404724121, "global_step": 265718, "epoch": 3201} {"train_loss": -25.205175399780273, "global_step": 265719, "epoch": 3201} {"train_loss": -24.959592819213867, "global_step": 265720, "epoch": 3201} {"train_loss": -25.248334884643555, "global_step": 265721, "epoch": 3201} {"train_loss": -25.088438034057617, "global_step": 265722, "epoch": 3201} {"train_loss": -25.67543601989746, "global_step": 265723, "epoch": 3201} {"train_loss": -25.2851505279541, "global_step": 265724, "epoch": 3201} {"train_loss": -25.347856521606445, "global_step": 265725, "epoch": 3201} {"train_loss": -25.653589248657227, "global_step": 265726, "epoch": 3201} {"train_loss": -25.079219818115234, "global_step": 265727, "epoch": 3201} {"train_loss": -25.383014678955078, "global_step": 265728, "epoch": 3201} {"train_loss": -25.097061157226562, "global_step": 265729, "epoch": 3201} {"train_loss": -25.460195541381836, "global_step": 265730, "epoch": 3201} {"train_loss": -24.998910903930664, "global_step": 265731, "epoch": 3201} {"train_loss": -25.049755096435547, "global_step": 265732, "epoch": 3201} {"train_loss": -25.055387496948242, "global_step": 265733, "epoch": 3201} {"train_loss": -25.04423713684082, "global_step": 265734, "epoch": 3201} {"train_loss": -25.074748992919922, "global_step": 265735, "epoch": 3201} {"train_loss": -24.90593910217285, "global_step": 265736, "epoch": 3201} {"train_loss": -25.052875518798828, "global_step": 265737, "epoch": 3201} {"train_loss": -25.25284767150879, "global_step": 265738, "epoch": 3201} {"train_loss": -25.45867347717285, "global_step": 265739, "epoch": 3201} {"train_loss": -25.088529586791992, "global_step": 265740, "epoch": 3201} {"train_loss": -24.791671752929688, "global_step": 265741, "epoch": 3201} {"train_loss": -25.077878952026367, "global_step": 265742, "epoch": 3201} {"train_loss": -25.251911163330078, "global_step": 265743, "epoch": 3201} {"train_loss": -25.25362205505371, "global_step": 265744, "epoch": 3201} {"train_loss": -25.052770614624023, "global_step": 265745, "epoch": 3201} {"train_loss": -24.839420318603516, "global_step": 265746, "epoch": 3201} {"train_loss": -24.852521896362305, "global_step": 265747, "epoch": 3201} {"train_loss": -25.263967514038086, "global_step": 265748, "epoch": 3201} {"train_loss": -25.253263473510742, "global_step": 265749, "epoch": 3201} {"train_loss": -25.25416374206543, "global_step": 265750, "epoch": 3201} {"train_loss": -25.282129287719727, "global_step": 265751, "epoch": 3201} {"train_loss": -25.421091079711914, "global_step": 265752, "epoch": 3201} {"train_loss": -25.050540924072266, "global_step": 265753, "epoch": 3201} {"train_loss": -25.60662841796875, "global_step": 265754, "epoch": 3201} {"train_loss": -25.10872459411621, "global_step": 265755, "epoch": 3201} {"train_loss": -25.34406280517578, "global_step": 265756, "epoch": 3201} {"train_loss": -25.476491928100586, "global_step": 265757, "epoch": 3201} {"train_loss": -25.522180557250977, "global_step": 265758, "epoch": 3201} {"train_loss": -25.492795944213867, "global_step": 265759, "epoch": 3201} {"train_loss": -25.518476486206055, "global_step": 265760, "epoch": 3201} {"train_loss": -25.351118087768555, "global_step": 265761, "epoch": 3201} {"train_loss": -25.105112075805664, "global_step": 265762, "epoch": 3201} {"train_loss": -25.3291015625, "global_step": 265763, "epoch": 3201} {"train_loss": -25.26371955871582, "global_step": 265764, "epoch": 3201} {"train_loss": -25.19555406685335, "global_step": 265765, "epoch": 3201, "val_loss": 6993674.0} {"train_loss": -24.400501251220703, "global_step": 265766, "epoch": 3202} {"train_loss": -24.77508544921875, "global_step": 265767, "epoch": 3202} {"train_loss": -24.531415939331055, "global_step": 265768, "epoch": 3202} {"train_loss": -25.11952018737793, "global_step": 265769, "epoch": 3202} {"train_loss": -24.168685913085938, "global_step": 265770, "epoch": 3202} {"train_loss": -24.814117431640625, "global_step": 265771, "epoch": 3202} {"train_loss": -25.153310775756836, "global_step": 265772, "epoch": 3202} {"train_loss": -24.79756736755371, "global_step": 265773, "epoch": 3202} {"train_loss": -24.456645965576172, "global_step": 265774, "epoch": 3202} {"train_loss": -25.109615325927734, "global_step": 265775, "epoch": 3202} {"train_loss": -24.91096305847168, "global_step": 265776, "epoch": 3202} {"train_loss": -24.754369735717773, "global_step": 265777, "epoch": 3202} {"train_loss": -24.930938720703125, "global_step": 265778, "epoch": 3202} {"train_loss": -25.166391372680664, "global_step": 265779, "epoch": 3202} {"train_loss": -25.09864616394043, "global_step": 265780, "epoch": 3202} {"train_loss": -24.90822410583496, "global_step": 265781, "epoch": 3202} {"train_loss": -25.013303756713867, "global_step": 265782, "epoch": 3202} {"train_loss": -24.899887084960938, "global_step": 265783, "epoch": 3202} {"train_loss": -25.204212188720703, "global_step": 265784, "epoch": 3202} {"train_loss": -24.814123153686523, "global_step": 265785, "epoch": 3202} {"train_loss": -24.991777420043945, "global_step": 265786, "epoch": 3202} {"train_loss": -25.07861328125, "global_step": 265787, "epoch": 3202} {"train_loss": -25.42881202697754, "global_step": 265788, "epoch": 3202} {"train_loss": -25.112937927246094, "global_step": 265789, "epoch": 3202} {"train_loss": -25.38886833190918, "global_step": 265790, "epoch": 3202} {"train_loss": -25.34751319885254, "global_step": 265791, "epoch": 3202} {"train_loss": -25.25824546813965, "global_step": 265792, "epoch": 3202} {"train_loss": -25.374679565429688, "global_step": 265793, "epoch": 3202} {"train_loss": -25.29547691345215, "global_step": 265794, "epoch": 3202} {"train_loss": -25.372739791870117, "global_step": 265795, "epoch": 3202} {"train_loss": -24.97328758239746, "global_step": 265796, "epoch": 3202} {"train_loss": -25.534250259399414, "global_step": 265797, "epoch": 3202} {"train_loss": -25.198915481567383, "global_step": 265798, "epoch": 3202} {"train_loss": -25.244281768798828, "global_step": 265799, "epoch": 3202} {"train_loss": -25.132953643798828, "global_step": 265800, "epoch": 3202} {"train_loss": -25.316686630249023, "global_step": 265801, "epoch": 3202} {"train_loss": -25.50933265686035, "global_step": 265802, "epoch": 3202} {"train_loss": -25.23007583618164, "global_step": 265803, "epoch": 3202} {"train_loss": -25.34065055847168, "global_step": 265804, "epoch": 3202} {"train_loss": -25.222185134887695, "global_step": 265805, "epoch": 3202} {"train_loss": -25.47584342956543, "global_step": 265806, "epoch": 3202} {"train_loss": -24.72957992553711, "global_step": 265807, "epoch": 3202} {"train_loss": -25.355907440185547, "global_step": 265808, "epoch": 3202} {"train_loss": -25.269227981567383, "global_step": 265809, "epoch": 3202} {"train_loss": -25.73060417175293, "global_step": 265810, "epoch": 3202} {"train_loss": -25.45020866394043, "global_step": 265811, "epoch": 3202} {"train_loss": -25.423994064331055, "global_step": 265812, "epoch": 3202} {"train_loss": -25.073719024658203, "global_step": 265813, "epoch": 3202} {"train_loss": -25.548791885375977, "global_step": 265814, "epoch": 3202} {"train_loss": -25.216163635253906, "global_step": 265815, "epoch": 3202} {"train_loss": -25.277334213256836, "global_step": 265816, "epoch": 3202} {"train_loss": -25.187314987182617, "global_step": 265817, "epoch": 3202} {"train_loss": -25.207901000976562, "global_step": 265818, "epoch": 3202} {"train_loss": -25.171463012695312, "global_step": 265819, "epoch": 3202} {"train_loss": -24.80170249938965, "global_step": 265820, "epoch": 3202} {"train_loss": -25.446786880493164, "global_step": 265821, "epoch": 3202} {"train_loss": -25.1214656829834, "global_step": 265822, "epoch": 3202} {"train_loss": -25.3413143157959, "global_step": 265823, "epoch": 3202} {"train_loss": -25.212255477905273, "global_step": 265824, "epoch": 3202} {"train_loss": -25.133434295654297, "global_step": 265825, "epoch": 3202} {"train_loss": -25.293838500976562, "global_step": 265826, "epoch": 3202} {"train_loss": -25.19068717956543, "global_step": 265827, "epoch": 3202} {"train_loss": -25.2880916595459, "global_step": 265828, "epoch": 3202} {"train_loss": -25.22603988647461, "global_step": 265829, "epoch": 3202} {"train_loss": -25.13918113708496, "global_step": 265830, "epoch": 3202} {"train_loss": -25.09347915649414, "global_step": 265831, "epoch": 3202} {"train_loss": -24.78334617614746, "global_step": 265832, "epoch": 3202} {"train_loss": -25.23444175720215, "global_step": 265833, "epoch": 3202} {"train_loss": -25.185476303100586, "global_step": 265834, "epoch": 3202} {"train_loss": -25.21223258972168, "global_step": 265835, "epoch": 3202} {"train_loss": -25.41314697265625, "global_step": 265836, "epoch": 3202} {"train_loss": -24.8483829498291, "global_step": 265837, "epoch": 3202} {"train_loss": -25.46347999572754, "global_step": 265838, "epoch": 3202} {"train_loss": -25.361806869506836, "global_step": 265839, "epoch": 3202} {"train_loss": -25.303647994995117, "global_step": 265840, "epoch": 3202} {"train_loss": -24.947132110595703, "global_step": 265841, "epoch": 3202} {"train_loss": -25.237199783325195, "global_step": 265842, "epoch": 3202} {"train_loss": -25.382205963134766, "global_step": 265843, "epoch": 3202} {"train_loss": -25.16817283630371, "global_step": 265844, "epoch": 3202} {"train_loss": -25.218664169311523, "global_step": 265845, "epoch": 3202} {"train_loss": -24.87799072265625, "global_step": 265846, "epoch": 3202} {"train_loss": -25.278417587280273, "global_step": 265847, "epoch": 3202} {"train_loss": -25.133953301303357, "global_step": 265848, "epoch": 3202, "val_loss": 7076737.0} {"train_loss": -24.40130043029785, "global_step": 265849, "epoch": 3203} {"train_loss": -24.87982749938965, "global_step": 265850, "epoch": 3203} {"train_loss": -24.624692916870117, "global_step": 265851, "epoch": 3203} {"train_loss": -24.937774658203125, "global_step": 265852, "epoch": 3203} {"train_loss": -24.366727828979492, "global_step": 265853, "epoch": 3203} {"train_loss": -24.587467193603516, "global_step": 265854, "epoch": 3203} {"train_loss": -24.647438049316406, "global_step": 265855, "epoch": 3203} {"train_loss": -24.877395629882812, "global_step": 265856, "epoch": 3203} {"train_loss": -25.1494083404541, "global_step": 265857, "epoch": 3203} {"train_loss": -25.060335159301758, "global_step": 265858, "epoch": 3203} {"train_loss": -24.892332077026367, "global_step": 265859, "epoch": 3203} {"train_loss": -24.925373077392578, "global_step": 265860, "epoch": 3203} {"train_loss": -24.962215423583984, "global_step": 265861, "epoch": 3203} {"train_loss": -24.722864151000977, "global_step": 265862, "epoch": 3203} {"train_loss": -24.873334884643555, "global_step": 265863, "epoch": 3203} {"train_loss": -25.020841598510742, "global_step": 265864, "epoch": 3203} {"train_loss": -25.218639373779297, "global_step": 265865, "epoch": 3203} {"train_loss": -24.882205963134766, "global_step": 265866, "epoch": 3203} {"train_loss": -24.984485626220703, "global_step": 265867, "epoch": 3203} {"train_loss": -25.56122398376465, "global_step": 265868, "epoch": 3203} {"train_loss": -25.185510635375977, "global_step": 265869, "epoch": 3203} {"train_loss": -24.933523178100586, "global_step": 265870, "epoch": 3203} {"train_loss": -24.918991088867188, "global_step": 265871, "epoch": 3203} {"train_loss": -24.81064796447754, "global_step": 265872, "epoch": 3203} {"train_loss": -25.123937606811523, "global_step": 265873, "epoch": 3203} {"train_loss": -25.251705169677734, "global_step": 265874, "epoch": 3203} {"train_loss": -25.07027816772461, "global_step": 265875, "epoch": 3203} {"train_loss": -25.162006378173828, "global_step": 265876, "epoch": 3203} {"train_loss": -25.212453842163086, "global_step": 265877, "epoch": 3203} {"train_loss": -25.622968673706055, "global_step": 265878, "epoch": 3203} {"train_loss": -25.41266632080078, "global_step": 265879, "epoch": 3203} {"train_loss": -25.21619987487793, "global_step": 265880, "epoch": 3203} {"train_loss": -25.529870986938477, "global_step": 265881, "epoch": 3203} {"train_loss": -25.41378402709961, "global_step": 265882, "epoch": 3203} {"train_loss": -25.045988082885742, "global_step": 265883, "epoch": 3203} {"train_loss": -25.07210922241211, "global_step": 265884, "epoch": 3203} {"train_loss": -25.46736717224121, "global_step": 265885, "epoch": 3203} {"train_loss": -25.13031005859375, "global_step": 265886, "epoch": 3203} {"train_loss": -25.73687171936035, "global_step": 265887, "epoch": 3203} {"train_loss": -25.18456268310547, "global_step": 265888, "epoch": 3203} {"train_loss": -25.239099502563477, "global_step": 265889, "epoch": 3203} {"train_loss": -25.24106788635254, "global_step": 265890, "epoch": 3203} {"train_loss": -25.126956939697266, "global_step": 265891, "epoch": 3203} {"train_loss": -25.315553665161133, "global_step": 265892, "epoch": 3203} {"train_loss": -25.71820640563965, "global_step": 265893, "epoch": 3203} {"train_loss": -25.351926803588867, "global_step": 265894, "epoch": 3203} {"train_loss": -25.037817001342773, "global_step": 265895, "epoch": 3203} {"train_loss": -25.158063888549805, "global_step": 265896, "epoch": 3203} {"train_loss": -25.183704376220703, "global_step": 265897, "epoch": 3203} {"train_loss": -24.801671981811523, "global_step": 265898, "epoch": 3203} {"train_loss": -25.168935775756836, "global_step": 265899, "epoch": 3203} {"train_loss": -25.003429412841797, "global_step": 265900, "epoch": 3203} {"train_loss": -24.8302059173584, "global_step": 265901, "epoch": 3203} {"train_loss": -24.684162139892578, "global_step": 265902, "epoch": 3203} {"train_loss": -24.927783966064453, "global_step": 265903, "epoch": 3203} {"train_loss": -25.551227569580078, "global_step": 265904, "epoch": 3203} {"train_loss": -25.18208885192871, "global_step": 265905, "epoch": 3203} {"train_loss": -24.883941650390625, "global_step": 265906, "epoch": 3203} {"train_loss": -24.816965103149414, "global_step": 265907, "epoch": 3203} {"train_loss": -24.622222900390625, "global_step": 265908, "epoch": 3203} {"train_loss": -25.434926986694336, "global_step": 265909, "epoch": 3203} {"train_loss": -25.01801109313965, "global_step": 265910, "epoch": 3203} {"train_loss": -24.795166015625, "global_step": 265911, "epoch": 3203} {"train_loss": -25.1862850189209, "global_step": 265912, "epoch": 3203} {"train_loss": -25.537900924682617, "global_step": 265913, "epoch": 3203} {"train_loss": -25.3715877532959, "global_step": 265914, "epoch": 3203} {"train_loss": -25.343345642089844, "global_step": 265915, "epoch": 3203} {"train_loss": -24.893178939819336, "global_step": 265916, "epoch": 3203} {"train_loss": -25.00682258605957, "global_step": 265917, "epoch": 3203} {"train_loss": -25.339025497436523, "global_step": 265918, "epoch": 3203} {"train_loss": -25.23719596862793, "global_step": 265919, "epoch": 3203} {"train_loss": -25.479923248291016, "global_step": 265920, "epoch": 3203} {"train_loss": -24.841567993164062, "global_step": 265921, "epoch": 3203} {"train_loss": -25.650548934936523, "global_step": 265922, "epoch": 3203} {"train_loss": -25.2622013092041, "global_step": 265923, "epoch": 3203} {"train_loss": -25.466922760009766, "global_step": 265924, "epoch": 3203} {"train_loss": -25.446712493896484, "global_step": 265925, "epoch": 3203} {"train_loss": -25.53041648864746, "global_step": 265926, "epoch": 3203} {"train_loss": -25.05858039855957, "global_step": 265927, "epoch": 3203} {"train_loss": -25.902374267578125, "global_step": 265928, "epoch": 3203} {"train_loss": -25.03542137145996, "global_step": 265929, "epoch": 3203} {"train_loss": -25.257177352905273, "global_step": 265930, "epoch": 3203} {"train_loss": -25.12628387543092, "global_step": 265931, "epoch": 3203, "val_loss": 6815255.0} {"train_loss": -24.44025230407715, "global_step": 265932, "epoch": 3204} {"train_loss": -24.23646354675293, "global_step": 265933, "epoch": 3204} {"train_loss": -24.647558212280273, "global_step": 265934, "epoch": 3204} {"train_loss": -24.77131462097168, "global_step": 265935, "epoch": 3204} {"train_loss": -24.456539154052734, "global_step": 265936, "epoch": 3204} {"train_loss": -24.687870025634766, "global_step": 265937, "epoch": 3204} {"train_loss": -25.15094757080078, "global_step": 265938, "epoch": 3204} {"train_loss": -24.862825393676758, "global_step": 265939, "epoch": 3204} {"train_loss": -24.74067497253418, "global_step": 265940, "epoch": 3204} {"train_loss": -25.251523971557617, "global_step": 265941, "epoch": 3204} {"train_loss": -24.820632934570312, "global_step": 265942, "epoch": 3204} {"train_loss": -25.107254028320312, "global_step": 265943, "epoch": 3204} {"train_loss": -24.819217681884766, "global_step": 265944, "epoch": 3204} {"train_loss": -25.02664566040039, "global_step": 265945, "epoch": 3204} {"train_loss": -25.1906681060791, "global_step": 265946, "epoch": 3204} {"train_loss": -24.475614547729492, "global_step": 265947, "epoch": 3204} {"train_loss": -25.323637008666992, "global_step": 265948, "epoch": 3204} {"train_loss": -24.8681640625, "global_step": 265949, "epoch": 3204} {"train_loss": -24.817880630493164, "global_step": 265950, "epoch": 3204} {"train_loss": -25.39838218688965, "global_step": 265951, "epoch": 3204} {"train_loss": -25.289575576782227, "global_step": 265952, "epoch": 3204} {"train_loss": -25.141550064086914, "global_step": 265953, "epoch": 3204} {"train_loss": -24.66817855834961, "global_step": 265954, "epoch": 3204} {"train_loss": -25.17144203186035, "global_step": 265955, "epoch": 3204} {"train_loss": -25.187986373901367, "global_step": 265956, "epoch": 3204} {"train_loss": -24.961469650268555, "global_step": 265957, "epoch": 3204} {"train_loss": -25.20660972595215, "global_step": 265958, "epoch": 3204} {"train_loss": -25.400495529174805, "global_step": 265959, "epoch": 3204} {"train_loss": -25.165271759033203, "global_step": 265960, "epoch": 3204} {"train_loss": -25.197031021118164, "global_step": 265961, "epoch": 3204} {"train_loss": -25.232032775878906, "global_step": 265962, "epoch": 3204} {"train_loss": -25.262516021728516, "global_step": 265963, "epoch": 3204} {"train_loss": -25.21967124938965, "global_step": 265964, "epoch": 3204} {"train_loss": -24.8878116607666, "global_step": 265965, "epoch": 3204} {"train_loss": -24.919851303100586, "global_step": 265966, "epoch": 3204} {"train_loss": -25.520694732666016, "global_step": 265967, "epoch": 3204} {"train_loss": -24.992525100708008, "global_step": 265968, "epoch": 3204} {"train_loss": -25.11751365661621, "global_step": 265969, "epoch": 3204} {"train_loss": -25.10724449157715, "global_step": 265970, "epoch": 3204} {"train_loss": -25.309823989868164, "global_step": 265971, "epoch": 3204} {"train_loss": -25.504316329956055, "global_step": 265972, "epoch": 3204} {"train_loss": -25.010183334350586, "global_step": 265973, "epoch": 3204} {"train_loss": -25.262907028198242, "global_step": 265974, "epoch": 3204} {"train_loss": -25.367841720581055, "global_step": 265975, "epoch": 3204} {"train_loss": -25.479625701904297, "global_step": 265976, "epoch": 3204} {"train_loss": -25.521656036376953, "global_step": 265977, "epoch": 3204} {"train_loss": -25.350078582763672, "global_step": 265978, "epoch": 3204} {"train_loss": -25.289880752563477, "global_step": 265979, "epoch": 3204} {"train_loss": -25.402585983276367, "global_step": 265980, "epoch": 3204} {"train_loss": -25.88689613342285, "global_step": 265981, "epoch": 3204} {"train_loss": -25.32575035095215, "global_step": 265982, "epoch": 3204} {"train_loss": -25.37862205505371, "global_step": 265983, "epoch": 3204} {"train_loss": -24.848798751831055, "global_step": 265984, "epoch": 3204} {"train_loss": -25.160539627075195, "global_step": 265985, "epoch": 3204} {"train_loss": -25.007476806640625, "global_step": 265986, "epoch": 3204} {"train_loss": -24.996484756469727, "global_step": 265987, "epoch": 3204} {"train_loss": -24.91237449645996, "global_step": 265988, "epoch": 3204} {"train_loss": -25.252973556518555, "global_step": 265989, "epoch": 3204} {"train_loss": -25.5297794342041, "global_step": 265990, "epoch": 3204} {"train_loss": -25.370935440063477, "global_step": 265991, "epoch": 3204} {"train_loss": -24.774784088134766, "global_step": 265992, "epoch": 3204} {"train_loss": -25.33000373840332, "global_step": 265993, "epoch": 3204} {"train_loss": -25.245893478393555, "global_step": 265994, "epoch": 3204} {"train_loss": -25.272262573242188, "global_step": 265995, "epoch": 3204} {"train_loss": -25.041162490844727, "global_step": 265996, "epoch": 3204} {"train_loss": -25.076435089111328, "global_step": 265997, "epoch": 3204} {"train_loss": -24.967721939086914, "global_step": 265998, "epoch": 3204} {"train_loss": -25.36908531188965, "global_step": 265999, "epoch": 3204} {"train_loss": -25.531553268432617, "global_step": 266000, "epoch": 3204} {"train_loss": -25.20761489868164, "global_step": 266001, "epoch": 3204} {"train_loss": -25.2265682220459, "global_step": 266002, "epoch": 3204} {"train_loss": -25.00802993774414, "global_step": 266003, "epoch": 3204} {"train_loss": -24.90468406677246, "global_step": 266004, "epoch": 3204} {"train_loss": -25.26616859436035, "global_step": 266005, "epoch": 3204} {"train_loss": -25.49464225769043, "global_step": 266006, "epoch": 3204} {"train_loss": -25.24861717224121, "global_step": 266007, "epoch": 3204} {"train_loss": -25.318038940429688, "global_step": 266008, "epoch": 3204} {"train_loss": -24.948450088500977, "global_step": 266009, "epoch": 3204} {"train_loss": -25.402511596679688, "global_step": 266010, "epoch": 3204} {"train_loss": -25.454442977905273, "global_step": 266011, "epoch": 3204} {"train_loss": -25.38563346862793, "global_step": 266012, "epoch": 3204} {"train_loss": -24.975942611694336, "global_step": 266013, "epoch": 3204} {"train_loss": -25.13236055029444, "global_step": 266014, "epoch": 3204, "val_loss": 6846558.0} {"train_loss": -24.66130828857422, "global_step": 266015, "epoch": 3205} {"train_loss": -25.00653839111328, "global_step": 266016, "epoch": 3205} {"train_loss": -24.8969783782959, "global_step": 266017, "epoch": 3205} {"train_loss": -25.06073570251465, "global_step": 266018, "epoch": 3205} {"train_loss": -24.876628875732422, "global_step": 266019, "epoch": 3205} {"train_loss": -24.95634651184082, "global_step": 266020, "epoch": 3205} {"train_loss": -25.129684448242188, "global_step": 266021, "epoch": 3205} {"train_loss": -25.44354820251465, "global_step": 266022, "epoch": 3205} {"train_loss": -24.921009063720703, "global_step": 266023, "epoch": 3205} {"train_loss": -25.214693069458008, "global_step": 266024, "epoch": 3205} {"train_loss": -24.969852447509766, "global_step": 266025, "epoch": 3205} {"train_loss": -25.017608642578125, "global_step": 266026, "epoch": 3205} {"train_loss": -25.20513916015625, "global_step": 266027, "epoch": 3205} {"train_loss": -25.14482307434082, "global_step": 266028, "epoch": 3205} {"train_loss": -25.168962478637695, "global_step": 266029, "epoch": 3205} {"train_loss": -25.460540771484375, "global_step": 266030, "epoch": 3205} {"train_loss": -25.342639923095703, "global_step": 266031, "epoch": 3205} {"train_loss": -25.39560890197754, "global_step": 266032, "epoch": 3205} {"train_loss": -25.192899703979492, "global_step": 266033, "epoch": 3205} {"train_loss": -25.112892150878906, "global_step": 266034, "epoch": 3205} {"train_loss": -25.024587631225586, "global_step": 266035, "epoch": 3205} {"train_loss": -25.141151428222656, "global_step": 266036, "epoch": 3205} {"train_loss": -25.357236862182617, "global_step": 266037, "epoch": 3205} {"train_loss": -25.21405601501465, "global_step": 266038, "epoch": 3205} {"train_loss": -25.42959976196289, "global_step": 266039, "epoch": 3205} {"train_loss": -25.140628814697266, "global_step": 266040, "epoch": 3205} {"train_loss": -25.369794845581055, "global_step": 266041, "epoch": 3205} {"train_loss": -25.635395050048828, "global_step": 266042, "epoch": 3205} {"train_loss": -25.649829864501953, "global_step": 266043, "epoch": 3205} {"train_loss": -25.105133056640625, "global_step": 266044, "epoch": 3205} {"train_loss": -25.082048416137695, "global_step": 266045, "epoch": 3205} {"train_loss": -25.230716705322266, "global_step": 266046, "epoch": 3205} {"train_loss": -24.980159759521484, "global_step": 266047, "epoch": 3205} {"train_loss": -25.310895919799805, "global_step": 266048, "epoch": 3205} {"train_loss": -25.316619873046875, "global_step": 266049, "epoch": 3205} {"train_loss": -25.527692794799805, "global_step": 266050, "epoch": 3205} {"train_loss": -25.508604049682617, "global_step": 266051, "epoch": 3205} {"train_loss": -25.02056312561035, "global_step": 266052, "epoch": 3205} {"train_loss": -25.35638999938965, "global_step": 266053, "epoch": 3205} {"train_loss": -25.40549087524414, "global_step": 266054, "epoch": 3205} {"train_loss": -25.341554641723633, "global_step": 266055, "epoch": 3205} {"train_loss": -25.34491539001465, "global_step": 266056, "epoch": 3205} {"train_loss": -25.429365158081055, "global_step": 266057, "epoch": 3205} {"train_loss": -25.254175186157227, "global_step": 266058, "epoch": 3205} {"train_loss": -24.99238395690918, "global_step": 266059, "epoch": 3205} {"train_loss": -25.309856414794922, "global_step": 266060, "epoch": 3205} {"train_loss": -25.290863037109375, "global_step": 266061, "epoch": 3205} {"train_loss": -25.218338012695312, "global_step": 266062, "epoch": 3205} {"train_loss": -25.576045989990234, "global_step": 266063, "epoch": 3205} {"train_loss": -25.44390869140625, "global_step": 266064, "epoch": 3205} {"train_loss": -25.042409896850586, "global_step": 266065, "epoch": 3205} {"train_loss": -25.383176803588867, "global_step": 266066, "epoch": 3205} {"train_loss": -25.07851791381836, "global_step": 266067, "epoch": 3205} {"train_loss": -25.61615562438965, "global_step": 266068, "epoch": 3205} {"train_loss": -25.042890548706055, "global_step": 266069, "epoch": 3205} {"train_loss": -25.107345581054688, "global_step": 266070, "epoch": 3205} {"train_loss": -25.32377052307129, "global_step": 266071, "epoch": 3205} {"train_loss": -25.456533432006836, "global_step": 266072, "epoch": 3205} {"train_loss": -25.206939697265625, "global_step": 266073, "epoch": 3205} {"train_loss": -25.44254493713379, "global_step": 266074, "epoch": 3205} {"train_loss": -25.191673278808594, "global_step": 266075, "epoch": 3205} {"train_loss": -25.483266830444336, "global_step": 266076, "epoch": 3205} {"train_loss": -25.45772361755371, "global_step": 266077, "epoch": 3205} {"train_loss": -25.557340621948242, "global_step": 266078, "epoch": 3205} {"train_loss": -25.26643943786621, "global_step": 266079, "epoch": 3205} {"train_loss": -25.297731399536133, "global_step": 266080, "epoch": 3205} {"train_loss": -25.20408058166504, "global_step": 266081, "epoch": 3205} {"train_loss": -24.788415908813477, "global_step": 266082, "epoch": 3205} {"train_loss": -24.881229400634766, "global_step": 266083, "epoch": 3205} {"train_loss": -25.62824821472168, "global_step": 266084, "epoch": 3205} {"train_loss": -25.702993392944336, "global_step": 266085, "epoch": 3205} {"train_loss": -25.239931106567383, "global_step": 266086, "epoch": 3205} {"train_loss": -25.288700103759766, "global_step": 266087, "epoch": 3205} {"train_loss": -25.162572860717773, "global_step": 266088, "epoch": 3205} {"train_loss": -25.483972549438477, "global_step": 266089, "epoch": 3205} {"train_loss": -25.24904441833496, "global_step": 266090, "epoch": 3205} {"train_loss": -25.1862850189209, "global_step": 266091, "epoch": 3205} {"train_loss": -25.18307876586914, "global_step": 266092, "epoch": 3205} {"train_loss": -24.972509384155273, "global_step": 266093, "epoch": 3205} {"train_loss": -25.7021484375, "global_step": 266094, "epoch": 3205} {"train_loss": -25.246854782104492, "global_step": 266095, "epoch": 3205} {"train_loss": -24.949716567993164, "global_step": 266096, "epoch": 3205} {"train_loss": -25.237420599144624, "global_step": 266097, "epoch": 3205, "val_loss": 6941924.0} {"train_loss": -25.174177169799805, "global_step": 266098, "epoch": 3206} {"train_loss": -24.968042373657227, "global_step": 266099, "epoch": 3206} {"train_loss": -25.16264533996582, "global_step": 266100, "epoch": 3206} {"train_loss": -25.043622970581055, "global_step": 266101, "epoch": 3206} {"train_loss": -24.837926864624023, "global_step": 266102, "epoch": 3206} {"train_loss": -25.255178451538086, "global_step": 266103, "epoch": 3206} {"train_loss": -25.017120361328125, "global_step": 266104, "epoch": 3206} {"train_loss": -25.594411849975586, "global_step": 266105, "epoch": 3206} {"train_loss": -25.313663482666016, "global_step": 266106, "epoch": 3206} {"train_loss": -25.065826416015625, "global_step": 266107, "epoch": 3206} {"train_loss": -25.194738388061523, "global_step": 266108, "epoch": 3206} {"train_loss": -25.399864196777344, "global_step": 266109, "epoch": 3206} {"train_loss": -25.503929138183594, "global_step": 266110, "epoch": 3206} {"train_loss": -25.100797653198242, "global_step": 266111, "epoch": 3206} {"train_loss": -25.125823974609375, "global_step": 266112, "epoch": 3206} {"train_loss": -25.110807418823242, "global_step": 266113, "epoch": 3206} {"train_loss": -25.333568572998047, "global_step": 266114, "epoch": 3206} {"train_loss": -25.254751205444336, "global_step": 266115, "epoch": 3206} {"train_loss": -25.06370735168457, "global_step": 266116, "epoch": 3206} {"train_loss": -25.235929489135742, "global_step": 266117, "epoch": 3206} {"train_loss": -25.25501823425293, "global_step": 266118, "epoch": 3206} {"train_loss": -25.383621215820312, "global_step": 266119, "epoch": 3206} {"train_loss": -24.725997924804688, "global_step": 266120, "epoch": 3206} {"train_loss": -24.646902084350586, "global_step": 266121, "epoch": 3206} {"train_loss": -25.24903678894043, "global_step": 266122, "epoch": 3206} {"train_loss": -25.267200469970703, "global_step": 266123, "epoch": 3206} {"train_loss": -24.848363876342773, "global_step": 266124, "epoch": 3206} {"train_loss": -25.229963302612305, "global_step": 266125, "epoch": 3206} {"train_loss": -25.195615768432617, "global_step": 266126, "epoch": 3206} {"train_loss": -24.81000518798828, "global_step": 266127, "epoch": 3206} {"train_loss": -25.446500778198242, "global_step": 266128, "epoch": 3206} {"train_loss": -25.451797485351562, "global_step": 266129, "epoch": 3206} {"train_loss": -25.33613395690918, "global_step": 266130, "epoch": 3206} {"train_loss": -25.153976440429688, "global_step": 266131, "epoch": 3206} {"train_loss": -25.018178939819336, "global_step": 266132, "epoch": 3206} {"train_loss": -25.141307830810547, "global_step": 266133, "epoch": 3206} {"train_loss": -25.342618942260742, "global_step": 266134, "epoch": 3206} {"train_loss": -25.22269058227539, "global_step": 266135, "epoch": 3206} {"train_loss": -25.002065658569336, "global_step": 266136, "epoch": 3206} {"train_loss": -25.69663429260254, "global_step": 266137, "epoch": 3206} {"train_loss": -25.4744815826416, "global_step": 266138, "epoch": 3206} {"train_loss": -25.605682373046875, "global_step": 266139, "epoch": 3206} {"train_loss": -25.520193099975586, "global_step": 266140, "epoch": 3206} {"train_loss": -25.497846603393555, "global_step": 266141, "epoch": 3206} {"train_loss": -25.43600845336914, "global_step": 266142, "epoch": 3206} {"train_loss": -25.571142196655273, "global_step": 266143, "epoch": 3206} {"train_loss": -25.19746971130371, "global_step": 266144, "epoch": 3206} {"train_loss": -25.442373275756836, "global_step": 266145, "epoch": 3206} {"train_loss": -24.956396102905273, "global_step": 266146, "epoch": 3206} {"train_loss": -25.409252166748047, "global_step": 266147, "epoch": 3206} {"train_loss": -25.08802604675293, "global_step": 266148, "epoch": 3206} {"train_loss": -25.192880630493164, "global_step": 266149, "epoch": 3206} {"train_loss": -25.27567481994629, "global_step": 266150, "epoch": 3206} {"train_loss": -24.96083641052246, "global_step": 266151, "epoch": 3206} {"train_loss": -25.300941467285156, "global_step": 266152, "epoch": 3206} {"train_loss": -25.355642318725586, "global_step": 266153, "epoch": 3206} {"train_loss": -25.329397201538086, "global_step": 266154, "epoch": 3206} {"train_loss": -25.320281982421875, "global_step": 266155, "epoch": 3206} {"train_loss": -24.87957000732422, "global_step": 266156, "epoch": 3206} {"train_loss": -24.971546173095703, "global_step": 266157, "epoch": 3206} {"train_loss": -25.429275512695312, "global_step": 266158, "epoch": 3206} {"train_loss": -25.099706649780273, "global_step": 266159, "epoch": 3206} {"train_loss": -25.02578353881836, "global_step": 266160, "epoch": 3206} {"train_loss": -24.90545082092285, "global_step": 266161, "epoch": 3206} {"train_loss": -25.071714401245117, "global_step": 266162, "epoch": 3206} {"train_loss": -24.854907989501953, "global_step": 266163, "epoch": 3206} {"train_loss": -24.59153175354004, "global_step": 266164, "epoch": 3206} {"train_loss": -24.749481201171875, "global_step": 266165, "epoch": 3206} {"train_loss": -25.14015007019043, "global_step": 266166, "epoch": 3206} {"train_loss": -25.14166259765625, "global_step": 266167, "epoch": 3206} {"train_loss": -25.208200454711914, "global_step": 266168, "epoch": 3206} {"train_loss": -25.225723266601562, "global_step": 266169, "epoch": 3206} {"train_loss": -25.046049118041992, "global_step": 266170, "epoch": 3206} {"train_loss": -25.560590744018555, "global_step": 266171, "epoch": 3206} {"train_loss": -25.330562591552734, "global_step": 266172, "epoch": 3206} {"train_loss": -24.985187530517578, "global_step": 266173, "epoch": 3206} {"train_loss": -25.117938995361328, "global_step": 266174, "epoch": 3206} {"train_loss": -25.004209518432617, "global_step": 266175, "epoch": 3206} {"train_loss": -25.920745849609375, "global_step": 266176, "epoch": 3206} {"train_loss": -25.281822204589844, "global_step": 266177, "epoch": 3206} {"train_loss": -25.409648895263672, "global_step": 266178, "epoch": 3206} {"train_loss": -25.707319259643555, "global_step": 266179, "epoch": 3206} {"train_loss": -25.195855037275567, "global_step": 266180, "epoch": 3206, "val_loss": 6939765.5} {"train_loss": -24.70826530456543, "global_step": 266181, "epoch": 3207} {"train_loss": -24.766529083251953, "global_step": 266182, "epoch": 3207} {"train_loss": -24.636159896850586, "global_step": 266183, "epoch": 3207} {"train_loss": -24.780622482299805, "global_step": 266184, "epoch": 3207} {"train_loss": -25.147415161132812, "global_step": 266185, "epoch": 3207} {"train_loss": -25.058347702026367, "global_step": 266186, "epoch": 3207} {"train_loss": -24.385013580322266, "global_step": 266187, "epoch": 3207} {"train_loss": -25.301868438720703, "global_step": 266188, "epoch": 3207} {"train_loss": -24.814434051513672, "global_step": 266189, "epoch": 3207} {"train_loss": -24.621173858642578, "global_step": 266190, "epoch": 3207} {"train_loss": -25.233579635620117, "global_step": 266191, "epoch": 3207} {"train_loss": -24.866790771484375, "global_step": 266192, "epoch": 3207} {"train_loss": -24.940828323364258, "global_step": 266193, "epoch": 3207} {"train_loss": -24.848596572875977, "global_step": 266194, "epoch": 3207} {"train_loss": -24.78053092956543, "global_step": 266195, "epoch": 3207} {"train_loss": -25.40659523010254, "global_step": 266196, "epoch": 3207} {"train_loss": -25.17215919494629, "global_step": 266197, "epoch": 3207} {"train_loss": -25.04637336730957, "global_step": 266198, "epoch": 3207} {"train_loss": -25.42144012451172, "global_step": 266199, "epoch": 3207} {"train_loss": -25.180038452148438, "global_step": 266200, "epoch": 3207} {"train_loss": -25.388696670532227, "global_step": 266201, "epoch": 3207} {"train_loss": -25.743255615234375, "global_step": 266202, "epoch": 3207} {"train_loss": -25.175268173217773, "global_step": 266203, "epoch": 3207} {"train_loss": -25.320301055908203, "global_step": 266204, "epoch": 3207} {"train_loss": -25.086532592773438, "global_step": 266205, "epoch": 3207} {"train_loss": -25.00551414489746, "global_step": 266206, "epoch": 3207} {"train_loss": -25.12398338317871, "global_step": 266207, "epoch": 3207} {"train_loss": -25.278766632080078, "global_step": 266208, "epoch": 3207} {"train_loss": -25.583480834960938, "global_step": 266209, "epoch": 3207} {"train_loss": -25.53363609313965, "global_step": 266210, "epoch": 3207} {"train_loss": -25.222475051879883, "global_step": 266211, "epoch": 3207} {"train_loss": -25.041044235229492, "global_step": 266212, "epoch": 3207} {"train_loss": -25.192792892456055, "global_step": 266213, "epoch": 3207} {"train_loss": -25.153446197509766, "global_step": 266214, "epoch": 3207} {"train_loss": -24.944822311401367, "global_step": 266215, "epoch": 3207} {"train_loss": -25.246143341064453, "global_step": 266216, "epoch": 3207} {"train_loss": -25.675384521484375, "global_step": 266217, "epoch": 3207} {"train_loss": -25.443878173828125, "global_step": 266218, "epoch": 3207} {"train_loss": -25.094228744506836, "global_step": 266219, "epoch": 3207} {"train_loss": -25.017927169799805, "global_step": 266220, "epoch": 3207} {"train_loss": -25.665359497070312, "global_step": 266221, "epoch": 3207} {"train_loss": -25.48992919921875, "global_step": 266222, "epoch": 3207} {"train_loss": -25.366201400756836, "global_step": 266223, "epoch": 3207} {"train_loss": -25.672285079956055, "global_step": 266224, "epoch": 3207} {"train_loss": -25.361480712890625, "global_step": 266225, "epoch": 3207} {"train_loss": -25.134092330932617, "global_step": 266226, "epoch": 3207} {"train_loss": -25.269346237182617, "global_step": 266227, "epoch": 3207} {"train_loss": -25.104684829711914, "global_step": 266228, "epoch": 3207} {"train_loss": -25.658828735351562, "global_step": 266229, "epoch": 3207} {"train_loss": -25.401397705078125, "global_step": 266230, "epoch": 3207} {"train_loss": -25.3574275970459, "global_step": 266231, "epoch": 3207} {"train_loss": -25.22830581665039, "global_step": 266232, "epoch": 3207} {"train_loss": -25.499845504760742, "global_step": 266233, "epoch": 3207} {"train_loss": -25.357484817504883, "global_step": 266234, "epoch": 3207} {"train_loss": -25.614383697509766, "global_step": 266235, "epoch": 3207} {"train_loss": -24.918508529663086, "global_step": 266236, "epoch": 3207} {"train_loss": -25.219655990600586, "global_step": 266237, "epoch": 3207} {"train_loss": -24.935152053833008, "global_step": 266238, "epoch": 3207} {"train_loss": -24.424039840698242, "global_step": 266239, "epoch": 3207} {"train_loss": -24.751739501953125, "global_step": 266240, "epoch": 3207} {"train_loss": -24.7875919342041, "global_step": 266241, "epoch": 3207} {"train_loss": -25.035905838012695, "global_step": 266242, "epoch": 3207} {"train_loss": -24.7978515625, "global_step": 266243, "epoch": 3207} {"train_loss": -25.067590713500977, "global_step": 266244, "epoch": 3207} {"train_loss": -25.002119064331055, "global_step": 266245, "epoch": 3207} {"train_loss": -25.3693790435791, "global_step": 266246, "epoch": 3207} {"train_loss": -25.127307891845703, "global_step": 266247, "epoch": 3207} {"train_loss": -25.280147552490234, "global_step": 266248, "epoch": 3207} {"train_loss": -24.999914169311523, "global_step": 266249, "epoch": 3207} {"train_loss": -24.992460250854492, "global_step": 266250, "epoch": 3207} {"train_loss": -25.405242919921875, "global_step": 266251, "epoch": 3207} {"train_loss": -25.539716720581055, "global_step": 266252, "epoch": 3207} {"train_loss": -24.807571411132812, "global_step": 266253, "epoch": 3207} {"train_loss": -25.268598556518555, "global_step": 266254, "epoch": 3207} {"train_loss": -24.97491455078125, "global_step": 266255, "epoch": 3207} {"train_loss": -25.399229049682617, "global_step": 266256, "epoch": 3207} {"train_loss": -25.161741256713867, "global_step": 266257, "epoch": 3207} {"train_loss": -25.239049911499023, "global_step": 266258, "epoch": 3207} {"train_loss": -25.34796142578125, "global_step": 266259, "epoch": 3207} {"train_loss": -25.03022575378418, "global_step": 266260, "epoch": 3207} {"train_loss": -25.18533706665039, "global_step": 266261, "epoch": 3207} {"train_loss": -24.7933349609375, "global_step": 266262, "epoch": 3207} {"train_loss": -25.150841356760047, "global_step": 266263, "epoch": 3207, "val_loss": 6883954.0} {"train_loss": -24.9553279876709, "global_step": 266264, "epoch": 3208} {"train_loss": -24.78173828125, "global_step": 266265, "epoch": 3208} {"train_loss": -25.0384578704834, "global_step": 266266, "epoch": 3208} {"train_loss": -25.003141403198242, "global_step": 266267, "epoch": 3208} {"train_loss": -25.058456420898438, "global_step": 266268, "epoch": 3208} {"train_loss": -24.788564682006836, "global_step": 266269, "epoch": 3208} {"train_loss": -24.570022583007812, "global_step": 266270, "epoch": 3208} {"train_loss": -24.69675636291504, "global_step": 266271, "epoch": 3208} {"train_loss": -24.869169235229492, "global_step": 266272, "epoch": 3208} {"train_loss": -25.000513076782227, "global_step": 266273, "epoch": 3208} {"train_loss": -25.199703216552734, "global_step": 266274, "epoch": 3208} {"train_loss": -25.44656753540039, "global_step": 266275, "epoch": 3208} {"train_loss": -24.825740814208984, "global_step": 266276, "epoch": 3208} {"train_loss": -25.27518653869629, "global_step": 266277, "epoch": 3208} {"train_loss": -25.188518524169922, "global_step": 266278, "epoch": 3208} {"train_loss": -25.18123435974121, "global_step": 266279, "epoch": 3208} {"train_loss": -25.23526382446289, "global_step": 266280, "epoch": 3208} {"train_loss": -25.17482566833496, "global_step": 266281, "epoch": 3208} {"train_loss": -25.212839126586914, "global_step": 266282, "epoch": 3208} {"train_loss": -25.204172134399414, "global_step": 266283, "epoch": 3208} {"train_loss": -25.38825798034668, "global_step": 266284, "epoch": 3208} {"train_loss": -24.97988510131836, "global_step": 266285, "epoch": 3208} {"train_loss": -25.40424919128418, "global_step": 266286, "epoch": 3208} {"train_loss": -25.217348098754883, "global_step": 266287, "epoch": 3208} {"train_loss": -25.12921714782715, "global_step": 266288, "epoch": 3208} {"train_loss": -25.25374984741211, "global_step": 266289, "epoch": 3208} {"train_loss": -25.31995964050293, "global_step": 266290, "epoch": 3208} {"train_loss": -25.242862701416016, "global_step": 266291, "epoch": 3208} {"train_loss": -24.99358558654785, "global_step": 266292, "epoch": 3208} {"train_loss": -25.254932403564453, "global_step": 266293, "epoch": 3208} {"train_loss": -25.462778091430664, "global_step": 266294, "epoch": 3208} {"train_loss": -25.30533790588379, "global_step": 266295, "epoch": 3208} {"train_loss": -25.381031036376953, "global_step": 266296, "epoch": 3208} {"train_loss": -25.409128189086914, "global_step": 266297, "epoch": 3208} {"train_loss": -25.4285945892334, "global_step": 266298, "epoch": 3208} {"train_loss": -25.20591926574707, "global_step": 266299, "epoch": 3208} {"train_loss": -25.14748764038086, "global_step": 266300, "epoch": 3208} {"train_loss": -25.23909568786621, "global_step": 266301, "epoch": 3208} {"train_loss": -25.42831802368164, "global_step": 266302, "epoch": 3208} {"train_loss": -25.500940322875977, "global_step": 266303, "epoch": 3208} {"train_loss": -25.519556045532227, "global_step": 266304, "epoch": 3208} {"train_loss": -25.38239097595215, "global_step": 266305, "epoch": 3208} {"train_loss": -25.535829544067383, "global_step": 266306, "epoch": 3208} {"train_loss": -25.22384262084961, "global_step": 266307, "epoch": 3208} {"train_loss": -25.078584671020508, "global_step": 266308, "epoch": 3208} {"train_loss": -25.383520126342773, "global_step": 266309, "epoch": 3208} {"train_loss": -25.244510650634766, "global_step": 266310, "epoch": 3208} {"train_loss": -25.575220108032227, "global_step": 266311, "epoch": 3208} {"train_loss": -25.492780685424805, "global_step": 266312, "epoch": 3208} {"train_loss": -25.461566925048828, "global_step": 266313, "epoch": 3208} {"train_loss": -25.36985206604004, "global_step": 266314, "epoch": 3208} {"train_loss": -25.014724731445312, "global_step": 266315, "epoch": 3208} {"train_loss": -24.72993278503418, "global_step": 266316, "epoch": 3208} {"train_loss": -24.966835021972656, "global_step": 266317, "epoch": 3208} {"train_loss": -24.462757110595703, "global_step": 266318, "epoch": 3208} {"train_loss": -24.333242416381836, "global_step": 266319, "epoch": 3208} {"train_loss": -24.33639907836914, "global_step": 266320, "epoch": 3208} {"train_loss": -25.210397720336914, "global_step": 266321, "epoch": 3208} {"train_loss": -24.181745529174805, "global_step": 266322, "epoch": 3208} {"train_loss": -24.788848876953125, "global_step": 266323, "epoch": 3208} {"train_loss": -24.952838897705078, "global_step": 266324, "epoch": 3208} {"train_loss": -24.437196731567383, "global_step": 266325, "epoch": 3208} {"train_loss": -24.53656005859375, "global_step": 266326, "epoch": 3208} {"train_loss": -24.90070915222168, "global_step": 266327, "epoch": 3208} {"train_loss": -25.018783569335938, "global_step": 266328, "epoch": 3208} {"train_loss": -24.899673461914062, "global_step": 266329, "epoch": 3208} {"train_loss": -25.095029830932617, "global_step": 266330, "epoch": 3208} {"train_loss": -25.215879440307617, "global_step": 266331, "epoch": 3208} {"train_loss": -24.846792221069336, "global_step": 266332, "epoch": 3208} {"train_loss": -24.673669815063477, "global_step": 266333, "epoch": 3208} {"train_loss": -25.035371780395508, "global_step": 266334, "epoch": 3208} {"train_loss": -25.119659423828125, "global_step": 266335, "epoch": 3208} {"train_loss": -25.206125259399414, "global_step": 266336, "epoch": 3208} {"train_loss": -24.897878646850586, "global_step": 266337, "epoch": 3208} {"train_loss": -25.07512092590332, "global_step": 266338, "epoch": 3208} {"train_loss": -25.26055908203125, "global_step": 266339, "epoch": 3208} {"train_loss": -25.254165649414062, "global_step": 266340, "epoch": 3208} {"train_loss": -25.264129638671875, "global_step": 266341, "epoch": 3208} {"train_loss": -25.45273780822754, "global_step": 266342, "epoch": 3208} {"train_loss": -25.03313446044922, "global_step": 266343, "epoch": 3208} {"train_loss": -25.436193466186523, "global_step": 266344, "epoch": 3208} {"train_loss": -24.969465255737305, "global_step": 266345, "epoch": 3208} {"train_loss": -25.08604330039886, "global_step": 266346, "epoch": 3208, "val_loss": 6986019.5} {"train_loss": -24.349546432495117, "global_step": 266347, "epoch": 3209} {"train_loss": -24.75579261779785, "global_step": 266348, "epoch": 3209} {"train_loss": -24.917293548583984, "global_step": 266349, "epoch": 3209} {"train_loss": -25.20992088317871, "global_step": 266350, "epoch": 3209} {"train_loss": -24.98141098022461, "global_step": 266351, "epoch": 3209} {"train_loss": -24.305234909057617, "global_step": 266352, "epoch": 3209} {"train_loss": -25.03403663635254, "global_step": 266353, "epoch": 3209} {"train_loss": -25.12369155883789, "global_step": 266354, "epoch": 3209} {"train_loss": -24.99728775024414, "global_step": 266355, "epoch": 3209} {"train_loss": -25.094236373901367, "global_step": 266356, "epoch": 3209} {"train_loss": -24.793386459350586, "global_step": 266357, "epoch": 3209} {"train_loss": -24.67620277404785, "global_step": 266358, "epoch": 3209} {"train_loss": -24.7801570892334, "global_step": 266359, "epoch": 3209} {"train_loss": -24.757665634155273, "global_step": 266360, "epoch": 3209} {"train_loss": -25.001659393310547, "global_step": 266361, "epoch": 3209} {"train_loss": -24.354339599609375, "global_step": 266362, "epoch": 3209} {"train_loss": -25.067136764526367, "global_step": 266363, "epoch": 3209} {"train_loss": -24.641138076782227, "global_step": 266364, "epoch": 3209} {"train_loss": -24.582290649414062, "global_step": 266365, "epoch": 3209} {"train_loss": -24.92864990234375, "global_step": 266366, "epoch": 3209} {"train_loss": -24.980915069580078, "global_step": 266367, "epoch": 3209} {"train_loss": -25.04640007019043, "global_step": 266368, "epoch": 3209} {"train_loss": -25.151525497436523, "global_step": 266369, "epoch": 3209} {"train_loss": -25.083576202392578, "global_step": 266370, "epoch": 3209} {"train_loss": -25.071744918823242, "global_step": 266371, "epoch": 3209} {"train_loss": -25.048063278198242, "global_step": 266372, "epoch": 3209} {"train_loss": -25.15998649597168, "global_step": 266373, "epoch": 3209} {"train_loss": -25.20882225036621, "global_step": 266374, "epoch": 3209} {"train_loss": -25.179697036743164, "global_step": 266375, "epoch": 3209} {"train_loss": -25.191307067871094, "global_step": 266376, "epoch": 3209} {"train_loss": -24.936859130859375, "global_step": 266377, "epoch": 3209} {"train_loss": -24.941951751708984, "global_step": 266378, "epoch": 3209} {"train_loss": -24.863489151000977, "global_step": 266379, "epoch": 3209} {"train_loss": -25.07880210876465, "global_step": 266380, "epoch": 3209} {"train_loss": -25.3310489654541, "global_step": 266381, "epoch": 3209} {"train_loss": -25.37407112121582, "global_step": 266382, "epoch": 3209} {"train_loss": -25.415996551513672, "global_step": 266383, "epoch": 3209} {"train_loss": -25.163288116455078, "global_step": 266384, "epoch": 3209} {"train_loss": -25.552183151245117, "global_step": 266385, "epoch": 3209} {"train_loss": -25.434782028198242, "global_step": 266386, "epoch": 3209} {"train_loss": -25.170578002929688, "global_step": 266387, "epoch": 3209} {"train_loss": -25.474842071533203, "global_step": 266388, "epoch": 3209} {"train_loss": -25.41128921508789, "global_step": 266389, "epoch": 3209} {"train_loss": -25.24428367614746, "global_step": 266390, "epoch": 3209} {"train_loss": -25.220115661621094, "global_step": 266391, "epoch": 3209} {"train_loss": -25.404951095581055, "global_step": 266392, "epoch": 3209} {"train_loss": -24.956018447875977, "global_step": 266393, "epoch": 3209} {"train_loss": -25.29258155822754, "global_step": 266394, "epoch": 3209} {"train_loss": -25.399932861328125, "global_step": 266395, "epoch": 3209} {"train_loss": -25.21224021911621, "global_step": 266396, "epoch": 3209} {"train_loss": -25.455795288085938, "global_step": 266397, "epoch": 3209} {"train_loss": -25.328601837158203, "global_step": 266398, "epoch": 3209} {"train_loss": -25.108640670776367, "global_step": 266399, "epoch": 3209} {"train_loss": -25.83534049987793, "global_step": 266400, "epoch": 3209} {"train_loss": -25.53306007385254, "global_step": 266401, "epoch": 3209} {"train_loss": -25.462661743164062, "global_step": 266402, "epoch": 3209} {"train_loss": -25.566999435424805, "global_step": 266403, "epoch": 3209} {"train_loss": -25.174968719482422, "global_step": 266404, "epoch": 3209} {"train_loss": -25.139785766601562, "global_step": 266405, "epoch": 3209} {"train_loss": -24.895954132080078, "global_step": 266406, "epoch": 3209} {"train_loss": -25.13179588317871, "global_step": 266407, "epoch": 3209} {"train_loss": -25.500370025634766, "global_step": 266408, "epoch": 3209} {"train_loss": -25.21246910095215, "global_step": 266409, "epoch": 3209} {"train_loss": -25.572309494018555, "global_step": 266410, "epoch": 3209} {"train_loss": -25.581106185913086, "global_step": 266411, "epoch": 3209} {"train_loss": -25.86261558532715, "global_step": 266412, "epoch": 3209} {"train_loss": -25.090856552124023, "global_step": 266413, "epoch": 3209} {"train_loss": -24.633953094482422, "global_step": 266414, "epoch": 3209} {"train_loss": -24.646108627319336, "global_step": 266415, "epoch": 3209} {"train_loss": -24.53419303894043, "global_step": 266416, "epoch": 3209} {"train_loss": -25.196218490600586, "global_step": 266417, "epoch": 3209} {"train_loss": -24.8321533203125, "global_step": 266418, "epoch": 3209} {"train_loss": -25.325048446655273, "global_step": 266419, "epoch": 3209} {"train_loss": -24.963958740234375, "global_step": 266420, "epoch": 3209} {"train_loss": -25.200326919555664, "global_step": 266421, "epoch": 3209} {"train_loss": -25.450387954711914, "global_step": 266422, "epoch": 3209} {"train_loss": -25.255149841308594, "global_step": 266423, "epoch": 3209} {"train_loss": -25.020389556884766, "global_step": 266424, "epoch": 3209} {"train_loss": -25.374126434326172, "global_step": 266425, "epoch": 3209} {"train_loss": -25.0844783782959, "global_step": 266426, "epoch": 3209} {"train_loss": -25.34633445739746, "global_step": 266427, "epoch": 3209} {"train_loss": -25.23406982421875, "global_step": 266428, "epoch": 3209} {"train_loss": -25.12102395942412, "global_step": 266429, "epoch": 3209, "val_loss": 6987167.5} {"train_loss": -23.560789108276367, "global_step": 266430, "epoch": 3210} {"train_loss": -24.783884048461914, "global_step": 266431, "epoch": 3210} {"train_loss": -24.730436325073242, "global_step": 266432, "epoch": 3210} {"train_loss": -24.088668823242188, "global_step": 266433, "epoch": 3210} {"train_loss": -24.747589111328125, "global_step": 266434, "epoch": 3210} {"train_loss": -24.51167106628418, "global_step": 266435, "epoch": 3210} {"train_loss": -24.47902488708496, "global_step": 266436, "epoch": 3210} {"train_loss": -24.511205673217773, "global_step": 266437, "epoch": 3210} {"train_loss": -24.78597068786621, "global_step": 266438, "epoch": 3210} {"train_loss": -24.333494186401367, "global_step": 266439, "epoch": 3210} {"train_loss": -24.95790672302246, "global_step": 266440, "epoch": 3210} {"train_loss": -25.045209884643555, "global_step": 266441, "epoch": 3210} {"train_loss": -24.85283851623535, "global_step": 266442, "epoch": 3210} {"train_loss": -24.693679809570312, "global_step": 266443, "epoch": 3210} {"train_loss": -24.954835891723633, "global_step": 266444, "epoch": 3210} {"train_loss": -25.17172622680664, "global_step": 266445, "epoch": 3210} {"train_loss": -24.961576461791992, "global_step": 266446, "epoch": 3210} {"train_loss": -24.926488876342773, "global_step": 266447, "epoch": 3210} {"train_loss": -25.111263275146484, "global_step": 266448, "epoch": 3210} {"train_loss": -24.62070083618164, "global_step": 266449, "epoch": 3210} {"train_loss": -25.08682632446289, "global_step": 266450, "epoch": 3210} {"train_loss": -24.757715225219727, "global_step": 266451, "epoch": 3210} {"train_loss": -24.98200225830078, "global_step": 266452, "epoch": 3210} {"train_loss": -24.742740631103516, "global_step": 266453, "epoch": 3210} {"train_loss": -24.94502830505371, "global_step": 266454, "epoch": 3210} {"train_loss": -25.30242347717285, "global_step": 266455, "epoch": 3210} {"train_loss": -25.419198989868164, "global_step": 266456, "epoch": 3210} {"train_loss": -24.981470108032227, "global_step": 266457, "epoch": 3210} {"train_loss": -25.327545166015625, "global_step": 266458, "epoch": 3210} {"train_loss": -24.850112915039062, "global_step": 266459, "epoch": 3210} {"train_loss": -25.165205001831055, "global_step": 266460, "epoch": 3210} {"train_loss": -25.171466827392578, "global_step": 266461, "epoch": 3210} {"train_loss": -25.249418258666992, "global_step": 266462, "epoch": 3210} {"train_loss": -25.102752685546875, "global_step": 266463, "epoch": 3210} {"train_loss": -25.239521026611328, "global_step": 266464, "epoch": 3210} {"train_loss": -25.12751579284668, "global_step": 266465, "epoch": 3210} {"train_loss": -25.20454978942871, "global_step": 266466, "epoch": 3210} {"train_loss": -24.99195671081543, "global_step": 266467, "epoch": 3210} {"train_loss": -24.863967895507812, "global_step": 266468, "epoch": 3210} {"train_loss": -25.285202026367188, "global_step": 266469, "epoch": 3210} {"train_loss": -24.917770385742188, "global_step": 266470, "epoch": 3210} {"train_loss": -24.7816219329834, "global_step": 266471, "epoch": 3210} {"train_loss": -25.148033142089844, "global_step": 266472, "epoch": 3210} {"train_loss": -24.90452003479004, "global_step": 266473, "epoch": 3210} {"train_loss": -25.06451416015625, "global_step": 266474, "epoch": 3210} {"train_loss": -24.889318466186523, "global_step": 266475, "epoch": 3210} {"train_loss": -25.162158966064453, "global_step": 266476, "epoch": 3210} {"train_loss": -25.304859161376953, "global_step": 266477, "epoch": 3210} {"train_loss": -25.032974243164062, "global_step": 266478, "epoch": 3210} {"train_loss": -25.227188110351562, "global_step": 266479, "epoch": 3210} {"train_loss": -25.348554611206055, "global_step": 266480, "epoch": 3210} {"train_loss": -25.007762908935547, "global_step": 266481, "epoch": 3210} {"train_loss": -25.24942970275879, "global_step": 266482, "epoch": 3210} {"train_loss": -25.434680938720703, "global_step": 266483, "epoch": 3210} {"train_loss": -25.441238403320312, "global_step": 266484, "epoch": 3210} {"train_loss": -25.111860275268555, "global_step": 266485, "epoch": 3210} {"train_loss": -25.305936813354492, "global_step": 266486, "epoch": 3210} {"train_loss": -25.040475845336914, "global_step": 266487, "epoch": 3210} {"train_loss": -24.959598541259766, "global_step": 266488, "epoch": 3210} {"train_loss": -25.28986167907715, "global_step": 266489, "epoch": 3210} {"train_loss": -25.465890884399414, "global_step": 266490, "epoch": 3210} {"train_loss": -25.40087890625, "global_step": 266491, "epoch": 3210} {"train_loss": -25.16562843322754, "global_step": 266492, "epoch": 3210} {"train_loss": -25.3925838470459, "global_step": 266493, "epoch": 3210} {"train_loss": -25.471006393432617, "global_step": 266494, "epoch": 3210} {"train_loss": -25.49532699584961, "global_step": 266495, "epoch": 3210} {"train_loss": -25.29555320739746, "global_step": 266496, "epoch": 3210} {"train_loss": -25.305402755737305, "global_step": 266497, "epoch": 3210} {"train_loss": -25.806659698486328, "global_step": 266498, "epoch": 3210} {"train_loss": -25.383329391479492, "global_step": 266499, "epoch": 3210} {"train_loss": -25.30259132385254, "global_step": 266500, "epoch": 3210} {"train_loss": -25.44890022277832, "global_step": 266501, "epoch": 3210} {"train_loss": -25.561548233032227, "global_step": 266502, "epoch": 3210} {"train_loss": -25.544879913330078, "global_step": 266503, "epoch": 3210} {"train_loss": -25.44260597229004, "global_step": 266504, "epoch": 3210} {"train_loss": -24.922143936157227, "global_step": 266505, "epoch": 3210} {"train_loss": -25.424482345581055, "global_step": 266506, "epoch": 3210} {"train_loss": -24.926557540893555, "global_step": 266507, "epoch": 3210} {"train_loss": -25.162017822265625, "global_step": 266508, "epoch": 3210} {"train_loss": -25.142276763916016, "global_step": 266509, "epoch": 3210} {"train_loss": -25.307897567749023, "global_step": 266510, "epoch": 3210} {"train_loss": -25.354537963867188, "global_step": 266511, "epoch": 3210} {"train_loss": -25.061297612017896, "global_step": 266512, "epoch": 3210, "val_loss": 6907702.0} {"train_loss": -24.841293334960938, "global_step": 266513, "epoch": 3211} {"train_loss": -24.46123695373535, "global_step": 266514, "epoch": 3211} {"train_loss": -23.99736976623535, "global_step": 266515, "epoch": 3211} {"train_loss": -24.805246353149414, "global_step": 266516, "epoch": 3211} {"train_loss": -24.866491317749023, "global_step": 266517, "epoch": 3211} {"train_loss": -24.66121482849121, "global_step": 266518, "epoch": 3211} {"train_loss": -24.624130249023438, "global_step": 266519, "epoch": 3211} {"train_loss": -24.749637603759766, "global_step": 266520, "epoch": 3211} {"train_loss": -25.151607513427734, "global_step": 266521, "epoch": 3211} {"train_loss": -24.964704513549805, "global_step": 266522, "epoch": 3211} {"train_loss": -24.8904972076416, "global_step": 266523, "epoch": 3211} {"train_loss": -24.929370880126953, "global_step": 266524, "epoch": 3211} {"train_loss": -24.723356246948242, "global_step": 266525, "epoch": 3211} {"train_loss": -24.78997230529785, "global_step": 266526, "epoch": 3211} {"train_loss": -24.2637882232666, "global_step": 266527, "epoch": 3211} {"train_loss": -24.719221115112305, "global_step": 266528, "epoch": 3211} {"train_loss": -25.15060806274414, "global_step": 266529, "epoch": 3211} {"train_loss": -25.287973403930664, "global_step": 266530, "epoch": 3211} {"train_loss": -24.945735931396484, "global_step": 266531, "epoch": 3211} {"train_loss": -25.176319122314453, "global_step": 266532, "epoch": 3211} {"train_loss": -24.9456787109375, "global_step": 266533, "epoch": 3211} {"train_loss": -25.328279495239258, "global_step": 266534, "epoch": 3211} {"train_loss": -25.06990623474121, "global_step": 266535, "epoch": 3211} {"train_loss": -25.15253257751465, "global_step": 266536, "epoch": 3211} {"train_loss": -25.016263961791992, "global_step": 266537, "epoch": 3211} {"train_loss": -24.92084312438965, "global_step": 266538, "epoch": 3211} {"train_loss": -25.01301383972168, "global_step": 266539, "epoch": 3211} {"train_loss": -25.386198043823242, "global_step": 266540, "epoch": 3211} {"train_loss": -25.10735511779785, "global_step": 266541, "epoch": 3211} {"train_loss": -25.353256225585938, "global_step": 266542, "epoch": 3211} {"train_loss": -25.18604850769043, "global_step": 266543, "epoch": 3211} {"train_loss": -25.144216537475586, "global_step": 266544, "epoch": 3211} {"train_loss": -25.679723739624023, "global_step": 266545, "epoch": 3211} {"train_loss": -24.73183250427246, "global_step": 266546, "epoch": 3211} {"train_loss": -25.588430404663086, "global_step": 266547, "epoch": 3211} {"train_loss": -25.3399715423584, "global_step": 266548, "epoch": 3211} {"train_loss": -25.157958984375, "global_step": 266549, "epoch": 3211} {"train_loss": -24.826251983642578, "global_step": 266550, "epoch": 3211} {"train_loss": -25.395795822143555, "global_step": 266551, "epoch": 3211} {"train_loss": -25.54941177368164, "global_step": 266552, "epoch": 3211} {"train_loss": -25.25954246520996, "global_step": 266553, "epoch": 3211} {"train_loss": -25.46931266784668, "global_step": 266554, "epoch": 3211} {"train_loss": -25.415510177612305, "global_step": 266555, "epoch": 3211} {"train_loss": -25.293560028076172, "global_step": 266556, "epoch": 3211} {"train_loss": -25.213117599487305, "global_step": 266557, "epoch": 3211} {"train_loss": -25.205839157104492, "global_step": 266558, "epoch": 3211} {"train_loss": -25.720380783081055, "global_step": 266559, "epoch": 3211} {"train_loss": -25.368680953979492, "global_step": 266560, "epoch": 3211} {"train_loss": -25.317829132080078, "global_step": 266561, "epoch": 3211} {"train_loss": -25.538562774658203, "global_step": 266562, "epoch": 3211} {"train_loss": -25.423017501831055, "global_step": 266563, "epoch": 3211} {"train_loss": -25.946752548217773, "global_step": 266564, "epoch": 3211} {"train_loss": -25.244802474975586, "global_step": 266565, "epoch": 3211} {"train_loss": -25.490009307861328, "global_step": 266566, "epoch": 3211} {"train_loss": -25.32143211364746, "global_step": 266567, "epoch": 3211} {"train_loss": -25.145917892456055, "global_step": 266568, "epoch": 3211} {"train_loss": -25.25355339050293, "global_step": 266569, "epoch": 3211} {"train_loss": -25.559879302978516, "global_step": 266570, "epoch": 3211} {"train_loss": -25.487201690673828, "global_step": 266571, "epoch": 3211} {"train_loss": -25.1770076751709, "global_step": 266572, "epoch": 3211} {"train_loss": -25.53002166748047, "global_step": 266573, "epoch": 3211} {"train_loss": -25.664417266845703, "global_step": 266574, "epoch": 3211} {"train_loss": -25.563262939453125, "global_step": 266575, "epoch": 3211} {"train_loss": -25.271804809570312, "global_step": 266576, "epoch": 3211} {"train_loss": -25.300777435302734, "global_step": 266577, "epoch": 3211} {"train_loss": -25.49131202697754, "global_step": 266578, "epoch": 3211} {"train_loss": -25.29747200012207, "global_step": 266579, "epoch": 3211} {"train_loss": -24.937088012695312, "global_step": 266580, "epoch": 3211} {"train_loss": -25.3708438873291, "global_step": 266581, "epoch": 3211} {"train_loss": -25.046966552734375, "global_step": 266582, "epoch": 3211} {"train_loss": -25.03675651550293, "global_step": 266583, "epoch": 3211} {"train_loss": -25.29779624938965, "global_step": 266584, "epoch": 3211} {"train_loss": -25.14324378967285, "global_step": 266585, "epoch": 3211} {"train_loss": -25.253427505493164, "global_step": 266586, "epoch": 3211} {"train_loss": -25.436487197875977, "global_step": 266587, "epoch": 3211} {"train_loss": -25.2974853515625, "global_step": 266588, "epoch": 3211} {"train_loss": -24.94471549987793, "global_step": 266589, "epoch": 3211} {"train_loss": -25.621307373046875, "global_step": 266590, "epoch": 3211} {"train_loss": -25.16795539855957, "global_step": 266591, "epoch": 3211} {"train_loss": -25.592382431030273, "global_step": 266592, "epoch": 3211} {"train_loss": -25.152463912963867, "global_step": 266593, "epoch": 3211} {"train_loss": -25.496686935424805, "global_step": 266594, "epoch": 3211} {"train_loss": -25.180088112153204, "global_step": 266595, "epoch": 3211, "val_loss": 7045628.0} {"train_loss": -24.78737449645996, "global_step": 266596, "epoch": 3212} {"train_loss": -24.645742416381836, "global_step": 266597, "epoch": 3212} {"train_loss": -25.128793716430664, "global_step": 266598, "epoch": 3212} {"train_loss": -25.40395164489746, "global_step": 266599, "epoch": 3212} {"train_loss": -24.936447143554688, "global_step": 266600, "epoch": 3212} {"train_loss": -24.965574264526367, "global_step": 266601, "epoch": 3212} {"train_loss": -25.103879928588867, "global_step": 266602, "epoch": 3212} {"train_loss": -25.470890045166016, "global_step": 266603, "epoch": 3212} {"train_loss": -25.136001586914062, "global_step": 266604, "epoch": 3212} {"train_loss": -25.131549835205078, "global_step": 266605, "epoch": 3212} {"train_loss": -25.42578125, "global_step": 266606, "epoch": 3212} {"train_loss": -24.878549575805664, "global_step": 266607, "epoch": 3212} {"train_loss": -25.165708541870117, "global_step": 266608, "epoch": 3212} {"train_loss": -25.078323364257812, "global_step": 266609, "epoch": 3212} {"train_loss": -25.548093795776367, "global_step": 266610, "epoch": 3212} {"train_loss": -24.67757797241211, "global_step": 266611, "epoch": 3212} {"train_loss": -25.282724380493164, "global_step": 266612, "epoch": 3212} {"train_loss": -25.59956169128418, "global_step": 266613, "epoch": 3212} {"train_loss": -25.2449893951416, "global_step": 266614, "epoch": 3212} {"train_loss": -25.469263076782227, "global_step": 266615, "epoch": 3212} {"train_loss": -25.5250244140625, "global_step": 266616, "epoch": 3212} {"train_loss": -25.3104190826416, "global_step": 266617, "epoch": 3212} {"train_loss": -25.082874298095703, "global_step": 266618, "epoch": 3212} {"train_loss": -25.451021194458008, "global_step": 266619, "epoch": 3212} {"train_loss": -25.322053909301758, "global_step": 266620, "epoch": 3212} {"train_loss": -25.407743453979492, "global_step": 266621, "epoch": 3212} {"train_loss": -25.16588592529297, "global_step": 266622, "epoch": 3212} {"train_loss": -25.382783889770508, "global_step": 266623, "epoch": 3212} {"train_loss": -25.46063804626465, "global_step": 266624, "epoch": 3212} {"train_loss": -25.45069694519043, "global_step": 266625, "epoch": 3212} {"train_loss": -25.294830322265625, "global_step": 266626, "epoch": 3212} {"train_loss": -25.3070011138916, "global_step": 266627, "epoch": 3212} {"train_loss": -25.19477081298828, "global_step": 266628, "epoch": 3212} {"train_loss": -25.30299949645996, "global_step": 266629, "epoch": 3212} {"train_loss": -25.627843856811523, "global_step": 266630, "epoch": 3212} {"train_loss": -25.117664337158203, "global_step": 266631, "epoch": 3212} {"train_loss": -25.77967643737793, "global_step": 266632, "epoch": 3212} {"train_loss": -25.138654708862305, "global_step": 266633, "epoch": 3212} {"train_loss": -25.132930755615234, "global_step": 266634, "epoch": 3212} {"train_loss": -25.531404495239258, "global_step": 266635, "epoch": 3212} {"train_loss": -25.214200973510742, "global_step": 266636, "epoch": 3212} {"train_loss": -25.599138259887695, "global_step": 266637, "epoch": 3212} {"train_loss": -25.11152458190918, "global_step": 266638, "epoch": 3212} {"train_loss": -25.483097076416016, "global_step": 266639, "epoch": 3212} {"train_loss": -25.49300193786621, "global_step": 266640, "epoch": 3212} {"train_loss": -25.320981979370117, "global_step": 266641, "epoch": 3212} {"train_loss": -25.0241756439209, "global_step": 266642, "epoch": 3212} {"train_loss": -25.25186538696289, "global_step": 266643, "epoch": 3212} {"train_loss": -25.415420532226562, "global_step": 266644, "epoch": 3212} {"train_loss": -25.216506958007812, "global_step": 266645, "epoch": 3212} {"train_loss": -25.097192764282227, "global_step": 266646, "epoch": 3212} {"train_loss": -24.887435913085938, "global_step": 266647, "epoch": 3212} {"train_loss": -24.92386817932129, "global_step": 266648, "epoch": 3212} {"train_loss": -23.778223037719727, "global_step": 266649, "epoch": 3212} {"train_loss": -22.24167251586914, "global_step": 266650, "epoch": 3212} {"train_loss": -22.71919822692871, "global_step": 266651, "epoch": 3212} {"train_loss": -24.00567626953125, "global_step": 266652, "epoch": 3212} {"train_loss": -25.019697189331055, "global_step": 266653, "epoch": 3212} {"train_loss": -24.30987548828125, "global_step": 266654, "epoch": 3212} {"train_loss": -24.563404083251953, "global_step": 266655, "epoch": 3212} {"train_loss": -24.604639053344727, "global_step": 266656, "epoch": 3212} {"train_loss": -24.919029235839844, "global_step": 266657, "epoch": 3212} {"train_loss": -24.623687744140625, "global_step": 266658, "epoch": 3212} {"train_loss": -24.59146499633789, "global_step": 266659, "epoch": 3212} {"train_loss": -24.643436431884766, "global_step": 266660, "epoch": 3212} {"train_loss": -24.50124740600586, "global_step": 266661, "epoch": 3212} {"train_loss": -25.233457565307617, "global_step": 266662, "epoch": 3212} {"train_loss": -24.98270606994629, "global_step": 266663, "epoch": 3212} {"train_loss": -24.91710090637207, "global_step": 266664, "epoch": 3212} {"train_loss": -24.986988067626953, "global_step": 266665, "epoch": 3212} {"train_loss": -25.165193557739258, "global_step": 266666, "epoch": 3212} {"train_loss": -24.747934341430664, "global_step": 266667, "epoch": 3212} {"train_loss": -24.584272384643555, "global_step": 266668, "epoch": 3212} {"train_loss": -25.03693962097168, "global_step": 266669, "epoch": 3212} {"train_loss": -25.018064498901367, "global_step": 266670, "epoch": 3212} {"train_loss": -24.959400177001953, "global_step": 266671, "epoch": 3212} {"train_loss": -24.96512794494629, "global_step": 266672, "epoch": 3212} {"train_loss": -25.075178146362305, "global_step": 266673, "epoch": 3212} {"train_loss": -24.740108489990234, "global_step": 266674, "epoch": 3212} {"train_loss": -25.00211524963379, "global_step": 266675, "epoch": 3212} {"train_loss": -25.245832443237305, "global_step": 266676, "epoch": 3212} {"train_loss": -24.746427536010742, "global_step": 266677, "epoch": 3212} {"train_loss": -25.02372732507177, "global_step": 266678, "epoch": 3212, "val_loss": 6968793.0} {"train_loss": -24.644987106323242, "global_step": 266679, "epoch": 3213} {"train_loss": -24.529823303222656, "global_step": 266680, "epoch": 3213} {"train_loss": -24.721721649169922, "global_step": 266681, "epoch": 3213} {"train_loss": -25.400344848632812, "global_step": 266682, "epoch": 3213} {"train_loss": -24.41407585144043, "global_step": 266683, "epoch": 3213} {"train_loss": -24.73423957824707, "global_step": 266684, "epoch": 3213} {"train_loss": -24.66716957092285, "global_step": 266685, "epoch": 3213} {"train_loss": -24.605894088745117, "global_step": 266686, "epoch": 3213} {"train_loss": -25.13274383544922, "global_step": 266687, "epoch": 3213} {"train_loss": -25.020092010498047, "global_step": 266688, "epoch": 3213} {"train_loss": -24.906728744506836, "global_step": 266689, "epoch": 3213} {"train_loss": -25.00264549255371, "global_step": 266690, "epoch": 3213} {"train_loss": -24.892658233642578, "global_step": 266691, "epoch": 3213} {"train_loss": -25.072839736938477, "global_step": 266692, "epoch": 3213} {"train_loss": -25.15274429321289, "global_step": 266693, "epoch": 3213} {"train_loss": -25.254980087280273, "global_step": 266694, "epoch": 3213} {"train_loss": -24.946073532104492, "global_step": 266695, "epoch": 3213} {"train_loss": -25.346256256103516, "global_step": 266696, "epoch": 3213} {"train_loss": -25.126401901245117, "global_step": 266697, "epoch": 3213} {"train_loss": -25.266632080078125, "global_step": 266698, "epoch": 3213} {"train_loss": -24.913400650024414, "global_step": 266699, "epoch": 3213} {"train_loss": -25.342437744140625, "global_step": 266700, "epoch": 3213} {"train_loss": -25.165815353393555, "global_step": 266701, "epoch": 3213} {"train_loss": -25.168987274169922, "global_step": 266702, "epoch": 3213} {"train_loss": -24.5712947845459, "global_step": 266703, "epoch": 3213} {"train_loss": -25.016815185546875, "global_step": 266704, "epoch": 3213} {"train_loss": -25.282133102416992, "global_step": 266705, "epoch": 3213} {"train_loss": -25.089385986328125, "global_step": 266706, "epoch": 3213} {"train_loss": -25.18418312072754, "global_step": 266707, "epoch": 3213} {"train_loss": -25.268949508666992, "global_step": 266708, "epoch": 3213} {"train_loss": -25.127798080444336, "global_step": 266709, "epoch": 3213} {"train_loss": -25.435949325561523, "global_step": 266710, "epoch": 3213} {"train_loss": -25.29096794128418, "global_step": 266711, "epoch": 3213} {"train_loss": -25.14436149597168, "global_step": 266712, "epoch": 3213} {"train_loss": -25.167715072631836, "global_step": 266713, "epoch": 3213} {"train_loss": -25.024160385131836, "global_step": 266714, "epoch": 3213} {"train_loss": -25.086088180541992, "global_step": 266715, "epoch": 3213} {"train_loss": -25.724884033203125, "global_step": 266716, "epoch": 3213} {"train_loss": -24.9531307220459, "global_step": 266717, "epoch": 3213} {"train_loss": -25.488895416259766, "global_step": 266718, "epoch": 3213} {"train_loss": -24.947071075439453, "global_step": 266719, "epoch": 3213} {"train_loss": -24.84062385559082, "global_step": 266720, "epoch": 3213} {"train_loss": -25.201215744018555, "global_step": 266721, "epoch": 3213} {"train_loss": -25.294605255126953, "global_step": 266722, "epoch": 3213} {"train_loss": -25.50129508972168, "global_step": 266723, "epoch": 3213} {"train_loss": -25.800443649291992, "global_step": 266724, "epoch": 3213} {"train_loss": -25.36376953125, "global_step": 266725, "epoch": 3213} {"train_loss": -25.39215660095215, "global_step": 266726, "epoch": 3213} {"train_loss": -25.411436080932617, "global_step": 266727, "epoch": 3213} {"train_loss": -25.421903610229492, "global_step": 266728, "epoch": 3213} {"train_loss": -25.240341186523438, "global_step": 266729, "epoch": 3213} {"train_loss": -25.332815170288086, "global_step": 266730, "epoch": 3213} {"train_loss": -25.269811630249023, "global_step": 266731, "epoch": 3213} {"train_loss": -25.4846248626709, "global_step": 266732, "epoch": 3213} {"train_loss": -25.214025497436523, "global_step": 266733, "epoch": 3213} {"train_loss": -25.6095027923584, "global_step": 266734, "epoch": 3213} {"train_loss": -25.205472946166992, "global_step": 266735, "epoch": 3213} {"train_loss": -25.333581924438477, "global_step": 266736, "epoch": 3213} {"train_loss": -25.034156799316406, "global_step": 266737, "epoch": 3213} {"train_loss": -24.999313354492188, "global_step": 266738, "epoch": 3213} {"train_loss": -25.451059341430664, "global_step": 266739, "epoch": 3213} {"train_loss": -25.43361473083496, "global_step": 266740, "epoch": 3213} {"train_loss": -25.25360107421875, "global_step": 266741, "epoch": 3213} {"train_loss": -25.336294174194336, "global_step": 266742, "epoch": 3213} {"train_loss": -25.277753829956055, "global_step": 266743, "epoch": 3213} {"train_loss": -25.379579544067383, "global_step": 266744, "epoch": 3213} {"train_loss": -25.399906158447266, "global_step": 266745, "epoch": 3213} {"train_loss": -25.45289421081543, "global_step": 266746, "epoch": 3213} {"train_loss": -25.218263626098633, "global_step": 266747, "epoch": 3213} {"train_loss": -24.970670700073242, "global_step": 266748, "epoch": 3213} {"train_loss": -25.1513614654541, "global_step": 266749, "epoch": 3213} {"train_loss": -25.33856773376465, "global_step": 266750, "epoch": 3213} {"train_loss": -25.562299728393555, "global_step": 266751, "epoch": 3213} {"train_loss": -25.09552574157715, "global_step": 266752, "epoch": 3213} {"train_loss": -25.3463191986084, "global_step": 266753, "epoch": 3213} {"train_loss": -25.098962783813477, "global_step": 266754, "epoch": 3213} {"train_loss": -25.627912521362305, "global_step": 266755, "epoch": 3213} {"train_loss": -25.302703857421875, "global_step": 266756, "epoch": 3213} {"train_loss": -25.09030532836914, "global_step": 266757, "epoch": 3213} {"train_loss": -25.065250396728516, "global_step": 266758, "epoch": 3213} {"train_loss": -25.38850975036621, "global_step": 266759, "epoch": 3213} {"train_loss": -25.332944869995117, "global_step": 266760, "epoch": 3213} {"train_loss": -25.176940366446253, "global_step": 266761, "epoch": 3213, "val_loss": 7014516.0} {"train_loss": -22.898099899291992, "global_step": 266762, "epoch": 3214} {"train_loss": -22.391990661621094, "global_step": 266763, "epoch": 3214} {"train_loss": -24.490903854370117, "global_step": 266764, "epoch": 3214} {"train_loss": -24.04743003845215, "global_step": 266765, "epoch": 3214} {"train_loss": -24.412790298461914, "global_step": 266766, "epoch": 3214} {"train_loss": -24.618560791015625, "global_step": 266767, "epoch": 3214} {"train_loss": -24.363330841064453, "global_step": 266768, "epoch": 3214} {"train_loss": -24.492834091186523, "global_step": 266769, "epoch": 3214} {"train_loss": -24.907543182373047, "global_step": 266770, "epoch": 3214} {"train_loss": -24.83575439453125, "global_step": 266771, "epoch": 3214} {"train_loss": -24.532983779907227, "global_step": 266772, "epoch": 3214} {"train_loss": -24.545957565307617, "global_step": 266773, "epoch": 3214} {"train_loss": -24.648950576782227, "global_step": 266774, "epoch": 3214} {"train_loss": -24.625898361206055, "global_step": 266775, "epoch": 3214} {"train_loss": -24.574636459350586, "global_step": 266776, "epoch": 3214} {"train_loss": -24.585500717163086, "global_step": 266777, "epoch": 3214} {"train_loss": -24.82382583618164, "global_step": 266778, "epoch": 3214} {"train_loss": -24.786481857299805, "global_step": 266779, "epoch": 3214} {"train_loss": -24.828571319580078, "global_step": 266780, "epoch": 3214} {"train_loss": -24.846899032592773, "global_step": 266781, "epoch": 3214} {"train_loss": -25.26430320739746, "global_step": 266782, "epoch": 3214} {"train_loss": -25.031494140625, "global_step": 266783, "epoch": 3214} {"train_loss": -25.274656295776367, "global_step": 266784, "epoch": 3214} {"train_loss": -25.003612518310547, "global_step": 266785, "epoch": 3214} {"train_loss": -24.690765380859375, "global_step": 266786, "epoch": 3214} {"train_loss": -25.281522750854492, "global_step": 266787, "epoch": 3214} {"train_loss": -25.17241668701172, "global_step": 266788, "epoch": 3214} {"train_loss": -25.513458251953125, "global_step": 266789, "epoch": 3214} {"train_loss": -25.362995147705078, "global_step": 266790, "epoch": 3214} {"train_loss": -25.160877227783203, "global_step": 266791, "epoch": 3214} {"train_loss": -25.55971336364746, "global_step": 266792, "epoch": 3214} {"train_loss": -25.21510124206543, "global_step": 266793, "epoch": 3214} {"train_loss": -25.268903732299805, "global_step": 266794, "epoch": 3214} {"train_loss": -25.422391891479492, "global_step": 266795, "epoch": 3214} {"train_loss": -25.379987716674805, "global_step": 266796, "epoch": 3214} {"train_loss": -25.28397560119629, "global_step": 266797, "epoch": 3214} {"train_loss": -25.094388961791992, "global_step": 266798, "epoch": 3214} {"train_loss": -25.454843521118164, "global_step": 266799, "epoch": 3214} {"train_loss": -25.40996742248535, "global_step": 266800, "epoch": 3214} {"train_loss": -25.32988739013672, "global_step": 266801, "epoch": 3214} {"train_loss": -25.694355010986328, "global_step": 266802, "epoch": 3214} {"train_loss": -25.40215301513672, "global_step": 266803, "epoch": 3214} {"train_loss": -25.3465518951416, "global_step": 266804, "epoch": 3214} {"train_loss": -25.343612670898438, "global_step": 266805, "epoch": 3214} {"train_loss": -25.35328483581543, "global_step": 266806, "epoch": 3214} {"train_loss": -25.190689086914062, "global_step": 266807, "epoch": 3214} {"train_loss": -25.110153198242188, "global_step": 266808, "epoch": 3214} {"train_loss": -25.212675094604492, "global_step": 266809, "epoch": 3214} {"train_loss": -25.2012996673584, "global_step": 266810, "epoch": 3214} {"train_loss": -25.416107177734375, "global_step": 266811, "epoch": 3214} {"train_loss": -25.421106338500977, "global_step": 266812, "epoch": 3214} {"train_loss": -25.00508689880371, "global_step": 266813, "epoch": 3214} {"train_loss": -25.288990020751953, "global_step": 266814, "epoch": 3214} {"train_loss": -25.31429100036621, "global_step": 266815, "epoch": 3214} {"train_loss": -25.387189865112305, "global_step": 266816, "epoch": 3214} {"train_loss": -25.244836807250977, "global_step": 266817, "epoch": 3214} {"train_loss": -25.227039337158203, "global_step": 266818, "epoch": 3214} {"train_loss": -25.389062881469727, "global_step": 266819, "epoch": 3214} {"train_loss": -24.956247329711914, "global_step": 266820, "epoch": 3214} {"train_loss": -24.56817054748535, "global_step": 266821, "epoch": 3214} {"train_loss": -24.640478134155273, "global_step": 266822, "epoch": 3214} {"train_loss": -24.750648498535156, "global_step": 266823, "epoch": 3214} {"train_loss": -24.870630264282227, "global_step": 266824, "epoch": 3214} {"train_loss": -25.409076690673828, "global_step": 266825, "epoch": 3214} {"train_loss": -24.778364181518555, "global_step": 266826, "epoch": 3214} {"train_loss": -24.879404067993164, "global_step": 266827, "epoch": 3214} {"train_loss": -24.900793075561523, "global_step": 266828, "epoch": 3214} {"train_loss": -25.129079818725586, "global_step": 266829, "epoch": 3214} {"train_loss": -24.92670249938965, "global_step": 266830, "epoch": 3214} {"train_loss": -25.031766891479492, "global_step": 266831, "epoch": 3214} {"train_loss": -25.141103744506836, "global_step": 266832, "epoch": 3214} {"train_loss": -24.984298706054688, "global_step": 266833, "epoch": 3214} {"train_loss": -24.917577743530273, "global_step": 266834, "epoch": 3214} {"train_loss": -24.905668258666992, "global_step": 266835, "epoch": 3214} {"train_loss": -24.911142349243164, "global_step": 266836, "epoch": 3214} {"train_loss": -24.99873924255371, "global_step": 266837, "epoch": 3214} {"train_loss": -24.931936264038086, "global_step": 266838, "epoch": 3214} {"train_loss": -25.307842254638672, "global_step": 266839, "epoch": 3214} {"train_loss": -25.113218307495117, "global_step": 266840, "epoch": 3214} {"train_loss": -24.889768600463867, "global_step": 266841, "epoch": 3214} {"train_loss": -25.292129516601562, "global_step": 266842, "epoch": 3214} {"train_loss": -25.223752975463867, "global_step": 266843, "epoch": 3214} {"train_loss": -25.000429911785815, "global_step": 266844, "epoch": 3214, "val_loss": 6902574.0} {"train_loss": -25.031190872192383, "global_step": 266845, "epoch": 3215} {"train_loss": -24.5883846282959, "global_step": 266846, "epoch": 3215} {"train_loss": -25.273059844970703, "global_step": 266847, "epoch": 3215} {"train_loss": -24.572080612182617, "global_step": 266848, "epoch": 3215} {"train_loss": -24.7218074798584, "global_step": 266849, "epoch": 3215} {"train_loss": -24.50420570373535, "global_step": 266850, "epoch": 3215} {"train_loss": -24.63381004333496, "global_step": 266851, "epoch": 3215} {"train_loss": -24.79023551940918, "global_step": 266852, "epoch": 3215} {"train_loss": -25.529878616333008, "global_step": 266853, "epoch": 3215} {"train_loss": -25.443811416625977, "global_step": 266854, "epoch": 3215} {"train_loss": -25.544343948364258, "global_step": 266855, "epoch": 3215} {"train_loss": -25.04204750061035, "global_step": 266856, "epoch": 3215} {"train_loss": -25.014591217041016, "global_step": 266857, "epoch": 3215} {"train_loss": -25.069496154785156, "global_step": 266858, "epoch": 3215} {"train_loss": -24.994983673095703, "global_step": 266859, "epoch": 3215} {"train_loss": -25.277677536010742, "global_step": 266860, "epoch": 3215} {"train_loss": -25.257272720336914, "global_step": 266861, "epoch": 3215} {"train_loss": -25.19207763671875, "global_step": 266862, "epoch": 3215} {"train_loss": -25.213165283203125, "global_step": 266863, "epoch": 3215} {"train_loss": -25.46669578552246, "global_step": 266864, "epoch": 3215} {"train_loss": -25.089130401611328, "global_step": 266865, "epoch": 3215} {"train_loss": -25.77619743347168, "global_step": 266866, "epoch": 3215} {"train_loss": -25.58601188659668, "global_step": 266867, "epoch": 3215} {"train_loss": -25.02341651916504, "global_step": 266868, "epoch": 3215} {"train_loss": -25.232168197631836, "global_step": 266869, "epoch": 3215} {"train_loss": -25.266515731811523, "global_step": 266870, "epoch": 3215} {"train_loss": -25.091018676757812, "global_step": 266871, "epoch": 3215} {"train_loss": -25.373197555541992, "global_step": 266872, "epoch": 3215} {"train_loss": -25.220413208007812, "global_step": 266873, "epoch": 3215} {"train_loss": -24.580820083618164, "global_step": 266874, "epoch": 3215} {"train_loss": -25.05218505859375, "global_step": 266875, "epoch": 3215} {"train_loss": -24.99769401550293, "global_step": 266876, "epoch": 3215} {"train_loss": -24.94439697265625, "global_step": 266877, "epoch": 3215} {"train_loss": -24.836782455444336, "global_step": 266878, "epoch": 3215} {"train_loss": -25.244434356689453, "global_step": 266879, "epoch": 3215} {"train_loss": -25.037519454956055, "global_step": 266880, "epoch": 3215} {"train_loss": -25.155517578125, "global_step": 266881, "epoch": 3215} {"train_loss": -25.174787521362305, "global_step": 266882, "epoch": 3215} {"train_loss": -25.44908332824707, "global_step": 266883, "epoch": 3215} {"train_loss": -25.178293228149414, "global_step": 266884, "epoch": 3215} {"train_loss": -25.250242233276367, "global_step": 266885, "epoch": 3215} {"train_loss": -25.407337188720703, "global_step": 266886, "epoch": 3215} {"train_loss": -25.0999755859375, "global_step": 266887, "epoch": 3215} {"train_loss": -25.48114585876465, "global_step": 266888, "epoch": 3215} {"train_loss": -25.285860061645508, "global_step": 266889, "epoch": 3215} {"train_loss": -25.18243980407715, "global_step": 266890, "epoch": 3215} {"train_loss": -25.45734405517578, "global_step": 266891, "epoch": 3215} {"train_loss": -25.332015991210938, "global_step": 266892, "epoch": 3215} {"train_loss": -25.529394149780273, "global_step": 266893, "epoch": 3215} {"train_loss": -25.685617446899414, "global_step": 266894, "epoch": 3215} {"train_loss": -25.160593032836914, "global_step": 266895, "epoch": 3215} {"train_loss": -25.241769790649414, "global_step": 266896, "epoch": 3215} {"train_loss": -24.95198631286621, "global_step": 266897, "epoch": 3215} {"train_loss": -25.50180435180664, "global_step": 266898, "epoch": 3215} {"train_loss": -25.448749542236328, "global_step": 266899, "epoch": 3215} {"train_loss": -25.246936798095703, "global_step": 266900, "epoch": 3215} {"train_loss": -24.954933166503906, "global_step": 266901, "epoch": 3215} {"train_loss": -25.379535675048828, "global_step": 266902, "epoch": 3215} {"train_loss": -25.656982421875, "global_step": 266903, "epoch": 3215} {"train_loss": -25.650976181030273, "global_step": 266904, "epoch": 3215} {"train_loss": -25.224889755249023, "global_step": 266905, "epoch": 3215} {"train_loss": -25.54143524169922, "global_step": 266906, "epoch": 3215} {"train_loss": -25.502674102783203, "global_step": 266907, "epoch": 3215} {"train_loss": -25.465505599975586, "global_step": 266908, "epoch": 3215} {"train_loss": -25.282516479492188, "global_step": 266909, "epoch": 3215} {"train_loss": -25.262235641479492, "global_step": 266910, "epoch": 3215} {"train_loss": -25.49702262878418, "global_step": 266911, "epoch": 3215} {"train_loss": -25.486942291259766, "global_step": 266912, "epoch": 3215} {"train_loss": -25.519546508789062, "global_step": 266913, "epoch": 3215} {"train_loss": -25.648706436157227, "global_step": 266914, "epoch": 3215} {"train_loss": -25.356094360351562, "global_step": 266915, "epoch": 3215} {"train_loss": -25.31845474243164, "global_step": 266916, "epoch": 3215} {"train_loss": -25.87664794921875, "global_step": 266917, "epoch": 3215} {"train_loss": -25.313146591186523, "global_step": 266918, "epoch": 3215} {"train_loss": -24.91509437561035, "global_step": 266919, "epoch": 3215} {"train_loss": -25.614410400390625, "global_step": 266920, "epoch": 3215} {"train_loss": -25.358102798461914, "global_step": 266921, "epoch": 3215} {"train_loss": -24.598529815673828, "global_step": 266922, "epoch": 3215} {"train_loss": -25.246017456054688, "global_step": 266923, "epoch": 3215} {"train_loss": -25.261255264282227, "global_step": 266924, "epoch": 3215} {"train_loss": -25.54023551940918, "global_step": 266925, "epoch": 3215} {"train_loss": -25.078908920288086, "global_step": 266926, "epoch": 3215} {"train_loss": -25.239082474306404, "global_step": 266927, "epoch": 3215, "val_loss": 6922887.0} {"train_loss": -25.011999130249023, "global_step": 266928, "epoch": 3216} {"train_loss": -24.900365829467773, "global_step": 266929, "epoch": 3216} {"train_loss": -24.88405418395996, "global_step": 266930, "epoch": 3216} {"train_loss": -24.735971450805664, "global_step": 266931, "epoch": 3216} {"train_loss": -24.885244369506836, "global_step": 266932, "epoch": 3216} {"train_loss": -24.870115280151367, "global_step": 266933, "epoch": 3216} {"train_loss": -24.72773551940918, "global_step": 266934, "epoch": 3216} {"train_loss": -24.8489933013916, "global_step": 266935, "epoch": 3216} {"train_loss": -24.76800537109375, "global_step": 266936, "epoch": 3216} {"train_loss": -24.784048080444336, "global_step": 266937, "epoch": 3216} {"train_loss": -25.001590728759766, "global_step": 266938, "epoch": 3216} {"train_loss": -25.00537109375, "global_step": 266939, "epoch": 3216} {"train_loss": -25.142353057861328, "global_step": 266940, "epoch": 3216} {"train_loss": -25.449073791503906, "global_step": 266941, "epoch": 3216} {"train_loss": -24.958959579467773, "global_step": 266942, "epoch": 3216} {"train_loss": -25.383817672729492, "global_step": 266943, "epoch": 3216} {"train_loss": -25.442642211914062, "global_step": 266944, "epoch": 3216} {"train_loss": -25.274953842163086, "global_step": 266945, "epoch": 3216} {"train_loss": -25.143491744995117, "global_step": 266946, "epoch": 3216} {"train_loss": -25.078237533569336, "global_step": 266947, "epoch": 3216} {"train_loss": -25.145536422729492, "global_step": 266948, "epoch": 3216} {"train_loss": -25.60797119140625, "global_step": 266949, "epoch": 3216} {"train_loss": -25.35801124572754, "global_step": 266950, "epoch": 3216} {"train_loss": -25.393625259399414, "global_step": 266951, "epoch": 3216} {"train_loss": -25.08724594116211, "global_step": 266952, "epoch": 3216} {"train_loss": -25.324613571166992, "global_step": 266953, "epoch": 3216} {"train_loss": -25.30686378479004, "global_step": 266954, "epoch": 3216} {"train_loss": -25.460590362548828, "global_step": 266955, "epoch": 3216} {"train_loss": -25.521320343017578, "global_step": 266956, "epoch": 3216} {"train_loss": -25.094465255737305, "global_step": 266957, "epoch": 3216} {"train_loss": -25.187179565429688, "global_step": 266958, "epoch": 3216} {"train_loss": -25.28653907775879, "global_step": 266959, "epoch": 3216} {"train_loss": -24.954328536987305, "global_step": 266960, "epoch": 3216} {"train_loss": -25.2291316986084, "global_step": 266961, "epoch": 3216} {"train_loss": -25.391334533691406, "global_step": 266962, "epoch": 3216} {"train_loss": -25.12276268005371, "global_step": 266963, "epoch": 3216} {"train_loss": -25.564682006835938, "global_step": 266964, "epoch": 3216} {"train_loss": -25.24142837524414, "global_step": 266965, "epoch": 3216} {"train_loss": -25.1727352142334, "global_step": 266966, "epoch": 3216} {"train_loss": -24.866960525512695, "global_step": 266967, "epoch": 3216} {"train_loss": -25.308002471923828, "global_step": 266968, "epoch": 3216} {"train_loss": -25.226242065429688, "global_step": 266969, "epoch": 3216} {"train_loss": -25.06788444519043, "global_step": 266970, "epoch": 3216} {"train_loss": -25.250391006469727, "global_step": 266971, "epoch": 3216} {"train_loss": -25.602664947509766, "global_step": 266972, "epoch": 3216} {"train_loss": -24.886062622070312, "global_step": 266973, "epoch": 3216} {"train_loss": -25.561939239501953, "global_step": 266974, "epoch": 3216} {"train_loss": -25.70319938659668, "global_step": 266975, "epoch": 3216} {"train_loss": -25.43576431274414, "global_step": 266976, "epoch": 3216} {"train_loss": -25.258176803588867, "global_step": 266977, "epoch": 3216} {"train_loss": -25.52480125427246, "global_step": 266978, "epoch": 3216} {"train_loss": -25.326879501342773, "global_step": 266979, "epoch": 3216} {"train_loss": -25.294830322265625, "global_step": 266980, "epoch": 3216} {"train_loss": -25.072050094604492, "global_step": 266981, "epoch": 3216} {"train_loss": -25.43672752380371, "global_step": 266982, "epoch": 3216} {"train_loss": -24.98599624633789, "global_step": 266983, "epoch": 3216} {"train_loss": -25.74322509765625, "global_step": 266984, "epoch": 3216} {"train_loss": -24.851207733154297, "global_step": 266985, "epoch": 3216} {"train_loss": -24.48969078063965, "global_step": 266986, "epoch": 3216} {"train_loss": -24.513242721557617, "global_step": 266987, "epoch": 3216} {"train_loss": -25.272424697875977, "global_step": 266988, "epoch": 3216} {"train_loss": -25.118968963623047, "global_step": 266989, "epoch": 3216} {"train_loss": -24.77829360961914, "global_step": 266990, "epoch": 3216} {"train_loss": -25.09016227722168, "global_step": 266991, "epoch": 3216} {"train_loss": -25.286245346069336, "global_step": 266992, "epoch": 3216} {"train_loss": -24.69134521484375, "global_step": 266993, "epoch": 3216} {"train_loss": -24.874195098876953, "global_step": 266994, "epoch": 3216} {"train_loss": -25.014596939086914, "global_step": 266995, "epoch": 3216} {"train_loss": -24.800811767578125, "global_step": 266996, "epoch": 3216} {"train_loss": -24.782262802124023, "global_step": 266997, "epoch": 3216} {"train_loss": -24.526601791381836, "global_step": 266998, "epoch": 3216} {"train_loss": -24.995792388916016, "global_step": 266999, "epoch": 3216} {"train_loss": -25.115966796875, "global_step": 267000, "epoch": 3216} {"train_loss": -25.219593048095703, "global_step": 267001, "epoch": 3216} {"train_loss": -24.820308685302734, "global_step": 267002, "epoch": 3216} {"train_loss": -25.13132667541504, "global_step": 267003, "epoch": 3216} {"train_loss": -24.929641723632812, "global_step": 267004, "epoch": 3216} {"train_loss": -25.035053253173828, "global_step": 267005, "epoch": 3216} {"train_loss": -25.527265548706055, "global_step": 267006, "epoch": 3216} {"train_loss": -25.173795700073242, "global_step": 267007, "epoch": 3216} {"train_loss": -25.246225357055664, "global_step": 267008, "epoch": 3216} {"train_loss": -25.056541442871094, "global_step": 267009, "epoch": 3216} {"train_loss": -25.123622388724822, "global_step": 267010, "epoch": 3216, "val_loss": 6988976.5} {"train_loss": -24.6438045501709, "global_step": 267011, "epoch": 3217} {"train_loss": -24.78675079345703, "global_step": 267012, "epoch": 3217} {"train_loss": -24.831979751586914, "global_step": 267013, "epoch": 3217} {"train_loss": -25.133115768432617, "global_step": 267014, "epoch": 3217} {"train_loss": -24.863311767578125, "global_step": 267015, "epoch": 3217} {"train_loss": -25.31488609313965, "global_step": 267016, "epoch": 3217} {"train_loss": -24.931289672851562, "global_step": 267017, "epoch": 3217} {"train_loss": -25.137388229370117, "global_step": 267018, "epoch": 3217} {"train_loss": -24.89869499206543, "global_step": 267019, "epoch": 3217} {"train_loss": -24.990854263305664, "global_step": 267020, "epoch": 3217} {"train_loss": -24.885068893432617, "global_step": 267021, "epoch": 3217} {"train_loss": -25.285541534423828, "global_step": 267022, "epoch": 3217} {"train_loss": -25.197629928588867, "global_step": 267023, "epoch": 3217} {"train_loss": -24.816387176513672, "global_step": 267024, "epoch": 3217} {"train_loss": -25.211109161376953, "global_step": 267025, "epoch": 3217} {"train_loss": -24.89655113220215, "global_step": 267026, "epoch": 3217} {"train_loss": -25.08023452758789, "global_step": 267027, "epoch": 3217} {"train_loss": -24.95359230041504, "global_step": 267028, "epoch": 3217} {"train_loss": -24.972753524780273, "global_step": 267029, "epoch": 3217} {"train_loss": -25.34417724609375, "global_step": 267030, "epoch": 3217} {"train_loss": -25.10768699645996, "global_step": 267031, "epoch": 3217} {"train_loss": -25.340700149536133, "global_step": 267032, "epoch": 3217} {"train_loss": -25.027055740356445, "global_step": 267033, "epoch": 3217} {"train_loss": -25.249706268310547, "global_step": 267034, "epoch": 3217} {"train_loss": -24.988367080688477, "global_step": 267035, "epoch": 3217} {"train_loss": -25.500762939453125, "global_step": 267036, "epoch": 3217} {"train_loss": -25.287277221679688, "global_step": 267037, "epoch": 3217} {"train_loss": -25.106252670288086, "global_step": 267038, "epoch": 3217} {"train_loss": -25.488746643066406, "global_step": 267039, "epoch": 3217} {"train_loss": -25.129419326782227, "global_step": 267040, "epoch": 3217} {"train_loss": -25.418441772460938, "global_step": 267041, "epoch": 3217} {"train_loss": -25.429685592651367, "global_step": 267042, "epoch": 3217} {"train_loss": -25.3075008392334, "global_step": 267043, "epoch": 3217} {"train_loss": -25.433048248291016, "global_step": 267044, "epoch": 3217} {"train_loss": -25.157812118530273, "global_step": 267045, "epoch": 3217} {"train_loss": -25.604440689086914, "global_step": 267046, "epoch": 3217} {"train_loss": -25.279600143432617, "global_step": 267047, "epoch": 3217} {"train_loss": -25.345287322998047, "global_step": 267048, "epoch": 3217} {"train_loss": -25.538724899291992, "global_step": 267049, "epoch": 3217} {"train_loss": -25.28262710571289, "global_step": 267050, "epoch": 3217} {"train_loss": -25.007030487060547, "global_step": 267051, "epoch": 3217} {"train_loss": -25.05758285522461, "global_step": 267052, "epoch": 3217} {"train_loss": -25.175079345703125, "global_step": 267053, "epoch": 3217} {"train_loss": -25.111230850219727, "global_step": 267054, "epoch": 3217} {"train_loss": -25.360700607299805, "global_step": 267055, "epoch": 3217} {"train_loss": -25.330610275268555, "global_step": 267056, "epoch": 3217} {"train_loss": -25.119794845581055, "global_step": 267057, "epoch": 3217} {"train_loss": -24.605669021606445, "global_step": 267058, "epoch": 3217} {"train_loss": -25.289342880249023, "global_step": 267059, "epoch": 3217} {"train_loss": -25.274457931518555, "global_step": 267060, "epoch": 3217} {"train_loss": -25.04336929321289, "global_step": 267061, "epoch": 3217} {"train_loss": -24.942853927612305, "global_step": 267062, "epoch": 3217} {"train_loss": -25.04644775390625, "global_step": 267063, "epoch": 3217} {"train_loss": -25.223047256469727, "global_step": 267064, "epoch": 3217} {"train_loss": -25.30810546875, "global_step": 267065, "epoch": 3217} {"train_loss": -25.520694732666016, "global_step": 267066, "epoch": 3217} {"train_loss": -25.128890991210938, "global_step": 267067, "epoch": 3217} {"train_loss": -25.493144989013672, "global_step": 267068, "epoch": 3217} {"train_loss": -25.575796127319336, "global_step": 267069, "epoch": 3217} {"train_loss": -25.3072566986084, "global_step": 267070, "epoch": 3217} {"train_loss": -24.8388614654541, "global_step": 267071, "epoch": 3217} {"train_loss": -25.035429000854492, "global_step": 267072, "epoch": 3217} {"train_loss": -25.02440643310547, "global_step": 267073, "epoch": 3217} {"train_loss": -25.07034683227539, "global_step": 267074, "epoch": 3217} {"train_loss": -24.87892723083496, "global_step": 267075, "epoch": 3217} {"train_loss": -25.254737854003906, "global_step": 267076, "epoch": 3217} {"train_loss": -24.921993255615234, "global_step": 267077, "epoch": 3217} {"train_loss": -25.02313232421875, "global_step": 267078, "epoch": 3217} {"train_loss": -25.63187026977539, "global_step": 267079, "epoch": 3217} {"train_loss": -25.348745346069336, "global_step": 267080, "epoch": 3217} {"train_loss": -25.089262008666992, "global_step": 267081, "epoch": 3217} {"train_loss": -25.410634994506836, "global_step": 267082, "epoch": 3217} {"train_loss": -25.086868286132812, "global_step": 267083, "epoch": 3217} {"train_loss": -25.53493309020996, "global_step": 267084, "epoch": 3217} {"train_loss": -25.29762840270996, "global_step": 267085, "epoch": 3217} {"train_loss": -25.086740493774414, "global_step": 267086, "epoch": 3217} {"train_loss": -24.970157623291016, "global_step": 267087, "epoch": 3217} {"train_loss": -25.287315368652344, "global_step": 267088, "epoch": 3217} {"train_loss": -24.939058303833008, "global_step": 267089, "epoch": 3217} {"train_loss": -25.277353286743164, "global_step": 267090, "epoch": 3217} {"train_loss": -25.30108070373535, "global_step": 267091, "epoch": 3217} {"train_loss": -25.416584014892578, "global_step": 267092, "epoch": 3217} {"train_loss": -25.163043562188207, "global_step": 267093, "epoch": 3217, "val_loss": 6901896.0} {"train_loss": -24.88457679748535, "global_step": 267094, "epoch": 3218} {"train_loss": -25.009939193725586, "global_step": 267095, "epoch": 3218} {"train_loss": -24.389789581298828, "global_step": 267096, "epoch": 3218} {"train_loss": -25.068191528320312, "global_step": 267097, "epoch": 3218} {"train_loss": -24.738130569458008, "global_step": 267098, "epoch": 3218} {"train_loss": -24.933141708374023, "global_step": 267099, "epoch": 3218} {"train_loss": -24.80201530456543, "global_step": 267100, "epoch": 3218} {"train_loss": -24.739959716796875, "global_step": 267101, "epoch": 3218} {"train_loss": -24.946569442749023, "global_step": 267102, "epoch": 3218} {"train_loss": -24.71826171875, "global_step": 267103, "epoch": 3218} {"train_loss": -25.12691879272461, "global_step": 267104, "epoch": 3218} {"train_loss": -24.972549438476562, "global_step": 267105, "epoch": 3218} {"train_loss": -25.27518081665039, "global_step": 267106, "epoch": 3218} {"train_loss": -24.71491813659668, "global_step": 267107, "epoch": 3218} {"train_loss": -24.717304229736328, "global_step": 267108, "epoch": 3218} {"train_loss": -25.03606605529785, "global_step": 267109, "epoch": 3218} {"train_loss": -24.711191177368164, "global_step": 267110, "epoch": 3218} {"train_loss": -24.960607528686523, "global_step": 267111, "epoch": 3218} {"train_loss": -24.95033836364746, "global_step": 267112, "epoch": 3218} {"train_loss": -25.129730224609375, "global_step": 267113, "epoch": 3218} {"train_loss": -25.1920223236084, "global_step": 267114, "epoch": 3218} {"train_loss": -25.12904167175293, "global_step": 267115, "epoch": 3218} {"train_loss": -25.093229293823242, "global_step": 267116, "epoch": 3218} {"train_loss": -24.967126846313477, "global_step": 267117, "epoch": 3218} {"train_loss": -24.884361267089844, "global_step": 267118, "epoch": 3218} {"train_loss": -25.270612716674805, "global_step": 267119, "epoch": 3218} {"train_loss": -25.51524543762207, "global_step": 267120, "epoch": 3218} {"train_loss": -25.029399871826172, "global_step": 267121, "epoch": 3218} {"train_loss": -24.687992095947266, "global_step": 267122, "epoch": 3218} {"train_loss": -25.51624870300293, "global_step": 267123, "epoch": 3218} {"train_loss": -25.412199020385742, "global_step": 267124, "epoch": 3218} {"train_loss": -25.19618034362793, "global_step": 267125, "epoch": 3218} {"train_loss": -24.91633415222168, "global_step": 267126, "epoch": 3218} {"train_loss": -25.03824234008789, "global_step": 267127, "epoch": 3218} {"train_loss": -25.320722579956055, "global_step": 267128, "epoch": 3218} {"train_loss": -25.366989135742188, "global_step": 267129, "epoch": 3218} {"train_loss": -24.89864158630371, "global_step": 267130, "epoch": 3218} {"train_loss": -25.2154598236084, "global_step": 267131, "epoch": 3218} {"train_loss": -25.17217445373535, "global_step": 267132, "epoch": 3218} {"train_loss": -24.961620330810547, "global_step": 267133, "epoch": 3218} {"train_loss": -25.125669479370117, "global_step": 267134, "epoch": 3218} {"train_loss": -25.353010177612305, "global_step": 267135, "epoch": 3218} {"train_loss": -25.470312118530273, "global_step": 267136, "epoch": 3218} {"train_loss": -24.940078735351562, "global_step": 267137, "epoch": 3218} {"train_loss": -25.54551124572754, "global_step": 267138, "epoch": 3218} {"train_loss": -24.75599479675293, "global_step": 267139, "epoch": 3218} {"train_loss": -25.464614868164062, "global_step": 267140, "epoch": 3218} {"train_loss": -24.99356460571289, "global_step": 267141, "epoch": 3218} {"train_loss": -25.205596923828125, "global_step": 267142, "epoch": 3218} {"train_loss": -24.909765243530273, "global_step": 267143, "epoch": 3218} {"train_loss": -25.34344482421875, "global_step": 267144, "epoch": 3218} {"train_loss": -24.940370559692383, "global_step": 267145, "epoch": 3218} {"train_loss": -25.339065551757812, "global_step": 267146, "epoch": 3218} {"train_loss": -25.1494140625, "global_step": 267147, "epoch": 3218} {"train_loss": -25.584932327270508, "global_step": 267148, "epoch": 3218} {"train_loss": -25.248010635375977, "global_step": 267149, "epoch": 3218} {"train_loss": -25.445180892944336, "global_step": 267150, "epoch": 3218} {"train_loss": -25.655048370361328, "global_step": 267151, "epoch": 3218} {"train_loss": -25.168466567993164, "global_step": 267152, "epoch": 3218} {"train_loss": -25.5308837890625, "global_step": 267153, "epoch": 3218} {"train_loss": -25.59815216064453, "global_step": 267154, "epoch": 3218} {"train_loss": -25.334623336791992, "global_step": 267155, "epoch": 3218} {"train_loss": -25.05695343017578, "global_step": 267156, "epoch": 3218} {"train_loss": -25.57086753845215, "global_step": 267157, "epoch": 3218} {"train_loss": -25.355453491210938, "global_step": 267158, "epoch": 3218} {"train_loss": -25.30698013305664, "global_step": 267159, "epoch": 3218} {"train_loss": -25.20034408569336, "global_step": 267160, "epoch": 3218} {"train_loss": -25.736175537109375, "global_step": 267161, "epoch": 3218} {"train_loss": -25.0057315826416, "global_step": 267162, "epoch": 3218} {"train_loss": -25.287994384765625, "global_step": 267163, "epoch": 3218} {"train_loss": -25.21388053894043, "global_step": 267164, "epoch": 3218} {"train_loss": -25.034475326538086, "global_step": 267165, "epoch": 3218} {"train_loss": -25.019073486328125, "global_step": 267166, "epoch": 3218} {"train_loss": -25.550243377685547, "global_step": 267167, "epoch": 3218} {"train_loss": -24.788055419921875, "global_step": 267168, "epoch": 3218} {"train_loss": -25.039216995239258, "global_step": 267169, "epoch": 3218} {"train_loss": -25.4035701751709, "global_step": 267170, "epoch": 3218} {"train_loss": -25.364105224609375, "global_step": 267171, "epoch": 3218} {"train_loss": -25.042490005493164, "global_step": 267172, "epoch": 3218} {"train_loss": -25.01854133605957, "global_step": 267173, "epoch": 3218} {"train_loss": -25.513349533081055, "global_step": 267174, "epoch": 3218} {"train_loss": -25.27738380432129, "global_step": 267175, "epoch": 3218} {"train_loss": -25.146632941372424, "global_step": 267176, "epoch": 3218, "val_loss": 7001479.0} {"train_loss": -24.259370803833008, "global_step": 267177, "epoch": 3219} {"train_loss": -23.533370971679688, "global_step": 267178, "epoch": 3219} {"train_loss": -24.234460830688477, "global_step": 267179, "epoch": 3219} {"train_loss": -24.082914352416992, "global_step": 267180, "epoch": 3219} {"train_loss": -24.31971549987793, "global_step": 267181, "epoch": 3219} {"train_loss": -24.27252769470215, "global_step": 267182, "epoch": 3219} {"train_loss": -24.34619140625, "global_step": 267183, "epoch": 3219} {"train_loss": -24.268115997314453, "global_step": 267184, "epoch": 3219} {"train_loss": -24.453222274780273, "global_step": 267185, "epoch": 3219} {"train_loss": -24.798574447631836, "global_step": 267186, "epoch": 3219} {"train_loss": -24.556747436523438, "global_step": 267187, "epoch": 3219} {"train_loss": -24.634618759155273, "global_step": 267188, "epoch": 3219} {"train_loss": -24.575658798217773, "global_step": 267189, "epoch": 3219} {"train_loss": -24.74880027770996, "global_step": 267190, "epoch": 3219} {"train_loss": -25.021852493286133, "global_step": 267191, "epoch": 3219} {"train_loss": -24.68723487854004, "global_step": 267192, "epoch": 3219} {"train_loss": -24.885160446166992, "global_step": 267193, "epoch": 3219} {"train_loss": -24.739717483520508, "global_step": 267194, "epoch": 3219} {"train_loss": -24.481689453125, "global_step": 267195, "epoch": 3219} {"train_loss": -24.801013946533203, "global_step": 267196, "epoch": 3219} {"train_loss": -24.902267456054688, "global_step": 267197, "epoch": 3219} {"train_loss": -25.102649688720703, "global_step": 267198, "epoch": 3219} {"train_loss": -25.424373626708984, "global_step": 267199, "epoch": 3219} {"train_loss": -24.545074462890625, "global_step": 267200, "epoch": 3219} {"train_loss": -24.896703720092773, "global_step": 267201, "epoch": 3219} {"train_loss": -25.21708869934082, "global_step": 267202, "epoch": 3219} {"train_loss": -24.977466583251953, "global_step": 267203, "epoch": 3219} {"train_loss": -24.915267944335938, "global_step": 267204, "epoch": 3219} {"train_loss": -24.81214714050293, "global_step": 267205, "epoch": 3219} {"train_loss": -25.206323623657227, "global_step": 267206, "epoch": 3219} {"train_loss": -25.054035186767578, "global_step": 267207, "epoch": 3219} {"train_loss": -24.880443572998047, "global_step": 267208, "epoch": 3219} {"train_loss": -25.230253219604492, "global_step": 267209, "epoch": 3219} {"train_loss": -25.0216007232666, "global_step": 267210, "epoch": 3219} {"train_loss": -24.737850189208984, "global_step": 267211, "epoch": 3219} {"train_loss": -25.34761619567871, "global_step": 267212, "epoch": 3219} {"train_loss": -25.083112716674805, "global_step": 267213, "epoch": 3219} {"train_loss": -25.065570831298828, "global_step": 267214, "epoch": 3219} {"train_loss": -25.4730281829834, "global_step": 267215, "epoch": 3219} {"train_loss": -24.922603607177734, "global_step": 267216, "epoch": 3219} {"train_loss": -25.35829734802246, "global_step": 267217, "epoch": 3219} {"train_loss": -25.243947982788086, "global_step": 267218, "epoch": 3219} {"train_loss": -25.545499801635742, "global_step": 267219, "epoch": 3219} {"train_loss": -25.343738555908203, "global_step": 267220, "epoch": 3219} {"train_loss": -25.200918197631836, "global_step": 267221, "epoch": 3219} {"train_loss": -25.410497665405273, "global_step": 267222, "epoch": 3219} {"train_loss": -25.209537506103516, "global_step": 267223, "epoch": 3219} {"train_loss": -24.905929565429688, "global_step": 267224, "epoch": 3219} {"train_loss": -25.350858688354492, "global_step": 267225, "epoch": 3219} {"train_loss": -24.968503952026367, "global_step": 267226, "epoch": 3219} {"train_loss": -25.09169578552246, "global_step": 267227, "epoch": 3219} {"train_loss": -25.158376693725586, "global_step": 267228, "epoch": 3219} {"train_loss": -25.226520538330078, "global_step": 267229, "epoch": 3219} {"train_loss": -25.13275718688965, "global_step": 267230, "epoch": 3219} {"train_loss": -25.122556686401367, "global_step": 267231, "epoch": 3219} {"train_loss": -25.2989559173584, "global_step": 267232, "epoch": 3219} {"train_loss": -25.470590591430664, "global_step": 267233, "epoch": 3219} {"train_loss": -25.06264305114746, "global_step": 267234, "epoch": 3219} {"train_loss": -25.670495986938477, "global_step": 267235, "epoch": 3219} {"train_loss": -25.312925338745117, "global_step": 267236, "epoch": 3219} {"train_loss": -25.418853759765625, "global_step": 267237, "epoch": 3219} {"train_loss": -25.620176315307617, "global_step": 267238, "epoch": 3219} {"train_loss": -25.44801139831543, "global_step": 267239, "epoch": 3219} {"train_loss": -25.140810012817383, "global_step": 267240, "epoch": 3219} {"train_loss": -25.197717666625977, "global_step": 267241, "epoch": 3219} {"train_loss": -25.286115646362305, "global_step": 267242, "epoch": 3219} {"train_loss": -25.42527198791504, "global_step": 267243, "epoch": 3219} {"train_loss": -25.08860969543457, "global_step": 267244, "epoch": 3219} {"train_loss": -25.35271644592285, "global_step": 267245, "epoch": 3219} {"train_loss": -25.56166648864746, "global_step": 267246, "epoch": 3219} {"train_loss": -25.031103134155273, "global_step": 267247, "epoch": 3219} {"train_loss": -24.78927993774414, "global_step": 267248, "epoch": 3219} {"train_loss": -25.04952049255371, "global_step": 267249, "epoch": 3219} {"train_loss": -25.39257049560547, "global_step": 267250, "epoch": 3219} {"train_loss": -25.18439292907715, "global_step": 267251, "epoch": 3219} {"train_loss": -25.525876998901367, "global_step": 267252, "epoch": 3219} {"train_loss": -25.527647018432617, "global_step": 267253, "epoch": 3219} {"train_loss": -25.50123405456543, "global_step": 267254, "epoch": 3219} {"train_loss": -25.20338249206543, "global_step": 267255, "epoch": 3219} {"train_loss": -25.246816635131836, "global_step": 267256, "epoch": 3219} {"train_loss": -25.415109634399414, "global_step": 267257, "epoch": 3219} {"train_loss": -25.330793380737305, "global_step": 267258, "epoch": 3219} {"train_loss": -25.027606596429663, "global_step": 267259, "epoch": 3219, "val_loss": 6975683.5} {"train_loss": -25.35084342956543, "global_step": 267260, "epoch": 3220} {"train_loss": -25.110252380371094, "global_step": 267261, "epoch": 3220} {"train_loss": -24.749826431274414, "global_step": 267262, "epoch": 3220} {"train_loss": -24.313535690307617, "global_step": 267263, "epoch": 3220} {"train_loss": -24.600969314575195, "global_step": 267264, "epoch": 3220} {"train_loss": -25.109495162963867, "global_step": 267265, "epoch": 3220} {"train_loss": -24.9323787689209, "global_step": 267266, "epoch": 3220} {"train_loss": -25.102550506591797, "global_step": 267267, "epoch": 3220} {"train_loss": -24.797616958618164, "global_step": 267268, "epoch": 3220} {"train_loss": -24.86480140686035, "global_step": 267269, "epoch": 3220} {"train_loss": -25.248525619506836, "global_step": 267270, "epoch": 3220} {"train_loss": -25.20737075805664, "global_step": 267271, "epoch": 3220} {"train_loss": -24.825647354125977, "global_step": 267272, "epoch": 3220} {"train_loss": -25.06033706665039, "global_step": 267273, "epoch": 3220} {"train_loss": -24.797286987304688, "global_step": 267274, "epoch": 3220} {"train_loss": -25.141620635986328, "global_step": 267275, "epoch": 3220} {"train_loss": -25.152587890625, "global_step": 267276, "epoch": 3220} {"train_loss": -25.63811683654785, "global_step": 267277, "epoch": 3220} {"train_loss": -25.234540939331055, "global_step": 267278, "epoch": 3220} {"train_loss": -25.06523323059082, "global_step": 267279, "epoch": 3220} {"train_loss": -25.541547775268555, "global_step": 267280, "epoch": 3220} {"train_loss": -24.981199264526367, "global_step": 267281, "epoch": 3220} {"train_loss": -25.300989151000977, "global_step": 267282, "epoch": 3220} {"train_loss": -25.314958572387695, "global_step": 267283, "epoch": 3220} {"train_loss": -25.527481079101562, "global_step": 267284, "epoch": 3220} {"train_loss": -25.24781608581543, "global_step": 267285, "epoch": 3220} {"train_loss": -25.602033615112305, "global_step": 267286, "epoch": 3220} {"train_loss": -25.20930290222168, "global_step": 267287, "epoch": 3220} {"train_loss": -25.096399307250977, "global_step": 267288, "epoch": 3220} {"train_loss": -25.493146896362305, "global_step": 267289, "epoch": 3220} {"train_loss": -25.262441635131836, "global_step": 267290, "epoch": 3220} {"train_loss": -25.076318740844727, "global_step": 267291, "epoch": 3220} {"train_loss": -25.253307342529297, "global_step": 267292, "epoch": 3220} {"train_loss": -25.6103515625, "global_step": 267293, "epoch": 3220} {"train_loss": -25.025869369506836, "global_step": 267294, "epoch": 3220} {"train_loss": -25.541851043701172, "global_step": 267295, "epoch": 3220} {"train_loss": -25.53986930847168, "global_step": 267296, "epoch": 3220} {"train_loss": -25.41434669494629, "global_step": 267297, "epoch": 3220} {"train_loss": -25.18930435180664, "global_step": 267298, "epoch": 3220} {"train_loss": -25.351346969604492, "global_step": 267299, "epoch": 3220} {"train_loss": -24.886056900024414, "global_step": 267300, "epoch": 3220} {"train_loss": -25.585693359375, "global_step": 267301, "epoch": 3220} {"train_loss": -25.460851669311523, "global_step": 267302, "epoch": 3220} {"train_loss": -25.1912784576416, "global_step": 267303, "epoch": 3220} {"train_loss": -25.41663932800293, "global_step": 267304, "epoch": 3220} {"train_loss": -25.726913452148438, "global_step": 267305, "epoch": 3220} {"train_loss": -25.29230308532715, "global_step": 267306, "epoch": 3220} {"train_loss": -25.126195907592773, "global_step": 267307, "epoch": 3220} {"train_loss": -25.16571617126465, "global_step": 267308, "epoch": 3220} {"train_loss": -25.591535568237305, "global_step": 267309, "epoch": 3220} {"train_loss": -25.232833862304688, "global_step": 267310, "epoch": 3220} {"train_loss": -25.33323860168457, "global_step": 267311, "epoch": 3220} {"train_loss": -25.34406089782715, "global_step": 267312, "epoch": 3220} {"train_loss": -25.186716079711914, "global_step": 267313, "epoch": 3220} {"train_loss": -24.860376358032227, "global_step": 267314, "epoch": 3220} {"train_loss": -25.394609451293945, "global_step": 267315, "epoch": 3220} {"train_loss": -25.490402221679688, "global_step": 267316, "epoch": 3220} {"train_loss": -25.31218719482422, "global_step": 267317, "epoch": 3220} {"train_loss": -25.08694076538086, "global_step": 267318, "epoch": 3220} {"train_loss": -25.2669734954834, "global_step": 267319, "epoch": 3220} {"train_loss": -25.499900817871094, "global_step": 267320, "epoch": 3220} {"train_loss": -24.814678192138672, "global_step": 267321, "epoch": 3220} {"train_loss": -24.92750358581543, "global_step": 267322, "epoch": 3220} {"train_loss": -25.132612228393555, "global_step": 267323, "epoch": 3220} {"train_loss": -24.970291137695312, "global_step": 267324, "epoch": 3220} {"train_loss": -25.41158103942871, "global_step": 267325, "epoch": 3220} {"train_loss": -24.692880630493164, "global_step": 267326, "epoch": 3220} {"train_loss": -25.04579734802246, "global_step": 267327, "epoch": 3220} {"train_loss": -25.313098907470703, "global_step": 267328, "epoch": 3220} {"train_loss": -25.002342224121094, "global_step": 267329, "epoch": 3220} {"train_loss": -25.02985382080078, "global_step": 267330, "epoch": 3220} {"train_loss": -25.08197593688965, "global_step": 267331, "epoch": 3220} {"train_loss": -25.511898040771484, "global_step": 267332, "epoch": 3220} {"train_loss": -25.141756057739258, "global_step": 267333, "epoch": 3220} {"train_loss": -25.43550682067871, "global_step": 267334, "epoch": 3220} {"train_loss": -25.457698822021484, "global_step": 267335, "epoch": 3220} {"train_loss": -25.058330535888672, "global_step": 267336, "epoch": 3220} {"train_loss": -24.983619689941406, "global_step": 267337, "epoch": 3220} {"train_loss": -24.749074935913086, "global_step": 267338, "epoch": 3220} {"train_loss": -25.022192001342773, "global_step": 267339, "epoch": 3220} {"train_loss": -25.346593856811523, "global_step": 267340, "epoch": 3220} {"train_loss": -25.359806060791016, "global_step": 267341, "epoch": 3220} {"train_loss": -25.199886046260236, "global_step": 267342, "epoch": 3220, "val_loss": 6917782.5} {"train_loss": -24.795101165771484, "global_step": 267343, "epoch": 3221} {"train_loss": -24.7512149810791, "global_step": 267344, "epoch": 3221} {"train_loss": -24.9484920501709, "global_step": 267345, "epoch": 3221} {"train_loss": -24.80914878845215, "global_step": 267346, "epoch": 3221} {"train_loss": -24.2952880859375, "global_step": 267347, "epoch": 3221} {"train_loss": -24.4360408782959, "global_step": 267348, "epoch": 3221} {"train_loss": -24.5720272064209, "global_step": 267349, "epoch": 3221} {"train_loss": -24.88347816467285, "global_step": 267350, "epoch": 3221} {"train_loss": -24.920873641967773, "global_step": 267351, "epoch": 3221} {"train_loss": -24.487293243408203, "global_step": 267352, "epoch": 3221} {"train_loss": -24.389270782470703, "global_step": 267353, "epoch": 3221} {"train_loss": -25.016752243041992, "global_step": 267354, "epoch": 3221} {"train_loss": -24.90999984741211, "global_step": 267355, "epoch": 3221} {"train_loss": -25.030902862548828, "global_step": 267356, "epoch": 3221} {"train_loss": -24.97234535217285, "global_step": 267357, "epoch": 3221} {"train_loss": -24.76087760925293, "global_step": 267358, "epoch": 3221} {"train_loss": -25.066877365112305, "global_step": 267359, "epoch": 3221} {"train_loss": -24.71820068359375, "global_step": 267360, "epoch": 3221} {"train_loss": -25.100088119506836, "global_step": 267361, "epoch": 3221} {"train_loss": -25.220121383666992, "global_step": 267362, "epoch": 3221} {"train_loss": -25.11819076538086, "global_step": 267363, "epoch": 3221} {"train_loss": -25.146900177001953, "global_step": 267364, "epoch": 3221} {"train_loss": -25.092370986938477, "global_step": 267365, "epoch": 3221} {"train_loss": -24.88639259338379, "global_step": 267366, "epoch": 3221} {"train_loss": -25.152738571166992, "global_step": 267367, "epoch": 3221} {"train_loss": -24.950332641601562, "global_step": 267368, "epoch": 3221} {"train_loss": -25.292722702026367, "global_step": 267369, "epoch": 3221} {"train_loss": -25.24201011657715, "global_step": 267370, "epoch": 3221} {"train_loss": -25.2095890045166, "global_step": 267371, "epoch": 3221} {"train_loss": -25.36736488342285, "global_step": 267372, "epoch": 3221} {"train_loss": -25.40804100036621, "global_step": 267373, "epoch": 3221} {"train_loss": -25.089338302612305, "global_step": 267374, "epoch": 3221} {"train_loss": -25.17891502380371, "global_step": 267375, "epoch": 3221} {"train_loss": -25.29615592956543, "global_step": 267376, "epoch": 3221} {"train_loss": -25.322004318237305, "global_step": 267377, "epoch": 3221} {"train_loss": -25.442447662353516, "global_step": 267378, "epoch": 3221} {"train_loss": -25.599014282226562, "global_step": 267379, "epoch": 3221} {"train_loss": -25.08900260925293, "global_step": 267380, "epoch": 3221} {"train_loss": -24.95243263244629, "global_step": 267381, "epoch": 3221} {"train_loss": -25.39434242248535, "global_step": 267382, "epoch": 3221} {"train_loss": -25.39387321472168, "global_step": 267383, "epoch": 3221} {"train_loss": -25.44327735900879, "global_step": 267384, "epoch": 3221} {"train_loss": -25.480030059814453, "global_step": 267385, "epoch": 3221} {"train_loss": -25.135652542114258, "global_step": 267386, "epoch": 3221} {"train_loss": -25.435678482055664, "global_step": 267387, "epoch": 3221} {"train_loss": -25.17885971069336, "global_step": 267388, "epoch": 3221} {"train_loss": -25.22258186340332, "global_step": 267389, "epoch": 3221} {"train_loss": -25.597578048706055, "global_step": 267390, "epoch": 3221} {"train_loss": -25.801990509033203, "global_step": 267391, "epoch": 3221} {"train_loss": -25.30193328857422, "global_step": 267392, "epoch": 3221} {"train_loss": -25.37647819519043, "global_step": 267393, "epoch": 3221} {"train_loss": -25.0535945892334, "global_step": 267394, "epoch": 3221} {"train_loss": -25.87742042541504, "global_step": 267395, "epoch": 3221} {"train_loss": -25.306455612182617, "global_step": 267396, "epoch": 3221} {"train_loss": -25.47817039489746, "global_step": 267397, "epoch": 3221} {"train_loss": -25.608861923217773, "global_step": 267398, "epoch": 3221} {"train_loss": -25.24451446533203, "global_step": 267399, "epoch": 3221} {"train_loss": -25.567180633544922, "global_step": 267400, "epoch": 3221} {"train_loss": -25.319013595581055, "global_step": 267401, "epoch": 3221} {"train_loss": -25.33451271057129, "global_step": 267402, "epoch": 3221} {"train_loss": -25.384777069091797, "global_step": 267403, "epoch": 3221} {"train_loss": -25.149396896362305, "global_step": 267404, "epoch": 3221} {"train_loss": -25.481853485107422, "global_step": 267405, "epoch": 3221} {"train_loss": -25.08951759338379, "global_step": 267406, "epoch": 3221} {"train_loss": -25.0922908782959, "global_step": 267407, "epoch": 3221} {"train_loss": -24.759593963623047, "global_step": 267408, "epoch": 3221} {"train_loss": -25.220109939575195, "global_step": 267409, "epoch": 3221} {"train_loss": -25.133529663085938, "global_step": 267410, "epoch": 3221} {"train_loss": -25.005971908569336, "global_step": 267411, "epoch": 3221} {"train_loss": -25.219745635986328, "global_step": 267412, "epoch": 3221} {"train_loss": -25.504878997802734, "global_step": 267413, "epoch": 3221} {"train_loss": -24.640520095825195, "global_step": 267414, "epoch": 3221} {"train_loss": -25.26235580444336, "global_step": 267415, "epoch": 3221} {"train_loss": -25.250621795654297, "global_step": 267416, "epoch": 3221} {"train_loss": -25.262222290039062, "global_step": 267417, "epoch": 3221} {"train_loss": -25.441747665405273, "global_step": 267418, "epoch": 3221} {"train_loss": -25.11582374572754, "global_step": 267419, "epoch": 3221} {"train_loss": -25.10338592529297, "global_step": 267420, "epoch": 3221} {"train_loss": -24.92417335510254, "global_step": 267421, "epoch": 3221} {"train_loss": -25.138025283813477, "global_step": 267422, "epoch": 3221} {"train_loss": -25.341169357299805, "global_step": 267423, "epoch": 3221} {"train_loss": -25.234251022338867, "global_step": 267424, "epoch": 3221} {"train_loss": -25.15950067359281, "global_step": 267425, "epoch": 3221, "val_loss": 6950368.5} {"train_loss": -25.081274032592773, "global_step": 267426, "epoch": 3222} {"train_loss": -25.09346580505371, "global_step": 267427, "epoch": 3222} {"train_loss": -25.30811882019043, "global_step": 267428, "epoch": 3222} {"train_loss": -24.925006866455078, "global_step": 267429, "epoch": 3222} {"train_loss": -25.098527908325195, "global_step": 267430, "epoch": 3222} {"train_loss": -24.669511795043945, "global_step": 267431, "epoch": 3222} {"train_loss": -24.896087646484375, "global_step": 267432, "epoch": 3222} {"train_loss": -25.127607345581055, "global_step": 267433, "epoch": 3222} {"train_loss": -25.38319969177246, "global_step": 267434, "epoch": 3222} {"train_loss": -24.92508316040039, "global_step": 267435, "epoch": 3222} {"train_loss": -25.15985679626465, "global_step": 267436, "epoch": 3222} {"train_loss": -25.104175567626953, "global_step": 267437, "epoch": 3222} {"train_loss": -25.229244232177734, "global_step": 267438, "epoch": 3222} {"train_loss": -24.9655818939209, "global_step": 267439, "epoch": 3222} {"train_loss": -24.975547790527344, "global_step": 267440, "epoch": 3222} {"train_loss": -24.984724044799805, "global_step": 267441, "epoch": 3222} {"train_loss": -25.123159408569336, "global_step": 267442, "epoch": 3222} {"train_loss": -25.436721801757812, "global_step": 267443, "epoch": 3222} {"train_loss": -25.2110652923584, "global_step": 267444, "epoch": 3222} {"train_loss": -25.1527042388916, "global_step": 267445, "epoch": 3222} {"train_loss": -25.406227111816406, "global_step": 267446, "epoch": 3222} {"train_loss": -25.03249168395996, "global_step": 267447, "epoch": 3222} {"train_loss": -25.271146774291992, "global_step": 267448, "epoch": 3222} {"train_loss": -25.128080368041992, "global_step": 267449, "epoch": 3222} {"train_loss": -25.287906646728516, "global_step": 267450, "epoch": 3222} {"train_loss": -25.079233169555664, "global_step": 267451, "epoch": 3222} {"train_loss": -25.6491756439209, "global_step": 267452, "epoch": 3222} {"train_loss": -25.437896728515625, "global_step": 267453, "epoch": 3222} {"train_loss": -25.405332565307617, "global_step": 267454, "epoch": 3222} {"train_loss": -25.12954330444336, "global_step": 267455, "epoch": 3222} {"train_loss": -25.316482543945312, "global_step": 267456, "epoch": 3222} {"train_loss": -25.194095611572266, "global_step": 267457, "epoch": 3222} {"train_loss": -25.40167999267578, "global_step": 267458, "epoch": 3222} {"train_loss": -25.193557739257812, "global_step": 267459, "epoch": 3222} {"train_loss": -25.402446746826172, "global_step": 267460, "epoch": 3222} {"train_loss": -25.48310661315918, "global_step": 267461, "epoch": 3222} {"train_loss": -25.751880645751953, "global_step": 267462, "epoch": 3222} {"train_loss": -25.437824249267578, "global_step": 267463, "epoch": 3222} {"train_loss": -25.729095458984375, "global_step": 267464, "epoch": 3222} {"train_loss": -25.362279891967773, "global_step": 267465, "epoch": 3222} {"train_loss": -25.836538314819336, "global_step": 267466, "epoch": 3222} {"train_loss": -25.35551643371582, "global_step": 267467, "epoch": 3222} {"train_loss": -25.558462142944336, "global_step": 267468, "epoch": 3222} {"train_loss": -25.309114456176758, "global_step": 267469, "epoch": 3222} {"train_loss": -24.8569393157959, "global_step": 267470, "epoch": 3222} {"train_loss": -25.529943466186523, "global_step": 267471, "epoch": 3222} {"train_loss": -25.19684410095215, "global_step": 267472, "epoch": 3222} {"train_loss": -25.133726119995117, "global_step": 267473, "epoch": 3222} {"train_loss": -25.100492477416992, "global_step": 267474, "epoch": 3222} {"train_loss": -24.82537841796875, "global_step": 267475, "epoch": 3222} {"train_loss": -25.51286506652832, "global_step": 267476, "epoch": 3222} {"train_loss": -25.2186336517334, "global_step": 267477, "epoch": 3222} {"train_loss": -25.43454933166504, "global_step": 267478, "epoch": 3222} {"train_loss": -25.095075607299805, "global_step": 267479, "epoch": 3222} {"train_loss": -25.48128318786621, "global_step": 267480, "epoch": 3222} {"train_loss": -25.662433624267578, "global_step": 267481, "epoch": 3222} {"train_loss": -25.198698043823242, "global_step": 267482, "epoch": 3222} {"train_loss": -25.400938034057617, "global_step": 267483, "epoch": 3222} {"train_loss": -25.47138786315918, "global_step": 267484, "epoch": 3222} {"train_loss": -25.103120803833008, "global_step": 267485, "epoch": 3222} {"train_loss": -25.368398666381836, "global_step": 267486, "epoch": 3222} {"train_loss": -25.34078025817871, "global_step": 267487, "epoch": 3222} {"train_loss": -25.133935928344727, "global_step": 267488, "epoch": 3222} {"train_loss": -25.443925857543945, "global_step": 267489, "epoch": 3222} {"train_loss": -25.710153579711914, "global_step": 267490, "epoch": 3222} {"train_loss": -25.63619041442871, "global_step": 267491, "epoch": 3222} {"train_loss": -24.96961784362793, "global_step": 267492, "epoch": 3222} {"train_loss": -25.4202938079834, "global_step": 267493, "epoch": 3222} {"train_loss": -25.559125900268555, "global_step": 267494, "epoch": 3222} {"train_loss": -25.38509178161621, "global_step": 267495, "epoch": 3222} {"train_loss": -25.58257293701172, "global_step": 267496, "epoch": 3222} {"train_loss": -25.455276489257812, "global_step": 267497, "epoch": 3222} {"train_loss": -25.13786506652832, "global_step": 267498, "epoch": 3222} {"train_loss": -25.40371322631836, "global_step": 267499, "epoch": 3222} {"train_loss": -25.164485931396484, "global_step": 267500, "epoch": 3222} {"train_loss": -25.63396644592285, "global_step": 267501, "epoch": 3222} {"train_loss": -25.52188491821289, "global_step": 267502, "epoch": 3222} {"train_loss": -25.283349990844727, "global_step": 267503, "epoch": 3222} {"train_loss": -25.337594985961914, "global_step": 267504, "epoch": 3222} {"train_loss": -25.488489151000977, "global_step": 267505, "epoch": 3222} {"train_loss": -24.863447189331055, "global_step": 267506, "epoch": 3222} {"train_loss": -24.666461944580078, "global_step": 267507, "epoch": 3222} {"train_loss": -25.245108202279333, "global_step": 267508, "epoch": 3222, "val_loss": 6981259.0} {"train_loss": -23.017038345336914, "global_step": 267509, "epoch": 3223} {"train_loss": -23.307796478271484, "global_step": 267510, "epoch": 3223} {"train_loss": -23.8042049407959, "global_step": 267511, "epoch": 3223} {"train_loss": -23.996368408203125, "global_step": 267512, "epoch": 3223} {"train_loss": -23.7021484375, "global_step": 267513, "epoch": 3223} {"train_loss": -24.137577056884766, "global_step": 267514, "epoch": 3223} {"train_loss": -23.934371948242188, "global_step": 267515, "epoch": 3223} {"train_loss": -24.583295822143555, "global_step": 267516, "epoch": 3223} {"train_loss": -24.303211212158203, "global_step": 267517, "epoch": 3223} {"train_loss": -24.148590087890625, "global_step": 267518, "epoch": 3223} {"train_loss": -24.194181442260742, "global_step": 267519, "epoch": 3223} {"train_loss": -24.4942626953125, "global_step": 267520, "epoch": 3223} {"train_loss": -24.31227684020996, "global_step": 267521, "epoch": 3223} {"train_loss": -24.273679733276367, "global_step": 267522, "epoch": 3223} {"train_loss": -24.629364013671875, "global_step": 267523, "epoch": 3223} {"train_loss": -24.992733001708984, "global_step": 267524, "epoch": 3223} {"train_loss": -24.73583984375, "global_step": 267525, "epoch": 3223} {"train_loss": -24.864315032958984, "global_step": 267526, "epoch": 3223} {"train_loss": -24.86554527282715, "global_step": 267527, "epoch": 3223} {"train_loss": -24.59427833557129, "global_step": 267528, "epoch": 3223} {"train_loss": -24.709518432617188, "global_step": 267529, "epoch": 3223} {"train_loss": -24.595590591430664, "global_step": 267530, "epoch": 3223} {"train_loss": -24.779932022094727, "global_step": 267531, "epoch": 3223} {"train_loss": -24.978836059570312, "global_step": 267532, "epoch": 3223} {"train_loss": -25.191862106323242, "global_step": 267533, "epoch": 3223} {"train_loss": -24.9171142578125, "global_step": 267534, "epoch": 3223} {"train_loss": -25.036909103393555, "global_step": 267535, "epoch": 3223} {"train_loss": -24.4833927154541, "global_step": 267536, "epoch": 3223} {"train_loss": -24.909561157226562, "global_step": 267537, "epoch": 3223} {"train_loss": -24.969839096069336, "global_step": 267538, "epoch": 3223} {"train_loss": -25.280935287475586, "global_step": 267539, "epoch": 3223} {"train_loss": -24.95957374572754, "global_step": 267540, "epoch": 3223} {"train_loss": -24.812314987182617, "global_step": 267541, "epoch": 3223} {"train_loss": -24.65389060974121, "global_step": 267542, "epoch": 3223} {"train_loss": -25.093551635742188, "global_step": 267543, "epoch": 3223} {"train_loss": -25.2182559967041, "global_step": 267544, "epoch": 3223} {"train_loss": -25.185062408447266, "global_step": 267545, "epoch": 3223} {"train_loss": -24.85893440246582, "global_step": 267546, "epoch": 3223} {"train_loss": -25.246105194091797, "global_step": 267547, "epoch": 3223} {"train_loss": -25.403095245361328, "global_step": 267548, "epoch": 3223} {"train_loss": -25.508987426757812, "global_step": 267549, "epoch": 3223} {"train_loss": -25.399564743041992, "global_step": 267550, "epoch": 3223} {"train_loss": -25.514657974243164, "global_step": 267551, "epoch": 3223} {"train_loss": -25.139257431030273, "global_step": 267552, "epoch": 3223} {"train_loss": -24.779308319091797, "global_step": 267553, "epoch": 3223} {"train_loss": -25.13821792602539, "global_step": 267554, "epoch": 3223} {"train_loss": -25.364444732666016, "global_step": 267555, "epoch": 3223} {"train_loss": -24.942991256713867, "global_step": 267556, "epoch": 3223} {"train_loss": -24.718557357788086, "global_step": 267557, "epoch": 3223} {"train_loss": -25.073896408081055, "global_step": 267558, "epoch": 3223} {"train_loss": -25.279821395874023, "global_step": 267559, "epoch": 3223} {"train_loss": -24.99349021911621, "global_step": 267560, "epoch": 3223} {"train_loss": -25.31618309020996, "global_step": 267561, "epoch": 3223} {"train_loss": -25.256359100341797, "global_step": 267562, "epoch": 3223} {"train_loss": -25.315467834472656, "global_step": 267563, "epoch": 3223} {"train_loss": -24.79129981994629, "global_step": 267564, "epoch": 3223} {"train_loss": -25.151229858398438, "global_step": 267565, "epoch": 3223} {"train_loss": -25.211050033569336, "global_step": 267566, "epoch": 3223} {"train_loss": -24.74515724182129, "global_step": 267567, "epoch": 3223} {"train_loss": -25.311338424682617, "global_step": 267568, "epoch": 3223} {"train_loss": -25.485797882080078, "global_step": 267569, "epoch": 3223} {"train_loss": -25.113998413085938, "global_step": 267570, "epoch": 3223} {"train_loss": -25.311613082885742, "global_step": 267571, "epoch": 3223} {"train_loss": -25.266210556030273, "global_step": 267572, "epoch": 3223} {"train_loss": -25.44272232055664, "global_step": 267573, "epoch": 3223} {"train_loss": -24.801544189453125, "global_step": 267574, "epoch": 3223} {"train_loss": -25.086889266967773, "global_step": 267575, "epoch": 3223} {"train_loss": -25.004802703857422, "global_step": 267576, "epoch": 3223} {"train_loss": -25.17159080505371, "global_step": 267577, "epoch": 3223} {"train_loss": -25.202743530273438, "global_step": 267578, "epoch": 3223} {"train_loss": -25.216928482055664, "global_step": 267579, "epoch": 3223} {"train_loss": -25.332416534423828, "global_step": 267580, "epoch": 3223} {"train_loss": -25.23647689819336, "global_step": 267581, "epoch": 3223} {"train_loss": -25.277301788330078, "global_step": 267582, "epoch": 3223} {"train_loss": -24.995725631713867, "global_step": 267583, "epoch": 3223} {"train_loss": -25.502260208129883, "global_step": 267584, "epoch": 3223} {"train_loss": -25.19730567932129, "global_step": 267585, "epoch": 3223} {"train_loss": -25.79815673828125, "global_step": 267586, "epoch": 3223} {"train_loss": -25.182527542114258, "global_step": 267587, "epoch": 3223} {"train_loss": -25.108041763305664, "global_step": 267588, "epoch": 3223} {"train_loss": -25.213741302490234, "global_step": 267589, "epoch": 3223} {"train_loss": -25.52153968811035, "global_step": 267590, "epoch": 3223} {"train_loss": -24.891086256647686, "global_step": 267591, "epoch": 3223, "val_loss": 6940798.0} {"train_loss": -24.776418685913086, "global_step": 267592, "epoch": 3224} {"train_loss": -24.994176864624023, "global_step": 267593, "epoch": 3224} {"train_loss": -25.116323471069336, "global_step": 267594, "epoch": 3224} {"train_loss": -24.68263053894043, "global_step": 267595, "epoch": 3224} {"train_loss": -24.24062728881836, "global_step": 267596, "epoch": 3224} {"train_loss": -24.90386390686035, "global_step": 267597, "epoch": 3224} {"train_loss": -24.984838485717773, "global_step": 267598, "epoch": 3224} {"train_loss": -24.781902313232422, "global_step": 267599, "epoch": 3224} {"train_loss": -25.179651260375977, "global_step": 267600, "epoch": 3224} {"train_loss": -25.07015037536621, "global_step": 267601, "epoch": 3224} {"train_loss": -25.141071319580078, "global_step": 267602, "epoch": 3224} {"train_loss": -24.933542251586914, "global_step": 267603, "epoch": 3224} {"train_loss": -25.1114444732666, "global_step": 267604, "epoch": 3224} {"train_loss": -25.254608154296875, "global_step": 267605, "epoch": 3224} {"train_loss": -25.28456687927246, "global_step": 267606, "epoch": 3224} {"train_loss": -25.170730590820312, "global_step": 267607, "epoch": 3224} {"train_loss": -25.145334243774414, "global_step": 267608, "epoch": 3224} {"train_loss": -25.23396873474121, "global_step": 267609, "epoch": 3224} {"train_loss": -24.8992919921875, "global_step": 267610, "epoch": 3224} {"train_loss": -25.485227584838867, "global_step": 267611, "epoch": 3224} {"train_loss": -25.448026657104492, "global_step": 267612, "epoch": 3224} {"train_loss": -24.98333740234375, "global_step": 267613, "epoch": 3224} {"train_loss": -25.476816177368164, "global_step": 267614, "epoch": 3224} {"train_loss": -24.945507049560547, "global_step": 267615, "epoch": 3224} {"train_loss": -25.25465202331543, "global_step": 267616, "epoch": 3224} {"train_loss": -25.463106155395508, "global_step": 267617, "epoch": 3224} {"train_loss": -25.273839950561523, "global_step": 267618, "epoch": 3224} {"train_loss": -24.884164810180664, "global_step": 267619, "epoch": 3224} {"train_loss": -25.663000106811523, "global_step": 267620, "epoch": 3224} {"train_loss": -25.379934310913086, "global_step": 267621, "epoch": 3224} {"train_loss": -25.376693725585938, "global_step": 267622, "epoch": 3224} {"train_loss": -24.851213455200195, "global_step": 267623, "epoch": 3224} {"train_loss": -25.25482749938965, "global_step": 267624, "epoch": 3224} {"train_loss": -25.016002655029297, "global_step": 267625, "epoch": 3224} {"train_loss": -25.526954650878906, "global_step": 267626, "epoch": 3224} {"train_loss": -25.12204933166504, "global_step": 267627, "epoch": 3224} {"train_loss": -24.880495071411133, "global_step": 267628, "epoch": 3224} {"train_loss": -25.58357810974121, "global_step": 267629, "epoch": 3224} {"train_loss": -25.125431060791016, "global_step": 267630, "epoch": 3224} {"train_loss": -25.115537643432617, "global_step": 267631, "epoch": 3224} {"train_loss": -25.2132568359375, "global_step": 267632, "epoch": 3224} {"train_loss": -25.406038284301758, "global_step": 267633, "epoch": 3224} {"train_loss": -25.520240783691406, "global_step": 267634, "epoch": 3224} {"train_loss": -25.32501220703125, "global_step": 267635, "epoch": 3224} {"train_loss": -25.31485939025879, "global_step": 267636, "epoch": 3224} {"train_loss": -25.0338191986084, "global_step": 267637, "epoch": 3224} {"train_loss": -25.04912757873535, "global_step": 267638, "epoch": 3224} {"train_loss": -25.354995727539062, "global_step": 267639, "epoch": 3224} {"train_loss": -25.220449447631836, "global_step": 267640, "epoch": 3224} {"train_loss": -25.368410110473633, "global_step": 267641, "epoch": 3224} {"train_loss": -25.284788131713867, "global_step": 267642, "epoch": 3224} {"train_loss": -25.122495651245117, "global_step": 267643, "epoch": 3224} {"train_loss": -25.518047332763672, "global_step": 267644, "epoch": 3224} {"train_loss": -25.12257957458496, "global_step": 267645, "epoch": 3224} {"train_loss": -24.916311264038086, "global_step": 267646, "epoch": 3224} {"train_loss": -25.13665771484375, "global_step": 267647, "epoch": 3224} {"train_loss": -25.67133903503418, "global_step": 267648, "epoch": 3224} {"train_loss": -25.160444259643555, "global_step": 267649, "epoch": 3224} {"train_loss": -25.187231063842773, "global_step": 267650, "epoch": 3224} {"train_loss": -24.85880470275879, "global_step": 267651, "epoch": 3224} {"train_loss": -25.407583236694336, "global_step": 267652, "epoch": 3224} {"train_loss": -25.168542861938477, "global_step": 267653, "epoch": 3224} {"train_loss": -25.023029327392578, "global_step": 267654, "epoch": 3224} {"train_loss": -25.3453426361084, "global_step": 267655, "epoch": 3224} {"train_loss": -25.328868865966797, "global_step": 267656, "epoch": 3224} {"train_loss": -25.20368194580078, "global_step": 267657, "epoch": 3224} {"train_loss": -25.3514347076416, "global_step": 267658, "epoch": 3224} {"train_loss": -25.480606079101562, "global_step": 267659, "epoch": 3224} {"train_loss": -25.201847076416016, "global_step": 267660, "epoch": 3224} {"train_loss": -25.222686767578125, "global_step": 267661, "epoch": 3224} {"train_loss": -25.312692642211914, "global_step": 267662, "epoch": 3224} {"train_loss": -25.219945907592773, "global_step": 267663, "epoch": 3224} {"train_loss": -25.264089584350586, "global_step": 267664, "epoch": 3224} {"train_loss": -25.244665145874023, "global_step": 267665, "epoch": 3224} {"train_loss": -24.91487693786621, "global_step": 267666, "epoch": 3224} {"train_loss": -25.32320213317871, "global_step": 267667, "epoch": 3224} {"train_loss": -25.049253463745117, "global_step": 267668, "epoch": 3224} {"train_loss": -24.98164176940918, "global_step": 267669, "epoch": 3224} {"train_loss": -25.43577003479004, "global_step": 267670, "epoch": 3224} {"train_loss": -25.08083152770996, "global_step": 267671, "epoch": 3224} {"train_loss": -25.141843795776367, "global_step": 267672, "epoch": 3224} {"train_loss": -25.103086471557617, "global_step": 267673, "epoch": 3224} {"train_loss": -25.177050716905708, "global_step": 267674, "epoch": 3224, "val_loss": 7016662.5} {"train_loss": -24.301088333129883, "global_step": 267675, "epoch": 3225} {"train_loss": -24.254331588745117, "global_step": 267676, "epoch": 3225} {"train_loss": -24.081018447875977, "global_step": 267677, "epoch": 3225} {"train_loss": -24.876144409179688, "global_step": 267678, "epoch": 3225} {"train_loss": -24.493555068969727, "global_step": 267679, "epoch": 3225} {"train_loss": -24.812463760375977, "global_step": 267680, "epoch": 3225} {"train_loss": -24.96317481994629, "global_step": 267681, "epoch": 3225} {"train_loss": -24.7235107421875, "global_step": 267682, "epoch": 3225} {"train_loss": -24.98380470275879, "global_step": 267683, "epoch": 3225} {"train_loss": -24.751752853393555, "global_step": 267684, "epoch": 3225} {"train_loss": -24.759307861328125, "global_step": 267685, "epoch": 3225} {"train_loss": -24.833051681518555, "global_step": 267686, "epoch": 3225} {"train_loss": -25.145986557006836, "global_step": 267687, "epoch": 3225} {"train_loss": -25.269790649414062, "global_step": 267688, "epoch": 3225} {"train_loss": -25.168325424194336, "global_step": 267689, "epoch": 3225} {"train_loss": -24.9482421875, "global_step": 267690, "epoch": 3225} {"train_loss": -24.74472999572754, "global_step": 267691, "epoch": 3225} {"train_loss": -25.511520385742188, "global_step": 267692, "epoch": 3225} {"train_loss": -25.27935028076172, "global_step": 267693, "epoch": 3225} {"train_loss": -25.23534393310547, "global_step": 267694, "epoch": 3225} {"train_loss": -25.00629997253418, "global_step": 267695, "epoch": 3225} {"train_loss": -25.231863021850586, "global_step": 267696, "epoch": 3225} {"train_loss": -25.529949188232422, "global_step": 267697, "epoch": 3225} {"train_loss": -25.347440719604492, "global_step": 267698, "epoch": 3225} {"train_loss": -25.20194435119629, "global_step": 267699, "epoch": 3225} {"train_loss": -25.163190841674805, "global_step": 267700, "epoch": 3225} {"train_loss": -25.24311065673828, "global_step": 267701, "epoch": 3225} {"train_loss": -25.265167236328125, "global_step": 267702, "epoch": 3225} {"train_loss": -25.467100143432617, "global_step": 267703, "epoch": 3225} {"train_loss": -25.156265258789062, "global_step": 267704, "epoch": 3225} {"train_loss": -25.151498794555664, "global_step": 267705, "epoch": 3225} {"train_loss": -25.13840675354004, "global_step": 267706, "epoch": 3225} {"train_loss": -25.134902954101562, "global_step": 267707, "epoch": 3225} {"train_loss": -24.999801635742188, "global_step": 267708, "epoch": 3225} {"train_loss": -25.001495361328125, "global_step": 267709, "epoch": 3225} {"train_loss": -25.476587295532227, "global_step": 267710, "epoch": 3225} {"train_loss": -25.329166412353516, "global_step": 267711, "epoch": 3225} {"train_loss": -25.70350456237793, "global_step": 267712, "epoch": 3225} {"train_loss": -25.099393844604492, "global_step": 267713, "epoch": 3225} {"train_loss": -25.455381393432617, "global_step": 267714, "epoch": 3225} {"train_loss": -25.59693717956543, "global_step": 267715, "epoch": 3225} {"train_loss": -25.410104751586914, "global_step": 267716, "epoch": 3225} {"train_loss": -25.337909698486328, "global_step": 267717, "epoch": 3225} {"train_loss": -25.517887115478516, "global_step": 267718, "epoch": 3225} {"train_loss": -25.720605850219727, "global_step": 267719, "epoch": 3225} {"train_loss": -25.713031768798828, "global_step": 267720, "epoch": 3225} {"train_loss": -25.64877700805664, "global_step": 267721, "epoch": 3225} {"train_loss": -25.267562866210938, "global_step": 267722, "epoch": 3225} {"train_loss": -25.30073356628418, "global_step": 267723, "epoch": 3225} {"train_loss": -25.541568756103516, "global_step": 267724, "epoch": 3225} {"train_loss": -25.285064697265625, "global_step": 267725, "epoch": 3225} {"train_loss": -24.795087814331055, "global_step": 267726, "epoch": 3225} {"train_loss": -25.048620223999023, "global_step": 267727, "epoch": 3225} {"train_loss": -24.71310806274414, "global_step": 267728, "epoch": 3225} {"train_loss": -24.686742782592773, "global_step": 267729, "epoch": 3225} {"train_loss": -24.869266510009766, "global_step": 267730, "epoch": 3225} {"train_loss": -25.054935455322266, "global_step": 267731, "epoch": 3225} {"train_loss": -25.09588050842285, "global_step": 267732, "epoch": 3225} {"train_loss": -25.01128578186035, "global_step": 267733, "epoch": 3225} {"train_loss": -25.195192337036133, "global_step": 267734, "epoch": 3225} {"train_loss": -25.110410690307617, "global_step": 267735, "epoch": 3225} {"train_loss": -24.409910202026367, "global_step": 267736, "epoch": 3225} {"train_loss": -24.22450828552246, "global_step": 267737, "epoch": 3225} {"train_loss": -24.258699417114258, "global_step": 267738, "epoch": 3225} {"train_loss": -25.129133224487305, "global_step": 267739, "epoch": 3225} {"train_loss": -24.907062530517578, "global_step": 267740, "epoch": 3225} {"train_loss": -25.54011344909668, "global_step": 267741, "epoch": 3225} {"train_loss": -24.614118576049805, "global_step": 267742, "epoch": 3225} {"train_loss": -25.680221557617188, "global_step": 267743, "epoch": 3225} {"train_loss": -24.629547119140625, "global_step": 267744, "epoch": 3225} {"train_loss": -25.03960609436035, "global_step": 267745, "epoch": 3225} {"train_loss": -24.94296646118164, "global_step": 267746, "epoch": 3225} {"train_loss": -24.861127853393555, "global_step": 267747, "epoch": 3225} {"train_loss": -24.733474731445312, "global_step": 267748, "epoch": 3225} {"train_loss": -25.060035705566406, "global_step": 267749, "epoch": 3225} {"train_loss": -25.1796875, "global_step": 267750, "epoch": 3225} {"train_loss": -24.71297264099121, "global_step": 267751, "epoch": 3225} {"train_loss": -25.153738021850586, "global_step": 267752, "epoch": 3225} {"train_loss": -24.934114456176758, "global_step": 267753, "epoch": 3225} {"train_loss": -25.361797332763672, "global_step": 267754, "epoch": 3225} {"train_loss": -24.9799861907959, "global_step": 267755, "epoch": 3225} {"train_loss": -25.10580825805664, "global_step": 267756, "epoch": 3225} {"train_loss": -25.079556177897626, "global_step": 267757, "epoch": 3225, "val_loss": 7073639.0} {"train_loss": -25.01535987854004, "global_step": 267758, "epoch": 3226} {"train_loss": -25.128849029541016, "global_step": 267759, "epoch": 3226} {"train_loss": -24.99605369567871, "global_step": 267760, "epoch": 3226} {"train_loss": -24.90735626220703, "global_step": 267761, "epoch": 3226} {"train_loss": -24.961755752563477, "global_step": 267762, "epoch": 3226} {"train_loss": -25.063806533813477, "global_step": 267763, "epoch": 3226} {"train_loss": -25.010540008544922, "global_step": 267764, "epoch": 3226} {"train_loss": -25.711029052734375, "global_step": 267765, "epoch": 3226} {"train_loss": -25.251710891723633, "global_step": 267766, "epoch": 3226} {"train_loss": -24.920116424560547, "global_step": 267767, "epoch": 3226} {"train_loss": -25.35981559753418, "global_step": 267768, "epoch": 3226} {"train_loss": -24.986103057861328, "global_step": 267769, "epoch": 3226} {"train_loss": -25.154346466064453, "global_step": 267770, "epoch": 3226} {"train_loss": -25.49481773376465, "global_step": 267771, "epoch": 3226} {"train_loss": -25.340057373046875, "global_step": 267772, "epoch": 3226} {"train_loss": -25.311185836791992, "global_step": 267773, "epoch": 3226} {"train_loss": -25.261817932128906, "global_step": 267774, "epoch": 3226} {"train_loss": -25.510848999023438, "global_step": 267775, "epoch": 3226} {"train_loss": -25.318172454833984, "global_step": 267776, "epoch": 3226} {"train_loss": -24.881092071533203, "global_step": 267777, "epoch": 3226} {"train_loss": -25.473648071289062, "global_step": 267778, "epoch": 3226} {"train_loss": -25.22984504699707, "global_step": 267779, "epoch": 3226} {"train_loss": -24.780582427978516, "global_step": 267780, "epoch": 3226} {"train_loss": -25.639862060546875, "global_step": 267781, "epoch": 3226} {"train_loss": -25.35443115234375, "global_step": 267782, "epoch": 3226} {"train_loss": -25.623193740844727, "global_step": 267783, "epoch": 3226} {"train_loss": -25.32122802734375, "global_step": 267784, "epoch": 3226} {"train_loss": -25.06650161743164, "global_step": 267785, "epoch": 3226} {"train_loss": -25.31388282775879, "global_step": 267786, "epoch": 3226} {"train_loss": -25.086509704589844, "global_step": 267787, "epoch": 3226} {"train_loss": -25.348190307617188, "global_step": 267788, "epoch": 3226} {"train_loss": -25.172086715698242, "global_step": 267789, "epoch": 3226} {"train_loss": -25.116315841674805, "global_step": 267790, "epoch": 3226} {"train_loss": -24.910442352294922, "global_step": 267791, "epoch": 3226} {"train_loss": -25.325437545776367, "global_step": 267792, "epoch": 3226} {"train_loss": -25.4267578125, "global_step": 267793, "epoch": 3226} {"train_loss": -25.239913940429688, "global_step": 267794, "epoch": 3226} {"train_loss": -25.25581932067871, "global_step": 267795, "epoch": 3226} {"train_loss": -25.0172061920166, "global_step": 267796, "epoch": 3226} {"train_loss": -24.954002380371094, "global_step": 267797, "epoch": 3226} {"train_loss": -25.560001373291016, "global_step": 267798, "epoch": 3226} {"train_loss": -25.453596115112305, "global_step": 267799, "epoch": 3226} {"train_loss": -25.606412887573242, "global_step": 267800, "epoch": 3226} {"train_loss": -25.562145233154297, "global_step": 267801, "epoch": 3226} {"train_loss": -25.3861026763916, "global_step": 267802, "epoch": 3226} {"train_loss": -25.367475509643555, "global_step": 267803, "epoch": 3226} {"train_loss": -25.37457847595215, "global_step": 267804, "epoch": 3226} {"train_loss": -25.41402244567871, "global_step": 267805, "epoch": 3226} {"train_loss": -25.66493797302246, "global_step": 267806, "epoch": 3226} {"train_loss": -25.138202667236328, "global_step": 267807, "epoch": 3226} {"train_loss": -25.209335327148438, "global_step": 267808, "epoch": 3226} {"train_loss": -24.946115493774414, "global_step": 267809, "epoch": 3226} {"train_loss": -25.04864501953125, "global_step": 267810, "epoch": 3226} {"train_loss": -24.91059684753418, "global_step": 267811, "epoch": 3226} {"train_loss": -25.119600296020508, "global_step": 267812, "epoch": 3226} {"train_loss": -25.36409568786621, "global_step": 267813, "epoch": 3226} {"train_loss": -25.06427001953125, "global_step": 267814, "epoch": 3226} {"train_loss": -25.498563766479492, "global_step": 267815, "epoch": 3226} {"train_loss": -25.164457321166992, "global_step": 267816, "epoch": 3226} {"train_loss": -25.131423950195312, "global_step": 267817, "epoch": 3226} {"train_loss": -25.363779067993164, "global_step": 267818, "epoch": 3226} {"train_loss": -25.126869201660156, "global_step": 267819, "epoch": 3226} {"train_loss": -24.911741256713867, "global_step": 267820, "epoch": 3226} {"train_loss": -25.48795509338379, "global_step": 267821, "epoch": 3226} {"train_loss": -25.860761642456055, "global_step": 267822, "epoch": 3226} {"train_loss": -25.104026794433594, "global_step": 267823, "epoch": 3226} {"train_loss": -25.180002212524414, "global_step": 267824, "epoch": 3226} {"train_loss": -25.319229125976562, "global_step": 267825, "epoch": 3226} {"train_loss": -25.032941818237305, "global_step": 267826, "epoch": 3226} {"train_loss": -25.208669662475586, "global_step": 267827, "epoch": 3226} {"train_loss": -25.185623168945312, "global_step": 267828, "epoch": 3226} {"train_loss": -25.275930404663086, "global_step": 267829, "epoch": 3226} {"train_loss": -25.031478881835938, "global_step": 267830, "epoch": 3226} {"train_loss": -25.14618492126465, "global_step": 267831, "epoch": 3226} {"train_loss": -25.519943237304688, "global_step": 267832, "epoch": 3226} {"train_loss": -25.15525245666504, "global_step": 267833, "epoch": 3226} {"train_loss": -25.486663818359375, "global_step": 267834, "epoch": 3226} {"train_loss": -25.123071670532227, "global_step": 267835, "epoch": 3226} {"train_loss": -24.88414192199707, "global_step": 267836, "epoch": 3226} {"train_loss": -25.14447784423828, "global_step": 267837, "epoch": 3226} {"train_loss": -24.988292694091797, "global_step": 267838, "epoch": 3226} {"train_loss": -25.006010055541992, "global_step": 267839, "epoch": 3226} {"train_loss": -25.25469740902085, "global_step": 267840, "epoch": 3226, "val_loss": 7050674.5} {"train_loss": -23.906829833984375, "global_step": 267841, "epoch": 3227} {"train_loss": -24.40750503540039, "global_step": 267842, "epoch": 3227} {"train_loss": -24.396976470947266, "global_step": 267843, "epoch": 3227} {"train_loss": -24.763254165649414, "global_step": 267844, "epoch": 3227} {"train_loss": -24.592151641845703, "global_step": 267845, "epoch": 3227} {"train_loss": -24.523902893066406, "global_step": 267846, "epoch": 3227} {"train_loss": -25.01609230041504, "global_step": 267847, "epoch": 3227} {"train_loss": -24.859634399414062, "global_step": 267848, "epoch": 3227} {"train_loss": -24.939231872558594, "global_step": 267849, "epoch": 3227} {"train_loss": -24.7867374420166, "global_step": 267850, "epoch": 3227} {"train_loss": -24.70924949645996, "global_step": 267851, "epoch": 3227} {"train_loss": -24.774627685546875, "global_step": 267852, "epoch": 3227} {"train_loss": -24.57545280456543, "global_step": 267853, "epoch": 3227} {"train_loss": -24.53877830505371, "global_step": 267854, "epoch": 3227} {"train_loss": -25.135507583618164, "global_step": 267855, "epoch": 3227} {"train_loss": -24.80573081970215, "global_step": 267856, "epoch": 3227} {"train_loss": -25.080673217773438, "global_step": 267857, "epoch": 3227} {"train_loss": -24.848102569580078, "global_step": 267858, "epoch": 3227} {"train_loss": -24.662433624267578, "global_step": 267859, "epoch": 3227} {"train_loss": -25.258298873901367, "global_step": 267860, "epoch": 3227} {"train_loss": -24.93882942199707, "global_step": 267861, "epoch": 3227} {"train_loss": -24.886810302734375, "global_step": 267862, "epoch": 3227} {"train_loss": -25.1027889251709, "global_step": 267863, "epoch": 3227} {"train_loss": -25.07257652282715, "global_step": 267864, "epoch": 3227} {"train_loss": -25.249271392822266, "global_step": 267865, "epoch": 3227} {"train_loss": -24.990829467773438, "global_step": 267866, "epoch": 3227} {"train_loss": -24.849899291992188, "global_step": 267867, "epoch": 3227} {"train_loss": -25.444181442260742, "global_step": 267868, "epoch": 3227} {"train_loss": -25.03719711303711, "global_step": 267869, "epoch": 3227} {"train_loss": -25.14191436767578, "global_step": 267870, "epoch": 3227} {"train_loss": -25.42032241821289, "global_step": 267871, "epoch": 3227} {"train_loss": -25.09820556640625, "global_step": 267872, "epoch": 3227} {"train_loss": -25.174367904663086, "global_step": 267873, "epoch": 3227} {"train_loss": -25.087726593017578, "global_step": 267874, "epoch": 3227} {"train_loss": -25.24800682067871, "global_step": 267875, "epoch": 3227} {"train_loss": -25.29359245300293, "global_step": 267876, "epoch": 3227} {"train_loss": -25.093387603759766, "global_step": 267877, "epoch": 3227} {"train_loss": -25.188434600830078, "global_step": 267878, "epoch": 3227} {"train_loss": -24.740720748901367, "global_step": 267879, "epoch": 3227} {"train_loss": -25.599584579467773, "global_step": 267880, "epoch": 3227} {"train_loss": -24.976932525634766, "global_step": 267881, "epoch": 3227} {"train_loss": -25.44207763671875, "global_step": 267882, "epoch": 3227} {"train_loss": -25.540639877319336, "global_step": 267883, "epoch": 3227} {"train_loss": -25.56605339050293, "global_step": 267884, "epoch": 3227} {"train_loss": -25.76508903503418, "global_step": 267885, "epoch": 3227} {"train_loss": -25.071643829345703, "global_step": 267886, "epoch": 3227} {"train_loss": -25.494892120361328, "global_step": 267887, "epoch": 3227} {"train_loss": -25.608230590820312, "global_step": 267888, "epoch": 3227} {"train_loss": -25.123937606811523, "global_step": 267889, "epoch": 3227} {"train_loss": -24.94705581665039, "global_step": 267890, "epoch": 3227} {"train_loss": -25.57758331298828, "global_step": 267891, "epoch": 3227} {"train_loss": -25.489192962646484, "global_step": 267892, "epoch": 3227} {"train_loss": -25.614837646484375, "global_step": 267893, "epoch": 3227} {"train_loss": -25.342004776000977, "global_step": 267894, "epoch": 3227} {"train_loss": -24.967260360717773, "global_step": 267895, "epoch": 3227} {"train_loss": -25.412832260131836, "global_step": 267896, "epoch": 3227} {"train_loss": -25.285419464111328, "global_step": 267897, "epoch": 3227} {"train_loss": -25.353818893432617, "global_step": 267898, "epoch": 3227} {"train_loss": -25.12725067138672, "global_step": 267899, "epoch": 3227} {"train_loss": -25.23155975341797, "global_step": 267900, "epoch": 3227} {"train_loss": -25.238706588745117, "global_step": 267901, "epoch": 3227} {"train_loss": -25.27897071838379, "global_step": 267902, "epoch": 3227} {"train_loss": -25.077314376831055, "global_step": 267903, "epoch": 3227} {"train_loss": -25.573352813720703, "global_step": 267904, "epoch": 3227} {"train_loss": -25.191787719726562, "global_step": 267905, "epoch": 3227} {"train_loss": -25.278886795043945, "global_step": 267906, "epoch": 3227} {"train_loss": -25.015533447265625, "global_step": 267907, "epoch": 3227} {"train_loss": -25.27488136291504, "global_step": 267908, "epoch": 3227} {"train_loss": -25.515331268310547, "global_step": 267909, "epoch": 3227} {"train_loss": -25.259258270263672, "global_step": 267910, "epoch": 3227} {"train_loss": -25.096460342407227, "global_step": 267911, "epoch": 3227} {"train_loss": -25.15096092224121, "global_step": 267912, "epoch": 3227} {"train_loss": -25.28434181213379, "global_step": 267913, "epoch": 3227} {"train_loss": -25.505523681640625, "global_step": 267914, "epoch": 3227} {"train_loss": -25.26107406616211, "global_step": 267915, "epoch": 3227} {"train_loss": -24.819198608398438, "global_step": 267916, "epoch": 3227} {"train_loss": -25.23306655883789, "global_step": 267917, "epoch": 3227} {"train_loss": -25.111858367919922, "global_step": 267918, "epoch": 3227} {"train_loss": -25.645233154296875, "global_step": 267919, "epoch": 3227} {"train_loss": -25.439054489135742, "global_step": 267920, "epoch": 3227} {"train_loss": -25.976179122924805, "global_step": 267921, "epoch": 3227} {"train_loss": -25.4625244140625, "global_step": 267922, "epoch": 3227} {"train_loss": -25.12517761322389, "global_step": 267923, "epoch": 3227, "val_loss": 6967282.0} {"train_loss": -24.13556480407715, "global_step": 267924, "epoch": 3228} {"train_loss": -24.699405670166016, "global_step": 267925, "epoch": 3228} {"train_loss": -24.425878524780273, "global_step": 267926, "epoch": 3228} {"train_loss": -23.779590606689453, "global_step": 267927, "epoch": 3228} {"train_loss": -24.623727798461914, "global_step": 267928, "epoch": 3228} {"train_loss": -24.47230339050293, "global_step": 267929, "epoch": 3228} {"train_loss": -24.611757278442383, "global_step": 267930, "epoch": 3228} {"train_loss": -24.654142379760742, "global_step": 267931, "epoch": 3228} {"train_loss": -25.055112838745117, "global_step": 267932, "epoch": 3228} {"train_loss": -24.645519256591797, "global_step": 267933, "epoch": 3228} {"train_loss": -25.107540130615234, "global_step": 267934, "epoch": 3228} {"train_loss": -24.888059616088867, "global_step": 267935, "epoch": 3228} {"train_loss": -24.6143798828125, "global_step": 267936, "epoch": 3228} {"train_loss": -24.735706329345703, "global_step": 267937, "epoch": 3228} {"train_loss": -24.776559829711914, "global_step": 267938, "epoch": 3228} {"train_loss": -24.79060935974121, "global_step": 267939, "epoch": 3228} {"train_loss": -24.929500579833984, "global_step": 267940, "epoch": 3228} {"train_loss": -24.67597007751465, "global_step": 267941, "epoch": 3228} {"train_loss": -24.81878662109375, "global_step": 267942, "epoch": 3228} {"train_loss": -25.110151290893555, "global_step": 267943, "epoch": 3228} {"train_loss": -25.072134017944336, "global_step": 267944, "epoch": 3228} {"train_loss": -24.928442001342773, "global_step": 267945, "epoch": 3228} {"train_loss": -24.65943717956543, "global_step": 267946, "epoch": 3228} {"train_loss": -25.10219383239746, "global_step": 267947, "epoch": 3228} {"train_loss": -24.89130401611328, "global_step": 267948, "epoch": 3228} {"train_loss": -24.488718032836914, "global_step": 267949, "epoch": 3228} {"train_loss": -24.590389251708984, "global_step": 267950, "epoch": 3228} {"train_loss": -25.03835105895996, "global_step": 267951, "epoch": 3228} {"train_loss": -24.731943130493164, "global_step": 267952, "epoch": 3228} {"train_loss": -25.344053268432617, "global_step": 267953, "epoch": 3228} {"train_loss": -25.522581100463867, "global_step": 267954, "epoch": 3228} {"train_loss": -24.88739776611328, "global_step": 267955, "epoch": 3228} {"train_loss": -25.220062255859375, "global_step": 267956, "epoch": 3228} {"train_loss": -25.121702194213867, "global_step": 267957, "epoch": 3228} {"train_loss": -24.944019317626953, "global_step": 267958, "epoch": 3228} {"train_loss": -24.924314498901367, "global_step": 267959, "epoch": 3228} {"train_loss": -25.40169334411621, "global_step": 267960, "epoch": 3228} {"train_loss": -25.38860511779785, "global_step": 267961, "epoch": 3228} {"train_loss": -25.302907943725586, "global_step": 267962, "epoch": 3228} {"train_loss": -25.437637329101562, "global_step": 267963, "epoch": 3228} {"train_loss": -25.315786361694336, "global_step": 267964, "epoch": 3228} {"train_loss": -25.16872215270996, "global_step": 267965, "epoch": 3228} {"train_loss": -25.120746612548828, "global_step": 267966, "epoch": 3228} {"train_loss": -25.388338088989258, "global_step": 267967, "epoch": 3228} {"train_loss": -25.15838050842285, "global_step": 267968, "epoch": 3228} {"train_loss": -25.50604248046875, "global_step": 267969, "epoch": 3228} {"train_loss": -25.502777099609375, "global_step": 267970, "epoch": 3228} {"train_loss": -25.38558006286621, "global_step": 267971, "epoch": 3228} {"train_loss": -25.566741943359375, "global_step": 267972, "epoch": 3228} {"train_loss": -25.356542587280273, "global_step": 267973, "epoch": 3228} {"train_loss": -25.343652725219727, "global_step": 267974, "epoch": 3228} {"train_loss": -25.300384521484375, "global_step": 267975, "epoch": 3228} {"train_loss": -25.409772872924805, "global_step": 267976, "epoch": 3228} {"train_loss": -25.263568878173828, "global_step": 267977, "epoch": 3228} {"train_loss": -25.10835075378418, "global_step": 267978, "epoch": 3228} {"train_loss": -24.715391159057617, "global_step": 267979, "epoch": 3228} {"train_loss": -25.211406707763672, "global_step": 267980, "epoch": 3228} {"train_loss": -24.999204635620117, "global_step": 267981, "epoch": 3228} {"train_loss": -24.91731834411621, "global_step": 267982, "epoch": 3228} {"train_loss": -24.920791625976562, "global_step": 267983, "epoch": 3228} {"train_loss": -24.666898727416992, "global_step": 267984, "epoch": 3228} {"train_loss": -25.57393455505371, "global_step": 267985, "epoch": 3228} {"train_loss": -25.342859268188477, "global_step": 267986, "epoch": 3228} {"train_loss": -25.021305084228516, "global_step": 267987, "epoch": 3228} {"train_loss": -25.330583572387695, "global_step": 267988, "epoch": 3228} {"train_loss": -25.62604331970215, "global_step": 267989, "epoch": 3228} {"train_loss": -25.216506958007812, "global_step": 267990, "epoch": 3228} {"train_loss": -25.0736083984375, "global_step": 267991, "epoch": 3228} {"train_loss": -25.12001609802246, "global_step": 267992, "epoch": 3228} {"train_loss": -24.963024139404297, "global_step": 267993, "epoch": 3228} {"train_loss": -25.18069839477539, "global_step": 267994, "epoch": 3228} {"train_loss": -25.22920799255371, "global_step": 267995, "epoch": 3228} {"train_loss": -25.619359970092773, "global_step": 267996, "epoch": 3228} {"train_loss": -25.308996200561523, "global_step": 267997, "epoch": 3228} {"train_loss": -25.476842880249023, "global_step": 267998, "epoch": 3228} {"train_loss": -25.477975845336914, "global_step": 267999, "epoch": 3228} {"train_loss": -25.5819034576416, "global_step": 268000, "epoch": 3228} {"train_loss": -25.390213012695312, "global_step": 268001, "epoch": 3228} {"train_loss": -25.235328674316406, "global_step": 268002, "epoch": 3228} {"train_loss": -25.547466278076172, "global_step": 268003, "epoch": 3228} {"train_loss": -25.303054809570312, "global_step": 268004, "epoch": 3228} {"train_loss": -25.61801528930664, "global_step": 268005, "epoch": 3228} {"train_loss": -25.088621989790216, "global_step": 268006, "epoch": 3228, "val_loss": 7007444.5} {"train_loss": -25.09171485900879, "global_step": 268007, "epoch": 3229} {"train_loss": -25.202045440673828, "global_step": 268008, "epoch": 3229} {"train_loss": -24.950590133666992, "global_step": 268009, "epoch": 3229} {"train_loss": -24.93181610107422, "global_step": 268010, "epoch": 3229} {"train_loss": -25.317787170410156, "global_step": 268011, "epoch": 3229} {"train_loss": -25.21797752380371, "global_step": 268012, "epoch": 3229} {"train_loss": -24.811920166015625, "global_step": 268013, "epoch": 3229} {"train_loss": -25.107908248901367, "global_step": 268014, "epoch": 3229} {"train_loss": -25.301166534423828, "global_step": 268015, "epoch": 3229} {"train_loss": -24.799179077148438, "global_step": 268016, "epoch": 3229} {"train_loss": -25.194232940673828, "global_step": 268017, "epoch": 3229} {"train_loss": -24.994400024414062, "global_step": 268018, "epoch": 3229} {"train_loss": -25.312246322631836, "global_step": 268019, "epoch": 3229} {"train_loss": -25.231191635131836, "global_step": 268020, "epoch": 3229} {"train_loss": -24.803369522094727, "global_step": 268021, "epoch": 3229} {"train_loss": -24.83081817626953, "global_step": 268022, "epoch": 3229} {"train_loss": -25.228269577026367, "global_step": 268023, "epoch": 3229} {"train_loss": -25.075483322143555, "global_step": 268024, "epoch": 3229} {"train_loss": -25.171031951904297, "global_step": 268025, "epoch": 3229} {"train_loss": -25.151792526245117, "global_step": 268026, "epoch": 3229} {"train_loss": -25.079238891601562, "global_step": 268027, "epoch": 3229} {"train_loss": -24.69273567199707, "global_step": 268028, "epoch": 3229} {"train_loss": -24.90754508972168, "global_step": 268029, "epoch": 3229} {"train_loss": -25.362401962280273, "global_step": 268030, "epoch": 3229} {"train_loss": -25.15890884399414, "global_step": 268031, "epoch": 3229} {"train_loss": -25.47580337524414, "global_step": 268032, "epoch": 3229} {"train_loss": -25.127164840698242, "global_step": 268033, "epoch": 3229} {"train_loss": -25.383604049682617, "global_step": 268034, "epoch": 3229} {"train_loss": -25.14056396484375, "global_step": 268035, "epoch": 3229} {"train_loss": -25.23052406311035, "global_step": 268036, "epoch": 3229} {"train_loss": -25.544357299804688, "global_step": 268037, "epoch": 3229} {"train_loss": -25.349878311157227, "global_step": 268038, "epoch": 3229} {"train_loss": -25.47855567932129, "global_step": 268039, "epoch": 3229} {"train_loss": -25.11591148376465, "global_step": 268040, "epoch": 3229} {"train_loss": -25.228939056396484, "global_step": 268041, "epoch": 3229} {"train_loss": -25.230915069580078, "global_step": 268042, "epoch": 3229} {"train_loss": -25.15122413635254, "global_step": 268043, "epoch": 3229} {"train_loss": -25.23103904724121, "global_step": 268044, "epoch": 3229} {"train_loss": -25.363454818725586, "global_step": 268045, "epoch": 3229} {"train_loss": -25.03413200378418, "global_step": 268046, "epoch": 3229} {"train_loss": -25.32086753845215, "global_step": 268047, "epoch": 3229} {"train_loss": -25.2596435546875, "global_step": 268048, "epoch": 3229} {"train_loss": -25.2781982421875, "global_step": 268049, "epoch": 3229} {"train_loss": -25.30807876586914, "global_step": 268050, "epoch": 3229} {"train_loss": -25.115901947021484, "global_step": 268051, "epoch": 3229} {"train_loss": -25.550344467163086, "global_step": 268052, "epoch": 3229} {"train_loss": -25.286510467529297, "global_step": 268053, "epoch": 3229} {"train_loss": -25.087488174438477, "global_step": 268054, "epoch": 3229} {"train_loss": -25.802515029907227, "global_step": 268055, "epoch": 3229} {"train_loss": -24.965795516967773, "global_step": 268056, "epoch": 3229} {"train_loss": -25.211057662963867, "global_step": 268057, "epoch": 3229} {"train_loss": -25.48414421081543, "global_step": 268058, "epoch": 3229} {"train_loss": -24.745182037353516, "global_step": 268059, "epoch": 3229} {"train_loss": -25.310270309448242, "global_step": 268060, "epoch": 3229} {"train_loss": -25.259992599487305, "global_step": 268061, "epoch": 3229} {"train_loss": -25.719919204711914, "global_step": 268062, "epoch": 3229} {"train_loss": -25.68939208984375, "global_step": 268063, "epoch": 3229} {"train_loss": -25.22733497619629, "global_step": 268064, "epoch": 3229} {"train_loss": -25.044160842895508, "global_step": 268065, "epoch": 3229} {"train_loss": -25.1943359375, "global_step": 268066, "epoch": 3229} {"train_loss": -25.8339786529541, "global_step": 268067, "epoch": 3229} {"train_loss": -25.326704025268555, "global_step": 268068, "epoch": 3229} {"train_loss": -25.59347152709961, "global_step": 268069, "epoch": 3229} {"train_loss": -25.100223541259766, "global_step": 268070, "epoch": 3229} {"train_loss": -25.336868286132812, "global_step": 268071, "epoch": 3229} {"train_loss": -25.280664443969727, "global_step": 268072, "epoch": 3229} {"train_loss": -25.486835479736328, "global_step": 268073, "epoch": 3229} {"train_loss": -25.304983139038086, "global_step": 268074, "epoch": 3229} {"train_loss": -24.929019927978516, "global_step": 268075, "epoch": 3229} {"train_loss": -25.056705474853516, "global_step": 268076, "epoch": 3229} {"train_loss": -25.391267776489258, "global_step": 268077, "epoch": 3229} {"train_loss": -25.062118530273438, "global_step": 268078, "epoch": 3229} {"train_loss": -25.25334930419922, "global_step": 268079, "epoch": 3229} {"train_loss": -25.103717803955078, "global_step": 268080, "epoch": 3229} {"train_loss": -25.07312774658203, "global_step": 268081, "epoch": 3229} {"train_loss": -25.177139282226562, "global_step": 268082, "epoch": 3229} {"train_loss": -25.017841339111328, "global_step": 268083, "epoch": 3229} {"train_loss": -25.198822021484375, "global_step": 268084, "epoch": 3229} {"train_loss": -25.335725784301758, "global_step": 268085, "epoch": 3229} {"train_loss": -25.1412353515625, "global_step": 268086, "epoch": 3229} {"train_loss": -25.35137176513672, "global_step": 268087, "epoch": 3229} {"train_loss": -25.095794677734375, "global_step": 268088, "epoch": 3229} {"train_loss": -25.220530843160237, "global_step": 268089, "epoch": 3229, "val_loss": 6966783.0} {"train_loss": -24.987390518188477, "global_step": 268090, "epoch": 3230} {"train_loss": -24.595930099487305, "global_step": 268091, "epoch": 3230} {"train_loss": -24.950260162353516, "global_step": 268092, "epoch": 3230} {"train_loss": -25.231508255004883, "global_step": 268093, "epoch": 3230} {"train_loss": -24.780683517456055, "global_step": 268094, "epoch": 3230} {"train_loss": -25.3841609954834, "global_step": 268095, "epoch": 3230} {"train_loss": -25.02100372314453, "global_step": 268096, "epoch": 3230} {"train_loss": -25.050302505493164, "global_step": 268097, "epoch": 3230} {"train_loss": -25.25738525390625, "global_step": 268098, "epoch": 3230} {"train_loss": -24.7928409576416, "global_step": 268099, "epoch": 3230} {"train_loss": -24.666948318481445, "global_step": 268100, "epoch": 3230} {"train_loss": -25.32981300354004, "global_step": 268101, "epoch": 3230} {"train_loss": -24.973270416259766, "global_step": 268102, "epoch": 3230} {"train_loss": -25.08017921447754, "global_step": 268103, "epoch": 3230} {"train_loss": -24.93003273010254, "global_step": 268104, "epoch": 3230} {"train_loss": -24.880733489990234, "global_step": 268105, "epoch": 3230} {"train_loss": -25.044172286987305, "global_step": 268106, "epoch": 3230} {"train_loss": -25.28008270263672, "global_step": 268107, "epoch": 3230} {"train_loss": -25.098724365234375, "global_step": 268108, "epoch": 3230} {"train_loss": -25.243589401245117, "global_step": 268109, "epoch": 3230} {"train_loss": -25.295246124267578, "global_step": 268110, "epoch": 3230} {"train_loss": -24.855297088623047, "global_step": 268111, "epoch": 3230} {"train_loss": -25.09339141845703, "global_step": 268112, "epoch": 3230} {"train_loss": -25.12037467956543, "global_step": 268113, "epoch": 3230} {"train_loss": -25.083293914794922, "global_step": 268114, "epoch": 3230} {"train_loss": -25.33370018005371, "global_step": 268115, "epoch": 3230} {"train_loss": -25.271690368652344, "global_step": 268116, "epoch": 3230} {"train_loss": -25.36115837097168, "global_step": 268117, "epoch": 3230} {"train_loss": -25.42633056640625, "global_step": 268118, "epoch": 3230} {"train_loss": -25.407651901245117, "global_step": 268119, "epoch": 3230} {"train_loss": -25.341283798217773, "global_step": 268120, "epoch": 3230} {"train_loss": -25.296932220458984, "global_step": 268121, "epoch": 3230} {"train_loss": -25.44691276550293, "global_step": 268122, "epoch": 3230} {"train_loss": -25.28960609436035, "global_step": 268123, "epoch": 3230} {"train_loss": -24.582731246948242, "global_step": 268124, "epoch": 3230} {"train_loss": -25.227619171142578, "global_step": 268125, "epoch": 3230} {"train_loss": -25.397993087768555, "global_step": 268126, "epoch": 3230} {"train_loss": -25.026397705078125, "global_step": 268127, "epoch": 3230} {"train_loss": -25.311777114868164, "global_step": 268128, "epoch": 3230} {"train_loss": -25.288694381713867, "global_step": 268129, "epoch": 3230} {"train_loss": -25.401845932006836, "global_step": 268130, "epoch": 3230} {"train_loss": -25.249902725219727, "global_step": 268131, "epoch": 3230} {"train_loss": -25.360153198242188, "global_step": 268132, "epoch": 3230} {"train_loss": -25.129995346069336, "global_step": 268133, "epoch": 3230} {"train_loss": -25.24388313293457, "global_step": 268134, "epoch": 3230} {"train_loss": -25.494565963745117, "global_step": 268135, "epoch": 3230} {"train_loss": -25.53125, "global_step": 268136, "epoch": 3230} {"train_loss": -24.832080841064453, "global_step": 268137, "epoch": 3230} {"train_loss": -25.600019454956055, "global_step": 268138, "epoch": 3230} {"train_loss": -25.21482276916504, "global_step": 268139, "epoch": 3230} {"train_loss": -25.33477783203125, "global_step": 268140, "epoch": 3230} {"train_loss": -25.043701171875, "global_step": 268141, "epoch": 3230} {"train_loss": -25.244272232055664, "global_step": 268142, "epoch": 3230} {"train_loss": -25.243606567382812, "global_step": 268143, "epoch": 3230} {"train_loss": -24.959680557250977, "global_step": 268144, "epoch": 3230} {"train_loss": -25.46064567565918, "global_step": 268145, "epoch": 3230} {"train_loss": -25.30021095275879, "global_step": 268146, "epoch": 3230} {"train_loss": -24.922971725463867, "global_step": 268147, "epoch": 3230} {"train_loss": -25.371496200561523, "global_step": 268148, "epoch": 3230} {"train_loss": -25.007888793945312, "global_step": 268149, "epoch": 3230} {"train_loss": -25.342960357666016, "global_step": 268150, "epoch": 3230} {"train_loss": -25.580976486206055, "global_step": 268151, "epoch": 3230} {"train_loss": -25.74611473083496, "global_step": 268152, "epoch": 3230} {"train_loss": -25.28718376159668, "global_step": 268153, "epoch": 3230} {"train_loss": -25.03400230407715, "global_step": 268154, "epoch": 3230} {"train_loss": -25.087724685668945, "global_step": 268155, "epoch": 3230} {"train_loss": -24.89411163330078, "global_step": 268156, "epoch": 3230} {"train_loss": -25.088510513305664, "global_step": 268157, "epoch": 3230} {"train_loss": -25.34827995300293, "global_step": 268158, "epoch": 3230} {"train_loss": -25.251827239990234, "global_step": 268159, "epoch": 3230} {"train_loss": -25.295379638671875, "global_step": 268160, "epoch": 3230} {"train_loss": -25.27760124206543, "global_step": 268161, "epoch": 3230} {"train_loss": -25.43411636352539, "global_step": 268162, "epoch": 3230} {"train_loss": -25.293516159057617, "global_step": 268163, "epoch": 3230} {"train_loss": -25.101375579833984, "global_step": 268164, "epoch": 3230} {"train_loss": -25.216955184936523, "global_step": 268165, "epoch": 3230} {"train_loss": -25.128814697265625, "global_step": 268166, "epoch": 3230} {"train_loss": -25.81194496154785, "global_step": 268167, "epoch": 3230} {"train_loss": -25.280292510986328, "global_step": 268168, "epoch": 3230} {"train_loss": -25.462339401245117, "global_step": 268169, "epoch": 3230} {"train_loss": -25.478008270263672, "global_step": 268170, "epoch": 3230} {"train_loss": -25.440990447998047, "global_step": 268171, "epoch": 3230} {"train_loss": -25.22214756241764, "global_step": 268172, "epoch": 3230, "val_loss": 6923222.0} {"train_loss": -24.802261352539062, "global_step": 268173, "epoch": 3231} {"train_loss": -24.885345458984375, "global_step": 268174, "epoch": 3231} {"train_loss": -25.053861618041992, "global_step": 268175, "epoch": 3231} {"train_loss": -24.67915916442871, "global_step": 268176, "epoch": 3231} {"train_loss": -24.510290145874023, "global_step": 268177, "epoch": 3231} {"train_loss": -24.84441566467285, "global_step": 268178, "epoch": 3231} {"train_loss": -24.878116607666016, "global_step": 268179, "epoch": 3231} {"train_loss": -25.10963249206543, "global_step": 268180, "epoch": 3231} {"train_loss": -24.986862182617188, "global_step": 268181, "epoch": 3231} {"train_loss": -24.814788818359375, "global_step": 268182, "epoch": 3231} {"train_loss": -24.798521041870117, "global_step": 268183, "epoch": 3231} {"train_loss": -25.244659423828125, "global_step": 268184, "epoch": 3231} {"train_loss": -25.26131248474121, "global_step": 268185, "epoch": 3231} {"train_loss": -24.60123634338379, "global_step": 268186, "epoch": 3231} {"train_loss": -25.116119384765625, "global_step": 268187, "epoch": 3231} {"train_loss": -25.028474807739258, "global_step": 268188, "epoch": 3231} {"train_loss": -25.052587509155273, "global_step": 268189, "epoch": 3231} {"train_loss": -25.200275421142578, "global_step": 268190, "epoch": 3231} {"train_loss": -25.38661003112793, "global_step": 268191, "epoch": 3231} {"train_loss": -25.105751037597656, "global_step": 268192, "epoch": 3231} {"train_loss": -25.0023250579834, "global_step": 268193, "epoch": 3231} {"train_loss": -25.132125854492188, "global_step": 268194, "epoch": 3231} {"train_loss": -25.206729888916016, "global_step": 268195, "epoch": 3231} {"train_loss": -25.14377212524414, "global_step": 268196, "epoch": 3231} {"train_loss": -24.991174697875977, "global_step": 268197, "epoch": 3231} {"train_loss": -25.26857566833496, "global_step": 268198, "epoch": 3231} {"train_loss": -25.663562774658203, "global_step": 268199, "epoch": 3231} {"train_loss": -25.180509567260742, "global_step": 268200, "epoch": 3231} {"train_loss": -25.07618522644043, "global_step": 268201, "epoch": 3231} {"train_loss": -25.58427619934082, "global_step": 268202, "epoch": 3231} {"train_loss": -25.38869285583496, "global_step": 268203, "epoch": 3231} {"train_loss": -25.608972549438477, "global_step": 268204, "epoch": 3231} {"train_loss": -25.622995376586914, "global_step": 268205, "epoch": 3231} {"train_loss": -25.137556076049805, "global_step": 268206, "epoch": 3231} {"train_loss": -25.2984676361084, "global_step": 268207, "epoch": 3231} {"train_loss": -25.479267120361328, "global_step": 268208, "epoch": 3231} {"train_loss": -25.22152328491211, "global_step": 268209, "epoch": 3231} {"train_loss": -25.335477828979492, "global_step": 268210, "epoch": 3231} {"train_loss": -25.59002113342285, "global_step": 268211, "epoch": 3231} {"train_loss": -25.145471572875977, "global_step": 268212, "epoch": 3231} {"train_loss": -25.214197158813477, "global_step": 268213, "epoch": 3231} {"train_loss": -24.85389518737793, "global_step": 268214, "epoch": 3231} {"train_loss": -25.31123161315918, "global_step": 268215, "epoch": 3231} {"train_loss": -25.153799057006836, "global_step": 268216, "epoch": 3231} {"train_loss": -25.293737411499023, "global_step": 268217, "epoch": 3231} {"train_loss": -25.503902435302734, "global_step": 268218, "epoch": 3231} {"train_loss": -25.07308006286621, "global_step": 268219, "epoch": 3231} {"train_loss": -25.27931022644043, "global_step": 268220, "epoch": 3231} {"train_loss": -25.563594818115234, "global_step": 268221, "epoch": 3231} {"train_loss": -25.650693893432617, "global_step": 268222, "epoch": 3231} {"train_loss": -25.027502059936523, "global_step": 268223, "epoch": 3231} {"train_loss": -25.021453857421875, "global_step": 268224, "epoch": 3231} {"train_loss": -25.260778427124023, "global_step": 268225, "epoch": 3231} {"train_loss": -25.10994529724121, "global_step": 268226, "epoch": 3231} {"train_loss": -25.65947914123535, "global_step": 268227, "epoch": 3231} {"train_loss": -24.82591438293457, "global_step": 268228, "epoch": 3231} {"train_loss": -25.114744186401367, "global_step": 268229, "epoch": 3231} {"train_loss": -25.11054801940918, "global_step": 268230, "epoch": 3231} {"train_loss": -24.895627975463867, "global_step": 268231, "epoch": 3231} {"train_loss": -25.657812118530273, "global_step": 268232, "epoch": 3231} {"train_loss": -25.315670013427734, "global_step": 268233, "epoch": 3231} {"train_loss": -25.478179931640625, "global_step": 268234, "epoch": 3231} {"train_loss": -24.832883834838867, "global_step": 268235, "epoch": 3231} {"train_loss": -25.48016357421875, "global_step": 268236, "epoch": 3231} {"train_loss": -25.34929847717285, "global_step": 268237, "epoch": 3231} {"train_loss": -24.90528678894043, "global_step": 268238, "epoch": 3231} {"train_loss": -25.37382698059082, "global_step": 268239, "epoch": 3231} {"train_loss": -24.991825103759766, "global_step": 268240, "epoch": 3231} {"train_loss": -25.462736129760742, "global_step": 268241, "epoch": 3231} {"train_loss": -25.314668655395508, "global_step": 268242, "epoch": 3231} {"train_loss": -25.238386154174805, "global_step": 268243, "epoch": 3231} {"train_loss": -25.56349754333496, "global_step": 268244, "epoch": 3231} {"train_loss": -25.355470657348633, "global_step": 268245, "epoch": 3231} {"train_loss": -25.48845863342285, "global_step": 268246, "epoch": 3231} {"train_loss": -25.586790084838867, "global_step": 268247, "epoch": 3231} {"train_loss": -25.281513214111328, "global_step": 268248, "epoch": 3231} {"train_loss": -25.216489791870117, "global_step": 268249, "epoch": 3231} {"train_loss": -25.734054565429688, "global_step": 268250, "epoch": 3231} {"train_loss": -25.61993408203125, "global_step": 268251, "epoch": 3231} {"train_loss": -25.3519229888916, "global_step": 268252, "epoch": 3231} {"train_loss": -25.103376388549805, "global_step": 268253, "epoch": 3231} {"train_loss": -24.967077255249023, "global_step": 268254, "epoch": 3231} {"train_loss": -25.196969687220562, "global_step": 268255, "epoch": 3231, "val_loss": 7134741.0} {"train_loss": -24.901525497436523, "global_step": 268256, "epoch": 3232} {"train_loss": -22.90347671508789, "global_step": 268257, "epoch": 3232} {"train_loss": -23.995677947998047, "global_step": 268258, "epoch": 3232} {"train_loss": -24.48158836364746, "global_step": 268259, "epoch": 3232} {"train_loss": -24.1671142578125, "global_step": 268260, "epoch": 3232} {"train_loss": -24.40245246887207, "global_step": 268261, "epoch": 3232} {"train_loss": -24.834562301635742, "global_step": 268262, "epoch": 3232} {"train_loss": -24.326160430908203, "global_step": 268263, "epoch": 3232} {"train_loss": -24.64702796936035, "global_step": 268264, "epoch": 3232} {"train_loss": -24.416372299194336, "global_step": 268265, "epoch": 3232} {"train_loss": -24.610248565673828, "global_step": 268266, "epoch": 3232} {"train_loss": -24.674591064453125, "global_step": 268267, "epoch": 3232} {"train_loss": -24.875919342041016, "global_step": 268268, "epoch": 3232} {"train_loss": -24.754148483276367, "global_step": 268269, "epoch": 3232} {"train_loss": -24.856006622314453, "global_step": 268270, "epoch": 3232} {"train_loss": -24.98565101623535, "global_step": 268271, "epoch": 3232} {"train_loss": -24.5767879486084, "global_step": 268272, "epoch": 3232} {"train_loss": -25.295907974243164, "global_step": 268273, "epoch": 3232} {"train_loss": -25.091896057128906, "global_step": 268274, "epoch": 3232} {"train_loss": -25.040014266967773, "global_step": 268275, "epoch": 3232} {"train_loss": -25.185455322265625, "global_step": 268276, "epoch": 3232} {"train_loss": -25.037790298461914, "global_step": 268277, "epoch": 3232} {"train_loss": -25.479162216186523, "global_step": 268278, "epoch": 3232} {"train_loss": -24.91359519958496, "global_step": 268279, "epoch": 3232} {"train_loss": -24.95501136779785, "global_step": 268280, "epoch": 3232} {"train_loss": -25.26169776916504, "global_step": 268281, "epoch": 3232} {"train_loss": -25.1988582611084, "global_step": 268282, "epoch": 3232} {"train_loss": -25.125112533569336, "global_step": 268283, "epoch": 3232} {"train_loss": -25.171659469604492, "global_step": 268284, "epoch": 3232} {"train_loss": -25.405200958251953, "global_step": 268285, "epoch": 3232} {"train_loss": -25.507383346557617, "global_step": 268286, "epoch": 3232} {"train_loss": -25.590576171875, "global_step": 268287, "epoch": 3232} {"train_loss": -24.931663513183594, "global_step": 268288, "epoch": 3232} {"train_loss": -25.715103149414062, "global_step": 268289, "epoch": 3232} {"train_loss": -25.31614875793457, "global_step": 268290, "epoch": 3232} {"train_loss": -25.413166046142578, "global_step": 268291, "epoch": 3232} {"train_loss": -25.339658737182617, "global_step": 268292, "epoch": 3232} {"train_loss": -25.387914657592773, "global_step": 268293, "epoch": 3232} {"train_loss": -25.29471206665039, "global_step": 268294, "epoch": 3232} {"train_loss": -25.367416381835938, "global_step": 268295, "epoch": 3232} {"train_loss": -25.253475189208984, "global_step": 268296, "epoch": 3232} {"train_loss": -25.346689224243164, "global_step": 268297, "epoch": 3232} {"train_loss": -25.043020248413086, "global_step": 268298, "epoch": 3232} {"train_loss": -25.364002227783203, "global_step": 268299, "epoch": 3232} {"train_loss": -25.350698471069336, "global_step": 268300, "epoch": 3232} {"train_loss": -25.32733154296875, "global_step": 268301, "epoch": 3232} {"train_loss": -25.3313045501709, "global_step": 268302, "epoch": 3232} {"train_loss": -25.34659767150879, "global_step": 268303, "epoch": 3232} {"train_loss": -25.160858154296875, "global_step": 268304, "epoch": 3232} {"train_loss": -25.081876754760742, "global_step": 268305, "epoch": 3232} {"train_loss": -25.266855239868164, "global_step": 268306, "epoch": 3232} {"train_loss": -25.324636459350586, "global_step": 268307, "epoch": 3232} {"train_loss": -25.602136611938477, "global_step": 268308, "epoch": 3232} {"train_loss": -25.604995727539062, "global_step": 268309, "epoch": 3232} {"train_loss": -25.719335556030273, "global_step": 268310, "epoch": 3232} {"train_loss": -25.200708389282227, "global_step": 268311, "epoch": 3232} {"train_loss": -25.5910701751709, "global_step": 268312, "epoch": 3232} {"train_loss": -25.148881912231445, "global_step": 268313, "epoch": 3232} {"train_loss": -25.05067253112793, "global_step": 268314, "epoch": 3232} {"train_loss": -25.33609390258789, "global_step": 268315, "epoch": 3232} {"train_loss": -25.558134078979492, "global_step": 268316, "epoch": 3232} {"train_loss": -25.18330955505371, "global_step": 268317, "epoch": 3232} {"train_loss": -25.044225692749023, "global_step": 268318, "epoch": 3232} {"train_loss": -25.44015884399414, "global_step": 268319, "epoch": 3232} {"train_loss": -25.22616195678711, "global_step": 268320, "epoch": 3232} {"train_loss": -25.79267692565918, "global_step": 268321, "epoch": 3232} {"train_loss": -25.26734733581543, "global_step": 268322, "epoch": 3232} {"train_loss": -25.516620635986328, "global_step": 268323, "epoch": 3232} {"train_loss": -25.261198043823242, "global_step": 268324, "epoch": 3232} {"train_loss": -25.87668800354004, "global_step": 268325, "epoch": 3232} {"train_loss": -25.22480583190918, "global_step": 268326, "epoch": 3232} {"train_loss": -25.67205810546875, "global_step": 268327, "epoch": 3232} {"train_loss": -25.247766494750977, "global_step": 268328, "epoch": 3232} {"train_loss": -25.6894474029541, "global_step": 268329, "epoch": 3232} {"train_loss": -25.403532028198242, "global_step": 268330, "epoch": 3232} {"train_loss": -25.445096969604492, "global_step": 268331, "epoch": 3232} {"train_loss": -25.545133590698242, "global_step": 268332, "epoch": 3232} {"train_loss": -25.39569854736328, "global_step": 268333, "epoch": 3232} {"train_loss": -25.599454879760742, "global_step": 268334, "epoch": 3232} {"train_loss": -25.040283203125, "global_step": 268335, "epoch": 3232} {"train_loss": -25.206449508666992, "global_step": 268336, "epoch": 3232} {"train_loss": -24.5743465423584, "global_step": 268337, "epoch": 3232} {"train_loss": -25.139612014035144, "global_step": 268338, "epoch": 3232, "val_loss": 6868045.0} {"train_loss": -24.29953956604004, "global_step": 268339, "epoch": 3233} {"train_loss": -23.88698387145996, "global_step": 268340, "epoch": 3233} {"train_loss": -24.607431411743164, "global_step": 268341, "epoch": 3233} {"train_loss": -24.816360473632812, "global_step": 268342, "epoch": 3233} {"train_loss": -24.166305541992188, "global_step": 268343, "epoch": 3233} {"train_loss": -24.889667510986328, "global_step": 268344, "epoch": 3233} {"train_loss": -24.539709091186523, "global_step": 268345, "epoch": 3233} {"train_loss": -24.90096092224121, "global_step": 268346, "epoch": 3233} {"train_loss": -25.18447494506836, "global_step": 268347, "epoch": 3233} {"train_loss": -24.876312255859375, "global_step": 268348, "epoch": 3233} {"train_loss": -24.747007369995117, "global_step": 268349, "epoch": 3233} {"train_loss": -24.746990203857422, "global_step": 268350, "epoch": 3233} {"train_loss": -24.6726016998291, "global_step": 268351, "epoch": 3233} {"train_loss": -24.92085075378418, "global_step": 268352, "epoch": 3233} {"train_loss": -25.077138900756836, "global_step": 268353, "epoch": 3233} {"train_loss": -24.779813766479492, "global_step": 268354, "epoch": 3233} {"train_loss": -24.709415435791016, "global_step": 268355, "epoch": 3233} {"train_loss": -25.11794662475586, "global_step": 268356, "epoch": 3233} {"train_loss": -24.996366500854492, "global_step": 268357, "epoch": 3233} {"train_loss": -25.15321922302246, "global_step": 268358, "epoch": 3233} {"train_loss": -24.78936767578125, "global_step": 268359, "epoch": 3233} {"train_loss": -24.937658309936523, "global_step": 268360, "epoch": 3233} {"train_loss": -24.948165893554688, "global_step": 268361, "epoch": 3233} {"train_loss": -25.09269142150879, "global_step": 268362, "epoch": 3233} {"train_loss": -25.220788955688477, "global_step": 268363, "epoch": 3233} {"train_loss": -25.37860679626465, "global_step": 268364, "epoch": 3233} {"train_loss": -25.15352439880371, "global_step": 268365, "epoch": 3233} {"train_loss": -25.093076705932617, "global_step": 268366, "epoch": 3233} {"train_loss": -25.072702407836914, "global_step": 268367, "epoch": 3233} {"train_loss": -25.416465759277344, "global_step": 268368, "epoch": 3233} {"train_loss": -25.146764755249023, "global_step": 268369, "epoch": 3233} {"train_loss": -25.225547790527344, "global_step": 268370, "epoch": 3233} {"train_loss": -25.300813674926758, "global_step": 268371, "epoch": 3233} {"train_loss": -25.350677490234375, "global_step": 268372, "epoch": 3233} {"train_loss": -25.186193466186523, "global_step": 268373, "epoch": 3233} {"train_loss": -25.448841094970703, "global_step": 268374, "epoch": 3233} {"train_loss": -25.651580810546875, "global_step": 268375, "epoch": 3233} {"train_loss": -25.13936424255371, "global_step": 268376, "epoch": 3233} {"train_loss": -25.260040283203125, "global_step": 268377, "epoch": 3233} {"train_loss": -24.968643188476562, "global_step": 268378, "epoch": 3233} {"train_loss": -25.082551956176758, "global_step": 268379, "epoch": 3233} {"train_loss": -25.418832778930664, "global_step": 268380, "epoch": 3233} {"train_loss": -25.196929931640625, "global_step": 268381, "epoch": 3233} {"train_loss": -25.37393569946289, "global_step": 268382, "epoch": 3233} {"train_loss": -25.26287841796875, "global_step": 268383, "epoch": 3233} {"train_loss": -25.29218101501465, "global_step": 268384, "epoch": 3233} {"train_loss": -25.196325302124023, "global_step": 268385, "epoch": 3233} {"train_loss": -25.161300659179688, "global_step": 268386, "epoch": 3233} {"train_loss": -24.46438980102539, "global_step": 268387, "epoch": 3233} {"train_loss": -24.367328643798828, "global_step": 268388, "epoch": 3233} {"train_loss": -25.209157943725586, "global_step": 268389, "epoch": 3233} {"train_loss": -25.570926666259766, "global_step": 268390, "epoch": 3233} {"train_loss": -24.771652221679688, "global_step": 268391, "epoch": 3233} {"train_loss": -24.758914947509766, "global_step": 268392, "epoch": 3233} {"train_loss": -25.401071548461914, "global_step": 268393, "epoch": 3233} {"train_loss": -25.143341064453125, "global_step": 268394, "epoch": 3233} {"train_loss": -25.16558837890625, "global_step": 268395, "epoch": 3233} {"train_loss": -25.324068069458008, "global_step": 268396, "epoch": 3233} {"train_loss": -25.07927894592285, "global_step": 268397, "epoch": 3233} {"train_loss": -24.895723342895508, "global_step": 268398, "epoch": 3233} {"train_loss": -25.44106101989746, "global_step": 268399, "epoch": 3233} {"train_loss": -25.240623474121094, "global_step": 268400, "epoch": 3233} {"train_loss": -25.152265548706055, "global_step": 268401, "epoch": 3233} {"train_loss": -25.34311294555664, "global_step": 268402, "epoch": 3233} {"train_loss": -25.596792221069336, "global_step": 268403, "epoch": 3233} {"train_loss": -25.405126571655273, "global_step": 268404, "epoch": 3233} {"train_loss": -25.285905838012695, "global_step": 268405, "epoch": 3233} {"train_loss": -25.58737564086914, "global_step": 268406, "epoch": 3233} {"train_loss": -25.32773208618164, "global_step": 268407, "epoch": 3233} {"train_loss": -25.457122802734375, "global_step": 268408, "epoch": 3233} {"train_loss": -24.9178524017334, "global_step": 268409, "epoch": 3233} {"train_loss": -25.460529327392578, "global_step": 268410, "epoch": 3233} {"train_loss": -25.221603393554688, "global_step": 268411, "epoch": 3233} {"train_loss": -25.23908805847168, "global_step": 268412, "epoch": 3233} {"train_loss": -25.448537826538086, "global_step": 268413, "epoch": 3233} {"train_loss": -25.643335342407227, "global_step": 268414, "epoch": 3233} {"train_loss": -25.57239532470703, "global_step": 268415, "epoch": 3233} {"train_loss": -25.491186141967773, "global_step": 268416, "epoch": 3233} {"train_loss": -25.4875545501709, "global_step": 268417, "epoch": 3233} {"train_loss": -25.41925621032715, "global_step": 268418, "epoch": 3233} {"train_loss": -25.376644134521484, "global_step": 268419, "epoch": 3233} {"train_loss": -25.436704635620117, "global_step": 268420, "epoch": 3233} {"train_loss": -25.12154386129724, "global_step": 268421, "epoch": 3233, "val_loss": 6911948.0} {"train_loss": -24.536853790283203, "global_step": 268422, "epoch": 3234} {"train_loss": -24.838518142700195, "global_step": 268423, "epoch": 3234} {"train_loss": -24.66867446899414, "global_step": 268424, "epoch": 3234} {"train_loss": -23.886472702026367, "global_step": 268425, "epoch": 3234} {"train_loss": -24.76694679260254, "global_step": 268426, "epoch": 3234} {"train_loss": -24.791723251342773, "global_step": 268427, "epoch": 3234} {"train_loss": -24.62710189819336, "global_step": 268428, "epoch": 3234} {"train_loss": -25.08119010925293, "global_step": 268429, "epoch": 3234} {"train_loss": -24.64760971069336, "global_step": 268430, "epoch": 3234} {"train_loss": -24.558809280395508, "global_step": 268431, "epoch": 3234} {"train_loss": -24.80158042907715, "global_step": 268432, "epoch": 3234} {"train_loss": -24.65673828125, "global_step": 268433, "epoch": 3234} {"train_loss": -24.68586540222168, "global_step": 268434, "epoch": 3234} {"train_loss": -24.887346267700195, "global_step": 268435, "epoch": 3234} {"train_loss": -25.2637939453125, "global_step": 268436, "epoch": 3234} {"train_loss": -24.952117919921875, "global_step": 268437, "epoch": 3234} {"train_loss": -24.64194107055664, "global_step": 268438, "epoch": 3234} {"train_loss": -24.757741928100586, "global_step": 268439, "epoch": 3234} {"train_loss": -25.083356857299805, "global_step": 268440, "epoch": 3234} {"train_loss": -24.9718074798584, "global_step": 268441, "epoch": 3234} {"train_loss": -25.122156143188477, "global_step": 268442, "epoch": 3234} {"train_loss": -25.04017448425293, "global_step": 268443, "epoch": 3234} {"train_loss": -24.99387550354004, "global_step": 268444, "epoch": 3234} {"train_loss": -24.952455520629883, "global_step": 268445, "epoch": 3234} {"train_loss": -25.24013900756836, "global_step": 268446, "epoch": 3234} {"train_loss": -25.783349990844727, "global_step": 268447, "epoch": 3234} {"train_loss": -24.946474075317383, "global_step": 268448, "epoch": 3234} {"train_loss": -25.445926666259766, "global_step": 268449, "epoch": 3234} {"train_loss": -24.782543182373047, "global_step": 268450, "epoch": 3234} {"train_loss": -25.044113159179688, "global_step": 268451, "epoch": 3234} {"train_loss": -25.165267944335938, "global_step": 268452, "epoch": 3234} {"train_loss": -25.444881439208984, "global_step": 268453, "epoch": 3234} {"train_loss": -25.192312240600586, "global_step": 268454, "epoch": 3234} {"train_loss": -25.12331199645996, "global_step": 268455, "epoch": 3234} {"train_loss": -25.54097557067871, "global_step": 268456, "epoch": 3234} {"train_loss": -25.731647491455078, "global_step": 268457, "epoch": 3234} {"train_loss": -25.396299362182617, "global_step": 268458, "epoch": 3234} {"train_loss": -25.35442543029785, "global_step": 268459, "epoch": 3234} {"train_loss": -25.325393676757812, "global_step": 268460, "epoch": 3234} {"train_loss": -25.3688907623291, "global_step": 268461, "epoch": 3234} {"train_loss": -25.10553741455078, "global_step": 268462, "epoch": 3234} {"train_loss": -25.296903610229492, "global_step": 268463, "epoch": 3234} {"train_loss": -25.94960594177246, "global_step": 268464, "epoch": 3234} {"train_loss": -25.420896530151367, "global_step": 268465, "epoch": 3234} {"train_loss": -25.279794692993164, "global_step": 268466, "epoch": 3234} {"train_loss": -25.602014541625977, "global_step": 268467, "epoch": 3234} {"train_loss": -25.143678665161133, "global_step": 268468, "epoch": 3234} {"train_loss": -25.137426376342773, "global_step": 268469, "epoch": 3234} {"train_loss": -25.5164737701416, "global_step": 268470, "epoch": 3234} {"train_loss": -25.347204208374023, "global_step": 268471, "epoch": 3234} {"train_loss": -25.096790313720703, "global_step": 268472, "epoch": 3234} {"train_loss": -24.659500122070312, "global_step": 268473, "epoch": 3234} {"train_loss": -25.022676467895508, "global_step": 268474, "epoch": 3234} {"train_loss": -25.177072525024414, "global_step": 268475, "epoch": 3234} {"train_loss": -25.094669342041016, "global_step": 268476, "epoch": 3234} {"train_loss": -24.957229614257812, "global_step": 268477, "epoch": 3234} {"train_loss": -24.983325958251953, "global_step": 268478, "epoch": 3234} {"train_loss": -24.9260311126709, "global_step": 268479, "epoch": 3234} {"train_loss": -25.134721755981445, "global_step": 268480, "epoch": 3234} {"train_loss": -25.340917587280273, "global_step": 268481, "epoch": 3234} {"train_loss": -25.036476135253906, "global_step": 268482, "epoch": 3234} {"train_loss": -24.671911239624023, "global_step": 268483, "epoch": 3234} {"train_loss": -25.051748275756836, "global_step": 268484, "epoch": 3234} {"train_loss": -25.164915084838867, "global_step": 268485, "epoch": 3234} {"train_loss": -25.562307357788086, "global_step": 268486, "epoch": 3234} {"train_loss": -24.837926864624023, "global_step": 268487, "epoch": 3234} {"train_loss": -25.874109268188477, "global_step": 268488, "epoch": 3234} {"train_loss": -25.05899429321289, "global_step": 268489, "epoch": 3234} {"train_loss": -25.12221908569336, "global_step": 268490, "epoch": 3234} {"train_loss": -24.910179138183594, "global_step": 268491, "epoch": 3234} {"train_loss": -25.163244247436523, "global_step": 268492, "epoch": 3234} {"train_loss": -25.200910568237305, "global_step": 268493, "epoch": 3234} {"train_loss": -25.19021987915039, "global_step": 268494, "epoch": 3234} {"train_loss": -25.49273681640625, "global_step": 268495, "epoch": 3234} {"train_loss": -25.209951400756836, "global_step": 268496, "epoch": 3234} {"train_loss": -25.233543395996094, "global_step": 268497, "epoch": 3234} {"train_loss": -25.541942596435547, "global_step": 268498, "epoch": 3234} {"train_loss": -25.276330947875977, "global_step": 268499, "epoch": 3234} {"train_loss": -25.384763717651367, "global_step": 268500, "epoch": 3234} {"train_loss": -25.351404190063477, "global_step": 268501, "epoch": 3234} {"train_loss": -25.152070999145508, "global_step": 268502, "epoch": 3234} {"train_loss": -25.325307846069336, "global_step": 268503, "epoch": 3234} {"train_loss": -25.105393030557288, "global_step": 268504, "epoch": 3234, "val_loss": 7029236.0} {"train_loss": -25.400821685791016, "global_step": 268505, "epoch": 3235} {"train_loss": -24.478851318359375, "global_step": 268506, "epoch": 3235} {"train_loss": -25.39540672302246, "global_step": 268507, "epoch": 3235} {"train_loss": -24.65623664855957, "global_step": 268508, "epoch": 3235} {"train_loss": -25.390174865722656, "global_step": 268509, "epoch": 3235} {"train_loss": -25.060531616210938, "global_step": 268510, "epoch": 3235} {"train_loss": -24.885746002197266, "global_step": 268511, "epoch": 3235} {"train_loss": -24.94391441345215, "global_step": 268512, "epoch": 3235} {"train_loss": -25.21687889099121, "global_step": 268513, "epoch": 3235} {"train_loss": -25.035375595092773, "global_step": 268514, "epoch": 3235} {"train_loss": -25.289365768432617, "global_step": 268515, "epoch": 3235} {"train_loss": -25.38666343688965, "global_step": 268516, "epoch": 3235} {"train_loss": -25.08758544921875, "global_step": 268517, "epoch": 3235} {"train_loss": -25.519832611083984, "global_step": 268518, "epoch": 3235} {"train_loss": -25.1190242767334, "global_step": 268519, "epoch": 3235} {"train_loss": -25.189905166625977, "global_step": 268520, "epoch": 3235} {"train_loss": -25.27638816833496, "global_step": 268521, "epoch": 3235} {"train_loss": -25.27650260925293, "global_step": 268522, "epoch": 3235} {"train_loss": -25.660680770874023, "global_step": 268523, "epoch": 3235} {"train_loss": -25.51041603088379, "global_step": 268524, "epoch": 3235} {"train_loss": -25.196569442749023, "global_step": 268525, "epoch": 3235} {"train_loss": -25.28949546813965, "global_step": 268526, "epoch": 3235} {"train_loss": -25.53377342224121, "global_step": 268527, "epoch": 3235} {"train_loss": -25.279767990112305, "global_step": 268528, "epoch": 3235} {"train_loss": -25.624662399291992, "global_step": 268529, "epoch": 3235} {"train_loss": -25.360361099243164, "global_step": 268530, "epoch": 3235} {"train_loss": -25.420059204101562, "global_step": 268531, "epoch": 3235} {"train_loss": -25.30234146118164, "global_step": 268532, "epoch": 3235} {"train_loss": -25.360937118530273, "global_step": 268533, "epoch": 3235} {"train_loss": -25.241989135742188, "global_step": 268534, "epoch": 3235} {"train_loss": -25.138229370117188, "global_step": 268535, "epoch": 3235} {"train_loss": -25.007875442504883, "global_step": 268536, "epoch": 3235} {"train_loss": -25.216402053833008, "global_step": 268537, "epoch": 3235} {"train_loss": -25.091678619384766, "global_step": 268538, "epoch": 3235} {"train_loss": -24.90277671813965, "global_step": 268539, "epoch": 3235} {"train_loss": -25.23921775817871, "global_step": 268540, "epoch": 3235} {"train_loss": -25.245162963867188, "global_step": 268541, "epoch": 3235} {"train_loss": -25.322961807250977, "global_step": 268542, "epoch": 3235} {"train_loss": -24.902034759521484, "global_step": 268543, "epoch": 3235} {"train_loss": -24.949567794799805, "global_step": 268544, "epoch": 3235} {"train_loss": -25.391315460205078, "global_step": 268545, "epoch": 3235} {"train_loss": -25.194795608520508, "global_step": 268546, "epoch": 3235} {"train_loss": -25.36341667175293, "global_step": 268547, "epoch": 3235} {"train_loss": -25.586956024169922, "global_step": 268548, "epoch": 3235} {"train_loss": -25.250024795532227, "global_step": 268549, "epoch": 3235} {"train_loss": -25.61672019958496, "global_step": 268550, "epoch": 3235} {"train_loss": -25.457395553588867, "global_step": 268551, "epoch": 3235} {"train_loss": -25.0701847076416, "global_step": 268552, "epoch": 3235} {"train_loss": -25.191617965698242, "global_step": 268553, "epoch": 3235} {"train_loss": -25.399303436279297, "global_step": 268554, "epoch": 3235} {"train_loss": -25.30890464782715, "global_step": 268555, "epoch": 3235} {"train_loss": -25.109472274780273, "global_step": 268556, "epoch": 3235} {"train_loss": -25.306913375854492, "global_step": 268557, "epoch": 3235} {"train_loss": -25.689924240112305, "global_step": 268558, "epoch": 3235} {"train_loss": -25.59869956970215, "global_step": 268559, "epoch": 3235} {"train_loss": -25.6063175201416, "global_step": 268560, "epoch": 3235} {"train_loss": -25.26701545715332, "global_step": 268561, "epoch": 3235} {"train_loss": -25.077850341796875, "global_step": 268562, "epoch": 3235} {"train_loss": -25.485849380493164, "global_step": 268563, "epoch": 3235} {"train_loss": -25.172021865844727, "global_step": 268564, "epoch": 3235} {"train_loss": -24.981311798095703, "global_step": 268565, "epoch": 3235} {"train_loss": -25.30869483947754, "global_step": 268566, "epoch": 3235} {"train_loss": -25.431516647338867, "global_step": 268567, "epoch": 3235} {"train_loss": -25.460485458374023, "global_step": 268568, "epoch": 3235} {"train_loss": -25.317079544067383, "global_step": 268569, "epoch": 3235} {"train_loss": -25.37820816040039, "global_step": 268570, "epoch": 3235} {"train_loss": -25.132434844970703, "global_step": 268571, "epoch": 3235} {"train_loss": -25.23247718811035, "global_step": 268572, "epoch": 3235} {"train_loss": -25.459518432617188, "global_step": 268573, "epoch": 3235} {"train_loss": -25.758947372436523, "global_step": 268574, "epoch": 3235} {"train_loss": -25.162343978881836, "global_step": 268575, "epoch": 3235} {"train_loss": -25.620136260986328, "global_step": 268576, "epoch": 3235} {"train_loss": -25.42792320251465, "global_step": 268577, "epoch": 3235} {"train_loss": -25.61001968383789, "global_step": 268578, "epoch": 3235} {"train_loss": -25.21925926208496, "global_step": 268579, "epoch": 3235} {"train_loss": -25.1846923828125, "global_step": 268580, "epoch": 3235} {"train_loss": -24.94930076599121, "global_step": 268581, "epoch": 3235} {"train_loss": -24.68145179748535, "global_step": 268582, "epoch": 3235} {"train_loss": -24.47528648376465, "global_step": 268583, "epoch": 3235} {"train_loss": -24.635562896728516, "global_step": 268584, "epoch": 3235} {"train_loss": -24.888744354248047, "global_step": 268585, "epoch": 3235} {"train_loss": -24.860532760620117, "global_step": 268586, "epoch": 3235} {"train_loss": -25.237614482282154, "global_step": 268587, "epoch": 3235, "val_loss": 7000886.0} {"train_loss": -24.03783416748047, "global_step": 268588, "epoch": 3236} {"train_loss": -24.068418502807617, "global_step": 268589, "epoch": 3236} {"train_loss": -24.223758697509766, "global_step": 268590, "epoch": 3236} {"train_loss": -24.519691467285156, "global_step": 268591, "epoch": 3236} {"train_loss": -24.07749366760254, "global_step": 268592, "epoch": 3236} {"train_loss": -24.379444122314453, "global_step": 268593, "epoch": 3236} {"train_loss": -24.580488204956055, "global_step": 268594, "epoch": 3236} {"train_loss": -24.51153564453125, "global_step": 268595, "epoch": 3236} {"train_loss": -24.277786254882812, "global_step": 268596, "epoch": 3236} {"train_loss": -24.729326248168945, "global_step": 268597, "epoch": 3236} {"train_loss": -24.417478561401367, "global_step": 268598, "epoch": 3236} {"train_loss": -25.040903091430664, "global_step": 268599, "epoch": 3236} {"train_loss": -24.544876098632812, "global_step": 268600, "epoch": 3236} {"train_loss": -24.85422134399414, "global_step": 268601, "epoch": 3236} {"train_loss": -24.602025985717773, "global_step": 268602, "epoch": 3236} {"train_loss": -24.739315032958984, "global_step": 268603, "epoch": 3236} {"train_loss": -24.88661003112793, "global_step": 268604, "epoch": 3236} {"train_loss": -24.537939071655273, "global_step": 268605, "epoch": 3236} {"train_loss": -25.136627197265625, "global_step": 268606, "epoch": 3236} {"train_loss": -25.08293342590332, "global_step": 268607, "epoch": 3236} {"train_loss": -25.00493812561035, "global_step": 268608, "epoch": 3236} {"train_loss": -24.877605438232422, "global_step": 268609, "epoch": 3236} {"train_loss": -24.824087142944336, "global_step": 268610, "epoch": 3236} {"train_loss": -24.8769588470459, "global_step": 268611, "epoch": 3236} {"train_loss": -24.9534969329834, "global_step": 268612, "epoch": 3236} {"train_loss": -24.89431381225586, "global_step": 268613, "epoch": 3236} {"train_loss": -25.012468338012695, "global_step": 268614, "epoch": 3236} {"train_loss": -24.96803855895996, "global_step": 268615, "epoch": 3236} {"train_loss": -25.148048400878906, "global_step": 268616, "epoch": 3236} {"train_loss": -25.00678825378418, "global_step": 268617, "epoch": 3236} {"train_loss": -25.533029556274414, "global_step": 268618, "epoch": 3236} {"train_loss": -25.26532554626465, "global_step": 268619, "epoch": 3236} {"train_loss": -24.97415542602539, "global_step": 268620, "epoch": 3236} {"train_loss": -25.31576156616211, "global_step": 268621, "epoch": 3236} {"train_loss": -25.183454513549805, "global_step": 268622, "epoch": 3236} {"train_loss": -24.89305877685547, "global_step": 268623, "epoch": 3236} {"train_loss": -25.341764450073242, "global_step": 268624, "epoch": 3236} {"train_loss": -25.345169067382812, "global_step": 268625, "epoch": 3236} {"train_loss": -25.096134185791016, "global_step": 268626, "epoch": 3236} {"train_loss": -24.98109245300293, "global_step": 268627, "epoch": 3236} {"train_loss": -25.130842208862305, "global_step": 268628, "epoch": 3236} {"train_loss": -25.392276763916016, "global_step": 268629, "epoch": 3236} {"train_loss": -25.538297653198242, "global_step": 268630, "epoch": 3236} {"train_loss": -25.37390899658203, "global_step": 268631, "epoch": 3236} {"train_loss": -25.210506439208984, "global_step": 268632, "epoch": 3236} {"train_loss": -25.26607322692871, "global_step": 268633, "epoch": 3236} {"train_loss": -25.4543514251709, "global_step": 268634, "epoch": 3236} {"train_loss": -25.282758712768555, "global_step": 268635, "epoch": 3236} {"train_loss": -25.582670211791992, "global_step": 268636, "epoch": 3236} {"train_loss": -25.375511169433594, "global_step": 268637, "epoch": 3236} {"train_loss": -25.472667694091797, "global_step": 268638, "epoch": 3236} {"train_loss": -25.47176170349121, "global_step": 268639, "epoch": 3236} {"train_loss": -25.36556053161621, "global_step": 268640, "epoch": 3236} {"train_loss": -25.445627212524414, "global_step": 268641, "epoch": 3236} {"train_loss": -24.90097427368164, "global_step": 268642, "epoch": 3236} {"train_loss": -24.983911514282227, "global_step": 268643, "epoch": 3236} {"train_loss": -25.25124740600586, "global_step": 268644, "epoch": 3236} {"train_loss": -25.18697738647461, "global_step": 268645, "epoch": 3236} {"train_loss": -25.205957412719727, "global_step": 268646, "epoch": 3236} {"train_loss": -25.662546157836914, "global_step": 268647, "epoch": 3236} {"train_loss": -25.356475830078125, "global_step": 268648, "epoch": 3236} {"train_loss": -25.118261337280273, "global_step": 268649, "epoch": 3236} {"train_loss": -25.27071189880371, "global_step": 268650, "epoch": 3236} {"train_loss": -25.141653060913086, "global_step": 268651, "epoch": 3236} {"train_loss": -25.443496704101562, "global_step": 268652, "epoch": 3236} {"train_loss": -25.34139060974121, "global_step": 268653, "epoch": 3236} {"train_loss": -25.633773803710938, "global_step": 268654, "epoch": 3236} {"train_loss": -25.481657028198242, "global_step": 268655, "epoch": 3236} {"train_loss": -25.349313735961914, "global_step": 268656, "epoch": 3236} {"train_loss": -24.974262237548828, "global_step": 268657, "epoch": 3236} {"train_loss": -25.47431755065918, "global_step": 268658, "epoch": 3236} {"train_loss": -25.288183212280273, "global_step": 268659, "epoch": 3236} {"train_loss": -25.4117488861084, "global_step": 268660, "epoch": 3236} {"train_loss": -24.913602828979492, "global_step": 268661, "epoch": 3236} {"train_loss": -25.354379653930664, "global_step": 268662, "epoch": 3236} {"train_loss": -25.213682174682617, "global_step": 268663, "epoch": 3236} {"train_loss": -25.607772827148438, "global_step": 268664, "epoch": 3236} {"train_loss": -25.439491271972656, "global_step": 268665, "epoch": 3236} {"train_loss": -24.920658111572266, "global_step": 268666, "epoch": 3236} {"train_loss": -25.59486961364746, "global_step": 268667, "epoch": 3236} {"train_loss": -25.22028350830078, "global_step": 268668, "epoch": 3236} {"train_loss": -25.082971572875977, "global_step": 268669, "epoch": 3236} {"train_loss": -25.08541791984834, "global_step": 268670, "epoch": 3236, "val_loss": 6960460.0} {"train_loss": -24.30014991760254, "global_step": 268671, "epoch": 3237} {"train_loss": -24.35053825378418, "global_step": 268672, "epoch": 3237} {"train_loss": -24.859981536865234, "global_step": 268673, "epoch": 3237} {"train_loss": -24.25784683227539, "global_step": 268674, "epoch": 3237} {"train_loss": -24.766199111938477, "global_step": 268675, "epoch": 3237} {"train_loss": -24.391145706176758, "global_step": 268676, "epoch": 3237} {"train_loss": -24.656614303588867, "global_step": 268677, "epoch": 3237} {"train_loss": -24.7414608001709, "global_step": 268678, "epoch": 3237} {"train_loss": -24.620473861694336, "global_step": 268679, "epoch": 3237} {"train_loss": -24.428281784057617, "global_step": 268680, "epoch": 3237} {"train_loss": -24.49696159362793, "global_step": 268681, "epoch": 3237} {"train_loss": -24.153995513916016, "global_step": 268682, "epoch": 3237} {"train_loss": -24.428808212280273, "global_step": 268683, "epoch": 3237} {"train_loss": -24.837892532348633, "global_step": 268684, "epoch": 3237} {"train_loss": -24.734535217285156, "global_step": 268685, "epoch": 3237} {"train_loss": -24.538862228393555, "global_step": 268686, "epoch": 3237} {"train_loss": -24.48482322692871, "global_step": 268687, "epoch": 3237} {"train_loss": -24.90580177307129, "global_step": 268688, "epoch": 3237} {"train_loss": -24.64762306213379, "global_step": 268689, "epoch": 3237} {"train_loss": -24.687551498413086, "global_step": 268690, "epoch": 3237} {"train_loss": -24.6196346282959, "global_step": 268691, "epoch": 3237} {"train_loss": -24.964481353759766, "global_step": 268692, "epoch": 3237} {"train_loss": -24.944196701049805, "global_step": 268693, "epoch": 3237} {"train_loss": -24.74495506286621, "global_step": 268694, "epoch": 3237} {"train_loss": -25.065048217773438, "global_step": 268695, "epoch": 3237} {"train_loss": -25.411256790161133, "global_step": 268696, "epoch": 3237} {"train_loss": -24.91115379333496, "global_step": 268697, "epoch": 3237} {"train_loss": -25.414209365844727, "global_step": 268698, "epoch": 3237} {"train_loss": -24.884374618530273, "global_step": 268699, "epoch": 3237} {"train_loss": -25.55592155456543, "global_step": 268700, "epoch": 3237} {"train_loss": -24.9220027923584, "global_step": 268701, "epoch": 3237} {"train_loss": -25.314193725585938, "global_step": 268702, "epoch": 3237} {"train_loss": -25.306699752807617, "global_step": 268703, "epoch": 3237} {"train_loss": -24.98476219177246, "global_step": 268704, "epoch": 3237} {"train_loss": -25.10420036315918, "global_step": 268705, "epoch": 3237} {"train_loss": -25.239850997924805, "global_step": 268706, "epoch": 3237} {"train_loss": -25.147476196289062, "global_step": 268707, "epoch": 3237} {"train_loss": -25.48316764831543, "global_step": 268708, "epoch": 3237} {"train_loss": -25.429540634155273, "global_step": 268709, "epoch": 3237} {"train_loss": -25.045948028564453, "global_step": 268710, "epoch": 3237} {"train_loss": -25.072725296020508, "global_step": 268711, "epoch": 3237} {"train_loss": -24.72135353088379, "global_step": 268712, "epoch": 3237} {"train_loss": -25.081701278686523, "global_step": 268713, "epoch": 3237} {"train_loss": -25.482749938964844, "global_step": 268714, "epoch": 3237} {"train_loss": -25.37992286682129, "global_step": 268715, "epoch": 3237} {"train_loss": -25.241086959838867, "global_step": 268716, "epoch": 3237} {"train_loss": -25.309162139892578, "global_step": 268717, "epoch": 3237} {"train_loss": -24.8651180267334, "global_step": 268718, "epoch": 3237} {"train_loss": -25.17488670349121, "global_step": 268719, "epoch": 3237} {"train_loss": -24.812660217285156, "global_step": 268720, "epoch": 3237} {"train_loss": -25.5152645111084, "global_step": 268721, "epoch": 3237} {"train_loss": -25.19351577758789, "global_step": 268722, "epoch": 3237} {"train_loss": -25.30085563659668, "global_step": 268723, "epoch": 3237} {"train_loss": -25.534963607788086, "global_step": 268724, "epoch": 3237} {"train_loss": -25.212223052978516, "global_step": 268725, "epoch": 3237} {"train_loss": -25.277740478515625, "global_step": 268726, "epoch": 3237} {"train_loss": -25.373167037963867, "global_step": 268727, "epoch": 3237} {"train_loss": -25.402067184448242, "global_step": 268728, "epoch": 3237} {"train_loss": -25.55378532409668, "global_step": 268729, "epoch": 3237} {"train_loss": -25.570632934570312, "global_step": 268730, "epoch": 3237} {"train_loss": -25.52490234375, "global_step": 268731, "epoch": 3237} {"train_loss": -25.353139877319336, "global_step": 268732, "epoch": 3237} {"train_loss": -25.409276962280273, "global_step": 268733, "epoch": 3237} {"train_loss": -25.46087074279785, "global_step": 268734, "epoch": 3237} {"train_loss": -25.259435653686523, "global_step": 268735, "epoch": 3237} {"train_loss": -25.097074508666992, "global_step": 268736, "epoch": 3237} {"train_loss": -25.29337501525879, "global_step": 268737, "epoch": 3237} {"train_loss": -24.918109893798828, "global_step": 268738, "epoch": 3237} {"train_loss": -25.40943717956543, "global_step": 268739, "epoch": 3237} {"train_loss": -25.20524024963379, "global_step": 268740, "epoch": 3237} {"train_loss": -25.203466415405273, "global_step": 268741, "epoch": 3237} {"train_loss": -25.214475631713867, "global_step": 268742, "epoch": 3237} {"train_loss": -24.990026473999023, "global_step": 268743, "epoch": 3237} {"train_loss": -25.07986831665039, "global_step": 268744, "epoch": 3237} {"train_loss": -25.48061180114746, "global_step": 268745, "epoch": 3237} {"train_loss": -24.825302124023438, "global_step": 268746, "epoch": 3237} {"train_loss": -25.553321838378906, "global_step": 268747, "epoch": 3237} {"train_loss": -25.496646881103516, "global_step": 268748, "epoch": 3237} {"train_loss": -25.167097091674805, "global_step": 268749, "epoch": 3237} {"train_loss": -25.51308250427246, "global_step": 268750, "epoch": 3237} {"train_loss": -25.405771255493164, "global_step": 268751, "epoch": 3237} {"train_loss": -25.028593063354492, "global_step": 268752, "epoch": 3237} {"train_loss": -25.059405499194042, "global_step": 268753, "epoch": 3237, "val_loss": 6975327.0} {"train_loss": -24.634559631347656, "global_step": 268754, "epoch": 3238} {"train_loss": -24.698514938354492, "global_step": 268755, "epoch": 3238} {"train_loss": -24.912235260009766, "global_step": 268756, "epoch": 3238} {"train_loss": -24.678442001342773, "global_step": 268757, "epoch": 3238} {"train_loss": -25.064298629760742, "global_step": 268758, "epoch": 3238} {"train_loss": -25.155134201049805, "global_step": 268759, "epoch": 3238} {"train_loss": -25.052976608276367, "global_step": 268760, "epoch": 3238} {"train_loss": -24.89510154724121, "global_step": 268761, "epoch": 3238} {"train_loss": -24.74515151977539, "global_step": 268762, "epoch": 3238} {"train_loss": -24.72920036315918, "global_step": 268763, "epoch": 3238} {"train_loss": -24.804994583129883, "global_step": 268764, "epoch": 3238} {"train_loss": -25.213302612304688, "global_step": 268765, "epoch": 3238} {"train_loss": -24.81822395324707, "global_step": 268766, "epoch": 3238} {"train_loss": -25.104297637939453, "global_step": 268767, "epoch": 3238} {"train_loss": -25.20435905456543, "global_step": 268768, "epoch": 3238} {"train_loss": -24.796539306640625, "global_step": 268769, "epoch": 3238} {"train_loss": -25.2734317779541, "global_step": 268770, "epoch": 3238} {"train_loss": -25.31668472290039, "global_step": 268771, "epoch": 3238} {"train_loss": -25.10567283630371, "global_step": 268772, "epoch": 3238} {"train_loss": -25.227752685546875, "global_step": 268773, "epoch": 3238} {"train_loss": -25.08754539489746, "global_step": 268774, "epoch": 3238} {"train_loss": -25.21210289001465, "global_step": 268775, "epoch": 3238} {"train_loss": -25.429258346557617, "global_step": 268776, "epoch": 3238} {"train_loss": -25.388431549072266, "global_step": 268777, "epoch": 3238} {"train_loss": -25.25470542907715, "global_step": 268778, "epoch": 3238} {"train_loss": -25.011154174804688, "global_step": 268779, "epoch": 3238} {"train_loss": -25.272558212280273, "global_step": 268780, "epoch": 3238} {"train_loss": -25.401845932006836, "global_step": 268781, "epoch": 3238} {"train_loss": -24.985538482666016, "global_step": 268782, "epoch": 3238} {"train_loss": -25.343847274780273, "global_step": 268783, "epoch": 3238} {"train_loss": -25.37535285949707, "global_step": 268784, "epoch": 3238} {"train_loss": -25.38960838317871, "global_step": 268785, "epoch": 3238} {"train_loss": -25.133941650390625, "global_step": 268786, "epoch": 3238} {"train_loss": -25.259408950805664, "global_step": 268787, "epoch": 3238} {"train_loss": -25.367345809936523, "global_step": 268788, "epoch": 3238} {"train_loss": -25.043136596679688, "global_step": 268789, "epoch": 3238} {"train_loss": -25.31337547302246, "global_step": 268790, "epoch": 3238} {"train_loss": -24.70407485961914, "global_step": 268791, "epoch": 3238} {"train_loss": -25.178773880004883, "global_step": 268792, "epoch": 3238} {"train_loss": -25.294736862182617, "global_step": 268793, "epoch": 3238} {"train_loss": -25.016860961914062, "global_step": 268794, "epoch": 3238} {"train_loss": -25.458024978637695, "global_step": 268795, "epoch": 3238} {"train_loss": -24.938800811767578, "global_step": 268796, "epoch": 3238} {"train_loss": -25.61358642578125, "global_step": 268797, "epoch": 3238} {"train_loss": -24.921188354492188, "global_step": 268798, "epoch": 3238} {"train_loss": -25.738061904907227, "global_step": 268799, "epoch": 3238} {"train_loss": -25.08943748474121, "global_step": 268800, "epoch": 3238} {"train_loss": -25.28253746032715, "global_step": 268801, "epoch": 3238} {"train_loss": -25.299413681030273, "global_step": 268802, "epoch": 3238} {"train_loss": -25.122907638549805, "global_step": 268803, "epoch": 3238} {"train_loss": -25.396547317504883, "global_step": 268804, "epoch": 3238} {"train_loss": -25.279277801513672, "global_step": 268805, "epoch": 3238} {"train_loss": -25.241619110107422, "global_step": 268806, "epoch": 3238} {"train_loss": -25.158103942871094, "global_step": 268807, "epoch": 3238} {"train_loss": -24.955656051635742, "global_step": 268808, "epoch": 3238} {"train_loss": -25.28061294555664, "global_step": 268809, "epoch": 3238} {"train_loss": -25.559789657592773, "global_step": 268810, "epoch": 3238} {"train_loss": -25.09468650817871, "global_step": 268811, "epoch": 3238} {"train_loss": -25.5272159576416, "global_step": 268812, "epoch": 3238} {"train_loss": -25.005279541015625, "global_step": 268813, "epoch": 3238} {"train_loss": -25.388843536376953, "global_step": 268814, "epoch": 3238} {"train_loss": -25.701513290405273, "global_step": 268815, "epoch": 3238} {"train_loss": -25.418964385986328, "global_step": 268816, "epoch": 3238} {"train_loss": -25.367643356323242, "global_step": 268817, "epoch": 3238} {"train_loss": -24.90268898010254, "global_step": 268818, "epoch": 3238} {"train_loss": -25.404829025268555, "global_step": 268819, "epoch": 3238} {"train_loss": -25.44959831237793, "global_step": 268820, "epoch": 3238} {"train_loss": -25.28262710571289, "global_step": 268821, "epoch": 3238} {"train_loss": -25.32769775390625, "global_step": 268822, "epoch": 3238} {"train_loss": -25.332338333129883, "global_step": 268823, "epoch": 3238} {"train_loss": -25.439748764038086, "global_step": 268824, "epoch": 3238} {"train_loss": -25.040855407714844, "global_step": 268825, "epoch": 3238} {"train_loss": -24.941049575805664, "global_step": 268826, "epoch": 3238} {"train_loss": -24.860929489135742, "global_step": 268827, "epoch": 3238} {"train_loss": -25.192485809326172, "global_step": 268828, "epoch": 3238} {"train_loss": -24.96333122253418, "global_step": 268829, "epoch": 3238} {"train_loss": -25.10038185119629, "global_step": 268830, "epoch": 3238} {"train_loss": -25.158496856689453, "global_step": 268831, "epoch": 3238} {"train_loss": -25.199813842773438, "global_step": 268832, "epoch": 3238} {"train_loss": -24.72458267211914, "global_step": 268833, "epoch": 3238} {"train_loss": -25.047752380371094, "global_step": 268834, "epoch": 3238} {"train_loss": -24.946826934814453, "global_step": 268835, "epoch": 3238} {"train_loss": -25.16009383603751, "global_step": 268836, "epoch": 3238, "val_loss": 6997476.0} {"train_loss": -25.28420066833496, "global_step": 268837, "epoch": 3239} {"train_loss": -25.064855575561523, "global_step": 268838, "epoch": 3239} {"train_loss": -24.7972354888916, "global_step": 268839, "epoch": 3239} {"train_loss": -24.949848175048828, "global_step": 268840, "epoch": 3239} {"train_loss": -24.75052261352539, "global_step": 268841, "epoch": 3239} {"train_loss": -24.953737258911133, "global_step": 268842, "epoch": 3239} {"train_loss": -24.794361114501953, "global_step": 268843, "epoch": 3239} {"train_loss": -24.900136947631836, "global_step": 268844, "epoch": 3239} {"train_loss": -24.476987838745117, "global_step": 268845, "epoch": 3239} {"train_loss": -25.10812759399414, "global_step": 268846, "epoch": 3239} {"train_loss": -24.73098373413086, "global_step": 268847, "epoch": 3239} {"train_loss": -24.87618637084961, "global_step": 268848, "epoch": 3239} {"train_loss": -25.262454986572266, "global_step": 268849, "epoch": 3239} {"train_loss": -24.7667293548584, "global_step": 268850, "epoch": 3239} {"train_loss": -25.119842529296875, "global_step": 268851, "epoch": 3239} {"train_loss": -25.036212921142578, "global_step": 268852, "epoch": 3239} {"train_loss": -25.06558609008789, "global_step": 268853, "epoch": 3239} {"train_loss": -25.30352783203125, "global_step": 268854, "epoch": 3239} {"train_loss": -25.293554306030273, "global_step": 268855, "epoch": 3239} {"train_loss": -25.07539176940918, "global_step": 268856, "epoch": 3239} {"train_loss": -25.035175323486328, "global_step": 268857, "epoch": 3239} {"train_loss": -24.967031478881836, "global_step": 268858, "epoch": 3239} {"train_loss": -25.58089256286621, "global_step": 268859, "epoch": 3239} {"train_loss": -25.213911056518555, "global_step": 268860, "epoch": 3239} {"train_loss": -25.226255416870117, "global_step": 268861, "epoch": 3239} {"train_loss": -24.945404052734375, "global_step": 268862, "epoch": 3239} {"train_loss": -25.240869522094727, "global_step": 268863, "epoch": 3239} {"train_loss": -24.85959815979004, "global_step": 268864, "epoch": 3239} {"train_loss": -24.86106300354004, "global_step": 268865, "epoch": 3239} {"train_loss": -25.650800704956055, "global_step": 268866, "epoch": 3239} {"train_loss": -25.066923141479492, "global_step": 268867, "epoch": 3239} {"train_loss": -25.3075008392334, "global_step": 268868, "epoch": 3239} {"train_loss": -25.198793411254883, "global_step": 268869, "epoch": 3239} {"train_loss": -25.413068771362305, "global_step": 268870, "epoch": 3239} {"train_loss": -25.21238899230957, "global_step": 268871, "epoch": 3239} {"train_loss": -25.452451705932617, "global_step": 268872, "epoch": 3239} {"train_loss": -25.75702476501465, "global_step": 268873, "epoch": 3239} {"train_loss": -25.621301651000977, "global_step": 268874, "epoch": 3239} {"train_loss": -25.442960739135742, "global_step": 268875, "epoch": 3239} {"train_loss": -25.311063766479492, "global_step": 268876, "epoch": 3239} {"train_loss": -25.055267333984375, "global_step": 268877, "epoch": 3239} {"train_loss": -25.0400333404541, "global_step": 268878, "epoch": 3239} {"train_loss": -25.218740463256836, "global_step": 268879, "epoch": 3239} {"train_loss": -25.2052059173584, "global_step": 268880, "epoch": 3239} {"train_loss": -24.96478843688965, "global_step": 268881, "epoch": 3239} {"train_loss": -24.84372901916504, "global_step": 268882, "epoch": 3239} {"train_loss": -24.71623420715332, "global_step": 268883, "epoch": 3239} {"train_loss": -25.283203125, "global_step": 268884, "epoch": 3239} {"train_loss": -25.205869674682617, "global_step": 268885, "epoch": 3239} {"train_loss": -25.372037887573242, "global_step": 268886, "epoch": 3239} {"train_loss": -25.161489486694336, "global_step": 268887, "epoch": 3239} {"train_loss": -25.07387351989746, "global_step": 268888, "epoch": 3239} {"train_loss": -24.94496726989746, "global_step": 268889, "epoch": 3239} {"train_loss": -25.271520614624023, "global_step": 268890, "epoch": 3239} {"train_loss": -25.332731246948242, "global_step": 268891, "epoch": 3239} {"train_loss": -25.317481994628906, "global_step": 268892, "epoch": 3239} {"train_loss": -25.01876449584961, "global_step": 268893, "epoch": 3239} {"train_loss": -25.028339385986328, "global_step": 268894, "epoch": 3239} {"train_loss": -25.14488410949707, "global_step": 268895, "epoch": 3239} {"train_loss": -24.883962631225586, "global_step": 268896, "epoch": 3239} {"train_loss": -25.432907104492188, "global_step": 268897, "epoch": 3239} {"train_loss": -24.994739532470703, "global_step": 268898, "epoch": 3239} {"train_loss": -25.02088737487793, "global_step": 268899, "epoch": 3239} {"train_loss": -25.35076141357422, "global_step": 268900, "epoch": 3239} {"train_loss": -25.481353759765625, "global_step": 268901, "epoch": 3239} {"train_loss": -25.250144958496094, "global_step": 268902, "epoch": 3239} {"train_loss": -25.06926918029785, "global_step": 268903, "epoch": 3239} {"train_loss": -25.26093101501465, "global_step": 268904, "epoch": 3239} {"train_loss": -25.121389389038086, "global_step": 268905, "epoch": 3239} {"train_loss": -25.64839744567871, "global_step": 268906, "epoch": 3239} {"train_loss": -25.24056053161621, "global_step": 268907, "epoch": 3239} {"train_loss": -24.99178123474121, "global_step": 268908, "epoch": 3239} {"train_loss": -25.327468872070312, "global_step": 268909, "epoch": 3239} {"train_loss": -25.51666259765625, "global_step": 268910, "epoch": 3239} {"train_loss": -25.463590621948242, "global_step": 268911, "epoch": 3239} {"train_loss": -25.29241943359375, "global_step": 268912, "epoch": 3239} {"train_loss": -25.396703720092773, "global_step": 268913, "epoch": 3239} {"train_loss": -25.279891967773438, "global_step": 268914, "epoch": 3239} {"train_loss": -25.298450469970703, "global_step": 268915, "epoch": 3239} {"train_loss": -25.565187454223633, "global_step": 268916, "epoch": 3239} {"train_loss": -25.359882354736328, "global_step": 268917, "epoch": 3239} {"train_loss": -25.132959365844727, "global_step": 268918, "epoch": 3239} {"train_loss": -25.161037468048463, "global_step": 268919, "epoch": 3239, "val_loss": 6977365.0} {"train_loss": -24.180395126342773, "global_step": 268920, "epoch": 3240} {"train_loss": -23.696701049804688, "global_step": 268921, "epoch": 3240} {"train_loss": -23.954830169677734, "global_step": 268922, "epoch": 3240} {"train_loss": -24.190217971801758, "global_step": 268923, "epoch": 3240} {"train_loss": -24.9024715423584, "global_step": 268924, "epoch": 3240} {"train_loss": -24.585256576538086, "global_step": 268925, "epoch": 3240} {"train_loss": -24.74781608581543, "global_step": 268926, "epoch": 3240} {"train_loss": -24.96235466003418, "global_step": 268927, "epoch": 3240} {"train_loss": -24.517698287963867, "global_step": 268928, "epoch": 3240} {"train_loss": -24.782751083374023, "global_step": 268929, "epoch": 3240} {"train_loss": -25.081884384155273, "global_step": 268930, "epoch": 3240} {"train_loss": -24.68440818786621, "global_step": 268931, "epoch": 3240} {"train_loss": -24.99373435974121, "global_step": 268932, "epoch": 3240} {"train_loss": -25.323999404907227, "global_step": 268933, "epoch": 3240} {"train_loss": -25.214969635009766, "global_step": 268934, "epoch": 3240} {"train_loss": -24.84266471862793, "global_step": 268935, "epoch": 3240} {"train_loss": -24.928550720214844, "global_step": 268936, "epoch": 3240} {"train_loss": -25.250457763671875, "global_step": 268937, "epoch": 3240} {"train_loss": -25.25986671447754, "global_step": 268938, "epoch": 3240} {"train_loss": -25.01142692565918, "global_step": 268939, "epoch": 3240} {"train_loss": -25.03795623779297, "global_step": 268940, "epoch": 3240} {"train_loss": -25.303110122680664, "global_step": 268941, "epoch": 3240} {"train_loss": -24.97635269165039, "global_step": 268942, "epoch": 3240} {"train_loss": -24.92592430114746, "global_step": 268943, "epoch": 3240} {"train_loss": -25.01753044128418, "global_step": 268944, "epoch": 3240} {"train_loss": -25.53363609313965, "global_step": 268945, "epoch": 3240} {"train_loss": -25.582462310791016, "global_step": 268946, "epoch": 3240} {"train_loss": -25.15778923034668, "global_step": 268947, "epoch": 3240} {"train_loss": -25.032407760620117, "global_step": 268948, "epoch": 3240} {"train_loss": -25.521238327026367, "global_step": 268949, "epoch": 3240} {"train_loss": -25.26313591003418, "global_step": 268950, "epoch": 3240} {"train_loss": -25.18899917602539, "global_step": 268951, "epoch": 3240} {"train_loss": -25.20240592956543, "global_step": 268952, "epoch": 3240} {"train_loss": -25.271482467651367, "global_step": 268953, "epoch": 3240} {"train_loss": -25.21840476989746, "global_step": 268954, "epoch": 3240} {"train_loss": -25.089523315429688, "global_step": 268955, "epoch": 3240} {"train_loss": -25.375822067260742, "global_step": 268956, "epoch": 3240} {"train_loss": -25.15561866760254, "global_step": 268957, "epoch": 3240} {"train_loss": -25.553081512451172, "global_step": 268958, "epoch": 3240} {"train_loss": -25.199129104614258, "global_step": 268959, "epoch": 3240} {"train_loss": -25.279071807861328, "global_step": 268960, "epoch": 3240} {"train_loss": -25.292938232421875, "global_step": 268961, "epoch": 3240} {"train_loss": -25.59540367126465, "global_step": 268962, "epoch": 3240} {"train_loss": -25.46302604675293, "global_step": 268963, "epoch": 3240} {"train_loss": -25.187095642089844, "global_step": 268964, "epoch": 3240} {"train_loss": -25.16132164001465, "global_step": 268965, "epoch": 3240} {"train_loss": -25.541166305541992, "global_step": 268966, "epoch": 3240} {"train_loss": -25.608203887939453, "global_step": 268967, "epoch": 3240} {"train_loss": -25.544696807861328, "global_step": 268968, "epoch": 3240} {"train_loss": -25.221572875976562, "global_step": 268969, "epoch": 3240} {"train_loss": -25.049423217773438, "global_step": 268970, "epoch": 3240} {"train_loss": -25.768142700195312, "global_step": 268971, "epoch": 3240} {"train_loss": -25.321796417236328, "global_step": 268972, "epoch": 3240} {"train_loss": -25.49921226501465, "global_step": 268973, "epoch": 3240} {"train_loss": -25.362625122070312, "global_step": 268974, "epoch": 3240} {"train_loss": -24.919906616210938, "global_step": 268975, "epoch": 3240} {"train_loss": -25.283395767211914, "global_step": 268976, "epoch": 3240} {"train_loss": -25.105867385864258, "global_step": 268977, "epoch": 3240} {"train_loss": -25.197635650634766, "global_step": 268978, "epoch": 3240} {"train_loss": -25.20124626159668, "global_step": 268979, "epoch": 3240} {"train_loss": -25.36163330078125, "global_step": 268980, "epoch": 3240} {"train_loss": -25.447315216064453, "global_step": 268981, "epoch": 3240} {"train_loss": -25.28081703186035, "global_step": 268982, "epoch": 3240} {"train_loss": -25.102033615112305, "global_step": 268983, "epoch": 3240} {"train_loss": -25.4047908782959, "global_step": 268984, "epoch": 3240} {"train_loss": -25.653156280517578, "global_step": 268985, "epoch": 3240} {"train_loss": -25.468223571777344, "global_step": 268986, "epoch": 3240} {"train_loss": -25.492115020751953, "global_step": 268987, "epoch": 3240} {"train_loss": -25.589561462402344, "global_step": 268988, "epoch": 3240} {"train_loss": -25.486013412475586, "global_step": 268989, "epoch": 3240} {"train_loss": -25.562986373901367, "global_step": 268990, "epoch": 3240} {"train_loss": -25.269506454467773, "global_step": 268991, "epoch": 3240} {"train_loss": -25.43043327331543, "global_step": 268992, "epoch": 3240} {"train_loss": -25.36809730529785, "global_step": 268993, "epoch": 3240} {"train_loss": -25.324832916259766, "global_step": 268994, "epoch": 3240} {"train_loss": -25.364755630493164, "global_step": 268995, "epoch": 3240} {"train_loss": -25.244054794311523, "global_step": 268996, "epoch": 3240} {"train_loss": -25.451704025268555, "global_step": 268997, "epoch": 3240} {"train_loss": -25.44997215270996, "global_step": 268998, "epoch": 3240} {"train_loss": -25.628503799438477, "global_step": 268999, "epoch": 3240} {"train_loss": -25.2062931060791, "global_step": 269000, "epoch": 3240} {"train_loss": -25.42242431640625, "global_step": 269001, "epoch": 3240} {"train_loss": -25.191187916031804, "global_step": 269002, "epoch": 3240, "val_loss": 6928945.0} {"train_loss": -24.57583999633789, "global_step": 269003, "epoch": 3241} {"train_loss": -24.572492599487305, "global_step": 269004, "epoch": 3241} {"train_loss": -23.543840408325195, "global_step": 269005, "epoch": 3241} {"train_loss": -24.60637664794922, "global_step": 269006, "epoch": 3241} {"train_loss": -24.9899959564209, "global_step": 269007, "epoch": 3241} {"train_loss": -24.857969284057617, "global_step": 269008, "epoch": 3241} {"train_loss": -24.81003189086914, "global_step": 269009, "epoch": 3241} {"train_loss": -24.813230514526367, "global_step": 269010, "epoch": 3241} {"train_loss": -25.251922607421875, "global_step": 269011, "epoch": 3241} {"train_loss": -25.02860450744629, "global_step": 269012, "epoch": 3241} {"train_loss": -24.83262062072754, "global_step": 269013, "epoch": 3241} {"train_loss": -24.93784523010254, "global_step": 269014, "epoch": 3241} {"train_loss": -25.240854263305664, "global_step": 269015, "epoch": 3241} {"train_loss": -25.085617065429688, "global_step": 269016, "epoch": 3241} {"train_loss": -24.571863174438477, "global_step": 269017, "epoch": 3241} {"train_loss": -24.506818771362305, "global_step": 269018, "epoch": 3241} {"train_loss": -24.813419342041016, "global_step": 269019, "epoch": 3241} {"train_loss": -25.033445358276367, "global_step": 269020, "epoch": 3241} {"train_loss": -25.345443725585938, "global_step": 269021, "epoch": 3241} {"train_loss": -25.141197204589844, "global_step": 269022, "epoch": 3241} {"train_loss": -25.44521141052246, "global_step": 269023, "epoch": 3241} {"train_loss": -24.846755981445312, "global_step": 269024, "epoch": 3241} {"train_loss": -24.89801597595215, "global_step": 269025, "epoch": 3241} {"train_loss": -25.284879684448242, "global_step": 269026, "epoch": 3241} {"train_loss": -25.17378044128418, "global_step": 269027, "epoch": 3241} {"train_loss": -25.19978904724121, "global_step": 269028, "epoch": 3241} {"train_loss": -25.248624801635742, "global_step": 269029, "epoch": 3241} {"train_loss": -25.198089599609375, "global_step": 269030, "epoch": 3241} {"train_loss": -25.438207626342773, "global_step": 269031, "epoch": 3241} {"train_loss": -25.175424575805664, "global_step": 269032, "epoch": 3241} {"train_loss": -25.32758331298828, "global_step": 269033, "epoch": 3241} {"train_loss": -25.82935905456543, "global_step": 269034, "epoch": 3241} {"train_loss": -25.6668643951416, "global_step": 269035, "epoch": 3241} {"train_loss": -25.35833740234375, "global_step": 269036, "epoch": 3241} {"train_loss": -25.077884674072266, "global_step": 269037, "epoch": 3241} {"train_loss": -25.403751373291016, "global_step": 269038, "epoch": 3241} {"train_loss": -25.478168487548828, "global_step": 269039, "epoch": 3241} {"train_loss": -25.30391502380371, "global_step": 269040, "epoch": 3241} {"train_loss": -25.19149398803711, "global_step": 269041, "epoch": 3241} {"train_loss": -25.271947860717773, "global_step": 269042, "epoch": 3241} {"train_loss": -25.156185150146484, "global_step": 269043, "epoch": 3241} {"train_loss": -25.284290313720703, "global_step": 269044, "epoch": 3241} {"train_loss": -25.36669158935547, "global_step": 269045, "epoch": 3241} {"train_loss": -25.160818099975586, "global_step": 269046, "epoch": 3241} {"train_loss": -25.321195602416992, "global_step": 269047, "epoch": 3241} {"train_loss": -25.23405647277832, "global_step": 269048, "epoch": 3241} {"train_loss": -25.081871032714844, "global_step": 269049, "epoch": 3241} {"train_loss": -25.40598487854004, "global_step": 269050, "epoch": 3241} {"train_loss": -25.15214729309082, "global_step": 269051, "epoch": 3241} {"train_loss": -24.829158782958984, "global_step": 269052, "epoch": 3241} {"train_loss": -25.16294288635254, "global_step": 269053, "epoch": 3241} {"train_loss": -25.04638671875, "global_step": 269054, "epoch": 3241} {"train_loss": -25.195341110229492, "global_step": 269055, "epoch": 3241} {"train_loss": -25.116796493530273, "global_step": 269056, "epoch": 3241} {"train_loss": -25.102462768554688, "global_step": 269057, "epoch": 3241} {"train_loss": -25.25019645690918, "global_step": 269058, "epoch": 3241} {"train_loss": -25.212697982788086, "global_step": 269059, "epoch": 3241} {"train_loss": -25.2332763671875, "global_step": 269060, "epoch": 3241} {"train_loss": -25.319326400756836, "global_step": 269061, "epoch": 3241} {"train_loss": -25.47559928894043, "global_step": 269062, "epoch": 3241} {"train_loss": -24.922216415405273, "global_step": 269063, "epoch": 3241} {"train_loss": -25.269628524780273, "global_step": 269064, "epoch": 3241} {"train_loss": -25.33753776550293, "global_step": 269065, "epoch": 3241} {"train_loss": -25.40875816345215, "global_step": 269066, "epoch": 3241} {"train_loss": -25.18320655822754, "global_step": 269067, "epoch": 3241} {"train_loss": -25.27225685119629, "global_step": 269068, "epoch": 3241} {"train_loss": -25.34783935546875, "global_step": 269069, "epoch": 3241} {"train_loss": -25.386381149291992, "global_step": 269070, "epoch": 3241} {"train_loss": -25.381851196289062, "global_step": 269071, "epoch": 3241} {"train_loss": -25.68756675720215, "global_step": 269072, "epoch": 3241} {"train_loss": -25.402618408203125, "global_step": 269073, "epoch": 3241} {"train_loss": -25.2016658782959, "global_step": 269074, "epoch": 3241} {"train_loss": -25.413311004638672, "global_step": 269075, "epoch": 3241} {"train_loss": -25.542203903198242, "global_step": 269076, "epoch": 3241} {"train_loss": -25.403919219970703, "global_step": 269077, "epoch": 3241} {"train_loss": -25.38142967224121, "global_step": 269078, "epoch": 3241} {"train_loss": -25.461217880249023, "global_step": 269079, "epoch": 3241} {"train_loss": -25.711700439453125, "global_step": 269080, "epoch": 3241} {"train_loss": -25.314048767089844, "global_step": 269081, "epoch": 3241} {"train_loss": -25.229406356811523, "global_step": 269082, "epoch": 3241} {"train_loss": -24.824613571166992, "global_step": 269083, "epoch": 3241} {"train_loss": -25.397323608398438, "global_step": 269084, "epoch": 3241} {"train_loss": -25.16163977657456, "global_step": 269085, "epoch": 3241, "val_loss": 6904433.0} {"train_loss": -24.70222282409668, "global_step": 269086, "epoch": 3242} {"train_loss": -24.36088752746582, "global_step": 269087, "epoch": 3242} {"train_loss": -24.077041625976562, "global_step": 269088, "epoch": 3242} {"train_loss": -24.344106674194336, "global_step": 269089, "epoch": 3242} {"train_loss": -25.165481567382812, "global_step": 269090, "epoch": 3242} {"train_loss": -24.654144287109375, "global_step": 269091, "epoch": 3242} {"train_loss": -24.68390464782715, "global_step": 269092, "epoch": 3242} {"train_loss": -24.590301513671875, "global_step": 269093, "epoch": 3242} {"train_loss": -25.04034423828125, "global_step": 269094, "epoch": 3242} {"train_loss": -24.788516998291016, "global_step": 269095, "epoch": 3242} {"train_loss": -24.719745635986328, "global_step": 269096, "epoch": 3242} {"train_loss": -25.116939544677734, "global_step": 269097, "epoch": 3242} {"train_loss": -24.77066421508789, "global_step": 269098, "epoch": 3242} {"train_loss": -24.86293601989746, "global_step": 269099, "epoch": 3242} {"train_loss": -24.9393367767334, "global_step": 269100, "epoch": 3242} {"train_loss": -25.448511123657227, "global_step": 269101, "epoch": 3242} {"train_loss": -25.007640838623047, "global_step": 269102, "epoch": 3242} {"train_loss": -25.02424430847168, "global_step": 269103, "epoch": 3242} {"train_loss": -25.123226165771484, "global_step": 269104, "epoch": 3242} {"train_loss": -25.114500045776367, "global_step": 269105, "epoch": 3242} {"train_loss": -25.04317283630371, "global_step": 269106, "epoch": 3242} {"train_loss": -25.366838455200195, "global_step": 269107, "epoch": 3242} {"train_loss": -24.97235679626465, "global_step": 269108, "epoch": 3242} {"train_loss": -25.173337936401367, "global_step": 269109, "epoch": 3242} {"train_loss": -25.253250122070312, "global_step": 269110, "epoch": 3242} {"train_loss": -25.1666202545166, "global_step": 269111, "epoch": 3242} {"train_loss": -25.324430465698242, "global_step": 269112, "epoch": 3242} {"train_loss": -24.906991958618164, "global_step": 269113, "epoch": 3242} {"train_loss": -25.22014808654785, "global_step": 269114, "epoch": 3242} {"train_loss": -25.421337127685547, "global_step": 269115, "epoch": 3242} {"train_loss": -25.40032196044922, "global_step": 269116, "epoch": 3242} {"train_loss": -25.31352996826172, "global_step": 269117, "epoch": 3242} {"train_loss": -25.117067337036133, "global_step": 269118, "epoch": 3242} {"train_loss": -25.031700134277344, "global_step": 269119, "epoch": 3242} {"train_loss": -25.345947265625, "global_step": 269120, "epoch": 3242} {"train_loss": -25.0457763671875, "global_step": 269121, "epoch": 3242} {"train_loss": -25.77097511291504, "global_step": 269122, "epoch": 3242} {"train_loss": -25.36775779724121, "global_step": 269123, "epoch": 3242} {"train_loss": -25.14113426208496, "global_step": 269124, "epoch": 3242} {"train_loss": -25.33797264099121, "global_step": 269125, "epoch": 3242} {"train_loss": -25.303489685058594, "global_step": 269126, "epoch": 3242} {"train_loss": -24.629810333251953, "global_step": 269127, "epoch": 3242} {"train_loss": -25.307294845581055, "global_step": 269128, "epoch": 3242} {"train_loss": -25.33087730407715, "global_step": 269129, "epoch": 3242} {"train_loss": -25.2183895111084, "global_step": 269130, "epoch": 3242} {"train_loss": -25.374191284179688, "global_step": 269131, "epoch": 3242} {"train_loss": -25.39525604248047, "global_step": 269132, "epoch": 3242} {"train_loss": -25.436508178710938, "global_step": 269133, "epoch": 3242} {"train_loss": -25.345914840698242, "global_step": 269134, "epoch": 3242} {"train_loss": -25.526241302490234, "global_step": 269135, "epoch": 3242} {"train_loss": -25.377117156982422, "global_step": 269136, "epoch": 3242} {"train_loss": -25.349872589111328, "global_step": 269137, "epoch": 3242} {"train_loss": -25.380130767822266, "global_step": 269138, "epoch": 3242} {"train_loss": -25.332748413085938, "global_step": 269139, "epoch": 3242} {"train_loss": -25.338104248046875, "global_step": 269140, "epoch": 3242} {"train_loss": -25.31888771057129, "global_step": 269141, "epoch": 3242} {"train_loss": -25.216876983642578, "global_step": 269142, "epoch": 3242} {"train_loss": -25.588895797729492, "global_step": 269143, "epoch": 3242} {"train_loss": -25.128387451171875, "global_step": 269144, "epoch": 3242} {"train_loss": -25.831439971923828, "global_step": 269145, "epoch": 3242} {"train_loss": -25.306360244750977, "global_step": 269146, "epoch": 3242} {"train_loss": -24.942750930786133, "global_step": 269147, "epoch": 3242} {"train_loss": -25.226516723632812, "global_step": 269148, "epoch": 3242} {"train_loss": -25.199481964111328, "global_step": 269149, "epoch": 3242} {"train_loss": -24.95904541015625, "global_step": 269150, "epoch": 3242} {"train_loss": -25.410062789916992, "global_step": 269151, "epoch": 3242} {"train_loss": -25.326982498168945, "global_step": 269152, "epoch": 3242} {"train_loss": -25.474489212036133, "global_step": 269153, "epoch": 3242} {"train_loss": -25.13400650024414, "global_step": 269154, "epoch": 3242} {"train_loss": -25.011245727539062, "global_step": 269155, "epoch": 3242} {"train_loss": -25.194501876831055, "global_step": 269156, "epoch": 3242} {"train_loss": -25.495105743408203, "global_step": 269157, "epoch": 3242} {"train_loss": -25.425540924072266, "global_step": 269158, "epoch": 3242} {"train_loss": -25.452566146850586, "global_step": 269159, "epoch": 3242} {"train_loss": -25.440383911132812, "global_step": 269160, "epoch": 3242} {"train_loss": -25.257286071777344, "global_step": 269161, "epoch": 3242} {"train_loss": -25.3193416595459, "global_step": 269162, "epoch": 3242} {"train_loss": -25.78375244140625, "global_step": 269163, "epoch": 3242} {"train_loss": -25.7061824798584, "global_step": 269164, "epoch": 3242} {"train_loss": -25.189483642578125, "global_step": 269165, "epoch": 3242} {"train_loss": -25.332843780517578, "global_step": 269166, "epoch": 3242} {"train_loss": -25.034208297729492, "global_step": 269167, "epoch": 3242} {"train_loss": -25.183790390750012, "global_step": 269168, "epoch": 3242, "val_loss": 6915023.0} {"train_loss": -25.17831039428711, "global_step": 269169, "epoch": 3243} {"train_loss": -24.88796043395996, "global_step": 269170, "epoch": 3243} {"train_loss": -24.808435440063477, "global_step": 269171, "epoch": 3243} {"train_loss": -25.06691551208496, "global_step": 269172, "epoch": 3243} {"train_loss": -24.899145126342773, "global_step": 269173, "epoch": 3243} {"train_loss": -25.046924591064453, "global_step": 269174, "epoch": 3243} {"train_loss": -25.0662841796875, "global_step": 269175, "epoch": 3243} {"train_loss": -24.758344650268555, "global_step": 269176, "epoch": 3243} {"train_loss": -25.462427139282227, "global_step": 269177, "epoch": 3243} {"train_loss": -24.591093063354492, "global_step": 269178, "epoch": 3243} {"train_loss": -25.107181549072266, "global_step": 269179, "epoch": 3243} {"train_loss": -24.917831420898438, "global_step": 269180, "epoch": 3243} {"train_loss": -25.027618408203125, "global_step": 269181, "epoch": 3243} {"train_loss": -25.33375358581543, "global_step": 269182, "epoch": 3243} {"train_loss": -24.881132125854492, "global_step": 269183, "epoch": 3243} {"train_loss": -24.723337173461914, "global_step": 269184, "epoch": 3243} {"train_loss": -25.571247100830078, "global_step": 269185, "epoch": 3243} {"train_loss": -25.448484420776367, "global_step": 269186, "epoch": 3243} {"train_loss": -25.194128036499023, "global_step": 269187, "epoch": 3243} {"train_loss": -25.49297523498535, "global_step": 269188, "epoch": 3243} {"train_loss": -25.344022750854492, "global_step": 269189, "epoch": 3243} {"train_loss": -25.400604248046875, "global_step": 269190, "epoch": 3243} {"train_loss": -25.507299423217773, "global_step": 269191, "epoch": 3243} {"train_loss": -25.122669219970703, "global_step": 269192, "epoch": 3243} {"train_loss": -25.377866744995117, "global_step": 269193, "epoch": 3243} {"train_loss": -25.005050659179688, "global_step": 269194, "epoch": 3243} {"train_loss": -25.08107566833496, "global_step": 269195, "epoch": 3243} {"train_loss": -25.09686851501465, "global_step": 269196, "epoch": 3243} {"train_loss": -25.32338523864746, "global_step": 269197, "epoch": 3243} {"train_loss": -25.307165145874023, "global_step": 269198, "epoch": 3243} {"train_loss": -24.964908599853516, "global_step": 269199, "epoch": 3243} {"train_loss": -24.796911239624023, "global_step": 269200, "epoch": 3243} {"train_loss": -25.37574005126953, "global_step": 269201, "epoch": 3243} {"train_loss": -24.78400230407715, "global_step": 269202, "epoch": 3243} {"train_loss": -25.004682540893555, "global_step": 269203, "epoch": 3243} {"train_loss": -25.3574161529541, "global_step": 269204, "epoch": 3243} {"train_loss": -25.069629669189453, "global_step": 269205, "epoch": 3243} {"train_loss": -25.18938446044922, "global_step": 269206, "epoch": 3243} {"train_loss": -25.507190704345703, "global_step": 269207, "epoch": 3243} {"train_loss": -25.46272850036621, "global_step": 269208, "epoch": 3243} {"train_loss": -24.954288482666016, "global_step": 269209, "epoch": 3243} {"train_loss": -25.493343353271484, "global_step": 269210, "epoch": 3243} {"train_loss": -25.41977310180664, "global_step": 269211, "epoch": 3243} {"train_loss": -25.186298370361328, "global_step": 269212, "epoch": 3243} {"train_loss": -25.510482788085938, "global_step": 269213, "epoch": 3243} {"train_loss": -25.394506454467773, "global_step": 269214, "epoch": 3243} {"train_loss": -25.516324996948242, "global_step": 269215, "epoch": 3243} {"train_loss": -25.206064224243164, "global_step": 269216, "epoch": 3243} {"train_loss": -25.767175674438477, "global_step": 269217, "epoch": 3243} {"train_loss": -25.718069076538086, "global_step": 269218, "epoch": 3243} {"train_loss": -25.54652214050293, "global_step": 269219, "epoch": 3243} {"train_loss": -25.65046501159668, "global_step": 269220, "epoch": 3243} {"train_loss": -25.28131675720215, "global_step": 269221, "epoch": 3243} {"train_loss": -25.637100219726562, "global_step": 269222, "epoch": 3243} {"train_loss": -25.244319915771484, "global_step": 269223, "epoch": 3243} {"train_loss": -25.3387393951416, "global_step": 269224, "epoch": 3243} {"train_loss": -25.208097457885742, "global_step": 269225, "epoch": 3243} {"train_loss": -25.514785766601562, "global_step": 269226, "epoch": 3243} {"train_loss": -25.34453010559082, "global_step": 269227, "epoch": 3243} {"train_loss": -25.161846160888672, "global_step": 269228, "epoch": 3243} {"train_loss": -25.36164665222168, "global_step": 269229, "epoch": 3243} {"train_loss": -25.322402954101562, "global_step": 269230, "epoch": 3243} {"train_loss": -25.382301330566406, "global_step": 269231, "epoch": 3243} {"train_loss": -25.52151107788086, "global_step": 269232, "epoch": 3243} {"train_loss": -25.4066162109375, "global_step": 269233, "epoch": 3243} {"train_loss": -25.522401809692383, "global_step": 269234, "epoch": 3243} {"train_loss": -25.094663619995117, "global_step": 269235, "epoch": 3243} {"train_loss": -25.62532615661621, "global_step": 269236, "epoch": 3243} {"train_loss": -25.094831466674805, "global_step": 269237, "epoch": 3243} {"train_loss": -25.749109268188477, "global_step": 269238, "epoch": 3243} {"train_loss": -25.416980743408203, "global_step": 269239, "epoch": 3243} {"train_loss": -25.119098663330078, "global_step": 269240, "epoch": 3243} {"train_loss": -25.277616500854492, "global_step": 269241, "epoch": 3243} {"train_loss": -25.014545440673828, "global_step": 269242, "epoch": 3243} {"train_loss": -25.00392723083496, "global_step": 269243, "epoch": 3243} {"train_loss": -24.9963436126709, "global_step": 269244, "epoch": 3243} {"train_loss": -25.45856285095215, "global_step": 269245, "epoch": 3243} {"train_loss": -25.124187469482422, "global_step": 269246, "epoch": 3243} {"train_loss": -25.000242233276367, "global_step": 269247, "epoch": 3243} {"train_loss": -25.19379425048828, "global_step": 269248, "epoch": 3243} {"train_loss": -25.353702545166016, "global_step": 269249, "epoch": 3243} {"train_loss": -25.01983642578125, "global_step": 269250, "epoch": 3243} {"train_loss": -25.23034222154732, "global_step": 269251, "epoch": 3243, "val_loss": 7064673.0} {"train_loss": -24.828378677368164, "global_step": 269252, "epoch": 3244} {"train_loss": -24.162307739257812, "global_step": 269253, "epoch": 3244} {"train_loss": -24.724924087524414, "global_step": 269254, "epoch": 3244} {"train_loss": -24.509145736694336, "global_step": 269255, "epoch": 3244} {"train_loss": -24.23381233215332, "global_step": 269256, "epoch": 3244} {"train_loss": -24.91061782836914, "global_step": 269257, "epoch": 3244} {"train_loss": -24.46614646911621, "global_step": 269258, "epoch": 3244} {"train_loss": -24.82594871520996, "global_step": 269259, "epoch": 3244} {"train_loss": -24.415637969970703, "global_step": 269260, "epoch": 3244} {"train_loss": -24.808761596679688, "global_step": 269261, "epoch": 3244} {"train_loss": -25.026996612548828, "global_step": 269262, "epoch": 3244} {"train_loss": -24.932519912719727, "global_step": 269263, "epoch": 3244} {"train_loss": -25.072158813476562, "global_step": 269264, "epoch": 3244} {"train_loss": -24.941205978393555, "global_step": 269265, "epoch": 3244} {"train_loss": -24.903732299804688, "global_step": 269266, "epoch": 3244} {"train_loss": -25.375944137573242, "global_step": 269267, "epoch": 3244} {"train_loss": -24.896982192993164, "global_step": 269268, "epoch": 3244} {"train_loss": -24.882883071899414, "global_step": 269269, "epoch": 3244} {"train_loss": -24.89374351501465, "global_step": 269270, "epoch": 3244} {"train_loss": -25.07611846923828, "global_step": 269271, "epoch": 3244} {"train_loss": -25.105947494506836, "global_step": 269272, "epoch": 3244} {"train_loss": -25.073335647583008, "global_step": 269273, "epoch": 3244} {"train_loss": -25.095216751098633, "global_step": 269274, "epoch": 3244} {"train_loss": -25.372352600097656, "global_step": 269275, "epoch": 3244} {"train_loss": -24.96148681640625, "global_step": 269276, "epoch": 3244} {"train_loss": -25.335317611694336, "global_step": 269277, "epoch": 3244} {"train_loss": -25.19207191467285, "global_step": 269278, "epoch": 3244} {"train_loss": -25.137792587280273, "global_step": 269279, "epoch": 3244} {"train_loss": -24.983165740966797, "global_step": 269280, "epoch": 3244} {"train_loss": -25.151203155517578, "global_step": 269281, "epoch": 3244} {"train_loss": -25.463058471679688, "global_step": 269282, "epoch": 3244} {"train_loss": -24.886293411254883, "global_step": 269283, "epoch": 3244} {"train_loss": -25.442014694213867, "global_step": 269284, "epoch": 3244} {"train_loss": -25.3813419342041, "global_step": 269285, "epoch": 3244} {"train_loss": -25.20191764831543, "global_step": 269286, "epoch": 3244} {"train_loss": -25.58269691467285, "global_step": 269287, "epoch": 3244} {"train_loss": -25.39333724975586, "global_step": 269288, "epoch": 3244} {"train_loss": -25.428634643554688, "global_step": 269289, "epoch": 3244} {"train_loss": -25.169008255004883, "global_step": 269290, "epoch": 3244} {"train_loss": -25.594545364379883, "global_step": 269291, "epoch": 3244} {"train_loss": -25.279539108276367, "global_step": 269292, "epoch": 3244} {"train_loss": -25.052528381347656, "global_step": 269293, "epoch": 3244} {"train_loss": -25.338531494140625, "global_step": 269294, "epoch": 3244} {"train_loss": -25.107473373413086, "global_step": 269295, "epoch": 3244} {"train_loss": -25.32124900817871, "global_step": 269296, "epoch": 3244} {"train_loss": -25.56868553161621, "global_step": 269297, "epoch": 3244} {"train_loss": -24.983501434326172, "global_step": 269298, "epoch": 3244} {"train_loss": -25.161731719970703, "global_step": 269299, "epoch": 3244} {"train_loss": -25.1737117767334, "global_step": 269300, "epoch": 3244} {"train_loss": -24.9410457611084, "global_step": 269301, "epoch": 3244} {"train_loss": -25.282272338867188, "global_step": 269302, "epoch": 3244} {"train_loss": -24.74049949645996, "global_step": 269303, "epoch": 3244} {"train_loss": -25.170846939086914, "global_step": 269304, "epoch": 3244} {"train_loss": -25.077871322631836, "global_step": 269305, "epoch": 3244} {"train_loss": -24.56214714050293, "global_step": 269306, "epoch": 3244} {"train_loss": -24.88375473022461, "global_step": 269307, "epoch": 3244} {"train_loss": -24.883377075195312, "global_step": 269308, "epoch": 3244} {"train_loss": -25.2574520111084, "global_step": 269309, "epoch": 3244} {"train_loss": -24.98225212097168, "global_step": 269310, "epoch": 3244} {"train_loss": -25.21275520324707, "global_step": 269311, "epoch": 3244} {"train_loss": -25.469255447387695, "global_step": 269312, "epoch": 3244} {"train_loss": -24.77161979675293, "global_step": 269313, "epoch": 3244} {"train_loss": -25.032745361328125, "global_step": 269314, "epoch": 3244} {"train_loss": -24.902603149414062, "global_step": 269315, "epoch": 3244} {"train_loss": -25.081491470336914, "global_step": 269316, "epoch": 3244} {"train_loss": -25.219457626342773, "global_step": 269317, "epoch": 3244} {"train_loss": -25.321136474609375, "global_step": 269318, "epoch": 3244} {"train_loss": -25.211502075195312, "global_step": 269319, "epoch": 3244} {"train_loss": -25.12845802307129, "global_step": 269320, "epoch": 3244} {"train_loss": -25.1727237701416, "global_step": 269321, "epoch": 3244} {"train_loss": -25.400510787963867, "global_step": 269322, "epoch": 3244} {"train_loss": -25.2434139251709, "global_step": 269323, "epoch": 3244} {"train_loss": -25.61799430847168, "global_step": 269324, "epoch": 3244} {"train_loss": -25.367935180664062, "global_step": 269325, "epoch": 3244} {"train_loss": -25.268875122070312, "global_step": 269326, "epoch": 3244} {"train_loss": -25.244604110717773, "global_step": 269327, "epoch": 3244} {"train_loss": -25.390933990478516, "global_step": 269328, "epoch": 3244} {"train_loss": -25.4543399810791, "global_step": 269329, "epoch": 3244} {"train_loss": -25.4331111907959, "global_step": 269330, "epoch": 3244} {"train_loss": -25.431617736816406, "global_step": 269331, "epoch": 3244} {"train_loss": -25.789762496948242, "global_step": 269332, "epoch": 3244} {"train_loss": -25.675352096557617, "global_step": 269333, "epoch": 3244} {"train_loss": -25.09727197670075, "global_step": 269334, "epoch": 3244, "val_loss": 7019304.0} {"train_loss": -25.179418563842773, "global_step": 269335, "epoch": 3245} {"train_loss": -24.87175178527832, "global_step": 269336, "epoch": 3245} {"train_loss": -25.086278915405273, "global_step": 269337, "epoch": 3245} {"train_loss": -25.26120376586914, "global_step": 269338, "epoch": 3245} {"train_loss": -25.07335090637207, "global_step": 269339, "epoch": 3245} {"train_loss": -24.7083797454834, "global_step": 269340, "epoch": 3245} {"train_loss": -25.163818359375, "global_step": 269341, "epoch": 3245} {"train_loss": -24.959516525268555, "global_step": 269342, "epoch": 3245} {"train_loss": -25.196603775024414, "global_step": 269343, "epoch": 3245} {"train_loss": -25.026514053344727, "global_step": 269344, "epoch": 3245} {"train_loss": -25.547639846801758, "global_step": 269345, "epoch": 3245} {"train_loss": -25.094404220581055, "global_step": 269346, "epoch": 3245} {"train_loss": -25.01341438293457, "global_step": 269347, "epoch": 3245} {"train_loss": -24.990570068359375, "global_step": 269348, "epoch": 3245} {"train_loss": -25.3690185546875, "global_step": 269349, "epoch": 3245} {"train_loss": -25.459104537963867, "global_step": 269350, "epoch": 3245} {"train_loss": -25.14615821838379, "global_step": 269351, "epoch": 3245} {"train_loss": -25.333864212036133, "global_step": 269352, "epoch": 3245} {"train_loss": -25.26366424560547, "global_step": 269353, "epoch": 3245} {"train_loss": -25.392736434936523, "global_step": 269354, "epoch": 3245} {"train_loss": -24.693405151367188, "global_step": 269355, "epoch": 3245} {"train_loss": -25.09320640563965, "global_step": 269356, "epoch": 3245} {"train_loss": -25.17115592956543, "global_step": 269357, "epoch": 3245} {"train_loss": -25.456205368041992, "global_step": 269358, "epoch": 3245} {"train_loss": -25.401142120361328, "global_step": 269359, "epoch": 3245} {"train_loss": -25.179859161376953, "global_step": 269360, "epoch": 3245} {"train_loss": -25.189346313476562, "global_step": 269361, "epoch": 3245} {"train_loss": -25.261411666870117, "global_step": 269362, "epoch": 3245} {"train_loss": -25.390615463256836, "global_step": 269363, "epoch": 3245} {"train_loss": -25.21303367614746, "global_step": 269364, "epoch": 3245} {"train_loss": -25.114606857299805, "global_step": 269365, "epoch": 3245} {"train_loss": -25.36305809020996, "global_step": 269366, "epoch": 3245} {"train_loss": -25.097536087036133, "global_step": 269367, "epoch": 3245} {"train_loss": -25.465639114379883, "global_step": 269368, "epoch": 3245} {"train_loss": -24.989103317260742, "global_step": 269369, "epoch": 3245} {"train_loss": -24.98551368713379, "global_step": 269370, "epoch": 3245} {"train_loss": -25.032346725463867, "global_step": 269371, "epoch": 3245} {"train_loss": -25.38447380065918, "global_step": 269372, "epoch": 3245} {"train_loss": -25.57376480102539, "global_step": 269373, "epoch": 3245} {"train_loss": -25.59298324584961, "global_step": 269374, "epoch": 3245} {"train_loss": -25.207639694213867, "global_step": 269375, "epoch": 3245} {"train_loss": -25.183870315551758, "global_step": 269376, "epoch": 3245} {"train_loss": -25.183591842651367, "global_step": 269377, "epoch": 3245} {"train_loss": -25.185522079467773, "global_step": 269378, "epoch": 3245} {"train_loss": -25.316007614135742, "global_step": 269379, "epoch": 3245} {"train_loss": -25.34417724609375, "global_step": 269380, "epoch": 3245} {"train_loss": -25.393850326538086, "global_step": 269381, "epoch": 3245} {"train_loss": -25.083057403564453, "global_step": 269382, "epoch": 3245} {"train_loss": -25.290531158447266, "global_step": 269383, "epoch": 3245} {"train_loss": -25.131000518798828, "global_step": 269384, "epoch": 3245} {"train_loss": -25.24959373474121, "global_step": 269385, "epoch": 3245} {"train_loss": -25.3115291595459, "global_step": 269386, "epoch": 3245} {"train_loss": -25.11679458618164, "global_step": 269387, "epoch": 3245} {"train_loss": -25.285621643066406, "global_step": 269388, "epoch": 3245} {"train_loss": -25.310766220092773, "global_step": 269389, "epoch": 3245} {"train_loss": -25.170812606811523, "global_step": 269390, "epoch": 3245} {"train_loss": -25.392284393310547, "global_step": 269391, "epoch": 3245} {"train_loss": -24.94620132446289, "global_step": 269392, "epoch": 3245} {"train_loss": -25.11378288269043, "global_step": 269393, "epoch": 3245} {"train_loss": -25.29015350341797, "global_step": 269394, "epoch": 3245} {"train_loss": -25.321239471435547, "global_step": 269395, "epoch": 3245} {"train_loss": -25.603818893432617, "global_step": 269396, "epoch": 3245} {"train_loss": -25.04066276550293, "global_step": 269397, "epoch": 3245} {"train_loss": -25.340408325195312, "global_step": 269398, "epoch": 3245} {"train_loss": -25.051219940185547, "global_step": 269399, "epoch": 3245} {"train_loss": -25.222463607788086, "global_step": 269400, "epoch": 3245} {"train_loss": -25.495662689208984, "global_step": 269401, "epoch": 3245} {"train_loss": -25.6738338470459, "global_step": 269402, "epoch": 3245} {"train_loss": -25.263166427612305, "global_step": 269403, "epoch": 3245} {"train_loss": -25.21546745300293, "global_step": 269404, "epoch": 3245} {"train_loss": -25.704076766967773, "global_step": 269405, "epoch": 3245} {"train_loss": -25.771230697631836, "global_step": 269406, "epoch": 3245} {"train_loss": -25.642148971557617, "global_step": 269407, "epoch": 3245} {"train_loss": -25.403127670288086, "global_step": 269408, "epoch": 3245} {"train_loss": -25.44476890563965, "global_step": 269409, "epoch": 3245} {"train_loss": -25.55863380432129, "global_step": 269410, "epoch": 3245} {"train_loss": -25.395776748657227, "global_step": 269411, "epoch": 3245} {"train_loss": -25.39667510986328, "global_step": 269412, "epoch": 3245} {"train_loss": -25.442230224609375, "global_step": 269413, "epoch": 3245} {"train_loss": -25.41998863220215, "global_step": 269414, "epoch": 3245} {"train_loss": -24.981550216674805, "global_step": 269415, "epoch": 3245} {"train_loss": -25.51936149597168, "global_step": 269416, "epoch": 3245} {"train_loss": -25.264902390629413, "global_step": 269417, "epoch": 3245, "val_loss": 6986217.0} {"train_loss": -25.0555419921875, "global_step": 269418, "epoch": 3246} {"train_loss": -24.18483543395996, "global_step": 269419, "epoch": 3246} {"train_loss": -23.399892807006836, "global_step": 269420, "epoch": 3246} {"train_loss": -24.531169891357422, "global_step": 269421, "epoch": 3246} {"train_loss": -24.63364601135254, "global_step": 269422, "epoch": 3246} {"train_loss": -24.130590438842773, "global_step": 269423, "epoch": 3246} {"train_loss": -24.50835609436035, "global_step": 269424, "epoch": 3246} {"train_loss": -24.62521743774414, "global_step": 269425, "epoch": 3246} {"train_loss": -24.644168853759766, "global_step": 269426, "epoch": 3246} {"train_loss": -24.68446922302246, "global_step": 269427, "epoch": 3246} {"train_loss": -24.862041473388672, "global_step": 269428, "epoch": 3246} {"train_loss": -24.642404556274414, "global_step": 269429, "epoch": 3246} {"train_loss": -25.14451026916504, "global_step": 269430, "epoch": 3246} {"train_loss": -24.72418785095215, "global_step": 269431, "epoch": 3246} {"train_loss": -25.303495407104492, "global_step": 269432, "epoch": 3246} {"train_loss": -24.90232276916504, "global_step": 269433, "epoch": 3246} {"train_loss": -24.735809326171875, "global_step": 269434, "epoch": 3246} {"train_loss": -24.994400024414062, "global_step": 269435, "epoch": 3246} {"train_loss": -25.340755462646484, "global_step": 269436, "epoch": 3246} {"train_loss": -25.162761688232422, "global_step": 269437, "epoch": 3246} {"train_loss": -24.852079391479492, "global_step": 269438, "epoch": 3246} {"train_loss": -25.038423538208008, "global_step": 269439, "epoch": 3246} {"train_loss": -24.982906341552734, "global_step": 269440, "epoch": 3246} {"train_loss": -24.95342254638672, "global_step": 269441, "epoch": 3246} {"train_loss": -24.97278594970703, "global_step": 269442, "epoch": 3246} {"train_loss": -25.128890991210938, "global_step": 269443, "epoch": 3246} {"train_loss": -25.17963981628418, "global_step": 269444, "epoch": 3246} {"train_loss": -25.419462203979492, "global_step": 269445, "epoch": 3246} {"train_loss": -25.384864807128906, "global_step": 269446, "epoch": 3246} {"train_loss": -25.259199142456055, "global_step": 269447, "epoch": 3246} {"train_loss": -25.338497161865234, "global_step": 269448, "epoch": 3246} {"train_loss": -25.19171714782715, "global_step": 269449, "epoch": 3246} {"train_loss": -25.355119705200195, "global_step": 269450, "epoch": 3246} {"train_loss": -25.760013580322266, "global_step": 269451, "epoch": 3246} {"train_loss": -25.559003829956055, "global_step": 269452, "epoch": 3246} {"train_loss": -25.237918853759766, "global_step": 269453, "epoch": 3246} {"train_loss": -25.56234359741211, "global_step": 269454, "epoch": 3246} {"train_loss": -25.586938858032227, "global_step": 269455, "epoch": 3246} {"train_loss": -25.09095573425293, "global_step": 269456, "epoch": 3246} {"train_loss": -25.243200302124023, "global_step": 269457, "epoch": 3246} {"train_loss": -25.741607666015625, "global_step": 269458, "epoch": 3246} {"train_loss": -25.355573654174805, "global_step": 269459, "epoch": 3246} {"train_loss": -25.329505920410156, "global_step": 269460, "epoch": 3246} {"train_loss": -25.131895065307617, "global_step": 269461, "epoch": 3246} {"train_loss": -24.9987850189209, "global_step": 269462, "epoch": 3246} {"train_loss": -24.878650665283203, "global_step": 269463, "epoch": 3246} {"train_loss": -24.948514938354492, "global_step": 269464, "epoch": 3246} {"train_loss": -25.146656036376953, "global_step": 269465, "epoch": 3246} {"train_loss": -24.993087768554688, "global_step": 269466, "epoch": 3246} {"train_loss": -25.33833122253418, "global_step": 269467, "epoch": 3246} {"train_loss": -24.53753089904785, "global_step": 269468, "epoch": 3246} {"train_loss": -24.588117599487305, "global_step": 269469, "epoch": 3246} {"train_loss": -25.44244956970215, "global_step": 269470, "epoch": 3246} {"train_loss": -24.867420196533203, "global_step": 269471, "epoch": 3246} {"train_loss": -25.222585678100586, "global_step": 269472, "epoch": 3246} {"train_loss": -24.348112106323242, "global_step": 269473, "epoch": 3246} {"train_loss": -25.020326614379883, "global_step": 269474, "epoch": 3246} {"train_loss": -24.387235641479492, "global_step": 269475, "epoch": 3246} {"train_loss": -24.67216682434082, "global_step": 269476, "epoch": 3246} {"train_loss": -25.016830444335938, "global_step": 269477, "epoch": 3246} {"train_loss": -25.024213790893555, "global_step": 269478, "epoch": 3246} {"train_loss": -25.01492691040039, "global_step": 269479, "epoch": 3246} {"train_loss": -24.91518783569336, "global_step": 269480, "epoch": 3246} {"train_loss": -25.060216903686523, "global_step": 269481, "epoch": 3246} {"train_loss": -24.787925720214844, "global_step": 269482, "epoch": 3246} {"train_loss": -25.333576202392578, "global_step": 269483, "epoch": 3246} {"train_loss": -25.183490753173828, "global_step": 269484, "epoch": 3246} {"train_loss": -25.006872177124023, "global_step": 269485, "epoch": 3246} {"train_loss": -25.25071907043457, "global_step": 269486, "epoch": 3246} {"train_loss": -25.08833122253418, "global_step": 269487, "epoch": 3246} {"train_loss": -24.956790924072266, "global_step": 269488, "epoch": 3246} {"train_loss": -25.222930908203125, "global_step": 269489, "epoch": 3246} {"train_loss": -24.97842025756836, "global_step": 269490, "epoch": 3246} {"train_loss": -24.914609909057617, "global_step": 269491, "epoch": 3246} {"train_loss": -25.101776123046875, "global_step": 269492, "epoch": 3246} {"train_loss": -24.941205978393555, "global_step": 269493, "epoch": 3246} {"train_loss": -25.048688888549805, "global_step": 269494, "epoch": 3246} {"train_loss": -25.0349063873291, "global_step": 269495, "epoch": 3246} {"train_loss": -25.24322509765625, "global_step": 269496, "epoch": 3246} {"train_loss": -24.91261863708496, "global_step": 269497, "epoch": 3246} {"train_loss": -25.26484489440918, "global_step": 269498, "epoch": 3246} {"train_loss": -25.27507972717285, "global_step": 269499, "epoch": 3246} {"train_loss": -25.012053685015943, "global_step": 269500, "epoch": 3246, "val_loss": 6999795.0} {"train_loss": -24.85041046142578, "global_step": 269501, "epoch": 3247} {"train_loss": -25.143028259277344, "global_step": 269502, "epoch": 3247} {"train_loss": -25.028955459594727, "global_step": 269503, "epoch": 3247} {"train_loss": -24.811630249023438, "global_step": 269504, "epoch": 3247} {"train_loss": -25.122909545898438, "global_step": 269505, "epoch": 3247} {"train_loss": -25.353403091430664, "global_step": 269506, "epoch": 3247} {"train_loss": -25.08009147644043, "global_step": 269507, "epoch": 3247} {"train_loss": -25.055131912231445, "global_step": 269508, "epoch": 3247} {"train_loss": -25.51923942565918, "global_step": 269509, "epoch": 3247} {"train_loss": -25.098955154418945, "global_step": 269510, "epoch": 3247} {"train_loss": -24.847137451171875, "global_step": 269511, "epoch": 3247} {"train_loss": -25.2490177154541, "global_step": 269512, "epoch": 3247} {"train_loss": -24.725147247314453, "global_step": 269513, "epoch": 3247} {"train_loss": -25.166610717773438, "global_step": 269514, "epoch": 3247} {"train_loss": -25.216262817382812, "global_step": 269515, "epoch": 3247} {"train_loss": -24.580114364624023, "global_step": 269516, "epoch": 3247} {"train_loss": -24.9252986907959, "global_step": 269517, "epoch": 3247} {"train_loss": -24.59626579284668, "global_step": 269518, "epoch": 3247} {"train_loss": -25.268285751342773, "global_step": 269519, "epoch": 3247} {"train_loss": -24.62434196472168, "global_step": 269520, "epoch": 3247} {"train_loss": -24.94037437438965, "global_step": 269521, "epoch": 3247} {"train_loss": -24.808395385742188, "global_step": 269522, "epoch": 3247} {"train_loss": -25.091550827026367, "global_step": 269523, "epoch": 3247} {"train_loss": -24.88030242919922, "global_step": 269524, "epoch": 3247} {"train_loss": -24.7703914642334, "global_step": 269525, "epoch": 3247} {"train_loss": -25.388334274291992, "global_step": 269526, "epoch": 3247} {"train_loss": -25.0961971282959, "global_step": 269527, "epoch": 3247} {"train_loss": -25.255367279052734, "global_step": 269528, "epoch": 3247} {"train_loss": -24.890024185180664, "global_step": 269529, "epoch": 3247} {"train_loss": -25.03612518310547, "global_step": 269530, "epoch": 3247} {"train_loss": -25.19178581237793, "global_step": 269531, "epoch": 3247} {"train_loss": -24.91701889038086, "global_step": 269532, "epoch": 3247} {"train_loss": -25.098766326904297, "global_step": 269533, "epoch": 3247} {"train_loss": -25.213857650756836, "global_step": 269534, "epoch": 3247} {"train_loss": -25.529462814331055, "global_step": 269535, "epoch": 3247} {"train_loss": -25.252477645874023, "global_step": 269536, "epoch": 3247} {"train_loss": -25.55984115600586, "global_step": 269537, "epoch": 3247} {"train_loss": -25.3170108795166, "global_step": 269538, "epoch": 3247} {"train_loss": -25.406644821166992, "global_step": 269539, "epoch": 3247} {"train_loss": -25.281770706176758, "global_step": 269540, "epoch": 3247} {"train_loss": -25.29303741455078, "global_step": 269541, "epoch": 3247} {"train_loss": -25.047033309936523, "global_step": 269542, "epoch": 3247} {"train_loss": -25.296615600585938, "global_step": 269543, "epoch": 3247} {"train_loss": -25.486740112304688, "global_step": 269544, "epoch": 3247} {"train_loss": -25.482053756713867, "global_step": 269545, "epoch": 3247} {"train_loss": -25.450504302978516, "global_step": 269546, "epoch": 3247} {"train_loss": -25.303436279296875, "global_step": 269547, "epoch": 3247} {"train_loss": -25.28376579284668, "global_step": 269548, "epoch": 3247} {"train_loss": -25.547677993774414, "global_step": 269549, "epoch": 3247} {"train_loss": -25.17243766784668, "global_step": 269550, "epoch": 3247} {"train_loss": -24.986928939819336, "global_step": 269551, "epoch": 3247} {"train_loss": -25.18415069580078, "global_step": 269552, "epoch": 3247} {"train_loss": -25.880857467651367, "global_step": 269553, "epoch": 3247} {"train_loss": -25.182832717895508, "global_step": 269554, "epoch": 3247} {"train_loss": -25.414403915405273, "global_step": 269555, "epoch": 3247} {"train_loss": -25.299428939819336, "global_step": 269556, "epoch": 3247} {"train_loss": -25.425256729125977, "global_step": 269557, "epoch": 3247} {"train_loss": -25.528301239013672, "global_step": 269558, "epoch": 3247} {"train_loss": -25.110570907592773, "global_step": 269559, "epoch": 3247} {"train_loss": -25.514429092407227, "global_step": 269560, "epoch": 3247} {"train_loss": -25.602386474609375, "global_step": 269561, "epoch": 3247} {"train_loss": -25.4144287109375, "global_step": 269562, "epoch": 3247} {"train_loss": -25.360361099243164, "global_step": 269563, "epoch": 3247} {"train_loss": -25.301856994628906, "global_step": 269564, "epoch": 3247} {"train_loss": -25.054182052612305, "global_step": 269565, "epoch": 3247} {"train_loss": -24.99850082397461, "global_step": 269566, "epoch": 3247} {"train_loss": -25.19209098815918, "global_step": 269567, "epoch": 3247} {"train_loss": -25.488941192626953, "global_step": 269568, "epoch": 3247} {"train_loss": -25.400665283203125, "global_step": 269569, "epoch": 3247} {"train_loss": -25.417823791503906, "global_step": 269570, "epoch": 3247} {"train_loss": -25.299131393432617, "global_step": 269571, "epoch": 3247} {"train_loss": -25.260013580322266, "global_step": 269572, "epoch": 3247} {"train_loss": -25.499990463256836, "global_step": 269573, "epoch": 3247} {"train_loss": -25.360666275024414, "global_step": 269574, "epoch": 3247} {"train_loss": -25.090961456298828, "global_step": 269575, "epoch": 3247} {"train_loss": -25.533899307250977, "global_step": 269576, "epoch": 3247} {"train_loss": -25.598175048828125, "global_step": 269577, "epoch": 3247} {"train_loss": -25.267385482788086, "global_step": 269578, "epoch": 3247} {"train_loss": -25.56460952758789, "global_step": 269579, "epoch": 3247} {"train_loss": -25.46718978881836, "global_step": 269580, "epoch": 3247} {"train_loss": -25.6439151763916, "global_step": 269581, "epoch": 3247} {"train_loss": -25.072874069213867, "global_step": 269582, "epoch": 3247} {"train_loss": -25.217497745192194, "global_step": 269583, "epoch": 3247, "val_loss": 6912917.0} {"train_loss": -25.39961051940918, "global_step": 269584, "epoch": 3248} {"train_loss": -24.95315933227539, "global_step": 269585, "epoch": 3248} {"train_loss": -25.199697494506836, "global_step": 269586, "epoch": 3248} {"train_loss": -24.702411651611328, "global_step": 269587, "epoch": 3248} {"train_loss": -25.038654327392578, "global_step": 269588, "epoch": 3248} {"train_loss": -24.94561195373535, "global_step": 269589, "epoch": 3248} {"train_loss": -24.887836456298828, "global_step": 269590, "epoch": 3248} {"train_loss": -24.59860610961914, "global_step": 269591, "epoch": 3248} {"train_loss": -25.26222801208496, "global_step": 269592, "epoch": 3248} {"train_loss": -24.94900894165039, "global_step": 269593, "epoch": 3248} {"train_loss": -25.112823486328125, "global_step": 269594, "epoch": 3248} {"train_loss": -25.212432861328125, "global_step": 269595, "epoch": 3248} {"train_loss": -24.999958038330078, "global_step": 269596, "epoch": 3248} {"train_loss": -25.08226776123047, "global_step": 269597, "epoch": 3248} {"train_loss": -25.220449447631836, "global_step": 269598, "epoch": 3248} {"train_loss": -25.052818298339844, "global_step": 269599, "epoch": 3248} {"train_loss": -25.331228256225586, "global_step": 269600, "epoch": 3248} {"train_loss": -25.08856201171875, "global_step": 269601, "epoch": 3248} {"train_loss": -25.325681686401367, "global_step": 269602, "epoch": 3248} {"train_loss": -25.251344680786133, "global_step": 269603, "epoch": 3248} {"train_loss": -25.46624183654785, "global_step": 269604, "epoch": 3248} {"train_loss": -25.00050163269043, "global_step": 269605, "epoch": 3248} {"train_loss": -25.0673885345459, "global_step": 269606, "epoch": 3248} {"train_loss": -25.0919132232666, "global_step": 269607, "epoch": 3248} {"train_loss": -25.45140266418457, "global_step": 269608, "epoch": 3248} {"train_loss": -25.5421199798584, "global_step": 269609, "epoch": 3248} {"train_loss": -25.04343032836914, "global_step": 269610, "epoch": 3248} {"train_loss": -25.16822052001953, "global_step": 269611, "epoch": 3248} {"train_loss": -25.33300018310547, "global_step": 269612, "epoch": 3248} {"train_loss": -25.60955238342285, "global_step": 269613, "epoch": 3248} {"train_loss": -25.579862594604492, "global_step": 269614, "epoch": 3248} {"train_loss": -25.180944442749023, "global_step": 269615, "epoch": 3248} {"train_loss": -25.24271011352539, "global_step": 269616, "epoch": 3248} {"train_loss": -25.34296226501465, "global_step": 269617, "epoch": 3248} {"train_loss": -25.349821090698242, "global_step": 269618, "epoch": 3248} {"train_loss": -25.437646865844727, "global_step": 269619, "epoch": 3248} {"train_loss": -25.255542755126953, "global_step": 269620, "epoch": 3248} {"train_loss": -25.174726486206055, "global_step": 269621, "epoch": 3248} {"train_loss": -25.34639549255371, "global_step": 269622, "epoch": 3248} {"train_loss": -25.34354019165039, "global_step": 269623, "epoch": 3248} {"train_loss": -25.222061157226562, "global_step": 269624, "epoch": 3248} {"train_loss": -25.70096206665039, "global_step": 269625, "epoch": 3248} {"train_loss": -25.264131546020508, "global_step": 269626, "epoch": 3248} {"train_loss": -25.05860710144043, "global_step": 269627, "epoch": 3248} {"train_loss": -25.19179344177246, "global_step": 269628, "epoch": 3248} {"train_loss": -25.700794219970703, "global_step": 269629, "epoch": 3248} {"train_loss": -25.471969604492188, "global_step": 269630, "epoch": 3248} {"train_loss": -25.378740310668945, "global_step": 269631, "epoch": 3248} {"train_loss": -24.995630264282227, "global_step": 269632, "epoch": 3248} {"train_loss": -24.988468170166016, "global_step": 269633, "epoch": 3248} {"train_loss": -25.184614181518555, "global_step": 269634, "epoch": 3248} {"train_loss": -25.402963638305664, "global_step": 269635, "epoch": 3248} {"train_loss": -25.389301300048828, "global_step": 269636, "epoch": 3248} {"train_loss": -25.495281219482422, "global_step": 269637, "epoch": 3248} {"train_loss": -25.580448150634766, "global_step": 269638, "epoch": 3248} {"train_loss": -25.108739852905273, "global_step": 269639, "epoch": 3248} {"train_loss": -25.315176010131836, "global_step": 269640, "epoch": 3248} {"train_loss": -25.622283935546875, "global_step": 269641, "epoch": 3248} {"train_loss": -25.02817153930664, "global_step": 269642, "epoch": 3248} {"train_loss": -25.54438591003418, "global_step": 269643, "epoch": 3248} {"train_loss": -25.36079978942871, "global_step": 269644, "epoch": 3248} {"train_loss": -25.28996467590332, "global_step": 269645, "epoch": 3248} {"train_loss": -24.922964096069336, "global_step": 269646, "epoch": 3248} {"train_loss": -25.642902374267578, "global_step": 269647, "epoch": 3248} {"train_loss": -24.950698852539062, "global_step": 269648, "epoch": 3248} {"train_loss": -25.245380401611328, "global_step": 269649, "epoch": 3248} {"train_loss": -25.417573928833008, "global_step": 269650, "epoch": 3248} {"train_loss": -25.0445613861084, "global_step": 269651, "epoch": 3248} {"train_loss": -25.191320419311523, "global_step": 269652, "epoch": 3248} {"train_loss": -25.417545318603516, "global_step": 269653, "epoch": 3248} {"train_loss": -25.225156784057617, "global_step": 269654, "epoch": 3248} {"train_loss": -25.452869415283203, "global_step": 269655, "epoch": 3248} {"train_loss": -25.351608276367188, "global_step": 269656, "epoch": 3248} {"train_loss": -24.57370376586914, "global_step": 269657, "epoch": 3248} {"train_loss": -24.71473503112793, "global_step": 269658, "epoch": 3248} {"train_loss": -25.419952392578125, "global_step": 269659, "epoch": 3248} {"train_loss": -25.093347549438477, "global_step": 269660, "epoch": 3248} {"train_loss": -25.460922241210938, "global_step": 269661, "epoch": 3248} {"train_loss": -25.354528427124023, "global_step": 269662, "epoch": 3248} {"train_loss": -25.10773277282715, "global_step": 269663, "epoch": 3248} {"train_loss": -25.291072845458984, "global_step": 269664, "epoch": 3248} {"train_loss": -25.318052291870117, "global_step": 269665, "epoch": 3248} {"train_loss": -25.230597783284015, "global_step": 269666, "epoch": 3248, "val_loss": 6890405.5} {"train_loss": -24.525556564331055, "global_step": 269667, "epoch": 3249} {"train_loss": -24.981138229370117, "global_step": 269668, "epoch": 3249} {"train_loss": -24.98238182067871, "global_step": 269669, "epoch": 3249} {"train_loss": -24.66490936279297, "global_step": 269670, "epoch": 3249} {"train_loss": -25.30680274963379, "global_step": 269671, "epoch": 3249} {"train_loss": -25.0152530670166, "global_step": 269672, "epoch": 3249} {"train_loss": -25.087087631225586, "global_step": 269673, "epoch": 3249} {"train_loss": -25.213214874267578, "global_step": 269674, "epoch": 3249} {"train_loss": -24.55409812927246, "global_step": 269675, "epoch": 3249} {"train_loss": -25.232898712158203, "global_step": 269676, "epoch": 3249} {"train_loss": -25.10283851623535, "global_step": 269677, "epoch": 3249} {"train_loss": -24.886831283569336, "global_step": 269678, "epoch": 3249} {"train_loss": -25.35434913635254, "global_step": 269679, "epoch": 3249} {"train_loss": -24.99300193786621, "global_step": 269680, "epoch": 3249} {"train_loss": -24.407257080078125, "global_step": 269681, "epoch": 3249} {"train_loss": -24.90608787536621, "global_step": 269682, "epoch": 3249} {"train_loss": -25.23542022705078, "global_step": 269683, "epoch": 3249} {"train_loss": -24.85493278503418, "global_step": 269684, "epoch": 3249} {"train_loss": -24.908828735351562, "global_step": 269685, "epoch": 3249} {"train_loss": -25.39826011657715, "global_step": 269686, "epoch": 3249} {"train_loss": -25.002498626708984, "global_step": 269687, "epoch": 3249} {"train_loss": -25.430509567260742, "global_step": 269688, "epoch": 3249} {"train_loss": -25.156349182128906, "global_step": 269689, "epoch": 3249} {"train_loss": -25.066547393798828, "global_step": 269690, "epoch": 3249} {"train_loss": -25.37632179260254, "global_step": 269691, "epoch": 3249} {"train_loss": -25.037023544311523, "global_step": 269692, "epoch": 3249} {"train_loss": -25.195714950561523, "global_step": 269693, "epoch": 3249} {"train_loss": -25.304330825805664, "global_step": 269694, "epoch": 3249} {"train_loss": -24.879629135131836, "global_step": 269695, "epoch": 3249} {"train_loss": -24.927656173706055, "global_step": 269696, "epoch": 3249} {"train_loss": -24.95050048828125, "global_step": 269697, "epoch": 3249} {"train_loss": -24.942825317382812, "global_step": 269698, "epoch": 3249} {"train_loss": -25.070499420166016, "global_step": 269699, "epoch": 3249} {"train_loss": -24.695112228393555, "global_step": 269700, "epoch": 3249} {"train_loss": -25.09427261352539, "global_step": 269701, "epoch": 3249} {"train_loss": -25.247343063354492, "global_step": 269702, "epoch": 3249} {"train_loss": -25.323911666870117, "global_step": 269703, "epoch": 3249} {"train_loss": -24.960556030273438, "global_step": 269704, "epoch": 3249} {"train_loss": -25.17575454711914, "global_step": 269705, "epoch": 3249} {"train_loss": -25.40077781677246, "global_step": 269706, "epoch": 3249} {"train_loss": -25.435596466064453, "global_step": 269707, "epoch": 3249} {"train_loss": -25.31023597717285, "global_step": 269708, "epoch": 3249} {"train_loss": -25.286474227905273, "global_step": 269709, "epoch": 3249} {"train_loss": -25.12327766418457, "global_step": 269710, "epoch": 3249} {"train_loss": -25.26789665222168, "global_step": 269711, "epoch": 3249} {"train_loss": -25.265504837036133, "global_step": 269712, "epoch": 3249} {"train_loss": -25.646350860595703, "global_step": 269713, "epoch": 3249} {"train_loss": -25.387344360351562, "global_step": 269714, "epoch": 3249} {"train_loss": -25.367307662963867, "global_step": 269715, "epoch": 3249} {"train_loss": -25.204999923706055, "global_step": 269716, "epoch": 3249} {"train_loss": -25.579879760742188, "global_step": 269717, "epoch": 3249} {"train_loss": -25.184377670288086, "global_step": 269718, "epoch": 3249} {"train_loss": -24.987640380859375, "global_step": 269719, "epoch": 3249} {"train_loss": -25.23914909362793, "global_step": 269720, "epoch": 3249} {"train_loss": -25.253549575805664, "global_step": 269721, "epoch": 3249} {"train_loss": -25.408767700195312, "global_step": 269722, "epoch": 3249} {"train_loss": -25.703359603881836, "global_step": 269723, "epoch": 3249} {"train_loss": -25.23000144958496, "global_step": 269724, "epoch": 3249} {"train_loss": -25.543010711669922, "global_step": 269725, "epoch": 3249} {"train_loss": -25.364294052124023, "global_step": 269726, "epoch": 3249} {"train_loss": -25.35165786743164, "global_step": 269727, "epoch": 3249} {"train_loss": -25.243732452392578, "global_step": 269728, "epoch": 3249} {"train_loss": -25.375635147094727, "global_step": 269729, "epoch": 3249} {"train_loss": -25.425222396850586, "global_step": 269730, "epoch": 3249} {"train_loss": -24.98798942565918, "global_step": 269731, "epoch": 3249} {"train_loss": -24.356571197509766, "global_step": 269732, "epoch": 3249} {"train_loss": -23.319171905517578, "global_step": 269733, "epoch": 3249} {"train_loss": -23.124563217163086, "global_step": 269734, "epoch": 3249} {"train_loss": -24.31898307800293, "global_step": 269735, "epoch": 3249} {"train_loss": -25.30403709411621, "global_step": 269736, "epoch": 3249} {"train_loss": -24.064687728881836, "global_step": 269737, "epoch": 3249} {"train_loss": -24.61659049987793, "global_step": 269738, "epoch": 3249} {"train_loss": -24.70631217956543, "global_step": 269739, "epoch": 3249} {"train_loss": -24.656713485717773, "global_step": 269740, "epoch": 3249} {"train_loss": -24.561317443847656, "global_step": 269741, "epoch": 3249} {"train_loss": -25.026548385620117, "global_step": 269742, "epoch": 3249} {"train_loss": -24.74041175842285, "global_step": 269743, "epoch": 3249} {"train_loss": -25.23957633972168, "global_step": 269744, "epoch": 3249} {"train_loss": -25.244421005249023, "global_step": 269745, "epoch": 3249} {"train_loss": -24.852384567260742, "global_step": 269746, "epoch": 3249} {"train_loss": -25.390371322631836, "global_step": 269747, "epoch": 3249} {"train_loss": -24.971914291381836, "global_step": 269748, "epoch": 3249} {"train_loss": -25.034485070102185, "global_step": 269749, "epoch": 3249, "val_loss": 6975448.5} {"train_loss": -24.257917404174805, "global_step": 269750, "epoch": 3250} {"train_loss": -24.497900009155273, "global_step": 269751, "epoch": 3250} {"train_loss": -24.588111877441406, "global_step": 269752, "epoch": 3250} {"train_loss": -24.889917373657227, "global_step": 269753, "epoch": 3250} {"train_loss": -24.62741470336914, "global_step": 269754, "epoch": 3250} {"train_loss": -25.019624710083008, "global_step": 269755, "epoch": 3250} {"train_loss": -25.096105575561523, "global_step": 269756, "epoch": 3250} {"train_loss": -24.538606643676758, "global_step": 269757, "epoch": 3250} {"train_loss": -25.075584411621094, "global_step": 269758, "epoch": 3250} {"train_loss": -24.67527198791504, "global_step": 269759, "epoch": 3250} {"train_loss": -24.960002899169922, "global_step": 269760, "epoch": 3250} {"train_loss": -25.12734031677246, "global_step": 269761, "epoch": 3250} {"train_loss": -24.96883201599121, "global_step": 269762, "epoch": 3250} {"train_loss": -25.415109634399414, "global_step": 269763, "epoch": 3250} {"train_loss": -25.112966537475586, "global_step": 269764, "epoch": 3250} {"train_loss": -25.334518432617188, "global_step": 269765, "epoch": 3250} {"train_loss": -24.783599853515625, "global_step": 269766, "epoch": 3250} {"train_loss": -24.66507339477539, "global_step": 269767, "epoch": 3250} {"train_loss": -24.909992218017578, "global_step": 269768, "epoch": 3250} {"train_loss": -25.416452407836914, "global_step": 269769, "epoch": 3250} {"train_loss": -25.039091110229492, "global_step": 269770, "epoch": 3250} {"train_loss": -25.141887664794922, "global_step": 269771, "epoch": 3250} {"train_loss": -25.239179611206055, "global_step": 269772, "epoch": 3250} {"train_loss": -25.731414794921875, "global_step": 269773, "epoch": 3250} {"train_loss": -25.23996353149414, "global_step": 269774, "epoch": 3250} {"train_loss": -25.07228660583496, "global_step": 269775, "epoch": 3250} {"train_loss": -25.134702682495117, "global_step": 269776, "epoch": 3250} {"train_loss": -25.601898193359375, "global_step": 269777, "epoch": 3250} {"train_loss": -25.05609703063965, "global_step": 269778, "epoch": 3250} {"train_loss": -25.552316665649414, "global_step": 269779, "epoch": 3250} {"train_loss": -24.811609268188477, "global_step": 269780, "epoch": 3250} {"train_loss": -25.211307525634766, "global_step": 269781, "epoch": 3250} {"train_loss": -25.169300079345703, "global_step": 269782, "epoch": 3250} {"train_loss": -25.460203170776367, "global_step": 269783, "epoch": 3250} {"train_loss": -25.44121742248535, "global_step": 269784, "epoch": 3250} {"train_loss": -25.269155502319336, "global_step": 269785, "epoch": 3250} {"train_loss": -25.17885398864746, "global_step": 269786, "epoch": 3250} {"train_loss": -25.578393936157227, "global_step": 269787, "epoch": 3250} {"train_loss": -25.512182235717773, "global_step": 269788, "epoch": 3250} {"train_loss": -25.88925552368164, "global_step": 269789, "epoch": 3250} {"train_loss": -25.44989585876465, "global_step": 269790, "epoch": 3250} {"train_loss": -25.864770889282227, "global_step": 269791, "epoch": 3250} {"train_loss": -24.965713500976562, "global_step": 269792, "epoch": 3250} {"train_loss": -25.585111618041992, "global_step": 269793, "epoch": 3250} {"train_loss": -25.227336883544922, "global_step": 269794, "epoch": 3250} {"train_loss": -25.092248916625977, "global_step": 269795, "epoch": 3250} {"train_loss": -25.662261962890625, "global_step": 269796, "epoch": 3250} {"train_loss": -25.367780685424805, "global_step": 269797, "epoch": 3250} {"train_loss": -25.343191146850586, "global_step": 269798, "epoch": 3250} {"train_loss": -25.8033447265625, "global_step": 269799, "epoch": 3250} {"train_loss": -25.18146324157715, "global_step": 269800, "epoch": 3250} {"train_loss": -25.034574508666992, "global_step": 269801, "epoch": 3250} {"train_loss": -25.548494338989258, "global_step": 269802, "epoch": 3250} {"train_loss": -25.02589988708496, "global_step": 269803, "epoch": 3250} {"train_loss": -24.999723434448242, "global_step": 269804, "epoch": 3250} {"train_loss": -24.875652313232422, "global_step": 269805, "epoch": 3250} {"train_loss": -24.997802734375, "global_step": 269806, "epoch": 3250} {"train_loss": -24.899072647094727, "global_step": 269807, "epoch": 3250} {"train_loss": -24.852205276489258, "global_step": 269808, "epoch": 3250} {"train_loss": -25.148513793945312, "global_step": 269809, "epoch": 3250} {"train_loss": -25.145343780517578, "global_step": 269810, "epoch": 3250} {"train_loss": -25.09815788269043, "global_step": 269811, "epoch": 3250} {"train_loss": -25.103113174438477, "global_step": 269812, "epoch": 3250} {"train_loss": -25.402563095092773, "global_step": 269813, "epoch": 3250} {"train_loss": -25.259536743164062, "global_step": 269814, "epoch": 3250} {"train_loss": -25.672821044921875, "global_step": 269815, "epoch": 3250} {"train_loss": -25.306276321411133, "global_step": 269816, "epoch": 3250} {"train_loss": -25.071622848510742, "global_step": 269817, "epoch": 3250} {"train_loss": -25.188993453979492, "global_step": 269818, "epoch": 3250} {"train_loss": -25.215425491333008, "global_step": 269819, "epoch": 3250} {"train_loss": -25.11761474609375, "global_step": 269820, "epoch": 3250} {"train_loss": -25.153594970703125, "global_step": 269821, "epoch": 3250} {"train_loss": -25.18462562561035, "global_step": 269822, "epoch": 3250} {"train_loss": -25.02007484436035, "global_step": 269823, "epoch": 3250} {"train_loss": -24.83416748046875, "global_step": 269824, "epoch": 3250} {"train_loss": -25.467315673828125, "global_step": 269825, "epoch": 3250} {"train_loss": -25.1923885345459, "global_step": 269826, "epoch": 3250} {"train_loss": -25.33326530456543, "global_step": 269827, "epoch": 3250} {"train_loss": -25.21394920349121, "global_step": 269828, "epoch": 3250} {"train_loss": -25.510770797729492, "global_step": 269829, "epoch": 3250} {"train_loss": -25.237876892089844, "global_step": 269830, "epoch": 3250} {"train_loss": -25.300954818725586, "global_step": 269831, "epoch": 3250} {"train_loss": -25.172058151428956, "global_step": 269832, "epoch": 3250, "train/sim_max_reward_0": 1.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 0.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4500000": 1.0, "test/sim_max_reward_4500001": 1.0, "test/sim_max_reward_4500002": 1.0, "test/sim_max_reward_4500003": 1.0, "test/sim_max_reward_4500004": 1.0, "test/sim_max_reward_4500005": 1.0, "test/sim_max_reward_4500006": 1.0, "test/sim_max_reward_4500007": 0.0, "test/sim_max_reward_4500008": 1.0, "test/sim_max_reward_4500009": 1.0, "test/sim_max_reward_4500010": 1.0, "test/sim_max_reward_4500011": 1.0, "test/sim_max_reward_4500012": 1.0, "test/sim_max_reward_4500013": 0.0, "test/sim_max_reward_4500014": 1.0, "test/sim_max_reward_4500015": 1.0, "test/sim_max_reward_4500016": 1.0, "test/sim_max_reward_4500017": 1.0, "test/sim_max_reward_4500018": 1.0, "test/sim_max_reward_4500019": 1.0, "test/sim_max_reward_4500020": 1.0, "test/sim_max_reward_4500021": 1.0, "train/mean_score": 0.8333333333333334, "test/mean_score": 0.9090909090909091, "val_loss": 7192537.0} {"train_loss": -24.634883880615234, "global_step": 269833, "epoch": 3251} {"train_loss": -25.08591079711914, "global_step": 269834, "epoch": 3251} {"train_loss": -24.778329849243164, "global_step": 269835, "epoch": 3251} {"train_loss": -25.054262161254883, "global_step": 269836, "epoch": 3251} {"train_loss": -25.066686630249023, "global_step": 269837, "epoch": 3251} {"train_loss": -25.13301658630371, "global_step": 269838, "epoch": 3251} {"train_loss": -24.98044204711914, "global_step": 269839, "epoch": 3251} {"train_loss": -25.078845977783203, "global_step": 269840, "epoch": 3251} {"train_loss": -24.970802307128906, "global_step": 269841, "epoch": 3251} {"train_loss": -25.33246421813965, "global_step": 269842, "epoch": 3251} {"train_loss": -24.961109161376953, "global_step": 269843, "epoch": 3251} {"train_loss": -25.0778751373291, "global_step": 269844, "epoch": 3251} {"train_loss": -25.29578971862793, "global_step": 269845, "epoch": 3251} {"train_loss": -25.11798667907715, "global_step": 269846, "epoch": 3251} {"train_loss": -24.660297393798828, "global_step": 269847, "epoch": 3251} {"train_loss": -25.261030197143555, "global_step": 269848, "epoch": 3251} {"train_loss": -25.3808536529541, "global_step": 269849, "epoch": 3251} {"train_loss": -24.987165451049805, "global_step": 269850, "epoch": 3251} {"train_loss": -25.228626251220703, "global_step": 269851, "epoch": 3251} {"train_loss": -24.977975845336914, "global_step": 269852, "epoch": 3251} {"train_loss": -25.42561912536621, "global_step": 269853, "epoch": 3251} {"train_loss": -24.89320945739746, "global_step": 269854, "epoch": 3251} {"train_loss": -25.463472366333008, "global_step": 269855, "epoch": 3251} {"train_loss": -25.12456703186035, "global_step": 269856, "epoch": 3251} {"train_loss": -25.274080276489258, "global_step": 269857, "epoch": 3251} {"train_loss": -25.45132827758789, "global_step": 269858, "epoch": 3251} {"train_loss": -25.55962562561035, "global_step": 269859, "epoch": 3251} {"train_loss": -25.262035369873047, "global_step": 269860, "epoch": 3251} {"train_loss": -25.273666381835938, "global_step": 269861, "epoch": 3251} {"train_loss": -25.19310188293457, "global_step": 269862, "epoch": 3251} {"train_loss": -25.236032485961914, "global_step": 269863, "epoch": 3251} {"train_loss": -25.1279354095459, "global_step": 269864, "epoch": 3251} {"train_loss": -25.41957664489746, "global_step": 269865, "epoch": 3251} {"train_loss": -25.235523223876953, "global_step": 269866, "epoch": 3251} {"train_loss": -25.020980834960938, "global_step": 269867, "epoch": 3251} {"train_loss": -25.244709014892578, "global_step": 269868, "epoch": 3251} {"train_loss": -25.250770568847656, "global_step": 269869, "epoch": 3251} {"train_loss": -25.024856567382812, "global_step": 269870, "epoch": 3251} {"train_loss": -25.32840919494629, "global_step": 269871, "epoch": 3251} {"train_loss": -25.428428649902344, "global_step": 269872, "epoch": 3251} {"train_loss": -25.375314712524414, "global_step": 269873, "epoch": 3251} {"train_loss": -25.571645736694336, "global_step": 269874, "epoch": 3251} {"train_loss": -25.26466941833496, "global_step": 269875, "epoch": 3251} {"train_loss": -25.284181594848633, "global_step": 269876, "epoch": 3251} {"train_loss": -25.55550765991211, "global_step": 269877, "epoch": 3251} {"train_loss": -24.808048248291016, "global_step": 269878, "epoch": 3251} {"train_loss": -25.089521408081055, "global_step": 269879, "epoch": 3251} {"train_loss": -25.2939453125, "global_step": 269880, "epoch": 3251} {"train_loss": -25.301700592041016, "global_step": 269881, "epoch": 3251} {"train_loss": -24.985868453979492, "global_step": 269882, "epoch": 3251} {"train_loss": -25.068490982055664, "global_step": 269883, "epoch": 3251} {"train_loss": -25.19615364074707, "global_step": 269884, "epoch": 3251} {"train_loss": -24.878705978393555, "global_step": 269885, "epoch": 3251} {"train_loss": -24.743446350097656, "global_step": 269886, "epoch": 3251} {"train_loss": -25.262678146362305, "global_step": 269887, "epoch": 3251} {"train_loss": -24.977176666259766, "global_step": 269888, "epoch": 3251} {"train_loss": -24.85669708251953, "global_step": 269889, "epoch": 3251} {"train_loss": -24.92403221130371, "global_step": 269890, "epoch": 3251} {"train_loss": -25.38969612121582, "global_step": 269891, "epoch": 3251} {"train_loss": -25.036588668823242, "global_step": 269892, "epoch": 3251} {"train_loss": -25.23764419555664, "global_step": 269893, "epoch": 3251} {"train_loss": -24.856904983520508, "global_step": 269894, "epoch": 3251} {"train_loss": -24.814313888549805, "global_step": 269895, "epoch": 3251} {"train_loss": -25.3348445892334, "global_step": 269896, "epoch": 3251} {"train_loss": -25.38252830505371, "global_step": 269897, "epoch": 3251} {"train_loss": -25.547502517700195, "global_step": 269898, "epoch": 3251} {"train_loss": -25.07156753540039, "global_step": 269899, "epoch": 3251} {"train_loss": -25.13167953491211, "global_step": 269900, "epoch": 3251} {"train_loss": -25.258161544799805, "global_step": 269901, "epoch": 3251} {"train_loss": -25.420053482055664, "global_step": 269902, "epoch": 3251} {"train_loss": -25.059192657470703, "global_step": 269903, "epoch": 3251} {"train_loss": -25.406890869140625, "global_step": 269904, "epoch": 3251} {"train_loss": -25.537097930908203, "global_step": 269905, "epoch": 3251} {"train_loss": -25.40309715270996, "global_step": 269906, "epoch": 3251} {"train_loss": -25.162443161010742, "global_step": 269907, "epoch": 3251} {"train_loss": -25.28424072265625, "global_step": 269908, "epoch": 3251} {"train_loss": -25.511709213256836, "global_step": 269909, "epoch": 3251} {"train_loss": -24.979042053222656, "global_step": 269910, "epoch": 3251} {"train_loss": -25.18369483947754, "global_step": 269911, "epoch": 3251} {"train_loss": -25.028013229370117, "global_step": 269912, "epoch": 3251} {"train_loss": -25.219619750976562, "global_step": 269913, "epoch": 3251} {"train_loss": -25.3335018157959, "global_step": 269914, "epoch": 3251} {"train_loss": -25.18707406377218, "global_step": 269915, "epoch": 3251, "val_loss": 7010265.0} {"train_loss": -23.886436462402344, "global_step": 269916, "epoch": 3252} {"train_loss": -23.70977020263672, "global_step": 269917, "epoch": 3252} {"train_loss": -23.947006225585938, "global_step": 269918, "epoch": 3252} {"train_loss": -24.58642578125, "global_step": 269919, "epoch": 3252} {"train_loss": -23.985111236572266, "global_step": 269920, "epoch": 3252} {"train_loss": -24.19915199279785, "global_step": 269921, "epoch": 3252} {"train_loss": -24.635887145996094, "global_step": 269922, "epoch": 3252} {"train_loss": -24.303348541259766, "global_step": 269923, "epoch": 3252} {"train_loss": -24.501930236816406, "global_step": 269924, "epoch": 3252} {"train_loss": -24.44097900390625, "global_step": 269925, "epoch": 3252} {"train_loss": -24.808591842651367, "global_step": 269926, "epoch": 3252} {"train_loss": -24.276960372924805, "global_step": 269927, "epoch": 3252} {"train_loss": -24.691875457763672, "global_step": 269928, "epoch": 3252} {"train_loss": -24.65819549560547, "global_step": 269929, "epoch": 3252} {"train_loss": -24.88956642150879, "global_step": 269930, "epoch": 3252} {"train_loss": -25.01008415222168, "global_step": 269931, "epoch": 3252} {"train_loss": -24.307533264160156, "global_step": 269932, "epoch": 3252} {"train_loss": -24.706710815429688, "global_step": 269933, "epoch": 3252} {"train_loss": -24.937475204467773, "global_step": 269934, "epoch": 3252} {"train_loss": -24.703828811645508, "global_step": 269935, "epoch": 3252} {"train_loss": -25.227781295776367, "global_step": 269936, "epoch": 3252} {"train_loss": -24.991552352905273, "global_step": 269937, "epoch": 3252} {"train_loss": -24.93799591064453, "global_step": 269938, "epoch": 3252} {"train_loss": -25.027524948120117, "global_step": 269939, "epoch": 3252} {"train_loss": -25.056957244873047, "global_step": 269940, "epoch": 3252} {"train_loss": -24.55495262145996, "global_step": 269941, "epoch": 3252} {"train_loss": -25.242910385131836, "global_step": 269942, "epoch": 3252} {"train_loss": -25.007165908813477, "global_step": 269943, "epoch": 3252} {"train_loss": -24.91678237915039, "global_step": 269944, "epoch": 3252} {"train_loss": -24.741804122924805, "global_step": 269945, "epoch": 3252} {"train_loss": -24.8536319732666, "global_step": 269946, "epoch": 3252} {"train_loss": -25.036840438842773, "global_step": 269947, "epoch": 3252} {"train_loss": -25.212430953979492, "global_step": 269948, "epoch": 3252} {"train_loss": -25.048969268798828, "global_step": 269949, "epoch": 3252} {"train_loss": -25.339033126831055, "global_step": 269950, "epoch": 3252} {"train_loss": -24.537145614624023, "global_step": 269951, "epoch": 3252} {"train_loss": -25.234296798706055, "global_step": 269952, "epoch": 3252} {"train_loss": -25.049060821533203, "global_step": 269953, "epoch": 3252} {"train_loss": -25.23702621459961, "global_step": 269954, "epoch": 3252} {"train_loss": -25.179113388061523, "global_step": 269955, "epoch": 3252} {"train_loss": -25.110071182250977, "global_step": 269956, "epoch": 3252} {"train_loss": -25.05391502380371, "global_step": 269957, "epoch": 3252} {"train_loss": -25.043930053710938, "global_step": 269958, "epoch": 3252} {"train_loss": -25.112024307250977, "global_step": 269959, "epoch": 3252} {"train_loss": -25.452560424804688, "global_step": 269960, "epoch": 3252} {"train_loss": -25.01527214050293, "global_step": 269961, "epoch": 3252} {"train_loss": -25.443618774414062, "global_step": 269962, "epoch": 3252} {"train_loss": -25.414525985717773, "global_step": 269963, "epoch": 3252} {"train_loss": -25.289539337158203, "global_step": 269964, "epoch": 3252} {"train_loss": -25.393634796142578, "global_step": 269965, "epoch": 3252} {"train_loss": -25.335214614868164, "global_step": 269966, "epoch": 3252} {"train_loss": -25.629779815673828, "global_step": 269967, "epoch": 3252} {"train_loss": -25.34502410888672, "global_step": 269968, "epoch": 3252} {"train_loss": -25.352848052978516, "global_step": 269969, "epoch": 3252} {"train_loss": -25.273122787475586, "global_step": 269970, "epoch": 3252} {"train_loss": -25.380956649780273, "global_step": 269971, "epoch": 3252} {"train_loss": -25.397483825683594, "global_step": 269972, "epoch": 3252} {"train_loss": -25.353073120117188, "global_step": 269973, "epoch": 3252} {"train_loss": -25.21489143371582, "global_step": 269974, "epoch": 3252} {"train_loss": -25.50699234008789, "global_step": 269975, "epoch": 3252} {"train_loss": -25.553579330444336, "global_step": 269976, "epoch": 3252} {"train_loss": -25.799787521362305, "global_step": 269977, "epoch": 3252} {"train_loss": -25.068252563476562, "global_step": 269978, "epoch": 3252} {"train_loss": -25.381315231323242, "global_step": 269979, "epoch": 3252} {"train_loss": -25.373510360717773, "global_step": 269980, "epoch": 3252} {"train_loss": -25.182313919067383, "global_step": 269981, "epoch": 3252} {"train_loss": -25.22869300842285, "global_step": 269982, "epoch": 3252} {"train_loss": -25.176755905151367, "global_step": 269983, "epoch": 3252} {"train_loss": -25.412443161010742, "global_step": 269984, "epoch": 3252} {"train_loss": -25.234783172607422, "global_step": 269985, "epoch": 3252} {"train_loss": -25.516002655029297, "global_step": 269986, "epoch": 3252} {"train_loss": -25.21765899658203, "global_step": 269987, "epoch": 3252} {"train_loss": -25.3100643157959, "global_step": 269988, "epoch": 3252} {"train_loss": -25.225305557250977, "global_step": 269989, "epoch": 3252} {"train_loss": -25.145700454711914, "global_step": 269990, "epoch": 3252} {"train_loss": -25.224668502807617, "global_step": 269991, "epoch": 3252} {"train_loss": -25.197744369506836, "global_step": 269992, "epoch": 3252} {"train_loss": -25.37448501586914, "global_step": 269993, "epoch": 3252} {"train_loss": -24.981979370117188, "global_step": 269994, "epoch": 3252} {"train_loss": -25.32834815979004, "global_step": 269995, "epoch": 3252} {"train_loss": -25.64142417907715, "global_step": 269996, "epoch": 3252} {"train_loss": -25.085834503173828, "global_step": 269997, "epoch": 3252} {"train_loss": -25.02369648577219, "global_step": 269998, "epoch": 3252, "val_loss": 7021123.0} {"train_loss": -23.70692253112793, "global_step": 269999, "epoch": 3253} {"train_loss": -23.676025390625, "global_step": 270000, "epoch": 3253} {"train_loss": -23.883331298828125, "global_step": 270001, "epoch": 3253} {"train_loss": -24.270151138305664, "global_step": 270002, "epoch": 3253} {"train_loss": -24.507089614868164, "global_step": 270003, "epoch": 3253} {"train_loss": -24.457386016845703, "global_step": 270004, "epoch": 3253} {"train_loss": -24.606489181518555, "global_step": 270005, "epoch": 3253} {"train_loss": -24.824432373046875, "global_step": 270006, "epoch": 3253} {"train_loss": -24.204612731933594, "global_step": 270007, "epoch": 3253} {"train_loss": -24.847143173217773, "global_step": 270008, "epoch": 3253} {"train_loss": -24.56093406677246, "global_step": 270009, "epoch": 3253} {"train_loss": -24.424175262451172, "global_step": 270010, "epoch": 3253} {"train_loss": -24.414823532104492, "global_step": 270011, "epoch": 3253} {"train_loss": -25.32407569885254, "global_step": 270012, "epoch": 3253} {"train_loss": -24.654571533203125, "global_step": 270013, "epoch": 3253} {"train_loss": -24.928640365600586, "global_step": 270014, "epoch": 3253} {"train_loss": -24.536914825439453, "global_step": 270015, "epoch": 3253} {"train_loss": -24.944787979125977, "global_step": 270016, "epoch": 3253} {"train_loss": -24.86905288696289, "global_step": 270017, "epoch": 3253} {"train_loss": -25.1063175201416, "global_step": 270018, "epoch": 3253} {"train_loss": -25.278066635131836, "global_step": 270019, "epoch": 3253} {"train_loss": -25.34779167175293, "global_step": 270020, "epoch": 3253} {"train_loss": -25.240646362304688, "global_step": 270021, "epoch": 3253} {"train_loss": -25.00857162475586, "global_step": 270022, "epoch": 3253} {"train_loss": -25.21103858947754, "global_step": 270023, "epoch": 3253} {"train_loss": -24.705419540405273, "global_step": 270024, "epoch": 3253} {"train_loss": -25.46046257019043, "global_step": 270025, "epoch": 3253} {"train_loss": -24.886337280273438, "global_step": 270026, "epoch": 3253} {"train_loss": -25.1429500579834, "global_step": 270027, "epoch": 3253} {"train_loss": -25.3199405670166, "global_step": 270028, "epoch": 3253} {"train_loss": -25.25455093383789, "global_step": 270029, "epoch": 3253} {"train_loss": -25.305570602416992, "global_step": 270030, "epoch": 3253} {"train_loss": -25.20157241821289, "global_step": 270031, "epoch": 3253} {"train_loss": -25.223196029663086, "global_step": 270032, "epoch": 3253} {"train_loss": -25.134016036987305, "global_step": 270033, "epoch": 3253} {"train_loss": -25.416234970092773, "global_step": 270034, "epoch": 3253} {"train_loss": -24.988544464111328, "global_step": 270035, "epoch": 3253} {"train_loss": -25.379491806030273, "global_step": 270036, "epoch": 3253} {"train_loss": -25.42366600036621, "global_step": 270037, "epoch": 3253} {"train_loss": -25.19013786315918, "global_step": 270038, "epoch": 3253} {"train_loss": -25.35532569885254, "global_step": 270039, "epoch": 3253} {"train_loss": -25.150386810302734, "global_step": 270040, "epoch": 3253} {"train_loss": -25.298837661743164, "global_step": 270041, "epoch": 3253} {"train_loss": -24.960250854492188, "global_step": 270042, "epoch": 3253} {"train_loss": -25.156644821166992, "global_step": 270043, "epoch": 3253} {"train_loss": -25.404951095581055, "global_step": 270044, "epoch": 3253} {"train_loss": -25.479251861572266, "global_step": 270045, "epoch": 3253} {"train_loss": -25.420949935913086, "global_step": 270046, "epoch": 3253} {"train_loss": -25.32363510131836, "global_step": 270047, "epoch": 3253} {"train_loss": -25.336477279663086, "global_step": 270048, "epoch": 3253} {"train_loss": -25.64438819885254, "global_step": 270049, "epoch": 3253} {"train_loss": -25.105045318603516, "global_step": 270050, "epoch": 3253} {"train_loss": -25.503372192382812, "global_step": 270051, "epoch": 3253} {"train_loss": -25.56501579284668, "global_step": 270052, "epoch": 3253} {"train_loss": -25.241994857788086, "global_step": 270053, "epoch": 3253} {"train_loss": -25.553569793701172, "global_step": 270054, "epoch": 3253} {"train_loss": -25.593612670898438, "global_step": 270055, "epoch": 3253} {"train_loss": -25.281848907470703, "global_step": 270056, "epoch": 3253} {"train_loss": -25.048105239868164, "global_step": 270057, "epoch": 3253} {"train_loss": -25.291440963745117, "global_step": 270058, "epoch": 3253} {"train_loss": -25.20795249938965, "global_step": 270059, "epoch": 3253} {"train_loss": -25.294544219970703, "global_step": 270060, "epoch": 3253} {"train_loss": -25.537954330444336, "global_step": 270061, "epoch": 3253} {"train_loss": -24.87346649169922, "global_step": 270062, "epoch": 3253} {"train_loss": -24.63614273071289, "global_step": 270063, "epoch": 3253} {"train_loss": -25.558547973632812, "global_step": 270064, "epoch": 3253} {"train_loss": -25.317874908447266, "global_step": 270065, "epoch": 3253} {"train_loss": -25.068296432495117, "global_step": 270066, "epoch": 3253} {"train_loss": -25.690710067749023, "global_step": 270067, "epoch": 3253} {"train_loss": -25.073076248168945, "global_step": 270068, "epoch": 3253} {"train_loss": -24.965150833129883, "global_step": 270069, "epoch": 3253} {"train_loss": -25.330015182495117, "global_step": 270070, "epoch": 3253} {"train_loss": -25.18375015258789, "global_step": 270071, "epoch": 3253} {"train_loss": -25.118192672729492, "global_step": 270072, "epoch": 3253} {"train_loss": -25.321598052978516, "global_step": 270073, "epoch": 3253} {"train_loss": -25.72425651550293, "global_step": 270074, "epoch": 3253} {"train_loss": -25.4753475189209, "global_step": 270075, "epoch": 3253} {"train_loss": -25.40167999267578, "global_step": 270076, "epoch": 3253} {"train_loss": -25.474302291870117, "global_step": 270077, "epoch": 3253} {"train_loss": -25.249910354614258, "global_step": 270078, "epoch": 3253} {"train_loss": -25.539228439331055, "global_step": 270079, "epoch": 3253} {"train_loss": -25.721973419189453, "global_step": 270080, "epoch": 3253} {"train_loss": -25.10635658631842, "global_step": 270081, "epoch": 3253, "val_loss": 6930999.0} {"train_loss": -24.943038940429688, "global_step": 270082, "epoch": 3254} {"train_loss": -24.909414291381836, "global_step": 270083, "epoch": 3254} {"train_loss": -24.821399688720703, "global_step": 270084, "epoch": 3254} {"train_loss": -24.70746421813965, "global_step": 270085, "epoch": 3254} {"train_loss": -24.542890548706055, "global_step": 270086, "epoch": 3254} {"train_loss": -25.279987335205078, "global_step": 270087, "epoch": 3254} {"train_loss": -24.724212646484375, "global_step": 270088, "epoch": 3254} {"train_loss": -25.051223754882812, "global_step": 270089, "epoch": 3254} {"train_loss": -24.936044692993164, "global_step": 270090, "epoch": 3254} {"train_loss": -24.789926528930664, "global_step": 270091, "epoch": 3254} {"train_loss": -24.827495574951172, "global_step": 270092, "epoch": 3254} {"train_loss": -25.238004684448242, "global_step": 270093, "epoch": 3254} {"train_loss": -24.979337692260742, "global_step": 270094, "epoch": 3254} {"train_loss": -25.0236759185791, "global_step": 270095, "epoch": 3254} {"train_loss": -25.17463493347168, "global_step": 270096, "epoch": 3254} {"train_loss": -24.866313934326172, "global_step": 270097, "epoch": 3254} {"train_loss": -25.262903213500977, "global_step": 270098, "epoch": 3254} {"train_loss": -25.27147674560547, "global_step": 270099, "epoch": 3254} {"train_loss": -25.146940231323242, "global_step": 270100, "epoch": 3254} {"train_loss": -24.78248405456543, "global_step": 270101, "epoch": 3254} {"train_loss": -25.101953506469727, "global_step": 270102, "epoch": 3254} {"train_loss": -25.161636352539062, "global_step": 270103, "epoch": 3254} {"train_loss": -24.849136352539062, "global_step": 270104, "epoch": 3254} {"train_loss": -25.4841365814209, "global_step": 270105, "epoch": 3254} {"train_loss": -25.288801193237305, "global_step": 270106, "epoch": 3254} {"train_loss": -25.210142135620117, "global_step": 270107, "epoch": 3254} {"train_loss": -25.17024803161621, "global_step": 270108, "epoch": 3254} {"train_loss": -25.363008499145508, "global_step": 270109, "epoch": 3254} {"train_loss": -25.478593826293945, "global_step": 270110, "epoch": 3254} {"train_loss": -25.3157958984375, "global_step": 270111, "epoch": 3254} {"train_loss": -25.1980037689209, "global_step": 270112, "epoch": 3254} {"train_loss": -25.269546508789062, "global_step": 270113, "epoch": 3254} {"train_loss": -25.373563766479492, "global_step": 270114, "epoch": 3254} {"train_loss": -25.542648315429688, "global_step": 270115, "epoch": 3254} {"train_loss": -25.140670776367188, "global_step": 270116, "epoch": 3254} {"train_loss": -25.69205093383789, "global_step": 270117, "epoch": 3254} {"train_loss": -25.6107177734375, "global_step": 270118, "epoch": 3254} {"train_loss": -25.32045555114746, "global_step": 270119, "epoch": 3254} {"train_loss": -25.685382843017578, "global_step": 270120, "epoch": 3254} {"train_loss": -25.434812545776367, "global_step": 270121, "epoch": 3254} {"train_loss": -25.478689193725586, "global_step": 270122, "epoch": 3254} {"train_loss": -25.556961059570312, "global_step": 270123, "epoch": 3254} {"train_loss": -25.503538131713867, "global_step": 270124, "epoch": 3254} {"train_loss": -25.046255111694336, "global_step": 270125, "epoch": 3254} {"train_loss": -25.378503799438477, "global_step": 270126, "epoch": 3254} {"train_loss": -25.34588623046875, "global_step": 270127, "epoch": 3254} {"train_loss": -25.05942153930664, "global_step": 270128, "epoch": 3254} {"train_loss": -25.659515380859375, "global_step": 270129, "epoch": 3254} {"train_loss": -25.275497436523438, "global_step": 270130, "epoch": 3254} {"train_loss": -25.242088317871094, "global_step": 270131, "epoch": 3254} {"train_loss": -25.24163818359375, "global_step": 270132, "epoch": 3254} {"train_loss": -25.16754150390625, "global_step": 270133, "epoch": 3254} {"train_loss": -25.450231552124023, "global_step": 270134, "epoch": 3254} {"train_loss": -25.674880981445312, "global_step": 270135, "epoch": 3254} {"train_loss": -25.695722579956055, "global_step": 270136, "epoch": 3254} {"train_loss": -25.25485610961914, "global_step": 270137, "epoch": 3254} {"train_loss": -25.392032623291016, "global_step": 270138, "epoch": 3254} {"train_loss": -25.53152847290039, "global_step": 270139, "epoch": 3254} {"train_loss": -25.059701919555664, "global_step": 270140, "epoch": 3254} {"train_loss": -25.535411834716797, "global_step": 270141, "epoch": 3254} {"train_loss": -25.056264877319336, "global_step": 270142, "epoch": 3254} {"train_loss": -25.377004623413086, "global_step": 270143, "epoch": 3254} {"train_loss": -25.736967086791992, "global_step": 270144, "epoch": 3254} {"train_loss": -25.30261993408203, "global_step": 270145, "epoch": 3254} {"train_loss": -25.336698532104492, "global_step": 270146, "epoch": 3254} {"train_loss": -25.432357788085938, "global_step": 270147, "epoch": 3254} {"train_loss": -25.34032440185547, "global_step": 270148, "epoch": 3254} {"train_loss": -25.238554000854492, "global_step": 270149, "epoch": 3254} {"train_loss": -25.139892578125, "global_step": 270150, "epoch": 3254} {"train_loss": -25.613183975219727, "global_step": 270151, "epoch": 3254} {"train_loss": -25.199413299560547, "global_step": 270152, "epoch": 3254} {"train_loss": -25.264156341552734, "global_step": 270153, "epoch": 3254} {"train_loss": -25.598520278930664, "global_step": 270154, "epoch": 3254} {"train_loss": -25.471677780151367, "global_step": 270155, "epoch": 3254} {"train_loss": -25.175397872924805, "global_step": 270156, "epoch": 3254} {"train_loss": -25.390188217163086, "global_step": 270157, "epoch": 3254} {"train_loss": -25.35323143005371, "global_step": 270158, "epoch": 3254} {"train_loss": -25.547780990600586, "global_step": 270159, "epoch": 3254} {"train_loss": -25.324787139892578, "global_step": 270160, "epoch": 3254} {"train_loss": -25.500288009643555, "global_step": 270161, "epoch": 3254} {"train_loss": -25.183835983276367, "global_step": 270162, "epoch": 3254} {"train_loss": -25.445737838745117, "global_step": 270163, "epoch": 3254} {"train_loss": -25.253593100122657, "global_step": 270164, "epoch": 3254, "val_loss": 7123374.0} {"train_loss": -24.64365005493164, "global_step": 270165, "epoch": 3255} {"train_loss": -24.441537857055664, "global_step": 270166, "epoch": 3255} {"train_loss": -24.675012588500977, "global_step": 270167, "epoch": 3255} {"train_loss": -24.375051498413086, "global_step": 270168, "epoch": 3255} {"train_loss": -24.689828872680664, "global_step": 270169, "epoch": 3255} {"train_loss": -24.661279678344727, "global_step": 270170, "epoch": 3255} {"train_loss": -24.593664169311523, "global_step": 270171, "epoch": 3255} {"train_loss": -24.50054931640625, "global_step": 270172, "epoch": 3255} {"train_loss": -24.696317672729492, "global_step": 270173, "epoch": 3255} {"train_loss": -24.7309513092041, "global_step": 270174, "epoch": 3255} {"train_loss": -24.841651916503906, "global_step": 270175, "epoch": 3255} {"train_loss": -24.93348503112793, "global_step": 270176, "epoch": 3255} {"train_loss": -24.53995704650879, "global_step": 270177, "epoch": 3255} {"train_loss": -24.759328842163086, "global_step": 270178, "epoch": 3255} {"train_loss": -24.389530181884766, "global_step": 270179, "epoch": 3255} {"train_loss": -25.06964111328125, "global_step": 270180, "epoch": 3255} {"train_loss": -24.927444458007812, "global_step": 270181, "epoch": 3255} {"train_loss": -25.02350425720215, "global_step": 270182, "epoch": 3255} {"train_loss": -24.956357955932617, "global_step": 270183, "epoch": 3255} {"train_loss": -25.240453720092773, "global_step": 270184, "epoch": 3255} {"train_loss": -25.167142868041992, "global_step": 270185, "epoch": 3255} {"train_loss": -25.00424575805664, "global_step": 270186, "epoch": 3255} {"train_loss": -25.008787155151367, "global_step": 270187, "epoch": 3255} {"train_loss": -25.171504974365234, "global_step": 270188, "epoch": 3255} {"train_loss": -25.217756271362305, "global_step": 270189, "epoch": 3255} {"train_loss": -25.21539878845215, "global_step": 270190, "epoch": 3255} {"train_loss": -25.011945724487305, "global_step": 270191, "epoch": 3255} {"train_loss": -24.947324752807617, "global_step": 270192, "epoch": 3255} {"train_loss": -24.76609230041504, "global_step": 270193, "epoch": 3255} {"train_loss": -25.218420028686523, "global_step": 270194, "epoch": 3255} {"train_loss": -24.970060348510742, "global_step": 270195, "epoch": 3255} {"train_loss": -25.02252769470215, "global_step": 270196, "epoch": 3255} {"train_loss": -25.19866371154785, "global_step": 270197, "epoch": 3255} {"train_loss": -25.101842880249023, "global_step": 270198, "epoch": 3255} {"train_loss": -25.31271743774414, "global_step": 270199, "epoch": 3255} {"train_loss": -25.670217514038086, "global_step": 270200, "epoch": 3255} {"train_loss": -25.095853805541992, "global_step": 270201, "epoch": 3255} {"train_loss": -25.54253578186035, "global_step": 270202, "epoch": 3255} {"train_loss": -25.483823776245117, "global_step": 270203, "epoch": 3255} {"train_loss": -25.6591739654541, "global_step": 270204, "epoch": 3255} {"train_loss": -25.277761459350586, "global_step": 270205, "epoch": 3255} {"train_loss": -25.40706443786621, "global_step": 270206, "epoch": 3255} {"train_loss": -25.204898834228516, "global_step": 270207, "epoch": 3255} {"train_loss": -25.33930015563965, "global_step": 270208, "epoch": 3255} {"train_loss": -25.16233253479004, "global_step": 270209, "epoch": 3255} {"train_loss": -25.526979446411133, "global_step": 270210, "epoch": 3255} {"train_loss": -25.359832763671875, "global_step": 270211, "epoch": 3255} {"train_loss": -25.192840576171875, "global_step": 270212, "epoch": 3255} {"train_loss": -25.220815658569336, "global_step": 270213, "epoch": 3255} {"train_loss": -25.140378952026367, "global_step": 270214, "epoch": 3255} {"train_loss": -25.41751480102539, "global_step": 270215, "epoch": 3255} {"train_loss": -25.11913299560547, "global_step": 270216, "epoch": 3255} {"train_loss": -25.27663803100586, "global_step": 270217, "epoch": 3255} {"train_loss": -25.763147354125977, "global_step": 270218, "epoch": 3255} {"train_loss": -25.337730407714844, "global_step": 270219, "epoch": 3255} {"train_loss": -25.21135139465332, "global_step": 270220, "epoch": 3255} {"train_loss": -24.884000778198242, "global_step": 270221, "epoch": 3255} {"train_loss": -24.517587661743164, "global_step": 270222, "epoch": 3255} {"train_loss": -25.008020401000977, "global_step": 270223, "epoch": 3255} {"train_loss": -25.939563751220703, "global_step": 270224, "epoch": 3255} {"train_loss": -25.094457626342773, "global_step": 270225, "epoch": 3255} {"train_loss": -25.27560043334961, "global_step": 270226, "epoch": 3255} {"train_loss": -25.357410430908203, "global_step": 270227, "epoch": 3255} {"train_loss": -25.19819450378418, "global_step": 270228, "epoch": 3255} {"train_loss": -25.449506759643555, "global_step": 270229, "epoch": 3255} {"train_loss": -24.90296745300293, "global_step": 270230, "epoch": 3255} {"train_loss": -25.885852813720703, "global_step": 270231, "epoch": 3255} {"train_loss": -25.413333892822266, "global_step": 270232, "epoch": 3255} {"train_loss": -25.496713638305664, "global_step": 270233, "epoch": 3255} {"train_loss": -25.551259994506836, "global_step": 270234, "epoch": 3255} {"train_loss": -25.098787307739258, "global_step": 270235, "epoch": 3255} {"train_loss": -25.561559677124023, "global_step": 270236, "epoch": 3255} {"train_loss": -24.72102928161621, "global_step": 270237, "epoch": 3255} {"train_loss": -25.2195987701416, "global_step": 270238, "epoch": 3255} {"train_loss": -25.239614486694336, "global_step": 270239, "epoch": 3255} {"train_loss": -25.10350799560547, "global_step": 270240, "epoch": 3255} {"train_loss": -25.249698638916016, "global_step": 270241, "epoch": 3255} {"train_loss": -25.0208740234375, "global_step": 270242, "epoch": 3255} {"train_loss": -24.900676727294922, "global_step": 270243, "epoch": 3255} {"train_loss": -25.008703231811523, "global_step": 270244, "epoch": 3255} {"train_loss": -25.011009216308594, "global_step": 270245, "epoch": 3255} {"train_loss": -24.72498893737793, "global_step": 270246, "epoch": 3255} {"train_loss": -25.11109561230763, "global_step": 270247, "epoch": 3255, "val_loss": 7064497.5} {"train_loss": -24.35113525390625, "global_step": 270248, "epoch": 3256} {"train_loss": -24.99716567993164, "global_step": 270249, "epoch": 3256} {"train_loss": -24.466873168945312, "global_step": 270250, "epoch": 3256} {"train_loss": -24.480051040649414, "global_step": 270251, "epoch": 3256} {"train_loss": -24.497352600097656, "global_step": 270252, "epoch": 3256} {"train_loss": -24.87698745727539, "global_step": 270253, "epoch": 3256} {"train_loss": -24.726646423339844, "global_step": 270254, "epoch": 3256} {"train_loss": -24.746076583862305, "global_step": 270255, "epoch": 3256} {"train_loss": -24.974994659423828, "global_step": 270256, "epoch": 3256} {"train_loss": -24.91411590576172, "global_step": 270257, "epoch": 3256} {"train_loss": -24.648099899291992, "global_step": 270258, "epoch": 3256} {"train_loss": -25.033039093017578, "global_step": 270259, "epoch": 3256} {"train_loss": -24.961938858032227, "global_step": 270260, "epoch": 3256} {"train_loss": -25.02691650390625, "global_step": 270261, "epoch": 3256} {"train_loss": -25.361631393432617, "global_step": 270262, "epoch": 3256} {"train_loss": -25.1500186920166, "global_step": 270263, "epoch": 3256} {"train_loss": -25.046823501586914, "global_step": 270264, "epoch": 3256} {"train_loss": -25.085187911987305, "global_step": 270265, "epoch": 3256} {"train_loss": -25.018186569213867, "global_step": 270266, "epoch": 3256} {"train_loss": -24.91997528076172, "global_step": 270267, "epoch": 3256} {"train_loss": -25.095563888549805, "global_step": 270268, "epoch": 3256} {"train_loss": -24.95547866821289, "global_step": 270269, "epoch": 3256} {"train_loss": -24.874683380126953, "global_step": 270270, "epoch": 3256} {"train_loss": -25.491193771362305, "global_step": 270271, "epoch": 3256} {"train_loss": -25.183698654174805, "global_step": 270272, "epoch": 3256} {"train_loss": -24.729541778564453, "global_step": 270273, "epoch": 3256} {"train_loss": -25.16883659362793, "global_step": 270274, "epoch": 3256} {"train_loss": -25.57696533203125, "global_step": 270275, "epoch": 3256} {"train_loss": -25.339231491088867, "global_step": 270276, "epoch": 3256} {"train_loss": -25.12067985534668, "global_step": 270277, "epoch": 3256} {"train_loss": -25.444387435913086, "global_step": 270278, "epoch": 3256} {"train_loss": -25.380334854125977, "global_step": 270279, "epoch": 3256} {"train_loss": -25.244169235229492, "global_step": 270280, "epoch": 3256} {"train_loss": -25.27841567993164, "global_step": 270281, "epoch": 3256} {"train_loss": -25.585432052612305, "global_step": 270282, "epoch": 3256} {"train_loss": -25.453664779663086, "global_step": 270283, "epoch": 3256} {"train_loss": -25.41421127319336, "global_step": 270284, "epoch": 3256} {"train_loss": -25.174413681030273, "global_step": 270285, "epoch": 3256} {"train_loss": -25.419706344604492, "global_step": 270286, "epoch": 3256} {"train_loss": -25.17433738708496, "global_step": 270287, "epoch": 3256} {"train_loss": -24.971193313598633, "global_step": 270288, "epoch": 3256} {"train_loss": -25.463415145874023, "global_step": 270289, "epoch": 3256} {"train_loss": -25.451736450195312, "global_step": 270290, "epoch": 3256} {"train_loss": -25.380172729492188, "global_step": 270291, "epoch": 3256} {"train_loss": -25.200407028198242, "global_step": 270292, "epoch": 3256} {"train_loss": -25.61404800415039, "global_step": 270293, "epoch": 3256} {"train_loss": -24.863340377807617, "global_step": 270294, "epoch": 3256} {"train_loss": -25.07954216003418, "global_step": 270295, "epoch": 3256} {"train_loss": -25.158187866210938, "global_step": 270296, "epoch": 3256} {"train_loss": -25.225149154663086, "global_step": 270297, "epoch": 3256} {"train_loss": -25.76734733581543, "global_step": 270298, "epoch": 3256} {"train_loss": -25.27480125427246, "global_step": 270299, "epoch": 3256} {"train_loss": -25.37415885925293, "global_step": 270300, "epoch": 3256} {"train_loss": -25.565818786621094, "global_step": 270301, "epoch": 3256} {"train_loss": -25.106414794921875, "global_step": 270302, "epoch": 3256} {"train_loss": -25.110132217407227, "global_step": 270303, "epoch": 3256} {"train_loss": -25.539016723632812, "global_step": 270304, "epoch": 3256} {"train_loss": -25.38029670715332, "global_step": 270305, "epoch": 3256} {"train_loss": -25.2376766204834, "global_step": 270306, "epoch": 3256} {"train_loss": -25.377004623413086, "global_step": 270307, "epoch": 3256} {"train_loss": -25.825820922851562, "global_step": 270308, "epoch": 3256} {"train_loss": -25.229719161987305, "global_step": 270309, "epoch": 3256} {"train_loss": -25.481847763061523, "global_step": 270310, "epoch": 3256} {"train_loss": -25.55128288269043, "global_step": 270311, "epoch": 3256} {"train_loss": -25.5346622467041, "global_step": 270312, "epoch": 3256} {"train_loss": -25.600427627563477, "global_step": 270313, "epoch": 3256} {"train_loss": -25.643884658813477, "global_step": 270314, "epoch": 3256} {"train_loss": -25.573232650756836, "global_step": 270315, "epoch": 3256} {"train_loss": -25.5546932220459, "global_step": 270316, "epoch": 3256} {"train_loss": -25.024160385131836, "global_step": 270317, "epoch": 3256} {"train_loss": -25.51240348815918, "global_step": 270318, "epoch": 3256} {"train_loss": -25.469009399414062, "global_step": 270319, "epoch": 3256} {"train_loss": -25.02592658996582, "global_step": 270320, "epoch": 3256} {"train_loss": -25.223127365112305, "global_step": 270321, "epoch": 3256} {"train_loss": -25.530431747436523, "global_step": 270322, "epoch": 3256} {"train_loss": -25.29732322692871, "global_step": 270323, "epoch": 3256} {"train_loss": -25.52478790283203, "global_step": 270324, "epoch": 3256} {"train_loss": -25.398395538330078, "global_step": 270325, "epoch": 3256} {"train_loss": -25.082143783569336, "global_step": 270326, "epoch": 3256} {"train_loss": -25.445222854614258, "global_step": 270327, "epoch": 3256} {"train_loss": -25.185972213745117, "global_step": 270328, "epoch": 3256} {"train_loss": -24.817087173461914, "global_step": 270329, "epoch": 3256} {"train_loss": -25.186036810817487, "global_step": 270330, "epoch": 3256, "val_loss": 6976276.5} {"train_loss": -25.00766944885254, "global_step": 270331, "epoch": 3257} {"train_loss": -23.921804428100586, "global_step": 270332, "epoch": 3257} {"train_loss": -24.106552124023438, "global_step": 270333, "epoch": 3257} {"train_loss": -24.31574821472168, "global_step": 270334, "epoch": 3257} {"train_loss": -24.36927604675293, "global_step": 270335, "epoch": 3257} {"train_loss": -24.585987091064453, "global_step": 270336, "epoch": 3257} {"train_loss": -24.422122955322266, "global_step": 270337, "epoch": 3257} {"train_loss": -24.754150390625, "global_step": 270338, "epoch": 3257} {"train_loss": -24.919443130493164, "global_step": 270339, "epoch": 3257} {"train_loss": -24.8646297454834, "global_step": 270340, "epoch": 3257} {"train_loss": -25.13442039489746, "global_step": 270341, "epoch": 3257} {"train_loss": -24.643484115600586, "global_step": 270342, "epoch": 3257} {"train_loss": -24.735231399536133, "global_step": 270343, "epoch": 3257} {"train_loss": -24.55387306213379, "global_step": 270344, "epoch": 3257} {"train_loss": -24.89082145690918, "global_step": 270345, "epoch": 3257} {"train_loss": -24.55091667175293, "global_step": 270346, "epoch": 3257} {"train_loss": -25.216554641723633, "global_step": 270347, "epoch": 3257} {"train_loss": -24.68588638305664, "global_step": 270348, "epoch": 3257} {"train_loss": -24.774219512939453, "global_step": 270349, "epoch": 3257} {"train_loss": -24.75550079345703, "global_step": 270350, "epoch": 3257} {"train_loss": -24.956750869750977, "global_step": 270351, "epoch": 3257} {"train_loss": -24.4061222076416, "global_step": 270352, "epoch": 3257} {"train_loss": -24.867849349975586, "global_step": 270353, "epoch": 3257} {"train_loss": -24.952476501464844, "global_step": 270354, "epoch": 3257} {"train_loss": -24.954511642456055, "global_step": 270355, "epoch": 3257} {"train_loss": -24.89869499206543, "global_step": 270356, "epoch": 3257} {"train_loss": -24.907459259033203, "global_step": 270357, "epoch": 3257} {"train_loss": -25.05316925048828, "global_step": 270358, "epoch": 3257} {"train_loss": -24.947071075439453, "global_step": 270359, "epoch": 3257} {"train_loss": -24.97903823852539, "global_step": 270360, "epoch": 3257} {"train_loss": -25.086164474487305, "global_step": 270361, "epoch": 3257} {"train_loss": -25.32780647277832, "global_step": 270362, "epoch": 3257} {"train_loss": -24.926300048828125, "global_step": 270363, "epoch": 3257} {"train_loss": -25.157331466674805, "global_step": 270364, "epoch": 3257} {"train_loss": -25.032621383666992, "global_step": 270365, "epoch": 3257} {"train_loss": -25.139455795288086, "global_step": 270366, "epoch": 3257} {"train_loss": -25.44516372680664, "global_step": 270367, "epoch": 3257} {"train_loss": -25.237470626831055, "global_step": 270368, "epoch": 3257} {"train_loss": -25.094499588012695, "global_step": 270369, "epoch": 3257} {"train_loss": -25.093687057495117, "global_step": 270370, "epoch": 3257} {"train_loss": -25.243343353271484, "global_step": 270371, "epoch": 3257} {"train_loss": -25.225902557373047, "global_step": 270372, "epoch": 3257} {"train_loss": -25.387495040893555, "global_step": 270373, "epoch": 3257} {"train_loss": -25.165325164794922, "global_step": 270374, "epoch": 3257} {"train_loss": -25.698530197143555, "global_step": 270375, "epoch": 3257} {"train_loss": -24.999963760375977, "global_step": 270376, "epoch": 3257} {"train_loss": -25.307538986206055, "global_step": 270377, "epoch": 3257} {"train_loss": -25.3360538482666, "global_step": 270378, "epoch": 3257} {"train_loss": -25.055585861206055, "global_step": 270379, "epoch": 3257} {"train_loss": -25.4116268157959, "global_step": 270380, "epoch": 3257} {"train_loss": -25.315176010131836, "global_step": 270381, "epoch": 3257} {"train_loss": -25.105737686157227, "global_step": 270382, "epoch": 3257} {"train_loss": -25.686365127563477, "global_step": 270383, "epoch": 3257} {"train_loss": -25.27147102355957, "global_step": 270384, "epoch": 3257} {"train_loss": -25.155872344970703, "global_step": 270385, "epoch": 3257} {"train_loss": -25.4457950592041, "global_step": 270386, "epoch": 3257} {"train_loss": -25.44306182861328, "global_step": 270387, "epoch": 3257} {"train_loss": -25.544015884399414, "global_step": 270388, "epoch": 3257} {"train_loss": -25.36958122253418, "global_step": 270389, "epoch": 3257} {"train_loss": -25.137123107910156, "global_step": 270390, "epoch": 3257} {"train_loss": -25.265113830566406, "global_step": 270391, "epoch": 3257} {"train_loss": -25.601886749267578, "global_step": 270392, "epoch": 3257} {"train_loss": -25.507658004760742, "global_step": 270393, "epoch": 3257} {"train_loss": -25.682729721069336, "global_step": 270394, "epoch": 3257} {"train_loss": -25.34477424621582, "global_step": 270395, "epoch": 3257} {"train_loss": -25.342960357666016, "global_step": 270396, "epoch": 3257} {"train_loss": -25.387067794799805, "global_step": 270397, "epoch": 3257} {"train_loss": -25.32105255126953, "global_step": 270398, "epoch": 3257} {"train_loss": -25.244314193725586, "global_step": 270399, "epoch": 3257} {"train_loss": -24.939748764038086, "global_step": 270400, "epoch": 3257} {"train_loss": -25.23320770263672, "global_step": 270401, "epoch": 3257} {"train_loss": -25.442411422729492, "global_step": 270402, "epoch": 3257} {"train_loss": -25.14154624938965, "global_step": 270403, "epoch": 3257} {"train_loss": -25.484037399291992, "global_step": 270404, "epoch": 3257} {"train_loss": -25.406015396118164, "global_step": 270405, "epoch": 3257} {"train_loss": -25.851011276245117, "global_step": 270406, "epoch": 3257} {"train_loss": -25.545907974243164, "global_step": 270407, "epoch": 3257} {"train_loss": -25.392568588256836, "global_step": 270408, "epoch": 3257} {"train_loss": -25.534757614135742, "global_step": 270409, "epoch": 3257} {"train_loss": -25.44335174560547, "global_step": 270410, "epoch": 3257} {"train_loss": -25.46918296813965, "global_step": 270411, "epoch": 3257} {"train_loss": -25.545751571655273, "global_step": 270412, "epoch": 3257} {"train_loss": -25.086174516792756, "global_step": 270413, "epoch": 3257, "val_loss": 6928050.5} {"train_loss": -24.76569366455078, "global_step": 270414, "epoch": 3258} {"train_loss": -24.6857852935791, "global_step": 270415, "epoch": 3258} {"train_loss": -25.012252807617188, "global_step": 270416, "epoch": 3258} {"train_loss": -25.081157684326172, "global_step": 270417, "epoch": 3258} {"train_loss": -24.28549575805664, "global_step": 270418, "epoch": 3258} {"train_loss": -25.122812271118164, "global_step": 270419, "epoch": 3258} {"train_loss": -24.892902374267578, "global_step": 270420, "epoch": 3258} {"train_loss": -24.81498146057129, "global_step": 270421, "epoch": 3258} {"train_loss": -25.168699264526367, "global_step": 270422, "epoch": 3258} {"train_loss": -25.196552276611328, "global_step": 270423, "epoch": 3258} {"train_loss": -25.299367904663086, "global_step": 270424, "epoch": 3258} {"train_loss": -24.92399787902832, "global_step": 270425, "epoch": 3258} {"train_loss": -24.914533615112305, "global_step": 270426, "epoch": 3258} {"train_loss": -24.935270309448242, "global_step": 270427, "epoch": 3258} {"train_loss": -25.171932220458984, "global_step": 270428, "epoch": 3258} {"train_loss": -24.825777053833008, "global_step": 270429, "epoch": 3258} {"train_loss": -25.20297622680664, "global_step": 270430, "epoch": 3258} {"train_loss": -24.90334129333496, "global_step": 270431, "epoch": 3258} {"train_loss": -25.470401763916016, "global_step": 270432, "epoch": 3258} {"train_loss": -25.38204002380371, "global_step": 270433, "epoch": 3258} {"train_loss": -25.58003044128418, "global_step": 270434, "epoch": 3258} {"train_loss": -25.35371971130371, "global_step": 270435, "epoch": 3258} {"train_loss": -25.113882064819336, "global_step": 270436, "epoch": 3258} {"train_loss": -25.168228149414062, "global_step": 270437, "epoch": 3258} {"train_loss": -25.218671798706055, "global_step": 270438, "epoch": 3258} {"train_loss": -25.056615829467773, "global_step": 270439, "epoch": 3258} {"train_loss": -25.295705795288086, "global_step": 270440, "epoch": 3258} {"train_loss": -25.496919631958008, "global_step": 270441, "epoch": 3258} {"train_loss": -25.22333335876465, "global_step": 270442, "epoch": 3258} {"train_loss": -25.5672550201416, "global_step": 270443, "epoch": 3258} {"train_loss": -25.170591354370117, "global_step": 270444, "epoch": 3258} {"train_loss": -25.447975158691406, "global_step": 270445, "epoch": 3258} {"train_loss": -25.58186912536621, "global_step": 270446, "epoch": 3258} {"train_loss": -25.242979049682617, "global_step": 270447, "epoch": 3258} {"train_loss": -25.332523345947266, "global_step": 270448, "epoch": 3258} {"train_loss": -25.23204803466797, "global_step": 270449, "epoch": 3258} {"train_loss": -25.51157569885254, "global_step": 270450, "epoch": 3258} {"train_loss": -25.542646408081055, "global_step": 270451, "epoch": 3258} {"train_loss": -25.232492446899414, "global_step": 270452, "epoch": 3258} {"train_loss": -24.922605514526367, "global_step": 270453, "epoch": 3258} {"train_loss": -25.348182678222656, "global_step": 270454, "epoch": 3258} {"train_loss": -25.72730827331543, "global_step": 270455, "epoch": 3258} {"train_loss": -25.16655921936035, "global_step": 270456, "epoch": 3258} {"train_loss": -25.114761352539062, "global_step": 270457, "epoch": 3258} {"train_loss": -25.149648666381836, "global_step": 270458, "epoch": 3258} {"train_loss": -25.273008346557617, "global_step": 270459, "epoch": 3258} {"train_loss": -25.3825626373291, "global_step": 270460, "epoch": 3258} {"train_loss": -25.418590545654297, "global_step": 270461, "epoch": 3258} {"train_loss": -25.187108993530273, "global_step": 270462, "epoch": 3258} {"train_loss": -25.51503562927246, "global_step": 270463, "epoch": 3258} {"train_loss": -25.709064483642578, "global_step": 270464, "epoch": 3258} {"train_loss": -25.2844295501709, "global_step": 270465, "epoch": 3258} {"train_loss": -25.301145553588867, "global_step": 270466, "epoch": 3258} {"train_loss": -25.249168395996094, "global_step": 270467, "epoch": 3258} {"train_loss": -25.40987777709961, "global_step": 270468, "epoch": 3258} {"train_loss": -25.36475944519043, "global_step": 270469, "epoch": 3258} {"train_loss": -25.5765380859375, "global_step": 270470, "epoch": 3258} {"train_loss": -25.480756759643555, "global_step": 270471, "epoch": 3258} {"train_loss": -25.082740783691406, "global_step": 270472, "epoch": 3258} {"train_loss": -25.069721221923828, "global_step": 270473, "epoch": 3258} {"train_loss": -25.10638427734375, "global_step": 270474, "epoch": 3258} {"train_loss": -24.994199752807617, "global_step": 270475, "epoch": 3258} {"train_loss": -25.218679428100586, "global_step": 270476, "epoch": 3258} {"train_loss": -25.450132369995117, "global_step": 270477, "epoch": 3258} {"train_loss": -25.286792755126953, "global_step": 270478, "epoch": 3258} {"train_loss": -25.537004470825195, "global_step": 270479, "epoch": 3258} {"train_loss": -25.467084884643555, "global_step": 270480, "epoch": 3258} {"train_loss": -25.348920822143555, "global_step": 270481, "epoch": 3258} {"train_loss": -25.2913761138916, "global_step": 270482, "epoch": 3258} {"train_loss": -25.33405113220215, "global_step": 270483, "epoch": 3258} {"train_loss": -25.728256225585938, "global_step": 270484, "epoch": 3258} {"train_loss": -25.27530860900879, "global_step": 270485, "epoch": 3258} {"train_loss": -25.280139923095703, "global_step": 270486, "epoch": 3258} {"train_loss": -25.53713607788086, "global_step": 270487, "epoch": 3258} {"train_loss": -25.393030166625977, "global_step": 270488, "epoch": 3258} {"train_loss": -25.255298614501953, "global_step": 270489, "epoch": 3258} {"train_loss": -25.296062469482422, "global_step": 270490, "epoch": 3258} {"train_loss": -25.41615104675293, "global_step": 270491, "epoch": 3258} {"train_loss": -25.728498458862305, "global_step": 270492, "epoch": 3258} {"train_loss": -25.289358139038086, "global_step": 270493, "epoch": 3258} {"train_loss": -25.324365615844727, "global_step": 270494, "epoch": 3258} {"train_loss": -25.27181053161621, "global_step": 270495, "epoch": 3258} {"train_loss": -25.238386774637615, "global_step": 270496, "epoch": 3258, "val_loss": 6938667.0} {"train_loss": -25.115150451660156, "global_step": 270497, "epoch": 3259} {"train_loss": -25.144594192504883, "global_step": 270498, "epoch": 3259} {"train_loss": -25.209644317626953, "global_step": 270499, "epoch": 3259} {"train_loss": -24.781391143798828, "global_step": 270500, "epoch": 3259} {"train_loss": -24.62538719177246, "global_step": 270501, "epoch": 3259} {"train_loss": -25.34134292602539, "global_step": 270502, "epoch": 3259} {"train_loss": -24.802810668945312, "global_step": 270503, "epoch": 3259} {"train_loss": -24.87052345275879, "global_step": 270504, "epoch": 3259} {"train_loss": -24.8531494140625, "global_step": 270505, "epoch": 3259} {"train_loss": -24.9240665435791, "global_step": 270506, "epoch": 3259} {"train_loss": -24.970809936523438, "global_step": 270507, "epoch": 3259} {"train_loss": -25.066173553466797, "global_step": 270508, "epoch": 3259} {"train_loss": -24.633817672729492, "global_step": 270509, "epoch": 3259} {"train_loss": -24.83430290222168, "global_step": 270510, "epoch": 3259} {"train_loss": -25.02029800415039, "global_step": 270511, "epoch": 3259} {"train_loss": -24.95301055908203, "global_step": 270512, "epoch": 3259} {"train_loss": -25.073532104492188, "global_step": 270513, "epoch": 3259} {"train_loss": -24.99854850769043, "global_step": 270514, "epoch": 3259} {"train_loss": -25.14008903503418, "global_step": 270515, "epoch": 3259} {"train_loss": -25.07270050048828, "global_step": 270516, "epoch": 3259} {"train_loss": -25.180295944213867, "global_step": 270517, "epoch": 3259} {"train_loss": -25.23033905029297, "global_step": 270518, "epoch": 3259} {"train_loss": -25.36998176574707, "global_step": 270519, "epoch": 3259} {"train_loss": -24.855749130249023, "global_step": 270520, "epoch": 3259} {"train_loss": -25.351932525634766, "global_step": 270521, "epoch": 3259} {"train_loss": -25.440826416015625, "global_step": 270522, "epoch": 3259} {"train_loss": -25.393054962158203, "global_step": 270523, "epoch": 3259} {"train_loss": -25.383039474487305, "global_step": 270524, "epoch": 3259} {"train_loss": -25.495248794555664, "global_step": 270525, "epoch": 3259} {"train_loss": -25.360036849975586, "global_step": 270526, "epoch": 3259} {"train_loss": -25.335586547851562, "global_step": 270527, "epoch": 3259} {"train_loss": -25.92005729675293, "global_step": 270528, "epoch": 3259} {"train_loss": -25.441640853881836, "global_step": 270529, "epoch": 3259} {"train_loss": -25.43211555480957, "global_step": 270530, "epoch": 3259} {"train_loss": -25.44977378845215, "global_step": 270531, "epoch": 3259} {"train_loss": -25.36261749267578, "global_step": 270532, "epoch": 3259} {"train_loss": -25.447845458984375, "global_step": 270533, "epoch": 3259} {"train_loss": -25.33851432800293, "global_step": 270534, "epoch": 3259} {"train_loss": -25.174680709838867, "global_step": 270535, "epoch": 3259} {"train_loss": -25.165197372436523, "global_step": 270536, "epoch": 3259} {"train_loss": -25.386341094970703, "global_step": 270537, "epoch": 3259} {"train_loss": -25.28583335876465, "global_step": 270538, "epoch": 3259} {"train_loss": -25.484785079956055, "global_step": 270539, "epoch": 3259} {"train_loss": -25.525287628173828, "global_step": 270540, "epoch": 3259} {"train_loss": -25.439964294433594, "global_step": 270541, "epoch": 3259} {"train_loss": -25.189268112182617, "global_step": 270542, "epoch": 3259} {"train_loss": -25.605310440063477, "global_step": 270543, "epoch": 3259} {"train_loss": -25.517051696777344, "global_step": 270544, "epoch": 3259} {"train_loss": -25.209653854370117, "global_step": 270545, "epoch": 3259} {"train_loss": -25.496496200561523, "global_step": 270546, "epoch": 3259} {"train_loss": -25.227468490600586, "global_step": 270547, "epoch": 3259} {"train_loss": -25.5860538482666, "global_step": 270548, "epoch": 3259} {"train_loss": -25.2436580657959, "global_step": 270549, "epoch": 3259} {"train_loss": -25.787220001220703, "global_step": 270550, "epoch": 3259} {"train_loss": -25.487138748168945, "global_step": 270551, "epoch": 3259} {"train_loss": -25.553653717041016, "global_step": 270552, "epoch": 3259} {"train_loss": -25.9576358795166, "global_step": 270553, "epoch": 3259} {"train_loss": -25.631179809570312, "global_step": 270554, "epoch": 3259} {"train_loss": -25.26172637939453, "global_step": 270555, "epoch": 3259} {"train_loss": -25.162446975708008, "global_step": 270556, "epoch": 3259} {"train_loss": -25.047443389892578, "global_step": 270557, "epoch": 3259} {"train_loss": -25.06712532043457, "global_step": 270558, "epoch": 3259} {"train_loss": -25.332773208618164, "global_step": 270559, "epoch": 3259} {"train_loss": -25.229572296142578, "global_step": 270560, "epoch": 3259} {"train_loss": -25.406261444091797, "global_step": 270561, "epoch": 3259} {"train_loss": -25.29674530029297, "global_step": 270562, "epoch": 3259} {"train_loss": -25.333749771118164, "global_step": 270563, "epoch": 3259} {"train_loss": -25.29879379272461, "global_step": 270564, "epoch": 3259} {"train_loss": -25.17671775817871, "global_step": 270565, "epoch": 3259} {"train_loss": -25.02342414855957, "global_step": 270566, "epoch": 3259} {"train_loss": -25.189868927001953, "global_step": 270567, "epoch": 3259} {"train_loss": -25.515270233154297, "global_step": 270568, "epoch": 3259} {"train_loss": -24.904470443725586, "global_step": 270569, "epoch": 3259} {"train_loss": -25.15176773071289, "global_step": 270570, "epoch": 3259} {"train_loss": -25.00884437561035, "global_step": 270571, "epoch": 3259} {"train_loss": -25.350276947021484, "global_step": 270572, "epoch": 3259} {"train_loss": -25.22365951538086, "global_step": 270573, "epoch": 3259} {"train_loss": -25.152021408081055, "global_step": 270574, "epoch": 3259} {"train_loss": -25.64859962463379, "global_step": 270575, "epoch": 3259} {"train_loss": -25.159034729003906, "global_step": 270576, "epoch": 3259} {"train_loss": -25.381376266479492, "global_step": 270577, "epoch": 3259} {"train_loss": -25.137527465820312, "global_step": 270578, "epoch": 3259} {"train_loss": -25.245973426175404, "global_step": 270579, "epoch": 3259, "val_loss": 6919086.0} {"train_loss": -25.03306007385254, "global_step": 270580, "epoch": 3260} {"train_loss": -25.361989974975586, "global_step": 270581, "epoch": 3260} {"train_loss": -24.81939697265625, "global_step": 270582, "epoch": 3260} {"train_loss": -24.931325912475586, "global_step": 270583, "epoch": 3260} {"train_loss": -24.850677490234375, "global_step": 270584, "epoch": 3260} {"train_loss": -25.2130126953125, "global_step": 270585, "epoch": 3260} {"train_loss": -25.15340232849121, "global_step": 270586, "epoch": 3260} {"train_loss": -24.79327964782715, "global_step": 270587, "epoch": 3260} {"train_loss": -24.9852294921875, "global_step": 270588, "epoch": 3260} {"train_loss": -24.872243881225586, "global_step": 270589, "epoch": 3260} {"train_loss": -24.87928009033203, "global_step": 270590, "epoch": 3260} {"train_loss": -24.689695358276367, "global_step": 270591, "epoch": 3260} {"train_loss": -24.667673110961914, "global_step": 270592, "epoch": 3260} {"train_loss": -24.94098663330078, "global_step": 270593, "epoch": 3260} {"train_loss": -25.011701583862305, "global_step": 270594, "epoch": 3260} {"train_loss": -24.290433883666992, "global_step": 270595, "epoch": 3260} {"train_loss": -25.199636459350586, "global_step": 270596, "epoch": 3260} {"train_loss": -25.25064468383789, "global_step": 270597, "epoch": 3260} {"train_loss": -24.850645065307617, "global_step": 270598, "epoch": 3260} {"train_loss": -24.87856101989746, "global_step": 270599, "epoch": 3260} {"train_loss": -24.983327865600586, "global_step": 270600, "epoch": 3260} {"train_loss": -24.877399444580078, "global_step": 270601, "epoch": 3260} {"train_loss": -25.176816940307617, "global_step": 270602, "epoch": 3260} {"train_loss": -24.960195541381836, "global_step": 270603, "epoch": 3260} {"train_loss": -25.22684097290039, "global_step": 270604, "epoch": 3260} {"train_loss": -25.014188766479492, "global_step": 270605, "epoch": 3260} {"train_loss": -25.18889045715332, "global_step": 270606, "epoch": 3260} {"train_loss": -25.215618133544922, "global_step": 270607, "epoch": 3260} {"train_loss": -25.326120376586914, "global_step": 270608, "epoch": 3260} {"train_loss": -25.20015525817871, "global_step": 270609, "epoch": 3260} {"train_loss": -25.447681427001953, "global_step": 270610, "epoch": 3260} {"train_loss": -24.93170738220215, "global_step": 270611, "epoch": 3260} {"train_loss": -25.603851318359375, "global_step": 270612, "epoch": 3260} {"train_loss": -25.43707275390625, "global_step": 270613, "epoch": 3260} {"train_loss": -25.137083053588867, "global_step": 270614, "epoch": 3260} {"train_loss": -24.964635848999023, "global_step": 270615, "epoch": 3260} {"train_loss": -25.288101196289062, "global_step": 270616, "epoch": 3260} {"train_loss": -25.6019287109375, "global_step": 270617, "epoch": 3260} {"train_loss": -25.645002365112305, "global_step": 270618, "epoch": 3260} {"train_loss": -25.351613998413086, "global_step": 270619, "epoch": 3260} {"train_loss": -25.473094940185547, "global_step": 270620, "epoch": 3260} {"train_loss": -25.27073097229004, "global_step": 270621, "epoch": 3260} {"train_loss": -25.239948272705078, "global_step": 270622, "epoch": 3260} {"train_loss": -25.46402359008789, "global_step": 270623, "epoch": 3260} {"train_loss": -25.49713706970215, "global_step": 270624, "epoch": 3260} {"train_loss": -25.491811752319336, "global_step": 270625, "epoch": 3260} {"train_loss": -25.730432510375977, "global_step": 270626, "epoch": 3260} {"train_loss": -25.353782653808594, "global_step": 270627, "epoch": 3260} {"train_loss": -25.335844039916992, "global_step": 270628, "epoch": 3260} {"train_loss": -25.133275985717773, "global_step": 270629, "epoch": 3260} {"train_loss": -25.092205047607422, "global_step": 270630, "epoch": 3260} {"train_loss": -24.830732345581055, "global_step": 270631, "epoch": 3260} {"train_loss": -24.55840492248535, "global_step": 270632, "epoch": 3260} {"train_loss": -24.63995933532715, "global_step": 270633, "epoch": 3260} {"train_loss": -24.985578536987305, "global_step": 270634, "epoch": 3260} {"train_loss": -25.235755920410156, "global_step": 270635, "epoch": 3260} {"train_loss": -25.045814514160156, "global_step": 270636, "epoch": 3260} {"train_loss": -25.20380973815918, "global_step": 270637, "epoch": 3260} {"train_loss": -25.311134338378906, "global_step": 270638, "epoch": 3260} {"train_loss": -24.88215446472168, "global_step": 270639, "epoch": 3260} {"train_loss": -25.45881462097168, "global_step": 270640, "epoch": 3260} {"train_loss": -25.12099266052246, "global_step": 270641, "epoch": 3260} {"train_loss": -25.312429428100586, "global_step": 270642, "epoch": 3260} {"train_loss": -24.978086471557617, "global_step": 270643, "epoch": 3260} {"train_loss": -25.14073371887207, "global_step": 270644, "epoch": 3260} {"train_loss": -25.16610336303711, "global_step": 270645, "epoch": 3260} {"train_loss": -25.48997688293457, "global_step": 270646, "epoch": 3260} {"train_loss": -25.02274513244629, "global_step": 270647, "epoch": 3260} {"train_loss": -25.33489227294922, "global_step": 270648, "epoch": 3260} {"train_loss": -25.36930274963379, "global_step": 270649, "epoch": 3260} {"train_loss": -25.357091903686523, "global_step": 270650, "epoch": 3260} {"train_loss": -25.328969955444336, "global_step": 270651, "epoch": 3260} {"train_loss": -25.3248348236084, "global_step": 270652, "epoch": 3260} {"train_loss": -25.067331314086914, "global_step": 270653, "epoch": 3260} {"train_loss": -25.35127067565918, "global_step": 270654, "epoch": 3260} {"train_loss": -25.068599700927734, "global_step": 270655, "epoch": 3260} {"train_loss": -25.142417907714844, "global_step": 270656, "epoch": 3260} {"train_loss": -25.146657943725586, "global_step": 270657, "epoch": 3260} {"train_loss": -25.480697631835938, "global_step": 270658, "epoch": 3260} {"train_loss": -24.995683670043945, "global_step": 270659, "epoch": 3260} {"train_loss": -25.10504150390625, "global_step": 270660, "epoch": 3260} {"train_loss": -25.507495880126953, "global_step": 270661, "epoch": 3260} {"train_loss": -25.16092259050852, "global_step": 270662, "epoch": 3260, "val_loss": 7003898.0} {"train_loss": -25.116016387939453, "global_step": 270663, "epoch": 3261} {"train_loss": -24.762557983398438, "global_step": 270664, "epoch": 3261} {"train_loss": -25.001813888549805, "global_step": 270665, "epoch": 3261} {"train_loss": -25.034503936767578, "global_step": 270666, "epoch": 3261} {"train_loss": -24.930828094482422, "global_step": 270667, "epoch": 3261} {"train_loss": -25.229625701904297, "global_step": 270668, "epoch": 3261} {"train_loss": -24.674396514892578, "global_step": 270669, "epoch": 3261} {"train_loss": -25.052295684814453, "global_step": 270670, "epoch": 3261} {"train_loss": -25.32513999938965, "global_step": 270671, "epoch": 3261} {"train_loss": -25.153623580932617, "global_step": 270672, "epoch": 3261} {"train_loss": -24.85692596435547, "global_step": 270673, "epoch": 3261} {"train_loss": -25.233352661132812, "global_step": 270674, "epoch": 3261} {"train_loss": -25.135910034179688, "global_step": 270675, "epoch": 3261} {"train_loss": -25.53678321838379, "global_step": 270676, "epoch": 3261} {"train_loss": -25.05161476135254, "global_step": 270677, "epoch": 3261} {"train_loss": -25.03044891357422, "global_step": 270678, "epoch": 3261} {"train_loss": -25.107379913330078, "global_step": 270679, "epoch": 3261} {"train_loss": -25.61665916442871, "global_step": 270680, "epoch": 3261} {"train_loss": -25.22193717956543, "global_step": 270681, "epoch": 3261} {"train_loss": -25.326770782470703, "global_step": 270682, "epoch": 3261} {"train_loss": -25.465124130249023, "global_step": 270683, "epoch": 3261} {"train_loss": -25.27768325805664, "global_step": 270684, "epoch": 3261} {"train_loss": -25.568387985229492, "global_step": 270685, "epoch": 3261} {"train_loss": -25.325822830200195, "global_step": 270686, "epoch": 3261} {"train_loss": -25.357120513916016, "global_step": 270687, "epoch": 3261} {"train_loss": -25.080081939697266, "global_step": 270688, "epoch": 3261} {"train_loss": -25.11508560180664, "global_step": 270689, "epoch": 3261} {"train_loss": -25.74053382873535, "global_step": 270690, "epoch": 3261} {"train_loss": -24.9825382232666, "global_step": 270691, "epoch": 3261} {"train_loss": -25.672088623046875, "global_step": 270692, "epoch": 3261} {"train_loss": -25.31464958190918, "global_step": 270693, "epoch": 3261} {"train_loss": -25.495134353637695, "global_step": 270694, "epoch": 3261} {"train_loss": -25.110029220581055, "global_step": 270695, "epoch": 3261} {"train_loss": -25.497159957885742, "global_step": 270696, "epoch": 3261} {"train_loss": -25.19085693359375, "global_step": 270697, "epoch": 3261} {"train_loss": -25.31777000427246, "global_step": 270698, "epoch": 3261} {"train_loss": -25.132854461669922, "global_step": 270699, "epoch": 3261} {"train_loss": -25.24557876586914, "global_step": 270700, "epoch": 3261} {"train_loss": -25.478219985961914, "global_step": 270701, "epoch": 3261} {"train_loss": -24.97827911376953, "global_step": 270702, "epoch": 3261} {"train_loss": -25.6060791015625, "global_step": 270703, "epoch": 3261} {"train_loss": -25.407066345214844, "global_step": 270704, "epoch": 3261} {"train_loss": -25.418949127197266, "global_step": 270705, "epoch": 3261} {"train_loss": -25.511783599853516, "global_step": 270706, "epoch": 3261} {"train_loss": -25.637266159057617, "global_step": 270707, "epoch": 3261} {"train_loss": -25.690662384033203, "global_step": 270708, "epoch": 3261} {"train_loss": -25.262653350830078, "global_step": 270709, "epoch": 3261} {"train_loss": -25.374685287475586, "global_step": 270710, "epoch": 3261} {"train_loss": -25.405029296875, "global_step": 270711, "epoch": 3261} {"train_loss": -24.982229232788086, "global_step": 270712, "epoch": 3261} {"train_loss": -25.109786987304688, "global_step": 270713, "epoch": 3261} {"train_loss": -25.080900192260742, "global_step": 270714, "epoch": 3261} {"train_loss": -24.933496475219727, "global_step": 270715, "epoch": 3261} {"train_loss": -25.467838287353516, "global_step": 270716, "epoch": 3261} {"train_loss": -25.036714553833008, "global_step": 270717, "epoch": 3261} {"train_loss": -25.347469329833984, "global_step": 270718, "epoch": 3261} {"train_loss": -25.48395538330078, "global_step": 270719, "epoch": 3261} {"train_loss": -25.562246322631836, "global_step": 270720, "epoch": 3261} {"train_loss": -25.378009796142578, "global_step": 270721, "epoch": 3261} {"train_loss": -25.238037109375, "global_step": 270722, "epoch": 3261} {"train_loss": -25.478727340698242, "global_step": 270723, "epoch": 3261} {"train_loss": -25.335851669311523, "global_step": 270724, "epoch": 3261} {"train_loss": -25.302906036376953, "global_step": 270725, "epoch": 3261} {"train_loss": -24.993703842163086, "global_step": 270726, "epoch": 3261} {"train_loss": -24.913516998291016, "global_step": 270727, "epoch": 3261} {"train_loss": -25.4456729888916, "global_step": 270728, "epoch": 3261} {"train_loss": -25.541044235229492, "global_step": 270729, "epoch": 3261} {"train_loss": -25.47060775756836, "global_step": 270730, "epoch": 3261} {"train_loss": -25.209583282470703, "global_step": 270731, "epoch": 3261} {"train_loss": -25.354703903198242, "global_step": 270732, "epoch": 3261} {"train_loss": -25.373926162719727, "global_step": 270733, "epoch": 3261} {"train_loss": -25.262649536132812, "global_step": 270734, "epoch": 3261} {"train_loss": -25.189353942871094, "global_step": 270735, "epoch": 3261} {"train_loss": -25.185678482055664, "global_step": 270736, "epoch": 3261} {"train_loss": -25.024534225463867, "global_step": 270737, "epoch": 3261} {"train_loss": -25.52182388305664, "global_step": 270738, "epoch": 3261} {"train_loss": -25.622760772705078, "global_step": 270739, "epoch": 3261} {"train_loss": -24.925596237182617, "global_step": 270740, "epoch": 3261} {"train_loss": -25.56196403503418, "global_step": 270741, "epoch": 3261} {"train_loss": -25.15058708190918, "global_step": 270742, "epoch": 3261} {"train_loss": -25.194927215576172, "global_step": 270743, "epoch": 3261} {"train_loss": -25.030292510986328, "global_step": 270744, "epoch": 3261} {"train_loss": -25.249705647847737, "global_step": 270745, "epoch": 3261, "val_loss": 7117182.0} {"train_loss": -24.715656280517578, "global_step": 270746, "epoch": 3262} {"train_loss": -24.684926986694336, "global_step": 270747, "epoch": 3262} {"train_loss": -25.428516387939453, "global_step": 270748, "epoch": 3262} {"train_loss": -24.451749801635742, "global_step": 270749, "epoch": 3262} {"train_loss": -25.013431549072266, "global_step": 270750, "epoch": 3262} {"train_loss": -24.873079299926758, "global_step": 270751, "epoch": 3262} {"train_loss": -24.7624454498291, "global_step": 270752, "epoch": 3262} {"train_loss": -24.591325759887695, "global_step": 270753, "epoch": 3262} {"train_loss": -25.12308120727539, "global_step": 270754, "epoch": 3262} {"train_loss": -24.776508331298828, "global_step": 270755, "epoch": 3262} {"train_loss": -24.742162704467773, "global_step": 270756, "epoch": 3262} {"train_loss": -25.033727645874023, "global_step": 270757, "epoch": 3262} {"train_loss": -24.96346092224121, "global_step": 270758, "epoch": 3262} {"train_loss": -25.2496395111084, "global_step": 270759, "epoch": 3262} {"train_loss": -25.181350708007812, "global_step": 270760, "epoch": 3262} {"train_loss": -24.994882583618164, "global_step": 270761, "epoch": 3262} {"train_loss": -25.060224533081055, "global_step": 270762, "epoch": 3262} {"train_loss": -25.417322158813477, "global_step": 270763, "epoch": 3262} {"train_loss": -24.947599411010742, "global_step": 270764, "epoch": 3262} {"train_loss": -25.048852920532227, "global_step": 270765, "epoch": 3262} {"train_loss": -25.214900970458984, "global_step": 270766, "epoch": 3262} {"train_loss": -25.10491943359375, "global_step": 270767, "epoch": 3262} {"train_loss": -25.57924461364746, "global_step": 270768, "epoch": 3262} {"train_loss": -25.620962142944336, "global_step": 270769, "epoch": 3262} {"train_loss": -25.173730850219727, "global_step": 270770, "epoch": 3262} {"train_loss": -25.351972579956055, "global_step": 270771, "epoch": 3262} {"train_loss": -25.23284912109375, "global_step": 270772, "epoch": 3262} {"train_loss": -25.551488876342773, "global_step": 270773, "epoch": 3262} {"train_loss": -25.561084747314453, "global_step": 270774, "epoch": 3262} {"train_loss": -25.326047897338867, "global_step": 270775, "epoch": 3262} {"train_loss": -25.239856719970703, "global_step": 270776, "epoch": 3262} {"train_loss": -25.238054275512695, "global_step": 270777, "epoch": 3262} {"train_loss": -25.13722038269043, "global_step": 270778, "epoch": 3262} {"train_loss": -25.320486068725586, "global_step": 270779, "epoch": 3262} {"train_loss": -25.171010971069336, "global_step": 270780, "epoch": 3262} {"train_loss": -25.45608901977539, "global_step": 270781, "epoch": 3262} {"train_loss": -25.022747039794922, "global_step": 270782, "epoch": 3262} {"train_loss": -25.293603897094727, "global_step": 270783, "epoch": 3262} {"train_loss": -25.254383087158203, "global_step": 270784, "epoch": 3262} {"train_loss": -25.1472110748291, "global_step": 270785, "epoch": 3262} {"train_loss": -25.042585372924805, "global_step": 270786, "epoch": 3262} {"train_loss": -25.292129516601562, "global_step": 270787, "epoch": 3262} {"train_loss": -25.122392654418945, "global_step": 270788, "epoch": 3262} {"train_loss": -25.261415481567383, "global_step": 270789, "epoch": 3262} {"train_loss": -25.421297073364258, "global_step": 270790, "epoch": 3262} {"train_loss": -25.33379554748535, "global_step": 270791, "epoch": 3262} {"train_loss": -25.122760772705078, "global_step": 270792, "epoch": 3262} {"train_loss": -25.347116470336914, "global_step": 270793, "epoch": 3262} {"train_loss": -25.632614135742188, "global_step": 270794, "epoch": 3262} {"train_loss": -25.19904327392578, "global_step": 270795, "epoch": 3262} {"train_loss": -25.007511138916016, "global_step": 270796, "epoch": 3262} {"train_loss": -25.58115005493164, "global_step": 270797, "epoch": 3262} {"train_loss": -25.307506561279297, "global_step": 270798, "epoch": 3262} {"train_loss": -25.39609146118164, "global_step": 270799, "epoch": 3262} {"train_loss": -25.6859073638916, "global_step": 270800, "epoch": 3262} {"train_loss": -25.532163619995117, "global_step": 270801, "epoch": 3262} {"train_loss": -25.216632843017578, "global_step": 270802, "epoch": 3262} {"train_loss": -25.2716064453125, "global_step": 270803, "epoch": 3262} {"train_loss": -25.136465072631836, "global_step": 270804, "epoch": 3262} {"train_loss": -25.455677032470703, "global_step": 270805, "epoch": 3262} {"train_loss": -25.297103881835938, "global_step": 270806, "epoch": 3262} {"train_loss": -25.194114685058594, "global_step": 270807, "epoch": 3262} {"train_loss": -25.26297950744629, "global_step": 270808, "epoch": 3262} {"train_loss": -25.555612564086914, "global_step": 270809, "epoch": 3262} {"train_loss": -24.939800262451172, "global_step": 270810, "epoch": 3262} {"train_loss": -25.29568862915039, "global_step": 270811, "epoch": 3262} {"train_loss": -25.123695373535156, "global_step": 270812, "epoch": 3262} {"train_loss": -25.38289451599121, "global_step": 270813, "epoch": 3262} {"train_loss": -25.29678726196289, "global_step": 270814, "epoch": 3262} {"train_loss": -25.18077850341797, "global_step": 270815, "epoch": 3262} {"train_loss": -25.41534996032715, "global_step": 270816, "epoch": 3262} {"train_loss": -25.308841705322266, "global_step": 270817, "epoch": 3262} {"train_loss": -24.636655807495117, "global_step": 270818, "epoch": 3262} {"train_loss": -25.246047973632812, "global_step": 270819, "epoch": 3262} {"train_loss": -25.179290771484375, "global_step": 270820, "epoch": 3262} {"train_loss": -25.393735885620117, "global_step": 270821, "epoch": 3262} {"train_loss": -25.477094650268555, "global_step": 270822, "epoch": 3262} {"train_loss": -25.53133201599121, "global_step": 270823, "epoch": 3262} {"train_loss": -25.164640426635742, "global_step": 270824, "epoch": 3262} {"train_loss": -25.25128746032715, "global_step": 270825, "epoch": 3262} {"train_loss": -25.39552879333496, "global_step": 270826, "epoch": 3262} {"train_loss": -25.335834503173828, "global_step": 270827, "epoch": 3262} {"train_loss": -25.20806443547628, "global_step": 270828, "epoch": 3262, "val_loss": 6978460.0} {"train_loss": -23.877561569213867, "global_step": 270829, "epoch": 3263} {"train_loss": -23.7896728515625, "global_step": 270830, "epoch": 3263} {"train_loss": -25.31221580505371, "global_step": 270831, "epoch": 3263} {"train_loss": -24.163803100585938, "global_step": 270832, "epoch": 3263} {"train_loss": -24.86298179626465, "global_step": 270833, "epoch": 3263} {"train_loss": -24.431638717651367, "global_step": 270834, "epoch": 3263} {"train_loss": -24.485462188720703, "global_step": 270835, "epoch": 3263} {"train_loss": -24.70558738708496, "global_step": 270836, "epoch": 3263} {"train_loss": -24.526281356811523, "global_step": 270837, "epoch": 3263} {"train_loss": -24.542217254638672, "global_step": 270838, "epoch": 3263} {"train_loss": -24.5640869140625, "global_step": 270839, "epoch": 3263} {"train_loss": -24.757516860961914, "global_step": 270840, "epoch": 3263} {"train_loss": -24.55445671081543, "global_step": 270841, "epoch": 3263} {"train_loss": -24.96699333190918, "global_step": 270842, "epoch": 3263} {"train_loss": -24.810073852539062, "global_step": 270843, "epoch": 3263} {"train_loss": -24.790908813476562, "global_step": 270844, "epoch": 3263} {"train_loss": -24.700483322143555, "global_step": 270845, "epoch": 3263} {"train_loss": -24.501829147338867, "global_step": 270846, "epoch": 3263} {"train_loss": -25.22999382019043, "global_step": 270847, "epoch": 3263} {"train_loss": -25.057584762573242, "global_step": 270848, "epoch": 3263} {"train_loss": -25.236921310424805, "global_step": 270849, "epoch": 3263} {"train_loss": -25.341632843017578, "global_step": 270850, "epoch": 3263} {"train_loss": -25.302799224853516, "global_step": 270851, "epoch": 3263} {"train_loss": -25.262462615966797, "global_step": 270852, "epoch": 3263} {"train_loss": -25.43143653869629, "global_step": 270853, "epoch": 3263} {"train_loss": -25.147336959838867, "global_step": 270854, "epoch": 3263} {"train_loss": -25.389684677124023, "global_step": 270855, "epoch": 3263} {"train_loss": -25.05881690979004, "global_step": 270856, "epoch": 3263} {"train_loss": -25.432119369506836, "global_step": 270857, "epoch": 3263} {"train_loss": -25.484073638916016, "global_step": 270858, "epoch": 3263} {"train_loss": -25.205629348754883, "global_step": 270859, "epoch": 3263} {"train_loss": -24.92975616455078, "global_step": 270860, "epoch": 3263} {"train_loss": -25.684789657592773, "global_step": 270861, "epoch": 3263} {"train_loss": -25.593381881713867, "global_step": 270862, "epoch": 3263} {"train_loss": -24.832366943359375, "global_step": 270863, "epoch": 3263} {"train_loss": -25.43280601501465, "global_step": 270864, "epoch": 3263} {"train_loss": -25.406702041625977, "global_step": 270865, "epoch": 3263} {"train_loss": -25.030176162719727, "global_step": 270866, "epoch": 3263} {"train_loss": -25.26104736328125, "global_step": 270867, "epoch": 3263} {"train_loss": -24.93903923034668, "global_step": 270868, "epoch": 3263} {"train_loss": -25.357248306274414, "global_step": 270869, "epoch": 3263} {"train_loss": -25.43849754333496, "global_step": 270870, "epoch": 3263} {"train_loss": -25.58441734313965, "global_step": 270871, "epoch": 3263} {"train_loss": -25.286373138427734, "global_step": 270872, "epoch": 3263} {"train_loss": -25.409643173217773, "global_step": 270873, "epoch": 3263} {"train_loss": -25.32847785949707, "global_step": 270874, "epoch": 3263} {"train_loss": -25.566593170166016, "global_step": 270875, "epoch": 3263} {"train_loss": -25.21711540222168, "global_step": 270876, "epoch": 3263} {"train_loss": -25.142393112182617, "global_step": 270877, "epoch": 3263} {"train_loss": -25.409204483032227, "global_step": 270878, "epoch": 3263} {"train_loss": -25.423505783081055, "global_step": 270879, "epoch": 3263} {"train_loss": -25.490793228149414, "global_step": 270880, "epoch": 3263} {"train_loss": -25.318302154541016, "global_step": 270881, "epoch": 3263} {"train_loss": -25.484420776367188, "global_step": 270882, "epoch": 3263} {"train_loss": -25.599660873413086, "global_step": 270883, "epoch": 3263} {"train_loss": -25.520854949951172, "global_step": 270884, "epoch": 3263} {"train_loss": -25.723407745361328, "global_step": 270885, "epoch": 3263} {"train_loss": -25.350473403930664, "global_step": 270886, "epoch": 3263} {"train_loss": -25.367359161376953, "global_step": 270887, "epoch": 3263} {"train_loss": -25.5997314453125, "global_step": 270888, "epoch": 3263} {"train_loss": -25.76324462890625, "global_step": 270889, "epoch": 3263} {"train_loss": -25.422788619995117, "global_step": 270890, "epoch": 3263} {"train_loss": -25.815317153930664, "global_step": 270891, "epoch": 3263} {"train_loss": -25.533016204833984, "global_step": 270892, "epoch": 3263} {"train_loss": -24.854394912719727, "global_step": 270893, "epoch": 3263} {"train_loss": -23.612367630004883, "global_step": 270894, "epoch": 3263} {"train_loss": -22.900983810424805, "global_step": 270895, "epoch": 3263} {"train_loss": -22.779977798461914, "global_step": 270896, "epoch": 3263} {"train_loss": -24.669504165649414, "global_step": 270897, "epoch": 3263} {"train_loss": -24.35956382751465, "global_step": 270898, "epoch": 3263} {"train_loss": -24.836017608642578, "global_step": 270899, "epoch": 3263} {"train_loss": -24.411075592041016, "global_step": 270900, "epoch": 3263} {"train_loss": -24.9082088470459, "global_step": 270901, "epoch": 3263} {"train_loss": -24.895526885986328, "global_step": 270902, "epoch": 3263} {"train_loss": -24.89747428894043, "global_step": 270903, "epoch": 3263} {"train_loss": -24.818252563476562, "global_step": 270904, "epoch": 3263} {"train_loss": -24.720233917236328, "global_step": 270905, "epoch": 3263} {"train_loss": -24.63829803466797, "global_step": 270906, "epoch": 3263} {"train_loss": -24.865840911865234, "global_step": 270907, "epoch": 3263} {"train_loss": -24.868127822875977, "global_step": 270908, "epoch": 3263} {"train_loss": -24.90260887145996, "global_step": 270909, "epoch": 3263} {"train_loss": -24.91922950744629, "global_step": 270910, "epoch": 3263} {"train_loss": -24.989003215927674, "global_step": 270911, "epoch": 3263, "val_loss": 6979052.0} {"train_loss": -24.176610946655273, "global_step": 270912, "epoch": 3264} {"train_loss": -24.495595932006836, "global_step": 270913, "epoch": 3264} {"train_loss": -24.38321876525879, "global_step": 270914, "epoch": 3264} {"train_loss": -24.5549259185791, "global_step": 270915, "epoch": 3264} {"train_loss": -24.65217399597168, "global_step": 270916, "epoch": 3264} {"train_loss": -24.425500869750977, "global_step": 270917, "epoch": 3264} {"train_loss": -24.594589233398438, "global_step": 270918, "epoch": 3264} {"train_loss": -24.439594268798828, "global_step": 270919, "epoch": 3264} {"train_loss": -24.669431686401367, "global_step": 270920, "epoch": 3264} {"train_loss": -24.77202606201172, "global_step": 270921, "epoch": 3264} {"train_loss": -25.070314407348633, "global_step": 270922, "epoch": 3264} {"train_loss": -24.825971603393555, "global_step": 270923, "epoch": 3264} {"train_loss": -24.944631576538086, "global_step": 270924, "epoch": 3264} {"train_loss": -25.097562789916992, "global_step": 270925, "epoch": 3264} {"train_loss": -24.88022232055664, "global_step": 270926, "epoch": 3264} {"train_loss": -24.605924606323242, "global_step": 270927, "epoch": 3264} {"train_loss": -24.91423988342285, "global_step": 270928, "epoch": 3264} {"train_loss": -25.06668472290039, "global_step": 270929, "epoch": 3264} {"train_loss": -25.11164665222168, "global_step": 270930, "epoch": 3264} {"train_loss": -25.041034698486328, "global_step": 270931, "epoch": 3264} {"train_loss": -25.120920181274414, "global_step": 270932, "epoch": 3264} {"train_loss": -25.119556427001953, "global_step": 270933, "epoch": 3264} {"train_loss": -25.078439712524414, "global_step": 270934, "epoch": 3264} {"train_loss": -24.98934555053711, "global_step": 270935, "epoch": 3264} {"train_loss": -25.176725387573242, "global_step": 270936, "epoch": 3264} {"train_loss": -25.02294921875, "global_step": 270937, "epoch": 3264} {"train_loss": -25.174951553344727, "global_step": 270938, "epoch": 3264} {"train_loss": -25.503793716430664, "global_step": 270939, "epoch": 3264} {"train_loss": -24.887500762939453, "global_step": 270940, "epoch": 3264} {"train_loss": -25.266048431396484, "global_step": 270941, "epoch": 3264} {"train_loss": -25.18940544128418, "global_step": 270942, "epoch": 3264} {"train_loss": -24.945775985717773, "global_step": 270943, "epoch": 3264} {"train_loss": -25.026275634765625, "global_step": 270944, "epoch": 3264} {"train_loss": -25.837528228759766, "global_step": 270945, "epoch": 3264} {"train_loss": -25.673837661743164, "global_step": 270946, "epoch": 3264} {"train_loss": -25.695859909057617, "global_step": 270947, "epoch": 3264} {"train_loss": -25.21222686767578, "global_step": 270948, "epoch": 3264} {"train_loss": -25.08688735961914, "global_step": 270949, "epoch": 3264} {"train_loss": -24.936445236206055, "global_step": 270950, "epoch": 3264} {"train_loss": -25.605039596557617, "global_step": 270951, "epoch": 3264} {"train_loss": -25.22698211669922, "global_step": 270952, "epoch": 3264} {"train_loss": -25.167707443237305, "global_step": 270953, "epoch": 3264} {"train_loss": -25.298233032226562, "global_step": 270954, "epoch": 3264} {"train_loss": -25.072341918945312, "global_step": 270955, "epoch": 3264} {"train_loss": -25.331056594848633, "global_step": 270956, "epoch": 3264} {"train_loss": -25.507030487060547, "global_step": 270957, "epoch": 3264} {"train_loss": -25.377334594726562, "global_step": 270958, "epoch": 3264} {"train_loss": -25.598203659057617, "global_step": 270959, "epoch": 3264} {"train_loss": -25.205110549926758, "global_step": 270960, "epoch": 3264} {"train_loss": -25.465147018432617, "global_step": 270961, "epoch": 3264} {"train_loss": -25.28541374206543, "global_step": 270962, "epoch": 3264} {"train_loss": -25.36575698852539, "global_step": 270963, "epoch": 3264} {"train_loss": -25.244922637939453, "global_step": 270964, "epoch": 3264} {"train_loss": -25.440086364746094, "global_step": 270965, "epoch": 3264} {"train_loss": -25.725290298461914, "global_step": 270966, "epoch": 3264} {"train_loss": -25.405424118041992, "global_step": 270967, "epoch": 3264} {"train_loss": -25.425064086914062, "global_step": 270968, "epoch": 3264} {"train_loss": -25.604909896850586, "global_step": 270969, "epoch": 3264} {"train_loss": -25.558658599853516, "global_step": 270970, "epoch": 3264} {"train_loss": -25.533618927001953, "global_step": 270971, "epoch": 3264} {"train_loss": -25.351882934570312, "global_step": 270972, "epoch": 3264} {"train_loss": -25.129100799560547, "global_step": 270973, "epoch": 3264} {"train_loss": -25.090534210205078, "global_step": 270974, "epoch": 3264} {"train_loss": -25.20294761657715, "global_step": 270975, "epoch": 3264} {"train_loss": -25.482074737548828, "global_step": 270976, "epoch": 3264} {"train_loss": -25.347261428833008, "global_step": 270977, "epoch": 3264} {"train_loss": -25.34756088256836, "global_step": 270978, "epoch": 3264} {"train_loss": -25.163312911987305, "global_step": 270979, "epoch": 3264} {"train_loss": -25.44432258605957, "global_step": 270980, "epoch": 3264} {"train_loss": -25.43297576904297, "global_step": 270981, "epoch": 3264} {"train_loss": -25.377534866333008, "global_step": 270982, "epoch": 3264} {"train_loss": -25.25678825378418, "global_step": 270983, "epoch": 3264} {"train_loss": -25.332414627075195, "global_step": 270984, "epoch": 3264} {"train_loss": -25.2764949798584, "global_step": 270985, "epoch": 3264} {"train_loss": -24.956106185913086, "global_step": 270986, "epoch": 3264} {"train_loss": -25.36458396911621, "global_step": 270987, "epoch": 3264} {"train_loss": -24.871660232543945, "global_step": 270988, "epoch": 3264} {"train_loss": -25.448394775390625, "global_step": 270989, "epoch": 3264} {"train_loss": -25.686059951782227, "global_step": 270990, "epoch": 3264} {"train_loss": -25.25617027282715, "global_step": 270991, "epoch": 3264} {"train_loss": -25.451223373413086, "global_step": 270992, "epoch": 3264} {"train_loss": -25.64692497253418, "global_step": 270993, "epoch": 3264} {"train_loss": -25.159712228430323, "global_step": 270994, "epoch": 3264, "val_loss": 6993491.0} {"train_loss": -25.10282325744629, "global_step": 270995, "epoch": 3265} {"train_loss": -24.785123825073242, "global_step": 270996, "epoch": 3265} {"train_loss": -24.949729919433594, "global_step": 270997, "epoch": 3265} {"train_loss": -25.091049194335938, "global_step": 270998, "epoch": 3265} {"train_loss": -25.474876403808594, "global_step": 270999, "epoch": 3265} {"train_loss": -25.069616317749023, "global_step": 271000, "epoch": 3265} {"train_loss": -24.840818405151367, "global_step": 271001, "epoch": 3265} {"train_loss": -25.311979293823242, "global_step": 271002, "epoch": 3265} {"train_loss": -25.166728973388672, "global_step": 271003, "epoch": 3265} {"train_loss": -24.98814582824707, "global_step": 271004, "epoch": 3265} {"train_loss": -25.068403244018555, "global_step": 271005, "epoch": 3265} {"train_loss": -25.1673583984375, "global_step": 271006, "epoch": 3265} {"train_loss": -25.010025024414062, "global_step": 271007, "epoch": 3265} {"train_loss": -25.00764274597168, "global_step": 271008, "epoch": 3265} {"train_loss": -25.229108810424805, "global_step": 271009, "epoch": 3265} {"train_loss": -25.2165584564209, "global_step": 271010, "epoch": 3265} {"train_loss": -25.379745483398438, "global_step": 271011, "epoch": 3265} {"train_loss": -25.145549774169922, "global_step": 271012, "epoch": 3265} {"train_loss": -24.92070198059082, "global_step": 271013, "epoch": 3265} {"train_loss": -25.694595336914062, "global_step": 271014, "epoch": 3265} {"train_loss": -25.237808227539062, "global_step": 271015, "epoch": 3265} {"train_loss": -25.25971031188965, "global_step": 271016, "epoch": 3265} {"train_loss": -25.52918815612793, "global_step": 271017, "epoch": 3265} {"train_loss": -25.413278579711914, "global_step": 271018, "epoch": 3265} {"train_loss": -25.342945098876953, "global_step": 271019, "epoch": 3265} {"train_loss": -25.303171157836914, "global_step": 271020, "epoch": 3265} {"train_loss": -25.913721084594727, "global_step": 271021, "epoch": 3265} {"train_loss": -25.633914947509766, "global_step": 271022, "epoch": 3265} {"train_loss": -25.336050033569336, "global_step": 271023, "epoch": 3265} {"train_loss": -25.735034942626953, "global_step": 271024, "epoch": 3265} {"train_loss": -25.31099510192871, "global_step": 271025, "epoch": 3265} {"train_loss": -25.06699562072754, "global_step": 271026, "epoch": 3265} {"train_loss": -25.15494728088379, "global_step": 271027, "epoch": 3265} {"train_loss": -25.563888549804688, "global_step": 271028, "epoch": 3265} {"train_loss": -25.38230323791504, "global_step": 271029, "epoch": 3265} {"train_loss": -25.261882781982422, "global_step": 271030, "epoch": 3265} {"train_loss": -25.875091552734375, "global_step": 271031, "epoch": 3265} {"train_loss": -25.54280662536621, "global_step": 271032, "epoch": 3265} {"train_loss": -25.405202865600586, "global_step": 271033, "epoch": 3265} {"train_loss": -25.2819766998291, "global_step": 271034, "epoch": 3265} {"train_loss": -25.202266693115234, "global_step": 271035, "epoch": 3265} {"train_loss": -25.285505294799805, "global_step": 271036, "epoch": 3265} {"train_loss": -25.523502349853516, "global_step": 271037, "epoch": 3265} {"train_loss": -25.1267147064209, "global_step": 271038, "epoch": 3265} {"train_loss": -25.140905380249023, "global_step": 271039, "epoch": 3265} {"train_loss": -24.965620040893555, "global_step": 271040, "epoch": 3265} {"train_loss": -24.81715202331543, "global_step": 271041, "epoch": 3265} {"train_loss": -25.536413192749023, "global_step": 271042, "epoch": 3265} {"train_loss": -25.260242462158203, "global_step": 271043, "epoch": 3265} {"train_loss": -24.94459342956543, "global_step": 271044, "epoch": 3265} {"train_loss": -25.089399337768555, "global_step": 271045, "epoch": 3265} {"train_loss": -25.835559844970703, "global_step": 271046, "epoch": 3265} {"train_loss": -25.07807731628418, "global_step": 271047, "epoch": 3265} {"train_loss": -25.463367462158203, "global_step": 271048, "epoch": 3265} {"train_loss": -25.20814323425293, "global_step": 271049, "epoch": 3265} {"train_loss": -24.938194274902344, "global_step": 271050, "epoch": 3265} {"train_loss": -25.111684799194336, "global_step": 271051, "epoch": 3265} {"train_loss": -24.617456436157227, "global_step": 271052, "epoch": 3265} {"train_loss": -25.022260665893555, "global_step": 271053, "epoch": 3265} {"train_loss": -25.1812686920166, "global_step": 271054, "epoch": 3265} {"train_loss": -24.94746208190918, "global_step": 271055, "epoch": 3265} {"train_loss": -25.33088493347168, "global_step": 271056, "epoch": 3265} {"train_loss": -25.26312828063965, "global_step": 271057, "epoch": 3265} {"train_loss": -24.8861141204834, "global_step": 271058, "epoch": 3265} {"train_loss": -24.88677406311035, "global_step": 271059, "epoch": 3265} {"train_loss": -25.497377395629883, "global_step": 271060, "epoch": 3265} {"train_loss": -25.265932083129883, "global_step": 271061, "epoch": 3265} {"train_loss": -24.80914306640625, "global_step": 271062, "epoch": 3265} {"train_loss": -25.15644645690918, "global_step": 271063, "epoch": 3265} {"train_loss": -24.927228927612305, "global_step": 271064, "epoch": 3265} {"train_loss": -25.02351188659668, "global_step": 271065, "epoch": 3265} {"train_loss": -24.854936599731445, "global_step": 271066, "epoch": 3265} {"train_loss": -25.23163604736328, "global_step": 271067, "epoch": 3265} {"train_loss": -25.41212272644043, "global_step": 271068, "epoch": 3265} {"train_loss": -24.990812301635742, "global_step": 271069, "epoch": 3265} {"train_loss": -25.20863914489746, "global_step": 271070, "epoch": 3265} {"train_loss": -25.17854118347168, "global_step": 271071, "epoch": 3265} {"train_loss": -25.10430335998535, "global_step": 271072, "epoch": 3265} {"train_loss": -25.25357437133789, "global_step": 271073, "epoch": 3265} {"train_loss": -24.548988342285156, "global_step": 271074, "epoch": 3265} {"train_loss": -25.325439453125, "global_step": 271075, "epoch": 3265} {"train_loss": -25.515329360961914, "global_step": 271076, "epoch": 3265} {"train_loss": -25.204822907964868, "global_step": 271077, "epoch": 3265, "val_loss": 6962039.0} {"train_loss": -24.46006965637207, "global_step": 271078, "epoch": 3266} {"train_loss": -24.95314598083496, "global_step": 271079, "epoch": 3266} {"train_loss": -24.793655395507812, "global_step": 271080, "epoch": 3266} {"train_loss": -24.943218231201172, "global_step": 271081, "epoch": 3266} {"train_loss": -25.078189849853516, "global_step": 271082, "epoch": 3266} {"train_loss": -24.98652458190918, "global_step": 271083, "epoch": 3266} {"train_loss": -25.189287185668945, "global_step": 271084, "epoch": 3266} {"train_loss": -25.2216796875, "global_step": 271085, "epoch": 3266} {"train_loss": -25.023269653320312, "global_step": 271086, "epoch": 3266} {"train_loss": -25.04599380493164, "global_step": 271087, "epoch": 3266} {"train_loss": -24.787546157836914, "global_step": 271088, "epoch": 3266} {"train_loss": -25.310516357421875, "global_step": 271089, "epoch": 3266} {"train_loss": -25.336042404174805, "global_step": 271090, "epoch": 3266} {"train_loss": -24.918655395507812, "global_step": 271091, "epoch": 3266} {"train_loss": -24.775793075561523, "global_step": 271092, "epoch": 3266} {"train_loss": -25.363248825073242, "global_step": 271093, "epoch": 3266} {"train_loss": -25.341405868530273, "global_step": 271094, "epoch": 3266} {"train_loss": -25.23451042175293, "global_step": 271095, "epoch": 3266} {"train_loss": -25.23797607421875, "global_step": 271096, "epoch": 3266} {"train_loss": -25.32777214050293, "global_step": 271097, "epoch": 3266} {"train_loss": -25.321104049682617, "global_step": 271098, "epoch": 3266} {"train_loss": -25.010698318481445, "global_step": 271099, "epoch": 3266} {"train_loss": -25.21919822692871, "global_step": 271100, "epoch": 3266} {"train_loss": -25.39896011352539, "global_step": 271101, "epoch": 3266} {"train_loss": -25.175546646118164, "global_step": 271102, "epoch": 3266} {"train_loss": -25.458417892456055, "global_step": 271103, "epoch": 3266} {"train_loss": -25.29456901550293, "global_step": 271104, "epoch": 3266} {"train_loss": -25.398624420166016, "global_step": 271105, "epoch": 3266} {"train_loss": -25.130552291870117, "global_step": 271106, "epoch": 3266} {"train_loss": -25.28343963623047, "global_step": 271107, "epoch": 3266} {"train_loss": -25.374469757080078, "global_step": 271108, "epoch": 3266} {"train_loss": -25.161483764648438, "global_step": 271109, "epoch": 3266} {"train_loss": -25.278152465820312, "global_step": 271110, "epoch": 3266} {"train_loss": -25.722288131713867, "global_step": 271111, "epoch": 3266} {"train_loss": -25.34205436706543, "global_step": 271112, "epoch": 3266} {"train_loss": -25.114614486694336, "global_step": 271113, "epoch": 3266} {"train_loss": -25.071386337280273, "global_step": 271114, "epoch": 3266} {"train_loss": -25.468673706054688, "global_step": 271115, "epoch": 3266} {"train_loss": -25.19179344177246, "global_step": 271116, "epoch": 3266} {"train_loss": -24.916584014892578, "global_step": 271117, "epoch": 3266} {"train_loss": -25.203657150268555, "global_step": 271118, "epoch": 3266} {"train_loss": -25.18027687072754, "global_step": 271119, "epoch": 3266} {"train_loss": -25.24016761779785, "global_step": 271120, "epoch": 3266} {"train_loss": -25.539457321166992, "global_step": 271121, "epoch": 3266} {"train_loss": -25.252079010009766, "global_step": 271122, "epoch": 3266} {"train_loss": -24.92920684814453, "global_step": 271123, "epoch": 3266} {"train_loss": -25.127702713012695, "global_step": 271124, "epoch": 3266} {"train_loss": -25.173738479614258, "global_step": 271125, "epoch": 3266} {"train_loss": -25.13795280456543, "global_step": 271126, "epoch": 3266} {"train_loss": -25.416688919067383, "global_step": 271127, "epoch": 3266} {"train_loss": -25.411020278930664, "global_step": 271128, "epoch": 3266} {"train_loss": -25.327239990234375, "global_step": 271129, "epoch": 3266} {"train_loss": -25.520280838012695, "global_step": 271130, "epoch": 3266} {"train_loss": -25.41530990600586, "global_step": 271131, "epoch": 3266} {"train_loss": -25.2382869720459, "global_step": 271132, "epoch": 3266} {"train_loss": -25.333467483520508, "global_step": 271133, "epoch": 3266} {"train_loss": -25.477746963500977, "global_step": 271134, "epoch": 3266} {"train_loss": -25.42339515686035, "global_step": 271135, "epoch": 3266} {"train_loss": -25.372791290283203, "global_step": 271136, "epoch": 3266} {"train_loss": -25.721149444580078, "global_step": 271137, "epoch": 3266} {"train_loss": -25.38005256652832, "global_step": 271138, "epoch": 3266} {"train_loss": -25.12710952758789, "global_step": 271139, "epoch": 3266} {"train_loss": -25.462732315063477, "global_step": 271140, "epoch": 3266} {"train_loss": -25.080249786376953, "global_step": 271141, "epoch": 3266} {"train_loss": -25.464590072631836, "global_step": 271142, "epoch": 3266} {"train_loss": -25.48587989807129, "global_step": 271143, "epoch": 3266} {"train_loss": -25.313764572143555, "global_step": 271144, "epoch": 3266} {"train_loss": -25.436992645263672, "global_step": 271145, "epoch": 3266} {"train_loss": -25.418258666992188, "global_step": 271146, "epoch": 3266} {"train_loss": -25.475740432739258, "global_step": 271147, "epoch": 3266} {"train_loss": -25.09397315979004, "global_step": 271148, "epoch": 3266} {"train_loss": -24.926847457885742, "global_step": 271149, "epoch": 3266} {"train_loss": -24.891254425048828, "global_step": 271150, "epoch": 3266} {"train_loss": -24.93415641784668, "global_step": 271151, "epoch": 3266} {"train_loss": -24.92599105834961, "global_step": 271152, "epoch": 3266} {"train_loss": -24.804882049560547, "global_step": 271153, "epoch": 3266} {"train_loss": -25.389577865600586, "global_step": 271154, "epoch": 3266} {"train_loss": -25.521320343017578, "global_step": 271155, "epoch": 3266} {"train_loss": -24.982526779174805, "global_step": 271156, "epoch": 3266} {"train_loss": -25.114538192749023, "global_step": 271157, "epoch": 3266} {"train_loss": -25.228134155273438, "global_step": 271158, "epoch": 3266} {"train_loss": -25.06668472290039, "global_step": 271159, "epoch": 3266} {"train_loss": -25.22735005114452, "global_step": 271160, "epoch": 3266, "val_loss": 7175613.5} {"train_loss": -24.15254783630371, "global_step": 271161, "epoch": 3267} {"train_loss": -24.468618392944336, "global_step": 271162, "epoch": 3267} {"train_loss": -24.786855697631836, "global_step": 271163, "epoch": 3267} {"train_loss": -24.16341209411621, "global_step": 271164, "epoch": 3267} {"train_loss": -25.104955673217773, "global_step": 271165, "epoch": 3267} {"train_loss": -24.93914222717285, "global_step": 271166, "epoch": 3267} {"train_loss": -25.246891021728516, "global_step": 271167, "epoch": 3267} {"train_loss": -24.462142944335938, "global_step": 271168, "epoch": 3267} {"train_loss": -24.919153213500977, "global_step": 271169, "epoch": 3267} {"train_loss": -24.822912216186523, "global_step": 271170, "epoch": 3267} {"train_loss": -24.960336685180664, "global_step": 271171, "epoch": 3267} {"train_loss": -24.759443283081055, "global_step": 271172, "epoch": 3267} {"train_loss": -24.51807975769043, "global_step": 271173, "epoch": 3267} {"train_loss": -25.172266006469727, "global_step": 271174, "epoch": 3267} {"train_loss": -24.844865798950195, "global_step": 271175, "epoch": 3267} {"train_loss": -24.879840850830078, "global_step": 271176, "epoch": 3267} {"train_loss": -24.836790084838867, "global_step": 271177, "epoch": 3267} {"train_loss": -25.175954818725586, "global_step": 271178, "epoch": 3267} {"train_loss": -25.144336700439453, "global_step": 271179, "epoch": 3267} {"train_loss": -24.974170684814453, "global_step": 271180, "epoch": 3267} {"train_loss": -24.7343807220459, "global_step": 271181, "epoch": 3267} {"train_loss": -25.245182037353516, "global_step": 271182, "epoch": 3267} {"train_loss": -25.215301513671875, "global_step": 271183, "epoch": 3267} {"train_loss": -25.250778198242188, "global_step": 271184, "epoch": 3267} {"train_loss": -24.793472290039062, "global_step": 271185, "epoch": 3267} {"train_loss": -24.488845825195312, "global_step": 271186, "epoch": 3267} {"train_loss": -24.820560455322266, "global_step": 271187, "epoch": 3267} {"train_loss": -25.024045944213867, "global_step": 271188, "epoch": 3267} {"train_loss": -25.008649826049805, "global_step": 271189, "epoch": 3267} {"train_loss": -25.02479362487793, "global_step": 271190, "epoch": 3267} {"train_loss": -24.726789474487305, "global_step": 271191, "epoch": 3267} {"train_loss": -25.518354415893555, "global_step": 271192, "epoch": 3267} {"train_loss": -25.49995994567871, "global_step": 271193, "epoch": 3267} {"train_loss": -25.737455368041992, "global_step": 271194, "epoch": 3267} {"train_loss": -25.318161010742188, "global_step": 271195, "epoch": 3267} {"train_loss": -25.25310707092285, "global_step": 271196, "epoch": 3267} {"train_loss": -25.267629623413086, "global_step": 271197, "epoch": 3267} {"train_loss": -25.04010581970215, "global_step": 271198, "epoch": 3267} {"train_loss": -25.279991149902344, "global_step": 271199, "epoch": 3267} {"train_loss": -25.33607292175293, "global_step": 271200, "epoch": 3267} {"train_loss": -25.043394088745117, "global_step": 271201, "epoch": 3267} {"train_loss": -25.431413650512695, "global_step": 271202, "epoch": 3267} {"train_loss": -25.50766944885254, "global_step": 271203, "epoch": 3267} {"train_loss": -25.374601364135742, "global_step": 271204, "epoch": 3267} {"train_loss": -25.311227798461914, "global_step": 271205, "epoch": 3267} {"train_loss": -25.590835571289062, "global_step": 271206, "epoch": 3267} {"train_loss": -25.369585037231445, "global_step": 271207, "epoch": 3267} {"train_loss": -25.47423553466797, "global_step": 271208, "epoch": 3267} {"train_loss": -24.982776641845703, "global_step": 271209, "epoch": 3267} {"train_loss": -25.266794204711914, "global_step": 271210, "epoch": 3267} {"train_loss": -24.935590744018555, "global_step": 271211, "epoch": 3267} {"train_loss": -24.991186141967773, "global_step": 271212, "epoch": 3267} {"train_loss": -25.359981536865234, "global_step": 271213, "epoch": 3267} {"train_loss": -25.46697998046875, "global_step": 271214, "epoch": 3267} {"train_loss": -25.3668212890625, "global_step": 271215, "epoch": 3267} {"train_loss": -25.170635223388672, "global_step": 271216, "epoch": 3267} {"train_loss": -25.575138092041016, "global_step": 271217, "epoch": 3267} {"train_loss": -25.49538803100586, "global_step": 271218, "epoch": 3267} {"train_loss": -25.3765869140625, "global_step": 271219, "epoch": 3267} {"train_loss": -25.23958396911621, "global_step": 271220, "epoch": 3267} {"train_loss": -24.953702926635742, "global_step": 271221, "epoch": 3267} {"train_loss": -25.264511108398438, "global_step": 271222, "epoch": 3267} {"train_loss": -25.326322555541992, "global_step": 271223, "epoch": 3267} {"train_loss": -25.47661781311035, "global_step": 271224, "epoch": 3267} {"train_loss": -24.988866806030273, "global_step": 271225, "epoch": 3267} {"train_loss": -25.303903579711914, "global_step": 271226, "epoch": 3267} {"train_loss": -25.51806640625, "global_step": 271227, "epoch": 3267} {"train_loss": -25.492000579833984, "global_step": 271228, "epoch": 3267} {"train_loss": -25.709192276000977, "global_step": 271229, "epoch": 3267} {"train_loss": -25.206148147583008, "global_step": 271230, "epoch": 3267} {"train_loss": -25.504215240478516, "global_step": 271231, "epoch": 3267} {"train_loss": -25.368120193481445, "global_step": 271232, "epoch": 3267} {"train_loss": -25.595678329467773, "global_step": 271233, "epoch": 3267} {"train_loss": -25.343671798706055, "global_step": 271234, "epoch": 3267} {"train_loss": -24.822147369384766, "global_step": 271235, "epoch": 3267} {"train_loss": -25.704730987548828, "global_step": 271236, "epoch": 3267} {"train_loss": -25.185277938842773, "global_step": 271237, "epoch": 3267} {"train_loss": -25.18869972229004, "global_step": 271238, "epoch": 3267} {"train_loss": -25.746551513671875, "global_step": 271239, "epoch": 3267} {"train_loss": -25.3995361328125, "global_step": 271240, "epoch": 3267} {"train_loss": -25.300914764404297, "global_step": 271241, "epoch": 3267} {"train_loss": -25.570581436157227, "global_step": 271242, "epoch": 3267} {"train_loss": -25.151149887636482, "global_step": 271243, "epoch": 3267, "val_loss": 7012040.0} {"train_loss": -24.326929092407227, "global_step": 271244, "epoch": 3268} {"train_loss": -24.132856369018555, "global_step": 271245, "epoch": 3268} {"train_loss": -24.574487686157227, "global_step": 271246, "epoch": 3268} {"train_loss": -24.508237838745117, "global_step": 271247, "epoch": 3268} {"train_loss": -24.9262638092041, "global_step": 271248, "epoch": 3268} {"train_loss": -24.381546020507812, "global_step": 271249, "epoch": 3268} {"train_loss": -24.897695541381836, "global_step": 271250, "epoch": 3268} {"train_loss": -24.51447105407715, "global_step": 271251, "epoch": 3268} {"train_loss": -24.547910690307617, "global_step": 271252, "epoch": 3268} {"train_loss": -25.002166748046875, "global_step": 271253, "epoch": 3268} {"train_loss": -24.700162887573242, "global_step": 271254, "epoch": 3268} {"train_loss": -24.80843734741211, "global_step": 271255, "epoch": 3268} {"train_loss": -24.636219024658203, "global_step": 271256, "epoch": 3268} {"train_loss": -23.286691665649414, "global_step": 271257, "epoch": 3268} {"train_loss": -24.78822135925293, "global_step": 271258, "epoch": 3268} {"train_loss": -24.807262420654297, "global_step": 271259, "epoch": 3268} {"train_loss": -24.685117721557617, "global_step": 271260, "epoch": 3268} {"train_loss": -25.14686393737793, "global_step": 271261, "epoch": 3268} {"train_loss": -24.8941593170166, "global_step": 271262, "epoch": 3268} {"train_loss": -24.840316772460938, "global_step": 271263, "epoch": 3268} {"train_loss": -25.046154022216797, "global_step": 271264, "epoch": 3268} {"train_loss": -24.660491943359375, "global_step": 271265, "epoch": 3268} {"train_loss": -24.93739891052246, "global_step": 271266, "epoch": 3268} {"train_loss": -25.336633682250977, "global_step": 271267, "epoch": 3268} {"train_loss": -24.881988525390625, "global_step": 271268, "epoch": 3268} {"train_loss": -25.438026428222656, "global_step": 271269, "epoch": 3268} {"train_loss": -25.093975067138672, "global_step": 271270, "epoch": 3268} {"train_loss": -25.00238037109375, "global_step": 271271, "epoch": 3268} {"train_loss": -24.996137619018555, "global_step": 271272, "epoch": 3268} {"train_loss": -25.059263229370117, "global_step": 271273, "epoch": 3268} {"train_loss": -25.024078369140625, "global_step": 271274, "epoch": 3268} {"train_loss": -25.328908920288086, "global_step": 271275, "epoch": 3268} {"train_loss": -25.164831161499023, "global_step": 271276, "epoch": 3268} {"train_loss": -25.593915939331055, "global_step": 271277, "epoch": 3268} {"train_loss": -25.359159469604492, "global_step": 271278, "epoch": 3268} {"train_loss": -25.04833984375, "global_step": 271279, "epoch": 3268} {"train_loss": -25.392377853393555, "global_step": 271280, "epoch": 3268} {"train_loss": -25.18635368347168, "global_step": 271281, "epoch": 3268} {"train_loss": -24.940336227416992, "global_step": 271282, "epoch": 3268} {"train_loss": -25.34715461730957, "global_step": 271283, "epoch": 3268} {"train_loss": -25.46532440185547, "global_step": 271284, "epoch": 3268} {"train_loss": -25.515655517578125, "global_step": 271285, "epoch": 3268} {"train_loss": -25.40540885925293, "global_step": 271286, "epoch": 3268} {"train_loss": -25.03312873840332, "global_step": 271287, "epoch": 3268} {"train_loss": -25.41590690612793, "global_step": 271288, "epoch": 3268} {"train_loss": -25.430383682250977, "global_step": 271289, "epoch": 3268} {"train_loss": -25.655439376831055, "global_step": 271290, "epoch": 3268} {"train_loss": -25.167490005493164, "global_step": 271291, "epoch": 3268} {"train_loss": -25.394180297851562, "global_step": 271292, "epoch": 3268} {"train_loss": -25.533733367919922, "global_step": 271293, "epoch": 3268} {"train_loss": -25.435728073120117, "global_step": 271294, "epoch": 3268} {"train_loss": -25.3480224609375, "global_step": 271295, "epoch": 3268} {"train_loss": -25.15004539489746, "global_step": 271296, "epoch": 3268} {"train_loss": -25.351232528686523, "global_step": 271297, "epoch": 3268} {"train_loss": -25.24497413635254, "global_step": 271298, "epoch": 3268} {"train_loss": -24.99012565612793, "global_step": 271299, "epoch": 3268} {"train_loss": -24.878646850585938, "global_step": 271300, "epoch": 3268} {"train_loss": -25.19198989868164, "global_step": 271301, "epoch": 3268} {"train_loss": -25.087636947631836, "global_step": 271302, "epoch": 3268} {"train_loss": -25.278427124023438, "global_step": 271303, "epoch": 3268} {"train_loss": -25.53012466430664, "global_step": 271304, "epoch": 3268} {"train_loss": -25.288297653198242, "global_step": 271305, "epoch": 3268} {"train_loss": -25.325870513916016, "global_step": 271306, "epoch": 3268} {"train_loss": -25.102386474609375, "global_step": 271307, "epoch": 3268} {"train_loss": -25.10418128967285, "global_step": 271308, "epoch": 3268} {"train_loss": -25.427892684936523, "global_step": 271309, "epoch": 3268} {"train_loss": -25.373348236083984, "global_step": 271310, "epoch": 3268} {"train_loss": -25.265024185180664, "global_step": 271311, "epoch": 3268} {"train_loss": -25.134994506835938, "global_step": 271312, "epoch": 3268} {"train_loss": -24.880590438842773, "global_step": 271313, "epoch": 3268} {"train_loss": -25.444860458374023, "global_step": 271314, "epoch": 3268} {"train_loss": -25.389633178710938, "global_step": 271315, "epoch": 3268} {"train_loss": -25.150983810424805, "global_step": 271316, "epoch": 3268} {"train_loss": -25.489749908447266, "global_step": 271317, "epoch": 3268} {"train_loss": -25.012008666992188, "global_step": 271318, "epoch": 3268} {"train_loss": -25.277624130249023, "global_step": 271319, "epoch": 3268} {"train_loss": -24.9295654296875, "global_step": 271320, "epoch": 3268} {"train_loss": -25.384382247924805, "global_step": 271321, "epoch": 3268} {"train_loss": -25.447444915771484, "global_step": 271322, "epoch": 3268} {"train_loss": -25.01633644104004, "global_step": 271323, "epoch": 3268} {"train_loss": -25.6778564453125, "global_step": 271324, "epoch": 3268} {"train_loss": -25.468997955322266, "global_step": 271325, "epoch": 3268} {"train_loss": -25.096075103943605, "global_step": 271326, "epoch": 3268, "val_loss": 7039746.5} {"train_loss": -24.27312660217285, "global_step": 271327, "epoch": 3269} {"train_loss": -24.44248390197754, "global_step": 271328, "epoch": 3269} {"train_loss": -24.546890258789062, "global_step": 271329, "epoch": 3269} {"train_loss": -24.215627670288086, "global_step": 271330, "epoch": 3269} {"train_loss": -24.39625358581543, "global_step": 271331, "epoch": 3269} {"train_loss": -24.86140251159668, "global_step": 271332, "epoch": 3269} {"train_loss": -24.329076766967773, "global_step": 271333, "epoch": 3269} {"train_loss": -24.79038429260254, "global_step": 271334, "epoch": 3269} {"train_loss": -24.604700088500977, "global_step": 271335, "epoch": 3269} {"train_loss": -24.76248550415039, "global_step": 271336, "epoch": 3269} {"train_loss": -25.00331687927246, "global_step": 271337, "epoch": 3269} {"train_loss": -24.971250534057617, "global_step": 271338, "epoch": 3269} {"train_loss": -24.844968795776367, "global_step": 271339, "epoch": 3269} {"train_loss": -25.284244537353516, "global_step": 271340, "epoch": 3269} {"train_loss": -25.054920196533203, "global_step": 271341, "epoch": 3269} {"train_loss": -25.53066062927246, "global_step": 271342, "epoch": 3269} {"train_loss": -25.088747024536133, "global_step": 271343, "epoch": 3269} {"train_loss": -24.915250778198242, "global_step": 271344, "epoch": 3269} {"train_loss": -25.334762573242188, "global_step": 271345, "epoch": 3269} {"train_loss": -25.232633590698242, "global_step": 271346, "epoch": 3269} {"train_loss": -25.336021423339844, "global_step": 271347, "epoch": 3269} {"train_loss": -25.460683822631836, "global_step": 271348, "epoch": 3269} {"train_loss": -25.17235565185547, "global_step": 271349, "epoch": 3269} {"train_loss": -25.430395126342773, "global_step": 271350, "epoch": 3269} {"train_loss": -25.502836227416992, "global_step": 271351, "epoch": 3269} {"train_loss": -25.045473098754883, "global_step": 271352, "epoch": 3269} {"train_loss": -25.26875877380371, "global_step": 271353, "epoch": 3269} {"train_loss": -25.251670837402344, "global_step": 271354, "epoch": 3269} {"train_loss": -25.389760971069336, "global_step": 271355, "epoch": 3269} {"train_loss": -25.164579391479492, "global_step": 271356, "epoch": 3269} {"train_loss": -25.194339752197266, "global_step": 271357, "epoch": 3269} {"train_loss": -25.334495544433594, "global_step": 271358, "epoch": 3269} {"train_loss": -25.59499168395996, "global_step": 271359, "epoch": 3269} {"train_loss": -25.37873077392578, "global_step": 271360, "epoch": 3269} {"train_loss": -25.8061466217041, "global_step": 271361, "epoch": 3269} {"train_loss": -25.260894775390625, "global_step": 271362, "epoch": 3269} {"train_loss": -25.114572525024414, "global_step": 271363, "epoch": 3269} {"train_loss": -25.469263076782227, "global_step": 271364, "epoch": 3269} {"train_loss": -25.336881637573242, "global_step": 271365, "epoch": 3269} {"train_loss": -25.215116500854492, "global_step": 271366, "epoch": 3269} {"train_loss": -25.071979522705078, "global_step": 271367, "epoch": 3269} {"train_loss": -25.30002784729004, "global_step": 271368, "epoch": 3269} {"train_loss": -25.60662841796875, "global_step": 271369, "epoch": 3269} {"train_loss": -25.747800827026367, "global_step": 271370, "epoch": 3269} {"train_loss": -25.418033599853516, "global_step": 271371, "epoch": 3269} {"train_loss": -25.288684844970703, "global_step": 271372, "epoch": 3269} {"train_loss": -25.145099639892578, "global_step": 271373, "epoch": 3269} {"train_loss": -24.88260269165039, "global_step": 271374, "epoch": 3269} {"train_loss": -25.413894653320312, "global_step": 271375, "epoch": 3269} {"train_loss": -25.404325485229492, "global_step": 271376, "epoch": 3269} {"train_loss": -24.92572021484375, "global_step": 271377, "epoch": 3269} {"train_loss": -25.38032341003418, "global_step": 271378, "epoch": 3269} {"train_loss": -25.185314178466797, "global_step": 271379, "epoch": 3269} {"train_loss": -25.760772705078125, "global_step": 271380, "epoch": 3269} {"train_loss": -25.42951774597168, "global_step": 271381, "epoch": 3269} {"train_loss": -25.424219131469727, "global_step": 271382, "epoch": 3269} {"train_loss": -24.906997680664062, "global_step": 271383, "epoch": 3269} {"train_loss": -25.160856246948242, "global_step": 271384, "epoch": 3269} {"train_loss": -25.035924911499023, "global_step": 271385, "epoch": 3269} {"train_loss": -25.341970443725586, "global_step": 271386, "epoch": 3269} {"train_loss": -24.836219787597656, "global_step": 271387, "epoch": 3269} {"train_loss": -25.001789093017578, "global_step": 271388, "epoch": 3269} {"train_loss": -25.299972534179688, "global_step": 271389, "epoch": 3269} {"train_loss": -24.80019187927246, "global_step": 271390, "epoch": 3269} {"train_loss": -24.484994888305664, "global_step": 271391, "epoch": 3269} {"train_loss": -25.055917739868164, "global_step": 271392, "epoch": 3269} {"train_loss": -25.155004501342773, "global_step": 271393, "epoch": 3269} {"train_loss": -24.9277286529541, "global_step": 271394, "epoch": 3269} {"train_loss": -24.67115592956543, "global_step": 271395, "epoch": 3269} {"train_loss": -25.204198837280273, "global_step": 271396, "epoch": 3269} {"train_loss": -25.16824722290039, "global_step": 271397, "epoch": 3269} {"train_loss": -24.895803451538086, "global_step": 271398, "epoch": 3269} {"train_loss": -25.213701248168945, "global_step": 271399, "epoch": 3269} {"train_loss": -25.50555992126465, "global_step": 271400, "epoch": 3269} {"train_loss": -25.443342208862305, "global_step": 271401, "epoch": 3269} {"train_loss": -25.55177879333496, "global_step": 271402, "epoch": 3269} {"train_loss": -25.362356185913086, "global_step": 271403, "epoch": 3269} {"train_loss": -25.007368087768555, "global_step": 271404, "epoch": 3269} {"train_loss": -25.245895385742188, "global_step": 271405, "epoch": 3269} {"train_loss": -25.103321075439453, "global_step": 271406, "epoch": 3269} {"train_loss": -25.14987564086914, "global_step": 271407, "epoch": 3269} {"train_loss": -25.03177261352539, "global_step": 271408, "epoch": 3269} {"train_loss": -25.12760555313294, "global_step": 271409, "epoch": 3269, "val_loss": 6965627.0} {"train_loss": -24.768789291381836, "global_step": 271410, "epoch": 3270} {"train_loss": -25.387248992919922, "global_step": 271411, "epoch": 3270} {"train_loss": -25.235803604125977, "global_step": 271412, "epoch": 3270} {"train_loss": -24.88881492614746, "global_step": 271413, "epoch": 3270} {"train_loss": -25.457523345947266, "global_step": 271414, "epoch": 3270} {"train_loss": -24.997833251953125, "global_step": 271415, "epoch": 3270} {"train_loss": -24.991165161132812, "global_step": 271416, "epoch": 3270} {"train_loss": -24.824155807495117, "global_step": 271417, "epoch": 3270} {"train_loss": -25.069198608398438, "global_step": 271418, "epoch": 3270} {"train_loss": -25.12213706970215, "global_step": 271419, "epoch": 3270} {"train_loss": -25.134809494018555, "global_step": 271420, "epoch": 3270} {"train_loss": -25.18537712097168, "global_step": 271421, "epoch": 3270} {"train_loss": -25.304031372070312, "global_step": 271422, "epoch": 3270} {"train_loss": -25.171865463256836, "global_step": 271423, "epoch": 3270} {"train_loss": -25.32354736328125, "global_step": 271424, "epoch": 3270} {"train_loss": -25.084848403930664, "global_step": 271425, "epoch": 3270} {"train_loss": -25.77294921875, "global_step": 271426, "epoch": 3270} {"train_loss": -25.067676544189453, "global_step": 271427, "epoch": 3270} {"train_loss": -25.486038208007812, "global_step": 271428, "epoch": 3270} {"train_loss": -25.735660552978516, "global_step": 271429, "epoch": 3270} {"train_loss": -25.337467193603516, "global_step": 271430, "epoch": 3270} {"train_loss": -25.21491050720215, "global_step": 271431, "epoch": 3270} {"train_loss": -25.523757934570312, "global_step": 271432, "epoch": 3270} {"train_loss": -25.46889877319336, "global_step": 271433, "epoch": 3270} {"train_loss": -25.178871154785156, "global_step": 271434, "epoch": 3270} {"train_loss": -25.73838233947754, "global_step": 271435, "epoch": 3270} {"train_loss": -25.28531837463379, "global_step": 271436, "epoch": 3270} {"train_loss": -25.3435001373291, "global_step": 271437, "epoch": 3270} {"train_loss": -25.3718318939209, "global_step": 271438, "epoch": 3270} {"train_loss": -25.648502349853516, "global_step": 271439, "epoch": 3270} {"train_loss": -24.931350708007812, "global_step": 271440, "epoch": 3270} {"train_loss": -25.490339279174805, "global_step": 271441, "epoch": 3270} {"train_loss": -25.30133056640625, "global_step": 271442, "epoch": 3270} {"train_loss": -25.374509811401367, "global_step": 271443, "epoch": 3270} {"train_loss": -24.858633041381836, "global_step": 271444, "epoch": 3270} {"train_loss": -25.1031551361084, "global_step": 271445, "epoch": 3270} {"train_loss": -24.971776962280273, "global_step": 271446, "epoch": 3270} {"train_loss": -25.057785034179688, "global_step": 271447, "epoch": 3270} {"train_loss": -25.37257957458496, "global_step": 271448, "epoch": 3270} {"train_loss": -24.865137100219727, "global_step": 271449, "epoch": 3270} {"train_loss": -25.35433006286621, "global_step": 271450, "epoch": 3270} {"train_loss": -25.35860252380371, "global_step": 271451, "epoch": 3270} {"train_loss": -24.786100387573242, "global_step": 271452, "epoch": 3270} {"train_loss": -25.076337814331055, "global_step": 271453, "epoch": 3270} {"train_loss": -25.143508911132812, "global_step": 271454, "epoch": 3270} {"train_loss": -25.102354049682617, "global_step": 271455, "epoch": 3270} {"train_loss": -25.545061111450195, "global_step": 271456, "epoch": 3270} {"train_loss": -25.29441261291504, "global_step": 271457, "epoch": 3270} {"train_loss": -25.14803123474121, "global_step": 271458, "epoch": 3270} {"train_loss": -25.419025421142578, "global_step": 271459, "epoch": 3270} {"train_loss": -25.081384658813477, "global_step": 271460, "epoch": 3270} {"train_loss": -25.28129005432129, "global_step": 271461, "epoch": 3270} {"train_loss": -25.518451690673828, "global_step": 271462, "epoch": 3270} {"train_loss": -25.460498809814453, "global_step": 271463, "epoch": 3270} {"train_loss": -25.526838302612305, "global_step": 271464, "epoch": 3270} {"train_loss": -25.267736434936523, "global_step": 271465, "epoch": 3270} {"train_loss": -25.160213470458984, "global_step": 271466, "epoch": 3270} {"train_loss": -25.4527645111084, "global_step": 271467, "epoch": 3270} {"train_loss": -25.485515594482422, "global_step": 271468, "epoch": 3270} {"train_loss": -25.309844970703125, "global_step": 271469, "epoch": 3270} {"train_loss": -25.478254318237305, "global_step": 271470, "epoch": 3270} {"train_loss": -25.346923828125, "global_step": 271471, "epoch": 3270} {"train_loss": -24.978227615356445, "global_step": 271472, "epoch": 3270} {"train_loss": -25.433053970336914, "global_step": 271473, "epoch": 3270} {"train_loss": -25.38178825378418, "global_step": 271474, "epoch": 3270} {"train_loss": -25.325040817260742, "global_step": 271475, "epoch": 3270} {"train_loss": -25.275768280029297, "global_step": 271476, "epoch": 3270} {"train_loss": -25.113563537597656, "global_step": 271477, "epoch": 3270} {"train_loss": -25.3216609954834, "global_step": 271478, "epoch": 3270} {"train_loss": -25.75238609313965, "global_step": 271479, "epoch": 3270} {"train_loss": -25.739837646484375, "global_step": 271480, "epoch": 3270} {"train_loss": -25.494918823242188, "global_step": 271481, "epoch": 3270} {"train_loss": -25.130062103271484, "global_step": 271482, "epoch": 3270} {"train_loss": -25.369230270385742, "global_step": 271483, "epoch": 3270} {"train_loss": -25.51369857788086, "global_step": 271484, "epoch": 3270} {"train_loss": -25.119474411010742, "global_step": 271485, "epoch": 3270} {"train_loss": -25.030778884887695, "global_step": 271486, "epoch": 3270} {"train_loss": -25.203088760375977, "global_step": 271487, "epoch": 3270} {"train_loss": -25.185989379882812, "global_step": 271488, "epoch": 3270} {"train_loss": -25.169050216674805, "global_step": 271489, "epoch": 3270} {"train_loss": -25.295082092285156, "global_step": 271490, "epoch": 3270} {"train_loss": -25.14716148376465, "global_step": 271491, "epoch": 3270} {"train_loss": -25.272887861872295, "global_step": 271492, "epoch": 3270, "val_loss": 7050228.0} {"train_loss": -24.98813819885254, "global_step": 271493, "epoch": 3271} {"train_loss": -24.847780227661133, "global_step": 271494, "epoch": 3271} {"train_loss": -24.902639389038086, "global_step": 271495, "epoch": 3271} {"train_loss": -25.09562110900879, "global_step": 271496, "epoch": 3271} {"train_loss": -25.056119918823242, "global_step": 271497, "epoch": 3271} {"train_loss": -25.311769485473633, "global_step": 271498, "epoch": 3271} {"train_loss": -25.13959312438965, "global_step": 271499, "epoch": 3271} {"train_loss": -25.433324813842773, "global_step": 271500, "epoch": 3271} {"train_loss": -25.315637588500977, "global_step": 271501, "epoch": 3271} {"train_loss": -25.13818359375, "global_step": 271502, "epoch": 3271} {"train_loss": -25.20353126525879, "global_step": 271503, "epoch": 3271} {"train_loss": -25.350252151489258, "global_step": 271504, "epoch": 3271} {"train_loss": -25.027854919433594, "global_step": 271505, "epoch": 3271} {"train_loss": -24.885465621948242, "global_step": 271506, "epoch": 3271} {"train_loss": -25.2338924407959, "global_step": 271507, "epoch": 3271} {"train_loss": -24.839258193969727, "global_step": 271508, "epoch": 3271} {"train_loss": -24.857881546020508, "global_step": 271509, "epoch": 3271} {"train_loss": -25.269001007080078, "global_step": 271510, "epoch": 3271} {"train_loss": -25.148399353027344, "global_step": 271511, "epoch": 3271} {"train_loss": -25.317039489746094, "global_step": 271512, "epoch": 3271} {"train_loss": -25.075029373168945, "global_step": 271513, "epoch": 3271} {"train_loss": -25.338037490844727, "global_step": 271514, "epoch": 3271} {"train_loss": -25.59406852722168, "global_step": 271515, "epoch": 3271} {"train_loss": -24.921781539916992, "global_step": 271516, "epoch": 3271} {"train_loss": -25.285829544067383, "global_step": 271517, "epoch": 3271} {"train_loss": -25.265714645385742, "global_step": 271518, "epoch": 3271} {"train_loss": -25.12322425842285, "global_step": 271519, "epoch": 3271} {"train_loss": -25.435497283935547, "global_step": 271520, "epoch": 3271} {"train_loss": -25.359617233276367, "global_step": 271521, "epoch": 3271} {"train_loss": -25.248600006103516, "global_step": 271522, "epoch": 3271} {"train_loss": -25.090234756469727, "global_step": 271523, "epoch": 3271} {"train_loss": -25.49997329711914, "global_step": 271524, "epoch": 3271} {"train_loss": -25.22376823425293, "global_step": 271525, "epoch": 3271} {"train_loss": -25.52894401550293, "global_step": 271526, "epoch": 3271} {"train_loss": -25.02503776550293, "global_step": 271527, "epoch": 3271} {"train_loss": -25.30743408203125, "global_step": 271528, "epoch": 3271} {"train_loss": -25.529220581054688, "global_step": 271529, "epoch": 3271} {"train_loss": -25.0351619720459, "global_step": 271530, "epoch": 3271} {"train_loss": -25.246625900268555, "global_step": 271531, "epoch": 3271} {"train_loss": -25.165258407592773, "global_step": 271532, "epoch": 3271} {"train_loss": -25.271451950073242, "global_step": 271533, "epoch": 3271} {"train_loss": -25.678747177124023, "global_step": 271534, "epoch": 3271} {"train_loss": -25.05220603942871, "global_step": 271535, "epoch": 3271} {"train_loss": -25.04166603088379, "global_step": 271536, "epoch": 3271} {"train_loss": -25.00999641418457, "global_step": 271537, "epoch": 3271} {"train_loss": -25.726917266845703, "global_step": 271538, "epoch": 3271} {"train_loss": -25.71595573425293, "global_step": 271539, "epoch": 3271} {"train_loss": -25.1411075592041, "global_step": 271540, "epoch": 3271} {"train_loss": -24.941869735717773, "global_step": 271541, "epoch": 3271} {"train_loss": -25.156293869018555, "global_step": 271542, "epoch": 3271} {"train_loss": -25.145902633666992, "global_step": 271543, "epoch": 3271} {"train_loss": -24.936792373657227, "global_step": 271544, "epoch": 3271} {"train_loss": -25.220441818237305, "global_step": 271545, "epoch": 3271} {"train_loss": -25.18536376953125, "global_step": 271546, "epoch": 3271} {"train_loss": -25.368799209594727, "global_step": 271547, "epoch": 3271} {"train_loss": -25.14140510559082, "global_step": 271548, "epoch": 3271} {"train_loss": -25.3678035736084, "global_step": 271549, "epoch": 3271} {"train_loss": -25.158309936523438, "global_step": 271550, "epoch": 3271} {"train_loss": -25.28250503540039, "global_step": 271551, "epoch": 3271} {"train_loss": -25.467893600463867, "global_step": 271552, "epoch": 3271} {"train_loss": -25.232336044311523, "global_step": 271553, "epoch": 3271} {"train_loss": -25.22764015197754, "global_step": 271554, "epoch": 3271} {"train_loss": -25.045711517333984, "global_step": 271555, "epoch": 3271} {"train_loss": -24.999502182006836, "global_step": 271556, "epoch": 3271} {"train_loss": -25.5490665435791, "global_step": 271557, "epoch": 3271} {"train_loss": -25.46480369567871, "global_step": 271558, "epoch": 3271} {"train_loss": -25.185232162475586, "global_step": 271559, "epoch": 3271} {"train_loss": -25.149805068969727, "global_step": 271560, "epoch": 3271} {"train_loss": -25.2347354888916, "global_step": 271561, "epoch": 3271} {"train_loss": -24.898706436157227, "global_step": 271562, "epoch": 3271} {"train_loss": -25.2525691986084, "global_step": 271563, "epoch": 3271} {"train_loss": -25.164196014404297, "global_step": 271564, "epoch": 3271} {"train_loss": -25.26070213317871, "global_step": 271565, "epoch": 3271} {"train_loss": -25.40605926513672, "global_step": 271566, "epoch": 3271} {"train_loss": -25.0699520111084, "global_step": 271567, "epoch": 3271} {"train_loss": -24.919342041015625, "global_step": 271568, "epoch": 3271} {"train_loss": -25.72677993774414, "global_step": 271569, "epoch": 3271} {"train_loss": -25.076770782470703, "global_step": 271570, "epoch": 3271} {"train_loss": -24.9980525970459, "global_step": 271571, "epoch": 3271} {"train_loss": -24.96550750732422, "global_step": 271572, "epoch": 3271} {"train_loss": -25.59134292602539, "global_step": 271573, "epoch": 3271} {"train_loss": -25.558422088623047, "global_step": 271574, "epoch": 3271} {"train_loss": -25.211038405636707, "global_step": 271575, "epoch": 3271, "val_loss": 7009847.0} {"train_loss": -24.787504196166992, "global_step": 271576, "epoch": 3272} {"train_loss": -25.151540756225586, "global_step": 271577, "epoch": 3272} {"train_loss": -25.15595054626465, "global_step": 271578, "epoch": 3272} {"train_loss": -25.25421714782715, "global_step": 271579, "epoch": 3272} {"train_loss": -25.41556739807129, "global_step": 271580, "epoch": 3272} {"train_loss": -24.957677841186523, "global_step": 271581, "epoch": 3272} {"train_loss": -24.96585464477539, "global_step": 271582, "epoch": 3272} {"train_loss": -24.80671501159668, "global_step": 271583, "epoch": 3272} {"train_loss": -24.845937728881836, "global_step": 271584, "epoch": 3272} {"train_loss": -24.84071922302246, "global_step": 271585, "epoch": 3272} {"train_loss": -25.024396896362305, "global_step": 271586, "epoch": 3272} {"train_loss": -25.388641357421875, "global_step": 271587, "epoch": 3272} {"train_loss": -25.040428161621094, "global_step": 271588, "epoch": 3272} {"train_loss": -25.343765258789062, "global_step": 271589, "epoch": 3272} {"train_loss": -25.008831024169922, "global_step": 271590, "epoch": 3272} {"train_loss": -25.549678802490234, "global_step": 271591, "epoch": 3272} {"train_loss": -25.36958122253418, "global_step": 271592, "epoch": 3272} {"train_loss": -24.98797035217285, "global_step": 271593, "epoch": 3272} {"train_loss": -25.265060424804688, "global_step": 271594, "epoch": 3272} {"train_loss": -25.2935791015625, "global_step": 271595, "epoch": 3272} {"train_loss": -25.23428726196289, "global_step": 271596, "epoch": 3272} {"train_loss": -25.36799430847168, "global_step": 271597, "epoch": 3272} {"train_loss": -25.373483657836914, "global_step": 271598, "epoch": 3272} {"train_loss": -25.214679718017578, "global_step": 271599, "epoch": 3272} {"train_loss": -25.213157653808594, "global_step": 271600, "epoch": 3272} {"train_loss": -25.065961837768555, "global_step": 271601, "epoch": 3272} {"train_loss": -25.514759063720703, "global_step": 271602, "epoch": 3272} {"train_loss": -25.378694534301758, "global_step": 271603, "epoch": 3272} {"train_loss": -25.47194480895996, "global_step": 271604, "epoch": 3272} {"train_loss": -25.241008758544922, "global_step": 271605, "epoch": 3272} {"train_loss": -25.22128677368164, "global_step": 271606, "epoch": 3272} {"train_loss": -25.096378326416016, "global_step": 271607, "epoch": 3272} {"train_loss": -25.578353881835938, "global_step": 271608, "epoch": 3272} {"train_loss": -25.54376792907715, "global_step": 271609, "epoch": 3272} {"train_loss": -25.743122100830078, "global_step": 271610, "epoch": 3272} {"train_loss": -25.358884811401367, "global_step": 271611, "epoch": 3272} {"train_loss": -25.34767723083496, "global_step": 271612, "epoch": 3272} {"train_loss": -25.29165267944336, "global_step": 271613, "epoch": 3272} {"train_loss": -25.653034210205078, "global_step": 271614, "epoch": 3272} {"train_loss": -25.393056869506836, "global_step": 271615, "epoch": 3272} {"train_loss": -25.289094924926758, "global_step": 271616, "epoch": 3272} {"train_loss": -25.48580551147461, "global_step": 271617, "epoch": 3272} {"train_loss": -25.438352584838867, "global_step": 271618, "epoch": 3272} {"train_loss": -25.881750106811523, "global_step": 271619, "epoch": 3272} {"train_loss": -25.663122177124023, "global_step": 271620, "epoch": 3272} {"train_loss": -25.464086532592773, "global_step": 271621, "epoch": 3272} {"train_loss": -25.306798934936523, "global_step": 271622, "epoch": 3272} {"train_loss": -25.147216796875, "global_step": 271623, "epoch": 3272} {"train_loss": -25.328039169311523, "global_step": 271624, "epoch": 3272} {"train_loss": -25.573272705078125, "global_step": 271625, "epoch": 3272} {"train_loss": -25.352195739746094, "global_step": 271626, "epoch": 3272} {"train_loss": -25.1099910736084, "global_step": 271627, "epoch": 3272} {"train_loss": -25.34783363342285, "global_step": 271628, "epoch": 3272} {"train_loss": -25.081134796142578, "global_step": 271629, "epoch": 3272} {"train_loss": -25.203487396240234, "global_step": 271630, "epoch": 3272} {"train_loss": -25.25259780883789, "global_step": 271631, "epoch": 3272} {"train_loss": -25.264739990234375, "global_step": 271632, "epoch": 3272} {"train_loss": -25.34871482849121, "global_step": 271633, "epoch": 3272} {"train_loss": -25.077133178710938, "global_step": 271634, "epoch": 3272} {"train_loss": -25.043750762939453, "global_step": 271635, "epoch": 3272} {"train_loss": -25.112043380737305, "global_step": 271636, "epoch": 3272} {"train_loss": -24.77742576599121, "global_step": 271637, "epoch": 3272} {"train_loss": -25.332717895507812, "global_step": 271638, "epoch": 3272} {"train_loss": -24.86331558227539, "global_step": 271639, "epoch": 3272} {"train_loss": -24.868732452392578, "global_step": 271640, "epoch": 3272} {"train_loss": -24.79427146911621, "global_step": 271641, "epoch": 3272} {"train_loss": -24.625694274902344, "global_step": 271642, "epoch": 3272} {"train_loss": -25.307302474975586, "global_step": 271643, "epoch": 3272} {"train_loss": -25.35187530517578, "global_step": 271644, "epoch": 3272} {"train_loss": -24.89431381225586, "global_step": 271645, "epoch": 3272} {"train_loss": -25.420116424560547, "global_step": 271646, "epoch": 3272} {"train_loss": -25.36334800720215, "global_step": 271647, "epoch": 3272} {"train_loss": -25.501005172729492, "global_step": 271648, "epoch": 3272} {"train_loss": -25.31342124938965, "global_step": 271649, "epoch": 3272} {"train_loss": -25.45817756652832, "global_step": 271650, "epoch": 3272} {"train_loss": -25.463897705078125, "global_step": 271651, "epoch": 3272} {"train_loss": -25.293058395385742, "global_step": 271652, "epoch": 3272} {"train_loss": -25.532657623291016, "global_step": 271653, "epoch": 3272} {"train_loss": -25.204748153686523, "global_step": 271654, "epoch": 3272} {"train_loss": -25.36424446105957, "global_step": 271655, "epoch": 3272} {"train_loss": -25.59404945373535, "global_step": 271656, "epoch": 3272} {"train_loss": -25.287734985351562, "global_step": 271657, "epoch": 3272} {"train_loss": -25.26556458530656, "global_step": 271658, "epoch": 3272, "val_loss": 6912996.0} {"train_loss": -25.079221725463867, "global_step": 271659, "epoch": 3273} {"train_loss": -24.856874465942383, "global_step": 271660, "epoch": 3273} {"train_loss": -25.235876083374023, "global_step": 271661, "epoch": 3273} {"train_loss": -24.93940544128418, "global_step": 271662, "epoch": 3273} {"train_loss": -25.145849227905273, "global_step": 271663, "epoch": 3273} {"train_loss": -24.794288635253906, "global_step": 271664, "epoch": 3273} {"train_loss": -25.0478458404541, "global_step": 271665, "epoch": 3273} {"train_loss": -25.126060485839844, "global_step": 271666, "epoch": 3273} {"train_loss": -25.533355712890625, "global_step": 271667, "epoch": 3273} {"train_loss": -25.030696868896484, "global_step": 271668, "epoch": 3273} {"train_loss": -25.171262741088867, "global_step": 271669, "epoch": 3273} {"train_loss": -24.874256134033203, "global_step": 271670, "epoch": 3273} {"train_loss": -24.921737670898438, "global_step": 271671, "epoch": 3273} {"train_loss": -25.167646408081055, "global_step": 271672, "epoch": 3273} {"train_loss": -25.041440963745117, "global_step": 271673, "epoch": 3273} {"train_loss": -24.666933059692383, "global_step": 271674, "epoch": 3273} {"train_loss": -24.877277374267578, "global_step": 271675, "epoch": 3273} {"train_loss": -25.2886905670166, "global_step": 271676, "epoch": 3273} {"train_loss": -24.225467681884766, "global_step": 271677, "epoch": 3273} {"train_loss": -24.422941207885742, "global_step": 271678, "epoch": 3273} {"train_loss": -25.15546989440918, "global_step": 271679, "epoch": 3273} {"train_loss": -24.61357879638672, "global_step": 271680, "epoch": 3273} {"train_loss": -25.044294357299805, "global_step": 271681, "epoch": 3273} {"train_loss": -24.59669303894043, "global_step": 271682, "epoch": 3273} {"train_loss": -24.742450714111328, "global_step": 271683, "epoch": 3273} {"train_loss": -25.179651260375977, "global_step": 271684, "epoch": 3273} {"train_loss": -24.976499557495117, "global_step": 271685, "epoch": 3273} {"train_loss": -25.142759323120117, "global_step": 271686, "epoch": 3273} {"train_loss": -25.036542892456055, "global_step": 271687, "epoch": 3273} {"train_loss": -25.386903762817383, "global_step": 271688, "epoch": 3273} {"train_loss": -25.070968627929688, "global_step": 271689, "epoch": 3273} {"train_loss": -25.271175384521484, "global_step": 271690, "epoch": 3273} {"train_loss": -24.84219741821289, "global_step": 271691, "epoch": 3273} {"train_loss": -25.018877029418945, "global_step": 271692, "epoch": 3273} {"train_loss": -25.027746200561523, "global_step": 271693, "epoch": 3273} {"train_loss": -25.499950408935547, "global_step": 271694, "epoch": 3273} {"train_loss": -25.09015464782715, "global_step": 271695, "epoch": 3273} {"train_loss": -24.842151641845703, "global_step": 271696, "epoch": 3273} {"train_loss": -25.382627487182617, "global_step": 271697, "epoch": 3273} {"train_loss": -24.725330352783203, "global_step": 271698, "epoch": 3273} {"train_loss": -25.27569580078125, "global_step": 271699, "epoch": 3273} {"train_loss": -25.30515480041504, "global_step": 271700, "epoch": 3273} {"train_loss": -25.370080947875977, "global_step": 271701, "epoch": 3273} {"train_loss": -25.55709457397461, "global_step": 271702, "epoch": 3273} {"train_loss": -24.968088150024414, "global_step": 271703, "epoch": 3273} {"train_loss": -25.422271728515625, "global_step": 271704, "epoch": 3273} {"train_loss": -25.107318878173828, "global_step": 271705, "epoch": 3273} {"train_loss": -25.71327018737793, "global_step": 271706, "epoch": 3273} {"train_loss": -25.302993774414062, "global_step": 271707, "epoch": 3273} {"train_loss": -25.4748477935791, "global_step": 271708, "epoch": 3273} {"train_loss": -25.21428680419922, "global_step": 271709, "epoch": 3273} {"train_loss": -25.936193466186523, "global_step": 271710, "epoch": 3273} {"train_loss": -25.55462646484375, "global_step": 271711, "epoch": 3273} {"train_loss": -24.91494369506836, "global_step": 271712, "epoch": 3273} {"train_loss": -25.266273498535156, "global_step": 271713, "epoch": 3273} {"train_loss": -25.27098846435547, "global_step": 271714, "epoch": 3273} {"train_loss": -25.368804931640625, "global_step": 271715, "epoch": 3273} {"train_loss": -25.200180053710938, "global_step": 271716, "epoch": 3273} {"train_loss": -25.279436111450195, "global_step": 271717, "epoch": 3273} {"train_loss": -25.626806259155273, "global_step": 271718, "epoch": 3273} {"train_loss": -25.26645851135254, "global_step": 271719, "epoch": 3273} {"train_loss": -25.03095054626465, "global_step": 271720, "epoch": 3273} {"train_loss": -25.22520637512207, "global_step": 271721, "epoch": 3273} {"train_loss": -25.03419303894043, "global_step": 271722, "epoch": 3273} {"train_loss": -25.41806411743164, "global_step": 271723, "epoch": 3273} {"train_loss": -25.016605377197266, "global_step": 271724, "epoch": 3273} {"train_loss": -25.36945152282715, "global_step": 271725, "epoch": 3273} {"train_loss": -25.37050437927246, "global_step": 271726, "epoch": 3273} {"train_loss": -25.183216094970703, "global_step": 271727, "epoch": 3273} {"train_loss": -25.706256866455078, "global_step": 271728, "epoch": 3273} {"train_loss": -25.190662384033203, "global_step": 271729, "epoch": 3273} {"train_loss": -25.0327091217041, "global_step": 271730, "epoch": 3273} {"train_loss": -25.08217430114746, "global_step": 271731, "epoch": 3273} {"train_loss": -25.192102432250977, "global_step": 271732, "epoch": 3273} {"train_loss": -25.244932174682617, "global_step": 271733, "epoch": 3273} {"train_loss": -25.090682983398438, "global_step": 271734, "epoch": 3273} {"train_loss": -25.271148681640625, "global_step": 271735, "epoch": 3273} {"train_loss": -25.316009521484375, "global_step": 271736, "epoch": 3273} {"train_loss": -25.377653121948242, "global_step": 271737, "epoch": 3273} {"train_loss": -25.063159942626953, "global_step": 271738, "epoch": 3273} {"train_loss": -24.94313621520996, "global_step": 271739, "epoch": 3273} {"train_loss": -24.859128952026367, "global_step": 271740, "epoch": 3273} {"train_loss": -25.13680265035974, "global_step": 271741, "epoch": 3273, "val_loss": 7045048.5} {"train_loss": -24.378957748413086, "global_step": 271742, "epoch": 3274} {"train_loss": -25.071699142456055, "global_step": 271743, "epoch": 3274} {"train_loss": -24.53753662109375, "global_step": 271744, "epoch": 3274} {"train_loss": -24.863351821899414, "global_step": 271745, "epoch": 3274} {"train_loss": -25.016489028930664, "global_step": 271746, "epoch": 3274} {"train_loss": -24.902347564697266, "global_step": 271747, "epoch": 3274} {"train_loss": -24.40022087097168, "global_step": 271748, "epoch": 3274} {"train_loss": -24.99079704284668, "global_step": 271749, "epoch": 3274} {"train_loss": -24.724166870117188, "global_step": 271750, "epoch": 3274} {"train_loss": -24.913272857666016, "global_step": 271751, "epoch": 3274} {"train_loss": -24.928760528564453, "global_step": 271752, "epoch": 3274} {"train_loss": -24.938095092773438, "global_step": 271753, "epoch": 3274} {"train_loss": -24.839115142822266, "global_step": 271754, "epoch": 3274} {"train_loss": -25.29351234436035, "global_step": 271755, "epoch": 3274} {"train_loss": -25.222787857055664, "global_step": 271756, "epoch": 3274} {"train_loss": -25.010637283325195, "global_step": 271757, "epoch": 3274} {"train_loss": -25.181257247924805, "global_step": 271758, "epoch": 3274} {"train_loss": -25.533185958862305, "global_step": 271759, "epoch": 3274} {"train_loss": -24.95552635192871, "global_step": 271760, "epoch": 3274} {"train_loss": -24.897354125976562, "global_step": 271761, "epoch": 3274} {"train_loss": -25.235748291015625, "global_step": 271762, "epoch": 3274} {"train_loss": -25.34480857849121, "global_step": 271763, "epoch": 3274} {"train_loss": -25.2308349609375, "global_step": 271764, "epoch": 3274} {"train_loss": -25.371688842773438, "global_step": 271765, "epoch": 3274} {"train_loss": -25.217504501342773, "global_step": 271766, "epoch": 3274} {"train_loss": -25.424453735351562, "global_step": 271767, "epoch": 3274} {"train_loss": -25.329885482788086, "global_step": 271768, "epoch": 3274} {"train_loss": -25.276487350463867, "global_step": 271769, "epoch": 3274} {"train_loss": -25.10352897644043, "global_step": 271770, "epoch": 3274} {"train_loss": -24.743423461914062, "global_step": 271771, "epoch": 3274} {"train_loss": -25.08271026611328, "global_step": 271772, "epoch": 3274} {"train_loss": -25.08824348449707, "global_step": 271773, "epoch": 3274} {"train_loss": -25.47286033630371, "global_step": 271774, "epoch": 3274} {"train_loss": -25.55213737487793, "global_step": 271775, "epoch": 3274} {"train_loss": -25.652799606323242, "global_step": 271776, "epoch": 3274} {"train_loss": -25.698455810546875, "global_step": 271777, "epoch": 3274} {"train_loss": -25.346637725830078, "global_step": 271778, "epoch": 3274} {"train_loss": -25.203384399414062, "global_step": 271779, "epoch": 3274} {"train_loss": -25.650415420532227, "global_step": 271780, "epoch": 3274} {"train_loss": -25.62526512145996, "global_step": 271781, "epoch": 3274} {"train_loss": -25.447309494018555, "global_step": 271782, "epoch": 3274} {"train_loss": -25.417346954345703, "global_step": 271783, "epoch": 3274} {"train_loss": -25.44585418701172, "global_step": 271784, "epoch": 3274} {"train_loss": -25.29129409790039, "global_step": 271785, "epoch": 3274} {"train_loss": -25.485061645507812, "global_step": 271786, "epoch": 3274} {"train_loss": -25.770593643188477, "global_step": 271787, "epoch": 3274} {"train_loss": -25.14430809020996, "global_step": 271788, "epoch": 3274} {"train_loss": -25.4969425201416, "global_step": 271789, "epoch": 3274} {"train_loss": -25.095569610595703, "global_step": 271790, "epoch": 3274} {"train_loss": -25.26439666748047, "global_step": 271791, "epoch": 3274} {"train_loss": -25.4645938873291, "global_step": 271792, "epoch": 3274} {"train_loss": -25.49701499938965, "global_step": 271793, "epoch": 3274} {"train_loss": -25.438817977905273, "global_step": 271794, "epoch": 3274} {"train_loss": -25.51881217956543, "global_step": 271795, "epoch": 3274} {"train_loss": -25.147275924682617, "global_step": 271796, "epoch": 3274} {"train_loss": -25.008859634399414, "global_step": 271797, "epoch": 3274} {"train_loss": -25.260272979736328, "global_step": 271798, "epoch": 3274} {"train_loss": -25.111906051635742, "global_step": 271799, "epoch": 3274} {"train_loss": -24.967140197753906, "global_step": 271800, "epoch": 3274} {"train_loss": -24.777891159057617, "global_step": 271801, "epoch": 3274} {"train_loss": -25.31683921813965, "global_step": 271802, "epoch": 3274} {"train_loss": -25.224443435668945, "global_step": 271803, "epoch": 3274} {"train_loss": -25.021947860717773, "global_step": 271804, "epoch": 3274} {"train_loss": -24.92093276977539, "global_step": 271805, "epoch": 3274} {"train_loss": -25.434080123901367, "global_step": 271806, "epoch": 3274} {"train_loss": -25.203140258789062, "global_step": 271807, "epoch": 3274} {"train_loss": -25.173139572143555, "global_step": 271808, "epoch": 3274} {"train_loss": -25.10809326171875, "global_step": 271809, "epoch": 3274} {"train_loss": -25.344289779663086, "global_step": 271810, "epoch": 3274} {"train_loss": -24.974109649658203, "global_step": 271811, "epoch": 3274} {"train_loss": -25.19953727722168, "global_step": 271812, "epoch": 3274} {"train_loss": -25.474872589111328, "global_step": 271813, "epoch": 3274} {"train_loss": -25.380949020385742, "global_step": 271814, "epoch": 3274} {"train_loss": -25.417200088500977, "global_step": 271815, "epoch": 3274} {"train_loss": -25.193389892578125, "global_step": 271816, "epoch": 3274} {"train_loss": -25.28032875061035, "global_step": 271817, "epoch": 3274} {"train_loss": -25.13252830505371, "global_step": 271818, "epoch": 3274} {"train_loss": -25.328760147094727, "global_step": 271819, "epoch": 3274} {"train_loss": -25.15496826171875, "global_step": 271820, "epoch": 3274} {"train_loss": -25.155601501464844, "global_step": 271821, "epoch": 3274} {"train_loss": -25.52643394470215, "global_step": 271822, "epoch": 3274} {"train_loss": -25.544160842895508, "global_step": 271823, "epoch": 3274} {"train_loss": -25.209321493125824, "global_step": 271824, "epoch": 3274, "val_loss": 6988103.0} {"train_loss": -25.36355209350586, "global_step": 271825, "epoch": 3275} {"train_loss": -25.20351791381836, "global_step": 271826, "epoch": 3275} {"train_loss": -25.154478073120117, "global_step": 271827, "epoch": 3275} {"train_loss": -25.10321617126465, "global_step": 271828, "epoch": 3275} {"train_loss": -25.441665649414062, "global_step": 271829, "epoch": 3275} {"train_loss": -25.103294372558594, "global_step": 271830, "epoch": 3275} {"train_loss": -25.680322647094727, "global_step": 271831, "epoch": 3275} {"train_loss": -25.089506149291992, "global_step": 271832, "epoch": 3275} {"train_loss": -25.15810775756836, "global_step": 271833, "epoch": 3275} {"train_loss": -25.16242027282715, "global_step": 271834, "epoch": 3275} {"train_loss": -25.237018585205078, "global_step": 271835, "epoch": 3275} {"train_loss": -25.249494552612305, "global_step": 271836, "epoch": 3275} {"train_loss": -25.10848045349121, "global_step": 271837, "epoch": 3275} {"train_loss": -25.50144386291504, "global_step": 271838, "epoch": 3275} {"train_loss": -25.182048797607422, "global_step": 271839, "epoch": 3275} {"train_loss": -25.546571731567383, "global_step": 271840, "epoch": 3275} {"train_loss": -25.31428337097168, "global_step": 271841, "epoch": 3275} {"train_loss": -25.302644729614258, "global_step": 271842, "epoch": 3275} {"train_loss": -25.5058536529541, "global_step": 271843, "epoch": 3275} {"train_loss": -25.587528228759766, "global_step": 271844, "epoch": 3275} {"train_loss": -24.996768951416016, "global_step": 271845, "epoch": 3275} {"train_loss": -25.374265670776367, "global_step": 271846, "epoch": 3275} {"train_loss": -25.226850509643555, "global_step": 271847, "epoch": 3275} {"train_loss": -25.42401123046875, "global_step": 271848, "epoch": 3275} {"train_loss": -25.33790397644043, "global_step": 271849, "epoch": 3275} {"train_loss": -24.89485740661621, "global_step": 271850, "epoch": 3275} {"train_loss": -25.138769149780273, "global_step": 271851, "epoch": 3275} {"train_loss": -25.206287384033203, "global_step": 271852, "epoch": 3275} {"train_loss": -25.624982833862305, "global_step": 271853, "epoch": 3275} {"train_loss": -25.492040634155273, "global_step": 271854, "epoch": 3275} {"train_loss": -25.17148780822754, "global_step": 271855, "epoch": 3275} {"train_loss": -25.615278244018555, "global_step": 271856, "epoch": 3275} {"train_loss": -25.410985946655273, "global_step": 271857, "epoch": 3275} {"train_loss": -25.40764808654785, "global_step": 271858, "epoch": 3275} {"train_loss": -25.617725372314453, "global_step": 271859, "epoch": 3275} {"train_loss": -25.720458984375, "global_step": 271860, "epoch": 3275} {"train_loss": -25.29668617248535, "global_step": 271861, "epoch": 3275} {"train_loss": -25.420007705688477, "global_step": 271862, "epoch": 3275} {"train_loss": -25.506738662719727, "global_step": 271863, "epoch": 3275} {"train_loss": -25.40678596496582, "global_step": 271864, "epoch": 3275} {"train_loss": -25.187389373779297, "global_step": 271865, "epoch": 3275} {"train_loss": -25.186676025390625, "global_step": 271866, "epoch": 3275} {"train_loss": -25.368432998657227, "global_step": 271867, "epoch": 3275} {"train_loss": -25.444055557250977, "global_step": 271868, "epoch": 3275} {"train_loss": -25.57904052734375, "global_step": 271869, "epoch": 3275} {"train_loss": -25.411497116088867, "global_step": 271870, "epoch": 3275} {"train_loss": -25.379819869995117, "global_step": 271871, "epoch": 3275} {"train_loss": -25.490163803100586, "global_step": 271872, "epoch": 3275} {"train_loss": -25.3824462890625, "global_step": 271873, "epoch": 3275} {"train_loss": -25.56122398376465, "global_step": 271874, "epoch": 3275} {"train_loss": -25.267332077026367, "global_step": 271875, "epoch": 3275} {"train_loss": -24.994464874267578, "global_step": 271876, "epoch": 3275} {"train_loss": -25.419151306152344, "global_step": 271877, "epoch": 3275} {"train_loss": -25.107486724853516, "global_step": 271878, "epoch": 3275} {"train_loss": -25.55440330505371, "global_step": 271879, "epoch": 3275} {"train_loss": -24.871076583862305, "global_step": 271880, "epoch": 3275} {"train_loss": -24.978580474853516, "global_step": 271881, "epoch": 3275} {"train_loss": -25.533159255981445, "global_step": 271882, "epoch": 3275} {"train_loss": -24.76712989807129, "global_step": 271883, "epoch": 3275} {"train_loss": -25.095075607299805, "global_step": 271884, "epoch": 3275} {"train_loss": -25.41019058227539, "global_step": 271885, "epoch": 3275} {"train_loss": -24.991775512695312, "global_step": 271886, "epoch": 3275} {"train_loss": -25.30277442932129, "global_step": 271887, "epoch": 3275} {"train_loss": -25.37424087524414, "global_step": 271888, "epoch": 3275} {"train_loss": -25.2499942779541, "global_step": 271889, "epoch": 3275} {"train_loss": -25.213367462158203, "global_step": 271890, "epoch": 3275} {"train_loss": -25.129375457763672, "global_step": 271891, "epoch": 3275} {"train_loss": -25.19047737121582, "global_step": 271892, "epoch": 3275} {"train_loss": -25.215158462524414, "global_step": 271893, "epoch": 3275} {"train_loss": -25.052555084228516, "global_step": 271894, "epoch": 3275} {"train_loss": -25.57893943786621, "global_step": 271895, "epoch": 3275} {"train_loss": -25.195968627929688, "global_step": 271896, "epoch": 3275} {"train_loss": -25.572254180908203, "global_step": 271897, "epoch": 3275} {"train_loss": -25.015182495117188, "global_step": 271898, "epoch": 3275} {"train_loss": -24.81300163269043, "global_step": 271899, "epoch": 3275} {"train_loss": -25.70865821838379, "global_step": 271900, "epoch": 3275} {"train_loss": -24.72345542907715, "global_step": 271901, "epoch": 3275} {"train_loss": -25.146520614624023, "global_step": 271902, "epoch": 3275} {"train_loss": -25.097373962402344, "global_step": 271903, "epoch": 3275} {"train_loss": -25.252790451049805, "global_step": 271904, "epoch": 3275} {"train_loss": -25.383056640625, "global_step": 271905, "epoch": 3275} {"train_loss": -25.121503829956055, "global_step": 271906, "epoch": 3275} {"train_loss": -25.282844014914637, "global_step": 271907, "epoch": 3275, "val_loss": 6946167.0} {"train_loss": -24.624378204345703, "global_step": 271908, "epoch": 3276} {"train_loss": -24.59735870361328, "global_step": 271909, "epoch": 3276} {"train_loss": -24.85623550415039, "global_step": 271910, "epoch": 3276} {"train_loss": -25.06264305114746, "global_step": 271911, "epoch": 3276} {"train_loss": -24.58900260925293, "global_step": 271912, "epoch": 3276} {"train_loss": -25.060808181762695, "global_step": 271913, "epoch": 3276} {"train_loss": -24.729001998901367, "global_step": 271914, "epoch": 3276} {"train_loss": -24.599760055541992, "global_step": 271915, "epoch": 3276} {"train_loss": -25.013629913330078, "global_step": 271916, "epoch": 3276} {"train_loss": -25.009021759033203, "global_step": 271917, "epoch": 3276} {"train_loss": -25.00721549987793, "global_step": 271918, "epoch": 3276} {"train_loss": -24.784744262695312, "global_step": 271919, "epoch": 3276} {"train_loss": -25.35079002380371, "global_step": 271920, "epoch": 3276} {"train_loss": -25.004928588867188, "global_step": 271921, "epoch": 3276} {"train_loss": -25.174137115478516, "global_step": 271922, "epoch": 3276} {"train_loss": -24.80866241455078, "global_step": 271923, "epoch": 3276} {"train_loss": -24.718923568725586, "global_step": 271924, "epoch": 3276} {"train_loss": -25.181169509887695, "global_step": 271925, "epoch": 3276} {"train_loss": -25.413694381713867, "global_step": 271926, "epoch": 3276} {"train_loss": -25.147218704223633, "global_step": 271927, "epoch": 3276} {"train_loss": -25.25923728942871, "global_step": 271928, "epoch": 3276} {"train_loss": -24.84657859802246, "global_step": 271929, "epoch": 3276} {"train_loss": -25.0507755279541, "global_step": 271930, "epoch": 3276} {"train_loss": -25.022062301635742, "global_step": 271931, "epoch": 3276} {"train_loss": -25.746633529663086, "global_step": 271932, "epoch": 3276} {"train_loss": -25.465347290039062, "global_step": 271933, "epoch": 3276} {"train_loss": -24.826536178588867, "global_step": 271934, "epoch": 3276} {"train_loss": -25.26108169555664, "global_step": 271935, "epoch": 3276} {"train_loss": -24.935874938964844, "global_step": 271936, "epoch": 3276} {"train_loss": -25.331470489501953, "global_step": 271937, "epoch": 3276} {"train_loss": -25.027463912963867, "global_step": 271938, "epoch": 3276} {"train_loss": -25.382301330566406, "global_step": 271939, "epoch": 3276} {"train_loss": -25.098342895507812, "global_step": 271940, "epoch": 3276} {"train_loss": -25.4477481842041, "global_step": 271941, "epoch": 3276} {"train_loss": -25.32740592956543, "global_step": 271942, "epoch": 3276} {"train_loss": -25.502599716186523, "global_step": 271943, "epoch": 3276} {"train_loss": -25.38850212097168, "global_step": 271944, "epoch": 3276} {"train_loss": -25.78451919555664, "global_step": 271945, "epoch": 3276} {"train_loss": -25.734582901000977, "global_step": 271946, "epoch": 3276} {"train_loss": -25.467166900634766, "global_step": 271947, "epoch": 3276} {"train_loss": -25.497236251831055, "global_step": 271948, "epoch": 3276} {"train_loss": -25.136489868164062, "global_step": 271949, "epoch": 3276} {"train_loss": -25.269193649291992, "global_step": 271950, "epoch": 3276} {"train_loss": -25.384445190429688, "global_step": 271951, "epoch": 3276} {"train_loss": -25.253597259521484, "global_step": 271952, "epoch": 3276} {"train_loss": -25.531940460205078, "global_step": 271953, "epoch": 3276} {"train_loss": -25.164691925048828, "global_step": 271954, "epoch": 3276} {"train_loss": -25.560400009155273, "global_step": 271955, "epoch": 3276} {"train_loss": -25.588150024414062, "global_step": 271956, "epoch": 3276} {"train_loss": -25.553293228149414, "global_step": 271957, "epoch": 3276} {"train_loss": -25.199939727783203, "global_step": 271958, "epoch": 3276} {"train_loss": -25.495391845703125, "global_step": 271959, "epoch": 3276} {"train_loss": -25.370338439941406, "global_step": 271960, "epoch": 3276} {"train_loss": -25.05500602722168, "global_step": 271961, "epoch": 3276} {"train_loss": -25.48091697692871, "global_step": 271962, "epoch": 3276} {"train_loss": -24.985803604125977, "global_step": 271963, "epoch": 3276} {"train_loss": -24.69757652282715, "global_step": 271964, "epoch": 3276} {"train_loss": -25.175094604492188, "global_step": 271965, "epoch": 3276} {"train_loss": -25.101980209350586, "global_step": 271966, "epoch": 3276} {"train_loss": -25.193958282470703, "global_step": 271967, "epoch": 3276} {"train_loss": -25.321441650390625, "global_step": 271968, "epoch": 3276} {"train_loss": -24.85127830505371, "global_step": 271969, "epoch": 3276} {"train_loss": -25.37989616394043, "global_step": 271970, "epoch": 3276} {"train_loss": -25.011463165283203, "global_step": 271971, "epoch": 3276} {"train_loss": -25.206735610961914, "global_step": 271972, "epoch": 3276} {"train_loss": -24.66860008239746, "global_step": 271973, "epoch": 3276} {"train_loss": -25.2993106842041, "global_step": 271974, "epoch": 3276} {"train_loss": -25.168231964111328, "global_step": 271975, "epoch": 3276} {"train_loss": -25.598913192749023, "global_step": 271976, "epoch": 3276} {"train_loss": -25.13513946533203, "global_step": 271977, "epoch": 3276} {"train_loss": -25.509857177734375, "global_step": 271978, "epoch": 3276} {"train_loss": -25.574548721313477, "global_step": 271979, "epoch": 3276} {"train_loss": -25.154447555541992, "global_step": 271980, "epoch": 3276} {"train_loss": -24.846662521362305, "global_step": 271981, "epoch": 3276} {"train_loss": -25.4182186126709, "global_step": 271982, "epoch": 3276} {"train_loss": -25.488794326782227, "global_step": 271983, "epoch": 3276} {"train_loss": -25.20115089416504, "global_step": 271984, "epoch": 3276} {"train_loss": -25.475759506225586, "global_step": 271985, "epoch": 3276} {"train_loss": -25.403079986572266, "global_step": 271986, "epoch": 3276} {"train_loss": -25.72464370727539, "global_step": 271987, "epoch": 3276} {"train_loss": -25.364078521728516, "global_step": 271988, "epoch": 3276} {"train_loss": -25.27515983581543, "global_step": 271989, "epoch": 3276} {"train_loss": -25.19911747668163, "global_step": 271990, "epoch": 3276, "val_loss": 6970813.0} {"train_loss": -24.331228256225586, "global_step": 271991, "epoch": 3277} {"train_loss": -24.499332427978516, "global_step": 271992, "epoch": 3277} {"train_loss": -25.018049240112305, "global_step": 271993, "epoch": 3277} {"train_loss": -24.43550682067871, "global_step": 271994, "epoch": 3277} {"train_loss": -25.085580825805664, "global_step": 271995, "epoch": 3277} {"train_loss": -24.525304794311523, "global_step": 271996, "epoch": 3277} {"train_loss": -25.035932540893555, "global_step": 271997, "epoch": 3277} {"train_loss": -25.022058486938477, "global_step": 271998, "epoch": 3277} {"train_loss": -25.5760555267334, "global_step": 271999, "epoch": 3277} {"train_loss": -24.983530044555664, "global_step": 272000, "epoch": 3277} {"train_loss": -24.850629806518555, "global_step": 272001, "epoch": 3277} {"train_loss": -25.43721580505371, "global_step": 272002, "epoch": 3277} {"train_loss": -25.217161178588867, "global_step": 272003, "epoch": 3277} {"train_loss": -25.191518783569336, "global_step": 272004, "epoch": 3277} {"train_loss": -25.069311141967773, "global_step": 272005, "epoch": 3277} {"train_loss": -25.085336685180664, "global_step": 272006, "epoch": 3277} {"train_loss": -24.97608757019043, "global_step": 272007, "epoch": 3277} {"train_loss": -25.296539306640625, "global_step": 272008, "epoch": 3277} {"train_loss": -25.148578643798828, "global_step": 272009, "epoch": 3277} {"train_loss": -25.106475830078125, "global_step": 272010, "epoch": 3277} {"train_loss": -24.932565689086914, "global_step": 272011, "epoch": 3277} {"train_loss": -25.532089233398438, "global_step": 272012, "epoch": 3277} {"train_loss": -25.48568344116211, "global_step": 272013, "epoch": 3277} {"train_loss": -24.99324607849121, "global_step": 272014, "epoch": 3277} {"train_loss": -25.18800926208496, "global_step": 272015, "epoch": 3277} {"train_loss": -25.303436279296875, "global_step": 272016, "epoch": 3277} {"train_loss": -25.465978622436523, "global_step": 272017, "epoch": 3277} {"train_loss": -24.901432037353516, "global_step": 272018, "epoch": 3277} {"train_loss": -25.24238395690918, "global_step": 272019, "epoch": 3277} {"train_loss": -25.257413864135742, "global_step": 272020, "epoch": 3277} {"train_loss": -25.21450424194336, "global_step": 272021, "epoch": 3277} {"train_loss": -24.854860305786133, "global_step": 272022, "epoch": 3277} {"train_loss": -25.46993064880371, "global_step": 272023, "epoch": 3277} {"train_loss": -25.37872314453125, "global_step": 272024, "epoch": 3277} {"train_loss": -25.46320915222168, "global_step": 272025, "epoch": 3277} {"train_loss": -25.292646408081055, "global_step": 272026, "epoch": 3277} {"train_loss": -25.397647857666016, "global_step": 272027, "epoch": 3277} {"train_loss": -25.494115829467773, "global_step": 272028, "epoch": 3277} {"train_loss": -25.09918212890625, "global_step": 272029, "epoch": 3277} {"train_loss": -25.326078414916992, "global_step": 272030, "epoch": 3277} {"train_loss": -25.17193603515625, "global_step": 272031, "epoch": 3277} {"train_loss": -25.216909408569336, "global_step": 272032, "epoch": 3277} {"train_loss": -25.171396255493164, "global_step": 272033, "epoch": 3277} {"train_loss": -25.355581283569336, "global_step": 272034, "epoch": 3277} {"train_loss": -25.203052520751953, "global_step": 272035, "epoch": 3277} {"train_loss": -25.40972137451172, "global_step": 272036, "epoch": 3277} {"train_loss": -25.504011154174805, "global_step": 272037, "epoch": 3277} {"train_loss": -25.142684936523438, "global_step": 272038, "epoch": 3277} {"train_loss": -25.580591201782227, "global_step": 272039, "epoch": 3277} {"train_loss": -25.495826721191406, "global_step": 272040, "epoch": 3277} {"train_loss": -25.586191177368164, "global_step": 272041, "epoch": 3277} {"train_loss": -25.53974723815918, "global_step": 272042, "epoch": 3277} {"train_loss": -25.475008010864258, "global_step": 272043, "epoch": 3277} {"train_loss": -25.28083610534668, "global_step": 272044, "epoch": 3277} {"train_loss": -25.199594497680664, "global_step": 272045, "epoch": 3277} {"train_loss": -25.25356101989746, "global_step": 272046, "epoch": 3277} {"train_loss": -25.15176010131836, "global_step": 272047, "epoch": 3277} {"train_loss": -24.868682861328125, "global_step": 272048, "epoch": 3277} {"train_loss": -25.24393653869629, "global_step": 272049, "epoch": 3277} {"train_loss": -25.102338790893555, "global_step": 272050, "epoch": 3277} {"train_loss": -25.43532371520996, "global_step": 272051, "epoch": 3277} {"train_loss": -25.032535552978516, "global_step": 272052, "epoch": 3277} {"train_loss": -25.068660736083984, "global_step": 272053, "epoch": 3277} {"train_loss": -25.59998893737793, "global_step": 272054, "epoch": 3277} {"train_loss": -25.357391357421875, "global_step": 272055, "epoch": 3277} {"train_loss": -25.399824142456055, "global_step": 272056, "epoch": 3277} {"train_loss": -25.49662208557129, "global_step": 272057, "epoch": 3277} {"train_loss": -25.26146697998047, "global_step": 272058, "epoch": 3277} {"train_loss": -25.252714157104492, "global_step": 272059, "epoch": 3277} {"train_loss": -24.949979782104492, "global_step": 272060, "epoch": 3277} {"train_loss": -25.413837432861328, "global_step": 272061, "epoch": 3277} {"train_loss": -25.06178092956543, "global_step": 272062, "epoch": 3277} {"train_loss": -25.498430252075195, "global_step": 272063, "epoch": 3277} {"train_loss": -25.560407638549805, "global_step": 272064, "epoch": 3277} {"train_loss": -25.384492874145508, "global_step": 272065, "epoch": 3277} {"train_loss": -25.614103317260742, "global_step": 272066, "epoch": 3277} {"train_loss": -25.33279037475586, "global_step": 272067, "epoch": 3277} {"train_loss": -25.365938186645508, "global_step": 272068, "epoch": 3277} {"train_loss": -25.476093292236328, "global_step": 272069, "epoch": 3277} {"train_loss": -25.16936492919922, "global_step": 272070, "epoch": 3277} {"train_loss": -25.264150619506836, "global_step": 272071, "epoch": 3277} {"train_loss": -25.338125228881836, "global_step": 272072, "epoch": 3277} {"train_loss": -25.225430936698455, "global_step": 272073, "epoch": 3277, "val_loss": 6979651.5} {"train_loss": -25.140745162963867, "global_step": 272074, "epoch": 3278} {"train_loss": -25.084659576416016, "global_step": 272075, "epoch": 3278} {"train_loss": -24.808120727539062, "global_step": 272076, "epoch": 3278} {"train_loss": -25.00249671936035, "global_step": 272077, "epoch": 3278} {"train_loss": -25.376705169677734, "global_step": 272078, "epoch": 3278} {"train_loss": -24.84842872619629, "global_step": 272079, "epoch": 3278} {"train_loss": -24.774641036987305, "global_step": 272080, "epoch": 3278} {"train_loss": -25.249250411987305, "global_step": 272081, "epoch": 3278} {"train_loss": -25.652219772338867, "global_step": 272082, "epoch": 3278} {"train_loss": -25.084625244140625, "global_step": 272083, "epoch": 3278} {"train_loss": -25.10419464111328, "global_step": 272084, "epoch": 3278} {"train_loss": -24.954206466674805, "global_step": 272085, "epoch": 3278} {"train_loss": -24.888254165649414, "global_step": 272086, "epoch": 3278} {"train_loss": -25.233205795288086, "global_step": 272087, "epoch": 3278} {"train_loss": -25.210094451904297, "global_step": 272088, "epoch": 3278} {"train_loss": -25.079221725463867, "global_step": 272089, "epoch": 3278} {"train_loss": -25.088973999023438, "global_step": 272090, "epoch": 3278} {"train_loss": -25.184097290039062, "global_step": 272091, "epoch": 3278} {"train_loss": -25.20734214782715, "global_step": 272092, "epoch": 3278} {"train_loss": -25.39155387878418, "global_step": 272093, "epoch": 3278} {"train_loss": -25.302589416503906, "global_step": 272094, "epoch": 3278} {"train_loss": -25.11255645751953, "global_step": 272095, "epoch": 3278} {"train_loss": -25.494794845581055, "global_step": 272096, "epoch": 3278} {"train_loss": -24.897994995117188, "global_step": 272097, "epoch": 3278} {"train_loss": -25.470794677734375, "global_step": 272098, "epoch": 3278} {"train_loss": -25.411651611328125, "global_step": 272099, "epoch": 3278} {"train_loss": -25.677213668823242, "global_step": 272100, "epoch": 3278} {"train_loss": -25.4228515625, "global_step": 272101, "epoch": 3278} {"train_loss": -25.203413009643555, "global_step": 272102, "epoch": 3278} {"train_loss": -25.5267333984375, "global_step": 272103, "epoch": 3278} {"train_loss": -25.614728927612305, "global_step": 272104, "epoch": 3278} {"train_loss": -25.315786361694336, "global_step": 272105, "epoch": 3278} {"train_loss": -25.389602661132812, "global_step": 272106, "epoch": 3278} {"train_loss": -25.079923629760742, "global_step": 272107, "epoch": 3278} {"train_loss": -25.143402099609375, "global_step": 272108, "epoch": 3278} {"train_loss": -25.114171981811523, "global_step": 272109, "epoch": 3278} {"train_loss": -25.637914657592773, "global_step": 272110, "epoch": 3278} {"train_loss": -25.727582931518555, "global_step": 272111, "epoch": 3278} {"train_loss": -25.15309715270996, "global_step": 272112, "epoch": 3278} {"train_loss": -25.1809139251709, "global_step": 272113, "epoch": 3278} {"train_loss": -25.755756378173828, "global_step": 272114, "epoch": 3278} {"train_loss": -25.448577880859375, "global_step": 272115, "epoch": 3278} {"train_loss": -25.557397842407227, "global_step": 272116, "epoch": 3278} {"train_loss": -25.53523826599121, "global_step": 272117, "epoch": 3278} {"train_loss": -25.49224281311035, "global_step": 272118, "epoch": 3278} {"train_loss": -25.36774253845215, "global_step": 272119, "epoch": 3278} {"train_loss": -25.504730224609375, "global_step": 272120, "epoch": 3278} {"train_loss": -25.388168334960938, "global_step": 272121, "epoch": 3278} {"train_loss": -25.40139389038086, "global_step": 272122, "epoch": 3278} {"train_loss": -25.465028762817383, "global_step": 272123, "epoch": 3278} {"train_loss": -25.5373477935791, "global_step": 272124, "epoch": 3278} {"train_loss": -25.392988204956055, "global_step": 272125, "epoch": 3278} {"train_loss": -25.467985153198242, "global_step": 272126, "epoch": 3278} {"train_loss": -25.546438217163086, "global_step": 272127, "epoch": 3278} {"train_loss": -25.499338150024414, "global_step": 272128, "epoch": 3278} {"train_loss": -25.041471481323242, "global_step": 272129, "epoch": 3278} {"train_loss": -25.638463973999023, "global_step": 272130, "epoch": 3278} {"train_loss": -25.51154899597168, "global_step": 272131, "epoch": 3278} {"train_loss": -25.077878952026367, "global_step": 272132, "epoch": 3278} {"train_loss": -25.521190643310547, "global_step": 272133, "epoch": 3278} {"train_loss": -25.14564323425293, "global_step": 272134, "epoch": 3278} {"train_loss": -25.57344627380371, "global_step": 272135, "epoch": 3278} {"train_loss": -25.36148452758789, "global_step": 272136, "epoch": 3278} {"train_loss": -25.2913761138916, "global_step": 272137, "epoch": 3278} {"train_loss": -25.338430404663086, "global_step": 272138, "epoch": 3278} {"train_loss": -25.258642196655273, "global_step": 272139, "epoch": 3278} {"train_loss": -25.578502655029297, "global_step": 272140, "epoch": 3278} {"train_loss": -24.912778854370117, "global_step": 272141, "epoch": 3278} {"train_loss": -24.671701431274414, "global_step": 272142, "epoch": 3278} {"train_loss": -24.034732818603516, "global_step": 272143, "epoch": 3278} {"train_loss": -23.235340118408203, "global_step": 272144, "epoch": 3278} {"train_loss": -23.249940872192383, "global_step": 272145, "epoch": 3278} {"train_loss": -24.645748138427734, "global_step": 272146, "epoch": 3278} {"train_loss": -24.327573776245117, "global_step": 272147, "epoch": 3278} {"train_loss": -24.510807037353516, "global_step": 272148, "epoch": 3278} {"train_loss": -24.383207321166992, "global_step": 272149, "epoch": 3278} {"train_loss": -24.777362823486328, "global_step": 272150, "epoch": 3278} {"train_loss": -24.692155838012695, "global_step": 272151, "epoch": 3278} {"train_loss": -25.137434005737305, "global_step": 272152, "epoch": 3278} {"train_loss": -24.493833541870117, "global_step": 272153, "epoch": 3278} {"train_loss": -24.78012466430664, "global_step": 272154, "epoch": 3278} {"train_loss": -24.625167846679688, "global_step": 272155, "epoch": 3278} {"train_loss": -25.168450527880566, "global_step": 272156, "epoch": 3278, "val_loss": 6877821.0} {"train_loss": -23.649127960205078, "global_step": 272157, "epoch": 3279} {"train_loss": -23.784027099609375, "global_step": 272158, "epoch": 3279} {"train_loss": -25.029874801635742, "global_step": 272159, "epoch": 3279} {"train_loss": -23.9759464263916, "global_step": 272160, "epoch": 3279} {"train_loss": -24.425764083862305, "global_step": 272161, "epoch": 3279} {"train_loss": -24.61773681640625, "global_step": 272162, "epoch": 3279} {"train_loss": -24.484786987304688, "global_step": 272163, "epoch": 3279} {"train_loss": -24.431888580322266, "global_step": 272164, "epoch": 3279} {"train_loss": -24.33199691772461, "global_step": 272165, "epoch": 3279} {"train_loss": -24.754138946533203, "global_step": 272166, "epoch": 3279} {"train_loss": -24.675251007080078, "global_step": 272167, "epoch": 3279} {"train_loss": -24.713396072387695, "global_step": 272168, "epoch": 3279} {"train_loss": -24.515853881835938, "global_step": 272169, "epoch": 3279} {"train_loss": -25.216506958007812, "global_step": 272170, "epoch": 3279} {"train_loss": -24.967466354370117, "global_step": 272171, "epoch": 3279} {"train_loss": -25.043073654174805, "global_step": 272172, "epoch": 3279} {"train_loss": -24.989145278930664, "global_step": 272173, "epoch": 3279} {"train_loss": -24.893341064453125, "global_step": 272174, "epoch": 3279} {"train_loss": -25.135900497436523, "global_step": 272175, "epoch": 3279} {"train_loss": -25.121244430541992, "global_step": 272176, "epoch": 3279} {"train_loss": -24.71053123474121, "global_step": 272177, "epoch": 3279} {"train_loss": -24.91388511657715, "global_step": 272178, "epoch": 3279} {"train_loss": -25.202173233032227, "global_step": 272179, "epoch": 3279} {"train_loss": -25.266845703125, "global_step": 272180, "epoch": 3279} {"train_loss": -25.09101676940918, "global_step": 272181, "epoch": 3279} {"train_loss": -25.297868728637695, "global_step": 272182, "epoch": 3279} {"train_loss": -25.33216667175293, "global_step": 272183, "epoch": 3279} {"train_loss": -24.91644859313965, "global_step": 272184, "epoch": 3279} {"train_loss": -25.331323623657227, "global_step": 272185, "epoch": 3279} {"train_loss": -24.983760833740234, "global_step": 272186, "epoch": 3279} {"train_loss": -24.757999420166016, "global_step": 272187, "epoch": 3279} {"train_loss": -25.134336471557617, "global_step": 272188, "epoch": 3279} {"train_loss": -25.042251586914062, "global_step": 272189, "epoch": 3279} {"train_loss": -25.10112762451172, "global_step": 272190, "epoch": 3279} {"train_loss": -25.43775749206543, "global_step": 272191, "epoch": 3279} {"train_loss": -25.36709976196289, "global_step": 272192, "epoch": 3279} {"train_loss": -25.27280616760254, "global_step": 272193, "epoch": 3279} {"train_loss": -25.32989501953125, "global_step": 272194, "epoch": 3279} {"train_loss": -25.552188873291016, "global_step": 272195, "epoch": 3279} {"train_loss": -25.527984619140625, "global_step": 272196, "epoch": 3279} {"train_loss": -25.226064682006836, "global_step": 272197, "epoch": 3279} {"train_loss": -25.551982879638672, "global_step": 272198, "epoch": 3279} {"train_loss": -25.14085578918457, "global_step": 272199, "epoch": 3279} {"train_loss": -25.267303466796875, "global_step": 272200, "epoch": 3279} {"train_loss": -25.76630210876465, "global_step": 272201, "epoch": 3279} {"train_loss": -25.31861686706543, "global_step": 272202, "epoch": 3279} {"train_loss": -25.605854034423828, "global_step": 272203, "epoch": 3279} {"train_loss": -25.211095809936523, "global_step": 272204, "epoch": 3279} {"train_loss": -25.493810653686523, "global_step": 272205, "epoch": 3279} {"train_loss": -25.32625389099121, "global_step": 272206, "epoch": 3279} {"train_loss": -25.388593673706055, "global_step": 272207, "epoch": 3279} {"train_loss": -25.41994285583496, "global_step": 272208, "epoch": 3279} {"train_loss": -25.583372116088867, "global_step": 272209, "epoch": 3279} {"train_loss": -25.097673416137695, "global_step": 272210, "epoch": 3279} {"train_loss": -25.4954833984375, "global_step": 272211, "epoch": 3279} {"train_loss": -25.334043502807617, "global_step": 272212, "epoch": 3279} {"train_loss": -25.11586570739746, "global_step": 272213, "epoch": 3279} {"train_loss": -25.309865951538086, "global_step": 272214, "epoch": 3279} {"train_loss": -24.915403366088867, "global_step": 272215, "epoch": 3279} {"train_loss": -25.052459716796875, "global_step": 272216, "epoch": 3279} {"train_loss": -25.03370475769043, "global_step": 272217, "epoch": 3279} {"train_loss": -25.05536460876465, "global_step": 272218, "epoch": 3279} {"train_loss": -24.98795509338379, "global_step": 272219, "epoch": 3279} {"train_loss": -25.169187545776367, "global_step": 272220, "epoch": 3279} {"train_loss": -25.547121047973633, "global_step": 272221, "epoch": 3279} {"train_loss": -25.240299224853516, "global_step": 272222, "epoch": 3279} {"train_loss": -25.431926727294922, "global_step": 272223, "epoch": 3279} {"train_loss": -24.919723510742188, "global_step": 272224, "epoch": 3279} {"train_loss": -25.22957420349121, "global_step": 272225, "epoch": 3279} {"train_loss": -25.23279571533203, "global_step": 272226, "epoch": 3279} {"train_loss": -25.60040855407715, "global_step": 272227, "epoch": 3279} {"train_loss": -25.139101028442383, "global_step": 272228, "epoch": 3279} {"train_loss": -25.271635055541992, "global_step": 272229, "epoch": 3279} {"train_loss": -25.232379913330078, "global_step": 272230, "epoch": 3279} {"train_loss": -25.797582626342773, "global_step": 272231, "epoch": 3279} {"train_loss": -24.833377838134766, "global_step": 272232, "epoch": 3279} {"train_loss": -25.639318466186523, "global_step": 272233, "epoch": 3279} {"train_loss": -25.37110710144043, "global_step": 272234, "epoch": 3279} {"train_loss": -25.097314834594727, "global_step": 272235, "epoch": 3279} {"train_loss": -25.20157241821289, "global_step": 272236, "epoch": 3279} {"train_loss": -25.322555541992188, "global_step": 272237, "epoch": 3279} {"train_loss": -25.201078414916992, "global_step": 272238, "epoch": 3279} {"train_loss": -25.110400165419982, "global_step": 272239, "epoch": 3279, "val_loss": 7017889.0} {"train_loss": -25.13132667541504, "global_step": 272240, "epoch": 3280} {"train_loss": -24.271987915039062, "global_step": 272241, "epoch": 3280} {"train_loss": -25.061695098876953, "global_step": 272242, "epoch": 3280} {"train_loss": -25.327627182006836, "global_step": 272243, "epoch": 3280} {"train_loss": -24.856298446655273, "global_step": 272244, "epoch": 3280} {"train_loss": -25.05735206604004, "global_step": 272245, "epoch": 3280} {"train_loss": -24.806224822998047, "global_step": 272246, "epoch": 3280} {"train_loss": -25.093000411987305, "global_step": 272247, "epoch": 3280} {"train_loss": -24.910961151123047, "global_step": 272248, "epoch": 3280} {"train_loss": -24.993484497070312, "global_step": 272249, "epoch": 3280} {"train_loss": -24.668006896972656, "global_step": 272250, "epoch": 3280} {"train_loss": -25.08662986755371, "global_step": 272251, "epoch": 3280} {"train_loss": -25.2390193939209, "global_step": 272252, "epoch": 3280} {"train_loss": -24.984695434570312, "global_step": 272253, "epoch": 3280} {"train_loss": -25.227876663208008, "global_step": 272254, "epoch": 3280} {"train_loss": -25.080703735351562, "global_step": 272255, "epoch": 3280} {"train_loss": -25.001977920532227, "global_step": 272256, "epoch": 3280} {"train_loss": -25.4033203125, "global_step": 272257, "epoch": 3280} {"train_loss": -24.97285270690918, "global_step": 272258, "epoch": 3280} {"train_loss": -25.237058639526367, "global_step": 272259, "epoch": 3280} {"train_loss": -25.291431427001953, "global_step": 272260, "epoch": 3280} {"train_loss": -25.442262649536133, "global_step": 272261, "epoch": 3280} {"train_loss": -25.36573600769043, "global_step": 272262, "epoch": 3280} {"train_loss": -25.508941650390625, "global_step": 272263, "epoch": 3280} {"train_loss": -25.526443481445312, "global_step": 272264, "epoch": 3280} {"train_loss": -25.539306640625, "global_step": 272265, "epoch": 3280} {"train_loss": -25.359159469604492, "global_step": 272266, "epoch": 3280} {"train_loss": -25.584264755249023, "global_step": 272267, "epoch": 3280} {"train_loss": -25.22809410095215, "global_step": 272268, "epoch": 3280} {"train_loss": -25.275480270385742, "global_step": 272269, "epoch": 3280} {"train_loss": -25.63985252380371, "global_step": 272270, "epoch": 3280} {"train_loss": -25.453603744506836, "global_step": 272271, "epoch": 3280} {"train_loss": -25.402990341186523, "global_step": 272272, "epoch": 3280} {"train_loss": -25.401655197143555, "global_step": 272273, "epoch": 3280} {"train_loss": -25.441465377807617, "global_step": 272274, "epoch": 3280} {"train_loss": -25.55403709411621, "global_step": 272275, "epoch": 3280} {"train_loss": -25.675867080688477, "global_step": 272276, "epoch": 3280} {"train_loss": -25.79347038269043, "global_step": 272277, "epoch": 3280} {"train_loss": -25.371633529663086, "global_step": 272278, "epoch": 3280} {"train_loss": -25.58933448791504, "global_step": 272279, "epoch": 3280} {"train_loss": -25.077322006225586, "global_step": 272280, "epoch": 3280} {"train_loss": -25.478832244873047, "global_step": 272281, "epoch": 3280} {"train_loss": -25.25885581970215, "global_step": 272282, "epoch": 3280} {"train_loss": -25.136228561401367, "global_step": 272283, "epoch": 3280} {"train_loss": -25.169904708862305, "global_step": 272284, "epoch": 3280} {"train_loss": -25.522764205932617, "global_step": 272285, "epoch": 3280} {"train_loss": -25.740589141845703, "global_step": 272286, "epoch": 3280} {"train_loss": -25.250202178955078, "global_step": 272287, "epoch": 3280} {"train_loss": -25.657812118530273, "global_step": 272288, "epoch": 3280} {"train_loss": -25.187101364135742, "global_step": 272289, "epoch": 3280} {"train_loss": -25.737512588500977, "global_step": 272290, "epoch": 3280} {"train_loss": -25.315156936645508, "global_step": 272291, "epoch": 3280} {"train_loss": -25.61809730529785, "global_step": 272292, "epoch": 3280} {"train_loss": -25.283239364624023, "global_step": 272293, "epoch": 3280} {"train_loss": -25.468015670776367, "global_step": 272294, "epoch": 3280} {"train_loss": -25.28823471069336, "global_step": 272295, "epoch": 3280} {"train_loss": -25.639678955078125, "global_step": 272296, "epoch": 3280} {"train_loss": -25.451507568359375, "global_step": 272297, "epoch": 3280} {"train_loss": -25.446495056152344, "global_step": 272298, "epoch": 3280} {"train_loss": -25.24257469177246, "global_step": 272299, "epoch": 3280} {"train_loss": -24.99686622619629, "global_step": 272300, "epoch": 3280} {"train_loss": -24.75577735900879, "global_step": 272301, "epoch": 3280} {"train_loss": -25.009735107421875, "global_step": 272302, "epoch": 3280} {"train_loss": -25.122541427612305, "global_step": 272303, "epoch": 3280} {"train_loss": -25.234609603881836, "global_step": 272304, "epoch": 3280} {"train_loss": -25.57155418395996, "global_step": 272305, "epoch": 3280} {"train_loss": -25.199674606323242, "global_step": 272306, "epoch": 3280} {"train_loss": -25.525867462158203, "global_step": 272307, "epoch": 3280} {"train_loss": -25.030635833740234, "global_step": 272308, "epoch": 3280} {"train_loss": -25.439350128173828, "global_step": 272309, "epoch": 3280} {"train_loss": -25.020627975463867, "global_step": 272310, "epoch": 3280} {"train_loss": -24.936227798461914, "global_step": 272311, "epoch": 3280} {"train_loss": -25.24822998046875, "global_step": 272312, "epoch": 3280} {"train_loss": -25.180875778198242, "global_step": 272313, "epoch": 3280} {"train_loss": -24.840734481811523, "global_step": 272314, "epoch": 3280} {"train_loss": -24.764259338378906, "global_step": 272315, "epoch": 3280} {"train_loss": -25.319034576416016, "global_step": 272316, "epoch": 3280} {"train_loss": -25.230560302734375, "global_step": 272317, "epoch": 3280} {"train_loss": -25.24150276184082, "global_step": 272318, "epoch": 3280} {"train_loss": -25.139318466186523, "global_step": 272319, "epoch": 3280} {"train_loss": -25.26202964782715, "global_step": 272320, "epoch": 3280} {"train_loss": -25.05462074279785, "global_step": 272321, "epoch": 3280} {"train_loss": -25.256766491625683, "global_step": 272322, "epoch": 3280, "val_loss": 7044103.0} {"train_loss": -24.99855613708496, "global_step": 272323, "epoch": 3281} {"train_loss": -25.34625816345215, "global_step": 272324, "epoch": 3281} {"train_loss": -24.99620819091797, "global_step": 272325, "epoch": 3281} {"train_loss": -24.705387115478516, "global_step": 272326, "epoch": 3281} {"train_loss": -25.229158401489258, "global_step": 272327, "epoch": 3281} {"train_loss": -25.272043228149414, "global_step": 272328, "epoch": 3281} {"train_loss": -24.909019470214844, "global_step": 272329, "epoch": 3281} {"train_loss": -25.598979949951172, "global_step": 272330, "epoch": 3281} {"train_loss": -25.21003532409668, "global_step": 272331, "epoch": 3281} {"train_loss": -25.2655086517334, "global_step": 272332, "epoch": 3281} {"train_loss": -25.17731285095215, "global_step": 272333, "epoch": 3281} {"train_loss": -25.790861129760742, "global_step": 272334, "epoch": 3281} {"train_loss": -25.360219955444336, "global_step": 272335, "epoch": 3281} {"train_loss": -25.378103256225586, "global_step": 272336, "epoch": 3281} {"train_loss": -25.320152282714844, "global_step": 272337, "epoch": 3281} {"train_loss": -25.38783073425293, "global_step": 272338, "epoch": 3281} {"train_loss": -25.009103775024414, "global_step": 272339, "epoch": 3281} {"train_loss": -25.21480369567871, "global_step": 272340, "epoch": 3281} {"train_loss": -25.299650192260742, "global_step": 272341, "epoch": 3281} {"train_loss": -25.54250144958496, "global_step": 272342, "epoch": 3281} {"train_loss": -25.08392333984375, "global_step": 272343, "epoch": 3281} {"train_loss": -25.26549530029297, "global_step": 272344, "epoch": 3281} {"train_loss": -25.412057876586914, "global_step": 272345, "epoch": 3281} {"train_loss": -25.262523651123047, "global_step": 272346, "epoch": 3281} {"train_loss": -25.254322052001953, "global_step": 272347, "epoch": 3281} {"train_loss": -25.139753341674805, "global_step": 272348, "epoch": 3281} {"train_loss": -24.934926986694336, "global_step": 272349, "epoch": 3281} {"train_loss": -25.093536376953125, "global_step": 272350, "epoch": 3281} {"train_loss": -25.181509017944336, "global_step": 272351, "epoch": 3281} {"train_loss": -25.408292770385742, "global_step": 272352, "epoch": 3281} {"train_loss": -25.271991729736328, "global_step": 272353, "epoch": 3281} {"train_loss": -25.135848999023438, "global_step": 272354, "epoch": 3281} {"train_loss": -25.23543357849121, "global_step": 272355, "epoch": 3281} {"train_loss": -25.194873809814453, "global_step": 272356, "epoch": 3281} {"train_loss": -25.086318969726562, "global_step": 272357, "epoch": 3281} {"train_loss": -25.146442413330078, "global_step": 272358, "epoch": 3281} {"train_loss": -25.497526168823242, "global_step": 272359, "epoch": 3281} {"train_loss": -25.700180053710938, "global_step": 272360, "epoch": 3281} {"train_loss": -25.48297119140625, "global_step": 272361, "epoch": 3281} {"train_loss": -25.401670455932617, "global_step": 272362, "epoch": 3281} {"train_loss": -25.51569175720215, "global_step": 272363, "epoch": 3281} {"train_loss": -25.82745361328125, "global_step": 272364, "epoch": 3281} {"train_loss": -25.299911499023438, "global_step": 272365, "epoch": 3281} {"train_loss": -25.366674423217773, "global_step": 272366, "epoch": 3281} {"train_loss": -25.000654220581055, "global_step": 272367, "epoch": 3281} {"train_loss": -24.900848388671875, "global_step": 272368, "epoch": 3281} {"train_loss": -25.203786849975586, "global_step": 272369, "epoch": 3281} {"train_loss": -25.371877670288086, "global_step": 272370, "epoch": 3281} {"train_loss": -25.394834518432617, "global_step": 272371, "epoch": 3281} {"train_loss": -25.673871994018555, "global_step": 272372, "epoch": 3281} {"train_loss": -25.33797264099121, "global_step": 272373, "epoch": 3281} {"train_loss": -25.52296257019043, "global_step": 272374, "epoch": 3281} {"train_loss": -25.214139938354492, "global_step": 272375, "epoch": 3281} {"train_loss": -25.152433395385742, "global_step": 272376, "epoch": 3281} {"train_loss": -25.5545654296875, "global_step": 272377, "epoch": 3281} {"train_loss": -25.160289764404297, "global_step": 272378, "epoch": 3281} {"train_loss": -25.40789222717285, "global_step": 272379, "epoch": 3281} {"train_loss": -25.214523315429688, "global_step": 272380, "epoch": 3281} {"train_loss": -25.268476486206055, "global_step": 272381, "epoch": 3281} {"train_loss": -25.297624588012695, "global_step": 272382, "epoch": 3281} {"train_loss": -25.561880111694336, "global_step": 272383, "epoch": 3281} {"train_loss": -25.218896865844727, "global_step": 272384, "epoch": 3281} {"train_loss": -25.625242233276367, "global_step": 272385, "epoch": 3281} {"train_loss": -25.39118003845215, "global_step": 272386, "epoch": 3281} {"train_loss": -25.452224731445312, "global_step": 272387, "epoch": 3281} {"train_loss": -25.346235275268555, "global_step": 272388, "epoch": 3281} {"train_loss": -25.20145034790039, "global_step": 272389, "epoch": 3281} {"train_loss": -25.64166831970215, "global_step": 272390, "epoch": 3281} {"train_loss": -25.486066818237305, "global_step": 272391, "epoch": 3281} {"train_loss": -25.099149703979492, "global_step": 272392, "epoch": 3281} {"train_loss": -25.339982986450195, "global_step": 272393, "epoch": 3281} {"train_loss": -25.234928131103516, "global_step": 272394, "epoch": 3281} {"train_loss": -25.606184005737305, "global_step": 272395, "epoch": 3281} {"train_loss": -25.32655906677246, "global_step": 272396, "epoch": 3281} {"train_loss": -25.744312286376953, "global_step": 272397, "epoch": 3281} {"train_loss": -25.450437545776367, "global_step": 272398, "epoch": 3281} {"train_loss": -25.52470588684082, "global_step": 272399, "epoch": 3281} {"train_loss": -25.198951721191406, "global_step": 272400, "epoch": 3281} {"train_loss": -25.55503273010254, "global_step": 272401, "epoch": 3281} {"train_loss": -25.540241241455078, "global_step": 272402, "epoch": 3281} {"train_loss": -25.5045166015625, "global_step": 272403, "epoch": 3281} {"train_loss": -25.66607093811035, "global_step": 272404, "epoch": 3281} {"train_loss": -25.320077275655354, "global_step": 272405, "epoch": 3281, "val_loss": 7073620.0} {"train_loss": -24.710250854492188, "global_step": 272406, "epoch": 3282} {"train_loss": -25.190052032470703, "global_step": 272407, "epoch": 3282} {"train_loss": -24.86079978942871, "global_step": 272408, "epoch": 3282} {"train_loss": -25.43682861328125, "global_step": 272409, "epoch": 3282} {"train_loss": -25.115873336791992, "global_step": 272410, "epoch": 3282} {"train_loss": -25.073501586914062, "global_step": 272411, "epoch": 3282} {"train_loss": -25.70069694519043, "global_step": 272412, "epoch": 3282} {"train_loss": -25.183637619018555, "global_step": 272413, "epoch": 3282} {"train_loss": -25.033903121948242, "global_step": 272414, "epoch": 3282} {"train_loss": -24.787546157836914, "global_step": 272415, "epoch": 3282} {"train_loss": -24.668319702148438, "global_step": 272416, "epoch": 3282} {"train_loss": -24.918258666992188, "global_step": 272417, "epoch": 3282} {"train_loss": -25.129270553588867, "global_step": 272418, "epoch": 3282} {"train_loss": -24.892553329467773, "global_step": 272419, "epoch": 3282} {"train_loss": -24.972885131835938, "global_step": 272420, "epoch": 3282} {"train_loss": -24.95052719116211, "global_step": 272421, "epoch": 3282} {"train_loss": -25.17584991455078, "global_step": 272422, "epoch": 3282} {"train_loss": -24.78571319580078, "global_step": 272423, "epoch": 3282} {"train_loss": -24.956403732299805, "global_step": 272424, "epoch": 3282} {"train_loss": -25.148300170898438, "global_step": 272425, "epoch": 3282} {"train_loss": -25.213197708129883, "global_step": 272426, "epoch": 3282} {"train_loss": -25.139917373657227, "global_step": 272427, "epoch": 3282} {"train_loss": -25.4832763671875, "global_step": 272428, "epoch": 3282} {"train_loss": -24.904930114746094, "global_step": 272429, "epoch": 3282} {"train_loss": -25.544790267944336, "global_step": 272430, "epoch": 3282} {"train_loss": -25.543792724609375, "global_step": 272431, "epoch": 3282} {"train_loss": -25.41188621520996, "global_step": 272432, "epoch": 3282} {"train_loss": -25.337970733642578, "global_step": 272433, "epoch": 3282} {"train_loss": -25.457265853881836, "global_step": 272434, "epoch": 3282} {"train_loss": -25.19488525390625, "global_step": 272435, "epoch": 3282} {"train_loss": -25.23235511779785, "global_step": 272436, "epoch": 3282} {"train_loss": -25.136281967163086, "global_step": 272437, "epoch": 3282} {"train_loss": -25.118680953979492, "global_step": 272438, "epoch": 3282} {"train_loss": -25.59046173095703, "global_step": 272439, "epoch": 3282} {"train_loss": -25.4163818359375, "global_step": 272440, "epoch": 3282} {"train_loss": -25.226774215698242, "global_step": 272441, "epoch": 3282} {"train_loss": -25.039209365844727, "global_step": 272442, "epoch": 3282} {"train_loss": -24.999868392944336, "global_step": 272443, "epoch": 3282} {"train_loss": -25.67868423461914, "global_step": 272444, "epoch": 3282} {"train_loss": -25.589237213134766, "global_step": 272445, "epoch": 3282} {"train_loss": -25.67856788635254, "global_step": 272446, "epoch": 3282} {"train_loss": -25.3089656829834, "global_step": 272447, "epoch": 3282} {"train_loss": -25.553625106811523, "global_step": 272448, "epoch": 3282} {"train_loss": -25.388092041015625, "global_step": 272449, "epoch": 3282} {"train_loss": -25.49629020690918, "global_step": 272450, "epoch": 3282} {"train_loss": -25.476865768432617, "global_step": 272451, "epoch": 3282} {"train_loss": -25.494802474975586, "global_step": 272452, "epoch": 3282} {"train_loss": -25.32753562927246, "global_step": 272453, "epoch": 3282} {"train_loss": -25.780790328979492, "global_step": 272454, "epoch": 3282} {"train_loss": -25.44439697265625, "global_step": 272455, "epoch": 3282} {"train_loss": -25.832855224609375, "global_step": 272456, "epoch": 3282} {"train_loss": -25.760190963745117, "global_step": 272457, "epoch": 3282} {"train_loss": -25.362573623657227, "global_step": 272458, "epoch": 3282} {"train_loss": -25.512615203857422, "global_step": 272459, "epoch": 3282} {"train_loss": -25.4576473236084, "global_step": 272460, "epoch": 3282} {"train_loss": -25.551382064819336, "global_step": 272461, "epoch": 3282} {"train_loss": -25.67792320251465, "global_step": 272462, "epoch": 3282} {"train_loss": -25.264204025268555, "global_step": 272463, "epoch": 3282} {"train_loss": -24.99283790588379, "global_step": 272464, "epoch": 3282} {"train_loss": -25.383935928344727, "global_step": 272465, "epoch": 3282} {"train_loss": -25.573816299438477, "global_step": 272466, "epoch": 3282} {"train_loss": -25.235502243041992, "global_step": 272467, "epoch": 3282} {"train_loss": -25.071828842163086, "global_step": 272468, "epoch": 3282} {"train_loss": -24.986623764038086, "global_step": 272469, "epoch": 3282} {"train_loss": -25.351606369018555, "global_step": 272470, "epoch": 3282} {"train_loss": -25.3829402923584, "global_step": 272471, "epoch": 3282} {"train_loss": -25.051502227783203, "global_step": 272472, "epoch": 3282} {"train_loss": -25.47930335998535, "global_step": 272473, "epoch": 3282} {"train_loss": -25.057117462158203, "global_step": 272474, "epoch": 3282} {"train_loss": -25.6275634765625, "global_step": 272475, "epoch": 3282} {"train_loss": -25.249008178710938, "global_step": 272476, "epoch": 3282} {"train_loss": -25.005029678344727, "global_step": 272477, "epoch": 3282} {"train_loss": -25.281713485717773, "global_step": 272478, "epoch": 3282} {"train_loss": -25.179370880126953, "global_step": 272479, "epoch": 3282} {"train_loss": -25.16328239440918, "global_step": 272480, "epoch": 3282} {"train_loss": -25.201749801635742, "global_step": 272481, "epoch": 3282} {"train_loss": -25.352872848510742, "global_step": 272482, "epoch": 3282} {"train_loss": -24.919422149658203, "global_step": 272483, "epoch": 3282} {"train_loss": -24.95969581604004, "global_step": 272484, "epoch": 3282} {"train_loss": -25.188047409057617, "global_step": 272485, "epoch": 3282} {"train_loss": -24.431379318237305, "global_step": 272486, "epoch": 3282} {"train_loss": -25.02374839782715, "global_step": 272487, "epoch": 3282} {"train_loss": -25.245172569550665, "global_step": 272488, "epoch": 3282, "val_loss": 7148284.0} {"train_loss": -24.90355682373047, "global_step": 272489, "epoch": 3283} {"train_loss": -24.86185073852539, "global_step": 272490, "epoch": 3283} {"train_loss": -24.791624069213867, "global_step": 272491, "epoch": 3283} {"train_loss": -24.883163452148438, "global_step": 272492, "epoch": 3283} {"train_loss": -24.82849884033203, "global_step": 272493, "epoch": 3283} {"train_loss": -24.712512969970703, "global_step": 272494, "epoch": 3283} {"train_loss": -24.967641830444336, "global_step": 272495, "epoch": 3283} {"train_loss": -24.754667282104492, "global_step": 272496, "epoch": 3283} {"train_loss": -25.171842575073242, "global_step": 272497, "epoch": 3283} {"train_loss": -25.105981826782227, "global_step": 272498, "epoch": 3283} {"train_loss": -25.118507385253906, "global_step": 272499, "epoch": 3283} {"train_loss": -25.117734909057617, "global_step": 272500, "epoch": 3283} {"train_loss": -24.978139877319336, "global_step": 272501, "epoch": 3283} {"train_loss": -25.196136474609375, "global_step": 272502, "epoch": 3283} {"train_loss": -24.868009567260742, "global_step": 272503, "epoch": 3283} {"train_loss": -25.102609634399414, "global_step": 272504, "epoch": 3283} {"train_loss": -25.40446662902832, "global_step": 272505, "epoch": 3283} {"train_loss": -25.082889556884766, "global_step": 272506, "epoch": 3283} {"train_loss": -25.310508728027344, "global_step": 272507, "epoch": 3283} {"train_loss": -25.41740608215332, "global_step": 272508, "epoch": 3283} {"train_loss": -24.877395629882812, "global_step": 272509, "epoch": 3283} {"train_loss": -25.05867576599121, "global_step": 272510, "epoch": 3283} {"train_loss": -25.09814453125, "global_step": 272511, "epoch": 3283} {"train_loss": -25.321918487548828, "global_step": 272512, "epoch": 3283} {"train_loss": -25.37852668762207, "global_step": 272513, "epoch": 3283} {"train_loss": -25.677276611328125, "global_step": 272514, "epoch": 3283} {"train_loss": -25.20209312438965, "global_step": 272515, "epoch": 3283} {"train_loss": -25.264850616455078, "global_step": 272516, "epoch": 3283} {"train_loss": -25.135839462280273, "global_step": 272517, "epoch": 3283} {"train_loss": -25.371957778930664, "global_step": 272518, "epoch": 3283} {"train_loss": -25.241811752319336, "global_step": 272519, "epoch": 3283} {"train_loss": -25.32780647277832, "global_step": 272520, "epoch": 3283} {"train_loss": -25.479080200195312, "global_step": 272521, "epoch": 3283} {"train_loss": -25.41525650024414, "global_step": 272522, "epoch": 3283} {"train_loss": -25.720163345336914, "global_step": 272523, "epoch": 3283} {"train_loss": -25.48297691345215, "global_step": 272524, "epoch": 3283} {"train_loss": -25.139299392700195, "global_step": 272525, "epoch": 3283} {"train_loss": -25.16090965270996, "global_step": 272526, "epoch": 3283} {"train_loss": -25.338504791259766, "global_step": 272527, "epoch": 3283} {"train_loss": -25.459575653076172, "global_step": 272528, "epoch": 3283} {"train_loss": -25.47482681274414, "global_step": 272529, "epoch": 3283} {"train_loss": -25.34934425354004, "global_step": 272530, "epoch": 3283} {"train_loss": -25.21074867248535, "global_step": 272531, "epoch": 3283} {"train_loss": -25.140121459960938, "global_step": 272532, "epoch": 3283} {"train_loss": -25.4226131439209, "global_step": 272533, "epoch": 3283} {"train_loss": -25.187774658203125, "global_step": 272534, "epoch": 3283} {"train_loss": -25.33646011352539, "global_step": 272535, "epoch": 3283} {"train_loss": -25.32634925842285, "global_step": 272536, "epoch": 3283} {"train_loss": -25.092355728149414, "global_step": 272537, "epoch": 3283} {"train_loss": -25.301218032836914, "global_step": 272538, "epoch": 3283} {"train_loss": -25.44837188720703, "global_step": 272539, "epoch": 3283} {"train_loss": -25.709415435791016, "global_step": 272540, "epoch": 3283} {"train_loss": -25.651901245117188, "global_step": 272541, "epoch": 3283} {"train_loss": -25.607074737548828, "global_step": 272542, "epoch": 3283} {"train_loss": -24.84504508972168, "global_step": 272543, "epoch": 3283} {"train_loss": -25.41416358947754, "global_step": 272544, "epoch": 3283} {"train_loss": -24.959074020385742, "global_step": 272545, "epoch": 3283} {"train_loss": -25.702802658081055, "global_step": 272546, "epoch": 3283} {"train_loss": -25.374549865722656, "global_step": 272547, "epoch": 3283} {"train_loss": -25.445415496826172, "global_step": 272548, "epoch": 3283} {"train_loss": -25.497112274169922, "global_step": 272549, "epoch": 3283} {"train_loss": -25.3817195892334, "global_step": 272550, "epoch": 3283} {"train_loss": -25.450115203857422, "global_step": 272551, "epoch": 3283} {"train_loss": -25.183122634887695, "global_step": 272552, "epoch": 3283} {"train_loss": -25.47810935974121, "global_step": 272553, "epoch": 3283} {"train_loss": -25.27863883972168, "global_step": 272554, "epoch": 3283} {"train_loss": -25.505170822143555, "global_step": 272555, "epoch": 3283} {"train_loss": -25.521915435791016, "global_step": 272556, "epoch": 3283} {"train_loss": -25.277463912963867, "global_step": 272557, "epoch": 3283} {"train_loss": -25.115026473999023, "global_step": 272558, "epoch": 3283} {"train_loss": -24.997739791870117, "global_step": 272559, "epoch": 3283} {"train_loss": -25.09813690185547, "global_step": 272560, "epoch": 3283} {"train_loss": -24.894807815551758, "global_step": 272561, "epoch": 3283} {"train_loss": -25.504318237304688, "global_step": 272562, "epoch": 3283} {"train_loss": -24.875036239624023, "global_step": 272563, "epoch": 3283} {"train_loss": -25.19866180419922, "global_step": 272564, "epoch": 3283} {"train_loss": -25.148313522338867, "global_step": 272565, "epoch": 3283} {"train_loss": -25.249114990234375, "global_step": 272566, "epoch": 3283} {"train_loss": -24.90365982055664, "global_step": 272567, "epoch": 3283} {"train_loss": -25.30248260498047, "global_step": 272568, "epoch": 3283} {"train_loss": -25.458654403686523, "global_step": 272569, "epoch": 3283} {"train_loss": -25.274072647094727, "global_step": 272570, "epoch": 3283} {"train_loss": -25.235762079078032, "global_step": 272571, "epoch": 3283, "val_loss": 7016008.0} {"train_loss": -25.500608444213867, "global_step": 272572, "epoch": 3284} {"train_loss": -24.639257431030273, "global_step": 272573, "epoch": 3284} {"train_loss": -25.14131736755371, "global_step": 272574, "epoch": 3284} {"train_loss": -25.443729400634766, "global_step": 272575, "epoch": 3284} {"train_loss": -24.995702743530273, "global_step": 272576, "epoch": 3284} {"train_loss": -24.555906295776367, "global_step": 272577, "epoch": 3284} {"train_loss": -25.228628158569336, "global_step": 272578, "epoch": 3284} {"train_loss": -25.246854782104492, "global_step": 272579, "epoch": 3284} {"train_loss": -24.856693267822266, "global_step": 272580, "epoch": 3284} {"train_loss": -24.844642639160156, "global_step": 272581, "epoch": 3284} {"train_loss": -24.96282958984375, "global_step": 272582, "epoch": 3284} {"train_loss": -25.46143913269043, "global_step": 272583, "epoch": 3284} {"train_loss": -24.701719284057617, "global_step": 272584, "epoch": 3284} {"train_loss": -24.93356704711914, "global_step": 272585, "epoch": 3284} {"train_loss": -24.837331771850586, "global_step": 272586, "epoch": 3284} {"train_loss": -25.23731803894043, "global_step": 272587, "epoch": 3284} {"train_loss": -25.06477165222168, "global_step": 272588, "epoch": 3284} {"train_loss": -24.91219139099121, "global_step": 272589, "epoch": 3284} {"train_loss": -25.310148239135742, "global_step": 272590, "epoch": 3284} {"train_loss": -24.948410034179688, "global_step": 272591, "epoch": 3284} {"train_loss": -25.036359786987305, "global_step": 272592, "epoch": 3284} {"train_loss": -25.12363624572754, "global_step": 272593, "epoch": 3284} {"train_loss": -24.595111846923828, "global_step": 272594, "epoch": 3284} {"train_loss": -25.13136100769043, "global_step": 272595, "epoch": 3284} {"train_loss": -25.401275634765625, "global_step": 272596, "epoch": 3284} {"train_loss": -25.09030532836914, "global_step": 272597, "epoch": 3284} {"train_loss": -25.32292366027832, "global_step": 272598, "epoch": 3284} {"train_loss": -24.862754821777344, "global_step": 272599, "epoch": 3284} {"train_loss": -25.19298553466797, "global_step": 272600, "epoch": 3284} {"train_loss": -25.07743263244629, "global_step": 272601, "epoch": 3284} {"train_loss": -25.230548858642578, "global_step": 272602, "epoch": 3284} {"train_loss": -24.897470474243164, "global_step": 272603, "epoch": 3284} {"train_loss": -25.727075576782227, "global_step": 272604, "epoch": 3284} {"train_loss": -25.008323669433594, "global_step": 272605, "epoch": 3284} {"train_loss": -25.070789337158203, "global_step": 272606, "epoch": 3284} {"train_loss": -25.26228904724121, "global_step": 272607, "epoch": 3284} {"train_loss": -25.336652755737305, "global_step": 272608, "epoch": 3284} {"train_loss": -25.3421688079834, "global_step": 272609, "epoch": 3284} {"train_loss": -25.006330490112305, "global_step": 272610, "epoch": 3284} {"train_loss": -24.9357852935791, "global_step": 272611, "epoch": 3284} {"train_loss": -25.36812400817871, "global_step": 272612, "epoch": 3284} {"train_loss": -25.358901977539062, "global_step": 272613, "epoch": 3284} {"train_loss": -25.19245147705078, "global_step": 272614, "epoch": 3284} {"train_loss": -24.96005630493164, "global_step": 272615, "epoch": 3284} {"train_loss": -25.6153507232666, "global_step": 272616, "epoch": 3284} {"train_loss": -25.945587158203125, "global_step": 272617, "epoch": 3284} {"train_loss": -25.658185958862305, "global_step": 272618, "epoch": 3284} {"train_loss": -25.09786033630371, "global_step": 272619, "epoch": 3284} {"train_loss": -25.461631774902344, "global_step": 272620, "epoch": 3284} {"train_loss": -25.33177947998047, "global_step": 272621, "epoch": 3284} {"train_loss": -25.61982536315918, "global_step": 272622, "epoch": 3284} {"train_loss": -25.259994506835938, "global_step": 272623, "epoch": 3284} {"train_loss": -25.421051025390625, "global_step": 272624, "epoch": 3284} {"train_loss": -25.6176815032959, "global_step": 272625, "epoch": 3284} {"train_loss": -25.413633346557617, "global_step": 272626, "epoch": 3284} {"train_loss": -25.301504135131836, "global_step": 272627, "epoch": 3284} {"train_loss": -25.54931640625, "global_step": 272628, "epoch": 3284} {"train_loss": -25.560895919799805, "global_step": 272629, "epoch": 3284} {"train_loss": -25.409042358398438, "global_step": 272630, "epoch": 3284} {"train_loss": -25.268054962158203, "global_step": 272631, "epoch": 3284} {"train_loss": -25.727075576782227, "global_step": 272632, "epoch": 3284} {"train_loss": -25.531734466552734, "global_step": 272633, "epoch": 3284} {"train_loss": -25.08268928527832, "global_step": 272634, "epoch": 3284} {"train_loss": -25.387908935546875, "global_step": 272635, "epoch": 3284} {"train_loss": -25.355310440063477, "global_step": 272636, "epoch": 3284} {"train_loss": -25.3459415435791, "global_step": 272637, "epoch": 3284} {"train_loss": -25.510807037353516, "global_step": 272638, "epoch": 3284} {"train_loss": -25.338932037353516, "global_step": 272639, "epoch": 3284} {"train_loss": -25.23770523071289, "global_step": 272640, "epoch": 3284} {"train_loss": -25.2443904876709, "global_step": 272641, "epoch": 3284} {"train_loss": -25.446754455566406, "global_step": 272642, "epoch": 3284} {"train_loss": -25.3970947265625, "global_step": 272643, "epoch": 3284} {"train_loss": -25.553943634033203, "global_step": 272644, "epoch": 3284} {"train_loss": -25.11905860900879, "global_step": 272645, "epoch": 3284} {"train_loss": -25.138219833374023, "global_step": 272646, "epoch": 3284} {"train_loss": -24.687604904174805, "global_step": 272647, "epoch": 3284} {"train_loss": -24.74721336364746, "global_step": 272648, "epoch": 3284} {"train_loss": -25.39053726196289, "global_step": 272649, "epoch": 3284} {"train_loss": -25.227758407592773, "global_step": 272650, "epoch": 3284} {"train_loss": -25.056427001953125, "global_step": 272651, "epoch": 3284} {"train_loss": -25.41267967224121, "global_step": 272652, "epoch": 3284} {"train_loss": -24.945310592651367, "global_step": 272653, "epoch": 3284} {"train_loss": -25.222750192665192, "global_step": 272654, "epoch": 3284, "val_loss": 6992010.0} {"train_loss": -24.83370018005371, "global_step": 272655, "epoch": 3285} {"train_loss": -24.953954696655273, "global_step": 272656, "epoch": 3285} {"train_loss": -24.26422691345215, "global_step": 272657, "epoch": 3285} {"train_loss": -24.363971710205078, "global_step": 272658, "epoch": 3285} {"train_loss": -24.614011764526367, "global_step": 272659, "epoch": 3285} {"train_loss": -24.512683868408203, "global_step": 272660, "epoch": 3285} {"train_loss": -24.813405990600586, "global_step": 272661, "epoch": 3285} {"train_loss": -24.79202651977539, "global_step": 272662, "epoch": 3285} {"train_loss": -24.593679428100586, "global_step": 272663, "epoch": 3285} {"train_loss": -25.584400177001953, "global_step": 272664, "epoch": 3285} {"train_loss": -24.57526206970215, "global_step": 272665, "epoch": 3285} {"train_loss": -24.78999137878418, "global_step": 272666, "epoch": 3285} {"train_loss": -25.077505111694336, "global_step": 272667, "epoch": 3285} {"train_loss": -25.174829483032227, "global_step": 272668, "epoch": 3285} {"train_loss": -24.68581199645996, "global_step": 272669, "epoch": 3285} {"train_loss": -25.318418502807617, "global_step": 272670, "epoch": 3285} {"train_loss": -25.339677810668945, "global_step": 272671, "epoch": 3285} {"train_loss": -24.952939987182617, "global_step": 272672, "epoch": 3285} {"train_loss": -25.033096313476562, "global_step": 272673, "epoch": 3285} {"train_loss": -25.009511947631836, "global_step": 272674, "epoch": 3285} {"train_loss": -25.00167465209961, "global_step": 272675, "epoch": 3285} {"train_loss": -25.294431686401367, "global_step": 272676, "epoch": 3285} {"train_loss": -25.16567039489746, "global_step": 272677, "epoch": 3285} {"train_loss": -25.01459503173828, "global_step": 272678, "epoch": 3285} {"train_loss": -25.06014060974121, "global_step": 272679, "epoch": 3285} {"train_loss": -25.448936462402344, "global_step": 272680, "epoch": 3285} {"train_loss": -25.217897415161133, "global_step": 272681, "epoch": 3285} {"train_loss": -25.23636245727539, "global_step": 272682, "epoch": 3285} {"train_loss": -25.53142547607422, "global_step": 272683, "epoch": 3285} {"train_loss": -25.19999122619629, "global_step": 272684, "epoch": 3285} {"train_loss": -25.437549591064453, "global_step": 272685, "epoch": 3285} {"train_loss": -25.21376609802246, "global_step": 272686, "epoch": 3285} {"train_loss": -25.216049194335938, "global_step": 272687, "epoch": 3285} {"train_loss": -25.329349517822266, "global_step": 272688, "epoch": 3285} {"train_loss": -25.236169815063477, "global_step": 272689, "epoch": 3285} {"train_loss": -25.320409774780273, "global_step": 272690, "epoch": 3285} {"train_loss": -25.635883331298828, "global_step": 272691, "epoch": 3285} {"train_loss": -25.454137802124023, "global_step": 272692, "epoch": 3285} {"train_loss": -25.479389190673828, "global_step": 272693, "epoch": 3285} {"train_loss": -25.48836326599121, "global_step": 272694, "epoch": 3285} {"train_loss": -25.44776725769043, "global_step": 272695, "epoch": 3285} {"train_loss": -25.3798828125, "global_step": 272696, "epoch": 3285} {"train_loss": -25.471220016479492, "global_step": 272697, "epoch": 3285} {"train_loss": -25.3732852935791, "global_step": 272698, "epoch": 3285} {"train_loss": -25.380935668945312, "global_step": 272699, "epoch": 3285} {"train_loss": -25.4923152923584, "global_step": 272700, "epoch": 3285} {"train_loss": -25.457265853881836, "global_step": 272701, "epoch": 3285} {"train_loss": -25.368579864501953, "global_step": 272702, "epoch": 3285} {"train_loss": -25.198678970336914, "global_step": 272703, "epoch": 3285} {"train_loss": -25.3419246673584, "global_step": 272704, "epoch": 3285} {"train_loss": -25.663909912109375, "global_step": 272705, "epoch": 3285} {"train_loss": -25.586233139038086, "global_step": 272706, "epoch": 3285} {"train_loss": -25.60967445373535, "global_step": 272707, "epoch": 3285} {"train_loss": -25.61396598815918, "global_step": 272708, "epoch": 3285} {"train_loss": -25.554758071899414, "global_step": 272709, "epoch": 3285} {"train_loss": -25.503957748413086, "global_step": 272710, "epoch": 3285} {"train_loss": -25.597951889038086, "global_step": 272711, "epoch": 3285} {"train_loss": -25.56161880493164, "global_step": 272712, "epoch": 3285} {"train_loss": -25.748022079467773, "global_step": 272713, "epoch": 3285} {"train_loss": -25.5747127532959, "global_step": 272714, "epoch": 3285} {"train_loss": -25.441307067871094, "global_step": 272715, "epoch": 3285} {"train_loss": -25.292322158813477, "global_step": 272716, "epoch": 3285} {"train_loss": -25.091291427612305, "global_step": 272717, "epoch": 3285} {"train_loss": -25.65793228149414, "global_step": 272718, "epoch": 3285} {"train_loss": -25.278583526611328, "global_step": 272719, "epoch": 3285} {"train_loss": -25.26847267150879, "global_step": 272720, "epoch": 3285} {"train_loss": -25.26719856262207, "global_step": 272721, "epoch": 3285} {"train_loss": -25.48908042907715, "global_step": 272722, "epoch": 3285} {"train_loss": -25.28828239440918, "global_step": 272723, "epoch": 3285} {"train_loss": -25.442584991455078, "global_step": 272724, "epoch": 3285} {"train_loss": -25.29658317565918, "global_step": 272725, "epoch": 3285} {"train_loss": -25.63326072692871, "global_step": 272726, "epoch": 3285} {"train_loss": -24.834936141967773, "global_step": 272727, "epoch": 3285} {"train_loss": -25.346046447753906, "global_step": 272728, "epoch": 3285} {"train_loss": -25.401798248291016, "global_step": 272729, "epoch": 3285} {"train_loss": -25.48798942565918, "global_step": 272730, "epoch": 3285} {"train_loss": -24.951871871948242, "global_step": 272731, "epoch": 3285} {"train_loss": -25.23786735534668, "global_step": 272732, "epoch": 3285} {"train_loss": -25.41603660583496, "global_step": 272733, "epoch": 3285} {"train_loss": -25.095693588256836, "global_step": 272734, "epoch": 3285} {"train_loss": -25.286956787109375, "global_step": 272735, "epoch": 3285} {"train_loss": -25.322050094604492, "global_step": 272736, "epoch": 3285} {"train_loss": -25.243653975337384, "global_step": 272737, "epoch": 3285, "val_loss": 7075094.0} {"train_loss": -25.02730369567871, "global_step": 272738, "epoch": 3286} {"train_loss": -24.257604598999023, "global_step": 272739, "epoch": 3286} {"train_loss": -24.981008529663086, "global_step": 272740, "epoch": 3286} {"train_loss": -24.551443099975586, "global_step": 272741, "epoch": 3286} {"train_loss": -24.453153610229492, "global_step": 272742, "epoch": 3286} {"train_loss": -24.800609588623047, "global_step": 272743, "epoch": 3286} {"train_loss": -24.807165145874023, "global_step": 272744, "epoch": 3286} {"train_loss": -25.359426498413086, "global_step": 272745, "epoch": 3286} {"train_loss": -24.96392822265625, "global_step": 272746, "epoch": 3286} {"train_loss": -24.692541122436523, "global_step": 272747, "epoch": 3286} {"train_loss": -24.833417892456055, "global_step": 272748, "epoch": 3286} {"train_loss": -25.259624481201172, "global_step": 272749, "epoch": 3286} {"train_loss": -25.225360870361328, "global_step": 272750, "epoch": 3286} {"train_loss": -24.9201717376709, "global_step": 272751, "epoch": 3286} {"train_loss": -25.007749557495117, "global_step": 272752, "epoch": 3286} {"train_loss": -25.185758590698242, "global_step": 272753, "epoch": 3286} {"train_loss": -25.299386978149414, "global_step": 272754, "epoch": 3286} {"train_loss": -25.283218383789062, "global_step": 272755, "epoch": 3286} {"train_loss": -25.12212562561035, "global_step": 272756, "epoch": 3286} {"train_loss": -25.014028549194336, "global_step": 272757, "epoch": 3286} {"train_loss": -25.109210968017578, "global_step": 272758, "epoch": 3286} {"train_loss": -25.28683090209961, "global_step": 272759, "epoch": 3286} {"train_loss": -25.06964683532715, "global_step": 272760, "epoch": 3286} {"train_loss": -25.515464782714844, "global_step": 272761, "epoch": 3286} {"train_loss": -25.002260208129883, "global_step": 272762, "epoch": 3286} {"train_loss": -25.38535499572754, "global_step": 272763, "epoch": 3286} {"train_loss": -25.30610466003418, "global_step": 272764, "epoch": 3286} {"train_loss": -25.47970199584961, "global_step": 272765, "epoch": 3286} {"train_loss": -24.873334884643555, "global_step": 272766, "epoch": 3286} {"train_loss": -25.108407974243164, "global_step": 272767, "epoch": 3286} {"train_loss": -25.516014099121094, "global_step": 272768, "epoch": 3286} {"train_loss": -25.382369995117188, "global_step": 272769, "epoch": 3286} {"train_loss": -25.376314163208008, "global_step": 272770, "epoch": 3286} {"train_loss": -24.986345291137695, "global_step": 272771, "epoch": 3286} {"train_loss": -25.181623458862305, "global_step": 272772, "epoch": 3286} {"train_loss": -25.51919174194336, "global_step": 272773, "epoch": 3286} {"train_loss": -25.422239303588867, "global_step": 272774, "epoch": 3286} {"train_loss": -25.3901309967041, "global_step": 272775, "epoch": 3286} {"train_loss": -25.088407516479492, "global_step": 272776, "epoch": 3286} {"train_loss": -25.28659439086914, "global_step": 272777, "epoch": 3286} {"train_loss": -25.664539337158203, "global_step": 272778, "epoch": 3286} {"train_loss": -25.151697158813477, "global_step": 272779, "epoch": 3286} {"train_loss": -24.949304580688477, "global_step": 272780, "epoch": 3286} {"train_loss": -25.23088836669922, "global_step": 272781, "epoch": 3286} {"train_loss": -24.802490234375, "global_step": 272782, "epoch": 3286} {"train_loss": -25.06352424621582, "global_step": 272783, "epoch": 3286} {"train_loss": -25.106122970581055, "global_step": 272784, "epoch": 3286} {"train_loss": -25.408105850219727, "global_step": 272785, "epoch": 3286} {"train_loss": -25.257741928100586, "global_step": 272786, "epoch": 3286} {"train_loss": -24.974180221557617, "global_step": 272787, "epoch": 3286} {"train_loss": -25.119874954223633, "global_step": 272788, "epoch": 3286} {"train_loss": -24.89325714111328, "global_step": 272789, "epoch": 3286} {"train_loss": -25.42728614807129, "global_step": 272790, "epoch": 3286} {"train_loss": -25.475814819335938, "global_step": 272791, "epoch": 3286} {"train_loss": -25.387807846069336, "global_step": 272792, "epoch": 3286} {"train_loss": -25.300153732299805, "global_step": 272793, "epoch": 3286} {"train_loss": -25.200286865234375, "global_step": 272794, "epoch": 3286} {"train_loss": -25.541522979736328, "global_step": 272795, "epoch": 3286} {"train_loss": -25.822824478149414, "global_step": 272796, "epoch": 3286} {"train_loss": -25.70794677734375, "global_step": 272797, "epoch": 3286} {"train_loss": -25.570337295532227, "global_step": 272798, "epoch": 3286} {"train_loss": -25.486713409423828, "global_step": 272799, "epoch": 3286} {"train_loss": -25.47836685180664, "global_step": 272800, "epoch": 3286} {"train_loss": -25.4492130279541, "global_step": 272801, "epoch": 3286} {"train_loss": -25.744739532470703, "global_step": 272802, "epoch": 3286} {"train_loss": -25.509658813476562, "global_step": 272803, "epoch": 3286} {"train_loss": -25.31044578552246, "global_step": 272804, "epoch": 3286} {"train_loss": -25.89621925354004, "global_step": 272805, "epoch": 3286} {"train_loss": -25.52376365661621, "global_step": 272806, "epoch": 3286} {"train_loss": -25.454360961914062, "global_step": 272807, "epoch": 3286} {"train_loss": -25.552871704101562, "global_step": 272808, "epoch": 3286} {"train_loss": -25.363983154296875, "global_step": 272809, "epoch": 3286} {"train_loss": -25.57493019104004, "global_step": 272810, "epoch": 3286} {"train_loss": -25.274124145507812, "global_step": 272811, "epoch": 3286} {"train_loss": -25.54148292541504, "global_step": 272812, "epoch": 3286} {"train_loss": -25.394163131713867, "global_step": 272813, "epoch": 3286} {"train_loss": -25.469968795776367, "global_step": 272814, "epoch": 3286} {"train_loss": -25.872989654541016, "global_step": 272815, "epoch": 3286} {"train_loss": -25.387714385986328, "global_step": 272816, "epoch": 3286} {"train_loss": -25.723196029663086, "global_step": 272817, "epoch": 3286} {"train_loss": -25.321428298950195, "global_step": 272818, "epoch": 3286} {"train_loss": -25.109241485595703, "global_step": 272819, "epoch": 3286} {"train_loss": -25.273857162659425, "global_step": 272820, "epoch": 3286, "val_loss": 6993911.0} {"train_loss": -23.819326400756836, "global_step": 272821, "epoch": 3287} {"train_loss": -22.049840927124023, "global_step": 272822, "epoch": 3287} {"train_loss": -19.25587272644043, "global_step": 272823, "epoch": 3287} {"train_loss": -23.539554595947266, "global_step": 272824, "epoch": 3287} {"train_loss": -21.547977447509766, "global_step": 272825, "epoch": 3287} {"train_loss": -23.34317398071289, "global_step": 272826, "epoch": 3287} {"train_loss": -23.490276336669922, "global_step": 272827, "epoch": 3287} {"train_loss": -23.17116355895996, "global_step": 272828, "epoch": 3287} {"train_loss": -23.821491241455078, "global_step": 272829, "epoch": 3287} {"train_loss": -23.211111068725586, "global_step": 272830, "epoch": 3287} {"train_loss": -23.48059844970703, "global_step": 272831, "epoch": 3287} {"train_loss": -24.067707061767578, "global_step": 272832, "epoch": 3287} {"train_loss": -23.584674835205078, "global_step": 272833, "epoch": 3287} {"train_loss": -24.346872329711914, "global_step": 272834, "epoch": 3287} {"train_loss": -23.78349494934082, "global_step": 272835, "epoch": 3287} {"train_loss": -23.7379093170166, "global_step": 272836, "epoch": 3287} {"train_loss": -24.030750274658203, "global_step": 272837, "epoch": 3287} {"train_loss": -23.575794219970703, "global_step": 272838, "epoch": 3287} {"train_loss": -24.274911880493164, "global_step": 272839, "epoch": 3287} {"train_loss": -24.402801513671875, "global_step": 272840, "epoch": 3287} {"train_loss": -24.585983276367188, "global_step": 272841, "epoch": 3287} {"train_loss": -24.239879608154297, "global_step": 272842, "epoch": 3287} {"train_loss": -24.30922508239746, "global_step": 272843, "epoch": 3287} {"train_loss": -24.462553024291992, "global_step": 272844, "epoch": 3287} {"train_loss": -24.553327560424805, "global_step": 272845, "epoch": 3287} {"train_loss": -24.61615753173828, "global_step": 272846, "epoch": 3287} {"train_loss": -24.329593658447266, "global_step": 272847, "epoch": 3287} {"train_loss": -24.3568172454834, "global_step": 272848, "epoch": 3287} {"train_loss": -24.097736358642578, "global_step": 272849, "epoch": 3287} {"train_loss": -24.457645416259766, "global_step": 272850, "epoch": 3287} {"train_loss": -25.035669326782227, "global_step": 272851, "epoch": 3287} {"train_loss": -24.979236602783203, "global_step": 272852, "epoch": 3287} {"train_loss": -25.113832473754883, "global_step": 272853, "epoch": 3287} {"train_loss": -24.967960357666016, "global_step": 272854, "epoch": 3287} {"train_loss": -24.659833908081055, "global_step": 272855, "epoch": 3287} {"train_loss": -24.764076232910156, "global_step": 272856, "epoch": 3287} {"train_loss": -24.958255767822266, "global_step": 272857, "epoch": 3287} {"train_loss": -24.606969833374023, "global_step": 272858, "epoch": 3287} {"train_loss": -25.044967651367188, "global_step": 272859, "epoch": 3287} {"train_loss": -24.732620239257812, "global_step": 272860, "epoch": 3287} {"train_loss": -24.925878524780273, "global_step": 272861, "epoch": 3287} {"train_loss": -24.987361907958984, "global_step": 272862, "epoch": 3287} {"train_loss": -25.07570457458496, "global_step": 272863, "epoch": 3287} {"train_loss": -25.093931198120117, "global_step": 272864, "epoch": 3287} {"train_loss": -25.514118194580078, "global_step": 272865, "epoch": 3287} {"train_loss": -24.796785354614258, "global_step": 272866, "epoch": 3287} {"train_loss": -25.241987228393555, "global_step": 272867, "epoch": 3287} {"train_loss": -24.97077751159668, "global_step": 272868, "epoch": 3287} {"train_loss": -25.14529037475586, "global_step": 272869, "epoch": 3287} {"train_loss": -25.400808334350586, "global_step": 272870, "epoch": 3287} {"train_loss": -25.132078170776367, "global_step": 272871, "epoch": 3287} {"train_loss": -25.051551818847656, "global_step": 272872, "epoch": 3287} {"train_loss": -25.29463005065918, "global_step": 272873, "epoch": 3287} {"train_loss": -25.163578033447266, "global_step": 272874, "epoch": 3287} {"train_loss": -25.191564559936523, "global_step": 272875, "epoch": 3287} {"train_loss": -25.469818115234375, "global_step": 272876, "epoch": 3287} {"train_loss": -25.759796142578125, "global_step": 272877, "epoch": 3287} {"train_loss": -24.856151580810547, "global_step": 272878, "epoch": 3287} {"train_loss": -25.20737075805664, "global_step": 272879, "epoch": 3287} {"train_loss": -25.27614402770996, "global_step": 272880, "epoch": 3287} {"train_loss": -25.185474395751953, "global_step": 272881, "epoch": 3287} {"train_loss": -25.377187728881836, "global_step": 272882, "epoch": 3287} {"train_loss": -25.76958656311035, "global_step": 272883, "epoch": 3287} {"train_loss": -25.667322158813477, "global_step": 272884, "epoch": 3287} {"train_loss": -25.326147079467773, "global_step": 272885, "epoch": 3287} {"train_loss": -25.782194137573242, "global_step": 272886, "epoch": 3287} {"train_loss": -25.21491813659668, "global_step": 272887, "epoch": 3287} {"train_loss": -25.502578735351562, "global_step": 272888, "epoch": 3287} {"train_loss": -25.4063663482666, "global_step": 272889, "epoch": 3287} {"train_loss": -25.590242385864258, "global_step": 272890, "epoch": 3287} {"train_loss": -25.31833839416504, "global_step": 272891, "epoch": 3287} {"train_loss": -25.324234008789062, "global_step": 272892, "epoch": 3287} {"train_loss": -25.399709701538086, "global_step": 272893, "epoch": 3287} {"train_loss": -25.476276397705078, "global_step": 272894, "epoch": 3287} {"train_loss": -25.27179718017578, "global_step": 272895, "epoch": 3287} {"train_loss": -25.516605377197266, "global_step": 272896, "epoch": 3287} {"train_loss": -25.478866577148438, "global_step": 272897, "epoch": 3287} {"train_loss": -25.079374313354492, "global_step": 272898, "epoch": 3287} {"train_loss": -25.425992965698242, "global_step": 272899, "epoch": 3287} {"train_loss": -25.559995651245117, "global_step": 272900, "epoch": 3287} {"train_loss": -25.52739143371582, "global_step": 272901, "epoch": 3287} {"train_loss": -25.43619155883789, "global_step": 272902, "epoch": 3287} {"train_loss": -24.687818021659393, "global_step": 272903, "epoch": 3287, "val_loss": 6993201.0} {"train_loss": -25.32137107849121, "global_step": 272904, "epoch": 3288} {"train_loss": -24.57010269165039, "global_step": 272905, "epoch": 3288} {"train_loss": -25.580169677734375, "global_step": 272906, "epoch": 3288} {"train_loss": -25.37102699279785, "global_step": 272907, "epoch": 3288} {"train_loss": -25.075077056884766, "global_step": 272908, "epoch": 3288} {"train_loss": -25.02347183227539, "global_step": 272909, "epoch": 3288} {"train_loss": -25.017412185668945, "global_step": 272910, "epoch": 3288} {"train_loss": -25.223329544067383, "global_step": 272911, "epoch": 3288} {"train_loss": -25.139781951904297, "global_step": 272912, "epoch": 3288} {"train_loss": -25.154159545898438, "global_step": 272913, "epoch": 3288} {"train_loss": -25.137685775756836, "global_step": 272914, "epoch": 3288} {"train_loss": -25.051727294921875, "global_step": 272915, "epoch": 3288} {"train_loss": -25.452608108520508, "global_step": 272916, "epoch": 3288} {"train_loss": -25.399227142333984, "global_step": 272917, "epoch": 3288} {"train_loss": -25.220584869384766, "global_step": 272918, "epoch": 3288} {"train_loss": -25.358373641967773, "global_step": 272919, "epoch": 3288} {"train_loss": -25.2802734375, "global_step": 272920, "epoch": 3288} {"train_loss": -24.950538635253906, "global_step": 272921, "epoch": 3288} {"train_loss": -25.040372848510742, "global_step": 272922, "epoch": 3288} {"train_loss": -25.286596298217773, "global_step": 272923, "epoch": 3288} {"train_loss": -24.810569763183594, "global_step": 272924, "epoch": 3288} {"train_loss": -25.03432273864746, "global_step": 272925, "epoch": 3288} {"train_loss": -25.178152084350586, "global_step": 272926, "epoch": 3288} {"train_loss": -25.330881118774414, "global_step": 272927, "epoch": 3288} {"train_loss": -25.277952194213867, "global_step": 272928, "epoch": 3288} {"train_loss": -25.5987606048584, "global_step": 272929, "epoch": 3288} {"train_loss": -25.800647735595703, "global_step": 272930, "epoch": 3288} {"train_loss": -25.417760848999023, "global_step": 272931, "epoch": 3288} {"train_loss": -25.488712310791016, "global_step": 272932, "epoch": 3288} {"train_loss": -25.499120712280273, "global_step": 272933, "epoch": 3288} {"train_loss": -25.136795043945312, "global_step": 272934, "epoch": 3288} {"train_loss": -25.360036849975586, "global_step": 272935, "epoch": 3288} {"train_loss": -25.297361373901367, "global_step": 272936, "epoch": 3288} {"train_loss": -25.498661041259766, "global_step": 272937, "epoch": 3288} {"train_loss": -25.52712631225586, "global_step": 272938, "epoch": 3288} {"train_loss": -25.142057418823242, "global_step": 272939, "epoch": 3288} {"train_loss": -25.631860733032227, "global_step": 272940, "epoch": 3288} {"train_loss": -25.434309005737305, "global_step": 272941, "epoch": 3288} {"train_loss": -25.1981143951416, "global_step": 272942, "epoch": 3288} {"train_loss": -24.842666625976562, "global_step": 272943, "epoch": 3288} {"train_loss": -25.13858985900879, "global_step": 272944, "epoch": 3288} {"train_loss": -25.128862380981445, "global_step": 272945, "epoch": 3288} {"train_loss": -25.25604248046875, "global_step": 272946, "epoch": 3288} {"train_loss": -25.724679946899414, "global_step": 272947, "epoch": 3288} {"train_loss": -25.28372573852539, "global_step": 272948, "epoch": 3288} {"train_loss": -25.265766143798828, "global_step": 272949, "epoch": 3288} {"train_loss": -25.066068649291992, "global_step": 272950, "epoch": 3288} {"train_loss": -25.202423095703125, "global_step": 272951, "epoch": 3288} {"train_loss": -25.543073654174805, "global_step": 272952, "epoch": 3288} {"train_loss": -25.231048583984375, "global_step": 272953, "epoch": 3288} {"train_loss": -25.769506454467773, "global_step": 272954, "epoch": 3288} {"train_loss": -25.20185661315918, "global_step": 272955, "epoch": 3288} {"train_loss": -25.34351921081543, "global_step": 272956, "epoch": 3288} {"train_loss": -25.30238914489746, "global_step": 272957, "epoch": 3288} {"train_loss": -25.109649658203125, "global_step": 272958, "epoch": 3288} {"train_loss": -25.592138290405273, "global_step": 272959, "epoch": 3288} {"train_loss": -25.356149673461914, "global_step": 272960, "epoch": 3288} {"train_loss": -25.535253524780273, "global_step": 272961, "epoch": 3288} {"train_loss": -25.120929718017578, "global_step": 272962, "epoch": 3288} {"train_loss": -25.358837127685547, "global_step": 272963, "epoch": 3288} {"train_loss": -25.459381103515625, "global_step": 272964, "epoch": 3288} {"train_loss": -25.299489974975586, "global_step": 272965, "epoch": 3288} {"train_loss": -25.261449813842773, "global_step": 272966, "epoch": 3288} {"train_loss": -25.27670669555664, "global_step": 272967, "epoch": 3288} {"train_loss": -25.523365020751953, "global_step": 272968, "epoch": 3288} {"train_loss": -25.697784423828125, "global_step": 272969, "epoch": 3288} {"train_loss": -25.278701782226562, "global_step": 272970, "epoch": 3288} {"train_loss": -25.124216079711914, "global_step": 272971, "epoch": 3288} {"train_loss": -25.25815200805664, "global_step": 272972, "epoch": 3288} {"train_loss": -25.613327026367188, "global_step": 272973, "epoch": 3288} {"train_loss": -25.288284301757812, "global_step": 272974, "epoch": 3288} {"train_loss": -25.62563133239746, "global_step": 272975, "epoch": 3288} {"train_loss": -25.01224136352539, "global_step": 272976, "epoch": 3288} {"train_loss": -25.44118881225586, "global_step": 272977, "epoch": 3288} {"train_loss": -25.662778854370117, "global_step": 272978, "epoch": 3288} {"train_loss": -25.298389434814453, "global_step": 272979, "epoch": 3288} {"train_loss": -25.72185707092285, "global_step": 272980, "epoch": 3288} {"train_loss": -25.384309768676758, "global_step": 272981, "epoch": 3288} {"train_loss": -25.434438705444336, "global_step": 272982, "epoch": 3288} {"train_loss": -25.55622100830078, "global_step": 272983, "epoch": 3288} {"train_loss": -25.423391342163086, "global_step": 272984, "epoch": 3288} {"train_loss": -25.24486541748047, "global_step": 272985, "epoch": 3288} {"train_loss": -25.320195393389966, "global_step": 272986, "epoch": 3288, "val_loss": 7049885.0} {"train_loss": -25.186391830444336, "global_step": 272987, "epoch": 3289} {"train_loss": -24.550992965698242, "global_step": 272988, "epoch": 3289} {"train_loss": -23.869962692260742, "global_step": 272989, "epoch": 3289} {"train_loss": -23.510168075561523, "global_step": 272990, "epoch": 3289} {"train_loss": -25.23769187927246, "global_step": 272991, "epoch": 3289} {"train_loss": -24.591358184814453, "global_step": 272992, "epoch": 3289} {"train_loss": -24.61248207092285, "global_step": 272993, "epoch": 3289} {"train_loss": -24.73623275756836, "global_step": 272994, "epoch": 3289} {"train_loss": -24.941055297851562, "global_step": 272995, "epoch": 3289} {"train_loss": -24.410781860351562, "global_step": 272996, "epoch": 3289} {"train_loss": -24.937543869018555, "global_step": 272997, "epoch": 3289} {"train_loss": -24.49220085144043, "global_step": 272998, "epoch": 3289} {"train_loss": -25.20222282409668, "global_step": 272999, "epoch": 3289} {"train_loss": -24.91716194152832, "global_step": 273000, "epoch": 3289} {"train_loss": -24.930789947509766, "global_step": 273001, "epoch": 3289} {"train_loss": -24.92353630065918, "global_step": 273002, "epoch": 3289} {"train_loss": -25.073665618896484, "global_step": 273003, "epoch": 3289} {"train_loss": -24.892505645751953, "global_step": 273004, "epoch": 3289} {"train_loss": -25.27129554748535, "global_step": 273005, "epoch": 3289} {"train_loss": -24.794986724853516, "global_step": 273006, "epoch": 3289} {"train_loss": -24.982160568237305, "global_step": 273007, "epoch": 3289} {"train_loss": -25.219234466552734, "global_step": 273008, "epoch": 3289} {"train_loss": -25.290172576904297, "global_step": 273009, "epoch": 3289} {"train_loss": -25.055694580078125, "global_step": 273010, "epoch": 3289} {"train_loss": -25.24296760559082, "global_step": 273011, "epoch": 3289} {"train_loss": -24.82924461364746, "global_step": 273012, "epoch": 3289} {"train_loss": -25.152563095092773, "global_step": 273013, "epoch": 3289} {"train_loss": -25.103195190429688, "global_step": 273014, "epoch": 3289} {"train_loss": -25.27855682373047, "global_step": 273015, "epoch": 3289} {"train_loss": -24.897205352783203, "global_step": 273016, "epoch": 3289} {"train_loss": -25.118541717529297, "global_step": 273017, "epoch": 3289} {"train_loss": -25.303070068359375, "global_step": 273018, "epoch": 3289} {"train_loss": -25.495820999145508, "global_step": 273019, "epoch": 3289} {"train_loss": -25.269559860229492, "global_step": 273020, "epoch": 3289} {"train_loss": -25.3007869720459, "global_step": 273021, "epoch": 3289} {"train_loss": -25.428918838500977, "global_step": 273022, "epoch": 3289} {"train_loss": -25.39918327331543, "global_step": 273023, "epoch": 3289} {"train_loss": -25.103239059448242, "global_step": 273024, "epoch": 3289} {"train_loss": -25.0914363861084, "global_step": 273025, "epoch": 3289} {"train_loss": -25.611103057861328, "global_step": 273026, "epoch": 3289} {"train_loss": -25.229001998901367, "global_step": 273027, "epoch": 3289} {"train_loss": -25.386844635009766, "global_step": 273028, "epoch": 3289} {"train_loss": -25.33255958557129, "global_step": 273029, "epoch": 3289} {"train_loss": -25.720733642578125, "global_step": 273030, "epoch": 3289} {"train_loss": -25.256153106689453, "global_step": 273031, "epoch": 3289} {"train_loss": -24.960208892822266, "global_step": 273032, "epoch": 3289} {"train_loss": -25.211162567138672, "global_step": 273033, "epoch": 3289} {"train_loss": -25.343900680541992, "global_step": 273034, "epoch": 3289} {"train_loss": -25.66057777404785, "global_step": 273035, "epoch": 3289} {"train_loss": -25.28720474243164, "global_step": 273036, "epoch": 3289} {"train_loss": -25.307615280151367, "global_step": 273037, "epoch": 3289} {"train_loss": -25.18419647216797, "global_step": 273038, "epoch": 3289} {"train_loss": -25.509122848510742, "global_step": 273039, "epoch": 3289} {"train_loss": -25.305932998657227, "global_step": 273040, "epoch": 3289} {"train_loss": -25.660369873046875, "global_step": 273041, "epoch": 3289} {"train_loss": -25.12251091003418, "global_step": 273042, "epoch": 3289} {"train_loss": -25.4051456451416, "global_step": 273043, "epoch": 3289} {"train_loss": -25.800872802734375, "global_step": 273044, "epoch": 3289} {"train_loss": -25.40225601196289, "global_step": 273045, "epoch": 3289} {"train_loss": -25.662261962890625, "global_step": 273046, "epoch": 3289} {"train_loss": -25.645984649658203, "global_step": 273047, "epoch": 3289} {"train_loss": -25.565235137939453, "global_step": 273048, "epoch": 3289} {"train_loss": -25.173200607299805, "global_step": 273049, "epoch": 3289} {"train_loss": -25.667097091674805, "global_step": 273050, "epoch": 3289} {"train_loss": -25.21888542175293, "global_step": 273051, "epoch": 3289} {"train_loss": -25.505359649658203, "global_step": 273052, "epoch": 3289} {"train_loss": -25.19028091430664, "global_step": 273053, "epoch": 3289} {"train_loss": -24.971792221069336, "global_step": 273054, "epoch": 3289} {"train_loss": -24.78447914123535, "global_step": 273055, "epoch": 3289} {"train_loss": -25.209182739257812, "global_step": 273056, "epoch": 3289} {"train_loss": -25.170814514160156, "global_step": 273057, "epoch": 3289} {"train_loss": -25.348501205444336, "global_step": 273058, "epoch": 3289} {"train_loss": -25.55794334411621, "global_step": 273059, "epoch": 3289} {"train_loss": -24.961578369140625, "global_step": 273060, "epoch": 3289} {"train_loss": -25.527700424194336, "global_step": 273061, "epoch": 3289} {"train_loss": -25.310945510864258, "global_step": 273062, "epoch": 3289} {"train_loss": -24.8890438079834, "global_step": 273063, "epoch": 3289} {"train_loss": -25.451276779174805, "global_step": 273064, "epoch": 3289} {"train_loss": -25.346004486083984, "global_step": 273065, "epoch": 3289} {"train_loss": -25.596057891845703, "global_step": 273066, "epoch": 3289} {"train_loss": -25.51146697998047, "global_step": 273067, "epoch": 3289} {"train_loss": -25.21058464050293, "global_step": 273068, "epoch": 3289} {"train_loss": -25.180823567401934, "global_step": 273069, "epoch": 3289, "val_loss": 7043543.0} {"train_loss": -25.374887466430664, "global_step": 273070, "epoch": 3290} {"train_loss": -25.167753219604492, "global_step": 273071, "epoch": 3290} {"train_loss": -25.022153854370117, "global_step": 273072, "epoch": 3290} {"train_loss": -25.131254196166992, "global_step": 273073, "epoch": 3290} {"train_loss": -25.373132705688477, "global_step": 273074, "epoch": 3290} {"train_loss": -25.387624740600586, "global_step": 273075, "epoch": 3290} {"train_loss": -25.265533447265625, "global_step": 273076, "epoch": 3290} {"train_loss": -24.607473373413086, "global_step": 273077, "epoch": 3290} {"train_loss": -24.953201293945312, "global_step": 273078, "epoch": 3290} {"train_loss": -24.952579498291016, "global_step": 273079, "epoch": 3290} {"train_loss": -25.07910919189453, "global_step": 273080, "epoch": 3290} {"train_loss": -25.00922203063965, "global_step": 273081, "epoch": 3290} {"train_loss": -25.027048110961914, "global_step": 273082, "epoch": 3290} {"train_loss": -24.94674301147461, "global_step": 273083, "epoch": 3290} {"train_loss": -25.372194290161133, "global_step": 273084, "epoch": 3290} {"train_loss": -24.83204460144043, "global_step": 273085, "epoch": 3290} {"train_loss": -25.060503005981445, "global_step": 273086, "epoch": 3290} {"train_loss": -24.99347496032715, "global_step": 273087, "epoch": 3290} {"train_loss": -24.809185028076172, "global_step": 273088, "epoch": 3290} {"train_loss": -25.206172943115234, "global_step": 273089, "epoch": 3290} {"train_loss": -25.5214900970459, "global_step": 273090, "epoch": 3290} {"train_loss": -25.531843185424805, "global_step": 273091, "epoch": 3290} {"train_loss": -25.3052921295166, "global_step": 273092, "epoch": 3290} {"train_loss": -25.522489547729492, "global_step": 273093, "epoch": 3290} {"train_loss": -25.421770095825195, "global_step": 273094, "epoch": 3290} {"train_loss": -25.129430770874023, "global_step": 273095, "epoch": 3290} {"train_loss": -25.287841796875, "global_step": 273096, "epoch": 3290} {"train_loss": -25.244266510009766, "global_step": 273097, "epoch": 3290} {"train_loss": -25.399551391601562, "global_step": 273098, "epoch": 3290} {"train_loss": -25.3220272064209, "global_step": 273099, "epoch": 3290} {"train_loss": -25.813711166381836, "global_step": 273100, "epoch": 3290} {"train_loss": -25.276004791259766, "global_step": 273101, "epoch": 3290} {"train_loss": -25.440797805786133, "global_step": 273102, "epoch": 3290} {"train_loss": -25.541032791137695, "global_step": 273103, "epoch": 3290} {"train_loss": -25.312158584594727, "global_step": 273104, "epoch": 3290} {"train_loss": -25.404417037963867, "global_step": 273105, "epoch": 3290} {"train_loss": -25.488983154296875, "global_step": 273106, "epoch": 3290} {"train_loss": -25.728612899780273, "global_step": 273107, "epoch": 3290} {"train_loss": -25.323516845703125, "global_step": 273108, "epoch": 3290} {"train_loss": -25.272607803344727, "global_step": 273109, "epoch": 3290} {"train_loss": -25.62896728515625, "global_step": 273110, "epoch": 3290} {"train_loss": -25.40024757385254, "global_step": 273111, "epoch": 3290} {"train_loss": -25.564767837524414, "global_step": 273112, "epoch": 3290} {"train_loss": -25.467832565307617, "global_step": 273113, "epoch": 3290} {"train_loss": -25.503271102905273, "global_step": 273114, "epoch": 3290} {"train_loss": -25.187088012695312, "global_step": 273115, "epoch": 3290} {"train_loss": -25.20466423034668, "global_step": 273116, "epoch": 3290} {"train_loss": -25.368947982788086, "global_step": 273117, "epoch": 3290} {"train_loss": -25.26901626586914, "global_step": 273118, "epoch": 3290} {"train_loss": -25.405319213867188, "global_step": 273119, "epoch": 3290} {"train_loss": -25.638967514038086, "global_step": 273120, "epoch": 3290} {"train_loss": -25.43730354309082, "global_step": 273121, "epoch": 3290} {"train_loss": -25.602609634399414, "global_step": 273122, "epoch": 3290} {"train_loss": -25.187122344970703, "global_step": 273123, "epoch": 3290} {"train_loss": -25.668188095092773, "global_step": 273124, "epoch": 3290} {"train_loss": -25.60065269470215, "global_step": 273125, "epoch": 3290} {"train_loss": -25.5230655670166, "global_step": 273126, "epoch": 3290} {"train_loss": -25.65350341796875, "global_step": 273127, "epoch": 3290} {"train_loss": -25.66206169128418, "global_step": 273128, "epoch": 3290} {"train_loss": -24.939319610595703, "global_step": 273129, "epoch": 3290} {"train_loss": -25.681737899780273, "global_step": 273130, "epoch": 3290} {"train_loss": -25.1032772064209, "global_step": 273131, "epoch": 3290} {"train_loss": -25.532718658447266, "global_step": 273132, "epoch": 3290} {"train_loss": -25.75153923034668, "global_step": 273133, "epoch": 3290} {"train_loss": -24.821613311767578, "global_step": 273134, "epoch": 3290} {"train_loss": -24.99477195739746, "global_step": 273135, "epoch": 3290} {"train_loss": -25.024702072143555, "global_step": 273136, "epoch": 3290} {"train_loss": -25.31025505065918, "global_step": 273137, "epoch": 3290} {"train_loss": -25.38746452331543, "global_step": 273138, "epoch": 3290} {"train_loss": -25.370361328125, "global_step": 273139, "epoch": 3290} {"train_loss": -25.38423728942871, "global_step": 273140, "epoch": 3290} {"train_loss": -25.187442779541016, "global_step": 273141, "epoch": 3290} {"train_loss": -24.9459171295166, "global_step": 273142, "epoch": 3290} {"train_loss": -25.30302619934082, "global_step": 273143, "epoch": 3290} {"train_loss": -25.46830177307129, "global_step": 273144, "epoch": 3290} {"train_loss": -25.241348266601562, "global_step": 273145, "epoch": 3290} {"train_loss": -25.48821449279785, "global_step": 273146, "epoch": 3290} {"train_loss": -25.7995662689209, "global_step": 273147, "epoch": 3290} {"train_loss": -25.399200439453125, "global_step": 273148, "epoch": 3290} {"train_loss": -25.52638053894043, "global_step": 273149, "epoch": 3290} {"train_loss": -25.497516632080078, "global_step": 273150, "epoch": 3290} {"train_loss": -25.670209884643555, "global_step": 273151, "epoch": 3290} {"train_loss": -25.35503879225398, "global_step": 273152, "epoch": 3290, "val_loss": 6943240.5} {"train_loss": -24.683673858642578, "global_step": 273153, "epoch": 3291} {"train_loss": -24.42367172241211, "global_step": 273154, "epoch": 3291} {"train_loss": -24.67425537109375, "global_step": 273155, "epoch": 3291} {"train_loss": -24.65497398376465, "global_step": 273156, "epoch": 3291} {"train_loss": -24.958393096923828, "global_step": 273157, "epoch": 3291} {"train_loss": -24.951196670532227, "global_step": 273158, "epoch": 3291} {"train_loss": -24.112478256225586, "global_step": 273159, "epoch": 3291} {"train_loss": -24.575851440429688, "global_step": 273160, "epoch": 3291} {"train_loss": -24.772445678710938, "global_step": 273161, "epoch": 3291} {"train_loss": -24.46327781677246, "global_step": 273162, "epoch": 3291} {"train_loss": -25.15058708190918, "global_step": 273163, "epoch": 3291} {"train_loss": -24.827377319335938, "global_step": 273164, "epoch": 3291} {"train_loss": -24.935440063476562, "global_step": 273165, "epoch": 3291} {"train_loss": -24.625940322875977, "global_step": 273166, "epoch": 3291} {"train_loss": -24.744688034057617, "global_step": 273167, "epoch": 3291} {"train_loss": -24.7783260345459, "global_step": 273168, "epoch": 3291} {"train_loss": -25.139896392822266, "global_step": 273169, "epoch": 3291} {"train_loss": -25.17775535583496, "global_step": 273170, "epoch": 3291} {"train_loss": -25.085874557495117, "global_step": 273171, "epoch": 3291} {"train_loss": -25.128713607788086, "global_step": 273172, "epoch": 3291} {"train_loss": -25.052061080932617, "global_step": 273173, "epoch": 3291} {"train_loss": -24.881120681762695, "global_step": 273174, "epoch": 3291} {"train_loss": -25.379987716674805, "global_step": 273175, "epoch": 3291} {"train_loss": -24.885133743286133, "global_step": 273176, "epoch": 3291} {"train_loss": -24.904462814331055, "global_step": 273177, "epoch": 3291} {"train_loss": -25.352203369140625, "global_step": 273178, "epoch": 3291} {"train_loss": -25.14289665222168, "global_step": 273179, "epoch": 3291} {"train_loss": -25.24275016784668, "global_step": 273180, "epoch": 3291} {"train_loss": -25.044832229614258, "global_step": 273181, "epoch": 3291} {"train_loss": -24.922025680541992, "global_step": 273182, "epoch": 3291} {"train_loss": -24.84874725341797, "global_step": 273183, "epoch": 3291} {"train_loss": -24.92670249938965, "global_step": 273184, "epoch": 3291} {"train_loss": -25.330209732055664, "global_step": 273185, "epoch": 3291} {"train_loss": -25.053302764892578, "global_step": 273186, "epoch": 3291} {"train_loss": -25.087841033935547, "global_step": 273187, "epoch": 3291} {"train_loss": -24.989898681640625, "global_step": 273188, "epoch": 3291} {"train_loss": -25.55931282043457, "global_step": 273189, "epoch": 3291} {"train_loss": -24.985998153686523, "global_step": 273190, "epoch": 3291} {"train_loss": -25.073104858398438, "global_step": 273191, "epoch": 3291} {"train_loss": -25.368234634399414, "global_step": 273192, "epoch": 3291} {"train_loss": -25.27524757385254, "global_step": 273193, "epoch": 3291} {"train_loss": -25.19916343688965, "global_step": 273194, "epoch": 3291} {"train_loss": -25.304149627685547, "global_step": 273195, "epoch": 3291} {"train_loss": -25.100168228149414, "global_step": 273196, "epoch": 3291} {"train_loss": -24.9898681640625, "global_step": 273197, "epoch": 3291} {"train_loss": -25.048664093017578, "global_step": 273198, "epoch": 3291} {"train_loss": -25.33189582824707, "global_step": 273199, "epoch": 3291} {"train_loss": -25.42122459411621, "global_step": 273200, "epoch": 3291} {"train_loss": -25.292997360229492, "global_step": 273201, "epoch": 3291} {"train_loss": -25.56184196472168, "global_step": 273202, "epoch": 3291} {"train_loss": -25.05551528930664, "global_step": 273203, "epoch": 3291} {"train_loss": -25.456655502319336, "global_step": 273204, "epoch": 3291} {"train_loss": -25.365558624267578, "global_step": 273205, "epoch": 3291} {"train_loss": -25.264995574951172, "global_step": 273206, "epoch": 3291} {"train_loss": -25.427846908569336, "global_step": 273207, "epoch": 3291} {"train_loss": -25.433120727539062, "global_step": 273208, "epoch": 3291} {"train_loss": -25.13935661315918, "global_step": 273209, "epoch": 3291} {"train_loss": -25.24860382080078, "global_step": 273210, "epoch": 3291} {"train_loss": -25.578371047973633, "global_step": 273211, "epoch": 3291} {"train_loss": -25.258676528930664, "global_step": 273212, "epoch": 3291} {"train_loss": -25.404483795166016, "global_step": 273213, "epoch": 3291} {"train_loss": -25.328176498413086, "global_step": 273214, "epoch": 3291} {"train_loss": -25.174543380737305, "global_step": 273215, "epoch": 3291} {"train_loss": -24.919095993041992, "global_step": 273216, "epoch": 3291} {"train_loss": -25.350807189941406, "global_step": 273217, "epoch": 3291} {"train_loss": -25.584186553955078, "global_step": 273218, "epoch": 3291} {"train_loss": -25.512378692626953, "global_step": 273219, "epoch": 3291} {"train_loss": -25.18874168395996, "global_step": 273220, "epoch": 3291} {"train_loss": -25.228994369506836, "global_step": 273221, "epoch": 3291} {"train_loss": -25.044527053833008, "global_step": 273222, "epoch": 3291} {"train_loss": -25.31218910217285, "global_step": 273223, "epoch": 3291} {"train_loss": -25.03767967224121, "global_step": 273224, "epoch": 3291} {"train_loss": -25.823286056518555, "global_step": 273225, "epoch": 3291} {"train_loss": -24.920392990112305, "global_step": 273226, "epoch": 3291} {"train_loss": -25.30106544494629, "global_step": 273227, "epoch": 3291} {"train_loss": -25.291765213012695, "global_step": 273228, "epoch": 3291} {"train_loss": -24.958887100219727, "global_step": 273229, "epoch": 3291} {"train_loss": -25.37295913696289, "global_step": 273230, "epoch": 3291} {"train_loss": -24.948528289794922, "global_step": 273231, "epoch": 3291} {"train_loss": -25.556203842163086, "global_step": 273232, "epoch": 3291} {"train_loss": -25.232669830322266, "global_step": 273233, "epoch": 3291} {"train_loss": -25.069629669189453, "global_step": 273234, "epoch": 3291} {"train_loss": -25.125505378447382, "global_step": 273235, "epoch": 3291, "val_loss": 7051582.5} {"train_loss": -24.31671714782715, "global_step": 273236, "epoch": 3292} {"train_loss": -24.889402389526367, "global_step": 273237, "epoch": 3292} {"train_loss": -24.814529418945312, "global_step": 273238, "epoch": 3292} {"train_loss": -24.6351375579834, "global_step": 273239, "epoch": 3292} {"train_loss": -25.04865837097168, "global_step": 273240, "epoch": 3292} {"train_loss": -24.945240020751953, "global_step": 273241, "epoch": 3292} {"train_loss": -24.34572410583496, "global_step": 273242, "epoch": 3292} {"train_loss": -24.71864128112793, "global_step": 273243, "epoch": 3292} {"train_loss": -24.737234115600586, "global_step": 273244, "epoch": 3292} {"train_loss": -24.4124698638916, "global_step": 273245, "epoch": 3292} {"train_loss": -24.90907096862793, "global_step": 273246, "epoch": 3292} {"train_loss": -24.91646385192871, "global_step": 273247, "epoch": 3292} {"train_loss": -25.281831741333008, "global_step": 273248, "epoch": 3292} {"train_loss": -24.94136619567871, "global_step": 273249, "epoch": 3292} {"train_loss": -25.27231788635254, "global_step": 273250, "epoch": 3292} {"train_loss": -25.316638946533203, "global_step": 273251, "epoch": 3292} {"train_loss": -24.916866302490234, "global_step": 273252, "epoch": 3292} {"train_loss": -25.0212459564209, "global_step": 273253, "epoch": 3292} {"train_loss": -25.214872360229492, "global_step": 273254, "epoch": 3292} {"train_loss": -25.082754135131836, "global_step": 273255, "epoch": 3292} {"train_loss": -25.286420822143555, "global_step": 273256, "epoch": 3292} {"train_loss": -25.25464630126953, "global_step": 273257, "epoch": 3292} {"train_loss": -25.16938018798828, "global_step": 273258, "epoch": 3292} {"train_loss": -25.474136352539062, "global_step": 273259, "epoch": 3292} {"train_loss": -25.244430541992188, "global_step": 273260, "epoch": 3292} {"train_loss": -25.27705955505371, "global_step": 273261, "epoch": 3292} {"train_loss": -25.648527145385742, "global_step": 273262, "epoch": 3292} {"train_loss": -25.37604331970215, "global_step": 273263, "epoch": 3292} {"train_loss": -25.161296844482422, "global_step": 273264, "epoch": 3292} {"train_loss": -25.405532836914062, "global_step": 273265, "epoch": 3292} {"train_loss": -25.006235122680664, "global_step": 273266, "epoch": 3292} {"train_loss": -25.382658004760742, "global_step": 273267, "epoch": 3292} {"train_loss": -25.597898483276367, "global_step": 273268, "epoch": 3292} {"train_loss": -25.265390396118164, "global_step": 273269, "epoch": 3292} {"train_loss": -25.744298934936523, "global_step": 273270, "epoch": 3292} {"train_loss": -25.38941192626953, "global_step": 273271, "epoch": 3292} {"train_loss": -25.207725524902344, "global_step": 273272, "epoch": 3292} {"train_loss": -25.50834846496582, "global_step": 273273, "epoch": 3292} {"train_loss": -25.6492919921875, "global_step": 273274, "epoch": 3292} {"train_loss": -25.593917846679688, "global_step": 273275, "epoch": 3292} {"train_loss": -25.520051956176758, "global_step": 273276, "epoch": 3292} {"train_loss": -25.30962562561035, "global_step": 273277, "epoch": 3292} {"train_loss": -24.9975643157959, "global_step": 273278, "epoch": 3292} {"train_loss": -25.16607666015625, "global_step": 273279, "epoch": 3292} {"train_loss": -25.031492233276367, "global_step": 273280, "epoch": 3292} {"train_loss": -25.088804244995117, "global_step": 273281, "epoch": 3292} {"train_loss": -25.437376022338867, "global_step": 273282, "epoch": 3292} {"train_loss": -25.254995346069336, "global_step": 273283, "epoch": 3292} {"train_loss": -25.360000610351562, "global_step": 273284, "epoch": 3292} {"train_loss": -25.654129028320312, "global_step": 273285, "epoch": 3292} {"train_loss": -25.340293884277344, "global_step": 273286, "epoch": 3292} {"train_loss": -25.31174659729004, "global_step": 273287, "epoch": 3292} {"train_loss": -24.890485763549805, "global_step": 273288, "epoch": 3292} {"train_loss": -25.051166534423828, "global_step": 273289, "epoch": 3292} {"train_loss": -25.33529281616211, "global_step": 273290, "epoch": 3292} {"train_loss": -25.217557907104492, "global_step": 273291, "epoch": 3292} {"train_loss": -25.6944637298584, "global_step": 273292, "epoch": 3292} {"train_loss": -25.439838409423828, "global_step": 273293, "epoch": 3292} {"train_loss": -25.4528865814209, "global_step": 273294, "epoch": 3292} {"train_loss": -24.9581241607666, "global_step": 273295, "epoch": 3292} {"train_loss": -25.602773666381836, "global_step": 273296, "epoch": 3292} {"train_loss": -25.229843139648438, "global_step": 273297, "epoch": 3292} {"train_loss": -25.344465255737305, "global_step": 273298, "epoch": 3292} {"train_loss": -25.400297164916992, "global_step": 273299, "epoch": 3292} {"train_loss": -25.79107093811035, "global_step": 273300, "epoch": 3292} {"train_loss": -25.66583824157715, "global_step": 273301, "epoch": 3292} {"train_loss": -25.5732421875, "global_step": 273302, "epoch": 3292} {"train_loss": -25.2065372467041, "global_step": 273303, "epoch": 3292} {"train_loss": -25.641019821166992, "global_step": 273304, "epoch": 3292} {"train_loss": -25.20741844177246, "global_step": 273305, "epoch": 3292} {"train_loss": -25.19945526123047, "global_step": 273306, "epoch": 3292} {"train_loss": -25.834455490112305, "global_step": 273307, "epoch": 3292} {"train_loss": -25.325773239135742, "global_step": 273308, "epoch": 3292} {"train_loss": -25.301801681518555, "global_step": 273309, "epoch": 3292} {"train_loss": -25.207223892211914, "global_step": 273310, "epoch": 3292} {"train_loss": -25.015884399414062, "global_step": 273311, "epoch": 3292} {"train_loss": -25.266000747680664, "global_step": 273312, "epoch": 3292} {"train_loss": -25.097883224487305, "global_step": 273313, "epoch": 3292} {"train_loss": -24.993684768676758, "global_step": 273314, "epoch": 3292} {"train_loss": -25.484867095947266, "global_step": 273315, "epoch": 3292} {"train_loss": -25.343168258666992, "global_step": 273316, "epoch": 3292} {"train_loss": -25.100067138671875, "global_step": 273317, "epoch": 3292} {"train_loss": -25.232044380831432, "global_step": 273318, "epoch": 3292, "val_loss": 7016130.0} {"train_loss": -24.877979278564453, "global_step": 273319, "epoch": 3293} {"train_loss": -24.66971778869629, "global_step": 273320, "epoch": 3293} {"train_loss": -25.018272399902344, "global_step": 273321, "epoch": 3293} {"train_loss": -24.503528594970703, "global_step": 273322, "epoch": 3293} {"train_loss": -24.996610641479492, "global_step": 273323, "epoch": 3293} {"train_loss": -24.76198387145996, "global_step": 273324, "epoch": 3293} {"train_loss": -25.318632125854492, "global_step": 273325, "epoch": 3293} {"train_loss": -24.862485885620117, "global_step": 273326, "epoch": 3293} {"train_loss": -25.19209861755371, "global_step": 273327, "epoch": 3293} {"train_loss": -24.809059143066406, "global_step": 273328, "epoch": 3293} {"train_loss": -25.107101440429688, "global_step": 273329, "epoch": 3293} {"train_loss": -24.81386375427246, "global_step": 273330, "epoch": 3293} {"train_loss": -25.17549705505371, "global_step": 273331, "epoch": 3293} {"train_loss": -25.200881958007812, "global_step": 273332, "epoch": 3293} {"train_loss": -25.085813522338867, "global_step": 273333, "epoch": 3293} {"train_loss": -25.101486206054688, "global_step": 273334, "epoch": 3293} {"train_loss": -25.34142303466797, "global_step": 273335, "epoch": 3293} {"train_loss": -25.09303092956543, "global_step": 273336, "epoch": 3293} {"train_loss": -25.814931869506836, "global_step": 273337, "epoch": 3293} {"train_loss": -25.39063835144043, "global_step": 273338, "epoch": 3293} {"train_loss": -25.275955200195312, "global_step": 273339, "epoch": 3293} {"train_loss": -25.126052856445312, "global_step": 273340, "epoch": 3293} {"train_loss": -25.232938766479492, "global_step": 273341, "epoch": 3293} {"train_loss": -25.022174835205078, "global_step": 273342, "epoch": 3293} {"train_loss": -25.270723342895508, "global_step": 273343, "epoch": 3293} {"train_loss": -25.400007247924805, "global_step": 273344, "epoch": 3293} {"train_loss": -24.987462997436523, "global_step": 273345, "epoch": 3293} {"train_loss": -25.257665634155273, "global_step": 273346, "epoch": 3293} {"train_loss": -25.63172721862793, "global_step": 273347, "epoch": 3293} {"train_loss": -25.3388671875, "global_step": 273348, "epoch": 3293} {"train_loss": -25.363718032836914, "global_step": 273349, "epoch": 3293} {"train_loss": -25.497995376586914, "global_step": 273350, "epoch": 3293} {"train_loss": -25.33017921447754, "global_step": 273351, "epoch": 3293} {"train_loss": -25.31022834777832, "global_step": 273352, "epoch": 3293} {"train_loss": -25.438825607299805, "global_step": 273353, "epoch": 3293} {"train_loss": -25.350147247314453, "global_step": 273354, "epoch": 3293} {"train_loss": -25.493526458740234, "global_step": 273355, "epoch": 3293} {"train_loss": -25.49336814880371, "global_step": 273356, "epoch": 3293} {"train_loss": -25.418363571166992, "global_step": 273357, "epoch": 3293} {"train_loss": -25.50618553161621, "global_step": 273358, "epoch": 3293} {"train_loss": -25.264310836791992, "global_step": 273359, "epoch": 3293} {"train_loss": -25.557756423950195, "global_step": 273360, "epoch": 3293} {"train_loss": -25.501611709594727, "global_step": 273361, "epoch": 3293} {"train_loss": -25.292593002319336, "global_step": 273362, "epoch": 3293} {"train_loss": -25.55030632019043, "global_step": 273363, "epoch": 3293} {"train_loss": -25.675018310546875, "global_step": 273364, "epoch": 3293} {"train_loss": -25.350406646728516, "global_step": 273365, "epoch": 3293} {"train_loss": -25.34592056274414, "global_step": 273366, "epoch": 3293} {"train_loss": -24.921873092651367, "global_step": 273367, "epoch": 3293} {"train_loss": -25.47464370727539, "global_step": 273368, "epoch": 3293} {"train_loss": -25.25079345703125, "global_step": 273369, "epoch": 3293} {"train_loss": -25.35262680053711, "global_step": 273370, "epoch": 3293} {"train_loss": -25.247255325317383, "global_step": 273371, "epoch": 3293} {"train_loss": -25.645048141479492, "global_step": 273372, "epoch": 3293} {"train_loss": -25.400617599487305, "global_step": 273373, "epoch": 3293} {"train_loss": -25.52512550354004, "global_step": 273374, "epoch": 3293} {"train_loss": -25.94923210144043, "global_step": 273375, "epoch": 3293} {"train_loss": -25.303678512573242, "global_step": 273376, "epoch": 3293} {"train_loss": -25.407859802246094, "global_step": 273377, "epoch": 3293} {"train_loss": -25.58146858215332, "global_step": 273378, "epoch": 3293} {"train_loss": -25.3093318939209, "global_step": 273379, "epoch": 3293} {"train_loss": -25.651142120361328, "global_step": 273380, "epoch": 3293} {"train_loss": -25.392560958862305, "global_step": 273381, "epoch": 3293} {"train_loss": -25.598052978515625, "global_step": 273382, "epoch": 3293} {"train_loss": -25.165197372436523, "global_step": 273383, "epoch": 3293} {"train_loss": -24.70881462097168, "global_step": 273384, "epoch": 3293} {"train_loss": -24.74552345275879, "global_step": 273385, "epoch": 3293} {"train_loss": -24.814111709594727, "global_step": 273386, "epoch": 3293} {"train_loss": -24.9593563079834, "global_step": 273387, "epoch": 3293} {"train_loss": -25.7005615234375, "global_step": 273388, "epoch": 3293} {"train_loss": -25.1650447845459, "global_step": 273389, "epoch": 3293} {"train_loss": -25.485692977905273, "global_step": 273390, "epoch": 3293} {"train_loss": -25.042022705078125, "global_step": 273391, "epoch": 3293} {"train_loss": -25.473047256469727, "global_step": 273392, "epoch": 3293} {"train_loss": -25.18581199645996, "global_step": 273393, "epoch": 3293} {"train_loss": -25.527790069580078, "global_step": 273394, "epoch": 3293} {"train_loss": -25.211889266967773, "global_step": 273395, "epoch": 3293} {"train_loss": -25.57187843322754, "global_step": 273396, "epoch": 3293} {"train_loss": -25.44584083557129, "global_step": 273397, "epoch": 3293} {"train_loss": -25.338342666625977, "global_step": 273398, "epoch": 3293} {"train_loss": -24.96161460876465, "global_step": 273399, "epoch": 3293} {"train_loss": -25.4967098236084, "global_step": 273400, "epoch": 3293} {"train_loss": -25.267533221876764, "global_step": 273401, "epoch": 3293, "val_loss": 7093894.0} {"train_loss": -24.826358795166016, "global_step": 273402, "epoch": 3294} {"train_loss": -25.31742286682129, "global_step": 273403, "epoch": 3294} {"train_loss": -24.915555953979492, "global_step": 273404, "epoch": 3294} {"train_loss": -25.266611099243164, "global_step": 273405, "epoch": 3294} {"train_loss": -24.707698822021484, "global_step": 273406, "epoch": 3294} {"train_loss": -24.75687599182129, "global_step": 273407, "epoch": 3294} {"train_loss": -24.793195724487305, "global_step": 273408, "epoch": 3294} {"train_loss": -25.005613327026367, "global_step": 273409, "epoch": 3294} {"train_loss": -24.72993278503418, "global_step": 273410, "epoch": 3294} {"train_loss": -25.192747116088867, "global_step": 273411, "epoch": 3294} {"train_loss": -24.88063621520996, "global_step": 273412, "epoch": 3294} {"train_loss": -25.13309669494629, "global_step": 273413, "epoch": 3294} {"train_loss": -25.059444427490234, "global_step": 273414, "epoch": 3294} {"train_loss": -24.906888961791992, "global_step": 273415, "epoch": 3294} {"train_loss": -25.24006462097168, "global_step": 273416, "epoch": 3294} {"train_loss": -25.30948829650879, "global_step": 273417, "epoch": 3294} {"train_loss": -25.174442291259766, "global_step": 273418, "epoch": 3294} {"train_loss": -24.905309677124023, "global_step": 273419, "epoch": 3294} {"train_loss": -25.210155487060547, "global_step": 273420, "epoch": 3294} {"train_loss": -25.06852149963379, "global_step": 273421, "epoch": 3294} {"train_loss": -25.147994995117188, "global_step": 273422, "epoch": 3294} {"train_loss": -25.272991180419922, "global_step": 273423, "epoch": 3294} {"train_loss": -25.062292098999023, "global_step": 273424, "epoch": 3294} {"train_loss": -25.307573318481445, "global_step": 273425, "epoch": 3294} {"train_loss": -25.024860382080078, "global_step": 273426, "epoch": 3294} {"train_loss": -25.027963638305664, "global_step": 273427, "epoch": 3294} {"train_loss": -25.398975372314453, "global_step": 273428, "epoch": 3294} {"train_loss": -24.98936653137207, "global_step": 273429, "epoch": 3294} {"train_loss": -25.45258140563965, "global_step": 273430, "epoch": 3294} {"train_loss": -25.136716842651367, "global_step": 273431, "epoch": 3294} {"train_loss": -25.40455436706543, "global_step": 273432, "epoch": 3294} {"train_loss": -24.913671493530273, "global_step": 273433, "epoch": 3294} {"train_loss": -24.973613739013672, "global_step": 273434, "epoch": 3294} {"train_loss": -25.448774337768555, "global_step": 273435, "epoch": 3294} {"train_loss": -25.277952194213867, "global_step": 273436, "epoch": 3294} {"train_loss": -25.271411895751953, "global_step": 273437, "epoch": 3294} {"train_loss": -24.89401626586914, "global_step": 273438, "epoch": 3294} {"train_loss": -25.51419448852539, "global_step": 273439, "epoch": 3294} {"train_loss": -24.944976806640625, "global_step": 273440, "epoch": 3294} {"train_loss": -25.308439254760742, "global_step": 273441, "epoch": 3294} {"train_loss": -25.408849716186523, "global_step": 273442, "epoch": 3294} {"train_loss": -25.14688491821289, "global_step": 273443, "epoch": 3294} {"train_loss": -24.856950759887695, "global_step": 273444, "epoch": 3294} {"train_loss": -25.803998947143555, "global_step": 273445, "epoch": 3294} {"train_loss": -25.578733444213867, "global_step": 273446, "epoch": 3294} {"train_loss": -25.361568450927734, "global_step": 273447, "epoch": 3294} {"train_loss": -25.54359245300293, "global_step": 273448, "epoch": 3294} {"train_loss": -25.1063175201416, "global_step": 273449, "epoch": 3294} {"train_loss": -25.16718864440918, "global_step": 273450, "epoch": 3294} {"train_loss": -25.25482940673828, "global_step": 273451, "epoch": 3294} {"train_loss": -25.262826919555664, "global_step": 273452, "epoch": 3294} {"train_loss": -25.43565559387207, "global_step": 273453, "epoch": 3294} {"train_loss": -25.612979888916016, "global_step": 273454, "epoch": 3294} {"train_loss": -25.381046295166016, "global_step": 273455, "epoch": 3294} {"train_loss": -25.280487060546875, "global_step": 273456, "epoch": 3294} {"train_loss": -25.59320640563965, "global_step": 273457, "epoch": 3294} {"train_loss": -25.389150619506836, "global_step": 273458, "epoch": 3294} {"train_loss": -25.568267822265625, "global_step": 273459, "epoch": 3294} {"train_loss": -25.330778121948242, "global_step": 273460, "epoch": 3294} {"train_loss": -25.331491470336914, "global_step": 273461, "epoch": 3294} {"train_loss": -25.165807723999023, "global_step": 273462, "epoch": 3294} {"train_loss": -25.6246280670166, "global_step": 273463, "epoch": 3294} {"train_loss": -25.393539428710938, "global_step": 273464, "epoch": 3294} {"train_loss": -25.752771377563477, "global_step": 273465, "epoch": 3294} {"train_loss": -25.455862045288086, "global_step": 273466, "epoch": 3294} {"train_loss": -25.175159454345703, "global_step": 273467, "epoch": 3294} {"train_loss": -25.50136375427246, "global_step": 273468, "epoch": 3294} {"train_loss": -25.712400436401367, "global_step": 273469, "epoch": 3294} {"train_loss": -25.62327003479004, "global_step": 273470, "epoch": 3294} {"train_loss": -25.13921356201172, "global_step": 273471, "epoch": 3294} {"train_loss": -25.27651596069336, "global_step": 273472, "epoch": 3294} {"train_loss": -25.900409698486328, "global_step": 273473, "epoch": 3294} {"train_loss": -25.526941299438477, "global_step": 273474, "epoch": 3294} {"train_loss": -25.420507431030273, "global_step": 273475, "epoch": 3294} {"train_loss": -25.37355613708496, "global_step": 273476, "epoch": 3294} {"train_loss": -25.432558059692383, "global_step": 273477, "epoch": 3294} {"train_loss": -25.690475463867188, "global_step": 273478, "epoch": 3294} {"train_loss": -25.334928512573242, "global_step": 273479, "epoch": 3294} {"train_loss": -25.369565963745117, "global_step": 273480, "epoch": 3294} {"train_loss": -25.30366325378418, "global_step": 273481, "epoch": 3294} {"train_loss": -25.306243896484375, "global_step": 273482, "epoch": 3294} {"train_loss": -25.500558853149414, "global_step": 273483, "epoch": 3294} {"train_loss": -25.250971621777637, "global_step": 273484, "epoch": 3294, "val_loss": 7058397.0} {"train_loss": -24.790952682495117, "global_step": 273485, "epoch": 3295} {"train_loss": -24.202518463134766, "global_step": 273486, "epoch": 3295} {"train_loss": -23.517742156982422, "global_step": 273487, "epoch": 3295} {"train_loss": -24.48023796081543, "global_step": 273488, "epoch": 3295} {"train_loss": -24.29829978942871, "global_step": 273489, "epoch": 3295} {"train_loss": -24.75531768798828, "global_step": 273490, "epoch": 3295} {"train_loss": -24.663732528686523, "global_step": 273491, "epoch": 3295} {"train_loss": -24.65724754333496, "global_step": 273492, "epoch": 3295} {"train_loss": -24.703638076782227, "global_step": 273493, "epoch": 3295} {"train_loss": -25.06594467163086, "global_step": 273494, "epoch": 3295} {"train_loss": -24.807889938354492, "global_step": 273495, "epoch": 3295} {"train_loss": -24.773406982421875, "global_step": 273496, "epoch": 3295} {"train_loss": -24.965068817138672, "global_step": 273497, "epoch": 3295} {"train_loss": -24.439416885375977, "global_step": 273498, "epoch": 3295} {"train_loss": -24.720399856567383, "global_step": 273499, "epoch": 3295} {"train_loss": -24.737577438354492, "global_step": 273500, "epoch": 3295} {"train_loss": -24.499492645263672, "global_step": 273501, "epoch": 3295} {"train_loss": -24.81556510925293, "global_step": 273502, "epoch": 3295} {"train_loss": -24.735641479492188, "global_step": 273503, "epoch": 3295} {"train_loss": -25.17323112487793, "global_step": 273504, "epoch": 3295} {"train_loss": -24.948667526245117, "global_step": 273505, "epoch": 3295} {"train_loss": -24.721527099609375, "global_step": 273506, "epoch": 3295} {"train_loss": -24.706335067749023, "global_step": 273507, "epoch": 3295} {"train_loss": -24.89395523071289, "global_step": 273508, "epoch": 3295} {"train_loss": -24.91316795349121, "global_step": 273509, "epoch": 3295} {"train_loss": -25.101696014404297, "global_step": 273510, "epoch": 3295} {"train_loss": -24.813669204711914, "global_step": 273511, "epoch": 3295} {"train_loss": -25.245622634887695, "global_step": 273512, "epoch": 3295} {"train_loss": -25.24178123474121, "global_step": 273513, "epoch": 3295} {"train_loss": -25.491125106811523, "global_step": 273514, "epoch": 3295} {"train_loss": -25.197431564331055, "global_step": 273515, "epoch": 3295} {"train_loss": -25.44972038269043, "global_step": 273516, "epoch": 3295} {"train_loss": -25.22347068786621, "global_step": 273517, "epoch": 3295} {"train_loss": -25.772619247436523, "global_step": 273518, "epoch": 3295} {"train_loss": -25.2380428314209, "global_step": 273519, "epoch": 3295} {"train_loss": -25.581710815429688, "global_step": 273520, "epoch": 3295} {"train_loss": -25.61252784729004, "global_step": 273521, "epoch": 3295} {"train_loss": -25.627857208251953, "global_step": 273522, "epoch": 3295} {"train_loss": -25.425901412963867, "global_step": 273523, "epoch": 3295} {"train_loss": -25.417877197265625, "global_step": 273524, "epoch": 3295} {"train_loss": -25.141372680664062, "global_step": 273525, "epoch": 3295} {"train_loss": -25.415708541870117, "global_step": 273526, "epoch": 3295} {"train_loss": -25.636220932006836, "global_step": 273527, "epoch": 3295} {"train_loss": -24.912771224975586, "global_step": 273528, "epoch": 3295} {"train_loss": -24.92232322692871, "global_step": 273529, "epoch": 3295} {"train_loss": -25.20078468322754, "global_step": 273530, "epoch": 3295} {"train_loss": -25.37993812561035, "global_step": 273531, "epoch": 3295} {"train_loss": -25.492341995239258, "global_step": 273532, "epoch": 3295} {"train_loss": -25.709552764892578, "global_step": 273533, "epoch": 3295} {"train_loss": -25.4276123046875, "global_step": 273534, "epoch": 3295} {"train_loss": -25.1575927734375, "global_step": 273535, "epoch": 3295} {"train_loss": -25.209699630737305, "global_step": 273536, "epoch": 3295} {"train_loss": -25.386133193969727, "global_step": 273537, "epoch": 3295} {"train_loss": -25.25327491760254, "global_step": 273538, "epoch": 3295} {"train_loss": -25.576688766479492, "global_step": 273539, "epoch": 3295} {"train_loss": -25.56344985961914, "global_step": 273540, "epoch": 3295} {"train_loss": -25.294361114501953, "global_step": 273541, "epoch": 3295} {"train_loss": -25.395832061767578, "global_step": 273542, "epoch": 3295} {"train_loss": -25.238988876342773, "global_step": 273543, "epoch": 3295} {"train_loss": -25.558670043945312, "global_step": 273544, "epoch": 3295} {"train_loss": -25.480436325073242, "global_step": 273545, "epoch": 3295} {"train_loss": -25.517616271972656, "global_step": 273546, "epoch": 3295} {"train_loss": -25.796411514282227, "global_step": 273547, "epoch": 3295} {"train_loss": -25.41376495361328, "global_step": 273548, "epoch": 3295} {"train_loss": -25.36110496520996, "global_step": 273549, "epoch": 3295} {"train_loss": -25.525346755981445, "global_step": 273550, "epoch": 3295} {"train_loss": -25.41480827331543, "global_step": 273551, "epoch": 3295} {"train_loss": -25.036705017089844, "global_step": 273552, "epoch": 3295} {"train_loss": -25.306121826171875, "global_step": 273553, "epoch": 3295} {"train_loss": -25.30451011657715, "global_step": 273554, "epoch": 3295} {"train_loss": -25.498416900634766, "global_step": 273555, "epoch": 3295} {"train_loss": -25.293006896972656, "global_step": 273556, "epoch": 3295} {"train_loss": -25.11659812927246, "global_step": 273557, "epoch": 3295} {"train_loss": -25.404632568359375, "global_step": 273558, "epoch": 3295} {"train_loss": -25.617319107055664, "global_step": 273559, "epoch": 3295} {"train_loss": -25.35207176208496, "global_step": 273560, "epoch": 3295} {"train_loss": -25.28192710876465, "global_step": 273561, "epoch": 3295} {"train_loss": -25.54620361328125, "global_step": 273562, "epoch": 3295} {"train_loss": -25.153600692749023, "global_step": 273563, "epoch": 3295} {"train_loss": -25.45790672302246, "global_step": 273564, "epoch": 3295} {"train_loss": -25.49497413635254, "global_step": 273565, "epoch": 3295} {"train_loss": -25.236520767211914, "global_step": 273566, "epoch": 3295} {"train_loss": -25.17501994213426, "global_step": 273567, "epoch": 3295, "val_loss": 7042909.0} {"train_loss": -24.123010635375977, "global_step": 273568, "epoch": 3296} {"train_loss": -24.44462013244629, "global_step": 273569, "epoch": 3296} {"train_loss": -24.865652084350586, "global_step": 273570, "epoch": 3296} {"train_loss": -24.557666778564453, "global_step": 273571, "epoch": 3296} {"train_loss": -24.21729850769043, "global_step": 273572, "epoch": 3296} {"train_loss": -24.302961349487305, "global_step": 273573, "epoch": 3296} {"train_loss": -24.257612228393555, "global_step": 273574, "epoch": 3296} {"train_loss": -24.40892219543457, "global_step": 273575, "epoch": 3296} {"train_loss": -24.431180953979492, "global_step": 273576, "epoch": 3296} {"train_loss": -24.522857666015625, "global_step": 273577, "epoch": 3296} {"train_loss": -24.383710861206055, "global_step": 273578, "epoch": 3296} {"train_loss": -24.871179580688477, "global_step": 273579, "epoch": 3296} {"train_loss": -24.177326202392578, "global_step": 273580, "epoch": 3296} {"train_loss": -24.961639404296875, "global_step": 273581, "epoch": 3296} {"train_loss": -24.868444442749023, "global_step": 273582, "epoch": 3296} {"train_loss": -24.676597595214844, "global_step": 273583, "epoch": 3296} {"train_loss": -24.620590209960938, "global_step": 273584, "epoch": 3296} {"train_loss": -24.636178970336914, "global_step": 273585, "epoch": 3296} {"train_loss": -24.938949584960938, "global_step": 273586, "epoch": 3296} {"train_loss": -24.912410736083984, "global_step": 273587, "epoch": 3296} {"train_loss": -24.803966522216797, "global_step": 273588, "epoch": 3296} {"train_loss": -25.140321731567383, "global_step": 273589, "epoch": 3296} {"train_loss": -24.86610221862793, "global_step": 273590, "epoch": 3296} {"train_loss": -24.974178314208984, "global_step": 273591, "epoch": 3296} {"train_loss": -25.138940811157227, "global_step": 273592, "epoch": 3296} {"train_loss": -24.881072998046875, "global_step": 273593, "epoch": 3296} {"train_loss": -25.223630905151367, "global_step": 273594, "epoch": 3296} {"train_loss": -25.151233673095703, "global_step": 273595, "epoch": 3296} {"train_loss": -24.88315773010254, "global_step": 273596, "epoch": 3296} {"train_loss": -24.86948585510254, "global_step": 273597, "epoch": 3296} {"train_loss": -25.214933395385742, "global_step": 273598, "epoch": 3296} {"train_loss": -25.279319763183594, "global_step": 273599, "epoch": 3296} {"train_loss": -25.36006736755371, "global_step": 273600, "epoch": 3296} {"train_loss": -25.3350772857666, "global_step": 273601, "epoch": 3296} {"train_loss": -25.196035385131836, "global_step": 273602, "epoch": 3296} {"train_loss": -25.2227725982666, "global_step": 273603, "epoch": 3296} {"train_loss": -25.136728286743164, "global_step": 273604, "epoch": 3296} {"train_loss": -25.282808303833008, "global_step": 273605, "epoch": 3296} {"train_loss": -25.265897750854492, "global_step": 273606, "epoch": 3296} {"train_loss": -25.397972106933594, "global_step": 273607, "epoch": 3296} {"train_loss": -24.951379776000977, "global_step": 273608, "epoch": 3296} {"train_loss": -25.337717056274414, "global_step": 273609, "epoch": 3296} {"train_loss": -25.419958114624023, "global_step": 273610, "epoch": 3296} {"train_loss": -25.16092872619629, "global_step": 273611, "epoch": 3296} {"train_loss": -25.473344802856445, "global_step": 273612, "epoch": 3296} {"train_loss": -25.373977661132812, "global_step": 273613, "epoch": 3296} {"train_loss": -25.536426544189453, "global_step": 273614, "epoch": 3296} {"train_loss": -25.542835235595703, "global_step": 273615, "epoch": 3296} {"train_loss": -25.429731369018555, "global_step": 273616, "epoch": 3296} {"train_loss": -25.10271644592285, "global_step": 273617, "epoch": 3296} {"train_loss": -25.575855255126953, "global_step": 273618, "epoch": 3296} {"train_loss": -25.626190185546875, "global_step": 273619, "epoch": 3296} {"train_loss": -25.29070281982422, "global_step": 273620, "epoch": 3296} {"train_loss": -24.953275680541992, "global_step": 273621, "epoch": 3296} {"train_loss": -25.50701904296875, "global_step": 273622, "epoch": 3296} {"train_loss": -25.443506240844727, "global_step": 273623, "epoch": 3296} {"train_loss": -25.487619400024414, "global_step": 273624, "epoch": 3296} {"train_loss": -25.215862274169922, "global_step": 273625, "epoch": 3296} {"train_loss": -25.103967666625977, "global_step": 273626, "epoch": 3296} {"train_loss": -25.226783752441406, "global_step": 273627, "epoch": 3296} {"train_loss": -25.297351837158203, "global_step": 273628, "epoch": 3296} {"train_loss": -25.087726593017578, "global_step": 273629, "epoch": 3296} {"train_loss": -25.588043212890625, "global_step": 273630, "epoch": 3296} {"train_loss": -25.546422958374023, "global_step": 273631, "epoch": 3296} {"train_loss": -25.1632080078125, "global_step": 273632, "epoch": 3296} {"train_loss": -25.26704978942871, "global_step": 273633, "epoch": 3296} {"train_loss": -25.9902400970459, "global_step": 273634, "epoch": 3296} {"train_loss": -25.3242244720459, "global_step": 273635, "epoch": 3296} {"train_loss": -25.389448165893555, "global_step": 273636, "epoch": 3296} {"train_loss": -24.961910247802734, "global_step": 273637, "epoch": 3296} {"train_loss": -25.324583053588867, "global_step": 273638, "epoch": 3296} {"train_loss": -25.519079208374023, "global_step": 273639, "epoch": 3296} {"train_loss": -25.305322647094727, "global_step": 273640, "epoch": 3296} {"train_loss": -25.594680786132812, "global_step": 273641, "epoch": 3296} {"train_loss": -25.421207427978516, "global_step": 273642, "epoch": 3296} {"train_loss": -25.351116180419922, "global_step": 273643, "epoch": 3296} {"train_loss": -25.276168823242188, "global_step": 273644, "epoch": 3296} {"train_loss": -25.363866806030273, "global_step": 273645, "epoch": 3296} {"train_loss": -25.194669723510742, "global_step": 273646, "epoch": 3296} {"train_loss": -25.868528366088867, "global_step": 273647, "epoch": 3296} {"train_loss": -25.16654396057129, "global_step": 273648, "epoch": 3296} {"train_loss": -25.44601058959961, "global_step": 273649, "epoch": 3296} {"train_loss": -25.113236369856867, "global_step": 273650, "epoch": 3296, "val_loss": 6983117.0} {"train_loss": -25.27803611755371, "global_step": 273651, "epoch": 3297} {"train_loss": -24.373416900634766, "global_step": 273652, "epoch": 3297} {"train_loss": -24.344802856445312, "global_step": 273653, "epoch": 3297} {"train_loss": -24.92896842956543, "global_step": 273654, "epoch": 3297} {"train_loss": -25.07558250427246, "global_step": 273655, "epoch": 3297} {"train_loss": -24.68665885925293, "global_step": 273656, "epoch": 3297} {"train_loss": -25.0568790435791, "global_step": 273657, "epoch": 3297} {"train_loss": -25.039587020874023, "global_step": 273658, "epoch": 3297} {"train_loss": -24.359722137451172, "global_step": 273659, "epoch": 3297} {"train_loss": -24.919586181640625, "global_step": 273660, "epoch": 3297} {"train_loss": -25.16883087158203, "global_step": 273661, "epoch": 3297} {"train_loss": -24.899808883666992, "global_step": 273662, "epoch": 3297} {"train_loss": -24.578643798828125, "global_step": 273663, "epoch": 3297} {"train_loss": -25.52669334411621, "global_step": 273664, "epoch": 3297} {"train_loss": -24.788171768188477, "global_step": 273665, "epoch": 3297} {"train_loss": -25.04665184020996, "global_step": 273666, "epoch": 3297} {"train_loss": -25.019271850585938, "global_step": 273667, "epoch": 3297} {"train_loss": -25.128259658813477, "global_step": 273668, "epoch": 3297} {"train_loss": -25.159902572631836, "global_step": 273669, "epoch": 3297} {"train_loss": -24.89386558532715, "global_step": 273670, "epoch": 3297} {"train_loss": -24.93914794921875, "global_step": 273671, "epoch": 3297} {"train_loss": -24.446203231811523, "global_step": 273672, "epoch": 3297} {"train_loss": -25.054174423217773, "global_step": 273673, "epoch": 3297} {"train_loss": -24.8677921295166, "global_step": 273674, "epoch": 3297} {"train_loss": -25.225549697875977, "global_step": 273675, "epoch": 3297} {"train_loss": -24.90904998779297, "global_step": 273676, "epoch": 3297} {"train_loss": -25.142454147338867, "global_step": 273677, "epoch": 3297} {"train_loss": -25.30738067626953, "global_step": 273678, "epoch": 3297} {"train_loss": -25.20447540283203, "global_step": 273679, "epoch": 3297} {"train_loss": -25.006261825561523, "global_step": 273680, "epoch": 3297} {"train_loss": -24.991025924682617, "global_step": 273681, "epoch": 3297} {"train_loss": -25.042882919311523, "global_step": 273682, "epoch": 3297} {"train_loss": -25.231651306152344, "global_step": 273683, "epoch": 3297} {"train_loss": -25.10505485534668, "global_step": 273684, "epoch": 3297} {"train_loss": -25.575719833374023, "global_step": 273685, "epoch": 3297} {"train_loss": -25.350757598876953, "global_step": 273686, "epoch": 3297} {"train_loss": -25.47804069519043, "global_step": 273687, "epoch": 3297} {"train_loss": -25.460460662841797, "global_step": 273688, "epoch": 3297} {"train_loss": -24.91867446899414, "global_step": 273689, "epoch": 3297} {"train_loss": -24.97372817993164, "global_step": 273690, "epoch": 3297} {"train_loss": -25.154590606689453, "global_step": 273691, "epoch": 3297} {"train_loss": -25.202829360961914, "global_step": 273692, "epoch": 3297} {"train_loss": -25.31817626953125, "global_step": 273693, "epoch": 3297} {"train_loss": -25.37205696105957, "global_step": 273694, "epoch": 3297} {"train_loss": -25.34496307373047, "global_step": 273695, "epoch": 3297} {"train_loss": -25.569049835205078, "global_step": 273696, "epoch": 3297} {"train_loss": -25.406736373901367, "global_step": 273697, "epoch": 3297} {"train_loss": -25.2990665435791, "global_step": 273698, "epoch": 3297} {"train_loss": -25.411544799804688, "global_step": 273699, "epoch": 3297} {"train_loss": -25.380868911743164, "global_step": 273700, "epoch": 3297} {"train_loss": -25.59018325805664, "global_step": 273701, "epoch": 3297} {"train_loss": -24.99026107788086, "global_step": 273702, "epoch": 3297} {"train_loss": -25.097396850585938, "global_step": 273703, "epoch": 3297} {"train_loss": -25.44679832458496, "global_step": 273704, "epoch": 3297} {"train_loss": -25.25374984741211, "global_step": 273705, "epoch": 3297} {"train_loss": -25.521997451782227, "global_step": 273706, "epoch": 3297} {"train_loss": -25.19424819946289, "global_step": 273707, "epoch": 3297} {"train_loss": -25.76482582092285, "global_step": 273708, "epoch": 3297} {"train_loss": -25.37028694152832, "global_step": 273709, "epoch": 3297} {"train_loss": -25.382553100585938, "global_step": 273710, "epoch": 3297} {"train_loss": -25.459842681884766, "global_step": 273711, "epoch": 3297} {"train_loss": -25.62264060974121, "global_step": 273712, "epoch": 3297} {"train_loss": -24.922250747680664, "global_step": 273713, "epoch": 3297} {"train_loss": -25.40645408630371, "global_step": 273714, "epoch": 3297} {"train_loss": -25.190025329589844, "global_step": 273715, "epoch": 3297} {"train_loss": -25.432554244995117, "global_step": 273716, "epoch": 3297} {"train_loss": -24.78182029724121, "global_step": 273717, "epoch": 3297} {"train_loss": -24.89470863342285, "global_step": 273718, "epoch": 3297} {"train_loss": -24.820064544677734, "global_step": 273719, "epoch": 3297} {"train_loss": -24.98348617553711, "global_step": 273720, "epoch": 3297} {"train_loss": -24.642486572265625, "global_step": 273721, "epoch": 3297} {"train_loss": -24.6679744720459, "global_step": 273722, "epoch": 3297} {"train_loss": -25.30120086669922, "global_step": 273723, "epoch": 3297} {"train_loss": -25.19455909729004, "global_step": 273724, "epoch": 3297} {"train_loss": -25.279010772705078, "global_step": 273725, "epoch": 3297} {"train_loss": -25.228931427001953, "global_step": 273726, "epoch": 3297} {"train_loss": -25.365238189697266, "global_step": 273727, "epoch": 3297} {"train_loss": -25.206087112426758, "global_step": 273728, "epoch": 3297} {"train_loss": -25.45182228088379, "global_step": 273729, "epoch": 3297} {"train_loss": -25.40641975402832, "global_step": 273730, "epoch": 3297} {"train_loss": -24.961408615112305, "global_step": 273731, "epoch": 3297} {"train_loss": -25.51496124267578, "global_step": 273732, "epoch": 3297} {"train_loss": -25.13728560022561, "global_step": 273733, "epoch": 3297, "val_loss": 6865960.5} {"train_loss": -24.24774742126465, "global_step": 273734, "epoch": 3298} {"train_loss": -24.881637573242188, "global_step": 273735, "epoch": 3298} {"train_loss": -24.19439697265625, "global_step": 273736, "epoch": 3298} {"train_loss": -24.574268341064453, "global_step": 273737, "epoch": 3298} {"train_loss": -24.351886749267578, "global_step": 273738, "epoch": 3298} {"train_loss": -24.24405288696289, "global_step": 273739, "epoch": 3298} {"train_loss": -24.249469757080078, "global_step": 273740, "epoch": 3298} {"train_loss": -24.759889602661133, "global_step": 273741, "epoch": 3298} {"train_loss": -24.37381362915039, "global_step": 273742, "epoch": 3298} {"train_loss": -24.290515899658203, "global_step": 273743, "epoch": 3298} {"train_loss": -24.366168975830078, "global_step": 273744, "epoch": 3298} {"train_loss": -24.6184024810791, "global_step": 273745, "epoch": 3298} {"train_loss": -24.72177505493164, "global_step": 273746, "epoch": 3298} {"train_loss": -24.65791130065918, "global_step": 273747, "epoch": 3298} {"train_loss": -24.91355323791504, "global_step": 273748, "epoch": 3298} {"train_loss": -24.878435134887695, "global_step": 273749, "epoch": 3298} {"train_loss": -24.97364616394043, "global_step": 273750, "epoch": 3298} {"train_loss": -24.850919723510742, "global_step": 273751, "epoch": 3298} {"train_loss": -24.864173889160156, "global_step": 273752, "epoch": 3298} {"train_loss": -24.941858291625977, "global_step": 273753, "epoch": 3298} {"train_loss": -24.833192825317383, "global_step": 273754, "epoch": 3298} {"train_loss": -24.860612869262695, "global_step": 273755, "epoch": 3298} {"train_loss": -25.317981719970703, "global_step": 273756, "epoch": 3298} {"train_loss": -25.15822410583496, "global_step": 273757, "epoch": 3298} {"train_loss": -25.112783432006836, "global_step": 273758, "epoch": 3298} {"train_loss": -25.176111221313477, "global_step": 273759, "epoch": 3298} {"train_loss": -25.160329818725586, "global_step": 273760, "epoch": 3298} {"train_loss": -24.94552993774414, "global_step": 273761, "epoch": 3298} {"train_loss": -25.185304641723633, "global_step": 273762, "epoch": 3298} {"train_loss": -25.13125991821289, "global_step": 273763, "epoch": 3298} {"train_loss": -25.311080932617188, "global_step": 273764, "epoch": 3298} {"train_loss": -25.32525062561035, "global_step": 273765, "epoch": 3298} {"train_loss": -24.734012603759766, "global_step": 273766, "epoch": 3298} {"train_loss": -25.19038200378418, "global_step": 273767, "epoch": 3298} {"train_loss": -25.188446044921875, "global_step": 273768, "epoch": 3298} {"train_loss": -25.16147804260254, "global_step": 273769, "epoch": 3298} {"train_loss": -25.26775550842285, "global_step": 273770, "epoch": 3298} {"train_loss": -25.239370346069336, "global_step": 273771, "epoch": 3298} {"train_loss": -25.259199142456055, "global_step": 273772, "epoch": 3298} {"train_loss": -25.42011070251465, "global_step": 273773, "epoch": 3298} {"train_loss": -25.66629409790039, "global_step": 273774, "epoch": 3298} {"train_loss": -25.346363067626953, "global_step": 273775, "epoch": 3298} {"train_loss": -25.39585304260254, "global_step": 273776, "epoch": 3298} {"train_loss": -25.34804344177246, "global_step": 273777, "epoch": 3298} {"train_loss": -25.320459365844727, "global_step": 273778, "epoch": 3298} {"train_loss": -25.6228084564209, "global_step": 273779, "epoch": 3298} {"train_loss": -25.320663452148438, "global_step": 273780, "epoch": 3298} {"train_loss": -25.7320613861084, "global_step": 273781, "epoch": 3298} {"train_loss": -25.521739959716797, "global_step": 273782, "epoch": 3298} {"train_loss": -25.359661102294922, "global_step": 273783, "epoch": 3298} {"train_loss": -25.473447799682617, "global_step": 273784, "epoch": 3298} {"train_loss": -25.594833374023438, "global_step": 273785, "epoch": 3298} {"train_loss": -25.726062774658203, "global_step": 273786, "epoch": 3298} {"train_loss": -25.198083877563477, "global_step": 273787, "epoch": 3298} {"train_loss": -25.50566291809082, "global_step": 273788, "epoch": 3298} {"train_loss": -25.594058990478516, "global_step": 273789, "epoch": 3298} {"train_loss": -25.656457901000977, "global_step": 273790, "epoch": 3298} {"train_loss": -25.6766300201416, "global_step": 273791, "epoch": 3298} {"train_loss": -25.64857292175293, "global_step": 273792, "epoch": 3298} {"train_loss": -25.335575103759766, "global_step": 273793, "epoch": 3298} {"train_loss": -25.791259765625, "global_step": 273794, "epoch": 3298} {"train_loss": -25.95191764831543, "global_step": 273795, "epoch": 3298} {"train_loss": -25.463287353515625, "global_step": 273796, "epoch": 3298} {"train_loss": -25.10004997253418, "global_step": 273797, "epoch": 3298} {"train_loss": -25.42486000061035, "global_step": 273798, "epoch": 3298} {"train_loss": -25.526334762573242, "global_step": 273799, "epoch": 3298} {"train_loss": -25.260644912719727, "global_step": 273800, "epoch": 3298} {"train_loss": -25.651891708374023, "global_step": 273801, "epoch": 3298} {"train_loss": -25.440481185913086, "global_step": 273802, "epoch": 3298} {"train_loss": -25.30183219909668, "global_step": 273803, "epoch": 3298} {"train_loss": -25.481163024902344, "global_step": 273804, "epoch": 3298} {"train_loss": -25.75945472717285, "global_step": 273805, "epoch": 3298} {"train_loss": -25.305986404418945, "global_step": 273806, "epoch": 3298} {"train_loss": -25.259180068969727, "global_step": 273807, "epoch": 3298} {"train_loss": -25.093379974365234, "global_step": 273808, "epoch": 3298} {"train_loss": -25.289968490600586, "global_step": 273809, "epoch": 3298} {"train_loss": -25.649642944335938, "global_step": 273810, "epoch": 3298} {"train_loss": -25.773340225219727, "global_step": 273811, "epoch": 3298} {"train_loss": -25.451345443725586, "global_step": 273812, "epoch": 3298} {"train_loss": -25.357511520385742, "global_step": 273813, "epoch": 3298} {"train_loss": -25.37008285522461, "global_step": 273814, "epoch": 3298} {"train_loss": -25.5496768951416, "global_step": 273815, "epoch": 3298} {"train_loss": -25.18254714414298, "global_step": 273816, "epoch": 3298, "val_loss": 7006520.5} {"train_loss": -24.634048461914062, "global_step": 273817, "epoch": 3299} {"train_loss": -24.42683219909668, "global_step": 273818, "epoch": 3299} {"train_loss": -24.508243560791016, "global_step": 273819, "epoch": 3299} {"train_loss": -24.207395553588867, "global_step": 273820, "epoch": 3299} {"train_loss": -24.82326316833496, "global_step": 273821, "epoch": 3299} {"train_loss": -24.486587524414062, "global_step": 273822, "epoch": 3299} {"train_loss": -24.85829734802246, "global_step": 273823, "epoch": 3299} {"train_loss": -24.323232650756836, "global_step": 273824, "epoch": 3299} {"train_loss": -24.382841110229492, "global_step": 273825, "epoch": 3299} {"train_loss": -24.748435974121094, "global_step": 273826, "epoch": 3299} {"train_loss": -25.08383560180664, "global_step": 273827, "epoch": 3299} {"train_loss": -24.78806495666504, "global_step": 273828, "epoch": 3299} {"train_loss": -24.637958526611328, "global_step": 273829, "epoch": 3299} {"train_loss": -24.70762062072754, "global_step": 273830, "epoch": 3299} {"train_loss": -24.577869415283203, "global_step": 273831, "epoch": 3299} {"train_loss": -24.861663818359375, "global_step": 273832, "epoch": 3299} {"train_loss": -24.424304962158203, "global_step": 273833, "epoch": 3299} {"train_loss": -25.33368492126465, "global_step": 273834, "epoch": 3299} {"train_loss": -25.224185943603516, "global_step": 273835, "epoch": 3299} {"train_loss": -25.194040298461914, "global_step": 273836, "epoch": 3299} {"train_loss": -25.064716339111328, "global_step": 273837, "epoch": 3299} {"train_loss": -24.866628646850586, "global_step": 273838, "epoch": 3299} {"train_loss": -24.98978614807129, "global_step": 273839, "epoch": 3299} {"train_loss": -25.14096450805664, "global_step": 273840, "epoch": 3299} {"train_loss": -24.803016662597656, "global_step": 273841, "epoch": 3299} {"train_loss": -25.33418083190918, "global_step": 273842, "epoch": 3299} {"train_loss": -25.5913143157959, "global_step": 273843, "epoch": 3299} {"train_loss": -25.184982299804688, "global_step": 273844, "epoch": 3299} {"train_loss": -25.15199851989746, "global_step": 273845, "epoch": 3299} {"train_loss": -25.452238082885742, "global_step": 273846, "epoch": 3299} {"train_loss": -25.16141128540039, "global_step": 273847, "epoch": 3299} {"train_loss": -25.212705612182617, "global_step": 273848, "epoch": 3299} {"train_loss": -25.464689254760742, "global_step": 273849, "epoch": 3299} {"train_loss": -25.691381454467773, "global_step": 273850, "epoch": 3299} {"train_loss": -25.40645408630371, "global_step": 273851, "epoch": 3299} {"train_loss": -25.436614990234375, "global_step": 273852, "epoch": 3299} {"train_loss": -25.50655174255371, "global_step": 273853, "epoch": 3299} {"train_loss": -25.828170776367188, "global_step": 273854, "epoch": 3299} {"train_loss": -25.16329002380371, "global_step": 273855, "epoch": 3299} {"train_loss": -25.737974166870117, "global_step": 273856, "epoch": 3299} {"train_loss": -25.490615844726562, "global_step": 273857, "epoch": 3299} {"train_loss": -25.2353515625, "global_step": 273858, "epoch": 3299} {"train_loss": -25.706693649291992, "global_step": 273859, "epoch": 3299} {"train_loss": -25.208505630493164, "global_step": 273860, "epoch": 3299} {"train_loss": -25.391340255737305, "global_step": 273861, "epoch": 3299} {"train_loss": -25.15403175354004, "global_step": 273862, "epoch": 3299} {"train_loss": -25.385601043701172, "global_step": 273863, "epoch": 3299} {"train_loss": -25.597959518432617, "global_step": 273864, "epoch": 3299} {"train_loss": -25.446226119995117, "global_step": 273865, "epoch": 3299} {"train_loss": -25.230466842651367, "global_step": 273866, "epoch": 3299} {"train_loss": -25.69437599182129, "global_step": 273867, "epoch": 3299} {"train_loss": -25.170154571533203, "global_step": 273868, "epoch": 3299} {"train_loss": -25.202123641967773, "global_step": 273869, "epoch": 3299} {"train_loss": -25.129934310913086, "global_step": 273870, "epoch": 3299} {"train_loss": -25.500762939453125, "global_step": 273871, "epoch": 3299} {"train_loss": -25.061445236206055, "global_step": 273872, "epoch": 3299} {"train_loss": -25.58208656311035, "global_step": 273873, "epoch": 3299} {"train_loss": -25.549715042114258, "global_step": 273874, "epoch": 3299} {"train_loss": -25.565845489501953, "global_step": 273875, "epoch": 3299} {"train_loss": -25.44622230529785, "global_step": 273876, "epoch": 3299} {"train_loss": -25.501331329345703, "global_step": 273877, "epoch": 3299} {"train_loss": -25.275470733642578, "global_step": 273878, "epoch": 3299} {"train_loss": -25.36163902282715, "global_step": 273879, "epoch": 3299} {"train_loss": -25.311750411987305, "global_step": 273880, "epoch": 3299} {"train_loss": -25.728857040405273, "global_step": 273881, "epoch": 3299} {"train_loss": -25.345462799072266, "global_step": 273882, "epoch": 3299} {"train_loss": -25.53639793395996, "global_step": 273883, "epoch": 3299} {"train_loss": -25.216712951660156, "global_step": 273884, "epoch": 3299} {"train_loss": -25.451915740966797, "global_step": 273885, "epoch": 3299} {"train_loss": -25.515043258666992, "global_step": 273886, "epoch": 3299} {"train_loss": -25.37411880493164, "global_step": 273887, "epoch": 3299} {"train_loss": -25.236665725708008, "global_step": 273888, "epoch": 3299} {"train_loss": -25.22780418395996, "global_step": 273889, "epoch": 3299} {"train_loss": -25.258024215698242, "global_step": 273890, "epoch": 3299} {"train_loss": -25.31608772277832, "global_step": 273891, "epoch": 3299} {"train_loss": -25.029157638549805, "global_step": 273892, "epoch": 3299} {"train_loss": -25.34798812866211, "global_step": 273893, "epoch": 3299} {"train_loss": -25.826648712158203, "global_step": 273894, "epoch": 3299} {"train_loss": -25.668912887573242, "global_step": 273895, "epoch": 3299} {"train_loss": -25.581186294555664, "global_step": 273896, "epoch": 3299} {"train_loss": -25.787084579467773, "global_step": 273897, "epoch": 3299} {"train_loss": -25.044654846191406, "global_step": 273898, "epoch": 3299} {"train_loss": -25.20412183095174, "global_step": 273899, "epoch": 3299, "val_loss": 7156637.0} {"train_loss": -22.709796905517578, "global_step": 273900, "epoch": 3300} {"train_loss": -24.131505966186523, "global_step": 273901, "epoch": 3300} {"train_loss": -24.212318420410156, "global_step": 273902, "epoch": 3300} {"train_loss": -22.708166122436523, "global_step": 273903, "epoch": 3300} {"train_loss": -24.566038131713867, "global_step": 273904, "epoch": 3300} {"train_loss": -23.42555046081543, "global_step": 273905, "epoch": 3300} {"train_loss": -24.41958236694336, "global_step": 273906, "epoch": 3300} {"train_loss": -24.66303062438965, "global_step": 273907, "epoch": 3300} {"train_loss": -24.253997802734375, "global_step": 273908, "epoch": 3300} {"train_loss": -24.930814743041992, "global_step": 273909, "epoch": 3300} {"train_loss": -24.58808708190918, "global_step": 273910, "epoch": 3300} {"train_loss": -24.11774253845215, "global_step": 273911, "epoch": 3300} {"train_loss": -24.46891975402832, "global_step": 273912, "epoch": 3300} {"train_loss": -24.189517974853516, "global_step": 273913, "epoch": 3300} {"train_loss": -24.51420021057129, "global_step": 273914, "epoch": 3300} {"train_loss": -24.441497802734375, "global_step": 273915, "epoch": 3300} {"train_loss": -24.34039878845215, "global_step": 273916, "epoch": 3300} {"train_loss": -24.204648971557617, "global_step": 273917, "epoch": 3300} {"train_loss": -24.890457153320312, "global_step": 273918, "epoch": 3300} {"train_loss": -24.773359298706055, "global_step": 273919, "epoch": 3300} {"train_loss": -24.1190185546875, "global_step": 273920, "epoch": 3300} {"train_loss": -24.616003036499023, "global_step": 273921, "epoch": 3300} {"train_loss": -24.927921295166016, "global_step": 273922, "epoch": 3300} {"train_loss": -24.672407150268555, "global_step": 273923, "epoch": 3300} {"train_loss": -25.161327362060547, "global_step": 273924, "epoch": 3300} {"train_loss": -24.703035354614258, "global_step": 273925, "epoch": 3300} {"train_loss": -25.06884765625, "global_step": 273926, "epoch": 3300} {"train_loss": -25.172760009765625, "global_step": 273927, "epoch": 3300} {"train_loss": -24.84100341796875, "global_step": 273928, "epoch": 3300} {"train_loss": -25.31148338317871, "global_step": 273929, "epoch": 3300} {"train_loss": -24.841413497924805, "global_step": 273930, "epoch": 3300} {"train_loss": -24.842105865478516, "global_step": 273931, "epoch": 3300} {"train_loss": -25.044448852539062, "global_step": 273932, "epoch": 3300} {"train_loss": -24.684045791625977, "global_step": 273933, "epoch": 3300} {"train_loss": -25.163076400756836, "global_step": 273934, "epoch": 3300} {"train_loss": -24.881452560424805, "global_step": 273935, "epoch": 3300} {"train_loss": -25.090499877929688, "global_step": 273936, "epoch": 3300} {"train_loss": -24.78766441345215, "global_step": 273937, "epoch": 3300} {"train_loss": -25.48475456237793, "global_step": 273938, "epoch": 3300} {"train_loss": -25.129026412963867, "global_step": 273939, "epoch": 3300} {"train_loss": -25.218236923217773, "global_step": 273940, "epoch": 3300} {"train_loss": -24.947895050048828, "global_step": 273941, "epoch": 3300} {"train_loss": -25.49637794494629, "global_step": 273942, "epoch": 3300} {"train_loss": -25.30451202392578, "global_step": 273943, "epoch": 3300} {"train_loss": -25.23369789123535, "global_step": 273944, "epoch": 3300} {"train_loss": -25.424985885620117, "global_step": 273945, "epoch": 3300} {"train_loss": -25.19774055480957, "global_step": 273946, "epoch": 3300} {"train_loss": -25.177968978881836, "global_step": 273947, "epoch": 3300} {"train_loss": -25.417192459106445, "global_step": 273948, "epoch": 3300} {"train_loss": -25.572921752929688, "global_step": 273949, "epoch": 3300} {"train_loss": -25.746164321899414, "global_step": 273950, "epoch": 3300} {"train_loss": -25.321470260620117, "global_step": 273951, "epoch": 3300} {"train_loss": -25.02298355102539, "global_step": 273952, "epoch": 3300} {"train_loss": -25.507747650146484, "global_step": 273953, "epoch": 3300} {"train_loss": -25.75995445251465, "global_step": 273954, "epoch": 3300} {"train_loss": -25.490612030029297, "global_step": 273955, "epoch": 3300} {"train_loss": -25.294116973876953, "global_step": 273956, "epoch": 3300} {"train_loss": -25.13468360900879, "global_step": 273957, "epoch": 3300} {"train_loss": -25.522785186767578, "global_step": 273958, "epoch": 3300} {"train_loss": -25.740278244018555, "global_step": 273959, "epoch": 3300} {"train_loss": -25.40995216369629, "global_step": 273960, "epoch": 3300} {"train_loss": -25.30179214477539, "global_step": 273961, "epoch": 3300} {"train_loss": -25.480304718017578, "global_step": 273962, "epoch": 3300} {"train_loss": -25.44440460205078, "global_step": 273963, "epoch": 3300} {"train_loss": -25.311052322387695, "global_step": 273964, "epoch": 3300} {"train_loss": -25.084247589111328, "global_step": 273965, "epoch": 3300} {"train_loss": -24.992429733276367, "global_step": 273966, "epoch": 3300} {"train_loss": -25.928327560424805, "global_step": 273967, "epoch": 3300} {"train_loss": -25.594831466674805, "global_step": 273968, "epoch": 3300} {"train_loss": -25.200172424316406, "global_step": 273969, "epoch": 3300} {"train_loss": -25.636194229125977, "global_step": 273970, "epoch": 3300} {"train_loss": -25.459135055541992, "global_step": 273971, "epoch": 3300} {"train_loss": -25.174381256103516, "global_step": 273972, "epoch": 3300} {"train_loss": -25.285978317260742, "global_step": 273973, "epoch": 3300} {"train_loss": -25.300573348999023, "global_step": 273974, "epoch": 3300} {"train_loss": -25.56337547302246, "global_step": 273975, "epoch": 3300} {"train_loss": -25.228986740112305, "global_step": 273976, "epoch": 3300} {"train_loss": -25.416839599609375, "global_step": 273977, "epoch": 3300} {"train_loss": -25.718061447143555, "global_step": 273978, "epoch": 3300} {"train_loss": -25.63679313659668, "global_step": 273979, "epoch": 3300} {"train_loss": -25.359481811523438, "global_step": 273980, "epoch": 3300} {"train_loss": -25.758127212524414, "global_step": 273981, "epoch": 3300} {"train_loss": -24.999653483011638, "global_step": 273982, "epoch": 3300, "train/sim_max_reward_0": 1.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4500000": 1.0, "test/sim_max_reward_4500001": 1.0, "test/sim_max_reward_4500002": 1.0, "test/sim_max_reward_4500003": 1.0, "test/sim_max_reward_4500004": 1.0, "test/sim_max_reward_4500005": 1.0, "test/sim_max_reward_4500006": 1.0, "test/sim_max_reward_4500007": 1.0, "test/sim_max_reward_4500008": 1.0, "test/sim_max_reward_4500009": 1.0, "test/sim_max_reward_4500010": 1.0, "test/sim_max_reward_4500011": 1.0, "test/sim_max_reward_4500012": 1.0, "test/sim_max_reward_4500013": 0.0, "test/sim_max_reward_4500014": 1.0, "test/sim_max_reward_4500015": 1.0, "test/sim_max_reward_4500016": 1.0, "test/sim_max_reward_4500017": 1.0, "test/sim_max_reward_4500018": 1.0, "test/sim_max_reward_4500019": 1.0, "test/sim_max_reward_4500020": 1.0, "test/sim_max_reward_4500021": 1.0, "train/mean_score": 1.0, "test/mean_score": 0.9545454545454546, "val_loss": 6960964.0} {"train_loss": -25.08904266357422, "global_step": 273983, "epoch": 3301} {"train_loss": -25.204071044921875, "global_step": 273984, "epoch": 3301} {"train_loss": -25.160768508911133, "global_step": 273985, "epoch": 3301} {"train_loss": -24.935911178588867, "global_step": 273986, "epoch": 3301} {"train_loss": -24.43330192565918, "global_step": 273987, "epoch": 3301} {"train_loss": -24.636180877685547, "global_step": 273988, "epoch": 3301} {"train_loss": -25.231830596923828, "global_step": 273989, "epoch": 3301} {"train_loss": -24.94917106628418, "global_step": 273990, "epoch": 3301} {"train_loss": -25.368192672729492, "global_step": 273991, "epoch": 3301} {"train_loss": -25.09267234802246, "global_step": 273992, "epoch": 3301} {"train_loss": -24.92682647705078, "global_step": 273993, "epoch": 3301} {"train_loss": -25.140453338623047, "global_step": 273994, "epoch": 3301} {"train_loss": -25.07193946838379, "global_step": 273995, "epoch": 3301} {"train_loss": -25.638885498046875, "global_step": 273996, "epoch": 3301} {"train_loss": -24.971115112304688, "global_step": 273997, "epoch": 3301} {"train_loss": -25.290021896362305, "global_step": 273998, "epoch": 3301} {"train_loss": -24.847562789916992, "global_step": 273999, "epoch": 3301} {"train_loss": -25.049428939819336, "global_step": 274000, "epoch": 3301} {"train_loss": -25.306318283081055, "global_step": 274001, "epoch": 3301} {"train_loss": -25.126523971557617, "global_step": 274002, "epoch": 3301} {"train_loss": -25.012130737304688, "global_step": 274003, "epoch": 3301} {"train_loss": -25.35868263244629, "global_step": 274004, "epoch": 3301} {"train_loss": -24.543190002441406, "global_step": 274005, "epoch": 3301} {"train_loss": -25.471498489379883, "global_step": 274006, "epoch": 3301} {"train_loss": -24.919198989868164, "global_step": 274007, "epoch": 3301} {"train_loss": -24.99047088623047, "global_step": 274008, "epoch": 3301} {"train_loss": -25.21352195739746, "global_step": 274009, "epoch": 3301} {"train_loss": -25.020341873168945, "global_step": 274010, "epoch": 3301} {"train_loss": -25.2232723236084, "global_step": 274011, "epoch": 3301} {"train_loss": -25.229238510131836, "global_step": 274012, "epoch": 3301} {"train_loss": -25.1735782623291, "global_step": 274013, "epoch": 3301} {"train_loss": -25.394302368164062, "global_step": 274014, "epoch": 3301} {"train_loss": -25.115549087524414, "global_step": 274015, "epoch": 3301} {"train_loss": -25.752288818359375, "global_step": 274016, "epoch": 3301} {"train_loss": -25.422147750854492, "global_step": 274017, "epoch": 3301} {"train_loss": -25.151830673217773, "global_step": 274018, "epoch": 3301} {"train_loss": -25.371978759765625, "global_step": 274019, "epoch": 3301} {"train_loss": -25.212953567504883, "global_step": 274020, "epoch": 3301} {"train_loss": -25.24100112915039, "global_step": 274021, "epoch": 3301} {"train_loss": -24.922550201416016, "global_step": 274022, "epoch": 3301} {"train_loss": -25.104068756103516, "global_step": 274023, "epoch": 3301} {"train_loss": -25.446481704711914, "global_step": 274024, "epoch": 3301} {"train_loss": -25.462787628173828, "global_step": 274025, "epoch": 3301} {"train_loss": -25.337053298950195, "global_step": 274026, "epoch": 3301} {"train_loss": -25.40156364440918, "global_step": 274027, "epoch": 3301} {"train_loss": -25.34222984313965, "global_step": 274028, "epoch": 3301} {"train_loss": -25.17719078063965, "global_step": 274029, "epoch": 3301} {"train_loss": -25.652402877807617, "global_step": 274030, "epoch": 3301} {"train_loss": -25.615522384643555, "global_step": 274031, "epoch": 3301} {"train_loss": -25.573463439941406, "global_step": 274032, "epoch": 3301} {"train_loss": -25.748579025268555, "global_step": 274033, "epoch": 3301} {"train_loss": -25.623319625854492, "global_step": 274034, "epoch": 3301} {"train_loss": -25.534839630126953, "global_step": 274035, "epoch": 3301} {"train_loss": -25.600753784179688, "global_step": 274036, "epoch": 3301} {"train_loss": -25.729108810424805, "global_step": 274037, "epoch": 3301} {"train_loss": -25.181915283203125, "global_step": 274038, "epoch": 3301} {"train_loss": -25.421157836914062, "global_step": 274039, "epoch": 3301} {"train_loss": -25.25520896911621, "global_step": 274040, "epoch": 3301} {"train_loss": -25.53632926940918, "global_step": 274041, "epoch": 3301} {"train_loss": -25.17005729675293, "global_step": 274042, "epoch": 3301} {"train_loss": -25.377790451049805, "global_step": 274043, "epoch": 3301} {"train_loss": -25.610523223876953, "global_step": 274044, "epoch": 3301} {"train_loss": -25.4166202545166, "global_step": 274045, "epoch": 3301} {"train_loss": -25.53951072692871, "global_step": 274046, "epoch": 3301} {"train_loss": -25.515413284301758, "global_step": 274047, "epoch": 3301} {"train_loss": -25.362192153930664, "global_step": 274048, "epoch": 3301} {"train_loss": -25.15921401977539, "global_step": 274049, "epoch": 3301} {"train_loss": -25.616809844970703, "global_step": 274050, "epoch": 3301} {"train_loss": -25.078277587890625, "global_step": 274051, "epoch": 3301} {"train_loss": -24.947376251220703, "global_step": 274052, "epoch": 3301} {"train_loss": -24.819433212280273, "global_step": 274053, "epoch": 3301} {"train_loss": -25.38905906677246, "global_step": 274054, "epoch": 3301} {"train_loss": -25.031478881835938, "global_step": 274055, "epoch": 3301} {"train_loss": -25.121429443359375, "global_step": 274056, "epoch": 3301} {"train_loss": -25.25630760192871, "global_step": 274057, "epoch": 3301} {"train_loss": -24.91933250427246, "global_step": 274058, "epoch": 3301} {"train_loss": -25.180906295776367, "global_step": 274059, "epoch": 3301} {"train_loss": -25.120105743408203, "global_step": 274060, "epoch": 3301} {"train_loss": -25.265625, "global_step": 274061, "epoch": 3301} {"train_loss": -25.4561824798584, "global_step": 274062, "epoch": 3301} {"train_loss": -25.409332275390625, "global_step": 274063, "epoch": 3301} {"train_loss": -25.29302406311035, "global_step": 274064, "epoch": 3301} {"train_loss": -25.237701301115106, "global_step": 274065, "epoch": 3301, "val_loss": 6902192.0} {"train_loss": -24.16983413696289, "global_step": 274066, "epoch": 3302} {"train_loss": -24.914011001586914, "global_step": 274067, "epoch": 3302} {"train_loss": -24.599897384643555, "global_step": 274068, "epoch": 3302} {"train_loss": -25.130197525024414, "global_step": 274069, "epoch": 3302} {"train_loss": -24.33438491821289, "global_step": 274070, "epoch": 3302} {"train_loss": -24.69851303100586, "global_step": 274071, "epoch": 3302} {"train_loss": -24.86942481994629, "global_step": 274072, "epoch": 3302} {"train_loss": -24.56829833984375, "global_step": 274073, "epoch": 3302} {"train_loss": -24.787710189819336, "global_step": 274074, "epoch": 3302} {"train_loss": -24.812122344970703, "global_step": 274075, "epoch": 3302} {"train_loss": -24.807233810424805, "global_step": 274076, "epoch": 3302} {"train_loss": -24.8609619140625, "global_step": 274077, "epoch": 3302} {"train_loss": -24.68008041381836, "global_step": 274078, "epoch": 3302} {"train_loss": -25.37731170654297, "global_step": 274079, "epoch": 3302} {"train_loss": -24.89382553100586, "global_step": 274080, "epoch": 3302} {"train_loss": -25.399572372436523, "global_step": 274081, "epoch": 3302} {"train_loss": -24.8758602142334, "global_step": 274082, "epoch": 3302} {"train_loss": -25.118223190307617, "global_step": 274083, "epoch": 3302} {"train_loss": -25.181501388549805, "global_step": 274084, "epoch": 3302} {"train_loss": -25.04530906677246, "global_step": 274085, "epoch": 3302} {"train_loss": -24.917585372924805, "global_step": 274086, "epoch": 3302} {"train_loss": -25.60208511352539, "global_step": 274087, "epoch": 3302} {"train_loss": -25.263792037963867, "global_step": 274088, "epoch": 3302} {"train_loss": -25.377124786376953, "global_step": 274089, "epoch": 3302} {"train_loss": -25.332761764526367, "global_step": 274090, "epoch": 3302} {"train_loss": -25.218616485595703, "global_step": 274091, "epoch": 3302} {"train_loss": -24.935361862182617, "global_step": 274092, "epoch": 3302} {"train_loss": -25.52707290649414, "global_step": 274093, "epoch": 3302} {"train_loss": -25.6081485748291, "global_step": 274094, "epoch": 3302} {"train_loss": -25.141637802124023, "global_step": 274095, "epoch": 3302} {"train_loss": -25.139257431030273, "global_step": 274096, "epoch": 3302} {"train_loss": -25.757476806640625, "global_step": 274097, "epoch": 3302} {"train_loss": -25.272663116455078, "global_step": 274098, "epoch": 3302} {"train_loss": -25.447010040283203, "global_step": 274099, "epoch": 3302} {"train_loss": -25.09771728515625, "global_step": 274100, "epoch": 3302} {"train_loss": -25.506059646606445, "global_step": 274101, "epoch": 3302} {"train_loss": -25.305288314819336, "global_step": 274102, "epoch": 3302} {"train_loss": -25.39423942565918, "global_step": 274103, "epoch": 3302} {"train_loss": -25.49948501586914, "global_step": 274104, "epoch": 3302} {"train_loss": -25.422597885131836, "global_step": 274105, "epoch": 3302} {"train_loss": -25.888940811157227, "global_step": 274106, "epoch": 3302} {"train_loss": -25.946014404296875, "global_step": 274107, "epoch": 3302} {"train_loss": -25.361438751220703, "global_step": 274108, "epoch": 3302} {"train_loss": -25.278188705444336, "global_step": 274109, "epoch": 3302} {"train_loss": -25.20539665222168, "global_step": 274110, "epoch": 3302} {"train_loss": -25.285940170288086, "global_step": 274111, "epoch": 3302} {"train_loss": -25.20360565185547, "global_step": 274112, "epoch": 3302} {"train_loss": -25.67083168029785, "global_step": 274113, "epoch": 3302} {"train_loss": -25.683490753173828, "global_step": 274114, "epoch": 3302} {"train_loss": -25.57140350341797, "global_step": 274115, "epoch": 3302} {"train_loss": -25.45313835144043, "global_step": 274116, "epoch": 3302} {"train_loss": -25.466266632080078, "global_step": 274117, "epoch": 3302} {"train_loss": -25.50333023071289, "global_step": 274118, "epoch": 3302} {"train_loss": -25.318286895751953, "global_step": 274119, "epoch": 3302} {"train_loss": -25.093793869018555, "global_step": 274120, "epoch": 3302} {"train_loss": -25.6114444732666, "global_step": 274121, "epoch": 3302} {"train_loss": -25.448078155517578, "global_step": 274122, "epoch": 3302} {"train_loss": -25.17704200744629, "global_step": 274123, "epoch": 3302} {"train_loss": -25.425411224365234, "global_step": 274124, "epoch": 3302} {"train_loss": -25.16046905517578, "global_step": 274125, "epoch": 3302} {"train_loss": -25.028766632080078, "global_step": 274126, "epoch": 3302} {"train_loss": -25.428756713867188, "global_step": 274127, "epoch": 3302} {"train_loss": -25.05952262878418, "global_step": 274128, "epoch": 3302} {"train_loss": -25.089895248413086, "global_step": 274129, "epoch": 3302} {"train_loss": -25.011442184448242, "global_step": 274130, "epoch": 3302} {"train_loss": -25.041915893554688, "global_step": 274131, "epoch": 3302} {"train_loss": -25.301029205322266, "global_step": 274132, "epoch": 3302} {"train_loss": -25.06333351135254, "global_step": 274133, "epoch": 3302} {"train_loss": -25.412221908569336, "global_step": 274134, "epoch": 3302} {"train_loss": -25.139570236206055, "global_step": 274135, "epoch": 3302} {"train_loss": -25.287755966186523, "global_step": 274136, "epoch": 3302} {"train_loss": -25.001089096069336, "global_step": 274137, "epoch": 3302} {"train_loss": -25.399518966674805, "global_step": 274138, "epoch": 3302} {"train_loss": -25.16475486755371, "global_step": 274139, "epoch": 3302} {"train_loss": -25.311492919921875, "global_step": 274140, "epoch": 3302} {"train_loss": -25.52025032043457, "global_step": 274141, "epoch": 3302} {"train_loss": -25.328420639038086, "global_step": 274142, "epoch": 3302} {"train_loss": -25.347583770751953, "global_step": 274143, "epoch": 3302} {"train_loss": -25.710859298706055, "global_step": 274144, "epoch": 3302} {"train_loss": -25.576757431030273, "global_step": 274145, "epoch": 3302} {"train_loss": -25.260679244995117, "global_step": 274146, "epoch": 3302} {"train_loss": -25.13516616821289, "global_step": 274147, "epoch": 3302} {"train_loss": -25.22704172708902, "global_step": 274148, "epoch": 3302, "val_loss": 7117239.0} {"train_loss": -24.316091537475586, "global_step": 274149, "epoch": 3303} {"train_loss": -24.672651290893555, "global_step": 274150, "epoch": 3303} {"train_loss": -24.666990280151367, "global_step": 274151, "epoch": 3303} {"train_loss": -24.488859176635742, "global_step": 274152, "epoch": 3303} {"train_loss": -24.335615158081055, "global_step": 274153, "epoch": 3303} {"train_loss": -24.83518409729004, "global_step": 274154, "epoch": 3303} {"train_loss": -24.569782257080078, "global_step": 274155, "epoch": 3303} {"train_loss": -24.66200828552246, "global_step": 274156, "epoch": 3303} {"train_loss": -25.011274337768555, "global_step": 274157, "epoch": 3303} {"train_loss": -24.361085891723633, "global_step": 274158, "epoch": 3303} {"train_loss": -24.92930793762207, "global_step": 274159, "epoch": 3303} {"train_loss": -24.829797744750977, "global_step": 274160, "epoch": 3303} {"train_loss": -24.572877883911133, "global_step": 274161, "epoch": 3303} {"train_loss": -24.656064987182617, "global_step": 274162, "epoch": 3303} {"train_loss": -25.086719512939453, "global_step": 274163, "epoch": 3303} {"train_loss": -25.153766632080078, "global_step": 274164, "epoch": 3303} {"train_loss": -24.739595413208008, "global_step": 274165, "epoch": 3303} {"train_loss": -25.008329391479492, "global_step": 274166, "epoch": 3303} {"train_loss": -24.66562843322754, "global_step": 274167, "epoch": 3303} {"train_loss": -24.91221046447754, "global_step": 274168, "epoch": 3303} {"train_loss": -25.199724197387695, "global_step": 274169, "epoch": 3303} {"train_loss": -25.05455207824707, "global_step": 274170, "epoch": 3303} {"train_loss": -25.318891525268555, "global_step": 274171, "epoch": 3303} {"train_loss": -25.486881256103516, "global_step": 274172, "epoch": 3303} {"train_loss": -24.911699295043945, "global_step": 274173, "epoch": 3303} {"train_loss": -25.41860008239746, "global_step": 274174, "epoch": 3303} {"train_loss": -25.123401641845703, "global_step": 274175, "epoch": 3303} {"train_loss": -24.88103485107422, "global_step": 274176, "epoch": 3303} {"train_loss": -25.26812744140625, "global_step": 274177, "epoch": 3303} {"train_loss": -25.201141357421875, "global_step": 274178, "epoch": 3303} {"train_loss": -25.036924362182617, "global_step": 274179, "epoch": 3303} {"train_loss": -25.25904083251953, "global_step": 274180, "epoch": 3303} {"train_loss": -25.50544548034668, "global_step": 274181, "epoch": 3303} {"train_loss": -25.821125030517578, "global_step": 274182, "epoch": 3303} {"train_loss": -25.635913848876953, "global_step": 274183, "epoch": 3303} {"train_loss": -25.53257942199707, "global_step": 274184, "epoch": 3303} {"train_loss": -25.41097068786621, "global_step": 274185, "epoch": 3303} {"train_loss": -25.480676651000977, "global_step": 274186, "epoch": 3303} {"train_loss": -25.288328170776367, "global_step": 274187, "epoch": 3303} {"train_loss": -25.67914390563965, "global_step": 274188, "epoch": 3303} {"train_loss": -24.9277400970459, "global_step": 274189, "epoch": 3303} {"train_loss": -25.865137100219727, "global_step": 274190, "epoch": 3303} {"train_loss": -25.49006462097168, "global_step": 274191, "epoch": 3303} {"train_loss": -25.33095359802246, "global_step": 274192, "epoch": 3303} {"train_loss": -25.719724655151367, "global_step": 274193, "epoch": 3303} {"train_loss": -25.781280517578125, "global_step": 274194, "epoch": 3303} {"train_loss": -25.501251220703125, "global_step": 274195, "epoch": 3303} {"train_loss": -25.16121482849121, "global_step": 274196, "epoch": 3303} {"train_loss": -25.45755386352539, "global_step": 274197, "epoch": 3303} {"train_loss": -25.43792724609375, "global_step": 274198, "epoch": 3303} {"train_loss": -25.74020767211914, "global_step": 274199, "epoch": 3303} {"train_loss": -25.311120986938477, "global_step": 274200, "epoch": 3303} {"train_loss": -25.5009822845459, "global_step": 274201, "epoch": 3303} {"train_loss": -25.74513053894043, "global_step": 274202, "epoch": 3303} {"train_loss": -25.433515548706055, "global_step": 274203, "epoch": 3303} {"train_loss": -25.32369041442871, "global_step": 274204, "epoch": 3303} {"train_loss": -25.37024688720703, "global_step": 274205, "epoch": 3303} {"train_loss": -25.439571380615234, "global_step": 274206, "epoch": 3303} {"train_loss": -25.258407592773438, "global_step": 274207, "epoch": 3303} {"train_loss": -25.283628463745117, "global_step": 274208, "epoch": 3303} {"train_loss": -25.2435359954834, "global_step": 274209, "epoch": 3303} {"train_loss": -24.899375915527344, "global_step": 274210, "epoch": 3303} {"train_loss": -25.699722290039062, "global_step": 274211, "epoch": 3303} {"train_loss": -25.351850509643555, "global_step": 274212, "epoch": 3303} {"train_loss": -25.040319442749023, "global_step": 274213, "epoch": 3303} {"train_loss": -25.351892471313477, "global_step": 274214, "epoch": 3303} {"train_loss": -25.41884422302246, "global_step": 274215, "epoch": 3303} {"train_loss": -25.23607063293457, "global_step": 274216, "epoch": 3303} {"train_loss": -25.259052276611328, "global_step": 274217, "epoch": 3303} {"train_loss": -25.366090774536133, "global_step": 274218, "epoch": 3303} {"train_loss": -25.355255126953125, "global_step": 274219, "epoch": 3303} {"train_loss": -25.08428382873535, "global_step": 274220, "epoch": 3303} {"train_loss": -25.265949249267578, "global_step": 274221, "epoch": 3303} {"train_loss": -25.289569854736328, "global_step": 274222, "epoch": 3303} {"train_loss": -25.431406021118164, "global_step": 274223, "epoch": 3303} {"train_loss": -25.03643035888672, "global_step": 274224, "epoch": 3303} {"train_loss": -25.124126434326172, "global_step": 274225, "epoch": 3303} {"train_loss": -25.240524291992188, "global_step": 274226, "epoch": 3303} {"train_loss": -25.485321044921875, "global_step": 274227, "epoch": 3303} {"train_loss": -25.510499954223633, "global_step": 274228, "epoch": 3303} {"train_loss": -25.475074768066406, "global_step": 274229, "epoch": 3303} {"train_loss": -25.16498374938965, "global_step": 274230, "epoch": 3303} {"train_loss": -25.194081157086842, "global_step": 274231, "epoch": 3303, "val_loss": 6992833.5} {"train_loss": -24.542560577392578, "global_step": 274232, "epoch": 3304} {"train_loss": -24.043109893798828, "global_step": 274233, "epoch": 3304} {"train_loss": -24.457962036132812, "global_step": 274234, "epoch": 3304} {"train_loss": -24.64765739440918, "global_step": 274235, "epoch": 3304} {"train_loss": -24.770721435546875, "global_step": 274236, "epoch": 3304} {"train_loss": -24.620075225830078, "global_step": 274237, "epoch": 3304} {"train_loss": -25.0988712310791, "global_step": 274238, "epoch": 3304} {"train_loss": -24.676359176635742, "global_step": 274239, "epoch": 3304} {"train_loss": -24.7434139251709, "global_step": 274240, "epoch": 3304} {"train_loss": -24.96497917175293, "global_step": 274241, "epoch": 3304} {"train_loss": -24.702661514282227, "global_step": 274242, "epoch": 3304} {"train_loss": -24.970252990722656, "global_step": 274243, "epoch": 3304} {"train_loss": -24.669025421142578, "global_step": 274244, "epoch": 3304} {"train_loss": -25.279767990112305, "global_step": 274245, "epoch": 3304} {"train_loss": -25.697668075561523, "global_step": 274246, "epoch": 3304} {"train_loss": -24.980018615722656, "global_step": 274247, "epoch": 3304} {"train_loss": -25.081205368041992, "global_step": 274248, "epoch": 3304} {"train_loss": -25.204120635986328, "global_step": 274249, "epoch": 3304} {"train_loss": -24.94267463684082, "global_step": 274250, "epoch": 3304} {"train_loss": -25.287527084350586, "global_step": 274251, "epoch": 3304} {"train_loss": -25.59528923034668, "global_step": 274252, "epoch": 3304} {"train_loss": -25.386463165283203, "global_step": 274253, "epoch": 3304} {"train_loss": -25.385303497314453, "global_step": 274254, "epoch": 3304} {"train_loss": -25.218494415283203, "global_step": 274255, "epoch": 3304} {"train_loss": -25.252710342407227, "global_step": 274256, "epoch": 3304} {"train_loss": -25.539020538330078, "global_step": 274257, "epoch": 3304} {"train_loss": -25.149831771850586, "global_step": 274258, "epoch": 3304} {"train_loss": -25.218807220458984, "global_step": 274259, "epoch": 3304} {"train_loss": -25.157411575317383, "global_step": 274260, "epoch": 3304} {"train_loss": -25.246423721313477, "global_step": 274261, "epoch": 3304} {"train_loss": -25.29950714111328, "global_step": 274262, "epoch": 3304} {"train_loss": -25.247058868408203, "global_step": 274263, "epoch": 3304} {"train_loss": -25.306547164916992, "global_step": 274264, "epoch": 3304} {"train_loss": -25.383398056030273, "global_step": 274265, "epoch": 3304} {"train_loss": -25.304574966430664, "global_step": 274266, "epoch": 3304} {"train_loss": -25.162107467651367, "global_step": 274267, "epoch": 3304} {"train_loss": -25.547569274902344, "global_step": 274268, "epoch": 3304} {"train_loss": -25.342708587646484, "global_step": 274269, "epoch": 3304} {"train_loss": -25.4793758392334, "global_step": 274270, "epoch": 3304} {"train_loss": -25.469661712646484, "global_step": 274271, "epoch": 3304} {"train_loss": -25.370311737060547, "global_step": 274272, "epoch": 3304} {"train_loss": -25.51191520690918, "global_step": 274273, "epoch": 3304} {"train_loss": -25.49786949157715, "global_step": 274274, "epoch": 3304} {"train_loss": -25.28122901916504, "global_step": 274275, "epoch": 3304} {"train_loss": -25.57028579711914, "global_step": 274276, "epoch": 3304} {"train_loss": -25.488183975219727, "global_step": 274277, "epoch": 3304} {"train_loss": -25.152143478393555, "global_step": 274278, "epoch": 3304} {"train_loss": -25.339065551757812, "global_step": 274279, "epoch": 3304} {"train_loss": -25.39188003540039, "global_step": 274280, "epoch": 3304} {"train_loss": -25.47939109802246, "global_step": 274281, "epoch": 3304} {"train_loss": -25.360218048095703, "global_step": 274282, "epoch": 3304} {"train_loss": -25.4617862701416, "global_step": 274283, "epoch": 3304} {"train_loss": -25.36988067626953, "global_step": 274284, "epoch": 3304} {"train_loss": -25.45886993408203, "global_step": 274285, "epoch": 3304} {"train_loss": -25.37259864807129, "global_step": 274286, "epoch": 3304} {"train_loss": -25.364500045776367, "global_step": 274287, "epoch": 3304} {"train_loss": -25.31294822692871, "global_step": 274288, "epoch": 3304} {"train_loss": -25.252668380737305, "global_step": 274289, "epoch": 3304} {"train_loss": -25.76934814453125, "global_step": 274290, "epoch": 3304} {"train_loss": -25.287811279296875, "global_step": 274291, "epoch": 3304} {"train_loss": -25.306737899780273, "global_step": 274292, "epoch": 3304} {"train_loss": -25.118799209594727, "global_step": 274293, "epoch": 3304} {"train_loss": -25.151493072509766, "global_step": 274294, "epoch": 3304} {"train_loss": -25.7977237701416, "global_step": 274295, "epoch": 3304} {"train_loss": -25.309574127197266, "global_step": 274296, "epoch": 3304} {"train_loss": -25.47088050842285, "global_step": 274297, "epoch": 3304} {"train_loss": -25.057926177978516, "global_step": 274298, "epoch": 3304} {"train_loss": -25.459753036499023, "global_step": 274299, "epoch": 3304} {"train_loss": -24.977237701416016, "global_step": 274300, "epoch": 3304} {"train_loss": -25.63754653930664, "global_step": 274301, "epoch": 3304} {"train_loss": -25.2620792388916, "global_step": 274302, "epoch": 3304} {"train_loss": -25.46990966796875, "global_step": 274303, "epoch": 3304} {"train_loss": -25.325132369995117, "global_step": 274304, "epoch": 3304} {"train_loss": -25.675939559936523, "global_step": 274305, "epoch": 3304} {"train_loss": -25.093952178955078, "global_step": 274306, "epoch": 3304} {"train_loss": -25.54573631286621, "global_step": 274307, "epoch": 3304} {"train_loss": -25.489225387573242, "global_step": 274308, "epoch": 3304} {"train_loss": -25.431488037109375, "global_step": 274309, "epoch": 3304} {"train_loss": -25.599773406982422, "global_step": 274310, "epoch": 3304} {"train_loss": -25.24473762512207, "global_step": 274311, "epoch": 3304} {"train_loss": -25.041547775268555, "global_step": 274312, "epoch": 3304} {"train_loss": -25.25714683532715, "global_step": 274313, "epoch": 3304} {"train_loss": -25.239334175385626, "global_step": 274314, "epoch": 3304, "val_loss": 7004948.0} {"train_loss": -24.91781997680664, "global_step": 274315, "epoch": 3305} {"train_loss": -24.875980377197266, "global_step": 274316, "epoch": 3305} {"train_loss": -25.073476791381836, "global_step": 274317, "epoch": 3305} {"train_loss": -24.9863224029541, "global_step": 274318, "epoch": 3305} {"train_loss": -24.79035758972168, "global_step": 274319, "epoch": 3305} {"train_loss": -25.134708404541016, "global_step": 274320, "epoch": 3305} {"train_loss": -24.704023361206055, "global_step": 274321, "epoch": 3305} {"train_loss": -24.90443229675293, "global_step": 274322, "epoch": 3305} {"train_loss": -24.954580307006836, "global_step": 274323, "epoch": 3305} {"train_loss": -25.05573844909668, "global_step": 274324, "epoch": 3305} {"train_loss": -25.082799911499023, "global_step": 274325, "epoch": 3305} {"train_loss": -25.187368392944336, "global_step": 274326, "epoch": 3305} {"train_loss": -25.0802059173584, "global_step": 274327, "epoch": 3305} {"train_loss": -25.399866104125977, "global_step": 274328, "epoch": 3305} {"train_loss": -25.070363998413086, "global_step": 274329, "epoch": 3305} {"train_loss": -25.33656883239746, "global_step": 274330, "epoch": 3305} {"train_loss": -25.12033462524414, "global_step": 274331, "epoch": 3305} {"train_loss": -25.222803115844727, "global_step": 274332, "epoch": 3305} {"train_loss": -25.078495025634766, "global_step": 274333, "epoch": 3305} {"train_loss": -25.164915084838867, "global_step": 274334, "epoch": 3305} {"train_loss": -25.364355087280273, "global_step": 274335, "epoch": 3305} {"train_loss": -25.41689109802246, "global_step": 274336, "epoch": 3305} {"train_loss": -25.079051971435547, "global_step": 274337, "epoch": 3305} {"train_loss": -25.157024383544922, "global_step": 274338, "epoch": 3305} {"train_loss": -25.003299713134766, "global_step": 274339, "epoch": 3305} {"train_loss": -25.156747817993164, "global_step": 274340, "epoch": 3305} {"train_loss": -25.3800048828125, "global_step": 274341, "epoch": 3305} {"train_loss": -25.173385620117188, "global_step": 274342, "epoch": 3305} {"train_loss": -25.568769454956055, "global_step": 274343, "epoch": 3305} {"train_loss": -25.496803283691406, "global_step": 274344, "epoch": 3305} {"train_loss": -25.61215591430664, "global_step": 274345, "epoch": 3305} {"train_loss": -25.48094940185547, "global_step": 274346, "epoch": 3305} {"train_loss": -25.4620418548584, "global_step": 274347, "epoch": 3305} {"train_loss": -25.15987205505371, "global_step": 274348, "epoch": 3305} {"train_loss": -25.395959854125977, "global_step": 274349, "epoch": 3305} {"train_loss": -25.364404678344727, "global_step": 274350, "epoch": 3305} {"train_loss": -25.283218383789062, "global_step": 274351, "epoch": 3305} {"train_loss": -25.570302963256836, "global_step": 274352, "epoch": 3305} {"train_loss": -25.209976196289062, "global_step": 274353, "epoch": 3305} {"train_loss": -25.079885482788086, "global_step": 274354, "epoch": 3305} {"train_loss": -25.151473999023438, "global_step": 274355, "epoch": 3305} {"train_loss": -25.38533592224121, "global_step": 274356, "epoch": 3305} {"train_loss": -25.74344825744629, "global_step": 274357, "epoch": 3305} {"train_loss": -25.555099487304688, "global_step": 274358, "epoch": 3305} {"train_loss": -25.968017578125, "global_step": 274359, "epoch": 3305} {"train_loss": -25.0625057220459, "global_step": 274360, "epoch": 3305} {"train_loss": -25.53536033630371, "global_step": 274361, "epoch": 3305} {"train_loss": -25.341827392578125, "global_step": 274362, "epoch": 3305} {"train_loss": -25.657058715820312, "global_step": 274363, "epoch": 3305} {"train_loss": -25.43224334716797, "global_step": 274364, "epoch": 3305} {"train_loss": -25.491641998291016, "global_step": 274365, "epoch": 3305} {"train_loss": -26.161718368530273, "global_step": 274366, "epoch": 3305} {"train_loss": -25.234888076782227, "global_step": 274367, "epoch": 3305} {"train_loss": -25.29316520690918, "global_step": 274368, "epoch": 3305} {"train_loss": -24.67877769470215, "global_step": 274369, "epoch": 3305} {"train_loss": -24.8889217376709, "global_step": 274370, "epoch": 3305} {"train_loss": -24.534793853759766, "global_step": 274371, "epoch": 3305} {"train_loss": -24.447965621948242, "global_step": 274372, "epoch": 3305} {"train_loss": -24.734413146972656, "global_step": 274373, "epoch": 3305} {"train_loss": -25.1558895111084, "global_step": 274374, "epoch": 3305} {"train_loss": -25.380022048950195, "global_step": 274375, "epoch": 3305} {"train_loss": -24.477415084838867, "global_step": 274376, "epoch": 3305} {"train_loss": -24.742780685424805, "global_step": 274377, "epoch": 3305} {"train_loss": -25.113000869750977, "global_step": 274378, "epoch": 3305} {"train_loss": -25.359888076782227, "global_step": 274379, "epoch": 3305} {"train_loss": -25.35993194580078, "global_step": 274380, "epoch": 3305} {"train_loss": -25.21488380432129, "global_step": 274381, "epoch": 3305} {"train_loss": -25.02081871032715, "global_step": 274382, "epoch": 3305} {"train_loss": -24.943166732788086, "global_step": 274383, "epoch": 3305} {"train_loss": -24.986967086791992, "global_step": 274384, "epoch": 3305} {"train_loss": -24.797119140625, "global_step": 274385, "epoch": 3305} {"train_loss": -25.07796859741211, "global_step": 274386, "epoch": 3305} {"train_loss": -25.031038284301758, "global_step": 274387, "epoch": 3305} {"train_loss": -24.91506576538086, "global_step": 274388, "epoch": 3305} {"train_loss": -25.756454467773438, "global_step": 274389, "epoch": 3305} {"train_loss": -25.262371063232422, "global_step": 274390, "epoch": 3305} {"train_loss": -25.05385398864746, "global_step": 274391, "epoch": 3305} {"train_loss": -25.43717384338379, "global_step": 274392, "epoch": 3305} {"train_loss": -25.37931251525879, "global_step": 274393, "epoch": 3305} {"train_loss": -25.616809844970703, "global_step": 274394, "epoch": 3305} {"train_loss": -25.25411605834961, "global_step": 274395, "epoch": 3305} {"train_loss": -25.324127197265625, "global_step": 274396, "epoch": 3305} {"train_loss": -25.228436136820232, "global_step": 274397, "epoch": 3305, "val_loss": 7013853.0} {"train_loss": -24.492128372192383, "global_step": 274398, "epoch": 3306} {"train_loss": -25.060302734375, "global_step": 274399, "epoch": 3306} {"train_loss": -25.00770378112793, "global_step": 274400, "epoch": 3306} {"train_loss": -24.553354263305664, "global_step": 274401, "epoch": 3306} {"train_loss": -24.7169132232666, "global_step": 274402, "epoch": 3306} {"train_loss": -24.968017578125, "global_step": 274403, "epoch": 3306} {"train_loss": -24.832487106323242, "global_step": 274404, "epoch": 3306} {"train_loss": -24.943622589111328, "global_step": 274405, "epoch": 3306} {"train_loss": -25.192289352416992, "global_step": 274406, "epoch": 3306} {"train_loss": -24.672382354736328, "global_step": 274407, "epoch": 3306} {"train_loss": -25.004146575927734, "global_step": 274408, "epoch": 3306} {"train_loss": -25.19345474243164, "global_step": 274409, "epoch": 3306} {"train_loss": -24.835073471069336, "global_step": 274410, "epoch": 3306} {"train_loss": -25.3242244720459, "global_step": 274411, "epoch": 3306} {"train_loss": -24.90308380126953, "global_step": 274412, "epoch": 3306} {"train_loss": -24.86176872253418, "global_step": 274413, "epoch": 3306} {"train_loss": -25.4321231842041, "global_step": 274414, "epoch": 3306} {"train_loss": -25.195905685424805, "global_step": 274415, "epoch": 3306} {"train_loss": -25.061304092407227, "global_step": 274416, "epoch": 3306} {"train_loss": -25.284650802612305, "global_step": 274417, "epoch": 3306} {"train_loss": -25.23501968383789, "global_step": 274418, "epoch": 3306} {"train_loss": -24.7852840423584, "global_step": 274419, "epoch": 3306} {"train_loss": -25.198232650756836, "global_step": 274420, "epoch": 3306} {"train_loss": -25.249723434448242, "global_step": 274421, "epoch": 3306} {"train_loss": -24.591754913330078, "global_step": 274422, "epoch": 3306} {"train_loss": -24.717870712280273, "global_step": 274423, "epoch": 3306} {"train_loss": -25.1505184173584, "global_step": 274424, "epoch": 3306} {"train_loss": -25.298690795898438, "global_step": 274425, "epoch": 3306} {"train_loss": -25.00593376159668, "global_step": 274426, "epoch": 3306} {"train_loss": -25.094223022460938, "global_step": 274427, "epoch": 3306} {"train_loss": -25.0528564453125, "global_step": 274428, "epoch": 3306} {"train_loss": -25.193456649780273, "global_step": 274429, "epoch": 3306} {"train_loss": -24.992979049682617, "global_step": 274430, "epoch": 3306} {"train_loss": -25.339963912963867, "global_step": 274431, "epoch": 3306} {"train_loss": -25.240345001220703, "global_step": 274432, "epoch": 3306} {"train_loss": -25.08914566040039, "global_step": 274433, "epoch": 3306} {"train_loss": -25.5302791595459, "global_step": 274434, "epoch": 3306} {"train_loss": -25.403179168701172, "global_step": 274435, "epoch": 3306} {"train_loss": -25.222270965576172, "global_step": 274436, "epoch": 3306} {"train_loss": -25.153671264648438, "global_step": 274437, "epoch": 3306} {"train_loss": -25.56900978088379, "global_step": 274438, "epoch": 3306} {"train_loss": -25.194990158081055, "global_step": 274439, "epoch": 3306} {"train_loss": -25.737457275390625, "global_step": 274440, "epoch": 3306} {"train_loss": -25.431142807006836, "global_step": 274441, "epoch": 3306} {"train_loss": -25.68645668029785, "global_step": 274442, "epoch": 3306} {"train_loss": -25.534423828125, "global_step": 274443, "epoch": 3306} {"train_loss": -25.465314865112305, "global_step": 274444, "epoch": 3306} {"train_loss": -25.758148193359375, "global_step": 274445, "epoch": 3306} {"train_loss": -25.383895874023438, "global_step": 274446, "epoch": 3306} {"train_loss": -25.509023666381836, "global_step": 274447, "epoch": 3306} {"train_loss": -25.58342742919922, "global_step": 274448, "epoch": 3306} {"train_loss": -25.48707389831543, "global_step": 274449, "epoch": 3306} {"train_loss": -25.447750091552734, "global_step": 274450, "epoch": 3306} {"train_loss": -25.504371643066406, "global_step": 274451, "epoch": 3306} {"train_loss": -25.207353591918945, "global_step": 274452, "epoch": 3306} {"train_loss": -25.3941593170166, "global_step": 274453, "epoch": 3306} {"train_loss": -25.32996940612793, "global_step": 274454, "epoch": 3306} {"train_loss": -25.358030319213867, "global_step": 274455, "epoch": 3306} {"train_loss": -25.112918853759766, "global_step": 274456, "epoch": 3306} {"train_loss": -25.21941566467285, "global_step": 274457, "epoch": 3306} {"train_loss": -25.24786949157715, "global_step": 274458, "epoch": 3306} {"train_loss": -25.38570213317871, "global_step": 274459, "epoch": 3306} {"train_loss": -25.12835693359375, "global_step": 274460, "epoch": 3306} {"train_loss": -25.566221237182617, "global_step": 274461, "epoch": 3306} {"train_loss": -25.67841911315918, "global_step": 274462, "epoch": 3306} {"train_loss": -25.599924087524414, "global_step": 274463, "epoch": 3306} {"train_loss": -25.139610290527344, "global_step": 274464, "epoch": 3306} {"train_loss": -25.726505279541016, "global_step": 274465, "epoch": 3306} {"train_loss": -25.208988189697266, "global_step": 274466, "epoch": 3306} {"train_loss": -25.09792137145996, "global_step": 274467, "epoch": 3306} {"train_loss": -25.07736587524414, "global_step": 274468, "epoch": 3306} {"train_loss": -25.375411987304688, "global_step": 274469, "epoch": 3306} {"train_loss": -25.09619140625, "global_step": 274470, "epoch": 3306} {"train_loss": -25.530731201171875, "global_step": 274471, "epoch": 3306} {"train_loss": -24.982269287109375, "global_step": 274472, "epoch": 3306} {"train_loss": -25.132604598999023, "global_step": 274473, "epoch": 3306} {"train_loss": -25.307178497314453, "global_step": 274474, "epoch": 3306} {"train_loss": -25.3255615234375, "global_step": 274475, "epoch": 3306} {"train_loss": -24.965200424194336, "global_step": 274476, "epoch": 3306} {"train_loss": -25.0524845123291, "global_step": 274477, "epoch": 3306} {"train_loss": -24.75362205505371, "global_step": 274478, "epoch": 3306} {"train_loss": -25.006433486938477, "global_step": 274479, "epoch": 3306} {"train_loss": -25.190600222851856, "global_step": 274480, "epoch": 3306, "val_loss": 7056616.5} {"train_loss": -24.748228073120117, "global_step": 274481, "epoch": 3307} {"train_loss": -24.82988739013672, "global_step": 274482, "epoch": 3307} {"train_loss": -24.910484313964844, "global_step": 274483, "epoch": 3307} {"train_loss": -24.849380493164062, "global_step": 274484, "epoch": 3307} {"train_loss": -24.713321685791016, "global_step": 274485, "epoch": 3307} {"train_loss": -24.661733627319336, "global_step": 274486, "epoch": 3307} {"train_loss": -25.114938735961914, "global_step": 274487, "epoch": 3307} {"train_loss": -24.88510513305664, "global_step": 274488, "epoch": 3307} {"train_loss": -25.25922393798828, "global_step": 274489, "epoch": 3307} {"train_loss": -24.95176124572754, "global_step": 274490, "epoch": 3307} {"train_loss": -25.15205955505371, "global_step": 274491, "epoch": 3307} {"train_loss": -24.92015266418457, "global_step": 274492, "epoch": 3307} {"train_loss": -24.89472007751465, "global_step": 274493, "epoch": 3307} {"train_loss": -25.104398727416992, "global_step": 274494, "epoch": 3307} {"train_loss": -24.90304183959961, "global_step": 274495, "epoch": 3307} {"train_loss": -25.383657455444336, "global_step": 274496, "epoch": 3307} {"train_loss": -25.19342803955078, "global_step": 274497, "epoch": 3307} {"train_loss": -25.325408935546875, "global_step": 274498, "epoch": 3307} {"train_loss": -25.131513595581055, "global_step": 274499, "epoch": 3307} {"train_loss": -25.248918533325195, "global_step": 274500, "epoch": 3307} {"train_loss": -25.193096160888672, "global_step": 274501, "epoch": 3307} {"train_loss": -25.04514503479004, "global_step": 274502, "epoch": 3307} {"train_loss": -25.431659698486328, "global_step": 274503, "epoch": 3307} {"train_loss": -25.659271240234375, "global_step": 274504, "epoch": 3307} {"train_loss": -25.363813400268555, "global_step": 274505, "epoch": 3307} {"train_loss": -25.315214157104492, "global_step": 274506, "epoch": 3307} {"train_loss": -25.24700927734375, "global_step": 274507, "epoch": 3307} {"train_loss": -25.114179611206055, "global_step": 274508, "epoch": 3307} {"train_loss": -25.07138442993164, "global_step": 274509, "epoch": 3307} {"train_loss": -25.430387496948242, "global_step": 274510, "epoch": 3307} {"train_loss": -25.335309982299805, "global_step": 274511, "epoch": 3307} {"train_loss": -25.673803329467773, "global_step": 274512, "epoch": 3307} {"train_loss": -25.17217445373535, "global_step": 274513, "epoch": 3307} {"train_loss": -25.12094497680664, "global_step": 274514, "epoch": 3307} {"train_loss": -25.51747703552246, "global_step": 274515, "epoch": 3307} {"train_loss": -25.09108543395996, "global_step": 274516, "epoch": 3307} {"train_loss": -25.327377319335938, "global_step": 274517, "epoch": 3307} {"train_loss": -25.38658332824707, "global_step": 274518, "epoch": 3307} {"train_loss": -25.512693405151367, "global_step": 274519, "epoch": 3307} {"train_loss": -25.402860641479492, "global_step": 274520, "epoch": 3307} {"train_loss": -25.118770599365234, "global_step": 274521, "epoch": 3307} {"train_loss": -25.515928268432617, "global_step": 274522, "epoch": 3307} {"train_loss": -25.400020599365234, "global_step": 274523, "epoch": 3307} {"train_loss": -25.382854461669922, "global_step": 274524, "epoch": 3307} {"train_loss": -25.818592071533203, "global_step": 274525, "epoch": 3307} {"train_loss": -25.78778076171875, "global_step": 274526, "epoch": 3307} {"train_loss": -25.644393920898438, "global_step": 274527, "epoch": 3307} {"train_loss": -25.5040340423584, "global_step": 274528, "epoch": 3307} {"train_loss": -25.2943172454834, "global_step": 274529, "epoch": 3307} {"train_loss": -25.063129425048828, "global_step": 274530, "epoch": 3307} {"train_loss": -25.404645919799805, "global_step": 274531, "epoch": 3307} {"train_loss": -25.65171241760254, "global_step": 274532, "epoch": 3307} {"train_loss": -25.47127914428711, "global_step": 274533, "epoch": 3307} {"train_loss": -25.501110076904297, "global_step": 274534, "epoch": 3307} {"train_loss": -25.290205001831055, "global_step": 274535, "epoch": 3307} {"train_loss": -25.18116569519043, "global_step": 274536, "epoch": 3307} {"train_loss": -25.287826538085938, "global_step": 274537, "epoch": 3307} {"train_loss": -24.898569107055664, "global_step": 274538, "epoch": 3307} {"train_loss": -25.144941329956055, "global_step": 274539, "epoch": 3307} {"train_loss": -25.415739059448242, "global_step": 274540, "epoch": 3307} {"train_loss": -25.640857696533203, "global_step": 274541, "epoch": 3307} {"train_loss": -25.349750518798828, "global_step": 274542, "epoch": 3307} {"train_loss": -25.2655086517334, "global_step": 274543, "epoch": 3307} {"train_loss": -25.504819869995117, "global_step": 274544, "epoch": 3307} {"train_loss": -25.604251861572266, "global_step": 274545, "epoch": 3307} {"train_loss": -25.602025985717773, "global_step": 274546, "epoch": 3307} {"train_loss": -25.459287643432617, "global_step": 274547, "epoch": 3307} {"train_loss": -24.97503662109375, "global_step": 274548, "epoch": 3307} {"train_loss": -25.21407699584961, "global_step": 274549, "epoch": 3307} {"train_loss": -25.246185302734375, "global_step": 274550, "epoch": 3307} {"train_loss": -25.66574478149414, "global_step": 274551, "epoch": 3307} {"train_loss": -25.289932250976562, "global_step": 274552, "epoch": 3307} {"train_loss": -25.27912712097168, "global_step": 274553, "epoch": 3307} {"train_loss": -25.373062133789062, "global_step": 274554, "epoch": 3307} {"train_loss": -25.476806640625, "global_step": 274555, "epoch": 3307} {"train_loss": -25.39764404296875, "global_step": 274556, "epoch": 3307} {"train_loss": -25.008394241333008, "global_step": 274557, "epoch": 3307} {"train_loss": -24.307077407836914, "global_step": 274558, "epoch": 3307} {"train_loss": -24.23529624938965, "global_step": 274559, "epoch": 3307} {"train_loss": -25.215545654296875, "global_step": 274560, "epoch": 3307} {"train_loss": -24.664533615112305, "global_step": 274561, "epoch": 3307} {"train_loss": -24.64886474609375, "global_step": 274562, "epoch": 3307} {"train_loss": -25.23414552068136, "global_step": 274563, "epoch": 3307, "val_loss": 7206206.5} {"train_loss": -24.447406768798828, "global_step": 274564, "epoch": 3308} {"train_loss": -24.400634765625, "global_step": 274565, "epoch": 3308} {"train_loss": -24.14579200744629, "global_step": 274566, "epoch": 3308} {"train_loss": -24.5380916595459, "global_step": 274567, "epoch": 3308} {"train_loss": -24.137704849243164, "global_step": 274568, "epoch": 3308} {"train_loss": -24.383041381835938, "global_step": 274569, "epoch": 3308} {"train_loss": -24.76633644104004, "global_step": 274570, "epoch": 3308} {"train_loss": -24.678592681884766, "global_step": 274571, "epoch": 3308} {"train_loss": -24.869115829467773, "global_step": 274572, "epoch": 3308} {"train_loss": -24.651281356811523, "global_step": 274573, "epoch": 3308} {"train_loss": -24.554563522338867, "global_step": 274574, "epoch": 3308} {"train_loss": -24.425992965698242, "global_step": 274575, "epoch": 3308} {"train_loss": -24.60967445373535, "global_step": 274576, "epoch": 3308} {"train_loss": -24.674787521362305, "global_step": 274577, "epoch": 3308} {"train_loss": -24.869953155517578, "global_step": 274578, "epoch": 3308} {"train_loss": -24.95123291015625, "global_step": 274579, "epoch": 3308} {"train_loss": -24.528684616088867, "global_step": 274580, "epoch": 3308} {"train_loss": -24.98470115661621, "global_step": 274581, "epoch": 3308} {"train_loss": -24.79722023010254, "global_step": 274582, "epoch": 3308} {"train_loss": -25.0700740814209, "global_step": 274583, "epoch": 3308} {"train_loss": -24.94841766357422, "global_step": 274584, "epoch": 3308} {"train_loss": -24.868162155151367, "global_step": 274585, "epoch": 3308} {"train_loss": -25.158796310424805, "global_step": 274586, "epoch": 3308} {"train_loss": -25.13140869140625, "global_step": 274587, "epoch": 3308} {"train_loss": -24.767427444458008, "global_step": 274588, "epoch": 3308} {"train_loss": -24.972288131713867, "global_step": 274589, "epoch": 3308} {"train_loss": -25.442039489746094, "global_step": 274590, "epoch": 3308} {"train_loss": -25.180532455444336, "global_step": 274591, "epoch": 3308} {"train_loss": -25.265491485595703, "global_step": 274592, "epoch": 3308} {"train_loss": -25.000717163085938, "global_step": 274593, "epoch": 3308} {"train_loss": -24.90131187438965, "global_step": 274594, "epoch": 3308} {"train_loss": -25.1812744140625, "global_step": 274595, "epoch": 3308} {"train_loss": -25.411819458007812, "global_step": 274596, "epoch": 3308} {"train_loss": -25.0762882232666, "global_step": 274597, "epoch": 3308} {"train_loss": -25.339506149291992, "global_step": 274598, "epoch": 3308} {"train_loss": -25.494415283203125, "global_step": 274599, "epoch": 3308} {"train_loss": -25.25121307373047, "global_step": 274600, "epoch": 3308} {"train_loss": -25.195735931396484, "global_step": 274601, "epoch": 3308} {"train_loss": -25.47499656677246, "global_step": 274602, "epoch": 3308} {"train_loss": -25.717212677001953, "global_step": 274603, "epoch": 3308} {"train_loss": -25.7943058013916, "global_step": 274604, "epoch": 3308} {"train_loss": -25.301660537719727, "global_step": 274605, "epoch": 3308} {"train_loss": -25.5353946685791, "global_step": 274606, "epoch": 3308} {"train_loss": -25.51424217224121, "global_step": 274607, "epoch": 3308} {"train_loss": -25.20357322692871, "global_step": 274608, "epoch": 3308} {"train_loss": -25.48225975036621, "global_step": 274609, "epoch": 3308} {"train_loss": -25.608728408813477, "global_step": 274610, "epoch": 3308} {"train_loss": -25.082304000854492, "global_step": 274611, "epoch": 3308} {"train_loss": -25.424428939819336, "global_step": 274612, "epoch": 3308} {"train_loss": -25.651172637939453, "global_step": 274613, "epoch": 3308} {"train_loss": -25.596309661865234, "global_step": 274614, "epoch": 3308} {"train_loss": -25.344404220581055, "global_step": 274615, "epoch": 3308} {"train_loss": -24.8135929107666, "global_step": 274616, "epoch": 3308} {"train_loss": -25.317123413085938, "global_step": 274617, "epoch": 3308} {"train_loss": -25.280094146728516, "global_step": 274618, "epoch": 3308} {"train_loss": -24.96685218811035, "global_step": 274619, "epoch": 3308} {"train_loss": -25.46721649169922, "global_step": 274620, "epoch": 3308} {"train_loss": -25.34918785095215, "global_step": 274621, "epoch": 3308} {"train_loss": -25.18906593322754, "global_step": 274622, "epoch": 3308} {"train_loss": -25.215871810913086, "global_step": 274623, "epoch": 3308} {"train_loss": -24.52435302734375, "global_step": 274624, "epoch": 3308} {"train_loss": -25.120344161987305, "global_step": 274625, "epoch": 3308} {"train_loss": -25.056577682495117, "global_step": 274626, "epoch": 3308} {"train_loss": -25.14515495300293, "global_step": 274627, "epoch": 3308} {"train_loss": -25.42079734802246, "global_step": 274628, "epoch": 3308} {"train_loss": -25.147205352783203, "global_step": 274629, "epoch": 3308} {"train_loss": -25.33803939819336, "global_step": 274630, "epoch": 3308} {"train_loss": -25.526357650756836, "global_step": 274631, "epoch": 3308} {"train_loss": -25.304519653320312, "global_step": 274632, "epoch": 3308} {"train_loss": -25.216602325439453, "global_step": 274633, "epoch": 3308} {"train_loss": -25.615436553955078, "global_step": 274634, "epoch": 3308} {"train_loss": -25.477399826049805, "global_step": 274635, "epoch": 3308} {"train_loss": -25.29209327697754, "global_step": 274636, "epoch": 3308} {"train_loss": -25.274993896484375, "global_step": 274637, "epoch": 3308} {"train_loss": -25.505868911743164, "global_step": 274638, "epoch": 3308} {"train_loss": -25.140356063842773, "global_step": 274639, "epoch": 3308} {"train_loss": -25.405170440673828, "global_step": 274640, "epoch": 3308} {"train_loss": -25.378753662109375, "global_step": 274641, "epoch": 3308} {"train_loss": -25.675085067749023, "global_step": 274642, "epoch": 3308} {"train_loss": -25.464195251464844, "global_step": 274643, "epoch": 3308} {"train_loss": -25.280506134033203, "global_step": 274644, "epoch": 3308} {"train_loss": -25.207895278930664, "global_step": 274645, "epoch": 3308} {"train_loss": -25.126582019300347, "global_step": 274646, "epoch": 3308, "val_loss": 6932140.5} {"train_loss": -25.31034278869629, "global_step": 274647, "epoch": 3309} {"train_loss": -24.87084197998047, "global_step": 274648, "epoch": 3309} {"train_loss": -25.489116668701172, "global_step": 274649, "epoch": 3309} {"train_loss": -24.93745994567871, "global_step": 274650, "epoch": 3309} {"train_loss": -25.16834259033203, "global_step": 274651, "epoch": 3309} {"train_loss": -24.94659996032715, "global_step": 274652, "epoch": 3309} {"train_loss": -24.853473663330078, "global_step": 274653, "epoch": 3309} {"train_loss": -25.178308486938477, "global_step": 274654, "epoch": 3309} {"train_loss": -25.13358497619629, "global_step": 274655, "epoch": 3309} {"train_loss": -25.130390167236328, "global_step": 274656, "epoch": 3309} {"train_loss": -24.955883026123047, "global_step": 274657, "epoch": 3309} {"train_loss": -25.500829696655273, "global_step": 274658, "epoch": 3309} {"train_loss": -25.055280685424805, "global_step": 274659, "epoch": 3309} {"train_loss": -25.51791763305664, "global_step": 274660, "epoch": 3309} {"train_loss": -25.092164993286133, "global_step": 274661, "epoch": 3309} {"train_loss": -25.410829544067383, "global_step": 274662, "epoch": 3309} {"train_loss": -25.111103057861328, "global_step": 274663, "epoch": 3309} {"train_loss": -25.016712188720703, "global_step": 274664, "epoch": 3309} {"train_loss": -25.631183624267578, "global_step": 274665, "epoch": 3309} {"train_loss": -25.08974266052246, "global_step": 274666, "epoch": 3309} {"train_loss": -25.31211280822754, "global_step": 274667, "epoch": 3309} {"train_loss": -25.539525985717773, "global_step": 274668, "epoch": 3309} {"train_loss": -25.185483932495117, "global_step": 274669, "epoch": 3309} {"train_loss": -25.331945419311523, "global_step": 274670, "epoch": 3309} {"train_loss": -25.201879501342773, "global_step": 274671, "epoch": 3309} {"train_loss": -25.64863395690918, "global_step": 274672, "epoch": 3309} {"train_loss": -25.25703239440918, "global_step": 274673, "epoch": 3309} {"train_loss": -25.638914108276367, "global_step": 274674, "epoch": 3309} {"train_loss": -25.377460479736328, "global_step": 274675, "epoch": 3309} {"train_loss": -25.394664764404297, "global_step": 274676, "epoch": 3309} {"train_loss": -25.40199851989746, "global_step": 274677, "epoch": 3309} {"train_loss": -24.93439292907715, "global_step": 274678, "epoch": 3309} {"train_loss": -25.45858383178711, "global_step": 274679, "epoch": 3309} {"train_loss": -25.31587791442871, "global_step": 274680, "epoch": 3309} {"train_loss": -25.237964630126953, "global_step": 274681, "epoch": 3309} {"train_loss": -25.604589462280273, "global_step": 274682, "epoch": 3309} {"train_loss": -25.26244354248047, "global_step": 274683, "epoch": 3309} {"train_loss": -25.933874130249023, "global_step": 274684, "epoch": 3309} {"train_loss": -25.52133560180664, "global_step": 274685, "epoch": 3309} {"train_loss": -25.361875534057617, "global_step": 274686, "epoch": 3309} {"train_loss": -26.00942039489746, "global_step": 274687, "epoch": 3309} {"train_loss": -25.37251853942871, "global_step": 274688, "epoch": 3309} {"train_loss": -25.475261688232422, "global_step": 274689, "epoch": 3309} {"train_loss": -25.46002769470215, "global_step": 274690, "epoch": 3309} {"train_loss": -25.30439567565918, "global_step": 274691, "epoch": 3309} {"train_loss": -25.263837814331055, "global_step": 274692, "epoch": 3309} {"train_loss": -25.553939819335938, "global_step": 274693, "epoch": 3309} {"train_loss": -25.658588409423828, "global_step": 274694, "epoch": 3309} {"train_loss": -25.287290573120117, "global_step": 274695, "epoch": 3309} {"train_loss": -25.28461265563965, "global_step": 274696, "epoch": 3309} {"train_loss": -24.868478775024414, "global_step": 274697, "epoch": 3309} {"train_loss": -25.031585693359375, "global_step": 274698, "epoch": 3309} {"train_loss": -24.935720443725586, "global_step": 274699, "epoch": 3309} {"train_loss": -24.891756057739258, "global_step": 274700, "epoch": 3309} {"train_loss": -25.47148323059082, "global_step": 274701, "epoch": 3309} {"train_loss": -25.067129135131836, "global_step": 274702, "epoch": 3309} {"train_loss": -25.12223243713379, "global_step": 274703, "epoch": 3309} {"train_loss": -25.104774475097656, "global_step": 274704, "epoch": 3309} {"train_loss": -25.029850006103516, "global_step": 274705, "epoch": 3309} {"train_loss": -25.249853134155273, "global_step": 274706, "epoch": 3309} {"train_loss": -25.23696517944336, "global_step": 274707, "epoch": 3309} {"train_loss": -25.062467575073242, "global_step": 274708, "epoch": 3309} {"train_loss": -25.582901000976562, "global_step": 274709, "epoch": 3309} {"train_loss": -25.459964752197266, "global_step": 274710, "epoch": 3309} {"train_loss": -25.409503936767578, "global_step": 274711, "epoch": 3309} {"train_loss": -25.100637435913086, "global_step": 274712, "epoch": 3309} {"train_loss": -25.45842170715332, "global_step": 274713, "epoch": 3309} {"train_loss": -25.33138084411621, "global_step": 274714, "epoch": 3309} {"train_loss": -25.60407066345215, "global_step": 274715, "epoch": 3309} {"train_loss": -25.267227172851562, "global_step": 274716, "epoch": 3309} {"train_loss": -25.131540298461914, "global_step": 274717, "epoch": 3309} {"train_loss": -25.348350524902344, "global_step": 274718, "epoch": 3309} {"train_loss": -25.42395782470703, "global_step": 274719, "epoch": 3309} {"train_loss": -25.978681564331055, "global_step": 274720, "epoch": 3309} {"train_loss": -25.282875061035156, "global_step": 274721, "epoch": 3309} {"train_loss": -25.26128578186035, "global_step": 274722, "epoch": 3309} {"train_loss": -25.6165714263916, "global_step": 274723, "epoch": 3309} {"train_loss": -25.511877059936523, "global_step": 274724, "epoch": 3309} {"train_loss": -25.30278205871582, "global_step": 274725, "epoch": 3309} {"train_loss": -25.399826049804688, "global_step": 274726, "epoch": 3309} {"train_loss": -25.361936569213867, "global_step": 274727, "epoch": 3309} {"train_loss": -25.19069480895996, "global_step": 274728, "epoch": 3309} {"train_loss": -25.311055309801215, "global_step": 274729, "epoch": 3309, "val_loss": 7023240.0} {"train_loss": -25.20688247680664, "global_step": 274730, "epoch": 3310} {"train_loss": -25.277780532836914, "global_step": 274731, "epoch": 3310} {"train_loss": -25.12944793701172, "global_step": 274732, "epoch": 3310} {"train_loss": -24.546091079711914, "global_step": 274733, "epoch": 3310} {"train_loss": -25.16582679748535, "global_step": 274734, "epoch": 3310} {"train_loss": -25.01219940185547, "global_step": 274735, "epoch": 3310} {"train_loss": -24.640838623046875, "global_step": 274736, "epoch": 3310} {"train_loss": -25.064701080322266, "global_step": 274737, "epoch": 3310} {"train_loss": -24.788267135620117, "global_step": 274738, "epoch": 3310} {"train_loss": -25.01973533630371, "global_step": 274739, "epoch": 3310} {"train_loss": -24.67803955078125, "global_step": 274740, "epoch": 3310} {"train_loss": -25.31486701965332, "global_step": 274741, "epoch": 3310} {"train_loss": -25.190204620361328, "global_step": 274742, "epoch": 3310} {"train_loss": -25.089385986328125, "global_step": 274743, "epoch": 3310} {"train_loss": -24.98880386352539, "global_step": 274744, "epoch": 3310} {"train_loss": -25.080942153930664, "global_step": 274745, "epoch": 3310} {"train_loss": -25.506582260131836, "global_step": 274746, "epoch": 3310} {"train_loss": -24.985811233520508, "global_step": 274747, "epoch": 3310} {"train_loss": -25.219148635864258, "global_step": 274748, "epoch": 3310} {"train_loss": -24.82708168029785, "global_step": 274749, "epoch": 3310} {"train_loss": -25.220075607299805, "global_step": 274750, "epoch": 3310} {"train_loss": -24.978029251098633, "global_step": 274751, "epoch": 3310} {"train_loss": -25.390817642211914, "global_step": 274752, "epoch": 3310} {"train_loss": -25.07515525817871, "global_step": 274753, "epoch": 3310} {"train_loss": -25.453006744384766, "global_step": 274754, "epoch": 3310} {"train_loss": -25.150297164916992, "global_step": 274755, "epoch": 3310} {"train_loss": -25.319950103759766, "global_step": 274756, "epoch": 3310} {"train_loss": -25.27044677734375, "global_step": 274757, "epoch": 3310} {"train_loss": -25.214628219604492, "global_step": 274758, "epoch": 3310} {"train_loss": -25.347326278686523, "global_step": 274759, "epoch": 3310} {"train_loss": -25.46491050720215, "global_step": 274760, "epoch": 3310} {"train_loss": -25.42240333557129, "global_step": 274761, "epoch": 3310} {"train_loss": -25.093238830566406, "global_step": 274762, "epoch": 3310} {"train_loss": -25.57745361328125, "global_step": 274763, "epoch": 3310} {"train_loss": -25.124509811401367, "global_step": 274764, "epoch": 3310} {"train_loss": -25.584409713745117, "global_step": 274765, "epoch": 3310} {"train_loss": -25.54134178161621, "global_step": 274766, "epoch": 3310} {"train_loss": -25.596054077148438, "global_step": 274767, "epoch": 3310} {"train_loss": -25.61757469177246, "global_step": 274768, "epoch": 3310} {"train_loss": -25.75421714782715, "global_step": 274769, "epoch": 3310} {"train_loss": -25.434497833251953, "global_step": 274770, "epoch": 3310} {"train_loss": -25.748929977416992, "global_step": 274771, "epoch": 3310} {"train_loss": -25.47567367553711, "global_step": 274772, "epoch": 3310} {"train_loss": -25.52607536315918, "global_step": 274773, "epoch": 3310} {"train_loss": -25.59760284423828, "global_step": 274774, "epoch": 3310} {"train_loss": -25.71405029296875, "global_step": 274775, "epoch": 3310} {"train_loss": -25.57010841369629, "global_step": 274776, "epoch": 3310} {"train_loss": -25.408023834228516, "global_step": 274777, "epoch": 3310} {"train_loss": -24.937536239624023, "global_step": 274778, "epoch": 3310} {"train_loss": -25.774398803710938, "global_step": 274779, "epoch": 3310} {"train_loss": -25.488201141357422, "global_step": 274780, "epoch": 3310} {"train_loss": -25.34947395324707, "global_step": 274781, "epoch": 3310} {"train_loss": -25.48480796813965, "global_step": 274782, "epoch": 3310} {"train_loss": -25.1030216217041, "global_step": 274783, "epoch": 3310} {"train_loss": -25.01789093017578, "global_step": 274784, "epoch": 3310} {"train_loss": -24.865188598632812, "global_step": 274785, "epoch": 3310} {"train_loss": -24.914871215820312, "global_step": 274786, "epoch": 3310} {"train_loss": -25.310361862182617, "global_step": 274787, "epoch": 3310} {"train_loss": -25.188322067260742, "global_step": 274788, "epoch": 3310} {"train_loss": -25.46650505065918, "global_step": 274789, "epoch": 3310} {"train_loss": -25.28224754333496, "global_step": 274790, "epoch": 3310} {"train_loss": -25.299789428710938, "global_step": 274791, "epoch": 3310} {"train_loss": -25.252342224121094, "global_step": 274792, "epoch": 3310} {"train_loss": -25.2252254486084, "global_step": 274793, "epoch": 3310} {"train_loss": -25.695581436157227, "global_step": 274794, "epoch": 3310} {"train_loss": -25.50574493408203, "global_step": 274795, "epoch": 3310} {"train_loss": -25.18980598449707, "global_step": 274796, "epoch": 3310} {"train_loss": -25.796552658081055, "global_step": 274797, "epoch": 3310} {"train_loss": -25.64505386352539, "global_step": 274798, "epoch": 3310} {"train_loss": -25.379594802856445, "global_step": 274799, "epoch": 3310} {"train_loss": -25.136991500854492, "global_step": 274800, "epoch": 3310} {"train_loss": -25.29608726501465, "global_step": 274801, "epoch": 3310} {"train_loss": -25.334009170532227, "global_step": 274802, "epoch": 3310} {"train_loss": -24.9819393157959, "global_step": 274803, "epoch": 3310} {"train_loss": -25.332157135009766, "global_step": 274804, "epoch": 3310} {"train_loss": -25.130313873291016, "global_step": 274805, "epoch": 3310} {"train_loss": -25.67459487915039, "global_step": 274806, "epoch": 3310} {"train_loss": -25.47853660583496, "global_step": 274807, "epoch": 3310} {"train_loss": -25.112762451171875, "global_step": 274808, "epoch": 3310} {"train_loss": -25.086750030517578, "global_step": 274809, "epoch": 3310} {"train_loss": -25.331541061401367, "global_step": 274810, "epoch": 3310} {"train_loss": -25.440784454345703, "global_step": 274811, "epoch": 3310} {"train_loss": -25.287621141916297, "global_step": 274812, "epoch": 3310, "val_loss": 7016671.0} {"train_loss": -24.01409149169922, "global_step": 274813, "epoch": 3311} {"train_loss": -24.822851181030273, "global_step": 274814, "epoch": 3311} {"train_loss": -23.784143447875977, "global_step": 274815, "epoch": 3311} {"train_loss": -24.72174072265625, "global_step": 274816, "epoch": 3311} {"train_loss": -24.410694122314453, "global_step": 274817, "epoch": 3311} {"train_loss": -25.0898380279541, "global_step": 274818, "epoch": 3311} {"train_loss": -24.583078384399414, "global_step": 274819, "epoch": 3311} {"train_loss": -24.27918243408203, "global_step": 274820, "epoch": 3311} {"train_loss": -24.534778594970703, "global_step": 274821, "epoch": 3311} {"train_loss": -24.066038131713867, "global_step": 274822, "epoch": 3311} {"train_loss": -24.47828483581543, "global_step": 274823, "epoch": 3311} {"train_loss": -24.55909538269043, "global_step": 274824, "epoch": 3311} {"train_loss": -24.832895278930664, "global_step": 274825, "epoch": 3311} {"train_loss": -24.730993270874023, "global_step": 274826, "epoch": 3311} {"train_loss": -25.07021141052246, "global_step": 274827, "epoch": 3311} {"train_loss": -24.606067657470703, "global_step": 274828, "epoch": 3311} {"train_loss": -24.895231246948242, "global_step": 274829, "epoch": 3311} {"train_loss": -24.856674194335938, "global_step": 274830, "epoch": 3311} {"train_loss": -25.118440628051758, "global_step": 274831, "epoch": 3311} {"train_loss": -24.774656295776367, "global_step": 274832, "epoch": 3311} {"train_loss": -24.9241886138916, "global_step": 274833, "epoch": 3311} {"train_loss": -25.227680206298828, "global_step": 274834, "epoch": 3311} {"train_loss": -24.625749588012695, "global_step": 274835, "epoch": 3311} {"train_loss": -24.88604164123535, "global_step": 274836, "epoch": 3311} {"train_loss": -25.062070846557617, "global_step": 274837, "epoch": 3311} {"train_loss": -25.340242385864258, "global_step": 274838, "epoch": 3311} {"train_loss": -25.257158279418945, "global_step": 274839, "epoch": 3311} {"train_loss": -25.318878173828125, "global_step": 274840, "epoch": 3311} {"train_loss": -25.22913932800293, "global_step": 274841, "epoch": 3311} {"train_loss": -25.059457778930664, "global_step": 274842, "epoch": 3311} {"train_loss": -24.994659423828125, "global_step": 274843, "epoch": 3311} {"train_loss": -24.681747436523438, "global_step": 274844, "epoch": 3311} {"train_loss": -24.82184410095215, "global_step": 274845, "epoch": 3311} {"train_loss": -25.211339950561523, "global_step": 274846, "epoch": 3311} {"train_loss": -25.324308395385742, "global_step": 274847, "epoch": 3311} {"train_loss": -24.735000610351562, "global_step": 274848, "epoch": 3311} {"train_loss": -25.507465362548828, "global_step": 274849, "epoch": 3311} {"train_loss": -25.280080795288086, "global_step": 274850, "epoch": 3311} {"train_loss": -25.106313705444336, "global_step": 274851, "epoch": 3311} {"train_loss": -25.308786392211914, "global_step": 274852, "epoch": 3311} {"train_loss": -25.10516357421875, "global_step": 274853, "epoch": 3311} {"train_loss": -24.984586715698242, "global_step": 274854, "epoch": 3311} {"train_loss": -24.632287979125977, "global_step": 274855, "epoch": 3311} {"train_loss": -25.229448318481445, "global_step": 274856, "epoch": 3311} {"train_loss": -25.26784324645996, "global_step": 274857, "epoch": 3311} {"train_loss": -24.850793838500977, "global_step": 274858, "epoch": 3311} {"train_loss": -24.657072067260742, "global_step": 274859, "epoch": 3311} {"train_loss": -25.194368362426758, "global_step": 274860, "epoch": 3311} {"train_loss": -25.080366134643555, "global_step": 274861, "epoch": 3311} {"train_loss": -24.94329833984375, "global_step": 274862, "epoch": 3311} {"train_loss": -25.202011108398438, "global_step": 274863, "epoch": 3311} {"train_loss": -24.866104125976562, "global_step": 274864, "epoch": 3311} {"train_loss": -25.488611221313477, "global_step": 274865, "epoch": 3311} {"train_loss": -24.813047409057617, "global_step": 274866, "epoch": 3311} {"train_loss": -25.365427017211914, "global_step": 274867, "epoch": 3311} {"train_loss": -25.070329666137695, "global_step": 274868, "epoch": 3311} {"train_loss": -25.340194702148438, "global_step": 274869, "epoch": 3311} {"train_loss": -25.431854248046875, "global_step": 274870, "epoch": 3311} {"train_loss": -24.946847915649414, "global_step": 274871, "epoch": 3311} {"train_loss": -25.380563735961914, "global_step": 274872, "epoch": 3311} {"train_loss": -25.3740177154541, "global_step": 274873, "epoch": 3311} {"train_loss": -25.1441707611084, "global_step": 274874, "epoch": 3311} {"train_loss": -25.29044532775879, "global_step": 274875, "epoch": 3311} {"train_loss": -25.335102081298828, "global_step": 274876, "epoch": 3311} {"train_loss": -25.354129791259766, "global_step": 274877, "epoch": 3311} {"train_loss": -25.1392879486084, "global_step": 274878, "epoch": 3311} {"train_loss": -25.27766990661621, "global_step": 274879, "epoch": 3311} {"train_loss": -25.535303115844727, "global_step": 274880, "epoch": 3311} {"train_loss": -25.375146865844727, "global_step": 274881, "epoch": 3311} {"train_loss": -25.142654418945312, "global_step": 274882, "epoch": 3311} {"train_loss": -25.34767723083496, "global_step": 274883, "epoch": 3311} {"train_loss": -25.772903442382812, "global_step": 274884, "epoch": 3311} {"train_loss": -25.288440704345703, "global_step": 274885, "epoch": 3311} {"train_loss": -25.442821502685547, "global_step": 274886, "epoch": 3311} {"train_loss": -25.38868522644043, "global_step": 274887, "epoch": 3311} {"train_loss": -25.119873046875, "global_step": 274888, "epoch": 3311} {"train_loss": -25.090417861938477, "global_step": 274889, "epoch": 3311} {"train_loss": -24.729249954223633, "global_step": 274890, "epoch": 3311} {"train_loss": -25.00208854675293, "global_step": 274891, "epoch": 3311} {"train_loss": -25.289777755737305, "global_step": 274892, "epoch": 3311} {"train_loss": -24.94483757019043, "global_step": 274893, "epoch": 3311} {"train_loss": -24.947824478149414, "global_step": 274894, "epoch": 3311} {"train_loss": -25.025407791137695, "global_step": 274895, "epoch": 3311, "val_loss": 7110094.5} {"train_loss": -24.18622398376465, "global_step": 274896, "epoch": 3312} {"train_loss": -24.098716735839844, "global_step": 274897, "epoch": 3312} {"train_loss": -24.360782623291016, "global_step": 274898, "epoch": 3312} {"train_loss": -24.362485885620117, "global_step": 274899, "epoch": 3312} {"train_loss": -24.337629318237305, "global_step": 274900, "epoch": 3312} {"train_loss": -24.248075485229492, "global_step": 274901, "epoch": 3312} {"train_loss": -25.05398941040039, "global_step": 274902, "epoch": 3312} {"train_loss": -24.83622169494629, "global_step": 274903, "epoch": 3312} {"train_loss": -24.570453643798828, "global_step": 274904, "epoch": 3312} {"train_loss": -24.882801055908203, "global_step": 274905, "epoch": 3312} {"train_loss": -24.60293960571289, "global_step": 274906, "epoch": 3312} {"train_loss": -24.96525001525879, "global_step": 274907, "epoch": 3312} {"train_loss": -24.774030685424805, "global_step": 274908, "epoch": 3312} {"train_loss": -24.88411521911621, "global_step": 274909, "epoch": 3312} {"train_loss": -24.739395141601562, "global_step": 274910, "epoch": 3312} {"train_loss": -24.869155883789062, "global_step": 274911, "epoch": 3312} {"train_loss": -24.80360221862793, "global_step": 274912, "epoch": 3312} {"train_loss": -25.217361450195312, "global_step": 274913, "epoch": 3312} {"train_loss": -25.277816772460938, "global_step": 274914, "epoch": 3312} {"train_loss": -25.08709716796875, "global_step": 274915, "epoch": 3312} {"train_loss": -24.859642028808594, "global_step": 274916, "epoch": 3312} {"train_loss": -24.868051528930664, "global_step": 274917, "epoch": 3312} {"train_loss": -25.155235290527344, "global_step": 274918, "epoch": 3312} {"train_loss": -25.38541030883789, "global_step": 274919, "epoch": 3312} {"train_loss": -24.949413299560547, "global_step": 274920, "epoch": 3312} {"train_loss": -25.25273895263672, "global_step": 274921, "epoch": 3312} {"train_loss": -25.207508087158203, "global_step": 274922, "epoch": 3312} {"train_loss": -25.230297088623047, "global_step": 274923, "epoch": 3312} {"train_loss": -25.130155563354492, "global_step": 274924, "epoch": 3312} {"train_loss": -25.32505226135254, "global_step": 274925, "epoch": 3312} {"train_loss": -25.129608154296875, "global_step": 274926, "epoch": 3312} {"train_loss": -25.451343536376953, "global_step": 274927, "epoch": 3312} {"train_loss": -25.434879302978516, "global_step": 274928, "epoch": 3312} {"train_loss": -25.577041625976562, "global_step": 274929, "epoch": 3312} {"train_loss": -25.21733283996582, "global_step": 274930, "epoch": 3312} {"train_loss": -25.421398162841797, "global_step": 274931, "epoch": 3312} {"train_loss": -25.384206771850586, "global_step": 274932, "epoch": 3312} {"train_loss": -25.35297966003418, "global_step": 274933, "epoch": 3312} {"train_loss": -25.469783782958984, "global_step": 274934, "epoch": 3312} {"train_loss": -25.556564331054688, "global_step": 274935, "epoch": 3312} {"train_loss": -25.60031509399414, "global_step": 274936, "epoch": 3312} {"train_loss": -25.38773536682129, "global_step": 274937, "epoch": 3312} {"train_loss": -25.567197799682617, "global_step": 274938, "epoch": 3312} {"train_loss": -25.304309844970703, "global_step": 274939, "epoch": 3312} {"train_loss": -25.161962509155273, "global_step": 274940, "epoch": 3312} {"train_loss": -25.28784942626953, "global_step": 274941, "epoch": 3312} {"train_loss": -25.45615577697754, "global_step": 274942, "epoch": 3312} {"train_loss": -25.52926254272461, "global_step": 274943, "epoch": 3312} {"train_loss": -25.66621208190918, "global_step": 274944, "epoch": 3312} {"train_loss": -25.463199615478516, "global_step": 274945, "epoch": 3312} {"train_loss": -25.75929832458496, "global_step": 274946, "epoch": 3312} {"train_loss": -25.711225509643555, "global_step": 274947, "epoch": 3312} {"train_loss": -25.127866744995117, "global_step": 274948, "epoch": 3312} {"train_loss": -25.328798294067383, "global_step": 274949, "epoch": 3312} {"train_loss": -25.232759475708008, "global_step": 274950, "epoch": 3312} {"train_loss": -25.467639923095703, "global_step": 274951, "epoch": 3312} {"train_loss": -25.289396286010742, "global_step": 274952, "epoch": 3312} {"train_loss": -25.477724075317383, "global_step": 274953, "epoch": 3312} {"train_loss": -25.25747299194336, "global_step": 274954, "epoch": 3312} {"train_loss": -25.481298446655273, "global_step": 274955, "epoch": 3312} {"train_loss": -25.30586814880371, "global_step": 274956, "epoch": 3312} {"train_loss": -25.242372512817383, "global_step": 274957, "epoch": 3312} {"train_loss": -25.1168270111084, "global_step": 274958, "epoch": 3312} {"train_loss": -25.331512451171875, "global_step": 274959, "epoch": 3312} {"train_loss": -25.124887466430664, "global_step": 274960, "epoch": 3312} {"train_loss": -25.521039962768555, "global_step": 274961, "epoch": 3312} {"train_loss": -25.42133331298828, "global_step": 274962, "epoch": 3312} {"train_loss": -25.564729690551758, "global_step": 274963, "epoch": 3312} {"train_loss": -25.221078872680664, "global_step": 274964, "epoch": 3312} {"train_loss": -25.498769760131836, "global_step": 274965, "epoch": 3312} {"train_loss": -25.491369247436523, "global_step": 274966, "epoch": 3312} {"train_loss": -25.53471565246582, "global_step": 274967, "epoch": 3312} {"train_loss": -25.511474609375, "global_step": 274968, "epoch": 3312} {"train_loss": -25.183691024780273, "global_step": 274969, "epoch": 3312} {"train_loss": -25.26058578491211, "global_step": 274970, "epoch": 3312} {"train_loss": -25.4504337310791, "global_step": 274971, "epoch": 3312} {"train_loss": -24.95513916015625, "global_step": 274972, "epoch": 3312} {"train_loss": -25.537809371948242, "global_step": 274973, "epoch": 3312} {"train_loss": -25.44607925415039, "global_step": 274974, "epoch": 3312} {"train_loss": -25.321348190307617, "global_step": 274975, "epoch": 3312} {"train_loss": -25.454620361328125, "global_step": 274976, "epoch": 3312} {"train_loss": -25.4591064453125, "global_step": 274977, "epoch": 3312} {"train_loss": -25.203600642192793, "global_step": 274978, "epoch": 3312, "val_loss": 7027018.0} {"train_loss": -25.201889038085938, "global_step": 274979, "epoch": 3313} {"train_loss": -24.594078063964844, "global_step": 274980, "epoch": 3313} {"train_loss": -25.168142318725586, "global_step": 274981, "epoch": 3313} {"train_loss": -24.99290657043457, "global_step": 274982, "epoch": 3313} {"train_loss": -25.739118576049805, "global_step": 274983, "epoch": 3313} {"train_loss": -25.208454132080078, "global_step": 274984, "epoch": 3313} {"train_loss": -25.111791610717773, "global_step": 274985, "epoch": 3313} {"train_loss": -25.54294776916504, "global_step": 274986, "epoch": 3313} {"train_loss": -24.99683952331543, "global_step": 274987, "epoch": 3313} {"train_loss": -25.2487850189209, "global_step": 274988, "epoch": 3313} {"train_loss": -25.192882537841797, "global_step": 274989, "epoch": 3313} {"train_loss": -25.40129852294922, "global_step": 274990, "epoch": 3313} {"train_loss": -25.26563835144043, "global_step": 274991, "epoch": 3313} {"train_loss": -25.370677947998047, "global_step": 274992, "epoch": 3313} {"train_loss": -25.713123321533203, "global_step": 274993, "epoch": 3313} {"train_loss": -24.974430084228516, "global_step": 274994, "epoch": 3313} {"train_loss": -25.549936294555664, "global_step": 274995, "epoch": 3313} {"train_loss": -25.346492767333984, "global_step": 274996, "epoch": 3313} {"train_loss": -25.550275802612305, "global_step": 274997, "epoch": 3313} {"train_loss": -25.172191619873047, "global_step": 274998, "epoch": 3313} {"train_loss": -25.218223571777344, "global_step": 274999, "epoch": 3313} {"train_loss": -25.067153930664062, "global_step": 275000, "epoch": 3313} {"train_loss": -25.50212860107422, "global_step": 275001, "epoch": 3313} {"train_loss": -25.499181747436523, "global_step": 275002, "epoch": 3313} {"train_loss": -25.79249382019043, "global_step": 275003, "epoch": 3313} {"train_loss": -25.567655563354492, "global_step": 275004, "epoch": 3313} {"train_loss": -25.62177085876465, "global_step": 275005, "epoch": 3313} {"train_loss": -25.584028244018555, "global_step": 275006, "epoch": 3313} {"train_loss": -25.39325714111328, "global_step": 275007, "epoch": 3313} {"train_loss": -25.201223373413086, "global_step": 275008, "epoch": 3313} {"train_loss": -25.694669723510742, "global_step": 275009, "epoch": 3313} {"train_loss": -25.467098236083984, "global_step": 275010, "epoch": 3313} {"train_loss": -25.509767532348633, "global_step": 275011, "epoch": 3313} {"train_loss": -25.18448257446289, "global_step": 275012, "epoch": 3313} {"train_loss": -25.213104248046875, "global_step": 275013, "epoch": 3313} {"train_loss": -25.088117599487305, "global_step": 275014, "epoch": 3313} {"train_loss": -25.419158935546875, "global_step": 275015, "epoch": 3313} {"train_loss": -25.501670837402344, "global_step": 275016, "epoch": 3313} {"train_loss": -25.143875122070312, "global_step": 275017, "epoch": 3313} {"train_loss": -25.299015045166016, "global_step": 275018, "epoch": 3313} {"train_loss": -24.88991355895996, "global_step": 275019, "epoch": 3313} {"train_loss": -24.71914291381836, "global_step": 275020, "epoch": 3313} {"train_loss": -24.862873077392578, "global_step": 275021, "epoch": 3313} {"train_loss": -25.23728370666504, "global_step": 275022, "epoch": 3313} {"train_loss": -25.074188232421875, "global_step": 275023, "epoch": 3313} {"train_loss": -25.45013427734375, "global_step": 275024, "epoch": 3313} {"train_loss": -25.520090103149414, "global_step": 275025, "epoch": 3313} {"train_loss": -25.57535171508789, "global_step": 275026, "epoch": 3313} {"train_loss": -25.16135025024414, "global_step": 275027, "epoch": 3313} {"train_loss": -25.158370971679688, "global_step": 275028, "epoch": 3313} {"train_loss": -25.324567794799805, "global_step": 275029, "epoch": 3313} {"train_loss": -25.04560661315918, "global_step": 275030, "epoch": 3313} {"train_loss": -24.942245483398438, "global_step": 275031, "epoch": 3313} {"train_loss": -24.760160446166992, "global_step": 275032, "epoch": 3313} {"train_loss": -25.200977325439453, "global_step": 275033, "epoch": 3313} {"train_loss": -25.653898239135742, "global_step": 275034, "epoch": 3313} {"train_loss": -25.667661666870117, "global_step": 275035, "epoch": 3313} {"train_loss": -25.189767837524414, "global_step": 275036, "epoch": 3313} {"train_loss": -25.42891502380371, "global_step": 275037, "epoch": 3313} {"train_loss": -25.197965621948242, "global_step": 275038, "epoch": 3313} {"train_loss": -25.50800895690918, "global_step": 275039, "epoch": 3313} {"train_loss": -25.26076889038086, "global_step": 275040, "epoch": 3313} {"train_loss": -25.659555435180664, "global_step": 275041, "epoch": 3313} {"train_loss": -25.34423065185547, "global_step": 275042, "epoch": 3313} {"train_loss": -25.84730339050293, "global_step": 275043, "epoch": 3313} {"train_loss": -25.235525131225586, "global_step": 275044, "epoch": 3313} {"train_loss": -25.528112411499023, "global_step": 275045, "epoch": 3313} {"train_loss": -25.624710083007812, "global_step": 275046, "epoch": 3313} {"train_loss": -25.33885383605957, "global_step": 275047, "epoch": 3313} {"train_loss": -25.904447555541992, "global_step": 275048, "epoch": 3313} {"train_loss": -25.4271183013916, "global_step": 275049, "epoch": 3313} {"train_loss": -25.349056243896484, "global_step": 275050, "epoch": 3313} {"train_loss": -25.66419792175293, "global_step": 275051, "epoch": 3313} {"train_loss": -25.388830184936523, "global_step": 275052, "epoch": 3313} {"train_loss": -25.52033042907715, "global_step": 275053, "epoch": 3313} {"train_loss": -25.1822452545166, "global_step": 275054, "epoch": 3313} {"train_loss": -25.26485252380371, "global_step": 275055, "epoch": 3313} {"train_loss": -25.228933334350586, "global_step": 275056, "epoch": 3313} {"train_loss": -25.41717529296875, "global_step": 275057, "epoch": 3313} {"train_loss": -25.14904022216797, "global_step": 275058, "epoch": 3313} {"train_loss": -25.365964889526367, "global_step": 275059, "epoch": 3313} {"train_loss": -25.22163200378418, "global_step": 275060, "epoch": 3313} {"train_loss": -25.333314114306347, "global_step": 275061, "epoch": 3313, "val_loss": 7120384.0} {"train_loss": -24.615514755249023, "global_step": 275062, "epoch": 3314} {"train_loss": -24.555578231811523, "global_step": 275063, "epoch": 3314} {"train_loss": -24.01373291015625, "global_step": 275064, "epoch": 3314} {"train_loss": -24.498512268066406, "global_step": 275065, "epoch": 3314} {"train_loss": -24.569374084472656, "global_step": 275066, "epoch": 3314} {"train_loss": -24.689359664916992, "global_step": 275067, "epoch": 3314} {"train_loss": -24.35282325744629, "global_step": 275068, "epoch": 3314} {"train_loss": -24.51348876953125, "global_step": 275069, "epoch": 3314} {"train_loss": -24.64518928527832, "global_step": 275070, "epoch": 3314} {"train_loss": -24.592435836791992, "global_step": 275071, "epoch": 3314} {"train_loss": -24.75943946838379, "global_step": 275072, "epoch": 3314} {"train_loss": -25.048439025878906, "global_step": 275073, "epoch": 3314} {"train_loss": -24.893423080444336, "global_step": 275074, "epoch": 3314} {"train_loss": -24.56216812133789, "global_step": 275075, "epoch": 3314} {"train_loss": -24.758638381958008, "global_step": 275076, "epoch": 3314} {"train_loss": -24.674114227294922, "global_step": 275077, "epoch": 3314} {"train_loss": -24.984704971313477, "global_step": 275078, "epoch": 3314} {"train_loss": -25.286884307861328, "global_step": 275079, "epoch": 3314} {"train_loss": -24.811594009399414, "global_step": 275080, "epoch": 3314} {"train_loss": -24.97382354736328, "global_step": 275081, "epoch": 3314} {"train_loss": -24.774099349975586, "global_step": 275082, "epoch": 3314} {"train_loss": -24.953916549682617, "global_step": 275083, "epoch": 3314} {"train_loss": -25.273073196411133, "global_step": 275084, "epoch": 3314} {"train_loss": -25.399499893188477, "global_step": 275085, "epoch": 3314} {"train_loss": -25.0587215423584, "global_step": 275086, "epoch": 3314} {"train_loss": -25.298080444335938, "global_step": 275087, "epoch": 3314} {"train_loss": -25.139299392700195, "global_step": 275088, "epoch": 3314} {"train_loss": -25.508800506591797, "global_step": 275089, "epoch": 3314} {"train_loss": -25.552766799926758, "global_step": 275090, "epoch": 3314} {"train_loss": -25.56299591064453, "global_step": 275091, "epoch": 3314} {"train_loss": -25.25775146484375, "global_step": 275092, "epoch": 3314} {"train_loss": -25.486709594726562, "global_step": 275093, "epoch": 3314} {"train_loss": -25.038490295410156, "global_step": 275094, "epoch": 3314} {"train_loss": -25.34499168395996, "global_step": 275095, "epoch": 3314} {"train_loss": -25.026304244995117, "global_step": 275096, "epoch": 3314} {"train_loss": -24.90529441833496, "global_step": 275097, "epoch": 3314} {"train_loss": -25.352596282958984, "global_step": 275098, "epoch": 3314} {"train_loss": -25.78400993347168, "global_step": 275099, "epoch": 3314} {"train_loss": -25.368619918823242, "global_step": 275100, "epoch": 3314} {"train_loss": -25.261510848999023, "global_step": 275101, "epoch": 3314} {"train_loss": -25.535375595092773, "global_step": 275102, "epoch": 3314} {"train_loss": -25.329845428466797, "global_step": 275103, "epoch": 3314} {"train_loss": -25.457021713256836, "global_step": 275104, "epoch": 3314} {"train_loss": -25.472152709960938, "global_step": 275105, "epoch": 3314} {"train_loss": -25.46730613708496, "global_step": 275106, "epoch": 3314} {"train_loss": -25.37613868713379, "global_step": 275107, "epoch": 3314} {"train_loss": -25.402381896972656, "global_step": 275108, "epoch": 3314} {"train_loss": -25.7476749420166, "global_step": 275109, "epoch": 3314} {"train_loss": -25.62384033203125, "global_step": 275110, "epoch": 3314} {"train_loss": -25.748998641967773, "global_step": 275111, "epoch": 3314} {"train_loss": -25.53304100036621, "global_step": 275112, "epoch": 3314} {"train_loss": -25.587764739990234, "global_step": 275113, "epoch": 3314} {"train_loss": -25.463834762573242, "global_step": 275114, "epoch": 3314} {"train_loss": -25.440038681030273, "global_step": 275115, "epoch": 3314} {"train_loss": -25.37578582763672, "global_step": 275116, "epoch": 3314} {"train_loss": -25.54034996032715, "global_step": 275117, "epoch": 3314} {"train_loss": -25.796934127807617, "global_step": 275118, "epoch": 3314} {"train_loss": -25.485553741455078, "global_step": 275119, "epoch": 3314} {"train_loss": -25.523666381835938, "global_step": 275120, "epoch": 3314} {"train_loss": -25.826562881469727, "global_step": 275121, "epoch": 3314} {"train_loss": -25.521451950073242, "global_step": 275122, "epoch": 3314} {"train_loss": -25.528594970703125, "global_step": 275123, "epoch": 3314} {"train_loss": -25.789112091064453, "global_step": 275124, "epoch": 3314} {"train_loss": -25.693838119506836, "global_step": 275125, "epoch": 3314} {"train_loss": -25.249797821044922, "global_step": 275126, "epoch": 3314} {"train_loss": -25.743600845336914, "global_step": 275127, "epoch": 3314} {"train_loss": -25.508453369140625, "global_step": 275128, "epoch": 3314} {"train_loss": -25.3750057220459, "global_step": 275129, "epoch": 3314} {"train_loss": -25.109577178955078, "global_step": 275130, "epoch": 3314} {"train_loss": -25.198780059814453, "global_step": 275131, "epoch": 3314} {"train_loss": -25.45184898376465, "global_step": 275132, "epoch": 3314} {"train_loss": -25.35057830810547, "global_step": 275133, "epoch": 3314} {"train_loss": -25.598142623901367, "global_step": 275134, "epoch": 3314} {"train_loss": -25.388538360595703, "global_step": 275135, "epoch": 3314} {"train_loss": -25.463254928588867, "global_step": 275136, "epoch": 3314} {"train_loss": -24.946826934814453, "global_step": 275137, "epoch": 3314} {"train_loss": -25.50210952758789, "global_step": 275138, "epoch": 3314} {"train_loss": -24.93729019165039, "global_step": 275139, "epoch": 3314} {"train_loss": -24.887434005737305, "global_step": 275140, "epoch": 3314} {"train_loss": -25.058317184448242, "global_step": 275141, "epoch": 3314} {"train_loss": -25.59236717224121, "global_step": 275142, "epoch": 3314} {"train_loss": -24.962594985961914, "global_step": 275143, "epoch": 3314} {"train_loss": -25.23182664434594, "global_step": 275144, "epoch": 3314, "val_loss": 6947643.0} {"train_loss": -24.503236770629883, "global_step": 275145, "epoch": 3315} {"train_loss": -23.295475006103516, "global_step": 275146, "epoch": 3315} {"train_loss": -23.470918655395508, "global_step": 275147, "epoch": 3315} {"train_loss": -24.4349365234375, "global_step": 275148, "epoch": 3315} {"train_loss": -24.21186637878418, "global_step": 275149, "epoch": 3315} {"train_loss": -24.1047420501709, "global_step": 275150, "epoch": 3315} {"train_loss": -24.431703567504883, "global_step": 275151, "epoch": 3315} {"train_loss": -24.02516746520996, "global_step": 275152, "epoch": 3315} {"train_loss": -24.809926986694336, "global_step": 275153, "epoch": 3315} {"train_loss": -24.21558952331543, "global_step": 275154, "epoch": 3315} {"train_loss": -24.4412841796875, "global_step": 275155, "epoch": 3315} {"train_loss": -24.80568504333496, "global_step": 275156, "epoch": 3315} {"train_loss": -24.46728515625, "global_step": 275157, "epoch": 3315} {"train_loss": -24.724349975585938, "global_step": 275158, "epoch": 3315} {"train_loss": -24.852951049804688, "global_step": 275159, "epoch": 3315} {"train_loss": -24.560060501098633, "global_step": 275160, "epoch": 3315} {"train_loss": -25.114463806152344, "global_step": 275161, "epoch": 3315} {"train_loss": -25.22772789001465, "global_step": 275162, "epoch": 3315} {"train_loss": -24.841901779174805, "global_step": 275163, "epoch": 3315} {"train_loss": -24.980682373046875, "global_step": 275164, "epoch": 3315} {"train_loss": -25.27984619140625, "global_step": 275165, "epoch": 3315} {"train_loss": -25.15620994567871, "global_step": 275166, "epoch": 3315} {"train_loss": -24.995351791381836, "global_step": 275167, "epoch": 3315} {"train_loss": -24.7669677734375, "global_step": 275168, "epoch": 3315} {"train_loss": -25.085172653198242, "global_step": 275169, "epoch": 3315} {"train_loss": -25.172880172729492, "global_step": 275170, "epoch": 3315} {"train_loss": -25.154369354248047, "global_step": 275171, "epoch": 3315} {"train_loss": -25.196582794189453, "global_step": 275172, "epoch": 3315} {"train_loss": -25.08186912536621, "global_step": 275173, "epoch": 3315} {"train_loss": -25.159515380859375, "global_step": 275174, "epoch": 3315} {"train_loss": -24.989500045776367, "global_step": 275175, "epoch": 3315} {"train_loss": -25.75249671936035, "global_step": 275176, "epoch": 3315} {"train_loss": -25.293628692626953, "global_step": 275177, "epoch": 3315} {"train_loss": -25.0421199798584, "global_step": 275178, "epoch": 3315} {"train_loss": -25.39143180847168, "global_step": 275179, "epoch": 3315} {"train_loss": -25.147327423095703, "global_step": 275180, "epoch": 3315} {"train_loss": -25.39369010925293, "global_step": 275181, "epoch": 3315} {"train_loss": -25.017921447753906, "global_step": 275182, "epoch": 3315} {"train_loss": -25.335155487060547, "global_step": 275183, "epoch": 3315} {"train_loss": -25.753625869750977, "global_step": 275184, "epoch": 3315} {"train_loss": -25.55677032470703, "global_step": 275185, "epoch": 3315} {"train_loss": -25.177709579467773, "global_step": 275186, "epoch": 3315} {"train_loss": -25.334850311279297, "global_step": 275187, "epoch": 3315} {"train_loss": -25.532806396484375, "global_step": 275188, "epoch": 3315} {"train_loss": -25.17554473876953, "global_step": 275189, "epoch": 3315} {"train_loss": -25.582550048828125, "global_step": 275190, "epoch": 3315} {"train_loss": -25.255115509033203, "global_step": 275191, "epoch": 3315} {"train_loss": -25.46028709411621, "global_step": 275192, "epoch": 3315} {"train_loss": -25.67575454711914, "global_step": 275193, "epoch": 3315} {"train_loss": -25.560468673706055, "global_step": 275194, "epoch": 3315} {"train_loss": -25.55820083618164, "global_step": 275195, "epoch": 3315} {"train_loss": -25.182144165039062, "global_step": 275196, "epoch": 3315} {"train_loss": -25.259342193603516, "global_step": 275197, "epoch": 3315} {"train_loss": -25.263296127319336, "global_step": 275198, "epoch": 3315} {"train_loss": -24.66558265686035, "global_step": 275199, "epoch": 3315} {"train_loss": -25.352575302124023, "global_step": 275200, "epoch": 3315} {"train_loss": -25.305713653564453, "global_step": 275201, "epoch": 3315} {"train_loss": -25.247690200805664, "global_step": 275202, "epoch": 3315} {"train_loss": -25.046226501464844, "global_step": 275203, "epoch": 3315} {"train_loss": -25.00864601135254, "global_step": 275204, "epoch": 3315} {"train_loss": -25.382843017578125, "global_step": 275205, "epoch": 3315} {"train_loss": -25.41872215270996, "global_step": 275206, "epoch": 3315} {"train_loss": -25.449064254760742, "global_step": 275207, "epoch": 3315} {"train_loss": -25.482580184936523, "global_step": 275208, "epoch": 3315} {"train_loss": -25.568994522094727, "global_step": 275209, "epoch": 3315} {"train_loss": -25.324615478515625, "global_step": 275210, "epoch": 3315} {"train_loss": -25.630054473876953, "global_step": 275211, "epoch": 3315} {"train_loss": -25.4863338470459, "global_step": 275212, "epoch": 3315} {"train_loss": -25.358713150024414, "global_step": 275213, "epoch": 3315} {"train_loss": -25.239595413208008, "global_step": 275214, "epoch": 3315} {"train_loss": -25.6093692779541, "global_step": 275215, "epoch": 3315} {"train_loss": -25.541519165039062, "global_step": 275216, "epoch": 3315} {"train_loss": -25.373369216918945, "global_step": 275217, "epoch": 3315} {"train_loss": -25.391294479370117, "global_step": 275218, "epoch": 3315} {"train_loss": -25.57486343383789, "global_step": 275219, "epoch": 3315} {"train_loss": -25.749237060546875, "global_step": 275220, "epoch": 3315} {"train_loss": -25.217803955078125, "global_step": 275221, "epoch": 3315} {"train_loss": -25.425222396850586, "global_step": 275222, "epoch": 3315} {"train_loss": -25.52806854248047, "global_step": 275223, "epoch": 3315} {"train_loss": -25.717161178588867, "global_step": 275224, "epoch": 3315} {"train_loss": -25.222837448120117, "global_step": 275225, "epoch": 3315} {"train_loss": -25.728107452392578, "global_step": 275226, "epoch": 3315} {"train_loss": -25.146789458860834, "global_step": 275227, "epoch": 3315, "val_loss": 7006001.0} {"train_loss": -25.134016036987305, "global_step": 275228, "epoch": 3316} {"train_loss": -25.085920333862305, "global_step": 275229, "epoch": 3316} {"train_loss": -25.45730972290039, "global_step": 275230, "epoch": 3316} {"train_loss": -25.114675521850586, "global_step": 275231, "epoch": 3316} {"train_loss": -25.101892471313477, "global_step": 275232, "epoch": 3316} {"train_loss": -25.33695411682129, "global_step": 275233, "epoch": 3316} {"train_loss": -25.52731704711914, "global_step": 275234, "epoch": 3316} {"train_loss": -25.437833786010742, "global_step": 275235, "epoch": 3316} {"train_loss": -24.997398376464844, "global_step": 275236, "epoch": 3316} {"train_loss": -25.382104873657227, "global_step": 275237, "epoch": 3316} {"train_loss": -24.831220626831055, "global_step": 275238, "epoch": 3316} {"train_loss": -25.29619598388672, "global_step": 275239, "epoch": 3316} {"train_loss": -25.171710968017578, "global_step": 275240, "epoch": 3316} {"train_loss": -24.95204734802246, "global_step": 275241, "epoch": 3316} {"train_loss": -25.5964412689209, "global_step": 275242, "epoch": 3316} {"train_loss": -25.212953567504883, "global_step": 275243, "epoch": 3316} {"train_loss": -25.08925437927246, "global_step": 275244, "epoch": 3316} {"train_loss": -25.116455078125, "global_step": 275245, "epoch": 3316} {"train_loss": -25.053064346313477, "global_step": 275246, "epoch": 3316} {"train_loss": -25.18545150756836, "global_step": 275247, "epoch": 3316} {"train_loss": -25.144363403320312, "global_step": 275248, "epoch": 3316} {"train_loss": -25.47373390197754, "global_step": 275249, "epoch": 3316} {"train_loss": -25.667484283447266, "global_step": 275250, "epoch": 3316} {"train_loss": -25.322507858276367, "global_step": 275251, "epoch": 3316} {"train_loss": -25.0230655670166, "global_step": 275252, "epoch": 3316} {"train_loss": -25.20099449157715, "global_step": 275253, "epoch": 3316} {"train_loss": -25.199853897094727, "global_step": 275254, "epoch": 3316} {"train_loss": -25.834381103515625, "global_step": 275255, "epoch": 3316} {"train_loss": -25.062589645385742, "global_step": 275256, "epoch": 3316} {"train_loss": -25.44312286376953, "global_step": 275257, "epoch": 3316} {"train_loss": -25.270559310913086, "global_step": 275258, "epoch": 3316} {"train_loss": -25.213674545288086, "global_step": 275259, "epoch": 3316} {"train_loss": -25.287193298339844, "global_step": 275260, "epoch": 3316} {"train_loss": -25.300992965698242, "global_step": 275261, "epoch": 3316} {"train_loss": -25.534360885620117, "global_step": 275262, "epoch": 3316} {"train_loss": -25.507801055908203, "global_step": 275263, "epoch": 3316} {"train_loss": -25.34945297241211, "global_step": 275264, "epoch": 3316} {"train_loss": -25.785993576049805, "global_step": 275265, "epoch": 3316} {"train_loss": -25.204803466796875, "global_step": 275266, "epoch": 3316} {"train_loss": -25.556812286376953, "global_step": 275267, "epoch": 3316} {"train_loss": -25.669326782226562, "global_step": 275268, "epoch": 3316} {"train_loss": -25.634185791015625, "global_step": 275269, "epoch": 3316} {"train_loss": -25.524169921875, "global_step": 275270, "epoch": 3316} {"train_loss": -25.240890502929688, "global_step": 275271, "epoch": 3316} {"train_loss": -25.513452529907227, "global_step": 275272, "epoch": 3316} {"train_loss": -25.27626609802246, "global_step": 275273, "epoch": 3316} {"train_loss": -25.698835372924805, "global_step": 275274, "epoch": 3316} {"train_loss": -25.334823608398438, "global_step": 275275, "epoch": 3316} {"train_loss": -25.46027946472168, "global_step": 275276, "epoch": 3316} {"train_loss": -25.71346092224121, "global_step": 275277, "epoch": 3316} {"train_loss": -25.1593017578125, "global_step": 275278, "epoch": 3316} {"train_loss": -25.61252784729004, "global_step": 275279, "epoch": 3316} {"train_loss": -25.293447494506836, "global_step": 275280, "epoch": 3316} {"train_loss": -25.377286911010742, "global_step": 275281, "epoch": 3316} {"train_loss": -25.55268669128418, "global_step": 275282, "epoch": 3316} {"train_loss": -25.8388671875, "global_step": 275283, "epoch": 3316} {"train_loss": -25.464405059814453, "global_step": 275284, "epoch": 3316} {"train_loss": -25.724084854125977, "global_step": 275285, "epoch": 3316} {"train_loss": -25.607458114624023, "global_step": 275286, "epoch": 3316} {"train_loss": -25.433307647705078, "global_step": 275287, "epoch": 3316} {"train_loss": -25.522083282470703, "global_step": 275288, "epoch": 3316} {"train_loss": -24.74614906311035, "global_step": 275289, "epoch": 3316} {"train_loss": -24.72784996032715, "global_step": 275290, "epoch": 3316} {"train_loss": -24.602201461791992, "global_step": 275291, "epoch": 3316} {"train_loss": -23.88886070251465, "global_step": 275292, "epoch": 3316} {"train_loss": -24.89657974243164, "global_step": 275293, "epoch": 3316} {"train_loss": -24.533048629760742, "global_step": 275294, "epoch": 3316} {"train_loss": -25.010297775268555, "global_step": 275295, "epoch": 3316} {"train_loss": -24.93900489807129, "global_step": 275296, "epoch": 3316} {"train_loss": -24.956125259399414, "global_step": 275297, "epoch": 3316} {"train_loss": -25.125211715698242, "global_step": 275298, "epoch": 3316} {"train_loss": -24.961999893188477, "global_step": 275299, "epoch": 3316} {"train_loss": -25.134428024291992, "global_step": 275300, "epoch": 3316} {"train_loss": -25.320804595947266, "global_step": 275301, "epoch": 3316} {"train_loss": -25.256555557250977, "global_step": 275302, "epoch": 3316} {"train_loss": -25.040788650512695, "global_step": 275303, "epoch": 3316} {"train_loss": -25.276628494262695, "global_step": 275304, "epoch": 3316} {"train_loss": -25.202314376831055, "global_step": 275305, "epoch": 3316} {"train_loss": -25.33086585998535, "global_step": 275306, "epoch": 3316} {"train_loss": -25.195886611938477, "global_step": 275307, "epoch": 3316} {"train_loss": -25.255937576293945, "global_step": 275308, "epoch": 3316} {"train_loss": -25.245330810546875, "global_step": 275309, "epoch": 3316} {"train_loss": -25.277029313236834, "global_step": 275310, "epoch": 3316, "val_loss": 7071137.5} {"train_loss": -24.963394165039062, "global_step": 275311, "epoch": 3317} {"train_loss": -24.9422550201416, "global_step": 275312, "epoch": 3317} {"train_loss": -25.07577896118164, "global_step": 275313, "epoch": 3317} {"train_loss": -25.055723190307617, "global_step": 275314, "epoch": 3317} {"train_loss": -24.846403121948242, "global_step": 275315, "epoch": 3317} {"train_loss": -25.251941680908203, "global_step": 275316, "epoch": 3317} {"train_loss": -25.16070556640625, "global_step": 275317, "epoch": 3317} {"train_loss": -25.044519424438477, "global_step": 275318, "epoch": 3317} {"train_loss": -25.448965072631836, "global_step": 275319, "epoch": 3317} {"train_loss": -24.9810733795166, "global_step": 275320, "epoch": 3317} {"train_loss": -25.314939498901367, "global_step": 275321, "epoch": 3317} {"train_loss": -25.4378604888916, "global_step": 275322, "epoch": 3317} {"train_loss": -25.05632972717285, "global_step": 275323, "epoch": 3317} {"train_loss": -25.1829891204834, "global_step": 275324, "epoch": 3317} {"train_loss": -24.93339729309082, "global_step": 275325, "epoch": 3317} {"train_loss": -25.05009651184082, "global_step": 275326, "epoch": 3317} {"train_loss": -25.155696868896484, "global_step": 275327, "epoch": 3317} {"train_loss": -25.28578758239746, "global_step": 275328, "epoch": 3317} {"train_loss": -24.885147094726562, "global_step": 275329, "epoch": 3317} {"train_loss": -25.03627586364746, "global_step": 275330, "epoch": 3317} {"train_loss": -25.516372680664062, "global_step": 275331, "epoch": 3317} {"train_loss": -24.894489288330078, "global_step": 275332, "epoch": 3317} {"train_loss": -25.272689819335938, "global_step": 275333, "epoch": 3317} {"train_loss": -24.94123649597168, "global_step": 275334, "epoch": 3317} {"train_loss": -25.619043350219727, "global_step": 275335, "epoch": 3317} {"train_loss": -25.160818099975586, "global_step": 275336, "epoch": 3317} {"train_loss": -25.629907608032227, "global_step": 275337, "epoch": 3317} {"train_loss": -25.411413192749023, "global_step": 275338, "epoch": 3317} {"train_loss": -25.221467971801758, "global_step": 275339, "epoch": 3317} {"train_loss": -25.3486270904541, "global_step": 275340, "epoch": 3317} {"train_loss": -25.125436782836914, "global_step": 275341, "epoch": 3317} {"train_loss": -25.46310043334961, "global_step": 275342, "epoch": 3317} {"train_loss": -25.317590713500977, "global_step": 275343, "epoch": 3317} {"train_loss": -25.460052490234375, "global_step": 275344, "epoch": 3317} {"train_loss": -25.457416534423828, "global_step": 275345, "epoch": 3317} {"train_loss": -25.05243492126465, "global_step": 275346, "epoch": 3317} {"train_loss": -25.531875610351562, "global_step": 275347, "epoch": 3317} {"train_loss": -25.381071090698242, "global_step": 275348, "epoch": 3317} {"train_loss": -25.460777282714844, "global_step": 275349, "epoch": 3317} {"train_loss": -25.6711483001709, "global_step": 275350, "epoch": 3317} {"train_loss": -25.747343063354492, "global_step": 275351, "epoch": 3317} {"train_loss": -25.44193458557129, "global_step": 275352, "epoch": 3317} {"train_loss": -25.598054885864258, "global_step": 275353, "epoch": 3317} {"train_loss": -25.265596389770508, "global_step": 275354, "epoch": 3317} {"train_loss": -25.4968204498291, "global_step": 275355, "epoch": 3317} {"train_loss": -25.32086944580078, "global_step": 275356, "epoch": 3317} {"train_loss": -25.733610153198242, "global_step": 275357, "epoch": 3317} {"train_loss": -25.731958389282227, "global_step": 275358, "epoch": 3317} {"train_loss": -25.309934616088867, "global_step": 275359, "epoch": 3317} {"train_loss": -25.603315353393555, "global_step": 275360, "epoch": 3317} {"train_loss": -25.122581481933594, "global_step": 275361, "epoch": 3317} {"train_loss": -25.587602615356445, "global_step": 275362, "epoch": 3317} {"train_loss": -25.406408309936523, "global_step": 275363, "epoch": 3317} {"train_loss": -25.46921730041504, "global_step": 275364, "epoch": 3317} {"train_loss": -25.238264083862305, "global_step": 275365, "epoch": 3317} {"train_loss": -25.26166343688965, "global_step": 275366, "epoch": 3317} {"train_loss": -25.632474899291992, "global_step": 275367, "epoch": 3317} {"train_loss": -25.31648063659668, "global_step": 275368, "epoch": 3317} {"train_loss": -25.210508346557617, "global_step": 275369, "epoch": 3317} {"train_loss": -24.938791275024414, "global_step": 275370, "epoch": 3317} {"train_loss": -24.99293327331543, "global_step": 275371, "epoch": 3317} {"train_loss": -25.4664363861084, "global_step": 275372, "epoch": 3317} {"train_loss": -25.005516052246094, "global_step": 275373, "epoch": 3317} {"train_loss": -25.222692489624023, "global_step": 275374, "epoch": 3317} {"train_loss": -25.36518669128418, "global_step": 275375, "epoch": 3317} {"train_loss": -25.386198043823242, "global_step": 275376, "epoch": 3317} {"train_loss": -24.83144187927246, "global_step": 275377, "epoch": 3317} {"train_loss": -25.15338134765625, "global_step": 275378, "epoch": 3317} {"train_loss": -25.620779037475586, "global_step": 275379, "epoch": 3317} {"train_loss": -25.39600372314453, "global_step": 275380, "epoch": 3317} {"train_loss": -25.666290283203125, "global_step": 275381, "epoch": 3317} {"train_loss": -25.13302993774414, "global_step": 275382, "epoch": 3317} {"train_loss": -25.192312240600586, "global_step": 275383, "epoch": 3317} {"train_loss": -25.3395938873291, "global_step": 275384, "epoch": 3317} {"train_loss": -25.039653778076172, "global_step": 275385, "epoch": 3317} {"train_loss": -25.54728126525879, "global_step": 275386, "epoch": 3317} {"train_loss": -25.224842071533203, "global_step": 275387, "epoch": 3317} {"train_loss": -25.138790130615234, "global_step": 275388, "epoch": 3317} {"train_loss": -24.983083724975586, "global_step": 275389, "epoch": 3317} {"train_loss": -25.330249786376953, "global_step": 275390, "epoch": 3317} {"train_loss": -25.20383644104004, "global_step": 275391, "epoch": 3317} {"train_loss": -25.625152587890625, "global_step": 275392, "epoch": 3317} {"train_loss": -25.290871241006506, "global_step": 275393, "epoch": 3317, "val_loss": 6986225.0} {"train_loss": -25.24448585510254, "global_step": 275394, "epoch": 3318} {"train_loss": -25.01412582397461, "global_step": 275395, "epoch": 3318} {"train_loss": -25.01484489440918, "global_step": 275396, "epoch": 3318} {"train_loss": -25.073471069335938, "global_step": 275397, "epoch": 3318} {"train_loss": -24.83075714111328, "global_step": 275398, "epoch": 3318} {"train_loss": -24.68082046508789, "global_step": 275399, "epoch": 3318} {"train_loss": -24.925079345703125, "global_step": 275400, "epoch": 3318} {"train_loss": -24.802959442138672, "global_step": 275401, "epoch": 3318} {"train_loss": -25.208072662353516, "global_step": 275402, "epoch": 3318} {"train_loss": -25.12986946105957, "global_step": 275403, "epoch": 3318} {"train_loss": -25.60906410217285, "global_step": 275404, "epoch": 3318} {"train_loss": -25.272802352905273, "global_step": 275405, "epoch": 3318} {"train_loss": -25.187353134155273, "global_step": 275406, "epoch": 3318} {"train_loss": -25.110204696655273, "global_step": 275407, "epoch": 3318} {"train_loss": -25.43528938293457, "global_step": 275408, "epoch": 3318} {"train_loss": -25.252866744995117, "global_step": 275409, "epoch": 3318} {"train_loss": -25.170446395874023, "global_step": 275410, "epoch": 3318} {"train_loss": -25.217172622680664, "global_step": 275411, "epoch": 3318} {"train_loss": -25.433685302734375, "global_step": 275412, "epoch": 3318} {"train_loss": -25.5231990814209, "global_step": 275413, "epoch": 3318} {"train_loss": -25.14432716369629, "global_step": 275414, "epoch": 3318} {"train_loss": -25.29899024963379, "global_step": 275415, "epoch": 3318} {"train_loss": -25.671493530273438, "global_step": 275416, "epoch": 3318} {"train_loss": -25.231040954589844, "global_step": 275417, "epoch": 3318} {"train_loss": -25.6292724609375, "global_step": 275418, "epoch": 3318} {"train_loss": -25.314212799072266, "global_step": 275419, "epoch": 3318} {"train_loss": -25.255443572998047, "global_step": 275420, "epoch": 3318} {"train_loss": -25.702085494995117, "global_step": 275421, "epoch": 3318} {"train_loss": -25.628692626953125, "global_step": 275422, "epoch": 3318} {"train_loss": -25.490488052368164, "global_step": 275423, "epoch": 3318} {"train_loss": -25.505170822143555, "global_step": 275424, "epoch": 3318} {"train_loss": -25.51359748840332, "global_step": 275425, "epoch": 3318} {"train_loss": -25.626434326171875, "global_step": 275426, "epoch": 3318} {"train_loss": -25.454315185546875, "global_step": 275427, "epoch": 3318} {"train_loss": -25.175825119018555, "global_step": 275428, "epoch": 3318} {"train_loss": -25.418832778930664, "global_step": 275429, "epoch": 3318} {"train_loss": -25.57079315185547, "global_step": 275430, "epoch": 3318} {"train_loss": -25.542253494262695, "global_step": 275431, "epoch": 3318} {"train_loss": -25.256080627441406, "global_step": 275432, "epoch": 3318} {"train_loss": -25.27131462097168, "global_step": 275433, "epoch": 3318} {"train_loss": -25.562641143798828, "global_step": 275434, "epoch": 3318} {"train_loss": -25.35293960571289, "global_step": 275435, "epoch": 3318} {"train_loss": -25.5625057220459, "global_step": 275436, "epoch": 3318} {"train_loss": -25.503482818603516, "global_step": 275437, "epoch": 3318} {"train_loss": -25.568227767944336, "global_step": 275438, "epoch": 3318} {"train_loss": -25.049232482910156, "global_step": 275439, "epoch": 3318} {"train_loss": -24.908004760742188, "global_step": 275440, "epoch": 3318} {"train_loss": -25.226337432861328, "global_step": 275441, "epoch": 3318} {"train_loss": -25.561946868896484, "global_step": 275442, "epoch": 3318} {"train_loss": -25.41845703125, "global_step": 275443, "epoch": 3318} {"train_loss": -25.25237274169922, "global_step": 275444, "epoch": 3318} {"train_loss": -25.45855140686035, "global_step": 275445, "epoch": 3318} {"train_loss": -25.2694149017334, "global_step": 275446, "epoch": 3318} {"train_loss": -25.541860580444336, "global_step": 275447, "epoch": 3318} {"train_loss": -25.06233787536621, "global_step": 275448, "epoch": 3318} {"train_loss": -25.426603317260742, "global_step": 275449, "epoch": 3318} {"train_loss": -25.437910079956055, "global_step": 275450, "epoch": 3318} {"train_loss": -25.308313369750977, "global_step": 275451, "epoch": 3318} {"train_loss": -25.492219924926758, "global_step": 275452, "epoch": 3318} {"train_loss": -25.60721778869629, "global_step": 275453, "epoch": 3318} {"train_loss": -25.69248390197754, "global_step": 275454, "epoch": 3318} {"train_loss": -25.06696128845215, "global_step": 275455, "epoch": 3318} {"train_loss": -25.81624412536621, "global_step": 275456, "epoch": 3318} {"train_loss": -25.25640296936035, "global_step": 275457, "epoch": 3318} {"train_loss": -25.137603759765625, "global_step": 275458, "epoch": 3318} {"train_loss": -25.478002548217773, "global_step": 275459, "epoch": 3318} {"train_loss": -25.465900421142578, "global_step": 275460, "epoch": 3318} {"train_loss": -25.199459075927734, "global_step": 275461, "epoch": 3318} {"train_loss": -25.577924728393555, "global_step": 275462, "epoch": 3318} {"train_loss": -25.220352172851562, "global_step": 275463, "epoch": 3318} {"train_loss": -25.482717514038086, "global_step": 275464, "epoch": 3318} {"train_loss": -25.501605987548828, "global_step": 275465, "epoch": 3318} {"train_loss": -25.47187042236328, "global_step": 275466, "epoch": 3318} {"train_loss": -25.188940048217773, "global_step": 275467, "epoch": 3318} {"train_loss": -25.602575302124023, "global_step": 275468, "epoch": 3318} {"train_loss": -25.14057731628418, "global_step": 275469, "epoch": 3318} {"train_loss": -25.381620407104492, "global_step": 275470, "epoch": 3318} {"train_loss": -25.27908706665039, "global_step": 275471, "epoch": 3318} {"train_loss": -25.596891403198242, "global_step": 275472, "epoch": 3318} {"train_loss": -25.274351119995117, "global_step": 275473, "epoch": 3318} {"train_loss": -25.417707443237305, "global_step": 275474, "epoch": 3318} {"train_loss": -25.034015655517578, "global_step": 275475, "epoch": 3318} {"train_loss": -25.331875858536687, "global_step": 275476, "epoch": 3318, "val_loss": 7145979.0} {"train_loss": -24.992645263671875, "global_step": 275477, "epoch": 3319} {"train_loss": -24.66212272644043, "global_step": 275478, "epoch": 3319} {"train_loss": -24.5845947265625, "global_step": 275479, "epoch": 3319} {"train_loss": -24.923086166381836, "global_step": 275480, "epoch": 3319} {"train_loss": -25.055700302124023, "global_step": 275481, "epoch": 3319} {"train_loss": -25.16997528076172, "global_step": 275482, "epoch": 3319} {"train_loss": -24.66998291015625, "global_step": 275483, "epoch": 3319} {"train_loss": -24.86566925048828, "global_step": 275484, "epoch": 3319} {"train_loss": -25.031803131103516, "global_step": 275485, "epoch": 3319} {"train_loss": -24.761999130249023, "global_step": 275486, "epoch": 3319} {"train_loss": -24.7385311126709, "global_step": 275487, "epoch": 3319} {"train_loss": -25.28916358947754, "global_step": 275488, "epoch": 3319} {"train_loss": -25.43426513671875, "global_step": 275489, "epoch": 3319} {"train_loss": -24.87916374206543, "global_step": 275490, "epoch": 3319} {"train_loss": -25.053171157836914, "global_step": 275491, "epoch": 3319} {"train_loss": -25.401050567626953, "global_step": 275492, "epoch": 3319} {"train_loss": -24.71054458618164, "global_step": 275493, "epoch": 3319} {"train_loss": -24.949466705322266, "global_step": 275494, "epoch": 3319} {"train_loss": -25.12406349182129, "global_step": 275495, "epoch": 3319} {"train_loss": -25.0638484954834, "global_step": 275496, "epoch": 3319} {"train_loss": -24.876867294311523, "global_step": 275497, "epoch": 3319} {"train_loss": -25.667285919189453, "global_step": 275498, "epoch": 3319} {"train_loss": -25.161392211914062, "global_step": 275499, "epoch": 3319} {"train_loss": -24.782957077026367, "global_step": 275500, "epoch": 3319} {"train_loss": -25.603124618530273, "global_step": 275501, "epoch": 3319} {"train_loss": -25.018766403198242, "global_step": 275502, "epoch": 3319} {"train_loss": -25.39644432067871, "global_step": 275503, "epoch": 3319} {"train_loss": -25.22052764892578, "global_step": 275504, "epoch": 3319} {"train_loss": -25.583209991455078, "global_step": 275505, "epoch": 3319} {"train_loss": -25.379011154174805, "global_step": 275506, "epoch": 3319} {"train_loss": -25.727066040039062, "global_step": 275507, "epoch": 3319} {"train_loss": -25.539819717407227, "global_step": 275508, "epoch": 3319} {"train_loss": -25.689544677734375, "global_step": 275509, "epoch": 3319} {"train_loss": -25.451353073120117, "global_step": 275510, "epoch": 3319} {"train_loss": -25.450990676879883, "global_step": 275511, "epoch": 3319} {"train_loss": -25.507389068603516, "global_step": 275512, "epoch": 3319} {"train_loss": -25.409406661987305, "global_step": 275513, "epoch": 3319} {"train_loss": -25.536731719970703, "global_step": 275514, "epoch": 3319} {"train_loss": -25.273183822631836, "global_step": 275515, "epoch": 3319} {"train_loss": -25.584714889526367, "global_step": 275516, "epoch": 3319} {"train_loss": -25.39995765686035, "global_step": 275517, "epoch": 3319} {"train_loss": -25.82402992248535, "global_step": 275518, "epoch": 3319} {"train_loss": -25.426403045654297, "global_step": 275519, "epoch": 3319} {"train_loss": -25.29242515563965, "global_step": 275520, "epoch": 3319} {"train_loss": -25.324731826782227, "global_step": 275521, "epoch": 3319} {"train_loss": -25.11255645751953, "global_step": 275522, "epoch": 3319} {"train_loss": -25.3569278717041, "global_step": 275523, "epoch": 3319} {"train_loss": -25.642322540283203, "global_step": 275524, "epoch": 3319} {"train_loss": -25.53520965576172, "global_step": 275525, "epoch": 3319} {"train_loss": -25.576419830322266, "global_step": 275526, "epoch": 3319} {"train_loss": -25.358875274658203, "global_step": 275527, "epoch": 3319} {"train_loss": -25.44460105895996, "global_step": 275528, "epoch": 3319} {"train_loss": -25.7357234954834, "global_step": 275529, "epoch": 3319} {"train_loss": -25.165143966674805, "global_step": 275530, "epoch": 3319} {"train_loss": -25.57010841369629, "global_step": 275531, "epoch": 3319} {"train_loss": -25.45534324645996, "global_step": 275532, "epoch": 3319} {"train_loss": -25.369749069213867, "global_step": 275533, "epoch": 3319} {"train_loss": -25.478384017944336, "global_step": 275534, "epoch": 3319} {"train_loss": -25.555450439453125, "global_step": 275535, "epoch": 3319} {"train_loss": -25.099271774291992, "global_step": 275536, "epoch": 3319} {"train_loss": -25.15317153930664, "global_step": 275537, "epoch": 3319} {"train_loss": -25.35382652282715, "global_step": 275538, "epoch": 3319} {"train_loss": -25.41122817993164, "global_step": 275539, "epoch": 3319} {"train_loss": -25.606830596923828, "global_step": 275540, "epoch": 3319} {"train_loss": -25.269723892211914, "global_step": 275541, "epoch": 3319} {"train_loss": -25.265125274658203, "global_step": 275542, "epoch": 3319} {"train_loss": -25.282861709594727, "global_step": 275543, "epoch": 3319} {"train_loss": -25.30122184753418, "global_step": 275544, "epoch": 3319} {"train_loss": -24.88663101196289, "global_step": 275545, "epoch": 3319} {"train_loss": -25.23440933227539, "global_step": 275546, "epoch": 3319} {"train_loss": -25.21370506286621, "global_step": 275547, "epoch": 3319} {"train_loss": -25.271942138671875, "global_step": 275548, "epoch": 3319} {"train_loss": -25.204336166381836, "global_step": 275549, "epoch": 3319} {"train_loss": -25.28447723388672, "global_step": 275550, "epoch": 3319} {"train_loss": -25.11511993408203, "global_step": 275551, "epoch": 3319} {"train_loss": -25.150489807128906, "global_step": 275552, "epoch": 3319} {"train_loss": -25.508779525756836, "global_step": 275553, "epoch": 3319} {"train_loss": -25.434587478637695, "global_step": 275554, "epoch": 3319} {"train_loss": -25.42076873779297, "global_step": 275555, "epoch": 3319} {"train_loss": -25.305395126342773, "global_step": 275556, "epoch": 3319} {"train_loss": -25.412307739257812, "global_step": 275557, "epoch": 3319} {"train_loss": -25.142614364624023, "global_step": 275558, "epoch": 3319} {"train_loss": -25.272957330726715, "global_step": 275559, "epoch": 3319, "val_loss": 7074760.0} {"train_loss": -24.439186096191406, "global_step": 275560, "epoch": 3320} {"train_loss": -24.322792053222656, "global_step": 275561, "epoch": 3320} {"train_loss": -24.878238677978516, "global_step": 275562, "epoch": 3320} {"train_loss": -25.231983184814453, "global_step": 275563, "epoch": 3320} {"train_loss": -24.8044376373291, "global_step": 275564, "epoch": 3320} {"train_loss": -25.08796501159668, "global_step": 275565, "epoch": 3320} {"train_loss": -24.957950592041016, "global_step": 275566, "epoch": 3320} {"train_loss": -25.379337310791016, "global_step": 275567, "epoch": 3320} {"train_loss": -24.8585205078125, "global_step": 275568, "epoch": 3320} {"train_loss": -25.299367904663086, "global_step": 275569, "epoch": 3320} {"train_loss": -25.003225326538086, "global_step": 275570, "epoch": 3320} {"train_loss": -25.204381942749023, "global_step": 275571, "epoch": 3320} {"train_loss": -24.883512496948242, "global_step": 275572, "epoch": 3320} {"train_loss": -24.916799545288086, "global_step": 275573, "epoch": 3320} {"train_loss": -25.361677169799805, "global_step": 275574, "epoch": 3320} {"train_loss": -24.820314407348633, "global_step": 275575, "epoch": 3320} {"train_loss": -25.12203025817871, "global_step": 275576, "epoch": 3320} {"train_loss": -25.399988174438477, "global_step": 275577, "epoch": 3320} {"train_loss": -24.767553329467773, "global_step": 275578, "epoch": 3320} {"train_loss": -25.564653396606445, "global_step": 275579, "epoch": 3320} {"train_loss": -25.04079246520996, "global_step": 275580, "epoch": 3320} {"train_loss": -25.721588134765625, "global_step": 275581, "epoch": 3320} {"train_loss": -25.350751876831055, "global_step": 275582, "epoch": 3320} {"train_loss": -25.29845428466797, "global_step": 275583, "epoch": 3320} {"train_loss": -25.775470733642578, "global_step": 275584, "epoch": 3320} {"train_loss": -25.523761749267578, "global_step": 275585, "epoch": 3320} {"train_loss": -25.33333396911621, "global_step": 275586, "epoch": 3320} {"train_loss": -25.183561325073242, "global_step": 275587, "epoch": 3320} {"train_loss": -25.43904685974121, "global_step": 275588, "epoch": 3320} {"train_loss": -25.37849998474121, "global_step": 275589, "epoch": 3320} {"train_loss": -25.15864372253418, "global_step": 275590, "epoch": 3320} {"train_loss": -25.54313087463379, "global_step": 275591, "epoch": 3320} {"train_loss": -25.43854331970215, "global_step": 275592, "epoch": 3320} {"train_loss": -25.369279861450195, "global_step": 275593, "epoch": 3320} {"train_loss": -25.56659698486328, "global_step": 275594, "epoch": 3320} {"train_loss": -25.38637351989746, "global_step": 275595, "epoch": 3320} {"train_loss": -25.472076416015625, "global_step": 275596, "epoch": 3320} {"train_loss": -25.291492462158203, "global_step": 275597, "epoch": 3320} {"train_loss": -25.708417892456055, "global_step": 275598, "epoch": 3320} {"train_loss": -25.395536422729492, "global_step": 275599, "epoch": 3320} {"train_loss": -25.760955810546875, "global_step": 275600, "epoch": 3320} {"train_loss": -25.251493453979492, "global_step": 275601, "epoch": 3320} {"train_loss": -25.6506404876709, "global_step": 275602, "epoch": 3320} {"train_loss": -25.0611572265625, "global_step": 275603, "epoch": 3320} {"train_loss": -25.54654884338379, "global_step": 275604, "epoch": 3320} {"train_loss": -25.02753257751465, "global_step": 275605, "epoch": 3320} {"train_loss": -25.777118682861328, "global_step": 275606, "epoch": 3320} {"train_loss": -25.26336097717285, "global_step": 275607, "epoch": 3320} {"train_loss": -25.5978946685791, "global_step": 275608, "epoch": 3320} {"train_loss": -25.142345428466797, "global_step": 275609, "epoch": 3320} {"train_loss": -25.562305450439453, "global_step": 275610, "epoch": 3320} {"train_loss": -25.20857048034668, "global_step": 275611, "epoch": 3320} {"train_loss": -25.621923446655273, "global_step": 275612, "epoch": 3320} {"train_loss": -25.242334365844727, "global_step": 275613, "epoch": 3320} {"train_loss": -25.42774772644043, "global_step": 275614, "epoch": 3320} {"train_loss": -25.465412139892578, "global_step": 275615, "epoch": 3320} {"train_loss": -25.6903076171875, "global_step": 275616, "epoch": 3320} {"train_loss": -25.46879005432129, "global_step": 275617, "epoch": 3320} {"train_loss": -25.38899803161621, "global_step": 275618, "epoch": 3320} {"train_loss": -25.783422470092773, "global_step": 275619, "epoch": 3320} {"train_loss": -25.567474365234375, "global_step": 275620, "epoch": 3320} {"train_loss": -25.139646530151367, "global_step": 275621, "epoch": 3320} {"train_loss": -24.9095401763916, "global_step": 275622, "epoch": 3320} {"train_loss": -25.527334213256836, "global_step": 275623, "epoch": 3320} {"train_loss": -25.307950973510742, "global_step": 275624, "epoch": 3320} {"train_loss": -25.449615478515625, "global_step": 275625, "epoch": 3320} {"train_loss": -25.35684585571289, "global_step": 275626, "epoch": 3320} {"train_loss": -25.1821346282959, "global_step": 275627, "epoch": 3320} {"train_loss": -25.218652725219727, "global_step": 275628, "epoch": 3320} {"train_loss": -25.446928024291992, "global_step": 275629, "epoch": 3320} {"train_loss": -25.474468231201172, "global_step": 275630, "epoch": 3320} {"train_loss": -25.001663208007812, "global_step": 275631, "epoch": 3320} {"train_loss": -25.66977310180664, "global_step": 275632, "epoch": 3320} {"train_loss": -25.465229034423828, "global_step": 275633, "epoch": 3320} {"train_loss": -25.703948974609375, "global_step": 275634, "epoch": 3320} {"train_loss": -25.322416305541992, "global_step": 275635, "epoch": 3320} {"train_loss": -24.98563003540039, "global_step": 275636, "epoch": 3320} {"train_loss": -25.499927520751953, "global_step": 275637, "epoch": 3320} {"train_loss": -25.45652198791504, "global_step": 275638, "epoch": 3320} {"train_loss": -25.643341064453125, "global_step": 275639, "epoch": 3320} {"train_loss": -25.51158905029297, "global_step": 275640, "epoch": 3320} {"train_loss": -25.325101852416992, "global_step": 275641, "epoch": 3320} {"train_loss": -25.327973331313537, "global_step": 275642, "epoch": 3320, "val_loss": 7099590.0} {"train_loss": -25.413700103759766, "global_step": 275643, "epoch": 3321} {"train_loss": -24.779808044433594, "global_step": 275644, "epoch": 3321} {"train_loss": -25.330127716064453, "global_step": 275645, "epoch": 3321} {"train_loss": -25.036108016967773, "global_step": 275646, "epoch": 3321} {"train_loss": -24.87631607055664, "global_step": 275647, "epoch": 3321} {"train_loss": -24.70738983154297, "global_step": 275648, "epoch": 3321} {"train_loss": -25.069868087768555, "global_step": 275649, "epoch": 3321} {"train_loss": -25.409420013427734, "global_step": 275650, "epoch": 3321} {"train_loss": -24.897138595581055, "global_step": 275651, "epoch": 3321} {"train_loss": -25.553205490112305, "global_step": 275652, "epoch": 3321} {"train_loss": -25.109529495239258, "global_step": 275653, "epoch": 3321} {"train_loss": -25.068857192993164, "global_step": 275654, "epoch": 3321} {"train_loss": -24.99518585205078, "global_step": 275655, "epoch": 3321} {"train_loss": -25.053516387939453, "global_step": 275656, "epoch": 3321} {"train_loss": -25.62776756286621, "global_step": 275657, "epoch": 3321} {"train_loss": -25.343618392944336, "global_step": 275658, "epoch": 3321} {"train_loss": -25.41023826599121, "global_step": 275659, "epoch": 3321} {"train_loss": -25.333663940429688, "global_step": 275660, "epoch": 3321} {"train_loss": -25.486982345581055, "global_step": 275661, "epoch": 3321} {"train_loss": -25.439138412475586, "global_step": 275662, "epoch": 3321} {"train_loss": -25.275726318359375, "global_step": 275663, "epoch": 3321} {"train_loss": -25.419910430908203, "global_step": 275664, "epoch": 3321} {"train_loss": -25.65484046936035, "global_step": 275665, "epoch": 3321} {"train_loss": -25.40781593322754, "global_step": 275666, "epoch": 3321} {"train_loss": -25.3912410736084, "global_step": 275667, "epoch": 3321} {"train_loss": -25.20269203186035, "global_step": 275668, "epoch": 3321} {"train_loss": -25.400197982788086, "global_step": 275669, "epoch": 3321} {"train_loss": -24.908838272094727, "global_step": 275670, "epoch": 3321} {"train_loss": -25.5560302734375, "global_step": 275671, "epoch": 3321} {"train_loss": -25.376123428344727, "global_step": 275672, "epoch": 3321} {"train_loss": -25.365110397338867, "global_step": 275673, "epoch": 3321} {"train_loss": -25.825159072875977, "global_step": 275674, "epoch": 3321} {"train_loss": -25.672805786132812, "global_step": 275675, "epoch": 3321} {"train_loss": -25.1679744720459, "global_step": 275676, "epoch": 3321} {"train_loss": -25.59267234802246, "global_step": 275677, "epoch": 3321} {"train_loss": -25.696176528930664, "global_step": 275678, "epoch": 3321} {"train_loss": -25.57044792175293, "global_step": 275679, "epoch": 3321} {"train_loss": -25.41179656982422, "global_step": 275680, "epoch": 3321} {"train_loss": -25.666885375976562, "global_step": 275681, "epoch": 3321} {"train_loss": -25.433469772338867, "global_step": 275682, "epoch": 3321} {"train_loss": -25.320722579956055, "global_step": 275683, "epoch": 3321} {"train_loss": -25.384899139404297, "global_step": 275684, "epoch": 3321} {"train_loss": -25.29865264892578, "global_step": 275685, "epoch": 3321} {"train_loss": -24.95643424987793, "global_step": 275686, "epoch": 3321} {"train_loss": -24.997644424438477, "global_step": 275687, "epoch": 3321} {"train_loss": -25.025259017944336, "global_step": 275688, "epoch": 3321} {"train_loss": -24.831684112548828, "global_step": 275689, "epoch": 3321} {"train_loss": -25.163206100463867, "global_step": 275690, "epoch": 3321} {"train_loss": -25.00503158569336, "global_step": 275691, "epoch": 3321} {"train_loss": -25.45290184020996, "global_step": 275692, "epoch": 3321} {"train_loss": -25.411542892456055, "global_step": 275693, "epoch": 3321} {"train_loss": -24.583799362182617, "global_step": 275694, "epoch": 3321} {"train_loss": -25.177160263061523, "global_step": 275695, "epoch": 3321} {"train_loss": -24.936429977416992, "global_step": 275696, "epoch": 3321} {"train_loss": -25.45948600769043, "global_step": 275697, "epoch": 3321} {"train_loss": -25.14668846130371, "global_step": 275698, "epoch": 3321} {"train_loss": -25.61663246154785, "global_step": 275699, "epoch": 3321} {"train_loss": -25.475017547607422, "global_step": 275700, "epoch": 3321} {"train_loss": -25.089035034179688, "global_step": 275701, "epoch": 3321} {"train_loss": -24.91594886779785, "global_step": 275702, "epoch": 3321} {"train_loss": -25.41896629333496, "global_step": 275703, "epoch": 3321} {"train_loss": -25.234769821166992, "global_step": 275704, "epoch": 3321} {"train_loss": -25.54401206970215, "global_step": 275705, "epoch": 3321} {"train_loss": -25.325796127319336, "global_step": 275706, "epoch": 3321} {"train_loss": -25.517126083374023, "global_step": 275707, "epoch": 3321} {"train_loss": -25.26471519470215, "global_step": 275708, "epoch": 3321} {"train_loss": -25.65852928161621, "global_step": 275709, "epoch": 3321} {"train_loss": -25.41200065612793, "global_step": 275710, "epoch": 3321} {"train_loss": -25.785009384155273, "global_step": 275711, "epoch": 3321} {"train_loss": -25.690702438354492, "global_step": 275712, "epoch": 3321} {"train_loss": -25.452392578125, "global_step": 275713, "epoch": 3321} {"train_loss": -25.19411277770996, "global_step": 275714, "epoch": 3321} {"train_loss": -25.06235694885254, "global_step": 275715, "epoch": 3321} {"train_loss": -25.88106346130371, "global_step": 275716, "epoch": 3321} {"train_loss": -25.50149154663086, "global_step": 275717, "epoch": 3321} {"train_loss": -25.254623413085938, "global_step": 275718, "epoch": 3321} {"train_loss": -25.351388931274414, "global_step": 275719, "epoch": 3321} {"train_loss": -25.438615798950195, "global_step": 275720, "epoch": 3321} {"train_loss": -25.46764373779297, "global_step": 275721, "epoch": 3321} {"train_loss": -25.19017219543457, "global_step": 275722, "epoch": 3321} {"train_loss": -24.85631561279297, "global_step": 275723, "epoch": 3321} {"train_loss": -25.416574478149414, "global_step": 275724, "epoch": 3321} {"train_loss": -25.319052454936934, "global_step": 275725, "epoch": 3321, "val_loss": 7012605.5} {"train_loss": -23.057514190673828, "global_step": 275726, "epoch": 3322} {"train_loss": -22.5289249420166, "global_step": 275727, "epoch": 3322} {"train_loss": -25.13759422302246, "global_step": 275728, "epoch": 3322} {"train_loss": -23.760290145874023, "global_step": 275729, "epoch": 3322} {"train_loss": -24.800865173339844, "global_step": 275730, "epoch": 3322} {"train_loss": -23.876144409179688, "global_step": 275731, "epoch": 3322} {"train_loss": -24.601301193237305, "global_step": 275732, "epoch": 3322} {"train_loss": -24.915302276611328, "global_step": 275733, "epoch": 3322} {"train_loss": -24.697940826416016, "global_step": 275734, "epoch": 3322} {"train_loss": -24.751800537109375, "global_step": 275735, "epoch": 3322} {"train_loss": -24.821096420288086, "global_step": 275736, "epoch": 3322} {"train_loss": -24.728328704833984, "global_step": 275737, "epoch": 3322} {"train_loss": -24.828842163085938, "global_step": 275738, "epoch": 3322} {"train_loss": -24.924320220947266, "global_step": 275739, "epoch": 3322} {"train_loss": -25.008237838745117, "global_step": 275740, "epoch": 3322} {"train_loss": -24.53900718688965, "global_step": 275741, "epoch": 3322} {"train_loss": -25.2454891204834, "global_step": 275742, "epoch": 3322} {"train_loss": -24.740131378173828, "global_step": 275743, "epoch": 3322} {"train_loss": -25.28867530822754, "global_step": 275744, "epoch": 3322} {"train_loss": -25.02226448059082, "global_step": 275745, "epoch": 3322} {"train_loss": -24.877273559570312, "global_step": 275746, "epoch": 3322} {"train_loss": -24.737110137939453, "global_step": 275747, "epoch": 3322} {"train_loss": -25.190032958984375, "global_step": 275748, "epoch": 3322} {"train_loss": -25.125019073486328, "global_step": 275749, "epoch": 3322} {"train_loss": -24.913515090942383, "global_step": 275750, "epoch": 3322} {"train_loss": -24.997692108154297, "global_step": 275751, "epoch": 3322} {"train_loss": -24.57468605041504, "global_step": 275752, "epoch": 3322} {"train_loss": -24.783111572265625, "global_step": 275753, "epoch": 3322} {"train_loss": -25.03777503967285, "global_step": 275754, "epoch": 3322} {"train_loss": -25.06966209411621, "global_step": 275755, "epoch": 3322} {"train_loss": -25.228511810302734, "global_step": 275756, "epoch": 3322} {"train_loss": -25.0286922454834, "global_step": 275757, "epoch": 3322} {"train_loss": -25.081804275512695, "global_step": 275758, "epoch": 3322} {"train_loss": -25.840274810791016, "global_step": 275759, "epoch": 3322} {"train_loss": -25.08158302307129, "global_step": 275760, "epoch": 3322} {"train_loss": -24.89129638671875, "global_step": 275761, "epoch": 3322} {"train_loss": -25.132001876831055, "global_step": 275762, "epoch": 3322} {"train_loss": -24.887632369995117, "global_step": 275763, "epoch": 3322} {"train_loss": -25.122112274169922, "global_step": 275764, "epoch": 3322} {"train_loss": -25.114606857299805, "global_step": 275765, "epoch": 3322} {"train_loss": -25.371112823486328, "global_step": 275766, "epoch": 3322} {"train_loss": -24.988075256347656, "global_step": 275767, "epoch": 3322} {"train_loss": -25.704147338867188, "global_step": 275768, "epoch": 3322} {"train_loss": -25.307188034057617, "global_step": 275769, "epoch": 3322} {"train_loss": -25.387075424194336, "global_step": 275770, "epoch": 3322} {"train_loss": -25.44458770751953, "global_step": 275771, "epoch": 3322} {"train_loss": -25.4864501953125, "global_step": 275772, "epoch": 3322} {"train_loss": -25.64887809753418, "global_step": 275773, "epoch": 3322} {"train_loss": -25.43848991394043, "global_step": 275774, "epoch": 3322} {"train_loss": -25.170366287231445, "global_step": 275775, "epoch": 3322} {"train_loss": -25.385326385498047, "global_step": 275776, "epoch": 3322} {"train_loss": -25.467527389526367, "global_step": 275777, "epoch": 3322} {"train_loss": -25.250652313232422, "global_step": 275778, "epoch": 3322} {"train_loss": -25.203201293945312, "global_step": 275779, "epoch": 3322} {"train_loss": -25.84901237487793, "global_step": 275780, "epoch": 3322} {"train_loss": -25.40230369567871, "global_step": 275781, "epoch": 3322} {"train_loss": -25.61588478088379, "global_step": 275782, "epoch": 3322} {"train_loss": -25.55155372619629, "global_step": 275783, "epoch": 3322} {"train_loss": -25.5853214263916, "global_step": 275784, "epoch": 3322} {"train_loss": -25.45340347290039, "global_step": 275785, "epoch": 3322} {"train_loss": -25.348360061645508, "global_step": 275786, "epoch": 3322} {"train_loss": -25.348217010498047, "global_step": 275787, "epoch": 3322} {"train_loss": -25.023405075073242, "global_step": 275788, "epoch": 3322} {"train_loss": -25.678659439086914, "global_step": 275789, "epoch": 3322} {"train_loss": -25.429819107055664, "global_step": 275790, "epoch": 3322} {"train_loss": -25.683218002319336, "global_step": 275791, "epoch": 3322} {"train_loss": -25.043136596679688, "global_step": 275792, "epoch": 3322} {"train_loss": -25.58422088623047, "global_step": 275793, "epoch": 3322} {"train_loss": -25.244897842407227, "global_step": 275794, "epoch": 3322} {"train_loss": -25.002241134643555, "global_step": 275795, "epoch": 3322} {"train_loss": -24.925582885742188, "global_step": 275796, "epoch": 3322} {"train_loss": -25.163938522338867, "global_step": 275797, "epoch": 3322} {"train_loss": -25.05299186706543, "global_step": 275798, "epoch": 3322} {"train_loss": -25.735889434814453, "global_step": 275799, "epoch": 3322} {"train_loss": -25.383350372314453, "global_step": 275800, "epoch": 3322} {"train_loss": -25.07281494140625, "global_step": 275801, "epoch": 3322} {"train_loss": -25.03834342956543, "global_step": 275802, "epoch": 3322} {"train_loss": -25.417282104492188, "global_step": 275803, "epoch": 3322} {"train_loss": -25.15995979309082, "global_step": 275804, "epoch": 3322} {"train_loss": -25.329486846923828, "global_step": 275805, "epoch": 3322} {"train_loss": -25.062170028686523, "global_step": 275806, "epoch": 3322} {"train_loss": -25.619476318359375, "global_step": 275807, "epoch": 3322} {"train_loss": -25.080073620899615, "global_step": 275808, "epoch": 3322, "val_loss": 7173318.0} {"train_loss": -25.02983856201172, "global_step": 275809, "epoch": 3323} {"train_loss": -25.14487648010254, "global_step": 275810, "epoch": 3323} {"train_loss": -24.826770782470703, "global_step": 275811, "epoch": 3323} {"train_loss": -24.902141571044922, "global_step": 275812, "epoch": 3323} {"train_loss": -25.259780883789062, "global_step": 275813, "epoch": 3323} {"train_loss": -24.913543701171875, "global_step": 275814, "epoch": 3323} {"train_loss": -24.76834487915039, "global_step": 275815, "epoch": 3323} {"train_loss": -24.971311569213867, "global_step": 275816, "epoch": 3323} {"train_loss": -24.84258460998535, "global_step": 275817, "epoch": 3323} {"train_loss": -24.968618392944336, "global_step": 275818, "epoch": 3323} {"train_loss": -25.044843673706055, "global_step": 275819, "epoch": 3323} {"train_loss": -25.379714965820312, "global_step": 275820, "epoch": 3323} {"train_loss": -25.442861557006836, "global_step": 275821, "epoch": 3323} {"train_loss": -25.047000885009766, "global_step": 275822, "epoch": 3323} {"train_loss": -25.083463668823242, "global_step": 275823, "epoch": 3323} {"train_loss": -25.633935928344727, "global_step": 275824, "epoch": 3323} {"train_loss": -25.339712142944336, "global_step": 275825, "epoch": 3323} {"train_loss": -24.95708656311035, "global_step": 275826, "epoch": 3323} {"train_loss": -25.137611389160156, "global_step": 275827, "epoch": 3323} {"train_loss": -25.021053314208984, "global_step": 275828, "epoch": 3323} {"train_loss": -25.03334617614746, "global_step": 275829, "epoch": 3323} {"train_loss": -25.119497299194336, "global_step": 275830, "epoch": 3323} {"train_loss": -25.371036529541016, "global_step": 275831, "epoch": 3323} {"train_loss": -25.306934356689453, "global_step": 275832, "epoch": 3323} {"train_loss": -25.201007843017578, "global_step": 275833, "epoch": 3323} {"train_loss": -25.153850555419922, "global_step": 275834, "epoch": 3323} {"train_loss": -24.9620418548584, "global_step": 275835, "epoch": 3323} {"train_loss": -25.104873657226562, "global_step": 275836, "epoch": 3323} {"train_loss": -25.479780197143555, "global_step": 275837, "epoch": 3323} {"train_loss": -25.034231185913086, "global_step": 275838, "epoch": 3323} {"train_loss": -25.107107162475586, "global_step": 275839, "epoch": 3323} {"train_loss": -25.6884708404541, "global_step": 275840, "epoch": 3323} {"train_loss": -25.002029418945312, "global_step": 275841, "epoch": 3323} {"train_loss": -25.70090675354004, "global_step": 275842, "epoch": 3323} {"train_loss": -25.232364654541016, "global_step": 275843, "epoch": 3323} {"train_loss": -25.63466453552246, "global_step": 275844, "epoch": 3323} {"train_loss": -25.24915885925293, "global_step": 275845, "epoch": 3323} {"train_loss": -25.418087005615234, "global_step": 275846, "epoch": 3323} {"train_loss": -25.155576705932617, "global_step": 275847, "epoch": 3323} {"train_loss": -25.41816520690918, "global_step": 275848, "epoch": 3323} {"train_loss": -25.521974563598633, "global_step": 275849, "epoch": 3323} {"train_loss": -25.205951690673828, "global_step": 275850, "epoch": 3323} {"train_loss": -25.11414909362793, "global_step": 275851, "epoch": 3323} {"train_loss": -25.73700523376465, "global_step": 275852, "epoch": 3323} {"train_loss": -25.02470588684082, "global_step": 275853, "epoch": 3323} {"train_loss": -24.779388427734375, "global_step": 275854, "epoch": 3323} {"train_loss": -25.522417068481445, "global_step": 275855, "epoch": 3323} {"train_loss": -25.501962661743164, "global_step": 275856, "epoch": 3323} {"train_loss": -25.129606246948242, "global_step": 275857, "epoch": 3323} {"train_loss": -25.235828399658203, "global_step": 275858, "epoch": 3323} {"train_loss": -24.956539154052734, "global_step": 275859, "epoch": 3323} {"train_loss": -25.565500259399414, "global_step": 275860, "epoch": 3323} {"train_loss": -25.161020278930664, "global_step": 275861, "epoch": 3323} {"train_loss": -25.157899856567383, "global_step": 275862, "epoch": 3323} {"train_loss": -25.28485107421875, "global_step": 275863, "epoch": 3323} {"train_loss": -25.083255767822266, "global_step": 275864, "epoch": 3323} {"train_loss": -25.163589477539062, "global_step": 275865, "epoch": 3323} {"train_loss": -25.51673698425293, "global_step": 275866, "epoch": 3323} {"train_loss": -25.16720199584961, "global_step": 275867, "epoch": 3323} {"train_loss": -25.56655502319336, "global_step": 275868, "epoch": 3323} {"train_loss": -25.416677474975586, "global_step": 275869, "epoch": 3323} {"train_loss": -25.330434799194336, "global_step": 275870, "epoch": 3323} {"train_loss": -24.95771598815918, "global_step": 275871, "epoch": 3323} {"train_loss": -25.567888259887695, "global_step": 275872, "epoch": 3323} {"train_loss": -25.167142868041992, "global_step": 275873, "epoch": 3323} {"train_loss": -25.628854751586914, "global_step": 275874, "epoch": 3323} {"train_loss": -25.278099060058594, "global_step": 275875, "epoch": 3323} {"train_loss": -25.232938766479492, "global_step": 275876, "epoch": 3323} {"train_loss": -25.464208602905273, "global_step": 275877, "epoch": 3323} {"train_loss": -25.607717514038086, "global_step": 275878, "epoch": 3323} {"train_loss": -25.42861557006836, "global_step": 275879, "epoch": 3323} {"train_loss": -25.723432540893555, "global_step": 275880, "epoch": 3323} {"train_loss": -25.581274032592773, "global_step": 275881, "epoch": 3323} {"train_loss": -25.411006927490234, "global_step": 275882, "epoch": 3323} {"train_loss": -25.264921188354492, "global_step": 275883, "epoch": 3323} {"train_loss": -25.497190475463867, "global_step": 275884, "epoch": 3323} {"train_loss": -25.473201751708984, "global_step": 275885, "epoch": 3323} {"train_loss": -25.505247116088867, "global_step": 275886, "epoch": 3323} {"train_loss": -25.673826217651367, "global_step": 275887, "epoch": 3323} {"train_loss": -25.162073135375977, "global_step": 275888, "epoch": 3323} {"train_loss": -25.27067756652832, "global_step": 275889, "epoch": 3323} {"train_loss": -25.447999954223633, "global_step": 275890, "epoch": 3323} {"train_loss": -25.26573475297675, "global_step": 275891, "epoch": 3323, "val_loss": 7045746.0} {"train_loss": -24.138790130615234, "global_step": 275892, "epoch": 3324} {"train_loss": -23.347076416015625, "global_step": 275893, "epoch": 3324} {"train_loss": -24.802093505859375, "global_step": 275894, "epoch": 3324} {"train_loss": -23.459997177124023, "global_step": 275895, "epoch": 3324} {"train_loss": -24.64149284362793, "global_step": 275896, "epoch": 3324} {"train_loss": -24.1185302734375, "global_step": 275897, "epoch": 3324} {"train_loss": -24.87140655517578, "global_step": 275898, "epoch": 3324} {"train_loss": -24.33717155456543, "global_step": 275899, "epoch": 3324} {"train_loss": -25.208250045776367, "global_step": 275900, "epoch": 3324} {"train_loss": -24.284130096435547, "global_step": 275901, "epoch": 3324} {"train_loss": -25.12565040588379, "global_step": 275902, "epoch": 3324} {"train_loss": -24.627994537353516, "global_step": 275903, "epoch": 3324} {"train_loss": -24.37056541442871, "global_step": 275904, "epoch": 3324} {"train_loss": -24.823354721069336, "global_step": 275905, "epoch": 3324} {"train_loss": -25.051313400268555, "global_step": 275906, "epoch": 3324} {"train_loss": -24.45551872253418, "global_step": 275907, "epoch": 3324} {"train_loss": -24.67184066772461, "global_step": 275908, "epoch": 3324} {"train_loss": -24.286819458007812, "global_step": 275909, "epoch": 3324} {"train_loss": -24.775367736816406, "global_step": 275910, "epoch": 3324} {"train_loss": -24.532079696655273, "global_step": 275911, "epoch": 3324} {"train_loss": -25.192304611206055, "global_step": 275912, "epoch": 3324} {"train_loss": -24.900556564331055, "global_step": 275913, "epoch": 3324} {"train_loss": -25.082767486572266, "global_step": 275914, "epoch": 3324} {"train_loss": -24.86607551574707, "global_step": 275915, "epoch": 3324} {"train_loss": -25.362003326416016, "global_step": 275916, "epoch": 3324} {"train_loss": -24.669437408447266, "global_step": 275917, "epoch": 3324} {"train_loss": -25.07333755493164, "global_step": 275918, "epoch": 3324} {"train_loss": -24.950956344604492, "global_step": 275919, "epoch": 3324} {"train_loss": -25.245101928710938, "global_step": 275920, "epoch": 3324} {"train_loss": -25.299072265625, "global_step": 275921, "epoch": 3324} {"train_loss": -25.010908126831055, "global_step": 275922, "epoch": 3324} {"train_loss": -25.277585983276367, "global_step": 275923, "epoch": 3324} {"train_loss": -25.179561614990234, "global_step": 275924, "epoch": 3324} {"train_loss": -25.23067283630371, "global_step": 275925, "epoch": 3324} {"train_loss": -25.32986831665039, "global_step": 275926, "epoch": 3324} {"train_loss": -25.482954025268555, "global_step": 275927, "epoch": 3324} {"train_loss": -25.620874404907227, "global_step": 275928, "epoch": 3324} {"train_loss": -25.43793296813965, "global_step": 275929, "epoch": 3324} {"train_loss": -25.15660858154297, "global_step": 275930, "epoch": 3324} {"train_loss": -25.523700714111328, "global_step": 275931, "epoch": 3324} {"train_loss": -25.576128005981445, "global_step": 275932, "epoch": 3324} {"train_loss": -25.258825302124023, "global_step": 275933, "epoch": 3324} {"train_loss": -25.47496795654297, "global_step": 275934, "epoch": 3324} {"train_loss": -25.184934616088867, "global_step": 275935, "epoch": 3324} {"train_loss": -25.407241821289062, "global_step": 275936, "epoch": 3324} {"train_loss": -25.44126319885254, "global_step": 275937, "epoch": 3324} {"train_loss": -25.3120174407959, "global_step": 275938, "epoch": 3324} {"train_loss": -25.177688598632812, "global_step": 275939, "epoch": 3324} {"train_loss": -25.216846466064453, "global_step": 275940, "epoch": 3324} {"train_loss": -25.432281494140625, "global_step": 275941, "epoch": 3324} {"train_loss": -25.378843307495117, "global_step": 275942, "epoch": 3324} {"train_loss": -25.23575782775879, "global_step": 275943, "epoch": 3324} {"train_loss": -25.410036087036133, "global_step": 275944, "epoch": 3324} {"train_loss": -25.350292205810547, "global_step": 275945, "epoch": 3324} {"train_loss": -25.064868927001953, "global_step": 275946, "epoch": 3324} {"train_loss": -24.984846115112305, "global_step": 275947, "epoch": 3324} {"train_loss": -25.130674362182617, "global_step": 275948, "epoch": 3324} {"train_loss": -25.643415451049805, "global_step": 275949, "epoch": 3324} {"train_loss": -25.504323959350586, "global_step": 275950, "epoch": 3324} {"train_loss": -25.533607482910156, "global_step": 275951, "epoch": 3324} {"train_loss": -25.537683486938477, "global_step": 275952, "epoch": 3324} {"train_loss": -25.471696853637695, "global_step": 275953, "epoch": 3324} {"train_loss": -25.313720703125, "global_step": 275954, "epoch": 3324} {"train_loss": -25.617847442626953, "global_step": 275955, "epoch": 3324} {"train_loss": -25.198225021362305, "global_step": 275956, "epoch": 3324} {"train_loss": -25.026294708251953, "global_step": 275957, "epoch": 3324} {"train_loss": -25.46642303466797, "global_step": 275958, "epoch": 3324} {"train_loss": -25.48613929748535, "global_step": 275959, "epoch": 3324} {"train_loss": -25.23224449157715, "global_step": 275960, "epoch": 3324} {"train_loss": -25.639694213867188, "global_step": 275961, "epoch": 3324} {"train_loss": -25.380949020385742, "global_step": 275962, "epoch": 3324} {"train_loss": -25.57667350769043, "global_step": 275963, "epoch": 3324} {"train_loss": -25.18891716003418, "global_step": 275964, "epoch": 3324} {"train_loss": -25.45912742614746, "global_step": 275965, "epoch": 3324} {"train_loss": -25.424123764038086, "global_step": 275966, "epoch": 3324} {"train_loss": -25.395627975463867, "global_step": 275967, "epoch": 3324} {"train_loss": -25.23080062866211, "global_step": 275968, "epoch": 3324} {"train_loss": -25.503528594970703, "global_step": 275969, "epoch": 3324} {"train_loss": -25.466711044311523, "global_step": 275970, "epoch": 3324} {"train_loss": -25.77130699157715, "global_step": 275971, "epoch": 3324} {"train_loss": -25.215261459350586, "global_step": 275972, "epoch": 3324} {"train_loss": -25.77389907836914, "global_step": 275973, "epoch": 3324} {"train_loss": -25.145787618246423, "global_step": 275974, "epoch": 3324, "val_loss": 7168650.0} {"train_loss": -24.62660026550293, "global_step": 275975, "epoch": 3325} {"train_loss": -23.130334854125977, "global_step": 275976, "epoch": 3325} {"train_loss": -23.663795471191406, "global_step": 275977, "epoch": 3325} {"train_loss": -24.565702438354492, "global_step": 275978, "epoch": 3325} {"train_loss": -24.449670791625977, "global_step": 275979, "epoch": 3325} {"train_loss": -24.414295196533203, "global_step": 275980, "epoch": 3325} {"train_loss": -24.409345626831055, "global_step": 275981, "epoch": 3325} {"train_loss": -24.68094253540039, "global_step": 275982, "epoch": 3325} {"train_loss": -24.233474731445312, "global_step": 275983, "epoch": 3325} {"train_loss": -24.700416564941406, "global_step": 275984, "epoch": 3325} {"train_loss": -24.194238662719727, "global_step": 275985, "epoch": 3325} {"train_loss": -25.02557373046875, "global_step": 275986, "epoch": 3325} {"train_loss": -24.6738338470459, "global_step": 275987, "epoch": 3325} {"train_loss": -24.48824691772461, "global_step": 275988, "epoch": 3325} {"train_loss": -25.09173011779785, "global_step": 275989, "epoch": 3325} {"train_loss": -25.465456008911133, "global_step": 275990, "epoch": 3325} {"train_loss": -24.76944351196289, "global_step": 275991, "epoch": 3325} {"train_loss": -24.792743682861328, "global_step": 275992, "epoch": 3325} {"train_loss": -24.773874282836914, "global_step": 275993, "epoch": 3325} {"train_loss": -25.02322006225586, "global_step": 275994, "epoch": 3325} {"train_loss": -25.064271926879883, "global_step": 275995, "epoch": 3325} {"train_loss": -25.060562133789062, "global_step": 275996, "epoch": 3325} {"train_loss": -24.993494033813477, "global_step": 275997, "epoch": 3325} {"train_loss": -25.11834716796875, "global_step": 275998, "epoch": 3325} {"train_loss": -24.796737670898438, "global_step": 275999, "epoch": 3325} {"train_loss": -24.886215209960938, "global_step": 276000, "epoch": 3325} {"train_loss": -25.3295955657959, "global_step": 276001, "epoch": 3325} {"train_loss": -25.442533493041992, "global_step": 276002, "epoch": 3325} {"train_loss": -25.642688751220703, "global_step": 276003, "epoch": 3325} {"train_loss": -25.234912872314453, "global_step": 276004, "epoch": 3325} {"train_loss": -25.228790283203125, "global_step": 276005, "epoch": 3325} {"train_loss": -25.44061851501465, "global_step": 276006, "epoch": 3325} {"train_loss": -25.125869750976562, "global_step": 276007, "epoch": 3325} {"train_loss": -25.368610382080078, "global_step": 276008, "epoch": 3325} {"train_loss": -25.02419090270996, "global_step": 276009, "epoch": 3325} {"train_loss": -25.026784896850586, "global_step": 276010, "epoch": 3325} {"train_loss": -25.325056076049805, "global_step": 276011, "epoch": 3325} {"train_loss": -25.26068115234375, "global_step": 276012, "epoch": 3325} {"train_loss": -25.23441505432129, "global_step": 276013, "epoch": 3325} {"train_loss": -25.70633888244629, "global_step": 276014, "epoch": 3325} {"train_loss": -25.142005920410156, "global_step": 276015, "epoch": 3325} {"train_loss": -25.392362594604492, "global_step": 276016, "epoch": 3325} {"train_loss": -25.596769332885742, "global_step": 276017, "epoch": 3325} {"train_loss": -25.392332077026367, "global_step": 276018, "epoch": 3325} {"train_loss": -25.509689331054688, "global_step": 276019, "epoch": 3325} {"train_loss": -25.663305282592773, "global_step": 276020, "epoch": 3325} {"train_loss": -25.811542510986328, "global_step": 276021, "epoch": 3325} {"train_loss": -25.373403549194336, "global_step": 276022, "epoch": 3325} {"train_loss": -25.9505615234375, "global_step": 276023, "epoch": 3325} {"train_loss": -25.725439071655273, "global_step": 276024, "epoch": 3325} {"train_loss": -25.533809661865234, "global_step": 276025, "epoch": 3325} {"train_loss": -25.630233764648438, "global_step": 276026, "epoch": 3325} {"train_loss": -25.39851188659668, "global_step": 276027, "epoch": 3325} {"train_loss": -26.009958267211914, "global_step": 276028, "epoch": 3325} {"train_loss": -25.487545013427734, "global_step": 276029, "epoch": 3325} {"train_loss": -25.540945053100586, "global_step": 276030, "epoch": 3325} {"train_loss": -25.333494186401367, "global_step": 276031, "epoch": 3325} {"train_loss": -24.4062557220459, "global_step": 276032, "epoch": 3325} {"train_loss": -24.368711471557617, "global_step": 276033, "epoch": 3325} {"train_loss": -24.643756866455078, "global_step": 276034, "epoch": 3325} {"train_loss": -25.51771354675293, "global_step": 276035, "epoch": 3325} {"train_loss": -25.057527542114258, "global_step": 276036, "epoch": 3325} {"train_loss": -24.80982780456543, "global_step": 276037, "epoch": 3325} {"train_loss": -25.10978889465332, "global_step": 276038, "epoch": 3325} {"train_loss": -25.12970542907715, "global_step": 276039, "epoch": 3325} {"train_loss": -24.974557876586914, "global_step": 276040, "epoch": 3325} {"train_loss": -25.18181800842285, "global_step": 276041, "epoch": 3325} {"train_loss": -25.271833419799805, "global_step": 276042, "epoch": 3325} {"train_loss": -25.514984130859375, "global_step": 276043, "epoch": 3325} {"train_loss": -25.20503807067871, "global_step": 276044, "epoch": 3325} {"train_loss": -25.081098556518555, "global_step": 276045, "epoch": 3325} {"train_loss": -25.271648406982422, "global_step": 276046, "epoch": 3325} {"train_loss": -25.059864044189453, "global_step": 276047, "epoch": 3325} {"train_loss": -25.763263702392578, "global_step": 276048, "epoch": 3325} {"train_loss": -25.64520263671875, "global_step": 276049, "epoch": 3325} {"train_loss": -25.31027603149414, "global_step": 276050, "epoch": 3325} {"train_loss": -25.65545082092285, "global_step": 276051, "epoch": 3325} {"train_loss": -25.75982666015625, "global_step": 276052, "epoch": 3325} {"train_loss": -25.130157470703125, "global_step": 276053, "epoch": 3325} {"train_loss": -25.46685791015625, "global_step": 276054, "epoch": 3325} {"train_loss": -25.645801544189453, "global_step": 276055, "epoch": 3325} {"train_loss": -25.20273780822754, "global_step": 276056, "epoch": 3325} {"train_loss": -25.123052344264753, "global_step": 276057, "epoch": 3325, "val_loss": 6993903.5} {"train_loss": -24.70284080505371, "global_step": 276058, "epoch": 3326} {"train_loss": -23.762958526611328, "global_step": 276059, "epoch": 3326} {"train_loss": -24.21016502380371, "global_step": 276060, "epoch": 3326} {"train_loss": -25.2587947845459, "global_step": 276061, "epoch": 3326} {"train_loss": -23.79115867614746, "global_step": 276062, "epoch": 3326} {"train_loss": -25.05865478515625, "global_step": 276063, "epoch": 3326} {"train_loss": -24.983469009399414, "global_step": 276064, "epoch": 3326} {"train_loss": -24.725812911987305, "global_step": 276065, "epoch": 3326} {"train_loss": -24.734724044799805, "global_step": 276066, "epoch": 3326} {"train_loss": -24.84695816040039, "global_step": 276067, "epoch": 3326} {"train_loss": -25.09878921508789, "global_step": 276068, "epoch": 3326} {"train_loss": -25.358722686767578, "global_step": 276069, "epoch": 3326} {"train_loss": -25.182592391967773, "global_step": 276070, "epoch": 3326} {"train_loss": -24.810468673706055, "global_step": 276071, "epoch": 3326} {"train_loss": -25.48879051208496, "global_step": 276072, "epoch": 3326} {"train_loss": -24.980880737304688, "global_step": 276073, "epoch": 3326} {"train_loss": -24.955223083496094, "global_step": 276074, "epoch": 3326} {"train_loss": -25.015554428100586, "global_step": 276075, "epoch": 3326} {"train_loss": -25.190868377685547, "global_step": 276076, "epoch": 3326} {"train_loss": -25.37127685546875, "global_step": 276077, "epoch": 3326} {"train_loss": -25.240747451782227, "global_step": 276078, "epoch": 3326} {"train_loss": -24.905235290527344, "global_step": 276079, "epoch": 3326} {"train_loss": -24.767911911010742, "global_step": 276080, "epoch": 3326} {"train_loss": -25.131772994995117, "global_step": 276081, "epoch": 3326} {"train_loss": -25.25359535217285, "global_step": 276082, "epoch": 3326} {"train_loss": -25.260446548461914, "global_step": 276083, "epoch": 3326} {"train_loss": -24.861581802368164, "global_step": 276084, "epoch": 3326} {"train_loss": -25.161361694335938, "global_step": 276085, "epoch": 3326} {"train_loss": -25.142086029052734, "global_step": 276086, "epoch": 3326} {"train_loss": -25.494321823120117, "global_step": 276087, "epoch": 3326} {"train_loss": -24.864990234375, "global_step": 276088, "epoch": 3326} {"train_loss": -25.082372665405273, "global_step": 276089, "epoch": 3326} {"train_loss": -25.186254501342773, "global_step": 276090, "epoch": 3326} {"train_loss": -25.363800048828125, "global_step": 276091, "epoch": 3326} {"train_loss": -25.35359001159668, "global_step": 276092, "epoch": 3326} {"train_loss": -25.29290199279785, "global_step": 276093, "epoch": 3326} {"train_loss": -25.33890724182129, "global_step": 276094, "epoch": 3326} {"train_loss": -25.559751510620117, "global_step": 276095, "epoch": 3326} {"train_loss": -25.729496002197266, "global_step": 276096, "epoch": 3326} {"train_loss": -25.32236671447754, "global_step": 276097, "epoch": 3326} {"train_loss": -24.945419311523438, "global_step": 276098, "epoch": 3326} {"train_loss": -25.428632736206055, "global_step": 276099, "epoch": 3326} {"train_loss": -25.68082046508789, "global_step": 276100, "epoch": 3326} {"train_loss": -25.531238555908203, "global_step": 276101, "epoch": 3326} {"train_loss": -25.412036895751953, "global_step": 276102, "epoch": 3326} {"train_loss": -25.31574821472168, "global_step": 276103, "epoch": 3326} {"train_loss": -25.254087448120117, "global_step": 276104, "epoch": 3326} {"train_loss": -25.29185676574707, "global_step": 276105, "epoch": 3326} {"train_loss": -25.756128311157227, "global_step": 276106, "epoch": 3326} {"train_loss": -25.10975456237793, "global_step": 276107, "epoch": 3326} {"train_loss": -25.616455078125, "global_step": 276108, "epoch": 3326} {"train_loss": -25.13572120666504, "global_step": 276109, "epoch": 3326} {"train_loss": -25.7539119720459, "global_step": 276110, "epoch": 3326} {"train_loss": -25.72992515563965, "global_step": 276111, "epoch": 3326} {"train_loss": -25.849714279174805, "global_step": 276112, "epoch": 3326} {"train_loss": -25.458541870117188, "global_step": 276113, "epoch": 3326} {"train_loss": -25.384855270385742, "global_step": 276114, "epoch": 3326} {"train_loss": -25.451377868652344, "global_step": 276115, "epoch": 3326} {"train_loss": -25.5391902923584, "global_step": 276116, "epoch": 3326} {"train_loss": -25.703821182250977, "global_step": 276117, "epoch": 3326} {"train_loss": -25.649946212768555, "global_step": 276118, "epoch": 3326} {"train_loss": -25.55352210998535, "global_step": 276119, "epoch": 3326} {"train_loss": -25.685684204101562, "global_step": 276120, "epoch": 3326} {"train_loss": -25.315200805664062, "global_step": 276121, "epoch": 3326} {"train_loss": -25.328886032104492, "global_step": 276122, "epoch": 3326} {"train_loss": -25.554580688476562, "global_step": 276123, "epoch": 3326} {"train_loss": -25.266550064086914, "global_step": 276124, "epoch": 3326} {"train_loss": -25.012237548828125, "global_step": 276125, "epoch": 3326} {"train_loss": -25.44878578186035, "global_step": 276126, "epoch": 3326} {"train_loss": -25.288976669311523, "global_step": 276127, "epoch": 3326} {"train_loss": -25.308828353881836, "global_step": 276128, "epoch": 3326} {"train_loss": -25.032312393188477, "global_step": 276129, "epoch": 3326} {"train_loss": -25.12713050842285, "global_step": 276130, "epoch": 3326} {"train_loss": -25.267370223999023, "global_step": 276131, "epoch": 3326} {"train_loss": -25.7301025390625, "global_step": 276132, "epoch": 3326} {"train_loss": -25.271209716796875, "global_step": 276133, "epoch": 3326} {"train_loss": -25.283395767211914, "global_step": 276134, "epoch": 3326} {"train_loss": -25.109500885009766, "global_step": 276135, "epoch": 3326} {"train_loss": -25.400388717651367, "global_step": 276136, "epoch": 3326} {"train_loss": -25.563024520874023, "global_step": 276137, "epoch": 3326} {"train_loss": -25.372455596923828, "global_step": 276138, "epoch": 3326} {"train_loss": -25.2142333984375, "global_step": 276139, "epoch": 3326} {"train_loss": -25.227153548275133, "global_step": 276140, "epoch": 3326, "val_loss": 7076150.0} {"train_loss": -24.472732543945312, "global_step": 276141, "epoch": 3327} {"train_loss": -25.254409790039062, "global_step": 276142, "epoch": 3327} {"train_loss": -24.84739112854004, "global_step": 276143, "epoch": 3327} {"train_loss": -24.6412353515625, "global_step": 276144, "epoch": 3327} {"train_loss": -25.20147705078125, "global_step": 276145, "epoch": 3327} {"train_loss": -24.572147369384766, "global_step": 276146, "epoch": 3327} {"train_loss": -24.843801498413086, "global_step": 276147, "epoch": 3327} {"train_loss": -25.326934814453125, "global_step": 276148, "epoch": 3327} {"train_loss": -24.879972457885742, "global_step": 276149, "epoch": 3327} {"train_loss": -24.869062423706055, "global_step": 276150, "epoch": 3327} {"train_loss": -24.92659568786621, "global_step": 276151, "epoch": 3327} {"train_loss": -25.14274787902832, "global_step": 276152, "epoch": 3327} {"train_loss": -24.896076202392578, "global_step": 276153, "epoch": 3327} {"train_loss": -25.09987449645996, "global_step": 276154, "epoch": 3327} {"train_loss": -25.007484436035156, "global_step": 276155, "epoch": 3327} {"train_loss": -25.211807250976562, "global_step": 276156, "epoch": 3327} {"train_loss": -24.724567413330078, "global_step": 276157, "epoch": 3327} {"train_loss": -25.150161743164062, "global_step": 276158, "epoch": 3327} {"train_loss": -24.984891891479492, "global_step": 276159, "epoch": 3327} {"train_loss": -25.047374725341797, "global_step": 276160, "epoch": 3327} {"train_loss": -25.117507934570312, "global_step": 276161, "epoch": 3327} {"train_loss": -25.22059440612793, "global_step": 276162, "epoch": 3327} {"train_loss": -25.43540382385254, "global_step": 276163, "epoch": 3327} {"train_loss": -24.975942611694336, "global_step": 276164, "epoch": 3327} {"train_loss": -24.265256881713867, "global_step": 276165, "epoch": 3327} {"train_loss": -24.76121711730957, "global_step": 276166, "epoch": 3327} {"train_loss": -24.75942611694336, "global_step": 276167, "epoch": 3327} {"train_loss": -24.892744064331055, "global_step": 276168, "epoch": 3327} {"train_loss": -24.58357810974121, "global_step": 276169, "epoch": 3327} {"train_loss": -25.09689712524414, "global_step": 276170, "epoch": 3327} {"train_loss": -25.2711124420166, "global_step": 276171, "epoch": 3327} {"train_loss": -24.764169692993164, "global_step": 276172, "epoch": 3327} {"train_loss": -25.319337844848633, "global_step": 276173, "epoch": 3327} {"train_loss": -25.213953018188477, "global_step": 276174, "epoch": 3327} {"train_loss": -24.993066787719727, "global_step": 276175, "epoch": 3327} {"train_loss": -25.256481170654297, "global_step": 276176, "epoch": 3327} {"train_loss": -25.43818473815918, "global_step": 276177, "epoch": 3327} {"train_loss": -25.268178939819336, "global_step": 276178, "epoch": 3327} {"train_loss": -25.338109970092773, "global_step": 276179, "epoch": 3327} {"train_loss": -25.337467193603516, "global_step": 276180, "epoch": 3327} {"train_loss": -25.24708366394043, "global_step": 276181, "epoch": 3327} {"train_loss": -25.212080001831055, "global_step": 276182, "epoch": 3327} {"train_loss": -25.33210563659668, "global_step": 276183, "epoch": 3327} {"train_loss": -25.12003517150879, "global_step": 276184, "epoch": 3327} {"train_loss": -25.17849349975586, "global_step": 276185, "epoch": 3327} {"train_loss": -25.000829696655273, "global_step": 276186, "epoch": 3327} {"train_loss": -25.073837280273438, "global_step": 276187, "epoch": 3327} {"train_loss": -25.651670455932617, "global_step": 276188, "epoch": 3327} {"train_loss": -25.560441970825195, "global_step": 276189, "epoch": 3327} {"train_loss": -25.5283260345459, "global_step": 276190, "epoch": 3327} {"train_loss": -25.438447952270508, "global_step": 276191, "epoch": 3327} {"train_loss": -25.40594482421875, "global_step": 276192, "epoch": 3327} {"train_loss": -25.325002670288086, "global_step": 276193, "epoch": 3327} {"train_loss": -25.412626266479492, "global_step": 276194, "epoch": 3327} {"train_loss": -25.806421279907227, "global_step": 276195, "epoch": 3327} {"train_loss": -24.943023681640625, "global_step": 276196, "epoch": 3327} {"train_loss": -25.389944076538086, "global_step": 276197, "epoch": 3327} {"train_loss": -25.501907348632812, "global_step": 276198, "epoch": 3327} {"train_loss": -25.534147262573242, "global_step": 276199, "epoch": 3327} {"train_loss": -25.2314510345459, "global_step": 276200, "epoch": 3327} {"train_loss": -24.926015853881836, "global_step": 276201, "epoch": 3327} {"train_loss": -24.777381896972656, "global_step": 276202, "epoch": 3327} {"train_loss": -24.78249168395996, "global_step": 276203, "epoch": 3327} {"train_loss": -24.682302474975586, "global_step": 276204, "epoch": 3327} {"train_loss": -25.055801391601562, "global_step": 276205, "epoch": 3327} {"train_loss": -24.98442268371582, "global_step": 276206, "epoch": 3327} {"train_loss": -24.95197868347168, "global_step": 276207, "epoch": 3327} {"train_loss": -24.866052627563477, "global_step": 276208, "epoch": 3327} {"train_loss": -24.808815002441406, "global_step": 276209, "epoch": 3327} {"train_loss": -25.07709312438965, "global_step": 276210, "epoch": 3327} {"train_loss": -25.147537231445312, "global_step": 276211, "epoch": 3327} {"train_loss": -25.21897315979004, "global_step": 276212, "epoch": 3327} {"train_loss": -25.577375411987305, "global_step": 276213, "epoch": 3327} {"train_loss": -25.41360855102539, "global_step": 276214, "epoch": 3327} {"train_loss": -25.529882431030273, "global_step": 276215, "epoch": 3327} {"train_loss": -25.05377197265625, "global_step": 276216, "epoch": 3327} {"train_loss": -25.12051773071289, "global_step": 276217, "epoch": 3327} {"train_loss": -25.43286895751953, "global_step": 276218, "epoch": 3327} {"train_loss": -25.572431564331055, "global_step": 276219, "epoch": 3327} {"train_loss": -25.544830322265625, "global_step": 276220, "epoch": 3327} {"train_loss": -25.57941436767578, "global_step": 276221, "epoch": 3327} {"train_loss": -25.377840042114258, "global_step": 276222, "epoch": 3327} {"train_loss": -25.13728525552405, "global_step": 276223, "epoch": 3327, "val_loss": 6925138.0} {"train_loss": -25.30363655090332, "global_step": 276224, "epoch": 3328} {"train_loss": -25.496570587158203, "global_step": 276225, "epoch": 3328} {"train_loss": -25.489315032958984, "global_step": 276226, "epoch": 3328} {"train_loss": -25.303693771362305, "global_step": 276227, "epoch": 3328} {"train_loss": -25.507905960083008, "global_step": 276228, "epoch": 3328} {"train_loss": -25.14540672302246, "global_step": 276229, "epoch": 3328} {"train_loss": -25.751867294311523, "global_step": 276230, "epoch": 3328} {"train_loss": -25.147626876831055, "global_step": 276231, "epoch": 3328} {"train_loss": -25.12447166442871, "global_step": 276232, "epoch": 3328} {"train_loss": -25.596765518188477, "global_step": 276233, "epoch": 3328} {"train_loss": -25.602231979370117, "global_step": 276234, "epoch": 3328} {"train_loss": -25.26360321044922, "global_step": 276235, "epoch": 3328} {"train_loss": -25.08988380432129, "global_step": 276236, "epoch": 3328} {"train_loss": -25.269954681396484, "global_step": 276237, "epoch": 3328} {"train_loss": -25.2263240814209, "global_step": 276238, "epoch": 3328} {"train_loss": -25.101322174072266, "global_step": 276239, "epoch": 3328} {"train_loss": -25.25301170349121, "global_step": 276240, "epoch": 3328} {"train_loss": -25.49802589416504, "global_step": 276241, "epoch": 3328} {"train_loss": -25.50958824157715, "global_step": 276242, "epoch": 3328} {"train_loss": -25.57990837097168, "global_step": 276243, "epoch": 3328} {"train_loss": -25.535245895385742, "global_step": 276244, "epoch": 3328} {"train_loss": -25.56662368774414, "global_step": 276245, "epoch": 3328} {"train_loss": -25.520313262939453, "global_step": 276246, "epoch": 3328} {"train_loss": -25.18617820739746, "global_step": 276247, "epoch": 3328} {"train_loss": -25.240726470947266, "global_step": 276248, "epoch": 3328} {"train_loss": -24.992338180541992, "global_step": 276249, "epoch": 3328} {"train_loss": -25.5655574798584, "global_step": 276250, "epoch": 3328} {"train_loss": -25.147552490234375, "global_step": 276251, "epoch": 3328} {"train_loss": -25.167844772338867, "global_step": 276252, "epoch": 3328} {"train_loss": -24.64451026916504, "global_step": 276253, "epoch": 3328} {"train_loss": -24.794790267944336, "global_step": 276254, "epoch": 3328} {"train_loss": -25.39349937438965, "global_step": 276255, "epoch": 3328} {"train_loss": -25.4808349609375, "global_step": 276256, "epoch": 3328} {"train_loss": -25.603321075439453, "global_step": 276257, "epoch": 3328} {"train_loss": -25.4564266204834, "global_step": 276258, "epoch": 3328} {"train_loss": -25.335813522338867, "global_step": 276259, "epoch": 3328} {"train_loss": -25.098051071166992, "global_step": 276260, "epoch": 3328} {"train_loss": -25.241727828979492, "global_step": 276261, "epoch": 3328} {"train_loss": -25.154592514038086, "global_step": 276262, "epoch": 3328} {"train_loss": -25.288776397705078, "global_step": 276263, "epoch": 3328} {"train_loss": -25.1893253326416, "global_step": 276264, "epoch": 3328} {"train_loss": -25.195877075195312, "global_step": 276265, "epoch": 3328} {"train_loss": -25.35199737548828, "global_step": 276266, "epoch": 3328} {"train_loss": -25.23630714416504, "global_step": 276267, "epoch": 3328} {"train_loss": -25.096206665039062, "global_step": 276268, "epoch": 3328} {"train_loss": -24.99823570251465, "global_step": 276269, "epoch": 3328} {"train_loss": -25.395862579345703, "global_step": 276270, "epoch": 3328} {"train_loss": -25.179174423217773, "global_step": 276271, "epoch": 3328} {"train_loss": -25.26462173461914, "global_step": 276272, "epoch": 3328} {"train_loss": -25.247282028198242, "global_step": 276273, "epoch": 3328} {"train_loss": -25.071044921875, "global_step": 276274, "epoch": 3328} {"train_loss": -25.42097282409668, "global_step": 276275, "epoch": 3328} {"train_loss": -25.115259170532227, "global_step": 276276, "epoch": 3328} {"train_loss": -25.450637817382812, "global_step": 276277, "epoch": 3328} {"train_loss": -25.206146240234375, "global_step": 276278, "epoch": 3328} {"train_loss": -25.622028350830078, "global_step": 276279, "epoch": 3328} {"train_loss": -25.384052276611328, "global_step": 276280, "epoch": 3328} {"train_loss": -25.383760452270508, "global_step": 276281, "epoch": 3328} {"train_loss": -25.15852165222168, "global_step": 276282, "epoch": 3328} {"train_loss": -25.55706024169922, "global_step": 276283, "epoch": 3328} {"train_loss": -25.423480987548828, "global_step": 276284, "epoch": 3328} {"train_loss": -25.579565048217773, "global_step": 276285, "epoch": 3328} {"train_loss": -25.20966339111328, "global_step": 276286, "epoch": 3328} {"train_loss": -25.592771530151367, "global_step": 276287, "epoch": 3328} {"train_loss": -25.45366859436035, "global_step": 276288, "epoch": 3328} {"train_loss": -25.587753295898438, "global_step": 276289, "epoch": 3328} {"train_loss": -25.210681915283203, "global_step": 276290, "epoch": 3328} {"train_loss": -25.598556518554688, "global_step": 276291, "epoch": 3328} {"train_loss": -25.703662872314453, "global_step": 276292, "epoch": 3328} {"train_loss": -25.494489669799805, "global_step": 276293, "epoch": 3328} {"train_loss": -25.405553817749023, "global_step": 276294, "epoch": 3328} {"train_loss": -25.033763885498047, "global_step": 276295, "epoch": 3328} {"train_loss": -25.328271865844727, "global_step": 276296, "epoch": 3328} {"train_loss": -25.39531135559082, "global_step": 276297, "epoch": 3328} {"train_loss": -25.77681541442871, "global_step": 276298, "epoch": 3328} {"train_loss": -25.230894088745117, "global_step": 276299, "epoch": 3328} {"train_loss": -25.414499282836914, "global_step": 276300, "epoch": 3328} {"train_loss": -25.489566802978516, "global_step": 276301, "epoch": 3328} {"train_loss": -25.2921142578125, "global_step": 276302, "epoch": 3328} {"train_loss": -25.579654693603516, "global_step": 276303, "epoch": 3328} {"train_loss": -25.533483505249023, "global_step": 276304, "epoch": 3328} {"train_loss": -25.731969833374023, "global_step": 276305, "epoch": 3328} {"train_loss": -25.34943258905985, "global_step": 276306, "epoch": 3328, "val_loss": 7158149.0} {"train_loss": -25.56314468383789, "global_step": 276307, "epoch": 3329} {"train_loss": -25.06850242614746, "global_step": 276308, "epoch": 3329} {"train_loss": -24.96034049987793, "global_step": 276309, "epoch": 3329} {"train_loss": -25.072080612182617, "global_step": 276310, "epoch": 3329} {"train_loss": -25.177854537963867, "global_step": 276311, "epoch": 3329} {"train_loss": -25.486597061157227, "global_step": 276312, "epoch": 3329} {"train_loss": -25.25882911682129, "global_step": 276313, "epoch": 3329} {"train_loss": -25.64393424987793, "global_step": 276314, "epoch": 3329} {"train_loss": -25.281587600708008, "global_step": 276315, "epoch": 3329} {"train_loss": -25.31954574584961, "global_step": 276316, "epoch": 3329} {"train_loss": -25.049158096313477, "global_step": 276317, "epoch": 3329} {"train_loss": -25.181869506835938, "global_step": 276318, "epoch": 3329} {"train_loss": -25.145538330078125, "global_step": 276319, "epoch": 3329} {"train_loss": -24.747207641601562, "global_step": 276320, "epoch": 3329} {"train_loss": -25.200790405273438, "global_step": 276321, "epoch": 3329} {"train_loss": -25.464031219482422, "global_step": 276322, "epoch": 3329} {"train_loss": -25.226694107055664, "global_step": 276323, "epoch": 3329} {"train_loss": -25.267812728881836, "global_step": 276324, "epoch": 3329} {"train_loss": -24.86318016052246, "global_step": 276325, "epoch": 3329} {"train_loss": -24.700714111328125, "global_step": 276326, "epoch": 3329} {"train_loss": -24.45290184020996, "global_step": 276327, "epoch": 3329} {"train_loss": -25.083375930786133, "global_step": 276328, "epoch": 3329} {"train_loss": -24.83369255065918, "global_step": 276329, "epoch": 3329} {"train_loss": -24.84732437133789, "global_step": 276330, "epoch": 3329} {"train_loss": -25.072479248046875, "global_step": 276331, "epoch": 3329} {"train_loss": -24.766040802001953, "global_step": 276332, "epoch": 3329} {"train_loss": -25.215173721313477, "global_step": 276333, "epoch": 3329} {"train_loss": -24.99393653869629, "global_step": 276334, "epoch": 3329} {"train_loss": -25.215694427490234, "global_step": 276335, "epoch": 3329} {"train_loss": -25.110816955566406, "global_step": 276336, "epoch": 3329} {"train_loss": -25.05989646911621, "global_step": 276337, "epoch": 3329} {"train_loss": -25.29681396484375, "global_step": 276338, "epoch": 3329} {"train_loss": -25.141908645629883, "global_step": 276339, "epoch": 3329} {"train_loss": -25.094825744628906, "global_step": 276340, "epoch": 3329} {"train_loss": -25.067102432250977, "global_step": 276341, "epoch": 3329} {"train_loss": -25.400442123413086, "global_step": 276342, "epoch": 3329} {"train_loss": -25.237272262573242, "global_step": 276343, "epoch": 3329} {"train_loss": -25.242107391357422, "global_step": 276344, "epoch": 3329} {"train_loss": -25.66475486755371, "global_step": 276345, "epoch": 3329} {"train_loss": -25.43011474609375, "global_step": 276346, "epoch": 3329} {"train_loss": -25.625263214111328, "global_step": 276347, "epoch": 3329} {"train_loss": -25.109214782714844, "global_step": 276348, "epoch": 3329} {"train_loss": -25.509246826171875, "global_step": 276349, "epoch": 3329} {"train_loss": -25.3825740814209, "global_step": 276350, "epoch": 3329} {"train_loss": -25.508901596069336, "global_step": 276351, "epoch": 3329} {"train_loss": -24.987329483032227, "global_step": 276352, "epoch": 3329} {"train_loss": -25.336362838745117, "global_step": 276353, "epoch": 3329} {"train_loss": -25.6968936920166, "global_step": 276354, "epoch": 3329} {"train_loss": -25.400684356689453, "global_step": 276355, "epoch": 3329} {"train_loss": -25.24676513671875, "global_step": 276356, "epoch": 3329} {"train_loss": -25.24149513244629, "global_step": 276357, "epoch": 3329} {"train_loss": -25.80185890197754, "global_step": 276358, "epoch": 3329} {"train_loss": -25.52097511291504, "global_step": 276359, "epoch": 3329} {"train_loss": -25.630313873291016, "global_step": 276360, "epoch": 3329} {"train_loss": -25.884708404541016, "global_step": 276361, "epoch": 3329} {"train_loss": -25.093626022338867, "global_step": 276362, "epoch": 3329} {"train_loss": -25.386289596557617, "global_step": 276363, "epoch": 3329} {"train_loss": -25.58856773376465, "global_step": 276364, "epoch": 3329} {"train_loss": -25.61260986328125, "global_step": 276365, "epoch": 3329} {"train_loss": -25.67752456665039, "global_step": 276366, "epoch": 3329} {"train_loss": -25.459369659423828, "global_step": 276367, "epoch": 3329} {"train_loss": -25.26262855529785, "global_step": 276368, "epoch": 3329} {"train_loss": -25.378522872924805, "global_step": 276369, "epoch": 3329} {"train_loss": -25.837121963500977, "global_step": 276370, "epoch": 3329} {"train_loss": -25.38052749633789, "global_step": 276371, "epoch": 3329} {"train_loss": -25.485132217407227, "global_step": 276372, "epoch": 3329} {"train_loss": -25.170469284057617, "global_step": 276373, "epoch": 3329} {"train_loss": -25.674875259399414, "global_step": 276374, "epoch": 3329} {"train_loss": -25.228588104248047, "global_step": 276375, "epoch": 3329} {"train_loss": -25.62967872619629, "global_step": 276376, "epoch": 3329} {"train_loss": -25.379945755004883, "global_step": 276377, "epoch": 3329} {"train_loss": -25.448720932006836, "global_step": 276378, "epoch": 3329} {"train_loss": -25.613508224487305, "global_step": 276379, "epoch": 3329} {"train_loss": -25.591583251953125, "global_step": 276380, "epoch": 3329} {"train_loss": -25.390003204345703, "global_step": 276381, "epoch": 3329} {"train_loss": -25.666501998901367, "global_step": 276382, "epoch": 3329} {"train_loss": -25.394975662231445, "global_step": 276383, "epoch": 3329} {"train_loss": -25.641632080078125, "global_step": 276384, "epoch": 3329} {"train_loss": -25.255512237548828, "global_step": 276385, "epoch": 3329} {"train_loss": -25.49892234802246, "global_step": 276386, "epoch": 3329} {"train_loss": -25.328598022460938, "global_step": 276387, "epoch": 3329} {"train_loss": -25.8055419921875, "global_step": 276388, "epoch": 3329} {"train_loss": -25.320318727608186, "global_step": 276389, "epoch": 3329, "val_loss": 7065912.0} {"train_loss": -25.239301681518555, "global_step": 276390, "epoch": 3330} {"train_loss": -25.100391387939453, "global_step": 276391, "epoch": 3330} {"train_loss": -25.205198287963867, "global_step": 276392, "epoch": 3330} {"train_loss": -24.885604858398438, "global_step": 276393, "epoch": 3330} {"train_loss": -23.90485954284668, "global_step": 276394, "epoch": 3330} {"train_loss": -24.337249755859375, "global_step": 276395, "epoch": 3330} {"train_loss": -24.676456451416016, "global_step": 276396, "epoch": 3330} {"train_loss": -25.149057388305664, "global_step": 276397, "epoch": 3330} {"train_loss": -24.814836502075195, "global_step": 276398, "epoch": 3330} {"train_loss": -24.615915298461914, "global_step": 276399, "epoch": 3330} {"train_loss": -25.052433013916016, "global_step": 276400, "epoch": 3330} {"train_loss": -24.85935401916504, "global_step": 276401, "epoch": 3330} {"train_loss": -25.3433837890625, "global_step": 276402, "epoch": 3330} {"train_loss": -25.15192222595215, "global_step": 276403, "epoch": 3330} {"train_loss": -25.20099449157715, "global_step": 276404, "epoch": 3330} {"train_loss": -25.160442352294922, "global_step": 276405, "epoch": 3330} {"train_loss": -25.21565055847168, "global_step": 276406, "epoch": 3330} {"train_loss": -25.261205673217773, "global_step": 276407, "epoch": 3330} {"train_loss": -25.19182586669922, "global_step": 276408, "epoch": 3330} {"train_loss": -25.18406867980957, "global_step": 276409, "epoch": 3330} {"train_loss": -25.439451217651367, "global_step": 276410, "epoch": 3330} {"train_loss": -25.169832229614258, "global_step": 276411, "epoch": 3330} {"train_loss": -25.402488708496094, "global_step": 276412, "epoch": 3330} {"train_loss": -24.96882438659668, "global_step": 276413, "epoch": 3330} {"train_loss": -25.15599822998047, "global_step": 276414, "epoch": 3330} {"train_loss": -25.399728775024414, "global_step": 276415, "epoch": 3330} {"train_loss": -25.438459396362305, "global_step": 276416, "epoch": 3330} {"train_loss": -25.06561279296875, "global_step": 276417, "epoch": 3330} {"train_loss": -25.52115249633789, "global_step": 276418, "epoch": 3330} {"train_loss": -25.402524948120117, "global_step": 276419, "epoch": 3330} {"train_loss": -25.414575576782227, "global_step": 276420, "epoch": 3330} {"train_loss": -25.318334579467773, "global_step": 276421, "epoch": 3330} {"train_loss": -25.42862892150879, "global_step": 276422, "epoch": 3330} {"train_loss": -25.274124145507812, "global_step": 276423, "epoch": 3330} {"train_loss": -25.403366088867188, "global_step": 276424, "epoch": 3330} {"train_loss": -25.238733291625977, "global_step": 276425, "epoch": 3330} {"train_loss": -25.48649024963379, "global_step": 276426, "epoch": 3330} {"train_loss": -25.507144927978516, "global_step": 276427, "epoch": 3330} {"train_loss": -25.522686004638672, "global_step": 276428, "epoch": 3330} {"train_loss": -25.496219635009766, "global_step": 276429, "epoch": 3330} {"train_loss": -25.754064559936523, "global_step": 276430, "epoch": 3330} {"train_loss": -25.386016845703125, "global_step": 276431, "epoch": 3330} {"train_loss": -25.183006286621094, "global_step": 276432, "epoch": 3330} {"train_loss": -25.213138580322266, "global_step": 276433, "epoch": 3330} {"train_loss": -25.35232162475586, "global_step": 276434, "epoch": 3330} {"train_loss": -25.439281463623047, "global_step": 276435, "epoch": 3330} {"train_loss": -25.67854881286621, "global_step": 276436, "epoch": 3330} {"train_loss": -25.462629318237305, "global_step": 276437, "epoch": 3330} {"train_loss": -25.256515502929688, "global_step": 276438, "epoch": 3330} {"train_loss": -25.694067001342773, "global_step": 276439, "epoch": 3330} {"train_loss": -25.51143455505371, "global_step": 276440, "epoch": 3330} {"train_loss": -25.170047760009766, "global_step": 276441, "epoch": 3330} {"train_loss": -25.225736618041992, "global_step": 276442, "epoch": 3330} {"train_loss": -25.588857650756836, "global_step": 276443, "epoch": 3330} {"train_loss": -25.403894424438477, "global_step": 276444, "epoch": 3330} {"train_loss": -25.46675682067871, "global_step": 276445, "epoch": 3330} {"train_loss": -25.35178565979004, "global_step": 276446, "epoch": 3330} {"train_loss": -25.12250328063965, "global_step": 276447, "epoch": 3330} {"train_loss": -25.58431625366211, "global_step": 276448, "epoch": 3330} {"train_loss": -25.655384063720703, "global_step": 276449, "epoch": 3330} {"train_loss": -25.661956787109375, "global_step": 276450, "epoch": 3330} {"train_loss": -25.256221771240234, "global_step": 276451, "epoch": 3330} {"train_loss": -25.33588981628418, "global_step": 276452, "epoch": 3330} {"train_loss": -25.42158317565918, "global_step": 276453, "epoch": 3330} {"train_loss": -25.407093048095703, "global_step": 276454, "epoch": 3330} {"train_loss": -25.386716842651367, "global_step": 276455, "epoch": 3330} {"train_loss": -25.055152893066406, "global_step": 276456, "epoch": 3330} {"train_loss": -25.379926681518555, "global_step": 276457, "epoch": 3330} {"train_loss": -25.34535789489746, "global_step": 276458, "epoch": 3330} {"train_loss": -25.24672508239746, "global_step": 276459, "epoch": 3330} {"train_loss": -25.100862503051758, "global_step": 276460, "epoch": 3330} {"train_loss": -25.215206146240234, "global_step": 276461, "epoch": 3330} {"train_loss": -25.06904411315918, "global_step": 276462, "epoch": 3330} {"train_loss": -25.452274322509766, "global_step": 276463, "epoch": 3330} {"train_loss": -25.38709259033203, "global_step": 276464, "epoch": 3330} {"train_loss": -25.57863998413086, "global_step": 276465, "epoch": 3330} {"train_loss": -25.102733612060547, "global_step": 276466, "epoch": 3330} {"train_loss": -25.19880485534668, "global_step": 276467, "epoch": 3330} {"train_loss": -25.64362907409668, "global_step": 276468, "epoch": 3330} {"train_loss": -25.28601837158203, "global_step": 276469, "epoch": 3330} {"train_loss": -25.477252960205078, "global_step": 276470, "epoch": 3330} {"train_loss": -25.678613662719727, "global_step": 276471, "epoch": 3330} {"train_loss": -25.275093377354633, "global_step": 276472, "epoch": 3330, "val_loss": 6951730.5} {"train_loss": -25.113113403320312, "global_step": 276473, "epoch": 3331} {"train_loss": -24.92348289489746, "global_step": 276474, "epoch": 3331} {"train_loss": -25.220645904541016, "global_step": 276475, "epoch": 3331} {"train_loss": -24.950918197631836, "global_step": 276476, "epoch": 3331} {"train_loss": -24.89409637451172, "global_step": 276477, "epoch": 3331} {"train_loss": -24.927539825439453, "global_step": 276478, "epoch": 3331} {"train_loss": -25.506195068359375, "global_step": 276479, "epoch": 3331} {"train_loss": -25.059415817260742, "global_step": 276480, "epoch": 3331} {"train_loss": -25.20753288269043, "global_step": 276481, "epoch": 3331} {"train_loss": -25.442941665649414, "global_step": 276482, "epoch": 3331} {"train_loss": -25.42461585998535, "global_step": 276483, "epoch": 3331} {"train_loss": -25.25331687927246, "global_step": 276484, "epoch": 3331} {"train_loss": -25.370529174804688, "global_step": 276485, "epoch": 3331} {"train_loss": -25.29047203063965, "global_step": 276486, "epoch": 3331} {"train_loss": -25.09541130065918, "global_step": 276487, "epoch": 3331} {"train_loss": -25.12507438659668, "global_step": 276488, "epoch": 3331} {"train_loss": -25.012331008911133, "global_step": 276489, "epoch": 3331} {"train_loss": -25.44898796081543, "global_step": 276490, "epoch": 3331} {"train_loss": -24.771162033081055, "global_step": 276491, "epoch": 3331} {"train_loss": -25.376806259155273, "global_step": 276492, "epoch": 3331} {"train_loss": -25.135908126831055, "global_step": 276493, "epoch": 3331} {"train_loss": -25.410348892211914, "global_step": 276494, "epoch": 3331} {"train_loss": -25.12534523010254, "global_step": 276495, "epoch": 3331} {"train_loss": -25.702716827392578, "global_step": 276496, "epoch": 3331} {"train_loss": -25.1980037689209, "global_step": 276497, "epoch": 3331} {"train_loss": -25.535310745239258, "global_step": 276498, "epoch": 3331} {"train_loss": -24.944381713867188, "global_step": 276499, "epoch": 3331} {"train_loss": -25.315780639648438, "global_step": 276500, "epoch": 3331} {"train_loss": -25.66277503967285, "global_step": 276501, "epoch": 3331} {"train_loss": -24.96111488342285, "global_step": 276502, "epoch": 3331} {"train_loss": -25.1492919921875, "global_step": 276503, "epoch": 3331} {"train_loss": -25.084135055541992, "global_step": 276504, "epoch": 3331} {"train_loss": -25.31493377685547, "global_step": 276505, "epoch": 3331} {"train_loss": -25.412870407104492, "global_step": 276506, "epoch": 3331} {"train_loss": -25.42921257019043, "global_step": 276507, "epoch": 3331} {"train_loss": -25.29026222229004, "global_step": 276508, "epoch": 3331} {"train_loss": -25.40980339050293, "global_step": 276509, "epoch": 3331} {"train_loss": -25.844146728515625, "global_step": 276510, "epoch": 3331} {"train_loss": -25.697193145751953, "global_step": 276511, "epoch": 3331} {"train_loss": -25.393022537231445, "global_step": 276512, "epoch": 3331} {"train_loss": -25.599939346313477, "global_step": 276513, "epoch": 3331} {"train_loss": -25.635757446289062, "global_step": 276514, "epoch": 3331} {"train_loss": -25.653013229370117, "global_step": 276515, "epoch": 3331} {"train_loss": -25.477371215820312, "global_step": 276516, "epoch": 3331} {"train_loss": -25.680509567260742, "global_step": 276517, "epoch": 3331} {"train_loss": -25.119903564453125, "global_step": 276518, "epoch": 3331} {"train_loss": -25.193655014038086, "global_step": 276519, "epoch": 3331} {"train_loss": -25.1518611907959, "global_step": 276520, "epoch": 3331} {"train_loss": -25.142587661743164, "global_step": 276521, "epoch": 3331} {"train_loss": -25.199447631835938, "global_step": 276522, "epoch": 3331} {"train_loss": -25.51728057861328, "global_step": 276523, "epoch": 3331} {"train_loss": -25.259611129760742, "global_step": 276524, "epoch": 3331} {"train_loss": -25.474689483642578, "global_step": 276525, "epoch": 3331} {"train_loss": -25.619855880737305, "global_step": 276526, "epoch": 3331} {"train_loss": -25.563732147216797, "global_step": 276527, "epoch": 3331} {"train_loss": -24.86937713623047, "global_step": 276528, "epoch": 3331} {"train_loss": -25.107885360717773, "global_step": 276529, "epoch": 3331} {"train_loss": -25.125228881835938, "global_step": 276530, "epoch": 3331} {"train_loss": -25.511564254760742, "global_step": 276531, "epoch": 3331} {"train_loss": -25.275257110595703, "global_step": 276532, "epoch": 3331} {"train_loss": -25.212810516357422, "global_step": 276533, "epoch": 3331} {"train_loss": -25.37289810180664, "global_step": 276534, "epoch": 3331} {"train_loss": -25.35724449157715, "global_step": 276535, "epoch": 3331} {"train_loss": -25.2595272064209, "global_step": 276536, "epoch": 3331} {"train_loss": -25.509075164794922, "global_step": 276537, "epoch": 3331} {"train_loss": -25.63922119140625, "global_step": 276538, "epoch": 3331} {"train_loss": -25.1612606048584, "global_step": 276539, "epoch": 3331} {"train_loss": -25.251501083374023, "global_step": 276540, "epoch": 3331} {"train_loss": -25.053068161010742, "global_step": 276541, "epoch": 3331} {"train_loss": -25.378293991088867, "global_step": 276542, "epoch": 3331} {"train_loss": -25.390125274658203, "global_step": 276543, "epoch": 3331} {"train_loss": -25.224035263061523, "global_step": 276544, "epoch": 3331} {"train_loss": -25.097740173339844, "global_step": 276545, "epoch": 3331} {"train_loss": -25.086820602416992, "global_step": 276546, "epoch": 3331} {"train_loss": -25.255271911621094, "global_step": 276547, "epoch": 3331} {"train_loss": -25.216806411743164, "global_step": 276548, "epoch": 3331} {"train_loss": -25.470609664916992, "global_step": 276549, "epoch": 3331} {"train_loss": -25.304311752319336, "global_step": 276550, "epoch": 3331} {"train_loss": -25.01167106628418, "global_step": 276551, "epoch": 3331} {"train_loss": -25.46877098083496, "global_step": 276552, "epoch": 3331} {"train_loss": -25.39385986328125, "global_step": 276553, "epoch": 3331} {"train_loss": -25.267864227294922, "global_step": 276554, "epoch": 3331} {"train_loss": -25.28804631980069, "global_step": 276555, "epoch": 3331, "val_loss": 6942556.0} {"train_loss": -24.812559127807617, "global_step": 276556, "epoch": 3332} {"train_loss": -24.66587257385254, "global_step": 276557, "epoch": 3332} {"train_loss": -25.05677604675293, "global_step": 276558, "epoch": 3332} {"train_loss": -24.73175621032715, "global_step": 276559, "epoch": 3332} {"train_loss": -24.795766830444336, "global_step": 276560, "epoch": 3332} {"train_loss": -24.458663940429688, "global_step": 276561, "epoch": 3332} {"train_loss": -24.581222534179688, "global_step": 276562, "epoch": 3332} {"train_loss": -24.677881240844727, "global_step": 276563, "epoch": 3332} {"train_loss": -24.673601150512695, "global_step": 276564, "epoch": 3332} {"train_loss": -24.525836944580078, "global_step": 276565, "epoch": 3332} {"train_loss": -24.942951202392578, "global_step": 276566, "epoch": 3332} {"train_loss": -25.48940086364746, "global_step": 276567, "epoch": 3332} {"train_loss": -24.789682388305664, "global_step": 276568, "epoch": 3332} {"train_loss": -24.920503616333008, "global_step": 276569, "epoch": 3332} {"train_loss": -24.551218032836914, "global_step": 276570, "epoch": 3332} {"train_loss": -25.003400802612305, "global_step": 276571, "epoch": 3332} {"train_loss": -24.799190521240234, "global_step": 276572, "epoch": 3332} {"train_loss": -25.089054107666016, "global_step": 276573, "epoch": 3332} {"train_loss": -25.353830337524414, "global_step": 276574, "epoch": 3332} {"train_loss": -24.356369018554688, "global_step": 276575, "epoch": 3332} {"train_loss": -25.147581100463867, "global_step": 276576, "epoch": 3332} {"train_loss": -25.457609176635742, "global_step": 276577, "epoch": 3332} {"train_loss": -24.82286262512207, "global_step": 276578, "epoch": 3332} {"train_loss": -24.999181747436523, "global_step": 276579, "epoch": 3332} {"train_loss": -25.19870376586914, "global_step": 276580, "epoch": 3332} {"train_loss": -25.385181427001953, "global_step": 276581, "epoch": 3332} {"train_loss": -25.065298080444336, "global_step": 276582, "epoch": 3332} {"train_loss": -25.48193359375, "global_step": 276583, "epoch": 3332} {"train_loss": -25.191335678100586, "global_step": 276584, "epoch": 3332} {"train_loss": -25.154356002807617, "global_step": 276585, "epoch": 3332} {"train_loss": -25.072628021240234, "global_step": 276586, "epoch": 3332} {"train_loss": -25.3143367767334, "global_step": 276587, "epoch": 3332} {"train_loss": -25.229833602905273, "global_step": 276588, "epoch": 3332} {"train_loss": -25.50214958190918, "global_step": 276589, "epoch": 3332} {"train_loss": -25.152952194213867, "global_step": 276590, "epoch": 3332} {"train_loss": -25.671430587768555, "global_step": 276591, "epoch": 3332} {"train_loss": -25.112972259521484, "global_step": 276592, "epoch": 3332} {"train_loss": -25.623266220092773, "global_step": 276593, "epoch": 3332} {"train_loss": -25.452651977539062, "global_step": 276594, "epoch": 3332} {"train_loss": -25.513715744018555, "global_step": 276595, "epoch": 3332} {"train_loss": -25.238204956054688, "global_step": 276596, "epoch": 3332} {"train_loss": -25.224327087402344, "global_step": 276597, "epoch": 3332} {"train_loss": -25.354549407958984, "global_step": 276598, "epoch": 3332} {"train_loss": -25.34498405456543, "global_step": 276599, "epoch": 3332} {"train_loss": -25.332426071166992, "global_step": 276600, "epoch": 3332} {"train_loss": -25.481657028198242, "global_step": 276601, "epoch": 3332} {"train_loss": -25.203481674194336, "global_step": 276602, "epoch": 3332} {"train_loss": -25.442523956298828, "global_step": 276603, "epoch": 3332} {"train_loss": -25.30670928955078, "global_step": 276604, "epoch": 3332} {"train_loss": -25.42221450805664, "global_step": 276605, "epoch": 3332} {"train_loss": -25.142227172851562, "global_step": 276606, "epoch": 3332} {"train_loss": -25.223623275756836, "global_step": 276607, "epoch": 3332} {"train_loss": -25.4714412689209, "global_step": 276608, "epoch": 3332} {"train_loss": -25.274642944335938, "global_step": 276609, "epoch": 3332} {"train_loss": -25.3411865234375, "global_step": 276610, "epoch": 3332} {"train_loss": -25.461198806762695, "global_step": 276611, "epoch": 3332} {"train_loss": -25.384000778198242, "global_step": 276612, "epoch": 3332} {"train_loss": -25.430856704711914, "global_step": 276613, "epoch": 3332} {"train_loss": -25.48145866394043, "global_step": 276614, "epoch": 3332} {"train_loss": -25.36931610107422, "global_step": 276615, "epoch": 3332} {"train_loss": -25.366973876953125, "global_step": 276616, "epoch": 3332} {"train_loss": -25.171056747436523, "global_step": 276617, "epoch": 3332} {"train_loss": -25.444650650024414, "global_step": 276618, "epoch": 3332} {"train_loss": -25.230892181396484, "global_step": 276619, "epoch": 3332} {"train_loss": -24.3955135345459, "global_step": 276620, "epoch": 3332} {"train_loss": -23.52825927734375, "global_step": 276621, "epoch": 3332} {"train_loss": -22.64388084411621, "global_step": 276622, "epoch": 3332} {"train_loss": -24.40291976928711, "global_step": 276623, "epoch": 3332} {"train_loss": -24.935840606689453, "global_step": 276624, "epoch": 3332} {"train_loss": -24.594707489013672, "global_step": 276625, "epoch": 3332} {"train_loss": -25.050525665283203, "global_step": 276626, "epoch": 3332} {"train_loss": -24.754785537719727, "global_step": 276627, "epoch": 3332} {"train_loss": -24.439701080322266, "global_step": 276628, "epoch": 3332} {"train_loss": -24.852712631225586, "global_step": 276629, "epoch": 3332} {"train_loss": -24.751264572143555, "global_step": 276630, "epoch": 3332} {"train_loss": -24.624267578125, "global_step": 276631, "epoch": 3332} {"train_loss": -24.763370513916016, "global_step": 276632, "epoch": 3332} {"train_loss": -24.9891300201416, "global_step": 276633, "epoch": 3332} {"train_loss": -24.743558883666992, "global_step": 276634, "epoch": 3332} {"train_loss": -24.678945541381836, "global_step": 276635, "epoch": 3332} {"train_loss": -25.166526794433594, "global_step": 276636, "epoch": 3332} {"train_loss": -24.944488525390625, "global_step": 276637, "epoch": 3332} {"train_loss": -25.0260875196342, "global_step": 276638, "epoch": 3332, "val_loss": 6930484.0} {"train_loss": -24.17664909362793, "global_step": 276639, "epoch": 3333} {"train_loss": -24.753705978393555, "global_step": 276640, "epoch": 3333} {"train_loss": -24.511377334594727, "global_step": 276641, "epoch": 3333} {"train_loss": -24.73323631286621, "global_step": 276642, "epoch": 3333} {"train_loss": -25.025104522705078, "global_step": 276643, "epoch": 3333} {"train_loss": -24.682191848754883, "global_step": 276644, "epoch": 3333} {"train_loss": -24.852798461914062, "global_step": 276645, "epoch": 3333} {"train_loss": -25.077045440673828, "global_step": 276646, "epoch": 3333} {"train_loss": -25.102270126342773, "global_step": 276647, "epoch": 3333} {"train_loss": -24.890653610229492, "global_step": 276648, "epoch": 3333} {"train_loss": -24.51338768005371, "global_step": 276649, "epoch": 3333} {"train_loss": -24.94612693786621, "global_step": 276650, "epoch": 3333} {"train_loss": -24.97405433654785, "global_step": 276651, "epoch": 3333} {"train_loss": -25.199071884155273, "global_step": 276652, "epoch": 3333} {"train_loss": -25.05837059020996, "global_step": 276653, "epoch": 3333} {"train_loss": -25.402847290039062, "global_step": 276654, "epoch": 3333} {"train_loss": -25.032129287719727, "global_step": 276655, "epoch": 3333} {"train_loss": -25.36102294921875, "global_step": 276656, "epoch": 3333} {"train_loss": -25.494802474975586, "global_step": 276657, "epoch": 3333} {"train_loss": -25.30646324157715, "global_step": 276658, "epoch": 3333} {"train_loss": -25.121702194213867, "global_step": 276659, "epoch": 3333} {"train_loss": -25.180707931518555, "global_step": 276660, "epoch": 3333} {"train_loss": -25.701343536376953, "global_step": 276661, "epoch": 3333} {"train_loss": -25.150318145751953, "global_step": 276662, "epoch": 3333} {"train_loss": -25.36724281311035, "global_step": 276663, "epoch": 3333} {"train_loss": -25.236454010009766, "global_step": 276664, "epoch": 3333} {"train_loss": -25.34840965270996, "global_step": 276665, "epoch": 3333} {"train_loss": -25.386980056762695, "global_step": 276666, "epoch": 3333} {"train_loss": -25.393301010131836, "global_step": 276667, "epoch": 3333} {"train_loss": -25.67014503479004, "global_step": 276668, "epoch": 3333} {"train_loss": -25.783828735351562, "global_step": 276669, "epoch": 3333} {"train_loss": -25.251657485961914, "global_step": 276670, "epoch": 3333} {"train_loss": -25.215505599975586, "global_step": 276671, "epoch": 3333} {"train_loss": -25.45564842224121, "global_step": 276672, "epoch": 3333} {"train_loss": -25.43501091003418, "global_step": 276673, "epoch": 3333} {"train_loss": -25.539846420288086, "global_step": 276674, "epoch": 3333} {"train_loss": -25.40583610534668, "global_step": 276675, "epoch": 3333} {"train_loss": -25.382234573364258, "global_step": 276676, "epoch": 3333} {"train_loss": -25.423954010009766, "global_step": 276677, "epoch": 3333} {"train_loss": -25.085161209106445, "global_step": 276678, "epoch": 3333} {"train_loss": -25.306852340698242, "global_step": 276679, "epoch": 3333} {"train_loss": -24.684532165527344, "global_step": 276680, "epoch": 3333} {"train_loss": -25.23624038696289, "global_step": 276681, "epoch": 3333} {"train_loss": -25.281352996826172, "global_step": 276682, "epoch": 3333} {"train_loss": -25.56692886352539, "global_step": 276683, "epoch": 3333} {"train_loss": -25.13956069946289, "global_step": 276684, "epoch": 3333} {"train_loss": -25.287189483642578, "global_step": 276685, "epoch": 3333} {"train_loss": -25.615264892578125, "global_step": 276686, "epoch": 3333} {"train_loss": -25.616943359375, "global_step": 276687, "epoch": 3333} {"train_loss": -25.411182403564453, "global_step": 276688, "epoch": 3333} {"train_loss": -25.582983016967773, "global_step": 276689, "epoch": 3333} {"train_loss": -25.831073760986328, "global_step": 276690, "epoch": 3333} {"train_loss": -25.47988510131836, "global_step": 276691, "epoch": 3333} {"train_loss": -25.244510650634766, "global_step": 276692, "epoch": 3333} {"train_loss": -25.2829647064209, "global_step": 276693, "epoch": 3333} {"train_loss": -25.747785568237305, "global_step": 276694, "epoch": 3333} {"train_loss": -25.45184898376465, "global_step": 276695, "epoch": 3333} {"train_loss": -24.833232879638672, "global_step": 276696, "epoch": 3333} {"train_loss": -25.285274505615234, "global_step": 276697, "epoch": 3333} {"train_loss": -25.391101837158203, "global_step": 276698, "epoch": 3333} {"train_loss": -25.069623947143555, "global_step": 276699, "epoch": 3333} {"train_loss": -25.558456420898438, "global_step": 276700, "epoch": 3333} {"train_loss": -25.413360595703125, "global_step": 276701, "epoch": 3333} {"train_loss": -25.201663970947266, "global_step": 276702, "epoch": 3333} {"train_loss": -25.525522232055664, "global_step": 276703, "epoch": 3333} {"train_loss": -25.48177146911621, "global_step": 276704, "epoch": 3333} {"train_loss": -25.223379135131836, "global_step": 276705, "epoch": 3333} {"train_loss": -25.757566452026367, "global_step": 276706, "epoch": 3333} {"train_loss": -25.489870071411133, "global_step": 276707, "epoch": 3333} {"train_loss": -25.386877059936523, "global_step": 276708, "epoch": 3333} {"train_loss": -25.28376579284668, "global_step": 276709, "epoch": 3333} {"train_loss": -25.118709564208984, "global_step": 276710, "epoch": 3333} {"train_loss": -25.30565071105957, "global_step": 276711, "epoch": 3333} {"train_loss": -25.663543701171875, "global_step": 276712, "epoch": 3333} {"train_loss": -25.496103286743164, "global_step": 276713, "epoch": 3333} {"train_loss": -25.375999450683594, "global_step": 276714, "epoch": 3333} {"train_loss": -25.684762954711914, "global_step": 276715, "epoch": 3333} {"train_loss": -25.448469161987305, "global_step": 276716, "epoch": 3333} {"train_loss": -25.530410766601562, "global_step": 276717, "epoch": 3333} {"train_loss": -25.643051147460938, "global_step": 276718, "epoch": 3333} {"train_loss": -25.50370216369629, "global_step": 276719, "epoch": 3333} {"train_loss": -25.002416610717773, "global_step": 276720, "epoch": 3333} {"train_loss": -25.283050835850727, "global_step": 276721, "epoch": 3333, "val_loss": 7036234.0} {"train_loss": -24.492141723632812, "global_step": 276722, "epoch": 3334} {"train_loss": -24.729639053344727, "global_step": 276723, "epoch": 3334} {"train_loss": -24.040315628051758, "global_step": 276724, "epoch": 3334} {"train_loss": -24.486684799194336, "global_step": 276725, "epoch": 3334} {"train_loss": -24.911563873291016, "global_step": 276726, "epoch": 3334} {"train_loss": -24.449676513671875, "global_step": 276727, "epoch": 3334} {"train_loss": -24.46204948425293, "global_step": 276728, "epoch": 3334} {"train_loss": -24.578475952148438, "global_step": 276729, "epoch": 3334} {"train_loss": -24.671537399291992, "global_step": 276730, "epoch": 3334} {"train_loss": -24.781641006469727, "global_step": 276731, "epoch": 3334} {"train_loss": -24.79395866394043, "global_step": 276732, "epoch": 3334} {"train_loss": -24.48868751525879, "global_step": 276733, "epoch": 3334} {"train_loss": -24.838254928588867, "global_step": 276734, "epoch": 3334} {"train_loss": -24.897432327270508, "global_step": 276735, "epoch": 3334} {"train_loss": -24.650697708129883, "global_step": 276736, "epoch": 3334} {"train_loss": -24.961423873901367, "global_step": 276737, "epoch": 3334} {"train_loss": -25.08452796936035, "global_step": 276738, "epoch": 3334} {"train_loss": -24.897022247314453, "global_step": 276739, "epoch": 3334} {"train_loss": -24.823991775512695, "global_step": 276740, "epoch": 3334} {"train_loss": -25.022573471069336, "global_step": 276741, "epoch": 3334} {"train_loss": -25.100893020629883, "global_step": 276742, "epoch": 3334} {"train_loss": -25.1540470123291, "global_step": 276743, "epoch": 3334} {"train_loss": -24.849035263061523, "global_step": 276744, "epoch": 3334} {"train_loss": -24.912277221679688, "global_step": 276745, "epoch": 3334} {"train_loss": -24.830806732177734, "global_step": 276746, "epoch": 3334} {"train_loss": -24.782291412353516, "global_step": 276747, "epoch": 3334} {"train_loss": -25.031085968017578, "global_step": 276748, "epoch": 3334} {"train_loss": -24.986928939819336, "global_step": 276749, "epoch": 3334} {"train_loss": -24.751455307006836, "global_step": 276750, "epoch": 3334} {"train_loss": -25.013416290283203, "global_step": 276751, "epoch": 3334} {"train_loss": -25.3763427734375, "global_step": 276752, "epoch": 3334} {"train_loss": -25.090185165405273, "global_step": 276753, "epoch": 3334} {"train_loss": -25.02941131591797, "global_step": 276754, "epoch": 3334} {"train_loss": -25.474733352661133, "global_step": 276755, "epoch": 3334} {"train_loss": -24.982370376586914, "global_step": 276756, "epoch": 3334} {"train_loss": -25.303329467773438, "global_step": 276757, "epoch": 3334} {"train_loss": -25.213424682617188, "global_step": 276758, "epoch": 3334} {"train_loss": -25.277183532714844, "global_step": 276759, "epoch": 3334} {"train_loss": -25.43134880065918, "global_step": 276760, "epoch": 3334} {"train_loss": -25.788854598999023, "global_step": 276761, "epoch": 3334} {"train_loss": -25.32036590576172, "global_step": 276762, "epoch": 3334} {"train_loss": -25.288793563842773, "global_step": 276763, "epoch": 3334} {"train_loss": -25.514394760131836, "global_step": 276764, "epoch": 3334} {"train_loss": -25.34641456604004, "global_step": 276765, "epoch": 3334} {"train_loss": -25.19911003112793, "global_step": 276766, "epoch": 3334} {"train_loss": -25.630401611328125, "global_step": 276767, "epoch": 3334} {"train_loss": -25.110965728759766, "global_step": 276768, "epoch": 3334} {"train_loss": -25.567218780517578, "global_step": 276769, "epoch": 3334} {"train_loss": -25.379663467407227, "global_step": 276770, "epoch": 3334} {"train_loss": -25.265676498413086, "global_step": 276771, "epoch": 3334} {"train_loss": -25.179780960083008, "global_step": 276772, "epoch": 3334} {"train_loss": -25.59437370300293, "global_step": 276773, "epoch": 3334} {"train_loss": -25.695642471313477, "global_step": 276774, "epoch": 3334} {"train_loss": -25.70302391052246, "global_step": 276775, "epoch": 3334} {"train_loss": -25.87163734436035, "global_step": 276776, "epoch": 3334} {"train_loss": -25.440832138061523, "global_step": 276777, "epoch": 3334} {"train_loss": -25.506271362304688, "global_step": 276778, "epoch": 3334} {"train_loss": -25.598936080932617, "global_step": 276779, "epoch": 3334} {"train_loss": -25.215824127197266, "global_step": 276780, "epoch": 3334} {"train_loss": -25.65907096862793, "global_step": 276781, "epoch": 3334} {"train_loss": -25.762409210205078, "global_step": 276782, "epoch": 3334} {"train_loss": -25.391422271728516, "global_step": 276783, "epoch": 3334} {"train_loss": -25.51983070373535, "global_step": 276784, "epoch": 3334} {"train_loss": -25.234188079833984, "global_step": 276785, "epoch": 3334} {"train_loss": -25.611175537109375, "global_step": 276786, "epoch": 3334} {"train_loss": -25.18580436706543, "global_step": 276787, "epoch": 3334} {"train_loss": -25.500259399414062, "global_step": 276788, "epoch": 3334} {"train_loss": -25.936542510986328, "global_step": 276789, "epoch": 3334} {"train_loss": -25.26130485534668, "global_step": 276790, "epoch": 3334} {"train_loss": -25.319433212280273, "global_step": 276791, "epoch": 3334} {"train_loss": -25.568540573120117, "global_step": 276792, "epoch": 3334} {"train_loss": -25.412092208862305, "global_step": 276793, "epoch": 3334} {"train_loss": -25.398086547851562, "global_step": 276794, "epoch": 3334} {"train_loss": -25.069990158081055, "global_step": 276795, "epoch": 3334} {"train_loss": -24.97715187072754, "global_step": 276796, "epoch": 3334} {"train_loss": -25.13043785095215, "global_step": 276797, "epoch": 3334} {"train_loss": -24.74846649169922, "global_step": 276798, "epoch": 3334} {"train_loss": -25.349645614624023, "global_step": 276799, "epoch": 3334} {"train_loss": -24.81233787536621, "global_step": 276800, "epoch": 3334} {"train_loss": -25.296979904174805, "global_step": 276801, "epoch": 3334} {"train_loss": -24.981473922729492, "global_step": 276802, "epoch": 3334} {"train_loss": -24.87142562866211, "global_step": 276803, "epoch": 3334} {"train_loss": -25.153307742383106, "global_step": 276804, "epoch": 3334, "val_loss": 7142415.5} {"train_loss": -22.21836280822754, "global_step": 276805, "epoch": 3335} {"train_loss": -23.810016632080078, "global_step": 276806, "epoch": 3335} {"train_loss": -23.234853744506836, "global_step": 276807, "epoch": 3335} {"train_loss": -23.262685775756836, "global_step": 276808, "epoch": 3335} {"train_loss": -23.71809959411621, "global_step": 276809, "epoch": 3335} {"train_loss": -23.229490280151367, "global_step": 276810, "epoch": 3335} {"train_loss": -23.744789123535156, "global_step": 276811, "epoch": 3335} {"train_loss": -24.499082565307617, "global_step": 276812, "epoch": 3335} {"train_loss": -23.856534957885742, "global_step": 276813, "epoch": 3335} {"train_loss": -24.092321395874023, "global_step": 276814, "epoch": 3335} {"train_loss": -23.571365356445312, "global_step": 276815, "epoch": 3335} {"train_loss": -24.027496337890625, "global_step": 276816, "epoch": 3335} {"train_loss": -23.889795303344727, "global_step": 276817, "epoch": 3335} {"train_loss": -24.252445220947266, "global_step": 276818, "epoch": 3335} {"train_loss": -23.974716186523438, "global_step": 276819, "epoch": 3335} {"train_loss": -24.265254974365234, "global_step": 276820, "epoch": 3335} {"train_loss": -24.289487838745117, "global_step": 276821, "epoch": 3335} {"train_loss": -24.452560424804688, "global_step": 276822, "epoch": 3335} {"train_loss": -23.87091064453125, "global_step": 276823, "epoch": 3335} {"train_loss": -24.63825798034668, "global_step": 276824, "epoch": 3335} {"train_loss": -24.496183395385742, "global_step": 276825, "epoch": 3335} {"train_loss": -24.21988868713379, "global_step": 276826, "epoch": 3335} {"train_loss": -24.665470123291016, "global_step": 276827, "epoch": 3335} {"train_loss": -24.765857696533203, "global_step": 276828, "epoch": 3335} {"train_loss": -24.748809814453125, "global_step": 276829, "epoch": 3335} {"train_loss": -24.69740867614746, "global_step": 276830, "epoch": 3335} {"train_loss": -24.671422958374023, "global_step": 276831, "epoch": 3335} {"train_loss": -24.573875427246094, "global_step": 276832, "epoch": 3335} {"train_loss": -24.938352584838867, "global_step": 276833, "epoch": 3335} {"train_loss": -24.72736930847168, "global_step": 276834, "epoch": 3335} {"train_loss": -24.78232192993164, "global_step": 276835, "epoch": 3335} {"train_loss": -24.810949325561523, "global_step": 276836, "epoch": 3335} {"train_loss": -24.868778228759766, "global_step": 276837, "epoch": 3335} {"train_loss": -24.759506225585938, "global_step": 276838, "epoch": 3335} {"train_loss": -24.852426528930664, "global_step": 276839, "epoch": 3335} {"train_loss": -24.84450912475586, "global_step": 276840, "epoch": 3335} {"train_loss": -25.08241081237793, "global_step": 276841, "epoch": 3335} {"train_loss": -25.258779525756836, "global_step": 276842, "epoch": 3335} {"train_loss": -25.67119789123535, "global_step": 276843, "epoch": 3335} {"train_loss": -25.170230865478516, "global_step": 276844, "epoch": 3335} {"train_loss": -25.016006469726562, "global_step": 276845, "epoch": 3335} {"train_loss": -24.976293563842773, "global_step": 276846, "epoch": 3335} {"train_loss": -25.40164566040039, "global_step": 276847, "epoch": 3335} {"train_loss": -25.4282169342041, "global_step": 276848, "epoch": 3335} {"train_loss": -25.117799758911133, "global_step": 276849, "epoch": 3335} {"train_loss": -25.115598678588867, "global_step": 276850, "epoch": 3335} {"train_loss": -24.97858238220215, "global_step": 276851, "epoch": 3335} {"train_loss": -25.551382064819336, "global_step": 276852, "epoch": 3335} {"train_loss": -25.171157836914062, "global_step": 276853, "epoch": 3335} {"train_loss": -25.304868698120117, "global_step": 276854, "epoch": 3335} {"train_loss": -25.49891471862793, "global_step": 276855, "epoch": 3335} {"train_loss": -25.35986328125, "global_step": 276856, "epoch": 3335} {"train_loss": -25.211246490478516, "global_step": 276857, "epoch": 3335} {"train_loss": -25.30755043029785, "global_step": 276858, "epoch": 3335} {"train_loss": -25.221731185913086, "global_step": 276859, "epoch": 3335} {"train_loss": -25.01668357849121, "global_step": 276860, "epoch": 3335} {"train_loss": -25.08082389831543, "global_step": 276861, "epoch": 3335} {"train_loss": -24.86029624938965, "global_step": 276862, "epoch": 3335} {"train_loss": -25.4733943939209, "global_step": 276863, "epoch": 3335} {"train_loss": -25.3309383392334, "global_step": 276864, "epoch": 3335} {"train_loss": -25.248472213745117, "global_step": 276865, "epoch": 3335} {"train_loss": -25.649961471557617, "global_step": 276866, "epoch": 3335} {"train_loss": -25.337677001953125, "global_step": 276867, "epoch": 3335} {"train_loss": -25.53834342956543, "global_step": 276868, "epoch": 3335} {"train_loss": -25.365039825439453, "global_step": 276869, "epoch": 3335} {"train_loss": -25.549640655517578, "global_step": 276870, "epoch": 3335} {"train_loss": -25.297801971435547, "global_step": 276871, "epoch": 3335} {"train_loss": -25.508365631103516, "global_step": 276872, "epoch": 3335} {"train_loss": -25.446500778198242, "global_step": 276873, "epoch": 3335} {"train_loss": -25.193634033203125, "global_step": 276874, "epoch": 3335} {"train_loss": -25.52181625366211, "global_step": 276875, "epoch": 3335} {"train_loss": -25.476301193237305, "global_step": 276876, "epoch": 3335} {"train_loss": -25.455121994018555, "global_step": 276877, "epoch": 3335} {"train_loss": -25.281661987304688, "global_step": 276878, "epoch": 3335} {"train_loss": -25.187213897705078, "global_step": 276879, "epoch": 3335} {"train_loss": -25.56382942199707, "global_step": 276880, "epoch": 3335} {"train_loss": -25.20694351196289, "global_step": 276881, "epoch": 3335} {"train_loss": -25.269277572631836, "global_step": 276882, "epoch": 3335} {"train_loss": -25.6336669921875, "global_step": 276883, "epoch": 3335} {"train_loss": -25.367103576660156, "global_step": 276884, "epoch": 3335} {"train_loss": -25.119678497314453, "global_step": 276885, "epoch": 3335} {"train_loss": -24.986448287963867, "global_step": 276886, "epoch": 3335} {"train_loss": -24.838952949248164, "global_step": 276887, "epoch": 3335, "val_loss": 7081241.0} {"train_loss": -25.178983688354492, "global_step": 276888, "epoch": 3336} {"train_loss": -24.413015365600586, "global_step": 276889, "epoch": 3336} {"train_loss": -24.73172950744629, "global_step": 276890, "epoch": 3336} {"train_loss": -24.524154663085938, "global_step": 276891, "epoch": 3336} {"train_loss": -25.061853408813477, "global_step": 276892, "epoch": 3336} {"train_loss": -24.654708862304688, "global_step": 276893, "epoch": 3336} {"train_loss": -25.08567237854004, "global_step": 276894, "epoch": 3336} {"train_loss": -25.076719284057617, "global_step": 276895, "epoch": 3336} {"train_loss": -24.866744995117188, "global_step": 276896, "epoch": 3336} {"train_loss": -25.238780975341797, "global_step": 276897, "epoch": 3336} {"train_loss": -24.78899574279785, "global_step": 276898, "epoch": 3336} {"train_loss": -25.322174072265625, "global_step": 276899, "epoch": 3336} {"train_loss": -25.16775894165039, "global_step": 276900, "epoch": 3336} {"train_loss": -24.726646423339844, "global_step": 276901, "epoch": 3336} {"train_loss": -25.23122215270996, "global_step": 276902, "epoch": 3336} {"train_loss": -25.512601852416992, "global_step": 276903, "epoch": 3336} {"train_loss": -25.115245819091797, "global_step": 276904, "epoch": 3336} {"train_loss": -25.046527862548828, "global_step": 276905, "epoch": 3336} {"train_loss": -25.081846237182617, "global_step": 276906, "epoch": 3336} {"train_loss": -24.980985641479492, "global_step": 276907, "epoch": 3336} {"train_loss": -25.216350555419922, "global_step": 276908, "epoch": 3336} {"train_loss": -25.040218353271484, "global_step": 276909, "epoch": 3336} {"train_loss": -25.470579147338867, "global_step": 276910, "epoch": 3336} {"train_loss": -25.36281394958496, "global_step": 276911, "epoch": 3336} {"train_loss": -24.99675178527832, "global_step": 276912, "epoch": 3336} {"train_loss": -25.1185359954834, "global_step": 276913, "epoch": 3336} {"train_loss": -25.561399459838867, "global_step": 276914, "epoch": 3336} {"train_loss": -25.66172218322754, "global_step": 276915, "epoch": 3336} {"train_loss": -25.57491683959961, "global_step": 276916, "epoch": 3336} {"train_loss": -25.594764709472656, "global_step": 276917, "epoch": 3336} {"train_loss": -25.11554527282715, "global_step": 276918, "epoch": 3336} {"train_loss": -25.631946563720703, "global_step": 276919, "epoch": 3336} {"train_loss": -24.96054458618164, "global_step": 276920, "epoch": 3336} {"train_loss": -25.468595504760742, "global_step": 276921, "epoch": 3336} {"train_loss": -25.49802017211914, "global_step": 276922, "epoch": 3336} {"train_loss": -25.04807472229004, "global_step": 276923, "epoch": 3336} {"train_loss": -25.045379638671875, "global_step": 276924, "epoch": 3336} {"train_loss": -25.479764938354492, "global_step": 276925, "epoch": 3336} {"train_loss": -25.283794403076172, "global_step": 276926, "epoch": 3336} {"train_loss": -25.405920028686523, "global_step": 276927, "epoch": 3336} {"train_loss": -25.291837692260742, "global_step": 276928, "epoch": 3336} {"train_loss": -25.444013595581055, "global_step": 276929, "epoch": 3336} {"train_loss": -25.3989200592041, "global_step": 276930, "epoch": 3336} {"train_loss": -25.619359970092773, "global_step": 276931, "epoch": 3336} {"train_loss": -25.234304428100586, "global_step": 276932, "epoch": 3336} {"train_loss": -25.461462020874023, "global_step": 276933, "epoch": 3336} {"train_loss": -25.35824966430664, "global_step": 276934, "epoch": 3336} {"train_loss": -25.338972091674805, "global_step": 276935, "epoch": 3336} {"train_loss": -25.373472213745117, "global_step": 276936, "epoch": 3336} {"train_loss": -25.35399627685547, "global_step": 276937, "epoch": 3336} {"train_loss": -25.473548889160156, "global_step": 276938, "epoch": 3336} {"train_loss": -25.548187255859375, "global_step": 276939, "epoch": 3336} {"train_loss": -25.775236129760742, "global_step": 276940, "epoch": 3336} {"train_loss": -25.430307388305664, "global_step": 276941, "epoch": 3336} {"train_loss": -25.403432846069336, "global_step": 276942, "epoch": 3336} {"train_loss": -25.448963165283203, "global_step": 276943, "epoch": 3336} {"train_loss": -25.246417999267578, "global_step": 276944, "epoch": 3336} {"train_loss": -25.424421310424805, "global_step": 276945, "epoch": 3336} {"train_loss": -25.449438095092773, "global_step": 276946, "epoch": 3336} {"train_loss": -25.284975051879883, "global_step": 276947, "epoch": 3336} {"train_loss": -25.652088165283203, "global_step": 276948, "epoch": 3336} {"train_loss": -25.54755401611328, "global_step": 276949, "epoch": 3336} {"train_loss": -25.38246726989746, "global_step": 276950, "epoch": 3336} {"train_loss": -25.331052780151367, "global_step": 276951, "epoch": 3336} {"train_loss": -25.47809410095215, "global_step": 276952, "epoch": 3336} {"train_loss": -25.390356063842773, "global_step": 276953, "epoch": 3336} {"train_loss": -25.340591430664062, "global_step": 276954, "epoch": 3336} {"train_loss": -25.423921585083008, "global_step": 276955, "epoch": 3336} {"train_loss": -25.18893814086914, "global_step": 276956, "epoch": 3336} {"train_loss": -25.36250877380371, "global_step": 276957, "epoch": 3336} {"train_loss": -25.020200729370117, "global_step": 276958, "epoch": 3336} {"train_loss": -25.339120864868164, "global_step": 276959, "epoch": 3336} {"train_loss": -25.479381561279297, "global_step": 276960, "epoch": 3336} {"train_loss": -25.425012588500977, "global_step": 276961, "epoch": 3336} {"train_loss": -25.354995727539062, "global_step": 276962, "epoch": 3336} {"train_loss": -25.4863338470459, "global_step": 276963, "epoch": 3336} {"train_loss": -25.555099487304688, "global_step": 276964, "epoch": 3336} {"train_loss": -25.755462646484375, "global_step": 276965, "epoch": 3336} {"train_loss": -25.295515060424805, "global_step": 276966, "epoch": 3336} {"train_loss": -25.63117790222168, "global_step": 276967, "epoch": 3336} {"train_loss": -25.873661041259766, "global_step": 276968, "epoch": 3336} {"train_loss": -25.66498374938965, "global_step": 276969, "epoch": 3336} {"train_loss": -25.29677632343338, "global_step": 276970, "epoch": 3336, "val_loss": 7089161.5} {"train_loss": -24.928821563720703, "global_step": 276971, "epoch": 3337} {"train_loss": -25.30276870727539, "global_step": 276972, "epoch": 3337} {"train_loss": -25.12835693359375, "global_step": 276973, "epoch": 3337} {"train_loss": -24.37238121032715, "global_step": 276974, "epoch": 3337} {"train_loss": -25.090438842773438, "global_step": 276975, "epoch": 3337} {"train_loss": -24.91567611694336, "global_step": 276976, "epoch": 3337} {"train_loss": -24.459901809692383, "global_step": 276977, "epoch": 3337} {"train_loss": -25.32097625732422, "global_step": 276978, "epoch": 3337} {"train_loss": -24.711528778076172, "global_step": 276979, "epoch": 3337} {"train_loss": -24.950510025024414, "global_step": 276980, "epoch": 3337} {"train_loss": -25.38568878173828, "global_step": 276981, "epoch": 3337} {"train_loss": -24.904600143432617, "global_step": 276982, "epoch": 3337} {"train_loss": -25.226743698120117, "global_step": 276983, "epoch": 3337} {"train_loss": -25.12251853942871, "global_step": 276984, "epoch": 3337} {"train_loss": -25.314523696899414, "global_step": 276985, "epoch": 3337} {"train_loss": -24.885705947875977, "global_step": 276986, "epoch": 3337} {"train_loss": -25.545059204101562, "global_step": 276987, "epoch": 3337} {"train_loss": -25.014848709106445, "global_step": 276988, "epoch": 3337} {"train_loss": -25.10856056213379, "global_step": 276989, "epoch": 3337} {"train_loss": -25.372814178466797, "global_step": 276990, "epoch": 3337} {"train_loss": -24.970109939575195, "global_step": 276991, "epoch": 3337} {"train_loss": -25.120647430419922, "global_step": 276992, "epoch": 3337} {"train_loss": -25.34905433654785, "global_step": 276993, "epoch": 3337} {"train_loss": -24.99544334411621, "global_step": 276994, "epoch": 3337} {"train_loss": -24.824480056762695, "global_step": 276995, "epoch": 3337} {"train_loss": -25.29265594482422, "global_step": 276996, "epoch": 3337} {"train_loss": -25.11907196044922, "global_step": 276997, "epoch": 3337} {"train_loss": -24.999435424804688, "global_step": 276998, "epoch": 3337} {"train_loss": -25.39155387878418, "global_step": 276999, "epoch": 3337} {"train_loss": -25.058446884155273, "global_step": 277000, "epoch": 3337} {"train_loss": -25.130477905273438, "global_step": 277001, "epoch": 3337} {"train_loss": -25.49460792541504, "global_step": 277002, "epoch": 3337} {"train_loss": -25.124963760375977, "global_step": 277003, "epoch": 3337} {"train_loss": -25.31747817993164, "global_step": 277004, "epoch": 3337} {"train_loss": -25.40877914428711, "global_step": 277005, "epoch": 3337} {"train_loss": -25.316511154174805, "global_step": 277006, "epoch": 3337} {"train_loss": -25.554183959960938, "global_step": 277007, "epoch": 3337} {"train_loss": -25.346878051757812, "global_step": 277008, "epoch": 3337} {"train_loss": -25.646427154541016, "global_step": 277009, "epoch": 3337} {"train_loss": -25.65450096130371, "global_step": 277010, "epoch": 3337} {"train_loss": -25.057823181152344, "global_step": 277011, "epoch": 3337} {"train_loss": -25.251619338989258, "global_step": 277012, "epoch": 3337} {"train_loss": -25.568811416625977, "global_step": 277013, "epoch": 3337} {"train_loss": -25.223928451538086, "global_step": 277014, "epoch": 3337} {"train_loss": -25.267057418823242, "global_step": 277015, "epoch": 3337} {"train_loss": -25.505292892456055, "global_step": 277016, "epoch": 3337} {"train_loss": -25.410907745361328, "global_step": 277017, "epoch": 3337} {"train_loss": -25.00203514099121, "global_step": 277018, "epoch": 3337} {"train_loss": -25.43121337890625, "global_step": 277019, "epoch": 3337} {"train_loss": -25.325300216674805, "global_step": 277020, "epoch": 3337} {"train_loss": -25.766815185546875, "global_step": 277021, "epoch": 3337} {"train_loss": -25.5311336517334, "global_step": 277022, "epoch": 3337} {"train_loss": -25.442882537841797, "global_step": 277023, "epoch": 3337} {"train_loss": -25.49037742614746, "global_step": 277024, "epoch": 3337} {"train_loss": -25.285795211791992, "global_step": 277025, "epoch": 3337} {"train_loss": -25.677148818969727, "global_step": 277026, "epoch": 3337} {"train_loss": -25.03236198425293, "global_step": 277027, "epoch": 3337} {"train_loss": -25.31694221496582, "global_step": 277028, "epoch": 3337} {"train_loss": -25.877042770385742, "global_step": 277029, "epoch": 3337} {"train_loss": -25.601226806640625, "global_step": 277030, "epoch": 3337} {"train_loss": -25.152936935424805, "global_step": 277031, "epoch": 3337} {"train_loss": -25.3194522857666, "global_step": 277032, "epoch": 3337} {"train_loss": -25.11442756652832, "global_step": 277033, "epoch": 3337} {"train_loss": -25.450916290283203, "global_step": 277034, "epoch": 3337} {"train_loss": -25.400053024291992, "global_step": 277035, "epoch": 3337} {"train_loss": -25.596420288085938, "global_step": 277036, "epoch": 3337} {"train_loss": -25.5526180267334, "global_step": 277037, "epoch": 3337} {"train_loss": -25.589670181274414, "global_step": 277038, "epoch": 3337} {"train_loss": -25.26878547668457, "global_step": 277039, "epoch": 3337} {"train_loss": -25.8029727935791, "global_step": 277040, "epoch": 3337} {"train_loss": -25.676542282104492, "global_step": 277041, "epoch": 3337} {"train_loss": -25.59152603149414, "global_step": 277042, "epoch": 3337} {"train_loss": -25.446317672729492, "global_step": 277043, "epoch": 3337} {"train_loss": -25.48196792602539, "global_step": 277044, "epoch": 3337} {"train_loss": -25.375152587890625, "global_step": 277045, "epoch": 3337} {"train_loss": -25.131103515625, "global_step": 277046, "epoch": 3337} {"train_loss": -25.4617919921875, "global_step": 277047, "epoch": 3337} {"train_loss": -25.099401473999023, "global_step": 277048, "epoch": 3337} {"train_loss": -25.397602081298828, "global_step": 277049, "epoch": 3337} {"train_loss": -25.335424423217773, "global_step": 277050, "epoch": 3337} {"train_loss": -25.26242446899414, "global_step": 277051, "epoch": 3337} {"train_loss": -25.582693099975586, "global_step": 277052, "epoch": 3337} {"train_loss": -25.268932181668568, "global_step": 277053, "epoch": 3337, "val_loss": 7113690.0} {"train_loss": -23.49897575378418, "global_step": 277054, "epoch": 3338} {"train_loss": -23.24126625061035, "global_step": 277055, "epoch": 3338} {"train_loss": -24.749183654785156, "global_step": 277056, "epoch": 3338} {"train_loss": -23.483844757080078, "global_step": 277057, "epoch": 3338} {"train_loss": -24.714338302612305, "global_step": 277058, "epoch": 3338} {"train_loss": -24.36995506286621, "global_step": 277059, "epoch": 3338} {"train_loss": -24.3984317779541, "global_step": 277060, "epoch": 3338} {"train_loss": -24.064605712890625, "global_step": 277061, "epoch": 3338} {"train_loss": -24.41005516052246, "global_step": 277062, "epoch": 3338} {"train_loss": -24.58205223083496, "global_step": 277063, "epoch": 3338} {"train_loss": -24.45505714416504, "global_step": 277064, "epoch": 3338} {"train_loss": -24.502429962158203, "global_step": 277065, "epoch": 3338} {"train_loss": -25.0689697265625, "global_step": 277066, "epoch": 3338} {"train_loss": -24.5687255859375, "global_step": 277067, "epoch": 3338} {"train_loss": -24.676855087280273, "global_step": 277068, "epoch": 3338} {"train_loss": -25.08774185180664, "global_step": 277069, "epoch": 3338} {"train_loss": -25.02783203125, "global_step": 277070, "epoch": 3338} {"train_loss": -24.738994598388672, "global_step": 277071, "epoch": 3338} {"train_loss": -24.979902267456055, "global_step": 277072, "epoch": 3338} {"train_loss": -24.776700973510742, "global_step": 277073, "epoch": 3338} {"train_loss": -24.64806365966797, "global_step": 277074, "epoch": 3338} {"train_loss": -24.949264526367188, "global_step": 277075, "epoch": 3338} {"train_loss": -25.032861709594727, "global_step": 277076, "epoch": 3338} {"train_loss": -24.968637466430664, "global_step": 277077, "epoch": 3338} {"train_loss": -25.010915756225586, "global_step": 277078, "epoch": 3338} {"train_loss": -24.882116317749023, "global_step": 277079, "epoch": 3338} {"train_loss": -24.985200881958008, "global_step": 277080, "epoch": 3338} {"train_loss": -24.97858238220215, "global_step": 277081, "epoch": 3338} {"train_loss": -24.983261108398438, "global_step": 277082, "epoch": 3338} {"train_loss": -25.255041122436523, "global_step": 277083, "epoch": 3338} {"train_loss": -25.093732833862305, "global_step": 277084, "epoch": 3338} {"train_loss": -25.098220825195312, "global_step": 277085, "epoch": 3338} {"train_loss": -25.836538314819336, "global_step": 277086, "epoch": 3338} {"train_loss": -25.24793815612793, "global_step": 277087, "epoch": 3338} {"train_loss": -25.275327682495117, "global_step": 277088, "epoch": 3338} {"train_loss": -24.994909286499023, "global_step": 277089, "epoch": 3338} {"train_loss": -25.171903610229492, "global_step": 277090, "epoch": 3338} {"train_loss": -25.074459075927734, "global_step": 277091, "epoch": 3338} {"train_loss": -25.41516876220703, "global_step": 277092, "epoch": 3338} {"train_loss": -25.04582405090332, "global_step": 277093, "epoch": 3338} {"train_loss": -25.543325424194336, "global_step": 277094, "epoch": 3338} {"train_loss": -25.614648818969727, "global_step": 277095, "epoch": 3338} {"train_loss": -25.398038864135742, "global_step": 277096, "epoch": 3338} {"train_loss": -25.586225509643555, "global_step": 277097, "epoch": 3338} {"train_loss": -25.31610679626465, "global_step": 277098, "epoch": 3338} {"train_loss": -25.430377960205078, "global_step": 277099, "epoch": 3338} {"train_loss": -25.03297233581543, "global_step": 277100, "epoch": 3338} {"train_loss": -25.741445541381836, "global_step": 277101, "epoch": 3338} {"train_loss": -25.664188385009766, "global_step": 277102, "epoch": 3338} {"train_loss": -25.400575637817383, "global_step": 277103, "epoch": 3338} {"train_loss": -25.8049259185791, "global_step": 277104, "epoch": 3338} {"train_loss": -25.580121994018555, "global_step": 277105, "epoch": 3338} {"train_loss": -25.396076202392578, "global_step": 277106, "epoch": 3338} {"train_loss": -25.297157287597656, "global_step": 277107, "epoch": 3338} {"train_loss": -25.628690719604492, "global_step": 277108, "epoch": 3338} {"train_loss": -25.362653732299805, "global_step": 277109, "epoch": 3338} {"train_loss": -25.662174224853516, "global_step": 277110, "epoch": 3338} {"train_loss": -25.534076690673828, "global_step": 277111, "epoch": 3338} {"train_loss": -25.491254806518555, "global_step": 277112, "epoch": 3338} {"train_loss": -25.44562339782715, "global_step": 277113, "epoch": 3338} {"train_loss": -25.29648780822754, "global_step": 277114, "epoch": 3338} {"train_loss": -25.386137008666992, "global_step": 277115, "epoch": 3338} {"train_loss": -25.498292922973633, "global_step": 277116, "epoch": 3338} {"train_loss": -25.376272201538086, "global_step": 277117, "epoch": 3338} {"train_loss": -25.449207305908203, "global_step": 277118, "epoch": 3338} {"train_loss": -25.45115089416504, "global_step": 277119, "epoch": 3338} {"train_loss": -25.261524200439453, "global_step": 277120, "epoch": 3338} {"train_loss": -25.23171043395996, "global_step": 277121, "epoch": 3338} {"train_loss": -25.267736434936523, "global_step": 277122, "epoch": 3338} {"train_loss": -25.67919921875, "global_step": 277123, "epoch": 3338} {"train_loss": -25.67136001586914, "global_step": 277124, "epoch": 3338} {"train_loss": -25.272390365600586, "global_step": 277125, "epoch": 3338} {"train_loss": -25.794172286987305, "global_step": 277126, "epoch": 3338} {"train_loss": -25.637226104736328, "global_step": 277127, "epoch": 3338} {"train_loss": -25.285625457763672, "global_step": 277128, "epoch": 3338} {"train_loss": -25.666858673095703, "global_step": 277129, "epoch": 3338} {"train_loss": -25.77888298034668, "global_step": 277130, "epoch": 3338} {"train_loss": -25.096506118774414, "global_step": 277131, "epoch": 3338} {"train_loss": -24.926532745361328, "global_step": 277132, "epoch": 3338} {"train_loss": -25.604795455932617, "global_step": 277133, "epoch": 3338} {"train_loss": -25.499156951904297, "global_step": 277134, "epoch": 3338} {"train_loss": -25.346267700195312, "global_step": 277135, "epoch": 3338} {"train_loss": -25.132583526243646, "global_step": 277136, "epoch": 3338, "val_loss": 7184020.5} {"train_loss": -24.820852279663086, "global_step": 277137, "epoch": 3339} {"train_loss": -24.831138610839844, "global_step": 277138, "epoch": 3339} {"train_loss": -24.563234329223633, "global_step": 277139, "epoch": 3339} {"train_loss": -24.08477210998535, "global_step": 277140, "epoch": 3339} {"train_loss": -24.627307891845703, "global_step": 277141, "epoch": 3339} {"train_loss": -24.52389907836914, "global_step": 277142, "epoch": 3339} {"train_loss": -24.932559967041016, "global_step": 277143, "epoch": 3339} {"train_loss": -24.93299674987793, "global_step": 277144, "epoch": 3339} {"train_loss": -25.130220413208008, "global_step": 277145, "epoch": 3339} {"train_loss": -24.755056381225586, "global_step": 277146, "epoch": 3339} {"train_loss": -25.10382080078125, "global_step": 277147, "epoch": 3339} {"train_loss": -24.97968101501465, "global_step": 277148, "epoch": 3339} {"train_loss": -25.397573471069336, "global_step": 277149, "epoch": 3339} {"train_loss": -25.152021408081055, "global_step": 277150, "epoch": 3339} {"train_loss": -24.90130615234375, "global_step": 277151, "epoch": 3339} {"train_loss": -25.066431045532227, "global_step": 277152, "epoch": 3339} {"train_loss": -25.289987564086914, "global_step": 277153, "epoch": 3339} {"train_loss": -24.93484878540039, "global_step": 277154, "epoch": 3339} {"train_loss": -25.232208251953125, "global_step": 277155, "epoch": 3339} {"train_loss": -24.86052894592285, "global_step": 277156, "epoch": 3339} {"train_loss": -24.89647674560547, "global_step": 277157, "epoch": 3339} {"train_loss": -25.043888092041016, "global_step": 277158, "epoch": 3339} {"train_loss": -25.322057723999023, "global_step": 277159, "epoch": 3339} {"train_loss": -24.9993896484375, "global_step": 277160, "epoch": 3339} {"train_loss": -25.2155704498291, "global_step": 277161, "epoch": 3339} {"train_loss": -25.228656768798828, "global_step": 277162, "epoch": 3339} {"train_loss": -24.5642032623291, "global_step": 277163, "epoch": 3339} {"train_loss": -25.119827270507812, "global_step": 277164, "epoch": 3339} {"train_loss": -25.059585571289062, "global_step": 277165, "epoch": 3339} {"train_loss": -24.859853744506836, "global_step": 277166, "epoch": 3339} {"train_loss": -25.731496810913086, "global_step": 277167, "epoch": 3339} {"train_loss": -25.471885681152344, "global_step": 277168, "epoch": 3339} {"train_loss": -25.43782615661621, "global_step": 277169, "epoch": 3339} {"train_loss": -25.3019962310791, "global_step": 277170, "epoch": 3339} {"train_loss": -25.482622146606445, "global_step": 277171, "epoch": 3339} {"train_loss": -24.99149513244629, "global_step": 277172, "epoch": 3339} {"train_loss": -25.26852035522461, "global_step": 277173, "epoch": 3339} {"train_loss": -25.207096099853516, "global_step": 277174, "epoch": 3339} {"train_loss": -25.347808837890625, "global_step": 277175, "epoch": 3339} {"train_loss": -25.553979873657227, "global_step": 277176, "epoch": 3339} {"train_loss": -25.392026901245117, "global_step": 277177, "epoch": 3339} {"train_loss": -25.395797729492188, "global_step": 277178, "epoch": 3339} {"train_loss": -25.78799819946289, "global_step": 277179, "epoch": 3339} {"train_loss": -25.638105392456055, "global_step": 277180, "epoch": 3339} {"train_loss": -25.564699172973633, "global_step": 277181, "epoch": 3339} {"train_loss": -25.265836715698242, "global_step": 277182, "epoch": 3339} {"train_loss": -25.454965591430664, "global_step": 277183, "epoch": 3339} {"train_loss": -25.515485763549805, "global_step": 277184, "epoch": 3339} {"train_loss": -25.279722213745117, "global_step": 277185, "epoch": 3339} {"train_loss": -25.290597915649414, "global_step": 277186, "epoch": 3339} {"train_loss": -25.112207412719727, "global_step": 277187, "epoch": 3339} {"train_loss": -25.340534210205078, "global_step": 277188, "epoch": 3339} {"train_loss": -25.355764389038086, "global_step": 277189, "epoch": 3339} {"train_loss": -25.469144821166992, "global_step": 277190, "epoch": 3339} {"train_loss": -25.467514038085938, "global_step": 277191, "epoch": 3339} {"train_loss": -25.040525436401367, "global_step": 277192, "epoch": 3339} {"train_loss": -25.296003341674805, "global_step": 277193, "epoch": 3339} {"train_loss": -25.324926376342773, "global_step": 277194, "epoch": 3339} {"train_loss": -25.665374755859375, "global_step": 277195, "epoch": 3339} {"train_loss": -25.80926513671875, "global_step": 277196, "epoch": 3339} {"train_loss": -25.08009910583496, "global_step": 277197, "epoch": 3339} {"train_loss": -25.48322105407715, "global_step": 277198, "epoch": 3339} {"train_loss": -25.176237106323242, "global_step": 277199, "epoch": 3339} {"train_loss": -25.1412353515625, "global_step": 277200, "epoch": 3339} {"train_loss": -24.794998168945312, "global_step": 277201, "epoch": 3339} {"train_loss": -25.08095932006836, "global_step": 277202, "epoch": 3339} {"train_loss": -25.409412384033203, "global_step": 277203, "epoch": 3339} {"train_loss": -25.49934959411621, "global_step": 277204, "epoch": 3339} {"train_loss": -25.574562072753906, "global_step": 277205, "epoch": 3339} {"train_loss": -25.293230056762695, "global_step": 277206, "epoch": 3339} {"train_loss": -25.13068199157715, "global_step": 277207, "epoch": 3339} {"train_loss": -25.15524673461914, "global_step": 277208, "epoch": 3339} {"train_loss": -25.20563316345215, "global_step": 277209, "epoch": 3339} {"train_loss": -25.728788375854492, "global_step": 277210, "epoch": 3339} {"train_loss": -25.406347274780273, "global_step": 277211, "epoch": 3339} {"train_loss": -24.944808959960938, "global_step": 277212, "epoch": 3339} {"train_loss": -25.669391632080078, "global_step": 277213, "epoch": 3339} {"train_loss": -25.25977897644043, "global_step": 277214, "epoch": 3339} {"train_loss": -25.44786262512207, "global_step": 277215, "epoch": 3339} {"train_loss": -25.64594078063965, "global_step": 277216, "epoch": 3339} {"train_loss": -25.37765121459961, "global_step": 277217, "epoch": 3339} {"train_loss": -25.379804611206055, "global_step": 277218, "epoch": 3339} {"train_loss": -25.22225586764784, "global_step": 277219, "epoch": 3339, "val_loss": 6926416.0} {"train_loss": -24.893138885498047, "global_step": 277220, "epoch": 3340} {"train_loss": -25.168027877807617, "global_step": 277221, "epoch": 3340} {"train_loss": -24.971654891967773, "global_step": 277222, "epoch": 3340} {"train_loss": -25.267919540405273, "global_step": 277223, "epoch": 3340} {"train_loss": -25.29090690612793, "global_step": 277224, "epoch": 3340} {"train_loss": -24.827367782592773, "global_step": 277225, "epoch": 3340} {"train_loss": -25.207338333129883, "global_step": 277226, "epoch": 3340} {"train_loss": -24.648950576782227, "global_step": 277227, "epoch": 3340} {"train_loss": -25.411714553833008, "global_step": 277228, "epoch": 3340} {"train_loss": -25.60822105407715, "global_step": 277229, "epoch": 3340} {"train_loss": -24.85145378112793, "global_step": 277230, "epoch": 3340} {"train_loss": -24.8957576751709, "global_step": 277231, "epoch": 3340} {"train_loss": -24.878971099853516, "global_step": 277232, "epoch": 3340} {"train_loss": -25.087207794189453, "global_step": 277233, "epoch": 3340} {"train_loss": -25.360288619995117, "global_step": 277234, "epoch": 3340} {"train_loss": -25.15924835205078, "global_step": 277235, "epoch": 3340} {"train_loss": -25.17074966430664, "global_step": 277236, "epoch": 3340} {"train_loss": -25.416906356811523, "global_step": 277237, "epoch": 3340} {"train_loss": -25.215044021606445, "global_step": 277238, "epoch": 3340} {"train_loss": -25.508865356445312, "global_step": 277239, "epoch": 3340} {"train_loss": -25.40365982055664, "global_step": 277240, "epoch": 3340} {"train_loss": -25.164846420288086, "global_step": 277241, "epoch": 3340} {"train_loss": -25.261035919189453, "global_step": 277242, "epoch": 3340} {"train_loss": -25.183868408203125, "global_step": 277243, "epoch": 3340} {"train_loss": -25.463647842407227, "global_step": 277244, "epoch": 3340} {"train_loss": -25.365079879760742, "global_step": 277245, "epoch": 3340} {"train_loss": -25.394134521484375, "global_step": 277246, "epoch": 3340} {"train_loss": -25.67872428894043, "global_step": 277247, "epoch": 3340} {"train_loss": -25.634235382080078, "global_step": 277248, "epoch": 3340} {"train_loss": -25.444950103759766, "global_step": 277249, "epoch": 3340} {"train_loss": -25.352149963378906, "global_step": 277250, "epoch": 3340} {"train_loss": -25.43897247314453, "global_step": 277251, "epoch": 3340} {"train_loss": -25.17300796508789, "global_step": 277252, "epoch": 3340} {"train_loss": -25.383764266967773, "global_step": 277253, "epoch": 3340} {"train_loss": -25.333566665649414, "global_step": 277254, "epoch": 3340} {"train_loss": -25.697126388549805, "global_step": 277255, "epoch": 3340} {"train_loss": -25.679182052612305, "global_step": 277256, "epoch": 3340} {"train_loss": -25.388294219970703, "global_step": 277257, "epoch": 3340} {"train_loss": -25.30348777770996, "global_step": 277258, "epoch": 3340} {"train_loss": -25.0599308013916, "global_step": 277259, "epoch": 3340} {"train_loss": -25.738021850585938, "global_step": 277260, "epoch": 3340} {"train_loss": -25.468008041381836, "global_step": 277261, "epoch": 3340} {"train_loss": -25.668975830078125, "global_step": 277262, "epoch": 3340} {"train_loss": -25.801172256469727, "global_step": 277263, "epoch": 3340} {"train_loss": -25.463197708129883, "global_step": 277264, "epoch": 3340} {"train_loss": -25.072834014892578, "global_step": 277265, "epoch": 3340} {"train_loss": -25.348180770874023, "global_step": 277266, "epoch": 3340} {"train_loss": -25.445266723632812, "global_step": 277267, "epoch": 3340} {"train_loss": -25.67557716369629, "global_step": 277268, "epoch": 3340} {"train_loss": -25.526941299438477, "global_step": 277269, "epoch": 3340} {"train_loss": -25.841588973999023, "global_step": 277270, "epoch": 3340} {"train_loss": -25.195966720581055, "global_step": 277271, "epoch": 3340} {"train_loss": -25.61875343322754, "global_step": 277272, "epoch": 3340} {"train_loss": -25.041471481323242, "global_step": 277273, "epoch": 3340} {"train_loss": -25.28099822998047, "global_step": 277274, "epoch": 3340} {"train_loss": -25.402189254760742, "global_step": 277275, "epoch": 3340} {"train_loss": -25.280471801757812, "global_step": 277276, "epoch": 3340} {"train_loss": -25.442432403564453, "global_step": 277277, "epoch": 3340} {"train_loss": -25.58742904663086, "global_step": 277278, "epoch": 3340} {"train_loss": -25.441675186157227, "global_step": 277279, "epoch": 3340} {"train_loss": -25.475032806396484, "global_step": 277280, "epoch": 3340} {"train_loss": -25.76091957092285, "global_step": 277281, "epoch": 3340} {"train_loss": -24.931297302246094, "global_step": 277282, "epoch": 3340} {"train_loss": -25.292552947998047, "global_step": 277283, "epoch": 3340} {"train_loss": -25.37604331970215, "global_step": 277284, "epoch": 3340} {"train_loss": -25.554588317871094, "global_step": 277285, "epoch": 3340} {"train_loss": -25.4400634765625, "global_step": 277286, "epoch": 3340} {"train_loss": -25.189342498779297, "global_step": 277287, "epoch": 3340} {"train_loss": -25.427371978759766, "global_step": 277288, "epoch": 3340} {"train_loss": -25.663959503173828, "global_step": 277289, "epoch": 3340} {"train_loss": -25.52397918701172, "global_step": 277290, "epoch": 3340} {"train_loss": -25.482378005981445, "global_step": 277291, "epoch": 3340} {"train_loss": -25.69672966003418, "global_step": 277292, "epoch": 3340} {"train_loss": -25.57292366027832, "global_step": 277293, "epoch": 3340} {"train_loss": -25.658706665039062, "global_step": 277294, "epoch": 3340} {"train_loss": -25.479156494140625, "global_step": 277295, "epoch": 3340} {"train_loss": -25.62445068359375, "global_step": 277296, "epoch": 3340} {"train_loss": -26.04011344909668, "global_step": 277297, "epoch": 3340} {"train_loss": -25.536365509033203, "global_step": 277298, "epoch": 3340} {"train_loss": -25.579574584960938, "global_step": 277299, "epoch": 3340} {"train_loss": -25.23955726623535, "global_step": 277300, "epoch": 3340} {"train_loss": -25.593975067138672, "global_step": 277301, "epoch": 3340} {"train_loss": -25.387084777096668, "global_step": 277302, "epoch": 3340, "val_loss": 7260202.0} {"train_loss": -24.97364044189453, "global_step": 277303, "epoch": 3341} {"train_loss": -24.727144241333008, "global_step": 277304, "epoch": 3341} {"train_loss": -25.410612106323242, "global_step": 277305, "epoch": 3341} {"train_loss": -24.857709884643555, "global_step": 277306, "epoch": 3341} {"train_loss": -25.02689552307129, "global_step": 277307, "epoch": 3341} {"train_loss": -24.90163230895996, "global_step": 277308, "epoch": 3341} {"train_loss": -24.968412399291992, "global_step": 277309, "epoch": 3341} {"train_loss": -25.432538986206055, "global_step": 277310, "epoch": 3341} {"train_loss": -25.006982803344727, "global_step": 277311, "epoch": 3341} {"train_loss": -25.03290557861328, "global_step": 277312, "epoch": 3341} {"train_loss": -25.2202091217041, "global_step": 277313, "epoch": 3341} {"train_loss": -24.829971313476562, "global_step": 277314, "epoch": 3341} {"train_loss": -25.576047897338867, "global_step": 277315, "epoch": 3341} {"train_loss": -24.821134567260742, "global_step": 277316, "epoch": 3341} {"train_loss": -24.65961456298828, "global_step": 277317, "epoch": 3341} {"train_loss": -24.865156173706055, "global_step": 277318, "epoch": 3341} {"train_loss": -24.55374526977539, "global_step": 277319, "epoch": 3341} {"train_loss": -24.616819381713867, "global_step": 277320, "epoch": 3341} {"train_loss": -24.86395263671875, "global_step": 277321, "epoch": 3341} {"train_loss": -24.83111000061035, "global_step": 277322, "epoch": 3341} {"train_loss": -24.893613815307617, "global_step": 277323, "epoch": 3341} {"train_loss": -25.40774917602539, "global_step": 277324, "epoch": 3341} {"train_loss": -24.913288116455078, "global_step": 277325, "epoch": 3341} {"train_loss": -25.40445899963379, "global_step": 277326, "epoch": 3341} {"train_loss": -25.174131393432617, "global_step": 277327, "epoch": 3341} {"train_loss": -25.32220458984375, "global_step": 277328, "epoch": 3341} {"train_loss": -25.258560180664062, "global_step": 277329, "epoch": 3341} {"train_loss": -25.24812126159668, "global_step": 277330, "epoch": 3341} {"train_loss": -25.263765335083008, "global_step": 277331, "epoch": 3341} {"train_loss": -25.42502212524414, "global_step": 277332, "epoch": 3341} {"train_loss": -25.02956199645996, "global_step": 277333, "epoch": 3341} {"train_loss": -24.701128005981445, "global_step": 277334, "epoch": 3341} {"train_loss": -25.69353675842285, "global_step": 277335, "epoch": 3341} {"train_loss": -25.149755477905273, "global_step": 277336, "epoch": 3341} {"train_loss": -25.38047981262207, "global_step": 277337, "epoch": 3341} {"train_loss": -25.108346939086914, "global_step": 277338, "epoch": 3341} {"train_loss": -25.13050651550293, "global_step": 277339, "epoch": 3341} {"train_loss": -25.36256217956543, "global_step": 277340, "epoch": 3341} {"train_loss": -24.989736557006836, "global_step": 277341, "epoch": 3341} {"train_loss": -25.55776596069336, "global_step": 277342, "epoch": 3341} {"train_loss": -25.274015426635742, "global_step": 277343, "epoch": 3341} {"train_loss": -25.299659729003906, "global_step": 277344, "epoch": 3341} {"train_loss": -25.830780029296875, "global_step": 277345, "epoch": 3341} {"train_loss": -25.12523651123047, "global_step": 277346, "epoch": 3341} {"train_loss": -25.155258178710938, "global_step": 277347, "epoch": 3341} {"train_loss": -25.3134822845459, "global_step": 277348, "epoch": 3341} {"train_loss": -25.47600555419922, "global_step": 277349, "epoch": 3341} {"train_loss": -25.22480583190918, "global_step": 277350, "epoch": 3341} {"train_loss": -25.390602111816406, "global_step": 277351, "epoch": 3341} {"train_loss": -25.571340560913086, "global_step": 277352, "epoch": 3341} {"train_loss": -25.634735107421875, "global_step": 277353, "epoch": 3341} {"train_loss": -25.324031829833984, "global_step": 277354, "epoch": 3341} {"train_loss": -25.83173942565918, "global_step": 277355, "epoch": 3341} {"train_loss": -25.495134353637695, "global_step": 277356, "epoch": 3341} {"train_loss": -25.770191192626953, "global_step": 277357, "epoch": 3341} {"train_loss": -25.47047233581543, "global_step": 277358, "epoch": 3341} {"train_loss": -25.699325561523438, "global_step": 277359, "epoch": 3341} {"train_loss": -25.393949508666992, "global_step": 277360, "epoch": 3341} {"train_loss": -25.638416290283203, "global_step": 277361, "epoch": 3341} {"train_loss": -25.76069450378418, "global_step": 277362, "epoch": 3341} {"train_loss": -25.45833969116211, "global_step": 277363, "epoch": 3341} {"train_loss": -25.46285057067871, "global_step": 277364, "epoch": 3341} {"train_loss": -25.50733757019043, "global_step": 277365, "epoch": 3341} {"train_loss": -25.56564712524414, "global_step": 277366, "epoch": 3341} {"train_loss": -24.76712989807129, "global_step": 277367, "epoch": 3341} {"train_loss": -25.56011390686035, "global_step": 277368, "epoch": 3341} {"train_loss": -25.44035530090332, "global_step": 277369, "epoch": 3341} {"train_loss": -25.952804565429688, "global_step": 277370, "epoch": 3341} {"train_loss": -25.564762115478516, "global_step": 277371, "epoch": 3341} {"train_loss": -25.425018310546875, "global_step": 277372, "epoch": 3341} {"train_loss": -25.674976348876953, "global_step": 277373, "epoch": 3341} {"train_loss": -25.419179916381836, "global_step": 277374, "epoch": 3341} {"train_loss": -25.115495681762695, "global_step": 277375, "epoch": 3341} {"train_loss": -25.24024772644043, "global_step": 277376, "epoch": 3341} {"train_loss": -25.31190299987793, "global_step": 277377, "epoch": 3341} {"train_loss": -25.27924156188965, "global_step": 277378, "epoch": 3341} {"train_loss": -25.223907470703125, "global_step": 277379, "epoch": 3341} {"train_loss": -25.25680160522461, "global_step": 277380, "epoch": 3341} {"train_loss": -25.584291458129883, "global_step": 277381, "epoch": 3341} {"train_loss": -24.9599609375, "global_step": 277382, "epoch": 3341} {"train_loss": -25.370136260986328, "global_step": 277383, "epoch": 3341} {"train_loss": -25.570886611938477, "global_step": 277384, "epoch": 3341} {"train_loss": -25.25787158184741, "global_step": 277385, "epoch": 3341, "val_loss": 7027668.0} {"train_loss": -25.085113525390625, "global_step": 277386, "epoch": 3342} {"train_loss": -25.06180763244629, "global_step": 277387, "epoch": 3342} {"train_loss": -25.033824920654297, "global_step": 277388, "epoch": 3342} {"train_loss": -25.149744033813477, "global_step": 277389, "epoch": 3342} {"train_loss": -25.06332778930664, "global_step": 277390, "epoch": 3342} {"train_loss": -25.2034969329834, "global_step": 277391, "epoch": 3342} {"train_loss": -25.149499893188477, "global_step": 277392, "epoch": 3342} {"train_loss": -25.56893539428711, "global_step": 277393, "epoch": 3342} {"train_loss": -25.55324935913086, "global_step": 277394, "epoch": 3342} {"train_loss": -25.313282012939453, "global_step": 277395, "epoch": 3342} {"train_loss": -25.426380157470703, "global_step": 277396, "epoch": 3342} {"train_loss": -25.269229888916016, "global_step": 277397, "epoch": 3342} {"train_loss": -25.427501678466797, "global_step": 277398, "epoch": 3342} {"train_loss": -25.516504287719727, "global_step": 277399, "epoch": 3342} {"train_loss": -25.399900436401367, "global_step": 277400, "epoch": 3342} {"train_loss": -25.160261154174805, "global_step": 277401, "epoch": 3342} {"train_loss": -25.29720115661621, "global_step": 277402, "epoch": 3342} {"train_loss": -25.058490753173828, "global_step": 277403, "epoch": 3342} {"train_loss": -25.138357162475586, "global_step": 277404, "epoch": 3342} {"train_loss": -25.11666488647461, "global_step": 277405, "epoch": 3342} {"train_loss": -25.320035934448242, "global_step": 277406, "epoch": 3342} {"train_loss": -25.5360164642334, "global_step": 277407, "epoch": 3342} {"train_loss": -25.52890396118164, "global_step": 277408, "epoch": 3342} {"train_loss": -25.3200626373291, "global_step": 277409, "epoch": 3342} {"train_loss": -25.28194236755371, "global_step": 277410, "epoch": 3342} {"train_loss": -25.41350746154785, "global_step": 277411, "epoch": 3342} {"train_loss": -25.501562118530273, "global_step": 277412, "epoch": 3342} {"train_loss": -25.453968048095703, "global_step": 277413, "epoch": 3342} {"train_loss": -25.473752975463867, "global_step": 277414, "epoch": 3342} {"train_loss": -25.77471351623535, "global_step": 277415, "epoch": 3342} {"train_loss": -24.813915252685547, "global_step": 277416, "epoch": 3342} {"train_loss": -25.66615104675293, "global_step": 277417, "epoch": 3342} {"train_loss": -25.552717208862305, "global_step": 277418, "epoch": 3342} {"train_loss": -25.440677642822266, "global_step": 277419, "epoch": 3342} {"train_loss": -25.507659912109375, "global_step": 277420, "epoch": 3342} {"train_loss": -25.439321517944336, "global_step": 277421, "epoch": 3342} {"train_loss": -25.072830200195312, "global_step": 277422, "epoch": 3342} {"train_loss": -25.58319664001465, "global_step": 277423, "epoch": 3342} {"train_loss": -25.22278594970703, "global_step": 277424, "epoch": 3342} {"train_loss": -24.992156982421875, "global_step": 277425, "epoch": 3342} {"train_loss": -25.03034019470215, "global_step": 277426, "epoch": 3342} {"train_loss": -25.493810653686523, "global_step": 277427, "epoch": 3342} {"train_loss": -25.358423233032227, "global_step": 277428, "epoch": 3342} {"train_loss": -25.335330963134766, "global_step": 277429, "epoch": 3342} {"train_loss": -25.33469009399414, "global_step": 277430, "epoch": 3342} {"train_loss": -25.278182983398438, "global_step": 277431, "epoch": 3342} {"train_loss": -25.461334228515625, "global_step": 277432, "epoch": 3342} {"train_loss": -25.273832321166992, "global_step": 277433, "epoch": 3342} {"train_loss": -25.470619201660156, "global_step": 277434, "epoch": 3342} {"train_loss": -25.291589736938477, "global_step": 277435, "epoch": 3342} {"train_loss": -25.47256088256836, "global_step": 277436, "epoch": 3342} {"train_loss": -25.480247497558594, "global_step": 277437, "epoch": 3342} {"train_loss": -25.237125396728516, "global_step": 277438, "epoch": 3342} {"train_loss": -24.934185028076172, "global_step": 277439, "epoch": 3342} {"train_loss": -25.586027145385742, "global_step": 277440, "epoch": 3342} {"train_loss": -25.321582794189453, "global_step": 277441, "epoch": 3342} {"train_loss": -25.310766220092773, "global_step": 277442, "epoch": 3342} {"train_loss": -25.41943359375, "global_step": 277443, "epoch": 3342} {"train_loss": -25.325159072875977, "global_step": 277444, "epoch": 3342} {"train_loss": -25.613849639892578, "global_step": 277445, "epoch": 3342} {"train_loss": -25.296070098876953, "global_step": 277446, "epoch": 3342} {"train_loss": -25.60529899597168, "global_step": 277447, "epoch": 3342} {"train_loss": -25.617919921875, "global_step": 277448, "epoch": 3342} {"train_loss": -25.511091232299805, "global_step": 277449, "epoch": 3342} {"train_loss": -25.497333526611328, "global_step": 277450, "epoch": 3342} {"train_loss": -25.472564697265625, "global_step": 277451, "epoch": 3342} {"train_loss": -25.713226318359375, "global_step": 277452, "epoch": 3342} {"train_loss": -25.791473388671875, "global_step": 277453, "epoch": 3342} {"train_loss": -25.54660415649414, "global_step": 277454, "epoch": 3342} {"train_loss": -25.53974723815918, "global_step": 277455, "epoch": 3342} {"train_loss": -25.421152114868164, "global_step": 277456, "epoch": 3342} {"train_loss": -25.51593589782715, "global_step": 277457, "epoch": 3342} {"train_loss": -25.450307846069336, "global_step": 277458, "epoch": 3342} {"train_loss": -25.346399307250977, "global_step": 277459, "epoch": 3342} {"train_loss": -25.243310928344727, "global_step": 277460, "epoch": 3342} {"train_loss": -25.71930503845215, "global_step": 277461, "epoch": 3342} {"train_loss": -25.244884490966797, "global_step": 277462, "epoch": 3342} {"train_loss": -25.728775024414062, "global_step": 277463, "epoch": 3342} {"train_loss": -25.569162368774414, "global_step": 277464, "epoch": 3342} {"train_loss": -24.950199127197266, "global_step": 277465, "epoch": 3342} {"train_loss": -24.957569122314453, "global_step": 277466, "epoch": 3342} {"train_loss": -25.38897705078125, "global_step": 277467, "epoch": 3342} {"train_loss": -25.3713986270399, "global_step": 277468, "epoch": 3342, "val_loss": 6972346.0} {"train_loss": -24.784015655517578, "global_step": 277469, "epoch": 3343} {"train_loss": -25.119125366210938, "global_step": 277470, "epoch": 3343} {"train_loss": -24.9355411529541, "global_step": 277471, "epoch": 3343} {"train_loss": -25.28469467163086, "global_step": 277472, "epoch": 3343} {"train_loss": -25.414066314697266, "global_step": 277473, "epoch": 3343} {"train_loss": -25.49957275390625, "global_step": 277474, "epoch": 3343} {"train_loss": -25.690601348876953, "global_step": 277475, "epoch": 3343} {"train_loss": -25.707040786743164, "global_step": 277476, "epoch": 3343} {"train_loss": -25.194856643676758, "global_step": 277477, "epoch": 3343} {"train_loss": -25.37631607055664, "global_step": 277478, "epoch": 3343} {"train_loss": -25.04982566833496, "global_step": 277479, "epoch": 3343} {"train_loss": -25.627805709838867, "global_step": 277480, "epoch": 3343} {"train_loss": -25.420108795166016, "global_step": 277481, "epoch": 3343} {"train_loss": -25.176755905151367, "global_step": 277482, "epoch": 3343} {"train_loss": -25.40394401550293, "global_step": 277483, "epoch": 3343} {"train_loss": -25.17922019958496, "global_step": 277484, "epoch": 3343} {"train_loss": -24.896080017089844, "global_step": 277485, "epoch": 3343} {"train_loss": -25.445981979370117, "global_step": 277486, "epoch": 3343} {"train_loss": -25.097063064575195, "global_step": 277487, "epoch": 3343} {"train_loss": -25.4206485748291, "global_step": 277488, "epoch": 3343} {"train_loss": -25.570072174072266, "global_step": 277489, "epoch": 3343} {"train_loss": -25.13506507873535, "global_step": 277490, "epoch": 3343} {"train_loss": -25.119802474975586, "global_step": 277491, "epoch": 3343} {"train_loss": -25.55755615234375, "global_step": 277492, "epoch": 3343} {"train_loss": -25.461669921875, "global_step": 277493, "epoch": 3343} {"train_loss": -25.2196102142334, "global_step": 277494, "epoch": 3343} {"train_loss": -25.338102340698242, "global_step": 277495, "epoch": 3343} {"train_loss": -25.023481369018555, "global_step": 277496, "epoch": 3343} {"train_loss": -25.497756958007812, "global_step": 277497, "epoch": 3343} {"train_loss": -25.40675163269043, "global_step": 277498, "epoch": 3343} {"train_loss": -25.050687789916992, "global_step": 277499, "epoch": 3343} {"train_loss": -25.37287712097168, "global_step": 277500, "epoch": 3343} {"train_loss": -25.517414093017578, "global_step": 277501, "epoch": 3343} {"train_loss": -25.418127059936523, "global_step": 277502, "epoch": 3343} {"train_loss": -25.434614181518555, "global_step": 277503, "epoch": 3343} {"train_loss": -25.629011154174805, "global_step": 277504, "epoch": 3343} {"train_loss": -25.293821334838867, "global_step": 277505, "epoch": 3343} {"train_loss": -25.514179229736328, "global_step": 277506, "epoch": 3343} {"train_loss": -25.183887481689453, "global_step": 277507, "epoch": 3343} {"train_loss": -25.770727157592773, "global_step": 277508, "epoch": 3343} {"train_loss": -25.67380142211914, "global_step": 277509, "epoch": 3343} {"train_loss": -25.527368545532227, "global_step": 277510, "epoch": 3343} {"train_loss": -25.61564064025879, "global_step": 277511, "epoch": 3343} {"train_loss": -25.41359519958496, "global_step": 277512, "epoch": 3343} {"train_loss": -25.08658790588379, "global_step": 277513, "epoch": 3343} {"train_loss": -25.26820945739746, "global_step": 277514, "epoch": 3343} {"train_loss": -25.439207077026367, "global_step": 277515, "epoch": 3343} {"train_loss": -25.544897079467773, "global_step": 277516, "epoch": 3343} {"train_loss": -25.415586471557617, "global_step": 277517, "epoch": 3343} {"train_loss": -25.809528350830078, "global_step": 277518, "epoch": 3343} {"train_loss": -25.116971969604492, "global_step": 277519, "epoch": 3343} {"train_loss": -25.642126083374023, "global_step": 277520, "epoch": 3343} {"train_loss": -25.30777931213379, "global_step": 277521, "epoch": 3343} {"train_loss": -25.362836837768555, "global_step": 277522, "epoch": 3343} {"train_loss": -25.55533218383789, "global_step": 277523, "epoch": 3343} {"train_loss": -25.462491989135742, "global_step": 277524, "epoch": 3343} {"train_loss": -25.226659774780273, "global_step": 277525, "epoch": 3343} {"train_loss": -25.131364822387695, "global_step": 277526, "epoch": 3343} {"train_loss": -25.243589401245117, "global_step": 277527, "epoch": 3343} {"train_loss": -25.678503036499023, "global_step": 277528, "epoch": 3343} {"train_loss": -25.556623458862305, "global_step": 277529, "epoch": 3343} {"train_loss": -25.53034210205078, "global_step": 277530, "epoch": 3343} {"train_loss": -25.246450424194336, "global_step": 277531, "epoch": 3343} {"train_loss": -25.543590545654297, "global_step": 277532, "epoch": 3343} {"train_loss": -25.00136947631836, "global_step": 277533, "epoch": 3343} {"train_loss": -25.239896774291992, "global_step": 277534, "epoch": 3343} {"train_loss": -25.203643798828125, "global_step": 277535, "epoch": 3343} {"train_loss": -25.748992919921875, "global_step": 277536, "epoch": 3343} {"train_loss": -25.334674835205078, "global_step": 277537, "epoch": 3343} {"train_loss": -25.410818099975586, "global_step": 277538, "epoch": 3343} {"train_loss": -25.20998191833496, "global_step": 277539, "epoch": 3343} {"train_loss": -25.350080490112305, "global_step": 277540, "epoch": 3343} {"train_loss": -25.619470596313477, "global_step": 277541, "epoch": 3343} {"train_loss": -25.369348526000977, "global_step": 277542, "epoch": 3343} {"train_loss": -24.927663803100586, "global_step": 277543, "epoch": 3343} {"train_loss": -25.438907623291016, "global_step": 277544, "epoch": 3343} {"train_loss": -25.82684898376465, "global_step": 277545, "epoch": 3343} {"train_loss": -25.293277740478516, "global_step": 277546, "epoch": 3343} {"train_loss": -24.812286376953125, "global_step": 277547, "epoch": 3343} {"train_loss": -24.79309844970703, "global_step": 277548, "epoch": 3343} {"train_loss": -25.65474510192871, "global_step": 277549, "epoch": 3343} {"train_loss": -25.159679412841797, "global_step": 277550, "epoch": 3343} {"train_loss": -25.34779858876424, "global_step": 277551, "epoch": 3343, "val_loss": 7091701.0} {"train_loss": -22.357561111450195, "global_step": 277552, "epoch": 3344} {"train_loss": -24.021581649780273, "global_step": 277553, "epoch": 3344} {"train_loss": -23.72757339477539, "global_step": 277554, "epoch": 3344} {"train_loss": -23.131107330322266, "global_step": 277555, "epoch": 3344} {"train_loss": -23.826894760131836, "global_step": 277556, "epoch": 3344} {"train_loss": -23.734607696533203, "global_step": 277557, "epoch": 3344} {"train_loss": -24.059823989868164, "global_step": 277558, "epoch": 3344} {"train_loss": -23.88887596130371, "global_step": 277559, "epoch": 3344} {"train_loss": -24.313112258911133, "global_step": 277560, "epoch": 3344} {"train_loss": -23.9281063079834, "global_step": 277561, "epoch": 3344} {"train_loss": -24.37714385986328, "global_step": 277562, "epoch": 3344} {"train_loss": -24.5976619720459, "global_step": 277563, "epoch": 3344} {"train_loss": -24.52092742919922, "global_step": 277564, "epoch": 3344} {"train_loss": -24.141324996948242, "global_step": 277565, "epoch": 3344} {"train_loss": -24.355680465698242, "global_step": 277566, "epoch": 3344} {"train_loss": -24.42816162109375, "global_step": 277567, "epoch": 3344} {"train_loss": -24.74703025817871, "global_step": 277568, "epoch": 3344} {"train_loss": -24.249284744262695, "global_step": 277569, "epoch": 3344} {"train_loss": -25.133928298950195, "global_step": 277570, "epoch": 3344} {"train_loss": -24.883731842041016, "global_step": 277571, "epoch": 3344} {"train_loss": -24.820384979248047, "global_step": 277572, "epoch": 3344} {"train_loss": -24.67365074157715, "global_step": 277573, "epoch": 3344} {"train_loss": -24.606863021850586, "global_step": 277574, "epoch": 3344} {"train_loss": -24.79815673828125, "global_step": 277575, "epoch": 3344} {"train_loss": -24.884130477905273, "global_step": 277576, "epoch": 3344} {"train_loss": -24.897512435913086, "global_step": 277577, "epoch": 3344} {"train_loss": -24.81028938293457, "global_step": 277578, "epoch": 3344} {"train_loss": -25.315296173095703, "global_step": 277579, "epoch": 3344} {"train_loss": -24.814022064208984, "global_step": 277580, "epoch": 3344} {"train_loss": -25.314895629882812, "global_step": 277581, "epoch": 3344} {"train_loss": -24.667648315429688, "global_step": 277582, "epoch": 3344} {"train_loss": -25.255451202392578, "global_step": 277583, "epoch": 3344} {"train_loss": -25.2299861907959, "global_step": 277584, "epoch": 3344} {"train_loss": -25.410276412963867, "global_step": 277585, "epoch": 3344} {"train_loss": -25.536218643188477, "global_step": 277586, "epoch": 3344} {"train_loss": -25.444202423095703, "global_step": 277587, "epoch": 3344} {"train_loss": -25.402454376220703, "global_step": 277588, "epoch": 3344} {"train_loss": -25.175878524780273, "global_step": 277589, "epoch": 3344} {"train_loss": -25.24568748474121, "global_step": 277590, "epoch": 3344} {"train_loss": -25.12957191467285, "global_step": 277591, "epoch": 3344} {"train_loss": -25.12288475036621, "global_step": 277592, "epoch": 3344} {"train_loss": -25.44685935974121, "global_step": 277593, "epoch": 3344} {"train_loss": -25.330053329467773, "global_step": 277594, "epoch": 3344} {"train_loss": -25.790876388549805, "global_step": 277595, "epoch": 3344} {"train_loss": -25.560470581054688, "global_step": 277596, "epoch": 3344} {"train_loss": -25.691747665405273, "global_step": 277597, "epoch": 3344} {"train_loss": -25.377920150756836, "global_step": 277598, "epoch": 3344} {"train_loss": -25.43394660949707, "global_step": 277599, "epoch": 3344} {"train_loss": -25.312753677368164, "global_step": 277600, "epoch": 3344} {"train_loss": -25.172937393188477, "global_step": 277601, "epoch": 3344} {"train_loss": -25.492294311523438, "global_step": 277602, "epoch": 3344} {"train_loss": -25.496536254882812, "global_step": 277603, "epoch": 3344} {"train_loss": -25.37919044494629, "global_step": 277604, "epoch": 3344} {"train_loss": -25.440425872802734, "global_step": 277605, "epoch": 3344} {"train_loss": -25.683496475219727, "global_step": 277606, "epoch": 3344} {"train_loss": -25.85577392578125, "global_step": 277607, "epoch": 3344} {"train_loss": -25.334030151367188, "global_step": 277608, "epoch": 3344} {"train_loss": -25.529756546020508, "global_step": 277609, "epoch": 3344} {"train_loss": -25.4107666015625, "global_step": 277610, "epoch": 3344} {"train_loss": -25.468618392944336, "global_step": 277611, "epoch": 3344} {"train_loss": -25.93263816833496, "global_step": 277612, "epoch": 3344} {"train_loss": -25.212783813476562, "global_step": 277613, "epoch": 3344} {"train_loss": -25.148662567138672, "global_step": 277614, "epoch": 3344} {"train_loss": -25.210298538208008, "global_step": 277615, "epoch": 3344} {"train_loss": -25.111461639404297, "global_step": 277616, "epoch": 3344} {"train_loss": -25.2553768157959, "global_step": 277617, "epoch": 3344} {"train_loss": -25.630041122436523, "global_step": 277618, "epoch": 3344} {"train_loss": -25.464223861694336, "global_step": 277619, "epoch": 3344} {"train_loss": -25.23090362548828, "global_step": 277620, "epoch": 3344} {"train_loss": -25.08506202697754, "global_step": 277621, "epoch": 3344} {"train_loss": -25.47415542602539, "global_step": 277622, "epoch": 3344} {"train_loss": -25.5772762298584, "global_step": 277623, "epoch": 3344} {"train_loss": -25.444995880126953, "global_step": 277624, "epoch": 3344} {"train_loss": -25.23602867126465, "global_step": 277625, "epoch": 3344} {"train_loss": -25.283788681030273, "global_step": 277626, "epoch": 3344} {"train_loss": -25.407888412475586, "global_step": 277627, "epoch": 3344} {"train_loss": -25.191068649291992, "global_step": 277628, "epoch": 3344} {"train_loss": -25.492216110229492, "global_step": 277629, "epoch": 3344} {"train_loss": -25.018539428710938, "global_step": 277630, "epoch": 3344} {"train_loss": -24.812875747680664, "global_step": 277631, "epoch": 3344} {"train_loss": -25.3819637298584, "global_step": 277632, "epoch": 3344} {"train_loss": -25.062423706054688, "global_step": 277633, "epoch": 3344} {"train_loss": -25.01215424595109, "global_step": 277634, "epoch": 3344, "val_loss": 7009327.0} {"train_loss": -24.69085121154785, "global_step": 277635, "epoch": 3345} {"train_loss": -24.654111862182617, "global_step": 277636, "epoch": 3345} {"train_loss": -24.900999069213867, "global_step": 277637, "epoch": 3345} {"train_loss": -25.058778762817383, "global_step": 277638, "epoch": 3345} {"train_loss": -25.22174644470215, "global_step": 277639, "epoch": 3345} {"train_loss": -24.55183982849121, "global_step": 277640, "epoch": 3345} {"train_loss": -25.065919876098633, "global_step": 277641, "epoch": 3345} {"train_loss": -25.090768814086914, "global_step": 277642, "epoch": 3345} {"train_loss": -24.78407859802246, "global_step": 277643, "epoch": 3345} {"train_loss": -25.160490036010742, "global_step": 277644, "epoch": 3345} {"train_loss": -25.102142333984375, "global_step": 277645, "epoch": 3345} {"train_loss": -25.257171630859375, "global_step": 277646, "epoch": 3345} {"train_loss": -24.861133575439453, "global_step": 277647, "epoch": 3345} {"train_loss": -24.7959041595459, "global_step": 277648, "epoch": 3345} {"train_loss": -25.329788208007812, "global_step": 277649, "epoch": 3345} {"train_loss": -24.810237884521484, "global_step": 277650, "epoch": 3345} {"train_loss": -25.13456153869629, "global_step": 277651, "epoch": 3345} {"train_loss": -25.25922966003418, "global_step": 277652, "epoch": 3345} {"train_loss": -24.907297134399414, "global_step": 277653, "epoch": 3345} {"train_loss": -25.158676147460938, "global_step": 277654, "epoch": 3345} {"train_loss": -25.321826934814453, "global_step": 277655, "epoch": 3345} {"train_loss": -25.098438262939453, "global_step": 277656, "epoch": 3345} {"train_loss": -25.0025634765625, "global_step": 277657, "epoch": 3345} {"train_loss": -25.09999656677246, "global_step": 277658, "epoch": 3345} {"train_loss": -24.941429138183594, "global_step": 277659, "epoch": 3345} {"train_loss": -25.679412841796875, "global_step": 277660, "epoch": 3345} {"train_loss": -25.300445556640625, "global_step": 277661, "epoch": 3345} {"train_loss": -25.013273239135742, "global_step": 277662, "epoch": 3345} {"train_loss": -25.614892959594727, "global_step": 277663, "epoch": 3345} {"train_loss": -25.55206298828125, "global_step": 277664, "epoch": 3345} {"train_loss": -24.86690902709961, "global_step": 277665, "epoch": 3345} {"train_loss": -25.21217918395996, "global_step": 277666, "epoch": 3345} {"train_loss": -25.020097732543945, "global_step": 277667, "epoch": 3345} {"train_loss": -25.453794479370117, "global_step": 277668, "epoch": 3345} {"train_loss": -25.38185691833496, "global_step": 277669, "epoch": 3345} {"train_loss": -25.232179641723633, "global_step": 277670, "epoch": 3345} {"train_loss": -25.252685546875, "global_step": 277671, "epoch": 3345} {"train_loss": -25.483440399169922, "global_step": 277672, "epoch": 3345} {"train_loss": -25.764692306518555, "global_step": 277673, "epoch": 3345} {"train_loss": -25.785400390625, "global_step": 277674, "epoch": 3345} {"train_loss": -25.62772560119629, "global_step": 277675, "epoch": 3345} {"train_loss": -25.12550926208496, "global_step": 277676, "epoch": 3345} {"train_loss": -25.400707244873047, "global_step": 277677, "epoch": 3345} {"train_loss": -25.152606964111328, "global_step": 277678, "epoch": 3345} {"train_loss": -25.608428955078125, "global_step": 277679, "epoch": 3345} {"train_loss": -25.64912223815918, "global_step": 277680, "epoch": 3345} {"train_loss": -25.55143165588379, "global_step": 277681, "epoch": 3345} {"train_loss": -25.841232299804688, "global_step": 277682, "epoch": 3345} {"train_loss": -25.234567642211914, "global_step": 277683, "epoch": 3345} {"train_loss": -25.351654052734375, "global_step": 277684, "epoch": 3345} {"train_loss": -25.351980209350586, "global_step": 277685, "epoch": 3345} {"train_loss": -25.53799057006836, "global_step": 277686, "epoch": 3345} {"train_loss": -25.480985641479492, "global_step": 277687, "epoch": 3345} {"train_loss": -25.36256217956543, "global_step": 277688, "epoch": 3345} {"train_loss": -25.411977767944336, "global_step": 277689, "epoch": 3345} {"train_loss": -25.590423583984375, "global_step": 277690, "epoch": 3345} {"train_loss": -25.203046798706055, "global_step": 277691, "epoch": 3345} {"train_loss": -25.281740188598633, "global_step": 277692, "epoch": 3345} {"train_loss": -25.843637466430664, "global_step": 277693, "epoch": 3345} {"train_loss": -25.57504653930664, "global_step": 277694, "epoch": 3345} {"train_loss": -25.5076904296875, "global_step": 277695, "epoch": 3345} {"train_loss": -25.20038604736328, "global_step": 277696, "epoch": 3345} {"train_loss": -25.400100708007812, "global_step": 277697, "epoch": 3345} {"train_loss": -25.175283432006836, "global_step": 277698, "epoch": 3345} {"train_loss": -25.40614891052246, "global_step": 277699, "epoch": 3345} {"train_loss": -24.900476455688477, "global_step": 277700, "epoch": 3345} {"train_loss": -24.09474754333496, "global_step": 277701, "epoch": 3345} {"train_loss": -23.279239654541016, "global_step": 277702, "epoch": 3345} {"train_loss": -24.54902458190918, "global_step": 277703, "epoch": 3345} {"train_loss": -25.493732452392578, "global_step": 277704, "epoch": 3345} {"train_loss": -24.722728729248047, "global_step": 277705, "epoch": 3345} {"train_loss": -25.113676071166992, "global_step": 277706, "epoch": 3345} {"train_loss": -24.819211959838867, "global_step": 277707, "epoch": 3345} {"train_loss": -25.088380813598633, "global_step": 277708, "epoch": 3345} {"train_loss": -25.47101402282715, "global_step": 277709, "epoch": 3345} {"train_loss": -24.978979110717773, "global_step": 277710, "epoch": 3345} {"train_loss": -24.9810848236084, "global_step": 277711, "epoch": 3345} {"train_loss": -25.2434139251709, "global_step": 277712, "epoch": 3345} {"train_loss": -25.297100067138672, "global_step": 277713, "epoch": 3345} {"train_loss": -24.9847469329834, "global_step": 277714, "epoch": 3345} {"train_loss": -25.274707794189453, "global_step": 277715, "epoch": 3345} {"train_loss": -25.05161476135254, "global_step": 277716, "epoch": 3345} {"train_loss": -25.185755764145448, "global_step": 277717, "epoch": 3345, "val_loss": 7045983.0} {"train_loss": -24.970500946044922, "global_step": 277718, "epoch": 3346} {"train_loss": -25.108366012573242, "global_step": 277719, "epoch": 3346} {"train_loss": -24.873014450073242, "global_step": 277720, "epoch": 3346} {"train_loss": -25.10003662109375, "global_step": 277721, "epoch": 3346} {"train_loss": -25.118993759155273, "global_step": 277722, "epoch": 3346} {"train_loss": -25.44637107849121, "global_step": 277723, "epoch": 3346} {"train_loss": -25.0684871673584, "global_step": 277724, "epoch": 3346} {"train_loss": -25.25821876525879, "global_step": 277725, "epoch": 3346} {"train_loss": -25.165647506713867, "global_step": 277726, "epoch": 3346} {"train_loss": -25.279037475585938, "global_step": 277727, "epoch": 3346} {"train_loss": -25.481565475463867, "global_step": 277728, "epoch": 3346} {"train_loss": -24.75225830078125, "global_step": 277729, "epoch": 3346} {"train_loss": -25.38299560546875, "global_step": 277730, "epoch": 3346} {"train_loss": -25.20438575744629, "global_step": 277731, "epoch": 3346} {"train_loss": -25.157968521118164, "global_step": 277732, "epoch": 3346} {"train_loss": -25.563833236694336, "global_step": 277733, "epoch": 3346} {"train_loss": -25.38752555847168, "global_step": 277734, "epoch": 3346} {"train_loss": -25.208280563354492, "global_step": 277735, "epoch": 3346} {"train_loss": -25.232139587402344, "global_step": 277736, "epoch": 3346} {"train_loss": -25.47028160095215, "global_step": 277737, "epoch": 3346} {"train_loss": -25.642364501953125, "global_step": 277738, "epoch": 3346} {"train_loss": -25.380142211914062, "global_step": 277739, "epoch": 3346} {"train_loss": -25.410634994506836, "global_step": 277740, "epoch": 3346} {"train_loss": -25.352092742919922, "global_step": 277741, "epoch": 3346} {"train_loss": -25.42023277282715, "global_step": 277742, "epoch": 3346} {"train_loss": -25.25096321105957, "global_step": 277743, "epoch": 3346} {"train_loss": -25.62983512878418, "global_step": 277744, "epoch": 3346} {"train_loss": -25.70818519592285, "global_step": 277745, "epoch": 3346} {"train_loss": -25.384387969970703, "global_step": 277746, "epoch": 3346} {"train_loss": -25.613489151000977, "global_step": 277747, "epoch": 3346} {"train_loss": -25.551313400268555, "global_step": 277748, "epoch": 3346} {"train_loss": -25.528125762939453, "global_step": 277749, "epoch": 3346} {"train_loss": -25.460403442382812, "global_step": 277750, "epoch": 3346} {"train_loss": -25.52579689025879, "global_step": 277751, "epoch": 3346} {"train_loss": -25.397035598754883, "global_step": 277752, "epoch": 3346} {"train_loss": -25.381153106689453, "global_step": 277753, "epoch": 3346} {"train_loss": -25.307432174682617, "global_step": 277754, "epoch": 3346} {"train_loss": -25.703033447265625, "global_step": 277755, "epoch": 3346} {"train_loss": -25.53755760192871, "global_step": 277756, "epoch": 3346} {"train_loss": -25.339223861694336, "global_step": 277757, "epoch": 3346} {"train_loss": -25.489286422729492, "global_step": 277758, "epoch": 3346} {"train_loss": -25.634241104125977, "global_step": 277759, "epoch": 3346} {"train_loss": -25.593908309936523, "global_step": 277760, "epoch": 3346} {"train_loss": -25.43056297302246, "global_step": 277761, "epoch": 3346} {"train_loss": -25.280895233154297, "global_step": 277762, "epoch": 3346} {"train_loss": -25.38280487060547, "global_step": 277763, "epoch": 3346} {"train_loss": -25.462087631225586, "global_step": 277764, "epoch": 3346} {"train_loss": -25.246381759643555, "global_step": 277765, "epoch": 3346} {"train_loss": -25.561174392700195, "global_step": 277766, "epoch": 3346} {"train_loss": -25.40854263305664, "global_step": 277767, "epoch": 3346} {"train_loss": -25.05312156677246, "global_step": 277768, "epoch": 3346} {"train_loss": -25.18086051940918, "global_step": 277769, "epoch": 3346} {"train_loss": -25.53412437438965, "global_step": 277770, "epoch": 3346} {"train_loss": -25.29210090637207, "global_step": 277771, "epoch": 3346} {"train_loss": -25.3739013671875, "global_step": 277772, "epoch": 3346} {"train_loss": -25.75408363342285, "global_step": 277773, "epoch": 3346} {"train_loss": -25.27872085571289, "global_step": 277774, "epoch": 3346} {"train_loss": -25.31849479675293, "global_step": 277775, "epoch": 3346} {"train_loss": -25.34254264831543, "global_step": 277776, "epoch": 3346} {"train_loss": -24.938833236694336, "global_step": 277777, "epoch": 3346} {"train_loss": -25.10578155517578, "global_step": 277778, "epoch": 3346} {"train_loss": -25.41615104675293, "global_step": 277779, "epoch": 3346} {"train_loss": -25.33954429626465, "global_step": 277780, "epoch": 3346} {"train_loss": -25.04026985168457, "global_step": 277781, "epoch": 3346} {"train_loss": -25.35710334777832, "global_step": 277782, "epoch": 3346} {"train_loss": -25.03013038635254, "global_step": 277783, "epoch": 3346} {"train_loss": -24.909635543823242, "global_step": 277784, "epoch": 3346} {"train_loss": -25.493633270263672, "global_step": 277785, "epoch": 3346} {"train_loss": -25.672178268432617, "global_step": 277786, "epoch": 3346} {"train_loss": -24.738698959350586, "global_step": 277787, "epoch": 3346} {"train_loss": -25.0390567779541, "global_step": 277788, "epoch": 3346} {"train_loss": -25.008535385131836, "global_step": 277789, "epoch": 3346} {"train_loss": -24.959434509277344, "global_step": 277790, "epoch": 3346} {"train_loss": -25.21403694152832, "global_step": 277791, "epoch": 3346} {"train_loss": -24.963895797729492, "global_step": 277792, "epoch": 3346} {"train_loss": -25.26698875427246, "global_step": 277793, "epoch": 3346} {"train_loss": -24.75618553161621, "global_step": 277794, "epoch": 3346} {"train_loss": -25.40186882019043, "global_step": 277795, "epoch": 3346} {"train_loss": -25.50325584411621, "global_step": 277796, "epoch": 3346} {"train_loss": -25.127614974975586, "global_step": 277797, "epoch": 3346} {"train_loss": -25.208768844604492, "global_step": 277798, "epoch": 3346} {"train_loss": -25.324573516845703, "global_step": 277799, "epoch": 3346} {"train_loss": -25.317615646913826, "global_step": 277800, "epoch": 3346, "val_loss": 6911021.5} {"train_loss": -24.964216232299805, "global_step": 277801, "epoch": 3347} {"train_loss": -25.023693084716797, "global_step": 277802, "epoch": 3347} {"train_loss": -25.16839027404785, "global_step": 277803, "epoch": 3347} {"train_loss": -24.861679077148438, "global_step": 277804, "epoch": 3347} {"train_loss": -25.043907165527344, "global_step": 277805, "epoch": 3347} {"train_loss": -24.914321899414062, "global_step": 277806, "epoch": 3347} {"train_loss": -25.352197647094727, "global_step": 277807, "epoch": 3347} {"train_loss": -25.07822608947754, "global_step": 277808, "epoch": 3347} {"train_loss": -25.108564376831055, "global_step": 277809, "epoch": 3347} {"train_loss": -25.178842544555664, "global_step": 277810, "epoch": 3347} {"train_loss": -25.285154342651367, "global_step": 277811, "epoch": 3347} {"train_loss": -24.982707977294922, "global_step": 277812, "epoch": 3347} {"train_loss": -25.22042465209961, "global_step": 277813, "epoch": 3347} {"train_loss": -25.52216911315918, "global_step": 277814, "epoch": 3347} {"train_loss": -25.261154174804688, "global_step": 277815, "epoch": 3347} {"train_loss": -25.2252140045166, "global_step": 277816, "epoch": 3347} {"train_loss": -24.96872901916504, "global_step": 277817, "epoch": 3347} {"train_loss": -25.232074737548828, "global_step": 277818, "epoch": 3347} {"train_loss": -24.932554244995117, "global_step": 277819, "epoch": 3347} {"train_loss": -25.134769439697266, "global_step": 277820, "epoch": 3347} {"train_loss": -25.467422485351562, "global_step": 277821, "epoch": 3347} {"train_loss": -25.220815658569336, "global_step": 277822, "epoch": 3347} {"train_loss": -25.345884323120117, "global_step": 277823, "epoch": 3347} {"train_loss": -25.25982093811035, "global_step": 277824, "epoch": 3347} {"train_loss": -25.394723892211914, "global_step": 277825, "epoch": 3347} {"train_loss": -25.384748458862305, "global_step": 277826, "epoch": 3347} {"train_loss": -25.6170654296875, "global_step": 277827, "epoch": 3347} {"train_loss": -25.474454879760742, "global_step": 277828, "epoch": 3347} {"train_loss": -25.140600204467773, "global_step": 277829, "epoch": 3347} {"train_loss": -25.0618839263916, "global_step": 277830, "epoch": 3347} {"train_loss": -25.487043380737305, "global_step": 277831, "epoch": 3347} {"train_loss": -25.608036041259766, "global_step": 277832, "epoch": 3347} {"train_loss": -25.510944366455078, "global_step": 277833, "epoch": 3347} {"train_loss": -25.861499786376953, "global_step": 277834, "epoch": 3347} {"train_loss": -25.763227462768555, "global_step": 277835, "epoch": 3347} {"train_loss": -25.333240509033203, "global_step": 277836, "epoch": 3347} {"train_loss": -25.66754150390625, "global_step": 277837, "epoch": 3347} {"train_loss": -25.486486434936523, "global_step": 277838, "epoch": 3347} {"train_loss": -25.258420944213867, "global_step": 277839, "epoch": 3347} {"train_loss": -25.502683639526367, "global_step": 277840, "epoch": 3347} {"train_loss": -25.406314849853516, "global_step": 277841, "epoch": 3347} {"train_loss": -25.150711059570312, "global_step": 277842, "epoch": 3347} {"train_loss": -25.316280364990234, "global_step": 277843, "epoch": 3347} {"train_loss": -25.806293487548828, "global_step": 277844, "epoch": 3347} {"train_loss": -25.848474502563477, "global_step": 277845, "epoch": 3347} {"train_loss": -25.5393009185791, "global_step": 277846, "epoch": 3347} {"train_loss": -25.509021759033203, "global_step": 277847, "epoch": 3347} {"train_loss": -25.886327743530273, "global_step": 277848, "epoch": 3347} {"train_loss": -25.258604049682617, "global_step": 277849, "epoch": 3347} {"train_loss": -25.665128707885742, "global_step": 277850, "epoch": 3347} {"train_loss": -25.478092193603516, "global_step": 277851, "epoch": 3347} {"train_loss": -25.50395393371582, "global_step": 277852, "epoch": 3347} {"train_loss": -25.256370544433594, "global_step": 277853, "epoch": 3347} {"train_loss": -25.221954345703125, "global_step": 277854, "epoch": 3347} {"train_loss": -25.4398136138916, "global_step": 277855, "epoch": 3347} {"train_loss": -25.739805221557617, "global_step": 277856, "epoch": 3347} {"train_loss": -25.10455322265625, "global_step": 277857, "epoch": 3347} {"train_loss": -25.515865325927734, "global_step": 277858, "epoch": 3347} {"train_loss": -25.268896102905273, "global_step": 277859, "epoch": 3347} {"train_loss": -25.113815307617188, "global_step": 277860, "epoch": 3347} {"train_loss": -25.402746200561523, "global_step": 277861, "epoch": 3347} {"train_loss": -25.59662628173828, "global_step": 277862, "epoch": 3347} {"train_loss": -25.334857940673828, "global_step": 277863, "epoch": 3347} {"train_loss": -25.693588256835938, "global_step": 277864, "epoch": 3347} {"train_loss": -25.5423641204834, "global_step": 277865, "epoch": 3347} {"train_loss": -25.685781478881836, "global_step": 277866, "epoch": 3347} {"train_loss": -25.421585083007812, "global_step": 277867, "epoch": 3347} {"train_loss": -25.2257022857666, "global_step": 277868, "epoch": 3347} {"train_loss": -25.673898696899414, "global_step": 277869, "epoch": 3347} {"train_loss": -25.26460838317871, "global_step": 277870, "epoch": 3347} {"train_loss": -25.5041446685791, "global_step": 277871, "epoch": 3347} {"train_loss": -25.93644142150879, "global_step": 277872, "epoch": 3347} {"train_loss": -25.633935928344727, "global_step": 277873, "epoch": 3347} {"train_loss": -25.503747940063477, "global_step": 277874, "epoch": 3347} {"train_loss": -25.940893173217773, "global_step": 277875, "epoch": 3347} {"train_loss": -25.33087730407715, "global_step": 277876, "epoch": 3347} {"train_loss": -25.551055908203125, "global_step": 277877, "epoch": 3347} {"train_loss": -25.435413360595703, "global_step": 277878, "epoch": 3347} {"train_loss": -25.438135147094727, "global_step": 277879, "epoch": 3347} {"train_loss": -25.510587692260742, "global_step": 277880, "epoch": 3347} {"train_loss": -25.103151321411133, "global_step": 277881, "epoch": 3347} {"train_loss": -25.215116500854492, "global_step": 277882, "epoch": 3347} {"train_loss": -25.383640220366328, "global_step": 277883, "epoch": 3347, "val_loss": 6979326.0} {"train_loss": -24.728879928588867, "global_step": 277884, "epoch": 3348} {"train_loss": -24.89208221435547, "global_step": 277885, "epoch": 3348} {"train_loss": -25.033905029296875, "global_step": 277886, "epoch": 3348} {"train_loss": -24.891599655151367, "global_step": 277887, "epoch": 3348} {"train_loss": -25.121191024780273, "global_step": 277888, "epoch": 3348} {"train_loss": -25.1323299407959, "global_step": 277889, "epoch": 3348} {"train_loss": -24.9881591796875, "global_step": 277890, "epoch": 3348} {"train_loss": -25.133934020996094, "global_step": 277891, "epoch": 3348} {"train_loss": -25.180957794189453, "global_step": 277892, "epoch": 3348} {"train_loss": -25.46765899658203, "global_step": 277893, "epoch": 3348} {"train_loss": -25.017356872558594, "global_step": 277894, "epoch": 3348} {"train_loss": -24.62396240234375, "global_step": 277895, "epoch": 3348} {"train_loss": -25.267263412475586, "global_step": 277896, "epoch": 3348} {"train_loss": -25.081581115722656, "global_step": 277897, "epoch": 3348} {"train_loss": -25.400270462036133, "global_step": 277898, "epoch": 3348} {"train_loss": -24.862180709838867, "global_step": 277899, "epoch": 3348} {"train_loss": -25.158496856689453, "global_step": 277900, "epoch": 3348} {"train_loss": -25.041736602783203, "global_step": 277901, "epoch": 3348} {"train_loss": -25.4808292388916, "global_step": 277902, "epoch": 3348} {"train_loss": -25.6489315032959, "global_step": 277903, "epoch": 3348} {"train_loss": -25.121475219726562, "global_step": 277904, "epoch": 3348} {"train_loss": -25.14522361755371, "global_step": 277905, "epoch": 3348} {"train_loss": -25.15227508544922, "global_step": 277906, "epoch": 3348} {"train_loss": -25.132915496826172, "global_step": 277907, "epoch": 3348} {"train_loss": -25.08186912536621, "global_step": 277908, "epoch": 3348} {"train_loss": -25.5297794342041, "global_step": 277909, "epoch": 3348} {"train_loss": -25.28365135192871, "global_step": 277910, "epoch": 3348} {"train_loss": -25.154356002807617, "global_step": 277911, "epoch": 3348} {"train_loss": -25.631200790405273, "global_step": 277912, "epoch": 3348} {"train_loss": -25.47987174987793, "global_step": 277913, "epoch": 3348} {"train_loss": -25.553720474243164, "global_step": 277914, "epoch": 3348} {"train_loss": -25.144079208374023, "global_step": 277915, "epoch": 3348} {"train_loss": -25.682153701782227, "global_step": 277916, "epoch": 3348} {"train_loss": -25.630651473999023, "global_step": 277917, "epoch": 3348} {"train_loss": -25.3350830078125, "global_step": 277918, "epoch": 3348} {"train_loss": -25.527509689331055, "global_step": 277919, "epoch": 3348} {"train_loss": -25.370046615600586, "global_step": 277920, "epoch": 3348} {"train_loss": -25.46971893310547, "global_step": 277921, "epoch": 3348} {"train_loss": -25.158063888549805, "global_step": 277922, "epoch": 3348} {"train_loss": -25.499282836914062, "global_step": 277923, "epoch": 3348} {"train_loss": -25.63037109375, "global_step": 277924, "epoch": 3348} {"train_loss": -25.453296661376953, "global_step": 277925, "epoch": 3348} {"train_loss": -25.38558006286621, "global_step": 277926, "epoch": 3348} {"train_loss": -25.42641258239746, "global_step": 277927, "epoch": 3348} {"train_loss": -25.47308921813965, "global_step": 277928, "epoch": 3348} {"train_loss": -25.713842391967773, "global_step": 277929, "epoch": 3348} {"train_loss": -25.4721736907959, "global_step": 277930, "epoch": 3348} {"train_loss": -25.279376983642578, "global_step": 277931, "epoch": 3348} {"train_loss": -25.3482723236084, "global_step": 277932, "epoch": 3348} {"train_loss": -25.455581665039062, "global_step": 277933, "epoch": 3348} {"train_loss": -25.619470596313477, "global_step": 277934, "epoch": 3348} {"train_loss": -25.251951217651367, "global_step": 277935, "epoch": 3348} {"train_loss": -25.35685157775879, "global_step": 277936, "epoch": 3348} {"train_loss": -25.279836654663086, "global_step": 277937, "epoch": 3348} {"train_loss": -25.366180419921875, "global_step": 277938, "epoch": 3348} {"train_loss": -25.512815475463867, "global_step": 277939, "epoch": 3348} {"train_loss": -25.1304874420166, "global_step": 277940, "epoch": 3348} {"train_loss": -25.1643009185791, "global_step": 277941, "epoch": 3348} {"train_loss": -25.368183135986328, "global_step": 277942, "epoch": 3348} {"train_loss": -25.478483200073242, "global_step": 277943, "epoch": 3348} {"train_loss": -25.10605812072754, "global_step": 277944, "epoch": 3348} {"train_loss": -25.359413146972656, "global_step": 277945, "epoch": 3348} {"train_loss": -25.770009994506836, "global_step": 277946, "epoch": 3348} {"train_loss": -25.747314453125, "global_step": 277947, "epoch": 3348} {"train_loss": -25.474647521972656, "global_step": 277948, "epoch": 3348} {"train_loss": -25.40816307067871, "global_step": 277949, "epoch": 3348} {"train_loss": -25.357868194580078, "global_step": 277950, "epoch": 3348} {"train_loss": -25.578428268432617, "global_step": 277951, "epoch": 3348} {"train_loss": -25.51283836364746, "global_step": 277952, "epoch": 3348} {"train_loss": -25.474355697631836, "global_step": 277953, "epoch": 3348} {"train_loss": -25.61053466796875, "global_step": 277954, "epoch": 3348} {"train_loss": -25.1662654876709, "global_step": 277955, "epoch": 3348} {"train_loss": -25.214330673217773, "global_step": 277956, "epoch": 3348} {"train_loss": -25.592580795288086, "global_step": 277957, "epoch": 3348} {"train_loss": -25.242429733276367, "global_step": 277958, "epoch": 3348} {"train_loss": -25.192113876342773, "global_step": 277959, "epoch": 3348} {"train_loss": -25.664682388305664, "global_step": 277960, "epoch": 3348} {"train_loss": -25.27202033996582, "global_step": 277961, "epoch": 3348} {"train_loss": -25.472496032714844, "global_step": 277962, "epoch": 3348} {"train_loss": -25.299610137939453, "global_step": 277963, "epoch": 3348} {"train_loss": -25.455352783203125, "global_step": 277964, "epoch": 3348} {"train_loss": -25.29802131652832, "global_step": 277965, "epoch": 3348} {"train_loss": -25.34703757963985, "global_step": 277966, "epoch": 3348, "val_loss": 6890705.0} {"train_loss": -24.453712463378906, "global_step": 277967, "epoch": 3349} {"train_loss": -23.425861358642578, "global_step": 277968, "epoch": 3349} {"train_loss": -23.230045318603516, "global_step": 277969, "epoch": 3349} {"train_loss": -24.268041610717773, "global_step": 277970, "epoch": 3349} {"train_loss": -23.827327728271484, "global_step": 277971, "epoch": 3349} {"train_loss": -24.68529510498047, "global_step": 277972, "epoch": 3349} {"train_loss": -23.830717086791992, "global_step": 277973, "epoch": 3349} {"train_loss": -24.69649314880371, "global_step": 277974, "epoch": 3349} {"train_loss": -23.76987648010254, "global_step": 277975, "epoch": 3349} {"train_loss": -25.059326171875, "global_step": 277976, "epoch": 3349} {"train_loss": -24.401721954345703, "global_step": 277977, "epoch": 3349} {"train_loss": -24.751779556274414, "global_step": 277978, "epoch": 3349} {"train_loss": -24.60312843322754, "global_step": 277979, "epoch": 3349} {"train_loss": -24.671096801757812, "global_step": 277980, "epoch": 3349} {"train_loss": -24.641864776611328, "global_step": 277981, "epoch": 3349} {"train_loss": -25.006195068359375, "global_step": 277982, "epoch": 3349} {"train_loss": -24.478300094604492, "global_step": 277983, "epoch": 3349} {"train_loss": -24.940610885620117, "global_step": 277984, "epoch": 3349} {"train_loss": -24.750598907470703, "global_step": 277985, "epoch": 3349} {"train_loss": -24.69135093688965, "global_step": 277986, "epoch": 3349} {"train_loss": -24.688613891601562, "global_step": 277987, "epoch": 3349} {"train_loss": -25.115467071533203, "global_step": 277988, "epoch": 3349} {"train_loss": -25.31524658203125, "global_step": 277989, "epoch": 3349} {"train_loss": -24.776832580566406, "global_step": 277990, "epoch": 3349} {"train_loss": -25.00603675842285, "global_step": 277991, "epoch": 3349} {"train_loss": -25.213830947875977, "global_step": 277992, "epoch": 3349} {"train_loss": -25.281644821166992, "global_step": 277993, "epoch": 3349} {"train_loss": -24.71842384338379, "global_step": 277994, "epoch": 3349} {"train_loss": -25.1927433013916, "global_step": 277995, "epoch": 3349} {"train_loss": -25.102123260498047, "global_step": 277996, "epoch": 3349} {"train_loss": -25.404043197631836, "global_step": 277997, "epoch": 3349} {"train_loss": -25.09149742126465, "global_step": 277998, "epoch": 3349} {"train_loss": -25.13067626953125, "global_step": 277999, "epoch": 3349} {"train_loss": -25.295209884643555, "global_step": 278000, "epoch": 3349} {"train_loss": -24.834186553955078, "global_step": 278001, "epoch": 3349} {"train_loss": -25.380945205688477, "global_step": 278002, "epoch": 3349} {"train_loss": -25.221220016479492, "global_step": 278003, "epoch": 3349} {"train_loss": -25.373981475830078, "global_step": 278004, "epoch": 3349} {"train_loss": -24.99559211730957, "global_step": 278005, "epoch": 3349} {"train_loss": -25.315780639648438, "global_step": 278006, "epoch": 3349} {"train_loss": -24.997604370117188, "global_step": 278007, "epoch": 3349} {"train_loss": -25.268720626831055, "global_step": 278008, "epoch": 3349} {"train_loss": -25.52549934387207, "global_step": 278009, "epoch": 3349} {"train_loss": -25.411653518676758, "global_step": 278010, "epoch": 3349} {"train_loss": -25.3463191986084, "global_step": 278011, "epoch": 3349} {"train_loss": -25.62739372253418, "global_step": 278012, "epoch": 3349} {"train_loss": -25.530012130737305, "global_step": 278013, "epoch": 3349} {"train_loss": -25.475610733032227, "global_step": 278014, "epoch": 3349} {"train_loss": -25.021459579467773, "global_step": 278015, "epoch": 3349} {"train_loss": -25.448102951049805, "global_step": 278016, "epoch": 3349} {"train_loss": -25.996973037719727, "global_step": 278017, "epoch": 3349} {"train_loss": -25.448392868041992, "global_step": 278018, "epoch": 3349} {"train_loss": -25.343250274658203, "global_step": 278019, "epoch": 3349} {"train_loss": -25.31939697265625, "global_step": 278020, "epoch": 3349} {"train_loss": -25.426725387573242, "global_step": 278021, "epoch": 3349} {"train_loss": -25.31336784362793, "global_step": 278022, "epoch": 3349} {"train_loss": -25.22535514831543, "global_step": 278023, "epoch": 3349} {"train_loss": -25.36125373840332, "global_step": 278024, "epoch": 3349} {"train_loss": -25.14003562927246, "global_step": 278025, "epoch": 3349} {"train_loss": -25.478225708007812, "global_step": 278026, "epoch": 3349} {"train_loss": -25.29885482788086, "global_step": 278027, "epoch": 3349} {"train_loss": -25.66328239440918, "global_step": 278028, "epoch": 3349} {"train_loss": -25.50340461730957, "global_step": 278029, "epoch": 3349} {"train_loss": -25.170164108276367, "global_step": 278030, "epoch": 3349} {"train_loss": -25.64023780822754, "global_step": 278031, "epoch": 3349} {"train_loss": -25.331480026245117, "global_step": 278032, "epoch": 3349} {"train_loss": -25.197525024414062, "global_step": 278033, "epoch": 3349} {"train_loss": -25.30592918395996, "global_step": 278034, "epoch": 3349} {"train_loss": -25.271854400634766, "global_step": 278035, "epoch": 3349} {"train_loss": -25.739078521728516, "global_step": 278036, "epoch": 3349} {"train_loss": -25.44647789001465, "global_step": 278037, "epoch": 3349} {"train_loss": -25.437646865844727, "global_step": 278038, "epoch": 3349} {"train_loss": -25.47657585144043, "global_step": 278039, "epoch": 3349} {"train_loss": -25.441537857055664, "global_step": 278040, "epoch": 3349} {"train_loss": -25.3598575592041, "global_step": 278041, "epoch": 3349} {"train_loss": -25.8192081451416, "global_step": 278042, "epoch": 3349} {"train_loss": -25.25447654724121, "global_step": 278043, "epoch": 3349} {"train_loss": -25.637495040893555, "global_step": 278044, "epoch": 3349} {"train_loss": -25.083324432373047, "global_step": 278045, "epoch": 3349} {"train_loss": -25.558462142944336, "global_step": 278046, "epoch": 3349} {"train_loss": -25.150300979614258, "global_step": 278047, "epoch": 3349} {"train_loss": -25.470813751220703, "global_step": 278048, "epoch": 3349} {"train_loss": -25.095910497458583, "global_step": 278049, "epoch": 3349, "val_loss": 7009609.5} {"train_loss": -24.9942684173584, "global_step": 278050, "epoch": 3350} {"train_loss": -24.812271118164062, "global_step": 278051, "epoch": 3350} {"train_loss": -24.39923095703125, "global_step": 278052, "epoch": 3350} {"train_loss": -24.93345069885254, "global_step": 278053, "epoch": 3350} {"train_loss": -24.945791244506836, "global_step": 278054, "epoch": 3350} {"train_loss": -24.787389755249023, "global_step": 278055, "epoch": 3350} {"train_loss": -25.12270164489746, "global_step": 278056, "epoch": 3350} {"train_loss": -25.004863739013672, "global_step": 278057, "epoch": 3350} {"train_loss": -25.008893966674805, "global_step": 278058, "epoch": 3350} {"train_loss": -24.917287826538086, "global_step": 278059, "epoch": 3350} {"train_loss": -25.17764663696289, "global_step": 278060, "epoch": 3350} {"train_loss": -24.720508575439453, "global_step": 278061, "epoch": 3350} {"train_loss": -25.009048461914062, "global_step": 278062, "epoch": 3350} {"train_loss": -25.0086727142334, "global_step": 278063, "epoch": 3350} {"train_loss": -25.050960540771484, "global_step": 278064, "epoch": 3350} {"train_loss": -24.774526596069336, "global_step": 278065, "epoch": 3350} {"train_loss": -25.051555633544922, "global_step": 278066, "epoch": 3350} {"train_loss": -25.636884689331055, "global_step": 278067, "epoch": 3350} {"train_loss": -25.001827239990234, "global_step": 278068, "epoch": 3350} {"train_loss": -24.92768669128418, "global_step": 278069, "epoch": 3350} {"train_loss": -24.849843978881836, "global_step": 278070, "epoch": 3350} {"train_loss": -25.201871871948242, "global_step": 278071, "epoch": 3350} {"train_loss": -25.611886978149414, "global_step": 278072, "epoch": 3350} {"train_loss": -25.378416061401367, "global_step": 278073, "epoch": 3350} {"train_loss": -25.2843074798584, "global_step": 278074, "epoch": 3350} {"train_loss": -25.20857810974121, "global_step": 278075, "epoch": 3350} {"train_loss": -25.357624053955078, "global_step": 278076, "epoch": 3350} {"train_loss": -25.330434799194336, "global_step": 278077, "epoch": 3350} {"train_loss": -25.110496520996094, "global_step": 278078, "epoch": 3350} {"train_loss": -25.394241333007812, "global_step": 278079, "epoch": 3350} {"train_loss": -25.242528915405273, "global_step": 278080, "epoch": 3350} {"train_loss": -24.910602569580078, "global_step": 278081, "epoch": 3350} {"train_loss": -25.61202049255371, "global_step": 278082, "epoch": 3350} {"train_loss": -25.23525047302246, "global_step": 278083, "epoch": 3350} {"train_loss": -25.469724655151367, "global_step": 278084, "epoch": 3350} {"train_loss": -25.5865478515625, "global_step": 278085, "epoch": 3350} {"train_loss": -25.31521987915039, "global_step": 278086, "epoch": 3350} {"train_loss": -25.723230361938477, "global_step": 278087, "epoch": 3350} {"train_loss": -25.455270767211914, "global_step": 278088, "epoch": 3350} {"train_loss": -25.252090454101562, "global_step": 278089, "epoch": 3350} {"train_loss": -25.2493953704834, "global_step": 278090, "epoch": 3350} {"train_loss": -25.384506225585938, "global_step": 278091, "epoch": 3350} {"train_loss": -24.95350456237793, "global_step": 278092, "epoch": 3350} {"train_loss": -25.259159088134766, "global_step": 278093, "epoch": 3350} {"train_loss": -25.52503204345703, "global_step": 278094, "epoch": 3350} {"train_loss": -25.826887130737305, "global_step": 278095, "epoch": 3350} {"train_loss": -25.5655574798584, "global_step": 278096, "epoch": 3350} {"train_loss": -25.43467903137207, "global_step": 278097, "epoch": 3350} {"train_loss": -25.276914596557617, "global_step": 278098, "epoch": 3350} {"train_loss": -25.1729679107666, "global_step": 278099, "epoch": 3350} {"train_loss": -25.357091903686523, "global_step": 278100, "epoch": 3350} {"train_loss": -25.721776962280273, "global_step": 278101, "epoch": 3350} {"train_loss": -25.556982040405273, "global_step": 278102, "epoch": 3350} {"train_loss": -25.03206443786621, "global_step": 278103, "epoch": 3350} {"train_loss": -25.319438934326172, "global_step": 278104, "epoch": 3350} {"train_loss": -25.411039352416992, "global_step": 278105, "epoch": 3350} {"train_loss": -25.29593276977539, "global_step": 278106, "epoch": 3350} {"train_loss": -25.57777976989746, "global_step": 278107, "epoch": 3350} {"train_loss": -25.400915145874023, "global_step": 278108, "epoch": 3350} {"train_loss": -25.157163619995117, "global_step": 278109, "epoch": 3350} {"train_loss": -25.50348472595215, "global_step": 278110, "epoch": 3350} {"train_loss": -25.303037643432617, "global_step": 278111, "epoch": 3350} {"train_loss": -25.33780288696289, "global_step": 278112, "epoch": 3350} {"train_loss": -25.471336364746094, "global_step": 278113, "epoch": 3350} {"train_loss": -25.246747970581055, "global_step": 278114, "epoch": 3350} {"train_loss": -25.255508422851562, "global_step": 278115, "epoch": 3350} {"train_loss": -25.1098575592041, "global_step": 278116, "epoch": 3350} {"train_loss": -25.33046531677246, "global_step": 278117, "epoch": 3350} {"train_loss": -25.28693199157715, "global_step": 278118, "epoch": 3350} {"train_loss": -25.053529739379883, "global_step": 278119, "epoch": 3350} {"train_loss": -25.281972885131836, "global_step": 278120, "epoch": 3350} {"train_loss": -25.361963272094727, "global_step": 278121, "epoch": 3350} {"train_loss": -24.55579948425293, "global_step": 278122, "epoch": 3350} {"train_loss": -24.375858306884766, "global_step": 278123, "epoch": 3350} {"train_loss": -24.812652587890625, "global_step": 278124, "epoch": 3350} {"train_loss": -24.9742488861084, "global_step": 278125, "epoch": 3350} {"train_loss": -24.698299407958984, "global_step": 278126, "epoch": 3350} {"train_loss": -24.744251251220703, "global_step": 278127, "epoch": 3350} {"train_loss": -24.488033294677734, "global_step": 278128, "epoch": 3350} {"train_loss": -25.069862365722656, "global_step": 278129, "epoch": 3350} {"train_loss": -24.46625518798828, "global_step": 278130, "epoch": 3350} {"train_loss": -24.610599517822266, "global_step": 278131, "epoch": 3350} {"train_loss": -25.17621782601598, "global_step": 278132, "epoch": 3350, "train/sim_max_reward_0": 1.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4500000": 1.0, "test/sim_max_reward_4500001": 1.0, "test/sim_max_reward_4500002": 1.0, "test/sim_max_reward_4500003": 1.0, "test/sim_max_reward_4500004": 1.0, "test/sim_max_reward_4500005": 1.0, "test/sim_max_reward_4500006": 1.0, "test/sim_max_reward_4500007": 0.0, "test/sim_max_reward_4500008": 1.0, "test/sim_max_reward_4500009": 1.0, "test/sim_max_reward_4500010": 1.0, "test/sim_max_reward_4500011": 1.0, "test/sim_max_reward_4500012": 1.0, "test/sim_max_reward_4500013": 1.0, "test/sim_max_reward_4500014": 1.0, "test/sim_max_reward_4500015": 1.0, "test/sim_max_reward_4500016": 1.0, "test/sim_max_reward_4500017": 1.0, "test/sim_max_reward_4500018": 0.0, "test/sim_max_reward_4500019": 0.0, "test/sim_max_reward_4500020": 1.0, "test/sim_max_reward_4500021": 1.0, "train/mean_score": 1.0, "test/mean_score": 0.8636363636363636, "val_loss": 7103977.0} {"train_loss": -24.862010955810547, "global_step": 278133, "epoch": 3351} {"train_loss": -24.657163619995117, "global_step": 278134, "epoch": 3351} {"train_loss": -25.201635360717773, "global_step": 278135, "epoch": 3351} {"train_loss": -24.919782638549805, "global_step": 278136, "epoch": 3351} {"train_loss": -24.50539207458496, "global_step": 278137, "epoch": 3351} {"train_loss": -25.10569190979004, "global_step": 278138, "epoch": 3351} {"train_loss": -24.931289672851562, "global_step": 278139, "epoch": 3351} {"train_loss": -25.255613327026367, "global_step": 278140, "epoch": 3351} {"train_loss": -24.84883689880371, "global_step": 278141, "epoch": 3351} {"train_loss": -24.673236846923828, "global_step": 278142, "epoch": 3351} {"train_loss": -25.132421493530273, "global_step": 278143, "epoch": 3351} {"train_loss": -25.15885353088379, "global_step": 278144, "epoch": 3351} {"train_loss": -24.741865158081055, "global_step": 278145, "epoch": 3351} {"train_loss": -25.281400680541992, "global_step": 278146, "epoch": 3351} {"train_loss": -25.420114517211914, "global_step": 278147, "epoch": 3351} {"train_loss": -24.965513229370117, "global_step": 278148, "epoch": 3351} {"train_loss": -24.792802810668945, "global_step": 278149, "epoch": 3351} {"train_loss": -24.75850486755371, "global_step": 278150, "epoch": 3351} {"train_loss": -25.15387535095215, "global_step": 278151, "epoch": 3351} {"train_loss": -25.24237060546875, "global_step": 278152, "epoch": 3351} {"train_loss": -25.061246871948242, "global_step": 278153, "epoch": 3351} {"train_loss": -25.41669273376465, "global_step": 278154, "epoch": 3351} {"train_loss": -25.464763641357422, "global_step": 278155, "epoch": 3351} {"train_loss": -24.789621353149414, "global_step": 278156, "epoch": 3351} {"train_loss": -25.133275985717773, "global_step": 278157, "epoch": 3351} {"train_loss": -25.198596954345703, "global_step": 278158, "epoch": 3351} {"train_loss": -25.348129272460938, "global_step": 278159, "epoch": 3351} {"train_loss": -25.2141170501709, "global_step": 278160, "epoch": 3351} {"train_loss": -25.552122116088867, "global_step": 278161, "epoch": 3351} {"train_loss": -25.4013614654541, "global_step": 278162, "epoch": 3351} {"train_loss": -25.362287521362305, "global_step": 278163, "epoch": 3351} {"train_loss": -25.419111251831055, "global_step": 278164, "epoch": 3351} {"train_loss": -25.413293838500977, "global_step": 278165, "epoch": 3351} {"train_loss": -25.324655532836914, "global_step": 278166, "epoch": 3351} {"train_loss": -25.332191467285156, "global_step": 278167, "epoch": 3351} {"train_loss": -25.228788375854492, "global_step": 278168, "epoch": 3351} {"train_loss": -25.42632484436035, "global_step": 278169, "epoch": 3351} {"train_loss": -25.67616081237793, "global_step": 278170, "epoch": 3351} {"train_loss": -25.310382843017578, "global_step": 278171, "epoch": 3351} {"train_loss": -25.23000144958496, "global_step": 278172, "epoch": 3351} {"train_loss": -25.235055923461914, "global_step": 278173, "epoch": 3351} {"train_loss": -24.944644927978516, "global_step": 278174, "epoch": 3351} {"train_loss": -25.325836181640625, "global_step": 278175, "epoch": 3351} {"train_loss": -25.337039947509766, "global_step": 278176, "epoch": 3351} {"train_loss": -25.191553115844727, "global_step": 278177, "epoch": 3351} {"train_loss": -25.49379539489746, "global_step": 278178, "epoch": 3351} {"train_loss": -25.397403717041016, "global_step": 278179, "epoch": 3351} {"train_loss": -25.090843200683594, "global_step": 278180, "epoch": 3351} {"train_loss": -25.913619995117188, "global_step": 278181, "epoch": 3351} {"train_loss": -25.310651779174805, "global_step": 278182, "epoch": 3351} {"train_loss": -25.834980010986328, "global_step": 278183, "epoch": 3351} {"train_loss": -25.290624618530273, "global_step": 278184, "epoch": 3351} {"train_loss": -25.247533798217773, "global_step": 278185, "epoch": 3351} {"train_loss": -25.448156356811523, "global_step": 278186, "epoch": 3351} {"train_loss": -25.215576171875, "global_step": 278187, "epoch": 3351} {"train_loss": -25.240991592407227, "global_step": 278188, "epoch": 3351} {"train_loss": -24.736730575561523, "global_step": 278189, "epoch": 3351} {"train_loss": -25.483495712280273, "global_step": 278190, "epoch": 3351} {"train_loss": -25.201297760009766, "global_step": 278191, "epoch": 3351} {"train_loss": -25.258283615112305, "global_step": 278192, "epoch": 3351} {"train_loss": -25.30560874938965, "global_step": 278193, "epoch": 3351} {"train_loss": -25.087400436401367, "global_step": 278194, "epoch": 3351} {"train_loss": -25.019420623779297, "global_step": 278195, "epoch": 3351} {"train_loss": -25.188467025756836, "global_step": 278196, "epoch": 3351} {"train_loss": -25.24603271484375, "global_step": 278197, "epoch": 3351} {"train_loss": -25.444047927856445, "global_step": 278198, "epoch": 3351} {"train_loss": -25.154743194580078, "global_step": 278199, "epoch": 3351} {"train_loss": -25.354337692260742, "global_step": 278200, "epoch": 3351} {"train_loss": -24.77095603942871, "global_step": 278201, "epoch": 3351} {"train_loss": -25.324234008789062, "global_step": 278202, "epoch": 3351} {"train_loss": -25.7159423828125, "global_step": 278203, "epoch": 3351} {"train_loss": -25.423994064331055, "global_step": 278204, "epoch": 3351} {"train_loss": -25.590192794799805, "global_step": 278205, "epoch": 3351} {"train_loss": -25.2961368560791, "global_step": 278206, "epoch": 3351} {"train_loss": -25.461837768554688, "global_step": 278207, "epoch": 3351} {"train_loss": -25.284645080566406, "global_step": 278208, "epoch": 3351} {"train_loss": -25.268798828125, "global_step": 278209, "epoch": 3351} {"train_loss": -25.140764236450195, "global_step": 278210, "epoch": 3351} {"train_loss": -25.44562339782715, "global_step": 278211, "epoch": 3351} {"train_loss": -24.979093551635742, "global_step": 278212, "epoch": 3351} {"train_loss": -25.197446823120117, "global_step": 278213, "epoch": 3351} {"train_loss": -25.335569381713867, "global_step": 278214, "epoch": 3351} {"train_loss": -25.228065375822137, "global_step": 278215, "epoch": 3351, "val_loss": 6961786.0} {"train_loss": -25.176198959350586, "global_step": 278216, "epoch": 3352} {"train_loss": -25.12741470336914, "global_step": 278217, "epoch": 3352} {"train_loss": -25.154924392700195, "global_step": 278218, "epoch": 3352} {"train_loss": -25.4086971282959, "global_step": 278219, "epoch": 3352} {"train_loss": -25.50618553161621, "global_step": 278220, "epoch": 3352} {"train_loss": -25.307178497314453, "global_step": 278221, "epoch": 3352} {"train_loss": -24.773033142089844, "global_step": 278222, "epoch": 3352} {"train_loss": -25.156301498413086, "global_step": 278223, "epoch": 3352} {"train_loss": -25.284547805786133, "global_step": 278224, "epoch": 3352} {"train_loss": -25.20224952697754, "global_step": 278225, "epoch": 3352} {"train_loss": -25.4123592376709, "global_step": 278226, "epoch": 3352} {"train_loss": -25.47665786743164, "global_step": 278227, "epoch": 3352} {"train_loss": -25.219472885131836, "global_step": 278228, "epoch": 3352} {"train_loss": -25.777673721313477, "global_step": 278229, "epoch": 3352} {"train_loss": -25.650793075561523, "global_step": 278230, "epoch": 3352} {"train_loss": -25.419818878173828, "global_step": 278231, "epoch": 3352} {"train_loss": -25.523147583007812, "global_step": 278232, "epoch": 3352} {"train_loss": -25.519445419311523, "global_step": 278233, "epoch": 3352} {"train_loss": -25.461759567260742, "global_step": 278234, "epoch": 3352} {"train_loss": -25.661474227905273, "global_step": 278235, "epoch": 3352} {"train_loss": -25.385923385620117, "global_step": 278236, "epoch": 3352} {"train_loss": -25.345600128173828, "global_step": 278237, "epoch": 3352} {"train_loss": -25.306550979614258, "global_step": 278238, "epoch": 3352} {"train_loss": -25.47663688659668, "global_step": 278239, "epoch": 3352} {"train_loss": -25.529932022094727, "global_step": 278240, "epoch": 3352} {"train_loss": -25.6351318359375, "global_step": 278241, "epoch": 3352} {"train_loss": -25.4169921875, "global_step": 278242, "epoch": 3352} {"train_loss": -25.533214569091797, "global_step": 278243, "epoch": 3352} {"train_loss": -25.48306655883789, "global_step": 278244, "epoch": 3352} {"train_loss": -25.575000762939453, "global_step": 278245, "epoch": 3352} {"train_loss": -25.835403442382812, "global_step": 278246, "epoch": 3352} {"train_loss": -25.223621368408203, "global_step": 278247, "epoch": 3352} {"train_loss": -25.367753982543945, "global_step": 278248, "epoch": 3352} {"train_loss": -25.501073837280273, "global_step": 278249, "epoch": 3352} {"train_loss": -25.366254806518555, "global_step": 278250, "epoch": 3352} {"train_loss": -25.120594024658203, "global_step": 278251, "epoch": 3352} {"train_loss": -25.766284942626953, "global_step": 278252, "epoch": 3352} {"train_loss": -25.494810104370117, "global_step": 278253, "epoch": 3352} {"train_loss": -25.10160255432129, "global_step": 278254, "epoch": 3352} {"train_loss": -25.563215255737305, "global_step": 278255, "epoch": 3352} {"train_loss": -25.28704071044922, "global_step": 278256, "epoch": 3352} {"train_loss": -25.45745849609375, "global_step": 278257, "epoch": 3352} {"train_loss": -25.699384689331055, "global_step": 278258, "epoch": 3352} {"train_loss": -25.39335060119629, "global_step": 278259, "epoch": 3352} {"train_loss": -25.472999572753906, "global_step": 278260, "epoch": 3352} {"train_loss": -25.08006477355957, "global_step": 278261, "epoch": 3352} {"train_loss": -25.641010284423828, "global_step": 278262, "epoch": 3352} {"train_loss": -25.825912475585938, "global_step": 278263, "epoch": 3352} {"train_loss": -25.652204513549805, "global_step": 278264, "epoch": 3352} {"train_loss": -25.43703269958496, "global_step": 278265, "epoch": 3352} {"train_loss": -25.335927963256836, "global_step": 278266, "epoch": 3352} {"train_loss": -25.478490829467773, "global_step": 278267, "epoch": 3352} {"train_loss": -25.171138763427734, "global_step": 278268, "epoch": 3352} {"train_loss": -25.394062042236328, "global_step": 278269, "epoch": 3352} {"train_loss": -25.561689376831055, "global_step": 278270, "epoch": 3352} {"train_loss": -25.759220123291016, "global_step": 278271, "epoch": 3352} {"train_loss": -25.110631942749023, "global_step": 278272, "epoch": 3352} {"train_loss": -25.317337036132812, "global_step": 278273, "epoch": 3352} {"train_loss": -25.771955490112305, "global_step": 278274, "epoch": 3352} {"train_loss": -25.100948333740234, "global_step": 278275, "epoch": 3352} {"train_loss": -25.53620719909668, "global_step": 278276, "epoch": 3352} {"train_loss": -25.6107234954834, "global_step": 278277, "epoch": 3352} {"train_loss": -25.28815269470215, "global_step": 278278, "epoch": 3352} {"train_loss": -25.10968017578125, "global_step": 278279, "epoch": 3352} {"train_loss": -25.301015853881836, "global_step": 278280, "epoch": 3352} {"train_loss": -25.290760040283203, "global_step": 278281, "epoch": 3352} {"train_loss": -25.338525772094727, "global_step": 278282, "epoch": 3352} {"train_loss": -25.404565811157227, "global_step": 278283, "epoch": 3352} {"train_loss": -25.582656860351562, "global_step": 278284, "epoch": 3352} {"train_loss": -25.286691665649414, "global_step": 278285, "epoch": 3352} {"train_loss": -25.08586311340332, "global_step": 278286, "epoch": 3352} {"train_loss": -25.05422019958496, "global_step": 278287, "epoch": 3352} {"train_loss": -25.330442428588867, "global_step": 278288, "epoch": 3352} {"train_loss": -25.27252769470215, "global_step": 278289, "epoch": 3352} {"train_loss": -25.059234619140625, "global_step": 278290, "epoch": 3352} {"train_loss": -25.36404800415039, "global_step": 278291, "epoch": 3352} {"train_loss": -25.791858673095703, "global_step": 278292, "epoch": 3352} {"train_loss": -25.267868041992188, "global_step": 278293, "epoch": 3352} {"train_loss": -25.6584529876709, "global_step": 278294, "epoch": 3352} {"train_loss": -25.580690383911133, "global_step": 278295, "epoch": 3352} {"train_loss": -25.32051658630371, "global_step": 278296, "epoch": 3352} {"train_loss": -25.499555587768555, "global_step": 278297, "epoch": 3352} {"train_loss": -25.414541244506836, "global_step": 278298, "epoch": 3352, "val_loss": 6970366.0} {"train_loss": -25.07706642150879, "global_step": 278299, "epoch": 3353} {"train_loss": -25.098134994506836, "global_step": 278300, "epoch": 3353} {"train_loss": -25.2294864654541, "global_step": 278301, "epoch": 3353} {"train_loss": -25.35212516784668, "global_step": 278302, "epoch": 3353} {"train_loss": -25.330093383789062, "global_step": 278303, "epoch": 3353} {"train_loss": -25.095388412475586, "global_step": 278304, "epoch": 3353} {"train_loss": -25.36097526550293, "global_step": 278305, "epoch": 3353} {"train_loss": -25.42603874206543, "global_step": 278306, "epoch": 3353} {"train_loss": -24.952972412109375, "global_step": 278307, "epoch": 3353} {"train_loss": -25.117752075195312, "global_step": 278308, "epoch": 3353} {"train_loss": -25.017963409423828, "global_step": 278309, "epoch": 3353} {"train_loss": -24.878097534179688, "global_step": 278310, "epoch": 3353} {"train_loss": -25.12668800354004, "global_step": 278311, "epoch": 3353} {"train_loss": -24.738117218017578, "global_step": 278312, "epoch": 3353} {"train_loss": -25.39369010925293, "global_step": 278313, "epoch": 3353} {"train_loss": -25.16737937927246, "global_step": 278314, "epoch": 3353} {"train_loss": -24.828195571899414, "global_step": 278315, "epoch": 3353} {"train_loss": -24.77113914489746, "global_step": 278316, "epoch": 3353} {"train_loss": -25.13685417175293, "global_step": 278317, "epoch": 3353} {"train_loss": -25.308042526245117, "global_step": 278318, "epoch": 3353} {"train_loss": -25.246118545532227, "global_step": 278319, "epoch": 3353} {"train_loss": -24.969465255737305, "global_step": 278320, "epoch": 3353} {"train_loss": -25.464303970336914, "global_step": 278321, "epoch": 3353} {"train_loss": -25.540523529052734, "global_step": 278322, "epoch": 3353} {"train_loss": -25.262468338012695, "global_step": 278323, "epoch": 3353} {"train_loss": -25.315298080444336, "global_step": 278324, "epoch": 3353} {"train_loss": -25.145065307617188, "global_step": 278325, "epoch": 3353} {"train_loss": -25.50140953063965, "global_step": 278326, "epoch": 3353} {"train_loss": -25.32362937927246, "global_step": 278327, "epoch": 3353} {"train_loss": -25.43708610534668, "global_step": 278328, "epoch": 3353} {"train_loss": -25.467405319213867, "global_step": 278329, "epoch": 3353} {"train_loss": -25.751935958862305, "global_step": 278330, "epoch": 3353} {"train_loss": -25.465423583984375, "global_step": 278331, "epoch": 3353} {"train_loss": -25.48456573486328, "global_step": 278332, "epoch": 3353} {"train_loss": -25.919336318969727, "global_step": 278333, "epoch": 3353} {"train_loss": -25.467058181762695, "global_step": 278334, "epoch": 3353} {"train_loss": -25.43865966796875, "global_step": 278335, "epoch": 3353} {"train_loss": -25.31076431274414, "global_step": 278336, "epoch": 3353} {"train_loss": -25.039676666259766, "global_step": 278337, "epoch": 3353} {"train_loss": -25.07895851135254, "global_step": 278338, "epoch": 3353} {"train_loss": -25.453962326049805, "global_step": 278339, "epoch": 3353} {"train_loss": -25.403303146362305, "global_step": 278340, "epoch": 3353} {"train_loss": -25.330476760864258, "global_step": 278341, "epoch": 3353} {"train_loss": -25.70503044128418, "global_step": 278342, "epoch": 3353} {"train_loss": -25.306842803955078, "global_step": 278343, "epoch": 3353} {"train_loss": -25.3808536529541, "global_step": 278344, "epoch": 3353} {"train_loss": -25.449970245361328, "global_step": 278345, "epoch": 3353} {"train_loss": -25.55426025390625, "global_step": 278346, "epoch": 3353} {"train_loss": -25.60699462890625, "global_step": 278347, "epoch": 3353} {"train_loss": -25.75815773010254, "global_step": 278348, "epoch": 3353} {"train_loss": -25.29846954345703, "global_step": 278349, "epoch": 3353} {"train_loss": -25.17228126525879, "global_step": 278350, "epoch": 3353} {"train_loss": -25.540170669555664, "global_step": 278351, "epoch": 3353} {"train_loss": -25.30607032775879, "global_step": 278352, "epoch": 3353} {"train_loss": -25.31476402282715, "global_step": 278353, "epoch": 3353} {"train_loss": -25.224782943725586, "global_step": 278354, "epoch": 3353} {"train_loss": -25.572744369506836, "global_step": 278355, "epoch": 3353} {"train_loss": -25.430984497070312, "global_step": 278356, "epoch": 3353} {"train_loss": -25.309391021728516, "global_step": 278357, "epoch": 3353} {"train_loss": -25.520231246948242, "global_step": 278358, "epoch": 3353} {"train_loss": -25.42961311340332, "global_step": 278359, "epoch": 3353} {"train_loss": -24.6731014251709, "global_step": 278360, "epoch": 3353} {"train_loss": -25.449819564819336, "global_step": 278361, "epoch": 3353} {"train_loss": -25.393461227416992, "global_step": 278362, "epoch": 3353} {"train_loss": -25.14478302001953, "global_step": 278363, "epoch": 3353} {"train_loss": -25.340497970581055, "global_step": 278364, "epoch": 3353} {"train_loss": -25.411474227905273, "global_step": 278365, "epoch": 3353} {"train_loss": -25.181678771972656, "global_step": 278366, "epoch": 3353} {"train_loss": -25.439313888549805, "global_step": 278367, "epoch": 3353} {"train_loss": -25.32681655883789, "global_step": 278368, "epoch": 3353} {"train_loss": -25.365385055541992, "global_step": 278369, "epoch": 3353} {"train_loss": -25.14277458190918, "global_step": 278370, "epoch": 3353} {"train_loss": -25.02841567993164, "global_step": 278371, "epoch": 3353} {"train_loss": -24.891864776611328, "global_step": 278372, "epoch": 3353} {"train_loss": -25.324848175048828, "global_step": 278373, "epoch": 3353} {"train_loss": -25.266048431396484, "global_step": 278374, "epoch": 3353} {"train_loss": -25.2393741607666, "global_step": 278375, "epoch": 3353} {"train_loss": -25.642486572265625, "global_step": 278376, "epoch": 3353} {"train_loss": -25.308271408081055, "global_step": 278377, "epoch": 3353} {"train_loss": -25.417802810668945, "global_step": 278378, "epoch": 3353} {"train_loss": -25.271390914916992, "global_step": 278379, "epoch": 3353} {"train_loss": -25.275863647460938, "global_step": 278380, "epoch": 3353} {"train_loss": -25.291273254946052, "global_step": 278381, "epoch": 3353, "val_loss": 7066642.0} {"train_loss": -25.000547409057617, "global_step": 278382, "epoch": 3354} {"train_loss": -25.20084571838379, "global_step": 278383, "epoch": 3354} {"train_loss": -24.994583129882812, "global_step": 278384, "epoch": 3354} {"train_loss": -25.097278594970703, "global_step": 278385, "epoch": 3354} {"train_loss": -25.154193878173828, "global_step": 278386, "epoch": 3354} {"train_loss": -25.057788848876953, "global_step": 278387, "epoch": 3354} {"train_loss": -25.13515853881836, "global_step": 278388, "epoch": 3354} {"train_loss": -25.088699340820312, "global_step": 278389, "epoch": 3354} {"train_loss": -25.474681854248047, "global_step": 278390, "epoch": 3354} {"train_loss": -25.06219482421875, "global_step": 278391, "epoch": 3354} {"train_loss": -25.38919448852539, "global_step": 278392, "epoch": 3354} {"train_loss": -25.27658462524414, "global_step": 278393, "epoch": 3354} {"train_loss": -25.499418258666992, "global_step": 278394, "epoch": 3354} {"train_loss": -25.499364852905273, "global_step": 278395, "epoch": 3354} {"train_loss": -25.373483657836914, "global_step": 278396, "epoch": 3354} {"train_loss": -25.393583297729492, "global_step": 278397, "epoch": 3354} {"train_loss": -25.004560470581055, "global_step": 278398, "epoch": 3354} {"train_loss": -25.092336654663086, "global_step": 278399, "epoch": 3354} {"train_loss": -25.347211837768555, "global_step": 278400, "epoch": 3354} {"train_loss": -25.257537841796875, "global_step": 278401, "epoch": 3354} {"train_loss": -25.299551010131836, "global_step": 278402, "epoch": 3354} {"train_loss": -25.011611938476562, "global_step": 278403, "epoch": 3354} {"train_loss": -25.57027816772461, "global_step": 278404, "epoch": 3354} {"train_loss": -25.265445709228516, "global_step": 278405, "epoch": 3354} {"train_loss": -25.6468505859375, "global_step": 278406, "epoch": 3354} {"train_loss": -25.051280975341797, "global_step": 278407, "epoch": 3354} {"train_loss": -25.20956802368164, "global_step": 278408, "epoch": 3354} {"train_loss": -25.347644805908203, "global_step": 278409, "epoch": 3354} {"train_loss": -25.57041358947754, "global_step": 278410, "epoch": 3354} {"train_loss": -25.483354568481445, "global_step": 278411, "epoch": 3354} {"train_loss": -25.244115829467773, "global_step": 278412, "epoch": 3354} {"train_loss": -25.405580520629883, "global_step": 278413, "epoch": 3354} {"train_loss": -25.125675201416016, "global_step": 278414, "epoch": 3354} {"train_loss": -25.24037742614746, "global_step": 278415, "epoch": 3354} {"train_loss": -25.2224178314209, "global_step": 278416, "epoch": 3354} {"train_loss": -25.62052345275879, "global_step": 278417, "epoch": 3354} {"train_loss": -25.171667098999023, "global_step": 278418, "epoch": 3354} {"train_loss": -25.384973526000977, "global_step": 278419, "epoch": 3354} {"train_loss": -25.190418243408203, "global_step": 278420, "epoch": 3354} {"train_loss": -25.311767578125, "global_step": 278421, "epoch": 3354} {"train_loss": -25.38773536682129, "global_step": 278422, "epoch": 3354} {"train_loss": -25.307575225830078, "global_step": 278423, "epoch": 3354} {"train_loss": -25.510507583618164, "global_step": 278424, "epoch": 3354} {"train_loss": -25.304861068725586, "global_step": 278425, "epoch": 3354} {"train_loss": -25.59733009338379, "global_step": 278426, "epoch": 3354} {"train_loss": -25.6341552734375, "global_step": 278427, "epoch": 3354} {"train_loss": -25.58315086364746, "global_step": 278428, "epoch": 3354} {"train_loss": -25.432863235473633, "global_step": 278429, "epoch": 3354} {"train_loss": -25.636280059814453, "global_step": 278430, "epoch": 3354} {"train_loss": -25.632598876953125, "global_step": 278431, "epoch": 3354} {"train_loss": -25.522241592407227, "global_step": 278432, "epoch": 3354} {"train_loss": -25.691364288330078, "global_step": 278433, "epoch": 3354} {"train_loss": -25.602338790893555, "global_step": 278434, "epoch": 3354} {"train_loss": -25.389488220214844, "global_step": 278435, "epoch": 3354} {"train_loss": -25.310422897338867, "global_step": 278436, "epoch": 3354} {"train_loss": -25.737707138061523, "global_step": 278437, "epoch": 3354} {"train_loss": -25.5226993560791, "global_step": 278438, "epoch": 3354} {"train_loss": -25.823942184448242, "global_step": 278439, "epoch": 3354} {"train_loss": -25.128713607788086, "global_step": 278440, "epoch": 3354} {"train_loss": -25.504253387451172, "global_step": 278441, "epoch": 3354} {"train_loss": -25.598623275756836, "global_step": 278442, "epoch": 3354} {"train_loss": -25.36414337158203, "global_step": 278443, "epoch": 3354} {"train_loss": -25.28360939025879, "global_step": 278444, "epoch": 3354} {"train_loss": -25.691852569580078, "global_step": 278445, "epoch": 3354} {"train_loss": -25.13211441040039, "global_step": 278446, "epoch": 3354} {"train_loss": -25.36423110961914, "global_step": 278447, "epoch": 3354} {"train_loss": -25.15765380859375, "global_step": 278448, "epoch": 3354} {"train_loss": -25.351118087768555, "global_step": 278449, "epoch": 3354} {"train_loss": -25.758642196655273, "global_step": 278450, "epoch": 3354} {"train_loss": -25.498960494995117, "global_step": 278451, "epoch": 3354} {"train_loss": -25.111417770385742, "global_step": 278452, "epoch": 3354} {"train_loss": -25.2482967376709, "global_step": 278453, "epoch": 3354} {"train_loss": -25.556455612182617, "global_step": 278454, "epoch": 3354} {"train_loss": -25.781381607055664, "global_step": 278455, "epoch": 3354} {"train_loss": -24.92580223083496, "global_step": 278456, "epoch": 3354} {"train_loss": -25.56610870361328, "global_step": 278457, "epoch": 3354} {"train_loss": -25.14479637145996, "global_step": 278458, "epoch": 3354} {"train_loss": -25.447240829467773, "global_step": 278459, "epoch": 3354} {"train_loss": -25.12874412536621, "global_step": 278460, "epoch": 3354} {"train_loss": -25.211898803710938, "global_step": 278461, "epoch": 3354} {"train_loss": -25.219078063964844, "global_step": 278462, "epoch": 3354} {"train_loss": -25.509809494018555, "global_step": 278463, "epoch": 3354} {"train_loss": -25.353967207023896, "global_step": 278464, "epoch": 3354, "val_loss": 6984289.5} {"train_loss": -24.953250885009766, "global_step": 278465, "epoch": 3355} {"train_loss": -24.670913696289062, "global_step": 278466, "epoch": 3355} {"train_loss": -24.879535675048828, "global_step": 278467, "epoch": 3355} {"train_loss": -24.400379180908203, "global_step": 278468, "epoch": 3355} {"train_loss": -24.91780662536621, "global_step": 278469, "epoch": 3355} {"train_loss": -24.566377639770508, "global_step": 278470, "epoch": 3355} {"train_loss": -24.45922088623047, "global_step": 278471, "epoch": 3355} {"train_loss": -25.08807373046875, "global_step": 278472, "epoch": 3355} {"train_loss": -24.707666397094727, "global_step": 278473, "epoch": 3355} {"train_loss": -24.60189437866211, "global_step": 278474, "epoch": 3355} {"train_loss": -25.079824447631836, "global_step": 278475, "epoch": 3355} {"train_loss": -25.17276382446289, "global_step": 278476, "epoch": 3355} {"train_loss": -24.6657772064209, "global_step": 278477, "epoch": 3355} {"train_loss": -24.876394271850586, "global_step": 278478, "epoch": 3355} {"train_loss": -25.072818756103516, "global_step": 278479, "epoch": 3355} {"train_loss": -25.215604782104492, "global_step": 278480, "epoch": 3355} {"train_loss": -25.105688095092773, "global_step": 278481, "epoch": 3355} {"train_loss": -25.32181739807129, "global_step": 278482, "epoch": 3355} {"train_loss": -25.112016677856445, "global_step": 278483, "epoch": 3355} {"train_loss": -24.927459716796875, "global_step": 278484, "epoch": 3355} {"train_loss": -25.297508239746094, "global_step": 278485, "epoch": 3355} {"train_loss": -24.881513595581055, "global_step": 278486, "epoch": 3355} {"train_loss": -25.200244903564453, "global_step": 278487, "epoch": 3355} {"train_loss": -25.156753540039062, "global_step": 278488, "epoch": 3355} {"train_loss": -25.29149055480957, "global_step": 278489, "epoch": 3355} {"train_loss": -25.09747314453125, "global_step": 278490, "epoch": 3355} {"train_loss": -25.122385025024414, "global_step": 278491, "epoch": 3355} {"train_loss": -24.93202018737793, "global_step": 278492, "epoch": 3355} {"train_loss": -25.454593658447266, "global_step": 278493, "epoch": 3355} {"train_loss": -25.240629196166992, "global_step": 278494, "epoch": 3355} {"train_loss": -25.496856689453125, "global_step": 278495, "epoch": 3355} {"train_loss": -25.057315826416016, "global_step": 278496, "epoch": 3355} {"train_loss": -25.56743049621582, "global_step": 278497, "epoch": 3355} {"train_loss": -25.296876907348633, "global_step": 278498, "epoch": 3355} {"train_loss": -25.252431869506836, "global_step": 278499, "epoch": 3355} {"train_loss": -25.08780288696289, "global_step": 278500, "epoch": 3355} {"train_loss": -25.47245979309082, "global_step": 278501, "epoch": 3355} {"train_loss": -25.698352813720703, "global_step": 278502, "epoch": 3355} {"train_loss": -25.3417911529541, "global_step": 278503, "epoch": 3355} {"train_loss": -25.6618595123291, "global_step": 278504, "epoch": 3355} {"train_loss": -25.62653923034668, "global_step": 278505, "epoch": 3355} {"train_loss": -25.132816314697266, "global_step": 278506, "epoch": 3355} {"train_loss": -25.202932357788086, "global_step": 278507, "epoch": 3355} {"train_loss": -25.403078079223633, "global_step": 278508, "epoch": 3355} {"train_loss": -25.174367904663086, "global_step": 278509, "epoch": 3355} {"train_loss": -25.17412757873535, "global_step": 278510, "epoch": 3355} {"train_loss": -24.637338638305664, "global_step": 278511, "epoch": 3355} {"train_loss": -25.263042449951172, "global_step": 278512, "epoch": 3355} {"train_loss": -25.64170265197754, "global_step": 278513, "epoch": 3355} {"train_loss": -25.284128189086914, "global_step": 278514, "epoch": 3355} {"train_loss": -25.576290130615234, "global_step": 278515, "epoch": 3355} {"train_loss": -25.191497802734375, "global_step": 278516, "epoch": 3355} {"train_loss": -25.825763702392578, "global_step": 278517, "epoch": 3355} {"train_loss": -25.240232467651367, "global_step": 278518, "epoch": 3355} {"train_loss": -25.116395950317383, "global_step": 278519, "epoch": 3355} {"train_loss": -25.642154693603516, "global_step": 278520, "epoch": 3355} {"train_loss": -25.431058883666992, "global_step": 278521, "epoch": 3355} {"train_loss": -25.08734703063965, "global_step": 278522, "epoch": 3355} {"train_loss": -25.4624080657959, "global_step": 278523, "epoch": 3355} {"train_loss": -25.48448944091797, "global_step": 278524, "epoch": 3355} {"train_loss": -25.339550018310547, "global_step": 278525, "epoch": 3355} {"train_loss": -25.817401885986328, "global_step": 278526, "epoch": 3355} {"train_loss": -25.79385757446289, "global_step": 278527, "epoch": 3355} {"train_loss": -25.49004554748535, "global_step": 278528, "epoch": 3355} {"train_loss": -25.943531036376953, "global_step": 278529, "epoch": 3355} {"train_loss": -25.21297264099121, "global_step": 278530, "epoch": 3355} {"train_loss": -25.055709838867188, "global_step": 278531, "epoch": 3355} {"train_loss": -25.27581787109375, "global_step": 278532, "epoch": 3355} {"train_loss": -25.480371475219727, "global_step": 278533, "epoch": 3355} {"train_loss": -25.680891036987305, "global_step": 278534, "epoch": 3355} {"train_loss": -25.393030166625977, "global_step": 278535, "epoch": 3355} {"train_loss": -25.278966903686523, "global_step": 278536, "epoch": 3355} {"train_loss": -25.38101577758789, "global_step": 278537, "epoch": 3355} {"train_loss": -25.57735252380371, "global_step": 278538, "epoch": 3355} {"train_loss": -25.08997917175293, "global_step": 278539, "epoch": 3355} {"train_loss": -25.201343536376953, "global_step": 278540, "epoch": 3355} {"train_loss": -25.592084884643555, "global_step": 278541, "epoch": 3355} {"train_loss": -25.64936637878418, "global_step": 278542, "epoch": 3355} {"train_loss": -25.910512924194336, "global_step": 278543, "epoch": 3355} {"train_loss": -25.051057815551758, "global_step": 278544, "epoch": 3355} {"train_loss": -25.1839542388916, "global_step": 278545, "epoch": 3355} {"train_loss": -25.778400421142578, "global_step": 278546, "epoch": 3355} {"train_loss": -25.236017479953997, "global_step": 278547, "epoch": 3355, "val_loss": 7008279.0} {"train_loss": -25.30171012878418, "global_step": 278548, "epoch": 3356} {"train_loss": -24.820545196533203, "global_step": 278549, "epoch": 3356} {"train_loss": -25.0936336517334, "global_step": 278550, "epoch": 3356} {"train_loss": -24.86588478088379, "global_step": 278551, "epoch": 3356} {"train_loss": -24.848758697509766, "global_step": 278552, "epoch": 3356} {"train_loss": -24.965591430664062, "global_step": 278553, "epoch": 3356} {"train_loss": -24.823814392089844, "global_step": 278554, "epoch": 3356} {"train_loss": -24.70853042602539, "global_step": 278555, "epoch": 3356} {"train_loss": -24.968692779541016, "global_step": 278556, "epoch": 3356} {"train_loss": -25.315292358398438, "global_step": 278557, "epoch": 3356} {"train_loss": -24.65386390686035, "global_step": 278558, "epoch": 3356} {"train_loss": -25.213497161865234, "global_step": 278559, "epoch": 3356} {"train_loss": -25.061635971069336, "global_step": 278560, "epoch": 3356} {"train_loss": -25.116376876831055, "global_step": 278561, "epoch": 3356} {"train_loss": -24.864347457885742, "global_step": 278562, "epoch": 3356} {"train_loss": -24.99698829650879, "global_step": 278563, "epoch": 3356} {"train_loss": -25.279296875, "global_step": 278564, "epoch": 3356} {"train_loss": -25.2094783782959, "global_step": 278565, "epoch": 3356} {"train_loss": -24.829416275024414, "global_step": 278566, "epoch": 3356} {"train_loss": -24.813220977783203, "global_step": 278567, "epoch": 3356} {"train_loss": -25.469449996948242, "global_step": 278568, "epoch": 3356} {"train_loss": -24.85077476501465, "global_step": 278569, "epoch": 3356} {"train_loss": -25.2656192779541, "global_step": 278570, "epoch": 3356} {"train_loss": -25.566532135009766, "global_step": 278571, "epoch": 3356} {"train_loss": -25.398361206054688, "global_step": 278572, "epoch": 3356} {"train_loss": -25.2952938079834, "global_step": 278573, "epoch": 3356} {"train_loss": -25.449655532836914, "global_step": 278574, "epoch": 3356} {"train_loss": -25.411865234375, "global_step": 278575, "epoch": 3356} {"train_loss": -25.404869079589844, "global_step": 278576, "epoch": 3356} {"train_loss": -25.158727645874023, "global_step": 278577, "epoch": 3356} {"train_loss": -25.64023208618164, "global_step": 278578, "epoch": 3356} {"train_loss": -25.100406646728516, "global_step": 278579, "epoch": 3356} {"train_loss": -25.487125396728516, "global_step": 278580, "epoch": 3356} {"train_loss": -25.291967391967773, "global_step": 278581, "epoch": 3356} {"train_loss": -25.46271324157715, "global_step": 278582, "epoch": 3356} {"train_loss": -25.465103149414062, "global_step": 278583, "epoch": 3356} {"train_loss": -25.434432983398438, "global_step": 278584, "epoch": 3356} {"train_loss": -25.224355697631836, "global_step": 278585, "epoch": 3356} {"train_loss": -25.233728408813477, "global_step": 278586, "epoch": 3356} {"train_loss": -25.538801193237305, "global_step": 278587, "epoch": 3356} {"train_loss": -25.482315063476562, "global_step": 278588, "epoch": 3356} {"train_loss": -25.502031326293945, "global_step": 278589, "epoch": 3356} {"train_loss": -25.45710563659668, "global_step": 278590, "epoch": 3356} {"train_loss": -25.407846450805664, "global_step": 278591, "epoch": 3356} {"train_loss": -25.463647842407227, "global_step": 278592, "epoch": 3356} {"train_loss": -25.22140884399414, "global_step": 278593, "epoch": 3356} {"train_loss": -25.517484664916992, "global_step": 278594, "epoch": 3356} {"train_loss": -25.4036808013916, "global_step": 278595, "epoch": 3356} {"train_loss": -25.702199935913086, "global_step": 278596, "epoch": 3356} {"train_loss": -25.563934326171875, "global_step": 278597, "epoch": 3356} {"train_loss": -25.425275802612305, "global_step": 278598, "epoch": 3356} {"train_loss": -25.413732528686523, "global_step": 278599, "epoch": 3356} {"train_loss": -25.475139617919922, "global_step": 278600, "epoch": 3356} {"train_loss": -25.6501522064209, "global_step": 278601, "epoch": 3356} {"train_loss": -25.18767547607422, "global_step": 278602, "epoch": 3356} {"train_loss": -25.476171493530273, "global_step": 278603, "epoch": 3356} {"train_loss": -25.355682373046875, "global_step": 278604, "epoch": 3356} {"train_loss": -25.320941925048828, "global_step": 278605, "epoch": 3356} {"train_loss": -25.601675033569336, "global_step": 278606, "epoch": 3356} {"train_loss": -25.56804847717285, "global_step": 278607, "epoch": 3356} {"train_loss": -25.75368309020996, "global_step": 278608, "epoch": 3356} {"train_loss": -25.59136390686035, "global_step": 278609, "epoch": 3356} {"train_loss": -25.254623413085938, "global_step": 278610, "epoch": 3356} {"train_loss": -25.270158767700195, "global_step": 278611, "epoch": 3356} {"train_loss": -25.04035758972168, "global_step": 278612, "epoch": 3356} {"train_loss": -25.212324142456055, "global_step": 278613, "epoch": 3356} {"train_loss": -25.481382369995117, "global_step": 278614, "epoch": 3356} {"train_loss": -25.844507217407227, "global_step": 278615, "epoch": 3356} {"train_loss": -25.11808204650879, "global_step": 278616, "epoch": 3356} {"train_loss": -25.320846557617188, "global_step": 278617, "epoch": 3356} {"train_loss": -25.302217483520508, "global_step": 278618, "epoch": 3356} {"train_loss": -25.6112060546875, "global_step": 278619, "epoch": 3356} {"train_loss": -25.202857971191406, "global_step": 278620, "epoch": 3356} {"train_loss": -25.391006469726562, "global_step": 278621, "epoch": 3356} {"train_loss": -25.58219337463379, "global_step": 278622, "epoch": 3356} {"train_loss": -25.57859230041504, "global_step": 278623, "epoch": 3356} {"train_loss": -25.385835647583008, "global_step": 278624, "epoch": 3356} {"train_loss": -25.484277725219727, "global_step": 278625, "epoch": 3356} {"train_loss": -25.284168243408203, "global_step": 278626, "epoch": 3356} {"train_loss": -25.6599178314209, "global_step": 278627, "epoch": 3356} {"train_loss": -25.63849449157715, "global_step": 278628, "epoch": 3356} {"train_loss": -25.422224044799805, "global_step": 278629, "epoch": 3356} {"train_loss": -25.312168833721113, "global_step": 278630, "epoch": 3356, "val_loss": 7105940.0} {"train_loss": -25.090890884399414, "global_step": 278631, "epoch": 3357} {"train_loss": -25.087268829345703, "global_step": 278632, "epoch": 3357} {"train_loss": -25.568012237548828, "global_step": 278633, "epoch": 3357} {"train_loss": -24.96486473083496, "global_step": 278634, "epoch": 3357} {"train_loss": -24.606061935424805, "global_step": 278635, "epoch": 3357} {"train_loss": -25.196271896362305, "global_step": 278636, "epoch": 3357} {"train_loss": -25.14859390258789, "global_step": 278637, "epoch": 3357} {"train_loss": -24.755718231201172, "global_step": 278638, "epoch": 3357} {"train_loss": -25.155757904052734, "global_step": 278639, "epoch": 3357} {"train_loss": -24.364805221557617, "global_step": 278640, "epoch": 3357} {"train_loss": -24.94807243347168, "global_step": 278641, "epoch": 3357} {"train_loss": -24.880151748657227, "global_step": 278642, "epoch": 3357} {"train_loss": -24.890846252441406, "global_step": 278643, "epoch": 3357} {"train_loss": -25.173538208007812, "global_step": 278644, "epoch": 3357} {"train_loss": -24.95192527770996, "global_step": 278645, "epoch": 3357} {"train_loss": -25.091720581054688, "global_step": 278646, "epoch": 3357} {"train_loss": -24.775373458862305, "global_step": 278647, "epoch": 3357} {"train_loss": -24.859220504760742, "global_step": 278648, "epoch": 3357} {"train_loss": -25.52979850769043, "global_step": 278649, "epoch": 3357} {"train_loss": -25.46320915222168, "global_step": 278650, "epoch": 3357} {"train_loss": -25.09308624267578, "global_step": 278651, "epoch": 3357} {"train_loss": -24.84458351135254, "global_step": 278652, "epoch": 3357} {"train_loss": -25.174453735351562, "global_step": 278653, "epoch": 3357} {"train_loss": -25.544815063476562, "global_step": 278654, "epoch": 3357} {"train_loss": -25.36853790283203, "global_step": 278655, "epoch": 3357} {"train_loss": -25.123031616210938, "global_step": 278656, "epoch": 3357} {"train_loss": -25.00535011291504, "global_step": 278657, "epoch": 3357} {"train_loss": -25.54880142211914, "global_step": 278658, "epoch": 3357} {"train_loss": -25.259353637695312, "global_step": 278659, "epoch": 3357} {"train_loss": -25.0838623046875, "global_step": 278660, "epoch": 3357} {"train_loss": -25.248859405517578, "global_step": 278661, "epoch": 3357} {"train_loss": -25.2018985748291, "global_step": 278662, "epoch": 3357} {"train_loss": -25.64338493347168, "global_step": 278663, "epoch": 3357} {"train_loss": -25.212251663208008, "global_step": 278664, "epoch": 3357} {"train_loss": -25.52996063232422, "global_step": 278665, "epoch": 3357} {"train_loss": -25.128345489501953, "global_step": 278666, "epoch": 3357} {"train_loss": -25.23025131225586, "global_step": 278667, "epoch": 3357} {"train_loss": -25.408451080322266, "global_step": 278668, "epoch": 3357} {"train_loss": -25.23335838317871, "global_step": 278669, "epoch": 3357} {"train_loss": -25.266489028930664, "global_step": 278670, "epoch": 3357} {"train_loss": -25.1956844329834, "global_step": 278671, "epoch": 3357} {"train_loss": -25.6623592376709, "global_step": 278672, "epoch": 3357} {"train_loss": -25.55744171142578, "global_step": 278673, "epoch": 3357} {"train_loss": -25.24889373779297, "global_step": 278674, "epoch": 3357} {"train_loss": -25.17901039123535, "global_step": 278675, "epoch": 3357} {"train_loss": -25.47632598876953, "global_step": 278676, "epoch": 3357} {"train_loss": -25.51802635192871, "global_step": 278677, "epoch": 3357} {"train_loss": -25.5982666015625, "global_step": 278678, "epoch": 3357} {"train_loss": -25.842060089111328, "global_step": 278679, "epoch": 3357} {"train_loss": -25.662952423095703, "global_step": 278680, "epoch": 3357} {"train_loss": -25.42220115661621, "global_step": 278681, "epoch": 3357} {"train_loss": -25.611820220947266, "global_step": 278682, "epoch": 3357} {"train_loss": -25.56410789489746, "global_step": 278683, "epoch": 3357} {"train_loss": -25.785058975219727, "global_step": 278684, "epoch": 3357} {"train_loss": -25.67120933532715, "global_step": 278685, "epoch": 3357} {"train_loss": -25.44842529296875, "global_step": 278686, "epoch": 3357} {"train_loss": -25.589496612548828, "global_step": 278687, "epoch": 3357} {"train_loss": -25.30853843688965, "global_step": 278688, "epoch": 3357} {"train_loss": -25.58281898498535, "global_step": 278689, "epoch": 3357} {"train_loss": -25.50945472717285, "global_step": 278690, "epoch": 3357} {"train_loss": -25.262527465820312, "global_step": 278691, "epoch": 3357} {"train_loss": -25.081937789916992, "global_step": 278692, "epoch": 3357} {"train_loss": -25.432762145996094, "global_step": 278693, "epoch": 3357} {"train_loss": -25.173973083496094, "global_step": 278694, "epoch": 3357} {"train_loss": -25.431638717651367, "global_step": 278695, "epoch": 3357} {"train_loss": -25.408727645874023, "global_step": 278696, "epoch": 3357} {"train_loss": -25.5694637298584, "global_step": 278697, "epoch": 3357} {"train_loss": -25.537939071655273, "global_step": 278698, "epoch": 3357} {"train_loss": -25.5804386138916, "global_step": 278699, "epoch": 3357} {"train_loss": -25.908939361572266, "global_step": 278700, "epoch": 3357} {"train_loss": -25.351341247558594, "global_step": 278701, "epoch": 3357} {"train_loss": -25.54437828063965, "global_step": 278702, "epoch": 3357} {"train_loss": -25.394073486328125, "global_step": 278703, "epoch": 3357} {"train_loss": -25.36528205871582, "global_step": 278704, "epoch": 3357} {"train_loss": -25.509252548217773, "global_step": 278705, "epoch": 3357} {"train_loss": -25.39739227294922, "global_step": 278706, "epoch": 3357} {"train_loss": -25.182430267333984, "global_step": 278707, "epoch": 3357} {"train_loss": -25.391271591186523, "global_step": 278708, "epoch": 3357} {"train_loss": -24.97130012512207, "global_step": 278709, "epoch": 3357} {"train_loss": -24.437997817993164, "global_step": 278710, "epoch": 3357} {"train_loss": -24.207307815551758, "global_step": 278711, "epoch": 3357} {"train_loss": -24.970489501953125, "global_step": 278712, "epoch": 3357} {"train_loss": -25.29052247196795, "global_step": 278713, "epoch": 3357, "val_loss": 6969435.0} {"train_loss": -23.771692276000977, "global_step": 278714, "epoch": 3358} {"train_loss": -24.02898406982422, "global_step": 278715, "epoch": 3358} {"train_loss": -24.981369018554688, "global_step": 278716, "epoch": 3358} {"train_loss": -24.504762649536133, "global_step": 278717, "epoch": 3358} {"train_loss": -24.717267990112305, "global_step": 278718, "epoch": 3358} {"train_loss": -24.810958862304688, "global_step": 278719, "epoch": 3358} {"train_loss": -24.899274826049805, "global_step": 278720, "epoch": 3358} {"train_loss": -24.847490310668945, "global_step": 278721, "epoch": 3358} {"train_loss": -24.98131561279297, "global_step": 278722, "epoch": 3358} {"train_loss": -25.10270118713379, "global_step": 278723, "epoch": 3358} {"train_loss": -24.597990036010742, "global_step": 278724, "epoch": 3358} {"train_loss": -24.845932006835938, "global_step": 278725, "epoch": 3358} {"train_loss": -24.757217407226562, "global_step": 278726, "epoch": 3358} {"train_loss": -24.56914710998535, "global_step": 278727, "epoch": 3358} {"train_loss": -24.98261833190918, "global_step": 278728, "epoch": 3358} {"train_loss": -24.7799015045166, "global_step": 278729, "epoch": 3358} {"train_loss": -25.21371078491211, "global_step": 278730, "epoch": 3358} {"train_loss": -24.96526527404785, "global_step": 278731, "epoch": 3358} {"train_loss": -25.080745697021484, "global_step": 278732, "epoch": 3358} {"train_loss": -25.321165084838867, "global_step": 278733, "epoch": 3358} {"train_loss": -25.16901206970215, "global_step": 278734, "epoch": 3358} {"train_loss": -24.992441177368164, "global_step": 278735, "epoch": 3358} {"train_loss": -25.257898330688477, "global_step": 278736, "epoch": 3358} {"train_loss": -25.246999740600586, "global_step": 278737, "epoch": 3358} {"train_loss": -25.7039737701416, "global_step": 278738, "epoch": 3358} {"train_loss": -25.226219177246094, "global_step": 278739, "epoch": 3358} {"train_loss": -25.238662719726562, "global_step": 278740, "epoch": 3358} {"train_loss": -25.33271598815918, "global_step": 278741, "epoch": 3358} {"train_loss": -25.19947624206543, "global_step": 278742, "epoch": 3358} {"train_loss": -25.209035873413086, "global_step": 278743, "epoch": 3358} {"train_loss": -25.228971481323242, "global_step": 278744, "epoch": 3358} {"train_loss": -25.45218276977539, "global_step": 278745, "epoch": 3358} {"train_loss": -25.427555084228516, "global_step": 278746, "epoch": 3358} {"train_loss": -25.393508911132812, "global_step": 278747, "epoch": 3358} {"train_loss": -25.432519912719727, "global_step": 278748, "epoch": 3358} {"train_loss": -25.301212310791016, "global_step": 278749, "epoch": 3358} {"train_loss": -25.471891403198242, "global_step": 278750, "epoch": 3358} {"train_loss": -24.907251358032227, "global_step": 278751, "epoch": 3358} {"train_loss": -25.30936622619629, "global_step": 278752, "epoch": 3358} {"train_loss": -25.35951042175293, "global_step": 278753, "epoch": 3358} {"train_loss": -25.2257080078125, "global_step": 278754, "epoch": 3358} {"train_loss": -25.16400909423828, "global_step": 278755, "epoch": 3358} {"train_loss": -25.606313705444336, "global_step": 278756, "epoch": 3358} {"train_loss": -25.687265396118164, "global_step": 278757, "epoch": 3358} {"train_loss": -25.13336753845215, "global_step": 278758, "epoch": 3358} {"train_loss": -24.959501266479492, "global_step": 278759, "epoch": 3358} {"train_loss": -25.353254318237305, "global_step": 278760, "epoch": 3358} {"train_loss": -25.591552734375, "global_step": 278761, "epoch": 3358} {"train_loss": -25.47762107849121, "global_step": 278762, "epoch": 3358} {"train_loss": -25.48261833190918, "global_step": 278763, "epoch": 3358} {"train_loss": -25.32337760925293, "global_step": 278764, "epoch": 3358} {"train_loss": -25.434309005737305, "global_step": 278765, "epoch": 3358} {"train_loss": -25.464447021484375, "global_step": 278766, "epoch": 3358} {"train_loss": -25.656864166259766, "global_step": 278767, "epoch": 3358} {"train_loss": -25.282194137573242, "global_step": 278768, "epoch": 3358} {"train_loss": -25.827545166015625, "global_step": 278769, "epoch": 3358} {"train_loss": -25.62140464782715, "global_step": 278770, "epoch": 3358} {"train_loss": -25.624530792236328, "global_step": 278771, "epoch": 3358} {"train_loss": -25.472396850585938, "global_step": 278772, "epoch": 3358} {"train_loss": -25.30801773071289, "global_step": 278773, "epoch": 3358} {"train_loss": -25.59816551208496, "global_step": 278774, "epoch": 3358} {"train_loss": -25.397323608398438, "global_step": 278775, "epoch": 3358} {"train_loss": -25.3243350982666, "global_step": 278776, "epoch": 3358} {"train_loss": -25.21651268005371, "global_step": 278777, "epoch": 3358} {"train_loss": -25.485219955444336, "global_step": 278778, "epoch": 3358} {"train_loss": -25.539464950561523, "global_step": 278779, "epoch": 3358} {"train_loss": -25.164640426635742, "global_step": 278780, "epoch": 3358} {"train_loss": -25.38459587097168, "global_step": 278781, "epoch": 3358} {"train_loss": -25.11091423034668, "global_step": 278782, "epoch": 3358} {"train_loss": -25.245338439941406, "global_step": 278783, "epoch": 3358} {"train_loss": -25.184524536132812, "global_step": 278784, "epoch": 3358} {"train_loss": -25.349409103393555, "global_step": 278785, "epoch": 3358} {"train_loss": -25.304336547851562, "global_step": 278786, "epoch": 3358} {"train_loss": -25.481586456298828, "global_step": 278787, "epoch": 3358} {"train_loss": -25.215545654296875, "global_step": 278788, "epoch": 3358} {"train_loss": -25.55387306213379, "global_step": 278789, "epoch": 3358} {"train_loss": -25.46787452697754, "global_step": 278790, "epoch": 3358} {"train_loss": -25.304784774780273, "global_step": 278791, "epoch": 3358} {"train_loss": -25.787378311157227, "global_step": 278792, "epoch": 3358} {"train_loss": -25.575328826904297, "global_step": 278793, "epoch": 3358} {"train_loss": -25.578323364257812, "global_step": 278794, "epoch": 3358} {"train_loss": -25.63654136657715, "global_step": 278795, "epoch": 3358} {"train_loss": -25.219950848315136, "global_step": 278796, "epoch": 3358, "val_loss": 7083355.0} {"train_loss": -24.722415924072266, "global_step": 278797, "epoch": 3359} {"train_loss": -24.587465286254883, "global_step": 278798, "epoch": 3359} {"train_loss": -25.0042781829834, "global_step": 278799, "epoch": 3359} {"train_loss": -25.129560470581055, "global_step": 278800, "epoch": 3359} {"train_loss": -24.882780075073242, "global_step": 278801, "epoch": 3359} {"train_loss": -24.326330184936523, "global_step": 278802, "epoch": 3359} {"train_loss": -24.764976501464844, "global_step": 278803, "epoch": 3359} {"train_loss": -24.801742553710938, "global_step": 278804, "epoch": 3359} {"train_loss": -24.916112899780273, "global_step": 278805, "epoch": 3359} {"train_loss": -24.888891220092773, "global_step": 278806, "epoch": 3359} {"train_loss": -24.953908920288086, "global_step": 278807, "epoch": 3359} {"train_loss": -24.850248336791992, "global_step": 278808, "epoch": 3359} {"train_loss": -25.12227439880371, "global_step": 278809, "epoch": 3359} {"train_loss": -25.213621139526367, "global_step": 278810, "epoch": 3359} {"train_loss": -25.279172897338867, "global_step": 278811, "epoch": 3359} {"train_loss": -25.03412437438965, "global_step": 278812, "epoch": 3359} {"train_loss": -25.582273483276367, "global_step": 278813, "epoch": 3359} {"train_loss": -24.955120086669922, "global_step": 278814, "epoch": 3359} {"train_loss": -24.732799530029297, "global_step": 278815, "epoch": 3359} {"train_loss": -24.93939208984375, "global_step": 278816, "epoch": 3359} {"train_loss": -25.16966438293457, "global_step": 278817, "epoch": 3359} {"train_loss": -24.774198532104492, "global_step": 278818, "epoch": 3359} {"train_loss": -25.1603946685791, "global_step": 278819, "epoch": 3359} {"train_loss": -25.107507705688477, "global_step": 278820, "epoch": 3359} {"train_loss": -25.668903350830078, "global_step": 278821, "epoch": 3359} {"train_loss": -25.05779457092285, "global_step": 278822, "epoch": 3359} {"train_loss": -25.342655181884766, "global_step": 278823, "epoch": 3359} {"train_loss": -25.330244064331055, "global_step": 278824, "epoch": 3359} {"train_loss": -25.4021053314209, "global_step": 278825, "epoch": 3359} {"train_loss": -25.722326278686523, "global_step": 278826, "epoch": 3359} {"train_loss": -25.342374801635742, "global_step": 278827, "epoch": 3359} {"train_loss": -25.633508682250977, "global_step": 278828, "epoch": 3359} {"train_loss": -25.162282943725586, "global_step": 278829, "epoch": 3359} {"train_loss": -25.590309143066406, "global_step": 278830, "epoch": 3359} {"train_loss": -24.977651596069336, "global_step": 278831, "epoch": 3359} {"train_loss": -25.450483322143555, "global_step": 278832, "epoch": 3359} {"train_loss": -25.16254997253418, "global_step": 278833, "epoch": 3359} {"train_loss": -25.32771110534668, "global_step": 278834, "epoch": 3359} {"train_loss": -25.10702896118164, "global_step": 278835, "epoch": 3359} {"train_loss": -25.299701690673828, "global_step": 278836, "epoch": 3359} {"train_loss": -25.020559310913086, "global_step": 278837, "epoch": 3359} {"train_loss": -25.60171890258789, "global_step": 278838, "epoch": 3359} {"train_loss": -25.2890625, "global_step": 278839, "epoch": 3359} {"train_loss": -25.16103172302246, "global_step": 278840, "epoch": 3359} {"train_loss": -25.439199447631836, "global_step": 278841, "epoch": 3359} {"train_loss": -25.463394165039062, "global_step": 278842, "epoch": 3359} {"train_loss": -25.3277645111084, "global_step": 278843, "epoch": 3359} {"train_loss": -25.375226974487305, "global_step": 278844, "epoch": 3359} {"train_loss": -25.11566734313965, "global_step": 278845, "epoch": 3359} {"train_loss": -25.67217445373535, "global_step": 278846, "epoch": 3359} {"train_loss": -25.37080192565918, "global_step": 278847, "epoch": 3359} {"train_loss": -25.687347412109375, "global_step": 278848, "epoch": 3359} {"train_loss": -25.5580997467041, "global_step": 278849, "epoch": 3359} {"train_loss": -25.392963409423828, "global_step": 278850, "epoch": 3359} {"train_loss": -25.274084091186523, "global_step": 278851, "epoch": 3359} {"train_loss": -25.34445571899414, "global_step": 278852, "epoch": 3359} {"train_loss": -25.416946411132812, "global_step": 278853, "epoch": 3359} {"train_loss": -25.270618438720703, "global_step": 278854, "epoch": 3359} {"train_loss": -25.096569061279297, "global_step": 278855, "epoch": 3359} {"train_loss": -25.374359130859375, "global_step": 278856, "epoch": 3359} {"train_loss": -25.639387130737305, "global_step": 278857, "epoch": 3359} {"train_loss": -25.6402587890625, "global_step": 278858, "epoch": 3359} {"train_loss": -25.45206069946289, "global_step": 278859, "epoch": 3359} {"train_loss": -25.50520896911621, "global_step": 278860, "epoch": 3359} {"train_loss": -25.843000411987305, "global_step": 278861, "epoch": 3359} {"train_loss": -25.58047866821289, "global_step": 278862, "epoch": 3359} {"train_loss": -25.656646728515625, "global_step": 278863, "epoch": 3359} {"train_loss": -25.515981674194336, "global_step": 278864, "epoch": 3359} {"train_loss": -25.136112213134766, "global_step": 278865, "epoch": 3359} {"train_loss": -25.571496963500977, "global_step": 278866, "epoch": 3359} {"train_loss": -25.457345962524414, "global_step": 278867, "epoch": 3359} {"train_loss": -25.363115310668945, "global_step": 278868, "epoch": 3359} {"train_loss": -25.471240997314453, "global_step": 278869, "epoch": 3359} {"train_loss": -25.7657470703125, "global_step": 278870, "epoch": 3359} {"train_loss": -25.152368545532227, "global_step": 278871, "epoch": 3359} {"train_loss": -25.656421661376953, "global_step": 278872, "epoch": 3359} {"train_loss": -25.766834259033203, "global_step": 278873, "epoch": 3359} {"train_loss": -25.525121688842773, "global_step": 278874, "epoch": 3359} {"train_loss": -25.704267501831055, "global_step": 278875, "epoch": 3359} {"train_loss": -25.474544525146484, "global_step": 278876, "epoch": 3359} {"train_loss": -25.478734970092773, "global_step": 278877, "epoch": 3359} {"train_loss": -25.62662696838379, "global_step": 278878, "epoch": 3359} {"train_loss": -25.29905987934894, "global_step": 278879, "epoch": 3359, "val_loss": 7058232.0} {"train_loss": -25.10801124572754, "global_step": 278880, "epoch": 3360} {"train_loss": -24.968875885009766, "global_step": 278881, "epoch": 3360} {"train_loss": -24.729568481445312, "global_step": 278882, "epoch": 3360} {"train_loss": -24.97138786315918, "global_step": 278883, "epoch": 3360} {"train_loss": -24.622968673706055, "global_step": 278884, "epoch": 3360} {"train_loss": -25.40565299987793, "global_step": 278885, "epoch": 3360} {"train_loss": -25.170684814453125, "global_step": 278886, "epoch": 3360} {"train_loss": -24.454267501831055, "global_step": 278887, "epoch": 3360} {"train_loss": -24.9672908782959, "global_step": 278888, "epoch": 3360} {"train_loss": -25.05580711364746, "global_step": 278889, "epoch": 3360} {"train_loss": -24.926788330078125, "global_step": 278890, "epoch": 3360} {"train_loss": -25.065340042114258, "global_step": 278891, "epoch": 3360} {"train_loss": -25.122209548950195, "global_step": 278892, "epoch": 3360} {"train_loss": -25.241819381713867, "global_step": 278893, "epoch": 3360} {"train_loss": -25.44982147216797, "global_step": 278894, "epoch": 3360} {"train_loss": -25.274261474609375, "global_step": 278895, "epoch": 3360} {"train_loss": -25.16469383239746, "global_step": 278896, "epoch": 3360} {"train_loss": -25.223426818847656, "global_step": 278897, "epoch": 3360} {"train_loss": -24.95572853088379, "global_step": 278898, "epoch": 3360} {"train_loss": -25.09437370300293, "global_step": 278899, "epoch": 3360} {"train_loss": -25.12630844116211, "global_step": 278900, "epoch": 3360} {"train_loss": -24.870508193969727, "global_step": 278901, "epoch": 3360} {"train_loss": -25.008026123046875, "global_step": 278902, "epoch": 3360} {"train_loss": -25.56624412536621, "global_step": 278903, "epoch": 3360} {"train_loss": -25.086233139038086, "global_step": 278904, "epoch": 3360} {"train_loss": -25.590763092041016, "global_step": 278905, "epoch": 3360} {"train_loss": -25.200702667236328, "global_step": 278906, "epoch": 3360} {"train_loss": -25.353042602539062, "global_step": 278907, "epoch": 3360} {"train_loss": -25.448780059814453, "global_step": 278908, "epoch": 3360} {"train_loss": -25.518491744995117, "global_step": 278909, "epoch": 3360} {"train_loss": -25.39320945739746, "global_step": 278910, "epoch": 3360} {"train_loss": -25.235750198364258, "global_step": 278911, "epoch": 3360} {"train_loss": -25.503171920776367, "global_step": 278912, "epoch": 3360} {"train_loss": -25.176977157592773, "global_step": 278913, "epoch": 3360} {"train_loss": -25.243093490600586, "global_step": 278914, "epoch": 3360} {"train_loss": -25.31894874572754, "global_step": 278915, "epoch": 3360} {"train_loss": -25.6987247467041, "global_step": 278916, "epoch": 3360} {"train_loss": -25.413082122802734, "global_step": 278917, "epoch": 3360} {"train_loss": -25.209022521972656, "global_step": 278918, "epoch": 3360} {"train_loss": -25.445283889770508, "global_step": 278919, "epoch": 3360} {"train_loss": -25.475284576416016, "global_step": 278920, "epoch": 3360} {"train_loss": -25.645238876342773, "global_step": 278921, "epoch": 3360} {"train_loss": -25.332916259765625, "global_step": 278922, "epoch": 3360} {"train_loss": -25.446273803710938, "global_step": 278923, "epoch": 3360} {"train_loss": -25.26192283630371, "global_step": 278924, "epoch": 3360} {"train_loss": -25.069135665893555, "global_step": 278925, "epoch": 3360} {"train_loss": -25.555389404296875, "global_step": 278926, "epoch": 3360} {"train_loss": -25.473350524902344, "global_step": 278927, "epoch": 3360} {"train_loss": -25.45111656188965, "global_step": 278928, "epoch": 3360} {"train_loss": -25.489215850830078, "global_step": 278929, "epoch": 3360} {"train_loss": -25.448951721191406, "global_step": 278930, "epoch": 3360} {"train_loss": -25.723251342773438, "global_step": 278931, "epoch": 3360} {"train_loss": -25.511110305786133, "global_step": 278932, "epoch": 3360} {"train_loss": -25.48651695251465, "global_step": 278933, "epoch": 3360} {"train_loss": -25.120807647705078, "global_step": 278934, "epoch": 3360} {"train_loss": -25.716571807861328, "global_step": 278935, "epoch": 3360} {"train_loss": -25.109893798828125, "global_step": 278936, "epoch": 3360} {"train_loss": -25.572193145751953, "global_step": 278937, "epoch": 3360} {"train_loss": -25.534103393554688, "global_step": 278938, "epoch": 3360} {"train_loss": -25.10934066772461, "global_step": 278939, "epoch": 3360} {"train_loss": -25.216989517211914, "global_step": 278940, "epoch": 3360} {"train_loss": -25.435121536254883, "global_step": 278941, "epoch": 3360} {"train_loss": -25.65576171875, "global_step": 278942, "epoch": 3360} {"train_loss": -25.543752670288086, "global_step": 278943, "epoch": 3360} {"train_loss": -25.43304443359375, "global_step": 278944, "epoch": 3360} {"train_loss": -25.245670318603516, "global_step": 278945, "epoch": 3360} {"train_loss": -25.42720603942871, "global_step": 278946, "epoch": 3360} {"train_loss": -25.650659561157227, "global_step": 278947, "epoch": 3360} {"train_loss": -24.869171142578125, "global_step": 278948, "epoch": 3360} {"train_loss": -25.25460433959961, "global_step": 278949, "epoch": 3360} {"train_loss": -25.3011417388916, "global_step": 278950, "epoch": 3360} {"train_loss": -25.57035255432129, "global_step": 278951, "epoch": 3360} {"train_loss": -25.70635414123535, "global_step": 278952, "epoch": 3360} {"train_loss": -25.316211700439453, "global_step": 278953, "epoch": 3360} {"train_loss": -25.70122718811035, "global_step": 278954, "epoch": 3360} {"train_loss": -25.517072677612305, "global_step": 278955, "epoch": 3360} {"train_loss": -25.285127639770508, "global_step": 278956, "epoch": 3360} {"train_loss": -25.659284591674805, "global_step": 278957, "epoch": 3360} {"train_loss": -25.360132217407227, "global_step": 278958, "epoch": 3360} {"train_loss": -25.147262573242188, "global_step": 278959, "epoch": 3360} {"train_loss": -25.47694969177246, "global_step": 278960, "epoch": 3360} {"train_loss": -25.687788009643555, "global_step": 278961, "epoch": 3360} {"train_loss": -25.31151105122394, "global_step": 278962, "epoch": 3360, "val_loss": 7117316.0} {"train_loss": -24.69523048400879, "global_step": 278963, "epoch": 3361} {"train_loss": -24.024887084960938, "global_step": 278964, "epoch": 3361} {"train_loss": -23.089935302734375, "global_step": 278965, "epoch": 3361} {"train_loss": -24.59042739868164, "global_step": 278966, "epoch": 3361} {"train_loss": -25.174108505249023, "global_step": 278967, "epoch": 3361} {"train_loss": -24.648880004882812, "global_step": 278968, "epoch": 3361} {"train_loss": -24.400001525878906, "global_step": 278969, "epoch": 3361} {"train_loss": -25.200159072875977, "global_step": 278970, "epoch": 3361} {"train_loss": -25.01752281188965, "global_step": 278971, "epoch": 3361} {"train_loss": -24.919279098510742, "global_step": 278972, "epoch": 3361} {"train_loss": -25.100759506225586, "global_step": 278973, "epoch": 3361} {"train_loss": -24.77217674255371, "global_step": 278974, "epoch": 3361} {"train_loss": -24.760141372680664, "global_step": 278975, "epoch": 3361} {"train_loss": -24.740249633789062, "global_step": 278976, "epoch": 3361} {"train_loss": -25.21827507019043, "global_step": 278977, "epoch": 3361} {"train_loss": -24.775897979736328, "global_step": 278978, "epoch": 3361} {"train_loss": -25.063276290893555, "global_step": 278979, "epoch": 3361} {"train_loss": -25.086999893188477, "global_step": 278980, "epoch": 3361} {"train_loss": -25.03596305847168, "global_step": 278981, "epoch": 3361} {"train_loss": -25.11042022705078, "global_step": 278982, "epoch": 3361} {"train_loss": -25.174514770507812, "global_step": 278983, "epoch": 3361} {"train_loss": -24.59523582458496, "global_step": 278984, "epoch": 3361} {"train_loss": -25.389616012573242, "global_step": 278985, "epoch": 3361} {"train_loss": -25.14932632446289, "global_step": 278986, "epoch": 3361} {"train_loss": -25.126895904541016, "global_step": 278987, "epoch": 3361} {"train_loss": -25.28299903869629, "global_step": 278988, "epoch": 3361} {"train_loss": -25.348901748657227, "global_step": 278989, "epoch": 3361} {"train_loss": -25.623044967651367, "global_step": 278990, "epoch": 3361} {"train_loss": -25.287656784057617, "global_step": 278991, "epoch": 3361} {"train_loss": -25.30754280090332, "global_step": 278992, "epoch": 3361} {"train_loss": -25.43035888671875, "global_step": 278993, "epoch": 3361} {"train_loss": -25.36896324157715, "global_step": 278994, "epoch": 3361} {"train_loss": -25.173934936523438, "global_step": 278995, "epoch": 3361} {"train_loss": -25.275907516479492, "global_step": 278996, "epoch": 3361} {"train_loss": -25.42020034790039, "global_step": 278997, "epoch": 3361} {"train_loss": -25.404565811157227, "global_step": 278998, "epoch": 3361} {"train_loss": -25.336599349975586, "global_step": 278999, "epoch": 3361} {"train_loss": -25.371871948242188, "global_step": 279000, "epoch": 3361} {"train_loss": -25.547239303588867, "global_step": 279001, "epoch": 3361} {"train_loss": -25.42707633972168, "global_step": 279002, "epoch": 3361} {"train_loss": -24.772422790527344, "global_step": 279003, "epoch": 3361} {"train_loss": -25.52859878540039, "global_step": 279004, "epoch": 3361} {"train_loss": -25.689542770385742, "global_step": 279005, "epoch": 3361} {"train_loss": -25.074527740478516, "global_step": 279006, "epoch": 3361} {"train_loss": -25.13446044921875, "global_step": 279007, "epoch": 3361} {"train_loss": -25.314510345458984, "global_step": 279008, "epoch": 3361} {"train_loss": -25.284255981445312, "global_step": 279009, "epoch": 3361} {"train_loss": -25.633047103881836, "global_step": 279010, "epoch": 3361} {"train_loss": -25.6267032623291, "global_step": 279011, "epoch": 3361} {"train_loss": -25.5223445892334, "global_step": 279012, "epoch": 3361} {"train_loss": -25.56251335144043, "global_step": 279013, "epoch": 3361} {"train_loss": -25.50381851196289, "global_step": 279014, "epoch": 3361} {"train_loss": -25.653345108032227, "global_step": 279015, "epoch": 3361} {"train_loss": -25.845417022705078, "global_step": 279016, "epoch": 3361} {"train_loss": -25.585834503173828, "global_step": 279017, "epoch": 3361} {"train_loss": -25.360876083374023, "global_step": 279018, "epoch": 3361} {"train_loss": -25.476285934448242, "global_step": 279019, "epoch": 3361} {"train_loss": -25.589147567749023, "global_step": 279020, "epoch": 3361} {"train_loss": -25.231630325317383, "global_step": 279021, "epoch": 3361} {"train_loss": -25.442907333374023, "global_step": 279022, "epoch": 3361} {"train_loss": -25.276968002319336, "global_step": 279023, "epoch": 3361} {"train_loss": -25.489160537719727, "global_step": 279024, "epoch": 3361} {"train_loss": -25.569028854370117, "global_step": 279025, "epoch": 3361} {"train_loss": -25.51632308959961, "global_step": 279026, "epoch": 3361} {"train_loss": -25.36246681213379, "global_step": 279027, "epoch": 3361} {"train_loss": -25.39906883239746, "global_step": 279028, "epoch": 3361} {"train_loss": -25.350128173828125, "global_step": 279029, "epoch": 3361} {"train_loss": -25.26742935180664, "global_step": 279030, "epoch": 3361} {"train_loss": -25.181833267211914, "global_step": 279031, "epoch": 3361} {"train_loss": -24.78464126586914, "global_step": 279032, "epoch": 3361} {"train_loss": -25.479658126831055, "global_step": 279033, "epoch": 3361} {"train_loss": -25.129371643066406, "global_step": 279034, "epoch": 3361} {"train_loss": -25.014606475830078, "global_step": 279035, "epoch": 3361} {"train_loss": -25.08330726623535, "global_step": 279036, "epoch": 3361} {"train_loss": -25.21642303466797, "global_step": 279037, "epoch": 3361} {"train_loss": -25.34882926940918, "global_step": 279038, "epoch": 3361} {"train_loss": -25.172073364257812, "global_step": 279039, "epoch": 3361} {"train_loss": -25.280303955078125, "global_step": 279040, "epoch": 3361} {"train_loss": -25.200361251831055, "global_step": 279041, "epoch": 3361} {"train_loss": -25.15874481201172, "global_step": 279042, "epoch": 3361} {"train_loss": -25.132497787475586, "global_step": 279043, "epoch": 3361} {"train_loss": -25.321104049682617, "global_step": 279044, "epoch": 3361} {"train_loss": -25.20736616203584, "global_step": 279045, "epoch": 3361, "val_loss": 7092340.0} {"train_loss": -24.687549591064453, "global_step": 279046, "epoch": 3362} {"train_loss": -24.60393714904785, "global_step": 279047, "epoch": 3362} {"train_loss": -24.917978286743164, "global_step": 279048, "epoch": 3362} {"train_loss": -24.655044555664062, "global_step": 279049, "epoch": 3362} {"train_loss": -24.730335235595703, "global_step": 279050, "epoch": 3362} {"train_loss": -24.820480346679688, "global_step": 279051, "epoch": 3362} {"train_loss": -25.107275009155273, "global_step": 279052, "epoch": 3362} {"train_loss": -25.116350173950195, "global_step": 279053, "epoch": 3362} {"train_loss": -25.102102279663086, "global_step": 279054, "epoch": 3362} {"train_loss": -25.063657760620117, "global_step": 279055, "epoch": 3362} {"train_loss": -25.074914932250977, "global_step": 279056, "epoch": 3362} {"train_loss": -25.07328224182129, "global_step": 279057, "epoch": 3362} {"train_loss": -25.012414932250977, "global_step": 279058, "epoch": 3362} {"train_loss": -25.288700103759766, "global_step": 279059, "epoch": 3362} {"train_loss": -25.282882690429688, "global_step": 279060, "epoch": 3362} {"train_loss": -25.192907333374023, "global_step": 279061, "epoch": 3362} {"train_loss": -25.48317527770996, "global_step": 279062, "epoch": 3362} {"train_loss": -25.51053237915039, "global_step": 279063, "epoch": 3362} {"train_loss": -25.15542984008789, "global_step": 279064, "epoch": 3362} {"train_loss": -25.25457191467285, "global_step": 279065, "epoch": 3362} {"train_loss": -25.26041030883789, "global_step": 279066, "epoch": 3362} {"train_loss": -25.06278419494629, "global_step": 279067, "epoch": 3362} {"train_loss": -25.8724422454834, "global_step": 279068, "epoch": 3362} {"train_loss": -25.526811599731445, "global_step": 279069, "epoch": 3362} {"train_loss": -25.118776321411133, "global_step": 279070, "epoch": 3362} {"train_loss": -25.373294830322266, "global_step": 279071, "epoch": 3362} {"train_loss": -25.652551651000977, "global_step": 279072, "epoch": 3362} {"train_loss": -25.36616325378418, "global_step": 279073, "epoch": 3362} {"train_loss": -25.71339225769043, "global_step": 279074, "epoch": 3362} {"train_loss": -25.80025291442871, "global_step": 279075, "epoch": 3362} {"train_loss": -25.581857681274414, "global_step": 279076, "epoch": 3362} {"train_loss": -25.2718448638916, "global_step": 279077, "epoch": 3362} {"train_loss": -25.47477149963379, "global_step": 279078, "epoch": 3362} {"train_loss": -25.320905685424805, "global_step": 279079, "epoch": 3362} {"train_loss": -25.447446823120117, "global_step": 279080, "epoch": 3362} {"train_loss": -25.748647689819336, "global_step": 279081, "epoch": 3362} {"train_loss": -25.574237823486328, "global_step": 279082, "epoch": 3362} {"train_loss": -25.275310516357422, "global_step": 279083, "epoch": 3362} {"train_loss": -25.514432907104492, "global_step": 279084, "epoch": 3362} {"train_loss": -25.438453674316406, "global_step": 279085, "epoch": 3362} {"train_loss": -25.687158584594727, "global_step": 279086, "epoch": 3362} {"train_loss": -25.518518447875977, "global_step": 279087, "epoch": 3362} {"train_loss": -25.28876304626465, "global_step": 279088, "epoch": 3362} {"train_loss": -25.340909957885742, "global_step": 279089, "epoch": 3362} {"train_loss": -25.52071189880371, "global_step": 279090, "epoch": 3362} {"train_loss": -25.397563934326172, "global_step": 279091, "epoch": 3362} {"train_loss": -24.710851669311523, "global_step": 279092, "epoch": 3362} {"train_loss": -24.52202033996582, "global_step": 279093, "epoch": 3362} {"train_loss": -24.403303146362305, "global_step": 279094, "epoch": 3362} {"train_loss": -25.037199020385742, "global_step": 279095, "epoch": 3362} {"train_loss": -25.6729793548584, "global_step": 279096, "epoch": 3362} {"train_loss": -25.191192626953125, "global_step": 279097, "epoch": 3362} {"train_loss": -25.669336318969727, "global_step": 279098, "epoch": 3362} {"train_loss": -25.077518463134766, "global_step": 279099, "epoch": 3362} {"train_loss": -25.118619918823242, "global_step": 279100, "epoch": 3362} {"train_loss": -25.249427795410156, "global_step": 279101, "epoch": 3362} {"train_loss": -25.4935245513916, "global_step": 279102, "epoch": 3362} {"train_loss": -25.222593307495117, "global_step": 279103, "epoch": 3362} {"train_loss": -25.101232528686523, "global_step": 279104, "epoch": 3362} {"train_loss": -25.226816177368164, "global_step": 279105, "epoch": 3362} {"train_loss": -25.495670318603516, "global_step": 279106, "epoch": 3362} {"train_loss": -25.492612838745117, "global_step": 279107, "epoch": 3362} {"train_loss": -25.383071899414062, "global_step": 279108, "epoch": 3362} {"train_loss": -25.780038833618164, "global_step": 279109, "epoch": 3362} {"train_loss": -25.662506103515625, "global_step": 279110, "epoch": 3362} {"train_loss": -25.548429489135742, "global_step": 279111, "epoch": 3362} {"train_loss": -25.617694854736328, "global_step": 279112, "epoch": 3362} {"train_loss": -25.59438705444336, "global_step": 279113, "epoch": 3362} {"train_loss": -25.276044845581055, "global_step": 279114, "epoch": 3362} {"train_loss": -25.324979782104492, "global_step": 279115, "epoch": 3362} {"train_loss": -25.557641983032227, "global_step": 279116, "epoch": 3362} {"train_loss": -25.511066436767578, "global_step": 279117, "epoch": 3362} {"train_loss": -25.788724899291992, "global_step": 279118, "epoch": 3362} {"train_loss": -25.58675193786621, "global_step": 279119, "epoch": 3362} {"train_loss": -25.489803314208984, "global_step": 279120, "epoch": 3362} {"train_loss": -25.83271598815918, "global_step": 279121, "epoch": 3362} {"train_loss": -25.41708755493164, "global_step": 279122, "epoch": 3362} {"train_loss": -24.878204345703125, "global_step": 279123, "epoch": 3362} {"train_loss": -25.596927642822266, "global_step": 279124, "epoch": 3362} {"train_loss": -25.321435928344727, "global_step": 279125, "epoch": 3362} {"train_loss": -25.335552215576172, "global_step": 279126, "epoch": 3362} {"train_loss": -25.079809188842773, "global_step": 279127, "epoch": 3362} {"train_loss": -25.28638159510601, "global_step": 279128, "epoch": 3362, "val_loss": 7120558.0} {"train_loss": -25.10553741455078, "global_step": 279129, "epoch": 3363} {"train_loss": -24.70722007751465, "global_step": 279130, "epoch": 3363} {"train_loss": -24.756309509277344, "global_step": 279131, "epoch": 3363} {"train_loss": -24.840206146240234, "global_step": 279132, "epoch": 3363} {"train_loss": -24.784080505371094, "global_step": 279133, "epoch": 3363} {"train_loss": -24.619314193725586, "global_step": 279134, "epoch": 3363} {"train_loss": -24.764362335205078, "global_step": 279135, "epoch": 3363} {"train_loss": -25.162582397460938, "global_step": 279136, "epoch": 3363} {"train_loss": -24.560083389282227, "global_step": 279137, "epoch": 3363} {"train_loss": -24.624958038330078, "global_step": 279138, "epoch": 3363} {"train_loss": -24.713130950927734, "global_step": 279139, "epoch": 3363} {"train_loss": -24.953048706054688, "global_step": 279140, "epoch": 3363} {"train_loss": -25.315977096557617, "global_step": 279141, "epoch": 3363} {"train_loss": -25.153181076049805, "global_step": 279142, "epoch": 3363} {"train_loss": -24.815885543823242, "global_step": 279143, "epoch": 3363} {"train_loss": -25.13986587524414, "global_step": 279144, "epoch": 3363} {"train_loss": -24.928674697875977, "global_step": 279145, "epoch": 3363} {"train_loss": -24.96529197692871, "global_step": 279146, "epoch": 3363} {"train_loss": -25.210927963256836, "global_step": 279147, "epoch": 3363} {"train_loss": -25.659997940063477, "global_step": 279148, "epoch": 3363} {"train_loss": -25.350675582885742, "global_step": 279149, "epoch": 3363} {"train_loss": -24.930875778198242, "global_step": 279150, "epoch": 3363} {"train_loss": -25.1193790435791, "global_step": 279151, "epoch": 3363} {"train_loss": -25.129962921142578, "global_step": 279152, "epoch": 3363} {"train_loss": -25.49283790588379, "global_step": 279153, "epoch": 3363} {"train_loss": -25.383092880249023, "global_step": 279154, "epoch": 3363} {"train_loss": -25.37972068786621, "global_step": 279155, "epoch": 3363} {"train_loss": -25.169292449951172, "global_step": 279156, "epoch": 3363} {"train_loss": -25.512479782104492, "global_step": 279157, "epoch": 3363} {"train_loss": -25.336912155151367, "global_step": 279158, "epoch": 3363} {"train_loss": -25.425378799438477, "global_step": 279159, "epoch": 3363} {"train_loss": -25.464611053466797, "global_step": 279160, "epoch": 3363} {"train_loss": -25.391820907592773, "global_step": 279161, "epoch": 3363} {"train_loss": -25.609479904174805, "global_step": 279162, "epoch": 3363} {"train_loss": -25.345426559448242, "global_step": 279163, "epoch": 3363} {"train_loss": -25.29897117614746, "global_step": 279164, "epoch": 3363} {"train_loss": -25.47674560546875, "global_step": 279165, "epoch": 3363} {"train_loss": -25.35677719116211, "global_step": 279166, "epoch": 3363} {"train_loss": -25.419031143188477, "global_step": 279167, "epoch": 3363} {"train_loss": -25.084747314453125, "global_step": 279168, "epoch": 3363} {"train_loss": -25.416948318481445, "global_step": 279169, "epoch": 3363} {"train_loss": -25.294466018676758, "global_step": 279170, "epoch": 3363} {"train_loss": -25.434743881225586, "global_step": 279171, "epoch": 3363} {"train_loss": -25.05879783630371, "global_step": 279172, "epoch": 3363} {"train_loss": -25.528564453125, "global_step": 279173, "epoch": 3363} {"train_loss": -25.380491256713867, "global_step": 279174, "epoch": 3363} {"train_loss": -25.634057998657227, "global_step": 279175, "epoch": 3363} {"train_loss": -25.308494567871094, "global_step": 279176, "epoch": 3363} {"train_loss": -25.20629119873047, "global_step": 279177, "epoch": 3363} {"train_loss": -25.425199508666992, "global_step": 279178, "epoch": 3363} {"train_loss": -25.47342300415039, "global_step": 279179, "epoch": 3363} {"train_loss": -25.213491439819336, "global_step": 279180, "epoch": 3363} {"train_loss": -25.42942237854004, "global_step": 279181, "epoch": 3363} {"train_loss": -25.453458786010742, "global_step": 279182, "epoch": 3363} {"train_loss": -24.99155616760254, "global_step": 279183, "epoch": 3363} {"train_loss": -25.30632972717285, "global_step": 279184, "epoch": 3363} {"train_loss": -25.483198165893555, "global_step": 279185, "epoch": 3363} {"train_loss": -25.49698257446289, "global_step": 279186, "epoch": 3363} {"train_loss": -25.19317054748535, "global_step": 279187, "epoch": 3363} {"train_loss": -25.23383903503418, "global_step": 279188, "epoch": 3363} {"train_loss": -25.36885643005371, "global_step": 279189, "epoch": 3363} {"train_loss": -25.510028839111328, "global_step": 279190, "epoch": 3363} {"train_loss": -25.0844783782959, "global_step": 279191, "epoch": 3363} {"train_loss": -25.1331729888916, "global_step": 279192, "epoch": 3363} {"train_loss": -25.259061813354492, "global_step": 279193, "epoch": 3363} {"train_loss": -24.814605712890625, "global_step": 279194, "epoch": 3363} {"train_loss": -25.680042266845703, "global_step": 279195, "epoch": 3363} {"train_loss": -25.44329833984375, "global_step": 279196, "epoch": 3363} {"train_loss": -25.653793334960938, "global_step": 279197, "epoch": 3363} {"train_loss": -25.179248809814453, "global_step": 279198, "epoch": 3363} {"train_loss": -25.670461654663086, "global_step": 279199, "epoch": 3363} {"train_loss": -25.303945541381836, "global_step": 279200, "epoch": 3363} {"train_loss": -25.421300888061523, "global_step": 279201, "epoch": 3363} {"train_loss": -25.11642837524414, "global_step": 279202, "epoch": 3363} {"train_loss": -25.635761260986328, "global_step": 279203, "epoch": 3363} {"train_loss": -25.3466854095459, "global_step": 279204, "epoch": 3363} {"train_loss": -25.43260955810547, "global_step": 279205, "epoch": 3363} {"train_loss": -25.578624725341797, "global_step": 279206, "epoch": 3363} {"train_loss": -25.688980102539062, "global_step": 279207, "epoch": 3363} {"train_loss": -25.681745529174805, "global_step": 279208, "epoch": 3363} {"train_loss": -25.25807762145996, "global_step": 279209, "epoch": 3363} {"train_loss": -25.35219383239746, "global_step": 279210, "epoch": 3363} {"train_loss": -25.257144973938722, "global_step": 279211, "epoch": 3363, "val_loss": 6960151.0} {"train_loss": -24.79936981201172, "global_step": 279212, "epoch": 3364} {"train_loss": -24.44130516052246, "global_step": 279213, "epoch": 3364} {"train_loss": -24.4676570892334, "global_step": 279214, "epoch": 3364} {"train_loss": -24.67325782775879, "global_step": 279215, "epoch": 3364} {"train_loss": -24.740449905395508, "global_step": 279216, "epoch": 3364} {"train_loss": -24.60531997680664, "global_step": 279217, "epoch": 3364} {"train_loss": -24.886442184448242, "global_step": 279218, "epoch": 3364} {"train_loss": -24.522653579711914, "global_step": 279219, "epoch": 3364} {"train_loss": -24.67299461364746, "global_step": 279220, "epoch": 3364} {"train_loss": -24.969823837280273, "global_step": 279221, "epoch": 3364} {"train_loss": -25.496057510375977, "global_step": 279222, "epoch": 3364} {"train_loss": -24.898740768432617, "global_step": 279223, "epoch": 3364} {"train_loss": -24.925739288330078, "global_step": 279224, "epoch": 3364} {"train_loss": -24.93989372253418, "global_step": 279225, "epoch": 3364} {"train_loss": -24.974149703979492, "global_step": 279226, "epoch": 3364} {"train_loss": -24.994237899780273, "global_step": 279227, "epoch": 3364} {"train_loss": -25.09556770324707, "global_step": 279228, "epoch": 3364} {"train_loss": -25.11691665649414, "global_step": 279229, "epoch": 3364} {"train_loss": -24.805410385131836, "global_step": 279230, "epoch": 3364} {"train_loss": -25.041208267211914, "global_step": 279231, "epoch": 3364} {"train_loss": -25.498735427856445, "global_step": 279232, "epoch": 3364} {"train_loss": -24.843477249145508, "global_step": 279233, "epoch": 3364} {"train_loss": -25.227554321289062, "global_step": 279234, "epoch": 3364} {"train_loss": -25.189453125, "global_step": 279235, "epoch": 3364} {"train_loss": -25.080524444580078, "global_step": 279236, "epoch": 3364} {"train_loss": -25.6666202545166, "global_step": 279237, "epoch": 3364} {"train_loss": -25.427289962768555, "global_step": 279238, "epoch": 3364} {"train_loss": -25.250499725341797, "global_step": 279239, "epoch": 3364} {"train_loss": -25.44854736328125, "global_step": 279240, "epoch": 3364} {"train_loss": -25.367643356323242, "global_step": 279241, "epoch": 3364} {"train_loss": -25.48004150390625, "global_step": 279242, "epoch": 3364} {"train_loss": -25.268136978149414, "global_step": 279243, "epoch": 3364} {"train_loss": -25.13727378845215, "global_step": 279244, "epoch": 3364} {"train_loss": -25.014392852783203, "global_step": 279245, "epoch": 3364} {"train_loss": -25.398326873779297, "global_step": 279246, "epoch": 3364} {"train_loss": -25.24120330810547, "global_step": 279247, "epoch": 3364} {"train_loss": -25.224157333374023, "global_step": 279248, "epoch": 3364} {"train_loss": -25.296998977661133, "global_step": 279249, "epoch": 3364} {"train_loss": -25.100614547729492, "global_step": 279250, "epoch": 3364} {"train_loss": -25.27591896057129, "global_step": 279251, "epoch": 3364} {"train_loss": -25.505842208862305, "global_step": 279252, "epoch": 3364} {"train_loss": -25.595233917236328, "global_step": 279253, "epoch": 3364} {"train_loss": -25.8126163482666, "global_step": 279254, "epoch": 3364} {"train_loss": -25.3033447265625, "global_step": 279255, "epoch": 3364} {"train_loss": -25.36106300354004, "global_step": 279256, "epoch": 3364} {"train_loss": -25.115598678588867, "global_step": 279257, "epoch": 3364} {"train_loss": -25.455320358276367, "global_step": 279258, "epoch": 3364} {"train_loss": -25.785079956054688, "global_step": 279259, "epoch": 3364} {"train_loss": -25.500144958496094, "global_step": 279260, "epoch": 3364} {"train_loss": -25.47844886779785, "global_step": 279261, "epoch": 3364} {"train_loss": -25.64404296875, "global_step": 279262, "epoch": 3364} {"train_loss": -25.566177368164062, "global_step": 279263, "epoch": 3364} {"train_loss": -24.977609634399414, "global_step": 279264, "epoch": 3364} {"train_loss": -24.989986419677734, "global_step": 279265, "epoch": 3364} {"train_loss": -25.283329010009766, "global_step": 279266, "epoch": 3364} {"train_loss": -25.49905776977539, "global_step": 279267, "epoch": 3364} {"train_loss": -25.0716495513916, "global_step": 279268, "epoch": 3364} {"train_loss": -25.53197479248047, "global_step": 279269, "epoch": 3364} {"train_loss": -25.3454647064209, "global_step": 279270, "epoch": 3364} {"train_loss": -25.714832305908203, "global_step": 279271, "epoch": 3364} {"train_loss": -25.01244354248047, "global_step": 279272, "epoch": 3364} {"train_loss": -25.156970977783203, "global_step": 279273, "epoch": 3364} {"train_loss": -25.25218963623047, "global_step": 279274, "epoch": 3364} {"train_loss": -25.05629539489746, "global_step": 279275, "epoch": 3364} {"train_loss": -25.531845092773438, "global_step": 279276, "epoch": 3364} {"train_loss": -24.833242416381836, "global_step": 279277, "epoch": 3364} {"train_loss": -25.433256149291992, "global_step": 279278, "epoch": 3364} {"train_loss": -25.266708374023438, "global_step": 279279, "epoch": 3364} {"train_loss": -25.63624382019043, "global_step": 279280, "epoch": 3364} {"train_loss": -25.49432373046875, "global_step": 279281, "epoch": 3364} {"train_loss": -25.158283233642578, "global_step": 279282, "epoch": 3364} {"train_loss": -25.261497497558594, "global_step": 279283, "epoch": 3364} {"train_loss": -25.23953628540039, "global_step": 279284, "epoch": 3364} {"train_loss": -25.601621627807617, "global_step": 279285, "epoch": 3364} {"train_loss": -25.599849700927734, "global_step": 279286, "epoch": 3364} {"train_loss": -25.12151527404785, "global_step": 279287, "epoch": 3364} {"train_loss": -25.457523345947266, "global_step": 279288, "epoch": 3364} {"train_loss": -24.941205978393555, "global_step": 279289, "epoch": 3364} {"train_loss": -25.439130783081055, "global_step": 279290, "epoch": 3364} {"train_loss": -25.171432495117188, "global_step": 279291, "epoch": 3364} {"train_loss": -25.46100425720215, "global_step": 279292, "epoch": 3364} {"train_loss": -25.6123104095459, "global_step": 279293, "epoch": 3364} {"train_loss": -25.22074083535068, "global_step": 279294, "epoch": 3364, "val_loss": 7002548.0} {"train_loss": -25.442764282226562, "global_step": 279295, "epoch": 3365} {"train_loss": -25.670217514038086, "global_step": 279296, "epoch": 3365} {"train_loss": -25.18892478942871, "global_step": 279297, "epoch": 3365} {"train_loss": -24.827207565307617, "global_step": 279298, "epoch": 3365} {"train_loss": -25.426176071166992, "global_step": 279299, "epoch": 3365} {"train_loss": -25.400739669799805, "global_step": 279300, "epoch": 3365} {"train_loss": -25.45912742614746, "global_step": 279301, "epoch": 3365} {"train_loss": -24.975238800048828, "global_step": 279302, "epoch": 3365} {"train_loss": -25.270030975341797, "global_step": 279303, "epoch": 3365} {"train_loss": -25.39512062072754, "global_step": 279304, "epoch": 3365} {"train_loss": -25.03329849243164, "global_step": 279305, "epoch": 3365} {"train_loss": -24.9917049407959, "global_step": 279306, "epoch": 3365} {"train_loss": -25.57459259033203, "global_step": 279307, "epoch": 3365} {"train_loss": -25.4580078125, "global_step": 279308, "epoch": 3365} {"train_loss": -25.158771514892578, "global_step": 279309, "epoch": 3365} {"train_loss": -25.551259994506836, "global_step": 279310, "epoch": 3365} {"train_loss": -25.34227752685547, "global_step": 279311, "epoch": 3365} {"train_loss": -25.030292510986328, "global_step": 279312, "epoch": 3365} {"train_loss": -25.289968490600586, "global_step": 279313, "epoch": 3365} {"train_loss": -25.360321044921875, "global_step": 279314, "epoch": 3365} {"train_loss": -25.620080947875977, "global_step": 279315, "epoch": 3365} {"train_loss": -24.985984802246094, "global_step": 279316, "epoch": 3365} {"train_loss": -25.591400146484375, "global_step": 279317, "epoch": 3365} {"train_loss": -25.174863815307617, "global_step": 279318, "epoch": 3365} {"train_loss": -25.00731086730957, "global_step": 279319, "epoch": 3365} {"train_loss": -25.703760147094727, "global_step": 279320, "epoch": 3365} {"train_loss": -25.662891387939453, "global_step": 279321, "epoch": 3365} {"train_loss": -25.32670783996582, "global_step": 279322, "epoch": 3365} {"train_loss": -25.489408493041992, "global_step": 279323, "epoch": 3365} {"train_loss": -25.567441940307617, "global_step": 279324, "epoch": 3365} {"train_loss": -25.54737663269043, "global_step": 279325, "epoch": 3365} {"train_loss": -25.69916343688965, "global_step": 279326, "epoch": 3365} {"train_loss": -25.429372787475586, "global_step": 279327, "epoch": 3365} {"train_loss": -25.466552734375, "global_step": 279328, "epoch": 3365} {"train_loss": -25.577289581298828, "global_step": 279329, "epoch": 3365} {"train_loss": -25.468900680541992, "global_step": 279330, "epoch": 3365} {"train_loss": -25.301651000976562, "global_step": 279331, "epoch": 3365} {"train_loss": -25.39086151123047, "global_step": 279332, "epoch": 3365} {"train_loss": -25.529691696166992, "global_step": 279333, "epoch": 3365} {"train_loss": -25.130325317382812, "global_step": 279334, "epoch": 3365} {"train_loss": -25.633310317993164, "global_step": 279335, "epoch": 3365} {"train_loss": -25.145092010498047, "global_step": 279336, "epoch": 3365} {"train_loss": -25.447996139526367, "global_step": 279337, "epoch": 3365} {"train_loss": -25.420923233032227, "global_step": 279338, "epoch": 3365} {"train_loss": -25.377029418945312, "global_step": 279339, "epoch": 3365} {"train_loss": -25.2823543548584, "global_step": 279340, "epoch": 3365} {"train_loss": -25.0598201751709, "global_step": 279341, "epoch": 3365} {"train_loss": -25.135923385620117, "global_step": 279342, "epoch": 3365} {"train_loss": -25.666152954101562, "global_step": 279343, "epoch": 3365} {"train_loss": -25.605661392211914, "global_step": 279344, "epoch": 3365} {"train_loss": -25.380430221557617, "global_step": 279345, "epoch": 3365} {"train_loss": -25.399343490600586, "global_step": 279346, "epoch": 3365} {"train_loss": -25.34479331970215, "global_step": 279347, "epoch": 3365} {"train_loss": -25.689496994018555, "global_step": 279348, "epoch": 3365} {"train_loss": -24.896244049072266, "global_step": 279349, "epoch": 3365} {"train_loss": -25.071060180664062, "global_step": 279350, "epoch": 3365} {"train_loss": -25.641143798828125, "global_step": 279351, "epoch": 3365} {"train_loss": -25.273948669433594, "global_step": 279352, "epoch": 3365} {"train_loss": -25.153432846069336, "global_step": 279353, "epoch": 3365} {"train_loss": -25.213912963867188, "global_step": 279354, "epoch": 3365} {"train_loss": -24.76340103149414, "global_step": 279355, "epoch": 3365} {"train_loss": -25.011178970336914, "global_step": 279356, "epoch": 3365} {"train_loss": -25.303983688354492, "global_step": 279357, "epoch": 3365} {"train_loss": -24.98089599609375, "global_step": 279358, "epoch": 3365} {"train_loss": -25.15500259399414, "global_step": 279359, "epoch": 3365} {"train_loss": -25.217802047729492, "global_step": 279360, "epoch": 3365} {"train_loss": -25.470932006835938, "global_step": 279361, "epoch": 3365} {"train_loss": -25.583332061767578, "global_step": 279362, "epoch": 3365} {"train_loss": -25.57386589050293, "global_step": 279363, "epoch": 3365} {"train_loss": -25.0694522857666, "global_step": 279364, "epoch": 3365} {"train_loss": -25.490264892578125, "global_step": 279365, "epoch": 3365} {"train_loss": -25.290172576904297, "global_step": 279366, "epoch": 3365} {"train_loss": -25.63960075378418, "global_step": 279367, "epoch": 3365} {"train_loss": -25.310691833496094, "global_step": 279368, "epoch": 3365} {"train_loss": -25.471548080444336, "global_step": 279369, "epoch": 3365} {"train_loss": -25.65386390686035, "global_step": 279370, "epoch": 3365} {"train_loss": -25.325407028198242, "global_step": 279371, "epoch": 3365} {"train_loss": -25.716156005859375, "global_step": 279372, "epoch": 3365} {"train_loss": -25.528749465942383, "global_step": 279373, "epoch": 3365} {"train_loss": -25.539567947387695, "global_step": 279374, "epoch": 3365} {"train_loss": -25.217361450195312, "global_step": 279375, "epoch": 3365} {"train_loss": -25.662372589111328, "global_step": 279376, "epoch": 3365} {"train_loss": -25.355765836784638, "global_step": 279377, "epoch": 3365, "val_loss": 7123291.0} {"train_loss": -25.34322166442871, "global_step": 279378, "epoch": 3366} {"train_loss": -24.924591064453125, "global_step": 279379, "epoch": 3366} {"train_loss": -25.211700439453125, "global_step": 279380, "epoch": 3366} {"train_loss": -25.458324432373047, "global_step": 279381, "epoch": 3366} {"train_loss": -24.717084884643555, "global_step": 279382, "epoch": 3366} {"train_loss": -24.661834716796875, "global_step": 279383, "epoch": 3366} {"train_loss": -25.34271812438965, "global_step": 279384, "epoch": 3366} {"train_loss": -25.228900909423828, "global_step": 279385, "epoch": 3366} {"train_loss": -25.05036163330078, "global_step": 279386, "epoch": 3366} {"train_loss": -25.38947296142578, "global_step": 279387, "epoch": 3366} {"train_loss": -25.411865234375, "global_step": 279388, "epoch": 3366} {"train_loss": -25.060142517089844, "global_step": 279389, "epoch": 3366} {"train_loss": -24.967594146728516, "global_step": 279390, "epoch": 3366} {"train_loss": -25.35727310180664, "global_step": 279391, "epoch": 3366} {"train_loss": -25.3642635345459, "global_step": 279392, "epoch": 3366} {"train_loss": -25.236928939819336, "global_step": 279393, "epoch": 3366} {"train_loss": -25.44800567626953, "global_step": 279394, "epoch": 3366} {"train_loss": -25.139057159423828, "global_step": 279395, "epoch": 3366} {"train_loss": -25.508922576904297, "global_step": 279396, "epoch": 3366} {"train_loss": -25.351402282714844, "global_step": 279397, "epoch": 3366} {"train_loss": -25.362104415893555, "global_step": 279398, "epoch": 3366} {"train_loss": -25.46942710876465, "global_step": 279399, "epoch": 3366} {"train_loss": -25.26308250427246, "global_step": 279400, "epoch": 3366} {"train_loss": -25.322040557861328, "global_step": 279401, "epoch": 3366} {"train_loss": -24.955251693725586, "global_step": 279402, "epoch": 3366} {"train_loss": -25.412525177001953, "global_step": 279403, "epoch": 3366} {"train_loss": -25.35597801208496, "global_step": 279404, "epoch": 3366} {"train_loss": -25.799772262573242, "global_step": 279405, "epoch": 3366} {"train_loss": -25.295482635498047, "global_step": 279406, "epoch": 3366} {"train_loss": -25.33190155029297, "global_step": 279407, "epoch": 3366} {"train_loss": -25.46345329284668, "global_step": 279408, "epoch": 3366} {"train_loss": -25.324766159057617, "global_step": 279409, "epoch": 3366} {"train_loss": -25.37701416015625, "global_step": 279410, "epoch": 3366} {"train_loss": -25.5488338470459, "global_step": 279411, "epoch": 3366} {"train_loss": -25.31653594970703, "global_step": 279412, "epoch": 3366} {"train_loss": -25.237207412719727, "global_step": 279413, "epoch": 3366} {"train_loss": -25.29268455505371, "global_step": 279414, "epoch": 3366} {"train_loss": -25.283660888671875, "global_step": 279415, "epoch": 3366} {"train_loss": -25.618743896484375, "global_step": 279416, "epoch": 3366} {"train_loss": -25.2564697265625, "global_step": 279417, "epoch": 3366} {"train_loss": -25.444746017456055, "global_step": 279418, "epoch": 3366} {"train_loss": -24.873035430908203, "global_step": 279419, "epoch": 3366} {"train_loss": -25.486526489257812, "global_step": 279420, "epoch": 3366} {"train_loss": -25.405597686767578, "global_step": 279421, "epoch": 3366} {"train_loss": -25.411088943481445, "global_step": 279422, "epoch": 3366} {"train_loss": -25.22669792175293, "global_step": 279423, "epoch": 3366} {"train_loss": -25.44867515563965, "global_step": 279424, "epoch": 3366} {"train_loss": -25.25092124938965, "global_step": 279425, "epoch": 3366} {"train_loss": -25.286108016967773, "global_step": 279426, "epoch": 3366} {"train_loss": -25.55967140197754, "global_step": 279427, "epoch": 3366} {"train_loss": -25.512725830078125, "global_step": 279428, "epoch": 3366} {"train_loss": -25.583097457885742, "global_step": 279429, "epoch": 3366} {"train_loss": -25.49781608581543, "global_step": 279430, "epoch": 3366} {"train_loss": -25.134172439575195, "global_step": 279431, "epoch": 3366} {"train_loss": -25.48628807067871, "global_step": 279432, "epoch": 3366} {"train_loss": -25.304412841796875, "global_step": 279433, "epoch": 3366} {"train_loss": -25.576833724975586, "global_step": 279434, "epoch": 3366} {"train_loss": -25.44378662109375, "global_step": 279435, "epoch": 3366} {"train_loss": -25.540267944335938, "global_step": 279436, "epoch": 3366} {"train_loss": -25.439239501953125, "global_step": 279437, "epoch": 3366} {"train_loss": -25.514841079711914, "global_step": 279438, "epoch": 3366} {"train_loss": -25.469730377197266, "global_step": 279439, "epoch": 3366} {"train_loss": -25.550853729248047, "global_step": 279440, "epoch": 3366} {"train_loss": -25.481708526611328, "global_step": 279441, "epoch": 3366} {"train_loss": -25.2863826751709, "global_step": 279442, "epoch": 3366} {"train_loss": -25.658802032470703, "global_step": 279443, "epoch": 3366} {"train_loss": -25.486621856689453, "global_step": 279444, "epoch": 3366} {"train_loss": -25.46735954284668, "global_step": 279445, "epoch": 3366} {"train_loss": -25.98322105407715, "global_step": 279446, "epoch": 3366} {"train_loss": -25.811471939086914, "global_step": 279447, "epoch": 3366} {"train_loss": -25.470844268798828, "global_step": 279448, "epoch": 3366} {"train_loss": -25.61078453063965, "global_step": 279449, "epoch": 3366} {"train_loss": -25.269962310791016, "global_step": 279450, "epoch": 3366} {"train_loss": -25.535558700561523, "global_step": 279451, "epoch": 3366} {"train_loss": -25.245019912719727, "global_step": 279452, "epoch": 3366} {"train_loss": -25.27747917175293, "global_step": 279453, "epoch": 3366} {"train_loss": -25.3105525970459, "global_step": 279454, "epoch": 3366} {"train_loss": -25.77495765686035, "global_step": 279455, "epoch": 3366} {"train_loss": -25.022830963134766, "global_step": 279456, "epoch": 3366} {"train_loss": -25.51097869873047, "global_step": 279457, "epoch": 3366} {"train_loss": -25.749303817749023, "global_step": 279458, "epoch": 3366} {"train_loss": -25.471006393432617, "global_step": 279459, "epoch": 3366} {"train_loss": -25.377369800245905, "global_step": 279460, "epoch": 3366, "val_loss": 7009070.0} {"train_loss": -25.371198654174805, "global_step": 279461, "epoch": 3367} {"train_loss": -25.299827575683594, "global_step": 279462, "epoch": 3367} {"train_loss": -25.3142147064209, "global_step": 279463, "epoch": 3367} {"train_loss": -25.224828720092773, "global_step": 279464, "epoch": 3367} {"train_loss": -25.205411911010742, "global_step": 279465, "epoch": 3367} {"train_loss": -25.50990104675293, "global_step": 279466, "epoch": 3367} {"train_loss": -25.295866012573242, "global_step": 279467, "epoch": 3367} {"train_loss": -25.06588363647461, "global_step": 279468, "epoch": 3367} {"train_loss": -24.987110137939453, "global_step": 279469, "epoch": 3367} {"train_loss": -25.34333610534668, "global_step": 279470, "epoch": 3367} {"train_loss": -24.919849395751953, "global_step": 279471, "epoch": 3367} {"train_loss": -25.129301071166992, "global_step": 279472, "epoch": 3367} {"train_loss": -25.55253028869629, "global_step": 279473, "epoch": 3367} {"train_loss": -25.264179229736328, "global_step": 279474, "epoch": 3367} {"train_loss": -25.483362197875977, "global_step": 279475, "epoch": 3367} {"train_loss": -25.5905704498291, "global_step": 279476, "epoch": 3367} {"train_loss": -25.34933853149414, "global_step": 279477, "epoch": 3367} {"train_loss": -25.37393569946289, "global_step": 279478, "epoch": 3367} {"train_loss": -25.184383392333984, "global_step": 279479, "epoch": 3367} {"train_loss": -25.281782150268555, "global_step": 279480, "epoch": 3367} {"train_loss": -25.282041549682617, "global_step": 279481, "epoch": 3367} {"train_loss": -25.57999038696289, "global_step": 279482, "epoch": 3367} {"train_loss": -25.480426788330078, "global_step": 279483, "epoch": 3367} {"train_loss": -25.53813934326172, "global_step": 279484, "epoch": 3367} {"train_loss": -25.41626739501953, "global_step": 279485, "epoch": 3367} {"train_loss": -25.189420700073242, "global_step": 279486, "epoch": 3367} {"train_loss": -25.7783145904541, "global_step": 279487, "epoch": 3367} {"train_loss": -25.178342819213867, "global_step": 279488, "epoch": 3367} {"train_loss": -25.451377868652344, "global_step": 279489, "epoch": 3367} {"train_loss": -25.24500846862793, "global_step": 279490, "epoch": 3367} {"train_loss": -25.440210342407227, "global_step": 279491, "epoch": 3367} {"train_loss": -25.290058135986328, "global_step": 279492, "epoch": 3367} {"train_loss": -25.45857810974121, "global_step": 279493, "epoch": 3367} {"train_loss": -25.54900360107422, "global_step": 279494, "epoch": 3367} {"train_loss": -25.176130294799805, "global_step": 279495, "epoch": 3367} {"train_loss": -25.49444007873535, "global_step": 279496, "epoch": 3367} {"train_loss": -25.37131118774414, "global_step": 279497, "epoch": 3367} {"train_loss": -25.239322662353516, "global_step": 279498, "epoch": 3367} {"train_loss": -25.64029312133789, "global_step": 279499, "epoch": 3367} {"train_loss": -25.268400192260742, "global_step": 279500, "epoch": 3367} {"train_loss": -25.459909439086914, "global_step": 279501, "epoch": 3367} {"train_loss": -25.582523345947266, "global_step": 279502, "epoch": 3367} {"train_loss": -25.72564697265625, "global_step": 279503, "epoch": 3367} {"train_loss": -25.64548683166504, "global_step": 279504, "epoch": 3367} {"train_loss": -25.555557250976562, "global_step": 279505, "epoch": 3367} {"train_loss": -25.7873477935791, "global_step": 279506, "epoch": 3367} {"train_loss": -25.631778717041016, "global_step": 279507, "epoch": 3367} {"train_loss": -25.8354434967041, "global_step": 279508, "epoch": 3367} {"train_loss": -25.494821548461914, "global_step": 279509, "epoch": 3367} {"train_loss": -25.654035568237305, "global_step": 279510, "epoch": 3367} {"train_loss": -25.63802146911621, "global_step": 279511, "epoch": 3367} {"train_loss": -25.48370361328125, "global_step": 279512, "epoch": 3367} {"train_loss": -25.56682777404785, "global_step": 279513, "epoch": 3367} {"train_loss": -25.4844970703125, "global_step": 279514, "epoch": 3367} {"train_loss": -25.20884132385254, "global_step": 279515, "epoch": 3367} {"train_loss": -25.561002731323242, "global_step": 279516, "epoch": 3367} {"train_loss": -25.401103973388672, "global_step": 279517, "epoch": 3367} {"train_loss": -25.337230682373047, "global_step": 279518, "epoch": 3367} {"train_loss": -25.47669219970703, "global_step": 279519, "epoch": 3367} {"train_loss": -25.118690490722656, "global_step": 279520, "epoch": 3367} {"train_loss": -24.893539428710938, "global_step": 279521, "epoch": 3367} {"train_loss": -25.417016983032227, "global_step": 279522, "epoch": 3367} {"train_loss": -25.494728088378906, "global_step": 279523, "epoch": 3367} {"train_loss": -25.026958465576172, "global_step": 279524, "epoch": 3367} {"train_loss": -25.16707420349121, "global_step": 279525, "epoch": 3367} {"train_loss": -25.007835388183594, "global_step": 279526, "epoch": 3367} {"train_loss": -25.201736450195312, "global_step": 279527, "epoch": 3367} {"train_loss": -24.55927848815918, "global_step": 279528, "epoch": 3367} {"train_loss": -25.17203712463379, "global_step": 279529, "epoch": 3367} {"train_loss": -25.074209213256836, "global_step": 279530, "epoch": 3367} {"train_loss": -24.875431060791016, "global_step": 279531, "epoch": 3367} {"train_loss": -24.984119415283203, "global_step": 279532, "epoch": 3367} {"train_loss": -25.345172882080078, "global_step": 279533, "epoch": 3367} {"train_loss": -24.617294311523438, "global_step": 279534, "epoch": 3367} {"train_loss": -24.98385238647461, "global_step": 279535, "epoch": 3367} {"train_loss": -25.446863174438477, "global_step": 279536, "epoch": 3367} {"train_loss": -25.218351364135742, "global_step": 279537, "epoch": 3367} {"train_loss": -25.061885833740234, "global_step": 279538, "epoch": 3367} {"train_loss": -25.207141876220703, "global_step": 279539, "epoch": 3367} {"train_loss": -25.189149856567383, "global_step": 279540, "epoch": 3367} {"train_loss": -25.30531883239746, "global_step": 279541, "epoch": 3367} {"train_loss": -25.188121795654297, "global_step": 279542, "epoch": 3367} {"train_loss": -25.32753659443683, "global_step": 279543, "epoch": 3367, "val_loss": 7044536.0} {"train_loss": -24.898542404174805, "global_step": 279544, "epoch": 3368} {"train_loss": -25.150949478149414, "global_step": 279545, "epoch": 3368} {"train_loss": -24.99867820739746, "global_step": 279546, "epoch": 3368} {"train_loss": -25.10434341430664, "global_step": 279547, "epoch": 3368} {"train_loss": -24.677032470703125, "global_step": 279548, "epoch": 3368} {"train_loss": -25.03160858154297, "global_step": 279549, "epoch": 3368} {"train_loss": -25.040485382080078, "global_step": 279550, "epoch": 3368} {"train_loss": -25.378812789916992, "global_step": 279551, "epoch": 3368} {"train_loss": -24.835098266601562, "global_step": 279552, "epoch": 3368} {"train_loss": -25.492578506469727, "global_step": 279553, "epoch": 3368} {"train_loss": -25.222959518432617, "global_step": 279554, "epoch": 3368} {"train_loss": -24.911787033081055, "global_step": 279555, "epoch": 3368} {"train_loss": -25.244224548339844, "global_step": 279556, "epoch": 3368} {"train_loss": -25.261899948120117, "global_step": 279557, "epoch": 3368} {"train_loss": -25.316429138183594, "global_step": 279558, "epoch": 3368} {"train_loss": -25.656909942626953, "global_step": 279559, "epoch": 3368} {"train_loss": -25.264270782470703, "global_step": 279560, "epoch": 3368} {"train_loss": -25.360898971557617, "global_step": 279561, "epoch": 3368} {"train_loss": -25.771772384643555, "global_step": 279562, "epoch": 3368} {"train_loss": -25.310958862304688, "global_step": 279563, "epoch": 3368} {"train_loss": -25.37683868408203, "global_step": 279564, "epoch": 3368} {"train_loss": -25.244037628173828, "global_step": 279565, "epoch": 3368} {"train_loss": -25.166547775268555, "global_step": 279566, "epoch": 3368} {"train_loss": -25.467670440673828, "global_step": 279567, "epoch": 3368} {"train_loss": -25.292001724243164, "global_step": 279568, "epoch": 3368} {"train_loss": -25.64957618713379, "global_step": 279569, "epoch": 3368} {"train_loss": -25.455289840698242, "global_step": 279570, "epoch": 3368} {"train_loss": -25.488859176635742, "global_step": 279571, "epoch": 3368} {"train_loss": -25.49622917175293, "global_step": 279572, "epoch": 3368} {"train_loss": -25.430814743041992, "global_step": 279573, "epoch": 3368} {"train_loss": -25.24153709411621, "global_step": 279574, "epoch": 3368} {"train_loss": -25.036447525024414, "global_step": 279575, "epoch": 3368} {"train_loss": -25.330158233642578, "global_step": 279576, "epoch": 3368} {"train_loss": -25.358169555664062, "global_step": 279577, "epoch": 3368} {"train_loss": -25.571012496948242, "global_step": 279578, "epoch": 3368} {"train_loss": -25.6588191986084, "global_step": 279579, "epoch": 3368} {"train_loss": -25.794422149658203, "global_step": 279580, "epoch": 3368} {"train_loss": -25.6780948638916, "global_step": 279581, "epoch": 3368} {"train_loss": -25.321083068847656, "global_step": 279582, "epoch": 3368} {"train_loss": -25.231399536132812, "global_step": 279583, "epoch": 3368} {"train_loss": -25.307615280151367, "global_step": 279584, "epoch": 3368} {"train_loss": -25.530893325805664, "global_step": 279585, "epoch": 3368} {"train_loss": -25.325387954711914, "global_step": 279586, "epoch": 3368} {"train_loss": -25.314970016479492, "global_step": 279587, "epoch": 3368} {"train_loss": -25.36634635925293, "global_step": 279588, "epoch": 3368} {"train_loss": -25.34455680847168, "global_step": 279589, "epoch": 3368} {"train_loss": -25.688190460205078, "global_step": 279590, "epoch": 3368} {"train_loss": -25.392982482910156, "global_step": 279591, "epoch": 3368} {"train_loss": -25.73076820373535, "global_step": 279592, "epoch": 3368} {"train_loss": -25.012136459350586, "global_step": 279593, "epoch": 3368} {"train_loss": -25.734106063842773, "global_step": 279594, "epoch": 3368} {"train_loss": -25.286178588867188, "global_step": 279595, "epoch": 3368} {"train_loss": -25.06032371520996, "global_step": 279596, "epoch": 3368} {"train_loss": -25.296430587768555, "global_step": 279597, "epoch": 3368} {"train_loss": -25.60468864440918, "global_step": 279598, "epoch": 3368} {"train_loss": -25.2263240814209, "global_step": 279599, "epoch": 3368} {"train_loss": -25.43899917602539, "global_step": 279600, "epoch": 3368} {"train_loss": -25.23973846435547, "global_step": 279601, "epoch": 3368} {"train_loss": -25.52565574645996, "global_step": 279602, "epoch": 3368} {"train_loss": -25.1900634765625, "global_step": 279603, "epoch": 3368} {"train_loss": -25.645238876342773, "global_step": 279604, "epoch": 3368} {"train_loss": -25.49182891845703, "global_step": 279605, "epoch": 3368} {"train_loss": -25.350481033325195, "global_step": 279606, "epoch": 3368} {"train_loss": -25.640256881713867, "global_step": 279607, "epoch": 3368} {"train_loss": -25.352344512939453, "global_step": 279608, "epoch": 3368} {"train_loss": -25.28883934020996, "global_step": 279609, "epoch": 3368} {"train_loss": -25.357404708862305, "global_step": 279610, "epoch": 3368} {"train_loss": -25.09758186340332, "global_step": 279611, "epoch": 3368} {"train_loss": -25.621917724609375, "global_step": 279612, "epoch": 3368} {"train_loss": -25.647024154663086, "global_step": 279613, "epoch": 3368} {"train_loss": -25.396013259887695, "global_step": 279614, "epoch": 3368} {"train_loss": -25.293485641479492, "global_step": 279615, "epoch": 3368} {"train_loss": -24.789358139038086, "global_step": 279616, "epoch": 3368} {"train_loss": -25.04694175720215, "global_step": 279617, "epoch": 3368} {"train_loss": -25.319257736206055, "global_step": 279618, "epoch": 3368} {"train_loss": -24.819467544555664, "global_step": 279619, "epoch": 3368} {"train_loss": -25.810043334960938, "global_step": 279620, "epoch": 3368} {"train_loss": -25.36652374267578, "global_step": 279621, "epoch": 3368} {"train_loss": -25.37397575378418, "global_step": 279622, "epoch": 3368} {"train_loss": -25.67066764831543, "global_step": 279623, "epoch": 3368} {"train_loss": -25.478809356689453, "global_step": 279624, "epoch": 3368} {"train_loss": -25.314496994018555, "global_step": 279625, "epoch": 3368} {"train_loss": -25.3456194544413, "global_step": 279626, "epoch": 3368, "val_loss": 7097557.0} {"train_loss": -25.500858306884766, "global_step": 279627, "epoch": 3369} {"train_loss": -25.40449333190918, "global_step": 279628, "epoch": 3369} {"train_loss": -25.298532485961914, "global_step": 279629, "epoch": 3369} {"train_loss": -25.31943130493164, "global_step": 279630, "epoch": 3369} {"train_loss": -25.636138916015625, "global_step": 279631, "epoch": 3369} {"train_loss": -25.172773361206055, "global_step": 279632, "epoch": 3369} {"train_loss": -25.479705810546875, "global_step": 279633, "epoch": 3369} {"train_loss": -25.157718658447266, "global_step": 279634, "epoch": 3369} {"train_loss": -25.0771541595459, "global_step": 279635, "epoch": 3369} {"train_loss": -25.395938873291016, "global_step": 279636, "epoch": 3369} {"train_loss": -25.474321365356445, "global_step": 279637, "epoch": 3369} {"train_loss": -25.087963104248047, "global_step": 279638, "epoch": 3369} {"train_loss": -25.38453483581543, "global_step": 279639, "epoch": 3369} {"train_loss": -25.219318389892578, "global_step": 279640, "epoch": 3369} {"train_loss": -24.79338836669922, "global_step": 279641, "epoch": 3369} {"train_loss": -25.3165283203125, "global_step": 279642, "epoch": 3369} {"train_loss": -24.99934196472168, "global_step": 279643, "epoch": 3369} {"train_loss": -25.35548973083496, "global_step": 279644, "epoch": 3369} {"train_loss": -25.202680587768555, "global_step": 279645, "epoch": 3369} {"train_loss": -25.636152267456055, "global_step": 279646, "epoch": 3369} {"train_loss": -25.385318756103516, "global_step": 279647, "epoch": 3369} {"train_loss": -25.116422653198242, "global_step": 279648, "epoch": 3369} {"train_loss": -25.477338790893555, "global_step": 279649, "epoch": 3369} {"train_loss": -24.928014755249023, "global_step": 279650, "epoch": 3369} {"train_loss": -25.269254684448242, "global_step": 279651, "epoch": 3369} {"train_loss": -25.236093521118164, "global_step": 279652, "epoch": 3369} {"train_loss": -25.229116439819336, "global_step": 279653, "epoch": 3369} {"train_loss": -25.25330924987793, "global_step": 279654, "epoch": 3369} {"train_loss": -25.504987716674805, "global_step": 279655, "epoch": 3369} {"train_loss": -25.72463035583496, "global_step": 279656, "epoch": 3369} {"train_loss": -25.25821876525879, "global_step": 279657, "epoch": 3369} {"train_loss": -25.2880802154541, "global_step": 279658, "epoch": 3369} {"train_loss": -25.380647659301758, "global_step": 279659, "epoch": 3369} {"train_loss": -25.63960075378418, "global_step": 279660, "epoch": 3369} {"train_loss": -25.865116119384766, "global_step": 279661, "epoch": 3369} {"train_loss": -25.244665145874023, "global_step": 279662, "epoch": 3369} {"train_loss": -25.620849609375, "global_step": 279663, "epoch": 3369} {"train_loss": -25.442556381225586, "global_step": 279664, "epoch": 3369} {"train_loss": -25.192594528198242, "global_step": 279665, "epoch": 3369} {"train_loss": -25.5051212310791, "global_step": 279666, "epoch": 3369} {"train_loss": -25.096572875976562, "global_step": 279667, "epoch": 3369} {"train_loss": -25.5063419342041, "global_step": 279668, "epoch": 3369} {"train_loss": -25.68775749206543, "global_step": 279669, "epoch": 3369} {"train_loss": -25.8240909576416, "global_step": 279670, "epoch": 3369} {"train_loss": -25.34221649169922, "global_step": 279671, "epoch": 3369} {"train_loss": -25.572830200195312, "global_step": 279672, "epoch": 3369} {"train_loss": -25.746112823486328, "global_step": 279673, "epoch": 3369} {"train_loss": -25.350400924682617, "global_step": 279674, "epoch": 3369} {"train_loss": -25.6975040435791, "global_step": 279675, "epoch": 3369} {"train_loss": -25.531957626342773, "global_step": 279676, "epoch": 3369} {"train_loss": -25.309452056884766, "global_step": 279677, "epoch": 3369} {"train_loss": -25.68361473083496, "global_step": 279678, "epoch": 3369} {"train_loss": -25.870452880859375, "global_step": 279679, "epoch": 3369} {"train_loss": -25.40269660949707, "global_step": 279680, "epoch": 3369} {"train_loss": -25.459325790405273, "global_step": 279681, "epoch": 3369} {"train_loss": -24.98569107055664, "global_step": 279682, "epoch": 3369} {"train_loss": -25.48590087890625, "global_step": 279683, "epoch": 3369} {"train_loss": -25.3753719329834, "global_step": 279684, "epoch": 3369} {"train_loss": -25.292993545532227, "global_step": 279685, "epoch": 3369} {"train_loss": -25.049951553344727, "global_step": 279686, "epoch": 3369} {"train_loss": -25.60910987854004, "global_step": 279687, "epoch": 3369} {"train_loss": -25.156667709350586, "global_step": 279688, "epoch": 3369} {"train_loss": -25.285886764526367, "global_step": 279689, "epoch": 3369} {"train_loss": -25.461332321166992, "global_step": 279690, "epoch": 3369} {"train_loss": -25.2735652923584, "global_step": 279691, "epoch": 3369} {"train_loss": -25.440900802612305, "global_step": 279692, "epoch": 3369} {"train_loss": -25.63612174987793, "global_step": 279693, "epoch": 3369} {"train_loss": -25.746356964111328, "global_step": 279694, "epoch": 3369} {"train_loss": -25.602970123291016, "global_step": 279695, "epoch": 3369} {"train_loss": -25.549274444580078, "global_step": 279696, "epoch": 3369} {"train_loss": -25.85528564453125, "global_step": 279697, "epoch": 3369} {"train_loss": -25.413122177124023, "global_step": 279698, "epoch": 3369} {"train_loss": -25.34067726135254, "global_step": 279699, "epoch": 3369} {"train_loss": -25.317564010620117, "global_step": 279700, "epoch": 3369} {"train_loss": -25.871234893798828, "global_step": 279701, "epoch": 3369} {"train_loss": -25.85114097595215, "global_step": 279702, "epoch": 3369} {"train_loss": -25.267614364624023, "global_step": 279703, "epoch": 3369} {"train_loss": -25.524208068847656, "global_step": 279704, "epoch": 3369} {"train_loss": -25.380844116210938, "global_step": 279705, "epoch": 3369} {"train_loss": -25.36343765258789, "global_step": 279706, "epoch": 3369} {"train_loss": -25.025131225585938, "global_step": 279707, "epoch": 3369} {"train_loss": -25.436405181884766, "global_step": 279708, "epoch": 3369} {"train_loss": -25.398345602564063, "global_step": 279709, "epoch": 3369, "val_loss": 7015810.0} {"train_loss": -24.569692611694336, "global_step": 279710, "epoch": 3370} {"train_loss": -24.64653968811035, "global_step": 279711, "epoch": 3370} {"train_loss": -24.830224990844727, "global_step": 279712, "epoch": 3370} {"train_loss": -25.126020431518555, "global_step": 279713, "epoch": 3370} {"train_loss": -25.185293197631836, "global_step": 279714, "epoch": 3370} {"train_loss": -25.20917320251465, "global_step": 279715, "epoch": 3370} {"train_loss": -24.980051040649414, "global_step": 279716, "epoch": 3370} {"train_loss": -24.696781158447266, "global_step": 279717, "epoch": 3370} {"train_loss": -25.3905086517334, "global_step": 279718, "epoch": 3370} {"train_loss": -24.9029483795166, "global_step": 279719, "epoch": 3370} {"train_loss": -25.28519630432129, "global_step": 279720, "epoch": 3370} {"train_loss": -24.976110458374023, "global_step": 279721, "epoch": 3370} {"train_loss": -25.354482650756836, "global_step": 279722, "epoch": 3370} {"train_loss": -24.932132720947266, "global_step": 279723, "epoch": 3370} {"train_loss": -24.924936294555664, "global_step": 279724, "epoch": 3370} {"train_loss": -25.0306453704834, "global_step": 279725, "epoch": 3370} {"train_loss": -25.21284294128418, "global_step": 279726, "epoch": 3370} {"train_loss": -25.20058250427246, "global_step": 279727, "epoch": 3370} {"train_loss": -25.282760620117188, "global_step": 279728, "epoch": 3370} {"train_loss": -25.305831909179688, "global_step": 279729, "epoch": 3370} {"train_loss": -25.025436401367188, "global_step": 279730, "epoch": 3370} {"train_loss": -25.02203369140625, "global_step": 279731, "epoch": 3370} {"train_loss": -25.036670684814453, "global_step": 279732, "epoch": 3370} {"train_loss": -25.535795211791992, "global_step": 279733, "epoch": 3370} {"train_loss": -25.503747940063477, "global_step": 279734, "epoch": 3370} {"train_loss": -25.57693862915039, "global_step": 279735, "epoch": 3370} {"train_loss": -25.4348201751709, "global_step": 279736, "epoch": 3370} {"train_loss": -25.14838218688965, "global_step": 279737, "epoch": 3370} {"train_loss": -25.277708053588867, "global_step": 279738, "epoch": 3370} {"train_loss": -25.295698165893555, "global_step": 279739, "epoch": 3370} {"train_loss": -25.442005157470703, "global_step": 279740, "epoch": 3370} {"train_loss": -25.3211612701416, "global_step": 279741, "epoch": 3370} {"train_loss": -25.112306594848633, "global_step": 279742, "epoch": 3370} {"train_loss": -25.610700607299805, "global_step": 279743, "epoch": 3370} {"train_loss": -25.34429359436035, "global_step": 279744, "epoch": 3370} {"train_loss": -25.60576820373535, "global_step": 279745, "epoch": 3370} {"train_loss": -25.352827072143555, "global_step": 279746, "epoch": 3370} {"train_loss": -25.29522132873535, "global_step": 279747, "epoch": 3370} {"train_loss": -25.516088485717773, "global_step": 279748, "epoch": 3370} {"train_loss": -25.53101921081543, "global_step": 279749, "epoch": 3370} {"train_loss": -25.48784828186035, "global_step": 279750, "epoch": 3370} {"train_loss": -25.013090133666992, "global_step": 279751, "epoch": 3370} {"train_loss": -25.268335342407227, "global_step": 279752, "epoch": 3370} {"train_loss": -25.443315505981445, "global_step": 279753, "epoch": 3370} {"train_loss": -25.062959671020508, "global_step": 279754, "epoch": 3370} {"train_loss": -24.922956466674805, "global_step": 279755, "epoch": 3370} {"train_loss": -25.568708419799805, "global_step": 279756, "epoch": 3370} {"train_loss": -25.15924644470215, "global_step": 279757, "epoch": 3370} {"train_loss": -25.239011764526367, "global_step": 279758, "epoch": 3370} {"train_loss": -25.4355411529541, "global_step": 279759, "epoch": 3370} {"train_loss": -25.134273529052734, "global_step": 279760, "epoch": 3370} {"train_loss": -25.4939022064209, "global_step": 279761, "epoch": 3370} {"train_loss": -25.15920066833496, "global_step": 279762, "epoch": 3370} {"train_loss": -25.441675186157227, "global_step": 279763, "epoch": 3370} {"train_loss": -25.351709365844727, "global_step": 279764, "epoch": 3370} {"train_loss": -25.517507553100586, "global_step": 279765, "epoch": 3370} {"train_loss": -24.836515426635742, "global_step": 279766, "epoch": 3370} {"train_loss": -25.570890426635742, "global_step": 279767, "epoch": 3370} {"train_loss": -25.229496002197266, "global_step": 279768, "epoch": 3370} {"train_loss": -25.50639533996582, "global_step": 279769, "epoch": 3370} {"train_loss": -25.838769912719727, "global_step": 279770, "epoch": 3370} {"train_loss": -25.469541549682617, "global_step": 279771, "epoch": 3370} {"train_loss": -25.47093391418457, "global_step": 279772, "epoch": 3370} {"train_loss": -25.615406036376953, "global_step": 279773, "epoch": 3370} {"train_loss": -25.25142478942871, "global_step": 279774, "epoch": 3370} {"train_loss": -25.459470748901367, "global_step": 279775, "epoch": 3370} {"train_loss": -25.408666610717773, "global_step": 279776, "epoch": 3370} {"train_loss": -25.228769302368164, "global_step": 279777, "epoch": 3370} {"train_loss": -25.546630859375, "global_step": 279778, "epoch": 3370} {"train_loss": -25.216054916381836, "global_step": 279779, "epoch": 3370} {"train_loss": -25.320804595947266, "global_step": 279780, "epoch": 3370} {"train_loss": -25.365934371948242, "global_step": 279781, "epoch": 3370} {"train_loss": -25.600950241088867, "global_step": 279782, "epoch": 3370} {"train_loss": -25.18238639831543, "global_step": 279783, "epoch": 3370} {"train_loss": -25.317852020263672, "global_step": 279784, "epoch": 3370} {"train_loss": -25.583547592163086, "global_step": 279785, "epoch": 3370} {"train_loss": -25.494903564453125, "global_step": 279786, "epoch": 3370} {"train_loss": -25.793848037719727, "global_step": 279787, "epoch": 3370} {"train_loss": -25.341426849365234, "global_step": 279788, "epoch": 3370} {"train_loss": -25.931676864624023, "global_step": 279789, "epoch": 3370} {"train_loss": -25.726591110229492, "global_step": 279790, "epoch": 3370} {"train_loss": -25.794300079345703, "global_step": 279791, "epoch": 3370} {"train_loss": -25.293225024119916, "global_step": 279792, "epoch": 3370, "val_loss": 7008138.0} {"train_loss": -24.78010368347168, "global_step": 279793, "epoch": 3371} {"train_loss": -25.086496353149414, "global_step": 279794, "epoch": 3371} {"train_loss": -25.08329200744629, "global_step": 279795, "epoch": 3371} {"train_loss": -25.316404342651367, "global_step": 279796, "epoch": 3371} {"train_loss": -25.322370529174805, "global_step": 279797, "epoch": 3371} {"train_loss": -24.859285354614258, "global_step": 279798, "epoch": 3371} {"train_loss": -24.956466674804688, "global_step": 279799, "epoch": 3371} {"train_loss": -24.895729064941406, "global_step": 279800, "epoch": 3371} {"train_loss": -24.666641235351562, "global_step": 279801, "epoch": 3371} {"train_loss": -24.918628692626953, "global_step": 279802, "epoch": 3371} {"train_loss": -25.592411041259766, "global_step": 279803, "epoch": 3371} {"train_loss": -25.243188858032227, "global_step": 279804, "epoch": 3371} {"train_loss": -25.307815551757812, "global_step": 279805, "epoch": 3371} {"train_loss": -25.297754287719727, "global_step": 279806, "epoch": 3371} {"train_loss": -24.937278747558594, "global_step": 279807, "epoch": 3371} {"train_loss": -25.079370498657227, "global_step": 279808, "epoch": 3371} {"train_loss": -25.393796920776367, "global_step": 279809, "epoch": 3371} {"train_loss": -25.216678619384766, "global_step": 279810, "epoch": 3371} {"train_loss": -25.489965438842773, "global_step": 279811, "epoch": 3371} {"train_loss": -24.992450714111328, "global_step": 279812, "epoch": 3371} {"train_loss": -25.29017448425293, "global_step": 279813, "epoch": 3371} {"train_loss": -25.318044662475586, "global_step": 279814, "epoch": 3371} {"train_loss": -25.779987335205078, "global_step": 279815, "epoch": 3371} {"train_loss": -25.011783599853516, "global_step": 279816, "epoch": 3371} {"train_loss": -25.32039451599121, "global_step": 279817, "epoch": 3371} {"train_loss": -24.923139572143555, "global_step": 279818, "epoch": 3371} {"train_loss": -25.41565704345703, "global_step": 279819, "epoch": 3371} {"train_loss": -25.3093318939209, "global_step": 279820, "epoch": 3371} {"train_loss": -25.411239624023438, "global_step": 279821, "epoch": 3371} {"train_loss": -25.8542537689209, "global_step": 279822, "epoch": 3371} {"train_loss": -25.39749526977539, "global_step": 279823, "epoch": 3371} {"train_loss": -25.3465518951416, "global_step": 279824, "epoch": 3371} {"train_loss": -25.15574073791504, "global_step": 279825, "epoch": 3371} {"train_loss": -25.742666244506836, "global_step": 279826, "epoch": 3371} {"train_loss": -25.519620895385742, "global_step": 279827, "epoch": 3371} {"train_loss": -25.3859920501709, "global_step": 279828, "epoch": 3371} {"train_loss": -25.57936668395996, "global_step": 279829, "epoch": 3371} {"train_loss": -25.399274826049805, "global_step": 279830, "epoch": 3371} {"train_loss": -25.2137508392334, "global_step": 279831, "epoch": 3371} {"train_loss": -25.337757110595703, "global_step": 279832, "epoch": 3371} {"train_loss": -25.696701049804688, "global_step": 279833, "epoch": 3371} {"train_loss": -25.315977096557617, "global_step": 279834, "epoch": 3371} {"train_loss": -25.002843856811523, "global_step": 279835, "epoch": 3371} {"train_loss": -25.09109878540039, "global_step": 279836, "epoch": 3371} {"train_loss": -25.30766487121582, "global_step": 279837, "epoch": 3371} {"train_loss": -25.046045303344727, "global_step": 279838, "epoch": 3371} {"train_loss": -25.163618087768555, "global_step": 279839, "epoch": 3371} {"train_loss": -25.52919578552246, "global_step": 279840, "epoch": 3371} {"train_loss": -25.13287353515625, "global_step": 279841, "epoch": 3371} {"train_loss": -25.49481773376465, "global_step": 279842, "epoch": 3371} {"train_loss": -25.033010482788086, "global_step": 279843, "epoch": 3371} {"train_loss": -25.291269302368164, "global_step": 279844, "epoch": 3371} {"train_loss": -25.40924644470215, "global_step": 279845, "epoch": 3371} {"train_loss": -25.471256256103516, "global_step": 279846, "epoch": 3371} {"train_loss": -25.489307403564453, "global_step": 279847, "epoch": 3371} {"train_loss": -25.58683204650879, "global_step": 279848, "epoch": 3371} {"train_loss": -25.495548248291016, "global_step": 279849, "epoch": 3371} {"train_loss": -25.563989639282227, "global_step": 279850, "epoch": 3371} {"train_loss": -25.735931396484375, "global_step": 279851, "epoch": 3371} {"train_loss": -25.14667510986328, "global_step": 279852, "epoch": 3371} {"train_loss": -25.79286003112793, "global_step": 279853, "epoch": 3371} {"train_loss": -25.406248092651367, "global_step": 279854, "epoch": 3371} {"train_loss": -25.475378036499023, "global_step": 279855, "epoch": 3371} {"train_loss": -25.52056312561035, "global_step": 279856, "epoch": 3371} {"train_loss": -25.40424156188965, "global_step": 279857, "epoch": 3371} {"train_loss": -25.46310806274414, "global_step": 279858, "epoch": 3371} {"train_loss": -25.703094482421875, "global_step": 279859, "epoch": 3371} {"train_loss": -25.55984878540039, "global_step": 279860, "epoch": 3371} {"train_loss": -25.186458587646484, "global_step": 279861, "epoch": 3371} {"train_loss": -25.600479125976562, "global_step": 279862, "epoch": 3371} {"train_loss": -25.346555709838867, "global_step": 279863, "epoch": 3371} {"train_loss": -25.898767471313477, "global_step": 279864, "epoch": 3371} {"train_loss": -25.14070701599121, "global_step": 279865, "epoch": 3371} {"train_loss": -25.492511749267578, "global_step": 279866, "epoch": 3371} {"train_loss": -25.658536911010742, "global_step": 279867, "epoch": 3371} {"train_loss": -25.610183715820312, "global_step": 279868, "epoch": 3371} {"train_loss": -25.44757080078125, "global_step": 279869, "epoch": 3371} {"train_loss": -25.593393325805664, "global_step": 279870, "epoch": 3371} {"train_loss": -25.539953231811523, "global_step": 279871, "epoch": 3371} {"train_loss": -25.8425235748291, "global_step": 279872, "epoch": 3371} {"train_loss": -25.414514541625977, "global_step": 279873, "epoch": 3371} {"train_loss": -25.27910804748535, "global_step": 279874, "epoch": 3371} {"train_loss": -25.351483563342725, "global_step": 279875, "epoch": 3371, "val_loss": 7011794.0} {"train_loss": -24.195728302001953, "global_step": 279876, "epoch": 3372} {"train_loss": -22.493202209472656, "global_step": 279877, "epoch": 3372} {"train_loss": -22.442283630371094, "global_step": 279878, "epoch": 3372} {"train_loss": -23.202526092529297, "global_step": 279879, "epoch": 3372} {"train_loss": -24.89594841003418, "global_step": 279880, "epoch": 3372} {"train_loss": -23.93100929260254, "global_step": 279881, "epoch": 3372} {"train_loss": -23.835866928100586, "global_step": 279882, "epoch": 3372} {"train_loss": -24.265178680419922, "global_step": 279883, "epoch": 3372} {"train_loss": -24.174650192260742, "global_step": 279884, "epoch": 3372} {"train_loss": -24.11099624633789, "global_step": 279885, "epoch": 3372} {"train_loss": -24.99761962890625, "global_step": 279886, "epoch": 3372} {"train_loss": -24.43937110900879, "global_step": 279887, "epoch": 3372} {"train_loss": -24.37969970703125, "global_step": 279888, "epoch": 3372} {"train_loss": -24.404178619384766, "global_step": 279889, "epoch": 3372} {"train_loss": -24.312686920166016, "global_step": 279890, "epoch": 3372} {"train_loss": -24.530109405517578, "global_step": 279891, "epoch": 3372} {"train_loss": -24.699146270751953, "global_step": 279892, "epoch": 3372} {"train_loss": -24.78533363342285, "global_step": 279893, "epoch": 3372} {"train_loss": -25.2040958404541, "global_step": 279894, "epoch": 3372} {"train_loss": -24.79483985900879, "global_step": 279895, "epoch": 3372} {"train_loss": -24.440492630004883, "global_step": 279896, "epoch": 3372} {"train_loss": -24.85097885131836, "global_step": 279897, "epoch": 3372} {"train_loss": -24.91843605041504, "global_step": 279898, "epoch": 3372} {"train_loss": -25.011337280273438, "global_step": 279899, "epoch": 3372} {"train_loss": -24.880456924438477, "global_step": 279900, "epoch": 3372} {"train_loss": -25.46805763244629, "global_step": 279901, "epoch": 3372} {"train_loss": -25.13545036315918, "global_step": 279902, "epoch": 3372} {"train_loss": -25.0885066986084, "global_step": 279903, "epoch": 3372} {"train_loss": -25.499210357666016, "global_step": 279904, "epoch": 3372} {"train_loss": -25.1549015045166, "global_step": 279905, "epoch": 3372} {"train_loss": -25.231538772583008, "global_step": 279906, "epoch": 3372} {"train_loss": -24.99936294555664, "global_step": 279907, "epoch": 3372} {"train_loss": -25.418203353881836, "global_step": 279908, "epoch": 3372} {"train_loss": -25.281644821166992, "global_step": 279909, "epoch": 3372} {"train_loss": -25.490476608276367, "global_step": 279910, "epoch": 3372} {"train_loss": -25.815174102783203, "global_step": 279911, "epoch": 3372} {"train_loss": -25.5725154876709, "global_step": 279912, "epoch": 3372} {"train_loss": -25.38210678100586, "global_step": 279913, "epoch": 3372} {"train_loss": -25.273807525634766, "global_step": 279914, "epoch": 3372} {"train_loss": -25.12421989440918, "global_step": 279915, "epoch": 3372} {"train_loss": -24.822086334228516, "global_step": 279916, "epoch": 3372} {"train_loss": -24.98614501953125, "global_step": 279917, "epoch": 3372} {"train_loss": -25.17268180847168, "global_step": 279918, "epoch": 3372} {"train_loss": -25.677078247070312, "global_step": 279919, "epoch": 3372} {"train_loss": -25.52687644958496, "global_step": 279920, "epoch": 3372} {"train_loss": -25.425386428833008, "global_step": 279921, "epoch": 3372} {"train_loss": -25.7443790435791, "global_step": 279922, "epoch": 3372} {"train_loss": -25.129384994506836, "global_step": 279923, "epoch": 3372} {"train_loss": -25.302335739135742, "global_step": 279924, "epoch": 3372} {"train_loss": -25.487957000732422, "global_step": 279925, "epoch": 3372} {"train_loss": -25.31178855895996, "global_step": 279926, "epoch": 3372} {"train_loss": -25.415586471557617, "global_step": 279927, "epoch": 3372} {"train_loss": -25.24140739440918, "global_step": 279928, "epoch": 3372} {"train_loss": -25.0056095123291, "global_step": 279929, "epoch": 3372} {"train_loss": -24.982208251953125, "global_step": 279930, "epoch": 3372} {"train_loss": -25.339208602905273, "global_step": 279931, "epoch": 3372} {"train_loss": -25.21729850769043, "global_step": 279932, "epoch": 3372} {"train_loss": -25.18794822692871, "global_step": 279933, "epoch": 3372} {"train_loss": -25.451278686523438, "global_step": 279934, "epoch": 3372} {"train_loss": -24.999298095703125, "global_step": 279935, "epoch": 3372} {"train_loss": -25.27103042602539, "global_step": 279936, "epoch": 3372} {"train_loss": -25.537900924682617, "global_step": 279937, "epoch": 3372} {"train_loss": -25.610843658447266, "global_step": 279938, "epoch": 3372} {"train_loss": -25.40321159362793, "global_step": 279939, "epoch": 3372} {"train_loss": -25.2719783782959, "global_step": 279940, "epoch": 3372} {"train_loss": -25.02674674987793, "global_step": 279941, "epoch": 3372} {"train_loss": -25.259082794189453, "global_step": 279942, "epoch": 3372} {"train_loss": -25.221492767333984, "global_step": 279943, "epoch": 3372} {"train_loss": -25.32956886291504, "global_step": 279944, "epoch": 3372} {"train_loss": -25.59108543395996, "global_step": 279945, "epoch": 3372} {"train_loss": -24.759252548217773, "global_step": 279946, "epoch": 3372} {"train_loss": -25.36125373840332, "global_step": 279947, "epoch": 3372} {"train_loss": -25.55512046813965, "global_step": 279948, "epoch": 3372} {"train_loss": -24.77462387084961, "global_step": 279949, "epoch": 3372} {"train_loss": -25.231657028198242, "global_step": 279950, "epoch": 3372} {"train_loss": -25.31392478942871, "global_step": 279951, "epoch": 3372} {"train_loss": -25.21242332458496, "global_step": 279952, "epoch": 3372} {"train_loss": -25.51920509338379, "global_step": 279953, "epoch": 3372} {"train_loss": -25.466840744018555, "global_step": 279954, "epoch": 3372} {"train_loss": -25.470577239990234, "global_step": 279955, "epoch": 3372} {"train_loss": -25.480676651000977, "global_step": 279956, "epoch": 3372} {"train_loss": -25.49014663696289, "global_step": 279957, "epoch": 3372} {"train_loss": -25.00577804841191, "global_step": 279958, "epoch": 3372, "val_loss": 6986246.0} {"train_loss": -24.925439834594727, "global_step": 279959, "epoch": 3373} {"train_loss": -25.438779830932617, "global_step": 279960, "epoch": 3373} {"train_loss": -25.11282730102539, "global_step": 279961, "epoch": 3373} {"train_loss": -25.092859268188477, "global_step": 279962, "epoch": 3373} {"train_loss": -25.095163345336914, "global_step": 279963, "epoch": 3373} {"train_loss": -24.923547744750977, "global_step": 279964, "epoch": 3373} {"train_loss": -25.154163360595703, "global_step": 279965, "epoch": 3373} {"train_loss": -25.63362693786621, "global_step": 279966, "epoch": 3373} {"train_loss": -24.89674949645996, "global_step": 279967, "epoch": 3373} {"train_loss": -25.033767700195312, "global_step": 279968, "epoch": 3373} {"train_loss": -25.095836639404297, "global_step": 279969, "epoch": 3373} {"train_loss": -25.392995834350586, "global_step": 279970, "epoch": 3373} {"train_loss": -25.454736709594727, "global_step": 279971, "epoch": 3373} {"train_loss": -25.479381561279297, "global_step": 279972, "epoch": 3373} {"train_loss": -25.495777130126953, "global_step": 279973, "epoch": 3373} {"train_loss": -25.18409538269043, "global_step": 279974, "epoch": 3373} {"train_loss": -25.092329025268555, "global_step": 279975, "epoch": 3373} {"train_loss": -25.229028701782227, "global_step": 279976, "epoch": 3373} {"train_loss": -25.184778213500977, "global_step": 279977, "epoch": 3373} {"train_loss": -25.016708374023438, "global_step": 279978, "epoch": 3373} {"train_loss": -25.291709899902344, "global_step": 279979, "epoch": 3373} {"train_loss": -25.29833984375, "global_step": 279980, "epoch": 3373} {"train_loss": -25.376197814941406, "global_step": 279981, "epoch": 3373} {"train_loss": -25.308637619018555, "global_step": 279982, "epoch": 3373} {"train_loss": -25.672510147094727, "global_step": 279983, "epoch": 3373} {"train_loss": -25.38538932800293, "global_step": 279984, "epoch": 3373} {"train_loss": -25.148935317993164, "global_step": 279985, "epoch": 3373} {"train_loss": -25.257448196411133, "global_step": 279986, "epoch": 3373} {"train_loss": -25.4730281829834, "global_step": 279987, "epoch": 3373} {"train_loss": -25.51249122619629, "global_step": 279988, "epoch": 3373} {"train_loss": -25.498159408569336, "global_step": 279989, "epoch": 3373} {"train_loss": -25.082202911376953, "global_step": 279990, "epoch": 3373} {"train_loss": -25.429140090942383, "global_step": 279991, "epoch": 3373} {"train_loss": -25.509984970092773, "global_step": 279992, "epoch": 3373} {"train_loss": -25.17371940612793, "global_step": 279993, "epoch": 3373} {"train_loss": -25.508527755737305, "global_step": 279994, "epoch": 3373} {"train_loss": -25.378854751586914, "global_step": 279995, "epoch": 3373} {"train_loss": -25.306411743164062, "global_step": 279996, "epoch": 3373} {"train_loss": -25.724592208862305, "global_step": 279997, "epoch": 3373} {"train_loss": -25.750595092773438, "global_step": 279998, "epoch": 3373} {"train_loss": -25.62662696838379, "global_step": 279999, "epoch": 3373} {"train_loss": -25.591955184936523, "global_step": 280000, "epoch": 3373} {"train_loss": -25.43318748474121, "global_step": 280001, "epoch": 3373} {"train_loss": -25.373186111450195, "global_step": 280002, "epoch": 3373} {"train_loss": -25.792749404907227, "global_step": 280003, "epoch": 3373} {"train_loss": -25.44363021850586, "global_step": 280004, "epoch": 3373} {"train_loss": -25.497039794921875, "global_step": 280005, "epoch": 3373} {"train_loss": -25.80430030822754, "global_step": 280006, "epoch": 3373} {"train_loss": -25.56441307067871, "global_step": 280007, "epoch": 3373} {"train_loss": -25.478622436523438, "global_step": 280008, "epoch": 3373} {"train_loss": -25.363691329956055, "global_step": 280009, "epoch": 3373} {"train_loss": -25.062448501586914, "global_step": 280010, "epoch": 3373} {"train_loss": -25.20871925354004, "global_step": 280011, "epoch": 3373} {"train_loss": -25.512853622436523, "global_step": 280012, "epoch": 3373} {"train_loss": -25.505529403686523, "global_step": 280013, "epoch": 3373} {"train_loss": -25.665546417236328, "global_step": 280014, "epoch": 3373} {"train_loss": -25.40789794921875, "global_step": 280015, "epoch": 3373} {"train_loss": -25.547834396362305, "global_step": 280016, "epoch": 3373} {"train_loss": -25.679784774780273, "global_step": 280017, "epoch": 3373} {"train_loss": -25.48612403869629, "global_step": 280018, "epoch": 3373} {"train_loss": -25.329504013061523, "global_step": 280019, "epoch": 3373} {"train_loss": -25.581266403198242, "global_step": 280020, "epoch": 3373} {"train_loss": -25.423086166381836, "global_step": 280021, "epoch": 3373} {"train_loss": -25.542591094970703, "global_step": 280022, "epoch": 3373} {"train_loss": -25.64357566833496, "global_step": 280023, "epoch": 3373} {"train_loss": -25.5014591217041, "global_step": 280024, "epoch": 3373} {"train_loss": -25.446033477783203, "global_step": 280025, "epoch": 3373} {"train_loss": -25.475631713867188, "global_step": 280026, "epoch": 3373} {"train_loss": -25.390565872192383, "global_step": 280027, "epoch": 3373} {"train_loss": -25.331838607788086, "global_step": 280028, "epoch": 3373} {"train_loss": -25.419111251831055, "global_step": 280029, "epoch": 3373} {"train_loss": -25.399715423583984, "global_step": 280030, "epoch": 3373} {"train_loss": -25.213687896728516, "global_step": 280031, "epoch": 3373} {"train_loss": -25.342321395874023, "global_step": 280032, "epoch": 3373} {"train_loss": -25.26250648498535, "global_step": 280033, "epoch": 3373} {"train_loss": -25.669626235961914, "global_step": 280034, "epoch": 3373} {"train_loss": -25.339082717895508, "global_step": 280035, "epoch": 3373} {"train_loss": -25.141572952270508, "global_step": 280036, "epoch": 3373} {"train_loss": -24.6169376373291, "global_step": 280037, "epoch": 3373} {"train_loss": -24.554471969604492, "global_step": 280038, "epoch": 3373} {"train_loss": -24.97511100769043, "global_step": 280039, "epoch": 3373} {"train_loss": -25.22903060913086, "global_step": 280040, "epoch": 3373} {"train_loss": -25.34778652420963, "global_step": 280041, "epoch": 3373, "val_loss": 7037611.0} {"train_loss": -24.0997257232666, "global_step": 280042, "epoch": 3374} {"train_loss": -24.380094528198242, "global_step": 280043, "epoch": 3374} {"train_loss": -23.76048469543457, "global_step": 280044, "epoch": 3374} {"train_loss": -23.89493751525879, "global_step": 280045, "epoch": 3374} {"train_loss": -24.593229293823242, "global_step": 280046, "epoch": 3374} {"train_loss": -23.792814254760742, "global_step": 280047, "epoch": 3374} {"train_loss": -24.501718521118164, "global_step": 280048, "epoch": 3374} {"train_loss": -23.919021606445312, "global_step": 280049, "epoch": 3374} {"train_loss": -24.716541290283203, "global_step": 280050, "epoch": 3374} {"train_loss": -24.96973991394043, "global_step": 280051, "epoch": 3374} {"train_loss": -24.320629119873047, "global_step": 280052, "epoch": 3374} {"train_loss": -24.65232276916504, "global_step": 280053, "epoch": 3374} {"train_loss": -24.684799194335938, "global_step": 280054, "epoch": 3374} {"train_loss": -24.475065231323242, "global_step": 280055, "epoch": 3374} {"train_loss": -24.652969360351562, "global_step": 280056, "epoch": 3374} {"train_loss": -24.660436630249023, "global_step": 280057, "epoch": 3374} {"train_loss": -24.93595314025879, "global_step": 280058, "epoch": 3374} {"train_loss": -25.0628719329834, "global_step": 280059, "epoch": 3374} {"train_loss": -24.661813735961914, "global_step": 280060, "epoch": 3374} {"train_loss": -24.707517623901367, "global_step": 280061, "epoch": 3374} {"train_loss": -25.162837982177734, "global_step": 280062, "epoch": 3374} {"train_loss": -24.952869415283203, "global_step": 280063, "epoch": 3374} {"train_loss": -25.06671714782715, "global_step": 280064, "epoch": 3374} {"train_loss": -25.48095703125, "global_step": 280065, "epoch": 3374} {"train_loss": -25.284494400024414, "global_step": 280066, "epoch": 3374} {"train_loss": -25.462732315063477, "global_step": 280067, "epoch": 3374} {"train_loss": -25.138402938842773, "global_step": 280068, "epoch": 3374} {"train_loss": -25.224328994750977, "global_step": 280069, "epoch": 3374} {"train_loss": -25.334901809692383, "global_step": 280070, "epoch": 3374} {"train_loss": -25.31467056274414, "global_step": 280071, "epoch": 3374} {"train_loss": -25.136980056762695, "global_step": 280072, "epoch": 3374} {"train_loss": -24.982019424438477, "global_step": 280073, "epoch": 3374} {"train_loss": -25.37757682800293, "global_step": 280074, "epoch": 3374} {"train_loss": -25.44024658203125, "global_step": 280075, "epoch": 3374} {"train_loss": -25.204883575439453, "global_step": 280076, "epoch": 3374} {"train_loss": -25.533109664916992, "global_step": 280077, "epoch": 3374} {"train_loss": -25.003347396850586, "global_step": 280078, "epoch": 3374} {"train_loss": -25.440898895263672, "global_step": 280079, "epoch": 3374} {"train_loss": -25.58615493774414, "global_step": 280080, "epoch": 3374} {"train_loss": -25.232553482055664, "global_step": 280081, "epoch": 3374} {"train_loss": -25.198511123657227, "global_step": 280082, "epoch": 3374} {"train_loss": -25.225318908691406, "global_step": 280083, "epoch": 3374} {"train_loss": -25.656469345092773, "global_step": 280084, "epoch": 3374} {"train_loss": -25.291791915893555, "global_step": 280085, "epoch": 3374} {"train_loss": -25.326387405395508, "global_step": 280086, "epoch": 3374} {"train_loss": -25.32845115661621, "global_step": 280087, "epoch": 3374} {"train_loss": -25.54690933227539, "global_step": 280088, "epoch": 3374} {"train_loss": -25.408933639526367, "global_step": 280089, "epoch": 3374} {"train_loss": -25.56355857849121, "global_step": 280090, "epoch": 3374} {"train_loss": -25.52335548400879, "global_step": 280091, "epoch": 3374} {"train_loss": -25.6535587310791, "global_step": 280092, "epoch": 3374} {"train_loss": -25.270458221435547, "global_step": 280093, "epoch": 3374} {"train_loss": -25.64320945739746, "global_step": 280094, "epoch": 3374} {"train_loss": -25.42990493774414, "global_step": 280095, "epoch": 3374} {"train_loss": -25.029218673706055, "global_step": 280096, "epoch": 3374} {"train_loss": -25.069311141967773, "global_step": 280097, "epoch": 3374} {"train_loss": -25.447053909301758, "global_step": 280098, "epoch": 3374} {"train_loss": -25.4453125, "global_step": 280099, "epoch": 3374} {"train_loss": -24.93387222290039, "global_step": 280100, "epoch": 3374} {"train_loss": -25.272750854492188, "global_step": 280101, "epoch": 3374} {"train_loss": -25.177350997924805, "global_step": 280102, "epoch": 3374} {"train_loss": -24.501686096191406, "global_step": 280103, "epoch": 3374} {"train_loss": -24.879404067993164, "global_step": 280104, "epoch": 3374} {"train_loss": -25.31641960144043, "global_step": 280105, "epoch": 3374} {"train_loss": -25.210020065307617, "global_step": 280106, "epoch": 3374} {"train_loss": -25.53253746032715, "global_step": 280107, "epoch": 3374} {"train_loss": -25.297426223754883, "global_step": 280108, "epoch": 3374} {"train_loss": -25.203323364257812, "global_step": 280109, "epoch": 3374} {"train_loss": -25.7300968170166, "global_step": 280110, "epoch": 3374} {"train_loss": -25.40266990661621, "global_step": 280111, "epoch": 3374} {"train_loss": -25.62361717224121, "global_step": 280112, "epoch": 3374} {"train_loss": -25.125022888183594, "global_step": 280113, "epoch": 3374} {"train_loss": -25.767255783081055, "global_step": 280114, "epoch": 3374} {"train_loss": -25.236417770385742, "global_step": 280115, "epoch": 3374} {"train_loss": -25.23969841003418, "global_step": 280116, "epoch": 3374} {"train_loss": -25.384275436401367, "global_step": 280117, "epoch": 3374} {"train_loss": -25.113080978393555, "global_step": 280118, "epoch": 3374} {"train_loss": -24.995059967041016, "global_step": 280119, "epoch": 3374} {"train_loss": -25.436588287353516, "global_step": 280120, "epoch": 3374} {"train_loss": -25.03279685974121, "global_step": 280121, "epoch": 3374} {"train_loss": -24.959096908569336, "global_step": 280122, "epoch": 3374} {"train_loss": -25.550792694091797, "global_step": 280123, "epoch": 3374} {"train_loss": -25.08703344414033, "global_step": 280124, "epoch": 3374, "val_loss": 6920467.0} {"train_loss": -24.586305618286133, "global_step": 280125, "epoch": 3375} {"train_loss": -24.820051193237305, "global_step": 280126, "epoch": 3375} {"train_loss": -24.632843017578125, "global_step": 280127, "epoch": 3375} {"train_loss": -24.6185302734375, "global_step": 280128, "epoch": 3375} {"train_loss": -24.59214210510254, "global_step": 280129, "epoch": 3375} {"train_loss": -25.037906646728516, "global_step": 280130, "epoch": 3375} {"train_loss": -25.188644409179688, "global_step": 280131, "epoch": 3375} {"train_loss": -24.994800567626953, "global_step": 280132, "epoch": 3375} {"train_loss": -25.01959800720215, "global_step": 280133, "epoch": 3375} {"train_loss": -25.305553436279297, "global_step": 280134, "epoch": 3375} {"train_loss": -25.333511352539062, "global_step": 280135, "epoch": 3375} {"train_loss": -25.481063842773438, "global_step": 280136, "epoch": 3375} {"train_loss": -25.04388427734375, "global_step": 280137, "epoch": 3375} {"train_loss": -25.252483367919922, "global_step": 280138, "epoch": 3375} {"train_loss": -25.119979858398438, "global_step": 280139, "epoch": 3375} {"train_loss": -25.197284698486328, "global_step": 280140, "epoch": 3375} {"train_loss": -25.134023666381836, "global_step": 280141, "epoch": 3375} {"train_loss": -25.111906051635742, "global_step": 280142, "epoch": 3375} {"train_loss": -25.276962280273438, "global_step": 280143, "epoch": 3375} {"train_loss": -25.291057586669922, "global_step": 280144, "epoch": 3375} {"train_loss": -25.19706916809082, "global_step": 280145, "epoch": 3375} {"train_loss": -25.43960952758789, "global_step": 280146, "epoch": 3375} {"train_loss": -25.464298248291016, "global_step": 280147, "epoch": 3375} {"train_loss": -25.240385055541992, "global_step": 280148, "epoch": 3375} {"train_loss": -25.50022315979004, "global_step": 280149, "epoch": 3375} {"train_loss": -25.034774780273438, "global_step": 280150, "epoch": 3375} {"train_loss": -25.38301658630371, "global_step": 280151, "epoch": 3375} {"train_loss": -25.461164474487305, "global_step": 280152, "epoch": 3375} {"train_loss": -25.796894073486328, "global_step": 280153, "epoch": 3375} {"train_loss": -25.36466407775879, "global_step": 280154, "epoch": 3375} {"train_loss": -25.60224723815918, "global_step": 280155, "epoch": 3375} {"train_loss": -25.68776512145996, "global_step": 280156, "epoch": 3375} {"train_loss": -25.326913833618164, "global_step": 280157, "epoch": 3375} {"train_loss": -25.1147403717041, "global_step": 280158, "epoch": 3375} {"train_loss": -25.579954147338867, "global_step": 280159, "epoch": 3375} {"train_loss": -25.43868064880371, "global_step": 280160, "epoch": 3375} {"train_loss": -25.314855575561523, "global_step": 280161, "epoch": 3375} {"train_loss": -25.232885360717773, "global_step": 280162, "epoch": 3375} {"train_loss": -25.809467315673828, "global_step": 280163, "epoch": 3375} {"train_loss": -25.56867027282715, "global_step": 280164, "epoch": 3375} {"train_loss": -25.168655395507812, "global_step": 280165, "epoch": 3375} {"train_loss": -25.588743209838867, "global_step": 280166, "epoch": 3375} {"train_loss": -25.312788009643555, "global_step": 280167, "epoch": 3375} {"train_loss": -25.575119018554688, "global_step": 280168, "epoch": 3375} {"train_loss": -25.453563690185547, "global_step": 280169, "epoch": 3375} {"train_loss": -25.669025421142578, "global_step": 280170, "epoch": 3375} {"train_loss": -26.088367462158203, "global_step": 280171, "epoch": 3375} {"train_loss": -25.662555694580078, "global_step": 280172, "epoch": 3375} {"train_loss": -25.6126766204834, "global_step": 280173, "epoch": 3375} {"train_loss": -25.2396240234375, "global_step": 280174, "epoch": 3375} {"train_loss": -25.513273239135742, "global_step": 280175, "epoch": 3375} {"train_loss": -25.22676658630371, "global_step": 280176, "epoch": 3375} {"train_loss": -25.39518928527832, "global_step": 280177, "epoch": 3375} {"train_loss": -25.355825424194336, "global_step": 280178, "epoch": 3375} {"train_loss": -26.027603149414062, "global_step": 280179, "epoch": 3375} {"train_loss": -25.10020637512207, "global_step": 280180, "epoch": 3375} {"train_loss": -25.42698097229004, "global_step": 280181, "epoch": 3375} {"train_loss": -25.42816734313965, "global_step": 280182, "epoch": 3375} {"train_loss": -25.887094497680664, "global_step": 280183, "epoch": 3375} {"train_loss": -25.73430824279785, "global_step": 280184, "epoch": 3375} {"train_loss": -25.053003311157227, "global_step": 280185, "epoch": 3375} {"train_loss": -25.041532516479492, "global_step": 280186, "epoch": 3375} {"train_loss": -25.508106231689453, "global_step": 280187, "epoch": 3375} {"train_loss": -25.29225730895996, "global_step": 280188, "epoch": 3375} {"train_loss": -25.051345825195312, "global_step": 280189, "epoch": 3375} {"train_loss": -24.952341079711914, "global_step": 280190, "epoch": 3375} {"train_loss": -25.62592887878418, "global_step": 280191, "epoch": 3375} {"train_loss": -25.6826229095459, "global_step": 280192, "epoch": 3375} {"train_loss": -24.884462356567383, "global_step": 280193, "epoch": 3375} {"train_loss": -25.523134231567383, "global_step": 280194, "epoch": 3375} {"train_loss": -25.665878295898438, "global_step": 280195, "epoch": 3375} {"train_loss": -25.38252067565918, "global_step": 280196, "epoch": 3375} {"train_loss": -25.4456844329834, "global_step": 280197, "epoch": 3375} {"train_loss": -25.272293090820312, "global_step": 280198, "epoch": 3375} {"train_loss": -25.295812606811523, "global_step": 280199, "epoch": 3375} {"train_loss": -25.26576805114746, "global_step": 280200, "epoch": 3375} {"train_loss": -25.424406051635742, "global_step": 280201, "epoch": 3375} {"train_loss": -25.46271324157715, "global_step": 280202, "epoch": 3375} {"train_loss": -25.517881393432617, "global_step": 280203, "epoch": 3375} {"train_loss": -25.32270622253418, "global_step": 280204, "epoch": 3375} {"train_loss": -25.58192253112793, "global_step": 280205, "epoch": 3375} {"train_loss": -25.41834831237793, "global_step": 280206, "epoch": 3375} {"train_loss": -25.344459188989845, "global_step": 280207, "epoch": 3375, "val_loss": 7118872.0} {"train_loss": -25.10310935974121, "global_step": 280208, "epoch": 3376} {"train_loss": -25.413097381591797, "global_step": 280209, "epoch": 3376} {"train_loss": -24.95829963684082, "global_step": 280210, "epoch": 3376} {"train_loss": -25.250850677490234, "global_step": 280211, "epoch": 3376} {"train_loss": -25.24374008178711, "global_step": 280212, "epoch": 3376} {"train_loss": -25.309675216674805, "global_step": 280213, "epoch": 3376} {"train_loss": -24.920896530151367, "global_step": 280214, "epoch": 3376} {"train_loss": -25.305133819580078, "global_step": 280215, "epoch": 3376} {"train_loss": -25.492700576782227, "global_step": 280216, "epoch": 3376} {"train_loss": -25.51782989501953, "global_step": 280217, "epoch": 3376} {"train_loss": -25.4049072265625, "global_step": 280218, "epoch": 3376} {"train_loss": -25.487857818603516, "global_step": 280219, "epoch": 3376} {"train_loss": -25.448801040649414, "global_step": 280220, "epoch": 3376} {"train_loss": -25.14444351196289, "global_step": 280221, "epoch": 3376} {"train_loss": -24.89012336730957, "global_step": 280222, "epoch": 3376} {"train_loss": -25.46755599975586, "global_step": 280223, "epoch": 3376} {"train_loss": -25.572006225585938, "global_step": 280224, "epoch": 3376} {"train_loss": -25.145736694335938, "global_step": 280225, "epoch": 3376} {"train_loss": -25.491764068603516, "global_step": 280226, "epoch": 3376} {"train_loss": -25.054441452026367, "global_step": 280227, "epoch": 3376} {"train_loss": -25.53025245666504, "global_step": 280228, "epoch": 3376} {"train_loss": -25.57540512084961, "global_step": 280229, "epoch": 3376} {"train_loss": -25.313169479370117, "global_step": 280230, "epoch": 3376} {"train_loss": -25.27009391784668, "global_step": 280231, "epoch": 3376} {"train_loss": -25.2811279296875, "global_step": 280232, "epoch": 3376} {"train_loss": -25.648578643798828, "global_step": 280233, "epoch": 3376} {"train_loss": -25.54878044128418, "global_step": 280234, "epoch": 3376} {"train_loss": -25.2387638092041, "global_step": 280235, "epoch": 3376} {"train_loss": -25.294986724853516, "global_step": 280236, "epoch": 3376} {"train_loss": -25.278587341308594, "global_step": 280237, "epoch": 3376} {"train_loss": -25.3083438873291, "global_step": 280238, "epoch": 3376} {"train_loss": -25.297456741333008, "global_step": 280239, "epoch": 3376} {"train_loss": -25.23333740234375, "global_step": 280240, "epoch": 3376} {"train_loss": -25.148691177368164, "global_step": 280241, "epoch": 3376} {"train_loss": -25.420312881469727, "global_step": 280242, "epoch": 3376} {"train_loss": -25.389150619506836, "global_step": 280243, "epoch": 3376} {"train_loss": -25.47739601135254, "global_step": 280244, "epoch": 3376} {"train_loss": -25.33154296875, "global_step": 280245, "epoch": 3376} {"train_loss": -25.293516159057617, "global_step": 280246, "epoch": 3376} {"train_loss": -24.960744857788086, "global_step": 280247, "epoch": 3376} {"train_loss": -25.493057250976562, "global_step": 280248, "epoch": 3376} {"train_loss": -25.652008056640625, "global_step": 280249, "epoch": 3376} {"train_loss": -25.29355239868164, "global_step": 280250, "epoch": 3376} {"train_loss": -25.5611629486084, "global_step": 280251, "epoch": 3376} {"train_loss": -25.27174186706543, "global_step": 280252, "epoch": 3376} {"train_loss": -25.084903717041016, "global_step": 280253, "epoch": 3376} {"train_loss": -25.706195831298828, "global_step": 280254, "epoch": 3376} {"train_loss": -25.36989402770996, "global_step": 280255, "epoch": 3376} {"train_loss": -25.76936912536621, "global_step": 280256, "epoch": 3376} {"train_loss": -25.281320571899414, "global_step": 280257, "epoch": 3376} {"train_loss": -25.408527374267578, "global_step": 280258, "epoch": 3376} {"train_loss": -25.454248428344727, "global_step": 280259, "epoch": 3376} {"train_loss": -25.75349235534668, "global_step": 280260, "epoch": 3376} {"train_loss": -25.540109634399414, "global_step": 280261, "epoch": 3376} {"train_loss": -25.25167465209961, "global_step": 280262, "epoch": 3376} {"train_loss": -25.379947662353516, "global_step": 280263, "epoch": 3376} {"train_loss": -25.701892852783203, "global_step": 280264, "epoch": 3376} {"train_loss": -25.51192283630371, "global_step": 280265, "epoch": 3376} {"train_loss": -25.218215942382812, "global_step": 280266, "epoch": 3376} {"train_loss": -25.09341812133789, "global_step": 280267, "epoch": 3376} {"train_loss": -25.637327194213867, "global_step": 280268, "epoch": 3376} {"train_loss": -25.272342681884766, "global_step": 280269, "epoch": 3376} {"train_loss": -25.36504364013672, "global_step": 280270, "epoch": 3376} {"train_loss": -25.558746337890625, "global_step": 280271, "epoch": 3376} {"train_loss": -25.677799224853516, "global_step": 280272, "epoch": 3376} {"train_loss": -25.577661514282227, "global_step": 280273, "epoch": 3376} {"train_loss": -25.264013290405273, "global_step": 280274, "epoch": 3376} {"train_loss": -25.44772720336914, "global_step": 280275, "epoch": 3376} {"train_loss": -25.20465660095215, "global_step": 280276, "epoch": 3376} {"train_loss": -25.74712562561035, "global_step": 280277, "epoch": 3376} {"train_loss": -25.79408073425293, "global_step": 280278, "epoch": 3376} {"train_loss": -25.43624496459961, "global_step": 280279, "epoch": 3376} {"train_loss": -24.7523250579834, "global_step": 280280, "epoch": 3376} {"train_loss": -23.9483585357666, "global_step": 280281, "epoch": 3376} {"train_loss": -23.17042350769043, "global_step": 280282, "epoch": 3376} {"train_loss": -24.28397560119629, "global_step": 280283, "epoch": 3376} {"train_loss": -24.326858520507812, "global_step": 280284, "epoch": 3376} {"train_loss": -24.948328018188477, "global_step": 280285, "epoch": 3376} {"train_loss": -24.62504768371582, "global_step": 280286, "epoch": 3376} {"train_loss": -24.715734481811523, "global_step": 280287, "epoch": 3376} {"train_loss": -24.874561309814453, "global_step": 280288, "epoch": 3376} {"train_loss": -25.170211791992188, "global_step": 280289, "epoch": 3376} {"train_loss": -25.255479215139367, "global_step": 280290, "epoch": 3376, "val_loss": 7045433.0} {"train_loss": -24.438140869140625, "global_step": 280291, "epoch": 3377} {"train_loss": -24.707929611206055, "global_step": 280292, "epoch": 3377} {"train_loss": -24.573158264160156, "global_step": 280293, "epoch": 3377} {"train_loss": -24.55042839050293, "global_step": 280294, "epoch": 3377} {"train_loss": -24.5446720123291, "global_step": 280295, "epoch": 3377} {"train_loss": -24.836292266845703, "global_step": 280296, "epoch": 3377} {"train_loss": -24.7296142578125, "global_step": 280297, "epoch": 3377} {"train_loss": -24.665388107299805, "global_step": 280298, "epoch": 3377} {"train_loss": -24.617589950561523, "global_step": 280299, "epoch": 3377} {"train_loss": -24.647109985351562, "global_step": 280300, "epoch": 3377} {"train_loss": -24.618406295776367, "global_step": 280301, "epoch": 3377} {"train_loss": -24.62373924255371, "global_step": 280302, "epoch": 3377} {"train_loss": -24.93071746826172, "global_step": 280303, "epoch": 3377} {"train_loss": -24.812732696533203, "global_step": 280304, "epoch": 3377} {"train_loss": -25.011442184448242, "global_step": 280305, "epoch": 3377} {"train_loss": -25.301149368286133, "global_step": 280306, "epoch": 3377} {"train_loss": -24.826339721679688, "global_step": 280307, "epoch": 3377} {"train_loss": -25.079458236694336, "global_step": 280308, "epoch": 3377} {"train_loss": -25.153396606445312, "global_step": 280309, "epoch": 3377} {"train_loss": -24.88519859313965, "global_step": 280310, "epoch": 3377} {"train_loss": -24.809492111206055, "global_step": 280311, "epoch": 3377} {"train_loss": -24.975675582885742, "global_step": 280312, "epoch": 3377} {"train_loss": -25.190122604370117, "global_step": 280313, "epoch": 3377} {"train_loss": -25.20902442932129, "global_step": 280314, "epoch": 3377} {"train_loss": -25.176074981689453, "global_step": 280315, "epoch": 3377} {"train_loss": -25.12057876586914, "global_step": 280316, "epoch": 3377} {"train_loss": -25.36051368713379, "global_step": 280317, "epoch": 3377} {"train_loss": -25.5050048828125, "global_step": 280318, "epoch": 3377} {"train_loss": -25.187362670898438, "global_step": 280319, "epoch": 3377} {"train_loss": -25.52443504333496, "global_step": 280320, "epoch": 3377} {"train_loss": -25.440231323242188, "global_step": 280321, "epoch": 3377} {"train_loss": -25.8509464263916, "global_step": 280322, "epoch": 3377} {"train_loss": -25.4757080078125, "global_step": 280323, "epoch": 3377} {"train_loss": -25.201644897460938, "global_step": 280324, "epoch": 3377} {"train_loss": -25.6563777923584, "global_step": 280325, "epoch": 3377} {"train_loss": -25.605863571166992, "global_step": 280326, "epoch": 3377} {"train_loss": -25.458189010620117, "global_step": 280327, "epoch": 3377} {"train_loss": -25.64039421081543, "global_step": 280328, "epoch": 3377} {"train_loss": -25.53187370300293, "global_step": 280329, "epoch": 3377} {"train_loss": -25.235403060913086, "global_step": 280330, "epoch": 3377} {"train_loss": -25.437599182128906, "global_step": 280331, "epoch": 3377} {"train_loss": -25.535991668701172, "global_step": 280332, "epoch": 3377} {"train_loss": -25.6824951171875, "global_step": 280333, "epoch": 3377} {"train_loss": -25.4050350189209, "global_step": 280334, "epoch": 3377} {"train_loss": -25.66814613342285, "global_step": 280335, "epoch": 3377} {"train_loss": -25.45790672302246, "global_step": 280336, "epoch": 3377} {"train_loss": -25.52937126159668, "global_step": 280337, "epoch": 3377} {"train_loss": -25.796356201171875, "global_step": 280338, "epoch": 3377} {"train_loss": -25.898725509643555, "global_step": 280339, "epoch": 3377} {"train_loss": -26.08098793029785, "global_step": 280340, "epoch": 3377} {"train_loss": -25.206024169921875, "global_step": 280341, "epoch": 3377} {"train_loss": -25.412546157836914, "global_step": 280342, "epoch": 3377} {"train_loss": -24.947845458984375, "global_step": 280343, "epoch": 3377} {"train_loss": -24.884695053100586, "global_step": 280344, "epoch": 3377} {"train_loss": -25.245023727416992, "global_step": 280345, "epoch": 3377} {"train_loss": -25.359708786010742, "global_step": 280346, "epoch": 3377} {"train_loss": -25.184125900268555, "global_step": 280347, "epoch": 3377} {"train_loss": -25.607343673706055, "global_step": 280348, "epoch": 3377} {"train_loss": -25.228424072265625, "global_step": 280349, "epoch": 3377} {"train_loss": -25.519325256347656, "global_step": 280350, "epoch": 3377} {"train_loss": -25.551416397094727, "global_step": 280351, "epoch": 3377} {"train_loss": -25.308349609375, "global_step": 280352, "epoch": 3377} {"train_loss": -25.630605697631836, "global_step": 280353, "epoch": 3377} {"train_loss": -25.506223678588867, "global_step": 280354, "epoch": 3377} {"train_loss": -25.38726234436035, "global_step": 280355, "epoch": 3377} {"train_loss": -25.318281173706055, "global_step": 280356, "epoch": 3377} {"train_loss": -25.817646026611328, "global_step": 280357, "epoch": 3377} {"train_loss": -25.0587100982666, "global_step": 280358, "epoch": 3377} {"train_loss": -25.590673446655273, "global_step": 280359, "epoch": 3377} {"train_loss": -25.22051429748535, "global_step": 280360, "epoch": 3377} {"train_loss": -25.516620635986328, "global_step": 280361, "epoch": 3377} {"train_loss": -25.441707611083984, "global_step": 280362, "epoch": 3377} {"train_loss": -25.522031784057617, "global_step": 280363, "epoch": 3377} {"train_loss": -25.61226463317871, "global_step": 280364, "epoch": 3377} {"train_loss": -25.466764450073242, "global_step": 280365, "epoch": 3377} {"train_loss": -25.498525619506836, "global_step": 280366, "epoch": 3377} {"train_loss": -25.585981369018555, "global_step": 280367, "epoch": 3377} {"train_loss": -25.293088912963867, "global_step": 280368, "epoch": 3377} {"train_loss": -25.37856101989746, "global_step": 280369, "epoch": 3377} {"train_loss": -25.36615562438965, "global_step": 280370, "epoch": 3377} {"train_loss": -25.441329956054688, "global_step": 280371, "epoch": 3377} {"train_loss": -25.382551193237305, "global_step": 280372, "epoch": 3377} {"train_loss": -25.261338590139367, "global_step": 280373, "epoch": 3377, "val_loss": 7073928.0} {"train_loss": -25.24601173400879, "global_step": 280374, "epoch": 3378} {"train_loss": -25.11819839477539, "global_step": 280375, "epoch": 3378} {"train_loss": -25.313037872314453, "global_step": 280376, "epoch": 3378} {"train_loss": -25.05768394470215, "global_step": 280377, "epoch": 3378} {"train_loss": -25.072847366333008, "global_step": 280378, "epoch": 3378} {"train_loss": -25.142194747924805, "global_step": 280379, "epoch": 3378} {"train_loss": -25.334617614746094, "global_step": 280380, "epoch": 3378} {"train_loss": -25.013399124145508, "global_step": 280381, "epoch": 3378} {"train_loss": -25.1272029876709, "global_step": 280382, "epoch": 3378} {"train_loss": -24.816028594970703, "global_step": 280383, "epoch": 3378} {"train_loss": -24.94352149963379, "global_step": 280384, "epoch": 3378} {"train_loss": -25.24293327331543, "global_step": 280385, "epoch": 3378} {"train_loss": -24.777475357055664, "global_step": 280386, "epoch": 3378} {"train_loss": -25.207792282104492, "global_step": 280387, "epoch": 3378} {"train_loss": -25.361038208007812, "global_step": 280388, "epoch": 3378} {"train_loss": -25.29328727722168, "global_step": 280389, "epoch": 3378} {"train_loss": -25.138233184814453, "global_step": 280390, "epoch": 3378} {"train_loss": -25.318161010742188, "global_step": 280391, "epoch": 3378} {"train_loss": -24.98737907409668, "global_step": 280392, "epoch": 3378} {"train_loss": -25.26336669921875, "global_step": 280393, "epoch": 3378} {"train_loss": -25.074506759643555, "global_step": 280394, "epoch": 3378} {"train_loss": -25.32547378540039, "global_step": 280395, "epoch": 3378} {"train_loss": -25.05693244934082, "global_step": 280396, "epoch": 3378} {"train_loss": -25.270343780517578, "global_step": 280397, "epoch": 3378} {"train_loss": -25.482954025268555, "global_step": 280398, "epoch": 3378} {"train_loss": -25.683496475219727, "global_step": 280399, "epoch": 3378} {"train_loss": -25.178617477416992, "global_step": 280400, "epoch": 3378} {"train_loss": -25.32645034790039, "global_step": 280401, "epoch": 3378} {"train_loss": -25.254730224609375, "global_step": 280402, "epoch": 3378} {"train_loss": -25.35495948791504, "global_step": 280403, "epoch": 3378} {"train_loss": -25.182117462158203, "global_step": 280404, "epoch": 3378} {"train_loss": -25.33056640625, "global_step": 280405, "epoch": 3378} {"train_loss": -25.36298179626465, "global_step": 280406, "epoch": 3378} {"train_loss": -25.248449325561523, "global_step": 280407, "epoch": 3378} {"train_loss": -25.347145080566406, "global_step": 280408, "epoch": 3378} {"train_loss": -25.38080406188965, "global_step": 280409, "epoch": 3378} {"train_loss": -25.7417049407959, "global_step": 280410, "epoch": 3378} {"train_loss": -25.46402359008789, "global_step": 280411, "epoch": 3378} {"train_loss": -25.50572395324707, "global_step": 280412, "epoch": 3378} {"train_loss": -25.376224517822266, "global_step": 280413, "epoch": 3378} {"train_loss": -25.145523071289062, "global_step": 280414, "epoch": 3378} {"train_loss": -25.646961212158203, "global_step": 280415, "epoch": 3378} {"train_loss": -25.497142791748047, "global_step": 280416, "epoch": 3378} {"train_loss": -25.5264892578125, "global_step": 280417, "epoch": 3378} {"train_loss": -25.69170570373535, "global_step": 280418, "epoch": 3378} {"train_loss": -25.192243576049805, "global_step": 280419, "epoch": 3378} {"train_loss": -25.622167587280273, "global_step": 280420, "epoch": 3378} {"train_loss": -25.114059448242188, "global_step": 280421, "epoch": 3378} {"train_loss": -25.117124557495117, "global_step": 280422, "epoch": 3378} {"train_loss": -24.74286460876465, "global_step": 280423, "epoch": 3378} {"train_loss": -25.613147735595703, "global_step": 280424, "epoch": 3378} {"train_loss": -25.28470230102539, "global_step": 280425, "epoch": 3378} {"train_loss": -25.487398147583008, "global_step": 280426, "epoch": 3378} {"train_loss": -25.783979415893555, "global_step": 280427, "epoch": 3378} {"train_loss": -25.695392608642578, "global_step": 280428, "epoch": 3378} {"train_loss": -25.485986709594727, "global_step": 280429, "epoch": 3378} {"train_loss": -25.73768424987793, "global_step": 280430, "epoch": 3378} {"train_loss": -25.414072036743164, "global_step": 280431, "epoch": 3378} {"train_loss": -25.317663192749023, "global_step": 280432, "epoch": 3378} {"train_loss": -25.29758644104004, "global_step": 280433, "epoch": 3378} {"train_loss": -25.408967971801758, "global_step": 280434, "epoch": 3378} {"train_loss": -25.66348648071289, "global_step": 280435, "epoch": 3378} {"train_loss": -25.159666061401367, "global_step": 280436, "epoch": 3378} {"train_loss": -25.572805404663086, "global_step": 280437, "epoch": 3378} {"train_loss": -25.6899471282959, "global_step": 280438, "epoch": 3378} {"train_loss": -25.41182518005371, "global_step": 280439, "epoch": 3378} {"train_loss": -25.285886764526367, "global_step": 280440, "epoch": 3378} {"train_loss": -25.166135787963867, "global_step": 280441, "epoch": 3378} {"train_loss": -25.721195220947266, "global_step": 280442, "epoch": 3378} {"train_loss": -25.72212028503418, "global_step": 280443, "epoch": 3378} {"train_loss": -25.52705192565918, "global_step": 280444, "epoch": 3378} {"train_loss": -25.432172775268555, "global_step": 280445, "epoch": 3378} {"train_loss": -25.389299392700195, "global_step": 280446, "epoch": 3378} {"train_loss": -25.4691219329834, "global_step": 280447, "epoch": 3378} {"train_loss": -25.50168800354004, "global_step": 280448, "epoch": 3378} {"train_loss": -25.087827682495117, "global_step": 280449, "epoch": 3378} {"train_loss": -25.344091415405273, "global_step": 280450, "epoch": 3378} {"train_loss": -25.442798614501953, "global_step": 280451, "epoch": 3378} {"train_loss": -25.441762924194336, "global_step": 280452, "epoch": 3378} {"train_loss": -25.301748275756836, "global_step": 280453, "epoch": 3378} {"train_loss": -25.30790138244629, "global_step": 280454, "epoch": 3378} {"train_loss": -25.40128517150879, "global_step": 280455, "epoch": 3378} {"train_loss": -25.34647031577237, "global_step": 280456, "epoch": 3378, "val_loss": 7028801.0} {"train_loss": -24.97359848022461, "global_step": 280457, "epoch": 3379} {"train_loss": -24.85129737854004, "global_step": 280458, "epoch": 3379} {"train_loss": -24.96013832092285, "global_step": 280459, "epoch": 3379} {"train_loss": -25.006418228149414, "global_step": 280460, "epoch": 3379} {"train_loss": -24.902109146118164, "global_step": 280461, "epoch": 3379} {"train_loss": -24.518516540527344, "global_step": 280462, "epoch": 3379} {"train_loss": -24.953601837158203, "global_step": 280463, "epoch": 3379} {"train_loss": -25.314105987548828, "global_step": 280464, "epoch": 3379} {"train_loss": -24.527729034423828, "global_step": 280465, "epoch": 3379} {"train_loss": -24.767011642456055, "global_step": 280466, "epoch": 3379} {"train_loss": -25.359773635864258, "global_step": 280467, "epoch": 3379} {"train_loss": -24.815439224243164, "global_step": 280468, "epoch": 3379} {"train_loss": -25.522558212280273, "global_step": 280469, "epoch": 3379} {"train_loss": -24.581932067871094, "global_step": 280470, "epoch": 3379} {"train_loss": -25.152633666992188, "global_step": 280471, "epoch": 3379} {"train_loss": -24.686941146850586, "global_step": 280472, "epoch": 3379} {"train_loss": -25.05134391784668, "global_step": 280473, "epoch": 3379} {"train_loss": -25.073440551757812, "global_step": 280474, "epoch": 3379} {"train_loss": -24.852237701416016, "global_step": 280475, "epoch": 3379} {"train_loss": -25.303512573242188, "global_step": 280476, "epoch": 3379} {"train_loss": -24.695295333862305, "global_step": 280477, "epoch": 3379} {"train_loss": -25.304737091064453, "global_step": 280478, "epoch": 3379} {"train_loss": -24.93874740600586, "global_step": 280479, "epoch": 3379} {"train_loss": -25.409494400024414, "global_step": 280480, "epoch": 3379} {"train_loss": -25.168119430541992, "global_step": 280481, "epoch": 3379} {"train_loss": -25.02203369140625, "global_step": 280482, "epoch": 3379} {"train_loss": -25.552270889282227, "global_step": 280483, "epoch": 3379} {"train_loss": -24.95045280456543, "global_step": 280484, "epoch": 3379} {"train_loss": -25.219228744506836, "global_step": 280485, "epoch": 3379} {"train_loss": -25.607690811157227, "global_step": 280486, "epoch": 3379} {"train_loss": -25.33024024963379, "global_step": 280487, "epoch": 3379} {"train_loss": -25.299312591552734, "global_step": 280488, "epoch": 3379} {"train_loss": -25.323816299438477, "global_step": 280489, "epoch": 3379} {"train_loss": -24.884389877319336, "global_step": 280490, "epoch": 3379} {"train_loss": -24.914398193359375, "global_step": 280491, "epoch": 3379} {"train_loss": -25.056013107299805, "global_step": 280492, "epoch": 3379} {"train_loss": -24.985288619995117, "global_step": 280493, "epoch": 3379} {"train_loss": -25.185426712036133, "global_step": 280494, "epoch": 3379} {"train_loss": -25.34308433532715, "global_step": 280495, "epoch": 3379} {"train_loss": -25.267841339111328, "global_step": 280496, "epoch": 3379} {"train_loss": -25.065217971801758, "global_step": 280497, "epoch": 3379} {"train_loss": -25.174518585205078, "global_step": 280498, "epoch": 3379} {"train_loss": -25.16069793701172, "global_step": 280499, "epoch": 3379} {"train_loss": -24.983728408813477, "global_step": 280500, "epoch": 3379} {"train_loss": -25.424652099609375, "global_step": 280501, "epoch": 3379} {"train_loss": -25.205251693725586, "global_step": 280502, "epoch": 3379} {"train_loss": -25.385229110717773, "global_step": 280503, "epoch": 3379} {"train_loss": -25.38441276550293, "global_step": 280504, "epoch": 3379} {"train_loss": -25.293964385986328, "global_step": 280505, "epoch": 3379} {"train_loss": -25.64031982421875, "global_step": 280506, "epoch": 3379} {"train_loss": -25.74518394470215, "global_step": 280507, "epoch": 3379} {"train_loss": -25.381893157958984, "global_step": 280508, "epoch": 3379} {"train_loss": -25.569541931152344, "global_step": 280509, "epoch": 3379} {"train_loss": -25.570093154907227, "global_step": 280510, "epoch": 3379} {"train_loss": -25.329992294311523, "global_step": 280511, "epoch": 3379} {"train_loss": -25.71254539489746, "global_step": 280512, "epoch": 3379} {"train_loss": -25.320863723754883, "global_step": 280513, "epoch": 3379} {"train_loss": -25.41284942626953, "global_step": 280514, "epoch": 3379} {"train_loss": -25.874923706054688, "global_step": 280515, "epoch": 3379} {"train_loss": -25.433229446411133, "global_step": 280516, "epoch": 3379} {"train_loss": -25.621824264526367, "global_step": 280517, "epoch": 3379} {"train_loss": -25.187108993530273, "global_step": 280518, "epoch": 3379} {"train_loss": -25.711048126220703, "global_step": 280519, "epoch": 3379} {"train_loss": -25.463645935058594, "global_step": 280520, "epoch": 3379} {"train_loss": -25.4314022064209, "global_step": 280521, "epoch": 3379} {"train_loss": -25.19287109375, "global_step": 280522, "epoch": 3379} {"train_loss": -25.331235885620117, "global_step": 280523, "epoch": 3379} {"train_loss": -25.638639450073242, "global_step": 280524, "epoch": 3379} {"train_loss": -25.111572265625, "global_step": 280525, "epoch": 3379} {"train_loss": -25.173675537109375, "global_step": 280526, "epoch": 3379} {"train_loss": -25.47300148010254, "global_step": 280527, "epoch": 3379} {"train_loss": -25.347469329833984, "global_step": 280528, "epoch": 3379} {"train_loss": -25.110692977905273, "global_step": 280529, "epoch": 3379} {"train_loss": -24.86908721923828, "global_step": 280530, "epoch": 3379} {"train_loss": -25.485801696777344, "global_step": 280531, "epoch": 3379} {"train_loss": -25.793676376342773, "global_step": 280532, "epoch": 3379} {"train_loss": -25.54629898071289, "global_step": 280533, "epoch": 3379} {"train_loss": -25.262948989868164, "global_step": 280534, "epoch": 3379} {"train_loss": -25.14686393737793, "global_step": 280535, "epoch": 3379} {"train_loss": -25.18044662475586, "global_step": 280536, "epoch": 3379} {"train_loss": -24.998151779174805, "global_step": 280537, "epoch": 3379} {"train_loss": -25.405683517456055, "global_step": 280538, "epoch": 3379} {"train_loss": -25.207645600100598, "global_step": 280539, "epoch": 3379, "val_loss": 7130300.0} {"train_loss": -24.428049087524414, "global_step": 280540, "epoch": 3380} {"train_loss": -25.231382369995117, "global_step": 280541, "epoch": 3380} {"train_loss": -24.365903854370117, "global_step": 280542, "epoch": 3380} {"train_loss": -24.92127799987793, "global_step": 280543, "epoch": 3380} {"train_loss": -24.787763595581055, "global_step": 280544, "epoch": 3380} {"train_loss": -25.05510711669922, "global_step": 280545, "epoch": 3380} {"train_loss": -24.746295928955078, "global_step": 280546, "epoch": 3380} {"train_loss": -25.092145919799805, "global_step": 280547, "epoch": 3380} {"train_loss": -24.996366500854492, "global_step": 280548, "epoch": 3380} {"train_loss": -25.509092330932617, "global_step": 280549, "epoch": 3380} {"train_loss": -25.458932876586914, "global_step": 280550, "epoch": 3380} {"train_loss": -25.315258026123047, "global_step": 280551, "epoch": 3380} {"train_loss": -24.829620361328125, "global_step": 280552, "epoch": 3380} {"train_loss": -25.178125381469727, "global_step": 280553, "epoch": 3380} {"train_loss": -25.454662322998047, "global_step": 280554, "epoch": 3380} {"train_loss": -25.004940032958984, "global_step": 280555, "epoch": 3380} {"train_loss": -25.00244903564453, "global_step": 280556, "epoch": 3380} {"train_loss": -25.07870101928711, "global_step": 280557, "epoch": 3380} {"train_loss": -25.55179214477539, "global_step": 280558, "epoch": 3380} {"train_loss": -25.486814498901367, "global_step": 280559, "epoch": 3380} {"train_loss": -25.444808959960938, "global_step": 280560, "epoch": 3380} {"train_loss": -25.36360740661621, "global_step": 280561, "epoch": 3380} {"train_loss": -25.58723258972168, "global_step": 280562, "epoch": 3380} {"train_loss": -24.973804473876953, "global_step": 280563, "epoch": 3380} {"train_loss": -24.876789093017578, "global_step": 280564, "epoch": 3380} {"train_loss": -25.219682693481445, "global_step": 280565, "epoch": 3380} {"train_loss": -25.688247680664062, "global_step": 280566, "epoch": 3380} {"train_loss": -25.344633102416992, "global_step": 280567, "epoch": 3380} {"train_loss": -25.329626083374023, "global_step": 280568, "epoch": 3380} {"train_loss": -25.41497802734375, "global_step": 280569, "epoch": 3380} {"train_loss": -25.56610679626465, "global_step": 280570, "epoch": 3380} {"train_loss": -25.471546173095703, "global_step": 280571, "epoch": 3380} {"train_loss": -25.584104537963867, "global_step": 280572, "epoch": 3380} {"train_loss": -25.76118278503418, "global_step": 280573, "epoch": 3380} {"train_loss": -25.60721778869629, "global_step": 280574, "epoch": 3380} {"train_loss": -25.451194763183594, "global_step": 280575, "epoch": 3380} {"train_loss": -25.391704559326172, "global_step": 280576, "epoch": 3380} {"train_loss": -25.79522705078125, "global_step": 280577, "epoch": 3380} {"train_loss": -25.542898178100586, "global_step": 280578, "epoch": 3380} {"train_loss": -25.67995262145996, "global_step": 280579, "epoch": 3380} {"train_loss": -25.486804962158203, "global_step": 280580, "epoch": 3380} {"train_loss": -25.49566650390625, "global_step": 280581, "epoch": 3380} {"train_loss": -25.638757705688477, "global_step": 280582, "epoch": 3380} {"train_loss": -25.347341537475586, "global_step": 280583, "epoch": 3380} {"train_loss": -25.52999496459961, "global_step": 280584, "epoch": 3380} {"train_loss": -25.566072463989258, "global_step": 280585, "epoch": 3380} {"train_loss": -25.590892791748047, "global_step": 280586, "epoch": 3380} {"train_loss": -25.408849716186523, "global_step": 280587, "epoch": 3380} {"train_loss": -25.8978271484375, "global_step": 280588, "epoch": 3380} {"train_loss": -25.537452697753906, "global_step": 280589, "epoch": 3380} {"train_loss": -25.358829498291016, "global_step": 280590, "epoch": 3380} {"train_loss": -24.880773544311523, "global_step": 280591, "epoch": 3380} {"train_loss": -25.130752563476562, "global_step": 280592, "epoch": 3380} {"train_loss": -25.29360580444336, "global_step": 280593, "epoch": 3380} {"train_loss": -25.45509147644043, "global_step": 280594, "epoch": 3380} {"train_loss": -25.3665771484375, "global_step": 280595, "epoch": 3380} {"train_loss": -25.42596435546875, "global_step": 280596, "epoch": 3380} {"train_loss": -25.315532684326172, "global_step": 280597, "epoch": 3380} {"train_loss": -25.36087989807129, "global_step": 280598, "epoch": 3380} {"train_loss": -25.36739158630371, "global_step": 280599, "epoch": 3380} {"train_loss": -25.46224021911621, "global_step": 280600, "epoch": 3380} {"train_loss": -25.351774215698242, "global_step": 280601, "epoch": 3380} {"train_loss": -25.695402145385742, "global_step": 280602, "epoch": 3380} {"train_loss": -25.604333877563477, "global_step": 280603, "epoch": 3380} {"train_loss": -25.362979888916016, "global_step": 280604, "epoch": 3380} {"train_loss": -25.547292709350586, "global_step": 280605, "epoch": 3380} {"train_loss": -25.11893653869629, "global_step": 280606, "epoch": 3380} {"train_loss": -25.535167694091797, "global_step": 280607, "epoch": 3380} {"train_loss": -25.730451583862305, "global_step": 280608, "epoch": 3380} {"train_loss": -25.26137351989746, "global_step": 280609, "epoch": 3380} {"train_loss": -25.438642501831055, "global_step": 280610, "epoch": 3380} {"train_loss": -25.237974166870117, "global_step": 280611, "epoch": 3380} {"train_loss": -25.144819259643555, "global_step": 280612, "epoch": 3380} {"train_loss": -25.289142608642578, "global_step": 280613, "epoch": 3380} {"train_loss": -25.751989364624023, "global_step": 280614, "epoch": 3380} {"train_loss": -25.163524627685547, "global_step": 280615, "epoch": 3380} {"train_loss": -25.24330711364746, "global_step": 280616, "epoch": 3380} {"train_loss": -25.610692977905273, "global_step": 280617, "epoch": 3380} {"train_loss": -25.300962448120117, "global_step": 280618, "epoch": 3380} {"train_loss": -25.400619506835938, "global_step": 280619, "epoch": 3380} {"train_loss": -25.368518829345703, "global_step": 280620, "epoch": 3380} {"train_loss": -25.6331787109375, "global_step": 280621, "epoch": 3380} {"train_loss": -25.34791466126959, "global_step": 280622, "epoch": 3380, "val_loss": 7112679.0} {"train_loss": -24.203866958618164, "global_step": 280623, "epoch": 3381} {"train_loss": -25.048446655273438, "global_step": 280624, "epoch": 3381} {"train_loss": -24.302358627319336, "global_step": 280625, "epoch": 3381} {"train_loss": -24.988828659057617, "global_step": 280626, "epoch": 3381} {"train_loss": -24.333789825439453, "global_step": 280627, "epoch": 3381} {"train_loss": -24.493087768554688, "global_step": 280628, "epoch": 3381} {"train_loss": -24.745620727539062, "global_step": 280629, "epoch": 3381} {"train_loss": -24.744604110717773, "global_step": 280630, "epoch": 3381} {"train_loss": -24.771198272705078, "global_step": 280631, "epoch": 3381} {"train_loss": -24.800342559814453, "global_step": 280632, "epoch": 3381} {"train_loss": -24.867111206054688, "global_step": 280633, "epoch": 3381} {"train_loss": -24.785930633544922, "global_step": 280634, "epoch": 3381} {"train_loss": -24.691247940063477, "global_step": 280635, "epoch": 3381} {"train_loss": -25.006183624267578, "global_step": 280636, "epoch": 3381} {"train_loss": -24.84299087524414, "global_step": 280637, "epoch": 3381} {"train_loss": -25.17823600769043, "global_step": 280638, "epoch": 3381} {"train_loss": -25.139455795288086, "global_step": 280639, "epoch": 3381} {"train_loss": -25.270584106445312, "global_step": 280640, "epoch": 3381} {"train_loss": -25.299739837646484, "global_step": 280641, "epoch": 3381} {"train_loss": -25.11671257019043, "global_step": 280642, "epoch": 3381} {"train_loss": -25.32635498046875, "global_step": 280643, "epoch": 3381} {"train_loss": -25.148950576782227, "global_step": 280644, "epoch": 3381} {"train_loss": -25.164331436157227, "global_step": 280645, "epoch": 3381} {"train_loss": -25.096027374267578, "global_step": 280646, "epoch": 3381} {"train_loss": -25.391921997070312, "global_step": 280647, "epoch": 3381} {"train_loss": -25.0191593170166, "global_step": 280648, "epoch": 3381} {"train_loss": -25.42380714416504, "global_step": 280649, "epoch": 3381} {"train_loss": -25.46024513244629, "global_step": 280650, "epoch": 3381} {"train_loss": -25.133371353149414, "global_step": 280651, "epoch": 3381} {"train_loss": -25.3199405670166, "global_step": 280652, "epoch": 3381} {"train_loss": -25.187482833862305, "global_step": 280653, "epoch": 3381} {"train_loss": -25.04450798034668, "global_step": 280654, "epoch": 3381} {"train_loss": -25.5262393951416, "global_step": 280655, "epoch": 3381} {"train_loss": -25.326749801635742, "global_step": 280656, "epoch": 3381} {"train_loss": -25.560823440551758, "global_step": 280657, "epoch": 3381} {"train_loss": -24.889944076538086, "global_step": 280658, "epoch": 3381} {"train_loss": -25.469823837280273, "global_step": 280659, "epoch": 3381} {"train_loss": -25.44338607788086, "global_step": 280660, "epoch": 3381} {"train_loss": -25.13155746459961, "global_step": 280661, "epoch": 3381} {"train_loss": -25.65540885925293, "global_step": 280662, "epoch": 3381} {"train_loss": -25.17171859741211, "global_step": 280663, "epoch": 3381} {"train_loss": -25.481948852539062, "global_step": 280664, "epoch": 3381} {"train_loss": -25.457828521728516, "global_step": 280665, "epoch": 3381} {"train_loss": -25.0093936920166, "global_step": 280666, "epoch": 3381} {"train_loss": -25.364103317260742, "global_step": 280667, "epoch": 3381} {"train_loss": -25.180953979492188, "global_step": 280668, "epoch": 3381} {"train_loss": -25.759017944335938, "global_step": 280669, "epoch": 3381} {"train_loss": -25.566974639892578, "global_step": 280670, "epoch": 3381} {"train_loss": -25.39907455444336, "global_step": 280671, "epoch": 3381} {"train_loss": -25.354394912719727, "global_step": 280672, "epoch": 3381} {"train_loss": -25.031997680664062, "global_step": 280673, "epoch": 3381} {"train_loss": -25.406036376953125, "global_step": 280674, "epoch": 3381} {"train_loss": -25.494657516479492, "global_step": 280675, "epoch": 3381} {"train_loss": -25.454465866088867, "global_step": 280676, "epoch": 3381} {"train_loss": -25.403915405273438, "global_step": 280677, "epoch": 3381} {"train_loss": -25.688425064086914, "global_step": 280678, "epoch": 3381} {"train_loss": -25.47981834411621, "global_step": 280679, "epoch": 3381} {"train_loss": -26.177722930908203, "global_step": 280680, "epoch": 3381} {"train_loss": -25.392913818359375, "global_step": 280681, "epoch": 3381} {"train_loss": -25.542959213256836, "global_step": 280682, "epoch": 3381} {"train_loss": -25.099905014038086, "global_step": 280683, "epoch": 3381} {"train_loss": -25.725189208984375, "global_step": 280684, "epoch": 3381} {"train_loss": -25.407148361206055, "global_step": 280685, "epoch": 3381} {"train_loss": -25.635395050048828, "global_step": 280686, "epoch": 3381} {"train_loss": -25.199251174926758, "global_step": 280687, "epoch": 3381} {"train_loss": -25.586572647094727, "global_step": 280688, "epoch": 3381} {"train_loss": -25.32193946838379, "global_step": 280689, "epoch": 3381} {"train_loss": -25.26099967956543, "global_step": 280690, "epoch": 3381} {"train_loss": -25.32389259338379, "global_step": 280691, "epoch": 3381} {"train_loss": -25.377058029174805, "global_step": 280692, "epoch": 3381} {"train_loss": -24.787918090820312, "global_step": 280693, "epoch": 3381} {"train_loss": -25.289682388305664, "global_step": 280694, "epoch": 3381} {"train_loss": -25.285533905029297, "global_step": 280695, "epoch": 3381} {"train_loss": -25.01637840270996, "global_step": 280696, "epoch": 3381} {"train_loss": -25.090774536132812, "global_step": 280697, "epoch": 3381} {"train_loss": -25.169267654418945, "global_step": 280698, "epoch": 3381} {"train_loss": -25.090147018432617, "global_step": 280699, "epoch": 3381} {"train_loss": -25.16382598876953, "global_step": 280700, "epoch": 3381} {"train_loss": -25.324462890625, "global_step": 280701, "epoch": 3381} {"train_loss": -25.24086570739746, "global_step": 280702, "epoch": 3381} {"train_loss": -24.839529037475586, "global_step": 280703, "epoch": 3381} {"train_loss": -25.191762924194336, "global_step": 280704, "epoch": 3381} {"train_loss": -25.189615203673583, "global_step": 280705, "epoch": 3381, "val_loss": 6997586.0} {"train_loss": -24.531034469604492, "global_step": 280706, "epoch": 3382} {"train_loss": -24.334033966064453, "global_step": 280707, "epoch": 3382} {"train_loss": -24.2185115814209, "global_step": 280708, "epoch": 3382} {"train_loss": -23.959203720092773, "global_step": 280709, "epoch": 3382} {"train_loss": -24.313369750976562, "global_step": 280710, "epoch": 3382} {"train_loss": -24.841432571411133, "global_step": 280711, "epoch": 3382} {"train_loss": -25.061847686767578, "global_step": 280712, "epoch": 3382} {"train_loss": -24.506853103637695, "global_step": 280713, "epoch": 3382} {"train_loss": -24.53584098815918, "global_step": 280714, "epoch": 3382} {"train_loss": -25.14826011657715, "global_step": 280715, "epoch": 3382} {"train_loss": -24.579776763916016, "global_step": 280716, "epoch": 3382} {"train_loss": -25.098800659179688, "global_step": 280717, "epoch": 3382} {"train_loss": -24.998044967651367, "global_step": 280718, "epoch": 3382} {"train_loss": -24.540117263793945, "global_step": 280719, "epoch": 3382} {"train_loss": -25.128225326538086, "global_step": 280720, "epoch": 3382} {"train_loss": -25.44078826904297, "global_step": 280721, "epoch": 3382} {"train_loss": -24.863815307617188, "global_step": 280722, "epoch": 3382} {"train_loss": -25.204797744750977, "global_step": 280723, "epoch": 3382} {"train_loss": -25.322572708129883, "global_step": 280724, "epoch": 3382} {"train_loss": -25.186344146728516, "global_step": 280725, "epoch": 3382} {"train_loss": -25.08571434020996, "global_step": 280726, "epoch": 3382} {"train_loss": -25.16097068786621, "global_step": 280727, "epoch": 3382} {"train_loss": -25.3652400970459, "global_step": 280728, "epoch": 3382} {"train_loss": -25.268033981323242, "global_step": 280729, "epoch": 3382} {"train_loss": -25.272598266601562, "global_step": 280730, "epoch": 3382} {"train_loss": -25.5096378326416, "global_step": 280731, "epoch": 3382} {"train_loss": -25.1723575592041, "global_step": 280732, "epoch": 3382} {"train_loss": -25.204662322998047, "global_step": 280733, "epoch": 3382} {"train_loss": -24.97882080078125, "global_step": 280734, "epoch": 3382} {"train_loss": -25.104278564453125, "global_step": 280735, "epoch": 3382} {"train_loss": -25.422870635986328, "global_step": 280736, "epoch": 3382} {"train_loss": -25.162900924682617, "global_step": 280737, "epoch": 3382} {"train_loss": -25.463415145874023, "global_step": 280738, "epoch": 3382} {"train_loss": -24.967321395874023, "global_step": 280739, "epoch": 3382} {"train_loss": -25.3659610748291, "global_step": 280740, "epoch": 3382} {"train_loss": -25.22206687927246, "global_step": 280741, "epoch": 3382} {"train_loss": -25.181884765625, "global_step": 280742, "epoch": 3382} {"train_loss": -25.3701114654541, "global_step": 280743, "epoch": 3382} {"train_loss": -25.516067504882812, "global_step": 280744, "epoch": 3382} {"train_loss": -25.485828399658203, "global_step": 280745, "epoch": 3382} {"train_loss": -25.347309112548828, "global_step": 280746, "epoch": 3382} {"train_loss": -25.78473472595215, "global_step": 280747, "epoch": 3382} {"train_loss": -25.293493270874023, "global_step": 280748, "epoch": 3382} {"train_loss": -25.628080368041992, "global_step": 280749, "epoch": 3382} {"train_loss": -25.382925033569336, "global_step": 280750, "epoch": 3382} {"train_loss": -25.859174728393555, "global_step": 280751, "epoch": 3382} {"train_loss": -25.467885971069336, "global_step": 280752, "epoch": 3382} {"train_loss": -25.922876358032227, "global_step": 280753, "epoch": 3382} {"train_loss": -25.570959091186523, "global_step": 280754, "epoch": 3382} {"train_loss": -25.525693893432617, "global_step": 280755, "epoch": 3382} {"train_loss": -25.426122665405273, "global_step": 280756, "epoch": 3382} {"train_loss": -25.449954986572266, "global_step": 280757, "epoch": 3382} {"train_loss": -25.49469566345215, "global_step": 280758, "epoch": 3382} {"train_loss": -25.735538482666016, "global_step": 280759, "epoch": 3382} {"train_loss": -25.591032028198242, "global_step": 280760, "epoch": 3382} {"train_loss": -25.6713809967041, "global_step": 280761, "epoch": 3382} {"train_loss": -25.84528160095215, "global_step": 280762, "epoch": 3382} {"train_loss": -25.38365364074707, "global_step": 280763, "epoch": 3382} {"train_loss": -25.129592895507812, "global_step": 280764, "epoch": 3382} {"train_loss": -25.654220581054688, "global_step": 280765, "epoch": 3382} {"train_loss": -25.6779727935791, "global_step": 280766, "epoch": 3382} {"train_loss": -25.502243041992188, "global_step": 280767, "epoch": 3382} {"train_loss": -25.4821834564209, "global_step": 280768, "epoch": 3382} {"train_loss": -25.194055557250977, "global_step": 280769, "epoch": 3382} {"train_loss": -25.85491943359375, "global_step": 280770, "epoch": 3382} {"train_loss": -25.13654327392578, "global_step": 280771, "epoch": 3382} {"train_loss": -25.40427017211914, "global_step": 280772, "epoch": 3382} {"train_loss": -25.28061866760254, "global_step": 280773, "epoch": 3382} {"train_loss": -25.65118980407715, "global_step": 280774, "epoch": 3382} {"train_loss": -25.392425537109375, "global_step": 280775, "epoch": 3382} {"train_loss": -25.240140914916992, "global_step": 280776, "epoch": 3382} {"train_loss": -25.674161911010742, "global_step": 280777, "epoch": 3382} {"train_loss": -25.269258499145508, "global_step": 280778, "epoch": 3382} {"train_loss": -25.273900985717773, "global_step": 280779, "epoch": 3382} {"train_loss": -25.19189453125, "global_step": 280780, "epoch": 3382} {"train_loss": -24.858884811401367, "global_step": 280781, "epoch": 3382} {"train_loss": -24.396039962768555, "global_step": 280782, "epoch": 3382} {"train_loss": -24.57295036315918, "global_step": 280783, "epoch": 3382} {"train_loss": -24.62696075439453, "global_step": 280784, "epoch": 3382} {"train_loss": -25.459354400634766, "global_step": 280785, "epoch": 3382} {"train_loss": -24.59003257751465, "global_step": 280786, "epoch": 3382} {"train_loss": -25.129735946655273, "global_step": 280787, "epoch": 3382} {"train_loss": -25.201584827469055, "global_step": 280788, "epoch": 3382, "val_loss": 7052472.0} {"train_loss": -22.300886154174805, "global_step": 280789, "epoch": 3383} {"train_loss": -23.803495407104492, "global_step": 280790, "epoch": 3383} {"train_loss": -24.657367706298828, "global_step": 280791, "epoch": 3383} {"train_loss": -23.233856201171875, "global_step": 280792, "epoch": 3383} {"train_loss": -24.41455841064453, "global_step": 280793, "epoch": 3383} {"train_loss": -23.979856491088867, "global_step": 280794, "epoch": 3383} {"train_loss": -24.519046783447266, "global_step": 280795, "epoch": 3383} {"train_loss": -24.0175724029541, "global_step": 280796, "epoch": 3383} {"train_loss": -24.424123764038086, "global_step": 280797, "epoch": 3383} {"train_loss": -24.565305709838867, "global_step": 280798, "epoch": 3383} {"train_loss": -24.505708694458008, "global_step": 280799, "epoch": 3383} {"train_loss": -24.68720054626465, "global_step": 280800, "epoch": 3383} {"train_loss": -24.853178024291992, "global_step": 280801, "epoch": 3383} {"train_loss": -24.894336700439453, "global_step": 280802, "epoch": 3383} {"train_loss": -24.681989669799805, "global_step": 280803, "epoch": 3383} {"train_loss": -24.698917388916016, "global_step": 280804, "epoch": 3383} {"train_loss": -24.828998565673828, "global_step": 280805, "epoch": 3383} {"train_loss": -24.95783805847168, "global_step": 280806, "epoch": 3383} {"train_loss": -24.718381881713867, "global_step": 280807, "epoch": 3383} {"train_loss": -24.68854522705078, "global_step": 280808, "epoch": 3383} {"train_loss": -24.744441986083984, "global_step": 280809, "epoch": 3383} {"train_loss": -24.741565704345703, "global_step": 280810, "epoch": 3383} {"train_loss": -25.09149169921875, "global_step": 280811, "epoch": 3383} {"train_loss": -24.8280086517334, "global_step": 280812, "epoch": 3383} {"train_loss": -24.759855270385742, "global_step": 280813, "epoch": 3383} {"train_loss": -24.727657318115234, "global_step": 280814, "epoch": 3383} {"train_loss": -24.89577293395996, "global_step": 280815, "epoch": 3383} {"train_loss": -24.923919677734375, "global_step": 280816, "epoch": 3383} {"train_loss": -25.35927963256836, "global_step": 280817, "epoch": 3383} {"train_loss": -24.942737579345703, "global_step": 280818, "epoch": 3383} {"train_loss": -24.919729232788086, "global_step": 280819, "epoch": 3383} {"train_loss": -25.083662033081055, "global_step": 280820, "epoch": 3383} {"train_loss": -24.761655807495117, "global_step": 280821, "epoch": 3383} {"train_loss": -25.353609085083008, "global_step": 280822, "epoch": 3383} {"train_loss": -25.206655502319336, "global_step": 280823, "epoch": 3383} {"train_loss": -25.5245361328125, "global_step": 280824, "epoch": 3383} {"train_loss": -25.28814125061035, "global_step": 280825, "epoch": 3383} {"train_loss": -24.988067626953125, "global_step": 280826, "epoch": 3383} {"train_loss": -25.740766525268555, "global_step": 280827, "epoch": 3383} {"train_loss": -25.09218406677246, "global_step": 280828, "epoch": 3383} {"train_loss": -25.02509880065918, "global_step": 280829, "epoch": 3383} {"train_loss": -25.162059783935547, "global_step": 280830, "epoch": 3383} {"train_loss": -25.638675689697266, "global_step": 280831, "epoch": 3383} {"train_loss": -25.3394775390625, "global_step": 280832, "epoch": 3383} {"train_loss": -25.505605697631836, "global_step": 280833, "epoch": 3383} {"train_loss": -25.641468048095703, "global_step": 280834, "epoch": 3383} {"train_loss": -25.488256454467773, "global_step": 280835, "epoch": 3383} {"train_loss": -25.675113677978516, "global_step": 280836, "epoch": 3383} {"train_loss": -25.235952377319336, "global_step": 280837, "epoch": 3383} {"train_loss": -25.47083854675293, "global_step": 280838, "epoch": 3383} {"train_loss": -25.64803123474121, "global_step": 280839, "epoch": 3383} {"train_loss": -25.23631477355957, "global_step": 280840, "epoch": 3383} {"train_loss": -25.074331283569336, "global_step": 280841, "epoch": 3383} {"train_loss": -25.582149505615234, "global_step": 280842, "epoch": 3383} {"train_loss": -25.48664665222168, "global_step": 280843, "epoch": 3383} {"train_loss": -25.396841049194336, "global_step": 280844, "epoch": 3383} {"train_loss": -25.198671340942383, "global_step": 280845, "epoch": 3383} {"train_loss": -25.669036865234375, "global_step": 280846, "epoch": 3383} {"train_loss": -25.2557373046875, "global_step": 280847, "epoch": 3383} {"train_loss": -25.960147857666016, "global_step": 280848, "epoch": 3383} {"train_loss": -25.354236602783203, "global_step": 280849, "epoch": 3383} {"train_loss": -25.55550193786621, "global_step": 280850, "epoch": 3383} {"train_loss": -24.8924617767334, "global_step": 280851, "epoch": 3383} {"train_loss": -24.430519104003906, "global_step": 280852, "epoch": 3383} {"train_loss": -25.06075096130371, "global_step": 280853, "epoch": 3383} {"train_loss": -25.7651309967041, "global_step": 280854, "epoch": 3383} {"train_loss": -25.21678352355957, "global_step": 280855, "epoch": 3383} {"train_loss": -25.132871627807617, "global_step": 280856, "epoch": 3383} {"train_loss": -25.400924682617188, "global_step": 280857, "epoch": 3383} {"train_loss": -25.34464454650879, "global_step": 280858, "epoch": 3383} {"train_loss": -25.77028465270996, "global_step": 280859, "epoch": 3383} {"train_loss": -25.019149780273438, "global_step": 280860, "epoch": 3383} {"train_loss": -25.482677459716797, "global_step": 280861, "epoch": 3383} {"train_loss": -24.99302101135254, "global_step": 280862, "epoch": 3383} {"train_loss": -25.49921226501465, "global_step": 280863, "epoch": 3383} {"train_loss": -25.556711196899414, "global_step": 280864, "epoch": 3383} {"train_loss": -25.36155128479004, "global_step": 280865, "epoch": 3383} {"train_loss": -25.596839904785156, "global_step": 280866, "epoch": 3383} {"train_loss": -25.29551124572754, "global_step": 280867, "epoch": 3383} {"train_loss": -25.16103172302246, "global_step": 280868, "epoch": 3383} {"train_loss": -25.488697052001953, "global_step": 280869, "epoch": 3383} {"train_loss": -25.310470581054688, "global_step": 280870, "epoch": 3383} {"train_loss": -25.04675081551793, "global_step": 280871, "epoch": 3383, "val_loss": 6933613.0} {"train_loss": -25.352563858032227, "global_step": 280872, "epoch": 3384} {"train_loss": -25.255233764648438, "global_step": 280873, "epoch": 3384} {"train_loss": -25.481382369995117, "global_step": 280874, "epoch": 3384} {"train_loss": -25.58918571472168, "global_step": 280875, "epoch": 3384} {"train_loss": -25.136093139648438, "global_step": 280876, "epoch": 3384} {"train_loss": -25.232471466064453, "global_step": 280877, "epoch": 3384} {"train_loss": -25.417200088500977, "global_step": 280878, "epoch": 3384} {"train_loss": -25.21479606628418, "global_step": 280879, "epoch": 3384} {"train_loss": -25.682025909423828, "global_step": 280880, "epoch": 3384} {"train_loss": -25.089231491088867, "global_step": 280881, "epoch": 3384} {"train_loss": -25.118927001953125, "global_step": 280882, "epoch": 3384} {"train_loss": -25.187652587890625, "global_step": 280883, "epoch": 3384} {"train_loss": -25.290504455566406, "global_step": 280884, "epoch": 3384} {"train_loss": -25.1331844329834, "global_step": 280885, "epoch": 3384} {"train_loss": -25.265241622924805, "global_step": 280886, "epoch": 3384} {"train_loss": -25.381214141845703, "global_step": 280887, "epoch": 3384} {"train_loss": -25.062097549438477, "global_step": 280888, "epoch": 3384} {"train_loss": -25.340595245361328, "global_step": 280889, "epoch": 3384} {"train_loss": -25.512882232666016, "global_step": 280890, "epoch": 3384} {"train_loss": -25.33809471130371, "global_step": 280891, "epoch": 3384} {"train_loss": -25.285585403442383, "global_step": 280892, "epoch": 3384} {"train_loss": -25.50095558166504, "global_step": 280893, "epoch": 3384} {"train_loss": -25.334775924682617, "global_step": 280894, "epoch": 3384} {"train_loss": -25.396055221557617, "global_step": 280895, "epoch": 3384} {"train_loss": -25.268943786621094, "global_step": 280896, "epoch": 3384} {"train_loss": -25.591487884521484, "global_step": 280897, "epoch": 3384} {"train_loss": -25.590530395507812, "global_step": 280898, "epoch": 3384} {"train_loss": -25.219528198242188, "global_step": 280899, "epoch": 3384} {"train_loss": -25.279949188232422, "global_step": 280900, "epoch": 3384} {"train_loss": -25.482641220092773, "global_step": 280901, "epoch": 3384} {"train_loss": -25.165328979492188, "global_step": 280902, "epoch": 3384} {"train_loss": -25.75178337097168, "global_step": 280903, "epoch": 3384} {"train_loss": -25.3092041015625, "global_step": 280904, "epoch": 3384} {"train_loss": -25.351282119750977, "global_step": 280905, "epoch": 3384} {"train_loss": -25.58452033996582, "global_step": 280906, "epoch": 3384} {"train_loss": -25.679004669189453, "global_step": 280907, "epoch": 3384} {"train_loss": -25.292280197143555, "global_step": 280908, "epoch": 3384} {"train_loss": -25.803237915039062, "global_step": 280909, "epoch": 3384} {"train_loss": -25.527751922607422, "global_step": 280910, "epoch": 3384} {"train_loss": -25.841577529907227, "global_step": 280911, "epoch": 3384} {"train_loss": -25.20088005065918, "global_step": 280912, "epoch": 3384} {"train_loss": -25.498830795288086, "global_step": 280913, "epoch": 3384} {"train_loss": -25.521095275878906, "global_step": 280914, "epoch": 3384} {"train_loss": -25.636327743530273, "global_step": 280915, "epoch": 3384} {"train_loss": -25.453933715820312, "global_step": 280916, "epoch": 3384} {"train_loss": -26.027576446533203, "global_step": 280917, "epoch": 3384} {"train_loss": -25.536680221557617, "global_step": 280918, "epoch": 3384} {"train_loss": -25.63433837890625, "global_step": 280919, "epoch": 3384} {"train_loss": -25.15521240234375, "global_step": 280920, "epoch": 3384} {"train_loss": -25.194765090942383, "global_step": 280921, "epoch": 3384} {"train_loss": -25.249467849731445, "global_step": 280922, "epoch": 3384} {"train_loss": -25.55421257019043, "global_step": 280923, "epoch": 3384} {"train_loss": -25.400907516479492, "global_step": 280924, "epoch": 3384} {"train_loss": -25.23825454711914, "global_step": 280925, "epoch": 3384} {"train_loss": -24.470335006713867, "global_step": 280926, "epoch": 3384} {"train_loss": -25.315366744995117, "global_step": 280927, "epoch": 3384} {"train_loss": -25.023250579833984, "global_step": 280928, "epoch": 3384} {"train_loss": -25.10005760192871, "global_step": 280929, "epoch": 3384} {"train_loss": -25.337316513061523, "global_step": 280930, "epoch": 3384} {"train_loss": -25.398183822631836, "global_step": 280931, "epoch": 3384} {"train_loss": -25.242700576782227, "global_step": 280932, "epoch": 3384} {"train_loss": -25.61642837524414, "global_step": 280933, "epoch": 3384} {"train_loss": -25.41219139099121, "global_step": 280934, "epoch": 3384} {"train_loss": -25.608991622924805, "global_step": 280935, "epoch": 3384} {"train_loss": -25.150190353393555, "global_step": 280936, "epoch": 3384} {"train_loss": -25.35867691040039, "global_step": 280937, "epoch": 3384} {"train_loss": -25.688138961791992, "global_step": 280938, "epoch": 3384} {"train_loss": -25.279277801513672, "global_step": 280939, "epoch": 3384} {"train_loss": -25.253782272338867, "global_step": 280940, "epoch": 3384} {"train_loss": -25.121902465820312, "global_step": 280941, "epoch": 3384} {"train_loss": -25.527807235717773, "global_step": 280942, "epoch": 3384} {"train_loss": -25.100976943969727, "global_step": 280943, "epoch": 3384} {"train_loss": -25.280447006225586, "global_step": 280944, "epoch": 3384} {"train_loss": -25.422836303710938, "global_step": 280945, "epoch": 3384} {"train_loss": -25.153181076049805, "global_step": 280946, "epoch": 3384} {"train_loss": -25.71323585510254, "global_step": 280947, "epoch": 3384} {"train_loss": -25.51481819152832, "global_step": 280948, "epoch": 3384} {"train_loss": -25.756744384765625, "global_step": 280949, "epoch": 3384} {"train_loss": -25.248287200927734, "global_step": 280950, "epoch": 3384} {"train_loss": -25.217269897460938, "global_step": 280951, "epoch": 3384} {"train_loss": -25.558778762817383, "global_step": 280952, "epoch": 3384} {"train_loss": -25.48357582092285, "global_step": 280953, "epoch": 3384} {"train_loss": -25.37659677252712, "global_step": 280954, "epoch": 3384, "val_loss": 7045963.5} {"train_loss": -25.134319305419922, "global_step": 280955, "epoch": 3385} {"train_loss": -23.350387573242188, "global_step": 280956, "epoch": 3385} {"train_loss": -22.72015380859375, "global_step": 280957, "epoch": 3385} {"train_loss": -24.506500244140625, "global_step": 280958, "epoch": 3385} {"train_loss": -24.625537872314453, "global_step": 280959, "epoch": 3385} {"train_loss": -24.689346313476562, "global_step": 280960, "epoch": 3385} {"train_loss": -24.816553115844727, "global_step": 280961, "epoch": 3385} {"train_loss": -23.776172637939453, "global_step": 280962, "epoch": 3385} {"train_loss": -24.55961799621582, "global_step": 280963, "epoch": 3385} {"train_loss": -24.705724716186523, "global_step": 280964, "epoch": 3385} {"train_loss": -24.00676918029785, "global_step": 280965, "epoch": 3385} {"train_loss": -25.059043884277344, "global_step": 280966, "epoch": 3385} {"train_loss": -24.458972930908203, "global_step": 280967, "epoch": 3385} {"train_loss": -24.54745864868164, "global_step": 280968, "epoch": 3385} {"train_loss": -24.586082458496094, "global_step": 280969, "epoch": 3385} {"train_loss": -24.850730895996094, "global_step": 280970, "epoch": 3385} {"train_loss": -24.860239028930664, "global_step": 280971, "epoch": 3385} {"train_loss": -24.723661422729492, "global_step": 280972, "epoch": 3385} {"train_loss": -24.881505966186523, "global_step": 280973, "epoch": 3385} {"train_loss": -24.967754364013672, "global_step": 280974, "epoch": 3385} {"train_loss": -24.981313705444336, "global_step": 280975, "epoch": 3385} {"train_loss": -25.22006607055664, "global_step": 280976, "epoch": 3385} {"train_loss": -25.06789779663086, "global_step": 280977, "epoch": 3385} {"train_loss": -25.198104858398438, "global_step": 280978, "epoch": 3385} {"train_loss": -25.006502151489258, "global_step": 280979, "epoch": 3385} {"train_loss": -25.352432250976562, "global_step": 280980, "epoch": 3385} {"train_loss": -25.167837142944336, "global_step": 280981, "epoch": 3385} {"train_loss": -24.85724449157715, "global_step": 280982, "epoch": 3385} {"train_loss": -25.005691528320312, "global_step": 280983, "epoch": 3385} {"train_loss": -25.060693740844727, "global_step": 280984, "epoch": 3385} {"train_loss": -25.189945220947266, "global_step": 280985, "epoch": 3385} {"train_loss": -25.206708908081055, "global_step": 280986, "epoch": 3385} {"train_loss": -25.223363876342773, "global_step": 280987, "epoch": 3385} {"train_loss": -25.13839340209961, "global_step": 280988, "epoch": 3385} {"train_loss": -25.151113510131836, "global_step": 280989, "epoch": 3385} {"train_loss": -25.54191017150879, "global_step": 280990, "epoch": 3385} {"train_loss": -25.607702255249023, "global_step": 280991, "epoch": 3385} {"train_loss": -25.470792770385742, "global_step": 280992, "epoch": 3385} {"train_loss": -25.395938873291016, "global_step": 280993, "epoch": 3385} {"train_loss": -25.365259170532227, "global_step": 280994, "epoch": 3385} {"train_loss": -25.301870346069336, "global_step": 280995, "epoch": 3385} {"train_loss": -25.43607521057129, "global_step": 280996, "epoch": 3385} {"train_loss": -25.65516471862793, "global_step": 280997, "epoch": 3385} {"train_loss": -25.189926147460938, "global_step": 280998, "epoch": 3385} {"train_loss": -25.415943145751953, "global_step": 280999, "epoch": 3385} {"train_loss": -25.351938247680664, "global_step": 281000, "epoch": 3385} {"train_loss": -25.680103302001953, "global_step": 281001, "epoch": 3385} {"train_loss": -25.57093620300293, "global_step": 281002, "epoch": 3385} {"train_loss": -25.097354888916016, "global_step": 281003, "epoch": 3385} {"train_loss": -25.683979034423828, "global_step": 281004, "epoch": 3385} {"train_loss": -25.68253517150879, "global_step": 281005, "epoch": 3385} {"train_loss": -26.055866241455078, "global_step": 281006, "epoch": 3385} {"train_loss": -25.556882858276367, "global_step": 281007, "epoch": 3385} {"train_loss": -25.452655792236328, "global_step": 281008, "epoch": 3385} {"train_loss": -25.69952964782715, "global_step": 281009, "epoch": 3385} {"train_loss": -25.578826904296875, "global_step": 281010, "epoch": 3385} {"train_loss": -25.664566040039062, "global_step": 281011, "epoch": 3385} {"train_loss": -25.52474594116211, "global_step": 281012, "epoch": 3385} {"train_loss": -25.42021942138672, "global_step": 281013, "epoch": 3385} {"train_loss": -25.384830474853516, "global_step": 281014, "epoch": 3385} {"train_loss": -26.060094833374023, "global_step": 281015, "epoch": 3385} {"train_loss": -25.377042770385742, "global_step": 281016, "epoch": 3385} {"train_loss": -25.487707138061523, "global_step": 281017, "epoch": 3385} {"train_loss": -25.333982467651367, "global_step": 281018, "epoch": 3385} {"train_loss": -25.046873092651367, "global_step": 281019, "epoch": 3385} {"train_loss": -25.66741371154785, "global_step": 281020, "epoch": 3385} {"train_loss": -25.43439483642578, "global_step": 281021, "epoch": 3385} {"train_loss": -25.083280563354492, "global_step": 281022, "epoch": 3385} {"train_loss": -25.245880126953125, "global_step": 281023, "epoch": 3385} {"train_loss": -24.836742401123047, "global_step": 281024, "epoch": 3385} {"train_loss": -25.474702835083008, "global_step": 281025, "epoch": 3385} {"train_loss": -25.138967514038086, "global_step": 281026, "epoch": 3385} {"train_loss": -25.715930938720703, "global_step": 281027, "epoch": 3385} {"train_loss": -25.488344192504883, "global_step": 281028, "epoch": 3385} {"train_loss": -25.244892120361328, "global_step": 281029, "epoch": 3385} {"train_loss": -25.610706329345703, "global_step": 281030, "epoch": 3385} {"train_loss": -25.376272201538086, "global_step": 281031, "epoch": 3385} {"train_loss": -25.345746994018555, "global_step": 281032, "epoch": 3385} {"train_loss": -25.576934814453125, "global_step": 281033, "epoch": 3385} {"train_loss": -25.533334732055664, "global_step": 281034, "epoch": 3385} {"train_loss": -25.288061141967773, "global_step": 281035, "epoch": 3385} {"train_loss": -25.723316192626953, "global_step": 281036, "epoch": 3385} {"train_loss": -25.164627098175416, "global_step": 281037, "epoch": 3385, "val_loss": 6969333.0} {"train_loss": -23.429044723510742, "global_step": 281038, "epoch": 3386} {"train_loss": -23.398540496826172, "global_step": 281039, "epoch": 3386} {"train_loss": -24.05056381225586, "global_step": 281040, "epoch": 3386} {"train_loss": -24.98111343383789, "global_step": 281041, "epoch": 3386} {"train_loss": -23.656997680664062, "global_step": 281042, "epoch": 3386} {"train_loss": -24.81644630432129, "global_step": 281043, "epoch": 3386} {"train_loss": -24.41657829284668, "global_step": 281044, "epoch": 3386} {"train_loss": -24.627683639526367, "global_step": 281045, "epoch": 3386} {"train_loss": -24.721921920776367, "global_step": 281046, "epoch": 3386} {"train_loss": -24.446439743041992, "global_step": 281047, "epoch": 3386} {"train_loss": -25.326879501342773, "global_step": 281048, "epoch": 3386} {"train_loss": -25.058792114257812, "global_step": 281049, "epoch": 3386} {"train_loss": -24.689876556396484, "global_step": 281050, "epoch": 3386} {"train_loss": -24.752779006958008, "global_step": 281051, "epoch": 3386} {"train_loss": -25.250280380249023, "global_step": 281052, "epoch": 3386} {"train_loss": -24.813337326049805, "global_step": 281053, "epoch": 3386} {"train_loss": -24.79715919494629, "global_step": 281054, "epoch": 3386} {"train_loss": -25.041879653930664, "global_step": 281055, "epoch": 3386} {"train_loss": -24.98663330078125, "global_step": 281056, "epoch": 3386} {"train_loss": -24.83747673034668, "global_step": 281057, "epoch": 3386} {"train_loss": -25.035125732421875, "global_step": 281058, "epoch": 3386} {"train_loss": -24.92603874206543, "global_step": 281059, "epoch": 3386} {"train_loss": -25.048019409179688, "global_step": 281060, "epoch": 3386} {"train_loss": -25.023147583007812, "global_step": 281061, "epoch": 3386} {"train_loss": -24.96065330505371, "global_step": 281062, "epoch": 3386} {"train_loss": -24.95407485961914, "global_step": 281063, "epoch": 3386} {"train_loss": -25.06346321105957, "global_step": 281064, "epoch": 3386} {"train_loss": -24.847091674804688, "global_step": 281065, "epoch": 3386} {"train_loss": -25.557449340820312, "global_step": 281066, "epoch": 3386} {"train_loss": -25.095670700073242, "global_step": 281067, "epoch": 3386} {"train_loss": -25.231000900268555, "global_step": 281068, "epoch": 3386} {"train_loss": -25.426158905029297, "global_step": 281069, "epoch": 3386} {"train_loss": -25.316282272338867, "global_step": 281070, "epoch": 3386} {"train_loss": -25.49045181274414, "global_step": 281071, "epoch": 3386} {"train_loss": -25.62420082092285, "global_step": 281072, "epoch": 3386} {"train_loss": -25.34183692932129, "global_step": 281073, "epoch": 3386} {"train_loss": -25.452096939086914, "global_step": 281074, "epoch": 3386} {"train_loss": -25.813817977905273, "global_step": 281075, "epoch": 3386} {"train_loss": -25.88189125061035, "global_step": 281076, "epoch": 3386} {"train_loss": -25.549219131469727, "global_step": 281077, "epoch": 3386} {"train_loss": -25.500463485717773, "global_step": 281078, "epoch": 3386} {"train_loss": -25.629148483276367, "global_step": 281079, "epoch": 3386} {"train_loss": -25.803348541259766, "global_step": 281080, "epoch": 3386} {"train_loss": -25.333139419555664, "global_step": 281081, "epoch": 3386} {"train_loss": -25.355382919311523, "global_step": 281082, "epoch": 3386} {"train_loss": -25.669696807861328, "global_step": 281083, "epoch": 3386} {"train_loss": -25.252527236938477, "global_step": 281084, "epoch": 3386} {"train_loss": -25.592390060424805, "global_step": 281085, "epoch": 3386} {"train_loss": -25.501331329345703, "global_step": 281086, "epoch": 3386} {"train_loss": -25.20034408569336, "global_step": 281087, "epoch": 3386} {"train_loss": -25.0318603515625, "global_step": 281088, "epoch": 3386} {"train_loss": -25.400102615356445, "global_step": 281089, "epoch": 3386} {"train_loss": -25.241910934448242, "global_step": 281090, "epoch": 3386} {"train_loss": -25.38816261291504, "global_step": 281091, "epoch": 3386} {"train_loss": -25.525930404663086, "global_step": 281092, "epoch": 3386} {"train_loss": -25.15701675415039, "global_step": 281093, "epoch": 3386} {"train_loss": -25.801212310791016, "global_step": 281094, "epoch": 3386} {"train_loss": -25.489723205566406, "global_step": 281095, "epoch": 3386} {"train_loss": -25.541685104370117, "global_step": 281096, "epoch": 3386} {"train_loss": -25.719470977783203, "global_step": 281097, "epoch": 3386} {"train_loss": -25.378660202026367, "global_step": 281098, "epoch": 3386} {"train_loss": -25.821533203125, "global_step": 281099, "epoch": 3386} {"train_loss": -25.63164710998535, "global_step": 281100, "epoch": 3386} {"train_loss": -25.636642456054688, "global_step": 281101, "epoch": 3386} {"train_loss": -25.504962921142578, "global_step": 281102, "epoch": 3386} {"train_loss": -25.168832778930664, "global_step": 281103, "epoch": 3386} {"train_loss": -25.016077041625977, "global_step": 281104, "epoch": 3386} {"train_loss": -25.125776290893555, "global_step": 281105, "epoch": 3386} {"train_loss": -25.051788330078125, "global_step": 281106, "epoch": 3386} {"train_loss": -24.57640838623047, "global_step": 281107, "epoch": 3386} {"train_loss": -24.997129440307617, "global_step": 281108, "epoch": 3386} {"train_loss": -25.38132095336914, "global_step": 281109, "epoch": 3386} {"train_loss": -25.088119506835938, "global_step": 281110, "epoch": 3386} {"train_loss": -25.24318504333496, "global_step": 281111, "epoch": 3386} {"train_loss": -25.324438095092773, "global_step": 281112, "epoch": 3386} {"train_loss": -25.444196701049805, "global_step": 281113, "epoch": 3386} {"train_loss": -25.375455856323242, "global_step": 281114, "epoch": 3386} {"train_loss": -25.10109519958496, "global_step": 281115, "epoch": 3386} {"train_loss": -25.056732177734375, "global_step": 281116, "epoch": 3386} {"train_loss": -25.66745376586914, "global_step": 281117, "epoch": 3386} {"train_loss": -25.47287940979004, "global_step": 281118, "epoch": 3386} {"train_loss": -25.065433502197266, "global_step": 281119, "epoch": 3386} {"train_loss": -25.17680407144937, "global_step": 281120, "epoch": 3386, "val_loss": 7072989.0} {"train_loss": -25.113887786865234, "global_step": 281121, "epoch": 3387} {"train_loss": -25.0206356048584, "global_step": 281122, "epoch": 3387} {"train_loss": -24.738149642944336, "global_step": 281123, "epoch": 3387} {"train_loss": -24.754173278808594, "global_step": 281124, "epoch": 3387} {"train_loss": -24.867538452148438, "global_step": 281125, "epoch": 3387} {"train_loss": -24.99949073791504, "global_step": 281126, "epoch": 3387} {"train_loss": -25.262399673461914, "global_step": 281127, "epoch": 3387} {"train_loss": -24.82103729248047, "global_step": 281128, "epoch": 3387} {"train_loss": -24.83320426940918, "global_step": 281129, "epoch": 3387} {"train_loss": -25.42569923400879, "global_step": 281130, "epoch": 3387} {"train_loss": -24.76243019104004, "global_step": 281131, "epoch": 3387} {"train_loss": -25.237348556518555, "global_step": 281132, "epoch": 3387} {"train_loss": -25.294322967529297, "global_step": 281133, "epoch": 3387} {"train_loss": -25.232114791870117, "global_step": 281134, "epoch": 3387} {"train_loss": -25.471206665039062, "global_step": 281135, "epoch": 3387} {"train_loss": -25.410411834716797, "global_step": 281136, "epoch": 3387} {"train_loss": -25.629119873046875, "global_step": 281137, "epoch": 3387} {"train_loss": -25.177213668823242, "global_step": 281138, "epoch": 3387} {"train_loss": -25.36391258239746, "global_step": 281139, "epoch": 3387} {"train_loss": -25.529882431030273, "global_step": 281140, "epoch": 3387} {"train_loss": -25.332433700561523, "global_step": 281141, "epoch": 3387} {"train_loss": -25.111223220825195, "global_step": 281142, "epoch": 3387} {"train_loss": -25.356464385986328, "global_step": 281143, "epoch": 3387} {"train_loss": -25.14583396911621, "global_step": 281144, "epoch": 3387} {"train_loss": -25.074893951416016, "global_step": 281145, "epoch": 3387} {"train_loss": -25.36448860168457, "global_step": 281146, "epoch": 3387} {"train_loss": -25.464353561401367, "global_step": 281147, "epoch": 3387} {"train_loss": -25.75250244140625, "global_step": 281148, "epoch": 3387} {"train_loss": -25.55718231201172, "global_step": 281149, "epoch": 3387} {"train_loss": -25.441213607788086, "global_step": 281150, "epoch": 3387} {"train_loss": -25.388702392578125, "global_step": 281151, "epoch": 3387} {"train_loss": -25.597911834716797, "global_step": 281152, "epoch": 3387} {"train_loss": -25.254837036132812, "global_step": 281153, "epoch": 3387} {"train_loss": -25.39424705505371, "global_step": 281154, "epoch": 3387} {"train_loss": -25.430082321166992, "global_step": 281155, "epoch": 3387} {"train_loss": -25.060428619384766, "global_step": 281156, "epoch": 3387} {"train_loss": -25.528553009033203, "global_step": 281157, "epoch": 3387} {"train_loss": -25.42955207824707, "global_step": 281158, "epoch": 3387} {"train_loss": -25.4008731842041, "global_step": 281159, "epoch": 3387} {"train_loss": -25.894031524658203, "global_step": 281160, "epoch": 3387} {"train_loss": -25.3376407623291, "global_step": 281161, "epoch": 3387} {"train_loss": -25.364896774291992, "global_step": 281162, "epoch": 3387} {"train_loss": -25.698652267456055, "global_step": 281163, "epoch": 3387} {"train_loss": -25.240827560424805, "global_step": 281164, "epoch": 3387} {"train_loss": -25.472200393676758, "global_step": 281165, "epoch": 3387} {"train_loss": -25.06784439086914, "global_step": 281166, "epoch": 3387} {"train_loss": -25.523481369018555, "global_step": 281167, "epoch": 3387} {"train_loss": -25.437265396118164, "global_step": 281168, "epoch": 3387} {"train_loss": -25.136747360229492, "global_step": 281169, "epoch": 3387} {"train_loss": -25.234098434448242, "global_step": 281170, "epoch": 3387} {"train_loss": -25.21770668029785, "global_step": 281171, "epoch": 3387} {"train_loss": -25.212331771850586, "global_step": 281172, "epoch": 3387} {"train_loss": -24.925331115722656, "global_step": 281173, "epoch": 3387} {"train_loss": -25.470361709594727, "global_step": 281174, "epoch": 3387} {"train_loss": -24.98296356201172, "global_step": 281175, "epoch": 3387} {"train_loss": -24.893430709838867, "global_step": 281176, "epoch": 3387} {"train_loss": -25.26910972595215, "global_step": 281177, "epoch": 3387} {"train_loss": -25.242231369018555, "global_step": 281178, "epoch": 3387} {"train_loss": -25.347219467163086, "global_step": 281179, "epoch": 3387} {"train_loss": -25.69257164001465, "global_step": 281180, "epoch": 3387} {"train_loss": -25.43329429626465, "global_step": 281181, "epoch": 3387} {"train_loss": -25.639057159423828, "global_step": 281182, "epoch": 3387} {"train_loss": -25.44641876220703, "global_step": 281183, "epoch": 3387} {"train_loss": -25.428598403930664, "global_step": 281184, "epoch": 3387} {"train_loss": -25.090978622436523, "global_step": 281185, "epoch": 3387} {"train_loss": -25.925012588500977, "global_step": 281186, "epoch": 3387} {"train_loss": -25.61865234375, "global_step": 281187, "epoch": 3387} {"train_loss": -25.736875534057617, "global_step": 281188, "epoch": 3387} {"train_loss": -25.01788902282715, "global_step": 281189, "epoch": 3387} {"train_loss": -25.662256240844727, "global_step": 281190, "epoch": 3387} {"train_loss": -25.716205596923828, "global_step": 281191, "epoch": 3387} {"train_loss": -25.43448829650879, "global_step": 281192, "epoch": 3387} {"train_loss": -25.4451847076416, "global_step": 281193, "epoch": 3387} {"train_loss": -25.62714195251465, "global_step": 281194, "epoch": 3387} {"train_loss": -25.46087646484375, "global_step": 281195, "epoch": 3387} {"train_loss": -25.7205810546875, "global_step": 281196, "epoch": 3387} {"train_loss": -25.605451583862305, "global_step": 281197, "epoch": 3387} {"train_loss": -25.506473541259766, "global_step": 281198, "epoch": 3387} {"train_loss": -25.46501350402832, "global_step": 281199, "epoch": 3387} {"train_loss": -25.79656982421875, "global_step": 281200, "epoch": 3387} {"train_loss": -25.68598747253418, "global_step": 281201, "epoch": 3387} {"train_loss": -25.39463233947754, "global_step": 281202, "epoch": 3387} {"train_loss": -25.343716724809394, "global_step": 281203, "epoch": 3387, "val_loss": 6969203.0} {"train_loss": -25.023469924926758, "global_step": 281204, "epoch": 3388} {"train_loss": -24.898212432861328, "global_step": 281205, "epoch": 3388} {"train_loss": -25.636356353759766, "global_step": 281206, "epoch": 3388} {"train_loss": -24.97352409362793, "global_step": 281207, "epoch": 3388} {"train_loss": -24.87445640563965, "global_step": 281208, "epoch": 3388} {"train_loss": -25.137405395507812, "global_step": 281209, "epoch": 3388} {"train_loss": -25.17644691467285, "global_step": 281210, "epoch": 3388} {"train_loss": -25.254013061523438, "global_step": 281211, "epoch": 3388} {"train_loss": -25.07330894470215, "global_step": 281212, "epoch": 3388} {"train_loss": -25.39497184753418, "global_step": 281213, "epoch": 3388} {"train_loss": -25.46137809753418, "global_step": 281214, "epoch": 3388} {"train_loss": -25.18107795715332, "global_step": 281215, "epoch": 3388} {"train_loss": -25.44435691833496, "global_step": 281216, "epoch": 3388} {"train_loss": -25.232868194580078, "global_step": 281217, "epoch": 3388} {"train_loss": -25.665613174438477, "global_step": 281218, "epoch": 3388} {"train_loss": -25.205596923828125, "global_step": 281219, "epoch": 3388} {"train_loss": -25.49067497253418, "global_step": 281220, "epoch": 3388} {"train_loss": -25.22906494140625, "global_step": 281221, "epoch": 3388} {"train_loss": -25.539175033569336, "global_step": 281222, "epoch": 3388} {"train_loss": -25.877634048461914, "global_step": 281223, "epoch": 3388} {"train_loss": -25.35828971862793, "global_step": 281224, "epoch": 3388} {"train_loss": -25.52304458618164, "global_step": 281225, "epoch": 3388} {"train_loss": -25.55501365661621, "global_step": 281226, "epoch": 3388} {"train_loss": -25.275659561157227, "global_step": 281227, "epoch": 3388} {"train_loss": -25.495275497436523, "global_step": 281228, "epoch": 3388} {"train_loss": -25.666162490844727, "global_step": 281229, "epoch": 3388} {"train_loss": -25.592260360717773, "global_step": 281230, "epoch": 3388} {"train_loss": -25.844045639038086, "global_step": 281231, "epoch": 3388} {"train_loss": -25.64306640625, "global_step": 281232, "epoch": 3388} {"train_loss": -25.563243865966797, "global_step": 281233, "epoch": 3388} {"train_loss": -25.55755043029785, "global_step": 281234, "epoch": 3388} {"train_loss": -25.488630294799805, "global_step": 281235, "epoch": 3388} {"train_loss": -25.338117599487305, "global_step": 281236, "epoch": 3388} {"train_loss": -25.37735939025879, "global_step": 281237, "epoch": 3388} {"train_loss": -25.675586700439453, "global_step": 281238, "epoch": 3388} {"train_loss": -25.687824249267578, "global_step": 281239, "epoch": 3388} {"train_loss": -25.38463592529297, "global_step": 281240, "epoch": 3388} {"train_loss": -24.944059371948242, "global_step": 281241, "epoch": 3388} {"train_loss": -24.979415893554688, "global_step": 281242, "epoch": 3388} {"train_loss": -25.7564697265625, "global_step": 281243, "epoch": 3388} {"train_loss": -25.463056564331055, "global_step": 281244, "epoch": 3388} {"train_loss": -24.896299362182617, "global_step": 281245, "epoch": 3388} {"train_loss": -25.438566207885742, "global_step": 281246, "epoch": 3388} {"train_loss": -25.376718521118164, "global_step": 281247, "epoch": 3388} {"train_loss": -25.719263076782227, "global_step": 281248, "epoch": 3388} {"train_loss": -25.51656150817871, "global_step": 281249, "epoch": 3388} {"train_loss": -25.689620971679688, "global_step": 281250, "epoch": 3388} {"train_loss": -25.9320011138916, "global_step": 281251, "epoch": 3388} {"train_loss": -25.470922470092773, "global_step": 281252, "epoch": 3388} {"train_loss": -25.523637771606445, "global_step": 281253, "epoch": 3388} {"train_loss": -25.81599235534668, "global_step": 281254, "epoch": 3388} {"train_loss": -25.6140193939209, "global_step": 281255, "epoch": 3388} {"train_loss": -25.41436767578125, "global_step": 281256, "epoch": 3388} {"train_loss": -25.75278091430664, "global_step": 281257, "epoch": 3388} {"train_loss": -25.486543655395508, "global_step": 281258, "epoch": 3388} {"train_loss": -25.527196884155273, "global_step": 281259, "epoch": 3388} {"train_loss": -25.756174087524414, "global_step": 281260, "epoch": 3388} {"train_loss": -25.668319702148438, "global_step": 281261, "epoch": 3388} {"train_loss": -25.540136337280273, "global_step": 281262, "epoch": 3388} {"train_loss": -25.465993881225586, "global_step": 281263, "epoch": 3388} {"train_loss": -25.242473602294922, "global_step": 281264, "epoch": 3388} {"train_loss": -25.560789108276367, "global_step": 281265, "epoch": 3388} {"train_loss": -25.595245361328125, "global_step": 281266, "epoch": 3388} {"train_loss": -25.317609786987305, "global_step": 281267, "epoch": 3388} {"train_loss": -25.35833740234375, "global_step": 281268, "epoch": 3388} {"train_loss": -25.45420265197754, "global_step": 281269, "epoch": 3388} {"train_loss": -25.228336334228516, "global_step": 281270, "epoch": 3388} {"train_loss": -25.241926193237305, "global_step": 281271, "epoch": 3388} {"train_loss": -24.995718002319336, "global_step": 281272, "epoch": 3388} {"train_loss": -25.378061294555664, "global_step": 281273, "epoch": 3388} {"train_loss": -25.385061264038086, "global_step": 281274, "epoch": 3388} {"train_loss": -25.110889434814453, "global_step": 281275, "epoch": 3388} {"train_loss": -25.502267837524414, "global_step": 281276, "epoch": 3388} {"train_loss": -25.243860244750977, "global_step": 281277, "epoch": 3388} {"train_loss": -25.04340171813965, "global_step": 281278, "epoch": 3388} {"train_loss": -25.169612884521484, "global_step": 281279, "epoch": 3388} {"train_loss": -25.34669303894043, "global_step": 281280, "epoch": 3388} {"train_loss": -25.124387741088867, "global_step": 281281, "epoch": 3388} {"train_loss": -25.364383697509766, "global_step": 281282, "epoch": 3388} {"train_loss": -25.136266708374023, "global_step": 281283, "epoch": 3388} {"train_loss": -25.359256744384766, "global_step": 281284, "epoch": 3388} {"train_loss": -25.257822036743164, "global_step": 281285, "epoch": 3388} {"train_loss": -25.416290673864893, "global_step": 281286, "epoch": 3388, "val_loss": 6907463.0} {"train_loss": -24.871475219726562, "global_step": 281287, "epoch": 3389} {"train_loss": -24.857929229736328, "global_step": 281288, "epoch": 3389} {"train_loss": -25.346813201904297, "global_step": 281289, "epoch": 3389} {"train_loss": -24.87446403503418, "global_step": 281290, "epoch": 3389} {"train_loss": -24.8951416015625, "global_step": 281291, "epoch": 3389} {"train_loss": -24.78772735595703, "global_step": 281292, "epoch": 3389} {"train_loss": -24.95916748046875, "global_step": 281293, "epoch": 3389} {"train_loss": -25.338132858276367, "global_step": 281294, "epoch": 3389} {"train_loss": -24.872236251831055, "global_step": 281295, "epoch": 3389} {"train_loss": -25.073627471923828, "global_step": 281296, "epoch": 3389} {"train_loss": -25.079648971557617, "global_step": 281297, "epoch": 3389} {"train_loss": -25.122129440307617, "global_step": 281298, "epoch": 3389} {"train_loss": -25.168594360351562, "global_step": 281299, "epoch": 3389} {"train_loss": -25.229671478271484, "global_step": 281300, "epoch": 3389} {"train_loss": -25.419979095458984, "global_step": 281301, "epoch": 3389} {"train_loss": -25.018842697143555, "global_step": 281302, "epoch": 3389} {"train_loss": -25.424381256103516, "global_step": 281303, "epoch": 3389} {"train_loss": -25.34613037109375, "global_step": 281304, "epoch": 3389} {"train_loss": -25.407581329345703, "global_step": 281305, "epoch": 3389} {"train_loss": -25.296154022216797, "global_step": 281306, "epoch": 3389} {"train_loss": -25.262685775756836, "global_step": 281307, "epoch": 3389} {"train_loss": -25.236570358276367, "global_step": 281308, "epoch": 3389} {"train_loss": -25.714630126953125, "global_step": 281309, "epoch": 3389} {"train_loss": -25.9031982421875, "global_step": 281310, "epoch": 3389} {"train_loss": -25.50893211364746, "global_step": 281311, "epoch": 3389} {"train_loss": -25.465574264526367, "global_step": 281312, "epoch": 3389} {"train_loss": -25.8054141998291, "global_step": 281313, "epoch": 3389} {"train_loss": -25.448293685913086, "global_step": 281314, "epoch": 3389} {"train_loss": -25.335834503173828, "global_step": 281315, "epoch": 3389} {"train_loss": -25.456342697143555, "global_step": 281316, "epoch": 3389} {"train_loss": -25.39564323425293, "global_step": 281317, "epoch": 3389} {"train_loss": -25.500825881958008, "global_step": 281318, "epoch": 3389} {"train_loss": -25.5122127532959, "global_step": 281319, "epoch": 3389} {"train_loss": -25.66534423828125, "global_step": 281320, "epoch": 3389} {"train_loss": -25.29182243347168, "global_step": 281321, "epoch": 3389} {"train_loss": -25.561431884765625, "global_step": 281322, "epoch": 3389} {"train_loss": -25.658466339111328, "global_step": 281323, "epoch": 3389} {"train_loss": -25.467723846435547, "global_step": 281324, "epoch": 3389} {"train_loss": -25.444454193115234, "global_step": 281325, "epoch": 3389} {"train_loss": -25.343427658081055, "global_step": 281326, "epoch": 3389} {"train_loss": -25.58649444580078, "global_step": 281327, "epoch": 3389} {"train_loss": -25.60100746154785, "global_step": 281328, "epoch": 3389} {"train_loss": -25.9643497467041, "global_step": 281329, "epoch": 3389} {"train_loss": -25.417043685913086, "global_step": 281330, "epoch": 3389} {"train_loss": -25.62455177307129, "global_step": 281331, "epoch": 3389} {"train_loss": -25.903247833251953, "global_step": 281332, "epoch": 3389} {"train_loss": -25.606998443603516, "global_step": 281333, "epoch": 3389} {"train_loss": -25.83090591430664, "global_step": 281334, "epoch": 3389} {"train_loss": -25.86423110961914, "global_step": 281335, "epoch": 3389} {"train_loss": -25.701492309570312, "global_step": 281336, "epoch": 3389} {"train_loss": -25.11928367614746, "global_step": 281337, "epoch": 3389} {"train_loss": -25.19315528869629, "global_step": 281338, "epoch": 3389} {"train_loss": -25.248456954956055, "global_step": 281339, "epoch": 3389} {"train_loss": -25.162681579589844, "global_step": 281340, "epoch": 3389} {"train_loss": -25.112154006958008, "global_step": 281341, "epoch": 3389} {"train_loss": -25.419919967651367, "global_step": 281342, "epoch": 3389} {"train_loss": -25.12861442565918, "global_step": 281343, "epoch": 3389} {"train_loss": -25.28499412536621, "global_step": 281344, "epoch": 3389} {"train_loss": -25.365583419799805, "global_step": 281345, "epoch": 3389} {"train_loss": -25.456527709960938, "global_step": 281346, "epoch": 3389} {"train_loss": -25.322118759155273, "global_step": 281347, "epoch": 3389} {"train_loss": -25.431659698486328, "global_step": 281348, "epoch": 3389} {"train_loss": -25.346372604370117, "global_step": 281349, "epoch": 3389} {"train_loss": -25.356796264648438, "global_step": 281350, "epoch": 3389} {"train_loss": -25.637067794799805, "global_step": 281351, "epoch": 3389} {"train_loss": -25.36488151550293, "global_step": 281352, "epoch": 3389} {"train_loss": -25.33038902282715, "global_step": 281353, "epoch": 3389} {"train_loss": -25.897008895874023, "global_step": 281354, "epoch": 3389} {"train_loss": -25.60202407836914, "global_step": 281355, "epoch": 3389} {"train_loss": -25.247323989868164, "global_step": 281356, "epoch": 3389} {"train_loss": -25.51915168762207, "global_step": 281357, "epoch": 3389} {"train_loss": -25.308979034423828, "global_step": 281358, "epoch": 3389} {"train_loss": -25.5145263671875, "global_step": 281359, "epoch": 3389} {"train_loss": -25.748666763305664, "global_step": 281360, "epoch": 3389} {"train_loss": -25.684921264648438, "global_step": 281361, "epoch": 3389} {"train_loss": -25.45473289489746, "global_step": 281362, "epoch": 3389} {"train_loss": -25.357574462890625, "global_step": 281363, "epoch": 3389} {"train_loss": -25.798492431640625, "global_step": 281364, "epoch": 3389} {"train_loss": -25.882339477539062, "global_step": 281365, "epoch": 3389} {"train_loss": -25.41435432434082, "global_step": 281366, "epoch": 3389} {"train_loss": -25.48348045349121, "global_step": 281367, "epoch": 3389} {"train_loss": -25.731220245361328, "global_step": 281368, "epoch": 3389} {"train_loss": -25.41080362251006, "global_step": 281369, "epoch": 3389, "val_loss": 6977821.0} {"train_loss": -25.12967300415039, "global_step": 281370, "epoch": 3390} {"train_loss": -24.586715698242188, "global_step": 281371, "epoch": 3390} {"train_loss": -24.56658363342285, "global_step": 281372, "epoch": 3390} {"train_loss": -24.52181625366211, "global_step": 281373, "epoch": 3390} {"train_loss": -25.07724952697754, "global_step": 281374, "epoch": 3390} {"train_loss": -24.20160484313965, "global_step": 281375, "epoch": 3390} {"train_loss": -23.8299560546875, "global_step": 281376, "epoch": 3390} {"train_loss": -24.940147399902344, "global_step": 281377, "epoch": 3390} {"train_loss": -25.203596115112305, "global_step": 281378, "epoch": 3390} {"train_loss": -24.51715660095215, "global_step": 281379, "epoch": 3390} {"train_loss": -24.7563533782959, "global_step": 281380, "epoch": 3390} {"train_loss": -25.05057716369629, "global_step": 281381, "epoch": 3390} {"train_loss": -24.334524154663086, "global_step": 281382, "epoch": 3390} {"train_loss": -24.888778686523438, "global_step": 281383, "epoch": 3390} {"train_loss": -24.98672866821289, "global_step": 281384, "epoch": 3390} {"train_loss": -24.734689712524414, "global_step": 281385, "epoch": 3390} {"train_loss": -25.001449584960938, "global_step": 281386, "epoch": 3390} {"train_loss": -24.658241271972656, "global_step": 281387, "epoch": 3390} {"train_loss": -25.226097106933594, "global_step": 281388, "epoch": 3390} {"train_loss": -25.10390281677246, "global_step": 281389, "epoch": 3390} {"train_loss": -24.881072998046875, "global_step": 281390, "epoch": 3390} {"train_loss": -25.126291275024414, "global_step": 281391, "epoch": 3390} {"train_loss": -25.31569480895996, "global_step": 281392, "epoch": 3390} {"train_loss": -25.063613891601562, "global_step": 281393, "epoch": 3390} {"train_loss": -25.24972915649414, "global_step": 281394, "epoch": 3390} {"train_loss": -25.54227638244629, "global_step": 281395, "epoch": 3390} {"train_loss": -25.151403427124023, "global_step": 281396, "epoch": 3390} {"train_loss": -24.93202781677246, "global_step": 281397, "epoch": 3390} {"train_loss": -25.279672622680664, "global_step": 281398, "epoch": 3390} {"train_loss": -25.266788482666016, "global_step": 281399, "epoch": 3390} {"train_loss": -25.772321701049805, "global_step": 281400, "epoch": 3390} {"train_loss": -25.04844093322754, "global_step": 281401, "epoch": 3390} {"train_loss": -25.329029083251953, "global_step": 281402, "epoch": 3390} {"train_loss": -25.337656021118164, "global_step": 281403, "epoch": 3390} {"train_loss": -25.622730255126953, "global_step": 281404, "epoch": 3390} {"train_loss": -25.363492965698242, "global_step": 281405, "epoch": 3390} {"train_loss": -25.30377769470215, "global_step": 281406, "epoch": 3390} {"train_loss": -25.153440475463867, "global_step": 281407, "epoch": 3390} {"train_loss": -25.443912506103516, "global_step": 281408, "epoch": 3390} {"train_loss": -25.04775619506836, "global_step": 281409, "epoch": 3390} {"train_loss": -25.355775833129883, "global_step": 281410, "epoch": 3390} {"train_loss": -25.465879440307617, "global_step": 281411, "epoch": 3390} {"train_loss": -25.127531051635742, "global_step": 281412, "epoch": 3390} {"train_loss": -25.25098991394043, "global_step": 281413, "epoch": 3390} {"train_loss": -25.6019229888916, "global_step": 281414, "epoch": 3390} {"train_loss": -25.179798126220703, "global_step": 281415, "epoch": 3390} {"train_loss": -25.16703224182129, "global_step": 281416, "epoch": 3390} {"train_loss": -25.040693283081055, "global_step": 281417, "epoch": 3390} {"train_loss": -25.450029373168945, "global_step": 281418, "epoch": 3390} {"train_loss": -25.309791564941406, "global_step": 281419, "epoch": 3390} {"train_loss": -25.72100830078125, "global_step": 281420, "epoch": 3390} {"train_loss": -25.66676139831543, "global_step": 281421, "epoch": 3390} {"train_loss": -25.43926429748535, "global_step": 281422, "epoch": 3390} {"train_loss": -25.46060562133789, "global_step": 281423, "epoch": 3390} {"train_loss": -25.188642501831055, "global_step": 281424, "epoch": 3390} {"train_loss": -25.393468856811523, "global_step": 281425, "epoch": 3390} {"train_loss": -25.617212295532227, "global_step": 281426, "epoch": 3390} {"train_loss": -25.180749893188477, "global_step": 281427, "epoch": 3390} {"train_loss": -25.308134078979492, "global_step": 281428, "epoch": 3390} {"train_loss": -25.105905532836914, "global_step": 281429, "epoch": 3390} {"train_loss": -25.3481502532959, "global_step": 281430, "epoch": 3390} {"train_loss": -25.121274948120117, "global_step": 281431, "epoch": 3390} {"train_loss": -25.47736167907715, "global_step": 281432, "epoch": 3390} {"train_loss": -25.210987091064453, "global_step": 281433, "epoch": 3390} {"train_loss": -25.46450424194336, "global_step": 281434, "epoch": 3390} {"train_loss": -25.28090476989746, "global_step": 281435, "epoch": 3390} {"train_loss": -25.18817138671875, "global_step": 281436, "epoch": 3390} {"train_loss": -25.160757064819336, "global_step": 281437, "epoch": 3390} {"train_loss": -25.4914608001709, "global_step": 281438, "epoch": 3390} {"train_loss": -25.120237350463867, "global_step": 281439, "epoch": 3390} {"train_loss": -25.627466201782227, "global_step": 281440, "epoch": 3390} {"train_loss": -25.089319229125977, "global_step": 281441, "epoch": 3390} {"train_loss": -25.582462310791016, "global_step": 281442, "epoch": 3390} {"train_loss": -25.19525718688965, "global_step": 281443, "epoch": 3390} {"train_loss": -25.34274673461914, "global_step": 281444, "epoch": 3390} {"train_loss": -25.357309341430664, "global_step": 281445, "epoch": 3390} {"train_loss": -25.496129989624023, "global_step": 281446, "epoch": 3390} {"train_loss": -25.151687622070312, "global_step": 281447, "epoch": 3390} {"train_loss": -24.936861038208008, "global_step": 281448, "epoch": 3390} {"train_loss": -25.236568450927734, "global_step": 281449, "epoch": 3390} {"train_loss": -25.50461196899414, "global_step": 281450, "epoch": 3390} {"train_loss": -25.124252319335938, "global_step": 281451, "epoch": 3390} {"train_loss": -25.165947052369635, "global_step": 281452, "epoch": 3390, "val_loss": 7181709.0} {"train_loss": -24.851909637451172, "global_step": 281453, "epoch": 3391} {"train_loss": -25.26818084716797, "global_step": 281454, "epoch": 3391} {"train_loss": -24.94595718383789, "global_step": 281455, "epoch": 3391} {"train_loss": -25.041868209838867, "global_step": 281456, "epoch": 3391} {"train_loss": -24.763113021850586, "global_step": 281457, "epoch": 3391} {"train_loss": -25.39874267578125, "global_step": 281458, "epoch": 3391} {"train_loss": -25.11263084411621, "global_step": 281459, "epoch": 3391} {"train_loss": -24.703174591064453, "global_step": 281460, "epoch": 3391} {"train_loss": -24.908323287963867, "global_step": 281461, "epoch": 3391} {"train_loss": -24.855195999145508, "global_step": 281462, "epoch": 3391} {"train_loss": -24.913436889648438, "global_step": 281463, "epoch": 3391} {"train_loss": -25.13178062438965, "global_step": 281464, "epoch": 3391} {"train_loss": -25.081146240234375, "global_step": 281465, "epoch": 3391} {"train_loss": -24.98423194885254, "global_step": 281466, "epoch": 3391} {"train_loss": -25.218448638916016, "global_step": 281467, "epoch": 3391} {"train_loss": -25.595090866088867, "global_step": 281468, "epoch": 3391} {"train_loss": -25.390657424926758, "global_step": 281469, "epoch": 3391} {"train_loss": -25.4376277923584, "global_step": 281470, "epoch": 3391} {"train_loss": -25.571964263916016, "global_step": 281471, "epoch": 3391} {"train_loss": -24.89881706237793, "global_step": 281472, "epoch": 3391} {"train_loss": -25.517288208007812, "global_step": 281473, "epoch": 3391} {"train_loss": -25.46955108642578, "global_step": 281474, "epoch": 3391} {"train_loss": -25.600194931030273, "global_step": 281475, "epoch": 3391} {"train_loss": -25.202167510986328, "global_step": 281476, "epoch": 3391} {"train_loss": -25.540193557739258, "global_step": 281477, "epoch": 3391} {"train_loss": -25.294631958007812, "global_step": 281478, "epoch": 3391} {"train_loss": -25.567651748657227, "global_step": 281479, "epoch": 3391} {"train_loss": -25.176816940307617, "global_step": 281480, "epoch": 3391} {"train_loss": -25.684955596923828, "global_step": 281481, "epoch": 3391} {"train_loss": -25.456212997436523, "global_step": 281482, "epoch": 3391} {"train_loss": -25.654937744140625, "global_step": 281483, "epoch": 3391} {"train_loss": -25.517505645751953, "global_step": 281484, "epoch": 3391} {"train_loss": -25.671369552612305, "global_step": 281485, "epoch": 3391} {"train_loss": -24.95462989807129, "global_step": 281486, "epoch": 3391} {"train_loss": -25.402143478393555, "global_step": 281487, "epoch": 3391} {"train_loss": -25.22161865234375, "global_step": 281488, "epoch": 3391} {"train_loss": -25.7913875579834, "global_step": 281489, "epoch": 3391} {"train_loss": -25.28670310974121, "global_step": 281490, "epoch": 3391} {"train_loss": -25.380788803100586, "global_step": 281491, "epoch": 3391} {"train_loss": -25.31258201599121, "global_step": 281492, "epoch": 3391} {"train_loss": -25.17738151550293, "global_step": 281493, "epoch": 3391} {"train_loss": -25.06950569152832, "global_step": 281494, "epoch": 3391} {"train_loss": -25.54083824157715, "global_step": 281495, "epoch": 3391} {"train_loss": -25.34358787536621, "global_step": 281496, "epoch": 3391} {"train_loss": -25.474716186523438, "global_step": 281497, "epoch": 3391} {"train_loss": -25.25628662109375, "global_step": 281498, "epoch": 3391} {"train_loss": -25.620756149291992, "global_step": 281499, "epoch": 3391} {"train_loss": -25.306215286254883, "global_step": 281500, "epoch": 3391} {"train_loss": -25.335844039916992, "global_step": 281501, "epoch": 3391} {"train_loss": -24.762414932250977, "global_step": 281502, "epoch": 3391} {"train_loss": -25.058683395385742, "global_step": 281503, "epoch": 3391} {"train_loss": -25.7100887298584, "global_step": 281504, "epoch": 3391} {"train_loss": -24.94394874572754, "global_step": 281505, "epoch": 3391} {"train_loss": -24.881643295288086, "global_step": 281506, "epoch": 3391} {"train_loss": -25.363727569580078, "global_step": 281507, "epoch": 3391} {"train_loss": -24.438661575317383, "global_step": 281508, "epoch": 3391} {"train_loss": -24.62397003173828, "global_step": 281509, "epoch": 3391} {"train_loss": -25.260421752929688, "global_step": 281510, "epoch": 3391} {"train_loss": -24.99582290649414, "global_step": 281511, "epoch": 3391} {"train_loss": -25.16143798828125, "global_step": 281512, "epoch": 3391} {"train_loss": -24.93489646911621, "global_step": 281513, "epoch": 3391} {"train_loss": -25.519739151000977, "global_step": 281514, "epoch": 3391} {"train_loss": -25.15303611755371, "global_step": 281515, "epoch": 3391} {"train_loss": -25.506521224975586, "global_step": 281516, "epoch": 3391} {"train_loss": -25.33109474182129, "global_step": 281517, "epoch": 3391} {"train_loss": -25.094684600830078, "global_step": 281518, "epoch": 3391} {"train_loss": -25.172359466552734, "global_step": 281519, "epoch": 3391} {"train_loss": -25.669260025024414, "global_step": 281520, "epoch": 3391} {"train_loss": -25.561748504638672, "global_step": 281521, "epoch": 3391} {"train_loss": -25.636356353759766, "global_step": 281522, "epoch": 3391} {"train_loss": -25.39232635498047, "global_step": 281523, "epoch": 3391} {"train_loss": -25.573545455932617, "global_step": 281524, "epoch": 3391} {"train_loss": -25.24066734313965, "global_step": 281525, "epoch": 3391} {"train_loss": -24.7695255279541, "global_step": 281526, "epoch": 3391} {"train_loss": -25.07954216003418, "global_step": 281527, "epoch": 3391} {"train_loss": -25.2106876373291, "global_step": 281528, "epoch": 3391} {"train_loss": -25.231735229492188, "global_step": 281529, "epoch": 3391} {"train_loss": -25.45805549621582, "global_step": 281530, "epoch": 3391} {"train_loss": -25.33270263671875, "global_step": 281531, "epoch": 3391} {"train_loss": -25.257965087890625, "global_step": 281532, "epoch": 3391} {"train_loss": -25.4418888092041, "global_step": 281533, "epoch": 3391} {"train_loss": -25.467037200927734, "global_step": 281534, "epoch": 3391} {"train_loss": -25.2455447323351, "global_step": 281535, "epoch": 3391, "val_loss": 7146085.0} {"train_loss": -24.47974967956543, "global_step": 281536, "epoch": 3392} {"train_loss": -24.242815017700195, "global_step": 281537, "epoch": 3392} {"train_loss": -24.949039459228516, "global_step": 281538, "epoch": 3392} {"train_loss": -24.69205665588379, "global_step": 281539, "epoch": 3392} {"train_loss": -25.425004959106445, "global_step": 281540, "epoch": 3392} {"train_loss": -24.642789840698242, "global_step": 281541, "epoch": 3392} {"train_loss": -25.62226676940918, "global_step": 281542, "epoch": 3392} {"train_loss": -24.94674301147461, "global_step": 281543, "epoch": 3392} {"train_loss": -25.33466148376465, "global_step": 281544, "epoch": 3392} {"train_loss": -25.361169815063477, "global_step": 281545, "epoch": 3392} {"train_loss": -25.188739776611328, "global_step": 281546, "epoch": 3392} {"train_loss": -25.128395080566406, "global_step": 281547, "epoch": 3392} {"train_loss": -24.907957077026367, "global_step": 281548, "epoch": 3392} {"train_loss": -25.300321578979492, "global_step": 281549, "epoch": 3392} {"train_loss": -25.275754928588867, "global_step": 281550, "epoch": 3392} {"train_loss": -25.023052215576172, "global_step": 281551, "epoch": 3392} {"train_loss": -25.134540557861328, "global_step": 281552, "epoch": 3392} {"train_loss": -25.378705978393555, "global_step": 281553, "epoch": 3392} {"train_loss": -25.35215187072754, "global_step": 281554, "epoch": 3392} {"train_loss": -25.483997344970703, "global_step": 281555, "epoch": 3392} {"train_loss": -25.0965633392334, "global_step": 281556, "epoch": 3392} {"train_loss": -24.875335693359375, "global_step": 281557, "epoch": 3392} {"train_loss": -25.232534408569336, "global_step": 281558, "epoch": 3392} {"train_loss": -25.6850643157959, "global_step": 281559, "epoch": 3392} {"train_loss": -25.3214054107666, "global_step": 281560, "epoch": 3392} {"train_loss": -25.53354835510254, "global_step": 281561, "epoch": 3392} {"train_loss": -25.384981155395508, "global_step": 281562, "epoch": 3392} {"train_loss": -25.54485321044922, "global_step": 281563, "epoch": 3392} {"train_loss": -25.45162010192871, "global_step": 281564, "epoch": 3392} {"train_loss": -25.661712646484375, "global_step": 281565, "epoch": 3392} {"train_loss": -25.235355377197266, "global_step": 281566, "epoch": 3392} {"train_loss": -25.509803771972656, "global_step": 281567, "epoch": 3392} {"train_loss": -25.159263610839844, "global_step": 281568, "epoch": 3392} {"train_loss": -25.58701515197754, "global_step": 281569, "epoch": 3392} {"train_loss": -25.830463409423828, "global_step": 281570, "epoch": 3392} {"train_loss": -25.491270065307617, "global_step": 281571, "epoch": 3392} {"train_loss": -25.528715133666992, "global_step": 281572, "epoch": 3392} {"train_loss": -25.478771209716797, "global_step": 281573, "epoch": 3392} {"train_loss": -25.43130874633789, "global_step": 281574, "epoch": 3392} {"train_loss": -25.127914428710938, "global_step": 281575, "epoch": 3392} {"train_loss": -25.50909996032715, "global_step": 281576, "epoch": 3392} {"train_loss": -25.605600357055664, "global_step": 281577, "epoch": 3392} {"train_loss": -25.806079864501953, "global_step": 281578, "epoch": 3392} {"train_loss": -25.3323917388916, "global_step": 281579, "epoch": 3392} {"train_loss": -25.441118240356445, "global_step": 281580, "epoch": 3392} {"train_loss": -25.49384880065918, "global_step": 281581, "epoch": 3392} {"train_loss": -25.59187126159668, "global_step": 281582, "epoch": 3392} {"train_loss": -25.265213012695312, "global_step": 281583, "epoch": 3392} {"train_loss": -25.636199951171875, "global_step": 281584, "epoch": 3392} {"train_loss": -25.515363693237305, "global_step": 281585, "epoch": 3392} {"train_loss": -25.09229850769043, "global_step": 281586, "epoch": 3392} {"train_loss": -24.963220596313477, "global_step": 281587, "epoch": 3392} {"train_loss": -25.56391716003418, "global_step": 281588, "epoch": 3392} {"train_loss": -25.42561149597168, "global_step": 281589, "epoch": 3392} {"train_loss": -25.426069259643555, "global_step": 281590, "epoch": 3392} {"train_loss": -25.718542098999023, "global_step": 281591, "epoch": 3392} {"train_loss": -25.54135513305664, "global_step": 281592, "epoch": 3392} {"train_loss": -25.531024932861328, "global_step": 281593, "epoch": 3392} {"train_loss": -25.666128158569336, "global_step": 281594, "epoch": 3392} {"train_loss": -25.27012825012207, "global_step": 281595, "epoch": 3392} {"train_loss": -25.28541374206543, "global_step": 281596, "epoch": 3392} {"train_loss": -25.362192153930664, "global_step": 281597, "epoch": 3392} {"train_loss": -25.564313888549805, "global_step": 281598, "epoch": 3392} {"train_loss": -25.357778549194336, "global_step": 281599, "epoch": 3392} {"train_loss": -25.49301528930664, "global_step": 281600, "epoch": 3392} {"train_loss": -25.678241729736328, "global_step": 281601, "epoch": 3392} {"train_loss": -25.369508743286133, "global_step": 281602, "epoch": 3392} {"train_loss": -25.27902603149414, "global_step": 281603, "epoch": 3392} {"train_loss": -25.744001388549805, "global_step": 281604, "epoch": 3392} {"train_loss": -25.555614471435547, "global_step": 281605, "epoch": 3392} {"train_loss": -25.50373649597168, "global_step": 281606, "epoch": 3392} {"train_loss": -25.655475616455078, "global_step": 281607, "epoch": 3392} {"train_loss": -25.104759216308594, "global_step": 281608, "epoch": 3392} {"train_loss": -25.617826461791992, "global_step": 281609, "epoch": 3392} {"train_loss": -25.2950496673584, "global_step": 281610, "epoch": 3392} {"train_loss": -25.042449951171875, "global_step": 281611, "epoch": 3392} {"train_loss": -25.634979248046875, "global_step": 281612, "epoch": 3392} {"train_loss": -25.168699264526367, "global_step": 281613, "epoch": 3392} {"train_loss": -25.14019012451172, "global_step": 281614, "epoch": 3392} {"train_loss": -25.14392852783203, "global_step": 281615, "epoch": 3392} {"train_loss": -25.820348739624023, "global_step": 281616, "epoch": 3392} {"train_loss": -25.652252197265625, "global_step": 281617, "epoch": 3392} {"train_loss": -25.35562584199101, "global_step": 281618, "epoch": 3392, "val_loss": 7204400.0} {"train_loss": -24.274267196655273, "global_step": 281619, "epoch": 3393} {"train_loss": -24.255170822143555, "global_step": 281620, "epoch": 3393} {"train_loss": -23.862363815307617, "global_step": 281621, "epoch": 3393} {"train_loss": -24.650243759155273, "global_step": 281622, "epoch": 3393} {"train_loss": -24.596548080444336, "global_step": 281623, "epoch": 3393} {"train_loss": -24.40224266052246, "global_step": 281624, "epoch": 3393} {"train_loss": -24.58673095703125, "global_step": 281625, "epoch": 3393} {"train_loss": -24.734846115112305, "global_step": 281626, "epoch": 3393} {"train_loss": -24.67341423034668, "global_step": 281627, "epoch": 3393} {"train_loss": -24.022153854370117, "global_step": 281628, "epoch": 3393} {"train_loss": -24.70456886291504, "global_step": 281629, "epoch": 3393} {"train_loss": -24.745542526245117, "global_step": 281630, "epoch": 3393} {"train_loss": -24.494863510131836, "global_step": 281631, "epoch": 3393} {"train_loss": -24.873374938964844, "global_step": 281632, "epoch": 3393} {"train_loss": -24.880268096923828, "global_step": 281633, "epoch": 3393} {"train_loss": -24.574508666992188, "global_step": 281634, "epoch": 3393} {"train_loss": -25.000364303588867, "global_step": 281635, "epoch": 3393} {"train_loss": -25.206388473510742, "global_step": 281636, "epoch": 3393} {"train_loss": -24.953420639038086, "global_step": 281637, "epoch": 3393} {"train_loss": -25.335336685180664, "global_step": 281638, "epoch": 3393} {"train_loss": -24.976064682006836, "global_step": 281639, "epoch": 3393} {"train_loss": -25.08209228515625, "global_step": 281640, "epoch": 3393} {"train_loss": -24.812612533569336, "global_step": 281641, "epoch": 3393} {"train_loss": -25.07007598876953, "global_step": 281642, "epoch": 3393} {"train_loss": -25.072385787963867, "global_step": 281643, "epoch": 3393} {"train_loss": -25.03308868408203, "global_step": 281644, "epoch": 3393} {"train_loss": -24.952817916870117, "global_step": 281645, "epoch": 3393} {"train_loss": -24.959136962890625, "global_step": 281646, "epoch": 3393} {"train_loss": -25.588769912719727, "global_step": 281647, "epoch": 3393} {"train_loss": -24.968936920166016, "global_step": 281648, "epoch": 3393} {"train_loss": -25.35159683227539, "global_step": 281649, "epoch": 3393} {"train_loss": -25.2479248046875, "global_step": 281650, "epoch": 3393} {"train_loss": -25.352554321289062, "global_step": 281651, "epoch": 3393} {"train_loss": -25.556516647338867, "global_step": 281652, "epoch": 3393} {"train_loss": -25.30185890197754, "global_step": 281653, "epoch": 3393} {"train_loss": -25.257278442382812, "global_step": 281654, "epoch": 3393} {"train_loss": -25.602832794189453, "global_step": 281655, "epoch": 3393} {"train_loss": -25.5725040435791, "global_step": 281656, "epoch": 3393} {"train_loss": -25.719141006469727, "global_step": 281657, "epoch": 3393} {"train_loss": -25.500986099243164, "global_step": 281658, "epoch": 3393} {"train_loss": -25.355844497680664, "global_step": 281659, "epoch": 3393} {"train_loss": -25.650339126586914, "global_step": 281660, "epoch": 3393} {"train_loss": -25.302297592163086, "global_step": 281661, "epoch": 3393} {"train_loss": -25.28835105895996, "global_step": 281662, "epoch": 3393} {"train_loss": -25.650257110595703, "global_step": 281663, "epoch": 3393} {"train_loss": -25.339921951293945, "global_step": 281664, "epoch": 3393} {"train_loss": -25.75880241394043, "global_step": 281665, "epoch": 3393} {"train_loss": -25.547901153564453, "global_step": 281666, "epoch": 3393} {"train_loss": -25.97920799255371, "global_step": 281667, "epoch": 3393} {"train_loss": -25.25254249572754, "global_step": 281668, "epoch": 3393} {"train_loss": -25.35264778137207, "global_step": 281669, "epoch": 3393} {"train_loss": -25.101306915283203, "global_step": 281670, "epoch": 3393} {"train_loss": -25.59413719177246, "global_step": 281671, "epoch": 3393} {"train_loss": -25.602697372436523, "global_step": 281672, "epoch": 3393} {"train_loss": -25.590641021728516, "global_step": 281673, "epoch": 3393} {"train_loss": -25.471738815307617, "global_step": 281674, "epoch": 3393} {"train_loss": -25.804792404174805, "global_step": 281675, "epoch": 3393} {"train_loss": -25.62845802307129, "global_step": 281676, "epoch": 3393} {"train_loss": -25.36390495300293, "global_step": 281677, "epoch": 3393} {"train_loss": -24.988372802734375, "global_step": 281678, "epoch": 3393} {"train_loss": -25.401676177978516, "global_step": 281679, "epoch": 3393} {"train_loss": -25.576562881469727, "global_step": 281680, "epoch": 3393} {"train_loss": -25.445571899414062, "global_step": 281681, "epoch": 3393} {"train_loss": -25.476566314697266, "global_step": 281682, "epoch": 3393} {"train_loss": -25.594106674194336, "global_step": 281683, "epoch": 3393} {"train_loss": -25.727249145507812, "global_step": 281684, "epoch": 3393} {"train_loss": -25.555686950683594, "global_step": 281685, "epoch": 3393} {"train_loss": -25.016651153564453, "global_step": 281686, "epoch": 3393} {"train_loss": -25.080671310424805, "global_step": 281687, "epoch": 3393} {"train_loss": -25.61371421813965, "global_step": 281688, "epoch": 3393} {"train_loss": -25.905475616455078, "global_step": 281689, "epoch": 3393} {"train_loss": -25.20183753967285, "global_step": 281690, "epoch": 3393} {"train_loss": -25.108083724975586, "global_step": 281691, "epoch": 3393} {"train_loss": -25.413394927978516, "global_step": 281692, "epoch": 3393} {"train_loss": -25.602115631103516, "global_step": 281693, "epoch": 3393} {"train_loss": -25.29796028137207, "global_step": 281694, "epoch": 3393} {"train_loss": -25.805402755737305, "global_step": 281695, "epoch": 3393} {"train_loss": -25.531482696533203, "global_step": 281696, "epoch": 3393} {"train_loss": -25.401065826416016, "global_step": 281697, "epoch": 3393} {"train_loss": -25.822525024414062, "global_step": 281698, "epoch": 3393} {"train_loss": -25.737112045288086, "global_step": 281699, "epoch": 3393} {"train_loss": -25.3291072845459, "global_step": 281700, "epoch": 3393} {"train_loss": -25.218747908810535, "global_step": 281701, "epoch": 3393, "val_loss": 7272329.0} {"train_loss": -24.0978946685791, "global_step": 281702, "epoch": 3394} {"train_loss": -23.71244239807129, "global_step": 281703, "epoch": 3394} {"train_loss": -23.167871475219727, "global_step": 281704, "epoch": 3394} {"train_loss": -24.145221710205078, "global_step": 281705, "epoch": 3394} {"train_loss": -24.23397445678711, "global_step": 281706, "epoch": 3394} {"train_loss": -24.593746185302734, "global_step": 281707, "epoch": 3394} {"train_loss": -24.702903747558594, "global_step": 281708, "epoch": 3394} {"train_loss": -24.77054786682129, "global_step": 281709, "epoch": 3394} {"train_loss": -24.644548416137695, "global_step": 281710, "epoch": 3394} {"train_loss": -24.291072845458984, "global_step": 281711, "epoch": 3394} {"train_loss": -24.81560707092285, "global_step": 281712, "epoch": 3394} {"train_loss": -24.501888275146484, "global_step": 281713, "epoch": 3394} {"train_loss": -24.955249786376953, "global_step": 281714, "epoch": 3394} {"train_loss": -24.88886260986328, "global_step": 281715, "epoch": 3394} {"train_loss": -25.110509872436523, "global_step": 281716, "epoch": 3394} {"train_loss": -24.842382431030273, "global_step": 281717, "epoch": 3394} {"train_loss": -24.94667625427246, "global_step": 281718, "epoch": 3394} {"train_loss": -25.069028854370117, "global_step": 281719, "epoch": 3394} {"train_loss": -25.086606979370117, "global_step": 281720, "epoch": 3394} {"train_loss": -24.77644157409668, "global_step": 281721, "epoch": 3394} {"train_loss": -25.329076766967773, "global_step": 281722, "epoch": 3394} {"train_loss": -25.194425582885742, "global_step": 281723, "epoch": 3394} {"train_loss": -25.340612411499023, "global_step": 281724, "epoch": 3394} {"train_loss": -24.970937728881836, "global_step": 281725, "epoch": 3394} {"train_loss": -25.388137817382812, "global_step": 281726, "epoch": 3394} {"train_loss": -25.20161247253418, "global_step": 281727, "epoch": 3394} {"train_loss": -25.37300682067871, "global_step": 281728, "epoch": 3394} {"train_loss": -25.408235549926758, "global_step": 281729, "epoch": 3394} {"train_loss": -25.41862678527832, "global_step": 281730, "epoch": 3394} {"train_loss": -24.980724334716797, "global_step": 281731, "epoch": 3394} {"train_loss": -25.34473991394043, "global_step": 281732, "epoch": 3394} {"train_loss": -25.053815841674805, "global_step": 281733, "epoch": 3394} {"train_loss": -25.19111442565918, "global_step": 281734, "epoch": 3394} {"train_loss": -25.451749801635742, "global_step": 281735, "epoch": 3394} {"train_loss": -25.5458927154541, "global_step": 281736, "epoch": 3394} {"train_loss": -25.463346481323242, "global_step": 281737, "epoch": 3394} {"train_loss": -25.343732833862305, "global_step": 281738, "epoch": 3394} {"train_loss": -25.543638229370117, "global_step": 281739, "epoch": 3394} {"train_loss": -25.1224365234375, "global_step": 281740, "epoch": 3394} {"train_loss": -25.762739181518555, "global_step": 281741, "epoch": 3394} {"train_loss": -25.37453269958496, "global_step": 281742, "epoch": 3394} {"train_loss": -25.096033096313477, "global_step": 281743, "epoch": 3394} {"train_loss": -25.67718505859375, "global_step": 281744, "epoch": 3394} {"train_loss": -25.63503074645996, "global_step": 281745, "epoch": 3394} {"train_loss": -25.673099517822266, "global_step": 281746, "epoch": 3394} {"train_loss": -25.62102699279785, "global_step": 281747, "epoch": 3394} {"train_loss": -25.442676544189453, "global_step": 281748, "epoch": 3394} {"train_loss": -25.605682373046875, "global_step": 281749, "epoch": 3394} {"train_loss": -25.674671173095703, "global_step": 281750, "epoch": 3394} {"train_loss": -25.631534576416016, "global_step": 281751, "epoch": 3394} {"train_loss": -25.781164169311523, "global_step": 281752, "epoch": 3394} {"train_loss": -25.707523345947266, "global_step": 281753, "epoch": 3394} {"train_loss": -25.822111129760742, "global_step": 281754, "epoch": 3394} {"train_loss": -25.799789428710938, "global_step": 281755, "epoch": 3394} {"train_loss": -25.59930992126465, "global_step": 281756, "epoch": 3394} {"train_loss": -25.58085823059082, "global_step": 281757, "epoch": 3394} {"train_loss": -25.494129180908203, "global_step": 281758, "epoch": 3394} {"train_loss": -24.99098014831543, "global_step": 281759, "epoch": 3394} {"train_loss": -25.65260124206543, "global_step": 281760, "epoch": 3394} {"train_loss": -25.42776870727539, "global_step": 281761, "epoch": 3394} {"train_loss": -25.19904899597168, "global_step": 281762, "epoch": 3394} {"train_loss": -25.157224655151367, "global_step": 281763, "epoch": 3394} {"train_loss": -25.4574031829834, "global_step": 281764, "epoch": 3394} {"train_loss": -25.406660079956055, "global_step": 281765, "epoch": 3394} {"train_loss": -25.603734970092773, "global_step": 281766, "epoch": 3394} {"train_loss": -25.248762130737305, "global_step": 281767, "epoch": 3394} {"train_loss": -24.988178253173828, "global_step": 281768, "epoch": 3394} {"train_loss": -25.687591552734375, "global_step": 281769, "epoch": 3394} {"train_loss": -25.08786392211914, "global_step": 281770, "epoch": 3394} {"train_loss": -25.745466232299805, "global_step": 281771, "epoch": 3394} {"train_loss": -25.42792510986328, "global_step": 281772, "epoch": 3394} {"train_loss": -25.238269805908203, "global_step": 281773, "epoch": 3394} {"train_loss": -25.249834060668945, "global_step": 281774, "epoch": 3394} {"train_loss": -25.07887840270996, "global_step": 281775, "epoch": 3394} {"train_loss": -25.599185943603516, "global_step": 281776, "epoch": 3394} {"train_loss": -25.526758193969727, "global_step": 281777, "epoch": 3394} {"train_loss": -25.913297653198242, "global_step": 281778, "epoch": 3394} {"train_loss": -26.069761276245117, "global_step": 281779, "epoch": 3394} {"train_loss": -25.50553321838379, "global_step": 281780, "epoch": 3394} {"train_loss": -25.7308406829834, "global_step": 281781, "epoch": 3394} {"train_loss": -25.480457305908203, "global_step": 281782, "epoch": 3394} {"train_loss": -25.579360961914062, "global_step": 281783, "epoch": 3394} {"train_loss": -25.226516470851667, "global_step": 281784, "epoch": 3394, "val_loss": 7109811.0} {"train_loss": -24.688657760620117, "global_step": 281785, "epoch": 3395} {"train_loss": -24.7416934967041, "global_step": 281786, "epoch": 3395} {"train_loss": -24.645679473876953, "global_step": 281787, "epoch": 3395} {"train_loss": -24.579870223999023, "global_step": 281788, "epoch": 3395} {"train_loss": -24.437164306640625, "global_step": 281789, "epoch": 3395} {"train_loss": -24.984525680541992, "global_step": 281790, "epoch": 3395} {"train_loss": -24.89067840576172, "global_step": 281791, "epoch": 3395} {"train_loss": -24.900074005126953, "global_step": 281792, "epoch": 3395} {"train_loss": -24.900962829589844, "global_step": 281793, "epoch": 3395} {"train_loss": -24.5546817779541, "global_step": 281794, "epoch": 3395} {"train_loss": -25.466033935546875, "global_step": 281795, "epoch": 3395} {"train_loss": -25.24700927734375, "global_step": 281796, "epoch": 3395} {"train_loss": -24.885433197021484, "global_step": 281797, "epoch": 3395} {"train_loss": -25.1319522857666, "global_step": 281798, "epoch": 3395} {"train_loss": -25.136449813842773, "global_step": 281799, "epoch": 3395} {"train_loss": -24.97211265563965, "global_step": 281800, "epoch": 3395} {"train_loss": -25.259357452392578, "global_step": 281801, "epoch": 3395} {"train_loss": -25.360822677612305, "global_step": 281802, "epoch": 3395} {"train_loss": -24.793500900268555, "global_step": 281803, "epoch": 3395} {"train_loss": -25.491302490234375, "global_step": 281804, "epoch": 3395} {"train_loss": -25.424577713012695, "global_step": 281805, "epoch": 3395} {"train_loss": -25.501171112060547, "global_step": 281806, "epoch": 3395} {"train_loss": -25.31025505065918, "global_step": 281807, "epoch": 3395} {"train_loss": -25.50436782836914, "global_step": 281808, "epoch": 3395} {"train_loss": -25.2197208404541, "global_step": 281809, "epoch": 3395} {"train_loss": -25.57145118713379, "global_step": 281810, "epoch": 3395} {"train_loss": -25.715351104736328, "global_step": 281811, "epoch": 3395} {"train_loss": -25.005483627319336, "global_step": 281812, "epoch": 3395} {"train_loss": -25.46158790588379, "global_step": 281813, "epoch": 3395} {"train_loss": -25.356870651245117, "global_step": 281814, "epoch": 3395} {"train_loss": -25.325284957885742, "global_step": 281815, "epoch": 3395} {"train_loss": -25.079870223999023, "global_step": 281816, "epoch": 3395} {"train_loss": -25.584331512451172, "global_step": 281817, "epoch": 3395} {"train_loss": -25.491607666015625, "global_step": 281818, "epoch": 3395} {"train_loss": -25.428823471069336, "global_step": 281819, "epoch": 3395} {"train_loss": -25.340091705322266, "global_step": 281820, "epoch": 3395} {"train_loss": -25.6427059173584, "global_step": 281821, "epoch": 3395} {"train_loss": -25.313230514526367, "global_step": 281822, "epoch": 3395} {"train_loss": -25.687158584594727, "global_step": 281823, "epoch": 3395} {"train_loss": -25.360300064086914, "global_step": 281824, "epoch": 3395} {"train_loss": -25.430469512939453, "global_step": 281825, "epoch": 3395} {"train_loss": -25.62794303894043, "global_step": 281826, "epoch": 3395} {"train_loss": -25.635114669799805, "global_step": 281827, "epoch": 3395} {"train_loss": -25.722625732421875, "global_step": 281828, "epoch": 3395} {"train_loss": -25.458250045776367, "global_step": 281829, "epoch": 3395} {"train_loss": -25.495630264282227, "global_step": 281830, "epoch": 3395} {"train_loss": -25.502700805664062, "global_step": 281831, "epoch": 3395} {"train_loss": -25.636327743530273, "global_step": 281832, "epoch": 3395} {"train_loss": -25.514780044555664, "global_step": 281833, "epoch": 3395} {"train_loss": -25.26627540588379, "global_step": 281834, "epoch": 3395} {"train_loss": -25.595144271850586, "global_step": 281835, "epoch": 3395} {"train_loss": -25.846988677978516, "global_step": 281836, "epoch": 3395} {"train_loss": -25.567781448364258, "global_step": 281837, "epoch": 3395} {"train_loss": -25.528066635131836, "global_step": 281838, "epoch": 3395} {"train_loss": -25.429698944091797, "global_step": 281839, "epoch": 3395} {"train_loss": -25.623884201049805, "global_step": 281840, "epoch": 3395} {"train_loss": -25.464298248291016, "global_step": 281841, "epoch": 3395} {"train_loss": -25.529647827148438, "global_step": 281842, "epoch": 3395} {"train_loss": -25.685171127319336, "global_step": 281843, "epoch": 3395} {"train_loss": -25.534046173095703, "global_step": 281844, "epoch": 3395} {"train_loss": -25.61018943786621, "global_step": 281845, "epoch": 3395} {"train_loss": -25.9626407623291, "global_step": 281846, "epoch": 3395} {"train_loss": -25.483898162841797, "global_step": 281847, "epoch": 3395} {"train_loss": -25.509323120117188, "global_step": 281848, "epoch": 3395} {"train_loss": -25.473981857299805, "global_step": 281849, "epoch": 3395} {"train_loss": -25.248014450073242, "global_step": 281850, "epoch": 3395} {"train_loss": -25.492891311645508, "global_step": 281851, "epoch": 3395} {"train_loss": -25.195524215698242, "global_step": 281852, "epoch": 3395} {"train_loss": -25.3204402923584, "global_step": 281853, "epoch": 3395} {"train_loss": -25.60340690612793, "global_step": 281854, "epoch": 3395} {"train_loss": -25.21494483947754, "global_step": 281855, "epoch": 3395} {"train_loss": -25.419158935546875, "global_step": 281856, "epoch": 3395} {"train_loss": -25.345111846923828, "global_step": 281857, "epoch": 3395} {"train_loss": -25.822675704956055, "global_step": 281858, "epoch": 3395} {"train_loss": -25.333860397338867, "global_step": 281859, "epoch": 3395} {"train_loss": -25.7990665435791, "global_step": 281860, "epoch": 3395} {"train_loss": -25.505216598510742, "global_step": 281861, "epoch": 3395} {"train_loss": -25.411149978637695, "global_step": 281862, "epoch": 3395} {"train_loss": -25.2366943359375, "global_step": 281863, "epoch": 3395} {"train_loss": -25.8501033782959, "global_step": 281864, "epoch": 3395} {"train_loss": -25.394750595092773, "global_step": 281865, "epoch": 3395} {"train_loss": -25.34902572631836, "global_step": 281866, "epoch": 3395} {"train_loss": -25.36122400214873, "global_step": 281867, "epoch": 3395, "val_loss": 7068652.0} {"train_loss": -25.15118980407715, "global_step": 281868, "epoch": 3396} {"train_loss": -25.123485565185547, "global_step": 281869, "epoch": 3396} {"train_loss": -25.05061912536621, "global_step": 281870, "epoch": 3396} {"train_loss": -25.943273544311523, "global_step": 281871, "epoch": 3396} {"train_loss": -25.0654296875, "global_step": 281872, "epoch": 3396} {"train_loss": -24.9011287689209, "global_step": 281873, "epoch": 3396} {"train_loss": -25.391077041625977, "global_step": 281874, "epoch": 3396} {"train_loss": -25.314010620117188, "global_step": 281875, "epoch": 3396} {"train_loss": -25.145145416259766, "global_step": 281876, "epoch": 3396} {"train_loss": -25.18160057067871, "global_step": 281877, "epoch": 3396} {"train_loss": -24.97381019592285, "global_step": 281878, "epoch": 3396} {"train_loss": -25.315418243408203, "global_step": 281879, "epoch": 3396} {"train_loss": -25.400531768798828, "global_step": 281880, "epoch": 3396} {"train_loss": -25.260818481445312, "global_step": 281881, "epoch": 3396} {"train_loss": -25.725666046142578, "global_step": 281882, "epoch": 3396} {"train_loss": -25.39444923400879, "global_step": 281883, "epoch": 3396} {"train_loss": -25.47446060180664, "global_step": 281884, "epoch": 3396} {"train_loss": -25.43402099609375, "global_step": 281885, "epoch": 3396} {"train_loss": -25.607038497924805, "global_step": 281886, "epoch": 3396} {"train_loss": -25.400320053100586, "global_step": 281887, "epoch": 3396} {"train_loss": -25.558063507080078, "global_step": 281888, "epoch": 3396} {"train_loss": -25.604480743408203, "global_step": 281889, "epoch": 3396} {"train_loss": -24.990385055541992, "global_step": 281890, "epoch": 3396} {"train_loss": -25.304784774780273, "global_step": 281891, "epoch": 3396} {"train_loss": -24.963598251342773, "global_step": 281892, "epoch": 3396} {"train_loss": -25.368896484375, "global_step": 281893, "epoch": 3396} {"train_loss": -25.365402221679688, "global_step": 281894, "epoch": 3396} {"train_loss": -25.495529174804688, "global_step": 281895, "epoch": 3396} {"train_loss": -25.053375244140625, "global_step": 281896, "epoch": 3396} {"train_loss": -24.717802047729492, "global_step": 281897, "epoch": 3396} {"train_loss": -25.23193359375, "global_step": 281898, "epoch": 3396} {"train_loss": -25.606769561767578, "global_step": 281899, "epoch": 3396} {"train_loss": -25.152088165283203, "global_step": 281900, "epoch": 3396} {"train_loss": -25.055150985717773, "global_step": 281901, "epoch": 3396} {"train_loss": -25.636459350585938, "global_step": 281902, "epoch": 3396} {"train_loss": -25.223079681396484, "global_step": 281903, "epoch": 3396} {"train_loss": -25.33473777770996, "global_step": 281904, "epoch": 3396} {"train_loss": -25.489349365234375, "global_step": 281905, "epoch": 3396} {"train_loss": -25.160362243652344, "global_step": 281906, "epoch": 3396} {"train_loss": -25.306594848632812, "global_step": 281907, "epoch": 3396} {"train_loss": -25.574356079101562, "global_step": 281908, "epoch": 3396} {"train_loss": -25.145727157592773, "global_step": 281909, "epoch": 3396} {"train_loss": -25.632068634033203, "global_step": 281910, "epoch": 3396} {"train_loss": -25.491117477416992, "global_step": 281911, "epoch": 3396} {"train_loss": -25.727737426757812, "global_step": 281912, "epoch": 3396} {"train_loss": -25.866201400756836, "global_step": 281913, "epoch": 3396} {"train_loss": -25.499340057373047, "global_step": 281914, "epoch": 3396} {"train_loss": -25.709653854370117, "global_step": 281915, "epoch": 3396} {"train_loss": -25.358478546142578, "global_step": 281916, "epoch": 3396} {"train_loss": -25.454126358032227, "global_step": 281917, "epoch": 3396} {"train_loss": -25.685007095336914, "global_step": 281918, "epoch": 3396} {"train_loss": -25.781518936157227, "global_step": 281919, "epoch": 3396} {"train_loss": -25.380996704101562, "global_step": 281920, "epoch": 3396} {"train_loss": -25.61018180847168, "global_step": 281921, "epoch": 3396} {"train_loss": -25.481950759887695, "global_step": 281922, "epoch": 3396} {"train_loss": -25.88408851623535, "global_step": 281923, "epoch": 3396} {"train_loss": -25.496444702148438, "global_step": 281924, "epoch": 3396} {"train_loss": -25.330467224121094, "global_step": 281925, "epoch": 3396} {"train_loss": -25.48615264892578, "global_step": 281926, "epoch": 3396} {"train_loss": -25.69563102722168, "global_step": 281927, "epoch": 3396} {"train_loss": -25.34234619140625, "global_step": 281928, "epoch": 3396} {"train_loss": -25.79694175720215, "global_step": 281929, "epoch": 3396} {"train_loss": -25.683149337768555, "global_step": 281930, "epoch": 3396} {"train_loss": -25.4957218170166, "global_step": 281931, "epoch": 3396} {"train_loss": -25.249204635620117, "global_step": 281932, "epoch": 3396} {"train_loss": -25.959314346313477, "global_step": 281933, "epoch": 3396} {"train_loss": -25.11536407470703, "global_step": 281934, "epoch": 3396} {"train_loss": -25.46949577331543, "global_step": 281935, "epoch": 3396} {"train_loss": -25.127653121948242, "global_step": 281936, "epoch": 3396} {"train_loss": -25.700475692749023, "global_step": 281937, "epoch": 3396} {"train_loss": -25.300642013549805, "global_step": 281938, "epoch": 3396} {"train_loss": -25.747243881225586, "global_step": 281939, "epoch": 3396} {"train_loss": -25.584592819213867, "global_step": 281940, "epoch": 3396} {"train_loss": -24.925682067871094, "global_step": 281941, "epoch": 3396} {"train_loss": -25.485610961914062, "global_step": 281942, "epoch": 3396} {"train_loss": -25.88034439086914, "global_step": 281943, "epoch": 3396} {"train_loss": -25.15903091430664, "global_step": 281944, "epoch": 3396} {"train_loss": -25.061328887939453, "global_step": 281945, "epoch": 3396} {"train_loss": -24.70429801940918, "global_step": 281946, "epoch": 3396} {"train_loss": -25.520130157470703, "global_step": 281947, "epoch": 3396} {"train_loss": -25.402755737304688, "global_step": 281948, "epoch": 3396} {"train_loss": -25.347463607788086, "global_step": 281949, "epoch": 3396} {"train_loss": -25.397689635495105, "global_step": 281950, "epoch": 3396, "val_loss": 7119072.5} {"train_loss": -25.07803726196289, "global_step": 281951, "epoch": 3397} {"train_loss": -24.86210060119629, "global_step": 281952, "epoch": 3397} {"train_loss": -25.174758911132812, "global_step": 281953, "epoch": 3397} {"train_loss": -25.250747680664062, "global_step": 281954, "epoch": 3397} {"train_loss": -25.021493911743164, "global_step": 281955, "epoch": 3397} {"train_loss": -24.86442756652832, "global_step": 281956, "epoch": 3397} {"train_loss": -25.062978744506836, "global_step": 281957, "epoch": 3397} {"train_loss": -25.351152420043945, "global_step": 281958, "epoch": 3397} {"train_loss": -25.37353515625, "global_step": 281959, "epoch": 3397} {"train_loss": -25.185712814331055, "global_step": 281960, "epoch": 3397} {"train_loss": -24.937490463256836, "global_step": 281961, "epoch": 3397} {"train_loss": -25.30726432800293, "global_step": 281962, "epoch": 3397} {"train_loss": -25.272823333740234, "global_step": 281963, "epoch": 3397} {"train_loss": -25.402799606323242, "global_step": 281964, "epoch": 3397} {"train_loss": -25.605960845947266, "global_step": 281965, "epoch": 3397} {"train_loss": -25.47527503967285, "global_step": 281966, "epoch": 3397} {"train_loss": -25.326868057250977, "global_step": 281967, "epoch": 3397} {"train_loss": -25.07647705078125, "global_step": 281968, "epoch": 3397} {"train_loss": -25.48929786682129, "global_step": 281969, "epoch": 3397} {"train_loss": -25.690759658813477, "global_step": 281970, "epoch": 3397} {"train_loss": -25.43750762939453, "global_step": 281971, "epoch": 3397} {"train_loss": -25.459020614624023, "global_step": 281972, "epoch": 3397} {"train_loss": -25.17789649963379, "global_step": 281973, "epoch": 3397} {"train_loss": -25.590192794799805, "global_step": 281974, "epoch": 3397} {"train_loss": -24.978498458862305, "global_step": 281975, "epoch": 3397} {"train_loss": -25.259830474853516, "global_step": 281976, "epoch": 3397} {"train_loss": -24.996450424194336, "global_step": 281977, "epoch": 3397} {"train_loss": -25.279699325561523, "global_step": 281978, "epoch": 3397} {"train_loss": -25.749042510986328, "global_step": 281979, "epoch": 3397} {"train_loss": -25.01572608947754, "global_step": 281980, "epoch": 3397} {"train_loss": -25.6162052154541, "global_step": 281981, "epoch": 3397} {"train_loss": -25.7849063873291, "global_step": 281982, "epoch": 3397} {"train_loss": -25.426862716674805, "global_step": 281983, "epoch": 3397} {"train_loss": -25.206167221069336, "global_step": 281984, "epoch": 3397} {"train_loss": -25.605390548706055, "global_step": 281985, "epoch": 3397} {"train_loss": -25.600711822509766, "global_step": 281986, "epoch": 3397} {"train_loss": -25.638341903686523, "global_step": 281987, "epoch": 3397} {"train_loss": -25.59516716003418, "global_step": 281988, "epoch": 3397} {"train_loss": -25.461950302124023, "global_step": 281989, "epoch": 3397} {"train_loss": -25.376813888549805, "global_step": 281990, "epoch": 3397} {"train_loss": -25.890766143798828, "global_step": 281991, "epoch": 3397} {"train_loss": -25.24924087524414, "global_step": 281992, "epoch": 3397} {"train_loss": -25.73554039001465, "global_step": 281993, "epoch": 3397} {"train_loss": -25.280420303344727, "global_step": 281994, "epoch": 3397} {"train_loss": -25.366018295288086, "global_step": 281995, "epoch": 3397} {"train_loss": -26.001501083374023, "global_step": 281996, "epoch": 3397} {"train_loss": -25.462060928344727, "global_step": 281997, "epoch": 3397} {"train_loss": -25.34769630432129, "global_step": 281998, "epoch": 3397} {"train_loss": -25.400928497314453, "global_step": 281999, "epoch": 3397} {"train_loss": -25.62054443359375, "global_step": 282000, "epoch": 3397} {"train_loss": -25.424264907836914, "global_step": 282001, "epoch": 3397} {"train_loss": -25.424972534179688, "global_step": 282002, "epoch": 3397} {"train_loss": -25.414323806762695, "global_step": 282003, "epoch": 3397} {"train_loss": -25.301204681396484, "global_step": 282004, "epoch": 3397} {"train_loss": -25.682050704956055, "global_step": 282005, "epoch": 3397} {"train_loss": -25.18601417541504, "global_step": 282006, "epoch": 3397} {"train_loss": -25.040618896484375, "global_step": 282007, "epoch": 3397} {"train_loss": -25.244470596313477, "global_step": 282008, "epoch": 3397} {"train_loss": -25.684823989868164, "global_step": 282009, "epoch": 3397} {"train_loss": -25.819293975830078, "global_step": 282010, "epoch": 3397} {"train_loss": -25.607709884643555, "global_step": 282011, "epoch": 3397} {"train_loss": -25.552940368652344, "global_step": 282012, "epoch": 3397} {"train_loss": -25.492618560791016, "global_step": 282013, "epoch": 3397} {"train_loss": -25.551328659057617, "global_step": 282014, "epoch": 3397} {"train_loss": -25.59956932067871, "global_step": 282015, "epoch": 3397} {"train_loss": -25.49054718017578, "global_step": 282016, "epoch": 3397} {"train_loss": -25.457687377929688, "global_step": 282017, "epoch": 3397} {"train_loss": -25.605289459228516, "global_step": 282018, "epoch": 3397} {"train_loss": -25.466032028198242, "global_step": 282019, "epoch": 3397} {"train_loss": -25.527799606323242, "global_step": 282020, "epoch": 3397} {"train_loss": -25.403501510620117, "global_step": 282021, "epoch": 3397} {"train_loss": -25.084569931030273, "global_step": 282022, "epoch": 3397} {"train_loss": -24.914352416992188, "global_step": 282023, "epoch": 3397} {"train_loss": -24.796716690063477, "global_step": 282024, "epoch": 3397} {"train_loss": -24.99716567993164, "global_step": 282025, "epoch": 3397} {"train_loss": -24.914819717407227, "global_step": 282026, "epoch": 3397} {"train_loss": -25.12797737121582, "global_step": 282027, "epoch": 3397} {"train_loss": -24.98225212097168, "global_step": 282028, "epoch": 3397} {"train_loss": -25.6126651763916, "global_step": 282029, "epoch": 3397} {"train_loss": -25.04973793029785, "global_step": 282030, "epoch": 3397} {"train_loss": -25.319110870361328, "global_step": 282031, "epoch": 3397} {"train_loss": -25.526472091674805, "global_step": 282032, "epoch": 3397} {"train_loss": -25.346301366047687, "global_step": 282033, "epoch": 3397, "val_loss": 6995781.5} {"train_loss": -23.888912200927734, "global_step": 282034, "epoch": 3398} {"train_loss": -24.330495834350586, "global_step": 282035, "epoch": 3398} {"train_loss": -24.42279624938965, "global_step": 282036, "epoch": 3398} {"train_loss": -24.2981014251709, "global_step": 282037, "epoch": 3398} {"train_loss": -24.89790153503418, "global_step": 282038, "epoch": 3398} {"train_loss": -24.70476722717285, "global_step": 282039, "epoch": 3398} {"train_loss": -24.83837890625, "global_step": 282040, "epoch": 3398} {"train_loss": -24.764278411865234, "global_step": 282041, "epoch": 3398} {"train_loss": -25.00937843322754, "global_step": 282042, "epoch": 3398} {"train_loss": -24.90773582458496, "global_step": 282043, "epoch": 3398} {"train_loss": -25.010772705078125, "global_step": 282044, "epoch": 3398} {"train_loss": -24.730026245117188, "global_step": 282045, "epoch": 3398} {"train_loss": -24.577268600463867, "global_step": 282046, "epoch": 3398} {"train_loss": -25.21636199951172, "global_step": 282047, "epoch": 3398} {"train_loss": -25.072586059570312, "global_step": 282048, "epoch": 3398} {"train_loss": -24.92870330810547, "global_step": 282049, "epoch": 3398} {"train_loss": -25.2681941986084, "global_step": 282050, "epoch": 3398} {"train_loss": -24.985937118530273, "global_step": 282051, "epoch": 3398} {"train_loss": -25.142704010009766, "global_step": 282052, "epoch": 3398} {"train_loss": -25.105417251586914, "global_step": 282053, "epoch": 3398} {"train_loss": -25.421335220336914, "global_step": 282054, "epoch": 3398} {"train_loss": -24.979755401611328, "global_step": 282055, "epoch": 3398} {"train_loss": -25.180694580078125, "global_step": 282056, "epoch": 3398} {"train_loss": -25.364105224609375, "global_step": 282057, "epoch": 3398} {"train_loss": -25.54060935974121, "global_step": 282058, "epoch": 3398} {"train_loss": -24.959497451782227, "global_step": 282059, "epoch": 3398} {"train_loss": -24.999799728393555, "global_step": 282060, "epoch": 3398} {"train_loss": -25.176334381103516, "global_step": 282061, "epoch": 3398} {"train_loss": -25.256052017211914, "global_step": 282062, "epoch": 3398} {"train_loss": -25.555883407592773, "global_step": 282063, "epoch": 3398} {"train_loss": -25.2047119140625, "global_step": 282064, "epoch": 3398} {"train_loss": -25.586572647094727, "global_step": 282065, "epoch": 3398} {"train_loss": -25.307592391967773, "global_step": 282066, "epoch": 3398} {"train_loss": -25.43735122680664, "global_step": 282067, "epoch": 3398} {"train_loss": -25.476789474487305, "global_step": 282068, "epoch": 3398} {"train_loss": -25.625436782836914, "global_step": 282069, "epoch": 3398} {"train_loss": -25.45039176940918, "global_step": 282070, "epoch": 3398} {"train_loss": -25.70796012878418, "global_step": 282071, "epoch": 3398} {"train_loss": -25.547399520874023, "global_step": 282072, "epoch": 3398} {"train_loss": -25.431272506713867, "global_step": 282073, "epoch": 3398} {"train_loss": -25.667499542236328, "global_step": 282074, "epoch": 3398} {"train_loss": -25.075952529907227, "global_step": 282075, "epoch": 3398} {"train_loss": -25.367597579956055, "global_step": 282076, "epoch": 3398} {"train_loss": -25.576095581054688, "global_step": 282077, "epoch": 3398} {"train_loss": -25.497400283813477, "global_step": 282078, "epoch": 3398} {"train_loss": -25.234704971313477, "global_step": 282079, "epoch": 3398} {"train_loss": -24.900388717651367, "global_step": 282080, "epoch": 3398} {"train_loss": -25.92970085144043, "global_step": 282081, "epoch": 3398} {"train_loss": -25.227054595947266, "global_step": 282082, "epoch": 3398} {"train_loss": -25.509031295776367, "global_step": 282083, "epoch": 3398} {"train_loss": -25.52149772644043, "global_step": 282084, "epoch": 3398} {"train_loss": -24.884252548217773, "global_step": 282085, "epoch": 3398} {"train_loss": -25.445072174072266, "global_step": 282086, "epoch": 3398} {"train_loss": -25.309751510620117, "global_step": 282087, "epoch": 3398} {"train_loss": -25.7712345123291, "global_step": 282088, "epoch": 3398} {"train_loss": -25.48781394958496, "global_step": 282089, "epoch": 3398} {"train_loss": -25.373411178588867, "global_step": 282090, "epoch": 3398} {"train_loss": -25.50508689880371, "global_step": 282091, "epoch": 3398} {"train_loss": -25.399412155151367, "global_step": 282092, "epoch": 3398} {"train_loss": -25.7293701171875, "global_step": 282093, "epoch": 3398} {"train_loss": -25.49416160583496, "global_step": 282094, "epoch": 3398} {"train_loss": -25.457975387573242, "global_step": 282095, "epoch": 3398} {"train_loss": -25.117000579833984, "global_step": 282096, "epoch": 3398} {"train_loss": -25.72132682800293, "global_step": 282097, "epoch": 3398} {"train_loss": -25.327600479125977, "global_step": 282098, "epoch": 3398} {"train_loss": -25.108478546142578, "global_step": 282099, "epoch": 3398} {"train_loss": -25.337207794189453, "global_step": 282100, "epoch": 3398} {"train_loss": -25.573440551757812, "global_step": 282101, "epoch": 3398} {"train_loss": -25.395912170410156, "global_step": 282102, "epoch": 3398} {"train_loss": -25.609928131103516, "global_step": 282103, "epoch": 3398} {"train_loss": -25.293838500976562, "global_step": 282104, "epoch": 3398} {"train_loss": -24.98593521118164, "global_step": 282105, "epoch": 3398} {"train_loss": -25.317651748657227, "global_step": 282106, "epoch": 3398} {"train_loss": -25.369853973388672, "global_step": 282107, "epoch": 3398} {"train_loss": -25.706974029541016, "global_step": 282108, "epoch": 3398} {"train_loss": -25.621326446533203, "global_step": 282109, "epoch": 3398} {"train_loss": -25.192108154296875, "global_step": 282110, "epoch": 3398} {"train_loss": -25.465993881225586, "global_step": 282111, "epoch": 3398} {"train_loss": -25.363615036010742, "global_step": 282112, "epoch": 3398} {"train_loss": -25.56482696533203, "global_step": 282113, "epoch": 3398} {"train_loss": -25.45863914489746, "global_step": 282114, "epoch": 3398} {"train_loss": -25.46202850341797, "global_step": 282115, "epoch": 3398} {"train_loss": -25.243719032011835, "global_step": 282116, "epoch": 3398, "val_loss": 7082124.0} {"train_loss": -25.150270462036133, "global_step": 282117, "epoch": 3399} {"train_loss": -25.47871208190918, "global_step": 282118, "epoch": 3399} {"train_loss": -25.11172866821289, "global_step": 282119, "epoch": 3399} {"train_loss": -25.331960678100586, "global_step": 282120, "epoch": 3399} {"train_loss": -25.49894142150879, "global_step": 282121, "epoch": 3399} {"train_loss": -24.875289916992188, "global_step": 282122, "epoch": 3399} {"train_loss": -25.13666343688965, "global_step": 282123, "epoch": 3399} {"train_loss": -25.06898307800293, "global_step": 282124, "epoch": 3399} {"train_loss": -24.90422248840332, "global_step": 282125, "epoch": 3399} {"train_loss": -25.29109764099121, "global_step": 282126, "epoch": 3399} {"train_loss": -25.509145736694336, "global_step": 282127, "epoch": 3399} {"train_loss": -25.13304901123047, "global_step": 282128, "epoch": 3399} {"train_loss": -25.76972007751465, "global_step": 282129, "epoch": 3399} {"train_loss": -24.994489669799805, "global_step": 282130, "epoch": 3399} {"train_loss": -25.26588249206543, "global_step": 282131, "epoch": 3399} {"train_loss": -25.379314422607422, "global_step": 282132, "epoch": 3399} {"train_loss": -25.113758087158203, "global_step": 282133, "epoch": 3399} {"train_loss": -25.26466178894043, "global_step": 282134, "epoch": 3399} {"train_loss": -25.198972702026367, "global_step": 282135, "epoch": 3399} {"train_loss": -25.19842529296875, "global_step": 282136, "epoch": 3399} {"train_loss": -26.056848526000977, "global_step": 282137, "epoch": 3399} {"train_loss": -25.410154342651367, "global_step": 282138, "epoch": 3399} {"train_loss": -25.516626358032227, "global_step": 282139, "epoch": 3399} {"train_loss": -25.486562728881836, "global_step": 282140, "epoch": 3399} {"train_loss": -25.299741744995117, "global_step": 282141, "epoch": 3399} {"train_loss": -25.26970863342285, "global_step": 282142, "epoch": 3399} {"train_loss": -24.906457901000977, "global_step": 282143, "epoch": 3399} {"train_loss": -25.4360294342041, "global_step": 282144, "epoch": 3399} {"train_loss": -25.761754989624023, "global_step": 282145, "epoch": 3399} {"train_loss": -25.130329132080078, "global_step": 282146, "epoch": 3399} {"train_loss": -25.339521408081055, "global_step": 282147, "epoch": 3399} {"train_loss": -25.09988784790039, "global_step": 282148, "epoch": 3399} {"train_loss": -25.453580856323242, "global_step": 282149, "epoch": 3399} {"train_loss": -25.134824752807617, "global_step": 282150, "epoch": 3399} {"train_loss": -25.41009521484375, "global_step": 282151, "epoch": 3399} {"train_loss": -25.49590492248535, "global_step": 282152, "epoch": 3399} {"train_loss": -25.45272445678711, "global_step": 282153, "epoch": 3399} {"train_loss": -25.352554321289062, "global_step": 282154, "epoch": 3399} {"train_loss": -25.774694442749023, "global_step": 282155, "epoch": 3399} {"train_loss": -25.34395408630371, "global_step": 282156, "epoch": 3399} {"train_loss": -25.39711570739746, "global_step": 282157, "epoch": 3399} {"train_loss": -25.68003273010254, "global_step": 282158, "epoch": 3399} {"train_loss": -25.453968048095703, "global_step": 282159, "epoch": 3399} {"train_loss": -25.353391647338867, "global_step": 282160, "epoch": 3399} {"train_loss": -25.789072036743164, "global_step": 282161, "epoch": 3399} {"train_loss": -25.4583797454834, "global_step": 282162, "epoch": 3399} {"train_loss": -25.537559509277344, "global_step": 282163, "epoch": 3399} {"train_loss": -25.35529136657715, "global_step": 282164, "epoch": 3399} {"train_loss": -25.347131729125977, "global_step": 282165, "epoch": 3399} {"train_loss": -25.430051803588867, "global_step": 282166, "epoch": 3399} {"train_loss": -25.377471923828125, "global_step": 282167, "epoch": 3399} {"train_loss": -25.09710693359375, "global_step": 282168, "epoch": 3399} {"train_loss": -25.49092674255371, "global_step": 282169, "epoch": 3399} {"train_loss": -25.44866180419922, "global_step": 282170, "epoch": 3399} {"train_loss": -24.950756072998047, "global_step": 282171, "epoch": 3399} {"train_loss": -25.547622680664062, "global_step": 282172, "epoch": 3399} {"train_loss": -25.2100772857666, "global_step": 282173, "epoch": 3399} {"train_loss": -25.0762939453125, "global_step": 282174, "epoch": 3399} {"train_loss": -25.37650489807129, "global_step": 282175, "epoch": 3399} {"train_loss": -25.412084579467773, "global_step": 282176, "epoch": 3399} {"train_loss": -25.428667068481445, "global_step": 282177, "epoch": 3399} {"train_loss": -25.6373233795166, "global_step": 282178, "epoch": 3399} {"train_loss": -25.561655044555664, "global_step": 282179, "epoch": 3399} {"train_loss": -25.64192008972168, "global_step": 282180, "epoch": 3399} {"train_loss": -25.307126998901367, "global_step": 282181, "epoch": 3399} {"train_loss": -25.647802352905273, "global_step": 282182, "epoch": 3399} {"train_loss": -25.277587890625, "global_step": 282183, "epoch": 3399} {"train_loss": -25.44855308532715, "global_step": 282184, "epoch": 3399} {"train_loss": -25.458932876586914, "global_step": 282185, "epoch": 3399} {"train_loss": -25.63580894470215, "global_step": 282186, "epoch": 3399} {"train_loss": -25.45926856994629, "global_step": 282187, "epoch": 3399} {"train_loss": -25.6245174407959, "global_step": 282188, "epoch": 3399} {"train_loss": -25.774250030517578, "global_step": 282189, "epoch": 3399} {"train_loss": -25.748111724853516, "global_step": 282190, "epoch": 3399} {"train_loss": -25.552810668945312, "global_step": 282191, "epoch": 3399} {"train_loss": -25.2759952545166, "global_step": 282192, "epoch": 3399} {"train_loss": -25.805185317993164, "global_step": 282193, "epoch": 3399} {"train_loss": -25.212717056274414, "global_step": 282194, "epoch": 3399} {"train_loss": -25.407155990600586, "global_step": 282195, "epoch": 3399} {"train_loss": -25.59928321838379, "global_step": 282196, "epoch": 3399} {"train_loss": -25.6232967376709, "global_step": 282197, "epoch": 3399} {"train_loss": -25.202320098876953, "global_step": 282198, "epoch": 3399} {"train_loss": -25.370838188263306, "global_step": 282199, "epoch": 3399, "val_loss": 7093043.0} {"train_loss": -25.43115234375, "global_step": 282200, "epoch": 3400} {"train_loss": -25.41131591796875, "global_step": 282201, "epoch": 3400} {"train_loss": -25.353666305541992, "global_step": 282202, "epoch": 3400} {"train_loss": -25.323575973510742, "global_step": 282203, "epoch": 3400} {"train_loss": -25.196834564208984, "global_step": 282204, "epoch": 3400} {"train_loss": -25.046993255615234, "global_step": 282205, "epoch": 3400} {"train_loss": -25.03518295288086, "global_step": 282206, "epoch": 3400} {"train_loss": -25.178014755249023, "global_step": 282207, "epoch": 3400} {"train_loss": -25.24018669128418, "global_step": 282208, "epoch": 3400} {"train_loss": -24.658767700195312, "global_step": 282209, "epoch": 3400} {"train_loss": -25.190723419189453, "global_step": 282210, "epoch": 3400} {"train_loss": -25.080930709838867, "global_step": 282211, "epoch": 3400} {"train_loss": -25.04487419128418, "global_step": 282212, "epoch": 3400} {"train_loss": -24.879289627075195, "global_step": 282213, "epoch": 3400} {"train_loss": -24.985244750976562, "global_step": 282214, "epoch": 3400} {"train_loss": -25.12391471862793, "global_step": 282215, "epoch": 3400} {"train_loss": -25.11220932006836, "global_step": 282216, "epoch": 3400} {"train_loss": -25.092435836791992, "global_step": 282217, "epoch": 3400} {"train_loss": -25.05732536315918, "global_step": 282218, "epoch": 3400} {"train_loss": -25.42950439453125, "global_step": 282219, "epoch": 3400} {"train_loss": -24.94622230529785, "global_step": 282220, "epoch": 3400} {"train_loss": -25.538984298706055, "global_step": 282221, "epoch": 3400} {"train_loss": -25.37973976135254, "global_step": 282222, "epoch": 3400} {"train_loss": -25.713491439819336, "global_step": 282223, "epoch": 3400} {"train_loss": -25.605688095092773, "global_step": 282224, "epoch": 3400} {"train_loss": -25.318622589111328, "global_step": 282225, "epoch": 3400} {"train_loss": -25.246366500854492, "global_step": 282226, "epoch": 3400} {"train_loss": -25.532751083374023, "global_step": 282227, "epoch": 3400} {"train_loss": -25.15765953063965, "global_step": 282228, "epoch": 3400} {"train_loss": -25.73797035217285, "global_step": 282229, "epoch": 3400} {"train_loss": -25.722925186157227, "global_step": 282230, "epoch": 3400} {"train_loss": -25.51003074645996, "global_step": 282231, "epoch": 3400} {"train_loss": -25.289716720581055, "global_step": 282232, "epoch": 3400} {"train_loss": -25.38129997253418, "global_step": 282233, "epoch": 3400} {"train_loss": -25.762006759643555, "global_step": 282234, "epoch": 3400} {"train_loss": -25.54811668395996, "global_step": 282235, "epoch": 3400} {"train_loss": -25.493793487548828, "global_step": 282236, "epoch": 3400} {"train_loss": -25.148571014404297, "global_step": 282237, "epoch": 3400} {"train_loss": -25.601730346679688, "global_step": 282238, "epoch": 3400} {"train_loss": -25.552234649658203, "global_step": 282239, "epoch": 3400} {"train_loss": -25.57671546936035, "global_step": 282240, "epoch": 3400} {"train_loss": -25.6924991607666, "global_step": 282241, "epoch": 3400} {"train_loss": -25.721052169799805, "global_step": 282242, "epoch": 3400} {"train_loss": -25.459943771362305, "global_step": 282243, "epoch": 3400} {"train_loss": -25.627450942993164, "global_step": 282244, "epoch": 3400} {"train_loss": -25.678943634033203, "global_step": 282245, "epoch": 3400} {"train_loss": -25.62940788269043, "global_step": 282246, "epoch": 3400} {"train_loss": -25.354700088500977, "global_step": 282247, "epoch": 3400} {"train_loss": -25.67316246032715, "global_step": 282248, "epoch": 3400} {"train_loss": -25.30263328552246, "global_step": 282249, "epoch": 3400} {"train_loss": -25.544530868530273, "global_step": 282250, "epoch": 3400} {"train_loss": -25.195613861083984, "global_step": 282251, "epoch": 3400} {"train_loss": -25.29107093811035, "global_step": 282252, "epoch": 3400} {"train_loss": -25.25783348083496, "global_step": 282253, "epoch": 3400} {"train_loss": -25.45680046081543, "global_step": 282254, "epoch": 3400} {"train_loss": -25.12761878967285, "global_step": 282255, "epoch": 3400} {"train_loss": -25.20172882080078, "global_step": 282256, "epoch": 3400} {"train_loss": -25.490467071533203, "global_step": 282257, "epoch": 3400} {"train_loss": -25.45391273498535, "global_step": 282258, "epoch": 3400} {"train_loss": -25.309186935424805, "global_step": 282259, "epoch": 3400} {"train_loss": -25.466581344604492, "global_step": 282260, "epoch": 3400} {"train_loss": -25.057336807250977, "global_step": 282261, "epoch": 3400} {"train_loss": -25.707904815673828, "global_step": 282262, "epoch": 3400} {"train_loss": -25.13055419921875, "global_step": 282263, "epoch": 3400} {"train_loss": -25.486942291259766, "global_step": 282264, "epoch": 3400} {"train_loss": -25.48915672302246, "global_step": 282265, "epoch": 3400} {"train_loss": -25.531173706054688, "global_step": 282266, "epoch": 3400} {"train_loss": -25.34621238708496, "global_step": 282267, "epoch": 3400} {"train_loss": -25.690637588500977, "global_step": 282268, "epoch": 3400} {"train_loss": -25.35236358642578, "global_step": 282269, "epoch": 3400} {"train_loss": -25.5284423828125, "global_step": 282270, "epoch": 3400} {"train_loss": -25.362768173217773, "global_step": 282271, "epoch": 3400} {"train_loss": -25.858190536499023, "global_step": 282272, "epoch": 3400} {"train_loss": -24.994382858276367, "global_step": 282273, "epoch": 3400} {"train_loss": -25.5771484375, "global_step": 282274, "epoch": 3400} {"train_loss": -25.535240173339844, "global_step": 282275, "epoch": 3400} {"train_loss": -25.78278923034668, "global_step": 282276, "epoch": 3400} {"train_loss": -25.285797119140625, "global_step": 282277, "epoch": 3400} {"train_loss": -25.144508361816406, "global_step": 282278, "epoch": 3400} {"train_loss": -25.545583724975586, "global_step": 282279, "epoch": 3400} {"train_loss": -25.628332138061523, "global_step": 282280, "epoch": 3400} {"train_loss": -25.926025390625, "global_step": 282281, "epoch": 3400} {"train_loss": -25.379348892763435, "global_step": 282282, "epoch": 3400, "train/sim_max_reward_0": 1.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4500000": 1.0, "test/sim_max_reward_4500001": 1.0, "test/sim_max_reward_4500002": 1.0, "test/sim_max_reward_4500003": 1.0, "test/sim_max_reward_4500004": 1.0, "test/sim_max_reward_4500005": 1.0, "test/sim_max_reward_4500006": 1.0, "test/sim_max_reward_4500007": 1.0, "test/sim_max_reward_4500008": 1.0, "test/sim_max_reward_4500009": 1.0, "test/sim_max_reward_4500010": 1.0, "test/sim_max_reward_4500011": 1.0, "test/sim_max_reward_4500012": 1.0, "test/sim_max_reward_4500013": 1.0, "test/sim_max_reward_4500014": 1.0, "test/sim_max_reward_4500015": 1.0, "test/sim_max_reward_4500016": 1.0, "test/sim_max_reward_4500017": 1.0, "test/sim_max_reward_4500018": 1.0, "test/sim_max_reward_4500019": 1.0, "test/sim_max_reward_4500020": 1.0, "test/sim_max_reward_4500021": 1.0, "train/mean_score": 1.0, "test/mean_score": 1.0, "val_loss": 7052055.0} {"train_loss": -24.95514488220215, "global_step": 282283, "epoch": 3401} {"train_loss": -24.502403259277344, "global_step": 282284, "epoch": 3401} {"train_loss": -25.211225509643555, "global_step": 282285, "epoch": 3401} {"train_loss": -25.092920303344727, "global_step": 282286, "epoch": 3401} {"train_loss": -25.030790328979492, "global_step": 282287, "epoch": 3401} {"train_loss": -25.3188533782959, "global_step": 282288, "epoch": 3401} {"train_loss": -24.77655792236328, "global_step": 282289, "epoch": 3401} {"train_loss": -25.60312271118164, "global_step": 282290, "epoch": 3401} {"train_loss": -25.600677490234375, "global_step": 282291, "epoch": 3401} {"train_loss": -24.693105697631836, "global_step": 282292, "epoch": 3401} {"train_loss": -25.448394775390625, "global_step": 282293, "epoch": 3401} {"train_loss": -25.224599838256836, "global_step": 282294, "epoch": 3401} {"train_loss": -24.997156143188477, "global_step": 282295, "epoch": 3401} {"train_loss": -25.36819839477539, "global_step": 282296, "epoch": 3401} {"train_loss": -25.07952308654785, "global_step": 282297, "epoch": 3401} {"train_loss": -25.08367919921875, "global_step": 282298, "epoch": 3401} {"train_loss": -25.522783279418945, "global_step": 282299, "epoch": 3401} {"train_loss": -25.69009780883789, "global_step": 282300, "epoch": 3401} {"train_loss": -25.454957962036133, "global_step": 282301, "epoch": 3401} {"train_loss": -25.557659149169922, "global_step": 282302, "epoch": 3401} {"train_loss": -25.406513214111328, "global_step": 282303, "epoch": 3401} {"train_loss": -25.41730308532715, "global_step": 282304, "epoch": 3401} {"train_loss": -25.35514259338379, "global_step": 282305, "epoch": 3401} {"train_loss": -25.281009674072266, "global_step": 282306, "epoch": 3401} {"train_loss": -25.64143180847168, "global_step": 282307, "epoch": 3401} {"train_loss": -25.572412490844727, "global_step": 282308, "epoch": 3401} {"train_loss": -25.39598846435547, "global_step": 282309, "epoch": 3401} {"train_loss": -25.780866622924805, "global_step": 282310, "epoch": 3401} {"train_loss": -25.441608428955078, "global_step": 282311, "epoch": 3401} {"train_loss": -25.4293270111084, "global_step": 282312, "epoch": 3401} {"train_loss": -25.522369384765625, "global_step": 282313, "epoch": 3401} {"train_loss": -25.570358276367188, "global_step": 282314, "epoch": 3401} {"train_loss": -25.58570098876953, "global_step": 282315, "epoch": 3401} {"train_loss": -25.282278060913086, "global_step": 282316, "epoch": 3401} {"train_loss": -25.353830337524414, "global_step": 282317, "epoch": 3401} {"train_loss": -25.554349899291992, "global_step": 282318, "epoch": 3401} {"train_loss": -25.21390151977539, "global_step": 282319, "epoch": 3401} {"train_loss": -25.788314819335938, "global_step": 282320, "epoch": 3401} {"train_loss": -25.27709197998047, "global_step": 282321, "epoch": 3401} {"train_loss": -25.523290634155273, "global_step": 282322, "epoch": 3401} {"train_loss": -25.769529342651367, "global_step": 282323, "epoch": 3401} {"train_loss": -25.13154411315918, "global_step": 282324, "epoch": 3401} {"train_loss": -25.65915870666504, "global_step": 282325, "epoch": 3401} {"train_loss": -25.626550674438477, "global_step": 282326, "epoch": 3401} {"train_loss": -25.16698455810547, "global_step": 282327, "epoch": 3401} {"train_loss": -25.38260841369629, "global_step": 282328, "epoch": 3401} {"train_loss": -25.17211151123047, "global_step": 282329, "epoch": 3401} {"train_loss": -25.367591857910156, "global_step": 282330, "epoch": 3401} {"train_loss": -25.24297523498535, "global_step": 282331, "epoch": 3401} {"train_loss": -25.093217849731445, "global_step": 282332, "epoch": 3401} {"train_loss": -25.495786666870117, "global_step": 282333, "epoch": 3401} {"train_loss": -25.097780227661133, "global_step": 282334, "epoch": 3401} {"train_loss": -25.541433334350586, "global_step": 282335, "epoch": 3401} {"train_loss": -25.09908103942871, "global_step": 282336, "epoch": 3401} {"train_loss": -25.688446044921875, "global_step": 282337, "epoch": 3401} {"train_loss": -25.66814613342285, "global_step": 282338, "epoch": 3401} {"train_loss": -25.2821102142334, "global_step": 282339, "epoch": 3401} {"train_loss": -25.429590225219727, "global_step": 282340, "epoch": 3401} {"train_loss": -25.29221534729004, "global_step": 282341, "epoch": 3401} {"train_loss": -25.4777774810791, "global_step": 282342, "epoch": 3401} {"train_loss": -25.35991096496582, "global_step": 282343, "epoch": 3401} {"train_loss": -25.640613555908203, "global_step": 282344, "epoch": 3401} {"train_loss": -25.45419692993164, "global_step": 282345, "epoch": 3401} {"train_loss": -25.65399742126465, "global_step": 282346, "epoch": 3401} {"train_loss": -25.207258224487305, "global_step": 282347, "epoch": 3401} {"train_loss": -25.273653030395508, "global_step": 282348, "epoch": 3401} {"train_loss": -25.323007583618164, "global_step": 282349, "epoch": 3401} {"train_loss": -24.700246810913086, "global_step": 282350, "epoch": 3401} {"train_loss": -25.10890007019043, "global_step": 282351, "epoch": 3401} {"train_loss": -25.089296340942383, "global_step": 282352, "epoch": 3401} {"train_loss": -25.29148292541504, "global_step": 282353, "epoch": 3401} {"train_loss": -25.73396110534668, "global_step": 282354, "epoch": 3401} {"train_loss": -25.603742599487305, "global_step": 282355, "epoch": 3401} {"train_loss": -25.108251571655273, "global_step": 282356, "epoch": 3401} {"train_loss": -25.13045310974121, "global_step": 282357, "epoch": 3401} {"train_loss": -25.57000732421875, "global_step": 282358, "epoch": 3401} {"train_loss": -25.27620506286621, "global_step": 282359, "epoch": 3401} {"train_loss": -25.24073028564453, "global_step": 282360, "epoch": 3401} {"train_loss": -25.03982162475586, "global_step": 282361, "epoch": 3401} {"train_loss": -25.40157127380371, "global_step": 282362, "epoch": 3401} {"train_loss": -25.18487548828125, "global_step": 282363, "epoch": 3401} {"train_loss": -25.269384384155273, "global_step": 282364, "epoch": 3401} {"train_loss": -25.36756851012448, "global_step": 282365, "epoch": 3401, "val_loss": 7021261.0} {"train_loss": -25.492475509643555, "global_step": 282366, "epoch": 3402} {"train_loss": -25.377710342407227, "global_step": 282367, "epoch": 3402} {"train_loss": -25.319068908691406, "global_step": 282368, "epoch": 3402} {"train_loss": -25.117450714111328, "global_step": 282369, "epoch": 3402} {"train_loss": -24.979434967041016, "global_step": 282370, "epoch": 3402} {"train_loss": -25.09149169921875, "global_step": 282371, "epoch": 3402} {"train_loss": -25.471725463867188, "global_step": 282372, "epoch": 3402} {"train_loss": -25.290742874145508, "global_step": 282373, "epoch": 3402} {"train_loss": -25.349279403686523, "global_step": 282374, "epoch": 3402} {"train_loss": -25.351293563842773, "global_step": 282375, "epoch": 3402} {"train_loss": -25.418092727661133, "global_step": 282376, "epoch": 3402} {"train_loss": -25.331207275390625, "global_step": 282377, "epoch": 3402} {"train_loss": -25.309337615966797, "global_step": 282378, "epoch": 3402} {"train_loss": -25.488739013671875, "global_step": 282379, "epoch": 3402} {"train_loss": -25.48602294921875, "global_step": 282380, "epoch": 3402} {"train_loss": -25.50135612487793, "global_step": 282381, "epoch": 3402} {"train_loss": -25.731922149658203, "global_step": 282382, "epoch": 3402} {"train_loss": -25.236156463623047, "global_step": 282383, "epoch": 3402} {"train_loss": -25.726459503173828, "global_step": 282384, "epoch": 3402} {"train_loss": -25.661579132080078, "global_step": 282385, "epoch": 3402} {"train_loss": -25.211734771728516, "global_step": 282386, "epoch": 3402} {"train_loss": -25.627079010009766, "global_step": 282387, "epoch": 3402} {"train_loss": -25.375436782836914, "global_step": 282388, "epoch": 3402} {"train_loss": -25.469566345214844, "global_step": 282389, "epoch": 3402} {"train_loss": -25.815107345581055, "global_step": 282390, "epoch": 3402} {"train_loss": -25.26349449157715, "global_step": 282391, "epoch": 3402} {"train_loss": -25.538179397583008, "global_step": 282392, "epoch": 3402} {"train_loss": -25.63031578063965, "global_step": 282393, "epoch": 3402} {"train_loss": -25.74091911315918, "global_step": 282394, "epoch": 3402} {"train_loss": -25.264535903930664, "global_step": 282395, "epoch": 3402} {"train_loss": -25.695844650268555, "global_step": 282396, "epoch": 3402} {"train_loss": -25.384557723999023, "global_step": 282397, "epoch": 3402} {"train_loss": -25.274770736694336, "global_step": 282398, "epoch": 3402} {"train_loss": -25.246366500854492, "global_step": 282399, "epoch": 3402} {"train_loss": -25.135608673095703, "global_step": 282400, "epoch": 3402} {"train_loss": -25.504640579223633, "global_step": 282401, "epoch": 3402} {"train_loss": -25.7696590423584, "global_step": 282402, "epoch": 3402} {"train_loss": -25.805831909179688, "global_step": 282403, "epoch": 3402} {"train_loss": -25.441450119018555, "global_step": 282404, "epoch": 3402} {"train_loss": -25.183856964111328, "global_step": 282405, "epoch": 3402} {"train_loss": -24.879913330078125, "global_step": 282406, "epoch": 3402} {"train_loss": -25.04703140258789, "global_step": 282407, "epoch": 3402} {"train_loss": -25.63636589050293, "global_step": 282408, "epoch": 3402} {"train_loss": -25.417659759521484, "global_step": 282409, "epoch": 3402} {"train_loss": -24.992839813232422, "global_step": 282410, "epoch": 3402} {"train_loss": -25.53675651550293, "global_step": 282411, "epoch": 3402} {"train_loss": -25.505643844604492, "global_step": 282412, "epoch": 3402} {"train_loss": -25.56108283996582, "global_step": 282413, "epoch": 3402} {"train_loss": -25.662343978881836, "global_step": 282414, "epoch": 3402} {"train_loss": -25.364994049072266, "global_step": 282415, "epoch": 3402} {"train_loss": -25.40230941772461, "global_step": 282416, "epoch": 3402} {"train_loss": -25.824338912963867, "global_step": 282417, "epoch": 3402} {"train_loss": -25.422842025756836, "global_step": 282418, "epoch": 3402} {"train_loss": -25.66619873046875, "global_step": 282419, "epoch": 3402} {"train_loss": -25.207029342651367, "global_step": 282420, "epoch": 3402} {"train_loss": -25.274581909179688, "global_step": 282421, "epoch": 3402} {"train_loss": -25.306177139282227, "global_step": 282422, "epoch": 3402} {"train_loss": -25.47468376159668, "global_step": 282423, "epoch": 3402} {"train_loss": -25.57186508178711, "global_step": 282424, "epoch": 3402} {"train_loss": -25.425365447998047, "global_step": 282425, "epoch": 3402} {"train_loss": -25.380428314208984, "global_step": 282426, "epoch": 3402} {"train_loss": -25.546537399291992, "global_step": 282427, "epoch": 3402} {"train_loss": -25.335529327392578, "global_step": 282428, "epoch": 3402} {"train_loss": -25.783233642578125, "global_step": 282429, "epoch": 3402} {"train_loss": -25.7520809173584, "global_step": 282430, "epoch": 3402} {"train_loss": -25.437780380249023, "global_step": 282431, "epoch": 3402} {"train_loss": -25.28045082092285, "global_step": 282432, "epoch": 3402} {"train_loss": -25.313383102416992, "global_step": 282433, "epoch": 3402} {"train_loss": -25.288732528686523, "global_step": 282434, "epoch": 3402} {"train_loss": -25.630661010742188, "global_step": 282435, "epoch": 3402} {"train_loss": -25.218769073486328, "global_step": 282436, "epoch": 3402} {"train_loss": -25.39047622680664, "global_step": 282437, "epoch": 3402} {"train_loss": -25.401031494140625, "global_step": 282438, "epoch": 3402} {"train_loss": -24.946027755737305, "global_step": 282439, "epoch": 3402} {"train_loss": -25.286405563354492, "global_step": 282440, "epoch": 3402} {"train_loss": -24.986051559448242, "global_step": 282441, "epoch": 3402} {"train_loss": -25.5267333984375, "global_step": 282442, "epoch": 3402} {"train_loss": -25.56752586364746, "global_step": 282443, "epoch": 3402} {"train_loss": -25.86005973815918, "global_step": 282444, "epoch": 3402} {"train_loss": -24.901647567749023, "global_step": 282445, "epoch": 3402} {"train_loss": -25.166034698486328, "global_step": 282446, "epoch": 3402} {"train_loss": -25.3780460357666, "global_step": 282447, "epoch": 3402} {"train_loss": -25.419195404971937, "global_step": 282448, "epoch": 3402, "val_loss": 7126161.0} {"train_loss": -25.10797119140625, "global_step": 282449, "epoch": 3403} {"train_loss": -24.682035446166992, "global_step": 282450, "epoch": 3403} {"train_loss": -24.931413650512695, "global_step": 282451, "epoch": 3403} {"train_loss": -25.505422592163086, "global_step": 282452, "epoch": 3403} {"train_loss": -25.316848754882812, "global_step": 282453, "epoch": 3403} {"train_loss": -24.841493606567383, "global_step": 282454, "epoch": 3403} {"train_loss": -25.352554321289062, "global_step": 282455, "epoch": 3403} {"train_loss": -25.195594787597656, "global_step": 282456, "epoch": 3403} {"train_loss": -25.31538963317871, "global_step": 282457, "epoch": 3403} {"train_loss": -24.900068283081055, "global_step": 282458, "epoch": 3403} {"train_loss": -24.851905822753906, "global_step": 282459, "epoch": 3403} {"train_loss": -25.206884384155273, "global_step": 282460, "epoch": 3403} {"train_loss": -25.279577255249023, "global_step": 282461, "epoch": 3403} {"train_loss": -25.31879997253418, "global_step": 282462, "epoch": 3403} {"train_loss": -24.96343421936035, "global_step": 282463, "epoch": 3403} {"train_loss": -25.47127342224121, "global_step": 282464, "epoch": 3403} {"train_loss": -25.078908920288086, "global_step": 282465, "epoch": 3403} {"train_loss": -25.22367286682129, "global_step": 282466, "epoch": 3403} {"train_loss": -25.324665069580078, "global_step": 282467, "epoch": 3403} {"train_loss": -25.455562591552734, "global_step": 282468, "epoch": 3403} {"train_loss": -25.392322540283203, "global_step": 282469, "epoch": 3403} {"train_loss": -25.59850311279297, "global_step": 282470, "epoch": 3403} {"train_loss": -25.07453727722168, "global_step": 282471, "epoch": 3403} {"train_loss": -25.486698150634766, "global_step": 282472, "epoch": 3403} {"train_loss": -25.57118797302246, "global_step": 282473, "epoch": 3403} {"train_loss": -25.750782012939453, "global_step": 282474, "epoch": 3403} {"train_loss": -25.280044555664062, "global_step": 282475, "epoch": 3403} {"train_loss": -25.58245849609375, "global_step": 282476, "epoch": 3403} {"train_loss": -25.3951473236084, "global_step": 282477, "epoch": 3403} {"train_loss": -25.384870529174805, "global_step": 282478, "epoch": 3403} {"train_loss": -25.462820053100586, "global_step": 282479, "epoch": 3403} {"train_loss": -25.546833038330078, "global_step": 282480, "epoch": 3403} {"train_loss": -25.392488479614258, "global_step": 282481, "epoch": 3403} {"train_loss": -25.169845581054688, "global_step": 282482, "epoch": 3403} {"train_loss": -25.677082061767578, "global_step": 282483, "epoch": 3403} {"train_loss": -25.208608627319336, "global_step": 282484, "epoch": 3403} {"train_loss": -25.08302879333496, "global_step": 282485, "epoch": 3403} {"train_loss": -25.318279266357422, "global_step": 282486, "epoch": 3403} {"train_loss": -25.420761108398438, "global_step": 282487, "epoch": 3403} {"train_loss": -25.568180084228516, "global_step": 282488, "epoch": 3403} {"train_loss": -25.79037857055664, "global_step": 282489, "epoch": 3403} {"train_loss": -25.38374137878418, "global_step": 282490, "epoch": 3403} {"train_loss": -25.327878952026367, "global_step": 282491, "epoch": 3403} {"train_loss": -25.432098388671875, "global_step": 282492, "epoch": 3403} {"train_loss": -25.330982208251953, "global_step": 282493, "epoch": 3403} {"train_loss": -25.48105812072754, "global_step": 282494, "epoch": 3403} {"train_loss": -25.555631637573242, "global_step": 282495, "epoch": 3403} {"train_loss": -25.31884002685547, "global_step": 282496, "epoch": 3403} {"train_loss": -25.17364501953125, "global_step": 282497, "epoch": 3403} {"train_loss": -24.727752685546875, "global_step": 282498, "epoch": 3403} {"train_loss": -25.47175407409668, "global_step": 282499, "epoch": 3403} {"train_loss": -25.459457397460938, "global_step": 282500, "epoch": 3403} {"train_loss": -25.02581787109375, "global_step": 282501, "epoch": 3403} {"train_loss": -25.126283645629883, "global_step": 282502, "epoch": 3403} {"train_loss": -24.990633010864258, "global_step": 282503, "epoch": 3403} {"train_loss": -25.774045944213867, "global_step": 282504, "epoch": 3403} {"train_loss": -25.560575485229492, "global_step": 282505, "epoch": 3403} {"train_loss": -24.99161148071289, "global_step": 282506, "epoch": 3403} {"train_loss": -25.05687141418457, "global_step": 282507, "epoch": 3403} {"train_loss": -25.184431076049805, "global_step": 282508, "epoch": 3403} {"train_loss": -25.601383209228516, "global_step": 282509, "epoch": 3403} {"train_loss": -25.521982192993164, "global_step": 282510, "epoch": 3403} {"train_loss": -25.337270736694336, "global_step": 282511, "epoch": 3403} {"train_loss": -25.293556213378906, "global_step": 282512, "epoch": 3403} {"train_loss": -25.21083641052246, "global_step": 282513, "epoch": 3403} {"train_loss": -25.23869514465332, "global_step": 282514, "epoch": 3403} {"train_loss": -25.054794311523438, "global_step": 282515, "epoch": 3403} {"train_loss": -25.059080123901367, "global_step": 282516, "epoch": 3403} {"train_loss": -25.8239803314209, "global_step": 282517, "epoch": 3403} {"train_loss": -25.442678451538086, "global_step": 282518, "epoch": 3403} {"train_loss": -25.547719955444336, "global_step": 282519, "epoch": 3403} {"train_loss": -25.35891342163086, "global_step": 282520, "epoch": 3403} {"train_loss": -25.369861602783203, "global_step": 282521, "epoch": 3403} {"train_loss": -25.44742774963379, "global_step": 282522, "epoch": 3403} {"train_loss": -24.984092712402344, "global_step": 282523, "epoch": 3403} {"train_loss": -25.6942081451416, "global_step": 282524, "epoch": 3403} {"train_loss": -25.527009963989258, "global_step": 282525, "epoch": 3403} {"train_loss": -25.458820343017578, "global_step": 282526, "epoch": 3403} {"train_loss": -25.248580932617188, "global_step": 282527, "epoch": 3403} {"train_loss": -25.516023635864258, "global_step": 282528, "epoch": 3403} {"train_loss": -25.010751724243164, "global_step": 282529, "epoch": 3403} {"train_loss": -25.371105194091797, "global_step": 282530, "epoch": 3403} {"train_loss": -25.31811707278332, "global_step": 282531, "epoch": 3403, "val_loss": 7142203.0} {"train_loss": -25.380678176879883, "global_step": 282532, "epoch": 3404} {"train_loss": -25.08456802368164, "global_step": 282533, "epoch": 3404} {"train_loss": -25.159292221069336, "global_step": 282534, "epoch": 3404} {"train_loss": -25.184011459350586, "global_step": 282535, "epoch": 3404} {"train_loss": -25.137420654296875, "global_step": 282536, "epoch": 3404} {"train_loss": -25.364910125732422, "global_step": 282537, "epoch": 3404} {"train_loss": -24.69571876525879, "global_step": 282538, "epoch": 3404} {"train_loss": -25.30904197692871, "global_step": 282539, "epoch": 3404} {"train_loss": -25.442794799804688, "global_step": 282540, "epoch": 3404} {"train_loss": -25.330188751220703, "global_step": 282541, "epoch": 3404} {"train_loss": -25.40915870666504, "global_step": 282542, "epoch": 3404} {"train_loss": -25.32611656188965, "global_step": 282543, "epoch": 3404} {"train_loss": -25.81001091003418, "global_step": 282544, "epoch": 3404} {"train_loss": -25.418493270874023, "global_step": 282545, "epoch": 3404} {"train_loss": -25.64801597595215, "global_step": 282546, "epoch": 3404} {"train_loss": -24.922941207885742, "global_step": 282547, "epoch": 3404} {"train_loss": -25.22423553466797, "global_step": 282548, "epoch": 3404} {"train_loss": -25.298009872436523, "global_step": 282549, "epoch": 3404} {"train_loss": -25.42915153503418, "global_step": 282550, "epoch": 3404} {"train_loss": -25.449384689331055, "global_step": 282551, "epoch": 3404} {"train_loss": -25.656286239624023, "global_step": 282552, "epoch": 3404} {"train_loss": -25.449716567993164, "global_step": 282553, "epoch": 3404} {"train_loss": -25.365507125854492, "global_step": 282554, "epoch": 3404} {"train_loss": -25.322250366210938, "global_step": 282555, "epoch": 3404} {"train_loss": -25.29886817932129, "global_step": 282556, "epoch": 3404} {"train_loss": -25.544492721557617, "global_step": 282557, "epoch": 3404} {"train_loss": -25.072843551635742, "global_step": 282558, "epoch": 3404} {"train_loss": -25.588132858276367, "global_step": 282559, "epoch": 3404} {"train_loss": -25.39065933227539, "global_step": 282560, "epoch": 3404} {"train_loss": -25.41826629638672, "global_step": 282561, "epoch": 3404} {"train_loss": -25.58418083190918, "global_step": 282562, "epoch": 3404} {"train_loss": -25.49901580810547, "global_step": 282563, "epoch": 3404} {"train_loss": -24.83367347717285, "global_step": 282564, "epoch": 3404} {"train_loss": -25.09014892578125, "global_step": 282565, "epoch": 3404} {"train_loss": -25.52243995666504, "global_step": 282566, "epoch": 3404} {"train_loss": -25.32069969177246, "global_step": 282567, "epoch": 3404} {"train_loss": -25.408727645874023, "global_step": 282568, "epoch": 3404} {"train_loss": -25.564733505249023, "global_step": 282569, "epoch": 3404} {"train_loss": -25.43898582458496, "global_step": 282570, "epoch": 3404} {"train_loss": -25.159528732299805, "global_step": 282571, "epoch": 3404} {"train_loss": -25.4615478515625, "global_step": 282572, "epoch": 3404} {"train_loss": -25.36739158630371, "global_step": 282573, "epoch": 3404} {"train_loss": -25.610645294189453, "global_step": 282574, "epoch": 3404} {"train_loss": -25.480106353759766, "global_step": 282575, "epoch": 3404} {"train_loss": -25.469728469848633, "global_step": 282576, "epoch": 3404} {"train_loss": -25.272789001464844, "global_step": 282577, "epoch": 3404} {"train_loss": -25.16078758239746, "global_step": 282578, "epoch": 3404} {"train_loss": -25.63885498046875, "global_step": 282579, "epoch": 3404} {"train_loss": -25.4165096282959, "global_step": 282580, "epoch": 3404} {"train_loss": -25.44668197631836, "global_step": 282581, "epoch": 3404} {"train_loss": -25.029539108276367, "global_step": 282582, "epoch": 3404} {"train_loss": -25.21181297302246, "global_step": 282583, "epoch": 3404} {"train_loss": -25.558530807495117, "global_step": 282584, "epoch": 3404} {"train_loss": -25.37763023376465, "global_step": 282585, "epoch": 3404} {"train_loss": -25.047412872314453, "global_step": 282586, "epoch": 3404} {"train_loss": -25.136693954467773, "global_step": 282587, "epoch": 3404} {"train_loss": -25.530731201171875, "global_step": 282588, "epoch": 3404} {"train_loss": -25.037967681884766, "global_step": 282589, "epoch": 3404} {"train_loss": -25.289539337158203, "global_step": 282590, "epoch": 3404} {"train_loss": -25.5120849609375, "global_step": 282591, "epoch": 3404} {"train_loss": -24.949525833129883, "global_step": 282592, "epoch": 3404} {"train_loss": -25.37627601623535, "global_step": 282593, "epoch": 3404} {"train_loss": -25.27381134033203, "global_step": 282594, "epoch": 3404} {"train_loss": -25.027936935424805, "global_step": 282595, "epoch": 3404} {"train_loss": -25.614288330078125, "global_step": 282596, "epoch": 3404} {"train_loss": -25.56283187866211, "global_step": 282597, "epoch": 3404} {"train_loss": -25.669370651245117, "global_step": 282598, "epoch": 3404} {"train_loss": -25.536020278930664, "global_step": 282599, "epoch": 3404} {"train_loss": -25.543018341064453, "global_step": 282600, "epoch": 3404} {"train_loss": -24.937564849853516, "global_step": 282601, "epoch": 3404} {"train_loss": -25.395782470703125, "global_step": 282602, "epoch": 3404} {"train_loss": -25.447315216064453, "global_step": 282603, "epoch": 3404} {"train_loss": -25.27393913269043, "global_step": 282604, "epoch": 3404} {"train_loss": -25.46588706970215, "global_step": 282605, "epoch": 3404} {"train_loss": -25.55177116394043, "global_step": 282606, "epoch": 3404} {"train_loss": -25.713041305541992, "global_step": 282607, "epoch": 3404} {"train_loss": -25.763174057006836, "global_step": 282608, "epoch": 3404} {"train_loss": -25.490833282470703, "global_step": 282609, "epoch": 3404} {"train_loss": -25.253604888916016, "global_step": 282610, "epoch": 3404} {"train_loss": -25.734546661376953, "global_step": 282611, "epoch": 3404} {"train_loss": -25.47539520263672, "global_step": 282612, "epoch": 3404} {"train_loss": -25.203571319580078, "global_step": 282613, "epoch": 3404} {"train_loss": -25.335627061774932, "global_step": 282614, "epoch": 3404, "val_loss": 7045386.0} {"train_loss": -24.168977737426758, "global_step": 282615, "epoch": 3405} {"train_loss": -24.986534118652344, "global_step": 282616, "epoch": 3405} {"train_loss": -25.07419776916504, "global_step": 282617, "epoch": 3405} {"train_loss": -24.8159122467041, "global_step": 282618, "epoch": 3405} {"train_loss": -25.21380043029785, "global_step": 282619, "epoch": 3405} {"train_loss": -24.7973575592041, "global_step": 282620, "epoch": 3405} {"train_loss": -25.071945190429688, "global_step": 282621, "epoch": 3405} {"train_loss": -24.617101669311523, "global_step": 282622, "epoch": 3405} {"train_loss": -25.493440628051758, "global_step": 282623, "epoch": 3405} {"train_loss": -25.111576080322266, "global_step": 282624, "epoch": 3405} {"train_loss": -25.439756393432617, "global_step": 282625, "epoch": 3405} {"train_loss": -25.085416793823242, "global_step": 282626, "epoch": 3405} {"train_loss": -25.453617095947266, "global_step": 282627, "epoch": 3405} {"train_loss": -25.224544525146484, "global_step": 282628, "epoch": 3405} {"train_loss": -25.023494720458984, "global_step": 282629, "epoch": 3405} {"train_loss": -24.74944496154785, "global_step": 282630, "epoch": 3405} {"train_loss": -25.307416915893555, "global_step": 282631, "epoch": 3405} {"train_loss": -24.54988670349121, "global_step": 282632, "epoch": 3405} {"train_loss": -25.168657302856445, "global_step": 282633, "epoch": 3405} {"train_loss": -24.997751235961914, "global_step": 282634, "epoch": 3405} {"train_loss": -25.171327590942383, "global_step": 282635, "epoch": 3405} {"train_loss": -25.23001480102539, "global_step": 282636, "epoch": 3405} {"train_loss": -25.282291412353516, "global_step": 282637, "epoch": 3405} {"train_loss": -25.450498580932617, "global_step": 282638, "epoch": 3405} {"train_loss": -25.53702735900879, "global_step": 282639, "epoch": 3405} {"train_loss": -25.46321678161621, "global_step": 282640, "epoch": 3405} {"train_loss": -25.370166778564453, "global_step": 282641, "epoch": 3405} {"train_loss": -25.36734390258789, "global_step": 282642, "epoch": 3405} {"train_loss": -25.164663314819336, "global_step": 282643, "epoch": 3405} {"train_loss": -25.347843170166016, "global_step": 282644, "epoch": 3405} {"train_loss": -25.199275970458984, "global_step": 282645, "epoch": 3405} {"train_loss": -25.50172233581543, "global_step": 282646, "epoch": 3405} {"train_loss": -25.080062866210938, "global_step": 282647, "epoch": 3405} {"train_loss": -25.410995483398438, "global_step": 282648, "epoch": 3405} {"train_loss": -25.69856071472168, "global_step": 282649, "epoch": 3405} {"train_loss": -25.5870418548584, "global_step": 282650, "epoch": 3405} {"train_loss": -25.336994171142578, "global_step": 282651, "epoch": 3405} {"train_loss": -25.268369674682617, "global_step": 282652, "epoch": 3405} {"train_loss": -25.450307846069336, "global_step": 282653, "epoch": 3405} {"train_loss": -25.357555389404297, "global_step": 282654, "epoch": 3405} {"train_loss": -25.344228744506836, "global_step": 282655, "epoch": 3405} {"train_loss": -25.475664138793945, "global_step": 282656, "epoch": 3405} {"train_loss": -25.318828582763672, "global_step": 282657, "epoch": 3405} {"train_loss": -25.757476806640625, "global_step": 282658, "epoch": 3405} {"train_loss": -25.645904541015625, "global_step": 282659, "epoch": 3405} {"train_loss": -25.511457443237305, "global_step": 282660, "epoch": 3405} {"train_loss": -25.250070571899414, "global_step": 282661, "epoch": 3405} {"train_loss": -25.352285385131836, "global_step": 282662, "epoch": 3405} {"train_loss": -25.377544403076172, "global_step": 282663, "epoch": 3405} {"train_loss": -25.65254783630371, "global_step": 282664, "epoch": 3405} {"train_loss": -25.418087005615234, "global_step": 282665, "epoch": 3405} {"train_loss": -25.271549224853516, "global_step": 282666, "epoch": 3405} {"train_loss": -25.782468795776367, "global_step": 282667, "epoch": 3405} {"train_loss": -25.256452560424805, "global_step": 282668, "epoch": 3405} {"train_loss": -25.74566650390625, "global_step": 282669, "epoch": 3405} {"train_loss": -25.401792526245117, "global_step": 282670, "epoch": 3405} {"train_loss": -25.327178955078125, "global_step": 282671, "epoch": 3405} {"train_loss": -25.6546688079834, "global_step": 282672, "epoch": 3405} {"train_loss": -25.44023323059082, "global_step": 282673, "epoch": 3405} {"train_loss": -25.474863052368164, "global_step": 282674, "epoch": 3405} {"train_loss": -25.636838912963867, "global_step": 282675, "epoch": 3405} {"train_loss": -25.422775268554688, "global_step": 282676, "epoch": 3405} {"train_loss": -25.60467529296875, "global_step": 282677, "epoch": 3405} {"train_loss": -25.705886840820312, "global_step": 282678, "epoch": 3405} {"train_loss": -25.433231353759766, "global_step": 282679, "epoch": 3405} {"train_loss": -25.48755645751953, "global_step": 282680, "epoch": 3405} {"train_loss": -25.47378921508789, "global_step": 282681, "epoch": 3405} {"train_loss": -25.454933166503906, "global_step": 282682, "epoch": 3405} {"train_loss": -25.642850875854492, "global_step": 282683, "epoch": 3405} {"train_loss": -25.67954444885254, "global_step": 282684, "epoch": 3405} {"train_loss": -25.346385955810547, "global_step": 282685, "epoch": 3405} {"train_loss": -25.169984817504883, "global_step": 282686, "epoch": 3405} {"train_loss": -24.49054718017578, "global_step": 282687, "epoch": 3405} {"train_loss": -23.70355224609375, "global_step": 282688, "epoch": 3405} {"train_loss": -24.94450569152832, "global_step": 282689, "epoch": 3405} {"train_loss": -24.90595054626465, "global_step": 282690, "epoch": 3405} {"train_loss": -25.093856811523438, "global_step": 282691, "epoch": 3405} {"train_loss": -24.750885009765625, "global_step": 282692, "epoch": 3405} {"train_loss": -25.047569274902344, "global_step": 282693, "epoch": 3405} {"train_loss": -25.049335479736328, "global_step": 282694, "epoch": 3405} {"train_loss": -25.49667739868164, "global_step": 282695, "epoch": 3405} {"train_loss": -25.07697868347168, "global_step": 282696, "epoch": 3405} {"train_loss": -25.2611026534115, "global_step": 282697, "epoch": 3405, "val_loss": 7056659.5} {"train_loss": -24.787212371826172, "global_step": 282698, "epoch": 3406} {"train_loss": -24.5313777923584, "global_step": 282699, "epoch": 3406} {"train_loss": -24.468502044677734, "global_step": 282700, "epoch": 3406} {"train_loss": -24.381881713867188, "global_step": 282701, "epoch": 3406} {"train_loss": -24.517133712768555, "global_step": 282702, "epoch": 3406} {"train_loss": -25.02129554748535, "global_step": 282703, "epoch": 3406} {"train_loss": -24.718271255493164, "global_step": 282704, "epoch": 3406} {"train_loss": -24.70794105529785, "global_step": 282705, "epoch": 3406} {"train_loss": -24.616865158081055, "global_step": 282706, "epoch": 3406} {"train_loss": -25.249753952026367, "global_step": 282707, "epoch": 3406} {"train_loss": -24.35887336730957, "global_step": 282708, "epoch": 3406} {"train_loss": -24.55033302307129, "global_step": 282709, "epoch": 3406} {"train_loss": -25.00516700744629, "global_step": 282710, "epoch": 3406} {"train_loss": -25.504362106323242, "global_step": 282711, "epoch": 3406} {"train_loss": -24.811803817749023, "global_step": 282712, "epoch": 3406} {"train_loss": -25.00202751159668, "global_step": 282713, "epoch": 3406} {"train_loss": -24.951047897338867, "global_step": 282714, "epoch": 3406} {"train_loss": -25.221586227416992, "global_step": 282715, "epoch": 3406} {"train_loss": -25.218067169189453, "global_step": 282716, "epoch": 3406} {"train_loss": -25.139699935913086, "global_step": 282717, "epoch": 3406} {"train_loss": -25.234128952026367, "global_step": 282718, "epoch": 3406} {"train_loss": -25.080331802368164, "global_step": 282719, "epoch": 3406} {"train_loss": -25.204248428344727, "global_step": 282720, "epoch": 3406} {"train_loss": -25.044553756713867, "global_step": 282721, "epoch": 3406} {"train_loss": -25.158405303955078, "global_step": 282722, "epoch": 3406} {"train_loss": -25.382333755493164, "global_step": 282723, "epoch": 3406} {"train_loss": -25.219812393188477, "global_step": 282724, "epoch": 3406} {"train_loss": -25.359689712524414, "global_step": 282725, "epoch": 3406} {"train_loss": -25.125228881835938, "global_step": 282726, "epoch": 3406} {"train_loss": -25.310232162475586, "global_step": 282727, "epoch": 3406} {"train_loss": -25.121826171875, "global_step": 282728, "epoch": 3406} {"train_loss": -25.644458770751953, "global_step": 282729, "epoch": 3406} {"train_loss": -25.47822380065918, "global_step": 282730, "epoch": 3406} {"train_loss": -25.11557960510254, "global_step": 282731, "epoch": 3406} {"train_loss": -25.560056686401367, "global_step": 282732, "epoch": 3406} {"train_loss": -25.15715980529785, "global_step": 282733, "epoch": 3406} {"train_loss": -25.424644470214844, "global_step": 282734, "epoch": 3406} {"train_loss": -25.45844078063965, "global_step": 282735, "epoch": 3406} {"train_loss": -25.260847091674805, "global_step": 282736, "epoch": 3406} {"train_loss": -25.42191505432129, "global_step": 282737, "epoch": 3406} {"train_loss": -25.301448822021484, "global_step": 282738, "epoch": 3406} {"train_loss": -25.90485191345215, "global_step": 282739, "epoch": 3406} {"train_loss": -25.192398071289062, "global_step": 282740, "epoch": 3406} {"train_loss": -25.515460968017578, "global_step": 282741, "epoch": 3406} {"train_loss": -25.23146629333496, "global_step": 282742, "epoch": 3406} {"train_loss": -25.502277374267578, "global_step": 282743, "epoch": 3406} {"train_loss": -25.487281799316406, "global_step": 282744, "epoch": 3406} {"train_loss": -25.13804817199707, "global_step": 282745, "epoch": 3406} {"train_loss": -25.55496597290039, "global_step": 282746, "epoch": 3406} {"train_loss": -25.629413604736328, "global_step": 282747, "epoch": 3406} {"train_loss": -25.262487411499023, "global_step": 282748, "epoch": 3406} {"train_loss": -25.897802352905273, "global_step": 282749, "epoch": 3406} {"train_loss": -25.03196907043457, "global_step": 282750, "epoch": 3406} {"train_loss": -25.484272003173828, "global_step": 282751, "epoch": 3406} {"train_loss": -25.504362106323242, "global_step": 282752, "epoch": 3406} {"train_loss": -25.386274337768555, "global_step": 282753, "epoch": 3406} {"train_loss": -25.079483032226562, "global_step": 282754, "epoch": 3406} {"train_loss": -25.30543327331543, "global_step": 282755, "epoch": 3406} {"train_loss": -25.033727645874023, "global_step": 282756, "epoch": 3406} {"train_loss": -25.0638370513916, "global_step": 282757, "epoch": 3406} {"train_loss": -25.420448303222656, "global_step": 282758, "epoch": 3406} {"train_loss": -25.220247268676758, "global_step": 282759, "epoch": 3406} {"train_loss": -25.29644203186035, "global_step": 282760, "epoch": 3406} {"train_loss": -25.420087814331055, "global_step": 282761, "epoch": 3406} {"train_loss": -25.439111709594727, "global_step": 282762, "epoch": 3406} {"train_loss": -25.58841323852539, "global_step": 282763, "epoch": 3406} {"train_loss": -25.652069091796875, "global_step": 282764, "epoch": 3406} {"train_loss": -25.254331588745117, "global_step": 282765, "epoch": 3406} {"train_loss": -25.41676139831543, "global_step": 282766, "epoch": 3406} {"train_loss": -25.5165958404541, "global_step": 282767, "epoch": 3406} {"train_loss": -25.345001220703125, "global_step": 282768, "epoch": 3406} {"train_loss": -25.9427433013916, "global_step": 282769, "epoch": 3406} {"train_loss": -25.615182876586914, "global_step": 282770, "epoch": 3406} {"train_loss": -25.584524154663086, "global_step": 282771, "epoch": 3406} {"train_loss": -25.778793334960938, "global_step": 282772, "epoch": 3406} {"train_loss": -25.84429931640625, "global_step": 282773, "epoch": 3406} {"train_loss": -25.339160919189453, "global_step": 282774, "epoch": 3406} {"train_loss": -25.51535987854004, "global_step": 282775, "epoch": 3406} {"train_loss": -25.58150291442871, "global_step": 282776, "epoch": 3406} {"train_loss": -25.768936157226562, "global_step": 282777, "epoch": 3406} {"train_loss": -25.477989196777344, "global_step": 282778, "epoch": 3406} {"train_loss": -25.52130699157715, "global_step": 282779, "epoch": 3406} {"train_loss": -25.26410645174693, "global_step": 282780, "epoch": 3406, "val_loss": 7079573.0} {"train_loss": -25.50187110900879, "global_step": 282781, "epoch": 3407} {"train_loss": -25.30510711669922, "global_step": 282782, "epoch": 3407} {"train_loss": -25.41396141052246, "global_step": 282783, "epoch": 3407} {"train_loss": -25.366031646728516, "global_step": 282784, "epoch": 3407} {"train_loss": -25.717365264892578, "global_step": 282785, "epoch": 3407} {"train_loss": -25.18379020690918, "global_step": 282786, "epoch": 3407} {"train_loss": -25.189712524414062, "global_step": 282787, "epoch": 3407} {"train_loss": -25.4732608795166, "global_step": 282788, "epoch": 3407} {"train_loss": -25.524885177612305, "global_step": 282789, "epoch": 3407} {"train_loss": -25.56866455078125, "global_step": 282790, "epoch": 3407} {"train_loss": -25.1542911529541, "global_step": 282791, "epoch": 3407} {"train_loss": -25.104074478149414, "global_step": 282792, "epoch": 3407} {"train_loss": -25.034215927124023, "global_step": 282793, "epoch": 3407} {"train_loss": -25.35249137878418, "global_step": 282794, "epoch": 3407} {"train_loss": -25.40203857421875, "global_step": 282795, "epoch": 3407} {"train_loss": -25.303556442260742, "global_step": 282796, "epoch": 3407} {"train_loss": -25.34990882873535, "global_step": 282797, "epoch": 3407} {"train_loss": -25.408111572265625, "global_step": 282798, "epoch": 3407} {"train_loss": -25.238584518432617, "global_step": 282799, "epoch": 3407} {"train_loss": -25.484893798828125, "global_step": 282800, "epoch": 3407} {"train_loss": -25.393985748291016, "global_step": 282801, "epoch": 3407} {"train_loss": -26.08034324645996, "global_step": 282802, "epoch": 3407} {"train_loss": -25.517227172851562, "global_step": 282803, "epoch": 3407} {"train_loss": -25.722227096557617, "global_step": 282804, "epoch": 3407} {"train_loss": -25.426721572875977, "global_step": 282805, "epoch": 3407} {"train_loss": -25.798858642578125, "global_step": 282806, "epoch": 3407} {"train_loss": -25.882917404174805, "global_step": 282807, "epoch": 3407} {"train_loss": -25.413114547729492, "global_step": 282808, "epoch": 3407} {"train_loss": -25.391632080078125, "global_step": 282809, "epoch": 3407} {"train_loss": -25.65283203125, "global_step": 282810, "epoch": 3407} {"train_loss": -25.728261947631836, "global_step": 282811, "epoch": 3407} {"train_loss": -25.624753952026367, "global_step": 282812, "epoch": 3407} {"train_loss": -25.572153091430664, "global_step": 282813, "epoch": 3407} {"train_loss": -25.153837203979492, "global_step": 282814, "epoch": 3407} {"train_loss": -25.196332931518555, "global_step": 282815, "epoch": 3407} {"train_loss": -25.2779541015625, "global_step": 282816, "epoch": 3407} {"train_loss": -25.2279109954834, "global_step": 282817, "epoch": 3407} {"train_loss": -25.587034225463867, "global_step": 282818, "epoch": 3407} {"train_loss": -25.529653549194336, "global_step": 282819, "epoch": 3407} {"train_loss": -25.233993530273438, "global_step": 282820, "epoch": 3407} {"train_loss": -25.425809860229492, "global_step": 282821, "epoch": 3407} {"train_loss": -25.520278930664062, "global_step": 282822, "epoch": 3407} {"train_loss": -25.396381378173828, "global_step": 282823, "epoch": 3407} {"train_loss": -25.780536651611328, "global_step": 282824, "epoch": 3407} {"train_loss": -25.37264633178711, "global_step": 282825, "epoch": 3407} {"train_loss": -25.645654678344727, "global_step": 282826, "epoch": 3407} {"train_loss": -25.76816177368164, "global_step": 282827, "epoch": 3407} {"train_loss": -25.613616943359375, "global_step": 282828, "epoch": 3407} {"train_loss": -25.655227661132812, "global_step": 282829, "epoch": 3407} {"train_loss": -25.463979721069336, "global_step": 282830, "epoch": 3407} {"train_loss": -25.54102325439453, "global_step": 282831, "epoch": 3407} {"train_loss": -25.613264083862305, "global_step": 282832, "epoch": 3407} {"train_loss": -25.107891082763672, "global_step": 282833, "epoch": 3407} {"train_loss": -25.198266983032227, "global_step": 282834, "epoch": 3407} {"train_loss": -25.434555053710938, "global_step": 282835, "epoch": 3407} {"train_loss": -25.33950424194336, "global_step": 282836, "epoch": 3407} {"train_loss": -25.14324378967285, "global_step": 282837, "epoch": 3407} {"train_loss": -25.4622859954834, "global_step": 282838, "epoch": 3407} {"train_loss": -25.41842269897461, "global_step": 282839, "epoch": 3407} {"train_loss": -25.439191818237305, "global_step": 282840, "epoch": 3407} {"train_loss": -25.308143615722656, "global_step": 282841, "epoch": 3407} {"train_loss": -25.35004234313965, "global_step": 282842, "epoch": 3407} {"train_loss": -25.368438720703125, "global_step": 282843, "epoch": 3407} {"train_loss": -25.520206451416016, "global_step": 282844, "epoch": 3407} {"train_loss": -25.3024959564209, "global_step": 282845, "epoch": 3407} {"train_loss": -25.50050163269043, "global_step": 282846, "epoch": 3407} {"train_loss": -25.733362197875977, "global_step": 282847, "epoch": 3407} {"train_loss": -25.254545211791992, "global_step": 282848, "epoch": 3407} {"train_loss": -25.839710235595703, "global_step": 282849, "epoch": 3407} {"train_loss": -24.985239028930664, "global_step": 282850, "epoch": 3407} {"train_loss": -25.639535903930664, "global_step": 282851, "epoch": 3407} {"train_loss": -25.265634536743164, "global_step": 282852, "epoch": 3407} {"train_loss": -25.64150047302246, "global_step": 282853, "epoch": 3407} {"train_loss": -25.07257843017578, "global_step": 282854, "epoch": 3407} {"train_loss": -25.32142448425293, "global_step": 282855, "epoch": 3407} {"train_loss": -25.22039031982422, "global_step": 282856, "epoch": 3407} {"train_loss": -25.588727951049805, "global_step": 282857, "epoch": 3407} {"train_loss": -25.40180015563965, "global_step": 282858, "epoch": 3407} {"train_loss": -25.405014038085938, "global_step": 282859, "epoch": 3407} {"train_loss": -26.007349014282227, "global_step": 282860, "epoch": 3407} {"train_loss": -25.19171142578125, "global_step": 282861, "epoch": 3407} {"train_loss": -25.19283103942871, "global_step": 282862, "epoch": 3407} {"train_loss": -25.425064684396766, "global_step": 282863, "epoch": 3407, "val_loss": 7081148.0} {"train_loss": -25.1569766998291, "global_step": 282864, "epoch": 3408} {"train_loss": -24.622900009155273, "global_step": 282865, "epoch": 3408} {"train_loss": -25.067142486572266, "global_step": 282866, "epoch": 3408} {"train_loss": -25.375566482543945, "global_step": 282867, "epoch": 3408} {"train_loss": -25.094213485717773, "global_step": 282868, "epoch": 3408} {"train_loss": -24.891529083251953, "global_step": 282869, "epoch": 3408} {"train_loss": -24.960575103759766, "global_step": 282870, "epoch": 3408} {"train_loss": -24.684911727905273, "global_step": 282871, "epoch": 3408} {"train_loss": -25.369937896728516, "global_step": 282872, "epoch": 3408} {"train_loss": -25.302648544311523, "global_step": 282873, "epoch": 3408} {"train_loss": -24.91977310180664, "global_step": 282874, "epoch": 3408} {"train_loss": -25.06752586364746, "global_step": 282875, "epoch": 3408} {"train_loss": -25.14192771911621, "global_step": 282876, "epoch": 3408} {"train_loss": -25.416242599487305, "global_step": 282877, "epoch": 3408} {"train_loss": -24.99745750427246, "global_step": 282878, "epoch": 3408} {"train_loss": -25.493791580200195, "global_step": 282879, "epoch": 3408} {"train_loss": -25.402158737182617, "global_step": 282880, "epoch": 3408} {"train_loss": -25.325681686401367, "global_step": 282881, "epoch": 3408} {"train_loss": -25.230792999267578, "global_step": 282882, "epoch": 3408} {"train_loss": -25.16343116760254, "global_step": 282883, "epoch": 3408} {"train_loss": -25.186382293701172, "global_step": 282884, "epoch": 3408} {"train_loss": -25.345182418823242, "global_step": 282885, "epoch": 3408} {"train_loss": -25.332916259765625, "global_step": 282886, "epoch": 3408} {"train_loss": -25.673200607299805, "global_step": 282887, "epoch": 3408} {"train_loss": -25.4387149810791, "global_step": 282888, "epoch": 3408} {"train_loss": -25.2060604095459, "global_step": 282889, "epoch": 3408} {"train_loss": -25.623584747314453, "global_step": 282890, "epoch": 3408} {"train_loss": -25.391887664794922, "global_step": 282891, "epoch": 3408} {"train_loss": -25.100555419921875, "global_step": 282892, "epoch": 3408} {"train_loss": -25.57858657836914, "global_step": 282893, "epoch": 3408} {"train_loss": -25.346601486206055, "global_step": 282894, "epoch": 3408} {"train_loss": -25.18576431274414, "global_step": 282895, "epoch": 3408} {"train_loss": -25.22652244567871, "global_step": 282896, "epoch": 3408} {"train_loss": -25.31764030456543, "global_step": 282897, "epoch": 3408} {"train_loss": -25.029924392700195, "global_step": 282898, "epoch": 3408} {"train_loss": -25.202068328857422, "global_step": 282899, "epoch": 3408} {"train_loss": -25.683582305908203, "global_step": 282900, "epoch": 3408} {"train_loss": -25.294809341430664, "global_step": 282901, "epoch": 3408} {"train_loss": -25.71563720703125, "global_step": 282902, "epoch": 3408} {"train_loss": -25.498796463012695, "global_step": 282903, "epoch": 3408} {"train_loss": -25.39350128173828, "global_step": 282904, "epoch": 3408} {"train_loss": -25.553035736083984, "global_step": 282905, "epoch": 3408} {"train_loss": -25.749088287353516, "global_step": 282906, "epoch": 3408} {"train_loss": -25.75006103515625, "global_step": 282907, "epoch": 3408} {"train_loss": -25.832275390625, "global_step": 282908, "epoch": 3408} {"train_loss": -25.745868682861328, "global_step": 282909, "epoch": 3408} {"train_loss": -25.623931884765625, "global_step": 282910, "epoch": 3408} {"train_loss": -25.560543060302734, "global_step": 282911, "epoch": 3408} {"train_loss": -25.631872177124023, "global_step": 282912, "epoch": 3408} {"train_loss": -25.446882247924805, "global_step": 282913, "epoch": 3408} {"train_loss": -25.76957130432129, "global_step": 282914, "epoch": 3408} {"train_loss": -25.712125778198242, "global_step": 282915, "epoch": 3408} {"train_loss": -25.438814163208008, "global_step": 282916, "epoch": 3408} {"train_loss": -25.680566787719727, "global_step": 282917, "epoch": 3408} {"train_loss": -25.11183738708496, "global_step": 282918, "epoch": 3408} {"train_loss": -25.412885665893555, "global_step": 282919, "epoch": 3408} {"train_loss": -24.875625610351562, "global_step": 282920, "epoch": 3408} {"train_loss": -24.78903579711914, "global_step": 282921, "epoch": 3408} {"train_loss": -24.704078674316406, "global_step": 282922, "epoch": 3408} {"train_loss": -24.674850463867188, "global_step": 282923, "epoch": 3408} {"train_loss": -25.502790451049805, "global_step": 282924, "epoch": 3408} {"train_loss": -25.395551681518555, "global_step": 282925, "epoch": 3408} {"train_loss": -25.090396881103516, "global_step": 282926, "epoch": 3408} {"train_loss": -25.38996696472168, "global_step": 282927, "epoch": 3408} {"train_loss": -25.79828453063965, "global_step": 282928, "epoch": 3408} {"train_loss": -25.49859046936035, "global_step": 282929, "epoch": 3408} {"train_loss": -25.33027458190918, "global_step": 282930, "epoch": 3408} {"train_loss": -24.850711822509766, "global_step": 282931, "epoch": 3408} {"train_loss": -25.152557373046875, "global_step": 282932, "epoch": 3408} {"train_loss": -25.307212829589844, "global_step": 282933, "epoch": 3408} {"train_loss": -25.171527862548828, "global_step": 282934, "epoch": 3408} {"train_loss": -25.624616622924805, "global_step": 282935, "epoch": 3408} {"train_loss": -25.15540313720703, "global_step": 282936, "epoch": 3408} {"train_loss": -25.307592391967773, "global_step": 282937, "epoch": 3408} {"train_loss": -25.34476089477539, "global_step": 282938, "epoch": 3408} {"train_loss": -25.255855560302734, "global_step": 282939, "epoch": 3408} {"train_loss": -25.58745765686035, "global_step": 282940, "epoch": 3408} {"train_loss": -25.356521606445312, "global_step": 282941, "epoch": 3408} {"train_loss": -25.184106826782227, "global_step": 282942, "epoch": 3408} {"train_loss": -25.574222564697266, "global_step": 282943, "epoch": 3408} {"train_loss": -25.21726417541504, "global_step": 282944, "epoch": 3408} {"train_loss": -25.474485397338867, "global_step": 282945, "epoch": 3408} {"train_loss": -25.314120396074042, "global_step": 282946, "epoch": 3408, "val_loss": 7015973.0} {"train_loss": -25.21502685546875, "global_step": 282947, "epoch": 3409} {"train_loss": -24.830839157104492, "global_step": 282948, "epoch": 3409} {"train_loss": -24.837505340576172, "global_step": 282949, "epoch": 3409} {"train_loss": -25.27373504638672, "global_step": 282950, "epoch": 3409} {"train_loss": -24.572628021240234, "global_step": 282951, "epoch": 3409} {"train_loss": -25.418630599975586, "global_step": 282952, "epoch": 3409} {"train_loss": -24.900758743286133, "global_step": 282953, "epoch": 3409} {"train_loss": -25.437429428100586, "global_step": 282954, "epoch": 3409} {"train_loss": -25.13314437866211, "global_step": 282955, "epoch": 3409} {"train_loss": -25.173608779907227, "global_step": 282956, "epoch": 3409} {"train_loss": -24.725799560546875, "global_step": 282957, "epoch": 3409} {"train_loss": -25.193832397460938, "global_step": 282958, "epoch": 3409} {"train_loss": -25.197477340698242, "global_step": 282959, "epoch": 3409} {"train_loss": -25.10348129272461, "global_step": 282960, "epoch": 3409} {"train_loss": -25.517942428588867, "global_step": 282961, "epoch": 3409} {"train_loss": -25.15717887878418, "global_step": 282962, "epoch": 3409} {"train_loss": -25.149389266967773, "global_step": 282963, "epoch": 3409} {"train_loss": -25.23048210144043, "global_step": 282964, "epoch": 3409} {"train_loss": -25.100906372070312, "global_step": 282965, "epoch": 3409} {"train_loss": -25.32961082458496, "global_step": 282966, "epoch": 3409} {"train_loss": -25.2326717376709, "global_step": 282967, "epoch": 3409} {"train_loss": -24.69513511657715, "global_step": 282968, "epoch": 3409} {"train_loss": -25.593168258666992, "global_step": 282969, "epoch": 3409} {"train_loss": -25.210290908813477, "global_step": 282970, "epoch": 3409} {"train_loss": -25.223169326782227, "global_step": 282971, "epoch": 3409} {"train_loss": -25.18501853942871, "global_step": 282972, "epoch": 3409} {"train_loss": -25.398029327392578, "global_step": 282973, "epoch": 3409} {"train_loss": -25.355581283569336, "global_step": 282974, "epoch": 3409} {"train_loss": -25.263731002807617, "global_step": 282975, "epoch": 3409} {"train_loss": -25.407743453979492, "global_step": 282976, "epoch": 3409} {"train_loss": -25.64236831665039, "global_step": 282977, "epoch": 3409} {"train_loss": -25.524227142333984, "global_step": 282978, "epoch": 3409} {"train_loss": -25.27934455871582, "global_step": 282979, "epoch": 3409} {"train_loss": -25.459035873413086, "global_step": 282980, "epoch": 3409} {"train_loss": -25.319007873535156, "global_step": 282981, "epoch": 3409} {"train_loss": -25.653675079345703, "global_step": 282982, "epoch": 3409} {"train_loss": -25.572227478027344, "global_step": 282983, "epoch": 3409} {"train_loss": -25.655057907104492, "global_step": 282984, "epoch": 3409} {"train_loss": -25.386932373046875, "global_step": 282985, "epoch": 3409} {"train_loss": -25.798559188842773, "global_step": 282986, "epoch": 3409} {"train_loss": -25.83316421508789, "global_step": 282987, "epoch": 3409} {"train_loss": -25.448604583740234, "global_step": 282988, "epoch": 3409} {"train_loss": -25.648603439331055, "global_step": 282989, "epoch": 3409} {"train_loss": -25.824268341064453, "global_step": 282990, "epoch": 3409} {"train_loss": -26.0202693939209, "global_step": 282991, "epoch": 3409} {"train_loss": -25.826801300048828, "global_step": 282992, "epoch": 3409} {"train_loss": -25.453306198120117, "global_step": 282993, "epoch": 3409} {"train_loss": -25.368606567382812, "global_step": 282994, "epoch": 3409} {"train_loss": -25.47061538696289, "global_step": 282995, "epoch": 3409} {"train_loss": -25.066265106201172, "global_step": 282996, "epoch": 3409} {"train_loss": -25.484298706054688, "global_step": 282997, "epoch": 3409} {"train_loss": -25.547348022460938, "global_step": 282998, "epoch": 3409} {"train_loss": -25.591554641723633, "global_step": 282999, "epoch": 3409} {"train_loss": -25.337745666503906, "global_step": 283000, "epoch": 3409} {"train_loss": -25.43585777282715, "global_step": 283001, "epoch": 3409} {"train_loss": -25.17890739440918, "global_step": 283002, "epoch": 3409} {"train_loss": -25.455759048461914, "global_step": 283003, "epoch": 3409} {"train_loss": -24.9537353515625, "global_step": 283004, "epoch": 3409} {"train_loss": -25.226024627685547, "global_step": 283005, "epoch": 3409} {"train_loss": -25.672775268554688, "global_step": 283006, "epoch": 3409} {"train_loss": -25.195844650268555, "global_step": 283007, "epoch": 3409} {"train_loss": -25.135395050048828, "global_step": 283008, "epoch": 3409} {"train_loss": -25.380727767944336, "global_step": 283009, "epoch": 3409} {"train_loss": -25.410511016845703, "global_step": 283010, "epoch": 3409} {"train_loss": -25.3056697845459, "global_step": 283011, "epoch": 3409} {"train_loss": -25.471088409423828, "global_step": 283012, "epoch": 3409} {"train_loss": -25.149036407470703, "global_step": 283013, "epoch": 3409} {"train_loss": -25.144121170043945, "global_step": 283014, "epoch": 3409} {"train_loss": -25.078033447265625, "global_step": 283015, "epoch": 3409} {"train_loss": -25.822345733642578, "global_step": 283016, "epoch": 3409} {"train_loss": -25.510093688964844, "global_step": 283017, "epoch": 3409} {"train_loss": -25.557397842407227, "global_step": 283018, "epoch": 3409} {"train_loss": -25.309778213500977, "global_step": 283019, "epoch": 3409} {"train_loss": -25.313522338867188, "global_step": 283020, "epoch": 3409} {"train_loss": -25.577373504638672, "global_step": 283021, "epoch": 3409} {"train_loss": -24.97994041442871, "global_step": 283022, "epoch": 3409} {"train_loss": -24.964054107666016, "global_step": 283023, "epoch": 3409} {"train_loss": -25.62770652770996, "global_step": 283024, "epoch": 3409} {"train_loss": -25.228382110595703, "global_step": 283025, "epoch": 3409} {"train_loss": -25.445280075073242, "global_step": 283026, "epoch": 3409} {"train_loss": -25.72771644592285, "global_step": 283027, "epoch": 3409} {"train_loss": -25.277179718017578, "global_step": 283028, "epoch": 3409} {"train_loss": -25.3349958902382, "global_step": 283029, "epoch": 3409, "val_loss": 7157398.0} {"train_loss": -24.365320205688477, "global_step": 283030, "epoch": 3410} {"train_loss": -24.25033950805664, "global_step": 283031, "epoch": 3410} {"train_loss": -23.818634033203125, "global_step": 283032, "epoch": 3410} {"train_loss": -24.850709915161133, "global_step": 283033, "epoch": 3410} {"train_loss": -24.095184326171875, "global_step": 283034, "epoch": 3410} {"train_loss": -24.66937828063965, "global_step": 283035, "epoch": 3410} {"train_loss": -24.197256088256836, "global_step": 283036, "epoch": 3410} {"train_loss": -23.871479034423828, "global_step": 283037, "epoch": 3410} {"train_loss": -24.705284118652344, "global_step": 283038, "epoch": 3410} {"train_loss": -23.84384536743164, "global_step": 283039, "epoch": 3410} {"train_loss": -24.830718994140625, "global_step": 283040, "epoch": 3410} {"train_loss": -24.467153549194336, "global_step": 283041, "epoch": 3410} {"train_loss": -24.591487884521484, "global_step": 283042, "epoch": 3410} {"train_loss": -24.78652000427246, "global_step": 283043, "epoch": 3410} {"train_loss": -24.795461654663086, "global_step": 283044, "epoch": 3410} {"train_loss": -24.67276382446289, "global_step": 283045, "epoch": 3410} {"train_loss": -24.714035034179688, "global_step": 283046, "epoch": 3410} {"train_loss": -24.83363914489746, "global_step": 283047, "epoch": 3410} {"train_loss": -25.144559860229492, "global_step": 283048, "epoch": 3410} {"train_loss": -25.001262664794922, "global_step": 283049, "epoch": 3410} {"train_loss": -25.21784782409668, "global_step": 283050, "epoch": 3410} {"train_loss": -24.8403377532959, "global_step": 283051, "epoch": 3410} {"train_loss": -24.974241256713867, "global_step": 283052, "epoch": 3410} {"train_loss": -24.89777183532715, "global_step": 283053, "epoch": 3410} {"train_loss": -25.28476905822754, "global_step": 283054, "epoch": 3410} {"train_loss": -25.142011642456055, "global_step": 283055, "epoch": 3410} {"train_loss": -25.278440475463867, "global_step": 283056, "epoch": 3410} {"train_loss": -25.345922470092773, "global_step": 283057, "epoch": 3410} {"train_loss": -25.339054107666016, "global_step": 283058, "epoch": 3410} {"train_loss": -24.959924697875977, "global_step": 283059, "epoch": 3410} {"train_loss": -25.493566513061523, "global_step": 283060, "epoch": 3410} {"train_loss": -25.41874885559082, "global_step": 283061, "epoch": 3410} {"train_loss": -25.3598690032959, "global_step": 283062, "epoch": 3410} {"train_loss": -25.19449234008789, "global_step": 283063, "epoch": 3410} {"train_loss": -25.280765533447266, "global_step": 283064, "epoch": 3410} {"train_loss": -25.102252960205078, "global_step": 283065, "epoch": 3410} {"train_loss": -25.506031036376953, "global_step": 283066, "epoch": 3410} {"train_loss": -25.216943740844727, "global_step": 283067, "epoch": 3410} {"train_loss": -25.44175148010254, "global_step": 283068, "epoch": 3410} {"train_loss": -25.404462814331055, "global_step": 283069, "epoch": 3410} {"train_loss": -25.41261100769043, "global_step": 283070, "epoch": 3410} {"train_loss": -25.290151596069336, "global_step": 283071, "epoch": 3410} {"train_loss": -25.729969024658203, "global_step": 283072, "epoch": 3410} {"train_loss": -25.383474349975586, "global_step": 283073, "epoch": 3410} {"train_loss": -25.2563533782959, "global_step": 283074, "epoch": 3410} {"train_loss": -25.352991104125977, "global_step": 283075, "epoch": 3410} {"train_loss": -25.142248153686523, "global_step": 283076, "epoch": 3410} {"train_loss": -25.33057975769043, "global_step": 283077, "epoch": 3410} {"train_loss": -25.25493812561035, "global_step": 283078, "epoch": 3410} {"train_loss": -25.293333053588867, "global_step": 283079, "epoch": 3410} {"train_loss": -25.573936462402344, "global_step": 283080, "epoch": 3410} {"train_loss": -25.27190589904785, "global_step": 283081, "epoch": 3410} {"train_loss": -25.431121826171875, "global_step": 283082, "epoch": 3410} {"train_loss": -25.526912689208984, "global_step": 283083, "epoch": 3410} {"train_loss": -25.754444122314453, "global_step": 283084, "epoch": 3410} {"train_loss": -25.447919845581055, "global_step": 283085, "epoch": 3410} {"train_loss": -25.757282257080078, "global_step": 283086, "epoch": 3410} {"train_loss": -25.319244384765625, "global_step": 283087, "epoch": 3410} {"train_loss": -25.660879135131836, "global_step": 283088, "epoch": 3410} {"train_loss": -25.46930503845215, "global_step": 283089, "epoch": 3410} {"train_loss": -25.60100746154785, "global_step": 283090, "epoch": 3410} {"train_loss": -25.62251091003418, "global_step": 283091, "epoch": 3410} {"train_loss": -25.55409812927246, "global_step": 283092, "epoch": 3410} {"train_loss": -25.306650161743164, "global_step": 283093, "epoch": 3410} {"train_loss": -25.319717407226562, "global_step": 283094, "epoch": 3410} {"train_loss": -25.462678909301758, "global_step": 283095, "epoch": 3410} {"train_loss": -25.697324752807617, "global_step": 283096, "epoch": 3410} {"train_loss": -25.430694580078125, "global_step": 283097, "epoch": 3410} {"train_loss": -25.666166305541992, "global_step": 283098, "epoch": 3410} {"train_loss": -25.84736442565918, "global_step": 283099, "epoch": 3410} {"train_loss": -25.624042510986328, "global_step": 283100, "epoch": 3410} {"train_loss": -25.506145477294922, "global_step": 283101, "epoch": 3410} {"train_loss": -25.572614669799805, "global_step": 283102, "epoch": 3410} {"train_loss": -25.563379287719727, "global_step": 283103, "epoch": 3410} {"train_loss": -25.59394645690918, "global_step": 283104, "epoch": 3410} {"train_loss": -25.29066276550293, "global_step": 283105, "epoch": 3410} {"train_loss": -25.34697914123535, "global_step": 283106, "epoch": 3410} {"train_loss": -25.825408935546875, "global_step": 283107, "epoch": 3410} {"train_loss": -25.271554946899414, "global_step": 283108, "epoch": 3410} {"train_loss": -25.54458236694336, "global_step": 283109, "epoch": 3410} {"train_loss": -25.272756576538086, "global_step": 283110, "epoch": 3410} {"train_loss": -25.348772048950195, "global_step": 283111, "epoch": 3410} {"train_loss": -25.176049657614833, "global_step": 283112, "epoch": 3410, "val_loss": 7105230.0} {"train_loss": -25.364042282104492, "global_step": 283113, "epoch": 3411} {"train_loss": -24.65892791748047, "global_step": 283114, "epoch": 3411} {"train_loss": -24.945417404174805, "global_step": 283115, "epoch": 3411} {"train_loss": -25.15220069885254, "global_step": 283116, "epoch": 3411} {"train_loss": -24.962528228759766, "global_step": 283117, "epoch": 3411} {"train_loss": -24.99078941345215, "global_step": 283118, "epoch": 3411} {"train_loss": -25.180755615234375, "global_step": 283119, "epoch": 3411} {"train_loss": -25.072357177734375, "global_step": 283120, "epoch": 3411} {"train_loss": -25.434873580932617, "global_step": 283121, "epoch": 3411} {"train_loss": -25.452566146850586, "global_step": 283122, "epoch": 3411} {"train_loss": -25.153738021850586, "global_step": 283123, "epoch": 3411} {"train_loss": -25.67706298828125, "global_step": 283124, "epoch": 3411} {"train_loss": -25.021472930908203, "global_step": 283125, "epoch": 3411} {"train_loss": -25.369190216064453, "global_step": 283126, "epoch": 3411} {"train_loss": -25.55708122253418, "global_step": 283127, "epoch": 3411} {"train_loss": -25.514366149902344, "global_step": 283128, "epoch": 3411} {"train_loss": -24.982213973999023, "global_step": 283129, "epoch": 3411} {"train_loss": -25.384428024291992, "global_step": 283130, "epoch": 3411} {"train_loss": -25.076749801635742, "global_step": 283131, "epoch": 3411} {"train_loss": -25.625747680664062, "global_step": 283132, "epoch": 3411} {"train_loss": -25.426477432250977, "global_step": 283133, "epoch": 3411} {"train_loss": -25.27798080444336, "global_step": 283134, "epoch": 3411} {"train_loss": -25.442068099975586, "global_step": 283135, "epoch": 3411} {"train_loss": -25.66343116760254, "global_step": 283136, "epoch": 3411} {"train_loss": -25.21295738220215, "global_step": 283137, "epoch": 3411} {"train_loss": -25.595666885375977, "global_step": 283138, "epoch": 3411} {"train_loss": -25.76626968383789, "global_step": 283139, "epoch": 3411} {"train_loss": -25.185361862182617, "global_step": 283140, "epoch": 3411} {"train_loss": -25.116865158081055, "global_step": 283141, "epoch": 3411} {"train_loss": -25.2159481048584, "global_step": 283142, "epoch": 3411} {"train_loss": -25.1506290435791, "global_step": 283143, "epoch": 3411} {"train_loss": -25.524534225463867, "global_step": 283144, "epoch": 3411} {"train_loss": -25.389408111572266, "global_step": 283145, "epoch": 3411} {"train_loss": -25.261154174804688, "global_step": 283146, "epoch": 3411} {"train_loss": -25.357330322265625, "global_step": 283147, "epoch": 3411} {"train_loss": -25.301504135131836, "global_step": 283148, "epoch": 3411} {"train_loss": -25.51952362060547, "global_step": 283149, "epoch": 3411} {"train_loss": -25.7523250579834, "global_step": 283150, "epoch": 3411} {"train_loss": -25.549274444580078, "global_step": 283151, "epoch": 3411} {"train_loss": -25.23699951171875, "global_step": 283152, "epoch": 3411} {"train_loss": -25.158231735229492, "global_step": 283153, "epoch": 3411} {"train_loss": -25.549480438232422, "global_step": 283154, "epoch": 3411} {"train_loss": -25.22746467590332, "global_step": 283155, "epoch": 3411} {"train_loss": -25.27565574645996, "global_step": 283156, "epoch": 3411} {"train_loss": -25.617597579956055, "global_step": 283157, "epoch": 3411} {"train_loss": -25.44219207763672, "global_step": 283158, "epoch": 3411} {"train_loss": -25.22565460205078, "global_step": 283159, "epoch": 3411} {"train_loss": -25.728445053100586, "global_step": 283160, "epoch": 3411} {"train_loss": -25.744653701782227, "global_step": 283161, "epoch": 3411} {"train_loss": -25.30317497253418, "global_step": 283162, "epoch": 3411} {"train_loss": -25.450407028198242, "global_step": 283163, "epoch": 3411} {"train_loss": -25.437665939331055, "global_step": 283164, "epoch": 3411} {"train_loss": -25.571664810180664, "global_step": 283165, "epoch": 3411} {"train_loss": -25.57999038696289, "global_step": 283166, "epoch": 3411} {"train_loss": -25.687335968017578, "global_step": 283167, "epoch": 3411} {"train_loss": -25.753137588500977, "global_step": 283168, "epoch": 3411} {"train_loss": -25.47151756286621, "global_step": 283169, "epoch": 3411} {"train_loss": -25.411090850830078, "global_step": 283170, "epoch": 3411} {"train_loss": -25.523685455322266, "global_step": 283171, "epoch": 3411} {"train_loss": -25.32912254333496, "global_step": 283172, "epoch": 3411} {"train_loss": -25.174917221069336, "global_step": 283173, "epoch": 3411} {"train_loss": -25.683441162109375, "global_step": 283174, "epoch": 3411} {"train_loss": -25.463272094726562, "global_step": 283175, "epoch": 3411} {"train_loss": -25.80463981628418, "global_step": 283176, "epoch": 3411} {"train_loss": -25.59522819519043, "global_step": 283177, "epoch": 3411} {"train_loss": -25.286258697509766, "global_step": 283178, "epoch": 3411} {"train_loss": -25.2382869720459, "global_step": 283179, "epoch": 3411} {"train_loss": -25.150394439697266, "global_step": 283180, "epoch": 3411} {"train_loss": -25.752735137939453, "global_step": 283181, "epoch": 3411} {"train_loss": -25.63010597229004, "global_step": 283182, "epoch": 3411} {"train_loss": -25.341018676757812, "global_step": 283183, "epoch": 3411} {"train_loss": -25.47809410095215, "global_step": 283184, "epoch": 3411} {"train_loss": -25.006881713867188, "global_step": 283185, "epoch": 3411} {"train_loss": -25.391876220703125, "global_step": 283186, "epoch": 3411} {"train_loss": -25.616870880126953, "global_step": 283187, "epoch": 3411} {"train_loss": -25.5117244720459, "global_step": 283188, "epoch": 3411} {"train_loss": -25.406890869140625, "global_step": 283189, "epoch": 3411} {"train_loss": -25.325836181640625, "global_step": 283190, "epoch": 3411} {"train_loss": -25.69952392578125, "global_step": 283191, "epoch": 3411} {"train_loss": -25.748498916625977, "global_step": 283192, "epoch": 3411} {"train_loss": -25.38241958618164, "global_step": 283193, "epoch": 3411} {"train_loss": -25.680200576782227, "global_step": 283194, "epoch": 3411} {"train_loss": -25.402026302843208, "global_step": 283195, "epoch": 3411, "val_loss": 7109232.0} {"train_loss": -24.633832931518555, "global_step": 283196, "epoch": 3412} {"train_loss": -25.244531631469727, "global_step": 283197, "epoch": 3412} {"train_loss": -25.280752182006836, "global_step": 283198, "epoch": 3412} {"train_loss": -25.03297996520996, "global_step": 283199, "epoch": 3412} {"train_loss": -25.295089721679688, "global_step": 283200, "epoch": 3412} {"train_loss": -24.77678871154785, "global_step": 283201, "epoch": 3412} {"train_loss": -25.057445526123047, "global_step": 283202, "epoch": 3412} {"train_loss": -25.041181564331055, "global_step": 283203, "epoch": 3412} {"train_loss": -25.046951293945312, "global_step": 283204, "epoch": 3412} {"train_loss": -25.351608276367188, "global_step": 283205, "epoch": 3412} {"train_loss": -25.065038681030273, "global_step": 283206, "epoch": 3412} {"train_loss": -24.64580535888672, "global_step": 283207, "epoch": 3412} {"train_loss": -25.19744110107422, "global_step": 283208, "epoch": 3412} {"train_loss": -25.242691040039062, "global_step": 283209, "epoch": 3412} {"train_loss": -25.43776512145996, "global_step": 283210, "epoch": 3412} {"train_loss": -25.096363067626953, "global_step": 283211, "epoch": 3412} {"train_loss": -25.39908218383789, "global_step": 283212, "epoch": 3412} {"train_loss": -25.143064498901367, "global_step": 283213, "epoch": 3412} {"train_loss": -25.3538875579834, "global_step": 283214, "epoch": 3412} {"train_loss": -25.26633644104004, "global_step": 283215, "epoch": 3412} {"train_loss": -25.19736099243164, "global_step": 283216, "epoch": 3412} {"train_loss": -25.207937240600586, "global_step": 283217, "epoch": 3412} {"train_loss": -25.30804443359375, "global_step": 283218, "epoch": 3412} {"train_loss": -25.373315811157227, "global_step": 283219, "epoch": 3412} {"train_loss": -25.5922908782959, "global_step": 283220, "epoch": 3412} {"train_loss": -25.1580810546875, "global_step": 283221, "epoch": 3412} {"train_loss": -25.512706756591797, "global_step": 283222, "epoch": 3412} {"train_loss": -25.7139949798584, "global_step": 283223, "epoch": 3412} {"train_loss": -25.344093322753906, "global_step": 283224, "epoch": 3412} {"train_loss": -25.675586700439453, "global_step": 283225, "epoch": 3412} {"train_loss": -25.39011573791504, "global_step": 283226, "epoch": 3412} {"train_loss": -25.46021842956543, "global_step": 283227, "epoch": 3412} {"train_loss": -25.716754913330078, "global_step": 283228, "epoch": 3412} {"train_loss": -25.38497543334961, "global_step": 283229, "epoch": 3412} {"train_loss": -25.37647819519043, "global_step": 283230, "epoch": 3412} {"train_loss": -25.151601791381836, "global_step": 283231, "epoch": 3412} {"train_loss": -24.99823570251465, "global_step": 283232, "epoch": 3412} {"train_loss": -25.435565948486328, "global_step": 283233, "epoch": 3412} {"train_loss": -25.309673309326172, "global_step": 283234, "epoch": 3412} {"train_loss": -25.308115005493164, "global_step": 283235, "epoch": 3412} {"train_loss": -25.480693817138672, "global_step": 283236, "epoch": 3412} {"train_loss": -25.386594772338867, "global_step": 283237, "epoch": 3412} {"train_loss": -25.759973526000977, "global_step": 283238, "epoch": 3412} {"train_loss": -25.5159969329834, "global_step": 283239, "epoch": 3412} {"train_loss": -25.37860679626465, "global_step": 283240, "epoch": 3412} {"train_loss": -25.585464477539062, "global_step": 283241, "epoch": 3412} {"train_loss": -25.61040687561035, "global_step": 283242, "epoch": 3412} {"train_loss": -25.39777183532715, "global_step": 283243, "epoch": 3412} {"train_loss": -25.345396041870117, "global_step": 283244, "epoch": 3412} {"train_loss": -25.571552276611328, "global_step": 283245, "epoch": 3412} {"train_loss": -25.622278213500977, "global_step": 283246, "epoch": 3412} {"train_loss": -25.412425994873047, "global_step": 283247, "epoch": 3412} {"train_loss": -25.210006713867188, "global_step": 283248, "epoch": 3412} {"train_loss": -25.216527938842773, "global_step": 283249, "epoch": 3412} {"train_loss": -25.482145309448242, "global_step": 283250, "epoch": 3412} {"train_loss": -25.536785125732422, "global_step": 283251, "epoch": 3412} {"train_loss": -25.585729598999023, "global_step": 283252, "epoch": 3412} {"train_loss": -25.514833450317383, "global_step": 283253, "epoch": 3412} {"train_loss": -25.616241455078125, "global_step": 283254, "epoch": 3412} {"train_loss": -25.797409057617188, "global_step": 283255, "epoch": 3412} {"train_loss": -25.603851318359375, "global_step": 283256, "epoch": 3412} {"train_loss": -25.732364654541016, "global_step": 283257, "epoch": 3412} {"train_loss": -25.284040451049805, "global_step": 283258, "epoch": 3412} {"train_loss": -25.036184310913086, "global_step": 283259, "epoch": 3412} {"train_loss": -25.490957260131836, "global_step": 283260, "epoch": 3412} {"train_loss": -25.54018211364746, "global_step": 283261, "epoch": 3412} {"train_loss": -25.11284828186035, "global_step": 283262, "epoch": 3412} {"train_loss": -25.515182495117188, "global_step": 283263, "epoch": 3412} {"train_loss": -25.0649471282959, "global_step": 283264, "epoch": 3412} {"train_loss": -25.327762603759766, "global_step": 283265, "epoch": 3412} {"train_loss": -25.75132179260254, "global_step": 283266, "epoch": 3412} {"train_loss": -25.129846572875977, "global_step": 283267, "epoch": 3412} {"train_loss": -25.362133026123047, "global_step": 283268, "epoch": 3412} {"train_loss": -25.283166885375977, "global_step": 283269, "epoch": 3412} {"train_loss": -25.642377853393555, "global_step": 283270, "epoch": 3412} {"train_loss": -25.15652847290039, "global_step": 283271, "epoch": 3412} {"train_loss": -25.434843063354492, "global_step": 283272, "epoch": 3412} {"train_loss": -25.31836700439453, "global_step": 283273, "epoch": 3412} {"train_loss": -25.869232177734375, "global_step": 283274, "epoch": 3412} {"train_loss": -25.784086227416992, "global_step": 283275, "epoch": 3412} {"train_loss": -25.568260192871094, "global_step": 283276, "epoch": 3412} {"train_loss": -25.704517364501953, "global_step": 283277, "epoch": 3412} {"train_loss": -25.369021679981646, "global_step": 283278, "epoch": 3412, "val_loss": 7150006.0} {"train_loss": -24.49823760986328, "global_step": 283279, "epoch": 3413} {"train_loss": -23.718730926513672, "global_step": 283280, "epoch": 3413} {"train_loss": -24.45370101928711, "global_step": 283281, "epoch": 3413} {"train_loss": -25.201108932495117, "global_step": 283282, "epoch": 3413} {"train_loss": -24.61527442932129, "global_step": 283283, "epoch": 3413} {"train_loss": -24.89289665222168, "global_step": 283284, "epoch": 3413} {"train_loss": -24.55156707763672, "global_step": 283285, "epoch": 3413} {"train_loss": -24.80214500427246, "global_step": 283286, "epoch": 3413} {"train_loss": -24.743667602539062, "global_step": 283287, "epoch": 3413} {"train_loss": -24.3116397857666, "global_step": 283288, "epoch": 3413} {"train_loss": -24.76420783996582, "global_step": 283289, "epoch": 3413} {"train_loss": -25.42706298828125, "global_step": 283290, "epoch": 3413} {"train_loss": -25.13772201538086, "global_step": 283291, "epoch": 3413} {"train_loss": -24.991857528686523, "global_step": 283292, "epoch": 3413} {"train_loss": -24.84861183166504, "global_step": 283293, "epoch": 3413} {"train_loss": -25.292570114135742, "global_step": 283294, "epoch": 3413} {"train_loss": -24.7866268157959, "global_step": 283295, "epoch": 3413} {"train_loss": -25.04648208618164, "global_step": 283296, "epoch": 3413} {"train_loss": -25.321441650390625, "global_step": 283297, "epoch": 3413} {"train_loss": -25.030179977416992, "global_step": 283298, "epoch": 3413} {"train_loss": -24.86159324645996, "global_step": 283299, "epoch": 3413} {"train_loss": -25.285167694091797, "global_step": 283300, "epoch": 3413} {"train_loss": -24.913740158081055, "global_step": 283301, "epoch": 3413} {"train_loss": -24.90651512145996, "global_step": 283302, "epoch": 3413} {"train_loss": -25.301227569580078, "global_step": 283303, "epoch": 3413} {"train_loss": -25.27402687072754, "global_step": 283304, "epoch": 3413} {"train_loss": -25.333030700683594, "global_step": 283305, "epoch": 3413} {"train_loss": -25.164228439331055, "global_step": 283306, "epoch": 3413} {"train_loss": -25.302480697631836, "global_step": 283307, "epoch": 3413} {"train_loss": -25.56489372253418, "global_step": 283308, "epoch": 3413} {"train_loss": -25.760162353515625, "global_step": 283309, "epoch": 3413} {"train_loss": -25.247398376464844, "global_step": 283310, "epoch": 3413} {"train_loss": -25.17640495300293, "global_step": 283311, "epoch": 3413} {"train_loss": -25.445119857788086, "global_step": 283312, "epoch": 3413} {"train_loss": -25.991107940673828, "global_step": 283313, "epoch": 3413} {"train_loss": -25.195287704467773, "global_step": 283314, "epoch": 3413} {"train_loss": -25.829252243041992, "global_step": 283315, "epoch": 3413} {"train_loss": -25.51784324645996, "global_step": 283316, "epoch": 3413} {"train_loss": -25.180206298828125, "global_step": 283317, "epoch": 3413} {"train_loss": -25.418701171875, "global_step": 283318, "epoch": 3413} {"train_loss": -25.68994140625, "global_step": 283319, "epoch": 3413} {"train_loss": -25.831668853759766, "global_step": 283320, "epoch": 3413} {"train_loss": -25.616235733032227, "global_step": 283321, "epoch": 3413} {"train_loss": -25.62396240234375, "global_step": 283322, "epoch": 3413} {"train_loss": -25.220510482788086, "global_step": 283323, "epoch": 3413} {"train_loss": -25.65201759338379, "global_step": 283324, "epoch": 3413} {"train_loss": -25.294876098632812, "global_step": 283325, "epoch": 3413} {"train_loss": -25.284332275390625, "global_step": 283326, "epoch": 3413} {"train_loss": -25.16547203063965, "global_step": 283327, "epoch": 3413} {"train_loss": -25.30472183227539, "global_step": 283328, "epoch": 3413} {"train_loss": -25.28089714050293, "global_step": 283329, "epoch": 3413} {"train_loss": -25.597293853759766, "global_step": 283330, "epoch": 3413} {"train_loss": -25.203794479370117, "global_step": 283331, "epoch": 3413} {"train_loss": -25.4564266204834, "global_step": 283332, "epoch": 3413} {"train_loss": -25.631732940673828, "global_step": 283333, "epoch": 3413} {"train_loss": -25.267370223999023, "global_step": 283334, "epoch": 3413} {"train_loss": -25.987384796142578, "global_step": 283335, "epoch": 3413} {"train_loss": -25.23095703125, "global_step": 283336, "epoch": 3413} {"train_loss": -25.280548095703125, "global_step": 283337, "epoch": 3413} {"train_loss": -25.84779930114746, "global_step": 283338, "epoch": 3413} {"train_loss": -25.05304527282715, "global_step": 283339, "epoch": 3413} {"train_loss": -25.16383934020996, "global_step": 283340, "epoch": 3413} {"train_loss": -25.514297485351562, "global_step": 283341, "epoch": 3413} {"train_loss": -25.443340301513672, "global_step": 283342, "epoch": 3413} {"train_loss": -25.208023071289062, "global_step": 283343, "epoch": 3413} {"train_loss": -25.986433029174805, "global_step": 283344, "epoch": 3413} {"train_loss": -25.370420455932617, "global_step": 283345, "epoch": 3413} {"train_loss": -25.519405364990234, "global_step": 283346, "epoch": 3413} {"train_loss": -24.86507225036621, "global_step": 283347, "epoch": 3413} {"train_loss": -25.387937545776367, "global_step": 283348, "epoch": 3413} {"train_loss": -25.803466796875, "global_step": 283349, "epoch": 3413} {"train_loss": -24.90675163269043, "global_step": 283350, "epoch": 3413} {"train_loss": -25.601898193359375, "global_step": 283351, "epoch": 3413} {"train_loss": -25.443151473999023, "global_step": 283352, "epoch": 3413} {"train_loss": -25.47153663635254, "global_step": 283353, "epoch": 3413} {"train_loss": -25.872949600219727, "global_step": 283354, "epoch": 3413} {"train_loss": -25.466760635375977, "global_step": 283355, "epoch": 3413} {"train_loss": -25.90797233581543, "global_step": 283356, "epoch": 3413} {"train_loss": -25.11408233642578, "global_step": 283357, "epoch": 3413} {"train_loss": -25.444080352783203, "global_step": 283358, "epoch": 3413} {"train_loss": -24.981403350830078, "global_step": 283359, "epoch": 3413} {"train_loss": -25.348752975463867, "global_step": 283360, "epoch": 3413} {"train_loss": -25.2470703125, "global_step": 283361, "epoch": 3413, "val_loss": 7201202.0} {"train_loss": -24.471820831298828, "global_step": 283362, "epoch": 3414} {"train_loss": -24.545740127563477, "global_step": 283363, "epoch": 3414} {"train_loss": -25.046096801757812, "global_step": 283364, "epoch": 3414} {"train_loss": -25.814807891845703, "global_step": 283365, "epoch": 3414} {"train_loss": -25.117666244506836, "global_step": 283366, "epoch": 3414} {"train_loss": -25.16644859313965, "global_step": 283367, "epoch": 3414} {"train_loss": -25.327842712402344, "global_step": 283368, "epoch": 3414} {"train_loss": -25.092802047729492, "global_step": 283369, "epoch": 3414} {"train_loss": -25.528356552124023, "global_step": 283370, "epoch": 3414} {"train_loss": -25.33774185180664, "global_step": 283371, "epoch": 3414} {"train_loss": -25.706897735595703, "global_step": 283372, "epoch": 3414} {"train_loss": -25.204023361206055, "global_step": 283373, "epoch": 3414} {"train_loss": -25.315256118774414, "global_step": 283374, "epoch": 3414} {"train_loss": -25.427526473999023, "global_step": 283375, "epoch": 3414} {"train_loss": -25.634506225585938, "global_step": 283376, "epoch": 3414} {"train_loss": -25.250438690185547, "global_step": 283377, "epoch": 3414} {"train_loss": -25.56593132019043, "global_step": 283378, "epoch": 3414} {"train_loss": -25.118553161621094, "global_step": 283379, "epoch": 3414} {"train_loss": -25.471866607666016, "global_step": 283380, "epoch": 3414} {"train_loss": -25.531002044677734, "global_step": 283381, "epoch": 3414} {"train_loss": -25.71306800842285, "global_step": 283382, "epoch": 3414} {"train_loss": -25.305347442626953, "global_step": 283383, "epoch": 3414} {"train_loss": -25.51529312133789, "global_step": 283384, "epoch": 3414} {"train_loss": -25.52606773376465, "global_step": 283385, "epoch": 3414} {"train_loss": -24.847097396850586, "global_step": 283386, "epoch": 3414} {"train_loss": -25.322561264038086, "global_step": 283387, "epoch": 3414} {"train_loss": -25.172595977783203, "global_step": 283388, "epoch": 3414} {"train_loss": -25.605772018432617, "global_step": 283389, "epoch": 3414} {"train_loss": -25.448993682861328, "global_step": 283390, "epoch": 3414} {"train_loss": -25.78522300720215, "global_step": 283391, "epoch": 3414} {"train_loss": -25.58918571472168, "global_step": 283392, "epoch": 3414} {"train_loss": -25.6225643157959, "global_step": 283393, "epoch": 3414} {"train_loss": -25.4708309173584, "global_step": 283394, "epoch": 3414} {"train_loss": -25.22503089904785, "global_step": 283395, "epoch": 3414} {"train_loss": -25.50649642944336, "global_step": 283396, "epoch": 3414} {"train_loss": -25.32888412475586, "global_step": 283397, "epoch": 3414} {"train_loss": -25.139989852905273, "global_step": 283398, "epoch": 3414} {"train_loss": -25.43015480041504, "global_step": 283399, "epoch": 3414} {"train_loss": -25.334579467773438, "global_step": 283400, "epoch": 3414} {"train_loss": -25.418933868408203, "global_step": 283401, "epoch": 3414} {"train_loss": -25.501188278198242, "global_step": 283402, "epoch": 3414} {"train_loss": -25.407732009887695, "global_step": 283403, "epoch": 3414} {"train_loss": -25.468307495117188, "global_step": 283404, "epoch": 3414} {"train_loss": -25.01750946044922, "global_step": 283405, "epoch": 3414} {"train_loss": -25.5958309173584, "global_step": 283406, "epoch": 3414} {"train_loss": -25.420841217041016, "global_step": 283407, "epoch": 3414} {"train_loss": -25.647912979125977, "global_step": 283408, "epoch": 3414} {"train_loss": -25.364871978759766, "global_step": 283409, "epoch": 3414} {"train_loss": -25.28590965270996, "global_step": 283410, "epoch": 3414} {"train_loss": -25.61971092224121, "global_step": 283411, "epoch": 3414} {"train_loss": -25.662744522094727, "global_step": 283412, "epoch": 3414} {"train_loss": -25.4964656829834, "global_step": 283413, "epoch": 3414} {"train_loss": -25.83949851989746, "global_step": 283414, "epoch": 3414} {"train_loss": -25.342132568359375, "global_step": 283415, "epoch": 3414} {"train_loss": -25.510799407958984, "global_step": 283416, "epoch": 3414} {"train_loss": -25.684650421142578, "global_step": 283417, "epoch": 3414} {"train_loss": -25.3332576751709, "global_step": 283418, "epoch": 3414} {"train_loss": -25.712671279907227, "global_step": 283419, "epoch": 3414} {"train_loss": -25.210826873779297, "global_step": 283420, "epoch": 3414} {"train_loss": -25.451696395874023, "global_step": 283421, "epoch": 3414} {"train_loss": -25.607519149780273, "global_step": 283422, "epoch": 3414} {"train_loss": -25.550790786743164, "global_step": 283423, "epoch": 3414} {"train_loss": -25.297475814819336, "global_step": 283424, "epoch": 3414} {"train_loss": -25.614856719970703, "global_step": 283425, "epoch": 3414} {"train_loss": -25.626358032226562, "global_step": 283426, "epoch": 3414} {"train_loss": -26.038904190063477, "global_step": 283427, "epoch": 3414} {"train_loss": -25.34535789489746, "global_step": 283428, "epoch": 3414} {"train_loss": -25.37674331665039, "global_step": 283429, "epoch": 3414} {"train_loss": -25.56061363220215, "global_step": 283430, "epoch": 3414} {"train_loss": -25.75933265686035, "global_step": 283431, "epoch": 3414} {"train_loss": -25.16377067565918, "global_step": 283432, "epoch": 3414} {"train_loss": -24.7069034576416, "global_step": 283433, "epoch": 3414} {"train_loss": -23.9146728515625, "global_step": 283434, "epoch": 3414} {"train_loss": -23.888059616088867, "global_step": 283435, "epoch": 3414} {"train_loss": -25.323976516723633, "global_step": 283436, "epoch": 3414} {"train_loss": -24.657052993774414, "global_step": 283437, "epoch": 3414} {"train_loss": -24.573518753051758, "global_step": 283438, "epoch": 3414} {"train_loss": -24.375015258789062, "global_step": 283439, "epoch": 3414} {"train_loss": -24.960708618164062, "global_step": 283440, "epoch": 3414} {"train_loss": -24.63448715209961, "global_step": 283441, "epoch": 3414} {"train_loss": -24.55946922302246, "global_step": 283442, "epoch": 3414} {"train_loss": -24.82561683654785, "global_step": 283443, "epoch": 3414} {"train_loss": -25.299268469753034, "global_step": 283444, "epoch": 3414, "val_loss": 7239912.0} {"train_loss": -24.915023803710938, "global_step": 283445, "epoch": 3415} {"train_loss": -24.183561325073242, "global_step": 283446, "epoch": 3415} {"train_loss": -24.288633346557617, "global_step": 283447, "epoch": 3415} {"train_loss": -24.361799240112305, "global_step": 283448, "epoch": 3415} {"train_loss": -24.45517921447754, "global_step": 283449, "epoch": 3415} {"train_loss": -24.52350616455078, "global_step": 283450, "epoch": 3415} {"train_loss": -24.55144691467285, "global_step": 283451, "epoch": 3415} {"train_loss": -24.5660343170166, "global_step": 283452, "epoch": 3415} {"train_loss": -24.533308029174805, "global_step": 283453, "epoch": 3415} {"train_loss": -25.257801055908203, "global_step": 283454, "epoch": 3415} {"train_loss": -24.573989868164062, "global_step": 283455, "epoch": 3415} {"train_loss": -24.805395126342773, "global_step": 283456, "epoch": 3415} {"train_loss": -24.231767654418945, "global_step": 283457, "epoch": 3415} {"train_loss": -24.654987335205078, "global_step": 283458, "epoch": 3415} {"train_loss": -24.878538131713867, "global_step": 283459, "epoch": 3415} {"train_loss": -24.987462997436523, "global_step": 283460, "epoch": 3415} {"train_loss": -24.75436019897461, "global_step": 283461, "epoch": 3415} {"train_loss": -24.668521881103516, "global_step": 283462, "epoch": 3415} {"train_loss": -25.120914459228516, "global_step": 283463, "epoch": 3415} {"train_loss": -25.188879013061523, "global_step": 283464, "epoch": 3415} {"train_loss": -25.53078842163086, "global_step": 283465, "epoch": 3415} {"train_loss": -25.30210304260254, "global_step": 283466, "epoch": 3415} {"train_loss": -25.128122329711914, "global_step": 283467, "epoch": 3415} {"train_loss": -25.501794815063477, "global_step": 283468, "epoch": 3415} {"train_loss": -25.371728897094727, "global_step": 283469, "epoch": 3415} {"train_loss": -25.406553268432617, "global_step": 283470, "epoch": 3415} {"train_loss": -25.319580078125, "global_step": 283471, "epoch": 3415} {"train_loss": -25.47408103942871, "global_step": 283472, "epoch": 3415} {"train_loss": -25.472076416015625, "global_step": 283473, "epoch": 3415} {"train_loss": -25.09419059753418, "global_step": 283474, "epoch": 3415} {"train_loss": -25.215778350830078, "global_step": 283475, "epoch": 3415} {"train_loss": -25.81500816345215, "global_step": 283476, "epoch": 3415} {"train_loss": -25.318044662475586, "global_step": 283477, "epoch": 3415} {"train_loss": -25.610076904296875, "global_step": 283478, "epoch": 3415} {"train_loss": -25.341827392578125, "global_step": 283479, "epoch": 3415} {"train_loss": -25.76266860961914, "global_step": 283480, "epoch": 3415} {"train_loss": -25.349628448486328, "global_step": 283481, "epoch": 3415} {"train_loss": -25.837446212768555, "global_step": 283482, "epoch": 3415} {"train_loss": -25.574392318725586, "global_step": 283483, "epoch": 3415} {"train_loss": -26.22056007385254, "global_step": 283484, "epoch": 3415} {"train_loss": -25.590381622314453, "global_step": 283485, "epoch": 3415} {"train_loss": -25.557083129882812, "global_step": 283486, "epoch": 3415} {"train_loss": -25.425495147705078, "global_step": 283487, "epoch": 3415} {"train_loss": -25.342411041259766, "global_step": 283488, "epoch": 3415} {"train_loss": -25.428068161010742, "global_step": 283489, "epoch": 3415} {"train_loss": -25.297697067260742, "global_step": 283490, "epoch": 3415} {"train_loss": -25.463897705078125, "global_step": 283491, "epoch": 3415} {"train_loss": -25.645404815673828, "global_step": 283492, "epoch": 3415} {"train_loss": -25.446001052856445, "global_step": 283493, "epoch": 3415} {"train_loss": -25.263349533081055, "global_step": 283494, "epoch": 3415} {"train_loss": -25.427724838256836, "global_step": 283495, "epoch": 3415} {"train_loss": -25.61777114868164, "global_step": 283496, "epoch": 3415} {"train_loss": -25.80695152282715, "global_step": 283497, "epoch": 3415} {"train_loss": -25.56941032409668, "global_step": 283498, "epoch": 3415} {"train_loss": -25.6908016204834, "global_step": 283499, "epoch": 3415} {"train_loss": -25.651315689086914, "global_step": 283500, "epoch": 3415} {"train_loss": -25.76544761657715, "global_step": 283501, "epoch": 3415} {"train_loss": -25.763776779174805, "global_step": 283502, "epoch": 3415} {"train_loss": -25.8748779296875, "global_step": 283503, "epoch": 3415} {"train_loss": -25.613889694213867, "global_step": 283504, "epoch": 3415} {"train_loss": -25.5255184173584, "global_step": 283505, "epoch": 3415} {"train_loss": -25.721607208251953, "global_step": 283506, "epoch": 3415} {"train_loss": -25.479631423950195, "global_step": 283507, "epoch": 3415} {"train_loss": -25.65212059020996, "global_step": 283508, "epoch": 3415} {"train_loss": -25.414873123168945, "global_step": 283509, "epoch": 3415} {"train_loss": -25.31656837463379, "global_step": 283510, "epoch": 3415} {"train_loss": -25.250228881835938, "global_step": 283511, "epoch": 3415} {"train_loss": -25.16135597229004, "global_step": 283512, "epoch": 3415} {"train_loss": -25.532804489135742, "global_step": 283513, "epoch": 3415} {"train_loss": -25.53396987915039, "global_step": 283514, "epoch": 3415} {"train_loss": -25.43792724609375, "global_step": 283515, "epoch": 3415} {"train_loss": -25.599512100219727, "global_step": 283516, "epoch": 3415} {"train_loss": -25.721471786499023, "global_step": 283517, "epoch": 3415} {"train_loss": -25.581607818603516, "global_step": 283518, "epoch": 3415} {"train_loss": -25.737903594970703, "global_step": 283519, "epoch": 3415} {"train_loss": -25.6651554107666, "global_step": 283520, "epoch": 3415} {"train_loss": -25.7445125579834, "global_step": 283521, "epoch": 3415} {"train_loss": -25.26870346069336, "global_step": 283522, "epoch": 3415} {"train_loss": -25.464797973632812, "global_step": 283523, "epoch": 3415} {"train_loss": -25.73237419128418, "global_step": 283524, "epoch": 3415} {"train_loss": -25.57343101501465, "global_step": 283525, "epoch": 3415} {"train_loss": -25.259586334228516, "global_step": 283526, "epoch": 3415} {"train_loss": -25.321495630654944, "global_step": 283527, "epoch": 3415, "val_loss": 7085955.0} {"train_loss": -23.97090721130371, "global_step": 283528, "epoch": 3416} {"train_loss": -23.865585327148438, "global_step": 283529, "epoch": 3416} {"train_loss": -24.79562759399414, "global_step": 283530, "epoch": 3416} {"train_loss": -24.560483932495117, "global_step": 283531, "epoch": 3416} {"train_loss": -24.350915908813477, "global_step": 283532, "epoch": 3416} {"train_loss": -25.31867027282715, "global_step": 283533, "epoch": 3416} {"train_loss": -24.937467575073242, "global_step": 283534, "epoch": 3416} {"train_loss": -24.640233993530273, "global_step": 283535, "epoch": 3416} {"train_loss": -25.001028060913086, "global_step": 283536, "epoch": 3416} {"train_loss": -24.855243682861328, "global_step": 283537, "epoch": 3416} {"train_loss": -25.437591552734375, "global_step": 283538, "epoch": 3416} {"train_loss": -25.157062530517578, "global_step": 283539, "epoch": 3416} {"train_loss": -25.364328384399414, "global_step": 283540, "epoch": 3416} {"train_loss": -25.379905700683594, "global_step": 283541, "epoch": 3416} {"train_loss": -25.115013122558594, "global_step": 283542, "epoch": 3416} {"train_loss": -24.787256240844727, "global_step": 283543, "epoch": 3416} {"train_loss": -25.171409606933594, "global_step": 283544, "epoch": 3416} {"train_loss": -24.99323844909668, "global_step": 283545, "epoch": 3416} {"train_loss": -25.108306884765625, "global_step": 283546, "epoch": 3416} {"train_loss": -24.988332748413086, "global_step": 283547, "epoch": 3416} {"train_loss": -25.5205135345459, "global_step": 283548, "epoch": 3416} {"train_loss": -25.31434440612793, "global_step": 283549, "epoch": 3416} {"train_loss": -25.58392906188965, "global_step": 283550, "epoch": 3416} {"train_loss": -25.19285011291504, "global_step": 283551, "epoch": 3416} {"train_loss": -25.34733772277832, "global_step": 283552, "epoch": 3416} {"train_loss": -25.007171630859375, "global_step": 283553, "epoch": 3416} {"train_loss": -25.3810977935791, "global_step": 283554, "epoch": 3416} {"train_loss": -25.604028701782227, "global_step": 283555, "epoch": 3416} {"train_loss": -25.506006240844727, "global_step": 283556, "epoch": 3416} {"train_loss": -25.349706649780273, "global_step": 283557, "epoch": 3416} {"train_loss": -25.179025650024414, "global_step": 283558, "epoch": 3416} {"train_loss": -25.634754180908203, "global_step": 283559, "epoch": 3416} {"train_loss": -25.535131454467773, "global_step": 283560, "epoch": 3416} {"train_loss": -25.42011070251465, "global_step": 283561, "epoch": 3416} {"train_loss": -25.056455612182617, "global_step": 283562, "epoch": 3416} {"train_loss": -25.642179489135742, "global_step": 283563, "epoch": 3416} {"train_loss": -25.62666130065918, "global_step": 283564, "epoch": 3416} {"train_loss": -25.522743225097656, "global_step": 283565, "epoch": 3416} {"train_loss": -25.512929916381836, "global_step": 283566, "epoch": 3416} {"train_loss": -25.745153427124023, "global_step": 283567, "epoch": 3416} {"train_loss": -25.90833854675293, "global_step": 283568, "epoch": 3416} {"train_loss": -25.38032341003418, "global_step": 283569, "epoch": 3416} {"train_loss": -25.594533920288086, "global_step": 283570, "epoch": 3416} {"train_loss": -25.7228946685791, "global_step": 283571, "epoch": 3416} {"train_loss": -25.59754753112793, "global_step": 283572, "epoch": 3416} {"train_loss": -25.567777633666992, "global_step": 283573, "epoch": 3416} {"train_loss": -25.7747802734375, "global_step": 283574, "epoch": 3416} {"train_loss": -25.547861099243164, "global_step": 283575, "epoch": 3416} {"train_loss": -25.666107177734375, "global_step": 283576, "epoch": 3416} {"train_loss": -25.87129020690918, "global_step": 283577, "epoch": 3416} {"train_loss": -25.882171630859375, "global_step": 283578, "epoch": 3416} {"train_loss": -25.77149772644043, "global_step": 283579, "epoch": 3416} {"train_loss": -25.732227325439453, "global_step": 283580, "epoch": 3416} {"train_loss": -25.63068199157715, "global_step": 283581, "epoch": 3416} {"train_loss": -25.7435302734375, "global_step": 283582, "epoch": 3416} {"train_loss": -25.177656173706055, "global_step": 283583, "epoch": 3416} {"train_loss": -25.15087127685547, "global_step": 283584, "epoch": 3416} {"train_loss": -24.9956111907959, "global_step": 283585, "epoch": 3416} {"train_loss": -25.398107528686523, "global_step": 283586, "epoch": 3416} {"train_loss": -25.505416870117188, "global_step": 283587, "epoch": 3416} {"train_loss": -25.207111358642578, "global_step": 283588, "epoch": 3416} {"train_loss": -25.16066551208496, "global_step": 283589, "epoch": 3416} {"train_loss": -25.750532150268555, "global_step": 283590, "epoch": 3416} {"train_loss": -25.096878051757812, "global_step": 283591, "epoch": 3416} {"train_loss": -25.65863037109375, "global_step": 283592, "epoch": 3416} {"train_loss": -25.30073356628418, "global_step": 283593, "epoch": 3416} {"train_loss": -25.79292106628418, "global_step": 283594, "epoch": 3416} {"train_loss": -25.54435157775879, "global_step": 283595, "epoch": 3416} {"train_loss": -25.698083877563477, "global_step": 283596, "epoch": 3416} {"train_loss": -25.563243865966797, "global_step": 283597, "epoch": 3416} {"train_loss": -25.604177474975586, "global_step": 283598, "epoch": 3416} {"train_loss": -25.279361724853516, "global_step": 283599, "epoch": 3416} {"train_loss": -25.76506996154785, "global_step": 283600, "epoch": 3416} {"train_loss": -25.69365882873535, "global_step": 283601, "epoch": 3416} {"train_loss": -25.188392639160156, "global_step": 283602, "epoch": 3416} {"train_loss": -25.558456420898438, "global_step": 283603, "epoch": 3416} {"train_loss": -25.712926864624023, "global_step": 283604, "epoch": 3416} {"train_loss": -25.3216609954834, "global_step": 283605, "epoch": 3416} {"train_loss": -25.774810791015625, "global_step": 283606, "epoch": 3416} {"train_loss": -25.295976638793945, "global_step": 283607, "epoch": 3416} {"train_loss": -25.56545639038086, "global_step": 283608, "epoch": 3416} {"train_loss": -25.930374145507812, "global_step": 283609, "epoch": 3416} {"train_loss": -25.34632728760501, "global_step": 283610, "epoch": 3416, "val_loss": 7075882.0} {"train_loss": -24.44417381286621, "global_step": 283611, "epoch": 3417} {"train_loss": -24.250452041625977, "global_step": 283612, "epoch": 3417} {"train_loss": -23.97943687438965, "global_step": 283613, "epoch": 3417} {"train_loss": -24.85381317138672, "global_step": 283614, "epoch": 3417} {"train_loss": -23.469085693359375, "global_step": 283615, "epoch": 3417} {"train_loss": -24.64920425415039, "global_step": 283616, "epoch": 3417} {"train_loss": -24.392282485961914, "global_step": 283617, "epoch": 3417} {"train_loss": -23.576753616333008, "global_step": 283618, "epoch": 3417} {"train_loss": -23.801435470581055, "global_step": 283619, "epoch": 3417} {"train_loss": -24.939830780029297, "global_step": 283620, "epoch": 3417} {"train_loss": -24.195499420166016, "global_step": 283621, "epoch": 3417} {"train_loss": -24.479490280151367, "global_step": 283622, "epoch": 3417} {"train_loss": -24.485300064086914, "global_step": 283623, "epoch": 3417} {"train_loss": -24.87051010131836, "global_step": 283624, "epoch": 3417} {"train_loss": -24.636310577392578, "global_step": 283625, "epoch": 3417} {"train_loss": -24.71673583984375, "global_step": 283626, "epoch": 3417} {"train_loss": -24.95722770690918, "global_step": 283627, "epoch": 3417} {"train_loss": -24.838651657104492, "global_step": 283628, "epoch": 3417} {"train_loss": -24.459735870361328, "global_step": 283629, "epoch": 3417} {"train_loss": -24.510284423828125, "global_step": 283630, "epoch": 3417} {"train_loss": -24.723508834838867, "global_step": 283631, "epoch": 3417} {"train_loss": -24.899227142333984, "global_step": 283632, "epoch": 3417} {"train_loss": -25.166940689086914, "global_step": 283633, "epoch": 3417} {"train_loss": -24.61116600036621, "global_step": 283634, "epoch": 3417} {"train_loss": -24.99172019958496, "global_step": 283635, "epoch": 3417} {"train_loss": -25.23064613342285, "global_step": 283636, "epoch": 3417} {"train_loss": -25.018951416015625, "global_step": 283637, "epoch": 3417} {"train_loss": -24.831167221069336, "global_step": 283638, "epoch": 3417} {"train_loss": -25.09973907470703, "global_step": 283639, "epoch": 3417} {"train_loss": -25.04888916015625, "global_step": 283640, "epoch": 3417} {"train_loss": -25.222646713256836, "global_step": 283641, "epoch": 3417} {"train_loss": -25.231212615966797, "global_step": 283642, "epoch": 3417} {"train_loss": -24.846498489379883, "global_step": 283643, "epoch": 3417} {"train_loss": -25.367279052734375, "global_step": 283644, "epoch": 3417} {"train_loss": -25.542516708374023, "global_step": 283645, "epoch": 3417} {"train_loss": -25.335285186767578, "global_step": 283646, "epoch": 3417} {"train_loss": -25.37335777282715, "global_step": 283647, "epoch": 3417} {"train_loss": -25.44856071472168, "global_step": 283648, "epoch": 3417} {"train_loss": -25.827564239501953, "global_step": 283649, "epoch": 3417} {"train_loss": -25.24909782409668, "global_step": 283650, "epoch": 3417} {"train_loss": -25.621936798095703, "global_step": 283651, "epoch": 3417} {"train_loss": -25.577306747436523, "global_step": 283652, "epoch": 3417} {"train_loss": -25.29609489440918, "global_step": 283653, "epoch": 3417} {"train_loss": -25.612274169921875, "global_step": 283654, "epoch": 3417} {"train_loss": -25.27065086364746, "global_step": 283655, "epoch": 3417} {"train_loss": -25.187458038330078, "global_step": 283656, "epoch": 3417} {"train_loss": -25.05828094482422, "global_step": 283657, "epoch": 3417} {"train_loss": -25.206735610961914, "global_step": 283658, "epoch": 3417} {"train_loss": -25.11290740966797, "global_step": 283659, "epoch": 3417} {"train_loss": -25.11036491394043, "global_step": 283660, "epoch": 3417} {"train_loss": -25.7828426361084, "global_step": 283661, "epoch": 3417} {"train_loss": -25.041873931884766, "global_step": 283662, "epoch": 3417} {"train_loss": -25.480987548828125, "global_step": 283663, "epoch": 3417} {"train_loss": -25.420072555541992, "global_step": 283664, "epoch": 3417} {"train_loss": -25.700286865234375, "global_step": 283665, "epoch": 3417} {"train_loss": -25.422094345092773, "global_step": 283666, "epoch": 3417} {"train_loss": -25.08078384399414, "global_step": 283667, "epoch": 3417} {"train_loss": -25.281753540039062, "global_step": 283668, "epoch": 3417} {"train_loss": -25.630512237548828, "global_step": 283669, "epoch": 3417} {"train_loss": -25.722394943237305, "global_step": 283670, "epoch": 3417} {"train_loss": -25.235702514648438, "global_step": 283671, "epoch": 3417} {"train_loss": -25.127073287963867, "global_step": 283672, "epoch": 3417} {"train_loss": -25.4388370513916, "global_step": 283673, "epoch": 3417} {"train_loss": -25.085824966430664, "global_step": 283674, "epoch": 3417} {"train_loss": -25.183944702148438, "global_step": 283675, "epoch": 3417} {"train_loss": -24.846914291381836, "global_step": 283676, "epoch": 3417} {"train_loss": -24.825082778930664, "global_step": 283677, "epoch": 3417} {"train_loss": -25.141767501831055, "global_step": 283678, "epoch": 3417} {"train_loss": -25.01881980895996, "global_step": 283679, "epoch": 3417} {"train_loss": -24.875457763671875, "global_step": 283680, "epoch": 3417} {"train_loss": -25.338171005249023, "global_step": 283681, "epoch": 3417} {"train_loss": -25.439016342163086, "global_step": 283682, "epoch": 3417} {"train_loss": -25.032773971557617, "global_step": 283683, "epoch": 3417} {"train_loss": -25.466190338134766, "global_step": 283684, "epoch": 3417} {"train_loss": -25.45655059814453, "global_step": 283685, "epoch": 3417} {"train_loss": -25.570547103881836, "global_step": 283686, "epoch": 3417} {"train_loss": -25.11795997619629, "global_step": 283687, "epoch": 3417} {"train_loss": -25.47783851623535, "global_step": 283688, "epoch": 3417} {"train_loss": -25.049535751342773, "global_step": 283689, "epoch": 3417} {"train_loss": -25.085540771484375, "global_step": 283690, "epoch": 3417} {"train_loss": -25.758630752563477, "global_step": 283691, "epoch": 3417} {"train_loss": -25.94233512878418, "global_step": 283692, "epoch": 3417} {"train_loss": -25.078611649662616, "global_step": 283693, "epoch": 3417, "val_loss": 7086280.0} {"train_loss": -23.36262321472168, "global_step": 283694, "epoch": 3418} {"train_loss": -23.537050247192383, "global_step": 283695, "epoch": 3418} {"train_loss": -25.06325340270996, "global_step": 283696, "epoch": 3418} {"train_loss": -23.743408203125, "global_step": 283697, "epoch": 3418} {"train_loss": -24.261188507080078, "global_step": 283698, "epoch": 3418} {"train_loss": -24.580846786499023, "global_step": 283699, "epoch": 3418} {"train_loss": -24.529468536376953, "global_step": 283700, "epoch": 3418} {"train_loss": -24.921724319458008, "global_step": 283701, "epoch": 3418} {"train_loss": -24.47015953063965, "global_step": 283702, "epoch": 3418} {"train_loss": -24.6123046875, "global_step": 283703, "epoch": 3418} {"train_loss": -25.006591796875, "global_step": 283704, "epoch": 3418} {"train_loss": -24.8142147064209, "global_step": 283705, "epoch": 3418} {"train_loss": -24.983837127685547, "global_step": 283706, "epoch": 3418} {"train_loss": -25.178686141967773, "global_step": 283707, "epoch": 3418} {"train_loss": -24.866552352905273, "global_step": 283708, "epoch": 3418} {"train_loss": -25.203834533691406, "global_step": 283709, "epoch": 3418} {"train_loss": -24.88532066345215, "global_step": 283710, "epoch": 3418} {"train_loss": -25.07097816467285, "global_step": 283711, "epoch": 3418} {"train_loss": -24.68306541442871, "global_step": 283712, "epoch": 3418} {"train_loss": -24.923715591430664, "global_step": 283713, "epoch": 3418} {"train_loss": -24.85200309753418, "global_step": 283714, "epoch": 3418} {"train_loss": -25.158580780029297, "global_step": 283715, "epoch": 3418} {"train_loss": -25.289539337158203, "global_step": 283716, "epoch": 3418} {"train_loss": -25.10731315612793, "global_step": 283717, "epoch": 3418} {"train_loss": -25.159961700439453, "global_step": 283718, "epoch": 3418} {"train_loss": -25.28883934020996, "global_step": 283719, "epoch": 3418} {"train_loss": -25.16668128967285, "global_step": 283720, "epoch": 3418} {"train_loss": -25.28481101989746, "global_step": 283721, "epoch": 3418} {"train_loss": -25.38959312438965, "global_step": 283722, "epoch": 3418} {"train_loss": -25.131994247436523, "global_step": 283723, "epoch": 3418} {"train_loss": -25.324356079101562, "global_step": 283724, "epoch": 3418} {"train_loss": -25.442888259887695, "global_step": 283725, "epoch": 3418} {"train_loss": -25.646224975585938, "global_step": 283726, "epoch": 3418} {"train_loss": -25.62261962890625, "global_step": 283727, "epoch": 3418} {"train_loss": -25.58046531677246, "global_step": 283728, "epoch": 3418} {"train_loss": -25.527145385742188, "global_step": 283729, "epoch": 3418} {"train_loss": -25.658105850219727, "global_step": 283730, "epoch": 3418} {"train_loss": -25.60218620300293, "global_step": 283731, "epoch": 3418} {"train_loss": -25.919635772705078, "global_step": 283732, "epoch": 3418} {"train_loss": -25.689502716064453, "global_step": 283733, "epoch": 3418} {"train_loss": -25.60518455505371, "global_step": 283734, "epoch": 3418} {"train_loss": -25.49612808227539, "global_step": 283735, "epoch": 3418} {"train_loss": -25.652053833007812, "global_step": 283736, "epoch": 3418} {"train_loss": -25.57526969909668, "global_step": 283737, "epoch": 3418} {"train_loss": -25.52370834350586, "global_step": 283738, "epoch": 3418} {"train_loss": -25.478164672851562, "global_step": 283739, "epoch": 3418} {"train_loss": -25.60736083984375, "global_step": 283740, "epoch": 3418} {"train_loss": -25.396814346313477, "global_step": 283741, "epoch": 3418} {"train_loss": -25.665063858032227, "global_step": 283742, "epoch": 3418} {"train_loss": -25.650365829467773, "global_step": 283743, "epoch": 3418} {"train_loss": -25.682666778564453, "global_step": 283744, "epoch": 3418} {"train_loss": -25.601072311401367, "global_step": 283745, "epoch": 3418} {"train_loss": -25.449987411499023, "global_step": 283746, "epoch": 3418} {"train_loss": -25.5087890625, "global_step": 283747, "epoch": 3418} {"train_loss": -25.858423233032227, "global_step": 283748, "epoch": 3418} {"train_loss": -25.868213653564453, "global_step": 283749, "epoch": 3418} {"train_loss": -25.491912841796875, "global_step": 283750, "epoch": 3418} {"train_loss": -25.443506240844727, "global_step": 283751, "epoch": 3418} {"train_loss": -25.48652458190918, "global_step": 283752, "epoch": 3418} {"train_loss": -25.056787490844727, "global_step": 283753, "epoch": 3418} {"train_loss": -25.30063819885254, "global_step": 283754, "epoch": 3418} {"train_loss": -25.311569213867188, "global_step": 283755, "epoch": 3418} {"train_loss": -25.371410369873047, "global_step": 283756, "epoch": 3418} {"train_loss": -25.384828567504883, "global_step": 283757, "epoch": 3418} {"train_loss": -25.11802101135254, "global_step": 283758, "epoch": 3418} {"train_loss": -24.620426177978516, "global_step": 283759, "epoch": 3418} {"train_loss": -24.512388229370117, "global_step": 283760, "epoch": 3418} {"train_loss": -25.441648483276367, "global_step": 283761, "epoch": 3418} {"train_loss": -24.61547088623047, "global_step": 283762, "epoch": 3418} {"train_loss": -25.05286979675293, "global_step": 283763, "epoch": 3418} {"train_loss": -25.335031509399414, "global_step": 283764, "epoch": 3418} {"train_loss": -25.3599853515625, "global_step": 283765, "epoch": 3418} {"train_loss": -25.06637954711914, "global_step": 283766, "epoch": 3418} {"train_loss": -25.570547103881836, "global_step": 283767, "epoch": 3418} {"train_loss": -25.317520141601562, "global_step": 283768, "epoch": 3418} {"train_loss": -25.28787612915039, "global_step": 283769, "epoch": 3418} {"train_loss": -25.240467071533203, "global_step": 283770, "epoch": 3418} {"train_loss": -25.118892669677734, "global_step": 283771, "epoch": 3418} {"train_loss": -25.499242782592773, "global_step": 283772, "epoch": 3418} {"train_loss": -25.462902069091797, "global_step": 283773, "epoch": 3418} {"train_loss": -25.089868545532227, "global_step": 283774, "epoch": 3418} {"train_loss": -25.685033798217773, "global_step": 283775, "epoch": 3418} {"train_loss": -25.183529704450123, "global_step": 283776, "epoch": 3418, "val_loss": 7229617.0} {"train_loss": -24.726877212524414, "global_step": 283777, "epoch": 3419} {"train_loss": -24.5968017578125, "global_step": 283778, "epoch": 3419} {"train_loss": -25.607152938842773, "global_step": 283779, "epoch": 3419} {"train_loss": -25.012460708618164, "global_step": 283780, "epoch": 3419} {"train_loss": -25.142534255981445, "global_step": 283781, "epoch": 3419} {"train_loss": -25.110288619995117, "global_step": 283782, "epoch": 3419} {"train_loss": -25.436019897460938, "global_step": 283783, "epoch": 3419} {"train_loss": -24.91976547241211, "global_step": 283784, "epoch": 3419} {"train_loss": -25.653669357299805, "global_step": 283785, "epoch": 3419} {"train_loss": -24.820343017578125, "global_step": 283786, "epoch": 3419} {"train_loss": -24.996002197265625, "global_step": 283787, "epoch": 3419} {"train_loss": -24.99301528930664, "global_step": 283788, "epoch": 3419} {"train_loss": -25.23674774169922, "global_step": 283789, "epoch": 3419} {"train_loss": -25.332143783569336, "global_step": 283790, "epoch": 3419} {"train_loss": -25.495975494384766, "global_step": 283791, "epoch": 3419} {"train_loss": -25.16219139099121, "global_step": 283792, "epoch": 3419} {"train_loss": -25.644872665405273, "global_step": 283793, "epoch": 3419} {"train_loss": -25.0780086517334, "global_step": 283794, "epoch": 3419} {"train_loss": -25.47072410583496, "global_step": 283795, "epoch": 3419} {"train_loss": -25.177433013916016, "global_step": 283796, "epoch": 3419} {"train_loss": -25.14217185974121, "global_step": 283797, "epoch": 3419} {"train_loss": -25.4721622467041, "global_step": 283798, "epoch": 3419} {"train_loss": -25.144399642944336, "global_step": 283799, "epoch": 3419} {"train_loss": -25.61025047302246, "global_step": 283800, "epoch": 3419} {"train_loss": -25.571714401245117, "global_step": 283801, "epoch": 3419} {"train_loss": -25.387714385986328, "global_step": 283802, "epoch": 3419} {"train_loss": -25.65457534790039, "global_step": 283803, "epoch": 3419} {"train_loss": -25.3603572845459, "global_step": 283804, "epoch": 3419} {"train_loss": -25.370542526245117, "global_step": 283805, "epoch": 3419} {"train_loss": -25.194684982299805, "global_step": 283806, "epoch": 3419} {"train_loss": -25.271005630493164, "global_step": 283807, "epoch": 3419} {"train_loss": -25.387197494506836, "global_step": 283808, "epoch": 3419} {"train_loss": -25.24810218811035, "global_step": 283809, "epoch": 3419} {"train_loss": -25.53803062438965, "global_step": 283810, "epoch": 3419} {"train_loss": -24.96933364868164, "global_step": 283811, "epoch": 3419} {"train_loss": -25.69504737854004, "global_step": 283812, "epoch": 3419} {"train_loss": -25.71003532409668, "global_step": 283813, "epoch": 3419} {"train_loss": -25.500198364257812, "global_step": 283814, "epoch": 3419} {"train_loss": -25.472763061523438, "global_step": 283815, "epoch": 3419} {"train_loss": -25.303407669067383, "global_step": 283816, "epoch": 3419} {"train_loss": -25.39630699157715, "global_step": 283817, "epoch": 3419} {"train_loss": -25.454763412475586, "global_step": 283818, "epoch": 3419} {"train_loss": -25.696292877197266, "global_step": 283819, "epoch": 3419} {"train_loss": -25.878559112548828, "global_step": 283820, "epoch": 3419} {"train_loss": -25.476295471191406, "global_step": 283821, "epoch": 3419} {"train_loss": -25.940763473510742, "global_step": 283822, "epoch": 3419} {"train_loss": -25.200603485107422, "global_step": 283823, "epoch": 3419} {"train_loss": -25.652830123901367, "global_step": 283824, "epoch": 3419} {"train_loss": -25.924840927124023, "global_step": 283825, "epoch": 3419} {"train_loss": -25.467180252075195, "global_step": 283826, "epoch": 3419} {"train_loss": -25.40079116821289, "global_step": 283827, "epoch": 3419} {"train_loss": -25.150785446166992, "global_step": 283828, "epoch": 3419} {"train_loss": -25.13347816467285, "global_step": 283829, "epoch": 3419} {"train_loss": -25.260616302490234, "global_step": 283830, "epoch": 3419} {"train_loss": -25.206361770629883, "global_step": 283831, "epoch": 3419} {"train_loss": -25.19114112854004, "global_step": 283832, "epoch": 3419} {"train_loss": -25.430021286010742, "global_step": 283833, "epoch": 3419} {"train_loss": -25.30191993713379, "global_step": 283834, "epoch": 3419} {"train_loss": -25.216487884521484, "global_step": 283835, "epoch": 3419} {"train_loss": -25.173263549804688, "global_step": 283836, "epoch": 3419} {"train_loss": -25.467350006103516, "global_step": 283837, "epoch": 3419} {"train_loss": -25.14479637145996, "global_step": 283838, "epoch": 3419} {"train_loss": -25.421186447143555, "global_step": 283839, "epoch": 3419} {"train_loss": -25.111236572265625, "global_step": 283840, "epoch": 3419} {"train_loss": -25.471298217773438, "global_step": 283841, "epoch": 3419} {"train_loss": -25.032567977905273, "global_step": 283842, "epoch": 3419} {"train_loss": -25.313329696655273, "global_step": 283843, "epoch": 3419} {"train_loss": -25.38361167907715, "global_step": 283844, "epoch": 3419} {"train_loss": -25.335508346557617, "global_step": 283845, "epoch": 3419} {"train_loss": -25.42793846130371, "global_step": 283846, "epoch": 3419} {"train_loss": -25.48778533935547, "global_step": 283847, "epoch": 3419} {"train_loss": -25.328454971313477, "global_step": 283848, "epoch": 3419} {"train_loss": -25.43050193786621, "global_step": 283849, "epoch": 3419} {"train_loss": -25.606510162353516, "global_step": 283850, "epoch": 3419} {"train_loss": -25.747541427612305, "global_step": 283851, "epoch": 3419} {"train_loss": -25.337865829467773, "global_step": 283852, "epoch": 3419} {"train_loss": -25.74725341796875, "global_step": 283853, "epoch": 3419} {"train_loss": -25.475141525268555, "global_step": 283854, "epoch": 3419} {"train_loss": -25.673124313354492, "global_step": 283855, "epoch": 3419} {"train_loss": -25.63858413696289, "global_step": 283856, "epoch": 3419} {"train_loss": -25.6536922454834, "global_step": 283857, "epoch": 3419} {"train_loss": -25.712814331054688, "global_step": 283858, "epoch": 3419} {"train_loss": -25.36816107508648, "global_step": 283859, "epoch": 3419, "val_loss": 6988443.5} {"train_loss": -24.96393394470215, "global_step": 283860, "epoch": 3420} {"train_loss": -25.349245071411133, "global_step": 283861, "epoch": 3420} {"train_loss": -25.451013565063477, "global_step": 283862, "epoch": 3420} {"train_loss": -25.33962059020996, "global_step": 283863, "epoch": 3420} {"train_loss": -24.949941635131836, "global_step": 283864, "epoch": 3420} {"train_loss": -24.961872100830078, "global_step": 283865, "epoch": 3420} {"train_loss": -25.578489303588867, "global_step": 283866, "epoch": 3420} {"train_loss": -25.277557373046875, "global_step": 283867, "epoch": 3420} {"train_loss": -25.37142562866211, "global_step": 283868, "epoch": 3420} {"train_loss": -25.032569885253906, "global_step": 283869, "epoch": 3420} {"train_loss": -25.439056396484375, "global_step": 283870, "epoch": 3420} {"train_loss": -25.296472549438477, "global_step": 283871, "epoch": 3420} {"train_loss": -25.428836822509766, "global_step": 283872, "epoch": 3420} {"train_loss": -25.681005477905273, "global_step": 283873, "epoch": 3420} {"train_loss": -25.501266479492188, "global_step": 283874, "epoch": 3420} {"train_loss": -25.28340721130371, "global_step": 283875, "epoch": 3420} {"train_loss": -25.256500244140625, "global_step": 283876, "epoch": 3420} {"train_loss": -25.350399017333984, "global_step": 283877, "epoch": 3420} {"train_loss": -25.444021224975586, "global_step": 283878, "epoch": 3420} {"train_loss": -25.642719268798828, "global_step": 283879, "epoch": 3420} {"train_loss": -25.577423095703125, "global_step": 283880, "epoch": 3420} {"train_loss": -25.791818618774414, "global_step": 283881, "epoch": 3420} {"train_loss": -25.085676193237305, "global_step": 283882, "epoch": 3420} {"train_loss": -25.225683212280273, "global_step": 283883, "epoch": 3420} {"train_loss": -25.557340621948242, "global_step": 283884, "epoch": 3420} {"train_loss": -25.397504806518555, "global_step": 283885, "epoch": 3420} {"train_loss": -25.3037166595459, "global_step": 283886, "epoch": 3420} {"train_loss": -25.366031646728516, "global_step": 283887, "epoch": 3420} {"train_loss": -25.315113067626953, "global_step": 283888, "epoch": 3420} {"train_loss": -25.663516998291016, "global_step": 283889, "epoch": 3420} {"train_loss": -25.8181095123291, "global_step": 283890, "epoch": 3420} {"train_loss": -25.67453384399414, "global_step": 283891, "epoch": 3420} {"train_loss": -25.812421798706055, "global_step": 283892, "epoch": 3420} {"train_loss": -25.637243270874023, "global_step": 283893, "epoch": 3420} {"train_loss": -25.633264541625977, "global_step": 283894, "epoch": 3420} {"train_loss": -25.223615646362305, "global_step": 283895, "epoch": 3420} {"train_loss": -25.463436126708984, "global_step": 283896, "epoch": 3420} {"train_loss": -25.593734741210938, "global_step": 283897, "epoch": 3420} {"train_loss": -25.425851821899414, "global_step": 283898, "epoch": 3420} {"train_loss": -26.014211654663086, "global_step": 283899, "epoch": 3420} {"train_loss": -25.65940284729004, "global_step": 283900, "epoch": 3420} {"train_loss": -25.59454345703125, "global_step": 283901, "epoch": 3420} {"train_loss": -25.66981315612793, "global_step": 283902, "epoch": 3420} {"train_loss": -25.53339385986328, "global_step": 283903, "epoch": 3420} {"train_loss": -25.664127349853516, "global_step": 283904, "epoch": 3420} {"train_loss": -25.48322868347168, "global_step": 283905, "epoch": 3420} {"train_loss": -25.23828125, "global_step": 283906, "epoch": 3420} {"train_loss": -25.455827713012695, "global_step": 283907, "epoch": 3420} {"train_loss": -25.588943481445312, "global_step": 283908, "epoch": 3420} {"train_loss": -25.612354278564453, "global_step": 283909, "epoch": 3420} {"train_loss": -25.345090866088867, "global_step": 283910, "epoch": 3420} {"train_loss": -25.366233825683594, "global_step": 283911, "epoch": 3420} {"train_loss": -25.643457412719727, "global_step": 283912, "epoch": 3420} {"train_loss": -25.051477432250977, "global_step": 283913, "epoch": 3420} {"train_loss": -24.919157028198242, "global_step": 283914, "epoch": 3420} {"train_loss": -24.452695846557617, "global_step": 283915, "epoch": 3420} {"train_loss": -25.271934509277344, "global_step": 283916, "epoch": 3420} {"train_loss": -25.43059730529785, "global_step": 283917, "epoch": 3420} {"train_loss": -25.557947158813477, "global_step": 283918, "epoch": 3420} {"train_loss": -24.940048217773438, "global_step": 283919, "epoch": 3420} {"train_loss": -25.20193862915039, "global_step": 283920, "epoch": 3420} {"train_loss": -25.12537956237793, "global_step": 283921, "epoch": 3420} {"train_loss": -25.14801788330078, "global_step": 283922, "epoch": 3420} {"train_loss": -25.386032104492188, "global_step": 283923, "epoch": 3420} {"train_loss": -25.28590965270996, "global_step": 283924, "epoch": 3420} {"train_loss": -25.171192169189453, "global_step": 283925, "epoch": 3420} {"train_loss": -25.342199325561523, "global_step": 283926, "epoch": 3420} {"train_loss": -25.488590240478516, "global_step": 283927, "epoch": 3420} {"train_loss": -25.496728897094727, "global_step": 283928, "epoch": 3420} {"train_loss": -25.457611083984375, "global_step": 283929, "epoch": 3420} {"train_loss": -25.596921920776367, "global_step": 283930, "epoch": 3420} {"train_loss": -25.515005111694336, "global_step": 283931, "epoch": 3420} {"train_loss": -25.19052505493164, "global_step": 283932, "epoch": 3420} {"train_loss": -25.302717208862305, "global_step": 283933, "epoch": 3420} {"train_loss": -25.28243064880371, "global_step": 283934, "epoch": 3420} {"train_loss": -25.405149459838867, "global_step": 283935, "epoch": 3420} {"train_loss": -25.344493865966797, "global_step": 283936, "epoch": 3420} {"train_loss": -25.7109317779541, "global_step": 283937, "epoch": 3420} {"train_loss": -25.680891036987305, "global_step": 283938, "epoch": 3420} {"train_loss": -26.112701416015625, "global_step": 283939, "epoch": 3420} {"train_loss": -25.49688720703125, "global_step": 283940, "epoch": 3420} {"train_loss": -25.312606811523438, "global_step": 283941, "epoch": 3420} {"train_loss": -25.410701131246174, "global_step": 283942, "epoch": 3420, "val_loss": 7077829.5} {"train_loss": -25.527915954589844, "global_step": 283943, "epoch": 3421} {"train_loss": -25.02193260192871, "global_step": 283944, "epoch": 3421} {"train_loss": -25.212759017944336, "global_step": 283945, "epoch": 3421} {"train_loss": -25.097742080688477, "global_step": 283946, "epoch": 3421} {"train_loss": -25.37525749206543, "global_step": 283947, "epoch": 3421} {"train_loss": -25.331130981445312, "global_step": 283948, "epoch": 3421} {"train_loss": -25.243213653564453, "global_step": 283949, "epoch": 3421} {"train_loss": -25.216279983520508, "global_step": 283950, "epoch": 3421} {"train_loss": -25.258625030517578, "global_step": 283951, "epoch": 3421} {"train_loss": -25.56879997253418, "global_step": 283952, "epoch": 3421} {"train_loss": -25.393295288085938, "global_step": 283953, "epoch": 3421} {"train_loss": -25.503171920776367, "global_step": 283954, "epoch": 3421} {"train_loss": -25.13129997253418, "global_step": 283955, "epoch": 3421} {"train_loss": -25.457685470581055, "global_step": 283956, "epoch": 3421} {"train_loss": -25.53538703918457, "global_step": 283957, "epoch": 3421} {"train_loss": -24.990802764892578, "global_step": 283958, "epoch": 3421} {"train_loss": -25.1713924407959, "global_step": 283959, "epoch": 3421} {"train_loss": -25.442777633666992, "global_step": 283960, "epoch": 3421} {"train_loss": -25.219175338745117, "global_step": 283961, "epoch": 3421} {"train_loss": -25.338871002197266, "global_step": 283962, "epoch": 3421} {"train_loss": -25.4576358795166, "global_step": 283963, "epoch": 3421} {"train_loss": -25.623533248901367, "global_step": 283964, "epoch": 3421} {"train_loss": -25.08257293701172, "global_step": 283965, "epoch": 3421} {"train_loss": -25.137191772460938, "global_step": 283966, "epoch": 3421} {"train_loss": -25.656009674072266, "global_step": 283967, "epoch": 3421} {"train_loss": -25.39944839477539, "global_step": 283968, "epoch": 3421} {"train_loss": -25.4083309173584, "global_step": 283969, "epoch": 3421} {"train_loss": -25.637298583984375, "global_step": 283970, "epoch": 3421} {"train_loss": -25.530792236328125, "global_step": 283971, "epoch": 3421} {"train_loss": -24.824201583862305, "global_step": 283972, "epoch": 3421} {"train_loss": -25.31777000427246, "global_step": 283973, "epoch": 3421} {"train_loss": -25.53350257873535, "global_step": 283974, "epoch": 3421} {"train_loss": -25.265411376953125, "global_step": 283975, "epoch": 3421} {"train_loss": -25.08997917175293, "global_step": 283976, "epoch": 3421} {"train_loss": -25.666589736938477, "global_step": 283977, "epoch": 3421} {"train_loss": -25.654897689819336, "global_step": 283978, "epoch": 3421} {"train_loss": -25.80720329284668, "global_step": 283979, "epoch": 3421} {"train_loss": -25.324851989746094, "global_step": 283980, "epoch": 3421} {"train_loss": -25.254907608032227, "global_step": 283981, "epoch": 3421} {"train_loss": -25.47763442993164, "global_step": 283982, "epoch": 3421} {"train_loss": -25.367206573486328, "global_step": 283983, "epoch": 3421} {"train_loss": -25.86663818359375, "global_step": 283984, "epoch": 3421} {"train_loss": -25.455854415893555, "global_step": 283985, "epoch": 3421} {"train_loss": -25.163179397583008, "global_step": 283986, "epoch": 3421} {"train_loss": -25.57570457458496, "global_step": 283987, "epoch": 3421} {"train_loss": -25.473268508911133, "global_step": 283988, "epoch": 3421} {"train_loss": -25.416242599487305, "global_step": 283989, "epoch": 3421} {"train_loss": -25.702747344970703, "global_step": 283990, "epoch": 3421} {"train_loss": -25.350391387939453, "global_step": 283991, "epoch": 3421} {"train_loss": -25.644886016845703, "global_step": 283992, "epoch": 3421} {"train_loss": -25.531728744506836, "global_step": 283993, "epoch": 3421} {"train_loss": -25.631301879882812, "global_step": 283994, "epoch": 3421} {"train_loss": -25.068342208862305, "global_step": 283995, "epoch": 3421} {"train_loss": -25.176435470581055, "global_step": 283996, "epoch": 3421} {"train_loss": -25.474735260009766, "global_step": 283997, "epoch": 3421} {"train_loss": -25.3382511138916, "global_step": 283998, "epoch": 3421} {"train_loss": -24.773597717285156, "global_step": 283999, "epoch": 3421} {"train_loss": -25.442520141601562, "global_step": 284000, "epoch": 3421} {"train_loss": -25.69093132019043, "global_step": 284001, "epoch": 3421} {"train_loss": -25.3494815826416, "global_step": 284002, "epoch": 3421} {"train_loss": -25.249217987060547, "global_step": 284003, "epoch": 3421} {"train_loss": -25.593923568725586, "global_step": 284004, "epoch": 3421} {"train_loss": -25.16566276550293, "global_step": 284005, "epoch": 3421} {"train_loss": -24.96771812438965, "global_step": 284006, "epoch": 3421} {"train_loss": -24.59067153930664, "global_step": 284007, "epoch": 3421} {"train_loss": -25.508010864257812, "global_step": 284008, "epoch": 3421} {"train_loss": -25.141752243041992, "global_step": 284009, "epoch": 3421} {"train_loss": -25.30135154724121, "global_step": 284010, "epoch": 3421} {"train_loss": -25.5051326751709, "global_step": 284011, "epoch": 3421} {"train_loss": -25.2095947265625, "global_step": 284012, "epoch": 3421} {"train_loss": -25.409709930419922, "global_step": 284013, "epoch": 3421} {"train_loss": -24.96836280822754, "global_step": 284014, "epoch": 3421} {"train_loss": -25.692724227905273, "global_step": 284015, "epoch": 3421} {"train_loss": -25.11920166015625, "global_step": 284016, "epoch": 3421} {"train_loss": -25.453702926635742, "global_step": 284017, "epoch": 3421} {"train_loss": -25.46455955505371, "global_step": 284018, "epoch": 3421} {"train_loss": -25.387861251831055, "global_step": 284019, "epoch": 3421} {"train_loss": -25.363983154296875, "global_step": 284020, "epoch": 3421} {"train_loss": -25.684890747070312, "global_step": 284021, "epoch": 3421} {"train_loss": -25.468040466308594, "global_step": 284022, "epoch": 3421} {"train_loss": -25.543045043945312, "global_step": 284023, "epoch": 3421} {"train_loss": -25.30970573425293, "global_step": 284024, "epoch": 3421} {"train_loss": -25.364891534828278, "global_step": 284025, "epoch": 3421, "val_loss": 6989852.0} {"train_loss": -25.39609718322754, "global_step": 284026, "epoch": 3422} {"train_loss": -25.164466857910156, "global_step": 284027, "epoch": 3422} {"train_loss": -25.22926902770996, "global_step": 284028, "epoch": 3422} {"train_loss": -25.034442901611328, "global_step": 284029, "epoch": 3422} {"train_loss": -24.522897720336914, "global_step": 284030, "epoch": 3422} {"train_loss": -25.329870223999023, "global_step": 284031, "epoch": 3422} {"train_loss": -25.410865783691406, "global_step": 284032, "epoch": 3422} {"train_loss": -25.22203254699707, "global_step": 284033, "epoch": 3422} {"train_loss": -25.490880966186523, "global_step": 284034, "epoch": 3422} {"train_loss": -25.37601661682129, "global_step": 284035, "epoch": 3422} {"train_loss": -25.45448112487793, "global_step": 284036, "epoch": 3422} {"train_loss": -25.41028594970703, "global_step": 284037, "epoch": 3422} {"train_loss": -25.454113006591797, "global_step": 284038, "epoch": 3422} {"train_loss": -25.74078369140625, "global_step": 284039, "epoch": 3422} {"train_loss": -25.290891647338867, "global_step": 284040, "epoch": 3422} {"train_loss": -25.183122634887695, "global_step": 284041, "epoch": 3422} {"train_loss": -25.98224449157715, "global_step": 284042, "epoch": 3422} {"train_loss": -25.719079971313477, "global_step": 284043, "epoch": 3422} {"train_loss": -25.58726692199707, "global_step": 284044, "epoch": 3422} {"train_loss": -25.22193717956543, "global_step": 284045, "epoch": 3422} {"train_loss": -25.468122482299805, "global_step": 284046, "epoch": 3422} {"train_loss": -25.286630630493164, "global_step": 284047, "epoch": 3422} {"train_loss": -25.320886611938477, "global_step": 284048, "epoch": 3422} {"train_loss": -25.66391372680664, "global_step": 284049, "epoch": 3422} {"train_loss": -25.482053756713867, "global_step": 284050, "epoch": 3422} {"train_loss": -25.40821647644043, "global_step": 284051, "epoch": 3422} {"train_loss": -25.678512573242188, "global_step": 284052, "epoch": 3422} {"train_loss": -25.498746871948242, "global_step": 284053, "epoch": 3422} {"train_loss": -25.3876953125, "global_step": 284054, "epoch": 3422} {"train_loss": -25.464675903320312, "global_step": 284055, "epoch": 3422} {"train_loss": -25.527870178222656, "global_step": 284056, "epoch": 3422} {"train_loss": -25.1980037689209, "global_step": 284057, "epoch": 3422} {"train_loss": -25.43892478942871, "global_step": 284058, "epoch": 3422} {"train_loss": -25.435626983642578, "global_step": 284059, "epoch": 3422} {"train_loss": -25.465673446655273, "global_step": 284060, "epoch": 3422} {"train_loss": -25.1529483795166, "global_step": 284061, "epoch": 3422} {"train_loss": -25.6352596282959, "global_step": 284062, "epoch": 3422} {"train_loss": -25.52522850036621, "global_step": 284063, "epoch": 3422} {"train_loss": -25.261964797973633, "global_step": 284064, "epoch": 3422} {"train_loss": -25.49382972717285, "global_step": 284065, "epoch": 3422} {"train_loss": -25.517580032348633, "global_step": 284066, "epoch": 3422} {"train_loss": -25.507251739501953, "global_step": 284067, "epoch": 3422} {"train_loss": -25.429439544677734, "global_step": 284068, "epoch": 3422} {"train_loss": -25.61665153503418, "global_step": 284069, "epoch": 3422} {"train_loss": -25.8297061920166, "global_step": 284070, "epoch": 3422} {"train_loss": -25.501537322998047, "global_step": 284071, "epoch": 3422} {"train_loss": -25.51752281188965, "global_step": 284072, "epoch": 3422} {"train_loss": -25.51932716369629, "global_step": 284073, "epoch": 3422} {"train_loss": -25.182416915893555, "global_step": 284074, "epoch": 3422} {"train_loss": -25.579660415649414, "global_step": 284075, "epoch": 3422} {"train_loss": -25.20429039001465, "global_step": 284076, "epoch": 3422} {"train_loss": -25.550363540649414, "global_step": 284077, "epoch": 3422} {"train_loss": -25.50971794128418, "global_step": 284078, "epoch": 3422} {"train_loss": -25.76873779296875, "global_step": 284079, "epoch": 3422} {"train_loss": -25.352970123291016, "global_step": 284080, "epoch": 3422} {"train_loss": -25.711698532104492, "global_step": 284081, "epoch": 3422} {"train_loss": -25.5151309967041, "global_step": 284082, "epoch": 3422} {"train_loss": -25.492677688598633, "global_step": 284083, "epoch": 3422} {"train_loss": -25.3197078704834, "global_step": 284084, "epoch": 3422} {"train_loss": -25.635290145874023, "global_step": 284085, "epoch": 3422} {"train_loss": -25.502216339111328, "global_step": 284086, "epoch": 3422} {"train_loss": -25.75247573852539, "global_step": 284087, "epoch": 3422} {"train_loss": -25.4526424407959, "global_step": 284088, "epoch": 3422} {"train_loss": -25.481149673461914, "global_step": 284089, "epoch": 3422} {"train_loss": -25.58995819091797, "global_step": 284090, "epoch": 3422} {"train_loss": -25.70606803894043, "global_step": 284091, "epoch": 3422} {"train_loss": -25.638980865478516, "global_step": 284092, "epoch": 3422} {"train_loss": -25.575807571411133, "global_step": 284093, "epoch": 3422} {"train_loss": -25.275381088256836, "global_step": 284094, "epoch": 3422} {"train_loss": -25.42384910583496, "global_step": 284095, "epoch": 3422} {"train_loss": -25.73520278930664, "global_step": 284096, "epoch": 3422} {"train_loss": -25.51313591003418, "global_step": 284097, "epoch": 3422} {"train_loss": -25.389204025268555, "global_step": 284098, "epoch": 3422} {"train_loss": -25.48006248474121, "global_step": 284099, "epoch": 3422} {"train_loss": -25.045310974121094, "global_step": 284100, "epoch": 3422} {"train_loss": -25.43914794921875, "global_step": 284101, "epoch": 3422} {"train_loss": -25.65802574157715, "global_step": 284102, "epoch": 3422} {"train_loss": -25.789764404296875, "global_step": 284103, "epoch": 3422} {"train_loss": -25.575815200805664, "global_step": 284104, "epoch": 3422} {"train_loss": -25.50790786743164, "global_step": 284105, "epoch": 3422} {"train_loss": -25.59572410583496, "global_step": 284106, "epoch": 3422} {"train_loss": -25.415477752685547, "global_step": 284107, "epoch": 3422} {"train_loss": -25.460851393550275, "global_step": 284108, "epoch": 3422, "val_loss": 7122821.0} {"train_loss": -24.746183395385742, "global_step": 284109, "epoch": 3423} {"train_loss": -24.458906173706055, "global_step": 284110, "epoch": 3423} {"train_loss": -24.863922119140625, "global_step": 284111, "epoch": 3423} {"train_loss": -25.319313049316406, "global_step": 284112, "epoch": 3423} {"train_loss": -25.1922664642334, "global_step": 284113, "epoch": 3423} {"train_loss": -25.2147159576416, "global_step": 284114, "epoch": 3423} {"train_loss": -25.0452880859375, "global_step": 284115, "epoch": 3423} {"train_loss": -25.320409774780273, "global_step": 284116, "epoch": 3423} {"train_loss": -24.71949577331543, "global_step": 284117, "epoch": 3423} {"train_loss": -24.975515365600586, "global_step": 284118, "epoch": 3423} {"train_loss": -24.858449935913086, "global_step": 284119, "epoch": 3423} {"train_loss": -25.034896850585938, "global_step": 284120, "epoch": 3423} {"train_loss": -25.339269638061523, "global_step": 284121, "epoch": 3423} {"train_loss": -25.044294357299805, "global_step": 284122, "epoch": 3423} {"train_loss": -25.392166137695312, "global_step": 284123, "epoch": 3423} {"train_loss": -25.43181037902832, "global_step": 284124, "epoch": 3423} {"train_loss": -25.31156349182129, "global_step": 284125, "epoch": 3423} {"train_loss": -25.342742919921875, "global_step": 284126, "epoch": 3423} {"train_loss": -25.46317481994629, "global_step": 284127, "epoch": 3423} {"train_loss": -25.424392700195312, "global_step": 284128, "epoch": 3423} {"train_loss": -25.452543258666992, "global_step": 284129, "epoch": 3423} {"train_loss": -25.484729766845703, "global_step": 284130, "epoch": 3423} {"train_loss": -25.261381149291992, "global_step": 284131, "epoch": 3423} {"train_loss": -25.36781883239746, "global_step": 284132, "epoch": 3423} {"train_loss": -25.621301651000977, "global_step": 284133, "epoch": 3423} {"train_loss": -25.486326217651367, "global_step": 284134, "epoch": 3423} {"train_loss": -25.201292037963867, "global_step": 284135, "epoch": 3423} {"train_loss": -25.668731689453125, "global_step": 284136, "epoch": 3423} {"train_loss": -25.55274772644043, "global_step": 284137, "epoch": 3423} {"train_loss": -25.738134384155273, "global_step": 284138, "epoch": 3423} {"train_loss": -25.2991886138916, "global_step": 284139, "epoch": 3423} {"train_loss": -25.300006866455078, "global_step": 284140, "epoch": 3423} {"train_loss": -25.474111557006836, "global_step": 284141, "epoch": 3423} {"train_loss": -25.190832138061523, "global_step": 284142, "epoch": 3423} {"train_loss": -25.430511474609375, "global_step": 284143, "epoch": 3423} {"train_loss": -25.608922958374023, "global_step": 284144, "epoch": 3423} {"train_loss": -25.346731185913086, "global_step": 284145, "epoch": 3423} {"train_loss": -25.27353858947754, "global_step": 284146, "epoch": 3423} {"train_loss": -25.477514266967773, "global_step": 284147, "epoch": 3423} {"train_loss": -25.796798706054688, "global_step": 284148, "epoch": 3423} {"train_loss": -25.496458053588867, "global_step": 284149, "epoch": 3423} {"train_loss": -25.6992244720459, "global_step": 284150, "epoch": 3423} {"train_loss": -25.510290145874023, "global_step": 284151, "epoch": 3423} {"train_loss": -25.67398452758789, "global_step": 284152, "epoch": 3423} {"train_loss": -25.73828125, "global_step": 284153, "epoch": 3423} {"train_loss": -25.33988380432129, "global_step": 284154, "epoch": 3423} {"train_loss": -25.611968994140625, "global_step": 284155, "epoch": 3423} {"train_loss": -25.698352813720703, "global_step": 284156, "epoch": 3423} {"train_loss": -25.394134521484375, "global_step": 284157, "epoch": 3423} {"train_loss": -25.356882095336914, "global_step": 284158, "epoch": 3423} {"train_loss": -25.192121505737305, "global_step": 284159, "epoch": 3423} {"train_loss": -25.34052848815918, "global_step": 284160, "epoch": 3423} {"train_loss": -25.374149322509766, "global_step": 284161, "epoch": 3423} {"train_loss": -25.61380386352539, "global_step": 284162, "epoch": 3423} {"train_loss": -25.741626739501953, "global_step": 284163, "epoch": 3423} {"train_loss": -25.535799026489258, "global_step": 284164, "epoch": 3423} {"train_loss": -25.063047409057617, "global_step": 284165, "epoch": 3423} {"train_loss": -25.543842315673828, "global_step": 284166, "epoch": 3423} {"train_loss": -25.464977264404297, "global_step": 284167, "epoch": 3423} {"train_loss": -25.66997718811035, "global_step": 284168, "epoch": 3423} {"train_loss": -25.463085174560547, "global_step": 284169, "epoch": 3423} {"train_loss": -25.35106658935547, "global_step": 284170, "epoch": 3423} {"train_loss": -25.24016761779785, "global_step": 284171, "epoch": 3423} {"train_loss": -25.781585693359375, "global_step": 284172, "epoch": 3423} {"train_loss": -25.790058135986328, "global_step": 284173, "epoch": 3423} {"train_loss": -25.42268180847168, "global_step": 284174, "epoch": 3423} {"train_loss": -25.433717727661133, "global_step": 284175, "epoch": 3423} {"train_loss": -25.689748764038086, "global_step": 284176, "epoch": 3423} {"train_loss": -25.211828231811523, "global_step": 284177, "epoch": 3423} {"train_loss": -25.288354873657227, "global_step": 284178, "epoch": 3423} {"train_loss": -25.387266159057617, "global_step": 284179, "epoch": 3423} {"train_loss": -25.577312469482422, "global_step": 284180, "epoch": 3423} {"train_loss": -25.805892944335938, "global_step": 284181, "epoch": 3423} {"train_loss": -25.12307357788086, "global_step": 284182, "epoch": 3423} {"train_loss": -25.5981388092041, "global_step": 284183, "epoch": 3423} {"train_loss": -25.804906845092773, "global_step": 284184, "epoch": 3423} {"train_loss": -25.412628173828125, "global_step": 284185, "epoch": 3423} {"train_loss": -25.571319580078125, "global_step": 284186, "epoch": 3423} {"train_loss": -25.19610023498535, "global_step": 284187, "epoch": 3423} {"train_loss": -24.748117446899414, "global_step": 284188, "epoch": 3423} {"train_loss": -24.467737197875977, "global_step": 284189, "epoch": 3423} {"train_loss": -25.0360050201416, "global_step": 284190, "epoch": 3423} {"train_loss": -25.365181428840362, "global_step": 284191, "epoch": 3423, "val_loss": 7275537.0} {"train_loss": -24.506799697875977, "global_step": 284192, "epoch": 3424} {"train_loss": -24.611377716064453, "global_step": 284193, "epoch": 3424} {"train_loss": -24.860143661499023, "global_step": 284194, "epoch": 3424} {"train_loss": -24.89497947692871, "global_step": 284195, "epoch": 3424} {"train_loss": -24.517087936401367, "global_step": 284196, "epoch": 3424} {"train_loss": -24.653486251831055, "global_step": 284197, "epoch": 3424} {"train_loss": -24.963970184326172, "global_step": 284198, "epoch": 3424} {"train_loss": -24.80682945251465, "global_step": 284199, "epoch": 3424} {"train_loss": -24.988309860229492, "global_step": 284200, "epoch": 3424} {"train_loss": -24.787378311157227, "global_step": 284201, "epoch": 3424} {"train_loss": -24.615894317626953, "global_step": 284202, "epoch": 3424} {"train_loss": -24.91149139404297, "global_step": 284203, "epoch": 3424} {"train_loss": -25.3360538482666, "global_step": 284204, "epoch": 3424} {"train_loss": -24.664152145385742, "global_step": 284205, "epoch": 3424} {"train_loss": -24.8292236328125, "global_step": 284206, "epoch": 3424} {"train_loss": -25.310815811157227, "global_step": 284207, "epoch": 3424} {"train_loss": -25.26622772216797, "global_step": 284208, "epoch": 3424} {"train_loss": -25.149539947509766, "global_step": 284209, "epoch": 3424} {"train_loss": -25.832462310791016, "global_step": 284210, "epoch": 3424} {"train_loss": -25.50459861755371, "global_step": 284211, "epoch": 3424} {"train_loss": -25.07673454284668, "global_step": 284212, "epoch": 3424} {"train_loss": -24.99961280822754, "global_step": 284213, "epoch": 3424} {"train_loss": -25.56207847595215, "global_step": 284214, "epoch": 3424} {"train_loss": -25.232267379760742, "global_step": 284215, "epoch": 3424} {"train_loss": -25.61854362487793, "global_step": 284216, "epoch": 3424} {"train_loss": -25.41736602783203, "global_step": 284217, "epoch": 3424} {"train_loss": -25.261627197265625, "global_step": 284218, "epoch": 3424} {"train_loss": -25.21209144592285, "global_step": 284219, "epoch": 3424} {"train_loss": -25.1864070892334, "global_step": 284220, "epoch": 3424} {"train_loss": -25.499074935913086, "global_step": 284221, "epoch": 3424} {"train_loss": -25.498647689819336, "global_step": 284222, "epoch": 3424} {"train_loss": -25.4825439453125, "global_step": 284223, "epoch": 3424} {"train_loss": -25.532732009887695, "global_step": 284224, "epoch": 3424} {"train_loss": -25.302051544189453, "global_step": 284225, "epoch": 3424} {"train_loss": -25.70794677734375, "global_step": 284226, "epoch": 3424} {"train_loss": -25.56888771057129, "global_step": 284227, "epoch": 3424} {"train_loss": -25.37666130065918, "global_step": 284228, "epoch": 3424} {"train_loss": -25.540000915527344, "global_step": 284229, "epoch": 3424} {"train_loss": -25.554916381835938, "global_step": 284230, "epoch": 3424} {"train_loss": -25.478532791137695, "global_step": 284231, "epoch": 3424} {"train_loss": -25.619848251342773, "global_step": 284232, "epoch": 3424} {"train_loss": -25.57282829284668, "global_step": 284233, "epoch": 3424} {"train_loss": -25.858428955078125, "global_step": 284234, "epoch": 3424} {"train_loss": -25.51329803466797, "global_step": 284235, "epoch": 3424} {"train_loss": -25.46193504333496, "global_step": 284236, "epoch": 3424} {"train_loss": -25.53672218322754, "global_step": 284237, "epoch": 3424} {"train_loss": -25.84027671813965, "global_step": 284238, "epoch": 3424} {"train_loss": -25.698638916015625, "global_step": 284239, "epoch": 3424} {"train_loss": -25.734039306640625, "global_step": 284240, "epoch": 3424} {"train_loss": -25.77884292602539, "global_step": 284241, "epoch": 3424} {"train_loss": -25.3795166015625, "global_step": 284242, "epoch": 3424} {"train_loss": -25.0892333984375, "global_step": 284243, "epoch": 3424} {"train_loss": -25.662683486938477, "global_step": 284244, "epoch": 3424} {"train_loss": -25.291202545166016, "global_step": 284245, "epoch": 3424} {"train_loss": -25.813953399658203, "global_step": 284246, "epoch": 3424} {"train_loss": -25.310758590698242, "global_step": 284247, "epoch": 3424} {"train_loss": -25.456357955932617, "global_step": 284248, "epoch": 3424} {"train_loss": -25.7272891998291, "global_step": 284249, "epoch": 3424} {"train_loss": -25.0775146484375, "global_step": 284250, "epoch": 3424} {"train_loss": -25.791584014892578, "global_step": 284251, "epoch": 3424} {"train_loss": -25.542688369750977, "global_step": 284252, "epoch": 3424} {"train_loss": -25.418582916259766, "global_step": 284253, "epoch": 3424} {"train_loss": -25.860742568969727, "global_step": 284254, "epoch": 3424} {"train_loss": -25.497472763061523, "global_step": 284255, "epoch": 3424} {"train_loss": -25.74268913269043, "global_step": 284256, "epoch": 3424} {"train_loss": -25.833709716796875, "global_step": 284257, "epoch": 3424} {"train_loss": -25.293212890625, "global_step": 284258, "epoch": 3424} {"train_loss": -25.36579132080078, "global_step": 284259, "epoch": 3424} {"train_loss": -25.6036434173584, "global_step": 284260, "epoch": 3424} {"train_loss": -25.47879409790039, "global_step": 284261, "epoch": 3424} {"train_loss": -25.447656631469727, "global_step": 284262, "epoch": 3424} {"train_loss": -25.23396110534668, "global_step": 284263, "epoch": 3424} {"train_loss": -25.418689727783203, "global_step": 284264, "epoch": 3424} {"train_loss": -25.55864715576172, "global_step": 284265, "epoch": 3424} {"train_loss": -25.38994789123535, "global_step": 284266, "epoch": 3424} {"train_loss": -25.325040817260742, "global_step": 284267, "epoch": 3424} {"train_loss": -25.06461524963379, "global_step": 284268, "epoch": 3424} {"train_loss": -25.346839904785156, "global_step": 284269, "epoch": 3424} {"train_loss": -25.904499053955078, "global_step": 284270, "epoch": 3424} {"train_loss": -25.562047958374023, "global_step": 284271, "epoch": 3424} {"train_loss": -25.673282623291016, "global_step": 284272, "epoch": 3424} {"train_loss": -25.593244552612305, "global_step": 284273, "epoch": 3424} {"train_loss": -25.359812702041076, "global_step": 284274, "epoch": 3424, "val_loss": 7389729.5} {"train_loss": -20.95392417907715, "global_step": 284275, "epoch": 3425} {"train_loss": -24.701406478881836, "global_step": 284276, "epoch": 3425} {"train_loss": -21.266355514526367, "global_step": 284277, "epoch": 3425} {"train_loss": -24.153162002563477, "global_step": 284278, "epoch": 3425} {"train_loss": -23.007177352905273, "global_step": 284279, "epoch": 3425} {"train_loss": -23.555889129638672, "global_step": 284280, "epoch": 3425} {"train_loss": -23.879819869995117, "global_step": 284281, "epoch": 3425} {"train_loss": -23.470561981201172, "global_step": 284282, "epoch": 3425} {"train_loss": -23.779233932495117, "global_step": 284283, "epoch": 3425} {"train_loss": -24.0251407623291, "global_step": 284284, "epoch": 3425} {"train_loss": -23.778797149658203, "global_step": 284285, "epoch": 3425} {"train_loss": -24.19168472290039, "global_step": 284286, "epoch": 3425} {"train_loss": -24.50107192993164, "global_step": 284287, "epoch": 3425} {"train_loss": -24.117244720458984, "global_step": 284288, "epoch": 3425} {"train_loss": -24.071937561035156, "global_step": 284289, "epoch": 3425} {"train_loss": -23.84657859802246, "global_step": 284290, "epoch": 3425} {"train_loss": -24.237934112548828, "global_step": 284291, "epoch": 3425} {"train_loss": -23.908018112182617, "global_step": 284292, "epoch": 3425} {"train_loss": -24.57520294189453, "global_step": 284293, "epoch": 3425} {"train_loss": -24.001127243041992, "global_step": 284294, "epoch": 3425} {"train_loss": -24.654014587402344, "global_step": 284295, "epoch": 3425} {"train_loss": -24.64814567565918, "global_step": 284296, "epoch": 3425} {"train_loss": -24.830669403076172, "global_step": 284297, "epoch": 3425} {"train_loss": -24.566818237304688, "global_step": 284298, "epoch": 3425} {"train_loss": -24.610212326049805, "global_step": 284299, "epoch": 3425} {"train_loss": -24.83537483215332, "global_step": 284300, "epoch": 3425} {"train_loss": -24.632978439331055, "global_step": 284301, "epoch": 3425} {"train_loss": -24.682788848876953, "global_step": 284302, "epoch": 3425} {"train_loss": -24.803802490234375, "global_step": 284303, "epoch": 3425} {"train_loss": -24.747175216674805, "global_step": 284304, "epoch": 3425} {"train_loss": -25.23544692993164, "global_step": 284305, "epoch": 3425} {"train_loss": -24.796955108642578, "global_step": 284306, "epoch": 3425} {"train_loss": -24.761693954467773, "global_step": 284307, "epoch": 3425} {"train_loss": -25.103551864624023, "global_step": 284308, "epoch": 3425} {"train_loss": -24.9940128326416, "global_step": 284309, "epoch": 3425} {"train_loss": -25.166757583618164, "global_step": 284310, "epoch": 3425} {"train_loss": -25.258956909179688, "global_step": 284311, "epoch": 3425} {"train_loss": -24.961050033569336, "global_step": 284312, "epoch": 3425} {"train_loss": -24.690473556518555, "global_step": 284313, "epoch": 3425} {"train_loss": -25.28989601135254, "global_step": 284314, "epoch": 3425} {"train_loss": -24.847240447998047, "global_step": 284315, "epoch": 3425} {"train_loss": -25.159948348999023, "global_step": 284316, "epoch": 3425} {"train_loss": -25.133657455444336, "global_step": 284317, "epoch": 3425} {"train_loss": -25.29853057861328, "global_step": 284318, "epoch": 3425} {"train_loss": -25.193387985229492, "global_step": 284319, "epoch": 3425} {"train_loss": -25.395349502563477, "global_step": 284320, "epoch": 3425} {"train_loss": -25.518634796142578, "global_step": 284321, "epoch": 3425} {"train_loss": -25.44791603088379, "global_step": 284322, "epoch": 3425} {"train_loss": -25.26801109313965, "global_step": 284323, "epoch": 3425} {"train_loss": -25.307226181030273, "global_step": 284324, "epoch": 3425} {"train_loss": -25.232444763183594, "global_step": 284325, "epoch": 3425} {"train_loss": -25.212934494018555, "global_step": 284326, "epoch": 3425} {"train_loss": -25.302616119384766, "global_step": 284327, "epoch": 3425} {"train_loss": -25.585453033447266, "global_step": 284328, "epoch": 3425} {"train_loss": -25.485517501831055, "global_step": 284329, "epoch": 3425} {"train_loss": -25.763330459594727, "global_step": 284330, "epoch": 3425} {"train_loss": -25.526813507080078, "global_step": 284331, "epoch": 3425} {"train_loss": -25.512502670288086, "global_step": 284332, "epoch": 3425} {"train_loss": -25.69826316833496, "global_step": 284333, "epoch": 3425} {"train_loss": -25.33582305908203, "global_step": 284334, "epoch": 3425} {"train_loss": -25.586816787719727, "global_step": 284335, "epoch": 3425} {"train_loss": -25.466739654541016, "global_step": 284336, "epoch": 3425} {"train_loss": -25.44940185546875, "global_step": 284337, "epoch": 3425} {"train_loss": -25.602094650268555, "global_step": 284338, "epoch": 3425} {"train_loss": -25.590900421142578, "global_step": 284339, "epoch": 3425} {"train_loss": -25.711408615112305, "global_step": 284340, "epoch": 3425} {"train_loss": -25.5454044342041, "global_step": 284341, "epoch": 3425} {"train_loss": -25.5646915435791, "global_step": 284342, "epoch": 3425} {"train_loss": -25.48358917236328, "global_step": 284343, "epoch": 3425} {"train_loss": -25.366657257080078, "global_step": 284344, "epoch": 3425} {"train_loss": -25.005826950073242, "global_step": 284345, "epoch": 3425} {"train_loss": -25.180662155151367, "global_step": 284346, "epoch": 3425} {"train_loss": -25.61958122253418, "global_step": 284347, "epoch": 3425} {"train_loss": -25.34583854675293, "global_step": 284348, "epoch": 3425} {"train_loss": -25.565000534057617, "global_step": 284349, "epoch": 3425} {"train_loss": -25.33310317993164, "global_step": 284350, "epoch": 3425} {"train_loss": -25.498641967773438, "global_step": 284351, "epoch": 3425} {"train_loss": -25.522939682006836, "global_step": 284352, "epoch": 3425} {"train_loss": -24.981834411621094, "global_step": 284353, "epoch": 3425} {"train_loss": -25.442251205444336, "global_step": 284354, "epoch": 3425} {"train_loss": -25.109699249267578, "global_step": 284355, "epoch": 3425} {"train_loss": -25.462371826171875, "global_step": 284356, "epoch": 3425} {"train_loss": -24.834904222603303, "global_step": 284357, "epoch": 3425, "val_loss": 7002995.5} {"train_loss": -24.269088745117188, "global_step": 284358, "epoch": 3426} {"train_loss": -24.4462890625, "global_step": 284359, "epoch": 3426} {"train_loss": -24.847883224487305, "global_step": 284360, "epoch": 3426} {"train_loss": -24.773176193237305, "global_step": 284361, "epoch": 3426} {"train_loss": -24.727720260620117, "global_step": 284362, "epoch": 3426} {"train_loss": -24.618661880493164, "global_step": 284363, "epoch": 3426} {"train_loss": -25.105321884155273, "global_step": 284364, "epoch": 3426} {"train_loss": -25.18343162536621, "global_step": 284365, "epoch": 3426} {"train_loss": -24.835737228393555, "global_step": 284366, "epoch": 3426} {"train_loss": -24.708919525146484, "global_step": 284367, "epoch": 3426} {"train_loss": -24.888341903686523, "global_step": 284368, "epoch": 3426} {"train_loss": -24.902591705322266, "global_step": 284369, "epoch": 3426} {"train_loss": -25.078474044799805, "global_step": 284370, "epoch": 3426} {"train_loss": -24.655139923095703, "global_step": 284371, "epoch": 3426} {"train_loss": -25.07048797607422, "global_step": 284372, "epoch": 3426} {"train_loss": -25.066064834594727, "global_step": 284373, "epoch": 3426} {"train_loss": -25.09054183959961, "global_step": 284374, "epoch": 3426} {"train_loss": -25.238861083984375, "global_step": 284375, "epoch": 3426} {"train_loss": -24.947294235229492, "global_step": 284376, "epoch": 3426} {"train_loss": -25.22292709350586, "global_step": 284377, "epoch": 3426} {"train_loss": -25.16147804260254, "global_step": 284378, "epoch": 3426} {"train_loss": -25.018756866455078, "global_step": 284379, "epoch": 3426} {"train_loss": -25.258426666259766, "global_step": 284380, "epoch": 3426} {"train_loss": -24.676977157592773, "global_step": 284381, "epoch": 3426} {"train_loss": -25.142053604125977, "global_step": 284382, "epoch": 3426} {"train_loss": -25.384471893310547, "global_step": 284383, "epoch": 3426} {"train_loss": -25.245988845825195, "global_step": 284384, "epoch": 3426} {"train_loss": -25.251262664794922, "global_step": 284385, "epoch": 3426} {"train_loss": -25.24810218811035, "global_step": 284386, "epoch": 3426} {"train_loss": -25.44045066833496, "global_step": 284387, "epoch": 3426} {"train_loss": -25.332914352416992, "global_step": 284388, "epoch": 3426} {"train_loss": -25.123310089111328, "global_step": 284389, "epoch": 3426} {"train_loss": -25.437070846557617, "global_step": 284390, "epoch": 3426} {"train_loss": -25.591716766357422, "global_step": 284391, "epoch": 3426} {"train_loss": -25.3243408203125, "global_step": 284392, "epoch": 3426} {"train_loss": -25.172733306884766, "global_step": 284393, "epoch": 3426} {"train_loss": -25.167423248291016, "global_step": 284394, "epoch": 3426} {"train_loss": -25.149295806884766, "global_step": 284395, "epoch": 3426} {"train_loss": -25.435331344604492, "global_step": 284396, "epoch": 3426} {"train_loss": -25.28038787841797, "global_step": 284397, "epoch": 3426} {"train_loss": -25.384328842163086, "global_step": 284398, "epoch": 3426} {"train_loss": -25.490625381469727, "global_step": 284399, "epoch": 3426} {"train_loss": -25.333356857299805, "global_step": 284400, "epoch": 3426} {"train_loss": -25.081926345825195, "global_step": 284401, "epoch": 3426} {"train_loss": -25.27431297302246, "global_step": 284402, "epoch": 3426} {"train_loss": -25.624738693237305, "global_step": 284403, "epoch": 3426} {"train_loss": -25.674732208251953, "global_step": 284404, "epoch": 3426} {"train_loss": -25.580242156982422, "global_step": 284405, "epoch": 3426} {"train_loss": -25.575550079345703, "global_step": 284406, "epoch": 3426} {"train_loss": -25.480764389038086, "global_step": 284407, "epoch": 3426} {"train_loss": -25.268075942993164, "global_step": 284408, "epoch": 3426} {"train_loss": -26.165510177612305, "global_step": 284409, "epoch": 3426} {"train_loss": -25.30445671081543, "global_step": 284410, "epoch": 3426} {"train_loss": -25.543487548828125, "global_step": 284411, "epoch": 3426} {"train_loss": -25.649810791015625, "global_step": 284412, "epoch": 3426} {"train_loss": -25.86918067932129, "global_step": 284413, "epoch": 3426} {"train_loss": -25.40871238708496, "global_step": 284414, "epoch": 3426} {"train_loss": -25.899341583251953, "global_step": 284415, "epoch": 3426} {"train_loss": -25.67305564880371, "global_step": 284416, "epoch": 3426} {"train_loss": -25.773944854736328, "global_step": 284417, "epoch": 3426} {"train_loss": -25.84274673461914, "global_step": 284418, "epoch": 3426} {"train_loss": -25.87677574157715, "global_step": 284419, "epoch": 3426} {"train_loss": -25.66830825805664, "global_step": 284420, "epoch": 3426} {"train_loss": -25.79383659362793, "global_step": 284421, "epoch": 3426} {"train_loss": -25.4980525970459, "global_step": 284422, "epoch": 3426} {"train_loss": -25.668506622314453, "global_step": 284423, "epoch": 3426} {"train_loss": -25.74725914001465, "global_step": 284424, "epoch": 3426} {"train_loss": -25.485809326171875, "global_step": 284425, "epoch": 3426} {"train_loss": -25.617664337158203, "global_step": 284426, "epoch": 3426} {"train_loss": -25.043338775634766, "global_step": 284427, "epoch": 3426} {"train_loss": -25.456823348999023, "global_step": 284428, "epoch": 3426} {"train_loss": -25.341297149658203, "global_step": 284429, "epoch": 3426} {"train_loss": -25.00931167602539, "global_step": 284430, "epoch": 3426} {"train_loss": -24.680513381958008, "global_step": 284431, "epoch": 3426} {"train_loss": -24.29769515991211, "global_step": 284432, "epoch": 3426} {"train_loss": -24.801605224609375, "global_step": 284433, "epoch": 3426} {"train_loss": -25.332996368408203, "global_step": 284434, "epoch": 3426} {"train_loss": -25.148340225219727, "global_step": 284435, "epoch": 3426} {"train_loss": -24.650890350341797, "global_step": 284436, "epoch": 3426} {"train_loss": -25.5772762298584, "global_step": 284437, "epoch": 3426} {"train_loss": -25.335020065307617, "global_step": 284438, "epoch": 3426} {"train_loss": -24.966663360595703, "global_step": 284439, "epoch": 3426} {"train_loss": -25.25342617264713, "global_step": 284440, "epoch": 3426, "val_loss": 7134538.0} {"train_loss": -24.142894744873047, "global_step": 284441, "epoch": 3427} {"train_loss": -24.293607711791992, "global_step": 284442, "epoch": 3427} {"train_loss": -25.212392807006836, "global_step": 284443, "epoch": 3427} {"train_loss": -24.550094604492188, "global_step": 284444, "epoch": 3427} {"train_loss": -25.142004013061523, "global_step": 284445, "epoch": 3427} {"train_loss": -24.48897361755371, "global_step": 284446, "epoch": 3427} {"train_loss": -24.81123161315918, "global_step": 284447, "epoch": 3427} {"train_loss": -24.54478645324707, "global_step": 284448, "epoch": 3427} {"train_loss": -24.840551376342773, "global_step": 284449, "epoch": 3427} {"train_loss": -24.81801986694336, "global_step": 284450, "epoch": 3427} {"train_loss": -25.012697219848633, "global_step": 284451, "epoch": 3427} {"train_loss": -24.94278907775879, "global_step": 284452, "epoch": 3427} {"train_loss": -24.818435668945312, "global_step": 284453, "epoch": 3427} {"train_loss": -25.122943878173828, "global_step": 284454, "epoch": 3427} {"train_loss": -25.103797912597656, "global_step": 284455, "epoch": 3427} {"train_loss": -24.972137451171875, "global_step": 284456, "epoch": 3427} {"train_loss": -25.077457427978516, "global_step": 284457, "epoch": 3427} {"train_loss": -24.865726470947266, "global_step": 284458, "epoch": 3427} {"train_loss": -25.487653732299805, "global_step": 284459, "epoch": 3427} {"train_loss": -25.174823760986328, "global_step": 284460, "epoch": 3427} {"train_loss": -25.342315673828125, "global_step": 284461, "epoch": 3427} {"train_loss": -25.467199325561523, "global_step": 284462, "epoch": 3427} {"train_loss": -24.91910743713379, "global_step": 284463, "epoch": 3427} {"train_loss": -25.35854148864746, "global_step": 284464, "epoch": 3427} {"train_loss": -25.306724548339844, "global_step": 284465, "epoch": 3427} {"train_loss": -25.215829849243164, "global_step": 284466, "epoch": 3427} {"train_loss": -25.08455467224121, "global_step": 284467, "epoch": 3427} {"train_loss": -25.48635482788086, "global_step": 284468, "epoch": 3427} {"train_loss": -25.30630874633789, "global_step": 284469, "epoch": 3427} {"train_loss": -25.521284103393555, "global_step": 284470, "epoch": 3427} {"train_loss": -25.763280868530273, "global_step": 284471, "epoch": 3427} {"train_loss": -25.591766357421875, "global_step": 284472, "epoch": 3427} {"train_loss": -25.250532150268555, "global_step": 284473, "epoch": 3427} {"train_loss": -25.790857315063477, "global_step": 284474, "epoch": 3427} {"train_loss": -25.657377243041992, "global_step": 284475, "epoch": 3427} {"train_loss": -25.57956886291504, "global_step": 284476, "epoch": 3427} {"train_loss": -25.548118591308594, "global_step": 284477, "epoch": 3427} {"train_loss": -25.725522994995117, "global_step": 284478, "epoch": 3427} {"train_loss": -25.767154693603516, "global_step": 284479, "epoch": 3427} {"train_loss": -25.857511520385742, "global_step": 284480, "epoch": 3427} {"train_loss": -25.7005672454834, "global_step": 284481, "epoch": 3427} {"train_loss": -25.678186416625977, "global_step": 284482, "epoch": 3427} {"train_loss": -25.665552139282227, "global_step": 284483, "epoch": 3427} {"train_loss": -25.54652214050293, "global_step": 284484, "epoch": 3427} {"train_loss": -25.7110652923584, "global_step": 284485, "epoch": 3427} {"train_loss": -25.846546173095703, "global_step": 284486, "epoch": 3427} {"train_loss": -25.762516021728516, "global_step": 284487, "epoch": 3427} {"train_loss": -25.80837059020996, "global_step": 284488, "epoch": 3427} {"train_loss": -25.835336685180664, "global_step": 284489, "epoch": 3427} {"train_loss": -25.6315860748291, "global_step": 284490, "epoch": 3427} {"train_loss": -25.64577293395996, "global_step": 284491, "epoch": 3427} {"train_loss": -25.551910400390625, "global_step": 284492, "epoch": 3427} {"train_loss": -25.9100399017334, "global_step": 284493, "epoch": 3427} {"train_loss": -25.760009765625, "global_step": 284494, "epoch": 3427} {"train_loss": -25.622177124023438, "global_step": 284495, "epoch": 3427} {"train_loss": -25.698429107666016, "global_step": 284496, "epoch": 3427} {"train_loss": -25.789670944213867, "global_step": 284497, "epoch": 3427} {"train_loss": -25.712905883789062, "global_step": 284498, "epoch": 3427} {"train_loss": -25.40684700012207, "global_step": 284499, "epoch": 3427} {"train_loss": -25.540706634521484, "global_step": 284500, "epoch": 3427} {"train_loss": -25.90705680847168, "global_step": 284501, "epoch": 3427} {"train_loss": -25.426607131958008, "global_step": 284502, "epoch": 3427} {"train_loss": -25.348569869995117, "global_step": 284503, "epoch": 3427} {"train_loss": -25.549514770507812, "global_step": 284504, "epoch": 3427} {"train_loss": -25.48322296142578, "global_step": 284505, "epoch": 3427} {"train_loss": -25.331268310546875, "global_step": 284506, "epoch": 3427} {"train_loss": -25.089784622192383, "global_step": 284507, "epoch": 3427} {"train_loss": -25.31062889099121, "global_step": 284508, "epoch": 3427} {"train_loss": -25.7304630279541, "global_step": 284509, "epoch": 3427} {"train_loss": -25.585189819335938, "global_step": 284510, "epoch": 3427} {"train_loss": -25.43304443359375, "global_step": 284511, "epoch": 3427} {"train_loss": -25.450849533081055, "global_step": 284512, "epoch": 3427} {"train_loss": -25.126876831054688, "global_step": 284513, "epoch": 3427} {"train_loss": -25.916223526000977, "global_step": 284514, "epoch": 3427} {"train_loss": -25.5369930267334, "global_step": 284515, "epoch": 3427} {"train_loss": -25.227787017822266, "global_step": 284516, "epoch": 3427} {"train_loss": -25.394086837768555, "global_step": 284517, "epoch": 3427} {"train_loss": -25.603748321533203, "global_step": 284518, "epoch": 3427} {"train_loss": -25.498350143432617, "global_step": 284519, "epoch": 3427} {"train_loss": -25.43446159362793, "global_step": 284520, "epoch": 3427} {"train_loss": -25.867523193359375, "global_step": 284521, "epoch": 3427} {"train_loss": -25.35211181640625, "global_step": 284522, "epoch": 3427} {"train_loss": -25.391786942999047, "global_step": 284523, "epoch": 3427, "val_loss": 7064233.0} {"train_loss": -23.815542221069336, "global_step": 284524, "epoch": 3428} {"train_loss": -24.10263442993164, "global_step": 284525, "epoch": 3428} {"train_loss": -24.830366134643555, "global_step": 284526, "epoch": 3428} {"train_loss": -24.766403198242188, "global_step": 284527, "epoch": 3428} {"train_loss": -24.80194091796875, "global_step": 284528, "epoch": 3428} {"train_loss": -24.711881637573242, "global_step": 284529, "epoch": 3428} {"train_loss": -24.810239791870117, "global_step": 284530, "epoch": 3428} {"train_loss": -24.51885986328125, "global_step": 284531, "epoch": 3428} {"train_loss": -25.016931533813477, "global_step": 284532, "epoch": 3428} {"train_loss": -24.65313148498535, "global_step": 284533, "epoch": 3428} {"train_loss": -24.458698272705078, "global_step": 284534, "epoch": 3428} {"train_loss": -24.925479888916016, "global_step": 284535, "epoch": 3428} {"train_loss": -24.795848846435547, "global_step": 284536, "epoch": 3428} {"train_loss": -25.008329391479492, "global_step": 284537, "epoch": 3428} {"train_loss": -25.104183197021484, "global_step": 284538, "epoch": 3428} {"train_loss": -25.070871353149414, "global_step": 284539, "epoch": 3428} {"train_loss": -24.989049911499023, "global_step": 284540, "epoch": 3428} {"train_loss": -24.65617561340332, "global_step": 284541, "epoch": 3428} {"train_loss": -25.212400436401367, "global_step": 284542, "epoch": 3428} {"train_loss": -25.263376235961914, "global_step": 284543, "epoch": 3428} {"train_loss": -25.170774459838867, "global_step": 284544, "epoch": 3428} {"train_loss": -25.116966247558594, "global_step": 284545, "epoch": 3428} {"train_loss": -25.394250869750977, "global_step": 284546, "epoch": 3428} {"train_loss": -25.20438575744629, "global_step": 284547, "epoch": 3428} {"train_loss": -24.88092041015625, "global_step": 284548, "epoch": 3428} {"train_loss": -25.064939498901367, "global_step": 284549, "epoch": 3428} {"train_loss": -25.29231834411621, "global_step": 284550, "epoch": 3428} {"train_loss": -25.160417556762695, "global_step": 284551, "epoch": 3428} {"train_loss": -25.458995819091797, "global_step": 284552, "epoch": 3428} {"train_loss": -25.37360954284668, "global_step": 284553, "epoch": 3428} {"train_loss": -25.536792755126953, "global_step": 284554, "epoch": 3428} {"train_loss": -25.45488929748535, "global_step": 284555, "epoch": 3428} {"train_loss": -25.138193130493164, "global_step": 284556, "epoch": 3428} {"train_loss": -25.44476890563965, "global_step": 284557, "epoch": 3428} {"train_loss": -25.290590286254883, "global_step": 284558, "epoch": 3428} {"train_loss": -25.272321701049805, "global_step": 284559, "epoch": 3428} {"train_loss": -25.4045467376709, "global_step": 284560, "epoch": 3428} {"train_loss": -25.453100204467773, "global_step": 284561, "epoch": 3428} {"train_loss": -25.869049072265625, "global_step": 284562, "epoch": 3428} {"train_loss": -25.64447593688965, "global_step": 284563, "epoch": 3428} {"train_loss": -25.20392417907715, "global_step": 284564, "epoch": 3428} {"train_loss": -25.21272087097168, "global_step": 284565, "epoch": 3428} {"train_loss": -25.797693252563477, "global_step": 284566, "epoch": 3428} {"train_loss": -25.62568473815918, "global_step": 284567, "epoch": 3428} {"train_loss": -25.513357162475586, "global_step": 284568, "epoch": 3428} {"train_loss": -25.77503776550293, "global_step": 284569, "epoch": 3428} {"train_loss": -25.29810905456543, "global_step": 284570, "epoch": 3428} {"train_loss": -25.6788387298584, "global_step": 284571, "epoch": 3428} {"train_loss": -25.129337310791016, "global_step": 284572, "epoch": 3428} {"train_loss": -25.620325088500977, "global_step": 284573, "epoch": 3428} {"train_loss": -25.543258666992188, "global_step": 284574, "epoch": 3428} {"train_loss": -25.36612892150879, "global_step": 284575, "epoch": 3428} {"train_loss": -25.668777465820312, "global_step": 284576, "epoch": 3428} {"train_loss": -25.494184494018555, "global_step": 284577, "epoch": 3428} {"train_loss": -25.568313598632812, "global_step": 284578, "epoch": 3428} {"train_loss": -25.46017837524414, "global_step": 284579, "epoch": 3428} {"train_loss": -25.52818489074707, "global_step": 284580, "epoch": 3428} {"train_loss": -25.144634246826172, "global_step": 284581, "epoch": 3428} {"train_loss": -25.681781768798828, "global_step": 284582, "epoch": 3428} {"train_loss": -25.833044052124023, "global_step": 284583, "epoch": 3428} {"train_loss": -25.205198287963867, "global_step": 284584, "epoch": 3428} {"train_loss": -25.359792709350586, "global_step": 284585, "epoch": 3428} {"train_loss": -25.07978630065918, "global_step": 284586, "epoch": 3428} {"train_loss": -25.668615341186523, "global_step": 284587, "epoch": 3428} {"train_loss": -25.761463165283203, "global_step": 284588, "epoch": 3428} {"train_loss": -24.59261131286621, "global_step": 284589, "epoch": 3428} {"train_loss": -23.9846248626709, "global_step": 284590, "epoch": 3428} {"train_loss": -23.91762351989746, "global_step": 284591, "epoch": 3428} {"train_loss": -24.960845947265625, "global_step": 284592, "epoch": 3428} {"train_loss": -25.05674171447754, "global_step": 284593, "epoch": 3428} {"train_loss": -24.975738525390625, "global_step": 284594, "epoch": 3428} {"train_loss": -25.13565444946289, "global_step": 284595, "epoch": 3428} {"train_loss": -25.571887969970703, "global_step": 284596, "epoch": 3428} {"train_loss": -24.700637817382812, "global_step": 284597, "epoch": 3428} {"train_loss": -25.369998931884766, "global_step": 284598, "epoch": 3428} {"train_loss": -25.064115524291992, "global_step": 284599, "epoch": 3428} {"train_loss": -25.58856773376465, "global_step": 284600, "epoch": 3428} {"train_loss": -25.280231475830078, "global_step": 284601, "epoch": 3428} {"train_loss": -25.63541030883789, "global_step": 284602, "epoch": 3428} {"train_loss": -25.468547821044922, "global_step": 284603, "epoch": 3428} {"train_loss": -25.18354606628418, "global_step": 284604, "epoch": 3428} {"train_loss": -25.65614128112793, "global_step": 284605, "epoch": 3428} {"train_loss": -25.17115650406803, "global_step": 284606, "epoch": 3428, "val_loss": 7083726.5} {"train_loss": -24.842567443847656, "global_step": 284607, "epoch": 3429} {"train_loss": -24.865707397460938, "global_step": 284608, "epoch": 3429} {"train_loss": -25.149843215942383, "global_step": 284609, "epoch": 3429} {"train_loss": -25.196300506591797, "global_step": 284610, "epoch": 3429} {"train_loss": -24.397729873657227, "global_step": 284611, "epoch": 3429} {"train_loss": -25.161468505859375, "global_step": 284612, "epoch": 3429} {"train_loss": -24.953550338745117, "global_step": 284613, "epoch": 3429} {"train_loss": -25.056427001953125, "global_step": 284614, "epoch": 3429} {"train_loss": -25.37468910217285, "global_step": 284615, "epoch": 3429} {"train_loss": -25.09682273864746, "global_step": 284616, "epoch": 3429} {"train_loss": -25.192750930786133, "global_step": 284617, "epoch": 3429} {"train_loss": -25.244537353515625, "global_step": 284618, "epoch": 3429} {"train_loss": -25.064664840698242, "global_step": 284619, "epoch": 3429} {"train_loss": -25.336578369140625, "global_step": 284620, "epoch": 3429} {"train_loss": -25.37713623046875, "global_step": 284621, "epoch": 3429} {"train_loss": -25.30104637145996, "global_step": 284622, "epoch": 3429} {"train_loss": -25.411508560180664, "global_step": 284623, "epoch": 3429} {"train_loss": -25.139795303344727, "global_step": 284624, "epoch": 3429} {"train_loss": -25.432804107666016, "global_step": 284625, "epoch": 3429} {"train_loss": -25.284025192260742, "global_step": 284626, "epoch": 3429} {"train_loss": -25.55565643310547, "global_step": 284627, "epoch": 3429} {"train_loss": -25.513463973999023, "global_step": 284628, "epoch": 3429} {"train_loss": -25.458009719848633, "global_step": 284629, "epoch": 3429} {"train_loss": -25.72587013244629, "global_step": 284630, "epoch": 3429} {"train_loss": -25.611616134643555, "global_step": 284631, "epoch": 3429} {"train_loss": -25.402524948120117, "global_step": 284632, "epoch": 3429} {"train_loss": -25.361492156982422, "global_step": 284633, "epoch": 3429} {"train_loss": -25.306955337524414, "global_step": 284634, "epoch": 3429} {"train_loss": -25.716272354125977, "global_step": 284635, "epoch": 3429} {"train_loss": -25.54099464416504, "global_step": 284636, "epoch": 3429} {"train_loss": -25.664770126342773, "global_step": 284637, "epoch": 3429} {"train_loss": -25.37626075744629, "global_step": 284638, "epoch": 3429} {"train_loss": -25.828765869140625, "global_step": 284639, "epoch": 3429} {"train_loss": -25.922046661376953, "global_step": 284640, "epoch": 3429} {"train_loss": -25.4417667388916, "global_step": 284641, "epoch": 3429} {"train_loss": -25.719221115112305, "global_step": 284642, "epoch": 3429} {"train_loss": -25.7061767578125, "global_step": 284643, "epoch": 3429} {"train_loss": -25.657608032226562, "global_step": 284644, "epoch": 3429} {"train_loss": -25.3728084564209, "global_step": 284645, "epoch": 3429} {"train_loss": -25.504417419433594, "global_step": 284646, "epoch": 3429} {"train_loss": -25.42402458190918, "global_step": 284647, "epoch": 3429} {"train_loss": -26.018299102783203, "global_step": 284648, "epoch": 3429} {"train_loss": -25.1759090423584, "global_step": 284649, "epoch": 3429} {"train_loss": -24.94986915588379, "global_step": 284650, "epoch": 3429} {"train_loss": -25.222143173217773, "global_step": 284651, "epoch": 3429} {"train_loss": -24.972518920898438, "global_step": 284652, "epoch": 3429} {"train_loss": -25.503175735473633, "global_step": 284653, "epoch": 3429} {"train_loss": -25.343332290649414, "global_step": 284654, "epoch": 3429} {"train_loss": -25.416852951049805, "global_step": 284655, "epoch": 3429} {"train_loss": -25.6370906829834, "global_step": 284656, "epoch": 3429} {"train_loss": -25.58452606201172, "global_step": 284657, "epoch": 3429} {"train_loss": -25.577987670898438, "global_step": 284658, "epoch": 3429} {"train_loss": -25.464248657226562, "global_step": 284659, "epoch": 3429} {"train_loss": -25.59097671508789, "global_step": 284660, "epoch": 3429} {"train_loss": -25.57929229736328, "global_step": 284661, "epoch": 3429} {"train_loss": -25.80132484436035, "global_step": 284662, "epoch": 3429} {"train_loss": -25.452436447143555, "global_step": 284663, "epoch": 3429} {"train_loss": -25.457563400268555, "global_step": 284664, "epoch": 3429} {"train_loss": -25.34649085998535, "global_step": 284665, "epoch": 3429} {"train_loss": -25.47796630859375, "global_step": 284666, "epoch": 3429} {"train_loss": -25.740299224853516, "global_step": 284667, "epoch": 3429} {"train_loss": -25.615869522094727, "global_step": 284668, "epoch": 3429} {"train_loss": -25.451261520385742, "global_step": 284669, "epoch": 3429} {"train_loss": -25.41514778137207, "global_step": 284670, "epoch": 3429} {"train_loss": -25.638410568237305, "global_step": 284671, "epoch": 3429} {"train_loss": -25.245084762573242, "global_step": 284672, "epoch": 3429} {"train_loss": -25.484853744506836, "global_step": 284673, "epoch": 3429} {"train_loss": -25.983062744140625, "global_step": 284674, "epoch": 3429} {"train_loss": -25.71771812438965, "global_step": 284675, "epoch": 3429} {"train_loss": -25.458316802978516, "global_step": 284676, "epoch": 3429} {"train_loss": -25.6143741607666, "global_step": 284677, "epoch": 3429} {"train_loss": -25.335796356201172, "global_step": 284678, "epoch": 3429} {"train_loss": -25.634368896484375, "global_step": 284679, "epoch": 3429} {"train_loss": -25.745895385742188, "global_step": 284680, "epoch": 3429} {"train_loss": -25.34823989868164, "global_step": 284681, "epoch": 3429} {"train_loss": -25.5360107421875, "global_step": 284682, "epoch": 3429} {"train_loss": -25.608173370361328, "global_step": 284683, "epoch": 3429} {"train_loss": -25.82358741760254, "global_step": 284684, "epoch": 3429} {"train_loss": -25.592975616455078, "global_step": 284685, "epoch": 3429} {"train_loss": -25.56454849243164, "global_step": 284686, "epoch": 3429} {"train_loss": -25.48859214782715, "global_step": 284687, "epoch": 3429} {"train_loss": -25.343412399291992, "global_step": 284688, "epoch": 3429} {"train_loss": -25.425454036299005, "global_step": 284689, "epoch": 3429, "val_loss": 7234974.0} {"train_loss": -24.04861068725586, "global_step": 284690, "epoch": 3430} {"train_loss": -23.105255126953125, "global_step": 284691, "epoch": 3430} {"train_loss": -24.77430534362793, "global_step": 284692, "epoch": 3430} {"train_loss": -24.884218215942383, "global_step": 284693, "epoch": 3430} {"train_loss": -24.66815185546875, "global_step": 284694, "epoch": 3430} {"train_loss": -24.974355697631836, "global_step": 284695, "epoch": 3430} {"train_loss": -24.52964210510254, "global_step": 284696, "epoch": 3430} {"train_loss": -25.059602737426758, "global_step": 284697, "epoch": 3430} {"train_loss": -24.79316520690918, "global_step": 284698, "epoch": 3430} {"train_loss": -24.71298599243164, "global_step": 284699, "epoch": 3430} {"train_loss": -25.06436538696289, "global_step": 284700, "epoch": 3430} {"train_loss": -25.053869247436523, "global_step": 284701, "epoch": 3430} {"train_loss": -24.999189376831055, "global_step": 284702, "epoch": 3430} {"train_loss": -25.288955688476562, "global_step": 284703, "epoch": 3430} {"train_loss": -25.58743667602539, "global_step": 284704, "epoch": 3430} {"train_loss": -25.119091033935547, "global_step": 284705, "epoch": 3430} {"train_loss": -25.423559188842773, "global_step": 284706, "epoch": 3430} {"train_loss": -25.38685417175293, "global_step": 284707, "epoch": 3430} {"train_loss": -25.441709518432617, "global_step": 284708, "epoch": 3430} {"train_loss": -25.44036865234375, "global_step": 284709, "epoch": 3430} {"train_loss": -24.903026580810547, "global_step": 284710, "epoch": 3430} {"train_loss": -25.27042007446289, "global_step": 284711, "epoch": 3430} {"train_loss": -25.255441665649414, "global_step": 284712, "epoch": 3430} {"train_loss": -25.21875, "global_step": 284713, "epoch": 3430} {"train_loss": -25.14274787902832, "global_step": 284714, "epoch": 3430} {"train_loss": -25.515687942504883, "global_step": 284715, "epoch": 3430} {"train_loss": -25.37668228149414, "global_step": 284716, "epoch": 3430} {"train_loss": -25.485279083251953, "global_step": 284717, "epoch": 3430} {"train_loss": -25.624181747436523, "global_step": 284718, "epoch": 3430} {"train_loss": -25.51070213317871, "global_step": 284719, "epoch": 3430} {"train_loss": -25.732324600219727, "global_step": 284720, "epoch": 3430} {"train_loss": -25.424352645874023, "global_step": 284721, "epoch": 3430} {"train_loss": -25.696096420288086, "global_step": 284722, "epoch": 3430} {"train_loss": -25.791650772094727, "global_step": 284723, "epoch": 3430} {"train_loss": -25.383045196533203, "global_step": 284724, "epoch": 3430} {"train_loss": -25.451704025268555, "global_step": 284725, "epoch": 3430} {"train_loss": -25.82285499572754, "global_step": 284726, "epoch": 3430} {"train_loss": -25.9547119140625, "global_step": 284727, "epoch": 3430} {"train_loss": -25.653839111328125, "global_step": 284728, "epoch": 3430} {"train_loss": -25.448719024658203, "global_step": 284729, "epoch": 3430} {"train_loss": -25.62415885925293, "global_step": 284730, "epoch": 3430} {"train_loss": -25.676685333251953, "global_step": 284731, "epoch": 3430} {"train_loss": -25.334369659423828, "global_step": 284732, "epoch": 3430} {"train_loss": -25.373519897460938, "global_step": 284733, "epoch": 3430} {"train_loss": -25.566776275634766, "global_step": 284734, "epoch": 3430} {"train_loss": -25.6174259185791, "global_step": 284735, "epoch": 3430} {"train_loss": -25.5562744140625, "global_step": 284736, "epoch": 3430} {"train_loss": -25.340333938598633, "global_step": 284737, "epoch": 3430} {"train_loss": -25.304336547851562, "global_step": 284738, "epoch": 3430} {"train_loss": -25.698917388916016, "global_step": 284739, "epoch": 3430} {"train_loss": -25.613224029541016, "global_step": 284740, "epoch": 3430} {"train_loss": -25.48596954345703, "global_step": 284741, "epoch": 3430} {"train_loss": -25.203500747680664, "global_step": 284742, "epoch": 3430} {"train_loss": -25.27321434020996, "global_step": 284743, "epoch": 3430} {"train_loss": -25.55353355407715, "global_step": 284744, "epoch": 3430} {"train_loss": -25.559595108032227, "global_step": 284745, "epoch": 3430} {"train_loss": -25.722610473632812, "global_step": 284746, "epoch": 3430} {"train_loss": -26.033369064331055, "global_step": 284747, "epoch": 3430} {"train_loss": -25.834884643554688, "global_step": 284748, "epoch": 3430} {"train_loss": -25.67746925354004, "global_step": 284749, "epoch": 3430} {"train_loss": -25.464078903198242, "global_step": 284750, "epoch": 3430} {"train_loss": -25.360946655273438, "global_step": 284751, "epoch": 3430} {"train_loss": -25.30396842956543, "global_step": 284752, "epoch": 3430} {"train_loss": -25.324539184570312, "global_step": 284753, "epoch": 3430} {"train_loss": -25.476333618164062, "global_step": 284754, "epoch": 3430} {"train_loss": -25.6041202545166, "global_step": 284755, "epoch": 3430} {"train_loss": -25.914045333862305, "global_step": 284756, "epoch": 3430} {"train_loss": -25.76275062561035, "global_step": 284757, "epoch": 3430} {"train_loss": -25.07929229736328, "global_step": 284758, "epoch": 3430} {"train_loss": -25.599454879760742, "global_step": 284759, "epoch": 3430} {"train_loss": -25.52179527282715, "global_step": 284760, "epoch": 3430} {"train_loss": -25.266618728637695, "global_step": 284761, "epoch": 3430} {"train_loss": -25.286468505859375, "global_step": 284762, "epoch": 3430} {"train_loss": -25.617048263549805, "global_step": 284763, "epoch": 3430} {"train_loss": -25.770587921142578, "global_step": 284764, "epoch": 3430} {"train_loss": -25.50787925720215, "global_step": 284765, "epoch": 3430} {"train_loss": -25.788604736328125, "global_step": 284766, "epoch": 3430} {"train_loss": -25.694570541381836, "global_step": 284767, "epoch": 3430} {"train_loss": -25.421279907226562, "global_step": 284768, "epoch": 3430} {"train_loss": -25.378076553344727, "global_step": 284769, "epoch": 3430} {"train_loss": -25.52150535583496, "global_step": 284770, "epoch": 3430} {"train_loss": -25.836374282836914, "global_step": 284771, "epoch": 3430} {"train_loss": -25.363555172839796, "global_step": 284772, "epoch": 3430, "val_loss": 7144342.0} {"train_loss": -25.03835105895996, "global_step": 284773, "epoch": 3431} {"train_loss": -24.773500442504883, "global_step": 284774, "epoch": 3431} {"train_loss": -25.260847091674805, "global_step": 284775, "epoch": 3431} {"train_loss": -24.65810203552246, "global_step": 284776, "epoch": 3431} {"train_loss": -24.46402931213379, "global_step": 284777, "epoch": 3431} {"train_loss": -25.091720581054688, "global_step": 284778, "epoch": 3431} {"train_loss": -24.771024703979492, "global_step": 284779, "epoch": 3431} {"train_loss": -25.260560989379883, "global_step": 284780, "epoch": 3431} {"train_loss": -24.84307289123535, "global_step": 284781, "epoch": 3431} {"train_loss": -24.97796058654785, "global_step": 284782, "epoch": 3431} {"train_loss": -24.651124954223633, "global_step": 284783, "epoch": 3431} {"train_loss": -25.339609146118164, "global_step": 284784, "epoch": 3431} {"train_loss": -25.020713806152344, "global_step": 284785, "epoch": 3431} {"train_loss": -24.901155471801758, "global_step": 284786, "epoch": 3431} {"train_loss": -25.026844024658203, "global_step": 284787, "epoch": 3431} {"train_loss": -25.38180923461914, "global_step": 284788, "epoch": 3431} {"train_loss": -25.565500259399414, "global_step": 284789, "epoch": 3431} {"train_loss": -25.46511459350586, "global_step": 284790, "epoch": 3431} {"train_loss": -25.150259017944336, "global_step": 284791, "epoch": 3431} {"train_loss": -25.22280502319336, "global_step": 284792, "epoch": 3431} {"train_loss": -25.25843620300293, "global_step": 284793, "epoch": 3431} {"train_loss": -25.50556182861328, "global_step": 284794, "epoch": 3431} {"train_loss": -25.306442260742188, "global_step": 284795, "epoch": 3431} {"train_loss": -25.46222496032715, "global_step": 284796, "epoch": 3431} {"train_loss": -25.7104434967041, "global_step": 284797, "epoch": 3431} {"train_loss": -25.514738082885742, "global_step": 284798, "epoch": 3431} {"train_loss": -25.042089462280273, "global_step": 284799, "epoch": 3431} {"train_loss": -25.579938888549805, "global_step": 284800, "epoch": 3431} {"train_loss": -25.12079429626465, "global_step": 284801, "epoch": 3431} {"train_loss": -25.333410263061523, "global_step": 284802, "epoch": 3431} {"train_loss": -25.6019287109375, "global_step": 284803, "epoch": 3431} {"train_loss": -24.980993270874023, "global_step": 284804, "epoch": 3431} {"train_loss": -25.397462844848633, "global_step": 284805, "epoch": 3431} {"train_loss": -25.402610778808594, "global_step": 284806, "epoch": 3431} {"train_loss": -25.58180809020996, "global_step": 284807, "epoch": 3431} {"train_loss": -25.211755752563477, "global_step": 284808, "epoch": 3431} {"train_loss": -25.956106185913086, "global_step": 284809, "epoch": 3431} {"train_loss": -25.53782844543457, "global_step": 284810, "epoch": 3431} {"train_loss": -25.431852340698242, "global_step": 284811, "epoch": 3431} {"train_loss": -25.074371337890625, "global_step": 284812, "epoch": 3431} {"train_loss": -25.478076934814453, "global_step": 284813, "epoch": 3431} {"train_loss": -25.7415828704834, "global_step": 284814, "epoch": 3431} {"train_loss": -25.72812271118164, "global_step": 284815, "epoch": 3431} {"train_loss": -25.812891006469727, "global_step": 284816, "epoch": 3431} {"train_loss": -25.615827560424805, "global_step": 284817, "epoch": 3431} {"train_loss": -25.324691772460938, "global_step": 284818, "epoch": 3431} {"train_loss": -25.009502410888672, "global_step": 284819, "epoch": 3431} {"train_loss": -25.346166610717773, "global_step": 284820, "epoch": 3431} {"train_loss": -25.497671127319336, "global_step": 284821, "epoch": 3431} {"train_loss": -25.684223175048828, "global_step": 284822, "epoch": 3431} {"train_loss": -26.196624755859375, "global_step": 284823, "epoch": 3431} {"train_loss": -25.044729232788086, "global_step": 284824, "epoch": 3431} {"train_loss": -25.189790725708008, "global_step": 284825, "epoch": 3431} {"train_loss": -25.55088233947754, "global_step": 284826, "epoch": 3431} {"train_loss": -25.28102684020996, "global_step": 284827, "epoch": 3431} {"train_loss": -25.518049240112305, "global_step": 284828, "epoch": 3431} {"train_loss": -25.7631893157959, "global_step": 284829, "epoch": 3431} {"train_loss": -25.40911865234375, "global_step": 284830, "epoch": 3431} {"train_loss": -25.614471435546875, "global_step": 284831, "epoch": 3431} {"train_loss": -25.841236114501953, "global_step": 284832, "epoch": 3431} {"train_loss": -25.633838653564453, "global_step": 284833, "epoch": 3431} {"train_loss": -25.414831161499023, "global_step": 284834, "epoch": 3431} {"train_loss": -25.769311904907227, "global_step": 284835, "epoch": 3431} {"train_loss": -25.5427188873291, "global_step": 284836, "epoch": 3431} {"train_loss": -26.05023193359375, "global_step": 284837, "epoch": 3431} {"train_loss": -25.551422119140625, "global_step": 284838, "epoch": 3431} {"train_loss": -25.58887481689453, "global_step": 284839, "epoch": 3431} {"train_loss": -25.868045806884766, "global_step": 284840, "epoch": 3431} {"train_loss": -25.558101654052734, "global_step": 284841, "epoch": 3431} {"train_loss": -25.559757232666016, "global_step": 284842, "epoch": 3431} {"train_loss": -25.805200576782227, "global_step": 284843, "epoch": 3431} {"train_loss": -25.51642608642578, "global_step": 284844, "epoch": 3431} {"train_loss": -25.537918090820312, "global_step": 284845, "epoch": 3431} {"train_loss": -25.275957107543945, "global_step": 284846, "epoch": 3431} {"train_loss": -25.871612548828125, "global_step": 284847, "epoch": 3431} {"train_loss": -25.291200637817383, "global_step": 284848, "epoch": 3431} {"train_loss": -25.62607765197754, "global_step": 284849, "epoch": 3431} {"train_loss": -25.020124435424805, "global_step": 284850, "epoch": 3431} {"train_loss": -25.201684951782227, "global_step": 284851, "epoch": 3431} {"train_loss": -25.60498046875, "global_step": 284852, "epoch": 3431} {"train_loss": -25.47442626953125, "global_step": 284853, "epoch": 3431} {"train_loss": -25.83243179321289, "global_step": 284854, "epoch": 3431} {"train_loss": -25.389045669371825, "global_step": 284855, "epoch": 3431, "val_loss": 7155099.5} {"train_loss": -25.585391998291016, "global_step": 284856, "epoch": 3432} {"train_loss": -25.079389572143555, "global_step": 284857, "epoch": 3432} {"train_loss": -25.350278854370117, "global_step": 284858, "epoch": 3432} {"train_loss": -25.261526107788086, "global_step": 284859, "epoch": 3432} {"train_loss": -24.933874130249023, "global_step": 284860, "epoch": 3432} {"train_loss": -25.57364273071289, "global_step": 284861, "epoch": 3432} {"train_loss": -24.647497177124023, "global_step": 284862, "epoch": 3432} {"train_loss": -25.151151657104492, "global_step": 284863, "epoch": 3432} {"train_loss": -24.711198806762695, "global_step": 284864, "epoch": 3432} {"train_loss": -25.171344757080078, "global_step": 284865, "epoch": 3432} {"train_loss": -25.072797775268555, "global_step": 284866, "epoch": 3432} {"train_loss": -25.09837532043457, "global_step": 284867, "epoch": 3432} {"train_loss": -25.33522605895996, "global_step": 284868, "epoch": 3432} {"train_loss": -25.08330726623535, "global_step": 284869, "epoch": 3432} {"train_loss": -25.866819381713867, "global_step": 284870, "epoch": 3432} {"train_loss": -25.258955001831055, "global_step": 284871, "epoch": 3432} {"train_loss": -25.421310424804688, "global_step": 284872, "epoch": 3432} {"train_loss": -24.97100257873535, "global_step": 284873, "epoch": 3432} {"train_loss": -25.415945053100586, "global_step": 284874, "epoch": 3432} {"train_loss": -25.944232940673828, "global_step": 284875, "epoch": 3432} {"train_loss": -25.582056045532227, "global_step": 284876, "epoch": 3432} {"train_loss": -25.425756454467773, "global_step": 284877, "epoch": 3432} {"train_loss": -25.387475967407227, "global_step": 284878, "epoch": 3432} {"train_loss": -25.443408966064453, "global_step": 284879, "epoch": 3432} {"train_loss": -25.523244857788086, "global_step": 284880, "epoch": 3432} {"train_loss": -25.07844352722168, "global_step": 284881, "epoch": 3432} {"train_loss": -25.372329711914062, "global_step": 284882, "epoch": 3432} {"train_loss": -25.386980056762695, "global_step": 284883, "epoch": 3432} {"train_loss": -25.50265121459961, "global_step": 284884, "epoch": 3432} {"train_loss": -25.63788414001465, "global_step": 284885, "epoch": 3432} {"train_loss": -25.53297996520996, "global_step": 284886, "epoch": 3432} {"train_loss": -25.39280891418457, "global_step": 284887, "epoch": 3432} {"train_loss": -25.29486656188965, "global_step": 284888, "epoch": 3432} {"train_loss": -26.096662521362305, "global_step": 284889, "epoch": 3432} {"train_loss": -25.312183380126953, "global_step": 284890, "epoch": 3432} {"train_loss": -25.096914291381836, "global_step": 284891, "epoch": 3432} {"train_loss": -25.536962509155273, "global_step": 284892, "epoch": 3432} {"train_loss": -25.543664932250977, "global_step": 284893, "epoch": 3432} {"train_loss": -25.75864601135254, "global_step": 284894, "epoch": 3432} {"train_loss": -25.44685173034668, "global_step": 284895, "epoch": 3432} {"train_loss": -25.517126083374023, "global_step": 284896, "epoch": 3432} {"train_loss": -25.42951011657715, "global_step": 284897, "epoch": 3432} {"train_loss": -24.909236907958984, "global_step": 284898, "epoch": 3432} {"train_loss": -25.16562271118164, "global_step": 284899, "epoch": 3432} {"train_loss": -25.050161361694336, "global_step": 284900, "epoch": 3432} {"train_loss": -24.70197868347168, "global_step": 284901, "epoch": 3432} {"train_loss": -24.988576889038086, "global_step": 284902, "epoch": 3432} {"train_loss": -25.244247436523438, "global_step": 284903, "epoch": 3432} {"train_loss": -25.575632095336914, "global_step": 284904, "epoch": 3432} {"train_loss": -25.67547035217285, "global_step": 284905, "epoch": 3432} {"train_loss": -25.1446590423584, "global_step": 284906, "epoch": 3432} {"train_loss": -25.6539306640625, "global_step": 284907, "epoch": 3432} {"train_loss": -25.045101165771484, "global_step": 284908, "epoch": 3432} {"train_loss": -25.105905532836914, "global_step": 284909, "epoch": 3432} {"train_loss": -25.215360641479492, "global_step": 284910, "epoch": 3432} {"train_loss": -25.06597900390625, "global_step": 284911, "epoch": 3432} {"train_loss": -25.574071884155273, "global_step": 284912, "epoch": 3432} {"train_loss": -25.31206703186035, "global_step": 284913, "epoch": 3432} {"train_loss": -25.34640121459961, "global_step": 284914, "epoch": 3432} {"train_loss": -25.46110725402832, "global_step": 284915, "epoch": 3432} {"train_loss": -25.5596923828125, "global_step": 284916, "epoch": 3432} {"train_loss": -25.786636352539062, "global_step": 284917, "epoch": 3432} {"train_loss": -25.6618709564209, "global_step": 284918, "epoch": 3432} {"train_loss": -25.1959285736084, "global_step": 284919, "epoch": 3432} {"train_loss": -25.430784225463867, "global_step": 284920, "epoch": 3432} {"train_loss": -25.42659568786621, "global_step": 284921, "epoch": 3432} {"train_loss": -25.710474014282227, "global_step": 284922, "epoch": 3432} {"train_loss": -25.448850631713867, "global_step": 284923, "epoch": 3432} {"train_loss": -25.52195167541504, "global_step": 284924, "epoch": 3432} {"train_loss": -25.58743667602539, "global_step": 284925, "epoch": 3432} {"train_loss": -25.44411849975586, "global_step": 284926, "epoch": 3432} {"train_loss": -25.569684982299805, "global_step": 284927, "epoch": 3432} {"train_loss": -25.696813583374023, "global_step": 284928, "epoch": 3432} {"train_loss": -25.905200958251953, "global_step": 284929, "epoch": 3432} {"train_loss": -25.375974655151367, "global_step": 284930, "epoch": 3432} {"train_loss": -25.41983985900879, "global_step": 284931, "epoch": 3432} {"train_loss": -25.426403045654297, "global_step": 284932, "epoch": 3432} {"train_loss": -25.737213134765625, "global_step": 284933, "epoch": 3432} {"train_loss": -25.725982666015625, "global_step": 284934, "epoch": 3432} {"train_loss": -24.80143928527832, "global_step": 284935, "epoch": 3432} {"train_loss": -25.311857223510742, "global_step": 284936, "epoch": 3432} {"train_loss": -25.15126609802246, "global_step": 284937, "epoch": 3432} {"train_loss": -25.35393581620182, "global_step": 284938, "epoch": 3432, "val_loss": 7225971.5} {"train_loss": -24.83300018310547, "global_step": 284939, "epoch": 3433} {"train_loss": -24.09236717224121, "global_step": 284940, "epoch": 3433} {"train_loss": -24.679040908813477, "global_step": 284941, "epoch": 3433} {"train_loss": -24.479751586914062, "global_step": 284942, "epoch": 3433} {"train_loss": -25.15632438659668, "global_step": 284943, "epoch": 3433} {"train_loss": -24.520475387573242, "global_step": 284944, "epoch": 3433} {"train_loss": -25.271438598632812, "global_step": 284945, "epoch": 3433} {"train_loss": -24.539310455322266, "global_step": 284946, "epoch": 3433} {"train_loss": -25.201061248779297, "global_step": 284947, "epoch": 3433} {"train_loss": -24.861934661865234, "global_step": 284948, "epoch": 3433} {"train_loss": -24.843992233276367, "global_step": 284949, "epoch": 3433} {"train_loss": -25.39250946044922, "global_step": 284950, "epoch": 3433} {"train_loss": -25.349151611328125, "global_step": 284951, "epoch": 3433} {"train_loss": -24.740806579589844, "global_step": 284952, "epoch": 3433} {"train_loss": -25.14472198486328, "global_step": 284953, "epoch": 3433} {"train_loss": -25.109561920166016, "global_step": 284954, "epoch": 3433} {"train_loss": -25.007843017578125, "global_step": 284955, "epoch": 3433} {"train_loss": -25.30653190612793, "global_step": 284956, "epoch": 3433} {"train_loss": -24.95010757446289, "global_step": 284957, "epoch": 3433} {"train_loss": -25.135604858398438, "global_step": 284958, "epoch": 3433} {"train_loss": -25.428205490112305, "global_step": 284959, "epoch": 3433} {"train_loss": -25.275617599487305, "global_step": 284960, "epoch": 3433} {"train_loss": -25.280597686767578, "global_step": 284961, "epoch": 3433} {"train_loss": -25.394269943237305, "global_step": 284962, "epoch": 3433} {"train_loss": -25.61199951171875, "global_step": 284963, "epoch": 3433} {"train_loss": -25.286409378051758, "global_step": 284964, "epoch": 3433} {"train_loss": -25.62892723083496, "global_step": 284965, "epoch": 3433} {"train_loss": -25.453357696533203, "global_step": 284966, "epoch": 3433} {"train_loss": -25.246768951416016, "global_step": 284967, "epoch": 3433} {"train_loss": -25.271190643310547, "global_step": 284968, "epoch": 3433} {"train_loss": -25.82781982421875, "global_step": 284969, "epoch": 3433} {"train_loss": -25.919355392456055, "global_step": 284970, "epoch": 3433} {"train_loss": -25.46082878112793, "global_step": 284971, "epoch": 3433} {"train_loss": -25.47102165222168, "global_step": 284972, "epoch": 3433} {"train_loss": -25.5105037689209, "global_step": 284973, "epoch": 3433} {"train_loss": -25.687429428100586, "global_step": 284974, "epoch": 3433} {"train_loss": -25.869848251342773, "global_step": 284975, "epoch": 3433} {"train_loss": -25.463031768798828, "global_step": 284976, "epoch": 3433} {"train_loss": -25.4235897064209, "global_step": 284977, "epoch": 3433} {"train_loss": -25.496692657470703, "global_step": 284978, "epoch": 3433} {"train_loss": -25.438358306884766, "global_step": 284979, "epoch": 3433} {"train_loss": -25.585426330566406, "global_step": 284980, "epoch": 3433} {"train_loss": -25.820789337158203, "global_step": 284981, "epoch": 3433} {"train_loss": -25.798227310180664, "global_step": 284982, "epoch": 3433} {"train_loss": -26.028772354125977, "global_step": 284983, "epoch": 3433} {"train_loss": -25.475461959838867, "global_step": 284984, "epoch": 3433} {"train_loss": -25.886764526367188, "global_step": 284985, "epoch": 3433} {"train_loss": -25.502546310424805, "global_step": 284986, "epoch": 3433} {"train_loss": -25.870792388916016, "global_step": 284987, "epoch": 3433} {"train_loss": -25.626819610595703, "global_step": 284988, "epoch": 3433} {"train_loss": -25.764423370361328, "global_step": 284989, "epoch": 3433} {"train_loss": -25.403995513916016, "global_step": 284990, "epoch": 3433} {"train_loss": -25.53425407409668, "global_step": 284991, "epoch": 3433} {"train_loss": -25.631521224975586, "global_step": 284992, "epoch": 3433} {"train_loss": -25.180585861206055, "global_step": 284993, "epoch": 3433} {"train_loss": -25.43427085876465, "global_step": 284994, "epoch": 3433} {"train_loss": -24.696338653564453, "global_step": 284995, "epoch": 3433} {"train_loss": -24.208982467651367, "global_step": 284996, "epoch": 3433} {"train_loss": -24.677289962768555, "global_step": 284997, "epoch": 3433} {"train_loss": -25.189144134521484, "global_step": 284998, "epoch": 3433} {"train_loss": -24.639333724975586, "global_step": 284999, "epoch": 3433} {"train_loss": -24.891382217407227, "global_step": 285000, "epoch": 3433} {"train_loss": -25.567419052124023, "global_step": 285001, "epoch": 3433} {"train_loss": -25.059167861938477, "global_step": 285002, "epoch": 3433} {"train_loss": -24.826807022094727, "global_step": 285003, "epoch": 3433} {"train_loss": -24.94891929626465, "global_step": 285004, "epoch": 3433} {"train_loss": -25.30342674255371, "global_step": 285005, "epoch": 3433} {"train_loss": -24.940214157104492, "global_step": 285006, "epoch": 3433} {"train_loss": -25.14032745361328, "global_step": 285007, "epoch": 3433} {"train_loss": -25.202259063720703, "global_step": 285008, "epoch": 3433} {"train_loss": -25.16139793395996, "global_step": 285009, "epoch": 3433} {"train_loss": -25.114761352539062, "global_step": 285010, "epoch": 3433} {"train_loss": -24.789587020874023, "global_step": 285011, "epoch": 3433} {"train_loss": -24.68794059753418, "global_step": 285012, "epoch": 3433} {"train_loss": -25.145156860351562, "global_step": 285013, "epoch": 3433} {"train_loss": -25.025251388549805, "global_step": 285014, "epoch": 3433} {"train_loss": -25.412887573242188, "global_step": 285015, "epoch": 3433} {"train_loss": -25.39901351928711, "global_step": 285016, "epoch": 3433} {"train_loss": -25.243850708007812, "global_step": 285017, "epoch": 3433} {"train_loss": -25.49032211303711, "global_step": 285018, "epoch": 3433} {"train_loss": -25.70111656188965, "global_step": 285019, "epoch": 3433} {"train_loss": -25.64719009399414, "global_step": 285020, "epoch": 3433} {"train_loss": -25.25887657073607, "global_step": 285021, "epoch": 3433, "val_loss": 7012803.0} {"train_loss": -25.544200897216797, "global_step": 285022, "epoch": 3434} {"train_loss": -25.556550979614258, "global_step": 285023, "epoch": 3434} {"train_loss": -25.176013946533203, "global_step": 285024, "epoch": 3434} {"train_loss": -25.732303619384766, "global_step": 285025, "epoch": 3434} {"train_loss": -25.119720458984375, "global_step": 285026, "epoch": 3434} {"train_loss": -25.491466522216797, "global_step": 285027, "epoch": 3434} {"train_loss": -25.686193466186523, "global_step": 285028, "epoch": 3434} {"train_loss": -25.321622848510742, "global_step": 285029, "epoch": 3434} {"train_loss": -25.74993896484375, "global_step": 285030, "epoch": 3434} {"train_loss": -25.001991271972656, "global_step": 285031, "epoch": 3434} {"train_loss": -25.559492111206055, "global_step": 285032, "epoch": 3434} {"train_loss": -25.444658279418945, "global_step": 285033, "epoch": 3434} {"train_loss": -25.37828254699707, "global_step": 285034, "epoch": 3434} {"train_loss": -25.41095733642578, "global_step": 285035, "epoch": 3434} {"train_loss": -25.350820541381836, "global_step": 285036, "epoch": 3434} {"train_loss": -25.32019805908203, "global_step": 285037, "epoch": 3434} {"train_loss": -25.275054931640625, "global_step": 285038, "epoch": 3434} {"train_loss": -25.26869010925293, "global_step": 285039, "epoch": 3434} {"train_loss": -25.8701229095459, "global_step": 285040, "epoch": 3434} {"train_loss": -25.50826072692871, "global_step": 285041, "epoch": 3434} {"train_loss": -25.336179733276367, "global_step": 285042, "epoch": 3434} {"train_loss": -25.629074096679688, "global_step": 285043, "epoch": 3434} {"train_loss": -25.226490020751953, "global_step": 285044, "epoch": 3434} {"train_loss": -25.333255767822266, "global_step": 285045, "epoch": 3434} {"train_loss": -25.242467880249023, "global_step": 285046, "epoch": 3434} {"train_loss": -25.842016220092773, "global_step": 285047, "epoch": 3434} {"train_loss": -25.666675567626953, "global_step": 285048, "epoch": 3434} {"train_loss": -25.678674697875977, "global_step": 285049, "epoch": 3434} {"train_loss": -25.6780948638916, "global_step": 285050, "epoch": 3434} {"train_loss": -25.583829879760742, "global_step": 285051, "epoch": 3434} {"train_loss": -25.604536056518555, "global_step": 285052, "epoch": 3434} {"train_loss": -25.1485652923584, "global_step": 285053, "epoch": 3434} {"train_loss": -25.53902244567871, "global_step": 285054, "epoch": 3434} {"train_loss": -25.44419288635254, "global_step": 285055, "epoch": 3434} {"train_loss": -25.295988082885742, "global_step": 285056, "epoch": 3434} {"train_loss": -25.049270629882812, "global_step": 285057, "epoch": 3434} {"train_loss": -25.310163497924805, "global_step": 285058, "epoch": 3434} {"train_loss": -25.431533813476562, "global_step": 285059, "epoch": 3434} {"train_loss": -25.509906768798828, "global_step": 285060, "epoch": 3434} {"train_loss": -25.90272331237793, "global_step": 285061, "epoch": 3434} {"train_loss": -25.465957641601562, "global_step": 285062, "epoch": 3434} {"train_loss": -25.524099349975586, "global_step": 285063, "epoch": 3434} {"train_loss": -25.57105827331543, "global_step": 285064, "epoch": 3434} {"train_loss": -25.443470001220703, "global_step": 285065, "epoch": 3434} {"train_loss": -25.563825607299805, "global_step": 285066, "epoch": 3434} {"train_loss": -25.116056442260742, "global_step": 285067, "epoch": 3434} {"train_loss": -25.8242244720459, "global_step": 285068, "epoch": 3434} {"train_loss": -25.44540786743164, "global_step": 285069, "epoch": 3434} {"train_loss": -25.72804069519043, "global_step": 285070, "epoch": 3434} {"train_loss": -25.4724178314209, "global_step": 285071, "epoch": 3434} {"train_loss": -25.68216896057129, "global_step": 285072, "epoch": 3434} {"train_loss": -25.372846603393555, "global_step": 285073, "epoch": 3434} {"train_loss": -25.789941787719727, "global_step": 285074, "epoch": 3434} {"train_loss": -25.51637077331543, "global_step": 285075, "epoch": 3434} {"train_loss": -25.509450912475586, "global_step": 285076, "epoch": 3434} {"train_loss": -25.6435546875, "global_step": 285077, "epoch": 3434} {"train_loss": -25.31568717956543, "global_step": 285078, "epoch": 3434} {"train_loss": -25.428266525268555, "global_step": 285079, "epoch": 3434} {"train_loss": -25.51166343688965, "global_step": 285080, "epoch": 3434} {"train_loss": -25.152929306030273, "global_step": 285081, "epoch": 3434} {"train_loss": -24.861083984375, "global_step": 285082, "epoch": 3434} {"train_loss": -25.34046745300293, "global_step": 285083, "epoch": 3434} {"train_loss": -25.539113998413086, "global_step": 285084, "epoch": 3434} {"train_loss": -25.122461318969727, "global_step": 285085, "epoch": 3434} {"train_loss": -25.65842628479004, "global_step": 285086, "epoch": 3434} {"train_loss": -25.598207473754883, "global_step": 285087, "epoch": 3434} {"train_loss": -25.316801071166992, "global_step": 285088, "epoch": 3434} {"train_loss": -25.492841720581055, "global_step": 285089, "epoch": 3434} {"train_loss": -25.651325225830078, "global_step": 285090, "epoch": 3434} {"train_loss": -25.661304473876953, "global_step": 285091, "epoch": 3434} {"train_loss": -25.56637191772461, "global_step": 285092, "epoch": 3434} {"train_loss": -25.2462215423584, "global_step": 285093, "epoch": 3434} {"train_loss": -25.334369659423828, "global_step": 285094, "epoch": 3434} {"train_loss": -25.36543846130371, "global_step": 285095, "epoch": 3434} {"train_loss": -25.385435104370117, "global_step": 285096, "epoch": 3434} {"train_loss": -25.11798667907715, "global_step": 285097, "epoch": 3434} {"train_loss": -25.41678237915039, "global_step": 285098, "epoch": 3434} {"train_loss": -25.212886810302734, "global_step": 285099, "epoch": 3434} {"train_loss": -25.335693359375, "global_step": 285100, "epoch": 3434} {"train_loss": -25.664052963256836, "global_step": 285101, "epoch": 3434} {"train_loss": -25.50140953063965, "global_step": 285102, "epoch": 3434} {"train_loss": -25.429174423217773, "global_step": 285103, "epoch": 3434} {"train_loss": -25.46469840084214, "global_step": 285104, "epoch": 3434, "val_loss": 7101668.0} {"train_loss": -23.71906852722168, "global_step": 285105, "epoch": 3435} {"train_loss": -24.01068115234375, "global_step": 285106, "epoch": 3435} {"train_loss": -23.99100685119629, "global_step": 285107, "epoch": 3435} {"train_loss": -24.47471046447754, "global_step": 285108, "epoch": 3435} {"train_loss": -24.525402069091797, "global_step": 285109, "epoch": 3435} {"train_loss": -24.07831573486328, "global_step": 285110, "epoch": 3435} {"train_loss": -24.508886337280273, "global_step": 285111, "epoch": 3435} {"train_loss": -24.345430374145508, "global_step": 285112, "epoch": 3435} {"train_loss": -24.5245418548584, "global_step": 285113, "epoch": 3435} {"train_loss": -24.793720245361328, "global_step": 285114, "epoch": 3435} {"train_loss": -24.829687118530273, "global_step": 285115, "epoch": 3435} {"train_loss": -24.659841537475586, "global_step": 285116, "epoch": 3435} {"train_loss": -24.91598892211914, "global_step": 285117, "epoch": 3435} {"train_loss": -24.8377742767334, "global_step": 285118, "epoch": 3435} {"train_loss": -24.81510353088379, "global_step": 285119, "epoch": 3435} {"train_loss": -25.0733642578125, "global_step": 285120, "epoch": 3435} {"train_loss": -24.825040817260742, "global_step": 285121, "epoch": 3435} {"train_loss": -24.924402236938477, "global_step": 285122, "epoch": 3435} {"train_loss": -24.605737686157227, "global_step": 285123, "epoch": 3435} {"train_loss": -24.923749923706055, "global_step": 285124, "epoch": 3435} {"train_loss": -25.0563907623291, "global_step": 285125, "epoch": 3435} {"train_loss": -25.035154342651367, "global_step": 285126, "epoch": 3435} {"train_loss": -25.35159683227539, "global_step": 285127, "epoch": 3435} {"train_loss": -25.559574127197266, "global_step": 285128, "epoch": 3435} {"train_loss": -25.208890914916992, "global_step": 285129, "epoch": 3435} {"train_loss": -25.088232040405273, "global_step": 285130, "epoch": 3435} {"train_loss": -25.12837028503418, "global_step": 285131, "epoch": 3435} {"train_loss": -25.189117431640625, "global_step": 285132, "epoch": 3435} {"train_loss": -25.408695220947266, "global_step": 285133, "epoch": 3435} {"train_loss": -25.291322708129883, "global_step": 285134, "epoch": 3435} {"train_loss": -25.71131706237793, "global_step": 285135, "epoch": 3435} {"train_loss": -25.394874572753906, "global_step": 285136, "epoch": 3435} {"train_loss": -25.437942504882812, "global_step": 285137, "epoch": 3435} {"train_loss": -25.557064056396484, "global_step": 285138, "epoch": 3435} {"train_loss": -25.238819122314453, "global_step": 285139, "epoch": 3435} {"train_loss": -25.651620864868164, "global_step": 285140, "epoch": 3435} {"train_loss": -25.490341186523438, "global_step": 285141, "epoch": 3435} {"train_loss": -25.419084548950195, "global_step": 285142, "epoch": 3435} {"train_loss": -25.639923095703125, "global_step": 285143, "epoch": 3435} {"train_loss": -25.22768783569336, "global_step": 285144, "epoch": 3435} {"train_loss": -25.076465606689453, "global_step": 285145, "epoch": 3435} {"train_loss": -25.358734130859375, "global_step": 285146, "epoch": 3435} {"train_loss": -25.206342697143555, "global_step": 285147, "epoch": 3435} {"train_loss": -25.679553985595703, "global_step": 285148, "epoch": 3435} {"train_loss": -25.379194259643555, "global_step": 285149, "epoch": 3435} {"train_loss": -25.440597534179688, "global_step": 285150, "epoch": 3435} {"train_loss": -25.6335506439209, "global_step": 285151, "epoch": 3435} {"train_loss": -25.5432186126709, "global_step": 285152, "epoch": 3435} {"train_loss": -25.18787384033203, "global_step": 285153, "epoch": 3435} {"train_loss": -25.392181396484375, "global_step": 285154, "epoch": 3435} {"train_loss": -25.411666870117188, "global_step": 285155, "epoch": 3435} {"train_loss": -25.497224807739258, "global_step": 285156, "epoch": 3435} {"train_loss": -25.57562828063965, "global_step": 285157, "epoch": 3435} {"train_loss": -25.481735229492188, "global_step": 285158, "epoch": 3435} {"train_loss": -25.395893096923828, "global_step": 285159, "epoch": 3435} {"train_loss": -25.497079849243164, "global_step": 285160, "epoch": 3435} {"train_loss": -25.147756576538086, "global_step": 285161, "epoch": 3435} {"train_loss": -25.899518966674805, "global_step": 285162, "epoch": 3435} {"train_loss": -25.689117431640625, "global_step": 285163, "epoch": 3435} {"train_loss": -25.506328582763672, "global_step": 285164, "epoch": 3435} {"train_loss": -25.0454044342041, "global_step": 285165, "epoch": 3435} {"train_loss": -25.407163619995117, "global_step": 285166, "epoch": 3435} {"train_loss": -25.607934951782227, "global_step": 285167, "epoch": 3435} {"train_loss": -25.377365112304688, "global_step": 285168, "epoch": 3435} {"train_loss": -25.25630760192871, "global_step": 285169, "epoch": 3435} {"train_loss": -25.444730758666992, "global_step": 285170, "epoch": 3435} {"train_loss": -25.677656173706055, "global_step": 285171, "epoch": 3435} {"train_loss": -25.230955123901367, "global_step": 285172, "epoch": 3435} {"train_loss": -25.693252563476562, "global_step": 285173, "epoch": 3435} {"train_loss": -25.321701049804688, "global_step": 285174, "epoch": 3435} {"train_loss": -25.271574020385742, "global_step": 285175, "epoch": 3435} {"train_loss": -25.54010581970215, "global_step": 285176, "epoch": 3435} {"train_loss": -25.594701766967773, "global_step": 285177, "epoch": 3435} {"train_loss": -25.23023796081543, "global_step": 285178, "epoch": 3435} {"train_loss": -25.26441192626953, "global_step": 285179, "epoch": 3435} {"train_loss": -25.58182144165039, "global_step": 285180, "epoch": 3435} {"train_loss": -25.7403507232666, "global_step": 285181, "epoch": 3435} {"train_loss": -25.826414108276367, "global_step": 285182, "epoch": 3435} {"train_loss": -25.685062408447266, "global_step": 285183, "epoch": 3435} {"train_loss": -25.579513549804688, "global_step": 285184, "epoch": 3435} {"train_loss": -25.31529426574707, "global_step": 285185, "epoch": 3435} {"train_loss": -25.390628814697266, "global_step": 285186, "epoch": 3435} {"train_loss": -25.219031759055262, "global_step": 285187, "epoch": 3435, "val_loss": 7012688.0} {"train_loss": -24.96300506591797, "global_step": 285188, "epoch": 3436} {"train_loss": -24.276187896728516, "global_step": 285189, "epoch": 3436} {"train_loss": -24.012603759765625, "global_step": 285190, "epoch": 3436} {"train_loss": -24.968229293823242, "global_step": 285191, "epoch": 3436} {"train_loss": -25.18756866455078, "global_step": 285192, "epoch": 3436} {"train_loss": -24.880064010620117, "global_step": 285193, "epoch": 3436} {"train_loss": -24.97223663330078, "global_step": 285194, "epoch": 3436} {"train_loss": -24.6915225982666, "global_step": 285195, "epoch": 3436} {"train_loss": -25.424163818359375, "global_step": 285196, "epoch": 3436} {"train_loss": -24.951934814453125, "global_step": 285197, "epoch": 3436} {"train_loss": -25.739973068237305, "global_step": 285198, "epoch": 3436} {"train_loss": -24.993879318237305, "global_step": 285199, "epoch": 3436} {"train_loss": -25.343412399291992, "global_step": 285200, "epoch": 3436} {"train_loss": -24.85279655456543, "global_step": 285201, "epoch": 3436} {"train_loss": -25.05369758605957, "global_step": 285202, "epoch": 3436} {"train_loss": -25.389860153198242, "global_step": 285203, "epoch": 3436} {"train_loss": -25.19647789001465, "global_step": 285204, "epoch": 3436} {"train_loss": -25.154403686523438, "global_step": 285205, "epoch": 3436} {"train_loss": -25.55043601989746, "global_step": 285206, "epoch": 3436} {"train_loss": -25.20289421081543, "global_step": 285207, "epoch": 3436} {"train_loss": -25.424924850463867, "global_step": 285208, "epoch": 3436} {"train_loss": -25.35327911376953, "global_step": 285209, "epoch": 3436} {"train_loss": -25.224945068359375, "global_step": 285210, "epoch": 3436} {"train_loss": -25.272123336791992, "global_step": 285211, "epoch": 3436} {"train_loss": -25.291719436645508, "global_step": 285212, "epoch": 3436} {"train_loss": -25.22532081604004, "global_step": 285213, "epoch": 3436} {"train_loss": -25.58197593688965, "global_step": 285214, "epoch": 3436} {"train_loss": -25.289920806884766, "global_step": 285215, "epoch": 3436} {"train_loss": -25.311464309692383, "global_step": 285216, "epoch": 3436} {"train_loss": -25.55824851989746, "global_step": 285217, "epoch": 3436} {"train_loss": -25.420255661010742, "global_step": 285218, "epoch": 3436} {"train_loss": -25.64759635925293, "global_step": 285219, "epoch": 3436} {"train_loss": -25.58669090270996, "global_step": 285220, "epoch": 3436} {"train_loss": -25.9081974029541, "global_step": 285221, "epoch": 3436} {"train_loss": -25.448163986206055, "global_step": 285222, "epoch": 3436} {"train_loss": -25.429302215576172, "global_step": 285223, "epoch": 3436} {"train_loss": -25.681995391845703, "global_step": 285224, "epoch": 3436} {"train_loss": -25.181676864624023, "global_step": 285225, "epoch": 3436} {"train_loss": -25.326156616210938, "global_step": 285226, "epoch": 3436} {"train_loss": -25.733434677124023, "global_step": 285227, "epoch": 3436} {"train_loss": -25.664813995361328, "global_step": 285228, "epoch": 3436} {"train_loss": -25.60349464416504, "global_step": 285229, "epoch": 3436} {"train_loss": -25.397581100463867, "global_step": 285230, "epoch": 3436} {"train_loss": -25.564388275146484, "global_step": 285231, "epoch": 3436} {"train_loss": -25.37545394897461, "global_step": 285232, "epoch": 3436} {"train_loss": -25.623950958251953, "global_step": 285233, "epoch": 3436} {"train_loss": -25.699909210205078, "global_step": 285234, "epoch": 3436} {"train_loss": -25.577335357666016, "global_step": 285235, "epoch": 3436} {"train_loss": -25.457387924194336, "global_step": 285236, "epoch": 3436} {"train_loss": -25.63543701171875, "global_step": 285237, "epoch": 3436} {"train_loss": -25.539281845092773, "global_step": 285238, "epoch": 3436} {"train_loss": -25.036834716796875, "global_step": 285239, "epoch": 3436} {"train_loss": -25.52200698852539, "global_step": 285240, "epoch": 3436} {"train_loss": -25.59992790222168, "global_step": 285241, "epoch": 3436} {"train_loss": -25.608020782470703, "global_step": 285242, "epoch": 3436} {"train_loss": -25.241580963134766, "global_step": 285243, "epoch": 3436} {"train_loss": -25.040210723876953, "global_step": 285244, "epoch": 3436} {"train_loss": -25.635522842407227, "global_step": 285245, "epoch": 3436} {"train_loss": -25.2281494140625, "global_step": 285246, "epoch": 3436} {"train_loss": -24.730764389038086, "global_step": 285247, "epoch": 3436} {"train_loss": -25.866413116455078, "global_step": 285248, "epoch": 3436} {"train_loss": -25.66212272644043, "global_step": 285249, "epoch": 3436} {"train_loss": -25.166597366333008, "global_step": 285250, "epoch": 3436} {"train_loss": -25.52720069885254, "global_step": 285251, "epoch": 3436} {"train_loss": -25.577510833740234, "global_step": 285252, "epoch": 3436} {"train_loss": -25.5738468170166, "global_step": 285253, "epoch": 3436} {"train_loss": -25.794111251831055, "global_step": 285254, "epoch": 3436} {"train_loss": -25.413171768188477, "global_step": 285255, "epoch": 3436} {"train_loss": -25.704259872436523, "global_step": 285256, "epoch": 3436} {"train_loss": -25.681737899780273, "global_step": 285257, "epoch": 3436} {"train_loss": -25.515600204467773, "global_step": 285258, "epoch": 3436} {"train_loss": -25.682937622070312, "global_step": 285259, "epoch": 3436} {"train_loss": -25.562030792236328, "global_step": 285260, "epoch": 3436} {"train_loss": -25.309492111206055, "global_step": 285261, "epoch": 3436} {"train_loss": -25.51897621154785, "global_step": 285262, "epoch": 3436} {"train_loss": -25.879526138305664, "global_step": 285263, "epoch": 3436} {"train_loss": -25.429433822631836, "global_step": 285264, "epoch": 3436} {"train_loss": -25.45765495300293, "global_step": 285265, "epoch": 3436} {"train_loss": -25.220722198486328, "global_step": 285266, "epoch": 3436} {"train_loss": -26.0615291595459, "global_step": 285267, "epoch": 3436} {"train_loss": -25.45944595336914, "global_step": 285268, "epoch": 3436} {"train_loss": -25.54324722290039, "global_step": 285269, "epoch": 3436} {"train_loss": -25.37328959085855, "global_step": 285270, "epoch": 3436, "val_loss": 7072575.0} {"train_loss": -25.53526496887207, "global_step": 285271, "epoch": 3437} {"train_loss": -24.604665756225586, "global_step": 285272, "epoch": 3437} {"train_loss": -24.228904724121094, "global_step": 285273, "epoch": 3437} {"train_loss": -24.52971649169922, "global_step": 285274, "epoch": 3437} {"train_loss": -25.130943298339844, "global_step": 285275, "epoch": 3437} {"train_loss": -24.589115142822266, "global_step": 285276, "epoch": 3437} {"train_loss": -24.96315574645996, "global_step": 285277, "epoch": 3437} {"train_loss": -25.340688705444336, "global_step": 285278, "epoch": 3437} {"train_loss": -25.237138748168945, "global_step": 285279, "epoch": 3437} {"train_loss": -25.27187156677246, "global_step": 285280, "epoch": 3437} {"train_loss": -25.115787506103516, "global_step": 285281, "epoch": 3437} {"train_loss": -25.394681930541992, "global_step": 285282, "epoch": 3437} {"train_loss": -25.55316734313965, "global_step": 285283, "epoch": 3437} {"train_loss": -25.28974723815918, "global_step": 285284, "epoch": 3437} {"train_loss": -25.415512084960938, "global_step": 285285, "epoch": 3437} {"train_loss": -25.102558135986328, "global_step": 285286, "epoch": 3437} {"train_loss": -25.148733139038086, "global_step": 285287, "epoch": 3437} {"train_loss": -25.46268653869629, "global_step": 285288, "epoch": 3437} {"train_loss": -25.066059112548828, "global_step": 285289, "epoch": 3437} {"train_loss": -25.271106719970703, "global_step": 285290, "epoch": 3437} {"train_loss": -25.39202308654785, "global_step": 285291, "epoch": 3437} {"train_loss": -25.490671157836914, "global_step": 285292, "epoch": 3437} {"train_loss": -25.346853256225586, "global_step": 285293, "epoch": 3437} {"train_loss": -25.067371368408203, "global_step": 285294, "epoch": 3437} {"train_loss": -25.459379196166992, "global_step": 285295, "epoch": 3437} {"train_loss": -25.4447021484375, "global_step": 285296, "epoch": 3437} {"train_loss": -25.387571334838867, "global_step": 285297, "epoch": 3437} {"train_loss": -25.52438735961914, "global_step": 285298, "epoch": 3437} {"train_loss": -25.59114646911621, "global_step": 285299, "epoch": 3437} {"train_loss": -25.359846115112305, "global_step": 285300, "epoch": 3437} {"train_loss": -25.277658462524414, "global_step": 285301, "epoch": 3437} {"train_loss": -25.28020668029785, "global_step": 285302, "epoch": 3437} {"train_loss": -25.60177993774414, "global_step": 285303, "epoch": 3437} {"train_loss": -25.716772079467773, "global_step": 285304, "epoch": 3437} {"train_loss": -25.595611572265625, "global_step": 285305, "epoch": 3437} {"train_loss": -25.622028350830078, "global_step": 285306, "epoch": 3437} {"train_loss": -25.495508193969727, "global_step": 285307, "epoch": 3437} {"train_loss": -26.154956817626953, "global_step": 285308, "epoch": 3437} {"train_loss": -25.678577423095703, "global_step": 285309, "epoch": 3437} {"train_loss": -25.45759391784668, "global_step": 285310, "epoch": 3437} {"train_loss": -25.292348861694336, "global_step": 285311, "epoch": 3437} {"train_loss": -25.653369903564453, "global_step": 285312, "epoch": 3437} {"train_loss": -25.8485050201416, "global_step": 285313, "epoch": 3437} {"train_loss": -25.355329513549805, "global_step": 285314, "epoch": 3437} {"train_loss": -25.2215633392334, "global_step": 285315, "epoch": 3437} {"train_loss": -25.743213653564453, "global_step": 285316, "epoch": 3437} {"train_loss": -25.440149307250977, "global_step": 285317, "epoch": 3437} {"train_loss": -25.33185386657715, "global_step": 285318, "epoch": 3437} {"train_loss": -25.729633331298828, "global_step": 285319, "epoch": 3437} {"train_loss": -25.607160568237305, "global_step": 285320, "epoch": 3437} {"train_loss": -25.796873092651367, "global_step": 285321, "epoch": 3437} {"train_loss": -25.67740249633789, "global_step": 285322, "epoch": 3437} {"train_loss": -25.685211181640625, "global_step": 285323, "epoch": 3437} {"train_loss": -25.579870223999023, "global_step": 285324, "epoch": 3437} {"train_loss": -25.534521102905273, "global_step": 285325, "epoch": 3437} {"train_loss": -25.97511100769043, "global_step": 285326, "epoch": 3437} {"train_loss": -25.476057052612305, "global_step": 285327, "epoch": 3437} {"train_loss": -25.647153854370117, "global_step": 285328, "epoch": 3437} {"train_loss": -25.40776824951172, "global_step": 285329, "epoch": 3437} {"train_loss": -25.752674102783203, "global_step": 285330, "epoch": 3437} {"train_loss": -25.5754451751709, "global_step": 285331, "epoch": 3437} {"train_loss": -25.45037841796875, "global_step": 285332, "epoch": 3437} {"train_loss": -25.223445892333984, "global_step": 285333, "epoch": 3437} {"train_loss": -24.765005111694336, "global_step": 285334, "epoch": 3437} {"train_loss": -25.14143943786621, "global_step": 285335, "epoch": 3437} {"train_loss": -24.870403289794922, "global_step": 285336, "epoch": 3437} {"train_loss": -25.147857666015625, "global_step": 285337, "epoch": 3437} {"train_loss": -25.49899673461914, "global_step": 285338, "epoch": 3437} {"train_loss": -25.039358139038086, "global_step": 285339, "epoch": 3437} {"train_loss": -25.20757293701172, "global_step": 285340, "epoch": 3437} {"train_loss": -25.13797378540039, "global_step": 285341, "epoch": 3437} {"train_loss": -25.391040802001953, "global_step": 285342, "epoch": 3437} {"train_loss": -25.21836280822754, "global_step": 285343, "epoch": 3437} {"train_loss": -25.490392684936523, "global_step": 285344, "epoch": 3437} {"train_loss": -25.333255767822266, "global_step": 285345, "epoch": 3437} {"train_loss": -25.402019500732422, "global_step": 285346, "epoch": 3437} {"train_loss": -25.215280532836914, "global_step": 285347, "epoch": 3437} {"train_loss": -25.328142166137695, "global_step": 285348, "epoch": 3437} {"train_loss": -25.32396125793457, "global_step": 285349, "epoch": 3437} {"train_loss": -25.205320358276367, "global_step": 285350, "epoch": 3437} {"train_loss": -25.107465744018555, "global_step": 285351, "epoch": 3437} {"train_loss": -25.68552017211914, "global_step": 285352, "epoch": 3437} {"train_loss": -25.36655720170722, "global_step": 285353, "epoch": 3437, "val_loss": 7035081.0} {"train_loss": -24.786239624023438, "global_step": 285354, "epoch": 3438} {"train_loss": -24.232465744018555, "global_step": 285355, "epoch": 3438} {"train_loss": -24.353988647460938, "global_step": 285356, "epoch": 3438} {"train_loss": -25.284292221069336, "global_step": 285357, "epoch": 3438} {"train_loss": -25.186920166015625, "global_step": 285358, "epoch": 3438} {"train_loss": -24.491788864135742, "global_step": 285359, "epoch": 3438} {"train_loss": -24.87663459777832, "global_step": 285360, "epoch": 3438} {"train_loss": -25.037765502929688, "global_step": 285361, "epoch": 3438} {"train_loss": -24.50925064086914, "global_step": 285362, "epoch": 3438} {"train_loss": -24.992700576782227, "global_step": 285363, "epoch": 3438} {"train_loss": -24.89939308166504, "global_step": 285364, "epoch": 3438} {"train_loss": -25.290634155273438, "global_step": 285365, "epoch": 3438} {"train_loss": -24.481801986694336, "global_step": 285366, "epoch": 3438} {"train_loss": -25.067041397094727, "global_step": 285367, "epoch": 3438} {"train_loss": -25.07611656188965, "global_step": 285368, "epoch": 3438} {"train_loss": -25.250516891479492, "global_step": 285369, "epoch": 3438} {"train_loss": -25.102432250976562, "global_step": 285370, "epoch": 3438} {"train_loss": -25.142210006713867, "global_step": 285371, "epoch": 3438} {"train_loss": -25.489856719970703, "global_step": 285372, "epoch": 3438} {"train_loss": -25.171491622924805, "global_step": 285373, "epoch": 3438} {"train_loss": -25.249143600463867, "global_step": 285374, "epoch": 3438} {"train_loss": -25.32404136657715, "global_step": 285375, "epoch": 3438} {"train_loss": -25.275968551635742, "global_step": 285376, "epoch": 3438} {"train_loss": -25.08765983581543, "global_step": 285377, "epoch": 3438} {"train_loss": -24.873924255371094, "global_step": 285378, "epoch": 3438} {"train_loss": -25.1741943359375, "global_step": 285379, "epoch": 3438} {"train_loss": -25.46101188659668, "global_step": 285380, "epoch": 3438} {"train_loss": -24.899612426757812, "global_step": 285381, "epoch": 3438} {"train_loss": -25.82122802734375, "global_step": 285382, "epoch": 3438} {"train_loss": -25.46843147277832, "global_step": 285383, "epoch": 3438} {"train_loss": -25.831769943237305, "global_step": 285384, "epoch": 3438} {"train_loss": -25.500783920288086, "global_step": 285385, "epoch": 3438} {"train_loss": -25.690021514892578, "global_step": 285386, "epoch": 3438} {"train_loss": -25.7293643951416, "global_step": 285387, "epoch": 3438} {"train_loss": -25.27046012878418, "global_step": 285388, "epoch": 3438} {"train_loss": -25.285846710205078, "global_step": 285389, "epoch": 3438} {"train_loss": -25.690439224243164, "global_step": 285390, "epoch": 3438} {"train_loss": -25.19968605041504, "global_step": 285391, "epoch": 3438} {"train_loss": -25.184499740600586, "global_step": 285392, "epoch": 3438} {"train_loss": -25.527246475219727, "global_step": 285393, "epoch": 3438} {"train_loss": -25.89139175415039, "global_step": 285394, "epoch": 3438} {"train_loss": -25.25057029724121, "global_step": 285395, "epoch": 3438} {"train_loss": -25.452102661132812, "global_step": 285396, "epoch": 3438} {"train_loss": -25.338834762573242, "global_step": 285397, "epoch": 3438} {"train_loss": -25.337133407592773, "global_step": 285398, "epoch": 3438} {"train_loss": -25.548795700073242, "global_step": 285399, "epoch": 3438} {"train_loss": -25.544883728027344, "global_step": 285400, "epoch": 3438} {"train_loss": -25.540761947631836, "global_step": 285401, "epoch": 3438} {"train_loss": -25.506391525268555, "global_step": 285402, "epoch": 3438} {"train_loss": -25.6286678314209, "global_step": 285403, "epoch": 3438} {"train_loss": -25.438879013061523, "global_step": 285404, "epoch": 3438} {"train_loss": -25.45708656311035, "global_step": 285405, "epoch": 3438} {"train_loss": -25.730270385742188, "global_step": 285406, "epoch": 3438} {"train_loss": -25.551912307739258, "global_step": 285407, "epoch": 3438} {"train_loss": -25.647260665893555, "global_step": 285408, "epoch": 3438} {"train_loss": -25.415563583374023, "global_step": 285409, "epoch": 3438} {"train_loss": -25.441530227661133, "global_step": 285410, "epoch": 3438} {"train_loss": -25.59429359436035, "global_step": 285411, "epoch": 3438} {"train_loss": -25.662982940673828, "global_step": 285412, "epoch": 3438} {"train_loss": -25.956647872924805, "global_step": 285413, "epoch": 3438} {"train_loss": -25.069313049316406, "global_step": 285414, "epoch": 3438} {"train_loss": -25.53679847717285, "global_step": 285415, "epoch": 3438} {"train_loss": -25.244535446166992, "global_step": 285416, "epoch": 3438} {"train_loss": -25.758630752563477, "global_step": 285417, "epoch": 3438} {"train_loss": -25.396337509155273, "global_step": 285418, "epoch": 3438} {"train_loss": -25.626026153564453, "global_step": 285419, "epoch": 3438} {"train_loss": -25.454103469848633, "global_step": 285420, "epoch": 3438} {"train_loss": -25.76178550720215, "global_step": 285421, "epoch": 3438} {"train_loss": -25.343460083007812, "global_step": 285422, "epoch": 3438} {"train_loss": -25.48369598388672, "global_step": 285423, "epoch": 3438} {"train_loss": -25.53828239440918, "global_step": 285424, "epoch": 3438} {"train_loss": -25.794111251831055, "global_step": 285425, "epoch": 3438} {"train_loss": -25.91047477722168, "global_step": 285426, "epoch": 3438} {"train_loss": -25.480695724487305, "global_step": 285427, "epoch": 3438} {"train_loss": -25.596342086791992, "global_step": 285428, "epoch": 3438} {"train_loss": -25.579299926757812, "global_step": 285429, "epoch": 3438} {"train_loss": -25.75070571899414, "global_step": 285430, "epoch": 3438} {"train_loss": -25.439821243286133, "global_step": 285431, "epoch": 3438} {"train_loss": -25.815235137939453, "global_step": 285432, "epoch": 3438} {"train_loss": -25.333656311035156, "global_step": 285433, "epoch": 3438} {"train_loss": -25.62458610534668, "global_step": 285434, "epoch": 3438} {"train_loss": -26.117202758789062, "global_step": 285435, "epoch": 3438} {"train_loss": -25.377160658319312, "global_step": 285436, "epoch": 3438, "val_loss": 7096368.0} {"train_loss": -24.788015365600586, "global_step": 285437, "epoch": 3439} {"train_loss": -24.384153366088867, "global_step": 285438, "epoch": 3439} {"train_loss": -24.513774871826172, "global_step": 285439, "epoch": 3439} {"train_loss": -24.87322998046875, "global_step": 285440, "epoch": 3439} {"train_loss": -25.326080322265625, "global_step": 285441, "epoch": 3439} {"train_loss": -24.727506637573242, "global_step": 285442, "epoch": 3439} {"train_loss": -25.166135787963867, "global_step": 285443, "epoch": 3439} {"train_loss": -24.81845474243164, "global_step": 285444, "epoch": 3439} {"train_loss": -25.182218551635742, "global_step": 285445, "epoch": 3439} {"train_loss": -25.239301681518555, "global_step": 285446, "epoch": 3439} {"train_loss": -25.004209518432617, "global_step": 285447, "epoch": 3439} {"train_loss": -25.313180923461914, "global_step": 285448, "epoch": 3439} {"train_loss": -25.331735610961914, "global_step": 285449, "epoch": 3439} {"train_loss": -25.283811569213867, "global_step": 285450, "epoch": 3439} {"train_loss": -24.993515014648438, "global_step": 285451, "epoch": 3439} {"train_loss": -25.390844345092773, "global_step": 285452, "epoch": 3439} {"train_loss": -25.19020652770996, "global_step": 285453, "epoch": 3439} {"train_loss": -25.25392723083496, "global_step": 285454, "epoch": 3439} {"train_loss": -25.352115631103516, "global_step": 285455, "epoch": 3439} {"train_loss": -25.435632705688477, "global_step": 285456, "epoch": 3439} {"train_loss": -25.248136520385742, "global_step": 285457, "epoch": 3439} {"train_loss": -25.792577743530273, "global_step": 285458, "epoch": 3439} {"train_loss": -25.303464889526367, "global_step": 285459, "epoch": 3439} {"train_loss": -25.176177978515625, "global_step": 285460, "epoch": 3439} {"train_loss": -25.035505294799805, "global_step": 285461, "epoch": 3439} {"train_loss": -25.275318145751953, "global_step": 285462, "epoch": 3439} {"train_loss": -25.64240074157715, "global_step": 285463, "epoch": 3439} {"train_loss": -25.311447143554688, "global_step": 285464, "epoch": 3439} {"train_loss": -25.415782928466797, "global_step": 285465, "epoch": 3439} {"train_loss": -25.6973819732666, "global_step": 285466, "epoch": 3439} {"train_loss": -25.239418029785156, "global_step": 285467, "epoch": 3439} {"train_loss": -25.775726318359375, "global_step": 285468, "epoch": 3439} {"train_loss": -25.34869956970215, "global_step": 285469, "epoch": 3439} {"train_loss": -25.391904830932617, "global_step": 285470, "epoch": 3439} {"train_loss": -25.546039581298828, "global_step": 285471, "epoch": 3439} {"train_loss": -25.55305290222168, "global_step": 285472, "epoch": 3439} {"train_loss": -25.692575454711914, "global_step": 285473, "epoch": 3439} {"train_loss": -25.64252281188965, "global_step": 285474, "epoch": 3439} {"train_loss": -25.651334762573242, "global_step": 285475, "epoch": 3439} {"train_loss": -25.802204132080078, "global_step": 285476, "epoch": 3439} {"train_loss": -25.656753540039062, "global_step": 285477, "epoch": 3439} {"train_loss": -25.563175201416016, "global_step": 285478, "epoch": 3439} {"train_loss": -25.356664657592773, "global_step": 285479, "epoch": 3439} {"train_loss": -26.012365341186523, "global_step": 285480, "epoch": 3439} {"train_loss": -25.551223754882812, "global_step": 285481, "epoch": 3439} {"train_loss": -25.154163360595703, "global_step": 285482, "epoch": 3439} {"train_loss": -25.60468864440918, "global_step": 285483, "epoch": 3439} {"train_loss": -25.55000877380371, "global_step": 285484, "epoch": 3439} {"train_loss": -25.737415313720703, "global_step": 285485, "epoch": 3439} {"train_loss": -25.386938095092773, "global_step": 285486, "epoch": 3439} {"train_loss": -25.269872665405273, "global_step": 285487, "epoch": 3439} {"train_loss": -25.198333740234375, "global_step": 285488, "epoch": 3439} {"train_loss": -25.268936157226562, "global_step": 285489, "epoch": 3439} {"train_loss": -25.345338821411133, "global_step": 285490, "epoch": 3439} {"train_loss": -25.61726951599121, "global_step": 285491, "epoch": 3439} {"train_loss": -24.675952911376953, "global_step": 285492, "epoch": 3439} {"train_loss": -25.153026580810547, "global_step": 285493, "epoch": 3439} {"train_loss": -25.18531608581543, "global_step": 285494, "epoch": 3439} {"train_loss": -24.988033294677734, "global_step": 285495, "epoch": 3439} {"train_loss": -25.178152084350586, "global_step": 285496, "epoch": 3439} {"train_loss": -25.390506744384766, "global_step": 285497, "epoch": 3439} {"train_loss": -25.08522605895996, "global_step": 285498, "epoch": 3439} {"train_loss": -25.23277473449707, "global_step": 285499, "epoch": 3439} {"train_loss": -25.37253189086914, "global_step": 285500, "epoch": 3439} {"train_loss": -25.34333610534668, "global_step": 285501, "epoch": 3439} {"train_loss": -25.203176498413086, "global_step": 285502, "epoch": 3439} {"train_loss": -25.138071060180664, "global_step": 285503, "epoch": 3439} {"train_loss": -25.364151000976562, "global_step": 285504, "epoch": 3439} {"train_loss": -25.325481414794922, "global_step": 285505, "epoch": 3439} {"train_loss": -25.371437072753906, "global_step": 285506, "epoch": 3439} {"train_loss": -25.1834659576416, "global_step": 285507, "epoch": 3439} {"train_loss": -25.330717086791992, "global_step": 285508, "epoch": 3439} {"train_loss": -25.45258140563965, "global_step": 285509, "epoch": 3439} {"train_loss": -25.24885368347168, "global_step": 285510, "epoch": 3439} {"train_loss": -25.208009719848633, "global_step": 285511, "epoch": 3439} {"train_loss": -25.90484046936035, "global_step": 285512, "epoch": 3439} {"train_loss": -25.455005645751953, "global_step": 285513, "epoch": 3439} {"train_loss": -25.264402389526367, "global_step": 285514, "epoch": 3439} {"train_loss": -25.602705001831055, "global_step": 285515, "epoch": 3439} {"train_loss": -25.29237174987793, "global_step": 285516, "epoch": 3439} {"train_loss": -25.150917053222656, "global_step": 285517, "epoch": 3439} {"train_loss": -25.583311080932617, "global_step": 285518, "epoch": 3439} {"train_loss": -25.32361338512007, "global_step": 285519, "epoch": 3439, "val_loss": 7071968.0} {"train_loss": -24.824800491333008, "global_step": 285520, "epoch": 3440} {"train_loss": -25.249990463256836, "global_step": 285521, "epoch": 3440} {"train_loss": -25.009857177734375, "global_step": 285522, "epoch": 3440} {"train_loss": -25.732025146484375, "global_step": 285523, "epoch": 3440} {"train_loss": -24.77833366394043, "global_step": 285524, "epoch": 3440} {"train_loss": -24.8272647857666, "global_step": 285525, "epoch": 3440} {"train_loss": -25.093158721923828, "global_step": 285526, "epoch": 3440} {"train_loss": -24.642440795898438, "global_step": 285527, "epoch": 3440} {"train_loss": -25.393619537353516, "global_step": 285528, "epoch": 3440} {"train_loss": -24.81000328063965, "global_step": 285529, "epoch": 3440} {"train_loss": -25.472274780273438, "global_step": 285530, "epoch": 3440} {"train_loss": -25.04589080810547, "global_step": 285531, "epoch": 3440} {"train_loss": -25.508947372436523, "global_step": 285532, "epoch": 3440} {"train_loss": -25.147512435913086, "global_step": 285533, "epoch": 3440} {"train_loss": -24.852216720581055, "global_step": 285534, "epoch": 3440} {"train_loss": -25.187103271484375, "global_step": 285535, "epoch": 3440} {"train_loss": -25.180212020874023, "global_step": 285536, "epoch": 3440} {"train_loss": -25.327533721923828, "global_step": 285537, "epoch": 3440} {"train_loss": -25.32645034790039, "global_step": 285538, "epoch": 3440} {"train_loss": -25.185134887695312, "global_step": 285539, "epoch": 3440} {"train_loss": -25.352298736572266, "global_step": 285540, "epoch": 3440} {"train_loss": -25.444549560546875, "global_step": 285541, "epoch": 3440} {"train_loss": -25.34756088256836, "global_step": 285542, "epoch": 3440} {"train_loss": -25.33067512512207, "global_step": 285543, "epoch": 3440} {"train_loss": -25.38670539855957, "global_step": 285544, "epoch": 3440} {"train_loss": -25.47452735900879, "global_step": 285545, "epoch": 3440} {"train_loss": -25.66790771484375, "global_step": 285546, "epoch": 3440} {"train_loss": -25.542747497558594, "global_step": 285547, "epoch": 3440} {"train_loss": -25.419958114624023, "global_step": 285548, "epoch": 3440} {"train_loss": -25.514474868774414, "global_step": 285549, "epoch": 3440} {"train_loss": -25.54616355895996, "global_step": 285550, "epoch": 3440} {"train_loss": -25.58061981201172, "global_step": 285551, "epoch": 3440} {"train_loss": -25.27784538269043, "global_step": 285552, "epoch": 3440} {"train_loss": -25.707061767578125, "global_step": 285553, "epoch": 3440} {"train_loss": -25.401830673217773, "global_step": 285554, "epoch": 3440} {"train_loss": -25.491239547729492, "global_step": 285555, "epoch": 3440} {"train_loss": -25.57574462890625, "global_step": 285556, "epoch": 3440} {"train_loss": -25.790369033813477, "global_step": 285557, "epoch": 3440} {"train_loss": -25.484970092773438, "global_step": 285558, "epoch": 3440} {"train_loss": -25.740161895751953, "global_step": 285559, "epoch": 3440} {"train_loss": -25.46586036682129, "global_step": 285560, "epoch": 3440} {"train_loss": -25.22931480407715, "global_step": 285561, "epoch": 3440} {"train_loss": -25.53450584411621, "global_step": 285562, "epoch": 3440} {"train_loss": -25.41224479675293, "global_step": 285563, "epoch": 3440} {"train_loss": -25.492048263549805, "global_step": 285564, "epoch": 3440} {"train_loss": -25.598257064819336, "global_step": 285565, "epoch": 3440} {"train_loss": -25.687952041625977, "global_step": 285566, "epoch": 3440} {"train_loss": -25.29448890686035, "global_step": 285567, "epoch": 3440} {"train_loss": -25.20178985595703, "global_step": 285568, "epoch": 3440} {"train_loss": -25.31199073791504, "global_step": 285569, "epoch": 3440} {"train_loss": -25.87131690979004, "global_step": 285570, "epoch": 3440} {"train_loss": -25.55286979675293, "global_step": 285571, "epoch": 3440} {"train_loss": -25.42937660217285, "global_step": 285572, "epoch": 3440} {"train_loss": -25.585948944091797, "global_step": 285573, "epoch": 3440} {"train_loss": -25.322101593017578, "global_step": 285574, "epoch": 3440} {"train_loss": -25.494131088256836, "global_step": 285575, "epoch": 3440} {"train_loss": -25.580623626708984, "global_step": 285576, "epoch": 3440} {"train_loss": -25.792890548706055, "global_step": 285577, "epoch": 3440} {"train_loss": -25.394681930541992, "global_step": 285578, "epoch": 3440} {"train_loss": -25.79510498046875, "global_step": 285579, "epoch": 3440} {"train_loss": -25.697376251220703, "global_step": 285580, "epoch": 3440} {"train_loss": -26.01833152770996, "global_step": 285581, "epoch": 3440} {"train_loss": -25.567951202392578, "global_step": 285582, "epoch": 3440} {"train_loss": -25.49138832092285, "global_step": 285583, "epoch": 3440} {"train_loss": -25.577354431152344, "global_step": 285584, "epoch": 3440} {"train_loss": -25.404775619506836, "global_step": 285585, "epoch": 3440} {"train_loss": -25.705398559570312, "global_step": 285586, "epoch": 3440} {"train_loss": -25.67598533630371, "global_step": 285587, "epoch": 3440} {"train_loss": -25.448579788208008, "global_step": 285588, "epoch": 3440} {"train_loss": -25.39729118347168, "global_step": 285589, "epoch": 3440} {"train_loss": -25.36542320251465, "global_step": 285590, "epoch": 3440} {"train_loss": -25.736713409423828, "global_step": 285591, "epoch": 3440} {"train_loss": -25.84897232055664, "global_step": 285592, "epoch": 3440} {"train_loss": -25.50606346130371, "global_step": 285593, "epoch": 3440} {"train_loss": -25.210630416870117, "global_step": 285594, "epoch": 3440} {"train_loss": -25.35051918029785, "global_step": 285595, "epoch": 3440} {"train_loss": -25.40737533569336, "global_step": 285596, "epoch": 3440} {"train_loss": -25.417470932006836, "global_step": 285597, "epoch": 3440} {"train_loss": -25.40431022644043, "global_step": 285598, "epoch": 3440} {"train_loss": -25.590314865112305, "global_step": 285599, "epoch": 3440} {"train_loss": -25.608469009399414, "global_step": 285600, "epoch": 3440} {"train_loss": -25.589475631713867, "global_step": 285601, "epoch": 3440} {"train_loss": -25.402208879769567, "global_step": 285602, "epoch": 3440, "val_loss": 7052491.0} {"train_loss": -25.25629997253418, "global_step": 285603, "epoch": 3441} {"train_loss": -24.82279396057129, "global_step": 285604, "epoch": 3441} {"train_loss": -24.342227935791016, "global_step": 285605, "epoch": 3441} {"train_loss": -23.774127960205078, "global_step": 285606, "epoch": 3441} {"train_loss": -24.954364776611328, "global_step": 285607, "epoch": 3441} {"train_loss": -25.257465362548828, "global_step": 285608, "epoch": 3441} {"train_loss": -24.53609275817871, "global_step": 285609, "epoch": 3441} {"train_loss": -25.05671501159668, "global_step": 285610, "epoch": 3441} {"train_loss": -24.832666397094727, "global_step": 285611, "epoch": 3441} {"train_loss": -24.87006187438965, "global_step": 285612, "epoch": 3441} {"train_loss": -25.328296661376953, "global_step": 285613, "epoch": 3441} {"train_loss": -25.094350814819336, "global_step": 285614, "epoch": 3441} {"train_loss": -25.544443130493164, "global_step": 285615, "epoch": 3441} {"train_loss": -25.36801528930664, "global_step": 285616, "epoch": 3441} {"train_loss": -25.484149932861328, "global_step": 285617, "epoch": 3441} {"train_loss": -25.388277053833008, "global_step": 285618, "epoch": 3441} {"train_loss": -25.545833587646484, "global_step": 285619, "epoch": 3441} {"train_loss": -25.2585506439209, "global_step": 285620, "epoch": 3441} {"train_loss": -25.30719566345215, "global_step": 285621, "epoch": 3441} {"train_loss": -25.23849105834961, "global_step": 285622, "epoch": 3441} {"train_loss": -24.976783752441406, "global_step": 285623, "epoch": 3441} {"train_loss": -25.471464157104492, "global_step": 285624, "epoch": 3441} {"train_loss": -25.62904167175293, "global_step": 285625, "epoch": 3441} {"train_loss": -25.696813583374023, "global_step": 285626, "epoch": 3441} {"train_loss": -25.659210205078125, "global_step": 285627, "epoch": 3441} {"train_loss": -25.401498794555664, "global_step": 285628, "epoch": 3441} {"train_loss": -25.541168212890625, "global_step": 285629, "epoch": 3441} {"train_loss": -25.295692443847656, "global_step": 285630, "epoch": 3441} {"train_loss": -25.373783111572266, "global_step": 285631, "epoch": 3441} {"train_loss": -25.44074821472168, "global_step": 285632, "epoch": 3441} {"train_loss": -25.14501953125, "global_step": 285633, "epoch": 3441} {"train_loss": -25.17180824279785, "global_step": 285634, "epoch": 3441} {"train_loss": -25.249393463134766, "global_step": 285635, "epoch": 3441} {"train_loss": -25.498760223388672, "global_step": 285636, "epoch": 3441} {"train_loss": -25.227249145507812, "global_step": 285637, "epoch": 3441} {"train_loss": -25.51256561279297, "global_step": 285638, "epoch": 3441} {"train_loss": -25.517314910888672, "global_step": 285639, "epoch": 3441} {"train_loss": -25.382976531982422, "global_step": 285640, "epoch": 3441} {"train_loss": -25.285444259643555, "global_step": 285641, "epoch": 3441} {"train_loss": -25.857954025268555, "global_step": 285642, "epoch": 3441} {"train_loss": -25.46138572692871, "global_step": 285643, "epoch": 3441} {"train_loss": -25.513723373413086, "global_step": 285644, "epoch": 3441} {"train_loss": -25.371366500854492, "global_step": 285645, "epoch": 3441} {"train_loss": -25.591079711914062, "global_step": 285646, "epoch": 3441} {"train_loss": -25.58693504333496, "global_step": 285647, "epoch": 3441} {"train_loss": -25.387609481811523, "global_step": 285648, "epoch": 3441} {"train_loss": -25.751379013061523, "global_step": 285649, "epoch": 3441} {"train_loss": -25.529848098754883, "global_step": 285650, "epoch": 3441} {"train_loss": -25.704242706298828, "global_step": 285651, "epoch": 3441} {"train_loss": -25.821455001831055, "global_step": 285652, "epoch": 3441} {"train_loss": -26.04066276550293, "global_step": 285653, "epoch": 3441} {"train_loss": -25.40279769897461, "global_step": 285654, "epoch": 3441} {"train_loss": -25.08163833618164, "global_step": 285655, "epoch": 3441} {"train_loss": -24.874958038330078, "global_step": 285656, "epoch": 3441} {"train_loss": -24.892841339111328, "global_step": 285657, "epoch": 3441} {"train_loss": -25.008045196533203, "global_step": 285658, "epoch": 3441} {"train_loss": -25.461652755737305, "global_step": 285659, "epoch": 3441} {"train_loss": -25.274749755859375, "global_step": 285660, "epoch": 3441} {"train_loss": -25.317626953125, "global_step": 285661, "epoch": 3441} {"train_loss": -25.1127986907959, "global_step": 285662, "epoch": 3441} {"train_loss": -25.38911247253418, "global_step": 285663, "epoch": 3441} {"train_loss": -25.12038230895996, "global_step": 285664, "epoch": 3441} {"train_loss": -25.070343017578125, "global_step": 285665, "epoch": 3441} {"train_loss": -25.44089698791504, "global_step": 285666, "epoch": 3441} {"train_loss": -24.632734298706055, "global_step": 285667, "epoch": 3441} {"train_loss": -25.178680419921875, "global_step": 285668, "epoch": 3441} {"train_loss": -25.575550079345703, "global_step": 285669, "epoch": 3441} {"train_loss": -25.474950790405273, "global_step": 285670, "epoch": 3441} {"train_loss": -25.111324310302734, "global_step": 285671, "epoch": 3441} {"train_loss": -25.152690887451172, "global_step": 285672, "epoch": 3441} {"train_loss": -25.451990127563477, "global_step": 285673, "epoch": 3441} {"train_loss": -25.276329040527344, "global_step": 285674, "epoch": 3441} {"train_loss": -25.538103103637695, "global_step": 285675, "epoch": 3441} {"train_loss": -25.197980880737305, "global_step": 285676, "epoch": 3441} {"train_loss": -25.4705867767334, "global_step": 285677, "epoch": 3441} {"train_loss": -25.356721878051758, "global_step": 285678, "epoch": 3441} {"train_loss": -25.39043426513672, "global_step": 285679, "epoch": 3441} {"train_loss": -25.324195861816406, "global_step": 285680, "epoch": 3441} {"train_loss": -25.238513946533203, "global_step": 285681, "epoch": 3441} {"train_loss": -25.44696044921875, "global_step": 285682, "epoch": 3441} {"train_loss": -25.714126586914062, "global_step": 285683, "epoch": 3441} {"train_loss": -25.502805709838867, "global_step": 285684, "epoch": 3441} {"train_loss": -25.302850286644624, "global_step": 285685, "epoch": 3441, "val_loss": 7084154.5} {"train_loss": -25.188146591186523, "global_step": 285686, "epoch": 3442} {"train_loss": -25.02197265625, "global_step": 285687, "epoch": 3442} {"train_loss": -25.331939697265625, "global_step": 285688, "epoch": 3442} {"train_loss": -25.214597702026367, "global_step": 285689, "epoch": 3442} {"train_loss": -25.27699089050293, "global_step": 285690, "epoch": 3442} {"train_loss": -25.47460174560547, "global_step": 285691, "epoch": 3442} {"train_loss": -24.59235191345215, "global_step": 285692, "epoch": 3442} {"train_loss": -25.0788516998291, "global_step": 285693, "epoch": 3442} {"train_loss": -24.987964630126953, "global_step": 285694, "epoch": 3442} {"train_loss": -25.052785873413086, "global_step": 285695, "epoch": 3442} {"train_loss": -25.545169830322266, "global_step": 285696, "epoch": 3442} {"train_loss": -25.418664932250977, "global_step": 285697, "epoch": 3442} {"train_loss": -25.56117057800293, "global_step": 285698, "epoch": 3442} {"train_loss": -25.359344482421875, "global_step": 285699, "epoch": 3442} {"train_loss": -25.352888107299805, "global_step": 285700, "epoch": 3442} {"train_loss": -24.968042373657227, "global_step": 285701, "epoch": 3442} {"train_loss": -25.242740631103516, "global_step": 285702, "epoch": 3442} {"train_loss": -25.41809844970703, "global_step": 285703, "epoch": 3442} {"train_loss": -24.79167366027832, "global_step": 285704, "epoch": 3442} {"train_loss": -25.586023330688477, "global_step": 285705, "epoch": 3442} {"train_loss": -25.296146392822266, "global_step": 285706, "epoch": 3442} {"train_loss": -25.000150680541992, "global_step": 285707, "epoch": 3442} {"train_loss": -25.000551223754883, "global_step": 285708, "epoch": 3442} {"train_loss": -25.0849666595459, "global_step": 285709, "epoch": 3442} {"train_loss": -25.395193099975586, "global_step": 285710, "epoch": 3442} {"train_loss": -25.478391647338867, "global_step": 285711, "epoch": 3442} {"train_loss": -25.288101196289062, "global_step": 285712, "epoch": 3442} {"train_loss": -25.811614990234375, "global_step": 285713, "epoch": 3442} {"train_loss": -25.766284942626953, "global_step": 285714, "epoch": 3442} {"train_loss": -25.411603927612305, "global_step": 285715, "epoch": 3442} {"train_loss": -25.118131637573242, "global_step": 285716, "epoch": 3442} {"train_loss": -25.038496017456055, "global_step": 285717, "epoch": 3442} {"train_loss": -25.607791900634766, "global_step": 285718, "epoch": 3442} {"train_loss": -25.40038299560547, "global_step": 285719, "epoch": 3442} {"train_loss": -25.30735969543457, "global_step": 285720, "epoch": 3442} {"train_loss": -25.48798942565918, "global_step": 285721, "epoch": 3442} {"train_loss": -25.857481002807617, "global_step": 285722, "epoch": 3442} {"train_loss": -25.088470458984375, "global_step": 285723, "epoch": 3442} {"train_loss": -25.451780319213867, "global_step": 285724, "epoch": 3442} {"train_loss": -25.653799057006836, "global_step": 285725, "epoch": 3442} {"train_loss": -25.84280776977539, "global_step": 285726, "epoch": 3442} {"train_loss": -25.559938430786133, "global_step": 285727, "epoch": 3442} {"train_loss": -25.494115829467773, "global_step": 285728, "epoch": 3442} {"train_loss": -25.277755737304688, "global_step": 285729, "epoch": 3442} {"train_loss": -25.6038761138916, "global_step": 285730, "epoch": 3442} {"train_loss": -25.78274917602539, "global_step": 285731, "epoch": 3442} {"train_loss": -25.67958641052246, "global_step": 285732, "epoch": 3442} {"train_loss": -25.985803604125977, "global_step": 285733, "epoch": 3442} {"train_loss": -25.043378829956055, "global_step": 285734, "epoch": 3442} {"train_loss": -25.88236427307129, "global_step": 285735, "epoch": 3442} {"train_loss": -25.751422882080078, "global_step": 285736, "epoch": 3442} {"train_loss": -25.343725204467773, "global_step": 285737, "epoch": 3442} {"train_loss": -25.392337799072266, "global_step": 285738, "epoch": 3442} {"train_loss": -25.209497451782227, "global_step": 285739, "epoch": 3442} {"train_loss": -25.23923110961914, "global_step": 285740, "epoch": 3442} {"train_loss": -25.55219078063965, "global_step": 285741, "epoch": 3442} {"train_loss": -25.514846801757812, "global_step": 285742, "epoch": 3442} {"train_loss": -25.32686424255371, "global_step": 285743, "epoch": 3442} {"train_loss": -25.3675537109375, "global_step": 285744, "epoch": 3442} {"train_loss": -25.492216110229492, "global_step": 285745, "epoch": 3442} {"train_loss": -25.291973114013672, "global_step": 285746, "epoch": 3442} {"train_loss": -25.67998695373535, "global_step": 285747, "epoch": 3442} {"train_loss": -25.548826217651367, "global_step": 285748, "epoch": 3442} {"train_loss": -25.69113540649414, "global_step": 285749, "epoch": 3442} {"train_loss": -25.643768310546875, "global_step": 285750, "epoch": 3442} {"train_loss": -25.164716720581055, "global_step": 285751, "epoch": 3442} {"train_loss": -25.553016662597656, "global_step": 285752, "epoch": 3442} {"train_loss": -25.626300811767578, "global_step": 285753, "epoch": 3442} {"train_loss": -25.236631393432617, "global_step": 285754, "epoch": 3442} {"train_loss": -25.57788848876953, "global_step": 285755, "epoch": 3442} {"train_loss": -25.60047721862793, "global_step": 285756, "epoch": 3442} {"train_loss": -25.357669830322266, "global_step": 285757, "epoch": 3442} {"train_loss": -25.402002334594727, "global_step": 285758, "epoch": 3442} {"train_loss": -25.445741653442383, "global_step": 285759, "epoch": 3442} {"train_loss": -25.063026428222656, "global_step": 285760, "epoch": 3442} {"train_loss": -25.43226432800293, "global_step": 285761, "epoch": 3442} {"train_loss": -25.81245994567871, "global_step": 285762, "epoch": 3442} {"train_loss": -25.47043228149414, "global_step": 285763, "epoch": 3442} {"train_loss": -25.438596725463867, "global_step": 285764, "epoch": 3442} {"train_loss": -25.123348236083984, "global_step": 285765, "epoch": 3442} {"train_loss": -24.946792602539062, "global_step": 285766, "epoch": 3442} {"train_loss": -25.278125762939453, "global_step": 285767, "epoch": 3442} {"train_loss": -25.38302299775273, "global_step": 285768, "epoch": 3442, "val_loss": 7173720.0} {"train_loss": -22.88435935974121, "global_step": 285769, "epoch": 3443} {"train_loss": -23.4121036529541, "global_step": 285770, "epoch": 3443} {"train_loss": -24.850421905517578, "global_step": 285771, "epoch": 3443} {"train_loss": -23.74812889099121, "global_step": 285772, "epoch": 3443} {"train_loss": -24.65009880065918, "global_step": 285773, "epoch": 3443} {"train_loss": -24.565515518188477, "global_step": 285774, "epoch": 3443} {"train_loss": -24.54511070251465, "global_step": 285775, "epoch": 3443} {"train_loss": -25.04277229309082, "global_step": 285776, "epoch": 3443} {"train_loss": -24.329299926757812, "global_step": 285777, "epoch": 3443} {"train_loss": -24.935871124267578, "global_step": 285778, "epoch": 3443} {"train_loss": -24.690383911132812, "global_step": 285779, "epoch": 3443} {"train_loss": -24.650455474853516, "global_step": 285780, "epoch": 3443} {"train_loss": -24.728548049926758, "global_step": 285781, "epoch": 3443} {"train_loss": -24.89685821533203, "global_step": 285782, "epoch": 3443} {"train_loss": -24.86318588256836, "global_step": 285783, "epoch": 3443} {"train_loss": -24.62165641784668, "global_step": 285784, "epoch": 3443} {"train_loss": -25.307819366455078, "global_step": 285785, "epoch": 3443} {"train_loss": -24.9033203125, "global_step": 285786, "epoch": 3443} {"train_loss": -25.030698776245117, "global_step": 285787, "epoch": 3443} {"train_loss": -25.192045211791992, "global_step": 285788, "epoch": 3443} {"train_loss": -25.01650047302246, "global_step": 285789, "epoch": 3443} {"train_loss": -25.08616065979004, "global_step": 285790, "epoch": 3443} {"train_loss": -25.13042640686035, "global_step": 285791, "epoch": 3443} {"train_loss": -24.99000358581543, "global_step": 285792, "epoch": 3443} {"train_loss": -25.6105899810791, "global_step": 285793, "epoch": 3443} {"train_loss": -25.46497344970703, "global_step": 285794, "epoch": 3443} {"train_loss": -25.3635196685791, "global_step": 285795, "epoch": 3443} {"train_loss": -25.10390281677246, "global_step": 285796, "epoch": 3443} {"train_loss": -25.509775161743164, "global_step": 285797, "epoch": 3443} {"train_loss": -25.573516845703125, "global_step": 285798, "epoch": 3443} {"train_loss": -25.264127731323242, "global_step": 285799, "epoch": 3443} {"train_loss": -25.132205963134766, "global_step": 285800, "epoch": 3443} {"train_loss": -25.60260581970215, "global_step": 285801, "epoch": 3443} {"train_loss": -25.183279037475586, "global_step": 285802, "epoch": 3443} {"train_loss": -25.42630386352539, "global_step": 285803, "epoch": 3443} {"train_loss": -25.365631103515625, "global_step": 285804, "epoch": 3443} {"train_loss": -25.280271530151367, "global_step": 285805, "epoch": 3443} {"train_loss": -25.117050170898438, "global_step": 285806, "epoch": 3443} {"train_loss": -25.613372802734375, "global_step": 285807, "epoch": 3443} {"train_loss": -25.559186935424805, "global_step": 285808, "epoch": 3443} {"train_loss": -25.575233459472656, "global_step": 285809, "epoch": 3443} {"train_loss": -25.58347511291504, "global_step": 285810, "epoch": 3443} {"train_loss": -25.148223876953125, "global_step": 285811, "epoch": 3443} {"train_loss": -25.523300170898438, "global_step": 285812, "epoch": 3443} {"train_loss": -25.62616539001465, "global_step": 285813, "epoch": 3443} {"train_loss": -25.462812423706055, "global_step": 285814, "epoch": 3443} {"train_loss": -25.5968017578125, "global_step": 285815, "epoch": 3443} {"train_loss": -25.589086532592773, "global_step": 285816, "epoch": 3443} {"train_loss": -25.62786865234375, "global_step": 285817, "epoch": 3443} {"train_loss": -25.483579635620117, "global_step": 285818, "epoch": 3443} {"train_loss": -25.595458984375, "global_step": 285819, "epoch": 3443} {"train_loss": -25.677515029907227, "global_step": 285820, "epoch": 3443} {"train_loss": -25.595983505249023, "global_step": 285821, "epoch": 3443} {"train_loss": -25.587255477905273, "global_step": 285822, "epoch": 3443} {"train_loss": -25.883438110351562, "global_step": 285823, "epoch": 3443} {"train_loss": -25.428119659423828, "global_step": 285824, "epoch": 3443} {"train_loss": -25.870227813720703, "global_step": 285825, "epoch": 3443} {"train_loss": -25.619110107421875, "global_step": 285826, "epoch": 3443} {"train_loss": -25.15814781188965, "global_step": 285827, "epoch": 3443} {"train_loss": -24.904211044311523, "global_step": 285828, "epoch": 3443} {"train_loss": -24.76095962524414, "global_step": 285829, "epoch": 3443} {"train_loss": -25.70940589904785, "global_step": 285830, "epoch": 3443} {"train_loss": -25.03242301940918, "global_step": 285831, "epoch": 3443} {"train_loss": -24.929340362548828, "global_step": 285832, "epoch": 3443} {"train_loss": -24.91273307800293, "global_step": 285833, "epoch": 3443} {"train_loss": -25.466115951538086, "global_step": 285834, "epoch": 3443} {"train_loss": -25.380523681640625, "global_step": 285835, "epoch": 3443} {"train_loss": -25.567005157470703, "global_step": 285836, "epoch": 3443} {"train_loss": -25.378555297851562, "global_step": 285837, "epoch": 3443} {"train_loss": -25.550636291503906, "global_step": 285838, "epoch": 3443} {"train_loss": -25.618118286132812, "global_step": 285839, "epoch": 3443} {"train_loss": -25.10587501525879, "global_step": 285840, "epoch": 3443} {"train_loss": -25.46084976196289, "global_step": 285841, "epoch": 3443} {"train_loss": -25.093618392944336, "global_step": 285842, "epoch": 3443} {"train_loss": -25.467973709106445, "global_step": 285843, "epoch": 3443} {"train_loss": -25.240009307861328, "global_step": 285844, "epoch": 3443} {"train_loss": -25.278532028198242, "global_step": 285845, "epoch": 3443} {"train_loss": -25.524810791015625, "global_step": 285846, "epoch": 3443} {"train_loss": -25.18438148498535, "global_step": 285847, "epoch": 3443} {"train_loss": -25.418954849243164, "global_step": 285848, "epoch": 3443} {"train_loss": -25.081594467163086, "global_step": 285849, "epoch": 3443} {"train_loss": -25.426237106323242, "global_step": 285850, "epoch": 3443} {"train_loss": -25.191453152392285, "global_step": 285851, "epoch": 3443, "val_loss": 7201587.0} {"train_loss": -24.743207931518555, "global_step": 285852, "epoch": 3444} {"train_loss": -25.459802627563477, "global_step": 285853, "epoch": 3444} {"train_loss": -24.927587509155273, "global_step": 285854, "epoch": 3444} {"train_loss": -24.845483779907227, "global_step": 285855, "epoch": 3444} {"train_loss": -24.59394073486328, "global_step": 285856, "epoch": 3444} {"train_loss": -25.366531372070312, "global_step": 285857, "epoch": 3444} {"train_loss": -25.165205001831055, "global_step": 285858, "epoch": 3444} {"train_loss": -25.139551162719727, "global_step": 285859, "epoch": 3444} {"train_loss": -25.42450523376465, "global_step": 285860, "epoch": 3444} {"train_loss": -25.076799392700195, "global_step": 285861, "epoch": 3444} {"train_loss": -25.420866012573242, "global_step": 285862, "epoch": 3444} {"train_loss": -25.13857650756836, "global_step": 285863, "epoch": 3444} {"train_loss": -25.018306732177734, "global_step": 285864, "epoch": 3444} {"train_loss": -25.681589126586914, "global_step": 285865, "epoch": 3444} {"train_loss": -25.262407302856445, "global_step": 285866, "epoch": 3444} {"train_loss": -25.076047897338867, "global_step": 285867, "epoch": 3444} {"train_loss": -25.2901554107666, "global_step": 285868, "epoch": 3444} {"train_loss": -25.386356353759766, "global_step": 285869, "epoch": 3444} {"train_loss": -25.3396053314209, "global_step": 285870, "epoch": 3444} {"train_loss": -25.783720016479492, "global_step": 285871, "epoch": 3444} {"train_loss": -25.37818145751953, "global_step": 285872, "epoch": 3444} {"train_loss": -25.60597038269043, "global_step": 285873, "epoch": 3444} {"train_loss": -25.475582122802734, "global_step": 285874, "epoch": 3444} {"train_loss": -25.342914581298828, "global_step": 285875, "epoch": 3444} {"train_loss": -25.65408706665039, "global_step": 285876, "epoch": 3444} {"train_loss": -25.849700927734375, "global_step": 285877, "epoch": 3444} {"train_loss": -25.765844345092773, "global_step": 285878, "epoch": 3444} {"train_loss": -25.9239559173584, "global_step": 285879, "epoch": 3444} {"train_loss": -25.649219512939453, "global_step": 285880, "epoch": 3444} {"train_loss": -25.838693618774414, "global_step": 285881, "epoch": 3444} {"train_loss": -25.498708724975586, "global_step": 285882, "epoch": 3444} {"train_loss": -25.45699119567871, "global_step": 285883, "epoch": 3444} {"train_loss": -25.278858184814453, "global_step": 285884, "epoch": 3444} {"train_loss": -25.603689193725586, "global_step": 285885, "epoch": 3444} {"train_loss": -25.569326400756836, "global_step": 285886, "epoch": 3444} {"train_loss": -25.574106216430664, "global_step": 285887, "epoch": 3444} {"train_loss": -24.92901039123535, "global_step": 285888, "epoch": 3444} {"train_loss": -25.539487838745117, "global_step": 285889, "epoch": 3444} {"train_loss": -25.26677703857422, "global_step": 285890, "epoch": 3444} {"train_loss": -25.676584243774414, "global_step": 285891, "epoch": 3444} {"train_loss": -25.329910278320312, "global_step": 285892, "epoch": 3444} {"train_loss": -25.373443603515625, "global_step": 285893, "epoch": 3444} {"train_loss": -25.651111602783203, "global_step": 285894, "epoch": 3444} {"train_loss": -25.48012351989746, "global_step": 285895, "epoch": 3444} {"train_loss": -25.67695426940918, "global_step": 285896, "epoch": 3444} {"train_loss": -25.207706451416016, "global_step": 285897, "epoch": 3444} {"train_loss": -25.42500877380371, "global_step": 285898, "epoch": 3444} {"train_loss": -25.274991989135742, "global_step": 285899, "epoch": 3444} {"train_loss": -25.384004592895508, "global_step": 285900, "epoch": 3444} {"train_loss": -25.21221351623535, "global_step": 285901, "epoch": 3444} {"train_loss": -25.368783950805664, "global_step": 285902, "epoch": 3444} {"train_loss": -25.414546966552734, "global_step": 285903, "epoch": 3444} {"train_loss": -25.319232940673828, "global_step": 285904, "epoch": 3444} {"train_loss": -25.6921443939209, "global_step": 285905, "epoch": 3444} {"train_loss": -25.677331924438477, "global_step": 285906, "epoch": 3444} {"train_loss": -25.767303466796875, "global_step": 285907, "epoch": 3444} {"train_loss": -25.285417556762695, "global_step": 285908, "epoch": 3444} {"train_loss": -25.71461296081543, "global_step": 285909, "epoch": 3444} {"train_loss": -25.4051570892334, "global_step": 285910, "epoch": 3444} {"train_loss": -25.512174606323242, "global_step": 285911, "epoch": 3444} {"train_loss": -25.860681533813477, "global_step": 285912, "epoch": 3444} {"train_loss": -25.59761619567871, "global_step": 285913, "epoch": 3444} {"train_loss": -25.517942428588867, "global_step": 285914, "epoch": 3444} {"train_loss": -25.763935089111328, "global_step": 285915, "epoch": 3444} {"train_loss": -25.5054931640625, "global_step": 285916, "epoch": 3444} {"train_loss": -25.514890670776367, "global_step": 285917, "epoch": 3444} {"train_loss": -25.68471336364746, "global_step": 285918, "epoch": 3444} {"train_loss": -25.25714111328125, "global_step": 285919, "epoch": 3444} {"train_loss": -25.705923080444336, "global_step": 285920, "epoch": 3444} {"train_loss": -25.91327476501465, "global_step": 285921, "epoch": 3444} {"train_loss": -25.915334701538086, "global_step": 285922, "epoch": 3444} {"train_loss": -25.667890548706055, "global_step": 285923, "epoch": 3444} {"train_loss": -25.672107696533203, "global_step": 285924, "epoch": 3444} {"train_loss": -25.45094108581543, "global_step": 285925, "epoch": 3444} {"train_loss": -25.365299224853516, "global_step": 285926, "epoch": 3444} {"train_loss": -25.391613006591797, "global_step": 285927, "epoch": 3444} {"train_loss": -25.636112213134766, "global_step": 285928, "epoch": 3444} {"train_loss": -26.11246109008789, "global_step": 285929, "epoch": 3444} {"train_loss": -25.318632125854492, "global_step": 285930, "epoch": 3444} {"train_loss": -25.5311336517334, "global_step": 285931, "epoch": 3444} {"train_loss": -25.563732147216797, "global_step": 285932, "epoch": 3444} {"train_loss": -25.330774307250977, "global_step": 285933, "epoch": 3444} {"train_loss": -25.457489289433124, "global_step": 285934, "epoch": 3444, "val_loss": 7068423.0} {"train_loss": -25.036285400390625, "global_step": 285935, "epoch": 3445} {"train_loss": -24.482032775878906, "global_step": 285936, "epoch": 3445} {"train_loss": -24.39399528503418, "global_step": 285937, "epoch": 3445} {"train_loss": -24.742084503173828, "global_step": 285938, "epoch": 3445} {"train_loss": -24.768110275268555, "global_step": 285939, "epoch": 3445} {"train_loss": -24.464794158935547, "global_step": 285940, "epoch": 3445} {"train_loss": -25.17655372619629, "global_step": 285941, "epoch": 3445} {"train_loss": -25.081533432006836, "global_step": 285942, "epoch": 3445} {"train_loss": -25.13431167602539, "global_step": 285943, "epoch": 3445} {"train_loss": -24.668869018554688, "global_step": 285944, "epoch": 3445} {"train_loss": -25.470447540283203, "global_step": 285945, "epoch": 3445} {"train_loss": -24.974912643432617, "global_step": 285946, "epoch": 3445} {"train_loss": -25.209903717041016, "global_step": 285947, "epoch": 3445} {"train_loss": -25.24440574645996, "global_step": 285948, "epoch": 3445} {"train_loss": -25.33369255065918, "global_step": 285949, "epoch": 3445} {"train_loss": -25.34491539001465, "global_step": 285950, "epoch": 3445} {"train_loss": -25.113004684448242, "global_step": 285951, "epoch": 3445} {"train_loss": -25.062097549438477, "global_step": 285952, "epoch": 3445} {"train_loss": -24.97133445739746, "global_step": 285953, "epoch": 3445} {"train_loss": -25.27989387512207, "global_step": 285954, "epoch": 3445} {"train_loss": -25.341135025024414, "global_step": 285955, "epoch": 3445} {"train_loss": -25.36897087097168, "global_step": 285956, "epoch": 3445} {"train_loss": -25.30064582824707, "global_step": 285957, "epoch": 3445} {"train_loss": -25.272430419921875, "global_step": 285958, "epoch": 3445} {"train_loss": -25.369871139526367, "global_step": 285959, "epoch": 3445} {"train_loss": -25.361051559448242, "global_step": 285960, "epoch": 3445} {"train_loss": -25.353530883789062, "global_step": 285961, "epoch": 3445} {"train_loss": -25.474905014038086, "global_step": 285962, "epoch": 3445} {"train_loss": -25.333349227905273, "global_step": 285963, "epoch": 3445} {"train_loss": -25.763595581054688, "global_step": 285964, "epoch": 3445} {"train_loss": -25.603139877319336, "global_step": 285965, "epoch": 3445} {"train_loss": -25.417390823364258, "global_step": 285966, "epoch": 3445} {"train_loss": -25.608381271362305, "global_step": 285967, "epoch": 3445} {"train_loss": -25.411348342895508, "global_step": 285968, "epoch": 3445} {"train_loss": -25.57390785217285, "global_step": 285969, "epoch": 3445} {"train_loss": -25.7884578704834, "global_step": 285970, "epoch": 3445} {"train_loss": -25.730871200561523, "global_step": 285971, "epoch": 3445} {"train_loss": -25.47256088256836, "global_step": 285972, "epoch": 3445} {"train_loss": -25.329158782958984, "global_step": 285973, "epoch": 3445} {"train_loss": -25.637561798095703, "global_step": 285974, "epoch": 3445} {"train_loss": -25.6982421875, "global_step": 285975, "epoch": 3445} {"train_loss": -25.44811248779297, "global_step": 285976, "epoch": 3445} {"train_loss": -25.589792251586914, "global_step": 285977, "epoch": 3445} {"train_loss": -25.666406631469727, "global_step": 285978, "epoch": 3445} {"train_loss": -25.792118072509766, "global_step": 285979, "epoch": 3445} {"train_loss": -25.99098014831543, "global_step": 285980, "epoch": 3445} {"train_loss": -25.674097061157227, "global_step": 285981, "epoch": 3445} {"train_loss": -25.537277221679688, "global_step": 285982, "epoch": 3445} {"train_loss": -25.77072525024414, "global_step": 285983, "epoch": 3445} {"train_loss": -25.478368759155273, "global_step": 285984, "epoch": 3445} {"train_loss": -25.777196884155273, "global_step": 285985, "epoch": 3445} {"train_loss": -25.303640365600586, "global_step": 285986, "epoch": 3445} {"train_loss": -25.6772518157959, "global_step": 285987, "epoch": 3445} {"train_loss": -25.75186538696289, "global_step": 285988, "epoch": 3445} {"train_loss": -25.61195182800293, "global_step": 285989, "epoch": 3445} {"train_loss": -25.268590927124023, "global_step": 285990, "epoch": 3445} {"train_loss": -25.13003158569336, "global_step": 285991, "epoch": 3445} {"train_loss": -25.42122459411621, "global_step": 285992, "epoch": 3445} {"train_loss": -25.527822494506836, "global_step": 285993, "epoch": 3445} {"train_loss": -25.923070907592773, "global_step": 285994, "epoch": 3445} {"train_loss": -25.297285079956055, "global_step": 285995, "epoch": 3445} {"train_loss": -25.53020668029785, "global_step": 285996, "epoch": 3445} {"train_loss": -25.650182723999023, "global_step": 285997, "epoch": 3445} {"train_loss": -25.802886962890625, "global_step": 285998, "epoch": 3445} {"train_loss": -25.739566802978516, "global_step": 285999, "epoch": 3445} {"train_loss": -25.670379638671875, "global_step": 286000, "epoch": 3445} {"train_loss": -25.832489013671875, "global_step": 286001, "epoch": 3445} {"train_loss": -25.57929801940918, "global_step": 286002, "epoch": 3445} {"train_loss": -25.49602699279785, "global_step": 286003, "epoch": 3445} {"train_loss": -25.53708267211914, "global_step": 286004, "epoch": 3445} {"train_loss": -25.72071647644043, "global_step": 286005, "epoch": 3445} {"train_loss": -25.635435104370117, "global_step": 286006, "epoch": 3445} {"train_loss": -25.57098388671875, "global_step": 286007, "epoch": 3445} {"train_loss": -25.583784103393555, "global_step": 286008, "epoch": 3445} {"train_loss": -25.56540298461914, "global_step": 286009, "epoch": 3445} {"train_loss": -25.315793991088867, "global_step": 286010, "epoch": 3445} {"train_loss": -25.648740768432617, "global_step": 286011, "epoch": 3445} {"train_loss": -25.537668228149414, "global_step": 286012, "epoch": 3445} {"train_loss": -25.79970359802246, "global_step": 286013, "epoch": 3445} {"train_loss": -25.92205810546875, "global_step": 286014, "epoch": 3445} {"train_loss": -25.578048706054688, "global_step": 286015, "epoch": 3445} {"train_loss": -25.33721923828125, "global_step": 286016, "epoch": 3445} {"train_loss": -25.42319750498576, "global_step": 286017, "epoch": 3445, "val_loss": 7168305.0} {"train_loss": -25.4623966217041, "global_step": 286018, "epoch": 3446} {"train_loss": -24.8369197845459, "global_step": 286019, "epoch": 3446} {"train_loss": -25.183231353759766, "global_step": 286020, "epoch": 3446} {"train_loss": -25.380014419555664, "global_step": 286021, "epoch": 3446} {"train_loss": -25.3536319732666, "global_step": 286022, "epoch": 3446} {"train_loss": -25.215686798095703, "global_step": 286023, "epoch": 3446} {"train_loss": -25.07565689086914, "global_step": 286024, "epoch": 3446} {"train_loss": -24.62703514099121, "global_step": 286025, "epoch": 3446} {"train_loss": -25.42079734802246, "global_step": 286026, "epoch": 3446} {"train_loss": -24.8040771484375, "global_step": 286027, "epoch": 3446} {"train_loss": -25.312021255493164, "global_step": 286028, "epoch": 3446} {"train_loss": -25.117916107177734, "global_step": 286029, "epoch": 3446} {"train_loss": -25.382421493530273, "global_step": 286030, "epoch": 3446} {"train_loss": -25.106712341308594, "global_step": 286031, "epoch": 3446} {"train_loss": -25.575437545776367, "global_step": 286032, "epoch": 3446} {"train_loss": -25.055477142333984, "global_step": 286033, "epoch": 3446} {"train_loss": -25.19847297668457, "global_step": 286034, "epoch": 3446} {"train_loss": -25.30594825744629, "global_step": 286035, "epoch": 3446} {"train_loss": -25.24464988708496, "global_step": 286036, "epoch": 3446} {"train_loss": -25.229215621948242, "global_step": 286037, "epoch": 3446} {"train_loss": -25.0929012298584, "global_step": 286038, "epoch": 3446} {"train_loss": -25.293981552124023, "global_step": 286039, "epoch": 3446} {"train_loss": -25.353038787841797, "global_step": 286040, "epoch": 3446} {"train_loss": -25.29021644592285, "global_step": 286041, "epoch": 3446} {"train_loss": -25.11197280883789, "global_step": 286042, "epoch": 3446} {"train_loss": -25.57497215270996, "global_step": 286043, "epoch": 3446} {"train_loss": -24.978662490844727, "global_step": 286044, "epoch": 3446} {"train_loss": -25.424238204956055, "global_step": 286045, "epoch": 3446} {"train_loss": -25.698827743530273, "global_step": 286046, "epoch": 3446} {"train_loss": -25.333696365356445, "global_step": 286047, "epoch": 3446} {"train_loss": -25.52161979675293, "global_step": 286048, "epoch": 3446} {"train_loss": -25.58962059020996, "global_step": 286049, "epoch": 3446} {"train_loss": -25.2966365814209, "global_step": 286050, "epoch": 3446} {"train_loss": -25.60431480407715, "global_step": 286051, "epoch": 3446} {"train_loss": -25.70781898498535, "global_step": 286052, "epoch": 3446} {"train_loss": -25.551313400268555, "global_step": 286053, "epoch": 3446} {"train_loss": -25.222742080688477, "global_step": 286054, "epoch": 3446} {"train_loss": -25.601789474487305, "global_step": 286055, "epoch": 3446} {"train_loss": -25.209423065185547, "global_step": 286056, "epoch": 3446} {"train_loss": -25.538724899291992, "global_step": 286057, "epoch": 3446} {"train_loss": -25.575057983398438, "global_step": 286058, "epoch": 3446} {"train_loss": -25.818288803100586, "global_step": 286059, "epoch": 3446} {"train_loss": -25.745359420776367, "global_step": 286060, "epoch": 3446} {"train_loss": -25.57979965209961, "global_step": 286061, "epoch": 3446} {"train_loss": -25.222015380859375, "global_step": 286062, "epoch": 3446} {"train_loss": -25.572450637817383, "global_step": 286063, "epoch": 3446} {"train_loss": -25.537067413330078, "global_step": 286064, "epoch": 3446} {"train_loss": -25.387033462524414, "global_step": 286065, "epoch": 3446} {"train_loss": -25.245649337768555, "global_step": 286066, "epoch": 3446} {"train_loss": -25.396793365478516, "global_step": 286067, "epoch": 3446} {"train_loss": -24.65321922302246, "global_step": 286068, "epoch": 3446} {"train_loss": -24.743738174438477, "global_step": 286069, "epoch": 3446} {"train_loss": -25.045814514160156, "global_step": 286070, "epoch": 3446} {"train_loss": -25.183124542236328, "global_step": 286071, "epoch": 3446} {"train_loss": -25.20110321044922, "global_step": 286072, "epoch": 3446} {"train_loss": -25.65388298034668, "global_step": 286073, "epoch": 3446} {"train_loss": -24.89753532409668, "global_step": 286074, "epoch": 3446} {"train_loss": -25.419273376464844, "global_step": 286075, "epoch": 3446} {"train_loss": -24.847179412841797, "global_step": 286076, "epoch": 3446} {"train_loss": -25.271642684936523, "global_step": 286077, "epoch": 3446} {"train_loss": -25.453826904296875, "global_step": 286078, "epoch": 3446} {"train_loss": -25.46735954284668, "global_step": 286079, "epoch": 3446} {"train_loss": -25.158519744873047, "global_step": 286080, "epoch": 3446} {"train_loss": -25.21410369873047, "global_step": 286081, "epoch": 3446} {"train_loss": -25.69211196899414, "global_step": 286082, "epoch": 3446} {"train_loss": -25.8261661529541, "global_step": 286083, "epoch": 3446} {"train_loss": -25.746225357055664, "global_step": 286084, "epoch": 3446} {"train_loss": -24.976760864257812, "global_step": 286085, "epoch": 3446} {"train_loss": -24.91938018798828, "global_step": 286086, "epoch": 3446} {"train_loss": -25.462440490722656, "global_step": 286087, "epoch": 3446} {"train_loss": -25.483524322509766, "global_step": 286088, "epoch": 3446} {"train_loss": -25.312387466430664, "global_step": 286089, "epoch": 3446} {"train_loss": -25.474565505981445, "global_step": 286090, "epoch": 3446} {"train_loss": -25.29075050354004, "global_step": 286091, "epoch": 3446} {"train_loss": -25.820154190063477, "global_step": 286092, "epoch": 3446} {"train_loss": -25.24209976196289, "global_step": 286093, "epoch": 3446} {"train_loss": -25.635828018188477, "global_step": 286094, "epoch": 3446} {"train_loss": -25.5596923828125, "global_step": 286095, "epoch": 3446} {"train_loss": -25.3369140625, "global_step": 286096, "epoch": 3446} {"train_loss": -25.598182678222656, "global_step": 286097, "epoch": 3446} {"train_loss": -25.984073638916016, "global_step": 286098, "epoch": 3446} {"train_loss": -25.739059448242188, "global_step": 286099, "epoch": 3446} {"train_loss": -25.347339538206537, "global_step": 286100, "epoch": 3446, "val_loss": 7130711.5} {"train_loss": -25.501827239990234, "global_step": 286101, "epoch": 3447} {"train_loss": -25.014753341674805, "global_step": 286102, "epoch": 3447} {"train_loss": -25.362186431884766, "global_step": 286103, "epoch": 3447} {"train_loss": -25.18213653564453, "global_step": 286104, "epoch": 3447} {"train_loss": -25.60614585876465, "global_step": 286105, "epoch": 3447} {"train_loss": -25.55245018005371, "global_step": 286106, "epoch": 3447} {"train_loss": -25.341190338134766, "global_step": 286107, "epoch": 3447} {"train_loss": -25.63858985900879, "global_step": 286108, "epoch": 3447} {"train_loss": -24.832677841186523, "global_step": 286109, "epoch": 3447} {"train_loss": -25.40834617614746, "global_step": 286110, "epoch": 3447} {"train_loss": -25.530324935913086, "global_step": 286111, "epoch": 3447} {"train_loss": -25.481826782226562, "global_step": 286112, "epoch": 3447} {"train_loss": -25.432849884033203, "global_step": 286113, "epoch": 3447} {"train_loss": -25.434001922607422, "global_step": 286114, "epoch": 3447} {"train_loss": -25.093555450439453, "global_step": 286115, "epoch": 3447} {"train_loss": -25.751087188720703, "global_step": 286116, "epoch": 3447} {"train_loss": -25.447736740112305, "global_step": 286117, "epoch": 3447} {"train_loss": -25.764135360717773, "global_step": 286118, "epoch": 3447} {"train_loss": -25.63071632385254, "global_step": 286119, "epoch": 3447} {"train_loss": -25.827245712280273, "global_step": 286120, "epoch": 3447} {"train_loss": -25.493942260742188, "global_step": 286121, "epoch": 3447} {"train_loss": -25.66373634338379, "global_step": 286122, "epoch": 3447} {"train_loss": -25.48188018798828, "global_step": 286123, "epoch": 3447} {"train_loss": -25.5072078704834, "global_step": 286124, "epoch": 3447} {"train_loss": -25.35679054260254, "global_step": 286125, "epoch": 3447} {"train_loss": -25.386457443237305, "global_step": 286126, "epoch": 3447} {"train_loss": -25.396512985229492, "global_step": 286127, "epoch": 3447} {"train_loss": -25.681650161743164, "global_step": 286128, "epoch": 3447} {"train_loss": -25.418193817138672, "global_step": 286129, "epoch": 3447} {"train_loss": -25.199533462524414, "global_step": 286130, "epoch": 3447} {"train_loss": -25.406801223754883, "global_step": 286131, "epoch": 3447} {"train_loss": -25.472543716430664, "global_step": 286132, "epoch": 3447} {"train_loss": -25.42827796936035, "global_step": 286133, "epoch": 3447} {"train_loss": -25.701040267944336, "global_step": 286134, "epoch": 3447} {"train_loss": -26.18170166015625, "global_step": 286135, "epoch": 3447} {"train_loss": -25.69931411743164, "global_step": 286136, "epoch": 3447} {"train_loss": -25.664093017578125, "global_step": 286137, "epoch": 3447} {"train_loss": -25.642108917236328, "global_step": 286138, "epoch": 3447} {"train_loss": -25.512744903564453, "global_step": 286139, "epoch": 3447} {"train_loss": -25.4576473236084, "global_step": 286140, "epoch": 3447} {"train_loss": -25.253299713134766, "global_step": 286141, "epoch": 3447} {"train_loss": -25.491636276245117, "global_step": 286142, "epoch": 3447} {"train_loss": -25.430971145629883, "global_step": 286143, "epoch": 3447} {"train_loss": -25.60297203063965, "global_step": 286144, "epoch": 3447} {"train_loss": -25.313337326049805, "global_step": 286145, "epoch": 3447} {"train_loss": -25.31691551208496, "global_step": 286146, "epoch": 3447} {"train_loss": -25.654356002807617, "global_step": 286147, "epoch": 3447} {"train_loss": -24.769136428833008, "global_step": 286148, "epoch": 3447} {"train_loss": -25.35181999206543, "global_step": 286149, "epoch": 3447} {"train_loss": -25.41994857788086, "global_step": 286150, "epoch": 3447} {"train_loss": -24.551984786987305, "global_step": 286151, "epoch": 3447} {"train_loss": -25.762006759643555, "global_step": 286152, "epoch": 3447} {"train_loss": -25.035856246948242, "global_step": 286153, "epoch": 3447} {"train_loss": -25.10455894470215, "global_step": 286154, "epoch": 3447} {"train_loss": -25.2528076171875, "global_step": 286155, "epoch": 3447} {"train_loss": -24.63180923461914, "global_step": 286156, "epoch": 3447} {"train_loss": -25.096967697143555, "global_step": 286157, "epoch": 3447} {"train_loss": -25.11751937866211, "global_step": 286158, "epoch": 3447} {"train_loss": -25.333877563476562, "global_step": 286159, "epoch": 3447} {"train_loss": -25.216999053955078, "global_step": 286160, "epoch": 3447} {"train_loss": -25.46807861328125, "global_step": 286161, "epoch": 3447} {"train_loss": -25.42413330078125, "global_step": 286162, "epoch": 3447} {"train_loss": -25.539325714111328, "global_step": 286163, "epoch": 3447} {"train_loss": -25.53096580505371, "global_step": 286164, "epoch": 3447} {"train_loss": -25.3560733795166, "global_step": 286165, "epoch": 3447} {"train_loss": -25.428939819335938, "global_step": 286166, "epoch": 3447} {"train_loss": -25.55782127380371, "global_step": 286167, "epoch": 3447} {"train_loss": -25.324167251586914, "global_step": 286168, "epoch": 3447} {"train_loss": -25.414487838745117, "global_step": 286169, "epoch": 3447} {"train_loss": -25.167728424072266, "global_step": 286170, "epoch": 3447} {"train_loss": -24.880983352661133, "global_step": 286171, "epoch": 3447} {"train_loss": -25.435483932495117, "global_step": 286172, "epoch": 3447} {"train_loss": -25.5892333984375, "global_step": 286173, "epoch": 3447} {"train_loss": -25.252370834350586, "global_step": 286174, "epoch": 3447} {"train_loss": -25.54057502746582, "global_step": 286175, "epoch": 3447} {"train_loss": -25.594453811645508, "global_step": 286176, "epoch": 3447} {"train_loss": -25.635766983032227, "global_step": 286177, "epoch": 3447} {"train_loss": -25.804296493530273, "global_step": 286178, "epoch": 3447} {"train_loss": -25.547780990600586, "global_step": 286179, "epoch": 3447} {"train_loss": -25.3761043548584, "global_step": 286180, "epoch": 3447} {"train_loss": -25.53114128112793, "global_step": 286181, "epoch": 3447} {"train_loss": -25.64858055114746, "global_step": 286182, "epoch": 3447} {"train_loss": -25.420889015657355, "global_step": 286183, "epoch": 3447, "val_loss": 7070415.0} {"train_loss": -24.63759422302246, "global_step": 286184, "epoch": 3448} {"train_loss": -24.72867774963379, "global_step": 286185, "epoch": 3448} {"train_loss": -24.812442779541016, "global_step": 286186, "epoch": 3448} {"train_loss": -24.687368392944336, "global_step": 286187, "epoch": 3448} {"train_loss": -24.453296661376953, "global_step": 286188, "epoch": 3448} {"train_loss": -24.879274368286133, "global_step": 286189, "epoch": 3448} {"train_loss": -25.04416275024414, "global_step": 286190, "epoch": 3448} {"train_loss": -25.309728622436523, "global_step": 286191, "epoch": 3448} {"train_loss": -24.62890625, "global_step": 286192, "epoch": 3448} {"train_loss": -25.120960235595703, "global_step": 286193, "epoch": 3448} {"train_loss": -25.434064865112305, "global_step": 286194, "epoch": 3448} {"train_loss": -24.821279525756836, "global_step": 286195, "epoch": 3448} {"train_loss": -25.276386260986328, "global_step": 286196, "epoch": 3448} {"train_loss": -25.438268661499023, "global_step": 286197, "epoch": 3448} {"train_loss": -25.440351486206055, "global_step": 286198, "epoch": 3448} {"train_loss": -25.383623123168945, "global_step": 286199, "epoch": 3448} {"train_loss": -25.18332862854004, "global_step": 286200, "epoch": 3448} {"train_loss": -25.093774795532227, "global_step": 286201, "epoch": 3448} {"train_loss": -25.320173263549805, "global_step": 286202, "epoch": 3448} {"train_loss": -25.379945755004883, "global_step": 286203, "epoch": 3448} {"train_loss": -25.455345153808594, "global_step": 286204, "epoch": 3448} {"train_loss": -25.47356605529785, "global_step": 286205, "epoch": 3448} {"train_loss": -25.32736587524414, "global_step": 286206, "epoch": 3448} {"train_loss": -25.424463272094727, "global_step": 286207, "epoch": 3448} {"train_loss": -25.286344528198242, "global_step": 286208, "epoch": 3448} {"train_loss": -25.643301010131836, "global_step": 286209, "epoch": 3448} {"train_loss": -25.43483543395996, "global_step": 286210, "epoch": 3448} {"train_loss": -25.3073673248291, "global_step": 286211, "epoch": 3448} {"train_loss": -25.806121826171875, "global_step": 286212, "epoch": 3448} {"train_loss": -25.55915069580078, "global_step": 286213, "epoch": 3448} {"train_loss": -25.1964054107666, "global_step": 286214, "epoch": 3448} {"train_loss": -25.221336364746094, "global_step": 286215, "epoch": 3448} {"train_loss": -25.13551139831543, "global_step": 286216, "epoch": 3448} {"train_loss": -25.284671783447266, "global_step": 286217, "epoch": 3448} {"train_loss": -25.429224014282227, "global_step": 286218, "epoch": 3448} {"train_loss": -25.38831901550293, "global_step": 286219, "epoch": 3448} {"train_loss": -24.784467697143555, "global_step": 286220, "epoch": 3448} {"train_loss": -25.3583927154541, "global_step": 286221, "epoch": 3448} {"train_loss": -25.922582626342773, "global_step": 286222, "epoch": 3448} {"train_loss": -25.09626579284668, "global_step": 286223, "epoch": 3448} {"train_loss": -25.641040802001953, "global_step": 286224, "epoch": 3448} {"train_loss": -25.63702392578125, "global_step": 286225, "epoch": 3448} {"train_loss": -25.5044002532959, "global_step": 286226, "epoch": 3448} {"train_loss": -25.571741104125977, "global_step": 286227, "epoch": 3448} {"train_loss": -25.932159423828125, "global_step": 286228, "epoch": 3448} {"train_loss": -25.37188148498535, "global_step": 286229, "epoch": 3448} {"train_loss": -25.893817901611328, "global_step": 286230, "epoch": 3448} {"train_loss": -25.870779037475586, "global_step": 286231, "epoch": 3448} {"train_loss": -25.5089054107666, "global_step": 286232, "epoch": 3448} {"train_loss": -25.094594955444336, "global_step": 286233, "epoch": 3448} {"train_loss": -25.553836822509766, "global_step": 286234, "epoch": 3448} {"train_loss": -25.18926239013672, "global_step": 286235, "epoch": 3448} {"train_loss": -25.4311580657959, "global_step": 286236, "epoch": 3448} {"train_loss": -25.693618774414062, "global_step": 286237, "epoch": 3448} {"train_loss": -25.485774993896484, "global_step": 286238, "epoch": 3448} {"train_loss": -25.66689109802246, "global_step": 286239, "epoch": 3448} {"train_loss": -25.449270248413086, "global_step": 286240, "epoch": 3448} {"train_loss": -25.543642044067383, "global_step": 286241, "epoch": 3448} {"train_loss": -25.521419525146484, "global_step": 286242, "epoch": 3448} {"train_loss": -25.50221824645996, "global_step": 286243, "epoch": 3448} {"train_loss": -25.02676010131836, "global_step": 286244, "epoch": 3448} {"train_loss": -25.363000869750977, "global_step": 286245, "epoch": 3448} {"train_loss": -25.82526969909668, "global_step": 286246, "epoch": 3448} {"train_loss": -25.26822280883789, "global_step": 286247, "epoch": 3448} {"train_loss": -25.529296875, "global_step": 286248, "epoch": 3448} {"train_loss": -25.734466552734375, "global_step": 286249, "epoch": 3448} {"train_loss": -25.588064193725586, "global_step": 286250, "epoch": 3448} {"train_loss": -25.22952651977539, "global_step": 286251, "epoch": 3448} {"train_loss": -25.76401710510254, "global_step": 286252, "epoch": 3448} {"train_loss": -25.695331573486328, "global_step": 286253, "epoch": 3448} {"train_loss": -25.54969596862793, "global_step": 286254, "epoch": 3448} {"train_loss": -25.392704010009766, "global_step": 286255, "epoch": 3448} {"train_loss": -25.69831657409668, "global_step": 286256, "epoch": 3448} {"train_loss": -25.503292083740234, "global_step": 286257, "epoch": 3448} {"train_loss": -25.36311912536621, "global_step": 286258, "epoch": 3448} {"train_loss": -25.494924545288086, "global_step": 286259, "epoch": 3448} {"train_loss": -25.303346633911133, "global_step": 286260, "epoch": 3448} {"train_loss": -25.534311294555664, "global_step": 286261, "epoch": 3448} {"train_loss": -25.347476959228516, "global_step": 286262, "epoch": 3448} {"train_loss": -25.351734161376953, "global_step": 286263, "epoch": 3448} {"train_loss": -25.73850440979004, "global_step": 286264, "epoch": 3448} {"train_loss": -25.702747344970703, "global_step": 286265, "epoch": 3448} {"train_loss": -25.376359594873634, "global_step": 286266, "epoch": 3448, "val_loss": 7138746.0} {"train_loss": -24.921262741088867, "global_step": 286267, "epoch": 3449} {"train_loss": -24.437952041625977, "global_step": 286268, "epoch": 3449} {"train_loss": -24.551786422729492, "global_step": 286269, "epoch": 3449} {"train_loss": -24.581342697143555, "global_step": 286270, "epoch": 3449} {"train_loss": -24.892248153686523, "global_step": 286271, "epoch": 3449} {"train_loss": -24.45746612548828, "global_step": 286272, "epoch": 3449} {"train_loss": -24.978322982788086, "global_step": 286273, "epoch": 3449} {"train_loss": -24.599872589111328, "global_step": 286274, "epoch": 3449} {"train_loss": -24.946382522583008, "global_step": 286275, "epoch": 3449} {"train_loss": -24.82870864868164, "global_step": 286276, "epoch": 3449} {"train_loss": -24.61710548400879, "global_step": 286277, "epoch": 3449} {"train_loss": -25.089250564575195, "global_step": 286278, "epoch": 3449} {"train_loss": -24.736799240112305, "global_step": 286279, "epoch": 3449} {"train_loss": -24.665241241455078, "global_step": 286280, "epoch": 3449} {"train_loss": -25.001834869384766, "global_step": 286281, "epoch": 3449} {"train_loss": -24.931577682495117, "global_step": 286282, "epoch": 3449} {"train_loss": -24.82148551940918, "global_step": 286283, "epoch": 3449} {"train_loss": -25.14946937561035, "global_step": 286284, "epoch": 3449} {"train_loss": -25.289392471313477, "global_step": 286285, "epoch": 3449} {"train_loss": -25.20977210998535, "global_step": 286286, "epoch": 3449} {"train_loss": -25.09650993347168, "global_step": 286287, "epoch": 3449} {"train_loss": -25.050613403320312, "global_step": 286288, "epoch": 3449} {"train_loss": -25.021896362304688, "global_step": 286289, "epoch": 3449} {"train_loss": -25.56262969970703, "global_step": 286290, "epoch": 3449} {"train_loss": -25.33027458190918, "global_step": 286291, "epoch": 3449} {"train_loss": -25.35529136657715, "global_step": 286292, "epoch": 3449} {"train_loss": -25.143009185791016, "global_step": 286293, "epoch": 3449} {"train_loss": -25.356645584106445, "global_step": 286294, "epoch": 3449} {"train_loss": -25.268735885620117, "global_step": 286295, "epoch": 3449} {"train_loss": -25.376432418823242, "global_step": 286296, "epoch": 3449} {"train_loss": -25.6274356842041, "global_step": 286297, "epoch": 3449} {"train_loss": -25.66162109375, "global_step": 286298, "epoch": 3449} {"train_loss": -25.2724609375, "global_step": 286299, "epoch": 3449} {"train_loss": -25.59772300720215, "global_step": 286300, "epoch": 3449} {"train_loss": -25.551063537597656, "global_step": 286301, "epoch": 3449} {"train_loss": -25.18617057800293, "global_step": 286302, "epoch": 3449} {"train_loss": -25.677936553955078, "global_step": 286303, "epoch": 3449} {"train_loss": -25.574073791503906, "global_step": 286304, "epoch": 3449} {"train_loss": -25.372730255126953, "global_step": 286305, "epoch": 3449} {"train_loss": -25.741064071655273, "global_step": 286306, "epoch": 3449} {"train_loss": -25.49798583984375, "global_step": 286307, "epoch": 3449} {"train_loss": -25.40932273864746, "global_step": 286308, "epoch": 3449} {"train_loss": -25.356840133666992, "global_step": 286309, "epoch": 3449} {"train_loss": -25.505298614501953, "global_step": 286310, "epoch": 3449} {"train_loss": -25.424713134765625, "global_step": 286311, "epoch": 3449} {"train_loss": -25.387468338012695, "global_step": 286312, "epoch": 3449} {"train_loss": -25.6660099029541, "global_step": 286313, "epoch": 3449} {"train_loss": -25.28728485107422, "global_step": 286314, "epoch": 3449} {"train_loss": -25.579845428466797, "global_step": 286315, "epoch": 3449} {"train_loss": -25.62784767150879, "global_step": 286316, "epoch": 3449} {"train_loss": -25.50035285949707, "global_step": 286317, "epoch": 3449} {"train_loss": -26.0220890045166, "global_step": 286318, "epoch": 3449} {"train_loss": -25.898914337158203, "global_step": 286319, "epoch": 3449} {"train_loss": -25.63326072692871, "global_step": 286320, "epoch": 3449} {"train_loss": -25.727075576782227, "global_step": 286321, "epoch": 3449} {"train_loss": -25.562835693359375, "global_step": 286322, "epoch": 3449} {"train_loss": -25.580726623535156, "global_step": 286323, "epoch": 3449} {"train_loss": -25.42203712463379, "global_step": 286324, "epoch": 3449} {"train_loss": -25.85432243347168, "global_step": 286325, "epoch": 3449} {"train_loss": -25.76875877380371, "global_step": 286326, "epoch": 3449} {"train_loss": -25.559860229492188, "global_step": 286327, "epoch": 3449} {"train_loss": -25.966089248657227, "global_step": 286328, "epoch": 3449} {"train_loss": -25.386083602905273, "global_step": 286329, "epoch": 3449} {"train_loss": -25.455923080444336, "global_step": 286330, "epoch": 3449} {"train_loss": -25.633193969726562, "global_step": 286331, "epoch": 3449} {"train_loss": -25.228580474853516, "global_step": 286332, "epoch": 3449} {"train_loss": -25.169057846069336, "global_step": 286333, "epoch": 3449} {"train_loss": -25.166919708251953, "global_step": 286334, "epoch": 3449} {"train_loss": -25.353662490844727, "global_step": 286335, "epoch": 3449} {"train_loss": -25.40015983581543, "global_step": 286336, "epoch": 3449} {"train_loss": -25.290699005126953, "global_step": 286337, "epoch": 3449} {"train_loss": -25.645526885986328, "global_step": 286338, "epoch": 3449} {"train_loss": -25.484363555908203, "global_step": 286339, "epoch": 3449} {"train_loss": -25.595117568969727, "global_step": 286340, "epoch": 3449} {"train_loss": -25.589494705200195, "global_step": 286341, "epoch": 3449} {"train_loss": -25.110883712768555, "global_step": 286342, "epoch": 3449} {"train_loss": -25.6552791595459, "global_step": 286343, "epoch": 3449} {"train_loss": -25.041446685791016, "global_step": 286344, "epoch": 3449} {"train_loss": -25.3283634185791, "global_step": 286345, "epoch": 3449} {"train_loss": -25.12082862854004, "global_step": 286346, "epoch": 3449} {"train_loss": -25.4354305267334, "global_step": 286347, "epoch": 3449} {"train_loss": -25.405805587768555, "global_step": 286348, "epoch": 3449} {"train_loss": -25.295949935913086, "global_step": 286349, "epoch": 3449, "val_loss": 7222193.0} {"train_loss": -24.620506286621094, "global_step": 286350, "epoch": 3450} {"train_loss": -24.83321762084961, "global_step": 286351, "epoch": 3450} {"train_loss": -25.11199951171875, "global_step": 286352, "epoch": 3450} {"train_loss": -24.89051055908203, "global_step": 286353, "epoch": 3450} {"train_loss": -24.757381439208984, "global_step": 286354, "epoch": 3450} {"train_loss": -24.781856536865234, "global_step": 286355, "epoch": 3450} {"train_loss": -25.113874435424805, "global_step": 286356, "epoch": 3450} {"train_loss": -25.27772331237793, "global_step": 286357, "epoch": 3450} {"train_loss": -25.378437042236328, "global_step": 286358, "epoch": 3450} {"train_loss": -25.01374626159668, "global_step": 286359, "epoch": 3450} {"train_loss": -25.05099868774414, "global_step": 286360, "epoch": 3450} {"train_loss": -24.83051872253418, "global_step": 286361, "epoch": 3450} {"train_loss": -25.412742614746094, "global_step": 286362, "epoch": 3450} {"train_loss": -25.342159271240234, "global_step": 286363, "epoch": 3450} {"train_loss": -25.52707862854004, "global_step": 286364, "epoch": 3450} {"train_loss": -25.658588409423828, "global_step": 286365, "epoch": 3450} {"train_loss": -25.420047760009766, "global_step": 286366, "epoch": 3450} {"train_loss": -25.374576568603516, "global_step": 286367, "epoch": 3450} {"train_loss": -25.33340835571289, "global_step": 286368, "epoch": 3450} {"train_loss": -25.55748748779297, "global_step": 286369, "epoch": 3450} {"train_loss": -25.883459091186523, "global_step": 286370, "epoch": 3450} {"train_loss": -25.712324142456055, "global_step": 286371, "epoch": 3450} {"train_loss": -25.667343139648438, "global_step": 286372, "epoch": 3450} {"train_loss": -25.50565528869629, "global_step": 286373, "epoch": 3450} {"train_loss": -25.667463302612305, "global_step": 286374, "epoch": 3450} {"train_loss": -25.627532958984375, "global_step": 286375, "epoch": 3450} {"train_loss": -25.433744430541992, "global_step": 286376, "epoch": 3450} {"train_loss": -25.4665584564209, "global_step": 286377, "epoch": 3450} {"train_loss": -25.488981246948242, "global_step": 286378, "epoch": 3450} {"train_loss": -25.429929733276367, "global_step": 286379, "epoch": 3450} {"train_loss": -25.775226593017578, "global_step": 286380, "epoch": 3450} {"train_loss": -25.319339752197266, "global_step": 286381, "epoch": 3450} {"train_loss": -25.520505905151367, "global_step": 286382, "epoch": 3450} {"train_loss": -25.602025985717773, "global_step": 286383, "epoch": 3450} {"train_loss": -25.753189086914062, "global_step": 286384, "epoch": 3450} {"train_loss": -25.642423629760742, "global_step": 286385, "epoch": 3450} {"train_loss": -25.80694007873535, "global_step": 286386, "epoch": 3450} {"train_loss": -25.21877098083496, "global_step": 286387, "epoch": 3450} {"train_loss": -25.410688400268555, "global_step": 286388, "epoch": 3450} {"train_loss": -25.2011661529541, "global_step": 286389, "epoch": 3450} {"train_loss": -25.830785751342773, "global_step": 286390, "epoch": 3450} {"train_loss": -25.58856201171875, "global_step": 286391, "epoch": 3450} {"train_loss": -25.392282485961914, "global_step": 286392, "epoch": 3450} {"train_loss": -25.749868392944336, "global_step": 286393, "epoch": 3450} {"train_loss": -25.333507537841797, "global_step": 286394, "epoch": 3450} {"train_loss": -25.9783935546875, "global_step": 286395, "epoch": 3450} {"train_loss": -25.568044662475586, "global_step": 286396, "epoch": 3450} {"train_loss": -25.340547561645508, "global_step": 286397, "epoch": 3450} {"train_loss": -25.634967803955078, "global_step": 286398, "epoch": 3450} {"train_loss": -25.244230270385742, "global_step": 286399, "epoch": 3450} {"train_loss": -25.35565757751465, "global_step": 286400, "epoch": 3450} {"train_loss": -25.120542526245117, "global_step": 286401, "epoch": 3450} {"train_loss": -25.25654411315918, "global_step": 286402, "epoch": 3450} {"train_loss": -25.46470832824707, "global_step": 286403, "epoch": 3450} {"train_loss": -25.503660202026367, "global_step": 286404, "epoch": 3450} {"train_loss": -25.86669921875, "global_step": 286405, "epoch": 3450} {"train_loss": -25.53801918029785, "global_step": 286406, "epoch": 3450} {"train_loss": -25.340906143188477, "global_step": 286407, "epoch": 3450} {"train_loss": -25.32441520690918, "global_step": 286408, "epoch": 3450} {"train_loss": -25.57956886291504, "global_step": 286409, "epoch": 3450} {"train_loss": -25.282760620117188, "global_step": 286410, "epoch": 3450} {"train_loss": -25.67914390563965, "global_step": 286411, "epoch": 3450} {"train_loss": -25.485307693481445, "global_step": 286412, "epoch": 3450} {"train_loss": -25.77627944946289, "global_step": 286413, "epoch": 3450} {"train_loss": -25.875812530517578, "global_step": 286414, "epoch": 3450} {"train_loss": -25.453771591186523, "global_step": 286415, "epoch": 3450} {"train_loss": -25.447952270507812, "global_step": 286416, "epoch": 3450} {"train_loss": -25.960800170898438, "global_step": 286417, "epoch": 3450} {"train_loss": -25.355283737182617, "global_step": 286418, "epoch": 3450} {"train_loss": -25.5847225189209, "global_step": 286419, "epoch": 3450} {"train_loss": -25.548538208007812, "global_step": 286420, "epoch": 3450} {"train_loss": -25.339597702026367, "global_step": 286421, "epoch": 3450} {"train_loss": -25.53958511352539, "global_step": 286422, "epoch": 3450} {"train_loss": -25.358657836914062, "global_step": 286423, "epoch": 3450} {"train_loss": -26.07062339782715, "global_step": 286424, "epoch": 3450} {"train_loss": -25.27619743347168, "global_step": 286425, "epoch": 3450} {"train_loss": -25.23869514465332, "global_step": 286426, "epoch": 3450} {"train_loss": -25.05388641357422, "global_step": 286427, "epoch": 3450} {"train_loss": -24.841279983520508, "global_step": 286428, "epoch": 3450} {"train_loss": -25.328577041625977, "global_step": 286429, "epoch": 3450} {"train_loss": -25.352497100830078, "global_step": 286430, "epoch": 3450} {"train_loss": -24.94893455505371, "global_step": 286431, "epoch": 3450} {"train_loss": -25.403926274862634, "global_step": 286432, "epoch": 3450, "train/sim_max_reward_0": 1.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 0.0, "test/sim_max_reward_4500000": 1.0, "test/sim_max_reward_4500001": 1.0, "test/sim_max_reward_4500002": 1.0, "test/sim_max_reward_4500003": 1.0, "test/sim_max_reward_4500004": 0.0, "test/sim_max_reward_4500005": 1.0, "test/sim_max_reward_4500006": 1.0, "test/sim_max_reward_4500007": 1.0, "test/sim_max_reward_4500008": 1.0, "test/sim_max_reward_4500009": 1.0, "test/sim_max_reward_4500010": 1.0, "test/sim_max_reward_4500011": 1.0, "test/sim_max_reward_4500012": 1.0, "test/sim_max_reward_4500013": 1.0, "test/sim_max_reward_4500014": 1.0, "test/sim_max_reward_4500015": 1.0, "test/sim_max_reward_4500016": 1.0, "test/sim_max_reward_4500017": 1.0, "test/sim_max_reward_4500018": 1.0, "test/sim_max_reward_4500019": 1.0, "test/sim_max_reward_4500020": 1.0, "test/sim_max_reward_4500021": 1.0, "train/mean_score": 0.8333333333333334, "test/mean_score": 0.9545454545454546, "val_loss": 7136365.5} {"train_loss": -24.404190063476562, "global_step": 286433, "epoch": 3451} {"train_loss": -24.65435218811035, "global_step": 286434, "epoch": 3451} {"train_loss": -24.45876693725586, "global_step": 286435, "epoch": 3451} {"train_loss": -24.3308048248291, "global_step": 286436, "epoch": 3451} {"train_loss": -24.56610107421875, "global_step": 286437, "epoch": 3451} {"train_loss": -24.871816635131836, "global_step": 286438, "epoch": 3451} {"train_loss": -24.801496505737305, "global_step": 286439, "epoch": 3451} {"train_loss": -25.059843063354492, "global_step": 286440, "epoch": 3451} {"train_loss": -25.34000587463379, "global_step": 286441, "epoch": 3451} {"train_loss": -24.826862335205078, "global_step": 286442, "epoch": 3451} {"train_loss": -25.000146865844727, "global_step": 286443, "epoch": 3451} {"train_loss": -25.120792388916016, "global_step": 286444, "epoch": 3451} {"train_loss": -25.40778923034668, "global_step": 286445, "epoch": 3451} {"train_loss": -24.780183792114258, "global_step": 286446, "epoch": 3451} {"train_loss": -25.4570369720459, "global_step": 286447, "epoch": 3451} {"train_loss": -25.071292877197266, "global_step": 286448, "epoch": 3451} {"train_loss": -25.300968170166016, "global_step": 286449, "epoch": 3451} {"train_loss": -25.009695053100586, "global_step": 286450, "epoch": 3451} {"train_loss": -25.045169830322266, "global_step": 286451, "epoch": 3451} {"train_loss": -25.40806007385254, "global_step": 286452, "epoch": 3451} {"train_loss": -25.046873092651367, "global_step": 286453, "epoch": 3451} {"train_loss": -25.43117332458496, "global_step": 286454, "epoch": 3451} {"train_loss": -25.657001495361328, "global_step": 286455, "epoch": 3451} {"train_loss": -25.04526710510254, "global_step": 286456, "epoch": 3451} {"train_loss": -25.058637619018555, "global_step": 286457, "epoch": 3451} {"train_loss": -25.28892707824707, "global_step": 286458, "epoch": 3451} {"train_loss": -25.182043075561523, "global_step": 286459, "epoch": 3451} {"train_loss": -25.420822143554688, "global_step": 286460, "epoch": 3451} {"train_loss": -25.013822555541992, "global_step": 286461, "epoch": 3451} {"train_loss": -25.176742553710938, "global_step": 286462, "epoch": 3451} {"train_loss": -25.064151763916016, "global_step": 286463, "epoch": 3451} {"train_loss": -24.95313262939453, "global_step": 286464, "epoch": 3451} {"train_loss": -25.47917366027832, "global_step": 286465, "epoch": 3451} {"train_loss": -25.191455841064453, "global_step": 286466, "epoch": 3451} {"train_loss": -25.433332443237305, "global_step": 286467, "epoch": 3451} {"train_loss": -25.45090103149414, "global_step": 286468, "epoch": 3451} {"train_loss": -25.719457626342773, "global_step": 286469, "epoch": 3451} {"train_loss": -25.47208023071289, "global_step": 286470, "epoch": 3451} {"train_loss": -25.527578353881836, "global_step": 286471, "epoch": 3451} {"train_loss": -25.34574317932129, "global_step": 286472, "epoch": 3451} {"train_loss": -25.96082878112793, "global_step": 286473, "epoch": 3451} {"train_loss": -25.385446548461914, "global_step": 286474, "epoch": 3451} {"train_loss": -25.51039695739746, "global_step": 286475, "epoch": 3451} {"train_loss": -25.741865158081055, "global_step": 286476, "epoch": 3451} {"train_loss": -25.62532615661621, "global_step": 286477, "epoch": 3451} {"train_loss": -26.09588623046875, "global_step": 286478, "epoch": 3451} {"train_loss": -25.461456298828125, "global_step": 286479, "epoch": 3451} {"train_loss": -25.6434383392334, "global_step": 286480, "epoch": 3451} {"train_loss": -25.47917366027832, "global_step": 286481, "epoch": 3451} {"train_loss": -25.645893096923828, "global_step": 286482, "epoch": 3451} {"train_loss": -25.285785675048828, "global_step": 286483, "epoch": 3451} {"train_loss": -25.204906463623047, "global_step": 286484, "epoch": 3451} {"train_loss": -25.75217628479004, "global_step": 286485, "epoch": 3451} {"train_loss": -25.337087631225586, "global_step": 286486, "epoch": 3451} {"train_loss": -25.435468673706055, "global_step": 286487, "epoch": 3451} {"train_loss": -25.820886611938477, "global_step": 286488, "epoch": 3451} {"train_loss": -25.248023986816406, "global_step": 286489, "epoch": 3451} {"train_loss": -25.805810928344727, "global_step": 286490, "epoch": 3451} {"train_loss": -25.68584632873535, "global_step": 286491, "epoch": 3451} {"train_loss": -25.482501983642578, "global_step": 286492, "epoch": 3451} {"train_loss": -25.69867515563965, "global_step": 286493, "epoch": 3451} {"train_loss": -25.831079483032227, "global_step": 286494, "epoch": 3451} {"train_loss": -25.563451766967773, "global_step": 286495, "epoch": 3451} {"train_loss": -25.688180923461914, "global_step": 286496, "epoch": 3451} {"train_loss": -25.32701873779297, "global_step": 286497, "epoch": 3451} {"train_loss": -24.985593795776367, "global_step": 286498, "epoch": 3451} {"train_loss": -25.399991989135742, "global_step": 286499, "epoch": 3451} {"train_loss": -25.0393123626709, "global_step": 286500, "epoch": 3451} {"train_loss": -25.433862686157227, "global_step": 286501, "epoch": 3451} {"train_loss": -25.64385986328125, "global_step": 286502, "epoch": 3451} {"train_loss": -24.99349021911621, "global_step": 286503, "epoch": 3451} {"train_loss": -25.596616744995117, "global_step": 286504, "epoch": 3451} {"train_loss": -25.38875389099121, "global_step": 286505, "epoch": 3451} {"train_loss": -25.34808349609375, "global_step": 286506, "epoch": 3451} {"train_loss": -25.62969398498535, "global_step": 286507, "epoch": 3451} {"train_loss": -25.179494857788086, "global_step": 286508, "epoch": 3451} {"train_loss": -25.259374618530273, "global_step": 286509, "epoch": 3451} {"train_loss": -25.368757247924805, "global_step": 286510, "epoch": 3451} {"train_loss": -25.35918617248535, "global_step": 286511, "epoch": 3451} {"train_loss": -24.68830680847168, "global_step": 286512, "epoch": 3451} {"train_loss": -24.6588134765625, "global_step": 286513, "epoch": 3451} {"train_loss": -24.28196144104004, "global_step": 286514, "epoch": 3451} {"train_loss": -25.26392506978598, "global_step": 286515, "epoch": 3451, "val_loss": 7211412.0} {"train_loss": -24.145648956298828, "global_step": 286516, "epoch": 3452} {"train_loss": -24.587158203125, "global_step": 286517, "epoch": 3452} {"train_loss": -24.640230178833008, "global_step": 286518, "epoch": 3452} {"train_loss": -24.28778076171875, "global_step": 286519, "epoch": 3452} {"train_loss": -24.98111915588379, "global_step": 286520, "epoch": 3452} {"train_loss": -24.77414894104004, "global_step": 286521, "epoch": 3452} {"train_loss": -24.896020889282227, "global_step": 286522, "epoch": 3452} {"train_loss": -25.164587020874023, "global_step": 286523, "epoch": 3452} {"train_loss": -24.55182456970215, "global_step": 286524, "epoch": 3452} {"train_loss": -24.98848533630371, "global_step": 286525, "epoch": 3452} {"train_loss": -25.299467086791992, "global_step": 286526, "epoch": 3452} {"train_loss": -24.79767417907715, "global_step": 286527, "epoch": 3452} {"train_loss": -24.907581329345703, "global_step": 286528, "epoch": 3452} {"train_loss": -24.915897369384766, "global_step": 286529, "epoch": 3452} {"train_loss": -25.08265495300293, "global_step": 286530, "epoch": 3452} {"train_loss": -25.058156967163086, "global_step": 286531, "epoch": 3452} {"train_loss": -25.044010162353516, "global_step": 286532, "epoch": 3452} {"train_loss": -25.11760902404785, "global_step": 286533, "epoch": 3452} {"train_loss": -24.84604835510254, "global_step": 286534, "epoch": 3452} {"train_loss": -25.152204513549805, "global_step": 286535, "epoch": 3452} {"train_loss": -24.994260787963867, "global_step": 286536, "epoch": 3452} {"train_loss": -25.3767147064209, "global_step": 286537, "epoch": 3452} {"train_loss": -25.174203872680664, "global_step": 286538, "epoch": 3452} {"train_loss": -25.250375747680664, "global_step": 286539, "epoch": 3452} {"train_loss": -25.099960327148438, "global_step": 286540, "epoch": 3452} {"train_loss": -25.48540496826172, "global_step": 286541, "epoch": 3452} {"train_loss": -25.433435440063477, "global_step": 286542, "epoch": 3452} {"train_loss": -25.549245834350586, "global_step": 286543, "epoch": 3452} {"train_loss": -25.273794174194336, "global_step": 286544, "epoch": 3452} {"train_loss": -25.135467529296875, "global_step": 286545, "epoch": 3452} {"train_loss": -25.28260612487793, "global_step": 286546, "epoch": 3452} {"train_loss": -25.495420455932617, "global_step": 286547, "epoch": 3452} {"train_loss": -25.41006088256836, "global_step": 286548, "epoch": 3452} {"train_loss": -25.478374481201172, "global_step": 286549, "epoch": 3452} {"train_loss": -25.280624389648438, "global_step": 286550, "epoch": 3452} {"train_loss": -25.797483444213867, "global_step": 286551, "epoch": 3452} {"train_loss": -25.502445220947266, "global_step": 286552, "epoch": 3452} {"train_loss": -25.470348358154297, "global_step": 286553, "epoch": 3452} {"train_loss": -25.703418731689453, "global_step": 286554, "epoch": 3452} {"train_loss": -25.305166244506836, "global_step": 286555, "epoch": 3452} {"train_loss": -25.725229263305664, "global_step": 286556, "epoch": 3452} {"train_loss": -25.833724975585938, "global_step": 286557, "epoch": 3452} {"train_loss": -25.73160171508789, "global_step": 286558, "epoch": 3452} {"train_loss": -25.8301944732666, "global_step": 286559, "epoch": 3452} {"train_loss": -25.33730697631836, "global_step": 286560, "epoch": 3452} {"train_loss": -25.849706649780273, "global_step": 286561, "epoch": 3452} {"train_loss": -25.22280502319336, "global_step": 286562, "epoch": 3452} {"train_loss": -25.679489135742188, "global_step": 286563, "epoch": 3452} {"train_loss": -25.964155197143555, "global_step": 286564, "epoch": 3452} {"train_loss": -25.7957706451416, "global_step": 286565, "epoch": 3452} {"train_loss": -25.592575073242188, "global_step": 286566, "epoch": 3452} {"train_loss": -25.303306579589844, "global_step": 286567, "epoch": 3452} {"train_loss": -25.96270751953125, "global_step": 286568, "epoch": 3452} {"train_loss": -25.38760757446289, "global_step": 286569, "epoch": 3452} {"train_loss": -25.473602294921875, "global_step": 286570, "epoch": 3452} {"train_loss": -25.870529174804688, "global_step": 286571, "epoch": 3452} {"train_loss": -25.453554153442383, "global_step": 286572, "epoch": 3452} {"train_loss": -25.496397018432617, "global_step": 286573, "epoch": 3452} {"train_loss": -25.42323875427246, "global_step": 286574, "epoch": 3452} {"train_loss": -24.53192710876465, "global_step": 286575, "epoch": 3452} {"train_loss": -24.77438735961914, "global_step": 286576, "epoch": 3452} {"train_loss": -25.62154197692871, "global_step": 286577, "epoch": 3452} {"train_loss": -25.490116119384766, "global_step": 286578, "epoch": 3452} {"train_loss": -25.396636962890625, "global_step": 286579, "epoch": 3452} {"train_loss": -25.57831382751465, "global_step": 286580, "epoch": 3452} {"train_loss": -25.239721298217773, "global_step": 286581, "epoch": 3452} {"train_loss": -25.71213722229004, "global_step": 286582, "epoch": 3452} {"train_loss": -25.732177734375, "global_step": 286583, "epoch": 3452} {"train_loss": -25.36951446533203, "global_step": 286584, "epoch": 3452} {"train_loss": -25.306615829467773, "global_step": 286585, "epoch": 3452} {"train_loss": -25.58035659790039, "global_step": 286586, "epoch": 3452} {"train_loss": -25.644088745117188, "global_step": 286587, "epoch": 3452} {"train_loss": -25.072891235351562, "global_step": 286588, "epoch": 3452} {"train_loss": -25.627408981323242, "global_step": 286589, "epoch": 3452} {"train_loss": -25.701126098632812, "global_step": 286590, "epoch": 3452} {"train_loss": -25.4630069732666, "global_step": 286591, "epoch": 3452} {"train_loss": -25.161273956298828, "global_step": 286592, "epoch": 3452} {"train_loss": -25.22072982788086, "global_step": 286593, "epoch": 3452} {"train_loss": -25.513219833374023, "global_step": 286594, "epoch": 3452} {"train_loss": -25.27406120300293, "global_step": 286595, "epoch": 3452} {"train_loss": -24.91393280029297, "global_step": 286596, "epoch": 3452} {"train_loss": -25.690372467041016, "global_step": 286597, "epoch": 3452} {"train_loss": -25.31946683217244, "global_step": 286598, "epoch": 3452, "val_loss": 7174937.0} {"train_loss": -24.42280387878418, "global_step": 286599, "epoch": 3453} {"train_loss": -23.9390811920166, "global_step": 286600, "epoch": 3453} {"train_loss": -24.337875366210938, "global_step": 286601, "epoch": 3453} {"train_loss": -25.07741928100586, "global_step": 286602, "epoch": 3453} {"train_loss": -24.128129959106445, "global_step": 286603, "epoch": 3453} {"train_loss": -24.768268585205078, "global_step": 286604, "epoch": 3453} {"train_loss": -24.797285079956055, "global_step": 286605, "epoch": 3453} {"train_loss": -24.502399444580078, "global_step": 286606, "epoch": 3453} {"train_loss": -24.983144760131836, "global_step": 286607, "epoch": 3453} {"train_loss": -25.118457794189453, "global_step": 286608, "epoch": 3453} {"train_loss": -25.345457077026367, "global_step": 286609, "epoch": 3453} {"train_loss": -24.898910522460938, "global_step": 286610, "epoch": 3453} {"train_loss": -25.14887809753418, "global_step": 286611, "epoch": 3453} {"train_loss": -25.1608943939209, "global_step": 286612, "epoch": 3453} {"train_loss": -25.32560157775879, "global_step": 286613, "epoch": 3453} {"train_loss": -24.9874324798584, "global_step": 286614, "epoch": 3453} {"train_loss": -25.36858558654785, "global_step": 286615, "epoch": 3453} {"train_loss": -24.914587020874023, "global_step": 286616, "epoch": 3453} {"train_loss": -25.256147384643555, "global_step": 286617, "epoch": 3453} {"train_loss": -25.320249557495117, "global_step": 286618, "epoch": 3453} {"train_loss": -25.43903923034668, "global_step": 286619, "epoch": 3453} {"train_loss": -25.45894432067871, "global_step": 286620, "epoch": 3453} {"train_loss": -25.220867156982422, "global_step": 286621, "epoch": 3453} {"train_loss": -25.468795776367188, "global_step": 286622, "epoch": 3453} {"train_loss": -25.782251358032227, "global_step": 286623, "epoch": 3453} {"train_loss": -25.319379806518555, "global_step": 286624, "epoch": 3453} {"train_loss": -25.39435386657715, "global_step": 286625, "epoch": 3453} {"train_loss": -25.345081329345703, "global_step": 286626, "epoch": 3453} {"train_loss": -25.436071395874023, "global_step": 286627, "epoch": 3453} {"train_loss": -25.360563278198242, "global_step": 286628, "epoch": 3453} {"train_loss": -25.37750244140625, "global_step": 286629, "epoch": 3453} {"train_loss": -25.681283950805664, "global_step": 286630, "epoch": 3453} {"train_loss": -25.0532283782959, "global_step": 286631, "epoch": 3453} {"train_loss": -25.30084228515625, "global_step": 286632, "epoch": 3453} {"train_loss": -25.777969360351562, "global_step": 286633, "epoch": 3453} {"train_loss": -25.6944522857666, "global_step": 286634, "epoch": 3453} {"train_loss": -25.861377716064453, "global_step": 286635, "epoch": 3453} {"train_loss": -25.42154312133789, "global_step": 286636, "epoch": 3453} {"train_loss": -25.515323638916016, "global_step": 286637, "epoch": 3453} {"train_loss": -25.767480850219727, "global_step": 286638, "epoch": 3453} {"train_loss": -25.541894912719727, "global_step": 286639, "epoch": 3453} {"train_loss": -25.466049194335938, "global_step": 286640, "epoch": 3453} {"train_loss": -25.90839958190918, "global_step": 286641, "epoch": 3453} {"train_loss": -25.164915084838867, "global_step": 286642, "epoch": 3453} {"train_loss": -25.480783462524414, "global_step": 286643, "epoch": 3453} {"train_loss": -25.443206787109375, "global_step": 286644, "epoch": 3453} {"train_loss": -25.207014083862305, "global_step": 286645, "epoch": 3453} {"train_loss": -25.6905460357666, "global_step": 286646, "epoch": 3453} {"train_loss": -25.45197105407715, "global_step": 286647, "epoch": 3453} {"train_loss": -25.345468521118164, "global_step": 286648, "epoch": 3453} {"train_loss": -25.62177848815918, "global_step": 286649, "epoch": 3453} {"train_loss": -25.679309844970703, "global_step": 286650, "epoch": 3453} {"train_loss": -25.31865882873535, "global_step": 286651, "epoch": 3453} {"train_loss": -25.75520896911621, "global_step": 286652, "epoch": 3453} {"train_loss": -25.63496208190918, "global_step": 286653, "epoch": 3453} {"train_loss": -25.386144638061523, "global_step": 286654, "epoch": 3453} {"train_loss": -25.42398452758789, "global_step": 286655, "epoch": 3453} {"train_loss": -25.51410675048828, "global_step": 286656, "epoch": 3453} {"train_loss": -25.6611385345459, "global_step": 286657, "epoch": 3453} {"train_loss": -25.53547477722168, "global_step": 286658, "epoch": 3453} {"train_loss": -25.41440200805664, "global_step": 286659, "epoch": 3453} {"train_loss": -25.792936325073242, "global_step": 286660, "epoch": 3453} {"train_loss": -25.297386169433594, "global_step": 286661, "epoch": 3453} {"train_loss": -25.555578231811523, "global_step": 286662, "epoch": 3453} {"train_loss": -25.221500396728516, "global_step": 286663, "epoch": 3453} {"train_loss": -25.054107666015625, "global_step": 286664, "epoch": 3453} {"train_loss": -25.53757095336914, "global_step": 286665, "epoch": 3453} {"train_loss": -25.436113357543945, "global_step": 286666, "epoch": 3453} {"train_loss": -25.352380752563477, "global_step": 286667, "epoch": 3453} {"train_loss": -25.26320457458496, "global_step": 286668, "epoch": 3453} {"train_loss": -25.264820098876953, "global_step": 286669, "epoch": 3453} {"train_loss": -25.249862670898438, "global_step": 286670, "epoch": 3453} {"train_loss": -25.182809829711914, "global_step": 286671, "epoch": 3453} {"train_loss": -25.704320907592773, "global_step": 286672, "epoch": 3453} {"train_loss": -25.495004653930664, "global_step": 286673, "epoch": 3453} {"train_loss": -25.281911849975586, "global_step": 286674, "epoch": 3453} {"train_loss": -25.53540802001953, "global_step": 286675, "epoch": 3453} {"train_loss": -25.492876052856445, "global_step": 286676, "epoch": 3453} {"train_loss": -25.259939193725586, "global_step": 286677, "epoch": 3453} {"train_loss": -25.47161865234375, "global_step": 286678, "epoch": 3453} {"train_loss": -25.65888023376465, "global_step": 286679, "epoch": 3453} {"train_loss": -25.56331443786621, "global_step": 286680, "epoch": 3453} {"train_loss": -25.33391800845962, "global_step": 286681, "epoch": 3453, "val_loss": 7041562.0} {"train_loss": -24.710880279541016, "global_step": 286682, "epoch": 3454} {"train_loss": -25.276357650756836, "global_step": 286683, "epoch": 3454} {"train_loss": -24.60811424255371, "global_step": 286684, "epoch": 3454} {"train_loss": -25.43804931640625, "global_step": 286685, "epoch": 3454} {"train_loss": -24.951496124267578, "global_step": 286686, "epoch": 3454} {"train_loss": -25.04981231689453, "global_step": 286687, "epoch": 3454} {"train_loss": -25.21988868713379, "global_step": 286688, "epoch": 3454} {"train_loss": -25.059707641601562, "global_step": 286689, "epoch": 3454} {"train_loss": -24.918975830078125, "global_step": 286690, "epoch": 3454} {"train_loss": -25.037351608276367, "global_step": 286691, "epoch": 3454} {"train_loss": -24.95548439025879, "global_step": 286692, "epoch": 3454} {"train_loss": -25.096303939819336, "global_step": 286693, "epoch": 3454} {"train_loss": -25.097997665405273, "global_step": 286694, "epoch": 3454} {"train_loss": -25.21882438659668, "global_step": 286695, "epoch": 3454} {"train_loss": -25.560178756713867, "global_step": 286696, "epoch": 3454} {"train_loss": -25.272998809814453, "global_step": 286697, "epoch": 3454} {"train_loss": -25.783750534057617, "global_step": 286698, "epoch": 3454} {"train_loss": -25.52459144592285, "global_step": 286699, "epoch": 3454} {"train_loss": -25.186973571777344, "global_step": 286700, "epoch": 3454} {"train_loss": -25.539600372314453, "global_step": 286701, "epoch": 3454} {"train_loss": -25.2160587310791, "global_step": 286702, "epoch": 3454} {"train_loss": -25.21943473815918, "global_step": 286703, "epoch": 3454} {"train_loss": -25.591796875, "global_step": 286704, "epoch": 3454} {"train_loss": -25.220693588256836, "global_step": 286705, "epoch": 3454} {"train_loss": -24.882383346557617, "global_step": 286706, "epoch": 3454} {"train_loss": -25.316635131835938, "global_step": 286707, "epoch": 3454} {"train_loss": -25.114038467407227, "global_step": 286708, "epoch": 3454} {"train_loss": -25.38206672668457, "global_step": 286709, "epoch": 3454} {"train_loss": -25.560945510864258, "global_step": 286710, "epoch": 3454} {"train_loss": -25.415496826171875, "global_step": 286711, "epoch": 3454} {"train_loss": -25.043109893798828, "global_step": 286712, "epoch": 3454} {"train_loss": -25.551599502563477, "global_step": 286713, "epoch": 3454} {"train_loss": -25.484830856323242, "global_step": 286714, "epoch": 3454} {"train_loss": -25.60752296447754, "global_step": 286715, "epoch": 3454} {"train_loss": -25.73493003845215, "global_step": 286716, "epoch": 3454} {"train_loss": -25.694196701049805, "global_step": 286717, "epoch": 3454} {"train_loss": -25.314504623413086, "global_step": 286718, "epoch": 3454} {"train_loss": -25.6685848236084, "global_step": 286719, "epoch": 3454} {"train_loss": -25.560400009155273, "global_step": 286720, "epoch": 3454} {"train_loss": -25.514875411987305, "global_step": 286721, "epoch": 3454} {"train_loss": -25.057706832885742, "global_step": 286722, "epoch": 3454} {"train_loss": -26.084333419799805, "global_step": 286723, "epoch": 3454} {"train_loss": -25.49146270751953, "global_step": 286724, "epoch": 3454} {"train_loss": -25.471647262573242, "global_step": 286725, "epoch": 3454} {"train_loss": -25.45794677734375, "global_step": 286726, "epoch": 3454} {"train_loss": -26.152631759643555, "global_step": 286727, "epoch": 3454} {"train_loss": -25.151334762573242, "global_step": 286728, "epoch": 3454} {"train_loss": -25.380056381225586, "global_step": 286729, "epoch": 3454} {"train_loss": -25.385089874267578, "global_step": 286730, "epoch": 3454} {"train_loss": -25.38329315185547, "global_step": 286731, "epoch": 3454} {"train_loss": -25.293596267700195, "global_step": 286732, "epoch": 3454} {"train_loss": -25.14344596862793, "global_step": 286733, "epoch": 3454} {"train_loss": -24.994443893432617, "global_step": 286734, "epoch": 3454} {"train_loss": -25.678083419799805, "global_step": 286735, "epoch": 3454} {"train_loss": -25.077871322631836, "global_step": 286736, "epoch": 3454} {"train_loss": -25.0654239654541, "global_step": 286737, "epoch": 3454} {"train_loss": -25.440610885620117, "global_step": 286738, "epoch": 3454} {"train_loss": -25.366342544555664, "global_step": 286739, "epoch": 3454} {"train_loss": -25.28951072692871, "global_step": 286740, "epoch": 3454} {"train_loss": -25.312580108642578, "global_step": 286741, "epoch": 3454} {"train_loss": -25.74393081665039, "global_step": 286742, "epoch": 3454} {"train_loss": -25.50881004333496, "global_step": 286743, "epoch": 3454} {"train_loss": -25.40189552307129, "global_step": 286744, "epoch": 3454} {"train_loss": -25.381460189819336, "global_step": 286745, "epoch": 3454} {"train_loss": -25.56390953063965, "global_step": 286746, "epoch": 3454} {"train_loss": -25.792266845703125, "global_step": 286747, "epoch": 3454} {"train_loss": -25.341819763183594, "global_step": 286748, "epoch": 3454} {"train_loss": -25.684040069580078, "global_step": 286749, "epoch": 3454} {"train_loss": -25.592390060424805, "global_step": 286750, "epoch": 3454} {"train_loss": -25.594097137451172, "global_step": 286751, "epoch": 3454} {"train_loss": -25.59103775024414, "global_step": 286752, "epoch": 3454} {"train_loss": -25.71689224243164, "global_step": 286753, "epoch": 3454} {"train_loss": -25.397619247436523, "global_step": 286754, "epoch": 3454} {"train_loss": -24.756484985351562, "global_step": 286755, "epoch": 3454} {"train_loss": -24.87879753112793, "global_step": 286756, "epoch": 3454} {"train_loss": -25.419570922851562, "global_step": 286757, "epoch": 3454} {"train_loss": -25.90478515625, "global_step": 286758, "epoch": 3454} {"train_loss": -25.36292839050293, "global_step": 286759, "epoch": 3454} {"train_loss": -25.253353118896484, "global_step": 286760, "epoch": 3454} {"train_loss": -25.330347061157227, "global_step": 286761, "epoch": 3454} {"train_loss": -25.215328216552734, "global_step": 286762, "epoch": 3454} {"train_loss": -25.14650535583496, "global_step": 286763, "epoch": 3454} {"train_loss": -25.344538493328784, "global_step": 286764, "epoch": 3454, "val_loss": 7152026.0} {"train_loss": -24.41828155517578, "global_step": 286765, "epoch": 3455} {"train_loss": -25.060293197631836, "global_step": 286766, "epoch": 3455} {"train_loss": -23.977252960205078, "global_step": 286767, "epoch": 3455} {"train_loss": -24.215702056884766, "global_step": 286768, "epoch": 3455} {"train_loss": -24.34964942932129, "global_step": 286769, "epoch": 3455} {"train_loss": -24.54926872253418, "global_step": 286770, "epoch": 3455} {"train_loss": -24.696842193603516, "global_step": 286771, "epoch": 3455} {"train_loss": -24.5831298828125, "global_step": 286772, "epoch": 3455} {"train_loss": -24.877300262451172, "global_step": 286773, "epoch": 3455} {"train_loss": -24.42279624938965, "global_step": 286774, "epoch": 3455} {"train_loss": -25.110300064086914, "global_step": 286775, "epoch": 3455} {"train_loss": -24.438495635986328, "global_step": 286776, "epoch": 3455} {"train_loss": -24.656518936157227, "global_step": 286777, "epoch": 3455} {"train_loss": -25.120075225830078, "global_step": 286778, "epoch": 3455} {"train_loss": -24.451396942138672, "global_step": 286779, "epoch": 3455} {"train_loss": -24.548171997070312, "global_step": 286780, "epoch": 3455} {"train_loss": -25.12942886352539, "global_step": 286781, "epoch": 3455} {"train_loss": -24.63218879699707, "global_step": 286782, "epoch": 3455} {"train_loss": -24.485868453979492, "global_step": 286783, "epoch": 3455} {"train_loss": -25.15910530090332, "global_step": 286784, "epoch": 3455} {"train_loss": -24.77128028869629, "global_step": 286785, "epoch": 3455} {"train_loss": -25.134069442749023, "global_step": 286786, "epoch": 3455} {"train_loss": -25.153894424438477, "global_step": 286787, "epoch": 3455} {"train_loss": -25.01646614074707, "global_step": 286788, "epoch": 3455} {"train_loss": -25.339582443237305, "global_step": 286789, "epoch": 3455} {"train_loss": -25.32637596130371, "global_step": 286790, "epoch": 3455} {"train_loss": -25.529361724853516, "global_step": 286791, "epoch": 3455} {"train_loss": -25.052946090698242, "global_step": 286792, "epoch": 3455} {"train_loss": -25.2413330078125, "global_step": 286793, "epoch": 3455} {"train_loss": -25.574853897094727, "global_step": 286794, "epoch": 3455} {"train_loss": -25.17256736755371, "global_step": 286795, "epoch": 3455} {"train_loss": -25.147384643554688, "global_step": 286796, "epoch": 3455} {"train_loss": -25.335147857666016, "global_step": 286797, "epoch": 3455} {"train_loss": -25.352598190307617, "global_step": 286798, "epoch": 3455} {"train_loss": -25.380252838134766, "global_step": 286799, "epoch": 3455} {"train_loss": -25.663055419921875, "global_step": 286800, "epoch": 3455} {"train_loss": -25.46346664428711, "global_step": 286801, "epoch": 3455} {"train_loss": -25.384939193725586, "global_step": 286802, "epoch": 3455} {"train_loss": -25.593780517578125, "global_step": 286803, "epoch": 3455} {"train_loss": -25.666839599609375, "global_step": 286804, "epoch": 3455} {"train_loss": -25.665945053100586, "global_step": 286805, "epoch": 3455} {"train_loss": -25.621240615844727, "global_step": 286806, "epoch": 3455} {"train_loss": -25.597763061523438, "global_step": 286807, "epoch": 3455} {"train_loss": -25.452035903930664, "global_step": 286808, "epoch": 3455} {"train_loss": -25.41035270690918, "global_step": 286809, "epoch": 3455} {"train_loss": -25.485692977905273, "global_step": 286810, "epoch": 3455} {"train_loss": -25.80855369567871, "global_step": 286811, "epoch": 3455} {"train_loss": -25.270679473876953, "global_step": 286812, "epoch": 3455} {"train_loss": -25.775623321533203, "global_step": 286813, "epoch": 3455} {"train_loss": -25.742618560791016, "global_step": 286814, "epoch": 3455} {"train_loss": -26.06768226623535, "global_step": 286815, "epoch": 3455} {"train_loss": -25.42449378967285, "global_step": 286816, "epoch": 3455} {"train_loss": -25.65352439880371, "global_step": 286817, "epoch": 3455} {"train_loss": -25.693002700805664, "global_step": 286818, "epoch": 3455} {"train_loss": -25.856903076171875, "global_step": 286819, "epoch": 3455} {"train_loss": -25.52235221862793, "global_step": 286820, "epoch": 3455} {"train_loss": -25.695966720581055, "global_step": 286821, "epoch": 3455} {"train_loss": -25.622989654541016, "global_step": 286822, "epoch": 3455} {"train_loss": -25.741979598999023, "global_step": 286823, "epoch": 3455} {"train_loss": -25.57468605041504, "global_step": 286824, "epoch": 3455} {"train_loss": -25.8239688873291, "global_step": 286825, "epoch": 3455} {"train_loss": -25.528194427490234, "global_step": 286826, "epoch": 3455} {"train_loss": -25.44953727722168, "global_step": 286827, "epoch": 3455} {"train_loss": -25.65286636352539, "global_step": 286828, "epoch": 3455} {"train_loss": -25.28993034362793, "global_step": 286829, "epoch": 3455} {"train_loss": -25.522706985473633, "global_step": 286830, "epoch": 3455} {"train_loss": -25.63677978515625, "global_step": 286831, "epoch": 3455} {"train_loss": -25.421018600463867, "global_step": 286832, "epoch": 3455} {"train_loss": -25.641462326049805, "global_step": 286833, "epoch": 3455} {"train_loss": -25.408294677734375, "global_step": 286834, "epoch": 3455} {"train_loss": -25.16701316833496, "global_step": 286835, "epoch": 3455} {"train_loss": -25.62607765197754, "global_step": 286836, "epoch": 3455} {"train_loss": -25.170347213745117, "global_step": 286837, "epoch": 3455} {"train_loss": -25.183012008666992, "global_step": 286838, "epoch": 3455} {"train_loss": -25.253986358642578, "global_step": 286839, "epoch": 3455} {"train_loss": -25.57725715637207, "global_step": 286840, "epoch": 3455} {"train_loss": -25.583765029907227, "global_step": 286841, "epoch": 3455} {"train_loss": -25.265979766845703, "global_step": 286842, "epoch": 3455} {"train_loss": -25.519678115844727, "global_step": 286843, "epoch": 3455} {"train_loss": -25.354597091674805, "global_step": 286844, "epoch": 3455} {"train_loss": -25.2490234375, "global_step": 286845, "epoch": 3455} {"train_loss": -25.48784828186035, "global_step": 286846, "epoch": 3455} {"train_loss": -25.248267277177558, "global_step": 286847, "epoch": 3455, "val_loss": 6994937.0} {"train_loss": -25.510610580444336, "global_step": 286848, "epoch": 3456} {"train_loss": -25.053829193115234, "global_step": 286849, "epoch": 3456} {"train_loss": -25.11496353149414, "global_step": 286850, "epoch": 3456} {"train_loss": -24.907855987548828, "global_step": 286851, "epoch": 3456} {"train_loss": -25.65447998046875, "global_step": 286852, "epoch": 3456} {"train_loss": -25.248703002929688, "global_step": 286853, "epoch": 3456} {"train_loss": -25.296823501586914, "global_step": 286854, "epoch": 3456} {"train_loss": -25.379621505737305, "global_step": 286855, "epoch": 3456} {"train_loss": -25.029638290405273, "global_step": 286856, "epoch": 3456} {"train_loss": -25.383092880249023, "global_step": 286857, "epoch": 3456} {"train_loss": -25.234865188598633, "global_step": 286858, "epoch": 3456} {"train_loss": -24.975679397583008, "global_step": 286859, "epoch": 3456} {"train_loss": -25.157997131347656, "global_step": 286860, "epoch": 3456} {"train_loss": -25.895776748657227, "global_step": 286861, "epoch": 3456} {"train_loss": -25.246883392333984, "global_step": 286862, "epoch": 3456} {"train_loss": -25.343111038208008, "global_step": 286863, "epoch": 3456} {"train_loss": -25.183786392211914, "global_step": 286864, "epoch": 3456} {"train_loss": -25.60479736328125, "global_step": 286865, "epoch": 3456} {"train_loss": -25.393125534057617, "global_step": 286866, "epoch": 3456} {"train_loss": -25.526729583740234, "global_step": 286867, "epoch": 3456} {"train_loss": -25.458099365234375, "global_step": 286868, "epoch": 3456} {"train_loss": -25.405227661132812, "global_step": 286869, "epoch": 3456} {"train_loss": -25.392995834350586, "global_step": 286870, "epoch": 3456} {"train_loss": -24.937965393066406, "global_step": 286871, "epoch": 3456} {"train_loss": -25.31977653503418, "global_step": 286872, "epoch": 3456} {"train_loss": -25.5990047454834, "global_step": 286873, "epoch": 3456} {"train_loss": -25.935827255249023, "global_step": 286874, "epoch": 3456} {"train_loss": -25.22754669189453, "global_step": 286875, "epoch": 3456} {"train_loss": -25.652286529541016, "global_step": 286876, "epoch": 3456} {"train_loss": -25.570035934448242, "global_step": 286877, "epoch": 3456} {"train_loss": -25.73285484313965, "global_step": 286878, "epoch": 3456} {"train_loss": -25.380756378173828, "global_step": 286879, "epoch": 3456} {"train_loss": -25.526287078857422, "global_step": 286880, "epoch": 3456} {"train_loss": -25.3083438873291, "global_step": 286881, "epoch": 3456} {"train_loss": -25.628036499023438, "global_step": 286882, "epoch": 3456} {"train_loss": -25.515592575073242, "global_step": 286883, "epoch": 3456} {"train_loss": -25.50359535217285, "global_step": 286884, "epoch": 3456} {"train_loss": -25.40630531311035, "global_step": 286885, "epoch": 3456} {"train_loss": -25.940387725830078, "global_step": 286886, "epoch": 3456} {"train_loss": -25.45204734802246, "global_step": 286887, "epoch": 3456} {"train_loss": -25.30610466003418, "global_step": 286888, "epoch": 3456} {"train_loss": -25.487035751342773, "global_step": 286889, "epoch": 3456} {"train_loss": -25.382736206054688, "global_step": 286890, "epoch": 3456} {"train_loss": -25.74452018737793, "global_step": 286891, "epoch": 3456} {"train_loss": -25.32692527770996, "global_step": 286892, "epoch": 3456} {"train_loss": -25.412729263305664, "global_step": 286893, "epoch": 3456} {"train_loss": -25.475168228149414, "global_step": 286894, "epoch": 3456} {"train_loss": -25.47023582458496, "global_step": 286895, "epoch": 3456} {"train_loss": -25.731536865234375, "global_step": 286896, "epoch": 3456} {"train_loss": -25.684553146362305, "global_step": 286897, "epoch": 3456} {"train_loss": -25.824569702148438, "global_step": 286898, "epoch": 3456} {"train_loss": -25.792449951171875, "global_step": 286899, "epoch": 3456} {"train_loss": -25.631549835205078, "global_step": 286900, "epoch": 3456} {"train_loss": -25.855239868164062, "global_step": 286901, "epoch": 3456} {"train_loss": -25.266437530517578, "global_step": 286902, "epoch": 3456} {"train_loss": -25.710752487182617, "global_step": 286903, "epoch": 3456} {"train_loss": -25.46736717224121, "global_step": 286904, "epoch": 3456} {"train_loss": -25.653095245361328, "global_step": 286905, "epoch": 3456} {"train_loss": -25.481210708618164, "global_step": 286906, "epoch": 3456} {"train_loss": -25.522851943969727, "global_step": 286907, "epoch": 3456} {"train_loss": -25.593189239501953, "global_step": 286908, "epoch": 3456} {"train_loss": -25.6153621673584, "global_step": 286909, "epoch": 3456} {"train_loss": -25.222848892211914, "global_step": 286910, "epoch": 3456} {"train_loss": -25.783172607421875, "global_step": 286911, "epoch": 3456} {"train_loss": -25.773117065429688, "global_step": 286912, "epoch": 3456} {"train_loss": -25.811100006103516, "global_step": 286913, "epoch": 3456} {"train_loss": -25.738422393798828, "global_step": 286914, "epoch": 3456} {"train_loss": -25.1005916595459, "global_step": 286915, "epoch": 3456} {"train_loss": -25.307193756103516, "global_step": 286916, "epoch": 3456} {"train_loss": -25.04609489440918, "global_step": 286917, "epoch": 3456} {"train_loss": -25.138086318969727, "global_step": 286918, "epoch": 3456} {"train_loss": -25.642179489135742, "global_step": 286919, "epoch": 3456} {"train_loss": -25.601959228515625, "global_step": 286920, "epoch": 3456} {"train_loss": -25.620651245117188, "global_step": 286921, "epoch": 3456} {"train_loss": -25.72466468811035, "global_step": 286922, "epoch": 3456} {"train_loss": -25.24361228942871, "global_step": 286923, "epoch": 3456} {"train_loss": -25.32836151123047, "global_step": 286924, "epoch": 3456} {"train_loss": -25.709226608276367, "global_step": 286925, "epoch": 3456} {"train_loss": -25.609100341796875, "global_step": 286926, "epoch": 3456} {"train_loss": -25.400541305541992, "global_step": 286927, "epoch": 3456} {"train_loss": -25.579763412475586, "global_step": 286928, "epoch": 3456} {"train_loss": -25.36798095703125, "global_step": 286929, "epoch": 3456} {"train_loss": -25.48890037996223, "global_step": 286930, "epoch": 3456, "val_loss": 7029444.0} {"train_loss": -25.248056411743164, "global_step": 286931, "epoch": 3457} {"train_loss": -25.1815242767334, "global_step": 286932, "epoch": 3457} {"train_loss": -24.583438873291016, "global_step": 286933, "epoch": 3457} {"train_loss": -25.18146324157715, "global_step": 286934, "epoch": 3457} {"train_loss": -25.352819442749023, "global_step": 286935, "epoch": 3457} {"train_loss": -25.05976676940918, "global_step": 286936, "epoch": 3457} {"train_loss": -25.31540870666504, "global_step": 286937, "epoch": 3457} {"train_loss": -24.884113311767578, "global_step": 286938, "epoch": 3457} {"train_loss": -25.1143856048584, "global_step": 286939, "epoch": 3457} {"train_loss": -25.36639976501465, "global_step": 286940, "epoch": 3457} {"train_loss": -25.32962417602539, "global_step": 286941, "epoch": 3457} {"train_loss": -25.07423210144043, "global_step": 286942, "epoch": 3457} {"train_loss": -25.1854190826416, "global_step": 286943, "epoch": 3457} {"train_loss": -25.040781021118164, "global_step": 286944, "epoch": 3457} {"train_loss": -25.3444881439209, "global_step": 286945, "epoch": 3457} {"train_loss": -25.622543334960938, "global_step": 286946, "epoch": 3457} {"train_loss": -25.29068946838379, "global_step": 286947, "epoch": 3457} {"train_loss": -25.284366607666016, "global_step": 286948, "epoch": 3457} {"train_loss": -25.457487106323242, "global_step": 286949, "epoch": 3457} {"train_loss": -25.503049850463867, "global_step": 286950, "epoch": 3457} {"train_loss": -25.458642959594727, "global_step": 286951, "epoch": 3457} {"train_loss": -25.22394561767578, "global_step": 286952, "epoch": 3457} {"train_loss": -25.68519401550293, "global_step": 286953, "epoch": 3457} {"train_loss": -25.531999588012695, "global_step": 286954, "epoch": 3457} {"train_loss": -25.735754013061523, "global_step": 286955, "epoch": 3457} {"train_loss": -24.9702091217041, "global_step": 286956, "epoch": 3457} {"train_loss": -25.772932052612305, "global_step": 286957, "epoch": 3457} {"train_loss": -25.552831649780273, "global_step": 286958, "epoch": 3457} {"train_loss": -25.484952926635742, "global_step": 286959, "epoch": 3457} {"train_loss": -25.7365779876709, "global_step": 286960, "epoch": 3457} {"train_loss": -25.946561813354492, "global_step": 286961, "epoch": 3457} {"train_loss": -25.323598861694336, "global_step": 286962, "epoch": 3457} {"train_loss": -26.115447998046875, "global_step": 286963, "epoch": 3457} {"train_loss": -25.445405960083008, "global_step": 286964, "epoch": 3457} {"train_loss": -25.482755661010742, "global_step": 286965, "epoch": 3457} {"train_loss": -25.81463623046875, "global_step": 286966, "epoch": 3457} {"train_loss": -25.650846481323242, "global_step": 286967, "epoch": 3457} {"train_loss": -25.3140869140625, "global_step": 286968, "epoch": 3457} {"train_loss": -25.297897338867188, "global_step": 286969, "epoch": 3457} {"train_loss": -25.678882598876953, "global_step": 286970, "epoch": 3457} {"train_loss": -25.608478546142578, "global_step": 286971, "epoch": 3457} {"train_loss": -25.68821144104004, "global_step": 286972, "epoch": 3457} {"train_loss": -25.371618270874023, "global_step": 286973, "epoch": 3457} {"train_loss": -25.13490867614746, "global_step": 286974, "epoch": 3457} {"train_loss": -24.76177406311035, "global_step": 286975, "epoch": 3457} {"train_loss": -25.392000198364258, "global_step": 286976, "epoch": 3457} {"train_loss": -25.04366683959961, "global_step": 286977, "epoch": 3457} {"train_loss": -25.3901309967041, "global_step": 286978, "epoch": 3457} {"train_loss": -25.020614624023438, "global_step": 286979, "epoch": 3457} {"train_loss": -25.517480850219727, "global_step": 286980, "epoch": 3457} {"train_loss": -25.380023956298828, "global_step": 286981, "epoch": 3457} {"train_loss": -25.463476181030273, "global_step": 286982, "epoch": 3457} {"train_loss": -25.1787166595459, "global_step": 286983, "epoch": 3457} {"train_loss": -25.186649322509766, "global_step": 286984, "epoch": 3457} {"train_loss": -25.4814510345459, "global_step": 286985, "epoch": 3457} {"train_loss": -25.23130226135254, "global_step": 286986, "epoch": 3457} {"train_loss": -25.469511032104492, "global_step": 286987, "epoch": 3457} {"train_loss": -25.405956268310547, "global_step": 286988, "epoch": 3457} {"train_loss": -25.200407028198242, "global_step": 286989, "epoch": 3457} {"train_loss": -25.2081241607666, "global_step": 286990, "epoch": 3457} {"train_loss": -25.762866973876953, "global_step": 286991, "epoch": 3457} {"train_loss": -25.023950576782227, "global_step": 286992, "epoch": 3457} {"train_loss": -24.803312301635742, "global_step": 286993, "epoch": 3457} {"train_loss": -24.9688663482666, "global_step": 286994, "epoch": 3457} {"train_loss": -24.94333267211914, "global_step": 286995, "epoch": 3457} {"train_loss": -25.84661293029785, "global_step": 286996, "epoch": 3457} {"train_loss": -25.242738723754883, "global_step": 286997, "epoch": 3457} {"train_loss": -25.421632766723633, "global_step": 286998, "epoch": 3457} {"train_loss": -25.640371322631836, "global_step": 286999, "epoch": 3457} {"train_loss": -25.586563110351562, "global_step": 287000, "epoch": 3457} {"train_loss": -25.136777877807617, "global_step": 287001, "epoch": 3457} {"train_loss": -25.742156982421875, "global_step": 287002, "epoch": 3457} {"train_loss": -25.49263572692871, "global_step": 287003, "epoch": 3457} {"train_loss": -25.330312728881836, "global_step": 287004, "epoch": 3457} {"train_loss": -25.60934829711914, "global_step": 287005, "epoch": 3457} {"train_loss": -25.31576919555664, "global_step": 287006, "epoch": 3457} {"train_loss": -25.241575241088867, "global_step": 287007, "epoch": 3457} {"train_loss": -25.614282608032227, "global_step": 287008, "epoch": 3457} {"train_loss": -25.288833618164062, "global_step": 287009, "epoch": 3457} {"train_loss": -25.528121948242188, "global_step": 287010, "epoch": 3457} {"train_loss": -25.900190353393555, "global_step": 287011, "epoch": 3457} {"train_loss": -25.14175796508789, "global_step": 287012, "epoch": 3457} {"train_loss": -25.39319564635495, "global_step": 287013, "epoch": 3457, "val_loss": 7051692.0} {"train_loss": -25.158288955688477, "global_step": 287014, "epoch": 3458} {"train_loss": -25.406511306762695, "global_step": 287015, "epoch": 3458} {"train_loss": -25.687360763549805, "global_step": 287016, "epoch": 3458} {"train_loss": -25.350793838500977, "global_step": 287017, "epoch": 3458} {"train_loss": -25.51252555847168, "global_step": 287018, "epoch": 3458} {"train_loss": -25.77768898010254, "global_step": 287019, "epoch": 3458} {"train_loss": -25.637409210205078, "global_step": 287020, "epoch": 3458} {"train_loss": -25.532745361328125, "global_step": 287021, "epoch": 3458} {"train_loss": -25.10162925720215, "global_step": 287022, "epoch": 3458} {"train_loss": -25.31589698791504, "global_step": 287023, "epoch": 3458} {"train_loss": -25.49115562438965, "global_step": 287024, "epoch": 3458} {"train_loss": -25.49349021911621, "global_step": 287025, "epoch": 3458} {"train_loss": -25.544918060302734, "global_step": 287026, "epoch": 3458} {"train_loss": -25.402450561523438, "global_step": 287027, "epoch": 3458} {"train_loss": -25.464523315429688, "global_step": 287028, "epoch": 3458} {"train_loss": -25.7851505279541, "global_step": 287029, "epoch": 3458} {"train_loss": -25.584875106811523, "global_step": 287030, "epoch": 3458} {"train_loss": -25.370487213134766, "global_step": 287031, "epoch": 3458} {"train_loss": -25.799640655517578, "global_step": 287032, "epoch": 3458} {"train_loss": -25.360219955444336, "global_step": 287033, "epoch": 3458} {"train_loss": -25.291717529296875, "global_step": 287034, "epoch": 3458} {"train_loss": -25.35289192199707, "global_step": 287035, "epoch": 3458} {"train_loss": -25.683881759643555, "global_step": 287036, "epoch": 3458} {"train_loss": -25.778156280517578, "global_step": 287037, "epoch": 3458} {"train_loss": -25.5101261138916, "global_step": 287038, "epoch": 3458} {"train_loss": -25.561885833740234, "global_step": 287039, "epoch": 3458} {"train_loss": -25.533918380737305, "global_step": 287040, "epoch": 3458} {"train_loss": -25.699295043945312, "global_step": 287041, "epoch": 3458} {"train_loss": -25.230300903320312, "global_step": 287042, "epoch": 3458} {"train_loss": -25.79336929321289, "global_step": 287043, "epoch": 3458} {"train_loss": -25.55671501159668, "global_step": 287044, "epoch": 3458} {"train_loss": -25.503040313720703, "global_step": 287045, "epoch": 3458} {"train_loss": -25.61052894592285, "global_step": 287046, "epoch": 3458} {"train_loss": -25.768848419189453, "global_step": 287047, "epoch": 3458} {"train_loss": -25.821338653564453, "global_step": 287048, "epoch": 3458} {"train_loss": -25.683927536010742, "global_step": 287049, "epoch": 3458} {"train_loss": -25.571569442749023, "global_step": 287050, "epoch": 3458} {"train_loss": -25.513565063476562, "global_step": 287051, "epoch": 3458} {"train_loss": -25.82282829284668, "global_step": 287052, "epoch": 3458} {"train_loss": -25.626972198486328, "global_step": 287053, "epoch": 3458} {"train_loss": -25.248807907104492, "global_step": 287054, "epoch": 3458} {"train_loss": -25.56098747253418, "global_step": 287055, "epoch": 3458} {"train_loss": -25.641071319580078, "global_step": 287056, "epoch": 3458} {"train_loss": -25.872943878173828, "global_step": 287057, "epoch": 3458} {"train_loss": -25.707839965820312, "global_step": 287058, "epoch": 3458} {"train_loss": -25.636463165283203, "global_step": 287059, "epoch": 3458} {"train_loss": -25.665302276611328, "global_step": 287060, "epoch": 3458} {"train_loss": -25.80525016784668, "global_step": 287061, "epoch": 3458} {"train_loss": -25.540822982788086, "global_step": 287062, "epoch": 3458} {"train_loss": -25.658527374267578, "global_step": 287063, "epoch": 3458} {"train_loss": -25.325796127319336, "global_step": 287064, "epoch": 3458} {"train_loss": -25.561452865600586, "global_step": 287065, "epoch": 3458} {"train_loss": -25.6997013092041, "global_step": 287066, "epoch": 3458} {"train_loss": -25.92066764831543, "global_step": 287067, "epoch": 3458} {"train_loss": -25.189159393310547, "global_step": 287068, "epoch": 3458} {"train_loss": -24.700546264648438, "global_step": 287069, "epoch": 3458} {"train_loss": -24.972864151000977, "global_step": 287070, "epoch": 3458} {"train_loss": -24.56406593322754, "global_step": 287071, "epoch": 3458} {"train_loss": -24.90536880493164, "global_step": 287072, "epoch": 3458} {"train_loss": -25.42201805114746, "global_step": 287073, "epoch": 3458} {"train_loss": -25.184247970581055, "global_step": 287074, "epoch": 3458} {"train_loss": -25.051101684570312, "global_step": 287075, "epoch": 3458} {"train_loss": -25.104156494140625, "global_step": 287076, "epoch": 3458} {"train_loss": -25.306156158447266, "global_step": 287077, "epoch": 3458} {"train_loss": -25.42852783203125, "global_step": 287078, "epoch": 3458} {"train_loss": -24.993757247924805, "global_step": 287079, "epoch": 3458} {"train_loss": -25.583555221557617, "global_step": 287080, "epoch": 3458} {"train_loss": -25.4129638671875, "global_step": 287081, "epoch": 3458} {"train_loss": -25.7705135345459, "global_step": 287082, "epoch": 3458} {"train_loss": -25.663360595703125, "global_step": 287083, "epoch": 3458} {"train_loss": -25.70448112487793, "global_step": 287084, "epoch": 3458} {"train_loss": -25.034564971923828, "global_step": 287085, "epoch": 3458} {"train_loss": -25.49857521057129, "global_step": 287086, "epoch": 3458} {"train_loss": -25.902008056640625, "global_step": 287087, "epoch": 3458} {"train_loss": -25.658788681030273, "global_step": 287088, "epoch": 3458} {"train_loss": -25.37399673461914, "global_step": 287089, "epoch": 3458} {"train_loss": -25.643518447875977, "global_step": 287090, "epoch": 3458} {"train_loss": -25.26397132873535, "global_step": 287091, "epoch": 3458} {"train_loss": -25.716840744018555, "global_step": 287092, "epoch": 3458} {"train_loss": -25.432682037353516, "global_step": 287093, "epoch": 3458} {"train_loss": -25.299177169799805, "global_step": 287094, "epoch": 3458} {"train_loss": -25.399765014648438, "global_step": 287095, "epoch": 3458} {"train_loss": -25.48772414333849, "global_step": 287096, "epoch": 3458, "val_loss": 7016703.5} {"train_loss": -25.468765258789062, "global_step": 287097, "epoch": 3459} {"train_loss": -25.0310001373291, "global_step": 287098, "epoch": 3459} {"train_loss": -24.739736557006836, "global_step": 287099, "epoch": 3459} {"train_loss": -25.404630661010742, "global_step": 287100, "epoch": 3459} {"train_loss": -25.104196548461914, "global_step": 287101, "epoch": 3459} {"train_loss": -24.789609909057617, "global_step": 287102, "epoch": 3459} {"train_loss": -24.629690170288086, "global_step": 287103, "epoch": 3459} {"train_loss": -25.32354736328125, "global_step": 287104, "epoch": 3459} {"train_loss": -25.240591049194336, "global_step": 287105, "epoch": 3459} {"train_loss": -25.121850967407227, "global_step": 287106, "epoch": 3459} {"train_loss": -25.101789474487305, "global_step": 287107, "epoch": 3459} {"train_loss": -25.199188232421875, "global_step": 287108, "epoch": 3459} {"train_loss": -25.150348663330078, "global_step": 287109, "epoch": 3459} {"train_loss": -25.20906639099121, "global_step": 287110, "epoch": 3459} {"train_loss": -25.59773063659668, "global_step": 287111, "epoch": 3459} {"train_loss": -25.155214309692383, "global_step": 287112, "epoch": 3459} {"train_loss": -25.167455673217773, "global_step": 287113, "epoch": 3459} {"train_loss": -25.217626571655273, "global_step": 287114, "epoch": 3459} {"train_loss": -25.269535064697266, "global_step": 287115, "epoch": 3459} {"train_loss": -25.143213272094727, "global_step": 287116, "epoch": 3459} {"train_loss": -25.24651527404785, "global_step": 287117, "epoch": 3459} {"train_loss": -25.344083786010742, "global_step": 287118, "epoch": 3459} {"train_loss": -25.116241455078125, "global_step": 287119, "epoch": 3459} {"train_loss": -25.3980655670166, "global_step": 287120, "epoch": 3459} {"train_loss": -25.46919059753418, "global_step": 287121, "epoch": 3459} {"train_loss": -25.204790115356445, "global_step": 287122, "epoch": 3459} {"train_loss": -25.480960845947266, "global_step": 287123, "epoch": 3459} {"train_loss": -25.492666244506836, "global_step": 287124, "epoch": 3459} {"train_loss": -25.549726486206055, "global_step": 287125, "epoch": 3459} {"train_loss": -25.21730613708496, "global_step": 287126, "epoch": 3459} {"train_loss": -25.614398956298828, "global_step": 287127, "epoch": 3459} {"train_loss": -25.6592960357666, "global_step": 287128, "epoch": 3459} {"train_loss": -25.7158260345459, "global_step": 287129, "epoch": 3459} {"train_loss": -25.600873947143555, "global_step": 287130, "epoch": 3459} {"train_loss": -25.590383529663086, "global_step": 287131, "epoch": 3459} {"train_loss": -25.574735641479492, "global_step": 287132, "epoch": 3459} {"train_loss": -25.460145950317383, "global_step": 287133, "epoch": 3459} {"train_loss": -25.763324737548828, "global_step": 287134, "epoch": 3459} {"train_loss": -25.56671714782715, "global_step": 287135, "epoch": 3459} {"train_loss": -25.52982521057129, "global_step": 287136, "epoch": 3459} {"train_loss": -25.263980865478516, "global_step": 287137, "epoch": 3459} {"train_loss": -25.447914123535156, "global_step": 287138, "epoch": 3459} {"train_loss": -25.87613868713379, "global_step": 287139, "epoch": 3459} {"train_loss": -25.60711097717285, "global_step": 287140, "epoch": 3459} {"train_loss": -25.578916549682617, "global_step": 287141, "epoch": 3459} {"train_loss": -25.480459213256836, "global_step": 287142, "epoch": 3459} {"train_loss": -25.943693161010742, "global_step": 287143, "epoch": 3459} {"train_loss": -25.493200302124023, "global_step": 287144, "epoch": 3459} {"train_loss": -25.832509994506836, "global_step": 287145, "epoch": 3459} {"train_loss": -25.492721557617188, "global_step": 287146, "epoch": 3459} {"train_loss": -25.730484008789062, "global_step": 287147, "epoch": 3459} {"train_loss": -25.217357635498047, "global_step": 287148, "epoch": 3459} {"train_loss": -25.350799560546875, "global_step": 287149, "epoch": 3459} {"train_loss": -25.34661865234375, "global_step": 287150, "epoch": 3459} {"train_loss": -24.71047019958496, "global_step": 287151, "epoch": 3459} {"train_loss": -24.998016357421875, "global_step": 287152, "epoch": 3459} {"train_loss": -24.96338653564453, "global_step": 287153, "epoch": 3459} {"train_loss": -25.359220504760742, "global_step": 287154, "epoch": 3459} {"train_loss": -24.84307861328125, "global_step": 287155, "epoch": 3459} {"train_loss": -24.487205505371094, "global_step": 287156, "epoch": 3459} {"train_loss": -25.381284713745117, "global_step": 287157, "epoch": 3459} {"train_loss": -24.598094940185547, "global_step": 287158, "epoch": 3459} {"train_loss": -25.026594161987305, "global_step": 287159, "epoch": 3459} {"train_loss": -25.373003005981445, "global_step": 287160, "epoch": 3459} {"train_loss": -25.3293514251709, "global_step": 287161, "epoch": 3459} {"train_loss": -25.443073272705078, "global_step": 287162, "epoch": 3459} {"train_loss": -24.98749542236328, "global_step": 287163, "epoch": 3459} {"train_loss": -25.088003158569336, "global_step": 287164, "epoch": 3459} {"train_loss": -25.43647575378418, "global_step": 287165, "epoch": 3459} {"train_loss": -25.153417587280273, "global_step": 287166, "epoch": 3459} {"train_loss": -25.141159057617188, "global_step": 287167, "epoch": 3459} {"train_loss": -25.603824615478516, "global_step": 287168, "epoch": 3459} {"train_loss": -25.57221031188965, "global_step": 287169, "epoch": 3459} {"train_loss": -24.997243881225586, "global_step": 287170, "epoch": 3459} {"train_loss": -25.29071044921875, "global_step": 287171, "epoch": 3459} {"train_loss": -25.215166091918945, "global_step": 287172, "epoch": 3459} {"train_loss": -25.642492294311523, "global_step": 287173, "epoch": 3459} {"train_loss": -25.45489501953125, "global_step": 287174, "epoch": 3459} {"train_loss": -25.466272354125977, "global_step": 287175, "epoch": 3459} {"train_loss": -25.086702346801758, "global_step": 287176, "epoch": 3459} {"train_loss": -25.691198348999023, "global_step": 287177, "epoch": 3459} {"train_loss": -25.58077049255371, "global_step": 287178, "epoch": 3459} {"train_loss": -25.316141726022742, "global_step": 287179, "epoch": 3459, "val_loss": 7123519.0} {"train_loss": -25.397083282470703, "global_step": 287180, "epoch": 3460} {"train_loss": -24.81056785583496, "global_step": 287181, "epoch": 3460} {"train_loss": -25.236459732055664, "global_step": 287182, "epoch": 3460} {"train_loss": -25.07073402404785, "global_step": 287183, "epoch": 3460} {"train_loss": -25.172256469726562, "global_step": 287184, "epoch": 3460} {"train_loss": -24.70163917541504, "global_step": 287185, "epoch": 3460} {"train_loss": -25.526884078979492, "global_step": 287186, "epoch": 3460} {"train_loss": -25.21027183532715, "global_step": 287187, "epoch": 3460} {"train_loss": -25.042543411254883, "global_step": 287188, "epoch": 3460} {"train_loss": -25.341114044189453, "global_step": 287189, "epoch": 3460} {"train_loss": -25.57419776916504, "global_step": 287190, "epoch": 3460} {"train_loss": -25.188146591186523, "global_step": 287191, "epoch": 3460} {"train_loss": -25.235624313354492, "global_step": 287192, "epoch": 3460} {"train_loss": -25.30843162536621, "global_step": 287193, "epoch": 3460} {"train_loss": -25.365766525268555, "global_step": 287194, "epoch": 3460} {"train_loss": -25.211681365966797, "global_step": 287195, "epoch": 3460} {"train_loss": -25.539819717407227, "global_step": 287196, "epoch": 3460} {"train_loss": -25.098276138305664, "global_step": 287197, "epoch": 3460} {"train_loss": -25.494539260864258, "global_step": 287198, "epoch": 3460} {"train_loss": -25.435400009155273, "global_step": 287199, "epoch": 3460} {"train_loss": -25.475160598754883, "global_step": 287200, "epoch": 3460} {"train_loss": -25.683502197265625, "global_step": 287201, "epoch": 3460} {"train_loss": -25.369029998779297, "global_step": 287202, "epoch": 3460} {"train_loss": -25.42786979675293, "global_step": 287203, "epoch": 3460} {"train_loss": -25.7174015045166, "global_step": 287204, "epoch": 3460} {"train_loss": -25.35953712463379, "global_step": 287205, "epoch": 3460} {"train_loss": -25.650440216064453, "global_step": 287206, "epoch": 3460} {"train_loss": -25.3812198638916, "global_step": 287207, "epoch": 3460} {"train_loss": -25.48166275024414, "global_step": 287208, "epoch": 3460} {"train_loss": -25.70722007751465, "global_step": 287209, "epoch": 3460} {"train_loss": -25.351722717285156, "global_step": 287210, "epoch": 3460} {"train_loss": -25.6488094329834, "global_step": 287211, "epoch": 3460} {"train_loss": -25.442453384399414, "global_step": 287212, "epoch": 3460} {"train_loss": -25.7373104095459, "global_step": 287213, "epoch": 3460} {"train_loss": -25.686498641967773, "global_step": 287214, "epoch": 3460} {"train_loss": -25.620763778686523, "global_step": 287215, "epoch": 3460} {"train_loss": -25.55849266052246, "global_step": 287216, "epoch": 3460} {"train_loss": -25.697965621948242, "global_step": 287217, "epoch": 3460} {"train_loss": -25.277088165283203, "global_step": 287218, "epoch": 3460} {"train_loss": -25.920764923095703, "global_step": 287219, "epoch": 3460} {"train_loss": -25.38349723815918, "global_step": 287220, "epoch": 3460} {"train_loss": -25.436115264892578, "global_step": 287221, "epoch": 3460} {"train_loss": -25.509933471679688, "global_step": 287222, "epoch": 3460} {"train_loss": -25.45723533630371, "global_step": 287223, "epoch": 3460} {"train_loss": -25.46701431274414, "global_step": 287224, "epoch": 3460} {"train_loss": -25.811513900756836, "global_step": 287225, "epoch": 3460} {"train_loss": -25.167203903198242, "global_step": 287226, "epoch": 3460} {"train_loss": -25.098342895507812, "global_step": 287227, "epoch": 3460} {"train_loss": -25.06377601623535, "global_step": 287228, "epoch": 3460} {"train_loss": -25.389074325561523, "global_step": 287229, "epoch": 3460} {"train_loss": -25.49187660217285, "global_step": 287230, "epoch": 3460} {"train_loss": -25.08064079284668, "global_step": 287231, "epoch": 3460} {"train_loss": -24.98362922668457, "global_step": 287232, "epoch": 3460} {"train_loss": -25.6125431060791, "global_step": 287233, "epoch": 3460} {"train_loss": -25.776060104370117, "global_step": 287234, "epoch": 3460} {"train_loss": -25.388586044311523, "global_step": 287235, "epoch": 3460} {"train_loss": -25.31812286376953, "global_step": 287236, "epoch": 3460} {"train_loss": -25.262304306030273, "global_step": 287237, "epoch": 3460} {"train_loss": -25.438608169555664, "global_step": 287238, "epoch": 3460} {"train_loss": -25.380849838256836, "global_step": 287239, "epoch": 3460} {"train_loss": -25.18718719482422, "global_step": 287240, "epoch": 3460} {"train_loss": -25.603927612304688, "global_step": 287241, "epoch": 3460} {"train_loss": -25.19405746459961, "global_step": 287242, "epoch": 3460} {"train_loss": -25.352773666381836, "global_step": 287243, "epoch": 3460} {"train_loss": -25.73724937438965, "global_step": 287244, "epoch": 3460} {"train_loss": -25.53327751159668, "global_step": 287245, "epoch": 3460} {"train_loss": -25.886682510375977, "global_step": 287246, "epoch": 3460} {"train_loss": -25.506689071655273, "global_step": 287247, "epoch": 3460} {"train_loss": -25.472734451293945, "global_step": 287248, "epoch": 3460} {"train_loss": -25.7568359375, "global_step": 287249, "epoch": 3460} {"train_loss": -25.523630142211914, "global_step": 287250, "epoch": 3460} {"train_loss": -25.683088302612305, "global_step": 287251, "epoch": 3460} {"train_loss": -25.563833236694336, "global_step": 287252, "epoch": 3460} {"train_loss": -25.5258846282959, "global_step": 287253, "epoch": 3460} {"train_loss": -25.499601364135742, "global_step": 287254, "epoch": 3460} {"train_loss": -25.365081787109375, "global_step": 287255, "epoch": 3460} {"train_loss": -25.546701431274414, "global_step": 287256, "epoch": 3460} {"train_loss": -25.700244903564453, "global_step": 287257, "epoch": 3460} {"train_loss": -26.093969345092773, "global_step": 287258, "epoch": 3460} {"train_loss": -25.908170700073242, "global_step": 287259, "epoch": 3460} {"train_loss": -25.240097045898438, "global_step": 287260, "epoch": 3460} {"train_loss": -25.522096633911133, "global_step": 287261, "epoch": 3460} {"train_loss": -25.434162070952265, "global_step": 287262, "epoch": 3460, "val_loss": 7024974.0} {"train_loss": -25.407682418823242, "global_step": 287263, "epoch": 3461} {"train_loss": -24.813539505004883, "global_step": 287264, "epoch": 3461} {"train_loss": -25.278690338134766, "global_step": 287265, "epoch": 3461} {"train_loss": -25.202775955200195, "global_step": 287266, "epoch": 3461} {"train_loss": -25.32533836364746, "global_step": 287267, "epoch": 3461} {"train_loss": -25.294279098510742, "global_step": 287268, "epoch": 3461} {"train_loss": -24.998130798339844, "global_step": 287269, "epoch": 3461} {"train_loss": -25.088857650756836, "global_step": 287270, "epoch": 3461} {"train_loss": -25.194171905517578, "global_step": 287271, "epoch": 3461} {"train_loss": -24.889150619506836, "global_step": 287272, "epoch": 3461} {"train_loss": -25.073657989501953, "global_step": 287273, "epoch": 3461} {"train_loss": -25.503787994384766, "global_step": 287274, "epoch": 3461} {"train_loss": -25.27947998046875, "global_step": 287275, "epoch": 3461} {"train_loss": -25.3787841796875, "global_step": 287276, "epoch": 3461} {"train_loss": -25.367841720581055, "global_step": 287277, "epoch": 3461} {"train_loss": -25.53814125061035, "global_step": 287278, "epoch": 3461} {"train_loss": -24.967426300048828, "global_step": 287279, "epoch": 3461} {"train_loss": -25.406848907470703, "global_step": 287280, "epoch": 3461} {"train_loss": -25.39790916442871, "global_step": 287281, "epoch": 3461} {"train_loss": -25.411285400390625, "global_step": 287282, "epoch": 3461} {"train_loss": -25.480396270751953, "global_step": 287283, "epoch": 3461} {"train_loss": -25.57021141052246, "global_step": 287284, "epoch": 3461} {"train_loss": -25.199207305908203, "global_step": 287285, "epoch": 3461} {"train_loss": -24.887054443359375, "global_step": 287286, "epoch": 3461} {"train_loss": -25.412845611572266, "global_step": 287287, "epoch": 3461} {"train_loss": -25.31969451904297, "global_step": 287288, "epoch": 3461} {"train_loss": -25.09444808959961, "global_step": 287289, "epoch": 3461} {"train_loss": -25.76849365234375, "global_step": 287290, "epoch": 3461} {"train_loss": -25.345827102661133, "global_step": 287291, "epoch": 3461} {"train_loss": -25.505239486694336, "global_step": 287292, "epoch": 3461} {"train_loss": -25.321331024169922, "global_step": 287293, "epoch": 3461} {"train_loss": -25.778039932250977, "global_step": 287294, "epoch": 3461} {"train_loss": -25.499324798583984, "global_step": 287295, "epoch": 3461} {"train_loss": -25.6320743560791, "global_step": 287296, "epoch": 3461} {"train_loss": -25.414396286010742, "global_step": 287297, "epoch": 3461} {"train_loss": -25.414161682128906, "global_step": 287298, "epoch": 3461} {"train_loss": -25.621631622314453, "global_step": 287299, "epoch": 3461} {"train_loss": -25.578659057617188, "global_step": 287300, "epoch": 3461} {"train_loss": -25.9871768951416, "global_step": 287301, "epoch": 3461} {"train_loss": -25.454538345336914, "global_step": 287302, "epoch": 3461} {"train_loss": -25.811660766601562, "global_step": 287303, "epoch": 3461} {"train_loss": -25.32755470275879, "global_step": 287304, "epoch": 3461} {"train_loss": -25.254606246948242, "global_step": 287305, "epoch": 3461} {"train_loss": -25.785633087158203, "global_step": 287306, "epoch": 3461} {"train_loss": -25.49757194519043, "global_step": 287307, "epoch": 3461} {"train_loss": -25.394512176513672, "global_step": 287308, "epoch": 3461} {"train_loss": -25.523542404174805, "global_step": 287309, "epoch": 3461} {"train_loss": -25.246103286743164, "global_step": 287310, "epoch": 3461} {"train_loss": -25.344440460205078, "global_step": 287311, "epoch": 3461} {"train_loss": -25.526256561279297, "global_step": 287312, "epoch": 3461} {"train_loss": -25.845794677734375, "global_step": 287313, "epoch": 3461} {"train_loss": -25.60101318359375, "global_step": 287314, "epoch": 3461} {"train_loss": -25.633981704711914, "global_step": 287315, "epoch": 3461} {"train_loss": -25.417150497436523, "global_step": 287316, "epoch": 3461} {"train_loss": -25.32047462463379, "global_step": 287317, "epoch": 3461} {"train_loss": -25.573957443237305, "global_step": 287318, "epoch": 3461} {"train_loss": -25.480073928833008, "global_step": 287319, "epoch": 3461} {"train_loss": -25.882049560546875, "global_step": 287320, "epoch": 3461} {"train_loss": -25.523090362548828, "global_step": 287321, "epoch": 3461} {"train_loss": -25.717823028564453, "global_step": 287322, "epoch": 3461} {"train_loss": -25.552480697631836, "global_step": 287323, "epoch": 3461} {"train_loss": -24.852859497070312, "global_step": 287324, "epoch": 3461} {"train_loss": -24.91485595703125, "global_step": 287325, "epoch": 3461} {"train_loss": -25.41965103149414, "global_step": 287326, "epoch": 3461} {"train_loss": -25.320816040039062, "global_step": 287327, "epoch": 3461} {"train_loss": -25.280134201049805, "global_step": 287328, "epoch": 3461} {"train_loss": -25.1962890625, "global_step": 287329, "epoch": 3461} {"train_loss": -25.52518653869629, "global_step": 287330, "epoch": 3461} {"train_loss": -25.371156692504883, "global_step": 287331, "epoch": 3461} {"train_loss": -25.778549194335938, "global_step": 287332, "epoch": 3461} {"train_loss": -25.93463134765625, "global_step": 287333, "epoch": 3461} {"train_loss": -25.701202392578125, "global_step": 287334, "epoch": 3461} {"train_loss": -25.475555419921875, "global_step": 287335, "epoch": 3461} {"train_loss": -25.719892501831055, "global_step": 287336, "epoch": 3461} {"train_loss": -25.429014205932617, "global_step": 287337, "epoch": 3461} {"train_loss": -25.57586097717285, "global_step": 287338, "epoch": 3461} {"train_loss": -25.76094627380371, "global_step": 287339, "epoch": 3461} {"train_loss": -25.46381950378418, "global_step": 287340, "epoch": 3461} {"train_loss": -25.755517959594727, "global_step": 287341, "epoch": 3461} {"train_loss": -25.799097061157227, "global_step": 287342, "epoch": 3461} {"train_loss": -25.546579360961914, "global_step": 287343, "epoch": 3461} {"train_loss": -25.886682510375977, "global_step": 287344, "epoch": 3461} {"train_loss": -25.437987798667816, "global_step": 287345, "epoch": 3461, "val_loss": 7037781.0} {"train_loss": -25.08884620666504, "global_step": 287346, "epoch": 3462} {"train_loss": -24.968685150146484, "global_step": 287347, "epoch": 3462} {"train_loss": -25.68230628967285, "global_step": 287348, "epoch": 3462} {"train_loss": -25.18204689025879, "global_step": 287349, "epoch": 3462} {"train_loss": -25.502017974853516, "global_step": 287350, "epoch": 3462} {"train_loss": -25.174480438232422, "global_step": 287351, "epoch": 3462} {"train_loss": -24.946063995361328, "global_step": 287352, "epoch": 3462} {"train_loss": -25.522375106811523, "global_step": 287353, "epoch": 3462} {"train_loss": -24.975326538085938, "global_step": 287354, "epoch": 3462} {"train_loss": -25.166242599487305, "global_step": 287355, "epoch": 3462} {"train_loss": -25.436767578125, "global_step": 287356, "epoch": 3462} {"train_loss": -25.542469024658203, "global_step": 287357, "epoch": 3462} {"train_loss": -25.282367706298828, "global_step": 287358, "epoch": 3462} {"train_loss": -25.287155151367188, "global_step": 287359, "epoch": 3462} {"train_loss": -25.601736068725586, "global_step": 287360, "epoch": 3462} {"train_loss": -25.314966201782227, "global_step": 287361, "epoch": 3462} {"train_loss": -25.415283203125, "global_step": 287362, "epoch": 3462} {"train_loss": -25.395689010620117, "global_step": 287363, "epoch": 3462} {"train_loss": -25.400421142578125, "global_step": 287364, "epoch": 3462} {"train_loss": -25.529422760009766, "global_step": 287365, "epoch": 3462} {"train_loss": -25.5465145111084, "global_step": 287366, "epoch": 3462} {"train_loss": -25.590681076049805, "global_step": 287367, "epoch": 3462} {"train_loss": -25.47126007080078, "global_step": 287368, "epoch": 3462} {"train_loss": -25.599401473999023, "global_step": 287369, "epoch": 3462} {"train_loss": -25.575050354003906, "global_step": 287370, "epoch": 3462} {"train_loss": -25.552114486694336, "global_step": 287371, "epoch": 3462} {"train_loss": -25.843183517456055, "global_step": 287372, "epoch": 3462} {"train_loss": -25.456804275512695, "global_step": 287373, "epoch": 3462} {"train_loss": -26.050573348999023, "global_step": 287374, "epoch": 3462} {"train_loss": -25.717161178588867, "global_step": 287375, "epoch": 3462} {"train_loss": -25.6663875579834, "global_step": 287376, "epoch": 3462} {"train_loss": -25.646650314331055, "global_step": 287377, "epoch": 3462} {"train_loss": -25.84796714782715, "global_step": 287378, "epoch": 3462} {"train_loss": -25.694669723510742, "global_step": 287379, "epoch": 3462} {"train_loss": -26.022192001342773, "global_step": 287380, "epoch": 3462} {"train_loss": -25.52472496032715, "global_step": 287381, "epoch": 3462} {"train_loss": -25.884445190429688, "global_step": 287382, "epoch": 3462} {"train_loss": -25.967992782592773, "global_step": 287383, "epoch": 3462} {"train_loss": -25.69147300720215, "global_step": 287384, "epoch": 3462} {"train_loss": -25.52202796936035, "global_step": 287385, "epoch": 3462} {"train_loss": -25.482742309570312, "global_step": 287386, "epoch": 3462} {"train_loss": -25.243234634399414, "global_step": 287387, "epoch": 3462} {"train_loss": -25.272192001342773, "global_step": 287388, "epoch": 3462} {"train_loss": -25.17647361755371, "global_step": 287389, "epoch": 3462} {"train_loss": -25.776020050048828, "global_step": 287390, "epoch": 3462} {"train_loss": -25.03727149963379, "global_step": 287391, "epoch": 3462} {"train_loss": -25.241918563842773, "global_step": 287392, "epoch": 3462} {"train_loss": -25.46754264831543, "global_step": 287393, "epoch": 3462} {"train_loss": -25.719980239868164, "global_step": 287394, "epoch": 3462} {"train_loss": -25.462554931640625, "global_step": 287395, "epoch": 3462} {"train_loss": -25.52613639831543, "global_step": 287396, "epoch": 3462} {"train_loss": -25.966699600219727, "global_step": 287397, "epoch": 3462} {"train_loss": -25.748579025268555, "global_step": 287398, "epoch": 3462} {"train_loss": -25.51766014099121, "global_step": 287399, "epoch": 3462} {"train_loss": -25.541458129882812, "global_step": 287400, "epoch": 3462} {"train_loss": -24.878774642944336, "global_step": 287401, "epoch": 3462} {"train_loss": -25.15825653076172, "global_step": 287402, "epoch": 3462} {"train_loss": -25.11836814880371, "global_step": 287403, "epoch": 3462} {"train_loss": -25.381103515625, "global_step": 287404, "epoch": 3462} {"train_loss": -25.243635177612305, "global_step": 287405, "epoch": 3462} {"train_loss": -25.659393310546875, "global_step": 287406, "epoch": 3462} {"train_loss": -25.14168357849121, "global_step": 287407, "epoch": 3462} {"train_loss": -25.31825828552246, "global_step": 287408, "epoch": 3462} {"train_loss": -25.54064178466797, "global_step": 287409, "epoch": 3462} {"train_loss": -25.28555679321289, "global_step": 287410, "epoch": 3462} {"train_loss": -25.612781524658203, "global_step": 287411, "epoch": 3462} {"train_loss": -25.530920028686523, "global_step": 287412, "epoch": 3462} {"train_loss": -25.566823959350586, "global_step": 287413, "epoch": 3462} {"train_loss": -25.292598724365234, "global_step": 287414, "epoch": 3462} {"train_loss": -25.191076278686523, "global_step": 287415, "epoch": 3462} {"train_loss": -25.506052017211914, "global_step": 287416, "epoch": 3462} {"train_loss": -25.824848175048828, "global_step": 287417, "epoch": 3462} {"train_loss": -25.806669235229492, "global_step": 287418, "epoch": 3462} {"train_loss": -25.266725540161133, "global_step": 287419, "epoch": 3462} {"train_loss": -25.210102081298828, "global_step": 287420, "epoch": 3462} {"train_loss": -25.339820861816406, "global_step": 287421, "epoch": 3462} {"train_loss": -25.258474349975586, "global_step": 287422, "epoch": 3462} {"train_loss": -25.3778133392334, "global_step": 287423, "epoch": 3462} {"train_loss": -24.783578872680664, "global_step": 287424, "epoch": 3462} {"train_loss": -25.13919448852539, "global_step": 287425, "epoch": 3462} {"train_loss": -25.06520652770996, "global_step": 287426, "epoch": 3462} {"train_loss": -25.17793846130371, "global_step": 287427, "epoch": 3462} {"train_loss": -25.407329766147107, "global_step": 287428, "epoch": 3462, "val_loss": 7121573.0} {"train_loss": -24.836244583129883, "global_step": 287429, "epoch": 3463} {"train_loss": -24.47601318359375, "global_step": 287430, "epoch": 3463} {"train_loss": -24.966552734375, "global_step": 287431, "epoch": 3463} {"train_loss": -24.681074142456055, "global_step": 287432, "epoch": 3463} {"train_loss": -24.487295150756836, "global_step": 287433, "epoch": 3463} {"train_loss": -24.524869918823242, "global_step": 287434, "epoch": 3463} {"train_loss": -24.531021118164062, "global_step": 287435, "epoch": 3463} {"train_loss": -24.918519973754883, "global_step": 287436, "epoch": 3463} {"train_loss": -24.6517276763916, "global_step": 287437, "epoch": 3463} {"train_loss": -24.859792709350586, "global_step": 287438, "epoch": 3463} {"train_loss": -24.664716720581055, "global_step": 287439, "epoch": 3463} {"train_loss": -25.262332916259766, "global_step": 287440, "epoch": 3463} {"train_loss": -25.482717514038086, "global_step": 287441, "epoch": 3463} {"train_loss": -25.099884033203125, "global_step": 287442, "epoch": 3463} {"train_loss": -25.20248794555664, "global_step": 287443, "epoch": 3463} {"train_loss": -25.04010009765625, "global_step": 287444, "epoch": 3463} {"train_loss": -25.360599517822266, "global_step": 287445, "epoch": 3463} {"train_loss": -25.071218490600586, "global_step": 287446, "epoch": 3463} {"train_loss": -25.518922805786133, "global_step": 287447, "epoch": 3463} {"train_loss": -25.20844841003418, "global_step": 287448, "epoch": 3463} {"train_loss": -25.475488662719727, "global_step": 287449, "epoch": 3463} {"train_loss": -25.327272415161133, "global_step": 287450, "epoch": 3463} {"train_loss": -25.4993953704834, "global_step": 287451, "epoch": 3463} {"train_loss": -24.978675842285156, "global_step": 287452, "epoch": 3463} {"train_loss": -25.5351619720459, "global_step": 287453, "epoch": 3463} {"train_loss": -25.119497299194336, "global_step": 287454, "epoch": 3463} {"train_loss": -25.132192611694336, "global_step": 287455, "epoch": 3463} {"train_loss": -25.25139045715332, "global_step": 287456, "epoch": 3463} {"train_loss": -25.32024574279785, "global_step": 287457, "epoch": 3463} {"train_loss": -25.547138214111328, "global_step": 287458, "epoch": 3463} {"train_loss": -25.268613815307617, "global_step": 287459, "epoch": 3463} {"train_loss": -25.586523056030273, "global_step": 287460, "epoch": 3463} {"train_loss": -25.4548397064209, "global_step": 287461, "epoch": 3463} {"train_loss": -25.64644432067871, "global_step": 287462, "epoch": 3463} {"train_loss": -25.61165428161621, "global_step": 287463, "epoch": 3463} {"train_loss": -25.549604415893555, "global_step": 287464, "epoch": 3463} {"train_loss": -26.092870712280273, "global_step": 287465, "epoch": 3463} {"train_loss": -25.256378173828125, "global_step": 287466, "epoch": 3463} {"train_loss": -25.89815330505371, "global_step": 287467, "epoch": 3463} {"train_loss": -25.47943687438965, "global_step": 287468, "epoch": 3463} {"train_loss": -25.42778968811035, "global_step": 287469, "epoch": 3463} {"train_loss": -25.42671775817871, "global_step": 287470, "epoch": 3463} {"train_loss": -24.993309020996094, "global_step": 287471, "epoch": 3463} {"train_loss": -25.18117332458496, "global_step": 287472, "epoch": 3463} {"train_loss": -25.30916404724121, "global_step": 287473, "epoch": 3463} {"train_loss": -25.40638542175293, "global_step": 287474, "epoch": 3463} {"train_loss": -25.087080001831055, "global_step": 287475, "epoch": 3463} {"train_loss": -25.33386993408203, "global_step": 287476, "epoch": 3463} {"train_loss": -24.768131256103516, "global_step": 287477, "epoch": 3463} {"train_loss": -25.43025016784668, "global_step": 287478, "epoch": 3463} {"train_loss": -24.953983306884766, "global_step": 287479, "epoch": 3463} {"train_loss": -25.588838577270508, "global_step": 287480, "epoch": 3463} {"train_loss": -25.36101722717285, "global_step": 287481, "epoch": 3463} {"train_loss": -25.35464859008789, "global_step": 287482, "epoch": 3463} {"train_loss": -25.380084991455078, "global_step": 287483, "epoch": 3463} {"train_loss": -25.814855575561523, "global_step": 287484, "epoch": 3463} {"train_loss": -25.137256622314453, "global_step": 287485, "epoch": 3463} {"train_loss": -25.21759605407715, "global_step": 287486, "epoch": 3463} {"train_loss": -25.1732234954834, "global_step": 287487, "epoch": 3463} {"train_loss": -25.125490188598633, "global_step": 287488, "epoch": 3463} {"train_loss": -25.489347457885742, "global_step": 287489, "epoch": 3463} {"train_loss": -25.10447120666504, "global_step": 287490, "epoch": 3463} {"train_loss": -25.402328491210938, "global_step": 287491, "epoch": 3463} {"train_loss": -25.612567901611328, "global_step": 287492, "epoch": 3463} {"train_loss": -25.120004653930664, "global_step": 287493, "epoch": 3463} {"train_loss": -25.7393856048584, "global_step": 287494, "epoch": 3463} {"train_loss": -25.309541702270508, "global_step": 287495, "epoch": 3463} {"train_loss": -25.469942092895508, "global_step": 287496, "epoch": 3463} {"train_loss": -25.4505615234375, "global_step": 287497, "epoch": 3463} {"train_loss": -25.746427536010742, "global_step": 287498, "epoch": 3463} {"train_loss": -25.5308895111084, "global_step": 287499, "epoch": 3463} {"train_loss": -25.37363052368164, "global_step": 287500, "epoch": 3463} {"train_loss": -25.561983108520508, "global_step": 287501, "epoch": 3463} {"train_loss": -25.42067527770996, "global_step": 287502, "epoch": 3463} {"train_loss": -25.37843132019043, "global_step": 287503, "epoch": 3463} {"train_loss": -25.529470443725586, "global_step": 287504, "epoch": 3463} {"train_loss": -25.571622848510742, "global_step": 287505, "epoch": 3463} {"train_loss": -25.0036563873291, "global_step": 287506, "epoch": 3463} {"train_loss": -25.909000396728516, "global_step": 287507, "epoch": 3463} {"train_loss": -25.535783767700195, "global_step": 287508, "epoch": 3463} {"train_loss": -25.241910934448242, "global_step": 287509, "epoch": 3463} {"train_loss": -25.769987106323242, "global_step": 287510, "epoch": 3463} {"train_loss": -25.290822959807983, "global_step": 287511, "epoch": 3463, "val_loss": 7191401.0} {"train_loss": -25.066762924194336, "global_step": 287512, "epoch": 3464} {"train_loss": -24.75937271118164, "global_step": 287513, "epoch": 3464} {"train_loss": -25.019607543945312, "global_step": 287514, "epoch": 3464} {"train_loss": -25.216089248657227, "global_step": 287515, "epoch": 3464} {"train_loss": -24.81736946105957, "global_step": 287516, "epoch": 3464} {"train_loss": -25.07577896118164, "global_step": 287517, "epoch": 3464} {"train_loss": -25.137611389160156, "global_step": 287518, "epoch": 3464} {"train_loss": -25.1626033782959, "global_step": 287519, "epoch": 3464} {"train_loss": -25.014509201049805, "global_step": 287520, "epoch": 3464} {"train_loss": -24.222881317138672, "global_step": 287521, "epoch": 3464} {"train_loss": -24.2083740234375, "global_step": 287522, "epoch": 3464} {"train_loss": -25.49429702758789, "global_step": 287523, "epoch": 3464} {"train_loss": -24.839731216430664, "global_step": 287524, "epoch": 3464} {"train_loss": -25.34623146057129, "global_step": 287525, "epoch": 3464} {"train_loss": -24.957962036132812, "global_step": 287526, "epoch": 3464} {"train_loss": -24.911624908447266, "global_step": 287527, "epoch": 3464} {"train_loss": -24.7515811920166, "global_step": 287528, "epoch": 3464} {"train_loss": -25.434194564819336, "global_step": 287529, "epoch": 3464} {"train_loss": -24.912450790405273, "global_step": 287530, "epoch": 3464} {"train_loss": -25.254430770874023, "global_step": 287531, "epoch": 3464} {"train_loss": -25.113035202026367, "global_step": 287532, "epoch": 3464} {"train_loss": -25.36025047302246, "global_step": 287533, "epoch": 3464} {"train_loss": -25.214231491088867, "global_step": 287534, "epoch": 3464} {"train_loss": -24.88092613220215, "global_step": 287535, "epoch": 3464} {"train_loss": -25.16287612915039, "global_step": 287536, "epoch": 3464} {"train_loss": -25.488943099975586, "global_step": 287537, "epoch": 3464} {"train_loss": -25.104660034179688, "global_step": 287538, "epoch": 3464} {"train_loss": -25.426000595092773, "global_step": 287539, "epoch": 3464} {"train_loss": -25.281354904174805, "global_step": 287540, "epoch": 3464} {"train_loss": -25.55518913269043, "global_step": 287541, "epoch": 3464} {"train_loss": -25.681604385375977, "global_step": 287542, "epoch": 3464} {"train_loss": -25.331356048583984, "global_step": 287543, "epoch": 3464} {"train_loss": -25.21321678161621, "global_step": 287544, "epoch": 3464} {"train_loss": -25.462928771972656, "global_step": 287545, "epoch": 3464} {"train_loss": -25.31094741821289, "global_step": 287546, "epoch": 3464} {"train_loss": -25.550487518310547, "global_step": 287547, "epoch": 3464} {"train_loss": -25.334213256835938, "global_step": 287548, "epoch": 3464} {"train_loss": -25.66278648376465, "global_step": 287549, "epoch": 3464} {"train_loss": -25.44049072265625, "global_step": 287550, "epoch": 3464} {"train_loss": -25.534025192260742, "global_step": 287551, "epoch": 3464} {"train_loss": -25.7707462310791, "global_step": 287552, "epoch": 3464} {"train_loss": -25.341535568237305, "global_step": 287553, "epoch": 3464} {"train_loss": -25.61768913269043, "global_step": 287554, "epoch": 3464} {"train_loss": -25.046363830566406, "global_step": 287555, "epoch": 3464} {"train_loss": -25.77341079711914, "global_step": 287556, "epoch": 3464} {"train_loss": -25.504310607910156, "global_step": 287557, "epoch": 3464} {"train_loss": -25.584604263305664, "global_step": 287558, "epoch": 3464} {"train_loss": -25.69144630432129, "global_step": 287559, "epoch": 3464} {"train_loss": -25.75565528869629, "global_step": 287560, "epoch": 3464} {"train_loss": -25.613012313842773, "global_step": 287561, "epoch": 3464} {"train_loss": -25.618213653564453, "global_step": 287562, "epoch": 3464} {"train_loss": -25.68191909790039, "global_step": 287563, "epoch": 3464} {"train_loss": -25.09681510925293, "global_step": 287564, "epoch": 3464} {"train_loss": -25.491134643554688, "global_step": 287565, "epoch": 3464} {"train_loss": -25.403228759765625, "global_step": 287566, "epoch": 3464} {"train_loss": -25.491086959838867, "global_step": 287567, "epoch": 3464} {"train_loss": -25.520790100097656, "global_step": 287568, "epoch": 3464} {"train_loss": -25.47259521484375, "global_step": 287569, "epoch": 3464} {"train_loss": -25.556638717651367, "global_step": 287570, "epoch": 3464} {"train_loss": -25.64481544494629, "global_step": 287571, "epoch": 3464} {"train_loss": -25.6735782623291, "global_step": 287572, "epoch": 3464} {"train_loss": -25.546491622924805, "global_step": 287573, "epoch": 3464} {"train_loss": -25.169897079467773, "global_step": 287574, "epoch": 3464} {"train_loss": -25.95924186706543, "global_step": 287575, "epoch": 3464} {"train_loss": -25.495729446411133, "global_step": 287576, "epoch": 3464} {"train_loss": -25.504728317260742, "global_step": 287577, "epoch": 3464} {"train_loss": -26.13079833984375, "global_step": 287578, "epoch": 3464} {"train_loss": -25.8433780670166, "global_step": 287579, "epoch": 3464} {"train_loss": -25.394657135009766, "global_step": 287580, "epoch": 3464} {"train_loss": -26.07123374938965, "global_step": 287581, "epoch": 3464} {"train_loss": -25.288541793823242, "global_step": 287582, "epoch": 3464} {"train_loss": -25.406347274780273, "global_step": 287583, "epoch": 3464} {"train_loss": -25.343687057495117, "global_step": 287584, "epoch": 3464} {"train_loss": -25.6724853515625, "global_step": 287585, "epoch": 3464} {"train_loss": -25.536090850830078, "global_step": 287586, "epoch": 3464} {"train_loss": -25.761030197143555, "global_step": 287587, "epoch": 3464} {"train_loss": -25.2026424407959, "global_step": 287588, "epoch": 3464} {"train_loss": -25.431201934814453, "global_step": 287589, "epoch": 3464} {"train_loss": -25.670446395874023, "global_step": 287590, "epoch": 3464} {"train_loss": -25.41474723815918, "global_step": 287591, "epoch": 3464} {"train_loss": -25.383726119995117, "global_step": 287592, "epoch": 3464} {"train_loss": -25.31101417541504, "global_step": 287593, "epoch": 3464} {"train_loss": -25.36044715973268, "global_step": 287594, "epoch": 3464, "val_loss": 7012675.0} {"train_loss": -25.159578323364258, "global_step": 287595, "epoch": 3465} {"train_loss": -24.92447280883789, "global_step": 287596, "epoch": 3465} {"train_loss": -24.816295623779297, "global_step": 287597, "epoch": 3465} {"train_loss": -24.73335075378418, "global_step": 287598, "epoch": 3465} {"train_loss": -24.831823348999023, "global_step": 287599, "epoch": 3465} {"train_loss": -24.812427520751953, "global_step": 287600, "epoch": 3465} {"train_loss": -24.561771392822266, "global_step": 287601, "epoch": 3465} {"train_loss": -24.88324546813965, "global_step": 287602, "epoch": 3465} {"train_loss": -24.77315330505371, "global_step": 287603, "epoch": 3465} {"train_loss": -24.87308692932129, "global_step": 287604, "epoch": 3465} {"train_loss": -24.68645668029785, "global_step": 287605, "epoch": 3465} {"train_loss": -25.134244918823242, "global_step": 287606, "epoch": 3465} {"train_loss": -24.98694610595703, "global_step": 287607, "epoch": 3465} {"train_loss": -25.046552658081055, "global_step": 287608, "epoch": 3465} {"train_loss": -24.555814743041992, "global_step": 287609, "epoch": 3465} {"train_loss": -25.216779708862305, "global_step": 287610, "epoch": 3465} {"train_loss": -25.47432518005371, "global_step": 287611, "epoch": 3465} {"train_loss": -25.484813690185547, "global_step": 287612, "epoch": 3465} {"train_loss": -25.25161361694336, "global_step": 287613, "epoch": 3465} {"train_loss": -25.183637619018555, "global_step": 287614, "epoch": 3465} {"train_loss": -25.260061264038086, "global_step": 287615, "epoch": 3465} {"train_loss": -25.139667510986328, "global_step": 287616, "epoch": 3465} {"train_loss": -25.57625389099121, "global_step": 287617, "epoch": 3465} {"train_loss": -25.492313385009766, "global_step": 287618, "epoch": 3465} {"train_loss": -25.2961483001709, "global_step": 287619, "epoch": 3465} {"train_loss": -25.198373794555664, "global_step": 287620, "epoch": 3465} {"train_loss": -25.2960262298584, "global_step": 287621, "epoch": 3465} {"train_loss": -25.316503524780273, "global_step": 287622, "epoch": 3465} {"train_loss": -25.09902000427246, "global_step": 287623, "epoch": 3465} {"train_loss": -25.227827072143555, "global_step": 287624, "epoch": 3465} {"train_loss": -25.485523223876953, "global_step": 287625, "epoch": 3465} {"train_loss": -25.723302841186523, "global_step": 287626, "epoch": 3465} {"train_loss": -25.852497100830078, "global_step": 287627, "epoch": 3465} {"train_loss": -25.26080894470215, "global_step": 287628, "epoch": 3465} {"train_loss": -24.965774536132812, "global_step": 287629, "epoch": 3465} {"train_loss": -25.751325607299805, "global_step": 287630, "epoch": 3465} {"train_loss": -25.458364486694336, "global_step": 287631, "epoch": 3465} {"train_loss": -25.175888061523438, "global_step": 287632, "epoch": 3465} {"train_loss": -25.590404510498047, "global_step": 287633, "epoch": 3465} {"train_loss": -25.439741134643555, "global_step": 287634, "epoch": 3465} {"train_loss": -25.50992774963379, "global_step": 287635, "epoch": 3465} {"train_loss": -25.20979118347168, "global_step": 287636, "epoch": 3465} {"train_loss": -25.452190399169922, "global_step": 287637, "epoch": 3465} {"train_loss": -25.911727905273438, "global_step": 287638, "epoch": 3465} {"train_loss": -25.59328269958496, "global_step": 287639, "epoch": 3465} {"train_loss": -25.558168411254883, "global_step": 287640, "epoch": 3465} {"train_loss": -25.695419311523438, "global_step": 287641, "epoch": 3465} {"train_loss": -25.71673011779785, "global_step": 287642, "epoch": 3465} {"train_loss": -25.22141456604004, "global_step": 287643, "epoch": 3465} {"train_loss": -25.39080047607422, "global_step": 287644, "epoch": 3465} {"train_loss": -25.287120819091797, "global_step": 287645, "epoch": 3465} {"train_loss": -25.376970291137695, "global_step": 287646, "epoch": 3465} {"train_loss": -25.37599754333496, "global_step": 287647, "epoch": 3465} {"train_loss": -25.278045654296875, "global_step": 287648, "epoch": 3465} {"train_loss": -25.43191146850586, "global_step": 287649, "epoch": 3465} {"train_loss": -25.622852325439453, "global_step": 287650, "epoch": 3465} {"train_loss": -25.414505004882812, "global_step": 287651, "epoch": 3465} {"train_loss": -25.2910213470459, "global_step": 287652, "epoch": 3465} {"train_loss": -25.075916290283203, "global_step": 287653, "epoch": 3465} {"train_loss": -25.558347702026367, "global_step": 287654, "epoch": 3465} {"train_loss": -25.5635986328125, "global_step": 287655, "epoch": 3465} {"train_loss": -25.27680778503418, "global_step": 287656, "epoch": 3465} {"train_loss": -25.504241943359375, "global_step": 287657, "epoch": 3465} {"train_loss": -25.150287628173828, "global_step": 287658, "epoch": 3465} {"train_loss": -25.21815299987793, "global_step": 287659, "epoch": 3465} {"train_loss": -25.8050479888916, "global_step": 287660, "epoch": 3465} {"train_loss": -25.82295036315918, "global_step": 287661, "epoch": 3465} {"train_loss": -25.5794734954834, "global_step": 287662, "epoch": 3465} {"train_loss": -25.673187255859375, "global_step": 287663, "epoch": 3465} {"train_loss": -25.364280700683594, "global_step": 287664, "epoch": 3465} {"train_loss": -25.278928756713867, "global_step": 287665, "epoch": 3465} {"train_loss": -25.67603874206543, "global_step": 287666, "epoch": 3465} {"train_loss": -25.841571807861328, "global_step": 287667, "epoch": 3465} {"train_loss": -25.599809646606445, "global_step": 287668, "epoch": 3465} {"train_loss": -25.51276969909668, "global_step": 287669, "epoch": 3465} {"train_loss": -25.329872131347656, "global_step": 287670, "epoch": 3465} {"train_loss": -25.312665939331055, "global_step": 287671, "epoch": 3465} {"train_loss": -25.19108772277832, "global_step": 287672, "epoch": 3465} {"train_loss": -25.933984756469727, "global_step": 287673, "epoch": 3465} {"train_loss": -25.68100929260254, "global_step": 287674, "epoch": 3465} {"train_loss": -25.4146671295166, "global_step": 287675, "epoch": 3465} {"train_loss": -25.73046875, "global_step": 287676, "epoch": 3465} {"train_loss": -25.361143525824488, "global_step": 287677, "epoch": 3465, "val_loss": 7187209.0} {"train_loss": -25.34120750427246, "global_step": 287678, "epoch": 3466} {"train_loss": -25.11528205871582, "global_step": 287679, "epoch": 3466} {"train_loss": -25.258493423461914, "global_step": 287680, "epoch": 3466} {"train_loss": -25.063674926757812, "global_step": 287681, "epoch": 3466} {"train_loss": -25.392892837524414, "global_step": 287682, "epoch": 3466} {"train_loss": -25.3026180267334, "global_step": 287683, "epoch": 3466} {"train_loss": -25.635181427001953, "global_step": 287684, "epoch": 3466} {"train_loss": -25.481393814086914, "global_step": 287685, "epoch": 3466} {"train_loss": -25.624670028686523, "global_step": 287686, "epoch": 3466} {"train_loss": -25.477975845336914, "global_step": 287687, "epoch": 3466} {"train_loss": -25.415084838867188, "global_step": 287688, "epoch": 3466} {"train_loss": -24.89045524597168, "global_step": 287689, "epoch": 3466} {"train_loss": -25.056671142578125, "global_step": 287690, "epoch": 3466} {"train_loss": -24.972158432006836, "global_step": 287691, "epoch": 3466} {"train_loss": -25.32575798034668, "global_step": 287692, "epoch": 3466} {"train_loss": -25.667516708374023, "global_step": 287693, "epoch": 3466} {"train_loss": -24.865633010864258, "global_step": 287694, "epoch": 3466} {"train_loss": -25.06365966796875, "global_step": 287695, "epoch": 3466} {"train_loss": -25.135486602783203, "global_step": 287696, "epoch": 3466} {"train_loss": -25.334924697875977, "global_step": 287697, "epoch": 3466} {"train_loss": -25.361486434936523, "global_step": 287698, "epoch": 3466} {"train_loss": -25.641006469726562, "global_step": 287699, "epoch": 3466} {"train_loss": -24.755823135375977, "global_step": 287700, "epoch": 3466} {"train_loss": -25.038694381713867, "global_step": 287701, "epoch": 3466} {"train_loss": -25.507856369018555, "global_step": 287702, "epoch": 3466} {"train_loss": -25.48193359375, "global_step": 287703, "epoch": 3466} {"train_loss": -25.027694702148438, "global_step": 287704, "epoch": 3466} {"train_loss": -25.254831314086914, "global_step": 287705, "epoch": 3466} {"train_loss": -25.47174072265625, "global_step": 287706, "epoch": 3466} {"train_loss": -25.654510498046875, "global_step": 287707, "epoch": 3466} {"train_loss": -25.402137756347656, "global_step": 287708, "epoch": 3466} {"train_loss": -25.43199348449707, "global_step": 287709, "epoch": 3466} {"train_loss": -25.61752700805664, "global_step": 287710, "epoch": 3466} {"train_loss": -25.32173728942871, "global_step": 287711, "epoch": 3466} {"train_loss": -25.29840660095215, "global_step": 287712, "epoch": 3466} {"train_loss": -25.59540367126465, "global_step": 287713, "epoch": 3466} {"train_loss": -25.340085983276367, "global_step": 287714, "epoch": 3466} {"train_loss": -25.62628173828125, "global_step": 287715, "epoch": 3466} {"train_loss": -25.65277099609375, "global_step": 287716, "epoch": 3466} {"train_loss": -25.86502456665039, "global_step": 287717, "epoch": 3466} {"train_loss": -25.447723388671875, "global_step": 287718, "epoch": 3466} {"train_loss": -25.736948013305664, "global_step": 287719, "epoch": 3466} {"train_loss": -25.292198181152344, "global_step": 287720, "epoch": 3466} {"train_loss": -25.432668685913086, "global_step": 287721, "epoch": 3466} {"train_loss": -26.000244140625, "global_step": 287722, "epoch": 3466} {"train_loss": -25.59735870361328, "global_step": 287723, "epoch": 3466} {"train_loss": -25.464397430419922, "global_step": 287724, "epoch": 3466} {"train_loss": -25.7724552154541, "global_step": 287725, "epoch": 3466} {"train_loss": -25.632568359375, "global_step": 287726, "epoch": 3466} {"train_loss": -25.49492073059082, "global_step": 287727, "epoch": 3466} {"train_loss": -25.57960319519043, "global_step": 287728, "epoch": 3466} {"train_loss": -25.845197677612305, "global_step": 287729, "epoch": 3466} {"train_loss": -25.49009132385254, "global_step": 287730, "epoch": 3466} {"train_loss": -25.681655883789062, "global_step": 287731, "epoch": 3466} {"train_loss": -25.914020538330078, "global_step": 287732, "epoch": 3466} {"train_loss": -25.706588745117188, "global_step": 287733, "epoch": 3466} {"train_loss": -25.37603759765625, "global_step": 287734, "epoch": 3466} {"train_loss": -25.099042892456055, "global_step": 287735, "epoch": 3466} {"train_loss": -25.668973922729492, "global_step": 287736, "epoch": 3466} {"train_loss": -25.542898178100586, "global_step": 287737, "epoch": 3466} {"train_loss": -25.46099853515625, "global_step": 287738, "epoch": 3466} {"train_loss": -25.504384994506836, "global_step": 287739, "epoch": 3466} {"train_loss": -25.296117782592773, "global_step": 287740, "epoch": 3466} {"train_loss": -25.38797950744629, "global_step": 287741, "epoch": 3466} {"train_loss": -25.7971248626709, "global_step": 287742, "epoch": 3466} {"train_loss": -25.32179832458496, "global_step": 287743, "epoch": 3466} {"train_loss": -25.51192283630371, "global_step": 287744, "epoch": 3466} {"train_loss": -25.449827194213867, "global_step": 287745, "epoch": 3466} {"train_loss": -25.748035430908203, "global_step": 287746, "epoch": 3466} {"train_loss": -25.436420440673828, "global_step": 287747, "epoch": 3466} {"train_loss": -25.342655181884766, "global_step": 287748, "epoch": 3466} {"train_loss": -25.437318801879883, "global_step": 287749, "epoch": 3466} {"train_loss": -25.284826278686523, "global_step": 287750, "epoch": 3466} {"train_loss": -25.76474952697754, "global_step": 287751, "epoch": 3466} {"train_loss": -25.765546798706055, "global_step": 287752, "epoch": 3466} {"train_loss": -25.58089256286621, "global_step": 287753, "epoch": 3466} {"train_loss": -25.86646842956543, "global_step": 287754, "epoch": 3466} {"train_loss": -25.338071823120117, "global_step": 287755, "epoch": 3466} {"train_loss": -25.446203231811523, "global_step": 287756, "epoch": 3466} {"train_loss": -25.690595626831055, "global_step": 287757, "epoch": 3466} {"train_loss": -25.51421546936035, "global_step": 287758, "epoch": 3466} {"train_loss": -25.554365158081055, "global_step": 287759, "epoch": 3466} {"train_loss": -25.45052645579878, "global_step": 287760, "epoch": 3466, "val_loss": 7182563.0} {"train_loss": -25.167404174804688, "global_step": 287761, "epoch": 3467} {"train_loss": -23.921613693237305, "global_step": 287762, "epoch": 3467} {"train_loss": -22.626665115356445, "global_step": 287763, "epoch": 3467} {"train_loss": -25.2105770111084, "global_step": 287764, "epoch": 3467} {"train_loss": -24.7010498046875, "global_step": 287765, "epoch": 3467} {"train_loss": -24.680667877197266, "global_step": 287766, "epoch": 3467} {"train_loss": -24.753652572631836, "global_step": 287767, "epoch": 3467} {"train_loss": -24.452136993408203, "global_step": 287768, "epoch": 3467} {"train_loss": -24.741289138793945, "global_step": 287769, "epoch": 3467} {"train_loss": -25.405536651611328, "global_step": 287770, "epoch": 3467} {"train_loss": -24.83806610107422, "global_step": 287771, "epoch": 3467} {"train_loss": -24.826265335083008, "global_step": 287772, "epoch": 3467} {"train_loss": -24.85279655456543, "global_step": 287773, "epoch": 3467} {"train_loss": -25.29996109008789, "global_step": 287774, "epoch": 3467} {"train_loss": -24.76236915588379, "global_step": 287775, "epoch": 3467} {"train_loss": -25.345882415771484, "global_step": 287776, "epoch": 3467} {"train_loss": -24.883224487304688, "global_step": 287777, "epoch": 3467} {"train_loss": -25.238431930541992, "global_step": 287778, "epoch": 3467} {"train_loss": -25.25236701965332, "global_step": 287779, "epoch": 3467} {"train_loss": -25.317670822143555, "global_step": 287780, "epoch": 3467} {"train_loss": -25.1895751953125, "global_step": 287781, "epoch": 3467} {"train_loss": -25.161399841308594, "global_step": 287782, "epoch": 3467} {"train_loss": -24.89095687866211, "global_step": 287783, "epoch": 3467} {"train_loss": -25.0673885345459, "global_step": 287784, "epoch": 3467} {"train_loss": -25.64560890197754, "global_step": 287785, "epoch": 3467} {"train_loss": -25.4073486328125, "global_step": 287786, "epoch": 3467} {"train_loss": -25.625051498413086, "global_step": 287787, "epoch": 3467} {"train_loss": -25.299610137939453, "global_step": 287788, "epoch": 3467} {"train_loss": -25.6484375, "global_step": 287789, "epoch": 3467} {"train_loss": -25.31886863708496, "global_step": 287790, "epoch": 3467} {"train_loss": -25.173900604248047, "global_step": 287791, "epoch": 3467} {"train_loss": -25.222143173217773, "global_step": 287792, "epoch": 3467} {"train_loss": -25.585779190063477, "global_step": 287793, "epoch": 3467} {"train_loss": -25.6676082611084, "global_step": 287794, "epoch": 3467} {"train_loss": -25.303638458251953, "global_step": 287795, "epoch": 3467} {"train_loss": -25.481592178344727, "global_step": 287796, "epoch": 3467} {"train_loss": -25.445764541625977, "global_step": 287797, "epoch": 3467} {"train_loss": -25.431705474853516, "global_step": 287798, "epoch": 3467} {"train_loss": -25.26264762878418, "global_step": 287799, "epoch": 3467} {"train_loss": -25.371458053588867, "global_step": 287800, "epoch": 3467} {"train_loss": -25.775836944580078, "global_step": 287801, "epoch": 3467} {"train_loss": -25.242034912109375, "global_step": 287802, "epoch": 3467} {"train_loss": -25.335729598999023, "global_step": 287803, "epoch": 3467} {"train_loss": -25.59765625, "global_step": 287804, "epoch": 3467} {"train_loss": -25.305660247802734, "global_step": 287805, "epoch": 3467} {"train_loss": -25.42118263244629, "global_step": 287806, "epoch": 3467} {"train_loss": -25.55122947692871, "global_step": 287807, "epoch": 3467} {"train_loss": -25.357810974121094, "global_step": 287808, "epoch": 3467} {"train_loss": -25.68474769592285, "global_step": 287809, "epoch": 3467} {"train_loss": -25.679309844970703, "global_step": 287810, "epoch": 3467} {"train_loss": -25.5696964263916, "global_step": 287811, "epoch": 3467} {"train_loss": -25.35920524597168, "global_step": 287812, "epoch": 3467} {"train_loss": -25.33989143371582, "global_step": 287813, "epoch": 3467} {"train_loss": -25.212223052978516, "global_step": 287814, "epoch": 3467} {"train_loss": -25.29813575744629, "global_step": 287815, "epoch": 3467} {"train_loss": -25.54244041442871, "global_step": 287816, "epoch": 3467} {"train_loss": -25.6712703704834, "global_step": 287817, "epoch": 3467} {"train_loss": -25.538928985595703, "global_step": 287818, "epoch": 3467} {"train_loss": -25.63319969177246, "global_step": 287819, "epoch": 3467} {"train_loss": -25.48073959350586, "global_step": 287820, "epoch": 3467} {"train_loss": -25.25525665283203, "global_step": 287821, "epoch": 3467} {"train_loss": -25.682392120361328, "global_step": 287822, "epoch": 3467} {"train_loss": -25.60236167907715, "global_step": 287823, "epoch": 3467} {"train_loss": -25.44217300415039, "global_step": 287824, "epoch": 3467} {"train_loss": -25.557920455932617, "global_step": 287825, "epoch": 3467} {"train_loss": -25.32150650024414, "global_step": 287826, "epoch": 3467} {"train_loss": -25.570161819458008, "global_step": 287827, "epoch": 3467} {"train_loss": -25.604583740234375, "global_step": 287828, "epoch": 3467} {"train_loss": -25.578290939331055, "global_step": 287829, "epoch": 3467} {"train_loss": -25.51289939880371, "global_step": 287830, "epoch": 3467} {"train_loss": -25.720380783081055, "global_step": 287831, "epoch": 3467} {"train_loss": -25.6372127532959, "global_step": 287832, "epoch": 3467} {"train_loss": -25.589818954467773, "global_step": 287833, "epoch": 3467} {"train_loss": -25.704395294189453, "global_step": 287834, "epoch": 3467} {"train_loss": -25.291080474853516, "global_step": 287835, "epoch": 3467} {"train_loss": -25.46759796142578, "global_step": 287836, "epoch": 3467} {"train_loss": -25.50739860534668, "global_step": 287837, "epoch": 3467} {"train_loss": -25.23821449279785, "global_step": 287838, "epoch": 3467} {"train_loss": -25.641393661499023, "global_step": 287839, "epoch": 3467} {"train_loss": -25.90833854675293, "global_step": 287840, "epoch": 3467} {"train_loss": -25.650354385375977, "global_step": 287841, "epoch": 3467} {"train_loss": -25.82809829711914, "global_step": 287842, "epoch": 3467} {"train_loss": -25.31285835174193, "global_step": 287843, "epoch": 3467, "val_loss": 7125695.0} {"train_loss": -24.720266342163086, "global_step": 287844, "epoch": 3468} {"train_loss": -24.53531265258789, "global_step": 287845, "epoch": 3468} {"train_loss": -25.538618087768555, "global_step": 287846, "epoch": 3468} {"train_loss": -25.153135299682617, "global_step": 287847, "epoch": 3468} {"train_loss": -25.396512985229492, "global_step": 287848, "epoch": 3468} {"train_loss": -24.803909301757812, "global_step": 287849, "epoch": 3468} {"train_loss": -25.117277145385742, "global_step": 287850, "epoch": 3468} {"train_loss": -25.06411361694336, "global_step": 287851, "epoch": 3468} {"train_loss": -25.143064498901367, "global_step": 287852, "epoch": 3468} {"train_loss": -25.3253231048584, "global_step": 287853, "epoch": 3468} {"train_loss": -25.11946678161621, "global_step": 287854, "epoch": 3468} {"train_loss": -25.506895065307617, "global_step": 287855, "epoch": 3468} {"train_loss": -25.137901306152344, "global_step": 287856, "epoch": 3468} {"train_loss": -25.120285034179688, "global_step": 287857, "epoch": 3468} {"train_loss": -25.20005226135254, "global_step": 287858, "epoch": 3468} {"train_loss": -24.942052841186523, "global_step": 287859, "epoch": 3468} {"train_loss": -25.80645179748535, "global_step": 287860, "epoch": 3468} {"train_loss": -25.241247177124023, "global_step": 287861, "epoch": 3468} {"train_loss": -25.64680290222168, "global_step": 287862, "epoch": 3468} {"train_loss": -25.3233642578125, "global_step": 287863, "epoch": 3468} {"train_loss": -25.20111846923828, "global_step": 287864, "epoch": 3468} {"train_loss": -25.641889572143555, "global_step": 287865, "epoch": 3468} {"train_loss": -25.827838897705078, "global_step": 287866, "epoch": 3468} {"train_loss": -25.492429733276367, "global_step": 287867, "epoch": 3468} {"train_loss": -25.467313766479492, "global_step": 287868, "epoch": 3468} {"train_loss": -25.674951553344727, "global_step": 287869, "epoch": 3468} {"train_loss": -25.490055084228516, "global_step": 287870, "epoch": 3468} {"train_loss": -25.633214950561523, "global_step": 287871, "epoch": 3468} {"train_loss": -25.672765731811523, "global_step": 287872, "epoch": 3468} {"train_loss": -25.145631790161133, "global_step": 287873, "epoch": 3468} {"train_loss": -25.28949737548828, "global_step": 287874, "epoch": 3468} {"train_loss": -25.567893981933594, "global_step": 287875, "epoch": 3468} {"train_loss": -25.698209762573242, "global_step": 287876, "epoch": 3468} {"train_loss": -25.985431671142578, "global_step": 287877, "epoch": 3468} {"train_loss": -25.23850440979004, "global_step": 287878, "epoch": 3468} {"train_loss": -25.64328384399414, "global_step": 287879, "epoch": 3468} {"train_loss": -25.44025230407715, "global_step": 287880, "epoch": 3468} {"train_loss": -26.072208404541016, "global_step": 287881, "epoch": 3468} {"train_loss": -25.74065589904785, "global_step": 287882, "epoch": 3468} {"train_loss": -25.743066787719727, "global_step": 287883, "epoch": 3468} {"train_loss": -25.831281661987305, "global_step": 287884, "epoch": 3468} {"train_loss": -25.545787811279297, "global_step": 287885, "epoch": 3468} {"train_loss": -25.60744285583496, "global_step": 287886, "epoch": 3468} {"train_loss": -25.136003494262695, "global_step": 287887, "epoch": 3468} {"train_loss": -25.315311431884766, "global_step": 287888, "epoch": 3468} {"train_loss": -25.412662506103516, "global_step": 287889, "epoch": 3468} {"train_loss": -25.669574737548828, "global_step": 287890, "epoch": 3468} {"train_loss": -25.335037231445312, "global_step": 287891, "epoch": 3468} {"train_loss": -25.07084846496582, "global_step": 287892, "epoch": 3468} {"train_loss": -25.437105178833008, "global_step": 287893, "epoch": 3468} {"train_loss": -25.18283462524414, "global_step": 287894, "epoch": 3468} {"train_loss": -24.981094360351562, "global_step": 287895, "epoch": 3468} {"train_loss": -25.29659080505371, "global_step": 287896, "epoch": 3468} {"train_loss": -25.28407096862793, "global_step": 287897, "epoch": 3468} {"train_loss": -25.35526466369629, "global_step": 287898, "epoch": 3468} {"train_loss": -25.601505279541016, "global_step": 287899, "epoch": 3468} {"train_loss": -25.76104164123535, "global_step": 287900, "epoch": 3468} {"train_loss": -25.454952239990234, "global_step": 287901, "epoch": 3468} {"train_loss": -25.332172393798828, "global_step": 287902, "epoch": 3468} {"train_loss": -25.780780792236328, "global_step": 287903, "epoch": 3468} {"train_loss": -25.398115158081055, "global_step": 287904, "epoch": 3468} {"train_loss": -25.53746223449707, "global_step": 287905, "epoch": 3468} {"train_loss": -25.22022819519043, "global_step": 287906, "epoch": 3468} {"train_loss": -25.710010528564453, "global_step": 287907, "epoch": 3468} {"train_loss": -25.604475021362305, "global_step": 287908, "epoch": 3468} {"train_loss": -25.533374786376953, "global_step": 287909, "epoch": 3468} {"train_loss": -25.469831466674805, "global_step": 287910, "epoch": 3468} {"train_loss": -25.73089027404785, "global_step": 287911, "epoch": 3468} {"train_loss": -25.502168655395508, "global_step": 287912, "epoch": 3468} {"train_loss": -25.565690994262695, "global_step": 287913, "epoch": 3468} {"train_loss": -25.73430824279785, "global_step": 287914, "epoch": 3468} {"train_loss": -25.43118667602539, "global_step": 287915, "epoch": 3468} {"train_loss": -25.31053352355957, "global_step": 287916, "epoch": 3468} {"train_loss": -25.05287742614746, "global_step": 287917, "epoch": 3468} {"train_loss": -25.729162216186523, "global_step": 287918, "epoch": 3468} {"train_loss": -25.8107967376709, "global_step": 287919, "epoch": 3468} {"train_loss": -25.371994018554688, "global_step": 287920, "epoch": 3468} {"train_loss": -25.675867080688477, "global_step": 287921, "epoch": 3468} {"train_loss": -25.564834594726562, "global_step": 287922, "epoch": 3468} {"train_loss": -25.89936637878418, "global_step": 287923, "epoch": 3468} {"train_loss": -25.712915420532227, "global_step": 287924, "epoch": 3468} {"train_loss": -25.598852157592773, "global_step": 287925, "epoch": 3468} {"train_loss": -25.439857597810676, "global_step": 287926, "epoch": 3468, "val_loss": 7084999.0} {"train_loss": -24.881195068359375, "global_step": 287927, "epoch": 3469} {"train_loss": -25.196306228637695, "global_step": 287928, "epoch": 3469} {"train_loss": -25.438922882080078, "global_step": 287929, "epoch": 3469} {"train_loss": -25.177549362182617, "global_step": 287930, "epoch": 3469} {"train_loss": -25.42243194580078, "global_step": 287931, "epoch": 3469} {"train_loss": -25.349933624267578, "global_step": 287932, "epoch": 3469} {"train_loss": -25.594697952270508, "global_step": 287933, "epoch": 3469} {"train_loss": -25.33664894104004, "global_step": 287934, "epoch": 3469} {"train_loss": -25.30877113342285, "global_step": 287935, "epoch": 3469} {"train_loss": -25.224843978881836, "global_step": 287936, "epoch": 3469} {"train_loss": -25.53740119934082, "global_step": 287937, "epoch": 3469} {"train_loss": -25.381601333618164, "global_step": 287938, "epoch": 3469} {"train_loss": -25.207162857055664, "global_step": 287939, "epoch": 3469} {"train_loss": -25.486736297607422, "global_step": 287940, "epoch": 3469} {"train_loss": -25.51544189453125, "global_step": 287941, "epoch": 3469} {"train_loss": -25.3104305267334, "global_step": 287942, "epoch": 3469} {"train_loss": -25.32755470275879, "global_step": 287943, "epoch": 3469} {"train_loss": -25.428735733032227, "global_step": 287944, "epoch": 3469} {"train_loss": -25.697492599487305, "global_step": 287945, "epoch": 3469} {"train_loss": -25.5282039642334, "global_step": 287946, "epoch": 3469} {"train_loss": -25.498294830322266, "global_step": 287947, "epoch": 3469} {"train_loss": -25.265066146850586, "global_step": 287948, "epoch": 3469} {"train_loss": -25.4182071685791, "global_step": 287949, "epoch": 3469} {"train_loss": -25.726743698120117, "global_step": 287950, "epoch": 3469} {"train_loss": -25.421039581298828, "global_step": 287951, "epoch": 3469} {"train_loss": -25.597623825073242, "global_step": 287952, "epoch": 3469} {"train_loss": -25.41200828552246, "global_step": 287953, "epoch": 3469} {"train_loss": -25.504196166992188, "global_step": 287954, "epoch": 3469} {"train_loss": -25.623458862304688, "global_step": 287955, "epoch": 3469} {"train_loss": -25.561237335205078, "global_step": 287956, "epoch": 3469} {"train_loss": -25.879926681518555, "global_step": 287957, "epoch": 3469} {"train_loss": -25.86590003967285, "global_step": 287958, "epoch": 3469} {"train_loss": -25.10340118408203, "global_step": 287959, "epoch": 3469} {"train_loss": -26.0185546875, "global_step": 287960, "epoch": 3469} {"train_loss": -25.06232452392578, "global_step": 287961, "epoch": 3469} {"train_loss": -25.522993087768555, "global_step": 287962, "epoch": 3469} {"train_loss": -25.59791374206543, "global_step": 287963, "epoch": 3469} {"train_loss": -25.310636520385742, "global_step": 287964, "epoch": 3469} {"train_loss": -25.668121337890625, "global_step": 287965, "epoch": 3469} {"train_loss": -25.329442977905273, "global_step": 287966, "epoch": 3469} {"train_loss": -25.501996994018555, "global_step": 287967, "epoch": 3469} {"train_loss": -25.403423309326172, "global_step": 287968, "epoch": 3469} {"train_loss": -25.446874618530273, "global_step": 287969, "epoch": 3469} {"train_loss": -25.638456344604492, "global_step": 287970, "epoch": 3469} {"train_loss": -25.417579650878906, "global_step": 287971, "epoch": 3469} {"train_loss": -25.53781509399414, "global_step": 287972, "epoch": 3469} {"train_loss": -25.374744415283203, "global_step": 287973, "epoch": 3469} {"train_loss": -25.722707748413086, "global_step": 287974, "epoch": 3469} {"train_loss": -25.268861770629883, "global_step": 287975, "epoch": 3469} {"train_loss": -25.74738121032715, "global_step": 287976, "epoch": 3469} {"train_loss": -25.534317016601562, "global_step": 287977, "epoch": 3469} {"train_loss": -25.73581314086914, "global_step": 287978, "epoch": 3469} {"train_loss": -25.387718200683594, "global_step": 287979, "epoch": 3469} {"train_loss": -25.54044532775879, "global_step": 287980, "epoch": 3469} {"train_loss": -25.40254783630371, "global_step": 287981, "epoch": 3469} {"train_loss": -25.38967514038086, "global_step": 287982, "epoch": 3469} {"train_loss": -25.412220001220703, "global_step": 287983, "epoch": 3469} {"train_loss": -25.348012924194336, "global_step": 287984, "epoch": 3469} {"train_loss": -25.614185333251953, "global_step": 287985, "epoch": 3469} {"train_loss": -25.410032272338867, "global_step": 287986, "epoch": 3469} {"train_loss": -25.512022018432617, "global_step": 287987, "epoch": 3469} {"train_loss": -25.648609161376953, "global_step": 287988, "epoch": 3469} {"train_loss": -25.636783599853516, "global_step": 287989, "epoch": 3469} {"train_loss": -26.06853675842285, "global_step": 287990, "epoch": 3469} {"train_loss": -25.419544219970703, "global_step": 287991, "epoch": 3469} {"train_loss": -25.962238311767578, "global_step": 287992, "epoch": 3469} {"train_loss": -25.332361221313477, "global_step": 287993, "epoch": 3469} {"train_loss": -25.750635147094727, "global_step": 287994, "epoch": 3469} {"train_loss": -25.224393844604492, "global_step": 287995, "epoch": 3469} {"train_loss": -25.879846572875977, "global_step": 287996, "epoch": 3469} {"train_loss": -25.377822875976562, "global_step": 287997, "epoch": 3469} {"train_loss": -25.536766052246094, "global_step": 287998, "epoch": 3469} {"train_loss": -25.9993839263916, "global_step": 287999, "epoch": 3469} {"train_loss": -25.65479850769043, "global_step": 288000, "epoch": 3469} {"train_loss": -25.722265243530273, "global_step": 288001, "epoch": 3469} {"train_loss": -25.76783561706543, "global_step": 288002, "epoch": 3469} {"train_loss": -25.504220962524414, "global_step": 288003, "epoch": 3469} {"train_loss": -25.59366226196289, "global_step": 288004, "epoch": 3469} {"train_loss": -25.48404884338379, "global_step": 288005, "epoch": 3469} {"train_loss": -25.861499786376953, "global_step": 288006, "epoch": 3469} {"train_loss": -25.715045928955078, "global_step": 288007, "epoch": 3469} {"train_loss": -25.671430587768555, "global_step": 288008, "epoch": 3469} {"train_loss": -25.500084222081195, "global_step": 288009, "epoch": 3469, "val_loss": 7158603.0} {"train_loss": -25.112363815307617, "global_step": 288010, "epoch": 3470} {"train_loss": -23.643585205078125, "global_step": 288011, "epoch": 3470} {"train_loss": -24.38886833190918, "global_step": 288012, "epoch": 3470} {"train_loss": -24.714147567749023, "global_step": 288013, "epoch": 3470} {"train_loss": -24.91328239440918, "global_step": 288014, "epoch": 3470} {"train_loss": -24.43964958190918, "global_step": 288015, "epoch": 3470} {"train_loss": -25.21329116821289, "global_step": 288016, "epoch": 3470} {"train_loss": -25.095741271972656, "global_step": 288017, "epoch": 3470} {"train_loss": -24.994298934936523, "global_step": 288018, "epoch": 3470} {"train_loss": -24.787857055664062, "global_step": 288019, "epoch": 3470} {"train_loss": -24.902727127075195, "global_step": 288020, "epoch": 3470} {"train_loss": -24.969287872314453, "global_step": 288021, "epoch": 3470} {"train_loss": -25.10257911682129, "global_step": 288022, "epoch": 3470} {"train_loss": -24.84231948852539, "global_step": 288023, "epoch": 3470} {"train_loss": -24.805387496948242, "global_step": 288024, "epoch": 3470} {"train_loss": -25.112613677978516, "global_step": 288025, "epoch": 3470} {"train_loss": -24.942691802978516, "global_step": 288026, "epoch": 3470} {"train_loss": -25.286762237548828, "global_step": 288027, "epoch": 3470} {"train_loss": -25.356172561645508, "global_step": 288028, "epoch": 3470} {"train_loss": -25.242698669433594, "global_step": 288029, "epoch": 3470} {"train_loss": -25.327852249145508, "global_step": 288030, "epoch": 3470} {"train_loss": -25.261199951171875, "global_step": 288031, "epoch": 3470} {"train_loss": -25.232025146484375, "global_step": 288032, "epoch": 3470} {"train_loss": -25.13492202758789, "global_step": 288033, "epoch": 3470} {"train_loss": -24.846139907836914, "global_step": 288034, "epoch": 3470} {"train_loss": -25.423789978027344, "global_step": 288035, "epoch": 3470} {"train_loss": -25.310123443603516, "global_step": 288036, "epoch": 3470} {"train_loss": -25.312896728515625, "global_step": 288037, "epoch": 3470} {"train_loss": -25.1572322845459, "global_step": 288038, "epoch": 3470} {"train_loss": -25.18486785888672, "global_step": 288039, "epoch": 3470} {"train_loss": -25.470487594604492, "global_step": 288040, "epoch": 3470} {"train_loss": -25.339780807495117, "global_step": 288041, "epoch": 3470} {"train_loss": -25.60501480102539, "global_step": 288042, "epoch": 3470} {"train_loss": -25.17573356628418, "global_step": 288043, "epoch": 3470} {"train_loss": -25.287614822387695, "global_step": 288044, "epoch": 3470} {"train_loss": -25.6208438873291, "global_step": 288045, "epoch": 3470} {"train_loss": -25.29075050354004, "global_step": 288046, "epoch": 3470} {"train_loss": -25.44788932800293, "global_step": 288047, "epoch": 3470} {"train_loss": -25.855321884155273, "global_step": 288048, "epoch": 3470} {"train_loss": -25.801593780517578, "global_step": 288049, "epoch": 3470} {"train_loss": -25.7985782623291, "global_step": 288050, "epoch": 3470} {"train_loss": -25.426088333129883, "global_step": 288051, "epoch": 3470} {"train_loss": -25.72904396057129, "global_step": 288052, "epoch": 3470} {"train_loss": -25.606464385986328, "global_step": 288053, "epoch": 3470} {"train_loss": -25.468975067138672, "global_step": 288054, "epoch": 3470} {"train_loss": -25.40779685974121, "global_step": 288055, "epoch": 3470} {"train_loss": -25.733007431030273, "global_step": 288056, "epoch": 3470} {"train_loss": -25.757116317749023, "global_step": 288057, "epoch": 3470} {"train_loss": -25.37467384338379, "global_step": 288058, "epoch": 3470} {"train_loss": -25.30376434326172, "global_step": 288059, "epoch": 3470} {"train_loss": -25.389820098876953, "global_step": 288060, "epoch": 3470} {"train_loss": -25.532766342163086, "global_step": 288061, "epoch": 3470} {"train_loss": -25.518156051635742, "global_step": 288062, "epoch": 3470} {"train_loss": -25.66595458984375, "global_step": 288063, "epoch": 3470} {"train_loss": -25.9289608001709, "global_step": 288064, "epoch": 3470} {"train_loss": -25.47848892211914, "global_step": 288065, "epoch": 3470} {"train_loss": -25.625879287719727, "global_step": 288066, "epoch": 3470} {"train_loss": -25.280004501342773, "global_step": 288067, "epoch": 3470} {"train_loss": -25.262292861938477, "global_step": 288068, "epoch": 3470} {"train_loss": -25.178442001342773, "global_step": 288069, "epoch": 3470} {"train_loss": -25.30205535888672, "global_step": 288070, "epoch": 3470} {"train_loss": -25.403310775756836, "global_step": 288071, "epoch": 3470} {"train_loss": -25.058963775634766, "global_step": 288072, "epoch": 3470} {"train_loss": -25.536090850830078, "global_step": 288073, "epoch": 3470} {"train_loss": -25.22895622253418, "global_step": 288074, "epoch": 3470} {"train_loss": -25.284727096557617, "global_step": 288075, "epoch": 3470} {"train_loss": -25.621923446655273, "global_step": 288076, "epoch": 3470} {"train_loss": -25.2956600189209, "global_step": 288077, "epoch": 3470} {"train_loss": -25.564716339111328, "global_step": 288078, "epoch": 3470} {"train_loss": -25.59069061279297, "global_step": 288079, "epoch": 3470} {"train_loss": -25.57703399658203, "global_step": 288080, "epoch": 3470} {"train_loss": -25.447734832763672, "global_step": 288081, "epoch": 3470} {"train_loss": -25.89459228515625, "global_step": 288082, "epoch": 3470} {"train_loss": -25.448482513427734, "global_step": 288083, "epoch": 3470} {"train_loss": -25.946369171142578, "global_step": 288084, "epoch": 3470} {"train_loss": -25.600589752197266, "global_step": 288085, "epoch": 3470} {"train_loss": -25.519763946533203, "global_step": 288086, "epoch": 3470} {"train_loss": -25.46668815612793, "global_step": 288087, "epoch": 3470} {"train_loss": -25.812713623046875, "global_step": 288088, "epoch": 3470} {"train_loss": -25.433134078979492, "global_step": 288089, "epoch": 3470} {"train_loss": -25.77199363708496, "global_step": 288090, "epoch": 3470} {"train_loss": -25.378198623657227, "global_step": 288091, "epoch": 3470} {"train_loss": -25.337608957865154, "global_step": 288092, "epoch": 3470, "val_loss": 7068220.0} {"train_loss": -23.945566177368164, "global_step": 288093, "epoch": 3471} {"train_loss": -23.6956787109375, "global_step": 288094, "epoch": 3471} {"train_loss": -23.76107406616211, "global_step": 288095, "epoch": 3471} {"train_loss": -24.853158950805664, "global_step": 288096, "epoch": 3471} {"train_loss": -24.7099609375, "global_step": 288097, "epoch": 3471} {"train_loss": -24.401060104370117, "global_step": 288098, "epoch": 3471} {"train_loss": -24.84391212463379, "global_step": 288099, "epoch": 3471} {"train_loss": -24.66531753540039, "global_step": 288100, "epoch": 3471} {"train_loss": -24.990591049194336, "global_step": 288101, "epoch": 3471} {"train_loss": -25.04931640625, "global_step": 288102, "epoch": 3471} {"train_loss": -25.015583038330078, "global_step": 288103, "epoch": 3471} {"train_loss": -24.963071823120117, "global_step": 288104, "epoch": 3471} {"train_loss": -24.748104095458984, "global_step": 288105, "epoch": 3471} {"train_loss": -25.04151725769043, "global_step": 288106, "epoch": 3471} {"train_loss": -24.820322036743164, "global_step": 288107, "epoch": 3471} {"train_loss": -25.18433952331543, "global_step": 288108, "epoch": 3471} {"train_loss": -25.192625045776367, "global_step": 288109, "epoch": 3471} {"train_loss": -25.15909767150879, "global_step": 288110, "epoch": 3471} {"train_loss": -24.8612117767334, "global_step": 288111, "epoch": 3471} {"train_loss": -24.828298568725586, "global_step": 288112, "epoch": 3471} {"train_loss": -24.945398330688477, "global_step": 288113, "epoch": 3471} {"train_loss": -24.907310485839844, "global_step": 288114, "epoch": 3471} {"train_loss": -25.117055892944336, "global_step": 288115, "epoch": 3471} {"train_loss": -25.380746841430664, "global_step": 288116, "epoch": 3471} {"train_loss": -25.25656509399414, "global_step": 288117, "epoch": 3471} {"train_loss": -25.36509895324707, "global_step": 288118, "epoch": 3471} {"train_loss": -25.55875587463379, "global_step": 288119, "epoch": 3471} {"train_loss": -25.339683532714844, "global_step": 288120, "epoch": 3471} {"train_loss": -25.180776596069336, "global_step": 288121, "epoch": 3471} {"train_loss": -25.07025718688965, "global_step": 288122, "epoch": 3471} {"train_loss": -25.186016082763672, "global_step": 288123, "epoch": 3471} {"train_loss": -25.614917755126953, "global_step": 288124, "epoch": 3471} {"train_loss": -25.551023483276367, "global_step": 288125, "epoch": 3471} {"train_loss": -25.22806739807129, "global_step": 288126, "epoch": 3471} {"train_loss": -25.72574806213379, "global_step": 288127, "epoch": 3471} {"train_loss": -25.250925064086914, "global_step": 288128, "epoch": 3471} {"train_loss": -25.49249839782715, "global_step": 288129, "epoch": 3471} {"train_loss": -25.453561782836914, "global_step": 288130, "epoch": 3471} {"train_loss": -25.55525016784668, "global_step": 288131, "epoch": 3471} {"train_loss": -25.116931915283203, "global_step": 288132, "epoch": 3471} {"train_loss": -25.874622344970703, "global_step": 288133, "epoch": 3471} {"train_loss": -25.508331298828125, "global_step": 288134, "epoch": 3471} {"train_loss": -25.519298553466797, "global_step": 288135, "epoch": 3471} {"train_loss": -25.42898178100586, "global_step": 288136, "epoch": 3471} {"train_loss": -25.46990966796875, "global_step": 288137, "epoch": 3471} {"train_loss": -25.812246322631836, "global_step": 288138, "epoch": 3471} {"train_loss": -25.609378814697266, "global_step": 288139, "epoch": 3471} {"train_loss": -25.731733322143555, "global_step": 288140, "epoch": 3471} {"train_loss": -25.512798309326172, "global_step": 288141, "epoch": 3471} {"train_loss": -25.54542350769043, "global_step": 288142, "epoch": 3471} {"train_loss": -25.3621883392334, "global_step": 288143, "epoch": 3471} {"train_loss": -25.192707061767578, "global_step": 288144, "epoch": 3471} {"train_loss": -24.972640991210938, "global_step": 288145, "epoch": 3471} {"train_loss": -24.890762329101562, "global_step": 288146, "epoch": 3471} {"train_loss": -24.979415893554688, "global_step": 288147, "epoch": 3471} {"train_loss": -24.981836318969727, "global_step": 288148, "epoch": 3471} {"train_loss": -25.066091537475586, "global_step": 288149, "epoch": 3471} {"train_loss": -25.435928344726562, "global_step": 288150, "epoch": 3471} {"train_loss": -25.469247817993164, "global_step": 288151, "epoch": 3471} {"train_loss": -25.17976188659668, "global_step": 288152, "epoch": 3471} {"train_loss": -25.755573272705078, "global_step": 288153, "epoch": 3471} {"train_loss": -25.824472427368164, "global_step": 288154, "epoch": 3471} {"train_loss": -25.5889835357666, "global_step": 288155, "epoch": 3471} {"train_loss": -25.481143951416016, "global_step": 288156, "epoch": 3471} {"train_loss": -25.625320434570312, "global_step": 288157, "epoch": 3471} {"train_loss": -25.571033477783203, "global_step": 288158, "epoch": 3471} {"train_loss": -25.287036895751953, "global_step": 288159, "epoch": 3471} {"train_loss": -25.24496078491211, "global_step": 288160, "epoch": 3471} {"train_loss": -25.468412399291992, "global_step": 288161, "epoch": 3471} {"train_loss": -25.378284454345703, "global_step": 288162, "epoch": 3471} {"train_loss": -25.52543830871582, "global_step": 288163, "epoch": 3471} {"train_loss": -25.721689224243164, "global_step": 288164, "epoch": 3471} {"train_loss": -25.627307891845703, "global_step": 288165, "epoch": 3471} {"train_loss": -25.75443458557129, "global_step": 288166, "epoch": 3471} {"train_loss": -25.665002822875977, "global_step": 288167, "epoch": 3471} {"train_loss": -25.668292999267578, "global_step": 288168, "epoch": 3471} {"train_loss": -25.42031478881836, "global_step": 288169, "epoch": 3471} {"train_loss": -25.43411636352539, "global_step": 288170, "epoch": 3471} {"train_loss": -25.5828857421875, "global_step": 288171, "epoch": 3471} {"train_loss": -25.680500030517578, "global_step": 288172, "epoch": 3471} {"train_loss": -25.363428115844727, "global_step": 288173, "epoch": 3471} {"train_loss": -25.36079978942871, "global_step": 288174, "epoch": 3471} {"train_loss": -25.252423228987727, "global_step": 288175, "epoch": 3471, "val_loss": 7143695.0} {"train_loss": -24.766721725463867, "global_step": 288176, "epoch": 3472} {"train_loss": -24.730791091918945, "global_step": 288177, "epoch": 3472} {"train_loss": -25.0886287689209, "global_step": 288178, "epoch": 3472} {"train_loss": -24.9301815032959, "global_step": 288179, "epoch": 3472} {"train_loss": -24.802988052368164, "global_step": 288180, "epoch": 3472} {"train_loss": -25.04418182373047, "global_step": 288181, "epoch": 3472} {"train_loss": -24.951282501220703, "global_step": 288182, "epoch": 3472} {"train_loss": -25.583467483520508, "global_step": 288183, "epoch": 3472} {"train_loss": -25.124303817749023, "global_step": 288184, "epoch": 3472} {"train_loss": -25.24383544921875, "global_step": 288185, "epoch": 3472} {"train_loss": -25.04684066772461, "global_step": 288186, "epoch": 3472} {"train_loss": -25.525476455688477, "global_step": 288187, "epoch": 3472} {"train_loss": -25.045774459838867, "global_step": 288188, "epoch": 3472} {"train_loss": -24.98517608642578, "global_step": 288189, "epoch": 3472} {"train_loss": -25.09579849243164, "global_step": 288190, "epoch": 3472} {"train_loss": -25.135839462280273, "global_step": 288191, "epoch": 3472} {"train_loss": -24.788320541381836, "global_step": 288192, "epoch": 3472} {"train_loss": -25.341054916381836, "global_step": 288193, "epoch": 3472} {"train_loss": -25.181856155395508, "global_step": 288194, "epoch": 3472} {"train_loss": -25.354806900024414, "global_step": 288195, "epoch": 3472} {"train_loss": -25.32022476196289, "global_step": 288196, "epoch": 3472} {"train_loss": -25.295541763305664, "global_step": 288197, "epoch": 3472} {"train_loss": -25.16194725036621, "global_step": 288198, "epoch": 3472} {"train_loss": -25.251800537109375, "global_step": 288199, "epoch": 3472} {"train_loss": -25.112218856811523, "global_step": 288200, "epoch": 3472} {"train_loss": -25.51125144958496, "global_step": 288201, "epoch": 3472} {"train_loss": -25.210004806518555, "global_step": 288202, "epoch": 3472} {"train_loss": -25.1611385345459, "global_step": 288203, "epoch": 3472} {"train_loss": -25.4962158203125, "global_step": 288204, "epoch": 3472} {"train_loss": -25.35987663269043, "global_step": 288205, "epoch": 3472} {"train_loss": -25.43294334411621, "global_step": 288206, "epoch": 3472} {"train_loss": -25.634435653686523, "global_step": 288207, "epoch": 3472} {"train_loss": -25.301576614379883, "global_step": 288208, "epoch": 3472} {"train_loss": -25.232440948486328, "global_step": 288209, "epoch": 3472} {"train_loss": -25.60821533203125, "global_step": 288210, "epoch": 3472} {"train_loss": -25.5404109954834, "global_step": 288211, "epoch": 3472} {"train_loss": -25.60480308532715, "global_step": 288212, "epoch": 3472} {"train_loss": -25.383140563964844, "global_step": 288213, "epoch": 3472} {"train_loss": -25.150842666625977, "global_step": 288214, "epoch": 3472} {"train_loss": -25.518220901489258, "global_step": 288215, "epoch": 3472} {"train_loss": -25.549081802368164, "global_step": 288216, "epoch": 3472} {"train_loss": -25.619962692260742, "global_step": 288217, "epoch": 3472} {"train_loss": -25.954877853393555, "global_step": 288218, "epoch": 3472} {"train_loss": -25.67744255065918, "global_step": 288219, "epoch": 3472} {"train_loss": -25.456218719482422, "global_step": 288220, "epoch": 3472} {"train_loss": -25.548460006713867, "global_step": 288221, "epoch": 3472} {"train_loss": -25.478296279907227, "global_step": 288222, "epoch": 3472} {"train_loss": -25.554601669311523, "global_step": 288223, "epoch": 3472} {"train_loss": -25.506473541259766, "global_step": 288224, "epoch": 3472} {"train_loss": -25.60546875, "global_step": 288225, "epoch": 3472} {"train_loss": -25.79123306274414, "global_step": 288226, "epoch": 3472} {"train_loss": -25.671649932861328, "global_step": 288227, "epoch": 3472} {"train_loss": -25.92097282409668, "global_step": 288228, "epoch": 3472} {"train_loss": -25.59621238708496, "global_step": 288229, "epoch": 3472} {"train_loss": -25.831602096557617, "global_step": 288230, "epoch": 3472} {"train_loss": -25.681201934814453, "global_step": 288231, "epoch": 3472} {"train_loss": -25.81928825378418, "global_step": 288232, "epoch": 3472} {"train_loss": -25.73237419128418, "global_step": 288233, "epoch": 3472} {"train_loss": -26.087921142578125, "global_step": 288234, "epoch": 3472} {"train_loss": -25.74566078186035, "global_step": 288235, "epoch": 3472} {"train_loss": -25.952777862548828, "global_step": 288236, "epoch": 3472} {"train_loss": -25.76539421081543, "global_step": 288237, "epoch": 3472} {"train_loss": -25.467466354370117, "global_step": 288238, "epoch": 3472} {"train_loss": -25.83884048461914, "global_step": 288239, "epoch": 3472} {"train_loss": -25.63986587524414, "global_step": 288240, "epoch": 3472} {"train_loss": -25.49928855895996, "global_step": 288241, "epoch": 3472} {"train_loss": -25.176881790161133, "global_step": 288242, "epoch": 3472} {"train_loss": -25.427352905273438, "global_step": 288243, "epoch": 3472} {"train_loss": -25.67486572265625, "global_step": 288244, "epoch": 3472} {"train_loss": -25.570066452026367, "global_step": 288245, "epoch": 3472} {"train_loss": -25.18428611755371, "global_step": 288246, "epoch": 3472} {"train_loss": -25.399900436401367, "global_step": 288247, "epoch": 3472} {"train_loss": -25.050947189331055, "global_step": 288248, "epoch": 3472} {"train_loss": -24.663190841674805, "global_step": 288249, "epoch": 3472} {"train_loss": -24.986278533935547, "global_step": 288250, "epoch": 3472} {"train_loss": -25.58576011657715, "global_step": 288251, "epoch": 3472} {"train_loss": -24.888200759887695, "global_step": 288252, "epoch": 3472} {"train_loss": -25.2001953125, "global_step": 288253, "epoch": 3472} {"train_loss": -25.364044189453125, "global_step": 288254, "epoch": 3472} {"train_loss": -25.646331787109375, "global_step": 288255, "epoch": 3472} {"train_loss": -25.523893356323242, "global_step": 288256, "epoch": 3472} {"train_loss": -25.511474609375, "global_step": 288257, "epoch": 3472} {"train_loss": -25.37273997571095, "global_step": 288258, "epoch": 3472, "val_loss": 7094728.5} {"train_loss": -23.520408630371094, "global_step": 288259, "epoch": 3473} {"train_loss": -24.8518123626709, "global_step": 288260, "epoch": 3473} {"train_loss": -23.86350440979004, "global_step": 288261, "epoch": 3473} {"train_loss": -24.180301666259766, "global_step": 288262, "epoch": 3473} {"train_loss": -24.443490982055664, "global_step": 288263, "epoch": 3473} {"train_loss": -24.32067108154297, "global_step": 288264, "epoch": 3473} {"train_loss": -24.769912719726562, "global_step": 288265, "epoch": 3473} {"train_loss": -24.342817306518555, "global_step": 288266, "epoch": 3473} {"train_loss": -24.35647964477539, "global_step": 288267, "epoch": 3473} {"train_loss": -24.516637802124023, "global_step": 288268, "epoch": 3473} {"train_loss": -24.613880157470703, "global_step": 288269, "epoch": 3473} {"train_loss": -24.833335876464844, "global_step": 288270, "epoch": 3473} {"train_loss": -24.783735275268555, "global_step": 288271, "epoch": 3473} {"train_loss": -24.597810745239258, "global_step": 288272, "epoch": 3473} {"train_loss": -24.886028289794922, "global_step": 288273, "epoch": 3473} {"train_loss": -24.7542667388916, "global_step": 288274, "epoch": 3473} {"train_loss": -25.08003044128418, "global_step": 288275, "epoch": 3473} {"train_loss": -24.50591468811035, "global_step": 288276, "epoch": 3473} {"train_loss": -24.8754940032959, "global_step": 288277, "epoch": 3473} {"train_loss": -24.730792999267578, "global_step": 288278, "epoch": 3473} {"train_loss": -24.973609924316406, "global_step": 288279, "epoch": 3473} {"train_loss": -25.220935821533203, "global_step": 288280, "epoch": 3473} {"train_loss": -25.1107177734375, "global_step": 288281, "epoch": 3473} {"train_loss": -24.896852493286133, "global_step": 288282, "epoch": 3473} {"train_loss": -25.307287216186523, "global_step": 288283, "epoch": 3473} {"train_loss": -24.8388614654541, "global_step": 288284, "epoch": 3473} {"train_loss": -25.221637725830078, "global_step": 288285, "epoch": 3473} {"train_loss": -24.82362174987793, "global_step": 288286, "epoch": 3473} {"train_loss": -25.23603630065918, "global_step": 288287, "epoch": 3473} {"train_loss": -25.444141387939453, "global_step": 288288, "epoch": 3473} {"train_loss": -25.099332809448242, "global_step": 288289, "epoch": 3473} {"train_loss": -25.521453857421875, "global_step": 288290, "epoch": 3473} {"train_loss": -25.142606735229492, "global_step": 288291, "epoch": 3473} {"train_loss": -25.22515106201172, "global_step": 288292, "epoch": 3473} {"train_loss": -25.338376998901367, "global_step": 288293, "epoch": 3473} {"train_loss": -25.067691802978516, "global_step": 288294, "epoch": 3473} {"train_loss": -25.265527725219727, "global_step": 288295, "epoch": 3473} {"train_loss": -25.30611228942871, "global_step": 288296, "epoch": 3473} {"train_loss": -25.689483642578125, "global_step": 288297, "epoch": 3473} {"train_loss": -25.673582077026367, "global_step": 288298, "epoch": 3473} {"train_loss": -25.438867568969727, "global_step": 288299, "epoch": 3473} {"train_loss": -25.586084365844727, "global_step": 288300, "epoch": 3473} {"train_loss": -25.45119285583496, "global_step": 288301, "epoch": 3473} {"train_loss": -25.54509925842285, "global_step": 288302, "epoch": 3473} {"train_loss": -25.475894927978516, "global_step": 288303, "epoch": 3473} {"train_loss": -25.48813247680664, "global_step": 288304, "epoch": 3473} {"train_loss": -25.46851921081543, "global_step": 288305, "epoch": 3473} {"train_loss": -25.510164260864258, "global_step": 288306, "epoch": 3473} {"train_loss": -25.56364631652832, "global_step": 288307, "epoch": 3473} {"train_loss": -25.466333389282227, "global_step": 288308, "epoch": 3473} {"train_loss": -25.6202449798584, "global_step": 288309, "epoch": 3473} {"train_loss": -25.863143920898438, "global_step": 288310, "epoch": 3473} {"train_loss": -25.6999568939209, "global_step": 288311, "epoch": 3473} {"train_loss": -25.59293556213379, "global_step": 288312, "epoch": 3473} {"train_loss": -25.664533615112305, "global_step": 288313, "epoch": 3473} {"train_loss": -25.6806640625, "global_step": 288314, "epoch": 3473} {"train_loss": -25.549104690551758, "global_step": 288315, "epoch": 3473} {"train_loss": -25.416019439697266, "global_step": 288316, "epoch": 3473} {"train_loss": -25.13335609436035, "global_step": 288317, "epoch": 3473} {"train_loss": -25.385496139526367, "global_step": 288318, "epoch": 3473} {"train_loss": -25.48736572265625, "global_step": 288319, "epoch": 3473} {"train_loss": -25.508150100708008, "global_step": 288320, "epoch": 3473} {"train_loss": -25.757049560546875, "global_step": 288321, "epoch": 3473} {"train_loss": -25.44013786315918, "global_step": 288322, "epoch": 3473} {"train_loss": -25.677387237548828, "global_step": 288323, "epoch": 3473} {"train_loss": -25.736801147460938, "global_step": 288324, "epoch": 3473} {"train_loss": -25.622766494750977, "global_step": 288325, "epoch": 3473} {"train_loss": -25.392663955688477, "global_step": 288326, "epoch": 3473} {"train_loss": -25.654890060424805, "global_step": 288327, "epoch": 3473} {"train_loss": -25.913293838500977, "global_step": 288328, "epoch": 3473} {"train_loss": -25.7763729095459, "global_step": 288329, "epoch": 3473} {"train_loss": -25.58864974975586, "global_step": 288330, "epoch": 3473} {"train_loss": -25.468473434448242, "global_step": 288331, "epoch": 3473} {"train_loss": -25.08489227294922, "global_step": 288332, "epoch": 3473} {"train_loss": -25.57059669494629, "global_step": 288333, "epoch": 3473} {"train_loss": -25.740161895751953, "global_step": 288334, "epoch": 3473} {"train_loss": -25.42021942138672, "global_step": 288335, "epoch": 3473} {"train_loss": -25.036361694335938, "global_step": 288336, "epoch": 3473} {"train_loss": -25.39814567565918, "global_step": 288337, "epoch": 3473} {"train_loss": -25.829252243041992, "global_step": 288338, "epoch": 3473} {"train_loss": -25.408926010131836, "global_step": 288339, "epoch": 3473} {"train_loss": -25.502784729003906, "global_step": 288340, "epoch": 3473} {"train_loss": -25.209562209715326, "global_step": 288341, "epoch": 3473, "val_loss": 7119931.5} {"train_loss": -24.391904830932617, "global_step": 288342, "epoch": 3474} {"train_loss": -24.643022537231445, "global_step": 288343, "epoch": 3474} {"train_loss": -24.6491756439209, "global_step": 288344, "epoch": 3474} {"train_loss": -25.02760887145996, "global_step": 288345, "epoch": 3474} {"train_loss": -24.855045318603516, "global_step": 288346, "epoch": 3474} {"train_loss": -24.335683822631836, "global_step": 288347, "epoch": 3474} {"train_loss": -24.71701431274414, "global_step": 288348, "epoch": 3474} {"train_loss": -25.006067276000977, "global_step": 288349, "epoch": 3474} {"train_loss": -24.94623374938965, "global_step": 288350, "epoch": 3474} {"train_loss": -24.87871551513672, "global_step": 288351, "epoch": 3474} {"train_loss": -25.20519256591797, "global_step": 288352, "epoch": 3474} {"train_loss": -25.557886123657227, "global_step": 288353, "epoch": 3474} {"train_loss": -25.206863403320312, "global_step": 288354, "epoch": 3474} {"train_loss": -25.8879451751709, "global_step": 288355, "epoch": 3474} {"train_loss": -25.61968994140625, "global_step": 288356, "epoch": 3474} {"train_loss": -25.24051856994629, "global_step": 288357, "epoch": 3474} {"train_loss": -25.300676345825195, "global_step": 288358, "epoch": 3474} {"train_loss": -25.21221923828125, "global_step": 288359, "epoch": 3474} {"train_loss": -25.146530151367188, "global_step": 288360, "epoch": 3474} {"train_loss": -25.429645538330078, "global_step": 288361, "epoch": 3474} {"train_loss": -25.6490421295166, "global_step": 288362, "epoch": 3474} {"train_loss": -25.40742301940918, "global_step": 288363, "epoch": 3474} {"train_loss": -25.769641876220703, "global_step": 288364, "epoch": 3474} {"train_loss": -25.28474235534668, "global_step": 288365, "epoch": 3474} {"train_loss": -25.410390853881836, "global_step": 288366, "epoch": 3474} {"train_loss": -25.735260009765625, "global_step": 288367, "epoch": 3474} {"train_loss": -25.661291122436523, "global_step": 288368, "epoch": 3474} {"train_loss": -25.771570205688477, "global_step": 288369, "epoch": 3474} {"train_loss": -25.765979766845703, "global_step": 288370, "epoch": 3474} {"train_loss": -25.645709991455078, "global_step": 288371, "epoch": 3474} {"train_loss": -25.35336685180664, "global_step": 288372, "epoch": 3474} {"train_loss": -25.444433212280273, "global_step": 288373, "epoch": 3474} {"train_loss": -25.6074275970459, "global_step": 288374, "epoch": 3474} {"train_loss": -25.428701400756836, "global_step": 288375, "epoch": 3474} {"train_loss": -25.591842651367188, "global_step": 288376, "epoch": 3474} {"train_loss": -25.70454216003418, "global_step": 288377, "epoch": 3474} {"train_loss": -25.847015380859375, "global_step": 288378, "epoch": 3474} {"train_loss": -25.705570220947266, "global_step": 288379, "epoch": 3474} {"train_loss": -25.23968505859375, "global_step": 288380, "epoch": 3474} {"train_loss": -25.43647003173828, "global_step": 288381, "epoch": 3474} {"train_loss": -25.653318405151367, "global_step": 288382, "epoch": 3474} {"train_loss": -25.689783096313477, "global_step": 288383, "epoch": 3474} {"train_loss": -25.397357940673828, "global_step": 288384, "epoch": 3474} {"train_loss": -25.343841552734375, "global_step": 288385, "epoch": 3474} {"train_loss": -25.673864364624023, "global_step": 288386, "epoch": 3474} {"train_loss": -25.68682289123535, "global_step": 288387, "epoch": 3474} {"train_loss": -25.388446807861328, "global_step": 288388, "epoch": 3474} {"train_loss": -25.666736602783203, "global_step": 288389, "epoch": 3474} {"train_loss": -25.513113021850586, "global_step": 288390, "epoch": 3474} {"train_loss": -25.736753463745117, "global_step": 288391, "epoch": 3474} {"train_loss": -25.485883712768555, "global_step": 288392, "epoch": 3474} {"train_loss": -25.457937240600586, "global_step": 288393, "epoch": 3474} {"train_loss": -25.344167709350586, "global_step": 288394, "epoch": 3474} {"train_loss": -25.366493225097656, "global_step": 288395, "epoch": 3474} {"train_loss": -25.673437118530273, "global_step": 288396, "epoch": 3474} {"train_loss": -25.602087020874023, "global_step": 288397, "epoch": 3474} {"train_loss": -25.916379928588867, "global_step": 288398, "epoch": 3474} {"train_loss": -25.26943016052246, "global_step": 288399, "epoch": 3474} {"train_loss": -25.236112594604492, "global_step": 288400, "epoch": 3474} {"train_loss": -25.40873146057129, "global_step": 288401, "epoch": 3474} {"train_loss": -25.701583862304688, "global_step": 288402, "epoch": 3474} {"train_loss": -25.98927116394043, "global_step": 288403, "epoch": 3474} {"train_loss": -25.87566566467285, "global_step": 288404, "epoch": 3474} {"train_loss": -25.796232223510742, "global_step": 288405, "epoch": 3474} {"train_loss": -25.337589263916016, "global_step": 288406, "epoch": 3474} {"train_loss": -25.716550827026367, "global_step": 288407, "epoch": 3474} {"train_loss": -25.474605560302734, "global_step": 288408, "epoch": 3474} {"train_loss": -25.48596954345703, "global_step": 288409, "epoch": 3474} {"train_loss": -25.897796630859375, "global_step": 288410, "epoch": 3474} {"train_loss": -25.916730880737305, "global_step": 288411, "epoch": 3474} {"train_loss": -25.434717178344727, "global_step": 288412, "epoch": 3474} {"train_loss": -25.894006729125977, "global_step": 288413, "epoch": 3474} {"train_loss": -25.638036727905273, "global_step": 288414, "epoch": 3474} {"train_loss": -25.740137100219727, "global_step": 288415, "epoch": 3474} {"train_loss": -25.70745849609375, "global_step": 288416, "epoch": 3474} {"train_loss": -25.804107666015625, "global_step": 288417, "epoch": 3474} {"train_loss": -25.59840965270996, "global_step": 288418, "epoch": 3474} {"train_loss": -25.673337936401367, "global_step": 288419, "epoch": 3474} {"train_loss": -25.830305099487305, "global_step": 288420, "epoch": 3474} {"train_loss": -25.83631706237793, "global_step": 288421, "epoch": 3474} {"train_loss": -25.544231414794922, "global_step": 288422, "epoch": 3474} {"train_loss": -25.989322662353516, "global_step": 288423, "epoch": 3474} {"train_loss": -25.48445327023426, "global_step": 288424, "epoch": 3474, "val_loss": 7070168.0} {"train_loss": -25.149383544921875, "global_step": 288425, "epoch": 3475} {"train_loss": -25.7650146484375, "global_step": 288426, "epoch": 3475} {"train_loss": -25.69331932067871, "global_step": 288427, "epoch": 3475} {"train_loss": -25.47712516784668, "global_step": 288428, "epoch": 3475} {"train_loss": -25.305908203125, "global_step": 288429, "epoch": 3475} {"train_loss": -25.56106185913086, "global_step": 288430, "epoch": 3475} {"train_loss": -25.36528778076172, "global_step": 288431, "epoch": 3475} {"train_loss": -25.617328643798828, "global_step": 288432, "epoch": 3475} {"train_loss": -25.07038688659668, "global_step": 288433, "epoch": 3475} {"train_loss": -25.600584030151367, "global_step": 288434, "epoch": 3475} {"train_loss": -25.304025650024414, "global_step": 288435, "epoch": 3475} {"train_loss": -25.44893455505371, "global_step": 288436, "epoch": 3475} {"train_loss": -25.653411865234375, "global_step": 288437, "epoch": 3475} {"train_loss": -25.589385986328125, "global_step": 288438, "epoch": 3475} {"train_loss": -25.579599380493164, "global_step": 288439, "epoch": 3475} {"train_loss": -25.884784698486328, "global_step": 288440, "epoch": 3475} {"train_loss": -25.75356101989746, "global_step": 288441, "epoch": 3475} {"train_loss": -25.19947624206543, "global_step": 288442, "epoch": 3475} {"train_loss": -25.493839263916016, "global_step": 288443, "epoch": 3475} {"train_loss": -24.936548233032227, "global_step": 288444, "epoch": 3475} {"train_loss": -25.7841739654541, "global_step": 288445, "epoch": 3475} {"train_loss": -25.074270248413086, "global_step": 288446, "epoch": 3475} {"train_loss": -25.570499420166016, "global_step": 288447, "epoch": 3475} {"train_loss": -25.37632179260254, "global_step": 288448, "epoch": 3475} {"train_loss": -25.228010177612305, "global_step": 288449, "epoch": 3475} {"train_loss": -25.374908447265625, "global_step": 288450, "epoch": 3475} {"train_loss": -25.716405868530273, "global_step": 288451, "epoch": 3475} {"train_loss": -25.298559188842773, "global_step": 288452, "epoch": 3475} {"train_loss": -25.285175323486328, "global_step": 288453, "epoch": 3475} {"train_loss": -25.598257064819336, "global_step": 288454, "epoch": 3475} {"train_loss": -25.671875, "global_step": 288455, "epoch": 3475} {"train_loss": -25.726825714111328, "global_step": 288456, "epoch": 3475} {"train_loss": -25.558340072631836, "global_step": 288457, "epoch": 3475} {"train_loss": -25.5205135345459, "global_step": 288458, "epoch": 3475} {"train_loss": -25.80734634399414, "global_step": 288459, "epoch": 3475} {"train_loss": -25.47052001953125, "global_step": 288460, "epoch": 3475} {"train_loss": -25.786518096923828, "global_step": 288461, "epoch": 3475} {"train_loss": -25.544082641601562, "global_step": 288462, "epoch": 3475} {"train_loss": -25.743627548217773, "global_step": 288463, "epoch": 3475} {"train_loss": -25.445091247558594, "global_step": 288464, "epoch": 3475} {"train_loss": -25.383731842041016, "global_step": 288465, "epoch": 3475} {"train_loss": -25.736120223999023, "global_step": 288466, "epoch": 3475} {"train_loss": -25.665616989135742, "global_step": 288467, "epoch": 3475} {"train_loss": -25.603591918945312, "global_step": 288468, "epoch": 3475} {"train_loss": -25.684110641479492, "global_step": 288469, "epoch": 3475} {"train_loss": -25.58392333984375, "global_step": 288470, "epoch": 3475} {"train_loss": -25.5443115234375, "global_step": 288471, "epoch": 3475} {"train_loss": -25.449880599975586, "global_step": 288472, "epoch": 3475} {"train_loss": -25.537946701049805, "global_step": 288473, "epoch": 3475} {"train_loss": -25.40833854675293, "global_step": 288474, "epoch": 3475} {"train_loss": -25.714643478393555, "global_step": 288475, "epoch": 3475} {"train_loss": -25.661039352416992, "global_step": 288476, "epoch": 3475} {"train_loss": -25.790491104125977, "global_step": 288477, "epoch": 3475} {"train_loss": -25.95879554748535, "global_step": 288478, "epoch": 3475} {"train_loss": -25.81532859802246, "global_step": 288479, "epoch": 3475} {"train_loss": -25.28664207458496, "global_step": 288480, "epoch": 3475} {"train_loss": -25.728769302368164, "global_step": 288481, "epoch": 3475} {"train_loss": -25.6599178314209, "global_step": 288482, "epoch": 3475} {"train_loss": -25.877355575561523, "global_step": 288483, "epoch": 3475} {"train_loss": -25.76471519470215, "global_step": 288484, "epoch": 3475} {"train_loss": -25.676288604736328, "global_step": 288485, "epoch": 3475} {"train_loss": -25.54487419128418, "global_step": 288486, "epoch": 3475} {"train_loss": -25.828336715698242, "global_step": 288487, "epoch": 3475} {"train_loss": -25.59845733642578, "global_step": 288488, "epoch": 3475} {"train_loss": -26.1783390045166, "global_step": 288489, "epoch": 3475} {"train_loss": -25.500247955322266, "global_step": 288490, "epoch": 3475} {"train_loss": -25.852991104125977, "global_step": 288491, "epoch": 3475} {"train_loss": -25.33636474609375, "global_step": 288492, "epoch": 3475} {"train_loss": -24.833545684814453, "global_step": 288493, "epoch": 3475} {"train_loss": -25.047882080078125, "global_step": 288494, "epoch": 3475} {"train_loss": -24.00478172302246, "global_step": 288495, "epoch": 3475} {"train_loss": -25.170866012573242, "global_step": 288496, "epoch": 3475} {"train_loss": -25.4888973236084, "global_step": 288497, "epoch": 3475} {"train_loss": -24.457746505737305, "global_step": 288498, "epoch": 3475} {"train_loss": -25.493928909301758, "global_step": 288499, "epoch": 3475} {"train_loss": -25.002283096313477, "global_step": 288500, "epoch": 3475} {"train_loss": -25.490047454833984, "global_step": 288501, "epoch": 3475} {"train_loss": -24.953994750976562, "global_step": 288502, "epoch": 3475} {"train_loss": -25.10121726989746, "global_step": 288503, "epoch": 3475} {"train_loss": -25.4013729095459, "global_step": 288504, "epoch": 3475} {"train_loss": -24.991071701049805, "global_step": 288505, "epoch": 3475} {"train_loss": -24.901010513305664, "global_step": 288506, "epoch": 3475} {"train_loss": -25.46518337295716, "global_step": 288507, "epoch": 3475, "val_loss": 7200032.0} {"train_loss": -25.168701171875, "global_step": 288508, "epoch": 3476} {"train_loss": -25.11165428161621, "global_step": 288509, "epoch": 3476} {"train_loss": -25.382783889770508, "global_step": 288510, "epoch": 3476} {"train_loss": -25.13667869567871, "global_step": 288511, "epoch": 3476} {"train_loss": -24.76816749572754, "global_step": 288512, "epoch": 3476} {"train_loss": -25.1365966796875, "global_step": 288513, "epoch": 3476} {"train_loss": -25.018285751342773, "global_step": 288514, "epoch": 3476} {"train_loss": -24.962583541870117, "global_step": 288515, "epoch": 3476} {"train_loss": -25.299184799194336, "global_step": 288516, "epoch": 3476} {"train_loss": -24.924224853515625, "global_step": 288517, "epoch": 3476} {"train_loss": -25.00545310974121, "global_step": 288518, "epoch": 3476} {"train_loss": -25.32314109802246, "global_step": 288519, "epoch": 3476} {"train_loss": -25.379117965698242, "global_step": 288520, "epoch": 3476} {"train_loss": -24.713382720947266, "global_step": 288521, "epoch": 3476} {"train_loss": -25.36702537536621, "global_step": 288522, "epoch": 3476} {"train_loss": -25.4415340423584, "global_step": 288523, "epoch": 3476} {"train_loss": -25.1640682220459, "global_step": 288524, "epoch": 3476} {"train_loss": -25.400297164916992, "global_step": 288525, "epoch": 3476} {"train_loss": -25.2882137298584, "global_step": 288526, "epoch": 3476} {"train_loss": -25.04966163635254, "global_step": 288527, "epoch": 3476} {"train_loss": -25.148046493530273, "global_step": 288528, "epoch": 3476} {"train_loss": -25.157928466796875, "global_step": 288529, "epoch": 3476} {"train_loss": -24.992734909057617, "global_step": 288530, "epoch": 3476} {"train_loss": -24.93770408630371, "global_step": 288531, "epoch": 3476} {"train_loss": -25.3878116607666, "global_step": 288532, "epoch": 3476} {"train_loss": -25.11870765686035, "global_step": 288533, "epoch": 3476} {"train_loss": -25.521732330322266, "global_step": 288534, "epoch": 3476} {"train_loss": -25.822797775268555, "global_step": 288535, "epoch": 3476} {"train_loss": -25.473020553588867, "global_step": 288536, "epoch": 3476} {"train_loss": -25.442707061767578, "global_step": 288537, "epoch": 3476} {"train_loss": -25.21575355529785, "global_step": 288538, "epoch": 3476} {"train_loss": -25.501089096069336, "global_step": 288539, "epoch": 3476} {"train_loss": -25.30985450744629, "global_step": 288540, "epoch": 3476} {"train_loss": -25.442886352539062, "global_step": 288541, "epoch": 3476} {"train_loss": -25.569684982299805, "global_step": 288542, "epoch": 3476} {"train_loss": -25.489347457885742, "global_step": 288543, "epoch": 3476} {"train_loss": -25.499338150024414, "global_step": 288544, "epoch": 3476} {"train_loss": -25.41168785095215, "global_step": 288545, "epoch": 3476} {"train_loss": -25.82282066345215, "global_step": 288546, "epoch": 3476} {"train_loss": -25.67274284362793, "global_step": 288547, "epoch": 3476} {"train_loss": -25.6890869140625, "global_step": 288548, "epoch": 3476} {"train_loss": -25.449907302856445, "global_step": 288549, "epoch": 3476} {"train_loss": -25.92669677734375, "global_step": 288550, "epoch": 3476} {"train_loss": -25.799589157104492, "global_step": 288551, "epoch": 3476} {"train_loss": -25.92091178894043, "global_step": 288552, "epoch": 3476} {"train_loss": -25.472028732299805, "global_step": 288553, "epoch": 3476} {"train_loss": -25.516416549682617, "global_step": 288554, "epoch": 3476} {"train_loss": -25.67951011657715, "global_step": 288555, "epoch": 3476} {"train_loss": -25.346820831298828, "global_step": 288556, "epoch": 3476} {"train_loss": -25.441457748413086, "global_step": 288557, "epoch": 3476} {"train_loss": -25.613428115844727, "global_step": 288558, "epoch": 3476} {"train_loss": -25.143404006958008, "global_step": 288559, "epoch": 3476} {"train_loss": -25.06414031982422, "global_step": 288560, "epoch": 3476} {"train_loss": -25.878223419189453, "global_step": 288561, "epoch": 3476} {"train_loss": -25.360401153564453, "global_step": 288562, "epoch": 3476} {"train_loss": -25.428125381469727, "global_step": 288563, "epoch": 3476} {"train_loss": -25.1567440032959, "global_step": 288564, "epoch": 3476} {"train_loss": -25.37179946899414, "global_step": 288565, "epoch": 3476} {"train_loss": -25.624231338500977, "global_step": 288566, "epoch": 3476} {"train_loss": -25.455368041992188, "global_step": 288567, "epoch": 3476} {"train_loss": -25.420753479003906, "global_step": 288568, "epoch": 3476} {"train_loss": -25.773929595947266, "global_step": 288569, "epoch": 3476} {"train_loss": -25.355655670166016, "global_step": 288570, "epoch": 3476} {"train_loss": -25.599538803100586, "global_step": 288571, "epoch": 3476} {"train_loss": -25.887365341186523, "global_step": 288572, "epoch": 3476} {"train_loss": -25.69012451171875, "global_step": 288573, "epoch": 3476} {"train_loss": -25.79422950744629, "global_step": 288574, "epoch": 3476} {"train_loss": -25.26154136657715, "global_step": 288575, "epoch": 3476} {"train_loss": -25.591054916381836, "global_step": 288576, "epoch": 3476} {"train_loss": -25.61956787109375, "global_step": 288577, "epoch": 3476} {"train_loss": -25.392505645751953, "global_step": 288578, "epoch": 3476} {"train_loss": -25.827802658081055, "global_step": 288579, "epoch": 3476} {"train_loss": -25.17076301574707, "global_step": 288580, "epoch": 3476} {"train_loss": -25.53239631652832, "global_step": 288581, "epoch": 3476} {"train_loss": -25.58950424194336, "global_step": 288582, "epoch": 3476} {"train_loss": -25.063579559326172, "global_step": 288583, "epoch": 3476} {"train_loss": -25.59126853942871, "global_step": 288584, "epoch": 3476} {"train_loss": -25.41585922241211, "global_step": 288585, "epoch": 3476} {"train_loss": -25.755477905273438, "global_step": 288586, "epoch": 3476} {"train_loss": -25.609344482421875, "global_step": 288587, "epoch": 3476} {"train_loss": -25.817495346069336, "global_step": 288588, "epoch": 3476} {"train_loss": -25.48406219482422, "global_step": 288589, "epoch": 3476} {"train_loss": -25.39394920992564, "global_step": 288590, "epoch": 3476, "val_loss": 7072198.5} {"train_loss": -25.246492385864258, "global_step": 288591, "epoch": 3477} {"train_loss": -24.332923889160156, "global_step": 288592, "epoch": 3477} {"train_loss": -25.009700775146484, "global_step": 288593, "epoch": 3477} {"train_loss": -25.130462646484375, "global_step": 288594, "epoch": 3477} {"train_loss": -25.140464782714844, "global_step": 288595, "epoch": 3477} {"train_loss": -24.702993392944336, "global_step": 288596, "epoch": 3477} {"train_loss": -25.19826316833496, "global_step": 288597, "epoch": 3477} {"train_loss": -24.465072631835938, "global_step": 288598, "epoch": 3477} {"train_loss": -25.257905960083008, "global_step": 288599, "epoch": 3477} {"train_loss": -24.64224624633789, "global_step": 288600, "epoch": 3477} {"train_loss": -25.15334129333496, "global_step": 288601, "epoch": 3477} {"train_loss": -24.967498779296875, "global_step": 288602, "epoch": 3477} {"train_loss": -25.268726348876953, "global_step": 288603, "epoch": 3477} {"train_loss": -25.03755760192871, "global_step": 288604, "epoch": 3477} {"train_loss": -25.2917537689209, "global_step": 288605, "epoch": 3477} {"train_loss": -25.200830459594727, "global_step": 288606, "epoch": 3477} {"train_loss": -24.914682388305664, "global_step": 288607, "epoch": 3477} {"train_loss": -25.144399642944336, "global_step": 288608, "epoch": 3477} {"train_loss": -25.545530319213867, "global_step": 288609, "epoch": 3477} {"train_loss": -25.334327697753906, "global_step": 288610, "epoch": 3477} {"train_loss": -25.582069396972656, "global_step": 288611, "epoch": 3477} {"train_loss": -25.7044677734375, "global_step": 288612, "epoch": 3477} {"train_loss": -25.452146530151367, "global_step": 288613, "epoch": 3477} {"train_loss": -25.4780330657959, "global_step": 288614, "epoch": 3477} {"train_loss": -25.64434242248535, "global_step": 288615, "epoch": 3477} {"train_loss": -25.130170822143555, "global_step": 288616, "epoch": 3477} {"train_loss": -25.29286003112793, "global_step": 288617, "epoch": 3477} {"train_loss": -25.219125747680664, "global_step": 288618, "epoch": 3477} {"train_loss": -25.48601722717285, "global_step": 288619, "epoch": 3477} {"train_loss": -25.638599395751953, "global_step": 288620, "epoch": 3477} {"train_loss": -25.651533126831055, "global_step": 288621, "epoch": 3477} {"train_loss": -25.312244415283203, "global_step": 288622, "epoch": 3477} {"train_loss": -25.525760650634766, "global_step": 288623, "epoch": 3477} {"train_loss": -25.762420654296875, "global_step": 288624, "epoch": 3477} {"train_loss": -25.4664363861084, "global_step": 288625, "epoch": 3477} {"train_loss": -25.71492576599121, "global_step": 288626, "epoch": 3477} {"train_loss": -25.414142608642578, "global_step": 288627, "epoch": 3477} {"train_loss": -25.59145164489746, "global_step": 288628, "epoch": 3477} {"train_loss": -25.99224281311035, "global_step": 288629, "epoch": 3477} {"train_loss": -25.666955947875977, "global_step": 288630, "epoch": 3477} {"train_loss": -25.53879737854004, "global_step": 288631, "epoch": 3477} {"train_loss": -25.468734741210938, "global_step": 288632, "epoch": 3477} {"train_loss": -25.80183219909668, "global_step": 288633, "epoch": 3477} {"train_loss": -25.777999877929688, "global_step": 288634, "epoch": 3477} {"train_loss": -25.78887939453125, "global_step": 288635, "epoch": 3477} {"train_loss": -25.902402877807617, "global_step": 288636, "epoch": 3477} {"train_loss": -25.557409286499023, "global_step": 288637, "epoch": 3477} {"train_loss": -25.565876007080078, "global_step": 288638, "epoch": 3477} {"train_loss": -25.626728057861328, "global_step": 288639, "epoch": 3477} {"train_loss": -25.3044490814209, "global_step": 288640, "epoch": 3477} {"train_loss": -25.751331329345703, "global_step": 288641, "epoch": 3477} {"train_loss": -25.273550033569336, "global_step": 288642, "epoch": 3477} {"train_loss": -25.65958595275879, "global_step": 288643, "epoch": 3477} {"train_loss": -25.450515747070312, "global_step": 288644, "epoch": 3477} {"train_loss": -25.25266456604004, "global_step": 288645, "epoch": 3477} {"train_loss": -25.623022079467773, "global_step": 288646, "epoch": 3477} {"train_loss": -25.44002914428711, "global_step": 288647, "epoch": 3477} {"train_loss": -26.178388595581055, "global_step": 288648, "epoch": 3477} {"train_loss": -25.281068801879883, "global_step": 288649, "epoch": 3477} {"train_loss": -25.5593318939209, "global_step": 288650, "epoch": 3477} {"train_loss": -25.347951889038086, "global_step": 288651, "epoch": 3477} {"train_loss": -25.3056583404541, "global_step": 288652, "epoch": 3477} {"train_loss": -25.151203155517578, "global_step": 288653, "epoch": 3477} {"train_loss": -25.25432014465332, "global_step": 288654, "epoch": 3477} {"train_loss": -24.5346622467041, "global_step": 288655, "epoch": 3477} {"train_loss": -25.28445053100586, "global_step": 288656, "epoch": 3477} {"train_loss": -25.405969619750977, "global_step": 288657, "epoch": 3477} {"train_loss": -25.2308292388916, "global_step": 288658, "epoch": 3477} {"train_loss": -25.45550537109375, "global_step": 288659, "epoch": 3477} {"train_loss": -25.275705337524414, "global_step": 288660, "epoch": 3477} {"train_loss": -25.40631103515625, "global_step": 288661, "epoch": 3477} {"train_loss": -25.52444076538086, "global_step": 288662, "epoch": 3477} {"train_loss": -25.75927734375, "global_step": 288663, "epoch": 3477} {"train_loss": -25.60355567932129, "global_step": 288664, "epoch": 3477} {"train_loss": -25.629322052001953, "global_step": 288665, "epoch": 3477} {"train_loss": -25.607288360595703, "global_step": 288666, "epoch": 3477} {"train_loss": -25.567474365234375, "global_step": 288667, "epoch": 3477} {"train_loss": -25.25762367248535, "global_step": 288668, "epoch": 3477} {"train_loss": -25.536035537719727, "global_step": 288669, "epoch": 3477} {"train_loss": -25.40641212463379, "global_step": 288670, "epoch": 3477} {"train_loss": -25.43329429626465, "global_step": 288671, "epoch": 3477} {"train_loss": -25.629119873046875, "global_step": 288672, "epoch": 3477} {"train_loss": -25.383081780858788, "global_step": 288673, "epoch": 3477, "val_loss": 7051440.0} {"train_loss": -25.13053321838379, "global_step": 288674, "epoch": 3478} {"train_loss": -25.2327938079834, "global_step": 288675, "epoch": 3478} {"train_loss": -25.11490249633789, "global_step": 288676, "epoch": 3478} {"train_loss": -24.891996383666992, "global_step": 288677, "epoch": 3478} {"train_loss": -25.342838287353516, "global_step": 288678, "epoch": 3478} {"train_loss": -25.005878448486328, "global_step": 288679, "epoch": 3478} {"train_loss": -25.116613388061523, "global_step": 288680, "epoch": 3478} {"train_loss": -25.014501571655273, "global_step": 288681, "epoch": 3478} {"train_loss": -25.429508209228516, "global_step": 288682, "epoch": 3478} {"train_loss": -25.236547470092773, "global_step": 288683, "epoch": 3478} {"train_loss": -24.877042770385742, "global_step": 288684, "epoch": 3478} {"train_loss": -25.53682518005371, "global_step": 288685, "epoch": 3478} {"train_loss": -25.096542358398438, "global_step": 288686, "epoch": 3478} {"train_loss": -25.285743713378906, "global_step": 288687, "epoch": 3478} {"train_loss": -25.38311767578125, "global_step": 288688, "epoch": 3478} {"train_loss": -25.60964012145996, "global_step": 288689, "epoch": 3478} {"train_loss": -25.28412437438965, "global_step": 288690, "epoch": 3478} {"train_loss": -25.2670841217041, "global_step": 288691, "epoch": 3478} {"train_loss": -25.60706901550293, "global_step": 288692, "epoch": 3478} {"train_loss": -25.472665786743164, "global_step": 288693, "epoch": 3478} {"train_loss": -25.42898941040039, "global_step": 288694, "epoch": 3478} {"train_loss": -25.340490341186523, "global_step": 288695, "epoch": 3478} {"train_loss": -25.36075210571289, "global_step": 288696, "epoch": 3478} {"train_loss": -25.654800415039062, "global_step": 288697, "epoch": 3478} {"train_loss": -25.528076171875, "global_step": 288698, "epoch": 3478} {"train_loss": -25.33133316040039, "global_step": 288699, "epoch": 3478} {"train_loss": -25.520864486694336, "global_step": 288700, "epoch": 3478} {"train_loss": -25.7152099609375, "global_step": 288701, "epoch": 3478} {"train_loss": -25.86282730102539, "global_step": 288702, "epoch": 3478} {"train_loss": -25.83721923828125, "global_step": 288703, "epoch": 3478} {"train_loss": -25.317514419555664, "global_step": 288704, "epoch": 3478} {"train_loss": -25.48154640197754, "global_step": 288705, "epoch": 3478} {"train_loss": -25.622699737548828, "global_step": 288706, "epoch": 3478} {"train_loss": -25.6717586517334, "global_step": 288707, "epoch": 3478} {"train_loss": -25.79197120666504, "global_step": 288708, "epoch": 3478} {"train_loss": -25.38313102722168, "global_step": 288709, "epoch": 3478} {"train_loss": -25.443662643432617, "global_step": 288710, "epoch": 3478} {"train_loss": -25.575199127197266, "global_step": 288711, "epoch": 3478} {"train_loss": -25.72854995727539, "global_step": 288712, "epoch": 3478} {"train_loss": -25.305410385131836, "global_step": 288713, "epoch": 3478} {"train_loss": -25.752607345581055, "global_step": 288714, "epoch": 3478} {"train_loss": -25.428543090820312, "global_step": 288715, "epoch": 3478} {"train_loss": -25.652240753173828, "global_step": 288716, "epoch": 3478} {"train_loss": -26.11756706237793, "global_step": 288717, "epoch": 3478} {"train_loss": -25.597753524780273, "global_step": 288718, "epoch": 3478} {"train_loss": -25.302143096923828, "global_step": 288719, "epoch": 3478} {"train_loss": -25.8460693359375, "global_step": 288720, "epoch": 3478} {"train_loss": -25.336978912353516, "global_step": 288721, "epoch": 3478} {"train_loss": -25.586475372314453, "global_step": 288722, "epoch": 3478} {"train_loss": -25.294876098632812, "global_step": 288723, "epoch": 3478} {"train_loss": -25.66204261779785, "global_step": 288724, "epoch": 3478} {"train_loss": -25.899368286132812, "global_step": 288725, "epoch": 3478} {"train_loss": -25.723520278930664, "global_step": 288726, "epoch": 3478} {"train_loss": -25.574390411376953, "global_step": 288727, "epoch": 3478} {"train_loss": -25.859928131103516, "global_step": 288728, "epoch": 3478} {"train_loss": -25.832807540893555, "global_step": 288729, "epoch": 3478} {"train_loss": -25.474184036254883, "global_step": 288730, "epoch": 3478} {"train_loss": -25.86899185180664, "global_step": 288731, "epoch": 3478} {"train_loss": -25.648542404174805, "global_step": 288732, "epoch": 3478} {"train_loss": -25.790058135986328, "global_step": 288733, "epoch": 3478} {"train_loss": -25.477951049804688, "global_step": 288734, "epoch": 3478} {"train_loss": -25.31988525390625, "global_step": 288735, "epoch": 3478} {"train_loss": -25.172555923461914, "global_step": 288736, "epoch": 3478} {"train_loss": -25.364765167236328, "global_step": 288737, "epoch": 3478} {"train_loss": -25.21681785583496, "global_step": 288738, "epoch": 3478} {"train_loss": -25.181682586669922, "global_step": 288739, "epoch": 3478} {"train_loss": -25.43790626525879, "global_step": 288740, "epoch": 3478} {"train_loss": -25.844175338745117, "global_step": 288741, "epoch": 3478} {"train_loss": -25.083463668823242, "global_step": 288742, "epoch": 3478} {"train_loss": -25.564584732055664, "global_step": 288743, "epoch": 3478} {"train_loss": -25.05659294128418, "global_step": 288744, "epoch": 3478} {"train_loss": -25.581186294555664, "global_step": 288745, "epoch": 3478} {"train_loss": -25.39829444885254, "global_step": 288746, "epoch": 3478} {"train_loss": -25.72494888305664, "global_step": 288747, "epoch": 3478} {"train_loss": -25.583433151245117, "global_step": 288748, "epoch": 3478} {"train_loss": -25.498252868652344, "global_step": 288749, "epoch": 3478} {"train_loss": -25.76724624633789, "global_step": 288750, "epoch": 3478} {"train_loss": -25.786468505859375, "global_step": 288751, "epoch": 3478} {"train_loss": -25.44361114501953, "global_step": 288752, "epoch": 3478} {"train_loss": -25.65408706665039, "global_step": 288753, "epoch": 3478} {"train_loss": -25.890966415405273, "global_step": 288754, "epoch": 3478} {"train_loss": -25.595727920532227, "global_step": 288755, "epoch": 3478} {"train_loss": -25.477757603289135, "global_step": 288756, "epoch": 3478, "val_loss": 7132787.5} {"train_loss": -25.148866653442383, "global_step": 288757, "epoch": 3479} {"train_loss": -24.97711181640625, "global_step": 288758, "epoch": 3479} {"train_loss": -25.0814151763916, "global_step": 288759, "epoch": 3479} {"train_loss": -24.71516990661621, "global_step": 288760, "epoch": 3479} {"train_loss": -24.80498504638672, "global_step": 288761, "epoch": 3479} {"train_loss": -24.79457664489746, "global_step": 288762, "epoch": 3479} {"train_loss": -25.70361328125, "global_step": 288763, "epoch": 3479} {"train_loss": -24.9775447845459, "global_step": 288764, "epoch": 3479} {"train_loss": -25.26057243347168, "global_step": 288765, "epoch": 3479} {"train_loss": -25.16707420349121, "global_step": 288766, "epoch": 3479} {"train_loss": -25.558637619018555, "global_step": 288767, "epoch": 3479} {"train_loss": -24.96137809753418, "global_step": 288768, "epoch": 3479} {"train_loss": -25.6307373046875, "global_step": 288769, "epoch": 3479} {"train_loss": -25.123342514038086, "global_step": 288770, "epoch": 3479} {"train_loss": -25.1530818939209, "global_step": 288771, "epoch": 3479} {"train_loss": -25.63173484802246, "global_step": 288772, "epoch": 3479} {"train_loss": -25.51065444946289, "global_step": 288773, "epoch": 3479} {"train_loss": -25.21304702758789, "global_step": 288774, "epoch": 3479} {"train_loss": -25.661727905273438, "global_step": 288775, "epoch": 3479} {"train_loss": -25.47197151184082, "global_step": 288776, "epoch": 3479} {"train_loss": -25.208322525024414, "global_step": 288777, "epoch": 3479} {"train_loss": -25.2656307220459, "global_step": 288778, "epoch": 3479} {"train_loss": -25.705352783203125, "global_step": 288779, "epoch": 3479} {"train_loss": -25.247602462768555, "global_step": 288780, "epoch": 3479} {"train_loss": -25.6241512298584, "global_step": 288781, "epoch": 3479} {"train_loss": -25.6025447845459, "global_step": 288782, "epoch": 3479} {"train_loss": -25.527204513549805, "global_step": 288783, "epoch": 3479} {"train_loss": -25.529434204101562, "global_step": 288784, "epoch": 3479} {"train_loss": -25.811498641967773, "global_step": 288785, "epoch": 3479} {"train_loss": -25.53329849243164, "global_step": 288786, "epoch": 3479} {"train_loss": -25.53111457824707, "global_step": 288787, "epoch": 3479} {"train_loss": -25.310693740844727, "global_step": 288788, "epoch": 3479} {"train_loss": -25.696399688720703, "global_step": 288789, "epoch": 3479} {"train_loss": -25.249713897705078, "global_step": 288790, "epoch": 3479} {"train_loss": -25.622085571289062, "global_step": 288791, "epoch": 3479} {"train_loss": -25.51328468322754, "global_step": 288792, "epoch": 3479} {"train_loss": -25.972320556640625, "global_step": 288793, "epoch": 3479} {"train_loss": -25.586912155151367, "global_step": 288794, "epoch": 3479} {"train_loss": -25.525358200073242, "global_step": 288795, "epoch": 3479} {"train_loss": -25.458200454711914, "global_step": 288796, "epoch": 3479} {"train_loss": -25.819860458374023, "global_step": 288797, "epoch": 3479} {"train_loss": -25.56670379638672, "global_step": 288798, "epoch": 3479} {"train_loss": -25.92959976196289, "global_step": 288799, "epoch": 3479} {"train_loss": -25.537002563476562, "global_step": 288800, "epoch": 3479} {"train_loss": -25.593324661254883, "global_step": 288801, "epoch": 3479} {"train_loss": -25.396392822265625, "global_step": 288802, "epoch": 3479} {"train_loss": -25.499135971069336, "global_step": 288803, "epoch": 3479} {"train_loss": -26.090967178344727, "global_step": 288804, "epoch": 3479} {"train_loss": -25.6102237701416, "global_step": 288805, "epoch": 3479} {"train_loss": -25.533361434936523, "global_step": 288806, "epoch": 3479} {"train_loss": -25.472110748291016, "global_step": 288807, "epoch": 3479} {"train_loss": -25.304250717163086, "global_step": 288808, "epoch": 3479} {"train_loss": -25.267501831054688, "global_step": 288809, "epoch": 3479} {"train_loss": -25.41495132446289, "global_step": 288810, "epoch": 3479} {"train_loss": -25.734373092651367, "global_step": 288811, "epoch": 3479} {"train_loss": -25.801212310791016, "global_step": 288812, "epoch": 3479} {"train_loss": -25.217365264892578, "global_step": 288813, "epoch": 3479} {"train_loss": -25.70195960998535, "global_step": 288814, "epoch": 3479} {"train_loss": -25.463537216186523, "global_step": 288815, "epoch": 3479} {"train_loss": -25.41743278503418, "global_step": 288816, "epoch": 3479} {"train_loss": -25.055997848510742, "global_step": 288817, "epoch": 3479} {"train_loss": -25.335580825805664, "global_step": 288818, "epoch": 3479} {"train_loss": -25.656965255737305, "global_step": 288819, "epoch": 3479} {"train_loss": -25.707752227783203, "global_step": 288820, "epoch": 3479} {"train_loss": -25.328441619873047, "global_step": 288821, "epoch": 3479} {"train_loss": -25.16813087463379, "global_step": 288822, "epoch": 3479} {"train_loss": -25.39048194885254, "global_step": 288823, "epoch": 3479} {"train_loss": -25.650226593017578, "global_step": 288824, "epoch": 3479} {"train_loss": -25.088438034057617, "global_step": 288825, "epoch": 3479} {"train_loss": -25.215747833251953, "global_step": 288826, "epoch": 3479} {"train_loss": -25.456083297729492, "global_step": 288827, "epoch": 3479} {"train_loss": -25.602771759033203, "global_step": 288828, "epoch": 3479} {"train_loss": -25.41089630126953, "global_step": 288829, "epoch": 3479} {"train_loss": -25.354145050048828, "global_step": 288830, "epoch": 3479} {"train_loss": -25.088960647583008, "global_step": 288831, "epoch": 3479} {"train_loss": -25.375036239624023, "global_step": 288832, "epoch": 3479} {"train_loss": -25.91859245300293, "global_step": 288833, "epoch": 3479} {"train_loss": -25.957752227783203, "global_step": 288834, "epoch": 3479} {"train_loss": -25.86368179321289, "global_step": 288835, "epoch": 3479} {"train_loss": -25.7015323638916, "global_step": 288836, "epoch": 3479} {"train_loss": -25.674657821655273, "global_step": 288837, "epoch": 3479} {"train_loss": -25.259567260742188, "global_step": 288838, "epoch": 3479} {"train_loss": -25.436340309051147, "global_step": 288839, "epoch": 3479, "val_loss": 7192198.0} {"train_loss": -24.594776153564453, "global_step": 288840, "epoch": 3480} {"train_loss": -25.048410415649414, "global_step": 288841, "epoch": 3480} {"train_loss": -25.293132781982422, "global_step": 288842, "epoch": 3480} {"train_loss": -24.839513778686523, "global_step": 288843, "epoch": 3480} {"train_loss": -25.319854736328125, "global_step": 288844, "epoch": 3480} {"train_loss": -24.75754165649414, "global_step": 288845, "epoch": 3480} {"train_loss": -25.19513511657715, "global_step": 288846, "epoch": 3480} {"train_loss": -24.950193405151367, "global_step": 288847, "epoch": 3480} {"train_loss": -25.4166316986084, "global_step": 288848, "epoch": 3480} {"train_loss": -25.358121871948242, "global_step": 288849, "epoch": 3480} {"train_loss": -25.49063491821289, "global_step": 288850, "epoch": 3480} {"train_loss": -25.25922966003418, "global_step": 288851, "epoch": 3480} {"train_loss": -25.167692184448242, "global_step": 288852, "epoch": 3480} {"train_loss": -25.22810935974121, "global_step": 288853, "epoch": 3480} {"train_loss": -25.45125961303711, "global_step": 288854, "epoch": 3480} {"train_loss": -25.347782135009766, "global_step": 288855, "epoch": 3480} {"train_loss": -24.906091690063477, "global_step": 288856, "epoch": 3480} {"train_loss": -25.606718063354492, "global_step": 288857, "epoch": 3480} {"train_loss": -25.3546199798584, "global_step": 288858, "epoch": 3480} {"train_loss": -25.401113510131836, "global_step": 288859, "epoch": 3480} {"train_loss": -25.6436767578125, "global_step": 288860, "epoch": 3480} {"train_loss": -25.378433227539062, "global_step": 288861, "epoch": 3480} {"train_loss": -25.35041618347168, "global_step": 288862, "epoch": 3480} {"train_loss": -25.275774002075195, "global_step": 288863, "epoch": 3480} {"train_loss": -25.304853439331055, "global_step": 288864, "epoch": 3480} {"train_loss": -25.925952911376953, "global_step": 288865, "epoch": 3480} {"train_loss": -25.37471580505371, "global_step": 288866, "epoch": 3480} {"train_loss": -25.601842880249023, "global_step": 288867, "epoch": 3480} {"train_loss": -25.626733779907227, "global_step": 288868, "epoch": 3480} {"train_loss": -25.535717010498047, "global_step": 288869, "epoch": 3480} {"train_loss": -25.48250389099121, "global_step": 288870, "epoch": 3480} {"train_loss": -25.485855102539062, "global_step": 288871, "epoch": 3480} {"train_loss": -25.770925521850586, "global_step": 288872, "epoch": 3480} {"train_loss": -25.714527130126953, "global_step": 288873, "epoch": 3480} {"train_loss": -25.47218132019043, "global_step": 288874, "epoch": 3480} {"train_loss": -25.60025978088379, "global_step": 288875, "epoch": 3480} {"train_loss": -25.49565315246582, "global_step": 288876, "epoch": 3480} {"train_loss": -25.376996994018555, "global_step": 288877, "epoch": 3480} {"train_loss": -25.460012435913086, "global_step": 288878, "epoch": 3480} {"train_loss": -25.792484283447266, "global_step": 288879, "epoch": 3480} {"train_loss": -25.369129180908203, "global_step": 288880, "epoch": 3480} {"train_loss": -25.1518611907959, "global_step": 288881, "epoch": 3480} {"train_loss": -25.291685104370117, "global_step": 288882, "epoch": 3480} {"train_loss": -25.10498046875, "global_step": 288883, "epoch": 3480} {"train_loss": -25.401874542236328, "global_step": 288884, "epoch": 3480} {"train_loss": -25.326324462890625, "global_step": 288885, "epoch": 3480} {"train_loss": -25.471221923828125, "global_step": 288886, "epoch": 3480} {"train_loss": -25.51405906677246, "global_step": 288887, "epoch": 3480} {"train_loss": -25.66242027282715, "global_step": 288888, "epoch": 3480} {"train_loss": -25.501211166381836, "global_step": 288889, "epoch": 3480} {"train_loss": -25.77849769592285, "global_step": 288890, "epoch": 3480} {"train_loss": -25.47623062133789, "global_step": 288891, "epoch": 3480} {"train_loss": -25.6919002532959, "global_step": 288892, "epoch": 3480} {"train_loss": -25.4713134765625, "global_step": 288893, "epoch": 3480} {"train_loss": -25.7916259765625, "global_step": 288894, "epoch": 3480} {"train_loss": -25.115928649902344, "global_step": 288895, "epoch": 3480} {"train_loss": -25.096933364868164, "global_step": 288896, "epoch": 3480} {"train_loss": -25.481603622436523, "global_step": 288897, "epoch": 3480} {"train_loss": -25.740314483642578, "global_step": 288898, "epoch": 3480} {"train_loss": -25.189624786376953, "global_step": 288899, "epoch": 3480} {"train_loss": -25.38594627380371, "global_step": 288900, "epoch": 3480} {"train_loss": -25.737396240234375, "global_step": 288901, "epoch": 3480} {"train_loss": -25.537738800048828, "global_step": 288902, "epoch": 3480} {"train_loss": -25.522871017456055, "global_step": 288903, "epoch": 3480} {"train_loss": -25.6026668548584, "global_step": 288904, "epoch": 3480} {"train_loss": -25.630407333374023, "global_step": 288905, "epoch": 3480} {"train_loss": -25.736581802368164, "global_step": 288906, "epoch": 3480} {"train_loss": -25.649005889892578, "global_step": 288907, "epoch": 3480} {"train_loss": -25.672399520874023, "global_step": 288908, "epoch": 3480} {"train_loss": -25.522504806518555, "global_step": 288909, "epoch": 3480} {"train_loss": -25.632205963134766, "global_step": 288910, "epoch": 3480} {"train_loss": -25.98798179626465, "global_step": 288911, "epoch": 3480} {"train_loss": -25.771188735961914, "global_step": 288912, "epoch": 3480} {"train_loss": -25.9244384765625, "global_step": 288913, "epoch": 3480} {"train_loss": -25.46016502380371, "global_step": 288914, "epoch": 3480} {"train_loss": -25.667682647705078, "global_step": 288915, "epoch": 3480} {"train_loss": -25.475278854370117, "global_step": 288916, "epoch": 3480} {"train_loss": -25.830358505249023, "global_step": 288917, "epoch": 3480} {"train_loss": -25.317127227783203, "global_step": 288918, "epoch": 3480} {"train_loss": -25.452484130859375, "global_step": 288919, "epoch": 3480} {"train_loss": -25.599576950073242, "global_step": 288920, "epoch": 3480} {"train_loss": -25.431285858154297, "global_step": 288921, "epoch": 3480} {"train_loss": -25.465624912675604, "global_step": 288922, "epoch": 3480, "val_loss": 7237106.0} {"train_loss": -23.79157066345215, "global_step": 288923, "epoch": 3481} {"train_loss": -24.18075180053711, "global_step": 288924, "epoch": 3481} {"train_loss": -23.325897216796875, "global_step": 288925, "epoch": 3481} {"train_loss": -24.366397857666016, "global_step": 288926, "epoch": 3481} {"train_loss": -24.651275634765625, "global_step": 288927, "epoch": 3481} {"train_loss": -24.286773681640625, "global_step": 288928, "epoch": 3481} {"train_loss": -24.504573822021484, "global_step": 288929, "epoch": 3481} {"train_loss": -24.384429931640625, "global_step": 288930, "epoch": 3481} {"train_loss": -24.980010986328125, "global_step": 288931, "epoch": 3481} {"train_loss": -25.117263793945312, "global_step": 288932, "epoch": 3481} {"train_loss": -24.690181732177734, "global_step": 288933, "epoch": 3481} {"train_loss": -24.918533325195312, "global_step": 288934, "epoch": 3481} {"train_loss": -24.792638778686523, "global_step": 288935, "epoch": 3481} {"train_loss": -24.825407028198242, "global_step": 288936, "epoch": 3481} {"train_loss": -24.64045524597168, "global_step": 288937, "epoch": 3481} {"train_loss": -25.16254997253418, "global_step": 288938, "epoch": 3481} {"train_loss": -24.646087646484375, "global_step": 288939, "epoch": 3481} {"train_loss": -24.73746109008789, "global_step": 288940, "epoch": 3481} {"train_loss": -24.88787841796875, "global_step": 288941, "epoch": 3481} {"train_loss": -25.552743911743164, "global_step": 288942, "epoch": 3481} {"train_loss": -25.105981826782227, "global_step": 288943, "epoch": 3481} {"train_loss": -25.144519805908203, "global_step": 288944, "epoch": 3481} {"train_loss": -25.195314407348633, "global_step": 288945, "epoch": 3481} {"train_loss": -24.83855438232422, "global_step": 288946, "epoch": 3481} {"train_loss": -25.37018394470215, "global_step": 288947, "epoch": 3481} {"train_loss": -25.189077377319336, "global_step": 288948, "epoch": 3481} {"train_loss": -25.1121826171875, "global_step": 288949, "epoch": 3481} {"train_loss": -25.19075584411621, "global_step": 288950, "epoch": 3481} {"train_loss": -25.277698516845703, "global_step": 288951, "epoch": 3481} {"train_loss": -25.593454360961914, "global_step": 288952, "epoch": 3481} {"train_loss": -25.7900333404541, "global_step": 288953, "epoch": 3481} {"train_loss": -25.445676803588867, "global_step": 288954, "epoch": 3481} {"train_loss": -25.506458282470703, "global_step": 288955, "epoch": 3481} {"train_loss": -25.3767147064209, "global_step": 288956, "epoch": 3481} {"train_loss": -25.181625366210938, "global_step": 288957, "epoch": 3481} {"train_loss": -25.40256690979004, "global_step": 288958, "epoch": 3481} {"train_loss": -25.66913414001465, "global_step": 288959, "epoch": 3481} {"train_loss": -25.648334503173828, "global_step": 288960, "epoch": 3481} {"train_loss": -25.556669235229492, "global_step": 288961, "epoch": 3481} {"train_loss": -25.548036575317383, "global_step": 288962, "epoch": 3481} {"train_loss": -25.617162704467773, "global_step": 288963, "epoch": 3481} {"train_loss": -25.7174072265625, "global_step": 288964, "epoch": 3481} {"train_loss": -25.899511337280273, "global_step": 288965, "epoch": 3481} {"train_loss": -25.867462158203125, "global_step": 288966, "epoch": 3481} {"train_loss": -25.65608024597168, "global_step": 288967, "epoch": 3481} {"train_loss": -25.56987953186035, "global_step": 288968, "epoch": 3481} {"train_loss": -25.699722290039062, "global_step": 288969, "epoch": 3481} {"train_loss": -25.547351837158203, "global_step": 288970, "epoch": 3481} {"train_loss": -25.468416213989258, "global_step": 288971, "epoch": 3481} {"train_loss": -25.592700958251953, "global_step": 288972, "epoch": 3481} {"train_loss": -25.694482803344727, "global_step": 288973, "epoch": 3481} {"train_loss": -25.822484970092773, "global_step": 288974, "epoch": 3481} {"train_loss": -25.531232833862305, "global_step": 288975, "epoch": 3481} {"train_loss": -25.542524337768555, "global_step": 288976, "epoch": 3481} {"train_loss": -25.527402877807617, "global_step": 288977, "epoch": 3481} {"train_loss": -25.70289421081543, "global_step": 288978, "epoch": 3481} {"train_loss": -25.359853744506836, "global_step": 288979, "epoch": 3481} {"train_loss": -25.3076114654541, "global_step": 288980, "epoch": 3481} {"train_loss": -25.253320693969727, "global_step": 288981, "epoch": 3481} {"train_loss": -25.624237060546875, "global_step": 288982, "epoch": 3481} {"train_loss": -25.72900390625, "global_step": 288983, "epoch": 3481} {"train_loss": -25.54414939880371, "global_step": 288984, "epoch": 3481} {"train_loss": -25.731311798095703, "global_step": 288985, "epoch": 3481} {"train_loss": -25.44456672668457, "global_step": 288986, "epoch": 3481} {"train_loss": -25.444955825805664, "global_step": 288987, "epoch": 3481} {"train_loss": -25.6375789642334, "global_step": 288988, "epoch": 3481} {"train_loss": -25.323331832885742, "global_step": 288989, "epoch": 3481} {"train_loss": -25.440824508666992, "global_step": 288990, "epoch": 3481} {"train_loss": -25.552005767822266, "global_step": 288991, "epoch": 3481} {"train_loss": -25.5115909576416, "global_step": 288992, "epoch": 3481} {"train_loss": -25.5715274810791, "global_step": 288993, "epoch": 3481} {"train_loss": -25.6350040435791, "global_step": 288994, "epoch": 3481} {"train_loss": -25.688840866088867, "global_step": 288995, "epoch": 3481} {"train_loss": -25.61787223815918, "global_step": 288996, "epoch": 3481} {"train_loss": -25.481264114379883, "global_step": 288997, "epoch": 3481} {"train_loss": -25.431289672851562, "global_step": 288998, "epoch": 3481} {"train_loss": -25.850372314453125, "global_step": 288999, "epoch": 3481} {"train_loss": -25.337047576904297, "global_step": 289000, "epoch": 3481} {"train_loss": -25.57697868347168, "global_step": 289001, "epoch": 3481} {"train_loss": -25.400074005126953, "global_step": 289002, "epoch": 3481} {"train_loss": -25.580705642700195, "global_step": 289003, "epoch": 3481} {"train_loss": -25.16587257385254, "global_step": 289004, "epoch": 3481} {"train_loss": -25.266487650124425, "global_step": 289005, "epoch": 3481, "val_loss": 7065691.0} {"train_loss": -24.69478416442871, "global_step": 289006, "epoch": 3482} {"train_loss": -24.65633201599121, "global_step": 289007, "epoch": 3482} {"train_loss": -24.748449325561523, "global_step": 289008, "epoch": 3482} {"train_loss": -25.026691436767578, "global_step": 289009, "epoch": 3482} {"train_loss": -25.29077911376953, "global_step": 289010, "epoch": 3482} {"train_loss": -25.342206954956055, "global_step": 289011, "epoch": 3482} {"train_loss": -25.09200668334961, "global_step": 289012, "epoch": 3482} {"train_loss": -25.417911529541016, "global_step": 289013, "epoch": 3482} {"train_loss": -24.91200828552246, "global_step": 289014, "epoch": 3482} {"train_loss": -25.258319854736328, "global_step": 289015, "epoch": 3482} {"train_loss": -25.41451072692871, "global_step": 289016, "epoch": 3482} {"train_loss": -25.11392593383789, "global_step": 289017, "epoch": 3482} {"train_loss": -25.026596069335938, "global_step": 289018, "epoch": 3482} {"train_loss": -25.263565063476562, "global_step": 289019, "epoch": 3482} {"train_loss": -25.504043579101562, "global_step": 289020, "epoch": 3482} {"train_loss": -25.112478256225586, "global_step": 289021, "epoch": 3482} {"train_loss": -25.30029296875, "global_step": 289022, "epoch": 3482} {"train_loss": -25.25493812561035, "global_step": 289023, "epoch": 3482} {"train_loss": -25.471677780151367, "global_step": 289024, "epoch": 3482} {"train_loss": -25.790205001831055, "global_step": 289025, "epoch": 3482} {"train_loss": -25.3940372467041, "global_step": 289026, "epoch": 3482} {"train_loss": -25.8918399810791, "global_step": 289027, "epoch": 3482} {"train_loss": -25.689346313476562, "global_step": 289028, "epoch": 3482} {"train_loss": -25.68770408630371, "global_step": 289029, "epoch": 3482} {"train_loss": -25.47407341003418, "global_step": 289030, "epoch": 3482} {"train_loss": -25.790220260620117, "global_step": 289031, "epoch": 3482} {"train_loss": -25.299610137939453, "global_step": 289032, "epoch": 3482} {"train_loss": -25.898107528686523, "global_step": 289033, "epoch": 3482} {"train_loss": -25.54155731201172, "global_step": 289034, "epoch": 3482} {"train_loss": -25.648853302001953, "global_step": 289035, "epoch": 3482} {"train_loss": -25.44516944885254, "global_step": 289036, "epoch": 3482} {"train_loss": -25.611875534057617, "global_step": 289037, "epoch": 3482} {"train_loss": -25.50855827331543, "global_step": 289038, "epoch": 3482} {"train_loss": -25.493972778320312, "global_step": 289039, "epoch": 3482} {"train_loss": -25.50341033935547, "global_step": 289040, "epoch": 3482} {"train_loss": -25.604476928710938, "global_step": 289041, "epoch": 3482} {"train_loss": -25.61541175842285, "global_step": 289042, "epoch": 3482} {"train_loss": -25.465944290161133, "global_step": 289043, "epoch": 3482} {"train_loss": -26.023849487304688, "global_step": 289044, "epoch": 3482} {"train_loss": -25.70962905883789, "global_step": 289045, "epoch": 3482} {"train_loss": -25.222707748413086, "global_step": 289046, "epoch": 3482} {"train_loss": -25.688480377197266, "global_step": 289047, "epoch": 3482} {"train_loss": -25.803129196166992, "global_step": 289048, "epoch": 3482} {"train_loss": -25.85825538635254, "global_step": 289049, "epoch": 3482} {"train_loss": -25.622045516967773, "global_step": 289050, "epoch": 3482} {"train_loss": -25.424875259399414, "global_step": 289051, "epoch": 3482} {"train_loss": -25.629602432250977, "global_step": 289052, "epoch": 3482} {"train_loss": -25.727705001831055, "global_step": 289053, "epoch": 3482} {"train_loss": -25.414026260375977, "global_step": 289054, "epoch": 3482} {"train_loss": -25.492490768432617, "global_step": 289055, "epoch": 3482} {"train_loss": -25.473739624023438, "global_step": 289056, "epoch": 3482} {"train_loss": -25.836706161499023, "global_step": 289057, "epoch": 3482} {"train_loss": -25.099166870117188, "global_step": 289058, "epoch": 3482} {"train_loss": -25.279617309570312, "global_step": 289059, "epoch": 3482} {"train_loss": -25.570409774780273, "global_step": 289060, "epoch": 3482} {"train_loss": -25.495193481445312, "global_step": 289061, "epoch": 3482} {"train_loss": -25.456321716308594, "global_step": 289062, "epoch": 3482} {"train_loss": -25.158451080322266, "global_step": 289063, "epoch": 3482} {"train_loss": -25.32391357421875, "global_step": 289064, "epoch": 3482} {"train_loss": -25.38519859313965, "global_step": 289065, "epoch": 3482} {"train_loss": -25.081052780151367, "global_step": 289066, "epoch": 3482} {"train_loss": -25.550870895385742, "global_step": 289067, "epoch": 3482} {"train_loss": -25.622583389282227, "global_step": 289068, "epoch": 3482} {"train_loss": -24.6315975189209, "global_step": 289069, "epoch": 3482} {"train_loss": -25.394865036010742, "global_step": 289070, "epoch": 3482} {"train_loss": -25.06629753112793, "global_step": 289071, "epoch": 3482} {"train_loss": -24.659414291381836, "global_step": 289072, "epoch": 3482} {"train_loss": -25.05536460876465, "global_step": 289073, "epoch": 3482} {"train_loss": -25.31554412841797, "global_step": 289074, "epoch": 3482} {"train_loss": -25.283437728881836, "global_step": 289075, "epoch": 3482} {"train_loss": -25.66621971130371, "global_step": 289076, "epoch": 3482} {"train_loss": -25.296689987182617, "global_step": 289077, "epoch": 3482} {"train_loss": -25.746091842651367, "global_step": 289078, "epoch": 3482} {"train_loss": -25.28604507446289, "global_step": 289079, "epoch": 3482} {"train_loss": -25.46040153503418, "global_step": 289080, "epoch": 3482} {"train_loss": -25.42799949645996, "global_step": 289081, "epoch": 3482} {"train_loss": -25.390390396118164, "global_step": 289082, "epoch": 3482} {"train_loss": -25.52260398864746, "global_step": 289083, "epoch": 3482} {"train_loss": -25.411054611206055, "global_step": 289084, "epoch": 3482} {"train_loss": -25.864904403686523, "global_step": 289085, "epoch": 3482} {"train_loss": -25.50152587890625, "global_step": 289086, "epoch": 3482} {"train_loss": -25.328107833862305, "global_step": 289087, "epoch": 3482} {"train_loss": -25.401702122515943, "global_step": 289088, "epoch": 3482, "val_loss": 7069531.0} {"train_loss": -24.983444213867188, "global_step": 289089, "epoch": 3483} {"train_loss": -24.837018966674805, "global_step": 289090, "epoch": 3483} {"train_loss": -25.19478416442871, "global_step": 289091, "epoch": 3483} {"train_loss": -25.288068771362305, "global_step": 289092, "epoch": 3483} {"train_loss": -24.968412399291992, "global_step": 289093, "epoch": 3483} {"train_loss": -25.492252349853516, "global_step": 289094, "epoch": 3483} {"train_loss": -25.49338722229004, "global_step": 289095, "epoch": 3483} {"train_loss": -25.23752212524414, "global_step": 289096, "epoch": 3483} {"train_loss": -24.9481258392334, "global_step": 289097, "epoch": 3483} {"train_loss": -25.042470932006836, "global_step": 289098, "epoch": 3483} {"train_loss": -25.312036514282227, "global_step": 289099, "epoch": 3483} {"train_loss": -25.514760971069336, "global_step": 289100, "epoch": 3483} {"train_loss": -25.512224197387695, "global_step": 289101, "epoch": 3483} {"train_loss": -25.69766616821289, "global_step": 289102, "epoch": 3483} {"train_loss": -25.431005477905273, "global_step": 289103, "epoch": 3483} {"train_loss": -25.405942916870117, "global_step": 289104, "epoch": 3483} {"train_loss": -25.521041870117188, "global_step": 289105, "epoch": 3483} {"train_loss": -25.21552276611328, "global_step": 289106, "epoch": 3483} {"train_loss": -25.641077041625977, "global_step": 289107, "epoch": 3483} {"train_loss": -25.447757720947266, "global_step": 289108, "epoch": 3483} {"train_loss": -25.544692993164062, "global_step": 289109, "epoch": 3483} {"train_loss": -25.28466796875, "global_step": 289110, "epoch": 3483} {"train_loss": -25.334531784057617, "global_step": 289111, "epoch": 3483} {"train_loss": -25.510120391845703, "global_step": 289112, "epoch": 3483} {"train_loss": -25.289562225341797, "global_step": 289113, "epoch": 3483} {"train_loss": -25.193830490112305, "global_step": 289114, "epoch": 3483} {"train_loss": -25.357160568237305, "global_step": 289115, "epoch": 3483} {"train_loss": -25.18985366821289, "global_step": 289116, "epoch": 3483} {"train_loss": -25.38772201538086, "global_step": 289117, "epoch": 3483} {"train_loss": -25.555944442749023, "global_step": 289118, "epoch": 3483} {"train_loss": -24.952905654907227, "global_step": 289119, "epoch": 3483} {"train_loss": -25.641437530517578, "global_step": 289120, "epoch": 3483} {"train_loss": -25.384235382080078, "global_step": 289121, "epoch": 3483} {"train_loss": -25.57245445251465, "global_step": 289122, "epoch": 3483} {"train_loss": -25.378870010375977, "global_step": 289123, "epoch": 3483} {"train_loss": -25.755237579345703, "global_step": 289124, "epoch": 3483} {"train_loss": -25.58229637145996, "global_step": 289125, "epoch": 3483} {"train_loss": -25.848712921142578, "global_step": 289126, "epoch": 3483} {"train_loss": -25.274066925048828, "global_step": 289127, "epoch": 3483} {"train_loss": -25.609949111938477, "global_step": 289128, "epoch": 3483} {"train_loss": -25.3565673828125, "global_step": 289129, "epoch": 3483} {"train_loss": -25.5833683013916, "global_step": 289130, "epoch": 3483} {"train_loss": -25.655256271362305, "global_step": 289131, "epoch": 3483} {"train_loss": -25.757007598876953, "global_step": 289132, "epoch": 3483} {"train_loss": -25.286699295043945, "global_step": 289133, "epoch": 3483} {"train_loss": -25.390644073486328, "global_step": 289134, "epoch": 3483} {"train_loss": -25.54949951171875, "global_step": 289135, "epoch": 3483} {"train_loss": -25.730712890625, "global_step": 289136, "epoch": 3483} {"train_loss": -25.61675453186035, "global_step": 289137, "epoch": 3483} {"train_loss": -25.595861434936523, "global_step": 289138, "epoch": 3483} {"train_loss": -25.893198013305664, "global_step": 289139, "epoch": 3483} {"train_loss": -25.7623233795166, "global_step": 289140, "epoch": 3483} {"train_loss": -25.860013961791992, "global_step": 289141, "epoch": 3483} {"train_loss": -25.753253936767578, "global_step": 289142, "epoch": 3483} {"train_loss": -25.43583106994629, "global_step": 289143, "epoch": 3483} {"train_loss": -25.505435943603516, "global_step": 289144, "epoch": 3483} {"train_loss": -26.014678955078125, "global_step": 289145, "epoch": 3483} {"train_loss": -25.65675926208496, "global_step": 289146, "epoch": 3483} {"train_loss": -25.768476486206055, "global_step": 289147, "epoch": 3483} {"train_loss": -25.608673095703125, "global_step": 289148, "epoch": 3483} {"train_loss": -25.823453903198242, "global_step": 289149, "epoch": 3483} {"train_loss": -25.457828521728516, "global_step": 289150, "epoch": 3483} {"train_loss": -25.281692504882812, "global_step": 289151, "epoch": 3483} {"train_loss": -25.21997833251953, "global_step": 289152, "epoch": 3483} {"train_loss": -25.008609771728516, "global_step": 289153, "epoch": 3483} {"train_loss": -25.538183212280273, "global_step": 289154, "epoch": 3483} {"train_loss": -25.56741714477539, "global_step": 289155, "epoch": 3483} {"train_loss": -24.901304244995117, "global_step": 289156, "epoch": 3483} {"train_loss": -25.355302810668945, "global_step": 289157, "epoch": 3483} {"train_loss": -24.933164596557617, "global_step": 289158, "epoch": 3483} {"train_loss": -25.576065063476562, "global_step": 289159, "epoch": 3483} {"train_loss": -25.515974044799805, "global_step": 289160, "epoch": 3483} {"train_loss": -25.070877075195312, "global_step": 289161, "epoch": 3483} {"train_loss": -25.698963165283203, "global_step": 289162, "epoch": 3483} {"train_loss": -25.195194244384766, "global_step": 289163, "epoch": 3483} {"train_loss": -24.747297286987305, "global_step": 289164, "epoch": 3483} {"train_loss": -24.928024291992188, "global_step": 289165, "epoch": 3483} {"train_loss": -25.17381477355957, "global_step": 289166, "epoch": 3483} {"train_loss": -25.107807159423828, "global_step": 289167, "epoch": 3483} {"train_loss": -24.816648483276367, "global_step": 289168, "epoch": 3483} {"train_loss": -25.409521102905273, "global_step": 289169, "epoch": 3483} {"train_loss": -25.117551803588867, "global_step": 289170, "epoch": 3483} {"train_loss": -25.39366152200354, "global_step": 289171, "epoch": 3483, "val_loss": 7239694.0} {"train_loss": -24.954025268554688, "global_step": 289172, "epoch": 3484} {"train_loss": -25.073484420776367, "global_step": 289173, "epoch": 3484} {"train_loss": -24.84483528137207, "global_step": 289174, "epoch": 3484} {"train_loss": -24.926319122314453, "global_step": 289175, "epoch": 3484} {"train_loss": -24.775177001953125, "global_step": 289176, "epoch": 3484} {"train_loss": -24.983627319335938, "global_step": 289177, "epoch": 3484} {"train_loss": -25.00396728515625, "global_step": 289178, "epoch": 3484} {"train_loss": -25.297927856445312, "global_step": 289179, "epoch": 3484} {"train_loss": -25.14095115661621, "global_step": 289180, "epoch": 3484} {"train_loss": -25.061832427978516, "global_step": 289181, "epoch": 3484} {"train_loss": -25.120101928710938, "global_step": 289182, "epoch": 3484} {"train_loss": -25.315839767456055, "global_step": 289183, "epoch": 3484} {"train_loss": -25.599592208862305, "global_step": 289184, "epoch": 3484} {"train_loss": -25.154258728027344, "global_step": 289185, "epoch": 3484} {"train_loss": -25.624542236328125, "global_step": 289186, "epoch": 3484} {"train_loss": -25.21662712097168, "global_step": 289187, "epoch": 3484} {"train_loss": -25.052778244018555, "global_step": 289188, "epoch": 3484} {"train_loss": -25.369726181030273, "global_step": 289189, "epoch": 3484} {"train_loss": -25.415489196777344, "global_step": 289190, "epoch": 3484} {"train_loss": -25.55060386657715, "global_step": 289191, "epoch": 3484} {"train_loss": -25.48433494567871, "global_step": 289192, "epoch": 3484} {"train_loss": -25.7706298828125, "global_step": 289193, "epoch": 3484} {"train_loss": -25.542722702026367, "global_step": 289194, "epoch": 3484} {"train_loss": -25.422916412353516, "global_step": 289195, "epoch": 3484} {"train_loss": -25.407926559448242, "global_step": 289196, "epoch": 3484} {"train_loss": -25.70353126525879, "global_step": 289197, "epoch": 3484} {"train_loss": -25.387319564819336, "global_step": 289198, "epoch": 3484} {"train_loss": -25.3481502532959, "global_step": 289199, "epoch": 3484} {"train_loss": -24.84079933166504, "global_step": 289200, "epoch": 3484} {"train_loss": -25.240833282470703, "global_step": 289201, "epoch": 3484} {"train_loss": -25.335180282592773, "global_step": 289202, "epoch": 3484} {"train_loss": -25.481891632080078, "global_step": 289203, "epoch": 3484} {"train_loss": -25.480512619018555, "global_step": 289204, "epoch": 3484} {"train_loss": -25.380699157714844, "global_step": 289205, "epoch": 3484} {"train_loss": -25.54840660095215, "global_step": 289206, "epoch": 3484} {"train_loss": -25.750646591186523, "global_step": 289207, "epoch": 3484} {"train_loss": -25.38513946533203, "global_step": 289208, "epoch": 3484} {"train_loss": -25.768491744995117, "global_step": 289209, "epoch": 3484} {"train_loss": -25.56775665283203, "global_step": 289210, "epoch": 3484} {"train_loss": -25.59842300415039, "global_step": 289211, "epoch": 3484} {"train_loss": -25.59006118774414, "global_step": 289212, "epoch": 3484} {"train_loss": -25.64044189453125, "global_step": 289213, "epoch": 3484} {"train_loss": -25.783308029174805, "global_step": 289214, "epoch": 3484} {"train_loss": -25.528928756713867, "global_step": 289215, "epoch": 3484} {"train_loss": -25.623998641967773, "global_step": 289216, "epoch": 3484} {"train_loss": -25.62750244140625, "global_step": 289217, "epoch": 3484} {"train_loss": -25.378042221069336, "global_step": 289218, "epoch": 3484} {"train_loss": -26.11322021484375, "global_step": 289219, "epoch": 3484} {"train_loss": -25.90708351135254, "global_step": 289220, "epoch": 3484} {"train_loss": -25.212379455566406, "global_step": 289221, "epoch": 3484} {"train_loss": -25.350622177124023, "global_step": 289222, "epoch": 3484} {"train_loss": -24.954938888549805, "global_step": 289223, "epoch": 3484} {"train_loss": -25.212453842163086, "global_step": 289224, "epoch": 3484} {"train_loss": -25.815265655517578, "global_step": 289225, "epoch": 3484} {"train_loss": -24.963788986206055, "global_step": 289226, "epoch": 3484} {"train_loss": -25.262117385864258, "global_step": 289227, "epoch": 3484} {"train_loss": -25.85914421081543, "global_step": 289228, "epoch": 3484} {"train_loss": -24.687047958374023, "global_step": 289229, "epoch": 3484} {"train_loss": -25.10967254638672, "global_step": 289230, "epoch": 3484} {"train_loss": -25.389169692993164, "global_step": 289231, "epoch": 3484} {"train_loss": -25.26500701904297, "global_step": 289232, "epoch": 3484} {"train_loss": -24.963542938232422, "global_step": 289233, "epoch": 3484} {"train_loss": -25.34798240661621, "global_step": 289234, "epoch": 3484} {"train_loss": -25.303510665893555, "global_step": 289235, "epoch": 3484} {"train_loss": -24.9633846282959, "global_step": 289236, "epoch": 3484} {"train_loss": -25.357946395874023, "global_step": 289237, "epoch": 3484} {"train_loss": -25.411619186401367, "global_step": 289238, "epoch": 3484} {"train_loss": -25.443960189819336, "global_step": 289239, "epoch": 3484} {"train_loss": -25.522445678710938, "global_step": 289240, "epoch": 3484} {"train_loss": -25.166671752929688, "global_step": 289241, "epoch": 3484} {"train_loss": -25.10536766052246, "global_step": 289242, "epoch": 3484} {"train_loss": -25.11065673828125, "global_step": 289243, "epoch": 3484} {"train_loss": -25.669158935546875, "global_step": 289244, "epoch": 3484} {"train_loss": -25.4836483001709, "global_step": 289245, "epoch": 3484} {"train_loss": -25.51068687438965, "global_step": 289246, "epoch": 3484} {"train_loss": -25.396076202392578, "global_step": 289247, "epoch": 3484} {"train_loss": -25.570999145507812, "global_step": 289248, "epoch": 3484} {"train_loss": -25.345434188842773, "global_step": 289249, "epoch": 3484} {"train_loss": -25.646100997924805, "global_step": 289250, "epoch": 3484} {"train_loss": -25.845458984375, "global_step": 289251, "epoch": 3484} {"train_loss": -25.349475860595703, "global_step": 289252, "epoch": 3484} {"train_loss": -25.328168869018555, "global_step": 289253, "epoch": 3484} {"train_loss": -25.364625126482494, "global_step": 289254, "epoch": 3484, "val_loss": 7117674.0} {"train_loss": -25.075284957885742, "global_step": 289255, "epoch": 3485} {"train_loss": -25.044815063476562, "global_step": 289256, "epoch": 3485} {"train_loss": -25.47224998474121, "global_step": 289257, "epoch": 3485} {"train_loss": -24.897918701171875, "global_step": 289258, "epoch": 3485} {"train_loss": -24.886474609375, "global_step": 289259, "epoch": 3485} {"train_loss": -25.7251033782959, "global_step": 289260, "epoch": 3485} {"train_loss": -25.22171974182129, "global_step": 289261, "epoch": 3485} {"train_loss": -25.252155303955078, "global_step": 289262, "epoch": 3485} {"train_loss": -25.37676429748535, "global_step": 289263, "epoch": 3485} {"train_loss": -25.396621704101562, "global_step": 289264, "epoch": 3485} {"train_loss": -25.175817489624023, "global_step": 289265, "epoch": 3485} {"train_loss": -25.72344970703125, "global_step": 289266, "epoch": 3485} {"train_loss": -25.40571403503418, "global_step": 289267, "epoch": 3485} {"train_loss": -25.42127799987793, "global_step": 289268, "epoch": 3485} {"train_loss": -25.10292625427246, "global_step": 289269, "epoch": 3485} {"train_loss": -25.744836807250977, "global_step": 289270, "epoch": 3485} {"train_loss": -25.43549919128418, "global_step": 289271, "epoch": 3485} {"train_loss": -25.49993324279785, "global_step": 289272, "epoch": 3485} {"train_loss": -25.52730941772461, "global_step": 289273, "epoch": 3485} {"train_loss": -25.42005729675293, "global_step": 289274, "epoch": 3485} {"train_loss": -25.29292869567871, "global_step": 289275, "epoch": 3485} {"train_loss": -25.560697555541992, "global_step": 289276, "epoch": 3485} {"train_loss": -25.679590225219727, "global_step": 289277, "epoch": 3485} {"train_loss": -25.577054977416992, "global_step": 289278, "epoch": 3485} {"train_loss": -25.1827449798584, "global_step": 289279, "epoch": 3485} {"train_loss": -25.247074127197266, "global_step": 289280, "epoch": 3485} {"train_loss": -25.33464241027832, "global_step": 289281, "epoch": 3485} {"train_loss": -25.78155517578125, "global_step": 289282, "epoch": 3485} {"train_loss": -25.69010353088379, "global_step": 289283, "epoch": 3485} {"train_loss": -25.80183219909668, "global_step": 289284, "epoch": 3485} {"train_loss": -25.798959732055664, "global_step": 289285, "epoch": 3485} {"train_loss": -25.7044677734375, "global_step": 289286, "epoch": 3485} {"train_loss": -25.80182456970215, "global_step": 289287, "epoch": 3485} {"train_loss": -25.38649559020996, "global_step": 289288, "epoch": 3485} {"train_loss": -25.934858322143555, "global_step": 289289, "epoch": 3485} {"train_loss": -25.655384063720703, "global_step": 289290, "epoch": 3485} {"train_loss": -25.503559112548828, "global_step": 289291, "epoch": 3485} {"train_loss": -25.59504508972168, "global_step": 289292, "epoch": 3485} {"train_loss": -25.356836318969727, "global_step": 289293, "epoch": 3485} {"train_loss": -25.676481246948242, "global_step": 289294, "epoch": 3485} {"train_loss": -25.489953994750977, "global_step": 289295, "epoch": 3485} {"train_loss": -25.67963981628418, "global_step": 289296, "epoch": 3485} {"train_loss": -25.530067443847656, "global_step": 289297, "epoch": 3485} {"train_loss": -25.275365829467773, "global_step": 289298, "epoch": 3485} {"train_loss": -25.302778244018555, "global_step": 289299, "epoch": 3485} {"train_loss": -25.417524337768555, "global_step": 289300, "epoch": 3485} {"train_loss": -25.410400390625, "global_step": 289301, "epoch": 3485} {"train_loss": -25.545759201049805, "global_step": 289302, "epoch": 3485} {"train_loss": -25.512697219848633, "global_step": 289303, "epoch": 3485} {"train_loss": -25.860631942749023, "global_step": 289304, "epoch": 3485} {"train_loss": -25.566831588745117, "global_step": 289305, "epoch": 3485} {"train_loss": -25.274017333984375, "global_step": 289306, "epoch": 3485} {"train_loss": -25.652851104736328, "global_step": 289307, "epoch": 3485} {"train_loss": -25.130788803100586, "global_step": 289308, "epoch": 3485} {"train_loss": -25.24532699584961, "global_step": 289309, "epoch": 3485} {"train_loss": -25.295135498046875, "global_step": 289310, "epoch": 3485} {"train_loss": -25.906213760375977, "global_step": 289311, "epoch": 3485} {"train_loss": -25.383787155151367, "global_step": 289312, "epoch": 3485} {"train_loss": -25.19025421142578, "global_step": 289313, "epoch": 3485} {"train_loss": -25.706939697265625, "global_step": 289314, "epoch": 3485} {"train_loss": -25.517993927001953, "global_step": 289315, "epoch": 3485} {"train_loss": -25.766565322875977, "global_step": 289316, "epoch": 3485} {"train_loss": -25.381364822387695, "global_step": 289317, "epoch": 3485} {"train_loss": -24.97316551208496, "global_step": 289318, "epoch": 3485} {"train_loss": -25.405784606933594, "global_step": 289319, "epoch": 3485} {"train_loss": -25.371810913085938, "global_step": 289320, "epoch": 3485} {"train_loss": -25.027250289916992, "global_step": 289321, "epoch": 3485} {"train_loss": -25.556129455566406, "global_step": 289322, "epoch": 3485} {"train_loss": -25.32166862487793, "global_step": 289323, "epoch": 3485} {"train_loss": -24.89379119873047, "global_step": 289324, "epoch": 3485} {"train_loss": -26.095722198486328, "global_step": 289325, "epoch": 3485} {"train_loss": -25.34150505065918, "global_step": 289326, "epoch": 3485} {"train_loss": -25.416370391845703, "global_step": 289327, "epoch": 3485} {"train_loss": -25.8085880279541, "global_step": 289328, "epoch": 3485} {"train_loss": -25.56867027282715, "global_step": 289329, "epoch": 3485} {"train_loss": -25.687030792236328, "global_step": 289330, "epoch": 3485} {"train_loss": -25.401626586914062, "global_step": 289331, "epoch": 3485} {"train_loss": -25.386301040649414, "global_step": 289332, "epoch": 3485} {"train_loss": -25.27571678161621, "global_step": 289333, "epoch": 3485} {"train_loss": -25.547948837280273, "global_step": 289334, "epoch": 3485} {"train_loss": -25.497434616088867, "global_step": 289335, "epoch": 3485} {"train_loss": -25.782825469970703, "global_step": 289336, "epoch": 3485} {"train_loss": -25.45708104788539, "global_step": 289337, "epoch": 3485, "val_loss": 7169727.5} {"train_loss": -25.235074996948242, "global_step": 289338, "epoch": 3486} {"train_loss": -25.38334846496582, "global_step": 289339, "epoch": 3486} {"train_loss": -24.57710838317871, "global_step": 289340, "epoch": 3486} {"train_loss": -25.367523193359375, "global_step": 289341, "epoch": 3486} {"train_loss": -25.007429122924805, "global_step": 289342, "epoch": 3486} {"train_loss": -25.2701416015625, "global_step": 289343, "epoch": 3486} {"train_loss": -25.50813102722168, "global_step": 289344, "epoch": 3486} {"train_loss": -24.823217391967773, "global_step": 289345, "epoch": 3486} {"train_loss": -25.378095626831055, "global_step": 289346, "epoch": 3486} {"train_loss": -25.14829444885254, "global_step": 289347, "epoch": 3486} {"train_loss": -25.1339168548584, "global_step": 289348, "epoch": 3486} {"train_loss": -25.105022430419922, "global_step": 289349, "epoch": 3486} {"train_loss": -25.335012435913086, "global_step": 289350, "epoch": 3486} {"train_loss": -25.4561824798584, "global_step": 289351, "epoch": 3486} {"train_loss": -25.365571975708008, "global_step": 289352, "epoch": 3486} {"train_loss": -25.172101974487305, "global_step": 289353, "epoch": 3486} {"train_loss": -25.608266830444336, "global_step": 289354, "epoch": 3486} {"train_loss": -25.682363510131836, "global_step": 289355, "epoch": 3486} {"train_loss": -25.112476348876953, "global_step": 289356, "epoch": 3486} {"train_loss": -25.225156784057617, "global_step": 289357, "epoch": 3486} {"train_loss": -25.444353103637695, "global_step": 289358, "epoch": 3486} {"train_loss": -25.366992950439453, "global_step": 289359, "epoch": 3486} {"train_loss": -25.43062973022461, "global_step": 289360, "epoch": 3486} {"train_loss": -25.387454986572266, "global_step": 289361, "epoch": 3486} {"train_loss": -25.44287872314453, "global_step": 289362, "epoch": 3486} {"train_loss": -25.50046157836914, "global_step": 289363, "epoch": 3486} {"train_loss": -25.416669845581055, "global_step": 289364, "epoch": 3486} {"train_loss": -25.198148727416992, "global_step": 289365, "epoch": 3486} {"train_loss": -25.23519515991211, "global_step": 289366, "epoch": 3486} {"train_loss": -25.378171920776367, "global_step": 289367, "epoch": 3486} {"train_loss": -25.39055824279785, "global_step": 289368, "epoch": 3486} {"train_loss": -25.36610984802246, "global_step": 289369, "epoch": 3486} {"train_loss": -25.876667022705078, "global_step": 289370, "epoch": 3486} {"train_loss": -25.337278366088867, "global_step": 289371, "epoch": 3486} {"train_loss": -25.279361724853516, "global_step": 289372, "epoch": 3486} {"train_loss": -25.624662399291992, "global_step": 289373, "epoch": 3486} {"train_loss": -25.386005401611328, "global_step": 289374, "epoch": 3486} {"train_loss": -25.219301223754883, "global_step": 289375, "epoch": 3486} {"train_loss": -25.11294937133789, "global_step": 289376, "epoch": 3486} {"train_loss": -25.378389358520508, "global_step": 289377, "epoch": 3486} {"train_loss": -25.554885864257812, "global_step": 289378, "epoch": 3486} {"train_loss": -25.773162841796875, "global_step": 289379, "epoch": 3486} {"train_loss": -25.708332061767578, "global_step": 289380, "epoch": 3486} {"train_loss": -25.350690841674805, "global_step": 289381, "epoch": 3486} {"train_loss": -25.366933822631836, "global_step": 289382, "epoch": 3486} {"train_loss": -25.423019409179688, "global_step": 289383, "epoch": 3486} {"train_loss": -25.144773483276367, "global_step": 289384, "epoch": 3486} {"train_loss": -25.62952995300293, "global_step": 289385, "epoch": 3486} {"train_loss": -25.88276481628418, "global_step": 289386, "epoch": 3486} {"train_loss": -25.256092071533203, "global_step": 289387, "epoch": 3486} {"train_loss": -25.42658805847168, "global_step": 289388, "epoch": 3486} {"train_loss": -25.309999465942383, "global_step": 289389, "epoch": 3486} {"train_loss": -25.46605682373047, "global_step": 289390, "epoch": 3486} {"train_loss": -25.454763412475586, "global_step": 289391, "epoch": 3486} {"train_loss": -25.658573150634766, "global_step": 289392, "epoch": 3486} {"train_loss": -25.794126510620117, "global_step": 289393, "epoch": 3486} {"train_loss": -25.177255630493164, "global_step": 289394, "epoch": 3486} {"train_loss": -25.84817886352539, "global_step": 289395, "epoch": 3486} {"train_loss": -25.56540298461914, "global_step": 289396, "epoch": 3486} {"train_loss": -26.032041549682617, "global_step": 289397, "epoch": 3486} {"train_loss": -25.185527801513672, "global_step": 289398, "epoch": 3486} {"train_loss": -25.724714279174805, "global_step": 289399, "epoch": 3486} {"train_loss": -25.65989112854004, "global_step": 289400, "epoch": 3486} {"train_loss": -25.760135650634766, "global_step": 289401, "epoch": 3486} {"train_loss": -25.488889694213867, "global_step": 289402, "epoch": 3486} {"train_loss": -25.94300651550293, "global_step": 289403, "epoch": 3486} {"train_loss": -25.727294921875, "global_step": 289404, "epoch": 3486} {"train_loss": -25.704273223876953, "global_step": 289405, "epoch": 3486} {"train_loss": -26.20490074157715, "global_step": 289406, "epoch": 3486} {"train_loss": -25.734542846679688, "global_step": 289407, "epoch": 3486} {"train_loss": -25.8741397857666, "global_step": 289408, "epoch": 3486} {"train_loss": -25.463123321533203, "global_step": 289409, "epoch": 3486} {"train_loss": -25.965234756469727, "global_step": 289410, "epoch": 3486} {"train_loss": -25.99070167541504, "global_step": 289411, "epoch": 3486} {"train_loss": -25.300588607788086, "global_step": 289412, "epoch": 3486} {"train_loss": -26.129236221313477, "global_step": 289413, "epoch": 3486} {"train_loss": -25.802698135375977, "global_step": 289414, "epoch": 3486} {"train_loss": -25.70001792907715, "global_step": 289415, "epoch": 3486} {"train_loss": -25.68755531311035, "global_step": 289416, "epoch": 3486} {"train_loss": -25.388504028320312, "global_step": 289417, "epoch": 3486} {"train_loss": -25.65545654296875, "global_step": 289418, "epoch": 3486} {"train_loss": -25.55769157409668, "global_step": 289419, "epoch": 3486} {"train_loss": -25.49005168317312, "global_step": 289420, "epoch": 3486, "val_loss": 7061457.5} {"train_loss": -25.019113540649414, "global_step": 289421, "epoch": 3487} {"train_loss": -24.371261596679688, "global_step": 289422, "epoch": 3487} {"train_loss": -24.628612518310547, "global_step": 289423, "epoch": 3487} {"train_loss": -23.51279640197754, "global_step": 289424, "epoch": 3487} {"train_loss": -23.77791404724121, "global_step": 289425, "epoch": 3487} {"train_loss": -24.70875358581543, "global_step": 289426, "epoch": 3487} {"train_loss": -24.317716598510742, "global_step": 289427, "epoch": 3487} {"train_loss": -24.695571899414062, "global_step": 289428, "epoch": 3487} {"train_loss": -24.85637855529785, "global_step": 289429, "epoch": 3487} {"train_loss": -24.9114933013916, "global_step": 289430, "epoch": 3487} {"train_loss": -24.660375595092773, "global_step": 289431, "epoch": 3487} {"train_loss": -24.89467430114746, "global_step": 289432, "epoch": 3487} {"train_loss": -24.903459548950195, "global_step": 289433, "epoch": 3487} {"train_loss": -24.676271438598633, "global_step": 289434, "epoch": 3487} {"train_loss": -24.39191246032715, "global_step": 289435, "epoch": 3487} {"train_loss": -24.63071060180664, "global_step": 289436, "epoch": 3487} {"train_loss": -25.36281394958496, "global_step": 289437, "epoch": 3487} {"train_loss": -25.146848678588867, "global_step": 289438, "epoch": 3487} {"train_loss": -25.180448532104492, "global_step": 289439, "epoch": 3487} {"train_loss": -24.567211151123047, "global_step": 289440, "epoch": 3487} {"train_loss": -24.833484649658203, "global_step": 289441, "epoch": 3487} {"train_loss": -25.513906478881836, "global_step": 289442, "epoch": 3487} {"train_loss": -25.237512588500977, "global_step": 289443, "epoch": 3487} {"train_loss": -25.49123191833496, "global_step": 289444, "epoch": 3487} {"train_loss": -25.055944442749023, "global_step": 289445, "epoch": 3487} {"train_loss": -25.225553512573242, "global_step": 289446, "epoch": 3487} {"train_loss": -25.192691802978516, "global_step": 289447, "epoch": 3487} {"train_loss": -25.241872787475586, "global_step": 289448, "epoch": 3487} {"train_loss": -25.286945343017578, "global_step": 289449, "epoch": 3487} {"train_loss": -25.33949089050293, "global_step": 289450, "epoch": 3487} {"train_loss": -25.426237106323242, "global_step": 289451, "epoch": 3487} {"train_loss": -25.131437301635742, "global_step": 289452, "epoch": 3487} {"train_loss": -25.743778228759766, "global_step": 289453, "epoch": 3487} {"train_loss": -25.08995246887207, "global_step": 289454, "epoch": 3487} {"train_loss": -25.627206802368164, "global_step": 289455, "epoch": 3487} {"train_loss": -25.22589111328125, "global_step": 289456, "epoch": 3487} {"train_loss": -25.920068740844727, "global_step": 289457, "epoch": 3487} {"train_loss": -25.239320755004883, "global_step": 289458, "epoch": 3487} {"train_loss": -25.600305557250977, "global_step": 289459, "epoch": 3487} {"train_loss": -25.173786163330078, "global_step": 289460, "epoch": 3487} {"train_loss": -25.99019432067871, "global_step": 289461, "epoch": 3487} {"train_loss": -25.628082275390625, "global_step": 289462, "epoch": 3487} {"train_loss": -25.72762107849121, "global_step": 289463, "epoch": 3487} {"train_loss": -25.611265182495117, "global_step": 289464, "epoch": 3487} {"train_loss": -25.885364532470703, "global_step": 289465, "epoch": 3487} {"train_loss": -25.986425399780273, "global_step": 289466, "epoch": 3487} {"train_loss": -25.680261611938477, "global_step": 289467, "epoch": 3487} {"train_loss": -25.8637752532959, "global_step": 289468, "epoch": 3487} {"train_loss": -25.786985397338867, "global_step": 289469, "epoch": 3487} {"train_loss": -26.00288963317871, "global_step": 289470, "epoch": 3487} {"train_loss": -25.57847785949707, "global_step": 289471, "epoch": 3487} {"train_loss": -25.6940860748291, "global_step": 289472, "epoch": 3487} {"train_loss": -25.74369239807129, "global_step": 289473, "epoch": 3487} {"train_loss": -25.446269989013672, "global_step": 289474, "epoch": 3487} {"train_loss": -25.77962303161621, "global_step": 289475, "epoch": 3487} {"train_loss": -25.91951560974121, "global_step": 289476, "epoch": 3487} {"train_loss": -25.478010177612305, "global_step": 289477, "epoch": 3487} {"train_loss": -25.713159561157227, "global_step": 289478, "epoch": 3487} {"train_loss": -25.598064422607422, "global_step": 289479, "epoch": 3487} {"train_loss": -25.51870346069336, "global_step": 289480, "epoch": 3487} {"train_loss": -25.784887313842773, "global_step": 289481, "epoch": 3487} {"train_loss": -25.643295288085938, "global_step": 289482, "epoch": 3487} {"train_loss": -25.578407287597656, "global_step": 289483, "epoch": 3487} {"train_loss": -25.708179473876953, "global_step": 289484, "epoch": 3487} {"train_loss": -25.585432052612305, "global_step": 289485, "epoch": 3487} {"train_loss": -25.800989151000977, "global_step": 289486, "epoch": 3487} {"train_loss": -25.709293365478516, "global_step": 289487, "epoch": 3487} {"train_loss": -25.745670318603516, "global_step": 289488, "epoch": 3487} {"train_loss": -25.571069717407227, "global_step": 289489, "epoch": 3487} {"train_loss": -25.26863670349121, "global_step": 289490, "epoch": 3487} {"train_loss": -24.700910568237305, "global_step": 289491, "epoch": 3487} {"train_loss": -23.75558853149414, "global_step": 289492, "epoch": 3487} {"train_loss": -22.801416397094727, "global_step": 289493, "epoch": 3487} {"train_loss": -24.165800094604492, "global_step": 289494, "epoch": 3487} {"train_loss": -25.362668991088867, "global_step": 289495, "epoch": 3487} {"train_loss": -24.75205421447754, "global_step": 289496, "epoch": 3487} {"train_loss": -25.141931533813477, "global_step": 289497, "epoch": 3487} {"train_loss": -25.02235221862793, "global_step": 289498, "epoch": 3487} {"train_loss": -25.259429931640625, "global_step": 289499, "epoch": 3487} {"train_loss": -25.169464111328125, "global_step": 289500, "epoch": 3487} {"train_loss": -24.752197265625, "global_step": 289501, "epoch": 3487} {"train_loss": -25.260868072509766, "global_step": 289502, "epoch": 3487} {"train_loss": -25.215809672711842, "global_step": 289503, "epoch": 3487, "val_loss": 7171400.0} {"train_loss": -24.94960594177246, "global_step": 289504, "epoch": 3488} {"train_loss": -24.84893226623535, "global_step": 289505, "epoch": 3488} {"train_loss": -25.068227767944336, "global_step": 289506, "epoch": 3488} {"train_loss": -24.614572525024414, "global_step": 289507, "epoch": 3488} {"train_loss": -25.09181022644043, "global_step": 289508, "epoch": 3488} {"train_loss": -24.689929962158203, "global_step": 289509, "epoch": 3488} {"train_loss": -25.023223876953125, "global_step": 289510, "epoch": 3488} {"train_loss": -24.51664924621582, "global_step": 289511, "epoch": 3488} {"train_loss": -25.093820571899414, "global_step": 289512, "epoch": 3488} {"train_loss": -25.00416374206543, "global_step": 289513, "epoch": 3488} {"train_loss": -25.039640426635742, "global_step": 289514, "epoch": 3488} {"train_loss": -25.098054885864258, "global_step": 289515, "epoch": 3488} {"train_loss": -25.312192916870117, "global_step": 289516, "epoch": 3488} {"train_loss": -25.379968643188477, "global_step": 289517, "epoch": 3488} {"train_loss": -25.38355827331543, "global_step": 289518, "epoch": 3488} {"train_loss": -25.027864456176758, "global_step": 289519, "epoch": 3488} {"train_loss": -25.166040420532227, "global_step": 289520, "epoch": 3488} {"train_loss": -25.19823455810547, "global_step": 289521, "epoch": 3488} {"train_loss": -25.49074363708496, "global_step": 289522, "epoch": 3488} {"train_loss": -25.431753158569336, "global_step": 289523, "epoch": 3488} {"train_loss": -25.580368041992188, "global_step": 289524, "epoch": 3488} {"train_loss": -24.927820205688477, "global_step": 289525, "epoch": 3488} {"train_loss": -25.438323974609375, "global_step": 289526, "epoch": 3488} {"train_loss": -25.614309310913086, "global_step": 289527, "epoch": 3488} {"train_loss": -25.202943801879883, "global_step": 289528, "epoch": 3488} {"train_loss": -24.981040954589844, "global_step": 289529, "epoch": 3488} {"train_loss": -25.457687377929688, "global_step": 289530, "epoch": 3488} {"train_loss": -25.490095138549805, "global_step": 289531, "epoch": 3488} {"train_loss": -25.56097984313965, "global_step": 289532, "epoch": 3488} {"train_loss": -25.134328842163086, "global_step": 289533, "epoch": 3488} {"train_loss": -25.7614803314209, "global_step": 289534, "epoch": 3488} {"train_loss": -25.218339920043945, "global_step": 289535, "epoch": 3488} {"train_loss": -25.534196853637695, "global_step": 289536, "epoch": 3488} {"train_loss": -25.67276382446289, "global_step": 289537, "epoch": 3488} {"train_loss": -25.614912033081055, "global_step": 289538, "epoch": 3488} {"train_loss": -25.44801902770996, "global_step": 289539, "epoch": 3488} {"train_loss": -25.77947425842285, "global_step": 289540, "epoch": 3488} {"train_loss": -25.320322036743164, "global_step": 289541, "epoch": 3488} {"train_loss": -25.347923278808594, "global_step": 289542, "epoch": 3488} {"train_loss": -25.644012451171875, "global_step": 289543, "epoch": 3488} {"train_loss": -25.505647659301758, "global_step": 289544, "epoch": 3488} {"train_loss": -25.527708053588867, "global_step": 289545, "epoch": 3488} {"train_loss": -25.962738037109375, "global_step": 289546, "epoch": 3488} {"train_loss": -25.696990966796875, "global_step": 289547, "epoch": 3488} {"train_loss": -25.7050724029541, "global_step": 289548, "epoch": 3488} {"train_loss": -25.576936721801758, "global_step": 289549, "epoch": 3488} {"train_loss": -25.71895408630371, "global_step": 289550, "epoch": 3488} {"train_loss": -25.578535079956055, "global_step": 289551, "epoch": 3488} {"train_loss": -25.576887130737305, "global_step": 289552, "epoch": 3488} {"train_loss": -25.67829704284668, "global_step": 289553, "epoch": 3488} {"train_loss": -25.10112953186035, "global_step": 289554, "epoch": 3488} {"train_loss": -25.27471160888672, "global_step": 289555, "epoch": 3488} {"train_loss": -25.409809112548828, "global_step": 289556, "epoch": 3488} {"train_loss": -25.500232696533203, "global_step": 289557, "epoch": 3488} {"train_loss": -25.469240188598633, "global_step": 289558, "epoch": 3488} {"train_loss": -25.659971237182617, "global_step": 289559, "epoch": 3488} {"train_loss": -25.185415267944336, "global_step": 289560, "epoch": 3488} {"train_loss": -25.462430953979492, "global_step": 289561, "epoch": 3488} {"train_loss": -25.773868560791016, "global_step": 289562, "epoch": 3488} {"train_loss": -25.403982162475586, "global_step": 289563, "epoch": 3488} {"train_loss": -25.39139175415039, "global_step": 289564, "epoch": 3488} {"train_loss": -25.484586715698242, "global_step": 289565, "epoch": 3488} {"train_loss": -25.900287628173828, "global_step": 289566, "epoch": 3488} {"train_loss": -25.491287231445312, "global_step": 289567, "epoch": 3488} {"train_loss": -25.90911293029785, "global_step": 289568, "epoch": 3488} {"train_loss": -25.541894912719727, "global_step": 289569, "epoch": 3488} {"train_loss": -25.337600708007812, "global_step": 289570, "epoch": 3488} {"train_loss": -25.730009078979492, "global_step": 289571, "epoch": 3488} {"train_loss": -25.642911911010742, "global_step": 289572, "epoch": 3488} {"train_loss": -25.305150985717773, "global_step": 289573, "epoch": 3488} {"train_loss": -25.66338539123535, "global_step": 289574, "epoch": 3488} {"train_loss": -25.75690269470215, "global_step": 289575, "epoch": 3488} {"train_loss": -25.931995391845703, "global_step": 289576, "epoch": 3488} {"train_loss": -26.023221969604492, "global_step": 289577, "epoch": 3488} {"train_loss": -25.491989135742188, "global_step": 289578, "epoch": 3488} {"train_loss": -25.600448608398438, "global_step": 289579, "epoch": 3488} {"train_loss": -25.8527774810791, "global_step": 289580, "epoch": 3488} {"train_loss": -25.66193199157715, "global_step": 289581, "epoch": 3488} {"train_loss": -25.6326904296875, "global_step": 289582, "epoch": 3488} {"train_loss": -25.570974349975586, "global_step": 289583, "epoch": 3488} {"train_loss": -25.49899673461914, "global_step": 289584, "epoch": 3488} {"train_loss": -25.807819366455078, "global_step": 289585, "epoch": 3488} {"train_loss": -25.417662494153863, "global_step": 289586, "epoch": 3488, "val_loss": 7065050.0} {"train_loss": -24.65036964416504, "global_step": 289587, "epoch": 3489} {"train_loss": -23.684083938598633, "global_step": 289588, "epoch": 3489} {"train_loss": -23.323686599731445, "global_step": 289589, "epoch": 3489} {"train_loss": -24.01202392578125, "global_step": 289590, "epoch": 3489} {"train_loss": -24.970792770385742, "global_step": 289591, "epoch": 3489} {"train_loss": -24.091161727905273, "global_step": 289592, "epoch": 3489} {"train_loss": -24.393718719482422, "global_step": 289593, "epoch": 3489} {"train_loss": -25.16724395751953, "global_step": 289594, "epoch": 3489} {"train_loss": -24.847028732299805, "global_step": 289595, "epoch": 3489} {"train_loss": -24.836809158325195, "global_step": 289596, "epoch": 3489} {"train_loss": -24.844816207885742, "global_step": 289597, "epoch": 3489} {"train_loss": -25.156877517700195, "global_step": 289598, "epoch": 3489} {"train_loss": -24.861648559570312, "global_step": 289599, "epoch": 3489} {"train_loss": -24.758634567260742, "global_step": 289600, "epoch": 3489} {"train_loss": -25.057859420776367, "global_step": 289601, "epoch": 3489} {"train_loss": -24.669477462768555, "global_step": 289602, "epoch": 3489} {"train_loss": -25.227569580078125, "global_step": 289603, "epoch": 3489} {"train_loss": -24.735107421875, "global_step": 289604, "epoch": 3489} {"train_loss": -25.08851432800293, "global_step": 289605, "epoch": 3489} {"train_loss": -25.154569625854492, "global_step": 289606, "epoch": 3489} {"train_loss": -25.126636505126953, "global_step": 289607, "epoch": 3489} {"train_loss": -24.911922454833984, "global_step": 289608, "epoch": 3489} {"train_loss": -24.908370971679688, "global_step": 289609, "epoch": 3489} {"train_loss": -25.533172607421875, "global_step": 289610, "epoch": 3489} {"train_loss": -25.379030227661133, "global_step": 289611, "epoch": 3489} {"train_loss": -25.43017578125, "global_step": 289612, "epoch": 3489} {"train_loss": -24.993431091308594, "global_step": 289613, "epoch": 3489} {"train_loss": -25.439720153808594, "global_step": 289614, "epoch": 3489} {"train_loss": -25.266435623168945, "global_step": 289615, "epoch": 3489} {"train_loss": -25.37415885925293, "global_step": 289616, "epoch": 3489} {"train_loss": -25.352294921875, "global_step": 289617, "epoch": 3489} {"train_loss": -25.215585708618164, "global_step": 289618, "epoch": 3489} {"train_loss": -25.59287452697754, "global_step": 289619, "epoch": 3489} {"train_loss": -25.84327507019043, "global_step": 289620, "epoch": 3489} {"train_loss": -25.48967170715332, "global_step": 289621, "epoch": 3489} {"train_loss": -25.708341598510742, "global_step": 289622, "epoch": 3489} {"train_loss": -25.800031661987305, "global_step": 289623, "epoch": 3489} {"train_loss": -25.546052932739258, "global_step": 289624, "epoch": 3489} {"train_loss": -25.471330642700195, "global_step": 289625, "epoch": 3489} {"train_loss": -25.450735092163086, "global_step": 289626, "epoch": 3489} {"train_loss": -25.392139434814453, "global_step": 289627, "epoch": 3489} {"train_loss": -25.499916076660156, "global_step": 289628, "epoch": 3489} {"train_loss": -25.537464141845703, "global_step": 289629, "epoch": 3489} {"train_loss": -25.60721778869629, "global_step": 289630, "epoch": 3489} {"train_loss": -25.695877075195312, "global_step": 289631, "epoch": 3489} {"train_loss": -25.467222213745117, "global_step": 289632, "epoch": 3489} {"train_loss": -25.631223678588867, "global_step": 289633, "epoch": 3489} {"train_loss": -25.639938354492188, "global_step": 289634, "epoch": 3489} {"train_loss": -25.503564834594727, "global_step": 289635, "epoch": 3489} {"train_loss": -25.427762985229492, "global_step": 289636, "epoch": 3489} {"train_loss": -25.410432815551758, "global_step": 289637, "epoch": 3489} {"train_loss": -25.669363021850586, "global_step": 289638, "epoch": 3489} {"train_loss": -25.59795570373535, "global_step": 289639, "epoch": 3489} {"train_loss": -25.27104949951172, "global_step": 289640, "epoch": 3489} {"train_loss": -25.540958404541016, "global_step": 289641, "epoch": 3489} {"train_loss": -25.49736976623535, "global_step": 289642, "epoch": 3489} {"train_loss": -25.691436767578125, "global_step": 289643, "epoch": 3489} {"train_loss": -25.35414695739746, "global_step": 289644, "epoch": 3489} {"train_loss": -25.513025283813477, "global_step": 289645, "epoch": 3489} {"train_loss": -25.51308250427246, "global_step": 289646, "epoch": 3489} {"train_loss": -25.652740478515625, "global_step": 289647, "epoch": 3489} {"train_loss": -25.74134635925293, "global_step": 289648, "epoch": 3489} {"train_loss": -25.44575309753418, "global_step": 289649, "epoch": 3489} {"train_loss": -25.528310775756836, "global_step": 289650, "epoch": 3489} {"train_loss": -25.523595809936523, "global_step": 289651, "epoch": 3489} {"train_loss": -25.573728561401367, "global_step": 289652, "epoch": 3489} {"train_loss": -25.177505493164062, "global_step": 289653, "epoch": 3489} {"train_loss": -25.837421417236328, "global_step": 289654, "epoch": 3489} {"train_loss": -25.681177139282227, "global_step": 289655, "epoch": 3489} {"train_loss": -25.625598907470703, "global_step": 289656, "epoch": 3489} {"train_loss": -25.83881187438965, "global_step": 289657, "epoch": 3489} {"train_loss": -25.905166625976562, "global_step": 289658, "epoch": 3489} {"train_loss": -25.252933502197266, "global_step": 289659, "epoch": 3489} {"train_loss": -25.709747314453125, "global_step": 289660, "epoch": 3489} {"train_loss": -25.494117736816406, "global_step": 289661, "epoch": 3489} {"train_loss": -25.6894588470459, "global_step": 289662, "epoch": 3489} {"train_loss": -25.56375503540039, "global_step": 289663, "epoch": 3489} {"train_loss": -25.4786434173584, "global_step": 289664, "epoch": 3489} {"train_loss": -25.723569869995117, "global_step": 289665, "epoch": 3489} {"train_loss": -25.79859733581543, "global_step": 289666, "epoch": 3489} {"train_loss": -25.775711059570312, "global_step": 289667, "epoch": 3489} {"train_loss": -25.854516983032227, "global_step": 289668, "epoch": 3489} {"train_loss": -25.314226656074982, "global_step": 289669, "epoch": 3489, "val_loss": 7170602.0} {"train_loss": -23.257144927978516, "global_step": 289670, "epoch": 3490} {"train_loss": -22.360334396362305, "global_step": 289671, "epoch": 3490} {"train_loss": -22.65184211730957, "global_step": 289672, "epoch": 3490} {"train_loss": -24.217947006225586, "global_step": 289673, "epoch": 3490} {"train_loss": -22.764982223510742, "global_step": 289674, "epoch": 3490} {"train_loss": -22.95343589782715, "global_step": 289675, "epoch": 3490} {"train_loss": -24.139272689819336, "global_step": 289676, "epoch": 3490} {"train_loss": -23.832122802734375, "global_step": 289677, "epoch": 3490} {"train_loss": -24.01919937133789, "global_step": 289678, "epoch": 3490} {"train_loss": -23.992496490478516, "global_step": 289679, "epoch": 3490} {"train_loss": -23.628087997436523, "global_step": 289680, "epoch": 3490} {"train_loss": -24.10879135131836, "global_step": 289681, "epoch": 3490} {"train_loss": -24.26350975036621, "global_step": 289682, "epoch": 3490} {"train_loss": -23.89984130859375, "global_step": 289683, "epoch": 3490} {"train_loss": -24.398786544799805, "global_step": 289684, "epoch": 3490} {"train_loss": -24.525102615356445, "global_step": 289685, "epoch": 3490} {"train_loss": -24.370471954345703, "global_step": 289686, "epoch": 3490} {"train_loss": -24.584430694580078, "global_step": 289687, "epoch": 3490} {"train_loss": -24.301488876342773, "global_step": 289688, "epoch": 3490} {"train_loss": -24.474510192871094, "global_step": 289689, "epoch": 3490} {"train_loss": -24.80910301208496, "global_step": 289690, "epoch": 3490} {"train_loss": -24.72313117980957, "global_step": 289691, "epoch": 3490} {"train_loss": -24.614288330078125, "global_step": 289692, "epoch": 3490} {"train_loss": -24.486135482788086, "global_step": 289693, "epoch": 3490} {"train_loss": -25.004179000854492, "global_step": 289694, "epoch": 3490} {"train_loss": -25.070825576782227, "global_step": 289695, "epoch": 3490} {"train_loss": -24.861135482788086, "global_step": 289696, "epoch": 3490} {"train_loss": -24.749744415283203, "global_step": 289697, "epoch": 3490} {"train_loss": -24.904386520385742, "global_step": 289698, "epoch": 3490} {"train_loss": -25.06394386291504, "global_step": 289699, "epoch": 3490} {"train_loss": -24.874242782592773, "global_step": 289700, "epoch": 3490} {"train_loss": -25.18255043029785, "global_step": 289701, "epoch": 3490} {"train_loss": -25.265531539916992, "global_step": 289702, "epoch": 3490} {"train_loss": -25.33428192138672, "global_step": 289703, "epoch": 3490} {"train_loss": -25.31263542175293, "global_step": 289704, "epoch": 3490} {"train_loss": -24.96516227722168, "global_step": 289705, "epoch": 3490} {"train_loss": -25.1090145111084, "global_step": 289706, "epoch": 3490} {"train_loss": -25.32887077331543, "global_step": 289707, "epoch": 3490} {"train_loss": -25.164691925048828, "global_step": 289708, "epoch": 3490} {"train_loss": -25.52773094177246, "global_step": 289709, "epoch": 3490} {"train_loss": -25.346637725830078, "global_step": 289710, "epoch": 3490} {"train_loss": -25.51899528503418, "global_step": 289711, "epoch": 3490} {"train_loss": -25.448627471923828, "global_step": 289712, "epoch": 3490} {"train_loss": -25.482255935668945, "global_step": 289713, "epoch": 3490} {"train_loss": -25.606882095336914, "global_step": 289714, "epoch": 3490} {"train_loss": -25.441247940063477, "global_step": 289715, "epoch": 3490} {"train_loss": -25.826658248901367, "global_step": 289716, "epoch": 3490} {"train_loss": -25.3956356048584, "global_step": 289717, "epoch": 3490} {"train_loss": -25.627674102783203, "global_step": 289718, "epoch": 3490} {"train_loss": -25.53761863708496, "global_step": 289719, "epoch": 3490} {"train_loss": -25.35184097290039, "global_step": 289720, "epoch": 3490} {"train_loss": -25.709081649780273, "global_step": 289721, "epoch": 3490} {"train_loss": -25.639450073242188, "global_step": 289722, "epoch": 3490} {"train_loss": -25.624860763549805, "global_step": 289723, "epoch": 3490} {"train_loss": -25.385404586791992, "global_step": 289724, "epoch": 3490} {"train_loss": -25.478635787963867, "global_step": 289725, "epoch": 3490} {"train_loss": -25.44388198852539, "global_step": 289726, "epoch": 3490} {"train_loss": -25.2758731842041, "global_step": 289727, "epoch": 3490} {"train_loss": -25.229692459106445, "global_step": 289728, "epoch": 3490} {"train_loss": -25.468564987182617, "global_step": 289729, "epoch": 3490} {"train_loss": -25.747440338134766, "global_step": 289730, "epoch": 3490} {"train_loss": -25.78043556213379, "global_step": 289731, "epoch": 3490} {"train_loss": -25.31926727294922, "global_step": 289732, "epoch": 3490} {"train_loss": -25.344934463500977, "global_step": 289733, "epoch": 3490} {"train_loss": -25.490060806274414, "global_step": 289734, "epoch": 3490} {"train_loss": -25.7742977142334, "global_step": 289735, "epoch": 3490} {"train_loss": -25.43548583984375, "global_step": 289736, "epoch": 3490} {"train_loss": -25.62235450744629, "global_step": 289737, "epoch": 3490} {"train_loss": -25.60699462890625, "global_step": 289738, "epoch": 3490} {"train_loss": -25.6348934173584, "global_step": 289739, "epoch": 3490} {"train_loss": -25.87233543395996, "global_step": 289740, "epoch": 3490} {"train_loss": -25.49309730529785, "global_step": 289741, "epoch": 3490} {"train_loss": -25.635086059570312, "global_step": 289742, "epoch": 3490} {"train_loss": -25.64979362487793, "global_step": 289743, "epoch": 3490} {"train_loss": -25.6810359954834, "global_step": 289744, "epoch": 3490} {"train_loss": -25.707141876220703, "global_step": 289745, "epoch": 3490} {"train_loss": -25.27955436706543, "global_step": 289746, "epoch": 3490} {"train_loss": -25.73785400390625, "global_step": 289747, "epoch": 3490} {"train_loss": -25.54090118408203, "global_step": 289748, "epoch": 3490} {"train_loss": -25.35451889038086, "global_step": 289749, "epoch": 3490} {"train_loss": -25.19585418701172, "global_step": 289750, "epoch": 3490} {"train_loss": -25.842437744140625, "global_step": 289751, "epoch": 3490} {"train_loss": -25.007397663162415, "global_step": 289752, "epoch": 3490, "val_loss": 7124316.0} {"train_loss": -25.232263565063477, "global_step": 289753, "epoch": 3491} {"train_loss": -25.165058135986328, "global_step": 289754, "epoch": 3491} {"train_loss": -24.823505401611328, "global_step": 289755, "epoch": 3491} {"train_loss": -25.046613693237305, "global_step": 289756, "epoch": 3491} {"train_loss": -24.85186004638672, "global_step": 289757, "epoch": 3491} {"train_loss": -24.94025993347168, "global_step": 289758, "epoch": 3491} {"train_loss": -24.780590057373047, "global_step": 289759, "epoch": 3491} {"train_loss": -24.7257022857666, "global_step": 289760, "epoch": 3491} {"train_loss": -24.935773849487305, "global_step": 289761, "epoch": 3491} {"train_loss": -25.01740074157715, "global_step": 289762, "epoch": 3491} {"train_loss": -25.2689151763916, "global_step": 289763, "epoch": 3491} {"train_loss": -25.203163146972656, "global_step": 289764, "epoch": 3491} {"train_loss": -25.43756675720215, "global_step": 289765, "epoch": 3491} {"train_loss": -25.296741485595703, "global_step": 289766, "epoch": 3491} {"train_loss": -25.209680557250977, "global_step": 289767, "epoch": 3491} {"train_loss": -25.64312744140625, "global_step": 289768, "epoch": 3491} {"train_loss": -25.09199333190918, "global_step": 289769, "epoch": 3491} {"train_loss": -25.293272018432617, "global_step": 289770, "epoch": 3491} {"train_loss": -25.1315860748291, "global_step": 289771, "epoch": 3491} {"train_loss": -25.42410659790039, "global_step": 289772, "epoch": 3491} {"train_loss": -25.126516342163086, "global_step": 289773, "epoch": 3491} {"train_loss": -25.692779541015625, "global_step": 289774, "epoch": 3491} {"train_loss": -25.585124969482422, "global_step": 289775, "epoch": 3491} {"train_loss": -25.7047119140625, "global_step": 289776, "epoch": 3491} {"train_loss": -25.474042892456055, "global_step": 289777, "epoch": 3491} {"train_loss": -25.665979385375977, "global_step": 289778, "epoch": 3491} {"train_loss": -25.528125762939453, "global_step": 289779, "epoch": 3491} {"train_loss": -25.3972110748291, "global_step": 289780, "epoch": 3491} {"train_loss": -25.39876365661621, "global_step": 289781, "epoch": 3491} {"train_loss": -25.6265811920166, "global_step": 289782, "epoch": 3491} {"train_loss": -25.681995391845703, "global_step": 289783, "epoch": 3491} {"train_loss": -25.610822677612305, "global_step": 289784, "epoch": 3491} {"train_loss": -25.598468780517578, "global_step": 289785, "epoch": 3491} {"train_loss": -25.73783302307129, "global_step": 289786, "epoch": 3491} {"train_loss": -25.481224060058594, "global_step": 289787, "epoch": 3491} {"train_loss": -25.81414794921875, "global_step": 289788, "epoch": 3491} {"train_loss": -26.035444259643555, "global_step": 289789, "epoch": 3491} {"train_loss": -25.617650985717773, "global_step": 289790, "epoch": 3491} {"train_loss": -25.699033737182617, "global_step": 289791, "epoch": 3491} {"train_loss": -25.68778419494629, "global_step": 289792, "epoch": 3491} {"train_loss": -25.400861740112305, "global_step": 289793, "epoch": 3491} {"train_loss": -25.80165672302246, "global_step": 289794, "epoch": 3491} {"train_loss": -25.78241539001465, "global_step": 289795, "epoch": 3491} {"train_loss": -25.613157272338867, "global_step": 289796, "epoch": 3491} {"train_loss": -25.37406349182129, "global_step": 289797, "epoch": 3491} {"train_loss": -26.135456085205078, "global_step": 289798, "epoch": 3491} {"train_loss": -25.658109664916992, "global_step": 289799, "epoch": 3491} {"train_loss": -25.076812744140625, "global_step": 289800, "epoch": 3491} {"train_loss": -25.443912506103516, "global_step": 289801, "epoch": 3491} {"train_loss": -25.925825119018555, "global_step": 289802, "epoch": 3491} {"train_loss": -25.647314071655273, "global_step": 289803, "epoch": 3491} {"train_loss": -25.71644401550293, "global_step": 289804, "epoch": 3491} {"train_loss": -25.17447853088379, "global_step": 289805, "epoch": 3491} {"train_loss": -25.981266021728516, "global_step": 289806, "epoch": 3491} {"train_loss": -25.264997482299805, "global_step": 289807, "epoch": 3491} {"train_loss": -25.320999145507812, "global_step": 289808, "epoch": 3491} {"train_loss": -24.735309600830078, "global_step": 289809, "epoch": 3491} {"train_loss": -25.048208236694336, "global_step": 289810, "epoch": 3491} {"train_loss": -25.429777145385742, "global_step": 289811, "epoch": 3491} {"train_loss": -25.350873947143555, "global_step": 289812, "epoch": 3491} {"train_loss": -25.74778175354004, "global_step": 289813, "epoch": 3491} {"train_loss": -25.575796127319336, "global_step": 289814, "epoch": 3491} {"train_loss": -25.37306022644043, "global_step": 289815, "epoch": 3491} {"train_loss": -25.499113082885742, "global_step": 289816, "epoch": 3491} {"train_loss": -25.51614761352539, "global_step": 289817, "epoch": 3491} {"train_loss": -25.613218307495117, "global_step": 289818, "epoch": 3491} {"train_loss": -25.46295738220215, "global_step": 289819, "epoch": 3491} {"train_loss": -25.65239906311035, "global_step": 289820, "epoch": 3491} {"train_loss": -25.28682518005371, "global_step": 289821, "epoch": 3491} {"train_loss": -25.62060546875, "global_step": 289822, "epoch": 3491} {"train_loss": -25.38620376586914, "global_step": 289823, "epoch": 3491} {"train_loss": -25.770172119140625, "global_step": 289824, "epoch": 3491} {"train_loss": -25.646820068359375, "global_step": 289825, "epoch": 3491} {"train_loss": -25.351049423217773, "global_step": 289826, "epoch": 3491} {"train_loss": -25.73878288269043, "global_step": 289827, "epoch": 3491} {"train_loss": -25.39449119567871, "global_step": 289828, "epoch": 3491} {"train_loss": -25.531469345092773, "global_step": 289829, "epoch": 3491} {"train_loss": -25.4647159576416, "global_step": 289830, "epoch": 3491} {"train_loss": -24.840118408203125, "global_step": 289831, "epoch": 3491} {"train_loss": -25.301410675048828, "global_step": 289832, "epoch": 3491} {"train_loss": -25.021825790405273, "global_step": 289833, "epoch": 3491} {"train_loss": -25.866907119750977, "global_step": 289834, "epoch": 3491} {"train_loss": -25.415831278605634, "global_step": 289835, "epoch": 3491, "val_loss": 7021792.0} {"train_loss": -25.063344955444336, "global_step": 289836, "epoch": 3492} {"train_loss": -24.848602294921875, "global_step": 289837, "epoch": 3492} {"train_loss": -25.250181198120117, "global_step": 289838, "epoch": 3492} {"train_loss": -25.179405212402344, "global_step": 289839, "epoch": 3492} {"train_loss": -24.530122756958008, "global_step": 289840, "epoch": 3492} {"train_loss": -24.705846786499023, "global_step": 289841, "epoch": 3492} {"train_loss": -24.90134048461914, "global_step": 289842, "epoch": 3492} {"train_loss": -25.372024536132812, "global_step": 289843, "epoch": 3492} {"train_loss": -24.725515365600586, "global_step": 289844, "epoch": 3492} {"train_loss": -25.291311264038086, "global_step": 289845, "epoch": 3492} {"train_loss": -25.253841400146484, "global_step": 289846, "epoch": 3492} {"train_loss": -25.33915138244629, "global_step": 289847, "epoch": 3492} {"train_loss": -25.094083786010742, "global_step": 289848, "epoch": 3492} {"train_loss": -25.181245803833008, "global_step": 289849, "epoch": 3492} {"train_loss": -25.36917495727539, "global_step": 289850, "epoch": 3492} {"train_loss": -25.724050521850586, "global_step": 289851, "epoch": 3492} {"train_loss": -25.470142364501953, "global_step": 289852, "epoch": 3492} {"train_loss": -24.978670120239258, "global_step": 289853, "epoch": 3492} {"train_loss": -25.009891510009766, "global_step": 289854, "epoch": 3492} {"train_loss": -25.63726234436035, "global_step": 289855, "epoch": 3492} {"train_loss": -25.719091415405273, "global_step": 289856, "epoch": 3492} {"train_loss": -25.648229598999023, "global_step": 289857, "epoch": 3492} {"train_loss": -25.4738826751709, "global_step": 289858, "epoch": 3492} {"train_loss": -25.884689331054688, "global_step": 289859, "epoch": 3492} {"train_loss": -25.346847534179688, "global_step": 289860, "epoch": 3492} {"train_loss": -25.515422821044922, "global_step": 289861, "epoch": 3492} {"train_loss": -25.56032371520996, "global_step": 289862, "epoch": 3492} {"train_loss": -25.477291107177734, "global_step": 289863, "epoch": 3492} {"train_loss": -25.734533309936523, "global_step": 289864, "epoch": 3492} {"train_loss": -25.019500732421875, "global_step": 289865, "epoch": 3492} {"train_loss": -25.690811157226562, "global_step": 289866, "epoch": 3492} {"train_loss": -25.627187728881836, "global_step": 289867, "epoch": 3492} {"train_loss": -25.447132110595703, "global_step": 289868, "epoch": 3492} {"train_loss": -25.622541427612305, "global_step": 289869, "epoch": 3492} {"train_loss": -25.962787628173828, "global_step": 289870, "epoch": 3492} {"train_loss": -25.468521118164062, "global_step": 289871, "epoch": 3492} {"train_loss": -25.422622680664062, "global_step": 289872, "epoch": 3492} {"train_loss": -25.943410873413086, "global_step": 289873, "epoch": 3492} {"train_loss": -25.338977813720703, "global_step": 289874, "epoch": 3492} {"train_loss": -25.66935157775879, "global_step": 289875, "epoch": 3492} {"train_loss": -25.6854248046875, "global_step": 289876, "epoch": 3492} {"train_loss": -25.805524826049805, "global_step": 289877, "epoch": 3492} {"train_loss": -25.628026962280273, "global_step": 289878, "epoch": 3492} {"train_loss": -25.909809112548828, "global_step": 289879, "epoch": 3492} {"train_loss": -25.958606719970703, "global_step": 289880, "epoch": 3492} {"train_loss": -25.70624351501465, "global_step": 289881, "epoch": 3492} {"train_loss": -25.777830123901367, "global_step": 289882, "epoch": 3492} {"train_loss": -25.604246139526367, "global_step": 289883, "epoch": 3492} {"train_loss": -25.611392974853516, "global_step": 289884, "epoch": 3492} {"train_loss": -25.572744369506836, "global_step": 289885, "epoch": 3492} {"train_loss": -25.159757614135742, "global_step": 289886, "epoch": 3492} {"train_loss": -25.64813232421875, "global_step": 289887, "epoch": 3492} {"train_loss": -25.603239059448242, "global_step": 289888, "epoch": 3492} {"train_loss": -25.881467819213867, "global_step": 289889, "epoch": 3492} {"train_loss": -25.7701358795166, "global_step": 289890, "epoch": 3492} {"train_loss": -26.136505126953125, "global_step": 289891, "epoch": 3492} {"train_loss": -26.068700790405273, "global_step": 289892, "epoch": 3492} {"train_loss": -25.693567276000977, "global_step": 289893, "epoch": 3492} {"train_loss": -25.608556747436523, "global_step": 289894, "epoch": 3492} {"train_loss": -25.50865936279297, "global_step": 289895, "epoch": 3492} {"train_loss": -25.52861976623535, "global_step": 289896, "epoch": 3492} {"train_loss": -25.95440101623535, "global_step": 289897, "epoch": 3492} {"train_loss": -25.58631134033203, "global_step": 289898, "epoch": 3492} {"train_loss": -25.13364028930664, "global_step": 289899, "epoch": 3492} {"train_loss": -25.480655670166016, "global_step": 289900, "epoch": 3492} {"train_loss": -25.715591430664062, "global_step": 289901, "epoch": 3492} {"train_loss": -25.550268173217773, "global_step": 289902, "epoch": 3492} {"train_loss": -25.277555465698242, "global_step": 289903, "epoch": 3492} {"train_loss": -25.285873413085938, "global_step": 289904, "epoch": 3492} {"train_loss": -25.136844635009766, "global_step": 289905, "epoch": 3492} {"train_loss": -24.980695724487305, "global_step": 289906, "epoch": 3492} {"train_loss": -25.135826110839844, "global_step": 289907, "epoch": 3492} {"train_loss": -25.45393943786621, "global_step": 289908, "epoch": 3492} {"train_loss": -25.30391502380371, "global_step": 289909, "epoch": 3492} {"train_loss": -24.863290786743164, "global_step": 289910, "epoch": 3492} {"train_loss": -25.363393783569336, "global_step": 289911, "epoch": 3492} {"train_loss": -25.278867721557617, "global_step": 289912, "epoch": 3492} {"train_loss": -25.092649459838867, "global_step": 289913, "epoch": 3492} {"train_loss": -25.42291259765625, "global_step": 289914, "epoch": 3492} {"train_loss": -25.027273178100586, "global_step": 289915, "epoch": 3492} {"train_loss": -25.239316940307617, "global_step": 289916, "epoch": 3492} {"train_loss": -25.66143798828125, "global_step": 289917, "epoch": 3492} {"train_loss": -25.43712202324925, "global_step": 289918, "epoch": 3492, "val_loss": 7112240.5} {"train_loss": -25.27557373046875, "global_step": 289919, "epoch": 3493} {"train_loss": -25.328125, "global_step": 289920, "epoch": 3493} {"train_loss": -24.770164489746094, "global_step": 289921, "epoch": 3493} {"train_loss": -24.39666175842285, "global_step": 289922, "epoch": 3493} {"train_loss": -24.91792106628418, "global_step": 289923, "epoch": 3493} {"train_loss": -25.104040145874023, "global_step": 289924, "epoch": 3493} {"train_loss": -25.2269229888916, "global_step": 289925, "epoch": 3493} {"train_loss": -24.874948501586914, "global_step": 289926, "epoch": 3493} {"train_loss": -25.342113494873047, "global_step": 289927, "epoch": 3493} {"train_loss": -25.08466911315918, "global_step": 289928, "epoch": 3493} {"train_loss": -24.950239181518555, "global_step": 289929, "epoch": 3493} {"train_loss": -25.04989242553711, "global_step": 289930, "epoch": 3493} {"train_loss": -25.258947372436523, "global_step": 289931, "epoch": 3493} {"train_loss": -24.793041229248047, "global_step": 289932, "epoch": 3493} {"train_loss": -25.404691696166992, "global_step": 289933, "epoch": 3493} {"train_loss": -25.081884384155273, "global_step": 289934, "epoch": 3493} {"train_loss": -25.44103240966797, "global_step": 289935, "epoch": 3493} {"train_loss": -25.251192092895508, "global_step": 289936, "epoch": 3493} {"train_loss": -25.355789184570312, "global_step": 289937, "epoch": 3493} {"train_loss": -25.241567611694336, "global_step": 289938, "epoch": 3493} {"train_loss": -25.642187118530273, "global_step": 289939, "epoch": 3493} {"train_loss": -25.540071487426758, "global_step": 289940, "epoch": 3493} {"train_loss": -25.07727813720703, "global_step": 289941, "epoch": 3493} {"train_loss": -25.317310333251953, "global_step": 289942, "epoch": 3493} {"train_loss": -25.613113403320312, "global_step": 289943, "epoch": 3493} {"train_loss": -25.70208168029785, "global_step": 289944, "epoch": 3493} {"train_loss": -25.185287475585938, "global_step": 289945, "epoch": 3493} {"train_loss": -25.2918758392334, "global_step": 289946, "epoch": 3493} {"train_loss": -25.296100616455078, "global_step": 289947, "epoch": 3493} {"train_loss": -25.648069381713867, "global_step": 289948, "epoch": 3493} {"train_loss": -25.5487060546875, "global_step": 289949, "epoch": 3493} {"train_loss": -25.629596710205078, "global_step": 289950, "epoch": 3493} {"train_loss": -25.287595748901367, "global_step": 289951, "epoch": 3493} {"train_loss": -25.56207275390625, "global_step": 289952, "epoch": 3493} {"train_loss": -25.333377838134766, "global_step": 289953, "epoch": 3493} {"train_loss": -25.446853637695312, "global_step": 289954, "epoch": 3493} {"train_loss": -25.57672119140625, "global_step": 289955, "epoch": 3493} {"train_loss": -25.242647171020508, "global_step": 289956, "epoch": 3493} {"train_loss": -25.550111770629883, "global_step": 289957, "epoch": 3493} {"train_loss": -25.151029586791992, "global_step": 289958, "epoch": 3493} {"train_loss": -25.571517944335938, "global_step": 289959, "epoch": 3493} {"train_loss": -25.746490478515625, "global_step": 289960, "epoch": 3493} {"train_loss": -25.493677139282227, "global_step": 289961, "epoch": 3493} {"train_loss": -25.838842391967773, "global_step": 289962, "epoch": 3493} {"train_loss": -25.463666915893555, "global_step": 289963, "epoch": 3493} {"train_loss": -25.775156021118164, "global_step": 289964, "epoch": 3493} {"train_loss": -25.25313377380371, "global_step": 289965, "epoch": 3493} {"train_loss": -25.617069244384766, "global_step": 289966, "epoch": 3493} {"train_loss": -25.431148529052734, "global_step": 289967, "epoch": 3493} {"train_loss": -25.303979873657227, "global_step": 289968, "epoch": 3493} {"train_loss": -25.766141891479492, "global_step": 289969, "epoch": 3493} {"train_loss": -25.555213928222656, "global_step": 289970, "epoch": 3493} {"train_loss": -25.56634521484375, "global_step": 289971, "epoch": 3493} {"train_loss": -25.611032485961914, "global_step": 289972, "epoch": 3493} {"train_loss": -25.774581909179688, "global_step": 289973, "epoch": 3493} {"train_loss": -25.388813018798828, "global_step": 289974, "epoch": 3493} {"train_loss": -25.572946548461914, "global_step": 289975, "epoch": 3493} {"train_loss": -25.76853370666504, "global_step": 289976, "epoch": 3493} {"train_loss": -25.826547622680664, "global_step": 289977, "epoch": 3493} {"train_loss": -25.66448974609375, "global_step": 289978, "epoch": 3493} {"train_loss": -25.714893341064453, "global_step": 289979, "epoch": 3493} {"train_loss": -25.79567527770996, "global_step": 289980, "epoch": 3493} {"train_loss": -25.73555564880371, "global_step": 289981, "epoch": 3493} {"train_loss": -25.951135635375977, "global_step": 289982, "epoch": 3493} {"train_loss": -25.44085693359375, "global_step": 289983, "epoch": 3493} {"train_loss": -25.80011558532715, "global_step": 289984, "epoch": 3493} {"train_loss": -25.739532470703125, "global_step": 289985, "epoch": 3493} {"train_loss": -25.83917808532715, "global_step": 289986, "epoch": 3493} {"train_loss": -25.956357955932617, "global_step": 289987, "epoch": 3493} {"train_loss": -25.992374420166016, "global_step": 289988, "epoch": 3493} {"train_loss": -25.778675079345703, "global_step": 289989, "epoch": 3493} {"train_loss": -25.496774673461914, "global_step": 289990, "epoch": 3493} {"train_loss": -26.026411056518555, "global_step": 289991, "epoch": 3493} {"train_loss": -25.27779197692871, "global_step": 289992, "epoch": 3493} {"train_loss": -25.69658851623535, "global_step": 289993, "epoch": 3493} {"train_loss": -25.3385009765625, "global_step": 289994, "epoch": 3493} {"train_loss": -25.139541625976562, "global_step": 289995, "epoch": 3493} {"train_loss": -25.563079833984375, "global_step": 289996, "epoch": 3493} {"train_loss": -25.760046005249023, "global_step": 289997, "epoch": 3493} {"train_loss": -25.779714584350586, "global_step": 289998, "epoch": 3493} {"train_loss": -25.458467483520508, "global_step": 289999, "epoch": 3493} {"train_loss": -25.651020050048828, "global_step": 290000, "epoch": 3493} {"train_loss": -25.46259363013578, "global_step": 290001, "epoch": 3493, "val_loss": 7138657.0} {"train_loss": -25.18770980834961, "global_step": 290002, "epoch": 3494} {"train_loss": -24.425275802612305, "global_step": 290003, "epoch": 3494} {"train_loss": -24.55414390563965, "global_step": 290004, "epoch": 3494} {"train_loss": -25.298242568969727, "global_step": 290005, "epoch": 3494} {"train_loss": -25.456575393676758, "global_step": 290006, "epoch": 3494} {"train_loss": -25.40603256225586, "global_step": 290007, "epoch": 3494} {"train_loss": -25.414636611938477, "global_step": 290008, "epoch": 3494} {"train_loss": -25.142332077026367, "global_step": 290009, "epoch": 3494} {"train_loss": -25.487030029296875, "global_step": 290010, "epoch": 3494} {"train_loss": -25.304065704345703, "global_step": 290011, "epoch": 3494} {"train_loss": -25.694198608398438, "global_step": 290012, "epoch": 3494} {"train_loss": -25.36024284362793, "global_step": 290013, "epoch": 3494} {"train_loss": -25.643646240234375, "global_step": 290014, "epoch": 3494} {"train_loss": -25.62619400024414, "global_step": 290015, "epoch": 3494} {"train_loss": -25.40293312072754, "global_step": 290016, "epoch": 3494} {"train_loss": -25.201223373413086, "global_step": 290017, "epoch": 3494} {"train_loss": -25.439184188842773, "global_step": 290018, "epoch": 3494} {"train_loss": -25.136159896850586, "global_step": 290019, "epoch": 3494} {"train_loss": -25.575345993041992, "global_step": 290020, "epoch": 3494} {"train_loss": -25.516305923461914, "global_step": 290021, "epoch": 3494} {"train_loss": -25.436643600463867, "global_step": 290022, "epoch": 3494} {"train_loss": -25.457380294799805, "global_step": 290023, "epoch": 3494} {"train_loss": -25.405963897705078, "global_step": 290024, "epoch": 3494} {"train_loss": -25.950653076171875, "global_step": 290025, "epoch": 3494} {"train_loss": -25.16985511779785, "global_step": 290026, "epoch": 3494} {"train_loss": -25.597227096557617, "global_step": 290027, "epoch": 3494} {"train_loss": -25.515823364257812, "global_step": 290028, "epoch": 3494} {"train_loss": -25.431303024291992, "global_step": 290029, "epoch": 3494} {"train_loss": -25.39983558654785, "global_step": 290030, "epoch": 3494} {"train_loss": -25.237653732299805, "global_step": 290031, "epoch": 3494} {"train_loss": -25.512531280517578, "global_step": 290032, "epoch": 3494} {"train_loss": -25.442373275756836, "global_step": 290033, "epoch": 3494} {"train_loss": -25.720569610595703, "global_step": 290034, "epoch": 3494} {"train_loss": -25.67185401916504, "global_step": 290035, "epoch": 3494} {"train_loss": -25.93343162536621, "global_step": 290036, "epoch": 3494} {"train_loss": -25.66680908203125, "global_step": 290037, "epoch": 3494} {"train_loss": -25.373437881469727, "global_step": 290038, "epoch": 3494} {"train_loss": -25.48992347717285, "global_step": 290039, "epoch": 3494} {"train_loss": -25.5863094329834, "global_step": 290040, "epoch": 3494} {"train_loss": -25.802997589111328, "global_step": 290041, "epoch": 3494} {"train_loss": -25.55582046508789, "global_step": 290042, "epoch": 3494} {"train_loss": -25.585508346557617, "global_step": 290043, "epoch": 3494} {"train_loss": -25.600927352905273, "global_step": 290044, "epoch": 3494} {"train_loss": -25.79183006286621, "global_step": 290045, "epoch": 3494} {"train_loss": -25.7305850982666, "global_step": 290046, "epoch": 3494} {"train_loss": -25.543895721435547, "global_step": 290047, "epoch": 3494} {"train_loss": -25.48783302307129, "global_step": 290048, "epoch": 3494} {"train_loss": -25.51964569091797, "global_step": 290049, "epoch": 3494} {"train_loss": -25.9544620513916, "global_step": 290050, "epoch": 3494} {"train_loss": -25.462400436401367, "global_step": 290051, "epoch": 3494} {"train_loss": -25.4826717376709, "global_step": 290052, "epoch": 3494} {"train_loss": -25.49176025390625, "global_step": 290053, "epoch": 3494} {"train_loss": -25.626266479492188, "global_step": 290054, "epoch": 3494} {"train_loss": -25.568084716796875, "global_step": 290055, "epoch": 3494} {"train_loss": -25.98552894592285, "global_step": 290056, "epoch": 3494} {"train_loss": -26.09870719909668, "global_step": 290057, "epoch": 3494} {"train_loss": -25.730701446533203, "global_step": 290058, "epoch": 3494} {"train_loss": -25.4594783782959, "global_step": 290059, "epoch": 3494} {"train_loss": -25.86463737487793, "global_step": 290060, "epoch": 3494} {"train_loss": -25.031112670898438, "global_step": 290061, "epoch": 3494} {"train_loss": -25.7320613861084, "global_step": 290062, "epoch": 3494} {"train_loss": -25.336925506591797, "global_step": 290063, "epoch": 3494} {"train_loss": -25.77741813659668, "global_step": 290064, "epoch": 3494} {"train_loss": -25.768966674804688, "global_step": 290065, "epoch": 3494} {"train_loss": -25.54254722595215, "global_step": 290066, "epoch": 3494} {"train_loss": -25.307180404663086, "global_step": 290067, "epoch": 3494} {"train_loss": -25.774246215820312, "global_step": 290068, "epoch": 3494} {"train_loss": -25.535367965698242, "global_step": 290069, "epoch": 3494} {"train_loss": -25.597991943359375, "global_step": 290070, "epoch": 3494} {"train_loss": -25.30386734008789, "global_step": 290071, "epoch": 3494} {"train_loss": -25.391357421875, "global_step": 290072, "epoch": 3494} {"train_loss": -25.37148094177246, "global_step": 290073, "epoch": 3494} {"train_loss": -25.639423370361328, "global_step": 290074, "epoch": 3494} {"train_loss": -25.67445182800293, "global_step": 290075, "epoch": 3494} {"train_loss": -25.603973388671875, "global_step": 290076, "epoch": 3494} {"train_loss": -25.68535804748535, "global_step": 290077, "epoch": 3494} {"train_loss": -25.101991653442383, "global_step": 290078, "epoch": 3494} {"train_loss": -25.914926528930664, "global_step": 290079, "epoch": 3494} {"train_loss": -25.749929428100586, "global_step": 290080, "epoch": 3494} {"train_loss": -25.592966079711914, "global_step": 290081, "epoch": 3494} {"train_loss": -25.56771469116211, "global_step": 290082, "epoch": 3494} {"train_loss": -25.835437774658203, "global_step": 290083, "epoch": 3494} {"train_loss": -25.535492655742598, "global_step": 290084, "epoch": 3494, "val_loss": 7089343.0} {"train_loss": -24.179346084594727, "global_step": 290085, "epoch": 3495} {"train_loss": -24.9222412109375, "global_step": 290086, "epoch": 3495} {"train_loss": -24.5424747467041, "global_step": 290087, "epoch": 3495} {"train_loss": -25.399341583251953, "global_step": 290088, "epoch": 3495} {"train_loss": -24.758255004882812, "global_step": 290089, "epoch": 3495} {"train_loss": -25.61895179748535, "global_step": 290090, "epoch": 3495} {"train_loss": -25.43104362487793, "global_step": 290091, "epoch": 3495} {"train_loss": -25.097354888916016, "global_step": 290092, "epoch": 3495} {"train_loss": -25.393224716186523, "global_step": 290093, "epoch": 3495} {"train_loss": -24.998361587524414, "global_step": 290094, "epoch": 3495} {"train_loss": -25.388818740844727, "global_step": 290095, "epoch": 3495} {"train_loss": -24.814565658569336, "global_step": 290096, "epoch": 3495} {"train_loss": -25.23259925842285, "global_step": 290097, "epoch": 3495} {"train_loss": -25.55355453491211, "global_step": 290098, "epoch": 3495} {"train_loss": -25.461923599243164, "global_step": 290099, "epoch": 3495} {"train_loss": -25.0025634765625, "global_step": 290100, "epoch": 3495} {"train_loss": -25.42807388305664, "global_step": 290101, "epoch": 3495} {"train_loss": -25.435489654541016, "global_step": 290102, "epoch": 3495} {"train_loss": -24.879566192626953, "global_step": 290103, "epoch": 3495} {"train_loss": -25.23284912109375, "global_step": 290104, "epoch": 3495} {"train_loss": -25.318761825561523, "global_step": 290105, "epoch": 3495} {"train_loss": -25.16946029663086, "global_step": 290106, "epoch": 3495} {"train_loss": -25.784936904907227, "global_step": 290107, "epoch": 3495} {"train_loss": -25.1768798828125, "global_step": 290108, "epoch": 3495} {"train_loss": -25.305631637573242, "global_step": 290109, "epoch": 3495} {"train_loss": -25.703689575195312, "global_step": 290110, "epoch": 3495} {"train_loss": -25.174640655517578, "global_step": 290111, "epoch": 3495} {"train_loss": -25.674009323120117, "global_step": 290112, "epoch": 3495} {"train_loss": -25.526952743530273, "global_step": 290113, "epoch": 3495} {"train_loss": -25.344619750976562, "global_step": 290114, "epoch": 3495} {"train_loss": -25.209827423095703, "global_step": 290115, "epoch": 3495} {"train_loss": -25.464397430419922, "global_step": 290116, "epoch": 3495} {"train_loss": -25.585935592651367, "global_step": 290117, "epoch": 3495} {"train_loss": -25.656482696533203, "global_step": 290118, "epoch": 3495} {"train_loss": -25.778852462768555, "global_step": 290119, "epoch": 3495} {"train_loss": -25.626062393188477, "global_step": 290120, "epoch": 3495} {"train_loss": -25.557098388671875, "global_step": 290121, "epoch": 3495} {"train_loss": -25.8048038482666, "global_step": 290122, "epoch": 3495} {"train_loss": -25.2939395904541, "global_step": 290123, "epoch": 3495} {"train_loss": -25.77423667907715, "global_step": 290124, "epoch": 3495} {"train_loss": -25.81269645690918, "global_step": 290125, "epoch": 3495} {"train_loss": -25.57265281677246, "global_step": 290126, "epoch": 3495} {"train_loss": -25.795068740844727, "global_step": 290127, "epoch": 3495} {"train_loss": -25.620864868164062, "global_step": 290128, "epoch": 3495} {"train_loss": -25.8884220123291, "global_step": 290129, "epoch": 3495} {"train_loss": -25.67999839782715, "global_step": 290130, "epoch": 3495} {"train_loss": -25.7436580657959, "global_step": 290131, "epoch": 3495} {"train_loss": -25.745309829711914, "global_step": 290132, "epoch": 3495} {"train_loss": -25.816120147705078, "global_step": 290133, "epoch": 3495} {"train_loss": -25.463857650756836, "global_step": 290134, "epoch": 3495} {"train_loss": -25.42284393310547, "global_step": 290135, "epoch": 3495} {"train_loss": -25.525991439819336, "global_step": 290136, "epoch": 3495} {"train_loss": -25.328739166259766, "global_step": 290137, "epoch": 3495} {"train_loss": -25.548145294189453, "global_step": 290138, "epoch": 3495} {"train_loss": -25.447147369384766, "global_step": 290139, "epoch": 3495} {"train_loss": -25.253568649291992, "global_step": 290140, "epoch": 3495} {"train_loss": -25.34400749206543, "global_step": 290141, "epoch": 3495} {"train_loss": -25.48168182373047, "global_step": 290142, "epoch": 3495} {"train_loss": -25.391401290893555, "global_step": 290143, "epoch": 3495} {"train_loss": -25.367660522460938, "global_step": 290144, "epoch": 3495} {"train_loss": -25.276830673217773, "global_step": 290145, "epoch": 3495} {"train_loss": -25.223806381225586, "global_step": 290146, "epoch": 3495} {"train_loss": -25.233633041381836, "global_step": 290147, "epoch": 3495} {"train_loss": -25.23198127746582, "global_step": 290148, "epoch": 3495} {"train_loss": -25.694202423095703, "global_step": 290149, "epoch": 3495} {"train_loss": -25.3931827545166, "global_step": 290150, "epoch": 3495} {"train_loss": -25.29745864868164, "global_step": 290151, "epoch": 3495} {"train_loss": -25.28657341003418, "global_step": 290152, "epoch": 3495} {"train_loss": -25.394643783569336, "global_step": 290153, "epoch": 3495} {"train_loss": -25.502729415893555, "global_step": 290154, "epoch": 3495} {"train_loss": -25.260644912719727, "global_step": 290155, "epoch": 3495} {"train_loss": -25.51645851135254, "global_step": 290156, "epoch": 3495} {"train_loss": -25.3194580078125, "global_step": 290157, "epoch": 3495} {"train_loss": -25.975168228149414, "global_step": 290158, "epoch": 3495} {"train_loss": -25.46234703063965, "global_step": 290159, "epoch": 3495} {"train_loss": -25.613880157470703, "global_step": 290160, "epoch": 3495} {"train_loss": -25.42239761352539, "global_step": 290161, "epoch": 3495} {"train_loss": -25.970600128173828, "global_step": 290162, "epoch": 3495} {"train_loss": -25.5960636138916, "global_step": 290163, "epoch": 3495} {"train_loss": -25.570547103881836, "global_step": 290164, "epoch": 3495} {"train_loss": -25.327747344970703, "global_step": 290165, "epoch": 3495} {"train_loss": -25.481958389282227, "global_step": 290166, "epoch": 3495} {"train_loss": -25.4135879838323, "global_step": 290167, "epoch": 3495, "val_loss": 7137020.5} {"train_loss": -25.247743606567383, "global_step": 290168, "epoch": 3496} {"train_loss": -25.031360626220703, "global_step": 290169, "epoch": 3496} {"train_loss": -25.74262046813965, "global_step": 290170, "epoch": 3496} {"train_loss": -25.32240104675293, "global_step": 290171, "epoch": 3496} {"train_loss": -25.35548210144043, "global_step": 290172, "epoch": 3496} {"train_loss": -25.52252197265625, "global_step": 290173, "epoch": 3496} {"train_loss": -25.291099548339844, "global_step": 290174, "epoch": 3496} {"train_loss": -25.670251846313477, "global_step": 290175, "epoch": 3496} {"train_loss": -25.18814468383789, "global_step": 290176, "epoch": 3496} {"train_loss": -25.416608810424805, "global_step": 290177, "epoch": 3496} {"train_loss": -25.147294998168945, "global_step": 290178, "epoch": 3496} {"train_loss": -25.496511459350586, "global_step": 290179, "epoch": 3496} {"train_loss": -25.33795738220215, "global_step": 290180, "epoch": 3496} {"train_loss": -25.25704002380371, "global_step": 290181, "epoch": 3496} {"train_loss": -25.430234909057617, "global_step": 290182, "epoch": 3496} {"train_loss": -25.34125328063965, "global_step": 290183, "epoch": 3496} {"train_loss": -25.676294326782227, "global_step": 290184, "epoch": 3496} {"train_loss": -25.483945846557617, "global_step": 290185, "epoch": 3496} {"train_loss": -25.697620391845703, "global_step": 290186, "epoch": 3496} {"train_loss": -25.485992431640625, "global_step": 290187, "epoch": 3496} {"train_loss": -25.701648712158203, "global_step": 290188, "epoch": 3496} {"train_loss": -25.660369873046875, "global_step": 290189, "epoch": 3496} {"train_loss": -25.15100860595703, "global_step": 290190, "epoch": 3496} {"train_loss": -25.267372131347656, "global_step": 290191, "epoch": 3496} {"train_loss": -25.341930389404297, "global_step": 290192, "epoch": 3496} {"train_loss": -25.639867782592773, "global_step": 290193, "epoch": 3496} {"train_loss": -25.4105281829834, "global_step": 290194, "epoch": 3496} {"train_loss": -25.542896270751953, "global_step": 290195, "epoch": 3496} {"train_loss": -25.685718536376953, "global_step": 290196, "epoch": 3496} {"train_loss": -25.488794326782227, "global_step": 290197, "epoch": 3496} {"train_loss": -25.57916831970215, "global_step": 290198, "epoch": 3496} {"train_loss": -26.040334701538086, "global_step": 290199, "epoch": 3496} {"train_loss": -25.8458194732666, "global_step": 290200, "epoch": 3496} {"train_loss": -25.56104278564453, "global_step": 290201, "epoch": 3496} {"train_loss": -25.64444923400879, "global_step": 290202, "epoch": 3496} {"train_loss": -25.980920791625977, "global_step": 290203, "epoch": 3496} {"train_loss": -25.807941436767578, "global_step": 290204, "epoch": 3496} {"train_loss": -25.83281898498535, "global_step": 290205, "epoch": 3496} {"train_loss": -25.345256805419922, "global_step": 290206, "epoch": 3496} {"train_loss": -25.85181999206543, "global_step": 290207, "epoch": 3496} {"train_loss": -25.618366241455078, "global_step": 290208, "epoch": 3496} {"train_loss": -25.3355770111084, "global_step": 290209, "epoch": 3496} {"train_loss": -25.55922508239746, "global_step": 290210, "epoch": 3496} {"train_loss": -24.71259307861328, "global_step": 290211, "epoch": 3496} {"train_loss": -25.59195899963379, "global_step": 290212, "epoch": 3496} {"train_loss": -25.536184310913086, "global_step": 290213, "epoch": 3496} {"train_loss": -25.06540870666504, "global_step": 290214, "epoch": 3496} {"train_loss": -25.615814208984375, "global_step": 290215, "epoch": 3496} {"train_loss": -25.356931686401367, "global_step": 290216, "epoch": 3496} {"train_loss": -25.564184188842773, "global_step": 290217, "epoch": 3496} {"train_loss": -25.594194412231445, "global_step": 290218, "epoch": 3496} {"train_loss": -25.468793869018555, "global_step": 290219, "epoch": 3496} {"train_loss": -25.09248924255371, "global_step": 290220, "epoch": 3496} {"train_loss": -25.189491271972656, "global_step": 290221, "epoch": 3496} {"train_loss": -25.651838302612305, "global_step": 290222, "epoch": 3496} {"train_loss": -25.39669418334961, "global_step": 290223, "epoch": 3496} {"train_loss": -25.088560104370117, "global_step": 290224, "epoch": 3496} {"train_loss": -25.355297088623047, "global_step": 290225, "epoch": 3496} {"train_loss": -25.817060470581055, "global_step": 290226, "epoch": 3496} {"train_loss": -25.447866439819336, "global_step": 290227, "epoch": 3496} {"train_loss": -25.195308685302734, "global_step": 290228, "epoch": 3496} {"train_loss": -25.72904396057129, "global_step": 290229, "epoch": 3496} {"train_loss": -25.46841812133789, "global_step": 290230, "epoch": 3496} {"train_loss": -25.507566452026367, "global_step": 290231, "epoch": 3496} {"train_loss": -25.279178619384766, "global_step": 290232, "epoch": 3496} {"train_loss": -25.612390518188477, "global_step": 290233, "epoch": 3496} {"train_loss": -25.752328872680664, "global_step": 290234, "epoch": 3496} {"train_loss": -25.547700881958008, "global_step": 290235, "epoch": 3496} {"train_loss": -25.385793685913086, "global_step": 290236, "epoch": 3496} {"train_loss": -25.90863609313965, "global_step": 290237, "epoch": 3496} {"train_loss": -25.670392990112305, "global_step": 290238, "epoch": 3496} {"train_loss": -25.66908836364746, "global_step": 290239, "epoch": 3496} {"train_loss": -25.511089324951172, "global_step": 290240, "epoch": 3496} {"train_loss": -25.555282592773438, "global_step": 290241, "epoch": 3496} {"train_loss": -25.49843406677246, "global_step": 290242, "epoch": 3496} {"train_loss": -25.7567195892334, "global_step": 290243, "epoch": 3496} {"train_loss": -25.604324340820312, "global_step": 290244, "epoch": 3496} {"train_loss": -25.504364013671875, "global_step": 290245, "epoch": 3496} {"train_loss": -25.80978775024414, "global_step": 290246, "epoch": 3496} {"train_loss": -25.79584312438965, "global_step": 290247, "epoch": 3496} {"train_loss": -25.640527725219727, "global_step": 290248, "epoch": 3496} {"train_loss": -25.65765380859375, "global_step": 290249, "epoch": 3496} {"train_loss": -25.526629068765295, "global_step": 290250, "epoch": 3496, "val_loss": 7094700.0} {"train_loss": -21.094640731811523, "global_step": 290251, "epoch": 3497} {"train_loss": -22.10053253173828, "global_step": 290252, "epoch": 3497} {"train_loss": -24.034250259399414, "global_step": 290253, "epoch": 3497} {"train_loss": -23.672861099243164, "global_step": 290254, "epoch": 3497} {"train_loss": -23.983734130859375, "global_step": 290255, "epoch": 3497} {"train_loss": -24.366628646850586, "global_step": 290256, "epoch": 3497} {"train_loss": -24.347694396972656, "global_step": 290257, "epoch": 3497} {"train_loss": -24.367460250854492, "global_step": 290258, "epoch": 3497} {"train_loss": -24.282323837280273, "global_step": 290259, "epoch": 3497} {"train_loss": -24.388511657714844, "global_step": 290260, "epoch": 3497} {"train_loss": -24.776456832885742, "global_step": 290261, "epoch": 3497} {"train_loss": -24.487564086914062, "global_step": 290262, "epoch": 3497} {"train_loss": -24.625911712646484, "global_step": 290263, "epoch": 3497} {"train_loss": -24.34244728088379, "global_step": 290264, "epoch": 3497} {"train_loss": -24.898441314697266, "global_step": 290265, "epoch": 3497} {"train_loss": -24.467578887939453, "global_step": 290266, "epoch": 3497} {"train_loss": -24.6748046875, "global_step": 290267, "epoch": 3497} {"train_loss": -24.790517807006836, "global_step": 290268, "epoch": 3497} {"train_loss": -25.21738624572754, "global_step": 290269, "epoch": 3497} {"train_loss": -25.18366813659668, "global_step": 290270, "epoch": 3497} {"train_loss": -24.730606079101562, "global_step": 290271, "epoch": 3497} {"train_loss": -25.026561737060547, "global_step": 290272, "epoch": 3497} {"train_loss": -25.06909942626953, "global_step": 290273, "epoch": 3497} {"train_loss": -25.048391342163086, "global_step": 290274, "epoch": 3497} {"train_loss": -25.297719955444336, "global_step": 290275, "epoch": 3497} {"train_loss": -24.810609817504883, "global_step": 290276, "epoch": 3497} {"train_loss": -25.116796493530273, "global_step": 290277, "epoch": 3497} {"train_loss": -25.188451766967773, "global_step": 290278, "epoch": 3497} {"train_loss": -25.028867721557617, "global_step": 290279, "epoch": 3497} {"train_loss": -24.9190616607666, "global_step": 290280, "epoch": 3497} {"train_loss": -25.11138916015625, "global_step": 290281, "epoch": 3497} {"train_loss": -25.629444122314453, "global_step": 290282, "epoch": 3497} {"train_loss": -24.92183494567871, "global_step": 290283, "epoch": 3497} {"train_loss": -25.008106231689453, "global_step": 290284, "epoch": 3497} {"train_loss": -25.52045249938965, "global_step": 290285, "epoch": 3497} {"train_loss": -25.1629695892334, "global_step": 290286, "epoch": 3497} {"train_loss": -25.430919647216797, "global_step": 290287, "epoch": 3497} {"train_loss": -25.630752563476562, "global_step": 290288, "epoch": 3497} {"train_loss": -25.670242309570312, "global_step": 290289, "epoch": 3497} {"train_loss": -25.300840377807617, "global_step": 290290, "epoch": 3497} {"train_loss": -25.612600326538086, "global_step": 290291, "epoch": 3497} {"train_loss": -25.525007247924805, "global_step": 290292, "epoch": 3497} {"train_loss": -25.3701171875, "global_step": 290293, "epoch": 3497} {"train_loss": -25.406644821166992, "global_step": 290294, "epoch": 3497} {"train_loss": -25.517194747924805, "global_step": 290295, "epoch": 3497} {"train_loss": -25.329648971557617, "global_step": 290296, "epoch": 3497} {"train_loss": -25.49827003479004, "global_step": 290297, "epoch": 3497} {"train_loss": -25.352558135986328, "global_step": 290298, "epoch": 3497} {"train_loss": -25.686315536499023, "global_step": 290299, "epoch": 3497} {"train_loss": -25.745681762695312, "global_step": 290300, "epoch": 3497} {"train_loss": -25.491432189941406, "global_step": 290301, "epoch": 3497} {"train_loss": -25.65394401550293, "global_step": 290302, "epoch": 3497} {"train_loss": -25.502735137939453, "global_step": 290303, "epoch": 3497} {"train_loss": -25.63395118713379, "global_step": 290304, "epoch": 3497} {"train_loss": -25.749963760375977, "global_step": 290305, "epoch": 3497} {"train_loss": -25.520462036132812, "global_step": 290306, "epoch": 3497} {"train_loss": -25.97035789489746, "global_step": 290307, "epoch": 3497} {"train_loss": -25.386404037475586, "global_step": 290308, "epoch": 3497} {"train_loss": -25.73841667175293, "global_step": 290309, "epoch": 3497} {"train_loss": -25.781564712524414, "global_step": 290310, "epoch": 3497} {"train_loss": -25.432804107666016, "global_step": 290311, "epoch": 3497} {"train_loss": -25.594179153442383, "global_step": 290312, "epoch": 3497} {"train_loss": -25.480146408081055, "global_step": 290313, "epoch": 3497} {"train_loss": -25.387054443359375, "global_step": 290314, "epoch": 3497} {"train_loss": -25.722808837890625, "global_step": 290315, "epoch": 3497} {"train_loss": -25.333269119262695, "global_step": 290316, "epoch": 3497} {"train_loss": -25.8055362701416, "global_step": 290317, "epoch": 3497} {"train_loss": -25.110849380493164, "global_step": 290318, "epoch": 3497} {"train_loss": -25.56390953063965, "global_step": 290319, "epoch": 3497} {"train_loss": -25.743627548217773, "global_step": 290320, "epoch": 3497} {"train_loss": -25.593549728393555, "global_step": 290321, "epoch": 3497} {"train_loss": -25.60236167907715, "global_step": 290322, "epoch": 3497} {"train_loss": -25.530250549316406, "global_step": 290323, "epoch": 3497} {"train_loss": -25.532670974731445, "global_step": 290324, "epoch": 3497} {"train_loss": -25.63120460510254, "global_step": 290325, "epoch": 3497} {"train_loss": -25.291349411010742, "global_step": 290326, "epoch": 3497} {"train_loss": -25.851139068603516, "global_step": 290327, "epoch": 3497} {"train_loss": -25.748273849487305, "global_step": 290328, "epoch": 3497} {"train_loss": -25.7661075592041, "global_step": 290329, "epoch": 3497} {"train_loss": -25.751972198486328, "global_step": 290330, "epoch": 3497} {"train_loss": -25.706933975219727, "global_step": 290331, "epoch": 3497} {"train_loss": -25.476810455322266, "global_step": 290332, "epoch": 3497} {"train_loss": -25.14950140987534, "global_step": 290333, "epoch": 3497, "val_loss": 7114476.0} {"train_loss": -25.074045181274414, "global_step": 290334, "epoch": 3498} {"train_loss": -24.90522575378418, "global_step": 290335, "epoch": 3498} {"train_loss": -24.875917434692383, "global_step": 290336, "epoch": 3498} {"train_loss": -25.113107681274414, "global_step": 290337, "epoch": 3498} {"train_loss": -24.788129806518555, "global_step": 290338, "epoch": 3498} {"train_loss": -24.443696975708008, "global_step": 290339, "epoch": 3498} {"train_loss": -25.03362464904785, "global_step": 290340, "epoch": 3498} {"train_loss": -25.200180053710938, "global_step": 290341, "epoch": 3498} {"train_loss": -24.721410751342773, "global_step": 290342, "epoch": 3498} {"train_loss": -24.310382843017578, "global_step": 290343, "epoch": 3498} {"train_loss": -25.069700241088867, "global_step": 290344, "epoch": 3498} {"train_loss": -24.909536361694336, "global_step": 290345, "epoch": 3498} {"train_loss": -24.557037353515625, "global_step": 290346, "epoch": 3498} {"train_loss": -25.285011291503906, "global_step": 290347, "epoch": 3498} {"train_loss": -24.944934844970703, "global_step": 290348, "epoch": 3498} {"train_loss": -24.814517974853516, "global_step": 290349, "epoch": 3498} {"train_loss": -25.048397064208984, "global_step": 290350, "epoch": 3498} {"train_loss": -25.489797592163086, "global_step": 290351, "epoch": 3498} {"train_loss": -25.2779541015625, "global_step": 290352, "epoch": 3498} {"train_loss": -24.946874618530273, "global_step": 290353, "epoch": 3498} {"train_loss": -25.5296630859375, "global_step": 290354, "epoch": 3498} {"train_loss": -25.34551429748535, "global_step": 290355, "epoch": 3498} {"train_loss": -25.325918197631836, "global_step": 290356, "epoch": 3498} {"train_loss": -25.28531265258789, "global_step": 290357, "epoch": 3498} {"train_loss": -25.12383460998535, "global_step": 290358, "epoch": 3498} {"train_loss": -25.706838607788086, "global_step": 290359, "epoch": 3498} {"train_loss": -25.334348678588867, "global_step": 290360, "epoch": 3498} {"train_loss": -25.538137435913086, "global_step": 290361, "epoch": 3498} {"train_loss": -25.454486846923828, "global_step": 290362, "epoch": 3498} {"train_loss": -25.606246948242188, "global_step": 290363, "epoch": 3498} {"train_loss": -25.658721923828125, "global_step": 290364, "epoch": 3498} {"train_loss": -25.5484676361084, "global_step": 290365, "epoch": 3498} {"train_loss": -25.26373863220215, "global_step": 290366, "epoch": 3498} {"train_loss": -25.493879318237305, "global_step": 290367, "epoch": 3498} {"train_loss": -25.68574333190918, "global_step": 290368, "epoch": 3498} {"train_loss": -25.31932830810547, "global_step": 290369, "epoch": 3498} {"train_loss": -25.231260299682617, "global_step": 290370, "epoch": 3498} {"train_loss": -25.625890731811523, "global_step": 290371, "epoch": 3498} {"train_loss": -25.68429946899414, "global_step": 290372, "epoch": 3498} {"train_loss": -25.60698890686035, "global_step": 290373, "epoch": 3498} {"train_loss": -25.5019588470459, "global_step": 290374, "epoch": 3498} {"train_loss": -25.893827438354492, "global_step": 290375, "epoch": 3498} {"train_loss": -25.704578399658203, "global_step": 290376, "epoch": 3498} {"train_loss": -25.8117618560791, "global_step": 290377, "epoch": 3498} {"train_loss": -25.720312118530273, "global_step": 290378, "epoch": 3498} {"train_loss": -25.571619033813477, "global_step": 290379, "epoch": 3498} {"train_loss": -25.80509376525879, "global_step": 290380, "epoch": 3498} {"train_loss": -25.59956932067871, "global_step": 290381, "epoch": 3498} {"train_loss": -25.637800216674805, "global_step": 290382, "epoch": 3498} {"train_loss": -25.481067657470703, "global_step": 290383, "epoch": 3498} {"train_loss": -25.730499267578125, "global_step": 290384, "epoch": 3498} {"train_loss": -25.653289794921875, "global_step": 290385, "epoch": 3498} {"train_loss": -25.540939331054688, "global_step": 290386, "epoch": 3498} {"train_loss": -26.14679527282715, "global_step": 290387, "epoch": 3498} {"train_loss": -25.537900924682617, "global_step": 290388, "epoch": 3498} {"train_loss": -25.64349365234375, "global_step": 290389, "epoch": 3498} {"train_loss": -25.796340942382812, "global_step": 290390, "epoch": 3498} {"train_loss": -25.764814376831055, "global_step": 290391, "epoch": 3498} {"train_loss": -25.607648849487305, "global_step": 290392, "epoch": 3498} {"train_loss": -25.47871208190918, "global_step": 290393, "epoch": 3498} {"train_loss": -25.685998916625977, "global_step": 290394, "epoch": 3498} {"train_loss": -25.626676559448242, "global_step": 290395, "epoch": 3498} {"train_loss": -25.909748077392578, "global_step": 290396, "epoch": 3498} {"train_loss": -25.859643936157227, "global_step": 290397, "epoch": 3498} {"train_loss": -25.718809127807617, "global_step": 290398, "epoch": 3498} {"train_loss": -25.637929916381836, "global_step": 290399, "epoch": 3498} {"train_loss": -25.762481689453125, "global_step": 290400, "epoch": 3498} {"train_loss": -25.61736488342285, "global_step": 290401, "epoch": 3498} {"train_loss": -25.950641632080078, "global_step": 290402, "epoch": 3498} {"train_loss": -25.437965393066406, "global_step": 290403, "epoch": 3498} {"train_loss": -25.446447372436523, "global_step": 290404, "epoch": 3498} {"train_loss": -25.505374908447266, "global_step": 290405, "epoch": 3498} {"train_loss": -25.63970375061035, "global_step": 290406, "epoch": 3498} {"train_loss": -25.84018898010254, "global_step": 290407, "epoch": 3498} {"train_loss": -25.66889762878418, "global_step": 290408, "epoch": 3498} {"train_loss": -25.694732666015625, "global_step": 290409, "epoch": 3498} {"train_loss": -25.5024471282959, "global_step": 290410, "epoch": 3498} {"train_loss": -25.24273109436035, "global_step": 290411, "epoch": 3498} {"train_loss": -25.764326095581055, "global_step": 290412, "epoch": 3498} {"train_loss": -25.45282554626465, "global_step": 290413, "epoch": 3498} {"train_loss": -25.484039306640625, "global_step": 290414, "epoch": 3498} {"train_loss": -25.28627586364746, "global_step": 290415, "epoch": 3498} {"train_loss": -25.434255324214337, "global_step": 290416, "epoch": 3498, "val_loss": 7183605.0} {"train_loss": -24.412118911743164, "global_step": 290417, "epoch": 3499} {"train_loss": -23.737260818481445, "global_step": 290418, "epoch": 3499} {"train_loss": -24.577411651611328, "global_step": 290419, "epoch": 3499} {"train_loss": -24.75252342224121, "global_step": 290420, "epoch": 3499} {"train_loss": -24.34638214111328, "global_step": 290421, "epoch": 3499} {"train_loss": -24.74715232849121, "global_step": 290422, "epoch": 3499} {"train_loss": -24.758092880249023, "global_step": 290423, "epoch": 3499} {"train_loss": -24.720518112182617, "global_step": 290424, "epoch": 3499} {"train_loss": -24.84095001220703, "global_step": 290425, "epoch": 3499} {"train_loss": -24.73988914489746, "global_step": 290426, "epoch": 3499} {"train_loss": -24.908275604248047, "global_step": 290427, "epoch": 3499} {"train_loss": -24.913942337036133, "global_step": 290428, "epoch": 3499} {"train_loss": -25.118677139282227, "global_step": 290429, "epoch": 3499} {"train_loss": -24.743825912475586, "global_step": 290430, "epoch": 3499} {"train_loss": -25.152286529541016, "global_step": 290431, "epoch": 3499} {"train_loss": -24.78577423095703, "global_step": 290432, "epoch": 3499} {"train_loss": -25.375905990600586, "global_step": 290433, "epoch": 3499} {"train_loss": -24.98050308227539, "global_step": 290434, "epoch": 3499} {"train_loss": -25.17700958251953, "global_step": 290435, "epoch": 3499} {"train_loss": -25.140689849853516, "global_step": 290436, "epoch": 3499} {"train_loss": -24.979528427124023, "global_step": 290437, "epoch": 3499} {"train_loss": -25.715185165405273, "global_step": 290438, "epoch": 3499} {"train_loss": -25.295324325561523, "global_step": 290439, "epoch": 3499} {"train_loss": -25.474960327148438, "global_step": 290440, "epoch": 3499} {"train_loss": -25.2884578704834, "global_step": 290441, "epoch": 3499} {"train_loss": -25.517911911010742, "global_step": 290442, "epoch": 3499} {"train_loss": -25.26702308654785, "global_step": 290443, "epoch": 3499} {"train_loss": -25.44331169128418, "global_step": 290444, "epoch": 3499} {"train_loss": -25.45331573486328, "global_step": 290445, "epoch": 3499} {"train_loss": -25.02394676208496, "global_step": 290446, "epoch": 3499} {"train_loss": -25.615488052368164, "global_step": 290447, "epoch": 3499} {"train_loss": -25.810659408569336, "global_step": 290448, "epoch": 3499} {"train_loss": -24.967147827148438, "global_step": 290449, "epoch": 3499} {"train_loss": -25.192094802856445, "global_step": 290450, "epoch": 3499} {"train_loss": -25.174901962280273, "global_step": 290451, "epoch": 3499} {"train_loss": -25.29479217529297, "global_step": 290452, "epoch": 3499} {"train_loss": -25.69283103942871, "global_step": 290453, "epoch": 3499} {"train_loss": -25.68378257751465, "global_step": 290454, "epoch": 3499} {"train_loss": -25.72443199157715, "global_step": 290455, "epoch": 3499} {"train_loss": -25.433351516723633, "global_step": 290456, "epoch": 3499} {"train_loss": -25.540071487426758, "global_step": 290457, "epoch": 3499} {"train_loss": -25.427812576293945, "global_step": 290458, "epoch": 3499} {"train_loss": -25.83526611328125, "global_step": 290459, "epoch": 3499} {"train_loss": -25.432477951049805, "global_step": 290460, "epoch": 3499} {"train_loss": -25.50712013244629, "global_step": 290461, "epoch": 3499} {"train_loss": -25.734601974487305, "global_step": 290462, "epoch": 3499} {"train_loss": -25.7287654876709, "global_step": 290463, "epoch": 3499} {"train_loss": -25.549238204956055, "global_step": 290464, "epoch": 3499} {"train_loss": -25.411130905151367, "global_step": 290465, "epoch": 3499} {"train_loss": -25.5328426361084, "global_step": 290466, "epoch": 3499} {"train_loss": -25.36972999572754, "global_step": 290467, "epoch": 3499} {"train_loss": -25.66761589050293, "global_step": 290468, "epoch": 3499} {"train_loss": -25.75225830078125, "global_step": 290469, "epoch": 3499} {"train_loss": -25.755203247070312, "global_step": 290470, "epoch": 3499} {"train_loss": -25.469440460205078, "global_step": 290471, "epoch": 3499} {"train_loss": -24.957061767578125, "global_step": 290472, "epoch": 3499} {"train_loss": -25.67926597595215, "global_step": 290473, "epoch": 3499} {"train_loss": -25.685033798217773, "global_step": 290474, "epoch": 3499} {"train_loss": -25.78470230102539, "global_step": 290475, "epoch": 3499} {"train_loss": -25.569814682006836, "global_step": 290476, "epoch": 3499} {"train_loss": -25.452741622924805, "global_step": 290477, "epoch": 3499} {"train_loss": -25.834537506103516, "global_step": 290478, "epoch": 3499} {"train_loss": -25.668554306030273, "global_step": 290479, "epoch": 3499} {"train_loss": -25.53358268737793, "global_step": 290480, "epoch": 3499} {"train_loss": -25.78632926940918, "global_step": 290481, "epoch": 3499} {"train_loss": -25.361921310424805, "global_step": 290482, "epoch": 3499} {"train_loss": -25.977035522460938, "global_step": 290483, "epoch": 3499} {"train_loss": -25.736927032470703, "global_step": 290484, "epoch": 3499} {"train_loss": -25.2762508392334, "global_step": 290485, "epoch": 3499} {"train_loss": -25.057769775390625, "global_step": 290486, "epoch": 3499} {"train_loss": -25.07090187072754, "global_step": 290487, "epoch": 3499} {"train_loss": -25.809528350830078, "global_step": 290488, "epoch": 3499} {"train_loss": -25.827051162719727, "global_step": 290489, "epoch": 3499} {"train_loss": -25.00200653076172, "global_step": 290490, "epoch": 3499} {"train_loss": -25.525964736938477, "global_step": 290491, "epoch": 3499} {"train_loss": -25.71656608581543, "global_step": 290492, "epoch": 3499} {"train_loss": -25.562070846557617, "global_step": 290493, "epoch": 3499} {"train_loss": -25.544403076171875, "global_step": 290494, "epoch": 3499} {"train_loss": -25.712549209594727, "global_step": 290495, "epoch": 3499} {"train_loss": -25.65781021118164, "global_step": 290496, "epoch": 3499} {"train_loss": -25.629796981811523, "global_step": 290497, "epoch": 3499} {"train_loss": -25.693012237548828, "global_step": 290498, "epoch": 3499} {"train_loss": -25.333697491381542, "global_step": 290499, "epoch": 3499, "val_loss": 7186357.0} {"train_loss": -25.075117111206055, "global_step": 290500, "epoch": 3500} {"train_loss": -25.099021911621094, "global_step": 290501, "epoch": 3500} {"train_loss": -25.109220504760742, "global_step": 290502, "epoch": 3500} {"train_loss": -25.311044692993164, "global_step": 290503, "epoch": 3500} {"train_loss": -25.161527633666992, "global_step": 290504, "epoch": 3500} {"train_loss": -24.88199234008789, "global_step": 290505, "epoch": 3500} {"train_loss": -25.074371337890625, "global_step": 290506, "epoch": 3500} {"train_loss": -25.500749588012695, "global_step": 290507, "epoch": 3500} {"train_loss": -25.025726318359375, "global_step": 290508, "epoch": 3500} {"train_loss": -25.094951629638672, "global_step": 290509, "epoch": 3500} {"train_loss": -25.15406608581543, "global_step": 290510, "epoch": 3500} {"train_loss": -25.486858367919922, "global_step": 290511, "epoch": 3500} {"train_loss": -25.42451286315918, "global_step": 290512, "epoch": 3500} {"train_loss": -25.459875106811523, "global_step": 290513, "epoch": 3500} {"train_loss": -25.68240737915039, "global_step": 290514, "epoch": 3500} {"train_loss": -25.329477310180664, "global_step": 290515, "epoch": 3500} {"train_loss": -25.1257266998291, "global_step": 290516, "epoch": 3500} {"train_loss": -25.483259201049805, "global_step": 290517, "epoch": 3500} {"train_loss": -25.559606552124023, "global_step": 290518, "epoch": 3500} {"train_loss": -25.179218292236328, "global_step": 290519, "epoch": 3500} {"train_loss": -25.48451042175293, "global_step": 290520, "epoch": 3500} {"train_loss": -25.81198501586914, "global_step": 290521, "epoch": 3500} {"train_loss": -25.211965560913086, "global_step": 290522, "epoch": 3500} {"train_loss": -25.75885581970215, "global_step": 290523, "epoch": 3500} {"train_loss": -25.56954574584961, "global_step": 290524, "epoch": 3500} {"train_loss": -25.21937370300293, "global_step": 290525, "epoch": 3500} {"train_loss": -25.58107566833496, "global_step": 290526, "epoch": 3500} {"train_loss": -25.073841094970703, "global_step": 290527, "epoch": 3500} {"train_loss": -25.52048110961914, "global_step": 290528, "epoch": 3500} {"train_loss": -25.618057250976562, "global_step": 290529, "epoch": 3500} {"train_loss": -25.34397315979004, "global_step": 290530, "epoch": 3500} {"train_loss": -25.6361083984375, "global_step": 290531, "epoch": 3500} {"train_loss": -25.396163940429688, "global_step": 290532, "epoch": 3500} {"train_loss": -25.396320343017578, "global_step": 290533, "epoch": 3500} {"train_loss": -25.379514694213867, "global_step": 290534, "epoch": 3500} {"train_loss": -25.17995834350586, "global_step": 290535, "epoch": 3500} {"train_loss": -25.437358856201172, "global_step": 290536, "epoch": 3500} {"train_loss": -25.206802368164062, "global_step": 290537, "epoch": 3500} {"train_loss": -25.54550552368164, "global_step": 290538, "epoch": 3500} {"train_loss": -25.583206176757812, "global_step": 290539, "epoch": 3500} {"train_loss": -25.55727195739746, "global_step": 290540, "epoch": 3500} {"train_loss": -25.297208786010742, "global_step": 290541, "epoch": 3500} {"train_loss": -25.853307723999023, "global_step": 290542, "epoch": 3500} {"train_loss": -25.773208618164062, "global_step": 290543, "epoch": 3500} {"train_loss": -25.86524772644043, "global_step": 290544, "epoch": 3500} {"train_loss": -25.545639038085938, "global_step": 290545, "epoch": 3500} {"train_loss": -25.565784454345703, "global_step": 290546, "epoch": 3500} {"train_loss": -25.7525691986084, "global_step": 290547, "epoch": 3500} {"train_loss": -25.314985275268555, "global_step": 290548, "epoch": 3500} {"train_loss": -25.760623931884766, "global_step": 290549, "epoch": 3500} {"train_loss": -25.57288360595703, "global_step": 290550, "epoch": 3500} {"train_loss": -24.995351791381836, "global_step": 290551, "epoch": 3500} {"train_loss": -25.78474235534668, "global_step": 290552, "epoch": 3500} {"train_loss": -25.584369659423828, "global_step": 290553, "epoch": 3500} {"train_loss": -25.0188045501709, "global_step": 290554, "epoch": 3500} {"train_loss": -25.380176544189453, "global_step": 290555, "epoch": 3500} {"train_loss": -25.7039794921875, "global_step": 290556, "epoch": 3500} {"train_loss": -25.519643783569336, "global_step": 290557, "epoch": 3500} {"train_loss": -25.228384017944336, "global_step": 290558, "epoch": 3500} {"train_loss": -25.85141372680664, "global_step": 290559, "epoch": 3500} {"train_loss": -25.28627586364746, "global_step": 290560, "epoch": 3500} {"train_loss": -25.68670654296875, "global_step": 290561, "epoch": 3500} {"train_loss": -25.659536361694336, "global_step": 290562, "epoch": 3500} {"train_loss": -25.665258407592773, "global_step": 290563, "epoch": 3500} {"train_loss": -25.451934814453125, "global_step": 290564, "epoch": 3500} {"train_loss": -25.232648849487305, "global_step": 290565, "epoch": 3500} {"train_loss": -25.785232543945312, "global_step": 290566, "epoch": 3500} {"train_loss": -25.522598266601562, "global_step": 290567, "epoch": 3500} {"train_loss": -25.973127365112305, "global_step": 290568, "epoch": 3500} {"train_loss": -24.83906364440918, "global_step": 290569, "epoch": 3500} {"train_loss": -25.068065643310547, "global_step": 290570, "epoch": 3500} {"train_loss": -24.6540584564209, "global_step": 290571, "epoch": 3500} {"train_loss": -24.7076416015625, "global_step": 290572, "epoch": 3500} {"train_loss": -25.229637145996094, "global_step": 290573, "epoch": 3500} {"train_loss": -25.78388023376465, "global_step": 290574, "epoch": 3500} {"train_loss": -24.83119773864746, "global_step": 290575, "epoch": 3500} {"train_loss": -25.362388610839844, "global_step": 290576, "epoch": 3500} {"train_loss": -25.625614166259766, "global_step": 290577, "epoch": 3500} {"train_loss": -25.204092025756836, "global_step": 290578, "epoch": 3500} {"train_loss": -25.638769149780273, "global_step": 290579, "epoch": 3500} {"train_loss": -25.359989166259766, "global_step": 290580, "epoch": 3500} {"train_loss": -25.408201217651367, "global_step": 290581, "epoch": 3500} {"train_loss": -25.417955214718738, "global_step": 290582, "epoch": 3500, "train/sim_max_reward_0": 1.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4500000": 1.0, "test/sim_max_reward_4500001": 1.0, "test/sim_max_reward_4500002": 1.0, "test/sim_max_reward_4500003": 1.0, "test/sim_max_reward_4500004": 0.0, "test/sim_max_reward_4500005": 1.0, "test/sim_max_reward_4500006": 1.0, "test/sim_max_reward_4500007": 0.0, "test/sim_max_reward_4500008": 1.0, "test/sim_max_reward_4500009": 1.0, "test/sim_max_reward_4500010": 1.0, "test/sim_max_reward_4500011": 1.0, "test/sim_max_reward_4500012": 1.0, "test/sim_max_reward_4500013": 1.0, "test/sim_max_reward_4500014": 1.0, "test/sim_max_reward_4500015": 1.0, "test/sim_max_reward_4500016": 1.0, "test/sim_max_reward_4500017": 1.0, "test/sim_max_reward_4500018": 1.0, "test/sim_max_reward_4500019": 1.0, "test/sim_max_reward_4500020": 1.0, "test/sim_max_reward_4500021": 1.0, "train/mean_score": 1.0, "test/mean_score": 0.9090909090909091, "val_loss": 6998943.0} {"train_loss": -25.296585083007812, "global_step": 290583, "epoch": 3501} {"train_loss": -24.96623992919922, "global_step": 290584, "epoch": 3501} {"train_loss": -24.47776222229004, "global_step": 290585, "epoch": 3501} {"train_loss": -25.107084274291992, "global_step": 290586, "epoch": 3501} {"train_loss": -25.015552520751953, "global_step": 290587, "epoch": 3501} {"train_loss": -24.43567657470703, "global_step": 290588, "epoch": 3501} {"train_loss": -25.11362075805664, "global_step": 290589, "epoch": 3501} {"train_loss": -25.40353012084961, "global_step": 290590, "epoch": 3501} {"train_loss": -24.802942276000977, "global_step": 290591, "epoch": 3501} {"train_loss": -24.756298065185547, "global_step": 290592, "epoch": 3501} {"train_loss": -25.04265785217285, "global_step": 290593, "epoch": 3501} {"train_loss": -24.752796173095703, "global_step": 290594, "epoch": 3501} {"train_loss": -25.30083656311035, "global_step": 290595, "epoch": 3501} {"train_loss": -25.012910842895508, "global_step": 290596, "epoch": 3501} {"train_loss": -25.308725357055664, "global_step": 290597, "epoch": 3501} {"train_loss": -25.492265701293945, "global_step": 290598, "epoch": 3501} {"train_loss": -24.95059585571289, "global_step": 290599, "epoch": 3501} {"train_loss": -25.171995162963867, "global_step": 290600, "epoch": 3501} {"train_loss": -25.087186813354492, "global_step": 290601, "epoch": 3501} {"train_loss": -25.033023834228516, "global_step": 290602, "epoch": 3501} {"train_loss": -25.167654037475586, "global_step": 290603, "epoch": 3501} {"train_loss": -25.2487850189209, "global_step": 290604, "epoch": 3501} {"train_loss": -25.3382568359375, "global_step": 290605, "epoch": 3501} {"train_loss": -25.13248062133789, "global_step": 290606, "epoch": 3501} {"train_loss": -25.319242477416992, "global_step": 290607, "epoch": 3501} {"train_loss": -25.364591598510742, "global_step": 290608, "epoch": 3501} {"train_loss": -25.41262435913086, "global_step": 290609, "epoch": 3501} {"train_loss": -25.421213150024414, "global_step": 290610, "epoch": 3501} {"train_loss": -25.769622802734375, "global_step": 290611, "epoch": 3501} {"train_loss": -25.314756393432617, "global_step": 290612, "epoch": 3501} {"train_loss": -25.746356964111328, "global_step": 290613, "epoch": 3501} {"train_loss": -25.324005126953125, "global_step": 290614, "epoch": 3501} {"train_loss": -25.570964813232422, "global_step": 290615, "epoch": 3501} {"train_loss": -25.520505905151367, "global_step": 290616, "epoch": 3501} {"train_loss": -25.88361167907715, "global_step": 290617, "epoch": 3501} {"train_loss": -25.74176597595215, "global_step": 290618, "epoch": 3501} {"train_loss": -25.807310104370117, "global_step": 290619, "epoch": 3501} {"train_loss": -25.417478561401367, "global_step": 290620, "epoch": 3501} {"train_loss": -25.320709228515625, "global_step": 290621, "epoch": 3501} {"train_loss": -25.36659049987793, "global_step": 290622, "epoch": 3501} {"train_loss": -25.395767211914062, "global_step": 290623, "epoch": 3501} {"train_loss": -25.567611694335938, "global_step": 290624, "epoch": 3501} {"train_loss": -25.407190322875977, "global_step": 290625, "epoch": 3501} {"train_loss": -25.882160186767578, "global_step": 290626, "epoch": 3501} {"train_loss": -25.7236270904541, "global_step": 290627, "epoch": 3501} {"train_loss": -25.987842559814453, "global_step": 290628, "epoch": 3501} {"train_loss": -25.546165466308594, "global_step": 290629, "epoch": 3501} {"train_loss": -25.644474029541016, "global_step": 290630, "epoch": 3501} {"train_loss": -25.67146110534668, "global_step": 290631, "epoch": 3501} {"train_loss": -25.72468376159668, "global_step": 290632, "epoch": 3501} {"train_loss": -26.070409774780273, "global_step": 290633, "epoch": 3501} {"train_loss": -25.978002548217773, "global_step": 290634, "epoch": 3501} {"train_loss": -25.6152400970459, "global_step": 290635, "epoch": 3501} {"train_loss": -25.79461669921875, "global_step": 290636, "epoch": 3501} {"train_loss": -25.525651931762695, "global_step": 290637, "epoch": 3501} {"train_loss": -25.49521827697754, "global_step": 290638, "epoch": 3501} {"train_loss": -25.348539352416992, "global_step": 290639, "epoch": 3501} {"train_loss": -25.024072647094727, "global_step": 290640, "epoch": 3501} {"train_loss": -25.55611801147461, "global_step": 290641, "epoch": 3501} {"train_loss": -25.6562557220459, "global_step": 290642, "epoch": 3501} {"train_loss": -25.324951171875, "global_step": 290643, "epoch": 3501} {"train_loss": -25.129308700561523, "global_step": 290644, "epoch": 3501} {"train_loss": -25.84645652770996, "global_step": 290645, "epoch": 3501} {"train_loss": -25.64133071899414, "global_step": 290646, "epoch": 3501} {"train_loss": -25.185333251953125, "global_step": 290647, "epoch": 3501} {"train_loss": -25.634918212890625, "global_step": 290648, "epoch": 3501} {"train_loss": -25.510530471801758, "global_step": 290649, "epoch": 3501} {"train_loss": -24.949033737182617, "global_step": 290650, "epoch": 3501} {"train_loss": -25.609827041625977, "global_step": 290651, "epoch": 3501} {"train_loss": -25.16534996032715, "global_step": 290652, "epoch": 3501} {"train_loss": -25.214956283569336, "global_step": 290653, "epoch": 3501} {"train_loss": -25.433801651000977, "global_step": 290654, "epoch": 3501} {"train_loss": -25.615346908569336, "global_step": 290655, "epoch": 3501} {"train_loss": -24.898405075073242, "global_step": 290656, "epoch": 3501} {"train_loss": -24.88846206665039, "global_step": 290657, "epoch": 3501} {"train_loss": -25.75653076171875, "global_step": 290658, "epoch": 3501} {"train_loss": -25.20994758605957, "global_step": 290659, "epoch": 3501} {"train_loss": -25.6021671295166, "global_step": 290660, "epoch": 3501} {"train_loss": -25.395965576171875, "global_step": 290661, "epoch": 3501} {"train_loss": -25.44630241394043, "global_step": 290662, "epoch": 3501} {"train_loss": -25.016576766967773, "global_step": 290663, "epoch": 3501} {"train_loss": -25.54530143737793, "global_step": 290664, "epoch": 3501} {"train_loss": -25.371676732258624, "global_step": 290665, "epoch": 3501, "val_loss": 7175328.0} {"train_loss": -25.186708450317383, "global_step": 290666, "epoch": 3502} {"train_loss": -25.306697845458984, "global_step": 290667, "epoch": 3502} {"train_loss": -25.622968673706055, "global_step": 290668, "epoch": 3502} {"train_loss": -25.255901336669922, "global_step": 290669, "epoch": 3502} {"train_loss": -25.147993087768555, "global_step": 290670, "epoch": 3502} {"train_loss": -25.536975860595703, "global_step": 290671, "epoch": 3502} {"train_loss": -25.664411544799805, "global_step": 290672, "epoch": 3502} {"train_loss": -25.35675621032715, "global_step": 290673, "epoch": 3502} {"train_loss": -25.0638484954834, "global_step": 290674, "epoch": 3502} {"train_loss": -25.269962310791016, "global_step": 290675, "epoch": 3502} {"train_loss": -25.14548683166504, "global_step": 290676, "epoch": 3502} {"train_loss": -25.312589645385742, "global_step": 290677, "epoch": 3502} {"train_loss": -25.493602752685547, "global_step": 290678, "epoch": 3502} {"train_loss": -25.591598510742188, "global_step": 290679, "epoch": 3502} {"train_loss": -25.415266036987305, "global_step": 290680, "epoch": 3502} {"train_loss": -25.6436710357666, "global_step": 290681, "epoch": 3502} {"train_loss": -25.589448928833008, "global_step": 290682, "epoch": 3502} {"train_loss": -25.274688720703125, "global_step": 290683, "epoch": 3502} {"train_loss": -25.164920806884766, "global_step": 290684, "epoch": 3502} {"train_loss": -25.538049697875977, "global_step": 290685, "epoch": 3502} {"train_loss": -25.414052963256836, "global_step": 290686, "epoch": 3502} {"train_loss": -25.06138801574707, "global_step": 290687, "epoch": 3502} {"train_loss": -25.80584144592285, "global_step": 290688, "epoch": 3502} {"train_loss": -25.433799743652344, "global_step": 290689, "epoch": 3502} {"train_loss": -25.325895309448242, "global_step": 290690, "epoch": 3502} {"train_loss": -25.631200790405273, "global_step": 290691, "epoch": 3502} {"train_loss": -25.61789894104004, "global_step": 290692, "epoch": 3502} {"train_loss": -25.394742965698242, "global_step": 290693, "epoch": 3502} {"train_loss": -25.416400909423828, "global_step": 290694, "epoch": 3502} {"train_loss": -25.58002281188965, "global_step": 290695, "epoch": 3502} {"train_loss": -25.730148315429688, "global_step": 290696, "epoch": 3502} {"train_loss": -25.448287963867188, "global_step": 290697, "epoch": 3502} {"train_loss": -25.208293914794922, "global_step": 290698, "epoch": 3502} {"train_loss": -25.97031593322754, "global_step": 290699, "epoch": 3502} {"train_loss": -25.58461570739746, "global_step": 290700, "epoch": 3502} {"train_loss": -25.7530460357666, "global_step": 290701, "epoch": 3502} {"train_loss": -25.952268600463867, "global_step": 290702, "epoch": 3502} {"train_loss": -25.801008224487305, "global_step": 290703, "epoch": 3502} {"train_loss": -25.4425048828125, "global_step": 290704, "epoch": 3502} {"train_loss": -25.225778579711914, "global_step": 290705, "epoch": 3502} {"train_loss": -25.442853927612305, "global_step": 290706, "epoch": 3502} {"train_loss": -25.1541805267334, "global_step": 290707, "epoch": 3502} {"train_loss": -25.644052505493164, "global_step": 290708, "epoch": 3502} {"train_loss": -25.846654891967773, "global_step": 290709, "epoch": 3502} {"train_loss": -25.481321334838867, "global_step": 290710, "epoch": 3502} {"train_loss": -26.02058219909668, "global_step": 290711, "epoch": 3502} {"train_loss": -25.548934936523438, "global_step": 290712, "epoch": 3502} {"train_loss": -25.63673210144043, "global_step": 290713, "epoch": 3502} {"train_loss": -25.8752384185791, "global_step": 290714, "epoch": 3502} {"train_loss": -25.517698287963867, "global_step": 290715, "epoch": 3502} {"train_loss": -25.933486938476562, "global_step": 290716, "epoch": 3502} {"train_loss": -26.02849769592285, "global_step": 290717, "epoch": 3502} {"train_loss": -25.820526123046875, "global_step": 290718, "epoch": 3502} {"train_loss": -25.55818748474121, "global_step": 290719, "epoch": 3502} {"train_loss": -25.366539001464844, "global_step": 290720, "epoch": 3502} {"train_loss": -25.607528686523438, "global_step": 290721, "epoch": 3502} {"train_loss": -25.4803409576416, "global_step": 290722, "epoch": 3502} {"train_loss": -25.456281661987305, "global_step": 290723, "epoch": 3502} {"train_loss": -25.58784294128418, "global_step": 290724, "epoch": 3502} {"train_loss": -25.370849609375, "global_step": 290725, "epoch": 3502} {"train_loss": -25.553874969482422, "global_step": 290726, "epoch": 3502} {"train_loss": -25.344573974609375, "global_step": 290727, "epoch": 3502} {"train_loss": -25.686279296875, "global_step": 290728, "epoch": 3502} {"train_loss": -25.322433471679688, "global_step": 290729, "epoch": 3502} {"train_loss": -25.447656631469727, "global_step": 290730, "epoch": 3502} {"train_loss": -25.731977462768555, "global_step": 290731, "epoch": 3502} {"train_loss": -25.695743560791016, "global_step": 290732, "epoch": 3502} {"train_loss": -25.908750534057617, "global_step": 290733, "epoch": 3502} {"train_loss": -25.358606338500977, "global_step": 290734, "epoch": 3502} {"train_loss": -25.804157257080078, "global_step": 290735, "epoch": 3502} {"train_loss": -25.686355590820312, "global_step": 290736, "epoch": 3502} {"train_loss": -25.463958740234375, "global_step": 290737, "epoch": 3502} {"train_loss": -25.746261596679688, "global_step": 290738, "epoch": 3502} {"train_loss": -25.889514923095703, "global_step": 290739, "epoch": 3502} {"train_loss": -25.756940841674805, "global_step": 290740, "epoch": 3502} {"train_loss": -25.616912841796875, "global_step": 290741, "epoch": 3502} {"train_loss": -25.69744873046875, "global_step": 290742, "epoch": 3502} {"train_loss": -25.88832664489746, "global_step": 290743, "epoch": 3502} {"train_loss": -25.814956665039062, "global_step": 290744, "epoch": 3502} {"train_loss": -25.568899154663086, "global_step": 290745, "epoch": 3502} {"train_loss": -26.11577796936035, "global_step": 290746, "epoch": 3502} {"train_loss": -26.057485580444336, "global_step": 290747, "epoch": 3502} {"train_loss": -25.556672912046135, "global_step": 290748, "epoch": 3502, "val_loss": 7043794.5} {"train_loss": -25.547645568847656, "global_step": 290749, "epoch": 3503} {"train_loss": -25.11786460876465, "global_step": 290750, "epoch": 3503} {"train_loss": -24.613508224487305, "global_step": 290751, "epoch": 3503} {"train_loss": -23.759429931640625, "global_step": 290752, "epoch": 3503} {"train_loss": -23.792455673217773, "global_step": 290753, "epoch": 3503} {"train_loss": -24.95771026611328, "global_step": 290754, "epoch": 3503} {"train_loss": -25.47621726989746, "global_step": 290755, "epoch": 3503} {"train_loss": -24.921607971191406, "global_step": 290756, "epoch": 3503} {"train_loss": -25.18597412109375, "global_step": 290757, "epoch": 3503} {"train_loss": -25.541894912719727, "global_step": 290758, "epoch": 3503} {"train_loss": -25.261167526245117, "global_step": 290759, "epoch": 3503} {"train_loss": -25.55021858215332, "global_step": 290760, "epoch": 3503} {"train_loss": -25.413816452026367, "global_step": 290761, "epoch": 3503} {"train_loss": -25.49261474609375, "global_step": 290762, "epoch": 3503} {"train_loss": -25.235288619995117, "global_step": 290763, "epoch": 3503} {"train_loss": -25.140615463256836, "global_step": 290764, "epoch": 3503} {"train_loss": -25.11762237548828, "global_step": 290765, "epoch": 3503} {"train_loss": -24.938974380493164, "global_step": 290766, "epoch": 3503} {"train_loss": -25.64922523498535, "global_step": 290767, "epoch": 3503} {"train_loss": -25.050596237182617, "global_step": 290768, "epoch": 3503} {"train_loss": -25.311269760131836, "global_step": 290769, "epoch": 3503} {"train_loss": -25.062604904174805, "global_step": 290770, "epoch": 3503} {"train_loss": -25.57089614868164, "global_step": 290771, "epoch": 3503} {"train_loss": -25.52823257446289, "global_step": 290772, "epoch": 3503} {"train_loss": -25.43626594543457, "global_step": 290773, "epoch": 3503} {"train_loss": -25.095975875854492, "global_step": 290774, "epoch": 3503} {"train_loss": -25.38504409790039, "global_step": 290775, "epoch": 3503} {"train_loss": -25.487319946289062, "global_step": 290776, "epoch": 3503} {"train_loss": -25.76258659362793, "global_step": 290777, "epoch": 3503} {"train_loss": -25.760986328125, "global_step": 290778, "epoch": 3503} {"train_loss": -25.575246810913086, "global_step": 290779, "epoch": 3503} {"train_loss": -25.48246192932129, "global_step": 290780, "epoch": 3503} {"train_loss": -25.485872268676758, "global_step": 290781, "epoch": 3503} {"train_loss": -25.75790786743164, "global_step": 290782, "epoch": 3503} {"train_loss": -25.5587100982666, "global_step": 290783, "epoch": 3503} {"train_loss": -25.609365463256836, "global_step": 290784, "epoch": 3503} {"train_loss": -25.685993194580078, "global_step": 290785, "epoch": 3503} {"train_loss": -25.707605361938477, "global_step": 290786, "epoch": 3503} {"train_loss": -25.72391700744629, "global_step": 290787, "epoch": 3503} {"train_loss": -25.995996475219727, "global_step": 290788, "epoch": 3503} {"train_loss": -25.409122467041016, "global_step": 290789, "epoch": 3503} {"train_loss": -25.72407341003418, "global_step": 290790, "epoch": 3503} {"train_loss": -25.529815673828125, "global_step": 290791, "epoch": 3503} {"train_loss": -25.439769744873047, "global_step": 290792, "epoch": 3503} {"train_loss": -25.5384521484375, "global_step": 290793, "epoch": 3503} {"train_loss": -25.651350021362305, "global_step": 290794, "epoch": 3503} {"train_loss": -25.832901000976562, "global_step": 290795, "epoch": 3503} {"train_loss": -26.0410099029541, "global_step": 290796, "epoch": 3503} {"train_loss": -25.91672706604004, "global_step": 290797, "epoch": 3503} {"train_loss": -25.601911544799805, "global_step": 290798, "epoch": 3503} {"train_loss": -25.462858200073242, "global_step": 290799, "epoch": 3503} {"train_loss": -25.824499130249023, "global_step": 290800, "epoch": 3503} {"train_loss": -25.64910888671875, "global_step": 290801, "epoch": 3503} {"train_loss": -25.677499771118164, "global_step": 290802, "epoch": 3503} {"train_loss": -25.64131736755371, "global_step": 290803, "epoch": 3503} {"train_loss": -25.946104049682617, "global_step": 290804, "epoch": 3503} {"train_loss": -25.535993576049805, "global_step": 290805, "epoch": 3503} {"train_loss": -25.54746437072754, "global_step": 290806, "epoch": 3503} {"train_loss": -25.6235408782959, "global_step": 290807, "epoch": 3503} {"train_loss": -25.418272018432617, "global_step": 290808, "epoch": 3503} {"train_loss": -25.29884147644043, "global_step": 290809, "epoch": 3503} {"train_loss": -25.32913589477539, "global_step": 290810, "epoch": 3503} {"train_loss": -25.756210327148438, "global_step": 290811, "epoch": 3503} {"train_loss": -25.796707153320312, "global_step": 290812, "epoch": 3503} {"train_loss": -25.606428146362305, "global_step": 290813, "epoch": 3503} {"train_loss": -25.340499877929688, "global_step": 290814, "epoch": 3503} {"train_loss": -25.7126522064209, "global_step": 290815, "epoch": 3503} {"train_loss": -25.775793075561523, "global_step": 290816, "epoch": 3503} {"train_loss": -25.838468551635742, "global_step": 290817, "epoch": 3503} {"train_loss": -25.214460372924805, "global_step": 290818, "epoch": 3503} {"train_loss": -25.07240867614746, "global_step": 290819, "epoch": 3503} {"train_loss": -25.321191787719727, "global_step": 290820, "epoch": 3503} {"train_loss": -25.336639404296875, "global_step": 290821, "epoch": 3503} {"train_loss": -25.863431930541992, "global_step": 290822, "epoch": 3503} {"train_loss": -25.016576766967773, "global_step": 290823, "epoch": 3503} {"train_loss": -25.558950424194336, "global_step": 290824, "epoch": 3503} {"train_loss": -25.08447265625, "global_step": 290825, "epoch": 3503} {"train_loss": -25.45577049255371, "global_step": 290826, "epoch": 3503} {"train_loss": -25.327438354492188, "global_step": 290827, "epoch": 3503} {"train_loss": -25.320995330810547, "global_step": 290828, "epoch": 3503} {"train_loss": -25.24626922607422, "global_step": 290829, "epoch": 3503} {"train_loss": -25.3546199798584, "global_step": 290830, "epoch": 3503} {"train_loss": -25.421434264585198, "global_step": 290831, "epoch": 3503, "val_loss": 7154883.0} {"train_loss": -24.875680923461914, "global_step": 290832, "epoch": 3504} {"train_loss": -24.932952880859375, "global_step": 290833, "epoch": 3504} {"train_loss": -25.16592025756836, "global_step": 290834, "epoch": 3504} {"train_loss": -25.53938102722168, "global_step": 290835, "epoch": 3504} {"train_loss": -24.984283447265625, "global_step": 290836, "epoch": 3504} {"train_loss": -25.018213272094727, "global_step": 290837, "epoch": 3504} {"train_loss": -25.413984298706055, "global_step": 290838, "epoch": 3504} {"train_loss": -25.212289810180664, "global_step": 290839, "epoch": 3504} {"train_loss": -25.296812057495117, "global_step": 290840, "epoch": 3504} {"train_loss": -25.407196044921875, "global_step": 290841, "epoch": 3504} {"train_loss": -25.300535202026367, "global_step": 290842, "epoch": 3504} {"train_loss": -25.334402084350586, "global_step": 290843, "epoch": 3504} {"train_loss": -25.4471378326416, "global_step": 290844, "epoch": 3504} {"train_loss": -25.360567092895508, "global_step": 290845, "epoch": 3504} {"train_loss": -25.2404842376709, "global_step": 290846, "epoch": 3504} {"train_loss": -25.355255126953125, "global_step": 290847, "epoch": 3504} {"train_loss": -25.645145416259766, "global_step": 290848, "epoch": 3504} {"train_loss": -26.025821685791016, "global_step": 290849, "epoch": 3504} {"train_loss": -25.581254959106445, "global_step": 290850, "epoch": 3504} {"train_loss": -25.540470123291016, "global_step": 290851, "epoch": 3504} {"train_loss": -25.464834213256836, "global_step": 290852, "epoch": 3504} {"train_loss": -25.103971481323242, "global_step": 290853, "epoch": 3504} {"train_loss": -25.2886905670166, "global_step": 290854, "epoch": 3504} {"train_loss": -25.65805435180664, "global_step": 290855, "epoch": 3504} {"train_loss": -25.470752716064453, "global_step": 290856, "epoch": 3504} {"train_loss": -25.52216339111328, "global_step": 290857, "epoch": 3504} {"train_loss": -25.48226547241211, "global_step": 290858, "epoch": 3504} {"train_loss": -25.00452995300293, "global_step": 290859, "epoch": 3504} {"train_loss": -25.28531265258789, "global_step": 290860, "epoch": 3504} {"train_loss": -25.35746955871582, "global_step": 290861, "epoch": 3504} {"train_loss": -25.548261642456055, "global_step": 290862, "epoch": 3504} {"train_loss": -25.85744285583496, "global_step": 290863, "epoch": 3504} {"train_loss": -25.2136287689209, "global_step": 290864, "epoch": 3504} {"train_loss": -25.339630126953125, "global_step": 290865, "epoch": 3504} {"train_loss": -25.378694534301758, "global_step": 290866, "epoch": 3504} {"train_loss": -25.13075828552246, "global_step": 290867, "epoch": 3504} {"train_loss": -26.077362060546875, "global_step": 290868, "epoch": 3504} {"train_loss": -25.32440948486328, "global_step": 290869, "epoch": 3504} {"train_loss": -25.382186889648438, "global_step": 290870, "epoch": 3504} {"train_loss": -25.734994888305664, "global_step": 290871, "epoch": 3504} {"train_loss": -25.540136337280273, "global_step": 290872, "epoch": 3504} {"train_loss": -25.48969841003418, "global_step": 290873, "epoch": 3504} {"train_loss": -25.534191131591797, "global_step": 290874, "epoch": 3504} {"train_loss": -25.652502059936523, "global_step": 290875, "epoch": 3504} {"train_loss": -25.352767944335938, "global_step": 290876, "epoch": 3504} {"train_loss": -25.51987648010254, "global_step": 290877, "epoch": 3504} {"train_loss": -25.837339401245117, "global_step": 290878, "epoch": 3504} {"train_loss": -25.355512619018555, "global_step": 290879, "epoch": 3504} {"train_loss": -25.439748764038086, "global_step": 290880, "epoch": 3504} {"train_loss": -25.604536056518555, "global_step": 290881, "epoch": 3504} {"train_loss": -25.67827796936035, "global_step": 290882, "epoch": 3504} {"train_loss": -25.692441940307617, "global_step": 290883, "epoch": 3504} {"train_loss": -25.751453399658203, "global_step": 290884, "epoch": 3504} {"train_loss": -25.648468017578125, "global_step": 290885, "epoch": 3504} {"train_loss": -25.513141632080078, "global_step": 290886, "epoch": 3504} {"train_loss": -25.17852210998535, "global_step": 290887, "epoch": 3504} {"train_loss": -25.307748794555664, "global_step": 290888, "epoch": 3504} {"train_loss": -25.386938095092773, "global_step": 290889, "epoch": 3504} {"train_loss": -24.995849609375, "global_step": 290890, "epoch": 3504} {"train_loss": -24.768211364746094, "global_step": 290891, "epoch": 3504} {"train_loss": -24.980567932128906, "global_step": 290892, "epoch": 3504} {"train_loss": -25.19668960571289, "global_step": 290893, "epoch": 3504} {"train_loss": -25.232154846191406, "global_step": 290894, "epoch": 3504} {"train_loss": -25.57100486755371, "global_step": 290895, "epoch": 3504} {"train_loss": -25.56773567199707, "global_step": 290896, "epoch": 3504} {"train_loss": -25.952136993408203, "global_step": 290897, "epoch": 3504} {"train_loss": -25.381248474121094, "global_step": 290898, "epoch": 3504} {"train_loss": -25.707778930664062, "global_step": 290899, "epoch": 3504} {"train_loss": -25.374555587768555, "global_step": 290900, "epoch": 3504} {"train_loss": -25.46160888671875, "global_step": 290901, "epoch": 3504} {"train_loss": -25.307209014892578, "global_step": 290902, "epoch": 3504} {"train_loss": -25.58919334411621, "global_step": 290903, "epoch": 3504} {"train_loss": -25.32004737854004, "global_step": 290904, "epoch": 3504} {"train_loss": -25.43549919128418, "global_step": 290905, "epoch": 3504} {"train_loss": -25.49124526977539, "global_step": 290906, "epoch": 3504} {"train_loss": -25.35015869140625, "global_step": 290907, "epoch": 3504} {"train_loss": -25.61785888671875, "global_step": 290908, "epoch": 3504} {"train_loss": -25.536001205444336, "global_step": 290909, "epoch": 3504} {"train_loss": -25.214923858642578, "global_step": 290910, "epoch": 3504} {"train_loss": -25.436384201049805, "global_step": 290911, "epoch": 3504} {"train_loss": -25.64155387878418, "global_step": 290912, "epoch": 3504} {"train_loss": -25.442970275878906, "global_step": 290913, "epoch": 3504} {"train_loss": -25.430753340204078, "global_step": 290914, "epoch": 3504, "val_loss": 7250883.0} {"train_loss": -25.1193790435791, "global_step": 290915, "epoch": 3505} {"train_loss": -25.478137969970703, "global_step": 290916, "epoch": 3505} {"train_loss": -25.214757919311523, "global_step": 290917, "epoch": 3505} {"train_loss": -25.251405715942383, "global_step": 290918, "epoch": 3505} {"train_loss": -25.005895614624023, "global_step": 290919, "epoch": 3505} {"train_loss": -25.219696044921875, "global_step": 290920, "epoch": 3505} {"train_loss": -25.087345123291016, "global_step": 290921, "epoch": 3505} {"train_loss": -24.788679122924805, "global_step": 290922, "epoch": 3505} {"train_loss": -25.471893310546875, "global_step": 290923, "epoch": 3505} {"train_loss": -25.37323760986328, "global_step": 290924, "epoch": 3505} {"train_loss": -25.209409713745117, "global_step": 290925, "epoch": 3505} {"train_loss": -25.435300827026367, "global_step": 290926, "epoch": 3505} {"train_loss": -25.32762908935547, "global_step": 290927, "epoch": 3505} {"train_loss": -25.165544509887695, "global_step": 290928, "epoch": 3505} {"train_loss": -25.703842163085938, "global_step": 290929, "epoch": 3505} {"train_loss": -25.636022567749023, "global_step": 290930, "epoch": 3505} {"train_loss": -25.49356460571289, "global_step": 290931, "epoch": 3505} {"train_loss": -25.47767448425293, "global_step": 290932, "epoch": 3505} {"train_loss": -25.481220245361328, "global_step": 290933, "epoch": 3505} {"train_loss": -25.381961822509766, "global_step": 290934, "epoch": 3505} {"train_loss": -25.54047203063965, "global_step": 290935, "epoch": 3505} {"train_loss": -25.718399047851562, "global_step": 290936, "epoch": 3505} {"train_loss": -25.390356063842773, "global_step": 290937, "epoch": 3505} {"train_loss": -25.9298152923584, "global_step": 290938, "epoch": 3505} {"train_loss": -25.416574478149414, "global_step": 290939, "epoch": 3505} {"train_loss": -25.270965576171875, "global_step": 290940, "epoch": 3505} {"train_loss": -25.458908081054688, "global_step": 290941, "epoch": 3505} {"train_loss": -25.53382682800293, "global_step": 290942, "epoch": 3505} {"train_loss": -25.34198760986328, "global_step": 290943, "epoch": 3505} {"train_loss": -25.464731216430664, "global_step": 290944, "epoch": 3505} {"train_loss": -25.657642364501953, "global_step": 290945, "epoch": 3505} {"train_loss": -25.44673728942871, "global_step": 290946, "epoch": 3505} {"train_loss": -25.61797523498535, "global_step": 290947, "epoch": 3505} {"train_loss": -25.91839599609375, "global_step": 290948, "epoch": 3505} {"train_loss": -25.65302085876465, "global_step": 290949, "epoch": 3505} {"train_loss": -25.73459243774414, "global_step": 290950, "epoch": 3505} {"train_loss": -25.561691284179688, "global_step": 290951, "epoch": 3505} {"train_loss": -25.582138061523438, "global_step": 290952, "epoch": 3505} {"train_loss": -25.451099395751953, "global_step": 290953, "epoch": 3505} {"train_loss": -25.64566993713379, "global_step": 290954, "epoch": 3505} {"train_loss": -25.55023193359375, "global_step": 290955, "epoch": 3505} {"train_loss": -25.899351119995117, "global_step": 290956, "epoch": 3505} {"train_loss": -25.84331703186035, "global_step": 290957, "epoch": 3505} {"train_loss": -25.74614906311035, "global_step": 290958, "epoch": 3505} {"train_loss": -25.477025985717773, "global_step": 290959, "epoch": 3505} {"train_loss": -25.863080978393555, "global_step": 290960, "epoch": 3505} {"train_loss": -25.41082000732422, "global_step": 290961, "epoch": 3505} {"train_loss": -25.798147201538086, "global_step": 290962, "epoch": 3505} {"train_loss": -25.797452926635742, "global_step": 290963, "epoch": 3505} {"train_loss": -26.001073837280273, "global_step": 290964, "epoch": 3505} {"train_loss": -25.576419830322266, "global_step": 290965, "epoch": 3505} {"train_loss": -25.632007598876953, "global_step": 290966, "epoch": 3505} {"train_loss": -25.934009552001953, "global_step": 290967, "epoch": 3505} {"train_loss": -25.865808486938477, "global_step": 290968, "epoch": 3505} {"train_loss": -25.77520179748535, "global_step": 290969, "epoch": 3505} {"train_loss": -25.7928466796875, "global_step": 290970, "epoch": 3505} {"train_loss": -25.825103759765625, "global_step": 290971, "epoch": 3505} {"train_loss": -25.78566551208496, "global_step": 290972, "epoch": 3505} {"train_loss": -25.306610107421875, "global_step": 290973, "epoch": 3505} {"train_loss": -25.20832633972168, "global_step": 290974, "epoch": 3505} {"train_loss": -25.488143920898438, "global_step": 290975, "epoch": 3505} {"train_loss": -26.197132110595703, "global_step": 290976, "epoch": 3505} {"train_loss": -25.418865203857422, "global_step": 290977, "epoch": 3505} {"train_loss": -25.40437889099121, "global_step": 290978, "epoch": 3505} {"train_loss": -25.500612258911133, "global_step": 290979, "epoch": 3505} {"train_loss": -25.48518943786621, "global_step": 290980, "epoch": 3505} {"train_loss": -25.60003662109375, "global_step": 290981, "epoch": 3505} {"train_loss": -25.478307723999023, "global_step": 290982, "epoch": 3505} {"train_loss": -25.641361236572266, "global_step": 290983, "epoch": 3505} {"train_loss": -25.94110679626465, "global_step": 290984, "epoch": 3505} {"train_loss": -26.050561904907227, "global_step": 290985, "epoch": 3505} {"train_loss": -25.31378173828125, "global_step": 290986, "epoch": 3505} {"train_loss": -25.481733322143555, "global_step": 290987, "epoch": 3505} {"train_loss": -25.574796676635742, "global_step": 290988, "epoch": 3505} {"train_loss": -25.819852828979492, "global_step": 290989, "epoch": 3505} {"train_loss": -24.999269485473633, "global_step": 290990, "epoch": 3505} {"train_loss": -25.322769165039062, "global_step": 290991, "epoch": 3505} {"train_loss": -25.77728271484375, "global_step": 290992, "epoch": 3505} {"train_loss": -25.293113708496094, "global_step": 290993, "epoch": 3505} {"train_loss": -25.648473739624023, "global_step": 290994, "epoch": 3505} {"train_loss": -25.256500244140625, "global_step": 290995, "epoch": 3505} {"train_loss": -25.650365829467773, "global_step": 290996, "epoch": 3505} {"train_loss": -25.52443777796734, "global_step": 290997, "epoch": 3505, "val_loss": 7219152.0} {"train_loss": -24.476099014282227, "global_step": 290998, "epoch": 3506} {"train_loss": -23.69838523864746, "global_step": 290999, "epoch": 3506} {"train_loss": -25.05630874633789, "global_step": 291000, "epoch": 3506} {"train_loss": -24.36052131652832, "global_step": 291001, "epoch": 3506} {"train_loss": -24.433828353881836, "global_step": 291002, "epoch": 3506} {"train_loss": -25.16830825805664, "global_step": 291003, "epoch": 3506} {"train_loss": -23.722431182861328, "global_step": 291004, "epoch": 3506} {"train_loss": -24.517959594726562, "global_step": 291005, "epoch": 3506} {"train_loss": -24.888090133666992, "global_step": 291006, "epoch": 3506} {"train_loss": -24.816417694091797, "global_step": 291007, "epoch": 3506} {"train_loss": -24.915836334228516, "global_step": 291008, "epoch": 3506} {"train_loss": -24.70926856994629, "global_step": 291009, "epoch": 3506} {"train_loss": -25.33399772644043, "global_step": 291010, "epoch": 3506} {"train_loss": -24.63088607788086, "global_step": 291011, "epoch": 3506} {"train_loss": -24.979476928710938, "global_step": 291012, "epoch": 3506} {"train_loss": -25.045276641845703, "global_step": 291013, "epoch": 3506} {"train_loss": -24.862131118774414, "global_step": 291014, "epoch": 3506} {"train_loss": -24.900903701782227, "global_step": 291015, "epoch": 3506} {"train_loss": -24.608428955078125, "global_step": 291016, "epoch": 3506} {"train_loss": -24.913938522338867, "global_step": 291017, "epoch": 3506} {"train_loss": -25.322668075561523, "global_step": 291018, "epoch": 3506} {"train_loss": -25.26373291015625, "global_step": 291019, "epoch": 3506} {"train_loss": -25.44913673400879, "global_step": 291020, "epoch": 3506} {"train_loss": -25.32807731628418, "global_step": 291021, "epoch": 3506} {"train_loss": -25.139326095581055, "global_step": 291022, "epoch": 3506} {"train_loss": -25.150487899780273, "global_step": 291023, "epoch": 3506} {"train_loss": -25.61553955078125, "global_step": 291024, "epoch": 3506} {"train_loss": -25.442575454711914, "global_step": 291025, "epoch": 3506} {"train_loss": -25.335346221923828, "global_step": 291026, "epoch": 3506} {"train_loss": -25.633121490478516, "global_step": 291027, "epoch": 3506} {"train_loss": -25.773298263549805, "global_step": 291028, "epoch": 3506} {"train_loss": -25.10085105895996, "global_step": 291029, "epoch": 3506} {"train_loss": -25.508806228637695, "global_step": 291030, "epoch": 3506} {"train_loss": -25.566381454467773, "global_step": 291031, "epoch": 3506} {"train_loss": -25.565053939819336, "global_step": 291032, "epoch": 3506} {"train_loss": -25.472660064697266, "global_step": 291033, "epoch": 3506} {"train_loss": -25.44227409362793, "global_step": 291034, "epoch": 3506} {"train_loss": -25.392606735229492, "global_step": 291035, "epoch": 3506} {"train_loss": -25.41533088684082, "global_step": 291036, "epoch": 3506} {"train_loss": -25.18815040588379, "global_step": 291037, "epoch": 3506} {"train_loss": -25.482255935668945, "global_step": 291038, "epoch": 3506} {"train_loss": -25.80365562438965, "global_step": 291039, "epoch": 3506} {"train_loss": -25.438724517822266, "global_step": 291040, "epoch": 3506} {"train_loss": -25.895950317382812, "global_step": 291041, "epoch": 3506} {"train_loss": -25.507200241088867, "global_step": 291042, "epoch": 3506} {"train_loss": -25.652637481689453, "global_step": 291043, "epoch": 3506} {"train_loss": -25.67950439453125, "global_step": 291044, "epoch": 3506} {"train_loss": -25.35748863220215, "global_step": 291045, "epoch": 3506} {"train_loss": -25.909442901611328, "global_step": 291046, "epoch": 3506} {"train_loss": -25.46630859375, "global_step": 291047, "epoch": 3506} {"train_loss": -25.77387046813965, "global_step": 291048, "epoch": 3506} {"train_loss": -25.445837020874023, "global_step": 291049, "epoch": 3506} {"train_loss": -25.844669342041016, "global_step": 291050, "epoch": 3506} {"train_loss": -25.932968139648438, "global_step": 291051, "epoch": 3506} {"train_loss": -25.366180419921875, "global_step": 291052, "epoch": 3506} {"train_loss": -25.6966495513916, "global_step": 291053, "epoch": 3506} {"train_loss": -25.8853759765625, "global_step": 291054, "epoch": 3506} {"train_loss": -25.644269943237305, "global_step": 291055, "epoch": 3506} {"train_loss": -25.663190841674805, "global_step": 291056, "epoch": 3506} {"train_loss": -25.59351348876953, "global_step": 291057, "epoch": 3506} {"train_loss": -25.24224090576172, "global_step": 291058, "epoch": 3506} {"train_loss": -25.5568790435791, "global_step": 291059, "epoch": 3506} {"train_loss": -25.691736221313477, "global_step": 291060, "epoch": 3506} {"train_loss": -25.595449447631836, "global_step": 291061, "epoch": 3506} {"train_loss": -25.935293197631836, "global_step": 291062, "epoch": 3506} {"train_loss": -25.91370964050293, "global_step": 291063, "epoch": 3506} {"train_loss": -25.828428268432617, "global_step": 291064, "epoch": 3506} {"train_loss": -25.466049194335938, "global_step": 291065, "epoch": 3506} {"train_loss": -25.931812286376953, "global_step": 291066, "epoch": 3506} {"train_loss": -25.8886661529541, "global_step": 291067, "epoch": 3506} {"train_loss": -25.541851043701172, "global_step": 291068, "epoch": 3506} {"train_loss": -25.57282066345215, "global_step": 291069, "epoch": 3506} {"train_loss": -25.751089096069336, "global_step": 291070, "epoch": 3506} {"train_loss": -25.82856559753418, "global_step": 291071, "epoch": 3506} {"train_loss": -25.504690170288086, "global_step": 291072, "epoch": 3506} {"train_loss": -25.478992462158203, "global_step": 291073, "epoch": 3506} {"train_loss": -25.88435173034668, "global_step": 291074, "epoch": 3506} {"train_loss": -25.576190948486328, "global_step": 291075, "epoch": 3506} {"train_loss": -25.321170806884766, "global_step": 291076, "epoch": 3506} {"train_loss": -25.440139770507812, "global_step": 291077, "epoch": 3506} {"train_loss": -24.848350524902344, "global_step": 291078, "epoch": 3506} {"train_loss": -25.147912979125977, "global_step": 291079, "epoch": 3506} {"train_loss": -25.348859901887824, "global_step": 291080, "epoch": 3506, "val_loss": 7167821.0} {"train_loss": -24.829227447509766, "global_step": 291081, "epoch": 3507} {"train_loss": -23.7288875579834, "global_step": 291082, "epoch": 3507} {"train_loss": -24.3269100189209, "global_step": 291083, "epoch": 3507} {"train_loss": -24.544113159179688, "global_step": 291084, "epoch": 3507} {"train_loss": -24.87277603149414, "global_step": 291085, "epoch": 3507} {"train_loss": -24.484310150146484, "global_step": 291086, "epoch": 3507} {"train_loss": -24.46280288696289, "global_step": 291087, "epoch": 3507} {"train_loss": -24.742448806762695, "global_step": 291088, "epoch": 3507} {"train_loss": -24.85999870300293, "global_step": 291089, "epoch": 3507} {"train_loss": -24.596744537353516, "global_step": 291090, "epoch": 3507} {"train_loss": -24.712631225585938, "global_step": 291091, "epoch": 3507} {"train_loss": -24.616138458251953, "global_step": 291092, "epoch": 3507} {"train_loss": -24.70356559753418, "global_step": 291093, "epoch": 3507} {"train_loss": -24.84178924560547, "global_step": 291094, "epoch": 3507} {"train_loss": -24.85321044921875, "global_step": 291095, "epoch": 3507} {"train_loss": -24.85248374938965, "global_step": 291096, "epoch": 3507} {"train_loss": -24.770044326782227, "global_step": 291097, "epoch": 3507} {"train_loss": -24.948373794555664, "global_step": 291098, "epoch": 3507} {"train_loss": -24.592239379882812, "global_step": 291099, "epoch": 3507} {"train_loss": -25.0018310546875, "global_step": 291100, "epoch": 3507} {"train_loss": -25.146739959716797, "global_step": 291101, "epoch": 3507} {"train_loss": -25.099246978759766, "global_step": 291102, "epoch": 3507} {"train_loss": -25.251407623291016, "global_step": 291103, "epoch": 3507} {"train_loss": -25.106430053710938, "global_step": 291104, "epoch": 3507} {"train_loss": -25.030868530273438, "global_step": 291105, "epoch": 3507} {"train_loss": -25.23523712158203, "global_step": 291106, "epoch": 3507} {"train_loss": -24.918684005737305, "global_step": 291107, "epoch": 3507} {"train_loss": -25.13288688659668, "global_step": 291108, "epoch": 3507} {"train_loss": -25.221694946289062, "global_step": 291109, "epoch": 3507} {"train_loss": -25.4892520904541, "global_step": 291110, "epoch": 3507} {"train_loss": -25.027856826782227, "global_step": 291111, "epoch": 3507} {"train_loss": -25.7196102142334, "global_step": 291112, "epoch": 3507} {"train_loss": -25.22134780883789, "global_step": 291113, "epoch": 3507} {"train_loss": -25.388046264648438, "global_step": 291114, "epoch": 3507} {"train_loss": -25.481216430664062, "global_step": 291115, "epoch": 3507} {"train_loss": -25.401206970214844, "global_step": 291116, "epoch": 3507} {"train_loss": -25.766571044921875, "global_step": 291117, "epoch": 3507} {"train_loss": -25.73975944519043, "global_step": 291118, "epoch": 3507} {"train_loss": -25.685077667236328, "global_step": 291119, "epoch": 3507} {"train_loss": -25.563526153564453, "global_step": 291120, "epoch": 3507} {"train_loss": -25.422697067260742, "global_step": 291121, "epoch": 3507} {"train_loss": -25.80198097229004, "global_step": 291122, "epoch": 3507} {"train_loss": -26.112546920776367, "global_step": 291123, "epoch": 3507} {"train_loss": -25.3684139251709, "global_step": 291124, "epoch": 3507} {"train_loss": -25.70181655883789, "global_step": 291125, "epoch": 3507} {"train_loss": -25.78120231628418, "global_step": 291126, "epoch": 3507} {"train_loss": -25.501779556274414, "global_step": 291127, "epoch": 3507} {"train_loss": -25.418132781982422, "global_step": 291128, "epoch": 3507} {"train_loss": -25.255632400512695, "global_step": 291129, "epoch": 3507} {"train_loss": -25.8581485748291, "global_step": 291130, "epoch": 3507} {"train_loss": -25.761499404907227, "global_step": 291131, "epoch": 3507} {"train_loss": -25.697362899780273, "global_step": 291132, "epoch": 3507} {"train_loss": -25.587100982666016, "global_step": 291133, "epoch": 3507} {"train_loss": -25.41673469543457, "global_step": 291134, "epoch": 3507} {"train_loss": -25.977216720581055, "global_step": 291135, "epoch": 3507} {"train_loss": -25.40326690673828, "global_step": 291136, "epoch": 3507} {"train_loss": -25.762805938720703, "global_step": 291137, "epoch": 3507} {"train_loss": -25.591493606567383, "global_step": 291138, "epoch": 3507} {"train_loss": -25.512569427490234, "global_step": 291139, "epoch": 3507} {"train_loss": -25.62342643737793, "global_step": 291140, "epoch": 3507} {"train_loss": -25.767807006835938, "global_step": 291141, "epoch": 3507} {"train_loss": -25.775196075439453, "global_step": 291142, "epoch": 3507} {"train_loss": -25.528301239013672, "global_step": 291143, "epoch": 3507} {"train_loss": -25.21089744567871, "global_step": 291144, "epoch": 3507} {"train_loss": -25.70961570739746, "global_step": 291145, "epoch": 3507} {"train_loss": -25.3625545501709, "global_step": 291146, "epoch": 3507} {"train_loss": -25.96564292907715, "global_step": 291147, "epoch": 3507} {"train_loss": -25.872150421142578, "global_step": 291148, "epoch": 3507} {"train_loss": -25.49148178100586, "global_step": 291149, "epoch": 3507} {"train_loss": -25.906585693359375, "global_step": 291150, "epoch": 3507} {"train_loss": -25.5418701171875, "global_step": 291151, "epoch": 3507} {"train_loss": -25.69880485534668, "global_step": 291152, "epoch": 3507} {"train_loss": -25.409351348876953, "global_step": 291153, "epoch": 3507} {"train_loss": -25.919240951538086, "global_step": 291154, "epoch": 3507} {"train_loss": -25.664798736572266, "global_step": 291155, "epoch": 3507} {"train_loss": -25.82683753967285, "global_step": 291156, "epoch": 3507} {"train_loss": -25.83963966369629, "global_step": 291157, "epoch": 3507} {"train_loss": -25.688379287719727, "global_step": 291158, "epoch": 3507} {"train_loss": -25.397153854370117, "global_step": 291159, "epoch": 3507} {"train_loss": -25.882110595703125, "global_step": 291160, "epoch": 3507} {"train_loss": -25.36321449279785, "global_step": 291161, "epoch": 3507} {"train_loss": -25.568586349487305, "global_step": 291162, "epoch": 3507} {"train_loss": -25.3087226913636, "global_step": 291163, "epoch": 3507, "val_loss": 7062373.0} {"train_loss": -24.753469467163086, "global_step": 291164, "epoch": 3508} {"train_loss": -24.849496841430664, "global_step": 291165, "epoch": 3508} {"train_loss": -24.51157569885254, "global_step": 291166, "epoch": 3508} {"train_loss": -25.293384552001953, "global_step": 291167, "epoch": 3508} {"train_loss": -24.456632614135742, "global_step": 291168, "epoch": 3508} {"train_loss": -25.121234893798828, "global_step": 291169, "epoch": 3508} {"train_loss": -24.6617431640625, "global_step": 291170, "epoch": 3508} {"train_loss": -24.69783592224121, "global_step": 291171, "epoch": 3508} {"train_loss": -24.964624404907227, "global_step": 291172, "epoch": 3508} {"train_loss": -24.745807647705078, "global_step": 291173, "epoch": 3508} {"train_loss": -24.704256057739258, "global_step": 291174, "epoch": 3508} {"train_loss": -24.874832153320312, "global_step": 291175, "epoch": 3508} {"train_loss": -25.068511962890625, "global_step": 291176, "epoch": 3508} {"train_loss": -24.5155029296875, "global_step": 291177, "epoch": 3508} {"train_loss": -24.70167350769043, "global_step": 291178, "epoch": 3508} {"train_loss": -24.96302032470703, "global_step": 291179, "epoch": 3508} {"train_loss": -24.66261100769043, "global_step": 291180, "epoch": 3508} {"train_loss": -24.8062801361084, "global_step": 291181, "epoch": 3508} {"train_loss": -25.368589401245117, "global_step": 291182, "epoch": 3508} {"train_loss": -24.717201232910156, "global_step": 291183, "epoch": 3508} {"train_loss": -24.913286209106445, "global_step": 291184, "epoch": 3508} {"train_loss": -25.099763870239258, "global_step": 291185, "epoch": 3508} {"train_loss": -24.952611923217773, "global_step": 291186, "epoch": 3508} {"train_loss": -24.6966609954834, "global_step": 291187, "epoch": 3508} {"train_loss": -25.117176055908203, "global_step": 291188, "epoch": 3508} {"train_loss": -24.958837509155273, "global_step": 291189, "epoch": 3508} {"train_loss": -25.46630859375, "global_step": 291190, "epoch": 3508} {"train_loss": -25.282608032226562, "global_step": 291191, "epoch": 3508} {"train_loss": -25.432191848754883, "global_step": 291192, "epoch": 3508} {"train_loss": -25.262271881103516, "global_step": 291193, "epoch": 3508} {"train_loss": -25.399906158447266, "global_step": 291194, "epoch": 3508} {"train_loss": -25.31373405456543, "global_step": 291195, "epoch": 3508} {"train_loss": -25.489728927612305, "global_step": 291196, "epoch": 3508} {"train_loss": -25.26141929626465, "global_step": 291197, "epoch": 3508} {"train_loss": -25.181318283081055, "global_step": 291198, "epoch": 3508} {"train_loss": -25.062137603759766, "global_step": 291199, "epoch": 3508} {"train_loss": -25.377988815307617, "global_step": 291200, "epoch": 3508} {"train_loss": -25.115201950073242, "global_step": 291201, "epoch": 3508} {"train_loss": -25.562734603881836, "global_step": 291202, "epoch": 3508} {"train_loss": -25.520559310913086, "global_step": 291203, "epoch": 3508} {"train_loss": -25.600910186767578, "global_step": 291204, "epoch": 3508} {"train_loss": -25.402151107788086, "global_step": 291205, "epoch": 3508} {"train_loss": -25.90496253967285, "global_step": 291206, "epoch": 3508} {"train_loss": -25.738195419311523, "global_step": 291207, "epoch": 3508} {"train_loss": -25.643335342407227, "global_step": 291208, "epoch": 3508} {"train_loss": -25.654743194580078, "global_step": 291209, "epoch": 3508} {"train_loss": -25.375717163085938, "global_step": 291210, "epoch": 3508} {"train_loss": -25.6713809967041, "global_step": 291211, "epoch": 3508} {"train_loss": -25.379865646362305, "global_step": 291212, "epoch": 3508} {"train_loss": -25.44022560119629, "global_step": 291213, "epoch": 3508} {"train_loss": -25.717975616455078, "global_step": 291214, "epoch": 3508} {"train_loss": -25.48227882385254, "global_step": 291215, "epoch": 3508} {"train_loss": -25.52651023864746, "global_step": 291216, "epoch": 3508} {"train_loss": -25.601791381835938, "global_step": 291217, "epoch": 3508} {"train_loss": -25.234981536865234, "global_step": 291218, "epoch": 3508} {"train_loss": -25.594593048095703, "global_step": 291219, "epoch": 3508} {"train_loss": -25.529882431030273, "global_step": 291220, "epoch": 3508} {"train_loss": -25.384822845458984, "global_step": 291221, "epoch": 3508} {"train_loss": -25.67344093322754, "global_step": 291222, "epoch": 3508} {"train_loss": -25.970041275024414, "global_step": 291223, "epoch": 3508} {"train_loss": -25.3259334564209, "global_step": 291224, "epoch": 3508} {"train_loss": -25.75779151916504, "global_step": 291225, "epoch": 3508} {"train_loss": -25.858213424682617, "global_step": 291226, "epoch": 3508} {"train_loss": -25.884735107421875, "global_step": 291227, "epoch": 3508} {"train_loss": -25.559207916259766, "global_step": 291228, "epoch": 3508} {"train_loss": -25.667139053344727, "global_step": 291229, "epoch": 3508} {"train_loss": -25.740360260009766, "global_step": 291230, "epoch": 3508} {"train_loss": -25.708267211914062, "global_step": 291231, "epoch": 3508} {"train_loss": -25.962377548217773, "global_step": 291232, "epoch": 3508} {"train_loss": -25.734716415405273, "global_step": 291233, "epoch": 3508} {"train_loss": -25.397552490234375, "global_step": 291234, "epoch": 3508} {"train_loss": -25.633106231689453, "global_step": 291235, "epoch": 3508} {"train_loss": -25.595197677612305, "global_step": 291236, "epoch": 3508} {"train_loss": -25.74920082092285, "global_step": 291237, "epoch": 3508} {"train_loss": -25.5147762298584, "global_step": 291238, "epoch": 3508} {"train_loss": -25.518779754638672, "global_step": 291239, "epoch": 3508} {"train_loss": -25.72193717956543, "global_step": 291240, "epoch": 3508} {"train_loss": -25.455310821533203, "global_step": 291241, "epoch": 3508} {"train_loss": -25.798742294311523, "global_step": 291242, "epoch": 3508} {"train_loss": -25.369047164916992, "global_step": 291243, "epoch": 3508} {"train_loss": -25.6647891998291, "global_step": 291244, "epoch": 3508} {"train_loss": -25.627914428710938, "global_step": 291245, "epoch": 3508} {"train_loss": -25.331536810082124, "global_step": 291246, "epoch": 3508, "val_loss": 7043503.0} {"train_loss": -24.89539909362793, "global_step": 291247, "epoch": 3509} {"train_loss": -25.292661666870117, "global_step": 291248, "epoch": 3509} {"train_loss": -24.658445358276367, "global_step": 291249, "epoch": 3509} {"train_loss": -25.200923919677734, "global_step": 291250, "epoch": 3509} {"train_loss": -25.258094787597656, "global_step": 291251, "epoch": 3509} {"train_loss": -24.891164779663086, "global_step": 291252, "epoch": 3509} {"train_loss": -25.277652740478516, "global_step": 291253, "epoch": 3509} {"train_loss": -25.31621742248535, "global_step": 291254, "epoch": 3509} {"train_loss": -25.17864990234375, "global_step": 291255, "epoch": 3509} {"train_loss": -25.129112243652344, "global_step": 291256, "epoch": 3509} {"train_loss": -25.156503677368164, "global_step": 291257, "epoch": 3509} {"train_loss": -25.22676658630371, "global_step": 291258, "epoch": 3509} {"train_loss": -25.056747436523438, "global_step": 291259, "epoch": 3509} {"train_loss": -25.001056671142578, "global_step": 291260, "epoch": 3509} {"train_loss": -25.488943099975586, "global_step": 291261, "epoch": 3509} {"train_loss": -25.366891860961914, "global_step": 291262, "epoch": 3509} {"train_loss": -25.263696670532227, "global_step": 291263, "epoch": 3509} {"train_loss": -25.48666000366211, "global_step": 291264, "epoch": 3509} {"train_loss": -25.535634994506836, "global_step": 291265, "epoch": 3509} {"train_loss": -25.246213912963867, "global_step": 291266, "epoch": 3509} {"train_loss": -25.630414962768555, "global_step": 291267, "epoch": 3509} {"train_loss": -25.64923667907715, "global_step": 291268, "epoch": 3509} {"train_loss": -25.514951705932617, "global_step": 291269, "epoch": 3509} {"train_loss": -25.539892196655273, "global_step": 291270, "epoch": 3509} {"train_loss": -25.322322845458984, "global_step": 291271, "epoch": 3509} {"train_loss": -25.296934127807617, "global_step": 291272, "epoch": 3509} {"train_loss": -25.726551055908203, "global_step": 291273, "epoch": 3509} {"train_loss": -25.39944839477539, "global_step": 291274, "epoch": 3509} {"train_loss": -25.817045211791992, "global_step": 291275, "epoch": 3509} {"train_loss": -25.497739791870117, "global_step": 291276, "epoch": 3509} {"train_loss": -25.36825942993164, "global_step": 291277, "epoch": 3509} {"train_loss": -25.701025009155273, "global_step": 291278, "epoch": 3509} {"train_loss": -25.7764892578125, "global_step": 291279, "epoch": 3509} {"train_loss": -25.350618362426758, "global_step": 291280, "epoch": 3509} {"train_loss": -25.707111358642578, "global_step": 291281, "epoch": 3509} {"train_loss": -25.781789779663086, "global_step": 291282, "epoch": 3509} {"train_loss": -25.485830307006836, "global_step": 291283, "epoch": 3509} {"train_loss": -25.716510772705078, "global_step": 291284, "epoch": 3509} {"train_loss": -25.57464599609375, "global_step": 291285, "epoch": 3509} {"train_loss": -25.45616912841797, "global_step": 291286, "epoch": 3509} {"train_loss": -25.521196365356445, "global_step": 291287, "epoch": 3509} {"train_loss": -25.346763610839844, "global_step": 291288, "epoch": 3509} {"train_loss": -25.799152374267578, "global_step": 291289, "epoch": 3509} {"train_loss": -25.970916748046875, "global_step": 291290, "epoch": 3509} {"train_loss": -25.110361099243164, "global_step": 291291, "epoch": 3509} {"train_loss": -25.617502212524414, "global_step": 291292, "epoch": 3509} {"train_loss": -25.89008140563965, "global_step": 291293, "epoch": 3509} {"train_loss": -25.409887313842773, "global_step": 291294, "epoch": 3509} {"train_loss": -25.6501407623291, "global_step": 291295, "epoch": 3509} {"train_loss": -25.367807388305664, "global_step": 291296, "epoch": 3509} {"train_loss": -25.530776977539062, "global_step": 291297, "epoch": 3509} {"train_loss": -25.423734664916992, "global_step": 291298, "epoch": 3509} {"train_loss": -25.64719009399414, "global_step": 291299, "epoch": 3509} {"train_loss": -25.183202743530273, "global_step": 291300, "epoch": 3509} {"train_loss": -25.93184471130371, "global_step": 291301, "epoch": 3509} {"train_loss": -25.533506393432617, "global_step": 291302, "epoch": 3509} {"train_loss": -25.362306594848633, "global_step": 291303, "epoch": 3509} {"train_loss": -25.061389923095703, "global_step": 291304, "epoch": 3509} {"train_loss": -25.254135131835938, "global_step": 291305, "epoch": 3509} {"train_loss": -25.362648010253906, "global_step": 291306, "epoch": 3509} {"train_loss": -25.189319610595703, "global_step": 291307, "epoch": 3509} {"train_loss": -25.457778930664062, "global_step": 291308, "epoch": 3509} {"train_loss": -25.578306198120117, "global_step": 291309, "epoch": 3509} {"train_loss": -25.434354782104492, "global_step": 291310, "epoch": 3509} {"train_loss": -25.516666412353516, "global_step": 291311, "epoch": 3509} {"train_loss": -25.101865768432617, "global_step": 291312, "epoch": 3509} {"train_loss": -25.460355758666992, "global_step": 291313, "epoch": 3509} {"train_loss": -25.75861167907715, "global_step": 291314, "epoch": 3509} {"train_loss": -25.471033096313477, "global_step": 291315, "epoch": 3509} {"train_loss": -25.168500900268555, "global_step": 291316, "epoch": 3509} {"train_loss": -25.538862228393555, "global_step": 291317, "epoch": 3509} {"train_loss": -25.6606502532959, "global_step": 291318, "epoch": 3509} {"train_loss": -25.499414443969727, "global_step": 291319, "epoch": 3509} {"train_loss": -25.586408615112305, "global_step": 291320, "epoch": 3509} {"train_loss": -25.951629638671875, "global_step": 291321, "epoch": 3509} {"train_loss": -25.61099624633789, "global_step": 291322, "epoch": 3509} {"train_loss": -25.446680068969727, "global_step": 291323, "epoch": 3509} {"train_loss": -25.373363494873047, "global_step": 291324, "epoch": 3509} {"train_loss": -25.21364402770996, "global_step": 291325, "epoch": 3509} {"train_loss": -25.834964752197266, "global_step": 291326, "epoch": 3509} {"train_loss": -25.134756088256836, "global_step": 291327, "epoch": 3509} {"train_loss": -25.686491012573242, "global_step": 291328, "epoch": 3509} {"train_loss": -25.450725348598986, "global_step": 291329, "epoch": 3509, "val_loss": 7389215.0} {"train_loss": -24.819995880126953, "global_step": 291330, "epoch": 3510} {"train_loss": -25.460134506225586, "global_step": 291331, "epoch": 3510} {"train_loss": -24.914400100708008, "global_step": 291332, "epoch": 3510} {"train_loss": -25.30801773071289, "global_step": 291333, "epoch": 3510} {"train_loss": -25.380075454711914, "global_step": 291334, "epoch": 3510} {"train_loss": -25.120851516723633, "global_step": 291335, "epoch": 3510} {"train_loss": -24.991365432739258, "global_step": 291336, "epoch": 3510} {"train_loss": -25.001577377319336, "global_step": 291337, "epoch": 3510} {"train_loss": -25.201431274414062, "global_step": 291338, "epoch": 3510} {"train_loss": -25.0711669921875, "global_step": 291339, "epoch": 3510} {"train_loss": -25.24470329284668, "global_step": 291340, "epoch": 3510} {"train_loss": -25.15842056274414, "global_step": 291341, "epoch": 3510} {"train_loss": -25.311691284179688, "global_step": 291342, "epoch": 3510} {"train_loss": -25.37749671936035, "global_step": 291343, "epoch": 3510} {"train_loss": -25.31717300415039, "global_step": 291344, "epoch": 3510} {"train_loss": -24.871564865112305, "global_step": 291345, "epoch": 3510} {"train_loss": -25.384042739868164, "global_step": 291346, "epoch": 3510} {"train_loss": -24.943313598632812, "global_step": 291347, "epoch": 3510} {"train_loss": -25.298303604125977, "global_step": 291348, "epoch": 3510} {"train_loss": -24.993391036987305, "global_step": 291349, "epoch": 3510} {"train_loss": -25.4053955078125, "global_step": 291350, "epoch": 3510} {"train_loss": -25.64755630493164, "global_step": 291351, "epoch": 3510} {"train_loss": -25.147985458374023, "global_step": 291352, "epoch": 3510} {"train_loss": -25.397733688354492, "global_step": 291353, "epoch": 3510} {"train_loss": -25.694547653198242, "global_step": 291354, "epoch": 3510} {"train_loss": -25.243009567260742, "global_step": 291355, "epoch": 3510} {"train_loss": -25.667051315307617, "global_step": 291356, "epoch": 3510} {"train_loss": -25.651397705078125, "global_step": 291357, "epoch": 3510} {"train_loss": -25.443029403686523, "global_step": 291358, "epoch": 3510} {"train_loss": -25.751544952392578, "global_step": 291359, "epoch": 3510} {"train_loss": -25.718738555908203, "global_step": 291360, "epoch": 3510} {"train_loss": -25.45298194885254, "global_step": 291361, "epoch": 3510} {"train_loss": -25.60697364807129, "global_step": 291362, "epoch": 3510} {"train_loss": -25.62823486328125, "global_step": 291363, "epoch": 3510} {"train_loss": -25.598779678344727, "global_step": 291364, "epoch": 3510} {"train_loss": -25.6033935546875, "global_step": 291365, "epoch": 3510} {"train_loss": -25.949594497680664, "global_step": 291366, "epoch": 3510} {"train_loss": -26.030475616455078, "global_step": 291367, "epoch": 3510} {"train_loss": -25.64784049987793, "global_step": 291368, "epoch": 3510} {"train_loss": -25.853759765625, "global_step": 291369, "epoch": 3510} {"train_loss": -25.450347900390625, "global_step": 291370, "epoch": 3510} {"train_loss": -25.578161239624023, "global_step": 291371, "epoch": 3510} {"train_loss": -25.385940551757812, "global_step": 291372, "epoch": 3510} {"train_loss": -25.512332916259766, "global_step": 291373, "epoch": 3510} {"train_loss": -25.76539421081543, "global_step": 291374, "epoch": 3510} {"train_loss": -25.569107055664062, "global_step": 291375, "epoch": 3510} {"train_loss": -25.820865631103516, "global_step": 291376, "epoch": 3510} {"train_loss": -25.393091201782227, "global_step": 291377, "epoch": 3510} {"train_loss": -25.485145568847656, "global_step": 291378, "epoch": 3510} {"train_loss": -25.49836540222168, "global_step": 291379, "epoch": 3510} {"train_loss": -26.010000228881836, "global_step": 291380, "epoch": 3510} {"train_loss": -25.427658081054688, "global_step": 291381, "epoch": 3510} {"train_loss": -25.434675216674805, "global_step": 291382, "epoch": 3510} {"train_loss": -25.521902084350586, "global_step": 291383, "epoch": 3510} {"train_loss": -25.44180679321289, "global_step": 291384, "epoch": 3510} {"train_loss": -25.6888484954834, "global_step": 291385, "epoch": 3510} {"train_loss": -24.980253219604492, "global_step": 291386, "epoch": 3510} {"train_loss": -24.843074798583984, "global_step": 291387, "epoch": 3510} {"train_loss": -25.27728271484375, "global_step": 291388, "epoch": 3510} {"train_loss": -25.18049430847168, "global_step": 291389, "epoch": 3510} {"train_loss": -25.009780883789062, "global_step": 291390, "epoch": 3510} {"train_loss": -24.791948318481445, "global_step": 291391, "epoch": 3510} {"train_loss": -25.53743553161621, "global_step": 291392, "epoch": 3510} {"train_loss": -25.054128646850586, "global_step": 291393, "epoch": 3510} {"train_loss": -25.569229125976562, "global_step": 291394, "epoch": 3510} {"train_loss": -25.303787231445312, "global_step": 291395, "epoch": 3510} {"train_loss": -25.529333114624023, "global_step": 291396, "epoch": 3510} {"train_loss": -25.60116958618164, "global_step": 291397, "epoch": 3510} {"train_loss": -25.257625579833984, "global_step": 291398, "epoch": 3510} {"train_loss": -25.65801429748535, "global_step": 291399, "epoch": 3510} {"train_loss": -25.389631271362305, "global_step": 291400, "epoch": 3510} {"train_loss": -25.390514373779297, "global_step": 291401, "epoch": 3510} {"train_loss": -25.12276268005371, "global_step": 291402, "epoch": 3510} {"train_loss": -25.441776275634766, "global_step": 291403, "epoch": 3510} {"train_loss": -25.229211807250977, "global_step": 291404, "epoch": 3510} {"train_loss": -25.347448348999023, "global_step": 291405, "epoch": 3510} {"train_loss": -25.439491271972656, "global_step": 291406, "epoch": 3510} {"train_loss": -25.49550437927246, "global_step": 291407, "epoch": 3510} {"train_loss": -25.56350326538086, "global_step": 291408, "epoch": 3510} {"train_loss": -25.387292861938477, "global_step": 291409, "epoch": 3510} {"train_loss": -25.050527572631836, "global_step": 291410, "epoch": 3510} {"train_loss": -25.570676803588867, "global_step": 291411, "epoch": 3510} {"train_loss": -25.394643209066736, "global_step": 291412, "epoch": 3510, "val_loss": 7227917.5} {"train_loss": -25.13690757751465, "global_step": 291413, "epoch": 3511} {"train_loss": -25.20191192626953, "global_step": 291414, "epoch": 3511} {"train_loss": -25.236576080322266, "global_step": 291415, "epoch": 3511} {"train_loss": -25.449384689331055, "global_step": 291416, "epoch": 3511} {"train_loss": -24.542654037475586, "global_step": 291417, "epoch": 3511} {"train_loss": -25.1793270111084, "global_step": 291418, "epoch": 3511} {"train_loss": -25.086816787719727, "global_step": 291419, "epoch": 3511} {"train_loss": -24.92333984375, "global_step": 291420, "epoch": 3511} {"train_loss": -25.462621688842773, "global_step": 291421, "epoch": 3511} {"train_loss": -25.273147583007812, "global_step": 291422, "epoch": 3511} {"train_loss": -24.94771385192871, "global_step": 291423, "epoch": 3511} {"train_loss": -25.131345748901367, "global_step": 291424, "epoch": 3511} {"train_loss": -25.447126388549805, "global_step": 291425, "epoch": 3511} {"train_loss": -25.142871856689453, "global_step": 291426, "epoch": 3511} {"train_loss": -25.151817321777344, "global_step": 291427, "epoch": 3511} {"train_loss": -25.07803726196289, "global_step": 291428, "epoch": 3511} {"train_loss": -25.417818069458008, "global_step": 291429, "epoch": 3511} {"train_loss": -25.546737670898438, "global_step": 291430, "epoch": 3511} {"train_loss": -25.40780258178711, "global_step": 291431, "epoch": 3511} {"train_loss": -25.353384017944336, "global_step": 291432, "epoch": 3511} {"train_loss": -25.462526321411133, "global_step": 291433, "epoch": 3511} {"train_loss": -25.7990779876709, "global_step": 291434, "epoch": 3511} {"train_loss": -25.107290267944336, "global_step": 291435, "epoch": 3511} {"train_loss": -25.243249893188477, "global_step": 291436, "epoch": 3511} {"train_loss": -25.459823608398438, "global_step": 291437, "epoch": 3511} {"train_loss": -25.692224502563477, "global_step": 291438, "epoch": 3511} {"train_loss": -25.795368194580078, "global_step": 291439, "epoch": 3511} {"train_loss": -25.55478858947754, "global_step": 291440, "epoch": 3511} {"train_loss": -25.593368530273438, "global_step": 291441, "epoch": 3511} {"train_loss": -25.25079917907715, "global_step": 291442, "epoch": 3511} {"train_loss": -25.574331283569336, "global_step": 291443, "epoch": 3511} {"train_loss": -25.398910522460938, "global_step": 291444, "epoch": 3511} {"train_loss": -25.631927490234375, "global_step": 291445, "epoch": 3511} {"train_loss": -25.99993896484375, "global_step": 291446, "epoch": 3511} {"train_loss": -25.079004287719727, "global_step": 291447, "epoch": 3511} {"train_loss": -25.532115936279297, "global_step": 291448, "epoch": 3511} {"train_loss": -25.503114700317383, "global_step": 291449, "epoch": 3511} {"train_loss": -25.8746280670166, "global_step": 291450, "epoch": 3511} {"train_loss": -25.48893928527832, "global_step": 291451, "epoch": 3511} {"train_loss": -25.856082916259766, "global_step": 291452, "epoch": 3511} {"train_loss": -25.42120361328125, "global_step": 291453, "epoch": 3511} {"train_loss": -25.582595825195312, "global_step": 291454, "epoch": 3511} {"train_loss": -25.566120147705078, "global_step": 291455, "epoch": 3511} {"train_loss": -25.67176628112793, "global_step": 291456, "epoch": 3511} {"train_loss": -25.812421798706055, "global_step": 291457, "epoch": 3511} {"train_loss": -25.46742820739746, "global_step": 291458, "epoch": 3511} {"train_loss": -25.81878662109375, "global_step": 291459, "epoch": 3511} {"train_loss": -25.777570724487305, "global_step": 291460, "epoch": 3511} {"train_loss": -25.387113571166992, "global_step": 291461, "epoch": 3511} {"train_loss": -25.8303165435791, "global_step": 291462, "epoch": 3511} {"train_loss": -25.579421997070312, "global_step": 291463, "epoch": 3511} {"train_loss": -25.77129554748535, "global_step": 291464, "epoch": 3511} {"train_loss": -25.552841186523438, "global_step": 291465, "epoch": 3511} {"train_loss": -25.534255981445312, "global_step": 291466, "epoch": 3511} {"train_loss": -25.79275894165039, "global_step": 291467, "epoch": 3511} {"train_loss": -25.543323516845703, "global_step": 291468, "epoch": 3511} {"train_loss": -25.863574981689453, "global_step": 291469, "epoch": 3511} {"train_loss": -25.58506202697754, "global_step": 291470, "epoch": 3511} {"train_loss": -24.97794532775879, "global_step": 291471, "epoch": 3511} {"train_loss": -25.15890121459961, "global_step": 291472, "epoch": 3511} {"train_loss": -25.302169799804688, "global_step": 291473, "epoch": 3511} {"train_loss": -25.365802764892578, "global_step": 291474, "epoch": 3511} {"train_loss": -25.29722785949707, "global_step": 291475, "epoch": 3511} {"train_loss": -25.6058406829834, "global_step": 291476, "epoch": 3511} {"train_loss": -25.521326065063477, "global_step": 291477, "epoch": 3511} {"train_loss": -25.6343994140625, "global_step": 291478, "epoch": 3511} {"train_loss": -25.074588775634766, "global_step": 291479, "epoch": 3511} {"train_loss": -25.796945571899414, "global_step": 291480, "epoch": 3511} {"train_loss": -25.45787811279297, "global_step": 291481, "epoch": 3511} {"train_loss": -26.035755157470703, "global_step": 291482, "epoch": 3511} {"train_loss": -25.64881706237793, "global_step": 291483, "epoch": 3511} {"train_loss": -25.532861709594727, "global_step": 291484, "epoch": 3511} {"train_loss": -25.402341842651367, "global_step": 291485, "epoch": 3511} {"train_loss": -25.40225601196289, "global_step": 291486, "epoch": 3511} {"train_loss": -25.626550674438477, "global_step": 291487, "epoch": 3511} {"train_loss": -25.45069694519043, "global_step": 291488, "epoch": 3511} {"train_loss": -25.534536361694336, "global_step": 291489, "epoch": 3511} {"train_loss": -25.49354362487793, "global_step": 291490, "epoch": 3511} {"train_loss": -25.6707820892334, "global_step": 291491, "epoch": 3511} {"train_loss": -25.42415428161621, "global_step": 291492, "epoch": 3511} {"train_loss": -25.261587142944336, "global_step": 291493, "epoch": 3511} {"train_loss": -25.683584213256836, "global_step": 291494, "epoch": 3511} {"train_loss": -25.45681296199201, "global_step": 291495, "epoch": 3511, "val_loss": 7176374.0} {"train_loss": -25.3603458404541, "global_step": 291496, "epoch": 3512} {"train_loss": -25.700397491455078, "global_step": 291497, "epoch": 3512} {"train_loss": -25.301183700561523, "global_step": 291498, "epoch": 3512} {"train_loss": -25.43121910095215, "global_step": 291499, "epoch": 3512} {"train_loss": -25.71673011779785, "global_step": 291500, "epoch": 3512} {"train_loss": -25.081857681274414, "global_step": 291501, "epoch": 3512} {"train_loss": -25.32718849182129, "global_step": 291502, "epoch": 3512} {"train_loss": -25.460580825805664, "global_step": 291503, "epoch": 3512} {"train_loss": -25.489147186279297, "global_step": 291504, "epoch": 3512} {"train_loss": -25.404850006103516, "global_step": 291505, "epoch": 3512} {"train_loss": -25.221649169921875, "global_step": 291506, "epoch": 3512} {"train_loss": -25.328657150268555, "global_step": 291507, "epoch": 3512} {"train_loss": -25.063968658447266, "global_step": 291508, "epoch": 3512} {"train_loss": -25.313339233398438, "global_step": 291509, "epoch": 3512} {"train_loss": -25.15324592590332, "global_step": 291510, "epoch": 3512} {"train_loss": -25.072839736938477, "global_step": 291511, "epoch": 3512} {"train_loss": -25.59561538696289, "global_step": 291512, "epoch": 3512} {"train_loss": -25.330059051513672, "global_step": 291513, "epoch": 3512} {"train_loss": -25.590993881225586, "global_step": 291514, "epoch": 3512} {"train_loss": -25.712018966674805, "global_step": 291515, "epoch": 3512} {"train_loss": -25.770959854125977, "global_step": 291516, "epoch": 3512} {"train_loss": -25.676044464111328, "global_step": 291517, "epoch": 3512} {"train_loss": -25.475982666015625, "global_step": 291518, "epoch": 3512} {"train_loss": -25.62428855895996, "global_step": 291519, "epoch": 3512} {"train_loss": -26.1854248046875, "global_step": 291520, "epoch": 3512} {"train_loss": -25.518415451049805, "global_step": 291521, "epoch": 3512} {"train_loss": -25.41047477722168, "global_step": 291522, "epoch": 3512} {"train_loss": -26.02107048034668, "global_step": 291523, "epoch": 3512} {"train_loss": -25.70057487487793, "global_step": 291524, "epoch": 3512} {"train_loss": -25.785125732421875, "global_step": 291525, "epoch": 3512} {"train_loss": -25.807912826538086, "global_step": 291526, "epoch": 3512} {"train_loss": -25.7088565826416, "global_step": 291527, "epoch": 3512} {"train_loss": -25.906421661376953, "global_step": 291528, "epoch": 3512} {"train_loss": -25.378416061401367, "global_step": 291529, "epoch": 3512} {"train_loss": -25.705121994018555, "global_step": 291530, "epoch": 3512} {"train_loss": -25.3955020904541, "global_step": 291531, "epoch": 3512} {"train_loss": -25.484655380249023, "global_step": 291532, "epoch": 3512} {"train_loss": -25.453359603881836, "global_step": 291533, "epoch": 3512} {"train_loss": -25.623388290405273, "global_step": 291534, "epoch": 3512} {"train_loss": -25.574111938476562, "global_step": 291535, "epoch": 3512} {"train_loss": -25.291461944580078, "global_step": 291536, "epoch": 3512} {"train_loss": -25.23683738708496, "global_step": 291537, "epoch": 3512} {"train_loss": -25.448694229125977, "global_step": 291538, "epoch": 3512} {"train_loss": -25.91200065612793, "global_step": 291539, "epoch": 3512} {"train_loss": -25.73858070373535, "global_step": 291540, "epoch": 3512} {"train_loss": -25.64912986755371, "global_step": 291541, "epoch": 3512} {"train_loss": -25.76173210144043, "global_step": 291542, "epoch": 3512} {"train_loss": -25.585927963256836, "global_step": 291543, "epoch": 3512} {"train_loss": -25.276233673095703, "global_step": 291544, "epoch": 3512} {"train_loss": -25.72901725769043, "global_step": 291545, "epoch": 3512} {"train_loss": -25.5821475982666, "global_step": 291546, "epoch": 3512} {"train_loss": -25.279836654663086, "global_step": 291547, "epoch": 3512} {"train_loss": -25.8944034576416, "global_step": 291548, "epoch": 3512} {"train_loss": -25.47421646118164, "global_step": 291549, "epoch": 3512} {"train_loss": -25.1148624420166, "global_step": 291550, "epoch": 3512} {"train_loss": -25.447614669799805, "global_step": 291551, "epoch": 3512} {"train_loss": -25.62350845336914, "global_step": 291552, "epoch": 3512} {"train_loss": -25.734228134155273, "global_step": 291553, "epoch": 3512} {"train_loss": -25.839496612548828, "global_step": 291554, "epoch": 3512} {"train_loss": -26.0093994140625, "global_step": 291555, "epoch": 3512} {"train_loss": -25.44659996032715, "global_step": 291556, "epoch": 3512} {"train_loss": -25.782926559448242, "global_step": 291557, "epoch": 3512} {"train_loss": -25.52281951904297, "global_step": 291558, "epoch": 3512} {"train_loss": -25.35263442993164, "global_step": 291559, "epoch": 3512} {"train_loss": -25.789106369018555, "global_step": 291560, "epoch": 3512} {"train_loss": -25.871877670288086, "global_step": 291561, "epoch": 3512} {"train_loss": -25.4064998626709, "global_step": 291562, "epoch": 3512} {"train_loss": -25.312694549560547, "global_step": 291563, "epoch": 3512} {"train_loss": -25.307138442993164, "global_step": 291564, "epoch": 3512} {"train_loss": -25.476285934448242, "global_step": 291565, "epoch": 3512} {"train_loss": -25.410860061645508, "global_step": 291566, "epoch": 3512} {"train_loss": -25.12906837463379, "global_step": 291567, "epoch": 3512} {"train_loss": -26.05207633972168, "global_step": 291568, "epoch": 3512} {"train_loss": -25.477834701538086, "global_step": 291569, "epoch": 3512} {"train_loss": -25.76715660095215, "global_step": 291570, "epoch": 3512} {"train_loss": -25.479724884033203, "global_step": 291571, "epoch": 3512} {"train_loss": -25.38931655883789, "global_step": 291572, "epoch": 3512} {"train_loss": -25.4397029876709, "global_step": 291573, "epoch": 3512} {"train_loss": -25.731475830078125, "global_step": 291574, "epoch": 3512} {"train_loss": -25.51327896118164, "global_step": 291575, "epoch": 3512} {"train_loss": -25.864734649658203, "global_step": 291576, "epoch": 3512} {"train_loss": -25.672677993774414, "global_step": 291577, "epoch": 3512} {"train_loss": -25.557650117989045, "global_step": 291578, "epoch": 3512, "val_loss": 7029755.0} {"train_loss": -23.937509536743164, "global_step": 291579, "epoch": 3513} {"train_loss": -24.50663948059082, "global_step": 291580, "epoch": 3513} {"train_loss": -25.218692779541016, "global_step": 291581, "epoch": 3513} {"train_loss": -24.0012264251709, "global_step": 291582, "epoch": 3513} {"train_loss": -25.247459411621094, "global_step": 291583, "epoch": 3513} {"train_loss": -24.671390533447266, "global_step": 291584, "epoch": 3513} {"train_loss": -24.848114013671875, "global_step": 291585, "epoch": 3513} {"train_loss": -24.9171085357666, "global_step": 291586, "epoch": 3513} {"train_loss": -24.9532470703125, "global_step": 291587, "epoch": 3513} {"train_loss": -24.645122528076172, "global_step": 291588, "epoch": 3513} {"train_loss": -24.958799362182617, "global_step": 291589, "epoch": 3513} {"train_loss": -24.896743774414062, "global_step": 291590, "epoch": 3513} {"train_loss": -25.222043991088867, "global_step": 291591, "epoch": 3513} {"train_loss": -25.1302490234375, "global_step": 291592, "epoch": 3513} {"train_loss": -25.291751861572266, "global_step": 291593, "epoch": 3513} {"train_loss": -25.207674026489258, "global_step": 291594, "epoch": 3513} {"train_loss": -25.167373657226562, "global_step": 291595, "epoch": 3513} {"train_loss": -25.65925407409668, "global_step": 291596, "epoch": 3513} {"train_loss": -25.006452560424805, "global_step": 291597, "epoch": 3513} {"train_loss": -25.254308700561523, "global_step": 291598, "epoch": 3513} {"train_loss": -25.26412582397461, "global_step": 291599, "epoch": 3513} {"train_loss": -25.195804595947266, "global_step": 291600, "epoch": 3513} {"train_loss": -24.947776794433594, "global_step": 291601, "epoch": 3513} {"train_loss": -24.89887809753418, "global_step": 291602, "epoch": 3513} {"train_loss": -25.482345581054688, "global_step": 291603, "epoch": 3513} {"train_loss": -25.527957916259766, "global_step": 291604, "epoch": 3513} {"train_loss": -25.237064361572266, "global_step": 291605, "epoch": 3513} {"train_loss": -25.3468074798584, "global_step": 291606, "epoch": 3513} {"train_loss": -25.38517951965332, "global_step": 291607, "epoch": 3513} {"train_loss": -25.122974395751953, "global_step": 291608, "epoch": 3513} {"train_loss": -25.377685546875, "global_step": 291609, "epoch": 3513} {"train_loss": -25.15755271911621, "global_step": 291610, "epoch": 3513} {"train_loss": -25.373010635375977, "global_step": 291611, "epoch": 3513} {"train_loss": -25.524152755737305, "global_step": 291612, "epoch": 3513} {"train_loss": -25.67279624938965, "global_step": 291613, "epoch": 3513} {"train_loss": -25.77762222290039, "global_step": 291614, "epoch": 3513} {"train_loss": -25.204668045043945, "global_step": 291615, "epoch": 3513} {"train_loss": -25.020977020263672, "global_step": 291616, "epoch": 3513} {"train_loss": -25.238178253173828, "global_step": 291617, "epoch": 3513} {"train_loss": -25.659072875976562, "global_step": 291618, "epoch": 3513} {"train_loss": -25.47562026977539, "global_step": 291619, "epoch": 3513} {"train_loss": -25.55816078186035, "global_step": 291620, "epoch": 3513} {"train_loss": -25.463258743286133, "global_step": 291621, "epoch": 3513} {"train_loss": -25.466567993164062, "global_step": 291622, "epoch": 3513} {"train_loss": -25.607257843017578, "global_step": 291623, "epoch": 3513} {"train_loss": -25.445579528808594, "global_step": 291624, "epoch": 3513} {"train_loss": -25.793170928955078, "global_step": 291625, "epoch": 3513} {"train_loss": -25.409250259399414, "global_step": 291626, "epoch": 3513} {"train_loss": -25.55516242980957, "global_step": 291627, "epoch": 3513} {"train_loss": -26.05398941040039, "global_step": 291628, "epoch": 3513} {"train_loss": -25.753070831298828, "global_step": 291629, "epoch": 3513} {"train_loss": -25.66267204284668, "global_step": 291630, "epoch": 3513} {"train_loss": -25.45547866821289, "global_step": 291631, "epoch": 3513} {"train_loss": -25.716306686401367, "global_step": 291632, "epoch": 3513} {"train_loss": -25.559646606445312, "global_step": 291633, "epoch": 3513} {"train_loss": -25.194747924804688, "global_step": 291634, "epoch": 3513} {"train_loss": -25.556798934936523, "global_step": 291635, "epoch": 3513} {"train_loss": -25.44853401184082, "global_step": 291636, "epoch": 3513} {"train_loss": -25.414196014404297, "global_step": 291637, "epoch": 3513} {"train_loss": -25.62774658203125, "global_step": 291638, "epoch": 3513} {"train_loss": -25.359251022338867, "global_step": 291639, "epoch": 3513} {"train_loss": -25.61410903930664, "global_step": 291640, "epoch": 3513} {"train_loss": -25.683115005493164, "global_step": 291641, "epoch": 3513} {"train_loss": -25.741056442260742, "global_step": 291642, "epoch": 3513} {"train_loss": -25.646093368530273, "global_step": 291643, "epoch": 3513} {"train_loss": -25.443185806274414, "global_step": 291644, "epoch": 3513} {"train_loss": -25.188217163085938, "global_step": 291645, "epoch": 3513} {"train_loss": -25.11531639099121, "global_step": 291646, "epoch": 3513} {"train_loss": -25.36215591430664, "global_step": 291647, "epoch": 3513} {"train_loss": -26.004180908203125, "global_step": 291648, "epoch": 3513} {"train_loss": -25.51711082458496, "global_step": 291649, "epoch": 3513} {"train_loss": -25.69964027404785, "global_step": 291650, "epoch": 3513} {"train_loss": -25.825794219970703, "global_step": 291651, "epoch": 3513} {"train_loss": -25.543195724487305, "global_step": 291652, "epoch": 3513} {"train_loss": -25.4691104888916, "global_step": 291653, "epoch": 3513} {"train_loss": -25.627643585205078, "global_step": 291654, "epoch": 3513} {"train_loss": -25.91655921936035, "global_step": 291655, "epoch": 3513} {"train_loss": -25.57147789001465, "global_step": 291656, "epoch": 3513} {"train_loss": -25.38486099243164, "global_step": 291657, "epoch": 3513} {"train_loss": -25.54123878479004, "global_step": 291658, "epoch": 3513} {"train_loss": -25.707372665405273, "global_step": 291659, "epoch": 3513} {"train_loss": -25.775251388549805, "global_step": 291660, "epoch": 3513} {"train_loss": -25.373036579913403, "global_step": 291661, "epoch": 3513, "val_loss": 7071990.0} {"train_loss": -25.10023307800293, "global_step": 291662, "epoch": 3514} {"train_loss": -25.141386032104492, "global_step": 291663, "epoch": 3514} {"train_loss": -25.02931022644043, "global_step": 291664, "epoch": 3514} {"train_loss": -24.721410751342773, "global_step": 291665, "epoch": 3514} {"train_loss": -25.251222610473633, "global_step": 291666, "epoch": 3514} {"train_loss": -24.631925582885742, "global_step": 291667, "epoch": 3514} {"train_loss": -25.03037452697754, "global_step": 291668, "epoch": 3514} {"train_loss": -25.184091567993164, "global_step": 291669, "epoch": 3514} {"train_loss": -24.755245208740234, "global_step": 291670, "epoch": 3514} {"train_loss": -25.160449981689453, "global_step": 291671, "epoch": 3514} {"train_loss": -24.808012008666992, "global_step": 291672, "epoch": 3514} {"train_loss": -25.07915496826172, "global_step": 291673, "epoch": 3514} {"train_loss": -25.29691505432129, "global_step": 291674, "epoch": 3514} {"train_loss": -25.344650268554688, "global_step": 291675, "epoch": 3514} {"train_loss": -25.332223892211914, "global_step": 291676, "epoch": 3514} {"train_loss": -25.27699851989746, "global_step": 291677, "epoch": 3514} {"train_loss": -25.5111083984375, "global_step": 291678, "epoch": 3514} {"train_loss": -25.14192008972168, "global_step": 291679, "epoch": 3514} {"train_loss": -25.203393936157227, "global_step": 291680, "epoch": 3514} {"train_loss": -25.24721336364746, "global_step": 291681, "epoch": 3514} {"train_loss": -25.19169044494629, "global_step": 291682, "epoch": 3514} {"train_loss": -25.267953872680664, "global_step": 291683, "epoch": 3514} {"train_loss": -25.084665298461914, "global_step": 291684, "epoch": 3514} {"train_loss": -25.2846736907959, "global_step": 291685, "epoch": 3514} {"train_loss": -25.481826782226562, "global_step": 291686, "epoch": 3514} {"train_loss": -25.522096633911133, "global_step": 291687, "epoch": 3514} {"train_loss": -25.576522827148438, "global_step": 291688, "epoch": 3514} {"train_loss": -25.552295684814453, "global_step": 291689, "epoch": 3514} {"train_loss": -25.419605255126953, "global_step": 291690, "epoch": 3514} {"train_loss": -25.38396644592285, "global_step": 291691, "epoch": 3514} {"train_loss": -25.762378692626953, "global_step": 291692, "epoch": 3514} {"train_loss": -25.77033805847168, "global_step": 291693, "epoch": 3514} {"train_loss": -25.57257080078125, "global_step": 291694, "epoch": 3514} {"train_loss": -25.155061721801758, "global_step": 291695, "epoch": 3514} {"train_loss": -25.691925048828125, "global_step": 291696, "epoch": 3514} {"train_loss": -25.47829246520996, "global_step": 291697, "epoch": 3514} {"train_loss": -25.126888275146484, "global_step": 291698, "epoch": 3514} {"train_loss": -25.576086044311523, "global_step": 291699, "epoch": 3514} {"train_loss": -25.493009567260742, "global_step": 291700, "epoch": 3514} {"train_loss": -25.624364852905273, "global_step": 291701, "epoch": 3514} {"train_loss": -25.490219116210938, "global_step": 291702, "epoch": 3514} {"train_loss": -25.850000381469727, "global_step": 291703, "epoch": 3514} {"train_loss": -26.085987091064453, "global_step": 291704, "epoch": 3514} {"train_loss": -26.00398063659668, "global_step": 291705, "epoch": 3514} {"train_loss": -25.88492202758789, "global_step": 291706, "epoch": 3514} {"train_loss": -25.74810791015625, "global_step": 291707, "epoch": 3514} {"train_loss": -25.842756271362305, "global_step": 291708, "epoch": 3514} {"train_loss": -25.931711196899414, "global_step": 291709, "epoch": 3514} {"train_loss": -25.834314346313477, "global_step": 291710, "epoch": 3514} {"train_loss": -25.644668579101562, "global_step": 291711, "epoch": 3514} {"train_loss": -25.6676082611084, "global_step": 291712, "epoch": 3514} {"train_loss": -26.024433135986328, "global_step": 291713, "epoch": 3514} {"train_loss": -26.269941329956055, "global_step": 291714, "epoch": 3514} {"train_loss": -25.501277923583984, "global_step": 291715, "epoch": 3514} {"train_loss": -25.9135684967041, "global_step": 291716, "epoch": 3514} {"train_loss": -25.906232833862305, "global_step": 291717, "epoch": 3514} {"train_loss": -25.457014083862305, "global_step": 291718, "epoch": 3514} {"train_loss": -25.792755126953125, "global_step": 291719, "epoch": 3514} {"train_loss": -25.567792892456055, "global_step": 291720, "epoch": 3514} {"train_loss": -26.096023559570312, "global_step": 291721, "epoch": 3514} {"train_loss": -25.58980941772461, "global_step": 291722, "epoch": 3514} {"train_loss": -25.505496978759766, "global_step": 291723, "epoch": 3514} {"train_loss": -25.62507438659668, "global_step": 291724, "epoch": 3514} {"train_loss": -25.380172729492188, "global_step": 291725, "epoch": 3514} {"train_loss": -25.542524337768555, "global_step": 291726, "epoch": 3514} {"train_loss": -25.55812644958496, "global_step": 291727, "epoch": 3514} {"train_loss": -25.581707000732422, "global_step": 291728, "epoch": 3514} {"train_loss": -25.780475616455078, "global_step": 291729, "epoch": 3514} {"train_loss": -25.3717098236084, "global_step": 291730, "epoch": 3514} {"train_loss": -25.165760040283203, "global_step": 291731, "epoch": 3514} {"train_loss": -25.138620376586914, "global_step": 291732, "epoch": 3514} {"train_loss": -25.277923583984375, "global_step": 291733, "epoch": 3514} {"train_loss": -25.552143096923828, "global_step": 291734, "epoch": 3514} {"train_loss": -25.76458740234375, "global_step": 291735, "epoch": 3514} {"train_loss": -25.215608596801758, "global_step": 291736, "epoch": 3514} {"train_loss": -25.64361572265625, "global_step": 291737, "epoch": 3514} {"train_loss": -25.823461532592773, "global_step": 291738, "epoch": 3514} {"train_loss": -25.15679359436035, "global_step": 291739, "epoch": 3514} {"train_loss": -25.75538444519043, "global_step": 291740, "epoch": 3514} {"train_loss": -25.44756317138672, "global_step": 291741, "epoch": 3514} {"train_loss": -25.07630729675293, "global_step": 291742, "epoch": 3514} {"train_loss": -25.663488388061523, "global_step": 291743, "epoch": 3514} {"train_loss": -25.461395286651978, "global_step": 291744, "epoch": 3514, "val_loss": 7164257.0} {"train_loss": -25.210477828979492, "global_step": 291745, "epoch": 3515} {"train_loss": -24.47696876525879, "global_step": 291746, "epoch": 3515} {"train_loss": -25.519506454467773, "global_step": 291747, "epoch": 3515} {"train_loss": -24.813627243041992, "global_step": 291748, "epoch": 3515} {"train_loss": -25.195037841796875, "global_step": 291749, "epoch": 3515} {"train_loss": -24.90586280822754, "global_step": 291750, "epoch": 3515} {"train_loss": -25.05506706237793, "global_step": 291751, "epoch": 3515} {"train_loss": -25.05344009399414, "global_step": 291752, "epoch": 3515} {"train_loss": -25.288990020751953, "global_step": 291753, "epoch": 3515} {"train_loss": -24.94672203063965, "global_step": 291754, "epoch": 3515} {"train_loss": -25.342609405517578, "global_step": 291755, "epoch": 3515} {"train_loss": -24.79205894470215, "global_step": 291756, "epoch": 3515} {"train_loss": -25.48140525817871, "global_step": 291757, "epoch": 3515} {"train_loss": -25.332136154174805, "global_step": 291758, "epoch": 3515} {"train_loss": -25.197389602661133, "global_step": 291759, "epoch": 3515} {"train_loss": -25.215539932250977, "global_step": 291760, "epoch": 3515} {"train_loss": -25.30463981628418, "global_step": 291761, "epoch": 3515} {"train_loss": -25.287885665893555, "global_step": 291762, "epoch": 3515} {"train_loss": -25.42206382751465, "global_step": 291763, "epoch": 3515} {"train_loss": -25.681140899658203, "global_step": 291764, "epoch": 3515} {"train_loss": -25.567707061767578, "global_step": 291765, "epoch": 3515} {"train_loss": -25.3873291015625, "global_step": 291766, "epoch": 3515} {"train_loss": -25.631732940673828, "global_step": 291767, "epoch": 3515} {"train_loss": -25.71671485900879, "global_step": 291768, "epoch": 3515} {"train_loss": -25.232166290283203, "global_step": 291769, "epoch": 3515} {"train_loss": -25.34598731994629, "global_step": 291770, "epoch": 3515} {"train_loss": -25.54666519165039, "global_step": 291771, "epoch": 3515} {"train_loss": -25.536779403686523, "global_step": 291772, "epoch": 3515} {"train_loss": -25.307769775390625, "global_step": 291773, "epoch": 3515} {"train_loss": -25.64973258972168, "global_step": 291774, "epoch": 3515} {"train_loss": -25.8852481842041, "global_step": 291775, "epoch": 3515} {"train_loss": -25.67936134338379, "global_step": 291776, "epoch": 3515} {"train_loss": -25.566387176513672, "global_step": 291777, "epoch": 3515} {"train_loss": -25.488256454467773, "global_step": 291778, "epoch": 3515} {"train_loss": -25.192960739135742, "global_step": 291779, "epoch": 3515} {"train_loss": -25.560081481933594, "global_step": 291780, "epoch": 3515} {"train_loss": -25.602359771728516, "global_step": 291781, "epoch": 3515} {"train_loss": -25.298681259155273, "global_step": 291782, "epoch": 3515} {"train_loss": -25.336715698242188, "global_step": 291783, "epoch": 3515} {"train_loss": -25.444406509399414, "global_step": 291784, "epoch": 3515} {"train_loss": -25.73504638671875, "global_step": 291785, "epoch": 3515} {"train_loss": -25.174604415893555, "global_step": 291786, "epoch": 3515} {"train_loss": -25.28592872619629, "global_step": 291787, "epoch": 3515} {"train_loss": -25.414560317993164, "global_step": 291788, "epoch": 3515} {"train_loss": -25.416990280151367, "global_step": 291789, "epoch": 3515} {"train_loss": -25.472461700439453, "global_step": 291790, "epoch": 3515} {"train_loss": -25.2720890045166, "global_step": 291791, "epoch": 3515} {"train_loss": -25.277158737182617, "global_step": 291792, "epoch": 3515} {"train_loss": -25.052000045776367, "global_step": 291793, "epoch": 3515} {"train_loss": -25.464391708374023, "global_step": 291794, "epoch": 3515} {"train_loss": -25.60282325744629, "global_step": 291795, "epoch": 3515} {"train_loss": -25.328168869018555, "global_step": 291796, "epoch": 3515} {"train_loss": -25.305068969726562, "global_step": 291797, "epoch": 3515} {"train_loss": -25.24332046508789, "global_step": 291798, "epoch": 3515} {"train_loss": -25.553930282592773, "global_step": 291799, "epoch": 3515} {"train_loss": -25.35888671875, "global_step": 291800, "epoch": 3515} {"train_loss": -25.693450927734375, "global_step": 291801, "epoch": 3515} {"train_loss": -25.262893676757812, "global_step": 291802, "epoch": 3515} {"train_loss": -25.4344482421875, "global_step": 291803, "epoch": 3515} {"train_loss": -25.705137252807617, "global_step": 291804, "epoch": 3515} {"train_loss": -25.66596031188965, "global_step": 291805, "epoch": 3515} {"train_loss": -25.512121200561523, "global_step": 291806, "epoch": 3515} {"train_loss": -25.882709503173828, "global_step": 291807, "epoch": 3515} {"train_loss": -25.334985733032227, "global_step": 291808, "epoch": 3515} {"train_loss": -25.442363739013672, "global_step": 291809, "epoch": 3515} {"train_loss": -25.5714168548584, "global_step": 291810, "epoch": 3515} {"train_loss": -25.50506591796875, "global_step": 291811, "epoch": 3515} {"train_loss": -25.49989891052246, "global_step": 291812, "epoch": 3515} {"train_loss": -25.70159912109375, "global_step": 291813, "epoch": 3515} {"train_loss": -25.534656524658203, "global_step": 291814, "epoch": 3515} {"train_loss": -25.697601318359375, "global_step": 291815, "epoch": 3515} {"train_loss": -25.497318267822266, "global_step": 291816, "epoch": 3515} {"train_loss": -25.585988998413086, "global_step": 291817, "epoch": 3515} {"train_loss": -25.75689125061035, "global_step": 291818, "epoch": 3515} {"train_loss": -25.549131393432617, "global_step": 291819, "epoch": 3515} {"train_loss": -25.495040893554688, "global_step": 291820, "epoch": 3515} {"train_loss": -25.6077938079834, "global_step": 291821, "epoch": 3515} {"train_loss": -25.85235595703125, "global_step": 291822, "epoch": 3515} {"train_loss": -25.278512954711914, "global_step": 291823, "epoch": 3515} {"train_loss": -24.91678810119629, "global_step": 291824, "epoch": 3515} {"train_loss": -25.051353454589844, "global_step": 291825, "epoch": 3515} {"train_loss": -25.137449264526367, "global_step": 291826, "epoch": 3515} {"train_loss": -25.372941511223114, "global_step": 291827, "epoch": 3515, "val_loss": 7189494.5} {"train_loss": -24.727645874023438, "global_step": 291828, "epoch": 3516} {"train_loss": -25.112058639526367, "global_step": 291829, "epoch": 3516} {"train_loss": -25.04610252380371, "global_step": 291830, "epoch": 3516} {"train_loss": -24.929683685302734, "global_step": 291831, "epoch": 3516} {"train_loss": -24.7424259185791, "global_step": 291832, "epoch": 3516} {"train_loss": -24.941997528076172, "global_step": 291833, "epoch": 3516} {"train_loss": -25.318923950195312, "global_step": 291834, "epoch": 3516} {"train_loss": -25.104026794433594, "global_step": 291835, "epoch": 3516} {"train_loss": -25.06589698791504, "global_step": 291836, "epoch": 3516} {"train_loss": -24.754758834838867, "global_step": 291837, "epoch": 3516} {"train_loss": -25.323678970336914, "global_step": 291838, "epoch": 3516} {"train_loss": -25.256479263305664, "global_step": 291839, "epoch": 3516} {"train_loss": -25.35694694519043, "global_step": 291840, "epoch": 3516} {"train_loss": -25.61024284362793, "global_step": 291841, "epoch": 3516} {"train_loss": -25.05126953125, "global_step": 291842, "epoch": 3516} {"train_loss": -25.491233825683594, "global_step": 291843, "epoch": 3516} {"train_loss": -25.22478675842285, "global_step": 291844, "epoch": 3516} {"train_loss": -25.094181060791016, "global_step": 291845, "epoch": 3516} {"train_loss": -25.746973037719727, "global_step": 291846, "epoch": 3516} {"train_loss": -25.01753807067871, "global_step": 291847, "epoch": 3516} {"train_loss": -25.660314559936523, "global_step": 291848, "epoch": 3516} {"train_loss": -24.997875213623047, "global_step": 291849, "epoch": 3516} {"train_loss": -25.14212417602539, "global_step": 291850, "epoch": 3516} {"train_loss": -25.440793991088867, "global_step": 291851, "epoch": 3516} {"train_loss": -25.42852210998535, "global_step": 291852, "epoch": 3516} {"train_loss": -25.532052993774414, "global_step": 291853, "epoch": 3516} {"train_loss": -25.604833602905273, "global_step": 291854, "epoch": 3516} {"train_loss": -25.384475708007812, "global_step": 291855, "epoch": 3516} {"train_loss": -25.339263916015625, "global_step": 291856, "epoch": 3516} {"train_loss": -25.164880752563477, "global_step": 291857, "epoch": 3516} {"train_loss": -25.216506958007812, "global_step": 291858, "epoch": 3516} {"train_loss": -25.590091705322266, "global_step": 291859, "epoch": 3516} {"train_loss": -25.495147705078125, "global_step": 291860, "epoch": 3516} {"train_loss": -25.33314323425293, "global_step": 291861, "epoch": 3516} {"train_loss": -25.936792373657227, "global_step": 291862, "epoch": 3516} {"train_loss": -25.265207290649414, "global_step": 291863, "epoch": 3516} {"train_loss": -25.520071029663086, "global_step": 291864, "epoch": 3516} {"train_loss": -25.939544677734375, "global_step": 291865, "epoch": 3516} {"train_loss": -25.07721519470215, "global_step": 291866, "epoch": 3516} {"train_loss": -25.4211368560791, "global_step": 291867, "epoch": 3516} {"train_loss": -25.315784454345703, "global_step": 291868, "epoch": 3516} {"train_loss": -25.24210548400879, "global_step": 291869, "epoch": 3516} {"train_loss": -25.378192901611328, "global_step": 291870, "epoch": 3516} {"train_loss": -25.859540939331055, "global_step": 291871, "epoch": 3516} {"train_loss": -25.77607536315918, "global_step": 291872, "epoch": 3516} {"train_loss": -25.589643478393555, "global_step": 291873, "epoch": 3516} {"train_loss": -25.2672061920166, "global_step": 291874, "epoch": 3516} {"train_loss": -25.51871681213379, "global_step": 291875, "epoch": 3516} {"train_loss": -25.540937423706055, "global_step": 291876, "epoch": 3516} {"train_loss": -25.48990249633789, "global_step": 291877, "epoch": 3516} {"train_loss": -25.730731964111328, "global_step": 291878, "epoch": 3516} {"train_loss": -25.89228630065918, "global_step": 291879, "epoch": 3516} {"train_loss": -25.33488655090332, "global_step": 291880, "epoch": 3516} {"train_loss": -25.95757484436035, "global_step": 291881, "epoch": 3516} {"train_loss": -25.6917667388916, "global_step": 291882, "epoch": 3516} {"train_loss": -25.67594337463379, "global_step": 291883, "epoch": 3516} {"train_loss": -25.47096824645996, "global_step": 291884, "epoch": 3516} {"train_loss": -25.72406578063965, "global_step": 291885, "epoch": 3516} {"train_loss": -25.736053466796875, "global_step": 291886, "epoch": 3516} {"train_loss": -25.16899299621582, "global_step": 291887, "epoch": 3516} {"train_loss": -25.745885848999023, "global_step": 291888, "epoch": 3516} {"train_loss": -25.652603149414062, "global_step": 291889, "epoch": 3516} {"train_loss": -25.518644332885742, "global_step": 291890, "epoch": 3516} {"train_loss": -25.7065372467041, "global_step": 291891, "epoch": 3516} {"train_loss": -25.59478759765625, "global_step": 291892, "epoch": 3516} {"train_loss": -25.56227684020996, "global_step": 291893, "epoch": 3516} {"train_loss": -25.943302154541016, "global_step": 291894, "epoch": 3516} {"train_loss": -25.317028045654297, "global_step": 291895, "epoch": 3516} {"train_loss": -26.041288375854492, "global_step": 291896, "epoch": 3516} {"train_loss": -25.796613693237305, "global_step": 291897, "epoch": 3516} {"train_loss": -25.77886390686035, "global_step": 291898, "epoch": 3516} {"train_loss": -25.518035888671875, "global_step": 291899, "epoch": 3516} {"train_loss": -25.78949546813965, "global_step": 291900, "epoch": 3516} {"train_loss": -26.0245418548584, "global_step": 291901, "epoch": 3516} {"train_loss": -25.95644187927246, "global_step": 291902, "epoch": 3516} {"train_loss": -25.697925567626953, "global_step": 291903, "epoch": 3516} {"train_loss": -26.006534576416016, "global_step": 291904, "epoch": 3516} {"train_loss": -25.782617568969727, "global_step": 291905, "epoch": 3516} {"train_loss": -25.59930992126465, "global_step": 291906, "epoch": 3516} {"train_loss": -25.495946884155273, "global_step": 291907, "epoch": 3516} {"train_loss": -25.360885620117188, "global_step": 291908, "epoch": 3516} {"train_loss": -24.58588981628418, "global_step": 291909, "epoch": 3516} {"train_loss": -25.43274396873382, "global_step": 291910, "epoch": 3516, "val_loss": 7255582.0} {"train_loss": -23.2209529876709, "global_step": 291911, "epoch": 3517} {"train_loss": -24.496267318725586, "global_step": 291912, "epoch": 3517} {"train_loss": -23.163219451904297, "global_step": 291913, "epoch": 3517} {"train_loss": -24.343984603881836, "global_step": 291914, "epoch": 3517} {"train_loss": -23.320932388305664, "global_step": 291915, "epoch": 3517} {"train_loss": -24.08963394165039, "global_step": 291916, "epoch": 3517} {"train_loss": -24.84206199645996, "global_step": 291917, "epoch": 3517} {"train_loss": -24.811635971069336, "global_step": 291918, "epoch": 3517} {"train_loss": -24.668088912963867, "global_step": 291919, "epoch": 3517} {"train_loss": -24.363683700561523, "global_step": 291920, "epoch": 3517} {"train_loss": -25.021774291992188, "global_step": 291921, "epoch": 3517} {"train_loss": -25.09278678894043, "global_step": 291922, "epoch": 3517} {"train_loss": -24.522066116333008, "global_step": 291923, "epoch": 3517} {"train_loss": -24.852813720703125, "global_step": 291924, "epoch": 3517} {"train_loss": -24.424924850463867, "global_step": 291925, "epoch": 3517} {"train_loss": -25.28067398071289, "global_step": 291926, "epoch": 3517} {"train_loss": -24.966053009033203, "global_step": 291927, "epoch": 3517} {"train_loss": -25.2041072845459, "global_step": 291928, "epoch": 3517} {"train_loss": -24.92397117614746, "global_step": 291929, "epoch": 3517} {"train_loss": -25.142837524414062, "global_step": 291930, "epoch": 3517} {"train_loss": -24.938854217529297, "global_step": 291931, "epoch": 3517} {"train_loss": -25.259536743164062, "global_step": 291932, "epoch": 3517} {"train_loss": -25.065509796142578, "global_step": 291933, "epoch": 3517} {"train_loss": -25.188278198242188, "global_step": 291934, "epoch": 3517} {"train_loss": -25.348236083984375, "global_step": 291935, "epoch": 3517} {"train_loss": -25.331953048706055, "global_step": 291936, "epoch": 3517} {"train_loss": -25.346128463745117, "global_step": 291937, "epoch": 3517} {"train_loss": -25.269760131835938, "global_step": 291938, "epoch": 3517} {"train_loss": -25.24435806274414, "global_step": 291939, "epoch": 3517} {"train_loss": -25.591279983520508, "global_step": 291940, "epoch": 3517} {"train_loss": -25.63783073425293, "global_step": 291941, "epoch": 3517} {"train_loss": -25.39674186706543, "global_step": 291942, "epoch": 3517} {"train_loss": -25.4864559173584, "global_step": 291943, "epoch": 3517} {"train_loss": -25.221866607666016, "global_step": 291944, "epoch": 3517} {"train_loss": -25.570602416992188, "global_step": 291945, "epoch": 3517} {"train_loss": -25.626752853393555, "global_step": 291946, "epoch": 3517} {"train_loss": -25.445409774780273, "global_step": 291947, "epoch": 3517} {"train_loss": -25.595312118530273, "global_step": 291948, "epoch": 3517} {"train_loss": -25.50152587890625, "global_step": 291949, "epoch": 3517} {"train_loss": -25.431537628173828, "global_step": 291950, "epoch": 3517} {"train_loss": -25.390859603881836, "global_step": 291951, "epoch": 3517} {"train_loss": -25.664337158203125, "global_step": 291952, "epoch": 3517} {"train_loss": -25.45292854309082, "global_step": 291953, "epoch": 3517} {"train_loss": -25.63527488708496, "global_step": 291954, "epoch": 3517} {"train_loss": -25.148401260375977, "global_step": 291955, "epoch": 3517} {"train_loss": -25.55133628845215, "global_step": 291956, "epoch": 3517} {"train_loss": -25.5076847076416, "global_step": 291957, "epoch": 3517} {"train_loss": -25.68379020690918, "global_step": 291958, "epoch": 3517} {"train_loss": -25.148855209350586, "global_step": 291959, "epoch": 3517} {"train_loss": -25.291044235229492, "global_step": 291960, "epoch": 3517} {"train_loss": -25.284160614013672, "global_step": 291961, "epoch": 3517} {"train_loss": -25.458724975585938, "global_step": 291962, "epoch": 3517} {"train_loss": -25.482776641845703, "global_step": 291963, "epoch": 3517} {"train_loss": -25.440183639526367, "global_step": 291964, "epoch": 3517} {"train_loss": -25.9847412109375, "global_step": 291965, "epoch": 3517} {"train_loss": -25.319169998168945, "global_step": 291966, "epoch": 3517} {"train_loss": -25.155038833618164, "global_step": 291967, "epoch": 3517} {"train_loss": -25.413358688354492, "global_step": 291968, "epoch": 3517} {"train_loss": -25.435956954956055, "global_step": 291969, "epoch": 3517} {"train_loss": -25.722553253173828, "global_step": 291970, "epoch": 3517} {"train_loss": -25.22772789001465, "global_step": 291971, "epoch": 3517} {"train_loss": -25.580322265625, "global_step": 291972, "epoch": 3517} {"train_loss": -25.679916381835938, "global_step": 291973, "epoch": 3517} {"train_loss": -25.396467208862305, "global_step": 291974, "epoch": 3517} {"train_loss": -25.602664947509766, "global_step": 291975, "epoch": 3517} {"train_loss": -25.821090698242188, "global_step": 291976, "epoch": 3517} {"train_loss": -25.71722412109375, "global_step": 291977, "epoch": 3517} {"train_loss": -25.233125686645508, "global_step": 291978, "epoch": 3517} {"train_loss": -25.7017765045166, "global_step": 291979, "epoch": 3517} {"train_loss": -25.3976993560791, "global_step": 291980, "epoch": 3517} {"train_loss": -25.938983917236328, "global_step": 291981, "epoch": 3517} {"train_loss": -25.560726165771484, "global_step": 291982, "epoch": 3517} {"train_loss": -25.647764205932617, "global_step": 291983, "epoch": 3517} {"train_loss": -25.64422607421875, "global_step": 291984, "epoch": 3517} {"train_loss": -25.74554443359375, "global_step": 291985, "epoch": 3517} {"train_loss": -25.695056915283203, "global_step": 291986, "epoch": 3517} {"train_loss": -25.610509872436523, "global_step": 291987, "epoch": 3517} {"train_loss": -25.57537269592285, "global_step": 291988, "epoch": 3517} {"train_loss": -25.942983627319336, "global_step": 291989, "epoch": 3517} {"train_loss": -25.65146827697754, "global_step": 291990, "epoch": 3517} {"train_loss": -25.86341667175293, "global_step": 291991, "epoch": 3517} {"train_loss": -25.6181697845459, "global_step": 291992, "epoch": 3517} {"train_loss": -25.246255943574102, "global_step": 291993, "epoch": 3517, "val_loss": 7121015.0} {"train_loss": -24.914764404296875, "global_step": 291994, "epoch": 3518} {"train_loss": -24.932693481445312, "global_step": 291995, "epoch": 3518} {"train_loss": -25.07419776916504, "global_step": 291996, "epoch": 3518} {"train_loss": -24.339567184448242, "global_step": 291997, "epoch": 3518} {"train_loss": -25.33075523376465, "global_step": 291998, "epoch": 3518} {"train_loss": -24.808568954467773, "global_step": 291999, "epoch": 3518} {"train_loss": -25.186147689819336, "global_step": 292000, "epoch": 3518} {"train_loss": -24.959190368652344, "global_step": 292001, "epoch": 3518} {"train_loss": -25.363609313964844, "global_step": 292002, "epoch": 3518} {"train_loss": -25.164457321166992, "global_step": 292003, "epoch": 3518} {"train_loss": -25.173250198364258, "global_step": 292004, "epoch": 3518} {"train_loss": -25.174909591674805, "global_step": 292005, "epoch": 3518} {"train_loss": -24.985681533813477, "global_step": 292006, "epoch": 3518} {"train_loss": -25.372180938720703, "global_step": 292007, "epoch": 3518} {"train_loss": -25.46558952331543, "global_step": 292008, "epoch": 3518} {"train_loss": -25.220827102661133, "global_step": 292009, "epoch": 3518} {"train_loss": -25.420385360717773, "global_step": 292010, "epoch": 3518} {"train_loss": -25.530967712402344, "global_step": 292011, "epoch": 3518} {"train_loss": -25.604887008666992, "global_step": 292012, "epoch": 3518} {"train_loss": -25.171358108520508, "global_step": 292013, "epoch": 3518} {"train_loss": -25.428375244140625, "global_step": 292014, "epoch": 3518} {"train_loss": -24.795141220092773, "global_step": 292015, "epoch": 3518} {"train_loss": -25.390953063964844, "global_step": 292016, "epoch": 3518} {"train_loss": -25.401540756225586, "global_step": 292017, "epoch": 3518} {"train_loss": -25.456228256225586, "global_step": 292018, "epoch": 3518} {"train_loss": -25.48477554321289, "global_step": 292019, "epoch": 3518} {"train_loss": -25.527761459350586, "global_step": 292020, "epoch": 3518} {"train_loss": -25.485517501831055, "global_step": 292021, "epoch": 3518} {"train_loss": -25.732275009155273, "global_step": 292022, "epoch": 3518} {"train_loss": -25.225061416625977, "global_step": 292023, "epoch": 3518} {"train_loss": -25.876880645751953, "global_step": 292024, "epoch": 3518} {"train_loss": -25.681659698486328, "global_step": 292025, "epoch": 3518} {"train_loss": -25.33432388305664, "global_step": 292026, "epoch": 3518} {"train_loss": -25.738874435424805, "global_step": 292027, "epoch": 3518} {"train_loss": -25.46978187561035, "global_step": 292028, "epoch": 3518} {"train_loss": -25.580875396728516, "global_step": 292029, "epoch": 3518} {"train_loss": -25.370529174804688, "global_step": 292030, "epoch": 3518} {"train_loss": -25.571455001831055, "global_step": 292031, "epoch": 3518} {"train_loss": -25.702009201049805, "global_step": 292032, "epoch": 3518} {"train_loss": -25.426816940307617, "global_step": 292033, "epoch": 3518} {"train_loss": -25.527170181274414, "global_step": 292034, "epoch": 3518} {"train_loss": -25.71632194519043, "global_step": 292035, "epoch": 3518} {"train_loss": -25.621824264526367, "global_step": 292036, "epoch": 3518} {"train_loss": -25.5908260345459, "global_step": 292037, "epoch": 3518} {"train_loss": -25.702777862548828, "global_step": 292038, "epoch": 3518} {"train_loss": -25.669904708862305, "global_step": 292039, "epoch": 3518} {"train_loss": -25.47995376586914, "global_step": 292040, "epoch": 3518} {"train_loss": -26.0729923248291, "global_step": 292041, "epoch": 3518} {"train_loss": -25.55742645263672, "global_step": 292042, "epoch": 3518} {"train_loss": -25.522689819335938, "global_step": 292043, "epoch": 3518} {"train_loss": -25.480329513549805, "global_step": 292044, "epoch": 3518} {"train_loss": -25.686676025390625, "global_step": 292045, "epoch": 3518} {"train_loss": -25.55902099609375, "global_step": 292046, "epoch": 3518} {"train_loss": -25.303918838500977, "global_step": 292047, "epoch": 3518} {"train_loss": -25.306509017944336, "global_step": 292048, "epoch": 3518} {"train_loss": -25.297515869140625, "global_step": 292049, "epoch": 3518} {"train_loss": -25.75958824157715, "global_step": 292050, "epoch": 3518} {"train_loss": -25.351316452026367, "global_step": 292051, "epoch": 3518} {"train_loss": -25.621191024780273, "global_step": 292052, "epoch": 3518} {"train_loss": -25.431150436401367, "global_step": 292053, "epoch": 3518} {"train_loss": -25.029247283935547, "global_step": 292054, "epoch": 3518} {"train_loss": -24.663358688354492, "global_step": 292055, "epoch": 3518} {"train_loss": -24.171905517578125, "global_step": 292056, "epoch": 3518} {"train_loss": -24.673099517822266, "global_step": 292057, "epoch": 3518} {"train_loss": -25.73708152770996, "global_step": 292058, "epoch": 3518} {"train_loss": -25.023027420043945, "global_step": 292059, "epoch": 3518} {"train_loss": -25.06254768371582, "global_step": 292060, "epoch": 3518} {"train_loss": -25.262975692749023, "global_step": 292061, "epoch": 3518} {"train_loss": -25.241186141967773, "global_step": 292062, "epoch": 3518} {"train_loss": -25.114669799804688, "global_step": 292063, "epoch": 3518} {"train_loss": -25.584577560424805, "global_step": 292064, "epoch": 3518} {"train_loss": -25.430866241455078, "global_step": 292065, "epoch": 3518} {"train_loss": -25.7579345703125, "global_step": 292066, "epoch": 3518} {"train_loss": -25.412687301635742, "global_step": 292067, "epoch": 3518} {"train_loss": -25.418317794799805, "global_step": 292068, "epoch": 3518} {"train_loss": -25.289037704467773, "global_step": 292069, "epoch": 3518} {"train_loss": -25.42188262939453, "global_step": 292070, "epoch": 3518} {"train_loss": -25.764923095703125, "global_step": 292071, "epoch": 3518} {"train_loss": -25.122037887573242, "global_step": 292072, "epoch": 3518} {"train_loss": -25.712072372436523, "global_step": 292073, "epoch": 3518} {"train_loss": -25.35530662536621, "global_step": 292074, "epoch": 3518} {"train_loss": -25.274276733398438, "global_step": 292075, "epoch": 3518} {"train_loss": -25.371243856039392, "global_step": 292076, "epoch": 3518, "val_loss": 7220769.0} {"train_loss": -24.661041259765625, "global_step": 292077, "epoch": 3519} {"train_loss": -25.00798988342285, "global_step": 292078, "epoch": 3519} {"train_loss": -25.16474723815918, "global_step": 292079, "epoch": 3519} {"train_loss": -24.83418846130371, "global_step": 292080, "epoch": 3519} {"train_loss": -25.390403747558594, "global_step": 292081, "epoch": 3519} {"train_loss": -24.815261840820312, "global_step": 292082, "epoch": 3519} {"train_loss": -25.357702255249023, "global_step": 292083, "epoch": 3519} {"train_loss": -25.056549072265625, "global_step": 292084, "epoch": 3519} {"train_loss": -24.953344345092773, "global_step": 292085, "epoch": 3519} {"train_loss": -25.547361373901367, "global_step": 292086, "epoch": 3519} {"train_loss": -25.3558292388916, "global_step": 292087, "epoch": 3519} {"train_loss": -25.22924041748047, "global_step": 292088, "epoch": 3519} {"train_loss": -25.605621337890625, "global_step": 292089, "epoch": 3519} {"train_loss": -25.279998779296875, "global_step": 292090, "epoch": 3519} {"train_loss": -25.406822204589844, "global_step": 292091, "epoch": 3519} {"train_loss": -25.34791374206543, "global_step": 292092, "epoch": 3519} {"train_loss": -25.499893188476562, "global_step": 292093, "epoch": 3519} {"train_loss": -25.447357177734375, "global_step": 292094, "epoch": 3519} {"train_loss": -25.635583877563477, "global_step": 292095, "epoch": 3519} {"train_loss": -25.171995162963867, "global_step": 292096, "epoch": 3519} {"train_loss": -25.43848991394043, "global_step": 292097, "epoch": 3519} {"train_loss": -25.316913604736328, "global_step": 292098, "epoch": 3519} {"train_loss": -25.055883407592773, "global_step": 292099, "epoch": 3519} {"train_loss": -25.35922622680664, "global_step": 292100, "epoch": 3519} {"train_loss": -25.309614181518555, "global_step": 292101, "epoch": 3519} {"train_loss": -25.445270538330078, "global_step": 292102, "epoch": 3519} {"train_loss": -25.652210235595703, "global_step": 292103, "epoch": 3519} {"train_loss": -25.159032821655273, "global_step": 292104, "epoch": 3519} {"train_loss": -25.62000846862793, "global_step": 292105, "epoch": 3519} {"train_loss": -25.719806671142578, "global_step": 292106, "epoch": 3519} {"train_loss": -25.55072593688965, "global_step": 292107, "epoch": 3519} {"train_loss": -25.615070343017578, "global_step": 292108, "epoch": 3519} {"train_loss": -25.448654174804688, "global_step": 292109, "epoch": 3519} {"train_loss": -25.2632999420166, "global_step": 292110, "epoch": 3519} {"train_loss": -25.675445556640625, "global_step": 292111, "epoch": 3519} {"train_loss": -25.7054500579834, "global_step": 292112, "epoch": 3519} {"train_loss": -25.635528564453125, "global_step": 292113, "epoch": 3519} {"train_loss": -25.52621841430664, "global_step": 292114, "epoch": 3519} {"train_loss": -25.637638092041016, "global_step": 292115, "epoch": 3519} {"train_loss": -25.727405548095703, "global_step": 292116, "epoch": 3519} {"train_loss": -25.276992797851562, "global_step": 292117, "epoch": 3519} {"train_loss": -24.885068893432617, "global_step": 292118, "epoch": 3519} {"train_loss": -25.698434829711914, "global_step": 292119, "epoch": 3519} {"train_loss": -25.50242805480957, "global_step": 292120, "epoch": 3519} {"train_loss": -25.41023826599121, "global_step": 292121, "epoch": 3519} {"train_loss": -25.783884048461914, "global_step": 292122, "epoch": 3519} {"train_loss": -25.892990112304688, "global_step": 292123, "epoch": 3519} {"train_loss": -25.57971954345703, "global_step": 292124, "epoch": 3519} {"train_loss": -25.410724639892578, "global_step": 292125, "epoch": 3519} {"train_loss": -25.894123077392578, "global_step": 292126, "epoch": 3519} {"train_loss": -25.658554077148438, "global_step": 292127, "epoch": 3519} {"train_loss": -25.373403549194336, "global_step": 292128, "epoch": 3519} {"train_loss": -25.528348922729492, "global_step": 292129, "epoch": 3519} {"train_loss": -25.667043685913086, "global_step": 292130, "epoch": 3519} {"train_loss": -25.82242774963379, "global_step": 292131, "epoch": 3519} {"train_loss": -25.66574478149414, "global_step": 292132, "epoch": 3519} {"train_loss": -25.854583740234375, "global_step": 292133, "epoch": 3519} {"train_loss": -25.755142211914062, "global_step": 292134, "epoch": 3519} {"train_loss": -25.688520431518555, "global_step": 292135, "epoch": 3519} {"train_loss": -25.6903133392334, "global_step": 292136, "epoch": 3519} {"train_loss": -26.081445693969727, "global_step": 292137, "epoch": 3519} {"train_loss": -25.63673210144043, "global_step": 292138, "epoch": 3519} {"train_loss": -25.863677978515625, "global_step": 292139, "epoch": 3519} {"train_loss": -25.7268009185791, "global_step": 292140, "epoch": 3519} {"train_loss": -25.597747802734375, "global_step": 292141, "epoch": 3519} {"train_loss": -25.335590362548828, "global_step": 292142, "epoch": 3519} {"train_loss": -25.50714874267578, "global_step": 292143, "epoch": 3519} {"train_loss": -25.926416397094727, "global_step": 292144, "epoch": 3519} {"train_loss": -25.821996688842773, "global_step": 292145, "epoch": 3519} {"train_loss": -25.432180404663086, "global_step": 292146, "epoch": 3519} {"train_loss": -25.735565185546875, "global_step": 292147, "epoch": 3519} {"train_loss": -25.79743003845215, "global_step": 292148, "epoch": 3519} {"train_loss": -25.8836669921875, "global_step": 292149, "epoch": 3519} {"train_loss": -25.463911056518555, "global_step": 292150, "epoch": 3519} {"train_loss": -25.626693725585938, "global_step": 292151, "epoch": 3519} {"train_loss": -25.62660026550293, "global_step": 292152, "epoch": 3519} {"train_loss": -25.496824264526367, "global_step": 292153, "epoch": 3519} {"train_loss": -25.363021850585938, "global_step": 292154, "epoch": 3519} {"train_loss": -25.6215877532959, "global_step": 292155, "epoch": 3519} {"train_loss": -25.70391845703125, "global_step": 292156, "epoch": 3519} {"train_loss": -25.793365478515625, "global_step": 292157, "epoch": 3519} {"train_loss": -25.663888931274414, "global_step": 292158, "epoch": 3519} {"train_loss": -25.50747087777379, "global_step": 292159, "epoch": 3519, "val_loss": 7109828.5} {"train_loss": -25.21622085571289, "global_step": 292160, "epoch": 3520} {"train_loss": -24.53761863708496, "global_step": 292161, "epoch": 3520} {"train_loss": -24.888492584228516, "global_step": 292162, "epoch": 3520} {"train_loss": -24.73097801208496, "global_step": 292163, "epoch": 3520} {"train_loss": -24.728410720825195, "global_step": 292164, "epoch": 3520} {"train_loss": -25.044361114501953, "global_step": 292165, "epoch": 3520} {"train_loss": -25.260112762451172, "global_step": 292166, "epoch": 3520} {"train_loss": -25.29353141784668, "global_step": 292167, "epoch": 3520} {"train_loss": -25.102527618408203, "global_step": 292168, "epoch": 3520} {"train_loss": -24.945932388305664, "global_step": 292169, "epoch": 3520} {"train_loss": -24.97102928161621, "global_step": 292170, "epoch": 3520} {"train_loss": -24.80535125732422, "global_step": 292171, "epoch": 3520} {"train_loss": -25.74875259399414, "global_step": 292172, "epoch": 3520} {"train_loss": -24.90665054321289, "global_step": 292173, "epoch": 3520} {"train_loss": -25.445585250854492, "global_step": 292174, "epoch": 3520} {"train_loss": -24.973485946655273, "global_step": 292175, "epoch": 3520} {"train_loss": -25.43695640563965, "global_step": 292176, "epoch": 3520} {"train_loss": -25.399389266967773, "global_step": 292177, "epoch": 3520} {"train_loss": -25.58203125, "global_step": 292178, "epoch": 3520} {"train_loss": -25.285429000854492, "global_step": 292179, "epoch": 3520} {"train_loss": -25.54159927368164, "global_step": 292180, "epoch": 3520} {"train_loss": -25.819400787353516, "global_step": 292181, "epoch": 3520} {"train_loss": -25.61331558227539, "global_step": 292182, "epoch": 3520} {"train_loss": -25.241098403930664, "global_step": 292183, "epoch": 3520} {"train_loss": -25.329627990722656, "global_step": 292184, "epoch": 3520} {"train_loss": -25.494413375854492, "global_step": 292185, "epoch": 3520} {"train_loss": -25.7025146484375, "global_step": 292186, "epoch": 3520} {"train_loss": -25.2792911529541, "global_step": 292187, "epoch": 3520} {"train_loss": -25.486339569091797, "global_step": 292188, "epoch": 3520} {"train_loss": -25.618560791015625, "global_step": 292189, "epoch": 3520} {"train_loss": -25.897541046142578, "global_step": 292190, "epoch": 3520} {"train_loss": -25.540813446044922, "global_step": 292191, "epoch": 3520} {"train_loss": -25.770587921142578, "global_step": 292192, "epoch": 3520} {"train_loss": -25.639678955078125, "global_step": 292193, "epoch": 3520} {"train_loss": -26.002180099487305, "global_step": 292194, "epoch": 3520} {"train_loss": -25.637619018554688, "global_step": 292195, "epoch": 3520} {"train_loss": -25.558691024780273, "global_step": 292196, "epoch": 3520} {"train_loss": -25.454076766967773, "global_step": 292197, "epoch": 3520} {"train_loss": -25.3354549407959, "global_step": 292198, "epoch": 3520} {"train_loss": -25.661453247070312, "global_step": 292199, "epoch": 3520} {"train_loss": -25.749597549438477, "global_step": 292200, "epoch": 3520} {"train_loss": -25.92789649963379, "global_step": 292201, "epoch": 3520} {"train_loss": -25.68501091003418, "global_step": 292202, "epoch": 3520} {"train_loss": -25.835107803344727, "global_step": 292203, "epoch": 3520} {"train_loss": -25.3396053314209, "global_step": 292204, "epoch": 3520} {"train_loss": -25.74580192565918, "global_step": 292205, "epoch": 3520} {"train_loss": -25.80306053161621, "global_step": 292206, "epoch": 3520} {"train_loss": -25.344440460205078, "global_step": 292207, "epoch": 3520} {"train_loss": -25.587804794311523, "global_step": 292208, "epoch": 3520} {"train_loss": -25.388946533203125, "global_step": 292209, "epoch": 3520} {"train_loss": -25.67557716369629, "global_step": 292210, "epoch": 3520} {"train_loss": -25.57020378112793, "global_step": 292211, "epoch": 3520} {"train_loss": -25.627233505249023, "global_step": 292212, "epoch": 3520} {"train_loss": -25.70892333984375, "global_step": 292213, "epoch": 3520} {"train_loss": -25.267248153686523, "global_step": 292214, "epoch": 3520} {"train_loss": -25.524765014648438, "global_step": 292215, "epoch": 3520} {"train_loss": -25.89747428894043, "global_step": 292216, "epoch": 3520} {"train_loss": -25.59671401977539, "global_step": 292217, "epoch": 3520} {"train_loss": -25.37923240661621, "global_step": 292218, "epoch": 3520} {"train_loss": -25.717849731445312, "global_step": 292219, "epoch": 3520} {"train_loss": -25.446929931640625, "global_step": 292220, "epoch": 3520} {"train_loss": -25.24598503112793, "global_step": 292221, "epoch": 3520} {"train_loss": -25.447832107543945, "global_step": 292222, "epoch": 3520} {"train_loss": -25.738500595092773, "global_step": 292223, "epoch": 3520} {"train_loss": -25.073759078979492, "global_step": 292224, "epoch": 3520} {"train_loss": -25.376089096069336, "global_step": 292225, "epoch": 3520} {"train_loss": -25.40582847595215, "global_step": 292226, "epoch": 3520} {"train_loss": -25.603723526000977, "global_step": 292227, "epoch": 3520} {"train_loss": -25.334733963012695, "global_step": 292228, "epoch": 3520} {"train_loss": -25.199146270751953, "global_step": 292229, "epoch": 3520} {"train_loss": -25.762344360351562, "global_step": 292230, "epoch": 3520} {"train_loss": -25.402435302734375, "global_step": 292231, "epoch": 3520} {"train_loss": -25.340091705322266, "global_step": 292232, "epoch": 3520} {"train_loss": -25.397315979003906, "global_step": 292233, "epoch": 3520} {"train_loss": -25.119043350219727, "global_step": 292234, "epoch": 3520} {"train_loss": -25.60654640197754, "global_step": 292235, "epoch": 3520} {"train_loss": -25.47245216369629, "global_step": 292236, "epoch": 3520} {"train_loss": -25.28328514099121, "global_step": 292237, "epoch": 3520} {"train_loss": -25.23676872253418, "global_step": 292238, "epoch": 3520} {"train_loss": -25.56195640563965, "global_step": 292239, "epoch": 3520} {"train_loss": -25.21332550048828, "global_step": 292240, "epoch": 3520} {"train_loss": -25.25910186767578, "global_step": 292241, "epoch": 3520} {"train_loss": -25.434916714587843, "global_step": 292242, "epoch": 3520, "val_loss": 7151960.0} {"train_loss": -23.81821632385254, "global_step": 292243, "epoch": 3521} {"train_loss": -21.704181671142578, "global_step": 292244, "epoch": 3521} {"train_loss": -24.512056350708008, "global_step": 292245, "epoch": 3521} {"train_loss": -23.71793556213379, "global_step": 292246, "epoch": 3521} {"train_loss": -24.471893310546875, "global_step": 292247, "epoch": 3521} {"train_loss": -23.6290283203125, "global_step": 292248, "epoch": 3521} {"train_loss": -25.345922470092773, "global_step": 292249, "epoch": 3521} {"train_loss": -24.058317184448242, "global_step": 292250, "epoch": 3521} {"train_loss": -24.7005558013916, "global_step": 292251, "epoch": 3521} {"train_loss": -24.873859405517578, "global_step": 292252, "epoch": 3521} {"train_loss": -24.45535659790039, "global_step": 292253, "epoch": 3521} {"train_loss": -24.949949264526367, "global_step": 292254, "epoch": 3521} {"train_loss": -25.3252010345459, "global_step": 292255, "epoch": 3521} {"train_loss": -24.795656204223633, "global_step": 292256, "epoch": 3521} {"train_loss": -24.745235443115234, "global_step": 292257, "epoch": 3521} {"train_loss": -24.96293830871582, "global_step": 292258, "epoch": 3521} {"train_loss": -25.399084091186523, "global_step": 292259, "epoch": 3521} {"train_loss": -25.252973556518555, "global_step": 292260, "epoch": 3521} {"train_loss": -24.939332962036133, "global_step": 292261, "epoch": 3521} {"train_loss": -25.455917358398438, "global_step": 292262, "epoch": 3521} {"train_loss": -24.813329696655273, "global_step": 292263, "epoch": 3521} {"train_loss": -24.930397033691406, "global_step": 292264, "epoch": 3521} {"train_loss": -25.05617332458496, "global_step": 292265, "epoch": 3521} {"train_loss": -24.812030792236328, "global_step": 292266, "epoch": 3521} {"train_loss": -25.28817367553711, "global_step": 292267, "epoch": 3521} {"train_loss": -25.210712432861328, "global_step": 292268, "epoch": 3521} {"train_loss": -24.91423988342285, "global_step": 292269, "epoch": 3521} {"train_loss": -25.335037231445312, "global_step": 292270, "epoch": 3521} {"train_loss": -25.656232833862305, "global_step": 292271, "epoch": 3521} {"train_loss": -25.226070404052734, "global_step": 292272, "epoch": 3521} {"train_loss": -25.01641845703125, "global_step": 292273, "epoch": 3521} {"train_loss": -25.729312896728516, "global_step": 292274, "epoch": 3521} {"train_loss": -25.131269454956055, "global_step": 292275, "epoch": 3521} {"train_loss": -25.4443416595459, "global_step": 292276, "epoch": 3521} {"train_loss": -25.269819259643555, "global_step": 292277, "epoch": 3521} {"train_loss": -25.299711227416992, "global_step": 292278, "epoch": 3521} {"train_loss": -25.671255111694336, "global_step": 292279, "epoch": 3521} {"train_loss": -25.60721778869629, "global_step": 292280, "epoch": 3521} {"train_loss": -25.51163673400879, "global_step": 292281, "epoch": 3521} {"train_loss": -25.776525497436523, "global_step": 292282, "epoch": 3521} {"train_loss": -25.43623924255371, "global_step": 292283, "epoch": 3521} {"train_loss": -25.71455192565918, "global_step": 292284, "epoch": 3521} {"train_loss": -25.56826400756836, "global_step": 292285, "epoch": 3521} {"train_loss": -25.03468894958496, "global_step": 292286, "epoch": 3521} {"train_loss": -25.448339462280273, "global_step": 292287, "epoch": 3521} {"train_loss": -25.28955078125, "global_step": 292288, "epoch": 3521} {"train_loss": -25.83054542541504, "global_step": 292289, "epoch": 3521} {"train_loss": -25.754384994506836, "global_step": 292290, "epoch": 3521} {"train_loss": -25.38033103942871, "global_step": 292291, "epoch": 3521} {"train_loss": -25.323482513427734, "global_step": 292292, "epoch": 3521} {"train_loss": -25.232128143310547, "global_step": 292293, "epoch": 3521} {"train_loss": -25.477294921875, "global_step": 292294, "epoch": 3521} {"train_loss": -25.738073348999023, "global_step": 292295, "epoch": 3521} {"train_loss": -25.38627052307129, "global_step": 292296, "epoch": 3521} {"train_loss": -25.620121002197266, "global_step": 292297, "epoch": 3521} {"train_loss": -25.38531494140625, "global_step": 292298, "epoch": 3521} {"train_loss": -25.627912521362305, "global_step": 292299, "epoch": 3521} {"train_loss": -25.47418975830078, "global_step": 292300, "epoch": 3521} {"train_loss": -25.552356719970703, "global_step": 292301, "epoch": 3521} {"train_loss": -25.554540634155273, "global_step": 292302, "epoch": 3521} {"train_loss": -25.522125244140625, "global_step": 292303, "epoch": 3521} {"train_loss": -25.706390380859375, "global_step": 292304, "epoch": 3521} {"train_loss": -26.003772735595703, "global_step": 292305, "epoch": 3521} {"train_loss": -25.906158447265625, "global_step": 292306, "epoch": 3521} {"train_loss": -25.4815731048584, "global_step": 292307, "epoch": 3521} {"train_loss": -25.707304000854492, "global_step": 292308, "epoch": 3521} {"train_loss": -25.77949333190918, "global_step": 292309, "epoch": 3521} {"train_loss": -25.762714385986328, "global_step": 292310, "epoch": 3521} {"train_loss": -25.77783203125, "global_step": 292311, "epoch": 3521} {"train_loss": -25.616605758666992, "global_step": 292312, "epoch": 3521} {"train_loss": -25.773290634155273, "global_step": 292313, "epoch": 3521} {"train_loss": -25.938739776611328, "global_step": 292314, "epoch": 3521} {"train_loss": -25.779266357421875, "global_step": 292315, "epoch": 3521} {"train_loss": -25.837284088134766, "global_step": 292316, "epoch": 3521} {"train_loss": -25.768903732299805, "global_step": 292317, "epoch": 3521} {"train_loss": -25.71158218383789, "global_step": 292318, "epoch": 3521} {"train_loss": -25.909713745117188, "global_step": 292319, "epoch": 3521} {"train_loss": -25.792022705078125, "global_step": 292320, "epoch": 3521} {"train_loss": -25.842365264892578, "global_step": 292321, "epoch": 3521} {"train_loss": -25.844635009765625, "global_step": 292322, "epoch": 3521} {"train_loss": -25.60296630859375, "global_step": 292323, "epoch": 3521} {"train_loss": -25.402036666870117, "global_step": 292324, "epoch": 3521} {"train_loss": -25.286692975515344, "global_step": 292325, "epoch": 3521, "val_loss": 7050376.0} {"train_loss": -25.21491813659668, "global_step": 292326, "epoch": 3522} {"train_loss": -25.47818374633789, "global_step": 292327, "epoch": 3522} {"train_loss": -25.337268829345703, "global_step": 292328, "epoch": 3522} {"train_loss": -25.046918869018555, "global_step": 292329, "epoch": 3522} {"train_loss": -25.029464721679688, "global_step": 292330, "epoch": 3522} {"train_loss": -25.1591796875, "global_step": 292331, "epoch": 3522} {"train_loss": -25.25319480895996, "global_step": 292332, "epoch": 3522} {"train_loss": -24.916593551635742, "global_step": 292333, "epoch": 3522} {"train_loss": -25.437253952026367, "global_step": 292334, "epoch": 3522} {"train_loss": -25.239032745361328, "global_step": 292335, "epoch": 3522} {"train_loss": -25.381591796875, "global_step": 292336, "epoch": 3522} {"train_loss": -25.298364639282227, "global_step": 292337, "epoch": 3522} {"train_loss": -25.505590438842773, "global_step": 292338, "epoch": 3522} {"train_loss": -25.34189796447754, "global_step": 292339, "epoch": 3522} {"train_loss": -25.459232330322266, "global_step": 292340, "epoch": 3522} {"train_loss": -25.134305953979492, "global_step": 292341, "epoch": 3522} {"train_loss": -25.420806884765625, "global_step": 292342, "epoch": 3522} {"train_loss": -25.48420524597168, "global_step": 292343, "epoch": 3522} {"train_loss": -25.228824615478516, "global_step": 292344, "epoch": 3522} {"train_loss": -25.34656524658203, "global_step": 292345, "epoch": 3522} {"train_loss": -25.650251388549805, "global_step": 292346, "epoch": 3522} {"train_loss": -25.242084503173828, "global_step": 292347, "epoch": 3522} {"train_loss": -25.468502044677734, "global_step": 292348, "epoch": 3522} {"train_loss": -25.29007911682129, "global_step": 292349, "epoch": 3522} {"train_loss": -25.716567993164062, "global_step": 292350, "epoch": 3522} {"train_loss": -25.396652221679688, "global_step": 292351, "epoch": 3522} {"train_loss": -25.502119064331055, "global_step": 292352, "epoch": 3522} {"train_loss": -25.79510498046875, "global_step": 292353, "epoch": 3522} {"train_loss": -25.481903076171875, "global_step": 292354, "epoch": 3522} {"train_loss": -25.677549362182617, "global_step": 292355, "epoch": 3522} {"train_loss": -25.79183006286621, "global_step": 292356, "epoch": 3522} {"train_loss": -25.917041778564453, "global_step": 292357, "epoch": 3522} {"train_loss": -25.93779945373535, "global_step": 292358, "epoch": 3522} {"train_loss": -25.43953514099121, "global_step": 292359, "epoch": 3522} {"train_loss": -25.31941032409668, "global_step": 292360, "epoch": 3522} {"train_loss": -25.65618896484375, "global_step": 292361, "epoch": 3522} {"train_loss": -25.562116622924805, "global_step": 292362, "epoch": 3522} {"train_loss": -25.74781608581543, "global_step": 292363, "epoch": 3522} {"train_loss": -25.508089065551758, "global_step": 292364, "epoch": 3522} {"train_loss": -25.21756935119629, "global_step": 292365, "epoch": 3522} {"train_loss": -25.459346771240234, "global_step": 292366, "epoch": 3522} {"train_loss": -25.173269271850586, "global_step": 292367, "epoch": 3522} {"train_loss": -25.178319931030273, "global_step": 292368, "epoch": 3522} {"train_loss": -25.00836181640625, "global_step": 292369, "epoch": 3522} {"train_loss": -25.17703628540039, "global_step": 292370, "epoch": 3522} {"train_loss": -25.142841339111328, "global_step": 292371, "epoch": 3522} {"train_loss": -25.286663055419922, "global_step": 292372, "epoch": 3522} {"train_loss": -25.743789672851562, "global_step": 292373, "epoch": 3522} {"train_loss": -25.35927963256836, "global_step": 292374, "epoch": 3522} {"train_loss": -25.56954002380371, "global_step": 292375, "epoch": 3522} {"train_loss": -25.790607452392578, "global_step": 292376, "epoch": 3522} {"train_loss": -25.33809471130371, "global_step": 292377, "epoch": 3522} {"train_loss": -25.4877986907959, "global_step": 292378, "epoch": 3522} {"train_loss": -25.249114990234375, "global_step": 292379, "epoch": 3522} {"train_loss": -25.390823364257812, "global_step": 292380, "epoch": 3522} {"train_loss": -25.46687889099121, "global_step": 292381, "epoch": 3522} {"train_loss": -25.36260986328125, "global_step": 292382, "epoch": 3522} {"train_loss": -25.22627067565918, "global_step": 292383, "epoch": 3522} {"train_loss": -25.51061248779297, "global_step": 292384, "epoch": 3522} {"train_loss": -25.170026779174805, "global_step": 292385, "epoch": 3522} {"train_loss": -25.719818115234375, "global_step": 292386, "epoch": 3522} {"train_loss": -25.057605743408203, "global_step": 292387, "epoch": 3522} {"train_loss": -25.504722595214844, "global_step": 292388, "epoch": 3522} {"train_loss": -25.323266983032227, "global_step": 292389, "epoch": 3522} {"train_loss": -25.808988571166992, "global_step": 292390, "epoch": 3522} {"train_loss": -25.3262882232666, "global_step": 292391, "epoch": 3522} {"train_loss": -25.54237174987793, "global_step": 292392, "epoch": 3522} {"train_loss": -25.5681095123291, "global_step": 292393, "epoch": 3522} {"train_loss": -25.57549285888672, "global_step": 292394, "epoch": 3522} {"train_loss": -25.6961727142334, "global_step": 292395, "epoch": 3522} {"train_loss": -25.628774642944336, "global_step": 292396, "epoch": 3522} {"train_loss": -25.46237564086914, "global_step": 292397, "epoch": 3522} {"train_loss": -25.442106246948242, "global_step": 292398, "epoch": 3522} {"train_loss": -25.52461814880371, "global_step": 292399, "epoch": 3522} {"train_loss": -25.584793090820312, "global_step": 292400, "epoch": 3522} {"train_loss": -25.673669815063477, "global_step": 292401, "epoch": 3522} {"train_loss": -25.349348068237305, "global_step": 292402, "epoch": 3522} {"train_loss": -25.257904052734375, "global_step": 292403, "epoch": 3522} {"train_loss": -25.835296630859375, "global_step": 292404, "epoch": 3522} {"train_loss": -26.11775016784668, "global_step": 292405, "epoch": 3522} {"train_loss": -25.74888038635254, "global_step": 292406, "epoch": 3522} {"train_loss": -25.12106704711914, "global_step": 292407, "epoch": 3522} {"train_loss": -25.45720162449113, "global_step": 292408, "epoch": 3522, "val_loss": 6964187.0} {"train_loss": -25.202869415283203, "global_step": 292409, "epoch": 3523} {"train_loss": -24.72412109375, "global_step": 292410, "epoch": 3523} {"train_loss": -24.861051559448242, "global_step": 292411, "epoch": 3523} {"train_loss": -25.206815719604492, "global_step": 292412, "epoch": 3523} {"train_loss": -25.140417098999023, "global_step": 292413, "epoch": 3523} {"train_loss": -24.851150512695312, "global_step": 292414, "epoch": 3523} {"train_loss": -25.182905197143555, "global_step": 292415, "epoch": 3523} {"train_loss": -25.037029266357422, "global_step": 292416, "epoch": 3523} {"train_loss": -25.34724235534668, "global_step": 292417, "epoch": 3523} {"train_loss": -25.198606491088867, "global_step": 292418, "epoch": 3523} {"train_loss": -25.362089157104492, "global_step": 292419, "epoch": 3523} {"train_loss": -25.226232528686523, "global_step": 292420, "epoch": 3523} {"train_loss": -25.422903060913086, "global_step": 292421, "epoch": 3523} {"train_loss": -25.437103271484375, "global_step": 292422, "epoch": 3523} {"train_loss": -24.829130172729492, "global_step": 292423, "epoch": 3523} {"train_loss": -25.44851303100586, "global_step": 292424, "epoch": 3523} {"train_loss": -25.503686904907227, "global_step": 292425, "epoch": 3523} {"train_loss": -25.586708068847656, "global_step": 292426, "epoch": 3523} {"train_loss": -25.38068962097168, "global_step": 292427, "epoch": 3523} {"train_loss": -25.421375274658203, "global_step": 292428, "epoch": 3523} {"train_loss": -25.59786033630371, "global_step": 292429, "epoch": 3523} {"train_loss": -25.6624755859375, "global_step": 292430, "epoch": 3523} {"train_loss": -25.814573287963867, "global_step": 292431, "epoch": 3523} {"train_loss": -25.43734359741211, "global_step": 292432, "epoch": 3523} {"train_loss": -25.64491081237793, "global_step": 292433, "epoch": 3523} {"train_loss": -25.674619674682617, "global_step": 292434, "epoch": 3523} {"train_loss": -25.691913604736328, "global_step": 292435, "epoch": 3523} {"train_loss": -25.821149826049805, "global_step": 292436, "epoch": 3523} {"train_loss": -25.377195358276367, "global_step": 292437, "epoch": 3523} {"train_loss": -25.907011032104492, "global_step": 292438, "epoch": 3523} {"train_loss": -25.61749839782715, "global_step": 292439, "epoch": 3523} {"train_loss": -26.0275936126709, "global_step": 292440, "epoch": 3523} {"train_loss": -25.68155860900879, "global_step": 292441, "epoch": 3523} {"train_loss": -25.828580856323242, "global_step": 292442, "epoch": 3523} {"train_loss": -25.43265151977539, "global_step": 292443, "epoch": 3523} {"train_loss": -25.503400802612305, "global_step": 292444, "epoch": 3523} {"train_loss": -25.870758056640625, "global_step": 292445, "epoch": 3523} {"train_loss": -25.720975875854492, "global_step": 292446, "epoch": 3523} {"train_loss": -25.365909576416016, "global_step": 292447, "epoch": 3523} {"train_loss": -25.85378074645996, "global_step": 292448, "epoch": 3523} {"train_loss": -26.064376831054688, "global_step": 292449, "epoch": 3523} {"train_loss": -25.6300106048584, "global_step": 292450, "epoch": 3523} {"train_loss": -25.7231502532959, "global_step": 292451, "epoch": 3523} {"train_loss": -25.724884033203125, "global_step": 292452, "epoch": 3523} {"train_loss": -25.175785064697266, "global_step": 292453, "epoch": 3523} {"train_loss": -25.46445083618164, "global_step": 292454, "epoch": 3523} {"train_loss": -25.717544555664062, "global_step": 292455, "epoch": 3523} {"train_loss": -24.93669891357422, "global_step": 292456, "epoch": 3523} {"train_loss": -24.978429794311523, "global_step": 292457, "epoch": 3523} {"train_loss": -25.476425170898438, "global_step": 292458, "epoch": 3523} {"train_loss": -25.288288116455078, "global_step": 292459, "epoch": 3523} {"train_loss": -25.411314010620117, "global_step": 292460, "epoch": 3523} {"train_loss": -25.442241668701172, "global_step": 292461, "epoch": 3523} {"train_loss": -24.7083797454834, "global_step": 292462, "epoch": 3523} {"train_loss": -25.262632369995117, "global_step": 292463, "epoch": 3523} {"train_loss": -24.91324806213379, "global_step": 292464, "epoch": 3523} {"train_loss": -25.28431510925293, "global_step": 292465, "epoch": 3523} {"train_loss": -25.0358829498291, "global_step": 292466, "epoch": 3523} {"train_loss": -25.160554885864258, "global_step": 292467, "epoch": 3523} {"train_loss": -25.649005889892578, "global_step": 292468, "epoch": 3523} {"train_loss": -24.717201232910156, "global_step": 292469, "epoch": 3523} {"train_loss": -25.089590072631836, "global_step": 292470, "epoch": 3523} {"train_loss": -25.246536254882812, "global_step": 292471, "epoch": 3523} {"train_loss": -25.241058349609375, "global_step": 292472, "epoch": 3523} {"train_loss": -25.211029052734375, "global_step": 292473, "epoch": 3523} {"train_loss": -25.6409912109375, "global_step": 292474, "epoch": 3523} {"train_loss": -25.59900665283203, "global_step": 292475, "epoch": 3523} {"train_loss": -25.394840240478516, "global_step": 292476, "epoch": 3523} {"train_loss": -25.028554916381836, "global_step": 292477, "epoch": 3523} {"train_loss": -25.681655883789062, "global_step": 292478, "epoch": 3523} {"train_loss": -25.454303741455078, "global_step": 292479, "epoch": 3523} {"train_loss": -25.2484130859375, "global_step": 292480, "epoch": 3523} {"train_loss": -25.601346969604492, "global_step": 292481, "epoch": 3523} {"train_loss": -25.603729248046875, "global_step": 292482, "epoch": 3523} {"train_loss": -25.04498863220215, "global_step": 292483, "epoch": 3523} {"train_loss": -25.7280216217041, "global_step": 292484, "epoch": 3523} {"train_loss": -25.7578067779541, "global_step": 292485, "epoch": 3523} {"train_loss": -25.761579513549805, "global_step": 292486, "epoch": 3523} {"train_loss": -25.634977340698242, "global_step": 292487, "epoch": 3523} {"train_loss": -25.798934936523438, "global_step": 292488, "epoch": 3523} {"train_loss": -25.36708641052246, "global_step": 292489, "epoch": 3523} {"train_loss": -25.873037338256836, "global_step": 292490, "epoch": 3523} {"train_loss": -25.434212719101502, "global_step": 292491, "epoch": 3523, "val_loss": 7129325.5} {"train_loss": -25.306917190551758, "global_step": 292492, "epoch": 3524} {"train_loss": -25.332258224487305, "global_step": 292493, "epoch": 3524} {"train_loss": -25.38672637939453, "global_step": 292494, "epoch": 3524} {"train_loss": -25.41259002685547, "global_step": 292495, "epoch": 3524} {"train_loss": -25.065357208251953, "global_step": 292496, "epoch": 3524} {"train_loss": -25.25091552734375, "global_step": 292497, "epoch": 3524} {"train_loss": -25.583166122436523, "global_step": 292498, "epoch": 3524} {"train_loss": -25.296327590942383, "global_step": 292499, "epoch": 3524} {"train_loss": -25.649450302124023, "global_step": 292500, "epoch": 3524} {"train_loss": -25.589475631713867, "global_step": 292501, "epoch": 3524} {"train_loss": -25.820219039916992, "global_step": 292502, "epoch": 3524} {"train_loss": -25.278579711914062, "global_step": 292503, "epoch": 3524} {"train_loss": -25.635223388671875, "global_step": 292504, "epoch": 3524} {"train_loss": -25.5775203704834, "global_step": 292505, "epoch": 3524} {"train_loss": -25.355026245117188, "global_step": 292506, "epoch": 3524} {"train_loss": -25.8335018157959, "global_step": 292507, "epoch": 3524} {"train_loss": -25.518783569335938, "global_step": 292508, "epoch": 3524} {"train_loss": -25.1700496673584, "global_step": 292509, "epoch": 3524} {"train_loss": -25.523609161376953, "global_step": 292510, "epoch": 3524} {"train_loss": -25.835107803344727, "global_step": 292511, "epoch": 3524} {"train_loss": -25.351499557495117, "global_step": 292512, "epoch": 3524} {"train_loss": -25.392038345336914, "global_step": 292513, "epoch": 3524} {"train_loss": -25.384347915649414, "global_step": 292514, "epoch": 3524} {"train_loss": -25.722610473632812, "global_step": 292515, "epoch": 3524} {"train_loss": -25.407352447509766, "global_step": 292516, "epoch": 3524} {"train_loss": -25.65628433227539, "global_step": 292517, "epoch": 3524} {"train_loss": -25.654443740844727, "global_step": 292518, "epoch": 3524} {"train_loss": -25.790027618408203, "global_step": 292519, "epoch": 3524} {"train_loss": -25.80620765686035, "global_step": 292520, "epoch": 3524} {"train_loss": -25.574125289916992, "global_step": 292521, "epoch": 3524} {"train_loss": -25.42962074279785, "global_step": 292522, "epoch": 3524} {"train_loss": -25.58955955505371, "global_step": 292523, "epoch": 3524} {"train_loss": -25.899763107299805, "global_step": 292524, "epoch": 3524} {"train_loss": -25.679046630859375, "global_step": 292525, "epoch": 3524} {"train_loss": -25.920469284057617, "global_step": 292526, "epoch": 3524} {"train_loss": -25.601194381713867, "global_step": 292527, "epoch": 3524} {"train_loss": -25.87615394592285, "global_step": 292528, "epoch": 3524} {"train_loss": -25.379438400268555, "global_step": 292529, "epoch": 3524} {"train_loss": -25.751508712768555, "global_step": 292530, "epoch": 3524} {"train_loss": -25.62977409362793, "global_step": 292531, "epoch": 3524} {"train_loss": -25.627012252807617, "global_step": 292532, "epoch": 3524} {"train_loss": -25.71536636352539, "global_step": 292533, "epoch": 3524} {"train_loss": -25.800012588500977, "global_step": 292534, "epoch": 3524} {"train_loss": -25.622129440307617, "global_step": 292535, "epoch": 3524} {"train_loss": -25.751935958862305, "global_step": 292536, "epoch": 3524} {"train_loss": -25.606576919555664, "global_step": 292537, "epoch": 3524} {"train_loss": -25.66943359375, "global_step": 292538, "epoch": 3524} {"train_loss": -25.54630470275879, "global_step": 292539, "epoch": 3524} {"train_loss": -25.53264045715332, "global_step": 292540, "epoch": 3524} {"train_loss": -25.42410659790039, "global_step": 292541, "epoch": 3524} {"train_loss": -25.620798110961914, "global_step": 292542, "epoch": 3524} {"train_loss": -25.697641372680664, "global_step": 292543, "epoch": 3524} {"train_loss": -25.347782135009766, "global_step": 292544, "epoch": 3524} {"train_loss": -25.504379272460938, "global_step": 292545, "epoch": 3524} {"train_loss": -25.165800094604492, "global_step": 292546, "epoch": 3524} {"train_loss": -25.304141998291016, "global_step": 292547, "epoch": 3524} {"train_loss": -25.080886840820312, "global_step": 292548, "epoch": 3524} {"train_loss": -25.126169204711914, "global_step": 292549, "epoch": 3524} {"train_loss": -25.72320556640625, "global_step": 292550, "epoch": 3524} {"train_loss": -25.18442726135254, "global_step": 292551, "epoch": 3524} {"train_loss": -25.296592712402344, "global_step": 292552, "epoch": 3524} {"train_loss": -25.22528648376465, "global_step": 292553, "epoch": 3524} {"train_loss": -25.300168991088867, "global_step": 292554, "epoch": 3524} {"train_loss": -25.679563522338867, "global_step": 292555, "epoch": 3524} {"train_loss": -25.45794105529785, "global_step": 292556, "epoch": 3524} {"train_loss": -25.70452880859375, "global_step": 292557, "epoch": 3524} {"train_loss": -25.395793914794922, "global_step": 292558, "epoch": 3524} {"train_loss": -25.35805320739746, "global_step": 292559, "epoch": 3524} {"train_loss": -25.68866539001465, "global_step": 292560, "epoch": 3524} {"train_loss": -25.528669357299805, "global_step": 292561, "epoch": 3524} {"train_loss": -25.439908981323242, "global_step": 292562, "epoch": 3524} {"train_loss": -25.904722213745117, "global_step": 292563, "epoch": 3524} {"train_loss": -25.490644454956055, "global_step": 292564, "epoch": 3524} {"train_loss": -25.434080123901367, "global_step": 292565, "epoch": 3524} {"train_loss": -25.69642448425293, "global_step": 292566, "epoch": 3524} {"train_loss": -25.58559226989746, "global_step": 292567, "epoch": 3524} {"train_loss": -25.902292251586914, "global_step": 292568, "epoch": 3524} {"train_loss": -25.496362686157227, "global_step": 292569, "epoch": 3524} {"train_loss": -25.34573745727539, "global_step": 292570, "epoch": 3524} {"train_loss": -25.370115280151367, "global_step": 292571, "epoch": 3524} {"train_loss": -25.71587562561035, "global_step": 292572, "epoch": 3524} {"train_loss": -25.804052352905273, "global_step": 292573, "epoch": 3524} {"train_loss": -25.531862511692278, "global_step": 292574, "epoch": 3524, "val_loss": 7052011.0} {"train_loss": -24.38100242614746, "global_step": 292575, "epoch": 3525} {"train_loss": -24.112640380859375, "global_step": 292576, "epoch": 3525} {"train_loss": -23.991613388061523, "global_step": 292577, "epoch": 3525} {"train_loss": -24.799123764038086, "global_step": 292578, "epoch": 3525} {"train_loss": -24.9826602935791, "global_step": 292579, "epoch": 3525} {"train_loss": -24.90155601501465, "global_step": 292580, "epoch": 3525} {"train_loss": -24.46319007873535, "global_step": 292581, "epoch": 3525} {"train_loss": -24.377119064331055, "global_step": 292582, "epoch": 3525} {"train_loss": -24.761676788330078, "global_step": 292583, "epoch": 3525} {"train_loss": -24.934776306152344, "global_step": 292584, "epoch": 3525} {"train_loss": -24.951574325561523, "global_step": 292585, "epoch": 3525} {"train_loss": -24.96278953552246, "global_step": 292586, "epoch": 3525} {"train_loss": -24.93720245361328, "global_step": 292587, "epoch": 3525} {"train_loss": -24.984983444213867, "global_step": 292588, "epoch": 3525} {"train_loss": -24.86171531677246, "global_step": 292589, "epoch": 3525} {"train_loss": -25.4202938079834, "global_step": 292590, "epoch": 3525} {"train_loss": -25.09974479675293, "global_step": 292591, "epoch": 3525} {"train_loss": -25.0960693359375, "global_step": 292592, "epoch": 3525} {"train_loss": -25.52060317993164, "global_step": 292593, "epoch": 3525} {"train_loss": -25.202085494995117, "global_step": 292594, "epoch": 3525} {"train_loss": -25.619482040405273, "global_step": 292595, "epoch": 3525} {"train_loss": -25.269224166870117, "global_step": 292596, "epoch": 3525} {"train_loss": -25.05106544494629, "global_step": 292597, "epoch": 3525} {"train_loss": -25.106155395507812, "global_step": 292598, "epoch": 3525} {"train_loss": -25.374134063720703, "global_step": 292599, "epoch": 3525} {"train_loss": -25.103803634643555, "global_step": 292600, "epoch": 3525} {"train_loss": -25.29176139831543, "global_step": 292601, "epoch": 3525} {"train_loss": -25.171955108642578, "global_step": 292602, "epoch": 3525} {"train_loss": -25.262327194213867, "global_step": 292603, "epoch": 3525} {"train_loss": -24.919692993164062, "global_step": 292604, "epoch": 3525} {"train_loss": -25.134841918945312, "global_step": 292605, "epoch": 3525} {"train_loss": -25.274656295776367, "global_step": 292606, "epoch": 3525} {"train_loss": -25.5694522857666, "global_step": 292607, "epoch": 3525} {"train_loss": -25.636199951171875, "global_step": 292608, "epoch": 3525} {"train_loss": -25.60028076171875, "global_step": 292609, "epoch": 3525} {"train_loss": -25.301136016845703, "global_step": 292610, "epoch": 3525} {"train_loss": -25.264631271362305, "global_step": 292611, "epoch": 3525} {"train_loss": -25.121253967285156, "global_step": 292612, "epoch": 3525} {"train_loss": -25.322711944580078, "global_step": 292613, "epoch": 3525} {"train_loss": -25.51542091369629, "global_step": 292614, "epoch": 3525} {"train_loss": -25.457426071166992, "global_step": 292615, "epoch": 3525} {"train_loss": -25.62385368347168, "global_step": 292616, "epoch": 3525} {"train_loss": -25.745691299438477, "global_step": 292617, "epoch": 3525} {"train_loss": -25.8463077545166, "global_step": 292618, "epoch": 3525} {"train_loss": -25.303476333618164, "global_step": 292619, "epoch": 3525} {"train_loss": -25.81959342956543, "global_step": 292620, "epoch": 3525} {"train_loss": -25.696258544921875, "global_step": 292621, "epoch": 3525} {"train_loss": -25.31537628173828, "global_step": 292622, "epoch": 3525} {"train_loss": -25.7885684967041, "global_step": 292623, "epoch": 3525} {"train_loss": -25.916980743408203, "global_step": 292624, "epoch": 3525} {"train_loss": -25.717609405517578, "global_step": 292625, "epoch": 3525} {"train_loss": -25.64923095703125, "global_step": 292626, "epoch": 3525} {"train_loss": -26.210607528686523, "global_step": 292627, "epoch": 3525} {"train_loss": -25.701993942260742, "global_step": 292628, "epoch": 3525} {"train_loss": -25.557371139526367, "global_step": 292629, "epoch": 3525} {"train_loss": -25.94253921508789, "global_step": 292630, "epoch": 3525} {"train_loss": -25.941022872924805, "global_step": 292631, "epoch": 3525} {"train_loss": -25.856653213500977, "global_step": 292632, "epoch": 3525} {"train_loss": -25.756925582885742, "global_step": 292633, "epoch": 3525} {"train_loss": -25.442949295043945, "global_step": 292634, "epoch": 3525} {"train_loss": -25.671117782592773, "global_step": 292635, "epoch": 3525} {"train_loss": -25.39564323425293, "global_step": 292636, "epoch": 3525} {"train_loss": -25.635889053344727, "global_step": 292637, "epoch": 3525} {"train_loss": -25.774662017822266, "global_step": 292638, "epoch": 3525} {"train_loss": -25.8761043548584, "global_step": 292639, "epoch": 3525} {"train_loss": -25.918684005737305, "global_step": 292640, "epoch": 3525} {"train_loss": -25.563133239746094, "global_step": 292641, "epoch": 3525} {"train_loss": -25.089494705200195, "global_step": 292642, "epoch": 3525} {"train_loss": -25.269838333129883, "global_step": 292643, "epoch": 3525} {"train_loss": -25.47861099243164, "global_step": 292644, "epoch": 3525} {"train_loss": -25.631113052368164, "global_step": 292645, "epoch": 3525} {"train_loss": -24.962142944335938, "global_step": 292646, "epoch": 3525} {"train_loss": -24.678848266601562, "global_step": 292647, "epoch": 3525} {"train_loss": -25.518939971923828, "global_step": 292648, "epoch": 3525} {"train_loss": -25.244279861450195, "global_step": 292649, "epoch": 3525} {"train_loss": -25.600778579711914, "global_step": 292650, "epoch": 3525} {"train_loss": -25.119064331054688, "global_step": 292651, "epoch": 3525} {"train_loss": -25.28246307373047, "global_step": 292652, "epoch": 3525} {"train_loss": -25.590505599975586, "global_step": 292653, "epoch": 3525} {"train_loss": -24.917234420776367, "global_step": 292654, "epoch": 3525} {"train_loss": -25.301597595214844, "global_step": 292655, "epoch": 3525} {"train_loss": -25.597604751586914, "global_step": 292656, "epoch": 3525} {"train_loss": -25.311994093010224, "global_step": 292657, "epoch": 3525, "val_loss": 7110522.0} {"train_loss": -25.139554977416992, "global_step": 292658, "epoch": 3526} {"train_loss": -25.735620498657227, "global_step": 292659, "epoch": 3526} {"train_loss": -25.328495025634766, "global_step": 292660, "epoch": 3526} {"train_loss": -24.809255599975586, "global_step": 292661, "epoch": 3526} {"train_loss": -24.88104248046875, "global_step": 292662, "epoch": 3526} {"train_loss": -24.977943420410156, "global_step": 292663, "epoch": 3526} {"train_loss": -24.613523483276367, "global_step": 292664, "epoch": 3526} {"train_loss": -25.127771377563477, "global_step": 292665, "epoch": 3526} {"train_loss": -25.237180709838867, "global_step": 292666, "epoch": 3526} {"train_loss": -25.028289794921875, "global_step": 292667, "epoch": 3526} {"train_loss": -25.13405990600586, "global_step": 292668, "epoch": 3526} {"train_loss": -25.151819229125977, "global_step": 292669, "epoch": 3526} {"train_loss": -25.652450561523438, "global_step": 292670, "epoch": 3526} {"train_loss": -25.345556259155273, "global_step": 292671, "epoch": 3526} {"train_loss": -25.491971969604492, "global_step": 292672, "epoch": 3526} {"train_loss": -25.270959854125977, "global_step": 292673, "epoch": 3526} {"train_loss": -24.969928741455078, "global_step": 292674, "epoch": 3526} {"train_loss": -25.632156372070312, "global_step": 292675, "epoch": 3526} {"train_loss": -25.401487350463867, "global_step": 292676, "epoch": 3526} {"train_loss": -25.662107467651367, "global_step": 292677, "epoch": 3526} {"train_loss": -25.444414138793945, "global_step": 292678, "epoch": 3526} {"train_loss": -25.41693687438965, "global_step": 292679, "epoch": 3526} {"train_loss": -25.543325424194336, "global_step": 292680, "epoch": 3526} {"train_loss": -25.803852081298828, "global_step": 292681, "epoch": 3526} {"train_loss": -25.69291114807129, "global_step": 292682, "epoch": 3526} {"train_loss": -25.594966888427734, "global_step": 292683, "epoch": 3526} {"train_loss": -25.613391876220703, "global_step": 292684, "epoch": 3526} {"train_loss": -25.746509552001953, "global_step": 292685, "epoch": 3526} {"train_loss": -25.234634399414062, "global_step": 292686, "epoch": 3526} {"train_loss": -25.646713256835938, "global_step": 292687, "epoch": 3526} {"train_loss": -25.595190048217773, "global_step": 292688, "epoch": 3526} {"train_loss": -25.6342830657959, "global_step": 292689, "epoch": 3526} {"train_loss": -25.360288619995117, "global_step": 292690, "epoch": 3526} {"train_loss": -25.50499725341797, "global_step": 292691, "epoch": 3526} {"train_loss": -25.87176513671875, "global_step": 292692, "epoch": 3526} {"train_loss": -25.8837890625, "global_step": 292693, "epoch": 3526} {"train_loss": -25.858020782470703, "global_step": 292694, "epoch": 3526} {"train_loss": -25.41472816467285, "global_step": 292695, "epoch": 3526} {"train_loss": -25.448583602905273, "global_step": 292696, "epoch": 3526} {"train_loss": -25.515228271484375, "global_step": 292697, "epoch": 3526} {"train_loss": -25.7290096282959, "global_step": 292698, "epoch": 3526} {"train_loss": -25.504806518554688, "global_step": 292699, "epoch": 3526} {"train_loss": -25.609329223632812, "global_step": 292700, "epoch": 3526} {"train_loss": -25.631275177001953, "global_step": 292701, "epoch": 3526} {"train_loss": -25.45115089416504, "global_step": 292702, "epoch": 3526} {"train_loss": -25.417104721069336, "global_step": 292703, "epoch": 3526} {"train_loss": -25.07608413696289, "global_step": 292704, "epoch": 3526} {"train_loss": -25.49587059020996, "global_step": 292705, "epoch": 3526} {"train_loss": -25.686033248901367, "global_step": 292706, "epoch": 3526} {"train_loss": -25.6820068359375, "global_step": 292707, "epoch": 3526} {"train_loss": -25.48261260986328, "global_step": 292708, "epoch": 3526} {"train_loss": -25.879858016967773, "global_step": 292709, "epoch": 3526} {"train_loss": -25.735315322875977, "global_step": 292710, "epoch": 3526} {"train_loss": -25.717206954956055, "global_step": 292711, "epoch": 3526} {"train_loss": -25.649255752563477, "global_step": 292712, "epoch": 3526} {"train_loss": -25.218219757080078, "global_step": 292713, "epoch": 3526} {"train_loss": -25.428396224975586, "global_step": 292714, "epoch": 3526} {"train_loss": -25.809741973876953, "global_step": 292715, "epoch": 3526} {"train_loss": -25.750064849853516, "global_step": 292716, "epoch": 3526} {"train_loss": -25.327892303466797, "global_step": 292717, "epoch": 3526} {"train_loss": -25.438980102539062, "global_step": 292718, "epoch": 3526} {"train_loss": -25.24683952331543, "global_step": 292719, "epoch": 3526} {"train_loss": -25.870813369750977, "global_step": 292720, "epoch": 3526} {"train_loss": -25.631881713867188, "global_step": 292721, "epoch": 3526} {"train_loss": -25.561574935913086, "global_step": 292722, "epoch": 3526} {"train_loss": -25.79397964477539, "global_step": 292723, "epoch": 3526} {"train_loss": -25.452035903930664, "global_step": 292724, "epoch": 3526} {"train_loss": -25.527502059936523, "global_step": 292725, "epoch": 3526} {"train_loss": -25.311975479125977, "global_step": 292726, "epoch": 3526} {"train_loss": -25.724685668945312, "global_step": 292727, "epoch": 3526} {"train_loss": -25.403348922729492, "global_step": 292728, "epoch": 3526} {"train_loss": -25.507198333740234, "global_step": 292729, "epoch": 3526} {"train_loss": -25.82283592224121, "global_step": 292730, "epoch": 3526} {"train_loss": -25.476089477539062, "global_step": 292731, "epoch": 3526} {"train_loss": -25.925537109375, "global_step": 292732, "epoch": 3526} {"train_loss": -25.36656951904297, "global_step": 292733, "epoch": 3526} {"train_loss": -25.628339767456055, "global_step": 292734, "epoch": 3526} {"train_loss": -25.084949493408203, "global_step": 292735, "epoch": 3526} {"train_loss": -24.852787017822266, "global_step": 292736, "epoch": 3526} {"train_loss": -25.187255859375, "global_step": 292737, "epoch": 3526} {"train_loss": -25.437503814697266, "global_step": 292738, "epoch": 3526} {"train_loss": -25.113037109375, "global_step": 292739, "epoch": 3526} {"train_loss": -25.450953265270556, "global_step": 292740, "epoch": 3526, "val_loss": 7173059.0} {"train_loss": -25.0632381439209, "global_step": 292741, "epoch": 3527} {"train_loss": -24.599273681640625, "global_step": 292742, "epoch": 3527} {"train_loss": -24.873517990112305, "global_step": 292743, "epoch": 3527} {"train_loss": -24.495431900024414, "global_step": 292744, "epoch": 3527} {"train_loss": -24.389156341552734, "global_step": 292745, "epoch": 3527} {"train_loss": -24.99648094177246, "global_step": 292746, "epoch": 3527} {"train_loss": -25.134017944335938, "global_step": 292747, "epoch": 3527} {"train_loss": -25.016071319580078, "global_step": 292748, "epoch": 3527} {"train_loss": -24.763864517211914, "global_step": 292749, "epoch": 3527} {"train_loss": -25.05684471130371, "global_step": 292750, "epoch": 3527} {"train_loss": -24.994197845458984, "global_step": 292751, "epoch": 3527} {"train_loss": -25.370956420898438, "global_step": 292752, "epoch": 3527} {"train_loss": -25.395849227905273, "global_step": 292753, "epoch": 3527} {"train_loss": -24.88472557067871, "global_step": 292754, "epoch": 3527} {"train_loss": -25.14722442626953, "global_step": 292755, "epoch": 3527} {"train_loss": -25.238861083984375, "global_step": 292756, "epoch": 3527} {"train_loss": -25.395549774169922, "global_step": 292757, "epoch": 3527} {"train_loss": -24.924671173095703, "global_step": 292758, "epoch": 3527} {"train_loss": -24.987985610961914, "global_step": 292759, "epoch": 3527} {"train_loss": -25.06776237487793, "global_step": 292760, "epoch": 3527} {"train_loss": -25.639175415039062, "global_step": 292761, "epoch": 3527} {"train_loss": -25.28104591369629, "global_step": 292762, "epoch": 3527} {"train_loss": -25.072580337524414, "global_step": 292763, "epoch": 3527} {"train_loss": -25.333110809326172, "global_step": 292764, "epoch": 3527} {"train_loss": -25.297704696655273, "global_step": 292765, "epoch": 3527} {"train_loss": -25.355470657348633, "global_step": 292766, "epoch": 3527} {"train_loss": -25.695281982421875, "global_step": 292767, "epoch": 3527} {"train_loss": -25.288467407226562, "global_step": 292768, "epoch": 3527} {"train_loss": -25.47344398498535, "global_step": 292769, "epoch": 3527} {"train_loss": -25.118194580078125, "global_step": 292770, "epoch": 3527} {"train_loss": -25.700037002563477, "global_step": 292771, "epoch": 3527} {"train_loss": -25.403141021728516, "global_step": 292772, "epoch": 3527} {"train_loss": -25.7493896484375, "global_step": 292773, "epoch": 3527} {"train_loss": -25.038660049438477, "global_step": 292774, "epoch": 3527} {"train_loss": -25.336179733276367, "global_step": 292775, "epoch": 3527} {"train_loss": -25.687345504760742, "global_step": 292776, "epoch": 3527} {"train_loss": -25.274877548217773, "global_step": 292777, "epoch": 3527} {"train_loss": -25.616413116455078, "global_step": 292778, "epoch": 3527} {"train_loss": -25.906204223632812, "global_step": 292779, "epoch": 3527} {"train_loss": -25.69771385192871, "global_step": 292780, "epoch": 3527} {"train_loss": -25.517257690429688, "global_step": 292781, "epoch": 3527} {"train_loss": -25.94037437438965, "global_step": 292782, "epoch": 3527} {"train_loss": -25.966567993164062, "global_step": 292783, "epoch": 3527} {"train_loss": -25.19154167175293, "global_step": 292784, "epoch": 3527} {"train_loss": -25.676969528198242, "global_step": 292785, "epoch": 3527} {"train_loss": -25.73697280883789, "global_step": 292786, "epoch": 3527} {"train_loss": -25.827550888061523, "global_step": 292787, "epoch": 3527} {"train_loss": -25.608930587768555, "global_step": 292788, "epoch": 3527} {"train_loss": -25.529481887817383, "global_step": 292789, "epoch": 3527} {"train_loss": -26.082983016967773, "global_step": 292790, "epoch": 3527} {"train_loss": -25.638532638549805, "global_step": 292791, "epoch": 3527} {"train_loss": -25.87017822265625, "global_step": 292792, "epoch": 3527} {"train_loss": -25.717304229736328, "global_step": 292793, "epoch": 3527} {"train_loss": -25.61310386657715, "global_step": 292794, "epoch": 3527} {"train_loss": -25.398527145385742, "global_step": 292795, "epoch": 3527} {"train_loss": -25.67049217224121, "global_step": 292796, "epoch": 3527} {"train_loss": -25.21657371520996, "global_step": 292797, "epoch": 3527} {"train_loss": -25.575286865234375, "global_step": 292798, "epoch": 3527} {"train_loss": -25.574514389038086, "global_step": 292799, "epoch": 3527} {"train_loss": -25.985126495361328, "global_step": 292800, "epoch": 3527} {"train_loss": -25.536163330078125, "global_step": 292801, "epoch": 3527} {"train_loss": -25.100006103515625, "global_step": 292802, "epoch": 3527} {"train_loss": -24.851289749145508, "global_step": 292803, "epoch": 3527} {"train_loss": -25.144765853881836, "global_step": 292804, "epoch": 3527} {"train_loss": -25.626501083374023, "global_step": 292805, "epoch": 3527} {"train_loss": -25.657331466674805, "global_step": 292806, "epoch": 3527} {"train_loss": -25.926105499267578, "global_step": 292807, "epoch": 3527} {"train_loss": -25.26425552368164, "global_step": 292808, "epoch": 3527} {"train_loss": -25.406402587890625, "global_step": 292809, "epoch": 3527} {"train_loss": -25.170677185058594, "global_step": 292810, "epoch": 3527} {"train_loss": -25.314966201782227, "global_step": 292811, "epoch": 3527} {"train_loss": -25.181623458862305, "global_step": 292812, "epoch": 3527} {"train_loss": -25.420467376708984, "global_step": 292813, "epoch": 3527} {"train_loss": -25.642642974853516, "global_step": 292814, "epoch": 3527} {"train_loss": -25.465600967407227, "global_step": 292815, "epoch": 3527} {"train_loss": -25.718305587768555, "global_step": 292816, "epoch": 3527} {"train_loss": -25.25589370727539, "global_step": 292817, "epoch": 3527} {"train_loss": -25.377119064331055, "global_step": 292818, "epoch": 3527} {"train_loss": -25.73604393005371, "global_step": 292819, "epoch": 3527} {"train_loss": -25.202693939208984, "global_step": 292820, "epoch": 3527} {"train_loss": -25.31955337524414, "global_step": 292821, "epoch": 3527} {"train_loss": -25.93147087097168, "global_step": 292822, "epoch": 3527} {"train_loss": -25.375458315194372, "global_step": 292823, "epoch": 3527, "val_loss": 7119238.5} {"train_loss": -24.598520278930664, "global_step": 292824, "epoch": 3528} {"train_loss": -25.049545288085938, "global_step": 292825, "epoch": 3528} {"train_loss": -25.14419937133789, "global_step": 292826, "epoch": 3528} {"train_loss": -24.980806350708008, "global_step": 292827, "epoch": 3528} {"train_loss": -24.681116104125977, "global_step": 292828, "epoch": 3528} {"train_loss": -25.0288143157959, "global_step": 292829, "epoch": 3528} {"train_loss": -24.96974754333496, "global_step": 292830, "epoch": 3528} {"train_loss": -25.18405532836914, "global_step": 292831, "epoch": 3528} {"train_loss": -25.252460479736328, "global_step": 292832, "epoch": 3528} {"train_loss": -25.233549118041992, "global_step": 292833, "epoch": 3528} {"train_loss": -25.100528717041016, "global_step": 292834, "epoch": 3528} {"train_loss": -25.302154541015625, "global_step": 292835, "epoch": 3528} {"train_loss": -25.313404083251953, "global_step": 292836, "epoch": 3528} {"train_loss": -25.118133544921875, "global_step": 292837, "epoch": 3528} {"train_loss": -25.452430725097656, "global_step": 292838, "epoch": 3528} {"train_loss": -25.734466552734375, "global_step": 292839, "epoch": 3528} {"train_loss": -25.20716667175293, "global_step": 292840, "epoch": 3528} {"train_loss": -25.382537841796875, "global_step": 292841, "epoch": 3528} {"train_loss": -25.259017944335938, "global_step": 292842, "epoch": 3528} {"train_loss": -25.287113189697266, "global_step": 292843, "epoch": 3528} {"train_loss": -25.39701271057129, "global_step": 292844, "epoch": 3528} {"train_loss": -25.177017211914062, "global_step": 292845, "epoch": 3528} {"train_loss": -25.433115005493164, "global_step": 292846, "epoch": 3528} {"train_loss": -25.214834213256836, "global_step": 292847, "epoch": 3528} {"train_loss": -25.27708625793457, "global_step": 292848, "epoch": 3528} {"train_loss": -25.6723575592041, "global_step": 292849, "epoch": 3528} {"train_loss": -25.297250747680664, "global_step": 292850, "epoch": 3528} {"train_loss": -25.45438003540039, "global_step": 292851, "epoch": 3528} {"train_loss": -25.5958309173584, "global_step": 292852, "epoch": 3528} {"train_loss": -25.833724975585938, "global_step": 292853, "epoch": 3528} {"train_loss": -25.69645118713379, "global_step": 292854, "epoch": 3528} {"train_loss": -25.511295318603516, "global_step": 292855, "epoch": 3528} {"train_loss": -25.543787002563477, "global_step": 292856, "epoch": 3528} {"train_loss": -25.723312377929688, "global_step": 292857, "epoch": 3528} {"train_loss": -25.618701934814453, "global_step": 292858, "epoch": 3528} {"train_loss": -25.60715675354004, "global_step": 292859, "epoch": 3528} {"train_loss": -25.92232322692871, "global_step": 292860, "epoch": 3528} {"train_loss": -25.655746459960938, "global_step": 292861, "epoch": 3528} {"train_loss": -25.841718673706055, "global_step": 292862, "epoch": 3528} {"train_loss": -25.892688751220703, "global_step": 292863, "epoch": 3528} {"train_loss": -25.767105102539062, "global_step": 292864, "epoch": 3528} {"train_loss": -25.919729232788086, "global_step": 292865, "epoch": 3528} {"train_loss": -25.825361251831055, "global_step": 292866, "epoch": 3528} {"train_loss": -25.723129272460938, "global_step": 292867, "epoch": 3528} {"train_loss": -25.66583824157715, "global_step": 292868, "epoch": 3528} {"train_loss": -25.371767044067383, "global_step": 292869, "epoch": 3528} {"train_loss": -25.36934471130371, "global_step": 292870, "epoch": 3528} {"train_loss": -25.779382705688477, "global_step": 292871, "epoch": 3528} {"train_loss": -25.808258056640625, "global_step": 292872, "epoch": 3528} {"train_loss": -25.59266471862793, "global_step": 292873, "epoch": 3528} {"train_loss": -25.467016220092773, "global_step": 292874, "epoch": 3528} {"train_loss": -25.586341857910156, "global_step": 292875, "epoch": 3528} {"train_loss": -25.51593589782715, "global_step": 292876, "epoch": 3528} {"train_loss": -25.78714370727539, "global_step": 292877, "epoch": 3528} {"train_loss": -25.6119441986084, "global_step": 292878, "epoch": 3528} {"train_loss": -25.954776763916016, "global_step": 292879, "epoch": 3528} {"train_loss": -25.7520694732666, "global_step": 292880, "epoch": 3528} {"train_loss": -25.264537811279297, "global_step": 292881, "epoch": 3528} {"train_loss": -24.53419303894043, "global_step": 292882, "epoch": 3528} {"train_loss": -24.3475341796875, "global_step": 292883, "epoch": 3528} {"train_loss": -25.162805557250977, "global_step": 292884, "epoch": 3528} {"train_loss": -25.181028366088867, "global_step": 292885, "epoch": 3528} {"train_loss": -24.766883850097656, "global_step": 292886, "epoch": 3528} {"train_loss": -24.792837142944336, "global_step": 292887, "epoch": 3528} {"train_loss": -25.65862464904785, "global_step": 292888, "epoch": 3528} {"train_loss": -24.966585159301758, "global_step": 292889, "epoch": 3528} {"train_loss": -25.044876098632812, "global_step": 292890, "epoch": 3528} {"train_loss": -26.056339263916016, "global_step": 292891, "epoch": 3528} {"train_loss": -24.805770874023438, "global_step": 292892, "epoch": 3528} {"train_loss": -25.703886032104492, "global_step": 292893, "epoch": 3528} {"train_loss": -25.13038444519043, "global_step": 292894, "epoch": 3528} {"train_loss": -25.61525535583496, "global_step": 292895, "epoch": 3528} {"train_loss": -24.98130226135254, "global_step": 292896, "epoch": 3528} {"train_loss": -25.41363525390625, "global_step": 292897, "epoch": 3528} {"train_loss": -25.16086769104004, "global_step": 292898, "epoch": 3528} {"train_loss": -25.578292846679688, "global_step": 292899, "epoch": 3528} {"train_loss": -25.31244468688965, "global_step": 292900, "epoch": 3528} {"train_loss": -25.7346248626709, "global_step": 292901, "epoch": 3528} {"train_loss": -25.21230697631836, "global_step": 292902, "epoch": 3528} {"train_loss": -25.391958236694336, "global_step": 292903, "epoch": 3528} {"train_loss": -25.317838668823242, "global_step": 292904, "epoch": 3528} {"train_loss": -25.50813102722168, "global_step": 292905, "epoch": 3528} {"train_loss": -25.37018624271255, "global_step": 292906, "epoch": 3528, "val_loss": 7065993.0} {"train_loss": -25.6751766204834, "global_step": 292907, "epoch": 3529} {"train_loss": -25.354114532470703, "global_step": 292908, "epoch": 3529} {"train_loss": -25.501890182495117, "global_step": 292909, "epoch": 3529} {"train_loss": -25.74945068359375, "global_step": 292910, "epoch": 3529} {"train_loss": -26.13140869140625, "global_step": 292911, "epoch": 3529} {"train_loss": -25.32491111755371, "global_step": 292912, "epoch": 3529} {"train_loss": -25.677030563354492, "global_step": 292913, "epoch": 3529} {"train_loss": -25.738998413085938, "global_step": 292914, "epoch": 3529} {"train_loss": -25.325117111206055, "global_step": 292915, "epoch": 3529} {"train_loss": -25.472623825073242, "global_step": 292916, "epoch": 3529} {"train_loss": -25.392379760742188, "global_step": 292917, "epoch": 3529} {"train_loss": -25.38197898864746, "global_step": 292918, "epoch": 3529} {"train_loss": -25.531896591186523, "global_step": 292919, "epoch": 3529} {"train_loss": -25.07379150390625, "global_step": 292920, "epoch": 3529} {"train_loss": -25.640241622924805, "global_step": 292921, "epoch": 3529} {"train_loss": -25.591821670532227, "global_step": 292922, "epoch": 3529} {"train_loss": -25.708393096923828, "global_step": 292923, "epoch": 3529} {"train_loss": -25.568836212158203, "global_step": 292924, "epoch": 3529} {"train_loss": -25.415546417236328, "global_step": 292925, "epoch": 3529} {"train_loss": -25.619903564453125, "global_step": 292926, "epoch": 3529} {"train_loss": -25.529794692993164, "global_step": 292927, "epoch": 3529} {"train_loss": -25.703144073486328, "global_step": 292928, "epoch": 3529} {"train_loss": -25.387741088867188, "global_step": 292929, "epoch": 3529} {"train_loss": -25.565807342529297, "global_step": 292930, "epoch": 3529} {"train_loss": -25.51987075805664, "global_step": 292931, "epoch": 3529} {"train_loss": -25.369665145874023, "global_step": 292932, "epoch": 3529} {"train_loss": -25.373891830444336, "global_step": 292933, "epoch": 3529} {"train_loss": -25.63962745666504, "global_step": 292934, "epoch": 3529} {"train_loss": -25.271093368530273, "global_step": 292935, "epoch": 3529} {"train_loss": -25.52069664001465, "global_step": 292936, "epoch": 3529} {"train_loss": -25.51920509338379, "global_step": 292937, "epoch": 3529} {"train_loss": -25.22126579284668, "global_step": 292938, "epoch": 3529} {"train_loss": -25.66058349609375, "global_step": 292939, "epoch": 3529} {"train_loss": -25.50745964050293, "global_step": 292940, "epoch": 3529} {"train_loss": -25.712188720703125, "global_step": 292941, "epoch": 3529} {"train_loss": -25.224531173706055, "global_step": 292942, "epoch": 3529} {"train_loss": -25.599287033081055, "global_step": 292943, "epoch": 3529} {"train_loss": -25.499584197998047, "global_step": 292944, "epoch": 3529} {"train_loss": -25.45253562927246, "global_step": 292945, "epoch": 3529} {"train_loss": -25.244779586791992, "global_step": 292946, "epoch": 3529} {"train_loss": -25.20703125, "global_step": 292947, "epoch": 3529} {"train_loss": -25.42160987854004, "global_step": 292948, "epoch": 3529} {"train_loss": -25.54847526550293, "global_step": 292949, "epoch": 3529} {"train_loss": -25.8676700592041, "global_step": 292950, "epoch": 3529} {"train_loss": -25.83049964904785, "global_step": 292951, "epoch": 3529} {"train_loss": -25.630889892578125, "global_step": 292952, "epoch": 3529} {"train_loss": -25.28529167175293, "global_step": 292953, "epoch": 3529} {"train_loss": -25.392175674438477, "global_step": 292954, "epoch": 3529} {"train_loss": -25.523630142211914, "global_step": 292955, "epoch": 3529} {"train_loss": -25.692834854125977, "global_step": 292956, "epoch": 3529} {"train_loss": -25.88986587524414, "global_step": 292957, "epoch": 3529} {"train_loss": -25.518564224243164, "global_step": 292958, "epoch": 3529} {"train_loss": -25.37652587890625, "global_step": 292959, "epoch": 3529} {"train_loss": -25.88175392150879, "global_step": 292960, "epoch": 3529} {"train_loss": -25.8299560546875, "global_step": 292961, "epoch": 3529} {"train_loss": -25.710920333862305, "global_step": 292962, "epoch": 3529} {"train_loss": -25.759504318237305, "global_step": 292963, "epoch": 3529} {"train_loss": -25.40394401550293, "global_step": 292964, "epoch": 3529} {"train_loss": -25.731740951538086, "global_step": 292965, "epoch": 3529} {"train_loss": -25.842870712280273, "global_step": 292966, "epoch": 3529} {"train_loss": -25.245630264282227, "global_step": 292967, "epoch": 3529} {"train_loss": -25.541738510131836, "global_step": 292968, "epoch": 3529} {"train_loss": -25.49673080444336, "global_step": 292969, "epoch": 3529} {"train_loss": -25.528322219848633, "global_step": 292970, "epoch": 3529} {"train_loss": -25.533740997314453, "global_step": 292971, "epoch": 3529} {"train_loss": -25.774927139282227, "global_step": 292972, "epoch": 3529} {"train_loss": -26.14975929260254, "global_step": 292973, "epoch": 3529} {"train_loss": -25.7204647064209, "global_step": 292974, "epoch": 3529} {"train_loss": -25.507793426513672, "global_step": 292975, "epoch": 3529} {"train_loss": -25.341337203979492, "global_step": 292976, "epoch": 3529} {"train_loss": -25.75384521484375, "global_step": 292977, "epoch": 3529} {"train_loss": -25.719669342041016, "global_step": 292978, "epoch": 3529} {"train_loss": -25.200111389160156, "global_step": 292979, "epoch": 3529} {"train_loss": -25.707197189331055, "global_step": 292980, "epoch": 3529} {"train_loss": -25.6023006439209, "global_step": 292981, "epoch": 3529} {"train_loss": -25.44697380065918, "global_step": 292982, "epoch": 3529} {"train_loss": -25.766523361206055, "global_step": 292983, "epoch": 3529} {"train_loss": -25.758106231689453, "global_step": 292984, "epoch": 3529} {"train_loss": -25.62479591369629, "global_step": 292985, "epoch": 3529} {"train_loss": -25.733753204345703, "global_step": 292986, "epoch": 3529} {"train_loss": -25.557872772216797, "global_step": 292987, "epoch": 3529} {"train_loss": -25.830183029174805, "global_step": 292988, "epoch": 3529} {"train_loss": -25.537029978740645, "global_step": 292989, "epoch": 3529, "val_loss": 7212227.0} {"train_loss": -25.376794815063477, "global_step": 292990, "epoch": 3530} {"train_loss": -24.911884307861328, "global_step": 292991, "epoch": 3530} {"train_loss": -25.302087783813477, "global_step": 292992, "epoch": 3530} {"train_loss": -25.13959312438965, "global_step": 292993, "epoch": 3530} {"train_loss": -24.92770767211914, "global_step": 292994, "epoch": 3530} {"train_loss": -25.2329158782959, "global_step": 292995, "epoch": 3530} {"train_loss": -25.079252243041992, "global_step": 292996, "epoch": 3530} {"train_loss": -25.309066772460938, "global_step": 292997, "epoch": 3530} {"train_loss": -25.221342086791992, "global_step": 292998, "epoch": 3530} {"train_loss": -25.48784828186035, "global_step": 292999, "epoch": 3530} {"train_loss": -25.504199981689453, "global_step": 293000, "epoch": 3530} {"train_loss": -25.803634643554688, "global_step": 293001, "epoch": 3530} {"train_loss": -25.371042251586914, "global_step": 293002, "epoch": 3530} {"train_loss": -25.418193817138672, "global_step": 293003, "epoch": 3530} {"train_loss": -25.301193237304688, "global_step": 293004, "epoch": 3530} {"train_loss": -25.29668617248535, "global_step": 293005, "epoch": 3530} {"train_loss": -25.451013565063477, "global_step": 293006, "epoch": 3530} {"train_loss": -25.366640090942383, "global_step": 293007, "epoch": 3530} {"train_loss": -24.955236434936523, "global_step": 293008, "epoch": 3530} {"train_loss": -25.284439086914062, "global_step": 293009, "epoch": 3530} {"train_loss": -25.365459442138672, "global_step": 293010, "epoch": 3530} {"train_loss": -25.19000244140625, "global_step": 293011, "epoch": 3530} {"train_loss": -25.17917251586914, "global_step": 293012, "epoch": 3530} {"train_loss": -25.642200469970703, "global_step": 293013, "epoch": 3530} {"train_loss": -25.395904541015625, "global_step": 293014, "epoch": 3530} {"train_loss": -25.50577163696289, "global_step": 293015, "epoch": 3530} {"train_loss": -25.00822639465332, "global_step": 293016, "epoch": 3530} {"train_loss": -25.187314987182617, "global_step": 293017, "epoch": 3530} {"train_loss": -25.164167404174805, "global_step": 293018, "epoch": 3530} {"train_loss": -24.77068328857422, "global_step": 293019, "epoch": 3530} {"train_loss": -25.21556282043457, "global_step": 293020, "epoch": 3530} {"train_loss": -25.47986602783203, "global_step": 293021, "epoch": 3530} {"train_loss": -25.798120498657227, "global_step": 293022, "epoch": 3530} {"train_loss": -25.68787956237793, "global_step": 293023, "epoch": 3530} {"train_loss": -25.520891189575195, "global_step": 293024, "epoch": 3530} {"train_loss": -25.183639526367188, "global_step": 293025, "epoch": 3530} {"train_loss": -25.584007263183594, "global_step": 293026, "epoch": 3530} {"train_loss": -25.367055892944336, "global_step": 293027, "epoch": 3530} {"train_loss": -25.5546932220459, "global_step": 293028, "epoch": 3530} {"train_loss": -25.17665672302246, "global_step": 293029, "epoch": 3530} {"train_loss": -25.72194480895996, "global_step": 293030, "epoch": 3530} {"train_loss": -25.557937622070312, "global_step": 293031, "epoch": 3530} {"train_loss": -25.814428329467773, "global_step": 293032, "epoch": 3530} {"train_loss": -25.881189346313477, "global_step": 293033, "epoch": 3530} {"train_loss": -25.569799423217773, "global_step": 293034, "epoch": 3530} {"train_loss": -25.39714813232422, "global_step": 293035, "epoch": 3530} {"train_loss": -25.555633544921875, "global_step": 293036, "epoch": 3530} {"train_loss": -25.279541015625, "global_step": 293037, "epoch": 3530} {"train_loss": -25.66059684753418, "global_step": 293038, "epoch": 3530} {"train_loss": -25.47981071472168, "global_step": 293039, "epoch": 3530} {"train_loss": -25.48683738708496, "global_step": 293040, "epoch": 3530} {"train_loss": -25.796833038330078, "global_step": 293041, "epoch": 3530} {"train_loss": -25.76740074157715, "global_step": 293042, "epoch": 3530} {"train_loss": -25.683002471923828, "global_step": 293043, "epoch": 3530} {"train_loss": -25.417556762695312, "global_step": 293044, "epoch": 3530} {"train_loss": -25.769575119018555, "global_step": 293045, "epoch": 3530} {"train_loss": -25.803430557250977, "global_step": 293046, "epoch": 3530} {"train_loss": -25.40995216369629, "global_step": 293047, "epoch": 3530} {"train_loss": -25.80375099182129, "global_step": 293048, "epoch": 3530} {"train_loss": -25.6320743560791, "global_step": 293049, "epoch": 3530} {"train_loss": -25.751245498657227, "global_step": 293050, "epoch": 3530} {"train_loss": -25.609262466430664, "global_step": 293051, "epoch": 3530} {"train_loss": -25.762451171875, "global_step": 293052, "epoch": 3530} {"train_loss": -25.556167602539062, "global_step": 293053, "epoch": 3530} {"train_loss": -25.388545989990234, "global_step": 293054, "epoch": 3530} {"train_loss": -25.40142822265625, "global_step": 293055, "epoch": 3530} {"train_loss": -25.682584762573242, "global_step": 293056, "epoch": 3530} {"train_loss": -25.195688247680664, "global_step": 293057, "epoch": 3530} {"train_loss": -25.194852828979492, "global_step": 293058, "epoch": 3530} {"train_loss": -25.802026748657227, "global_step": 293059, "epoch": 3530} {"train_loss": -25.32587242126465, "global_step": 293060, "epoch": 3530} {"train_loss": -25.40232276916504, "global_step": 293061, "epoch": 3530} {"train_loss": -25.936338424682617, "global_step": 293062, "epoch": 3530} {"train_loss": -25.48440170288086, "global_step": 293063, "epoch": 3530} {"train_loss": -25.092212677001953, "global_step": 293064, "epoch": 3530} {"train_loss": -25.19904136657715, "global_step": 293065, "epoch": 3530} {"train_loss": -25.42738914489746, "global_step": 293066, "epoch": 3530} {"train_loss": -25.444860458374023, "global_step": 293067, "epoch": 3530} {"train_loss": -25.437944412231445, "global_step": 293068, "epoch": 3530} {"train_loss": -25.342832565307617, "global_step": 293069, "epoch": 3530} {"train_loss": -25.3541202545166, "global_step": 293070, "epoch": 3530} {"train_loss": -25.44777488708496, "global_step": 293071, "epoch": 3530} {"train_loss": -25.456060846167876, "global_step": 293072, "epoch": 3530, "val_loss": 7195227.0} {"train_loss": -25.151987075805664, "global_step": 293073, "epoch": 3531} {"train_loss": -25.307491302490234, "global_step": 293074, "epoch": 3531} {"train_loss": -25.492399215698242, "global_step": 293075, "epoch": 3531} {"train_loss": -25.527421951293945, "global_step": 293076, "epoch": 3531} {"train_loss": -25.385061264038086, "global_step": 293077, "epoch": 3531} {"train_loss": -25.17226219177246, "global_step": 293078, "epoch": 3531} {"train_loss": -25.518726348876953, "global_step": 293079, "epoch": 3531} {"train_loss": -25.430891036987305, "global_step": 293080, "epoch": 3531} {"train_loss": -25.326467514038086, "global_step": 293081, "epoch": 3531} {"train_loss": -25.620878219604492, "global_step": 293082, "epoch": 3531} {"train_loss": -25.65093994140625, "global_step": 293083, "epoch": 3531} {"train_loss": -25.724645614624023, "global_step": 293084, "epoch": 3531} {"train_loss": -25.559619903564453, "global_step": 293085, "epoch": 3531} {"train_loss": -25.433523178100586, "global_step": 293086, "epoch": 3531} {"train_loss": -25.216571807861328, "global_step": 293087, "epoch": 3531} {"train_loss": -25.668869018554688, "global_step": 293088, "epoch": 3531} {"train_loss": -25.707778930664062, "global_step": 293089, "epoch": 3531} {"train_loss": -25.88079261779785, "global_step": 293090, "epoch": 3531} {"train_loss": -25.820209503173828, "global_step": 293091, "epoch": 3531} {"train_loss": -25.12538719177246, "global_step": 293092, "epoch": 3531} {"train_loss": -25.77924156188965, "global_step": 293093, "epoch": 3531} {"train_loss": -25.27129364013672, "global_step": 293094, "epoch": 3531} {"train_loss": -25.552404403686523, "global_step": 293095, "epoch": 3531} {"train_loss": -25.121633529663086, "global_step": 293096, "epoch": 3531} {"train_loss": -25.590543746948242, "global_step": 293097, "epoch": 3531} {"train_loss": -25.812589645385742, "global_step": 293098, "epoch": 3531} {"train_loss": -25.555959701538086, "global_step": 293099, "epoch": 3531} {"train_loss": -25.6274471282959, "global_step": 293100, "epoch": 3531} {"train_loss": -25.33424949645996, "global_step": 293101, "epoch": 3531} {"train_loss": -25.393400192260742, "global_step": 293102, "epoch": 3531} {"train_loss": -25.8166561126709, "global_step": 293103, "epoch": 3531} {"train_loss": -24.97698402404785, "global_step": 293104, "epoch": 3531} {"train_loss": -25.41678237915039, "global_step": 293105, "epoch": 3531} {"train_loss": -25.537246704101562, "global_step": 293106, "epoch": 3531} {"train_loss": -25.561613082885742, "global_step": 293107, "epoch": 3531} {"train_loss": -25.518936157226562, "global_step": 293108, "epoch": 3531} {"train_loss": -25.65596580505371, "global_step": 293109, "epoch": 3531} {"train_loss": -25.815948486328125, "global_step": 293110, "epoch": 3531} {"train_loss": -25.788806915283203, "global_step": 293111, "epoch": 3531} {"train_loss": -25.731353759765625, "global_step": 293112, "epoch": 3531} {"train_loss": -25.322946548461914, "global_step": 293113, "epoch": 3531} {"train_loss": -25.3770694732666, "global_step": 293114, "epoch": 3531} {"train_loss": -25.383041381835938, "global_step": 293115, "epoch": 3531} {"train_loss": -25.882482528686523, "global_step": 293116, "epoch": 3531} {"train_loss": -25.807233810424805, "global_step": 293117, "epoch": 3531} {"train_loss": -25.760095596313477, "global_step": 293118, "epoch": 3531} {"train_loss": -25.43168067932129, "global_step": 293119, "epoch": 3531} {"train_loss": -25.927900314331055, "global_step": 293120, "epoch": 3531} {"train_loss": -25.96669578552246, "global_step": 293121, "epoch": 3531} {"train_loss": -25.640867233276367, "global_step": 293122, "epoch": 3531} {"train_loss": -25.71170425415039, "global_step": 293123, "epoch": 3531} {"train_loss": -25.749921798706055, "global_step": 293124, "epoch": 3531} {"train_loss": -25.69046974182129, "global_step": 293125, "epoch": 3531} {"train_loss": -25.574865341186523, "global_step": 293126, "epoch": 3531} {"train_loss": -25.324947357177734, "global_step": 293127, "epoch": 3531} {"train_loss": -25.647619247436523, "global_step": 293128, "epoch": 3531} {"train_loss": -25.565032958984375, "global_step": 293129, "epoch": 3531} {"train_loss": -25.30533218383789, "global_step": 293130, "epoch": 3531} {"train_loss": -25.536012649536133, "global_step": 293131, "epoch": 3531} {"train_loss": -25.16413688659668, "global_step": 293132, "epoch": 3531} {"train_loss": -24.491865158081055, "global_step": 293133, "epoch": 3531} {"train_loss": -24.24924659729004, "global_step": 293134, "epoch": 3531} {"train_loss": -24.903234481811523, "global_step": 293135, "epoch": 3531} {"train_loss": -25.615407943725586, "global_step": 293136, "epoch": 3531} {"train_loss": -25.20966911315918, "global_step": 293137, "epoch": 3531} {"train_loss": -25.438810348510742, "global_step": 293138, "epoch": 3531} {"train_loss": -25.278532028198242, "global_step": 293139, "epoch": 3531} {"train_loss": -25.24641990661621, "global_step": 293140, "epoch": 3531} {"train_loss": -25.626840591430664, "global_step": 293141, "epoch": 3531} {"train_loss": -25.66742515563965, "global_step": 293142, "epoch": 3531} {"train_loss": -25.463735580444336, "global_step": 293143, "epoch": 3531} {"train_loss": -25.535388946533203, "global_step": 293144, "epoch": 3531} {"train_loss": -25.508834838867188, "global_step": 293145, "epoch": 3531} {"train_loss": -24.711469650268555, "global_step": 293146, "epoch": 3531} {"train_loss": -25.2822322845459, "global_step": 293147, "epoch": 3531} {"train_loss": -25.322750091552734, "global_step": 293148, "epoch": 3531} {"train_loss": -25.76857566833496, "global_step": 293149, "epoch": 3531} {"train_loss": -25.74082374572754, "global_step": 293150, "epoch": 3531} {"train_loss": -25.263212203979492, "global_step": 293151, "epoch": 3531} {"train_loss": -25.172372817993164, "global_step": 293152, "epoch": 3531} {"train_loss": -25.342605590820312, "global_step": 293153, "epoch": 3531} {"train_loss": -25.706729888916016, "global_step": 293154, "epoch": 3531} {"train_loss": -25.48655215803399, "global_step": 293155, "epoch": 3531, "val_loss": 7182717.0} {"train_loss": -25.143156051635742, "global_step": 293156, "epoch": 3532} {"train_loss": -25.106739044189453, "global_step": 293157, "epoch": 3532} {"train_loss": -25.191801071166992, "global_step": 293158, "epoch": 3532} {"train_loss": -25.260238647460938, "global_step": 293159, "epoch": 3532} {"train_loss": -24.948965072631836, "global_step": 293160, "epoch": 3532} {"train_loss": -25.57057762145996, "global_step": 293161, "epoch": 3532} {"train_loss": -25.640640258789062, "global_step": 293162, "epoch": 3532} {"train_loss": -25.010746002197266, "global_step": 293163, "epoch": 3532} {"train_loss": -25.549001693725586, "global_step": 293164, "epoch": 3532} {"train_loss": -24.883481979370117, "global_step": 293165, "epoch": 3532} {"train_loss": -25.559377670288086, "global_step": 293166, "epoch": 3532} {"train_loss": -25.210779190063477, "global_step": 293167, "epoch": 3532} {"train_loss": -25.580995559692383, "global_step": 293168, "epoch": 3532} {"train_loss": -25.396888732910156, "global_step": 293169, "epoch": 3532} {"train_loss": -25.53955841064453, "global_step": 293170, "epoch": 3532} {"train_loss": -25.312931060791016, "global_step": 293171, "epoch": 3532} {"train_loss": -25.355398178100586, "global_step": 293172, "epoch": 3532} {"train_loss": -25.107168197631836, "global_step": 293173, "epoch": 3532} {"train_loss": -25.57452964782715, "global_step": 293174, "epoch": 3532} {"train_loss": -25.41254997253418, "global_step": 293175, "epoch": 3532} {"train_loss": -25.774250030517578, "global_step": 293176, "epoch": 3532} {"train_loss": -25.51141929626465, "global_step": 293177, "epoch": 3532} {"train_loss": -25.693342208862305, "global_step": 293178, "epoch": 3532} {"train_loss": -25.3956356048584, "global_step": 293179, "epoch": 3532} {"train_loss": -25.558277130126953, "global_step": 293180, "epoch": 3532} {"train_loss": -25.25894546508789, "global_step": 293181, "epoch": 3532} {"train_loss": -26.015411376953125, "global_step": 293182, "epoch": 3532} {"train_loss": -25.516162872314453, "global_step": 293183, "epoch": 3532} {"train_loss": -25.327653884887695, "global_step": 293184, "epoch": 3532} {"train_loss": -25.230478286743164, "global_step": 293185, "epoch": 3532} {"train_loss": -25.433622360229492, "global_step": 293186, "epoch": 3532} {"train_loss": -25.460012435913086, "global_step": 293187, "epoch": 3532} {"train_loss": -25.386951446533203, "global_step": 293188, "epoch": 3532} {"train_loss": -25.465702056884766, "global_step": 293189, "epoch": 3532} {"train_loss": -25.38579750061035, "global_step": 293190, "epoch": 3532} {"train_loss": -25.61115074157715, "global_step": 293191, "epoch": 3532} {"train_loss": -25.328947067260742, "global_step": 293192, "epoch": 3532} {"train_loss": -25.790283203125, "global_step": 293193, "epoch": 3532} {"train_loss": -25.511953353881836, "global_step": 293194, "epoch": 3532} {"train_loss": -25.359556198120117, "global_step": 293195, "epoch": 3532} {"train_loss": -25.243595123291016, "global_step": 293196, "epoch": 3532} {"train_loss": -25.87160301208496, "global_step": 293197, "epoch": 3532} {"train_loss": -25.755695343017578, "global_step": 293198, "epoch": 3532} {"train_loss": -25.530641555786133, "global_step": 293199, "epoch": 3532} {"train_loss": -25.4399471282959, "global_step": 293200, "epoch": 3532} {"train_loss": -25.775190353393555, "global_step": 293201, "epoch": 3532} {"train_loss": -25.2973690032959, "global_step": 293202, "epoch": 3532} {"train_loss": -25.556140899658203, "global_step": 293203, "epoch": 3532} {"train_loss": -25.591577529907227, "global_step": 293204, "epoch": 3532} {"train_loss": -25.643136978149414, "global_step": 293205, "epoch": 3532} {"train_loss": -25.582778930664062, "global_step": 293206, "epoch": 3532} {"train_loss": -25.268056869506836, "global_step": 293207, "epoch": 3532} {"train_loss": -25.549283981323242, "global_step": 293208, "epoch": 3532} {"train_loss": -25.849618911743164, "global_step": 293209, "epoch": 3532} {"train_loss": -25.59700584411621, "global_step": 293210, "epoch": 3532} {"train_loss": -25.06471061706543, "global_step": 293211, "epoch": 3532} {"train_loss": -25.78107261657715, "global_step": 293212, "epoch": 3532} {"train_loss": -25.478317260742188, "global_step": 293213, "epoch": 3532} {"train_loss": -25.618606567382812, "global_step": 293214, "epoch": 3532} {"train_loss": -25.624820709228516, "global_step": 293215, "epoch": 3532} {"train_loss": -25.587615966796875, "global_step": 293216, "epoch": 3532} {"train_loss": -26.24875259399414, "global_step": 293217, "epoch": 3532} {"train_loss": -26.034692764282227, "global_step": 293218, "epoch": 3532} {"train_loss": -25.82175064086914, "global_step": 293219, "epoch": 3532} {"train_loss": -25.806610107421875, "global_step": 293220, "epoch": 3532} {"train_loss": -25.616809844970703, "global_step": 293221, "epoch": 3532} {"train_loss": -25.654340744018555, "global_step": 293222, "epoch": 3532} {"train_loss": -25.430870056152344, "global_step": 293223, "epoch": 3532} {"train_loss": -25.80167579650879, "global_step": 293224, "epoch": 3532} {"train_loss": -25.71771240234375, "global_step": 293225, "epoch": 3532} {"train_loss": -25.673938751220703, "global_step": 293226, "epoch": 3532} {"train_loss": -25.743274688720703, "global_step": 293227, "epoch": 3532} {"train_loss": -25.792160034179688, "global_step": 293228, "epoch": 3532} {"train_loss": -25.547061920166016, "global_step": 293229, "epoch": 3532} {"train_loss": -25.802515029907227, "global_step": 293230, "epoch": 3532} {"train_loss": -25.769315719604492, "global_step": 293231, "epoch": 3532} {"train_loss": -25.704986572265625, "global_step": 293232, "epoch": 3532} {"train_loss": -26.055606842041016, "global_step": 293233, "epoch": 3532} {"train_loss": -25.722131729125977, "global_step": 293234, "epoch": 3532} {"train_loss": -25.328462600708008, "global_step": 293235, "epoch": 3532} {"train_loss": -25.543106079101562, "global_step": 293236, "epoch": 3532} {"train_loss": -25.80450439453125, "global_step": 293237, "epoch": 3532} {"train_loss": -25.530439560671887, "global_step": 293238, "epoch": 3532, "val_loss": 7181558.5} {"train_loss": -24.99977684020996, "global_step": 293239, "epoch": 3533} {"train_loss": -23.861204147338867, "global_step": 293240, "epoch": 3533} {"train_loss": -24.264123916625977, "global_step": 293241, "epoch": 3533} {"train_loss": -25.03851890563965, "global_step": 293242, "epoch": 3533} {"train_loss": -24.795568466186523, "global_step": 293243, "epoch": 3533} {"train_loss": -24.789674758911133, "global_step": 293244, "epoch": 3533} {"train_loss": -25.431745529174805, "global_step": 293245, "epoch": 3533} {"train_loss": -25.26546287536621, "global_step": 293246, "epoch": 3533} {"train_loss": -25.232236862182617, "global_step": 293247, "epoch": 3533} {"train_loss": -25.26564598083496, "global_step": 293248, "epoch": 3533} {"train_loss": -25.217348098754883, "global_step": 293249, "epoch": 3533} {"train_loss": -25.108469009399414, "global_step": 293250, "epoch": 3533} {"train_loss": -25.30698013305664, "global_step": 293251, "epoch": 3533} {"train_loss": -25.30229949951172, "global_step": 293252, "epoch": 3533} {"train_loss": -25.079675674438477, "global_step": 293253, "epoch": 3533} {"train_loss": -25.485736846923828, "global_step": 293254, "epoch": 3533} {"train_loss": -25.380929946899414, "global_step": 293255, "epoch": 3533} {"train_loss": -25.290205001831055, "global_step": 293256, "epoch": 3533} {"train_loss": -25.405813217163086, "global_step": 293257, "epoch": 3533} {"train_loss": -24.987781524658203, "global_step": 293258, "epoch": 3533} {"train_loss": -25.412952423095703, "global_step": 293259, "epoch": 3533} {"train_loss": -25.378862380981445, "global_step": 293260, "epoch": 3533} {"train_loss": -25.740503311157227, "global_step": 293261, "epoch": 3533} {"train_loss": -25.68865394592285, "global_step": 293262, "epoch": 3533} {"train_loss": -25.400983810424805, "global_step": 293263, "epoch": 3533} {"train_loss": -25.783472061157227, "global_step": 293264, "epoch": 3533} {"train_loss": -26.068328857421875, "global_step": 293265, "epoch": 3533} {"train_loss": -25.628585815429688, "global_step": 293266, "epoch": 3533} {"train_loss": -25.85931968688965, "global_step": 293267, "epoch": 3533} {"train_loss": -25.659549713134766, "global_step": 293268, "epoch": 3533} {"train_loss": -25.72749900817871, "global_step": 293269, "epoch": 3533} {"train_loss": -25.737171173095703, "global_step": 293270, "epoch": 3533} {"train_loss": -25.883544921875, "global_step": 293271, "epoch": 3533} {"train_loss": -25.39978790283203, "global_step": 293272, "epoch": 3533} {"train_loss": -25.743087768554688, "global_step": 293273, "epoch": 3533} {"train_loss": -26.04303550720215, "global_step": 293274, "epoch": 3533} {"train_loss": -26.09712028503418, "global_step": 293275, "epoch": 3533} {"train_loss": -25.34908103942871, "global_step": 293276, "epoch": 3533} {"train_loss": -25.496105194091797, "global_step": 293277, "epoch": 3533} {"train_loss": -25.40488052368164, "global_step": 293278, "epoch": 3533} {"train_loss": -25.557037353515625, "global_step": 293279, "epoch": 3533} {"train_loss": -25.69178581237793, "global_step": 293280, "epoch": 3533} {"train_loss": -25.434621810913086, "global_step": 293281, "epoch": 3533} {"train_loss": -25.61008071899414, "global_step": 293282, "epoch": 3533} {"train_loss": -25.72772216796875, "global_step": 293283, "epoch": 3533} {"train_loss": -25.503612518310547, "global_step": 293284, "epoch": 3533} {"train_loss": -25.945026397705078, "global_step": 293285, "epoch": 3533} {"train_loss": -25.591806411743164, "global_step": 293286, "epoch": 3533} {"train_loss": -25.179306030273438, "global_step": 293287, "epoch": 3533} {"train_loss": -25.393056869506836, "global_step": 293288, "epoch": 3533} {"train_loss": -26.2702693939209, "global_step": 293289, "epoch": 3533} {"train_loss": -25.888675689697266, "global_step": 293290, "epoch": 3533} {"train_loss": -25.735553741455078, "global_step": 293291, "epoch": 3533} {"train_loss": -25.602069854736328, "global_step": 293292, "epoch": 3533} {"train_loss": -25.68017578125, "global_step": 293293, "epoch": 3533} {"train_loss": -25.603668212890625, "global_step": 293294, "epoch": 3533} {"train_loss": -25.351505279541016, "global_step": 293295, "epoch": 3533} {"train_loss": -24.736183166503906, "global_step": 293296, "epoch": 3533} {"train_loss": -24.025259017944336, "global_step": 293297, "epoch": 3533} {"train_loss": -23.89741325378418, "global_step": 293298, "epoch": 3533} {"train_loss": -24.975692749023438, "global_step": 293299, "epoch": 3533} {"train_loss": -25.515954971313477, "global_step": 293300, "epoch": 3533} {"train_loss": -24.823667526245117, "global_step": 293301, "epoch": 3533} {"train_loss": -25.308204650878906, "global_step": 293302, "epoch": 3533} {"train_loss": -25.652883529663086, "global_step": 293303, "epoch": 3533} {"train_loss": -25.555837631225586, "global_step": 293304, "epoch": 3533} {"train_loss": -25.357336044311523, "global_step": 293305, "epoch": 3533} {"train_loss": -25.339872360229492, "global_step": 293306, "epoch": 3533} {"train_loss": -25.427766799926758, "global_step": 293307, "epoch": 3533} {"train_loss": -25.323673248291016, "global_step": 293308, "epoch": 3533} {"train_loss": -25.428043365478516, "global_step": 293309, "epoch": 3533} {"train_loss": -25.250614166259766, "global_step": 293310, "epoch": 3533} {"train_loss": -25.326658248901367, "global_step": 293311, "epoch": 3533} {"train_loss": -25.272733688354492, "global_step": 293312, "epoch": 3533} {"train_loss": -25.129383087158203, "global_step": 293313, "epoch": 3533} {"train_loss": -25.277589797973633, "global_step": 293314, "epoch": 3533} {"train_loss": -25.48175811767578, "global_step": 293315, "epoch": 3533} {"train_loss": -25.337099075317383, "global_step": 293316, "epoch": 3533} {"train_loss": -25.452329635620117, "global_step": 293317, "epoch": 3533} {"train_loss": -25.153959274291992, "global_step": 293318, "epoch": 3533} {"train_loss": -25.651920318603516, "global_step": 293319, "epoch": 3533} {"train_loss": -25.072683334350586, "global_step": 293320, "epoch": 3533} {"train_loss": -25.36036319043263, "global_step": 293321, "epoch": 3533, "val_loss": 7094106.0} {"train_loss": -25.396259307861328, "global_step": 293322, "epoch": 3534} {"train_loss": -25.443340301513672, "global_step": 293323, "epoch": 3534} {"train_loss": -25.13191032409668, "global_step": 293324, "epoch": 3534} {"train_loss": -25.48932456970215, "global_step": 293325, "epoch": 3534} {"train_loss": -25.344472885131836, "global_step": 293326, "epoch": 3534} {"train_loss": -25.521732330322266, "global_step": 293327, "epoch": 3534} {"train_loss": -25.297840118408203, "global_step": 293328, "epoch": 3534} {"train_loss": -25.133419036865234, "global_step": 293329, "epoch": 3534} {"train_loss": -25.086538314819336, "global_step": 293330, "epoch": 3534} {"train_loss": -25.494565963745117, "global_step": 293331, "epoch": 3534} {"train_loss": -25.20650291442871, "global_step": 293332, "epoch": 3534} {"train_loss": -25.146970748901367, "global_step": 293333, "epoch": 3534} {"train_loss": -25.55494499206543, "global_step": 293334, "epoch": 3534} {"train_loss": -25.3387508392334, "global_step": 293335, "epoch": 3534} {"train_loss": -25.007131576538086, "global_step": 293336, "epoch": 3534} {"train_loss": -25.383146286010742, "global_step": 293337, "epoch": 3534} {"train_loss": -25.334308624267578, "global_step": 293338, "epoch": 3534} {"train_loss": -25.7856502532959, "global_step": 293339, "epoch": 3534} {"train_loss": -25.454599380493164, "global_step": 293340, "epoch": 3534} {"train_loss": -25.426870346069336, "global_step": 293341, "epoch": 3534} {"train_loss": -25.387798309326172, "global_step": 293342, "epoch": 3534} {"train_loss": -25.67416763305664, "global_step": 293343, "epoch": 3534} {"train_loss": -24.910625457763672, "global_step": 293344, "epoch": 3534} {"train_loss": -25.605300903320312, "global_step": 293345, "epoch": 3534} {"train_loss": -25.264225006103516, "global_step": 293346, "epoch": 3534} {"train_loss": -25.86113929748535, "global_step": 293347, "epoch": 3534} {"train_loss": -25.86244773864746, "global_step": 293348, "epoch": 3534} {"train_loss": -25.34779930114746, "global_step": 293349, "epoch": 3534} {"train_loss": -25.511310577392578, "global_step": 293350, "epoch": 3534} {"train_loss": -25.7320556640625, "global_step": 293351, "epoch": 3534} {"train_loss": -25.602888107299805, "global_step": 293352, "epoch": 3534} {"train_loss": -25.502273559570312, "global_step": 293353, "epoch": 3534} {"train_loss": -25.35770606994629, "global_step": 293354, "epoch": 3534} {"train_loss": -25.452316284179688, "global_step": 293355, "epoch": 3534} {"train_loss": -25.532485961914062, "global_step": 293356, "epoch": 3534} {"train_loss": -25.858596801757812, "global_step": 293357, "epoch": 3534} {"train_loss": -25.599143981933594, "global_step": 293358, "epoch": 3534} {"train_loss": -25.786725997924805, "global_step": 293359, "epoch": 3534} {"train_loss": -25.777149200439453, "global_step": 293360, "epoch": 3534} {"train_loss": -25.783899307250977, "global_step": 293361, "epoch": 3534} {"train_loss": -25.61781883239746, "global_step": 293362, "epoch": 3534} {"train_loss": -25.640750885009766, "global_step": 293363, "epoch": 3534} {"train_loss": -25.372879028320312, "global_step": 293364, "epoch": 3534} {"train_loss": -25.827789306640625, "global_step": 293365, "epoch": 3534} {"train_loss": -25.86737060546875, "global_step": 293366, "epoch": 3534} {"train_loss": -25.952783584594727, "global_step": 293367, "epoch": 3534} {"train_loss": -25.837743759155273, "global_step": 293368, "epoch": 3534} {"train_loss": -25.534948348999023, "global_step": 293369, "epoch": 3534} {"train_loss": -25.8709716796875, "global_step": 293370, "epoch": 3534} {"train_loss": -25.4274845123291, "global_step": 293371, "epoch": 3534} {"train_loss": -25.604516983032227, "global_step": 293372, "epoch": 3534} {"train_loss": -25.656309127807617, "global_step": 293373, "epoch": 3534} {"train_loss": -25.7910099029541, "global_step": 293374, "epoch": 3534} {"train_loss": -25.98801040649414, "global_step": 293375, "epoch": 3534} {"train_loss": -25.84296989440918, "global_step": 293376, "epoch": 3534} {"train_loss": -25.651813507080078, "global_step": 293377, "epoch": 3534} {"train_loss": -25.70400047302246, "global_step": 293378, "epoch": 3534} {"train_loss": -25.57195472717285, "global_step": 293379, "epoch": 3534} {"train_loss": -25.721149444580078, "global_step": 293380, "epoch": 3534} {"train_loss": -25.634923934936523, "global_step": 293381, "epoch": 3534} {"train_loss": -25.366559982299805, "global_step": 293382, "epoch": 3534} {"train_loss": -25.03329086303711, "global_step": 293383, "epoch": 3534} {"train_loss": -25.870473861694336, "global_step": 293384, "epoch": 3534} {"train_loss": -25.599796295166016, "global_step": 293385, "epoch": 3534} {"train_loss": -25.1345272064209, "global_step": 293386, "epoch": 3534} {"train_loss": -25.548566818237305, "global_step": 293387, "epoch": 3534} {"train_loss": -25.51076889038086, "global_step": 293388, "epoch": 3534} {"train_loss": -25.21183967590332, "global_step": 293389, "epoch": 3534} {"train_loss": -25.66082763671875, "global_step": 293390, "epoch": 3534} {"train_loss": -25.28313636779785, "global_step": 293391, "epoch": 3534} {"train_loss": -25.194395065307617, "global_step": 293392, "epoch": 3534} {"train_loss": -25.067363739013672, "global_step": 293393, "epoch": 3534} {"train_loss": -24.69017219543457, "global_step": 293394, "epoch": 3534} {"train_loss": -25.251142501831055, "global_step": 293395, "epoch": 3534} {"train_loss": -25.395261764526367, "global_step": 293396, "epoch": 3534} {"train_loss": -24.899028778076172, "global_step": 293397, "epoch": 3534} {"train_loss": -25.06972312927246, "global_step": 293398, "epoch": 3534} {"train_loss": -25.4271183013916, "global_step": 293399, "epoch": 3534} {"train_loss": -25.23282241821289, "global_step": 293400, "epoch": 3534} {"train_loss": -25.187849044799805, "global_step": 293401, "epoch": 3534} {"train_loss": -25.282817840576172, "global_step": 293402, "epoch": 3534} {"train_loss": -25.128509521484375, "global_step": 293403, "epoch": 3534} {"train_loss": -25.46421912779291, "global_step": 293404, "epoch": 3534, "val_loss": 7167110.0} {"train_loss": -24.63947105407715, "global_step": 293405, "epoch": 3535} {"train_loss": -25.222631454467773, "global_step": 293406, "epoch": 3535} {"train_loss": -24.39919090270996, "global_step": 293407, "epoch": 3535} {"train_loss": -25.22456169128418, "global_step": 293408, "epoch": 3535} {"train_loss": -24.38724708557129, "global_step": 293409, "epoch": 3535} {"train_loss": -24.957487106323242, "global_step": 293410, "epoch": 3535} {"train_loss": -24.42432403564453, "global_step": 293411, "epoch": 3535} {"train_loss": -24.88433265686035, "global_step": 293412, "epoch": 3535} {"train_loss": -24.498502731323242, "global_step": 293413, "epoch": 3535} {"train_loss": -24.449365615844727, "global_step": 293414, "epoch": 3535} {"train_loss": -24.848892211914062, "global_step": 293415, "epoch": 3535} {"train_loss": -24.64292335510254, "global_step": 293416, "epoch": 3535} {"train_loss": -24.833356857299805, "global_step": 293417, "epoch": 3535} {"train_loss": -24.89546775817871, "global_step": 293418, "epoch": 3535} {"train_loss": -24.784507751464844, "global_step": 293419, "epoch": 3535} {"train_loss": -25.020145416259766, "global_step": 293420, "epoch": 3535} {"train_loss": -25.27992057800293, "global_step": 293421, "epoch": 3535} {"train_loss": -25.02314567565918, "global_step": 293422, "epoch": 3535} {"train_loss": -25.06385040283203, "global_step": 293423, "epoch": 3535} {"train_loss": -25.250349044799805, "global_step": 293424, "epoch": 3535} {"train_loss": -25.041269302368164, "global_step": 293425, "epoch": 3535} {"train_loss": -25.235549926757812, "global_step": 293426, "epoch": 3535} {"train_loss": -25.207117080688477, "global_step": 293427, "epoch": 3535} {"train_loss": -25.316877365112305, "global_step": 293428, "epoch": 3535} {"train_loss": -25.280231475830078, "global_step": 293429, "epoch": 3535} {"train_loss": -24.921377182006836, "global_step": 293430, "epoch": 3535} {"train_loss": -25.607080459594727, "global_step": 293431, "epoch": 3535} {"train_loss": -25.18059730529785, "global_step": 293432, "epoch": 3535} {"train_loss": -25.66567039489746, "global_step": 293433, "epoch": 3535} {"train_loss": -25.273386001586914, "global_step": 293434, "epoch": 3535} {"train_loss": -25.47331428527832, "global_step": 293435, "epoch": 3535} {"train_loss": -25.19173240661621, "global_step": 293436, "epoch": 3535} {"train_loss": -25.269039154052734, "global_step": 293437, "epoch": 3535} {"train_loss": -25.177631378173828, "global_step": 293438, "epoch": 3535} {"train_loss": -25.59499168395996, "global_step": 293439, "epoch": 3535} {"train_loss": -25.28035545349121, "global_step": 293440, "epoch": 3535} {"train_loss": -25.577123641967773, "global_step": 293441, "epoch": 3535} {"train_loss": -25.54922103881836, "global_step": 293442, "epoch": 3535} {"train_loss": -25.59291648864746, "global_step": 293443, "epoch": 3535} {"train_loss": -25.799238204956055, "global_step": 293444, "epoch": 3535} {"train_loss": -25.38956642150879, "global_step": 293445, "epoch": 3535} {"train_loss": -25.37050437927246, "global_step": 293446, "epoch": 3535} {"train_loss": -25.515121459960938, "global_step": 293447, "epoch": 3535} {"train_loss": -25.770217895507812, "global_step": 293448, "epoch": 3535} {"train_loss": -25.72564697265625, "global_step": 293449, "epoch": 3535} {"train_loss": -25.561330795288086, "global_step": 293450, "epoch": 3535} {"train_loss": -25.80291748046875, "global_step": 293451, "epoch": 3535} {"train_loss": -25.896432876586914, "global_step": 293452, "epoch": 3535} {"train_loss": -25.7961483001709, "global_step": 293453, "epoch": 3535} {"train_loss": -25.614049911499023, "global_step": 293454, "epoch": 3535} {"train_loss": -25.931787490844727, "global_step": 293455, "epoch": 3535} {"train_loss": -25.903675079345703, "global_step": 293456, "epoch": 3535} {"train_loss": -25.529132843017578, "global_step": 293457, "epoch": 3535} {"train_loss": -25.488739013671875, "global_step": 293458, "epoch": 3535} {"train_loss": -25.71973991394043, "global_step": 293459, "epoch": 3535} {"train_loss": -25.482595443725586, "global_step": 293460, "epoch": 3535} {"train_loss": -25.8719425201416, "global_step": 293461, "epoch": 3535} {"train_loss": -26.261335372924805, "global_step": 293462, "epoch": 3535} {"train_loss": -25.90329933166504, "global_step": 293463, "epoch": 3535} {"train_loss": -25.752685546875, "global_step": 293464, "epoch": 3535} {"train_loss": -25.614948272705078, "global_step": 293465, "epoch": 3535} {"train_loss": -25.766666412353516, "global_step": 293466, "epoch": 3535} {"train_loss": -25.7866153717041, "global_step": 293467, "epoch": 3535} {"train_loss": -25.646320343017578, "global_step": 293468, "epoch": 3535} {"train_loss": -25.774534225463867, "global_step": 293469, "epoch": 3535} {"train_loss": -25.94972038269043, "global_step": 293470, "epoch": 3535} {"train_loss": -25.079811096191406, "global_step": 293471, "epoch": 3535} {"train_loss": -25.452301025390625, "global_step": 293472, "epoch": 3535} {"train_loss": -25.60699462890625, "global_step": 293473, "epoch": 3535} {"train_loss": -25.316238403320312, "global_step": 293474, "epoch": 3535} {"train_loss": -25.773162841796875, "global_step": 293475, "epoch": 3535} {"train_loss": -25.8452205657959, "global_step": 293476, "epoch": 3535} {"train_loss": -25.64314842224121, "global_step": 293477, "epoch": 3535} {"train_loss": -26.00385093688965, "global_step": 293478, "epoch": 3535} {"train_loss": -25.246320724487305, "global_step": 293479, "epoch": 3535} {"train_loss": -25.541006088256836, "global_step": 293480, "epoch": 3535} {"train_loss": -25.486143112182617, "global_step": 293481, "epoch": 3535} {"train_loss": -25.592382431030273, "global_step": 293482, "epoch": 3535} {"train_loss": -26.0925235748291, "global_step": 293483, "epoch": 3535} {"train_loss": -25.925565719604492, "global_step": 293484, "epoch": 3535} {"train_loss": -25.784351348876953, "global_step": 293485, "epoch": 3535} {"train_loss": -25.646411895751953, "global_step": 293486, "epoch": 3535} {"train_loss": -25.403067324534955, "global_step": 293487, "epoch": 3535, "val_loss": 7140400.0} {"train_loss": -24.89821434020996, "global_step": 293488, "epoch": 3536} {"train_loss": -24.02736473083496, "global_step": 293489, "epoch": 3536} {"train_loss": -24.38730239868164, "global_step": 293490, "epoch": 3536} {"train_loss": -24.440031051635742, "global_step": 293491, "epoch": 3536} {"train_loss": -24.936620712280273, "global_step": 293492, "epoch": 3536} {"train_loss": -25.11458396911621, "global_step": 293493, "epoch": 3536} {"train_loss": -25.166202545166016, "global_step": 293494, "epoch": 3536} {"train_loss": -24.844646453857422, "global_step": 293495, "epoch": 3536} {"train_loss": -25.038450241088867, "global_step": 293496, "epoch": 3536} {"train_loss": -25.228713989257812, "global_step": 293497, "epoch": 3536} {"train_loss": -24.88365936279297, "global_step": 293498, "epoch": 3536} {"train_loss": -25.086503982543945, "global_step": 293499, "epoch": 3536} {"train_loss": -25.632436752319336, "global_step": 293500, "epoch": 3536} {"train_loss": -25.339977264404297, "global_step": 293501, "epoch": 3536} {"train_loss": -25.44243812561035, "global_step": 293502, "epoch": 3536} {"train_loss": -25.387128829956055, "global_step": 293503, "epoch": 3536} {"train_loss": -25.559051513671875, "global_step": 293504, "epoch": 3536} {"train_loss": -25.1048526763916, "global_step": 293505, "epoch": 3536} {"train_loss": -25.29302978515625, "global_step": 293506, "epoch": 3536} {"train_loss": -25.510726928710938, "global_step": 293507, "epoch": 3536} {"train_loss": -25.435150146484375, "global_step": 293508, "epoch": 3536} {"train_loss": -25.661609649658203, "global_step": 293509, "epoch": 3536} {"train_loss": -25.473630905151367, "global_step": 293510, "epoch": 3536} {"train_loss": -25.514081954956055, "global_step": 293511, "epoch": 3536} {"train_loss": -25.40365982055664, "global_step": 293512, "epoch": 3536} {"train_loss": -25.449888229370117, "global_step": 293513, "epoch": 3536} {"train_loss": -25.403257369995117, "global_step": 293514, "epoch": 3536} {"train_loss": -25.612934112548828, "global_step": 293515, "epoch": 3536} {"train_loss": -25.446548461914062, "global_step": 293516, "epoch": 3536} {"train_loss": -25.578914642333984, "global_step": 293517, "epoch": 3536} {"train_loss": -25.779699325561523, "global_step": 293518, "epoch": 3536} {"train_loss": -25.707712173461914, "global_step": 293519, "epoch": 3536} {"train_loss": -25.709259033203125, "global_step": 293520, "epoch": 3536} {"train_loss": -25.783918380737305, "global_step": 293521, "epoch": 3536} {"train_loss": -25.528465270996094, "global_step": 293522, "epoch": 3536} {"train_loss": -25.66437339782715, "global_step": 293523, "epoch": 3536} {"train_loss": -25.71630859375, "global_step": 293524, "epoch": 3536} {"train_loss": -25.660343170166016, "global_step": 293525, "epoch": 3536} {"train_loss": -25.750085830688477, "global_step": 293526, "epoch": 3536} {"train_loss": -25.72210693359375, "global_step": 293527, "epoch": 3536} {"train_loss": -25.405406951904297, "global_step": 293528, "epoch": 3536} {"train_loss": -25.412628173828125, "global_step": 293529, "epoch": 3536} {"train_loss": -25.610021591186523, "global_step": 293530, "epoch": 3536} {"train_loss": -25.414575576782227, "global_step": 293531, "epoch": 3536} {"train_loss": -25.664432525634766, "global_step": 293532, "epoch": 3536} {"train_loss": -25.561935424804688, "global_step": 293533, "epoch": 3536} {"train_loss": -25.639612197875977, "global_step": 293534, "epoch": 3536} {"train_loss": -25.43716812133789, "global_step": 293535, "epoch": 3536} {"train_loss": -25.597341537475586, "global_step": 293536, "epoch": 3536} {"train_loss": -25.75954246520996, "global_step": 293537, "epoch": 3536} {"train_loss": -25.99616050720215, "global_step": 293538, "epoch": 3536} {"train_loss": -26.080556869506836, "global_step": 293539, "epoch": 3536} {"train_loss": -25.854963302612305, "global_step": 293540, "epoch": 3536} {"train_loss": -25.50579261779785, "global_step": 293541, "epoch": 3536} {"train_loss": -25.696762084960938, "global_step": 293542, "epoch": 3536} {"train_loss": -25.268606185913086, "global_step": 293543, "epoch": 3536} {"train_loss": -25.685535430908203, "global_step": 293544, "epoch": 3536} {"train_loss": -25.63441276550293, "global_step": 293545, "epoch": 3536} {"train_loss": -26.075498580932617, "global_step": 293546, "epoch": 3536} {"train_loss": -25.873334884643555, "global_step": 293547, "epoch": 3536} {"train_loss": -25.721471786499023, "global_step": 293548, "epoch": 3536} {"train_loss": -25.516977310180664, "global_step": 293549, "epoch": 3536} {"train_loss": -25.772979736328125, "global_step": 293550, "epoch": 3536} {"train_loss": -25.449880599975586, "global_step": 293551, "epoch": 3536} {"train_loss": -25.989429473876953, "global_step": 293552, "epoch": 3536} {"train_loss": -25.517486572265625, "global_step": 293553, "epoch": 3536} {"train_loss": -25.537429809570312, "global_step": 293554, "epoch": 3536} {"train_loss": -25.619489669799805, "global_step": 293555, "epoch": 3536} {"train_loss": -25.510456085205078, "global_step": 293556, "epoch": 3536} {"train_loss": -25.41654396057129, "global_step": 293557, "epoch": 3536} {"train_loss": -25.685535430908203, "global_step": 293558, "epoch": 3536} {"train_loss": -26.030838012695312, "global_step": 293559, "epoch": 3536} {"train_loss": -25.332937240600586, "global_step": 293560, "epoch": 3536} {"train_loss": -25.571876525878906, "global_step": 293561, "epoch": 3536} {"train_loss": -25.575979232788086, "global_step": 293562, "epoch": 3536} {"train_loss": -25.507028579711914, "global_step": 293563, "epoch": 3536} {"train_loss": -25.556156158447266, "global_step": 293564, "epoch": 3536} {"train_loss": -25.379053115844727, "global_step": 293565, "epoch": 3536} {"train_loss": -25.645910263061523, "global_step": 293566, "epoch": 3536} {"train_loss": -25.651458740234375, "global_step": 293567, "epoch": 3536} {"train_loss": -25.41523551940918, "global_step": 293568, "epoch": 3536} {"train_loss": -25.159732818603516, "global_step": 293569, "epoch": 3536} {"train_loss": -25.483548221817937, "global_step": 293570, "epoch": 3536, "val_loss": 7173732.0} {"train_loss": -25.154539108276367, "global_step": 293571, "epoch": 3537} {"train_loss": -25.398082733154297, "global_step": 293572, "epoch": 3537} {"train_loss": -25.315736770629883, "global_step": 293573, "epoch": 3537} {"train_loss": -25.305818557739258, "global_step": 293574, "epoch": 3537} {"train_loss": -25.248308181762695, "global_step": 293575, "epoch": 3537} {"train_loss": -25.27345848083496, "global_step": 293576, "epoch": 3537} {"train_loss": -25.602630615234375, "global_step": 293577, "epoch": 3537} {"train_loss": -25.410465240478516, "global_step": 293578, "epoch": 3537} {"train_loss": -25.660974502563477, "global_step": 293579, "epoch": 3537} {"train_loss": -25.230422973632812, "global_step": 293580, "epoch": 3537} {"train_loss": -25.231842041015625, "global_step": 293581, "epoch": 3537} {"train_loss": -25.486652374267578, "global_step": 293582, "epoch": 3537} {"train_loss": -25.435144424438477, "global_step": 293583, "epoch": 3537} {"train_loss": -25.334491729736328, "global_step": 293584, "epoch": 3537} {"train_loss": -25.53181266784668, "global_step": 293585, "epoch": 3537} {"train_loss": -25.383052825927734, "global_step": 293586, "epoch": 3537} {"train_loss": -25.581369400024414, "global_step": 293587, "epoch": 3537} {"train_loss": -25.424060821533203, "global_step": 293588, "epoch": 3537} {"train_loss": -25.668899536132812, "global_step": 293589, "epoch": 3537} {"train_loss": -25.432077407836914, "global_step": 293590, "epoch": 3537} {"train_loss": -25.63385009765625, "global_step": 293591, "epoch": 3537} {"train_loss": -25.293119430541992, "global_step": 293592, "epoch": 3537} {"train_loss": -25.62489128112793, "global_step": 293593, "epoch": 3537} {"train_loss": -25.58931541442871, "global_step": 293594, "epoch": 3537} {"train_loss": -25.648223876953125, "global_step": 293595, "epoch": 3537} {"train_loss": -25.671964645385742, "global_step": 293596, "epoch": 3537} {"train_loss": -25.746967315673828, "global_step": 293597, "epoch": 3537} {"train_loss": -25.63172721862793, "global_step": 293598, "epoch": 3537} {"train_loss": -25.82217788696289, "global_step": 293599, "epoch": 3537} {"train_loss": -25.66193962097168, "global_step": 293600, "epoch": 3537} {"train_loss": -25.782888412475586, "global_step": 293601, "epoch": 3537} {"train_loss": -25.566198348999023, "global_step": 293602, "epoch": 3537} {"train_loss": -25.49447250366211, "global_step": 293603, "epoch": 3537} {"train_loss": -25.925613403320312, "global_step": 293604, "epoch": 3537} {"train_loss": -25.4965877532959, "global_step": 293605, "epoch": 3537} {"train_loss": -25.58622169494629, "global_step": 293606, "epoch": 3537} {"train_loss": -26.064868927001953, "global_step": 293607, "epoch": 3537} {"train_loss": -25.386343002319336, "global_step": 293608, "epoch": 3537} {"train_loss": -25.52581787109375, "global_step": 293609, "epoch": 3537} {"train_loss": -25.503969192504883, "global_step": 293610, "epoch": 3537} {"train_loss": -25.848901748657227, "global_step": 293611, "epoch": 3537} {"train_loss": -25.7415771484375, "global_step": 293612, "epoch": 3537} {"train_loss": -25.845300674438477, "global_step": 293613, "epoch": 3537} {"train_loss": -25.608783721923828, "global_step": 293614, "epoch": 3537} {"train_loss": -25.548933029174805, "global_step": 293615, "epoch": 3537} {"train_loss": -25.806079864501953, "global_step": 293616, "epoch": 3537} {"train_loss": -26.047149658203125, "global_step": 293617, "epoch": 3537} {"train_loss": -25.69353675842285, "global_step": 293618, "epoch": 3537} {"train_loss": -25.5207462310791, "global_step": 293619, "epoch": 3537} {"train_loss": -25.900320053100586, "global_step": 293620, "epoch": 3537} {"train_loss": -25.754592895507812, "global_step": 293621, "epoch": 3537} {"train_loss": -25.5175724029541, "global_step": 293622, "epoch": 3537} {"train_loss": -25.261133193969727, "global_step": 293623, "epoch": 3537} {"train_loss": -25.5836238861084, "global_step": 293624, "epoch": 3537} {"train_loss": -25.165283203125, "global_step": 293625, "epoch": 3537} {"train_loss": -26.307275772094727, "global_step": 293626, "epoch": 3537} {"train_loss": -25.228254318237305, "global_step": 293627, "epoch": 3537} {"train_loss": -25.734989166259766, "global_step": 293628, "epoch": 3537} {"train_loss": -25.201330184936523, "global_step": 293629, "epoch": 3537} {"train_loss": -25.650299072265625, "global_step": 293630, "epoch": 3537} {"train_loss": -25.661502838134766, "global_step": 293631, "epoch": 3537} {"train_loss": -25.73004722595215, "global_step": 293632, "epoch": 3537} {"train_loss": -25.631834030151367, "global_step": 293633, "epoch": 3537} {"train_loss": -25.53917694091797, "global_step": 293634, "epoch": 3537} {"train_loss": -25.33388900756836, "global_step": 293635, "epoch": 3537} {"train_loss": -26.07198143005371, "global_step": 293636, "epoch": 3537} {"train_loss": -25.24834442138672, "global_step": 293637, "epoch": 3537} {"train_loss": -25.713415145874023, "global_step": 293638, "epoch": 3537} {"train_loss": -25.968494415283203, "global_step": 293639, "epoch": 3537} {"train_loss": -25.660938262939453, "global_step": 293640, "epoch": 3537} {"train_loss": -24.90534782409668, "global_step": 293641, "epoch": 3537} {"train_loss": -25.32057762145996, "global_step": 293642, "epoch": 3537} {"train_loss": -25.76310157775879, "global_step": 293643, "epoch": 3537} {"train_loss": -25.228759765625, "global_step": 293644, "epoch": 3537} {"train_loss": -25.299184799194336, "global_step": 293645, "epoch": 3537} {"train_loss": -25.46805191040039, "global_step": 293646, "epoch": 3537} {"train_loss": -25.507598876953125, "global_step": 293647, "epoch": 3537} {"train_loss": -25.895559310913086, "global_step": 293648, "epoch": 3537} {"train_loss": -25.4276180267334, "global_step": 293649, "epoch": 3537} {"train_loss": -25.569828033447266, "global_step": 293650, "epoch": 3537} {"train_loss": -25.246854782104492, "global_step": 293651, "epoch": 3537} {"train_loss": -25.4005126953125, "global_step": 293652, "epoch": 3537} {"train_loss": -25.540968125125012, "global_step": 293653, "epoch": 3537, "val_loss": 7119946.0} {"train_loss": -25.04254150390625, "global_step": 293654, "epoch": 3538} {"train_loss": -25.348251342773438, "global_step": 293655, "epoch": 3538} {"train_loss": -25.6287784576416, "global_step": 293656, "epoch": 3538} {"train_loss": -25.27650260925293, "global_step": 293657, "epoch": 3538} {"train_loss": -25.278654098510742, "global_step": 293658, "epoch": 3538} {"train_loss": -25.22818946838379, "global_step": 293659, "epoch": 3538} {"train_loss": -25.738317489624023, "global_step": 293660, "epoch": 3538} {"train_loss": -25.41788101196289, "global_step": 293661, "epoch": 3538} {"train_loss": -25.200206756591797, "global_step": 293662, "epoch": 3538} {"train_loss": -25.211790084838867, "global_step": 293663, "epoch": 3538} {"train_loss": -25.30714225769043, "global_step": 293664, "epoch": 3538} {"train_loss": -25.525583267211914, "global_step": 293665, "epoch": 3538} {"train_loss": -25.844470977783203, "global_step": 293666, "epoch": 3538} {"train_loss": -25.484418869018555, "global_step": 293667, "epoch": 3538} {"train_loss": -25.35430145263672, "global_step": 293668, "epoch": 3538} {"train_loss": -25.488672256469727, "global_step": 293669, "epoch": 3538} {"train_loss": -25.403188705444336, "global_step": 293670, "epoch": 3538} {"train_loss": -25.500253677368164, "global_step": 293671, "epoch": 3538} {"train_loss": -25.321706771850586, "global_step": 293672, "epoch": 3538} {"train_loss": -25.593435287475586, "global_step": 293673, "epoch": 3538} {"train_loss": -25.785572052001953, "global_step": 293674, "epoch": 3538} {"train_loss": -25.551870346069336, "global_step": 293675, "epoch": 3538} {"train_loss": -25.11104393005371, "global_step": 293676, "epoch": 3538} {"train_loss": -25.630783081054688, "global_step": 293677, "epoch": 3538} {"train_loss": -25.686487197875977, "global_step": 293678, "epoch": 3538} {"train_loss": -25.688405990600586, "global_step": 293679, "epoch": 3538} {"train_loss": -25.26557159423828, "global_step": 293680, "epoch": 3538} {"train_loss": -25.707611083984375, "global_step": 293681, "epoch": 3538} {"train_loss": -25.9815731048584, "global_step": 293682, "epoch": 3538} {"train_loss": -25.71587562561035, "global_step": 293683, "epoch": 3538} {"train_loss": -25.712249755859375, "global_step": 293684, "epoch": 3538} {"train_loss": -25.692808151245117, "global_step": 293685, "epoch": 3538} {"train_loss": -25.687997817993164, "global_step": 293686, "epoch": 3538} {"train_loss": -25.718595504760742, "global_step": 293687, "epoch": 3538} {"train_loss": -25.62076759338379, "global_step": 293688, "epoch": 3538} {"train_loss": -25.7351131439209, "global_step": 293689, "epoch": 3538} {"train_loss": -25.572904586791992, "global_step": 293690, "epoch": 3538} {"train_loss": -25.629179000854492, "global_step": 293691, "epoch": 3538} {"train_loss": -25.34065818786621, "global_step": 293692, "epoch": 3538} {"train_loss": -25.226572036743164, "global_step": 293693, "epoch": 3538} {"train_loss": -25.39219856262207, "global_step": 293694, "epoch": 3538} {"train_loss": -25.592252731323242, "global_step": 293695, "epoch": 3538} {"train_loss": -25.533231735229492, "global_step": 293696, "epoch": 3538} {"train_loss": -24.976491928100586, "global_step": 293697, "epoch": 3538} {"train_loss": -25.758420944213867, "global_step": 293698, "epoch": 3538} {"train_loss": -25.68177604675293, "global_step": 293699, "epoch": 3538} {"train_loss": -25.618223190307617, "global_step": 293700, "epoch": 3538} {"train_loss": -25.579240798950195, "global_step": 293701, "epoch": 3538} {"train_loss": -25.112958908081055, "global_step": 293702, "epoch": 3538} {"train_loss": -25.505268096923828, "global_step": 293703, "epoch": 3538} {"train_loss": -25.633142471313477, "global_step": 293704, "epoch": 3538} {"train_loss": -25.75455093383789, "global_step": 293705, "epoch": 3538} {"train_loss": -25.440471649169922, "global_step": 293706, "epoch": 3538} {"train_loss": -25.471603393554688, "global_step": 293707, "epoch": 3538} {"train_loss": -25.43630027770996, "global_step": 293708, "epoch": 3538} {"train_loss": -25.500202178955078, "global_step": 293709, "epoch": 3538} {"train_loss": -25.643508911132812, "global_step": 293710, "epoch": 3538} {"train_loss": -25.36753273010254, "global_step": 293711, "epoch": 3538} {"train_loss": -25.71436882019043, "global_step": 293712, "epoch": 3538} {"train_loss": -25.766469955444336, "global_step": 293713, "epoch": 3538} {"train_loss": -25.43597984313965, "global_step": 293714, "epoch": 3538} {"train_loss": -25.61488914489746, "global_step": 293715, "epoch": 3538} {"train_loss": -25.60565757751465, "global_step": 293716, "epoch": 3538} {"train_loss": -25.78592872619629, "global_step": 293717, "epoch": 3538} {"train_loss": -24.76131248474121, "global_step": 293718, "epoch": 3538} {"train_loss": -25.16196060180664, "global_step": 293719, "epoch": 3538} {"train_loss": -25.304922103881836, "global_step": 293720, "epoch": 3538} {"train_loss": -25.31904411315918, "global_step": 293721, "epoch": 3538} {"train_loss": -25.717803955078125, "global_step": 293722, "epoch": 3538} {"train_loss": -25.64914894104004, "global_step": 293723, "epoch": 3538} {"train_loss": -25.515920639038086, "global_step": 293724, "epoch": 3538} {"train_loss": -25.407129287719727, "global_step": 293725, "epoch": 3538} {"train_loss": -25.589677810668945, "global_step": 293726, "epoch": 3538} {"train_loss": -25.423086166381836, "global_step": 293727, "epoch": 3538} {"train_loss": -25.655323028564453, "global_step": 293728, "epoch": 3538} {"train_loss": -25.267902374267578, "global_step": 293729, "epoch": 3538} {"train_loss": -25.175657272338867, "global_step": 293730, "epoch": 3538} {"train_loss": -25.315717697143555, "global_step": 293731, "epoch": 3538} {"train_loss": -25.60744285583496, "global_step": 293732, "epoch": 3538} {"train_loss": -25.353866577148438, "global_step": 293733, "epoch": 3538} {"train_loss": -25.408353805541992, "global_step": 293734, "epoch": 3538} {"train_loss": -25.55319595336914, "global_step": 293735, "epoch": 3538} {"train_loss": -25.497807468276427, "global_step": 293736, "epoch": 3538, "val_loss": 7208765.0} {"train_loss": -25.356229782104492, "global_step": 293737, "epoch": 3539} {"train_loss": -25.459415435791016, "global_step": 293738, "epoch": 3539} {"train_loss": -25.26943588256836, "global_step": 293739, "epoch": 3539} {"train_loss": -25.518415451049805, "global_step": 293740, "epoch": 3539} {"train_loss": -25.203977584838867, "global_step": 293741, "epoch": 3539} {"train_loss": -25.306365966796875, "global_step": 293742, "epoch": 3539} {"train_loss": -25.22601318359375, "global_step": 293743, "epoch": 3539} {"train_loss": -25.45108413696289, "global_step": 293744, "epoch": 3539} {"train_loss": -25.193429946899414, "global_step": 293745, "epoch": 3539} {"train_loss": -25.337459564208984, "global_step": 293746, "epoch": 3539} {"train_loss": -25.14424705505371, "global_step": 293747, "epoch": 3539} {"train_loss": -25.95673942565918, "global_step": 293748, "epoch": 3539} {"train_loss": -25.459932327270508, "global_step": 293749, "epoch": 3539} {"train_loss": -25.305044174194336, "global_step": 293750, "epoch": 3539} {"train_loss": -25.307851791381836, "global_step": 293751, "epoch": 3539} {"train_loss": -25.577964782714844, "global_step": 293752, "epoch": 3539} {"train_loss": -25.422101974487305, "global_step": 293753, "epoch": 3539} {"train_loss": -25.8062686920166, "global_step": 293754, "epoch": 3539} {"train_loss": -25.60165786743164, "global_step": 293755, "epoch": 3539} {"train_loss": -25.668867111206055, "global_step": 293756, "epoch": 3539} {"train_loss": -25.580982208251953, "global_step": 293757, "epoch": 3539} {"train_loss": -25.36895751953125, "global_step": 293758, "epoch": 3539} {"train_loss": -25.487783432006836, "global_step": 293759, "epoch": 3539} {"train_loss": -25.856603622436523, "global_step": 293760, "epoch": 3539} {"train_loss": -25.9688663482666, "global_step": 293761, "epoch": 3539} {"train_loss": -25.487398147583008, "global_step": 293762, "epoch": 3539} {"train_loss": -25.667133331298828, "global_step": 293763, "epoch": 3539} {"train_loss": -25.405412673950195, "global_step": 293764, "epoch": 3539} {"train_loss": -25.536531448364258, "global_step": 293765, "epoch": 3539} {"train_loss": -25.972089767456055, "global_step": 293766, "epoch": 3539} {"train_loss": -25.748815536499023, "global_step": 293767, "epoch": 3539} {"train_loss": -25.571945190429688, "global_step": 293768, "epoch": 3539} {"train_loss": -25.72735595703125, "global_step": 293769, "epoch": 3539} {"train_loss": -25.927093505859375, "global_step": 293770, "epoch": 3539} {"train_loss": -25.535337448120117, "global_step": 293771, "epoch": 3539} {"train_loss": -25.624902725219727, "global_step": 293772, "epoch": 3539} {"train_loss": -25.62442398071289, "global_step": 293773, "epoch": 3539} {"train_loss": -25.41888999938965, "global_step": 293774, "epoch": 3539} {"train_loss": -25.292362213134766, "global_step": 293775, "epoch": 3539} {"train_loss": -25.600696563720703, "global_step": 293776, "epoch": 3539} {"train_loss": -25.811559677124023, "global_step": 293777, "epoch": 3539} {"train_loss": -25.73463249206543, "global_step": 293778, "epoch": 3539} {"train_loss": -25.608814239501953, "global_step": 293779, "epoch": 3539} {"train_loss": -25.526193618774414, "global_step": 293780, "epoch": 3539} {"train_loss": -25.719470977783203, "global_step": 293781, "epoch": 3539} {"train_loss": -25.462154388427734, "global_step": 293782, "epoch": 3539} {"train_loss": -25.717105865478516, "global_step": 293783, "epoch": 3539} {"train_loss": -25.58686065673828, "global_step": 293784, "epoch": 3539} {"train_loss": -25.614154815673828, "global_step": 293785, "epoch": 3539} {"train_loss": -25.965290069580078, "global_step": 293786, "epoch": 3539} {"train_loss": -25.941394805908203, "global_step": 293787, "epoch": 3539} {"train_loss": -25.26466178894043, "global_step": 293788, "epoch": 3539} {"train_loss": -25.63803482055664, "global_step": 293789, "epoch": 3539} {"train_loss": -25.462453842163086, "global_step": 293790, "epoch": 3539} {"train_loss": -25.815481185913086, "global_step": 293791, "epoch": 3539} {"train_loss": -25.754545211791992, "global_step": 293792, "epoch": 3539} {"train_loss": -25.612756729125977, "global_step": 293793, "epoch": 3539} {"train_loss": -26.0553035736084, "global_step": 293794, "epoch": 3539} {"train_loss": -25.595245361328125, "global_step": 293795, "epoch": 3539} {"train_loss": -25.395889282226562, "global_step": 293796, "epoch": 3539} {"train_loss": -26.006702423095703, "global_step": 293797, "epoch": 3539} {"train_loss": -24.895902633666992, "global_step": 293798, "epoch": 3539} {"train_loss": -25.21774673461914, "global_step": 293799, "epoch": 3539} {"train_loss": -25.556272506713867, "global_step": 293800, "epoch": 3539} {"train_loss": -25.575124740600586, "global_step": 293801, "epoch": 3539} {"train_loss": -25.410144805908203, "global_step": 293802, "epoch": 3539} {"train_loss": -25.793212890625, "global_step": 293803, "epoch": 3539} {"train_loss": -25.716455459594727, "global_step": 293804, "epoch": 3539} {"train_loss": -25.739093780517578, "global_step": 293805, "epoch": 3539} {"train_loss": -25.33160972595215, "global_step": 293806, "epoch": 3539} {"train_loss": -25.74250602722168, "global_step": 293807, "epoch": 3539} {"train_loss": -25.537147521972656, "global_step": 293808, "epoch": 3539} {"train_loss": -25.634313583374023, "global_step": 293809, "epoch": 3539} {"train_loss": -25.603452682495117, "global_step": 293810, "epoch": 3539} {"train_loss": -25.7639217376709, "global_step": 293811, "epoch": 3539} {"train_loss": -25.76694679260254, "global_step": 293812, "epoch": 3539} {"train_loss": -25.850208282470703, "global_step": 293813, "epoch": 3539} {"train_loss": -25.536849975585938, "global_step": 293814, "epoch": 3539} {"train_loss": -25.510757446289062, "global_step": 293815, "epoch": 3539} {"train_loss": -25.399612426757812, "global_step": 293816, "epoch": 3539} {"train_loss": -25.340307235717773, "global_step": 293817, "epoch": 3539} {"train_loss": -25.66489028930664, "global_step": 293818, "epoch": 3539} {"train_loss": -25.58069449734975, "global_step": 293819, "epoch": 3539, "val_loss": 7182967.5} {"train_loss": -25.2841796875, "global_step": 293820, "epoch": 3540} {"train_loss": -25.354936599731445, "global_step": 293821, "epoch": 3540} {"train_loss": -24.813732147216797, "global_step": 293822, "epoch": 3540} {"train_loss": -25.788415908813477, "global_step": 293823, "epoch": 3540} {"train_loss": -25.368099212646484, "global_step": 293824, "epoch": 3540} {"train_loss": -25.593957901000977, "global_step": 293825, "epoch": 3540} {"train_loss": -25.120025634765625, "global_step": 293826, "epoch": 3540} {"train_loss": -25.14828109741211, "global_step": 293827, "epoch": 3540} {"train_loss": -25.657398223876953, "global_step": 293828, "epoch": 3540} {"train_loss": -25.41489601135254, "global_step": 293829, "epoch": 3540} {"train_loss": -25.49062156677246, "global_step": 293830, "epoch": 3540} {"train_loss": -25.386234283447266, "global_step": 293831, "epoch": 3540} {"train_loss": -25.20191764831543, "global_step": 293832, "epoch": 3540} {"train_loss": -25.39112091064453, "global_step": 293833, "epoch": 3540} {"train_loss": -25.766651153564453, "global_step": 293834, "epoch": 3540} {"train_loss": -25.457807540893555, "global_step": 293835, "epoch": 3540} {"train_loss": -25.289188385009766, "global_step": 293836, "epoch": 3540} {"train_loss": -25.85712242126465, "global_step": 293837, "epoch": 3540} {"train_loss": -25.60578727722168, "global_step": 293838, "epoch": 3540} {"train_loss": -25.736486434936523, "global_step": 293839, "epoch": 3540} {"train_loss": -25.425769805908203, "global_step": 293840, "epoch": 3540} {"train_loss": -25.63850212097168, "global_step": 293841, "epoch": 3540} {"train_loss": -25.586620330810547, "global_step": 293842, "epoch": 3540} {"train_loss": -25.938465118408203, "global_step": 293843, "epoch": 3540} {"train_loss": -25.90472412109375, "global_step": 293844, "epoch": 3540} {"train_loss": -25.626708984375, "global_step": 293845, "epoch": 3540} {"train_loss": -25.967145919799805, "global_step": 293846, "epoch": 3540} {"train_loss": -25.771697998046875, "global_step": 293847, "epoch": 3540} {"train_loss": -25.672805786132812, "global_step": 293848, "epoch": 3540} {"train_loss": -25.729496002197266, "global_step": 293849, "epoch": 3540} {"train_loss": -25.488189697265625, "global_step": 293850, "epoch": 3540} {"train_loss": -25.77984619140625, "global_step": 293851, "epoch": 3540} {"train_loss": -25.56050682067871, "global_step": 293852, "epoch": 3540} {"train_loss": -25.465444564819336, "global_step": 293853, "epoch": 3540} {"train_loss": -25.56914710998535, "global_step": 293854, "epoch": 3540} {"train_loss": -25.828659057617188, "global_step": 293855, "epoch": 3540} {"train_loss": -25.3414249420166, "global_step": 293856, "epoch": 3540} {"train_loss": -25.557302474975586, "global_step": 293857, "epoch": 3540} {"train_loss": -25.612598419189453, "global_step": 293858, "epoch": 3540} {"train_loss": -25.261077880859375, "global_step": 293859, "epoch": 3540} {"train_loss": -25.545774459838867, "global_step": 293860, "epoch": 3540} {"train_loss": -25.463476181030273, "global_step": 293861, "epoch": 3540} {"train_loss": -25.517786026000977, "global_step": 293862, "epoch": 3540} {"train_loss": -25.52155876159668, "global_step": 293863, "epoch": 3540} {"train_loss": -25.500749588012695, "global_step": 293864, "epoch": 3540} {"train_loss": -25.386749267578125, "global_step": 293865, "epoch": 3540} {"train_loss": -25.40846061706543, "global_step": 293866, "epoch": 3540} {"train_loss": -25.53037452697754, "global_step": 293867, "epoch": 3540} {"train_loss": -25.8746337890625, "global_step": 293868, "epoch": 3540} {"train_loss": -25.129077911376953, "global_step": 293869, "epoch": 3540} {"train_loss": -25.22690773010254, "global_step": 293870, "epoch": 3540} {"train_loss": -25.155025482177734, "global_step": 293871, "epoch": 3540} {"train_loss": -25.207523345947266, "global_step": 293872, "epoch": 3540} {"train_loss": -25.30307388305664, "global_step": 293873, "epoch": 3540} {"train_loss": -25.331756591796875, "global_step": 293874, "epoch": 3540} {"train_loss": -25.004833221435547, "global_step": 293875, "epoch": 3540} {"train_loss": -25.655963897705078, "global_step": 293876, "epoch": 3540} {"train_loss": -25.577985763549805, "global_step": 293877, "epoch": 3540} {"train_loss": -25.731184005737305, "global_step": 293878, "epoch": 3540} {"train_loss": -25.28400230407715, "global_step": 293879, "epoch": 3540} {"train_loss": -25.720916748046875, "global_step": 293880, "epoch": 3540} {"train_loss": -25.38681983947754, "global_step": 293881, "epoch": 3540} {"train_loss": -25.098682403564453, "global_step": 293882, "epoch": 3540} {"train_loss": -25.50441551208496, "global_step": 293883, "epoch": 3540} {"train_loss": -25.817529678344727, "global_step": 293884, "epoch": 3540} {"train_loss": -25.25050163269043, "global_step": 293885, "epoch": 3540} {"train_loss": -25.63446044921875, "global_step": 293886, "epoch": 3540} {"train_loss": -25.380939483642578, "global_step": 293887, "epoch": 3540} {"train_loss": -25.263166427612305, "global_step": 293888, "epoch": 3540} {"train_loss": -25.667083740234375, "global_step": 293889, "epoch": 3540} {"train_loss": -25.357826232910156, "global_step": 293890, "epoch": 3540} {"train_loss": -25.553150177001953, "global_step": 293891, "epoch": 3540} {"train_loss": -25.34718132019043, "global_step": 293892, "epoch": 3540} {"train_loss": -25.708328247070312, "global_step": 293893, "epoch": 3540} {"train_loss": -25.83137321472168, "global_step": 293894, "epoch": 3540} {"train_loss": -25.552181243896484, "global_step": 293895, "epoch": 3540} {"train_loss": -25.625080108642578, "global_step": 293896, "epoch": 3540} {"train_loss": -25.499479293823242, "global_step": 293897, "epoch": 3540} {"train_loss": -25.468952178955078, "global_step": 293898, "epoch": 3540} {"train_loss": -25.53584098815918, "global_step": 293899, "epoch": 3540} {"train_loss": -25.566076278686523, "global_step": 293900, "epoch": 3540} {"train_loss": -25.414892196655273, "global_step": 293901, "epoch": 3540} {"train_loss": -25.49167205626706, "global_step": 293902, "epoch": 3540, "val_loss": 7074430.5} {"train_loss": -24.615224838256836, "global_step": 293903, "epoch": 3541} {"train_loss": -24.961139678955078, "global_step": 293904, "epoch": 3541} {"train_loss": -24.637353897094727, "global_step": 293905, "epoch": 3541} {"train_loss": -25.01069450378418, "global_step": 293906, "epoch": 3541} {"train_loss": -24.77063751220703, "global_step": 293907, "epoch": 3541} {"train_loss": -24.947559356689453, "global_step": 293908, "epoch": 3541} {"train_loss": -25.300691604614258, "global_step": 293909, "epoch": 3541} {"train_loss": -25.3393611907959, "global_step": 293910, "epoch": 3541} {"train_loss": -25.338092803955078, "global_step": 293911, "epoch": 3541} {"train_loss": -25.398727416992188, "global_step": 293912, "epoch": 3541} {"train_loss": -25.284717559814453, "global_step": 293913, "epoch": 3541} {"train_loss": -25.081539154052734, "global_step": 293914, "epoch": 3541} {"train_loss": -25.351932525634766, "global_step": 293915, "epoch": 3541} {"train_loss": -25.328283309936523, "global_step": 293916, "epoch": 3541} {"train_loss": -25.300046920776367, "global_step": 293917, "epoch": 3541} {"train_loss": -25.522735595703125, "global_step": 293918, "epoch": 3541} {"train_loss": -25.34323501586914, "global_step": 293919, "epoch": 3541} {"train_loss": -25.216754913330078, "global_step": 293920, "epoch": 3541} {"train_loss": -25.58808135986328, "global_step": 293921, "epoch": 3541} {"train_loss": -25.6094970703125, "global_step": 293922, "epoch": 3541} {"train_loss": -25.8691349029541, "global_step": 293923, "epoch": 3541} {"train_loss": -25.559720993041992, "global_step": 293924, "epoch": 3541} {"train_loss": -25.47150230407715, "global_step": 293925, "epoch": 3541} {"train_loss": -25.40216827392578, "global_step": 293926, "epoch": 3541} {"train_loss": -25.518712997436523, "global_step": 293927, "epoch": 3541} {"train_loss": -25.636810302734375, "global_step": 293928, "epoch": 3541} {"train_loss": -25.680234909057617, "global_step": 293929, "epoch": 3541} {"train_loss": -25.356382369995117, "global_step": 293930, "epoch": 3541} {"train_loss": -25.87347412109375, "global_step": 293931, "epoch": 3541} {"train_loss": -25.74665641784668, "global_step": 293932, "epoch": 3541} {"train_loss": -25.519506454467773, "global_step": 293933, "epoch": 3541} {"train_loss": -25.54905891418457, "global_step": 293934, "epoch": 3541} {"train_loss": -25.689971923828125, "global_step": 293935, "epoch": 3541} {"train_loss": -25.479703903198242, "global_step": 293936, "epoch": 3541} {"train_loss": -25.55494499206543, "global_step": 293937, "epoch": 3541} {"train_loss": -25.146865844726562, "global_step": 293938, "epoch": 3541} {"train_loss": -25.668745040893555, "global_step": 293939, "epoch": 3541} {"train_loss": -25.569114685058594, "global_step": 293940, "epoch": 3541} {"train_loss": -25.782211303710938, "global_step": 293941, "epoch": 3541} {"train_loss": -25.321815490722656, "global_step": 293942, "epoch": 3541} {"train_loss": -25.736526489257812, "global_step": 293943, "epoch": 3541} {"train_loss": -26.070051193237305, "global_step": 293944, "epoch": 3541} {"train_loss": -25.705707550048828, "global_step": 293945, "epoch": 3541} {"train_loss": -25.838735580444336, "global_step": 293946, "epoch": 3541} {"train_loss": -25.815216064453125, "global_step": 293947, "epoch": 3541} {"train_loss": -25.39533042907715, "global_step": 293948, "epoch": 3541} {"train_loss": -25.66265296936035, "global_step": 293949, "epoch": 3541} {"train_loss": -25.637121200561523, "global_step": 293950, "epoch": 3541} {"train_loss": -25.497434616088867, "global_step": 293951, "epoch": 3541} {"train_loss": -26.048009872436523, "global_step": 293952, "epoch": 3541} {"train_loss": -25.634674072265625, "global_step": 293953, "epoch": 3541} {"train_loss": -25.539701461791992, "global_step": 293954, "epoch": 3541} {"train_loss": -25.45057487487793, "global_step": 293955, "epoch": 3541} {"train_loss": -25.58553123474121, "global_step": 293956, "epoch": 3541} {"train_loss": -26.0810546875, "global_step": 293957, "epoch": 3541} {"train_loss": -26.030323028564453, "global_step": 293958, "epoch": 3541} {"train_loss": -25.823535919189453, "global_step": 293959, "epoch": 3541} {"train_loss": -25.345243453979492, "global_step": 293960, "epoch": 3541} {"train_loss": -25.67365074157715, "global_step": 293961, "epoch": 3541} {"train_loss": -25.50881004333496, "global_step": 293962, "epoch": 3541} {"train_loss": -25.61903953552246, "global_step": 293963, "epoch": 3541} {"train_loss": -25.54923439025879, "global_step": 293964, "epoch": 3541} {"train_loss": -25.385730743408203, "global_step": 293965, "epoch": 3541} {"train_loss": -25.72151756286621, "global_step": 293966, "epoch": 3541} {"train_loss": -25.4149227142334, "global_step": 293967, "epoch": 3541} {"train_loss": -25.206378936767578, "global_step": 293968, "epoch": 3541} {"train_loss": -24.973499298095703, "global_step": 293969, "epoch": 3541} {"train_loss": -24.948633193969727, "global_step": 293970, "epoch": 3541} {"train_loss": -25.720972061157227, "global_step": 293971, "epoch": 3541} {"train_loss": -25.28342056274414, "global_step": 293972, "epoch": 3541} {"train_loss": -25.346811294555664, "global_step": 293973, "epoch": 3541} {"train_loss": -25.43401527404785, "global_step": 293974, "epoch": 3541} {"train_loss": -25.668798446655273, "global_step": 293975, "epoch": 3541} {"train_loss": -25.448270797729492, "global_step": 293976, "epoch": 3541} {"train_loss": -25.718164443969727, "global_step": 293977, "epoch": 3541} {"train_loss": -25.75274658203125, "global_step": 293978, "epoch": 3541} {"train_loss": -25.622251510620117, "global_step": 293979, "epoch": 3541} {"train_loss": -25.517091751098633, "global_step": 293980, "epoch": 3541} {"train_loss": -25.13627052307129, "global_step": 293981, "epoch": 3541} {"train_loss": -25.7856502532959, "global_step": 293982, "epoch": 3541} {"train_loss": -25.222726821899414, "global_step": 293983, "epoch": 3541} {"train_loss": -25.444782257080078, "global_step": 293984, "epoch": 3541} {"train_loss": -25.471982703151472, "global_step": 293985, "epoch": 3541, "val_loss": 7281711.0} {"train_loss": -25.053964614868164, "global_step": 293986, "epoch": 3542} {"train_loss": -24.403324127197266, "global_step": 293987, "epoch": 3542} {"train_loss": -24.593290328979492, "global_step": 293988, "epoch": 3542} {"train_loss": -24.5653076171875, "global_step": 293989, "epoch": 3542} {"train_loss": -24.537656784057617, "global_step": 293990, "epoch": 3542} {"train_loss": -24.7733211517334, "global_step": 293991, "epoch": 3542} {"train_loss": -25.034011840820312, "global_step": 293992, "epoch": 3542} {"train_loss": -24.58620262145996, "global_step": 293993, "epoch": 3542} {"train_loss": -25.435346603393555, "global_step": 293994, "epoch": 3542} {"train_loss": -24.588903427124023, "global_step": 293995, "epoch": 3542} {"train_loss": -24.757009506225586, "global_step": 293996, "epoch": 3542} {"train_loss": -24.86301040649414, "global_step": 293997, "epoch": 3542} {"train_loss": -24.957548141479492, "global_step": 293998, "epoch": 3542} {"train_loss": -25.050323486328125, "global_step": 293999, "epoch": 3542} {"train_loss": -24.835588455200195, "global_step": 294000, "epoch": 3542} {"train_loss": -25.12537956237793, "global_step": 294001, "epoch": 3542} {"train_loss": -24.711811065673828, "global_step": 294002, "epoch": 3542} {"train_loss": -25.096403121948242, "global_step": 294003, "epoch": 3542} {"train_loss": -25.015201568603516, "global_step": 294004, "epoch": 3542} {"train_loss": -25.054950714111328, "global_step": 294005, "epoch": 3542} {"train_loss": -25.173654556274414, "global_step": 294006, "epoch": 3542} {"train_loss": -25.009008407592773, "global_step": 294007, "epoch": 3542} {"train_loss": -25.330686569213867, "global_step": 294008, "epoch": 3542} {"train_loss": -25.01509666442871, "global_step": 294009, "epoch": 3542} {"train_loss": -25.720108032226562, "global_step": 294010, "epoch": 3542} {"train_loss": -25.120319366455078, "global_step": 294011, "epoch": 3542} {"train_loss": -25.371559143066406, "global_step": 294012, "epoch": 3542} {"train_loss": -25.79294776916504, "global_step": 294013, "epoch": 3542} {"train_loss": -25.421552658081055, "global_step": 294014, "epoch": 3542} {"train_loss": -25.465198516845703, "global_step": 294015, "epoch": 3542} {"train_loss": -25.955347061157227, "global_step": 294016, "epoch": 3542} {"train_loss": -25.472993850708008, "global_step": 294017, "epoch": 3542} {"train_loss": -25.766080856323242, "global_step": 294018, "epoch": 3542} {"train_loss": -25.518722534179688, "global_step": 294019, "epoch": 3542} {"train_loss": -25.378400802612305, "global_step": 294020, "epoch": 3542} {"train_loss": -25.428564071655273, "global_step": 294021, "epoch": 3542} {"train_loss": -25.82508659362793, "global_step": 294022, "epoch": 3542} {"train_loss": -25.527755737304688, "global_step": 294023, "epoch": 3542} {"train_loss": -25.91168785095215, "global_step": 294024, "epoch": 3542} {"train_loss": -25.42828941345215, "global_step": 294025, "epoch": 3542} {"train_loss": -25.976133346557617, "global_step": 294026, "epoch": 3542} {"train_loss": -25.27859878540039, "global_step": 294027, "epoch": 3542} {"train_loss": -25.621366500854492, "global_step": 294028, "epoch": 3542} {"train_loss": -25.641071319580078, "global_step": 294029, "epoch": 3542} {"train_loss": -25.762836456298828, "global_step": 294030, "epoch": 3542} {"train_loss": -25.6968936920166, "global_step": 294031, "epoch": 3542} {"train_loss": -25.7180233001709, "global_step": 294032, "epoch": 3542} {"train_loss": -25.626712799072266, "global_step": 294033, "epoch": 3542} {"train_loss": -25.87961769104004, "global_step": 294034, "epoch": 3542} {"train_loss": -26.252613067626953, "global_step": 294035, "epoch": 3542} {"train_loss": -25.651123046875, "global_step": 294036, "epoch": 3542} {"train_loss": -25.89874267578125, "global_step": 294037, "epoch": 3542} {"train_loss": -25.342538833618164, "global_step": 294038, "epoch": 3542} {"train_loss": -25.523767471313477, "global_step": 294039, "epoch": 3542} {"train_loss": -25.611860275268555, "global_step": 294040, "epoch": 3542} {"train_loss": -25.674970626831055, "global_step": 294041, "epoch": 3542} {"train_loss": -25.6462459564209, "global_step": 294042, "epoch": 3542} {"train_loss": -25.679733276367188, "global_step": 294043, "epoch": 3542} {"train_loss": -25.557104110717773, "global_step": 294044, "epoch": 3542} {"train_loss": -25.364765167236328, "global_step": 294045, "epoch": 3542} {"train_loss": -25.844619750976562, "global_step": 294046, "epoch": 3542} {"train_loss": -25.48274040222168, "global_step": 294047, "epoch": 3542} {"train_loss": -25.736968994140625, "global_step": 294048, "epoch": 3542} {"train_loss": -25.521656036376953, "global_step": 294049, "epoch": 3542} {"train_loss": -25.501916885375977, "global_step": 294050, "epoch": 3542} {"train_loss": -25.610204696655273, "global_step": 294051, "epoch": 3542} {"train_loss": -25.337968826293945, "global_step": 294052, "epoch": 3542} {"train_loss": -25.596927642822266, "global_step": 294053, "epoch": 3542} {"train_loss": -25.504352569580078, "global_step": 294054, "epoch": 3542} {"train_loss": -25.864896774291992, "global_step": 294055, "epoch": 3542} {"train_loss": -25.342317581176758, "global_step": 294056, "epoch": 3542} {"train_loss": -25.597496032714844, "global_step": 294057, "epoch": 3542} {"train_loss": -25.669692993164062, "global_step": 294058, "epoch": 3542} {"train_loss": -25.479040145874023, "global_step": 294059, "epoch": 3542} {"train_loss": -26.212072372436523, "global_step": 294060, "epoch": 3542} {"train_loss": -25.131866455078125, "global_step": 294061, "epoch": 3542} {"train_loss": -25.476978302001953, "global_step": 294062, "epoch": 3542} {"train_loss": -25.59067153930664, "global_step": 294063, "epoch": 3542} {"train_loss": -25.480504989624023, "global_step": 294064, "epoch": 3542} {"train_loss": -25.819965362548828, "global_step": 294065, "epoch": 3542} {"train_loss": -25.361980438232422, "global_step": 294066, "epoch": 3542} {"train_loss": -25.761022567749023, "global_step": 294067, "epoch": 3542} {"train_loss": -25.396333694458008, "global_step": 294068, "epoch": 3542, "val_loss": 7124387.0} {"train_loss": -23.00247573852539, "global_step": 294069, "epoch": 3543} {"train_loss": -22.94479751586914, "global_step": 294070, "epoch": 3543} {"train_loss": -23.602590560913086, "global_step": 294071, "epoch": 3543} {"train_loss": -22.975242614746094, "global_step": 294072, "epoch": 3543} {"train_loss": -23.590686798095703, "global_step": 294073, "epoch": 3543} {"train_loss": -24.19321632385254, "global_step": 294074, "epoch": 3543} {"train_loss": -22.9417781829834, "global_step": 294075, "epoch": 3543} {"train_loss": -24.29656982421875, "global_step": 294076, "epoch": 3543} {"train_loss": -24.218236923217773, "global_step": 294077, "epoch": 3543} {"train_loss": -23.848129272460938, "global_step": 294078, "epoch": 3543} {"train_loss": -24.489118576049805, "global_step": 294079, "epoch": 3543} {"train_loss": -24.372203826904297, "global_step": 294080, "epoch": 3543} {"train_loss": -24.66128921508789, "global_step": 294081, "epoch": 3543} {"train_loss": -24.434844970703125, "global_step": 294082, "epoch": 3543} {"train_loss": -24.30810546875, "global_step": 294083, "epoch": 3543} {"train_loss": -24.499427795410156, "global_step": 294084, "epoch": 3543} {"train_loss": -24.586151123046875, "global_step": 294085, "epoch": 3543} {"train_loss": -24.818235397338867, "global_step": 294086, "epoch": 3543} {"train_loss": -24.58194351196289, "global_step": 294087, "epoch": 3543} {"train_loss": -24.800413131713867, "global_step": 294088, "epoch": 3543} {"train_loss": -24.638341903686523, "global_step": 294089, "epoch": 3543} {"train_loss": -24.65720558166504, "global_step": 294090, "epoch": 3543} {"train_loss": -25.00777244567871, "global_step": 294091, "epoch": 3543} {"train_loss": -24.901960372924805, "global_step": 294092, "epoch": 3543} {"train_loss": -24.85472869873047, "global_step": 294093, "epoch": 3543} {"train_loss": -24.50577163696289, "global_step": 294094, "epoch": 3543} {"train_loss": -24.531713485717773, "global_step": 294095, "epoch": 3543} {"train_loss": -25.17759132385254, "global_step": 294096, "epoch": 3543} {"train_loss": -25.054662704467773, "global_step": 294097, "epoch": 3543} {"train_loss": -24.826993942260742, "global_step": 294098, "epoch": 3543} {"train_loss": -25.0220890045166, "global_step": 294099, "epoch": 3543} {"train_loss": -24.60872459411621, "global_step": 294100, "epoch": 3543} {"train_loss": -25.04195213317871, "global_step": 294101, "epoch": 3543} {"train_loss": -24.847352981567383, "global_step": 294102, "epoch": 3543} {"train_loss": -25.363309860229492, "global_step": 294103, "epoch": 3543} {"train_loss": -25.390792846679688, "global_step": 294104, "epoch": 3543} {"train_loss": -25.120126724243164, "global_step": 294105, "epoch": 3543} {"train_loss": -25.305627822875977, "global_step": 294106, "epoch": 3543} {"train_loss": -25.193737030029297, "global_step": 294107, "epoch": 3543} {"train_loss": -25.1629695892334, "global_step": 294108, "epoch": 3543} {"train_loss": -25.449783325195312, "global_step": 294109, "epoch": 3543} {"train_loss": -25.40695571899414, "global_step": 294110, "epoch": 3543} {"train_loss": -25.48662567138672, "global_step": 294111, "epoch": 3543} {"train_loss": -25.655120849609375, "global_step": 294112, "epoch": 3543} {"train_loss": -25.189483642578125, "global_step": 294113, "epoch": 3543} {"train_loss": -25.337385177612305, "global_step": 294114, "epoch": 3543} {"train_loss": -24.962854385375977, "global_step": 294115, "epoch": 3543} {"train_loss": -25.710357666015625, "global_step": 294116, "epoch": 3543} {"train_loss": -25.691198348999023, "global_step": 294117, "epoch": 3543} {"train_loss": -25.336915969848633, "global_step": 294118, "epoch": 3543} {"train_loss": -25.613855361938477, "global_step": 294119, "epoch": 3543} {"train_loss": -25.596920013427734, "global_step": 294120, "epoch": 3543} {"train_loss": -25.435056686401367, "global_step": 294121, "epoch": 3543} {"train_loss": -25.560880661010742, "global_step": 294122, "epoch": 3543} {"train_loss": -25.591772079467773, "global_step": 294123, "epoch": 3543} {"train_loss": -25.577457427978516, "global_step": 294124, "epoch": 3543} {"train_loss": -25.4529972076416, "global_step": 294125, "epoch": 3543} {"train_loss": -25.39015769958496, "global_step": 294126, "epoch": 3543} {"train_loss": -25.532657623291016, "global_step": 294127, "epoch": 3543} {"train_loss": -25.69056510925293, "global_step": 294128, "epoch": 3543} {"train_loss": -25.662084579467773, "global_step": 294129, "epoch": 3543} {"train_loss": -25.7056884765625, "global_step": 294130, "epoch": 3543} {"train_loss": -25.881912231445312, "global_step": 294131, "epoch": 3543} {"train_loss": -25.58416748046875, "global_step": 294132, "epoch": 3543} {"train_loss": -25.628082275390625, "global_step": 294133, "epoch": 3543} {"train_loss": -25.5184268951416, "global_step": 294134, "epoch": 3543} {"train_loss": -25.901269912719727, "global_step": 294135, "epoch": 3543} {"train_loss": -25.937164306640625, "global_step": 294136, "epoch": 3543} {"train_loss": -25.657880783081055, "global_step": 294137, "epoch": 3543} {"train_loss": -25.73418617248535, "global_step": 294138, "epoch": 3543} {"train_loss": -25.678525924682617, "global_step": 294139, "epoch": 3543} {"train_loss": -25.92987060546875, "global_step": 294140, "epoch": 3543} {"train_loss": -25.963117599487305, "global_step": 294141, "epoch": 3543} {"train_loss": -25.644367218017578, "global_step": 294142, "epoch": 3543} {"train_loss": -25.835729598999023, "global_step": 294143, "epoch": 3543} {"train_loss": -25.597097396850586, "global_step": 294144, "epoch": 3543} {"train_loss": -25.698331832885742, "global_step": 294145, "epoch": 3543} {"train_loss": -25.619892120361328, "global_step": 294146, "epoch": 3543} {"train_loss": -25.8568058013916, "global_step": 294147, "epoch": 3543} {"train_loss": -26.1904239654541, "global_step": 294148, "epoch": 3543} {"train_loss": -25.609704971313477, "global_step": 294149, "epoch": 3543} {"train_loss": -25.158227920532227, "global_step": 294150, "epoch": 3543} {"train_loss": -25.08325236676687, "global_step": 294151, "epoch": 3543, "val_loss": 7163080.0} {"train_loss": -25.10614013671875, "global_step": 294152, "epoch": 3544} {"train_loss": -23.65891456604004, "global_step": 294153, "epoch": 3544} {"train_loss": -24.314651489257812, "global_step": 294154, "epoch": 3544} {"train_loss": -25.109472274780273, "global_step": 294155, "epoch": 3544} {"train_loss": -24.64700698852539, "global_step": 294156, "epoch": 3544} {"train_loss": -24.283374786376953, "global_step": 294157, "epoch": 3544} {"train_loss": -24.750185012817383, "global_step": 294158, "epoch": 3544} {"train_loss": -24.43879508972168, "global_step": 294159, "epoch": 3544} {"train_loss": -24.783130645751953, "global_step": 294160, "epoch": 3544} {"train_loss": -25.18120002746582, "global_step": 294161, "epoch": 3544} {"train_loss": -24.913816452026367, "global_step": 294162, "epoch": 3544} {"train_loss": -25.245946884155273, "global_step": 294163, "epoch": 3544} {"train_loss": -24.900291442871094, "global_step": 294164, "epoch": 3544} {"train_loss": -25.070430755615234, "global_step": 294165, "epoch": 3544} {"train_loss": -24.73927116394043, "global_step": 294166, "epoch": 3544} {"train_loss": -24.828386306762695, "global_step": 294167, "epoch": 3544} {"train_loss": -25.497520446777344, "global_step": 294168, "epoch": 3544} {"train_loss": -25.173192977905273, "global_step": 294169, "epoch": 3544} {"train_loss": -25.3326358795166, "global_step": 294170, "epoch": 3544} {"train_loss": -24.902870178222656, "global_step": 294171, "epoch": 3544} {"train_loss": -25.362089157104492, "global_step": 294172, "epoch": 3544} {"train_loss": -24.87078857421875, "global_step": 294173, "epoch": 3544} {"train_loss": -25.31794548034668, "global_step": 294174, "epoch": 3544} {"train_loss": -25.42214584350586, "global_step": 294175, "epoch": 3544} {"train_loss": -25.25275230407715, "global_step": 294176, "epoch": 3544} {"train_loss": -25.55221939086914, "global_step": 294177, "epoch": 3544} {"train_loss": -25.404085159301758, "global_step": 294178, "epoch": 3544} {"train_loss": -25.490285873413086, "global_step": 294179, "epoch": 3544} {"train_loss": -25.487672805786133, "global_step": 294180, "epoch": 3544} {"train_loss": -25.575178146362305, "global_step": 294181, "epoch": 3544} {"train_loss": -25.431568145751953, "global_step": 294182, "epoch": 3544} {"train_loss": -25.295408248901367, "global_step": 294183, "epoch": 3544} {"train_loss": -25.48582649230957, "global_step": 294184, "epoch": 3544} {"train_loss": -25.483469009399414, "global_step": 294185, "epoch": 3544} {"train_loss": -25.589614868164062, "global_step": 294186, "epoch": 3544} {"train_loss": -26.03533363342285, "global_step": 294187, "epoch": 3544} {"train_loss": -25.351064682006836, "global_step": 294188, "epoch": 3544} {"train_loss": -25.663782119750977, "global_step": 294189, "epoch": 3544} {"train_loss": -25.58152961730957, "global_step": 294190, "epoch": 3544} {"train_loss": -25.407264709472656, "global_step": 294191, "epoch": 3544} {"train_loss": -25.548479080200195, "global_step": 294192, "epoch": 3544} {"train_loss": -25.527551651000977, "global_step": 294193, "epoch": 3544} {"train_loss": -25.56266212463379, "global_step": 294194, "epoch": 3544} {"train_loss": -25.84832191467285, "global_step": 294195, "epoch": 3544} {"train_loss": -25.515857696533203, "global_step": 294196, "epoch": 3544} {"train_loss": -25.536420822143555, "global_step": 294197, "epoch": 3544} {"train_loss": -25.779035568237305, "global_step": 294198, "epoch": 3544} {"train_loss": -25.675573348999023, "global_step": 294199, "epoch": 3544} {"train_loss": -25.450170516967773, "global_step": 294200, "epoch": 3544} {"train_loss": -26.014474868774414, "global_step": 294201, "epoch": 3544} {"train_loss": -25.60066032409668, "global_step": 294202, "epoch": 3544} {"train_loss": -25.796430587768555, "global_step": 294203, "epoch": 3544} {"train_loss": -25.779272079467773, "global_step": 294204, "epoch": 3544} {"train_loss": -25.426841735839844, "global_step": 294205, "epoch": 3544} {"train_loss": -25.510404586791992, "global_step": 294206, "epoch": 3544} {"train_loss": -25.523710250854492, "global_step": 294207, "epoch": 3544} {"train_loss": -25.712926864624023, "global_step": 294208, "epoch": 3544} {"train_loss": -25.667646408081055, "global_step": 294209, "epoch": 3544} {"train_loss": -25.460098266601562, "global_step": 294210, "epoch": 3544} {"train_loss": -25.880640029907227, "global_step": 294211, "epoch": 3544} {"train_loss": -25.59714698791504, "global_step": 294212, "epoch": 3544} {"train_loss": -25.895050048828125, "global_step": 294213, "epoch": 3544} {"train_loss": -25.78510856628418, "global_step": 294214, "epoch": 3544} {"train_loss": -25.752588272094727, "global_step": 294215, "epoch": 3544} {"train_loss": -25.932159423828125, "global_step": 294216, "epoch": 3544} {"train_loss": -25.648279190063477, "global_step": 294217, "epoch": 3544} {"train_loss": -26.01112174987793, "global_step": 294218, "epoch": 3544} {"train_loss": -25.6732177734375, "global_step": 294219, "epoch": 3544} {"train_loss": -25.334028244018555, "global_step": 294220, "epoch": 3544} {"train_loss": -26.008880615234375, "global_step": 294221, "epoch": 3544} {"train_loss": -26.130178451538086, "global_step": 294222, "epoch": 3544} {"train_loss": -25.37200927734375, "global_step": 294223, "epoch": 3544} {"train_loss": -25.189889907836914, "global_step": 294224, "epoch": 3544} {"train_loss": -25.055362701416016, "global_step": 294225, "epoch": 3544} {"train_loss": -24.87384033203125, "global_step": 294226, "epoch": 3544} {"train_loss": -25.076004028320312, "global_step": 294227, "epoch": 3544} {"train_loss": -25.341527938842773, "global_step": 294228, "epoch": 3544} {"train_loss": -25.409896850585938, "global_step": 294229, "epoch": 3544} {"train_loss": -25.56314468383789, "global_step": 294230, "epoch": 3544} {"train_loss": -25.94867515563965, "global_step": 294231, "epoch": 3544} {"train_loss": -25.6766300201416, "global_step": 294232, "epoch": 3544} {"train_loss": -25.413116455078125, "global_step": 294233, "epoch": 3544} {"train_loss": -25.396705788302135, "global_step": 294234, "epoch": 3544, "val_loss": 7250975.0} {"train_loss": -25.475616455078125, "global_step": 294235, "epoch": 3545} {"train_loss": -24.629003524780273, "global_step": 294236, "epoch": 3545} {"train_loss": -25.333633422851562, "global_step": 294237, "epoch": 3545} {"train_loss": -25.61002540588379, "global_step": 294238, "epoch": 3545} {"train_loss": -24.909027099609375, "global_step": 294239, "epoch": 3545} {"train_loss": -25.11476707458496, "global_step": 294240, "epoch": 3545} {"train_loss": -25.304025650024414, "global_step": 294241, "epoch": 3545} {"train_loss": -25.255945205688477, "global_step": 294242, "epoch": 3545} {"train_loss": -25.17860221862793, "global_step": 294243, "epoch": 3545} {"train_loss": -25.1169490814209, "global_step": 294244, "epoch": 3545} {"train_loss": -25.455413818359375, "global_step": 294245, "epoch": 3545} {"train_loss": -25.215166091918945, "global_step": 294246, "epoch": 3545} {"train_loss": -25.562536239624023, "global_step": 294247, "epoch": 3545} {"train_loss": -25.238218307495117, "global_step": 294248, "epoch": 3545} {"train_loss": -25.10883140563965, "global_step": 294249, "epoch": 3545} {"train_loss": -25.195484161376953, "global_step": 294250, "epoch": 3545} {"train_loss": -25.450416564941406, "global_step": 294251, "epoch": 3545} {"train_loss": -25.579442977905273, "global_step": 294252, "epoch": 3545} {"train_loss": -25.38362693786621, "global_step": 294253, "epoch": 3545} {"train_loss": -25.5533504486084, "global_step": 294254, "epoch": 3545} {"train_loss": -25.342926025390625, "global_step": 294255, "epoch": 3545} {"train_loss": -25.00355339050293, "global_step": 294256, "epoch": 3545} {"train_loss": -25.25437355041504, "global_step": 294257, "epoch": 3545} {"train_loss": -25.37973976135254, "global_step": 294258, "epoch": 3545} {"train_loss": -25.733060836791992, "global_step": 294259, "epoch": 3545} {"train_loss": -25.318286895751953, "global_step": 294260, "epoch": 3545} {"train_loss": -25.59799575805664, "global_step": 294261, "epoch": 3545} {"train_loss": -25.60651206970215, "global_step": 294262, "epoch": 3545} {"train_loss": -25.128469467163086, "global_step": 294263, "epoch": 3545} {"train_loss": -25.64069938659668, "global_step": 294264, "epoch": 3545} {"train_loss": -25.6396484375, "global_step": 294265, "epoch": 3545} {"train_loss": -25.244308471679688, "global_step": 294266, "epoch": 3545} {"train_loss": -25.62127685546875, "global_step": 294267, "epoch": 3545} {"train_loss": -25.730239868164062, "global_step": 294268, "epoch": 3545} {"train_loss": -25.609464645385742, "global_step": 294269, "epoch": 3545} {"train_loss": -25.861419677734375, "global_step": 294270, "epoch": 3545} {"train_loss": -25.700775146484375, "global_step": 294271, "epoch": 3545} {"train_loss": -25.700916290283203, "global_step": 294272, "epoch": 3545} {"train_loss": -25.467639923095703, "global_step": 294273, "epoch": 3545} {"train_loss": -25.505096435546875, "global_step": 294274, "epoch": 3545} {"train_loss": -25.52377700805664, "global_step": 294275, "epoch": 3545} {"train_loss": -25.826004028320312, "global_step": 294276, "epoch": 3545} {"train_loss": -25.44696807861328, "global_step": 294277, "epoch": 3545} {"train_loss": -25.92584800720215, "global_step": 294278, "epoch": 3545} {"train_loss": -25.59701156616211, "global_step": 294279, "epoch": 3545} {"train_loss": -25.316715240478516, "global_step": 294280, "epoch": 3545} {"train_loss": -25.350872039794922, "global_step": 294281, "epoch": 3545} {"train_loss": -25.661670684814453, "global_step": 294282, "epoch": 3545} {"train_loss": -25.79631996154785, "global_step": 294283, "epoch": 3545} {"train_loss": -25.938617706298828, "global_step": 294284, "epoch": 3545} {"train_loss": -25.557373046875, "global_step": 294285, "epoch": 3545} {"train_loss": -25.762134552001953, "global_step": 294286, "epoch": 3545} {"train_loss": -25.275747299194336, "global_step": 294287, "epoch": 3545} {"train_loss": -25.55960464477539, "global_step": 294288, "epoch": 3545} {"train_loss": -25.70611572265625, "global_step": 294289, "epoch": 3545} {"train_loss": -25.683629989624023, "global_step": 294290, "epoch": 3545} {"train_loss": -25.265289306640625, "global_step": 294291, "epoch": 3545} {"train_loss": -25.800260543823242, "global_step": 294292, "epoch": 3545} {"train_loss": -25.497533798217773, "global_step": 294293, "epoch": 3545} {"train_loss": -25.489587783813477, "global_step": 294294, "epoch": 3545} {"train_loss": -25.929794311523438, "global_step": 294295, "epoch": 3545} {"train_loss": -25.708877563476562, "global_step": 294296, "epoch": 3545} {"train_loss": -25.6702880859375, "global_step": 294297, "epoch": 3545} {"train_loss": -25.42537498474121, "global_step": 294298, "epoch": 3545} {"train_loss": -25.6865291595459, "global_step": 294299, "epoch": 3545} {"train_loss": -25.561037063598633, "global_step": 294300, "epoch": 3545} {"train_loss": -25.63594627380371, "global_step": 294301, "epoch": 3545} {"train_loss": -25.69698143005371, "global_step": 294302, "epoch": 3545} {"train_loss": -25.584333419799805, "global_step": 294303, "epoch": 3545} {"train_loss": -25.684926986694336, "global_step": 294304, "epoch": 3545} {"train_loss": -25.73929214477539, "global_step": 294305, "epoch": 3545} {"train_loss": -25.498342514038086, "global_step": 294306, "epoch": 3545} {"train_loss": -25.68486976623535, "global_step": 294307, "epoch": 3545} {"train_loss": -26.018707275390625, "global_step": 294308, "epoch": 3545} {"train_loss": -25.537097930908203, "global_step": 294309, "epoch": 3545} {"train_loss": -25.58806800842285, "global_step": 294310, "epoch": 3545} {"train_loss": -25.623950958251953, "global_step": 294311, "epoch": 3545} {"train_loss": -25.466176986694336, "global_step": 294312, "epoch": 3545} {"train_loss": -25.96257972717285, "global_step": 294313, "epoch": 3545} {"train_loss": -25.834157943725586, "global_step": 294314, "epoch": 3545} {"train_loss": -25.77846336364746, "global_step": 294315, "epoch": 3545} {"train_loss": -25.605798721313477, "global_step": 294316, "epoch": 3545} {"train_loss": -25.528092533709057, "global_step": 294317, "epoch": 3545, "val_loss": 7135799.0} {"train_loss": -24.956533432006836, "global_step": 294318, "epoch": 3546} {"train_loss": -24.444324493408203, "global_step": 294319, "epoch": 3546} {"train_loss": -24.600698471069336, "global_step": 294320, "epoch": 3546} {"train_loss": -24.59371566772461, "global_step": 294321, "epoch": 3546} {"train_loss": -24.862756729125977, "global_step": 294322, "epoch": 3546} {"train_loss": -25.522022247314453, "global_step": 294323, "epoch": 3546} {"train_loss": -25.2093563079834, "global_step": 294324, "epoch": 3546} {"train_loss": -24.660385131835938, "global_step": 294325, "epoch": 3546} {"train_loss": -25.4821720123291, "global_step": 294326, "epoch": 3546} {"train_loss": -25.13965606689453, "global_step": 294327, "epoch": 3546} {"train_loss": -25.32369041442871, "global_step": 294328, "epoch": 3546} {"train_loss": -24.93733024597168, "global_step": 294329, "epoch": 3546} {"train_loss": -25.370399475097656, "global_step": 294330, "epoch": 3546} {"train_loss": -24.697092056274414, "global_step": 294331, "epoch": 3546} {"train_loss": -25.125532150268555, "global_step": 294332, "epoch": 3546} {"train_loss": -25.40180015563965, "global_step": 294333, "epoch": 3546} {"train_loss": -24.9612979888916, "global_step": 294334, "epoch": 3546} {"train_loss": -25.15921401977539, "global_step": 294335, "epoch": 3546} {"train_loss": -25.114089965820312, "global_step": 294336, "epoch": 3546} {"train_loss": -24.896976470947266, "global_step": 294337, "epoch": 3546} {"train_loss": -25.2719783782959, "global_step": 294338, "epoch": 3546} {"train_loss": -25.353351593017578, "global_step": 294339, "epoch": 3546} {"train_loss": -25.28985595703125, "global_step": 294340, "epoch": 3546} {"train_loss": -25.26657485961914, "global_step": 294341, "epoch": 3546} {"train_loss": -24.73059844970703, "global_step": 294342, "epoch": 3546} {"train_loss": -25.302997589111328, "global_step": 294343, "epoch": 3546} {"train_loss": -25.017047882080078, "global_step": 294344, "epoch": 3546} {"train_loss": -25.76112174987793, "global_step": 294345, "epoch": 3546} {"train_loss": -25.375259399414062, "global_step": 294346, "epoch": 3546} {"train_loss": -25.62799644470215, "global_step": 294347, "epoch": 3546} {"train_loss": -25.309003829956055, "global_step": 294348, "epoch": 3546} {"train_loss": -25.87959098815918, "global_step": 294349, "epoch": 3546} {"train_loss": -25.36362648010254, "global_step": 294350, "epoch": 3546} {"train_loss": -25.4073486328125, "global_step": 294351, "epoch": 3546} {"train_loss": -25.487302780151367, "global_step": 294352, "epoch": 3546} {"train_loss": -25.686105728149414, "global_step": 294353, "epoch": 3546} {"train_loss": -25.242294311523438, "global_step": 294354, "epoch": 3546} {"train_loss": -25.723312377929688, "global_step": 294355, "epoch": 3546} {"train_loss": -25.15375518798828, "global_step": 294356, "epoch": 3546} {"train_loss": -25.588314056396484, "global_step": 294357, "epoch": 3546} {"train_loss": -25.733341217041016, "global_step": 294358, "epoch": 3546} {"train_loss": -25.546415328979492, "global_step": 294359, "epoch": 3546} {"train_loss": -25.6746826171875, "global_step": 294360, "epoch": 3546} {"train_loss": -25.647724151611328, "global_step": 294361, "epoch": 3546} {"train_loss": -25.28567123413086, "global_step": 294362, "epoch": 3546} {"train_loss": -25.343969345092773, "global_step": 294363, "epoch": 3546} {"train_loss": -25.408334732055664, "global_step": 294364, "epoch": 3546} {"train_loss": -25.847171783447266, "global_step": 294365, "epoch": 3546} {"train_loss": -25.457916259765625, "global_step": 294366, "epoch": 3546} {"train_loss": -25.298038482666016, "global_step": 294367, "epoch": 3546} {"train_loss": -25.85993766784668, "global_step": 294368, "epoch": 3546} {"train_loss": -25.506084442138672, "global_step": 294369, "epoch": 3546} {"train_loss": -25.140697479248047, "global_step": 294370, "epoch": 3546} {"train_loss": -25.45448112487793, "global_step": 294371, "epoch": 3546} {"train_loss": -25.535444259643555, "global_step": 294372, "epoch": 3546} {"train_loss": -25.757110595703125, "global_step": 294373, "epoch": 3546} {"train_loss": -25.254026412963867, "global_step": 294374, "epoch": 3546} {"train_loss": -25.550466537475586, "global_step": 294375, "epoch": 3546} {"train_loss": -25.642797470092773, "global_step": 294376, "epoch": 3546} {"train_loss": -25.47904396057129, "global_step": 294377, "epoch": 3546} {"train_loss": -25.559165954589844, "global_step": 294378, "epoch": 3546} {"train_loss": -25.683908462524414, "global_step": 294379, "epoch": 3546} {"train_loss": -25.613779067993164, "global_step": 294380, "epoch": 3546} {"train_loss": -25.272069931030273, "global_step": 294381, "epoch": 3546} {"train_loss": -25.5041561126709, "global_step": 294382, "epoch": 3546} {"train_loss": -25.31905174255371, "global_step": 294383, "epoch": 3546} {"train_loss": -25.12116813659668, "global_step": 294384, "epoch": 3546} {"train_loss": -25.238849639892578, "global_step": 294385, "epoch": 3546} {"train_loss": -25.239784240722656, "global_step": 294386, "epoch": 3546} {"train_loss": -25.63667106628418, "global_step": 294387, "epoch": 3546} {"train_loss": -24.888290405273438, "global_step": 294388, "epoch": 3546} {"train_loss": -25.401426315307617, "global_step": 294389, "epoch": 3546} {"train_loss": -25.046716690063477, "global_step": 294390, "epoch": 3546} {"train_loss": -25.566442489624023, "global_step": 294391, "epoch": 3546} {"train_loss": -25.314714431762695, "global_step": 294392, "epoch": 3546} {"train_loss": -25.266477584838867, "global_step": 294393, "epoch": 3546} {"train_loss": -25.479385375976562, "global_step": 294394, "epoch": 3546} {"train_loss": -25.815418243408203, "global_step": 294395, "epoch": 3546} {"train_loss": -25.415842056274414, "global_step": 294396, "epoch": 3546} {"train_loss": -25.41383934020996, "global_step": 294397, "epoch": 3546} {"train_loss": -25.386123657226562, "global_step": 294398, "epoch": 3546} {"train_loss": -25.706945419311523, "global_step": 294399, "epoch": 3546} {"train_loss": -25.31820784419416, "global_step": 294400, "epoch": 3546, "val_loss": 7082691.0} {"train_loss": -25.450742721557617, "global_step": 294401, "epoch": 3547} {"train_loss": -24.965158462524414, "global_step": 294402, "epoch": 3547} {"train_loss": -25.0980281829834, "global_step": 294403, "epoch": 3547} {"train_loss": -25.477577209472656, "global_step": 294404, "epoch": 3547} {"train_loss": -25.876474380493164, "global_step": 294405, "epoch": 3547} {"train_loss": -25.573410034179688, "global_step": 294406, "epoch": 3547} {"train_loss": -25.514493942260742, "global_step": 294407, "epoch": 3547} {"train_loss": -25.2529354095459, "global_step": 294408, "epoch": 3547} {"train_loss": -25.23348045349121, "global_step": 294409, "epoch": 3547} {"train_loss": -25.32086753845215, "global_step": 294410, "epoch": 3547} {"train_loss": -25.8094482421875, "global_step": 294411, "epoch": 3547} {"train_loss": -25.387069702148438, "global_step": 294412, "epoch": 3547} {"train_loss": -25.267423629760742, "global_step": 294413, "epoch": 3547} {"train_loss": -25.518980026245117, "global_step": 294414, "epoch": 3547} {"train_loss": -25.479618072509766, "global_step": 294415, "epoch": 3547} {"train_loss": -25.128162384033203, "global_step": 294416, "epoch": 3547} {"train_loss": -25.502397537231445, "global_step": 294417, "epoch": 3547} {"train_loss": -25.35637855529785, "global_step": 294418, "epoch": 3547} {"train_loss": -25.297006607055664, "global_step": 294419, "epoch": 3547} {"train_loss": -25.203039169311523, "global_step": 294420, "epoch": 3547} {"train_loss": -25.7062931060791, "global_step": 294421, "epoch": 3547} {"train_loss": -25.49086570739746, "global_step": 294422, "epoch": 3547} {"train_loss": -25.718338012695312, "global_step": 294423, "epoch": 3547} {"train_loss": -25.577245712280273, "global_step": 294424, "epoch": 3547} {"train_loss": -25.994916915893555, "global_step": 294425, "epoch": 3547} {"train_loss": -25.870746612548828, "global_step": 294426, "epoch": 3547} {"train_loss": -25.641876220703125, "global_step": 294427, "epoch": 3547} {"train_loss": -25.517578125, "global_step": 294428, "epoch": 3547} {"train_loss": -25.62932777404785, "global_step": 294429, "epoch": 3547} {"train_loss": -25.806171417236328, "global_step": 294430, "epoch": 3547} {"train_loss": -25.641544342041016, "global_step": 294431, "epoch": 3547} {"train_loss": -25.84014320373535, "global_step": 294432, "epoch": 3547} {"train_loss": -25.816043853759766, "global_step": 294433, "epoch": 3547} {"train_loss": -25.740880966186523, "global_step": 294434, "epoch": 3547} {"train_loss": -25.48821449279785, "global_step": 294435, "epoch": 3547} {"train_loss": -25.976825714111328, "global_step": 294436, "epoch": 3547} {"train_loss": -25.73221778869629, "global_step": 294437, "epoch": 3547} {"train_loss": -26.697711944580078, "global_step": 294438, "epoch": 3547} {"train_loss": -25.489540100097656, "global_step": 294439, "epoch": 3547} {"train_loss": -25.77558708190918, "global_step": 294440, "epoch": 3547} {"train_loss": -25.711339950561523, "global_step": 294441, "epoch": 3547} {"train_loss": -25.809864044189453, "global_step": 294442, "epoch": 3547} {"train_loss": -25.684545516967773, "global_step": 294443, "epoch": 3547} {"train_loss": -25.7006893157959, "global_step": 294444, "epoch": 3547} {"train_loss": -25.72519874572754, "global_step": 294445, "epoch": 3547} {"train_loss": -25.691625595092773, "global_step": 294446, "epoch": 3547} {"train_loss": -25.700321197509766, "global_step": 294447, "epoch": 3547} {"train_loss": -25.33428955078125, "global_step": 294448, "epoch": 3547} {"train_loss": -25.377429962158203, "global_step": 294449, "epoch": 3547} {"train_loss": -25.5894832611084, "global_step": 294450, "epoch": 3547} {"train_loss": -25.6953125, "global_step": 294451, "epoch": 3547} {"train_loss": -25.583555221557617, "global_step": 294452, "epoch": 3547} {"train_loss": -25.153274536132812, "global_step": 294453, "epoch": 3547} {"train_loss": -25.616186141967773, "global_step": 294454, "epoch": 3547} {"train_loss": -25.701745986938477, "global_step": 294455, "epoch": 3547} {"train_loss": -25.774127960205078, "global_step": 294456, "epoch": 3547} {"train_loss": -25.5258731842041, "global_step": 294457, "epoch": 3547} {"train_loss": -25.957067489624023, "global_step": 294458, "epoch": 3547} {"train_loss": -25.404088973999023, "global_step": 294459, "epoch": 3547} {"train_loss": -25.62495994567871, "global_step": 294460, "epoch": 3547} {"train_loss": -25.480588912963867, "global_step": 294461, "epoch": 3547} {"train_loss": -25.965417861938477, "global_step": 294462, "epoch": 3547} {"train_loss": -25.802961349487305, "global_step": 294463, "epoch": 3547} {"train_loss": -25.379724502563477, "global_step": 294464, "epoch": 3547} {"train_loss": -25.858896255493164, "global_step": 294465, "epoch": 3547} {"train_loss": -25.426366806030273, "global_step": 294466, "epoch": 3547} {"train_loss": -25.501956939697266, "global_step": 294467, "epoch": 3547} {"train_loss": -25.388071060180664, "global_step": 294468, "epoch": 3547} {"train_loss": -25.31759262084961, "global_step": 294469, "epoch": 3547} {"train_loss": -25.522390365600586, "global_step": 294470, "epoch": 3547} {"train_loss": -25.693450927734375, "global_step": 294471, "epoch": 3547} {"train_loss": -25.640872955322266, "global_step": 294472, "epoch": 3547} {"train_loss": -25.964933395385742, "global_step": 294473, "epoch": 3547} {"train_loss": -25.486379623413086, "global_step": 294474, "epoch": 3547} {"train_loss": -25.556968688964844, "global_step": 294475, "epoch": 3547} {"train_loss": -25.632658004760742, "global_step": 294476, "epoch": 3547} {"train_loss": -25.36521339416504, "global_step": 294477, "epoch": 3547} {"train_loss": -25.38252067565918, "global_step": 294478, "epoch": 3547} {"train_loss": -25.731781005859375, "global_step": 294479, "epoch": 3547} {"train_loss": -25.3411808013916, "global_step": 294480, "epoch": 3547} {"train_loss": -25.64059829711914, "global_step": 294481, "epoch": 3547} {"train_loss": -25.750049591064453, "global_step": 294482, "epoch": 3547} {"train_loss": -25.5911343815815, "global_step": 294483, "epoch": 3547, "val_loss": 7096441.0} {"train_loss": -25.472686767578125, "global_step": 294484, "epoch": 3548} {"train_loss": -25.37796974182129, "global_step": 294485, "epoch": 3548} {"train_loss": -25.132665634155273, "global_step": 294486, "epoch": 3548} {"train_loss": -25.634414672851562, "global_step": 294487, "epoch": 3548} {"train_loss": -25.319135665893555, "global_step": 294488, "epoch": 3548} {"train_loss": -25.186420440673828, "global_step": 294489, "epoch": 3548} {"train_loss": -25.265439987182617, "global_step": 294490, "epoch": 3548} {"train_loss": -25.614477157592773, "global_step": 294491, "epoch": 3548} {"train_loss": -25.239107131958008, "global_step": 294492, "epoch": 3548} {"train_loss": -25.214317321777344, "global_step": 294493, "epoch": 3548} {"train_loss": -24.95755386352539, "global_step": 294494, "epoch": 3548} {"train_loss": -25.30881690979004, "global_step": 294495, "epoch": 3548} {"train_loss": -25.2136173248291, "global_step": 294496, "epoch": 3548} {"train_loss": -25.13644790649414, "global_step": 294497, "epoch": 3548} {"train_loss": -25.634719848632812, "global_step": 294498, "epoch": 3548} {"train_loss": -25.37082290649414, "global_step": 294499, "epoch": 3548} {"train_loss": -25.20444107055664, "global_step": 294500, "epoch": 3548} {"train_loss": -25.407886505126953, "global_step": 294501, "epoch": 3548} {"train_loss": -25.54195785522461, "global_step": 294502, "epoch": 3548} {"train_loss": -25.608434677124023, "global_step": 294503, "epoch": 3548} {"train_loss": -25.70294189453125, "global_step": 294504, "epoch": 3548} {"train_loss": -25.332456588745117, "global_step": 294505, "epoch": 3548} {"train_loss": -25.24382972717285, "global_step": 294506, "epoch": 3548} {"train_loss": -25.465576171875, "global_step": 294507, "epoch": 3548} {"train_loss": -25.243391036987305, "global_step": 294508, "epoch": 3548} {"train_loss": -25.314220428466797, "global_step": 294509, "epoch": 3548} {"train_loss": -25.480504989624023, "global_step": 294510, "epoch": 3548} {"train_loss": -25.46600341796875, "global_step": 294511, "epoch": 3548} {"train_loss": -25.565059661865234, "global_step": 294512, "epoch": 3548} {"train_loss": -25.70875358581543, "global_step": 294513, "epoch": 3548} {"train_loss": -25.817167282104492, "global_step": 294514, "epoch": 3548} {"train_loss": -25.849817276000977, "global_step": 294515, "epoch": 3548} {"train_loss": -25.491214752197266, "global_step": 294516, "epoch": 3548} {"train_loss": -25.516895294189453, "global_step": 294517, "epoch": 3548} {"train_loss": -25.376859664916992, "global_step": 294518, "epoch": 3548} {"train_loss": -25.68759536743164, "global_step": 294519, "epoch": 3548} {"train_loss": -25.403911590576172, "global_step": 294520, "epoch": 3548} {"train_loss": -25.403751373291016, "global_step": 294521, "epoch": 3548} {"train_loss": -25.683643341064453, "global_step": 294522, "epoch": 3548} {"train_loss": -25.678857803344727, "global_step": 294523, "epoch": 3548} {"train_loss": -25.573589324951172, "global_step": 294524, "epoch": 3548} {"train_loss": -25.76985740661621, "global_step": 294525, "epoch": 3548} {"train_loss": -25.82197380065918, "global_step": 294526, "epoch": 3548} {"train_loss": -25.471887588500977, "global_step": 294527, "epoch": 3548} {"train_loss": -25.54754066467285, "global_step": 294528, "epoch": 3548} {"train_loss": -25.64340591430664, "global_step": 294529, "epoch": 3548} {"train_loss": -25.65789222717285, "global_step": 294530, "epoch": 3548} {"train_loss": -25.530057907104492, "global_step": 294531, "epoch": 3548} {"train_loss": -25.497411727905273, "global_step": 294532, "epoch": 3548} {"train_loss": -25.64011573791504, "global_step": 294533, "epoch": 3548} {"train_loss": -25.831165313720703, "global_step": 294534, "epoch": 3548} {"train_loss": -25.813642501831055, "global_step": 294535, "epoch": 3548} {"train_loss": -25.59908676147461, "global_step": 294536, "epoch": 3548} {"train_loss": -25.47498893737793, "global_step": 294537, "epoch": 3548} {"train_loss": -25.82034683227539, "global_step": 294538, "epoch": 3548} {"train_loss": -25.36100196838379, "global_step": 294539, "epoch": 3548} {"train_loss": -25.827014923095703, "global_step": 294540, "epoch": 3548} {"train_loss": -25.65203857421875, "global_step": 294541, "epoch": 3548} {"train_loss": -25.85928726196289, "global_step": 294542, "epoch": 3548} {"train_loss": -25.734663009643555, "global_step": 294543, "epoch": 3548} {"train_loss": -25.611454010009766, "global_step": 294544, "epoch": 3548} {"train_loss": -25.88232421875, "global_step": 294545, "epoch": 3548} {"train_loss": -25.47650146484375, "global_step": 294546, "epoch": 3548} {"train_loss": -25.2791805267334, "global_step": 294547, "epoch": 3548} {"train_loss": -25.764638900756836, "global_step": 294548, "epoch": 3548} {"train_loss": -25.351810455322266, "global_step": 294549, "epoch": 3548} {"train_loss": -25.52931022644043, "global_step": 294550, "epoch": 3548} {"train_loss": -26.013198852539062, "global_step": 294551, "epoch": 3548} {"train_loss": -25.284650802612305, "global_step": 294552, "epoch": 3548} {"train_loss": -25.802722930908203, "global_step": 294553, "epoch": 3548} {"train_loss": -25.72333335876465, "global_step": 294554, "epoch": 3548} {"train_loss": -26.180822372436523, "global_step": 294555, "epoch": 3548} {"train_loss": -25.909717559814453, "global_step": 294556, "epoch": 3548} {"train_loss": -25.312374114990234, "global_step": 294557, "epoch": 3548} {"train_loss": -25.825605392456055, "global_step": 294558, "epoch": 3548} {"train_loss": -25.6547794342041, "global_step": 294559, "epoch": 3548} {"train_loss": -25.66071128845215, "global_step": 294560, "epoch": 3548} {"train_loss": -25.684040069580078, "global_step": 294561, "epoch": 3548} {"train_loss": -25.547704696655273, "global_step": 294562, "epoch": 3548} {"train_loss": -25.67694664001465, "global_step": 294563, "epoch": 3548} {"train_loss": -25.492599487304688, "global_step": 294564, "epoch": 3548} {"train_loss": -25.918054580688477, "global_step": 294565, "epoch": 3548} {"train_loss": -25.547780530998505, "global_step": 294566, "epoch": 3548, "val_loss": 7183015.0} {"train_loss": -24.079782485961914, "global_step": 294567, "epoch": 3549} {"train_loss": -24.016036987304688, "global_step": 294568, "epoch": 3549} {"train_loss": -25.34906768798828, "global_step": 294569, "epoch": 3549} {"train_loss": -24.89728546142578, "global_step": 294570, "epoch": 3549} {"train_loss": -24.834585189819336, "global_step": 294571, "epoch": 3549} {"train_loss": -24.749370574951172, "global_step": 294572, "epoch": 3549} {"train_loss": -25.239912033081055, "global_step": 294573, "epoch": 3549} {"train_loss": -25.025190353393555, "global_step": 294574, "epoch": 3549} {"train_loss": -25.17506217956543, "global_step": 294575, "epoch": 3549} {"train_loss": -24.734649658203125, "global_step": 294576, "epoch": 3549} {"train_loss": -25.259641647338867, "global_step": 294577, "epoch": 3549} {"train_loss": -25.03189468383789, "global_step": 294578, "epoch": 3549} {"train_loss": -25.11762809753418, "global_step": 294579, "epoch": 3549} {"train_loss": -25.367956161499023, "global_step": 294580, "epoch": 3549} {"train_loss": -24.959156036376953, "global_step": 294581, "epoch": 3549} {"train_loss": -25.42486572265625, "global_step": 294582, "epoch": 3549} {"train_loss": -25.821094512939453, "global_step": 294583, "epoch": 3549} {"train_loss": -25.656356811523438, "global_step": 294584, "epoch": 3549} {"train_loss": -25.363969802856445, "global_step": 294585, "epoch": 3549} {"train_loss": -25.296682357788086, "global_step": 294586, "epoch": 3549} {"train_loss": -25.379331588745117, "global_step": 294587, "epoch": 3549} {"train_loss": -25.787281036376953, "global_step": 294588, "epoch": 3549} {"train_loss": -25.287906646728516, "global_step": 294589, "epoch": 3549} {"train_loss": -25.954193115234375, "global_step": 294590, "epoch": 3549} {"train_loss": -25.620716094970703, "global_step": 294591, "epoch": 3549} {"train_loss": -25.514196395874023, "global_step": 294592, "epoch": 3549} {"train_loss": -25.62159538269043, "global_step": 294593, "epoch": 3549} {"train_loss": -25.50344467163086, "global_step": 294594, "epoch": 3549} {"train_loss": -25.744251251220703, "global_step": 294595, "epoch": 3549} {"train_loss": -25.77376365661621, "global_step": 294596, "epoch": 3549} {"train_loss": -25.557422637939453, "global_step": 294597, "epoch": 3549} {"train_loss": -25.636703491210938, "global_step": 294598, "epoch": 3549} {"train_loss": -25.581287384033203, "global_step": 294599, "epoch": 3549} {"train_loss": -25.388776779174805, "global_step": 294600, "epoch": 3549} {"train_loss": -25.72235679626465, "global_step": 294601, "epoch": 3549} {"train_loss": -25.29646110534668, "global_step": 294602, "epoch": 3549} {"train_loss": -25.577030181884766, "global_step": 294603, "epoch": 3549} {"train_loss": -25.250776290893555, "global_step": 294604, "epoch": 3549} {"train_loss": -25.5096492767334, "global_step": 294605, "epoch": 3549} {"train_loss": -25.247770309448242, "global_step": 294606, "epoch": 3549} {"train_loss": -25.69318199157715, "global_step": 294607, "epoch": 3549} {"train_loss": -25.768280029296875, "global_step": 294608, "epoch": 3549} {"train_loss": -25.63140296936035, "global_step": 294609, "epoch": 3549} {"train_loss": -25.497663497924805, "global_step": 294610, "epoch": 3549} {"train_loss": -25.57393455505371, "global_step": 294611, "epoch": 3549} {"train_loss": -25.535409927368164, "global_step": 294612, "epoch": 3549} {"train_loss": -25.4770450592041, "global_step": 294613, "epoch": 3549} {"train_loss": -25.56853675842285, "global_step": 294614, "epoch": 3549} {"train_loss": -25.02778434753418, "global_step": 294615, "epoch": 3549} {"train_loss": -25.469558715820312, "global_step": 294616, "epoch": 3549} {"train_loss": -25.486265182495117, "global_step": 294617, "epoch": 3549} {"train_loss": -25.082870483398438, "global_step": 294618, "epoch": 3549} {"train_loss": -24.173635482788086, "global_step": 294619, "epoch": 3549} {"train_loss": -25.037382125854492, "global_step": 294620, "epoch": 3549} {"train_loss": -25.386072158813477, "global_step": 294621, "epoch": 3549} {"train_loss": -23.57533073425293, "global_step": 294622, "epoch": 3549} {"train_loss": -24.625732421875, "global_step": 294623, "epoch": 3549} {"train_loss": -24.587114334106445, "global_step": 294624, "epoch": 3549} {"train_loss": -24.893442153930664, "global_step": 294625, "epoch": 3549} {"train_loss": -24.526046752929688, "global_step": 294626, "epoch": 3549} {"train_loss": -24.777265548706055, "global_step": 294627, "epoch": 3549} {"train_loss": -25.01063346862793, "global_step": 294628, "epoch": 3549} {"train_loss": -25.10859489440918, "global_step": 294629, "epoch": 3549} {"train_loss": -24.813129425048828, "global_step": 294630, "epoch": 3549} {"train_loss": -25.323720932006836, "global_step": 294631, "epoch": 3549} {"train_loss": -25.04878807067871, "global_step": 294632, "epoch": 3549} {"train_loss": -24.780445098876953, "global_step": 294633, "epoch": 3549} {"train_loss": -25.17366600036621, "global_step": 294634, "epoch": 3549} {"train_loss": -24.855085372924805, "global_step": 294635, "epoch": 3549} {"train_loss": -25.132944107055664, "global_step": 294636, "epoch": 3549} {"train_loss": -25.21904945373535, "global_step": 294637, "epoch": 3549} {"train_loss": -25.2992000579834, "global_step": 294638, "epoch": 3549} {"train_loss": -25.548410415649414, "global_step": 294639, "epoch": 3549} {"train_loss": -25.569381713867188, "global_step": 294640, "epoch": 3549} {"train_loss": -25.182615280151367, "global_step": 294641, "epoch": 3549} {"train_loss": -25.11646842956543, "global_step": 294642, "epoch": 3549} {"train_loss": -25.716596603393555, "global_step": 294643, "epoch": 3549} {"train_loss": -25.401620864868164, "global_step": 294644, "epoch": 3549} {"train_loss": -25.534841537475586, "global_step": 294645, "epoch": 3549} {"train_loss": -25.233135223388672, "global_step": 294646, "epoch": 3549} {"train_loss": -25.372358322143555, "global_step": 294647, "epoch": 3549} {"train_loss": -25.26188087463379, "global_step": 294648, "epoch": 3549} {"train_loss": -25.23397680075772, "global_step": 294649, "epoch": 3549, "val_loss": 7099614.0} {"train_loss": -24.77570152282715, "global_step": 294650, "epoch": 3550} {"train_loss": -24.23813247680664, "global_step": 294651, "epoch": 3550} {"train_loss": -23.9530029296875, "global_step": 294652, "epoch": 3550} {"train_loss": -25.091781616210938, "global_step": 294653, "epoch": 3550} {"train_loss": -23.769201278686523, "global_step": 294654, "epoch": 3550} {"train_loss": -24.933164596557617, "global_step": 294655, "epoch": 3550} {"train_loss": -24.39467430114746, "global_step": 294656, "epoch": 3550} {"train_loss": -24.949371337890625, "global_step": 294657, "epoch": 3550} {"train_loss": -25.051101684570312, "global_step": 294658, "epoch": 3550} {"train_loss": -25.431659698486328, "global_step": 294659, "epoch": 3550} {"train_loss": -24.85822868347168, "global_step": 294660, "epoch": 3550} {"train_loss": -25.305856704711914, "global_step": 294661, "epoch": 3550} {"train_loss": -25.373916625976562, "global_step": 294662, "epoch": 3550} {"train_loss": -25.12502098083496, "global_step": 294663, "epoch": 3550} {"train_loss": -25.259122848510742, "global_step": 294664, "epoch": 3550} {"train_loss": -25.055267333984375, "global_step": 294665, "epoch": 3550} {"train_loss": -25.791440963745117, "global_step": 294666, "epoch": 3550} {"train_loss": -25.095178604125977, "global_step": 294667, "epoch": 3550} {"train_loss": -25.69902992248535, "global_step": 294668, "epoch": 3550} {"train_loss": -25.40357780456543, "global_step": 294669, "epoch": 3550} {"train_loss": -25.496137619018555, "global_step": 294670, "epoch": 3550} {"train_loss": -25.3109073638916, "global_step": 294671, "epoch": 3550} {"train_loss": -25.6556339263916, "global_step": 294672, "epoch": 3550} {"train_loss": -25.624486923217773, "global_step": 294673, "epoch": 3550} {"train_loss": -25.921804428100586, "global_step": 294674, "epoch": 3550} {"train_loss": -25.520599365234375, "global_step": 294675, "epoch": 3550} {"train_loss": -25.9134578704834, "global_step": 294676, "epoch": 3550} {"train_loss": -25.363208770751953, "global_step": 294677, "epoch": 3550} {"train_loss": -25.621448516845703, "global_step": 294678, "epoch": 3550} {"train_loss": -25.56926918029785, "global_step": 294679, "epoch": 3550} {"train_loss": -25.658355712890625, "global_step": 294680, "epoch": 3550} {"train_loss": -25.81800651550293, "global_step": 294681, "epoch": 3550} {"train_loss": -25.549428939819336, "global_step": 294682, "epoch": 3550} {"train_loss": -25.258081436157227, "global_step": 294683, "epoch": 3550} {"train_loss": -25.64845085144043, "global_step": 294684, "epoch": 3550} {"train_loss": -25.705312728881836, "global_step": 294685, "epoch": 3550} {"train_loss": -25.58839225769043, "global_step": 294686, "epoch": 3550} {"train_loss": -25.767276763916016, "global_step": 294687, "epoch": 3550} {"train_loss": -25.716283798217773, "global_step": 294688, "epoch": 3550} {"train_loss": -25.82874870300293, "global_step": 294689, "epoch": 3550} {"train_loss": -25.070592880249023, "global_step": 294690, "epoch": 3550} {"train_loss": -25.571956634521484, "global_step": 294691, "epoch": 3550} {"train_loss": -25.278451919555664, "global_step": 294692, "epoch": 3550} {"train_loss": -25.740365982055664, "global_step": 294693, "epoch": 3550} {"train_loss": -25.43971061706543, "global_step": 294694, "epoch": 3550} {"train_loss": -25.703876495361328, "global_step": 294695, "epoch": 3550} {"train_loss": -25.651533126831055, "global_step": 294696, "epoch": 3550} {"train_loss": -25.499404907226562, "global_step": 294697, "epoch": 3550} {"train_loss": -25.37495231628418, "global_step": 294698, "epoch": 3550} {"train_loss": -25.816131591796875, "global_step": 294699, "epoch": 3550} {"train_loss": -25.397598266601562, "global_step": 294700, "epoch": 3550} {"train_loss": -25.12994956970215, "global_step": 294701, "epoch": 3550} {"train_loss": -25.522985458374023, "global_step": 294702, "epoch": 3550} {"train_loss": -25.780271530151367, "global_step": 294703, "epoch": 3550} {"train_loss": -25.896154403686523, "global_step": 294704, "epoch": 3550} {"train_loss": -25.609012603759766, "global_step": 294705, "epoch": 3550} {"train_loss": -25.06418800354004, "global_step": 294706, "epoch": 3550} {"train_loss": -25.641340255737305, "global_step": 294707, "epoch": 3550} {"train_loss": -25.722990036010742, "global_step": 294708, "epoch": 3550} {"train_loss": -25.8095703125, "global_step": 294709, "epoch": 3550} {"train_loss": -25.406740188598633, "global_step": 294710, "epoch": 3550} {"train_loss": -25.376127243041992, "global_step": 294711, "epoch": 3550} {"train_loss": -25.489347457885742, "global_step": 294712, "epoch": 3550} {"train_loss": -25.384397506713867, "global_step": 294713, "epoch": 3550} {"train_loss": -25.404361724853516, "global_step": 294714, "epoch": 3550} {"train_loss": -25.83024024963379, "global_step": 294715, "epoch": 3550} {"train_loss": -25.552778244018555, "global_step": 294716, "epoch": 3550} {"train_loss": -25.671051025390625, "global_step": 294717, "epoch": 3550} {"train_loss": -25.518484115600586, "global_step": 294718, "epoch": 3550} {"train_loss": -25.461360931396484, "global_step": 294719, "epoch": 3550} {"train_loss": -25.58893585205078, "global_step": 294720, "epoch": 3550} {"train_loss": -25.8714599609375, "global_step": 294721, "epoch": 3550} {"train_loss": -25.739713668823242, "global_step": 294722, "epoch": 3550} {"train_loss": -25.401744842529297, "global_step": 294723, "epoch": 3550} {"train_loss": -25.49983024597168, "global_step": 294724, "epoch": 3550} {"train_loss": -25.50984764099121, "global_step": 294725, "epoch": 3550} {"train_loss": -25.668964385986328, "global_step": 294726, "epoch": 3550} {"train_loss": -25.136449813842773, "global_step": 294727, "epoch": 3550} {"train_loss": -25.38304901123047, "global_step": 294728, "epoch": 3550} {"train_loss": -25.770538330078125, "global_step": 294729, "epoch": 3550} {"train_loss": -25.429340362548828, "global_step": 294730, "epoch": 3550} {"train_loss": -25.5349178314209, "global_step": 294731, "epoch": 3550} {"train_loss": -25.425165498113056, "global_step": 294732, "epoch": 3550, "train/sim_max_reward_0": 1.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4500000": 1.0, "test/sim_max_reward_4500001": 1.0, "test/sim_max_reward_4500002": 1.0, "test/sim_max_reward_4500003": 1.0, "test/sim_max_reward_4500004": 1.0, "test/sim_max_reward_4500005": 1.0, "test/sim_max_reward_4500006": 1.0, "test/sim_max_reward_4500007": 0.0, "test/sim_max_reward_4500008": 1.0, "test/sim_max_reward_4500009": 1.0, "test/sim_max_reward_4500010": 1.0, "test/sim_max_reward_4500011": 1.0, "test/sim_max_reward_4500012": 1.0, "test/sim_max_reward_4500013": 1.0, "test/sim_max_reward_4500014": 1.0, "test/sim_max_reward_4500015": 1.0, "test/sim_max_reward_4500016": 1.0, "test/sim_max_reward_4500017": 1.0, "test/sim_max_reward_4500018": 1.0, "test/sim_max_reward_4500019": 1.0, "test/sim_max_reward_4500020": 1.0, "test/sim_max_reward_4500021": 1.0, "train/mean_score": 1.0, "test/mean_score": 0.9545454545454546, "val_loss": 7187343.0} {"train_loss": -25.59578514099121, "global_step": 294733, "epoch": 3551} {"train_loss": -25.445016860961914, "global_step": 294734, "epoch": 3551} {"train_loss": -25.343172073364258, "global_step": 294735, "epoch": 3551} {"train_loss": -25.076187133789062, "global_step": 294736, "epoch": 3551} {"train_loss": -25.026641845703125, "global_step": 294737, "epoch": 3551} {"train_loss": -25.151470184326172, "global_step": 294738, "epoch": 3551} {"train_loss": -25.51373863220215, "global_step": 294739, "epoch": 3551} {"train_loss": -25.0045108795166, "global_step": 294740, "epoch": 3551} {"train_loss": -25.2683162689209, "global_step": 294741, "epoch": 3551} {"train_loss": -25.247106552124023, "global_step": 294742, "epoch": 3551} {"train_loss": -25.195096969604492, "global_step": 294743, "epoch": 3551} {"train_loss": -25.3294734954834, "global_step": 294744, "epoch": 3551} {"train_loss": -25.230831146240234, "global_step": 294745, "epoch": 3551} {"train_loss": -25.56727409362793, "global_step": 294746, "epoch": 3551} {"train_loss": -25.16566276550293, "global_step": 294747, "epoch": 3551} {"train_loss": -25.641326904296875, "global_step": 294748, "epoch": 3551} {"train_loss": -25.59040069580078, "global_step": 294749, "epoch": 3551} {"train_loss": -25.32704734802246, "global_step": 294750, "epoch": 3551} {"train_loss": -25.61930274963379, "global_step": 294751, "epoch": 3551} {"train_loss": -25.45318603515625, "global_step": 294752, "epoch": 3551} {"train_loss": -25.222614288330078, "global_step": 294753, "epoch": 3551} {"train_loss": -25.48124122619629, "global_step": 294754, "epoch": 3551} {"train_loss": -25.500343322753906, "global_step": 294755, "epoch": 3551} {"train_loss": -25.750226974487305, "global_step": 294756, "epoch": 3551} {"train_loss": -25.437946319580078, "global_step": 294757, "epoch": 3551} {"train_loss": -25.651769638061523, "global_step": 294758, "epoch": 3551} {"train_loss": -25.626394271850586, "global_step": 294759, "epoch": 3551} {"train_loss": -25.560178756713867, "global_step": 294760, "epoch": 3551} {"train_loss": -25.652069091796875, "global_step": 294761, "epoch": 3551} {"train_loss": -25.6253719329834, "global_step": 294762, "epoch": 3551} {"train_loss": -25.886993408203125, "global_step": 294763, "epoch": 3551} {"train_loss": -25.56890296936035, "global_step": 294764, "epoch": 3551} {"train_loss": -25.715789794921875, "global_step": 294765, "epoch": 3551} {"train_loss": -25.90447425842285, "global_step": 294766, "epoch": 3551} {"train_loss": -25.674713134765625, "global_step": 294767, "epoch": 3551} {"train_loss": -25.986719131469727, "global_step": 294768, "epoch": 3551} {"train_loss": -25.983184814453125, "global_step": 294769, "epoch": 3551} {"train_loss": -25.379695892333984, "global_step": 294770, "epoch": 3551} {"train_loss": -25.781482696533203, "global_step": 294771, "epoch": 3551} {"train_loss": -25.45377540588379, "global_step": 294772, "epoch": 3551} {"train_loss": -25.29815101623535, "global_step": 294773, "epoch": 3551} {"train_loss": -25.363006591796875, "global_step": 294774, "epoch": 3551} {"train_loss": -25.336429595947266, "global_step": 294775, "epoch": 3551} {"train_loss": -25.195560455322266, "global_step": 294776, "epoch": 3551} {"train_loss": -25.4713191986084, "global_step": 294777, "epoch": 3551} {"train_loss": -25.655012130737305, "global_step": 294778, "epoch": 3551} {"train_loss": -25.331701278686523, "global_step": 294779, "epoch": 3551} {"train_loss": -25.231077194213867, "global_step": 294780, "epoch": 3551} {"train_loss": -25.53078269958496, "global_step": 294781, "epoch": 3551} {"train_loss": -25.285673141479492, "global_step": 294782, "epoch": 3551} {"train_loss": -25.699995040893555, "global_step": 294783, "epoch": 3551} {"train_loss": -25.2813777923584, "global_step": 294784, "epoch": 3551} {"train_loss": -25.73720359802246, "global_step": 294785, "epoch": 3551} {"train_loss": -25.29681396484375, "global_step": 294786, "epoch": 3551} {"train_loss": -25.331649780273438, "global_step": 294787, "epoch": 3551} {"train_loss": -25.443754196166992, "global_step": 294788, "epoch": 3551} {"train_loss": -25.39556121826172, "global_step": 294789, "epoch": 3551} {"train_loss": -25.814136505126953, "global_step": 294790, "epoch": 3551} {"train_loss": -25.90107536315918, "global_step": 294791, "epoch": 3551} {"train_loss": -25.874835968017578, "global_step": 294792, "epoch": 3551} {"train_loss": -25.559589385986328, "global_step": 294793, "epoch": 3551} {"train_loss": -25.50518035888672, "global_step": 294794, "epoch": 3551} {"train_loss": -25.768798828125, "global_step": 294795, "epoch": 3551} {"train_loss": -25.20308494567871, "global_step": 294796, "epoch": 3551} {"train_loss": -25.871734619140625, "global_step": 294797, "epoch": 3551} {"train_loss": -25.41383171081543, "global_step": 294798, "epoch": 3551} {"train_loss": -25.557165145874023, "global_step": 294799, "epoch": 3551} {"train_loss": -25.78435707092285, "global_step": 294800, "epoch": 3551} {"train_loss": -25.41921615600586, "global_step": 294801, "epoch": 3551} {"train_loss": -25.401939392089844, "global_step": 294802, "epoch": 3551} {"train_loss": -25.59613037109375, "global_step": 294803, "epoch": 3551} {"train_loss": -25.801218032836914, "global_step": 294804, "epoch": 3551} {"train_loss": -25.7686767578125, "global_step": 294805, "epoch": 3551} {"train_loss": -25.408695220947266, "global_step": 294806, "epoch": 3551} {"train_loss": -25.742528915405273, "global_step": 294807, "epoch": 3551} {"train_loss": -25.368528366088867, "global_step": 294808, "epoch": 3551} {"train_loss": -25.53476905822754, "global_step": 294809, "epoch": 3551} {"train_loss": -25.724700927734375, "global_step": 294810, "epoch": 3551} {"train_loss": -25.56520652770996, "global_step": 294811, "epoch": 3551} {"train_loss": -26.02369499206543, "global_step": 294812, "epoch": 3551} {"train_loss": -25.557613372802734, "global_step": 294813, "epoch": 3551} {"train_loss": -25.573745727539062, "global_step": 294814, "epoch": 3551} {"train_loss": -25.513746468417615, "global_step": 294815, "epoch": 3551, "val_loss": 7192358.0} {"train_loss": -25.05613899230957, "global_step": 294816, "epoch": 3552} {"train_loss": -24.811553955078125, "global_step": 294817, "epoch": 3552} {"train_loss": -25.28955841064453, "global_step": 294818, "epoch": 3552} {"train_loss": -25.40195655822754, "global_step": 294819, "epoch": 3552} {"train_loss": -24.725584030151367, "global_step": 294820, "epoch": 3552} {"train_loss": -25.66798210144043, "global_step": 294821, "epoch": 3552} {"train_loss": -25.577810287475586, "global_step": 294822, "epoch": 3552} {"train_loss": -24.7995662689209, "global_step": 294823, "epoch": 3552} {"train_loss": -25.41366958618164, "global_step": 294824, "epoch": 3552} {"train_loss": -25.35921287536621, "global_step": 294825, "epoch": 3552} {"train_loss": -25.165353775024414, "global_step": 294826, "epoch": 3552} {"train_loss": -25.20490837097168, "global_step": 294827, "epoch": 3552} {"train_loss": -25.728193283081055, "global_step": 294828, "epoch": 3552} {"train_loss": -25.457216262817383, "global_step": 294829, "epoch": 3552} {"train_loss": -25.095670700073242, "global_step": 294830, "epoch": 3552} {"train_loss": -25.534147262573242, "global_step": 294831, "epoch": 3552} {"train_loss": -25.334829330444336, "global_step": 294832, "epoch": 3552} {"train_loss": -25.506696701049805, "global_step": 294833, "epoch": 3552} {"train_loss": -25.765623092651367, "global_step": 294834, "epoch": 3552} {"train_loss": -25.90159034729004, "global_step": 294835, "epoch": 3552} {"train_loss": -25.290220260620117, "global_step": 294836, "epoch": 3552} {"train_loss": -25.719457626342773, "global_step": 294837, "epoch": 3552} {"train_loss": -25.382558822631836, "global_step": 294838, "epoch": 3552} {"train_loss": -25.875431060791016, "global_step": 294839, "epoch": 3552} {"train_loss": -25.52402687072754, "global_step": 294840, "epoch": 3552} {"train_loss": -25.638776779174805, "global_step": 294841, "epoch": 3552} {"train_loss": -25.471168518066406, "global_step": 294842, "epoch": 3552} {"train_loss": -25.495718002319336, "global_step": 294843, "epoch": 3552} {"train_loss": -25.576631546020508, "global_step": 294844, "epoch": 3552} {"train_loss": -25.2514705657959, "global_step": 294845, "epoch": 3552} {"train_loss": -25.817041397094727, "global_step": 294846, "epoch": 3552} {"train_loss": -25.651031494140625, "global_step": 294847, "epoch": 3552} {"train_loss": -25.5488224029541, "global_step": 294848, "epoch": 3552} {"train_loss": -25.78683853149414, "global_step": 294849, "epoch": 3552} {"train_loss": -26.019611358642578, "global_step": 294850, "epoch": 3552} {"train_loss": -25.6774845123291, "global_step": 294851, "epoch": 3552} {"train_loss": -25.545936584472656, "global_step": 294852, "epoch": 3552} {"train_loss": -25.8364200592041, "global_step": 294853, "epoch": 3552} {"train_loss": -25.5073184967041, "global_step": 294854, "epoch": 3552} {"train_loss": -25.619155883789062, "global_step": 294855, "epoch": 3552} {"train_loss": -25.380126953125, "global_step": 294856, "epoch": 3552} {"train_loss": -25.983795166015625, "global_step": 294857, "epoch": 3552} {"train_loss": -25.95790672302246, "global_step": 294858, "epoch": 3552} {"train_loss": -25.753637313842773, "global_step": 294859, "epoch": 3552} {"train_loss": -25.69244956970215, "global_step": 294860, "epoch": 3552} {"train_loss": -25.36745262145996, "global_step": 294861, "epoch": 3552} {"train_loss": -26.152109146118164, "global_step": 294862, "epoch": 3552} {"train_loss": -25.837812423706055, "global_step": 294863, "epoch": 3552} {"train_loss": -25.8227481842041, "global_step": 294864, "epoch": 3552} {"train_loss": -25.32097053527832, "global_step": 294865, "epoch": 3552} {"train_loss": -25.60886573791504, "global_step": 294866, "epoch": 3552} {"train_loss": -25.882495880126953, "global_step": 294867, "epoch": 3552} {"train_loss": -25.58139419555664, "global_step": 294868, "epoch": 3552} {"train_loss": -25.570575714111328, "global_step": 294869, "epoch": 3552} {"train_loss": -26.01840591430664, "global_step": 294870, "epoch": 3552} {"train_loss": -25.64422607421875, "global_step": 294871, "epoch": 3552} {"train_loss": -25.823591232299805, "global_step": 294872, "epoch": 3552} {"train_loss": -24.78106689453125, "global_step": 294873, "epoch": 3552} {"train_loss": -24.343732833862305, "global_step": 294874, "epoch": 3552} {"train_loss": -24.376625061035156, "global_step": 294875, "epoch": 3552} {"train_loss": -24.921186447143555, "global_step": 294876, "epoch": 3552} {"train_loss": -25.220937728881836, "global_step": 294877, "epoch": 3552} {"train_loss": -25.071374893188477, "global_step": 294878, "epoch": 3552} {"train_loss": -25.715600967407227, "global_step": 294879, "epoch": 3552} {"train_loss": -25.23600196838379, "global_step": 294880, "epoch": 3552} {"train_loss": -25.34564208984375, "global_step": 294881, "epoch": 3552} {"train_loss": -25.21576499938965, "global_step": 294882, "epoch": 3552} {"train_loss": -25.304128646850586, "global_step": 294883, "epoch": 3552} {"train_loss": -25.9011287689209, "global_step": 294884, "epoch": 3552} {"train_loss": -25.509418487548828, "global_step": 294885, "epoch": 3552} {"train_loss": -25.405611038208008, "global_step": 294886, "epoch": 3552} {"train_loss": -25.66663932800293, "global_step": 294887, "epoch": 3552} {"train_loss": -25.881994247436523, "global_step": 294888, "epoch": 3552} {"train_loss": -25.382169723510742, "global_step": 294889, "epoch": 3552} {"train_loss": -25.973424911499023, "global_step": 294890, "epoch": 3552} {"train_loss": -25.82801628112793, "global_step": 294891, "epoch": 3552} {"train_loss": -25.46040916442871, "global_step": 294892, "epoch": 3552} {"train_loss": -25.497426986694336, "global_step": 294893, "epoch": 3552} {"train_loss": -25.651611328125, "global_step": 294894, "epoch": 3552} {"train_loss": -25.396076202392578, "global_step": 294895, "epoch": 3552} {"train_loss": -25.842742919921875, "global_step": 294896, "epoch": 3552} {"train_loss": -25.52729606628418, "global_step": 294897, "epoch": 3552} {"train_loss": -25.482857416911298, "global_step": 294898, "epoch": 3552, "val_loss": 7221450.0} {"train_loss": -25.405481338500977, "global_step": 294899, "epoch": 3553} {"train_loss": -25.366878509521484, "global_step": 294900, "epoch": 3553} {"train_loss": -25.095497131347656, "global_step": 294901, "epoch": 3553} {"train_loss": -25.326650619506836, "global_step": 294902, "epoch": 3553} {"train_loss": -25.46476936340332, "global_step": 294903, "epoch": 3553} {"train_loss": -25.303482055664062, "global_step": 294904, "epoch": 3553} {"train_loss": -25.267013549804688, "global_step": 294905, "epoch": 3553} {"train_loss": -25.66651725769043, "global_step": 294906, "epoch": 3553} {"train_loss": -25.54743194580078, "global_step": 294907, "epoch": 3553} {"train_loss": -25.32118034362793, "global_step": 294908, "epoch": 3553} {"train_loss": -25.40891456604004, "global_step": 294909, "epoch": 3553} {"train_loss": -25.387548446655273, "global_step": 294910, "epoch": 3553} {"train_loss": -25.606000900268555, "global_step": 294911, "epoch": 3553} {"train_loss": -25.404224395751953, "global_step": 294912, "epoch": 3553} {"train_loss": -25.251501083374023, "global_step": 294913, "epoch": 3553} {"train_loss": -25.408472061157227, "global_step": 294914, "epoch": 3553} {"train_loss": -25.71624755859375, "global_step": 294915, "epoch": 3553} {"train_loss": -25.4495849609375, "global_step": 294916, "epoch": 3553} {"train_loss": -24.914337158203125, "global_step": 294917, "epoch": 3553} {"train_loss": -25.8018856048584, "global_step": 294918, "epoch": 3553} {"train_loss": -25.519975662231445, "global_step": 294919, "epoch": 3553} {"train_loss": -25.70719337463379, "global_step": 294920, "epoch": 3553} {"train_loss": -25.6466007232666, "global_step": 294921, "epoch": 3553} {"train_loss": -25.666601181030273, "global_step": 294922, "epoch": 3553} {"train_loss": -25.448566436767578, "global_step": 294923, "epoch": 3553} {"train_loss": -26.13922119140625, "global_step": 294924, "epoch": 3553} {"train_loss": -25.65180015563965, "global_step": 294925, "epoch": 3553} {"train_loss": -25.458980560302734, "global_step": 294926, "epoch": 3553} {"train_loss": -25.723134994506836, "global_step": 294927, "epoch": 3553} {"train_loss": -25.501731872558594, "global_step": 294928, "epoch": 3553} {"train_loss": -25.770023345947266, "global_step": 294929, "epoch": 3553} {"train_loss": -25.750600814819336, "global_step": 294930, "epoch": 3553} {"train_loss": -26.0426082611084, "global_step": 294931, "epoch": 3553} {"train_loss": -25.426549911499023, "global_step": 294932, "epoch": 3553} {"train_loss": -25.601276397705078, "global_step": 294933, "epoch": 3553} {"train_loss": -25.710983276367188, "global_step": 294934, "epoch": 3553} {"train_loss": -25.680089950561523, "global_step": 294935, "epoch": 3553} {"train_loss": -25.6245174407959, "global_step": 294936, "epoch": 3553} {"train_loss": -25.5658016204834, "global_step": 294937, "epoch": 3553} {"train_loss": -25.7839298248291, "global_step": 294938, "epoch": 3553} {"train_loss": -25.787015914916992, "global_step": 294939, "epoch": 3553} {"train_loss": -26.03645133972168, "global_step": 294940, "epoch": 3553} {"train_loss": -25.473209381103516, "global_step": 294941, "epoch": 3553} {"train_loss": -25.47494888305664, "global_step": 294942, "epoch": 3553} {"train_loss": -25.693613052368164, "global_step": 294943, "epoch": 3553} {"train_loss": -25.48655128479004, "global_step": 294944, "epoch": 3553} {"train_loss": -25.459325790405273, "global_step": 294945, "epoch": 3553} {"train_loss": -25.20013999938965, "global_step": 294946, "epoch": 3553} {"train_loss": -25.478759765625, "global_step": 294947, "epoch": 3553} {"train_loss": -25.85272216796875, "global_step": 294948, "epoch": 3553} {"train_loss": -25.369369506835938, "global_step": 294949, "epoch": 3553} {"train_loss": -25.869739532470703, "global_step": 294950, "epoch": 3553} {"train_loss": -25.52907371520996, "global_step": 294951, "epoch": 3553} {"train_loss": -25.52034568786621, "global_step": 294952, "epoch": 3553} {"train_loss": -25.751911163330078, "global_step": 294953, "epoch": 3553} {"train_loss": -25.862091064453125, "global_step": 294954, "epoch": 3553} {"train_loss": -25.94624137878418, "global_step": 294955, "epoch": 3553} {"train_loss": -25.473648071289062, "global_step": 294956, "epoch": 3553} {"train_loss": -25.644575119018555, "global_step": 294957, "epoch": 3553} {"train_loss": -25.342823028564453, "global_step": 294958, "epoch": 3553} {"train_loss": -25.851261138916016, "global_step": 294959, "epoch": 3553} {"train_loss": -25.77654457092285, "global_step": 294960, "epoch": 3553} {"train_loss": -25.9952335357666, "global_step": 294961, "epoch": 3553} {"train_loss": -25.78717041015625, "global_step": 294962, "epoch": 3553} {"train_loss": -25.499534606933594, "global_step": 294963, "epoch": 3553} {"train_loss": -25.82978630065918, "global_step": 294964, "epoch": 3553} {"train_loss": -25.9482364654541, "global_step": 294965, "epoch": 3553} {"train_loss": -25.864538192749023, "global_step": 294966, "epoch": 3553} {"train_loss": -25.99661636352539, "global_step": 294967, "epoch": 3553} {"train_loss": -25.766759872436523, "global_step": 294968, "epoch": 3553} {"train_loss": -25.8727970123291, "global_step": 294969, "epoch": 3553} {"train_loss": -25.262104034423828, "global_step": 294970, "epoch": 3553} {"train_loss": -25.043167114257812, "global_step": 294971, "epoch": 3553} {"train_loss": -25.175567626953125, "global_step": 294972, "epoch": 3553} {"train_loss": -25.481670379638672, "global_step": 294973, "epoch": 3553} {"train_loss": -25.487714767456055, "global_step": 294974, "epoch": 3553} {"train_loss": -25.490453720092773, "global_step": 294975, "epoch": 3553} {"train_loss": -25.647907257080078, "global_step": 294976, "epoch": 3553} {"train_loss": -25.39299774169922, "global_step": 294977, "epoch": 3553} {"train_loss": -25.887338638305664, "global_step": 294978, "epoch": 3553} {"train_loss": -25.41309356689453, "global_step": 294979, "epoch": 3553} {"train_loss": -25.81568717956543, "global_step": 294980, "epoch": 3553} {"train_loss": -25.584275096295826, "global_step": 294981, "epoch": 3553, "val_loss": 7180513.0} {"train_loss": -24.946130752563477, "global_step": 294982, "epoch": 3554} {"train_loss": -24.520700454711914, "global_step": 294983, "epoch": 3554} {"train_loss": -24.376514434814453, "global_step": 294984, "epoch": 3554} {"train_loss": -24.88907241821289, "global_step": 294985, "epoch": 3554} {"train_loss": -24.578861236572266, "global_step": 294986, "epoch": 3554} {"train_loss": -25.150312423706055, "global_step": 294987, "epoch": 3554} {"train_loss": -25.3275146484375, "global_step": 294988, "epoch": 3554} {"train_loss": -25.0379581451416, "global_step": 294989, "epoch": 3554} {"train_loss": -25.24479866027832, "global_step": 294990, "epoch": 3554} {"train_loss": -24.96181297302246, "global_step": 294991, "epoch": 3554} {"train_loss": -25.63602638244629, "global_step": 294992, "epoch": 3554} {"train_loss": -25.305898666381836, "global_step": 294993, "epoch": 3554} {"train_loss": -25.454906463623047, "global_step": 294994, "epoch": 3554} {"train_loss": -25.366270065307617, "global_step": 294995, "epoch": 3554} {"train_loss": -25.228424072265625, "global_step": 294996, "epoch": 3554} {"train_loss": -25.323694229125977, "global_step": 294997, "epoch": 3554} {"train_loss": -25.293893814086914, "global_step": 294998, "epoch": 3554} {"train_loss": -25.346731185913086, "global_step": 294999, "epoch": 3554} {"train_loss": -25.243663787841797, "global_step": 295000, "epoch": 3554} {"train_loss": -25.400047302246094, "global_step": 295001, "epoch": 3554} {"train_loss": -25.23756980895996, "global_step": 295002, "epoch": 3554} {"train_loss": -25.43410301208496, "global_step": 295003, "epoch": 3554} {"train_loss": -25.85025978088379, "global_step": 295004, "epoch": 3554} {"train_loss": -25.60591697692871, "global_step": 295005, "epoch": 3554} {"train_loss": -25.663440704345703, "global_step": 295006, "epoch": 3554} {"train_loss": -25.394916534423828, "global_step": 295007, "epoch": 3554} {"train_loss": -25.367328643798828, "global_step": 295008, "epoch": 3554} {"train_loss": -25.850391387939453, "global_step": 295009, "epoch": 3554} {"train_loss": -25.69538688659668, "global_step": 295010, "epoch": 3554} {"train_loss": -25.67701530456543, "global_step": 295011, "epoch": 3554} {"train_loss": -25.71005630493164, "global_step": 295012, "epoch": 3554} {"train_loss": -25.544055938720703, "global_step": 295013, "epoch": 3554} {"train_loss": -25.647443771362305, "global_step": 295014, "epoch": 3554} {"train_loss": -25.874942779541016, "global_step": 295015, "epoch": 3554} {"train_loss": -26.0334529876709, "global_step": 295016, "epoch": 3554} {"train_loss": -25.46761703491211, "global_step": 295017, "epoch": 3554} {"train_loss": -25.77616310119629, "global_step": 295018, "epoch": 3554} {"train_loss": -25.885868072509766, "global_step": 295019, "epoch": 3554} {"train_loss": -25.698087692260742, "global_step": 295020, "epoch": 3554} {"train_loss": -25.518827438354492, "global_step": 295021, "epoch": 3554} {"train_loss": -26.005523681640625, "global_step": 295022, "epoch": 3554} {"train_loss": -25.66583824157715, "global_step": 295023, "epoch": 3554} {"train_loss": -25.694555282592773, "global_step": 295024, "epoch": 3554} {"train_loss": -26.121063232421875, "global_step": 295025, "epoch": 3554} {"train_loss": -25.7381534576416, "global_step": 295026, "epoch": 3554} {"train_loss": -25.462955474853516, "global_step": 295027, "epoch": 3554} {"train_loss": -25.896848678588867, "global_step": 295028, "epoch": 3554} {"train_loss": -25.717945098876953, "global_step": 295029, "epoch": 3554} {"train_loss": -25.48948097229004, "global_step": 295030, "epoch": 3554} {"train_loss": -25.80316162109375, "global_step": 295031, "epoch": 3554} {"train_loss": -25.819005966186523, "global_step": 295032, "epoch": 3554} {"train_loss": -25.31545066833496, "global_step": 295033, "epoch": 3554} {"train_loss": -24.369277954101562, "global_step": 295034, "epoch": 3554} {"train_loss": -24.336252212524414, "global_step": 295035, "epoch": 3554} {"train_loss": -23.191205978393555, "global_step": 295036, "epoch": 3554} {"train_loss": -24.504276275634766, "global_step": 295037, "epoch": 3554} {"train_loss": -25.277326583862305, "global_step": 295038, "epoch": 3554} {"train_loss": -24.55650520324707, "global_step": 295039, "epoch": 3554} {"train_loss": -24.682104110717773, "global_step": 295040, "epoch": 3554} {"train_loss": -25.089582443237305, "global_step": 295041, "epoch": 3554} {"train_loss": -24.824031829833984, "global_step": 295042, "epoch": 3554} {"train_loss": -24.96598243713379, "global_step": 295043, "epoch": 3554} {"train_loss": -24.73494529724121, "global_step": 295044, "epoch": 3554} {"train_loss": -25.10947036743164, "global_step": 295045, "epoch": 3554} {"train_loss": -25.023054122924805, "global_step": 295046, "epoch": 3554} {"train_loss": -25.214628219604492, "global_step": 295047, "epoch": 3554} {"train_loss": -25.304166793823242, "global_step": 295048, "epoch": 3554} {"train_loss": -24.73870277404785, "global_step": 295049, "epoch": 3554} {"train_loss": -25.171995162963867, "global_step": 295050, "epoch": 3554} {"train_loss": -25.187097549438477, "global_step": 295051, "epoch": 3554} {"train_loss": -25.67685317993164, "global_step": 295052, "epoch": 3554} {"train_loss": -25.320438385009766, "global_step": 295053, "epoch": 3554} {"train_loss": -25.137311935424805, "global_step": 295054, "epoch": 3554} {"train_loss": -24.805078506469727, "global_step": 295055, "epoch": 3554} {"train_loss": -25.241119384765625, "global_step": 295056, "epoch": 3554} {"train_loss": -25.214313507080078, "global_step": 295057, "epoch": 3554} {"train_loss": -25.56717300415039, "global_step": 295058, "epoch": 3554} {"train_loss": -25.32638931274414, "global_step": 295059, "epoch": 3554} {"train_loss": -25.0715274810791, "global_step": 295060, "epoch": 3554} {"train_loss": -25.374780654907227, "global_step": 295061, "epoch": 3554} {"train_loss": -25.45988655090332, "global_step": 295062, "epoch": 3554} {"train_loss": -25.496505737304688, "global_step": 295063, "epoch": 3554} {"train_loss": -25.306205404810157, "global_step": 295064, "epoch": 3554, "val_loss": 7235913.0} {"train_loss": -25.287275314331055, "global_step": 295065, "epoch": 3555} {"train_loss": -25.612171173095703, "global_step": 295066, "epoch": 3555} {"train_loss": -25.191120147705078, "global_step": 295067, "epoch": 3555} {"train_loss": -25.262540817260742, "global_step": 295068, "epoch": 3555} {"train_loss": -25.249217987060547, "global_step": 295069, "epoch": 3555} {"train_loss": -25.243635177612305, "global_step": 295070, "epoch": 3555} {"train_loss": -25.243207931518555, "global_step": 295071, "epoch": 3555} {"train_loss": -25.49245262145996, "global_step": 295072, "epoch": 3555} {"train_loss": -25.32061004638672, "global_step": 295073, "epoch": 3555} {"train_loss": -25.14590072631836, "global_step": 295074, "epoch": 3555} {"train_loss": -25.47491455078125, "global_step": 295075, "epoch": 3555} {"train_loss": -25.408498764038086, "global_step": 295076, "epoch": 3555} {"train_loss": -25.1066951751709, "global_step": 295077, "epoch": 3555} {"train_loss": -25.193037033081055, "global_step": 295078, "epoch": 3555} {"train_loss": -25.552173614501953, "global_step": 295079, "epoch": 3555} {"train_loss": -25.54728889465332, "global_step": 295080, "epoch": 3555} {"train_loss": -25.322250366210938, "global_step": 295081, "epoch": 3555} {"train_loss": -25.605993270874023, "global_step": 295082, "epoch": 3555} {"train_loss": -25.4166259765625, "global_step": 295083, "epoch": 3555} {"train_loss": -25.080215454101562, "global_step": 295084, "epoch": 3555} {"train_loss": -25.339035034179688, "global_step": 295085, "epoch": 3555} {"train_loss": -25.37507438659668, "global_step": 295086, "epoch": 3555} {"train_loss": -25.76153564453125, "global_step": 295087, "epoch": 3555} {"train_loss": -25.53655433654785, "global_step": 295088, "epoch": 3555} {"train_loss": -25.98407554626465, "global_step": 295089, "epoch": 3555} {"train_loss": -25.458528518676758, "global_step": 295090, "epoch": 3555} {"train_loss": -25.47455406188965, "global_step": 295091, "epoch": 3555} {"train_loss": -25.7225399017334, "global_step": 295092, "epoch": 3555} {"train_loss": -25.627105712890625, "global_step": 295093, "epoch": 3555} {"train_loss": -25.801258087158203, "global_step": 295094, "epoch": 3555} {"train_loss": -25.96036720275879, "global_step": 295095, "epoch": 3555} {"train_loss": -25.736555099487305, "global_step": 295096, "epoch": 3555} {"train_loss": -25.723556518554688, "global_step": 295097, "epoch": 3555} {"train_loss": -25.92551040649414, "global_step": 295098, "epoch": 3555} {"train_loss": -26.011722564697266, "global_step": 295099, "epoch": 3555} {"train_loss": -25.978973388671875, "global_step": 295100, "epoch": 3555} {"train_loss": -25.649023056030273, "global_step": 295101, "epoch": 3555} {"train_loss": -26.0183048248291, "global_step": 295102, "epoch": 3555} {"train_loss": -25.703876495361328, "global_step": 295103, "epoch": 3555} {"train_loss": -25.939374923706055, "global_step": 295104, "epoch": 3555} {"train_loss": -25.98797035217285, "global_step": 295105, "epoch": 3555} {"train_loss": -25.859216690063477, "global_step": 295106, "epoch": 3555} {"train_loss": -25.535036087036133, "global_step": 295107, "epoch": 3555} {"train_loss": -25.755475997924805, "global_step": 295108, "epoch": 3555} {"train_loss": -25.526975631713867, "global_step": 295109, "epoch": 3555} {"train_loss": -25.474367141723633, "global_step": 295110, "epoch": 3555} {"train_loss": -25.690576553344727, "global_step": 295111, "epoch": 3555} {"train_loss": -26.097461700439453, "global_step": 295112, "epoch": 3555} {"train_loss": -25.811208724975586, "global_step": 295113, "epoch": 3555} {"train_loss": -25.454710006713867, "global_step": 295114, "epoch": 3555} {"train_loss": -25.598814010620117, "global_step": 295115, "epoch": 3555} {"train_loss": -25.699216842651367, "global_step": 295116, "epoch": 3555} {"train_loss": -25.61406898498535, "global_step": 295117, "epoch": 3555} {"train_loss": -25.608539581298828, "global_step": 295118, "epoch": 3555} {"train_loss": -25.62151527404785, "global_step": 295119, "epoch": 3555} {"train_loss": -25.77994728088379, "global_step": 295120, "epoch": 3555} {"train_loss": -25.83945083618164, "global_step": 295121, "epoch": 3555} {"train_loss": -25.800891876220703, "global_step": 295122, "epoch": 3555} {"train_loss": -25.536495208740234, "global_step": 295123, "epoch": 3555} {"train_loss": -25.658369064331055, "global_step": 295124, "epoch": 3555} {"train_loss": -25.636194229125977, "global_step": 295125, "epoch": 3555} {"train_loss": -25.46868324279785, "global_step": 295126, "epoch": 3555} {"train_loss": -25.9862003326416, "global_step": 295127, "epoch": 3555} {"train_loss": -25.938053131103516, "global_step": 295128, "epoch": 3555} {"train_loss": -25.817758560180664, "global_step": 295129, "epoch": 3555} {"train_loss": -25.611927032470703, "global_step": 295130, "epoch": 3555} {"train_loss": -25.347761154174805, "global_step": 295131, "epoch": 3555} {"train_loss": -25.873212814331055, "global_step": 295132, "epoch": 3555} {"train_loss": -25.8057804107666, "global_step": 295133, "epoch": 3555} {"train_loss": -25.14252281188965, "global_step": 295134, "epoch": 3555} {"train_loss": -25.09418296813965, "global_step": 295135, "epoch": 3555} {"train_loss": -25.542551040649414, "global_step": 295136, "epoch": 3555} {"train_loss": -26.138660430908203, "global_step": 295137, "epoch": 3555} {"train_loss": -25.84795570373535, "global_step": 295138, "epoch": 3555} {"train_loss": -25.816741943359375, "global_step": 295139, "epoch": 3555} {"train_loss": -25.65789794921875, "global_step": 295140, "epoch": 3555} {"train_loss": -25.476032257080078, "global_step": 295141, "epoch": 3555} {"train_loss": -25.639846801757812, "global_step": 295142, "epoch": 3555} {"train_loss": -25.53663444519043, "global_step": 295143, "epoch": 3555} {"train_loss": -25.91444969177246, "global_step": 295144, "epoch": 3555} {"train_loss": -25.728967666625977, "global_step": 295145, "epoch": 3555} {"train_loss": -25.848926544189453, "global_step": 295146, "epoch": 3555} {"train_loss": -25.623696683401086, "global_step": 295147, "epoch": 3555, "val_loss": 7158417.5} {"train_loss": -23.776443481445312, "global_step": 295148, "epoch": 3556} {"train_loss": -23.28299903869629, "global_step": 295149, "epoch": 3556} {"train_loss": -24.354705810546875, "global_step": 295150, "epoch": 3556} {"train_loss": -24.7103328704834, "global_step": 295151, "epoch": 3556} {"train_loss": -24.817197799682617, "global_step": 295152, "epoch": 3556} {"train_loss": -25.07433319091797, "global_step": 295153, "epoch": 3556} {"train_loss": -24.595874786376953, "global_step": 295154, "epoch": 3556} {"train_loss": -25.046607971191406, "global_step": 295155, "epoch": 3556} {"train_loss": -24.87427520751953, "global_step": 295156, "epoch": 3556} {"train_loss": -25.084386825561523, "global_step": 295157, "epoch": 3556} {"train_loss": -25.438339233398438, "global_step": 295158, "epoch": 3556} {"train_loss": -24.92234230041504, "global_step": 295159, "epoch": 3556} {"train_loss": -24.779653549194336, "global_step": 295160, "epoch": 3556} {"train_loss": -24.625396728515625, "global_step": 295161, "epoch": 3556} {"train_loss": -24.83648681640625, "global_step": 295162, "epoch": 3556} {"train_loss": -25.44563102722168, "global_step": 295163, "epoch": 3556} {"train_loss": -24.838491439819336, "global_step": 295164, "epoch": 3556} {"train_loss": -25.39033317565918, "global_step": 295165, "epoch": 3556} {"train_loss": -24.969541549682617, "global_step": 295166, "epoch": 3556} {"train_loss": -25.473800659179688, "global_step": 295167, "epoch": 3556} {"train_loss": -25.574758529663086, "global_step": 295168, "epoch": 3556} {"train_loss": -25.167150497436523, "global_step": 295169, "epoch": 3556} {"train_loss": -25.063608169555664, "global_step": 295170, "epoch": 3556} {"train_loss": -25.00689697265625, "global_step": 295171, "epoch": 3556} {"train_loss": -25.4099178314209, "global_step": 295172, "epoch": 3556} {"train_loss": -25.713764190673828, "global_step": 295173, "epoch": 3556} {"train_loss": -24.919086456298828, "global_step": 295174, "epoch": 3556} {"train_loss": -26.16290283203125, "global_step": 295175, "epoch": 3556} {"train_loss": -25.422565460205078, "global_step": 295176, "epoch": 3556} {"train_loss": -25.534143447875977, "global_step": 295177, "epoch": 3556} {"train_loss": -25.555320739746094, "global_step": 295178, "epoch": 3556} {"train_loss": -25.523712158203125, "global_step": 295179, "epoch": 3556} {"train_loss": -25.4973201751709, "global_step": 295180, "epoch": 3556} {"train_loss": -25.6123104095459, "global_step": 295181, "epoch": 3556} {"train_loss": -25.79317283630371, "global_step": 295182, "epoch": 3556} {"train_loss": -25.88106346130371, "global_step": 295183, "epoch": 3556} {"train_loss": -25.596935272216797, "global_step": 295184, "epoch": 3556} {"train_loss": -25.897510528564453, "global_step": 295185, "epoch": 3556} {"train_loss": -25.41873550415039, "global_step": 295186, "epoch": 3556} {"train_loss": -25.497968673706055, "global_step": 295187, "epoch": 3556} {"train_loss": -25.6299991607666, "global_step": 295188, "epoch": 3556} {"train_loss": -25.657825469970703, "global_step": 295189, "epoch": 3556} {"train_loss": -25.923429489135742, "global_step": 295190, "epoch": 3556} {"train_loss": -25.446598052978516, "global_step": 295191, "epoch": 3556} {"train_loss": -25.6749267578125, "global_step": 295192, "epoch": 3556} {"train_loss": -25.849149703979492, "global_step": 295193, "epoch": 3556} {"train_loss": -25.973617553710938, "global_step": 295194, "epoch": 3556} {"train_loss": -25.35167121887207, "global_step": 295195, "epoch": 3556} {"train_loss": -25.51443099975586, "global_step": 295196, "epoch": 3556} {"train_loss": -25.689802169799805, "global_step": 295197, "epoch": 3556} {"train_loss": -25.709503173828125, "global_step": 295198, "epoch": 3556} {"train_loss": -25.576053619384766, "global_step": 295199, "epoch": 3556} {"train_loss": -25.938562393188477, "global_step": 295200, "epoch": 3556} {"train_loss": -25.4903564453125, "global_step": 295201, "epoch": 3556} {"train_loss": -25.37672233581543, "global_step": 295202, "epoch": 3556} {"train_loss": -25.906116485595703, "global_step": 295203, "epoch": 3556} {"train_loss": -25.60389518737793, "global_step": 295204, "epoch": 3556} {"train_loss": -25.171499252319336, "global_step": 295205, "epoch": 3556} {"train_loss": -25.438703536987305, "global_step": 295206, "epoch": 3556} {"train_loss": -25.558650970458984, "global_step": 295207, "epoch": 3556} {"train_loss": -25.188568115234375, "global_step": 295208, "epoch": 3556} {"train_loss": -25.644678115844727, "global_step": 295209, "epoch": 3556} {"train_loss": -25.60151481628418, "global_step": 295210, "epoch": 3556} {"train_loss": -25.304357528686523, "global_step": 295211, "epoch": 3556} {"train_loss": -25.814594268798828, "global_step": 295212, "epoch": 3556} {"train_loss": -25.376495361328125, "global_step": 295213, "epoch": 3556} {"train_loss": -25.51549530029297, "global_step": 295214, "epoch": 3556} {"train_loss": -25.6739559173584, "global_step": 295215, "epoch": 3556} {"train_loss": -25.824787139892578, "global_step": 295216, "epoch": 3556} {"train_loss": -25.487634658813477, "global_step": 295217, "epoch": 3556} {"train_loss": -25.33998680114746, "global_step": 295218, "epoch": 3556} {"train_loss": -25.189794540405273, "global_step": 295219, "epoch": 3556} {"train_loss": -25.458389282226562, "global_step": 295220, "epoch": 3556} {"train_loss": -25.352514266967773, "global_step": 295221, "epoch": 3556} {"train_loss": -25.61895751953125, "global_step": 295222, "epoch": 3556} {"train_loss": -25.364322662353516, "global_step": 295223, "epoch": 3556} {"train_loss": -25.304290771484375, "global_step": 295224, "epoch": 3556} {"train_loss": -26.00162696838379, "global_step": 295225, "epoch": 3556} {"train_loss": -25.45857048034668, "global_step": 295226, "epoch": 3556} {"train_loss": -25.625534057617188, "global_step": 295227, "epoch": 3556} {"train_loss": -25.821060180664062, "global_step": 295228, "epoch": 3556} {"train_loss": -25.542869567871094, "global_step": 295229, "epoch": 3556} {"train_loss": -25.387769836977302, "global_step": 295230, "epoch": 3556, "val_loss": 7076155.0} {"train_loss": -24.758756637573242, "global_step": 295231, "epoch": 3557} {"train_loss": -25.161542892456055, "global_step": 295232, "epoch": 3557} {"train_loss": -25.322263717651367, "global_step": 295233, "epoch": 3557} {"train_loss": -24.725788116455078, "global_step": 295234, "epoch": 3557} {"train_loss": -25.136796951293945, "global_step": 295235, "epoch": 3557} {"train_loss": -25.20012855529785, "global_step": 295236, "epoch": 3557} {"train_loss": -25.518512725830078, "global_step": 295237, "epoch": 3557} {"train_loss": -25.320255279541016, "global_step": 295238, "epoch": 3557} {"train_loss": -25.06719970703125, "global_step": 295239, "epoch": 3557} {"train_loss": -25.192581176757812, "global_step": 295240, "epoch": 3557} {"train_loss": -25.431642532348633, "global_step": 295241, "epoch": 3557} {"train_loss": -24.9269962310791, "global_step": 295242, "epoch": 3557} {"train_loss": -25.850919723510742, "global_step": 295243, "epoch": 3557} {"train_loss": -25.25746726989746, "global_step": 295244, "epoch": 3557} {"train_loss": -25.44064712524414, "global_step": 295245, "epoch": 3557} {"train_loss": -25.734426498413086, "global_step": 295246, "epoch": 3557} {"train_loss": -25.84099769592285, "global_step": 295247, "epoch": 3557} {"train_loss": -25.904340744018555, "global_step": 295248, "epoch": 3557} {"train_loss": -25.83515739440918, "global_step": 295249, "epoch": 3557} {"train_loss": -25.636489868164062, "global_step": 295250, "epoch": 3557} {"train_loss": -25.842742919921875, "global_step": 295251, "epoch": 3557} {"train_loss": -25.647857666015625, "global_step": 295252, "epoch": 3557} {"train_loss": -25.446308135986328, "global_step": 295253, "epoch": 3557} {"train_loss": -25.558961868286133, "global_step": 295254, "epoch": 3557} {"train_loss": -25.74444007873535, "global_step": 295255, "epoch": 3557} {"train_loss": -25.681074142456055, "global_step": 295256, "epoch": 3557} {"train_loss": -25.72625732421875, "global_step": 295257, "epoch": 3557} {"train_loss": -25.834857940673828, "global_step": 295258, "epoch": 3557} {"train_loss": -25.691192626953125, "global_step": 295259, "epoch": 3557} {"train_loss": -25.733915328979492, "global_step": 295260, "epoch": 3557} {"train_loss": -25.53073501586914, "global_step": 295261, "epoch": 3557} {"train_loss": -25.570775985717773, "global_step": 295262, "epoch": 3557} {"train_loss": -25.425153732299805, "global_step": 295263, "epoch": 3557} {"train_loss": -25.869827270507812, "global_step": 295264, "epoch": 3557} {"train_loss": -25.54603385925293, "global_step": 295265, "epoch": 3557} {"train_loss": -25.41242790222168, "global_step": 295266, "epoch": 3557} {"train_loss": -25.5024356842041, "global_step": 295267, "epoch": 3557} {"train_loss": -25.674238204956055, "global_step": 295268, "epoch": 3557} {"train_loss": -26.016254425048828, "global_step": 295269, "epoch": 3557} {"train_loss": -25.5231990814209, "global_step": 295270, "epoch": 3557} {"train_loss": -25.662525177001953, "global_step": 295271, "epoch": 3557} {"train_loss": -25.914026260375977, "global_step": 295272, "epoch": 3557} {"train_loss": -26.008163452148438, "global_step": 295273, "epoch": 3557} {"train_loss": -25.70827293395996, "global_step": 295274, "epoch": 3557} {"train_loss": -25.862537384033203, "global_step": 295275, "epoch": 3557} {"train_loss": -25.963150024414062, "global_step": 295276, "epoch": 3557} {"train_loss": -24.991315841674805, "global_step": 295277, "epoch": 3557} {"train_loss": -25.59463882446289, "global_step": 295278, "epoch": 3557} {"train_loss": -25.319690704345703, "global_step": 295279, "epoch": 3557} {"train_loss": -25.312286376953125, "global_step": 295280, "epoch": 3557} {"train_loss": -25.64837074279785, "global_step": 295281, "epoch": 3557} {"train_loss": -25.481679916381836, "global_step": 295282, "epoch": 3557} {"train_loss": -25.607084274291992, "global_step": 295283, "epoch": 3557} {"train_loss": -25.860727310180664, "global_step": 295284, "epoch": 3557} {"train_loss": -25.240713119506836, "global_step": 295285, "epoch": 3557} {"train_loss": -25.726591110229492, "global_step": 295286, "epoch": 3557} {"train_loss": -25.493986129760742, "global_step": 295287, "epoch": 3557} {"train_loss": -25.473773956298828, "global_step": 295288, "epoch": 3557} {"train_loss": -25.860885620117188, "global_step": 295289, "epoch": 3557} {"train_loss": -25.563461303710938, "global_step": 295290, "epoch": 3557} {"train_loss": -25.781721115112305, "global_step": 295291, "epoch": 3557} {"train_loss": -25.935529708862305, "global_step": 295292, "epoch": 3557} {"train_loss": -25.53316307067871, "global_step": 295293, "epoch": 3557} {"train_loss": -25.55371856689453, "global_step": 295294, "epoch": 3557} {"train_loss": -25.718778610229492, "global_step": 295295, "epoch": 3557} {"train_loss": -25.806970596313477, "global_step": 295296, "epoch": 3557} {"train_loss": -25.64607810974121, "global_step": 295297, "epoch": 3557} {"train_loss": -26.140369415283203, "global_step": 295298, "epoch": 3557} {"train_loss": -25.62872314453125, "global_step": 295299, "epoch": 3557} {"train_loss": -25.83330726623535, "global_step": 295300, "epoch": 3557} {"train_loss": -25.457212448120117, "global_step": 295301, "epoch": 3557} {"train_loss": -25.81180191040039, "global_step": 295302, "epoch": 3557} {"train_loss": -25.596704483032227, "global_step": 295303, "epoch": 3557} {"train_loss": -25.854175567626953, "global_step": 295304, "epoch": 3557} {"train_loss": -25.872344970703125, "global_step": 295305, "epoch": 3557} {"train_loss": -25.489185333251953, "global_step": 295306, "epoch": 3557} {"train_loss": -25.518476486206055, "global_step": 295307, "epoch": 3557} {"train_loss": -25.64617347717285, "global_step": 295308, "epoch": 3557} {"train_loss": -25.751611709594727, "global_step": 295309, "epoch": 3557} {"train_loss": -25.383769989013672, "global_step": 295310, "epoch": 3557} {"train_loss": -25.50417137145996, "global_step": 295311, "epoch": 3557} {"train_loss": -25.458219528198242, "global_step": 295312, "epoch": 3557} {"train_loss": -25.569891826215997, "global_step": 295313, "epoch": 3557, "val_loss": 7172353.0} {"train_loss": -24.686939239501953, "global_step": 295314, "epoch": 3558} {"train_loss": -24.35700035095215, "global_step": 295315, "epoch": 3558} {"train_loss": -25.095218658447266, "global_step": 295316, "epoch": 3558} {"train_loss": -25.153547286987305, "global_step": 295317, "epoch": 3558} {"train_loss": -24.660194396972656, "global_step": 295318, "epoch": 3558} {"train_loss": -24.749656677246094, "global_step": 295319, "epoch": 3558} {"train_loss": -25.20330810546875, "global_step": 295320, "epoch": 3558} {"train_loss": -24.952106475830078, "global_step": 295321, "epoch": 3558} {"train_loss": -24.97901725769043, "global_step": 295322, "epoch": 3558} {"train_loss": -25.22782325744629, "global_step": 295323, "epoch": 3558} {"train_loss": -25.386873245239258, "global_step": 295324, "epoch": 3558} {"train_loss": -25.199073791503906, "global_step": 295325, "epoch": 3558} {"train_loss": -25.01887321472168, "global_step": 295326, "epoch": 3558} {"train_loss": -25.10201072692871, "global_step": 295327, "epoch": 3558} {"train_loss": -25.184219360351562, "global_step": 295328, "epoch": 3558} {"train_loss": -25.0965576171875, "global_step": 295329, "epoch": 3558} {"train_loss": -25.403270721435547, "global_step": 295330, "epoch": 3558} {"train_loss": -25.28529167175293, "global_step": 295331, "epoch": 3558} {"train_loss": -25.29950714111328, "global_step": 295332, "epoch": 3558} {"train_loss": -25.182287216186523, "global_step": 295333, "epoch": 3558} {"train_loss": -25.09064292907715, "global_step": 295334, "epoch": 3558} {"train_loss": -25.136070251464844, "global_step": 295335, "epoch": 3558} {"train_loss": -25.32893180847168, "global_step": 295336, "epoch": 3558} {"train_loss": -25.39955711364746, "global_step": 295337, "epoch": 3558} {"train_loss": -25.468833923339844, "global_step": 295338, "epoch": 3558} {"train_loss": -25.752134323120117, "global_step": 295339, "epoch": 3558} {"train_loss": -25.5570125579834, "global_step": 295340, "epoch": 3558} {"train_loss": -25.651220321655273, "global_step": 295341, "epoch": 3558} {"train_loss": -25.43465232849121, "global_step": 295342, "epoch": 3558} {"train_loss": -25.59092140197754, "global_step": 295343, "epoch": 3558} {"train_loss": -25.314611434936523, "global_step": 295344, "epoch": 3558} {"train_loss": -25.72125244140625, "global_step": 295345, "epoch": 3558} {"train_loss": -25.37378692626953, "global_step": 295346, "epoch": 3558} {"train_loss": -25.300003051757812, "global_step": 295347, "epoch": 3558} {"train_loss": -25.4191837310791, "global_step": 295348, "epoch": 3558} {"train_loss": -25.36533546447754, "global_step": 295349, "epoch": 3558} {"train_loss": -26.075687408447266, "global_step": 295350, "epoch": 3558} {"train_loss": -25.8476619720459, "global_step": 295351, "epoch": 3558} {"train_loss": -25.75722312927246, "global_step": 295352, "epoch": 3558} {"train_loss": -25.570219039916992, "global_step": 295353, "epoch": 3558} {"train_loss": -25.6632080078125, "global_step": 295354, "epoch": 3558} {"train_loss": -25.72918128967285, "global_step": 295355, "epoch": 3558} {"train_loss": -25.84747314453125, "global_step": 295356, "epoch": 3558} {"train_loss": -25.409353256225586, "global_step": 295357, "epoch": 3558} {"train_loss": -25.442411422729492, "global_step": 295358, "epoch": 3558} {"train_loss": -25.489017486572266, "global_step": 295359, "epoch": 3558} {"train_loss": -25.74030113220215, "global_step": 295360, "epoch": 3558} {"train_loss": -26.025806427001953, "global_step": 295361, "epoch": 3558} {"train_loss": -25.54798698425293, "global_step": 295362, "epoch": 3558} {"train_loss": -25.83577537536621, "global_step": 295363, "epoch": 3558} {"train_loss": -25.6983699798584, "global_step": 295364, "epoch": 3558} {"train_loss": -25.177934646606445, "global_step": 295365, "epoch": 3558} {"train_loss": -25.796375274658203, "global_step": 295366, "epoch": 3558} {"train_loss": -25.302499771118164, "global_step": 295367, "epoch": 3558} {"train_loss": -25.83626365661621, "global_step": 295368, "epoch": 3558} {"train_loss": -25.616037368774414, "global_step": 295369, "epoch": 3558} {"train_loss": -26.009313583374023, "global_step": 295370, "epoch": 3558} {"train_loss": -25.320280075073242, "global_step": 295371, "epoch": 3558} {"train_loss": -25.460485458374023, "global_step": 295372, "epoch": 3558} {"train_loss": -25.567304611206055, "global_step": 295373, "epoch": 3558} {"train_loss": -25.578115463256836, "global_step": 295374, "epoch": 3558} {"train_loss": -25.750537872314453, "global_step": 295375, "epoch": 3558} {"train_loss": -25.378381729125977, "global_step": 295376, "epoch": 3558} {"train_loss": -25.377073287963867, "global_step": 295377, "epoch": 3558} {"train_loss": -25.574071884155273, "global_step": 295378, "epoch": 3558} {"train_loss": -25.623340606689453, "global_step": 295379, "epoch": 3558} {"train_loss": -25.541975021362305, "global_step": 295380, "epoch": 3558} {"train_loss": -25.9272518157959, "global_step": 295381, "epoch": 3558} {"train_loss": -25.841419219970703, "global_step": 295382, "epoch": 3558} {"train_loss": -25.46807098388672, "global_step": 295383, "epoch": 3558} {"train_loss": -25.58327293395996, "global_step": 295384, "epoch": 3558} {"train_loss": -25.53214454650879, "global_step": 295385, "epoch": 3558} {"train_loss": -25.83040428161621, "global_step": 295386, "epoch": 3558} {"train_loss": -25.769153594970703, "global_step": 295387, "epoch": 3558} {"train_loss": -26.04931640625, "global_step": 295388, "epoch": 3558} {"train_loss": -25.765745162963867, "global_step": 295389, "epoch": 3558} {"train_loss": -25.372333526611328, "global_step": 295390, "epoch": 3558} {"train_loss": -25.742996215820312, "global_step": 295391, "epoch": 3558} {"train_loss": -25.932403564453125, "global_step": 295392, "epoch": 3558} {"train_loss": -25.699909210205078, "global_step": 295393, "epoch": 3558} {"train_loss": -25.4589786529541, "global_step": 295394, "epoch": 3558} {"train_loss": -25.527862548828125, "global_step": 295395, "epoch": 3558} {"train_loss": -25.484387524156684, "global_step": 295396, "epoch": 3558, "val_loss": 7035276.0} {"train_loss": -21.409738540649414, "global_step": 295397, "epoch": 3559} {"train_loss": -23.12626838684082, "global_step": 295398, "epoch": 3559} {"train_loss": -24.014822006225586, "global_step": 295399, "epoch": 3559} {"train_loss": -23.2828311920166, "global_step": 295400, "epoch": 3559} {"train_loss": -23.991199493408203, "global_step": 295401, "epoch": 3559} {"train_loss": -24.0681209564209, "global_step": 295402, "epoch": 3559} {"train_loss": -24.3920841217041, "global_step": 295403, "epoch": 3559} {"train_loss": -23.98936653137207, "global_step": 295404, "epoch": 3559} {"train_loss": -24.506816864013672, "global_step": 295405, "epoch": 3559} {"train_loss": -24.240385055541992, "global_step": 295406, "epoch": 3559} {"train_loss": -24.504180908203125, "global_step": 295407, "epoch": 3559} {"train_loss": -24.556005477905273, "global_step": 295408, "epoch": 3559} {"train_loss": -24.562259674072266, "global_step": 295409, "epoch": 3559} {"train_loss": -24.744800567626953, "global_step": 295410, "epoch": 3559} {"train_loss": -24.70926856994629, "global_step": 295411, "epoch": 3559} {"train_loss": -24.5662899017334, "global_step": 295412, "epoch": 3559} {"train_loss": -24.766910552978516, "global_step": 295413, "epoch": 3559} {"train_loss": -24.55963706970215, "global_step": 295414, "epoch": 3559} {"train_loss": -24.700048446655273, "global_step": 295415, "epoch": 3559} {"train_loss": -24.57904052734375, "global_step": 295416, "epoch": 3559} {"train_loss": -24.84469985961914, "global_step": 295417, "epoch": 3559} {"train_loss": -24.908798217773438, "global_step": 295418, "epoch": 3559} {"train_loss": -25.181570053100586, "global_step": 295419, "epoch": 3559} {"train_loss": -24.997875213623047, "global_step": 295420, "epoch": 3559} {"train_loss": -24.907438278198242, "global_step": 295421, "epoch": 3559} {"train_loss": -25.029220581054688, "global_step": 295422, "epoch": 3559} {"train_loss": -25.07118797302246, "global_step": 295423, "epoch": 3559} {"train_loss": -24.698347091674805, "global_step": 295424, "epoch": 3559} {"train_loss": -24.910215377807617, "global_step": 295425, "epoch": 3559} {"train_loss": -24.823230743408203, "global_step": 295426, "epoch": 3559} {"train_loss": -25.029146194458008, "global_step": 295427, "epoch": 3559} {"train_loss": -25.195463180541992, "global_step": 295428, "epoch": 3559} {"train_loss": -25.325180053710938, "global_step": 295429, "epoch": 3559} {"train_loss": -25.324804306030273, "global_step": 295430, "epoch": 3559} {"train_loss": -25.099279403686523, "global_step": 295431, "epoch": 3559} {"train_loss": -25.190275192260742, "global_step": 295432, "epoch": 3559} {"train_loss": -25.474838256835938, "global_step": 295433, "epoch": 3559} {"train_loss": -25.06135368347168, "global_step": 295434, "epoch": 3559} {"train_loss": -25.441694259643555, "global_step": 295435, "epoch": 3559} {"train_loss": -25.224287033081055, "global_step": 295436, "epoch": 3559} {"train_loss": -25.343626022338867, "global_step": 295437, "epoch": 3559} {"train_loss": -25.23199462890625, "global_step": 295438, "epoch": 3559} {"train_loss": -25.5824031829834, "global_step": 295439, "epoch": 3559} {"train_loss": -25.152177810668945, "global_step": 295440, "epoch": 3559} {"train_loss": -25.295949935913086, "global_step": 295441, "epoch": 3559} {"train_loss": -25.419782638549805, "global_step": 295442, "epoch": 3559} {"train_loss": -25.48408317565918, "global_step": 295443, "epoch": 3559} {"train_loss": -25.21478843688965, "global_step": 295444, "epoch": 3559} {"train_loss": -25.20448875427246, "global_step": 295445, "epoch": 3559} {"train_loss": -25.110288619995117, "global_step": 295446, "epoch": 3559} {"train_loss": -25.25277328491211, "global_step": 295447, "epoch": 3559} {"train_loss": -25.235265731811523, "global_step": 295448, "epoch": 3559} {"train_loss": -25.171552658081055, "global_step": 295449, "epoch": 3559} {"train_loss": -25.294099807739258, "global_step": 295450, "epoch": 3559} {"train_loss": -25.36414909362793, "global_step": 295451, "epoch": 3559} {"train_loss": -25.668203353881836, "global_step": 295452, "epoch": 3559} {"train_loss": -25.636316299438477, "global_step": 295453, "epoch": 3559} {"train_loss": -25.583383560180664, "global_step": 295454, "epoch": 3559} {"train_loss": -25.351226806640625, "global_step": 295455, "epoch": 3559} {"train_loss": -24.885650634765625, "global_step": 295456, "epoch": 3559} {"train_loss": -25.4426326751709, "global_step": 295457, "epoch": 3559} {"train_loss": -25.728775024414062, "global_step": 295458, "epoch": 3559} {"train_loss": -25.424745559692383, "global_step": 295459, "epoch": 3559} {"train_loss": -25.306716918945312, "global_step": 295460, "epoch": 3559} {"train_loss": -25.594778060913086, "global_step": 295461, "epoch": 3559} {"train_loss": -25.69573402404785, "global_step": 295462, "epoch": 3559} {"train_loss": -25.274961471557617, "global_step": 295463, "epoch": 3559} {"train_loss": -25.753986358642578, "global_step": 295464, "epoch": 3559} {"train_loss": -25.59014892578125, "global_step": 295465, "epoch": 3559} {"train_loss": -25.451841354370117, "global_step": 295466, "epoch": 3559} {"train_loss": -25.272449493408203, "global_step": 295467, "epoch": 3559} {"train_loss": -25.36942481994629, "global_step": 295468, "epoch": 3559} {"train_loss": -25.696928024291992, "global_step": 295469, "epoch": 3559} {"train_loss": -25.56804847717285, "global_step": 295470, "epoch": 3559} {"train_loss": -25.880842208862305, "global_step": 295471, "epoch": 3559} {"train_loss": -25.456220626831055, "global_step": 295472, "epoch": 3559} {"train_loss": -25.705154418945312, "global_step": 295473, "epoch": 3559} {"train_loss": -25.777057647705078, "global_step": 295474, "epoch": 3559} {"train_loss": -25.815311431884766, "global_step": 295475, "epoch": 3559} {"train_loss": -25.718549728393555, "global_step": 295476, "epoch": 3559} {"train_loss": -25.573266983032227, "global_step": 295477, "epoch": 3559} {"train_loss": -25.767780303955078, "global_step": 295478, "epoch": 3559} {"train_loss": -25.036781173154534, "global_step": 295479, "epoch": 3559, "val_loss": 7189145.0} {"train_loss": -25.145071029663086, "global_step": 295480, "epoch": 3560} {"train_loss": -25.48487663269043, "global_step": 295481, "epoch": 3560} {"train_loss": -25.61488151550293, "global_step": 295482, "epoch": 3560} {"train_loss": -24.99647331237793, "global_step": 295483, "epoch": 3560} {"train_loss": -25.246715545654297, "global_step": 295484, "epoch": 3560} {"train_loss": -25.448591232299805, "global_step": 295485, "epoch": 3560} {"train_loss": -25.420291900634766, "global_step": 295486, "epoch": 3560} {"train_loss": -25.170902252197266, "global_step": 295487, "epoch": 3560} {"train_loss": -25.253070831298828, "global_step": 295488, "epoch": 3560} {"train_loss": -25.0413875579834, "global_step": 295489, "epoch": 3560} {"train_loss": -25.70395278930664, "global_step": 295490, "epoch": 3560} {"train_loss": -25.78034019470215, "global_step": 295491, "epoch": 3560} {"train_loss": -25.34380340576172, "global_step": 295492, "epoch": 3560} {"train_loss": -25.340988159179688, "global_step": 295493, "epoch": 3560} {"train_loss": -25.4475040435791, "global_step": 295494, "epoch": 3560} {"train_loss": -25.33821678161621, "global_step": 295495, "epoch": 3560} {"train_loss": -25.486785888671875, "global_step": 295496, "epoch": 3560} {"train_loss": -25.650232315063477, "global_step": 295497, "epoch": 3560} {"train_loss": -25.49281120300293, "global_step": 295498, "epoch": 3560} {"train_loss": -25.418954849243164, "global_step": 295499, "epoch": 3560} {"train_loss": -25.703399658203125, "global_step": 295500, "epoch": 3560} {"train_loss": -25.198333740234375, "global_step": 295501, "epoch": 3560} {"train_loss": -25.24671745300293, "global_step": 295502, "epoch": 3560} {"train_loss": -25.32552719116211, "global_step": 295503, "epoch": 3560} {"train_loss": -25.93106460571289, "global_step": 295504, "epoch": 3560} {"train_loss": -25.233596801757812, "global_step": 295505, "epoch": 3560} {"train_loss": -25.838830947875977, "global_step": 295506, "epoch": 3560} {"train_loss": -25.61842918395996, "global_step": 295507, "epoch": 3560} {"train_loss": -25.249313354492188, "global_step": 295508, "epoch": 3560} {"train_loss": -25.504358291625977, "global_step": 295509, "epoch": 3560} {"train_loss": -25.629858016967773, "global_step": 295510, "epoch": 3560} {"train_loss": -25.66704750061035, "global_step": 295511, "epoch": 3560} {"train_loss": -25.65814781188965, "global_step": 295512, "epoch": 3560} {"train_loss": -25.38168716430664, "global_step": 295513, "epoch": 3560} {"train_loss": -25.41021728515625, "global_step": 295514, "epoch": 3560} {"train_loss": -25.566980361938477, "global_step": 295515, "epoch": 3560} {"train_loss": -25.6284236907959, "global_step": 295516, "epoch": 3560} {"train_loss": -25.739688873291016, "global_step": 295517, "epoch": 3560} {"train_loss": -25.827075958251953, "global_step": 295518, "epoch": 3560} {"train_loss": -25.348331451416016, "global_step": 295519, "epoch": 3560} {"train_loss": -25.7108211517334, "global_step": 295520, "epoch": 3560} {"train_loss": -25.880115509033203, "global_step": 295521, "epoch": 3560} {"train_loss": -25.47036361694336, "global_step": 295522, "epoch": 3560} {"train_loss": -25.978979110717773, "global_step": 295523, "epoch": 3560} {"train_loss": -25.67976951599121, "global_step": 295524, "epoch": 3560} {"train_loss": -25.433696746826172, "global_step": 295525, "epoch": 3560} {"train_loss": -25.609323501586914, "global_step": 295526, "epoch": 3560} {"train_loss": -25.957250595092773, "global_step": 295527, "epoch": 3560} {"train_loss": -25.59842872619629, "global_step": 295528, "epoch": 3560} {"train_loss": -25.683109283447266, "global_step": 295529, "epoch": 3560} {"train_loss": -25.82834243774414, "global_step": 295530, "epoch": 3560} {"train_loss": -25.370176315307617, "global_step": 295531, "epoch": 3560} {"train_loss": -25.98431396484375, "global_step": 295532, "epoch": 3560} {"train_loss": -25.816213607788086, "global_step": 295533, "epoch": 3560} {"train_loss": -25.369300842285156, "global_step": 295534, "epoch": 3560} {"train_loss": -25.279226303100586, "global_step": 295535, "epoch": 3560} {"train_loss": -24.799280166625977, "global_step": 295536, "epoch": 3560} {"train_loss": -24.92998695373535, "global_step": 295537, "epoch": 3560} {"train_loss": -25.351062774658203, "global_step": 295538, "epoch": 3560} {"train_loss": -25.666889190673828, "global_step": 295539, "epoch": 3560} {"train_loss": -25.51685905456543, "global_step": 295540, "epoch": 3560} {"train_loss": -25.710479736328125, "global_step": 295541, "epoch": 3560} {"train_loss": -25.35321617126465, "global_step": 295542, "epoch": 3560} {"train_loss": -25.576448440551758, "global_step": 295543, "epoch": 3560} {"train_loss": -25.273359298706055, "global_step": 295544, "epoch": 3560} {"train_loss": -25.815170288085938, "global_step": 295545, "epoch": 3560} {"train_loss": -25.50431251525879, "global_step": 295546, "epoch": 3560} {"train_loss": -25.60211753845215, "global_step": 295547, "epoch": 3560} {"train_loss": -25.74226188659668, "global_step": 295548, "epoch": 3560} {"train_loss": -25.359792709350586, "global_step": 295549, "epoch": 3560} {"train_loss": -25.5097599029541, "global_step": 295550, "epoch": 3560} {"train_loss": -25.76369285583496, "global_step": 295551, "epoch": 3560} {"train_loss": -25.984106063842773, "global_step": 295552, "epoch": 3560} {"train_loss": -25.599096298217773, "global_step": 295553, "epoch": 3560} {"train_loss": -25.550580978393555, "global_step": 295554, "epoch": 3560} {"train_loss": -25.863061904907227, "global_step": 295555, "epoch": 3560} {"train_loss": -25.623443603515625, "global_step": 295556, "epoch": 3560} {"train_loss": -25.848154067993164, "global_step": 295557, "epoch": 3560} {"train_loss": -25.279584884643555, "global_step": 295558, "epoch": 3560} {"train_loss": -25.8509464263916, "global_step": 295559, "epoch": 3560} {"train_loss": -25.33729362487793, "global_step": 295560, "epoch": 3560} {"train_loss": -25.889572143554688, "global_step": 295561, "epoch": 3560} {"train_loss": -25.527893089386353, "global_step": 295562, "epoch": 3560, "val_loss": 7113485.0} {"train_loss": -25.028905868530273, "global_step": 295563, "epoch": 3561} {"train_loss": -24.99835968017578, "global_step": 295564, "epoch": 3561} {"train_loss": -25.208955764770508, "global_step": 295565, "epoch": 3561} {"train_loss": -25.07753562927246, "global_step": 295566, "epoch": 3561} {"train_loss": -25.17088508605957, "global_step": 295567, "epoch": 3561} {"train_loss": -25.128332138061523, "global_step": 295568, "epoch": 3561} {"train_loss": -25.039682388305664, "global_step": 295569, "epoch": 3561} {"train_loss": -25.578527450561523, "global_step": 295570, "epoch": 3561} {"train_loss": -25.449548721313477, "global_step": 295571, "epoch": 3561} {"train_loss": -25.53969383239746, "global_step": 295572, "epoch": 3561} {"train_loss": -25.674652099609375, "global_step": 295573, "epoch": 3561} {"train_loss": -25.23509979248047, "global_step": 295574, "epoch": 3561} {"train_loss": -25.2069149017334, "global_step": 295575, "epoch": 3561} {"train_loss": -25.35969352722168, "global_step": 295576, "epoch": 3561} {"train_loss": -25.310564041137695, "global_step": 295577, "epoch": 3561} {"train_loss": -25.64588737487793, "global_step": 295578, "epoch": 3561} {"train_loss": -25.48689842224121, "global_step": 295579, "epoch": 3561} {"train_loss": -25.541690826416016, "global_step": 295580, "epoch": 3561} {"train_loss": -25.70674705505371, "global_step": 295581, "epoch": 3561} {"train_loss": -25.6303653717041, "global_step": 295582, "epoch": 3561} {"train_loss": -25.692243576049805, "global_step": 295583, "epoch": 3561} {"train_loss": -25.77495765686035, "global_step": 295584, "epoch": 3561} {"train_loss": -25.532590866088867, "global_step": 295585, "epoch": 3561} {"train_loss": -25.464818954467773, "global_step": 295586, "epoch": 3561} {"train_loss": -25.67934226989746, "global_step": 295587, "epoch": 3561} {"train_loss": -25.864980697631836, "global_step": 295588, "epoch": 3561} {"train_loss": -25.422983169555664, "global_step": 295589, "epoch": 3561} {"train_loss": -26.025802612304688, "global_step": 295590, "epoch": 3561} {"train_loss": -25.773426055908203, "global_step": 295591, "epoch": 3561} {"train_loss": -25.504175186157227, "global_step": 295592, "epoch": 3561} {"train_loss": -26.019384384155273, "global_step": 295593, "epoch": 3561} {"train_loss": -25.87700843811035, "global_step": 295594, "epoch": 3561} {"train_loss": -25.902402877807617, "global_step": 295595, "epoch": 3561} {"train_loss": -25.362831115722656, "global_step": 295596, "epoch": 3561} {"train_loss": -25.763486862182617, "global_step": 295597, "epoch": 3561} {"train_loss": -25.510774612426758, "global_step": 295598, "epoch": 3561} {"train_loss": -25.335966110229492, "global_step": 295599, "epoch": 3561} {"train_loss": -25.484207153320312, "global_step": 295600, "epoch": 3561} {"train_loss": -25.80242347717285, "global_step": 295601, "epoch": 3561} {"train_loss": -25.76970863342285, "global_step": 295602, "epoch": 3561} {"train_loss": -25.833642959594727, "global_step": 295603, "epoch": 3561} {"train_loss": -26.00725746154785, "global_step": 295604, "epoch": 3561} {"train_loss": -25.722564697265625, "global_step": 295605, "epoch": 3561} {"train_loss": -25.598529815673828, "global_step": 295606, "epoch": 3561} {"train_loss": -25.641660690307617, "global_step": 295607, "epoch": 3561} {"train_loss": -25.349761962890625, "global_step": 295608, "epoch": 3561} {"train_loss": -25.48906898498535, "global_step": 295609, "epoch": 3561} {"train_loss": -26.011474609375, "global_step": 295610, "epoch": 3561} {"train_loss": -25.751432418823242, "global_step": 295611, "epoch": 3561} {"train_loss": -25.42769432067871, "global_step": 295612, "epoch": 3561} {"train_loss": -25.51694107055664, "global_step": 295613, "epoch": 3561} {"train_loss": -25.91864585876465, "global_step": 295614, "epoch": 3561} {"train_loss": -25.580698013305664, "global_step": 295615, "epoch": 3561} {"train_loss": -25.397470474243164, "global_step": 295616, "epoch": 3561} {"train_loss": -25.577301025390625, "global_step": 295617, "epoch": 3561} {"train_loss": -25.875274658203125, "global_step": 295618, "epoch": 3561} {"train_loss": -25.65467643737793, "global_step": 295619, "epoch": 3561} {"train_loss": -25.767532348632812, "global_step": 295620, "epoch": 3561} {"train_loss": -25.815963745117188, "global_step": 295621, "epoch": 3561} {"train_loss": -25.796762466430664, "global_step": 295622, "epoch": 3561} {"train_loss": -25.847543716430664, "global_step": 295623, "epoch": 3561} {"train_loss": -25.307668685913086, "global_step": 295624, "epoch": 3561} {"train_loss": -25.41961669921875, "global_step": 295625, "epoch": 3561} {"train_loss": -25.638593673706055, "global_step": 295626, "epoch": 3561} {"train_loss": -26.12360191345215, "global_step": 295627, "epoch": 3561} {"train_loss": -25.364904403686523, "global_step": 295628, "epoch": 3561} {"train_loss": -25.80586814880371, "global_step": 295629, "epoch": 3561} {"train_loss": -25.44473648071289, "global_step": 295630, "epoch": 3561} {"train_loss": -25.367076873779297, "global_step": 295631, "epoch": 3561} {"train_loss": -25.728687286376953, "global_step": 295632, "epoch": 3561} {"train_loss": -25.2437686920166, "global_step": 295633, "epoch": 3561} {"train_loss": -25.582361221313477, "global_step": 295634, "epoch": 3561} {"train_loss": -25.530481338500977, "global_step": 295635, "epoch": 3561} {"train_loss": -25.761022567749023, "global_step": 295636, "epoch": 3561} {"train_loss": -25.615156173706055, "global_step": 295637, "epoch": 3561} {"train_loss": -25.41244888305664, "global_step": 295638, "epoch": 3561} {"train_loss": -25.726110458374023, "global_step": 295639, "epoch": 3561} {"train_loss": -25.625146865844727, "global_step": 295640, "epoch": 3561} {"train_loss": -25.732105255126953, "global_step": 295641, "epoch": 3561} {"train_loss": -25.455799102783203, "global_step": 295642, "epoch": 3561} {"train_loss": -25.966367721557617, "global_step": 295643, "epoch": 3561} {"train_loss": -25.4063720703125, "global_step": 295644, "epoch": 3561} {"train_loss": -25.581278789474304, "global_step": 295645, "epoch": 3561, "val_loss": 7228267.0} {"train_loss": -24.209341049194336, "global_step": 295646, "epoch": 3562} {"train_loss": -24.680648803710938, "global_step": 295647, "epoch": 3562} {"train_loss": -25.118457794189453, "global_step": 295648, "epoch": 3562} {"train_loss": -24.210205078125, "global_step": 295649, "epoch": 3562} {"train_loss": -24.79193687438965, "global_step": 295650, "epoch": 3562} {"train_loss": -24.430110931396484, "global_step": 295651, "epoch": 3562} {"train_loss": -25.089200973510742, "global_step": 295652, "epoch": 3562} {"train_loss": -24.719802856445312, "global_step": 295653, "epoch": 3562} {"train_loss": -24.6796932220459, "global_step": 295654, "epoch": 3562} {"train_loss": -24.92637062072754, "global_step": 295655, "epoch": 3562} {"train_loss": -24.663156509399414, "global_step": 295656, "epoch": 3562} {"train_loss": -24.62140464782715, "global_step": 295657, "epoch": 3562} {"train_loss": -25.313894271850586, "global_step": 295658, "epoch": 3562} {"train_loss": -24.959745407104492, "global_step": 295659, "epoch": 3562} {"train_loss": -25.014375686645508, "global_step": 295660, "epoch": 3562} {"train_loss": -25.413257598876953, "global_step": 295661, "epoch": 3562} {"train_loss": -25.289886474609375, "global_step": 295662, "epoch": 3562} {"train_loss": -25.31281089782715, "global_step": 295663, "epoch": 3562} {"train_loss": -25.274351119995117, "global_step": 295664, "epoch": 3562} {"train_loss": -25.58475112915039, "global_step": 295665, "epoch": 3562} {"train_loss": -25.042539596557617, "global_step": 295666, "epoch": 3562} {"train_loss": -25.496801376342773, "global_step": 295667, "epoch": 3562} {"train_loss": -25.326553344726562, "global_step": 295668, "epoch": 3562} {"train_loss": -25.359832763671875, "global_step": 295669, "epoch": 3562} {"train_loss": -25.59116554260254, "global_step": 295670, "epoch": 3562} {"train_loss": -25.570035934448242, "global_step": 295671, "epoch": 3562} {"train_loss": -25.535409927368164, "global_step": 295672, "epoch": 3562} {"train_loss": -25.034820556640625, "global_step": 295673, "epoch": 3562} {"train_loss": -25.401214599609375, "global_step": 295674, "epoch": 3562} {"train_loss": -25.495254516601562, "global_step": 295675, "epoch": 3562} {"train_loss": -25.782501220703125, "global_step": 295676, "epoch": 3562} {"train_loss": -25.320327758789062, "global_step": 295677, "epoch": 3562} {"train_loss": -25.621191024780273, "global_step": 295678, "epoch": 3562} {"train_loss": -25.2585391998291, "global_step": 295679, "epoch": 3562} {"train_loss": -25.18491554260254, "global_step": 295680, "epoch": 3562} {"train_loss": -25.514667510986328, "global_step": 295681, "epoch": 3562} {"train_loss": -25.595043182373047, "global_step": 295682, "epoch": 3562} {"train_loss": -25.661792755126953, "global_step": 295683, "epoch": 3562} {"train_loss": -25.786941528320312, "global_step": 295684, "epoch": 3562} {"train_loss": -25.664499282836914, "global_step": 295685, "epoch": 3562} {"train_loss": -25.643884658813477, "global_step": 295686, "epoch": 3562} {"train_loss": -25.168058395385742, "global_step": 295687, "epoch": 3562} {"train_loss": -25.660720825195312, "global_step": 295688, "epoch": 3562} {"train_loss": -25.359479904174805, "global_step": 295689, "epoch": 3562} {"train_loss": -25.5201358795166, "global_step": 295690, "epoch": 3562} {"train_loss": -25.669702529907227, "global_step": 295691, "epoch": 3562} {"train_loss": -25.453899383544922, "global_step": 295692, "epoch": 3562} {"train_loss": -25.896320343017578, "global_step": 295693, "epoch": 3562} {"train_loss": -25.843719482421875, "global_step": 295694, "epoch": 3562} {"train_loss": -25.57608985900879, "global_step": 295695, "epoch": 3562} {"train_loss": -25.8470401763916, "global_step": 295696, "epoch": 3562} {"train_loss": -25.620718002319336, "global_step": 295697, "epoch": 3562} {"train_loss": -25.90247917175293, "global_step": 295698, "epoch": 3562} {"train_loss": -25.546369552612305, "global_step": 295699, "epoch": 3562} {"train_loss": -25.72513771057129, "global_step": 295700, "epoch": 3562} {"train_loss": -25.55498504638672, "global_step": 295701, "epoch": 3562} {"train_loss": -25.7862491607666, "global_step": 295702, "epoch": 3562} {"train_loss": -25.915658950805664, "global_step": 295703, "epoch": 3562} {"train_loss": -25.80078125, "global_step": 295704, "epoch": 3562} {"train_loss": -25.863134384155273, "global_step": 295705, "epoch": 3562} {"train_loss": -25.867053985595703, "global_step": 295706, "epoch": 3562} {"train_loss": -25.64630699157715, "global_step": 295707, "epoch": 3562} {"train_loss": -25.65407371520996, "global_step": 295708, "epoch": 3562} {"train_loss": -25.777509689331055, "global_step": 295709, "epoch": 3562} {"train_loss": -25.56606101989746, "global_step": 295710, "epoch": 3562} {"train_loss": -25.522911071777344, "global_step": 295711, "epoch": 3562} {"train_loss": -25.709192276000977, "global_step": 295712, "epoch": 3562} {"train_loss": -25.63720703125, "global_step": 295713, "epoch": 3562} {"train_loss": -25.809431076049805, "global_step": 295714, "epoch": 3562} {"train_loss": -25.839771270751953, "global_step": 295715, "epoch": 3562} {"train_loss": -25.710407257080078, "global_step": 295716, "epoch": 3562} {"train_loss": -25.261661529541016, "global_step": 295717, "epoch": 3562} {"train_loss": -25.198856353759766, "global_step": 295718, "epoch": 3562} {"train_loss": -25.672224044799805, "global_step": 295719, "epoch": 3562} {"train_loss": -25.93556022644043, "global_step": 295720, "epoch": 3562} {"train_loss": -25.50973129272461, "global_step": 295721, "epoch": 3562} {"train_loss": -25.714963912963867, "global_step": 295722, "epoch": 3562} {"train_loss": -25.525609970092773, "global_step": 295723, "epoch": 3562} {"train_loss": -25.2804012298584, "global_step": 295724, "epoch": 3562} {"train_loss": -25.19784927368164, "global_step": 295725, "epoch": 3562} {"train_loss": -25.45509147644043, "global_step": 295726, "epoch": 3562} {"train_loss": -25.300521850585938, "global_step": 295727, "epoch": 3562} {"train_loss": -25.41795739782862, "global_step": 295728, "epoch": 3562, "val_loss": 7060061.5} {"train_loss": -21.215810775756836, "global_step": 295729, "epoch": 3563} {"train_loss": -23.754905700683594, "global_step": 295730, "epoch": 3563} {"train_loss": -22.87874412536621, "global_step": 295731, "epoch": 3563} {"train_loss": -24.1146240234375, "global_step": 295732, "epoch": 3563} {"train_loss": -23.849369049072266, "global_step": 295733, "epoch": 3563} {"train_loss": -23.671371459960938, "global_step": 295734, "epoch": 3563} {"train_loss": -24.381702423095703, "global_step": 295735, "epoch": 3563} {"train_loss": -24.3537654876709, "global_step": 295736, "epoch": 3563} {"train_loss": -24.24213981628418, "global_step": 295737, "epoch": 3563} {"train_loss": -24.385358810424805, "global_step": 295738, "epoch": 3563} {"train_loss": -24.448213577270508, "global_step": 295739, "epoch": 3563} {"train_loss": -24.260093688964844, "global_step": 295740, "epoch": 3563} {"train_loss": -24.456235885620117, "global_step": 295741, "epoch": 3563} {"train_loss": -24.492807388305664, "global_step": 295742, "epoch": 3563} {"train_loss": -24.17107582092285, "global_step": 295743, "epoch": 3563} {"train_loss": -24.429250717163086, "global_step": 295744, "epoch": 3563} {"train_loss": -24.3627986907959, "global_step": 295745, "epoch": 3563} {"train_loss": -24.783187866210938, "global_step": 295746, "epoch": 3563} {"train_loss": -24.68669891357422, "global_step": 295747, "epoch": 3563} {"train_loss": -24.378787994384766, "global_step": 295748, "epoch": 3563} {"train_loss": -24.91187286376953, "global_step": 295749, "epoch": 3563} {"train_loss": -24.42416763305664, "global_step": 295750, "epoch": 3563} {"train_loss": -24.843679428100586, "global_step": 295751, "epoch": 3563} {"train_loss": -24.940961837768555, "global_step": 295752, "epoch": 3563} {"train_loss": -24.7957820892334, "global_step": 295753, "epoch": 3563} {"train_loss": -24.5376033782959, "global_step": 295754, "epoch": 3563} {"train_loss": -24.808063507080078, "global_step": 295755, "epoch": 3563} {"train_loss": -24.935197830200195, "global_step": 295756, "epoch": 3563} {"train_loss": -25.251283645629883, "global_step": 295757, "epoch": 3563} {"train_loss": -25.155668258666992, "global_step": 295758, "epoch": 3563} {"train_loss": -25.1380558013916, "global_step": 295759, "epoch": 3563} {"train_loss": -25.34707260131836, "global_step": 295760, "epoch": 3563} {"train_loss": -25.1778507232666, "global_step": 295761, "epoch": 3563} {"train_loss": -25.130361557006836, "global_step": 295762, "epoch": 3563} {"train_loss": -25.016401290893555, "global_step": 295763, "epoch": 3563} {"train_loss": -25.271343231201172, "global_step": 295764, "epoch": 3563} {"train_loss": -25.407337188720703, "global_step": 295765, "epoch": 3563} {"train_loss": -25.346622467041016, "global_step": 295766, "epoch": 3563} {"train_loss": -25.213239669799805, "global_step": 295767, "epoch": 3563} {"train_loss": -25.46503448486328, "global_step": 295768, "epoch": 3563} {"train_loss": -25.37997817993164, "global_step": 295769, "epoch": 3563} {"train_loss": -25.504907608032227, "global_step": 295770, "epoch": 3563} {"train_loss": -25.296689987182617, "global_step": 295771, "epoch": 3563} {"train_loss": -25.154027938842773, "global_step": 295772, "epoch": 3563} {"train_loss": -25.362966537475586, "global_step": 295773, "epoch": 3563} {"train_loss": -25.301542282104492, "global_step": 295774, "epoch": 3563} {"train_loss": -25.4455509185791, "global_step": 295775, "epoch": 3563} {"train_loss": -25.519412994384766, "global_step": 295776, "epoch": 3563} {"train_loss": -25.568649291992188, "global_step": 295777, "epoch": 3563} {"train_loss": -25.243518829345703, "global_step": 295778, "epoch": 3563} {"train_loss": -25.56325340270996, "global_step": 295779, "epoch": 3563} {"train_loss": -25.463083267211914, "global_step": 295780, "epoch": 3563} {"train_loss": -25.46087074279785, "global_step": 295781, "epoch": 3563} {"train_loss": -25.37217140197754, "global_step": 295782, "epoch": 3563} {"train_loss": -25.446353912353516, "global_step": 295783, "epoch": 3563} {"train_loss": -25.405332565307617, "global_step": 295784, "epoch": 3563} {"train_loss": -25.04107093811035, "global_step": 295785, "epoch": 3563} {"train_loss": -25.517560958862305, "global_step": 295786, "epoch": 3563} {"train_loss": -25.845279693603516, "global_step": 295787, "epoch": 3563} {"train_loss": -25.3856201171875, "global_step": 295788, "epoch": 3563} {"train_loss": -25.42652702331543, "global_step": 295789, "epoch": 3563} {"train_loss": -25.408849716186523, "global_step": 295790, "epoch": 3563} {"train_loss": -25.629425048828125, "global_step": 295791, "epoch": 3563} {"train_loss": -25.59292984008789, "global_step": 295792, "epoch": 3563} {"train_loss": -25.376285552978516, "global_step": 295793, "epoch": 3563} {"train_loss": -25.288373947143555, "global_step": 295794, "epoch": 3563} {"train_loss": -25.298837661743164, "global_step": 295795, "epoch": 3563} {"train_loss": -25.749286651611328, "global_step": 295796, "epoch": 3563} {"train_loss": -25.651569366455078, "global_step": 295797, "epoch": 3563} {"train_loss": -25.61090660095215, "global_step": 295798, "epoch": 3563} {"train_loss": -25.37550163269043, "global_step": 295799, "epoch": 3563} {"train_loss": -25.590044021606445, "global_step": 295800, "epoch": 3563} {"train_loss": -25.54176902770996, "global_step": 295801, "epoch": 3563} {"train_loss": -25.865192413330078, "global_step": 295802, "epoch": 3563} {"train_loss": -25.745376586914062, "global_step": 295803, "epoch": 3563} {"train_loss": -25.93330192565918, "global_step": 295804, "epoch": 3563} {"train_loss": -25.486162185668945, "global_step": 295805, "epoch": 3563} {"train_loss": -25.405603408813477, "global_step": 295806, "epoch": 3563} {"train_loss": -25.630615234375, "global_step": 295807, "epoch": 3563} {"train_loss": -26.01991844177246, "global_step": 295808, "epoch": 3563} {"train_loss": -25.75341796875, "global_step": 295809, "epoch": 3563} {"train_loss": -25.579368591308594, "global_step": 295810, "epoch": 3563} {"train_loss": -25.05171945870641, "global_step": 295811, "epoch": 3563, "val_loss": 7192118.0} {"train_loss": -24.78203582763672, "global_step": 295812, "epoch": 3564} {"train_loss": -24.741992950439453, "global_step": 295813, "epoch": 3564} {"train_loss": -25.035173416137695, "global_step": 295814, "epoch": 3564} {"train_loss": -25.122892379760742, "global_step": 295815, "epoch": 3564} {"train_loss": -25.49929428100586, "global_step": 295816, "epoch": 3564} {"train_loss": -24.7293701171875, "global_step": 295817, "epoch": 3564} {"train_loss": -24.97707176208496, "global_step": 295818, "epoch": 3564} {"train_loss": -24.862417221069336, "global_step": 295819, "epoch": 3564} {"train_loss": -25.423383712768555, "global_step": 295820, "epoch": 3564} {"train_loss": -24.767955780029297, "global_step": 295821, "epoch": 3564} {"train_loss": -25.4224853515625, "global_step": 295822, "epoch": 3564} {"train_loss": -25.2824764251709, "global_step": 295823, "epoch": 3564} {"train_loss": -24.90891456604004, "global_step": 295824, "epoch": 3564} {"train_loss": -25.006223678588867, "global_step": 295825, "epoch": 3564} {"train_loss": -25.026813507080078, "global_step": 295826, "epoch": 3564} {"train_loss": -25.238100051879883, "global_step": 295827, "epoch": 3564} {"train_loss": -25.444568634033203, "global_step": 295828, "epoch": 3564} {"train_loss": -25.630552291870117, "global_step": 295829, "epoch": 3564} {"train_loss": -25.021196365356445, "global_step": 295830, "epoch": 3564} {"train_loss": -25.311620712280273, "global_step": 295831, "epoch": 3564} {"train_loss": -25.576156616210938, "global_step": 295832, "epoch": 3564} {"train_loss": -25.367969512939453, "global_step": 295833, "epoch": 3564} {"train_loss": -25.430002212524414, "global_step": 295834, "epoch": 3564} {"train_loss": -25.56831932067871, "global_step": 295835, "epoch": 3564} {"train_loss": -25.48170280456543, "global_step": 295836, "epoch": 3564} {"train_loss": -25.907190322875977, "global_step": 295837, "epoch": 3564} {"train_loss": -25.418928146362305, "global_step": 295838, "epoch": 3564} {"train_loss": -25.60613441467285, "global_step": 295839, "epoch": 3564} {"train_loss": -25.569311141967773, "global_step": 295840, "epoch": 3564} {"train_loss": -25.327787399291992, "global_step": 295841, "epoch": 3564} {"train_loss": -25.394683837890625, "global_step": 295842, "epoch": 3564} {"train_loss": -25.86488151550293, "global_step": 295843, "epoch": 3564} {"train_loss": -25.430299758911133, "global_step": 295844, "epoch": 3564} {"train_loss": -26.13387107849121, "global_step": 295845, "epoch": 3564} {"train_loss": -25.446533203125, "global_step": 295846, "epoch": 3564} {"train_loss": -25.92521095275879, "global_step": 295847, "epoch": 3564} {"train_loss": -25.43465232849121, "global_step": 295848, "epoch": 3564} {"train_loss": -25.939966201782227, "global_step": 295849, "epoch": 3564} {"train_loss": -25.61627769470215, "global_step": 295850, "epoch": 3564} {"train_loss": -25.803451538085938, "global_step": 295851, "epoch": 3564} {"train_loss": -25.761194229125977, "global_step": 295852, "epoch": 3564} {"train_loss": -25.730268478393555, "global_step": 295853, "epoch": 3564} {"train_loss": -25.83969497680664, "global_step": 295854, "epoch": 3564} {"train_loss": -25.225614547729492, "global_step": 295855, "epoch": 3564} {"train_loss": -25.39548683166504, "global_step": 295856, "epoch": 3564} {"train_loss": -25.232757568359375, "global_step": 295857, "epoch": 3564} {"train_loss": -25.215576171875, "global_step": 295858, "epoch": 3564} {"train_loss": -26.157079696655273, "global_step": 295859, "epoch": 3564} {"train_loss": -25.976551055908203, "global_step": 295860, "epoch": 3564} {"train_loss": -25.418411254882812, "global_step": 295861, "epoch": 3564} {"train_loss": -25.607141494750977, "global_step": 295862, "epoch": 3564} {"train_loss": -25.735700607299805, "global_step": 295863, "epoch": 3564} {"train_loss": -25.588531494140625, "global_step": 295864, "epoch": 3564} {"train_loss": -26.247339248657227, "global_step": 295865, "epoch": 3564} {"train_loss": -26.021162033081055, "global_step": 295866, "epoch": 3564} {"train_loss": -25.344043731689453, "global_step": 295867, "epoch": 3564} {"train_loss": -25.372739791870117, "global_step": 295868, "epoch": 3564} {"train_loss": -25.812519073486328, "global_step": 295869, "epoch": 3564} {"train_loss": -25.694629669189453, "global_step": 295870, "epoch": 3564} {"train_loss": -25.057458877563477, "global_step": 295871, "epoch": 3564} {"train_loss": -25.507680892944336, "global_step": 295872, "epoch": 3564} {"train_loss": -25.57581329345703, "global_step": 295873, "epoch": 3564} {"train_loss": -25.38654136657715, "global_step": 295874, "epoch": 3564} {"train_loss": -25.36422348022461, "global_step": 295875, "epoch": 3564} {"train_loss": -25.366470336914062, "global_step": 295876, "epoch": 3564} {"train_loss": -25.487457275390625, "global_step": 295877, "epoch": 3564} {"train_loss": -25.595396041870117, "global_step": 295878, "epoch": 3564} {"train_loss": -25.573627471923828, "global_step": 295879, "epoch": 3564} {"train_loss": -25.562698364257812, "global_step": 295880, "epoch": 3564} {"train_loss": -25.728689193725586, "global_step": 295881, "epoch": 3564} {"train_loss": -25.73282814025879, "global_step": 295882, "epoch": 3564} {"train_loss": -25.56477165222168, "global_step": 295883, "epoch": 3564} {"train_loss": -25.24601173400879, "global_step": 295884, "epoch": 3564} {"train_loss": -25.880460739135742, "global_step": 295885, "epoch": 3564} {"train_loss": -25.54229164123535, "global_step": 295886, "epoch": 3564} {"train_loss": -25.762222290039062, "global_step": 295887, "epoch": 3564} {"train_loss": -25.523834228515625, "global_step": 295888, "epoch": 3564} {"train_loss": -25.94952392578125, "global_step": 295889, "epoch": 3564} {"train_loss": -25.55753517150879, "global_step": 295890, "epoch": 3564} {"train_loss": -25.864072799682617, "global_step": 295891, "epoch": 3564} {"train_loss": -25.8604736328125, "global_step": 295892, "epoch": 3564} {"train_loss": -25.440343856811523, "global_step": 295893, "epoch": 3564} {"train_loss": -25.503687410469514, "global_step": 295894, "epoch": 3564, "val_loss": 7141122.0} {"train_loss": -25.536651611328125, "global_step": 295895, "epoch": 3565} {"train_loss": -24.74941635131836, "global_step": 295896, "epoch": 3565} {"train_loss": -24.423887252807617, "global_step": 295897, "epoch": 3565} {"train_loss": -24.888385772705078, "global_step": 295898, "epoch": 3565} {"train_loss": -24.34813690185547, "global_step": 295899, "epoch": 3565} {"train_loss": -24.424680709838867, "global_step": 295900, "epoch": 3565} {"train_loss": -24.346378326416016, "global_step": 295901, "epoch": 3565} {"train_loss": -24.868623733520508, "global_step": 295902, "epoch": 3565} {"train_loss": -25.1016845703125, "global_step": 295903, "epoch": 3565} {"train_loss": -24.609683990478516, "global_step": 295904, "epoch": 3565} {"train_loss": -24.936368942260742, "global_step": 295905, "epoch": 3565} {"train_loss": -24.852672576904297, "global_step": 295906, "epoch": 3565} {"train_loss": -24.798368453979492, "global_step": 295907, "epoch": 3565} {"train_loss": -24.96907615661621, "global_step": 295908, "epoch": 3565} {"train_loss": -25.218107223510742, "global_step": 295909, "epoch": 3565} {"train_loss": -25.03731346130371, "global_step": 295910, "epoch": 3565} {"train_loss": -25.031902313232422, "global_step": 295911, "epoch": 3565} {"train_loss": -24.807634353637695, "global_step": 295912, "epoch": 3565} {"train_loss": -24.740575790405273, "global_step": 295913, "epoch": 3565} {"train_loss": -25.257904052734375, "global_step": 295914, "epoch": 3565} {"train_loss": -25.354942321777344, "global_step": 295915, "epoch": 3565} {"train_loss": -25.3316593170166, "global_step": 295916, "epoch": 3565} {"train_loss": -25.457067489624023, "global_step": 295917, "epoch": 3565} {"train_loss": -25.42622947692871, "global_step": 295918, "epoch": 3565} {"train_loss": -25.42180824279785, "global_step": 295919, "epoch": 3565} {"train_loss": -25.43458366394043, "global_step": 295920, "epoch": 3565} {"train_loss": -25.646207809448242, "global_step": 295921, "epoch": 3565} {"train_loss": -25.382455825805664, "global_step": 295922, "epoch": 3565} {"train_loss": -25.300390243530273, "global_step": 295923, "epoch": 3565} {"train_loss": -25.731164932250977, "global_step": 295924, "epoch": 3565} {"train_loss": -25.394184112548828, "global_step": 295925, "epoch": 3565} {"train_loss": -25.216012954711914, "global_step": 295926, "epoch": 3565} {"train_loss": -25.23761749267578, "global_step": 295927, "epoch": 3565} {"train_loss": -25.705123901367188, "global_step": 295928, "epoch": 3565} {"train_loss": -25.496301651000977, "global_step": 295929, "epoch": 3565} {"train_loss": -25.485462188720703, "global_step": 295930, "epoch": 3565} {"train_loss": -26.062021255493164, "global_step": 295931, "epoch": 3565} {"train_loss": -25.26398277282715, "global_step": 295932, "epoch": 3565} {"train_loss": -25.645599365234375, "global_step": 295933, "epoch": 3565} {"train_loss": -25.49615478515625, "global_step": 295934, "epoch": 3565} {"train_loss": -25.531713485717773, "global_step": 295935, "epoch": 3565} {"train_loss": -25.596799850463867, "global_step": 295936, "epoch": 3565} {"train_loss": -25.826074600219727, "global_step": 295937, "epoch": 3565} {"train_loss": -25.687891006469727, "global_step": 295938, "epoch": 3565} {"train_loss": -25.77044677734375, "global_step": 295939, "epoch": 3565} {"train_loss": -25.29288101196289, "global_step": 295940, "epoch": 3565} {"train_loss": -25.65093421936035, "global_step": 295941, "epoch": 3565} {"train_loss": -25.30708122253418, "global_step": 295942, "epoch": 3565} {"train_loss": -25.8543758392334, "global_step": 295943, "epoch": 3565} {"train_loss": -25.707178115844727, "global_step": 295944, "epoch": 3565} {"train_loss": -25.525575637817383, "global_step": 295945, "epoch": 3565} {"train_loss": -25.816181182861328, "global_step": 295946, "epoch": 3565} {"train_loss": -25.832849502563477, "global_step": 295947, "epoch": 3565} {"train_loss": -25.73048210144043, "global_step": 295948, "epoch": 3565} {"train_loss": -25.771865844726562, "global_step": 295949, "epoch": 3565} {"train_loss": -25.41951560974121, "global_step": 295950, "epoch": 3565} {"train_loss": -25.477710723876953, "global_step": 295951, "epoch": 3565} {"train_loss": -25.424341201782227, "global_step": 295952, "epoch": 3565} {"train_loss": -25.545867919921875, "global_step": 295953, "epoch": 3565} {"train_loss": -25.33131217956543, "global_step": 295954, "epoch": 3565} {"train_loss": -25.221813201904297, "global_step": 295955, "epoch": 3565} {"train_loss": -25.73529052734375, "global_step": 295956, "epoch": 3565} {"train_loss": -25.339441299438477, "global_step": 295957, "epoch": 3565} {"train_loss": -25.222431182861328, "global_step": 295958, "epoch": 3565} {"train_loss": -25.167816162109375, "global_step": 295959, "epoch": 3565} {"train_loss": -25.611867904663086, "global_step": 295960, "epoch": 3565} {"train_loss": -25.264432907104492, "global_step": 295961, "epoch": 3565} {"train_loss": -25.374536514282227, "global_step": 295962, "epoch": 3565} {"train_loss": -25.290807723999023, "global_step": 295963, "epoch": 3565} {"train_loss": -25.302051544189453, "global_step": 295964, "epoch": 3565} {"train_loss": -25.299816131591797, "global_step": 295965, "epoch": 3565} {"train_loss": -25.467100143432617, "global_step": 295966, "epoch": 3565} {"train_loss": -25.45111083984375, "global_step": 295967, "epoch": 3565} {"train_loss": -25.560787200927734, "global_step": 295968, "epoch": 3565} {"train_loss": -25.904296875, "global_step": 295969, "epoch": 3565} {"train_loss": -25.468338012695312, "global_step": 295970, "epoch": 3565} {"train_loss": -25.491168975830078, "global_step": 295971, "epoch": 3565} {"train_loss": -25.263879776000977, "global_step": 295972, "epoch": 3565} {"train_loss": -25.613910675048828, "global_step": 295973, "epoch": 3565} {"train_loss": -25.194305419921875, "global_step": 295974, "epoch": 3565} {"train_loss": -25.792617797851562, "global_step": 295975, "epoch": 3565} {"train_loss": -25.21872901916504, "global_step": 295976, "epoch": 3565} {"train_loss": -25.336120651428956, "global_step": 295977, "epoch": 3565, "val_loss": 7221252.0} {"train_loss": -24.346677780151367, "global_step": 295978, "epoch": 3566} {"train_loss": -25.11043357849121, "global_step": 295979, "epoch": 3566} {"train_loss": -25.48832893371582, "global_step": 295980, "epoch": 3566} {"train_loss": -25.10495376586914, "global_step": 295981, "epoch": 3566} {"train_loss": -24.693906784057617, "global_step": 295982, "epoch": 3566} {"train_loss": -25.600696563720703, "global_step": 295983, "epoch": 3566} {"train_loss": -25.675952911376953, "global_step": 295984, "epoch": 3566} {"train_loss": -25.42302131652832, "global_step": 295985, "epoch": 3566} {"train_loss": -25.3498477935791, "global_step": 295986, "epoch": 3566} {"train_loss": -25.230457305908203, "global_step": 295987, "epoch": 3566} {"train_loss": -25.786890029907227, "global_step": 295988, "epoch": 3566} {"train_loss": -25.570377349853516, "global_step": 295989, "epoch": 3566} {"train_loss": -25.437307357788086, "global_step": 295990, "epoch": 3566} {"train_loss": -25.635751724243164, "global_step": 295991, "epoch": 3566} {"train_loss": -25.502267837524414, "global_step": 295992, "epoch": 3566} {"train_loss": -25.653955459594727, "global_step": 295993, "epoch": 3566} {"train_loss": -25.615264892578125, "global_step": 295994, "epoch": 3566} {"train_loss": -25.655670166015625, "global_step": 295995, "epoch": 3566} {"train_loss": -25.712753295898438, "global_step": 295996, "epoch": 3566} {"train_loss": -25.462383270263672, "global_step": 295997, "epoch": 3566} {"train_loss": -25.845245361328125, "global_step": 295998, "epoch": 3566} {"train_loss": -25.517826080322266, "global_step": 295999, "epoch": 3566} {"train_loss": -25.542308807373047, "global_step": 296000, "epoch": 3566} {"train_loss": -25.757038116455078, "global_step": 296001, "epoch": 3566} {"train_loss": -25.94140625, "global_step": 296002, "epoch": 3566} {"train_loss": -25.830236434936523, "global_step": 296003, "epoch": 3566} {"train_loss": -25.851654052734375, "global_step": 296004, "epoch": 3566} {"train_loss": -25.9113712310791, "global_step": 296005, "epoch": 3566} {"train_loss": -25.31682586669922, "global_step": 296006, "epoch": 3566} {"train_loss": -25.54184913635254, "global_step": 296007, "epoch": 3566} {"train_loss": -25.76997184753418, "global_step": 296008, "epoch": 3566} {"train_loss": -25.69614028930664, "global_step": 296009, "epoch": 3566} {"train_loss": -25.668806076049805, "global_step": 296010, "epoch": 3566} {"train_loss": -25.984210968017578, "global_step": 296011, "epoch": 3566} {"train_loss": -25.33867073059082, "global_step": 296012, "epoch": 3566} {"train_loss": -25.971176147460938, "global_step": 296013, "epoch": 3566} {"train_loss": -25.314565658569336, "global_step": 296014, "epoch": 3566} {"train_loss": -25.65884780883789, "global_step": 296015, "epoch": 3566} {"train_loss": -25.501707077026367, "global_step": 296016, "epoch": 3566} {"train_loss": -25.5445499420166, "global_step": 296017, "epoch": 3566} {"train_loss": -25.6804256439209, "global_step": 296018, "epoch": 3566} {"train_loss": -25.66633415222168, "global_step": 296019, "epoch": 3566} {"train_loss": -25.683765411376953, "global_step": 296020, "epoch": 3566} {"train_loss": -25.60908317565918, "global_step": 296021, "epoch": 3566} {"train_loss": -25.385395050048828, "global_step": 296022, "epoch": 3566} {"train_loss": -25.175312042236328, "global_step": 296023, "epoch": 3566} {"train_loss": -25.511335372924805, "global_step": 296024, "epoch": 3566} {"train_loss": -25.6480712890625, "global_step": 296025, "epoch": 3566} {"train_loss": -25.46583366394043, "global_step": 296026, "epoch": 3566} {"train_loss": -25.667343139648438, "global_step": 296027, "epoch": 3566} {"train_loss": -25.79837989807129, "global_step": 296028, "epoch": 3566} {"train_loss": -25.305768966674805, "global_step": 296029, "epoch": 3566} {"train_loss": -25.41761589050293, "global_step": 296030, "epoch": 3566} {"train_loss": -25.682586669921875, "global_step": 296031, "epoch": 3566} {"train_loss": -25.740095138549805, "global_step": 296032, "epoch": 3566} {"train_loss": -25.834142684936523, "global_step": 296033, "epoch": 3566} {"train_loss": -25.315370559692383, "global_step": 296034, "epoch": 3566} {"train_loss": -25.586706161499023, "global_step": 296035, "epoch": 3566} {"train_loss": -25.693571090698242, "global_step": 296036, "epoch": 3566} {"train_loss": -25.808364868164062, "global_step": 296037, "epoch": 3566} {"train_loss": -25.7991943359375, "global_step": 296038, "epoch": 3566} {"train_loss": -25.7606143951416, "global_step": 296039, "epoch": 3566} {"train_loss": -25.708465576171875, "global_step": 296040, "epoch": 3566} {"train_loss": -25.612201690673828, "global_step": 296041, "epoch": 3566} {"train_loss": -25.81044578552246, "global_step": 296042, "epoch": 3566} {"train_loss": -25.77589225769043, "global_step": 296043, "epoch": 3566} {"train_loss": -25.839895248413086, "global_step": 296044, "epoch": 3566} {"train_loss": -25.628082275390625, "global_step": 296045, "epoch": 3566} {"train_loss": -25.69488525390625, "global_step": 296046, "epoch": 3566} {"train_loss": -25.57736587524414, "global_step": 296047, "epoch": 3566} {"train_loss": -25.62526512145996, "global_step": 296048, "epoch": 3566} {"train_loss": -25.74550437927246, "global_step": 296049, "epoch": 3566} {"train_loss": -26.179351806640625, "global_step": 296050, "epoch": 3566} {"train_loss": -25.81198501586914, "global_step": 296051, "epoch": 3566} {"train_loss": -25.66180992126465, "global_step": 296052, "epoch": 3566} {"train_loss": -25.9887752532959, "global_step": 296053, "epoch": 3566} {"train_loss": -25.82227897644043, "global_step": 296054, "epoch": 3566} {"train_loss": -25.543045043945312, "global_step": 296055, "epoch": 3566} {"train_loss": -25.666213989257812, "global_step": 296056, "epoch": 3566} {"train_loss": -25.724294662475586, "global_step": 296057, "epoch": 3566} {"train_loss": -26.024723052978516, "global_step": 296058, "epoch": 3566} {"train_loss": -25.681039810180664, "global_step": 296059, "epoch": 3566} {"train_loss": -25.601702977375812, "global_step": 296060, "epoch": 3566, "val_loss": 7157722.5} {"train_loss": -25.048171997070312, "global_step": 296061, "epoch": 3567} {"train_loss": -23.880874633789062, "global_step": 296062, "epoch": 3567} {"train_loss": -23.515308380126953, "global_step": 296063, "epoch": 3567} {"train_loss": -24.229949951171875, "global_step": 296064, "epoch": 3567} {"train_loss": -25.00282859802246, "global_step": 296065, "epoch": 3567} {"train_loss": -25.01540184020996, "global_step": 296066, "epoch": 3567} {"train_loss": -24.90119743347168, "global_step": 296067, "epoch": 3567} {"train_loss": -24.99366569519043, "global_step": 296068, "epoch": 3567} {"train_loss": -25.21175765991211, "global_step": 296069, "epoch": 3567} {"train_loss": -25.276527404785156, "global_step": 296070, "epoch": 3567} {"train_loss": -25.339506149291992, "global_step": 296071, "epoch": 3567} {"train_loss": -24.88016128540039, "global_step": 296072, "epoch": 3567} {"train_loss": -25.44010353088379, "global_step": 296073, "epoch": 3567} {"train_loss": -25.235464096069336, "global_step": 296074, "epoch": 3567} {"train_loss": -25.245853424072266, "global_step": 296075, "epoch": 3567} {"train_loss": -25.511362075805664, "global_step": 296076, "epoch": 3567} {"train_loss": -25.48982048034668, "global_step": 296077, "epoch": 3567} {"train_loss": -25.284635543823242, "global_step": 296078, "epoch": 3567} {"train_loss": -25.596038818359375, "global_step": 296079, "epoch": 3567} {"train_loss": -25.468276977539062, "global_step": 296080, "epoch": 3567} {"train_loss": -25.53595542907715, "global_step": 296081, "epoch": 3567} {"train_loss": -25.64301872253418, "global_step": 296082, "epoch": 3567} {"train_loss": -25.3365535736084, "global_step": 296083, "epoch": 3567} {"train_loss": -25.39823341369629, "global_step": 296084, "epoch": 3567} {"train_loss": -25.302467346191406, "global_step": 296085, "epoch": 3567} {"train_loss": -25.110435485839844, "global_step": 296086, "epoch": 3567} {"train_loss": -25.7220458984375, "global_step": 296087, "epoch": 3567} {"train_loss": -25.52680015563965, "global_step": 296088, "epoch": 3567} {"train_loss": -25.386178970336914, "global_step": 296089, "epoch": 3567} {"train_loss": -25.647480010986328, "global_step": 296090, "epoch": 3567} {"train_loss": -25.69915771484375, "global_step": 296091, "epoch": 3567} {"train_loss": -25.733325958251953, "global_step": 296092, "epoch": 3567} {"train_loss": -25.936613082885742, "global_step": 296093, "epoch": 3567} {"train_loss": -25.890445709228516, "global_step": 296094, "epoch": 3567} {"train_loss": -25.974842071533203, "global_step": 296095, "epoch": 3567} {"train_loss": -25.754507064819336, "global_step": 296096, "epoch": 3567} {"train_loss": -25.936941146850586, "global_step": 296097, "epoch": 3567} {"train_loss": -25.7221622467041, "global_step": 296098, "epoch": 3567} {"train_loss": -25.74603843688965, "global_step": 296099, "epoch": 3567} {"train_loss": -25.56447410583496, "global_step": 296100, "epoch": 3567} {"train_loss": -25.857816696166992, "global_step": 296101, "epoch": 3567} {"train_loss": -25.743228912353516, "global_step": 296102, "epoch": 3567} {"train_loss": -25.747522354125977, "global_step": 296103, "epoch": 3567} {"train_loss": -25.671850204467773, "global_step": 296104, "epoch": 3567} {"train_loss": -25.883710861206055, "global_step": 296105, "epoch": 3567} {"train_loss": -25.311996459960938, "global_step": 296106, "epoch": 3567} {"train_loss": -25.8035888671875, "global_step": 296107, "epoch": 3567} {"train_loss": -25.512556076049805, "global_step": 296108, "epoch": 3567} {"train_loss": -25.54817771911621, "global_step": 296109, "epoch": 3567} {"train_loss": -25.74614906311035, "global_step": 296110, "epoch": 3567} {"train_loss": -25.61712074279785, "global_step": 296111, "epoch": 3567} {"train_loss": -25.906213760375977, "global_step": 296112, "epoch": 3567} {"train_loss": -25.654407501220703, "global_step": 296113, "epoch": 3567} {"train_loss": -25.871753692626953, "global_step": 296114, "epoch": 3567} {"train_loss": -25.55483055114746, "global_step": 296115, "epoch": 3567} {"train_loss": -25.766448974609375, "global_step": 296116, "epoch": 3567} {"train_loss": -25.824155807495117, "global_step": 296117, "epoch": 3567} {"train_loss": -25.569110870361328, "global_step": 296118, "epoch": 3567} {"train_loss": -25.554798126220703, "global_step": 296119, "epoch": 3567} {"train_loss": -25.583518981933594, "global_step": 296120, "epoch": 3567} {"train_loss": -25.622943878173828, "global_step": 296121, "epoch": 3567} {"train_loss": -25.559864044189453, "global_step": 296122, "epoch": 3567} {"train_loss": -25.74628257751465, "global_step": 296123, "epoch": 3567} {"train_loss": -25.952590942382812, "global_step": 296124, "epoch": 3567} {"train_loss": -25.731613159179688, "global_step": 296125, "epoch": 3567} {"train_loss": -25.539403915405273, "global_step": 296126, "epoch": 3567} {"train_loss": -25.620319366455078, "global_step": 296127, "epoch": 3567} {"train_loss": -26.002649307250977, "global_step": 296128, "epoch": 3567} {"train_loss": -25.42520523071289, "global_step": 296129, "epoch": 3567} {"train_loss": -25.644412994384766, "global_step": 296130, "epoch": 3567} {"train_loss": -25.74251365661621, "global_step": 296131, "epoch": 3567} {"train_loss": -26.1422061920166, "global_step": 296132, "epoch": 3567} {"train_loss": -25.648574829101562, "global_step": 296133, "epoch": 3567} {"train_loss": -25.524518966674805, "global_step": 296134, "epoch": 3567} {"train_loss": -25.554304122924805, "global_step": 296135, "epoch": 3567} {"train_loss": -25.756793975830078, "global_step": 296136, "epoch": 3567} {"train_loss": -25.691679000854492, "global_step": 296137, "epoch": 3567} {"train_loss": -25.7242374420166, "global_step": 296138, "epoch": 3567} {"train_loss": -25.892820358276367, "global_step": 296139, "epoch": 3567} {"train_loss": -25.5233154296875, "global_step": 296140, "epoch": 3567} {"train_loss": -25.8154354095459, "global_step": 296141, "epoch": 3567} {"train_loss": -25.484891891479492, "global_step": 296142, "epoch": 3567} {"train_loss": -25.509322982236565, "global_step": 296143, "epoch": 3567, "val_loss": 7177200.0} {"train_loss": -25.322050094604492, "global_step": 296144, "epoch": 3568} {"train_loss": -24.712617874145508, "global_step": 296145, "epoch": 3568} {"train_loss": -25.20082664489746, "global_step": 296146, "epoch": 3568} {"train_loss": -25.51416015625, "global_step": 296147, "epoch": 3568} {"train_loss": -24.89958953857422, "global_step": 296148, "epoch": 3568} {"train_loss": -24.884151458740234, "global_step": 296149, "epoch": 3568} {"train_loss": -25.50632667541504, "global_step": 296150, "epoch": 3568} {"train_loss": -25.331512451171875, "global_step": 296151, "epoch": 3568} {"train_loss": -24.946321487426758, "global_step": 296152, "epoch": 3568} {"train_loss": -25.550819396972656, "global_step": 296153, "epoch": 3568} {"train_loss": -25.3084716796875, "global_step": 296154, "epoch": 3568} {"train_loss": -25.340946197509766, "global_step": 296155, "epoch": 3568} {"train_loss": -25.233036041259766, "global_step": 296156, "epoch": 3568} {"train_loss": -25.21197509765625, "global_step": 296157, "epoch": 3568} {"train_loss": -25.289663314819336, "global_step": 296158, "epoch": 3568} {"train_loss": -25.254545211791992, "global_step": 296159, "epoch": 3568} {"train_loss": -25.72993278503418, "global_step": 296160, "epoch": 3568} {"train_loss": -25.711029052734375, "global_step": 296161, "epoch": 3568} {"train_loss": -25.327505111694336, "global_step": 296162, "epoch": 3568} {"train_loss": -25.423826217651367, "global_step": 296163, "epoch": 3568} {"train_loss": -25.63982582092285, "global_step": 296164, "epoch": 3568} {"train_loss": -25.306432723999023, "global_step": 296165, "epoch": 3568} {"train_loss": -25.63746452331543, "global_step": 296166, "epoch": 3568} {"train_loss": -25.86445426940918, "global_step": 296167, "epoch": 3568} {"train_loss": -24.957921981811523, "global_step": 296168, "epoch": 3568} {"train_loss": -25.365324020385742, "global_step": 296169, "epoch": 3568} {"train_loss": -25.54218101501465, "global_step": 296170, "epoch": 3568} {"train_loss": -25.8408203125, "global_step": 296171, "epoch": 3568} {"train_loss": -25.45728302001953, "global_step": 296172, "epoch": 3568} {"train_loss": -25.54172134399414, "global_step": 296173, "epoch": 3568} {"train_loss": -25.467668533325195, "global_step": 296174, "epoch": 3568} {"train_loss": -25.432126998901367, "global_step": 296175, "epoch": 3568} {"train_loss": -25.45474624633789, "global_step": 296176, "epoch": 3568} {"train_loss": -25.661863327026367, "global_step": 296177, "epoch": 3568} {"train_loss": -25.5885066986084, "global_step": 296178, "epoch": 3568} {"train_loss": -25.58839988708496, "global_step": 296179, "epoch": 3568} {"train_loss": -25.80453872680664, "global_step": 296180, "epoch": 3568} {"train_loss": -25.580270767211914, "global_step": 296181, "epoch": 3568} {"train_loss": -25.505821228027344, "global_step": 296182, "epoch": 3568} {"train_loss": -25.406917572021484, "global_step": 296183, "epoch": 3568} {"train_loss": -25.7739200592041, "global_step": 296184, "epoch": 3568} {"train_loss": -25.15096092224121, "global_step": 296185, "epoch": 3568} {"train_loss": -25.7796630859375, "global_step": 296186, "epoch": 3568} {"train_loss": -25.506494522094727, "global_step": 296187, "epoch": 3568} {"train_loss": -25.327268600463867, "global_step": 296188, "epoch": 3568} {"train_loss": -25.84198570251465, "global_step": 296189, "epoch": 3568} {"train_loss": -25.391820907592773, "global_step": 296190, "epoch": 3568} {"train_loss": -25.627567291259766, "global_step": 296191, "epoch": 3568} {"train_loss": -25.583288192749023, "global_step": 296192, "epoch": 3568} {"train_loss": -25.730398178100586, "global_step": 296193, "epoch": 3568} {"train_loss": -25.93926429748535, "global_step": 296194, "epoch": 3568} {"train_loss": -25.673486709594727, "global_step": 296195, "epoch": 3568} {"train_loss": -25.64170265197754, "global_step": 296196, "epoch": 3568} {"train_loss": -26.198278427124023, "global_step": 296197, "epoch": 3568} {"train_loss": -25.810577392578125, "global_step": 296198, "epoch": 3568} {"train_loss": -25.55072593688965, "global_step": 296199, "epoch": 3568} {"train_loss": -25.49494743347168, "global_step": 296200, "epoch": 3568} {"train_loss": -25.437253952026367, "global_step": 296201, "epoch": 3568} {"train_loss": -25.6248836517334, "global_step": 296202, "epoch": 3568} {"train_loss": -25.87689208984375, "global_step": 296203, "epoch": 3568} {"train_loss": -25.938465118408203, "global_step": 296204, "epoch": 3568} {"train_loss": -25.60199546813965, "global_step": 296205, "epoch": 3568} {"train_loss": -25.885862350463867, "global_step": 296206, "epoch": 3568} {"train_loss": -25.53615379333496, "global_step": 296207, "epoch": 3568} {"train_loss": -25.413846969604492, "global_step": 296208, "epoch": 3568} {"train_loss": -25.730091094970703, "global_step": 296209, "epoch": 3568} {"train_loss": -25.536680221557617, "global_step": 296210, "epoch": 3568} {"train_loss": -26.022775650024414, "global_step": 296211, "epoch": 3568} {"train_loss": -25.570133209228516, "global_step": 296212, "epoch": 3568} {"train_loss": -25.763782501220703, "global_step": 296213, "epoch": 3568} {"train_loss": -25.97852897644043, "global_step": 296214, "epoch": 3568} {"train_loss": -25.537349700927734, "global_step": 296215, "epoch": 3568} {"train_loss": -25.8342342376709, "global_step": 296216, "epoch": 3568} {"train_loss": -25.62497901916504, "global_step": 296217, "epoch": 3568} {"train_loss": -25.565114974975586, "global_step": 296218, "epoch": 3568} {"train_loss": -25.877012252807617, "global_step": 296219, "epoch": 3568} {"train_loss": -25.1478214263916, "global_step": 296220, "epoch": 3568} {"train_loss": -25.55476951599121, "global_step": 296221, "epoch": 3568} {"train_loss": -25.555288314819336, "global_step": 296222, "epoch": 3568} {"train_loss": -26.092334747314453, "global_step": 296223, "epoch": 3568} {"train_loss": -25.885961532592773, "global_step": 296224, "epoch": 3568} {"train_loss": -25.583433151245117, "global_step": 296225, "epoch": 3568} {"train_loss": -25.557536343494093, "global_step": 296226, "epoch": 3568, "val_loss": 7241770.0} {"train_loss": -25.626489639282227, "global_step": 296227, "epoch": 3569} {"train_loss": -25.281919479370117, "global_step": 296228, "epoch": 3569} {"train_loss": -25.254676818847656, "global_step": 296229, "epoch": 3569} {"train_loss": -25.822101593017578, "global_step": 296230, "epoch": 3569} {"train_loss": -25.608875274658203, "global_step": 296231, "epoch": 3569} {"train_loss": -25.229225158691406, "global_step": 296232, "epoch": 3569} {"train_loss": -25.341238021850586, "global_step": 296233, "epoch": 3569} {"train_loss": -25.583097457885742, "global_step": 296234, "epoch": 3569} {"train_loss": -25.34109115600586, "global_step": 296235, "epoch": 3569} {"train_loss": -25.109315872192383, "global_step": 296236, "epoch": 3569} {"train_loss": -25.378210067749023, "global_step": 296237, "epoch": 3569} {"train_loss": -25.20973014831543, "global_step": 296238, "epoch": 3569} {"train_loss": -25.70833396911621, "global_step": 296239, "epoch": 3569} {"train_loss": -25.380481719970703, "global_step": 296240, "epoch": 3569} {"train_loss": -25.265321731567383, "global_step": 296241, "epoch": 3569} {"train_loss": -24.93046760559082, "global_step": 296242, "epoch": 3569} {"train_loss": -25.396116256713867, "global_step": 296243, "epoch": 3569} {"train_loss": -25.271930694580078, "global_step": 296244, "epoch": 3569} {"train_loss": -25.168180465698242, "global_step": 296245, "epoch": 3569} {"train_loss": -25.690418243408203, "global_step": 296246, "epoch": 3569} {"train_loss": -25.720197677612305, "global_step": 296247, "epoch": 3569} {"train_loss": -25.580148696899414, "global_step": 296248, "epoch": 3569} {"train_loss": -25.53139305114746, "global_step": 296249, "epoch": 3569} {"train_loss": -25.024978637695312, "global_step": 296250, "epoch": 3569} {"train_loss": -25.767057418823242, "global_step": 296251, "epoch": 3569} {"train_loss": -25.718393325805664, "global_step": 296252, "epoch": 3569} {"train_loss": -25.40813446044922, "global_step": 296253, "epoch": 3569} {"train_loss": -25.22113037109375, "global_step": 296254, "epoch": 3569} {"train_loss": -25.471467971801758, "global_step": 296255, "epoch": 3569} {"train_loss": -25.753732681274414, "global_step": 296256, "epoch": 3569} {"train_loss": -25.333765029907227, "global_step": 296257, "epoch": 3569} {"train_loss": -25.749963760375977, "global_step": 296258, "epoch": 3569} {"train_loss": -25.550655364990234, "global_step": 296259, "epoch": 3569} {"train_loss": -25.748289108276367, "global_step": 296260, "epoch": 3569} {"train_loss": -25.68458366394043, "global_step": 296261, "epoch": 3569} {"train_loss": -25.942325592041016, "global_step": 296262, "epoch": 3569} {"train_loss": -25.58726692199707, "global_step": 296263, "epoch": 3569} {"train_loss": -25.585546493530273, "global_step": 296264, "epoch": 3569} {"train_loss": -25.60401725769043, "global_step": 296265, "epoch": 3569} {"train_loss": -25.626911163330078, "global_step": 296266, "epoch": 3569} {"train_loss": -25.888294219970703, "global_step": 296267, "epoch": 3569} {"train_loss": -25.267261505126953, "global_step": 296268, "epoch": 3569} {"train_loss": -25.834426879882812, "global_step": 296269, "epoch": 3569} {"train_loss": -25.81143569946289, "global_step": 296270, "epoch": 3569} {"train_loss": -25.67390251159668, "global_step": 296271, "epoch": 3569} {"train_loss": -25.57781219482422, "global_step": 296272, "epoch": 3569} {"train_loss": -25.694717407226562, "global_step": 296273, "epoch": 3569} {"train_loss": -25.489547729492188, "global_step": 296274, "epoch": 3569} {"train_loss": -25.486743927001953, "global_step": 296275, "epoch": 3569} {"train_loss": -25.8681583404541, "global_step": 296276, "epoch": 3569} {"train_loss": -25.851110458374023, "global_step": 296277, "epoch": 3569} {"train_loss": -25.852371215820312, "global_step": 296278, "epoch": 3569} {"train_loss": -25.624658584594727, "global_step": 296279, "epoch": 3569} {"train_loss": -25.81671714782715, "global_step": 296280, "epoch": 3569} {"train_loss": -25.47450065612793, "global_step": 296281, "epoch": 3569} {"train_loss": -25.523923873901367, "global_step": 296282, "epoch": 3569} {"train_loss": -25.6002254486084, "global_step": 296283, "epoch": 3569} {"train_loss": -25.55620765686035, "global_step": 296284, "epoch": 3569} {"train_loss": -25.31491470336914, "global_step": 296285, "epoch": 3569} {"train_loss": -25.821063995361328, "global_step": 296286, "epoch": 3569} {"train_loss": -25.829498291015625, "global_step": 296287, "epoch": 3569} {"train_loss": -25.613574981689453, "global_step": 296288, "epoch": 3569} {"train_loss": -25.285146713256836, "global_step": 296289, "epoch": 3569} {"train_loss": -25.630863189697266, "global_step": 296290, "epoch": 3569} {"train_loss": -25.585411071777344, "global_step": 296291, "epoch": 3569} {"train_loss": -25.592981338500977, "global_step": 296292, "epoch": 3569} {"train_loss": -25.638708114624023, "global_step": 296293, "epoch": 3569} {"train_loss": -25.553638458251953, "global_step": 296294, "epoch": 3569} {"train_loss": -25.94138526916504, "global_step": 296295, "epoch": 3569} {"train_loss": -25.555641174316406, "global_step": 296296, "epoch": 3569} {"train_loss": -25.704862594604492, "global_step": 296297, "epoch": 3569} {"train_loss": -25.39322853088379, "global_step": 296298, "epoch": 3569} {"train_loss": -24.859594345092773, "global_step": 296299, "epoch": 3569} {"train_loss": -25.64761734008789, "global_step": 296300, "epoch": 3569} {"train_loss": -25.16823387145996, "global_step": 296301, "epoch": 3569} {"train_loss": -25.2435245513916, "global_step": 296302, "epoch": 3569} {"train_loss": -25.301206588745117, "global_step": 296303, "epoch": 3569} {"train_loss": -25.453950881958008, "global_step": 296304, "epoch": 3569} {"train_loss": -25.685842514038086, "global_step": 296305, "epoch": 3569} {"train_loss": -25.68927574157715, "global_step": 296306, "epoch": 3569} {"train_loss": -25.448883056640625, "global_step": 296307, "epoch": 3569} {"train_loss": -25.670089721679688, "global_step": 296308, "epoch": 3569} {"train_loss": -25.53985464716532, "global_step": 296309, "epoch": 3569, "val_loss": 7234942.0} {"train_loss": -25.07735252380371, "global_step": 296310, "epoch": 3570} {"train_loss": -24.74047088623047, "global_step": 296311, "epoch": 3570} {"train_loss": -25.05901527404785, "global_step": 296312, "epoch": 3570} {"train_loss": -24.857797622680664, "global_step": 296313, "epoch": 3570} {"train_loss": -25.342140197753906, "global_step": 296314, "epoch": 3570} {"train_loss": -25.192546844482422, "global_step": 296315, "epoch": 3570} {"train_loss": -25.707067489624023, "global_step": 296316, "epoch": 3570} {"train_loss": -25.43428611755371, "global_step": 296317, "epoch": 3570} {"train_loss": -25.0580997467041, "global_step": 296318, "epoch": 3570} {"train_loss": -25.397939682006836, "global_step": 296319, "epoch": 3570} {"train_loss": -25.333477020263672, "global_step": 296320, "epoch": 3570} {"train_loss": -25.43280601501465, "global_step": 296321, "epoch": 3570} {"train_loss": -25.957727432250977, "global_step": 296322, "epoch": 3570} {"train_loss": -25.570270538330078, "global_step": 296323, "epoch": 3570} {"train_loss": -25.74530601501465, "global_step": 296324, "epoch": 3570} {"train_loss": -25.6627140045166, "global_step": 296325, "epoch": 3570} {"train_loss": -25.61482048034668, "global_step": 296326, "epoch": 3570} {"train_loss": -25.48687171936035, "global_step": 296327, "epoch": 3570} {"train_loss": -25.590818405151367, "global_step": 296328, "epoch": 3570} {"train_loss": -25.04920768737793, "global_step": 296329, "epoch": 3570} {"train_loss": -25.599069595336914, "global_step": 296330, "epoch": 3570} {"train_loss": -25.641584396362305, "global_step": 296331, "epoch": 3570} {"train_loss": -24.97320556640625, "global_step": 296332, "epoch": 3570} {"train_loss": -25.4841365814209, "global_step": 296333, "epoch": 3570} {"train_loss": -25.042484283447266, "global_step": 296334, "epoch": 3570} {"train_loss": -25.508337020874023, "global_step": 296335, "epoch": 3570} {"train_loss": -25.05417251586914, "global_step": 296336, "epoch": 3570} {"train_loss": -25.22291374206543, "global_step": 296337, "epoch": 3570} {"train_loss": -25.33163833618164, "global_step": 296338, "epoch": 3570} {"train_loss": -25.643020629882812, "global_step": 296339, "epoch": 3570} {"train_loss": -25.439878463745117, "global_step": 296340, "epoch": 3570} {"train_loss": -25.670141220092773, "global_step": 296341, "epoch": 3570} {"train_loss": -25.634521484375, "global_step": 296342, "epoch": 3570} {"train_loss": -25.35116958618164, "global_step": 296343, "epoch": 3570} {"train_loss": -25.71453857421875, "global_step": 296344, "epoch": 3570} {"train_loss": -25.215253829956055, "global_step": 296345, "epoch": 3570} {"train_loss": -25.171899795532227, "global_step": 296346, "epoch": 3570} {"train_loss": -25.609262466430664, "global_step": 296347, "epoch": 3570} {"train_loss": -25.509714126586914, "global_step": 296348, "epoch": 3570} {"train_loss": -25.272167205810547, "global_step": 296349, "epoch": 3570} {"train_loss": -25.721731185913086, "global_step": 296350, "epoch": 3570} {"train_loss": -25.237268447875977, "global_step": 296351, "epoch": 3570} {"train_loss": -25.372488021850586, "global_step": 296352, "epoch": 3570} {"train_loss": -25.57892417907715, "global_step": 296353, "epoch": 3570} {"train_loss": -25.15993309020996, "global_step": 296354, "epoch": 3570} {"train_loss": -25.281484603881836, "global_step": 296355, "epoch": 3570} {"train_loss": -25.7059326171875, "global_step": 296356, "epoch": 3570} {"train_loss": -25.809528350830078, "global_step": 296357, "epoch": 3570} {"train_loss": -25.3779239654541, "global_step": 296358, "epoch": 3570} {"train_loss": -25.753387451171875, "global_step": 296359, "epoch": 3570} {"train_loss": -25.48573875427246, "global_step": 296360, "epoch": 3570} {"train_loss": -25.459186553955078, "global_step": 296361, "epoch": 3570} {"train_loss": -25.643665313720703, "global_step": 296362, "epoch": 3570} {"train_loss": -25.801116943359375, "global_step": 296363, "epoch": 3570} {"train_loss": -25.5240535736084, "global_step": 296364, "epoch": 3570} {"train_loss": -25.411231994628906, "global_step": 296365, "epoch": 3570} {"train_loss": -25.218976974487305, "global_step": 296366, "epoch": 3570} {"train_loss": -25.890731811523438, "global_step": 296367, "epoch": 3570} {"train_loss": -25.506481170654297, "global_step": 296368, "epoch": 3570} {"train_loss": -25.941232681274414, "global_step": 296369, "epoch": 3570} {"train_loss": -25.931690216064453, "global_step": 296370, "epoch": 3570} {"train_loss": -25.85107421875, "global_step": 296371, "epoch": 3570} {"train_loss": -25.82673454284668, "global_step": 296372, "epoch": 3570} {"train_loss": -25.740406036376953, "global_step": 296373, "epoch": 3570} {"train_loss": -26.050704956054688, "global_step": 296374, "epoch": 3570} {"train_loss": -25.974218368530273, "global_step": 296375, "epoch": 3570} {"train_loss": -25.7769775390625, "global_step": 296376, "epoch": 3570} {"train_loss": -25.931257247924805, "global_step": 296377, "epoch": 3570} {"train_loss": -25.98833656311035, "global_step": 296378, "epoch": 3570} {"train_loss": -25.816009521484375, "global_step": 296379, "epoch": 3570} {"train_loss": -25.661151885986328, "global_step": 296380, "epoch": 3570} {"train_loss": -25.71170425415039, "global_step": 296381, "epoch": 3570} {"train_loss": -25.637678146362305, "global_step": 296382, "epoch": 3570} {"train_loss": -25.42744255065918, "global_step": 296383, "epoch": 3570} {"train_loss": -25.48007583618164, "global_step": 296384, "epoch": 3570} {"train_loss": -25.595582962036133, "global_step": 296385, "epoch": 3570} {"train_loss": -25.369068145751953, "global_step": 296386, "epoch": 3570} {"train_loss": -25.72115135192871, "global_step": 296387, "epoch": 3570} {"train_loss": -25.618881225585938, "global_step": 296388, "epoch": 3570} {"train_loss": -26.009984970092773, "global_step": 296389, "epoch": 3570} {"train_loss": -25.629745483398438, "global_step": 296390, "epoch": 3570} {"train_loss": -25.28513526916504, "global_step": 296391, "epoch": 3570} {"train_loss": -25.504967999745563, "global_step": 296392, "epoch": 3570, "val_loss": 7081145.5} {"train_loss": -24.49946403503418, "global_step": 296393, "epoch": 3571} {"train_loss": -24.48557472229004, "global_step": 296394, "epoch": 3571} {"train_loss": -25.082014083862305, "global_step": 296395, "epoch": 3571} {"train_loss": -24.556211471557617, "global_step": 296396, "epoch": 3571} {"train_loss": -24.547204971313477, "global_step": 296397, "epoch": 3571} {"train_loss": -25.06190299987793, "global_step": 296398, "epoch": 3571} {"train_loss": -24.963895797729492, "global_step": 296399, "epoch": 3571} {"train_loss": -25.272247314453125, "global_step": 296400, "epoch": 3571} {"train_loss": -24.585981369018555, "global_step": 296401, "epoch": 3571} {"train_loss": -24.778362274169922, "global_step": 296402, "epoch": 3571} {"train_loss": -25.349328994750977, "global_step": 296403, "epoch": 3571} {"train_loss": -25.15590476989746, "global_step": 296404, "epoch": 3571} {"train_loss": -25.000314712524414, "global_step": 296405, "epoch": 3571} {"train_loss": -25.165969848632812, "global_step": 296406, "epoch": 3571} {"train_loss": -25.27638053894043, "global_step": 296407, "epoch": 3571} {"train_loss": -25.261137008666992, "global_step": 296408, "epoch": 3571} {"train_loss": -25.1335506439209, "global_step": 296409, "epoch": 3571} {"train_loss": -25.346342086791992, "global_step": 296410, "epoch": 3571} {"train_loss": -25.40877342224121, "global_step": 296411, "epoch": 3571} {"train_loss": -25.34698486328125, "global_step": 296412, "epoch": 3571} {"train_loss": -25.394641876220703, "global_step": 296413, "epoch": 3571} {"train_loss": -25.2420711517334, "global_step": 296414, "epoch": 3571} {"train_loss": -25.39337921142578, "global_step": 296415, "epoch": 3571} {"train_loss": -25.342527389526367, "global_step": 296416, "epoch": 3571} {"train_loss": -25.609277725219727, "global_step": 296417, "epoch": 3571} {"train_loss": -25.613525390625, "global_step": 296418, "epoch": 3571} {"train_loss": -25.188703536987305, "global_step": 296419, "epoch": 3571} {"train_loss": -25.94687843322754, "global_step": 296420, "epoch": 3571} {"train_loss": -25.570173263549805, "global_step": 296421, "epoch": 3571} {"train_loss": -25.79682731628418, "global_step": 296422, "epoch": 3571} {"train_loss": -25.743179321289062, "global_step": 296423, "epoch": 3571} {"train_loss": -25.668415069580078, "global_step": 296424, "epoch": 3571} {"train_loss": -25.7248592376709, "global_step": 296425, "epoch": 3571} {"train_loss": -25.49657440185547, "global_step": 296426, "epoch": 3571} {"train_loss": -25.558664321899414, "global_step": 296427, "epoch": 3571} {"train_loss": -25.654104232788086, "global_step": 296428, "epoch": 3571} {"train_loss": -25.958072662353516, "global_step": 296429, "epoch": 3571} {"train_loss": -25.704740524291992, "global_step": 296430, "epoch": 3571} {"train_loss": -25.59453773498535, "global_step": 296431, "epoch": 3571} {"train_loss": -25.868087768554688, "global_step": 296432, "epoch": 3571} {"train_loss": -25.67352294921875, "global_step": 296433, "epoch": 3571} {"train_loss": -25.859455108642578, "global_step": 296434, "epoch": 3571} {"train_loss": -25.860687255859375, "global_step": 296435, "epoch": 3571} {"train_loss": -25.790136337280273, "global_step": 296436, "epoch": 3571} {"train_loss": -25.7088680267334, "global_step": 296437, "epoch": 3571} {"train_loss": -25.742151260375977, "global_step": 296438, "epoch": 3571} {"train_loss": -25.51978302001953, "global_step": 296439, "epoch": 3571} {"train_loss": -25.604822158813477, "global_step": 296440, "epoch": 3571} {"train_loss": -25.742685317993164, "global_step": 296441, "epoch": 3571} {"train_loss": -25.955347061157227, "global_step": 296442, "epoch": 3571} {"train_loss": -25.955469131469727, "global_step": 296443, "epoch": 3571} {"train_loss": -25.485326766967773, "global_step": 296444, "epoch": 3571} {"train_loss": -25.687610626220703, "global_step": 296445, "epoch": 3571} {"train_loss": -25.763595581054688, "global_step": 296446, "epoch": 3571} {"train_loss": -25.866683959960938, "global_step": 296447, "epoch": 3571} {"train_loss": -25.349945068359375, "global_step": 296448, "epoch": 3571} {"train_loss": -25.10538101196289, "global_step": 296449, "epoch": 3571} {"train_loss": -25.426589965820312, "global_step": 296450, "epoch": 3571} {"train_loss": -25.22882652282715, "global_step": 296451, "epoch": 3571} {"train_loss": -25.610870361328125, "global_step": 296452, "epoch": 3571} {"train_loss": -25.470727920532227, "global_step": 296453, "epoch": 3571} {"train_loss": -25.90546989440918, "global_step": 296454, "epoch": 3571} {"train_loss": -25.62945556640625, "global_step": 296455, "epoch": 3571} {"train_loss": -25.617361068725586, "global_step": 296456, "epoch": 3571} {"train_loss": -25.443679809570312, "global_step": 296457, "epoch": 3571} {"train_loss": -25.587160110473633, "global_step": 296458, "epoch": 3571} {"train_loss": -25.57573699951172, "global_step": 296459, "epoch": 3571} {"train_loss": -25.72468376159668, "global_step": 296460, "epoch": 3571} {"train_loss": -26.005157470703125, "global_step": 296461, "epoch": 3571} {"train_loss": -26.2537899017334, "global_step": 296462, "epoch": 3571} {"train_loss": -25.393260955810547, "global_step": 296463, "epoch": 3571} {"train_loss": -25.445480346679688, "global_step": 296464, "epoch": 3571} {"train_loss": -25.54623031616211, "global_step": 296465, "epoch": 3571} {"train_loss": -26.121368408203125, "global_step": 296466, "epoch": 3571} {"train_loss": -25.793073654174805, "global_step": 296467, "epoch": 3571} {"train_loss": -25.63886070251465, "global_step": 296468, "epoch": 3571} {"train_loss": -25.49332046508789, "global_step": 296469, "epoch": 3571} {"train_loss": -25.575170516967773, "global_step": 296470, "epoch": 3571} {"train_loss": -25.240262985229492, "global_step": 296471, "epoch": 3571} {"train_loss": -25.443429946899414, "global_step": 296472, "epoch": 3571} {"train_loss": -25.788639068603516, "global_step": 296473, "epoch": 3571} {"train_loss": -25.837369918823242, "global_step": 296474, "epoch": 3571} {"train_loss": -25.47514596042863, "global_step": 296475, "epoch": 3571, "val_loss": 7176334.0} {"train_loss": -24.886564254760742, "global_step": 296476, "epoch": 3572} {"train_loss": -24.70232582092285, "global_step": 296477, "epoch": 3572} {"train_loss": -24.98384666442871, "global_step": 296478, "epoch": 3572} {"train_loss": -25.334142684936523, "global_step": 296479, "epoch": 3572} {"train_loss": -25.446733474731445, "global_step": 296480, "epoch": 3572} {"train_loss": -25.272192001342773, "global_step": 296481, "epoch": 3572} {"train_loss": -25.11655616760254, "global_step": 296482, "epoch": 3572} {"train_loss": -25.504825592041016, "global_step": 296483, "epoch": 3572} {"train_loss": -25.115070343017578, "global_step": 296484, "epoch": 3572} {"train_loss": -25.227203369140625, "global_step": 296485, "epoch": 3572} {"train_loss": -25.15376853942871, "global_step": 296486, "epoch": 3572} {"train_loss": -25.728612899780273, "global_step": 296487, "epoch": 3572} {"train_loss": -25.58548927307129, "global_step": 296488, "epoch": 3572} {"train_loss": -25.477079391479492, "global_step": 296489, "epoch": 3572} {"train_loss": -25.759521484375, "global_step": 296490, "epoch": 3572} {"train_loss": -25.572372436523438, "global_step": 296491, "epoch": 3572} {"train_loss": -25.618406295776367, "global_step": 296492, "epoch": 3572} {"train_loss": -25.592317581176758, "global_step": 296493, "epoch": 3572} {"train_loss": -25.68995475769043, "global_step": 296494, "epoch": 3572} {"train_loss": -25.615934371948242, "global_step": 296495, "epoch": 3572} {"train_loss": -25.609594345092773, "global_step": 296496, "epoch": 3572} {"train_loss": -25.470001220703125, "global_step": 296497, "epoch": 3572} {"train_loss": -25.49359703063965, "global_step": 296498, "epoch": 3572} {"train_loss": -25.565431594848633, "global_step": 296499, "epoch": 3572} {"train_loss": -25.42701530456543, "global_step": 296500, "epoch": 3572} {"train_loss": -25.247241973876953, "global_step": 296501, "epoch": 3572} {"train_loss": -25.658777236938477, "global_step": 296502, "epoch": 3572} {"train_loss": -25.71152114868164, "global_step": 296503, "epoch": 3572} {"train_loss": -25.58039665222168, "global_step": 296504, "epoch": 3572} {"train_loss": -25.788660049438477, "global_step": 296505, "epoch": 3572} {"train_loss": -25.482208251953125, "global_step": 296506, "epoch": 3572} {"train_loss": -25.335641860961914, "global_step": 296507, "epoch": 3572} {"train_loss": -25.406335830688477, "global_step": 296508, "epoch": 3572} {"train_loss": -25.584274291992188, "global_step": 296509, "epoch": 3572} {"train_loss": -25.801685333251953, "global_step": 296510, "epoch": 3572} {"train_loss": -25.618240356445312, "global_step": 296511, "epoch": 3572} {"train_loss": -25.856115341186523, "global_step": 296512, "epoch": 3572} {"train_loss": -25.649396896362305, "global_step": 296513, "epoch": 3572} {"train_loss": -25.770782470703125, "global_step": 296514, "epoch": 3572} {"train_loss": -25.419286727905273, "global_step": 296515, "epoch": 3572} {"train_loss": -25.742258071899414, "global_step": 296516, "epoch": 3572} {"train_loss": -25.58104705810547, "global_step": 296517, "epoch": 3572} {"train_loss": -26.13840675354004, "global_step": 296518, "epoch": 3572} {"train_loss": -25.888208389282227, "global_step": 296519, "epoch": 3572} {"train_loss": -25.775671005249023, "global_step": 296520, "epoch": 3572} {"train_loss": -25.53970718383789, "global_step": 296521, "epoch": 3572} {"train_loss": -25.41552734375, "global_step": 296522, "epoch": 3572} {"train_loss": -26.073333740234375, "global_step": 296523, "epoch": 3572} {"train_loss": -25.494314193725586, "global_step": 296524, "epoch": 3572} {"train_loss": -25.391141891479492, "global_step": 296525, "epoch": 3572} {"train_loss": -25.676376342773438, "global_step": 296526, "epoch": 3572} {"train_loss": -25.8122501373291, "global_step": 296527, "epoch": 3572} {"train_loss": -25.718231201171875, "global_step": 296528, "epoch": 3572} {"train_loss": -25.395965576171875, "global_step": 296529, "epoch": 3572} {"train_loss": -25.57913589477539, "global_step": 296530, "epoch": 3572} {"train_loss": -25.789154052734375, "global_step": 296531, "epoch": 3572} {"train_loss": -25.58234977722168, "global_step": 296532, "epoch": 3572} {"train_loss": -25.651639938354492, "global_step": 296533, "epoch": 3572} {"train_loss": -25.54610252380371, "global_step": 296534, "epoch": 3572} {"train_loss": -25.714130401611328, "global_step": 296535, "epoch": 3572} {"train_loss": -25.212512969970703, "global_step": 296536, "epoch": 3572} {"train_loss": -25.148351669311523, "global_step": 296537, "epoch": 3572} {"train_loss": -25.037336349487305, "global_step": 296538, "epoch": 3572} {"train_loss": -24.70384407043457, "global_step": 296539, "epoch": 3572} {"train_loss": -24.933780670166016, "global_step": 296540, "epoch": 3572} {"train_loss": -25.585283279418945, "global_step": 296541, "epoch": 3572} {"train_loss": -25.32887077331543, "global_step": 296542, "epoch": 3572} {"train_loss": -24.923246383666992, "global_step": 296543, "epoch": 3572} {"train_loss": -25.377300262451172, "global_step": 296544, "epoch": 3572} {"train_loss": -25.420578002929688, "global_step": 296545, "epoch": 3572} {"train_loss": -25.223936080932617, "global_step": 296546, "epoch": 3572} {"train_loss": -25.013593673706055, "global_step": 296547, "epoch": 3572} {"train_loss": -25.7105770111084, "global_step": 296548, "epoch": 3572} {"train_loss": -25.035737991333008, "global_step": 296549, "epoch": 3572} {"train_loss": -25.387155532836914, "global_step": 296550, "epoch": 3572} {"train_loss": -25.63813591003418, "global_step": 296551, "epoch": 3572} {"train_loss": -25.667800903320312, "global_step": 296552, "epoch": 3572} {"train_loss": -25.552717208862305, "global_step": 296553, "epoch": 3572} {"train_loss": -25.647541046142578, "global_step": 296554, "epoch": 3572} {"train_loss": -25.45477867126465, "global_step": 296555, "epoch": 3572} {"train_loss": -25.220197677612305, "global_step": 296556, "epoch": 3572} {"train_loss": -25.690032958984375, "global_step": 296557, "epoch": 3572} {"train_loss": -25.462709909462067, "global_step": 296558, "epoch": 3572, "val_loss": 7252288.0} {"train_loss": -25.155515670776367, "global_step": 296559, "epoch": 3573} {"train_loss": -25.1124324798584, "global_step": 296560, "epoch": 3573} {"train_loss": -24.989347457885742, "global_step": 296561, "epoch": 3573} {"train_loss": -25.49594497680664, "global_step": 296562, "epoch": 3573} {"train_loss": -24.83644676208496, "global_step": 296563, "epoch": 3573} {"train_loss": -25.26826286315918, "global_step": 296564, "epoch": 3573} {"train_loss": -25.61346435546875, "global_step": 296565, "epoch": 3573} {"train_loss": -25.033248901367188, "global_step": 296566, "epoch": 3573} {"train_loss": -25.311786651611328, "global_step": 296567, "epoch": 3573} {"train_loss": -25.244916915893555, "global_step": 296568, "epoch": 3573} {"train_loss": -25.292774200439453, "global_step": 296569, "epoch": 3573} {"train_loss": -25.12358856201172, "global_step": 296570, "epoch": 3573} {"train_loss": -25.26302146911621, "global_step": 296571, "epoch": 3573} {"train_loss": -25.30479621887207, "global_step": 296572, "epoch": 3573} {"train_loss": -25.34584617614746, "global_step": 296573, "epoch": 3573} {"train_loss": -25.44928550720215, "global_step": 296574, "epoch": 3573} {"train_loss": -25.32756233215332, "global_step": 296575, "epoch": 3573} {"train_loss": -25.3828067779541, "global_step": 296576, "epoch": 3573} {"train_loss": -25.714431762695312, "global_step": 296577, "epoch": 3573} {"train_loss": -25.7451114654541, "global_step": 296578, "epoch": 3573} {"train_loss": -25.660612106323242, "global_step": 296579, "epoch": 3573} {"train_loss": -25.633392333984375, "global_step": 296580, "epoch": 3573} {"train_loss": -25.7431697845459, "global_step": 296581, "epoch": 3573} {"train_loss": -25.45247459411621, "global_step": 296582, "epoch": 3573} {"train_loss": -25.59900665283203, "global_step": 296583, "epoch": 3573} {"train_loss": -25.618844985961914, "global_step": 296584, "epoch": 3573} {"train_loss": -25.53192710876465, "global_step": 296585, "epoch": 3573} {"train_loss": -25.71426773071289, "global_step": 296586, "epoch": 3573} {"train_loss": -25.521812438964844, "global_step": 296587, "epoch": 3573} {"train_loss": -25.59772300720215, "global_step": 296588, "epoch": 3573} {"train_loss": -25.850677490234375, "global_step": 296589, "epoch": 3573} {"train_loss": -25.72151756286621, "global_step": 296590, "epoch": 3573} {"train_loss": -25.543643951416016, "global_step": 296591, "epoch": 3573} {"train_loss": -25.67426872253418, "global_step": 296592, "epoch": 3573} {"train_loss": -25.491836547851562, "global_step": 296593, "epoch": 3573} {"train_loss": -25.437929153442383, "global_step": 296594, "epoch": 3573} {"train_loss": -25.76908302307129, "global_step": 296595, "epoch": 3573} {"train_loss": -25.831525802612305, "global_step": 296596, "epoch": 3573} {"train_loss": -25.882781982421875, "global_step": 296597, "epoch": 3573} {"train_loss": -25.534290313720703, "global_step": 296598, "epoch": 3573} {"train_loss": -25.506635665893555, "global_step": 296599, "epoch": 3573} {"train_loss": -25.741445541381836, "global_step": 296600, "epoch": 3573} {"train_loss": -25.473684310913086, "global_step": 296601, "epoch": 3573} {"train_loss": -25.73927116394043, "global_step": 296602, "epoch": 3573} {"train_loss": -25.980066299438477, "global_step": 296603, "epoch": 3573} {"train_loss": -25.72367286682129, "global_step": 296604, "epoch": 3573} {"train_loss": -25.70770835876465, "global_step": 296605, "epoch": 3573} {"train_loss": -25.469635009765625, "global_step": 296606, "epoch": 3573} {"train_loss": -25.6732120513916, "global_step": 296607, "epoch": 3573} {"train_loss": -25.67213249206543, "global_step": 296608, "epoch": 3573} {"train_loss": -26.036712646484375, "global_step": 296609, "epoch": 3573} {"train_loss": -25.71502113342285, "global_step": 296610, "epoch": 3573} {"train_loss": -25.72308349609375, "global_step": 296611, "epoch": 3573} {"train_loss": -25.425281524658203, "global_step": 296612, "epoch": 3573} {"train_loss": -25.678085327148438, "global_step": 296613, "epoch": 3573} {"train_loss": -25.632843017578125, "global_step": 296614, "epoch": 3573} {"train_loss": -25.670618057250977, "global_step": 296615, "epoch": 3573} {"train_loss": -25.8675537109375, "global_step": 296616, "epoch": 3573} {"train_loss": -26.1524658203125, "global_step": 296617, "epoch": 3573} {"train_loss": -25.814441680908203, "global_step": 296618, "epoch": 3573} {"train_loss": -25.843297958374023, "global_step": 296619, "epoch": 3573} {"train_loss": -25.712915420532227, "global_step": 296620, "epoch": 3573} {"train_loss": -25.457969665527344, "global_step": 296621, "epoch": 3573} {"train_loss": -25.7878475189209, "global_step": 296622, "epoch": 3573} {"train_loss": -25.969778060913086, "global_step": 296623, "epoch": 3573} {"train_loss": -25.888916015625, "global_step": 296624, "epoch": 3573} {"train_loss": -25.789770126342773, "global_step": 296625, "epoch": 3573} {"train_loss": -25.773681640625, "global_step": 296626, "epoch": 3573} {"train_loss": -25.36811065673828, "global_step": 296627, "epoch": 3573} {"train_loss": -25.598913192749023, "global_step": 296628, "epoch": 3573} {"train_loss": -25.55814552307129, "global_step": 296629, "epoch": 3573} {"train_loss": -25.401611328125, "global_step": 296630, "epoch": 3573} {"train_loss": -25.704259872436523, "global_step": 296631, "epoch": 3573} {"train_loss": -25.67598533630371, "global_step": 296632, "epoch": 3573} {"train_loss": -25.942005157470703, "global_step": 296633, "epoch": 3573} {"train_loss": -25.445384979248047, "global_step": 296634, "epoch": 3573} {"train_loss": -25.887914657592773, "global_step": 296635, "epoch": 3573} {"train_loss": -25.356481552124023, "global_step": 296636, "epoch": 3573} {"train_loss": -25.283910751342773, "global_step": 296637, "epoch": 3573} {"train_loss": -24.87623405456543, "global_step": 296638, "epoch": 3573} {"train_loss": -24.86607551574707, "global_step": 296639, "epoch": 3573} {"train_loss": -25.717803955078125, "global_step": 296640, "epoch": 3573} {"train_loss": -25.567961221717926, "global_step": 296641, "epoch": 3573, "val_loss": 7254762.0} {"train_loss": -25.126543045043945, "global_step": 296642, "epoch": 3574} {"train_loss": -24.264829635620117, "global_step": 296643, "epoch": 3574} {"train_loss": -24.40911293029785, "global_step": 296644, "epoch": 3574} {"train_loss": -24.48870086669922, "global_step": 296645, "epoch": 3574} {"train_loss": -24.663206100463867, "global_step": 296646, "epoch": 3574} {"train_loss": -24.1624813079834, "global_step": 296647, "epoch": 3574} {"train_loss": -24.105854034423828, "global_step": 296648, "epoch": 3574} {"train_loss": -24.666194915771484, "global_step": 296649, "epoch": 3574} {"train_loss": -24.008865356445312, "global_step": 296650, "epoch": 3574} {"train_loss": -24.83431625366211, "global_step": 296651, "epoch": 3574} {"train_loss": -24.624677658081055, "global_step": 296652, "epoch": 3574} {"train_loss": -24.547456741333008, "global_step": 296653, "epoch": 3574} {"train_loss": -25.393917083740234, "global_step": 296654, "epoch": 3574} {"train_loss": -24.84259605407715, "global_step": 296655, "epoch": 3574} {"train_loss": -24.7496395111084, "global_step": 296656, "epoch": 3574} {"train_loss": -24.547733306884766, "global_step": 296657, "epoch": 3574} {"train_loss": -24.791259765625, "global_step": 296658, "epoch": 3574} {"train_loss": -25.036230087280273, "global_step": 296659, "epoch": 3574} {"train_loss": -24.88627052307129, "global_step": 296660, "epoch": 3574} {"train_loss": -24.921356201171875, "global_step": 296661, "epoch": 3574} {"train_loss": -24.878822326660156, "global_step": 296662, "epoch": 3574} {"train_loss": -25.296361923217773, "global_step": 296663, "epoch": 3574} {"train_loss": -25.067218780517578, "global_step": 296664, "epoch": 3574} {"train_loss": -25.37354850769043, "global_step": 296665, "epoch": 3574} {"train_loss": -25.034847259521484, "global_step": 296666, "epoch": 3574} {"train_loss": -24.943796157836914, "global_step": 296667, "epoch": 3574} {"train_loss": -24.99527359008789, "global_step": 296668, "epoch": 3574} {"train_loss": -25.289838790893555, "global_step": 296669, "epoch": 3574} {"train_loss": -24.826475143432617, "global_step": 296670, "epoch": 3574} {"train_loss": -25.06251335144043, "global_step": 296671, "epoch": 3574} {"train_loss": -25.5093936920166, "global_step": 296672, "epoch": 3574} {"train_loss": -25.36202049255371, "global_step": 296673, "epoch": 3574} {"train_loss": -25.060932159423828, "global_step": 296674, "epoch": 3574} {"train_loss": -25.421987533569336, "global_step": 296675, "epoch": 3574} {"train_loss": -25.489477157592773, "global_step": 296676, "epoch": 3574} {"train_loss": -25.395889282226562, "global_step": 296677, "epoch": 3574} {"train_loss": -25.5645694732666, "global_step": 296678, "epoch": 3574} {"train_loss": -25.32820701599121, "global_step": 296679, "epoch": 3574} {"train_loss": -25.40430450439453, "global_step": 296680, "epoch": 3574} {"train_loss": -25.76348876953125, "global_step": 296681, "epoch": 3574} {"train_loss": -25.358158111572266, "global_step": 296682, "epoch": 3574} {"train_loss": -25.53156089782715, "global_step": 296683, "epoch": 3574} {"train_loss": -25.34418487548828, "global_step": 296684, "epoch": 3574} {"train_loss": -26.211013793945312, "global_step": 296685, "epoch": 3574} {"train_loss": -25.607257843017578, "global_step": 296686, "epoch": 3574} {"train_loss": -25.687124252319336, "global_step": 296687, "epoch": 3574} {"train_loss": -25.749876022338867, "global_step": 296688, "epoch": 3574} {"train_loss": -25.93202018737793, "global_step": 296689, "epoch": 3574} {"train_loss": -25.601974487304688, "global_step": 296690, "epoch": 3574} {"train_loss": -25.69515037536621, "global_step": 296691, "epoch": 3574} {"train_loss": -25.59661293029785, "global_step": 296692, "epoch": 3574} {"train_loss": -25.882822036743164, "global_step": 296693, "epoch": 3574} {"train_loss": -25.4061336517334, "global_step": 296694, "epoch": 3574} {"train_loss": -25.9921817779541, "global_step": 296695, "epoch": 3574} {"train_loss": -25.648412704467773, "global_step": 296696, "epoch": 3574} {"train_loss": -26.00068473815918, "global_step": 296697, "epoch": 3574} {"train_loss": -25.724180221557617, "global_step": 296698, "epoch": 3574} {"train_loss": -25.746015548706055, "global_step": 296699, "epoch": 3574} {"train_loss": -25.732954025268555, "global_step": 296700, "epoch": 3574} {"train_loss": -25.53165626525879, "global_step": 296701, "epoch": 3574} {"train_loss": -25.768665313720703, "global_step": 296702, "epoch": 3574} {"train_loss": -25.298948287963867, "global_step": 296703, "epoch": 3574} {"train_loss": -24.922658920288086, "global_step": 296704, "epoch": 3574} {"train_loss": -24.240455627441406, "global_step": 296705, "epoch": 3574} {"train_loss": -24.14857292175293, "global_step": 296706, "epoch": 3574} {"train_loss": -24.935136795043945, "global_step": 296707, "epoch": 3574} {"train_loss": -25.53779411315918, "global_step": 296708, "epoch": 3574} {"train_loss": -25.200841903686523, "global_step": 296709, "epoch": 3574} {"train_loss": -25.235734939575195, "global_step": 296710, "epoch": 3574} {"train_loss": -25.000585556030273, "global_step": 296711, "epoch": 3574} {"train_loss": -25.531164169311523, "global_step": 296712, "epoch": 3574} {"train_loss": -25.134014129638672, "global_step": 296713, "epoch": 3574} {"train_loss": -25.368093490600586, "global_step": 296714, "epoch": 3574} {"train_loss": -25.344253540039062, "global_step": 296715, "epoch": 3574} {"train_loss": -25.269880294799805, "global_step": 296716, "epoch": 3574} {"train_loss": -25.464136123657227, "global_step": 296717, "epoch": 3574} {"train_loss": -25.0933895111084, "global_step": 296718, "epoch": 3574} {"train_loss": -25.12384605407715, "global_step": 296719, "epoch": 3574} {"train_loss": -24.993091583251953, "global_step": 296720, "epoch": 3574} {"train_loss": -25.277524948120117, "global_step": 296721, "epoch": 3574} {"train_loss": -25.436376571655273, "global_step": 296722, "epoch": 3574} {"train_loss": -25.78350257873535, "global_step": 296723, "epoch": 3574} {"train_loss": -25.19751268409821, "global_step": 296724, "epoch": 3574, "val_loss": 7112960.0} {"train_loss": -22.604171752929688, "global_step": 296725, "epoch": 3575} {"train_loss": -24.958677291870117, "global_step": 296726, "epoch": 3575} {"train_loss": -23.414243698120117, "global_step": 296727, "epoch": 3575} {"train_loss": -23.760562896728516, "global_step": 296728, "epoch": 3575} {"train_loss": -24.408811569213867, "global_step": 296729, "epoch": 3575} {"train_loss": -24.266036987304688, "global_step": 296730, "epoch": 3575} {"train_loss": -24.569007873535156, "global_step": 296731, "epoch": 3575} {"train_loss": -25.02146339416504, "global_step": 296732, "epoch": 3575} {"train_loss": -24.738924026489258, "global_step": 296733, "epoch": 3575} {"train_loss": -24.772602081298828, "global_step": 296734, "epoch": 3575} {"train_loss": -24.711267471313477, "global_step": 296735, "epoch": 3575} {"train_loss": -24.764554977416992, "global_step": 296736, "epoch": 3575} {"train_loss": -24.642160415649414, "global_step": 296737, "epoch": 3575} {"train_loss": -24.96379280090332, "global_step": 296738, "epoch": 3575} {"train_loss": -24.61513328552246, "global_step": 296739, "epoch": 3575} {"train_loss": -25.171403884887695, "global_step": 296740, "epoch": 3575} {"train_loss": -24.63445281982422, "global_step": 296741, "epoch": 3575} {"train_loss": -24.88822364807129, "global_step": 296742, "epoch": 3575} {"train_loss": -25.2507381439209, "global_step": 296743, "epoch": 3575} {"train_loss": -24.95751953125, "global_step": 296744, "epoch": 3575} {"train_loss": -24.971830368041992, "global_step": 296745, "epoch": 3575} {"train_loss": -25.124942779541016, "global_step": 296746, "epoch": 3575} {"train_loss": -25.439661026000977, "global_step": 296747, "epoch": 3575} {"train_loss": -25.234342575073242, "global_step": 296748, "epoch": 3575} {"train_loss": -25.585905075073242, "global_step": 296749, "epoch": 3575} {"train_loss": -25.357275009155273, "global_step": 296750, "epoch": 3575} {"train_loss": -25.245742797851562, "global_step": 296751, "epoch": 3575} {"train_loss": -25.586990356445312, "global_step": 296752, "epoch": 3575} {"train_loss": -25.467077255249023, "global_step": 296753, "epoch": 3575} {"train_loss": -25.540393829345703, "global_step": 296754, "epoch": 3575} {"train_loss": -25.61686134338379, "global_step": 296755, "epoch": 3575} {"train_loss": -25.4375, "global_step": 296756, "epoch": 3575} {"train_loss": -25.5269832611084, "global_step": 296757, "epoch": 3575} {"train_loss": -25.646240234375, "global_step": 296758, "epoch": 3575} {"train_loss": -25.636503219604492, "global_step": 296759, "epoch": 3575} {"train_loss": -25.84620475769043, "global_step": 296760, "epoch": 3575} {"train_loss": -25.40486717224121, "global_step": 296761, "epoch": 3575} {"train_loss": -25.84205436706543, "global_step": 296762, "epoch": 3575} {"train_loss": -25.717126846313477, "global_step": 296763, "epoch": 3575} {"train_loss": -25.221210479736328, "global_step": 296764, "epoch": 3575} {"train_loss": -25.884016036987305, "global_step": 296765, "epoch": 3575} {"train_loss": -25.6568603515625, "global_step": 296766, "epoch": 3575} {"train_loss": -25.552541732788086, "global_step": 296767, "epoch": 3575} {"train_loss": -25.34010887145996, "global_step": 296768, "epoch": 3575} {"train_loss": -25.835744857788086, "global_step": 296769, "epoch": 3575} {"train_loss": -25.85352897644043, "global_step": 296770, "epoch": 3575} {"train_loss": -25.939865112304688, "global_step": 296771, "epoch": 3575} {"train_loss": -25.474166870117188, "global_step": 296772, "epoch": 3575} {"train_loss": -25.370498657226562, "global_step": 296773, "epoch": 3575} {"train_loss": -25.333486557006836, "global_step": 296774, "epoch": 3575} {"train_loss": -25.740148544311523, "global_step": 296775, "epoch": 3575} {"train_loss": -25.735177993774414, "global_step": 296776, "epoch": 3575} {"train_loss": -25.80645179748535, "global_step": 296777, "epoch": 3575} {"train_loss": -25.625686645507812, "global_step": 296778, "epoch": 3575} {"train_loss": -25.619022369384766, "global_step": 296779, "epoch": 3575} {"train_loss": -25.678970336914062, "global_step": 296780, "epoch": 3575} {"train_loss": -26.03840446472168, "global_step": 296781, "epoch": 3575} {"train_loss": -25.51686668395996, "global_step": 296782, "epoch": 3575} {"train_loss": -25.47979164123535, "global_step": 296783, "epoch": 3575} {"train_loss": -25.887664794921875, "global_step": 296784, "epoch": 3575} {"train_loss": -25.583349227905273, "global_step": 296785, "epoch": 3575} {"train_loss": -25.294832229614258, "global_step": 296786, "epoch": 3575} {"train_loss": -25.335712432861328, "global_step": 296787, "epoch": 3575} {"train_loss": -25.53645133972168, "global_step": 296788, "epoch": 3575} {"train_loss": -25.43280029296875, "global_step": 296789, "epoch": 3575} {"train_loss": -25.442020416259766, "global_step": 296790, "epoch": 3575} {"train_loss": -25.66425895690918, "global_step": 296791, "epoch": 3575} {"train_loss": -25.478836059570312, "global_step": 296792, "epoch": 3575} {"train_loss": -25.577619552612305, "global_step": 296793, "epoch": 3575} {"train_loss": -26.040754318237305, "global_step": 296794, "epoch": 3575} {"train_loss": -25.31339454650879, "global_step": 296795, "epoch": 3575} {"train_loss": -25.59102439880371, "global_step": 296796, "epoch": 3575} {"train_loss": -25.91110610961914, "global_step": 296797, "epoch": 3575} {"train_loss": -25.200429916381836, "global_step": 296798, "epoch": 3575} {"train_loss": -25.620559692382812, "global_step": 296799, "epoch": 3575} {"train_loss": -25.2767276763916, "global_step": 296800, "epoch": 3575} {"train_loss": -25.60626792907715, "global_step": 296801, "epoch": 3575} {"train_loss": -25.52015495300293, "global_step": 296802, "epoch": 3575} {"train_loss": -25.396581649780273, "global_step": 296803, "epoch": 3575} {"train_loss": -25.49012565612793, "global_step": 296804, "epoch": 3575} {"train_loss": -25.738880157470703, "global_step": 296805, "epoch": 3575} {"train_loss": -25.234088897705078, "global_step": 296806, "epoch": 3575} {"train_loss": -25.32777282990605, "global_step": 296807, "epoch": 3575, "val_loss": 7150889.0} {"train_loss": -25.719884872436523, "global_step": 296808, "epoch": 3576} {"train_loss": -25.358226776123047, "global_step": 296809, "epoch": 3576} {"train_loss": -25.117399215698242, "global_step": 296810, "epoch": 3576} {"train_loss": -25.344816207885742, "global_step": 296811, "epoch": 3576} {"train_loss": -25.372175216674805, "global_step": 296812, "epoch": 3576} {"train_loss": -25.727664947509766, "global_step": 296813, "epoch": 3576} {"train_loss": -25.28336524963379, "global_step": 296814, "epoch": 3576} {"train_loss": -25.037796020507812, "global_step": 296815, "epoch": 3576} {"train_loss": -25.735960006713867, "global_step": 296816, "epoch": 3576} {"train_loss": -25.435405731201172, "global_step": 296817, "epoch": 3576} {"train_loss": -25.2216739654541, "global_step": 296818, "epoch": 3576} {"train_loss": -25.408523559570312, "global_step": 296819, "epoch": 3576} {"train_loss": -25.549964904785156, "global_step": 296820, "epoch": 3576} {"train_loss": -25.676660537719727, "global_step": 296821, "epoch": 3576} {"train_loss": -25.47020149230957, "global_step": 296822, "epoch": 3576} {"train_loss": -25.544464111328125, "global_step": 296823, "epoch": 3576} {"train_loss": -25.679590225219727, "global_step": 296824, "epoch": 3576} {"train_loss": -25.84433364868164, "global_step": 296825, "epoch": 3576} {"train_loss": -25.291662216186523, "global_step": 296826, "epoch": 3576} {"train_loss": -25.541580200195312, "global_step": 296827, "epoch": 3576} {"train_loss": -25.51241111755371, "global_step": 296828, "epoch": 3576} {"train_loss": -25.193939208984375, "global_step": 296829, "epoch": 3576} {"train_loss": -25.52998161315918, "global_step": 296830, "epoch": 3576} {"train_loss": -25.51960563659668, "global_step": 296831, "epoch": 3576} {"train_loss": -25.666791915893555, "global_step": 296832, "epoch": 3576} {"train_loss": -25.272626876831055, "global_step": 296833, "epoch": 3576} {"train_loss": -25.482641220092773, "global_step": 296834, "epoch": 3576} {"train_loss": -25.36418342590332, "global_step": 296835, "epoch": 3576} {"train_loss": -25.444082260131836, "global_step": 296836, "epoch": 3576} {"train_loss": -25.360218048095703, "global_step": 296837, "epoch": 3576} {"train_loss": -25.681930541992188, "global_step": 296838, "epoch": 3576} {"train_loss": -25.83241081237793, "global_step": 296839, "epoch": 3576} {"train_loss": -25.84796714782715, "global_step": 296840, "epoch": 3576} {"train_loss": -25.531721115112305, "global_step": 296841, "epoch": 3576} {"train_loss": -25.513914108276367, "global_step": 296842, "epoch": 3576} {"train_loss": -25.44791603088379, "global_step": 296843, "epoch": 3576} {"train_loss": -25.442670822143555, "global_step": 296844, "epoch": 3576} {"train_loss": -25.693923950195312, "global_step": 296845, "epoch": 3576} {"train_loss": -25.917627334594727, "global_step": 296846, "epoch": 3576} {"train_loss": -25.47414207458496, "global_step": 296847, "epoch": 3576} {"train_loss": -25.515302658081055, "global_step": 296848, "epoch": 3576} {"train_loss": -25.522018432617188, "global_step": 296849, "epoch": 3576} {"train_loss": -25.411977767944336, "global_step": 296850, "epoch": 3576} {"train_loss": -25.357574462890625, "global_step": 296851, "epoch": 3576} {"train_loss": -25.630868911743164, "global_step": 296852, "epoch": 3576} {"train_loss": -25.699899673461914, "global_step": 296853, "epoch": 3576} {"train_loss": -25.777862548828125, "global_step": 296854, "epoch": 3576} {"train_loss": -25.717838287353516, "global_step": 296855, "epoch": 3576} {"train_loss": -25.779006958007812, "global_step": 296856, "epoch": 3576} {"train_loss": -25.83515739440918, "global_step": 296857, "epoch": 3576} {"train_loss": -25.713871002197266, "global_step": 296858, "epoch": 3576} {"train_loss": -25.96451759338379, "global_step": 296859, "epoch": 3576} {"train_loss": -25.808115005493164, "global_step": 296860, "epoch": 3576} {"train_loss": -25.654687881469727, "global_step": 296861, "epoch": 3576} {"train_loss": -25.75846290588379, "global_step": 296862, "epoch": 3576} {"train_loss": -25.975690841674805, "global_step": 296863, "epoch": 3576} {"train_loss": -25.641586303710938, "global_step": 296864, "epoch": 3576} {"train_loss": -25.6530818939209, "global_step": 296865, "epoch": 3576} {"train_loss": -25.588546752929688, "global_step": 296866, "epoch": 3576} {"train_loss": -25.982757568359375, "global_step": 296867, "epoch": 3576} {"train_loss": -25.69101905822754, "global_step": 296868, "epoch": 3576} {"train_loss": -25.427854537963867, "global_step": 296869, "epoch": 3576} {"train_loss": -25.479169845581055, "global_step": 296870, "epoch": 3576} {"train_loss": -25.711957931518555, "global_step": 296871, "epoch": 3576} {"train_loss": -25.493494033813477, "global_step": 296872, "epoch": 3576} {"train_loss": -25.721410751342773, "global_step": 296873, "epoch": 3576} {"train_loss": -25.50762939453125, "global_step": 296874, "epoch": 3576} {"train_loss": -25.585905075073242, "global_step": 296875, "epoch": 3576} {"train_loss": -25.13059425354004, "global_step": 296876, "epoch": 3576} {"train_loss": -25.36687660217285, "global_step": 296877, "epoch": 3576} {"train_loss": -25.08399772644043, "global_step": 296878, "epoch": 3576} {"train_loss": -25.493711471557617, "global_step": 296879, "epoch": 3576} {"train_loss": -25.70770263671875, "global_step": 296880, "epoch": 3576} {"train_loss": -25.491863250732422, "global_step": 296881, "epoch": 3576} {"train_loss": -25.342008590698242, "global_step": 296882, "epoch": 3576} {"train_loss": -25.32138442993164, "global_step": 296883, "epoch": 3576} {"train_loss": -25.45624351501465, "global_step": 296884, "epoch": 3576} {"train_loss": -25.652307510375977, "global_step": 296885, "epoch": 3576} {"train_loss": -25.68239402770996, "global_step": 296886, "epoch": 3576} {"train_loss": -25.45844078063965, "global_step": 296887, "epoch": 3576} {"train_loss": -25.703052520751953, "global_step": 296888, "epoch": 3576} {"train_loss": -25.334026336669922, "global_step": 296889, "epoch": 3576} {"train_loss": -25.561506685004176, "global_step": 296890, "epoch": 3576, "val_loss": 7219531.0} {"train_loss": -24.947484970092773, "global_step": 296891, "epoch": 3577} {"train_loss": -25.12669563293457, "global_step": 296892, "epoch": 3577} {"train_loss": -25.15049934387207, "global_step": 296893, "epoch": 3577} {"train_loss": -25.320606231689453, "global_step": 296894, "epoch": 3577} {"train_loss": -25.131549835205078, "global_step": 296895, "epoch": 3577} {"train_loss": -25.07388687133789, "global_step": 296896, "epoch": 3577} {"train_loss": -25.431049346923828, "global_step": 296897, "epoch": 3577} {"train_loss": -25.167577743530273, "global_step": 296898, "epoch": 3577} {"train_loss": -25.9033145904541, "global_step": 296899, "epoch": 3577} {"train_loss": -25.025808334350586, "global_step": 296900, "epoch": 3577} {"train_loss": -25.49339485168457, "global_step": 296901, "epoch": 3577} {"train_loss": -25.228784561157227, "global_step": 296902, "epoch": 3577} {"train_loss": -25.240802764892578, "global_step": 296903, "epoch": 3577} {"train_loss": -25.36162757873535, "global_step": 296904, "epoch": 3577} {"train_loss": -25.625995635986328, "global_step": 296905, "epoch": 3577} {"train_loss": -25.320676803588867, "global_step": 296906, "epoch": 3577} {"train_loss": -25.37116050720215, "global_step": 296907, "epoch": 3577} {"train_loss": -25.751630783081055, "global_step": 296908, "epoch": 3577} {"train_loss": -25.28700828552246, "global_step": 296909, "epoch": 3577} {"train_loss": -25.353805541992188, "global_step": 296910, "epoch": 3577} {"train_loss": -25.468257904052734, "global_step": 296911, "epoch": 3577} {"train_loss": -25.479780197143555, "global_step": 296912, "epoch": 3577} {"train_loss": -25.664587020874023, "global_step": 296913, "epoch": 3577} {"train_loss": -25.39832305908203, "global_step": 296914, "epoch": 3577} {"train_loss": -25.49273109436035, "global_step": 296915, "epoch": 3577} {"train_loss": -25.34925651550293, "global_step": 296916, "epoch": 3577} {"train_loss": -25.97673988342285, "global_step": 296917, "epoch": 3577} {"train_loss": -25.37939453125, "global_step": 296918, "epoch": 3577} {"train_loss": -25.70069694519043, "global_step": 296919, "epoch": 3577} {"train_loss": -25.583688735961914, "global_step": 296920, "epoch": 3577} {"train_loss": -25.808795928955078, "global_step": 296921, "epoch": 3577} {"train_loss": -25.60093116760254, "global_step": 296922, "epoch": 3577} {"train_loss": -25.864154815673828, "global_step": 296923, "epoch": 3577} {"train_loss": -25.467161178588867, "global_step": 296924, "epoch": 3577} {"train_loss": -25.733015060424805, "global_step": 296925, "epoch": 3577} {"train_loss": -25.532506942749023, "global_step": 296926, "epoch": 3577} {"train_loss": -25.501455307006836, "global_step": 296927, "epoch": 3577} {"train_loss": -25.79145622253418, "global_step": 296928, "epoch": 3577} {"train_loss": -26.11417579650879, "global_step": 296929, "epoch": 3577} {"train_loss": -25.80084228515625, "global_step": 296930, "epoch": 3577} {"train_loss": -25.395200729370117, "global_step": 296931, "epoch": 3577} {"train_loss": -26.118072509765625, "global_step": 296932, "epoch": 3577} {"train_loss": -25.441287994384766, "global_step": 296933, "epoch": 3577} {"train_loss": -25.417509078979492, "global_step": 296934, "epoch": 3577} {"train_loss": -25.150632858276367, "global_step": 296935, "epoch": 3577} {"train_loss": -24.62701416015625, "global_step": 296936, "epoch": 3577} {"train_loss": -24.31774139404297, "global_step": 296937, "epoch": 3577} {"train_loss": -24.552932739257812, "global_step": 296938, "epoch": 3577} {"train_loss": -25.729419708251953, "global_step": 296939, "epoch": 3577} {"train_loss": -25.14797019958496, "global_step": 296940, "epoch": 3577} {"train_loss": -25.113685607910156, "global_step": 296941, "epoch": 3577} {"train_loss": -25.6889705657959, "global_step": 296942, "epoch": 3577} {"train_loss": -24.66008949279785, "global_step": 296943, "epoch": 3577} {"train_loss": -25.407102584838867, "global_step": 296944, "epoch": 3577} {"train_loss": -25.390228271484375, "global_step": 296945, "epoch": 3577} {"train_loss": -24.7298583984375, "global_step": 296946, "epoch": 3577} {"train_loss": -25.089567184448242, "global_step": 296947, "epoch": 3577} {"train_loss": -24.899749755859375, "global_step": 296948, "epoch": 3577} {"train_loss": -25.512161254882812, "global_step": 296949, "epoch": 3577} {"train_loss": -24.90763282775879, "global_step": 296950, "epoch": 3577} {"train_loss": -25.594778060913086, "global_step": 296951, "epoch": 3577} {"train_loss": -25.51152801513672, "global_step": 296952, "epoch": 3577} {"train_loss": -25.062040328979492, "global_step": 296953, "epoch": 3577} {"train_loss": -25.442459106445312, "global_step": 296954, "epoch": 3577} {"train_loss": -25.217580795288086, "global_step": 296955, "epoch": 3577} {"train_loss": -25.398183822631836, "global_step": 296956, "epoch": 3577} {"train_loss": -25.60223388671875, "global_step": 296957, "epoch": 3577} {"train_loss": -25.173120498657227, "global_step": 296958, "epoch": 3577} {"train_loss": -25.205087661743164, "global_step": 296959, "epoch": 3577} {"train_loss": -25.111499786376953, "global_step": 296960, "epoch": 3577} {"train_loss": -25.634374618530273, "global_step": 296961, "epoch": 3577} {"train_loss": -25.42487907409668, "global_step": 296962, "epoch": 3577} {"train_loss": -25.46970558166504, "global_step": 296963, "epoch": 3577} {"train_loss": -25.638635635375977, "global_step": 296964, "epoch": 3577} {"train_loss": -25.371686935424805, "global_step": 296965, "epoch": 3577} {"train_loss": -25.51680564880371, "global_step": 296966, "epoch": 3577} {"train_loss": -25.491275787353516, "global_step": 296967, "epoch": 3577} {"train_loss": -25.475162506103516, "global_step": 296968, "epoch": 3577} {"train_loss": -25.671377182006836, "global_step": 296969, "epoch": 3577} {"train_loss": -25.492109298706055, "global_step": 296970, "epoch": 3577} {"train_loss": -25.461719512939453, "global_step": 296971, "epoch": 3577} {"train_loss": -25.64332389831543, "global_step": 296972, "epoch": 3577} {"train_loss": -25.39764748998435, "global_step": 296973, "epoch": 3577, "val_loss": 7161221.0} {"train_loss": -25.599462509155273, "global_step": 296974, "epoch": 3578} {"train_loss": -24.862133026123047, "global_step": 296975, "epoch": 3578} {"train_loss": -25.2302303314209, "global_step": 296976, "epoch": 3578} {"train_loss": -25.148935317993164, "global_step": 296977, "epoch": 3578} {"train_loss": -25.047067642211914, "global_step": 296978, "epoch": 3578} {"train_loss": -25.33407974243164, "global_step": 296979, "epoch": 3578} {"train_loss": -25.1505126953125, "global_step": 296980, "epoch": 3578} {"train_loss": -25.00157928466797, "global_step": 296981, "epoch": 3578} {"train_loss": -25.64930534362793, "global_step": 296982, "epoch": 3578} {"train_loss": -25.372167587280273, "global_step": 296983, "epoch": 3578} {"train_loss": -25.230112075805664, "global_step": 296984, "epoch": 3578} {"train_loss": -25.531835556030273, "global_step": 296985, "epoch": 3578} {"train_loss": -25.334657669067383, "global_step": 296986, "epoch": 3578} {"train_loss": -25.746051788330078, "global_step": 296987, "epoch": 3578} {"train_loss": -25.317920684814453, "global_step": 296988, "epoch": 3578} {"train_loss": -25.94099998474121, "global_step": 296989, "epoch": 3578} {"train_loss": -25.828786849975586, "global_step": 296990, "epoch": 3578} {"train_loss": -25.598995208740234, "global_step": 296991, "epoch": 3578} {"train_loss": -25.546415328979492, "global_step": 296992, "epoch": 3578} {"train_loss": -25.978464126586914, "global_step": 296993, "epoch": 3578} {"train_loss": -25.620874404907227, "global_step": 296994, "epoch": 3578} {"train_loss": -25.560705184936523, "global_step": 296995, "epoch": 3578} {"train_loss": -25.7581787109375, "global_step": 296996, "epoch": 3578} {"train_loss": -25.8778133392334, "global_step": 296997, "epoch": 3578} {"train_loss": -25.728961944580078, "global_step": 296998, "epoch": 3578} {"train_loss": -25.562633514404297, "global_step": 296999, "epoch": 3578} {"train_loss": -25.60227394104004, "global_step": 297000, "epoch": 3578} {"train_loss": -25.8480167388916, "global_step": 297001, "epoch": 3578} {"train_loss": -25.824054718017578, "global_step": 297002, "epoch": 3578} {"train_loss": -25.91102409362793, "global_step": 297003, "epoch": 3578} {"train_loss": -25.931859970092773, "global_step": 297004, "epoch": 3578} {"train_loss": -25.92176628112793, "global_step": 297005, "epoch": 3578} {"train_loss": -25.77227210998535, "global_step": 297006, "epoch": 3578} {"train_loss": -25.829736709594727, "global_step": 297007, "epoch": 3578} {"train_loss": -25.765644073486328, "global_step": 297008, "epoch": 3578} {"train_loss": -25.630468368530273, "global_step": 297009, "epoch": 3578} {"train_loss": -25.82108497619629, "global_step": 297010, "epoch": 3578} {"train_loss": -25.89998435974121, "global_step": 297011, "epoch": 3578} {"train_loss": -25.467350006103516, "global_step": 297012, "epoch": 3578} {"train_loss": -25.942737579345703, "global_step": 297013, "epoch": 3578} {"train_loss": -26.053516387939453, "global_step": 297014, "epoch": 3578} {"train_loss": -25.7364444732666, "global_step": 297015, "epoch": 3578} {"train_loss": -25.8634033203125, "global_step": 297016, "epoch": 3578} {"train_loss": -26.18556022644043, "global_step": 297017, "epoch": 3578} {"train_loss": -25.487415313720703, "global_step": 297018, "epoch": 3578} {"train_loss": -25.77841567993164, "global_step": 297019, "epoch": 3578} {"train_loss": -25.73426628112793, "global_step": 297020, "epoch": 3578} {"train_loss": -25.680509567260742, "global_step": 297021, "epoch": 3578} {"train_loss": -25.869199752807617, "global_step": 297022, "epoch": 3578} {"train_loss": -25.900297164916992, "global_step": 297023, "epoch": 3578} {"train_loss": -25.304325103759766, "global_step": 297024, "epoch": 3578} {"train_loss": -25.47028160095215, "global_step": 297025, "epoch": 3578} {"train_loss": -25.400558471679688, "global_step": 297026, "epoch": 3578} {"train_loss": -25.50758934020996, "global_step": 297027, "epoch": 3578} {"train_loss": -25.75971794128418, "global_step": 297028, "epoch": 3578} {"train_loss": -25.592002868652344, "global_step": 297029, "epoch": 3578} {"train_loss": -25.562746047973633, "global_step": 297030, "epoch": 3578} {"train_loss": -25.85053825378418, "global_step": 297031, "epoch": 3578} {"train_loss": -25.57390594482422, "global_step": 297032, "epoch": 3578} {"train_loss": -25.967390060424805, "global_step": 297033, "epoch": 3578} {"train_loss": -25.921009063720703, "global_step": 297034, "epoch": 3578} {"train_loss": -25.637714385986328, "global_step": 297035, "epoch": 3578} {"train_loss": -25.985708236694336, "global_step": 297036, "epoch": 3578} {"train_loss": -25.296918869018555, "global_step": 297037, "epoch": 3578} {"train_loss": -25.86370277404785, "global_step": 297038, "epoch": 3578} {"train_loss": -25.7347412109375, "global_step": 297039, "epoch": 3578} {"train_loss": -25.548856735229492, "global_step": 297040, "epoch": 3578} {"train_loss": -25.406436920166016, "global_step": 297041, "epoch": 3578} {"train_loss": -25.299497604370117, "global_step": 297042, "epoch": 3578} {"train_loss": -25.700021743774414, "global_step": 297043, "epoch": 3578} {"train_loss": -25.681476593017578, "global_step": 297044, "epoch": 3578} {"train_loss": -25.114877700805664, "global_step": 297045, "epoch": 3578} {"train_loss": -25.416406631469727, "global_step": 297046, "epoch": 3578} {"train_loss": -25.345317840576172, "global_step": 297047, "epoch": 3578} {"train_loss": -25.515356063842773, "global_step": 297048, "epoch": 3578} {"train_loss": -25.476760864257812, "global_step": 297049, "epoch": 3578} {"train_loss": -25.70088768005371, "global_step": 297050, "epoch": 3578} {"train_loss": -25.259000778198242, "global_step": 297051, "epoch": 3578} {"train_loss": -25.743356704711914, "global_step": 297052, "epoch": 3578} {"train_loss": -25.506223678588867, "global_step": 297053, "epoch": 3578} {"train_loss": -25.4815673828125, "global_step": 297054, "epoch": 3578} {"train_loss": -25.47772789001465, "global_step": 297055, "epoch": 3578} {"train_loss": -25.632586283856128, "global_step": 297056, "epoch": 3578, "val_loss": 7106203.0} {"train_loss": -25.261083602905273, "global_step": 297057, "epoch": 3579} {"train_loss": -25.08331871032715, "global_step": 297058, "epoch": 3579} {"train_loss": -25.228435516357422, "global_step": 297059, "epoch": 3579} {"train_loss": -25.210315704345703, "global_step": 297060, "epoch": 3579} {"train_loss": -25.5297908782959, "global_step": 297061, "epoch": 3579} {"train_loss": -25.337961196899414, "global_step": 297062, "epoch": 3579} {"train_loss": -25.03922462463379, "global_step": 297063, "epoch": 3579} {"train_loss": -24.901594161987305, "global_step": 297064, "epoch": 3579} {"train_loss": -25.60617446899414, "global_step": 297065, "epoch": 3579} {"train_loss": -25.464712142944336, "global_step": 297066, "epoch": 3579} {"train_loss": -25.540359497070312, "global_step": 297067, "epoch": 3579} {"train_loss": -25.157947540283203, "global_step": 297068, "epoch": 3579} {"train_loss": -25.638925552368164, "global_step": 297069, "epoch": 3579} {"train_loss": -25.7676944732666, "global_step": 297070, "epoch": 3579} {"train_loss": -25.856536865234375, "global_step": 297071, "epoch": 3579} {"train_loss": -25.643396377563477, "global_step": 297072, "epoch": 3579} {"train_loss": -25.4366455078125, "global_step": 297073, "epoch": 3579} {"train_loss": -25.391258239746094, "global_step": 297074, "epoch": 3579} {"train_loss": -25.495223999023438, "global_step": 297075, "epoch": 3579} {"train_loss": -25.94025993347168, "global_step": 297076, "epoch": 3579} {"train_loss": -25.313919067382812, "global_step": 297077, "epoch": 3579} {"train_loss": -25.370473861694336, "global_step": 297078, "epoch": 3579} {"train_loss": -25.210229873657227, "global_step": 297079, "epoch": 3579} {"train_loss": -25.465091705322266, "global_step": 297080, "epoch": 3579} {"train_loss": -25.48777198791504, "global_step": 297081, "epoch": 3579} {"train_loss": -25.439083099365234, "global_step": 297082, "epoch": 3579} {"train_loss": -25.553354263305664, "global_step": 297083, "epoch": 3579} {"train_loss": -25.485876083374023, "global_step": 297084, "epoch": 3579} {"train_loss": -25.416183471679688, "global_step": 297085, "epoch": 3579} {"train_loss": -25.20612144470215, "global_step": 297086, "epoch": 3579} {"train_loss": -25.46320152282715, "global_step": 297087, "epoch": 3579} {"train_loss": -25.523141860961914, "global_step": 297088, "epoch": 3579} {"train_loss": -25.84109878540039, "global_step": 297089, "epoch": 3579} {"train_loss": -26.001667022705078, "global_step": 297090, "epoch": 3579} {"train_loss": -25.421659469604492, "global_step": 297091, "epoch": 3579} {"train_loss": -25.368967056274414, "global_step": 297092, "epoch": 3579} {"train_loss": -25.295143127441406, "global_step": 297093, "epoch": 3579} {"train_loss": -25.672895431518555, "global_step": 297094, "epoch": 3579} {"train_loss": -25.59355926513672, "global_step": 297095, "epoch": 3579} {"train_loss": -25.42789649963379, "global_step": 297096, "epoch": 3579} {"train_loss": -25.475011825561523, "global_step": 297097, "epoch": 3579} {"train_loss": -25.585655212402344, "global_step": 297098, "epoch": 3579} {"train_loss": -25.293363571166992, "global_step": 297099, "epoch": 3579} {"train_loss": -25.899152755737305, "global_step": 297100, "epoch": 3579} {"train_loss": -25.373289108276367, "global_step": 297101, "epoch": 3579} {"train_loss": -25.3096923828125, "global_step": 297102, "epoch": 3579} {"train_loss": -25.473133087158203, "global_step": 297103, "epoch": 3579} {"train_loss": -25.166067123413086, "global_step": 297104, "epoch": 3579} {"train_loss": -25.402481079101562, "global_step": 297105, "epoch": 3579} {"train_loss": -25.593843460083008, "global_step": 297106, "epoch": 3579} {"train_loss": -25.52166175842285, "global_step": 297107, "epoch": 3579} {"train_loss": -24.92724609375, "global_step": 297108, "epoch": 3579} {"train_loss": -25.910364151000977, "global_step": 297109, "epoch": 3579} {"train_loss": -25.120159149169922, "global_step": 297110, "epoch": 3579} {"train_loss": -24.805471420288086, "global_step": 297111, "epoch": 3579} {"train_loss": -25.61127281188965, "global_step": 297112, "epoch": 3579} {"train_loss": -24.867773056030273, "global_step": 297113, "epoch": 3579} {"train_loss": -25.376811981201172, "global_step": 297114, "epoch": 3579} {"train_loss": -24.755664825439453, "global_step": 297115, "epoch": 3579} {"train_loss": -25.24073028564453, "global_step": 297116, "epoch": 3579} {"train_loss": -24.99774169921875, "global_step": 297117, "epoch": 3579} {"train_loss": -25.56800651550293, "global_step": 297118, "epoch": 3579} {"train_loss": -25.324148178100586, "global_step": 297119, "epoch": 3579} {"train_loss": -25.26594352722168, "global_step": 297120, "epoch": 3579} {"train_loss": -25.18565559387207, "global_step": 297121, "epoch": 3579} {"train_loss": -25.399688720703125, "global_step": 297122, "epoch": 3579} {"train_loss": -25.782957077026367, "global_step": 297123, "epoch": 3579} {"train_loss": -25.28329849243164, "global_step": 297124, "epoch": 3579} {"train_loss": -25.0513973236084, "global_step": 297125, "epoch": 3579} {"train_loss": -25.84983253479004, "global_step": 297126, "epoch": 3579} {"train_loss": -25.391752243041992, "global_step": 297127, "epoch": 3579} {"train_loss": -25.09865379333496, "global_step": 297128, "epoch": 3579} {"train_loss": -25.730615615844727, "global_step": 297129, "epoch": 3579} {"train_loss": -25.375940322875977, "global_step": 297130, "epoch": 3579} {"train_loss": -25.491802215576172, "global_step": 297131, "epoch": 3579} {"train_loss": -25.27581214904785, "global_step": 297132, "epoch": 3579} {"train_loss": -25.577436447143555, "global_step": 297133, "epoch": 3579} {"train_loss": -25.614206314086914, "global_step": 297134, "epoch": 3579} {"train_loss": -25.612701416015625, "global_step": 297135, "epoch": 3579} {"train_loss": -25.500043869018555, "global_step": 297136, "epoch": 3579} {"train_loss": -25.56897735595703, "global_step": 297137, "epoch": 3579} {"train_loss": -25.253477096557617, "global_step": 297138, "epoch": 3579} {"train_loss": -25.42541515396302, "global_step": 297139, "epoch": 3579, "val_loss": 7190678.0} {"train_loss": -25.494993209838867, "global_step": 297140, "epoch": 3580} {"train_loss": -25.247257232666016, "global_step": 297141, "epoch": 3580} {"train_loss": -25.581392288208008, "global_step": 297142, "epoch": 3580} {"train_loss": -25.455886840820312, "global_step": 297143, "epoch": 3580} {"train_loss": -25.4595890045166, "global_step": 297144, "epoch": 3580} {"train_loss": -25.670759201049805, "global_step": 297145, "epoch": 3580} {"train_loss": -25.659452438354492, "global_step": 297146, "epoch": 3580} {"train_loss": -25.50079917907715, "global_step": 297147, "epoch": 3580} {"train_loss": -25.493677139282227, "global_step": 297148, "epoch": 3580} {"train_loss": -25.794330596923828, "global_step": 297149, "epoch": 3580} {"train_loss": -25.366247177124023, "global_step": 297150, "epoch": 3580} {"train_loss": -25.4843807220459, "global_step": 297151, "epoch": 3580} {"train_loss": -25.602025985717773, "global_step": 297152, "epoch": 3580} {"train_loss": -25.659032821655273, "global_step": 297153, "epoch": 3580} {"train_loss": -25.33909034729004, "global_step": 297154, "epoch": 3580} {"train_loss": -25.754255294799805, "global_step": 297155, "epoch": 3580} {"train_loss": -25.601369857788086, "global_step": 297156, "epoch": 3580} {"train_loss": -25.59832191467285, "global_step": 297157, "epoch": 3580} {"train_loss": -25.5173282623291, "global_step": 297158, "epoch": 3580} {"train_loss": -25.68840980529785, "global_step": 297159, "epoch": 3580} {"train_loss": -25.811059951782227, "global_step": 297160, "epoch": 3580} {"train_loss": -25.556381225585938, "global_step": 297161, "epoch": 3580} {"train_loss": -25.762439727783203, "global_step": 297162, "epoch": 3580} {"train_loss": -25.93303871154785, "global_step": 297163, "epoch": 3580} {"train_loss": -25.833988189697266, "global_step": 297164, "epoch": 3580} {"train_loss": -25.7883358001709, "global_step": 297165, "epoch": 3580} {"train_loss": -25.676294326782227, "global_step": 297166, "epoch": 3580} {"train_loss": -25.86014175415039, "global_step": 297167, "epoch": 3580} {"train_loss": -25.82832145690918, "global_step": 297168, "epoch": 3580} {"train_loss": -25.624189376831055, "global_step": 297169, "epoch": 3580} {"train_loss": -25.58108901977539, "global_step": 297170, "epoch": 3580} {"train_loss": -25.50797462463379, "global_step": 297171, "epoch": 3580} {"train_loss": -25.261716842651367, "global_step": 297172, "epoch": 3580} {"train_loss": -25.46475601196289, "global_step": 297173, "epoch": 3580} {"train_loss": -25.54340171813965, "global_step": 297174, "epoch": 3580} {"train_loss": -25.661224365234375, "global_step": 297175, "epoch": 3580} {"train_loss": -25.827335357666016, "global_step": 297176, "epoch": 3580} {"train_loss": -25.30450439453125, "global_step": 297177, "epoch": 3580} {"train_loss": -25.28733253479004, "global_step": 297178, "epoch": 3580} {"train_loss": -25.503755569458008, "global_step": 297179, "epoch": 3580} {"train_loss": -25.47952651977539, "global_step": 297180, "epoch": 3580} {"train_loss": -25.636266708374023, "global_step": 297181, "epoch": 3580} {"train_loss": -25.9199161529541, "global_step": 297182, "epoch": 3580} {"train_loss": -25.705707550048828, "global_step": 297183, "epoch": 3580} {"train_loss": -25.91330337524414, "global_step": 297184, "epoch": 3580} {"train_loss": -25.89154052734375, "global_step": 297185, "epoch": 3580} {"train_loss": -25.53211784362793, "global_step": 297186, "epoch": 3580} {"train_loss": -25.843957901000977, "global_step": 297187, "epoch": 3580} {"train_loss": -25.910795211791992, "global_step": 297188, "epoch": 3580} {"train_loss": -25.355756759643555, "global_step": 297189, "epoch": 3580} {"train_loss": -25.608129501342773, "global_step": 297190, "epoch": 3580} {"train_loss": -25.789525985717773, "global_step": 297191, "epoch": 3580} {"train_loss": -25.368457794189453, "global_step": 297192, "epoch": 3580} {"train_loss": -25.694921493530273, "global_step": 297193, "epoch": 3580} {"train_loss": -25.741901397705078, "global_step": 297194, "epoch": 3580} {"train_loss": -25.553359985351562, "global_step": 297195, "epoch": 3580} {"train_loss": -25.27150535583496, "global_step": 297196, "epoch": 3580} {"train_loss": -25.436506271362305, "global_step": 297197, "epoch": 3580} {"train_loss": -25.52427101135254, "global_step": 297198, "epoch": 3580} {"train_loss": -25.76861572265625, "global_step": 297199, "epoch": 3580} {"train_loss": -25.692041397094727, "global_step": 297200, "epoch": 3580} {"train_loss": -25.385177612304688, "global_step": 297201, "epoch": 3580} {"train_loss": -25.745412826538086, "global_step": 297202, "epoch": 3580} {"train_loss": -25.777929306030273, "global_step": 297203, "epoch": 3580} {"train_loss": -26.03754997253418, "global_step": 297204, "epoch": 3580} {"train_loss": -25.523746490478516, "global_step": 297205, "epoch": 3580} {"train_loss": -25.76348876953125, "global_step": 297206, "epoch": 3580} {"train_loss": -25.5587100982666, "global_step": 297207, "epoch": 3580} {"train_loss": -25.389719009399414, "global_step": 297208, "epoch": 3580} {"train_loss": -25.71050453186035, "global_step": 297209, "epoch": 3580} {"train_loss": -25.481922149658203, "global_step": 297210, "epoch": 3580} {"train_loss": -25.577869415283203, "global_step": 297211, "epoch": 3580} {"train_loss": -25.815214157104492, "global_step": 297212, "epoch": 3580} {"train_loss": -25.864398956298828, "global_step": 297213, "epoch": 3580} {"train_loss": -25.82732582092285, "global_step": 297214, "epoch": 3580} {"train_loss": -25.892621994018555, "global_step": 297215, "epoch": 3580} {"train_loss": -25.427209854125977, "global_step": 297216, "epoch": 3580} {"train_loss": -25.490680694580078, "global_step": 297217, "epoch": 3580} {"train_loss": -25.443096160888672, "global_step": 297218, "epoch": 3580} {"train_loss": -25.55515480041504, "global_step": 297219, "epoch": 3580} {"train_loss": -25.598011016845703, "global_step": 297220, "epoch": 3580} {"train_loss": -25.387521743774414, "global_step": 297221, "epoch": 3580} {"train_loss": -25.611873764589607, "global_step": 297222, "epoch": 3580, "val_loss": 7366963.0} {"train_loss": -24.24390411376953, "global_step": 297223, "epoch": 3581} {"train_loss": -23.60922622680664, "global_step": 297224, "epoch": 3581} {"train_loss": -24.650678634643555, "global_step": 297225, "epoch": 3581} {"train_loss": -24.367979049682617, "global_step": 297226, "epoch": 3581} {"train_loss": -24.46137046813965, "global_step": 297227, "epoch": 3581} {"train_loss": -24.640655517578125, "global_step": 297228, "epoch": 3581} {"train_loss": -25.061914443969727, "global_step": 297229, "epoch": 3581} {"train_loss": -25.0975284576416, "global_step": 297230, "epoch": 3581} {"train_loss": -25.144826889038086, "global_step": 297231, "epoch": 3581} {"train_loss": -24.867868423461914, "global_step": 297232, "epoch": 3581} {"train_loss": -25.24492835998535, "global_step": 297233, "epoch": 3581} {"train_loss": -24.813751220703125, "global_step": 297234, "epoch": 3581} {"train_loss": -25.391603469848633, "global_step": 297235, "epoch": 3581} {"train_loss": -24.881757736206055, "global_step": 297236, "epoch": 3581} {"train_loss": -25.1066951751709, "global_step": 297237, "epoch": 3581} {"train_loss": -25.26339340209961, "global_step": 297238, "epoch": 3581} {"train_loss": -24.912498474121094, "global_step": 297239, "epoch": 3581} {"train_loss": -25.240978240966797, "global_step": 297240, "epoch": 3581} {"train_loss": -25.190576553344727, "global_step": 297241, "epoch": 3581} {"train_loss": -25.133371353149414, "global_step": 297242, "epoch": 3581} {"train_loss": -25.154895782470703, "global_step": 297243, "epoch": 3581} {"train_loss": -25.3293514251709, "global_step": 297244, "epoch": 3581} {"train_loss": -25.158573150634766, "global_step": 297245, "epoch": 3581} {"train_loss": -25.494855880737305, "global_step": 297246, "epoch": 3581} {"train_loss": -24.973447799682617, "global_step": 297247, "epoch": 3581} {"train_loss": -25.6036319732666, "global_step": 297248, "epoch": 3581} {"train_loss": -25.520496368408203, "global_step": 297249, "epoch": 3581} {"train_loss": -25.476913452148438, "global_step": 297250, "epoch": 3581} {"train_loss": -25.589990615844727, "global_step": 297251, "epoch": 3581} {"train_loss": -25.464994430541992, "global_step": 297252, "epoch": 3581} {"train_loss": -25.650243759155273, "global_step": 297253, "epoch": 3581} {"train_loss": -25.55014991760254, "global_step": 297254, "epoch": 3581} {"train_loss": -25.291488647460938, "global_step": 297255, "epoch": 3581} {"train_loss": -25.401355743408203, "global_step": 297256, "epoch": 3581} {"train_loss": -25.900653839111328, "global_step": 297257, "epoch": 3581} {"train_loss": -25.29977035522461, "global_step": 297258, "epoch": 3581} {"train_loss": -25.689716339111328, "global_step": 297259, "epoch": 3581} {"train_loss": -25.89112663269043, "global_step": 297260, "epoch": 3581} {"train_loss": -25.665037155151367, "global_step": 297261, "epoch": 3581} {"train_loss": -25.494781494140625, "global_step": 297262, "epoch": 3581} {"train_loss": -25.367685317993164, "global_step": 297263, "epoch": 3581} {"train_loss": -25.910736083984375, "global_step": 297264, "epoch": 3581} {"train_loss": -25.65864372253418, "global_step": 297265, "epoch": 3581} {"train_loss": -25.8710880279541, "global_step": 297266, "epoch": 3581} {"train_loss": -25.588088989257812, "global_step": 297267, "epoch": 3581} {"train_loss": -25.40683364868164, "global_step": 297268, "epoch": 3581} {"train_loss": -25.76481056213379, "global_step": 297269, "epoch": 3581} {"train_loss": -25.64908790588379, "global_step": 297270, "epoch": 3581} {"train_loss": -25.260221481323242, "global_step": 297271, "epoch": 3581} {"train_loss": -25.91517448425293, "global_step": 297272, "epoch": 3581} {"train_loss": -25.916852951049805, "global_step": 297273, "epoch": 3581} {"train_loss": -25.64215087890625, "global_step": 297274, "epoch": 3581} {"train_loss": -26.23126220703125, "global_step": 297275, "epoch": 3581} {"train_loss": -25.96282958984375, "global_step": 297276, "epoch": 3581} {"train_loss": -25.76468849182129, "global_step": 297277, "epoch": 3581} {"train_loss": -25.8038387298584, "global_step": 297278, "epoch": 3581} {"train_loss": -25.546573638916016, "global_step": 297279, "epoch": 3581} {"train_loss": -25.85357666015625, "global_step": 297280, "epoch": 3581} {"train_loss": -25.83588218688965, "global_step": 297281, "epoch": 3581} {"train_loss": -25.576839447021484, "global_step": 297282, "epoch": 3581} {"train_loss": -25.537382125854492, "global_step": 297283, "epoch": 3581} {"train_loss": -25.521692276000977, "global_step": 297284, "epoch": 3581} {"train_loss": -25.7282772064209, "global_step": 297285, "epoch": 3581} {"train_loss": -25.54981803894043, "global_step": 297286, "epoch": 3581} {"train_loss": -25.746618270874023, "global_step": 297287, "epoch": 3581} {"train_loss": -25.794116973876953, "global_step": 297288, "epoch": 3581} {"train_loss": -26.027944564819336, "global_step": 297289, "epoch": 3581} {"train_loss": -25.54195213317871, "global_step": 297290, "epoch": 3581} {"train_loss": -25.709171295166016, "global_step": 297291, "epoch": 3581} {"train_loss": -25.760299682617188, "global_step": 297292, "epoch": 3581} {"train_loss": -25.54049301147461, "global_step": 297293, "epoch": 3581} {"train_loss": -25.792312622070312, "global_step": 297294, "epoch": 3581} {"train_loss": -25.599153518676758, "global_step": 297295, "epoch": 3581} {"train_loss": -25.658660888671875, "global_step": 297296, "epoch": 3581} {"train_loss": -25.805517196655273, "global_step": 297297, "epoch": 3581} {"train_loss": -25.621261596679688, "global_step": 297298, "epoch": 3581} {"train_loss": -25.594606399536133, "global_step": 297299, "epoch": 3581} {"train_loss": -26.14642333984375, "global_step": 297300, "epoch": 3581} {"train_loss": -25.475751876831055, "global_step": 297301, "epoch": 3581} {"train_loss": -25.364377975463867, "global_step": 297302, "epoch": 3581} {"train_loss": -25.204233169555664, "global_step": 297303, "epoch": 3581} {"train_loss": -25.233224868774414, "global_step": 297304, "epoch": 3581} {"train_loss": -25.430114378412085, "global_step": 297305, "epoch": 3581, "val_loss": 7091621.0} {"train_loss": -25.331872940063477, "global_step": 297306, "epoch": 3582} {"train_loss": -24.8123722076416, "global_step": 297307, "epoch": 3582} {"train_loss": -24.766374588012695, "global_step": 297308, "epoch": 3582} {"train_loss": -25.276071548461914, "global_step": 297309, "epoch": 3582} {"train_loss": -24.96567726135254, "global_step": 297310, "epoch": 3582} {"train_loss": -24.29351806640625, "global_step": 297311, "epoch": 3582} {"train_loss": -25.26303482055664, "global_step": 297312, "epoch": 3582} {"train_loss": -25.02444839477539, "global_step": 297313, "epoch": 3582} {"train_loss": -25.331151962280273, "global_step": 297314, "epoch": 3582} {"train_loss": -25.270648956298828, "global_step": 297315, "epoch": 3582} {"train_loss": -24.985275268554688, "global_step": 297316, "epoch": 3582} {"train_loss": -25.07406997680664, "global_step": 297317, "epoch": 3582} {"train_loss": -25.070768356323242, "global_step": 297318, "epoch": 3582} {"train_loss": -25.200153350830078, "global_step": 297319, "epoch": 3582} {"train_loss": -25.06572723388672, "global_step": 297320, "epoch": 3582} {"train_loss": -25.38606834411621, "global_step": 297321, "epoch": 3582} {"train_loss": -25.44374656677246, "global_step": 297322, "epoch": 3582} {"train_loss": -25.101821899414062, "global_step": 297323, "epoch": 3582} {"train_loss": -25.360092163085938, "global_step": 297324, "epoch": 3582} {"train_loss": -25.243783950805664, "global_step": 297325, "epoch": 3582} {"train_loss": -25.25071907043457, "global_step": 297326, "epoch": 3582} {"train_loss": -25.48150062561035, "global_step": 297327, "epoch": 3582} {"train_loss": -25.678089141845703, "global_step": 297328, "epoch": 3582} {"train_loss": -25.550275802612305, "global_step": 297329, "epoch": 3582} {"train_loss": -25.39609146118164, "global_step": 297330, "epoch": 3582} {"train_loss": -25.612842559814453, "global_step": 297331, "epoch": 3582} {"train_loss": -25.730554580688477, "global_step": 297332, "epoch": 3582} {"train_loss": -25.65936279296875, "global_step": 297333, "epoch": 3582} {"train_loss": -25.24370765686035, "global_step": 297334, "epoch": 3582} {"train_loss": -25.35512351989746, "global_step": 297335, "epoch": 3582} {"train_loss": -26.184675216674805, "global_step": 297336, "epoch": 3582} {"train_loss": -25.779367446899414, "global_step": 297337, "epoch": 3582} {"train_loss": -25.49342155456543, "global_step": 297338, "epoch": 3582} {"train_loss": -26.038732528686523, "global_step": 297339, "epoch": 3582} {"train_loss": -25.325315475463867, "global_step": 297340, "epoch": 3582} {"train_loss": -25.51741600036621, "global_step": 297341, "epoch": 3582} {"train_loss": -25.31941032409668, "global_step": 297342, "epoch": 3582} {"train_loss": -25.65631103515625, "global_step": 297343, "epoch": 3582} {"train_loss": -25.781309127807617, "global_step": 297344, "epoch": 3582} {"train_loss": -25.428030014038086, "global_step": 297345, "epoch": 3582} {"train_loss": -25.623310089111328, "global_step": 297346, "epoch": 3582} {"train_loss": -25.790115356445312, "global_step": 297347, "epoch": 3582} {"train_loss": -25.71185302734375, "global_step": 297348, "epoch": 3582} {"train_loss": -25.8998966217041, "global_step": 297349, "epoch": 3582} {"train_loss": -25.47102165222168, "global_step": 297350, "epoch": 3582} {"train_loss": -25.79535484313965, "global_step": 297351, "epoch": 3582} {"train_loss": -25.521133422851562, "global_step": 297352, "epoch": 3582} {"train_loss": -26.155492782592773, "global_step": 297353, "epoch": 3582} {"train_loss": -25.53739356994629, "global_step": 297354, "epoch": 3582} {"train_loss": -25.891050338745117, "global_step": 297355, "epoch": 3582} {"train_loss": -25.65364646911621, "global_step": 297356, "epoch": 3582} {"train_loss": -25.464109420776367, "global_step": 297357, "epoch": 3582} {"train_loss": -25.748859405517578, "global_step": 297358, "epoch": 3582} {"train_loss": -25.755517959594727, "global_step": 297359, "epoch": 3582} {"train_loss": -25.93873405456543, "global_step": 297360, "epoch": 3582} {"train_loss": -25.370817184448242, "global_step": 297361, "epoch": 3582} {"train_loss": -25.830810546875, "global_step": 297362, "epoch": 3582} {"train_loss": -25.493371963500977, "global_step": 297363, "epoch": 3582} {"train_loss": -25.57057762145996, "global_step": 297364, "epoch": 3582} {"train_loss": -25.60218620300293, "global_step": 297365, "epoch": 3582} {"train_loss": -25.84311294555664, "global_step": 297366, "epoch": 3582} {"train_loss": -25.638059616088867, "global_step": 297367, "epoch": 3582} {"train_loss": -25.007658004760742, "global_step": 297368, "epoch": 3582} {"train_loss": -25.164764404296875, "global_step": 297369, "epoch": 3582} {"train_loss": -24.763465881347656, "global_step": 297370, "epoch": 3582} {"train_loss": -25.483123779296875, "global_step": 297371, "epoch": 3582} {"train_loss": -25.926794052124023, "global_step": 297372, "epoch": 3582} {"train_loss": -25.5571346282959, "global_step": 297373, "epoch": 3582} {"train_loss": -25.341917037963867, "global_step": 297374, "epoch": 3582} {"train_loss": -24.960357666015625, "global_step": 297375, "epoch": 3582} {"train_loss": -25.44563102722168, "global_step": 297376, "epoch": 3582} {"train_loss": -25.447853088378906, "global_step": 297377, "epoch": 3582} {"train_loss": -25.355056762695312, "global_step": 297378, "epoch": 3582} {"train_loss": -25.390609741210938, "global_step": 297379, "epoch": 3582} {"train_loss": -25.25164794921875, "global_step": 297380, "epoch": 3582} {"train_loss": -25.63555335998535, "global_step": 297381, "epoch": 3582} {"train_loss": -25.391422271728516, "global_step": 297382, "epoch": 3582} {"train_loss": -25.843961715698242, "global_step": 297383, "epoch": 3582} {"train_loss": -25.373472213745117, "global_step": 297384, "epoch": 3582} {"train_loss": -25.68939781188965, "global_step": 297385, "epoch": 3582} {"train_loss": -25.56833839416504, "global_step": 297386, "epoch": 3582} {"train_loss": -25.824792861938477, "global_step": 297387, "epoch": 3582} {"train_loss": -25.444681420383684, "global_step": 297388, "epoch": 3582, "val_loss": 7122274.0} {"train_loss": -25.237226486206055, "global_step": 297389, "epoch": 3583} {"train_loss": -25.171295166015625, "global_step": 297390, "epoch": 3583} {"train_loss": -25.604528427124023, "global_step": 297391, "epoch": 3583} {"train_loss": -25.272958755493164, "global_step": 297392, "epoch": 3583} {"train_loss": -24.88826560974121, "global_step": 297393, "epoch": 3583} {"train_loss": -25.14876937866211, "global_step": 297394, "epoch": 3583} {"train_loss": -25.107040405273438, "global_step": 297395, "epoch": 3583} {"train_loss": -25.182926177978516, "global_step": 297396, "epoch": 3583} {"train_loss": -25.103025436401367, "global_step": 297397, "epoch": 3583} {"train_loss": -25.60938835144043, "global_step": 297398, "epoch": 3583} {"train_loss": -25.040864944458008, "global_step": 297399, "epoch": 3583} {"train_loss": -25.595844268798828, "global_step": 297400, "epoch": 3583} {"train_loss": -25.365325927734375, "global_step": 297401, "epoch": 3583} {"train_loss": -25.5068359375, "global_step": 297402, "epoch": 3583} {"train_loss": -25.488386154174805, "global_step": 297403, "epoch": 3583} {"train_loss": -25.528533935546875, "global_step": 297404, "epoch": 3583} {"train_loss": -25.9567813873291, "global_step": 297405, "epoch": 3583} {"train_loss": -25.602216720581055, "global_step": 297406, "epoch": 3583} {"train_loss": -25.769805908203125, "global_step": 297407, "epoch": 3583} {"train_loss": -25.7269344329834, "global_step": 297408, "epoch": 3583} {"train_loss": -25.283720016479492, "global_step": 297409, "epoch": 3583} {"train_loss": -25.282958984375, "global_step": 297410, "epoch": 3583} {"train_loss": -25.743488311767578, "global_step": 297411, "epoch": 3583} {"train_loss": -25.432477951049805, "global_step": 297412, "epoch": 3583} {"train_loss": -25.666120529174805, "global_step": 297413, "epoch": 3583} {"train_loss": -25.47491455078125, "global_step": 297414, "epoch": 3583} {"train_loss": -25.623937606811523, "global_step": 297415, "epoch": 3583} {"train_loss": -25.626211166381836, "global_step": 297416, "epoch": 3583} {"train_loss": -25.5577335357666, "global_step": 297417, "epoch": 3583} {"train_loss": -25.636962890625, "global_step": 297418, "epoch": 3583} {"train_loss": -25.488332748413086, "global_step": 297419, "epoch": 3583} {"train_loss": -25.587644577026367, "global_step": 297420, "epoch": 3583} {"train_loss": -25.7733097076416, "global_step": 297421, "epoch": 3583} {"train_loss": -25.362028121948242, "global_step": 297422, "epoch": 3583} {"train_loss": -26.037677764892578, "global_step": 297423, "epoch": 3583} {"train_loss": -25.544513702392578, "global_step": 297424, "epoch": 3583} {"train_loss": -25.564556121826172, "global_step": 297425, "epoch": 3583} {"train_loss": -25.53608512878418, "global_step": 297426, "epoch": 3583} {"train_loss": -25.36700439453125, "global_step": 297427, "epoch": 3583} {"train_loss": -25.6667423248291, "global_step": 297428, "epoch": 3583} {"train_loss": -25.705249786376953, "global_step": 297429, "epoch": 3583} {"train_loss": -25.801794052124023, "global_step": 297430, "epoch": 3583} {"train_loss": -25.58078384399414, "global_step": 297431, "epoch": 3583} {"train_loss": -25.526269912719727, "global_step": 297432, "epoch": 3583} {"train_loss": -25.3955020904541, "global_step": 297433, "epoch": 3583} {"train_loss": -25.7803897857666, "global_step": 297434, "epoch": 3583} {"train_loss": -25.64419937133789, "global_step": 297435, "epoch": 3583} {"train_loss": -25.768192291259766, "global_step": 297436, "epoch": 3583} {"train_loss": -25.487751007080078, "global_step": 297437, "epoch": 3583} {"train_loss": -25.738805770874023, "global_step": 297438, "epoch": 3583} {"train_loss": -25.88960075378418, "global_step": 297439, "epoch": 3583} {"train_loss": -25.8587703704834, "global_step": 297440, "epoch": 3583} {"train_loss": -25.645246505737305, "global_step": 297441, "epoch": 3583} {"train_loss": -25.728403091430664, "global_step": 297442, "epoch": 3583} {"train_loss": -25.78931999206543, "global_step": 297443, "epoch": 3583} {"train_loss": -25.689924240112305, "global_step": 297444, "epoch": 3583} {"train_loss": -25.63886070251465, "global_step": 297445, "epoch": 3583} {"train_loss": -25.971906661987305, "global_step": 297446, "epoch": 3583} {"train_loss": -25.653701782226562, "global_step": 297447, "epoch": 3583} {"train_loss": -24.88318634033203, "global_step": 297448, "epoch": 3583} {"train_loss": -25.328580856323242, "global_step": 297449, "epoch": 3583} {"train_loss": -25.601049423217773, "global_step": 297450, "epoch": 3583} {"train_loss": -25.556007385253906, "global_step": 297451, "epoch": 3583} {"train_loss": -25.509422302246094, "global_step": 297452, "epoch": 3583} {"train_loss": -25.48824119567871, "global_step": 297453, "epoch": 3583} {"train_loss": -25.578556060791016, "global_step": 297454, "epoch": 3583} {"train_loss": -25.718320846557617, "global_step": 297455, "epoch": 3583} {"train_loss": -25.435699462890625, "global_step": 297456, "epoch": 3583} {"train_loss": -25.341001510620117, "global_step": 297457, "epoch": 3583} {"train_loss": -25.677045822143555, "global_step": 297458, "epoch": 3583} {"train_loss": -25.744659423828125, "global_step": 297459, "epoch": 3583} {"train_loss": -25.33273696899414, "global_step": 297460, "epoch": 3583} {"train_loss": -25.900800704956055, "global_step": 297461, "epoch": 3583} {"train_loss": -25.151514053344727, "global_step": 297462, "epoch": 3583} {"train_loss": -25.355480194091797, "global_step": 297463, "epoch": 3583} {"train_loss": -25.366498947143555, "global_step": 297464, "epoch": 3583} {"train_loss": -25.431976318359375, "global_step": 297465, "epoch": 3583} {"train_loss": -25.445812225341797, "global_step": 297466, "epoch": 3583} {"train_loss": -25.679096221923828, "global_step": 297467, "epoch": 3583} {"train_loss": -25.41195297241211, "global_step": 297468, "epoch": 3583} {"train_loss": -25.9211483001709, "global_step": 297469, "epoch": 3583} {"train_loss": -25.5660457611084, "global_step": 297470, "epoch": 3583} {"train_loss": -25.551584933177534, "global_step": 297471, "epoch": 3583, "val_loss": 7204413.0} {"train_loss": -24.963836669921875, "global_step": 297472, "epoch": 3584} {"train_loss": -24.8946533203125, "global_step": 297473, "epoch": 3584} {"train_loss": -25.37618064880371, "global_step": 297474, "epoch": 3584} {"train_loss": -24.7086124420166, "global_step": 297475, "epoch": 3584} {"train_loss": -25.2386531829834, "global_step": 297476, "epoch": 3584} {"train_loss": -25.243558883666992, "global_step": 297477, "epoch": 3584} {"train_loss": -25.01089859008789, "global_step": 297478, "epoch": 3584} {"train_loss": -25.054325103759766, "global_step": 297479, "epoch": 3584} {"train_loss": -25.06277847290039, "global_step": 297480, "epoch": 3584} {"train_loss": -25.46426773071289, "global_step": 297481, "epoch": 3584} {"train_loss": -25.35135841369629, "global_step": 297482, "epoch": 3584} {"train_loss": -25.24129867553711, "global_step": 297483, "epoch": 3584} {"train_loss": -25.432382583618164, "global_step": 297484, "epoch": 3584} {"train_loss": -25.65937614440918, "global_step": 297485, "epoch": 3584} {"train_loss": -25.479494094848633, "global_step": 297486, "epoch": 3584} {"train_loss": -25.52570152282715, "global_step": 297487, "epoch": 3584} {"train_loss": -25.636585235595703, "global_step": 297488, "epoch": 3584} {"train_loss": -25.50589370727539, "global_step": 297489, "epoch": 3584} {"train_loss": -25.706863403320312, "global_step": 297490, "epoch": 3584} {"train_loss": -25.33761978149414, "global_step": 297491, "epoch": 3584} {"train_loss": -25.524450302124023, "global_step": 297492, "epoch": 3584} {"train_loss": -25.325544357299805, "global_step": 297493, "epoch": 3584} {"train_loss": -25.189151763916016, "global_step": 297494, "epoch": 3584} {"train_loss": -25.149423599243164, "global_step": 297495, "epoch": 3584} {"train_loss": -25.50021743774414, "global_step": 297496, "epoch": 3584} {"train_loss": -25.251285552978516, "global_step": 297497, "epoch": 3584} {"train_loss": -25.6283016204834, "global_step": 297498, "epoch": 3584} {"train_loss": -25.66571617126465, "global_step": 297499, "epoch": 3584} {"train_loss": -25.506591796875, "global_step": 297500, "epoch": 3584} {"train_loss": -25.300504684448242, "global_step": 297501, "epoch": 3584} {"train_loss": -26.09381675720215, "global_step": 297502, "epoch": 3584} {"train_loss": -25.7598934173584, "global_step": 297503, "epoch": 3584} {"train_loss": -25.835025787353516, "global_step": 297504, "epoch": 3584} {"train_loss": -25.9071044921875, "global_step": 297505, "epoch": 3584} {"train_loss": -25.686044692993164, "global_step": 297506, "epoch": 3584} {"train_loss": -25.813995361328125, "global_step": 297507, "epoch": 3584} {"train_loss": -26.058624267578125, "global_step": 297508, "epoch": 3584} {"train_loss": -25.674222946166992, "global_step": 297509, "epoch": 3584} {"train_loss": -25.69233512878418, "global_step": 297510, "epoch": 3584} {"train_loss": -25.97127342224121, "global_step": 297511, "epoch": 3584} {"train_loss": -25.778289794921875, "global_step": 297512, "epoch": 3584} {"train_loss": -25.8764591217041, "global_step": 297513, "epoch": 3584} {"train_loss": -25.674840927124023, "global_step": 297514, "epoch": 3584} {"train_loss": -25.419593811035156, "global_step": 297515, "epoch": 3584} {"train_loss": -25.462787628173828, "global_step": 297516, "epoch": 3584} {"train_loss": -25.766183853149414, "global_step": 297517, "epoch": 3584} {"train_loss": -25.991317749023438, "global_step": 297518, "epoch": 3584} {"train_loss": -25.753477096557617, "global_step": 297519, "epoch": 3584} {"train_loss": -25.572330474853516, "global_step": 297520, "epoch": 3584} {"train_loss": -25.88804054260254, "global_step": 297521, "epoch": 3584} {"train_loss": -25.699140548706055, "global_step": 297522, "epoch": 3584} {"train_loss": -26.090158462524414, "global_step": 297523, "epoch": 3584} {"train_loss": -25.716501235961914, "global_step": 297524, "epoch": 3584} {"train_loss": -25.600421905517578, "global_step": 297525, "epoch": 3584} {"train_loss": -25.695465087890625, "global_step": 297526, "epoch": 3584} {"train_loss": -25.954614639282227, "global_step": 297527, "epoch": 3584} {"train_loss": -25.632556915283203, "global_step": 297528, "epoch": 3584} {"train_loss": -25.64849853515625, "global_step": 297529, "epoch": 3584} {"train_loss": -26.16946792602539, "global_step": 297530, "epoch": 3584} {"train_loss": -25.852054595947266, "global_step": 297531, "epoch": 3584} {"train_loss": -25.958927154541016, "global_step": 297532, "epoch": 3584} {"train_loss": -25.6115665435791, "global_step": 297533, "epoch": 3584} {"train_loss": -26.1957950592041, "global_step": 297534, "epoch": 3584} {"train_loss": -25.832412719726562, "global_step": 297535, "epoch": 3584} {"train_loss": -25.49165916442871, "global_step": 297536, "epoch": 3584} {"train_loss": -25.861820220947266, "global_step": 297537, "epoch": 3584} {"train_loss": -25.600873947143555, "global_step": 297538, "epoch": 3584} {"train_loss": -25.47414779663086, "global_step": 297539, "epoch": 3584} {"train_loss": -25.785297393798828, "global_step": 297540, "epoch": 3584} {"train_loss": -25.525358200073242, "global_step": 297541, "epoch": 3584} {"train_loss": -25.862201690673828, "global_step": 297542, "epoch": 3584} {"train_loss": -26.032297134399414, "global_step": 297543, "epoch": 3584} {"train_loss": -25.815887451171875, "global_step": 297544, "epoch": 3584} {"train_loss": -25.316593170166016, "global_step": 297545, "epoch": 3584} {"train_loss": -25.400039672851562, "global_step": 297546, "epoch": 3584} {"train_loss": -25.089462280273438, "global_step": 297547, "epoch": 3584} {"train_loss": -24.993925094604492, "global_step": 297548, "epoch": 3584} {"train_loss": -25.304691314697266, "global_step": 297549, "epoch": 3584} {"train_loss": -25.522199630737305, "global_step": 297550, "epoch": 3584} {"train_loss": -25.760452270507812, "global_step": 297551, "epoch": 3584} {"train_loss": -25.255945205688477, "global_step": 297552, "epoch": 3584} {"train_loss": -25.667865753173828, "global_step": 297553, "epoch": 3584} {"train_loss": -25.559494409216455, "global_step": 297554, "epoch": 3584, "val_loss": 7276675.0} {"train_loss": -23.763914108276367, "global_step": 297555, "epoch": 3585} {"train_loss": -23.825241088867188, "global_step": 297556, "epoch": 3585} {"train_loss": -24.119909286499023, "global_step": 297557, "epoch": 3585} {"train_loss": -23.458999633789062, "global_step": 297558, "epoch": 3585} {"train_loss": -24.43372917175293, "global_step": 297559, "epoch": 3585} {"train_loss": -24.2286376953125, "global_step": 297560, "epoch": 3585} {"train_loss": -23.43121337890625, "global_step": 297561, "epoch": 3585} {"train_loss": -23.990522384643555, "global_step": 297562, "epoch": 3585} {"train_loss": -24.389781951904297, "global_step": 297563, "epoch": 3585} {"train_loss": -24.150562286376953, "global_step": 297564, "epoch": 3585} {"train_loss": -23.804655075073242, "global_step": 297565, "epoch": 3585} {"train_loss": -24.345218658447266, "global_step": 297566, "epoch": 3585} {"train_loss": -24.14165687561035, "global_step": 297567, "epoch": 3585} {"train_loss": -24.493711471557617, "global_step": 297568, "epoch": 3585} {"train_loss": -24.496286392211914, "global_step": 297569, "epoch": 3585} {"train_loss": -24.682628631591797, "global_step": 297570, "epoch": 3585} {"train_loss": -24.517255783081055, "global_step": 297571, "epoch": 3585} {"train_loss": -25.10686683654785, "global_step": 297572, "epoch": 3585} {"train_loss": -24.28041648864746, "global_step": 297573, "epoch": 3585} {"train_loss": -24.895219802856445, "global_step": 297574, "epoch": 3585} {"train_loss": -24.85838508605957, "global_step": 297575, "epoch": 3585} {"train_loss": -25.217092514038086, "global_step": 297576, "epoch": 3585} {"train_loss": -24.83283233642578, "global_step": 297577, "epoch": 3585} {"train_loss": -24.87495994567871, "global_step": 297578, "epoch": 3585} {"train_loss": -24.748737335205078, "global_step": 297579, "epoch": 3585} {"train_loss": -25.258045196533203, "global_step": 297580, "epoch": 3585} {"train_loss": -25.061735153198242, "global_step": 297581, "epoch": 3585} {"train_loss": -25.082860946655273, "global_step": 297582, "epoch": 3585} {"train_loss": -25.15556526184082, "global_step": 297583, "epoch": 3585} {"train_loss": -25.220670700073242, "global_step": 297584, "epoch": 3585} {"train_loss": -24.87291145324707, "global_step": 297585, "epoch": 3585} {"train_loss": -25.23198127746582, "global_step": 297586, "epoch": 3585} {"train_loss": -25.460025787353516, "global_step": 297587, "epoch": 3585} {"train_loss": -25.03272819519043, "global_step": 297588, "epoch": 3585} {"train_loss": -25.236331939697266, "global_step": 297589, "epoch": 3585} {"train_loss": -25.555419921875, "global_step": 297590, "epoch": 3585} {"train_loss": -25.14191246032715, "global_step": 297591, "epoch": 3585} {"train_loss": -25.315807342529297, "global_step": 297592, "epoch": 3585} {"train_loss": -25.48323631286621, "global_step": 297593, "epoch": 3585} {"train_loss": -25.417646408081055, "global_step": 297594, "epoch": 3585} {"train_loss": -25.07592010498047, "global_step": 297595, "epoch": 3585} {"train_loss": -25.394824981689453, "global_step": 297596, "epoch": 3585} {"train_loss": -25.534194946289062, "global_step": 297597, "epoch": 3585} {"train_loss": -25.66971206665039, "global_step": 297598, "epoch": 3585} {"train_loss": -25.820852279663086, "global_step": 297599, "epoch": 3585} {"train_loss": -25.501707077026367, "global_step": 297600, "epoch": 3585} {"train_loss": -25.35655975341797, "global_step": 297601, "epoch": 3585} {"train_loss": -25.644302368164062, "global_step": 297602, "epoch": 3585} {"train_loss": -26.35700798034668, "global_step": 297603, "epoch": 3585} {"train_loss": -25.765588760375977, "global_step": 297604, "epoch": 3585} {"train_loss": -26.03687858581543, "global_step": 297605, "epoch": 3585} {"train_loss": -25.87298011779785, "global_step": 297606, "epoch": 3585} {"train_loss": -25.461883544921875, "global_step": 297607, "epoch": 3585} {"train_loss": -25.580293655395508, "global_step": 297608, "epoch": 3585} {"train_loss": -25.487287521362305, "global_step": 297609, "epoch": 3585} {"train_loss": -25.4464168548584, "global_step": 297610, "epoch": 3585} {"train_loss": -25.854841232299805, "global_step": 297611, "epoch": 3585} {"train_loss": -25.668848037719727, "global_step": 297612, "epoch": 3585} {"train_loss": -25.882959365844727, "global_step": 297613, "epoch": 3585} {"train_loss": -25.477365493774414, "global_step": 297614, "epoch": 3585} {"train_loss": -25.467954635620117, "global_step": 297615, "epoch": 3585} {"train_loss": -25.534921646118164, "global_step": 297616, "epoch": 3585} {"train_loss": -25.531797409057617, "global_step": 297617, "epoch": 3585} {"train_loss": -25.48710060119629, "global_step": 297618, "epoch": 3585} {"train_loss": -25.6505184173584, "global_step": 297619, "epoch": 3585} {"train_loss": -25.421100616455078, "global_step": 297620, "epoch": 3585} {"train_loss": -25.61322021484375, "global_step": 297621, "epoch": 3585} {"train_loss": -25.588134765625, "global_step": 297622, "epoch": 3585} {"train_loss": -25.4003849029541, "global_step": 297623, "epoch": 3585} {"train_loss": -25.6027889251709, "global_step": 297624, "epoch": 3585} {"train_loss": -25.48280906677246, "global_step": 297625, "epoch": 3585} {"train_loss": -25.847578048706055, "global_step": 297626, "epoch": 3585} {"train_loss": -25.746387481689453, "global_step": 297627, "epoch": 3585} {"train_loss": -25.68896484375, "global_step": 297628, "epoch": 3585} {"train_loss": -25.755340576171875, "global_step": 297629, "epoch": 3585} {"train_loss": -25.685413360595703, "global_step": 297630, "epoch": 3585} {"train_loss": -25.396902084350586, "global_step": 297631, "epoch": 3585} {"train_loss": -25.740161895751953, "global_step": 297632, "epoch": 3585} {"train_loss": -25.6785945892334, "global_step": 297633, "epoch": 3585} {"train_loss": -25.313928604125977, "global_step": 297634, "epoch": 3585} {"train_loss": -25.22617530822754, "global_step": 297635, "epoch": 3585} {"train_loss": -25.50289535522461, "global_step": 297636, "epoch": 3585} {"train_loss": -25.144003511911414, "global_step": 297637, "epoch": 3585, "val_loss": 7251849.0} {"train_loss": -25.246028900146484, "global_step": 297638, "epoch": 3586} {"train_loss": -25.15834617614746, "global_step": 297639, "epoch": 3586} {"train_loss": -25.486276626586914, "global_step": 297640, "epoch": 3586} {"train_loss": -24.896263122558594, "global_step": 297641, "epoch": 3586} {"train_loss": -25.408845901489258, "global_step": 297642, "epoch": 3586} {"train_loss": -25.195926666259766, "global_step": 297643, "epoch": 3586} {"train_loss": -25.666126251220703, "global_step": 297644, "epoch": 3586} {"train_loss": -25.8153076171875, "global_step": 297645, "epoch": 3586} {"train_loss": -25.386276245117188, "global_step": 297646, "epoch": 3586} {"train_loss": -25.30160903930664, "global_step": 297647, "epoch": 3586} {"train_loss": -25.791473388671875, "global_step": 297648, "epoch": 3586} {"train_loss": -24.926034927368164, "global_step": 297649, "epoch": 3586} {"train_loss": -25.65675926208496, "global_step": 297650, "epoch": 3586} {"train_loss": -25.167461395263672, "global_step": 297651, "epoch": 3586} {"train_loss": -25.42596435546875, "global_step": 297652, "epoch": 3586} {"train_loss": -25.34128761291504, "global_step": 297653, "epoch": 3586} {"train_loss": -25.836530685424805, "global_step": 297654, "epoch": 3586} {"train_loss": -25.36142921447754, "global_step": 297655, "epoch": 3586} {"train_loss": -25.613922119140625, "global_step": 297656, "epoch": 3586} {"train_loss": -25.441593170166016, "global_step": 297657, "epoch": 3586} {"train_loss": -25.7677059173584, "global_step": 297658, "epoch": 3586} {"train_loss": -25.360519409179688, "global_step": 297659, "epoch": 3586} {"train_loss": -25.132720947265625, "global_step": 297660, "epoch": 3586} {"train_loss": -25.82366943359375, "global_step": 297661, "epoch": 3586} {"train_loss": -25.583662033081055, "global_step": 297662, "epoch": 3586} {"train_loss": -25.421079635620117, "global_step": 297663, "epoch": 3586} {"train_loss": -25.210962295532227, "global_step": 297664, "epoch": 3586} {"train_loss": -25.799732208251953, "global_step": 297665, "epoch": 3586} {"train_loss": -25.773883819580078, "global_step": 297666, "epoch": 3586} {"train_loss": -25.514814376831055, "global_step": 297667, "epoch": 3586} {"train_loss": -25.23176383972168, "global_step": 297668, "epoch": 3586} {"train_loss": -25.75542640686035, "global_step": 297669, "epoch": 3586} {"train_loss": -25.726593017578125, "global_step": 297670, "epoch": 3586} {"train_loss": -25.32489585876465, "global_step": 297671, "epoch": 3586} {"train_loss": -25.966171264648438, "global_step": 297672, "epoch": 3586} {"train_loss": -25.501361846923828, "global_step": 297673, "epoch": 3586} {"train_loss": -26.044843673706055, "global_step": 297674, "epoch": 3586} {"train_loss": -25.90462303161621, "global_step": 297675, "epoch": 3586} {"train_loss": -25.989103317260742, "global_step": 297676, "epoch": 3586} {"train_loss": -25.567285537719727, "global_step": 297677, "epoch": 3586} {"train_loss": -25.926904678344727, "global_step": 297678, "epoch": 3586} {"train_loss": -25.9303035736084, "global_step": 297679, "epoch": 3586} {"train_loss": -25.727888107299805, "global_step": 297680, "epoch": 3586} {"train_loss": -25.949054718017578, "global_step": 297681, "epoch": 3586} {"train_loss": -25.611236572265625, "global_step": 297682, "epoch": 3586} {"train_loss": -26.070829391479492, "global_step": 297683, "epoch": 3586} {"train_loss": -25.623462677001953, "global_step": 297684, "epoch": 3586} {"train_loss": -25.543031692504883, "global_step": 297685, "epoch": 3586} {"train_loss": -25.716968536376953, "global_step": 297686, "epoch": 3586} {"train_loss": -25.640838623046875, "global_step": 297687, "epoch": 3586} {"train_loss": -25.702951431274414, "global_step": 297688, "epoch": 3586} {"train_loss": -25.802860260009766, "global_step": 297689, "epoch": 3586} {"train_loss": -25.515666961669922, "global_step": 297690, "epoch": 3586} {"train_loss": -25.256839752197266, "global_step": 297691, "epoch": 3586} {"train_loss": -25.116287231445312, "global_step": 297692, "epoch": 3586} {"train_loss": -25.298795700073242, "global_step": 297693, "epoch": 3586} {"train_loss": -25.88136100769043, "global_step": 297694, "epoch": 3586} {"train_loss": -26.174039840698242, "global_step": 297695, "epoch": 3586} {"train_loss": -25.455759048461914, "global_step": 297696, "epoch": 3586} {"train_loss": -24.86078453063965, "global_step": 297697, "epoch": 3586} {"train_loss": -25.666959762573242, "global_step": 297698, "epoch": 3586} {"train_loss": -25.41864013671875, "global_step": 297699, "epoch": 3586} {"train_loss": -26.221298217773438, "global_step": 297700, "epoch": 3586} {"train_loss": -25.83808708190918, "global_step": 297701, "epoch": 3586} {"train_loss": -25.540725708007812, "global_step": 297702, "epoch": 3586} {"train_loss": -25.885059356689453, "global_step": 297703, "epoch": 3586} {"train_loss": -25.166210174560547, "global_step": 297704, "epoch": 3586} {"train_loss": -25.27322769165039, "global_step": 297705, "epoch": 3586} {"train_loss": -25.83563804626465, "global_step": 297706, "epoch": 3586} {"train_loss": -25.66315269470215, "global_step": 297707, "epoch": 3586} {"train_loss": -25.801044464111328, "global_step": 297708, "epoch": 3586} {"train_loss": -25.3594913482666, "global_step": 297709, "epoch": 3586} {"train_loss": -25.53940773010254, "global_step": 297710, "epoch": 3586} {"train_loss": -25.566444396972656, "global_step": 297711, "epoch": 3586} {"train_loss": -25.52878189086914, "global_step": 297712, "epoch": 3586} {"train_loss": -25.483144760131836, "global_step": 297713, "epoch": 3586} {"train_loss": -25.444162368774414, "global_step": 297714, "epoch": 3586} {"train_loss": -25.70810317993164, "global_step": 297715, "epoch": 3586} {"train_loss": -25.45441246032715, "global_step": 297716, "epoch": 3586} {"train_loss": -25.619083404541016, "global_step": 297717, "epoch": 3586} {"train_loss": -25.553836822509766, "global_step": 297718, "epoch": 3586} {"train_loss": -25.69156265258789, "global_step": 297719, "epoch": 3586} {"train_loss": -25.56536361970097, "global_step": 297720, "epoch": 3586, "val_loss": 7172807.0} {"train_loss": -25.342233657836914, "global_step": 297721, "epoch": 3587} {"train_loss": -24.69052505493164, "global_step": 297722, "epoch": 3587} {"train_loss": -25.303844451904297, "global_step": 297723, "epoch": 3587} {"train_loss": -24.37580680847168, "global_step": 297724, "epoch": 3587} {"train_loss": -24.932300567626953, "global_step": 297725, "epoch": 3587} {"train_loss": -24.54543113708496, "global_step": 297726, "epoch": 3587} {"train_loss": -24.968496322631836, "global_step": 297727, "epoch": 3587} {"train_loss": -24.872007369995117, "global_step": 297728, "epoch": 3587} {"train_loss": -25.247695922851562, "global_step": 297729, "epoch": 3587} {"train_loss": -24.922637939453125, "global_step": 297730, "epoch": 3587} {"train_loss": -25.1973876953125, "global_step": 297731, "epoch": 3587} {"train_loss": -25.202760696411133, "global_step": 297732, "epoch": 3587} {"train_loss": -25.016019821166992, "global_step": 297733, "epoch": 3587} {"train_loss": -25.28553581237793, "global_step": 297734, "epoch": 3587} {"train_loss": -25.369274139404297, "global_step": 297735, "epoch": 3587} {"train_loss": -25.08613395690918, "global_step": 297736, "epoch": 3587} {"train_loss": -25.384992599487305, "global_step": 297737, "epoch": 3587} {"train_loss": -25.608306884765625, "global_step": 297738, "epoch": 3587} {"train_loss": -25.227636337280273, "global_step": 297739, "epoch": 3587} {"train_loss": -25.61958122253418, "global_step": 297740, "epoch": 3587} {"train_loss": -25.306074142456055, "global_step": 297741, "epoch": 3587} {"train_loss": -25.455699920654297, "global_step": 297742, "epoch": 3587} {"train_loss": -25.236515045166016, "global_step": 297743, "epoch": 3587} {"train_loss": -25.7707576751709, "global_step": 297744, "epoch": 3587} {"train_loss": -25.579273223876953, "global_step": 297745, "epoch": 3587} {"train_loss": -25.51165199279785, "global_step": 297746, "epoch": 3587} {"train_loss": -25.464006423950195, "global_step": 297747, "epoch": 3587} {"train_loss": -25.29719352722168, "global_step": 297748, "epoch": 3587} {"train_loss": -25.92645263671875, "global_step": 297749, "epoch": 3587} {"train_loss": -25.82818603515625, "global_step": 297750, "epoch": 3587} {"train_loss": -25.35772705078125, "global_step": 297751, "epoch": 3587} {"train_loss": -25.485065460205078, "global_step": 297752, "epoch": 3587} {"train_loss": -25.321958541870117, "global_step": 297753, "epoch": 3587} {"train_loss": -25.94775390625, "global_step": 297754, "epoch": 3587} {"train_loss": -25.584993362426758, "global_step": 297755, "epoch": 3587} {"train_loss": -25.534353256225586, "global_step": 297756, "epoch": 3587} {"train_loss": -25.646942138671875, "global_step": 297757, "epoch": 3587} {"train_loss": -25.820789337158203, "global_step": 297758, "epoch": 3587} {"train_loss": -25.36714744567871, "global_step": 297759, "epoch": 3587} {"train_loss": -25.386198043823242, "global_step": 297760, "epoch": 3587} {"train_loss": -25.706655502319336, "global_step": 297761, "epoch": 3587} {"train_loss": -25.791105270385742, "global_step": 297762, "epoch": 3587} {"train_loss": -25.683446884155273, "global_step": 297763, "epoch": 3587} {"train_loss": -25.702289581298828, "global_step": 297764, "epoch": 3587} {"train_loss": -25.66607093811035, "global_step": 297765, "epoch": 3587} {"train_loss": -26.05860710144043, "global_step": 297766, "epoch": 3587} {"train_loss": -25.554548263549805, "global_step": 297767, "epoch": 3587} {"train_loss": -25.929662704467773, "global_step": 297768, "epoch": 3587} {"train_loss": -25.78700828552246, "global_step": 297769, "epoch": 3587} {"train_loss": -25.90106201171875, "global_step": 297770, "epoch": 3587} {"train_loss": -25.730520248413086, "global_step": 297771, "epoch": 3587} {"train_loss": -25.883337020874023, "global_step": 297772, "epoch": 3587} {"train_loss": -26.1801700592041, "global_step": 297773, "epoch": 3587} {"train_loss": -25.6685791015625, "global_step": 297774, "epoch": 3587} {"train_loss": -25.486207962036133, "global_step": 297775, "epoch": 3587} {"train_loss": -25.266958236694336, "global_step": 297776, "epoch": 3587} {"train_loss": -25.396404266357422, "global_step": 297777, "epoch": 3587} {"train_loss": -25.492448806762695, "global_step": 297778, "epoch": 3587} {"train_loss": -25.6113338470459, "global_step": 297779, "epoch": 3587} {"train_loss": -25.85280418395996, "global_step": 297780, "epoch": 3587} {"train_loss": -25.906726837158203, "global_step": 297781, "epoch": 3587} {"train_loss": -25.928918838500977, "global_step": 297782, "epoch": 3587} {"train_loss": -25.849225997924805, "global_step": 297783, "epoch": 3587} {"train_loss": -25.630887985229492, "global_step": 297784, "epoch": 3587} {"train_loss": -25.3441104888916, "global_step": 297785, "epoch": 3587} {"train_loss": -25.485807418823242, "global_step": 297786, "epoch": 3587} {"train_loss": -25.615528106689453, "global_step": 297787, "epoch": 3587} {"train_loss": -25.365161895751953, "global_step": 297788, "epoch": 3587} {"train_loss": -25.339895248413086, "global_step": 297789, "epoch": 3587} {"train_loss": -25.246068954467773, "global_step": 297790, "epoch": 3587} {"train_loss": -25.72687339782715, "global_step": 297791, "epoch": 3587} {"train_loss": -25.500608444213867, "global_step": 297792, "epoch": 3587} {"train_loss": -25.71742820739746, "global_step": 297793, "epoch": 3587} {"train_loss": -25.453184127807617, "global_step": 297794, "epoch": 3587} {"train_loss": -25.573139190673828, "global_step": 297795, "epoch": 3587} {"train_loss": -25.77821159362793, "global_step": 297796, "epoch": 3587} {"train_loss": -25.71234130859375, "global_step": 297797, "epoch": 3587} {"train_loss": -25.859256744384766, "global_step": 297798, "epoch": 3587} {"train_loss": -25.60187339782715, "global_step": 297799, "epoch": 3587} {"train_loss": -25.90703773498535, "global_step": 297800, "epoch": 3587} {"train_loss": -25.935571670532227, "global_step": 297801, "epoch": 3587} {"train_loss": -26.150146484375, "global_step": 297802, "epoch": 3587} {"train_loss": -25.50136432877506, "global_step": 297803, "epoch": 3587, "val_loss": 7217636.0} {"train_loss": -25.273221969604492, "global_step": 297804, "epoch": 3588} {"train_loss": -24.693357467651367, "global_step": 297805, "epoch": 3588} {"train_loss": -24.9908504486084, "global_step": 297806, "epoch": 3588} {"train_loss": -24.8671932220459, "global_step": 297807, "epoch": 3588} {"train_loss": -24.867677688598633, "global_step": 297808, "epoch": 3588} {"train_loss": -25.403671264648438, "global_step": 297809, "epoch": 3588} {"train_loss": -24.67365074157715, "global_step": 297810, "epoch": 3588} {"train_loss": -24.807950973510742, "global_step": 297811, "epoch": 3588} {"train_loss": -24.94489288330078, "global_step": 297812, "epoch": 3588} {"train_loss": -25.357017517089844, "global_step": 297813, "epoch": 3588} {"train_loss": -25.521718978881836, "global_step": 297814, "epoch": 3588} {"train_loss": -25.373437881469727, "global_step": 297815, "epoch": 3588} {"train_loss": -25.52483367919922, "global_step": 297816, "epoch": 3588} {"train_loss": -25.279396057128906, "global_step": 297817, "epoch": 3588} {"train_loss": -25.300121307373047, "global_step": 297818, "epoch": 3588} {"train_loss": -25.293045043945312, "global_step": 297819, "epoch": 3588} {"train_loss": -25.403615951538086, "global_step": 297820, "epoch": 3588} {"train_loss": -25.146718978881836, "global_step": 297821, "epoch": 3588} {"train_loss": -25.403501510620117, "global_step": 297822, "epoch": 3588} {"train_loss": -25.582563400268555, "global_step": 297823, "epoch": 3588} {"train_loss": -25.186979293823242, "global_step": 297824, "epoch": 3588} {"train_loss": -25.213552474975586, "global_step": 297825, "epoch": 3588} {"train_loss": -25.18050765991211, "global_step": 297826, "epoch": 3588} {"train_loss": -25.231338500976562, "global_step": 297827, "epoch": 3588} {"train_loss": -25.363845825195312, "global_step": 297828, "epoch": 3588} {"train_loss": -25.436477661132812, "global_step": 297829, "epoch": 3588} {"train_loss": -25.55301284790039, "global_step": 297830, "epoch": 3588} {"train_loss": -25.762435913085938, "global_step": 297831, "epoch": 3588} {"train_loss": -25.584680557250977, "global_step": 297832, "epoch": 3588} {"train_loss": -25.62776756286621, "global_step": 297833, "epoch": 3588} {"train_loss": -25.426321029663086, "global_step": 297834, "epoch": 3588} {"train_loss": -25.475168228149414, "global_step": 297835, "epoch": 3588} {"train_loss": -25.391572952270508, "global_step": 297836, "epoch": 3588} {"train_loss": -25.513952255249023, "global_step": 297837, "epoch": 3588} {"train_loss": -25.731372833251953, "global_step": 297838, "epoch": 3588} {"train_loss": -25.767166137695312, "global_step": 297839, "epoch": 3588} {"train_loss": -25.302732467651367, "global_step": 297840, "epoch": 3588} {"train_loss": -25.77797508239746, "global_step": 297841, "epoch": 3588} {"train_loss": -25.578784942626953, "global_step": 297842, "epoch": 3588} {"train_loss": -25.532470703125, "global_step": 297843, "epoch": 3588} {"train_loss": -25.61939811706543, "global_step": 297844, "epoch": 3588} {"train_loss": -25.7276554107666, "global_step": 297845, "epoch": 3588} {"train_loss": -25.52166175842285, "global_step": 297846, "epoch": 3588} {"train_loss": -25.932758331298828, "global_step": 297847, "epoch": 3588} {"train_loss": -25.442556381225586, "global_step": 297848, "epoch": 3588} {"train_loss": -25.927692413330078, "global_step": 297849, "epoch": 3588} {"train_loss": -25.794097900390625, "global_step": 297850, "epoch": 3588} {"train_loss": -25.402862548828125, "global_step": 297851, "epoch": 3588} {"train_loss": -25.661130905151367, "global_step": 297852, "epoch": 3588} {"train_loss": -25.553396224975586, "global_step": 297853, "epoch": 3588} {"train_loss": -25.858539581298828, "global_step": 297854, "epoch": 3588} {"train_loss": -26.06849479675293, "global_step": 297855, "epoch": 3588} {"train_loss": -25.673065185546875, "global_step": 297856, "epoch": 3588} {"train_loss": -25.63641929626465, "global_step": 297857, "epoch": 3588} {"train_loss": -25.681354522705078, "global_step": 297858, "epoch": 3588} {"train_loss": -26.046621322631836, "global_step": 297859, "epoch": 3588} {"train_loss": -25.8869686126709, "global_step": 297860, "epoch": 3588} {"train_loss": -25.803974151611328, "global_step": 297861, "epoch": 3588} {"train_loss": -25.54029655456543, "global_step": 297862, "epoch": 3588} {"train_loss": -25.56318473815918, "global_step": 297863, "epoch": 3588} {"train_loss": -25.64546775817871, "global_step": 297864, "epoch": 3588} {"train_loss": -25.52247428894043, "global_step": 297865, "epoch": 3588} {"train_loss": -25.879322052001953, "global_step": 297866, "epoch": 3588} {"train_loss": -26.13600730895996, "global_step": 297867, "epoch": 3588} {"train_loss": -25.852014541625977, "global_step": 297868, "epoch": 3588} {"train_loss": -26.076425552368164, "global_step": 297869, "epoch": 3588} {"train_loss": -25.761877059936523, "global_step": 297870, "epoch": 3588} {"train_loss": -25.58743667602539, "global_step": 297871, "epoch": 3588} {"train_loss": -25.398218154907227, "global_step": 297872, "epoch": 3588} {"train_loss": -25.764318466186523, "global_step": 297873, "epoch": 3588} {"train_loss": -25.410083770751953, "global_step": 297874, "epoch": 3588} {"train_loss": -25.779592514038086, "global_step": 297875, "epoch": 3588} {"train_loss": -25.55344581604004, "global_step": 297876, "epoch": 3588} {"train_loss": -25.55010986328125, "global_step": 297877, "epoch": 3588} {"train_loss": -25.48673439025879, "global_step": 297878, "epoch": 3588} {"train_loss": -25.560827255249023, "global_step": 297879, "epoch": 3588} {"train_loss": -25.409957885742188, "global_step": 297880, "epoch": 3588} {"train_loss": -25.434364318847656, "global_step": 297881, "epoch": 3588} {"train_loss": -25.48811149597168, "global_step": 297882, "epoch": 3588} {"train_loss": -25.786569595336914, "global_step": 297883, "epoch": 3588} {"train_loss": -25.4383487701416, "global_step": 297884, "epoch": 3588} {"train_loss": -25.437726974487305, "global_step": 297885, "epoch": 3588} {"train_loss": -25.495041008455207, "global_step": 297886, "epoch": 3588, "val_loss": 7213978.0} {"train_loss": -24.975446701049805, "global_step": 297887, "epoch": 3589} {"train_loss": -25.30727195739746, "global_step": 297888, "epoch": 3589} {"train_loss": -24.897171020507812, "global_step": 297889, "epoch": 3589} {"train_loss": -25.23666763305664, "global_step": 297890, "epoch": 3589} {"train_loss": -25.275287628173828, "global_step": 297891, "epoch": 3589} {"train_loss": -25.75225830078125, "global_step": 297892, "epoch": 3589} {"train_loss": -25.44649314880371, "global_step": 297893, "epoch": 3589} {"train_loss": -25.536718368530273, "global_step": 297894, "epoch": 3589} {"train_loss": -25.509763717651367, "global_step": 297895, "epoch": 3589} {"train_loss": -25.666391372680664, "global_step": 297896, "epoch": 3589} {"train_loss": -26.056615829467773, "global_step": 297897, "epoch": 3589} {"train_loss": -25.680932998657227, "global_step": 297898, "epoch": 3589} {"train_loss": -25.57197380065918, "global_step": 297899, "epoch": 3589} {"train_loss": -25.499954223632812, "global_step": 297900, "epoch": 3589} {"train_loss": -25.711130142211914, "global_step": 297901, "epoch": 3589} {"train_loss": -25.17121696472168, "global_step": 297902, "epoch": 3589} {"train_loss": -25.451147079467773, "global_step": 297903, "epoch": 3589} {"train_loss": -25.486934661865234, "global_step": 297904, "epoch": 3589} {"train_loss": -25.537656784057617, "global_step": 297905, "epoch": 3589} {"train_loss": -25.286401748657227, "global_step": 297906, "epoch": 3589} {"train_loss": -25.616613388061523, "global_step": 297907, "epoch": 3589} {"train_loss": -25.460386276245117, "global_step": 297908, "epoch": 3589} {"train_loss": -25.751789093017578, "global_step": 297909, "epoch": 3589} {"train_loss": -25.71388053894043, "global_step": 297910, "epoch": 3589} {"train_loss": -25.672880172729492, "global_step": 297911, "epoch": 3589} {"train_loss": -25.95758628845215, "global_step": 297912, "epoch": 3589} {"train_loss": -25.914398193359375, "global_step": 297913, "epoch": 3589} {"train_loss": -25.466594696044922, "global_step": 297914, "epoch": 3589} {"train_loss": -25.79861831665039, "global_step": 297915, "epoch": 3589} {"train_loss": -25.594463348388672, "global_step": 297916, "epoch": 3589} {"train_loss": -25.493528366088867, "global_step": 297917, "epoch": 3589} {"train_loss": -25.694686889648438, "global_step": 297918, "epoch": 3589} {"train_loss": -25.57992935180664, "global_step": 297919, "epoch": 3589} {"train_loss": -25.780370712280273, "global_step": 297920, "epoch": 3589} {"train_loss": -25.762990951538086, "global_step": 297921, "epoch": 3589} {"train_loss": -25.638641357421875, "global_step": 297922, "epoch": 3589} {"train_loss": -25.985700607299805, "global_step": 297923, "epoch": 3589} {"train_loss": -25.752607345581055, "global_step": 297924, "epoch": 3589} {"train_loss": -25.489173889160156, "global_step": 297925, "epoch": 3589} {"train_loss": -25.25270652770996, "global_step": 297926, "epoch": 3589} {"train_loss": -25.853961944580078, "global_step": 297927, "epoch": 3589} {"train_loss": -25.601613998413086, "global_step": 297928, "epoch": 3589} {"train_loss": -25.649816513061523, "global_step": 297929, "epoch": 3589} {"train_loss": -25.390220642089844, "global_step": 297930, "epoch": 3589} {"train_loss": -25.431177139282227, "global_step": 297931, "epoch": 3589} {"train_loss": -25.596384048461914, "global_step": 297932, "epoch": 3589} {"train_loss": -25.752918243408203, "global_step": 297933, "epoch": 3589} {"train_loss": -25.77533531188965, "global_step": 297934, "epoch": 3589} {"train_loss": -25.73383903503418, "global_step": 297935, "epoch": 3589} {"train_loss": -25.356199264526367, "global_step": 297936, "epoch": 3589} {"train_loss": -25.775854110717773, "global_step": 297937, "epoch": 3589} {"train_loss": -25.47709846496582, "global_step": 297938, "epoch": 3589} {"train_loss": -25.7948055267334, "global_step": 297939, "epoch": 3589} {"train_loss": -25.565889358520508, "global_step": 297940, "epoch": 3589} {"train_loss": -25.65726089477539, "global_step": 297941, "epoch": 3589} {"train_loss": -25.52725601196289, "global_step": 297942, "epoch": 3589} {"train_loss": -25.428180694580078, "global_step": 297943, "epoch": 3589} {"train_loss": -25.35761833190918, "global_step": 297944, "epoch": 3589} {"train_loss": -25.63832664489746, "global_step": 297945, "epoch": 3589} {"train_loss": -25.86004638671875, "global_step": 297946, "epoch": 3589} {"train_loss": -25.6118106842041, "global_step": 297947, "epoch": 3589} {"train_loss": -25.6495418548584, "global_step": 297948, "epoch": 3589} {"train_loss": -25.687631607055664, "global_step": 297949, "epoch": 3589} {"train_loss": -25.954442977905273, "global_step": 297950, "epoch": 3589} {"train_loss": -25.852575302124023, "global_step": 297951, "epoch": 3589} {"train_loss": -25.722583770751953, "global_step": 297952, "epoch": 3589} {"train_loss": -25.49652099609375, "global_step": 297953, "epoch": 3589} {"train_loss": -25.880084991455078, "global_step": 297954, "epoch": 3589} {"train_loss": -25.351917266845703, "global_step": 297955, "epoch": 3589} {"train_loss": -25.808887481689453, "global_step": 297956, "epoch": 3589} {"train_loss": -25.812040328979492, "global_step": 297957, "epoch": 3589} {"train_loss": -25.6614933013916, "global_step": 297958, "epoch": 3589} {"train_loss": -25.90166664123535, "global_step": 297959, "epoch": 3589} {"train_loss": -25.56611442565918, "global_step": 297960, "epoch": 3589} {"train_loss": -25.684329986572266, "global_step": 297961, "epoch": 3589} {"train_loss": -25.699325561523438, "global_step": 297962, "epoch": 3589} {"train_loss": -25.225080490112305, "global_step": 297963, "epoch": 3589} {"train_loss": -25.244434356689453, "global_step": 297964, "epoch": 3589} {"train_loss": -25.50713539123535, "global_step": 297965, "epoch": 3589} {"train_loss": -25.050140380859375, "global_step": 297966, "epoch": 3589} {"train_loss": -25.903045654296875, "global_step": 297967, "epoch": 3589} {"train_loss": -25.85675048828125, "global_step": 297968, "epoch": 3589} {"train_loss": -25.593982076070393, "global_step": 297969, "epoch": 3589, "val_loss": 7133491.0} {"train_loss": -24.737756729125977, "global_step": 297970, "epoch": 3590} {"train_loss": -24.577110290527344, "global_step": 297971, "epoch": 3590} {"train_loss": -25.290924072265625, "global_step": 297972, "epoch": 3590} {"train_loss": -24.411474227905273, "global_step": 297973, "epoch": 3590} {"train_loss": -25.428144454956055, "global_step": 297974, "epoch": 3590} {"train_loss": -25.019466400146484, "global_step": 297975, "epoch": 3590} {"train_loss": -24.902433395385742, "global_step": 297976, "epoch": 3590} {"train_loss": -24.976850509643555, "global_step": 297977, "epoch": 3590} {"train_loss": -25.753559112548828, "global_step": 297978, "epoch": 3590} {"train_loss": -25.262048721313477, "global_step": 297979, "epoch": 3590} {"train_loss": -25.3150577545166, "global_step": 297980, "epoch": 3590} {"train_loss": -25.311323165893555, "global_step": 297981, "epoch": 3590} {"train_loss": -25.37338638305664, "global_step": 297982, "epoch": 3590} {"train_loss": -25.199613571166992, "global_step": 297983, "epoch": 3590} {"train_loss": -25.20306968688965, "global_step": 297984, "epoch": 3590} {"train_loss": -25.42325210571289, "global_step": 297985, "epoch": 3590} {"train_loss": -25.042234420776367, "global_step": 297986, "epoch": 3590} {"train_loss": -25.237682342529297, "global_step": 297987, "epoch": 3590} {"train_loss": -25.301773071289062, "global_step": 297988, "epoch": 3590} {"train_loss": -25.5471134185791, "global_step": 297989, "epoch": 3590} {"train_loss": -25.311338424682617, "global_step": 297990, "epoch": 3590} {"train_loss": -25.403295516967773, "global_step": 297991, "epoch": 3590} {"train_loss": -25.81266212463379, "global_step": 297992, "epoch": 3590} {"train_loss": -25.540353775024414, "global_step": 297993, "epoch": 3590} {"train_loss": -25.464155197143555, "global_step": 297994, "epoch": 3590} {"train_loss": -25.67740249633789, "global_step": 297995, "epoch": 3590} {"train_loss": -25.48855972290039, "global_step": 297996, "epoch": 3590} {"train_loss": -25.297178268432617, "global_step": 297997, "epoch": 3590} {"train_loss": -25.661420822143555, "global_step": 297998, "epoch": 3590} {"train_loss": -25.89356803894043, "global_step": 297999, "epoch": 3590} {"train_loss": -25.436594009399414, "global_step": 298000, "epoch": 3590} {"train_loss": -25.716445922851562, "global_step": 298001, "epoch": 3590} {"train_loss": -25.83990478515625, "global_step": 298002, "epoch": 3590} {"train_loss": -25.51552391052246, "global_step": 298003, "epoch": 3590} {"train_loss": -25.892333984375, "global_step": 298004, "epoch": 3590} {"train_loss": -25.545612335205078, "global_step": 298005, "epoch": 3590} {"train_loss": -25.592086791992188, "global_step": 298006, "epoch": 3590} {"train_loss": -25.36784553527832, "global_step": 298007, "epoch": 3590} {"train_loss": -25.54109001159668, "global_step": 298008, "epoch": 3590} {"train_loss": -25.694868087768555, "global_step": 298009, "epoch": 3590} {"train_loss": -25.58425521850586, "global_step": 298010, "epoch": 3590} {"train_loss": -25.05289077758789, "global_step": 298011, "epoch": 3590} {"train_loss": -25.852018356323242, "global_step": 298012, "epoch": 3590} {"train_loss": -25.639753341674805, "global_step": 298013, "epoch": 3590} {"train_loss": -25.429128646850586, "global_step": 298014, "epoch": 3590} {"train_loss": -25.577011108398438, "global_step": 298015, "epoch": 3590} {"train_loss": -25.981225967407227, "global_step": 298016, "epoch": 3590} {"train_loss": -25.523305892944336, "global_step": 298017, "epoch": 3590} {"train_loss": -25.495325088500977, "global_step": 298018, "epoch": 3590} {"train_loss": -25.19097328186035, "global_step": 298019, "epoch": 3590} {"train_loss": -25.926620483398438, "global_step": 298020, "epoch": 3590} {"train_loss": -25.732421875, "global_step": 298021, "epoch": 3590} {"train_loss": -25.22775650024414, "global_step": 298022, "epoch": 3590} {"train_loss": -25.76626968383789, "global_step": 298023, "epoch": 3590} {"train_loss": -25.284271240234375, "global_step": 298024, "epoch": 3590} {"train_loss": -25.423782348632812, "global_step": 298025, "epoch": 3590} {"train_loss": -25.42609977722168, "global_step": 298026, "epoch": 3590} {"train_loss": -25.332632064819336, "global_step": 298027, "epoch": 3590} {"train_loss": -25.818836212158203, "global_step": 298028, "epoch": 3590} {"train_loss": -25.7188777923584, "global_step": 298029, "epoch": 3590} {"train_loss": -25.217050552368164, "global_step": 298030, "epoch": 3590} {"train_loss": -25.760282516479492, "global_step": 298031, "epoch": 3590} {"train_loss": -25.009437561035156, "global_step": 298032, "epoch": 3590} {"train_loss": -26.008756637573242, "global_step": 298033, "epoch": 3590} {"train_loss": -25.3154354095459, "global_step": 298034, "epoch": 3590} {"train_loss": -25.87158203125, "global_step": 298035, "epoch": 3590} {"train_loss": -25.533140182495117, "global_step": 298036, "epoch": 3590} {"train_loss": -25.744482040405273, "global_step": 298037, "epoch": 3590} {"train_loss": -25.80135154724121, "global_step": 298038, "epoch": 3590} {"train_loss": -25.452463150024414, "global_step": 298039, "epoch": 3590} {"train_loss": -25.734745025634766, "global_step": 298040, "epoch": 3590} {"train_loss": -25.801786422729492, "global_step": 298041, "epoch": 3590} {"train_loss": -25.21234893798828, "global_step": 298042, "epoch": 3590} {"train_loss": -25.96248435974121, "global_step": 298043, "epoch": 3590} {"train_loss": -25.686269760131836, "global_step": 298044, "epoch": 3590} {"train_loss": -25.798391342163086, "global_step": 298045, "epoch": 3590} {"train_loss": -25.663776397705078, "global_step": 298046, "epoch": 3590} {"train_loss": -25.781885147094727, "global_step": 298047, "epoch": 3590} {"train_loss": -25.808155059814453, "global_step": 298048, "epoch": 3590} {"train_loss": -25.703369140625, "global_step": 298049, "epoch": 3590} {"train_loss": -25.61191177368164, "global_step": 298050, "epoch": 3590} {"train_loss": -25.693899154663086, "global_step": 298051, "epoch": 3590} {"train_loss": -25.499153114226928, "global_step": 298052, "epoch": 3590, "val_loss": 7253625.0} {"train_loss": -25.232084274291992, "global_step": 298053, "epoch": 3591} {"train_loss": -25.37384033203125, "global_step": 298054, "epoch": 3591} {"train_loss": -25.45154571533203, "global_step": 298055, "epoch": 3591} {"train_loss": -25.549217224121094, "global_step": 298056, "epoch": 3591} {"train_loss": -25.181615829467773, "global_step": 298057, "epoch": 3591} {"train_loss": -25.505313873291016, "global_step": 298058, "epoch": 3591} {"train_loss": -25.711078643798828, "global_step": 298059, "epoch": 3591} {"train_loss": -25.422317504882812, "global_step": 298060, "epoch": 3591} {"train_loss": -24.90444564819336, "global_step": 298061, "epoch": 3591} {"train_loss": -25.244909286499023, "global_step": 298062, "epoch": 3591} {"train_loss": -25.509830474853516, "global_step": 298063, "epoch": 3591} {"train_loss": -25.373159408569336, "global_step": 298064, "epoch": 3591} {"train_loss": -25.519046783447266, "global_step": 298065, "epoch": 3591} {"train_loss": -25.44841194152832, "global_step": 298066, "epoch": 3591} {"train_loss": -25.087182998657227, "global_step": 298067, "epoch": 3591} {"train_loss": -25.317686080932617, "global_step": 298068, "epoch": 3591} {"train_loss": -25.719709396362305, "global_step": 298069, "epoch": 3591} {"train_loss": -25.30472183227539, "global_step": 298070, "epoch": 3591} {"train_loss": -25.596881866455078, "global_step": 298071, "epoch": 3591} {"train_loss": -25.6102294921875, "global_step": 298072, "epoch": 3591} {"train_loss": -25.127643585205078, "global_step": 298073, "epoch": 3591} {"train_loss": -25.800281524658203, "global_step": 298074, "epoch": 3591} {"train_loss": -25.819442749023438, "global_step": 298075, "epoch": 3591} {"train_loss": -25.198118209838867, "global_step": 298076, "epoch": 3591} {"train_loss": -25.300046920776367, "global_step": 298077, "epoch": 3591} {"train_loss": -25.894657135009766, "global_step": 298078, "epoch": 3591} {"train_loss": -25.977771759033203, "global_step": 298079, "epoch": 3591} {"train_loss": -25.23533058166504, "global_step": 298080, "epoch": 3591} {"train_loss": -25.688623428344727, "global_step": 298081, "epoch": 3591} {"train_loss": -25.51374626159668, "global_step": 298082, "epoch": 3591} {"train_loss": -25.876728057861328, "global_step": 298083, "epoch": 3591} {"train_loss": -25.294479370117188, "global_step": 298084, "epoch": 3591} {"train_loss": -25.624662399291992, "global_step": 298085, "epoch": 3591} {"train_loss": -25.399768829345703, "global_step": 298086, "epoch": 3591} {"train_loss": -25.77178382873535, "global_step": 298087, "epoch": 3591} {"train_loss": -25.71563148498535, "global_step": 298088, "epoch": 3591} {"train_loss": -25.517677307128906, "global_step": 298089, "epoch": 3591} {"train_loss": -25.650426864624023, "global_step": 298090, "epoch": 3591} {"train_loss": -25.51749038696289, "global_step": 298091, "epoch": 3591} {"train_loss": -25.429136276245117, "global_step": 298092, "epoch": 3591} {"train_loss": -25.351163864135742, "global_step": 298093, "epoch": 3591} {"train_loss": -25.42146873474121, "global_step": 298094, "epoch": 3591} {"train_loss": -25.510684967041016, "global_step": 298095, "epoch": 3591} {"train_loss": -25.58799934387207, "global_step": 298096, "epoch": 3591} {"train_loss": -25.6641845703125, "global_step": 298097, "epoch": 3591} {"train_loss": -25.538320541381836, "global_step": 298098, "epoch": 3591} {"train_loss": -25.82305335998535, "global_step": 298099, "epoch": 3591} {"train_loss": -25.664045333862305, "global_step": 298100, "epoch": 3591} {"train_loss": -25.736913681030273, "global_step": 298101, "epoch": 3591} {"train_loss": -25.516780853271484, "global_step": 298102, "epoch": 3591} {"train_loss": -25.544414520263672, "global_step": 298103, "epoch": 3591} {"train_loss": -25.729461669921875, "global_step": 298104, "epoch": 3591} {"train_loss": -25.984149932861328, "global_step": 298105, "epoch": 3591} {"train_loss": -25.58367347717285, "global_step": 298106, "epoch": 3591} {"train_loss": -25.698837280273438, "global_step": 298107, "epoch": 3591} {"train_loss": -25.946582794189453, "global_step": 298108, "epoch": 3591} {"train_loss": -25.38204002380371, "global_step": 298109, "epoch": 3591} {"train_loss": -25.73465347290039, "global_step": 298110, "epoch": 3591} {"train_loss": -25.583871841430664, "global_step": 298111, "epoch": 3591} {"train_loss": -25.161237716674805, "global_step": 298112, "epoch": 3591} {"train_loss": -25.477514266967773, "global_step": 298113, "epoch": 3591} {"train_loss": -25.73054313659668, "global_step": 298114, "epoch": 3591} {"train_loss": -25.70295524597168, "global_step": 298115, "epoch": 3591} {"train_loss": -25.379987716674805, "global_step": 298116, "epoch": 3591} {"train_loss": -25.55316162109375, "global_step": 298117, "epoch": 3591} {"train_loss": -25.377241134643555, "global_step": 298118, "epoch": 3591} {"train_loss": -25.736318588256836, "global_step": 298119, "epoch": 3591} {"train_loss": -25.806964874267578, "global_step": 298120, "epoch": 3591} {"train_loss": -25.76962661743164, "global_step": 298121, "epoch": 3591} {"train_loss": -25.774967193603516, "global_step": 298122, "epoch": 3591} {"train_loss": -25.93037223815918, "global_step": 298123, "epoch": 3591} {"train_loss": -25.412263870239258, "global_step": 298124, "epoch": 3591} {"train_loss": -25.480091094970703, "global_step": 298125, "epoch": 3591} {"train_loss": -25.574888229370117, "global_step": 298126, "epoch": 3591} {"train_loss": -25.576658248901367, "global_step": 298127, "epoch": 3591} {"train_loss": -25.24676513671875, "global_step": 298128, "epoch": 3591} {"train_loss": -25.497270584106445, "global_step": 298129, "epoch": 3591} {"train_loss": -25.68122673034668, "global_step": 298130, "epoch": 3591} {"train_loss": -25.731321334838867, "global_step": 298131, "epoch": 3591} {"train_loss": -25.939746856689453, "global_step": 298132, "epoch": 3591} {"train_loss": -25.46671485900879, "global_step": 298133, "epoch": 3591} {"train_loss": -25.673871994018555, "global_step": 298134, "epoch": 3591} {"train_loss": -25.544958459325585, "global_step": 298135, "epoch": 3591, "val_loss": 7059835.0} {"train_loss": -24.905887603759766, "global_step": 298136, "epoch": 3592} {"train_loss": -25.08109474182129, "global_step": 298137, "epoch": 3592} {"train_loss": -25.371585845947266, "global_step": 298138, "epoch": 3592} {"train_loss": -25.158397674560547, "global_step": 298139, "epoch": 3592} {"train_loss": -25.340351104736328, "global_step": 298140, "epoch": 3592} {"train_loss": -25.59838104248047, "global_step": 298141, "epoch": 3592} {"train_loss": -25.160619735717773, "global_step": 298142, "epoch": 3592} {"train_loss": -25.207712173461914, "global_step": 298143, "epoch": 3592} {"train_loss": -25.436494827270508, "global_step": 298144, "epoch": 3592} {"train_loss": -25.8435001373291, "global_step": 298145, "epoch": 3592} {"train_loss": -25.51984214782715, "global_step": 298146, "epoch": 3592} {"train_loss": -25.83271598815918, "global_step": 298147, "epoch": 3592} {"train_loss": -25.28904151916504, "global_step": 298148, "epoch": 3592} {"train_loss": -25.541208267211914, "global_step": 298149, "epoch": 3592} {"train_loss": -25.56136131286621, "global_step": 298150, "epoch": 3592} {"train_loss": -25.46024513244629, "global_step": 298151, "epoch": 3592} {"train_loss": -25.655261993408203, "global_step": 298152, "epoch": 3592} {"train_loss": -25.673938751220703, "global_step": 298153, "epoch": 3592} {"train_loss": -25.682764053344727, "global_step": 298154, "epoch": 3592} {"train_loss": -25.582584381103516, "global_step": 298155, "epoch": 3592} {"train_loss": -25.43987464904785, "global_step": 298156, "epoch": 3592} {"train_loss": -25.53618621826172, "global_step": 298157, "epoch": 3592} {"train_loss": -25.485681533813477, "global_step": 298158, "epoch": 3592} {"train_loss": -25.875354766845703, "global_step": 298159, "epoch": 3592} {"train_loss": -25.658315658569336, "global_step": 298160, "epoch": 3592} {"train_loss": -25.467336654663086, "global_step": 298161, "epoch": 3592} {"train_loss": -25.651498794555664, "global_step": 298162, "epoch": 3592} {"train_loss": -25.8754825592041, "global_step": 298163, "epoch": 3592} {"train_loss": -25.85324478149414, "global_step": 298164, "epoch": 3592} {"train_loss": -25.779626846313477, "global_step": 298165, "epoch": 3592} {"train_loss": -25.523548126220703, "global_step": 298166, "epoch": 3592} {"train_loss": -25.74236488342285, "global_step": 298167, "epoch": 3592} {"train_loss": -25.922208786010742, "global_step": 298168, "epoch": 3592} {"train_loss": -25.74226188659668, "global_step": 298169, "epoch": 3592} {"train_loss": -25.668729782104492, "global_step": 298170, "epoch": 3592} {"train_loss": -25.397947311401367, "global_step": 298171, "epoch": 3592} {"train_loss": -25.292348861694336, "global_step": 298172, "epoch": 3592} {"train_loss": -25.14055824279785, "global_step": 298173, "epoch": 3592} {"train_loss": -25.170957565307617, "global_step": 298174, "epoch": 3592} {"train_loss": -25.32010269165039, "global_step": 298175, "epoch": 3592} {"train_loss": -25.559762954711914, "global_step": 298176, "epoch": 3592} {"train_loss": -25.034568786621094, "global_step": 298177, "epoch": 3592} {"train_loss": -25.099069595336914, "global_step": 298178, "epoch": 3592} {"train_loss": -25.48550796508789, "global_step": 298179, "epoch": 3592} {"train_loss": -25.2202091217041, "global_step": 298180, "epoch": 3592} {"train_loss": -25.429428100585938, "global_step": 298181, "epoch": 3592} {"train_loss": -25.770780563354492, "global_step": 298182, "epoch": 3592} {"train_loss": -25.679824829101562, "global_step": 298183, "epoch": 3592} {"train_loss": -25.298730850219727, "global_step": 298184, "epoch": 3592} {"train_loss": -25.55961036682129, "global_step": 298185, "epoch": 3592} {"train_loss": -24.915241241455078, "global_step": 298186, "epoch": 3592} {"train_loss": -25.517911911010742, "global_step": 298187, "epoch": 3592} {"train_loss": -25.768457412719727, "global_step": 298188, "epoch": 3592} {"train_loss": -25.55723762512207, "global_step": 298189, "epoch": 3592} {"train_loss": -25.65662956237793, "global_step": 298190, "epoch": 3592} {"train_loss": -25.40669059753418, "global_step": 298191, "epoch": 3592} {"train_loss": -26.026914596557617, "global_step": 298192, "epoch": 3592} {"train_loss": -25.643823623657227, "global_step": 298193, "epoch": 3592} {"train_loss": -25.322921752929688, "global_step": 298194, "epoch": 3592} {"train_loss": -25.52028465270996, "global_step": 298195, "epoch": 3592} {"train_loss": -25.574481964111328, "global_step": 298196, "epoch": 3592} {"train_loss": -25.830677032470703, "global_step": 298197, "epoch": 3592} {"train_loss": -25.44133949279785, "global_step": 298198, "epoch": 3592} {"train_loss": -25.541339874267578, "global_step": 298199, "epoch": 3592} {"train_loss": -25.359455108642578, "global_step": 298200, "epoch": 3592} {"train_loss": -25.82259178161621, "global_step": 298201, "epoch": 3592} {"train_loss": -25.850452423095703, "global_step": 298202, "epoch": 3592} {"train_loss": -25.696985244750977, "global_step": 298203, "epoch": 3592} {"train_loss": -25.883188247680664, "global_step": 298204, "epoch": 3592} {"train_loss": -25.6010799407959, "global_step": 298205, "epoch": 3592} {"train_loss": -25.869129180908203, "global_step": 298206, "epoch": 3592} {"train_loss": -26.068586349487305, "global_step": 298207, "epoch": 3592} {"train_loss": -26.002948760986328, "global_step": 298208, "epoch": 3592} {"train_loss": -25.8326473236084, "global_step": 298209, "epoch": 3592} {"train_loss": -25.820037841796875, "global_step": 298210, "epoch": 3592} {"train_loss": -25.7594051361084, "global_step": 298211, "epoch": 3592} {"train_loss": -26.07525062561035, "global_step": 298212, "epoch": 3592} {"train_loss": -25.6981258392334, "global_step": 298213, "epoch": 3592} {"train_loss": -25.461780548095703, "global_step": 298214, "epoch": 3592} {"train_loss": -24.606374740600586, "global_step": 298215, "epoch": 3592} {"train_loss": -25.152738571166992, "global_step": 298216, "epoch": 3592} {"train_loss": -24.79958152770996, "global_step": 298217, "epoch": 3592} {"train_loss": -25.532661644809217, "global_step": 298218, "epoch": 3592, "val_loss": 7215637.5} {"train_loss": -24.547060012817383, "global_step": 298219, "epoch": 3593} {"train_loss": -24.798185348510742, "global_step": 298220, "epoch": 3593} {"train_loss": -23.690587997436523, "global_step": 298221, "epoch": 3593} {"train_loss": -24.970569610595703, "global_step": 298222, "epoch": 3593} {"train_loss": -24.567312240600586, "global_step": 298223, "epoch": 3593} {"train_loss": -24.023771286010742, "global_step": 298224, "epoch": 3593} {"train_loss": -24.877206802368164, "global_step": 298225, "epoch": 3593} {"train_loss": -24.69346046447754, "global_step": 298226, "epoch": 3593} {"train_loss": -24.405960083007812, "global_step": 298227, "epoch": 3593} {"train_loss": -24.781339645385742, "global_step": 298228, "epoch": 3593} {"train_loss": -24.907318115234375, "global_step": 298229, "epoch": 3593} {"train_loss": -24.541839599609375, "global_step": 298230, "epoch": 3593} {"train_loss": -24.972244262695312, "global_step": 298231, "epoch": 3593} {"train_loss": -24.832334518432617, "global_step": 298232, "epoch": 3593} {"train_loss": -25.04388999938965, "global_step": 298233, "epoch": 3593} {"train_loss": -24.867694854736328, "global_step": 298234, "epoch": 3593} {"train_loss": -24.66510009765625, "global_step": 298235, "epoch": 3593} {"train_loss": -25.37624168395996, "global_step": 298236, "epoch": 3593} {"train_loss": -25.134469985961914, "global_step": 298237, "epoch": 3593} {"train_loss": -24.808645248413086, "global_step": 298238, "epoch": 3593} {"train_loss": -25.470579147338867, "global_step": 298239, "epoch": 3593} {"train_loss": -25.203107833862305, "global_step": 298240, "epoch": 3593} {"train_loss": -25.178741455078125, "global_step": 298241, "epoch": 3593} {"train_loss": -25.208078384399414, "global_step": 298242, "epoch": 3593} {"train_loss": -25.076690673828125, "global_step": 298243, "epoch": 3593} {"train_loss": -25.434446334838867, "global_step": 298244, "epoch": 3593} {"train_loss": -25.48787498474121, "global_step": 298245, "epoch": 3593} {"train_loss": -25.59667205810547, "global_step": 298246, "epoch": 3593} {"train_loss": -25.247379302978516, "global_step": 298247, "epoch": 3593} {"train_loss": -25.522998809814453, "global_step": 298248, "epoch": 3593} {"train_loss": -24.83916664123535, "global_step": 298249, "epoch": 3593} {"train_loss": -25.31135368347168, "global_step": 298250, "epoch": 3593} {"train_loss": -24.99806022644043, "global_step": 298251, "epoch": 3593} {"train_loss": -25.42296028137207, "global_step": 298252, "epoch": 3593} {"train_loss": -25.684650421142578, "global_step": 298253, "epoch": 3593} {"train_loss": -25.61405372619629, "global_step": 298254, "epoch": 3593} {"train_loss": -25.7413272857666, "global_step": 298255, "epoch": 3593} {"train_loss": -25.264272689819336, "global_step": 298256, "epoch": 3593} {"train_loss": -24.96110725402832, "global_step": 298257, "epoch": 3593} {"train_loss": -25.39776611328125, "global_step": 298258, "epoch": 3593} {"train_loss": -25.669004440307617, "global_step": 298259, "epoch": 3593} {"train_loss": -25.247644424438477, "global_step": 298260, "epoch": 3593} {"train_loss": -25.393512725830078, "global_step": 298261, "epoch": 3593} {"train_loss": -25.790937423706055, "global_step": 298262, "epoch": 3593} {"train_loss": -25.9068660736084, "global_step": 298263, "epoch": 3593} {"train_loss": -25.628080368041992, "global_step": 298264, "epoch": 3593} {"train_loss": -25.6378231048584, "global_step": 298265, "epoch": 3593} {"train_loss": -25.55182456970215, "global_step": 298266, "epoch": 3593} {"train_loss": -25.373167037963867, "global_step": 298267, "epoch": 3593} {"train_loss": -25.628620147705078, "global_step": 298268, "epoch": 3593} {"train_loss": -25.73078727722168, "global_step": 298269, "epoch": 3593} {"train_loss": -25.8380069732666, "global_step": 298270, "epoch": 3593} {"train_loss": -25.60342788696289, "global_step": 298271, "epoch": 3593} {"train_loss": -25.811725616455078, "global_step": 298272, "epoch": 3593} {"train_loss": -25.665985107421875, "global_step": 298273, "epoch": 3593} {"train_loss": -25.588592529296875, "global_step": 298274, "epoch": 3593} {"train_loss": -25.61689567565918, "global_step": 298275, "epoch": 3593} {"train_loss": -25.263826370239258, "global_step": 298276, "epoch": 3593} {"train_loss": -25.478960037231445, "global_step": 298277, "epoch": 3593} {"train_loss": -25.650089263916016, "global_step": 298278, "epoch": 3593} {"train_loss": -25.771503448486328, "global_step": 298279, "epoch": 3593} {"train_loss": -25.58625602722168, "global_step": 298280, "epoch": 3593} {"train_loss": -25.689050674438477, "global_step": 298281, "epoch": 3593} {"train_loss": -25.630615234375, "global_step": 298282, "epoch": 3593} {"train_loss": -25.644643783569336, "global_step": 298283, "epoch": 3593} {"train_loss": -25.570209503173828, "global_step": 298284, "epoch": 3593} {"train_loss": -25.99435806274414, "global_step": 298285, "epoch": 3593} {"train_loss": -25.985107421875, "global_step": 298286, "epoch": 3593} {"train_loss": -25.66596031188965, "global_step": 298287, "epoch": 3593} {"train_loss": -25.717742919921875, "global_step": 298288, "epoch": 3593} {"train_loss": -25.80860710144043, "global_step": 298289, "epoch": 3593} {"train_loss": -25.856109619140625, "global_step": 298290, "epoch": 3593} {"train_loss": -25.68141746520996, "global_step": 298291, "epoch": 3593} {"train_loss": -25.410066604614258, "global_step": 298292, "epoch": 3593} {"train_loss": -25.535524368286133, "global_step": 298293, "epoch": 3593} {"train_loss": -25.67547607421875, "global_step": 298294, "epoch": 3593} {"train_loss": -25.77666664123535, "global_step": 298295, "epoch": 3593} {"train_loss": -26.018768310546875, "global_step": 298296, "epoch": 3593} {"train_loss": -25.598121643066406, "global_step": 298297, "epoch": 3593} {"train_loss": -25.71736717224121, "global_step": 298298, "epoch": 3593} {"train_loss": -25.50194549560547, "global_step": 298299, "epoch": 3593} {"train_loss": -25.74117088317871, "global_step": 298300, "epoch": 3593} {"train_loss": -25.370522234813276, "global_step": 298301, "epoch": 3593, "val_loss": 7233695.5} {"train_loss": -24.33524513244629, "global_step": 298302, "epoch": 3594} {"train_loss": -24.0698184967041, "global_step": 298303, "epoch": 3594} {"train_loss": -24.551542282104492, "global_step": 298304, "epoch": 3594} {"train_loss": -25.507043838500977, "global_step": 298305, "epoch": 3594} {"train_loss": -24.56178855895996, "global_step": 298306, "epoch": 3594} {"train_loss": -24.660795211791992, "global_step": 298307, "epoch": 3594} {"train_loss": -25.596481323242188, "global_step": 298308, "epoch": 3594} {"train_loss": -24.449066162109375, "global_step": 298309, "epoch": 3594} {"train_loss": -25.13978385925293, "global_step": 298310, "epoch": 3594} {"train_loss": -25.024024963378906, "global_step": 298311, "epoch": 3594} {"train_loss": -25.223480224609375, "global_step": 298312, "epoch": 3594} {"train_loss": -24.673561096191406, "global_step": 298313, "epoch": 3594} {"train_loss": -24.92209815979004, "global_step": 298314, "epoch": 3594} {"train_loss": -25.026357650756836, "global_step": 298315, "epoch": 3594} {"train_loss": -25.31471061706543, "global_step": 298316, "epoch": 3594} {"train_loss": -24.94165802001953, "global_step": 298317, "epoch": 3594} {"train_loss": -25.096969604492188, "global_step": 298318, "epoch": 3594} {"train_loss": -25.3906192779541, "global_step": 298319, "epoch": 3594} {"train_loss": -25.175119400024414, "global_step": 298320, "epoch": 3594} {"train_loss": -25.061853408813477, "global_step": 298321, "epoch": 3594} {"train_loss": -24.839094161987305, "global_step": 298322, "epoch": 3594} {"train_loss": -25.31007957458496, "global_step": 298323, "epoch": 3594} {"train_loss": -25.14830207824707, "global_step": 298324, "epoch": 3594} {"train_loss": -25.463674545288086, "global_step": 298325, "epoch": 3594} {"train_loss": -25.550048828125, "global_step": 298326, "epoch": 3594} {"train_loss": -25.714740753173828, "global_step": 298327, "epoch": 3594} {"train_loss": -25.019201278686523, "global_step": 298328, "epoch": 3594} {"train_loss": -25.491504669189453, "global_step": 298329, "epoch": 3594} {"train_loss": -25.245458602905273, "global_step": 298330, "epoch": 3594} {"train_loss": -25.536705017089844, "global_step": 298331, "epoch": 3594} {"train_loss": -25.542423248291016, "global_step": 298332, "epoch": 3594} {"train_loss": -25.447467803955078, "global_step": 298333, "epoch": 3594} {"train_loss": -25.935449600219727, "global_step": 298334, "epoch": 3594} {"train_loss": -25.577245712280273, "global_step": 298335, "epoch": 3594} {"train_loss": -25.449522018432617, "global_step": 298336, "epoch": 3594} {"train_loss": -25.729246139526367, "global_step": 298337, "epoch": 3594} {"train_loss": -25.528894424438477, "global_step": 298338, "epoch": 3594} {"train_loss": -25.439233779907227, "global_step": 298339, "epoch": 3594} {"train_loss": -25.588361740112305, "global_step": 298340, "epoch": 3594} {"train_loss": -25.784921646118164, "global_step": 298341, "epoch": 3594} {"train_loss": -25.624969482421875, "global_step": 298342, "epoch": 3594} {"train_loss": -25.69944190979004, "global_step": 298343, "epoch": 3594} {"train_loss": -25.828283309936523, "global_step": 298344, "epoch": 3594} {"train_loss": -26.16304588317871, "global_step": 298345, "epoch": 3594} {"train_loss": -25.7115421295166, "global_step": 298346, "epoch": 3594} {"train_loss": -25.467496871948242, "global_step": 298347, "epoch": 3594} {"train_loss": -25.229461669921875, "global_step": 298348, "epoch": 3594} {"train_loss": -25.497465133666992, "global_step": 298349, "epoch": 3594} {"train_loss": -25.816495895385742, "global_step": 298350, "epoch": 3594} {"train_loss": -25.64794921875, "global_step": 298351, "epoch": 3594} {"train_loss": -25.855817794799805, "global_step": 298352, "epoch": 3594} {"train_loss": -25.362424850463867, "global_step": 298353, "epoch": 3594} {"train_loss": -25.45638084411621, "global_step": 298354, "epoch": 3594} {"train_loss": -25.716785430908203, "global_step": 298355, "epoch": 3594} {"train_loss": -25.383581161499023, "global_step": 298356, "epoch": 3594} {"train_loss": -25.304832458496094, "global_step": 298357, "epoch": 3594} {"train_loss": -25.61005973815918, "global_step": 298358, "epoch": 3594} {"train_loss": -26.127195358276367, "global_step": 298359, "epoch": 3594} {"train_loss": -25.499658584594727, "global_step": 298360, "epoch": 3594} {"train_loss": -25.827838897705078, "global_step": 298361, "epoch": 3594} {"train_loss": -25.8531551361084, "global_step": 298362, "epoch": 3594} {"train_loss": -25.283658981323242, "global_step": 298363, "epoch": 3594} {"train_loss": -25.212522506713867, "global_step": 298364, "epoch": 3594} {"train_loss": -25.636667251586914, "global_step": 298365, "epoch": 3594} {"train_loss": -25.575414657592773, "global_step": 298366, "epoch": 3594} {"train_loss": -25.856061935424805, "global_step": 298367, "epoch": 3594} {"train_loss": -25.464889526367188, "global_step": 298368, "epoch": 3594} {"train_loss": -25.498376846313477, "global_step": 298369, "epoch": 3594} {"train_loss": -25.31511688232422, "global_step": 298370, "epoch": 3594} {"train_loss": -25.62204360961914, "global_step": 298371, "epoch": 3594} {"train_loss": -25.905797958374023, "global_step": 298372, "epoch": 3594} {"train_loss": -25.276493072509766, "global_step": 298373, "epoch": 3594} {"train_loss": -24.89628791809082, "global_step": 298374, "epoch": 3594} {"train_loss": -24.956825256347656, "global_step": 298375, "epoch": 3594} {"train_loss": -25.61359977722168, "global_step": 298376, "epoch": 3594} {"train_loss": -26.094831466674805, "global_step": 298377, "epoch": 3594} {"train_loss": -25.272024154663086, "global_step": 298378, "epoch": 3594} {"train_loss": -26.03729820251465, "global_step": 298379, "epoch": 3594} {"train_loss": -25.523670196533203, "global_step": 298380, "epoch": 3594} {"train_loss": -25.464073181152344, "global_step": 298381, "epoch": 3594} {"train_loss": -25.48505973815918, "global_step": 298382, "epoch": 3594} {"train_loss": -25.642297744750977, "global_step": 298383, "epoch": 3594} {"train_loss": -25.399270184068794, "global_step": 298384, "epoch": 3594, "val_loss": 7101676.0} {"train_loss": -25.0753116607666, "global_step": 298385, "epoch": 3595} {"train_loss": -25.05190086364746, "global_step": 298386, "epoch": 3595} {"train_loss": -25.38545799255371, "global_step": 298387, "epoch": 3595} {"train_loss": -24.97612953186035, "global_step": 298388, "epoch": 3595} {"train_loss": -25.029678344726562, "global_step": 298389, "epoch": 3595} {"train_loss": -25.153955459594727, "global_step": 298390, "epoch": 3595} {"train_loss": -25.414539337158203, "global_step": 298391, "epoch": 3595} {"train_loss": -24.947467803955078, "global_step": 298392, "epoch": 3595} {"train_loss": -25.501331329345703, "global_step": 298393, "epoch": 3595} {"train_loss": -25.33442497253418, "global_step": 298394, "epoch": 3595} {"train_loss": -25.191823959350586, "global_step": 298395, "epoch": 3595} {"train_loss": -25.175195693969727, "global_step": 298396, "epoch": 3595} {"train_loss": -25.667932510375977, "global_step": 298397, "epoch": 3595} {"train_loss": -25.243391036987305, "global_step": 298398, "epoch": 3595} {"train_loss": -25.541584014892578, "global_step": 298399, "epoch": 3595} {"train_loss": -25.472415924072266, "global_step": 298400, "epoch": 3595} {"train_loss": -25.126117706298828, "global_step": 298401, "epoch": 3595} {"train_loss": -25.2071590423584, "global_step": 298402, "epoch": 3595} {"train_loss": -25.48948097229004, "global_step": 298403, "epoch": 3595} {"train_loss": -25.148561477661133, "global_step": 298404, "epoch": 3595} {"train_loss": -25.358083724975586, "global_step": 298405, "epoch": 3595} {"train_loss": -25.856048583984375, "global_step": 298406, "epoch": 3595} {"train_loss": -25.488245010375977, "global_step": 298407, "epoch": 3595} {"train_loss": -25.546100616455078, "global_step": 298408, "epoch": 3595} {"train_loss": -25.179885864257812, "global_step": 298409, "epoch": 3595} {"train_loss": -25.774534225463867, "global_step": 298410, "epoch": 3595} {"train_loss": -25.663541793823242, "global_step": 298411, "epoch": 3595} {"train_loss": -25.5234317779541, "global_step": 298412, "epoch": 3595} {"train_loss": -25.668684005737305, "global_step": 298413, "epoch": 3595} {"train_loss": -25.716888427734375, "global_step": 298414, "epoch": 3595} {"train_loss": -25.482269287109375, "global_step": 298415, "epoch": 3595} {"train_loss": -25.788787841796875, "global_step": 298416, "epoch": 3595} {"train_loss": -25.686767578125, "global_step": 298417, "epoch": 3595} {"train_loss": -25.9788818359375, "global_step": 298418, "epoch": 3595} {"train_loss": -26.234838485717773, "global_step": 298419, "epoch": 3595} {"train_loss": -25.615747451782227, "global_step": 298420, "epoch": 3595} {"train_loss": -25.733991622924805, "global_step": 298421, "epoch": 3595} {"train_loss": -25.67997169494629, "global_step": 298422, "epoch": 3595} {"train_loss": -25.7096004486084, "global_step": 298423, "epoch": 3595} {"train_loss": -25.70172119140625, "global_step": 298424, "epoch": 3595} {"train_loss": -25.874197006225586, "global_step": 298425, "epoch": 3595} {"train_loss": -25.2491512298584, "global_step": 298426, "epoch": 3595} {"train_loss": -25.788389205932617, "global_step": 298427, "epoch": 3595} {"train_loss": -25.196033477783203, "global_step": 298428, "epoch": 3595} {"train_loss": -25.40256118774414, "global_step": 298429, "epoch": 3595} {"train_loss": -25.111448287963867, "global_step": 298430, "epoch": 3595} {"train_loss": -25.21956443786621, "global_step": 298431, "epoch": 3595} {"train_loss": -25.551258087158203, "global_step": 298432, "epoch": 3595} {"train_loss": -25.330535888671875, "global_step": 298433, "epoch": 3595} {"train_loss": -25.586917877197266, "global_step": 298434, "epoch": 3595} {"train_loss": -25.603979110717773, "global_step": 298435, "epoch": 3595} {"train_loss": -25.634374618530273, "global_step": 298436, "epoch": 3595} {"train_loss": -25.512041091918945, "global_step": 298437, "epoch": 3595} {"train_loss": -25.554943084716797, "global_step": 298438, "epoch": 3595} {"train_loss": -25.591690063476562, "global_step": 298439, "epoch": 3595} {"train_loss": -25.54128646850586, "global_step": 298440, "epoch": 3595} {"train_loss": -25.839893341064453, "global_step": 298441, "epoch": 3595} {"train_loss": -25.638029098510742, "global_step": 298442, "epoch": 3595} {"train_loss": -25.8311824798584, "global_step": 298443, "epoch": 3595} {"train_loss": -25.28275489807129, "global_step": 298444, "epoch": 3595} {"train_loss": -25.8387393951416, "global_step": 298445, "epoch": 3595} {"train_loss": -25.564403533935547, "global_step": 298446, "epoch": 3595} {"train_loss": -25.544363021850586, "global_step": 298447, "epoch": 3595} {"train_loss": -25.5257511138916, "global_step": 298448, "epoch": 3595} {"train_loss": -25.413984298706055, "global_step": 298449, "epoch": 3595} {"train_loss": -25.681488037109375, "global_step": 298450, "epoch": 3595} {"train_loss": -25.858997344970703, "global_step": 298451, "epoch": 3595} {"train_loss": -25.671131134033203, "global_step": 298452, "epoch": 3595} {"train_loss": -25.53316307067871, "global_step": 298453, "epoch": 3595} {"train_loss": -25.62080955505371, "global_step": 298454, "epoch": 3595} {"train_loss": -25.47857093811035, "global_step": 298455, "epoch": 3595} {"train_loss": -25.523168563842773, "global_step": 298456, "epoch": 3595} {"train_loss": -25.49873924255371, "global_step": 298457, "epoch": 3595} {"train_loss": -25.793302536010742, "global_step": 298458, "epoch": 3595} {"train_loss": -25.765745162963867, "global_step": 298459, "epoch": 3595} {"train_loss": -25.663110733032227, "global_step": 298460, "epoch": 3595} {"train_loss": -25.48639488220215, "global_step": 298461, "epoch": 3595} {"train_loss": -25.45694923400879, "global_step": 298462, "epoch": 3595} {"train_loss": -25.684009552001953, "global_step": 298463, "epoch": 3595} {"train_loss": -25.24873161315918, "global_step": 298464, "epoch": 3595} {"train_loss": -25.82086753845215, "global_step": 298465, "epoch": 3595} {"train_loss": -25.634033203125, "global_step": 298466, "epoch": 3595} {"train_loss": -25.511797939438416, "global_step": 298467, "epoch": 3595, "val_loss": 7197682.5} {"train_loss": -25.45737075805664, "global_step": 298468, "epoch": 3596} {"train_loss": -25.55573081970215, "global_step": 298469, "epoch": 3596} {"train_loss": -25.478378295898438, "global_step": 298470, "epoch": 3596} {"train_loss": -25.654027938842773, "global_step": 298471, "epoch": 3596} {"train_loss": -25.289091110229492, "global_step": 298472, "epoch": 3596} {"train_loss": -25.40997886657715, "global_step": 298473, "epoch": 3596} {"train_loss": -25.303165435791016, "global_step": 298474, "epoch": 3596} {"train_loss": -25.32714080810547, "global_step": 298475, "epoch": 3596} {"train_loss": -25.60808753967285, "global_step": 298476, "epoch": 3596} {"train_loss": -25.4031982421875, "global_step": 298477, "epoch": 3596} {"train_loss": -25.260591506958008, "global_step": 298478, "epoch": 3596} {"train_loss": -25.14044761657715, "global_step": 298479, "epoch": 3596} {"train_loss": -25.670541763305664, "global_step": 298480, "epoch": 3596} {"train_loss": -25.274093627929688, "global_step": 298481, "epoch": 3596} {"train_loss": -24.959108352661133, "global_step": 298482, "epoch": 3596} {"train_loss": -25.206073760986328, "global_step": 298483, "epoch": 3596} {"train_loss": -25.855947494506836, "global_step": 298484, "epoch": 3596} {"train_loss": -25.315004348754883, "global_step": 298485, "epoch": 3596} {"train_loss": -25.315061569213867, "global_step": 298486, "epoch": 3596} {"train_loss": -25.577272415161133, "global_step": 298487, "epoch": 3596} {"train_loss": -25.86805534362793, "global_step": 298488, "epoch": 3596} {"train_loss": -25.58246421813965, "global_step": 298489, "epoch": 3596} {"train_loss": -25.354190826416016, "global_step": 298490, "epoch": 3596} {"train_loss": -25.70171546936035, "global_step": 298491, "epoch": 3596} {"train_loss": -25.41069793701172, "global_step": 298492, "epoch": 3596} {"train_loss": -25.880910873413086, "global_step": 298493, "epoch": 3596} {"train_loss": -25.63441276550293, "global_step": 298494, "epoch": 3596} {"train_loss": -25.942564010620117, "global_step": 298495, "epoch": 3596} {"train_loss": -25.8332462310791, "global_step": 298496, "epoch": 3596} {"train_loss": -25.573272705078125, "global_step": 298497, "epoch": 3596} {"train_loss": -25.63592529296875, "global_step": 298498, "epoch": 3596} {"train_loss": -25.578004837036133, "global_step": 298499, "epoch": 3596} {"train_loss": -25.258529663085938, "global_step": 298500, "epoch": 3596} {"train_loss": -26.042280197143555, "global_step": 298501, "epoch": 3596} {"train_loss": -25.77888298034668, "global_step": 298502, "epoch": 3596} {"train_loss": -25.93739128112793, "global_step": 298503, "epoch": 3596} {"train_loss": -25.711835861206055, "global_step": 298504, "epoch": 3596} {"train_loss": -25.493057250976562, "global_step": 298505, "epoch": 3596} {"train_loss": -25.63117790222168, "global_step": 298506, "epoch": 3596} {"train_loss": -25.701099395751953, "global_step": 298507, "epoch": 3596} {"train_loss": -25.621723175048828, "global_step": 298508, "epoch": 3596} {"train_loss": -26.049591064453125, "global_step": 298509, "epoch": 3596} {"train_loss": -25.728734970092773, "global_step": 298510, "epoch": 3596} {"train_loss": -25.740142822265625, "global_step": 298511, "epoch": 3596} {"train_loss": -25.91609001159668, "global_step": 298512, "epoch": 3596} {"train_loss": -25.613813400268555, "global_step": 298513, "epoch": 3596} {"train_loss": -25.56081199645996, "global_step": 298514, "epoch": 3596} {"train_loss": -25.708288192749023, "global_step": 298515, "epoch": 3596} {"train_loss": -26.057300567626953, "global_step": 298516, "epoch": 3596} {"train_loss": -25.419065475463867, "global_step": 298517, "epoch": 3596} {"train_loss": -25.433822631835938, "global_step": 298518, "epoch": 3596} {"train_loss": -25.92896842956543, "global_step": 298519, "epoch": 3596} {"train_loss": -25.485801696777344, "global_step": 298520, "epoch": 3596} {"train_loss": -25.417478561401367, "global_step": 298521, "epoch": 3596} {"train_loss": -25.806243896484375, "global_step": 298522, "epoch": 3596} {"train_loss": -25.718774795532227, "global_step": 298523, "epoch": 3596} {"train_loss": -25.477468490600586, "global_step": 298524, "epoch": 3596} {"train_loss": -25.439239501953125, "global_step": 298525, "epoch": 3596} {"train_loss": -25.704797744750977, "global_step": 298526, "epoch": 3596} {"train_loss": -25.75275993347168, "global_step": 298527, "epoch": 3596} {"train_loss": -25.41657257080078, "global_step": 298528, "epoch": 3596} {"train_loss": -25.12087059020996, "global_step": 298529, "epoch": 3596} {"train_loss": -25.284879684448242, "global_step": 298530, "epoch": 3596} {"train_loss": -25.910785675048828, "global_step": 298531, "epoch": 3596} {"train_loss": -25.928726196289062, "global_step": 298532, "epoch": 3596} {"train_loss": -25.399763107299805, "global_step": 298533, "epoch": 3596} {"train_loss": -25.516523361206055, "global_step": 298534, "epoch": 3596} {"train_loss": -25.588645935058594, "global_step": 298535, "epoch": 3596} {"train_loss": -25.422090530395508, "global_step": 298536, "epoch": 3596} {"train_loss": -25.871301651000977, "global_step": 298537, "epoch": 3596} {"train_loss": -25.549118041992188, "global_step": 298538, "epoch": 3596} {"train_loss": -25.9086971282959, "global_step": 298539, "epoch": 3596} {"train_loss": -25.83056640625, "global_step": 298540, "epoch": 3596} {"train_loss": -25.561193466186523, "global_step": 298541, "epoch": 3596} {"train_loss": -25.48261260986328, "global_step": 298542, "epoch": 3596} {"train_loss": -25.906641006469727, "global_step": 298543, "epoch": 3596} {"train_loss": -25.779327392578125, "global_step": 298544, "epoch": 3596} {"train_loss": -26.071186065673828, "global_step": 298545, "epoch": 3596} {"train_loss": -25.533702850341797, "global_step": 298546, "epoch": 3596} {"train_loss": -25.47786521911621, "global_step": 298547, "epoch": 3596} {"train_loss": -25.672590255737305, "global_step": 298548, "epoch": 3596} {"train_loss": -25.588491439819336, "global_step": 298549, "epoch": 3596} {"train_loss": -25.622643114572547, "global_step": 298550, "epoch": 3596, "val_loss": 7280945.5} {"train_loss": -23.50895881652832, "global_step": 298551, "epoch": 3597} {"train_loss": -22.71506118774414, "global_step": 298552, "epoch": 3597} {"train_loss": -23.98892593383789, "global_step": 298553, "epoch": 3597} {"train_loss": -24.830276489257812, "global_step": 298554, "epoch": 3597} {"train_loss": -23.663373947143555, "global_step": 298555, "epoch": 3597} {"train_loss": -24.8034725189209, "global_step": 298556, "epoch": 3597} {"train_loss": -24.537431716918945, "global_step": 298557, "epoch": 3597} {"train_loss": -24.78644371032715, "global_step": 298558, "epoch": 3597} {"train_loss": -24.67096519470215, "global_step": 298559, "epoch": 3597} {"train_loss": -24.864084243774414, "global_step": 298560, "epoch": 3597} {"train_loss": -24.770801544189453, "global_step": 298561, "epoch": 3597} {"train_loss": -24.748077392578125, "global_step": 298562, "epoch": 3597} {"train_loss": -25.031890869140625, "global_step": 298563, "epoch": 3597} {"train_loss": -24.79766082763672, "global_step": 298564, "epoch": 3597} {"train_loss": -25.093631744384766, "global_step": 298565, "epoch": 3597} {"train_loss": -25.21527671813965, "global_step": 298566, "epoch": 3597} {"train_loss": -25.103055953979492, "global_step": 298567, "epoch": 3597} {"train_loss": -25.030887603759766, "global_step": 298568, "epoch": 3597} {"train_loss": -25.066495895385742, "global_step": 298569, "epoch": 3597} {"train_loss": -25.059297561645508, "global_step": 298570, "epoch": 3597} {"train_loss": -25.230289459228516, "global_step": 298571, "epoch": 3597} {"train_loss": -25.303129196166992, "global_step": 298572, "epoch": 3597} {"train_loss": -25.407278060913086, "global_step": 298573, "epoch": 3597} {"train_loss": -24.937271118164062, "global_step": 298574, "epoch": 3597} {"train_loss": -25.53810691833496, "global_step": 298575, "epoch": 3597} {"train_loss": -25.497434616088867, "global_step": 298576, "epoch": 3597} {"train_loss": -25.172780990600586, "global_step": 298577, "epoch": 3597} {"train_loss": -25.169010162353516, "global_step": 298578, "epoch": 3597} {"train_loss": -25.664794921875, "global_step": 298579, "epoch": 3597} {"train_loss": -25.298908233642578, "global_step": 298580, "epoch": 3597} {"train_loss": -25.323022842407227, "global_step": 298581, "epoch": 3597} {"train_loss": -25.637571334838867, "global_step": 298582, "epoch": 3597} {"train_loss": -25.365718841552734, "global_step": 298583, "epoch": 3597} {"train_loss": -25.75265884399414, "global_step": 298584, "epoch": 3597} {"train_loss": -25.326868057250977, "global_step": 298585, "epoch": 3597} {"train_loss": -25.646331787109375, "global_step": 298586, "epoch": 3597} {"train_loss": -25.713403701782227, "global_step": 298587, "epoch": 3597} {"train_loss": -25.54869270324707, "global_step": 298588, "epoch": 3597} {"train_loss": -25.38242530822754, "global_step": 298589, "epoch": 3597} {"train_loss": -25.25739288330078, "global_step": 298590, "epoch": 3597} {"train_loss": -25.51411247253418, "global_step": 298591, "epoch": 3597} {"train_loss": -25.642837524414062, "global_step": 298592, "epoch": 3597} {"train_loss": -25.483631134033203, "global_step": 298593, "epoch": 3597} {"train_loss": -25.642786026000977, "global_step": 298594, "epoch": 3597} {"train_loss": -25.64801025390625, "global_step": 298595, "epoch": 3597} {"train_loss": -25.479598999023438, "global_step": 298596, "epoch": 3597} {"train_loss": -25.5567684173584, "global_step": 298597, "epoch": 3597} {"train_loss": -25.59173583984375, "global_step": 298598, "epoch": 3597} {"train_loss": -25.6206111907959, "global_step": 298599, "epoch": 3597} {"train_loss": -25.99354362487793, "global_step": 298600, "epoch": 3597} {"train_loss": -25.941869735717773, "global_step": 298601, "epoch": 3597} {"train_loss": -25.478694915771484, "global_step": 298602, "epoch": 3597} {"train_loss": -25.82048988342285, "global_step": 298603, "epoch": 3597} {"train_loss": -25.91775894165039, "global_step": 298604, "epoch": 3597} {"train_loss": -25.601593017578125, "global_step": 298605, "epoch": 3597} {"train_loss": -26.242034912109375, "global_step": 298606, "epoch": 3597} {"train_loss": -25.769453048706055, "global_step": 298607, "epoch": 3597} {"train_loss": -26.136962890625, "global_step": 298608, "epoch": 3597} {"train_loss": -25.65419578552246, "global_step": 298609, "epoch": 3597} {"train_loss": -25.836414337158203, "global_step": 298610, "epoch": 3597} {"train_loss": -25.113874435424805, "global_step": 298611, "epoch": 3597} {"train_loss": -25.369186401367188, "global_step": 298612, "epoch": 3597} {"train_loss": -25.11134147644043, "global_step": 298613, "epoch": 3597} {"train_loss": -25.5881404876709, "global_step": 298614, "epoch": 3597} {"train_loss": -26.31171226501465, "global_step": 298615, "epoch": 3597} {"train_loss": -25.79425621032715, "global_step": 298616, "epoch": 3597} {"train_loss": -25.603107452392578, "global_step": 298617, "epoch": 3597} {"train_loss": -25.686813354492188, "global_step": 298618, "epoch": 3597} {"train_loss": -25.345239639282227, "global_step": 298619, "epoch": 3597} {"train_loss": -25.686010360717773, "global_step": 298620, "epoch": 3597} {"train_loss": -25.271757125854492, "global_step": 298621, "epoch": 3597} {"train_loss": -25.527259826660156, "global_step": 298622, "epoch": 3597} {"train_loss": -26.0069522857666, "global_step": 298623, "epoch": 3597} {"train_loss": -25.594085693359375, "global_step": 298624, "epoch": 3597} {"train_loss": -25.51767349243164, "global_step": 298625, "epoch": 3597} {"train_loss": -26.12737464904785, "global_step": 298626, "epoch": 3597} {"train_loss": -25.55438232421875, "global_step": 298627, "epoch": 3597} {"train_loss": -25.530057907104492, "global_step": 298628, "epoch": 3597} {"train_loss": -25.412357330322266, "global_step": 298629, "epoch": 3597} {"train_loss": -26.08582878112793, "global_step": 298630, "epoch": 3597} {"train_loss": -25.54178810119629, "global_step": 298631, "epoch": 3597} {"train_loss": -25.8369197845459, "global_step": 298632, "epoch": 3597} {"train_loss": -25.366004461265472, "global_step": 298633, "epoch": 3597, "val_loss": 7224127.5} {"train_loss": -25.041748046875, "global_step": 298634, "epoch": 3598} {"train_loss": -25.21146583557129, "global_step": 298635, "epoch": 3598} {"train_loss": -25.00700569152832, "global_step": 298636, "epoch": 3598} {"train_loss": -25.71270751953125, "global_step": 298637, "epoch": 3598} {"train_loss": -25.7575626373291, "global_step": 298638, "epoch": 3598} {"train_loss": -25.29638671875, "global_step": 298639, "epoch": 3598} {"train_loss": -25.480268478393555, "global_step": 298640, "epoch": 3598} {"train_loss": -25.13357925415039, "global_step": 298641, "epoch": 3598} {"train_loss": -25.06874656677246, "global_step": 298642, "epoch": 3598} {"train_loss": -25.623767852783203, "global_step": 298643, "epoch": 3598} {"train_loss": -25.37225914001465, "global_step": 298644, "epoch": 3598} {"train_loss": -25.611722946166992, "global_step": 298645, "epoch": 3598} {"train_loss": -25.358442306518555, "global_step": 298646, "epoch": 3598} {"train_loss": -25.391372680664062, "global_step": 298647, "epoch": 3598} {"train_loss": -25.624608993530273, "global_step": 298648, "epoch": 3598} {"train_loss": -25.728925704956055, "global_step": 298649, "epoch": 3598} {"train_loss": -25.28009033203125, "global_step": 298650, "epoch": 3598} {"train_loss": -25.520933151245117, "global_step": 298651, "epoch": 3598} {"train_loss": -25.9821720123291, "global_step": 298652, "epoch": 3598} {"train_loss": -25.690845489501953, "global_step": 298653, "epoch": 3598} {"train_loss": -25.5463809967041, "global_step": 298654, "epoch": 3598} {"train_loss": -25.709753036499023, "global_step": 298655, "epoch": 3598} {"train_loss": -25.65824317932129, "global_step": 298656, "epoch": 3598} {"train_loss": -25.619993209838867, "global_step": 298657, "epoch": 3598} {"train_loss": -25.9090633392334, "global_step": 298658, "epoch": 3598} {"train_loss": -25.832868576049805, "global_step": 298659, "epoch": 3598} {"train_loss": -25.750951766967773, "global_step": 298660, "epoch": 3598} {"train_loss": -25.448850631713867, "global_step": 298661, "epoch": 3598} {"train_loss": -25.3168888092041, "global_step": 298662, "epoch": 3598} {"train_loss": -25.54293441772461, "global_step": 298663, "epoch": 3598} {"train_loss": -25.822011947631836, "global_step": 298664, "epoch": 3598} {"train_loss": -25.38405418395996, "global_step": 298665, "epoch": 3598} {"train_loss": -25.5759334564209, "global_step": 298666, "epoch": 3598} {"train_loss": -25.90093421936035, "global_step": 298667, "epoch": 3598} {"train_loss": -25.749069213867188, "global_step": 298668, "epoch": 3598} {"train_loss": -25.713266372680664, "global_step": 298669, "epoch": 3598} {"train_loss": -25.752944946289062, "global_step": 298670, "epoch": 3598} {"train_loss": -25.473712921142578, "global_step": 298671, "epoch": 3598} {"train_loss": -25.699670791625977, "global_step": 298672, "epoch": 3598} {"train_loss": -25.281288146972656, "global_step": 298673, "epoch": 3598} {"train_loss": -25.534276962280273, "global_step": 298674, "epoch": 3598} {"train_loss": -25.348791122436523, "global_step": 298675, "epoch": 3598} {"train_loss": -25.753192901611328, "global_step": 298676, "epoch": 3598} {"train_loss": -25.54430389404297, "global_step": 298677, "epoch": 3598} {"train_loss": -25.494190216064453, "global_step": 298678, "epoch": 3598} {"train_loss": -25.424345016479492, "global_step": 298679, "epoch": 3598} {"train_loss": -25.492591857910156, "global_step": 298680, "epoch": 3598} {"train_loss": -25.51276206970215, "global_step": 298681, "epoch": 3598} {"train_loss": -25.490278244018555, "global_step": 298682, "epoch": 3598} {"train_loss": -25.848041534423828, "global_step": 298683, "epoch": 3598} {"train_loss": -25.701892852783203, "global_step": 298684, "epoch": 3598} {"train_loss": -25.48613929748535, "global_step": 298685, "epoch": 3598} {"train_loss": -25.74942398071289, "global_step": 298686, "epoch": 3598} {"train_loss": -25.738805770874023, "global_step": 298687, "epoch": 3598} {"train_loss": -25.705978393554688, "global_step": 298688, "epoch": 3598} {"train_loss": -25.343290328979492, "global_step": 298689, "epoch": 3598} {"train_loss": -25.735177993774414, "global_step": 298690, "epoch": 3598} {"train_loss": -25.68988609313965, "global_step": 298691, "epoch": 3598} {"train_loss": -25.294931411743164, "global_step": 298692, "epoch": 3598} {"train_loss": -25.234134674072266, "global_step": 298693, "epoch": 3598} {"train_loss": -25.706485748291016, "global_step": 298694, "epoch": 3598} {"train_loss": -25.247888565063477, "global_step": 298695, "epoch": 3598} {"train_loss": -25.461759567260742, "global_step": 298696, "epoch": 3598} {"train_loss": -25.438350677490234, "global_step": 298697, "epoch": 3598} {"train_loss": -25.346315383911133, "global_step": 298698, "epoch": 3598} {"train_loss": -25.725576400756836, "global_step": 298699, "epoch": 3598} {"train_loss": -25.324478149414062, "global_step": 298700, "epoch": 3598} {"train_loss": -26.114831924438477, "global_step": 298701, "epoch": 3598} {"train_loss": -25.333433151245117, "global_step": 298702, "epoch": 3598} {"train_loss": -25.497426986694336, "global_step": 298703, "epoch": 3598} {"train_loss": -25.766864776611328, "global_step": 298704, "epoch": 3598} {"train_loss": -25.650909423828125, "global_step": 298705, "epoch": 3598} {"train_loss": -25.75252342224121, "global_step": 298706, "epoch": 3598} {"train_loss": -25.740924835205078, "global_step": 298707, "epoch": 3598} {"train_loss": -25.394407272338867, "global_step": 298708, "epoch": 3598} {"train_loss": -25.11093521118164, "global_step": 298709, "epoch": 3598} {"train_loss": -25.299169540405273, "global_step": 298710, "epoch": 3598} {"train_loss": -25.547897338867188, "global_step": 298711, "epoch": 3598} {"train_loss": -25.909320831298828, "global_step": 298712, "epoch": 3598} {"train_loss": -25.46017074584961, "global_step": 298713, "epoch": 3598} {"train_loss": -25.740497589111328, "global_step": 298714, "epoch": 3598} {"train_loss": -25.0560359954834, "global_step": 298715, "epoch": 3598} {"train_loss": -25.523165484508837, "global_step": 298716, "epoch": 3598, "val_loss": 7193384.0} {"train_loss": -25.311599731445312, "global_step": 298717, "epoch": 3599} {"train_loss": -24.984508514404297, "global_step": 298718, "epoch": 3599} {"train_loss": -25.225500106811523, "global_step": 298719, "epoch": 3599} {"train_loss": -24.67893409729004, "global_step": 298720, "epoch": 3599} {"train_loss": -25.23670768737793, "global_step": 298721, "epoch": 3599} {"train_loss": -25.12223243713379, "global_step": 298722, "epoch": 3599} {"train_loss": -24.995840072631836, "global_step": 298723, "epoch": 3599} {"train_loss": -24.914236068725586, "global_step": 298724, "epoch": 3599} {"train_loss": -24.89964485168457, "global_step": 298725, "epoch": 3599} {"train_loss": -25.071659088134766, "global_step": 298726, "epoch": 3599} {"train_loss": -25.278226852416992, "global_step": 298727, "epoch": 3599} {"train_loss": -25.052810668945312, "global_step": 298728, "epoch": 3599} {"train_loss": -25.47804069519043, "global_step": 298729, "epoch": 3599} {"train_loss": -24.97647476196289, "global_step": 298730, "epoch": 3599} {"train_loss": -25.32187843322754, "global_step": 298731, "epoch": 3599} {"train_loss": -25.44266128540039, "global_step": 298732, "epoch": 3599} {"train_loss": -25.29085922241211, "global_step": 298733, "epoch": 3599} {"train_loss": -25.631427764892578, "global_step": 298734, "epoch": 3599} {"train_loss": -25.56523895263672, "global_step": 298735, "epoch": 3599} {"train_loss": -25.771148681640625, "global_step": 298736, "epoch": 3599} {"train_loss": -25.27716064453125, "global_step": 298737, "epoch": 3599} {"train_loss": -25.58045768737793, "global_step": 298738, "epoch": 3599} {"train_loss": -25.281024932861328, "global_step": 298739, "epoch": 3599} {"train_loss": -25.55159568786621, "global_step": 298740, "epoch": 3599} {"train_loss": -25.7839412689209, "global_step": 298741, "epoch": 3599} {"train_loss": -25.490299224853516, "global_step": 298742, "epoch": 3599} {"train_loss": -25.215789794921875, "global_step": 298743, "epoch": 3599} {"train_loss": -25.588712692260742, "global_step": 298744, "epoch": 3599} {"train_loss": -25.526527404785156, "global_step": 298745, "epoch": 3599} {"train_loss": -25.44500160217285, "global_step": 298746, "epoch": 3599} {"train_loss": -25.586288452148438, "global_step": 298747, "epoch": 3599} {"train_loss": -25.848236083984375, "global_step": 298748, "epoch": 3599} {"train_loss": -25.693134307861328, "global_step": 298749, "epoch": 3599} {"train_loss": -25.703250885009766, "global_step": 298750, "epoch": 3599} {"train_loss": -25.828840255737305, "global_step": 298751, "epoch": 3599} {"train_loss": -25.525583267211914, "global_step": 298752, "epoch": 3599} {"train_loss": -26.1479434967041, "global_step": 298753, "epoch": 3599} {"train_loss": -25.6047420501709, "global_step": 298754, "epoch": 3599} {"train_loss": -25.724353790283203, "global_step": 298755, "epoch": 3599} {"train_loss": -25.213340759277344, "global_step": 298756, "epoch": 3599} {"train_loss": -25.81903648376465, "global_step": 298757, "epoch": 3599} {"train_loss": -25.640527725219727, "global_step": 298758, "epoch": 3599} {"train_loss": -25.582937240600586, "global_step": 298759, "epoch": 3599} {"train_loss": -25.47739028930664, "global_step": 298760, "epoch": 3599} {"train_loss": -25.556039810180664, "global_step": 298761, "epoch": 3599} {"train_loss": -25.93182373046875, "global_step": 298762, "epoch": 3599} {"train_loss": -25.479032516479492, "global_step": 298763, "epoch": 3599} {"train_loss": -25.122983932495117, "global_step": 298764, "epoch": 3599} {"train_loss": -24.356523513793945, "global_step": 298765, "epoch": 3599} {"train_loss": -25.253662109375, "global_step": 298766, "epoch": 3599} {"train_loss": -25.259984970092773, "global_step": 298767, "epoch": 3599} {"train_loss": -25.343841552734375, "global_step": 298768, "epoch": 3599} {"train_loss": -25.74421501159668, "global_step": 298769, "epoch": 3599} {"train_loss": -25.390018463134766, "global_step": 298770, "epoch": 3599} {"train_loss": -25.425395965576172, "global_step": 298771, "epoch": 3599} {"train_loss": -25.28729820251465, "global_step": 298772, "epoch": 3599} {"train_loss": -25.464981079101562, "global_step": 298773, "epoch": 3599} {"train_loss": -25.389860153198242, "global_step": 298774, "epoch": 3599} {"train_loss": -25.7897891998291, "global_step": 298775, "epoch": 3599} {"train_loss": -25.622150421142578, "global_step": 298776, "epoch": 3599} {"train_loss": -25.377399444580078, "global_step": 298777, "epoch": 3599} {"train_loss": -25.30217933654785, "global_step": 298778, "epoch": 3599} {"train_loss": -25.79689598083496, "global_step": 298779, "epoch": 3599} {"train_loss": -25.866668701171875, "global_step": 298780, "epoch": 3599} {"train_loss": -25.495994567871094, "global_step": 298781, "epoch": 3599} {"train_loss": -25.425596237182617, "global_step": 298782, "epoch": 3599} {"train_loss": -25.39459228515625, "global_step": 298783, "epoch": 3599} {"train_loss": -25.42414665222168, "global_step": 298784, "epoch": 3599} {"train_loss": -25.38691520690918, "global_step": 298785, "epoch": 3599} {"train_loss": -25.705738067626953, "global_step": 298786, "epoch": 3599} {"train_loss": -25.644134521484375, "global_step": 298787, "epoch": 3599} {"train_loss": -25.299163818359375, "global_step": 298788, "epoch": 3599} {"train_loss": -25.441715240478516, "global_step": 298789, "epoch": 3599} {"train_loss": -25.631805419921875, "global_step": 298790, "epoch": 3599} {"train_loss": -25.97992515563965, "global_step": 298791, "epoch": 3599} {"train_loss": -25.718414306640625, "global_step": 298792, "epoch": 3599} {"train_loss": -25.782978057861328, "global_step": 298793, "epoch": 3599} {"train_loss": -25.9716854095459, "global_step": 298794, "epoch": 3599} {"train_loss": -26.24945068359375, "global_step": 298795, "epoch": 3599} {"train_loss": -25.817584991455078, "global_step": 298796, "epoch": 3599} {"train_loss": -25.7016658782959, "global_step": 298797, "epoch": 3599} {"train_loss": -25.945188522338867, "global_step": 298798, "epoch": 3599} {"train_loss": -25.474713727652308, "global_step": 298799, "epoch": 3599, "val_loss": 7165002.0} {"train_loss": -25.114402770996094, "global_step": 298800, "epoch": 3600} {"train_loss": -25.16816520690918, "global_step": 298801, "epoch": 3600} {"train_loss": -25.09384536743164, "global_step": 298802, "epoch": 3600} {"train_loss": -24.92544174194336, "global_step": 298803, "epoch": 3600} {"train_loss": -25.351974487304688, "global_step": 298804, "epoch": 3600} {"train_loss": -25.27854347229004, "global_step": 298805, "epoch": 3600} {"train_loss": -25.37862205505371, "global_step": 298806, "epoch": 3600} {"train_loss": -25.075300216674805, "global_step": 298807, "epoch": 3600} {"train_loss": -25.148910522460938, "global_step": 298808, "epoch": 3600} {"train_loss": -25.4339656829834, "global_step": 298809, "epoch": 3600} {"train_loss": -25.448461532592773, "global_step": 298810, "epoch": 3600} {"train_loss": -25.16925621032715, "global_step": 298811, "epoch": 3600} {"train_loss": -25.387107849121094, "global_step": 298812, "epoch": 3600} {"train_loss": -25.226913452148438, "global_step": 298813, "epoch": 3600} {"train_loss": -25.445585250854492, "global_step": 298814, "epoch": 3600} {"train_loss": -25.1395263671875, "global_step": 298815, "epoch": 3600} {"train_loss": -25.038118362426758, "global_step": 298816, "epoch": 3600} {"train_loss": -25.614734649658203, "global_step": 298817, "epoch": 3600} {"train_loss": -25.433826446533203, "global_step": 298818, "epoch": 3600} {"train_loss": -25.472272872924805, "global_step": 298819, "epoch": 3600} {"train_loss": -25.37335777282715, "global_step": 298820, "epoch": 3600} {"train_loss": -25.466527938842773, "global_step": 298821, "epoch": 3600} {"train_loss": -25.263076782226562, "global_step": 298822, "epoch": 3600} {"train_loss": -25.155445098876953, "global_step": 298823, "epoch": 3600} {"train_loss": -25.276803970336914, "global_step": 298824, "epoch": 3600} {"train_loss": -25.51357078552246, "global_step": 298825, "epoch": 3600} {"train_loss": -25.427011489868164, "global_step": 298826, "epoch": 3600} {"train_loss": -25.639347076416016, "global_step": 298827, "epoch": 3600} {"train_loss": -25.40814781188965, "global_step": 298828, "epoch": 3600} {"train_loss": -25.2836856842041, "global_step": 298829, "epoch": 3600} {"train_loss": -25.7435245513916, "global_step": 298830, "epoch": 3600} {"train_loss": -25.67352294921875, "global_step": 298831, "epoch": 3600} {"train_loss": -25.92412757873535, "global_step": 298832, "epoch": 3600} {"train_loss": -25.56979751586914, "global_step": 298833, "epoch": 3600} {"train_loss": -25.328418731689453, "global_step": 298834, "epoch": 3600} {"train_loss": -25.511098861694336, "global_step": 298835, "epoch": 3600} {"train_loss": -25.719221115112305, "global_step": 298836, "epoch": 3600} {"train_loss": -25.492664337158203, "global_step": 298837, "epoch": 3600} {"train_loss": -25.41619300842285, "global_step": 298838, "epoch": 3600} {"train_loss": -25.455480575561523, "global_step": 298839, "epoch": 3600} {"train_loss": -25.933996200561523, "global_step": 298840, "epoch": 3600} {"train_loss": -25.739837646484375, "global_step": 298841, "epoch": 3600} {"train_loss": -25.73248863220215, "global_step": 298842, "epoch": 3600} {"train_loss": -25.695825576782227, "global_step": 298843, "epoch": 3600} {"train_loss": -25.062143325805664, "global_step": 298844, "epoch": 3600} {"train_loss": -25.210098266601562, "global_step": 298845, "epoch": 3600} {"train_loss": -25.75422477722168, "global_step": 298846, "epoch": 3600} {"train_loss": -25.13236427307129, "global_step": 298847, "epoch": 3600} {"train_loss": -25.3512020111084, "global_step": 298848, "epoch": 3600} {"train_loss": -25.94635009765625, "global_step": 298849, "epoch": 3600} {"train_loss": -25.735885620117188, "global_step": 298850, "epoch": 3600} {"train_loss": -25.442859649658203, "global_step": 298851, "epoch": 3600} {"train_loss": -25.77084732055664, "global_step": 298852, "epoch": 3600} {"train_loss": -25.864606857299805, "global_step": 298853, "epoch": 3600} {"train_loss": -25.6358699798584, "global_step": 298854, "epoch": 3600} {"train_loss": -25.780624389648438, "global_step": 298855, "epoch": 3600} {"train_loss": -25.397422790527344, "global_step": 298856, "epoch": 3600} {"train_loss": -25.702014923095703, "global_step": 298857, "epoch": 3600} {"train_loss": -25.655317306518555, "global_step": 298858, "epoch": 3600} {"train_loss": -25.25728416442871, "global_step": 298859, "epoch": 3600} {"train_loss": -25.865209579467773, "global_step": 298860, "epoch": 3600} {"train_loss": -25.589696884155273, "global_step": 298861, "epoch": 3600} {"train_loss": -25.833972930908203, "global_step": 298862, "epoch": 3600} {"train_loss": -25.460832595825195, "global_step": 298863, "epoch": 3600} {"train_loss": -25.698511123657227, "global_step": 298864, "epoch": 3600} {"train_loss": -25.309833526611328, "global_step": 298865, "epoch": 3600} {"train_loss": -25.775619506835938, "global_step": 298866, "epoch": 3600} {"train_loss": -25.56509780883789, "global_step": 298867, "epoch": 3600} {"train_loss": -25.428680419921875, "global_step": 298868, "epoch": 3600} {"train_loss": -25.75623893737793, "global_step": 298869, "epoch": 3600} {"train_loss": -25.880741119384766, "global_step": 298870, "epoch": 3600} {"train_loss": -25.809009552001953, "global_step": 298871, "epoch": 3600} {"train_loss": -25.569961547851562, "global_step": 298872, "epoch": 3600} {"train_loss": -25.493545532226562, "global_step": 298873, "epoch": 3600} {"train_loss": -25.729373931884766, "global_step": 298874, "epoch": 3600} {"train_loss": -25.695459365844727, "global_step": 298875, "epoch": 3600} {"train_loss": -25.887210845947266, "global_step": 298876, "epoch": 3600} {"train_loss": -25.499393463134766, "global_step": 298877, "epoch": 3600} {"train_loss": -25.88797950744629, "global_step": 298878, "epoch": 3600} {"train_loss": -25.543485641479492, "global_step": 298879, "epoch": 3600} {"train_loss": -25.829599380493164, "global_step": 298880, "epoch": 3600} {"train_loss": -25.64352798461914, "global_step": 298881, "epoch": 3600} {"train_loss": -25.49414653088673, "global_step": 298882, "epoch": 3600, "train/sim_max_reward_0": 1.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4500000": 1.0, "test/sim_max_reward_4500001": 1.0, "test/sim_max_reward_4500002": 1.0, "test/sim_max_reward_4500003": 1.0, "test/sim_max_reward_4500004": 0.0, "test/sim_max_reward_4500005": 1.0, "test/sim_max_reward_4500006": 1.0, "test/sim_max_reward_4500007": 0.0, "test/sim_max_reward_4500008": 1.0, "test/sim_max_reward_4500009": 1.0, "test/sim_max_reward_4500010": 1.0, "test/sim_max_reward_4500011": 1.0, "test/sim_max_reward_4500012": 1.0, "test/sim_max_reward_4500013": 0.0, "test/sim_max_reward_4500014": 1.0, "test/sim_max_reward_4500015": 1.0, "test/sim_max_reward_4500016": 1.0, "test/sim_max_reward_4500017": 1.0, "test/sim_max_reward_4500018": 1.0, "test/sim_max_reward_4500019": 1.0, "test/sim_max_reward_4500020": 1.0, "test/sim_max_reward_4500021": 1.0, "train/mean_score": 1.0, "test/mean_score": 0.8636363636363636, "val_loss": 7351678.0} {"train_loss": -25.09711265563965, "global_step": 298883, "epoch": 3601} {"train_loss": -24.96320915222168, "global_step": 298884, "epoch": 3601} {"train_loss": -25.320819854736328, "global_step": 298885, "epoch": 3601} {"train_loss": -25.070859909057617, "global_step": 298886, "epoch": 3601} {"train_loss": -25.275487899780273, "global_step": 298887, "epoch": 3601} {"train_loss": -25.189498901367188, "global_step": 298888, "epoch": 3601} {"train_loss": -25.611303329467773, "global_step": 298889, "epoch": 3601} {"train_loss": -25.354633331298828, "global_step": 298890, "epoch": 3601} {"train_loss": -25.113174438476562, "global_step": 298891, "epoch": 3601} {"train_loss": -25.4379825592041, "global_step": 298892, "epoch": 3601} {"train_loss": -25.296226501464844, "global_step": 298893, "epoch": 3601} {"train_loss": -25.691320419311523, "global_step": 298894, "epoch": 3601} {"train_loss": -25.749832153320312, "global_step": 298895, "epoch": 3601} {"train_loss": -25.220659255981445, "global_step": 298896, "epoch": 3601} {"train_loss": -25.8858699798584, "global_step": 298897, "epoch": 3601} {"train_loss": -25.194875717163086, "global_step": 298898, "epoch": 3601} {"train_loss": -25.742399215698242, "global_step": 298899, "epoch": 3601} {"train_loss": -25.280149459838867, "global_step": 298900, "epoch": 3601} {"train_loss": -25.346471786499023, "global_step": 298901, "epoch": 3601} {"train_loss": -25.67715835571289, "global_step": 298902, "epoch": 3601} {"train_loss": -25.65264892578125, "global_step": 298903, "epoch": 3601} {"train_loss": -25.232873916625977, "global_step": 298904, "epoch": 3601} {"train_loss": -25.218360900878906, "global_step": 298905, "epoch": 3601} {"train_loss": -25.600513458251953, "global_step": 298906, "epoch": 3601} {"train_loss": -25.511930465698242, "global_step": 298907, "epoch": 3601} {"train_loss": -25.238489151000977, "global_step": 298908, "epoch": 3601} {"train_loss": -25.484514236450195, "global_step": 298909, "epoch": 3601} {"train_loss": -25.523807525634766, "global_step": 298910, "epoch": 3601} {"train_loss": -25.263748168945312, "global_step": 298911, "epoch": 3601} {"train_loss": -25.503286361694336, "global_step": 298912, "epoch": 3601} {"train_loss": -25.270654678344727, "global_step": 298913, "epoch": 3601} {"train_loss": -25.281850814819336, "global_step": 298914, "epoch": 3601} {"train_loss": -25.267412185668945, "global_step": 298915, "epoch": 3601} {"train_loss": -25.734283447265625, "global_step": 298916, "epoch": 3601} {"train_loss": -25.477231979370117, "global_step": 298917, "epoch": 3601} {"train_loss": -25.953601837158203, "global_step": 298918, "epoch": 3601} {"train_loss": -25.617095947265625, "global_step": 298919, "epoch": 3601} {"train_loss": -25.49312400817871, "global_step": 298920, "epoch": 3601} {"train_loss": -25.782001495361328, "global_step": 298921, "epoch": 3601} {"train_loss": -25.652515411376953, "global_step": 298922, "epoch": 3601} {"train_loss": -25.472553253173828, "global_step": 298923, "epoch": 3601} {"train_loss": -25.844167709350586, "global_step": 298924, "epoch": 3601} {"train_loss": -25.551654815673828, "global_step": 298925, "epoch": 3601} {"train_loss": -25.532978057861328, "global_step": 298926, "epoch": 3601} {"train_loss": -25.690732955932617, "global_step": 298927, "epoch": 3601} {"train_loss": -25.8393611907959, "global_step": 298928, "epoch": 3601} {"train_loss": -25.65395164489746, "global_step": 298929, "epoch": 3601} {"train_loss": -25.92945671081543, "global_step": 298930, "epoch": 3601} {"train_loss": -26.278806686401367, "global_step": 298931, "epoch": 3601} {"train_loss": -25.78510093688965, "global_step": 298932, "epoch": 3601} {"train_loss": -25.45840835571289, "global_step": 298933, "epoch": 3601} {"train_loss": -25.729419708251953, "global_step": 298934, "epoch": 3601} {"train_loss": -25.927194595336914, "global_step": 298935, "epoch": 3601} {"train_loss": -25.893896102905273, "global_step": 298936, "epoch": 3601} {"train_loss": -25.946945190429688, "global_step": 298937, "epoch": 3601} {"train_loss": -25.597707748413086, "global_step": 298938, "epoch": 3601} {"train_loss": -25.773630142211914, "global_step": 298939, "epoch": 3601} {"train_loss": -25.94745445251465, "global_step": 298940, "epoch": 3601} {"train_loss": -25.247215270996094, "global_step": 298941, "epoch": 3601} {"train_loss": -25.6028995513916, "global_step": 298942, "epoch": 3601} {"train_loss": -25.386585235595703, "global_step": 298943, "epoch": 3601} {"train_loss": -25.7259578704834, "global_step": 298944, "epoch": 3601} {"train_loss": -25.3586368560791, "global_step": 298945, "epoch": 3601} {"train_loss": -25.506134033203125, "global_step": 298946, "epoch": 3601} {"train_loss": -25.94426918029785, "global_step": 298947, "epoch": 3601} {"train_loss": -25.401330947875977, "global_step": 298948, "epoch": 3601} {"train_loss": -25.55831527709961, "global_step": 298949, "epoch": 3601} {"train_loss": -25.811370849609375, "global_step": 298950, "epoch": 3601} {"train_loss": -25.90452003479004, "global_step": 298951, "epoch": 3601} {"train_loss": -25.964990615844727, "global_step": 298952, "epoch": 3601} {"train_loss": -25.812353134155273, "global_step": 298953, "epoch": 3601} {"train_loss": -26.15576171875, "global_step": 298954, "epoch": 3601} {"train_loss": -25.611459732055664, "global_step": 298955, "epoch": 3601} {"train_loss": -25.956289291381836, "global_step": 298956, "epoch": 3601} {"train_loss": -25.704227447509766, "global_step": 298957, "epoch": 3601} {"train_loss": -25.769628524780273, "global_step": 298958, "epoch": 3601} {"train_loss": -25.751501083374023, "global_step": 298959, "epoch": 3601} {"train_loss": -25.888599395751953, "global_step": 298960, "epoch": 3601} {"train_loss": -25.825708389282227, "global_step": 298961, "epoch": 3601} {"train_loss": -25.038002014160156, "global_step": 298962, "epoch": 3601} {"train_loss": -24.71437644958496, "global_step": 298963, "epoch": 3601} {"train_loss": -24.868017196655273, "global_step": 298964, "epoch": 3601} {"train_loss": -25.545650068535863, "global_step": 298965, "epoch": 3601, "val_loss": 7196545.5} {"train_loss": -25.247949600219727, "global_step": 298966, "epoch": 3602} {"train_loss": -24.355417251586914, "global_step": 298967, "epoch": 3602} {"train_loss": -23.661487579345703, "global_step": 298968, "epoch": 3602} {"train_loss": -24.46734046936035, "global_step": 298969, "epoch": 3602} {"train_loss": -24.128332138061523, "global_step": 298970, "epoch": 3602} {"train_loss": -24.39883041381836, "global_step": 298971, "epoch": 3602} {"train_loss": -24.95955467224121, "global_step": 298972, "epoch": 3602} {"train_loss": -25.044347763061523, "global_step": 298973, "epoch": 3602} {"train_loss": -24.873519897460938, "global_step": 298974, "epoch": 3602} {"train_loss": -25.06549072265625, "global_step": 298975, "epoch": 3602} {"train_loss": -24.951215744018555, "global_step": 298976, "epoch": 3602} {"train_loss": -25.29183006286621, "global_step": 298977, "epoch": 3602} {"train_loss": -24.93089485168457, "global_step": 298978, "epoch": 3602} {"train_loss": -25.189559936523438, "global_step": 298979, "epoch": 3602} {"train_loss": -25.287487030029297, "global_step": 298980, "epoch": 3602} {"train_loss": -25.003948211669922, "global_step": 298981, "epoch": 3602} {"train_loss": -24.88595199584961, "global_step": 298982, "epoch": 3602} {"train_loss": -25.138032913208008, "global_step": 298983, "epoch": 3602} {"train_loss": -25.23060417175293, "global_step": 298984, "epoch": 3602} {"train_loss": -25.227828979492188, "global_step": 298985, "epoch": 3602} {"train_loss": -25.278194427490234, "global_step": 298986, "epoch": 3602} {"train_loss": -25.227825164794922, "global_step": 298987, "epoch": 3602} {"train_loss": -25.284133911132812, "global_step": 298988, "epoch": 3602} {"train_loss": -25.545509338378906, "global_step": 298989, "epoch": 3602} {"train_loss": -24.771636962890625, "global_step": 298990, "epoch": 3602} {"train_loss": -25.447179794311523, "global_step": 298991, "epoch": 3602} {"train_loss": -25.34661293029785, "global_step": 298992, "epoch": 3602} {"train_loss": -25.619970321655273, "global_step": 298993, "epoch": 3602} {"train_loss": -25.158506393432617, "global_step": 298994, "epoch": 3602} {"train_loss": -25.477712631225586, "global_step": 298995, "epoch": 3602} {"train_loss": -25.480365753173828, "global_step": 298996, "epoch": 3602} {"train_loss": -25.566999435424805, "global_step": 298997, "epoch": 3602} {"train_loss": -25.439626693725586, "global_step": 298998, "epoch": 3602} {"train_loss": -25.964887619018555, "global_step": 298999, "epoch": 3602} {"train_loss": -25.968870162963867, "global_step": 299000, "epoch": 3602} {"train_loss": -25.4384765625, "global_step": 299001, "epoch": 3602} {"train_loss": -25.618494033813477, "global_step": 299002, "epoch": 3602} {"train_loss": -25.641889572143555, "global_step": 299003, "epoch": 3602} {"train_loss": -25.533313751220703, "global_step": 299004, "epoch": 3602} {"train_loss": -25.656347274780273, "global_step": 299005, "epoch": 3602} {"train_loss": -25.540170669555664, "global_step": 299006, "epoch": 3602} {"train_loss": -25.51376724243164, "global_step": 299007, "epoch": 3602} {"train_loss": -25.72678565979004, "global_step": 299008, "epoch": 3602} {"train_loss": -25.797271728515625, "global_step": 299009, "epoch": 3602} {"train_loss": -25.479656219482422, "global_step": 299010, "epoch": 3602} {"train_loss": -25.49723243713379, "global_step": 299011, "epoch": 3602} {"train_loss": -25.65024185180664, "global_step": 299012, "epoch": 3602} {"train_loss": -25.944381713867188, "global_step": 299013, "epoch": 3602} {"train_loss": -25.848188400268555, "global_step": 299014, "epoch": 3602} {"train_loss": -25.65277671813965, "global_step": 299015, "epoch": 3602} {"train_loss": -25.71085548400879, "global_step": 299016, "epoch": 3602} {"train_loss": -26.23126220703125, "global_step": 299017, "epoch": 3602} {"train_loss": -25.75055503845215, "global_step": 299018, "epoch": 3602} {"train_loss": -25.82168960571289, "global_step": 299019, "epoch": 3602} {"train_loss": -25.701202392578125, "global_step": 299020, "epoch": 3602} {"train_loss": -25.839853286743164, "global_step": 299021, "epoch": 3602} {"train_loss": -25.543121337890625, "global_step": 299022, "epoch": 3602} {"train_loss": -25.908750534057617, "global_step": 299023, "epoch": 3602} {"train_loss": -25.611408233642578, "global_step": 299024, "epoch": 3602} {"train_loss": -25.444217681884766, "global_step": 299025, "epoch": 3602} {"train_loss": -25.683273315429688, "global_step": 299026, "epoch": 3602} {"train_loss": -25.533994674682617, "global_step": 299027, "epoch": 3602} {"train_loss": -26.01258659362793, "global_step": 299028, "epoch": 3602} {"train_loss": -25.682331085205078, "global_step": 299029, "epoch": 3602} {"train_loss": -25.959867477416992, "global_step": 299030, "epoch": 3602} {"train_loss": -26.007904052734375, "global_step": 299031, "epoch": 3602} {"train_loss": -26.10149574279785, "global_step": 299032, "epoch": 3602} {"train_loss": -25.42316246032715, "global_step": 299033, "epoch": 3602} {"train_loss": -25.572141647338867, "global_step": 299034, "epoch": 3602} {"train_loss": -25.977319717407227, "global_step": 299035, "epoch": 3602} {"train_loss": -25.671384811401367, "global_step": 299036, "epoch": 3602} {"train_loss": -25.6945743560791, "global_step": 299037, "epoch": 3602} {"train_loss": -25.6614933013916, "global_step": 299038, "epoch": 3602} {"train_loss": -25.550378799438477, "global_step": 299039, "epoch": 3602} {"train_loss": -25.741275787353516, "global_step": 299040, "epoch": 3602} {"train_loss": -26.037755966186523, "global_step": 299041, "epoch": 3602} {"train_loss": -25.572734832763672, "global_step": 299042, "epoch": 3602} {"train_loss": -26.0904483795166, "global_step": 299043, "epoch": 3602} {"train_loss": -25.404218673706055, "global_step": 299044, "epoch": 3602} {"train_loss": -25.038822174072266, "global_step": 299045, "epoch": 3602} {"train_loss": -25.496063232421875, "global_step": 299046, "epoch": 3602} {"train_loss": -25.602399826049805, "global_step": 299047, "epoch": 3602} {"train_loss": -25.430061133511096, "global_step": 299048, "epoch": 3602, "val_loss": 7205459.5} {"train_loss": -24.352508544921875, "global_step": 299049, "epoch": 3603} {"train_loss": -24.349552154541016, "global_step": 299050, "epoch": 3603} {"train_loss": -25.073627471923828, "global_step": 299051, "epoch": 3603} {"train_loss": -24.621076583862305, "global_step": 299052, "epoch": 3603} {"train_loss": -25.48980712890625, "global_step": 299053, "epoch": 3603} {"train_loss": -24.753591537475586, "global_step": 299054, "epoch": 3603} {"train_loss": -25.264217376708984, "global_step": 299055, "epoch": 3603} {"train_loss": -25.09965705871582, "global_step": 299056, "epoch": 3603} {"train_loss": -25.0124568939209, "global_step": 299057, "epoch": 3603} {"train_loss": -25.070030212402344, "global_step": 299058, "epoch": 3603} {"train_loss": -25.251480102539062, "global_step": 299059, "epoch": 3603} {"train_loss": -25.065006256103516, "global_step": 299060, "epoch": 3603} {"train_loss": -25.712329864501953, "global_step": 299061, "epoch": 3603} {"train_loss": -24.956464767456055, "global_step": 299062, "epoch": 3603} {"train_loss": -24.875812530517578, "global_step": 299063, "epoch": 3603} {"train_loss": -25.430044174194336, "global_step": 299064, "epoch": 3603} {"train_loss": -25.0376033782959, "global_step": 299065, "epoch": 3603} {"train_loss": -25.813196182250977, "global_step": 299066, "epoch": 3603} {"train_loss": -25.36931037902832, "global_step": 299067, "epoch": 3603} {"train_loss": -25.542617797851562, "global_step": 299068, "epoch": 3603} {"train_loss": -25.279983520507812, "global_step": 299069, "epoch": 3603} {"train_loss": -25.74079704284668, "global_step": 299070, "epoch": 3603} {"train_loss": -25.869428634643555, "global_step": 299071, "epoch": 3603} {"train_loss": -25.359813690185547, "global_step": 299072, "epoch": 3603} {"train_loss": -25.42335319519043, "global_step": 299073, "epoch": 3603} {"train_loss": -25.743085861206055, "global_step": 299074, "epoch": 3603} {"train_loss": -25.6639404296875, "global_step": 299075, "epoch": 3603} {"train_loss": -25.498685836791992, "global_step": 299076, "epoch": 3603} {"train_loss": -25.201345443725586, "global_step": 299077, "epoch": 3603} {"train_loss": -25.61672019958496, "global_step": 299078, "epoch": 3603} {"train_loss": -25.97454833984375, "global_step": 299079, "epoch": 3603} {"train_loss": -25.618921279907227, "global_step": 299080, "epoch": 3603} {"train_loss": -25.448820114135742, "global_step": 299081, "epoch": 3603} {"train_loss": -25.609546661376953, "global_step": 299082, "epoch": 3603} {"train_loss": -25.752527236938477, "global_step": 299083, "epoch": 3603} {"train_loss": -25.60658073425293, "global_step": 299084, "epoch": 3603} {"train_loss": -25.693384170532227, "global_step": 299085, "epoch": 3603} {"train_loss": -25.914596557617188, "global_step": 299086, "epoch": 3603} {"train_loss": -25.795654296875, "global_step": 299087, "epoch": 3603} {"train_loss": -25.584264755249023, "global_step": 299088, "epoch": 3603} {"train_loss": -25.536466598510742, "global_step": 299089, "epoch": 3603} {"train_loss": -26.001508712768555, "global_step": 299090, "epoch": 3603} {"train_loss": -25.97540855407715, "global_step": 299091, "epoch": 3603} {"train_loss": -25.6983642578125, "global_step": 299092, "epoch": 3603} {"train_loss": -25.979101181030273, "global_step": 299093, "epoch": 3603} {"train_loss": -25.929031372070312, "global_step": 299094, "epoch": 3603} {"train_loss": -26.098041534423828, "global_step": 299095, "epoch": 3603} {"train_loss": -25.831701278686523, "global_step": 299096, "epoch": 3603} {"train_loss": -25.779706954956055, "global_step": 299097, "epoch": 3603} {"train_loss": -25.50571060180664, "global_step": 299098, "epoch": 3603} {"train_loss": -25.7943115234375, "global_step": 299099, "epoch": 3603} {"train_loss": -25.7316951751709, "global_step": 299100, "epoch": 3603} {"train_loss": -25.738508224487305, "global_step": 299101, "epoch": 3603} {"train_loss": -25.439899444580078, "global_step": 299102, "epoch": 3603} {"train_loss": -25.119176864624023, "global_step": 299103, "epoch": 3603} {"train_loss": -25.339656829833984, "global_step": 299104, "epoch": 3603} {"train_loss": -25.383079528808594, "global_step": 299105, "epoch": 3603} {"train_loss": -25.03999900817871, "global_step": 299106, "epoch": 3603} {"train_loss": -25.040128707885742, "global_step": 299107, "epoch": 3603} {"train_loss": -24.859182357788086, "global_step": 299108, "epoch": 3603} {"train_loss": -25.067886352539062, "global_step": 299109, "epoch": 3603} {"train_loss": -25.42206382751465, "global_step": 299110, "epoch": 3603} {"train_loss": -25.21710777282715, "global_step": 299111, "epoch": 3603} {"train_loss": -25.841711044311523, "global_step": 299112, "epoch": 3603} {"train_loss": -25.45391273498535, "global_step": 299113, "epoch": 3603} {"train_loss": -25.439565658569336, "global_step": 299114, "epoch": 3603} {"train_loss": -25.4207820892334, "global_step": 299115, "epoch": 3603} {"train_loss": -25.62354850769043, "global_step": 299116, "epoch": 3603} {"train_loss": -25.2921142578125, "global_step": 299117, "epoch": 3603} {"train_loss": -25.779272079467773, "global_step": 299118, "epoch": 3603} {"train_loss": -25.433338165283203, "global_step": 299119, "epoch": 3603} {"train_loss": -25.521289825439453, "global_step": 299120, "epoch": 3603} {"train_loss": -25.886371612548828, "global_step": 299121, "epoch": 3603} {"train_loss": -25.7482967376709, "global_step": 299122, "epoch": 3603} {"train_loss": -25.5418643951416, "global_step": 299123, "epoch": 3603} {"train_loss": -25.52696990966797, "global_step": 299124, "epoch": 3603} {"train_loss": -25.682153701782227, "global_step": 299125, "epoch": 3603} {"train_loss": -25.36354637145996, "global_step": 299126, "epoch": 3603} {"train_loss": -25.701818466186523, "global_step": 299127, "epoch": 3603} {"train_loss": -25.58835220336914, "global_step": 299128, "epoch": 3603} {"train_loss": -25.91632080078125, "global_step": 299129, "epoch": 3603} {"train_loss": -25.679182052612305, "global_step": 299130, "epoch": 3603} {"train_loss": -25.46178498325578, "global_step": 299131, "epoch": 3603, "val_loss": 7131869.0} {"train_loss": -25.567594528198242, "global_step": 299132, "epoch": 3604} {"train_loss": -25.028066635131836, "global_step": 299133, "epoch": 3604} {"train_loss": -25.505918502807617, "global_step": 299134, "epoch": 3604} {"train_loss": -24.8637752532959, "global_step": 299135, "epoch": 3604} {"train_loss": -24.949003219604492, "global_step": 299136, "epoch": 3604} {"train_loss": -25.74457359313965, "global_step": 299137, "epoch": 3604} {"train_loss": -25.028560638427734, "global_step": 299138, "epoch": 3604} {"train_loss": -24.962812423706055, "global_step": 299139, "epoch": 3604} {"train_loss": -25.457189559936523, "global_step": 299140, "epoch": 3604} {"train_loss": -25.043928146362305, "global_step": 299141, "epoch": 3604} {"train_loss": -25.3165283203125, "global_step": 299142, "epoch": 3604} {"train_loss": -25.26265525817871, "global_step": 299143, "epoch": 3604} {"train_loss": -25.241273880004883, "global_step": 299144, "epoch": 3604} {"train_loss": -25.794204711914062, "global_step": 299145, "epoch": 3604} {"train_loss": -25.420839309692383, "global_step": 299146, "epoch": 3604} {"train_loss": -25.157459259033203, "global_step": 299147, "epoch": 3604} {"train_loss": -25.320066452026367, "global_step": 299148, "epoch": 3604} {"train_loss": -25.415298461914062, "global_step": 299149, "epoch": 3604} {"train_loss": -25.52542495727539, "global_step": 299150, "epoch": 3604} {"train_loss": -25.475046157836914, "global_step": 299151, "epoch": 3604} {"train_loss": -25.755475997924805, "global_step": 299152, "epoch": 3604} {"train_loss": -25.336368560791016, "global_step": 299153, "epoch": 3604} {"train_loss": -25.80615234375, "global_step": 299154, "epoch": 3604} {"train_loss": -25.660755157470703, "global_step": 299155, "epoch": 3604} {"train_loss": -25.73090171813965, "global_step": 299156, "epoch": 3604} {"train_loss": -25.581279754638672, "global_step": 299157, "epoch": 3604} {"train_loss": -25.431556701660156, "global_step": 299158, "epoch": 3604} {"train_loss": -25.88762855529785, "global_step": 299159, "epoch": 3604} {"train_loss": -25.940338134765625, "global_step": 299160, "epoch": 3604} {"train_loss": -25.65103530883789, "global_step": 299161, "epoch": 3604} {"train_loss": -25.44623565673828, "global_step": 299162, "epoch": 3604} {"train_loss": -25.456911087036133, "global_step": 299163, "epoch": 3604} {"train_loss": -25.712976455688477, "global_step": 299164, "epoch": 3604} {"train_loss": -25.979856491088867, "global_step": 299165, "epoch": 3604} {"train_loss": -25.87567710876465, "global_step": 299166, "epoch": 3604} {"train_loss": -25.609601974487305, "global_step": 299167, "epoch": 3604} {"train_loss": -25.605825424194336, "global_step": 299168, "epoch": 3604} {"train_loss": -26.088409423828125, "global_step": 299169, "epoch": 3604} {"train_loss": -25.79755973815918, "global_step": 299170, "epoch": 3604} {"train_loss": -25.6094970703125, "global_step": 299171, "epoch": 3604} {"train_loss": -25.7600154876709, "global_step": 299172, "epoch": 3604} {"train_loss": -25.459388732910156, "global_step": 299173, "epoch": 3604} {"train_loss": -25.821043014526367, "global_step": 299174, "epoch": 3604} {"train_loss": -25.783761978149414, "global_step": 299175, "epoch": 3604} {"train_loss": -25.843469619750977, "global_step": 299176, "epoch": 3604} {"train_loss": -25.64374351501465, "global_step": 299177, "epoch": 3604} {"train_loss": -25.607513427734375, "global_step": 299178, "epoch": 3604} {"train_loss": -25.744434356689453, "global_step": 299179, "epoch": 3604} {"train_loss": -25.543010711669922, "global_step": 299180, "epoch": 3604} {"train_loss": -25.743345260620117, "global_step": 299181, "epoch": 3604} {"train_loss": -25.26626968383789, "global_step": 299182, "epoch": 3604} {"train_loss": -25.465240478515625, "global_step": 299183, "epoch": 3604} {"train_loss": -24.982290267944336, "global_step": 299184, "epoch": 3604} {"train_loss": -24.209653854370117, "global_step": 299185, "epoch": 3604} {"train_loss": -24.526527404785156, "global_step": 299186, "epoch": 3604} {"train_loss": -25.880462646484375, "global_step": 299187, "epoch": 3604} {"train_loss": -24.92103385925293, "global_step": 299188, "epoch": 3604} {"train_loss": -25.141647338867188, "global_step": 299189, "epoch": 3604} {"train_loss": -25.2996826171875, "global_step": 299190, "epoch": 3604} {"train_loss": -24.903076171875, "global_step": 299191, "epoch": 3604} {"train_loss": -25.37289810180664, "global_step": 299192, "epoch": 3604} {"train_loss": -25.259431838989258, "global_step": 299193, "epoch": 3604} {"train_loss": -25.353017807006836, "global_step": 299194, "epoch": 3604} {"train_loss": -25.643924713134766, "global_step": 299195, "epoch": 3604} {"train_loss": -25.232059478759766, "global_step": 299196, "epoch": 3604} {"train_loss": -25.585262298583984, "global_step": 299197, "epoch": 3604} {"train_loss": -25.427059173583984, "global_step": 299198, "epoch": 3604} {"train_loss": -25.311967849731445, "global_step": 299199, "epoch": 3604} {"train_loss": -25.87681007385254, "global_step": 299200, "epoch": 3604} {"train_loss": -25.50585174560547, "global_step": 299201, "epoch": 3604} {"train_loss": -25.55641746520996, "global_step": 299202, "epoch": 3604} {"train_loss": -25.532896041870117, "global_step": 299203, "epoch": 3604} {"train_loss": -25.7232723236084, "global_step": 299204, "epoch": 3604} {"train_loss": -25.64265251159668, "global_step": 299205, "epoch": 3604} {"train_loss": -26.051584243774414, "global_step": 299206, "epoch": 3604} {"train_loss": -25.700794219970703, "global_step": 299207, "epoch": 3604} {"train_loss": -25.609455108642578, "global_step": 299208, "epoch": 3604} {"train_loss": -25.694721221923828, "global_step": 299209, "epoch": 3604} {"train_loss": -25.82781410217285, "global_step": 299210, "epoch": 3604} {"train_loss": -25.294361114501953, "global_step": 299211, "epoch": 3604} {"train_loss": -25.800140380859375, "global_step": 299212, "epoch": 3604} {"train_loss": -25.658222198486328, "global_step": 299213, "epoch": 3604} {"train_loss": -25.49385459164539, "global_step": 299214, "epoch": 3604, "val_loss": 7109950.0} {"train_loss": -24.813282012939453, "global_step": 299215, "epoch": 3605} {"train_loss": -24.96516227722168, "global_step": 299216, "epoch": 3605} {"train_loss": -24.933317184448242, "global_step": 299217, "epoch": 3605} {"train_loss": -25.131418228149414, "global_step": 299218, "epoch": 3605} {"train_loss": -24.856054306030273, "global_step": 299219, "epoch": 3605} {"train_loss": -25.316055297851562, "global_step": 299220, "epoch": 3605} {"train_loss": -25.16921043395996, "global_step": 299221, "epoch": 3605} {"train_loss": -24.906892776489258, "global_step": 299222, "epoch": 3605} {"train_loss": -25.305286407470703, "global_step": 299223, "epoch": 3605} {"train_loss": -25.04526710510254, "global_step": 299224, "epoch": 3605} {"train_loss": -25.200654983520508, "global_step": 299225, "epoch": 3605} {"train_loss": -24.795820236206055, "global_step": 299226, "epoch": 3605} {"train_loss": -25.107934951782227, "global_step": 299227, "epoch": 3605} {"train_loss": -25.208057403564453, "global_step": 299228, "epoch": 3605} {"train_loss": -25.41678237915039, "global_step": 299229, "epoch": 3605} {"train_loss": -25.59889030456543, "global_step": 299230, "epoch": 3605} {"train_loss": -25.526151657104492, "global_step": 299231, "epoch": 3605} {"train_loss": -25.034608840942383, "global_step": 299232, "epoch": 3605} {"train_loss": -25.17841911315918, "global_step": 299233, "epoch": 3605} {"train_loss": -25.139623641967773, "global_step": 299234, "epoch": 3605} {"train_loss": -25.291091918945312, "global_step": 299235, "epoch": 3605} {"train_loss": -25.464080810546875, "global_step": 299236, "epoch": 3605} {"train_loss": -25.699115753173828, "global_step": 299237, "epoch": 3605} {"train_loss": -25.57998275756836, "global_step": 299238, "epoch": 3605} {"train_loss": -25.402040481567383, "global_step": 299239, "epoch": 3605} {"train_loss": -25.76495933532715, "global_step": 299240, "epoch": 3605} {"train_loss": -25.727930068969727, "global_step": 299241, "epoch": 3605} {"train_loss": -25.4910888671875, "global_step": 299242, "epoch": 3605} {"train_loss": -25.904691696166992, "global_step": 299243, "epoch": 3605} {"train_loss": -25.720746994018555, "global_step": 299244, "epoch": 3605} {"train_loss": -25.72141456604004, "global_step": 299245, "epoch": 3605} {"train_loss": -25.59510612487793, "global_step": 299246, "epoch": 3605} {"train_loss": -25.697528839111328, "global_step": 299247, "epoch": 3605} {"train_loss": -25.78496742248535, "global_step": 299248, "epoch": 3605} {"train_loss": -25.46965789794922, "global_step": 299249, "epoch": 3605} {"train_loss": -25.704557418823242, "global_step": 299250, "epoch": 3605} {"train_loss": -25.81313133239746, "global_step": 299251, "epoch": 3605} {"train_loss": -25.861051559448242, "global_step": 299252, "epoch": 3605} {"train_loss": -25.5413875579834, "global_step": 299253, "epoch": 3605} {"train_loss": -25.45893669128418, "global_step": 299254, "epoch": 3605} {"train_loss": -25.857954025268555, "global_step": 299255, "epoch": 3605} {"train_loss": -25.488178253173828, "global_step": 299256, "epoch": 3605} {"train_loss": -25.597848892211914, "global_step": 299257, "epoch": 3605} {"train_loss": -25.059667587280273, "global_step": 299258, "epoch": 3605} {"train_loss": -25.006330490112305, "global_step": 299259, "epoch": 3605} {"train_loss": -25.302221298217773, "global_step": 299260, "epoch": 3605} {"train_loss": -25.292173385620117, "global_step": 299261, "epoch": 3605} {"train_loss": -25.04743194580078, "global_step": 299262, "epoch": 3605} {"train_loss": -25.498380661010742, "global_step": 299263, "epoch": 3605} {"train_loss": -25.7026424407959, "global_step": 299264, "epoch": 3605} {"train_loss": -25.29905128479004, "global_step": 299265, "epoch": 3605} {"train_loss": -25.1780948638916, "global_step": 299266, "epoch": 3605} {"train_loss": -25.485578536987305, "global_step": 299267, "epoch": 3605} {"train_loss": -25.642120361328125, "global_step": 299268, "epoch": 3605} {"train_loss": -25.579126358032227, "global_step": 299269, "epoch": 3605} {"train_loss": -25.487781524658203, "global_step": 299270, "epoch": 3605} {"train_loss": -25.36408805847168, "global_step": 299271, "epoch": 3605} {"train_loss": -25.32560920715332, "global_step": 299272, "epoch": 3605} {"train_loss": -25.60540199279785, "global_step": 299273, "epoch": 3605} {"train_loss": -25.595121383666992, "global_step": 299274, "epoch": 3605} {"train_loss": -25.163795471191406, "global_step": 299275, "epoch": 3605} {"train_loss": -25.469213485717773, "global_step": 299276, "epoch": 3605} {"train_loss": -25.60053825378418, "global_step": 299277, "epoch": 3605} {"train_loss": -25.350950241088867, "global_step": 299278, "epoch": 3605} {"train_loss": -25.64284324645996, "global_step": 299279, "epoch": 3605} {"train_loss": -25.496240615844727, "global_step": 299280, "epoch": 3605} {"train_loss": -25.518075942993164, "global_step": 299281, "epoch": 3605} {"train_loss": -25.16056251525879, "global_step": 299282, "epoch": 3605} {"train_loss": -26.05865478515625, "global_step": 299283, "epoch": 3605} {"train_loss": -25.930017471313477, "global_step": 299284, "epoch": 3605} {"train_loss": -25.44500160217285, "global_step": 299285, "epoch": 3605} {"train_loss": -25.79242515563965, "global_step": 299286, "epoch": 3605} {"train_loss": -25.800048828125, "global_step": 299287, "epoch": 3605} {"train_loss": -25.985218048095703, "global_step": 299288, "epoch": 3605} {"train_loss": -25.6219482421875, "global_step": 299289, "epoch": 3605} {"train_loss": -25.710159301757812, "global_step": 299290, "epoch": 3605} {"train_loss": -25.5573787689209, "global_step": 299291, "epoch": 3605} {"train_loss": -25.962881088256836, "global_step": 299292, "epoch": 3605} {"train_loss": -25.63027000427246, "global_step": 299293, "epoch": 3605} {"train_loss": -25.853626251220703, "global_step": 299294, "epoch": 3605} {"train_loss": -25.91111183166504, "global_step": 299295, "epoch": 3605} {"train_loss": -25.76251792907715, "global_step": 299296, "epoch": 3605} {"train_loss": -25.481849532529534, "global_step": 299297, "epoch": 3605, "val_loss": 7170065.0} {"train_loss": -25.692106246948242, "global_step": 299298, "epoch": 3606} {"train_loss": -25.507396697998047, "global_step": 299299, "epoch": 3606} {"train_loss": -25.39137077331543, "global_step": 299300, "epoch": 3606} {"train_loss": -25.308088302612305, "global_step": 299301, "epoch": 3606} {"train_loss": -25.104434967041016, "global_step": 299302, "epoch": 3606} {"train_loss": -25.21436882019043, "global_step": 299303, "epoch": 3606} {"train_loss": -25.671218872070312, "global_step": 299304, "epoch": 3606} {"train_loss": -25.627979278564453, "global_step": 299305, "epoch": 3606} {"train_loss": -25.720096588134766, "global_step": 299306, "epoch": 3606} {"train_loss": -25.363784790039062, "global_step": 299307, "epoch": 3606} {"train_loss": -25.281064987182617, "global_step": 299308, "epoch": 3606} {"train_loss": -25.26922607421875, "global_step": 299309, "epoch": 3606} {"train_loss": -25.336822509765625, "global_step": 299310, "epoch": 3606} {"train_loss": -25.203237533569336, "global_step": 299311, "epoch": 3606} {"train_loss": -25.022424697875977, "global_step": 299312, "epoch": 3606} {"train_loss": -25.733795166015625, "global_step": 299313, "epoch": 3606} {"train_loss": -25.328672409057617, "global_step": 299314, "epoch": 3606} {"train_loss": -25.534860610961914, "global_step": 299315, "epoch": 3606} {"train_loss": -25.801406860351562, "global_step": 299316, "epoch": 3606} {"train_loss": -25.932586669921875, "global_step": 299317, "epoch": 3606} {"train_loss": -25.338485717773438, "global_step": 299318, "epoch": 3606} {"train_loss": -25.646093368530273, "global_step": 299319, "epoch": 3606} {"train_loss": -25.783308029174805, "global_step": 299320, "epoch": 3606} {"train_loss": -25.587852478027344, "global_step": 299321, "epoch": 3606} {"train_loss": -25.52614402770996, "global_step": 299322, "epoch": 3606} {"train_loss": -25.82074546813965, "global_step": 299323, "epoch": 3606} {"train_loss": -25.59272575378418, "global_step": 299324, "epoch": 3606} {"train_loss": -25.49427604675293, "global_step": 299325, "epoch": 3606} {"train_loss": -25.727285385131836, "global_step": 299326, "epoch": 3606} {"train_loss": -25.607004165649414, "global_step": 299327, "epoch": 3606} {"train_loss": -25.334457397460938, "global_step": 299328, "epoch": 3606} {"train_loss": -25.7319393157959, "global_step": 299329, "epoch": 3606} {"train_loss": -25.615461349487305, "global_step": 299330, "epoch": 3606} {"train_loss": -25.958383560180664, "global_step": 299331, "epoch": 3606} {"train_loss": -25.682790756225586, "global_step": 299332, "epoch": 3606} {"train_loss": -25.315744400024414, "global_step": 299333, "epoch": 3606} {"train_loss": -25.652511596679688, "global_step": 299334, "epoch": 3606} {"train_loss": -25.93098258972168, "global_step": 299335, "epoch": 3606} {"train_loss": -25.7718563079834, "global_step": 299336, "epoch": 3606} {"train_loss": -25.723936080932617, "global_step": 299337, "epoch": 3606} {"train_loss": -26.013158798217773, "global_step": 299338, "epoch": 3606} {"train_loss": -25.438081741333008, "global_step": 299339, "epoch": 3606} {"train_loss": -25.687353134155273, "global_step": 299340, "epoch": 3606} {"train_loss": -25.775236129760742, "global_step": 299341, "epoch": 3606} {"train_loss": -25.7452449798584, "global_step": 299342, "epoch": 3606} {"train_loss": -25.63467788696289, "global_step": 299343, "epoch": 3606} {"train_loss": -25.757471084594727, "global_step": 299344, "epoch": 3606} {"train_loss": -25.89314079284668, "global_step": 299345, "epoch": 3606} {"train_loss": -25.688617706298828, "global_step": 299346, "epoch": 3606} {"train_loss": -25.543624877929688, "global_step": 299347, "epoch": 3606} {"train_loss": -25.401891708374023, "global_step": 299348, "epoch": 3606} {"train_loss": -25.8223934173584, "global_step": 299349, "epoch": 3606} {"train_loss": -25.7883358001709, "global_step": 299350, "epoch": 3606} {"train_loss": -25.588956832885742, "global_step": 299351, "epoch": 3606} {"train_loss": -25.93143653869629, "global_step": 299352, "epoch": 3606} {"train_loss": -25.919397354125977, "global_step": 299353, "epoch": 3606} {"train_loss": -26.025354385375977, "global_step": 299354, "epoch": 3606} {"train_loss": -25.68132972717285, "global_step": 299355, "epoch": 3606} {"train_loss": -25.790729522705078, "global_step": 299356, "epoch": 3606} {"train_loss": -25.823871612548828, "global_step": 299357, "epoch": 3606} {"train_loss": -25.37491798400879, "global_step": 299358, "epoch": 3606} {"train_loss": -25.671417236328125, "global_step": 299359, "epoch": 3606} {"train_loss": -25.047637939453125, "global_step": 299360, "epoch": 3606} {"train_loss": -25.388996124267578, "global_step": 299361, "epoch": 3606} {"train_loss": -25.28362274169922, "global_step": 299362, "epoch": 3606} {"train_loss": -25.608251571655273, "global_step": 299363, "epoch": 3606} {"train_loss": -25.416215896606445, "global_step": 299364, "epoch": 3606} {"train_loss": -25.614013671875, "global_step": 299365, "epoch": 3606} {"train_loss": -25.761144638061523, "global_step": 299366, "epoch": 3606} {"train_loss": -25.936460494995117, "global_step": 299367, "epoch": 3606} {"train_loss": -25.77737808227539, "global_step": 299368, "epoch": 3606} {"train_loss": -25.21352195739746, "global_step": 299369, "epoch": 3606} {"train_loss": -25.83335304260254, "global_step": 299370, "epoch": 3606} {"train_loss": -25.6907958984375, "global_step": 299371, "epoch": 3606} {"train_loss": -25.9263916015625, "global_step": 299372, "epoch": 3606} {"train_loss": -25.54783058166504, "global_step": 299373, "epoch": 3606} {"train_loss": -25.149072647094727, "global_step": 299374, "epoch": 3606} {"train_loss": -25.615217208862305, "global_step": 299375, "epoch": 3606} {"train_loss": -25.60324478149414, "global_step": 299376, "epoch": 3606} {"train_loss": -25.844802856445312, "global_step": 299377, "epoch": 3606} {"train_loss": -25.72330665588379, "global_step": 299378, "epoch": 3606} {"train_loss": -25.532176971435547, "global_step": 299379, "epoch": 3606} {"train_loss": -25.595952229327466, "global_step": 299380, "epoch": 3606, "val_loss": 7234677.0} {"train_loss": -25.337461471557617, "global_step": 299381, "epoch": 3607} {"train_loss": -25.796283721923828, "global_step": 299382, "epoch": 3607} {"train_loss": -25.304636001586914, "global_step": 299383, "epoch": 3607} {"train_loss": -25.24493980407715, "global_step": 299384, "epoch": 3607} {"train_loss": -25.127227783203125, "global_step": 299385, "epoch": 3607} {"train_loss": -25.31990623474121, "global_step": 299386, "epoch": 3607} {"train_loss": -25.187849044799805, "global_step": 299387, "epoch": 3607} {"train_loss": -25.38612937927246, "global_step": 299388, "epoch": 3607} {"train_loss": -25.347497940063477, "global_step": 299389, "epoch": 3607} {"train_loss": -25.26864242553711, "global_step": 299390, "epoch": 3607} {"train_loss": -25.38539695739746, "global_step": 299391, "epoch": 3607} {"train_loss": -25.151620864868164, "global_step": 299392, "epoch": 3607} {"train_loss": -25.611251831054688, "global_step": 299393, "epoch": 3607} {"train_loss": -25.130399703979492, "global_step": 299394, "epoch": 3607} {"train_loss": -26.131484985351562, "global_step": 299395, "epoch": 3607} {"train_loss": -25.70212745666504, "global_step": 299396, "epoch": 3607} {"train_loss": -25.781757354736328, "global_step": 299397, "epoch": 3607} {"train_loss": -25.58173179626465, "global_step": 299398, "epoch": 3607} {"train_loss": -25.630701065063477, "global_step": 299399, "epoch": 3607} {"train_loss": -25.32029914855957, "global_step": 299400, "epoch": 3607} {"train_loss": -25.7718448638916, "global_step": 299401, "epoch": 3607} {"train_loss": -25.637542724609375, "global_step": 299402, "epoch": 3607} {"train_loss": -25.370803833007812, "global_step": 299403, "epoch": 3607} {"train_loss": -25.582860946655273, "global_step": 299404, "epoch": 3607} {"train_loss": -25.819122314453125, "global_step": 299405, "epoch": 3607} {"train_loss": -25.69208335876465, "global_step": 299406, "epoch": 3607} {"train_loss": -25.787982940673828, "global_step": 299407, "epoch": 3607} {"train_loss": -25.59270477294922, "global_step": 299408, "epoch": 3607} {"train_loss": -25.80305290222168, "global_step": 299409, "epoch": 3607} {"train_loss": -25.706989288330078, "global_step": 299410, "epoch": 3607} {"train_loss": -25.762271881103516, "global_step": 299411, "epoch": 3607} {"train_loss": -25.621652603149414, "global_step": 299412, "epoch": 3607} {"train_loss": -25.30452537536621, "global_step": 299413, "epoch": 3607} {"train_loss": -25.77105140686035, "global_step": 299414, "epoch": 3607} {"train_loss": -25.92009925842285, "global_step": 299415, "epoch": 3607} {"train_loss": -25.539487838745117, "global_step": 299416, "epoch": 3607} {"train_loss": -25.33029556274414, "global_step": 299417, "epoch": 3607} {"train_loss": -25.496540069580078, "global_step": 299418, "epoch": 3607} {"train_loss": -25.529924392700195, "global_step": 299419, "epoch": 3607} {"train_loss": -25.744359970092773, "global_step": 299420, "epoch": 3607} {"train_loss": -25.90654945373535, "global_step": 299421, "epoch": 3607} {"train_loss": -25.712915420532227, "global_step": 299422, "epoch": 3607} {"train_loss": -26.069040298461914, "global_step": 299423, "epoch": 3607} {"train_loss": -25.36848258972168, "global_step": 299424, "epoch": 3607} {"train_loss": -25.299972534179688, "global_step": 299425, "epoch": 3607} {"train_loss": -25.682889938354492, "global_step": 299426, "epoch": 3607} {"train_loss": -26.10706901550293, "global_step": 299427, "epoch": 3607} {"train_loss": -25.743057250976562, "global_step": 299428, "epoch": 3607} {"train_loss": -25.93314552307129, "global_step": 299429, "epoch": 3607} {"train_loss": -25.433658599853516, "global_step": 299430, "epoch": 3607} {"train_loss": -25.852828979492188, "global_step": 299431, "epoch": 3607} {"train_loss": -25.621591567993164, "global_step": 299432, "epoch": 3607} {"train_loss": -25.368186950683594, "global_step": 299433, "epoch": 3607} {"train_loss": -25.925825119018555, "global_step": 299434, "epoch": 3607} {"train_loss": -25.8583927154541, "global_step": 299435, "epoch": 3607} {"train_loss": -25.37667465209961, "global_step": 299436, "epoch": 3607} {"train_loss": -25.369871139526367, "global_step": 299437, "epoch": 3607} {"train_loss": -25.31208038330078, "global_step": 299438, "epoch": 3607} {"train_loss": -25.57883644104004, "global_step": 299439, "epoch": 3607} {"train_loss": -25.45343017578125, "global_step": 299440, "epoch": 3607} {"train_loss": -25.559452056884766, "global_step": 299441, "epoch": 3607} {"train_loss": -25.585289001464844, "global_step": 299442, "epoch": 3607} {"train_loss": -25.508468627929688, "global_step": 299443, "epoch": 3607} {"train_loss": -25.211278915405273, "global_step": 299444, "epoch": 3607} {"train_loss": -25.760129928588867, "global_step": 299445, "epoch": 3607} {"train_loss": -25.418941497802734, "global_step": 299446, "epoch": 3607} {"train_loss": -25.429685592651367, "global_step": 299447, "epoch": 3607} {"train_loss": -25.60222816467285, "global_step": 299448, "epoch": 3607} {"train_loss": -25.394880294799805, "global_step": 299449, "epoch": 3607} {"train_loss": -26.01578712463379, "global_step": 299450, "epoch": 3607} {"train_loss": -25.432865142822266, "global_step": 299451, "epoch": 3607} {"train_loss": -25.59443473815918, "global_step": 299452, "epoch": 3607} {"train_loss": -25.393463134765625, "global_step": 299453, "epoch": 3607} {"train_loss": -25.430334091186523, "global_step": 299454, "epoch": 3607} {"train_loss": -25.654138565063477, "global_step": 299455, "epoch": 3607} {"train_loss": -25.481189727783203, "global_step": 299456, "epoch": 3607} {"train_loss": -25.726598739624023, "global_step": 299457, "epoch": 3607} {"train_loss": -25.74592399597168, "global_step": 299458, "epoch": 3607} {"train_loss": -25.91077995300293, "global_step": 299459, "epoch": 3607} {"train_loss": -25.28976821899414, "global_step": 299460, "epoch": 3607} {"train_loss": -25.490514755249023, "global_step": 299461, "epoch": 3607} {"train_loss": -25.34712791442871, "global_step": 299462, "epoch": 3607} {"train_loss": -25.574330548206007, "global_step": 299463, "epoch": 3607, "val_loss": 7141255.0} {"train_loss": -25.169553756713867, "global_step": 299464, "epoch": 3608} {"train_loss": -24.750619888305664, "global_step": 299465, "epoch": 3608} {"train_loss": -24.993499755859375, "global_step": 299466, "epoch": 3608} {"train_loss": -25.26051139831543, "global_step": 299467, "epoch": 3608} {"train_loss": -25.0670166015625, "global_step": 299468, "epoch": 3608} {"train_loss": -24.753074645996094, "global_step": 299469, "epoch": 3608} {"train_loss": -25.3591251373291, "global_step": 299470, "epoch": 3608} {"train_loss": -25.192724227905273, "global_step": 299471, "epoch": 3608} {"train_loss": -25.323945999145508, "global_step": 299472, "epoch": 3608} {"train_loss": -25.397422790527344, "global_step": 299473, "epoch": 3608} {"train_loss": -25.197885513305664, "global_step": 299474, "epoch": 3608} {"train_loss": -25.120580673217773, "global_step": 299475, "epoch": 3608} {"train_loss": -25.81209373474121, "global_step": 299476, "epoch": 3608} {"train_loss": -25.62933349609375, "global_step": 299477, "epoch": 3608} {"train_loss": -25.21883201599121, "global_step": 299478, "epoch": 3608} {"train_loss": -25.329647064208984, "global_step": 299479, "epoch": 3608} {"train_loss": -25.21974754333496, "global_step": 299480, "epoch": 3608} {"train_loss": -26.109731674194336, "global_step": 299481, "epoch": 3608} {"train_loss": -25.737924575805664, "global_step": 299482, "epoch": 3608} {"train_loss": -25.317068099975586, "global_step": 299483, "epoch": 3608} {"train_loss": -25.51106071472168, "global_step": 299484, "epoch": 3608} {"train_loss": -25.43134117126465, "global_step": 299485, "epoch": 3608} {"train_loss": -25.22573471069336, "global_step": 299486, "epoch": 3608} {"train_loss": -25.857999801635742, "global_step": 299487, "epoch": 3608} {"train_loss": -25.43585777282715, "global_step": 299488, "epoch": 3608} {"train_loss": -25.734237670898438, "global_step": 299489, "epoch": 3608} {"train_loss": -25.6046142578125, "global_step": 299490, "epoch": 3608} {"train_loss": -25.186017990112305, "global_step": 299491, "epoch": 3608} {"train_loss": -25.76873779296875, "global_step": 299492, "epoch": 3608} {"train_loss": -25.501493453979492, "global_step": 299493, "epoch": 3608} {"train_loss": -25.589313507080078, "global_step": 299494, "epoch": 3608} {"train_loss": -25.14451026916504, "global_step": 299495, "epoch": 3608} {"train_loss": -25.75652503967285, "global_step": 299496, "epoch": 3608} {"train_loss": -25.633115768432617, "global_step": 299497, "epoch": 3608} {"train_loss": -25.651159286499023, "global_step": 299498, "epoch": 3608} {"train_loss": -25.421842575073242, "global_step": 299499, "epoch": 3608} {"train_loss": -25.862173080444336, "global_step": 299500, "epoch": 3608} {"train_loss": -25.79180335998535, "global_step": 299501, "epoch": 3608} {"train_loss": -25.645780563354492, "global_step": 299502, "epoch": 3608} {"train_loss": -25.637388229370117, "global_step": 299503, "epoch": 3608} {"train_loss": -25.575292587280273, "global_step": 299504, "epoch": 3608} {"train_loss": -25.491392135620117, "global_step": 299505, "epoch": 3608} {"train_loss": -25.680822372436523, "global_step": 299506, "epoch": 3608} {"train_loss": -25.425308227539062, "global_step": 299507, "epoch": 3608} {"train_loss": -25.87200927734375, "global_step": 299508, "epoch": 3608} {"train_loss": -25.4700870513916, "global_step": 299509, "epoch": 3608} {"train_loss": -26.035419464111328, "global_step": 299510, "epoch": 3608} {"train_loss": -25.81348991394043, "global_step": 299511, "epoch": 3608} {"train_loss": -25.92652702331543, "global_step": 299512, "epoch": 3608} {"train_loss": -25.850162506103516, "global_step": 299513, "epoch": 3608} {"train_loss": -25.560758590698242, "global_step": 299514, "epoch": 3608} {"train_loss": -25.519392013549805, "global_step": 299515, "epoch": 3608} {"train_loss": -25.440818786621094, "global_step": 299516, "epoch": 3608} {"train_loss": -25.576566696166992, "global_step": 299517, "epoch": 3608} {"train_loss": -25.759851455688477, "global_step": 299518, "epoch": 3608} {"train_loss": -26.034809112548828, "global_step": 299519, "epoch": 3608} {"train_loss": -26.05877685546875, "global_step": 299520, "epoch": 3608} {"train_loss": -25.7672176361084, "global_step": 299521, "epoch": 3608} {"train_loss": -26.26114845275879, "global_step": 299522, "epoch": 3608} {"train_loss": -25.520721435546875, "global_step": 299523, "epoch": 3608} {"train_loss": -25.939971923828125, "global_step": 299524, "epoch": 3608} {"train_loss": -25.580162048339844, "global_step": 299525, "epoch": 3608} {"train_loss": -25.680410385131836, "global_step": 299526, "epoch": 3608} {"train_loss": -25.00762367248535, "global_step": 299527, "epoch": 3608} {"train_loss": -24.985185623168945, "global_step": 299528, "epoch": 3608} {"train_loss": -24.969388961791992, "global_step": 299529, "epoch": 3608} {"train_loss": -25.058103561401367, "global_step": 299530, "epoch": 3608} {"train_loss": -25.735288619995117, "global_step": 299531, "epoch": 3608} {"train_loss": -25.50090980529785, "global_step": 299532, "epoch": 3608} {"train_loss": -25.70025634765625, "global_step": 299533, "epoch": 3608} {"train_loss": -25.74957275390625, "global_step": 299534, "epoch": 3608} {"train_loss": -25.593303680419922, "global_step": 299535, "epoch": 3608} {"train_loss": -25.7493839263916, "global_step": 299536, "epoch": 3608} {"train_loss": -25.532852172851562, "global_step": 299537, "epoch": 3608} {"train_loss": -25.291296005249023, "global_step": 299538, "epoch": 3608} {"train_loss": -25.711761474609375, "global_step": 299539, "epoch": 3608} {"train_loss": -25.86957359313965, "global_step": 299540, "epoch": 3608} {"train_loss": -25.41316032409668, "global_step": 299541, "epoch": 3608} {"train_loss": -25.30421257019043, "global_step": 299542, "epoch": 3608} {"train_loss": -25.525020599365234, "global_step": 299543, "epoch": 3608} {"train_loss": -25.16545295715332, "global_step": 299544, "epoch": 3608} {"train_loss": -25.691608428955078, "global_step": 299545, "epoch": 3608} {"train_loss": -25.53116609964026, "global_step": 299546, "epoch": 3608, "val_loss": 7263428.0} {"train_loss": -25.100479125976562, "global_step": 299547, "epoch": 3609} {"train_loss": -24.84272003173828, "global_step": 299548, "epoch": 3609} {"train_loss": -24.573625564575195, "global_step": 299549, "epoch": 3609} {"train_loss": -25.02546501159668, "global_step": 299550, "epoch": 3609} {"train_loss": -25.066694259643555, "global_step": 299551, "epoch": 3609} {"train_loss": -24.88693618774414, "global_step": 299552, "epoch": 3609} {"train_loss": -24.882070541381836, "global_step": 299553, "epoch": 3609} {"train_loss": -25.11343765258789, "global_step": 299554, "epoch": 3609} {"train_loss": -25.524702072143555, "global_step": 299555, "epoch": 3609} {"train_loss": -25.25795555114746, "global_step": 299556, "epoch": 3609} {"train_loss": -25.31639289855957, "global_step": 299557, "epoch": 3609} {"train_loss": -24.988698959350586, "global_step": 299558, "epoch": 3609} {"train_loss": -25.196252822875977, "global_step": 299559, "epoch": 3609} {"train_loss": -25.30899429321289, "global_step": 299560, "epoch": 3609} {"train_loss": -25.516666412353516, "global_step": 299561, "epoch": 3609} {"train_loss": -25.146564483642578, "global_step": 299562, "epoch": 3609} {"train_loss": -25.197345733642578, "global_step": 299563, "epoch": 3609} {"train_loss": -25.281814575195312, "global_step": 299564, "epoch": 3609} {"train_loss": -25.337635040283203, "global_step": 299565, "epoch": 3609} {"train_loss": -25.39274024963379, "global_step": 299566, "epoch": 3609} {"train_loss": -25.396669387817383, "global_step": 299567, "epoch": 3609} {"train_loss": -25.30354118347168, "global_step": 299568, "epoch": 3609} {"train_loss": -25.735288619995117, "global_step": 299569, "epoch": 3609} {"train_loss": -25.776594161987305, "global_step": 299570, "epoch": 3609} {"train_loss": -25.328603744506836, "global_step": 299571, "epoch": 3609} {"train_loss": -25.7171630859375, "global_step": 299572, "epoch": 3609} {"train_loss": -25.707361221313477, "global_step": 299573, "epoch": 3609} {"train_loss": -25.83709716796875, "global_step": 299574, "epoch": 3609} {"train_loss": -25.9810791015625, "global_step": 299575, "epoch": 3609} {"train_loss": -25.833404541015625, "global_step": 299576, "epoch": 3609} {"train_loss": -26.0481014251709, "global_step": 299577, "epoch": 3609} {"train_loss": -25.702489852905273, "global_step": 299578, "epoch": 3609} {"train_loss": -25.737680435180664, "global_step": 299579, "epoch": 3609} {"train_loss": -25.872678756713867, "global_step": 299580, "epoch": 3609} {"train_loss": -25.84476089477539, "global_step": 299581, "epoch": 3609} {"train_loss": -25.671619415283203, "global_step": 299582, "epoch": 3609} {"train_loss": -25.878894805908203, "global_step": 299583, "epoch": 3609} {"train_loss": -25.894479751586914, "global_step": 299584, "epoch": 3609} {"train_loss": -25.60858154296875, "global_step": 299585, "epoch": 3609} {"train_loss": -25.7523136138916, "global_step": 299586, "epoch": 3609} {"train_loss": -25.810922622680664, "global_step": 299587, "epoch": 3609} {"train_loss": -25.756027221679688, "global_step": 299588, "epoch": 3609} {"train_loss": -25.830219268798828, "global_step": 299589, "epoch": 3609} {"train_loss": -25.415237426757812, "global_step": 299590, "epoch": 3609} {"train_loss": -25.999353408813477, "global_step": 299591, "epoch": 3609} {"train_loss": -25.826801300048828, "global_step": 299592, "epoch": 3609} {"train_loss": -25.717639923095703, "global_step": 299593, "epoch": 3609} {"train_loss": -25.595958709716797, "global_step": 299594, "epoch": 3609} {"train_loss": -25.721471786499023, "global_step": 299595, "epoch": 3609} {"train_loss": -25.821014404296875, "global_step": 299596, "epoch": 3609} {"train_loss": -25.727619171142578, "global_step": 299597, "epoch": 3609} {"train_loss": -25.399633407592773, "global_step": 299598, "epoch": 3609} {"train_loss": -25.669355392456055, "global_step": 299599, "epoch": 3609} {"train_loss": -25.05910301208496, "global_step": 299600, "epoch": 3609} {"train_loss": -24.8409481048584, "global_step": 299601, "epoch": 3609} {"train_loss": -24.642101287841797, "global_step": 299602, "epoch": 3609} {"train_loss": -24.85860824584961, "global_step": 299603, "epoch": 3609} {"train_loss": -25.354162216186523, "global_step": 299604, "epoch": 3609} {"train_loss": -25.63462257385254, "global_step": 299605, "epoch": 3609} {"train_loss": -25.277402877807617, "global_step": 299606, "epoch": 3609} {"train_loss": -25.411012649536133, "global_step": 299607, "epoch": 3609} {"train_loss": -25.12399673461914, "global_step": 299608, "epoch": 3609} {"train_loss": -25.425321578979492, "global_step": 299609, "epoch": 3609} {"train_loss": -25.246530532836914, "global_step": 299610, "epoch": 3609} {"train_loss": -25.23787498474121, "global_step": 299611, "epoch": 3609} {"train_loss": -25.516599655151367, "global_step": 299612, "epoch": 3609} {"train_loss": -25.660186767578125, "global_step": 299613, "epoch": 3609} {"train_loss": -25.44972801208496, "global_step": 299614, "epoch": 3609} {"train_loss": -25.326704025268555, "global_step": 299615, "epoch": 3609} {"train_loss": -25.539762496948242, "global_step": 299616, "epoch": 3609} {"train_loss": -25.542356491088867, "global_step": 299617, "epoch": 3609} {"train_loss": -25.756378173828125, "global_step": 299618, "epoch": 3609} {"train_loss": -25.431888580322266, "global_step": 299619, "epoch": 3609} {"train_loss": -25.777099609375, "global_step": 299620, "epoch": 3609} {"train_loss": -25.40448570251465, "global_step": 299621, "epoch": 3609} {"train_loss": -25.503990173339844, "global_step": 299622, "epoch": 3609} {"train_loss": -25.707962036132812, "global_step": 299623, "epoch": 3609} {"train_loss": -25.408048629760742, "global_step": 299624, "epoch": 3609} {"train_loss": -25.495033264160156, "global_step": 299625, "epoch": 3609} {"train_loss": -25.251188278198242, "global_step": 299626, "epoch": 3609} {"train_loss": -25.6605224609375, "global_step": 299627, "epoch": 3609} {"train_loss": -25.85481071472168, "global_step": 299628, "epoch": 3609} {"train_loss": -25.463570859058795, "global_step": 299629, "epoch": 3609, "val_loss": 7129990.5} {"train_loss": -25.36897087097168, "global_step": 299630, "epoch": 3610} {"train_loss": -25.677988052368164, "global_step": 299631, "epoch": 3610} {"train_loss": -25.941980361938477, "global_step": 299632, "epoch": 3610} {"train_loss": -25.59657096862793, "global_step": 299633, "epoch": 3610} {"train_loss": -25.37242317199707, "global_step": 299634, "epoch": 3610} {"train_loss": -25.39387321472168, "global_step": 299635, "epoch": 3610} {"train_loss": -25.048891067504883, "global_step": 299636, "epoch": 3610} {"train_loss": -25.63813591003418, "global_step": 299637, "epoch": 3610} {"train_loss": -25.301469802856445, "global_step": 299638, "epoch": 3610} {"train_loss": -25.261545181274414, "global_step": 299639, "epoch": 3610} {"train_loss": -25.366941452026367, "global_step": 299640, "epoch": 3610} {"train_loss": -25.395559310913086, "global_step": 299641, "epoch": 3610} {"train_loss": -25.45362663269043, "global_step": 299642, "epoch": 3610} {"train_loss": -25.519603729248047, "global_step": 299643, "epoch": 3610} {"train_loss": -25.323415756225586, "global_step": 299644, "epoch": 3610} {"train_loss": -26.330015182495117, "global_step": 299645, "epoch": 3610} {"train_loss": -25.636579513549805, "global_step": 299646, "epoch": 3610} {"train_loss": -25.391992568969727, "global_step": 299647, "epoch": 3610} {"train_loss": -25.183515548706055, "global_step": 299648, "epoch": 3610} {"train_loss": -25.319351196289062, "global_step": 299649, "epoch": 3610} {"train_loss": -25.561939239501953, "global_step": 299650, "epoch": 3610} {"train_loss": -25.553207397460938, "global_step": 299651, "epoch": 3610} {"train_loss": -25.6966609954834, "global_step": 299652, "epoch": 3610} {"train_loss": -25.7126522064209, "global_step": 299653, "epoch": 3610} {"train_loss": -25.68092918395996, "global_step": 299654, "epoch": 3610} {"train_loss": -25.869314193725586, "global_step": 299655, "epoch": 3610} {"train_loss": -25.7318115234375, "global_step": 299656, "epoch": 3610} {"train_loss": -25.294296264648438, "global_step": 299657, "epoch": 3610} {"train_loss": -25.446048736572266, "global_step": 299658, "epoch": 3610} {"train_loss": -25.578149795532227, "global_step": 299659, "epoch": 3610} {"train_loss": -25.65390968322754, "global_step": 299660, "epoch": 3610} {"train_loss": -25.829675674438477, "global_step": 299661, "epoch": 3610} {"train_loss": -25.58757209777832, "global_step": 299662, "epoch": 3610} {"train_loss": -25.600671768188477, "global_step": 299663, "epoch": 3610} {"train_loss": -25.459808349609375, "global_step": 299664, "epoch": 3610} {"train_loss": -25.74078369140625, "global_step": 299665, "epoch": 3610} {"train_loss": -25.55689811706543, "global_step": 299666, "epoch": 3610} {"train_loss": -25.31252098083496, "global_step": 299667, "epoch": 3610} {"train_loss": -25.717864990234375, "global_step": 299668, "epoch": 3610} {"train_loss": -25.87070655822754, "global_step": 299669, "epoch": 3610} {"train_loss": -26.06685447692871, "global_step": 299670, "epoch": 3610} {"train_loss": -25.536481857299805, "global_step": 299671, "epoch": 3610} {"train_loss": -25.573047637939453, "global_step": 299672, "epoch": 3610} {"train_loss": -25.931882858276367, "global_step": 299673, "epoch": 3610} {"train_loss": -25.808408737182617, "global_step": 299674, "epoch": 3610} {"train_loss": -25.055999755859375, "global_step": 299675, "epoch": 3610} {"train_loss": -25.20461082458496, "global_step": 299676, "epoch": 3610} {"train_loss": -25.779829025268555, "global_step": 299677, "epoch": 3610} {"train_loss": -25.4329891204834, "global_step": 299678, "epoch": 3610} {"train_loss": -25.5156307220459, "global_step": 299679, "epoch": 3610} {"train_loss": -25.23690414428711, "global_step": 299680, "epoch": 3610} {"train_loss": -25.792560577392578, "global_step": 299681, "epoch": 3610} {"train_loss": -25.591014862060547, "global_step": 299682, "epoch": 3610} {"train_loss": -25.317392349243164, "global_step": 299683, "epoch": 3610} {"train_loss": -25.716541290283203, "global_step": 299684, "epoch": 3610} {"train_loss": -25.6334228515625, "global_step": 299685, "epoch": 3610} {"train_loss": -25.575626373291016, "global_step": 299686, "epoch": 3610} {"train_loss": -26.034910202026367, "global_step": 299687, "epoch": 3610} {"train_loss": -25.43147850036621, "global_step": 299688, "epoch": 3610} {"train_loss": -25.35951805114746, "global_step": 299689, "epoch": 3610} {"train_loss": -25.6086368560791, "global_step": 299690, "epoch": 3610} {"train_loss": -25.78985595703125, "global_step": 299691, "epoch": 3610} {"train_loss": -25.350217819213867, "global_step": 299692, "epoch": 3610} {"train_loss": -25.339923858642578, "global_step": 299693, "epoch": 3610} {"train_loss": -25.53226661682129, "global_step": 299694, "epoch": 3610} {"train_loss": -25.709304809570312, "global_step": 299695, "epoch": 3610} {"train_loss": -25.829547882080078, "global_step": 299696, "epoch": 3610} {"train_loss": -25.272022247314453, "global_step": 299697, "epoch": 3610} {"train_loss": -25.791919708251953, "global_step": 299698, "epoch": 3610} {"train_loss": -25.975637435913086, "global_step": 299699, "epoch": 3610} {"train_loss": -25.76654624938965, "global_step": 299700, "epoch": 3610} {"train_loss": -25.597253799438477, "global_step": 299701, "epoch": 3610} {"train_loss": -25.446420669555664, "global_step": 299702, "epoch": 3610} {"train_loss": -25.363536834716797, "global_step": 299703, "epoch": 3610} {"train_loss": -25.5738468170166, "global_step": 299704, "epoch": 3610} {"train_loss": -25.93031883239746, "global_step": 299705, "epoch": 3610} {"train_loss": -25.6456298828125, "global_step": 299706, "epoch": 3610} {"train_loss": -25.760766983032227, "global_step": 299707, "epoch": 3610} {"train_loss": -25.384685516357422, "global_step": 299708, "epoch": 3610} {"train_loss": -25.9615421295166, "global_step": 299709, "epoch": 3610} {"train_loss": -25.7175235748291, "global_step": 299710, "epoch": 3610} {"train_loss": -25.967609405517578, "global_step": 299711, "epoch": 3610} {"train_loss": -25.59509203807417, "global_step": 299712, "epoch": 3610, "val_loss": 7287057.0} {"train_loss": -25.720264434814453, "global_step": 299713, "epoch": 3611} {"train_loss": -25.642892837524414, "global_step": 299714, "epoch": 3611} {"train_loss": -25.80483055114746, "global_step": 299715, "epoch": 3611} {"train_loss": -25.63326072692871, "global_step": 299716, "epoch": 3611} {"train_loss": -25.8736572265625, "global_step": 299717, "epoch": 3611} {"train_loss": -25.77320671081543, "global_step": 299718, "epoch": 3611} {"train_loss": -25.78325843811035, "global_step": 299719, "epoch": 3611} {"train_loss": -25.616790771484375, "global_step": 299720, "epoch": 3611} {"train_loss": -25.651336669921875, "global_step": 299721, "epoch": 3611} {"train_loss": -25.157535552978516, "global_step": 299722, "epoch": 3611} {"train_loss": -25.590877532958984, "global_step": 299723, "epoch": 3611} {"train_loss": -25.48491668701172, "global_step": 299724, "epoch": 3611} {"train_loss": -25.652008056640625, "global_step": 299725, "epoch": 3611} {"train_loss": -25.787128448486328, "global_step": 299726, "epoch": 3611} {"train_loss": -25.68842887878418, "global_step": 299727, "epoch": 3611} {"train_loss": -25.655927658081055, "global_step": 299728, "epoch": 3611} {"train_loss": -25.571491241455078, "global_step": 299729, "epoch": 3611} {"train_loss": -25.301916122436523, "global_step": 299730, "epoch": 3611} {"train_loss": -25.569808959960938, "global_step": 299731, "epoch": 3611} {"train_loss": -25.72653579711914, "global_step": 299732, "epoch": 3611} {"train_loss": -25.433691024780273, "global_step": 299733, "epoch": 3611} {"train_loss": -25.22267723083496, "global_step": 299734, "epoch": 3611} {"train_loss": -25.58426284790039, "global_step": 299735, "epoch": 3611} {"train_loss": -25.48811149597168, "global_step": 299736, "epoch": 3611} {"train_loss": -25.45180892944336, "global_step": 299737, "epoch": 3611} {"train_loss": -25.626401901245117, "global_step": 299738, "epoch": 3611} {"train_loss": -25.60761070251465, "global_step": 299739, "epoch": 3611} {"train_loss": -25.7845401763916, "global_step": 299740, "epoch": 3611} {"train_loss": -25.239242553710938, "global_step": 299741, "epoch": 3611} {"train_loss": -25.157367706298828, "global_step": 299742, "epoch": 3611} {"train_loss": -25.500064849853516, "global_step": 299743, "epoch": 3611} {"train_loss": -25.459278106689453, "global_step": 299744, "epoch": 3611} {"train_loss": -25.447240829467773, "global_step": 299745, "epoch": 3611} {"train_loss": -25.265058517456055, "global_step": 299746, "epoch": 3611} {"train_loss": -25.046142578125, "global_step": 299747, "epoch": 3611} {"train_loss": -25.19463348388672, "global_step": 299748, "epoch": 3611} {"train_loss": -25.78314208984375, "global_step": 299749, "epoch": 3611} {"train_loss": -25.475961685180664, "global_step": 299750, "epoch": 3611} {"train_loss": -25.44375991821289, "global_step": 299751, "epoch": 3611} {"train_loss": -25.5875186920166, "global_step": 299752, "epoch": 3611} {"train_loss": -25.49725914001465, "global_step": 299753, "epoch": 3611} {"train_loss": -25.282697677612305, "global_step": 299754, "epoch": 3611} {"train_loss": -25.42932891845703, "global_step": 299755, "epoch": 3611} {"train_loss": -25.791187286376953, "global_step": 299756, "epoch": 3611} {"train_loss": -25.82741355895996, "global_step": 299757, "epoch": 3611} {"train_loss": -25.90067481994629, "global_step": 299758, "epoch": 3611} {"train_loss": -25.508190155029297, "global_step": 299759, "epoch": 3611} {"train_loss": -25.365278244018555, "global_step": 299760, "epoch": 3611} {"train_loss": -25.45674705505371, "global_step": 299761, "epoch": 3611} {"train_loss": -25.606664657592773, "global_step": 299762, "epoch": 3611} {"train_loss": -25.80743980407715, "global_step": 299763, "epoch": 3611} {"train_loss": -25.78346061706543, "global_step": 299764, "epoch": 3611} {"train_loss": -25.73085594177246, "global_step": 299765, "epoch": 3611} {"train_loss": -25.772504806518555, "global_step": 299766, "epoch": 3611} {"train_loss": -25.84039878845215, "global_step": 299767, "epoch": 3611} {"train_loss": -26.088281631469727, "global_step": 299768, "epoch": 3611} {"train_loss": -25.678680419921875, "global_step": 299769, "epoch": 3611} {"train_loss": -25.785186767578125, "global_step": 299770, "epoch": 3611} {"train_loss": -25.73421287536621, "global_step": 299771, "epoch": 3611} {"train_loss": -26.06910514831543, "global_step": 299772, "epoch": 3611} {"train_loss": -25.55387306213379, "global_step": 299773, "epoch": 3611} {"train_loss": -25.548154830932617, "global_step": 299774, "epoch": 3611} {"train_loss": -25.95419692993164, "global_step": 299775, "epoch": 3611} {"train_loss": -25.799270629882812, "global_step": 299776, "epoch": 3611} {"train_loss": -25.887632369995117, "global_step": 299777, "epoch": 3611} {"train_loss": -25.802448272705078, "global_step": 299778, "epoch": 3611} {"train_loss": -25.661645889282227, "global_step": 299779, "epoch": 3611} {"train_loss": -25.491912841796875, "global_step": 299780, "epoch": 3611} {"train_loss": -25.651941299438477, "global_step": 299781, "epoch": 3611} {"train_loss": -25.740121841430664, "global_step": 299782, "epoch": 3611} {"train_loss": -25.49880027770996, "global_step": 299783, "epoch": 3611} {"train_loss": -25.91116714477539, "global_step": 299784, "epoch": 3611} {"train_loss": -25.732284545898438, "global_step": 299785, "epoch": 3611} {"train_loss": -25.450895309448242, "global_step": 299786, "epoch": 3611} {"train_loss": -25.00092315673828, "global_step": 299787, "epoch": 3611} {"train_loss": -25.542268753051758, "global_step": 299788, "epoch": 3611} {"train_loss": -25.70947265625, "global_step": 299789, "epoch": 3611} {"train_loss": -25.704547882080078, "global_step": 299790, "epoch": 3611} {"train_loss": -25.6130428314209, "global_step": 299791, "epoch": 3611} {"train_loss": -25.41395378112793, "global_step": 299792, "epoch": 3611} {"train_loss": -25.152297973632812, "global_step": 299793, "epoch": 3611} {"train_loss": -25.346466064453125, "global_step": 299794, "epoch": 3611} {"train_loss": -25.609732938100056, "global_step": 299795, "epoch": 3611, "val_loss": 7234859.0} {"train_loss": -24.797317504882812, "global_step": 299796, "epoch": 3612} {"train_loss": -24.78048324584961, "global_step": 299797, "epoch": 3612} {"train_loss": -25.080127716064453, "global_step": 299798, "epoch": 3612} {"train_loss": -24.970239639282227, "global_step": 299799, "epoch": 3612} {"train_loss": -25.008527755737305, "global_step": 299800, "epoch": 3612} {"train_loss": -25.06138038635254, "global_step": 299801, "epoch": 3612} {"train_loss": -24.850906372070312, "global_step": 299802, "epoch": 3612} {"train_loss": -25.30634117126465, "global_step": 299803, "epoch": 3612} {"train_loss": -25.119871139526367, "global_step": 299804, "epoch": 3612} {"train_loss": -25.188007354736328, "global_step": 299805, "epoch": 3612} {"train_loss": -25.339521408081055, "global_step": 299806, "epoch": 3612} {"train_loss": -25.357040405273438, "global_step": 299807, "epoch": 3612} {"train_loss": -25.62885093688965, "global_step": 299808, "epoch": 3612} {"train_loss": -25.12660789489746, "global_step": 299809, "epoch": 3612} {"train_loss": -25.511632919311523, "global_step": 299810, "epoch": 3612} {"train_loss": -25.50400161743164, "global_step": 299811, "epoch": 3612} {"train_loss": -25.571853637695312, "global_step": 299812, "epoch": 3612} {"train_loss": -25.4479923248291, "global_step": 299813, "epoch": 3612} {"train_loss": -25.357131958007812, "global_step": 299814, "epoch": 3612} {"train_loss": -25.6490535736084, "global_step": 299815, "epoch": 3612} {"train_loss": -25.442537307739258, "global_step": 299816, "epoch": 3612} {"train_loss": -25.942047119140625, "global_step": 299817, "epoch": 3612} {"train_loss": -25.67591667175293, "global_step": 299818, "epoch": 3612} {"train_loss": -25.296186447143555, "global_step": 299819, "epoch": 3612} {"train_loss": -25.51193618774414, "global_step": 299820, "epoch": 3612} {"train_loss": -25.8648681640625, "global_step": 299821, "epoch": 3612} {"train_loss": -25.743635177612305, "global_step": 299822, "epoch": 3612} {"train_loss": -25.54901695251465, "global_step": 299823, "epoch": 3612} {"train_loss": -26.2156925201416, "global_step": 299824, "epoch": 3612} {"train_loss": -25.81854248046875, "global_step": 299825, "epoch": 3612} {"train_loss": -26.010969161987305, "global_step": 299826, "epoch": 3612} {"train_loss": -25.8298282623291, "global_step": 299827, "epoch": 3612} {"train_loss": -25.671478271484375, "global_step": 299828, "epoch": 3612} {"train_loss": -25.771839141845703, "global_step": 299829, "epoch": 3612} {"train_loss": -25.670560836791992, "global_step": 299830, "epoch": 3612} {"train_loss": -25.718412399291992, "global_step": 299831, "epoch": 3612} {"train_loss": -25.568891525268555, "global_step": 299832, "epoch": 3612} {"train_loss": -25.757349014282227, "global_step": 299833, "epoch": 3612} {"train_loss": -26.069477081298828, "global_step": 299834, "epoch": 3612} {"train_loss": -26.139698028564453, "global_step": 299835, "epoch": 3612} {"train_loss": -25.7183780670166, "global_step": 299836, "epoch": 3612} {"train_loss": -25.947772979736328, "global_step": 299837, "epoch": 3612} {"train_loss": -25.826217651367188, "global_step": 299838, "epoch": 3612} {"train_loss": -25.23570442199707, "global_step": 299839, "epoch": 3612} {"train_loss": -25.214841842651367, "global_step": 299840, "epoch": 3612} {"train_loss": -26.001251220703125, "global_step": 299841, "epoch": 3612} {"train_loss": -25.974227905273438, "global_step": 299842, "epoch": 3612} {"train_loss": -25.650922775268555, "global_step": 299843, "epoch": 3612} {"train_loss": -24.964628219604492, "global_step": 299844, "epoch": 3612} {"train_loss": -25.29374885559082, "global_step": 299845, "epoch": 3612} {"train_loss": -25.064300537109375, "global_step": 299846, "epoch": 3612} {"train_loss": -25.15321159362793, "global_step": 299847, "epoch": 3612} {"train_loss": -25.64896011352539, "global_step": 299848, "epoch": 3612} {"train_loss": -25.38814353942871, "global_step": 299849, "epoch": 3612} {"train_loss": -25.493738174438477, "global_step": 299850, "epoch": 3612} {"train_loss": -25.73219108581543, "global_step": 299851, "epoch": 3612} {"train_loss": -25.076889038085938, "global_step": 299852, "epoch": 3612} {"train_loss": -25.77828025817871, "global_step": 299853, "epoch": 3612} {"train_loss": -25.433256149291992, "global_step": 299854, "epoch": 3612} {"train_loss": -25.74100685119629, "global_step": 299855, "epoch": 3612} {"train_loss": -25.37005615234375, "global_step": 299856, "epoch": 3612} {"train_loss": -25.55021095275879, "global_step": 299857, "epoch": 3612} {"train_loss": -25.669464111328125, "global_step": 299858, "epoch": 3612} {"train_loss": -25.544782638549805, "global_step": 299859, "epoch": 3612} {"train_loss": -25.378759384155273, "global_step": 299860, "epoch": 3612} {"train_loss": -25.42890739440918, "global_step": 299861, "epoch": 3612} {"train_loss": -25.462017059326172, "global_step": 299862, "epoch": 3612} {"train_loss": -25.27058982849121, "global_step": 299863, "epoch": 3612} {"train_loss": -25.109724044799805, "global_step": 299864, "epoch": 3612} {"train_loss": -25.11102294921875, "global_step": 299865, "epoch": 3612} {"train_loss": -25.27356719970703, "global_step": 299866, "epoch": 3612} {"train_loss": -25.44973373413086, "global_step": 299867, "epoch": 3612} {"train_loss": -25.07526206970215, "global_step": 299868, "epoch": 3612} {"train_loss": -25.697065353393555, "global_step": 299869, "epoch": 3612} {"train_loss": -25.862232208251953, "global_step": 299870, "epoch": 3612} {"train_loss": -25.655744552612305, "global_step": 299871, "epoch": 3612} {"train_loss": -25.797590255737305, "global_step": 299872, "epoch": 3612} {"train_loss": -25.34427833557129, "global_step": 299873, "epoch": 3612} {"train_loss": -25.882238388061523, "global_step": 299874, "epoch": 3612} {"train_loss": -25.680822372436523, "global_step": 299875, "epoch": 3612} {"train_loss": -25.830371856689453, "global_step": 299876, "epoch": 3612} {"train_loss": -25.544702529907227, "global_step": 299877, "epoch": 3612} {"train_loss": -25.51868684607816, "global_step": 299878, "epoch": 3612, "val_loss": 7225287.0} {"train_loss": -25.284177780151367, "global_step": 299879, "epoch": 3613} {"train_loss": -25.56117057800293, "global_step": 299880, "epoch": 3613} {"train_loss": -25.4724178314209, "global_step": 299881, "epoch": 3613} {"train_loss": -25.704315185546875, "global_step": 299882, "epoch": 3613} {"train_loss": -25.114145278930664, "global_step": 299883, "epoch": 3613} {"train_loss": -25.61581802368164, "global_step": 299884, "epoch": 3613} {"train_loss": -25.584501266479492, "global_step": 299885, "epoch": 3613} {"train_loss": -25.886005401611328, "global_step": 299886, "epoch": 3613} {"train_loss": -25.3822078704834, "global_step": 299887, "epoch": 3613} {"train_loss": -25.459096908569336, "global_step": 299888, "epoch": 3613} {"train_loss": -25.55201530456543, "global_step": 299889, "epoch": 3613} {"train_loss": -25.645360946655273, "global_step": 299890, "epoch": 3613} {"train_loss": -25.747949600219727, "global_step": 299891, "epoch": 3613} {"train_loss": -25.7707462310791, "global_step": 299892, "epoch": 3613} {"train_loss": -25.513330459594727, "global_step": 299893, "epoch": 3613} {"train_loss": -25.704938888549805, "global_step": 299894, "epoch": 3613} {"train_loss": -25.8638916015625, "global_step": 299895, "epoch": 3613} {"train_loss": -25.949731826782227, "global_step": 299896, "epoch": 3613} {"train_loss": -25.459732055664062, "global_step": 299897, "epoch": 3613} {"train_loss": -25.7346248626709, "global_step": 299898, "epoch": 3613} {"train_loss": -25.58858299255371, "global_step": 299899, "epoch": 3613} {"train_loss": -25.738889694213867, "global_step": 299900, "epoch": 3613} {"train_loss": -25.301706314086914, "global_step": 299901, "epoch": 3613} {"train_loss": -25.707273483276367, "global_step": 299902, "epoch": 3613} {"train_loss": -25.51905632019043, "global_step": 299903, "epoch": 3613} {"train_loss": -25.206161499023438, "global_step": 299904, "epoch": 3613} {"train_loss": -25.08367919921875, "global_step": 299905, "epoch": 3613} {"train_loss": -24.969268798828125, "global_step": 299906, "epoch": 3613} {"train_loss": -25.48941421508789, "global_step": 299907, "epoch": 3613} {"train_loss": -25.680871963500977, "global_step": 299908, "epoch": 3613} {"train_loss": -25.16221809387207, "global_step": 299909, "epoch": 3613} {"train_loss": -24.95864486694336, "global_step": 299910, "epoch": 3613} {"train_loss": -24.652090072631836, "global_step": 299911, "epoch": 3613} {"train_loss": -25.506778717041016, "global_step": 299912, "epoch": 3613} {"train_loss": -24.7103214263916, "global_step": 299913, "epoch": 3613} {"train_loss": -25.271024703979492, "global_step": 299914, "epoch": 3613} {"train_loss": -24.892988204956055, "global_step": 299915, "epoch": 3613} {"train_loss": -25.425832748413086, "global_step": 299916, "epoch": 3613} {"train_loss": -25.142547607421875, "global_step": 299917, "epoch": 3613} {"train_loss": -25.30986976623535, "global_step": 299918, "epoch": 3613} {"train_loss": -25.54360580444336, "global_step": 299919, "epoch": 3613} {"train_loss": -25.600324630737305, "global_step": 299920, "epoch": 3613} {"train_loss": -25.513254165649414, "global_step": 299921, "epoch": 3613} {"train_loss": -25.286792755126953, "global_step": 299922, "epoch": 3613} {"train_loss": -25.451078414916992, "global_step": 299923, "epoch": 3613} {"train_loss": -25.5978946685791, "global_step": 299924, "epoch": 3613} {"train_loss": -25.724332809448242, "global_step": 299925, "epoch": 3613} {"train_loss": -25.523330688476562, "global_step": 299926, "epoch": 3613} {"train_loss": -25.73748779296875, "global_step": 299927, "epoch": 3613} {"train_loss": -25.60000991821289, "global_step": 299928, "epoch": 3613} {"train_loss": -25.770658493041992, "global_step": 299929, "epoch": 3613} {"train_loss": -25.29176902770996, "global_step": 299930, "epoch": 3613} {"train_loss": -25.7119083404541, "global_step": 299931, "epoch": 3613} {"train_loss": -25.758316040039062, "global_step": 299932, "epoch": 3613} {"train_loss": -25.749998092651367, "global_step": 299933, "epoch": 3613} {"train_loss": -25.847070693969727, "global_step": 299934, "epoch": 3613} {"train_loss": -25.944168090820312, "global_step": 299935, "epoch": 3613} {"train_loss": -25.54959487915039, "global_step": 299936, "epoch": 3613} {"train_loss": -25.885669708251953, "global_step": 299937, "epoch": 3613} {"train_loss": -25.857776641845703, "global_step": 299938, "epoch": 3613} {"train_loss": -25.799985885620117, "global_step": 299939, "epoch": 3613} {"train_loss": -25.825586318969727, "global_step": 299940, "epoch": 3613} {"train_loss": -26.09478187561035, "global_step": 299941, "epoch": 3613} {"train_loss": -25.761945724487305, "global_step": 299942, "epoch": 3613} {"train_loss": -26.02650260925293, "global_step": 299943, "epoch": 3613} {"train_loss": -25.875707626342773, "global_step": 299944, "epoch": 3613} {"train_loss": -25.69232177734375, "global_step": 299945, "epoch": 3613} {"train_loss": -25.563156127929688, "global_step": 299946, "epoch": 3613} {"train_loss": -25.808185577392578, "global_step": 299947, "epoch": 3613} {"train_loss": -25.569744110107422, "global_step": 299948, "epoch": 3613} {"train_loss": -25.868112564086914, "global_step": 299949, "epoch": 3613} {"train_loss": -25.849994659423828, "global_step": 299950, "epoch": 3613} {"train_loss": -25.760746002197266, "global_step": 299951, "epoch": 3613} {"train_loss": -25.768360137939453, "global_step": 299952, "epoch": 3613} {"train_loss": -25.829944610595703, "global_step": 299953, "epoch": 3613} {"train_loss": -25.572181701660156, "global_step": 299954, "epoch": 3613} {"train_loss": -25.86326026916504, "global_step": 299955, "epoch": 3613} {"train_loss": -25.58370590209961, "global_step": 299956, "epoch": 3613} {"train_loss": -25.653736114501953, "global_step": 299957, "epoch": 3613} {"train_loss": -25.76302146911621, "global_step": 299958, "epoch": 3613} {"train_loss": -25.87396240234375, "global_step": 299959, "epoch": 3613} {"train_loss": -25.641586303710938, "global_step": 299960, "epoch": 3613} {"train_loss": -25.577495023428675, "global_step": 299961, "epoch": 3613, "val_loss": 7159987.0} {"train_loss": -25.699750900268555, "global_step": 299962, "epoch": 3614} {"train_loss": -24.70984649658203, "global_step": 299963, "epoch": 3614} {"train_loss": -25.446823120117188, "global_step": 299964, "epoch": 3614} {"train_loss": -24.867225646972656, "global_step": 299965, "epoch": 3614} {"train_loss": -25.470510482788086, "global_step": 299966, "epoch": 3614} {"train_loss": -25.552566528320312, "global_step": 299967, "epoch": 3614} {"train_loss": -25.11785316467285, "global_step": 299968, "epoch": 3614} {"train_loss": -25.280122756958008, "global_step": 299969, "epoch": 3614} {"train_loss": -25.127094268798828, "global_step": 299970, "epoch": 3614} {"train_loss": -25.47802734375, "global_step": 299971, "epoch": 3614} {"train_loss": -24.94428062438965, "global_step": 299972, "epoch": 3614} {"train_loss": -25.40742301940918, "global_step": 299973, "epoch": 3614} {"train_loss": -25.553638458251953, "global_step": 299974, "epoch": 3614} {"train_loss": -25.036518096923828, "global_step": 299975, "epoch": 3614} {"train_loss": -25.15520668029785, "global_step": 299976, "epoch": 3614} {"train_loss": -25.232526779174805, "global_step": 299977, "epoch": 3614} {"train_loss": -25.63047218322754, "global_step": 299978, "epoch": 3614} {"train_loss": -25.31218719482422, "global_step": 299979, "epoch": 3614} {"train_loss": -25.203012466430664, "global_step": 299980, "epoch": 3614} {"train_loss": -25.190494537353516, "global_step": 299981, "epoch": 3614} {"train_loss": -25.420530319213867, "global_step": 299982, "epoch": 3614} {"train_loss": -24.731494903564453, "global_step": 299983, "epoch": 3614} {"train_loss": -25.5267276763916, "global_step": 299984, "epoch": 3614} {"train_loss": -25.070999145507812, "global_step": 299985, "epoch": 3614} {"train_loss": -25.609195709228516, "global_step": 299986, "epoch": 3614} {"train_loss": -25.260879516601562, "global_step": 299987, "epoch": 3614} {"train_loss": -25.347625732421875, "global_step": 299988, "epoch": 3614} {"train_loss": -25.37808609008789, "global_step": 299989, "epoch": 3614} {"train_loss": -25.170957565307617, "global_step": 299990, "epoch": 3614} {"train_loss": -25.512990951538086, "global_step": 299991, "epoch": 3614} {"train_loss": -25.47299575805664, "global_step": 299992, "epoch": 3614} {"train_loss": -25.625843048095703, "global_step": 299993, "epoch": 3614} {"train_loss": -25.639142990112305, "global_step": 299994, "epoch": 3614} {"train_loss": -25.654043197631836, "global_step": 299995, "epoch": 3614} {"train_loss": -25.24449348449707, "global_step": 299996, "epoch": 3614} {"train_loss": -25.5803279876709, "global_step": 299997, "epoch": 3614} {"train_loss": -25.56448745727539, "global_step": 299998, "epoch": 3614} {"train_loss": -25.68079948425293, "global_step": 299999, "epoch": 3614} {"train_loss": -25.7011661529541, "global_step": 300000, "epoch": 3614} {"train_loss": -25.83378028869629, "global_step": 300001, "epoch": 3614} {"train_loss": -25.556509017944336, "global_step": 300002, "epoch": 3614} {"train_loss": -25.816999435424805, "global_step": 300003, "epoch": 3614} {"train_loss": -25.690052032470703, "global_step": 300004, "epoch": 3614} {"train_loss": -25.709014892578125, "global_step": 300005, "epoch": 3614} {"train_loss": -25.789335250854492, "global_step": 300006, "epoch": 3614} {"train_loss": -25.850921630859375, "global_step": 300007, "epoch": 3614} {"train_loss": -25.992145538330078, "global_step": 300008, "epoch": 3614} {"train_loss": -26.0413875579834, "global_step": 300009, "epoch": 3614} {"train_loss": -25.93499183654785, "global_step": 300010, "epoch": 3614} {"train_loss": -25.854780197143555, "global_step": 300011, "epoch": 3614} {"train_loss": -25.682981491088867, "global_step": 300012, "epoch": 3614} {"train_loss": -25.96451187133789, "global_step": 300013, "epoch": 3614} {"train_loss": -25.8753662109375, "global_step": 300014, "epoch": 3614} {"train_loss": -25.47372817993164, "global_step": 300015, "epoch": 3614} {"train_loss": -25.955493927001953, "global_step": 300016, "epoch": 3614} {"train_loss": -25.41853904724121, "global_step": 300017, "epoch": 3614} {"train_loss": -26.012174606323242, "global_step": 300018, "epoch": 3614} {"train_loss": -25.863271713256836, "global_step": 300019, "epoch": 3614} {"train_loss": -25.655332565307617, "global_step": 300020, "epoch": 3614} {"train_loss": -25.606740951538086, "global_step": 300021, "epoch": 3614} {"train_loss": -25.318710327148438, "global_step": 300022, "epoch": 3614} {"train_loss": -25.745508193969727, "global_step": 300023, "epoch": 3614} {"train_loss": -25.896240234375, "global_step": 300024, "epoch": 3614} {"train_loss": -25.446916580200195, "global_step": 300025, "epoch": 3614} {"train_loss": -25.56638526916504, "global_step": 300026, "epoch": 3614} {"train_loss": -25.944814682006836, "global_step": 300027, "epoch": 3614} {"train_loss": -25.70479393005371, "global_step": 300028, "epoch": 3614} {"train_loss": -25.747756958007812, "global_step": 300029, "epoch": 3614} {"train_loss": -26.050922393798828, "global_step": 300030, "epoch": 3614} {"train_loss": -25.225797653198242, "global_step": 300031, "epoch": 3614} {"train_loss": -25.7952880859375, "global_step": 300032, "epoch": 3614} {"train_loss": -25.350048065185547, "global_step": 300033, "epoch": 3614} {"train_loss": -25.268346786499023, "global_step": 300034, "epoch": 3614} {"train_loss": -24.872602462768555, "global_step": 300035, "epoch": 3614} {"train_loss": -25.700559616088867, "global_step": 300036, "epoch": 3614} {"train_loss": -25.57499885559082, "global_step": 300037, "epoch": 3614} {"train_loss": -25.106197357177734, "global_step": 300038, "epoch": 3614} {"train_loss": -25.804563522338867, "global_step": 300039, "epoch": 3614} {"train_loss": -25.640783309936523, "global_step": 300040, "epoch": 3614} {"train_loss": -25.7510986328125, "global_step": 300041, "epoch": 3614} {"train_loss": -26.1441650390625, "global_step": 300042, "epoch": 3614} {"train_loss": -25.348880767822266, "global_step": 300043, "epoch": 3614} {"train_loss": -25.5360840946795, "global_step": 300044, "epoch": 3614, "val_loss": 7143246.5} {"train_loss": -24.438749313354492, "global_step": 300045, "epoch": 3615} {"train_loss": -24.692983627319336, "global_step": 300046, "epoch": 3615} {"train_loss": -24.685932159423828, "global_step": 300047, "epoch": 3615} {"train_loss": -24.829347610473633, "global_step": 300048, "epoch": 3615} {"train_loss": -24.80405044555664, "global_step": 300049, "epoch": 3615} {"train_loss": -24.46919059753418, "global_step": 300050, "epoch": 3615} {"train_loss": -24.823572158813477, "global_step": 300051, "epoch": 3615} {"train_loss": -25.302474975585938, "global_step": 300052, "epoch": 3615} {"train_loss": -24.940061569213867, "global_step": 300053, "epoch": 3615} {"train_loss": -25.168701171875, "global_step": 300054, "epoch": 3615} {"train_loss": -25.243106842041016, "global_step": 300055, "epoch": 3615} {"train_loss": -25.298242568969727, "global_step": 300056, "epoch": 3615} {"train_loss": -25.484806060791016, "global_step": 300057, "epoch": 3615} {"train_loss": -25.308652877807617, "global_step": 300058, "epoch": 3615} {"train_loss": -25.47683334350586, "global_step": 300059, "epoch": 3615} {"train_loss": -25.247787475585938, "global_step": 300060, "epoch": 3615} {"train_loss": -25.384544372558594, "global_step": 300061, "epoch": 3615} {"train_loss": -25.439697265625, "global_step": 300062, "epoch": 3615} {"train_loss": -25.34650993347168, "global_step": 300063, "epoch": 3615} {"train_loss": -25.135055541992188, "global_step": 300064, "epoch": 3615} {"train_loss": -25.041542053222656, "global_step": 300065, "epoch": 3615} {"train_loss": -25.843358993530273, "global_step": 300066, "epoch": 3615} {"train_loss": -25.368946075439453, "global_step": 300067, "epoch": 3615} {"train_loss": -25.196054458618164, "global_step": 300068, "epoch": 3615} {"train_loss": -25.33282470703125, "global_step": 300069, "epoch": 3615} {"train_loss": -25.894763946533203, "global_step": 300070, "epoch": 3615} {"train_loss": -25.344999313354492, "global_step": 300071, "epoch": 3615} {"train_loss": -25.600278854370117, "global_step": 300072, "epoch": 3615} {"train_loss": -25.804443359375, "global_step": 300073, "epoch": 3615} {"train_loss": -25.82038688659668, "global_step": 300074, "epoch": 3615} {"train_loss": -25.539945602416992, "global_step": 300075, "epoch": 3615} {"train_loss": -25.73927116394043, "global_step": 300076, "epoch": 3615} {"train_loss": -26.030004501342773, "global_step": 300077, "epoch": 3615} {"train_loss": -25.7414493560791, "global_step": 300078, "epoch": 3615} {"train_loss": -25.61988639831543, "global_step": 300079, "epoch": 3615} {"train_loss": -25.576297760009766, "global_step": 300080, "epoch": 3615} {"train_loss": -25.523136138916016, "global_step": 300081, "epoch": 3615} {"train_loss": -26.01124382019043, "global_step": 300082, "epoch": 3615} {"train_loss": -25.492263793945312, "global_step": 300083, "epoch": 3615} {"train_loss": -25.482898712158203, "global_step": 300084, "epoch": 3615} {"train_loss": -25.845800399780273, "global_step": 300085, "epoch": 3615} {"train_loss": -25.995569229125977, "global_step": 300086, "epoch": 3615} {"train_loss": -26.054357528686523, "global_step": 300087, "epoch": 3615} {"train_loss": -25.669897079467773, "global_step": 300088, "epoch": 3615} {"train_loss": -25.693769454956055, "global_step": 300089, "epoch": 3615} {"train_loss": -25.695636749267578, "global_step": 300090, "epoch": 3615} {"train_loss": -26.12421989440918, "global_step": 300091, "epoch": 3615} {"train_loss": -25.781909942626953, "global_step": 300092, "epoch": 3615} {"train_loss": -25.785730361938477, "global_step": 300093, "epoch": 3615} {"train_loss": -25.896759033203125, "global_step": 300094, "epoch": 3615} {"train_loss": -26.099042892456055, "global_step": 300095, "epoch": 3615} {"train_loss": -25.613737106323242, "global_step": 300096, "epoch": 3615} {"train_loss": -26.057443618774414, "global_step": 300097, "epoch": 3615} {"train_loss": -25.887338638305664, "global_step": 300098, "epoch": 3615} {"train_loss": -25.6295166015625, "global_step": 300099, "epoch": 3615} {"train_loss": -25.564044952392578, "global_step": 300100, "epoch": 3615} {"train_loss": -25.513599395751953, "global_step": 300101, "epoch": 3615} {"train_loss": -25.516300201416016, "global_step": 300102, "epoch": 3615} {"train_loss": -25.142484664916992, "global_step": 300103, "epoch": 3615} {"train_loss": -25.140445709228516, "global_step": 300104, "epoch": 3615} {"train_loss": -25.7265625, "global_step": 300105, "epoch": 3615} {"train_loss": -25.25025177001953, "global_step": 300106, "epoch": 3615} {"train_loss": -25.552518844604492, "global_step": 300107, "epoch": 3615} {"train_loss": -25.772382736206055, "global_step": 300108, "epoch": 3615} {"train_loss": -26.132307052612305, "global_step": 300109, "epoch": 3615} {"train_loss": -25.69874382019043, "global_step": 300110, "epoch": 3615} {"train_loss": -25.623151779174805, "global_step": 300111, "epoch": 3615} {"train_loss": -25.642370223999023, "global_step": 300112, "epoch": 3615} {"train_loss": -25.746774673461914, "global_step": 300113, "epoch": 3615} {"train_loss": -25.841161727905273, "global_step": 300114, "epoch": 3615} {"train_loss": -25.487531661987305, "global_step": 300115, "epoch": 3615} {"train_loss": -25.352548599243164, "global_step": 300116, "epoch": 3615} {"train_loss": -25.668827056884766, "global_step": 300117, "epoch": 3615} {"train_loss": -25.59396743774414, "global_step": 300118, "epoch": 3615} {"train_loss": -25.7799129486084, "global_step": 300119, "epoch": 3615} {"train_loss": -25.542333602905273, "global_step": 300120, "epoch": 3615} {"train_loss": -25.72604751586914, "global_step": 300121, "epoch": 3615} {"train_loss": -25.970062255859375, "global_step": 300122, "epoch": 3615} {"train_loss": -25.7208194732666, "global_step": 300123, "epoch": 3615} {"train_loss": -25.715810775756836, "global_step": 300124, "epoch": 3615} {"train_loss": -25.863723754882812, "global_step": 300125, "epoch": 3615} {"train_loss": -26.184782028198242, "global_step": 300126, "epoch": 3615} {"train_loss": -25.537766468094055, "global_step": 300127, "epoch": 3615, "val_loss": 7202739.0} {"train_loss": -25.2086124420166, "global_step": 300128, "epoch": 3616} {"train_loss": -25.190597534179688, "global_step": 300129, "epoch": 3616} {"train_loss": -25.499683380126953, "global_step": 300130, "epoch": 3616} {"train_loss": -25.23146629333496, "global_step": 300131, "epoch": 3616} {"train_loss": -25.039316177368164, "global_step": 300132, "epoch": 3616} {"train_loss": -25.67034339904785, "global_step": 300133, "epoch": 3616} {"train_loss": -25.196378707885742, "global_step": 300134, "epoch": 3616} {"train_loss": -25.42795181274414, "global_step": 300135, "epoch": 3616} {"train_loss": -25.110692977905273, "global_step": 300136, "epoch": 3616} {"train_loss": -25.495338439941406, "global_step": 300137, "epoch": 3616} {"train_loss": -25.439565658569336, "global_step": 300138, "epoch": 3616} {"train_loss": -25.53364372253418, "global_step": 300139, "epoch": 3616} {"train_loss": -25.4489688873291, "global_step": 300140, "epoch": 3616} {"train_loss": -25.48526954650879, "global_step": 300141, "epoch": 3616} {"train_loss": -25.48936653137207, "global_step": 300142, "epoch": 3616} {"train_loss": -25.581340789794922, "global_step": 300143, "epoch": 3616} {"train_loss": -25.53289794921875, "global_step": 300144, "epoch": 3616} {"train_loss": -25.788074493408203, "global_step": 300145, "epoch": 3616} {"train_loss": -25.666990280151367, "global_step": 300146, "epoch": 3616} {"train_loss": -25.53095817565918, "global_step": 300147, "epoch": 3616} {"train_loss": -25.98550796508789, "global_step": 300148, "epoch": 3616} {"train_loss": -25.572324752807617, "global_step": 300149, "epoch": 3616} {"train_loss": -25.515605926513672, "global_step": 300150, "epoch": 3616} {"train_loss": -25.62200927734375, "global_step": 300151, "epoch": 3616} {"train_loss": -25.65394401550293, "global_step": 300152, "epoch": 3616} {"train_loss": -25.727415084838867, "global_step": 300153, "epoch": 3616} {"train_loss": -25.9720401763916, "global_step": 300154, "epoch": 3616} {"train_loss": -25.86457633972168, "global_step": 300155, "epoch": 3616} {"train_loss": -25.754117965698242, "global_step": 300156, "epoch": 3616} {"train_loss": -25.892505645751953, "global_step": 300157, "epoch": 3616} {"train_loss": -25.481191635131836, "global_step": 300158, "epoch": 3616} {"train_loss": -26.09808349609375, "global_step": 300159, "epoch": 3616} {"train_loss": -25.527734756469727, "global_step": 300160, "epoch": 3616} {"train_loss": -25.9245548248291, "global_step": 300161, "epoch": 3616} {"train_loss": -25.56781768798828, "global_step": 300162, "epoch": 3616} {"train_loss": -25.71394157409668, "global_step": 300163, "epoch": 3616} {"train_loss": -25.677581787109375, "global_step": 300164, "epoch": 3616} {"train_loss": -25.969091415405273, "global_step": 300165, "epoch": 3616} {"train_loss": -25.872150421142578, "global_step": 300166, "epoch": 3616} {"train_loss": -25.763235092163086, "global_step": 300167, "epoch": 3616} {"train_loss": -25.731983184814453, "global_step": 300168, "epoch": 3616} {"train_loss": -25.60663414001465, "global_step": 300169, "epoch": 3616} {"train_loss": -25.842273712158203, "global_step": 300170, "epoch": 3616} {"train_loss": -25.7305965423584, "global_step": 300171, "epoch": 3616} {"train_loss": -25.54414939880371, "global_step": 300172, "epoch": 3616} {"train_loss": -25.95747184753418, "global_step": 300173, "epoch": 3616} {"train_loss": -25.835790634155273, "global_step": 300174, "epoch": 3616} {"train_loss": -26.235595703125, "global_step": 300175, "epoch": 3616} {"train_loss": -25.906042098999023, "global_step": 300176, "epoch": 3616} {"train_loss": -25.507793426513672, "global_step": 300177, "epoch": 3616} {"train_loss": -25.849334716796875, "global_step": 300178, "epoch": 3616} {"train_loss": -25.982593536376953, "global_step": 300179, "epoch": 3616} {"train_loss": -25.714557647705078, "global_step": 300180, "epoch": 3616} {"train_loss": -25.89443016052246, "global_step": 300181, "epoch": 3616} {"train_loss": -25.50372886657715, "global_step": 300182, "epoch": 3616} {"train_loss": -25.536991119384766, "global_step": 300183, "epoch": 3616} {"train_loss": -25.51312255859375, "global_step": 300184, "epoch": 3616} {"train_loss": -25.693571090698242, "global_step": 300185, "epoch": 3616} {"train_loss": -25.865875244140625, "global_step": 300186, "epoch": 3616} {"train_loss": -25.537866592407227, "global_step": 300187, "epoch": 3616} {"train_loss": -25.960397720336914, "global_step": 300188, "epoch": 3616} {"train_loss": -25.494714736938477, "global_step": 300189, "epoch": 3616} {"train_loss": -25.365478515625, "global_step": 300190, "epoch": 3616} {"train_loss": -25.909711837768555, "global_step": 300191, "epoch": 3616} {"train_loss": -25.60882568359375, "global_step": 300192, "epoch": 3616} {"train_loss": -25.3220157623291, "global_step": 300193, "epoch": 3616} {"train_loss": -25.705322265625, "global_step": 300194, "epoch": 3616} {"train_loss": -25.263038635253906, "global_step": 300195, "epoch": 3616} {"train_loss": -25.754789352416992, "global_step": 300196, "epoch": 3616} {"train_loss": -25.889612197875977, "global_step": 300197, "epoch": 3616} {"train_loss": -25.972753524780273, "global_step": 300198, "epoch": 3616} {"train_loss": -25.478771209716797, "global_step": 300199, "epoch": 3616} {"train_loss": -25.542617797851562, "global_step": 300200, "epoch": 3616} {"train_loss": -25.339353561401367, "global_step": 300201, "epoch": 3616} {"train_loss": -25.75603675842285, "global_step": 300202, "epoch": 3616} {"train_loss": -26.237028121948242, "global_step": 300203, "epoch": 3616} {"train_loss": -25.7070255279541, "global_step": 300204, "epoch": 3616} {"train_loss": -25.555707931518555, "global_step": 300205, "epoch": 3616} {"train_loss": -25.546297073364258, "global_step": 300206, "epoch": 3616} {"train_loss": -25.278667449951172, "global_step": 300207, "epoch": 3616} {"train_loss": -26.009017944335938, "global_step": 300208, "epoch": 3616} {"train_loss": -25.573949813842773, "global_step": 300209, "epoch": 3616} {"train_loss": -25.638466547770673, "global_step": 300210, "epoch": 3616, "val_loss": 7063491.0} {"train_loss": -25.291107177734375, "global_step": 300211, "epoch": 3617} {"train_loss": -24.36628532409668, "global_step": 300212, "epoch": 3617} {"train_loss": -23.766311645507812, "global_step": 300213, "epoch": 3617} {"train_loss": -24.46412467956543, "global_step": 300214, "epoch": 3617} {"train_loss": -25.468008041381836, "global_step": 300215, "epoch": 3617} {"train_loss": -24.074138641357422, "global_step": 300216, "epoch": 3617} {"train_loss": -24.72048568725586, "global_step": 300217, "epoch": 3617} {"train_loss": -25.451038360595703, "global_step": 300218, "epoch": 3617} {"train_loss": -24.647470474243164, "global_step": 300219, "epoch": 3617} {"train_loss": -25.198959350585938, "global_step": 300220, "epoch": 3617} {"train_loss": -25.061819076538086, "global_step": 300221, "epoch": 3617} {"train_loss": -25.08924674987793, "global_step": 300222, "epoch": 3617} {"train_loss": -25.204370498657227, "global_step": 300223, "epoch": 3617} {"train_loss": -25.07778549194336, "global_step": 300224, "epoch": 3617} {"train_loss": -25.715240478515625, "global_step": 300225, "epoch": 3617} {"train_loss": -25.12293815612793, "global_step": 300226, "epoch": 3617} {"train_loss": -25.05781364440918, "global_step": 300227, "epoch": 3617} {"train_loss": -25.422842025756836, "global_step": 300228, "epoch": 3617} {"train_loss": -25.35053062438965, "global_step": 300229, "epoch": 3617} {"train_loss": -25.1435604095459, "global_step": 300230, "epoch": 3617} {"train_loss": -25.259191513061523, "global_step": 300231, "epoch": 3617} {"train_loss": -25.464902877807617, "global_step": 300232, "epoch": 3617} {"train_loss": -25.467592239379883, "global_step": 300233, "epoch": 3617} {"train_loss": -25.4094295501709, "global_step": 300234, "epoch": 3617} {"train_loss": -25.422948837280273, "global_step": 300235, "epoch": 3617} {"train_loss": -25.537952423095703, "global_step": 300236, "epoch": 3617} {"train_loss": -25.687978744506836, "global_step": 300237, "epoch": 3617} {"train_loss": -25.86806297302246, "global_step": 300238, "epoch": 3617} {"train_loss": -25.19024658203125, "global_step": 300239, "epoch": 3617} {"train_loss": -25.263595581054688, "global_step": 300240, "epoch": 3617} {"train_loss": -25.74688720703125, "global_step": 300241, "epoch": 3617} {"train_loss": -25.685504913330078, "global_step": 300242, "epoch": 3617} {"train_loss": -25.21870994567871, "global_step": 300243, "epoch": 3617} {"train_loss": -25.532848358154297, "global_step": 300244, "epoch": 3617} {"train_loss": -25.417837142944336, "global_step": 300245, "epoch": 3617} {"train_loss": -25.65150260925293, "global_step": 300246, "epoch": 3617} {"train_loss": -25.73211669921875, "global_step": 300247, "epoch": 3617} {"train_loss": -25.132959365844727, "global_step": 300248, "epoch": 3617} {"train_loss": -25.645116806030273, "global_step": 300249, "epoch": 3617} {"train_loss": -25.816741943359375, "global_step": 300250, "epoch": 3617} {"train_loss": -25.61228370666504, "global_step": 300251, "epoch": 3617} {"train_loss": -25.29792594909668, "global_step": 300252, "epoch": 3617} {"train_loss": -25.43738555908203, "global_step": 300253, "epoch": 3617} {"train_loss": -25.735605239868164, "global_step": 300254, "epoch": 3617} {"train_loss": -25.61138343811035, "global_step": 300255, "epoch": 3617} {"train_loss": -25.445348739624023, "global_step": 300256, "epoch": 3617} {"train_loss": -25.61126136779785, "global_step": 300257, "epoch": 3617} {"train_loss": -25.51120948791504, "global_step": 300258, "epoch": 3617} {"train_loss": -25.51266860961914, "global_step": 300259, "epoch": 3617} {"train_loss": -25.456262588500977, "global_step": 300260, "epoch": 3617} {"train_loss": -25.597946166992188, "global_step": 300261, "epoch": 3617} {"train_loss": -25.55500602722168, "global_step": 300262, "epoch": 3617} {"train_loss": -25.732885360717773, "global_step": 300263, "epoch": 3617} {"train_loss": -25.420166015625, "global_step": 300264, "epoch": 3617} {"train_loss": -25.687414169311523, "global_step": 300265, "epoch": 3617} {"train_loss": -26.16963005065918, "global_step": 300266, "epoch": 3617} {"train_loss": -25.512187957763672, "global_step": 300267, "epoch": 3617} {"train_loss": -25.62006187438965, "global_step": 300268, "epoch": 3617} {"train_loss": -25.754520416259766, "global_step": 300269, "epoch": 3617} {"train_loss": -25.688764572143555, "global_step": 300270, "epoch": 3617} {"train_loss": -25.546104431152344, "global_step": 300271, "epoch": 3617} {"train_loss": -25.872472763061523, "global_step": 300272, "epoch": 3617} {"train_loss": -25.512454986572266, "global_step": 300273, "epoch": 3617} {"train_loss": -25.38313865661621, "global_step": 300274, "epoch": 3617} {"train_loss": -25.243650436401367, "global_step": 300275, "epoch": 3617} {"train_loss": -25.094520568847656, "global_step": 300276, "epoch": 3617} {"train_loss": -24.821687698364258, "global_step": 300277, "epoch": 3617} {"train_loss": -25.53799819946289, "global_step": 300278, "epoch": 3617} {"train_loss": -25.7613582611084, "global_step": 300279, "epoch": 3617} {"train_loss": -24.932159423828125, "global_step": 300280, "epoch": 3617} {"train_loss": -25.214096069335938, "global_step": 300281, "epoch": 3617} {"train_loss": -25.914569854736328, "global_step": 300282, "epoch": 3617} {"train_loss": -25.86783218383789, "global_step": 300283, "epoch": 3617} {"train_loss": -25.796003341674805, "global_step": 300284, "epoch": 3617} {"train_loss": -25.414892196655273, "global_step": 300285, "epoch": 3617} {"train_loss": -25.38770866394043, "global_step": 300286, "epoch": 3617} {"train_loss": -26.032562255859375, "global_step": 300287, "epoch": 3617} {"train_loss": -25.794361114501953, "global_step": 300288, "epoch": 3617} {"train_loss": -26.05487632751465, "global_step": 300289, "epoch": 3617} {"train_loss": -25.6987361907959, "global_step": 300290, "epoch": 3617} {"train_loss": -25.87082862854004, "global_step": 300291, "epoch": 3617} {"train_loss": -25.910261154174805, "global_step": 300292, "epoch": 3617} {"train_loss": -25.414333274565546, "global_step": 300293, "epoch": 3617, "val_loss": 7136691.0} {"train_loss": -24.897924423217773, "global_step": 300294, "epoch": 3618} {"train_loss": -25.080127716064453, "global_step": 300295, "epoch": 3618} {"train_loss": -25.052621841430664, "global_step": 300296, "epoch": 3618} {"train_loss": -25.543981552124023, "global_step": 300297, "epoch": 3618} {"train_loss": -24.82818603515625, "global_step": 300298, "epoch": 3618} {"train_loss": -24.744321823120117, "global_step": 300299, "epoch": 3618} {"train_loss": -24.943058013916016, "global_step": 300300, "epoch": 3618} {"train_loss": -25.2959041595459, "global_step": 300301, "epoch": 3618} {"train_loss": -24.831077575683594, "global_step": 300302, "epoch": 3618} {"train_loss": -25.118755340576172, "global_step": 300303, "epoch": 3618} {"train_loss": -25.492895126342773, "global_step": 300304, "epoch": 3618} {"train_loss": -25.33050537109375, "global_step": 300305, "epoch": 3618} {"train_loss": -25.126684188842773, "global_step": 300306, "epoch": 3618} {"train_loss": -25.452787399291992, "global_step": 300307, "epoch": 3618} {"train_loss": -25.674230575561523, "global_step": 300308, "epoch": 3618} {"train_loss": -25.33631706237793, "global_step": 300309, "epoch": 3618} {"train_loss": -25.384546279907227, "global_step": 300310, "epoch": 3618} {"train_loss": -25.455530166625977, "global_step": 300311, "epoch": 3618} {"train_loss": -25.37569236755371, "global_step": 300312, "epoch": 3618} {"train_loss": -25.41788673400879, "global_step": 300313, "epoch": 3618} {"train_loss": -25.255828857421875, "global_step": 300314, "epoch": 3618} {"train_loss": -25.580215454101562, "global_step": 300315, "epoch": 3618} {"train_loss": -25.438156127929688, "global_step": 300316, "epoch": 3618} {"train_loss": -25.336444854736328, "global_step": 300317, "epoch": 3618} {"train_loss": -26.245920181274414, "global_step": 300318, "epoch": 3618} {"train_loss": -25.46596336364746, "global_step": 300319, "epoch": 3618} {"train_loss": -25.50691032409668, "global_step": 300320, "epoch": 3618} {"train_loss": -25.98023796081543, "global_step": 300321, "epoch": 3618} {"train_loss": -25.994375228881836, "global_step": 300322, "epoch": 3618} {"train_loss": -25.458911895751953, "global_step": 300323, "epoch": 3618} {"train_loss": -25.60701560974121, "global_step": 300324, "epoch": 3618} {"train_loss": -26.065214157104492, "global_step": 300325, "epoch": 3618} {"train_loss": -26.0313720703125, "global_step": 300326, "epoch": 3618} {"train_loss": -25.414398193359375, "global_step": 300327, "epoch": 3618} {"train_loss": -25.927602767944336, "global_step": 300328, "epoch": 3618} {"train_loss": -25.587921142578125, "global_step": 300329, "epoch": 3618} {"train_loss": -26.161712646484375, "global_step": 300330, "epoch": 3618} {"train_loss": -25.22355079650879, "global_step": 300331, "epoch": 3618} {"train_loss": -25.711414337158203, "global_step": 300332, "epoch": 3618} {"train_loss": -25.934431076049805, "global_step": 300333, "epoch": 3618} {"train_loss": -25.17762565612793, "global_step": 300334, "epoch": 3618} {"train_loss": -25.542142868041992, "global_step": 300335, "epoch": 3618} {"train_loss": -25.603195190429688, "global_step": 300336, "epoch": 3618} {"train_loss": -25.785512924194336, "global_step": 300337, "epoch": 3618} {"train_loss": -25.367528915405273, "global_step": 300338, "epoch": 3618} {"train_loss": -25.904285430908203, "global_step": 300339, "epoch": 3618} {"train_loss": -25.820281982421875, "global_step": 300340, "epoch": 3618} {"train_loss": -25.7139835357666, "global_step": 300341, "epoch": 3618} {"train_loss": -25.63492202758789, "global_step": 300342, "epoch": 3618} {"train_loss": -25.912885665893555, "global_step": 300343, "epoch": 3618} {"train_loss": -25.560340881347656, "global_step": 300344, "epoch": 3618} {"train_loss": -25.631610870361328, "global_step": 300345, "epoch": 3618} {"train_loss": -25.4692440032959, "global_step": 300346, "epoch": 3618} {"train_loss": -25.7418212890625, "global_step": 300347, "epoch": 3618} {"train_loss": -25.81935691833496, "global_step": 300348, "epoch": 3618} {"train_loss": -25.777524948120117, "global_step": 300349, "epoch": 3618} {"train_loss": -25.232473373413086, "global_step": 300350, "epoch": 3618} {"train_loss": -25.54156494140625, "global_step": 300351, "epoch": 3618} {"train_loss": -25.837615966796875, "global_step": 300352, "epoch": 3618} {"train_loss": -25.405685424804688, "global_step": 300353, "epoch": 3618} {"train_loss": -25.715717315673828, "global_step": 300354, "epoch": 3618} {"train_loss": -25.475509643554688, "global_step": 300355, "epoch": 3618} {"train_loss": -25.572067260742188, "global_step": 300356, "epoch": 3618} {"train_loss": -25.585596084594727, "global_step": 300357, "epoch": 3618} {"train_loss": -25.230016708374023, "global_step": 300358, "epoch": 3618} {"train_loss": -25.107685089111328, "global_step": 300359, "epoch": 3618} {"train_loss": -25.236495971679688, "global_step": 300360, "epoch": 3618} {"train_loss": -25.221023559570312, "global_step": 300361, "epoch": 3618} {"train_loss": -25.678781509399414, "global_step": 300362, "epoch": 3618} {"train_loss": -25.65614128112793, "global_step": 300363, "epoch": 3618} {"train_loss": -25.195425033569336, "global_step": 300364, "epoch": 3618} {"train_loss": -25.527318954467773, "global_step": 300365, "epoch": 3618} {"train_loss": -25.403905868530273, "global_step": 300366, "epoch": 3618} {"train_loss": -25.647876739501953, "global_step": 300367, "epoch": 3618} {"train_loss": -25.264179229736328, "global_step": 300368, "epoch": 3618} {"train_loss": -25.445850372314453, "global_step": 300369, "epoch": 3618} {"train_loss": -25.771270751953125, "global_step": 300370, "epoch": 3618} {"train_loss": -25.511493682861328, "global_step": 300371, "epoch": 3618} {"train_loss": -25.2642765045166, "global_step": 300372, "epoch": 3618} {"train_loss": -25.837936401367188, "global_step": 300373, "epoch": 3618} {"train_loss": -25.422636032104492, "global_step": 300374, "epoch": 3618} {"train_loss": -25.390893936157227, "global_step": 300375, "epoch": 3618} {"train_loss": -25.499555587768555, "global_step": 300376, "epoch": 3618, "val_loss": 7261477.0} {"train_loss": -24.73069190979004, "global_step": 300377, "epoch": 3619} {"train_loss": -25.216455459594727, "global_step": 300378, "epoch": 3619} {"train_loss": -24.993892669677734, "global_step": 300379, "epoch": 3619} {"train_loss": -24.391103744506836, "global_step": 300380, "epoch": 3619} {"train_loss": -25.603717803955078, "global_step": 300381, "epoch": 3619} {"train_loss": -25.178186416625977, "global_step": 300382, "epoch": 3619} {"train_loss": -25.137025833129883, "global_step": 300383, "epoch": 3619} {"train_loss": -25.251541137695312, "global_step": 300384, "epoch": 3619} {"train_loss": -25.758228302001953, "global_step": 300385, "epoch": 3619} {"train_loss": -25.386781692504883, "global_step": 300386, "epoch": 3619} {"train_loss": -25.400165557861328, "global_step": 300387, "epoch": 3619} {"train_loss": -25.5446720123291, "global_step": 300388, "epoch": 3619} {"train_loss": -25.22629737854004, "global_step": 300389, "epoch": 3619} {"train_loss": -25.005979537963867, "global_step": 300390, "epoch": 3619} {"train_loss": -25.51542091369629, "global_step": 300391, "epoch": 3619} {"train_loss": -25.696603775024414, "global_step": 300392, "epoch": 3619} {"train_loss": -25.329801559448242, "global_step": 300393, "epoch": 3619} {"train_loss": -25.393775939941406, "global_step": 300394, "epoch": 3619} {"train_loss": -25.696680068969727, "global_step": 300395, "epoch": 3619} {"train_loss": -25.562522888183594, "global_step": 300396, "epoch": 3619} {"train_loss": -25.060596466064453, "global_step": 300397, "epoch": 3619} {"train_loss": -25.193220138549805, "global_step": 300398, "epoch": 3619} {"train_loss": -25.644678115844727, "global_step": 300399, "epoch": 3619} {"train_loss": -25.855224609375, "global_step": 300400, "epoch": 3619} {"train_loss": -25.947681427001953, "global_step": 300401, "epoch": 3619} {"train_loss": -25.46881103515625, "global_step": 300402, "epoch": 3619} {"train_loss": -25.469701766967773, "global_step": 300403, "epoch": 3619} {"train_loss": -25.800817489624023, "global_step": 300404, "epoch": 3619} {"train_loss": -25.513532638549805, "global_step": 300405, "epoch": 3619} {"train_loss": -25.8028564453125, "global_step": 300406, "epoch": 3619} {"train_loss": -25.81507682800293, "global_step": 300407, "epoch": 3619} {"train_loss": -25.538442611694336, "global_step": 300408, "epoch": 3619} {"train_loss": -25.83623695373535, "global_step": 300409, "epoch": 3619} {"train_loss": -25.903711318969727, "global_step": 300410, "epoch": 3619} {"train_loss": -25.551002502441406, "global_step": 300411, "epoch": 3619} {"train_loss": -25.698474884033203, "global_step": 300412, "epoch": 3619} {"train_loss": -25.641820907592773, "global_step": 300413, "epoch": 3619} {"train_loss": -25.550378799438477, "global_step": 300414, "epoch": 3619} {"train_loss": -25.8253231048584, "global_step": 300415, "epoch": 3619} {"train_loss": -25.40488624572754, "global_step": 300416, "epoch": 3619} {"train_loss": -25.88852882385254, "global_step": 300417, "epoch": 3619} {"train_loss": -25.469038009643555, "global_step": 300418, "epoch": 3619} {"train_loss": -25.669940948486328, "global_step": 300419, "epoch": 3619} {"train_loss": -25.919281005859375, "global_step": 300420, "epoch": 3619} {"train_loss": -25.760549545288086, "global_step": 300421, "epoch": 3619} {"train_loss": -25.415437698364258, "global_step": 300422, "epoch": 3619} {"train_loss": -25.783166885375977, "global_step": 300423, "epoch": 3619} {"train_loss": -25.973636627197266, "global_step": 300424, "epoch": 3619} {"train_loss": -25.532236099243164, "global_step": 300425, "epoch": 3619} {"train_loss": -25.96135902404785, "global_step": 300426, "epoch": 3619} {"train_loss": -25.49201011657715, "global_step": 300427, "epoch": 3619} {"train_loss": -25.552627563476562, "global_step": 300428, "epoch": 3619} {"train_loss": -25.570240020751953, "global_step": 300429, "epoch": 3619} {"train_loss": -25.93511390686035, "global_step": 300430, "epoch": 3619} {"train_loss": -25.470361709594727, "global_step": 300431, "epoch": 3619} {"train_loss": -25.607330322265625, "global_step": 300432, "epoch": 3619} {"train_loss": -25.670764923095703, "global_step": 300433, "epoch": 3619} {"train_loss": -25.840103149414062, "global_step": 300434, "epoch": 3619} {"train_loss": -25.528112411499023, "global_step": 300435, "epoch": 3619} {"train_loss": -25.82195472717285, "global_step": 300436, "epoch": 3619} {"train_loss": -25.9466552734375, "global_step": 300437, "epoch": 3619} {"train_loss": -25.758481979370117, "global_step": 300438, "epoch": 3619} {"train_loss": -25.878387451171875, "global_step": 300439, "epoch": 3619} {"train_loss": -25.613676071166992, "global_step": 300440, "epoch": 3619} {"train_loss": -25.582056045532227, "global_step": 300441, "epoch": 3619} {"train_loss": -25.172964096069336, "global_step": 300442, "epoch": 3619} {"train_loss": -25.795337677001953, "global_step": 300443, "epoch": 3619} {"train_loss": -25.82611656188965, "global_step": 300444, "epoch": 3619} {"train_loss": -25.7742862701416, "global_step": 300445, "epoch": 3619} {"train_loss": -25.5428409576416, "global_step": 300446, "epoch": 3619} {"train_loss": -25.61053466796875, "global_step": 300447, "epoch": 3619} {"train_loss": -25.145490646362305, "global_step": 300448, "epoch": 3619} {"train_loss": -25.69417381286621, "global_step": 300449, "epoch": 3619} {"train_loss": -25.722253799438477, "global_step": 300450, "epoch": 3619} {"train_loss": -25.63433265686035, "global_step": 300451, "epoch": 3619} {"train_loss": -25.58698081970215, "global_step": 300452, "epoch": 3619} {"train_loss": -25.74854850769043, "global_step": 300453, "epoch": 3619} {"train_loss": -25.456226348876953, "global_step": 300454, "epoch": 3619} {"train_loss": -25.696409225463867, "global_step": 300455, "epoch": 3619} {"train_loss": -25.7705020904541, "global_step": 300456, "epoch": 3619} {"train_loss": -25.891202926635742, "global_step": 300457, "epoch": 3619} {"train_loss": -25.76603126525879, "global_step": 300458, "epoch": 3619} {"train_loss": -25.559668000922144, "global_step": 300459, "epoch": 3619, "val_loss": 7300882.0} {"train_loss": -24.925601959228516, "global_step": 300460, "epoch": 3620} {"train_loss": -24.6489315032959, "global_step": 300461, "epoch": 3620} {"train_loss": -24.85198402404785, "global_step": 300462, "epoch": 3620} {"train_loss": -25.324390411376953, "global_step": 300463, "epoch": 3620} {"train_loss": -25.227619171142578, "global_step": 300464, "epoch": 3620} {"train_loss": -25.2644100189209, "global_step": 300465, "epoch": 3620} {"train_loss": -25.274580001831055, "global_step": 300466, "epoch": 3620} {"train_loss": -25.745996475219727, "global_step": 300467, "epoch": 3620} {"train_loss": -24.904159545898438, "global_step": 300468, "epoch": 3620} {"train_loss": -25.087202072143555, "global_step": 300469, "epoch": 3620} {"train_loss": -25.427785873413086, "global_step": 300470, "epoch": 3620} {"train_loss": -25.465848922729492, "global_step": 300471, "epoch": 3620} {"train_loss": -25.366905212402344, "global_step": 300472, "epoch": 3620} {"train_loss": -25.080371856689453, "global_step": 300473, "epoch": 3620} {"train_loss": -25.220943450927734, "global_step": 300474, "epoch": 3620} {"train_loss": -25.634729385375977, "global_step": 300475, "epoch": 3620} {"train_loss": -25.65528678894043, "global_step": 300476, "epoch": 3620} {"train_loss": -25.515867233276367, "global_step": 300477, "epoch": 3620} {"train_loss": -25.6339111328125, "global_step": 300478, "epoch": 3620} {"train_loss": -25.534900665283203, "global_step": 300479, "epoch": 3620} {"train_loss": -25.723718643188477, "global_step": 300480, "epoch": 3620} {"train_loss": -25.44854164123535, "global_step": 300481, "epoch": 3620} {"train_loss": -25.7274112701416, "global_step": 300482, "epoch": 3620} {"train_loss": -25.375415802001953, "global_step": 300483, "epoch": 3620} {"train_loss": -25.71988868713379, "global_step": 300484, "epoch": 3620} {"train_loss": -25.5304012298584, "global_step": 300485, "epoch": 3620} {"train_loss": -25.82221031188965, "global_step": 300486, "epoch": 3620} {"train_loss": -25.812376022338867, "global_step": 300487, "epoch": 3620} {"train_loss": -25.86246681213379, "global_step": 300488, "epoch": 3620} {"train_loss": -25.705337524414062, "global_step": 300489, "epoch": 3620} {"train_loss": -25.79840087890625, "global_step": 300490, "epoch": 3620} {"train_loss": -25.81156349182129, "global_step": 300491, "epoch": 3620} {"train_loss": -25.840560913085938, "global_step": 300492, "epoch": 3620} {"train_loss": -26.03114128112793, "global_step": 300493, "epoch": 3620} {"train_loss": -25.318740844726562, "global_step": 300494, "epoch": 3620} {"train_loss": -25.691314697265625, "global_step": 300495, "epoch": 3620} {"train_loss": -25.770116806030273, "global_step": 300496, "epoch": 3620} {"train_loss": -25.92438316345215, "global_step": 300497, "epoch": 3620} {"train_loss": -25.933624267578125, "global_step": 300498, "epoch": 3620} {"train_loss": -25.469213485717773, "global_step": 300499, "epoch": 3620} {"train_loss": -25.790735244750977, "global_step": 300500, "epoch": 3620} {"train_loss": -25.953861236572266, "global_step": 300501, "epoch": 3620} {"train_loss": -25.770177841186523, "global_step": 300502, "epoch": 3620} {"train_loss": -25.616241455078125, "global_step": 300503, "epoch": 3620} {"train_loss": -25.901952743530273, "global_step": 300504, "epoch": 3620} {"train_loss": -25.736404418945312, "global_step": 300505, "epoch": 3620} {"train_loss": -25.96670913696289, "global_step": 300506, "epoch": 3620} {"train_loss": -25.707870483398438, "global_step": 300507, "epoch": 3620} {"train_loss": -25.694787979125977, "global_step": 300508, "epoch": 3620} {"train_loss": -25.69978141784668, "global_step": 300509, "epoch": 3620} {"train_loss": -24.7135066986084, "global_step": 300510, "epoch": 3620} {"train_loss": -24.653522491455078, "global_step": 300511, "epoch": 3620} {"train_loss": -24.226842880249023, "global_step": 300512, "epoch": 3620} {"train_loss": -25.38887596130371, "global_step": 300513, "epoch": 3620} {"train_loss": -25.56943130493164, "global_step": 300514, "epoch": 3620} {"train_loss": -25.316518783569336, "global_step": 300515, "epoch": 3620} {"train_loss": -25.427703857421875, "global_step": 300516, "epoch": 3620} {"train_loss": -25.772891998291016, "global_step": 300517, "epoch": 3620} {"train_loss": -25.762121200561523, "global_step": 300518, "epoch": 3620} {"train_loss": -25.67146873474121, "global_step": 300519, "epoch": 3620} {"train_loss": -25.64313316345215, "global_step": 300520, "epoch": 3620} {"train_loss": -25.9492244720459, "global_step": 300521, "epoch": 3620} {"train_loss": -25.610471725463867, "global_step": 300522, "epoch": 3620} {"train_loss": -25.409162521362305, "global_step": 300523, "epoch": 3620} {"train_loss": -25.033414840698242, "global_step": 300524, "epoch": 3620} {"train_loss": -25.803442001342773, "global_step": 300525, "epoch": 3620} {"train_loss": -25.531768798828125, "global_step": 300526, "epoch": 3620} {"train_loss": -25.68267250061035, "global_step": 300527, "epoch": 3620} {"train_loss": -25.442462921142578, "global_step": 300528, "epoch": 3620} {"train_loss": -25.3944149017334, "global_step": 300529, "epoch": 3620} {"train_loss": -25.76079750061035, "global_step": 300530, "epoch": 3620} {"train_loss": -25.257978439331055, "global_step": 300531, "epoch": 3620} {"train_loss": -25.59549903869629, "global_step": 300532, "epoch": 3620} {"train_loss": -25.582998275756836, "global_step": 300533, "epoch": 3620} {"train_loss": -25.47413444519043, "global_step": 300534, "epoch": 3620} {"train_loss": -25.762470245361328, "global_step": 300535, "epoch": 3620} {"train_loss": -25.468652725219727, "global_step": 300536, "epoch": 3620} {"train_loss": -25.724105834960938, "global_step": 300537, "epoch": 3620} {"train_loss": -25.807449340820312, "global_step": 300538, "epoch": 3620} {"train_loss": -25.726964950561523, "global_step": 300539, "epoch": 3620} {"train_loss": -25.895954132080078, "global_step": 300540, "epoch": 3620} {"train_loss": -26.01189613342285, "global_step": 300541, "epoch": 3620} {"train_loss": -25.545402067253388, "global_step": 300542, "epoch": 3620, "val_loss": 7217411.0} {"train_loss": -25.136106491088867, "global_step": 300543, "epoch": 3621} {"train_loss": -24.2469539642334, "global_step": 300544, "epoch": 3621} {"train_loss": -25.116474151611328, "global_step": 300545, "epoch": 3621} {"train_loss": -25.295093536376953, "global_step": 300546, "epoch": 3621} {"train_loss": -25.084402084350586, "global_step": 300547, "epoch": 3621} {"train_loss": -25.78999137878418, "global_step": 300548, "epoch": 3621} {"train_loss": -25.533538818359375, "global_step": 300549, "epoch": 3621} {"train_loss": -25.412277221679688, "global_step": 300550, "epoch": 3621} {"train_loss": -25.342758178710938, "global_step": 300551, "epoch": 3621} {"train_loss": -25.515594482421875, "global_step": 300552, "epoch": 3621} {"train_loss": -25.410751342773438, "global_step": 300553, "epoch": 3621} {"train_loss": -25.472110748291016, "global_step": 300554, "epoch": 3621} {"train_loss": -25.15236473083496, "global_step": 300555, "epoch": 3621} {"train_loss": -25.52436065673828, "global_step": 300556, "epoch": 3621} {"train_loss": -25.332626342773438, "global_step": 300557, "epoch": 3621} {"train_loss": -25.354150772094727, "global_step": 300558, "epoch": 3621} {"train_loss": -25.573759078979492, "global_step": 300559, "epoch": 3621} {"train_loss": -25.986114501953125, "global_step": 300560, "epoch": 3621} {"train_loss": -25.671920776367188, "global_step": 300561, "epoch": 3621} {"train_loss": -25.24195098876953, "global_step": 300562, "epoch": 3621} {"train_loss": -25.2780818939209, "global_step": 300563, "epoch": 3621} {"train_loss": -25.02070426940918, "global_step": 300564, "epoch": 3621} {"train_loss": -25.520084381103516, "global_step": 300565, "epoch": 3621} {"train_loss": -25.428478240966797, "global_step": 300566, "epoch": 3621} {"train_loss": -25.826440811157227, "global_step": 300567, "epoch": 3621} {"train_loss": -25.529184341430664, "global_step": 300568, "epoch": 3621} {"train_loss": -25.13795280456543, "global_step": 300569, "epoch": 3621} {"train_loss": -25.640995025634766, "global_step": 300570, "epoch": 3621} {"train_loss": -25.277084350585938, "global_step": 300571, "epoch": 3621} {"train_loss": -25.41257667541504, "global_step": 300572, "epoch": 3621} {"train_loss": -25.4827938079834, "global_step": 300573, "epoch": 3621} {"train_loss": -25.4575252532959, "global_step": 300574, "epoch": 3621} {"train_loss": -25.302303314208984, "global_step": 300575, "epoch": 3621} {"train_loss": -25.557205200195312, "global_step": 300576, "epoch": 3621} {"train_loss": -25.665119171142578, "global_step": 300577, "epoch": 3621} {"train_loss": -25.828611373901367, "global_step": 300578, "epoch": 3621} {"train_loss": -25.381017684936523, "global_step": 300579, "epoch": 3621} {"train_loss": -25.77802848815918, "global_step": 300580, "epoch": 3621} {"train_loss": -25.92341423034668, "global_step": 300581, "epoch": 3621} {"train_loss": -25.41510772705078, "global_step": 300582, "epoch": 3621} {"train_loss": -25.63447380065918, "global_step": 300583, "epoch": 3621} {"train_loss": -25.630695343017578, "global_step": 300584, "epoch": 3621} {"train_loss": -25.92897605895996, "global_step": 300585, "epoch": 3621} {"train_loss": -26.0889892578125, "global_step": 300586, "epoch": 3621} {"train_loss": -25.922040939331055, "global_step": 300587, "epoch": 3621} {"train_loss": -25.791906356811523, "global_step": 300588, "epoch": 3621} {"train_loss": -25.87354850769043, "global_step": 300589, "epoch": 3621} {"train_loss": -26.179855346679688, "global_step": 300590, "epoch": 3621} {"train_loss": -25.857267379760742, "global_step": 300591, "epoch": 3621} {"train_loss": -25.386882781982422, "global_step": 300592, "epoch": 3621} {"train_loss": -25.932804107666016, "global_step": 300593, "epoch": 3621} {"train_loss": -25.450204849243164, "global_step": 300594, "epoch": 3621} {"train_loss": -25.706134796142578, "global_step": 300595, "epoch": 3621} {"train_loss": -25.57744026184082, "global_step": 300596, "epoch": 3621} {"train_loss": -25.588132858276367, "global_step": 300597, "epoch": 3621} {"train_loss": -25.435623168945312, "global_step": 300598, "epoch": 3621} {"train_loss": -25.915014266967773, "global_step": 300599, "epoch": 3621} {"train_loss": -25.730443954467773, "global_step": 300600, "epoch": 3621} {"train_loss": -25.980224609375, "global_step": 300601, "epoch": 3621} {"train_loss": -25.313583374023438, "global_step": 300602, "epoch": 3621} {"train_loss": -26.1708927154541, "global_step": 300603, "epoch": 3621} {"train_loss": -26.04444694519043, "global_step": 300604, "epoch": 3621} {"train_loss": -25.31599998474121, "global_step": 300605, "epoch": 3621} {"train_loss": -25.98929786682129, "global_step": 300606, "epoch": 3621} {"train_loss": -25.893064498901367, "global_step": 300607, "epoch": 3621} {"train_loss": -25.50351333618164, "global_step": 300608, "epoch": 3621} {"train_loss": -25.721487045288086, "global_step": 300609, "epoch": 3621} {"train_loss": -25.740690231323242, "global_step": 300610, "epoch": 3621} {"train_loss": -25.436555862426758, "global_step": 300611, "epoch": 3621} {"train_loss": -25.454120635986328, "global_step": 300612, "epoch": 3621} {"train_loss": -25.592737197875977, "global_step": 300613, "epoch": 3621} {"train_loss": -25.49952507019043, "global_step": 300614, "epoch": 3621} {"train_loss": -25.69772720336914, "global_step": 300615, "epoch": 3621} {"train_loss": -25.904449462890625, "global_step": 300616, "epoch": 3621} {"train_loss": -25.77631950378418, "global_step": 300617, "epoch": 3621} {"train_loss": -25.56341552734375, "global_step": 300618, "epoch": 3621} {"train_loss": -25.763341903686523, "global_step": 300619, "epoch": 3621} {"train_loss": -25.2750244140625, "global_step": 300620, "epoch": 3621} {"train_loss": -25.359943389892578, "global_step": 300621, "epoch": 3621} {"train_loss": -25.792814254760742, "global_step": 300622, "epoch": 3621} {"train_loss": -25.420373916625977, "global_step": 300623, "epoch": 3621} {"train_loss": -25.175979614257812, "global_step": 300624, "epoch": 3621} {"train_loss": -25.566132212259685, "global_step": 300625, "epoch": 3621, "val_loss": 7332977.5} {"train_loss": -23.105819702148438, "global_step": 300626, "epoch": 3622} {"train_loss": -23.86350440979004, "global_step": 300627, "epoch": 3622} {"train_loss": -23.8817138671875, "global_step": 300628, "epoch": 3622} {"train_loss": -24.893142700195312, "global_step": 300629, "epoch": 3622} {"train_loss": -24.839908599853516, "global_step": 300630, "epoch": 3622} {"train_loss": -23.9381160736084, "global_step": 300631, "epoch": 3622} {"train_loss": -25.006498336791992, "global_step": 300632, "epoch": 3622} {"train_loss": -24.628833770751953, "global_step": 300633, "epoch": 3622} {"train_loss": -24.92958641052246, "global_step": 300634, "epoch": 3622} {"train_loss": -24.944917678833008, "global_step": 300635, "epoch": 3622} {"train_loss": -24.785663604736328, "global_step": 300636, "epoch": 3622} {"train_loss": -25.127784729003906, "global_step": 300637, "epoch": 3622} {"train_loss": -25.212682723999023, "global_step": 300638, "epoch": 3622} {"train_loss": -25.125993728637695, "global_step": 300639, "epoch": 3622} {"train_loss": -25.3261775970459, "global_step": 300640, "epoch": 3622} {"train_loss": -24.959518432617188, "global_step": 300641, "epoch": 3622} {"train_loss": -24.9392147064209, "global_step": 300642, "epoch": 3622} {"train_loss": -25.25691032409668, "global_step": 300643, "epoch": 3622} {"train_loss": -24.990997314453125, "global_step": 300644, "epoch": 3622} {"train_loss": -25.48080062866211, "global_step": 300645, "epoch": 3622} {"train_loss": -25.429216384887695, "global_step": 300646, "epoch": 3622} {"train_loss": -25.645252227783203, "global_step": 300647, "epoch": 3622} {"train_loss": -25.537561416625977, "global_step": 300648, "epoch": 3622} {"train_loss": -25.388490676879883, "global_step": 300649, "epoch": 3622} {"train_loss": -25.270925521850586, "global_step": 300650, "epoch": 3622} {"train_loss": -25.868301391601562, "global_step": 300651, "epoch": 3622} {"train_loss": -25.71382713317871, "global_step": 300652, "epoch": 3622} {"train_loss": -25.667306900024414, "global_step": 300653, "epoch": 3622} {"train_loss": -25.491668701171875, "global_step": 300654, "epoch": 3622} {"train_loss": -25.69327735900879, "global_step": 300655, "epoch": 3622} {"train_loss": -25.415130615234375, "global_step": 300656, "epoch": 3622} {"train_loss": -25.652135848999023, "global_step": 300657, "epoch": 3622} {"train_loss": -25.453859329223633, "global_step": 300658, "epoch": 3622} {"train_loss": -25.68745994567871, "global_step": 300659, "epoch": 3622} {"train_loss": -25.67523765563965, "global_step": 300660, "epoch": 3622} {"train_loss": -25.717010498046875, "global_step": 300661, "epoch": 3622} {"train_loss": -25.21176528930664, "global_step": 300662, "epoch": 3622} {"train_loss": -25.586843490600586, "global_step": 300663, "epoch": 3622} {"train_loss": -25.480222702026367, "global_step": 300664, "epoch": 3622} {"train_loss": -25.263580322265625, "global_step": 300665, "epoch": 3622} {"train_loss": -25.529630661010742, "global_step": 300666, "epoch": 3622} {"train_loss": -25.468929290771484, "global_step": 300667, "epoch": 3622} {"train_loss": -25.578580856323242, "global_step": 300668, "epoch": 3622} {"train_loss": -25.564802169799805, "global_step": 300669, "epoch": 3622} {"train_loss": -25.43656349182129, "global_step": 300670, "epoch": 3622} {"train_loss": -25.639572143554688, "global_step": 300671, "epoch": 3622} {"train_loss": -25.466571807861328, "global_step": 300672, "epoch": 3622} {"train_loss": -25.52764320373535, "global_step": 300673, "epoch": 3622} {"train_loss": -25.66766929626465, "global_step": 300674, "epoch": 3622} {"train_loss": -25.22798728942871, "global_step": 300675, "epoch": 3622} {"train_loss": -25.471054077148438, "global_step": 300676, "epoch": 3622} {"train_loss": -25.220731735229492, "global_step": 300677, "epoch": 3622} {"train_loss": -25.772851943969727, "global_step": 300678, "epoch": 3622} {"train_loss": -25.545494079589844, "global_step": 300679, "epoch": 3622} {"train_loss": -25.425262451171875, "global_step": 300680, "epoch": 3622} {"train_loss": -25.501829147338867, "global_step": 300681, "epoch": 3622} {"train_loss": -25.447296142578125, "global_step": 300682, "epoch": 3622} {"train_loss": -25.52552604675293, "global_step": 300683, "epoch": 3622} {"train_loss": -25.191631317138672, "global_step": 300684, "epoch": 3622} {"train_loss": -25.55854606628418, "global_step": 300685, "epoch": 3622} {"train_loss": -25.602148056030273, "global_step": 300686, "epoch": 3622} {"train_loss": -25.455923080444336, "global_step": 300687, "epoch": 3622} {"train_loss": -25.616867065429688, "global_step": 300688, "epoch": 3622} {"train_loss": -25.303823471069336, "global_step": 300689, "epoch": 3622} {"train_loss": -25.956897735595703, "global_step": 300690, "epoch": 3622} {"train_loss": -25.544719696044922, "global_step": 300691, "epoch": 3622} {"train_loss": -25.411985397338867, "global_step": 300692, "epoch": 3622} {"train_loss": -25.46132469177246, "global_step": 300693, "epoch": 3622} {"train_loss": -25.676136016845703, "global_step": 300694, "epoch": 3622} {"train_loss": -25.527984619140625, "global_step": 300695, "epoch": 3622} {"train_loss": -25.405410766601562, "global_step": 300696, "epoch": 3622} {"train_loss": -25.898578643798828, "global_step": 300697, "epoch": 3622} {"train_loss": -25.591970443725586, "global_step": 300698, "epoch": 3622} {"train_loss": -25.231372833251953, "global_step": 300699, "epoch": 3622} {"train_loss": -25.5390682220459, "global_step": 300700, "epoch": 3622} {"train_loss": -25.822973251342773, "global_step": 300701, "epoch": 3622} {"train_loss": -25.897192001342773, "global_step": 300702, "epoch": 3622} {"train_loss": -26.13898277282715, "global_step": 300703, "epoch": 3622} {"train_loss": -25.868139266967773, "global_step": 300704, "epoch": 3622} {"train_loss": -25.447769165039062, "global_step": 300705, "epoch": 3622} {"train_loss": -25.948566436767578, "global_step": 300706, "epoch": 3622} {"train_loss": -25.84918785095215, "global_step": 300707, "epoch": 3622} {"train_loss": -25.371804202895568, "global_step": 300708, "epoch": 3622, "val_loss": 7031520.0} {"train_loss": -25.258787155151367, "global_step": 300709, "epoch": 3623} {"train_loss": -25.26815414428711, "global_step": 300710, "epoch": 3623} {"train_loss": -25.051559448242188, "global_step": 300711, "epoch": 3623} {"train_loss": -25.243438720703125, "global_step": 300712, "epoch": 3623} {"train_loss": -25.50653648376465, "global_step": 300713, "epoch": 3623} {"train_loss": -25.273401260375977, "global_step": 300714, "epoch": 3623} {"train_loss": -24.694997787475586, "global_step": 300715, "epoch": 3623} {"train_loss": -25.0170955657959, "global_step": 300716, "epoch": 3623} {"train_loss": -25.502588272094727, "global_step": 300717, "epoch": 3623} {"train_loss": -24.961599349975586, "global_step": 300718, "epoch": 3623} {"train_loss": -25.036418914794922, "global_step": 300719, "epoch": 3623} {"train_loss": -25.515398025512695, "global_step": 300720, "epoch": 3623} {"train_loss": -25.505643844604492, "global_step": 300721, "epoch": 3623} {"train_loss": -25.546703338623047, "global_step": 300722, "epoch": 3623} {"train_loss": -25.16826629638672, "global_step": 300723, "epoch": 3623} {"train_loss": -25.710376739501953, "global_step": 300724, "epoch": 3623} {"train_loss": -25.583995819091797, "global_step": 300725, "epoch": 3623} {"train_loss": -25.838794708251953, "global_step": 300726, "epoch": 3623} {"train_loss": -25.519298553466797, "global_step": 300727, "epoch": 3623} {"train_loss": -25.560373306274414, "global_step": 300728, "epoch": 3623} {"train_loss": -25.691003799438477, "global_step": 300729, "epoch": 3623} {"train_loss": -25.40732192993164, "global_step": 300730, "epoch": 3623} {"train_loss": -25.6509952545166, "global_step": 300731, "epoch": 3623} {"train_loss": -25.55119514465332, "global_step": 300732, "epoch": 3623} {"train_loss": -26.046125411987305, "global_step": 300733, "epoch": 3623} {"train_loss": -26.04755210876465, "global_step": 300734, "epoch": 3623} {"train_loss": -25.57568359375, "global_step": 300735, "epoch": 3623} {"train_loss": -25.643497467041016, "global_step": 300736, "epoch": 3623} {"train_loss": -25.67853355407715, "global_step": 300737, "epoch": 3623} {"train_loss": -25.499128341674805, "global_step": 300738, "epoch": 3623} {"train_loss": -25.834821701049805, "global_step": 300739, "epoch": 3623} {"train_loss": -25.445171356201172, "global_step": 300740, "epoch": 3623} {"train_loss": -25.50298500061035, "global_step": 300741, "epoch": 3623} {"train_loss": -25.7020320892334, "global_step": 300742, "epoch": 3623} {"train_loss": -25.467496871948242, "global_step": 300743, "epoch": 3623} {"train_loss": -25.751733779907227, "global_step": 300744, "epoch": 3623} {"train_loss": -25.7404842376709, "global_step": 300745, "epoch": 3623} {"train_loss": -26.124343872070312, "global_step": 300746, "epoch": 3623} {"train_loss": -25.3981990814209, "global_step": 300747, "epoch": 3623} {"train_loss": -25.418203353881836, "global_step": 300748, "epoch": 3623} {"train_loss": -25.55801010131836, "global_step": 300749, "epoch": 3623} {"train_loss": -25.6727352142334, "global_step": 300750, "epoch": 3623} {"train_loss": -25.106359481811523, "global_step": 300751, "epoch": 3623} {"train_loss": -25.50686264038086, "global_step": 300752, "epoch": 3623} {"train_loss": -25.636144638061523, "global_step": 300753, "epoch": 3623} {"train_loss": -25.724756240844727, "global_step": 300754, "epoch": 3623} {"train_loss": -25.248516082763672, "global_step": 300755, "epoch": 3623} {"train_loss": -25.7296085357666, "global_step": 300756, "epoch": 3623} {"train_loss": -25.57539176940918, "global_step": 300757, "epoch": 3623} {"train_loss": -25.964801788330078, "global_step": 300758, "epoch": 3623} {"train_loss": -25.363027572631836, "global_step": 300759, "epoch": 3623} {"train_loss": -25.602649688720703, "global_step": 300760, "epoch": 3623} {"train_loss": -26.059497833251953, "global_step": 300761, "epoch": 3623} {"train_loss": -25.23457908630371, "global_step": 300762, "epoch": 3623} {"train_loss": -25.78726577758789, "global_step": 300763, "epoch": 3623} {"train_loss": -25.361053466796875, "global_step": 300764, "epoch": 3623} {"train_loss": -25.647836685180664, "global_step": 300765, "epoch": 3623} {"train_loss": -25.429868698120117, "global_step": 300766, "epoch": 3623} {"train_loss": -25.7608642578125, "global_step": 300767, "epoch": 3623} {"train_loss": -25.507822036743164, "global_step": 300768, "epoch": 3623} {"train_loss": -25.691431045532227, "global_step": 300769, "epoch": 3623} {"train_loss": -25.6850528717041, "global_step": 300770, "epoch": 3623} {"train_loss": -25.654699325561523, "global_step": 300771, "epoch": 3623} {"train_loss": -25.68485450744629, "global_step": 300772, "epoch": 3623} {"train_loss": -25.680768966674805, "global_step": 300773, "epoch": 3623} {"train_loss": -25.903446197509766, "global_step": 300774, "epoch": 3623} {"train_loss": -25.481903076171875, "global_step": 300775, "epoch": 3623} {"train_loss": -25.732004165649414, "global_step": 300776, "epoch": 3623} {"train_loss": -25.824132919311523, "global_step": 300777, "epoch": 3623} {"train_loss": -25.480161666870117, "global_step": 300778, "epoch": 3623} {"train_loss": -25.984485626220703, "global_step": 300779, "epoch": 3623} {"train_loss": -25.692996978759766, "global_step": 300780, "epoch": 3623} {"train_loss": -25.32596206665039, "global_step": 300781, "epoch": 3623} {"train_loss": -25.60613441467285, "global_step": 300782, "epoch": 3623} {"train_loss": -25.642271041870117, "global_step": 300783, "epoch": 3623} {"train_loss": -25.643152236938477, "global_step": 300784, "epoch": 3623} {"train_loss": -25.61561393737793, "global_step": 300785, "epoch": 3623} {"train_loss": -26.013376235961914, "global_step": 300786, "epoch": 3623} {"train_loss": -25.72101402282715, "global_step": 300787, "epoch": 3623} {"train_loss": -25.635061264038086, "global_step": 300788, "epoch": 3623} {"train_loss": -25.541873931884766, "global_step": 300789, "epoch": 3623} {"train_loss": -25.495059967041016, "global_step": 300790, "epoch": 3623} {"train_loss": -25.548720233411675, "global_step": 300791, "epoch": 3623, "val_loss": 7234895.5} {"train_loss": -24.63702964782715, "global_step": 300792, "epoch": 3624} {"train_loss": -24.861791610717773, "global_step": 300793, "epoch": 3624} {"train_loss": -25.247703552246094, "global_step": 300794, "epoch": 3624} {"train_loss": -25.018049240112305, "global_step": 300795, "epoch": 3624} {"train_loss": -24.847929000854492, "global_step": 300796, "epoch": 3624} {"train_loss": -25.507282257080078, "global_step": 300797, "epoch": 3624} {"train_loss": -24.520179748535156, "global_step": 300798, "epoch": 3624} {"train_loss": -25.092832565307617, "global_step": 300799, "epoch": 3624} {"train_loss": -25.037702560424805, "global_step": 300800, "epoch": 3624} {"train_loss": -25.35146141052246, "global_step": 300801, "epoch": 3624} {"train_loss": -25.661407470703125, "global_step": 300802, "epoch": 3624} {"train_loss": -25.49329948425293, "global_step": 300803, "epoch": 3624} {"train_loss": -25.56475067138672, "global_step": 300804, "epoch": 3624} {"train_loss": -25.623825073242188, "global_step": 300805, "epoch": 3624} {"train_loss": -25.311359405517578, "global_step": 300806, "epoch": 3624} {"train_loss": -25.399492263793945, "global_step": 300807, "epoch": 3624} {"train_loss": -25.563230514526367, "global_step": 300808, "epoch": 3624} {"train_loss": -25.41168212890625, "global_step": 300809, "epoch": 3624} {"train_loss": -25.258150100708008, "global_step": 300810, "epoch": 3624} {"train_loss": -25.506521224975586, "global_step": 300811, "epoch": 3624} {"train_loss": -25.352922439575195, "global_step": 300812, "epoch": 3624} {"train_loss": -25.458412170410156, "global_step": 300813, "epoch": 3624} {"train_loss": -25.160917282104492, "global_step": 300814, "epoch": 3624} {"train_loss": -25.121898651123047, "global_step": 300815, "epoch": 3624} {"train_loss": -25.308820724487305, "global_step": 300816, "epoch": 3624} {"train_loss": -25.29009437561035, "global_step": 300817, "epoch": 3624} {"train_loss": -25.57577133178711, "global_step": 300818, "epoch": 3624} {"train_loss": -25.205835342407227, "global_step": 300819, "epoch": 3624} {"train_loss": -25.630664825439453, "global_step": 300820, "epoch": 3624} {"train_loss": -25.31865882873535, "global_step": 300821, "epoch": 3624} {"train_loss": -25.5580997467041, "global_step": 300822, "epoch": 3624} {"train_loss": -25.7746524810791, "global_step": 300823, "epoch": 3624} {"train_loss": -25.779052734375, "global_step": 300824, "epoch": 3624} {"train_loss": -25.224441528320312, "global_step": 300825, "epoch": 3624} {"train_loss": -25.557226181030273, "global_step": 300826, "epoch": 3624} {"train_loss": -25.653059005737305, "global_step": 300827, "epoch": 3624} {"train_loss": -25.91339683532715, "global_step": 300828, "epoch": 3624} {"train_loss": -25.999359130859375, "global_step": 300829, "epoch": 3624} {"train_loss": -25.572412490844727, "global_step": 300830, "epoch": 3624} {"train_loss": -25.637012481689453, "global_step": 300831, "epoch": 3624} {"train_loss": -26.010669708251953, "global_step": 300832, "epoch": 3624} {"train_loss": -25.759145736694336, "global_step": 300833, "epoch": 3624} {"train_loss": -25.774250030517578, "global_step": 300834, "epoch": 3624} {"train_loss": -25.7554874420166, "global_step": 300835, "epoch": 3624} {"train_loss": -25.925201416015625, "global_step": 300836, "epoch": 3624} {"train_loss": -25.446321487426758, "global_step": 300837, "epoch": 3624} {"train_loss": -25.847082138061523, "global_step": 300838, "epoch": 3624} {"train_loss": -25.968597412109375, "global_step": 300839, "epoch": 3624} {"train_loss": -25.822031021118164, "global_step": 300840, "epoch": 3624} {"train_loss": -25.7203369140625, "global_step": 300841, "epoch": 3624} {"train_loss": -25.881505966186523, "global_step": 300842, "epoch": 3624} {"train_loss": -25.492048263549805, "global_step": 300843, "epoch": 3624} {"train_loss": -25.622888565063477, "global_step": 300844, "epoch": 3624} {"train_loss": -25.46124267578125, "global_step": 300845, "epoch": 3624} {"train_loss": -25.50107765197754, "global_step": 300846, "epoch": 3624} {"train_loss": -26.049779891967773, "global_step": 300847, "epoch": 3624} {"train_loss": -25.521106719970703, "global_step": 300848, "epoch": 3624} {"train_loss": -25.570159912109375, "global_step": 300849, "epoch": 3624} {"train_loss": -25.640262603759766, "global_step": 300850, "epoch": 3624} {"train_loss": -25.703062057495117, "global_step": 300851, "epoch": 3624} {"train_loss": -25.620624542236328, "global_step": 300852, "epoch": 3624} {"train_loss": -25.58717155456543, "global_step": 300853, "epoch": 3624} {"train_loss": -25.293567657470703, "global_step": 300854, "epoch": 3624} {"train_loss": -25.69269371032715, "global_step": 300855, "epoch": 3624} {"train_loss": -25.591405868530273, "global_step": 300856, "epoch": 3624} {"train_loss": -25.15165138244629, "global_step": 300857, "epoch": 3624} {"train_loss": -25.34815788269043, "global_step": 300858, "epoch": 3624} {"train_loss": -25.337844848632812, "global_step": 300859, "epoch": 3624} {"train_loss": -25.52499771118164, "global_step": 300860, "epoch": 3624} {"train_loss": -25.769697189331055, "global_step": 300861, "epoch": 3624} {"train_loss": -25.583539962768555, "global_step": 300862, "epoch": 3624} {"train_loss": -25.57377052307129, "global_step": 300863, "epoch": 3624} {"train_loss": -25.754369735717773, "global_step": 300864, "epoch": 3624} {"train_loss": -25.58287239074707, "global_step": 300865, "epoch": 3624} {"train_loss": -25.670923233032227, "global_step": 300866, "epoch": 3624} {"train_loss": -25.724002838134766, "global_step": 300867, "epoch": 3624} {"train_loss": -25.776458740234375, "global_step": 300868, "epoch": 3624} {"train_loss": -25.49085235595703, "global_step": 300869, "epoch": 3624} {"train_loss": -25.51474952697754, "global_step": 300870, "epoch": 3624} {"train_loss": -25.683990478515625, "global_step": 300871, "epoch": 3624} {"train_loss": -25.86395263671875, "global_step": 300872, "epoch": 3624} {"train_loss": -25.412879943847656, "global_step": 300873, "epoch": 3624} {"train_loss": -25.530962220157484, "global_step": 300874, "epoch": 3624, "val_loss": 7156045.0} {"train_loss": -25.614490509033203, "global_step": 300875, "epoch": 3625} {"train_loss": -25.249452590942383, "global_step": 300876, "epoch": 3625} {"train_loss": -25.343948364257812, "global_step": 300877, "epoch": 3625} {"train_loss": -25.182737350463867, "global_step": 300878, "epoch": 3625} {"train_loss": -25.206403732299805, "global_step": 300879, "epoch": 3625} {"train_loss": -25.113492965698242, "global_step": 300880, "epoch": 3625} {"train_loss": -25.64314842224121, "global_step": 300881, "epoch": 3625} {"train_loss": -25.193485260009766, "global_step": 300882, "epoch": 3625} {"train_loss": -25.306577682495117, "global_step": 300883, "epoch": 3625} {"train_loss": -25.967050552368164, "global_step": 300884, "epoch": 3625} {"train_loss": -25.271703720092773, "global_step": 300885, "epoch": 3625} {"train_loss": -25.623743057250977, "global_step": 300886, "epoch": 3625} {"train_loss": -25.61935806274414, "global_step": 300887, "epoch": 3625} {"train_loss": -25.44124412536621, "global_step": 300888, "epoch": 3625} {"train_loss": -25.985126495361328, "global_step": 300889, "epoch": 3625} {"train_loss": -25.40522003173828, "global_step": 300890, "epoch": 3625} {"train_loss": -25.632165908813477, "global_step": 300891, "epoch": 3625} {"train_loss": -25.544458389282227, "global_step": 300892, "epoch": 3625} {"train_loss": -25.479150772094727, "global_step": 300893, "epoch": 3625} {"train_loss": -25.68284034729004, "global_step": 300894, "epoch": 3625} {"train_loss": -25.485197067260742, "global_step": 300895, "epoch": 3625} {"train_loss": -25.73064613342285, "global_step": 300896, "epoch": 3625} {"train_loss": -25.441457748413086, "global_step": 300897, "epoch": 3625} {"train_loss": -25.527944564819336, "global_step": 300898, "epoch": 3625} {"train_loss": -25.474782943725586, "global_step": 300899, "epoch": 3625} {"train_loss": -25.59018898010254, "global_step": 300900, "epoch": 3625} {"train_loss": -25.781396865844727, "global_step": 300901, "epoch": 3625} {"train_loss": -25.76704216003418, "global_step": 300902, "epoch": 3625} {"train_loss": -25.668439865112305, "global_step": 300903, "epoch": 3625} {"train_loss": -25.799823760986328, "global_step": 300904, "epoch": 3625} {"train_loss": -25.621702194213867, "global_step": 300905, "epoch": 3625} {"train_loss": -26.12741470336914, "global_step": 300906, "epoch": 3625} {"train_loss": -26.13315200805664, "global_step": 300907, "epoch": 3625} {"train_loss": -25.654804229736328, "global_step": 300908, "epoch": 3625} {"train_loss": -25.6384220123291, "global_step": 300909, "epoch": 3625} {"train_loss": -25.912158966064453, "global_step": 300910, "epoch": 3625} {"train_loss": -26.04463768005371, "global_step": 300911, "epoch": 3625} {"train_loss": -25.976842880249023, "global_step": 300912, "epoch": 3625} {"train_loss": -25.810949325561523, "global_step": 300913, "epoch": 3625} {"train_loss": -25.836050033569336, "global_step": 300914, "epoch": 3625} {"train_loss": -25.573606491088867, "global_step": 300915, "epoch": 3625} {"train_loss": -25.6471004486084, "global_step": 300916, "epoch": 3625} {"train_loss": -25.77301597595215, "global_step": 300917, "epoch": 3625} {"train_loss": -25.921741485595703, "global_step": 300918, "epoch": 3625} {"train_loss": -25.375699996948242, "global_step": 300919, "epoch": 3625} {"train_loss": -25.6357479095459, "global_step": 300920, "epoch": 3625} {"train_loss": -25.451889038085938, "global_step": 300921, "epoch": 3625} {"train_loss": -25.71494483947754, "global_step": 300922, "epoch": 3625} {"train_loss": -25.35831642150879, "global_step": 300923, "epoch": 3625} {"train_loss": -25.559494018554688, "global_step": 300924, "epoch": 3625} {"train_loss": -25.810626983642578, "global_step": 300925, "epoch": 3625} {"train_loss": -25.80494499206543, "global_step": 300926, "epoch": 3625} {"train_loss": -25.358951568603516, "global_step": 300927, "epoch": 3625} {"train_loss": -25.561172485351562, "global_step": 300928, "epoch": 3625} {"train_loss": -25.907379150390625, "global_step": 300929, "epoch": 3625} {"train_loss": -25.697967529296875, "global_step": 300930, "epoch": 3625} {"train_loss": -25.625823974609375, "global_step": 300931, "epoch": 3625} {"train_loss": -26.072729110717773, "global_step": 300932, "epoch": 3625} {"train_loss": -25.869293212890625, "global_step": 300933, "epoch": 3625} {"train_loss": -25.5483455657959, "global_step": 300934, "epoch": 3625} {"train_loss": -25.746891021728516, "global_step": 300935, "epoch": 3625} {"train_loss": -26.052770614624023, "global_step": 300936, "epoch": 3625} {"train_loss": -25.23193359375, "global_step": 300937, "epoch": 3625} {"train_loss": -25.470117568969727, "global_step": 300938, "epoch": 3625} {"train_loss": -25.852941513061523, "global_step": 300939, "epoch": 3625} {"train_loss": -25.494247436523438, "global_step": 300940, "epoch": 3625} {"train_loss": -25.823062896728516, "global_step": 300941, "epoch": 3625} {"train_loss": -25.750226974487305, "global_step": 300942, "epoch": 3625} {"train_loss": -25.97723960876465, "global_step": 300943, "epoch": 3625} {"train_loss": -25.74590492248535, "global_step": 300944, "epoch": 3625} {"train_loss": -26.1307430267334, "global_step": 300945, "epoch": 3625} {"train_loss": -25.478031158447266, "global_step": 300946, "epoch": 3625} {"train_loss": -25.604965209960938, "global_step": 300947, "epoch": 3625} {"train_loss": -25.864709854125977, "global_step": 300948, "epoch": 3625} {"train_loss": -26.179121017456055, "global_step": 300949, "epoch": 3625} {"train_loss": -25.756772994995117, "global_step": 300950, "epoch": 3625} {"train_loss": -25.74616050720215, "global_step": 300951, "epoch": 3625} {"train_loss": -26.013568878173828, "global_step": 300952, "epoch": 3625} {"train_loss": -25.834461212158203, "global_step": 300953, "epoch": 3625} {"train_loss": -25.520193099975586, "global_step": 300954, "epoch": 3625} {"train_loss": -24.93794059753418, "global_step": 300955, "epoch": 3625} {"train_loss": -23.93973731994629, "global_step": 300956, "epoch": 3625} {"train_loss": -25.627690211836114, "global_step": 300957, "epoch": 3625, "val_loss": 7280396.0} {"train_loss": -22.643800735473633, "global_step": 300958, "epoch": 3626} {"train_loss": -23.10104751586914, "global_step": 300959, "epoch": 3626} {"train_loss": -23.111717224121094, "global_step": 300960, "epoch": 3626} {"train_loss": -22.536598205566406, "global_step": 300961, "epoch": 3626} {"train_loss": -23.772966384887695, "global_step": 300962, "epoch": 3626} {"train_loss": -23.516820907592773, "global_step": 300963, "epoch": 3626} {"train_loss": -23.689298629760742, "global_step": 300964, "epoch": 3626} {"train_loss": -23.724124908447266, "global_step": 300965, "epoch": 3626} {"train_loss": -24.27397346496582, "global_step": 300966, "epoch": 3626} {"train_loss": -23.552066802978516, "global_step": 300967, "epoch": 3626} {"train_loss": -24.19977378845215, "global_step": 300968, "epoch": 3626} {"train_loss": -24.43739891052246, "global_step": 300969, "epoch": 3626} {"train_loss": -23.85273551940918, "global_step": 300970, "epoch": 3626} {"train_loss": -24.02912712097168, "global_step": 300971, "epoch": 3626} {"train_loss": -24.453458786010742, "global_step": 300972, "epoch": 3626} {"train_loss": -24.431346893310547, "global_step": 300973, "epoch": 3626} {"train_loss": -25.098907470703125, "global_step": 300974, "epoch": 3626} {"train_loss": -24.60398292541504, "global_step": 300975, "epoch": 3626} {"train_loss": -24.240713119506836, "global_step": 300976, "epoch": 3626} {"train_loss": -24.38886070251465, "global_step": 300977, "epoch": 3626} {"train_loss": -24.601537704467773, "global_step": 300978, "epoch": 3626} {"train_loss": -24.8861141204834, "global_step": 300979, "epoch": 3626} {"train_loss": -24.71781349182129, "global_step": 300980, "epoch": 3626} {"train_loss": -24.938650131225586, "global_step": 300981, "epoch": 3626} {"train_loss": -24.788978576660156, "global_step": 300982, "epoch": 3626} {"train_loss": -24.731597900390625, "global_step": 300983, "epoch": 3626} {"train_loss": -25.004161834716797, "global_step": 300984, "epoch": 3626} {"train_loss": -24.98225212097168, "global_step": 300985, "epoch": 3626} {"train_loss": -24.92889976501465, "global_step": 300986, "epoch": 3626} {"train_loss": -24.83378791809082, "global_step": 300987, "epoch": 3626} {"train_loss": -24.980098724365234, "global_step": 300988, "epoch": 3626} {"train_loss": -25.199697494506836, "global_step": 300989, "epoch": 3626} {"train_loss": -24.934812545776367, "global_step": 300990, "epoch": 3626} {"train_loss": -25.31599998474121, "global_step": 300991, "epoch": 3626} {"train_loss": -25.21786880493164, "global_step": 300992, "epoch": 3626} {"train_loss": -24.91783905029297, "global_step": 300993, "epoch": 3626} {"train_loss": -25.360342025756836, "global_step": 300994, "epoch": 3626} {"train_loss": -25.032337188720703, "global_step": 300995, "epoch": 3626} {"train_loss": -25.26373291015625, "global_step": 300996, "epoch": 3626} {"train_loss": -25.3604736328125, "global_step": 300997, "epoch": 3626} {"train_loss": -25.752521514892578, "global_step": 300998, "epoch": 3626} {"train_loss": -25.60178565979004, "global_step": 300999, "epoch": 3626} {"train_loss": -24.86615753173828, "global_step": 301000, "epoch": 3626} {"train_loss": -26.035507202148438, "global_step": 301001, "epoch": 3626} {"train_loss": -25.571203231811523, "global_step": 301002, "epoch": 3626} {"train_loss": -25.414621353149414, "global_step": 301003, "epoch": 3626} {"train_loss": -25.7077693939209, "global_step": 301004, "epoch": 3626} {"train_loss": -25.759321212768555, "global_step": 301005, "epoch": 3626} {"train_loss": -25.846332550048828, "global_step": 301006, "epoch": 3626} {"train_loss": -25.567838668823242, "global_step": 301007, "epoch": 3626} {"train_loss": -25.635852813720703, "global_step": 301008, "epoch": 3626} {"train_loss": -25.295902252197266, "global_step": 301009, "epoch": 3626} {"train_loss": -25.833938598632812, "global_step": 301010, "epoch": 3626} {"train_loss": -25.720922470092773, "global_step": 301011, "epoch": 3626} {"train_loss": -25.743467330932617, "global_step": 301012, "epoch": 3626} {"train_loss": -25.736658096313477, "global_step": 301013, "epoch": 3626} {"train_loss": -25.950342178344727, "global_step": 301014, "epoch": 3626} {"train_loss": -25.6715087890625, "global_step": 301015, "epoch": 3626} {"train_loss": -25.708723068237305, "global_step": 301016, "epoch": 3626} {"train_loss": -25.550968170166016, "global_step": 301017, "epoch": 3626} {"train_loss": -25.628686904907227, "global_step": 301018, "epoch": 3626} {"train_loss": -25.328088760375977, "global_step": 301019, "epoch": 3626} {"train_loss": -25.75201416015625, "global_step": 301020, "epoch": 3626} {"train_loss": -25.44212532043457, "global_step": 301021, "epoch": 3626} {"train_loss": -25.31599235534668, "global_step": 301022, "epoch": 3626} {"train_loss": -25.285951614379883, "global_step": 301023, "epoch": 3626} {"train_loss": -25.430234909057617, "global_step": 301024, "epoch": 3626} {"train_loss": -25.429096221923828, "global_step": 301025, "epoch": 3626} {"train_loss": -25.23066520690918, "global_step": 301026, "epoch": 3626} {"train_loss": -25.07306480407715, "global_step": 301027, "epoch": 3626} {"train_loss": -25.52781105041504, "global_step": 301028, "epoch": 3626} {"train_loss": -25.351957321166992, "global_step": 301029, "epoch": 3626} {"train_loss": -25.26458740234375, "global_step": 301030, "epoch": 3626} {"train_loss": -25.50202751159668, "global_step": 301031, "epoch": 3626} {"train_loss": -25.58268928527832, "global_step": 301032, "epoch": 3626} {"train_loss": -25.975040435791016, "global_step": 301033, "epoch": 3626} {"train_loss": -25.498027801513672, "global_step": 301034, "epoch": 3626} {"train_loss": -25.89118766784668, "global_step": 301035, "epoch": 3626} {"train_loss": -25.514476776123047, "global_step": 301036, "epoch": 3626} {"train_loss": -25.31215476989746, "global_step": 301037, "epoch": 3626} {"train_loss": -25.653411865234375, "global_step": 301038, "epoch": 3626} {"train_loss": -25.603561401367188, "global_step": 301039, "epoch": 3626} {"train_loss": -25.018731059798274, "global_step": 301040, "epoch": 3626, "val_loss": 7067262.5} {"train_loss": -24.820051193237305, "global_step": 301041, "epoch": 3627} {"train_loss": -25.10761070251465, "global_step": 301042, "epoch": 3627} {"train_loss": -24.910184860229492, "global_step": 301043, "epoch": 3627} {"train_loss": -25.222261428833008, "global_step": 301044, "epoch": 3627} {"train_loss": -25.165935516357422, "global_step": 301045, "epoch": 3627} {"train_loss": -24.76519775390625, "global_step": 301046, "epoch": 3627} {"train_loss": -25.070920944213867, "global_step": 301047, "epoch": 3627} {"train_loss": -24.977384567260742, "global_step": 301048, "epoch": 3627} {"train_loss": -25.10023307800293, "global_step": 301049, "epoch": 3627} {"train_loss": -25.382984161376953, "global_step": 301050, "epoch": 3627} {"train_loss": -24.92640495300293, "global_step": 301051, "epoch": 3627} {"train_loss": -25.29865837097168, "global_step": 301052, "epoch": 3627} {"train_loss": -25.02451515197754, "global_step": 301053, "epoch": 3627} {"train_loss": -25.204633712768555, "global_step": 301054, "epoch": 3627} {"train_loss": -25.20967674255371, "global_step": 301055, "epoch": 3627} {"train_loss": -25.073301315307617, "global_step": 301056, "epoch": 3627} {"train_loss": -25.54159927368164, "global_step": 301057, "epoch": 3627} {"train_loss": -25.68653678894043, "global_step": 301058, "epoch": 3627} {"train_loss": -25.54994010925293, "global_step": 301059, "epoch": 3627} {"train_loss": -25.617895126342773, "global_step": 301060, "epoch": 3627} {"train_loss": -25.022216796875, "global_step": 301061, "epoch": 3627} {"train_loss": -25.180524826049805, "global_step": 301062, "epoch": 3627} {"train_loss": -25.292261123657227, "global_step": 301063, "epoch": 3627} {"train_loss": -25.472291946411133, "global_step": 301064, "epoch": 3627} {"train_loss": -25.37140464782715, "global_step": 301065, "epoch": 3627} {"train_loss": -25.40359878540039, "global_step": 301066, "epoch": 3627} {"train_loss": -25.844104766845703, "global_step": 301067, "epoch": 3627} {"train_loss": -25.738361358642578, "global_step": 301068, "epoch": 3627} {"train_loss": -26.0754337310791, "global_step": 301069, "epoch": 3627} {"train_loss": -25.56499481201172, "global_step": 301070, "epoch": 3627} {"train_loss": -25.390233993530273, "global_step": 301071, "epoch": 3627} {"train_loss": -25.381446838378906, "global_step": 301072, "epoch": 3627} {"train_loss": -25.65729331970215, "global_step": 301073, "epoch": 3627} {"train_loss": -25.782211303710938, "global_step": 301074, "epoch": 3627} {"train_loss": -25.62555503845215, "global_step": 301075, "epoch": 3627} {"train_loss": -25.631362915039062, "global_step": 301076, "epoch": 3627} {"train_loss": -25.47909927368164, "global_step": 301077, "epoch": 3627} {"train_loss": -25.56770896911621, "global_step": 301078, "epoch": 3627} {"train_loss": -25.674467086791992, "global_step": 301079, "epoch": 3627} {"train_loss": -25.314558029174805, "global_step": 301080, "epoch": 3627} {"train_loss": -25.52730369567871, "global_step": 301081, "epoch": 3627} {"train_loss": -25.43739128112793, "global_step": 301082, "epoch": 3627} {"train_loss": -25.751239776611328, "global_step": 301083, "epoch": 3627} {"train_loss": -25.1174259185791, "global_step": 301084, "epoch": 3627} {"train_loss": -25.631214141845703, "global_step": 301085, "epoch": 3627} {"train_loss": -25.304285049438477, "global_step": 301086, "epoch": 3627} {"train_loss": -25.564315795898438, "global_step": 301087, "epoch": 3627} {"train_loss": -25.41730308532715, "global_step": 301088, "epoch": 3627} {"train_loss": -25.7034854888916, "global_step": 301089, "epoch": 3627} {"train_loss": -25.71596336364746, "global_step": 301090, "epoch": 3627} {"train_loss": -25.540279388427734, "global_step": 301091, "epoch": 3627} {"train_loss": -25.456939697265625, "global_step": 301092, "epoch": 3627} {"train_loss": -25.527881622314453, "global_step": 301093, "epoch": 3627} {"train_loss": -25.934579849243164, "global_step": 301094, "epoch": 3627} {"train_loss": -25.629446029663086, "global_step": 301095, "epoch": 3627} {"train_loss": -25.7100887298584, "global_step": 301096, "epoch": 3627} {"train_loss": -25.859241485595703, "global_step": 301097, "epoch": 3627} {"train_loss": -25.873764038085938, "global_step": 301098, "epoch": 3627} {"train_loss": -26.044294357299805, "global_step": 301099, "epoch": 3627} {"train_loss": -25.689016342163086, "global_step": 301100, "epoch": 3627} {"train_loss": -25.91269302368164, "global_step": 301101, "epoch": 3627} {"train_loss": -25.454320907592773, "global_step": 301102, "epoch": 3627} {"train_loss": -25.494361877441406, "global_step": 301103, "epoch": 3627} {"train_loss": -25.409324645996094, "global_step": 301104, "epoch": 3627} {"train_loss": -25.644128799438477, "global_step": 301105, "epoch": 3627} {"train_loss": -25.6693115234375, "global_step": 301106, "epoch": 3627} {"train_loss": -25.74072265625, "global_step": 301107, "epoch": 3627} {"train_loss": -25.55524253845215, "global_step": 301108, "epoch": 3627} {"train_loss": -25.7464542388916, "global_step": 301109, "epoch": 3627} {"train_loss": -25.6047420501709, "global_step": 301110, "epoch": 3627} {"train_loss": -25.9921817779541, "global_step": 301111, "epoch": 3627} {"train_loss": -25.981098175048828, "global_step": 301112, "epoch": 3627} {"train_loss": -25.2866268157959, "global_step": 301113, "epoch": 3627} {"train_loss": -25.8212890625, "global_step": 301114, "epoch": 3627} {"train_loss": -25.644779205322266, "global_step": 301115, "epoch": 3627} {"train_loss": -25.7786808013916, "global_step": 301116, "epoch": 3627} {"train_loss": -25.92388916015625, "global_step": 301117, "epoch": 3627} {"train_loss": -25.861669540405273, "global_step": 301118, "epoch": 3627} {"train_loss": -26.010351181030273, "global_step": 301119, "epoch": 3627} {"train_loss": -26.08490562438965, "global_step": 301120, "epoch": 3627} {"train_loss": -25.499046325683594, "global_step": 301121, "epoch": 3627} {"train_loss": -26.16779136657715, "global_step": 301122, "epoch": 3627} {"train_loss": -25.511043043021697, "global_step": 301123, "epoch": 3627, "val_loss": 7203217.5} {"train_loss": -24.42799949645996, "global_step": 301124, "epoch": 3628} {"train_loss": -24.9985408782959, "global_step": 301125, "epoch": 3628} {"train_loss": -25.03720474243164, "global_step": 301126, "epoch": 3628} {"train_loss": -24.952646255493164, "global_step": 301127, "epoch": 3628} {"train_loss": -25.222288131713867, "global_step": 301128, "epoch": 3628} {"train_loss": -25.233976364135742, "global_step": 301129, "epoch": 3628} {"train_loss": -25.573627471923828, "global_step": 301130, "epoch": 3628} {"train_loss": -25.331878662109375, "global_step": 301131, "epoch": 3628} {"train_loss": -25.188520431518555, "global_step": 301132, "epoch": 3628} {"train_loss": -25.139272689819336, "global_step": 301133, "epoch": 3628} {"train_loss": -25.30294418334961, "global_step": 301134, "epoch": 3628} {"train_loss": -25.21632194519043, "global_step": 301135, "epoch": 3628} {"train_loss": -25.15992546081543, "global_step": 301136, "epoch": 3628} {"train_loss": -25.6248836517334, "global_step": 301137, "epoch": 3628} {"train_loss": -25.166147232055664, "global_step": 301138, "epoch": 3628} {"train_loss": -25.416561126708984, "global_step": 301139, "epoch": 3628} {"train_loss": -24.9564266204834, "global_step": 301140, "epoch": 3628} {"train_loss": -25.388948440551758, "global_step": 301141, "epoch": 3628} {"train_loss": -24.938356399536133, "global_step": 301142, "epoch": 3628} {"train_loss": -25.45332145690918, "global_step": 301143, "epoch": 3628} {"train_loss": -25.2523193359375, "global_step": 301144, "epoch": 3628} {"train_loss": -25.466123580932617, "global_step": 301145, "epoch": 3628} {"train_loss": -25.164146423339844, "global_step": 301146, "epoch": 3628} {"train_loss": -25.426237106323242, "global_step": 301147, "epoch": 3628} {"train_loss": -25.09819984436035, "global_step": 301148, "epoch": 3628} {"train_loss": -25.738611221313477, "global_step": 301149, "epoch": 3628} {"train_loss": -25.407958984375, "global_step": 301150, "epoch": 3628} {"train_loss": -25.258291244506836, "global_step": 301151, "epoch": 3628} {"train_loss": -25.442529678344727, "global_step": 301152, "epoch": 3628} {"train_loss": -26.032861709594727, "global_step": 301153, "epoch": 3628} {"train_loss": -25.7228946685791, "global_step": 301154, "epoch": 3628} {"train_loss": -25.80845069885254, "global_step": 301155, "epoch": 3628} {"train_loss": -25.488800048828125, "global_step": 301156, "epoch": 3628} {"train_loss": -26.0137996673584, "global_step": 301157, "epoch": 3628} {"train_loss": -25.642667770385742, "global_step": 301158, "epoch": 3628} {"train_loss": -25.470684051513672, "global_step": 301159, "epoch": 3628} {"train_loss": -25.627838134765625, "global_step": 301160, "epoch": 3628} {"train_loss": -25.261037826538086, "global_step": 301161, "epoch": 3628} {"train_loss": -25.530651092529297, "global_step": 301162, "epoch": 3628} {"train_loss": -25.476673126220703, "global_step": 301163, "epoch": 3628} {"train_loss": -25.22857093811035, "global_step": 301164, "epoch": 3628} {"train_loss": -25.39255714416504, "global_step": 301165, "epoch": 3628} {"train_loss": -25.718313217163086, "global_step": 301166, "epoch": 3628} {"train_loss": -25.964975357055664, "global_step": 301167, "epoch": 3628} {"train_loss": -25.834033966064453, "global_step": 301168, "epoch": 3628} {"train_loss": -25.51362419128418, "global_step": 301169, "epoch": 3628} {"train_loss": -25.578481674194336, "global_step": 301170, "epoch": 3628} {"train_loss": -25.479976654052734, "global_step": 301171, "epoch": 3628} {"train_loss": -25.869924545288086, "global_step": 301172, "epoch": 3628} {"train_loss": -25.8211727142334, "global_step": 301173, "epoch": 3628} {"train_loss": -25.879648208618164, "global_step": 301174, "epoch": 3628} {"train_loss": -25.80771255493164, "global_step": 301175, "epoch": 3628} {"train_loss": -25.9536190032959, "global_step": 301176, "epoch": 3628} {"train_loss": -26.04920768737793, "global_step": 301177, "epoch": 3628} {"train_loss": -25.92140769958496, "global_step": 301178, "epoch": 3628} {"train_loss": -25.445859909057617, "global_step": 301179, "epoch": 3628} {"train_loss": -25.577661514282227, "global_step": 301180, "epoch": 3628} {"train_loss": -25.871173858642578, "global_step": 301181, "epoch": 3628} {"train_loss": -25.487791061401367, "global_step": 301182, "epoch": 3628} {"train_loss": -25.92542839050293, "global_step": 301183, "epoch": 3628} {"train_loss": -25.6925048828125, "global_step": 301184, "epoch": 3628} {"train_loss": -25.78840446472168, "global_step": 301185, "epoch": 3628} {"train_loss": -25.814538955688477, "global_step": 301186, "epoch": 3628} {"train_loss": -25.695972442626953, "global_step": 301187, "epoch": 3628} {"train_loss": -25.879438400268555, "global_step": 301188, "epoch": 3628} {"train_loss": -25.613882064819336, "global_step": 301189, "epoch": 3628} {"train_loss": -25.33650016784668, "global_step": 301190, "epoch": 3628} {"train_loss": -25.63666343688965, "global_step": 301191, "epoch": 3628} {"train_loss": -25.87188720703125, "global_step": 301192, "epoch": 3628} {"train_loss": -25.683130264282227, "global_step": 301193, "epoch": 3628} {"train_loss": -25.780548095703125, "global_step": 301194, "epoch": 3628} {"train_loss": -25.85733985900879, "global_step": 301195, "epoch": 3628} {"train_loss": -25.7127742767334, "global_step": 301196, "epoch": 3628} {"train_loss": -25.722776412963867, "global_step": 301197, "epoch": 3628} {"train_loss": -25.680561065673828, "global_step": 301198, "epoch": 3628} {"train_loss": -25.632837295532227, "global_step": 301199, "epoch": 3628} {"train_loss": -25.470027923583984, "global_step": 301200, "epoch": 3628} {"train_loss": -26.00380516052246, "global_step": 301201, "epoch": 3628} {"train_loss": -25.617359161376953, "global_step": 301202, "epoch": 3628} {"train_loss": -25.672754287719727, "global_step": 301203, "epoch": 3628} {"train_loss": -25.628393173217773, "global_step": 301204, "epoch": 3628} {"train_loss": -25.86799430847168, "global_step": 301205, "epoch": 3628} {"train_loss": -25.54447107429964, "global_step": 301206, "epoch": 3628, "val_loss": 7481993.0} {"train_loss": -24.42140007019043, "global_step": 301207, "epoch": 3629} {"train_loss": -24.31928062438965, "global_step": 301208, "epoch": 3629} {"train_loss": -24.80537986755371, "global_step": 301209, "epoch": 3629} {"train_loss": -23.819875717163086, "global_step": 301210, "epoch": 3629} {"train_loss": -24.736095428466797, "global_step": 301211, "epoch": 3629} {"train_loss": -24.52332878112793, "global_step": 301212, "epoch": 3629} {"train_loss": -24.544754028320312, "global_step": 301213, "epoch": 3629} {"train_loss": -24.86090660095215, "global_step": 301214, "epoch": 3629} {"train_loss": -25.0321102142334, "global_step": 301215, "epoch": 3629} {"train_loss": -24.66771125793457, "global_step": 301216, "epoch": 3629} {"train_loss": -25.543922424316406, "global_step": 301217, "epoch": 3629} {"train_loss": -24.977100372314453, "global_step": 301218, "epoch": 3629} {"train_loss": -24.829254150390625, "global_step": 301219, "epoch": 3629} {"train_loss": -24.74030303955078, "global_step": 301220, "epoch": 3629} {"train_loss": -25.134387969970703, "global_step": 301221, "epoch": 3629} {"train_loss": -25.019943237304688, "global_step": 301222, "epoch": 3629} {"train_loss": -25.397724151611328, "global_step": 301223, "epoch": 3629} {"train_loss": -25.416101455688477, "global_step": 301224, "epoch": 3629} {"train_loss": -25.141010284423828, "global_step": 301225, "epoch": 3629} {"train_loss": -25.204166412353516, "global_step": 301226, "epoch": 3629} {"train_loss": -24.745817184448242, "global_step": 301227, "epoch": 3629} {"train_loss": -25.83078384399414, "global_step": 301228, "epoch": 3629} {"train_loss": -25.137069702148438, "global_step": 301229, "epoch": 3629} {"train_loss": -25.447376251220703, "global_step": 301230, "epoch": 3629} {"train_loss": -25.582347869873047, "global_step": 301231, "epoch": 3629} {"train_loss": -24.861648559570312, "global_step": 301232, "epoch": 3629} {"train_loss": -25.58540153503418, "global_step": 301233, "epoch": 3629} {"train_loss": -25.596281051635742, "global_step": 301234, "epoch": 3629} {"train_loss": -25.53255271911621, "global_step": 301235, "epoch": 3629} {"train_loss": -25.590234756469727, "global_step": 301236, "epoch": 3629} {"train_loss": -25.63688087463379, "global_step": 301237, "epoch": 3629} {"train_loss": -25.680490493774414, "global_step": 301238, "epoch": 3629} {"train_loss": -25.674697875976562, "global_step": 301239, "epoch": 3629} {"train_loss": -25.606231689453125, "global_step": 301240, "epoch": 3629} {"train_loss": -25.734594345092773, "global_step": 301241, "epoch": 3629} {"train_loss": -26.029266357421875, "global_step": 301242, "epoch": 3629} {"train_loss": -25.735315322875977, "global_step": 301243, "epoch": 3629} {"train_loss": -25.615766525268555, "global_step": 301244, "epoch": 3629} {"train_loss": -25.80517578125, "global_step": 301245, "epoch": 3629} {"train_loss": -25.737995147705078, "global_step": 301246, "epoch": 3629} {"train_loss": -26.060047149658203, "global_step": 301247, "epoch": 3629} {"train_loss": -26.1060791015625, "global_step": 301248, "epoch": 3629} {"train_loss": -25.55988883972168, "global_step": 301249, "epoch": 3629} {"train_loss": -25.693164825439453, "global_step": 301250, "epoch": 3629} {"train_loss": -25.693988800048828, "global_step": 301251, "epoch": 3629} {"train_loss": -25.773426055908203, "global_step": 301252, "epoch": 3629} {"train_loss": -25.824588775634766, "global_step": 301253, "epoch": 3629} {"train_loss": -25.76922607421875, "global_step": 301254, "epoch": 3629} {"train_loss": -25.909265518188477, "global_step": 301255, "epoch": 3629} {"train_loss": -25.462812423706055, "global_step": 301256, "epoch": 3629} {"train_loss": -26.074628829956055, "global_step": 301257, "epoch": 3629} {"train_loss": -25.702428817749023, "global_step": 301258, "epoch": 3629} {"train_loss": -26.028705596923828, "global_step": 301259, "epoch": 3629} {"train_loss": -25.908796310424805, "global_step": 301260, "epoch": 3629} {"train_loss": -25.877634048461914, "global_step": 301261, "epoch": 3629} {"train_loss": -25.914459228515625, "global_step": 301262, "epoch": 3629} {"train_loss": -25.656574249267578, "global_step": 301263, "epoch": 3629} {"train_loss": -25.68079948425293, "global_step": 301264, "epoch": 3629} {"train_loss": -25.25376319885254, "global_step": 301265, "epoch": 3629} {"train_loss": -25.517183303833008, "global_step": 301266, "epoch": 3629} {"train_loss": -25.10471534729004, "global_step": 301267, "epoch": 3629} {"train_loss": -25.42995262145996, "global_step": 301268, "epoch": 3629} {"train_loss": -24.821258544921875, "global_step": 301269, "epoch": 3629} {"train_loss": -25.349111557006836, "global_step": 301270, "epoch": 3629} {"train_loss": -25.524620056152344, "global_step": 301271, "epoch": 3629} {"train_loss": -25.42630386352539, "global_step": 301272, "epoch": 3629} {"train_loss": -25.746856689453125, "global_step": 301273, "epoch": 3629} {"train_loss": -25.460901260375977, "global_step": 301274, "epoch": 3629} {"train_loss": -25.494733810424805, "global_step": 301275, "epoch": 3629} {"train_loss": -25.76853370666504, "global_step": 301276, "epoch": 3629} {"train_loss": -25.39399528503418, "global_step": 301277, "epoch": 3629} {"train_loss": -25.48569107055664, "global_step": 301278, "epoch": 3629} {"train_loss": -25.92191505432129, "global_step": 301279, "epoch": 3629} {"train_loss": -25.79014015197754, "global_step": 301280, "epoch": 3629} {"train_loss": -25.392484664916992, "global_step": 301281, "epoch": 3629} {"train_loss": -25.86859703063965, "global_step": 301282, "epoch": 3629} {"train_loss": -25.088632583618164, "global_step": 301283, "epoch": 3629} {"train_loss": -25.561742782592773, "global_step": 301284, "epoch": 3629} {"train_loss": -25.46992301940918, "global_step": 301285, "epoch": 3629} {"train_loss": -25.575437545776367, "global_step": 301286, "epoch": 3629} {"train_loss": -25.53717613220215, "global_step": 301287, "epoch": 3629} {"train_loss": -25.412778854370117, "global_step": 301288, "epoch": 3629} {"train_loss": -25.402512286082807, "global_step": 301289, "epoch": 3629, "val_loss": 7170045.0} {"train_loss": -25.40435218811035, "global_step": 301290, "epoch": 3630} {"train_loss": -24.243873596191406, "global_step": 301291, "epoch": 3630} {"train_loss": -25.274072647094727, "global_step": 301292, "epoch": 3630} {"train_loss": -25.0184268951416, "global_step": 301293, "epoch": 3630} {"train_loss": -24.864221572875977, "global_step": 301294, "epoch": 3630} {"train_loss": -24.86768341064453, "global_step": 301295, "epoch": 3630} {"train_loss": -25.100400924682617, "global_step": 301296, "epoch": 3630} {"train_loss": -25.462806701660156, "global_step": 301297, "epoch": 3630} {"train_loss": -25.709264755249023, "global_step": 301298, "epoch": 3630} {"train_loss": -24.9697322845459, "global_step": 301299, "epoch": 3630} {"train_loss": -25.415441513061523, "global_step": 301300, "epoch": 3630} {"train_loss": -24.982160568237305, "global_step": 301301, "epoch": 3630} {"train_loss": -25.52280044555664, "global_step": 301302, "epoch": 3630} {"train_loss": -25.271915435791016, "global_step": 301303, "epoch": 3630} {"train_loss": -25.320585250854492, "global_step": 301304, "epoch": 3630} {"train_loss": -25.547086715698242, "global_step": 301305, "epoch": 3630} {"train_loss": -25.54267692565918, "global_step": 301306, "epoch": 3630} {"train_loss": -25.44452476501465, "global_step": 301307, "epoch": 3630} {"train_loss": -25.537906646728516, "global_step": 301308, "epoch": 3630} {"train_loss": -25.49741554260254, "global_step": 301309, "epoch": 3630} {"train_loss": -25.377201080322266, "global_step": 301310, "epoch": 3630} {"train_loss": -25.688093185424805, "global_step": 301311, "epoch": 3630} {"train_loss": -25.564783096313477, "global_step": 301312, "epoch": 3630} {"train_loss": -25.310407638549805, "global_step": 301313, "epoch": 3630} {"train_loss": -25.616758346557617, "global_step": 301314, "epoch": 3630} {"train_loss": -25.496326446533203, "global_step": 301315, "epoch": 3630} {"train_loss": -25.722827911376953, "global_step": 301316, "epoch": 3630} {"train_loss": -25.78000259399414, "global_step": 301317, "epoch": 3630} {"train_loss": -25.445783615112305, "global_step": 301318, "epoch": 3630} {"train_loss": -25.698287963867188, "global_step": 301319, "epoch": 3630} {"train_loss": -25.688114166259766, "global_step": 301320, "epoch": 3630} {"train_loss": -25.827173233032227, "global_step": 301321, "epoch": 3630} {"train_loss": -25.46135711669922, "global_step": 301322, "epoch": 3630} {"train_loss": -25.77068519592285, "global_step": 301323, "epoch": 3630} {"train_loss": -25.87590980529785, "global_step": 301324, "epoch": 3630} {"train_loss": -25.860767364501953, "global_step": 301325, "epoch": 3630} {"train_loss": -25.773603439331055, "global_step": 301326, "epoch": 3630} {"train_loss": -25.855634689331055, "global_step": 301327, "epoch": 3630} {"train_loss": -26.154998779296875, "global_step": 301328, "epoch": 3630} {"train_loss": -25.85751724243164, "global_step": 301329, "epoch": 3630} {"train_loss": -25.382095336914062, "global_step": 301330, "epoch": 3630} {"train_loss": -25.928226470947266, "global_step": 301331, "epoch": 3630} {"train_loss": -25.812301635742188, "global_step": 301332, "epoch": 3630} {"train_loss": -25.402746200561523, "global_step": 301333, "epoch": 3630} {"train_loss": -25.7476806640625, "global_step": 301334, "epoch": 3630} {"train_loss": -25.598819732666016, "global_step": 301335, "epoch": 3630} {"train_loss": -25.474267959594727, "global_step": 301336, "epoch": 3630} {"train_loss": -25.281326293945312, "global_step": 301337, "epoch": 3630} {"train_loss": -25.00300407409668, "global_step": 301338, "epoch": 3630} {"train_loss": -24.11004638671875, "global_step": 301339, "epoch": 3630} {"train_loss": -24.40511131286621, "global_step": 301340, "epoch": 3630} {"train_loss": -25.176651000976562, "global_step": 301341, "epoch": 3630} {"train_loss": -25.030622482299805, "global_step": 301342, "epoch": 3630} {"train_loss": -24.75007438659668, "global_step": 301343, "epoch": 3630} {"train_loss": -25.48681640625, "global_step": 301344, "epoch": 3630} {"train_loss": -25.202898025512695, "global_step": 301345, "epoch": 3630} {"train_loss": -25.472084045410156, "global_step": 301346, "epoch": 3630} {"train_loss": -25.32785415649414, "global_step": 301347, "epoch": 3630} {"train_loss": -24.404813766479492, "global_step": 301348, "epoch": 3630} {"train_loss": -25.482263565063477, "global_step": 301349, "epoch": 3630} {"train_loss": -24.78683853149414, "global_step": 301350, "epoch": 3630} {"train_loss": -25.504430770874023, "global_step": 301351, "epoch": 3630} {"train_loss": -25.22256851196289, "global_step": 301352, "epoch": 3630} {"train_loss": -25.752538681030273, "global_step": 301353, "epoch": 3630} {"train_loss": -25.288082122802734, "global_step": 301354, "epoch": 3630} {"train_loss": -25.6087589263916, "global_step": 301355, "epoch": 3630} {"train_loss": -25.410900115966797, "global_step": 301356, "epoch": 3630} {"train_loss": -25.04530143737793, "global_step": 301357, "epoch": 3630} {"train_loss": -25.67305564880371, "global_step": 301358, "epoch": 3630} {"train_loss": -25.764806747436523, "global_step": 301359, "epoch": 3630} {"train_loss": -25.331071853637695, "global_step": 301360, "epoch": 3630} {"train_loss": -25.840600967407227, "global_step": 301361, "epoch": 3630} {"train_loss": -25.137182235717773, "global_step": 301362, "epoch": 3630} {"train_loss": -25.547136306762695, "global_step": 301363, "epoch": 3630} {"train_loss": -25.273040771484375, "global_step": 301364, "epoch": 3630} {"train_loss": -25.509654998779297, "global_step": 301365, "epoch": 3630} {"train_loss": -25.540311813354492, "global_step": 301366, "epoch": 3630} {"train_loss": -25.432132720947266, "global_step": 301367, "epoch": 3630} {"train_loss": -25.338844299316406, "global_step": 301368, "epoch": 3630} {"train_loss": -25.607553482055664, "global_step": 301369, "epoch": 3630} {"train_loss": -25.794208526611328, "global_step": 301370, "epoch": 3630} {"train_loss": -26.103796005249023, "global_step": 301371, "epoch": 3630} {"train_loss": -25.411963796041096, "global_step": 301372, "epoch": 3630, "val_loss": 7215016.0} {"train_loss": -24.731809616088867, "global_step": 301373, "epoch": 3631} {"train_loss": -24.87386131286621, "global_step": 301374, "epoch": 3631} {"train_loss": -25.28830337524414, "global_step": 301375, "epoch": 3631} {"train_loss": -25.07447624206543, "global_step": 301376, "epoch": 3631} {"train_loss": -25.299673080444336, "global_step": 301377, "epoch": 3631} {"train_loss": -25.045547485351562, "global_step": 301378, "epoch": 3631} {"train_loss": -24.712236404418945, "global_step": 301379, "epoch": 3631} {"train_loss": -24.995126724243164, "global_step": 301380, "epoch": 3631} {"train_loss": -25.27524757385254, "global_step": 301381, "epoch": 3631} {"train_loss": -24.887680053710938, "global_step": 301382, "epoch": 3631} {"train_loss": -25.09665870666504, "global_step": 301383, "epoch": 3631} {"train_loss": -25.050851821899414, "global_step": 301384, "epoch": 3631} {"train_loss": -25.33415412902832, "global_step": 301385, "epoch": 3631} {"train_loss": -25.337081909179688, "global_step": 301386, "epoch": 3631} {"train_loss": -25.346233367919922, "global_step": 301387, "epoch": 3631} {"train_loss": -25.414691925048828, "global_step": 301388, "epoch": 3631} {"train_loss": -25.28175926208496, "global_step": 301389, "epoch": 3631} {"train_loss": -25.627683639526367, "global_step": 301390, "epoch": 3631} {"train_loss": -25.488956451416016, "global_step": 301391, "epoch": 3631} {"train_loss": -25.68505859375, "global_step": 301392, "epoch": 3631} {"train_loss": -25.114978790283203, "global_step": 301393, "epoch": 3631} {"train_loss": -25.719409942626953, "global_step": 301394, "epoch": 3631} {"train_loss": -25.466583251953125, "global_step": 301395, "epoch": 3631} {"train_loss": -25.6909236907959, "global_step": 301396, "epoch": 3631} {"train_loss": -25.46978759765625, "global_step": 301397, "epoch": 3631} {"train_loss": -25.445430755615234, "global_step": 301398, "epoch": 3631} {"train_loss": -25.591655731201172, "global_step": 301399, "epoch": 3631} {"train_loss": -25.7862606048584, "global_step": 301400, "epoch": 3631} {"train_loss": -25.152023315429688, "global_step": 301401, "epoch": 3631} {"train_loss": -25.8424129486084, "global_step": 301402, "epoch": 3631} {"train_loss": -25.744464874267578, "global_step": 301403, "epoch": 3631} {"train_loss": -25.43862533569336, "global_step": 301404, "epoch": 3631} {"train_loss": -25.799274444580078, "global_step": 301405, "epoch": 3631} {"train_loss": -25.523855209350586, "global_step": 301406, "epoch": 3631} {"train_loss": -25.8243465423584, "global_step": 301407, "epoch": 3631} {"train_loss": -25.627904891967773, "global_step": 301408, "epoch": 3631} {"train_loss": -25.808765411376953, "global_step": 301409, "epoch": 3631} {"train_loss": -26.27076530456543, "global_step": 301410, "epoch": 3631} {"train_loss": -25.86279296875, "global_step": 301411, "epoch": 3631} {"train_loss": -26.08758544921875, "global_step": 301412, "epoch": 3631} {"train_loss": -25.623144149780273, "global_step": 301413, "epoch": 3631} {"train_loss": -26.02260398864746, "global_step": 301414, "epoch": 3631} {"train_loss": -25.7110652923584, "global_step": 301415, "epoch": 3631} {"train_loss": -26.007740020751953, "global_step": 301416, "epoch": 3631} {"train_loss": -26.014667510986328, "global_step": 301417, "epoch": 3631} {"train_loss": -25.745344161987305, "global_step": 301418, "epoch": 3631} {"train_loss": -25.964330673217773, "global_step": 301419, "epoch": 3631} {"train_loss": -25.39364242553711, "global_step": 301420, "epoch": 3631} {"train_loss": -26.105823516845703, "global_step": 301421, "epoch": 3631} {"train_loss": -25.307815551757812, "global_step": 301422, "epoch": 3631} {"train_loss": -25.834604263305664, "global_step": 301423, "epoch": 3631} {"train_loss": -25.730255126953125, "global_step": 301424, "epoch": 3631} {"train_loss": -25.860736846923828, "global_step": 301425, "epoch": 3631} {"train_loss": -25.882007598876953, "global_step": 301426, "epoch": 3631} {"train_loss": -25.437910079956055, "global_step": 301427, "epoch": 3631} {"train_loss": -25.732995986938477, "global_step": 301428, "epoch": 3631} {"train_loss": -25.865758895874023, "global_step": 301429, "epoch": 3631} {"train_loss": -25.37016487121582, "global_step": 301430, "epoch": 3631} {"train_loss": -25.51812744140625, "global_step": 301431, "epoch": 3631} {"train_loss": -25.098691940307617, "global_step": 301432, "epoch": 3631} {"train_loss": -25.594768524169922, "global_step": 301433, "epoch": 3631} {"train_loss": -25.67868423461914, "global_step": 301434, "epoch": 3631} {"train_loss": -25.77069091796875, "global_step": 301435, "epoch": 3631} {"train_loss": -25.996923446655273, "global_step": 301436, "epoch": 3631} {"train_loss": -25.570358276367188, "global_step": 301437, "epoch": 3631} {"train_loss": -25.59547996520996, "global_step": 301438, "epoch": 3631} {"train_loss": -25.881549835205078, "global_step": 301439, "epoch": 3631} {"train_loss": -25.604766845703125, "global_step": 301440, "epoch": 3631} {"train_loss": -25.711286544799805, "global_step": 301441, "epoch": 3631} {"train_loss": -25.932098388671875, "global_step": 301442, "epoch": 3631} {"train_loss": -25.381750106811523, "global_step": 301443, "epoch": 3631} {"train_loss": -26.01336669921875, "global_step": 301444, "epoch": 3631} {"train_loss": -25.552772521972656, "global_step": 301445, "epoch": 3631} {"train_loss": -25.84168815612793, "global_step": 301446, "epoch": 3631} {"train_loss": -25.49643898010254, "global_step": 301447, "epoch": 3631} {"train_loss": -25.811925888061523, "global_step": 301448, "epoch": 3631} {"train_loss": -25.691226959228516, "global_step": 301449, "epoch": 3631} {"train_loss": -25.539796829223633, "global_step": 301450, "epoch": 3631} {"train_loss": -26.015287399291992, "global_step": 301451, "epoch": 3631} {"train_loss": -25.7861328125, "global_step": 301452, "epoch": 3631} {"train_loss": -25.488889694213867, "global_step": 301453, "epoch": 3631} {"train_loss": -25.622465133666992, "global_step": 301454, "epoch": 3631} {"train_loss": -25.597514600638885, "global_step": 301455, "epoch": 3631, "val_loss": 7143631.0} {"train_loss": -24.807044982910156, "global_step": 301456, "epoch": 3632} {"train_loss": -24.77992820739746, "global_step": 301457, "epoch": 3632} {"train_loss": -24.513141632080078, "global_step": 301458, "epoch": 3632} {"train_loss": -25.253280639648438, "global_step": 301459, "epoch": 3632} {"train_loss": -25.20323371887207, "global_step": 301460, "epoch": 3632} {"train_loss": -25.104108810424805, "global_step": 301461, "epoch": 3632} {"train_loss": -25.01727294921875, "global_step": 301462, "epoch": 3632} {"train_loss": -25.195920944213867, "global_step": 301463, "epoch": 3632} {"train_loss": -25.513500213623047, "global_step": 301464, "epoch": 3632} {"train_loss": -25.386686325073242, "global_step": 301465, "epoch": 3632} {"train_loss": -25.279020309448242, "global_step": 301466, "epoch": 3632} {"train_loss": -25.466840744018555, "global_step": 301467, "epoch": 3632} {"train_loss": -25.783105850219727, "global_step": 301468, "epoch": 3632} {"train_loss": -25.403837203979492, "global_step": 301469, "epoch": 3632} {"train_loss": -25.691694259643555, "global_step": 301470, "epoch": 3632} {"train_loss": -25.740467071533203, "global_step": 301471, "epoch": 3632} {"train_loss": -25.87308692932129, "global_step": 301472, "epoch": 3632} {"train_loss": -25.69679832458496, "global_step": 301473, "epoch": 3632} {"train_loss": -25.50489616394043, "global_step": 301474, "epoch": 3632} {"train_loss": -25.596479415893555, "global_step": 301475, "epoch": 3632} {"train_loss": -25.585651397705078, "global_step": 301476, "epoch": 3632} {"train_loss": -25.970792770385742, "global_step": 301477, "epoch": 3632} {"train_loss": -25.4841365814209, "global_step": 301478, "epoch": 3632} {"train_loss": -25.64980125427246, "global_step": 301479, "epoch": 3632} {"train_loss": -25.84271812438965, "global_step": 301480, "epoch": 3632} {"train_loss": -25.755781173706055, "global_step": 301481, "epoch": 3632} {"train_loss": -25.58315086364746, "global_step": 301482, "epoch": 3632} {"train_loss": -25.784894943237305, "global_step": 301483, "epoch": 3632} {"train_loss": -25.68134117126465, "global_step": 301484, "epoch": 3632} {"train_loss": -25.929046630859375, "global_step": 301485, "epoch": 3632} {"train_loss": -25.425657272338867, "global_step": 301486, "epoch": 3632} {"train_loss": -25.91509437561035, "global_step": 301487, "epoch": 3632} {"train_loss": -25.49074363708496, "global_step": 301488, "epoch": 3632} {"train_loss": -25.605894088745117, "global_step": 301489, "epoch": 3632} {"train_loss": -26.148029327392578, "global_step": 301490, "epoch": 3632} {"train_loss": -25.47987937927246, "global_step": 301491, "epoch": 3632} {"train_loss": -25.903303146362305, "global_step": 301492, "epoch": 3632} {"train_loss": -25.534439086914062, "global_step": 301493, "epoch": 3632} {"train_loss": -25.8359432220459, "global_step": 301494, "epoch": 3632} {"train_loss": -25.512741088867188, "global_step": 301495, "epoch": 3632} {"train_loss": -25.4539852142334, "global_step": 301496, "epoch": 3632} {"train_loss": -25.404773712158203, "global_step": 301497, "epoch": 3632} {"train_loss": -25.717370986938477, "global_step": 301498, "epoch": 3632} {"train_loss": -25.805261611938477, "global_step": 301499, "epoch": 3632} {"train_loss": -25.3606014251709, "global_step": 301500, "epoch": 3632} {"train_loss": -25.499435424804688, "global_step": 301501, "epoch": 3632} {"train_loss": -25.56965446472168, "global_step": 301502, "epoch": 3632} {"train_loss": -25.256921768188477, "global_step": 301503, "epoch": 3632} {"train_loss": -26.092573165893555, "global_step": 301504, "epoch": 3632} {"train_loss": -25.780048370361328, "global_step": 301505, "epoch": 3632} {"train_loss": -25.362201690673828, "global_step": 301506, "epoch": 3632} {"train_loss": -25.63496208190918, "global_step": 301507, "epoch": 3632} {"train_loss": -25.762481689453125, "global_step": 301508, "epoch": 3632} {"train_loss": -25.508289337158203, "global_step": 301509, "epoch": 3632} {"train_loss": -25.91326904296875, "global_step": 301510, "epoch": 3632} {"train_loss": -25.912673950195312, "global_step": 301511, "epoch": 3632} {"train_loss": -26.2624568939209, "global_step": 301512, "epoch": 3632} {"train_loss": -24.9121150970459, "global_step": 301513, "epoch": 3632} {"train_loss": -25.668792724609375, "global_step": 301514, "epoch": 3632} {"train_loss": -25.205799102783203, "global_step": 301515, "epoch": 3632} {"train_loss": -25.651010513305664, "global_step": 301516, "epoch": 3632} {"train_loss": -25.68780517578125, "global_step": 301517, "epoch": 3632} {"train_loss": -25.806264877319336, "global_step": 301518, "epoch": 3632} {"train_loss": -25.64155387878418, "global_step": 301519, "epoch": 3632} {"train_loss": -25.616851806640625, "global_step": 301520, "epoch": 3632} {"train_loss": -25.72174644470215, "global_step": 301521, "epoch": 3632} {"train_loss": -25.84122657775879, "global_step": 301522, "epoch": 3632} {"train_loss": -25.730077743530273, "global_step": 301523, "epoch": 3632} {"train_loss": -25.571592330932617, "global_step": 301524, "epoch": 3632} {"train_loss": -25.646474838256836, "global_step": 301525, "epoch": 3632} {"train_loss": -25.661529541015625, "global_step": 301526, "epoch": 3632} {"train_loss": -25.259464263916016, "global_step": 301527, "epoch": 3632} {"train_loss": -25.980077743530273, "global_step": 301528, "epoch": 3632} {"train_loss": -25.472475051879883, "global_step": 301529, "epoch": 3632} {"train_loss": -25.65159034729004, "global_step": 301530, "epoch": 3632} {"train_loss": -25.339191436767578, "global_step": 301531, "epoch": 3632} {"train_loss": -25.417612075805664, "global_step": 301532, "epoch": 3632} {"train_loss": -25.149641036987305, "global_step": 301533, "epoch": 3632} {"train_loss": -25.54458999633789, "global_step": 301534, "epoch": 3632} {"train_loss": -25.890867233276367, "global_step": 301535, "epoch": 3632} {"train_loss": -25.475698471069336, "global_step": 301536, "epoch": 3632} {"train_loss": -26.0726261138916, "global_step": 301537, "epoch": 3632} {"train_loss": -25.567704763757177, "global_step": 301538, "epoch": 3632, "val_loss": 7222712.0} {"train_loss": -25.340579986572266, "global_step": 301539, "epoch": 3633} {"train_loss": -25.286779403686523, "global_step": 301540, "epoch": 3633} {"train_loss": -25.28248405456543, "global_step": 301541, "epoch": 3633} {"train_loss": -25.387359619140625, "global_step": 301542, "epoch": 3633} {"train_loss": -25.378936767578125, "global_step": 301543, "epoch": 3633} {"train_loss": -25.52292251586914, "global_step": 301544, "epoch": 3633} {"train_loss": -25.461368560791016, "global_step": 301545, "epoch": 3633} {"train_loss": -25.38600730895996, "global_step": 301546, "epoch": 3633} {"train_loss": -25.74159049987793, "global_step": 301547, "epoch": 3633} {"train_loss": -25.523557662963867, "global_step": 301548, "epoch": 3633} {"train_loss": -25.237722396850586, "global_step": 301549, "epoch": 3633} {"train_loss": -25.26429557800293, "global_step": 301550, "epoch": 3633} {"train_loss": -25.365564346313477, "global_step": 301551, "epoch": 3633} {"train_loss": -25.4814453125, "global_step": 301552, "epoch": 3633} {"train_loss": -25.4019775390625, "global_step": 301553, "epoch": 3633} {"train_loss": -25.175189971923828, "global_step": 301554, "epoch": 3633} {"train_loss": -26.024566650390625, "global_step": 301555, "epoch": 3633} {"train_loss": -25.6503849029541, "global_step": 301556, "epoch": 3633} {"train_loss": -25.501569747924805, "global_step": 301557, "epoch": 3633} {"train_loss": -25.4011173248291, "global_step": 301558, "epoch": 3633} {"train_loss": -25.54347801208496, "global_step": 301559, "epoch": 3633} {"train_loss": -25.861494064331055, "global_step": 301560, "epoch": 3633} {"train_loss": -25.838476181030273, "global_step": 301561, "epoch": 3633} {"train_loss": -25.73805809020996, "global_step": 301562, "epoch": 3633} {"train_loss": -25.76795768737793, "global_step": 301563, "epoch": 3633} {"train_loss": -25.666107177734375, "global_step": 301564, "epoch": 3633} {"train_loss": -25.686254501342773, "global_step": 301565, "epoch": 3633} {"train_loss": -25.781030654907227, "global_step": 301566, "epoch": 3633} {"train_loss": -25.85890007019043, "global_step": 301567, "epoch": 3633} {"train_loss": -25.75684928894043, "global_step": 301568, "epoch": 3633} {"train_loss": -25.837284088134766, "global_step": 301569, "epoch": 3633} {"train_loss": -25.8933048248291, "global_step": 301570, "epoch": 3633} {"train_loss": -25.277740478515625, "global_step": 301571, "epoch": 3633} {"train_loss": -25.185537338256836, "global_step": 301572, "epoch": 3633} {"train_loss": -25.719640731811523, "global_step": 301573, "epoch": 3633} {"train_loss": -26.038848876953125, "global_step": 301574, "epoch": 3633} {"train_loss": -26.115026473999023, "global_step": 301575, "epoch": 3633} {"train_loss": -25.96940040588379, "global_step": 301576, "epoch": 3633} {"train_loss": -25.75943374633789, "global_step": 301577, "epoch": 3633} {"train_loss": -25.719806671142578, "global_step": 301578, "epoch": 3633} {"train_loss": -25.526782989501953, "global_step": 301579, "epoch": 3633} {"train_loss": -25.62639808654785, "global_step": 301580, "epoch": 3633} {"train_loss": -25.9318904876709, "global_step": 301581, "epoch": 3633} {"train_loss": -25.626752853393555, "global_step": 301582, "epoch": 3633} {"train_loss": -25.724090576171875, "global_step": 301583, "epoch": 3633} {"train_loss": -25.635822296142578, "global_step": 301584, "epoch": 3633} {"train_loss": -25.71929359436035, "global_step": 301585, "epoch": 3633} {"train_loss": -25.971158981323242, "global_step": 301586, "epoch": 3633} {"train_loss": -25.5875186920166, "global_step": 301587, "epoch": 3633} {"train_loss": -25.628767013549805, "global_step": 301588, "epoch": 3633} {"train_loss": -25.818878173828125, "global_step": 301589, "epoch": 3633} {"train_loss": -25.604816436767578, "global_step": 301590, "epoch": 3633} {"train_loss": -25.99639320373535, "global_step": 301591, "epoch": 3633} {"train_loss": -25.692996978759766, "global_step": 301592, "epoch": 3633} {"train_loss": -25.526962280273438, "global_step": 301593, "epoch": 3633} {"train_loss": -25.587343215942383, "global_step": 301594, "epoch": 3633} {"train_loss": -25.920560836791992, "global_step": 301595, "epoch": 3633} {"train_loss": -25.68204689025879, "global_step": 301596, "epoch": 3633} {"train_loss": -25.420631408691406, "global_step": 301597, "epoch": 3633} {"train_loss": -25.762598037719727, "global_step": 301598, "epoch": 3633} {"train_loss": -25.663593292236328, "global_step": 301599, "epoch": 3633} {"train_loss": -25.970335006713867, "global_step": 301600, "epoch": 3633} {"train_loss": -25.75861167907715, "global_step": 301601, "epoch": 3633} {"train_loss": -25.548818588256836, "global_step": 301602, "epoch": 3633} {"train_loss": -26.195770263671875, "global_step": 301603, "epoch": 3633} {"train_loss": -25.75333595275879, "global_step": 301604, "epoch": 3633} {"train_loss": -25.714365005493164, "global_step": 301605, "epoch": 3633} {"train_loss": -25.54947280883789, "global_step": 301606, "epoch": 3633} {"train_loss": -25.681671142578125, "global_step": 301607, "epoch": 3633} {"train_loss": -25.62965202331543, "global_step": 301608, "epoch": 3633} {"train_loss": -25.882049560546875, "global_step": 301609, "epoch": 3633} {"train_loss": -25.911706924438477, "global_step": 301610, "epoch": 3633} {"train_loss": -25.679534912109375, "global_step": 301611, "epoch": 3633} {"train_loss": -25.733930587768555, "global_step": 301612, "epoch": 3633} {"train_loss": -25.608814239501953, "global_step": 301613, "epoch": 3633} {"train_loss": -25.323545455932617, "global_step": 301614, "epoch": 3633} {"train_loss": -25.932828903198242, "global_step": 301615, "epoch": 3633} {"train_loss": -25.508325576782227, "global_step": 301616, "epoch": 3633} {"train_loss": -25.80695152282715, "global_step": 301617, "epoch": 3633} {"train_loss": -25.305967330932617, "global_step": 301618, "epoch": 3633} {"train_loss": -25.8455810546875, "global_step": 301619, "epoch": 3633} {"train_loss": -25.86468505859375, "global_step": 301620, "epoch": 3633} {"train_loss": -25.666666697306805, "global_step": 301621, "epoch": 3633, "val_loss": 7099139.0} {"train_loss": -23.390485763549805, "global_step": 301622, "epoch": 3634} {"train_loss": -24.241544723510742, "global_step": 301623, "epoch": 3634} {"train_loss": -24.697866439819336, "global_step": 301624, "epoch": 3634} {"train_loss": -24.463300704956055, "global_step": 301625, "epoch": 3634} {"train_loss": -25.086843490600586, "global_step": 301626, "epoch": 3634} {"train_loss": -24.744062423706055, "global_step": 301627, "epoch": 3634} {"train_loss": -24.799243927001953, "global_step": 301628, "epoch": 3634} {"train_loss": -25.713088989257812, "global_step": 301629, "epoch": 3634} {"train_loss": -24.979713439941406, "global_step": 301630, "epoch": 3634} {"train_loss": -25.005754470825195, "global_step": 301631, "epoch": 3634} {"train_loss": -25.406333923339844, "global_step": 301632, "epoch": 3634} {"train_loss": -24.760339736938477, "global_step": 301633, "epoch": 3634} {"train_loss": -25.141584396362305, "global_step": 301634, "epoch": 3634} {"train_loss": -24.930471420288086, "global_step": 301635, "epoch": 3634} {"train_loss": -25.86446189880371, "global_step": 301636, "epoch": 3634} {"train_loss": -25.386377334594727, "global_step": 301637, "epoch": 3634} {"train_loss": -24.929780960083008, "global_step": 301638, "epoch": 3634} {"train_loss": -25.668752670288086, "global_step": 301639, "epoch": 3634} {"train_loss": -25.405738830566406, "global_step": 301640, "epoch": 3634} {"train_loss": -25.666046142578125, "global_step": 301641, "epoch": 3634} {"train_loss": -25.546171188354492, "global_step": 301642, "epoch": 3634} {"train_loss": -25.274051666259766, "global_step": 301643, "epoch": 3634} {"train_loss": -25.25201416015625, "global_step": 301644, "epoch": 3634} {"train_loss": -25.723495483398438, "global_step": 301645, "epoch": 3634} {"train_loss": -25.40928840637207, "global_step": 301646, "epoch": 3634} {"train_loss": -25.367822647094727, "global_step": 301647, "epoch": 3634} {"train_loss": -25.806793212890625, "global_step": 301648, "epoch": 3634} {"train_loss": -25.22087287902832, "global_step": 301649, "epoch": 3634} {"train_loss": -25.31163787841797, "global_step": 301650, "epoch": 3634} {"train_loss": -25.368362426757812, "global_step": 301651, "epoch": 3634} {"train_loss": -25.525074005126953, "global_step": 301652, "epoch": 3634} {"train_loss": -25.70383071899414, "global_step": 301653, "epoch": 3634} {"train_loss": -26.065185546875, "global_step": 301654, "epoch": 3634} {"train_loss": -25.71986198425293, "global_step": 301655, "epoch": 3634} {"train_loss": -26.017547607421875, "global_step": 301656, "epoch": 3634} {"train_loss": -25.81208610534668, "global_step": 301657, "epoch": 3634} {"train_loss": -25.615142822265625, "global_step": 301658, "epoch": 3634} {"train_loss": -25.763580322265625, "global_step": 301659, "epoch": 3634} {"train_loss": -25.953393936157227, "global_step": 301660, "epoch": 3634} {"train_loss": -25.545589447021484, "global_step": 301661, "epoch": 3634} {"train_loss": -25.70707130432129, "global_step": 301662, "epoch": 3634} {"train_loss": -25.62733268737793, "global_step": 301663, "epoch": 3634} {"train_loss": -25.776044845581055, "global_step": 301664, "epoch": 3634} {"train_loss": -25.744476318359375, "global_step": 301665, "epoch": 3634} {"train_loss": -25.78449821472168, "global_step": 301666, "epoch": 3634} {"train_loss": -25.720947265625, "global_step": 301667, "epoch": 3634} {"train_loss": -25.59615707397461, "global_step": 301668, "epoch": 3634} {"train_loss": -25.41278648376465, "global_step": 301669, "epoch": 3634} {"train_loss": -25.799596786499023, "global_step": 301670, "epoch": 3634} {"train_loss": -25.84674072265625, "global_step": 301671, "epoch": 3634} {"train_loss": -25.840673446655273, "global_step": 301672, "epoch": 3634} {"train_loss": -25.986984252929688, "global_step": 301673, "epoch": 3634} {"train_loss": -25.456119537353516, "global_step": 301674, "epoch": 3634} {"train_loss": -25.53371810913086, "global_step": 301675, "epoch": 3634} {"train_loss": -25.531021118164062, "global_step": 301676, "epoch": 3634} {"train_loss": -25.983381271362305, "global_step": 301677, "epoch": 3634} {"train_loss": -25.671735763549805, "global_step": 301678, "epoch": 3634} {"train_loss": -25.851179122924805, "global_step": 301679, "epoch": 3634} {"train_loss": -25.760839462280273, "global_step": 301680, "epoch": 3634} {"train_loss": -25.693099975585938, "global_step": 301681, "epoch": 3634} {"train_loss": -25.419593811035156, "global_step": 301682, "epoch": 3634} {"train_loss": -25.188251495361328, "global_step": 301683, "epoch": 3634} {"train_loss": -25.063817977905273, "global_step": 301684, "epoch": 3634} {"train_loss": -25.7347469329834, "global_step": 301685, "epoch": 3634} {"train_loss": -25.315698623657227, "global_step": 301686, "epoch": 3634} {"train_loss": -25.72540283203125, "global_step": 301687, "epoch": 3634} {"train_loss": -25.4704647064209, "global_step": 301688, "epoch": 3634} {"train_loss": -25.509817123413086, "global_step": 301689, "epoch": 3634} {"train_loss": -25.61441993713379, "global_step": 301690, "epoch": 3634} {"train_loss": -25.571102142333984, "global_step": 301691, "epoch": 3634} {"train_loss": -25.681970596313477, "global_step": 301692, "epoch": 3634} {"train_loss": -25.685861587524414, "global_step": 301693, "epoch": 3634} {"train_loss": -25.34662437438965, "global_step": 301694, "epoch": 3634} {"train_loss": -25.180925369262695, "global_step": 301695, "epoch": 3634} {"train_loss": -25.435855865478516, "global_step": 301696, "epoch": 3634} {"train_loss": -25.36261749267578, "global_step": 301697, "epoch": 3634} {"train_loss": -25.132139205932617, "global_step": 301698, "epoch": 3634} {"train_loss": -25.053688049316406, "global_step": 301699, "epoch": 3634} {"train_loss": -24.894147872924805, "global_step": 301700, "epoch": 3634} {"train_loss": -25.46573257446289, "global_step": 301701, "epoch": 3634} {"train_loss": -25.225515365600586, "global_step": 301702, "epoch": 3634} {"train_loss": -25.167295455932617, "global_step": 301703, "epoch": 3634} {"train_loss": -25.435664785913673, "global_step": 301704, "epoch": 3634, "val_loss": 7163263.0} {"train_loss": -23.84348487854004, "global_step": 301705, "epoch": 3635} {"train_loss": -24.922039031982422, "global_step": 301706, "epoch": 3635} {"train_loss": -24.918691635131836, "global_step": 301707, "epoch": 3635} {"train_loss": -24.472654342651367, "global_step": 301708, "epoch": 3635} {"train_loss": -25.16999053955078, "global_step": 301709, "epoch": 3635} {"train_loss": -24.372556686401367, "global_step": 301710, "epoch": 3635} {"train_loss": -24.804731369018555, "global_step": 301711, "epoch": 3635} {"train_loss": -25.038803100585938, "global_step": 301712, "epoch": 3635} {"train_loss": -25.23487091064453, "global_step": 301713, "epoch": 3635} {"train_loss": -25.038358688354492, "global_step": 301714, "epoch": 3635} {"train_loss": -25.11399269104004, "global_step": 301715, "epoch": 3635} {"train_loss": -25.02153778076172, "global_step": 301716, "epoch": 3635} {"train_loss": -24.989973068237305, "global_step": 301717, "epoch": 3635} {"train_loss": -25.016895294189453, "global_step": 301718, "epoch": 3635} {"train_loss": -25.08332633972168, "global_step": 301719, "epoch": 3635} {"train_loss": -25.28404426574707, "global_step": 301720, "epoch": 3635} {"train_loss": -25.43927001953125, "global_step": 301721, "epoch": 3635} {"train_loss": -25.00468635559082, "global_step": 301722, "epoch": 3635} {"train_loss": -25.660919189453125, "global_step": 301723, "epoch": 3635} {"train_loss": -24.969491958618164, "global_step": 301724, "epoch": 3635} {"train_loss": -25.43950653076172, "global_step": 301725, "epoch": 3635} {"train_loss": -25.434906005859375, "global_step": 301726, "epoch": 3635} {"train_loss": -25.585285186767578, "global_step": 301727, "epoch": 3635} {"train_loss": -25.46787452697754, "global_step": 301728, "epoch": 3635} {"train_loss": -25.811542510986328, "global_step": 301729, "epoch": 3635} {"train_loss": -26.006216049194336, "global_step": 301730, "epoch": 3635} {"train_loss": -25.70758056640625, "global_step": 301731, "epoch": 3635} {"train_loss": -25.528257369995117, "global_step": 301732, "epoch": 3635} {"train_loss": -25.83758544921875, "global_step": 301733, "epoch": 3635} {"train_loss": -25.95173454284668, "global_step": 301734, "epoch": 3635} {"train_loss": -25.6071834564209, "global_step": 301735, "epoch": 3635} {"train_loss": -25.482112884521484, "global_step": 301736, "epoch": 3635} {"train_loss": -25.84706687927246, "global_step": 301737, "epoch": 3635} {"train_loss": -25.775800704956055, "global_step": 301738, "epoch": 3635} {"train_loss": -26.0147762298584, "global_step": 301739, "epoch": 3635} {"train_loss": -25.843427658081055, "global_step": 301740, "epoch": 3635} {"train_loss": -25.857929229736328, "global_step": 301741, "epoch": 3635} {"train_loss": -25.8885498046875, "global_step": 301742, "epoch": 3635} {"train_loss": -25.644941329956055, "global_step": 301743, "epoch": 3635} {"train_loss": -25.72434425354004, "global_step": 301744, "epoch": 3635} {"train_loss": -26.11763572692871, "global_step": 301745, "epoch": 3635} {"train_loss": -25.578449249267578, "global_step": 301746, "epoch": 3635} {"train_loss": -25.972009658813477, "global_step": 301747, "epoch": 3635} {"train_loss": -26.294769287109375, "global_step": 301748, "epoch": 3635} {"train_loss": -25.78826904296875, "global_step": 301749, "epoch": 3635} {"train_loss": -25.558897018432617, "global_step": 301750, "epoch": 3635} {"train_loss": -25.764331817626953, "global_step": 301751, "epoch": 3635} {"train_loss": -25.9387264251709, "global_step": 301752, "epoch": 3635} {"train_loss": -25.693082809448242, "global_step": 301753, "epoch": 3635} {"train_loss": -25.832416534423828, "global_step": 301754, "epoch": 3635} {"train_loss": -25.660551071166992, "global_step": 301755, "epoch": 3635} {"train_loss": -25.674468994140625, "global_step": 301756, "epoch": 3635} {"train_loss": -25.362382888793945, "global_step": 301757, "epoch": 3635} {"train_loss": -25.311199188232422, "global_step": 301758, "epoch": 3635} {"train_loss": -25.392526626586914, "global_step": 301759, "epoch": 3635} {"train_loss": -25.174474716186523, "global_step": 301760, "epoch": 3635} {"train_loss": -25.2598876953125, "global_step": 301761, "epoch": 3635} {"train_loss": -25.6044979095459, "global_step": 301762, "epoch": 3635} {"train_loss": -25.667804718017578, "global_step": 301763, "epoch": 3635} {"train_loss": -25.65125846862793, "global_step": 301764, "epoch": 3635} {"train_loss": -25.6059513092041, "global_step": 301765, "epoch": 3635} {"train_loss": -25.60611915588379, "global_step": 301766, "epoch": 3635} {"train_loss": -25.881805419921875, "global_step": 301767, "epoch": 3635} {"train_loss": -26.00127601623535, "global_step": 301768, "epoch": 3635} {"train_loss": -26.322885513305664, "global_step": 301769, "epoch": 3635} {"train_loss": -25.675622940063477, "global_step": 301770, "epoch": 3635} {"train_loss": -25.6541748046875, "global_step": 301771, "epoch": 3635} {"train_loss": -25.636798858642578, "global_step": 301772, "epoch": 3635} {"train_loss": -26.162445068359375, "global_step": 301773, "epoch": 3635} {"train_loss": -25.81247901916504, "global_step": 301774, "epoch": 3635} {"train_loss": -25.723535537719727, "global_step": 301775, "epoch": 3635} {"train_loss": -25.27712631225586, "global_step": 301776, "epoch": 3635} {"train_loss": -25.89959716796875, "global_step": 301777, "epoch": 3635} {"train_loss": -25.499910354614258, "global_step": 301778, "epoch": 3635} {"train_loss": -25.30669593811035, "global_step": 301779, "epoch": 3635} {"train_loss": -25.755695343017578, "global_step": 301780, "epoch": 3635} {"train_loss": -25.736265182495117, "global_step": 301781, "epoch": 3635} {"train_loss": -25.55258560180664, "global_step": 301782, "epoch": 3635} {"train_loss": -26.170978546142578, "global_step": 301783, "epoch": 3635} {"train_loss": -25.689573287963867, "global_step": 301784, "epoch": 3635} {"train_loss": -25.624725341796875, "global_step": 301785, "epoch": 3635} {"train_loss": -26.00408935546875, "global_step": 301786, "epoch": 3635} {"train_loss": -25.541953994567137, "global_step": 301787, "epoch": 3635, "val_loss": 7202010.0} {"train_loss": -25.05995750427246, "global_step": 301788, "epoch": 3636} {"train_loss": -25.516176223754883, "global_step": 301789, "epoch": 3636} {"train_loss": -25.332935333251953, "global_step": 301790, "epoch": 3636} {"train_loss": -25.783185958862305, "global_step": 301791, "epoch": 3636} {"train_loss": -25.279253005981445, "global_step": 301792, "epoch": 3636} {"train_loss": -25.299320220947266, "global_step": 301793, "epoch": 3636} {"train_loss": -24.799848556518555, "global_step": 301794, "epoch": 3636} {"train_loss": -25.64093017578125, "global_step": 301795, "epoch": 3636} {"train_loss": -25.290273666381836, "global_step": 301796, "epoch": 3636} {"train_loss": -25.566871643066406, "global_step": 301797, "epoch": 3636} {"train_loss": -25.614606857299805, "global_step": 301798, "epoch": 3636} {"train_loss": -25.376583099365234, "global_step": 301799, "epoch": 3636} {"train_loss": -25.288206100463867, "global_step": 301800, "epoch": 3636} {"train_loss": -25.696638107299805, "global_step": 301801, "epoch": 3636} {"train_loss": -25.690433502197266, "global_step": 301802, "epoch": 3636} {"train_loss": -25.0697078704834, "global_step": 301803, "epoch": 3636} {"train_loss": -25.347610473632812, "global_step": 301804, "epoch": 3636} {"train_loss": -25.587446212768555, "global_step": 301805, "epoch": 3636} {"train_loss": -25.650009155273438, "global_step": 301806, "epoch": 3636} {"train_loss": -25.28255271911621, "global_step": 301807, "epoch": 3636} {"train_loss": -25.582395553588867, "global_step": 301808, "epoch": 3636} {"train_loss": -25.525959014892578, "global_step": 301809, "epoch": 3636} {"train_loss": -25.37272071838379, "global_step": 301810, "epoch": 3636} {"train_loss": -25.879621505737305, "global_step": 301811, "epoch": 3636} {"train_loss": -25.623899459838867, "global_step": 301812, "epoch": 3636} {"train_loss": -25.485456466674805, "global_step": 301813, "epoch": 3636} {"train_loss": -25.726327896118164, "global_step": 301814, "epoch": 3636} {"train_loss": -25.596527099609375, "global_step": 301815, "epoch": 3636} {"train_loss": -25.85793113708496, "global_step": 301816, "epoch": 3636} {"train_loss": -25.288002014160156, "global_step": 301817, "epoch": 3636} {"train_loss": -25.720504760742188, "global_step": 301818, "epoch": 3636} {"train_loss": -25.686742782592773, "global_step": 301819, "epoch": 3636} {"train_loss": -25.555932998657227, "global_step": 301820, "epoch": 3636} {"train_loss": -25.8006591796875, "global_step": 301821, "epoch": 3636} {"train_loss": -25.7592830657959, "global_step": 301822, "epoch": 3636} {"train_loss": -25.818151473999023, "global_step": 301823, "epoch": 3636} {"train_loss": -25.7158260345459, "global_step": 301824, "epoch": 3636} {"train_loss": -26.068021774291992, "global_step": 301825, "epoch": 3636} {"train_loss": -25.639728546142578, "global_step": 301826, "epoch": 3636} {"train_loss": -25.81965446472168, "global_step": 301827, "epoch": 3636} {"train_loss": -25.686628341674805, "global_step": 301828, "epoch": 3636} {"train_loss": -25.715545654296875, "global_step": 301829, "epoch": 3636} {"train_loss": -25.589296340942383, "global_step": 301830, "epoch": 3636} {"train_loss": -25.652618408203125, "global_step": 301831, "epoch": 3636} {"train_loss": -25.978864669799805, "global_step": 301832, "epoch": 3636} {"train_loss": -25.607004165649414, "global_step": 301833, "epoch": 3636} {"train_loss": -25.374662399291992, "global_step": 301834, "epoch": 3636} {"train_loss": -25.379201889038086, "global_step": 301835, "epoch": 3636} {"train_loss": -25.762617111206055, "global_step": 301836, "epoch": 3636} {"train_loss": -25.634082794189453, "global_step": 301837, "epoch": 3636} {"train_loss": -25.31325340270996, "global_step": 301838, "epoch": 3636} {"train_loss": -25.675216674804688, "global_step": 301839, "epoch": 3636} {"train_loss": -26.25776481628418, "global_step": 301840, "epoch": 3636} {"train_loss": -25.5843563079834, "global_step": 301841, "epoch": 3636} {"train_loss": -25.542591094970703, "global_step": 301842, "epoch": 3636} {"train_loss": -25.548316955566406, "global_step": 301843, "epoch": 3636} {"train_loss": -25.925512313842773, "global_step": 301844, "epoch": 3636} {"train_loss": -25.590595245361328, "global_step": 301845, "epoch": 3636} {"train_loss": -25.648468017578125, "global_step": 301846, "epoch": 3636} {"train_loss": -25.597814559936523, "global_step": 301847, "epoch": 3636} {"train_loss": -25.5595760345459, "global_step": 301848, "epoch": 3636} {"train_loss": -25.586130142211914, "global_step": 301849, "epoch": 3636} {"train_loss": -25.7337589263916, "global_step": 301850, "epoch": 3636} {"train_loss": -25.758508682250977, "global_step": 301851, "epoch": 3636} {"train_loss": -25.518077850341797, "global_step": 301852, "epoch": 3636} {"train_loss": -25.852766036987305, "global_step": 301853, "epoch": 3636} {"train_loss": -25.50213050842285, "global_step": 301854, "epoch": 3636} {"train_loss": -25.655691146850586, "global_step": 301855, "epoch": 3636} {"train_loss": -25.701786041259766, "global_step": 301856, "epoch": 3636} {"train_loss": -25.671661376953125, "global_step": 301857, "epoch": 3636} {"train_loss": -25.752470016479492, "global_step": 301858, "epoch": 3636} {"train_loss": -25.684375762939453, "global_step": 301859, "epoch": 3636} {"train_loss": -25.21190071105957, "global_step": 301860, "epoch": 3636} {"train_loss": -25.908185958862305, "global_step": 301861, "epoch": 3636} {"train_loss": -25.715457916259766, "global_step": 301862, "epoch": 3636} {"train_loss": -25.537179946899414, "global_step": 301863, "epoch": 3636} {"train_loss": -25.63881492614746, "global_step": 301864, "epoch": 3636} {"train_loss": -25.504283905029297, "global_step": 301865, "epoch": 3636} {"train_loss": -25.810144424438477, "global_step": 301866, "epoch": 3636} {"train_loss": -25.872638702392578, "global_step": 301867, "epoch": 3636} {"train_loss": -25.796314239501953, "global_step": 301868, "epoch": 3636} {"train_loss": -25.690977096557617, "global_step": 301869, "epoch": 3636} {"train_loss": -25.597405720906085, "global_step": 301870, "epoch": 3636, "val_loss": 7163904.0} {"train_loss": -25.40962791442871, "global_step": 301871, "epoch": 3637} {"train_loss": -24.883298873901367, "global_step": 301872, "epoch": 3637} {"train_loss": -25.474071502685547, "global_step": 301873, "epoch": 3637} {"train_loss": -25.27228355407715, "global_step": 301874, "epoch": 3637} {"train_loss": -25.24131202697754, "global_step": 301875, "epoch": 3637} {"train_loss": -24.96712303161621, "global_step": 301876, "epoch": 3637} {"train_loss": -24.906490325927734, "global_step": 301877, "epoch": 3637} {"train_loss": -25.060882568359375, "global_step": 301878, "epoch": 3637} {"train_loss": -25.221725463867188, "global_step": 301879, "epoch": 3637} {"train_loss": -25.31890869140625, "global_step": 301880, "epoch": 3637} {"train_loss": -25.566871643066406, "global_step": 301881, "epoch": 3637} {"train_loss": -25.35148811340332, "global_step": 301882, "epoch": 3637} {"train_loss": -25.995086669921875, "global_step": 301883, "epoch": 3637} {"train_loss": -25.584646224975586, "global_step": 301884, "epoch": 3637} {"train_loss": -25.70102310180664, "global_step": 301885, "epoch": 3637} {"train_loss": -25.305011749267578, "global_step": 301886, "epoch": 3637} {"train_loss": -25.593902587890625, "global_step": 301887, "epoch": 3637} {"train_loss": -25.548675537109375, "global_step": 301888, "epoch": 3637} {"train_loss": -25.714841842651367, "global_step": 301889, "epoch": 3637} {"train_loss": -25.65346336364746, "global_step": 301890, "epoch": 3637} {"train_loss": -25.457963943481445, "global_step": 301891, "epoch": 3637} {"train_loss": -25.513490676879883, "global_step": 301892, "epoch": 3637} {"train_loss": -25.725183486938477, "global_step": 301893, "epoch": 3637} {"train_loss": -25.99993896484375, "global_step": 301894, "epoch": 3637} {"train_loss": -25.384544372558594, "global_step": 301895, "epoch": 3637} {"train_loss": -26.10206413269043, "global_step": 301896, "epoch": 3637} {"train_loss": -25.41703224182129, "global_step": 301897, "epoch": 3637} {"train_loss": -25.459318161010742, "global_step": 301898, "epoch": 3637} {"train_loss": -25.59464454650879, "global_step": 301899, "epoch": 3637} {"train_loss": -25.44476318359375, "global_step": 301900, "epoch": 3637} {"train_loss": -25.997095108032227, "global_step": 301901, "epoch": 3637} {"train_loss": -25.789335250854492, "global_step": 301902, "epoch": 3637} {"train_loss": -25.482454299926758, "global_step": 301903, "epoch": 3637} {"train_loss": -25.37429428100586, "global_step": 301904, "epoch": 3637} {"train_loss": -25.64292335510254, "global_step": 301905, "epoch": 3637} {"train_loss": -25.652362823486328, "global_step": 301906, "epoch": 3637} {"train_loss": -25.8685359954834, "global_step": 301907, "epoch": 3637} {"train_loss": -25.549022674560547, "global_step": 301908, "epoch": 3637} {"train_loss": -25.811742782592773, "global_step": 301909, "epoch": 3637} {"train_loss": -25.887327194213867, "global_step": 301910, "epoch": 3637} {"train_loss": -25.659311294555664, "global_step": 301911, "epoch": 3637} {"train_loss": -25.574480056762695, "global_step": 301912, "epoch": 3637} {"train_loss": -25.657230377197266, "global_step": 301913, "epoch": 3637} {"train_loss": -25.680532455444336, "global_step": 301914, "epoch": 3637} {"train_loss": -25.986730575561523, "global_step": 301915, "epoch": 3637} {"train_loss": -25.765295028686523, "global_step": 301916, "epoch": 3637} {"train_loss": -25.479768753051758, "global_step": 301917, "epoch": 3637} {"train_loss": -25.524995803833008, "global_step": 301918, "epoch": 3637} {"train_loss": -25.51064682006836, "global_step": 301919, "epoch": 3637} {"train_loss": -25.8817195892334, "global_step": 301920, "epoch": 3637} {"train_loss": -25.582616806030273, "global_step": 301921, "epoch": 3637} {"train_loss": -25.530323028564453, "global_step": 301922, "epoch": 3637} {"train_loss": -25.80021095275879, "global_step": 301923, "epoch": 3637} {"train_loss": -25.437164306640625, "global_step": 301924, "epoch": 3637} {"train_loss": -25.858417510986328, "global_step": 301925, "epoch": 3637} {"train_loss": -25.658721923828125, "global_step": 301926, "epoch": 3637} {"train_loss": -25.678375244140625, "global_step": 301927, "epoch": 3637} {"train_loss": -25.778406143188477, "global_step": 301928, "epoch": 3637} {"train_loss": -26.07814598083496, "global_step": 301929, "epoch": 3637} {"train_loss": -25.317075729370117, "global_step": 301930, "epoch": 3637} {"train_loss": -25.631040573120117, "global_step": 301931, "epoch": 3637} {"train_loss": -26.007177352905273, "global_step": 301932, "epoch": 3637} {"train_loss": -25.486188888549805, "global_step": 301933, "epoch": 3637} {"train_loss": -25.7366886138916, "global_step": 301934, "epoch": 3637} {"train_loss": -25.645849227905273, "global_step": 301935, "epoch": 3637} {"train_loss": -25.707275390625, "global_step": 301936, "epoch": 3637} {"train_loss": -25.687362670898438, "global_step": 301937, "epoch": 3637} {"train_loss": -25.65598487854004, "global_step": 301938, "epoch": 3637} {"train_loss": -25.675556182861328, "global_step": 301939, "epoch": 3637} {"train_loss": -25.245649337768555, "global_step": 301940, "epoch": 3637} {"train_loss": -26.113733291625977, "global_step": 301941, "epoch": 3637} {"train_loss": -25.8209285736084, "global_step": 301942, "epoch": 3637} {"train_loss": -25.61652946472168, "global_step": 301943, "epoch": 3637} {"train_loss": -26.048559188842773, "global_step": 301944, "epoch": 3637} {"train_loss": -25.8057861328125, "global_step": 301945, "epoch": 3637} {"train_loss": -25.993215560913086, "global_step": 301946, "epoch": 3637} {"train_loss": -25.6577205657959, "global_step": 301947, "epoch": 3637} {"train_loss": -25.67690086364746, "global_step": 301948, "epoch": 3637} {"train_loss": -25.877294540405273, "global_step": 301949, "epoch": 3637} {"train_loss": -25.882566452026367, "global_step": 301950, "epoch": 3637} {"train_loss": -25.83180809020996, "global_step": 301951, "epoch": 3637} {"train_loss": -25.74301528930664, "global_step": 301952, "epoch": 3637} {"train_loss": -25.615975988916603, "global_step": 301953, "epoch": 3637, "val_loss": 7224867.5} {"train_loss": -25.44367790222168, "global_step": 301954, "epoch": 3638} {"train_loss": -25.373708724975586, "global_step": 301955, "epoch": 3638} {"train_loss": -25.372182846069336, "global_step": 301956, "epoch": 3638} {"train_loss": -25.071035385131836, "global_step": 301957, "epoch": 3638} {"train_loss": -25.090396881103516, "global_step": 301958, "epoch": 3638} {"train_loss": -25.637060165405273, "global_step": 301959, "epoch": 3638} {"train_loss": -24.972782135009766, "global_step": 301960, "epoch": 3638} {"train_loss": -25.205291748046875, "global_step": 301961, "epoch": 3638} {"train_loss": -25.28493309020996, "global_step": 301962, "epoch": 3638} {"train_loss": -25.40305519104004, "global_step": 301963, "epoch": 3638} {"train_loss": -25.227848052978516, "global_step": 301964, "epoch": 3638} {"train_loss": -25.223346710205078, "global_step": 301965, "epoch": 3638} {"train_loss": -25.2470703125, "global_step": 301966, "epoch": 3638} {"train_loss": -25.002063751220703, "global_step": 301967, "epoch": 3638} {"train_loss": -25.35696792602539, "global_step": 301968, "epoch": 3638} {"train_loss": -25.26930809020996, "global_step": 301969, "epoch": 3638} {"train_loss": -25.16938591003418, "global_step": 301970, "epoch": 3638} {"train_loss": -25.41945457458496, "global_step": 301971, "epoch": 3638} {"train_loss": -24.939916610717773, "global_step": 301972, "epoch": 3638} {"train_loss": -25.676105499267578, "global_step": 301973, "epoch": 3638} {"train_loss": -25.35610008239746, "global_step": 301974, "epoch": 3638} {"train_loss": -25.183591842651367, "global_step": 301975, "epoch": 3638} {"train_loss": -25.279775619506836, "global_step": 301976, "epoch": 3638} {"train_loss": -25.570919036865234, "global_step": 301977, "epoch": 3638} {"train_loss": -25.74386978149414, "global_step": 301978, "epoch": 3638} {"train_loss": -25.669904708862305, "global_step": 301979, "epoch": 3638} {"train_loss": -25.795074462890625, "global_step": 301980, "epoch": 3638} {"train_loss": -25.234970092773438, "global_step": 301981, "epoch": 3638} {"train_loss": -25.730030059814453, "global_step": 301982, "epoch": 3638} {"train_loss": -25.8189697265625, "global_step": 301983, "epoch": 3638} {"train_loss": -25.316543579101562, "global_step": 301984, "epoch": 3638} {"train_loss": -25.672388076782227, "global_step": 301985, "epoch": 3638} {"train_loss": -25.492786407470703, "global_step": 301986, "epoch": 3638} {"train_loss": -25.595195770263672, "global_step": 301987, "epoch": 3638} {"train_loss": -25.77678871154785, "global_step": 301988, "epoch": 3638} {"train_loss": -25.64592933654785, "global_step": 301989, "epoch": 3638} {"train_loss": -25.873077392578125, "global_step": 301990, "epoch": 3638} {"train_loss": -25.68316078186035, "global_step": 301991, "epoch": 3638} {"train_loss": -25.688201904296875, "global_step": 301992, "epoch": 3638} {"train_loss": -25.825841903686523, "global_step": 301993, "epoch": 3638} {"train_loss": -25.678308486938477, "global_step": 301994, "epoch": 3638} {"train_loss": -26.10528564453125, "global_step": 301995, "epoch": 3638} {"train_loss": -25.498998641967773, "global_step": 301996, "epoch": 3638} {"train_loss": -25.674041748046875, "global_step": 301997, "epoch": 3638} {"train_loss": -25.52826499938965, "global_step": 301998, "epoch": 3638} {"train_loss": -25.6162109375, "global_step": 301999, "epoch": 3638} {"train_loss": -25.8671875, "global_step": 302000, "epoch": 3638} {"train_loss": -26.04549217224121, "global_step": 302001, "epoch": 3638} {"train_loss": -25.649499893188477, "global_step": 302002, "epoch": 3638} {"train_loss": -25.812103271484375, "global_step": 302003, "epoch": 3638} {"train_loss": -26.018798828125, "global_step": 302004, "epoch": 3638} {"train_loss": -25.848285675048828, "global_step": 302005, "epoch": 3638} {"train_loss": -25.932464599609375, "global_step": 302006, "epoch": 3638} {"train_loss": -25.403276443481445, "global_step": 302007, "epoch": 3638} {"train_loss": -25.68011474609375, "global_step": 302008, "epoch": 3638} {"train_loss": -25.76779556274414, "global_step": 302009, "epoch": 3638} {"train_loss": -25.38570785522461, "global_step": 302010, "epoch": 3638} {"train_loss": -25.887027740478516, "global_step": 302011, "epoch": 3638} {"train_loss": -25.987323760986328, "global_step": 302012, "epoch": 3638} {"train_loss": -25.57377815246582, "global_step": 302013, "epoch": 3638} {"train_loss": -25.710119247436523, "global_step": 302014, "epoch": 3638} {"train_loss": -25.896484375, "global_step": 302015, "epoch": 3638} {"train_loss": -25.493087768554688, "global_step": 302016, "epoch": 3638} {"train_loss": -25.68014907836914, "global_step": 302017, "epoch": 3638} {"train_loss": -25.79788589477539, "global_step": 302018, "epoch": 3638} {"train_loss": -26.039255142211914, "global_step": 302019, "epoch": 3638} {"train_loss": -25.889129638671875, "global_step": 302020, "epoch": 3638} {"train_loss": -25.481260299682617, "global_step": 302021, "epoch": 3638} {"train_loss": -25.6527042388916, "global_step": 302022, "epoch": 3638} {"train_loss": -25.502769470214844, "global_step": 302023, "epoch": 3638} {"train_loss": -25.13325309753418, "global_step": 302024, "epoch": 3638} {"train_loss": -25.34689712524414, "global_step": 302025, "epoch": 3638} {"train_loss": -25.447696685791016, "global_step": 302026, "epoch": 3638} {"train_loss": -25.16065788269043, "global_step": 302027, "epoch": 3638} {"train_loss": -25.37570571899414, "global_step": 302028, "epoch": 3638} {"train_loss": -25.297107696533203, "global_step": 302029, "epoch": 3638} {"train_loss": -25.462020874023438, "global_step": 302030, "epoch": 3638} {"train_loss": -25.30107879638672, "global_step": 302031, "epoch": 3638} {"train_loss": -25.638458251953125, "global_step": 302032, "epoch": 3638} {"train_loss": -25.58005714416504, "global_step": 302033, "epoch": 3638} {"train_loss": -25.42401695251465, "global_step": 302034, "epoch": 3638} {"train_loss": -26.021703720092773, "global_step": 302035, "epoch": 3638} {"train_loss": -25.54026341725545, "global_step": 302036, "epoch": 3638, "val_loss": 7155412.0} {"train_loss": -24.799413681030273, "global_step": 302037, "epoch": 3639} {"train_loss": -25.060993194580078, "global_step": 302038, "epoch": 3639} {"train_loss": -25.255046844482422, "global_step": 302039, "epoch": 3639} {"train_loss": -25.438446044921875, "global_step": 302040, "epoch": 3639} {"train_loss": -25.686767578125, "global_step": 302041, "epoch": 3639} {"train_loss": -25.380264282226562, "global_step": 302042, "epoch": 3639} {"train_loss": -25.245019912719727, "global_step": 302043, "epoch": 3639} {"train_loss": -25.231008529663086, "global_step": 302044, "epoch": 3639} {"train_loss": -25.13819694519043, "global_step": 302045, "epoch": 3639} {"train_loss": -25.565736770629883, "global_step": 302046, "epoch": 3639} {"train_loss": -25.7076473236084, "global_step": 302047, "epoch": 3639} {"train_loss": -25.922779083251953, "global_step": 302048, "epoch": 3639} {"train_loss": -25.9570369720459, "global_step": 302049, "epoch": 3639} {"train_loss": -25.4493465423584, "global_step": 302050, "epoch": 3639} {"train_loss": -25.75823402404785, "global_step": 302051, "epoch": 3639} {"train_loss": -25.48011589050293, "global_step": 302052, "epoch": 3639} {"train_loss": -25.625085830688477, "global_step": 302053, "epoch": 3639} {"train_loss": -25.609350204467773, "global_step": 302054, "epoch": 3639} {"train_loss": -25.929885864257812, "global_step": 302055, "epoch": 3639} {"train_loss": -25.680089950561523, "global_step": 302056, "epoch": 3639} {"train_loss": -25.7559871673584, "global_step": 302057, "epoch": 3639} {"train_loss": -25.558794021606445, "global_step": 302058, "epoch": 3639} {"train_loss": -25.590951919555664, "global_step": 302059, "epoch": 3639} {"train_loss": -25.431692123413086, "global_step": 302060, "epoch": 3639} {"train_loss": -25.840179443359375, "global_step": 302061, "epoch": 3639} {"train_loss": -25.929269790649414, "global_step": 302062, "epoch": 3639} {"train_loss": -26.104583740234375, "global_step": 302063, "epoch": 3639} {"train_loss": -25.755292892456055, "global_step": 302064, "epoch": 3639} {"train_loss": -26.000507354736328, "global_step": 302065, "epoch": 3639} {"train_loss": -25.780414581298828, "global_step": 302066, "epoch": 3639} {"train_loss": -26.0894775390625, "global_step": 302067, "epoch": 3639} {"train_loss": -25.95539665222168, "global_step": 302068, "epoch": 3639} {"train_loss": -25.8640079498291, "global_step": 302069, "epoch": 3639} {"train_loss": -25.8826847076416, "global_step": 302070, "epoch": 3639} {"train_loss": -25.78387451171875, "global_step": 302071, "epoch": 3639} {"train_loss": -26.024946212768555, "global_step": 302072, "epoch": 3639} {"train_loss": -25.78550148010254, "global_step": 302073, "epoch": 3639} {"train_loss": -25.991119384765625, "global_step": 302074, "epoch": 3639} {"train_loss": -25.978635787963867, "global_step": 302075, "epoch": 3639} {"train_loss": -26.040210723876953, "global_step": 302076, "epoch": 3639} {"train_loss": -25.880300521850586, "global_step": 302077, "epoch": 3639} {"train_loss": -26.12507438659668, "global_step": 302078, "epoch": 3639} {"train_loss": -25.866907119750977, "global_step": 302079, "epoch": 3639} {"train_loss": -25.493833541870117, "global_step": 302080, "epoch": 3639} {"train_loss": -25.515077590942383, "global_step": 302081, "epoch": 3639} {"train_loss": -25.442657470703125, "global_step": 302082, "epoch": 3639} {"train_loss": -25.871084213256836, "global_step": 302083, "epoch": 3639} {"train_loss": -25.62107276916504, "global_step": 302084, "epoch": 3639} {"train_loss": -25.589658737182617, "global_step": 302085, "epoch": 3639} {"train_loss": -25.628381729125977, "global_step": 302086, "epoch": 3639} {"train_loss": -25.387788772583008, "global_step": 302087, "epoch": 3639} {"train_loss": -25.62641716003418, "global_step": 302088, "epoch": 3639} {"train_loss": -25.423925399780273, "global_step": 302089, "epoch": 3639} {"train_loss": -26.211536407470703, "global_step": 302090, "epoch": 3639} {"train_loss": -25.839120864868164, "global_step": 302091, "epoch": 3639} {"train_loss": -25.829315185546875, "global_step": 302092, "epoch": 3639} {"train_loss": -25.7828369140625, "global_step": 302093, "epoch": 3639} {"train_loss": -25.74830436706543, "global_step": 302094, "epoch": 3639} {"train_loss": -25.61444664001465, "global_step": 302095, "epoch": 3639} {"train_loss": -25.875295639038086, "global_step": 302096, "epoch": 3639} {"train_loss": -25.64984130859375, "global_step": 302097, "epoch": 3639} {"train_loss": -25.795928955078125, "global_step": 302098, "epoch": 3639} {"train_loss": -25.879602432250977, "global_step": 302099, "epoch": 3639} {"train_loss": -25.656763076782227, "global_step": 302100, "epoch": 3639} {"train_loss": -25.39572525024414, "global_step": 302101, "epoch": 3639} {"train_loss": -25.498538970947266, "global_step": 302102, "epoch": 3639} {"train_loss": -25.792051315307617, "global_step": 302103, "epoch": 3639} {"train_loss": -26.069183349609375, "global_step": 302104, "epoch": 3639} {"train_loss": -25.698144912719727, "global_step": 302105, "epoch": 3639} {"train_loss": -25.598339080810547, "global_step": 302106, "epoch": 3639} {"train_loss": -25.734054565429688, "global_step": 302107, "epoch": 3639} {"train_loss": -25.75349235534668, "global_step": 302108, "epoch": 3639} {"train_loss": -25.850860595703125, "global_step": 302109, "epoch": 3639} {"train_loss": -25.548200607299805, "global_step": 302110, "epoch": 3639} {"train_loss": -25.72598648071289, "global_step": 302111, "epoch": 3639} {"train_loss": -25.904748916625977, "global_step": 302112, "epoch": 3639} {"train_loss": -25.504148483276367, "global_step": 302113, "epoch": 3639} {"train_loss": -25.982385635375977, "global_step": 302114, "epoch": 3639} {"train_loss": -25.544584274291992, "global_step": 302115, "epoch": 3639} {"train_loss": -25.884824752807617, "global_step": 302116, "epoch": 3639} {"train_loss": -25.87489891052246, "global_step": 302117, "epoch": 3639} {"train_loss": -25.658823013305664, "global_step": 302118, "epoch": 3639} {"train_loss": -25.686063490718244, "global_step": 302119, "epoch": 3639, "val_loss": 7143552.0} {"train_loss": -22.363431930541992, "global_step": 302120, "epoch": 3640} {"train_loss": -22.626630783081055, "global_step": 302121, "epoch": 3640} {"train_loss": -24.849721908569336, "global_step": 302122, "epoch": 3640} {"train_loss": -22.74083709716797, "global_step": 302123, "epoch": 3640} {"train_loss": -23.996862411499023, "global_step": 302124, "epoch": 3640} {"train_loss": -23.478097915649414, "global_step": 302125, "epoch": 3640} {"train_loss": -22.80173110961914, "global_step": 302126, "epoch": 3640} {"train_loss": -24.451059341430664, "global_step": 302127, "epoch": 3640} {"train_loss": -23.758056640625, "global_step": 302128, "epoch": 3640} {"train_loss": -24.672754287719727, "global_step": 302129, "epoch": 3640} {"train_loss": -24.499658584594727, "global_step": 302130, "epoch": 3640} {"train_loss": -24.431425094604492, "global_step": 302131, "epoch": 3640} {"train_loss": -24.335004806518555, "global_step": 302132, "epoch": 3640} {"train_loss": -24.769773483276367, "global_step": 302133, "epoch": 3640} {"train_loss": -24.476947784423828, "global_step": 302134, "epoch": 3640} {"train_loss": -24.890905380249023, "global_step": 302135, "epoch": 3640} {"train_loss": -25.041881561279297, "global_step": 302136, "epoch": 3640} {"train_loss": -24.82015037536621, "global_step": 302137, "epoch": 3640} {"train_loss": -24.578927993774414, "global_step": 302138, "epoch": 3640} {"train_loss": -24.953012466430664, "global_step": 302139, "epoch": 3640} {"train_loss": -24.93633460998535, "global_step": 302140, "epoch": 3640} {"train_loss": -25.113821029663086, "global_step": 302141, "epoch": 3640} {"train_loss": -25.136350631713867, "global_step": 302142, "epoch": 3640} {"train_loss": -24.93111228942871, "global_step": 302143, "epoch": 3640} {"train_loss": -25.022296905517578, "global_step": 302144, "epoch": 3640} {"train_loss": -25.00408363342285, "global_step": 302145, "epoch": 3640} {"train_loss": -24.883386611938477, "global_step": 302146, "epoch": 3640} {"train_loss": -25.10013198852539, "global_step": 302147, "epoch": 3640} {"train_loss": -25.170103073120117, "global_step": 302148, "epoch": 3640} {"train_loss": -25.410831451416016, "global_step": 302149, "epoch": 3640} {"train_loss": -25.106304168701172, "global_step": 302150, "epoch": 3640} {"train_loss": -25.302099227905273, "global_step": 302151, "epoch": 3640} {"train_loss": -25.435327529907227, "global_step": 302152, "epoch": 3640} {"train_loss": -25.490222930908203, "global_step": 302153, "epoch": 3640} {"train_loss": -25.59769058227539, "global_step": 302154, "epoch": 3640} {"train_loss": -25.7711181640625, "global_step": 302155, "epoch": 3640} {"train_loss": -25.48828125, "global_step": 302156, "epoch": 3640} {"train_loss": -25.662458419799805, "global_step": 302157, "epoch": 3640} {"train_loss": -25.141620635986328, "global_step": 302158, "epoch": 3640} {"train_loss": -25.36460304260254, "global_step": 302159, "epoch": 3640} {"train_loss": -25.44723892211914, "global_step": 302160, "epoch": 3640} {"train_loss": -25.40066909790039, "global_step": 302161, "epoch": 3640} {"train_loss": -25.656591415405273, "global_step": 302162, "epoch": 3640} {"train_loss": -25.50986671447754, "global_step": 302163, "epoch": 3640} {"train_loss": -25.752222061157227, "global_step": 302164, "epoch": 3640} {"train_loss": -25.731800079345703, "global_step": 302165, "epoch": 3640} {"train_loss": -25.6195068359375, "global_step": 302166, "epoch": 3640} {"train_loss": -25.61669921875, "global_step": 302167, "epoch": 3640} {"train_loss": -25.05576515197754, "global_step": 302168, "epoch": 3640} {"train_loss": -25.873565673828125, "global_step": 302169, "epoch": 3640} {"train_loss": -25.580053329467773, "global_step": 302170, "epoch": 3640} {"train_loss": -25.420164108276367, "global_step": 302171, "epoch": 3640} {"train_loss": -25.735950469970703, "global_step": 302172, "epoch": 3640} {"train_loss": -25.955215454101562, "global_step": 302173, "epoch": 3640} {"train_loss": -25.902048110961914, "global_step": 302174, "epoch": 3640} {"train_loss": -25.61696434020996, "global_step": 302175, "epoch": 3640} {"train_loss": -25.652332305908203, "global_step": 302176, "epoch": 3640} {"train_loss": -25.567386627197266, "global_step": 302177, "epoch": 3640} {"train_loss": -25.694711685180664, "global_step": 302178, "epoch": 3640} {"train_loss": -25.87860107421875, "global_step": 302179, "epoch": 3640} {"train_loss": -25.717304229736328, "global_step": 302180, "epoch": 3640} {"train_loss": -25.347387313842773, "global_step": 302181, "epoch": 3640} {"train_loss": -25.69862937927246, "global_step": 302182, "epoch": 3640} {"train_loss": -25.641407012939453, "global_step": 302183, "epoch": 3640} {"train_loss": -25.76690101623535, "global_step": 302184, "epoch": 3640} {"train_loss": -25.832101821899414, "global_step": 302185, "epoch": 3640} {"train_loss": -25.277326583862305, "global_step": 302186, "epoch": 3640} {"train_loss": -25.47768211364746, "global_step": 302187, "epoch": 3640} {"train_loss": -25.61604118347168, "global_step": 302188, "epoch": 3640} {"train_loss": -25.46636390686035, "global_step": 302189, "epoch": 3640} {"train_loss": -26.159849166870117, "global_step": 302190, "epoch": 3640} {"train_loss": -26.085546493530273, "global_step": 302191, "epoch": 3640} {"train_loss": -25.23028564453125, "global_step": 302192, "epoch": 3640} {"train_loss": -25.848575592041016, "global_step": 302193, "epoch": 3640} {"train_loss": -25.611236572265625, "global_step": 302194, "epoch": 3640} {"train_loss": -25.85267448425293, "global_step": 302195, "epoch": 3640} {"train_loss": -25.653079986572266, "global_step": 302196, "epoch": 3640} {"train_loss": -25.53990936279297, "global_step": 302197, "epoch": 3640} {"train_loss": -25.708465576171875, "global_step": 302198, "epoch": 3640} {"train_loss": -25.85438346862793, "global_step": 302199, "epoch": 3640} {"train_loss": -25.85512351989746, "global_step": 302200, "epoch": 3640} {"train_loss": -25.9880428314209, "global_step": 302201, "epoch": 3640} {"train_loss": -25.204873556114105, "global_step": 302202, "epoch": 3640, "val_loss": 7221411.0} {"train_loss": -25.32356834411621, "global_step": 302203, "epoch": 3641} {"train_loss": -24.968751907348633, "global_step": 302204, "epoch": 3641} {"train_loss": -25.43825340270996, "global_step": 302205, "epoch": 3641} {"train_loss": -25.385303497314453, "global_step": 302206, "epoch": 3641} {"train_loss": -25.347562789916992, "global_step": 302207, "epoch": 3641} {"train_loss": -25.394163131713867, "global_step": 302208, "epoch": 3641} {"train_loss": -25.2587947845459, "global_step": 302209, "epoch": 3641} {"train_loss": -25.33578109741211, "global_step": 302210, "epoch": 3641} {"train_loss": -25.617874145507812, "global_step": 302211, "epoch": 3641} {"train_loss": -25.540178298950195, "global_step": 302212, "epoch": 3641} {"train_loss": -24.870811462402344, "global_step": 302213, "epoch": 3641} {"train_loss": -24.97775650024414, "global_step": 302214, "epoch": 3641} {"train_loss": -25.421594619750977, "global_step": 302215, "epoch": 3641} {"train_loss": -25.493947982788086, "global_step": 302216, "epoch": 3641} {"train_loss": -25.153209686279297, "global_step": 302217, "epoch": 3641} {"train_loss": -25.656347274780273, "global_step": 302218, "epoch": 3641} {"train_loss": -25.192596435546875, "global_step": 302219, "epoch": 3641} {"train_loss": -25.478368759155273, "global_step": 302220, "epoch": 3641} {"train_loss": -25.55109977722168, "global_step": 302221, "epoch": 3641} {"train_loss": -25.530317306518555, "global_step": 302222, "epoch": 3641} {"train_loss": -25.67099380493164, "global_step": 302223, "epoch": 3641} {"train_loss": -25.353361129760742, "global_step": 302224, "epoch": 3641} {"train_loss": -25.611011505126953, "global_step": 302225, "epoch": 3641} {"train_loss": -25.812665939331055, "global_step": 302226, "epoch": 3641} {"train_loss": -25.126480102539062, "global_step": 302227, "epoch": 3641} {"train_loss": -25.50762367248535, "global_step": 302228, "epoch": 3641} {"train_loss": -25.551599502563477, "global_step": 302229, "epoch": 3641} {"train_loss": -25.471601486206055, "global_step": 302230, "epoch": 3641} {"train_loss": -25.394657135009766, "global_step": 302231, "epoch": 3641} {"train_loss": -25.573837280273438, "global_step": 302232, "epoch": 3641} {"train_loss": -25.41019058227539, "global_step": 302233, "epoch": 3641} {"train_loss": -25.902393341064453, "global_step": 302234, "epoch": 3641} {"train_loss": -25.749134063720703, "global_step": 302235, "epoch": 3641} {"train_loss": -25.517822265625, "global_step": 302236, "epoch": 3641} {"train_loss": -25.46515464782715, "global_step": 302237, "epoch": 3641} {"train_loss": -25.44036293029785, "global_step": 302238, "epoch": 3641} {"train_loss": -25.53196144104004, "global_step": 302239, "epoch": 3641} {"train_loss": -25.758533477783203, "global_step": 302240, "epoch": 3641} {"train_loss": -25.289535522460938, "global_step": 302241, "epoch": 3641} {"train_loss": -25.42317771911621, "global_step": 302242, "epoch": 3641} {"train_loss": -25.48158073425293, "global_step": 302243, "epoch": 3641} {"train_loss": -25.601825714111328, "global_step": 302244, "epoch": 3641} {"train_loss": -25.523916244506836, "global_step": 302245, "epoch": 3641} {"train_loss": -25.160802841186523, "global_step": 302246, "epoch": 3641} {"train_loss": -25.359756469726562, "global_step": 302247, "epoch": 3641} {"train_loss": -25.45284080505371, "global_step": 302248, "epoch": 3641} {"train_loss": -25.43514060974121, "global_step": 302249, "epoch": 3641} {"train_loss": -25.804121017456055, "global_step": 302250, "epoch": 3641} {"train_loss": -25.652841567993164, "global_step": 302251, "epoch": 3641} {"train_loss": -25.674701690673828, "global_step": 302252, "epoch": 3641} {"train_loss": -25.889490127563477, "global_step": 302253, "epoch": 3641} {"train_loss": -25.745716094970703, "global_step": 302254, "epoch": 3641} {"train_loss": -25.985595703125, "global_step": 302255, "epoch": 3641} {"train_loss": -25.600727081298828, "global_step": 302256, "epoch": 3641} {"train_loss": -25.770360946655273, "global_step": 302257, "epoch": 3641} {"train_loss": -25.534236907958984, "global_step": 302258, "epoch": 3641} {"train_loss": -25.856582641601562, "global_step": 302259, "epoch": 3641} {"train_loss": -25.55885124206543, "global_step": 302260, "epoch": 3641} {"train_loss": -25.75837516784668, "global_step": 302261, "epoch": 3641} {"train_loss": -25.713546752929688, "global_step": 302262, "epoch": 3641} {"train_loss": -25.398775100708008, "global_step": 302263, "epoch": 3641} {"train_loss": -25.859607696533203, "global_step": 302264, "epoch": 3641} {"train_loss": -25.963144302368164, "global_step": 302265, "epoch": 3641} {"train_loss": -26.04026222229004, "global_step": 302266, "epoch": 3641} {"train_loss": -26.080957412719727, "global_step": 302267, "epoch": 3641} {"train_loss": -25.715662002563477, "global_step": 302268, "epoch": 3641} {"train_loss": -25.978046417236328, "global_step": 302269, "epoch": 3641} {"train_loss": -25.71799087524414, "global_step": 302270, "epoch": 3641} {"train_loss": -26.03240966796875, "global_step": 302271, "epoch": 3641} {"train_loss": -25.6660099029541, "global_step": 302272, "epoch": 3641} {"train_loss": -25.6683349609375, "global_step": 302273, "epoch": 3641} {"train_loss": -25.707080841064453, "global_step": 302274, "epoch": 3641} {"train_loss": -26.02265739440918, "global_step": 302275, "epoch": 3641} {"train_loss": -25.87339210510254, "global_step": 302276, "epoch": 3641} {"train_loss": -25.199872970581055, "global_step": 302277, "epoch": 3641} {"train_loss": -25.600629806518555, "global_step": 302278, "epoch": 3641} {"train_loss": -25.812055587768555, "global_step": 302279, "epoch": 3641} {"train_loss": -25.79294776916504, "global_step": 302280, "epoch": 3641} {"train_loss": -25.79595947265625, "global_step": 302281, "epoch": 3641} {"train_loss": -25.83062171936035, "global_step": 302282, "epoch": 3641} {"train_loss": -25.41360855102539, "global_step": 302283, "epoch": 3641} {"train_loss": -25.8057804107666, "global_step": 302284, "epoch": 3641} {"train_loss": -25.55688046834555, "global_step": 302285, "epoch": 3641, "val_loss": 7244354.0} {"train_loss": -25.290449142456055, "global_step": 302286, "epoch": 3642} {"train_loss": -25.09366226196289, "global_step": 302287, "epoch": 3642} {"train_loss": -25.084407806396484, "global_step": 302288, "epoch": 3642} {"train_loss": -24.723777770996094, "global_step": 302289, "epoch": 3642} {"train_loss": -25.387907028198242, "global_step": 302290, "epoch": 3642} {"train_loss": -25.15898895263672, "global_step": 302291, "epoch": 3642} {"train_loss": -24.90983009338379, "global_step": 302292, "epoch": 3642} {"train_loss": -24.949064254760742, "global_step": 302293, "epoch": 3642} {"train_loss": -25.8812198638916, "global_step": 302294, "epoch": 3642} {"train_loss": -25.06861686706543, "global_step": 302295, "epoch": 3642} {"train_loss": -24.832984924316406, "global_step": 302296, "epoch": 3642} {"train_loss": -25.388248443603516, "global_step": 302297, "epoch": 3642} {"train_loss": -25.100488662719727, "global_step": 302298, "epoch": 3642} {"train_loss": -24.984281539916992, "global_step": 302299, "epoch": 3642} {"train_loss": -25.313777923583984, "global_step": 302300, "epoch": 3642} {"train_loss": -25.34328269958496, "global_step": 302301, "epoch": 3642} {"train_loss": -25.9188289642334, "global_step": 302302, "epoch": 3642} {"train_loss": -25.45220375061035, "global_step": 302303, "epoch": 3642} {"train_loss": -25.318954467773438, "global_step": 302304, "epoch": 3642} {"train_loss": -25.533967971801758, "global_step": 302305, "epoch": 3642} {"train_loss": -25.284683227539062, "global_step": 302306, "epoch": 3642} {"train_loss": -25.532148361206055, "global_step": 302307, "epoch": 3642} {"train_loss": -25.372867584228516, "global_step": 302308, "epoch": 3642} {"train_loss": -25.67822265625, "global_step": 302309, "epoch": 3642} {"train_loss": -25.153852462768555, "global_step": 302310, "epoch": 3642} {"train_loss": -25.8361759185791, "global_step": 302311, "epoch": 3642} {"train_loss": -25.78915786743164, "global_step": 302312, "epoch": 3642} {"train_loss": -25.5123348236084, "global_step": 302313, "epoch": 3642} {"train_loss": -25.482778549194336, "global_step": 302314, "epoch": 3642} {"train_loss": -25.59433364868164, "global_step": 302315, "epoch": 3642} {"train_loss": -25.80873680114746, "global_step": 302316, "epoch": 3642} {"train_loss": -25.51309585571289, "global_step": 302317, "epoch": 3642} {"train_loss": -25.924819946289062, "global_step": 302318, "epoch": 3642} {"train_loss": -25.77540397644043, "global_step": 302319, "epoch": 3642} {"train_loss": -25.887287139892578, "global_step": 302320, "epoch": 3642} {"train_loss": -25.483659744262695, "global_step": 302321, "epoch": 3642} {"train_loss": -26.028120040893555, "global_step": 302322, "epoch": 3642} {"train_loss": -25.673574447631836, "global_step": 302323, "epoch": 3642} {"train_loss": -25.102100372314453, "global_step": 302324, "epoch": 3642} {"train_loss": -25.345212936401367, "global_step": 302325, "epoch": 3642} {"train_loss": -25.76338005065918, "global_step": 302326, "epoch": 3642} {"train_loss": -26.052906036376953, "global_step": 302327, "epoch": 3642} {"train_loss": -25.419692993164062, "global_step": 302328, "epoch": 3642} {"train_loss": -25.90087890625, "global_step": 302329, "epoch": 3642} {"train_loss": -25.631717681884766, "global_step": 302330, "epoch": 3642} {"train_loss": -25.72063636779785, "global_step": 302331, "epoch": 3642} {"train_loss": -26.05615234375, "global_step": 302332, "epoch": 3642} {"train_loss": -25.968372344970703, "global_step": 302333, "epoch": 3642} {"train_loss": -25.83674430847168, "global_step": 302334, "epoch": 3642} {"train_loss": -25.646020889282227, "global_step": 302335, "epoch": 3642} {"train_loss": -25.844867706298828, "global_step": 302336, "epoch": 3642} {"train_loss": -25.97796630859375, "global_step": 302337, "epoch": 3642} {"train_loss": -25.93906021118164, "global_step": 302338, "epoch": 3642} {"train_loss": -26.15866470336914, "global_step": 302339, "epoch": 3642} {"train_loss": -25.796646118164062, "global_step": 302340, "epoch": 3642} {"train_loss": -26.129241943359375, "global_step": 302341, "epoch": 3642} {"train_loss": -25.7142276763916, "global_step": 302342, "epoch": 3642} {"train_loss": -25.474775314331055, "global_step": 302343, "epoch": 3642} {"train_loss": -25.294315338134766, "global_step": 302344, "epoch": 3642} {"train_loss": -25.795080184936523, "global_step": 302345, "epoch": 3642} {"train_loss": -26.007734298706055, "global_step": 302346, "epoch": 3642} {"train_loss": -25.877573013305664, "global_step": 302347, "epoch": 3642} {"train_loss": -25.663175582885742, "global_step": 302348, "epoch": 3642} {"train_loss": -25.718381881713867, "global_step": 302349, "epoch": 3642} {"train_loss": -25.58810043334961, "global_step": 302350, "epoch": 3642} {"train_loss": -26.135913848876953, "global_step": 302351, "epoch": 3642} {"train_loss": -26.172901153564453, "global_step": 302352, "epoch": 3642} {"train_loss": -25.52257537841797, "global_step": 302353, "epoch": 3642} {"train_loss": -25.41355323791504, "global_step": 302354, "epoch": 3642} {"train_loss": -26.124195098876953, "global_step": 302355, "epoch": 3642} {"train_loss": -25.568288803100586, "global_step": 302356, "epoch": 3642} {"train_loss": -25.672515869140625, "global_step": 302357, "epoch": 3642} {"train_loss": -25.939748764038086, "global_step": 302358, "epoch": 3642} {"train_loss": -25.295717239379883, "global_step": 302359, "epoch": 3642} {"train_loss": -25.6518611907959, "global_step": 302360, "epoch": 3642} {"train_loss": -25.71577262878418, "global_step": 302361, "epoch": 3642} {"train_loss": -25.976545333862305, "global_step": 302362, "epoch": 3642} {"train_loss": -26.069812774658203, "global_step": 302363, "epoch": 3642} {"train_loss": -25.63221549987793, "global_step": 302364, "epoch": 3642} {"train_loss": -25.669748306274414, "global_step": 302365, "epoch": 3642} {"train_loss": -25.489927291870117, "global_step": 302366, "epoch": 3642} {"train_loss": -25.61875343322754, "global_step": 302367, "epoch": 3642} {"train_loss": -25.604406241911004, "global_step": 302368, "epoch": 3642, "val_loss": 7236591.0} {"train_loss": -25.046579360961914, "global_step": 302369, "epoch": 3643} {"train_loss": -24.474889755249023, "global_step": 302370, "epoch": 3643} {"train_loss": -23.69434928894043, "global_step": 302371, "epoch": 3643} {"train_loss": -25.10996437072754, "global_step": 302372, "epoch": 3643} {"train_loss": -25.342660903930664, "global_step": 302373, "epoch": 3643} {"train_loss": -25.065305709838867, "global_step": 302374, "epoch": 3643} {"train_loss": -24.891284942626953, "global_step": 302375, "epoch": 3643} {"train_loss": -24.694599151611328, "global_step": 302376, "epoch": 3643} {"train_loss": -25.382108688354492, "global_step": 302377, "epoch": 3643} {"train_loss": -25.184865951538086, "global_step": 302378, "epoch": 3643} {"train_loss": -25.230031967163086, "global_step": 302379, "epoch": 3643} {"train_loss": -25.291501998901367, "global_step": 302380, "epoch": 3643} {"train_loss": -24.861886978149414, "global_step": 302381, "epoch": 3643} {"train_loss": -25.316911697387695, "global_step": 302382, "epoch": 3643} {"train_loss": -25.27223014831543, "global_step": 302383, "epoch": 3643} {"train_loss": -25.394031524658203, "global_step": 302384, "epoch": 3643} {"train_loss": -25.01197624206543, "global_step": 302385, "epoch": 3643} {"train_loss": -25.14575958251953, "global_step": 302386, "epoch": 3643} {"train_loss": -25.545690536499023, "global_step": 302387, "epoch": 3643} {"train_loss": -25.450963973999023, "global_step": 302388, "epoch": 3643} {"train_loss": -25.235870361328125, "global_step": 302389, "epoch": 3643} {"train_loss": -24.995290756225586, "global_step": 302390, "epoch": 3643} {"train_loss": -25.03603172302246, "global_step": 302391, "epoch": 3643} {"train_loss": -25.743040084838867, "global_step": 302392, "epoch": 3643} {"train_loss": -25.507556915283203, "global_step": 302393, "epoch": 3643} {"train_loss": -25.32292938232422, "global_step": 302394, "epoch": 3643} {"train_loss": -25.626895904541016, "global_step": 302395, "epoch": 3643} {"train_loss": -25.757909774780273, "global_step": 302396, "epoch": 3643} {"train_loss": -25.810544967651367, "global_step": 302397, "epoch": 3643} {"train_loss": -25.662153244018555, "global_step": 302398, "epoch": 3643} {"train_loss": -25.500274658203125, "global_step": 302399, "epoch": 3643} {"train_loss": -25.733930587768555, "global_step": 302400, "epoch": 3643} {"train_loss": -25.8593807220459, "global_step": 302401, "epoch": 3643} {"train_loss": -25.581636428833008, "global_step": 302402, "epoch": 3643} {"train_loss": -25.876834869384766, "global_step": 302403, "epoch": 3643} {"train_loss": -25.530603408813477, "global_step": 302404, "epoch": 3643} {"train_loss": -25.74940299987793, "global_step": 302405, "epoch": 3643} {"train_loss": -25.843475341796875, "global_step": 302406, "epoch": 3643} {"train_loss": -26.136474609375, "global_step": 302407, "epoch": 3643} {"train_loss": -26.300634384155273, "global_step": 302408, "epoch": 3643} {"train_loss": -25.772912979125977, "global_step": 302409, "epoch": 3643} {"train_loss": -25.478239059448242, "global_step": 302410, "epoch": 3643} {"train_loss": -25.920276641845703, "global_step": 302411, "epoch": 3643} {"train_loss": -25.544200897216797, "global_step": 302412, "epoch": 3643} {"train_loss": -25.752212524414062, "global_step": 302413, "epoch": 3643} {"train_loss": -26.092893600463867, "global_step": 302414, "epoch": 3643} {"train_loss": -25.232040405273438, "global_step": 302415, "epoch": 3643} {"train_loss": -25.611474990844727, "global_step": 302416, "epoch": 3643} {"train_loss": -25.51352310180664, "global_step": 302417, "epoch": 3643} {"train_loss": -25.986297607421875, "global_step": 302418, "epoch": 3643} {"train_loss": -25.855268478393555, "global_step": 302419, "epoch": 3643} {"train_loss": -26.190692901611328, "global_step": 302420, "epoch": 3643} {"train_loss": -25.58846092224121, "global_step": 302421, "epoch": 3643} {"train_loss": -25.924549102783203, "global_step": 302422, "epoch": 3643} {"train_loss": -25.774038314819336, "global_step": 302423, "epoch": 3643} {"train_loss": -25.714025497436523, "global_step": 302424, "epoch": 3643} {"train_loss": -25.86334800720215, "global_step": 302425, "epoch": 3643} {"train_loss": -25.55885887145996, "global_step": 302426, "epoch": 3643} {"train_loss": -25.80475425720215, "global_step": 302427, "epoch": 3643} {"train_loss": -25.549270629882812, "global_step": 302428, "epoch": 3643} {"train_loss": -25.91114616394043, "global_step": 302429, "epoch": 3643} {"train_loss": -25.889068603515625, "global_step": 302430, "epoch": 3643} {"train_loss": -25.619953155517578, "global_step": 302431, "epoch": 3643} {"train_loss": -25.891494750976562, "global_step": 302432, "epoch": 3643} {"train_loss": -26.025165557861328, "global_step": 302433, "epoch": 3643} {"train_loss": -25.71188735961914, "global_step": 302434, "epoch": 3643} {"train_loss": -25.400753021240234, "global_step": 302435, "epoch": 3643} {"train_loss": -25.726898193359375, "global_step": 302436, "epoch": 3643} {"train_loss": -25.69367027282715, "global_step": 302437, "epoch": 3643} {"train_loss": -25.998489379882812, "global_step": 302438, "epoch": 3643} {"train_loss": -25.724445343017578, "global_step": 302439, "epoch": 3643} {"train_loss": -25.691303253173828, "global_step": 302440, "epoch": 3643} {"train_loss": -25.666807174682617, "global_step": 302441, "epoch": 3643} {"train_loss": -25.444936752319336, "global_step": 302442, "epoch": 3643} {"train_loss": -25.843276977539062, "global_step": 302443, "epoch": 3643} {"train_loss": -25.567548751831055, "global_step": 302444, "epoch": 3643} {"train_loss": -25.73811149597168, "global_step": 302445, "epoch": 3643} {"train_loss": -25.68536376953125, "global_step": 302446, "epoch": 3643} {"train_loss": -25.557723999023438, "global_step": 302447, "epoch": 3643} {"train_loss": -25.74843406677246, "global_step": 302448, "epoch": 3643} {"train_loss": -25.723913192749023, "global_step": 302449, "epoch": 3643} {"train_loss": -25.802265167236328, "global_step": 302450, "epoch": 3643} {"train_loss": -25.57072294763772, "global_step": 302451, "epoch": 3643, "val_loss": 7286671.0} {"train_loss": -25.131561279296875, "global_step": 302452, "epoch": 3644} {"train_loss": -24.460859298706055, "global_step": 302453, "epoch": 3644} {"train_loss": -24.951496124267578, "global_step": 302454, "epoch": 3644} {"train_loss": -24.793224334716797, "global_step": 302455, "epoch": 3644} {"train_loss": -24.582843780517578, "global_step": 302456, "epoch": 3644} {"train_loss": -24.592496871948242, "global_step": 302457, "epoch": 3644} {"train_loss": -25.70674705505371, "global_step": 302458, "epoch": 3644} {"train_loss": -25.113889694213867, "global_step": 302459, "epoch": 3644} {"train_loss": -24.928211212158203, "global_step": 302460, "epoch": 3644} {"train_loss": -25.686084747314453, "global_step": 302461, "epoch": 3644} {"train_loss": -24.666641235351562, "global_step": 302462, "epoch": 3644} {"train_loss": -25.352523803710938, "global_step": 302463, "epoch": 3644} {"train_loss": -24.950836181640625, "global_step": 302464, "epoch": 3644} {"train_loss": -25.32415771484375, "global_step": 302465, "epoch": 3644} {"train_loss": -25.48317527770996, "global_step": 302466, "epoch": 3644} {"train_loss": -25.584684371948242, "global_step": 302467, "epoch": 3644} {"train_loss": -25.453847885131836, "global_step": 302468, "epoch": 3644} {"train_loss": -25.220190048217773, "global_step": 302469, "epoch": 3644} {"train_loss": -25.328399658203125, "global_step": 302470, "epoch": 3644} {"train_loss": -25.451040267944336, "global_step": 302471, "epoch": 3644} {"train_loss": -25.2943172454834, "global_step": 302472, "epoch": 3644} {"train_loss": -25.537607192993164, "global_step": 302473, "epoch": 3644} {"train_loss": -25.523208618164062, "global_step": 302474, "epoch": 3644} {"train_loss": -25.742185592651367, "global_step": 302475, "epoch": 3644} {"train_loss": -25.577787399291992, "global_step": 302476, "epoch": 3644} {"train_loss": -25.485197067260742, "global_step": 302477, "epoch": 3644} {"train_loss": -25.63918113708496, "global_step": 302478, "epoch": 3644} {"train_loss": -25.8422794342041, "global_step": 302479, "epoch": 3644} {"train_loss": -25.254117965698242, "global_step": 302480, "epoch": 3644} {"train_loss": -25.589513778686523, "global_step": 302481, "epoch": 3644} {"train_loss": -25.509403228759766, "global_step": 302482, "epoch": 3644} {"train_loss": -25.672794342041016, "global_step": 302483, "epoch": 3644} {"train_loss": -26.19668960571289, "global_step": 302484, "epoch": 3644} {"train_loss": -26.024396896362305, "global_step": 302485, "epoch": 3644} {"train_loss": -25.91986656188965, "global_step": 302486, "epoch": 3644} {"train_loss": -25.61517333984375, "global_step": 302487, "epoch": 3644} {"train_loss": -25.825809478759766, "global_step": 302488, "epoch": 3644} {"train_loss": -26.16257095336914, "global_step": 302489, "epoch": 3644} {"train_loss": -25.54817008972168, "global_step": 302490, "epoch": 3644} {"train_loss": -25.6534481048584, "global_step": 302491, "epoch": 3644} {"train_loss": -25.791976928710938, "global_step": 302492, "epoch": 3644} {"train_loss": -25.55733299255371, "global_step": 302493, "epoch": 3644} {"train_loss": -25.907745361328125, "global_step": 302494, "epoch": 3644} {"train_loss": -25.513648986816406, "global_step": 302495, "epoch": 3644} {"train_loss": -25.409210205078125, "global_step": 302496, "epoch": 3644} {"train_loss": -25.895034790039062, "global_step": 302497, "epoch": 3644} {"train_loss": -25.22964096069336, "global_step": 302498, "epoch": 3644} {"train_loss": -25.87822914123535, "global_step": 302499, "epoch": 3644} {"train_loss": -25.817169189453125, "global_step": 302500, "epoch": 3644} {"train_loss": -25.712982177734375, "global_step": 302501, "epoch": 3644} {"train_loss": -25.736408233642578, "global_step": 302502, "epoch": 3644} {"train_loss": -25.968891143798828, "global_step": 302503, "epoch": 3644} {"train_loss": -25.12153434753418, "global_step": 302504, "epoch": 3644} {"train_loss": -25.789321899414062, "global_step": 302505, "epoch": 3644} {"train_loss": -25.747922897338867, "global_step": 302506, "epoch": 3644} {"train_loss": -25.899999618530273, "global_step": 302507, "epoch": 3644} {"train_loss": -25.776777267456055, "global_step": 302508, "epoch": 3644} {"train_loss": -25.834814071655273, "global_step": 302509, "epoch": 3644} {"train_loss": -25.687591552734375, "global_step": 302510, "epoch": 3644} {"train_loss": -25.837820053100586, "global_step": 302511, "epoch": 3644} {"train_loss": -25.368871688842773, "global_step": 302512, "epoch": 3644} {"train_loss": -25.516035079956055, "global_step": 302513, "epoch": 3644} {"train_loss": -25.61440086364746, "global_step": 302514, "epoch": 3644} {"train_loss": -25.75324821472168, "global_step": 302515, "epoch": 3644} {"train_loss": -25.7651309967041, "global_step": 302516, "epoch": 3644} {"train_loss": -25.673105239868164, "global_step": 302517, "epoch": 3644} {"train_loss": -25.451250076293945, "global_step": 302518, "epoch": 3644} {"train_loss": -25.637842178344727, "global_step": 302519, "epoch": 3644} {"train_loss": -25.560108184814453, "global_step": 302520, "epoch": 3644} {"train_loss": -25.546493530273438, "global_step": 302521, "epoch": 3644} {"train_loss": -25.293272018432617, "global_step": 302522, "epoch": 3644} {"train_loss": -25.48723602294922, "global_step": 302523, "epoch": 3644} {"train_loss": -25.962446212768555, "global_step": 302524, "epoch": 3644} {"train_loss": -25.64447593688965, "global_step": 302525, "epoch": 3644} {"train_loss": -25.817340850830078, "global_step": 302526, "epoch": 3644} {"train_loss": -25.915363311767578, "global_step": 302527, "epoch": 3644} {"train_loss": -25.65174674987793, "global_step": 302528, "epoch": 3644} {"train_loss": -25.640140533447266, "global_step": 302529, "epoch": 3644} {"train_loss": -25.870471954345703, "global_step": 302530, "epoch": 3644} {"train_loss": -25.526668548583984, "global_step": 302531, "epoch": 3644} {"train_loss": -25.793237686157227, "global_step": 302532, "epoch": 3644} {"train_loss": -25.56322479248047, "global_step": 302533, "epoch": 3644} {"train_loss": -25.536255756056452, "global_step": 302534, "epoch": 3644, "val_loss": 7132102.0} {"train_loss": -25.01845359802246, "global_step": 302535, "epoch": 3645} {"train_loss": -24.85711669921875, "global_step": 302536, "epoch": 3645} {"train_loss": -24.480558395385742, "global_step": 302537, "epoch": 3645} {"train_loss": -25.070756912231445, "global_step": 302538, "epoch": 3645} {"train_loss": -25.07923126220703, "global_step": 302539, "epoch": 3645} {"train_loss": -25.237165451049805, "global_step": 302540, "epoch": 3645} {"train_loss": -24.953983306884766, "global_step": 302541, "epoch": 3645} {"train_loss": -25.244674682617188, "global_step": 302542, "epoch": 3645} {"train_loss": -24.919485092163086, "global_step": 302543, "epoch": 3645} {"train_loss": -25.171194076538086, "global_step": 302544, "epoch": 3645} {"train_loss": -25.153778076171875, "global_step": 302545, "epoch": 3645} {"train_loss": -24.573856353759766, "global_step": 302546, "epoch": 3645} {"train_loss": -25.238859176635742, "global_step": 302547, "epoch": 3645} {"train_loss": -24.816884994506836, "global_step": 302548, "epoch": 3645} {"train_loss": -25.417194366455078, "global_step": 302549, "epoch": 3645} {"train_loss": -25.162391662597656, "global_step": 302550, "epoch": 3645} {"train_loss": -25.333280563354492, "global_step": 302551, "epoch": 3645} {"train_loss": -24.705358505249023, "global_step": 302552, "epoch": 3645} {"train_loss": -25.573423385620117, "global_step": 302553, "epoch": 3645} {"train_loss": -25.804523468017578, "global_step": 302554, "epoch": 3645} {"train_loss": -25.482099533081055, "global_step": 302555, "epoch": 3645} {"train_loss": -25.6326961517334, "global_step": 302556, "epoch": 3645} {"train_loss": -24.990562438964844, "global_step": 302557, "epoch": 3645} {"train_loss": -25.167640686035156, "global_step": 302558, "epoch": 3645} {"train_loss": -25.373350143432617, "global_step": 302559, "epoch": 3645} {"train_loss": -25.53476333618164, "global_step": 302560, "epoch": 3645} {"train_loss": -25.214086532592773, "global_step": 302561, "epoch": 3645} {"train_loss": -25.55141830444336, "global_step": 302562, "epoch": 3645} {"train_loss": -25.566797256469727, "global_step": 302563, "epoch": 3645} {"train_loss": -25.56971549987793, "global_step": 302564, "epoch": 3645} {"train_loss": -25.395687103271484, "global_step": 302565, "epoch": 3645} {"train_loss": -25.619537353515625, "global_step": 302566, "epoch": 3645} {"train_loss": -25.673603057861328, "global_step": 302567, "epoch": 3645} {"train_loss": -25.5305233001709, "global_step": 302568, "epoch": 3645} {"train_loss": -25.168848037719727, "global_step": 302569, "epoch": 3645} {"train_loss": -25.870969772338867, "global_step": 302570, "epoch": 3645} {"train_loss": -25.528779983520508, "global_step": 302571, "epoch": 3645} {"train_loss": -25.5412654876709, "global_step": 302572, "epoch": 3645} {"train_loss": -25.76194190979004, "global_step": 302573, "epoch": 3645} {"train_loss": -25.820981979370117, "global_step": 302574, "epoch": 3645} {"train_loss": -25.483823776245117, "global_step": 302575, "epoch": 3645} {"train_loss": -25.86623191833496, "global_step": 302576, "epoch": 3645} {"train_loss": -25.90846061706543, "global_step": 302577, "epoch": 3645} {"train_loss": -25.907133102416992, "global_step": 302578, "epoch": 3645} {"train_loss": -25.71164894104004, "global_step": 302579, "epoch": 3645} {"train_loss": -26.159900665283203, "global_step": 302580, "epoch": 3645} {"train_loss": -26.023624420166016, "global_step": 302581, "epoch": 3645} {"train_loss": -25.486642837524414, "global_step": 302582, "epoch": 3645} {"train_loss": -26.025991439819336, "global_step": 302583, "epoch": 3645} {"train_loss": -25.676050186157227, "global_step": 302584, "epoch": 3645} {"train_loss": -25.79536247253418, "global_step": 302585, "epoch": 3645} {"train_loss": -25.927474975585938, "global_step": 302586, "epoch": 3645} {"train_loss": -25.98102378845215, "global_step": 302587, "epoch": 3645} {"train_loss": -25.919116973876953, "global_step": 302588, "epoch": 3645} {"train_loss": -26.09405517578125, "global_step": 302589, "epoch": 3645} {"train_loss": -25.372406005859375, "global_step": 302590, "epoch": 3645} {"train_loss": -25.958471298217773, "global_step": 302591, "epoch": 3645} {"train_loss": -25.941883087158203, "global_step": 302592, "epoch": 3645} {"train_loss": -25.905797958374023, "global_step": 302593, "epoch": 3645} {"train_loss": -25.668542861938477, "global_step": 302594, "epoch": 3645} {"train_loss": -25.9183349609375, "global_step": 302595, "epoch": 3645} {"train_loss": -25.80598258972168, "global_step": 302596, "epoch": 3645} {"train_loss": -25.821491241455078, "global_step": 302597, "epoch": 3645} {"train_loss": -25.787418365478516, "global_step": 302598, "epoch": 3645} {"train_loss": -25.90394401550293, "global_step": 302599, "epoch": 3645} {"train_loss": -25.66969871520996, "global_step": 302600, "epoch": 3645} {"train_loss": -25.961170196533203, "global_step": 302601, "epoch": 3645} {"train_loss": -25.9084415435791, "global_step": 302602, "epoch": 3645} {"train_loss": -25.698339462280273, "global_step": 302603, "epoch": 3645} {"train_loss": -25.672718048095703, "global_step": 302604, "epoch": 3645} {"train_loss": -25.89240074157715, "global_step": 302605, "epoch": 3645} {"train_loss": -25.836095809936523, "global_step": 302606, "epoch": 3645} {"train_loss": -25.448537826538086, "global_step": 302607, "epoch": 3645} {"train_loss": -25.837263107299805, "global_step": 302608, "epoch": 3645} {"train_loss": -26.00823974609375, "global_step": 302609, "epoch": 3645} {"train_loss": -25.462148666381836, "global_step": 302610, "epoch": 3645} {"train_loss": -25.52178192138672, "global_step": 302611, "epoch": 3645} {"train_loss": -25.119083404541016, "global_step": 302612, "epoch": 3645} {"train_loss": -24.78384780883789, "global_step": 302613, "epoch": 3645} {"train_loss": -25.217954635620117, "global_step": 302614, "epoch": 3645} {"train_loss": -25.27052879333496, "global_step": 302615, "epoch": 3645} {"train_loss": -25.630573272705078, "global_step": 302616, "epoch": 3645} {"train_loss": -25.539533155510224, "global_step": 302617, "epoch": 3645, "val_loss": 7209594.0} {"train_loss": -22.042314529418945, "global_step": 302618, "epoch": 3646} {"train_loss": -23.921491622924805, "global_step": 302619, "epoch": 3646} {"train_loss": -23.346296310424805, "global_step": 302620, "epoch": 3646} {"train_loss": -23.983083724975586, "global_step": 302621, "epoch": 3646} {"train_loss": -24.28891372680664, "global_step": 302622, "epoch": 3646} {"train_loss": -24.5101375579834, "global_step": 302623, "epoch": 3646} {"train_loss": -24.348764419555664, "global_step": 302624, "epoch": 3646} {"train_loss": -24.605329513549805, "global_step": 302625, "epoch": 3646} {"train_loss": -24.106571197509766, "global_step": 302626, "epoch": 3646} {"train_loss": -25.00517463684082, "global_step": 302627, "epoch": 3646} {"train_loss": -24.430055618286133, "global_step": 302628, "epoch": 3646} {"train_loss": -24.620487213134766, "global_step": 302629, "epoch": 3646} {"train_loss": -24.922449111938477, "global_step": 302630, "epoch": 3646} {"train_loss": -24.78514289855957, "global_step": 302631, "epoch": 3646} {"train_loss": -24.6165828704834, "global_step": 302632, "epoch": 3646} {"train_loss": -24.441099166870117, "global_step": 302633, "epoch": 3646} {"train_loss": -24.776752471923828, "global_step": 302634, "epoch": 3646} {"train_loss": -25.154706954956055, "global_step": 302635, "epoch": 3646} {"train_loss": -25.03226661682129, "global_step": 302636, "epoch": 3646} {"train_loss": -24.760330200195312, "global_step": 302637, "epoch": 3646} {"train_loss": -25.073877334594727, "global_step": 302638, "epoch": 3646} {"train_loss": -25.273181915283203, "global_step": 302639, "epoch": 3646} {"train_loss": -25.353357315063477, "global_step": 302640, "epoch": 3646} {"train_loss": -24.78693199157715, "global_step": 302641, "epoch": 3646} {"train_loss": -25.35126495361328, "global_step": 302642, "epoch": 3646} {"train_loss": -25.099489212036133, "global_step": 302643, "epoch": 3646} {"train_loss": -25.17781639099121, "global_step": 302644, "epoch": 3646} {"train_loss": -25.28544044494629, "global_step": 302645, "epoch": 3646} {"train_loss": -25.623464584350586, "global_step": 302646, "epoch": 3646} {"train_loss": -25.551254272460938, "global_step": 302647, "epoch": 3646} {"train_loss": -25.562345504760742, "global_step": 302648, "epoch": 3646} {"train_loss": -25.553802490234375, "global_step": 302649, "epoch": 3646} {"train_loss": -25.575773239135742, "global_step": 302650, "epoch": 3646} {"train_loss": -25.296401977539062, "global_step": 302651, "epoch": 3646} {"train_loss": -25.233362197875977, "global_step": 302652, "epoch": 3646} {"train_loss": -25.450050354003906, "global_step": 302653, "epoch": 3646} {"train_loss": -25.753406524658203, "global_step": 302654, "epoch": 3646} {"train_loss": -25.756956100463867, "global_step": 302655, "epoch": 3646} {"train_loss": -25.66336441040039, "global_step": 302656, "epoch": 3646} {"train_loss": -25.7930965423584, "global_step": 302657, "epoch": 3646} {"train_loss": -25.767114639282227, "global_step": 302658, "epoch": 3646} {"train_loss": -25.4591007232666, "global_step": 302659, "epoch": 3646} {"train_loss": -25.200925827026367, "global_step": 302660, "epoch": 3646} {"train_loss": -25.709348678588867, "global_step": 302661, "epoch": 3646} {"train_loss": -25.377124786376953, "global_step": 302662, "epoch": 3646} {"train_loss": -25.525415420532227, "global_step": 302663, "epoch": 3646} {"train_loss": -25.851348876953125, "global_step": 302664, "epoch": 3646} {"train_loss": -25.683643341064453, "global_step": 302665, "epoch": 3646} {"train_loss": -25.621896743774414, "global_step": 302666, "epoch": 3646} {"train_loss": -25.631153106689453, "global_step": 302667, "epoch": 3646} {"train_loss": -25.8006649017334, "global_step": 302668, "epoch": 3646} {"train_loss": -25.4586124420166, "global_step": 302669, "epoch": 3646} {"train_loss": -25.51790428161621, "global_step": 302670, "epoch": 3646} {"train_loss": -25.878162384033203, "global_step": 302671, "epoch": 3646} {"train_loss": -25.801801681518555, "global_step": 302672, "epoch": 3646} {"train_loss": -25.825307846069336, "global_step": 302673, "epoch": 3646} {"train_loss": -25.675983428955078, "global_step": 302674, "epoch": 3646} {"train_loss": -25.650150299072266, "global_step": 302675, "epoch": 3646} {"train_loss": -25.710607528686523, "global_step": 302676, "epoch": 3646} {"train_loss": -25.515209197998047, "global_step": 302677, "epoch": 3646} {"train_loss": -25.875843048095703, "global_step": 302678, "epoch": 3646} {"train_loss": -25.80141258239746, "global_step": 302679, "epoch": 3646} {"train_loss": -25.704181671142578, "global_step": 302680, "epoch": 3646} {"train_loss": -25.38054847717285, "global_step": 302681, "epoch": 3646} {"train_loss": -25.858291625976562, "global_step": 302682, "epoch": 3646} {"train_loss": -25.526748657226562, "global_step": 302683, "epoch": 3646} {"train_loss": -25.827960968017578, "global_step": 302684, "epoch": 3646} {"train_loss": -25.657669067382812, "global_step": 302685, "epoch": 3646} {"train_loss": -25.78021812438965, "global_step": 302686, "epoch": 3646} {"train_loss": -25.681806564331055, "global_step": 302687, "epoch": 3646} {"train_loss": -26.08022117614746, "global_step": 302688, "epoch": 3646} {"train_loss": -25.363767623901367, "global_step": 302689, "epoch": 3646} {"train_loss": -25.456892013549805, "global_step": 302690, "epoch": 3646} {"train_loss": -25.575698852539062, "global_step": 302691, "epoch": 3646} {"train_loss": -25.5515193939209, "global_step": 302692, "epoch": 3646} {"train_loss": -25.600391387939453, "global_step": 302693, "epoch": 3646} {"train_loss": -25.96199607849121, "global_step": 302694, "epoch": 3646} {"train_loss": -25.567913055419922, "global_step": 302695, "epoch": 3646} {"train_loss": -25.232423782348633, "global_step": 302696, "epoch": 3646} {"train_loss": -25.512611389160156, "global_step": 302697, "epoch": 3646} {"train_loss": -25.702966690063477, "global_step": 302698, "epoch": 3646} {"train_loss": -25.8067569732666, "global_step": 302699, "epoch": 3646} {"train_loss": -25.295675990093184, "global_step": 302700, "epoch": 3646, "val_loss": 7197013.0} {"train_loss": -25.49711036682129, "global_step": 302701, "epoch": 3647} {"train_loss": -25.133020401000977, "global_step": 302702, "epoch": 3647} {"train_loss": -25.369783401489258, "global_step": 302703, "epoch": 3647} {"train_loss": -25.219266891479492, "global_step": 302704, "epoch": 3647} {"train_loss": -25.574384689331055, "global_step": 302705, "epoch": 3647} {"train_loss": -25.913440704345703, "global_step": 302706, "epoch": 3647} {"train_loss": -25.394145965576172, "global_step": 302707, "epoch": 3647} {"train_loss": -25.281005859375, "global_step": 302708, "epoch": 3647} {"train_loss": -25.00998306274414, "global_step": 302709, "epoch": 3647} {"train_loss": -25.8294734954834, "global_step": 302710, "epoch": 3647} {"train_loss": -24.962772369384766, "global_step": 302711, "epoch": 3647} {"train_loss": -25.486879348754883, "global_step": 302712, "epoch": 3647} {"train_loss": -25.390911102294922, "global_step": 302713, "epoch": 3647} {"train_loss": -25.633813858032227, "global_step": 302714, "epoch": 3647} {"train_loss": -25.918811798095703, "global_step": 302715, "epoch": 3647} {"train_loss": -24.815073013305664, "global_step": 302716, "epoch": 3647} {"train_loss": -25.200149536132812, "global_step": 302717, "epoch": 3647} {"train_loss": -25.371612548828125, "global_step": 302718, "epoch": 3647} {"train_loss": -25.393903732299805, "global_step": 302719, "epoch": 3647} {"train_loss": -25.438161849975586, "global_step": 302720, "epoch": 3647} {"train_loss": -25.72503662109375, "global_step": 302721, "epoch": 3647} {"train_loss": -25.583698272705078, "global_step": 302722, "epoch": 3647} {"train_loss": -25.35915184020996, "global_step": 302723, "epoch": 3647} {"train_loss": -25.548017501831055, "global_step": 302724, "epoch": 3647} {"train_loss": -25.6009464263916, "global_step": 302725, "epoch": 3647} {"train_loss": -25.45503807067871, "global_step": 302726, "epoch": 3647} {"train_loss": -25.497461318969727, "global_step": 302727, "epoch": 3647} {"train_loss": -25.986255645751953, "global_step": 302728, "epoch": 3647} {"train_loss": -25.55072021484375, "global_step": 302729, "epoch": 3647} {"train_loss": -25.65021324157715, "global_step": 302730, "epoch": 3647} {"train_loss": -25.56385612487793, "global_step": 302731, "epoch": 3647} {"train_loss": -26.141769409179688, "global_step": 302732, "epoch": 3647} {"train_loss": -25.713764190673828, "global_step": 302733, "epoch": 3647} {"train_loss": -25.684921264648438, "global_step": 302734, "epoch": 3647} {"train_loss": -25.654394149780273, "global_step": 302735, "epoch": 3647} {"train_loss": -25.7135009765625, "global_step": 302736, "epoch": 3647} {"train_loss": -25.90155601501465, "global_step": 302737, "epoch": 3647} {"train_loss": -25.8989200592041, "global_step": 302738, "epoch": 3647} {"train_loss": -26.057159423828125, "global_step": 302739, "epoch": 3647} {"train_loss": -25.585569381713867, "global_step": 302740, "epoch": 3647} {"train_loss": -25.844196319580078, "global_step": 302741, "epoch": 3647} {"train_loss": -26.045318603515625, "global_step": 302742, "epoch": 3647} {"train_loss": -25.151844024658203, "global_step": 302743, "epoch": 3647} {"train_loss": -25.533096313476562, "global_step": 302744, "epoch": 3647} {"train_loss": -25.57648277282715, "global_step": 302745, "epoch": 3647} {"train_loss": -25.306108474731445, "global_step": 302746, "epoch": 3647} {"train_loss": -25.84296989440918, "global_step": 302747, "epoch": 3647} {"train_loss": -25.67986488342285, "global_step": 302748, "epoch": 3647} {"train_loss": -26.189123153686523, "global_step": 302749, "epoch": 3647} {"train_loss": -26.006916046142578, "global_step": 302750, "epoch": 3647} {"train_loss": -25.56216812133789, "global_step": 302751, "epoch": 3647} {"train_loss": -26.05324363708496, "global_step": 302752, "epoch": 3647} {"train_loss": -25.708486557006836, "global_step": 302753, "epoch": 3647} {"train_loss": -25.631616592407227, "global_step": 302754, "epoch": 3647} {"train_loss": -24.98413848876953, "global_step": 302755, "epoch": 3647} {"train_loss": -25.897974014282227, "global_step": 302756, "epoch": 3647} {"train_loss": -25.48598289489746, "global_step": 302757, "epoch": 3647} {"train_loss": -25.528200149536133, "global_step": 302758, "epoch": 3647} {"train_loss": -25.221769332885742, "global_step": 302759, "epoch": 3647} {"train_loss": -25.728626251220703, "global_step": 302760, "epoch": 3647} {"train_loss": -25.8559513092041, "global_step": 302761, "epoch": 3647} {"train_loss": -25.619436264038086, "global_step": 302762, "epoch": 3647} {"train_loss": -25.663488388061523, "global_step": 302763, "epoch": 3647} {"train_loss": -25.731708526611328, "global_step": 302764, "epoch": 3647} {"train_loss": -25.710620880126953, "global_step": 302765, "epoch": 3647} {"train_loss": -25.46062469482422, "global_step": 302766, "epoch": 3647} {"train_loss": -25.84807777404785, "global_step": 302767, "epoch": 3647} {"train_loss": -25.703256607055664, "global_step": 302768, "epoch": 3647} {"train_loss": -25.424428939819336, "global_step": 302769, "epoch": 3647} {"train_loss": -26.363534927368164, "global_step": 302770, "epoch": 3647} {"train_loss": -26.182209014892578, "global_step": 302771, "epoch": 3647} {"train_loss": -25.6442813873291, "global_step": 302772, "epoch": 3647} {"train_loss": -25.7768497467041, "global_step": 302773, "epoch": 3647} {"train_loss": -26.048904418945312, "global_step": 302774, "epoch": 3647} {"train_loss": -26.157766342163086, "global_step": 302775, "epoch": 3647} {"train_loss": -25.69471549987793, "global_step": 302776, "epoch": 3647} {"train_loss": -25.97052001953125, "global_step": 302777, "epoch": 3647} {"train_loss": -25.860883712768555, "global_step": 302778, "epoch": 3647} {"train_loss": -25.787830352783203, "global_step": 302779, "epoch": 3647} {"train_loss": -25.983396530151367, "global_step": 302780, "epoch": 3647} {"train_loss": -25.697126388549805, "global_step": 302781, "epoch": 3647} {"train_loss": -25.906885147094727, "global_step": 302782, "epoch": 3647} {"train_loss": -25.63991195035268, "global_step": 302783, "epoch": 3647, "val_loss": 7284916.5} {"train_loss": -23.599889755249023, "global_step": 302784, "epoch": 3648} {"train_loss": -22.51025390625, "global_step": 302785, "epoch": 3648} {"train_loss": -25.000896453857422, "global_step": 302786, "epoch": 3648} {"train_loss": -23.159456253051758, "global_step": 302787, "epoch": 3648} {"train_loss": -24.72015953063965, "global_step": 302788, "epoch": 3648} {"train_loss": -23.659780502319336, "global_step": 302789, "epoch": 3648} {"train_loss": -24.349044799804688, "global_step": 302790, "epoch": 3648} {"train_loss": -24.169530868530273, "global_step": 302791, "epoch": 3648} {"train_loss": -24.171361923217773, "global_step": 302792, "epoch": 3648} {"train_loss": -24.92860984802246, "global_step": 302793, "epoch": 3648} {"train_loss": -24.666418075561523, "global_step": 302794, "epoch": 3648} {"train_loss": -24.6999568939209, "global_step": 302795, "epoch": 3648} {"train_loss": -24.697988510131836, "global_step": 302796, "epoch": 3648} {"train_loss": -25.639923095703125, "global_step": 302797, "epoch": 3648} {"train_loss": -24.74799919128418, "global_step": 302798, "epoch": 3648} {"train_loss": -25.098003387451172, "global_step": 302799, "epoch": 3648} {"train_loss": -25.020034790039062, "global_step": 302800, "epoch": 3648} {"train_loss": -25.217754364013672, "global_step": 302801, "epoch": 3648} {"train_loss": -24.850971221923828, "global_step": 302802, "epoch": 3648} {"train_loss": -25.143007278442383, "global_step": 302803, "epoch": 3648} {"train_loss": -24.815731048583984, "global_step": 302804, "epoch": 3648} {"train_loss": -25.39609718322754, "global_step": 302805, "epoch": 3648} {"train_loss": -24.88679313659668, "global_step": 302806, "epoch": 3648} {"train_loss": -25.10466766357422, "global_step": 302807, "epoch": 3648} {"train_loss": -25.44593620300293, "global_step": 302808, "epoch": 3648} {"train_loss": -25.7471923828125, "global_step": 302809, "epoch": 3648} {"train_loss": -25.26531982421875, "global_step": 302810, "epoch": 3648} {"train_loss": -25.423906326293945, "global_step": 302811, "epoch": 3648} {"train_loss": -25.188444137573242, "global_step": 302812, "epoch": 3648} {"train_loss": -25.11884307861328, "global_step": 302813, "epoch": 3648} {"train_loss": -25.4249324798584, "global_step": 302814, "epoch": 3648} {"train_loss": -25.001022338867188, "global_step": 302815, "epoch": 3648} {"train_loss": -26.007984161376953, "global_step": 302816, "epoch": 3648} {"train_loss": -25.524036407470703, "global_step": 302817, "epoch": 3648} {"train_loss": -25.314435958862305, "global_step": 302818, "epoch": 3648} {"train_loss": -25.69268226623535, "global_step": 302819, "epoch": 3648} {"train_loss": -25.530414581298828, "global_step": 302820, "epoch": 3648} {"train_loss": -25.330490112304688, "global_step": 302821, "epoch": 3648} {"train_loss": -25.5079345703125, "global_step": 302822, "epoch": 3648} {"train_loss": -25.683364868164062, "global_step": 302823, "epoch": 3648} {"train_loss": -25.830896377563477, "global_step": 302824, "epoch": 3648} {"train_loss": -25.382295608520508, "global_step": 302825, "epoch": 3648} {"train_loss": -25.521894454956055, "global_step": 302826, "epoch": 3648} {"train_loss": -25.85357666015625, "global_step": 302827, "epoch": 3648} {"train_loss": -25.754697799682617, "global_step": 302828, "epoch": 3648} {"train_loss": -25.197696685791016, "global_step": 302829, "epoch": 3648} {"train_loss": -25.83832359313965, "global_step": 302830, "epoch": 3648} {"train_loss": -25.45255470275879, "global_step": 302831, "epoch": 3648} {"train_loss": -25.559171676635742, "global_step": 302832, "epoch": 3648} {"train_loss": -25.352378845214844, "global_step": 302833, "epoch": 3648} {"train_loss": -25.7661075592041, "global_step": 302834, "epoch": 3648} {"train_loss": -25.53226661682129, "global_step": 302835, "epoch": 3648} {"train_loss": -25.724233627319336, "global_step": 302836, "epoch": 3648} {"train_loss": -25.20481300354004, "global_step": 302837, "epoch": 3648} {"train_loss": -25.65939712524414, "global_step": 302838, "epoch": 3648} {"train_loss": -25.288389205932617, "global_step": 302839, "epoch": 3648} {"train_loss": -25.883039474487305, "global_step": 302840, "epoch": 3648} {"train_loss": -25.223379135131836, "global_step": 302841, "epoch": 3648} {"train_loss": -25.709003448486328, "global_step": 302842, "epoch": 3648} {"train_loss": -25.5069580078125, "global_step": 302843, "epoch": 3648} {"train_loss": -25.70273780822754, "global_step": 302844, "epoch": 3648} {"train_loss": -25.755451202392578, "global_step": 302845, "epoch": 3648} {"train_loss": -25.645727157592773, "global_step": 302846, "epoch": 3648} {"train_loss": -25.754535675048828, "global_step": 302847, "epoch": 3648} {"train_loss": -25.946935653686523, "global_step": 302848, "epoch": 3648} {"train_loss": -25.598356246948242, "global_step": 302849, "epoch": 3648} {"train_loss": -26.00113296508789, "global_step": 302850, "epoch": 3648} {"train_loss": -25.7165470123291, "global_step": 302851, "epoch": 3648} {"train_loss": -25.58316993713379, "global_step": 302852, "epoch": 3648} {"train_loss": -25.718713760375977, "global_step": 302853, "epoch": 3648} {"train_loss": -25.502304077148438, "global_step": 302854, "epoch": 3648} {"train_loss": -25.53380584716797, "global_step": 302855, "epoch": 3648} {"train_loss": -25.981958389282227, "global_step": 302856, "epoch": 3648} {"train_loss": -25.292699813842773, "global_step": 302857, "epoch": 3648} {"train_loss": -25.812803268432617, "global_step": 302858, "epoch": 3648} {"train_loss": -25.664051055908203, "global_step": 302859, "epoch": 3648} {"train_loss": -25.8942813873291, "global_step": 302860, "epoch": 3648} {"train_loss": -25.901477813720703, "global_step": 302861, "epoch": 3648} {"train_loss": -25.650375366210938, "global_step": 302862, "epoch": 3648} {"train_loss": -26.20868492126465, "global_step": 302863, "epoch": 3648} {"train_loss": -25.68839454650879, "global_step": 302864, "epoch": 3648} {"train_loss": -25.750463485717773, "global_step": 302865, "epoch": 3648} {"train_loss": -25.314237318843244, "global_step": 302866, "epoch": 3648, "val_loss": 7255312.0} {"train_loss": -24.31572914123535, "global_step": 302867, "epoch": 3649} {"train_loss": -24.914535522460938, "global_step": 302868, "epoch": 3649} {"train_loss": -23.338590621948242, "global_step": 302869, "epoch": 3649} {"train_loss": -24.79073143005371, "global_step": 302870, "epoch": 3649} {"train_loss": -24.87067985534668, "global_step": 302871, "epoch": 3649} {"train_loss": -25.483169555664062, "global_step": 302872, "epoch": 3649} {"train_loss": -24.544076919555664, "global_step": 302873, "epoch": 3649} {"train_loss": -24.801071166992188, "global_step": 302874, "epoch": 3649} {"train_loss": -24.88468360900879, "global_step": 302875, "epoch": 3649} {"train_loss": -25.290332794189453, "global_step": 302876, "epoch": 3649} {"train_loss": -24.781408309936523, "global_step": 302877, "epoch": 3649} {"train_loss": -24.96607780456543, "global_step": 302878, "epoch": 3649} {"train_loss": -24.986865997314453, "global_step": 302879, "epoch": 3649} {"train_loss": -25.634729385375977, "global_step": 302880, "epoch": 3649} {"train_loss": -24.837034225463867, "global_step": 302881, "epoch": 3649} {"train_loss": -25.00982666015625, "global_step": 302882, "epoch": 3649} {"train_loss": -25.4599552154541, "global_step": 302883, "epoch": 3649} {"train_loss": -24.899641036987305, "global_step": 302884, "epoch": 3649} {"train_loss": -25.03228187561035, "global_step": 302885, "epoch": 3649} {"train_loss": -25.24652099609375, "global_step": 302886, "epoch": 3649} {"train_loss": -25.116857528686523, "global_step": 302887, "epoch": 3649} {"train_loss": -25.274641036987305, "global_step": 302888, "epoch": 3649} {"train_loss": -25.338281631469727, "global_step": 302889, "epoch": 3649} {"train_loss": -25.46246910095215, "global_step": 302890, "epoch": 3649} {"train_loss": -25.45639991760254, "global_step": 302891, "epoch": 3649} {"train_loss": -25.6838436126709, "global_step": 302892, "epoch": 3649} {"train_loss": -25.60377311706543, "global_step": 302893, "epoch": 3649} {"train_loss": -25.70832633972168, "global_step": 302894, "epoch": 3649} {"train_loss": -25.208515167236328, "global_step": 302895, "epoch": 3649} {"train_loss": -25.477813720703125, "global_step": 302896, "epoch": 3649} {"train_loss": -25.630207061767578, "global_step": 302897, "epoch": 3649} {"train_loss": -25.31001853942871, "global_step": 302898, "epoch": 3649} {"train_loss": -25.191665649414062, "global_step": 302899, "epoch": 3649} {"train_loss": -25.372854232788086, "global_step": 302900, "epoch": 3649} {"train_loss": -25.63028907775879, "global_step": 302901, "epoch": 3649} {"train_loss": -25.760894775390625, "global_step": 302902, "epoch": 3649} {"train_loss": -25.7547664642334, "global_step": 302903, "epoch": 3649} {"train_loss": -25.580333709716797, "global_step": 302904, "epoch": 3649} {"train_loss": -25.518123626708984, "global_step": 302905, "epoch": 3649} {"train_loss": -25.82598304748535, "global_step": 302906, "epoch": 3649} {"train_loss": -25.6053466796875, "global_step": 302907, "epoch": 3649} {"train_loss": -26.02534294128418, "global_step": 302908, "epoch": 3649} {"train_loss": -25.579044342041016, "global_step": 302909, "epoch": 3649} {"train_loss": -25.76444435119629, "global_step": 302910, "epoch": 3649} {"train_loss": -25.646686553955078, "global_step": 302911, "epoch": 3649} {"train_loss": -25.358612060546875, "global_step": 302912, "epoch": 3649} {"train_loss": -25.42696189880371, "global_step": 302913, "epoch": 3649} {"train_loss": -25.703083038330078, "global_step": 302914, "epoch": 3649} {"train_loss": -25.810138702392578, "global_step": 302915, "epoch": 3649} {"train_loss": -25.731733322143555, "global_step": 302916, "epoch": 3649} {"train_loss": -25.785388946533203, "global_step": 302917, "epoch": 3649} {"train_loss": -25.74006462097168, "global_step": 302918, "epoch": 3649} {"train_loss": -25.746923446655273, "global_step": 302919, "epoch": 3649} {"train_loss": -25.799118041992188, "global_step": 302920, "epoch": 3649} {"train_loss": -25.685712814331055, "global_step": 302921, "epoch": 3649} {"train_loss": -25.72954750061035, "global_step": 302922, "epoch": 3649} {"train_loss": -25.83976173400879, "global_step": 302923, "epoch": 3649} {"train_loss": -25.708486557006836, "global_step": 302924, "epoch": 3649} {"train_loss": -25.676761627197266, "global_step": 302925, "epoch": 3649} {"train_loss": -25.772077560424805, "global_step": 302926, "epoch": 3649} {"train_loss": -25.646127700805664, "global_step": 302927, "epoch": 3649} {"train_loss": -25.933380126953125, "global_step": 302928, "epoch": 3649} {"train_loss": -25.898351669311523, "global_step": 302929, "epoch": 3649} {"train_loss": -25.474950790405273, "global_step": 302930, "epoch": 3649} {"train_loss": -25.518381118774414, "global_step": 302931, "epoch": 3649} {"train_loss": -25.222869873046875, "global_step": 302932, "epoch": 3649} {"train_loss": -25.71435546875, "global_step": 302933, "epoch": 3649} {"train_loss": -25.70734977722168, "global_step": 302934, "epoch": 3649} {"train_loss": -25.178680419921875, "global_step": 302935, "epoch": 3649} {"train_loss": -25.131452560424805, "global_step": 302936, "epoch": 3649} {"train_loss": -25.595273971557617, "global_step": 302937, "epoch": 3649} {"train_loss": -25.142066955566406, "global_step": 302938, "epoch": 3649} {"train_loss": -25.447036743164062, "global_step": 302939, "epoch": 3649} {"train_loss": -25.016454696655273, "global_step": 302940, "epoch": 3649} {"train_loss": -25.74959373474121, "global_step": 302941, "epoch": 3649} {"train_loss": -25.28833770751953, "global_step": 302942, "epoch": 3649} {"train_loss": -25.029626846313477, "global_step": 302943, "epoch": 3649} {"train_loss": -25.01772117614746, "global_step": 302944, "epoch": 3649} {"train_loss": -25.572805404663086, "global_step": 302945, "epoch": 3649} {"train_loss": -24.988224029541016, "global_step": 302946, "epoch": 3649} {"train_loss": -25.059066772460938, "global_step": 302947, "epoch": 3649} {"train_loss": -25.673725128173828, "global_step": 302948, "epoch": 3649} {"train_loss": -25.371099288205066, "global_step": 302949, "epoch": 3649, "val_loss": 7187938.5} {"train_loss": -24.5465145111084, "global_step": 302950, "epoch": 3650} {"train_loss": -25.38026237487793, "global_step": 302951, "epoch": 3650} {"train_loss": -24.617990493774414, "global_step": 302952, "epoch": 3650} {"train_loss": -25.03882598876953, "global_step": 302953, "epoch": 3650} {"train_loss": -25.10194969177246, "global_step": 302954, "epoch": 3650} {"train_loss": -24.616140365600586, "global_step": 302955, "epoch": 3650} {"train_loss": -25.510713577270508, "global_step": 302956, "epoch": 3650} {"train_loss": -24.98468017578125, "global_step": 302957, "epoch": 3650} {"train_loss": -25.3524227142334, "global_step": 302958, "epoch": 3650} {"train_loss": -25.19209098815918, "global_step": 302959, "epoch": 3650} {"train_loss": -25.36185073852539, "global_step": 302960, "epoch": 3650} {"train_loss": -25.21651268005371, "global_step": 302961, "epoch": 3650} {"train_loss": -25.2961483001709, "global_step": 302962, "epoch": 3650} {"train_loss": -25.380674362182617, "global_step": 302963, "epoch": 3650} {"train_loss": -25.248685836791992, "global_step": 302964, "epoch": 3650} {"train_loss": -25.823963165283203, "global_step": 302965, "epoch": 3650} {"train_loss": -25.383625030517578, "global_step": 302966, "epoch": 3650} {"train_loss": -25.269010543823242, "global_step": 302967, "epoch": 3650} {"train_loss": -25.447675704956055, "global_step": 302968, "epoch": 3650} {"train_loss": -25.688888549804688, "global_step": 302969, "epoch": 3650} {"train_loss": -25.749670028686523, "global_step": 302970, "epoch": 3650} {"train_loss": -25.288192749023438, "global_step": 302971, "epoch": 3650} {"train_loss": -25.55921745300293, "global_step": 302972, "epoch": 3650} {"train_loss": -25.188060760498047, "global_step": 302973, "epoch": 3650} {"train_loss": -25.39244842529297, "global_step": 302974, "epoch": 3650} {"train_loss": -25.485517501831055, "global_step": 302975, "epoch": 3650} {"train_loss": -25.894567489624023, "global_step": 302976, "epoch": 3650} {"train_loss": -25.754125595092773, "global_step": 302977, "epoch": 3650} {"train_loss": -25.802404403686523, "global_step": 302978, "epoch": 3650} {"train_loss": -25.497299194335938, "global_step": 302979, "epoch": 3650} {"train_loss": -25.472148895263672, "global_step": 302980, "epoch": 3650} {"train_loss": -25.61297035217285, "global_step": 302981, "epoch": 3650} {"train_loss": -25.310083389282227, "global_step": 302982, "epoch": 3650} {"train_loss": -25.372251510620117, "global_step": 302983, "epoch": 3650} {"train_loss": -25.47093391418457, "global_step": 302984, "epoch": 3650} {"train_loss": -26.1234073638916, "global_step": 302985, "epoch": 3650} {"train_loss": -25.795236587524414, "global_step": 302986, "epoch": 3650} {"train_loss": -25.89287757873535, "global_step": 302987, "epoch": 3650} {"train_loss": -25.949203491210938, "global_step": 302988, "epoch": 3650} {"train_loss": -25.689451217651367, "global_step": 302989, "epoch": 3650} {"train_loss": -25.66033363342285, "global_step": 302990, "epoch": 3650} {"train_loss": -25.583450317382812, "global_step": 302991, "epoch": 3650} {"train_loss": -25.523134231567383, "global_step": 302992, "epoch": 3650} {"train_loss": -25.85027503967285, "global_step": 302993, "epoch": 3650} {"train_loss": -25.78775405883789, "global_step": 302994, "epoch": 3650} {"train_loss": -26.09748649597168, "global_step": 302995, "epoch": 3650} {"train_loss": -25.739973068237305, "global_step": 302996, "epoch": 3650} {"train_loss": -25.704187393188477, "global_step": 302997, "epoch": 3650} {"train_loss": -25.761859893798828, "global_step": 302998, "epoch": 3650} {"train_loss": -25.89216423034668, "global_step": 302999, "epoch": 3650} {"train_loss": -25.770246505737305, "global_step": 303000, "epoch": 3650} {"train_loss": -25.45949363708496, "global_step": 303001, "epoch": 3650} {"train_loss": -26.158496856689453, "global_step": 303002, "epoch": 3650} {"train_loss": -25.761474609375, "global_step": 303003, "epoch": 3650} {"train_loss": -25.73042869567871, "global_step": 303004, "epoch": 3650} {"train_loss": -26.007944107055664, "global_step": 303005, "epoch": 3650} {"train_loss": -25.62375259399414, "global_step": 303006, "epoch": 3650} {"train_loss": -25.538497924804688, "global_step": 303007, "epoch": 3650} {"train_loss": -25.760395050048828, "global_step": 303008, "epoch": 3650} {"train_loss": -26.10409927368164, "global_step": 303009, "epoch": 3650} {"train_loss": -25.999542236328125, "global_step": 303010, "epoch": 3650} {"train_loss": -25.936017990112305, "global_step": 303011, "epoch": 3650} {"train_loss": -25.92420768737793, "global_step": 303012, "epoch": 3650} {"train_loss": -26.162626266479492, "global_step": 303013, "epoch": 3650} {"train_loss": -25.764135360717773, "global_step": 303014, "epoch": 3650} {"train_loss": -25.788379669189453, "global_step": 303015, "epoch": 3650} {"train_loss": -25.60951042175293, "global_step": 303016, "epoch": 3650} {"train_loss": -25.674072265625, "global_step": 303017, "epoch": 3650} {"train_loss": -25.59427833557129, "global_step": 303018, "epoch": 3650} {"train_loss": -25.67001724243164, "global_step": 303019, "epoch": 3650} {"train_loss": -25.838987350463867, "global_step": 303020, "epoch": 3650} {"train_loss": -25.611112594604492, "global_step": 303021, "epoch": 3650} {"train_loss": -25.802433013916016, "global_step": 303022, "epoch": 3650} {"train_loss": -25.721906661987305, "global_step": 303023, "epoch": 3650} {"train_loss": -26.171598434448242, "global_step": 303024, "epoch": 3650} {"train_loss": -25.55811882019043, "global_step": 303025, "epoch": 3650} {"train_loss": -25.817960739135742, "global_step": 303026, "epoch": 3650} {"train_loss": -25.71291160583496, "global_step": 303027, "epoch": 3650} {"train_loss": -25.57840919494629, "global_step": 303028, "epoch": 3650} {"train_loss": -25.651126861572266, "global_step": 303029, "epoch": 3650} {"train_loss": -25.988311767578125, "global_step": 303030, "epoch": 3650} {"train_loss": -25.784687042236328, "global_step": 303031, "epoch": 3650} {"train_loss": -25.6033551549337, "global_step": 303032, "epoch": 3650, "train/sim_max_reward_0": 1.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4500000": 1.0, "test/sim_max_reward_4500001": 1.0, "test/sim_max_reward_4500002": 1.0, "test/sim_max_reward_4500003": 1.0, "test/sim_max_reward_4500004": 1.0, "test/sim_max_reward_4500005": 1.0, "test/sim_max_reward_4500006": 1.0, "test/sim_max_reward_4500007": 0.0, "test/sim_max_reward_4500008": 1.0, "test/sim_max_reward_4500009": 1.0, "test/sim_max_reward_4500010": 1.0, "test/sim_max_reward_4500011": 1.0, "test/sim_max_reward_4500012": 1.0, "test/sim_max_reward_4500013": 1.0, "test/sim_max_reward_4500014": 1.0, "test/sim_max_reward_4500015": 1.0, "test/sim_max_reward_4500016": 1.0, "test/sim_max_reward_4500017": 1.0, "test/sim_max_reward_4500018": 1.0, "test/sim_max_reward_4500019": 0.0, "test/sim_max_reward_4500020": 1.0, "test/sim_max_reward_4500021": 1.0, "train/mean_score": 1.0, "test/mean_score": 0.9090909090909091, "val_loss": 7279795.0} {"train_loss": -24.887685775756836, "global_step": 303033, "epoch": 3651} {"train_loss": -24.75965690612793, "global_step": 303034, "epoch": 3651} {"train_loss": -24.2664852142334, "global_step": 303035, "epoch": 3651} {"train_loss": -24.832786560058594, "global_step": 303036, "epoch": 3651} {"train_loss": -25.416074752807617, "global_step": 303037, "epoch": 3651} {"train_loss": -25.42165756225586, "global_step": 303038, "epoch": 3651} {"train_loss": -25.291561126708984, "global_step": 303039, "epoch": 3651} {"train_loss": -25.3617000579834, "global_step": 303040, "epoch": 3651} {"train_loss": -25.14165496826172, "global_step": 303041, "epoch": 3651} {"train_loss": -25.6460018157959, "global_step": 303042, "epoch": 3651} {"train_loss": -25.386661529541016, "global_step": 303043, "epoch": 3651} {"train_loss": -25.535934448242188, "global_step": 303044, "epoch": 3651} {"train_loss": -26.09438133239746, "global_step": 303045, "epoch": 3651} {"train_loss": -25.386096954345703, "global_step": 303046, "epoch": 3651} {"train_loss": -25.389890670776367, "global_step": 303047, "epoch": 3651} {"train_loss": -25.84470558166504, "global_step": 303048, "epoch": 3651} {"train_loss": -25.61530876159668, "global_step": 303049, "epoch": 3651} {"train_loss": -25.57712745666504, "global_step": 303050, "epoch": 3651} {"train_loss": -25.680526733398438, "global_step": 303051, "epoch": 3651} {"train_loss": -25.44283103942871, "global_step": 303052, "epoch": 3651} {"train_loss": -25.576404571533203, "global_step": 303053, "epoch": 3651} {"train_loss": -25.395816802978516, "global_step": 303054, "epoch": 3651} {"train_loss": -25.19004249572754, "global_step": 303055, "epoch": 3651} {"train_loss": -25.463727951049805, "global_step": 303056, "epoch": 3651} {"train_loss": -25.758365631103516, "global_step": 303057, "epoch": 3651} {"train_loss": -25.45260238647461, "global_step": 303058, "epoch": 3651} {"train_loss": -25.615583419799805, "global_step": 303059, "epoch": 3651} {"train_loss": -25.41499900817871, "global_step": 303060, "epoch": 3651} {"train_loss": -26.00588035583496, "global_step": 303061, "epoch": 3651} {"train_loss": -26.03788185119629, "global_step": 303062, "epoch": 3651} {"train_loss": -26.022546768188477, "global_step": 303063, "epoch": 3651} {"train_loss": -25.722309112548828, "global_step": 303064, "epoch": 3651} {"train_loss": -25.584394454956055, "global_step": 303065, "epoch": 3651} {"train_loss": -26.084142684936523, "global_step": 303066, "epoch": 3651} {"train_loss": -25.8266658782959, "global_step": 303067, "epoch": 3651} {"train_loss": -25.541141510009766, "global_step": 303068, "epoch": 3651} {"train_loss": -25.830291748046875, "global_step": 303069, "epoch": 3651} {"train_loss": -25.432621002197266, "global_step": 303070, "epoch": 3651} {"train_loss": -25.78460121154785, "global_step": 303071, "epoch": 3651} {"train_loss": -25.813812255859375, "global_step": 303072, "epoch": 3651} {"train_loss": -25.99001121520996, "global_step": 303073, "epoch": 3651} {"train_loss": -25.78058433532715, "global_step": 303074, "epoch": 3651} {"train_loss": -25.808700561523438, "global_step": 303075, "epoch": 3651} {"train_loss": -25.568708419799805, "global_step": 303076, "epoch": 3651} {"train_loss": -26.0775146484375, "global_step": 303077, "epoch": 3651} {"train_loss": -25.889759063720703, "global_step": 303078, "epoch": 3651} {"train_loss": -26.088897705078125, "global_step": 303079, "epoch": 3651} {"train_loss": -25.54457664489746, "global_step": 303080, "epoch": 3651} {"train_loss": -25.609668731689453, "global_step": 303081, "epoch": 3651} {"train_loss": -25.610681533813477, "global_step": 303082, "epoch": 3651} {"train_loss": -25.5346736907959, "global_step": 303083, "epoch": 3651} {"train_loss": -25.8521728515625, "global_step": 303084, "epoch": 3651} {"train_loss": -25.766332626342773, "global_step": 303085, "epoch": 3651} {"train_loss": -25.942975997924805, "global_step": 303086, "epoch": 3651} {"train_loss": -25.98956871032715, "global_step": 303087, "epoch": 3651} {"train_loss": -25.985034942626953, "global_step": 303088, "epoch": 3651} {"train_loss": -25.627527236938477, "global_step": 303089, "epoch": 3651} {"train_loss": -25.11225700378418, "global_step": 303090, "epoch": 3651} {"train_loss": -25.825122833251953, "global_step": 303091, "epoch": 3651} {"train_loss": -25.77248191833496, "global_step": 303092, "epoch": 3651} {"train_loss": -25.44463539123535, "global_step": 303093, "epoch": 3651} {"train_loss": -25.09422492980957, "global_step": 303094, "epoch": 3651} {"train_loss": -25.13252830505371, "global_step": 303095, "epoch": 3651} {"train_loss": -25.83740234375, "global_step": 303096, "epoch": 3651} {"train_loss": -25.52273941040039, "global_step": 303097, "epoch": 3651} {"train_loss": -25.537227630615234, "global_step": 303098, "epoch": 3651} {"train_loss": -25.634607315063477, "global_step": 303099, "epoch": 3651} {"train_loss": -25.560245513916016, "global_step": 303100, "epoch": 3651} {"train_loss": -25.776132583618164, "global_step": 303101, "epoch": 3651} {"train_loss": -25.138362884521484, "global_step": 303102, "epoch": 3651} {"train_loss": -25.716094970703125, "global_step": 303103, "epoch": 3651} {"train_loss": -26.171558380126953, "global_step": 303104, "epoch": 3651} {"train_loss": -25.430204391479492, "global_step": 303105, "epoch": 3651} {"train_loss": -25.82952308654785, "global_step": 303106, "epoch": 3651} {"train_loss": -25.77393913269043, "global_step": 303107, "epoch": 3651} {"train_loss": -25.3861083984375, "global_step": 303108, "epoch": 3651} {"train_loss": -25.387117385864258, "global_step": 303109, "epoch": 3651} {"train_loss": -25.347726821899414, "global_step": 303110, "epoch": 3651} {"train_loss": -25.92762565612793, "global_step": 303111, "epoch": 3651} {"train_loss": -25.712549209594727, "global_step": 303112, "epoch": 3651} {"train_loss": -25.6295166015625, "global_step": 303113, "epoch": 3651} {"train_loss": -25.568408966064453, "global_step": 303114, "epoch": 3651} {"train_loss": -25.587224891386835, "global_step": 303115, "epoch": 3651, "val_loss": 7222489.0} {"train_loss": -25.661712646484375, "global_step": 303116, "epoch": 3652} {"train_loss": -25.182981491088867, "global_step": 303117, "epoch": 3652} {"train_loss": -25.54218101501465, "global_step": 303118, "epoch": 3652} {"train_loss": -25.4449520111084, "global_step": 303119, "epoch": 3652} {"train_loss": -25.043161392211914, "global_step": 303120, "epoch": 3652} {"train_loss": -24.987878799438477, "global_step": 303121, "epoch": 3652} {"train_loss": -25.03310203552246, "global_step": 303122, "epoch": 3652} {"train_loss": -25.75510597229004, "global_step": 303123, "epoch": 3652} {"train_loss": -24.984375, "global_step": 303124, "epoch": 3652} {"train_loss": -25.266096115112305, "global_step": 303125, "epoch": 3652} {"train_loss": -25.241575241088867, "global_step": 303126, "epoch": 3652} {"train_loss": -25.219989776611328, "global_step": 303127, "epoch": 3652} {"train_loss": -25.09902000427246, "global_step": 303128, "epoch": 3652} {"train_loss": -25.58403968811035, "global_step": 303129, "epoch": 3652} {"train_loss": -25.24603843688965, "global_step": 303130, "epoch": 3652} {"train_loss": -25.403583526611328, "global_step": 303131, "epoch": 3652} {"train_loss": -25.42141342163086, "global_step": 303132, "epoch": 3652} {"train_loss": -25.512042999267578, "global_step": 303133, "epoch": 3652} {"train_loss": -25.972126007080078, "global_step": 303134, "epoch": 3652} {"train_loss": -25.420080184936523, "global_step": 303135, "epoch": 3652} {"train_loss": -25.924386978149414, "global_step": 303136, "epoch": 3652} {"train_loss": -25.840261459350586, "global_step": 303137, "epoch": 3652} {"train_loss": -25.548246383666992, "global_step": 303138, "epoch": 3652} {"train_loss": -25.747516632080078, "global_step": 303139, "epoch": 3652} {"train_loss": -25.50294303894043, "global_step": 303140, "epoch": 3652} {"train_loss": -25.594141006469727, "global_step": 303141, "epoch": 3652} {"train_loss": -25.44110679626465, "global_step": 303142, "epoch": 3652} {"train_loss": -25.78403663635254, "global_step": 303143, "epoch": 3652} {"train_loss": -25.893552780151367, "global_step": 303144, "epoch": 3652} {"train_loss": -25.651670455932617, "global_step": 303145, "epoch": 3652} {"train_loss": -25.429773330688477, "global_step": 303146, "epoch": 3652} {"train_loss": -25.83880615234375, "global_step": 303147, "epoch": 3652} {"train_loss": -25.592092514038086, "global_step": 303148, "epoch": 3652} {"train_loss": -25.785409927368164, "global_step": 303149, "epoch": 3652} {"train_loss": -25.829736709594727, "global_step": 303150, "epoch": 3652} {"train_loss": -26.052793502807617, "global_step": 303151, "epoch": 3652} {"train_loss": -25.58530044555664, "global_step": 303152, "epoch": 3652} {"train_loss": -25.656784057617188, "global_step": 303153, "epoch": 3652} {"train_loss": -25.971647262573242, "global_step": 303154, "epoch": 3652} {"train_loss": -26.040618896484375, "global_step": 303155, "epoch": 3652} {"train_loss": -25.748571395874023, "global_step": 303156, "epoch": 3652} {"train_loss": -25.90352439880371, "global_step": 303157, "epoch": 3652} {"train_loss": -26.020126342773438, "global_step": 303158, "epoch": 3652} {"train_loss": -25.78154945373535, "global_step": 303159, "epoch": 3652} {"train_loss": -25.877288818359375, "global_step": 303160, "epoch": 3652} {"train_loss": -25.785734176635742, "global_step": 303161, "epoch": 3652} {"train_loss": -25.717838287353516, "global_step": 303162, "epoch": 3652} {"train_loss": -25.59238624572754, "global_step": 303163, "epoch": 3652} {"train_loss": -25.793289184570312, "global_step": 303164, "epoch": 3652} {"train_loss": -25.83330726623535, "global_step": 303165, "epoch": 3652} {"train_loss": -25.756103515625, "global_step": 303166, "epoch": 3652} {"train_loss": -25.841928482055664, "global_step": 303167, "epoch": 3652} {"train_loss": -25.185733795166016, "global_step": 303168, "epoch": 3652} {"train_loss": -25.74964714050293, "global_step": 303169, "epoch": 3652} {"train_loss": -25.680912017822266, "global_step": 303170, "epoch": 3652} {"train_loss": -25.917728424072266, "global_step": 303171, "epoch": 3652} {"train_loss": -25.762664794921875, "global_step": 303172, "epoch": 3652} {"train_loss": -25.867563247680664, "global_step": 303173, "epoch": 3652} {"train_loss": -25.337574005126953, "global_step": 303174, "epoch": 3652} {"train_loss": -25.890562057495117, "global_step": 303175, "epoch": 3652} {"train_loss": -25.958349227905273, "global_step": 303176, "epoch": 3652} {"train_loss": -25.259424209594727, "global_step": 303177, "epoch": 3652} {"train_loss": -25.16096305847168, "global_step": 303178, "epoch": 3652} {"train_loss": -24.768447875976562, "global_step": 303179, "epoch": 3652} {"train_loss": -24.94209861755371, "global_step": 303180, "epoch": 3652} {"train_loss": -25.31171989440918, "global_step": 303181, "epoch": 3652} {"train_loss": -25.480016708374023, "global_step": 303182, "epoch": 3652} {"train_loss": -24.967493057250977, "global_step": 303183, "epoch": 3652} {"train_loss": -25.632761001586914, "global_step": 303184, "epoch": 3652} {"train_loss": -25.632368087768555, "global_step": 303185, "epoch": 3652} {"train_loss": -25.3284912109375, "global_step": 303186, "epoch": 3652} {"train_loss": -25.657651901245117, "global_step": 303187, "epoch": 3652} {"train_loss": -25.409854888916016, "global_step": 303188, "epoch": 3652} {"train_loss": -25.91988182067871, "global_step": 303189, "epoch": 3652} {"train_loss": -25.6389217376709, "global_step": 303190, "epoch": 3652} {"train_loss": -25.711557388305664, "global_step": 303191, "epoch": 3652} {"train_loss": -25.751861572265625, "global_step": 303192, "epoch": 3652} {"train_loss": -25.582914352416992, "global_step": 303193, "epoch": 3652} {"train_loss": -26.00641441345215, "global_step": 303194, "epoch": 3652} {"train_loss": -25.718481063842773, "global_step": 303195, "epoch": 3652} {"train_loss": -25.790746688842773, "global_step": 303196, "epoch": 3652} {"train_loss": -25.68216323852539, "global_step": 303197, "epoch": 3652} {"train_loss": -25.56462867001453, "global_step": 303198, "epoch": 3652, "val_loss": 7227156.0} {"train_loss": -25.37385368347168, "global_step": 303199, "epoch": 3653} {"train_loss": -24.957334518432617, "global_step": 303200, "epoch": 3653} {"train_loss": -25.36972427368164, "global_step": 303201, "epoch": 3653} {"train_loss": -25.45249366760254, "global_step": 303202, "epoch": 3653} {"train_loss": -24.92689323425293, "global_step": 303203, "epoch": 3653} {"train_loss": -24.976825714111328, "global_step": 303204, "epoch": 3653} {"train_loss": -25.291444778442383, "global_step": 303205, "epoch": 3653} {"train_loss": -25.31898307800293, "global_step": 303206, "epoch": 3653} {"train_loss": -25.092756271362305, "global_step": 303207, "epoch": 3653} {"train_loss": -25.51957130432129, "global_step": 303208, "epoch": 3653} {"train_loss": -25.656641006469727, "global_step": 303209, "epoch": 3653} {"train_loss": -24.858396530151367, "global_step": 303210, "epoch": 3653} {"train_loss": -25.546279907226562, "global_step": 303211, "epoch": 3653} {"train_loss": -25.432931900024414, "global_step": 303212, "epoch": 3653} {"train_loss": -25.829477310180664, "global_step": 303213, "epoch": 3653} {"train_loss": -25.169010162353516, "global_step": 303214, "epoch": 3653} {"train_loss": -25.675857543945312, "global_step": 303215, "epoch": 3653} {"train_loss": -25.5869083404541, "global_step": 303216, "epoch": 3653} {"train_loss": -25.552719116210938, "global_step": 303217, "epoch": 3653} {"train_loss": -25.4310359954834, "global_step": 303218, "epoch": 3653} {"train_loss": -25.37617301940918, "global_step": 303219, "epoch": 3653} {"train_loss": -25.547359466552734, "global_step": 303220, "epoch": 3653} {"train_loss": -25.402360916137695, "global_step": 303221, "epoch": 3653} {"train_loss": -25.66459083557129, "global_step": 303222, "epoch": 3653} {"train_loss": -25.7402400970459, "global_step": 303223, "epoch": 3653} {"train_loss": -25.84476661682129, "global_step": 303224, "epoch": 3653} {"train_loss": -25.41059112548828, "global_step": 303225, "epoch": 3653} {"train_loss": -25.616910934448242, "global_step": 303226, "epoch": 3653} {"train_loss": -25.568592071533203, "global_step": 303227, "epoch": 3653} {"train_loss": -25.842178344726562, "global_step": 303228, "epoch": 3653} {"train_loss": -25.621129989624023, "global_step": 303229, "epoch": 3653} {"train_loss": -25.729999542236328, "global_step": 303230, "epoch": 3653} {"train_loss": -25.270389556884766, "global_step": 303231, "epoch": 3653} {"train_loss": -25.735885620117188, "global_step": 303232, "epoch": 3653} {"train_loss": -25.48692512512207, "global_step": 303233, "epoch": 3653} {"train_loss": -26.031463623046875, "global_step": 303234, "epoch": 3653} {"train_loss": -25.474262237548828, "global_step": 303235, "epoch": 3653} {"train_loss": -25.861520767211914, "global_step": 303236, "epoch": 3653} {"train_loss": -25.69709587097168, "global_step": 303237, "epoch": 3653} {"train_loss": -25.670129776000977, "global_step": 303238, "epoch": 3653} {"train_loss": -25.759613037109375, "global_step": 303239, "epoch": 3653} {"train_loss": -25.52497673034668, "global_step": 303240, "epoch": 3653} {"train_loss": -25.906408309936523, "global_step": 303241, "epoch": 3653} {"train_loss": -25.639575958251953, "global_step": 303242, "epoch": 3653} {"train_loss": -25.361818313598633, "global_step": 303243, "epoch": 3653} {"train_loss": -25.789142608642578, "global_step": 303244, "epoch": 3653} {"train_loss": -25.71473503112793, "global_step": 303245, "epoch": 3653} {"train_loss": -25.80364990234375, "global_step": 303246, "epoch": 3653} {"train_loss": -25.680225372314453, "global_step": 303247, "epoch": 3653} {"train_loss": -25.86176109313965, "global_step": 303248, "epoch": 3653} {"train_loss": -25.511072158813477, "global_step": 303249, "epoch": 3653} {"train_loss": -25.944421768188477, "global_step": 303250, "epoch": 3653} {"train_loss": -25.713459014892578, "global_step": 303251, "epoch": 3653} {"train_loss": -25.836856842041016, "global_step": 303252, "epoch": 3653} {"train_loss": -25.772205352783203, "global_step": 303253, "epoch": 3653} {"train_loss": -25.831974029541016, "global_step": 303254, "epoch": 3653} {"train_loss": -25.29792022705078, "global_step": 303255, "epoch": 3653} {"train_loss": -25.933563232421875, "global_step": 303256, "epoch": 3653} {"train_loss": -25.430524826049805, "global_step": 303257, "epoch": 3653} {"train_loss": -25.738208770751953, "global_step": 303258, "epoch": 3653} {"train_loss": -25.53826904296875, "global_step": 303259, "epoch": 3653} {"train_loss": -25.328140258789062, "global_step": 303260, "epoch": 3653} {"train_loss": -25.54873275756836, "global_step": 303261, "epoch": 3653} {"train_loss": -25.58405303955078, "global_step": 303262, "epoch": 3653} {"train_loss": -25.50783348083496, "global_step": 303263, "epoch": 3653} {"train_loss": -25.1298770904541, "global_step": 303264, "epoch": 3653} {"train_loss": -25.509183883666992, "global_step": 303265, "epoch": 3653} {"train_loss": -25.76600456237793, "global_step": 303266, "epoch": 3653} {"train_loss": -25.691986083984375, "global_step": 303267, "epoch": 3653} {"train_loss": -25.498065948486328, "global_step": 303268, "epoch": 3653} {"train_loss": -25.607465744018555, "global_step": 303269, "epoch": 3653} {"train_loss": -25.71014976501465, "global_step": 303270, "epoch": 3653} {"train_loss": -25.414243698120117, "global_step": 303271, "epoch": 3653} {"train_loss": -25.599559783935547, "global_step": 303272, "epoch": 3653} {"train_loss": -25.544811248779297, "global_step": 303273, "epoch": 3653} {"train_loss": -25.89996337890625, "global_step": 303274, "epoch": 3653} {"train_loss": -25.775598526000977, "global_step": 303275, "epoch": 3653} {"train_loss": -25.35220718383789, "global_step": 303276, "epoch": 3653} {"train_loss": -25.918659210205078, "global_step": 303277, "epoch": 3653} {"train_loss": -25.7662410736084, "global_step": 303278, "epoch": 3653} {"train_loss": -25.588790893554688, "global_step": 303279, "epoch": 3653} {"train_loss": -25.888427734375, "global_step": 303280, "epoch": 3653} {"train_loss": -25.579806752951747, "global_step": 303281, "epoch": 3653, "val_loss": 7189191.5} {"train_loss": -24.933069229125977, "global_step": 303282, "epoch": 3654} {"train_loss": -24.080440521240234, "global_step": 303283, "epoch": 3654} {"train_loss": -24.727415084838867, "global_step": 303284, "epoch": 3654} {"train_loss": -25.262380599975586, "global_step": 303285, "epoch": 3654} {"train_loss": -24.81439208984375, "global_step": 303286, "epoch": 3654} {"train_loss": -25.67695426940918, "global_step": 303287, "epoch": 3654} {"train_loss": -24.94965171813965, "global_step": 303288, "epoch": 3654} {"train_loss": -24.785934448242188, "global_step": 303289, "epoch": 3654} {"train_loss": -25.33526039123535, "global_step": 303290, "epoch": 3654} {"train_loss": -25.3573055267334, "global_step": 303291, "epoch": 3654} {"train_loss": -25.286746978759766, "global_step": 303292, "epoch": 3654} {"train_loss": -25.36885643005371, "global_step": 303293, "epoch": 3654} {"train_loss": -25.397979736328125, "global_step": 303294, "epoch": 3654} {"train_loss": -25.85938835144043, "global_step": 303295, "epoch": 3654} {"train_loss": -25.267332077026367, "global_step": 303296, "epoch": 3654} {"train_loss": -25.75687026977539, "global_step": 303297, "epoch": 3654} {"train_loss": -25.793664932250977, "global_step": 303298, "epoch": 3654} {"train_loss": -25.45592498779297, "global_step": 303299, "epoch": 3654} {"train_loss": -25.783767700195312, "global_step": 303300, "epoch": 3654} {"train_loss": -25.645465850830078, "global_step": 303301, "epoch": 3654} {"train_loss": -25.520639419555664, "global_step": 303302, "epoch": 3654} {"train_loss": -25.36020278930664, "global_step": 303303, "epoch": 3654} {"train_loss": -25.192371368408203, "global_step": 303304, "epoch": 3654} {"train_loss": -25.345882415771484, "global_step": 303305, "epoch": 3654} {"train_loss": -25.8381404876709, "global_step": 303306, "epoch": 3654} {"train_loss": -25.70416831970215, "global_step": 303307, "epoch": 3654} {"train_loss": -25.647130966186523, "global_step": 303308, "epoch": 3654} {"train_loss": -25.4611873626709, "global_step": 303309, "epoch": 3654} {"train_loss": -25.582616806030273, "global_step": 303310, "epoch": 3654} {"train_loss": -25.696807861328125, "global_step": 303311, "epoch": 3654} {"train_loss": -25.526042938232422, "global_step": 303312, "epoch": 3654} {"train_loss": -25.620548248291016, "global_step": 303313, "epoch": 3654} {"train_loss": -25.634124755859375, "global_step": 303314, "epoch": 3654} {"train_loss": -25.842924118041992, "global_step": 303315, "epoch": 3654} {"train_loss": -25.7766170501709, "global_step": 303316, "epoch": 3654} {"train_loss": -25.279338836669922, "global_step": 303317, "epoch": 3654} {"train_loss": -25.457128524780273, "global_step": 303318, "epoch": 3654} {"train_loss": -25.74587059020996, "global_step": 303319, "epoch": 3654} {"train_loss": -25.793537139892578, "global_step": 303320, "epoch": 3654} {"train_loss": -25.48491668701172, "global_step": 303321, "epoch": 3654} {"train_loss": -25.306272506713867, "global_step": 303322, "epoch": 3654} {"train_loss": -25.86799430847168, "global_step": 303323, "epoch": 3654} {"train_loss": -25.765531539916992, "global_step": 303324, "epoch": 3654} {"train_loss": -25.31829261779785, "global_step": 303325, "epoch": 3654} {"train_loss": -25.721216201782227, "global_step": 303326, "epoch": 3654} {"train_loss": -25.448835372924805, "global_step": 303327, "epoch": 3654} {"train_loss": -25.717350006103516, "global_step": 303328, "epoch": 3654} {"train_loss": -25.389402389526367, "global_step": 303329, "epoch": 3654} {"train_loss": -25.506567001342773, "global_step": 303330, "epoch": 3654} {"train_loss": -25.7053165435791, "global_step": 303331, "epoch": 3654} {"train_loss": -25.242294311523438, "global_step": 303332, "epoch": 3654} {"train_loss": -25.70210838317871, "global_step": 303333, "epoch": 3654} {"train_loss": -25.781494140625, "global_step": 303334, "epoch": 3654} {"train_loss": -25.190799713134766, "global_step": 303335, "epoch": 3654} {"train_loss": -25.549501419067383, "global_step": 303336, "epoch": 3654} {"train_loss": -25.7581787109375, "global_step": 303337, "epoch": 3654} {"train_loss": -25.48337745666504, "global_step": 303338, "epoch": 3654} {"train_loss": -25.75, "global_step": 303339, "epoch": 3654} {"train_loss": -25.726903915405273, "global_step": 303340, "epoch": 3654} {"train_loss": -25.67919921875, "global_step": 303341, "epoch": 3654} {"train_loss": -25.62993812561035, "global_step": 303342, "epoch": 3654} {"train_loss": -25.350141525268555, "global_step": 303343, "epoch": 3654} {"train_loss": -25.820356369018555, "global_step": 303344, "epoch": 3654} {"train_loss": -25.7501277923584, "global_step": 303345, "epoch": 3654} {"train_loss": -25.959213256835938, "global_step": 303346, "epoch": 3654} {"train_loss": -25.41977310180664, "global_step": 303347, "epoch": 3654} {"train_loss": -25.80689811706543, "global_step": 303348, "epoch": 3654} {"train_loss": -25.80890464782715, "global_step": 303349, "epoch": 3654} {"train_loss": -25.32035255432129, "global_step": 303350, "epoch": 3654} {"train_loss": -25.515289306640625, "global_step": 303351, "epoch": 3654} {"train_loss": -25.7596378326416, "global_step": 303352, "epoch": 3654} {"train_loss": -25.87697410583496, "global_step": 303353, "epoch": 3654} {"train_loss": -25.80122184753418, "global_step": 303354, "epoch": 3654} {"train_loss": -25.760129928588867, "global_step": 303355, "epoch": 3654} {"train_loss": -25.280080795288086, "global_step": 303356, "epoch": 3654} {"train_loss": -25.5084285736084, "global_step": 303357, "epoch": 3654} {"train_loss": -25.751447677612305, "global_step": 303358, "epoch": 3654} {"train_loss": -25.424562454223633, "global_step": 303359, "epoch": 3654} {"train_loss": -25.828332901000977, "global_step": 303360, "epoch": 3654} {"train_loss": -25.800668716430664, "global_step": 303361, "epoch": 3654} {"train_loss": -25.36582374572754, "global_step": 303362, "epoch": 3654} {"train_loss": -25.763364791870117, "global_step": 303363, "epoch": 3654} {"train_loss": -25.531785781124988, "global_step": 303364, "epoch": 3654, "val_loss": 7170901.5} {"train_loss": -25.519102096557617, "global_step": 303365, "epoch": 3655} {"train_loss": -24.451814651489258, "global_step": 303366, "epoch": 3655} {"train_loss": -24.69891929626465, "global_step": 303367, "epoch": 3655} {"train_loss": -25.657773971557617, "global_step": 303368, "epoch": 3655} {"train_loss": -25.556503295898438, "global_step": 303369, "epoch": 3655} {"train_loss": -25.27178192138672, "global_step": 303370, "epoch": 3655} {"train_loss": -25.462121963500977, "global_step": 303371, "epoch": 3655} {"train_loss": -25.059783935546875, "global_step": 303372, "epoch": 3655} {"train_loss": -25.683385848999023, "global_step": 303373, "epoch": 3655} {"train_loss": -25.521451950073242, "global_step": 303374, "epoch": 3655} {"train_loss": -25.423847198486328, "global_step": 303375, "epoch": 3655} {"train_loss": -25.455947875976562, "global_step": 303376, "epoch": 3655} {"train_loss": -25.691381454467773, "global_step": 303377, "epoch": 3655} {"train_loss": -25.73882484436035, "global_step": 303378, "epoch": 3655} {"train_loss": -25.142057418823242, "global_step": 303379, "epoch": 3655} {"train_loss": -25.528303146362305, "global_step": 303380, "epoch": 3655} {"train_loss": -25.42304801940918, "global_step": 303381, "epoch": 3655} {"train_loss": -26.04400062561035, "global_step": 303382, "epoch": 3655} {"train_loss": -25.554903030395508, "global_step": 303383, "epoch": 3655} {"train_loss": -25.680471420288086, "global_step": 303384, "epoch": 3655} {"train_loss": -25.373870849609375, "global_step": 303385, "epoch": 3655} {"train_loss": -25.578289031982422, "global_step": 303386, "epoch": 3655} {"train_loss": -25.832809448242188, "global_step": 303387, "epoch": 3655} {"train_loss": -25.96232032775879, "global_step": 303388, "epoch": 3655} {"train_loss": -25.871862411499023, "global_step": 303389, "epoch": 3655} {"train_loss": -25.86195182800293, "global_step": 303390, "epoch": 3655} {"train_loss": -25.794416427612305, "global_step": 303391, "epoch": 3655} {"train_loss": -25.75020408630371, "global_step": 303392, "epoch": 3655} {"train_loss": -25.918914794921875, "global_step": 303393, "epoch": 3655} {"train_loss": -25.892536163330078, "global_step": 303394, "epoch": 3655} {"train_loss": -25.835615158081055, "global_step": 303395, "epoch": 3655} {"train_loss": -25.69135093688965, "global_step": 303396, "epoch": 3655} {"train_loss": -25.767972946166992, "global_step": 303397, "epoch": 3655} {"train_loss": -25.537607192993164, "global_step": 303398, "epoch": 3655} {"train_loss": -25.19345474243164, "global_step": 303399, "epoch": 3655} {"train_loss": -25.68840980529785, "global_step": 303400, "epoch": 3655} {"train_loss": -25.507240295410156, "global_step": 303401, "epoch": 3655} {"train_loss": -25.571569442749023, "global_step": 303402, "epoch": 3655} {"train_loss": -25.455322265625, "global_step": 303403, "epoch": 3655} {"train_loss": -25.235097885131836, "global_step": 303404, "epoch": 3655} {"train_loss": -25.66096305847168, "global_step": 303405, "epoch": 3655} {"train_loss": -25.224287033081055, "global_step": 303406, "epoch": 3655} {"train_loss": -25.396814346313477, "global_step": 303407, "epoch": 3655} {"train_loss": -25.420503616333008, "global_step": 303408, "epoch": 3655} {"train_loss": -25.54566764831543, "global_step": 303409, "epoch": 3655} {"train_loss": -25.343494415283203, "global_step": 303410, "epoch": 3655} {"train_loss": -25.455764770507812, "global_step": 303411, "epoch": 3655} {"train_loss": -25.796545028686523, "global_step": 303412, "epoch": 3655} {"train_loss": -25.361541748046875, "global_step": 303413, "epoch": 3655} {"train_loss": -25.358083724975586, "global_step": 303414, "epoch": 3655} {"train_loss": -25.421836853027344, "global_step": 303415, "epoch": 3655} {"train_loss": -25.342639923095703, "global_step": 303416, "epoch": 3655} {"train_loss": -25.08856773376465, "global_step": 303417, "epoch": 3655} {"train_loss": -25.82697105407715, "global_step": 303418, "epoch": 3655} {"train_loss": -25.42267608642578, "global_step": 303419, "epoch": 3655} {"train_loss": -25.768054962158203, "global_step": 303420, "epoch": 3655} {"train_loss": -26.158971786499023, "global_step": 303421, "epoch": 3655} {"train_loss": -25.6015625, "global_step": 303422, "epoch": 3655} {"train_loss": -25.57159996032715, "global_step": 303423, "epoch": 3655} {"train_loss": -25.575889587402344, "global_step": 303424, "epoch": 3655} {"train_loss": -25.757678985595703, "global_step": 303425, "epoch": 3655} {"train_loss": -26.042280197143555, "global_step": 303426, "epoch": 3655} {"train_loss": -25.4818115234375, "global_step": 303427, "epoch": 3655} {"train_loss": -25.65583610534668, "global_step": 303428, "epoch": 3655} {"train_loss": -25.746280670166016, "global_step": 303429, "epoch": 3655} {"train_loss": -25.779409408569336, "global_step": 303430, "epoch": 3655} {"train_loss": -25.627668380737305, "global_step": 303431, "epoch": 3655} {"train_loss": -26.04090690612793, "global_step": 303432, "epoch": 3655} {"train_loss": -25.822189331054688, "global_step": 303433, "epoch": 3655} {"train_loss": -25.56025505065918, "global_step": 303434, "epoch": 3655} {"train_loss": -25.955657958984375, "global_step": 303435, "epoch": 3655} {"train_loss": -26.00118064880371, "global_step": 303436, "epoch": 3655} {"train_loss": -25.8889217376709, "global_step": 303437, "epoch": 3655} {"train_loss": -25.604583740234375, "global_step": 303438, "epoch": 3655} {"train_loss": -25.700361251831055, "global_step": 303439, "epoch": 3655} {"train_loss": -25.59998893737793, "global_step": 303440, "epoch": 3655} {"train_loss": -25.359140396118164, "global_step": 303441, "epoch": 3655} {"train_loss": -25.837743759155273, "global_step": 303442, "epoch": 3655} {"train_loss": -26.0606632232666, "global_step": 303443, "epoch": 3655} {"train_loss": -25.45819854736328, "global_step": 303444, "epoch": 3655} {"train_loss": -25.702096939086914, "global_step": 303445, "epoch": 3655} {"train_loss": -25.644428253173828, "global_step": 303446, "epoch": 3655} {"train_loss": -25.58605292906244, "global_step": 303447, "epoch": 3655, "val_loss": 7140909.0} {"train_loss": -25.556577682495117, "global_step": 303448, "epoch": 3656} {"train_loss": -25.57776641845703, "global_step": 303449, "epoch": 3656} {"train_loss": -25.30051612854004, "global_step": 303450, "epoch": 3656} {"train_loss": -25.129093170166016, "global_step": 303451, "epoch": 3656} {"train_loss": -24.93342399597168, "global_step": 303452, "epoch": 3656} {"train_loss": -25.34510612487793, "global_step": 303453, "epoch": 3656} {"train_loss": -25.62238121032715, "global_step": 303454, "epoch": 3656} {"train_loss": -25.359411239624023, "global_step": 303455, "epoch": 3656} {"train_loss": -25.580644607543945, "global_step": 303456, "epoch": 3656} {"train_loss": -25.337430953979492, "global_step": 303457, "epoch": 3656} {"train_loss": -25.544950485229492, "global_step": 303458, "epoch": 3656} {"train_loss": -25.416839599609375, "global_step": 303459, "epoch": 3656} {"train_loss": -25.16063690185547, "global_step": 303460, "epoch": 3656} {"train_loss": -25.533748626708984, "global_step": 303461, "epoch": 3656} {"train_loss": -25.35884666442871, "global_step": 303462, "epoch": 3656} {"train_loss": -25.492908477783203, "global_step": 303463, "epoch": 3656} {"train_loss": -25.78948402404785, "global_step": 303464, "epoch": 3656} {"train_loss": -25.366060256958008, "global_step": 303465, "epoch": 3656} {"train_loss": -25.110925674438477, "global_step": 303466, "epoch": 3656} {"train_loss": -25.685775756835938, "global_step": 303467, "epoch": 3656} {"train_loss": -25.545318603515625, "global_step": 303468, "epoch": 3656} {"train_loss": -25.70660400390625, "global_step": 303469, "epoch": 3656} {"train_loss": -25.563825607299805, "global_step": 303470, "epoch": 3656} {"train_loss": -25.815046310424805, "global_step": 303471, "epoch": 3656} {"train_loss": -25.641082763671875, "global_step": 303472, "epoch": 3656} {"train_loss": -25.661245346069336, "global_step": 303473, "epoch": 3656} {"train_loss": -25.698835372924805, "global_step": 303474, "epoch": 3656} {"train_loss": -25.55568504333496, "global_step": 303475, "epoch": 3656} {"train_loss": -25.983978271484375, "global_step": 303476, "epoch": 3656} {"train_loss": -25.4041690826416, "global_step": 303477, "epoch": 3656} {"train_loss": -25.966001510620117, "global_step": 303478, "epoch": 3656} {"train_loss": -25.658416748046875, "global_step": 303479, "epoch": 3656} {"train_loss": -25.6064395904541, "global_step": 303480, "epoch": 3656} {"train_loss": -25.504804611206055, "global_step": 303481, "epoch": 3656} {"train_loss": -25.776519775390625, "global_step": 303482, "epoch": 3656} {"train_loss": -25.999677658081055, "global_step": 303483, "epoch": 3656} {"train_loss": -25.37598991394043, "global_step": 303484, "epoch": 3656} {"train_loss": -25.563512802124023, "global_step": 303485, "epoch": 3656} {"train_loss": -25.76137351989746, "global_step": 303486, "epoch": 3656} {"train_loss": -25.76038932800293, "global_step": 303487, "epoch": 3656} {"train_loss": -25.281665802001953, "global_step": 303488, "epoch": 3656} {"train_loss": -25.443464279174805, "global_step": 303489, "epoch": 3656} {"train_loss": -25.62982749938965, "global_step": 303490, "epoch": 3656} {"train_loss": -25.400657653808594, "global_step": 303491, "epoch": 3656} {"train_loss": -25.60800552368164, "global_step": 303492, "epoch": 3656} {"train_loss": -25.9220027923584, "global_step": 303493, "epoch": 3656} {"train_loss": -25.91644287109375, "global_step": 303494, "epoch": 3656} {"train_loss": -25.96686363220215, "global_step": 303495, "epoch": 3656} {"train_loss": -25.7626895904541, "global_step": 303496, "epoch": 3656} {"train_loss": -25.631567001342773, "global_step": 303497, "epoch": 3656} {"train_loss": -26.0093936920166, "global_step": 303498, "epoch": 3656} {"train_loss": -25.715051651000977, "global_step": 303499, "epoch": 3656} {"train_loss": -25.358890533447266, "global_step": 303500, "epoch": 3656} {"train_loss": -25.69736099243164, "global_step": 303501, "epoch": 3656} {"train_loss": -25.70707130432129, "global_step": 303502, "epoch": 3656} {"train_loss": -25.897693634033203, "global_step": 303503, "epoch": 3656} {"train_loss": -25.581462860107422, "global_step": 303504, "epoch": 3656} {"train_loss": -25.943490982055664, "global_step": 303505, "epoch": 3656} {"train_loss": -25.650476455688477, "global_step": 303506, "epoch": 3656} {"train_loss": -26.083715438842773, "global_step": 303507, "epoch": 3656} {"train_loss": -25.679336547851562, "global_step": 303508, "epoch": 3656} {"train_loss": -25.8735294342041, "global_step": 303509, "epoch": 3656} {"train_loss": -25.631250381469727, "global_step": 303510, "epoch": 3656} {"train_loss": -25.70246696472168, "global_step": 303511, "epoch": 3656} {"train_loss": -25.844329833984375, "global_step": 303512, "epoch": 3656} {"train_loss": -25.71963882446289, "global_step": 303513, "epoch": 3656} {"train_loss": -25.946945190429688, "global_step": 303514, "epoch": 3656} {"train_loss": -25.984588623046875, "global_step": 303515, "epoch": 3656} {"train_loss": -25.982389450073242, "global_step": 303516, "epoch": 3656} {"train_loss": -25.6071720123291, "global_step": 303517, "epoch": 3656} {"train_loss": -26.13053321838379, "global_step": 303518, "epoch": 3656} {"train_loss": -25.674304962158203, "global_step": 303519, "epoch": 3656} {"train_loss": -25.66733741760254, "global_step": 303520, "epoch": 3656} {"train_loss": -25.51645851135254, "global_step": 303521, "epoch": 3656} {"train_loss": -25.093564987182617, "global_step": 303522, "epoch": 3656} {"train_loss": -25.445642471313477, "global_step": 303523, "epoch": 3656} {"train_loss": -25.058324813842773, "global_step": 303524, "epoch": 3656} {"train_loss": -24.984329223632812, "global_step": 303525, "epoch": 3656} {"train_loss": -25.138818740844727, "global_step": 303526, "epoch": 3656} {"train_loss": -25.72785758972168, "global_step": 303527, "epoch": 3656} {"train_loss": -25.42486000061035, "global_step": 303528, "epoch": 3656} {"train_loss": -25.543033599853516, "global_step": 303529, "epoch": 3656} {"train_loss": -25.603826430906732, "global_step": 303530, "epoch": 3656, "val_loss": 7232840.0} {"train_loss": -25.228717803955078, "global_step": 303531, "epoch": 3657} {"train_loss": -25.297285079956055, "global_step": 303532, "epoch": 3657} {"train_loss": -24.698835372924805, "global_step": 303533, "epoch": 3657} {"train_loss": -25.16364097595215, "global_step": 303534, "epoch": 3657} {"train_loss": -25.503957748413086, "global_step": 303535, "epoch": 3657} {"train_loss": -24.968839645385742, "global_step": 303536, "epoch": 3657} {"train_loss": -25.46327018737793, "global_step": 303537, "epoch": 3657} {"train_loss": -25.573026657104492, "global_step": 303538, "epoch": 3657} {"train_loss": -25.28277587890625, "global_step": 303539, "epoch": 3657} {"train_loss": -25.054296493530273, "global_step": 303540, "epoch": 3657} {"train_loss": -25.114805221557617, "global_step": 303541, "epoch": 3657} {"train_loss": -25.283828735351562, "global_step": 303542, "epoch": 3657} {"train_loss": -25.24245834350586, "global_step": 303543, "epoch": 3657} {"train_loss": -25.912322998046875, "global_step": 303544, "epoch": 3657} {"train_loss": -25.569501876831055, "global_step": 303545, "epoch": 3657} {"train_loss": -25.37798500061035, "global_step": 303546, "epoch": 3657} {"train_loss": -25.58614730834961, "global_step": 303547, "epoch": 3657} {"train_loss": -25.370960235595703, "global_step": 303548, "epoch": 3657} {"train_loss": -25.186695098876953, "global_step": 303549, "epoch": 3657} {"train_loss": -25.53718376159668, "global_step": 303550, "epoch": 3657} {"train_loss": -25.736194610595703, "global_step": 303551, "epoch": 3657} {"train_loss": -25.56792640686035, "global_step": 303552, "epoch": 3657} {"train_loss": -25.42055320739746, "global_step": 303553, "epoch": 3657} {"train_loss": -25.25946617126465, "global_step": 303554, "epoch": 3657} {"train_loss": -25.811796188354492, "global_step": 303555, "epoch": 3657} {"train_loss": -25.538410186767578, "global_step": 303556, "epoch": 3657} {"train_loss": -25.5300350189209, "global_step": 303557, "epoch": 3657} {"train_loss": -25.14601707458496, "global_step": 303558, "epoch": 3657} {"train_loss": -25.81612205505371, "global_step": 303559, "epoch": 3657} {"train_loss": -25.48898696899414, "global_step": 303560, "epoch": 3657} {"train_loss": -25.6077938079834, "global_step": 303561, "epoch": 3657} {"train_loss": -25.763214111328125, "global_step": 303562, "epoch": 3657} {"train_loss": -25.28200340270996, "global_step": 303563, "epoch": 3657} {"train_loss": -25.610197067260742, "global_step": 303564, "epoch": 3657} {"train_loss": -25.891681671142578, "global_step": 303565, "epoch": 3657} {"train_loss": -25.662036895751953, "global_step": 303566, "epoch": 3657} {"train_loss": -25.696456909179688, "global_step": 303567, "epoch": 3657} {"train_loss": -25.368711471557617, "global_step": 303568, "epoch": 3657} {"train_loss": -25.576309204101562, "global_step": 303569, "epoch": 3657} {"train_loss": -25.949493408203125, "global_step": 303570, "epoch": 3657} {"train_loss": -25.616195678710938, "global_step": 303571, "epoch": 3657} {"train_loss": -25.904966354370117, "global_step": 303572, "epoch": 3657} {"train_loss": -26.19172477722168, "global_step": 303573, "epoch": 3657} {"train_loss": -26.01361083984375, "global_step": 303574, "epoch": 3657} {"train_loss": -25.501670837402344, "global_step": 303575, "epoch": 3657} {"train_loss": -26.042774200439453, "global_step": 303576, "epoch": 3657} {"train_loss": -25.67584800720215, "global_step": 303577, "epoch": 3657} {"train_loss": -25.989538192749023, "global_step": 303578, "epoch": 3657} {"train_loss": -25.556161880493164, "global_step": 303579, "epoch": 3657} {"train_loss": -25.81992530822754, "global_step": 303580, "epoch": 3657} {"train_loss": -25.761808395385742, "global_step": 303581, "epoch": 3657} {"train_loss": -25.6381893157959, "global_step": 303582, "epoch": 3657} {"train_loss": -25.864011764526367, "global_step": 303583, "epoch": 3657} {"train_loss": -25.86561393737793, "global_step": 303584, "epoch": 3657} {"train_loss": -26.094497680664062, "global_step": 303585, "epoch": 3657} {"train_loss": -25.665197372436523, "global_step": 303586, "epoch": 3657} {"train_loss": -25.861591339111328, "global_step": 303587, "epoch": 3657} {"train_loss": -25.571563720703125, "global_step": 303588, "epoch": 3657} {"train_loss": -25.781824111938477, "global_step": 303589, "epoch": 3657} {"train_loss": -25.236242294311523, "global_step": 303590, "epoch": 3657} {"train_loss": -26.206823348999023, "global_step": 303591, "epoch": 3657} {"train_loss": -25.555044174194336, "global_step": 303592, "epoch": 3657} {"train_loss": -25.65523338317871, "global_step": 303593, "epoch": 3657} {"train_loss": -25.503009796142578, "global_step": 303594, "epoch": 3657} {"train_loss": -25.999006271362305, "global_step": 303595, "epoch": 3657} {"train_loss": -25.741262435913086, "global_step": 303596, "epoch": 3657} {"train_loss": -25.399410247802734, "global_step": 303597, "epoch": 3657} {"train_loss": -25.6663818359375, "global_step": 303598, "epoch": 3657} {"train_loss": -25.538501739501953, "global_step": 303599, "epoch": 3657} {"train_loss": -25.70672607421875, "global_step": 303600, "epoch": 3657} {"train_loss": -25.5164794921875, "global_step": 303601, "epoch": 3657} {"train_loss": -25.526294708251953, "global_step": 303602, "epoch": 3657} {"train_loss": -25.63943862915039, "global_step": 303603, "epoch": 3657} {"train_loss": -25.94803810119629, "global_step": 303604, "epoch": 3657} {"train_loss": -26.03033447265625, "global_step": 303605, "epoch": 3657} {"train_loss": -25.53513526916504, "global_step": 303606, "epoch": 3657} {"train_loss": -25.859130859375, "global_step": 303607, "epoch": 3657} {"train_loss": -25.7534122467041, "global_step": 303608, "epoch": 3657} {"train_loss": -25.79377555847168, "global_step": 303609, "epoch": 3657} {"train_loss": -25.68140983581543, "global_step": 303610, "epoch": 3657} {"train_loss": -26.041492462158203, "global_step": 303611, "epoch": 3657} {"train_loss": -25.383630752563477, "global_step": 303612, "epoch": 3657} {"train_loss": -25.586684100599175, "global_step": 303613, "epoch": 3657, "val_loss": 7181193.5} {"train_loss": -25.53461456298828, "global_step": 303614, "epoch": 3658} {"train_loss": -25.00830078125, "global_step": 303615, "epoch": 3658} {"train_loss": -25.25656509399414, "global_step": 303616, "epoch": 3658} {"train_loss": -25.1275691986084, "global_step": 303617, "epoch": 3658} {"train_loss": -25.155654907226562, "global_step": 303618, "epoch": 3658} {"train_loss": -25.346189498901367, "global_step": 303619, "epoch": 3658} {"train_loss": -25.468156814575195, "global_step": 303620, "epoch": 3658} {"train_loss": -25.22137451171875, "global_step": 303621, "epoch": 3658} {"train_loss": -25.348054885864258, "global_step": 303622, "epoch": 3658} {"train_loss": -25.220571517944336, "global_step": 303623, "epoch": 3658} {"train_loss": -25.451215744018555, "global_step": 303624, "epoch": 3658} {"train_loss": -25.79151725769043, "global_step": 303625, "epoch": 3658} {"train_loss": -25.277801513671875, "global_step": 303626, "epoch": 3658} {"train_loss": -25.419490814208984, "global_step": 303627, "epoch": 3658} {"train_loss": -25.300457000732422, "global_step": 303628, "epoch": 3658} {"train_loss": -25.9796199798584, "global_step": 303629, "epoch": 3658} {"train_loss": -25.661523818969727, "global_step": 303630, "epoch": 3658} {"train_loss": -25.199626922607422, "global_step": 303631, "epoch": 3658} {"train_loss": -25.662267684936523, "global_step": 303632, "epoch": 3658} {"train_loss": -25.521474838256836, "global_step": 303633, "epoch": 3658} {"train_loss": -25.185028076171875, "global_step": 303634, "epoch": 3658} {"train_loss": -25.445972442626953, "global_step": 303635, "epoch": 3658} {"train_loss": -25.954914093017578, "global_step": 303636, "epoch": 3658} {"train_loss": -25.442609786987305, "global_step": 303637, "epoch": 3658} {"train_loss": -25.65231704711914, "global_step": 303638, "epoch": 3658} {"train_loss": -25.823627471923828, "global_step": 303639, "epoch": 3658} {"train_loss": -25.66419792175293, "global_step": 303640, "epoch": 3658} {"train_loss": -25.75701904296875, "global_step": 303641, "epoch": 3658} {"train_loss": -25.316862106323242, "global_step": 303642, "epoch": 3658} {"train_loss": -25.57254409790039, "global_step": 303643, "epoch": 3658} {"train_loss": -25.735107421875, "global_step": 303644, "epoch": 3658} {"train_loss": -25.917264938354492, "global_step": 303645, "epoch": 3658} {"train_loss": -25.713531494140625, "global_step": 303646, "epoch": 3658} {"train_loss": -25.775390625, "global_step": 303647, "epoch": 3658} {"train_loss": -25.795751571655273, "global_step": 303648, "epoch": 3658} {"train_loss": -26.122426986694336, "global_step": 303649, "epoch": 3658} {"train_loss": -25.64812660217285, "global_step": 303650, "epoch": 3658} {"train_loss": -25.875030517578125, "global_step": 303651, "epoch": 3658} {"train_loss": -25.68499755859375, "global_step": 303652, "epoch": 3658} {"train_loss": -25.322031021118164, "global_step": 303653, "epoch": 3658} {"train_loss": -25.95949363708496, "global_step": 303654, "epoch": 3658} {"train_loss": -26.10945701599121, "global_step": 303655, "epoch": 3658} {"train_loss": -25.196157455444336, "global_step": 303656, "epoch": 3658} {"train_loss": -25.341501235961914, "global_step": 303657, "epoch": 3658} {"train_loss": -25.498443603515625, "global_step": 303658, "epoch": 3658} {"train_loss": -25.164052963256836, "global_step": 303659, "epoch": 3658} {"train_loss": -25.7794132232666, "global_step": 303660, "epoch": 3658} {"train_loss": -25.750202178955078, "global_step": 303661, "epoch": 3658} {"train_loss": -25.81048583984375, "global_step": 303662, "epoch": 3658} {"train_loss": -25.711353302001953, "global_step": 303663, "epoch": 3658} {"train_loss": -25.678634643554688, "global_step": 303664, "epoch": 3658} {"train_loss": -25.55491828918457, "global_step": 303665, "epoch": 3658} {"train_loss": -25.687610626220703, "global_step": 303666, "epoch": 3658} {"train_loss": -25.831998825073242, "global_step": 303667, "epoch": 3658} {"train_loss": -25.8475284576416, "global_step": 303668, "epoch": 3658} {"train_loss": -25.480575561523438, "global_step": 303669, "epoch": 3658} {"train_loss": -25.643131256103516, "global_step": 303670, "epoch": 3658} {"train_loss": -25.569299697875977, "global_step": 303671, "epoch": 3658} {"train_loss": -25.253494262695312, "global_step": 303672, "epoch": 3658} {"train_loss": -25.088674545288086, "global_step": 303673, "epoch": 3658} {"train_loss": -25.859649658203125, "global_step": 303674, "epoch": 3658} {"train_loss": -25.500776290893555, "global_step": 303675, "epoch": 3658} {"train_loss": -25.406646728515625, "global_step": 303676, "epoch": 3658} {"train_loss": -25.70354652404785, "global_step": 303677, "epoch": 3658} {"train_loss": -25.54802894592285, "global_step": 303678, "epoch": 3658} {"train_loss": -25.4145565032959, "global_step": 303679, "epoch": 3658} {"train_loss": -25.55374526977539, "global_step": 303680, "epoch": 3658} {"train_loss": -25.697519302368164, "global_step": 303681, "epoch": 3658} {"train_loss": -25.831003189086914, "global_step": 303682, "epoch": 3658} {"train_loss": -25.847381591796875, "global_step": 303683, "epoch": 3658} {"train_loss": -25.315013885498047, "global_step": 303684, "epoch": 3658} {"train_loss": -25.865209579467773, "global_step": 303685, "epoch": 3658} {"train_loss": -25.891742706298828, "global_step": 303686, "epoch": 3658} {"train_loss": -25.3209228515625, "global_step": 303687, "epoch": 3658} {"train_loss": -26.24806022644043, "global_step": 303688, "epoch": 3658} {"train_loss": -25.4331111907959, "global_step": 303689, "epoch": 3658} {"train_loss": -24.862003326416016, "global_step": 303690, "epoch": 3658} {"train_loss": -25.63368034362793, "global_step": 303691, "epoch": 3658} {"train_loss": -25.594539642333984, "global_step": 303692, "epoch": 3658} {"train_loss": -25.058759689331055, "global_step": 303693, "epoch": 3658} {"train_loss": -25.7725830078125, "global_step": 303694, "epoch": 3658} {"train_loss": -25.720916748046875, "global_step": 303695, "epoch": 3658} {"train_loss": -25.552972402917334, "global_step": 303696, "epoch": 3658, "val_loss": 7255034.0} {"train_loss": -25.56160545349121, "global_step": 303697, "epoch": 3659} {"train_loss": -25.648117065429688, "global_step": 303698, "epoch": 3659} {"train_loss": -25.156957626342773, "global_step": 303699, "epoch": 3659} {"train_loss": -25.611557006835938, "global_step": 303700, "epoch": 3659} {"train_loss": -25.674978256225586, "global_step": 303701, "epoch": 3659} {"train_loss": -25.35573387145996, "global_step": 303702, "epoch": 3659} {"train_loss": -25.705121994018555, "global_step": 303703, "epoch": 3659} {"train_loss": -25.684255599975586, "global_step": 303704, "epoch": 3659} {"train_loss": -25.493362426757812, "global_step": 303705, "epoch": 3659} {"train_loss": -25.72870445251465, "global_step": 303706, "epoch": 3659} {"train_loss": -25.773344039916992, "global_step": 303707, "epoch": 3659} {"train_loss": -25.191980361938477, "global_step": 303708, "epoch": 3659} {"train_loss": -25.598302841186523, "global_step": 303709, "epoch": 3659} {"train_loss": -25.329086303710938, "global_step": 303710, "epoch": 3659} {"train_loss": -25.253890991210938, "global_step": 303711, "epoch": 3659} {"train_loss": -25.438077926635742, "global_step": 303712, "epoch": 3659} {"train_loss": -25.745441436767578, "global_step": 303713, "epoch": 3659} {"train_loss": -25.673215866088867, "global_step": 303714, "epoch": 3659} {"train_loss": -25.688827514648438, "global_step": 303715, "epoch": 3659} {"train_loss": -25.752466201782227, "global_step": 303716, "epoch": 3659} {"train_loss": -25.477872848510742, "global_step": 303717, "epoch": 3659} {"train_loss": -25.695728302001953, "global_step": 303718, "epoch": 3659} {"train_loss": -25.651838302612305, "global_step": 303719, "epoch": 3659} {"train_loss": -25.465152740478516, "global_step": 303720, "epoch": 3659} {"train_loss": -25.666101455688477, "global_step": 303721, "epoch": 3659} {"train_loss": -25.89479637145996, "global_step": 303722, "epoch": 3659} {"train_loss": -25.68277359008789, "global_step": 303723, "epoch": 3659} {"train_loss": -25.581079483032227, "global_step": 303724, "epoch": 3659} {"train_loss": -25.877552032470703, "global_step": 303725, "epoch": 3659} {"train_loss": -25.641586303710938, "global_step": 303726, "epoch": 3659} {"train_loss": -25.79715919494629, "global_step": 303727, "epoch": 3659} {"train_loss": -25.986133575439453, "global_step": 303728, "epoch": 3659} {"train_loss": -25.97612953186035, "global_step": 303729, "epoch": 3659} {"train_loss": -25.713632583618164, "global_step": 303730, "epoch": 3659} {"train_loss": -25.642414093017578, "global_step": 303731, "epoch": 3659} {"train_loss": -25.89463233947754, "global_step": 303732, "epoch": 3659} {"train_loss": -25.858642578125, "global_step": 303733, "epoch": 3659} {"train_loss": -25.84575843811035, "global_step": 303734, "epoch": 3659} {"train_loss": -25.467634201049805, "global_step": 303735, "epoch": 3659} {"train_loss": -25.6322021484375, "global_step": 303736, "epoch": 3659} {"train_loss": -25.81585121154785, "global_step": 303737, "epoch": 3659} {"train_loss": -25.9934139251709, "global_step": 303738, "epoch": 3659} {"train_loss": -25.880130767822266, "global_step": 303739, "epoch": 3659} {"train_loss": -25.546186447143555, "global_step": 303740, "epoch": 3659} {"train_loss": -25.7308406829834, "global_step": 303741, "epoch": 3659} {"train_loss": -25.81941032409668, "global_step": 303742, "epoch": 3659} {"train_loss": -25.304433822631836, "global_step": 303743, "epoch": 3659} {"train_loss": -25.942914962768555, "global_step": 303744, "epoch": 3659} {"train_loss": -25.59726333618164, "global_step": 303745, "epoch": 3659} {"train_loss": -25.69978141784668, "global_step": 303746, "epoch": 3659} {"train_loss": -25.888059616088867, "global_step": 303747, "epoch": 3659} {"train_loss": -26.060144424438477, "global_step": 303748, "epoch": 3659} {"train_loss": -25.719385147094727, "global_step": 303749, "epoch": 3659} {"train_loss": -26.0512638092041, "global_step": 303750, "epoch": 3659} {"train_loss": -25.758625030517578, "global_step": 303751, "epoch": 3659} {"train_loss": -25.401477813720703, "global_step": 303752, "epoch": 3659} {"train_loss": -25.78243064880371, "global_step": 303753, "epoch": 3659} {"train_loss": -25.634326934814453, "global_step": 303754, "epoch": 3659} {"train_loss": -25.53667449951172, "global_step": 303755, "epoch": 3659} {"train_loss": -25.668928146362305, "global_step": 303756, "epoch": 3659} {"train_loss": -25.601728439331055, "global_step": 303757, "epoch": 3659} {"train_loss": -26.14324378967285, "global_step": 303758, "epoch": 3659} {"train_loss": -25.682764053344727, "global_step": 303759, "epoch": 3659} {"train_loss": -26.147748947143555, "global_step": 303760, "epoch": 3659} {"train_loss": -26.13563346862793, "global_step": 303761, "epoch": 3659} {"train_loss": -25.73365592956543, "global_step": 303762, "epoch": 3659} {"train_loss": -25.597902297973633, "global_step": 303763, "epoch": 3659} {"train_loss": -25.789642333984375, "global_step": 303764, "epoch": 3659} {"train_loss": -25.677831649780273, "global_step": 303765, "epoch": 3659} {"train_loss": -25.77430534362793, "global_step": 303766, "epoch": 3659} {"train_loss": -25.47083854675293, "global_step": 303767, "epoch": 3659} {"train_loss": -25.537199020385742, "global_step": 303768, "epoch": 3659} {"train_loss": -25.75941276550293, "global_step": 303769, "epoch": 3659} {"train_loss": -25.54656219482422, "global_step": 303770, "epoch": 3659} {"train_loss": -25.826704025268555, "global_step": 303771, "epoch": 3659} {"train_loss": -25.143028259277344, "global_step": 303772, "epoch": 3659} {"train_loss": -25.497344970703125, "global_step": 303773, "epoch": 3659} {"train_loss": -25.51593017578125, "global_step": 303774, "epoch": 3659} {"train_loss": -25.38777732849121, "global_step": 303775, "epoch": 3659} {"train_loss": -25.482654571533203, "global_step": 303776, "epoch": 3659} {"train_loss": -25.69654655456543, "global_step": 303777, "epoch": 3659} {"train_loss": -25.826583862304688, "global_step": 303778, "epoch": 3659} {"train_loss": -25.680904526308357, "global_step": 303779, "epoch": 3659, "val_loss": 7126467.0} {"train_loss": -24.776443481445312, "global_step": 303780, "epoch": 3660} {"train_loss": -24.384801864624023, "global_step": 303781, "epoch": 3660} {"train_loss": -25.57335090637207, "global_step": 303782, "epoch": 3660} {"train_loss": -24.846511840820312, "global_step": 303783, "epoch": 3660} {"train_loss": -24.58387565612793, "global_step": 303784, "epoch": 3660} {"train_loss": -25.19585609436035, "global_step": 303785, "epoch": 3660} {"train_loss": -24.642847061157227, "global_step": 303786, "epoch": 3660} {"train_loss": -25.284238815307617, "global_step": 303787, "epoch": 3660} {"train_loss": -25.144346237182617, "global_step": 303788, "epoch": 3660} {"train_loss": -25.00617027282715, "global_step": 303789, "epoch": 3660} {"train_loss": -25.096479415893555, "global_step": 303790, "epoch": 3660} {"train_loss": -25.24874496459961, "global_step": 303791, "epoch": 3660} {"train_loss": -24.981237411499023, "global_step": 303792, "epoch": 3660} {"train_loss": -25.28900909423828, "global_step": 303793, "epoch": 3660} {"train_loss": -24.859304428100586, "global_step": 303794, "epoch": 3660} {"train_loss": -25.043392181396484, "global_step": 303795, "epoch": 3660} {"train_loss": -25.329504013061523, "global_step": 303796, "epoch": 3660} {"train_loss": -25.187070846557617, "global_step": 303797, "epoch": 3660} {"train_loss": -25.373701095581055, "global_step": 303798, "epoch": 3660} {"train_loss": -25.317256927490234, "global_step": 303799, "epoch": 3660} {"train_loss": -25.57422637939453, "global_step": 303800, "epoch": 3660} {"train_loss": -25.547849655151367, "global_step": 303801, "epoch": 3660} {"train_loss": -25.46052360534668, "global_step": 303802, "epoch": 3660} {"train_loss": -25.344654083251953, "global_step": 303803, "epoch": 3660} {"train_loss": -25.247392654418945, "global_step": 303804, "epoch": 3660} {"train_loss": -25.72216796875, "global_step": 303805, "epoch": 3660} {"train_loss": -25.78072166442871, "global_step": 303806, "epoch": 3660} {"train_loss": -25.605121612548828, "global_step": 303807, "epoch": 3660} {"train_loss": -25.526105880737305, "global_step": 303808, "epoch": 3660} {"train_loss": -25.835376739501953, "global_step": 303809, "epoch": 3660} {"train_loss": -25.240644454956055, "global_step": 303810, "epoch": 3660} {"train_loss": -25.676599502563477, "global_step": 303811, "epoch": 3660} {"train_loss": -25.710447311401367, "global_step": 303812, "epoch": 3660} {"train_loss": -25.523527145385742, "global_step": 303813, "epoch": 3660} {"train_loss": -25.6525936126709, "global_step": 303814, "epoch": 3660} {"train_loss": -25.780548095703125, "global_step": 303815, "epoch": 3660} {"train_loss": -25.47021484375, "global_step": 303816, "epoch": 3660} {"train_loss": -25.740203857421875, "global_step": 303817, "epoch": 3660} {"train_loss": -25.97722816467285, "global_step": 303818, "epoch": 3660} {"train_loss": -25.7124080657959, "global_step": 303819, "epoch": 3660} {"train_loss": -25.762372970581055, "global_step": 303820, "epoch": 3660} {"train_loss": -26.030370712280273, "global_step": 303821, "epoch": 3660} {"train_loss": -25.825773239135742, "global_step": 303822, "epoch": 3660} {"train_loss": -25.871545791625977, "global_step": 303823, "epoch": 3660} {"train_loss": -26.095996856689453, "global_step": 303824, "epoch": 3660} {"train_loss": -25.7979793548584, "global_step": 303825, "epoch": 3660} {"train_loss": -26.04387855529785, "global_step": 303826, "epoch": 3660} {"train_loss": -25.50412940979004, "global_step": 303827, "epoch": 3660} {"train_loss": -25.7874755859375, "global_step": 303828, "epoch": 3660} {"train_loss": -25.960546493530273, "global_step": 303829, "epoch": 3660} {"train_loss": -25.954389572143555, "global_step": 303830, "epoch": 3660} {"train_loss": -25.88953971862793, "global_step": 303831, "epoch": 3660} {"train_loss": -25.757949829101562, "global_step": 303832, "epoch": 3660} {"train_loss": -25.499330520629883, "global_step": 303833, "epoch": 3660} {"train_loss": -25.951465606689453, "global_step": 303834, "epoch": 3660} {"train_loss": -25.830280303955078, "global_step": 303835, "epoch": 3660} {"train_loss": -25.884021759033203, "global_step": 303836, "epoch": 3660} {"train_loss": -25.92286491394043, "global_step": 303837, "epoch": 3660} {"train_loss": -25.8057918548584, "global_step": 303838, "epoch": 3660} {"train_loss": -25.989826202392578, "global_step": 303839, "epoch": 3660} {"train_loss": -25.446474075317383, "global_step": 303840, "epoch": 3660} {"train_loss": -26.313573837280273, "global_step": 303841, "epoch": 3660} {"train_loss": -25.9867000579834, "global_step": 303842, "epoch": 3660} {"train_loss": -25.564193725585938, "global_step": 303843, "epoch": 3660} {"train_loss": -25.24859046936035, "global_step": 303844, "epoch": 3660} {"train_loss": -25.36287498474121, "global_step": 303845, "epoch": 3660} {"train_loss": -25.54728126525879, "global_step": 303846, "epoch": 3660} {"train_loss": -25.597211837768555, "global_step": 303847, "epoch": 3660} {"train_loss": -25.50703239440918, "global_step": 303848, "epoch": 3660} {"train_loss": -25.644607543945312, "global_step": 303849, "epoch": 3660} {"train_loss": -25.02423095703125, "global_step": 303850, "epoch": 3660} {"train_loss": -25.2930908203125, "global_step": 303851, "epoch": 3660} {"train_loss": -25.813756942749023, "global_step": 303852, "epoch": 3660} {"train_loss": -25.361404418945312, "global_step": 303853, "epoch": 3660} {"train_loss": -25.462610244750977, "global_step": 303854, "epoch": 3660} {"train_loss": -25.574193954467773, "global_step": 303855, "epoch": 3660} {"train_loss": -25.586841583251953, "global_step": 303856, "epoch": 3660} {"train_loss": -25.533843994140625, "global_step": 303857, "epoch": 3660} {"train_loss": -25.16107940673828, "global_step": 303858, "epoch": 3660} {"train_loss": -25.418670654296875, "global_step": 303859, "epoch": 3660} {"train_loss": -25.591144561767578, "global_step": 303860, "epoch": 3660} {"train_loss": -26.020776748657227, "global_step": 303861, "epoch": 3660} {"train_loss": -25.534893380590233, "global_step": 303862, "epoch": 3660, "val_loss": 7247570.0} {"train_loss": -25.298444747924805, "global_step": 303863, "epoch": 3661} {"train_loss": -25.22176170349121, "global_step": 303864, "epoch": 3661} {"train_loss": -25.287874221801758, "global_step": 303865, "epoch": 3661} {"train_loss": -25.144811630249023, "global_step": 303866, "epoch": 3661} {"train_loss": -25.387598037719727, "global_step": 303867, "epoch": 3661} {"train_loss": -25.345169067382812, "global_step": 303868, "epoch": 3661} {"train_loss": -25.125532150268555, "global_step": 303869, "epoch": 3661} {"train_loss": -25.7631778717041, "global_step": 303870, "epoch": 3661} {"train_loss": -25.17767906188965, "global_step": 303871, "epoch": 3661} {"train_loss": -25.592330932617188, "global_step": 303872, "epoch": 3661} {"train_loss": -25.31107521057129, "global_step": 303873, "epoch": 3661} {"train_loss": -25.63457679748535, "global_step": 303874, "epoch": 3661} {"train_loss": -25.159265518188477, "global_step": 303875, "epoch": 3661} {"train_loss": -25.393253326416016, "global_step": 303876, "epoch": 3661} {"train_loss": -25.653797149658203, "global_step": 303877, "epoch": 3661} {"train_loss": -25.318506240844727, "global_step": 303878, "epoch": 3661} {"train_loss": -25.375255584716797, "global_step": 303879, "epoch": 3661} {"train_loss": -25.85546875, "global_step": 303880, "epoch": 3661} {"train_loss": -25.181421279907227, "global_step": 303881, "epoch": 3661} {"train_loss": -25.32870101928711, "global_step": 303882, "epoch": 3661} {"train_loss": -25.88714027404785, "global_step": 303883, "epoch": 3661} {"train_loss": -26.023731231689453, "global_step": 303884, "epoch": 3661} {"train_loss": -25.798429489135742, "global_step": 303885, "epoch": 3661} {"train_loss": -25.886123657226562, "global_step": 303886, "epoch": 3661} {"train_loss": -25.464262008666992, "global_step": 303887, "epoch": 3661} {"train_loss": -25.735349655151367, "global_step": 303888, "epoch": 3661} {"train_loss": -25.852909088134766, "global_step": 303889, "epoch": 3661} {"train_loss": -25.670459747314453, "global_step": 303890, "epoch": 3661} {"train_loss": -25.321908950805664, "global_step": 303891, "epoch": 3661} {"train_loss": -25.478376388549805, "global_step": 303892, "epoch": 3661} {"train_loss": -25.57002067565918, "global_step": 303893, "epoch": 3661} {"train_loss": -25.8823299407959, "global_step": 303894, "epoch": 3661} {"train_loss": -25.633926391601562, "global_step": 303895, "epoch": 3661} {"train_loss": -25.418920516967773, "global_step": 303896, "epoch": 3661} {"train_loss": -25.408653259277344, "global_step": 303897, "epoch": 3661} {"train_loss": -25.9646053314209, "global_step": 303898, "epoch": 3661} {"train_loss": -26.130075454711914, "global_step": 303899, "epoch": 3661} {"train_loss": -25.677173614501953, "global_step": 303900, "epoch": 3661} {"train_loss": -25.716379165649414, "global_step": 303901, "epoch": 3661} {"train_loss": -26.019195556640625, "global_step": 303902, "epoch": 3661} {"train_loss": -25.8026065826416, "global_step": 303903, "epoch": 3661} {"train_loss": -25.807682037353516, "global_step": 303904, "epoch": 3661} {"train_loss": -25.932605743408203, "global_step": 303905, "epoch": 3661} {"train_loss": -26.064289093017578, "global_step": 303906, "epoch": 3661} {"train_loss": -25.528776168823242, "global_step": 303907, "epoch": 3661} {"train_loss": -26.09750747680664, "global_step": 303908, "epoch": 3661} {"train_loss": -25.895099639892578, "global_step": 303909, "epoch": 3661} {"train_loss": -25.694730758666992, "global_step": 303910, "epoch": 3661} {"train_loss": -25.886865615844727, "global_step": 303911, "epoch": 3661} {"train_loss": -25.47747802734375, "global_step": 303912, "epoch": 3661} {"train_loss": -25.510656356811523, "global_step": 303913, "epoch": 3661} {"train_loss": -25.44285011291504, "global_step": 303914, "epoch": 3661} {"train_loss": -25.70725440979004, "global_step": 303915, "epoch": 3661} {"train_loss": -25.717294692993164, "global_step": 303916, "epoch": 3661} {"train_loss": -25.673980712890625, "global_step": 303917, "epoch": 3661} {"train_loss": -25.632038116455078, "global_step": 303918, "epoch": 3661} {"train_loss": -25.97102165222168, "global_step": 303919, "epoch": 3661} {"train_loss": -25.930295944213867, "global_step": 303920, "epoch": 3661} {"train_loss": -25.772052764892578, "global_step": 303921, "epoch": 3661} {"train_loss": -25.812063217163086, "global_step": 303922, "epoch": 3661} {"train_loss": -25.9547061920166, "global_step": 303923, "epoch": 3661} {"train_loss": -25.894540786743164, "global_step": 303924, "epoch": 3661} {"train_loss": -26.068403244018555, "global_step": 303925, "epoch": 3661} {"train_loss": -25.755640029907227, "global_step": 303926, "epoch": 3661} {"train_loss": -25.717126846313477, "global_step": 303927, "epoch": 3661} {"train_loss": -25.506765365600586, "global_step": 303928, "epoch": 3661} {"train_loss": -26.026220321655273, "global_step": 303929, "epoch": 3661} {"train_loss": -25.9072265625, "global_step": 303930, "epoch": 3661} {"train_loss": -25.580106735229492, "global_step": 303931, "epoch": 3661} {"train_loss": -26.000402450561523, "global_step": 303932, "epoch": 3661} {"train_loss": -25.998029708862305, "global_step": 303933, "epoch": 3661} {"train_loss": -25.433135986328125, "global_step": 303934, "epoch": 3661} {"train_loss": -25.897077560424805, "global_step": 303935, "epoch": 3661} {"train_loss": -25.652517318725586, "global_step": 303936, "epoch": 3661} {"train_loss": -25.44697380065918, "global_step": 303937, "epoch": 3661} {"train_loss": -25.461944580078125, "global_step": 303938, "epoch": 3661} {"train_loss": -25.100500106811523, "global_step": 303939, "epoch": 3661} {"train_loss": -25.620054244995117, "global_step": 303940, "epoch": 3661} {"train_loss": -25.697980880737305, "global_step": 303941, "epoch": 3661} {"train_loss": -24.98263931274414, "global_step": 303942, "epoch": 3661} {"train_loss": -25.1472225189209, "global_step": 303943, "epoch": 3661} {"train_loss": -25.400592803955078, "global_step": 303944, "epoch": 3661} {"train_loss": -25.605932810220374, "global_step": 303945, "epoch": 3661, "val_loss": 7109952.0} {"train_loss": -23.387203216552734, "global_step": 303946, "epoch": 3662} {"train_loss": -25.13423728942871, "global_step": 303947, "epoch": 3662} {"train_loss": -24.32767105102539, "global_step": 303948, "epoch": 3662} {"train_loss": -24.79951286315918, "global_step": 303949, "epoch": 3662} {"train_loss": -24.1625919342041, "global_step": 303950, "epoch": 3662} {"train_loss": -24.4725341796875, "global_step": 303951, "epoch": 3662} {"train_loss": -24.5018253326416, "global_step": 303952, "epoch": 3662} {"train_loss": -24.32831573486328, "global_step": 303953, "epoch": 3662} {"train_loss": -24.473834991455078, "global_step": 303954, "epoch": 3662} {"train_loss": -24.82893943786621, "global_step": 303955, "epoch": 3662} {"train_loss": -24.40673828125, "global_step": 303956, "epoch": 3662} {"train_loss": -24.85029411315918, "global_step": 303957, "epoch": 3662} {"train_loss": -24.31656837463379, "global_step": 303958, "epoch": 3662} {"train_loss": -25.013137817382812, "global_step": 303959, "epoch": 3662} {"train_loss": -25.30449104309082, "global_step": 303960, "epoch": 3662} {"train_loss": -24.861257553100586, "global_step": 303961, "epoch": 3662} {"train_loss": -25.298383712768555, "global_step": 303962, "epoch": 3662} {"train_loss": -24.536113739013672, "global_step": 303963, "epoch": 3662} {"train_loss": -25.06448745727539, "global_step": 303964, "epoch": 3662} {"train_loss": -25.04024314880371, "global_step": 303965, "epoch": 3662} {"train_loss": -25.02131462097168, "global_step": 303966, "epoch": 3662} {"train_loss": -24.86702537536621, "global_step": 303967, "epoch": 3662} {"train_loss": -25.24171257019043, "global_step": 303968, "epoch": 3662} {"train_loss": -24.98476219177246, "global_step": 303969, "epoch": 3662} {"train_loss": -25.152555465698242, "global_step": 303970, "epoch": 3662} {"train_loss": -25.25998878479004, "global_step": 303971, "epoch": 3662} {"train_loss": -24.88702964782715, "global_step": 303972, "epoch": 3662} {"train_loss": -25.239912033081055, "global_step": 303973, "epoch": 3662} {"train_loss": -25.542390823364258, "global_step": 303974, "epoch": 3662} {"train_loss": -25.03421974182129, "global_step": 303975, "epoch": 3662} {"train_loss": -25.488128662109375, "global_step": 303976, "epoch": 3662} {"train_loss": -25.714689254760742, "global_step": 303977, "epoch": 3662} {"train_loss": -24.90425682067871, "global_step": 303978, "epoch": 3662} {"train_loss": -25.125110626220703, "global_step": 303979, "epoch": 3662} {"train_loss": -25.3754940032959, "global_step": 303980, "epoch": 3662} {"train_loss": -25.893390655517578, "global_step": 303981, "epoch": 3662} {"train_loss": -25.46788787841797, "global_step": 303982, "epoch": 3662} {"train_loss": -25.52812957763672, "global_step": 303983, "epoch": 3662} {"train_loss": -25.591825485229492, "global_step": 303984, "epoch": 3662} {"train_loss": -25.479923248291016, "global_step": 303985, "epoch": 3662} {"train_loss": -25.2781925201416, "global_step": 303986, "epoch": 3662} {"train_loss": -25.420019149780273, "global_step": 303987, "epoch": 3662} {"train_loss": -25.46904754638672, "global_step": 303988, "epoch": 3662} {"train_loss": -25.497669219970703, "global_step": 303989, "epoch": 3662} {"train_loss": -25.391944885253906, "global_step": 303990, "epoch": 3662} {"train_loss": -25.813461303710938, "global_step": 303991, "epoch": 3662} {"train_loss": -25.5130615234375, "global_step": 303992, "epoch": 3662} {"train_loss": -25.73541259765625, "global_step": 303993, "epoch": 3662} {"train_loss": -25.38533592224121, "global_step": 303994, "epoch": 3662} {"train_loss": -25.797719955444336, "global_step": 303995, "epoch": 3662} {"train_loss": -26.133869171142578, "global_step": 303996, "epoch": 3662} {"train_loss": -25.607532501220703, "global_step": 303997, "epoch": 3662} {"train_loss": -25.823095321655273, "global_step": 303998, "epoch": 3662} {"train_loss": -26.070819854736328, "global_step": 303999, "epoch": 3662} {"train_loss": -25.774276733398438, "global_step": 304000, "epoch": 3662} {"train_loss": -26.093103408813477, "global_step": 304001, "epoch": 3662} {"train_loss": -25.882965087890625, "global_step": 304002, "epoch": 3662} {"train_loss": -25.844608306884766, "global_step": 304003, "epoch": 3662} {"train_loss": -25.92426872253418, "global_step": 304004, "epoch": 3662} {"train_loss": -25.591398239135742, "global_step": 304005, "epoch": 3662} {"train_loss": -25.860244750976562, "global_step": 304006, "epoch": 3662} {"train_loss": -25.46466064453125, "global_step": 304007, "epoch": 3662} {"train_loss": -25.814868927001953, "global_step": 304008, "epoch": 3662} {"train_loss": -25.493465423583984, "global_step": 304009, "epoch": 3662} {"train_loss": -25.408048629760742, "global_step": 304010, "epoch": 3662} {"train_loss": -25.9574031829834, "global_step": 304011, "epoch": 3662} {"train_loss": -25.950674057006836, "global_step": 304012, "epoch": 3662} {"train_loss": -25.515501022338867, "global_step": 304013, "epoch": 3662} {"train_loss": -25.622098922729492, "global_step": 304014, "epoch": 3662} {"train_loss": -26.025732040405273, "global_step": 304015, "epoch": 3662} {"train_loss": -25.5413875579834, "global_step": 304016, "epoch": 3662} {"train_loss": -25.79373550415039, "global_step": 304017, "epoch": 3662} {"train_loss": -25.280658721923828, "global_step": 304018, "epoch": 3662} {"train_loss": -25.62180519104004, "global_step": 304019, "epoch": 3662} {"train_loss": -25.562490463256836, "global_step": 304020, "epoch": 3662} {"train_loss": -25.97797203063965, "global_step": 304021, "epoch": 3662} {"train_loss": -25.502315521240234, "global_step": 304022, "epoch": 3662} {"train_loss": -25.93317222595215, "global_step": 304023, "epoch": 3662} {"train_loss": -26.129730224609375, "global_step": 304024, "epoch": 3662} {"train_loss": -25.838199615478516, "global_step": 304025, "epoch": 3662} {"train_loss": -26.363037109375, "global_step": 304026, "epoch": 3662} {"train_loss": -25.63538932800293, "global_step": 304027, "epoch": 3662} {"train_loss": -25.355460477162556, "global_step": 304028, "epoch": 3662, "val_loss": 7315066.5} {"train_loss": -24.501428604125977, "global_step": 304029, "epoch": 3663} {"train_loss": -23.803730010986328, "global_step": 304030, "epoch": 3663} {"train_loss": -24.471450805664062, "global_step": 304031, "epoch": 3663} {"train_loss": -24.837278366088867, "global_step": 304032, "epoch": 3663} {"train_loss": -24.897489547729492, "global_step": 304033, "epoch": 3663} {"train_loss": -25.099863052368164, "global_step": 304034, "epoch": 3663} {"train_loss": -25.146286010742188, "global_step": 304035, "epoch": 3663} {"train_loss": -24.976770401000977, "global_step": 304036, "epoch": 3663} {"train_loss": -25.13008689880371, "global_step": 304037, "epoch": 3663} {"train_loss": -25.386295318603516, "global_step": 304038, "epoch": 3663} {"train_loss": -25.210866928100586, "global_step": 304039, "epoch": 3663} {"train_loss": -25.098417282104492, "global_step": 304040, "epoch": 3663} {"train_loss": -25.60382652282715, "global_step": 304041, "epoch": 3663} {"train_loss": -24.948837280273438, "global_step": 304042, "epoch": 3663} {"train_loss": -24.98846435546875, "global_step": 304043, "epoch": 3663} {"train_loss": -25.411100387573242, "global_step": 304044, "epoch": 3663} {"train_loss": -25.323688507080078, "global_step": 304045, "epoch": 3663} {"train_loss": -25.596738815307617, "global_step": 304046, "epoch": 3663} {"train_loss": -25.016340255737305, "global_step": 304047, "epoch": 3663} {"train_loss": -25.312437057495117, "global_step": 304048, "epoch": 3663} {"train_loss": -25.298337936401367, "global_step": 304049, "epoch": 3663} {"train_loss": -25.44941520690918, "global_step": 304050, "epoch": 3663} {"train_loss": -25.084936141967773, "global_step": 304051, "epoch": 3663} {"train_loss": -25.30620765686035, "global_step": 304052, "epoch": 3663} {"train_loss": -25.317508697509766, "global_step": 304053, "epoch": 3663} {"train_loss": -24.989608764648438, "global_step": 304054, "epoch": 3663} {"train_loss": -25.372608184814453, "global_step": 304055, "epoch": 3663} {"train_loss": -25.498550415039062, "global_step": 304056, "epoch": 3663} {"train_loss": -25.522558212280273, "global_step": 304057, "epoch": 3663} {"train_loss": -25.446775436401367, "global_step": 304058, "epoch": 3663} {"train_loss": -25.205839157104492, "global_step": 304059, "epoch": 3663} {"train_loss": -25.714618682861328, "global_step": 304060, "epoch": 3663} {"train_loss": -25.644535064697266, "global_step": 304061, "epoch": 3663} {"train_loss": -25.285879135131836, "global_step": 304062, "epoch": 3663} {"train_loss": -25.455392837524414, "global_step": 304063, "epoch": 3663} {"train_loss": -26.049036026000977, "global_step": 304064, "epoch": 3663} {"train_loss": -25.918991088867188, "global_step": 304065, "epoch": 3663} {"train_loss": -26.22385597229004, "global_step": 304066, "epoch": 3663} {"train_loss": -25.49860191345215, "global_step": 304067, "epoch": 3663} {"train_loss": -26.04140281677246, "global_step": 304068, "epoch": 3663} {"train_loss": -25.680875778198242, "global_step": 304069, "epoch": 3663} {"train_loss": -25.772357940673828, "global_step": 304070, "epoch": 3663} {"train_loss": -25.415443420410156, "global_step": 304071, "epoch": 3663} {"train_loss": -25.320863723754883, "global_step": 304072, "epoch": 3663} {"train_loss": -25.41315269470215, "global_step": 304073, "epoch": 3663} {"train_loss": -25.811269760131836, "global_step": 304074, "epoch": 3663} {"train_loss": -25.90349769592285, "global_step": 304075, "epoch": 3663} {"train_loss": -25.840625762939453, "global_step": 304076, "epoch": 3663} {"train_loss": -25.556699752807617, "global_step": 304077, "epoch": 3663} {"train_loss": -25.57662010192871, "global_step": 304078, "epoch": 3663} {"train_loss": -26.059797286987305, "global_step": 304079, "epoch": 3663} {"train_loss": -25.910425186157227, "global_step": 304080, "epoch": 3663} {"train_loss": -25.655012130737305, "global_step": 304081, "epoch": 3663} {"train_loss": -25.73200798034668, "global_step": 304082, "epoch": 3663} {"train_loss": -25.770200729370117, "global_step": 304083, "epoch": 3663} {"train_loss": -25.39107894897461, "global_step": 304084, "epoch": 3663} {"train_loss": -25.505441665649414, "global_step": 304085, "epoch": 3663} {"train_loss": -25.28099822998047, "global_step": 304086, "epoch": 3663} {"train_loss": -25.675207138061523, "global_step": 304087, "epoch": 3663} {"train_loss": -25.917001724243164, "global_step": 304088, "epoch": 3663} {"train_loss": -25.991546630859375, "global_step": 304089, "epoch": 3663} {"train_loss": -25.616666793823242, "global_step": 304090, "epoch": 3663} {"train_loss": -26.1309814453125, "global_step": 304091, "epoch": 3663} {"train_loss": -25.5300235748291, "global_step": 304092, "epoch": 3663} {"train_loss": -25.715057373046875, "global_step": 304093, "epoch": 3663} {"train_loss": -25.799917221069336, "global_step": 304094, "epoch": 3663} {"train_loss": -25.82508659362793, "global_step": 304095, "epoch": 3663} {"train_loss": -25.95693016052246, "global_step": 304096, "epoch": 3663} {"train_loss": -25.881271362304688, "global_step": 304097, "epoch": 3663} {"train_loss": -25.627460479736328, "global_step": 304098, "epoch": 3663} {"train_loss": -25.557632446289062, "global_step": 304099, "epoch": 3663} {"train_loss": -25.812957763671875, "global_step": 304100, "epoch": 3663} {"train_loss": -25.57594108581543, "global_step": 304101, "epoch": 3663} {"train_loss": -25.765338897705078, "global_step": 304102, "epoch": 3663} {"train_loss": -25.45531463623047, "global_step": 304103, "epoch": 3663} {"train_loss": -25.354877471923828, "global_step": 304104, "epoch": 3663} {"train_loss": -25.564258575439453, "global_step": 304105, "epoch": 3663} {"train_loss": -25.758222579956055, "global_step": 304106, "epoch": 3663} {"train_loss": -25.71479606628418, "global_step": 304107, "epoch": 3663} {"train_loss": -25.9565372467041, "global_step": 304108, "epoch": 3663} {"train_loss": -25.65655517578125, "global_step": 304109, "epoch": 3663} {"train_loss": -25.927799224853516, "global_step": 304110, "epoch": 3663} {"train_loss": -25.49176661939506, "global_step": 304111, "epoch": 3663, "val_loss": 7253121.5} {"train_loss": -24.82521629333496, "global_step": 304112, "epoch": 3664} {"train_loss": -25.115028381347656, "global_step": 304113, "epoch": 3664} {"train_loss": -25.7115421295166, "global_step": 304114, "epoch": 3664} {"train_loss": -25.118667602539062, "global_step": 304115, "epoch": 3664} {"train_loss": -25.36543083190918, "global_step": 304116, "epoch": 3664} {"train_loss": -25.459749221801758, "global_step": 304117, "epoch": 3664} {"train_loss": -24.764677047729492, "global_step": 304118, "epoch": 3664} {"train_loss": -25.442407608032227, "global_step": 304119, "epoch": 3664} {"train_loss": -25.32090187072754, "global_step": 304120, "epoch": 3664} {"train_loss": -25.49412727355957, "global_step": 304121, "epoch": 3664} {"train_loss": -25.31806755065918, "global_step": 304122, "epoch": 3664} {"train_loss": -25.58912467956543, "global_step": 304123, "epoch": 3664} {"train_loss": -25.83832359313965, "global_step": 304124, "epoch": 3664} {"train_loss": -25.67762565612793, "global_step": 304125, "epoch": 3664} {"train_loss": -25.405895233154297, "global_step": 304126, "epoch": 3664} {"train_loss": -25.569753646850586, "global_step": 304127, "epoch": 3664} {"train_loss": -25.711828231811523, "global_step": 304128, "epoch": 3664} {"train_loss": -25.65934181213379, "global_step": 304129, "epoch": 3664} {"train_loss": -25.525455474853516, "global_step": 304130, "epoch": 3664} {"train_loss": -25.443340301513672, "global_step": 304131, "epoch": 3664} {"train_loss": -25.6160888671875, "global_step": 304132, "epoch": 3664} {"train_loss": -25.681726455688477, "global_step": 304133, "epoch": 3664} {"train_loss": -25.74456787109375, "global_step": 304134, "epoch": 3664} {"train_loss": -25.376523971557617, "global_step": 304135, "epoch": 3664} {"train_loss": -25.6976261138916, "global_step": 304136, "epoch": 3664} {"train_loss": -26.169300079345703, "global_step": 304137, "epoch": 3664} {"train_loss": -25.835546493530273, "global_step": 304138, "epoch": 3664} {"train_loss": -25.227643966674805, "global_step": 304139, "epoch": 3664} {"train_loss": -25.73394775390625, "global_step": 304140, "epoch": 3664} {"train_loss": -25.65654945373535, "global_step": 304141, "epoch": 3664} {"train_loss": -25.87106704711914, "global_step": 304142, "epoch": 3664} {"train_loss": -25.869958877563477, "global_step": 304143, "epoch": 3664} {"train_loss": -25.82758140563965, "global_step": 304144, "epoch": 3664} {"train_loss": -25.616931915283203, "global_step": 304145, "epoch": 3664} {"train_loss": -25.817296981811523, "global_step": 304146, "epoch": 3664} {"train_loss": -25.82981300354004, "global_step": 304147, "epoch": 3664} {"train_loss": -25.668867111206055, "global_step": 304148, "epoch": 3664} {"train_loss": -25.633560180664062, "global_step": 304149, "epoch": 3664} {"train_loss": -26.161224365234375, "global_step": 304150, "epoch": 3664} {"train_loss": -25.76698112487793, "global_step": 304151, "epoch": 3664} {"train_loss": -25.831308364868164, "global_step": 304152, "epoch": 3664} {"train_loss": -25.805496215820312, "global_step": 304153, "epoch": 3664} {"train_loss": -25.944717407226562, "global_step": 304154, "epoch": 3664} {"train_loss": -25.7639102935791, "global_step": 304155, "epoch": 3664} {"train_loss": -25.77528190612793, "global_step": 304156, "epoch": 3664} {"train_loss": -25.62640953063965, "global_step": 304157, "epoch": 3664} {"train_loss": -25.68853759765625, "global_step": 304158, "epoch": 3664} {"train_loss": -25.999357223510742, "global_step": 304159, "epoch": 3664} {"train_loss": -25.803943634033203, "global_step": 304160, "epoch": 3664} {"train_loss": -25.901987075805664, "global_step": 304161, "epoch": 3664} {"train_loss": -25.8955135345459, "global_step": 304162, "epoch": 3664} {"train_loss": -25.940168380737305, "global_step": 304163, "epoch": 3664} {"train_loss": -25.522418975830078, "global_step": 304164, "epoch": 3664} {"train_loss": -25.357423782348633, "global_step": 304165, "epoch": 3664} {"train_loss": -25.63027000427246, "global_step": 304166, "epoch": 3664} {"train_loss": -25.959735870361328, "global_step": 304167, "epoch": 3664} {"train_loss": -25.700040817260742, "global_step": 304168, "epoch": 3664} {"train_loss": -25.636510848999023, "global_step": 304169, "epoch": 3664} {"train_loss": -25.22666358947754, "global_step": 304170, "epoch": 3664} {"train_loss": -25.51873207092285, "global_step": 304171, "epoch": 3664} {"train_loss": -25.457304000854492, "global_step": 304172, "epoch": 3664} {"train_loss": -25.900257110595703, "global_step": 304173, "epoch": 3664} {"train_loss": -25.714508056640625, "global_step": 304174, "epoch": 3664} {"train_loss": -25.746723175048828, "global_step": 304175, "epoch": 3664} {"train_loss": -25.51575469970703, "global_step": 304176, "epoch": 3664} {"train_loss": -25.776681900024414, "global_step": 304177, "epoch": 3664} {"train_loss": -25.6656494140625, "global_step": 304178, "epoch": 3664} {"train_loss": -25.8067569732666, "global_step": 304179, "epoch": 3664} {"train_loss": -25.879444122314453, "global_step": 304180, "epoch": 3664} {"train_loss": -25.9100341796875, "global_step": 304181, "epoch": 3664} {"train_loss": -26.037586212158203, "global_step": 304182, "epoch": 3664} {"train_loss": -25.631189346313477, "global_step": 304183, "epoch": 3664} {"train_loss": -25.875274658203125, "global_step": 304184, "epoch": 3664} {"train_loss": -26.04888343811035, "global_step": 304185, "epoch": 3664} {"train_loss": -25.942840576171875, "global_step": 304186, "epoch": 3664} {"train_loss": -26.072296142578125, "global_step": 304187, "epoch": 3664} {"train_loss": -26.1213436126709, "global_step": 304188, "epoch": 3664} {"train_loss": -25.744611740112305, "global_step": 304189, "epoch": 3664} {"train_loss": -25.637250900268555, "global_step": 304190, "epoch": 3664} {"train_loss": -25.609689712524414, "global_step": 304191, "epoch": 3664} {"train_loss": -25.991247177124023, "global_step": 304192, "epoch": 3664} {"train_loss": -25.713653564453125, "global_step": 304193, "epoch": 3664} {"train_loss": -25.67771458913045, "global_step": 304194, "epoch": 3664, "val_loss": 7237700.0} {"train_loss": -25.157251358032227, "global_step": 304195, "epoch": 3665} {"train_loss": -25.4746036529541, "global_step": 304196, "epoch": 3665} {"train_loss": -24.671340942382812, "global_step": 304197, "epoch": 3665} {"train_loss": -23.95655632019043, "global_step": 304198, "epoch": 3665} {"train_loss": -23.83222007751465, "global_step": 304199, "epoch": 3665} {"train_loss": -24.589595794677734, "global_step": 304200, "epoch": 3665} {"train_loss": -24.846454620361328, "global_step": 304201, "epoch": 3665} {"train_loss": -24.652252197265625, "global_step": 304202, "epoch": 3665} {"train_loss": -25.055702209472656, "global_step": 304203, "epoch": 3665} {"train_loss": -25.1734676361084, "global_step": 304204, "epoch": 3665} {"train_loss": -24.32416343688965, "global_step": 304205, "epoch": 3665} {"train_loss": -25.477006912231445, "global_step": 304206, "epoch": 3665} {"train_loss": -24.706396102905273, "global_step": 304207, "epoch": 3665} {"train_loss": -25.629514694213867, "global_step": 304208, "epoch": 3665} {"train_loss": -25.02979850769043, "global_step": 304209, "epoch": 3665} {"train_loss": -25.544370651245117, "global_step": 304210, "epoch": 3665} {"train_loss": -25.02937889099121, "global_step": 304211, "epoch": 3665} {"train_loss": -25.06186294555664, "global_step": 304212, "epoch": 3665} {"train_loss": -25.149948120117188, "global_step": 304213, "epoch": 3665} {"train_loss": -25.369869232177734, "global_step": 304214, "epoch": 3665} {"train_loss": -25.231245040893555, "global_step": 304215, "epoch": 3665} {"train_loss": -25.212881088256836, "global_step": 304216, "epoch": 3665} {"train_loss": -25.53690528869629, "global_step": 304217, "epoch": 3665} {"train_loss": -25.4664249420166, "global_step": 304218, "epoch": 3665} {"train_loss": -25.216611862182617, "global_step": 304219, "epoch": 3665} {"train_loss": -25.788599014282227, "global_step": 304220, "epoch": 3665} {"train_loss": -25.024511337280273, "global_step": 304221, "epoch": 3665} {"train_loss": -25.57098960876465, "global_step": 304222, "epoch": 3665} {"train_loss": -25.794851303100586, "global_step": 304223, "epoch": 3665} {"train_loss": -25.617197036743164, "global_step": 304224, "epoch": 3665} {"train_loss": -25.372535705566406, "global_step": 304225, "epoch": 3665} {"train_loss": -25.529630661010742, "global_step": 304226, "epoch": 3665} {"train_loss": -25.54816436767578, "global_step": 304227, "epoch": 3665} {"train_loss": -25.577102661132812, "global_step": 304228, "epoch": 3665} {"train_loss": -25.4299259185791, "global_step": 304229, "epoch": 3665} {"train_loss": -25.735422134399414, "global_step": 304230, "epoch": 3665} {"train_loss": -26.01826286315918, "global_step": 304231, "epoch": 3665} {"train_loss": -25.58481216430664, "global_step": 304232, "epoch": 3665} {"train_loss": -25.426679611206055, "global_step": 304233, "epoch": 3665} {"train_loss": -25.46359634399414, "global_step": 304234, "epoch": 3665} {"train_loss": -25.789396286010742, "global_step": 304235, "epoch": 3665} {"train_loss": -25.772573471069336, "global_step": 304236, "epoch": 3665} {"train_loss": -26.000843048095703, "global_step": 304237, "epoch": 3665} {"train_loss": -25.659961700439453, "global_step": 304238, "epoch": 3665} {"train_loss": -25.77642822265625, "global_step": 304239, "epoch": 3665} {"train_loss": -25.711267471313477, "global_step": 304240, "epoch": 3665} {"train_loss": -25.642847061157227, "global_step": 304241, "epoch": 3665} {"train_loss": -25.732141494750977, "global_step": 304242, "epoch": 3665} {"train_loss": -25.812149047851562, "global_step": 304243, "epoch": 3665} {"train_loss": -25.809513092041016, "global_step": 304244, "epoch": 3665} {"train_loss": -25.37240982055664, "global_step": 304245, "epoch": 3665} {"train_loss": -26.153579711914062, "global_step": 304246, "epoch": 3665} {"train_loss": -25.80691909790039, "global_step": 304247, "epoch": 3665} {"train_loss": -25.918500900268555, "global_step": 304248, "epoch": 3665} {"train_loss": -25.38800048828125, "global_step": 304249, "epoch": 3665} {"train_loss": -25.8942813873291, "global_step": 304250, "epoch": 3665} {"train_loss": -25.793567657470703, "global_step": 304251, "epoch": 3665} {"train_loss": -25.471975326538086, "global_step": 304252, "epoch": 3665} {"train_loss": -26.332538604736328, "global_step": 304253, "epoch": 3665} {"train_loss": -25.616849899291992, "global_step": 304254, "epoch": 3665} {"train_loss": -25.60895347595215, "global_step": 304255, "epoch": 3665} {"train_loss": -26.03986930847168, "global_step": 304256, "epoch": 3665} {"train_loss": -25.782033920288086, "global_step": 304257, "epoch": 3665} {"train_loss": -25.766448974609375, "global_step": 304258, "epoch": 3665} {"train_loss": -24.96527671813965, "global_step": 304259, "epoch": 3665} {"train_loss": -25.500612258911133, "global_step": 304260, "epoch": 3665} {"train_loss": -25.79693603515625, "global_step": 304261, "epoch": 3665} {"train_loss": -25.698902130126953, "global_step": 304262, "epoch": 3665} {"train_loss": -25.582853317260742, "global_step": 304263, "epoch": 3665} {"train_loss": -25.511695861816406, "global_step": 304264, "epoch": 3665} {"train_loss": -25.49782371520996, "global_step": 304265, "epoch": 3665} {"train_loss": -25.264081954956055, "global_step": 304266, "epoch": 3665} {"train_loss": -25.476633071899414, "global_step": 304267, "epoch": 3665} {"train_loss": -25.747488021850586, "global_step": 304268, "epoch": 3665} {"train_loss": -25.63067054748535, "global_step": 304269, "epoch": 3665} {"train_loss": -25.268823623657227, "global_step": 304270, "epoch": 3665} {"train_loss": -25.887619018554688, "global_step": 304271, "epoch": 3665} {"train_loss": -25.42629623413086, "global_step": 304272, "epoch": 3665} {"train_loss": -25.662805557250977, "global_step": 304273, "epoch": 3665} {"train_loss": -26.12579917907715, "global_step": 304274, "epoch": 3665} {"train_loss": -25.311477661132812, "global_step": 304275, "epoch": 3665} {"train_loss": -25.87799644470215, "global_step": 304276, "epoch": 3665} {"train_loss": -25.451050057468645, "global_step": 304277, "epoch": 3665, "val_loss": 7284469.0} {"train_loss": -25.416181564331055, "global_step": 304278, "epoch": 3666} {"train_loss": -24.836185455322266, "global_step": 304279, "epoch": 3666} {"train_loss": -25.5887451171875, "global_step": 304280, "epoch": 3666} {"train_loss": -25.228620529174805, "global_step": 304281, "epoch": 3666} {"train_loss": -25.173505783081055, "global_step": 304282, "epoch": 3666} {"train_loss": -25.52484703063965, "global_step": 304283, "epoch": 3666} {"train_loss": -25.544071197509766, "global_step": 304284, "epoch": 3666} {"train_loss": -25.515159606933594, "global_step": 304285, "epoch": 3666} {"train_loss": -25.28339958190918, "global_step": 304286, "epoch": 3666} {"train_loss": -25.26392936706543, "global_step": 304287, "epoch": 3666} {"train_loss": -25.294458389282227, "global_step": 304288, "epoch": 3666} {"train_loss": -25.33688735961914, "global_step": 304289, "epoch": 3666} {"train_loss": -25.54315948486328, "global_step": 304290, "epoch": 3666} {"train_loss": -25.81245231628418, "global_step": 304291, "epoch": 3666} {"train_loss": -25.87812614440918, "global_step": 304292, "epoch": 3666} {"train_loss": -25.696508407592773, "global_step": 304293, "epoch": 3666} {"train_loss": -25.805011749267578, "global_step": 304294, "epoch": 3666} {"train_loss": -25.823774337768555, "global_step": 304295, "epoch": 3666} {"train_loss": -25.946569442749023, "global_step": 304296, "epoch": 3666} {"train_loss": -25.6250057220459, "global_step": 304297, "epoch": 3666} {"train_loss": -26.031522750854492, "global_step": 304298, "epoch": 3666} {"train_loss": -25.67755126953125, "global_step": 304299, "epoch": 3666} {"train_loss": -25.791385650634766, "global_step": 304300, "epoch": 3666} {"train_loss": -25.605224609375, "global_step": 304301, "epoch": 3666} {"train_loss": -25.978479385375977, "global_step": 304302, "epoch": 3666} {"train_loss": -25.406932830810547, "global_step": 304303, "epoch": 3666} {"train_loss": -25.607202529907227, "global_step": 304304, "epoch": 3666} {"train_loss": -25.906421661376953, "global_step": 304305, "epoch": 3666} {"train_loss": -25.59894371032715, "global_step": 304306, "epoch": 3666} {"train_loss": -25.703495025634766, "global_step": 304307, "epoch": 3666} {"train_loss": -25.660070419311523, "global_step": 304308, "epoch": 3666} {"train_loss": -25.465240478515625, "global_step": 304309, "epoch": 3666} {"train_loss": -25.622526168823242, "global_step": 304310, "epoch": 3666} {"train_loss": -25.540258407592773, "global_step": 304311, "epoch": 3666} {"train_loss": -25.705612182617188, "global_step": 304312, "epoch": 3666} {"train_loss": -25.436141967773438, "global_step": 304313, "epoch": 3666} {"train_loss": -25.518178939819336, "global_step": 304314, "epoch": 3666} {"train_loss": -25.752368927001953, "global_step": 304315, "epoch": 3666} {"train_loss": -25.876834869384766, "global_step": 304316, "epoch": 3666} {"train_loss": -25.819095611572266, "global_step": 304317, "epoch": 3666} {"train_loss": -25.522035598754883, "global_step": 304318, "epoch": 3666} {"train_loss": -26.04558753967285, "global_step": 304319, "epoch": 3666} {"train_loss": -25.834644317626953, "global_step": 304320, "epoch": 3666} {"train_loss": -25.98052406311035, "global_step": 304321, "epoch": 3666} {"train_loss": -25.7294921875, "global_step": 304322, "epoch": 3666} {"train_loss": -25.59177589416504, "global_step": 304323, "epoch": 3666} {"train_loss": -25.62894630432129, "global_step": 304324, "epoch": 3666} {"train_loss": -25.56119728088379, "global_step": 304325, "epoch": 3666} {"train_loss": -25.846296310424805, "global_step": 304326, "epoch": 3666} {"train_loss": -25.700727462768555, "global_step": 304327, "epoch": 3666} {"train_loss": -25.700098037719727, "global_step": 304328, "epoch": 3666} {"train_loss": -25.747989654541016, "global_step": 304329, "epoch": 3666} {"train_loss": -25.881040573120117, "global_step": 304330, "epoch": 3666} {"train_loss": -25.78006935119629, "global_step": 304331, "epoch": 3666} {"train_loss": -25.56955337524414, "global_step": 304332, "epoch": 3666} {"train_loss": -25.5781307220459, "global_step": 304333, "epoch": 3666} {"train_loss": -25.655048370361328, "global_step": 304334, "epoch": 3666} {"train_loss": -25.852445602416992, "global_step": 304335, "epoch": 3666} {"train_loss": -26.053516387939453, "global_step": 304336, "epoch": 3666} {"train_loss": -25.71119499206543, "global_step": 304337, "epoch": 3666} {"train_loss": -25.87148094177246, "global_step": 304338, "epoch": 3666} {"train_loss": -25.662012100219727, "global_step": 304339, "epoch": 3666} {"train_loss": -25.35386085510254, "global_step": 304340, "epoch": 3666} {"train_loss": -25.709793090820312, "global_step": 304341, "epoch": 3666} {"train_loss": -25.583465576171875, "global_step": 304342, "epoch": 3666} {"train_loss": -25.59734535217285, "global_step": 304343, "epoch": 3666} {"train_loss": -25.854969024658203, "global_step": 304344, "epoch": 3666} {"train_loss": -25.927490234375, "global_step": 304345, "epoch": 3666} {"train_loss": -25.355270385742188, "global_step": 304346, "epoch": 3666} {"train_loss": -25.873416900634766, "global_step": 304347, "epoch": 3666} {"train_loss": -25.388036727905273, "global_step": 304348, "epoch": 3666} {"train_loss": -25.582067489624023, "global_step": 304349, "epoch": 3666} {"train_loss": -26.0649356842041, "global_step": 304350, "epoch": 3666} {"train_loss": -25.501934051513672, "global_step": 304351, "epoch": 3666} {"train_loss": -25.211105346679688, "global_step": 304352, "epoch": 3666} {"train_loss": -25.595792770385742, "global_step": 304353, "epoch": 3666} {"train_loss": -25.58635902404785, "global_step": 304354, "epoch": 3666} {"train_loss": -25.8389949798584, "global_step": 304355, "epoch": 3666} {"train_loss": -25.89592933654785, "global_step": 304356, "epoch": 3666} {"train_loss": -25.686094284057617, "global_step": 304357, "epoch": 3666} {"train_loss": -25.259000778198242, "global_step": 304358, "epoch": 3666} {"train_loss": -25.34767723083496, "global_step": 304359, "epoch": 3666} {"train_loss": -25.628858221582618, "global_step": 304360, "epoch": 3666, "val_loss": 7224576.5} {"train_loss": -25.376073837280273, "global_step": 304361, "epoch": 3667} {"train_loss": -25.40842056274414, "global_step": 304362, "epoch": 3667} {"train_loss": -25.36055564880371, "global_step": 304363, "epoch": 3667} {"train_loss": -25.8278751373291, "global_step": 304364, "epoch": 3667} {"train_loss": -25.407255172729492, "global_step": 304365, "epoch": 3667} {"train_loss": -25.431493759155273, "global_step": 304366, "epoch": 3667} {"train_loss": -25.343997955322266, "global_step": 304367, "epoch": 3667} {"train_loss": -25.3405818939209, "global_step": 304368, "epoch": 3667} {"train_loss": -25.78836441040039, "global_step": 304369, "epoch": 3667} {"train_loss": -25.580366134643555, "global_step": 304370, "epoch": 3667} {"train_loss": -26.038787841796875, "global_step": 304371, "epoch": 3667} {"train_loss": -25.459787368774414, "global_step": 304372, "epoch": 3667} {"train_loss": -25.92156410217285, "global_step": 304373, "epoch": 3667} {"train_loss": -25.814075469970703, "global_step": 304374, "epoch": 3667} {"train_loss": -25.69899559020996, "global_step": 304375, "epoch": 3667} {"train_loss": -25.858463287353516, "global_step": 304376, "epoch": 3667} {"train_loss": -25.729894638061523, "global_step": 304377, "epoch": 3667} {"train_loss": -25.533935546875, "global_step": 304378, "epoch": 3667} {"train_loss": -25.864612579345703, "global_step": 304379, "epoch": 3667} {"train_loss": -25.59571647644043, "global_step": 304380, "epoch": 3667} {"train_loss": -25.805511474609375, "global_step": 304381, "epoch": 3667} {"train_loss": -25.508102416992188, "global_step": 304382, "epoch": 3667} {"train_loss": -25.7221736907959, "global_step": 304383, "epoch": 3667} {"train_loss": -25.754362106323242, "global_step": 304384, "epoch": 3667} {"train_loss": -25.372182846069336, "global_step": 304385, "epoch": 3667} {"train_loss": -25.57569694519043, "global_step": 304386, "epoch": 3667} {"train_loss": -25.566482543945312, "global_step": 304387, "epoch": 3667} {"train_loss": -26.240375518798828, "global_step": 304388, "epoch": 3667} {"train_loss": -25.687149047851562, "global_step": 304389, "epoch": 3667} {"train_loss": -25.533843994140625, "global_step": 304390, "epoch": 3667} {"train_loss": -25.7578067779541, "global_step": 304391, "epoch": 3667} {"train_loss": -25.949813842773438, "global_step": 304392, "epoch": 3667} {"train_loss": -25.63117790222168, "global_step": 304393, "epoch": 3667} {"train_loss": -25.945356369018555, "global_step": 304394, "epoch": 3667} {"train_loss": -25.603391647338867, "global_step": 304395, "epoch": 3667} {"train_loss": -25.69122886657715, "global_step": 304396, "epoch": 3667} {"train_loss": -26.06687355041504, "global_step": 304397, "epoch": 3667} {"train_loss": -25.92730140686035, "global_step": 304398, "epoch": 3667} {"train_loss": -26.109928131103516, "global_step": 304399, "epoch": 3667} {"train_loss": -25.95875358581543, "global_step": 304400, "epoch": 3667} {"train_loss": -25.7585506439209, "global_step": 304401, "epoch": 3667} {"train_loss": -25.843591690063477, "global_step": 304402, "epoch": 3667} {"train_loss": -25.830060958862305, "global_step": 304403, "epoch": 3667} {"train_loss": -25.66912841796875, "global_step": 304404, "epoch": 3667} {"train_loss": -25.600873947143555, "global_step": 304405, "epoch": 3667} {"train_loss": -25.603071212768555, "global_step": 304406, "epoch": 3667} {"train_loss": -25.777713775634766, "global_step": 304407, "epoch": 3667} {"train_loss": -25.3785400390625, "global_step": 304408, "epoch": 3667} {"train_loss": -25.917190551757812, "global_step": 304409, "epoch": 3667} {"train_loss": -25.844623565673828, "global_step": 304410, "epoch": 3667} {"train_loss": -25.55824851989746, "global_step": 304411, "epoch": 3667} {"train_loss": -25.543363571166992, "global_step": 304412, "epoch": 3667} {"train_loss": -25.62395668029785, "global_step": 304413, "epoch": 3667} {"train_loss": -25.83030128479004, "global_step": 304414, "epoch": 3667} {"train_loss": -25.664871215820312, "global_step": 304415, "epoch": 3667} {"train_loss": -25.238197326660156, "global_step": 304416, "epoch": 3667} {"train_loss": -25.071496963500977, "global_step": 304417, "epoch": 3667} {"train_loss": -25.80060386657715, "global_step": 304418, "epoch": 3667} {"train_loss": -25.504730224609375, "global_step": 304419, "epoch": 3667} {"train_loss": -25.539514541625977, "global_step": 304420, "epoch": 3667} {"train_loss": -25.174213409423828, "global_step": 304421, "epoch": 3667} {"train_loss": -25.299657821655273, "global_step": 304422, "epoch": 3667} {"train_loss": -25.772842407226562, "global_step": 304423, "epoch": 3667} {"train_loss": -25.96119499206543, "global_step": 304424, "epoch": 3667} {"train_loss": -25.79290199279785, "global_step": 304425, "epoch": 3667} {"train_loss": -25.876331329345703, "global_step": 304426, "epoch": 3667} {"train_loss": -25.738916397094727, "global_step": 304427, "epoch": 3667} {"train_loss": -25.54528045654297, "global_step": 304428, "epoch": 3667} {"train_loss": -25.800954818725586, "global_step": 304429, "epoch": 3667} {"train_loss": -25.845117568969727, "global_step": 304430, "epoch": 3667} {"train_loss": -25.70745849609375, "global_step": 304431, "epoch": 3667} {"train_loss": -25.979734420776367, "global_step": 304432, "epoch": 3667} {"train_loss": -25.820098876953125, "global_step": 304433, "epoch": 3667} {"train_loss": -25.332073211669922, "global_step": 304434, "epoch": 3667} {"train_loss": -25.938138961791992, "global_step": 304435, "epoch": 3667} {"train_loss": -25.56671714782715, "global_step": 304436, "epoch": 3667} {"train_loss": -25.612756729125977, "global_step": 304437, "epoch": 3667} {"train_loss": -25.782285690307617, "global_step": 304438, "epoch": 3667} {"train_loss": -25.722339630126953, "global_step": 304439, "epoch": 3667} {"train_loss": -25.62650489807129, "global_step": 304440, "epoch": 3667} {"train_loss": -25.762510299682617, "global_step": 304441, "epoch": 3667} {"train_loss": -25.564006805419922, "global_step": 304442, "epoch": 3667} {"train_loss": -25.676095847623895, "global_step": 304443, "epoch": 3667, "val_loss": 7345452.0} {"train_loss": -25.02630043029785, "global_step": 304444, "epoch": 3668} {"train_loss": -25.2071475982666, "global_step": 304445, "epoch": 3668} {"train_loss": -25.449949264526367, "global_step": 304446, "epoch": 3668} {"train_loss": -25.561756134033203, "global_step": 304447, "epoch": 3668} {"train_loss": -25.25050163269043, "global_step": 304448, "epoch": 3668} {"train_loss": -25.119455337524414, "global_step": 304449, "epoch": 3668} {"train_loss": -25.482534408569336, "global_step": 304450, "epoch": 3668} {"train_loss": -25.760324478149414, "global_step": 304451, "epoch": 3668} {"train_loss": -25.199918746948242, "global_step": 304452, "epoch": 3668} {"train_loss": -25.592273712158203, "global_step": 304453, "epoch": 3668} {"train_loss": -25.42841148376465, "global_step": 304454, "epoch": 3668} {"train_loss": -25.644636154174805, "global_step": 304455, "epoch": 3668} {"train_loss": -25.711261749267578, "global_step": 304456, "epoch": 3668} {"train_loss": -25.322057723999023, "global_step": 304457, "epoch": 3668} {"train_loss": -25.757837295532227, "global_step": 304458, "epoch": 3668} {"train_loss": -25.477445602416992, "global_step": 304459, "epoch": 3668} {"train_loss": -25.570266723632812, "global_step": 304460, "epoch": 3668} {"train_loss": -25.864797592163086, "global_step": 304461, "epoch": 3668} {"train_loss": -25.823999404907227, "global_step": 304462, "epoch": 3668} {"train_loss": -25.504871368408203, "global_step": 304463, "epoch": 3668} {"train_loss": -25.843505859375, "global_step": 304464, "epoch": 3668} {"train_loss": -25.742612838745117, "global_step": 304465, "epoch": 3668} {"train_loss": -25.56778335571289, "global_step": 304466, "epoch": 3668} {"train_loss": -25.521581649780273, "global_step": 304467, "epoch": 3668} {"train_loss": -25.74271011352539, "global_step": 304468, "epoch": 3668} {"train_loss": -25.42194175720215, "global_step": 304469, "epoch": 3668} {"train_loss": -25.45228385925293, "global_step": 304470, "epoch": 3668} {"train_loss": -25.1506404876709, "global_step": 304471, "epoch": 3668} {"train_loss": -25.976776123046875, "global_step": 304472, "epoch": 3668} {"train_loss": -25.703384399414062, "global_step": 304473, "epoch": 3668} {"train_loss": -25.702701568603516, "global_step": 304474, "epoch": 3668} {"train_loss": -25.52555274963379, "global_step": 304475, "epoch": 3668} {"train_loss": -25.652252197265625, "global_step": 304476, "epoch": 3668} {"train_loss": -25.360246658325195, "global_step": 304477, "epoch": 3668} {"train_loss": -25.840320587158203, "global_step": 304478, "epoch": 3668} {"train_loss": -25.798725128173828, "global_step": 304479, "epoch": 3668} {"train_loss": -25.64564323425293, "global_step": 304480, "epoch": 3668} {"train_loss": -25.853134155273438, "global_step": 304481, "epoch": 3668} {"train_loss": -25.318334579467773, "global_step": 304482, "epoch": 3668} {"train_loss": -25.740966796875, "global_step": 304483, "epoch": 3668} {"train_loss": -25.5494441986084, "global_step": 304484, "epoch": 3668} {"train_loss": -25.7855167388916, "global_step": 304485, "epoch": 3668} {"train_loss": -25.660919189453125, "global_step": 304486, "epoch": 3668} {"train_loss": -25.8748722076416, "global_step": 304487, "epoch": 3668} {"train_loss": -25.929235458374023, "global_step": 304488, "epoch": 3668} {"train_loss": -25.609018325805664, "global_step": 304489, "epoch": 3668} {"train_loss": -25.581090927124023, "global_step": 304490, "epoch": 3668} {"train_loss": -26.086734771728516, "global_step": 304491, "epoch": 3668} {"train_loss": -25.79584312438965, "global_step": 304492, "epoch": 3668} {"train_loss": -26.077747344970703, "global_step": 304493, "epoch": 3668} {"train_loss": -25.907087326049805, "global_step": 304494, "epoch": 3668} {"train_loss": -25.99298095703125, "global_step": 304495, "epoch": 3668} {"train_loss": -25.803943634033203, "global_step": 304496, "epoch": 3668} {"train_loss": -25.966665267944336, "global_step": 304497, "epoch": 3668} {"train_loss": -25.94183921813965, "global_step": 304498, "epoch": 3668} {"train_loss": -26.028440475463867, "global_step": 304499, "epoch": 3668} {"train_loss": -26.099889755249023, "global_step": 304500, "epoch": 3668} {"train_loss": -25.693439483642578, "global_step": 304501, "epoch": 3668} {"train_loss": -26.11712646484375, "global_step": 304502, "epoch": 3668} {"train_loss": -26.043745040893555, "global_step": 304503, "epoch": 3668} {"train_loss": -25.78779411315918, "global_step": 304504, "epoch": 3668} {"train_loss": -26.022357940673828, "global_step": 304505, "epoch": 3668} {"train_loss": -25.44294548034668, "global_step": 304506, "epoch": 3668} {"train_loss": -25.291732788085938, "global_step": 304507, "epoch": 3668} {"train_loss": -24.415735244750977, "global_step": 304508, "epoch": 3668} {"train_loss": -22.9501953125, "global_step": 304509, "epoch": 3668} {"train_loss": -23.974103927612305, "global_step": 304510, "epoch": 3668} {"train_loss": -24.237483978271484, "global_step": 304511, "epoch": 3668} {"train_loss": -25.14568328857422, "global_step": 304512, "epoch": 3668} {"train_loss": -24.176706314086914, "global_step": 304513, "epoch": 3668} {"train_loss": -25.203327178955078, "global_step": 304514, "epoch": 3668} {"train_loss": -24.821557998657227, "global_step": 304515, "epoch": 3668} {"train_loss": -24.948379516601562, "global_step": 304516, "epoch": 3668} {"train_loss": -25.149154663085938, "global_step": 304517, "epoch": 3668} {"train_loss": -24.734018325805664, "global_step": 304518, "epoch": 3668} {"train_loss": -25.101831436157227, "global_step": 304519, "epoch": 3668} {"train_loss": -25.553274154663086, "global_step": 304520, "epoch": 3668} {"train_loss": -24.559093475341797, "global_step": 304521, "epoch": 3668} {"train_loss": -25.62384605407715, "global_step": 304522, "epoch": 3668} {"train_loss": -25.159704208374023, "global_step": 304523, "epoch": 3668} {"train_loss": -25.35552215576172, "global_step": 304524, "epoch": 3668} {"train_loss": -25.41876220703125, "global_step": 304525, "epoch": 3668} {"train_loss": -25.479986052915276, "global_step": 304526, "epoch": 3668, "val_loss": 7190203.5} {"train_loss": -25.212326049804688, "global_step": 304527, "epoch": 3669} {"train_loss": -25.131328582763672, "global_step": 304528, "epoch": 3669} {"train_loss": -24.827817916870117, "global_step": 304529, "epoch": 3669} {"train_loss": -24.887075424194336, "global_step": 304530, "epoch": 3669} {"train_loss": -25.31869888305664, "global_step": 304531, "epoch": 3669} {"train_loss": -24.84417152404785, "global_step": 304532, "epoch": 3669} {"train_loss": -25.09848403930664, "global_step": 304533, "epoch": 3669} {"train_loss": -24.9321231842041, "global_step": 304534, "epoch": 3669} {"train_loss": -25.190427780151367, "global_step": 304535, "epoch": 3669} {"train_loss": -25.089956283569336, "global_step": 304536, "epoch": 3669} {"train_loss": -25.646570205688477, "global_step": 304537, "epoch": 3669} {"train_loss": -25.41632652282715, "global_step": 304538, "epoch": 3669} {"train_loss": -25.353090286254883, "global_step": 304539, "epoch": 3669} {"train_loss": -25.36305809020996, "global_step": 304540, "epoch": 3669} {"train_loss": -25.24271011352539, "global_step": 304541, "epoch": 3669} {"train_loss": -25.694990158081055, "global_step": 304542, "epoch": 3669} {"train_loss": -25.375537872314453, "global_step": 304543, "epoch": 3669} {"train_loss": -25.303640365600586, "global_step": 304544, "epoch": 3669} {"train_loss": -25.5965633392334, "global_step": 304545, "epoch": 3669} {"train_loss": -25.63992691040039, "global_step": 304546, "epoch": 3669} {"train_loss": -25.43897819519043, "global_step": 304547, "epoch": 3669} {"train_loss": -25.857694625854492, "global_step": 304548, "epoch": 3669} {"train_loss": -25.485820770263672, "global_step": 304549, "epoch": 3669} {"train_loss": -25.84856605529785, "global_step": 304550, "epoch": 3669} {"train_loss": -25.962615966796875, "global_step": 304551, "epoch": 3669} {"train_loss": -25.63345718383789, "global_step": 304552, "epoch": 3669} {"train_loss": -25.824588775634766, "global_step": 304553, "epoch": 3669} {"train_loss": -25.830204010009766, "global_step": 304554, "epoch": 3669} {"train_loss": -25.830280303955078, "global_step": 304555, "epoch": 3669} {"train_loss": -25.69256019592285, "global_step": 304556, "epoch": 3669} {"train_loss": -25.658349990844727, "global_step": 304557, "epoch": 3669} {"train_loss": -25.72784423828125, "global_step": 304558, "epoch": 3669} {"train_loss": -25.880971908569336, "global_step": 304559, "epoch": 3669} {"train_loss": -25.575117111206055, "global_step": 304560, "epoch": 3669} {"train_loss": -25.723636627197266, "global_step": 304561, "epoch": 3669} {"train_loss": -25.359479904174805, "global_step": 304562, "epoch": 3669} {"train_loss": -26.082300186157227, "global_step": 304563, "epoch": 3669} {"train_loss": -25.67329216003418, "global_step": 304564, "epoch": 3669} {"train_loss": -25.640365600585938, "global_step": 304565, "epoch": 3669} {"train_loss": -25.780393600463867, "global_step": 304566, "epoch": 3669} {"train_loss": -25.588151931762695, "global_step": 304567, "epoch": 3669} {"train_loss": -25.90928077697754, "global_step": 304568, "epoch": 3669} {"train_loss": -25.970993041992188, "global_step": 304569, "epoch": 3669} {"train_loss": -25.674579620361328, "global_step": 304570, "epoch": 3669} {"train_loss": -25.351987838745117, "global_step": 304571, "epoch": 3669} {"train_loss": -25.556373596191406, "global_step": 304572, "epoch": 3669} {"train_loss": -25.6058406829834, "global_step": 304573, "epoch": 3669} {"train_loss": -25.77736473083496, "global_step": 304574, "epoch": 3669} {"train_loss": -25.894872665405273, "global_step": 304575, "epoch": 3669} {"train_loss": -25.603940963745117, "global_step": 304576, "epoch": 3669} {"train_loss": -25.40431785583496, "global_step": 304577, "epoch": 3669} {"train_loss": -25.763647079467773, "global_step": 304578, "epoch": 3669} {"train_loss": -25.474088668823242, "global_step": 304579, "epoch": 3669} {"train_loss": -25.705570220947266, "global_step": 304580, "epoch": 3669} {"train_loss": -25.17586326599121, "global_step": 304581, "epoch": 3669} {"train_loss": -25.9222469329834, "global_step": 304582, "epoch": 3669} {"train_loss": -25.683944702148438, "global_step": 304583, "epoch": 3669} {"train_loss": -25.7353572845459, "global_step": 304584, "epoch": 3669} {"train_loss": -25.482629776000977, "global_step": 304585, "epoch": 3669} {"train_loss": -25.615177154541016, "global_step": 304586, "epoch": 3669} {"train_loss": -25.88294792175293, "global_step": 304587, "epoch": 3669} {"train_loss": -25.771020889282227, "global_step": 304588, "epoch": 3669} {"train_loss": -25.888141632080078, "global_step": 304589, "epoch": 3669} {"train_loss": -25.74342918395996, "global_step": 304590, "epoch": 3669} {"train_loss": -25.583660125732422, "global_step": 304591, "epoch": 3669} {"train_loss": -25.70962905883789, "global_step": 304592, "epoch": 3669} {"train_loss": -25.275068283081055, "global_step": 304593, "epoch": 3669} {"train_loss": -25.503324508666992, "global_step": 304594, "epoch": 3669} {"train_loss": -25.6564884185791, "global_step": 304595, "epoch": 3669} {"train_loss": -25.76076316833496, "global_step": 304596, "epoch": 3669} {"train_loss": -25.888904571533203, "global_step": 304597, "epoch": 3669} {"train_loss": -25.643198013305664, "global_step": 304598, "epoch": 3669} {"train_loss": -25.883005142211914, "global_step": 304599, "epoch": 3669} {"train_loss": -25.666128158569336, "global_step": 304600, "epoch": 3669} {"train_loss": -25.7337646484375, "global_step": 304601, "epoch": 3669} {"train_loss": -25.778369903564453, "global_step": 304602, "epoch": 3669} {"train_loss": -25.804792404174805, "global_step": 304603, "epoch": 3669} {"train_loss": -25.927846908569336, "global_step": 304604, "epoch": 3669} {"train_loss": -25.921850204467773, "global_step": 304605, "epoch": 3669} {"train_loss": -25.97828483581543, "global_step": 304606, "epoch": 3669} {"train_loss": -25.455623626708984, "global_step": 304607, "epoch": 3669} {"train_loss": -25.718841552734375, "global_step": 304608, "epoch": 3669} {"train_loss": -25.587251915989153, "global_step": 304609, "epoch": 3669, "val_loss": 7166329.5} {"train_loss": -24.80125617980957, "global_step": 304610, "epoch": 3670} {"train_loss": -24.220788955688477, "global_step": 304611, "epoch": 3670} {"train_loss": -25.10453224182129, "global_step": 304612, "epoch": 3670} {"train_loss": -25.526805877685547, "global_step": 304613, "epoch": 3670} {"train_loss": -25.034366607666016, "global_step": 304614, "epoch": 3670} {"train_loss": -25.433385848999023, "global_step": 304615, "epoch": 3670} {"train_loss": -25.165159225463867, "global_step": 304616, "epoch": 3670} {"train_loss": -24.848630905151367, "global_step": 304617, "epoch": 3670} {"train_loss": -24.892131805419922, "global_step": 304618, "epoch": 3670} {"train_loss": -25.3994083404541, "global_step": 304619, "epoch": 3670} {"train_loss": -25.708311080932617, "global_step": 304620, "epoch": 3670} {"train_loss": -25.40384864807129, "global_step": 304621, "epoch": 3670} {"train_loss": -25.380014419555664, "global_step": 304622, "epoch": 3670} {"train_loss": -25.43590545654297, "global_step": 304623, "epoch": 3670} {"train_loss": -25.503068923950195, "global_step": 304624, "epoch": 3670} {"train_loss": -25.66241455078125, "global_step": 304625, "epoch": 3670} {"train_loss": -25.612390518188477, "global_step": 304626, "epoch": 3670} {"train_loss": -25.67762565612793, "global_step": 304627, "epoch": 3670} {"train_loss": -25.91021156311035, "global_step": 304628, "epoch": 3670} {"train_loss": -25.662927627563477, "global_step": 304629, "epoch": 3670} {"train_loss": -25.53253936767578, "global_step": 304630, "epoch": 3670} {"train_loss": -25.482961654663086, "global_step": 304631, "epoch": 3670} {"train_loss": -25.70025062561035, "global_step": 304632, "epoch": 3670} {"train_loss": -25.76946449279785, "global_step": 304633, "epoch": 3670} {"train_loss": -25.548969268798828, "global_step": 304634, "epoch": 3670} {"train_loss": -25.656103134155273, "global_step": 304635, "epoch": 3670} {"train_loss": -25.672183990478516, "global_step": 304636, "epoch": 3670} {"train_loss": -25.345300674438477, "global_step": 304637, "epoch": 3670} {"train_loss": -25.45222282409668, "global_step": 304638, "epoch": 3670} {"train_loss": -25.351476669311523, "global_step": 304639, "epoch": 3670} {"train_loss": -25.6792049407959, "global_step": 304640, "epoch": 3670} {"train_loss": -25.542255401611328, "global_step": 304641, "epoch": 3670} {"train_loss": -25.360681533813477, "global_step": 304642, "epoch": 3670} {"train_loss": -26.058185577392578, "global_step": 304643, "epoch": 3670} {"train_loss": -25.886960983276367, "global_step": 304644, "epoch": 3670} {"train_loss": -25.96689224243164, "global_step": 304645, "epoch": 3670} {"train_loss": -25.544904708862305, "global_step": 304646, "epoch": 3670} {"train_loss": -25.97871971130371, "global_step": 304647, "epoch": 3670} {"train_loss": -25.752126693725586, "global_step": 304648, "epoch": 3670} {"train_loss": -25.554000854492188, "global_step": 304649, "epoch": 3670} {"train_loss": -25.529449462890625, "global_step": 304650, "epoch": 3670} {"train_loss": -25.965717315673828, "global_step": 304651, "epoch": 3670} {"train_loss": -25.86991310119629, "global_step": 304652, "epoch": 3670} {"train_loss": -26.15203857421875, "global_step": 304653, "epoch": 3670} {"train_loss": -25.6195068359375, "global_step": 304654, "epoch": 3670} {"train_loss": -25.95859718322754, "global_step": 304655, "epoch": 3670} {"train_loss": -26.089078903198242, "global_step": 304656, "epoch": 3670} {"train_loss": -25.865652084350586, "global_step": 304657, "epoch": 3670} {"train_loss": -25.807815551757812, "global_step": 304658, "epoch": 3670} {"train_loss": -25.763456344604492, "global_step": 304659, "epoch": 3670} {"train_loss": -25.644567489624023, "global_step": 304660, "epoch": 3670} {"train_loss": -25.787153244018555, "global_step": 304661, "epoch": 3670} {"train_loss": -25.524328231811523, "global_step": 304662, "epoch": 3670} {"train_loss": -25.973785400390625, "global_step": 304663, "epoch": 3670} {"train_loss": -25.582304000854492, "global_step": 304664, "epoch": 3670} {"train_loss": -25.35179901123047, "global_step": 304665, "epoch": 3670} {"train_loss": -25.459766387939453, "global_step": 304666, "epoch": 3670} {"train_loss": -25.549728393554688, "global_step": 304667, "epoch": 3670} {"train_loss": -25.584470748901367, "global_step": 304668, "epoch": 3670} {"train_loss": -25.632471084594727, "global_step": 304669, "epoch": 3670} {"train_loss": -25.66389274597168, "global_step": 304670, "epoch": 3670} {"train_loss": -25.585844039916992, "global_step": 304671, "epoch": 3670} {"train_loss": -25.8861083984375, "global_step": 304672, "epoch": 3670} {"train_loss": -26.029027938842773, "global_step": 304673, "epoch": 3670} {"train_loss": -25.605966567993164, "global_step": 304674, "epoch": 3670} {"train_loss": -25.51685905456543, "global_step": 304675, "epoch": 3670} {"train_loss": -25.667133331298828, "global_step": 304676, "epoch": 3670} {"train_loss": -25.538705825805664, "global_step": 304677, "epoch": 3670} {"train_loss": -25.620426177978516, "global_step": 304678, "epoch": 3670} {"train_loss": -25.55902862548828, "global_step": 304679, "epoch": 3670} {"train_loss": -25.63551902770996, "global_step": 304680, "epoch": 3670} {"train_loss": -25.743188858032227, "global_step": 304681, "epoch": 3670} {"train_loss": -25.875654220581055, "global_step": 304682, "epoch": 3670} {"train_loss": -25.43146514892578, "global_step": 304683, "epoch": 3670} {"train_loss": -26.048492431640625, "global_step": 304684, "epoch": 3670} {"train_loss": -25.5297908782959, "global_step": 304685, "epoch": 3670} {"train_loss": -25.58957862854004, "global_step": 304686, "epoch": 3670} {"train_loss": -25.74679946899414, "global_step": 304687, "epoch": 3670} {"train_loss": -25.987287521362305, "global_step": 304688, "epoch": 3670} {"train_loss": -25.85274314880371, "global_step": 304689, "epoch": 3670} {"train_loss": -25.64761734008789, "global_step": 304690, "epoch": 3670} {"train_loss": -25.608911514282227, "global_step": 304691, "epoch": 3670} {"train_loss": -25.610297099653497, "global_step": 304692, "epoch": 3670, "val_loss": 7340056.0} {"train_loss": -24.800031661987305, "global_step": 304693, "epoch": 3671} {"train_loss": -24.848026275634766, "global_step": 304694, "epoch": 3671} {"train_loss": -24.911487579345703, "global_step": 304695, "epoch": 3671} {"train_loss": -25.254098892211914, "global_step": 304696, "epoch": 3671} {"train_loss": -24.77176856994629, "global_step": 304697, "epoch": 3671} {"train_loss": -25.4993896484375, "global_step": 304698, "epoch": 3671} {"train_loss": -25.020254135131836, "global_step": 304699, "epoch": 3671} {"train_loss": -25.201868057250977, "global_step": 304700, "epoch": 3671} {"train_loss": -25.45332908630371, "global_step": 304701, "epoch": 3671} {"train_loss": -25.68511962890625, "global_step": 304702, "epoch": 3671} {"train_loss": -25.633691787719727, "global_step": 304703, "epoch": 3671} {"train_loss": -25.2448787689209, "global_step": 304704, "epoch": 3671} {"train_loss": -25.655364990234375, "global_step": 304705, "epoch": 3671} {"train_loss": -25.51626205444336, "global_step": 304706, "epoch": 3671} {"train_loss": -25.380395889282227, "global_step": 304707, "epoch": 3671} {"train_loss": -25.889326095581055, "global_step": 304708, "epoch": 3671} {"train_loss": -25.069177627563477, "global_step": 304709, "epoch": 3671} {"train_loss": -25.412195205688477, "global_step": 304710, "epoch": 3671} {"train_loss": -25.388080596923828, "global_step": 304711, "epoch": 3671} {"train_loss": -25.672758102416992, "global_step": 304712, "epoch": 3671} {"train_loss": -25.453393936157227, "global_step": 304713, "epoch": 3671} {"train_loss": -25.3421688079834, "global_step": 304714, "epoch": 3671} {"train_loss": -25.220596313476562, "global_step": 304715, "epoch": 3671} {"train_loss": -25.200851440429688, "global_step": 304716, "epoch": 3671} {"train_loss": -25.57721710205078, "global_step": 304717, "epoch": 3671} {"train_loss": -25.290985107421875, "global_step": 304718, "epoch": 3671} {"train_loss": -25.137685775756836, "global_step": 304719, "epoch": 3671} {"train_loss": -25.335670471191406, "global_step": 304720, "epoch": 3671} {"train_loss": -25.314077377319336, "global_step": 304721, "epoch": 3671} {"train_loss": -25.522428512573242, "global_step": 304722, "epoch": 3671} {"train_loss": -25.315237045288086, "global_step": 304723, "epoch": 3671} {"train_loss": -25.764989852905273, "global_step": 304724, "epoch": 3671} {"train_loss": -25.41156578063965, "global_step": 304725, "epoch": 3671} {"train_loss": -24.989168167114258, "global_step": 304726, "epoch": 3671} {"train_loss": -25.47001838684082, "global_step": 304727, "epoch": 3671} {"train_loss": -25.314144134521484, "global_step": 304728, "epoch": 3671} {"train_loss": -25.291975021362305, "global_step": 304729, "epoch": 3671} {"train_loss": -25.65582275390625, "global_step": 304730, "epoch": 3671} {"train_loss": -25.37762451171875, "global_step": 304731, "epoch": 3671} {"train_loss": -25.669540405273438, "global_step": 304732, "epoch": 3671} {"train_loss": -25.724262237548828, "global_step": 304733, "epoch": 3671} {"train_loss": -25.605670928955078, "global_step": 304734, "epoch": 3671} {"train_loss": -25.63814353942871, "global_step": 304735, "epoch": 3671} {"train_loss": -25.68037223815918, "global_step": 304736, "epoch": 3671} {"train_loss": -25.733346939086914, "global_step": 304737, "epoch": 3671} {"train_loss": -25.815088272094727, "global_step": 304738, "epoch": 3671} {"train_loss": -25.93806266784668, "global_step": 304739, "epoch": 3671} {"train_loss": -25.415800094604492, "global_step": 304740, "epoch": 3671} {"train_loss": -25.684568405151367, "global_step": 304741, "epoch": 3671} {"train_loss": -25.599546432495117, "global_step": 304742, "epoch": 3671} {"train_loss": -25.523252487182617, "global_step": 304743, "epoch": 3671} {"train_loss": -25.575153350830078, "global_step": 304744, "epoch": 3671} {"train_loss": -25.632043838500977, "global_step": 304745, "epoch": 3671} {"train_loss": -25.921735763549805, "global_step": 304746, "epoch": 3671} {"train_loss": -25.824365615844727, "global_step": 304747, "epoch": 3671} {"train_loss": -26.273883819580078, "global_step": 304748, "epoch": 3671} {"train_loss": -25.48320198059082, "global_step": 304749, "epoch": 3671} {"train_loss": -25.8287296295166, "global_step": 304750, "epoch": 3671} {"train_loss": -26.018686294555664, "global_step": 304751, "epoch": 3671} {"train_loss": -25.827112197875977, "global_step": 304752, "epoch": 3671} {"train_loss": -25.973316192626953, "global_step": 304753, "epoch": 3671} {"train_loss": -26.130624771118164, "global_step": 304754, "epoch": 3671} {"train_loss": -25.781538009643555, "global_step": 304755, "epoch": 3671} {"train_loss": -25.72064208984375, "global_step": 304756, "epoch": 3671} {"train_loss": -25.76922035217285, "global_step": 304757, "epoch": 3671} {"train_loss": -25.99000358581543, "global_step": 304758, "epoch": 3671} {"train_loss": -26.024885177612305, "global_step": 304759, "epoch": 3671} {"train_loss": -25.96424674987793, "global_step": 304760, "epoch": 3671} {"train_loss": -25.74948501586914, "global_step": 304761, "epoch": 3671} {"train_loss": -25.680938720703125, "global_step": 304762, "epoch": 3671} {"train_loss": -25.555051803588867, "global_step": 304763, "epoch": 3671} {"train_loss": -25.318201065063477, "global_step": 304764, "epoch": 3671} {"train_loss": -25.469711303710938, "global_step": 304765, "epoch": 3671} {"train_loss": -25.34156608581543, "global_step": 304766, "epoch": 3671} {"train_loss": -25.492727279663086, "global_step": 304767, "epoch": 3671} {"train_loss": -25.331100463867188, "global_step": 304768, "epoch": 3671} {"train_loss": -25.60892677307129, "global_step": 304769, "epoch": 3671} {"train_loss": -25.472177505493164, "global_step": 304770, "epoch": 3671} {"train_loss": -25.19158363342285, "global_step": 304771, "epoch": 3671} {"train_loss": -25.99604606628418, "global_step": 304772, "epoch": 3671} {"train_loss": -25.496826171875, "global_step": 304773, "epoch": 3671} {"train_loss": -25.6939640045166, "global_step": 304774, "epoch": 3671} {"train_loss": -25.522350931742107, "global_step": 304775, "epoch": 3671, "val_loss": 7200278.0} {"train_loss": -25.040555953979492, "global_step": 304776, "epoch": 3672} {"train_loss": -24.43964958190918, "global_step": 304777, "epoch": 3672} {"train_loss": -25.0400447845459, "global_step": 304778, "epoch": 3672} {"train_loss": -25.257251739501953, "global_step": 304779, "epoch": 3672} {"train_loss": -24.79175567626953, "global_step": 304780, "epoch": 3672} {"train_loss": -24.666608810424805, "global_step": 304781, "epoch": 3672} {"train_loss": -25.106735229492188, "global_step": 304782, "epoch": 3672} {"train_loss": -25.133100509643555, "global_step": 304783, "epoch": 3672} {"train_loss": -25.64362144470215, "global_step": 304784, "epoch": 3672} {"train_loss": -25.47562599182129, "global_step": 304785, "epoch": 3672} {"train_loss": -25.451684951782227, "global_step": 304786, "epoch": 3672} {"train_loss": -24.99323081970215, "global_step": 304787, "epoch": 3672} {"train_loss": -25.143020629882812, "global_step": 304788, "epoch": 3672} {"train_loss": -25.16556167602539, "global_step": 304789, "epoch": 3672} {"train_loss": -25.35519027709961, "global_step": 304790, "epoch": 3672} {"train_loss": -25.407438278198242, "global_step": 304791, "epoch": 3672} {"train_loss": -25.202728271484375, "global_step": 304792, "epoch": 3672} {"train_loss": -25.411352157592773, "global_step": 304793, "epoch": 3672} {"train_loss": -25.421789169311523, "global_step": 304794, "epoch": 3672} {"train_loss": -25.672962188720703, "global_step": 304795, "epoch": 3672} {"train_loss": -25.85208511352539, "global_step": 304796, "epoch": 3672} {"train_loss": -25.713363647460938, "global_step": 304797, "epoch": 3672} {"train_loss": -25.704055786132812, "global_step": 304798, "epoch": 3672} {"train_loss": -25.534839630126953, "global_step": 304799, "epoch": 3672} {"train_loss": -25.72271156311035, "global_step": 304800, "epoch": 3672} {"train_loss": -25.913177490234375, "global_step": 304801, "epoch": 3672} {"train_loss": -25.593088150024414, "global_step": 304802, "epoch": 3672} {"train_loss": -25.680286407470703, "global_step": 304803, "epoch": 3672} {"train_loss": -25.61441993713379, "global_step": 304804, "epoch": 3672} {"train_loss": -25.676544189453125, "global_step": 304805, "epoch": 3672} {"train_loss": -25.469085693359375, "global_step": 304806, "epoch": 3672} {"train_loss": -25.99045753479004, "global_step": 304807, "epoch": 3672} {"train_loss": -25.359527587890625, "global_step": 304808, "epoch": 3672} {"train_loss": -26.0516357421875, "global_step": 304809, "epoch": 3672} {"train_loss": -25.735578536987305, "global_step": 304810, "epoch": 3672} {"train_loss": -25.629547119140625, "global_step": 304811, "epoch": 3672} {"train_loss": -25.826345443725586, "global_step": 304812, "epoch": 3672} {"train_loss": -25.521509170532227, "global_step": 304813, "epoch": 3672} {"train_loss": -25.7059383392334, "global_step": 304814, "epoch": 3672} {"train_loss": -26.030384063720703, "global_step": 304815, "epoch": 3672} {"train_loss": -25.52493667602539, "global_step": 304816, "epoch": 3672} {"train_loss": -25.574935913085938, "global_step": 304817, "epoch": 3672} {"train_loss": -25.679365158081055, "global_step": 304818, "epoch": 3672} {"train_loss": -26.042016983032227, "global_step": 304819, "epoch": 3672} {"train_loss": -25.951648712158203, "global_step": 304820, "epoch": 3672} {"train_loss": -25.771259307861328, "global_step": 304821, "epoch": 3672} {"train_loss": -25.91840171813965, "global_step": 304822, "epoch": 3672} {"train_loss": -25.755298614501953, "global_step": 304823, "epoch": 3672} {"train_loss": -25.824060440063477, "global_step": 304824, "epoch": 3672} {"train_loss": -25.55951690673828, "global_step": 304825, "epoch": 3672} {"train_loss": -25.986719131469727, "global_step": 304826, "epoch": 3672} {"train_loss": -25.71973991394043, "global_step": 304827, "epoch": 3672} {"train_loss": -26.15399742126465, "global_step": 304828, "epoch": 3672} {"train_loss": -25.730758666992188, "global_step": 304829, "epoch": 3672} {"train_loss": -25.907367706298828, "global_step": 304830, "epoch": 3672} {"train_loss": -25.745624542236328, "global_step": 304831, "epoch": 3672} {"train_loss": -25.74454689025879, "global_step": 304832, "epoch": 3672} {"train_loss": -25.87811279296875, "global_step": 304833, "epoch": 3672} {"train_loss": -25.490203857421875, "global_step": 304834, "epoch": 3672} {"train_loss": -25.550683975219727, "global_step": 304835, "epoch": 3672} {"train_loss": -25.62293815612793, "global_step": 304836, "epoch": 3672} {"train_loss": -25.538808822631836, "global_step": 304837, "epoch": 3672} {"train_loss": -25.395160675048828, "global_step": 304838, "epoch": 3672} {"train_loss": -25.438573837280273, "global_step": 304839, "epoch": 3672} {"train_loss": -25.952871322631836, "global_step": 304840, "epoch": 3672} {"train_loss": -25.503583908081055, "global_step": 304841, "epoch": 3672} {"train_loss": -25.8845157623291, "global_step": 304842, "epoch": 3672} {"train_loss": -25.390329360961914, "global_step": 304843, "epoch": 3672} {"train_loss": -26.017364501953125, "global_step": 304844, "epoch": 3672} {"train_loss": -25.612720489501953, "global_step": 304845, "epoch": 3672} {"train_loss": -25.6761531829834, "global_step": 304846, "epoch": 3672} {"train_loss": -25.097354888916016, "global_step": 304847, "epoch": 3672} {"train_loss": -25.310523986816406, "global_step": 304848, "epoch": 3672} {"train_loss": -25.576190948486328, "global_step": 304849, "epoch": 3672} {"train_loss": -25.35662841796875, "global_step": 304850, "epoch": 3672} {"train_loss": -25.52062225341797, "global_step": 304851, "epoch": 3672} {"train_loss": -25.22391128540039, "global_step": 304852, "epoch": 3672} {"train_loss": -25.306814193725586, "global_step": 304853, "epoch": 3672} {"train_loss": -25.560693740844727, "global_step": 304854, "epoch": 3672} {"train_loss": -25.497608184814453, "global_step": 304855, "epoch": 3672} {"train_loss": -25.533830642700195, "global_step": 304856, "epoch": 3672} {"train_loss": -25.30487632751465, "global_step": 304857, "epoch": 3672} {"train_loss": -25.554438464612847, "global_step": 304858, "epoch": 3672, "val_loss": 7118257.5} {"train_loss": -25.003080368041992, "global_step": 304859, "epoch": 3673} {"train_loss": -25.106801986694336, "global_step": 304860, "epoch": 3673} {"train_loss": -25.217382431030273, "global_step": 304861, "epoch": 3673} {"train_loss": -24.95396614074707, "global_step": 304862, "epoch": 3673} {"train_loss": -25.145084381103516, "global_step": 304863, "epoch": 3673} {"train_loss": -25.173307418823242, "global_step": 304864, "epoch": 3673} {"train_loss": -24.868167877197266, "global_step": 304865, "epoch": 3673} {"train_loss": -25.09079933166504, "global_step": 304866, "epoch": 3673} {"train_loss": -25.42195701599121, "global_step": 304867, "epoch": 3673} {"train_loss": -24.823083877563477, "global_step": 304868, "epoch": 3673} {"train_loss": -25.215394973754883, "global_step": 304869, "epoch": 3673} {"train_loss": -24.997634887695312, "global_step": 304870, "epoch": 3673} {"train_loss": -25.394405364990234, "global_step": 304871, "epoch": 3673} {"train_loss": -25.01604652404785, "global_step": 304872, "epoch": 3673} {"train_loss": -25.419519424438477, "global_step": 304873, "epoch": 3673} {"train_loss": -25.305891036987305, "global_step": 304874, "epoch": 3673} {"train_loss": -25.34836769104004, "global_step": 304875, "epoch": 3673} {"train_loss": -25.840808868408203, "global_step": 304876, "epoch": 3673} {"train_loss": -25.48872947692871, "global_step": 304877, "epoch": 3673} {"train_loss": -25.40767478942871, "global_step": 304878, "epoch": 3673} {"train_loss": -25.522083282470703, "global_step": 304879, "epoch": 3673} {"train_loss": -25.674306869506836, "global_step": 304880, "epoch": 3673} {"train_loss": -25.381189346313477, "global_step": 304881, "epoch": 3673} {"train_loss": -25.352474212646484, "global_step": 304882, "epoch": 3673} {"train_loss": -25.816247940063477, "global_step": 304883, "epoch": 3673} {"train_loss": -25.66423988342285, "global_step": 304884, "epoch": 3673} {"train_loss": -25.506650924682617, "global_step": 304885, "epoch": 3673} {"train_loss": -25.29994773864746, "global_step": 304886, "epoch": 3673} {"train_loss": -25.484609603881836, "global_step": 304887, "epoch": 3673} {"train_loss": -25.72759437561035, "global_step": 304888, "epoch": 3673} {"train_loss": -25.927988052368164, "global_step": 304889, "epoch": 3673} {"train_loss": -25.646894454956055, "global_step": 304890, "epoch": 3673} {"train_loss": -25.607587814331055, "global_step": 304891, "epoch": 3673} {"train_loss": -25.82936668395996, "global_step": 304892, "epoch": 3673} {"train_loss": -25.910507202148438, "global_step": 304893, "epoch": 3673} {"train_loss": -25.868976593017578, "global_step": 304894, "epoch": 3673} {"train_loss": -25.794260025024414, "global_step": 304895, "epoch": 3673} {"train_loss": -25.864587783813477, "global_step": 304896, "epoch": 3673} {"train_loss": -25.779926300048828, "global_step": 304897, "epoch": 3673} {"train_loss": -26.136144638061523, "global_step": 304898, "epoch": 3673} {"train_loss": -26.156845092773438, "global_step": 304899, "epoch": 3673} {"train_loss": -26.067113876342773, "global_step": 304900, "epoch": 3673} {"train_loss": -26.102020263671875, "global_step": 304901, "epoch": 3673} {"train_loss": -25.803363800048828, "global_step": 304902, "epoch": 3673} {"train_loss": -25.462949752807617, "global_step": 304903, "epoch": 3673} {"train_loss": -25.98702049255371, "global_step": 304904, "epoch": 3673} {"train_loss": -25.771474838256836, "global_step": 304905, "epoch": 3673} {"train_loss": -25.82977294921875, "global_step": 304906, "epoch": 3673} {"train_loss": -25.832416534423828, "global_step": 304907, "epoch": 3673} {"train_loss": -25.557374954223633, "global_step": 304908, "epoch": 3673} {"train_loss": -25.507442474365234, "global_step": 304909, "epoch": 3673} {"train_loss": -25.719953536987305, "global_step": 304910, "epoch": 3673} {"train_loss": -25.469514846801758, "global_step": 304911, "epoch": 3673} {"train_loss": -25.640899658203125, "global_step": 304912, "epoch": 3673} {"train_loss": -25.602224349975586, "global_step": 304913, "epoch": 3673} {"train_loss": -25.66139793395996, "global_step": 304914, "epoch": 3673} {"train_loss": -25.621164321899414, "global_step": 304915, "epoch": 3673} {"train_loss": -25.716938018798828, "global_step": 304916, "epoch": 3673} {"train_loss": -25.828222274780273, "global_step": 304917, "epoch": 3673} {"train_loss": -25.94009780883789, "global_step": 304918, "epoch": 3673} {"train_loss": -25.52484130859375, "global_step": 304919, "epoch": 3673} {"train_loss": -25.491249084472656, "global_step": 304920, "epoch": 3673} {"train_loss": -25.95073890686035, "global_step": 304921, "epoch": 3673} {"train_loss": -25.647581100463867, "global_step": 304922, "epoch": 3673} {"train_loss": -25.86480712890625, "global_step": 304923, "epoch": 3673} {"train_loss": -25.7384033203125, "global_step": 304924, "epoch": 3673} {"train_loss": -26.074453353881836, "global_step": 304925, "epoch": 3673} {"train_loss": -25.59885025024414, "global_step": 304926, "epoch": 3673} {"train_loss": -26.059499740600586, "global_step": 304927, "epoch": 3673} {"train_loss": -25.390026092529297, "global_step": 304928, "epoch": 3673} {"train_loss": -25.494510650634766, "global_step": 304929, "epoch": 3673} {"train_loss": -25.666227340698242, "global_step": 304930, "epoch": 3673} {"train_loss": -25.139530181884766, "global_step": 304931, "epoch": 3673} {"train_loss": -25.589384078979492, "global_step": 304932, "epoch": 3673} {"train_loss": -25.357803344726562, "global_step": 304933, "epoch": 3673} {"train_loss": -25.83489418029785, "global_step": 304934, "epoch": 3673} {"train_loss": -25.22065544128418, "global_step": 304935, "epoch": 3673} {"train_loss": -25.680761337280273, "global_step": 304936, "epoch": 3673} {"train_loss": -25.730030059814453, "global_step": 304937, "epoch": 3673} {"train_loss": -25.58748435974121, "global_step": 304938, "epoch": 3673} {"train_loss": -25.86162757873535, "global_step": 304939, "epoch": 3673} {"train_loss": -25.67743492126465, "global_step": 304940, "epoch": 3673} {"train_loss": -25.590554846338478, "global_step": 304941, "epoch": 3673, "val_loss": 7019732.0} {"train_loss": -24.51019287109375, "global_step": 304942, "epoch": 3674} {"train_loss": -24.346153259277344, "global_step": 304943, "epoch": 3674} {"train_loss": -24.882944107055664, "global_step": 304944, "epoch": 3674} {"train_loss": -24.92059326171875, "global_step": 304945, "epoch": 3674} {"train_loss": -24.8432559967041, "global_step": 304946, "epoch": 3674} {"train_loss": -25.427221298217773, "global_step": 304947, "epoch": 3674} {"train_loss": -25.196170806884766, "global_step": 304948, "epoch": 3674} {"train_loss": -25.177982330322266, "global_step": 304949, "epoch": 3674} {"train_loss": -25.37436866760254, "global_step": 304950, "epoch": 3674} {"train_loss": -25.386083602905273, "global_step": 304951, "epoch": 3674} {"train_loss": -25.448001861572266, "global_step": 304952, "epoch": 3674} {"train_loss": -25.220975875854492, "global_step": 304953, "epoch": 3674} {"train_loss": -25.81495475769043, "global_step": 304954, "epoch": 3674} {"train_loss": -24.830778121948242, "global_step": 304955, "epoch": 3674} {"train_loss": -25.55750846862793, "global_step": 304956, "epoch": 3674} {"train_loss": -25.18832015991211, "global_step": 304957, "epoch": 3674} {"train_loss": -25.463537216186523, "global_step": 304958, "epoch": 3674} {"train_loss": -25.617170333862305, "global_step": 304959, "epoch": 3674} {"train_loss": -25.53314781188965, "global_step": 304960, "epoch": 3674} {"train_loss": -25.590316772460938, "global_step": 304961, "epoch": 3674} {"train_loss": -25.442136764526367, "global_step": 304962, "epoch": 3674} {"train_loss": -25.259077072143555, "global_step": 304963, "epoch": 3674} {"train_loss": -24.863019943237305, "global_step": 304964, "epoch": 3674} {"train_loss": -25.830692291259766, "global_step": 304965, "epoch": 3674} {"train_loss": -25.51313591003418, "global_step": 304966, "epoch": 3674} {"train_loss": -25.265323638916016, "global_step": 304967, "epoch": 3674} {"train_loss": -25.632186889648438, "global_step": 304968, "epoch": 3674} {"train_loss": -25.579364776611328, "global_step": 304969, "epoch": 3674} {"train_loss": -25.524662017822266, "global_step": 304970, "epoch": 3674} {"train_loss": -25.63300895690918, "global_step": 304971, "epoch": 3674} {"train_loss": -25.844873428344727, "global_step": 304972, "epoch": 3674} {"train_loss": -25.962894439697266, "global_step": 304973, "epoch": 3674} {"train_loss": -25.89699363708496, "global_step": 304974, "epoch": 3674} {"train_loss": -25.6700496673584, "global_step": 304975, "epoch": 3674} {"train_loss": -25.73127555847168, "global_step": 304976, "epoch": 3674} {"train_loss": -26.123138427734375, "global_step": 304977, "epoch": 3674} {"train_loss": -25.90032958984375, "global_step": 304978, "epoch": 3674} {"train_loss": -25.517560958862305, "global_step": 304979, "epoch": 3674} {"train_loss": -25.830764770507812, "global_step": 304980, "epoch": 3674} {"train_loss": -25.7353458404541, "global_step": 304981, "epoch": 3674} {"train_loss": -25.729400634765625, "global_step": 304982, "epoch": 3674} {"train_loss": -25.972076416015625, "global_step": 304983, "epoch": 3674} {"train_loss": -25.545778274536133, "global_step": 304984, "epoch": 3674} {"train_loss": -25.768049240112305, "global_step": 304985, "epoch": 3674} {"train_loss": -25.715890884399414, "global_step": 304986, "epoch": 3674} {"train_loss": -26.14279556274414, "global_step": 304987, "epoch": 3674} {"train_loss": -25.732519149780273, "global_step": 304988, "epoch": 3674} {"train_loss": -25.664289474487305, "global_step": 304989, "epoch": 3674} {"train_loss": -25.78925132751465, "global_step": 304990, "epoch": 3674} {"train_loss": -25.744909286499023, "global_step": 304991, "epoch": 3674} {"train_loss": -25.894397735595703, "global_step": 304992, "epoch": 3674} {"train_loss": -25.59613609313965, "global_step": 304993, "epoch": 3674} {"train_loss": -25.9177188873291, "global_step": 304994, "epoch": 3674} {"train_loss": -25.913236618041992, "global_step": 304995, "epoch": 3674} {"train_loss": -25.743438720703125, "global_step": 304996, "epoch": 3674} {"train_loss": -25.849592208862305, "global_step": 304997, "epoch": 3674} {"train_loss": -26.170373916625977, "global_step": 304998, "epoch": 3674} {"train_loss": -25.63858413696289, "global_step": 304999, "epoch": 3674} {"train_loss": -25.702377319335938, "global_step": 305000, "epoch": 3674} {"train_loss": -25.920557022094727, "global_step": 305001, "epoch": 3674} {"train_loss": -25.868976593017578, "global_step": 305002, "epoch": 3674} {"train_loss": -26.08953857421875, "global_step": 305003, "epoch": 3674} {"train_loss": -25.830307006835938, "global_step": 305004, "epoch": 3674} {"train_loss": -25.701129913330078, "global_step": 305005, "epoch": 3674} {"train_loss": -25.773523330688477, "global_step": 305006, "epoch": 3674} {"train_loss": -25.258316040039062, "global_step": 305007, "epoch": 3674} {"train_loss": -24.84897232055664, "global_step": 305008, "epoch": 3674} {"train_loss": -25.010766983032227, "global_step": 305009, "epoch": 3674} {"train_loss": -25.33615493774414, "global_step": 305010, "epoch": 3674} {"train_loss": -25.7015323638916, "global_step": 305011, "epoch": 3674} {"train_loss": -25.701980590820312, "global_step": 305012, "epoch": 3674} {"train_loss": -25.505844116210938, "global_step": 305013, "epoch": 3674} {"train_loss": -25.29574966430664, "global_step": 305014, "epoch": 3674} {"train_loss": -25.834125518798828, "global_step": 305015, "epoch": 3674} {"train_loss": -25.604022979736328, "global_step": 305016, "epoch": 3674} {"train_loss": -25.389156341552734, "global_step": 305017, "epoch": 3674} {"train_loss": -25.633167266845703, "global_step": 305018, "epoch": 3674} {"train_loss": -25.554147720336914, "global_step": 305019, "epoch": 3674} {"train_loss": -25.370012283325195, "global_step": 305020, "epoch": 3674} {"train_loss": -25.51763153076172, "global_step": 305021, "epoch": 3674} {"train_loss": -25.876386642456055, "global_step": 305022, "epoch": 3674} {"train_loss": -25.3900089263916, "global_step": 305023, "epoch": 3674} {"train_loss": -25.554595211902296, "global_step": 305024, "epoch": 3674, "val_loss": 7257492.0} {"train_loss": -25.731937408447266, "global_step": 305025, "epoch": 3675} {"train_loss": -25.06227684020996, "global_step": 305026, "epoch": 3675} {"train_loss": -25.71843910217285, "global_step": 305027, "epoch": 3675} {"train_loss": -25.21235466003418, "global_step": 305028, "epoch": 3675} {"train_loss": -25.503238677978516, "global_step": 305029, "epoch": 3675} {"train_loss": -25.543134689331055, "global_step": 305030, "epoch": 3675} {"train_loss": -25.572744369506836, "global_step": 305031, "epoch": 3675} {"train_loss": -25.152633666992188, "global_step": 305032, "epoch": 3675} {"train_loss": -25.62177085876465, "global_step": 305033, "epoch": 3675} {"train_loss": -25.559349060058594, "global_step": 305034, "epoch": 3675} {"train_loss": -25.35405158996582, "global_step": 305035, "epoch": 3675} {"train_loss": -25.747421264648438, "global_step": 305036, "epoch": 3675} {"train_loss": -25.401243209838867, "global_step": 305037, "epoch": 3675} {"train_loss": -25.645841598510742, "global_step": 305038, "epoch": 3675} {"train_loss": -25.516515731811523, "global_step": 305039, "epoch": 3675} {"train_loss": -25.760900497436523, "global_step": 305040, "epoch": 3675} {"train_loss": -25.56669044494629, "global_step": 305041, "epoch": 3675} {"train_loss": -25.799108505249023, "global_step": 305042, "epoch": 3675} {"train_loss": -25.468957901000977, "global_step": 305043, "epoch": 3675} {"train_loss": -25.32975196838379, "global_step": 305044, "epoch": 3675} {"train_loss": -25.432600021362305, "global_step": 305045, "epoch": 3675} {"train_loss": -25.584487915039062, "global_step": 305046, "epoch": 3675} {"train_loss": -25.532865524291992, "global_step": 305047, "epoch": 3675} {"train_loss": -25.256723403930664, "global_step": 305048, "epoch": 3675} {"train_loss": -25.85614013671875, "global_step": 305049, "epoch": 3675} {"train_loss": -25.748611450195312, "global_step": 305050, "epoch": 3675} {"train_loss": -25.928531646728516, "global_step": 305051, "epoch": 3675} {"train_loss": -25.566692352294922, "global_step": 305052, "epoch": 3675} {"train_loss": -25.558950424194336, "global_step": 305053, "epoch": 3675} {"train_loss": -25.352968215942383, "global_step": 305054, "epoch": 3675} {"train_loss": -25.686620712280273, "global_step": 305055, "epoch": 3675} {"train_loss": -25.999692916870117, "global_step": 305056, "epoch": 3675} {"train_loss": -25.810977935791016, "global_step": 305057, "epoch": 3675} {"train_loss": -25.758962631225586, "global_step": 305058, "epoch": 3675} {"train_loss": -25.686344146728516, "global_step": 305059, "epoch": 3675} {"train_loss": -25.4376220703125, "global_step": 305060, "epoch": 3675} {"train_loss": -25.709243774414062, "global_step": 305061, "epoch": 3675} {"train_loss": -25.75457191467285, "global_step": 305062, "epoch": 3675} {"train_loss": -25.6561336517334, "global_step": 305063, "epoch": 3675} {"train_loss": -25.96952247619629, "global_step": 305064, "epoch": 3675} {"train_loss": -26.16458511352539, "global_step": 305065, "epoch": 3675} {"train_loss": -25.875268936157227, "global_step": 305066, "epoch": 3675} {"train_loss": -25.272994995117188, "global_step": 305067, "epoch": 3675} {"train_loss": -25.286840438842773, "global_step": 305068, "epoch": 3675} {"train_loss": -25.55964469909668, "global_step": 305069, "epoch": 3675} {"train_loss": -25.805908203125, "global_step": 305070, "epoch": 3675} {"train_loss": -25.79608726501465, "global_step": 305071, "epoch": 3675} {"train_loss": -25.850854873657227, "global_step": 305072, "epoch": 3675} {"train_loss": -25.23876190185547, "global_step": 305073, "epoch": 3675} {"train_loss": -25.893009185791016, "global_step": 305074, "epoch": 3675} {"train_loss": -25.941486358642578, "global_step": 305075, "epoch": 3675} {"train_loss": -25.779678344726562, "global_step": 305076, "epoch": 3675} {"train_loss": -25.526172637939453, "global_step": 305077, "epoch": 3675} {"train_loss": -25.8516788482666, "global_step": 305078, "epoch": 3675} {"train_loss": -25.714588165283203, "global_step": 305079, "epoch": 3675} {"train_loss": -25.558218002319336, "global_step": 305080, "epoch": 3675} {"train_loss": -25.088388442993164, "global_step": 305081, "epoch": 3675} {"train_loss": -25.70829200744629, "global_step": 305082, "epoch": 3675} {"train_loss": -25.793304443359375, "global_step": 305083, "epoch": 3675} {"train_loss": -25.535797119140625, "global_step": 305084, "epoch": 3675} {"train_loss": -25.341272354125977, "global_step": 305085, "epoch": 3675} {"train_loss": -25.476655960083008, "global_step": 305086, "epoch": 3675} {"train_loss": -25.861719131469727, "global_step": 305087, "epoch": 3675} {"train_loss": -26.17091178894043, "global_step": 305088, "epoch": 3675} {"train_loss": -25.007736206054688, "global_step": 305089, "epoch": 3675} {"train_loss": -25.82770347595215, "global_step": 305090, "epoch": 3675} {"train_loss": -25.55281639099121, "global_step": 305091, "epoch": 3675} {"train_loss": -25.596817016601562, "global_step": 305092, "epoch": 3675} {"train_loss": -25.410568237304688, "global_step": 305093, "epoch": 3675} {"train_loss": -25.243188858032227, "global_step": 305094, "epoch": 3675} {"train_loss": -25.46440887451172, "global_step": 305095, "epoch": 3675} {"train_loss": -25.357702255249023, "global_step": 305096, "epoch": 3675} {"train_loss": -25.326007843017578, "global_step": 305097, "epoch": 3675} {"train_loss": -25.628250122070312, "global_step": 305098, "epoch": 3675} {"train_loss": -25.12674331665039, "global_step": 305099, "epoch": 3675} {"train_loss": -25.7303409576416, "global_step": 305100, "epoch": 3675} {"train_loss": -25.29046630859375, "global_step": 305101, "epoch": 3675} {"train_loss": -25.655553817749023, "global_step": 305102, "epoch": 3675} {"train_loss": -25.551462173461914, "global_step": 305103, "epoch": 3675} {"train_loss": -25.552810668945312, "global_step": 305104, "epoch": 3675} {"train_loss": -25.56845474243164, "global_step": 305105, "epoch": 3675} {"train_loss": -25.512304306030273, "global_step": 305106, "epoch": 3675} {"train_loss": -25.576040681586207, "global_step": 305107, "epoch": 3675, "val_loss": 7313368.0} {"train_loss": -25.15849494934082, "global_step": 305108, "epoch": 3676} {"train_loss": -25.568090438842773, "global_step": 305109, "epoch": 3676} {"train_loss": -25.242813110351562, "global_step": 305110, "epoch": 3676} {"train_loss": -25.456045150756836, "global_step": 305111, "epoch": 3676} {"train_loss": -25.7774600982666, "global_step": 305112, "epoch": 3676} {"train_loss": -24.910207748413086, "global_step": 305113, "epoch": 3676} {"train_loss": -25.714435577392578, "global_step": 305114, "epoch": 3676} {"train_loss": -25.621801376342773, "global_step": 305115, "epoch": 3676} {"train_loss": -25.403085708618164, "global_step": 305116, "epoch": 3676} {"train_loss": -24.760833740234375, "global_step": 305117, "epoch": 3676} {"train_loss": -25.222808837890625, "global_step": 305118, "epoch": 3676} {"train_loss": -25.6669979095459, "global_step": 305119, "epoch": 3676} {"train_loss": -25.543790817260742, "global_step": 305120, "epoch": 3676} {"train_loss": -25.034887313842773, "global_step": 305121, "epoch": 3676} {"train_loss": -25.655548095703125, "global_step": 305122, "epoch": 3676} {"train_loss": -25.527587890625, "global_step": 305123, "epoch": 3676} {"train_loss": -25.208532333374023, "global_step": 305124, "epoch": 3676} {"train_loss": -25.610553741455078, "global_step": 305125, "epoch": 3676} {"train_loss": -25.6329288482666, "global_step": 305126, "epoch": 3676} {"train_loss": -25.667280197143555, "global_step": 305127, "epoch": 3676} {"train_loss": -25.8460636138916, "global_step": 305128, "epoch": 3676} {"train_loss": -25.261428833007812, "global_step": 305129, "epoch": 3676} {"train_loss": -25.842252731323242, "global_step": 305130, "epoch": 3676} {"train_loss": -25.743505477905273, "global_step": 305131, "epoch": 3676} {"train_loss": -25.591333389282227, "global_step": 305132, "epoch": 3676} {"train_loss": -26.0427188873291, "global_step": 305133, "epoch": 3676} {"train_loss": -25.55403709411621, "global_step": 305134, "epoch": 3676} {"train_loss": -25.77228355407715, "global_step": 305135, "epoch": 3676} {"train_loss": -25.7331485748291, "global_step": 305136, "epoch": 3676} {"train_loss": -25.9919376373291, "global_step": 305137, "epoch": 3676} {"train_loss": -25.323440551757812, "global_step": 305138, "epoch": 3676} {"train_loss": -25.64015007019043, "global_step": 305139, "epoch": 3676} {"train_loss": -25.929731369018555, "global_step": 305140, "epoch": 3676} {"train_loss": -25.66387367248535, "global_step": 305141, "epoch": 3676} {"train_loss": -25.78696060180664, "global_step": 305142, "epoch": 3676} {"train_loss": -25.560535430908203, "global_step": 305143, "epoch": 3676} {"train_loss": -25.975727081298828, "global_step": 305144, "epoch": 3676} {"train_loss": -25.52564811706543, "global_step": 305145, "epoch": 3676} {"train_loss": -25.86359214782715, "global_step": 305146, "epoch": 3676} {"train_loss": -25.5523624420166, "global_step": 305147, "epoch": 3676} {"train_loss": -25.914823532104492, "global_step": 305148, "epoch": 3676} {"train_loss": -25.98439598083496, "global_step": 305149, "epoch": 3676} {"train_loss": -25.731473922729492, "global_step": 305150, "epoch": 3676} {"train_loss": -25.85869789123535, "global_step": 305151, "epoch": 3676} {"train_loss": -26.092559814453125, "global_step": 305152, "epoch": 3676} {"train_loss": -25.678068161010742, "global_step": 305153, "epoch": 3676} {"train_loss": -25.71852684020996, "global_step": 305154, "epoch": 3676} {"train_loss": -25.627185821533203, "global_step": 305155, "epoch": 3676} {"train_loss": -25.739288330078125, "global_step": 305156, "epoch": 3676} {"train_loss": -25.58365821838379, "global_step": 305157, "epoch": 3676} {"train_loss": -25.827783584594727, "global_step": 305158, "epoch": 3676} {"train_loss": -25.871091842651367, "global_step": 305159, "epoch": 3676} {"train_loss": -25.75992774963379, "global_step": 305160, "epoch": 3676} {"train_loss": -25.867008209228516, "global_step": 305161, "epoch": 3676} {"train_loss": -25.823322296142578, "global_step": 305162, "epoch": 3676} {"train_loss": -25.784345626831055, "global_step": 305163, "epoch": 3676} {"train_loss": -25.687841415405273, "global_step": 305164, "epoch": 3676} {"train_loss": -25.970922470092773, "global_step": 305165, "epoch": 3676} {"train_loss": -26.1365909576416, "global_step": 305166, "epoch": 3676} {"train_loss": -25.664398193359375, "global_step": 305167, "epoch": 3676} {"train_loss": -25.705936431884766, "global_step": 305168, "epoch": 3676} {"train_loss": -25.73048973083496, "global_step": 305169, "epoch": 3676} {"train_loss": -25.86989402770996, "global_step": 305170, "epoch": 3676} {"train_loss": -25.54945182800293, "global_step": 305171, "epoch": 3676} {"train_loss": -25.412443161010742, "global_step": 305172, "epoch": 3676} {"train_loss": -25.477109909057617, "global_step": 305173, "epoch": 3676} {"train_loss": -25.83631706237793, "global_step": 305174, "epoch": 3676} {"train_loss": -25.377140045166016, "global_step": 305175, "epoch": 3676} {"train_loss": -26.05364990234375, "global_step": 305176, "epoch": 3676} {"train_loss": -25.834339141845703, "global_step": 305177, "epoch": 3676} {"train_loss": -25.41135025024414, "global_step": 305178, "epoch": 3676} {"train_loss": -25.60715103149414, "global_step": 305179, "epoch": 3676} {"train_loss": -25.761240005493164, "global_step": 305180, "epoch": 3676} {"train_loss": -25.627588272094727, "global_step": 305181, "epoch": 3676} {"train_loss": -25.496923446655273, "global_step": 305182, "epoch": 3676} {"train_loss": -25.625991821289062, "global_step": 305183, "epoch": 3676} {"train_loss": -25.793701171875, "global_step": 305184, "epoch": 3676} {"train_loss": -25.866247177124023, "global_step": 305185, "epoch": 3676} {"train_loss": -25.804471969604492, "global_step": 305186, "epoch": 3676} {"train_loss": -25.447011947631836, "global_step": 305187, "epoch": 3676} {"train_loss": -25.847354888916016, "global_step": 305188, "epoch": 3676} {"train_loss": -25.225711822509766, "global_step": 305189, "epoch": 3676} {"train_loss": -25.657097092594007, "global_step": 305190, "epoch": 3676, "val_loss": 7240075.0} {"train_loss": -25.397342681884766, "global_step": 305191, "epoch": 3677} {"train_loss": -25.414339065551758, "global_step": 305192, "epoch": 3677} {"train_loss": -25.445125579833984, "global_step": 305193, "epoch": 3677} {"train_loss": -25.315792083740234, "global_step": 305194, "epoch": 3677} {"train_loss": -25.471410751342773, "global_step": 305195, "epoch": 3677} {"train_loss": -25.430238723754883, "global_step": 305196, "epoch": 3677} {"train_loss": -25.323606491088867, "global_step": 305197, "epoch": 3677} {"train_loss": -25.45653533935547, "global_step": 305198, "epoch": 3677} {"train_loss": -25.576047897338867, "global_step": 305199, "epoch": 3677} {"train_loss": -25.73148536682129, "global_step": 305200, "epoch": 3677} {"train_loss": -25.35479736328125, "global_step": 305201, "epoch": 3677} {"train_loss": -25.580045700073242, "global_step": 305202, "epoch": 3677} {"train_loss": -25.50824546813965, "global_step": 305203, "epoch": 3677} {"train_loss": -25.880823135375977, "global_step": 305204, "epoch": 3677} {"train_loss": -25.585107803344727, "global_step": 305205, "epoch": 3677} {"train_loss": -25.709203720092773, "global_step": 305206, "epoch": 3677} {"train_loss": -25.484867095947266, "global_step": 305207, "epoch": 3677} {"train_loss": -26.02048683166504, "global_step": 305208, "epoch": 3677} {"train_loss": -25.601150512695312, "global_step": 305209, "epoch": 3677} {"train_loss": -25.76320457458496, "global_step": 305210, "epoch": 3677} {"train_loss": -25.930999755859375, "global_step": 305211, "epoch": 3677} {"train_loss": -25.92693519592285, "global_step": 305212, "epoch": 3677} {"train_loss": -26.332502365112305, "global_step": 305213, "epoch": 3677} {"train_loss": -25.8204402923584, "global_step": 305214, "epoch": 3677} {"train_loss": -25.7253360748291, "global_step": 305215, "epoch": 3677} {"train_loss": -25.488309860229492, "global_step": 305216, "epoch": 3677} {"train_loss": -25.591873168945312, "global_step": 305217, "epoch": 3677} {"train_loss": -26.144256591796875, "global_step": 305218, "epoch": 3677} {"train_loss": -25.733617782592773, "global_step": 305219, "epoch": 3677} {"train_loss": -25.786062240600586, "global_step": 305220, "epoch": 3677} {"train_loss": -25.81784439086914, "global_step": 305221, "epoch": 3677} {"train_loss": -26.172321319580078, "global_step": 305222, "epoch": 3677} {"train_loss": -25.580039978027344, "global_step": 305223, "epoch": 3677} {"train_loss": -25.722021102905273, "global_step": 305224, "epoch": 3677} {"train_loss": -25.791112899780273, "global_step": 305225, "epoch": 3677} {"train_loss": -26.092809677124023, "global_step": 305226, "epoch": 3677} {"train_loss": -25.916818618774414, "global_step": 305227, "epoch": 3677} {"train_loss": -25.9505615234375, "global_step": 305228, "epoch": 3677} {"train_loss": -25.8409366607666, "global_step": 305229, "epoch": 3677} {"train_loss": -25.816314697265625, "global_step": 305230, "epoch": 3677} {"train_loss": -25.713666915893555, "global_step": 305231, "epoch": 3677} {"train_loss": -26.120258331298828, "global_step": 305232, "epoch": 3677} {"train_loss": -25.900379180908203, "global_step": 305233, "epoch": 3677} {"train_loss": -25.846088409423828, "global_step": 305234, "epoch": 3677} {"train_loss": -26.002416610717773, "global_step": 305235, "epoch": 3677} {"train_loss": -25.602514266967773, "global_step": 305236, "epoch": 3677} {"train_loss": -26.09942626953125, "global_step": 305237, "epoch": 3677} {"train_loss": -25.898096084594727, "global_step": 305238, "epoch": 3677} {"train_loss": -25.855615615844727, "global_step": 305239, "epoch": 3677} {"train_loss": -25.942108154296875, "global_step": 305240, "epoch": 3677} {"train_loss": -25.788135528564453, "global_step": 305241, "epoch": 3677} {"train_loss": -25.638751983642578, "global_step": 305242, "epoch": 3677} {"train_loss": -25.508834838867188, "global_step": 305243, "epoch": 3677} {"train_loss": -25.349645614624023, "global_step": 305244, "epoch": 3677} {"train_loss": -25.267257690429688, "global_step": 305245, "epoch": 3677} {"train_loss": -25.586820602416992, "global_step": 305246, "epoch": 3677} {"train_loss": -25.03986167907715, "global_step": 305247, "epoch": 3677} {"train_loss": -25.883142471313477, "global_step": 305248, "epoch": 3677} {"train_loss": -25.43183708190918, "global_step": 305249, "epoch": 3677} {"train_loss": -25.25372886657715, "global_step": 305250, "epoch": 3677} {"train_loss": -25.868854522705078, "global_step": 305251, "epoch": 3677} {"train_loss": -25.5476016998291, "global_step": 305252, "epoch": 3677} {"train_loss": -25.44565773010254, "global_step": 305253, "epoch": 3677} {"train_loss": -25.87244987487793, "global_step": 305254, "epoch": 3677} {"train_loss": -25.521188735961914, "global_step": 305255, "epoch": 3677} {"train_loss": -25.935760498046875, "global_step": 305256, "epoch": 3677} {"train_loss": -25.87861442565918, "global_step": 305257, "epoch": 3677} {"train_loss": -25.41853904724121, "global_step": 305258, "epoch": 3677} {"train_loss": -25.27656364440918, "global_step": 305259, "epoch": 3677} {"train_loss": -25.193662643432617, "global_step": 305260, "epoch": 3677} {"train_loss": -25.684066772460938, "global_step": 305261, "epoch": 3677} {"train_loss": -25.73748779296875, "global_step": 305262, "epoch": 3677} {"train_loss": -25.839954376220703, "global_step": 305263, "epoch": 3677} {"train_loss": -25.628528594970703, "global_step": 305264, "epoch": 3677} {"train_loss": -25.752538681030273, "global_step": 305265, "epoch": 3677} {"train_loss": -25.331716537475586, "global_step": 305266, "epoch": 3677} {"train_loss": -25.818872451782227, "global_step": 305267, "epoch": 3677} {"train_loss": -25.89240074157715, "global_step": 305268, "epoch": 3677} {"train_loss": -25.964818954467773, "global_step": 305269, "epoch": 3677} {"train_loss": -25.87619972229004, "global_step": 305270, "epoch": 3677} {"train_loss": -25.93867301940918, "global_step": 305271, "epoch": 3677} {"train_loss": -25.626432418823242, "global_step": 305272, "epoch": 3677} {"train_loss": -25.696096856910064, "global_step": 305273, "epoch": 3677, "val_loss": 7233973.0} {"train_loss": -25.318267822265625, "global_step": 305274, "epoch": 3678} {"train_loss": -25.430463790893555, "global_step": 305275, "epoch": 3678} {"train_loss": -25.469593048095703, "global_step": 305276, "epoch": 3678} {"train_loss": -25.149494171142578, "global_step": 305277, "epoch": 3678} {"train_loss": -25.17708969116211, "global_step": 305278, "epoch": 3678} {"train_loss": -25.403335571289062, "global_step": 305279, "epoch": 3678} {"train_loss": -24.994455337524414, "global_step": 305280, "epoch": 3678} {"train_loss": -25.511302947998047, "global_step": 305281, "epoch": 3678} {"train_loss": -25.140798568725586, "global_step": 305282, "epoch": 3678} {"train_loss": -25.1814022064209, "global_step": 305283, "epoch": 3678} {"train_loss": -25.336374282836914, "global_step": 305284, "epoch": 3678} {"train_loss": -25.721179962158203, "global_step": 305285, "epoch": 3678} {"train_loss": -25.60888671875, "global_step": 305286, "epoch": 3678} {"train_loss": -25.379186630249023, "global_step": 305287, "epoch": 3678} {"train_loss": -25.772497177124023, "global_step": 305288, "epoch": 3678} {"train_loss": -25.6964054107666, "global_step": 305289, "epoch": 3678} {"train_loss": -25.109222412109375, "global_step": 305290, "epoch": 3678} {"train_loss": -25.62826919555664, "global_step": 305291, "epoch": 3678} {"train_loss": -25.417892456054688, "global_step": 305292, "epoch": 3678} {"train_loss": -25.60821533203125, "global_step": 305293, "epoch": 3678} {"train_loss": -25.45924949645996, "global_step": 305294, "epoch": 3678} {"train_loss": -25.807676315307617, "global_step": 305295, "epoch": 3678} {"train_loss": -25.26058006286621, "global_step": 305296, "epoch": 3678} {"train_loss": -25.656843185424805, "global_step": 305297, "epoch": 3678} {"train_loss": -25.745084762573242, "global_step": 305298, "epoch": 3678} {"train_loss": -25.5832576751709, "global_step": 305299, "epoch": 3678} {"train_loss": -25.8482666015625, "global_step": 305300, "epoch": 3678} {"train_loss": -25.688756942749023, "global_step": 305301, "epoch": 3678} {"train_loss": -26.03143310546875, "global_step": 305302, "epoch": 3678} {"train_loss": -25.90945816040039, "global_step": 305303, "epoch": 3678} {"train_loss": -25.722503662109375, "global_step": 305304, "epoch": 3678} {"train_loss": -25.963626861572266, "global_step": 305305, "epoch": 3678} {"train_loss": -25.86163330078125, "global_step": 305306, "epoch": 3678} {"train_loss": -25.708593368530273, "global_step": 305307, "epoch": 3678} {"train_loss": -25.753082275390625, "global_step": 305308, "epoch": 3678} {"train_loss": -25.931447982788086, "global_step": 305309, "epoch": 3678} {"train_loss": -26.246234893798828, "global_step": 305310, "epoch": 3678} {"train_loss": -25.847339630126953, "global_step": 305311, "epoch": 3678} {"train_loss": -25.80231285095215, "global_step": 305312, "epoch": 3678} {"train_loss": -25.800312042236328, "global_step": 305313, "epoch": 3678} {"train_loss": -25.680456161499023, "global_step": 305314, "epoch": 3678} {"train_loss": -25.652616500854492, "global_step": 305315, "epoch": 3678} {"train_loss": -25.636545181274414, "global_step": 305316, "epoch": 3678} {"train_loss": -25.76690101623535, "global_step": 305317, "epoch": 3678} {"train_loss": -25.969501495361328, "global_step": 305318, "epoch": 3678} {"train_loss": -25.43648338317871, "global_step": 305319, "epoch": 3678} {"train_loss": -25.55864906311035, "global_step": 305320, "epoch": 3678} {"train_loss": -25.674707412719727, "global_step": 305321, "epoch": 3678} {"train_loss": -25.386964797973633, "global_step": 305322, "epoch": 3678} {"train_loss": -25.523847579956055, "global_step": 305323, "epoch": 3678} {"train_loss": -25.860082626342773, "global_step": 305324, "epoch": 3678} {"train_loss": -26.079498291015625, "global_step": 305325, "epoch": 3678} {"train_loss": -26.198028564453125, "global_step": 305326, "epoch": 3678} {"train_loss": -25.74749183654785, "global_step": 305327, "epoch": 3678} {"train_loss": -26.049030303955078, "global_step": 305328, "epoch": 3678} {"train_loss": -25.97995376586914, "global_step": 305329, "epoch": 3678} {"train_loss": -25.884870529174805, "global_step": 305330, "epoch": 3678} {"train_loss": -25.475894927978516, "global_step": 305331, "epoch": 3678} {"train_loss": -25.581655502319336, "global_step": 305332, "epoch": 3678} {"train_loss": -25.59488296508789, "global_step": 305333, "epoch": 3678} {"train_loss": -26.136138916015625, "global_step": 305334, "epoch": 3678} {"train_loss": -25.734683990478516, "global_step": 305335, "epoch": 3678} {"train_loss": -25.608121871948242, "global_step": 305336, "epoch": 3678} {"train_loss": -25.700132369995117, "global_step": 305337, "epoch": 3678} {"train_loss": -25.722599029541016, "global_step": 305338, "epoch": 3678} {"train_loss": -25.50922966003418, "global_step": 305339, "epoch": 3678} {"train_loss": -25.967575073242188, "global_step": 305340, "epoch": 3678} {"train_loss": -25.91212272644043, "global_step": 305341, "epoch": 3678} {"train_loss": -25.570459365844727, "global_step": 305342, "epoch": 3678} {"train_loss": -25.799057006835938, "global_step": 305343, "epoch": 3678} {"train_loss": -25.46009635925293, "global_step": 305344, "epoch": 3678} {"train_loss": -25.44554901123047, "global_step": 305345, "epoch": 3678} {"train_loss": -25.829755783081055, "global_step": 305346, "epoch": 3678} {"train_loss": -25.6342830657959, "global_step": 305347, "epoch": 3678} {"train_loss": -25.612714767456055, "global_step": 305348, "epoch": 3678} {"train_loss": -25.565351486206055, "global_step": 305349, "epoch": 3678} {"train_loss": -25.344633102416992, "global_step": 305350, "epoch": 3678} {"train_loss": -25.8580265045166, "global_step": 305351, "epoch": 3678} {"train_loss": -25.8994083404541, "global_step": 305352, "epoch": 3678} {"train_loss": -25.825605392456055, "global_step": 305353, "epoch": 3678} {"train_loss": -26.037057876586914, "global_step": 305354, "epoch": 3678} {"train_loss": -25.6656494140625, "global_step": 305355, "epoch": 3678} {"train_loss": -25.666885330016356, "global_step": 305356, "epoch": 3678, "val_loss": 7331265.0} {"train_loss": -25.37628746032715, "global_step": 305357, "epoch": 3679} {"train_loss": -24.51398277282715, "global_step": 305358, "epoch": 3679} {"train_loss": -24.224767684936523, "global_step": 305359, "epoch": 3679} {"train_loss": -25.08173179626465, "global_step": 305360, "epoch": 3679} {"train_loss": -24.7471981048584, "global_step": 305361, "epoch": 3679} {"train_loss": -25.252653121948242, "global_step": 305362, "epoch": 3679} {"train_loss": -25.107717514038086, "global_step": 305363, "epoch": 3679} {"train_loss": -25.040163040161133, "global_step": 305364, "epoch": 3679} {"train_loss": -25.025484085083008, "global_step": 305365, "epoch": 3679} {"train_loss": -25.294940948486328, "global_step": 305366, "epoch": 3679} {"train_loss": -25.34596824645996, "global_step": 305367, "epoch": 3679} {"train_loss": -25.200475692749023, "global_step": 305368, "epoch": 3679} {"train_loss": -25.06589698791504, "global_step": 305369, "epoch": 3679} {"train_loss": -25.162668228149414, "global_step": 305370, "epoch": 3679} {"train_loss": -25.287521362304688, "global_step": 305371, "epoch": 3679} {"train_loss": -25.351669311523438, "global_step": 305372, "epoch": 3679} {"train_loss": -25.339841842651367, "global_step": 305373, "epoch": 3679} {"train_loss": -25.7901611328125, "global_step": 305374, "epoch": 3679} {"train_loss": -25.741708755493164, "global_step": 305375, "epoch": 3679} {"train_loss": -25.300100326538086, "global_step": 305376, "epoch": 3679} {"train_loss": -25.890090942382812, "global_step": 305377, "epoch": 3679} {"train_loss": -25.608047485351562, "global_step": 305378, "epoch": 3679} {"train_loss": -25.682538986206055, "global_step": 305379, "epoch": 3679} {"train_loss": -24.83045768737793, "global_step": 305380, "epoch": 3679} {"train_loss": -25.526885986328125, "global_step": 305381, "epoch": 3679} {"train_loss": -25.293664932250977, "global_step": 305382, "epoch": 3679} {"train_loss": -25.743350982666016, "global_step": 305383, "epoch": 3679} {"train_loss": -25.48390007019043, "global_step": 305384, "epoch": 3679} {"train_loss": -25.806110382080078, "global_step": 305385, "epoch": 3679} {"train_loss": -25.21075439453125, "global_step": 305386, "epoch": 3679} {"train_loss": -25.443912506103516, "global_step": 305387, "epoch": 3679} {"train_loss": -25.34541130065918, "global_step": 305388, "epoch": 3679} {"train_loss": -25.197784423828125, "global_step": 305389, "epoch": 3679} {"train_loss": -25.475061416625977, "global_step": 305390, "epoch": 3679} {"train_loss": -25.304716110229492, "global_step": 305391, "epoch": 3679} {"train_loss": -25.725133895874023, "global_step": 305392, "epoch": 3679} {"train_loss": -25.323789596557617, "global_step": 305393, "epoch": 3679} {"train_loss": -25.600934982299805, "global_step": 305394, "epoch": 3679} {"train_loss": -25.809362411499023, "global_step": 305395, "epoch": 3679} {"train_loss": -25.49226951599121, "global_step": 305396, "epoch": 3679} {"train_loss": -25.411367416381836, "global_step": 305397, "epoch": 3679} {"train_loss": -25.651227951049805, "global_step": 305398, "epoch": 3679} {"train_loss": -25.752124786376953, "global_step": 305399, "epoch": 3679} {"train_loss": -25.68756103515625, "global_step": 305400, "epoch": 3679} {"train_loss": -25.937015533447266, "global_step": 305401, "epoch": 3679} {"train_loss": -26.041784286499023, "global_step": 305402, "epoch": 3679} {"train_loss": -25.754520416259766, "global_step": 305403, "epoch": 3679} {"train_loss": -25.771814346313477, "global_step": 305404, "epoch": 3679} {"train_loss": -25.636411666870117, "global_step": 305405, "epoch": 3679} {"train_loss": -25.81683921813965, "global_step": 305406, "epoch": 3679} {"train_loss": -25.47810935974121, "global_step": 305407, "epoch": 3679} {"train_loss": -25.558612823486328, "global_step": 305408, "epoch": 3679} {"train_loss": -25.81672477722168, "global_step": 305409, "epoch": 3679} {"train_loss": -26.112024307250977, "global_step": 305410, "epoch": 3679} {"train_loss": -25.816679000854492, "global_step": 305411, "epoch": 3679} {"train_loss": -25.787097930908203, "global_step": 305412, "epoch": 3679} {"train_loss": -25.704008102416992, "global_step": 305413, "epoch": 3679} {"train_loss": -25.55731773376465, "global_step": 305414, "epoch": 3679} {"train_loss": -25.844675064086914, "global_step": 305415, "epoch": 3679} {"train_loss": -25.999902725219727, "global_step": 305416, "epoch": 3679} {"train_loss": -25.7675838470459, "global_step": 305417, "epoch": 3679} {"train_loss": -25.651426315307617, "global_step": 305418, "epoch": 3679} {"train_loss": -25.676618576049805, "global_step": 305419, "epoch": 3679} {"train_loss": -25.78748893737793, "global_step": 305420, "epoch": 3679} {"train_loss": -25.56454849243164, "global_step": 305421, "epoch": 3679} {"train_loss": -25.781171798706055, "global_step": 305422, "epoch": 3679} {"train_loss": -25.846435546875, "global_step": 305423, "epoch": 3679} {"train_loss": -25.474761962890625, "global_step": 305424, "epoch": 3679} {"train_loss": -25.625320434570312, "global_step": 305425, "epoch": 3679} {"train_loss": -25.675085067749023, "global_step": 305426, "epoch": 3679} {"train_loss": -25.626708984375, "global_step": 305427, "epoch": 3679} {"train_loss": -25.776721954345703, "global_step": 305428, "epoch": 3679} {"train_loss": -25.836750030517578, "global_step": 305429, "epoch": 3679} {"train_loss": -25.48414421081543, "global_step": 305430, "epoch": 3679} {"train_loss": -26.124204635620117, "global_step": 305431, "epoch": 3679} {"train_loss": -25.826826095581055, "global_step": 305432, "epoch": 3679} {"train_loss": -25.91617774963379, "global_step": 305433, "epoch": 3679} {"train_loss": -26.052997589111328, "global_step": 305434, "epoch": 3679} {"train_loss": -25.831640243530273, "global_step": 305435, "epoch": 3679} {"train_loss": -25.737506866455078, "global_step": 305436, "epoch": 3679} {"train_loss": -25.693042755126953, "global_step": 305437, "epoch": 3679} {"train_loss": -26.26877784729004, "global_step": 305438, "epoch": 3679} {"train_loss": -25.540079921124928, "global_step": 305439, "epoch": 3679, "val_loss": 7274378.0} {"train_loss": -24.825841903686523, "global_step": 305440, "epoch": 3680} {"train_loss": -24.589879989624023, "global_step": 305441, "epoch": 3680} {"train_loss": -23.499292373657227, "global_step": 305442, "epoch": 3680} {"train_loss": -23.744237899780273, "global_step": 305443, "epoch": 3680} {"train_loss": -25.202802658081055, "global_step": 305444, "epoch": 3680} {"train_loss": -24.640188217163086, "global_step": 305445, "epoch": 3680} {"train_loss": -24.857824325561523, "global_step": 305446, "epoch": 3680} {"train_loss": -25.113039016723633, "global_step": 305447, "epoch": 3680} {"train_loss": -25.05723762512207, "global_step": 305448, "epoch": 3680} {"train_loss": -24.923160552978516, "global_step": 305449, "epoch": 3680} {"train_loss": -25.532636642456055, "global_step": 305450, "epoch": 3680} {"train_loss": -25.09112548828125, "global_step": 305451, "epoch": 3680} {"train_loss": -25.5843505859375, "global_step": 305452, "epoch": 3680} {"train_loss": -24.93280601501465, "global_step": 305453, "epoch": 3680} {"train_loss": -25.214481353759766, "global_step": 305454, "epoch": 3680} {"train_loss": -24.920011520385742, "global_step": 305455, "epoch": 3680} {"train_loss": -25.112564086914062, "global_step": 305456, "epoch": 3680} {"train_loss": -25.448339462280273, "global_step": 305457, "epoch": 3680} {"train_loss": -25.039358139038086, "global_step": 305458, "epoch": 3680} {"train_loss": -25.28441619873047, "global_step": 305459, "epoch": 3680} {"train_loss": -25.089828491210938, "global_step": 305460, "epoch": 3680} {"train_loss": -25.235036849975586, "global_step": 305461, "epoch": 3680} {"train_loss": -25.58843421936035, "global_step": 305462, "epoch": 3680} {"train_loss": -25.109712600708008, "global_step": 305463, "epoch": 3680} {"train_loss": -25.54875946044922, "global_step": 305464, "epoch": 3680} {"train_loss": -25.461002349853516, "global_step": 305465, "epoch": 3680} {"train_loss": -25.74884605407715, "global_step": 305466, "epoch": 3680} {"train_loss": -25.646093368530273, "global_step": 305467, "epoch": 3680} {"train_loss": -25.806049346923828, "global_step": 305468, "epoch": 3680} {"train_loss": -25.50296974182129, "global_step": 305469, "epoch": 3680} {"train_loss": -25.488916397094727, "global_step": 305470, "epoch": 3680} {"train_loss": -25.644489288330078, "global_step": 305471, "epoch": 3680} {"train_loss": -25.718164443969727, "global_step": 305472, "epoch": 3680} {"train_loss": -25.86182975769043, "global_step": 305473, "epoch": 3680} {"train_loss": -25.7078914642334, "global_step": 305474, "epoch": 3680} {"train_loss": -25.854267120361328, "global_step": 305475, "epoch": 3680} {"train_loss": -25.845129013061523, "global_step": 305476, "epoch": 3680} {"train_loss": -25.513452529907227, "global_step": 305477, "epoch": 3680} {"train_loss": -25.675573348999023, "global_step": 305478, "epoch": 3680} {"train_loss": -25.45871353149414, "global_step": 305479, "epoch": 3680} {"train_loss": -26.09161949157715, "global_step": 305480, "epoch": 3680} {"train_loss": -25.661619186401367, "global_step": 305481, "epoch": 3680} {"train_loss": -25.70773696899414, "global_step": 305482, "epoch": 3680} {"train_loss": -25.662246704101562, "global_step": 305483, "epoch": 3680} {"train_loss": -26.112945556640625, "global_step": 305484, "epoch": 3680} {"train_loss": -25.894617080688477, "global_step": 305485, "epoch": 3680} {"train_loss": -25.79815101623535, "global_step": 305486, "epoch": 3680} {"train_loss": -25.532442092895508, "global_step": 305487, "epoch": 3680} {"train_loss": -25.723342895507812, "global_step": 305488, "epoch": 3680} {"train_loss": -25.63273048400879, "global_step": 305489, "epoch": 3680} {"train_loss": -25.740400314331055, "global_step": 305490, "epoch": 3680} {"train_loss": -25.928075790405273, "global_step": 305491, "epoch": 3680} {"train_loss": -26.007795333862305, "global_step": 305492, "epoch": 3680} {"train_loss": -26.11090087890625, "global_step": 305493, "epoch": 3680} {"train_loss": -25.7852783203125, "global_step": 305494, "epoch": 3680} {"train_loss": -25.938642501831055, "global_step": 305495, "epoch": 3680} {"train_loss": -25.654775619506836, "global_step": 305496, "epoch": 3680} {"train_loss": -25.986433029174805, "global_step": 305497, "epoch": 3680} {"train_loss": -25.765195846557617, "global_step": 305498, "epoch": 3680} {"train_loss": -25.949331283569336, "global_step": 305499, "epoch": 3680} {"train_loss": -25.6112060546875, "global_step": 305500, "epoch": 3680} {"train_loss": -25.96290397644043, "global_step": 305501, "epoch": 3680} {"train_loss": -25.375913619995117, "global_step": 305502, "epoch": 3680} {"train_loss": -24.772716522216797, "global_step": 305503, "epoch": 3680} {"train_loss": -25.24285316467285, "global_step": 305504, "epoch": 3680} {"train_loss": -25.211624145507812, "global_step": 305505, "epoch": 3680} {"train_loss": -24.552154541015625, "global_step": 305506, "epoch": 3680} {"train_loss": -25.379358291625977, "global_step": 305507, "epoch": 3680} {"train_loss": -24.830524444580078, "global_step": 305508, "epoch": 3680} {"train_loss": -25.467208862304688, "global_step": 305509, "epoch": 3680} {"train_loss": -24.718360900878906, "global_step": 305510, "epoch": 3680} {"train_loss": -25.81512451171875, "global_step": 305511, "epoch": 3680} {"train_loss": -24.535940170288086, "global_step": 305512, "epoch": 3680} {"train_loss": -25.600723266601562, "global_step": 305513, "epoch": 3680} {"train_loss": -24.977991104125977, "global_step": 305514, "epoch": 3680} {"train_loss": -25.30109214782715, "global_step": 305515, "epoch": 3680} {"train_loss": -25.18452262878418, "global_step": 305516, "epoch": 3680} {"train_loss": -25.413827896118164, "global_step": 305517, "epoch": 3680} {"train_loss": -25.465179443359375, "global_step": 305518, "epoch": 3680} {"train_loss": -25.183425903320312, "global_step": 305519, "epoch": 3680} {"train_loss": -25.496362686157227, "global_step": 305520, "epoch": 3680} {"train_loss": -25.503341674804688, "global_step": 305521, "epoch": 3680} {"train_loss": -25.380243439272224, "global_step": 305522, "epoch": 3680, "val_loss": 7027657.5} {"train_loss": -24.35170555114746, "global_step": 305523, "epoch": 3681} {"train_loss": -24.247095108032227, "global_step": 305524, "epoch": 3681} {"train_loss": -23.810022354125977, "global_step": 305525, "epoch": 3681} {"train_loss": -25.1039981842041, "global_step": 305526, "epoch": 3681} {"train_loss": -24.928396224975586, "global_step": 305527, "epoch": 3681} {"train_loss": -24.689279556274414, "global_step": 305528, "epoch": 3681} {"train_loss": -24.9422550201416, "global_step": 305529, "epoch": 3681} {"train_loss": -24.9930419921875, "global_step": 305530, "epoch": 3681} {"train_loss": -24.990140914916992, "global_step": 305531, "epoch": 3681} {"train_loss": -25.156375885009766, "global_step": 305532, "epoch": 3681} {"train_loss": -25.480690002441406, "global_step": 305533, "epoch": 3681} {"train_loss": -24.878965377807617, "global_step": 305534, "epoch": 3681} {"train_loss": -25.345991134643555, "global_step": 305535, "epoch": 3681} {"train_loss": -25.644235610961914, "global_step": 305536, "epoch": 3681} {"train_loss": -25.340862274169922, "global_step": 305537, "epoch": 3681} {"train_loss": -24.812259674072266, "global_step": 305538, "epoch": 3681} {"train_loss": -25.402606964111328, "global_step": 305539, "epoch": 3681} {"train_loss": -25.26666831970215, "global_step": 305540, "epoch": 3681} {"train_loss": -25.594417572021484, "global_step": 305541, "epoch": 3681} {"train_loss": -25.132944107055664, "global_step": 305542, "epoch": 3681} {"train_loss": -25.236948013305664, "global_step": 305543, "epoch": 3681} {"train_loss": -25.428476333618164, "global_step": 305544, "epoch": 3681} {"train_loss": -25.507173538208008, "global_step": 305545, "epoch": 3681} {"train_loss": -25.67725944519043, "global_step": 305546, "epoch": 3681} {"train_loss": -25.666217803955078, "global_step": 305547, "epoch": 3681} {"train_loss": -25.550539016723633, "global_step": 305548, "epoch": 3681} {"train_loss": -25.392696380615234, "global_step": 305549, "epoch": 3681} {"train_loss": -25.75518798828125, "global_step": 305550, "epoch": 3681} {"train_loss": -25.896203994750977, "global_step": 305551, "epoch": 3681} {"train_loss": -25.554094314575195, "global_step": 305552, "epoch": 3681} {"train_loss": -25.609725952148438, "global_step": 305553, "epoch": 3681} {"train_loss": -25.841184616088867, "global_step": 305554, "epoch": 3681} {"train_loss": -25.830896377563477, "global_step": 305555, "epoch": 3681} {"train_loss": -25.593351364135742, "global_step": 305556, "epoch": 3681} {"train_loss": -25.908905029296875, "global_step": 305557, "epoch": 3681} {"train_loss": -25.844518661499023, "global_step": 305558, "epoch": 3681} {"train_loss": -25.746891021728516, "global_step": 305559, "epoch": 3681} {"train_loss": -26.096405029296875, "global_step": 305560, "epoch": 3681} {"train_loss": -25.95185661315918, "global_step": 305561, "epoch": 3681} {"train_loss": -26.31631851196289, "global_step": 305562, "epoch": 3681} {"train_loss": -25.927112579345703, "global_step": 305563, "epoch": 3681} {"train_loss": -26.0560302734375, "global_step": 305564, "epoch": 3681} {"train_loss": -25.66037940979004, "global_step": 305565, "epoch": 3681} {"train_loss": -25.842695236206055, "global_step": 305566, "epoch": 3681} {"train_loss": -25.692365646362305, "global_step": 305567, "epoch": 3681} {"train_loss": -25.379281997680664, "global_step": 305568, "epoch": 3681} {"train_loss": -25.6153621673584, "global_step": 305569, "epoch": 3681} {"train_loss": -25.29587745666504, "global_step": 305570, "epoch": 3681} {"train_loss": -25.775726318359375, "global_step": 305571, "epoch": 3681} {"train_loss": -25.80230140686035, "global_step": 305572, "epoch": 3681} {"train_loss": -25.7050838470459, "global_step": 305573, "epoch": 3681} {"train_loss": -25.784351348876953, "global_step": 305574, "epoch": 3681} {"train_loss": -25.82305908203125, "global_step": 305575, "epoch": 3681} {"train_loss": -25.537805557250977, "global_step": 305576, "epoch": 3681} {"train_loss": -26.05167007446289, "global_step": 305577, "epoch": 3681} {"train_loss": -25.67017936706543, "global_step": 305578, "epoch": 3681} {"train_loss": -25.629255294799805, "global_step": 305579, "epoch": 3681} {"train_loss": -25.424667358398438, "global_step": 305580, "epoch": 3681} {"train_loss": -25.406126022338867, "global_step": 305581, "epoch": 3681} {"train_loss": -25.7861270904541, "global_step": 305582, "epoch": 3681} {"train_loss": -25.812467575073242, "global_step": 305583, "epoch": 3681} {"train_loss": -25.9774227142334, "global_step": 305584, "epoch": 3681} {"train_loss": -25.583404541015625, "global_step": 305585, "epoch": 3681} {"train_loss": -26.06912612915039, "global_step": 305586, "epoch": 3681} {"train_loss": -25.62019157409668, "global_step": 305587, "epoch": 3681} {"train_loss": -26.19548988342285, "global_step": 305588, "epoch": 3681} {"train_loss": -26.044546127319336, "global_step": 305589, "epoch": 3681} {"train_loss": -25.709203720092773, "global_step": 305590, "epoch": 3681} {"train_loss": -25.83966064453125, "global_step": 305591, "epoch": 3681} {"train_loss": -25.701383590698242, "global_step": 305592, "epoch": 3681} {"train_loss": -25.73463249206543, "global_step": 305593, "epoch": 3681} {"train_loss": -25.45041275024414, "global_step": 305594, "epoch": 3681} {"train_loss": -25.616256713867188, "global_step": 305595, "epoch": 3681} {"train_loss": -25.762042999267578, "global_step": 305596, "epoch": 3681} {"train_loss": -25.363666534423828, "global_step": 305597, "epoch": 3681} {"train_loss": -25.865079879760742, "global_step": 305598, "epoch": 3681} {"train_loss": -25.4591121673584, "global_step": 305599, "epoch": 3681} {"train_loss": -25.624496459960938, "global_step": 305600, "epoch": 3681} {"train_loss": -25.73955726623535, "global_step": 305601, "epoch": 3681} {"train_loss": -25.795629501342773, "global_step": 305602, "epoch": 3681} {"train_loss": -25.48160743713379, "global_step": 305603, "epoch": 3681} {"train_loss": -25.7906436920166, "global_step": 305604, "epoch": 3681} {"train_loss": -25.542826824877636, "global_step": 305605, "epoch": 3681, "val_loss": 7191502.0} {"train_loss": -25.396976470947266, "global_step": 305606, "epoch": 3682} {"train_loss": -25.314411163330078, "global_step": 305607, "epoch": 3682} {"train_loss": -25.391681671142578, "global_step": 305608, "epoch": 3682} {"train_loss": -25.345834732055664, "global_step": 305609, "epoch": 3682} {"train_loss": -25.335758209228516, "global_step": 305610, "epoch": 3682} {"train_loss": -25.43636131286621, "global_step": 305611, "epoch": 3682} {"train_loss": -25.516483306884766, "global_step": 305612, "epoch": 3682} {"train_loss": -25.404081344604492, "global_step": 305613, "epoch": 3682} {"train_loss": -25.5651798248291, "global_step": 305614, "epoch": 3682} {"train_loss": -25.8492374420166, "global_step": 305615, "epoch": 3682} {"train_loss": -25.82305908203125, "global_step": 305616, "epoch": 3682} {"train_loss": -25.47186851501465, "global_step": 305617, "epoch": 3682} {"train_loss": -25.584091186523438, "global_step": 305618, "epoch": 3682} {"train_loss": -25.65778923034668, "global_step": 305619, "epoch": 3682} {"train_loss": -25.0387020111084, "global_step": 305620, "epoch": 3682} {"train_loss": -25.068510055541992, "global_step": 305621, "epoch": 3682} {"train_loss": -25.597082138061523, "global_step": 305622, "epoch": 3682} {"train_loss": -25.572683334350586, "global_step": 305623, "epoch": 3682} {"train_loss": -25.844970703125, "global_step": 305624, "epoch": 3682} {"train_loss": -25.89678382873535, "global_step": 305625, "epoch": 3682} {"train_loss": -25.46708106994629, "global_step": 305626, "epoch": 3682} {"train_loss": -25.48189926147461, "global_step": 305627, "epoch": 3682} {"train_loss": -25.348913192749023, "global_step": 305628, "epoch": 3682} {"train_loss": -25.145214080810547, "global_step": 305629, "epoch": 3682} {"train_loss": -25.54990005493164, "global_step": 305630, "epoch": 3682} {"train_loss": -25.655975341796875, "global_step": 305631, "epoch": 3682} {"train_loss": -25.66000747680664, "global_step": 305632, "epoch": 3682} {"train_loss": -25.99917984008789, "global_step": 305633, "epoch": 3682} {"train_loss": -25.49226951599121, "global_step": 305634, "epoch": 3682} {"train_loss": -25.51823616027832, "global_step": 305635, "epoch": 3682} {"train_loss": -25.44445037841797, "global_step": 305636, "epoch": 3682} {"train_loss": -25.31548500061035, "global_step": 305637, "epoch": 3682} {"train_loss": -25.433547973632812, "global_step": 305638, "epoch": 3682} {"train_loss": -25.683856964111328, "global_step": 305639, "epoch": 3682} {"train_loss": -25.544937133789062, "global_step": 305640, "epoch": 3682} {"train_loss": -25.53969383239746, "global_step": 305641, "epoch": 3682} {"train_loss": -25.550947189331055, "global_step": 305642, "epoch": 3682} {"train_loss": -25.830854415893555, "global_step": 305643, "epoch": 3682} {"train_loss": -25.592844009399414, "global_step": 305644, "epoch": 3682} {"train_loss": -25.395505905151367, "global_step": 305645, "epoch": 3682} {"train_loss": -25.725387573242188, "global_step": 305646, "epoch": 3682} {"train_loss": -25.663915634155273, "global_step": 305647, "epoch": 3682} {"train_loss": -25.593595504760742, "global_step": 305648, "epoch": 3682} {"train_loss": -25.632434844970703, "global_step": 305649, "epoch": 3682} {"train_loss": -25.626615524291992, "global_step": 305650, "epoch": 3682} {"train_loss": -25.334211349487305, "global_step": 305651, "epoch": 3682} {"train_loss": -25.676620483398438, "global_step": 305652, "epoch": 3682} {"train_loss": -25.944091796875, "global_step": 305653, "epoch": 3682} {"train_loss": -25.786609649658203, "global_step": 305654, "epoch": 3682} {"train_loss": -25.743066787719727, "global_step": 305655, "epoch": 3682} {"train_loss": -25.894351959228516, "global_step": 305656, "epoch": 3682} {"train_loss": -25.62420082092285, "global_step": 305657, "epoch": 3682} {"train_loss": -26.353315353393555, "global_step": 305658, "epoch": 3682} {"train_loss": -25.618167877197266, "global_step": 305659, "epoch": 3682} {"train_loss": -25.690916061401367, "global_step": 305660, "epoch": 3682} {"train_loss": -25.757892608642578, "global_step": 305661, "epoch": 3682} {"train_loss": -25.51738739013672, "global_step": 305662, "epoch": 3682} {"train_loss": -25.438617706298828, "global_step": 305663, "epoch": 3682} {"train_loss": -25.59251594543457, "global_step": 305664, "epoch": 3682} {"train_loss": -26.126602172851562, "global_step": 305665, "epoch": 3682} {"train_loss": -25.61203384399414, "global_step": 305666, "epoch": 3682} {"train_loss": -25.88533592224121, "global_step": 305667, "epoch": 3682} {"train_loss": -25.657983779907227, "global_step": 305668, "epoch": 3682} {"train_loss": -25.860671997070312, "global_step": 305669, "epoch": 3682} {"train_loss": -25.646900177001953, "global_step": 305670, "epoch": 3682} {"train_loss": -25.774457931518555, "global_step": 305671, "epoch": 3682} {"train_loss": -25.33024787902832, "global_step": 305672, "epoch": 3682} {"train_loss": -25.505788803100586, "global_step": 305673, "epoch": 3682} {"train_loss": -25.139503479003906, "global_step": 305674, "epoch": 3682} {"train_loss": -25.736249923706055, "global_step": 305675, "epoch": 3682} {"train_loss": -25.44439125061035, "global_step": 305676, "epoch": 3682} {"train_loss": -25.596799850463867, "global_step": 305677, "epoch": 3682} {"train_loss": -25.6484432220459, "global_step": 305678, "epoch": 3682} {"train_loss": -25.59956169128418, "global_step": 305679, "epoch": 3682} {"train_loss": -25.783971786499023, "global_step": 305680, "epoch": 3682} {"train_loss": -25.591201782226562, "global_step": 305681, "epoch": 3682} {"train_loss": -25.66451072692871, "global_step": 305682, "epoch": 3682} {"train_loss": -26.015884399414062, "global_step": 305683, "epoch": 3682} {"train_loss": -25.887805938720703, "global_step": 305684, "epoch": 3682} {"train_loss": -25.482789993286133, "global_step": 305685, "epoch": 3682} {"train_loss": -25.93873405456543, "global_step": 305686, "epoch": 3682} {"train_loss": -25.689477920532227, "global_step": 305687, "epoch": 3682} {"train_loss": -25.592675450336504, "global_step": 305688, "epoch": 3682, "val_loss": 7048120.0} {"train_loss": -24.808652877807617, "global_step": 305689, "epoch": 3683} {"train_loss": -24.491994857788086, "global_step": 305690, "epoch": 3683} {"train_loss": -24.73287010192871, "global_step": 305691, "epoch": 3683} {"train_loss": -25.01955223083496, "global_step": 305692, "epoch": 3683} {"train_loss": -25.251815795898438, "global_step": 305693, "epoch": 3683} {"train_loss": -24.475549697875977, "global_step": 305694, "epoch": 3683} {"train_loss": -25.53581428527832, "global_step": 305695, "epoch": 3683} {"train_loss": -24.667922973632812, "global_step": 305696, "epoch": 3683} {"train_loss": -25.385622024536133, "global_step": 305697, "epoch": 3683} {"train_loss": -25.31381607055664, "global_step": 305698, "epoch": 3683} {"train_loss": -24.932024002075195, "global_step": 305699, "epoch": 3683} {"train_loss": -25.28424644470215, "global_step": 305700, "epoch": 3683} {"train_loss": -25.0557861328125, "global_step": 305701, "epoch": 3683} {"train_loss": -25.583459854125977, "global_step": 305702, "epoch": 3683} {"train_loss": -25.01873779296875, "global_step": 305703, "epoch": 3683} {"train_loss": -25.444461822509766, "global_step": 305704, "epoch": 3683} {"train_loss": -25.58696937561035, "global_step": 305705, "epoch": 3683} {"train_loss": -25.606958389282227, "global_step": 305706, "epoch": 3683} {"train_loss": -25.372663497924805, "global_step": 305707, "epoch": 3683} {"train_loss": -25.285810470581055, "global_step": 305708, "epoch": 3683} {"train_loss": -25.826452255249023, "global_step": 305709, "epoch": 3683} {"train_loss": -25.650043487548828, "global_step": 305710, "epoch": 3683} {"train_loss": -25.377962112426758, "global_step": 305711, "epoch": 3683} {"train_loss": -25.746877670288086, "global_step": 305712, "epoch": 3683} {"train_loss": -25.820653915405273, "global_step": 305713, "epoch": 3683} {"train_loss": -25.871967315673828, "global_step": 305714, "epoch": 3683} {"train_loss": -25.387800216674805, "global_step": 305715, "epoch": 3683} {"train_loss": -25.869998931884766, "global_step": 305716, "epoch": 3683} {"train_loss": -25.6295166015625, "global_step": 305717, "epoch": 3683} {"train_loss": -25.79025650024414, "global_step": 305718, "epoch": 3683} {"train_loss": -25.646915435791016, "global_step": 305719, "epoch": 3683} {"train_loss": -25.574148178100586, "global_step": 305720, "epoch": 3683} {"train_loss": -25.282079696655273, "global_step": 305721, "epoch": 3683} {"train_loss": -25.652517318725586, "global_step": 305722, "epoch": 3683} {"train_loss": -26.06593132019043, "global_step": 305723, "epoch": 3683} {"train_loss": -25.546586990356445, "global_step": 305724, "epoch": 3683} {"train_loss": -25.238969802856445, "global_step": 305725, "epoch": 3683} {"train_loss": -25.871259689331055, "global_step": 305726, "epoch": 3683} {"train_loss": -25.273529052734375, "global_step": 305727, "epoch": 3683} {"train_loss": -25.681690216064453, "global_step": 305728, "epoch": 3683} {"train_loss": -25.802417755126953, "global_step": 305729, "epoch": 3683} {"train_loss": -25.50288963317871, "global_step": 305730, "epoch": 3683} {"train_loss": -25.9224853515625, "global_step": 305731, "epoch": 3683} {"train_loss": -25.802885055541992, "global_step": 305732, "epoch": 3683} {"train_loss": -25.91656494140625, "global_step": 305733, "epoch": 3683} {"train_loss": -25.33558464050293, "global_step": 305734, "epoch": 3683} {"train_loss": -25.558576583862305, "global_step": 305735, "epoch": 3683} {"train_loss": -25.715259552001953, "global_step": 305736, "epoch": 3683} {"train_loss": -25.852758407592773, "global_step": 305737, "epoch": 3683} {"train_loss": -26.142492294311523, "global_step": 305738, "epoch": 3683} {"train_loss": -25.57185173034668, "global_step": 305739, "epoch": 3683} {"train_loss": -25.929340362548828, "global_step": 305740, "epoch": 3683} {"train_loss": -25.46003532409668, "global_step": 305741, "epoch": 3683} {"train_loss": -26.02985191345215, "global_step": 305742, "epoch": 3683} {"train_loss": -25.489927291870117, "global_step": 305743, "epoch": 3683} {"train_loss": -25.418781280517578, "global_step": 305744, "epoch": 3683} {"train_loss": -25.68973731994629, "global_step": 305745, "epoch": 3683} {"train_loss": -25.902618408203125, "global_step": 305746, "epoch": 3683} {"train_loss": -25.440414428710938, "global_step": 305747, "epoch": 3683} {"train_loss": -26.006845474243164, "global_step": 305748, "epoch": 3683} {"train_loss": -25.6239013671875, "global_step": 305749, "epoch": 3683} {"train_loss": -25.423856735229492, "global_step": 305750, "epoch": 3683} {"train_loss": -25.39366340637207, "global_step": 305751, "epoch": 3683} {"train_loss": -25.537752151489258, "global_step": 305752, "epoch": 3683} {"train_loss": -25.65375328063965, "global_step": 305753, "epoch": 3683} {"train_loss": -25.7530574798584, "global_step": 305754, "epoch": 3683} {"train_loss": -25.47218894958496, "global_step": 305755, "epoch": 3683} {"train_loss": -25.531599044799805, "global_step": 305756, "epoch": 3683} {"train_loss": -25.880325317382812, "global_step": 305757, "epoch": 3683} {"train_loss": -25.842269897460938, "global_step": 305758, "epoch": 3683} {"train_loss": -25.71439552307129, "global_step": 305759, "epoch": 3683} {"train_loss": -25.627490997314453, "global_step": 305760, "epoch": 3683} {"train_loss": -25.525442123413086, "global_step": 305761, "epoch": 3683} {"train_loss": -25.39841079711914, "global_step": 305762, "epoch": 3683} {"train_loss": -25.755889892578125, "global_step": 305763, "epoch": 3683} {"train_loss": -25.71540641784668, "global_step": 305764, "epoch": 3683} {"train_loss": -25.669301986694336, "global_step": 305765, "epoch": 3683} {"train_loss": -25.76740074157715, "global_step": 305766, "epoch": 3683} {"train_loss": -26.028751373291016, "global_step": 305767, "epoch": 3683} {"train_loss": -25.74393653869629, "global_step": 305768, "epoch": 3683} {"train_loss": -26.01704216003418, "global_step": 305769, "epoch": 3683} {"train_loss": -26.133596420288086, "global_step": 305770, "epoch": 3683} {"train_loss": -25.561753169599786, "global_step": 305771, "epoch": 3683, "val_loss": 7241242.0} {"train_loss": -25.491119384765625, "global_step": 305772, "epoch": 3684} {"train_loss": -25.53706169128418, "global_step": 305773, "epoch": 3684} {"train_loss": -25.450069427490234, "global_step": 305774, "epoch": 3684} {"train_loss": -25.689807891845703, "global_step": 305775, "epoch": 3684} {"train_loss": -25.430496215820312, "global_step": 305776, "epoch": 3684} {"train_loss": -25.680810928344727, "global_step": 305777, "epoch": 3684} {"train_loss": -25.842487335205078, "global_step": 305778, "epoch": 3684} {"train_loss": -25.683002471923828, "global_step": 305779, "epoch": 3684} {"train_loss": -25.350433349609375, "global_step": 305780, "epoch": 3684} {"train_loss": -25.48872947692871, "global_step": 305781, "epoch": 3684} {"train_loss": -25.67818260192871, "global_step": 305782, "epoch": 3684} {"train_loss": -25.872034072875977, "global_step": 305783, "epoch": 3684} {"train_loss": -25.59819793701172, "global_step": 305784, "epoch": 3684} {"train_loss": -26.116546630859375, "global_step": 305785, "epoch": 3684} {"train_loss": -25.616846084594727, "global_step": 305786, "epoch": 3684} {"train_loss": -25.860309600830078, "global_step": 305787, "epoch": 3684} {"train_loss": -25.562530517578125, "global_step": 305788, "epoch": 3684} {"train_loss": -25.8035945892334, "global_step": 305789, "epoch": 3684} {"train_loss": -25.606420516967773, "global_step": 305790, "epoch": 3684} {"train_loss": -25.705169677734375, "global_step": 305791, "epoch": 3684} {"train_loss": -25.92484474182129, "global_step": 305792, "epoch": 3684} {"train_loss": -26.048297882080078, "global_step": 305793, "epoch": 3684} {"train_loss": -25.574644088745117, "global_step": 305794, "epoch": 3684} {"train_loss": -25.528289794921875, "global_step": 305795, "epoch": 3684} {"train_loss": -25.89751625061035, "global_step": 305796, "epoch": 3684} {"train_loss": -25.675214767456055, "global_step": 305797, "epoch": 3684} {"train_loss": -25.70453453063965, "global_step": 305798, "epoch": 3684} {"train_loss": -26.03464126586914, "global_step": 305799, "epoch": 3684} {"train_loss": -25.518800735473633, "global_step": 305800, "epoch": 3684} {"train_loss": -25.687314987182617, "global_step": 305801, "epoch": 3684} {"train_loss": -25.966150283813477, "global_step": 305802, "epoch": 3684} {"train_loss": -25.71567726135254, "global_step": 305803, "epoch": 3684} {"train_loss": -25.716379165649414, "global_step": 305804, "epoch": 3684} {"train_loss": -25.784814834594727, "global_step": 305805, "epoch": 3684} {"train_loss": -26.004108428955078, "global_step": 305806, "epoch": 3684} {"train_loss": -25.552030563354492, "global_step": 305807, "epoch": 3684} {"train_loss": -25.601856231689453, "global_step": 305808, "epoch": 3684} {"train_loss": -25.479339599609375, "global_step": 305809, "epoch": 3684} {"train_loss": -25.808927536010742, "global_step": 305810, "epoch": 3684} {"train_loss": -25.537212371826172, "global_step": 305811, "epoch": 3684} {"train_loss": -25.441144943237305, "global_step": 305812, "epoch": 3684} {"train_loss": -25.437360763549805, "global_step": 305813, "epoch": 3684} {"train_loss": -25.874914169311523, "global_step": 305814, "epoch": 3684} {"train_loss": -25.826574325561523, "global_step": 305815, "epoch": 3684} {"train_loss": -25.561534881591797, "global_step": 305816, "epoch": 3684} {"train_loss": -25.94748878479004, "global_step": 305817, "epoch": 3684} {"train_loss": -25.846200942993164, "global_step": 305818, "epoch": 3684} {"train_loss": -25.97292137145996, "global_step": 305819, "epoch": 3684} {"train_loss": -25.85807228088379, "global_step": 305820, "epoch": 3684} {"train_loss": -25.738357543945312, "global_step": 305821, "epoch": 3684} {"train_loss": -25.97579002380371, "global_step": 305822, "epoch": 3684} {"train_loss": -25.642276763916016, "global_step": 305823, "epoch": 3684} {"train_loss": -25.456600189208984, "global_step": 305824, "epoch": 3684} {"train_loss": -25.633087158203125, "global_step": 305825, "epoch": 3684} {"train_loss": -25.30771827697754, "global_step": 305826, "epoch": 3684} {"train_loss": -25.825468063354492, "global_step": 305827, "epoch": 3684} {"train_loss": -25.45219612121582, "global_step": 305828, "epoch": 3684} {"train_loss": -25.703033447265625, "global_step": 305829, "epoch": 3684} {"train_loss": -26.153589248657227, "global_step": 305830, "epoch": 3684} {"train_loss": -25.677549362182617, "global_step": 305831, "epoch": 3684} {"train_loss": -25.9068603515625, "global_step": 305832, "epoch": 3684} {"train_loss": -25.72519302368164, "global_step": 305833, "epoch": 3684} {"train_loss": -25.710683822631836, "global_step": 305834, "epoch": 3684} {"train_loss": -26.236860275268555, "global_step": 305835, "epoch": 3684} {"train_loss": -25.41156768798828, "global_step": 305836, "epoch": 3684} {"train_loss": -25.763187408447266, "global_step": 305837, "epoch": 3684} {"train_loss": -25.89788818359375, "global_step": 305838, "epoch": 3684} {"train_loss": -25.589014053344727, "global_step": 305839, "epoch": 3684} {"train_loss": -25.68208122253418, "global_step": 305840, "epoch": 3684} {"train_loss": -25.86897087097168, "global_step": 305841, "epoch": 3684} {"train_loss": -25.945966720581055, "global_step": 305842, "epoch": 3684} {"train_loss": -25.53667640686035, "global_step": 305843, "epoch": 3684} {"train_loss": -25.574419021606445, "global_step": 305844, "epoch": 3684} {"train_loss": -25.625980377197266, "global_step": 305845, "epoch": 3684} {"train_loss": -25.880239486694336, "global_step": 305846, "epoch": 3684} {"train_loss": -25.69422721862793, "global_step": 305847, "epoch": 3684} {"train_loss": -25.71632194519043, "global_step": 305848, "epoch": 3684} {"train_loss": -25.60886001586914, "global_step": 305849, "epoch": 3684} {"train_loss": -25.905210494995117, "global_step": 305850, "epoch": 3684} {"train_loss": -25.785367965698242, "global_step": 305851, "epoch": 3684} {"train_loss": -25.642200469970703, "global_step": 305852, "epoch": 3684} {"train_loss": -25.79888343811035, "global_step": 305853, "epoch": 3684} {"train_loss": -25.70523264321936, "global_step": 305854, "epoch": 3684, "val_loss": 7267787.0} {"train_loss": -25.53859519958496, "global_step": 305855, "epoch": 3685} {"train_loss": -25.6053524017334, "global_step": 305856, "epoch": 3685} {"train_loss": -24.877206802368164, "global_step": 305857, "epoch": 3685} {"train_loss": -25.40670394897461, "global_step": 305858, "epoch": 3685} {"train_loss": -25.065446853637695, "global_step": 305859, "epoch": 3685} {"train_loss": -25.15593147277832, "global_step": 305860, "epoch": 3685} {"train_loss": -25.37476348876953, "global_step": 305861, "epoch": 3685} {"train_loss": -25.30264663696289, "global_step": 305862, "epoch": 3685} {"train_loss": -25.098112106323242, "global_step": 305863, "epoch": 3685} {"train_loss": -25.10149574279785, "global_step": 305864, "epoch": 3685} {"train_loss": -25.598129272460938, "global_step": 305865, "epoch": 3685} {"train_loss": -25.48287582397461, "global_step": 305866, "epoch": 3685} {"train_loss": -25.087339401245117, "global_step": 305867, "epoch": 3685} {"train_loss": -25.556760787963867, "global_step": 305868, "epoch": 3685} {"train_loss": -25.413528442382812, "global_step": 305869, "epoch": 3685} {"train_loss": -25.392126083374023, "global_step": 305870, "epoch": 3685} {"train_loss": -25.4381160736084, "global_step": 305871, "epoch": 3685} {"train_loss": -25.522438049316406, "global_step": 305872, "epoch": 3685} {"train_loss": -25.453353881835938, "global_step": 305873, "epoch": 3685} {"train_loss": -25.311426162719727, "global_step": 305874, "epoch": 3685} {"train_loss": -25.229507446289062, "global_step": 305875, "epoch": 3685} {"train_loss": -25.361082077026367, "global_step": 305876, "epoch": 3685} {"train_loss": -25.216283798217773, "global_step": 305877, "epoch": 3685} {"train_loss": -25.65863609313965, "global_step": 305878, "epoch": 3685} {"train_loss": -25.484098434448242, "global_step": 305879, "epoch": 3685} {"train_loss": -25.38044548034668, "global_step": 305880, "epoch": 3685} {"train_loss": -25.54190444946289, "global_step": 305881, "epoch": 3685} {"train_loss": -25.61299705505371, "global_step": 305882, "epoch": 3685} {"train_loss": -25.583921432495117, "global_step": 305883, "epoch": 3685} {"train_loss": -25.555578231811523, "global_step": 305884, "epoch": 3685} {"train_loss": -25.309207916259766, "global_step": 305885, "epoch": 3685} {"train_loss": -25.381261825561523, "global_step": 305886, "epoch": 3685} {"train_loss": -25.323135375976562, "global_step": 305887, "epoch": 3685} {"train_loss": -25.808319091796875, "global_step": 305888, "epoch": 3685} {"train_loss": -26.025039672851562, "global_step": 305889, "epoch": 3685} {"train_loss": -25.679838180541992, "global_step": 305890, "epoch": 3685} {"train_loss": -25.324298858642578, "global_step": 305891, "epoch": 3685} {"train_loss": -25.766515731811523, "global_step": 305892, "epoch": 3685} {"train_loss": -25.812183380126953, "global_step": 305893, "epoch": 3685} {"train_loss": -25.361528396606445, "global_step": 305894, "epoch": 3685} {"train_loss": -25.781686782836914, "global_step": 305895, "epoch": 3685} {"train_loss": -25.6616268157959, "global_step": 305896, "epoch": 3685} {"train_loss": -25.890411376953125, "global_step": 305897, "epoch": 3685} {"train_loss": -25.970947265625, "global_step": 305898, "epoch": 3685} {"train_loss": -25.790435791015625, "global_step": 305899, "epoch": 3685} {"train_loss": -25.7425537109375, "global_step": 305900, "epoch": 3685} {"train_loss": -25.544275283813477, "global_step": 305901, "epoch": 3685} {"train_loss": -25.87122917175293, "global_step": 305902, "epoch": 3685} {"train_loss": -25.91077995300293, "global_step": 305903, "epoch": 3685} {"train_loss": -25.769094467163086, "global_step": 305904, "epoch": 3685} {"train_loss": -25.780441284179688, "global_step": 305905, "epoch": 3685} {"train_loss": -25.35396385192871, "global_step": 305906, "epoch": 3685} {"train_loss": -25.917478561401367, "global_step": 305907, "epoch": 3685} {"train_loss": -25.88107681274414, "global_step": 305908, "epoch": 3685} {"train_loss": -25.96881675720215, "global_step": 305909, "epoch": 3685} {"train_loss": -25.74469566345215, "global_step": 305910, "epoch": 3685} {"train_loss": -26.363330841064453, "global_step": 305911, "epoch": 3685} {"train_loss": -25.738306045532227, "global_step": 305912, "epoch": 3685} {"train_loss": -25.730405807495117, "global_step": 305913, "epoch": 3685} {"train_loss": -25.845273971557617, "global_step": 305914, "epoch": 3685} {"train_loss": -25.985916137695312, "global_step": 305915, "epoch": 3685} {"train_loss": -25.702030181884766, "global_step": 305916, "epoch": 3685} {"train_loss": -25.397621154785156, "global_step": 305917, "epoch": 3685} {"train_loss": -25.788782119750977, "global_step": 305918, "epoch": 3685} {"train_loss": -25.93204116821289, "global_step": 305919, "epoch": 3685} {"train_loss": -25.703094482421875, "global_step": 305920, "epoch": 3685} {"train_loss": -25.929615020751953, "global_step": 305921, "epoch": 3685} {"train_loss": -25.644811630249023, "global_step": 305922, "epoch": 3685} {"train_loss": -25.8579158782959, "global_step": 305923, "epoch": 3685} {"train_loss": -26.140518188476562, "global_step": 305924, "epoch": 3685} {"train_loss": -25.672758102416992, "global_step": 305925, "epoch": 3685} {"train_loss": -25.8297061920166, "global_step": 305926, "epoch": 3685} {"train_loss": -25.696142196655273, "global_step": 305927, "epoch": 3685} {"train_loss": -25.879150390625, "global_step": 305928, "epoch": 3685} {"train_loss": -25.8721866607666, "global_step": 305929, "epoch": 3685} {"train_loss": -25.843994140625, "global_step": 305930, "epoch": 3685} {"train_loss": -26.012378692626953, "global_step": 305931, "epoch": 3685} {"train_loss": -25.698169708251953, "global_step": 305932, "epoch": 3685} {"train_loss": -25.818206787109375, "global_step": 305933, "epoch": 3685} {"train_loss": -25.8068790435791, "global_step": 305934, "epoch": 3685} {"train_loss": -25.874786376953125, "global_step": 305935, "epoch": 3685} {"train_loss": -25.546894073486328, "global_step": 305936, "epoch": 3685} {"train_loss": -25.60920719928052, "global_step": 305937, "epoch": 3685, "val_loss": 7106903.0} {"train_loss": -22.74260902404785, "global_step": 305938, "epoch": 3686} {"train_loss": -23.573209762573242, "global_step": 305939, "epoch": 3686} {"train_loss": -24.183874130249023, "global_step": 305940, "epoch": 3686} {"train_loss": -24.104536056518555, "global_step": 305941, "epoch": 3686} {"train_loss": -24.109546661376953, "global_step": 305942, "epoch": 3686} {"train_loss": -24.574304580688477, "global_step": 305943, "epoch": 3686} {"train_loss": -24.652084350585938, "global_step": 305944, "epoch": 3686} {"train_loss": -24.7925968170166, "global_step": 305945, "epoch": 3686} {"train_loss": -25.01150894165039, "global_step": 305946, "epoch": 3686} {"train_loss": -24.12886619567871, "global_step": 305947, "epoch": 3686} {"train_loss": -24.782522201538086, "global_step": 305948, "epoch": 3686} {"train_loss": -24.771282196044922, "global_step": 305949, "epoch": 3686} {"train_loss": -24.923755645751953, "global_step": 305950, "epoch": 3686} {"train_loss": -24.821287155151367, "global_step": 305951, "epoch": 3686} {"train_loss": -24.865070343017578, "global_step": 305952, "epoch": 3686} {"train_loss": -24.9503231048584, "global_step": 305953, "epoch": 3686} {"train_loss": -24.983102798461914, "global_step": 305954, "epoch": 3686} {"train_loss": -24.949430465698242, "global_step": 305955, "epoch": 3686} {"train_loss": -25.211536407470703, "global_step": 305956, "epoch": 3686} {"train_loss": -25.174474716186523, "global_step": 305957, "epoch": 3686} {"train_loss": -25.32184410095215, "global_step": 305958, "epoch": 3686} {"train_loss": -25.499542236328125, "global_step": 305959, "epoch": 3686} {"train_loss": -25.069700241088867, "global_step": 305960, "epoch": 3686} {"train_loss": -25.24443244934082, "global_step": 305961, "epoch": 3686} {"train_loss": -25.406539916992188, "global_step": 305962, "epoch": 3686} {"train_loss": -25.266660690307617, "global_step": 305963, "epoch": 3686} {"train_loss": -25.275693893432617, "global_step": 305964, "epoch": 3686} {"train_loss": -25.71860694885254, "global_step": 305965, "epoch": 3686} {"train_loss": -25.127817153930664, "global_step": 305966, "epoch": 3686} {"train_loss": -25.322126388549805, "global_step": 305967, "epoch": 3686} {"train_loss": -25.496967315673828, "global_step": 305968, "epoch": 3686} {"train_loss": -25.240360260009766, "global_step": 305969, "epoch": 3686} {"train_loss": -25.459131240844727, "global_step": 305970, "epoch": 3686} {"train_loss": -25.3063907623291, "global_step": 305971, "epoch": 3686} {"train_loss": -25.752002716064453, "global_step": 305972, "epoch": 3686} {"train_loss": -25.59808921813965, "global_step": 305973, "epoch": 3686} {"train_loss": -25.803497314453125, "global_step": 305974, "epoch": 3686} {"train_loss": -25.833646774291992, "global_step": 305975, "epoch": 3686} {"train_loss": -25.775196075439453, "global_step": 305976, "epoch": 3686} {"train_loss": -25.725616455078125, "global_step": 305977, "epoch": 3686} {"train_loss": -25.46409034729004, "global_step": 305978, "epoch": 3686} {"train_loss": -25.727890014648438, "global_step": 305979, "epoch": 3686} {"train_loss": -25.88591957092285, "global_step": 305980, "epoch": 3686} {"train_loss": -25.789630889892578, "global_step": 305981, "epoch": 3686} {"train_loss": -26.088153839111328, "global_step": 305982, "epoch": 3686} {"train_loss": -26.109704971313477, "global_step": 305983, "epoch": 3686} {"train_loss": -25.872472763061523, "global_step": 305984, "epoch": 3686} {"train_loss": -25.444263458251953, "global_step": 305985, "epoch": 3686} {"train_loss": -25.671192169189453, "global_step": 305986, "epoch": 3686} {"train_loss": -25.437915802001953, "global_step": 305987, "epoch": 3686} {"train_loss": -25.73347282409668, "global_step": 305988, "epoch": 3686} {"train_loss": -25.547805786132812, "global_step": 305989, "epoch": 3686} {"train_loss": -26.209638595581055, "global_step": 305990, "epoch": 3686} {"train_loss": -25.951465606689453, "global_step": 305991, "epoch": 3686} {"train_loss": -26.052631378173828, "global_step": 305992, "epoch": 3686} {"train_loss": -26.265729904174805, "global_step": 305993, "epoch": 3686} {"train_loss": -25.904632568359375, "global_step": 305994, "epoch": 3686} {"train_loss": -25.935138702392578, "global_step": 305995, "epoch": 3686} {"train_loss": -25.618133544921875, "global_step": 305996, "epoch": 3686} {"train_loss": -25.902082443237305, "global_step": 305997, "epoch": 3686} {"train_loss": -25.703414916992188, "global_step": 305998, "epoch": 3686} {"train_loss": -26.0404109954834, "global_step": 305999, "epoch": 3686} {"train_loss": -24.95265769958496, "global_step": 306000, "epoch": 3686} {"train_loss": -25.347549438476562, "global_step": 306001, "epoch": 3686} {"train_loss": -25.69867515563965, "global_step": 306002, "epoch": 3686} {"train_loss": -24.829748153686523, "global_step": 306003, "epoch": 3686} {"train_loss": -25.2792911529541, "global_step": 306004, "epoch": 3686} {"train_loss": -25.441936492919922, "global_step": 306005, "epoch": 3686} {"train_loss": -25.55504608154297, "global_step": 306006, "epoch": 3686} {"train_loss": -25.736007690429688, "global_step": 306007, "epoch": 3686} {"train_loss": -25.56599235534668, "global_step": 306008, "epoch": 3686} {"train_loss": -25.591968536376953, "global_step": 306009, "epoch": 3686} {"train_loss": -25.325246810913086, "global_step": 306010, "epoch": 3686} {"train_loss": -25.600631713867188, "global_step": 306011, "epoch": 3686} {"train_loss": -25.5933895111084, "global_step": 306012, "epoch": 3686} {"train_loss": -25.287399291992188, "global_step": 306013, "epoch": 3686} {"train_loss": -25.9212589263916, "global_step": 306014, "epoch": 3686} {"train_loss": -25.462215423583984, "global_step": 306015, "epoch": 3686} {"train_loss": -25.58561134338379, "global_step": 306016, "epoch": 3686} {"train_loss": -25.804859161376953, "global_step": 306017, "epoch": 3686} {"train_loss": -25.702808380126953, "global_step": 306018, "epoch": 3686} {"train_loss": -25.817895889282227, "global_step": 306019, "epoch": 3686} {"train_loss": -25.35850129644555, "global_step": 306020, "epoch": 3686, "val_loss": 7159267.0} {"train_loss": -24.87141990661621, "global_step": 306021, "epoch": 3687} {"train_loss": -25.380231857299805, "global_step": 306022, "epoch": 3687} {"train_loss": -25.46397590637207, "global_step": 306023, "epoch": 3687} {"train_loss": -25.408309936523438, "global_step": 306024, "epoch": 3687} {"train_loss": -25.257734298706055, "global_step": 306025, "epoch": 3687} {"train_loss": -25.668542861938477, "global_step": 306026, "epoch": 3687} {"train_loss": -25.248825073242188, "global_step": 306027, "epoch": 3687} {"train_loss": -25.208791732788086, "global_step": 306028, "epoch": 3687} {"train_loss": -24.79390525817871, "global_step": 306029, "epoch": 3687} {"train_loss": -25.18744468688965, "global_step": 306030, "epoch": 3687} {"train_loss": -25.25823974609375, "global_step": 306031, "epoch": 3687} {"train_loss": -25.89723777770996, "global_step": 306032, "epoch": 3687} {"train_loss": -25.189722061157227, "global_step": 306033, "epoch": 3687} {"train_loss": -25.183517456054688, "global_step": 306034, "epoch": 3687} {"train_loss": -25.33013153076172, "global_step": 306035, "epoch": 3687} {"train_loss": -25.45258903503418, "global_step": 306036, "epoch": 3687} {"train_loss": -25.61097526550293, "global_step": 306037, "epoch": 3687} {"train_loss": -26.01578712463379, "global_step": 306038, "epoch": 3687} {"train_loss": -25.650104522705078, "global_step": 306039, "epoch": 3687} {"train_loss": -25.459308624267578, "global_step": 306040, "epoch": 3687} {"train_loss": -25.660140991210938, "global_step": 306041, "epoch": 3687} {"train_loss": -26.007110595703125, "global_step": 306042, "epoch": 3687} {"train_loss": -25.65743064880371, "global_step": 306043, "epoch": 3687} {"train_loss": -25.663043975830078, "global_step": 306044, "epoch": 3687} {"train_loss": -25.331928253173828, "global_step": 306045, "epoch": 3687} {"train_loss": -25.7023983001709, "global_step": 306046, "epoch": 3687} {"train_loss": -25.39340591430664, "global_step": 306047, "epoch": 3687} {"train_loss": -25.54374122619629, "global_step": 306048, "epoch": 3687} {"train_loss": -25.774621963500977, "global_step": 306049, "epoch": 3687} {"train_loss": -25.49800682067871, "global_step": 306050, "epoch": 3687} {"train_loss": -25.566221237182617, "global_step": 306051, "epoch": 3687} {"train_loss": -25.8208065032959, "global_step": 306052, "epoch": 3687} {"train_loss": -25.91016960144043, "global_step": 306053, "epoch": 3687} {"train_loss": -25.705860137939453, "global_step": 306054, "epoch": 3687} {"train_loss": -25.504484176635742, "global_step": 306055, "epoch": 3687} {"train_loss": -25.672021865844727, "global_step": 306056, "epoch": 3687} {"train_loss": -25.783384323120117, "global_step": 306057, "epoch": 3687} {"train_loss": -25.791595458984375, "global_step": 306058, "epoch": 3687} {"train_loss": -25.797651290893555, "global_step": 306059, "epoch": 3687} {"train_loss": -25.774988174438477, "global_step": 306060, "epoch": 3687} {"train_loss": -25.759973526000977, "global_step": 306061, "epoch": 3687} {"train_loss": -26.00345802307129, "global_step": 306062, "epoch": 3687} {"train_loss": -25.654428482055664, "global_step": 306063, "epoch": 3687} {"train_loss": -25.7395076751709, "global_step": 306064, "epoch": 3687} {"train_loss": -25.744367599487305, "global_step": 306065, "epoch": 3687} {"train_loss": -25.815128326416016, "global_step": 306066, "epoch": 3687} {"train_loss": -25.777313232421875, "global_step": 306067, "epoch": 3687} {"train_loss": -25.713979721069336, "global_step": 306068, "epoch": 3687} {"train_loss": -26.009321212768555, "global_step": 306069, "epoch": 3687} {"train_loss": -25.747512817382812, "global_step": 306070, "epoch": 3687} {"train_loss": -25.924909591674805, "global_step": 306071, "epoch": 3687} {"train_loss": -26.3348388671875, "global_step": 306072, "epoch": 3687} {"train_loss": -26.043432235717773, "global_step": 306073, "epoch": 3687} {"train_loss": -25.588735580444336, "global_step": 306074, "epoch": 3687} {"train_loss": -25.605224609375, "global_step": 306075, "epoch": 3687} {"train_loss": -25.675378799438477, "global_step": 306076, "epoch": 3687} {"train_loss": -25.964323043823242, "global_step": 306077, "epoch": 3687} {"train_loss": -25.2386531829834, "global_step": 306078, "epoch": 3687} {"train_loss": -25.909772872924805, "global_step": 306079, "epoch": 3687} {"train_loss": -25.792890548706055, "global_step": 306080, "epoch": 3687} {"train_loss": -25.699569702148438, "global_step": 306081, "epoch": 3687} {"train_loss": -25.667083740234375, "global_step": 306082, "epoch": 3687} {"train_loss": -25.67513084411621, "global_step": 306083, "epoch": 3687} {"train_loss": -26.013681411743164, "global_step": 306084, "epoch": 3687} {"train_loss": -25.670581817626953, "global_step": 306085, "epoch": 3687} {"train_loss": -26.005868911743164, "global_step": 306086, "epoch": 3687} {"train_loss": -25.670072555541992, "global_step": 306087, "epoch": 3687} {"train_loss": -25.618682861328125, "global_step": 306088, "epoch": 3687} {"train_loss": -25.744556427001953, "global_step": 306089, "epoch": 3687} {"train_loss": -25.7437801361084, "global_step": 306090, "epoch": 3687} {"train_loss": -25.848974227905273, "global_step": 306091, "epoch": 3687} {"train_loss": -25.869565963745117, "global_step": 306092, "epoch": 3687} {"train_loss": -25.867216110229492, "global_step": 306093, "epoch": 3687} {"train_loss": -25.928455352783203, "global_step": 306094, "epoch": 3687} {"train_loss": -25.672636032104492, "global_step": 306095, "epoch": 3687} {"train_loss": -25.382566452026367, "global_step": 306096, "epoch": 3687} {"train_loss": -25.9414119720459, "global_step": 306097, "epoch": 3687} {"train_loss": -25.873815536499023, "global_step": 306098, "epoch": 3687} {"train_loss": -26.0048885345459, "global_step": 306099, "epoch": 3687} {"train_loss": -26.183786392211914, "global_step": 306100, "epoch": 3687} {"train_loss": -25.82954978942871, "global_step": 306101, "epoch": 3687} {"train_loss": -25.824115753173828, "global_step": 306102, "epoch": 3687} {"train_loss": -25.66831129143037, "global_step": 306103, "epoch": 3687, "val_loss": 7177275.0} {"train_loss": -25.400819778442383, "global_step": 306104, "epoch": 3688} {"train_loss": -24.826889038085938, "global_step": 306105, "epoch": 3688} {"train_loss": -24.562612533569336, "global_step": 306106, "epoch": 3688} {"train_loss": -24.91428565979004, "global_step": 306107, "epoch": 3688} {"train_loss": -25.257156372070312, "global_step": 306108, "epoch": 3688} {"train_loss": -25.570642471313477, "global_step": 306109, "epoch": 3688} {"train_loss": -25.223392486572266, "global_step": 306110, "epoch": 3688} {"train_loss": -25.35694694519043, "global_step": 306111, "epoch": 3688} {"train_loss": -25.57192039489746, "global_step": 306112, "epoch": 3688} {"train_loss": -25.253847122192383, "global_step": 306113, "epoch": 3688} {"train_loss": -25.6097469329834, "global_step": 306114, "epoch": 3688} {"train_loss": -25.635761260986328, "global_step": 306115, "epoch": 3688} {"train_loss": -25.452014923095703, "global_step": 306116, "epoch": 3688} {"train_loss": -25.786909103393555, "global_step": 306117, "epoch": 3688} {"train_loss": -25.621658325195312, "global_step": 306118, "epoch": 3688} {"train_loss": -25.249582290649414, "global_step": 306119, "epoch": 3688} {"train_loss": -25.388208389282227, "global_step": 306120, "epoch": 3688} {"train_loss": -25.50349235534668, "global_step": 306121, "epoch": 3688} {"train_loss": -25.346372604370117, "global_step": 306122, "epoch": 3688} {"train_loss": -25.427122116088867, "global_step": 306123, "epoch": 3688} {"train_loss": -25.649133682250977, "global_step": 306124, "epoch": 3688} {"train_loss": -25.733423233032227, "global_step": 306125, "epoch": 3688} {"train_loss": -25.144990921020508, "global_step": 306126, "epoch": 3688} {"train_loss": -25.63972282409668, "global_step": 306127, "epoch": 3688} {"train_loss": -25.31263542175293, "global_step": 306128, "epoch": 3688} {"train_loss": -25.736352920532227, "global_step": 306129, "epoch": 3688} {"train_loss": -25.69391441345215, "global_step": 306130, "epoch": 3688} {"train_loss": -25.593961715698242, "global_step": 306131, "epoch": 3688} {"train_loss": -25.3947811126709, "global_step": 306132, "epoch": 3688} {"train_loss": -25.811933517456055, "global_step": 306133, "epoch": 3688} {"train_loss": -25.256824493408203, "global_step": 306134, "epoch": 3688} {"train_loss": -25.724720001220703, "global_step": 306135, "epoch": 3688} {"train_loss": -25.637786865234375, "global_step": 306136, "epoch": 3688} {"train_loss": -25.857709884643555, "global_step": 306137, "epoch": 3688} {"train_loss": -25.59633445739746, "global_step": 306138, "epoch": 3688} {"train_loss": -25.333967208862305, "global_step": 306139, "epoch": 3688} {"train_loss": -25.5906982421875, "global_step": 306140, "epoch": 3688} {"train_loss": -25.64570426940918, "global_step": 306141, "epoch": 3688} {"train_loss": -25.917438507080078, "global_step": 306142, "epoch": 3688} {"train_loss": -25.688650131225586, "global_step": 306143, "epoch": 3688} {"train_loss": -25.6507511138916, "global_step": 306144, "epoch": 3688} {"train_loss": -25.969995498657227, "global_step": 306145, "epoch": 3688} {"train_loss": -25.78330421447754, "global_step": 306146, "epoch": 3688} {"train_loss": -25.740400314331055, "global_step": 306147, "epoch": 3688} {"train_loss": -25.547388076782227, "global_step": 306148, "epoch": 3688} {"train_loss": -25.6418399810791, "global_step": 306149, "epoch": 3688} {"train_loss": -25.94024085998535, "global_step": 306150, "epoch": 3688} {"train_loss": -25.839208602905273, "global_step": 306151, "epoch": 3688} {"train_loss": -25.459495544433594, "global_step": 306152, "epoch": 3688} {"train_loss": -25.734710693359375, "global_step": 306153, "epoch": 3688} {"train_loss": -25.825653076171875, "global_step": 306154, "epoch": 3688} {"train_loss": -25.45381736755371, "global_step": 306155, "epoch": 3688} {"train_loss": -25.841663360595703, "global_step": 306156, "epoch": 3688} {"train_loss": -25.594892501831055, "global_step": 306157, "epoch": 3688} {"train_loss": -25.81144142150879, "global_step": 306158, "epoch": 3688} {"train_loss": -25.93006706237793, "global_step": 306159, "epoch": 3688} {"train_loss": -25.85438346862793, "global_step": 306160, "epoch": 3688} {"train_loss": -25.398778915405273, "global_step": 306161, "epoch": 3688} {"train_loss": -25.661304473876953, "global_step": 306162, "epoch": 3688} {"train_loss": -25.7709903717041, "global_step": 306163, "epoch": 3688} {"train_loss": -25.545345306396484, "global_step": 306164, "epoch": 3688} {"train_loss": -25.842529296875, "global_step": 306165, "epoch": 3688} {"train_loss": -25.898839950561523, "global_step": 306166, "epoch": 3688} {"train_loss": -25.58237075805664, "global_step": 306167, "epoch": 3688} {"train_loss": -25.596622467041016, "global_step": 306168, "epoch": 3688} {"train_loss": -26.134479522705078, "global_step": 306169, "epoch": 3688} {"train_loss": -25.51654624938965, "global_step": 306170, "epoch": 3688} {"train_loss": -26.144460678100586, "global_step": 306171, "epoch": 3688} {"train_loss": -25.41632652282715, "global_step": 306172, "epoch": 3688} {"train_loss": -25.580429077148438, "global_step": 306173, "epoch": 3688} {"train_loss": -25.53053092956543, "global_step": 306174, "epoch": 3688} {"train_loss": -25.4542293548584, "global_step": 306175, "epoch": 3688} {"train_loss": -25.75152015686035, "global_step": 306176, "epoch": 3688} {"train_loss": -25.945587158203125, "global_step": 306177, "epoch": 3688} {"train_loss": -25.966955184936523, "global_step": 306178, "epoch": 3688} {"train_loss": -25.84902000427246, "global_step": 306179, "epoch": 3688} {"train_loss": -25.61395835876465, "global_step": 306180, "epoch": 3688} {"train_loss": -25.90411949157715, "global_step": 306181, "epoch": 3688} {"train_loss": -25.53741455078125, "global_step": 306182, "epoch": 3688} {"train_loss": -25.402082443237305, "global_step": 306183, "epoch": 3688} {"train_loss": -25.991437911987305, "global_step": 306184, "epoch": 3688} {"train_loss": -26.04059410095215, "global_step": 306185, "epoch": 3688} {"train_loss": -25.606477484645612, "global_step": 306186, "epoch": 3688, "val_loss": 7141223.0} {"train_loss": -25.101308822631836, "global_step": 306187, "epoch": 3689} {"train_loss": -25.201379776000977, "global_step": 306188, "epoch": 3689} {"train_loss": -25.27107048034668, "global_step": 306189, "epoch": 3689} {"train_loss": -24.815702438354492, "global_step": 306190, "epoch": 3689} {"train_loss": -24.608837127685547, "global_step": 306191, "epoch": 3689} {"train_loss": -25.297016143798828, "global_step": 306192, "epoch": 3689} {"train_loss": -24.568439483642578, "global_step": 306193, "epoch": 3689} {"train_loss": -25.131624221801758, "global_step": 306194, "epoch": 3689} {"train_loss": -25.2929744720459, "global_step": 306195, "epoch": 3689} {"train_loss": -25.1090087890625, "global_step": 306196, "epoch": 3689} {"train_loss": -25.53254508972168, "global_step": 306197, "epoch": 3689} {"train_loss": -25.322952270507812, "global_step": 306198, "epoch": 3689} {"train_loss": -25.306583404541016, "global_step": 306199, "epoch": 3689} {"train_loss": -25.3594970703125, "global_step": 306200, "epoch": 3689} {"train_loss": -25.316003799438477, "global_step": 306201, "epoch": 3689} {"train_loss": -25.25667381286621, "global_step": 306202, "epoch": 3689} {"train_loss": -25.116910934448242, "global_step": 306203, "epoch": 3689} {"train_loss": -25.236730575561523, "global_step": 306204, "epoch": 3689} {"train_loss": -25.18899917602539, "global_step": 306205, "epoch": 3689} {"train_loss": -25.305925369262695, "global_step": 306206, "epoch": 3689} {"train_loss": -25.629175186157227, "global_step": 306207, "epoch": 3689} {"train_loss": -25.9457950592041, "global_step": 306208, "epoch": 3689} {"train_loss": -25.4466609954834, "global_step": 306209, "epoch": 3689} {"train_loss": -25.619129180908203, "global_step": 306210, "epoch": 3689} {"train_loss": -25.993804931640625, "global_step": 306211, "epoch": 3689} {"train_loss": -25.611181259155273, "global_step": 306212, "epoch": 3689} {"train_loss": -25.375293731689453, "global_step": 306213, "epoch": 3689} {"train_loss": -25.824689865112305, "global_step": 306214, "epoch": 3689} {"train_loss": -25.488754272460938, "global_step": 306215, "epoch": 3689} {"train_loss": -25.76947593688965, "global_step": 306216, "epoch": 3689} {"train_loss": -25.532623291015625, "global_step": 306217, "epoch": 3689} {"train_loss": -25.98499870300293, "global_step": 306218, "epoch": 3689} {"train_loss": -25.973011016845703, "global_step": 306219, "epoch": 3689} {"train_loss": -25.664642333984375, "global_step": 306220, "epoch": 3689} {"train_loss": -25.574844360351562, "global_step": 306221, "epoch": 3689} {"train_loss": -25.832401275634766, "global_step": 306222, "epoch": 3689} {"train_loss": -25.659698486328125, "global_step": 306223, "epoch": 3689} {"train_loss": -26.149845123291016, "global_step": 306224, "epoch": 3689} {"train_loss": -26.008407592773438, "global_step": 306225, "epoch": 3689} {"train_loss": -26.134765625, "global_step": 306226, "epoch": 3689} {"train_loss": -25.45771026611328, "global_step": 306227, "epoch": 3689} {"train_loss": -25.887510299682617, "global_step": 306228, "epoch": 3689} {"train_loss": -25.58684539794922, "global_step": 306229, "epoch": 3689} {"train_loss": -26.0578670501709, "global_step": 306230, "epoch": 3689} {"train_loss": -26.094085693359375, "global_step": 306231, "epoch": 3689} {"train_loss": -25.815832138061523, "global_step": 306232, "epoch": 3689} {"train_loss": -26.13385581970215, "global_step": 306233, "epoch": 3689} {"train_loss": -26.189483642578125, "global_step": 306234, "epoch": 3689} {"train_loss": -25.8392333984375, "global_step": 306235, "epoch": 3689} {"train_loss": -25.814817428588867, "global_step": 306236, "epoch": 3689} {"train_loss": -25.538740158081055, "global_step": 306237, "epoch": 3689} {"train_loss": -25.77589225769043, "global_step": 306238, "epoch": 3689} {"train_loss": -26.3253231048584, "global_step": 306239, "epoch": 3689} {"train_loss": -25.912128448486328, "global_step": 306240, "epoch": 3689} {"train_loss": -25.632160186767578, "global_step": 306241, "epoch": 3689} {"train_loss": -25.514291763305664, "global_step": 306242, "epoch": 3689} {"train_loss": -25.289703369140625, "global_step": 306243, "epoch": 3689} {"train_loss": -25.140581130981445, "global_step": 306244, "epoch": 3689} {"train_loss": -25.636621475219727, "global_step": 306245, "epoch": 3689} {"train_loss": -25.82630729675293, "global_step": 306246, "epoch": 3689} {"train_loss": -25.9403076171875, "global_step": 306247, "epoch": 3689} {"train_loss": -25.751407623291016, "global_step": 306248, "epoch": 3689} {"train_loss": -25.254924774169922, "global_step": 306249, "epoch": 3689} {"train_loss": -25.50153160095215, "global_step": 306250, "epoch": 3689} {"train_loss": -25.64006996154785, "global_step": 306251, "epoch": 3689} {"train_loss": -25.233407974243164, "global_step": 306252, "epoch": 3689} {"train_loss": -25.54781723022461, "global_step": 306253, "epoch": 3689} {"train_loss": -25.959522247314453, "global_step": 306254, "epoch": 3689} {"train_loss": -25.404001235961914, "global_step": 306255, "epoch": 3689} {"train_loss": -25.35892677307129, "global_step": 306256, "epoch": 3689} {"train_loss": -25.809345245361328, "global_step": 306257, "epoch": 3689} {"train_loss": -25.882307052612305, "global_step": 306258, "epoch": 3689} {"train_loss": -25.7108097076416, "global_step": 306259, "epoch": 3689} {"train_loss": -25.565969467163086, "global_step": 306260, "epoch": 3689} {"train_loss": -25.666275024414062, "global_step": 306261, "epoch": 3689} {"train_loss": -25.988744735717773, "global_step": 306262, "epoch": 3689} {"train_loss": -25.851789474487305, "global_step": 306263, "epoch": 3689} {"train_loss": -25.676000595092773, "global_step": 306264, "epoch": 3689} {"train_loss": -25.47858238220215, "global_step": 306265, "epoch": 3689} {"train_loss": -25.609134674072266, "global_step": 306266, "epoch": 3689} {"train_loss": -25.85865592956543, "global_step": 306267, "epoch": 3689} {"train_loss": -25.649179458618164, "global_step": 306268, "epoch": 3689} {"train_loss": -25.602250133652284, "global_step": 306269, "epoch": 3689, "val_loss": 7320654.0} {"train_loss": -25.215539932250977, "global_step": 306270, "epoch": 3690} {"train_loss": -25.24814796447754, "global_step": 306271, "epoch": 3690} {"train_loss": -25.183744430541992, "global_step": 306272, "epoch": 3690} {"train_loss": -24.907264709472656, "global_step": 306273, "epoch": 3690} {"train_loss": -25.071439743041992, "global_step": 306274, "epoch": 3690} {"train_loss": -24.94407844543457, "global_step": 306275, "epoch": 3690} {"train_loss": -25.618122100830078, "global_step": 306276, "epoch": 3690} {"train_loss": -25.336896896362305, "global_step": 306277, "epoch": 3690} {"train_loss": -25.341472625732422, "global_step": 306278, "epoch": 3690} {"train_loss": -25.24440574645996, "global_step": 306279, "epoch": 3690} {"train_loss": -25.6241512298584, "global_step": 306280, "epoch": 3690} {"train_loss": -25.172536849975586, "global_step": 306281, "epoch": 3690} {"train_loss": -25.53165626525879, "global_step": 306282, "epoch": 3690} {"train_loss": -25.545759201049805, "global_step": 306283, "epoch": 3690} {"train_loss": -25.413999557495117, "global_step": 306284, "epoch": 3690} {"train_loss": -25.57563591003418, "global_step": 306285, "epoch": 3690} {"train_loss": -25.475814819335938, "global_step": 306286, "epoch": 3690} {"train_loss": -25.462350845336914, "global_step": 306287, "epoch": 3690} {"train_loss": -25.61635398864746, "global_step": 306288, "epoch": 3690} {"train_loss": -25.16987419128418, "global_step": 306289, "epoch": 3690} {"train_loss": -25.646982192993164, "global_step": 306290, "epoch": 3690} {"train_loss": -25.693090438842773, "global_step": 306291, "epoch": 3690} {"train_loss": -26.078815460205078, "global_step": 306292, "epoch": 3690} {"train_loss": -25.778371810913086, "global_step": 306293, "epoch": 3690} {"train_loss": -25.38978385925293, "global_step": 306294, "epoch": 3690} {"train_loss": -25.593563079833984, "global_step": 306295, "epoch": 3690} {"train_loss": -25.490554809570312, "global_step": 306296, "epoch": 3690} {"train_loss": -25.687774658203125, "global_step": 306297, "epoch": 3690} {"train_loss": -25.764495849609375, "global_step": 306298, "epoch": 3690} {"train_loss": -25.6898136138916, "global_step": 306299, "epoch": 3690} {"train_loss": -25.848169326782227, "global_step": 306300, "epoch": 3690} {"train_loss": -25.611663818359375, "global_step": 306301, "epoch": 3690} {"train_loss": -25.372705459594727, "global_step": 306302, "epoch": 3690} {"train_loss": -25.878461837768555, "global_step": 306303, "epoch": 3690} {"train_loss": -25.6196231842041, "global_step": 306304, "epoch": 3690} {"train_loss": -26.006757736206055, "global_step": 306305, "epoch": 3690} {"train_loss": -25.38201904296875, "global_step": 306306, "epoch": 3690} {"train_loss": -25.619770050048828, "global_step": 306307, "epoch": 3690} {"train_loss": -25.48723793029785, "global_step": 306308, "epoch": 3690} {"train_loss": -25.590539932250977, "global_step": 306309, "epoch": 3690} {"train_loss": -25.498022079467773, "global_step": 306310, "epoch": 3690} {"train_loss": -25.640064239501953, "global_step": 306311, "epoch": 3690} {"train_loss": -25.601415634155273, "global_step": 306312, "epoch": 3690} {"train_loss": -25.9511775970459, "global_step": 306313, "epoch": 3690} {"train_loss": -25.89007568359375, "global_step": 306314, "epoch": 3690} {"train_loss": -25.666868209838867, "global_step": 306315, "epoch": 3690} {"train_loss": -25.808942794799805, "global_step": 306316, "epoch": 3690} {"train_loss": -25.74350929260254, "global_step": 306317, "epoch": 3690} {"train_loss": -25.93108558654785, "global_step": 306318, "epoch": 3690} {"train_loss": -26.042844772338867, "global_step": 306319, "epoch": 3690} {"train_loss": -25.64300537109375, "global_step": 306320, "epoch": 3690} {"train_loss": -25.847217559814453, "global_step": 306321, "epoch": 3690} {"train_loss": -25.60548210144043, "global_step": 306322, "epoch": 3690} {"train_loss": -25.56591033935547, "global_step": 306323, "epoch": 3690} {"train_loss": -26.182580947875977, "global_step": 306324, "epoch": 3690} {"train_loss": -25.97674560546875, "global_step": 306325, "epoch": 3690} {"train_loss": -25.685102462768555, "global_step": 306326, "epoch": 3690} {"train_loss": -25.972326278686523, "global_step": 306327, "epoch": 3690} {"train_loss": -25.79157829284668, "global_step": 306328, "epoch": 3690} {"train_loss": -25.80419921875, "global_step": 306329, "epoch": 3690} {"train_loss": -25.943445205688477, "global_step": 306330, "epoch": 3690} {"train_loss": -25.599355697631836, "global_step": 306331, "epoch": 3690} {"train_loss": -25.55572509765625, "global_step": 306332, "epoch": 3690} {"train_loss": -25.801959991455078, "global_step": 306333, "epoch": 3690} {"train_loss": -25.00996971130371, "global_step": 306334, "epoch": 3690} {"train_loss": -25.6651611328125, "global_step": 306335, "epoch": 3690} {"train_loss": -25.8194637298584, "global_step": 306336, "epoch": 3690} {"train_loss": -25.78387451171875, "global_step": 306337, "epoch": 3690} {"train_loss": -25.72995376586914, "global_step": 306338, "epoch": 3690} {"train_loss": -25.825626373291016, "global_step": 306339, "epoch": 3690} {"train_loss": -25.576255798339844, "global_step": 306340, "epoch": 3690} {"train_loss": -25.74894142150879, "global_step": 306341, "epoch": 3690} {"train_loss": -25.41449546813965, "global_step": 306342, "epoch": 3690} {"train_loss": -25.57048988342285, "global_step": 306343, "epoch": 3690} {"train_loss": -26.01649284362793, "global_step": 306344, "epoch": 3690} {"train_loss": -25.678144454956055, "global_step": 306345, "epoch": 3690} {"train_loss": -26.029306411743164, "global_step": 306346, "epoch": 3690} {"train_loss": -25.63685417175293, "global_step": 306347, "epoch": 3690} {"train_loss": -26.064990997314453, "global_step": 306348, "epoch": 3690} {"train_loss": -25.657724380493164, "global_step": 306349, "epoch": 3690} {"train_loss": -25.993005752563477, "global_step": 306350, "epoch": 3690} {"train_loss": -25.70467185974121, "global_step": 306351, "epoch": 3690} {"train_loss": -25.651020532631012, "global_step": 306352, "epoch": 3690, "val_loss": 7214007.0} {"train_loss": -25.260353088378906, "global_step": 306353, "epoch": 3691} {"train_loss": -25.300642013549805, "global_step": 306354, "epoch": 3691} {"train_loss": -25.44343376159668, "global_step": 306355, "epoch": 3691} {"train_loss": -25.4103946685791, "global_step": 306356, "epoch": 3691} {"train_loss": -25.339374542236328, "global_step": 306357, "epoch": 3691} {"train_loss": -25.196348190307617, "global_step": 306358, "epoch": 3691} {"train_loss": -25.408090591430664, "global_step": 306359, "epoch": 3691} {"train_loss": -25.322336196899414, "global_step": 306360, "epoch": 3691} {"train_loss": -25.4161434173584, "global_step": 306361, "epoch": 3691} {"train_loss": -26.01641273498535, "global_step": 306362, "epoch": 3691} {"train_loss": -25.542707443237305, "global_step": 306363, "epoch": 3691} {"train_loss": -25.782529830932617, "global_step": 306364, "epoch": 3691} {"train_loss": -25.29816246032715, "global_step": 306365, "epoch": 3691} {"train_loss": -25.674335479736328, "global_step": 306366, "epoch": 3691} {"train_loss": -25.6271915435791, "global_step": 306367, "epoch": 3691} {"train_loss": -25.3045597076416, "global_step": 306368, "epoch": 3691} {"train_loss": -25.4805908203125, "global_step": 306369, "epoch": 3691} {"train_loss": -25.95393180847168, "global_step": 306370, "epoch": 3691} {"train_loss": -25.379440307617188, "global_step": 306371, "epoch": 3691} {"train_loss": -25.847524642944336, "global_step": 306372, "epoch": 3691} {"train_loss": -25.588491439819336, "global_step": 306373, "epoch": 3691} {"train_loss": -25.539844512939453, "global_step": 306374, "epoch": 3691} {"train_loss": -26.126483917236328, "global_step": 306375, "epoch": 3691} {"train_loss": -25.596464157104492, "global_step": 306376, "epoch": 3691} {"train_loss": -25.5784854888916, "global_step": 306377, "epoch": 3691} {"train_loss": -25.38983726501465, "global_step": 306378, "epoch": 3691} {"train_loss": -25.663349151611328, "global_step": 306379, "epoch": 3691} {"train_loss": -25.857892990112305, "global_step": 306380, "epoch": 3691} {"train_loss": -25.742938995361328, "global_step": 306381, "epoch": 3691} {"train_loss": -25.64874839782715, "global_step": 306382, "epoch": 3691} {"train_loss": -25.84716796875, "global_step": 306383, "epoch": 3691} {"train_loss": -25.923843383789062, "global_step": 306384, "epoch": 3691} {"train_loss": -25.78468132019043, "global_step": 306385, "epoch": 3691} {"train_loss": -25.511947631835938, "global_step": 306386, "epoch": 3691} {"train_loss": -25.27943992614746, "global_step": 306387, "epoch": 3691} {"train_loss": -25.710840225219727, "global_step": 306388, "epoch": 3691} {"train_loss": -25.382858276367188, "global_step": 306389, "epoch": 3691} {"train_loss": -25.920673370361328, "global_step": 306390, "epoch": 3691} {"train_loss": -25.805328369140625, "global_step": 306391, "epoch": 3691} {"train_loss": -25.62175941467285, "global_step": 306392, "epoch": 3691} {"train_loss": -25.3559627532959, "global_step": 306393, "epoch": 3691} {"train_loss": -25.41336441040039, "global_step": 306394, "epoch": 3691} {"train_loss": -25.67701530456543, "global_step": 306395, "epoch": 3691} {"train_loss": -25.874486923217773, "global_step": 306396, "epoch": 3691} {"train_loss": -25.136133193969727, "global_step": 306397, "epoch": 3691} {"train_loss": -25.538394927978516, "global_step": 306398, "epoch": 3691} {"train_loss": -25.3319091796875, "global_step": 306399, "epoch": 3691} {"train_loss": -25.572221755981445, "global_step": 306400, "epoch": 3691} {"train_loss": -25.345979690551758, "global_step": 306401, "epoch": 3691} {"train_loss": -25.41029930114746, "global_step": 306402, "epoch": 3691} {"train_loss": -25.95606803894043, "global_step": 306403, "epoch": 3691} {"train_loss": -25.267385482788086, "global_step": 306404, "epoch": 3691} {"train_loss": -25.53987693786621, "global_step": 306405, "epoch": 3691} {"train_loss": -25.926944732666016, "global_step": 306406, "epoch": 3691} {"train_loss": -25.49393081665039, "global_step": 306407, "epoch": 3691} {"train_loss": -25.560237884521484, "global_step": 306408, "epoch": 3691} {"train_loss": -25.90412712097168, "global_step": 306409, "epoch": 3691} {"train_loss": -25.79123306274414, "global_step": 306410, "epoch": 3691} {"train_loss": -25.973569869995117, "global_step": 306411, "epoch": 3691} {"train_loss": -25.834857940673828, "global_step": 306412, "epoch": 3691} {"train_loss": -25.683429718017578, "global_step": 306413, "epoch": 3691} {"train_loss": -25.81998062133789, "global_step": 306414, "epoch": 3691} {"train_loss": -25.497339248657227, "global_step": 306415, "epoch": 3691} {"train_loss": -25.964405059814453, "global_step": 306416, "epoch": 3691} {"train_loss": -25.69693946838379, "global_step": 306417, "epoch": 3691} {"train_loss": -25.702314376831055, "global_step": 306418, "epoch": 3691} {"train_loss": -26.118871688842773, "global_step": 306419, "epoch": 3691} {"train_loss": -26.056262969970703, "global_step": 306420, "epoch": 3691} {"train_loss": -25.70427894592285, "global_step": 306421, "epoch": 3691} {"train_loss": -25.65690040588379, "global_step": 306422, "epoch": 3691} {"train_loss": -25.885730743408203, "global_step": 306423, "epoch": 3691} {"train_loss": -25.564714431762695, "global_step": 306424, "epoch": 3691} {"train_loss": -25.569334030151367, "global_step": 306425, "epoch": 3691} {"train_loss": -25.749591827392578, "global_step": 306426, "epoch": 3691} {"train_loss": -25.653228759765625, "global_step": 306427, "epoch": 3691} {"train_loss": -25.233413696289062, "global_step": 306428, "epoch": 3691} {"train_loss": -25.846710205078125, "global_step": 306429, "epoch": 3691} {"train_loss": -25.702316284179688, "global_step": 306430, "epoch": 3691} {"train_loss": -25.863861083984375, "global_step": 306431, "epoch": 3691} {"train_loss": -25.6109619140625, "global_step": 306432, "epoch": 3691} {"train_loss": -25.791229248046875, "global_step": 306433, "epoch": 3691} {"train_loss": -25.929468154907227, "global_step": 306434, "epoch": 3691} {"train_loss": -25.638671875, "global_step": 306435, "epoch": 3691, "val_loss": 7147223.5} {"train_loss": -25.377403259277344, "global_step": 306436, "epoch": 3692} {"train_loss": -25.30000114440918, "global_step": 306437, "epoch": 3692} {"train_loss": -25.60291862487793, "global_step": 306438, "epoch": 3692} {"train_loss": -25.33318328857422, "global_step": 306439, "epoch": 3692} {"train_loss": -25.140974044799805, "global_step": 306440, "epoch": 3692} {"train_loss": -25.19894027709961, "global_step": 306441, "epoch": 3692} {"train_loss": -25.061735153198242, "global_step": 306442, "epoch": 3692} {"train_loss": -25.590978622436523, "global_step": 306443, "epoch": 3692} {"train_loss": -25.220457077026367, "global_step": 306444, "epoch": 3692} {"train_loss": -25.13903045654297, "global_step": 306445, "epoch": 3692} {"train_loss": -24.992568969726562, "global_step": 306446, "epoch": 3692} {"train_loss": -25.47657585144043, "global_step": 306447, "epoch": 3692} {"train_loss": -25.198789596557617, "global_step": 306448, "epoch": 3692} {"train_loss": -25.47490882873535, "global_step": 306449, "epoch": 3692} {"train_loss": -25.900115966796875, "global_step": 306450, "epoch": 3692} {"train_loss": -25.570180892944336, "global_step": 306451, "epoch": 3692} {"train_loss": -25.356361389160156, "global_step": 306452, "epoch": 3692} {"train_loss": -25.238483428955078, "global_step": 306453, "epoch": 3692} {"train_loss": -25.508258819580078, "global_step": 306454, "epoch": 3692} {"train_loss": -25.593320846557617, "global_step": 306455, "epoch": 3692} {"train_loss": -25.433679580688477, "global_step": 306456, "epoch": 3692} {"train_loss": -25.242019653320312, "global_step": 306457, "epoch": 3692} {"train_loss": -25.332136154174805, "global_step": 306458, "epoch": 3692} {"train_loss": -25.1818904876709, "global_step": 306459, "epoch": 3692} {"train_loss": -25.682287216186523, "global_step": 306460, "epoch": 3692} {"train_loss": -25.32948875427246, "global_step": 306461, "epoch": 3692} {"train_loss": -25.19766616821289, "global_step": 306462, "epoch": 3692} {"train_loss": -25.729093551635742, "global_step": 306463, "epoch": 3692} {"train_loss": -25.467144012451172, "global_step": 306464, "epoch": 3692} {"train_loss": -25.536190032958984, "global_step": 306465, "epoch": 3692} {"train_loss": -25.148427963256836, "global_step": 306466, "epoch": 3692} {"train_loss": -25.548480987548828, "global_step": 306467, "epoch": 3692} {"train_loss": -25.518569946289062, "global_step": 306468, "epoch": 3692} {"train_loss": -25.40976905822754, "global_step": 306469, "epoch": 3692} {"train_loss": -25.12225914001465, "global_step": 306470, "epoch": 3692} {"train_loss": -25.78509521484375, "global_step": 306471, "epoch": 3692} {"train_loss": -25.66144371032715, "global_step": 306472, "epoch": 3692} {"train_loss": -25.40821647644043, "global_step": 306473, "epoch": 3692} {"train_loss": -25.99188232421875, "global_step": 306474, "epoch": 3692} {"train_loss": -25.626718521118164, "global_step": 306475, "epoch": 3692} {"train_loss": -25.603952407836914, "global_step": 306476, "epoch": 3692} {"train_loss": -25.818588256835938, "global_step": 306477, "epoch": 3692} {"train_loss": -25.362844467163086, "global_step": 306478, "epoch": 3692} {"train_loss": -25.400196075439453, "global_step": 306479, "epoch": 3692} {"train_loss": -25.990234375, "global_step": 306480, "epoch": 3692} {"train_loss": -25.526405334472656, "global_step": 306481, "epoch": 3692} {"train_loss": -25.810333251953125, "global_step": 306482, "epoch": 3692} {"train_loss": -25.314332962036133, "global_step": 306483, "epoch": 3692} {"train_loss": -25.688730239868164, "global_step": 306484, "epoch": 3692} {"train_loss": -25.925342559814453, "global_step": 306485, "epoch": 3692} {"train_loss": -26.13262939453125, "global_step": 306486, "epoch": 3692} {"train_loss": -25.667593002319336, "global_step": 306487, "epoch": 3692} {"train_loss": -25.637170791625977, "global_step": 306488, "epoch": 3692} {"train_loss": -25.637939453125, "global_step": 306489, "epoch": 3692} {"train_loss": -25.96192741394043, "global_step": 306490, "epoch": 3692} {"train_loss": -25.81319236755371, "global_step": 306491, "epoch": 3692} {"train_loss": -25.62652015686035, "global_step": 306492, "epoch": 3692} {"train_loss": -25.73931884765625, "global_step": 306493, "epoch": 3692} {"train_loss": -25.78466796875, "global_step": 306494, "epoch": 3692} {"train_loss": -25.8898983001709, "global_step": 306495, "epoch": 3692} {"train_loss": -25.88144874572754, "global_step": 306496, "epoch": 3692} {"train_loss": -25.970062255859375, "global_step": 306497, "epoch": 3692} {"train_loss": -25.308916091918945, "global_step": 306498, "epoch": 3692} {"train_loss": -25.34417152404785, "global_step": 306499, "epoch": 3692} {"train_loss": -25.504087448120117, "global_step": 306500, "epoch": 3692} {"train_loss": -26.016284942626953, "global_step": 306501, "epoch": 3692} {"train_loss": -25.542932510375977, "global_step": 306502, "epoch": 3692} {"train_loss": -25.36838722229004, "global_step": 306503, "epoch": 3692} {"train_loss": -25.9184513092041, "global_step": 306504, "epoch": 3692} {"train_loss": -25.30776023864746, "global_step": 306505, "epoch": 3692} {"train_loss": -25.582399368286133, "global_step": 306506, "epoch": 3692} {"train_loss": -25.541967391967773, "global_step": 306507, "epoch": 3692} {"train_loss": -25.86832618713379, "global_step": 306508, "epoch": 3692} {"train_loss": -25.690221786499023, "global_step": 306509, "epoch": 3692} {"train_loss": -25.666894912719727, "global_step": 306510, "epoch": 3692} {"train_loss": -25.538724899291992, "global_step": 306511, "epoch": 3692} {"train_loss": -25.32138442993164, "global_step": 306512, "epoch": 3692} {"train_loss": -25.405902862548828, "global_step": 306513, "epoch": 3692} {"train_loss": -25.875349044799805, "global_step": 306514, "epoch": 3692} {"train_loss": -25.57613182067871, "global_step": 306515, "epoch": 3692} {"train_loss": -24.771121978759766, "global_step": 306516, "epoch": 3692} {"train_loss": -25.336790084838867, "global_step": 306517, "epoch": 3692} {"train_loss": -25.53524210366858, "global_step": 306518, "epoch": 3692, "val_loss": 7330159.0} {"train_loss": -24.71306800842285, "global_step": 306519, "epoch": 3693} {"train_loss": -25.555822372436523, "global_step": 306520, "epoch": 3693} {"train_loss": -24.892038345336914, "global_step": 306521, "epoch": 3693} {"train_loss": -25.24698829650879, "global_step": 306522, "epoch": 3693} {"train_loss": -24.759849548339844, "global_step": 306523, "epoch": 3693} {"train_loss": -25.22644805908203, "global_step": 306524, "epoch": 3693} {"train_loss": -24.903186798095703, "global_step": 306525, "epoch": 3693} {"train_loss": -25.59400749206543, "global_step": 306526, "epoch": 3693} {"train_loss": -25.2153377532959, "global_step": 306527, "epoch": 3693} {"train_loss": -25.308841705322266, "global_step": 306528, "epoch": 3693} {"train_loss": -25.57706069946289, "global_step": 306529, "epoch": 3693} {"train_loss": -25.37709617614746, "global_step": 306530, "epoch": 3693} {"train_loss": -25.322830200195312, "global_step": 306531, "epoch": 3693} {"train_loss": -25.224769592285156, "global_step": 306532, "epoch": 3693} {"train_loss": -25.694183349609375, "global_step": 306533, "epoch": 3693} {"train_loss": -25.61713218688965, "global_step": 306534, "epoch": 3693} {"train_loss": -25.512027740478516, "global_step": 306535, "epoch": 3693} {"train_loss": -25.874500274658203, "global_step": 306536, "epoch": 3693} {"train_loss": -25.96736717224121, "global_step": 306537, "epoch": 3693} {"train_loss": -25.613630294799805, "global_step": 306538, "epoch": 3693} {"train_loss": -25.728666305541992, "global_step": 306539, "epoch": 3693} {"train_loss": -25.603927612304688, "global_step": 306540, "epoch": 3693} {"train_loss": -25.50658416748047, "global_step": 306541, "epoch": 3693} {"train_loss": -25.552719116210938, "global_step": 306542, "epoch": 3693} {"train_loss": -25.630849838256836, "global_step": 306543, "epoch": 3693} {"train_loss": -25.35615348815918, "global_step": 306544, "epoch": 3693} {"train_loss": -26.046110153198242, "global_step": 306545, "epoch": 3693} {"train_loss": -25.95277214050293, "global_step": 306546, "epoch": 3693} {"train_loss": -25.85328483581543, "global_step": 306547, "epoch": 3693} {"train_loss": -25.534177780151367, "global_step": 306548, "epoch": 3693} {"train_loss": -26.008026123046875, "global_step": 306549, "epoch": 3693} {"train_loss": -25.883237838745117, "global_step": 306550, "epoch": 3693} {"train_loss": -25.721166610717773, "global_step": 306551, "epoch": 3693} {"train_loss": -25.779972076416016, "global_step": 306552, "epoch": 3693} {"train_loss": -25.858530044555664, "global_step": 306553, "epoch": 3693} {"train_loss": -25.699460983276367, "global_step": 306554, "epoch": 3693} {"train_loss": -25.45039939880371, "global_step": 306555, "epoch": 3693} {"train_loss": -25.612890243530273, "global_step": 306556, "epoch": 3693} {"train_loss": -25.658954620361328, "global_step": 306557, "epoch": 3693} {"train_loss": -26.032690048217773, "global_step": 306558, "epoch": 3693} {"train_loss": -25.39448356628418, "global_step": 306559, "epoch": 3693} {"train_loss": -25.73479652404785, "global_step": 306560, "epoch": 3693} {"train_loss": -26.012128829956055, "global_step": 306561, "epoch": 3693} {"train_loss": -25.898853302001953, "global_step": 306562, "epoch": 3693} {"train_loss": -25.952774047851562, "global_step": 306563, "epoch": 3693} {"train_loss": -25.763158798217773, "global_step": 306564, "epoch": 3693} {"train_loss": -26.159677505493164, "global_step": 306565, "epoch": 3693} {"train_loss": -25.54739761352539, "global_step": 306566, "epoch": 3693} {"train_loss": -25.779218673706055, "global_step": 306567, "epoch": 3693} {"train_loss": -26.095930099487305, "global_step": 306568, "epoch": 3693} {"train_loss": -25.737775802612305, "global_step": 306569, "epoch": 3693} {"train_loss": -25.948749542236328, "global_step": 306570, "epoch": 3693} {"train_loss": -25.438535690307617, "global_step": 306571, "epoch": 3693} {"train_loss": -25.579633712768555, "global_step": 306572, "epoch": 3693} {"train_loss": -25.75457191467285, "global_step": 306573, "epoch": 3693} {"train_loss": -25.585790634155273, "global_step": 306574, "epoch": 3693} {"train_loss": -25.862462997436523, "global_step": 306575, "epoch": 3693} {"train_loss": -25.45471954345703, "global_step": 306576, "epoch": 3693} {"train_loss": -25.732929229736328, "global_step": 306577, "epoch": 3693} {"train_loss": -25.81809425354004, "global_step": 306578, "epoch": 3693} {"train_loss": -25.613622665405273, "global_step": 306579, "epoch": 3693} {"train_loss": -25.83656883239746, "global_step": 306580, "epoch": 3693} {"train_loss": -25.82552146911621, "global_step": 306581, "epoch": 3693} {"train_loss": -25.6896915435791, "global_step": 306582, "epoch": 3693} {"train_loss": -25.473636627197266, "global_step": 306583, "epoch": 3693} {"train_loss": -26.171356201171875, "global_step": 306584, "epoch": 3693} {"train_loss": -25.42078971862793, "global_step": 306585, "epoch": 3693} {"train_loss": -25.763446807861328, "global_step": 306586, "epoch": 3693} {"train_loss": -26.099328994750977, "global_step": 306587, "epoch": 3693} {"train_loss": -25.564958572387695, "global_step": 306588, "epoch": 3693} {"train_loss": -25.80020523071289, "global_step": 306589, "epoch": 3693} {"train_loss": -25.945148468017578, "global_step": 306590, "epoch": 3693} {"train_loss": -25.915618896484375, "global_step": 306591, "epoch": 3693} {"train_loss": -25.79107093811035, "global_step": 306592, "epoch": 3693} {"train_loss": -25.476402282714844, "global_step": 306593, "epoch": 3693} {"train_loss": -25.852069854736328, "global_step": 306594, "epoch": 3693} {"train_loss": -25.7576961517334, "global_step": 306595, "epoch": 3693} {"train_loss": -25.571533203125, "global_step": 306596, "epoch": 3693} {"train_loss": -25.554386138916016, "global_step": 306597, "epoch": 3693} {"train_loss": -25.673410415649414, "global_step": 306598, "epoch": 3693} {"train_loss": -25.930713653564453, "global_step": 306599, "epoch": 3693} {"train_loss": -26.078580856323242, "global_step": 306600, "epoch": 3693} {"train_loss": -25.6550430619573, "global_step": 306601, "epoch": 3693, "val_loss": 7291693.0} {"train_loss": -25.781614303588867, "global_step": 306602, "epoch": 3694} {"train_loss": -25.31495475769043, "global_step": 306603, "epoch": 3694} {"train_loss": -25.330947875976562, "global_step": 306604, "epoch": 3694} {"train_loss": -25.449182510375977, "global_step": 306605, "epoch": 3694} {"train_loss": -25.350065231323242, "global_step": 306606, "epoch": 3694} {"train_loss": -25.635400772094727, "global_step": 306607, "epoch": 3694} {"train_loss": -25.911840438842773, "global_step": 306608, "epoch": 3694} {"train_loss": -25.61835289001465, "global_step": 306609, "epoch": 3694} {"train_loss": -25.435836791992188, "global_step": 306610, "epoch": 3694} {"train_loss": -25.391435623168945, "global_step": 306611, "epoch": 3694} {"train_loss": -25.817182540893555, "global_step": 306612, "epoch": 3694} {"train_loss": -25.44212532043457, "global_step": 306613, "epoch": 3694} {"train_loss": -25.760282516479492, "global_step": 306614, "epoch": 3694} {"train_loss": -25.895666122436523, "global_step": 306615, "epoch": 3694} {"train_loss": -25.405317306518555, "global_step": 306616, "epoch": 3694} {"train_loss": -25.83477783203125, "global_step": 306617, "epoch": 3694} {"train_loss": -25.576078414916992, "global_step": 306618, "epoch": 3694} {"train_loss": -25.929441452026367, "global_step": 306619, "epoch": 3694} {"train_loss": -26.04465103149414, "global_step": 306620, "epoch": 3694} {"train_loss": -25.298574447631836, "global_step": 306621, "epoch": 3694} {"train_loss": -25.251577377319336, "global_step": 306622, "epoch": 3694} {"train_loss": -25.7206974029541, "global_step": 306623, "epoch": 3694} {"train_loss": -25.532855987548828, "global_step": 306624, "epoch": 3694} {"train_loss": -25.676929473876953, "global_step": 306625, "epoch": 3694} {"train_loss": -25.6954345703125, "global_step": 306626, "epoch": 3694} {"train_loss": -26.005023956298828, "global_step": 306627, "epoch": 3694} {"train_loss": -25.742023468017578, "global_step": 306628, "epoch": 3694} {"train_loss": -26.149341583251953, "global_step": 306629, "epoch": 3694} {"train_loss": -25.832244873046875, "global_step": 306630, "epoch": 3694} {"train_loss": -25.7020263671875, "global_step": 306631, "epoch": 3694} {"train_loss": -25.480844497680664, "global_step": 306632, "epoch": 3694} {"train_loss": -25.700361251831055, "global_step": 306633, "epoch": 3694} {"train_loss": -25.93367576599121, "global_step": 306634, "epoch": 3694} {"train_loss": -25.748523712158203, "global_step": 306635, "epoch": 3694} {"train_loss": -25.53501319885254, "global_step": 306636, "epoch": 3694} {"train_loss": -25.657968521118164, "global_step": 306637, "epoch": 3694} {"train_loss": -25.430166244506836, "global_step": 306638, "epoch": 3694} {"train_loss": -25.885251998901367, "global_step": 306639, "epoch": 3694} {"train_loss": -25.849607467651367, "global_step": 306640, "epoch": 3694} {"train_loss": -25.59038543701172, "global_step": 306641, "epoch": 3694} {"train_loss": -26.066192626953125, "global_step": 306642, "epoch": 3694} {"train_loss": -25.950397491455078, "global_step": 306643, "epoch": 3694} {"train_loss": -25.812353134155273, "global_step": 306644, "epoch": 3694} {"train_loss": -25.776641845703125, "global_step": 306645, "epoch": 3694} {"train_loss": -25.783823013305664, "global_step": 306646, "epoch": 3694} {"train_loss": -25.85560417175293, "global_step": 306647, "epoch": 3694} {"train_loss": -26.141626358032227, "global_step": 306648, "epoch": 3694} {"train_loss": -25.52669334411621, "global_step": 306649, "epoch": 3694} {"train_loss": -25.515541076660156, "global_step": 306650, "epoch": 3694} {"train_loss": -25.5732479095459, "global_step": 306651, "epoch": 3694} {"train_loss": -25.46500587463379, "global_step": 306652, "epoch": 3694} {"train_loss": -24.809152603149414, "global_step": 306653, "epoch": 3694} {"train_loss": -25.213363647460938, "global_step": 306654, "epoch": 3694} {"train_loss": -25.72559928894043, "global_step": 306655, "epoch": 3694} {"train_loss": -25.499624252319336, "global_step": 306656, "epoch": 3694} {"train_loss": -24.8017578125, "global_step": 306657, "epoch": 3694} {"train_loss": -25.595378875732422, "global_step": 306658, "epoch": 3694} {"train_loss": -25.433778762817383, "global_step": 306659, "epoch": 3694} {"train_loss": -24.93988609313965, "global_step": 306660, "epoch": 3694} {"train_loss": -25.196643829345703, "global_step": 306661, "epoch": 3694} {"train_loss": -25.740442276000977, "global_step": 306662, "epoch": 3694} {"train_loss": -25.49808120727539, "global_step": 306663, "epoch": 3694} {"train_loss": -25.346769332885742, "global_step": 306664, "epoch": 3694} {"train_loss": -25.53401756286621, "global_step": 306665, "epoch": 3694} {"train_loss": -25.928503036499023, "global_step": 306666, "epoch": 3694} {"train_loss": -25.640121459960938, "global_step": 306667, "epoch": 3694} {"train_loss": -25.722675323486328, "global_step": 306668, "epoch": 3694} {"train_loss": -25.71257972717285, "global_step": 306669, "epoch": 3694} {"train_loss": -25.87933349609375, "global_step": 306670, "epoch": 3694} {"train_loss": -25.67323112487793, "global_step": 306671, "epoch": 3694} {"train_loss": -25.79554557800293, "global_step": 306672, "epoch": 3694} {"train_loss": -25.622953414916992, "global_step": 306673, "epoch": 3694} {"train_loss": -25.760828018188477, "global_step": 306674, "epoch": 3694} {"train_loss": -25.952930450439453, "global_step": 306675, "epoch": 3694} {"train_loss": -25.79715919494629, "global_step": 306676, "epoch": 3694} {"train_loss": -25.705108642578125, "global_step": 306677, "epoch": 3694} {"train_loss": -25.995756149291992, "global_step": 306678, "epoch": 3694} {"train_loss": -25.78901481628418, "global_step": 306679, "epoch": 3694} {"train_loss": -25.595407485961914, "global_step": 306680, "epoch": 3694} {"train_loss": -25.943115234375, "global_step": 306681, "epoch": 3694} {"train_loss": -25.932226181030273, "global_step": 306682, "epoch": 3694} {"train_loss": -25.962329864501953, "global_step": 306683, "epoch": 3694} {"train_loss": -25.66382506956537, "global_step": 306684, "epoch": 3694, "val_loss": 7204949.0} {"train_loss": -25.25830078125, "global_step": 306685, "epoch": 3695} {"train_loss": -25.526124954223633, "global_step": 306686, "epoch": 3695} {"train_loss": -25.29593849182129, "global_step": 306687, "epoch": 3695} {"train_loss": -25.39668846130371, "global_step": 306688, "epoch": 3695} {"train_loss": -25.60700798034668, "global_step": 306689, "epoch": 3695} {"train_loss": -25.70484733581543, "global_step": 306690, "epoch": 3695} {"train_loss": -25.441709518432617, "global_step": 306691, "epoch": 3695} {"train_loss": -25.6750545501709, "global_step": 306692, "epoch": 3695} {"train_loss": -25.59168815612793, "global_step": 306693, "epoch": 3695} {"train_loss": -25.53831672668457, "global_step": 306694, "epoch": 3695} {"train_loss": -25.333860397338867, "global_step": 306695, "epoch": 3695} {"train_loss": -25.90860366821289, "global_step": 306696, "epoch": 3695} {"train_loss": -25.3686580657959, "global_step": 306697, "epoch": 3695} {"train_loss": -25.563840866088867, "global_step": 306698, "epoch": 3695} {"train_loss": -25.869434356689453, "global_step": 306699, "epoch": 3695} {"train_loss": -25.549442291259766, "global_step": 306700, "epoch": 3695} {"train_loss": -25.49703025817871, "global_step": 306701, "epoch": 3695} {"train_loss": -25.87293815612793, "global_step": 306702, "epoch": 3695} {"train_loss": -26.050703048706055, "global_step": 306703, "epoch": 3695} {"train_loss": -25.829574584960938, "global_step": 306704, "epoch": 3695} {"train_loss": -25.577688217163086, "global_step": 306705, "epoch": 3695} {"train_loss": -25.840978622436523, "global_step": 306706, "epoch": 3695} {"train_loss": -25.456600189208984, "global_step": 306707, "epoch": 3695} {"train_loss": -25.86395263671875, "global_step": 306708, "epoch": 3695} {"train_loss": -25.737354278564453, "global_step": 306709, "epoch": 3695} {"train_loss": -25.584314346313477, "global_step": 306710, "epoch": 3695} {"train_loss": -26.103036880493164, "global_step": 306711, "epoch": 3695} {"train_loss": -25.704792022705078, "global_step": 306712, "epoch": 3695} {"train_loss": -25.62222671508789, "global_step": 306713, "epoch": 3695} {"train_loss": -26.027170181274414, "global_step": 306714, "epoch": 3695} {"train_loss": -25.675397872924805, "global_step": 306715, "epoch": 3695} {"train_loss": -25.535524368286133, "global_step": 306716, "epoch": 3695} {"train_loss": -25.636693954467773, "global_step": 306717, "epoch": 3695} {"train_loss": -25.57769775390625, "global_step": 306718, "epoch": 3695} {"train_loss": -25.715341567993164, "global_step": 306719, "epoch": 3695} {"train_loss": -25.513992309570312, "global_step": 306720, "epoch": 3695} {"train_loss": -25.7825870513916, "global_step": 306721, "epoch": 3695} {"train_loss": -25.472238540649414, "global_step": 306722, "epoch": 3695} {"train_loss": -25.70819664001465, "global_step": 306723, "epoch": 3695} {"train_loss": -25.7662410736084, "global_step": 306724, "epoch": 3695} {"train_loss": -24.918224334716797, "global_step": 306725, "epoch": 3695} {"train_loss": -25.20531463623047, "global_step": 306726, "epoch": 3695} {"train_loss": -25.985553741455078, "global_step": 306727, "epoch": 3695} {"train_loss": -25.40877342224121, "global_step": 306728, "epoch": 3695} {"train_loss": -25.7252197265625, "global_step": 306729, "epoch": 3695} {"train_loss": -25.69915771484375, "global_step": 306730, "epoch": 3695} {"train_loss": -25.212289810180664, "global_step": 306731, "epoch": 3695} {"train_loss": -25.600492477416992, "global_step": 306732, "epoch": 3695} {"train_loss": -25.250865936279297, "global_step": 306733, "epoch": 3695} {"train_loss": -25.651981353759766, "global_step": 306734, "epoch": 3695} {"train_loss": -25.480253219604492, "global_step": 306735, "epoch": 3695} {"train_loss": -25.63071632385254, "global_step": 306736, "epoch": 3695} {"train_loss": -25.482900619506836, "global_step": 306737, "epoch": 3695} {"train_loss": -25.60489845275879, "global_step": 306738, "epoch": 3695} {"train_loss": -25.52518081665039, "global_step": 306739, "epoch": 3695} {"train_loss": -25.517423629760742, "global_step": 306740, "epoch": 3695} {"train_loss": -25.60660743713379, "global_step": 306741, "epoch": 3695} {"train_loss": -25.843341827392578, "global_step": 306742, "epoch": 3695} {"train_loss": -25.86411476135254, "global_step": 306743, "epoch": 3695} {"train_loss": -25.48992347717285, "global_step": 306744, "epoch": 3695} {"train_loss": -25.268125534057617, "global_step": 306745, "epoch": 3695} {"train_loss": -25.84391212463379, "global_step": 306746, "epoch": 3695} {"train_loss": -25.569150924682617, "global_step": 306747, "epoch": 3695} {"train_loss": -25.9638671875, "global_step": 306748, "epoch": 3695} {"train_loss": -25.569334030151367, "global_step": 306749, "epoch": 3695} {"train_loss": -25.6561222076416, "global_step": 306750, "epoch": 3695} {"train_loss": -26.048603057861328, "global_step": 306751, "epoch": 3695} {"train_loss": -25.498205184936523, "global_step": 306752, "epoch": 3695} {"train_loss": -26.11676597595215, "global_step": 306753, "epoch": 3695} {"train_loss": -25.542997360229492, "global_step": 306754, "epoch": 3695} {"train_loss": -25.9864501953125, "global_step": 306755, "epoch": 3695} {"train_loss": -25.73907470703125, "global_step": 306756, "epoch": 3695} {"train_loss": -25.639062881469727, "global_step": 306757, "epoch": 3695} {"train_loss": -25.602060317993164, "global_step": 306758, "epoch": 3695} {"train_loss": -25.815866470336914, "global_step": 306759, "epoch": 3695} {"train_loss": -25.823835372924805, "global_step": 306760, "epoch": 3695} {"train_loss": -25.785419464111328, "global_step": 306761, "epoch": 3695} {"train_loss": -25.641315460205078, "global_step": 306762, "epoch": 3695} {"train_loss": -25.654184341430664, "global_step": 306763, "epoch": 3695} {"train_loss": -25.75653648376465, "global_step": 306764, "epoch": 3695} {"train_loss": -25.94696044921875, "global_step": 306765, "epoch": 3695} {"train_loss": -25.65673828125, "global_step": 306766, "epoch": 3695} {"train_loss": -25.655399414430182, "global_step": 306767, "epoch": 3695, "val_loss": 7250679.0} {"train_loss": -25.05649185180664, "global_step": 306768, "epoch": 3696} {"train_loss": -24.072067260742188, "global_step": 306769, "epoch": 3696} {"train_loss": -24.119359970092773, "global_step": 306770, "epoch": 3696} {"train_loss": -24.490097045898438, "global_step": 306771, "epoch": 3696} {"train_loss": -24.799001693725586, "global_step": 306772, "epoch": 3696} {"train_loss": -24.1075382232666, "global_step": 306773, "epoch": 3696} {"train_loss": -25.01898193359375, "global_step": 306774, "epoch": 3696} {"train_loss": -24.70466423034668, "global_step": 306775, "epoch": 3696} {"train_loss": -25.37810707092285, "global_step": 306776, "epoch": 3696} {"train_loss": -24.554004669189453, "global_step": 306777, "epoch": 3696} {"train_loss": -25.194425582885742, "global_step": 306778, "epoch": 3696} {"train_loss": -24.86439323425293, "global_step": 306779, "epoch": 3696} {"train_loss": -25.20779800415039, "global_step": 306780, "epoch": 3696} {"train_loss": -25.097909927368164, "global_step": 306781, "epoch": 3696} {"train_loss": -25.197683334350586, "global_step": 306782, "epoch": 3696} {"train_loss": -25.08277702331543, "global_step": 306783, "epoch": 3696} {"train_loss": -25.57282066345215, "global_step": 306784, "epoch": 3696} {"train_loss": -25.2618408203125, "global_step": 306785, "epoch": 3696} {"train_loss": -25.30364990234375, "global_step": 306786, "epoch": 3696} {"train_loss": -25.683547973632812, "global_step": 306787, "epoch": 3696} {"train_loss": -25.397825241088867, "global_step": 306788, "epoch": 3696} {"train_loss": -25.09571647644043, "global_step": 306789, "epoch": 3696} {"train_loss": -25.742639541625977, "global_step": 306790, "epoch": 3696} {"train_loss": -25.39552116394043, "global_step": 306791, "epoch": 3696} {"train_loss": -25.44312858581543, "global_step": 306792, "epoch": 3696} {"train_loss": -25.457937240600586, "global_step": 306793, "epoch": 3696} {"train_loss": -25.345203399658203, "global_step": 306794, "epoch": 3696} {"train_loss": -25.765478134155273, "global_step": 306795, "epoch": 3696} {"train_loss": -25.80653190612793, "global_step": 306796, "epoch": 3696} {"train_loss": -25.617780685424805, "global_step": 306797, "epoch": 3696} {"train_loss": -25.987995147705078, "global_step": 306798, "epoch": 3696} {"train_loss": -25.852792739868164, "global_step": 306799, "epoch": 3696} {"train_loss": -25.76910972595215, "global_step": 306800, "epoch": 3696} {"train_loss": -25.817060470581055, "global_step": 306801, "epoch": 3696} {"train_loss": -25.390722274780273, "global_step": 306802, "epoch": 3696} {"train_loss": -25.81062126159668, "global_step": 306803, "epoch": 3696} {"train_loss": -26.171873092651367, "global_step": 306804, "epoch": 3696} {"train_loss": -25.618762969970703, "global_step": 306805, "epoch": 3696} {"train_loss": -26.0115909576416, "global_step": 306806, "epoch": 3696} {"train_loss": -25.77577018737793, "global_step": 306807, "epoch": 3696} {"train_loss": -25.96640396118164, "global_step": 306808, "epoch": 3696} {"train_loss": -25.79690933227539, "global_step": 306809, "epoch": 3696} {"train_loss": -25.932209014892578, "global_step": 306810, "epoch": 3696} {"train_loss": -25.87192153930664, "global_step": 306811, "epoch": 3696} {"train_loss": -25.72437858581543, "global_step": 306812, "epoch": 3696} {"train_loss": -25.581274032592773, "global_step": 306813, "epoch": 3696} {"train_loss": -26.0289306640625, "global_step": 306814, "epoch": 3696} {"train_loss": -25.987028121948242, "global_step": 306815, "epoch": 3696} {"train_loss": -25.92365074157715, "global_step": 306816, "epoch": 3696} {"train_loss": -25.5472412109375, "global_step": 306817, "epoch": 3696} {"train_loss": -25.848058700561523, "global_step": 306818, "epoch": 3696} {"train_loss": -26.08416748046875, "global_step": 306819, "epoch": 3696} {"train_loss": -25.945104598999023, "global_step": 306820, "epoch": 3696} {"train_loss": -26.057348251342773, "global_step": 306821, "epoch": 3696} {"train_loss": -25.84345054626465, "global_step": 306822, "epoch": 3696} {"train_loss": -26.142248153686523, "global_step": 306823, "epoch": 3696} {"train_loss": -25.543411254882812, "global_step": 306824, "epoch": 3696} {"train_loss": -25.659515380859375, "global_step": 306825, "epoch": 3696} {"train_loss": -25.563323974609375, "global_step": 306826, "epoch": 3696} {"train_loss": -25.99993324279785, "global_step": 306827, "epoch": 3696} {"train_loss": -25.68214225769043, "global_step": 306828, "epoch": 3696} {"train_loss": -25.987340927124023, "global_step": 306829, "epoch": 3696} {"train_loss": -25.605222702026367, "global_step": 306830, "epoch": 3696} {"train_loss": -25.61441421508789, "global_step": 306831, "epoch": 3696} {"train_loss": -25.057403564453125, "global_step": 306832, "epoch": 3696} {"train_loss": -25.548051834106445, "global_step": 306833, "epoch": 3696} {"train_loss": -25.451196670532227, "global_step": 306834, "epoch": 3696} {"train_loss": -25.548105239868164, "global_step": 306835, "epoch": 3696} {"train_loss": -25.405685424804688, "global_step": 306836, "epoch": 3696} {"train_loss": -25.659427642822266, "global_step": 306837, "epoch": 3696} {"train_loss": -25.35396385192871, "global_step": 306838, "epoch": 3696} {"train_loss": -25.30640983581543, "global_step": 306839, "epoch": 3696} {"train_loss": -25.513980865478516, "global_step": 306840, "epoch": 3696} {"train_loss": -24.935428619384766, "global_step": 306841, "epoch": 3696} {"train_loss": -25.39935874938965, "global_step": 306842, "epoch": 3696} {"train_loss": -25.641986846923828, "global_step": 306843, "epoch": 3696} {"train_loss": -25.73357582092285, "global_step": 306844, "epoch": 3696} {"train_loss": -25.53461265563965, "global_step": 306845, "epoch": 3696} {"train_loss": -25.541894912719727, "global_step": 306846, "epoch": 3696} {"train_loss": -25.704965591430664, "global_step": 306847, "epoch": 3696} {"train_loss": -25.359228134155273, "global_step": 306848, "epoch": 3696} {"train_loss": -25.88470458984375, "global_step": 306849, "epoch": 3696} {"train_loss": -25.50201289625053, "global_step": 306850, "epoch": 3696, "val_loss": 7237872.0} {"train_loss": -25.368616104125977, "global_step": 306851, "epoch": 3697} {"train_loss": -25.722415924072266, "global_step": 306852, "epoch": 3697} {"train_loss": -25.594953536987305, "global_step": 306853, "epoch": 3697} {"train_loss": -25.498212814331055, "global_step": 306854, "epoch": 3697} {"train_loss": -25.01374053955078, "global_step": 306855, "epoch": 3697} {"train_loss": -25.628753662109375, "global_step": 306856, "epoch": 3697} {"train_loss": -25.7051944732666, "global_step": 306857, "epoch": 3697} {"train_loss": -25.144346237182617, "global_step": 306858, "epoch": 3697} {"train_loss": -25.508745193481445, "global_step": 306859, "epoch": 3697} {"train_loss": -25.372987747192383, "global_step": 306860, "epoch": 3697} {"train_loss": -25.060256958007812, "global_step": 306861, "epoch": 3697} {"train_loss": -25.28087615966797, "global_step": 306862, "epoch": 3697} {"train_loss": -25.51224136352539, "global_step": 306863, "epoch": 3697} {"train_loss": -25.44574546813965, "global_step": 306864, "epoch": 3697} {"train_loss": -25.47566032409668, "global_step": 306865, "epoch": 3697} {"train_loss": -25.667856216430664, "global_step": 306866, "epoch": 3697} {"train_loss": -25.805410385131836, "global_step": 306867, "epoch": 3697} {"train_loss": -25.249298095703125, "global_step": 306868, "epoch": 3697} {"train_loss": -25.484155654907227, "global_step": 306869, "epoch": 3697} {"train_loss": -25.505666732788086, "global_step": 306870, "epoch": 3697} {"train_loss": -25.33600616455078, "global_step": 306871, "epoch": 3697} {"train_loss": -25.5058536529541, "global_step": 306872, "epoch": 3697} {"train_loss": -25.80354118347168, "global_step": 306873, "epoch": 3697} {"train_loss": -25.257295608520508, "global_step": 306874, "epoch": 3697} {"train_loss": -25.57261848449707, "global_step": 306875, "epoch": 3697} {"train_loss": -25.51493263244629, "global_step": 306876, "epoch": 3697} {"train_loss": -25.329586029052734, "global_step": 306877, "epoch": 3697} {"train_loss": -25.636926651000977, "global_step": 306878, "epoch": 3697} {"train_loss": -25.563215255737305, "global_step": 306879, "epoch": 3697} {"train_loss": -25.461044311523438, "global_step": 306880, "epoch": 3697} {"train_loss": -25.683094024658203, "global_step": 306881, "epoch": 3697} {"train_loss": -25.27714729309082, "global_step": 306882, "epoch": 3697} {"train_loss": -25.5867919921875, "global_step": 306883, "epoch": 3697} {"train_loss": -25.30539321899414, "global_step": 306884, "epoch": 3697} {"train_loss": -25.824506759643555, "global_step": 306885, "epoch": 3697} {"train_loss": -25.51960563659668, "global_step": 306886, "epoch": 3697} {"train_loss": -25.573026657104492, "global_step": 306887, "epoch": 3697} {"train_loss": -25.710241317749023, "global_step": 306888, "epoch": 3697} {"train_loss": -25.70541763305664, "global_step": 306889, "epoch": 3697} {"train_loss": -25.986133575439453, "global_step": 306890, "epoch": 3697} {"train_loss": -25.586902618408203, "global_step": 306891, "epoch": 3697} {"train_loss": -25.104692459106445, "global_step": 306892, "epoch": 3697} {"train_loss": -25.719058990478516, "global_step": 306893, "epoch": 3697} {"train_loss": -25.740705490112305, "global_step": 306894, "epoch": 3697} {"train_loss": -25.901264190673828, "global_step": 306895, "epoch": 3697} {"train_loss": -25.86703872680664, "global_step": 306896, "epoch": 3697} {"train_loss": -25.786273956298828, "global_step": 306897, "epoch": 3697} {"train_loss": -25.56904411315918, "global_step": 306898, "epoch": 3697} {"train_loss": -25.92767906188965, "global_step": 306899, "epoch": 3697} {"train_loss": -25.72028923034668, "global_step": 306900, "epoch": 3697} {"train_loss": -25.873981475830078, "global_step": 306901, "epoch": 3697} {"train_loss": -26.229883193969727, "global_step": 306902, "epoch": 3697} {"train_loss": -25.84747886657715, "global_step": 306903, "epoch": 3697} {"train_loss": -25.738666534423828, "global_step": 306904, "epoch": 3697} {"train_loss": -25.72783851623535, "global_step": 306905, "epoch": 3697} {"train_loss": -25.753055572509766, "global_step": 306906, "epoch": 3697} {"train_loss": -26.002897262573242, "global_step": 306907, "epoch": 3697} {"train_loss": -25.965805053710938, "global_step": 306908, "epoch": 3697} {"train_loss": -25.8114013671875, "global_step": 306909, "epoch": 3697} {"train_loss": -25.90873146057129, "global_step": 306910, "epoch": 3697} {"train_loss": -25.815475463867188, "global_step": 306911, "epoch": 3697} {"train_loss": -26.0483341217041, "global_step": 306912, "epoch": 3697} {"train_loss": -25.328351974487305, "global_step": 306913, "epoch": 3697} {"train_loss": -25.78407096862793, "global_step": 306914, "epoch": 3697} {"train_loss": -25.543664932250977, "global_step": 306915, "epoch": 3697} {"train_loss": -25.66187858581543, "global_step": 306916, "epoch": 3697} {"train_loss": -25.643186569213867, "global_step": 306917, "epoch": 3697} {"train_loss": -25.586427688598633, "global_step": 306918, "epoch": 3697} {"train_loss": -26.031055450439453, "global_step": 306919, "epoch": 3697} {"train_loss": -25.668350219726562, "global_step": 306920, "epoch": 3697} {"train_loss": -25.40216636657715, "global_step": 306921, "epoch": 3697} {"train_loss": -25.73773193359375, "global_step": 306922, "epoch": 3697} {"train_loss": -25.413293838500977, "global_step": 306923, "epoch": 3697} {"train_loss": -25.64130210876465, "global_step": 306924, "epoch": 3697} {"train_loss": -25.940185546875, "global_step": 306925, "epoch": 3697} {"train_loss": -25.3504695892334, "global_step": 306926, "epoch": 3697} {"train_loss": -24.663719177246094, "global_step": 306927, "epoch": 3697} {"train_loss": -25.02816390991211, "global_step": 306928, "epoch": 3697} {"train_loss": -25.514867782592773, "global_step": 306929, "epoch": 3697} {"train_loss": -25.20854949951172, "global_step": 306930, "epoch": 3697} {"train_loss": -24.41718101501465, "global_step": 306931, "epoch": 3697} {"train_loss": -25.157474517822266, "global_step": 306932, "epoch": 3697} {"train_loss": -25.561543200389448, "global_step": 306933, "epoch": 3697, "val_loss": 7217899.0} {"train_loss": -24.592243194580078, "global_step": 306934, "epoch": 3698} {"train_loss": -24.92386245727539, "global_step": 306935, "epoch": 3698} {"train_loss": -24.30226707458496, "global_step": 306936, "epoch": 3698} {"train_loss": -24.18684959411621, "global_step": 306937, "epoch": 3698} {"train_loss": -24.81110954284668, "global_step": 306938, "epoch": 3698} {"train_loss": -24.220870971679688, "global_step": 306939, "epoch": 3698} {"train_loss": -24.62146759033203, "global_step": 306940, "epoch": 3698} {"train_loss": -24.912179946899414, "global_step": 306941, "epoch": 3698} {"train_loss": -24.915071487426758, "global_step": 306942, "epoch": 3698} {"train_loss": -24.910253524780273, "global_step": 306943, "epoch": 3698} {"train_loss": -24.998872756958008, "global_step": 306944, "epoch": 3698} {"train_loss": -24.762100219726562, "global_step": 306945, "epoch": 3698} {"train_loss": -25.164995193481445, "global_step": 306946, "epoch": 3698} {"train_loss": -25.210596084594727, "global_step": 306947, "epoch": 3698} {"train_loss": -24.81909942626953, "global_step": 306948, "epoch": 3698} {"train_loss": -25.206937789916992, "global_step": 306949, "epoch": 3698} {"train_loss": -24.713794708251953, "global_step": 306950, "epoch": 3698} {"train_loss": -25.395109176635742, "global_step": 306951, "epoch": 3698} {"train_loss": -25.11627769470215, "global_step": 306952, "epoch": 3698} {"train_loss": -25.028783798217773, "global_step": 306953, "epoch": 3698} {"train_loss": -25.452423095703125, "global_step": 306954, "epoch": 3698} {"train_loss": -24.78632926940918, "global_step": 306955, "epoch": 3698} {"train_loss": -25.017820358276367, "global_step": 306956, "epoch": 3698} {"train_loss": -25.173702239990234, "global_step": 306957, "epoch": 3698} {"train_loss": -25.486968994140625, "global_step": 306958, "epoch": 3698} {"train_loss": -25.770166397094727, "global_step": 306959, "epoch": 3698} {"train_loss": -25.249631881713867, "global_step": 306960, "epoch": 3698} {"train_loss": -25.310569763183594, "global_step": 306961, "epoch": 3698} {"train_loss": -25.521100997924805, "global_step": 306962, "epoch": 3698} {"train_loss": -25.53192710876465, "global_step": 306963, "epoch": 3698} {"train_loss": -25.366079330444336, "global_step": 306964, "epoch": 3698} {"train_loss": -25.566999435424805, "global_step": 306965, "epoch": 3698} {"train_loss": -25.5787296295166, "global_step": 306966, "epoch": 3698} {"train_loss": -25.761219024658203, "global_step": 306967, "epoch": 3698} {"train_loss": -25.432771682739258, "global_step": 306968, "epoch": 3698} {"train_loss": -25.685840606689453, "global_step": 306969, "epoch": 3698} {"train_loss": -25.954797744750977, "global_step": 306970, "epoch": 3698} {"train_loss": -25.810224533081055, "global_step": 306971, "epoch": 3698} {"train_loss": -25.71711540222168, "global_step": 306972, "epoch": 3698} {"train_loss": -25.7080135345459, "global_step": 306973, "epoch": 3698} {"train_loss": -25.89918327331543, "global_step": 306974, "epoch": 3698} {"train_loss": -25.940387725830078, "global_step": 306975, "epoch": 3698} {"train_loss": -25.8524112701416, "global_step": 306976, "epoch": 3698} {"train_loss": -25.832239151000977, "global_step": 306977, "epoch": 3698} {"train_loss": -25.724924087524414, "global_step": 306978, "epoch": 3698} {"train_loss": -26.054031372070312, "global_step": 306979, "epoch": 3698} {"train_loss": -26.1757755279541, "global_step": 306980, "epoch": 3698} {"train_loss": -25.511823654174805, "global_step": 306981, "epoch": 3698} {"train_loss": -26.06748390197754, "global_step": 306982, "epoch": 3698} {"train_loss": -25.928251266479492, "global_step": 306983, "epoch": 3698} {"train_loss": -26.14208984375, "global_step": 306984, "epoch": 3698} {"train_loss": -26.077564239501953, "global_step": 306985, "epoch": 3698} {"train_loss": -25.872785568237305, "global_step": 306986, "epoch": 3698} {"train_loss": -25.6434326171875, "global_step": 306987, "epoch": 3698} {"train_loss": -25.989789962768555, "global_step": 306988, "epoch": 3698} {"train_loss": -25.428525924682617, "global_step": 306989, "epoch": 3698} {"train_loss": -25.638967514038086, "global_step": 306990, "epoch": 3698} {"train_loss": -25.76901626586914, "global_step": 306991, "epoch": 3698} {"train_loss": -25.78822135925293, "global_step": 306992, "epoch": 3698} {"train_loss": -25.7893009185791, "global_step": 306993, "epoch": 3698} {"train_loss": -25.523181915283203, "global_step": 306994, "epoch": 3698} {"train_loss": -25.651294708251953, "global_step": 306995, "epoch": 3698} {"train_loss": -25.5579833984375, "global_step": 306996, "epoch": 3698} {"train_loss": -26.08685302734375, "global_step": 306997, "epoch": 3698} {"train_loss": -25.542837142944336, "global_step": 306998, "epoch": 3698} {"train_loss": -25.700361251831055, "global_step": 306999, "epoch": 3698} {"train_loss": -25.86042594909668, "global_step": 307000, "epoch": 3698} {"train_loss": -25.75644874572754, "global_step": 307001, "epoch": 3698} {"train_loss": -25.484487533569336, "global_step": 307002, "epoch": 3698} {"train_loss": -25.97344398498535, "global_step": 307003, "epoch": 3698} {"train_loss": -25.813159942626953, "global_step": 307004, "epoch": 3698} {"train_loss": -25.510845184326172, "global_step": 307005, "epoch": 3698} {"train_loss": -25.613492965698242, "global_step": 307006, "epoch": 3698} {"train_loss": -25.988523483276367, "global_step": 307007, "epoch": 3698} {"train_loss": -25.587902069091797, "global_step": 307008, "epoch": 3698} {"train_loss": -25.45149803161621, "global_step": 307009, "epoch": 3698} {"train_loss": -25.630615234375, "global_step": 307010, "epoch": 3698} {"train_loss": -25.41468620300293, "global_step": 307011, "epoch": 3698} {"train_loss": -26.198657989501953, "global_step": 307012, "epoch": 3698} {"train_loss": -25.751951217651367, "global_step": 307013, "epoch": 3698} {"train_loss": -25.613544464111328, "global_step": 307014, "epoch": 3698} {"train_loss": -25.3740291595459, "global_step": 307015, "epoch": 3698} {"train_loss": -25.488546900002355, "global_step": 307016, "epoch": 3698, "val_loss": 7252669.0} {"train_loss": -24.209733963012695, "global_step": 307017, "epoch": 3699} {"train_loss": -25.28835105895996, "global_step": 307018, "epoch": 3699} {"train_loss": -24.95806312561035, "global_step": 307019, "epoch": 3699} {"train_loss": -25.129667282104492, "global_step": 307020, "epoch": 3699} {"train_loss": -25.09351921081543, "global_step": 307021, "epoch": 3699} {"train_loss": -25.361343383789062, "global_step": 307022, "epoch": 3699} {"train_loss": -25.066242218017578, "global_step": 307023, "epoch": 3699} {"train_loss": -25.159303665161133, "global_step": 307024, "epoch": 3699} {"train_loss": -25.51952362060547, "global_step": 307025, "epoch": 3699} {"train_loss": -25.349233627319336, "global_step": 307026, "epoch": 3699} {"train_loss": -25.27113914489746, "global_step": 307027, "epoch": 3699} {"train_loss": -25.34670066833496, "global_step": 307028, "epoch": 3699} {"train_loss": -25.637826919555664, "global_step": 307029, "epoch": 3699} {"train_loss": -25.528980255126953, "global_step": 307030, "epoch": 3699} {"train_loss": -25.409082412719727, "global_step": 307031, "epoch": 3699} {"train_loss": -25.759244918823242, "global_step": 307032, "epoch": 3699} {"train_loss": -25.575101852416992, "global_step": 307033, "epoch": 3699} {"train_loss": -25.19776725769043, "global_step": 307034, "epoch": 3699} {"train_loss": -25.701404571533203, "global_step": 307035, "epoch": 3699} {"train_loss": -25.546104431152344, "global_step": 307036, "epoch": 3699} {"train_loss": -25.8651180267334, "global_step": 307037, "epoch": 3699} {"train_loss": -25.590713500976562, "global_step": 307038, "epoch": 3699} {"train_loss": -25.81812858581543, "global_step": 307039, "epoch": 3699} {"train_loss": -25.401447296142578, "global_step": 307040, "epoch": 3699} {"train_loss": -25.64307975769043, "global_step": 307041, "epoch": 3699} {"train_loss": -25.520526885986328, "global_step": 307042, "epoch": 3699} {"train_loss": -25.386877059936523, "global_step": 307043, "epoch": 3699} {"train_loss": -25.519746780395508, "global_step": 307044, "epoch": 3699} {"train_loss": -25.938983917236328, "global_step": 307045, "epoch": 3699} {"train_loss": -26.062963485717773, "global_step": 307046, "epoch": 3699} {"train_loss": -25.883970260620117, "global_step": 307047, "epoch": 3699} {"train_loss": -25.613489151000977, "global_step": 307048, "epoch": 3699} {"train_loss": -26.022613525390625, "global_step": 307049, "epoch": 3699} {"train_loss": -25.923383712768555, "global_step": 307050, "epoch": 3699} {"train_loss": -25.690662384033203, "global_step": 307051, "epoch": 3699} {"train_loss": -25.87088394165039, "global_step": 307052, "epoch": 3699} {"train_loss": -25.727643966674805, "global_step": 307053, "epoch": 3699} {"train_loss": -25.5397891998291, "global_step": 307054, "epoch": 3699} {"train_loss": -25.571935653686523, "global_step": 307055, "epoch": 3699} {"train_loss": -25.841815948486328, "global_step": 307056, "epoch": 3699} {"train_loss": -25.992704391479492, "global_step": 307057, "epoch": 3699} {"train_loss": -26.162580490112305, "global_step": 307058, "epoch": 3699} {"train_loss": -25.880802154541016, "global_step": 307059, "epoch": 3699} {"train_loss": -25.8737850189209, "global_step": 307060, "epoch": 3699} {"train_loss": -25.829090118408203, "global_step": 307061, "epoch": 3699} {"train_loss": -25.889225006103516, "global_step": 307062, "epoch": 3699} {"train_loss": -25.872411727905273, "global_step": 307063, "epoch": 3699} {"train_loss": -25.950336456298828, "global_step": 307064, "epoch": 3699} {"train_loss": -26.084196090698242, "global_step": 307065, "epoch": 3699} {"train_loss": -25.63408851623535, "global_step": 307066, "epoch": 3699} {"train_loss": -25.977874755859375, "global_step": 307067, "epoch": 3699} {"train_loss": -26.050146102905273, "global_step": 307068, "epoch": 3699} {"train_loss": -25.7215518951416, "global_step": 307069, "epoch": 3699} {"train_loss": -26.084686279296875, "global_step": 307070, "epoch": 3699} {"train_loss": -25.48617935180664, "global_step": 307071, "epoch": 3699} {"train_loss": -26.22791862487793, "global_step": 307072, "epoch": 3699} {"train_loss": -25.55610466003418, "global_step": 307073, "epoch": 3699} {"train_loss": -25.44083595275879, "global_step": 307074, "epoch": 3699} {"train_loss": -25.385284423828125, "global_step": 307075, "epoch": 3699} {"train_loss": -25.489782333374023, "global_step": 307076, "epoch": 3699} {"train_loss": -25.497037887573242, "global_step": 307077, "epoch": 3699} {"train_loss": -25.830307006835938, "global_step": 307078, "epoch": 3699} {"train_loss": -26.023096084594727, "global_step": 307079, "epoch": 3699} {"train_loss": -25.547224044799805, "global_step": 307080, "epoch": 3699} {"train_loss": -25.77168846130371, "global_step": 307081, "epoch": 3699} {"train_loss": -25.889633178710938, "global_step": 307082, "epoch": 3699} {"train_loss": -26.103708267211914, "global_step": 307083, "epoch": 3699} {"train_loss": -25.9829158782959, "global_step": 307084, "epoch": 3699} {"train_loss": -25.712881088256836, "global_step": 307085, "epoch": 3699} {"train_loss": -25.396610260009766, "global_step": 307086, "epoch": 3699} {"train_loss": -25.536956787109375, "global_step": 307087, "epoch": 3699} {"train_loss": -25.604629516601562, "global_step": 307088, "epoch": 3699} {"train_loss": -25.85174560546875, "global_step": 307089, "epoch": 3699} {"train_loss": -25.442594528198242, "global_step": 307090, "epoch": 3699} {"train_loss": -25.59093475341797, "global_step": 307091, "epoch": 3699} {"train_loss": -25.69049644470215, "global_step": 307092, "epoch": 3699} {"train_loss": -25.722692489624023, "global_step": 307093, "epoch": 3699} {"train_loss": -25.55786895751953, "global_step": 307094, "epoch": 3699} {"train_loss": -26.016437530517578, "global_step": 307095, "epoch": 3699} {"train_loss": -25.99112892150879, "global_step": 307096, "epoch": 3699} {"train_loss": -25.83042335510254, "global_step": 307097, "epoch": 3699} {"train_loss": -25.759002685546875, "global_step": 307098, "epoch": 3699} {"train_loss": -25.65907200273261, "global_step": 307099, "epoch": 3699, "val_loss": 7225201.0} {"train_loss": -25.143909454345703, "global_step": 307100, "epoch": 3700} {"train_loss": -25.620222091674805, "global_step": 307101, "epoch": 3700} {"train_loss": -24.89181900024414, "global_step": 307102, "epoch": 3700} {"train_loss": -25.458602905273438, "global_step": 307103, "epoch": 3700} {"train_loss": -25.150894165039062, "global_step": 307104, "epoch": 3700} {"train_loss": -24.991735458374023, "global_step": 307105, "epoch": 3700} {"train_loss": -25.806066513061523, "global_step": 307106, "epoch": 3700} {"train_loss": -25.585500717163086, "global_step": 307107, "epoch": 3700} {"train_loss": -25.560232162475586, "global_step": 307108, "epoch": 3700} {"train_loss": -25.611169815063477, "global_step": 307109, "epoch": 3700} {"train_loss": -25.475927352905273, "global_step": 307110, "epoch": 3700} {"train_loss": -25.500446319580078, "global_step": 307111, "epoch": 3700} {"train_loss": -25.445159912109375, "global_step": 307112, "epoch": 3700} {"train_loss": -25.5255069732666, "global_step": 307113, "epoch": 3700} {"train_loss": -25.589637756347656, "global_step": 307114, "epoch": 3700} {"train_loss": -25.641204833984375, "global_step": 307115, "epoch": 3700} {"train_loss": -25.495162963867188, "global_step": 307116, "epoch": 3700} {"train_loss": -25.833959579467773, "global_step": 307117, "epoch": 3700} {"train_loss": -25.412567138671875, "global_step": 307118, "epoch": 3700} {"train_loss": -25.481115341186523, "global_step": 307119, "epoch": 3700} {"train_loss": -25.331552505493164, "global_step": 307120, "epoch": 3700} {"train_loss": -25.430387496948242, "global_step": 307121, "epoch": 3700} {"train_loss": -25.669681549072266, "global_step": 307122, "epoch": 3700} {"train_loss": -25.287076950073242, "global_step": 307123, "epoch": 3700} {"train_loss": -25.3907527923584, "global_step": 307124, "epoch": 3700} {"train_loss": -25.97319984436035, "global_step": 307125, "epoch": 3700} {"train_loss": -25.747949600219727, "global_step": 307126, "epoch": 3700} {"train_loss": -25.869598388671875, "global_step": 307127, "epoch": 3700} {"train_loss": -25.305770874023438, "global_step": 307128, "epoch": 3700} {"train_loss": -25.734638214111328, "global_step": 307129, "epoch": 3700} {"train_loss": -25.499595642089844, "global_step": 307130, "epoch": 3700} {"train_loss": -25.81892204284668, "global_step": 307131, "epoch": 3700} {"train_loss": -25.486968994140625, "global_step": 307132, "epoch": 3700} {"train_loss": -25.641172409057617, "global_step": 307133, "epoch": 3700} {"train_loss": -25.91847801208496, "global_step": 307134, "epoch": 3700} {"train_loss": -25.681787490844727, "global_step": 307135, "epoch": 3700} {"train_loss": -26.043811798095703, "global_step": 307136, "epoch": 3700} {"train_loss": -25.853271484375, "global_step": 307137, "epoch": 3700} {"train_loss": -25.734155654907227, "global_step": 307138, "epoch": 3700} {"train_loss": -25.785980224609375, "global_step": 307139, "epoch": 3700} {"train_loss": -26.06117057800293, "global_step": 307140, "epoch": 3700} {"train_loss": -25.74593162536621, "global_step": 307141, "epoch": 3700} {"train_loss": -25.71430015563965, "global_step": 307142, "epoch": 3700} {"train_loss": -26.011627197265625, "global_step": 307143, "epoch": 3700} {"train_loss": -25.625537872314453, "global_step": 307144, "epoch": 3700} {"train_loss": -26.05177879333496, "global_step": 307145, "epoch": 3700} {"train_loss": -25.977954864501953, "global_step": 307146, "epoch": 3700} {"train_loss": -25.7503604888916, "global_step": 307147, "epoch": 3700} {"train_loss": -25.923816680908203, "global_step": 307148, "epoch": 3700} {"train_loss": -25.637928009033203, "global_step": 307149, "epoch": 3700} {"train_loss": -25.932615280151367, "global_step": 307150, "epoch": 3700} {"train_loss": -25.706464767456055, "global_step": 307151, "epoch": 3700} {"train_loss": -25.41908073425293, "global_step": 307152, "epoch": 3700} {"train_loss": -25.134519577026367, "global_step": 307153, "epoch": 3700} {"train_loss": -25.797107696533203, "global_step": 307154, "epoch": 3700} {"train_loss": -25.240076065063477, "global_step": 307155, "epoch": 3700} {"train_loss": -25.909912109375, "global_step": 307156, "epoch": 3700} {"train_loss": -25.843708038330078, "global_step": 307157, "epoch": 3700} {"train_loss": -25.556907653808594, "global_step": 307158, "epoch": 3700} {"train_loss": -25.629480361938477, "global_step": 307159, "epoch": 3700} {"train_loss": -24.95656394958496, "global_step": 307160, "epoch": 3700} {"train_loss": -24.841489791870117, "global_step": 307161, "epoch": 3700} {"train_loss": -25.230466842651367, "global_step": 307162, "epoch": 3700} {"train_loss": -25.4898624420166, "global_step": 307163, "epoch": 3700} {"train_loss": -25.33173370361328, "global_step": 307164, "epoch": 3700} {"train_loss": -25.748706817626953, "global_step": 307165, "epoch": 3700} {"train_loss": -25.451841354370117, "global_step": 307166, "epoch": 3700} {"train_loss": -25.821441650390625, "global_step": 307167, "epoch": 3700} {"train_loss": -25.827810287475586, "global_step": 307168, "epoch": 3700} {"train_loss": -25.21285057067871, "global_step": 307169, "epoch": 3700} {"train_loss": -25.757251739501953, "global_step": 307170, "epoch": 3700} {"train_loss": -25.535720825195312, "global_step": 307171, "epoch": 3700} {"train_loss": -25.283592224121094, "global_step": 307172, "epoch": 3700} {"train_loss": -25.315900802612305, "global_step": 307173, "epoch": 3700} {"train_loss": -25.802682876586914, "global_step": 307174, "epoch": 3700} {"train_loss": -25.66329002380371, "global_step": 307175, "epoch": 3700} {"train_loss": -25.778051376342773, "global_step": 307176, "epoch": 3700} {"train_loss": -25.87299919128418, "global_step": 307177, "epoch": 3700} {"train_loss": -25.427207946777344, "global_step": 307178, "epoch": 3700} {"train_loss": -25.8089656829834, "global_step": 307179, "epoch": 3700} {"train_loss": -25.719018936157227, "global_step": 307180, "epoch": 3700} {"train_loss": -25.751468658447266, "global_step": 307181, "epoch": 3700} {"train_loss": -25.600124106349714, "global_step": 307182, "epoch": 3700, "train/sim_max_reward_0": 1.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4500000": 1.0, "test/sim_max_reward_4500001": 1.0, "test/sim_max_reward_4500002": 1.0, "test/sim_max_reward_4500003": 1.0, "test/sim_max_reward_4500004": 0.0, "test/sim_max_reward_4500005": 1.0, "test/sim_max_reward_4500006": 1.0, "test/sim_max_reward_4500007": 1.0, "test/sim_max_reward_4500008": 1.0, "test/sim_max_reward_4500009": 1.0, "test/sim_max_reward_4500010": 1.0, "test/sim_max_reward_4500011": 1.0, "test/sim_max_reward_4500012": 1.0, "test/sim_max_reward_4500013": 0.0, "test/sim_max_reward_4500014": 1.0, "test/sim_max_reward_4500015": 1.0, "test/sim_max_reward_4500016": 1.0, "test/sim_max_reward_4500017": 1.0, "test/sim_max_reward_4500018": 1.0, "test/sim_max_reward_4500019": 0.0, "test/sim_max_reward_4500020": 1.0, "test/sim_max_reward_4500021": 1.0, "train/mean_score": 1.0, "test/mean_score": 0.8636363636363636, "val_loss": 7178392.5} {"train_loss": -25.805419921875, "global_step": 307183, "epoch": 3701} {"train_loss": -25.40799903869629, "global_step": 307184, "epoch": 3701} {"train_loss": -25.631973266601562, "global_step": 307185, "epoch": 3701} {"train_loss": -25.255170822143555, "global_step": 307186, "epoch": 3701} {"train_loss": -26.04598045349121, "global_step": 307187, "epoch": 3701} {"train_loss": -25.74199867248535, "global_step": 307188, "epoch": 3701} {"train_loss": -25.40284538269043, "global_step": 307189, "epoch": 3701} {"train_loss": -25.58319854736328, "global_step": 307190, "epoch": 3701} {"train_loss": -25.478485107421875, "global_step": 307191, "epoch": 3701} {"train_loss": -25.22467613220215, "global_step": 307192, "epoch": 3701} {"train_loss": -25.676578521728516, "global_step": 307193, "epoch": 3701} {"train_loss": -25.162626266479492, "global_step": 307194, "epoch": 3701} {"train_loss": -25.72987174987793, "global_step": 307195, "epoch": 3701} {"train_loss": -25.615371704101562, "global_step": 307196, "epoch": 3701} {"train_loss": -25.593692779541016, "global_step": 307197, "epoch": 3701} {"train_loss": -25.969165802001953, "global_step": 307198, "epoch": 3701} {"train_loss": -25.56138038635254, "global_step": 307199, "epoch": 3701} {"train_loss": -25.747360229492188, "global_step": 307200, "epoch": 3701} {"train_loss": -25.924463272094727, "global_step": 307201, "epoch": 3701} {"train_loss": -25.74213218688965, "global_step": 307202, "epoch": 3701} {"train_loss": -26.369709014892578, "global_step": 307203, "epoch": 3701} {"train_loss": -25.51749038696289, "global_step": 307204, "epoch": 3701} {"train_loss": -25.40559959411621, "global_step": 307205, "epoch": 3701} {"train_loss": -25.544401168823242, "global_step": 307206, "epoch": 3701} {"train_loss": -25.492568969726562, "global_step": 307207, "epoch": 3701} {"train_loss": -25.597532272338867, "global_step": 307208, "epoch": 3701} {"train_loss": -25.647130966186523, "global_step": 307209, "epoch": 3701} {"train_loss": -25.651391983032227, "global_step": 307210, "epoch": 3701} {"train_loss": -25.641830444335938, "global_step": 307211, "epoch": 3701} {"train_loss": -25.126787185668945, "global_step": 307212, "epoch": 3701} {"train_loss": -25.738611221313477, "global_step": 307213, "epoch": 3701} {"train_loss": -25.748014450073242, "global_step": 307214, "epoch": 3701} {"train_loss": -25.8707332611084, "global_step": 307215, "epoch": 3701} {"train_loss": -25.49783706665039, "global_step": 307216, "epoch": 3701} {"train_loss": -25.570777893066406, "global_step": 307217, "epoch": 3701} {"train_loss": -25.884801864624023, "global_step": 307218, "epoch": 3701} {"train_loss": -25.59039306640625, "global_step": 307219, "epoch": 3701} {"train_loss": -25.847187042236328, "global_step": 307220, "epoch": 3701} {"train_loss": -25.499738693237305, "global_step": 307221, "epoch": 3701} {"train_loss": -25.407106399536133, "global_step": 307222, "epoch": 3701} {"train_loss": -25.323287963867188, "global_step": 307223, "epoch": 3701} {"train_loss": -25.512346267700195, "global_step": 307224, "epoch": 3701} {"train_loss": -25.68484878540039, "global_step": 307225, "epoch": 3701} {"train_loss": -25.57110023498535, "global_step": 307226, "epoch": 3701} {"train_loss": -26.266162872314453, "global_step": 307227, "epoch": 3701} {"train_loss": -25.691181182861328, "global_step": 307228, "epoch": 3701} {"train_loss": -26.12811279296875, "global_step": 307229, "epoch": 3701} {"train_loss": -25.50995635986328, "global_step": 307230, "epoch": 3701} {"train_loss": -25.785736083984375, "global_step": 307231, "epoch": 3701} {"train_loss": -25.696197509765625, "global_step": 307232, "epoch": 3701} {"train_loss": -25.8502140045166, "global_step": 307233, "epoch": 3701} {"train_loss": -25.533605575561523, "global_step": 307234, "epoch": 3701} {"train_loss": -25.717914581298828, "global_step": 307235, "epoch": 3701} {"train_loss": -25.80426597595215, "global_step": 307236, "epoch": 3701} {"train_loss": -26.175817489624023, "global_step": 307237, "epoch": 3701} {"train_loss": -25.570056915283203, "global_step": 307238, "epoch": 3701} {"train_loss": -25.856861114501953, "global_step": 307239, "epoch": 3701} {"train_loss": -25.930761337280273, "global_step": 307240, "epoch": 3701} {"train_loss": -26.021215438842773, "global_step": 307241, "epoch": 3701} {"train_loss": -25.8038387298584, "global_step": 307242, "epoch": 3701} {"train_loss": -25.56863021850586, "global_step": 307243, "epoch": 3701} {"train_loss": -25.58222007751465, "global_step": 307244, "epoch": 3701} {"train_loss": -25.586950302124023, "global_step": 307245, "epoch": 3701} {"train_loss": -25.248510360717773, "global_step": 307246, "epoch": 3701} {"train_loss": -25.944049835205078, "global_step": 307247, "epoch": 3701} {"train_loss": -25.59259605407715, "global_step": 307248, "epoch": 3701} {"train_loss": -25.502979278564453, "global_step": 307249, "epoch": 3701} {"train_loss": -25.5556583404541, "global_step": 307250, "epoch": 3701} {"train_loss": -25.787351608276367, "global_step": 307251, "epoch": 3701} {"train_loss": -25.540334701538086, "global_step": 307252, "epoch": 3701} {"train_loss": -25.95391273498535, "global_step": 307253, "epoch": 3701} {"train_loss": -25.57622718811035, "global_step": 307254, "epoch": 3701} {"train_loss": -25.7067928314209, "global_step": 307255, "epoch": 3701} {"train_loss": -25.955657958984375, "global_step": 307256, "epoch": 3701} {"train_loss": -25.955902099609375, "global_step": 307257, "epoch": 3701} {"train_loss": -26.127012252807617, "global_step": 307258, "epoch": 3701} {"train_loss": -25.5747127532959, "global_step": 307259, "epoch": 3701} {"train_loss": -26.109399795532227, "global_step": 307260, "epoch": 3701} {"train_loss": -25.80881118774414, "global_step": 307261, "epoch": 3701} {"train_loss": -26.075239181518555, "global_step": 307262, "epoch": 3701} {"train_loss": -25.6152286529541, "global_step": 307263, "epoch": 3701} {"train_loss": -25.614065170288086, "global_step": 307264, "epoch": 3701} {"train_loss": -25.683258814984057, "global_step": 307265, "epoch": 3701, "val_loss": 7220923.0} {"train_loss": -24.373727798461914, "global_step": 307266, "epoch": 3702} {"train_loss": -23.027753829956055, "global_step": 307267, "epoch": 3702} {"train_loss": -24.875141143798828, "global_step": 307268, "epoch": 3702} {"train_loss": -24.40779685974121, "global_step": 307269, "epoch": 3702} {"train_loss": -23.996623992919922, "global_step": 307270, "epoch": 3702} {"train_loss": -24.051904678344727, "global_step": 307271, "epoch": 3702} {"train_loss": -24.358049392700195, "global_step": 307272, "epoch": 3702} {"train_loss": -24.258792877197266, "global_step": 307273, "epoch": 3702} {"train_loss": -25.193546295166016, "global_step": 307274, "epoch": 3702} {"train_loss": -24.793746948242188, "global_step": 307275, "epoch": 3702} {"train_loss": -24.88077163696289, "global_step": 307276, "epoch": 3702} {"train_loss": -24.825057983398438, "global_step": 307277, "epoch": 3702} {"train_loss": -24.982397079467773, "global_step": 307278, "epoch": 3702} {"train_loss": -25.0412654876709, "global_step": 307279, "epoch": 3702} {"train_loss": -25.377819061279297, "global_step": 307280, "epoch": 3702} {"train_loss": -24.754425048828125, "global_step": 307281, "epoch": 3702} {"train_loss": -24.971879959106445, "global_step": 307282, "epoch": 3702} {"train_loss": -25.56374168395996, "global_step": 307283, "epoch": 3702} {"train_loss": -24.8656005859375, "global_step": 307284, "epoch": 3702} {"train_loss": -25.197172164916992, "global_step": 307285, "epoch": 3702} {"train_loss": -25.3011531829834, "global_step": 307286, "epoch": 3702} {"train_loss": -25.42597007751465, "global_step": 307287, "epoch": 3702} {"train_loss": -24.977798461914062, "global_step": 307288, "epoch": 3702} {"train_loss": -24.910961151123047, "global_step": 307289, "epoch": 3702} {"train_loss": -24.97138023376465, "global_step": 307290, "epoch": 3702} {"train_loss": -25.51923942565918, "global_step": 307291, "epoch": 3702} {"train_loss": -25.5052547454834, "global_step": 307292, "epoch": 3702} {"train_loss": -25.41143226623535, "global_step": 307293, "epoch": 3702} {"train_loss": -25.604963302612305, "global_step": 307294, "epoch": 3702} {"train_loss": -25.084152221679688, "global_step": 307295, "epoch": 3702} {"train_loss": -25.581697463989258, "global_step": 307296, "epoch": 3702} {"train_loss": -25.204986572265625, "global_step": 307297, "epoch": 3702} {"train_loss": -25.229412078857422, "global_step": 307298, "epoch": 3702} {"train_loss": -25.55039405822754, "global_step": 307299, "epoch": 3702} {"train_loss": -25.77021598815918, "global_step": 307300, "epoch": 3702} {"train_loss": -25.531600952148438, "global_step": 307301, "epoch": 3702} {"train_loss": -25.285871505737305, "global_step": 307302, "epoch": 3702} {"train_loss": -25.350133895874023, "global_step": 307303, "epoch": 3702} {"train_loss": -25.605411529541016, "global_step": 307304, "epoch": 3702} {"train_loss": -25.485204696655273, "global_step": 307305, "epoch": 3702} {"train_loss": -25.838275909423828, "global_step": 307306, "epoch": 3702} {"train_loss": -26.07630729675293, "global_step": 307307, "epoch": 3702} {"train_loss": -25.731815338134766, "global_step": 307308, "epoch": 3702} {"train_loss": -25.982648849487305, "global_step": 307309, "epoch": 3702} {"train_loss": -25.856000900268555, "global_step": 307310, "epoch": 3702} {"train_loss": -25.750280380249023, "global_step": 307311, "epoch": 3702} {"train_loss": -25.587173461914062, "global_step": 307312, "epoch": 3702} {"train_loss": -25.806243896484375, "global_step": 307313, "epoch": 3702} {"train_loss": -25.593454360961914, "global_step": 307314, "epoch": 3702} {"train_loss": -25.31022071838379, "global_step": 307315, "epoch": 3702} {"train_loss": -25.791549682617188, "global_step": 307316, "epoch": 3702} {"train_loss": -25.870832443237305, "global_step": 307317, "epoch": 3702} {"train_loss": -25.89631462097168, "global_step": 307318, "epoch": 3702} {"train_loss": -26.00472068786621, "global_step": 307319, "epoch": 3702} {"train_loss": -25.754261016845703, "global_step": 307320, "epoch": 3702} {"train_loss": -25.480016708374023, "global_step": 307321, "epoch": 3702} {"train_loss": -25.6096248626709, "global_step": 307322, "epoch": 3702} {"train_loss": -25.7459774017334, "global_step": 307323, "epoch": 3702} {"train_loss": -25.5362606048584, "global_step": 307324, "epoch": 3702} {"train_loss": -25.822004318237305, "global_step": 307325, "epoch": 3702} {"train_loss": -25.778339385986328, "global_step": 307326, "epoch": 3702} {"train_loss": -25.57944107055664, "global_step": 307327, "epoch": 3702} {"train_loss": -25.705053329467773, "global_step": 307328, "epoch": 3702} {"train_loss": -26.25754165649414, "global_step": 307329, "epoch": 3702} {"train_loss": -25.633771896362305, "global_step": 307330, "epoch": 3702} {"train_loss": -25.73286247253418, "global_step": 307331, "epoch": 3702} {"train_loss": -25.887243270874023, "global_step": 307332, "epoch": 3702} {"train_loss": -25.708608627319336, "global_step": 307333, "epoch": 3702} {"train_loss": -25.663471221923828, "global_step": 307334, "epoch": 3702} {"train_loss": -25.55622673034668, "global_step": 307335, "epoch": 3702} {"train_loss": -25.801298141479492, "global_step": 307336, "epoch": 3702} {"train_loss": -25.793426513671875, "global_step": 307337, "epoch": 3702} {"train_loss": -25.829187393188477, "global_step": 307338, "epoch": 3702} {"train_loss": -26.09315299987793, "global_step": 307339, "epoch": 3702} {"train_loss": -25.759693145751953, "global_step": 307340, "epoch": 3702} {"train_loss": -26.1663761138916, "global_step": 307341, "epoch": 3702} {"train_loss": -25.851953506469727, "global_step": 307342, "epoch": 3702} {"train_loss": -25.679279327392578, "global_step": 307343, "epoch": 3702} {"train_loss": -25.83283042907715, "global_step": 307344, "epoch": 3702} {"train_loss": -26.22226905822754, "global_step": 307345, "epoch": 3702} {"train_loss": -25.38043785095215, "global_step": 307346, "epoch": 3702} {"train_loss": -25.6059627532959, "global_step": 307347, "epoch": 3702} {"train_loss": -25.4184931329934, "global_step": 307348, "epoch": 3702, "val_loss": 7316505.0} {"train_loss": -25.474611282348633, "global_step": 307349, "epoch": 3703} {"train_loss": -25.248197555541992, "global_step": 307350, "epoch": 3703} {"train_loss": -24.850496292114258, "global_step": 307351, "epoch": 3703} {"train_loss": -24.8701229095459, "global_step": 307352, "epoch": 3703} {"train_loss": -25.141061782836914, "global_step": 307353, "epoch": 3703} {"train_loss": -25.255126953125, "global_step": 307354, "epoch": 3703} {"train_loss": -25.026262283325195, "global_step": 307355, "epoch": 3703} {"train_loss": -25.518014907836914, "global_step": 307356, "epoch": 3703} {"train_loss": -25.451459884643555, "global_step": 307357, "epoch": 3703} {"train_loss": -25.86322021484375, "global_step": 307358, "epoch": 3703} {"train_loss": -25.625295639038086, "global_step": 307359, "epoch": 3703} {"train_loss": -25.307117462158203, "global_step": 307360, "epoch": 3703} {"train_loss": -25.526803970336914, "global_step": 307361, "epoch": 3703} {"train_loss": -25.10860252380371, "global_step": 307362, "epoch": 3703} {"train_loss": -24.841733932495117, "global_step": 307363, "epoch": 3703} {"train_loss": -25.579036712646484, "global_step": 307364, "epoch": 3703} {"train_loss": -25.512088775634766, "global_step": 307365, "epoch": 3703} {"train_loss": -25.536136627197266, "global_step": 307366, "epoch": 3703} {"train_loss": -25.716938018798828, "global_step": 307367, "epoch": 3703} {"train_loss": -25.37557029724121, "global_step": 307368, "epoch": 3703} {"train_loss": -25.66611099243164, "global_step": 307369, "epoch": 3703} {"train_loss": -25.46371841430664, "global_step": 307370, "epoch": 3703} {"train_loss": -26.073469161987305, "global_step": 307371, "epoch": 3703} {"train_loss": -25.189422607421875, "global_step": 307372, "epoch": 3703} {"train_loss": -25.60249137878418, "global_step": 307373, "epoch": 3703} {"train_loss": -25.434507369995117, "global_step": 307374, "epoch": 3703} {"train_loss": -25.610471725463867, "global_step": 307375, "epoch": 3703} {"train_loss": -25.274852752685547, "global_step": 307376, "epoch": 3703} {"train_loss": -25.805185317993164, "global_step": 307377, "epoch": 3703} {"train_loss": -26.225366592407227, "global_step": 307378, "epoch": 3703} {"train_loss": -25.682586669921875, "global_step": 307379, "epoch": 3703} {"train_loss": -25.70204734802246, "global_step": 307380, "epoch": 3703} {"train_loss": -26.00625991821289, "global_step": 307381, "epoch": 3703} {"train_loss": -25.885839462280273, "global_step": 307382, "epoch": 3703} {"train_loss": -25.889423370361328, "global_step": 307383, "epoch": 3703} {"train_loss": -25.56268310546875, "global_step": 307384, "epoch": 3703} {"train_loss": -25.478599548339844, "global_step": 307385, "epoch": 3703} {"train_loss": -25.642324447631836, "global_step": 307386, "epoch": 3703} {"train_loss": -25.6158390045166, "global_step": 307387, "epoch": 3703} {"train_loss": -25.56625747680664, "global_step": 307388, "epoch": 3703} {"train_loss": -25.913930892944336, "global_step": 307389, "epoch": 3703} {"train_loss": -25.672637939453125, "global_step": 307390, "epoch": 3703} {"train_loss": -25.56553840637207, "global_step": 307391, "epoch": 3703} {"train_loss": -25.93890380859375, "global_step": 307392, "epoch": 3703} {"train_loss": -25.91929054260254, "global_step": 307393, "epoch": 3703} {"train_loss": -25.93340492248535, "global_step": 307394, "epoch": 3703} {"train_loss": -25.82362174987793, "global_step": 307395, "epoch": 3703} {"train_loss": -25.428150177001953, "global_step": 307396, "epoch": 3703} {"train_loss": -25.60992431640625, "global_step": 307397, "epoch": 3703} {"train_loss": -26.050947189331055, "global_step": 307398, "epoch": 3703} {"train_loss": -25.832929611206055, "global_step": 307399, "epoch": 3703} {"train_loss": -25.734176635742188, "global_step": 307400, "epoch": 3703} {"train_loss": -25.54743766784668, "global_step": 307401, "epoch": 3703} {"train_loss": -25.942157745361328, "global_step": 307402, "epoch": 3703} {"train_loss": -25.81292724609375, "global_step": 307403, "epoch": 3703} {"train_loss": -25.513654708862305, "global_step": 307404, "epoch": 3703} {"train_loss": -25.605899810791016, "global_step": 307405, "epoch": 3703} {"train_loss": -25.994049072265625, "global_step": 307406, "epoch": 3703} {"train_loss": -26.384143829345703, "global_step": 307407, "epoch": 3703} {"train_loss": -25.884506225585938, "global_step": 307408, "epoch": 3703} {"train_loss": -25.543827056884766, "global_step": 307409, "epoch": 3703} {"train_loss": -25.59622573852539, "global_step": 307410, "epoch": 3703} {"train_loss": -25.629486083984375, "global_step": 307411, "epoch": 3703} {"train_loss": -25.78790283203125, "global_step": 307412, "epoch": 3703} {"train_loss": -26.055456161499023, "global_step": 307413, "epoch": 3703} {"train_loss": -25.989484786987305, "global_step": 307414, "epoch": 3703} {"train_loss": -25.820270538330078, "global_step": 307415, "epoch": 3703} {"train_loss": -25.847217559814453, "global_step": 307416, "epoch": 3703} {"train_loss": -26.131479263305664, "global_step": 307417, "epoch": 3703} {"train_loss": -25.809492111206055, "global_step": 307418, "epoch": 3703} {"train_loss": -25.638507843017578, "global_step": 307419, "epoch": 3703} {"train_loss": -25.736303329467773, "global_step": 307420, "epoch": 3703} {"train_loss": -26.0, "global_step": 307421, "epoch": 3703} {"train_loss": -25.784162521362305, "global_step": 307422, "epoch": 3703} {"train_loss": -26.02445411682129, "global_step": 307423, "epoch": 3703} {"train_loss": -25.93842887878418, "global_step": 307424, "epoch": 3703} {"train_loss": -25.58469581604004, "global_step": 307425, "epoch": 3703} {"train_loss": -25.920169830322266, "global_step": 307426, "epoch": 3703} {"train_loss": -25.95014762878418, "global_step": 307427, "epoch": 3703} {"train_loss": -25.748151779174805, "global_step": 307428, "epoch": 3703} {"train_loss": -25.330778121948242, "global_step": 307429, "epoch": 3703} {"train_loss": -25.940357208251953, "global_step": 307430, "epoch": 3703} {"train_loss": -25.67323484765478, "global_step": 307431, "epoch": 3703, "val_loss": 7236900.5} {"train_loss": -23.19516944885254, "global_step": 307432, "epoch": 3704} {"train_loss": -23.991971969604492, "global_step": 307433, "epoch": 3704} {"train_loss": -24.343494415283203, "global_step": 307434, "epoch": 3704} {"train_loss": -24.35108184814453, "global_step": 307435, "epoch": 3704} {"train_loss": -24.908096313476562, "global_step": 307436, "epoch": 3704} {"train_loss": -24.996854782104492, "global_step": 307437, "epoch": 3704} {"train_loss": -24.778167724609375, "global_step": 307438, "epoch": 3704} {"train_loss": -24.595134735107422, "global_step": 307439, "epoch": 3704} {"train_loss": -24.80702018737793, "global_step": 307440, "epoch": 3704} {"train_loss": -25.29818344116211, "global_step": 307441, "epoch": 3704} {"train_loss": -25.305557250976562, "global_step": 307442, "epoch": 3704} {"train_loss": -25.366287231445312, "global_step": 307443, "epoch": 3704} {"train_loss": -25.424402236938477, "global_step": 307444, "epoch": 3704} {"train_loss": -24.943052291870117, "global_step": 307445, "epoch": 3704} {"train_loss": -25.127304077148438, "global_step": 307446, "epoch": 3704} {"train_loss": -25.07100486755371, "global_step": 307447, "epoch": 3704} {"train_loss": -25.102773666381836, "global_step": 307448, "epoch": 3704} {"train_loss": -25.16489028930664, "global_step": 307449, "epoch": 3704} {"train_loss": -25.419681549072266, "global_step": 307450, "epoch": 3704} {"train_loss": -25.43693733215332, "global_step": 307451, "epoch": 3704} {"train_loss": -25.12186050415039, "global_step": 307452, "epoch": 3704} {"train_loss": -25.512067794799805, "global_step": 307453, "epoch": 3704} {"train_loss": -25.78724479675293, "global_step": 307454, "epoch": 3704} {"train_loss": -25.133621215820312, "global_step": 307455, "epoch": 3704} {"train_loss": -25.369781494140625, "global_step": 307456, "epoch": 3704} {"train_loss": -25.554651260375977, "global_step": 307457, "epoch": 3704} {"train_loss": -25.41314125061035, "global_step": 307458, "epoch": 3704} {"train_loss": -25.42441177368164, "global_step": 307459, "epoch": 3704} {"train_loss": -25.532197952270508, "global_step": 307460, "epoch": 3704} {"train_loss": -25.465776443481445, "global_step": 307461, "epoch": 3704} {"train_loss": -25.40564727783203, "global_step": 307462, "epoch": 3704} {"train_loss": -25.646774291992188, "global_step": 307463, "epoch": 3704} {"train_loss": -25.632902145385742, "global_step": 307464, "epoch": 3704} {"train_loss": -25.890851974487305, "global_step": 307465, "epoch": 3704} {"train_loss": -25.500286102294922, "global_step": 307466, "epoch": 3704} {"train_loss": -25.696069717407227, "global_step": 307467, "epoch": 3704} {"train_loss": -25.579090118408203, "global_step": 307468, "epoch": 3704} {"train_loss": -25.99273109436035, "global_step": 307469, "epoch": 3704} {"train_loss": -25.662872314453125, "global_step": 307470, "epoch": 3704} {"train_loss": -25.689077377319336, "global_step": 307471, "epoch": 3704} {"train_loss": -25.721872329711914, "global_step": 307472, "epoch": 3704} {"train_loss": -25.75302505493164, "global_step": 307473, "epoch": 3704} {"train_loss": -25.942792892456055, "global_step": 307474, "epoch": 3704} {"train_loss": -25.8348331451416, "global_step": 307475, "epoch": 3704} {"train_loss": -25.971830368041992, "global_step": 307476, "epoch": 3704} {"train_loss": -25.674238204956055, "global_step": 307477, "epoch": 3704} {"train_loss": -25.484067916870117, "global_step": 307478, "epoch": 3704} {"train_loss": -25.982519149780273, "global_step": 307479, "epoch": 3704} {"train_loss": -25.958280563354492, "global_step": 307480, "epoch": 3704} {"train_loss": -26.106094360351562, "global_step": 307481, "epoch": 3704} {"train_loss": -25.4223690032959, "global_step": 307482, "epoch": 3704} {"train_loss": -25.850133895874023, "global_step": 307483, "epoch": 3704} {"train_loss": -25.84551429748535, "global_step": 307484, "epoch": 3704} {"train_loss": -25.775888442993164, "global_step": 307485, "epoch": 3704} {"train_loss": -25.621931076049805, "global_step": 307486, "epoch": 3704} {"train_loss": -25.913867950439453, "global_step": 307487, "epoch": 3704} {"train_loss": -25.801345825195312, "global_step": 307488, "epoch": 3704} {"train_loss": -26.29799461364746, "global_step": 307489, "epoch": 3704} {"train_loss": -26.016773223876953, "global_step": 307490, "epoch": 3704} {"train_loss": -26.021026611328125, "global_step": 307491, "epoch": 3704} {"train_loss": -26.11405372619629, "global_step": 307492, "epoch": 3704} {"train_loss": -25.663049697875977, "global_step": 307493, "epoch": 3704} {"train_loss": -25.85384178161621, "global_step": 307494, "epoch": 3704} {"train_loss": -25.63984489440918, "global_step": 307495, "epoch": 3704} {"train_loss": -25.543081283569336, "global_step": 307496, "epoch": 3704} {"train_loss": -25.612380981445312, "global_step": 307497, "epoch": 3704} {"train_loss": -25.82855224609375, "global_step": 307498, "epoch": 3704} {"train_loss": -26.113927841186523, "global_step": 307499, "epoch": 3704} {"train_loss": -25.314573287963867, "global_step": 307500, "epoch": 3704} {"train_loss": -25.886474609375, "global_step": 307501, "epoch": 3704} {"train_loss": -25.57442283630371, "global_step": 307502, "epoch": 3704} {"train_loss": -25.75152587890625, "global_step": 307503, "epoch": 3704} {"train_loss": -25.890899658203125, "global_step": 307504, "epoch": 3704} {"train_loss": -25.795740127563477, "global_step": 307505, "epoch": 3704} {"train_loss": -25.571945190429688, "global_step": 307506, "epoch": 3704} {"train_loss": -26.118881225585938, "global_step": 307507, "epoch": 3704} {"train_loss": -26.067228317260742, "global_step": 307508, "epoch": 3704} {"train_loss": -25.342132568359375, "global_step": 307509, "epoch": 3704} {"train_loss": -25.361921310424805, "global_step": 307510, "epoch": 3704} {"train_loss": -25.785202026367188, "global_step": 307511, "epoch": 3704} {"train_loss": -25.57013702392578, "global_step": 307512, "epoch": 3704} {"train_loss": -25.197877883911133, "global_step": 307513, "epoch": 3704} {"train_loss": -25.51384519094444, "global_step": 307514, "epoch": 3704, "val_loss": 7222495.0} {"train_loss": -25.37030601501465, "global_step": 307515, "epoch": 3705} {"train_loss": -25.015005111694336, "global_step": 307516, "epoch": 3705} {"train_loss": -25.463651657104492, "global_step": 307517, "epoch": 3705} {"train_loss": -25.03639793395996, "global_step": 307518, "epoch": 3705} {"train_loss": -25.540973663330078, "global_step": 307519, "epoch": 3705} {"train_loss": -24.825056076049805, "global_step": 307520, "epoch": 3705} {"train_loss": -25.608966827392578, "global_step": 307521, "epoch": 3705} {"train_loss": -25.23486328125, "global_step": 307522, "epoch": 3705} {"train_loss": -25.423810958862305, "global_step": 307523, "epoch": 3705} {"train_loss": -25.57309913635254, "global_step": 307524, "epoch": 3705} {"train_loss": -25.59405517578125, "global_step": 307525, "epoch": 3705} {"train_loss": -25.433223724365234, "global_step": 307526, "epoch": 3705} {"train_loss": -25.883813858032227, "global_step": 307527, "epoch": 3705} {"train_loss": -25.213056564331055, "global_step": 307528, "epoch": 3705} {"train_loss": -25.66547966003418, "global_step": 307529, "epoch": 3705} {"train_loss": -25.428190231323242, "global_step": 307530, "epoch": 3705} {"train_loss": -25.667285919189453, "global_step": 307531, "epoch": 3705} {"train_loss": -25.431930541992188, "global_step": 307532, "epoch": 3705} {"train_loss": -25.953704833984375, "global_step": 307533, "epoch": 3705} {"train_loss": -25.94841957092285, "global_step": 307534, "epoch": 3705} {"train_loss": -25.714628219604492, "global_step": 307535, "epoch": 3705} {"train_loss": -25.676544189453125, "global_step": 307536, "epoch": 3705} {"train_loss": -25.627134323120117, "global_step": 307537, "epoch": 3705} {"train_loss": -25.675601959228516, "global_step": 307538, "epoch": 3705} {"train_loss": -25.710617065429688, "global_step": 307539, "epoch": 3705} {"train_loss": -25.661184310913086, "global_step": 307540, "epoch": 3705} {"train_loss": -25.846765518188477, "global_step": 307541, "epoch": 3705} {"train_loss": -25.54843521118164, "global_step": 307542, "epoch": 3705} {"train_loss": -25.607818603515625, "global_step": 307543, "epoch": 3705} {"train_loss": -25.519378662109375, "global_step": 307544, "epoch": 3705} {"train_loss": -25.64597511291504, "global_step": 307545, "epoch": 3705} {"train_loss": -25.904138565063477, "global_step": 307546, "epoch": 3705} {"train_loss": -25.984500885009766, "global_step": 307547, "epoch": 3705} {"train_loss": -26.13593101501465, "global_step": 307548, "epoch": 3705} {"train_loss": -25.6884765625, "global_step": 307549, "epoch": 3705} {"train_loss": -25.41944694519043, "global_step": 307550, "epoch": 3705} {"train_loss": -25.72979736328125, "global_step": 307551, "epoch": 3705} {"train_loss": -25.160429000854492, "global_step": 307552, "epoch": 3705} {"train_loss": -25.50113296508789, "global_step": 307553, "epoch": 3705} {"train_loss": -25.722517013549805, "global_step": 307554, "epoch": 3705} {"train_loss": -25.770231246948242, "global_step": 307555, "epoch": 3705} {"train_loss": -25.570322036743164, "global_step": 307556, "epoch": 3705} {"train_loss": -25.448453903198242, "global_step": 307557, "epoch": 3705} {"train_loss": -25.748245239257812, "global_step": 307558, "epoch": 3705} {"train_loss": -25.55401039123535, "global_step": 307559, "epoch": 3705} {"train_loss": -25.689228057861328, "global_step": 307560, "epoch": 3705} {"train_loss": -25.69817543029785, "global_step": 307561, "epoch": 3705} {"train_loss": -25.611597061157227, "global_step": 307562, "epoch": 3705} {"train_loss": -25.433801651000977, "global_step": 307563, "epoch": 3705} {"train_loss": -25.758956909179688, "global_step": 307564, "epoch": 3705} {"train_loss": -25.525392532348633, "global_step": 307565, "epoch": 3705} {"train_loss": -26.0521183013916, "global_step": 307566, "epoch": 3705} {"train_loss": -25.839874267578125, "global_step": 307567, "epoch": 3705} {"train_loss": -25.9930419921875, "global_step": 307568, "epoch": 3705} {"train_loss": -25.546131134033203, "global_step": 307569, "epoch": 3705} {"train_loss": -25.639490127563477, "global_step": 307570, "epoch": 3705} {"train_loss": -25.53951072692871, "global_step": 307571, "epoch": 3705} {"train_loss": -25.466161727905273, "global_step": 307572, "epoch": 3705} {"train_loss": -25.99098014831543, "global_step": 307573, "epoch": 3705} {"train_loss": -25.789581298828125, "global_step": 307574, "epoch": 3705} {"train_loss": -25.744298934936523, "global_step": 307575, "epoch": 3705} {"train_loss": -25.78790855407715, "global_step": 307576, "epoch": 3705} {"train_loss": -25.975391387939453, "global_step": 307577, "epoch": 3705} {"train_loss": -25.902769088745117, "global_step": 307578, "epoch": 3705} {"train_loss": -25.558454513549805, "global_step": 307579, "epoch": 3705} {"train_loss": -26.244556427001953, "global_step": 307580, "epoch": 3705} {"train_loss": -25.739103317260742, "global_step": 307581, "epoch": 3705} {"train_loss": -25.994775772094727, "global_step": 307582, "epoch": 3705} {"train_loss": -25.753250122070312, "global_step": 307583, "epoch": 3705} {"train_loss": -25.64015007019043, "global_step": 307584, "epoch": 3705} {"train_loss": -26.18745231628418, "global_step": 307585, "epoch": 3705} {"train_loss": -25.58101463317871, "global_step": 307586, "epoch": 3705} {"train_loss": -25.78167152404785, "global_step": 307587, "epoch": 3705} {"train_loss": -25.701074600219727, "global_step": 307588, "epoch": 3705} {"train_loss": -25.67401695251465, "global_step": 307589, "epoch": 3705} {"train_loss": -25.669591903686523, "global_step": 307590, "epoch": 3705} {"train_loss": -25.630340576171875, "global_step": 307591, "epoch": 3705} {"train_loss": -25.990278244018555, "global_step": 307592, "epoch": 3705} {"train_loss": -25.761777877807617, "global_step": 307593, "epoch": 3705} {"train_loss": -25.997522354125977, "global_step": 307594, "epoch": 3705} {"train_loss": -25.587814331054688, "global_step": 307595, "epoch": 3705} {"train_loss": -25.582185745239258, "global_step": 307596, "epoch": 3705} {"train_loss": -25.66212245067918, "global_step": 307597, "epoch": 3705, "val_loss": 7278070.0} {"train_loss": -23.48813247680664, "global_step": 307598, "epoch": 3706} {"train_loss": -23.01841926574707, "global_step": 307599, "epoch": 3706} {"train_loss": -24.414695739746094, "global_step": 307600, "epoch": 3706} {"train_loss": -24.311731338500977, "global_step": 307601, "epoch": 3706} {"train_loss": -23.802297592163086, "global_step": 307602, "epoch": 3706} {"train_loss": -25.0526180267334, "global_step": 307603, "epoch": 3706} {"train_loss": -24.652700424194336, "global_step": 307604, "epoch": 3706} {"train_loss": -25.2117862701416, "global_step": 307605, "epoch": 3706} {"train_loss": -24.74580192565918, "global_step": 307606, "epoch": 3706} {"train_loss": -24.78218650817871, "global_step": 307607, "epoch": 3706} {"train_loss": -24.81498908996582, "global_step": 307608, "epoch": 3706} {"train_loss": -24.768112182617188, "global_step": 307609, "epoch": 3706} {"train_loss": -24.93606948852539, "global_step": 307610, "epoch": 3706} {"train_loss": -24.8580265045166, "global_step": 307611, "epoch": 3706} {"train_loss": -24.671188354492188, "global_step": 307612, "epoch": 3706} {"train_loss": -25.035419464111328, "global_step": 307613, "epoch": 3706} {"train_loss": -25.241687774658203, "global_step": 307614, "epoch": 3706} {"train_loss": -24.71658706665039, "global_step": 307615, "epoch": 3706} {"train_loss": -25.28411102294922, "global_step": 307616, "epoch": 3706} {"train_loss": -25.14018440246582, "global_step": 307617, "epoch": 3706} {"train_loss": -24.601581573486328, "global_step": 307618, "epoch": 3706} {"train_loss": -24.902482986450195, "global_step": 307619, "epoch": 3706} {"train_loss": -25.219297409057617, "global_step": 307620, "epoch": 3706} {"train_loss": -25.350751876831055, "global_step": 307621, "epoch": 3706} {"train_loss": -25.5297794342041, "global_step": 307622, "epoch": 3706} {"train_loss": -24.934375762939453, "global_step": 307623, "epoch": 3706} {"train_loss": -25.354225158691406, "global_step": 307624, "epoch": 3706} {"train_loss": -25.28086280822754, "global_step": 307625, "epoch": 3706} {"train_loss": -25.27375030517578, "global_step": 307626, "epoch": 3706} {"train_loss": -25.1554012298584, "global_step": 307627, "epoch": 3706} {"train_loss": -25.585065841674805, "global_step": 307628, "epoch": 3706} {"train_loss": -25.586523056030273, "global_step": 307629, "epoch": 3706} {"train_loss": -25.496610641479492, "global_step": 307630, "epoch": 3706} {"train_loss": -25.66709327697754, "global_step": 307631, "epoch": 3706} {"train_loss": -26.057025909423828, "global_step": 307632, "epoch": 3706} {"train_loss": -25.587873458862305, "global_step": 307633, "epoch": 3706} {"train_loss": -25.51605224609375, "global_step": 307634, "epoch": 3706} {"train_loss": -25.561735153198242, "global_step": 307635, "epoch": 3706} {"train_loss": -25.704565048217773, "global_step": 307636, "epoch": 3706} {"train_loss": -25.8369140625, "global_step": 307637, "epoch": 3706} {"train_loss": -25.56707763671875, "global_step": 307638, "epoch": 3706} {"train_loss": -25.79779052734375, "global_step": 307639, "epoch": 3706} {"train_loss": -25.936628341674805, "global_step": 307640, "epoch": 3706} {"train_loss": -25.94402503967285, "global_step": 307641, "epoch": 3706} {"train_loss": -25.59852409362793, "global_step": 307642, "epoch": 3706} {"train_loss": -25.803546905517578, "global_step": 307643, "epoch": 3706} {"train_loss": -25.56251335144043, "global_step": 307644, "epoch": 3706} {"train_loss": -25.45263671875, "global_step": 307645, "epoch": 3706} {"train_loss": -26.032251358032227, "global_step": 307646, "epoch": 3706} {"train_loss": -25.770490646362305, "global_step": 307647, "epoch": 3706} {"train_loss": -26.045934677124023, "global_step": 307648, "epoch": 3706} {"train_loss": -26.0002498626709, "global_step": 307649, "epoch": 3706} {"train_loss": -25.9329776763916, "global_step": 307650, "epoch": 3706} {"train_loss": -25.727985382080078, "global_step": 307651, "epoch": 3706} {"train_loss": -25.762897491455078, "global_step": 307652, "epoch": 3706} {"train_loss": -25.869522094726562, "global_step": 307653, "epoch": 3706} {"train_loss": -26.097583770751953, "global_step": 307654, "epoch": 3706} {"train_loss": -25.68533706665039, "global_step": 307655, "epoch": 3706} {"train_loss": -25.481109619140625, "global_step": 307656, "epoch": 3706} {"train_loss": -25.838300704956055, "global_step": 307657, "epoch": 3706} {"train_loss": -25.970386505126953, "global_step": 307658, "epoch": 3706} {"train_loss": -26.16285514831543, "global_step": 307659, "epoch": 3706} {"train_loss": -25.874853134155273, "global_step": 307660, "epoch": 3706} {"train_loss": -25.87519645690918, "global_step": 307661, "epoch": 3706} {"train_loss": -25.668262481689453, "global_step": 307662, "epoch": 3706} {"train_loss": -25.5692138671875, "global_step": 307663, "epoch": 3706} {"train_loss": -25.899808883666992, "global_step": 307664, "epoch": 3706} {"train_loss": -25.832828521728516, "global_step": 307665, "epoch": 3706} {"train_loss": -25.90867042541504, "global_step": 307666, "epoch": 3706} {"train_loss": -25.866748809814453, "global_step": 307667, "epoch": 3706} {"train_loss": -25.963165283203125, "global_step": 307668, "epoch": 3706} {"train_loss": -26.015151977539062, "global_step": 307669, "epoch": 3706} {"train_loss": -25.940332412719727, "global_step": 307670, "epoch": 3706} {"train_loss": -25.441246032714844, "global_step": 307671, "epoch": 3706} {"train_loss": -24.290475845336914, "global_step": 307672, "epoch": 3706} {"train_loss": -23.820661544799805, "global_step": 307673, "epoch": 3706} {"train_loss": -23.46538734436035, "global_step": 307674, "epoch": 3706} {"train_loss": -25.390657424926758, "global_step": 307675, "epoch": 3706} {"train_loss": -24.806800842285156, "global_step": 307676, "epoch": 3706} {"train_loss": -24.05491065979004, "global_step": 307677, "epoch": 3706} {"train_loss": -25.471527099609375, "global_step": 307678, "epoch": 3706} {"train_loss": -24.97850799560547, "global_step": 307679, "epoch": 3706} {"train_loss": -25.301700431180286, "global_step": 307680, "epoch": 3706, "val_loss": 7269362.5} {"train_loss": -24.36318016052246, "global_step": 307681, "epoch": 3707} {"train_loss": -24.810245513916016, "global_step": 307682, "epoch": 3707} {"train_loss": -25.00476837158203, "global_step": 307683, "epoch": 3707} {"train_loss": -24.822551727294922, "global_step": 307684, "epoch": 3707} {"train_loss": -25.22452163696289, "global_step": 307685, "epoch": 3707} {"train_loss": -24.853681564331055, "global_step": 307686, "epoch": 3707} {"train_loss": -24.946277618408203, "global_step": 307687, "epoch": 3707} {"train_loss": -25.29781150817871, "global_step": 307688, "epoch": 3707} {"train_loss": -25.023466110229492, "global_step": 307689, "epoch": 3707} {"train_loss": -25.00831413269043, "global_step": 307690, "epoch": 3707} {"train_loss": -25.18076515197754, "global_step": 307691, "epoch": 3707} {"train_loss": -25.135282516479492, "global_step": 307692, "epoch": 3707} {"train_loss": -25.199867248535156, "global_step": 307693, "epoch": 3707} {"train_loss": -25.044326782226562, "global_step": 307694, "epoch": 3707} {"train_loss": -25.051469802856445, "global_step": 307695, "epoch": 3707} {"train_loss": -25.39401626586914, "global_step": 307696, "epoch": 3707} {"train_loss": -24.835161209106445, "global_step": 307697, "epoch": 3707} {"train_loss": -25.448034286499023, "global_step": 307698, "epoch": 3707} {"train_loss": -25.252683639526367, "global_step": 307699, "epoch": 3707} {"train_loss": -25.49762535095215, "global_step": 307700, "epoch": 3707} {"train_loss": -25.572481155395508, "global_step": 307701, "epoch": 3707} {"train_loss": -25.51275062561035, "global_step": 307702, "epoch": 3707} {"train_loss": -25.348556518554688, "global_step": 307703, "epoch": 3707} {"train_loss": -25.499868392944336, "global_step": 307704, "epoch": 3707} {"train_loss": -25.24776268005371, "global_step": 307705, "epoch": 3707} {"train_loss": -25.869848251342773, "global_step": 307706, "epoch": 3707} {"train_loss": -25.487478256225586, "global_step": 307707, "epoch": 3707} {"train_loss": -25.355527877807617, "global_step": 307708, "epoch": 3707} {"train_loss": -25.53438377380371, "global_step": 307709, "epoch": 3707} {"train_loss": -25.368253707885742, "global_step": 307710, "epoch": 3707} {"train_loss": -25.871301651000977, "global_step": 307711, "epoch": 3707} {"train_loss": -25.810352325439453, "global_step": 307712, "epoch": 3707} {"train_loss": -25.813018798828125, "global_step": 307713, "epoch": 3707} {"train_loss": -25.580778121948242, "global_step": 307714, "epoch": 3707} {"train_loss": -25.92816734313965, "global_step": 307715, "epoch": 3707} {"train_loss": -25.778242111206055, "global_step": 307716, "epoch": 3707} {"train_loss": -25.53163719177246, "global_step": 307717, "epoch": 3707} {"train_loss": -26.014968872070312, "global_step": 307718, "epoch": 3707} {"train_loss": -25.540563583374023, "global_step": 307719, "epoch": 3707} {"train_loss": -25.8095645904541, "global_step": 307720, "epoch": 3707} {"train_loss": -25.58449363708496, "global_step": 307721, "epoch": 3707} {"train_loss": -25.864294052124023, "global_step": 307722, "epoch": 3707} {"train_loss": -25.902353286743164, "global_step": 307723, "epoch": 3707} {"train_loss": -25.978321075439453, "global_step": 307724, "epoch": 3707} {"train_loss": -26.233564376831055, "global_step": 307725, "epoch": 3707} {"train_loss": -26.037763595581055, "global_step": 307726, "epoch": 3707} {"train_loss": -26.033599853515625, "global_step": 307727, "epoch": 3707} {"train_loss": -25.995779037475586, "global_step": 307728, "epoch": 3707} {"train_loss": -25.606836318969727, "global_step": 307729, "epoch": 3707} {"train_loss": -25.792295455932617, "global_step": 307730, "epoch": 3707} {"train_loss": -25.999704360961914, "global_step": 307731, "epoch": 3707} {"train_loss": -26.117650985717773, "global_step": 307732, "epoch": 3707} {"train_loss": -26.100988388061523, "global_step": 307733, "epoch": 3707} {"train_loss": -25.780683517456055, "global_step": 307734, "epoch": 3707} {"train_loss": -25.73902702331543, "global_step": 307735, "epoch": 3707} {"train_loss": -25.4986515045166, "global_step": 307736, "epoch": 3707} {"train_loss": -25.801502227783203, "global_step": 307737, "epoch": 3707} {"train_loss": -26.196395874023438, "global_step": 307738, "epoch": 3707} {"train_loss": -25.677703857421875, "global_step": 307739, "epoch": 3707} {"train_loss": -25.715930938720703, "global_step": 307740, "epoch": 3707} {"train_loss": -25.348031997680664, "global_step": 307741, "epoch": 3707} {"train_loss": -25.45076560974121, "global_step": 307742, "epoch": 3707} {"train_loss": -25.486759185791016, "global_step": 307743, "epoch": 3707} {"train_loss": -26.3176212310791, "global_step": 307744, "epoch": 3707} {"train_loss": -25.236433029174805, "global_step": 307745, "epoch": 3707} {"train_loss": -25.773340225219727, "global_step": 307746, "epoch": 3707} {"train_loss": -25.808141708374023, "global_step": 307747, "epoch": 3707} {"train_loss": -25.899778366088867, "global_step": 307748, "epoch": 3707} {"train_loss": -25.759679794311523, "global_step": 307749, "epoch": 3707} {"train_loss": -25.648975372314453, "global_step": 307750, "epoch": 3707} {"train_loss": -25.548660278320312, "global_step": 307751, "epoch": 3707} {"train_loss": -25.366479873657227, "global_step": 307752, "epoch": 3707} {"train_loss": -25.973255157470703, "global_step": 307753, "epoch": 3707} {"train_loss": -25.686079025268555, "global_step": 307754, "epoch": 3707} {"train_loss": -25.642004013061523, "global_step": 307755, "epoch": 3707} {"train_loss": -25.502765655517578, "global_step": 307756, "epoch": 3707} {"train_loss": -25.617673873901367, "global_step": 307757, "epoch": 3707} {"train_loss": -25.8159236907959, "global_step": 307758, "epoch": 3707} {"train_loss": -25.770227432250977, "global_step": 307759, "epoch": 3707} {"train_loss": -25.523595809936523, "global_step": 307760, "epoch": 3707} {"train_loss": -25.848920822143555, "global_step": 307761, "epoch": 3707} {"train_loss": -25.7459774017334, "global_step": 307762, "epoch": 3707} {"train_loss": -25.570221337927393, "global_step": 307763, "epoch": 3707, "val_loss": 7329815.0} {"train_loss": -25.27206802368164, "global_step": 307764, "epoch": 3708} {"train_loss": -25.49953269958496, "global_step": 307765, "epoch": 3708} {"train_loss": -25.673538208007812, "global_step": 307766, "epoch": 3708} {"train_loss": -25.111034393310547, "global_step": 307767, "epoch": 3708} {"train_loss": -25.10255241394043, "global_step": 307768, "epoch": 3708} {"train_loss": -25.574012756347656, "global_step": 307769, "epoch": 3708} {"train_loss": -25.039846420288086, "global_step": 307770, "epoch": 3708} {"train_loss": -25.707509994506836, "global_step": 307771, "epoch": 3708} {"train_loss": -25.758787155151367, "global_step": 307772, "epoch": 3708} {"train_loss": -25.455198287963867, "global_step": 307773, "epoch": 3708} {"train_loss": -25.29695701599121, "global_step": 307774, "epoch": 3708} {"train_loss": -26.02044105529785, "global_step": 307775, "epoch": 3708} {"train_loss": -25.33707618713379, "global_step": 307776, "epoch": 3708} {"train_loss": -25.7119140625, "global_step": 307777, "epoch": 3708} {"train_loss": -25.6300106048584, "global_step": 307778, "epoch": 3708} {"train_loss": -25.49811363220215, "global_step": 307779, "epoch": 3708} {"train_loss": -25.850494384765625, "global_step": 307780, "epoch": 3708} {"train_loss": -25.445119857788086, "global_step": 307781, "epoch": 3708} {"train_loss": -25.601226806640625, "global_step": 307782, "epoch": 3708} {"train_loss": -25.502485275268555, "global_step": 307783, "epoch": 3708} {"train_loss": -25.748517990112305, "global_step": 307784, "epoch": 3708} {"train_loss": -25.885114669799805, "global_step": 307785, "epoch": 3708} {"train_loss": -25.67852783203125, "global_step": 307786, "epoch": 3708} {"train_loss": -25.46551513671875, "global_step": 307787, "epoch": 3708} {"train_loss": -25.77943229675293, "global_step": 307788, "epoch": 3708} {"train_loss": -25.58490562438965, "global_step": 307789, "epoch": 3708} {"train_loss": -26.119672775268555, "global_step": 307790, "epoch": 3708} {"train_loss": -25.627782821655273, "global_step": 307791, "epoch": 3708} {"train_loss": -25.492961883544922, "global_step": 307792, "epoch": 3708} {"train_loss": -26.389667510986328, "global_step": 307793, "epoch": 3708} {"train_loss": -26.0283260345459, "global_step": 307794, "epoch": 3708} {"train_loss": -25.825891494750977, "global_step": 307795, "epoch": 3708} {"train_loss": -25.989850997924805, "global_step": 307796, "epoch": 3708} {"train_loss": -25.81035804748535, "global_step": 307797, "epoch": 3708} {"train_loss": -26.05280113220215, "global_step": 307798, "epoch": 3708} {"train_loss": -25.981164932250977, "global_step": 307799, "epoch": 3708} {"train_loss": -25.60528564453125, "global_step": 307800, "epoch": 3708} {"train_loss": -26.222579956054688, "global_step": 307801, "epoch": 3708} {"train_loss": -26.24143409729004, "global_step": 307802, "epoch": 3708} {"train_loss": -25.740026473999023, "global_step": 307803, "epoch": 3708} {"train_loss": -25.89027976989746, "global_step": 307804, "epoch": 3708} {"train_loss": -25.677709579467773, "global_step": 307805, "epoch": 3708} {"train_loss": -25.748884201049805, "global_step": 307806, "epoch": 3708} {"train_loss": -25.732629776000977, "global_step": 307807, "epoch": 3708} {"train_loss": -25.913427352905273, "global_step": 307808, "epoch": 3708} {"train_loss": -26.0485897064209, "global_step": 307809, "epoch": 3708} {"train_loss": -25.676483154296875, "global_step": 307810, "epoch": 3708} {"train_loss": -25.711429595947266, "global_step": 307811, "epoch": 3708} {"train_loss": -25.40656089782715, "global_step": 307812, "epoch": 3708} {"train_loss": -25.6893253326416, "global_step": 307813, "epoch": 3708} {"train_loss": -25.780359268188477, "global_step": 307814, "epoch": 3708} {"train_loss": -25.264423370361328, "global_step": 307815, "epoch": 3708} {"train_loss": -25.27471160888672, "global_step": 307816, "epoch": 3708} {"train_loss": -25.808124542236328, "global_step": 307817, "epoch": 3708} {"train_loss": -25.897674560546875, "global_step": 307818, "epoch": 3708} {"train_loss": -25.71009635925293, "global_step": 307819, "epoch": 3708} {"train_loss": -26.0889949798584, "global_step": 307820, "epoch": 3708} {"train_loss": -25.643911361694336, "global_step": 307821, "epoch": 3708} {"train_loss": -25.930774688720703, "global_step": 307822, "epoch": 3708} {"train_loss": -25.46223258972168, "global_step": 307823, "epoch": 3708} {"train_loss": -25.92138671875, "global_step": 307824, "epoch": 3708} {"train_loss": -25.665979385375977, "global_step": 307825, "epoch": 3708} {"train_loss": -25.965774536132812, "global_step": 307826, "epoch": 3708} {"train_loss": -25.69561767578125, "global_step": 307827, "epoch": 3708} {"train_loss": -25.890485763549805, "global_step": 307828, "epoch": 3708} {"train_loss": -25.6863956451416, "global_step": 307829, "epoch": 3708} {"train_loss": -25.978652954101562, "global_step": 307830, "epoch": 3708} {"train_loss": -25.933990478515625, "global_step": 307831, "epoch": 3708} {"train_loss": -25.778982162475586, "global_step": 307832, "epoch": 3708} {"train_loss": -26.109542846679688, "global_step": 307833, "epoch": 3708} {"train_loss": -25.624099731445312, "global_step": 307834, "epoch": 3708} {"train_loss": -26.22852897644043, "global_step": 307835, "epoch": 3708} {"train_loss": -25.8969669342041, "global_step": 307836, "epoch": 3708} {"train_loss": -25.567480087280273, "global_step": 307837, "epoch": 3708} {"train_loss": -25.7544002532959, "global_step": 307838, "epoch": 3708} {"train_loss": -26.165021896362305, "global_step": 307839, "epoch": 3708} {"train_loss": -25.643590927124023, "global_step": 307840, "epoch": 3708} {"train_loss": -25.9981689453125, "global_step": 307841, "epoch": 3708} {"train_loss": -25.81150245666504, "global_step": 307842, "epoch": 3708} {"train_loss": -25.955646514892578, "global_step": 307843, "epoch": 3708} {"train_loss": -25.720518112182617, "global_step": 307844, "epoch": 3708} {"train_loss": -25.73386573791504, "global_step": 307845, "epoch": 3708} {"train_loss": -25.74647473714438, "global_step": 307846, "epoch": 3708, "val_loss": 7165179.0} {"train_loss": -25.20929718017578, "global_step": 307847, "epoch": 3709} {"train_loss": -24.889570236206055, "global_step": 307848, "epoch": 3709} {"train_loss": -24.591262817382812, "global_step": 307849, "epoch": 3709} {"train_loss": -24.49943733215332, "global_step": 307850, "epoch": 3709} {"train_loss": -25.08812141418457, "global_step": 307851, "epoch": 3709} {"train_loss": -25.505102157592773, "global_step": 307852, "epoch": 3709} {"train_loss": -25.268972396850586, "global_step": 307853, "epoch": 3709} {"train_loss": -25.141036987304688, "global_step": 307854, "epoch": 3709} {"train_loss": -25.205768585205078, "global_step": 307855, "epoch": 3709} {"train_loss": -25.328269958496094, "global_step": 307856, "epoch": 3709} {"train_loss": -25.361846923828125, "global_step": 307857, "epoch": 3709} {"train_loss": -25.636335372924805, "global_step": 307858, "epoch": 3709} {"train_loss": -25.40683364868164, "global_step": 307859, "epoch": 3709} {"train_loss": -25.296295166015625, "global_step": 307860, "epoch": 3709} {"train_loss": -25.9366397857666, "global_step": 307861, "epoch": 3709} {"train_loss": -25.574377059936523, "global_step": 307862, "epoch": 3709} {"train_loss": -25.494369506835938, "global_step": 307863, "epoch": 3709} {"train_loss": -25.91767692565918, "global_step": 307864, "epoch": 3709} {"train_loss": -25.669544219970703, "global_step": 307865, "epoch": 3709} {"train_loss": -25.880170822143555, "global_step": 307866, "epoch": 3709} {"train_loss": -25.43440818786621, "global_step": 307867, "epoch": 3709} {"train_loss": -25.389789581298828, "global_step": 307868, "epoch": 3709} {"train_loss": -25.568296432495117, "global_step": 307869, "epoch": 3709} {"train_loss": -25.63602638244629, "global_step": 307870, "epoch": 3709} {"train_loss": -25.701221466064453, "global_step": 307871, "epoch": 3709} {"train_loss": -25.93902015686035, "global_step": 307872, "epoch": 3709} {"train_loss": -26.07258415222168, "global_step": 307873, "epoch": 3709} {"train_loss": -25.969818115234375, "global_step": 307874, "epoch": 3709} {"train_loss": -25.890111923217773, "global_step": 307875, "epoch": 3709} {"train_loss": -25.650060653686523, "global_step": 307876, "epoch": 3709} {"train_loss": -25.58017349243164, "global_step": 307877, "epoch": 3709} {"train_loss": -25.826282501220703, "global_step": 307878, "epoch": 3709} {"train_loss": -25.9686336517334, "global_step": 307879, "epoch": 3709} {"train_loss": -26.131662368774414, "global_step": 307880, "epoch": 3709} {"train_loss": -25.84906005859375, "global_step": 307881, "epoch": 3709} {"train_loss": -25.88055992126465, "global_step": 307882, "epoch": 3709} {"train_loss": -25.82343864440918, "global_step": 307883, "epoch": 3709} {"train_loss": -25.608854293823242, "global_step": 307884, "epoch": 3709} {"train_loss": -25.718442916870117, "global_step": 307885, "epoch": 3709} {"train_loss": -26.131864547729492, "global_step": 307886, "epoch": 3709} {"train_loss": -25.846393585205078, "global_step": 307887, "epoch": 3709} {"train_loss": -25.88602638244629, "global_step": 307888, "epoch": 3709} {"train_loss": -25.967792510986328, "global_step": 307889, "epoch": 3709} {"train_loss": -25.9456729888916, "global_step": 307890, "epoch": 3709} {"train_loss": -25.8397216796875, "global_step": 307891, "epoch": 3709} {"train_loss": -25.882535934448242, "global_step": 307892, "epoch": 3709} {"train_loss": -25.70553970336914, "global_step": 307893, "epoch": 3709} {"train_loss": -25.7109317779541, "global_step": 307894, "epoch": 3709} {"train_loss": -25.878067016601562, "global_step": 307895, "epoch": 3709} {"train_loss": -25.688928604125977, "global_step": 307896, "epoch": 3709} {"train_loss": -25.52313232421875, "global_step": 307897, "epoch": 3709} {"train_loss": -25.6401309967041, "global_step": 307898, "epoch": 3709} {"train_loss": -25.117145538330078, "global_step": 307899, "epoch": 3709} {"train_loss": -24.996639251708984, "global_step": 307900, "epoch": 3709} {"train_loss": -25.34748649597168, "global_step": 307901, "epoch": 3709} {"train_loss": -25.329957962036133, "global_step": 307902, "epoch": 3709} {"train_loss": -25.847257614135742, "global_step": 307903, "epoch": 3709} {"train_loss": -25.473073959350586, "global_step": 307904, "epoch": 3709} {"train_loss": -25.813562393188477, "global_step": 307905, "epoch": 3709} {"train_loss": -25.376426696777344, "global_step": 307906, "epoch": 3709} {"train_loss": -25.845935821533203, "global_step": 307907, "epoch": 3709} {"train_loss": -25.44879722595215, "global_step": 307908, "epoch": 3709} {"train_loss": -25.383024215698242, "global_step": 307909, "epoch": 3709} {"train_loss": -25.64875602722168, "global_step": 307910, "epoch": 3709} {"train_loss": -25.877466201782227, "global_step": 307911, "epoch": 3709} {"train_loss": -25.7338809967041, "global_step": 307912, "epoch": 3709} {"train_loss": -25.249128341674805, "global_step": 307913, "epoch": 3709} {"train_loss": -25.275846481323242, "global_step": 307914, "epoch": 3709} {"train_loss": -25.520856857299805, "global_step": 307915, "epoch": 3709} {"train_loss": -25.58429527282715, "global_step": 307916, "epoch": 3709} {"train_loss": -25.890228271484375, "global_step": 307917, "epoch": 3709} {"train_loss": -25.653778076171875, "global_step": 307918, "epoch": 3709} {"train_loss": -25.50703239440918, "global_step": 307919, "epoch": 3709} {"train_loss": -25.683202743530273, "global_step": 307920, "epoch": 3709} {"train_loss": -25.4139347076416, "global_step": 307921, "epoch": 3709} {"train_loss": -25.30976104736328, "global_step": 307922, "epoch": 3709} {"train_loss": -25.662860870361328, "global_step": 307923, "epoch": 3709} {"train_loss": -25.63954734802246, "global_step": 307924, "epoch": 3709} {"train_loss": -25.11875343322754, "global_step": 307925, "epoch": 3709} {"train_loss": -25.67725944519043, "global_step": 307926, "epoch": 3709} {"train_loss": -25.70892333984375, "global_step": 307927, "epoch": 3709} {"train_loss": -25.9068603515625, "global_step": 307928, "epoch": 3709} {"train_loss": -25.58613011923181, "global_step": 307929, "epoch": 3709, "val_loss": 7231914.0} {"train_loss": -25.165895462036133, "global_step": 307930, "epoch": 3710} {"train_loss": -25.544052124023438, "global_step": 307931, "epoch": 3710} {"train_loss": -25.23726463317871, "global_step": 307932, "epoch": 3710} {"train_loss": -25.14934730529785, "global_step": 307933, "epoch": 3710} {"train_loss": -25.305654525756836, "global_step": 307934, "epoch": 3710} {"train_loss": -25.404470443725586, "global_step": 307935, "epoch": 3710} {"train_loss": -25.30817985534668, "global_step": 307936, "epoch": 3710} {"train_loss": -25.927661895751953, "global_step": 307937, "epoch": 3710} {"train_loss": -25.11134147644043, "global_step": 307938, "epoch": 3710} {"train_loss": -25.81199073791504, "global_step": 307939, "epoch": 3710} {"train_loss": -25.59976577758789, "global_step": 307940, "epoch": 3710} {"train_loss": -25.506250381469727, "global_step": 307941, "epoch": 3710} {"train_loss": -25.300878524780273, "global_step": 307942, "epoch": 3710} {"train_loss": -25.242069244384766, "global_step": 307943, "epoch": 3710} {"train_loss": -25.6046142578125, "global_step": 307944, "epoch": 3710} {"train_loss": -25.200931549072266, "global_step": 307945, "epoch": 3710} {"train_loss": -25.716482162475586, "global_step": 307946, "epoch": 3710} {"train_loss": -25.7142391204834, "global_step": 307947, "epoch": 3710} {"train_loss": -25.573001861572266, "global_step": 307948, "epoch": 3710} {"train_loss": -25.857004165649414, "global_step": 307949, "epoch": 3710} {"train_loss": -25.609344482421875, "global_step": 307950, "epoch": 3710} {"train_loss": -25.390594482421875, "global_step": 307951, "epoch": 3710} {"train_loss": -25.73665428161621, "global_step": 307952, "epoch": 3710} {"train_loss": -25.789722442626953, "global_step": 307953, "epoch": 3710} {"train_loss": -25.629587173461914, "global_step": 307954, "epoch": 3710} {"train_loss": -25.486373901367188, "global_step": 307955, "epoch": 3710} {"train_loss": -25.59671401977539, "global_step": 307956, "epoch": 3710} {"train_loss": -25.647184371948242, "global_step": 307957, "epoch": 3710} {"train_loss": -25.429176330566406, "global_step": 307958, "epoch": 3710} {"train_loss": -25.644994735717773, "global_step": 307959, "epoch": 3710} {"train_loss": -25.389331817626953, "global_step": 307960, "epoch": 3710} {"train_loss": -25.464250564575195, "global_step": 307961, "epoch": 3710} {"train_loss": -25.603422164916992, "global_step": 307962, "epoch": 3710} {"train_loss": -25.46405601501465, "global_step": 307963, "epoch": 3710} {"train_loss": -25.507326126098633, "global_step": 307964, "epoch": 3710} {"train_loss": -25.634815216064453, "global_step": 307965, "epoch": 3710} {"train_loss": -25.523662567138672, "global_step": 307966, "epoch": 3710} {"train_loss": -25.638471603393555, "global_step": 307967, "epoch": 3710} {"train_loss": -25.667098999023438, "global_step": 307968, "epoch": 3710} {"train_loss": -25.48187255859375, "global_step": 307969, "epoch": 3710} {"train_loss": -25.668210983276367, "global_step": 307970, "epoch": 3710} {"train_loss": -25.893707275390625, "global_step": 307971, "epoch": 3710} {"train_loss": -25.690473556518555, "global_step": 307972, "epoch": 3710} {"train_loss": -25.69314956665039, "global_step": 307973, "epoch": 3710} {"train_loss": -25.36756706237793, "global_step": 307974, "epoch": 3710} {"train_loss": -25.561941146850586, "global_step": 307975, "epoch": 3710} {"train_loss": -25.38187599182129, "global_step": 307976, "epoch": 3710} {"train_loss": -25.88083839416504, "global_step": 307977, "epoch": 3710} {"train_loss": -25.898223876953125, "global_step": 307978, "epoch": 3710} {"train_loss": -25.8127498626709, "global_step": 307979, "epoch": 3710} {"train_loss": -26.1664981842041, "global_step": 307980, "epoch": 3710} {"train_loss": -25.916229248046875, "global_step": 307981, "epoch": 3710} {"train_loss": -25.792768478393555, "global_step": 307982, "epoch": 3710} {"train_loss": -25.269805908203125, "global_step": 307983, "epoch": 3710} {"train_loss": -25.499347686767578, "global_step": 307984, "epoch": 3710} {"train_loss": -25.61106300354004, "global_step": 307985, "epoch": 3710} {"train_loss": -25.74384117126465, "global_step": 307986, "epoch": 3710} {"train_loss": -24.942245483398438, "global_step": 307987, "epoch": 3710} {"train_loss": -25.635211944580078, "global_step": 307988, "epoch": 3710} {"train_loss": -25.36335563659668, "global_step": 307989, "epoch": 3710} {"train_loss": -25.327682495117188, "global_step": 307990, "epoch": 3710} {"train_loss": -25.528345108032227, "global_step": 307991, "epoch": 3710} {"train_loss": -25.613378524780273, "global_step": 307992, "epoch": 3710} {"train_loss": -25.51721954345703, "global_step": 307993, "epoch": 3710} {"train_loss": -25.960498809814453, "global_step": 307994, "epoch": 3710} {"train_loss": -25.33854866027832, "global_step": 307995, "epoch": 3710} {"train_loss": -25.930856704711914, "global_step": 307996, "epoch": 3710} {"train_loss": -25.248809814453125, "global_step": 307997, "epoch": 3710} {"train_loss": -25.743322372436523, "global_step": 307998, "epoch": 3710} {"train_loss": -25.906951904296875, "global_step": 307999, "epoch": 3710} {"train_loss": -25.91069984436035, "global_step": 308000, "epoch": 3710} {"train_loss": -25.746530532836914, "global_step": 308001, "epoch": 3710} {"train_loss": -25.55525016784668, "global_step": 308002, "epoch": 3710} {"train_loss": -25.60601806640625, "global_step": 308003, "epoch": 3710} {"train_loss": -25.65081787109375, "global_step": 308004, "epoch": 3710} {"train_loss": -25.919645309448242, "global_step": 308005, "epoch": 3710} {"train_loss": -25.958423614501953, "global_step": 308006, "epoch": 3710} {"train_loss": -25.749042510986328, "global_step": 308007, "epoch": 3710} {"train_loss": -25.86722755432129, "global_step": 308008, "epoch": 3710} {"train_loss": -26.05411148071289, "global_step": 308009, "epoch": 3710} {"train_loss": -25.888992309570312, "global_step": 308010, "epoch": 3710} {"train_loss": -25.743711471557617, "global_step": 308011, "epoch": 3710} {"train_loss": -25.60225100689624, "global_step": 308012, "epoch": 3710, "val_loss": 7214920.0} {"train_loss": -25.70814323425293, "global_step": 308013, "epoch": 3711} {"train_loss": -24.957176208496094, "global_step": 308014, "epoch": 3711} {"train_loss": -25.312597274780273, "global_step": 308015, "epoch": 3711} {"train_loss": -25.564889907836914, "global_step": 308016, "epoch": 3711} {"train_loss": -25.474687576293945, "global_step": 308017, "epoch": 3711} {"train_loss": -25.446626663208008, "global_step": 308018, "epoch": 3711} {"train_loss": -25.831710815429688, "global_step": 308019, "epoch": 3711} {"train_loss": -25.43160057067871, "global_step": 308020, "epoch": 3711} {"train_loss": -25.407363891601562, "global_step": 308021, "epoch": 3711} {"train_loss": -25.30841064453125, "global_step": 308022, "epoch": 3711} {"train_loss": -25.35470962524414, "global_step": 308023, "epoch": 3711} {"train_loss": -25.43546485900879, "global_step": 308024, "epoch": 3711} {"train_loss": -25.479177474975586, "global_step": 308025, "epoch": 3711} {"train_loss": -25.70790672302246, "global_step": 308026, "epoch": 3711} {"train_loss": -25.408214569091797, "global_step": 308027, "epoch": 3711} {"train_loss": -25.62909507751465, "global_step": 308028, "epoch": 3711} {"train_loss": -25.817188262939453, "global_step": 308029, "epoch": 3711} {"train_loss": -25.730060577392578, "global_step": 308030, "epoch": 3711} {"train_loss": -25.905317306518555, "global_step": 308031, "epoch": 3711} {"train_loss": -25.596845626831055, "global_step": 308032, "epoch": 3711} {"train_loss": -25.95185661315918, "global_step": 308033, "epoch": 3711} {"train_loss": -25.55986785888672, "global_step": 308034, "epoch": 3711} {"train_loss": -25.653797149658203, "global_step": 308035, "epoch": 3711} {"train_loss": -26.025318145751953, "global_step": 308036, "epoch": 3711} {"train_loss": -26.017990112304688, "global_step": 308037, "epoch": 3711} {"train_loss": -25.446645736694336, "global_step": 308038, "epoch": 3711} {"train_loss": -25.75922203063965, "global_step": 308039, "epoch": 3711} {"train_loss": -25.98353385925293, "global_step": 308040, "epoch": 3711} {"train_loss": -25.839996337890625, "global_step": 308041, "epoch": 3711} {"train_loss": -25.866422653198242, "global_step": 308042, "epoch": 3711} {"train_loss": -26.199926376342773, "global_step": 308043, "epoch": 3711} {"train_loss": -25.50464630126953, "global_step": 308044, "epoch": 3711} {"train_loss": -25.098438262939453, "global_step": 308045, "epoch": 3711} {"train_loss": -25.888696670532227, "global_step": 308046, "epoch": 3711} {"train_loss": -26.20366859436035, "global_step": 308047, "epoch": 3711} {"train_loss": -25.32249641418457, "global_step": 308048, "epoch": 3711} {"train_loss": -25.691089630126953, "global_step": 308049, "epoch": 3711} {"train_loss": -25.60824966430664, "global_step": 308050, "epoch": 3711} {"train_loss": -25.64084815979004, "global_step": 308051, "epoch": 3711} {"train_loss": -25.666309356689453, "global_step": 308052, "epoch": 3711} {"train_loss": -25.456418991088867, "global_step": 308053, "epoch": 3711} {"train_loss": -25.444915771484375, "global_step": 308054, "epoch": 3711} {"train_loss": -25.755521774291992, "global_step": 308055, "epoch": 3711} {"train_loss": -25.552762985229492, "global_step": 308056, "epoch": 3711} {"train_loss": -25.809158325195312, "global_step": 308057, "epoch": 3711} {"train_loss": -25.92051124572754, "global_step": 308058, "epoch": 3711} {"train_loss": -25.5438289642334, "global_step": 308059, "epoch": 3711} {"train_loss": -25.7897891998291, "global_step": 308060, "epoch": 3711} {"train_loss": -26.11248779296875, "global_step": 308061, "epoch": 3711} {"train_loss": -25.394264221191406, "global_step": 308062, "epoch": 3711} {"train_loss": -25.696338653564453, "global_step": 308063, "epoch": 3711} {"train_loss": -26.440702438354492, "global_step": 308064, "epoch": 3711} {"train_loss": -25.797317504882812, "global_step": 308065, "epoch": 3711} {"train_loss": -25.674280166625977, "global_step": 308066, "epoch": 3711} {"train_loss": -25.76837158203125, "global_step": 308067, "epoch": 3711} {"train_loss": -25.62346839904785, "global_step": 308068, "epoch": 3711} {"train_loss": -25.410858154296875, "global_step": 308069, "epoch": 3711} {"train_loss": -25.722394943237305, "global_step": 308070, "epoch": 3711} {"train_loss": -25.86155128479004, "global_step": 308071, "epoch": 3711} {"train_loss": -26.042938232421875, "global_step": 308072, "epoch": 3711} {"train_loss": -25.818653106689453, "global_step": 308073, "epoch": 3711} {"train_loss": -25.84979248046875, "global_step": 308074, "epoch": 3711} {"train_loss": -25.765295028686523, "global_step": 308075, "epoch": 3711} {"train_loss": -25.9470272064209, "global_step": 308076, "epoch": 3711} {"train_loss": -25.837987899780273, "global_step": 308077, "epoch": 3711} {"train_loss": -25.998876571655273, "global_step": 308078, "epoch": 3711} {"train_loss": -25.730377197265625, "global_step": 308079, "epoch": 3711} {"train_loss": -25.69947624206543, "global_step": 308080, "epoch": 3711} {"train_loss": -25.858173370361328, "global_step": 308081, "epoch": 3711} {"train_loss": -25.72577476501465, "global_step": 308082, "epoch": 3711} {"train_loss": -25.629718780517578, "global_step": 308083, "epoch": 3711} {"train_loss": -25.876535415649414, "global_step": 308084, "epoch": 3711} {"train_loss": -26.00787353515625, "global_step": 308085, "epoch": 3711} {"train_loss": -25.90559196472168, "global_step": 308086, "epoch": 3711} {"train_loss": -26.11774253845215, "global_step": 308087, "epoch": 3711} {"train_loss": -25.668338775634766, "global_step": 308088, "epoch": 3711} {"train_loss": -25.9024600982666, "global_step": 308089, "epoch": 3711} {"train_loss": -25.83038330078125, "global_step": 308090, "epoch": 3711} {"train_loss": -25.983036041259766, "global_step": 308091, "epoch": 3711} {"train_loss": -25.911609649658203, "global_step": 308092, "epoch": 3711} {"train_loss": -25.967803955078125, "global_step": 308093, "epoch": 3711} {"train_loss": -25.707128524780273, "global_step": 308094, "epoch": 3711} {"train_loss": -25.727014127984106, "global_step": 308095, "epoch": 3711, "val_loss": 7264355.0} {"train_loss": -25.364652633666992, "global_step": 308096, "epoch": 3712} {"train_loss": -24.9543514251709, "global_step": 308097, "epoch": 3712} {"train_loss": -24.651010513305664, "global_step": 308098, "epoch": 3712} {"train_loss": -25.171483993530273, "global_step": 308099, "epoch": 3712} {"train_loss": -25.013946533203125, "global_step": 308100, "epoch": 3712} {"train_loss": -25.19868278503418, "global_step": 308101, "epoch": 3712} {"train_loss": -25.6761417388916, "global_step": 308102, "epoch": 3712} {"train_loss": -25.108539581298828, "global_step": 308103, "epoch": 3712} {"train_loss": -25.536046981811523, "global_step": 308104, "epoch": 3712} {"train_loss": -25.47173309326172, "global_step": 308105, "epoch": 3712} {"train_loss": -25.057476043701172, "global_step": 308106, "epoch": 3712} {"train_loss": -25.246076583862305, "global_step": 308107, "epoch": 3712} {"train_loss": -25.47479248046875, "global_step": 308108, "epoch": 3712} {"train_loss": -25.7779541015625, "global_step": 308109, "epoch": 3712} {"train_loss": -25.12263298034668, "global_step": 308110, "epoch": 3712} {"train_loss": -25.623626708984375, "global_step": 308111, "epoch": 3712} {"train_loss": -25.644947052001953, "global_step": 308112, "epoch": 3712} {"train_loss": -25.4304256439209, "global_step": 308113, "epoch": 3712} {"train_loss": -25.80951499938965, "global_step": 308114, "epoch": 3712} {"train_loss": -25.870532989501953, "global_step": 308115, "epoch": 3712} {"train_loss": -25.522802352905273, "global_step": 308116, "epoch": 3712} {"train_loss": -25.381824493408203, "global_step": 308117, "epoch": 3712} {"train_loss": -25.78257179260254, "global_step": 308118, "epoch": 3712} {"train_loss": -26.056228637695312, "global_step": 308119, "epoch": 3712} {"train_loss": -25.491239547729492, "global_step": 308120, "epoch": 3712} {"train_loss": -25.617807388305664, "global_step": 308121, "epoch": 3712} {"train_loss": -25.780248641967773, "global_step": 308122, "epoch": 3712} {"train_loss": -25.375455856323242, "global_step": 308123, "epoch": 3712} {"train_loss": -25.394468307495117, "global_step": 308124, "epoch": 3712} {"train_loss": -25.603912353515625, "global_step": 308125, "epoch": 3712} {"train_loss": -25.79974365234375, "global_step": 308126, "epoch": 3712} {"train_loss": -25.557266235351562, "global_step": 308127, "epoch": 3712} {"train_loss": -25.59391212463379, "global_step": 308128, "epoch": 3712} {"train_loss": -25.944019317626953, "global_step": 308129, "epoch": 3712} {"train_loss": -25.678247451782227, "global_step": 308130, "epoch": 3712} {"train_loss": -26.029159545898438, "global_step": 308131, "epoch": 3712} {"train_loss": -25.970264434814453, "global_step": 308132, "epoch": 3712} {"train_loss": -25.88227653503418, "global_step": 308133, "epoch": 3712} {"train_loss": -26.03455924987793, "global_step": 308134, "epoch": 3712} {"train_loss": -25.889301300048828, "global_step": 308135, "epoch": 3712} {"train_loss": -25.702930450439453, "global_step": 308136, "epoch": 3712} {"train_loss": -25.18779945373535, "global_step": 308137, "epoch": 3712} {"train_loss": -25.947900772094727, "global_step": 308138, "epoch": 3712} {"train_loss": -25.90007972717285, "global_step": 308139, "epoch": 3712} {"train_loss": -26.194232940673828, "global_step": 308140, "epoch": 3712} {"train_loss": -25.8087215423584, "global_step": 308141, "epoch": 3712} {"train_loss": -25.345867156982422, "global_step": 308142, "epoch": 3712} {"train_loss": -25.99379539489746, "global_step": 308143, "epoch": 3712} {"train_loss": -25.36820411682129, "global_step": 308144, "epoch": 3712} {"train_loss": -25.603809356689453, "global_step": 308145, "epoch": 3712} {"train_loss": -25.876880645751953, "global_step": 308146, "epoch": 3712} {"train_loss": -25.407190322875977, "global_step": 308147, "epoch": 3712} {"train_loss": -25.913549423217773, "global_step": 308148, "epoch": 3712} {"train_loss": -25.360767364501953, "global_step": 308149, "epoch": 3712} {"train_loss": -24.92833709716797, "global_step": 308150, "epoch": 3712} {"train_loss": -25.275625228881836, "global_step": 308151, "epoch": 3712} {"train_loss": -25.811986923217773, "global_step": 308152, "epoch": 3712} {"train_loss": -25.468595504760742, "global_step": 308153, "epoch": 3712} {"train_loss": -25.716089248657227, "global_step": 308154, "epoch": 3712} {"train_loss": -25.358476638793945, "global_step": 308155, "epoch": 3712} {"train_loss": -25.682043075561523, "global_step": 308156, "epoch": 3712} {"train_loss": -25.101972579956055, "global_step": 308157, "epoch": 3712} {"train_loss": -25.263513565063477, "global_step": 308158, "epoch": 3712} {"train_loss": -25.360937118530273, "global_step": 308159, "epoch": 3712} {"train_loss": -25.446958541870117, "global_step": 308160, "epoch": 3712} {"train_loss": -25.388694763183594, "global_step": 308161, "epoch": 3712} {"train_loss": -25.59800148010254, "global_step": 308162, "epoch": 3712} {"train_loss": -25.36896324157715, "global_step": 308163, "epoch": 3712} {"train_loss": -25.475234985351562, "global_step": 308164, "epoch": 3712} {"train_loss": -25.932397842407227, "global_step": 308165, "epoch": 3712} {"train_loss": -25.705463409423828, "global_step": 308166, "epoch": 3712} {"train_loss": -25.998580932617188, "global_step": 308167, "epoch": 3712} {"train_loss": -25.809675216674805, "global_step": 308168, "epoch": 3712} {"train_loss": -26.09577751159668, "global_step": 308169, "epoch": 3712} {"train_loss": -25.568124771118164, "global_step": 308170, "epoch": 3712} {"train_loss": -26.051191329956055, "global_step": 308171, "epoch": 3712} {"train_loss": -25.77850341796875, "global_step": 308172, "epoch": 3712} {"train_loss": -25.789844512939453, "global_step": 308173, "epoch": 3712} {"train_loss": -25.58962631225586, "global_step": 308174, "epoch": 3712} {"train_loss": -25.882192611694336, "global_step": 308175, "epoch": 3712} {"train_loss": -26.032794952392578, "global_step": 308176, "epoch": 3712} {"train_loss": -26.04840087890625, "global_step": 308177, "epoch": 3712} {"train_loss": -25.60820715111422, "global_step": 308178, "epoch": 3712, "val_loss": 7227619.0} {"train_loss": -25.35469627380371, "global_step": 308179, "epoch": 3713} {"train_loss": -25.18963050842285, "global_step": 308180, "epoch": 3713} {"train_loss": -25.134546279907227, "global_step": 308181, "epoch": 3713} {"train_loss": -25.30735206604004, "global_step": 308182, "epoch": 3713} {"train_loss": -25.235448837280273, "global_step": 308183, "epoch": 3713} {"train_loss": -25.04019546508789, "global_step": 308184, "epoch": 3713} {"train_loss": -25.320161819458008, "global_step": 308185, "epoch": 3713} {"train_loss": -25.878759384155273, "global_step": 308186, "epoch": 3713} {"train_loss": -25.537458419799805, "global_step": 308187, "epoch": 3713} {"train_loss": -25.321462631225586, "global_step": 308188, "epoch": 3713} {"train_loss": -25.546003341674805, "global_step": 308189, "epoch": 3713} {"train_loss": -25.21599006652832, "global_step": 308190, "epoch": 3713} {"train_loss": -25.23434066772461, "global_step": 308191, "epoch": 3713} {"train_loss": -25.763837814331055, "global_step": 308192, "epoch": 3713} {"train_loss": -25.80463981628418, "global_step": 308193, "epoch": 3713} {"train_loss": -25.228431701660156, "global_step": 308194, "epoch": 3713} {"train_loss": -25.45252799987793, "global_step": 308195, "epoch": 3713} {"train_loss": -25.632099151611328, "global_step": 308196, "epoch": 3713} {"train_loss": -25.5750789642334, "global_step": 308197, "epoch": 3713} {"train_loss": -25.526769638061523, "global_step": 308198, "epoch": 3713} {"train_loss": -25.77044677734375, "global_step": 308199, "epoch": 3713} {"train_loss": -25.70773696899414, "global_step": 308200, "epoch": 3713} {"train_loss": -25.797117233276367, "global_step": 308201, "epoch": 3713} {"train_loss": -25.846881866455078, "global_step": 308202, "epoch": 3713} {"train_loss": -25.80079460144043, "global_step": 308203, "epoch": 3713} {"train_loss": -25.73807716369629, "global_step": 308204, "epoch": 3713} {"train_loss": -25.641712188720703, "global_step": 308205, "epoch": 3713} {"train_loss": -26.387781143188477, "global_step": 308206, "epoch": 3713} {"train_loss": -26.106069564819336, "global_step": 308207, "epoch": 3713} {"train_loss": -25.566511154174805, "global_step": 308208, "epoch": 3713} {"train_loss": -25.735998153686523, "global_step": 308209, "epoch": 3713} {"train_loss": -25.981725692749023, "global_step": 308210, "epoch": 3713} {"train_loss": -25.63718032836914, "global_step": 308211, "epoch": 3713} {"train_loss": -25.909475326538086, "global_step": 308212, "epoch": 3713} {"train_loss": -25.625640869140625, "global_step": 308213, "epoch": 3713} {"train_loss": -25.846288681030273, "global_step": 308214, "epoch": 3713} {"train_loss": -25.830942153930664, "global_step": 308215, "epoch": 3713} {"train_loss": -26.216400146484375, "global_step": 308216, "epoch": 3713} {"train_loss": -25.320524215698242, "global_step": 308217, "epoch": 3713} {"train_loss": -25.86859130859375, "global_step": 308218, "epoch": 3713} {"train_loss": -25.759626388549805, "global_step": 308219, "epoch": 3713} {"train_loss": -26.243488311767578, "global_step": 308220, "epoch": 3713} {"train_loss": -25.545015335083008, "global_step": 308221, "epoch": 3713} {"train_loss": -26.01972007751465, "global_step": 308222, "epoch": 3713} {"train_loss": -26.078245162963867, "global_step": 308223, "epoch": 3713} {"train_loss": -26.05341911315918, "global_step": 308224, "epoch": 3713} {"train_loss": -25.605005264282227, "global_step": 308225, "epoch": 3713} {"train_loss": -25.807575225830078, "global_step": 308226, "epoch": 3713} {"train_loss": -25.75660514831543, "global_step": 308227, "epoch": 3713} {"train_loss": -25.622095108032227, "global_step": 308228, "epoch": 3713} {"train_loss": -25.507389068603516, "global_step": 308229, "epoch": 3713} {"train_loss": -25.23134422302246, "global_step": 308230, "epoch": 3713} {"train_loss": -25.63936424255371, "global_step": 308231, "epoch": 3713} {"train_loss": -25.88663673400879, "global_step": 308232, "epoch": 3713} {"train_loss": -25.64227867126465, "global_step": 308233, "epoch": 3713} {"train_loss": -25.859724044799805, "global_step": 308234, "epoch": 3713} {"train_loss": -26.136754989624023, "global_step": 308235, "epoch": 3713} {"train_loss": -25.73514175415039, "global_step": 308236, "epoch": 3713} {"train_loss": -25.65652847290039, "global_step": 308237, "epoch": 3713} {"train_loss": -25.466087341308594, "global_step": 308238, "epoch": 3713} {"train_loss": -25.685766220092773, "global_step": 308239, "epoch": 3713} {"train_loss": -25.71026039123535, "global_step": 308240, "epoch": 3713} {"train_loss": -25.589521408081055, "global_step": 308241, "epoch": 3713} {"train_loss": -25.65437126159668, "global_step": 308242, "epoch": 3713} {"train_loss": -26.003589630126953, "global_step": 308243, "epoch": 3713} {"train_loss": -25.705520629882812, "global_step": 308244, "epoch": 3713} {"train_loss": -25.226694107055664, "global_step": 308245, "epoch": 3713} {"train_loss": -25.941335678100586, "global_step": 308246, "epoch": 3713} {"train_loss": -25.349355697631836, "global_step": 308247, "epoch": 3713} {"train_loss": -25.710718154907227, "global_step": 308248, "epoch": 3713} {"train_loss": -25.729089736938477, "global_step": 308249, "epoch": 3713} {"train_loss": -25.62702751159668, "global_step": 308250, "epoch": 3713} {"train_loss": -25.417577743530273, "global_step": 308251, "epoch": 3713} {"train_loss": -25.5911922454834, "global_step": 308252, "epoch": 3713} {"train_loss": -25.97944450378418, "global_step": 308253, "epoch": 3713} {"train_loss": -25.620569229125977, "global_step": 308254, "epoch": 3713} {"train_loss": -25.588857650756836, "global_step": 308255, "epoch": 3713} {"train_loss": -25.31894302368164, "global_step": 308256, "epoch": 3713} {"train_loss": -26.01656150817871, "global_step": 308257, "epoch": 3713} {"train_loss": -25.788320541381836, "global_step": 308258, "epoch": 3713} {"train_loss": -25.494802474975586, "global_step": 308259, "epoch": 3713} {"train_loss": -25.41855812072754, "global_step": 308260, "epoch": 3713} {"train_loss": -25.65580494432564, "global_step": 308261, "epoch": 3713, "val_loss": 7149951.0} {"train_loss": -24.929357528686523, "global_step": 308262, "epoch": 3714} {"train_loss": -25.465314865112305, "global_step": 308263, "epoch": 3714} {"train_loss": -24.83249855041504, "global_step": 308264, "epoch": 3714} {"train_loss": -25.156339645385742, "global_step": 308265, "epoch": 3714} {"train_loss": -25.397687911987305, "global_step": 308266, "epoch": 3714} {"train_loss": -25.27096939086914, "global_step": 308267, "epoch": 3714} {"train_loss": -25.544525146484375, "global_step": 308268, "epoch": 3714} {"train_loss": -25.095911026000977, "global_step": 308269, "epoch": 3714} {"train_loss": -24.95884132385254, "global_step": 308270, "epoch": 3714} {"train_loss": -25.120563507080078, "global_step": 308271, "epoch": 3714} {"train_loss": -25.726606369018555, "global_step": 308272, "epoch": 3714} {"train_loss": -25.718917846679688, "global_step": 308273, "epoch": 3714} {"train_loss": -25.6153621673584, "global_step": 308274, "epoch": 3714} {"train_loss": -25.280141830444336, "global_step": 308275, "epoch": 3714} {"train_loss": -25.79633903503418, "global_step": 308276, "epoch": 3714} {"train_loss": -25.58778190612793, "global_step": 308277, "epoch": 3714} {"train_loss": -25.270591735839844, "global_step": 308278, "epoch": 3714} {"train_loss": -25.544065475463867, "global_step": 308279, "epoch": 3714} {"train_loss": -25.676023483276367, "global_step": 308280, "epoch": 3714} {"train_loss": -25.342504501342773, "global_step": 308281, "epoch": 3714} {"train_loss": -25.818439483642578, "global_step": 308282, "epoch": 3714} {"train_loss": -25.85590934753418, "global_step": 308283, "epoch": 3714} {"train_loss": -25.445714950561523, "global_step": 308284, "epoch": 3714} {"train_loss": -25.807785034179688, "global_step": 308285, "epoch": 3714} {"train_loss": -25.751312255859375, "global_step": 308286, "epoch": 3714} {"train_loss": -25.788854598999023, "global_step": 308287, "epoch": 3714} {"train_loss": -25.685087203979492, "global_step": 308288, "epoch": 3714} {"train_loss": -25.57406997680664, "global_step": 308289, "epoch": 3714} {"train_loss": -25.539091110229492, "global_step": 308290, "epoch": 3714} {"train_loss": -25.546133041381836, "global_step": 308291, "epoch": 3714} {"train_loss": -25.375959396362305, "global_step": 308292, "epoch": 3714} {"train_loss": -25.840967178344727, "global_step": 308293, "epoch": 3714} {"train_loss": -25.761707305908203, "global_step": 308294, "epoch": 3714} {"train_loss": -25.866947174072266, "global_step": 308295, "epoch": 3714} {"train_loss": -26.146808624267578, "global_step": 308296, "epoch": 3714} {"train_loss": -26.331247329711914, "global_step": 308297, "epoch": 3714} {"train_loss": -25.867658615112305, "global_step": 308298, "epoch": 3714} {"train_loss": -25.89893913269043, "global_step": 308299, "epoch": 3714} {"train_loss": -25.792865753173828, "global_step": 308300, "epoch": 3714} {"train_loss": -25.61138343811035, "global_step": 308301, "epoch": 3714} {"train_loss": -25.722564697265625, "global_step": 308302, "epoch": 3714} {"train_loss": -25.8160400390625, "global_step": 308303, "epoch": 3714} {"train_loss": -26.06623649597168, "global_step": 308304, "epoch": 3714} {"train_loss": -25.747547149658203, "global_step": 308305, "epoch": 3714} {"train_loss": -25.56098747253418, "global_step": 308306, "epoch": 3714} {"train_loss": -25.78780174255371, "global_step": 308307, "epoch": 3714} {"train_loss": -25.844968795776367, "global_step": 308308, "epoch": 3714} {"train_loss": -25.48721694946289, "global_step": 308309, "epoch": 3714} {"train_loss": -25.803918838500977, "global_step": 308310, "epoch": 3714} {"train_loss": -25.437026977539062, "global_step": 308311, "epoch": 3714} {"train_loss": -25.57517433166504, "global_step": 308312, "epoch": 3714} {"train_loss": -25.844806671142578, "global_step": 308313, "epoch": 3714} {"train_loss": -25.782602310180664, "global_step": 308314, "epoch": 3714} {"train_loss": -25.58401107788086, "global_step": 308315, "epoch": 3714} {"train_loss": -25.70379066467285, "global_step": 308316, "epoch": 3714} {"train_loss": -25.7371768951416, "global_step": 308317, "epoch": 3714} {"train_loss": -25.77048683166504, "global_step": 308318, "epoch": 3714} {"train_loss": -25.883813858032227, "global_step": 308319, "epoch": 3714} {"train_loss": -25.688098907470703, "global_step": 308320, "epoch": 3714} {"train_loss": -25.65744400024414, "global_step": 308321, "epoch": 3714} {"train_loss": -25.555509567260742, "global_step": 308322, "epoch": 3714} {"train_loss": -25.835962295532227, "global_step": 308323, "epoch": 3714} {"train_loss": -25.659992218017578, "global_step": 308324, "epoch": 3714} {"train_loss": -25.670501708984375, "global_step": 308325, "epoch": 3714} {"train_loss": -25.385648727416992, "global_step": 308326, "epoch": 3714} {"train_loss": -25.884475708007812, "global_step": 308327, "epoch": 3714} {"train_loss": -26.029813766479492, "global_step": 308328, "epoch": 3714} {"train_loss": -25.714879989624023, "global_step": 308329, "epoch": 3714} {"train_loss": -26.283044815063477, "global_step": 308330, "epoch": 3714} {"train_loss": -26.138137817382812, "global_step": 308331, "epoch": 3714} {"train_loss": -26.071369171142578, "global_step": 308332, "epoch": 3714} {"train_loss": -26.17245864868164, "global_step": 308333, "epoch": 3714} {"train_loss": -25.972797393798828, "global_step": 308334, "epoch": 3714} {"train_loss": -26.06485366821289, "global_step": 308335, "epoch": 3714} {"train_loss": -25.71974754333496, "global_step": 308336, "epoch": 3714} {"train_loss": -25.90981101989746, "global_step": 308337, "epoch": 3714} {"train_loss": -25.81650161743164, "global_step": 308338, "epoch": 3714} {"train_loss": -26.159927368164062, "global_step": 308339, "epoch": 3714} {"train_loss": -26.020828247070312, "global_step": 308340, "epoch": 3714} {"train_loss": -25.650461196899414, "global_step": 308341, "epoch": 3714} {"train_loss": -25.79868507385254, "global_step": 308342, "epoch": 3714} {"train_loss": -25.69462013244629, "global_step": 308343, "epoch": 3714} {"train_loss": -25.69965463661286, "global_step": 308344, "epoch": 3714, "val_loss": 7133908.0} {"train_loss": -25.579561233520508, "global_step": 308345, "epoch": 3715} {"train_loss": -25.36521339416504, "global_step": 308346, "epoch": 3715} {"train_loss": -25.397165298461914, "global_step": 308347, "epoch": 3715} {"train_loss": -25.491561889648438, "global_step": 308348, "epoch": 3715} {"train_loss": -25.514123916625977, "global_step": 308349, "epoch": 3715} {"train_loss": -25.600561141967773, "global_step": 308350, "epoch": 3715} {"train_loss": -25.672101974487305, "global_step": 308351, "epoch": 3715} {"train_loss": -25.390634536743164, "global_step": 308352, "epoch": 3715} {"train_loss": -25.093481063842773, "global_step": 308353, "epoch": 3715} {"train_loss": -25.615524291992188, "global_step": 308354, "epoch": 3715} {"train_loss": -25.26677894592285, "global_step": 308355, "epoch": 3715} {"train_loss": -25.465261459350586, "global_step": 308356, "epoch": 3715} {"train_loss": -25.754657745361328, "global_step": 308357, "epoch": 3715} {"train_loss": -25.525358200073242, "global_step": 308358, "epoch": 3715} {"train_loss": -25.678485870361328, "global_step": 308359, "epoch": 3715} {"train_loss": -25.5032958984375, "global_step": 308360, "epoch": 3715} {"train_loss": -25.68703269958496, "global_step": 308361, "epoch": 3715} {"train_loss": -25.707380294799805, "global_step": 308362, "epoch": 3715} {"train_loss": -25.843246459960938, "global_step": 308363, "epoch": 3715} {"train_loss": -25.8397216796875, "global_step": 308364, "epoch": 3715} {"train_loss": -25.63202476501465, "global_step": 308365, "epoch": 3715} {"train_loss": -25.51361083984375, "global_step": 308366, "epoch": 3715} {"train_loss": -25.561386108398438, "global_step": 308367, "epoch": 3715} {"train_loss": -25.821537017822266, "global_step": 308368, "epoch": 3715} {"train_loss": -25.7530460357666, "global_step": 308369, "epoch": 3715} {"train_loss": -25.784116744995117, "global_step": 308370, "epoch": 3715} {"train_loss": -25.718311309814453, "global_step": 308371, "epoch": 3715} {"train_loss": -25.268524169921875, "global_step": 308372, "epoch": 3715} {"train_loss": -26.031469345092773, "global_step": 308373, "epoch": 3715} {"train_loss": -25.782459259033203, "global_step": 308374, "epoch": 3715} {"train_loss": -25.958606719970703, "global_step": 308375, "epoch": 3715} {"train_loss": -25.920446395874023, "global_step": 308376, "epoch": 3715} {"train_loss": -26.035200119018555, "global_step": 308377, "epoch": 3715} {"train_loss": -25.943012237548828, "global_step": 308378, "epoch": 3715} {"train_loss": -25.485702514648438, "global_step": 308379, "epoch": 3715} {"train_loss": -25.83426856994629, "global_step": 308380, "epoch": 3715} {"train_loss": -25.58038330078125, "global_step": 308381, "epoch": 3715} {"train_loss": -26.16273307800293, "global_step": 308382, "epoch": 3715} {"train_loss": -25.72308921813965, "global_step": 308383, "epoch": 3715} {"train_loss": -26.053680419921875, "global_step": 308384, "epoch": 3715} {"train_loss": -26.046106338500977, "global_step": 308385, "epoch": 3715} {"train_loss": -25.648941040039062, "global_step": 308386, "epoch": 3715} {"train_loss": -25.94954490661621, "global_step": 308387, "epoch": 3715} {"train_loss": -25.835025787353516, "global_step": 308388, "epoch": 3715} {"train_loss": -26.017126083374023, "global_step": 308389, "epoch": 3715} {"train_loss": -25.945371627807617, "global_step": 308390, "epoch": 3715} {"train_loss": -25.67095375061035, "global_step": 308391, "epoch": 3715} {"train_loss": -25.636367797851562, "global_step": 308392, "epoch": 3715} {"train_loss": -25.738128662109375, "global_step": 308393, "epoch": 3715} {"train_loss": -25.5438232421875, "global_step": 308394, "epoch": 3715} {"train_loss": -25.85822105407715, "global_step": 308395, "epoch": 3715} {"train_loss": -25.662689208984375, "global_step": 308396, "epoch": 3715} {"train_loss": -25.281448364257812, "global_step": 308397, "epoch": 3715} {"train_loss": -25.83880043029785, "global_step": 308398, "epoch": 3715} {"train_loss": -25.676441192626953, "global_step": 308399, "epoch": 3715} {"train_loss": -25.5322322845459, "global_step": 308400, "epoch": 3715} {"train_loss": -24.964689254760742, "global_step": 308401, "epoch": 3715} {"train_loss": -25.56036949157715, "global_step": 308402, "epoch": 3715} {"train_loss": -25.870990753173828, "global_step": 308403, "epoch": 3715} {"train_loss": -25.484619140625, "global_step": 308404, "epoch": 3715} {"train_loss": -25.66061782836914, "global_step": 308405, "epoch": 3715} {"train_loss": -25.38041114807129, "global_step": 308406, "epoch": 3715} {"train_loss": -25.564023971557617, "global_step": 308407, "epoch": 3715} {"train_loss": -25.72333335876465, "global_step": 308408, "epoch": 3715} {"train_loss": -25.559425354003906, "global_step": 308409, "epoch": 3715} {"train_loss": -25.72393798828125, "global_step": 308410, "epoch": 3715} {"train_loss": -25.70252799987793, "global_step": 308411, "epoch": 3715} {"train_loss": -25.44849967956543, "global_step": 308412, "epoch": 3715} {"train_loss": -25.96113395690918, "global_step": 308413, "epoch": 3715} {"train_loss": -25.63215446472168, "global_step": 308414, "epoch": 3715} {"train_loss": -25.85468101501465, "global_step": 308415, "epoch": 3715} {"train_loss": -25.899282455444336, "global_step": 308416, "epoch": 3715} {"train_loss": -25.775344848632812, "global_step": 308417, "epoch": 3715} {"train_loss": -25.787031173706055, "global_step": 308418, "epoch": 3715} {"train_loss": -26.177642822265625, "global_step": 308419, "epoch": 3715} {"train_loss": -26.06768798828125, "global_step": 308420, "epoch": 3715} {"train_loss": -25.840356826782227, "global_step": 308421, "epoch": 3715} {"train_loss": -25.893634796142578, "global_step": 308422, "epoch": 3715} {"train_loss": -25.831195831298828, "global_step": 308423, "epoch": 3715} {"train_loss": -26.507383346557617, "global_step": 308424, "epoch": 3715} {"train_loss": -25.959552764892578, "global_step": 308425, "epoch": 3715} {"train_loss": -25.885583877563477, "global_step": 308426, "epoch": 3715} {"train_loss": -25.696343272565358, "global_step": 308427, "epoch": 3715, "val_loss": 7201090.0} {"train_loss": -24.383031845092773, "global_step": 308428, "epoch": 3716} {"train_loss": -24.136520385742188, "global_step": 308429, "epoch": 3716} {"train_loss": -24.656566619873047, "global_step": 308430, "epoch": 3716} {"train_loss": -25.64565086364746, "global_step": 308431, "epoch": 3716} {"train_loss": -24.915443420410156, "global_step": 308432, "epoch": 3716} {"train_loss": -24.99372673034668, "global_step": 308433, "epoch": 3716} {"train_loss": -25.350126266479492, "global_step": 308434, "epoch": 3716} {"train_loss": -25.16120719909668, "global_step": 308435, "epoch": 3716} {"train_loss": -25.07495880126953, "global_step": 308436, "epoch": 3716} {"train_loss": -25.17323112487793, "global_step": 308437, "epoch": 3716} {"train_loss": -25.21177864074707, "global_step": 308438, "epoch": 3716} {"train_loss": -24.9180965423584, "global_step": 308439, "epoch": 3716} {"train_loss": -25.613632202148438, "global_step": 308440, "epoch": 3716} {"train_loss": -25.160846710205078, "global_step": 308441, "epoch": 3716} {"train_loss": -25.934362411499023, "global_step": 308442, "epoch": 3716} {"train_loss": -25.683456420898438, "global_step": 308443, "epoch": 3716} {"train_loss": -25.513580322265625, "global_step": 308444, "epoch": 3716} {"train_loss": -25.511762619018555, "global_step": 308445, "epoch": 3716} {"train_loss": -25.644811630249023, "global_step": 308446, "epoch": 3716} {"train_loss": -25.597705841064453, "global_step": 308447, "epoch": 3716} {"train_loss": -25.42875099182129, "global_step": 308448, "epoch": 3716} {"train_loss": -25.603605270385742, "global_step": 308449, "epoch": 3716} {"train_loss": -25.524738311767578, "global_step": 308450, "epoch": 3716} {"train_loss": -25.367328643798828, "global_step": 308451, "epoch": 3716} {"train_loss": -25.69618797302246, "global_step": 308452, "epoch": 3716} {"train_loss": -25.498580932617188, "global_step": 308453, "epoch": 3716} {"train_loss": -25.655160903930664, "global_step": 308454, "epoch": 3716} {"train_loss": -25.792102813720703, "global_step": 308455, "epoch": 3716} {"train_loss": -25.47941017150879, "global_step": 308456, "epoch": 3716} {"train_loss": -25.479841232299805, "global_step": 308457, "epoch": 3716} {"train_loss": -25.636173248291016, "global_step": 308458, "epoch": 3716} {"train_loss": -25.8586483001709, "global_step": 308459, "epoch": 3716} {"train_loss": -25.431684494018555, "global_step": 308460, "epoch": 3716} {"train_loss": -25.62183952331543, "global_step": 308461, "epoch": 3716} {"train_loss": -25.624103546142578, "global_step": 308462, "epoch": 3716} {"train_loss": -25.76388931274414, "global_step": 308463, "epoch": 3716} {"train_loss": -25.719196319580078, "global_step": 308464, "epoch": 3716} {"train_loss": -26.036344528198242, "global_step": 308465, "epoch": 3716} {"train_loss": -25.684919357299805, "global_step": 308466, "epoch": 3716} {"train_loss": -26.083114624023438, "global_step": 308467, "epoch": 3716} {"train_loss": -25.88751220703125, "global_step": 308468, "epoch": 3716} {"train_loss": -25.908151626586914, "global_step": 308469, "epoch": 3716} {"train_loss": -25.9346923828125, "global_step": 308470, "epoch": 3716} {"train_loss": -26.03938102722168, "global_step": 308471, "epoch": 3716} {"train_loss": -25.79339027404785, "global_step": 308472, "epoch": 3716} {"train_loss": -25.733869552612305, "global_step": 308473, "epoch": 3716} {"train_loss": -25.48664665222168, "global_step": 308474, "epoch": 3716} {"train_loss": -25.557233810424805, "global_step": 308475, "epoch": 3716} {"train_loss": -25.590375900268555, "global_step": 308476, "epoch": 3716} {"train_loss": -25.635236740112305, "global_step": 308477, "epoch": 3716} {"train_loss": -25.453372955322266, "global_step": 308478, "epoch": 3716} {"train_loss": -25.231273651123047, "global_step": 308479, "epoch": 3716} {"train_loss": -25.65277671813965, "global_step": 308480, "epoch": 3716} {"train_loss": -25.49176597595215, "global_step": 308481, "epoch": 3716} {"train_loss": -25.252859115600586, "global_step": 308482, "epoch": 3716} {"train_loss": -25.267560958862305, "global_step": 308483, "epoch": 3716} {"train_loss": -25.722431182861328, "global_step": 308484, "epoch": 3716} {"train_loss": -25.797285079956055, "global_step": 308485, "epoch": 3716} {"train_loss": -25.524999618530273, "global_step": 308486, "epoch": 3716} {"train_loss": -25.453710556030273, "global_step": 308487, "epoch": 3716} {"train_loss": -25.553449630737305, "global_step": 308488, "epoch": 3716} {"train_loss": -25.646085739135742, "global_step": 308489, "epoch": 3716} {"train_loss": -25.586036682128906, "global_step": 308490, "epoch": 3716} {"train_loss": -25.640283584594727, "global_step": 308491, "epoch": 3716} {"train_loss": -25.364118576049805, "global_step": 308492, "epoch": 3716} {"train_loss": -25.437095642089844, "global_step": 308493, "epoch": 3716} {"train_loss": -25.604272842407227, "global_step": 308494, "epoch": 3716} {"train_loss": -25.922119140625, "global_step": 308495, "epoch": 3716} {"train_loss": -25.529380798339844, "global_step": 308496, "epoch": 3716} {"train_loss": -25.71592140197754, "global_step": 308497, "epoch": 3716} {"train_loss": -25.935199737548828, "global_step": 308498, "epoch": 3716} {"train_loss": -25.60416603088379, "global_step": 308499, "epoch": 3716} {"train_loss": -26.09870719909668, "global_step": 308500, "epoch": 3716} {"train_loss": -25.7086181640625, "global_step": 308501, "epoch": 3716} {"train_loss": -26.000247955322266, "global_step": 308502, "epoch": 3716} {"train_loss": -25.652929306030273, "global_step": 308503, "epoch": 3716} {"train_loss": -25.785993576049805, "global_step": 308504, "epoch": 3716} {"train_loss": -25.941699981689453, "global_step": 308505, "epoch": 3716} {"train_loss": -26.00168228149414, "global_step": 308506, "epoch": 3716} {"train_loss": -25.901525497436523, "global_step": 308507, "epoch": 3716} {"train_loss": -25.9167423248291, "global_step": 308508, "epoch": 3716} {"train_loss": -26.037256240844727, "global_step": 308509, "epoch": 3716} {"train_loss": -25.57103076613093, "global_step": 308510, "epoch": 3716, "val_loss": 7262634.0} {"train_loss": -25.15083885192871, "global_step": 308511, "epoch": 3717} {"train_loss": -23.716495513916016, "global_step": 308512, "epoch": 3717} {"train_loss": -24.119840621948242, "global_step": 308513, "epoch": 3717} {"train_loss": -25.05323600769043, "global_step": 308514, "epoch": 3717} {"train_loss": -25.039052963256836, "global_step": 308515, "epoch": 3717} {"train_loss": -25.27337074279785, "global_step": 308516, "epoch": 3717} {"train_loss": -24.55575942993164, "global_step": 308517, "epoch": 3717} {"train_loss": -25.377981185913086, "global_step": 308518, "epoch": 3717} {"train_loss": -25.0264949798584, "global_step": 308519, "epoch": 3717} {"train_loss": -24.942960739135742, "global_step": 308520, "epoch": 3717} {"train_loss": -25.228008270263672, "global_step": 308521, "epoch": 3717} {"train_loss": -24.62529754638672, "global_step": 308522, "epoch": 3717} {"train_loss": -25.054229736328125, "global_step": 308523, "epoch": 3717} {"train_loss": -25.02786636352539, "global_step": 308524, "epoch": 3717} {"train_loss": -25.287982940673828, "global_step": 308525, "epoch": 3717} {"train_loss": -24.908164978027344, "global_step": 308526, "epoch": 3717} {"train_loss": -25.07455062866211, "global_step": 308527, "epoch": 3717} {"train_loss": -25.101526260375977, "global_step": 308528, "epoch": 3717} {"train_loss": -24.789812088012695, "global_step": 308529, "epoch": 3717} {"train_loss": -25.629011154174805, "global_step": 308530, "epoch": 3717} {"train_loss": -25.309982299804688, "global_step": 308531, "epoch": 3717} {"train_loss": -25.3453426361084, "global_step": 308532, "epoch": 3717} {"train_loss": -25.34372901916504, "global_step": 308533, "epoch": 3717} {"train_loss": -25.33308982849121, "global_step": 308534, "epoch": 3717} {"train_loss": -25.346969604492188, "global_step": 308535, "epoch": 3717} {"train_loss": -25.24523162841797, "global_step": 308536, "epoch": 3717} {"train_loss": -25.602664947509766, "global_step": 308537, "epoch": 3717} {"train_loss": -25.41036605834961, "global_step": 308538, "epoch": 3717} {"train_loss": -25.1888484954834, "global_step": 308539, "epoch": 3717} {"train_loss": -25.50238609313965, "global_step": 308540, "epoch": 3717} {"train_loss": -25.51239013671875, "global_step": 308541, "epoch": 3717} {"train_loss": -25.19742202758789, "global_step": 308542, "epoch": 3717} {"train_loss": -25.51092529296875, "global_step": 308543, "epoch": 3717} {"train_loss": -25.375553131103516, "global_step": 308544, "epoch": 3717} {"train_loss": -25.391929626464844, "global_step": 308545, "epoch": 3717} {"train_loss": -25.83441734313965, "global_step": 308546, "epoch": 3717} {"train_loss": -25.684728622436523, "global_step": 308547, "epoch": 3717} {"train_loss": -25.39560317993164, "global_step": 308548, "epoch": 3717} {"train_loss": -25.410110473632812, "global_step": 308549, "epoch": 3717} {"train_loss": -25.570158004760742, "global_step": 308550, "epoch": 3717} {"train_loss": -25.39246940612793, "global_step": 308551, "epoch": 3717} {"train_loss": -25.685632705688477, "global_step": 308552, "epoch": 3717} {"train_loss": -25.735294342041016, "global_step": 308553, "epoch": 3717} {"train_loss": -25.78375244140625, "global_step": 308554, "epoch": 3717} {"train_loss": -25.406753540039062, "global_step": 308555, "epoch": 3717} {"train_loss": -25.47873306274414, "global_step": 308556, "epoch": 3717} {"train_loss": -25.89023208618164, "global_step": 308557, "epoch": 3717} {"train_loss": -25.63754653930664, "global_step": 308558, "epoch": 3717} {"train_loss": -25.877887725830078, "global_step": 308559, "epoch": 3717} {"train_loss": -25.879240036010742, "global_step": 308560, "epoch": 3717} {"train_loss": -25.616168975830078, "global_step": 308561, "epoch": 3717} {"train_loss": -25.692840576171875, "global_step": 308562, "epoch": 3717} {"train_loss": -25.868024826049805, "global_step": 308563, "epoch": 3717} {"train_loss": -25.734418869018555, "global_step": 308564, "epoch": 3717} {"train_loss": -25.9510555267334, "global_step": 308565, "epoch": 3717} {"train_loss": -25.760883331298828, "global_step": 308566, "epoch": 3717} {"train_loss": -25.54315185546875, "global_step": 308567, "epoch": 3717} {"train_loss": -25.879852294921875, "global_step": 308568, "epoch": 3717} {"train_loss": -25.802892684936523, "global_step": 308569, "epoch": 3717} {"train_loss": -26.056604385375977, "global_step": 308570, "epoch": 3717} {"train_loss": -25.897180557250977, "global_step": 308571, "epoch": 3717} {"train_loss": -25.855566024780273, "global_step": 308572, "epoch": 3717} {"train_loss": -25.771869659423828, "global_step": 308573, "epoch": 3717} {"train_loss": -25.741125106811523, "global_step": 308574, "epoch": 3717} {"train_loss": -26.292627334594727, "global_step": 308575, "epoch": 3717} {"train_loss": -25.937963485717773, "global_step": 308576, "epoch": 3717} {"train_loss": -25.704980850219727, "global_step": 308577, "epoch": 3717} {"train_loss": -25.864835739135742, "global_step": 308578, "epoch": 3717} {"train_loss": -25.814306259155273, "global_step": 308579, "epoch": 3717} {"train_loss": -26.095752716064453, "global_step": 308580, "epoch": 3717} {"train_loss": -25.918811798095703, "global_step": 308581, "epoch": 3717} {"train_loss": -25.864093780517578, "global_step": 308582, "epoch": 3717} {"train_loss": -25.797870635986328, "global_step": 308583, "epoch": 3717} {"train_loss": -26.027963638305664, "global_step": 308584, "epoch": 3717} {"train_loss": -25.887792587280273, "global_step": 308585, "epoch": 3717} {"train_loss": -26.058324813842773, "global_step": 308586, "epoch": 3717} {"train_loss": -26.01901626586914, "global_step": 308587, "epoch": 3717} {"train_loss": -25.94487953186035, "global_step": 308588, "epoch": 3717} {"train_loss": -25.54806137084961, "global_step": 308589, "epoch": 3717} {"train_loss": -25.870447158813477, "global_step": 308590, "epoch": 3717} {"train_loss": -25.71112060546875, "global_step": 308591, "epoch": 3717} {"train_loss": -26.014856338500977, "global_step": 308592, "epoch": 3717} {"train_loss": -25.515637478196478, "global_step": 308593, "epoch": 3717, "val_loss": 7228012.0} {"train_loss": -25.412734985351562, "global_step": 308594, "epoch": 3718} {"train_loss": -25.468393325805664, "global_step": 308595, "epoch": 3718} {"train_loss": -25.383695602416992, "global_step": 308596, "epoch": 3718} {"train_loss": -26.0280818939209, "global_step": 308597, "epoch": 3718} {"train_loss": -25.381654739379883, "global_step": 308598, "epoch": 3718} {"train_loss": -25.681665420532227, "global_step": 308599, "epoch": 3718} {"train_loss": -25.851285934448242, "global_step": 308600, "epoch": 3718} {"train_loss": -25.21455955505371, "global_step": 308601, "epoch": 3718} {"train_loss": -25.6141300201416, "global_step": 308602, "epoch": 3718} {"train_loss": -25.6455020904541, "global_step": 308603, "epoch": 3718} {"train_loss": -25.57320213317871, "global_step": 308604, "epoch": 3718} {"train_loss": -25.33113670349121, "global_step": 308605, "epoch": 3718} {"train_loss": -25.620466232299805, "global_step": 308606, "epoch": 3718} {"train_loss": -25.302566528320312, "global_step": 308607, "epoch": 3718} {"train_loss": -25.7059383392334, "global_step": 308608, "epoch": 3718} {"train_loss": -25.726470947265625, "global_step": 308609, "epoch": 3718} {"train_loss": -25.51783561706543, "global_step": 308610, "epoch": 3718} {"train_loss": -25.85635757446289, "global_step": 308611, "epoch": 3718} {"train_loss": -25.45838737487793, "global_step": 308612, "epoch": 3718} {"train_loss": -25.637500762939453, "global_step": 308613, "epoch": 3718} {"train_loss": -25.7796688079834, "global_step": 308614, "epoch": 3718} {"train_loss": -25.58854103088379, "global_step": 308615, "epoch": 3718} {"train_loss": -25.468875885009766, "global_step": 308616, "epoch": 3718} {"train_loss": -25.808618545532227, "global_step": 308617, "epoch": 3718} {"train_loss": -25.868671417236328, "global_step": 308618, "epoch": 3718} {"train_loss": -25.66050148010254, "global_step": 308619, "epoch": 3718} {"train_loss": -25.205942153930664, "global_step": 308620, "epoch": 3718} {"train_loss": -25.730712890625, "global_step": 308621, "epoch": 3718} {"train_loss": -25.702560424804688, "global_step": 308622, "epoch": 3718} {"train_loss": -26.006261825561523, "global_step": 308623, "epoch": 3718} {"train_loss": -25.926132202148438, "global_step": 308624, "epoch": 3718} {"train_loss": -25.573627471923828, "global_step": 308625, "epoch": 3718} {"train_loss": -25.9747314453125, "global_step": 308626, "epoch": 3718} {"train_loss": -25.855030059814453, "global_step": 308627, "epoch": 3718} {"train_loss": -25.942935943603516, "global_step": 308628, "epoch": 3718} {"train_loss": -25.54144859313965, "global_step": 308629, "epoch": 3718} {"train_loss": -26.367353439331055, "global_step": 308630, "epoch": 3718} {"train_loss": -25.738723754882812, "global_step": 308631, "epoch": 3718} {"train_loss": -25.21808433532715, "global_step": 308632, "epoch": 3718} {"train_loss": -25.25795555114746, "global_step": 308633, "epoch": 3718} {"train_loss": -25.674713134765625, "global_step": 308634, "epoch": 3718} {"train_loss": -26.04300308227539, "global_step": 308635, "epoch": 3718} {"train_loss": -26.058195114135742, "global_step": 308636, "epoch": 3718} {"train_loss": -25.540611267089844, "global_step": 308637, "epoch": 3718} {"train_loss": -25.70442771911621, "global_step": 308638, "epoch": 3718} {"train_loss": -25.996938705444336, "global_step": 308639, "epoch": 3718} {"train_loss": -26.04011344909668, "global_step": 308640, "epoch": 3718} {"train_loss": -25.989337921142578, "global_step": 308641, "epoch": 3718} {"train_loss": -25.569538116455078, "global_step": 308642, "epoch": 3718} {"train_loss": -25.49195671081543, "global_step": 308643, "epoch": 3718} {"train_loss": -25.46872329711914, "global_step": 308644, "epoch": 3718} {"train_loss": -25.931812286376953, "global_step": 308645, "epoch": 3718} {"train_loss": -25.8531494140625, "global_step": 308646, "epoch": 3718} {"train_loss": -25.937625885009766, "global_step": 308647, "epoch": 3718} {"train_loss": -25.53382110595703, "global_step": 308648, "epoch": 3718} {"train_loss": -25.875268936157227, "global_step": 308649, "epoch": 3718} {"train_loss": -26.080291748046875, "global_step": 308650, "epoch": 3718} {"train_loss": -26.05301856994629, "global_step": 308651, "epoch": 3718} {"train_loss": -25.81587028503418, "global_step": 308652, "epoch": 3718} {"train_loss": -25.444665908813477, "global_step": 308653, "epoch": 3718} {"train_loss": -25.78876304626465, "global_step": 308654, "epoch": 3718} {"train_loss": -25.970081329345703, "global_step": 308655, "epoch": 3718} {"train_loss": -25.97279167175293, "global_step": 308656, "epoch": 3718} {"train_loss": -25.939783096313477, "global_step": 308657, "epoch": 3718} {"train_loss": -26.127485275268555, "global_step": 308658, "epoch": 3718} {"train_loss": -25.509296417236328, "global_step": 308659, "epoch": 3718} {"train_loss": -25.67576026916504, "global_step": 308660, "epoch": 3718} {"train_loss": -25.550649642944336, "global_step": 308661, "epoch": 3718} {"train_loss": -25.6544189453125, "global_step": 308662, "epoch": 3718} {"train_loss": -26.282440185546875, "global_step": 308663, "epoch": 3718} {"train_loss": -25.753738403320312, "global_step": 308664, "epoch": 3718} {"train_loss": -25.70374870300293, "global_step": 308665, "epoch": 3718} {"train_loss": -25.62871742248535, "global_step": 308666, "epoch": 3718} {"train_loss": -25.171939849853516, "global_step": 308667, "epoch": 3718} {"train_loss": -25.051822662353516, "global_step": 308668, "epoch": 3718} {"train_loss": -25.380516052246094, "global_step": 308669, "epoch": 3718} {"train_loss": -25.478662490844727, "global_step": 308670, "epoch": 3718} {"train_loss": -25.355085372924805, "global_step": 308671, "epoch": 3718} {"train_loss": -25.65424156188965, "global_step": 308672, "epoch": 3718} {"train_loss": -25.497413635253906, "global_step": 308673, "epoch": 3718} {"train_loss": -25.96868896484375, "global_step": 308674, "epoch": 3718} {"train_loss": -25.596832275390625, "global_step": 308675, "epoch": 3718} {"train_loss": -25.680456919842456, "global_step": 308676, "epoch": 3718, "val_loss": 7251102.0} {"train_loss": -24.436473846435547, "global_step": 308677, "epoch": 3719} {"train_loss": -25.00007438659668, "global_step": 308678, "epoch": 3719} {"train_loss": -25.02115249633789, "global_step": 308679, "epoch": 3719} {"train_loss": -25.169313430786133, "global_step": 308680, "epoch": 3719} {"train_loss": -25.001632690429688, "global_step": 308681, "epoch": 3719} {"train_loss": -25.379362106323242, "global_step": 308682, "epoch": 3719} {"train_loss": -24.743993759155273, "global_step": 308683, "epoch": 3719} {"train_loss": -25.638671875, "global_step": 308684, "epoch": 3719} {"train_loss": -25.366256713867188, "global_step": 308685, "epoch": 3719} {"train_loss": -25.35872459411621, "global_step": 308686, "epoch": 3719} {"train_loss": -25.44345474243164, "global_step": 308687, "epoch": 3719} {"train_loss": -25.115076065063477, "global_step": 308688, "epoch": 3719} {"train_loss": -25.627689361572266, "global_step": 308689, "epoch": 3719} {"train_loss": -25.519441604614258, "global_step": 308690, "epoch": 3719} {"train_loss": -25.451194763183594, "global_step": 308691, "epoch": 3719} {"train_loss": -25.7205753326416, "global_step": 308692, "epoch": 3719} {"train_loss": -25.356830596923828, "global_step": 308693, "epoch": 3719} {"train_loss": -25.49911117553711, "global_step": 308694, "epoch": 3719} {"train_loss": -26.185022354125977, "global_step": 308695, "epoch": 3719} {"train_loss": -25.50214195251465, "global_step": 308696, "epoch": 3719} {"train_loss": -25.806564331054688, "global_step": 308697, "epoch": 3719} {"train_loss": -25.710636138916016, "global_step": 308698, "epoch": 3719} {"train_loss": -25.407548904418945, "global_step": 308699, "epoch": 3719} {"train_loss": -25.539175033569336, "global_step": 308700, "epoch": 3719} {"train_loss": -25.770750045776367, "global_step": 308701, "epoch": 3719} {"train_loss": -25.70112419128418, "global_step": 308702, "epoch": 3719} {"train_loss": -25.946735382080078, "global_step": 308703, "epoch": 3719} {"train_loss": -25.458057403564453, "global_step": 308704, "epoch": 3719} {"train_loss": -25.448074340820312, "global_step": 308705, "epoch": 3719} {"train_loss": -25.669647216796875, "global_step": 308706, "epoch": 3719} {"train_loss": -25.58313751220703, "global_step": 308707, "epoch": 3719} {"train_loss": -25.14112663269043, "global_step": 308708, "epoch": 3719} {"train_loss": -25.917844772338867, "global_step": 308709, "epoch": 3719} {"train_loss": -25.906097412109375, "global_step": 308710, "epoch": 3719} {"train_loss": -25.768863677978516, "global_step": 308711, "epoch": 3719} {"train_loss": -25.9014949798584, "global_step": 308712, "epoch": 3719} {"train_loss": -25.526081085205078, "global_step": 308713, "epoch": 3719} {"train_loss": -25.719650268554688, "global_step": 308714, "epoch": 3719} {"train_loss": -25.7689266204834, "global_step": 308715, "epoch": 3719} {"train_loss": -25.80866813659668, "global_step": 308716, "epoch": 3719} {"train_loss": -26.073795318603516, "global_step": 308717, "epoch": 3719} {"train_loss": -25.85553550720215, "global_step": 308718, "epoch": 3719} {"train_loss": -25.74639892578125, "global_step": 308719, "epoch": 3719} {"train_loss": -25.947492599487305, "global_step": 308720, "epoch": 3719} {"train_loss": -25.865365982055664, "global_step": 308721, "epoch": 3719} {"train_loss": -26.25067138671875, "global_step": 308722, "epoch": 3719} {"train_loss": -25.931045532226562, "global_step": 308723, "epoch": 3719} {"train_loss": -25.6524715423584, "global_step": 308724, "epoch": 3719} {"train_loss": -25.792016983032227, "global_step": 308725, "epoch": 3719} {"train_loss": -25.71723747253418, "global_step": 308726, "epoch": 3719} {"train_loss": -25.585676193237305, "global_step": 308727, "epoch": 3719} {"train_loss": -25.5513973236084, "global_step": 308728, "epoch": 3719} {"train_loss": -25.81743812561035, "global_step": 308729, "epoch": 3719} {"train_loss": -25.96502685546875, "global_step": 308730, "epoch": 3719} {"train_loss": -25.791229248046875, "global_step": 308731, "epoch": 3719} {"train_loss": -25.497299194335938, "global_step": 308732, "epoch": 3719} {"train_loss": -25.551389694213867, "global_step": 308733, "epoch": 3719} {"train_loss": -25.29103660583496, "global_step": 308734, "epoch": 3719} {"train_loss": -25.63128662109375, "global_step": 308735, "epoch": 3719} {"train_loss": -25.92140007019043, "global_step": 308736, "epoch": 3719} {"train_loss": -25.8759765625, "global_step": 308737, "epoch": 3719} {"train_loss": -25.10040855407715, "global_step": 308738, "epoch": 3719} {"train_loss": -25.6914119720459, "global_step": 308739, "epoch": 3719} {"train_loss": -25.382888793945312, "global_step": 308740, "epoch": 3719} {"train_loss": -25.664535522460938, "global_step": 308741, "epoch": 3719} {"train_loss": -25.410675048828125, "global_step": 308742, "epoch": 3719} {"train_loss": -25.47496223449707, "global_step": 308743, "epoch": 3719} {"train_loss": -25.51252555847168, "global_step": 308744, "epoch": 3719} {"train_loss": -25.673322677612305, "global_step": 308745, "epoch": 3719} {"train_loss": -25.358169555664062, "global_step": 308746, "epoch": 3719} {"train_loss": -25.391559600830078, "global_step": 308747, "epoch": 3719} {"train_loss": -25.422502517700195, "global_step": 308748, "epoch": 3719} {"train_loss": -25.32049560546875, "global_step": 308749, "epoch": 3719} {"train_loss": -25.453184127807617, "global_step": 308750, "epoch": 3719} {"train_loss": -25.60491371154785, "global_step": 308751, "epoch": 3719} {"train_loss": -25.646915435791016, "global_step": 308752, "epoch": 3719} {"train_loss": -25.87765884399414, "global_step": 308753, "epoch": 3719} {"train_loss": -25.650053024291992, "global_step": 308754, "epoch": 3719} {"train_loss": -25.60797119140625, "global_step": 308755, "epoch": 3719} {"train_loss": -25.75809669494629, "global_step": 308756, "epoch": 3719} {"train_loss": -25.807010650634766, "global_step": 308757, "epoch": 3719} {"train_loss": -25.74658203125, "global_step": 308758, "epoch": 3719} {"train_loss": -25.606233803622693, "global_step": 308759, "epoch": 3719, "val_loss": 7160397.0} {"train_loss": -25.536909103393555, "global_step": 308760, "epoch": 3720} {"train_loss": -25.633426666259766, "global_step": 308761, "epoch": 3720} {"train_loss": -25.40327262878418, "global_step": 308762, "epoch": 3720} {"train_loss": -25.219074249267578, "global_step": 308763, "epoch": 3720} {"train_loss": -25.6759090423584, "global_step": 308764, "epoch": 3720} {"train_loss": -25.32862091064453, "global_step": 308765, "epoch": 3720} {"train_loss": -25.58901023864746, "global_step": 308766, "epoch": 3720} {"train_loss": -25.54803466796875, "global_step": 308767, "epoch": 3720} {"train_loss": -25.519323348999023, "global_step": 308768, "epoch": 3720} {"train_loss": -25.291004180908203, "global_step": 308769, "epoch": 3720} {"train_loss": -25.745258331298828, "global_step": 308770, "epoch": 3720} {"train_loss": -25.734272003173828, "global_step": 308771, "epoch": 3720} {"train_loss": -25.702402114868164, "global_step": 308772, "epoch": 3720} {"train_loss": -25.482404708862305, "global_step": 308773, "epoch": 3720} {"train_loss": -25.411090850830078, "global_step": 308774, "epoch": 3720} {"train_loss": -25.82488441467285, "global_step": 308775, "epoch": 3720} {"train_loss": -25.96524429321289, "global_step": 308776, "epoch": 3720} {"train_loss": -25.88376808166504, "global_step": 308777, "epoch": 3720} {"train_loss": -25.657058715820312, "global_step": 308778, "epoch": 3720} {"train_loss": -25.9890079498291, "global_step": 308779, "epoch": 3720} {"train_loss": -25.793073654174805, "global_step": 308780, "epoch": 3720} {"train_loss": -25.954120635986328, "global_step": 308781, "epoch": 3720} {"train_loss": -25.682851791381836, "global_step": 308782, "epoch": 3720} {"train_loss": -25.981664657592773, "global_step": 308783, "epoch": 3720} {"train_loss": -25.845020294189453, "global_step": 308784, "epoch": 3720} {"train_loss": -26.085538864135742, "global_step": 308785, "epoch": 3720} {"train_loss": -25.857999801635742, "global_step": 308786, "epoch": 3720} {"train_loss": -25.7507381439209, "global_step": 308787, "epoch": 3720} {"train_loss": -25.66474723815918, "global_step": 308788, "epoch": 3720} {"train_loss": -25.859943389892578, "global_step": 308789, "epoch": 3720} {"train_loss": -26.179401397705078, "global_step": 308790, "epoch": 3720} {"train_loss": -25.703048706054688, "global_step": 308791, "epoch": 3720} {"train_loss": -25.531084060668945, "global_step": 308792, "epoch": 3720} {"train_loss": -25.710418701171875, "global_step": 308793, "epoch": 3720} {"train_loss": -25.7729549407959, "global_step": 308794, "epoch": 3720} {"train_loss": -25.941822052001953, "global_step": 308795, "epoch": 3720} {"train_loss": -25.6422176361084, "global_step": 308796, "epoch": 3720} {"train_loss": -25.564697265625, "global_step": 308797, "epoch": 3720} {"train_loss": -26.010950088500977, "global_step": 308798, "epoch": 3720} {"train_loss": -26.064977645874023, "global_step": 308799, "epoch": 3720} {"train_loss": -25.44940757751465, "global_step": 308800, "epoch": 3720} {"train_loss": -25.283599853515625, "global_step": 308801, "epoch": 3720} {"train_loss": -25.23160171508789, "global_step": 308802, "epoch": 3720} {"train_loss": -25.749038696289062, "global_step": 308803, "epoch": 3720} {"train_loss": -25.415904998779297, "global_step": 308804, "epoch": 3720} {"train_loss": -25.53325843811035, "global_step": 308805, "epoch": 3720} {"train_loss": -25.5275936126709, "global_step": 308806, "epoch": 3720} {"train_loss": -25.590641021728516, "global_step": 308807, "epoch": 3720} {"train_loss": -25.594480514526367, "global_step": 308808, "epoch": 3720} {"train_loss": -25.804189682006836, "global_step": 308809, "epoch": 3720} {"train_loss": -25.604095458984375, "global_step": 308810, "epoch": 3720} {"train_loss": -25.985998153686523, "global_step": 308811, "epoch": 3720} {"train_loss": -25.948169708251953, "global_step": 308812, "epoch": 3720} {"train_loss": -26.077285766601562, "global_step": 308813, "epoch": 3720} {"train_loss": -25.530187606811523, "global_step": 308814, "epoch": 3720} {"train_loss": -26.0379638671875, "global_step": 308815, "epoch": 3720} {"train_loss": -25.977375030517578, "global_step": 308816, "epoch": 3720} {"train_loss": -25.840559005737305, "global_step": 308817, "epoch": 3720} {"train_loss": -26.20582389831543, "global_step": 308818, "epoch": 3720} {"train_loss": -25.718753814697266, "global_step": 308819, "epoch": 3720} {"train_loss": -25.928022384643555, "global_step": 308820, "epoch": 3720} {"train_loss": -25.7154598236084, "global_step": 308821, "epoch": 3720} {"train_loss": -25.886823654174805, "global_step": 308822, "epoch": 3720} {"train_loss": -25.72654151916504, "global_step": 308823, "epoch": 3720} {"train_loss": -25.716510772705078, "global_step": 308824, "epoch": 3720} {"train_loss": -25.530851364135742, "global_step": 308825, "epoch": 3720} {"train_loss": -25.585933685302734, "global_step": 308826, "epoch": 3720} {"train_loss": -26.141651153564453, "global_step": 308827, "epoch": 3720} {"train_loss": -26.123807907104492, "global_step": 308828, "epoch": 3720} {"train_loss": -25.821386337280273, "global_step": 308829, "epoch": 3720} {"train_loss": -25.915678024291992, "global_step": 308830, "epoch": 3720} {"train_loss": -25.622854232788086, "global_step": 308831, "epoch": 3720} {"train_loss": -26.157419204711914, "global_step": 308832, "epoch": 3720} {"train_loss": -25.952533721923828, "global_step": 308833, "epoch": 3720} {"train_loss": -25.94757652282715, "global_step": 308834, "epoch": 3720} {"train_loss": -26.084625244140625, "global_step": 308835, "epoch": 3720} {"train_loss": -25.883337020874023, "global_step": 308836, "epoch": 3720} {"train_loss": -25.51785659790039, "global_step": 308837, "epoch": 3720} {"train_loss": -25.214038848876953, "global_step": 308838, "epoch": 3720} {"train_loss": -25.145164489746094, "global_step": 308839, "epoch": 3720} {"train_loss": -25.756010055541992, "global_step": 308840, "epoch": 3720} {"train_loss": -25.512088775634766, "global_step": 308841, "epoch": 3720} {"train_loss": -25.727688502116376, "global_step": 308842, "epoch": 3720, "val_loss": 7421643.5} {"train_loss": -23.008275985717773, "global_step": 308843, "epoch": 3721} {"train_loss": -24.646718978881836, "global_step": 308844, "epoch": 3721} {"train_loss": -23.810415267944336, "global_step": 308845, "epoch": 3721} {"train_loss": -24.541532516479492, "global_step": 308846, "epoch": 3721} {"train_loss": -24.82383155822754, "global_step": 308847, "epoch": 3721} {"train_loss": -24.234085083007812, "global_step": 308848, "epoch": 3721} {"train_loss": -24.86841583251953, "global_step": 308849, "epoch": 3721} {"train_loss": -24.8183650970459, "global_step": 308850, "epoch": 3721} {"train_loss": -25.40582847595215, "global_step": 308851, "epoch": 3721} {"train_loss": -24.673320770263672, "global_step": 308852, "epoch": 3721} {"train_loss": -25.21169090270996, "global_step": 308853, "epoch": 3721} {"train_loss": -24.5677547454834, "global_step": 308854, "epoch": 3721} {"train_loss": -24.863662719726562, "global_step": 308855, "epoch": 3721} {"train_loss": -25.13118553161621, "global_step": 308856, "epoch": 3721} {"train_loss": -25.13727378845215, "global_step": 308857, "epoch": 3721} {"train_loss": -25.52158546447754, "global_step": 308858, "epoch": 3721} {"train_loss": -25.4350643157959, "global_step": 308859, "epoch": 3721} {"train_loss": -25.194746017456055, "global_step": 308860, "epoch": 3721} {"train_loss": -24.989242553710938, "global_step": 308861, "epoch": 3721} {"train_loss": -25.336151123046875, "global_step": 308862, "epoch": 3721} {"train_loss": -25.240802764892578, "global_step": 308863, "epoch": 3721} {"train_loss": -25.466703414916992, "global_step": 308864, "epoch": 3721} {"train_loss": -24.73077964782715, "global_step": 308865, "epoch": 3721} {"train_loss": -25.469751358032227, "global_step": 308866, "epoch": 3721} {"train_loss": -25.227420806884766, "global_step": 308867, "epoch": 3721} {"train_loss": -25.33283042907715, "global_step": 308868, "epoch": 3721} {"train_loss": -25.376550674438477, "global_step": 308869, "epoch": 3721} {"train_loss": -25.488306045532227, "global_step": 308870, "epoch": 3721} {"train_loss": -25.278596878051758, "global_step": 308871, "epoch": 3721} {"train_loss": -25.569665908813477, "global_step": 308872, "epoch": 3721} {"train_loss": -25.687122344970703, "global_step": 308873, "epoch": 3721} {"train_loss": -26.080188751220703, "global_step": 308874, "epoch": 3721} {"train_loss": -25.647008895874023, "global_step": 308875, "epoch": 3721} {"train_loss": -25.525388717651367, "global_step": 308876, "epoch": 3721} {"train_loss": -25.45536231994629, "global_step": 308877, "epoch": 3721} {"train_loss": -25.583433151245117, "global_step": 308878, "epoch": 3721} {"train_loss": -25.554492950439453, "global_step": 308879, "epoch": 3721} {"train_loss": -25.615039825439453, "global_step": 308880, "epoch": 3721} {"train_loss": -25.86787223815918, "global_step": 308881, "epoch": 3721} {"train_loss": -25.700580596923828, "global_step": 308882, "epoch": 3721} {"train_loss": -25.86433219909668, "global_step": 308883, "epoch": 3721} {"train_loss": -26.053009033203125, "global_step": 308884, "epoch": 3721} {"train_loss": -26.064624786376953, "global_step": 308885, "epoch": 3721} {"train_loss": -25.68221092224121, "global_step": 308886, "epoch": 3721} {"train_loss": -26.076169967651367, "global_step": 308887, "epoch": 3721} {"train_loss": -25.949384689331055, "global_step": 308888, "epoch": 3721} {"train_loss": -26.37607765197754, "global_step": 308889, "epoch": 3721} {"train_loss": -25.789749145507812, "global_step": 308890, "epoch": 3721} {"train_loss": -25.696125030517578, "global_step": 308891, "epoch": 3721} {"train_loss": -25.950550079345703, "global_step": 308892, "epoch": 3721} {"train_loss": -26.23347282409668, "global_step": 308893, "epoch": 3721} {"train_loss": -26.024551391601562, "global_step": 308894, "epoch": 3721} {"train_loss": -25.785934448242188, "global_step": 308895, "epoch": 3721} {"train_loss": -25.9072208404541, "global_step": 308896, "epoch": 3721} {"train_loss": -26.057584762573242, "global_step": 308897, "epoch": 3721} {"train_loss": -25.7397518157959, "global_step": 308898, "epoch": 3721} {"train_loss": -26.073837280273438, "global_step": 308899, "epoch": 3721} {"train_loss": -25.68109130859375, "global_step": 308900, "epoch": 3721} {"train_loss": -26.09278678894043, "global_step": 308901, "epoch": 3721} {"train_loss": -25.939868927001953, "global_step": 308902, "epoch": 3721} {"train_loss": -26.05994987487793, "global_step": 308903, "epoch": 3721} {"train_loss": -25.559423446655273, "global_step": 308904, "epoch": 3721} {"train_loss": -25.355289459228516, "global_step": 308905, "epoch": 3721} {"train_loss": -25.916107177734375, "global_step": 308906, "epoch": 3721} {"train_loss": -25.454870223999023, "global_step": 308907, "epoch": 3721} {"train_loss": -25.90106773376465, "global_step": 308908, "epoch": 3721} {"train_loss": -25.53394889831543, "global_step": 308909, "epoch": 3721} {"train_loss": -25.758237838745117, "global_step": 308910, "epoch": 3721} {"train_loss": -25.90205192565918, "global_step": 308911, "epoch": 3721} {"train_loss": -25.99969482421875, "global_step": 308912, "epoch": 3721} {"train_loss": -25.5451602935791, "global_step": 308913, "epoch": 3721} {"train_loss": -25.42603874206543, "global_step": 308914, "epoch": 3721} {"train_loss": -26.002471923828125, "global_step": 308915, "epoch": 3721} {"train_loss": -25.5459041595459, "global_step": 308916, "epoch": 3721} {"train_loss": -25.779401779174805, "global_step": 308917, "epoch": 3721} {"train_loss": -25.93344497680664, "global_step": 308918, "epoch": 3721} {"train_loss": -25.556764602661133, "global_step": 308919, "epoch": 3721} {"train_loss": -25.614965438842773, "global_step": 308920, "epoch": 3721} {"train_loss": -25.994464874267578, "global_step": 308921, "epoch": 3721} {"train_loss": -25.87554931640625, "global_step": 308922, "epoch": 3721} {"train_loss": -25.691761016845703, "global_step": 308923, "epoch": 3721} {"train_loss": -26.112751007080078, "global_step": 308924, "epoch": 3721} {"train_loss": -25.513328828007342, "global_step": 308925, "epoch": 3721, "val_loss": 7332399.5} {"train_loss": -25.69754409790039, "global_step": 308926, "epoch": 3722} {"train_loss": -25.43848991394043, "global_step": 308927, "epoch": 3722} {"train_loss": -25.839054107666016, "global_step": 308928, "epoch": 3722} {"train_loss": -25.08669090270996, "global_step": 308929, "epoch": 3722} {"train_loss": -25.37710952758789, "global_step": 308930, "epoch": 3722} {"train_loss": -25.45577621459961, "global_step": 308931, "epoch": 3722} {"train_loss": -25.531301498413086, "global_step": 308932, "epoch": 3722} {"train_loss": -25.397993087768555, "global_step": 308933, "epoch": 3722} {"train_loss": -25.8262996673584, "global_step": 308934, "epoch": 3722} {"train_loss": -25.0967960357666, "global_step": 308935, "epoch": 3722} {"train_loss": -25.607925415039062, "global_step": 308936, "epoch": 3722} {"train_loss": -25.476438522338867, "global_step": 308937, "epoch": 3722} {"train_loss": -25.176176071166992, "global_step": 308938, "epoch": 3722} {"train_loss": -25.876068115234375, "global_step": 308939, "epoch": 3722} {"train_loss": -25.03182029724121, "global_step": 308940, "epoch": 3722} {"train_loss": -25.683643341064453, "global_step": 308941, "epoch": 3722} {"train_loss": -25.460010528564453, "global_step": 308942, "epoch": 3722} {"train_loss": -25.71860122680664, "global_step": 308943, "epoch": 3722} {"train_loss": -25.45023536682129, "global_step": 308944, "epoch": 3722} {"train_loss": -25.570112228393555, "global_step": 308945, "epoch": 3722} {"train_loss": -25.450796127319336, "global_step": 308946, "epoch": 3722} {"train_loss": -25.953344345092773, "global_step": 308947, "epoch": 3722} {"train_loss": -25.79755973815918, "global_step": 308948, "epoch": 3722} {"train_loss": -25.546554565429688, "global_step": 308949, "epoch": 3722} {"train_loss": -25.958932876586914, "global_step": 308950, "epoch": 3722} {"train_loss": -25.83865737915039, "global_step": 308951, "epoch": 3722} {"train_loss": -25.76718521118164, "global_step": 308952, "epoch": 3722} {"train_loss": -25.7393741607666, "global_step": 308953, "epoch": 3722} {"train_loss": -25.564929962158203, "global_step": 308954, "epoch": 3722} {"train_loss": -25.6658992767334, "global_step": 308955, "epoch": 3722} {"train_loss": -25.95859718322754, "global_step": 308956, "epoch": 3722} {"train_loss": -25.484058380126953, "global_step": 308957, "epoch": 3722} {"train_loss": -25.534513473510742, "global_step": 308958, "epoch": 3722} {"train_loss": -25.505033493041992, "global_step": 308959, "epoch": 3722} {"train_loss": -25.536209106445312, "global_step": 308960, "epoch": 3722} {"train_loss": -25.9912052154541, "global_step": 308961, "epoch": 3722} {"train_loss": -25.579191207885742, "global_step": 308962, "epoch": 3722} {"train_loss": -25.818262100219727, "global_step": 308963, "epoch": 3722} {"train_loss": -26.051258087158203, "global_step": 308964, "epoch": 3722} {"train_loss": -25.500913619995117, "global_step": 308965, "epoch": 3722} {"train_loss": -25.54792594909668, "global_step": 308966, "epoch": 3722} {"train_loss": -25.408823013305664, "global_step": 308967, "epoch": 3722} {"train_loss": -25.52132225036621, "global_step": 308968, "epoch": 3722} {"train_loss": -25.50179100036621, "global_step": 308969, "epoch": 3722} {"train_loss": -25.491382598876953, "global_step": 308970, "epoch": 3722} {"train_loss": -26.049299240112305, "global_step": 308971, "epoch": 3722} {"train_loss": -25.938495635986328, "global_step": 308972, "epoch": 3722} {"train_loss": -25.586008071899414, "global_step": 308973, "epoch": 3722} {"train_loss": -25.583791732788086, "global_step": 308974, "epoch": 3722} {"train_loss": -25.283571243286133, "global_step": 308975, "epoch": 3722} {"train_loss": -25.204954147338867, "global_step": 308976, "epoch": 3722} {"train_loss": -25.49752426147461, "global_step": 308977, "epoch": 3722} {"train_loss": -26.141876220703125, "global_step": 308978, "epoch": 3722} {"train_loss": -25.658008575439453, "global_step": 308979, "epoch": 3722} {"train_loss": -25.785200119018555, "global_step": 308980, "epoch": 3722} {"train_loss": -25.998254776000977, "global_step": 308981, "epoch": 3722} {"train_loss": -25.865354537963867, "global_step": 308982, "epoch": 3722} {"train_loss": -25.8492431640625, "global_step": 308983, "epoch": 3722} {"train_loss": -25.691572189331055, "global_step": 308984, "epoch": 3722} {"train_loss": -25.651350021362305, "global_step": 308985, "epoch": 3722} {"train_loss": -25.46097183227539, "global_step": 308986, "epoch": 3722} {"train_loss": -25.48935317993164, "global_step": 308987, "epoch": 3722} {"train_loss": -25.93875503540039, "global_step": 308988, "epoch": 3722} {"train_loss": -25.85004234313965, "global_step": 308989, "epoch": 3722} {"train_loss": -25.502628326416016, "global_step": 308990, "epoch": 3722} {"train_loss": -25.728031158447266, "global_step": 308991, "epoch": 3722} {"train_loss": -25.918439865112305, "global_step": 308992, "epoch": 3722} {"train_loss": -26.052438735961914, "global_step": 308993, "epoch": 3722} {"train_loss": -25.37026596069336, "global_step": 308994, "epoch": 3722} {"train_loss": -25.411575317382812, "global_step": 308995, "epoch": 3722} {"train_loss": -25.554311752319336, "global_step": 308996, "epoch": 3722} {"train_loss": -25.617956161499023, "global_step": 308997, "epoch": 3722} {"train_loss": -25.886762619018555, "global_step": 308998, "epoch": 3722} {"train_loss": -25.654022216796875, "global_step": 308999, "epoch": 3722} {"train_loss": -25.899789810180664, "global_step": 309000, "epoch": 3722} {"train_loss": -25.641937255859375, "global_step": 309001, "epoch": 3722} {"train_loss": -26.137165069580078, "global_step": 309002, "epoch": 3722} {"train_loss": -25.837499618530273, "global_step": 309003, "epoch": 3722} {"train_loss": -25.945127487182617, "global_step": 309004, "epoch": 3722} {"train_loss": -25.402095794677734, "global_step": 309005, "epoch": 3722} {"train_loss": -25.782520294189453, "global_step": 309006, "epoch": 3722} {"train_loss": -25.61152458190918, "global_step": 309007, "epoch": 3722} {"train_loss": -25.63964000380183, "global_step": 309008, "epoch": 3722, "val_loss": 7239754.0} {"train_loss": -25.121906280517578, "global_step": 309009, "epoch": 3723} {"train_loss": -24.936328887939453, "global_step": 309010, "epoch": 3723} {"train_loss": -25.503080368041992, "global_step": 309011, "epoch": 3723} {"train_loss": -24.8592529296875, "global_step": 309012, "epoch": 3723} {"train_loss": -25.41933250427246, "global_step": 309013, "epoch": 3723} {"train_loss": -24.881423950195312, "global_step": 309014, "epoch": 3723} {"train_loss": -25.304462432861328, "global_step": 309015, "epoch": 3723} {"train_loss": -25.098386764526367, "global_step": 309016, "epoch": 3723} {"train_loss": -25.308719635009766, "global_step": 309017, "epoch": 3723} {"train_loss": -25.427845001220703, "global_step": 309018, "epoch": 3723} {"train_loss": -25.493703842163086, "global_step": 309019, "epoch": 3723} {"train_loss": -25.16046714782715, "global_step": 309020, "epoch": 3723} {"train_loss": -25.800092697143555, "global_step": 309021, "epoch": 3723} {"train_loss": -25.23676109313965, "global_step": 309022, "epoch": 3723} {"train_loss": -25.551206588745117, "global_step": 309023, "epoch": 3723} {"train_loss": -25.628881454467773, "global_step": 309024, "epoch": 3723} {"train_loss": -25.270736694335938, "global_step": 309025, "epoch": 3723} {"train_loss": -25.093799591064453, "global_step": 309026, "epoch": 3723} {"train_loss": -25.77039909362793, "global_step": 309027, "epoch": 3723} {"train_loss": -25.60016441345215, "global_step": 309028, "epoch": 3723} {"train_loss": -25.505970001220703, "global_step": 309029, "epoch": 3723} {"train_loss": -25.319623947143555, "global_step": 309030, "epoch": 3723} {"train_loss": -25.738662719726562, "global_step": 309031, "epoch": 3723} {"train_loss": -26.010873794555664, "global_step": 309032, "epoch": 3723} {"train_loss": -25.175535202026367, "global_step": 309033, "epoch": 3723} {"train_loss": -25.675466537475586, "global_step": 309034, "epoch": 3723} {"train_loss": -25.433279037475586, "global_step": 309035, "epoch": 3723} {"train_loss": -25.350778579711914, "global_step": 309036, "epoch": 3723} {"train_loss": -26.304279327392578, "global_step": 309037, "epoch": 3723} {"train_loss": -25.499469757080078, "global_step": 309038, "epoch": 3723} {"train_loss": -25.931615829467773, "global_step": 309039, "epoch": 3723} {"train_loss": -25.644546508789062, "global_step": 309040, "epoch": 3723} {"train_loss": -25.923995971679688, "global_step": 309041, "epoch": 3723} {"train_loss": -25.714941024780273, "global_step": 309042, "epoch": 3723} {"train_loss": -25.660261154174805, "global_step": 309043, "epoch": 3723} {"train_loss": -25.91164207458496, "global_step": 309044, "epoch": 3723} {"train_loss": -25.94623374938965, "global_step": 309045, "epoch": 3723} {"train_loss": -25.785293579101562, "global_step": 309046, "epoch": 3723} {"train_loss": -25.843841552734375, "global_step": 309047, "epoch": 3723} {"train_loss": -25.861541748046875, "global_step": 309048, "epoch": 3723} {"train_loss": -25.701501846313477, "global_step": 309049, "epoch": 3723} {"train_loss": -25.93596839904785, "global_step": 309050, "epoch": 3723} {"train_loss": -25.85053062438965, "global_step": 309051, "epoch": 3723} {"train_loss": -25.98465347290039, "global_step": 309052, "epoch": 3723} {"train_loss": -25.901044845581055, "global_step": 309053, "epoch": 3723} {"train_loss": -26.136962890625, "global_step": 309054, "epoch": 3723} {"train_loss": -25.778242111206055, "global_step": 309055, "epoch": 3723} {"train_loss": -26.049482345581055, "global_step": 309056, "epoch": 3723} {"train_loss": -25.97456932067871, "global_step": 309057, "epoch": 3723} {"train_loss": -25.770557403564453, "global_step": 309058, "epoch": 3723} {"train_loss": -25.118144989013672, "global_step": 309059, "epoch": 3723} {"train_loss": -25.39515495300293, "global_step": 309060, "epoch": 3723} {"train_loss": -25.67024040222168, "global_step": 309061, "epoch": 3723} {"train_loss": -25.469099044799805, "global_step": 309062, "epoch": 3723} {"train_loss": -25.930124282836914, "global_step": 309063, "epoch": 3723} {"train_loss": -26.196765899658203, "global_step": 309064, "epoch": 3723} {"train_loss": -25.466161727905273, "global_step": 309065, "epoch": 3723} {"train_loss": -25.884002685546875, "global_step": 309066, "epoch": 3723} {"train_loss": -25.56100845336914, "global_step": 309067, "epoch": 3723} {"train_loss": -25.84266471862793, "global_step": 309068, "epoch": 3723} {"train_loss": -25.657800674438477, "global_step": 309069, "epoch": 3723} {"train_loss": -25.650928497314453, "global_step": 309070, "epoch": 3723} {"train_loss": -25.86834144592285, "global_step": 309071, "epoch": 3723} {"train_loss": -25.512372970581055, "global_step": 309072, "epoch": 3723} {"train_loss": -26.095840454101562, "global_step": 309073, "epoch": 3723} {"train_loss": -25.705087661743164, "global_step": 309074, "epoch": 3723} {"train_loss": -25.707534790039062, "global_step": 309075, "epoch": 3723} {"train_loss": -25.53569221496582, "global_step": 309076, "epoch": 3723} {"train_loss": -25.540042877197266, "global_step": 309077, "epoch": 3723} {"train_loss": -25.814130783081055, "global_step": 309078, "epoch": 3723} {"train_loss": -26.007261276245117, "global_step": 309079, "epoch": 3723} {"train_loss": -25.906110763549805, "global_step": 309080, "epoch": 3723} {"train_loss": -26.20869255065918, "global_step": 309081, "epoch": 3723} {"train_loss": -25.981830596923828, "global_step": 309082, "epoch": 3723} {"train_loss": -26.158557891845703, "global_step": 309083, "epoch": 3723} {"train_loss": -26.029239654541016, "global_step": 309084, "epoch": 3723} {"train_loss": -25.580169677734375, "global_step": 309085, "epoch": 3723} {"train_loss": -26.171234130859375, "global_step": 309086, "epoch": 3723} {"train_loss": -26.0805721282959, "global_step": 309087, "epoch": 3723} {"train_loss": -26.072004318237305, "global_step": 309088, "epoch": 3723} {"train_loss": -25.415048599243164, "global_step": 309089, "epoch": 3723} {"train_loss": -26.098356246948242, "global_step": 309090, "epoch": 3723} {"train_loss": -25.680310812341162, "global_step": 309091, "epoch": 3723, "val_loss": 7272750.0} {"train_loss": -25.380277633666992, "global_step": 309092, "epoch": 3724} {"train_loss": -24.34280776977539, "global_step": 309093, "epoch": 3724} {"train_loss": -25.29006004333496, "global_step": 309094, "epoch": 3724} {"train_loss": -25.23613929748535, "global_step": 309095, "epoch": 3724} {"train_loss": -25.23979949951172, "global_step": 309096, "epoch": 3724} {"train_loss": -25.091711044311523, "global_step": 309097, "epoch": 3724} {"train_loss": -25.305105209350586, "global_step": 309098, "epoch": 3724} {"train_loss": -25.596609115600586, "global_step": 309099, "epoch": 3724} {"train_loss": -25.548349380493164, "global_step": 309100, "epoch": 3724} {"train_loss": -24.895612716674805, "global_step": 309101, "epoch": 3724} {"train_loss": -25.389150619506836, "global_step": 309102, "epoch": 3724} {"train_loss": -25.583072662353516, "global_step": 309103, "epoch": 3724} {"train_loss": -25.57769775390625, "global_step": 309104, "epoch": 3724} {"train_loss": -25.101484298706055, "global_step": 309105, "epoch": 3724} {"train_loss": -25.478731155395508, "global_step": 309106, "epoch": 3724} {"train_loss": -24.76230239868164, "global_step": 309107, "epoch": 3724} {"train_loss": -25.213274002075195, "global_step": 309108, "epoch": 3724} {"train_loss": -25.7047061920166, "global_step": 309109, "epoch": 3724} {"train_loss": -25.156248092651367, "global_step": 309110, "epoch": 3724} {"train_loss": -25.56588363647461, "global_step": 309111, "epoch": 3724} {"train_loss": -25.555755615234375, "global_step": 309112, "epoch": 3724} {"train_loss": -25.096887588500977, "global_step": 309113, "epoch": 3724} {"train_loss": -25.490522384643555, "global_step": 309114, "epoch": 3724} {"train_loss": -25.67344093322754, "global_step": 309115, "epoch": 3724} {"train_loss": -25.346820831298828, "global_step": 309116, "epoch": 3724} {"train_loss": -25.307077407836914, "global_step": 309117, "epoch": 3724} {"train_loss": -25.852811813354492, "global_step": 309118, "epoch": 3724} {"train_loss": -25.927356719970703, "global_step": 309119, "epoch": 3724} {"train_loss": -25.403478622436523, "global_step": 309120, "epoch": 3724} {"train_loss": -25.9351806640625, "global_step": 309121, "epoch": 3724} {"train_loss": -25.636627197265625, "global_step": 309122, "epoch": 3724} {"train_loss": -25.470640182495117, "global_step": 309123, "epoch": 3724} {"train_loss": -26.040014266967773, "global_step": 309124, "epoch": 3724} {"train_loss": -25.777069091796875, "global_step": 309125, "epoch": 3724} {"train_loss": -25.797815322875977, "global_step": 309126, "epoch": 3724} {"train_loss": -25.60555076599121, "global_step": 309127, "epoch": 3724} {"train_loss": -25.758895874023438, "global_step": 309128, "epoch": 3724} {"train_loss": -25.682697296142578, "global_step": 309129, "epoch": 3724} {"train_loss": -25.969635009765625, "global_step": 309130, "epoch": 3724} {"train_loss": -26.182580947875977, "global_step": 309131, "epoch": 3724} {"train_loss": -25.982492446899414, "global_step": 309132, "epoch": 3724} {"train_loss": -25.355772018432617, "global_step": 309133, "epoch": 3724} {"train_loss": -25.84577751159668, "global_step": 309134, "epoch": 3724} {"train_loss": -25.825525283813477, "global_step": 309135, "epoch": 3724} {"train_loss": -25.798070907592773, "global_step": 309136, "epoch": 3724} {"train_loss": -25.85009765625, "global_step": 309137, "epoch": 3724} {"train_loss": -25.98516273498535, "global_step": 309138, "epoch": 3724} {"train_loss": -25.796350479125977, "global_step": 309139, "epoch": 3724} {"train_loss": -25.480051040649414, "global_step": 309140, "epoch": 3724} {"train_loss": -25.645368576049805, "global_step": 309141, "epoch": 3724} {"train_loss": -24.831783294677734, "global_step": 309142, "epoch": 3724} {"train_loss": -25.2123966217041, "global_step": 309143, "epoch": 3724} {"train_loss": -25.158761978149414, "global_step": 309144, "epoch": 3724} {"train_loss": -25.556678771972656, "global_step": 309145, "epoch": 3724} {"train_loss": -25.971811294555664, "global_step": 309146, "epoch": 3724} {"train_loss": -25.859222412109375, "global_step": 309147, "epoch": 3724} {"train_loss": -25.781696319580078, "global_step": 309148, "epoch": 3724} {"train_loss": -25.759937286376953, "global_step": 309149, "epoch": 3724} {"train_loss": -25.727087020874023, "global_step": 309150, "epoch": 3724} {"train_loss": -25.71280288696289, "global_step": 309151, "epoch": 3724} {"train_loss": -25.53193473815918, "global_step": 309152, "epoch": 3724} {"train_loss": -25.6041259765625, "global_step": 309153, "epoch": 3724} {"train_loss": -25.722869873046875, "global_step": 309154, "epoch": 3724} {"train_loss": -26.187641143798828, "global_step": 309155, "epoch": 3724} {"train_loss": -25.784107208251953, "global_step": 309156, "epoch": 3724} {"train_loss": -25.629446029663086, "global_step": 309157, "epoch": 3724} {"train_loss": -25.755157470703125, "global_step": 309158, "epoch": 3724} {"train_loss": -25.73396110534668, "global_step": 309159, "epoch": 3724} {"train_loss": -25.705493927001953, "global_step": 309160, "epoch": 3724} {"train_loss": -25.689016342163086, "global_step": 309161, "epoch": 3724} {"train_loss": -26.181915283203125, "global_step": 309162, "epoch": 3724} {"train_loss": -25.718103408813477, "global_step": 309163, "epoch": 3724} {"train_loss": -25.776538848876953, "global_step": 309164, "epoch": 3724} {"train_loss": -25.56690788269043, "global_step": 309165, "epoch": 3724} {"train_loss": -26.1470947265625, "global_step": 309166, "epoch": 3724} {"train_loss": -25.794097900390625, "global_step": 309167, "epoch": 3724} {"train_loss": -25.45560073852539, "global_step": 309168, "epoch": 3724} {"train_loss": -25.659265518188477, "global_step": 309169, "epoch": 3724} {"train_loss": -25.670644760131836, "global_step": 309170, "epoch": 3724} {"train_loss": -25.956327438354492, "global_step": 309171, "epoch": 3724} {"train_loss": -25.728199005126953, "global_step": 309172, "epoch": 3724} {"train_loss": -26.23578453063965, "global_step": 309173, "epoch": 3724} {"train_loss": -25.59314943796181, "global_step": 309174, "epoch": 3724, "val_loss": 7154166.0} {"train_loss": -25.192052841186523, "global_step": 309175, "epoch": 3725} {"train_loss": -25.219907760620117, "global_step": 309176, "epoch": 3725} {"train_loss": -25.063220977783203, "global_step": 309177, "epoch": 3725} {"train_loss": -25.329225540161133, "global_step": 309178, "epoch": 3725} {"train_loss": -25.34037208557129, "global_step": 309179, "epoch": 3725} {"train_loss": -25.245161056518555, "global_step": 309180, "epoch": 3725} {"train_loss": -25.61126136779785, "global_step": 309181, "epoch": 3725} {"train_loss": -25.19573402404785, "global_step": 309182, "epoch": 3725} {"train_loss": -25.2396297454834, "global_step": 309183, "epoch": 3725} {"train_loss": -25.13170051574707, "global_step": 309184, "epoch": 3725} {"train_loss": -25.450702667236328, "global_step": 309185, "epoch": 3725} {"train_loss": -25.799909591674805, "global_step": 309186, "epoch": 3725} {"train_loss": -25.08782386779785, "global_step": 309187, "epoch": 3725} {"train_loss": -25.842138290405273, "global_step": 309188, "epoch": 3725} {"train_loss": -24.954538345336914, "global_step": 309189, "epoch": 3725} {"train_loss": -25.432130813598633, "global_step": 309190, "epoch": 3725} {"train_loss": -25.3583927154541, "global_step": 309191, "epoch": 3725} {"train_loss": -25.7846622467041, "global_step": 309192, "epoch": 3725} {"train_loss": -25.4871826171875, "global_step": 309193, "epoch": 3725} {"train_loss": -25.534183502197266, "global_step": 309194, "epoch": 3725} {"train_loss": -25.304845809936523, "global_step": 309195, "epoch": 3725} {"train_loss": -25.19486427307129, "global_step": 309196, "epoch": 3725} {"train_loss": -25.806379318237305, "global_step": 309197, "epoch": 3725} {"train_loss": -25.621885299682617, "global_step": 309198, "epoch": 3725} {"train_loss": -25.430028915405273, "global_step": 309199, "epoch": 3725} {"train_loss": -25.6125545501709, "global_step": 309200, "epoch": 3725} {"train_loss": -25.489669799804688, "global_step": 309201, "epoch": 3725} {"train_loss": -25.903417587280273, "global_step": 309202, "epoch": 3725} {"train_loss": -25.715713500976562, "global_step": 309203, "epoch": 3725} {"train_loss": -25.27621078491211, "global_step": 309204, "epoch": 3725} {"train_loss": -25.727664947509766, "global_step": 309205, "epoch": 3725} {"train_loss": -25.479934692382812, "global_step": 309206, "epoch": 3725} {"train_loss": -25.420591354370117, "global_step": 309207, "epoch": 3725} {"train_loss": -25.060651779174805, "global_step": 309208, "epoch": 3725} {"train_loss": -25.8090877532959, "global_step": 309209, "epoch": 3725} {"train_loss": -25.449243545532227, "global_step": 309210, "epoch": 3725} {"train_loss": -25.9918212890625, "global_step": 309211, "epoch": 3725} {"train_loss": -25.499738693237305, "global_step": 309212, "epoch": 3725} {"train_loss": -25.995946884155273, "global_step": 309213, "epoch": 3725} {"train_loss": -26.021142959594727, "global_step": 309214, "epoch": 3725} {"train_loss": -25.648160934448242, "global_step": 309215, "epoch": 3725} {"train_loss": -25.7292537689209, "global_step": 309216, "epoch": 3725} {"train_loss": -25.3454647064209, "global_step": 309217, "epoch": 3725} {"train_loss": -25.876245498657227, "global_step": 309218, "epoch": 3725} {"train_loss": -25.976850509643555, "global_step": 309219, "epoch": 3725} {"train_loss": -25.89991569519043, "global_step": 309220, "epoch": 3725} {"train_loss": -25.643339157104492, "global_step": 309221, "epoch": 3725} {"train_loss": -25.792749404907227, "global_step": 309222, "epoch": 3725} {"train_loss": -26.166250228881836, "global_step": 309223, "epoch": 3725} {"train_loss": -26.057987213134766, "global_step": 309224, "epoch": 3725} {"train_loss": -25.9984073638916, "global_step": 309225, "epoch": 3725} {"train_loss": -25.745458602905273, "global_step": 309226, "epoch": 3725} {"train_loss": -25.840229034423828, "global_step": 309227, "epoch": 3725} {"train_loss": -25.586240768432617, "global_step": 309228, "epoch": 3725} {"train_loss": -26.10003089904785, "global_step": 309229, "epoch": 3725} {"train_loss": -25.752674102783203, "global_step": 309230, "epoch": 3725} {"train_loss": -26.158496856689453, "global_step": 309231, "epoch": 3725} {"train_loss": -26.10255241394043, "global_step": 309232, "epoch": 3725} {"train_loss": -25.985898971557617, "global_step": 309233, "epoch": 3725} {"train_loss": -26.276418685913086, "global_step": 309234, "epoch": 3725} {"train_loss": -26.231603622436523, "global_step": 309235, "epoch": 3725} {"train_loss": -25.806446075439453, "global_step": 309236, "epoch": 3725} {"train_loss": -25.618619918823242, "global_step": 309237, "epoch": 3725} {"train_loss": -26.352466583251953, "global_step": 309238, "epoch": 3725} {"train_loss": -25.7557373046875, "global_step": 309239, "epoch": 3725} {"train_loss": -25.784666061401367, "global_step": 309240, "epoch": 3725} {"train_loss": -25.764850616455078, "global_step": 309241, "epoch": 3725} {"train_loss": -25.629531860351562, "global_step": 309242, "epoch": 3725} {"train_loss": -25.581567764282227, "global_step": 309243, "epoch": 3725} {"train_loss": -25.28939437866211, "global_step": 309244, "epoch": 3725} {"train_loss": -25.29567527770996, "global_step": 309245, "epoch": 3725} {"train_loss": -25.34958267211914, "global_step": 309246, "epoch": 3725} {"train_loss": -26.160078048706055, "global_step": 309247, "epoch": 3725} {"train_loss": -25.762008666992188, "global_step": 309248, "epoch": 3725} {"train_loss": -25.420888900756836, "global_step": 309249, "epoch": 3725} {"train_loss": -26.061552047729492, "global_step": 309250, "epoch": 3725} {"train_loss": -25.73211669921875, "global_step": 309251, "epoch": 3725} {"train_loss": -25.709081649780273, "global_step": 309252, "epoch": 3725} {"train_loss": -25.44663429260254, "global_step": 309253, "epoch": 3725} {"train_loss": -25.464750289916992, "global_step": 309254, "epoch": 3725} {"train_loss": -25.652359008789062, "global_step": 309255, "epoch": 3725} {"train_loss": -25.800352096557617, "global_step": 309256, "epoch": 3725} {"train_loss": -25.650869921029333, "global_step": 309257, "epoch": 3725, "val_loss": 7337676.5} {"train_loss": -25.377731323242188, "global_step": 309258, "epoch": 3726} {"train_loss": -24.749441146850586, "global_step": 309259, "epoch": 3726} {"train_loss": -25.249998092651367, "global_step": 309260, "epoch": 3726} {"train_loss": -25.062047958374023, "global_step": 309261, "epoch": 3726} {"train_loss": -24.866165161132812, "global_step": 309262, "epoch": 3726} {"train_loss": -25.21063804626465, "global_step": 309263, "epoch": 3726} {"train_loss": -25.355249404907227, "global_step": 309264, "epoch": 3726} {"train_loss": -25.580108642578125, "global_step": 309265, "epoch": 3726} {"train_loss": -25.273080825805664, "global_step": 309266, "epoch": 3726} {"train_loss": -25.50666618347168, "global_step": 309267, "epoch": 3726} {"train_loss": -25.24458122253418, "global_step": 309268, "epoch": 3726} {"train_loss": -24.7631893157959, "global_step": 309269, "epoch": 3726} {"train_loss": -25.66131591796875, "global_step": 309270, "epoch": 3726} {"train_loss": -25.466875076293945, "global_step": 309271, "epoch": 3726} {"train_loss": -25.595266342163086, "global_step": 309272, "epoch": 3726} {"train_loss": -25.281892776489258, "global_step": 309273, "epoch": 3726} {"train_loss": -25.7423095703125, "global_step": 309274, "epoch": 3726} {"train_loss": -25.45261573791504, "global_step": 309275, "epoch": 3726} {"train_loss": -25.394453048706055, "global_step": 309276, "epoch": 3726} {"train_loss": -25.56304931640625, "global_step": 309277, "epoch": 3726} {"train_loss": -25.92185401916504, "global_step": 309278, "epoch": 3726} {"train_loss": -25.423105239868164, "global_step": 309279, "epoch": 3726} {"train_loss": -25.81418228149414, "global_step": 309280, "epoch": 3726} {"train_loss": -25.20384407043457, "global_step": 309281, "epoch": 3726} {"train_loss": -25.61090087890625, "global_step": 309282, "epoch": 3726} {"train_loss": -25.68701171875, "global_step": 309283, "epoch": 3726} {"train_loss": -25.59775161743164, "global_step": 309284, "epoch": 3726} {"train_loss": -25.495378494262695, "global_step": 309285, "epoch": 3726} {"train_loss": -25.380271911621094, "global_step": 309286, "epoch": 3726} {"train_loss": -25.75811767578125, "global_step": 309287, "epoch": 3726} {"train_loss": -25.862775802612305, "global_step": 309288, "epoch": 3726} {"train_loss": -25.69843101501465, "global_step": 309289, "epoch": 3726} {"train_loss": -25.73517417907715, "global_step": 309290, "epoch": 3726} {"train_loss": -25.7439022064209, "global_step": 309291, "epoch": 3726} {"train_loss": -26.056623458862305, "global_step": 309292, "epoch": 3726} {"train_loss": -26.014368057250977, "global_step": 309293, "epoch": 3726} {"train_loss": -26.163183212280273, "global_step": 309294, "epoch": 3726} {"train_loss": -26.345205307006836, "global_step": 309295, "epoch": 3726} {"train_loss": -25.71564292907715, "global_step": 309296, "epoch": 3726} {"train_loss": -25.925079345703125, "global_step": 309297, "epoch": 3726} {"train_loss": -25.92522621154785, "global_step": 309298, "epoch": 3726} {"train_loss": -25.75809669494629, "global_step": 309299, "epoch": 3726} {"train_loss": -26.1015625, "global_step": 309300, "epoch": 3726} {"train_loss": -25.856170654296875, "global_step": 309301, "epoch": 3726} {"train_loss": -25.98577880859375, "global_step": 309302, "epoch": 3726} {"train_loss": -25.8625545501709, "global_step": 309303, "epoch": 3726} {"train_loss": -25.828536987304688, "global_step": 309304, "epoch": 3726} {"train_loss": -26.067224502563477, "global_step": 309305, "epoch": 3726} {"train_loss": -25.8371639251709, "global_step": 309306, "epoch": 3726} {"train_loss": -25.788984298706055, "global_step": 309307, "epoch": 3726} {"train_loss": -25.632726669311523, "global_step": 309308, "epoch": 3726} {"train_loss": -26.052331924438477, "global_step": 309309, "epoch": 3726} {"train_loss": -26.008350372314453, "global_step": 309310, "epoch": 3726} {"train_loss": -26.054235458374023, "global_step": 309311, "epoch": 3726} {"train_loss": -25.784717559814453, "global_step": 309312, "epoch": 3726} {"train_loss": -25.736581802368164, "global_step": 309313, "epoch": 3726} {"train_loss": -25.836475372314453, "global_step": 309314, "epoch": 3726} {"train_loss": -25.628223419189453, "global_step": 309315, "epoch": 3726} {"train_loss": -25.173540115356445, "global_step": 309316, "epoch": 3726} {"train_loss": -25.59604835510254, "global_step": 309317, "epoch": 3726} {"train_loss": -25.477676391601562, "global_step": 309318, "epoch": 3726} {"train_loss": -25.8923282623291, "global_step": 309319, "epoch": 3726} {"train_loss": -25.4477481842041, "global_step": 309320, "epoch": 3726} {"train_loss": -25.173913955688477, "global_step": 309321, "epoch": 3726} {"train_loss": -25.466760635375977, "global_step": 309322, "epoch": 3726} {"train_loss": -25.5819091796875, "global_step": 309323, "epoch": 3726} {"train_loss": -25.606494903564453, "global_step": 309324, "epoch": 3726} {"train_loss": -25.5543270111084, "global_step": 309325, "epoch": 3726} {"train_loss": -25.56337547302246, "global_step": 309326, "epoch": 3726} {"train_loss": -25.59609031677246, "global_step": 309327, "epoch": 3726} {"train_loss": -25.606494903564453, "global_step": 309328, "epoch": 3726} {"train_loss": -25.68744468688965, "global_step": 309329, "epoch": 3726} {"train_loss": -25.592275619506836, "global_step": 309330, "epoch": 3726} {"train_loss": -25.872358322143555, "global_step": 309331, "epoch": 3726} {"train_loss": -25.712177276611328, "global_step": 309332, "epoch": 3726} {"train_loss": -25.902036666870117, "global_step": 309333, "epoch": 3726} {"train_loss": -26.198781967163086, "global_step": 309334, "epoch": 3726} {"train_loss": -26.060806274414062, "global_step": 309335, "epoch": 3726} {"train_loss": -25.830480575561523, "global_step": 309336, "epoch": 3726} {"train_loss": -25.925647735595703, "global_step": 309337, "epoch": 3726} {"train_loss": -25.885892868041992, "global_step": 309338, "epoch": 3726} {"train_loss": -25.693994522094727, "global_step": 309339, "epoch": 3726} {"train_loss": -25.656647486859057, "global_step": 309340, "epoch": 3726, "val_loss": 7218824.0} {"train_loss": -25.040456771850586, "global_step": 309341, "epoch": 3727} {"train_loss": -25.4752140045166, "global_step": 309342, "epoch": 3727} {"train_loss": -25.56876564025879, "global_step": 309343, "epoch": 3727} {"train_loss": -24.969486236572266, "global_step": 309344, "epoch": 3727} {"train_loss": -24.88831901550293, "global_step": 309345, "epoch": 3727} {"train_loss": -25.272401809692383, "global_step": 309346, "epoch": 3727} {"train_loss": -24.931692123413086, "global_step": 309347, "epoch": 3727} {"train_loss": -25.636320114135742, "global_step": 309348, "epoch": 3727} {"train_loss": -25.00165367126465, "global_step": 309349, "epoch": 3727} {"train_loss": -25.80177116394043, "global_step": 309350, "epoch": 3727} {"train_loss": -25.152969360351562, "global_step": 309351, "epoch": 3727} {"train_loss": -25.5643367767334, "global_step": 309352, "epoch": 3727} {"train_loss": -25.137683868408203, "global_step": 309353, "epoch": 3727} {"train_loss": -25.697656631469727, "global_step": 309354, "epoch": 3727} {"train_loss": -25.59912109375, "global_step": 309355, "epoch": 3727} {"train_loss": -25.255077362060547, "global_step": 309356, "epoch": 3727} {"train_loss": -25.45352554321289, "global_step": 309357, "epoch": 3727} {"train_loss": -25.096439361572266, "global_step": 309358, "epoch": 3727} {"train_loss": -25.549413681030273, "global_step": 309359, "epoch": 3727} {"train_loss": -25.505399703979492, "global_step": 309360, "epoch": 3727} {"train_loss": -25.069272994995117, "global_step": 309361, "epoch": 3727} {"train_loss": -25.557910919189453, "global_step": 309362, "epoch": 3727} {"train_loss": -25.52390480041504, "global_step": 309363, "epoch": 3727} {"train_loss": -25.305700302124023, "global_step": 309364, "epoch": 3727} {"train_loss": -25.778919219970703, "global_step": 309365, "epoch": 3727} {"train_loss": -25.7864990234375, "global_step": 309366, "epoch": 3727} {"train_loss": -25.73282241821289, "global_step": 309367, "epoch": 3727} {"train_loss": -25.53023338317871, "global_step": 309368, "epoch": 3727} {"train_loss": -25.326242446899414, "global_step": 309369, "epoch": 3727} {"train_loss": -25.653112411499023, "global_step": 309370, "epoch": 3727} {"train_loss": -25.602222442626953, "global_step": 309371, "epoch": 3727} {"train_loss": -25.850690841674805, "global_step": 309372, "epoch": 3727} {"train_loss": -25.612470626831055, "global_step": 309373, "epoch": 3727} {"train_loss": -25.60150146484375, "global_step": 309374, "epoch": 3727} {"train_loss": -25.839313507080078, "global_step": 309375, "epoch": 3727} {"train_loss": -26.0779972076416, "global_step": 309376, "epoch": 3727} {"train_loss": -25.629077911376953, "global_step": 309377, "epoch": 3727} {"train_loss": -25.605056762695312, "global_step": 309378, "epoch": 3727} {"train_loss": -25.475566864013672, "global_step": 309379, "epoch": 3727} {"train_loss": -25.705732345581055, "global_step": 309380, "epoch": 3727} {"train_loss": -26.05266761779785, "global_step": 309381, "epoch": 3727} {"train_loss": -25.450986862182617, "global_step": 309382, "epoch": 3727} {"train_loss": -25.325368881225586, "global_step": 309383, "epoch": 3727} {"train_loss": -25.532155990600586, "global_step": 309384, "epoch": 3727} {"train_loss": -25.810972213745117, "global_step": 309385, "epoch": 3727} {"train_loss": -25.427339553833008, "global_step": 309386, "epoch": 3727} {"train_loss": -25.293888092041016, "global_step": 309387, "epoch": 3727} {"train_loss": -25.47090721130371, "global_step": 309388, "epoch": 3727} {"train_loss": -25.8160457611084, "global_step": 309389, "epoch": 3727} {"train_loss": -25.689640045166016, "global_step": 309390, "epoch": 3727} {"train_loss": -25.088716506958008, "global_step": 309391, "epoch": 3727} {"train_loss": -25.615249633789062, "global_step": 309392, "epoch": 3727} {"train_loss": -25.30940055847168, "global_step": 309393, "epoch": 3727} {"train_loss": -25.64655113220215, "global_step": 309394, "epoch": 3727} {"train_loss": -25.742658615112305, "global_step": 309395, "epoch": 3727} {"train_loss": -25.693805694580078, "global_step": 309396, "epoch": 3727} {"train_loss": -25.8436279296875, "global_step": 309397, "epoch": 3727} {"train_loss": -26.132923126220703, "global_step": 309398, "epoch": 3727} {"train_loss": -25.245849609375, "global_step": 309399, "epoch": 3727} {"train_loss": -25.45745849609375, "global_step": 309400, "epoch": 3727} {"train_loss": -25.350400924682617, "global_step": 309401, "epoch": 3727} {"train_loss": -25.323530197143555, "global_step": 309402, "epoch": 3727} {"train_loss": -25.735517501831055, "global_step": 309403, "epoch": 3727} {"train_loss": -25.4984188079834, "global_step": 309404, "epoch": 3727} {"train_loss": -25.491300582885742, "global_step": 309405, "epoch": 3727} {"train_loss": -25.882568359375, "global_step": 309406, "epoch": 3727} {"train_loss": -25.67486572265625, "global_step": 309407, "epoch": 3727} {"train_loss": -25.503276824951172, "global_step": 309408, "epoch": 3727} {"train_loss": -25.5639705657959, "global_step": 309409, "epoch": 3727} {"train_loss": -26.011930465698242, "global_step": 309410, "epoch": 3727} {"train_loss": -25.393896102905273, "global_step": 309411, "epoch": 3727} {"train_loss": -25.713077545166016, "global_step": 309412, "epoch": 3727} {"train_loss": -25.992101669311523, "global_step": 309413, "epoch": 3727} {"train_loss": -25.696258544921875, "global_step": 309414, "epoch": 3727} {"train_loss": -25.9492130279541, "global_step": 309415, "epoch": 3727} {"train_loss": -25.621082305908203, "global_step": 309416, "epoch": 3727} {"train_loss": -25.76873207092285, "global_step": 309417, "epoch": 3727} {"train_loss": -25.91571044921875, "global_step": 309418, "epoch": 3727} {"train_loss": -25.973718643188477, "global_step": 309419, "epoch": 3727} {"train_loss": -26.0438175201416, "global_step": 309420, "epoch": 3727} {"train_loss": -25.481428146362305, "global_step": 309421, "epoch": 3727} {"train_loss": -25.86603355407715, "global_step": 309422, "epoch": 3727} {"train_loss": -25.569329549031085, "global_step": 309423, "epoch": 3727, "val_loss": 7235421.0} {"train_loss": -25.027257919311523, "global_step": 309424, "epoch": 3728} {"train_loss": -25.615753173828125, "global_step": 309425, "epoch": 3728} {"train_loss": -25.0777530670166, "global_step": 309426, "epoch": 3728} {"train_loss": -25.079381942749023, "global_step": 309427, "epoch": 3728} {"train_loss": -25.15888786315918, "global_step": 309428, "epoch": 3728} {"train_loss": -25.374719619750977, "global_step": 309429, "epoch": 3728} {"train_loss": -25.54413414001465, "global_step": 309430, "epoch": 3728} {"train_loss": -25.186092376708984, "global_step": 309431, "epoch": 3728} {"train_loss": -25.443357467651367, "global_step": 309432, "epoch": 3728} {"train_loss": -24.67061424255371, "global_step": 309433, "epoch": 3728} {"train_loss": -25.544979095458984, "global_step": 309434, "epoch": 3728} {"train_loss": -25.17872428894043, "global_step": 309435, "epoch": 3728} {"train_loss": -25.13523292541504, "global_step": 309436, "epoch": 3728} {"train_loss": -25.347658157348633, "global_step": 309437, "epoch": 3728} {"train_loss": -25.569747924804688, "global_step": 309438, "epoch": 3728} {"train_loss": -25.48762321472168, "global_step": 309439, "epoch": 3728} {"train_loss": -25.295591354370117, "global_step": 309440, "epoch": 3728} {"train_loss": -25.554113388061523, "global_step": 309441, "epoch": 3728} {"train_loss": -25.68402671813965, "global_step": 309442, "epoch": 3728} {"train_loss": -25.685041427612305, "global_step": 309443, "epoch": 3728} {"train_loss": -25.498050689697266, "global_step": 309444, "epoch": 3728} {"train_loss": -25.835590362548828, "global_step": 309445, "epoch": 3728} {"train_loss": -25.957502365112305, "global_step": 309446, "epoch": 3728} {"train_loss": -26.135684967041016, "global_step": 309447, "epoch": 3728} {"train_loss": -25.296613693237305, "global_step": 309448, "epoch": 3728} {"train_loss": -25.391775131225586, "global_step": 309449, "epoch": 3728} {"train_loss": -25.68436050415039, "global_step": 309450, "epoch": 3728} {"train_loss": -25.8801326751709, "global_step": 309451, "epoch": 3728} {"train_loss": -25.597143173217773, "global_step": 309452, "epoch": 3728} {"train_loss": -25.912519454956055, "global_step": 309453, "epoch": 3728} {"train_loss": -25.78114128112793, "global_step": 309454, "epoch": 3728} {"train_loss": -25.892683029174805, "global_step": 309455, "epoch": 3728} {"train_loss": -25.604629516601562, "global_step": 309456, "epoch": 3728} {"train_loss": -25.668920516967773, "global_step": 309457, "epoch": 3728} {"train_loss": -25.93397331237793, "global_step": 309458, "epoch": 3728} {"train_loss": -25.984073638916016, "global_step": 309459, "epoch": 3728} {"train_loss": -25.890790939331055, "global_step": 309460, "epoch": 3728} {"train_loss": -26.014434814453125, "global_step": 309461, "epoch": 3728} {"train_loss": -25.938663482666016, "global_step": 309462, "epoch": 3728} {"train_loss": -25.50214958190918, "global_step": 309463, "epoch": 3728} {"train_loss": -25.8770694732666, "global_step": 309464, "epoch": 3728} {"train_loss": -25.915205001831055, "global_step": 309465, "epoch": 3728} {"train_loss": -25.68716812133789, "global_step": 309466, "epoch": 3728} {"train_loss": -25.809843063354492, "global_step": 309467, "epoch": 3728} {"train_loss": -25.758392333984375, "global_step": 309468, "epoch": 3728} {"train_loss": -25.713550567626953, "global_step": 309469, "epoch": 3728} {"train_loss": -25.839771270751953, "global_step": 309470, "epoch": 3728} {"train_loss": -25.444110870361328, "global_step": 309471, "epoch": 3728} {"train_loss": -25.920825958251953, "global_step": 309472, "epoch": 3728} {"train_loss": -25.966650009155273, "global_step": 309473, "epoch": 3728} {"train_loss": -25.666532516479492, "global_step": 309474, "epoch": 3728} {"train_loss": -26.26934242248535, "global_step": 309475, "epoch": 3728} {"train_loss": -26.1519718170166, "global_step": 309476, "epoch": 3728} {"train_loss": -26.234973907470703, "global_step": 309477, "epoch": 3728} {"train_loss": -25.89625358581543, "global_step": 309478, "epoch": 3728} {"train_loss": -25.532739639282227, "global_step": 309479, "epoch": 3728} {"train_loss": -25.60693359375, "global_step": 309480, "epoch": 3728} {"train_loss": -25.0579833984375, "global_step": 309481, "epoch": 3728} {"train_loss": -24.393604278564453, "global_step": 309482, "epoch": 3728} {"train_loss": -24.54034996032715, "global_step": 309483, "epoch": 3728} {"train_loss": -25.571279525756836, "global_step": 309484, "epoch": 3728} {"train_loss": -25.082138061523438, "global_step": 309485, "epoch": 3728} {"train_loss": -24.521984100341797, "global_step": 309486, "epoch": 3728} {"train_loss": -25.643402099609375, "global_step": 309487, "epoch": 3728} {"train_loss": -24.873214721679688, "global_step": 309488, "epoch": 3728} {"train_loss": -25.113563537597656, "global_step": 309489, "epoch": 3728} {"train_loss": -25.50942039489746, "global_step": 309490, "epoch": 3728} {"train_loss": -25.46636962890625, "global_step": 309491, "epoch": 3728} {"train_loss": -25.33272361755371, "global_step": 309492, "epoch": 3728} {"train_loss": -25.442169189453125, "global_step": 309493, "epoch": 3728} {"train_loss": -25.710615158081055, "global_step": 309494, "epoch": 3728} {"train_loss": -25.36525535583496, "global_step": 309495, "epoch": 3728} {"train_loss": -25.488325119018555, "global_step": 309496, "epoch": 3728} {"train_loss": -25.56068992614746, "global_step": 309497, "epoch": 3728} {"train_loss": -25.74586296081543, "global_step": 309498, "epoch": 3728} {"train_loss": -25.750280380249023, "global_step": 309499, "epoch": 3728} {"train_loss": -25.487897872924805, "global_step": 309500, "epoch": 3728} {"train_loss": -25.504013061523438, "global_step": 309501, "epoch": 3728} {"train_loss": -25.607160568237305, "global_step": 309502, "epoch": 3728} {"train_loss": -25.25785255432129, "global_step": 309503, "epoch": 3728} {"train_loss": -25.38521385192871, "global_step": 309504, "epoch": 3728} {"train_loss": -25.80043601989746, "global_step": 309505, "epoch": 3728} {"train_loss": -25.559454171054334, "global_step": 309506, "epoch": 3728, "val_loss": 7242265.5} {"train_loss": -25.644601821899414, "global_step": 309507, "epoch": 3729} {"train_loss": -25.665313720703125, "global_step": 309508, "epoch": 3729} {"train_loss": -25.36174964904785, "global_step": 309509, "epoch": 3729} {"train_loss": -25.391475677490234, "global_step": 309510, "epoch": 3729} {"train_loss": -25.233280181884766, "global_step": 309511, "epoch": 3729} {"train_loss": -25.4887752532959, "global_step": 309512, "epoch": 3729} {"train_loss": -25.36880874633789, "global_step": 309513, "epoch": 3729} {"train_loss": -25.68426513671875, "global_step": 309514, "epoch": 3729} {"train_loss": -25.539348602294922, "global_step": 309515, "epoch": 3729} {"train_loss": -25.757232666015625, "global_step": 309516, "epoch": 3729} {"train_loss": -25.366140365600586, "global_step": 309517, "epoch": 3729} {"train_loss": -25.931293487548828, "global_step": 309518, "epoch": 3729} {"train_loss": -25.541950225830078, "global_step": 309519, "epoch": 3729} {"train_loss": -25.662445068359375, "global_step": 309520, "epoch": 3729} {"train_loss": -25.48395347595215, "global_step": 309521, "epoch": 3729} {"train_loss": -25.333114624023438, "global_step": 309522, "epoch": 3729} {"train_loss": -25.612201690673828, "global_step": 309523, "epoch": 3729} {"train_loss": -25.729196548461914, "global_step": 309524, "epoch": 3729} {"train_loss": -25.706212997436523, "global_step": 309525, "epoch": 3729} {"train_loss": -25.502330780029297, "global_step": 309526, "epoch": 3729} {"train_loss": -25.363006591796875, "global_step": 309527, "epoch": 3729} {"train_loss": -26.0234317779541, "global_step": 309528, "epoch": 3729} {"train_loss": -25.46115493774414, "global_step": 309529, "epoch": 3729} {"train_loss": -26.077747344970703, "global_step": 309530, "epoch": 3729} {"train_loss": -25.355337142944336, "global_step": 309531, "epoch": 3729} {"train_loss": -25.52461814880371, "global_step": 309532, "epoch": 3729} {"train_loss": -26.024206161499023, "global_step": 309533, "epoch": 3729} {"train_loss": -25.77065086364746, "global_step": 309534, "epoch": 3729} {"train_loss": -25.560688018798828, "global_step": 309535, "epoch": 3729} {"train_loss": -25.759496688842773, "global_step": 309536, "epoch": 3729} {"train_loss": -25.6403751373291, "global_step": 309537, "epoch": 3729} {"train_loss": -25.936559677124023, "global_step": 309538, "epoch": 3729} {"train_loss": -25.57575798034668, "global_step": 309539, "epoch": 3729} {"train_loss": -25.63376808166504, "global_step": 309540, "epoch": 3729} {"train_loss": -25.902694702148438, "global_step": 309541, "epoch": 3729} {"train_loss": -25.79237174987793, "global_step": 309542, "epoch": 3729} {"train_loss": -25.248226165771484, "global_step": 309543, "epoch": 3729} {"train_loss": -25.57379722595215, "global_step": 309544, "epoch": 3729} {"train_loss": -25.597026824951172, "global_step": 309545, "epoch": 3729} {"train_loss": -25.895307540893555, "global_step": 309546, "epoch": 3729} {"train_loss": -25.956729888916016, "global_step": 309547, "epoch": 3729} {"train_loss": -25.76806640625, "global_step": 309548, "epoch": 3729} {"train_loss": -25.78510093688965, "global_step": 309549, "epoch": 3729} {"train_loss": -26.01087760925293, "global_step": 309550, "epoch": 3729} {"train_loss": -25.87045669555664, "global_step": 309551, "epoch": 3729} {"train_loss": -25.6213321685791, "global_step": 309552, "epoch": 3729} {"train_loss": -25.963037490844727, "global_step": 309553, "epoch": 3729} {"train_loss": -26.1357364654541, "global_step": 309554, "epoch": 3729} {"train_loss": -25.702911376953125, "global_step": 309555, "epoch": 3729} {"train_loss": -26.29583168029785, "global_step": 309556, "epoch": 3729} {"train_loss": -25.771961212158203, "global_step": 309557, "epoch": 3729} {"train_loss": -26.044193267822266, "global_step": 309558, "epoch": 3729} {"train_loss": -26.22418785095215, "global_step": 309559, "epoch": 3729} {"train_loss": -25.261877059936523, "global_step": 309560, "epoch": 3729} {"train_loss": -25.56892204284668, "global_step": 309561, "epoch": 3729} {"train_loss": -25.596240997314453, "global_step": 309562, "epoch": 3729} {"train_loss": -25.512964248657227, "global_step": 309563, "epoch": 3729} {"train_loss": -25.96961784362793, "global_step": 309564, "epoch": 3729} {"train_loss": -25.623693466186523, "global_step": 309565, "epoch": 3729} {"train_loss": -25.679136276245117, "global_step": 309566, "epoch": 3729} {"train_loss": -25.637868881225586, "global_step": 309567, "epoch": 3729} {"train_loss": -25.43667221069336, "global_step": 309568, "epoch": 3729} {"train_loss": -25.663602828979492, "global_step": 309569, "epoch": 3729} {"train_loss": -25.731678009033203, "global_step": 309570, "epoch": 3729} {"train_loss": -26.01214599609375, "global_step": 309571, "epoch": 3729} {"train_loss": -25.753164291381836, "global_step": 309572, "epoch": 3729} {"train_loss": -25.751996994018555, "global_step": 309573, "epoch": 3729} {"train_loss": -25.666284561157227, "global_step": 309574, "epoch": 3729} {"train_loss": -25.850461959838867, "global_step": 309575, "epoch": 3729} {"train_loss": -25.76275634765625, "global_step": 309576, "epoch": 3729} {"train_loss": -25.8337345123291, "global_step": 309577, "epoch": 3729} {"train_loss": -25.76173210144043, "global_step": 309578, "epoch": 3729} {"train_loss": -25.891021728515625, "global_step": 309579, "epoch": 3729} {"train_loss": -25.574905395507812, "global_step": 309580, "epoch": 3729} {"train_loss": -25.992517471313477, "global_step": 309581, "epoch": 3729} {"train_loss": -26.344409942626953, "global_step": 309582, "epoch": 3729} {"train_loss": -25.7773494720459, "global_step": 309583, "epoch": 3729} {"train_loss": -26.093774795532227, "global_step": 309584, "epoch": 3729} {"train_loss": -25.444110870361328, "global_step": 309585, "epoch": 3729} {"train_loss": -25.876571655273438, "global_step": 309586, "epoch": 3729} {"train_loss": -25.779159545898438, "global_step": 309587, "epoch": 3729} {"train_loss": -25.812915802001953, "global_step": 309588, "epoch": 3729} {"train_loss": -25.725566335471278, "global_step": 309589, "epoch": 3729, "val_loss": 7202031.0} {"train_loss": -25.171573638916016, "global_step": 309590, "epoch": 3730} {"train_loss": -24.582483291625977, "global_step": 309591, "epoch": 3730} {"train_loss": -25.400876998901367, "global_step": 309592, "epoch": 3730} {"train_loss": -24.827590942382812, "global_step": 309593, "epoch": 3730} {"train_loss": -25.368053436279297, "global_step": 309594, "epoch": 3730} {"train_loss": -25.036514282226562, "global_step": 309595, "epoch": 3730} {"train_loss": -24.875226974487305, "global_step": 309596, "epoch": 3730} {"train_loss": -25.290067672729492, "global_step": 309597, "epoch": 3730} {"train_loss": -25.152896881103516, "global_step": 309598, "epoch": 3730} {"train_loss": -25.229246139526367, "global_step": 309599, "epoch": 3730} {"train_loss": -25.210159301757812, "global_step": 309600, "epoch": 3730} {"train_loss": -25.371469497680664, "global_step": 309601, "epoch": 3730} {"train_loss": -25.375158309936523, "global_step": 309602, "epoch": 3730} {"train_loss": -25.6877498626709, "global_step": 309603, "epoch": 3730} {"train_loss": -25.30293846130371, "global_step": 309604, "epoch": 3730} {"train_loss": -25.412595748901367, "global_step": 309605, "epoch": 3730} {"train_loss": -25.10171890258789, "global_step": 309606, "epoch": 3730} {"train_loss": -25.686059951782227, "global_step": 309607, "epoch": 3730} {"train_loss": -25.508033752441406, "global_step": 309608, "epoch": 3730} {"train_loss": -25.4420108795166, "global_step": 309609, "epoch": 3730} {"train_loss": -25.78177261352539, "global_step": 309610, "epoch": 3730} {"train_loss": -25.653493881225586, "global_step": 309611, "epoch": 3730} {"train_loss": -25.514127731323242, "global_step": 309612, "epoch": 3730} {"train_loss": -25.600393295288086, "global_step": 309613, "epoch": 3730} {"train_loss": -25.335723876953125, "global_step": 309614, "epoch": 3730} {"train_loss": -25.607467651367188, "global_step": 309615, "epoch": 3730} {"train_loss": -25.810184478759766, "global_step": 309616, "epoch": 3730} {"train_loss": -25.86322021484375, "global_step": 309617, "epoch": 3730} {"train_loss": -25.6401309967041, "global_step": 309618, "epoch": 3730} {"train_loss": -25.857080459594727, "global_step": 309619, "epoch": 3730} {"train_loss": -25.461265563964844, "global_step": 309620, "epoch": 3730} {"train_loss": -25.99090576171875, "global_step": 309621, "epoch": 3730} {"train_loss": -26.044116973876953, "global_step": 309622, "epoch": 3730} {"train_loss": -25.94080924987793, "global_step": 309623, "epoch": 3730} {"train_loss": -25.186120986938477, "global_step": 309624, "epoch": 3730} {"train_loss": -25.94891929626465, "global_step": 309625, "epoch": 3730} {"train_loss": -26.079160690307617, "global_step": 309626, "epoch": 3730} {"train_loss": -25.749893188476562, "global_step": 309627, "epoch": 3730} {"train_loss": -25.90448570251465, "global_step": 309628, "epoch": 3730} {"train_loss": -25.696613311767578, "global_step": 309629, "epoch": 3730} {"train_loss": -25.67496681213379, "global_step": 309630, "epoch": 3730} {"train_loss": -25.75868797302246, "global_step": 309631, "epoch": 3730} {"train_loss": -25.72296714782715, "global_step": 309632, "epoch": 3730} {"train_loss": -25.68717384338379, "global_step": 309633, "epoch": 3730} {"train_loss": -25.85172462463379, "global_step": 309634, "epoch": 3730} {"train_loss": -25.979032516479492, "global_step": 309635, "epoch": 3730} {"train_loss": -25.67716407775879, "global_step": 309636, "epoch": 3730} {"train_loss": -25.556949615478516, "global_step": 309637, "epoch": 3730} {"train_loss": -26.09695816040039, "global_step": 309638, "epoch": 3730} {"train_loss": -26.282602310180664, "global_step": 309639, "epoch": 3730} {"train_loss": -25.268695831298828, "global_step": 309640, "epoch": 3730} {"train_loss": -25.308698654174805, "global_step": 309641, "epoch": 3730} {"train_loss": -25.42726707458496, "global_step": 309642, "epoch": 3730} {"train_loss": -25.584684371948242, "global_step": 309643, "epoch": 3730} {"train_loss": -25.244417190551758, "global_step": 309644, "epoch": 3730} {"train_loss": -25.28030776977539, "global_step": 309645, "epoch": 3730} {"train_loss": -25.75934410095215, "global_step": 309646, "epoch": 3730} {"train_loss": -25.57012939453125, "global_step": 309647, "epoch": 3730} {"train_loss": -25.558908462524414, "global_step": 309648, "epoch": 3730} {"train_loss": -25.688888549804688, "global_step": 309649, "epoch": 3730} {"train_loss": -25.69135093688965, "global_step": 309650, "epoch": 3730} {"train_loss": -26.051267623901367, "global_step": 309651, "epoch": 3730} {"train_loss": -25.663358688354492, "global_step": 309652, "epoch": 3730} {"train_loss": -25.608322143554688, "global_step": 309653, "epoch": 3730} {"train_loss": -25.842004776000977, "global_step": 309654, "epoch": 3730} {"train_loss": -25.76564598083496, "global_step": 309655, "epoch": 3730} {"train_loss": -25.659887313842773, "global_step": 309656, "epoch": 3730} {"train_loss": -25.580102920532227, "global_step": 309657, "epoch": 3730} {"train_loss": -25.63408851623535, "global_step": 309658, "epoch": 3730} {"train_loss": -25.785720825195312, "global_step": 309659, "epoch": 3730} {"train_loss": -25.804946899414062, "global_step": 309660, "epoch": 3730} {"train_loss": -25.974210739135742, "global_step": 309661, "epoch": 3730} {"train_loss": -25.744953155517578, "global_step": 309662, "epoch": 3730} {"train_loss": -25.8080997467041, "global_step": 309663, "epoch": 3730} {"train_loss": -26.056854248046875, "global_step": 309664, "epoch": 3730} {"train_loss": -25.86907958984375, "global_step": 309665, "epoch": 3730} {"train_loss": -25.956090927124023, "global_step": 309666, "epoch": 3730} {"train_loss": -25.747665405273438, "global_step": 309667, "epoch": 3730} {"train_loss": -25.732410430908203, "global_step": 309668, "epoch": 3730} {"train_loss": -25.77567481994629, "global_step": 309669, "epoch": 3730} {"train_loss": -25.8242244720459, "global_step": 309670, "epoch": 3730} {"train_loss": -25.691303253173828, "global_step": 309671, "epoch": 3730} {"train_loss": -25.605336913143297, "global_step": 309672, "epoch": 3730, "val_loss": 7209433.0} {"train_loss": -25.342269897460938, "global_step": 309673, "epoch": 3731} {"train_loss": -25.21700096130371, "global_step": 309674, "epoch": 3731} {"train_loss": -25.651620864868164, "global_step": 309675, "epoch": 3731} {"train_loss": -25.257429122924805, "global_step": 309676, "epoch": 3731} {"train_loss": -25.49649429321289, "global_step": 309677, "epoch": 3731} {"train_loss": -25.16400718688965, "global_step": 309678, "epoch": 3731} {"train_loss": -25.1234188079834, "global_step": 309679, "epoch": 3731} {"train_loss": -25.45611572265625, "global_step": 309680, "epoch": 3731} {"train_loss": -25.205190658569336, "global_step": 309681, "epoch": 3731} {"train_loss": -25.498441696166992, "global_step": 309682, "epoch": 3731} {"train_loss": -25.044376373291016, "global_step": 309683, "epoch": 3731} {"train_loss": -25.577306747436523, "global_step": 309684, "epoch": 3731} {"train_loss": -25.828372955322266, "global_step": 309685, "epoch": 3731} {"train_loss": -25.51676368713379, "global_step": 309686, "epoch": 3731} {"train_loss": -25.356754302978516, "global_step": 309687, "epoch": 3731} {"train_loss": -25.60613441467285, "global_step": 309688, "epoch": 3731} {"train_loss": -25.66655921936035, "global_step": 309689, "epoch": 3731} {"train_loss": -25.50864601135254, "global_step": 309690, "epoch": 3731} {"train_loss": -25.55447769165039, "global_step": 309691, "epoch": 3731} {"train_loss": -25.28779411315918, "global_step": 309692, "epoch": 3731} {"train_loss": -25.820444107055664, "global_step": 309693, "epoch": 3731} {"train_loss": -25.84454345703125, "global_step": 309694, "epoch": 3731} {"train_loss": -25.570703506469727, "global_step": 309695, "epoch": 3731} {"train_loss": -25.734771728515625, "global_step": 309696, "epoch": 3731} {"train_loss": -25.88848304748535, "global_step": 309697, "epoch": 3731} {"train_loss": -25.43140411376953, "global_step": 309698, "epoch": 3731} {"train_loss": -25.995935440063477, "global_step": 309699, "epoch": 3731} {"train_loss": -25.756118774414062, "global_step": 309700, "epoch": 3731} {"train_loss": -25.736276626586914, "global_step": 309701, "epoch": 3731} {"train_loss": -26.06477928161621, "global_step": 309702, "epoch": 3731} {"train_loss": -25.837024688720703, "global_step": 309703, "epoch": 3731} {"train_loss": -26.183088302612305, "global_step": 309704, "epoch": 3731} {"train_loss": -25.733362197875977, "global_step": 309705, "epoch": 3731} {"train_loss": -25.824934005737305, "global_step": 309706, "epoch": 3731} {"train_loss": -25.80817222595215, "global_step": 309707, "epoch": 3731} {"train_loss": -25.965656280517578, "global_step": 309708, "epoch": 3731} {"train_loss": -25.96829605102539, "global_step": 309709, "epoch": 3731} {"train_loss": -25.838348388671875, "global_step": 309710, "epoch": 3731} {"train_loss": -26.09639549255371, "global_step": 309711, "epoch": 3731} {"train_loss": -25.722919464111328, "global_step": 309712, "epoch": 3731} {"train_loss": -25.8554744720459, "global_step": 309713, "epoch": 3731} {"train_loss": -25.85365867614746, "global_step": 309714, "epoch": 3731} {"train_loss": -25.741317749023438, "global_step": 309715, "epoch": 3731} {"train_loss": -25.14832878112793, "global_step": 309716, "epoch": 3731} {"train_loss": -25.87070655822754, "global_step": 309717, "epoch": 3731} {"train_loss": -25.48373794555664, "global_step": 309718, "epoch": 3731} {"train_loss": -25.4939022064209, "global_step": 309719, "epoch": 3731} {"train_loss": -25.812097549438477, "global_step": 309720, "epoch": 3731} {"train_loss": -25.73774528503418, "global_step": 309721, "epoch": 3731} {"train_loss": -25.68830680847168, "global_step": 309722, "epoch": 3731} {"train_loss": -25.533666610717773, "global_step": 309723, "epoch": 3731} {"train_loss": -25.75481605529785, "global_step": 309724, "epoch": 3731} {"train_loss": -25.864032745361328, "global_step": 309725, "epoch": 3731} {"train_loss": -25.651960372924805, "global_step": 309726, "epoch": 3731} {"train_loss": -25.4872989654541, "global_step": 309727, "epoch": 3731} {"train_loss": -25.797651290893555, "global_step": 309728, "epoch": 3731} {"train_loss": -26.127355575561523, "global_step": 309729, "epoch": 3731} {"train_loss": -25.33619499206543, "global_step": 309730, "epoch": 3731} {"train_loss": -25.26039695739746, "global_step": 309731, "epoch": 3731} {"train_loss": -25.65595817565918, "global_step": 309732, "epoch": 3731} {"train_loss": -25.71502685546875, "global_step": 309733, "epoch": 3731} {"train_loss": -25.515634536743164, "global_step": 309734, "epoch": 3731} {"train_loss": -25.633533477783203, "global_step": 309735, "epoch": 3731} {"train_loss": -25.444717407226562, "global_step": 309736, "epoch": 3731} {"train_loss": -25.76629066467285, "global_step": 309737, "epoch": 3731} {"train_loss": -25.765869140625, "global_step": 309738, "epoch": 3731} {"train_loss": -24.75429344177246, "global_step": 309739, "epoch": 3731} {"train_loss": -25.44137191772461, "global_step": 309740, "epoch": 3731} {"train_loss": -25.245738983154297, "global_step": 309741, "epoch": 3731} {"train_loss": -25.36342430114746, "global_step": 309742, "epoch": 3731} {"train_loss": -25.896717071533203, "global_step": 309743, "epoch": 3731} {"train_loss": -25.48952865600586, "global_step": 309744, "epoch": 3731} {"train_loss": -25.724945068359375, "global_step": 309745, "epoch": 3731} {"train_loss": -25.3446102142334, "global_step": 309746, "epoch": 3731} {"train_loss": -25.782140731811523, "global_step": 309747, "epoch": 3731} {"train_loss": -25.990345001220703, "global_step": 309748, "epoch": 3731} {"train_loss": -25.66603660583496, "global_step": 309749, "epoch": 3731} {"train_loss": -25.55767822265625, "global_step": 309750, "epoch": 3731} {"train_loss": -26.056594848632812, "global_step": 309751, "epoch": 3731} {"train_loss": -25.52650260925293, "global_step": 309752, "epoch": 3731} {"train_loss": -25.754928588867188, "global_step": 309753, "epoch": 3731} {"train_loss": -26.0272159576416, "global_step": 309754, "epoch": 3731} {"train_loss": -25.61855054188924, "global_step": 309755, "epoch": 3731, "val_loss": 7178507.0} {"train_loss": -25.611902236938477, "global_step": 309756, "epoch": 3732} {"train_loss": -25.552518844604492, "global_step": 309757, "epoch": 3732} {"train_loss": -25.490032196044922, "global_step": 309758, "epoch": 3732} {"train_loss": -25.708724975585938, "global_step": 309759, "epoch": 3732} {"train_loss": -25.816064834594727, "global_step": 309760, "epoch": 3732} {"train_loss": -25.656599044799805, "global_step": 309761, "epoch": 3732} {"train_loss": -25.671894073486328, "global_step": 309762, "epoch": 3732} {"train_loss": -25.39536476135254, "global_step": 309763, "epoch": 3732} {"train_loss": -25.925113677978516, "global_step": 309764, "epoch": 3732} {"train_loss": -25.38575553894043, "global_step": 309765, "epoch": 3732} {"train_loss": -25.73836326599121, "global_step": 309766, "epoch": 3732} {"train_loss": -25.897314071655273, "global_step": 309767, "epoch": 3732} {"train_loss": -25.60418701171875, "global_step": 309768, "epoch": 3732} {"train_loss": -25.69051170349121, "global_step": 309769, "epoch": 3732} {"train_loss": -26.146020889282227, "global_step": 309770, "epoch": 3732} {"train_loss": -26.360998153686523, "global_step": 309771, "epoch": 3732} {"train_loss": -25.475528717041016, "global_step": 309772, "epoch": 3732} {"train_loss": -25.977697372436523, "global_step": 309773, "epoch": 3732} {"train_loss": -25.837858200073242, "global_step": 309774, "epoch": 3732} {"train_loss": -25.892297744750977, "global_step": 309775, "epoch": 3732} {"train_loss": -25.3157901763916, "global_step": 309776, "epoch": 3732} {"train_loss": -25.747852325439453, "global_step": 309777, "epoch": 3732} {"train_loss": -25.510921478271484, "global_step": 309778, "epoch": 3732} {"train_loss": -25.808576583862305, "global_step": 309779, "epoch": 3732} {"train_loss": -25.597274780273438, "global_step": 309780, "epoch": 3732} {"train_loss": -25.972227096557617, "global_step": 309781, "epoch": 3732} {"train_loss": -25.6921329498291, "global_step": 309782, "epoch": 3732} {"train_loss": -25.57791519165039, "global_step": 309783, "epoch": 3732} {"train_loss": -25.528501510620117, "global_step": 309784, "epoch": 3732} {"train_loss": -25.56734848022461, "global_step": 309785, "epoch": 3732} {"train_loss": -25.378009796142578, "global_step": 309786, "epoch": 3732} {"train_loss": -25.027053833007812, "global_step": 309787, "epoch": 3732} {"train_loss": -24.828882217407227, "global_step": 309788, "epoch": 3732} {"train_loss": -25.69852066040039, "global_step": 309789, "epoch": 3732} {"train_loss": -25.614171981811523, "global_step": 309790, "epoch": 3732} {"train_loss": -25.537641525268555, "global_step": 309791, "epoch": 3732} {"train_loss": -25.91166114807129, "global_step": 309792, "epoch": 3732} {"train_loss": -26.021087646484375, "global_step": 309793, "epoch": 3732} {"train_loss": -25.798818588256836, "global_step": 309794, "epoch": 3732} {"train_loss": -25.554704666137695, "global_step": 309795, "epoch": 3732} {"train_loss": -25.7564697265625, "global_step": 309796, "epoch": 3732} {"train_loss": -25.736148834228516, "global_step": 309797, "epoch": 3732} {"train_loss": -25.675256729125977, "global_step": 309798, "epoch": 3732} {"train_loss": -25.627887725830078, "global_step": 309799, "epoch": 3732} {"train_loss": -25.656095504760742, "global_step": 309800, "epoch": 3732} {"train_loss": -25.59288215637207, "global_step": 309801, "epoch": 3732} {"train_loss": -25.610828399658203, "global_step": 309802, "epoch": 3732} {"train_loss": -25.807174682617188, "global_step": 309803, "epoch": 3732} {"train_loss": -25.581811904907227, "global_step": 309804, "epoch": 3732} {"train_loss": -26.18366813659668, "global_step": 309805, "epoch": 3732} {"train_loss": -26.103071212768555, "global_step": 309806, "epoch": 3732} {"train_loss": -25.710187911987305, "global_step": 309807, "epoch": 3732} {"train_loss": -25.67097282409668, "global_step": 309808, "epoch": 3732} {"train_loss": -25.824939727783203, "global_step": 309809, "epoch": 3732} {"train_loss": -25.537841796875, "global_step": 309810, "epoch": 3732} {"train_loss": -25.423505783081055, "global_step": 309811, "epoch": 3732} {"train_loss": -26.053268432617188, "global_step": 309812, "epoch": 3732} {"train_loss": -25.78162956237793, "global_step": 309813, "epoch": 3732} {"train_loss": -25.79996109008789, "global_step": 309814, "epoch": 3732} {"train_loss": -25.7730655670166, "global_step": 309815, "epoch": 3732} {"train_loss": -26.0731258392334, "global_step": 309816, "epoch": 3732} {"train_loss": -25.677404403686523, "global_step": 309817, "epoch": 3732} {"train_loss": -25.39351463317871, "global_step": 309818, "epoch": 3732} {"train_loss": -25.939239501953125, "global_step": 309819, "epoch": 3732} {"train_loss": -26.1328125, "global_step": 309820, "epoch": 3732} {"train_loss": -25.4825496673584, "global_step": 309821, "epoch": 3732} {"train_loss": -25.893285751342773, "global_step": 309822, "epoch": 3732} {"train_loss": -26.17632484436035, "global_step": 309823, "epoch": 3732} {"train_loss": -25.409711837768555, "global_step": 309824, "epoch": 3732} {"train_loss": -25.28803253173828, "global_step": 309825, "epoch": 3732} {"train_loss": -25.42765998840332, "global_step": 309826, "epoch": 3732} {"train_loss": -25.988861083984375, "global_step": 309827, "epoch": 3732} {"train_loss": -25.838443756103516, "global_step": 309828, "epoch": 3732} {"train_loss": -25.745141983032227, "global_step": 309829, "epoch": 3732} {"train_loss": -26.004730224609375, "global_step": 309830, "epoch": 3732} {"train_loss": -25.860458374023438, "global_step": 309831, "epoch": 3732} {"train_loss": -25.74616050720215, "global_step": 309832, "epoch": 3732} {"train_loss": -25.784448623657227, "global_step": 309833, "epoch": 3732} {"train_loss": -25.90409278869629, "global_step": 309834, "epoch": 3732} {"train_loss": -25.804351806640625, "global_step": 309835, "epoch": 3732} {"train_loss": -25.742883682250977, "global_step": 309836, "epoch": 3732} {"train_loss": -26.011444091796875, "global_step": 309837, "epoch": 3732} {"train_loss": -25.712464481951244, "global_step": 309838, "epoch": 3732, "val_loss": 7179441.0} {"train_loss": -25.41901206970215, "global_step": 309839, "epoch": 3733} {"train_loss": -25.243215560913086, "global_step": 309840, "epoch": 3733} {"train_loss": -25.086652755737305, "global_step": 309841, "epoch": 3733} {"train_loss": -24.705434799194336, "global_step": 309842, "epoch": 3733} {"train_loss": -24.807483673095703, "global_step": 309843, "epoch": 3733} {"train_loss": -25.333873748779297, "global_step": 309844, "epoch": 3733} {"train_loss": -25.213359832763672, "global_step": 309845, "epoch": 3733} {"train_loss": -25.210241317749023, "global_step": 309846, "epoch": 3733} {"train_loss": -25.16130828857422, "global_step": 309847, "epoch": 3733} {"train_loss": -25.423715591430664, "global_step": 309848, "epoch": 3733} {"train_loss": -25.766864776611328, "global_step": 309849, "epoch": 3733} {"train_loss": -25.081859588623047, "global_step": 309850, "epoch": 3733} {"train_loss": -25.59634780883789, "global_step": 309851, "epoch": 3733} {"train_loss": -25.236127853393555, "global_step": 309852, "epoch": 3733} {"train_loss": -25.651044845581055, "global_step": 309853, "epoch": 3733} {"train_loss": -25.368579864501953, "global_step": 309854, "epoch": 3733} {"train_loss": -25.638132095336914, "global_step": 309855, "epoch": 3733} {"train_loss": -25.522558212280273, "global_step": 309856, "epoch": 3733} {"train_loss": -26.0626277923584, "global_step": 309857, "epoch": 3733} {"train_loss": -25.897140502929688, "global_step": 309858, "epoch": 3733} {"train_loss": -25.511186599731445, "global_step": 309859, "epoch": 3733} {"train_loss": -25.719024658203125, "global_step": 309860, "epoch": 3733} {"train_loss": -25.476688385009766, "global_step": 309861, "epoch": 3733} {"train_loss": -25.608057022094727, "global_step": 309862, "epoch": 3733} {"train_loss": -25.544477462768555, "global_step": 309863, "epoch": 3733} {"train_loss": -25.72881507873535, "global_step": 309864, "epoch": 3733} {"train_loss": -25.457904815673828, "global_step": 309865, "epoch": 3733} {"train_loss": -25.617584228515625, "global_step": 309866, "epoch": 3733} {"train_loss": -25.48931312561035, "global_step": 309867, "epoch": 3733} {"train_loss": -25.61187171936035, "global_step": 309868, "epoch": 3733} {"train_loss": -25.489042282104492, "global_step": 309869, "epoch": 3733} {"train_loss": -25.885007858276367, "global_step": 309870, "epoch": 3733} {"train_loss": -25.86652946472168, "global_step": 309871, "epoch": 3733} {"train_loss": -25.90101432800293, "global_step": 309872, "epoch": 3733} {"train_loss": -25.911115646362305, "global_step": 309873, "epoch": 3733} {"train_loss": -25.593265533447266, "global_step": 309874, "epoch": 3733} {"train_loss": -25.517290115356445, "global_step": 309875, "epoch": 3733} {"train_loss": -25.81080436706543, "global_step": 309876, "epoch": 3733} {"train_loss": -26.14741325378418, "global_step": 309877, "epoch": 3733} {"train_loss": -25.54654884338379, "global_step": 309878, "epoch": 3733} {"train_loss": -25.643756866455078, "global_step": 309879, "epoch": 3733} {"train_loss": -25.840261459350586, "global_step": 309880, "epoch": 3733} {"train_loss": -25.883453369140625, "global_step": 309881, "epoch": 3733} {"train_loss": -25.480224609375, "global_step": 309882, "epoch": 3733} {"train_loss": -25.166706085205078, "global_step": 309883, "epoch": 3733} {"train_loss": -25.700469970703125, "global_step": 309884, "epoch": 3733} {"train_loss": -25.150503158569336, "global_step": 309885, "epoch": 3733} {"train_loss": -25.9495906829834, "global_step": 309886, "epoch": 3733} {"train_loss": -25.523120880126953, "global_step": 309887, "epoch": 3733} {"train_loss": -25.892309188842773, "global_step": 309888, "epoch": 3733} {"train_loss": -25.930688858032227, "global_step": 309889, "epoch": 3733} {"train_loss": -25.954833984375, "global_step": 309890, "epoch": 3733} {"train_loss": -25.835269927978516, "global_step": 309891, "epoch": 3733} {"train_loss": -25.682819366455078, "global_step": 309892, "epoch": 3733} {"train_loss": -25.877119064331055, "global_step": 309893, "epoch": 3733} {"train_loss": -26.0950927734375, "global_step": 309894, "epoch": 3733} {"train_loss": -25.851123809814453, "global_step": 309895, "epoch": 3733} {"train_loss": -26.01667594909668, "global_step": 309896, "epoch": 3733} {"train_loss": -25.687183380126953, "global_step": 309897, "epoch": 3733} {"train_loss": -25.8156681060791, "global_step": 309898, "epoch": 3733} {"train_loss": -25.770843505859375, "global_step": 309899, "epoch": 3733} {"train_loss": -25.84803581237793, "global_step": 309900, "epoch": 3733} {"train_loss": -25.774560928344727, "global_step": 309901, "epoch": 3733} {"train_loss": -25.713668823242188, "global_step": 309902, "epoch": 3733} {"train_loss": -25.88410758972168, "global_step": 309903, "epoch": 3733} {"train_loss": -25.836029052734375, "global_step": 309904, "epoch": 3733} {"train_loss": -25.842853546142578, "global_step": 309905, "epoch": 3733} {"train_loss": -25.43242835998535, "global_step": 309906, "epoch": 3733} {"train_loss": -25.849349975585938, "global_step": 309907, "epoch": 3733} {"train_loss": -25.518198013305664, "global_step": 309908, "epoch": 3733} {"train_loss": -25.6098690032959, "global_step": 309909, "epoch": 3733} {"train_loss": -25.917463302612305, "global_step": 309910, "epoch": 3733} {"train_loss": -25.58119773864746, "global_step": 309911, "epoch": 3733} {"train_loss": -25.653818130493164, "global_step": 309912, "epoch": 3733} {"train_loss": -25.89961051940918, "global_step": 309913, "epoch": 3733} {"train_loss": -25.724353790283203, "global_step": 309914, "epoch": 3733} {"train_loss": -25.83642578125, "global_step": 309915, "epoch": 3733} {"train_loss": -25.603973388671875, "global_step": 309916, "epoch": 3733} {"train_loss": -25.93002700805664, "global_step": 309917, "epoch": 3733} {"train_loss": -25.835681915283203, "global_step": 309918, "epoch": 3733} {"train_loss": -25.989572525024414, "global_step": 309919, "epoch": 3733} {"train_loss": -25.86075782775879, "global_step": 309920, "epoch": 3733} {"train_loss": -25.640209979321583, "global_step": 309921, "epoch": 3733, "val_loss": 7202044.0} {"train_loss": -25.46289825439453, "global_step": 309922, "epoch": 3734} {"train_loss": -25.526058197021484, "global_step": 309923, "epoch": 3734} {"train_loss": -25.613107681274414, "global_step": 309924, "epoch": 3734} {"train_loss": -25.593843460083008, "global_step": 309925, "epoch": 3734} {"train_loss": -25.51095962524414, "global_step": 309926, "epoch": 3734} {"train_loss": -25.8460750579834, "global_step": 309927, "epoch": 3734} {"train_loss": -25.403350830078125, "global_step": 309928, "epoch": 3734} {"train_loss": -25.067996978759766, "global_step": 309929, "epoch": 3734} {"train_loss": -25.723922729492188, "global_step": 309930, "epoch": 3734} {"train_loss": -25.363237380981445, "global_step": 309931, "epoch": 3734} {"train_loss": -25.428518295288086, "global_step": 309932, "epoch": 3734} {"train_loss": -25.46565055847168, "global_step": 309933, "epoch": 3734} {"train_loss": -25.331632614135742, "global_step": 309934, "epoch": 3734} {"train_loss": -25.587308883666992, "global_step": 309935, "epoch": 3734} {"train_loss": -25.753055572509766, "global_step": 309936, "epoch": 3734} {"train_loss": -25.517751693725586, "global_step": 309937, "epoch": 3734} {"train_loss": -25.458433151245117, "global_step": 309938, "epoch": 3734} {"train_loss": -25.5177059173584, "global_step": 309939, "epoch": 3734} {"train_loss": -25.780786514282227, "global_step": 309940, "epoch": 3734} {"train_loss": -25.46750259399414, "global_step": 309941, "epoch": 3734} {"train_loss": -25.313037872314453, "global_step": 309942, "epoch": 3734} {"train_loss": -25.87428092956543, "global_step": 309943, "epoch": 3734} {"train_loss": -25.7965145111084, "global_step": 309944, "epoch": 3734} {"train_loss": -25.632593154907227, "global_step": 309945, "epoch": 3734} {"train_loss": -25.774328231811523, "global_step": 309946, "epoch": 3734} {"train_loss": -26.045740127563477, "global_step": 309947, "epoch": 3734} {"train_loss": -25.703327178955078, "global_step": 309948, "epoch": 3734} {"train_loss": -26.14972496032715, "global_step": 309949, "epoch": 3734} {"train_loss": -25.638635635375977, "global_step": 309950, "epoch": 3734} {"train_loss": -25.852493286132812, "global_step": 309951, "epoch": 3734} {"train_loss": -25.723325729370117, "global_step": 309952, "epoch": 3734} {"train_loss": -25.702533721923828, "global_step": 309953, "epoch": 3734} {"train_loss": -25.785139083862305, "global_step": 309954, "epoch": 3734} {"train_loss": -26.230627059936523, "global_step": 309955, "epoch": 3734} {"train_loss": -25.980329513549805, "global_step": 309956, "epoch": 3734} {"train_loss": -25.637481689453125, "global_step": 309957, "epoch": 3734} {"train_loss": -25.78399085998535, "global_step": 309958, "epoch": 3734} {"train_loss": -25.853296279907227, "global_step": 309959, "epoch": 3734} {"train_loss": -25.790847778320312, "global_step": 309960, "epoch": 3734} {"train_loss": -26.14657974243164, "global_step": 309961, "epoch": 3734} {"train_loss": -25.798429489135742, "global_step": 309962, "epoch": 3734} {"train_loss": -25.58638572692871, "global_step": 309963, "epoch": 3734} {"train_loss": -25.873327255249023, "global_step": 309964, "epoch": 3734} {"train_loss": -25.44927978515625, "global_step": 309965, "epoch": 3734} {"train_loss": -25.821435928344727, "global_step": 309966, "epoch": 3734} {"train_loss": -25.644454956054688, "global_step": 309967, "epoch": 3734} {"train_loss": -25.62308120727539, "global_step": 309968, "epoch": 3734} {"train_loss": -25.73491859436035, "global_step": 309969, "epoch": 3734} {"train_loss": -25.1429500579834, "global_step": 309970, "epoch": 3734} {"train_loss": -25.62184715270996, "global_step": 309971, "epoch": 3734} {"train_loss": -25.967365264892578, "global_step": 309972, "epoch": 3734} {"train_loss": -25.37566566467285, "global_step": 309973, "epoch": 3734} {"train_loss": -25.409910202026367, "global_step": 309974, "epoch": 3734} {"train_loss": -25.64229393005371, "global_step": 309975, "epoch": 3734} {"train_loss": -25.5548038482666, "global_step": 309976, "epoch": 3734} {"train_loss": -25.68324089050293, "global_step": 309977, "epoch": 3734} {"train_loss": -25.405027389526367, "global_step": 309978, "epoch": 3734} {"train_loss": -25.32640838623047, "global_step": 309979, "epoch": 3734} {"train_loss": -25.8059139251709, "global_step": 309980, "epoch": 3734} {"train_loss": -25.39949607849121, "global_step": 309981, "epoch": 3734} {"train_loss": -25.713821411132812, "global_step": 309982, "epoch": 3734} {"train_loss": -25.82024574279785, "global_step": 309983, "epoch": 3734} {"train_loss": -25.43193817138672, "global_step": 309984, "epoch": 3734} {"train_loss": -25.540353775024414, "global_step": 309985, "epoch": 3734} {"train_loss": -25.509510040283203, "global_step": 309986, "epoch": 3734} {"train_loss": -25.536468505859375, "global_step": 309987, "epoch": 3734} {"train_loss": -25.745330810546875, "global_step": 309988, "epoch": 3734} {"train_loss": -25.9292049407959, "global_step": 309989, "epoch": 3734} {"train_loss": -25.72528076171875, "global_step": 309990, "epoch": 3734} {"train_loss": -25.671899795532227, "global_step": 309991, "epoch": 3734} {"train_loss": -25.653024673461914, "global_step": 309992, "epoch": 3734} {"train_loss": -25.463415145874023, "global_step": 309993, "epoch": 3734} {"train_loss": -25.180322647094727, "global_step": 309994, "epoch": 3734} {"train_loss": -25.905200958251953, "global_step": 309995, "epoch": 3734} {"train_loss": -25.48003578186035, "global_step": 309996, "epoch": 3734} {"train_loss": -25.936132431030273, "global_step": 309997, "epoch": 3734} {"train_loss": -25.80425453186035, "global_step": 309998, "epoch": 3734} {"train_loss": -25.922391891479492, "global_step": 309999, "epoch": 3734} {"train_loss": -25.710569381713867, "global_step": 310000, "epoch": 3734} {"train_loss": -26.03360939025879, "global_step": 310001, "epoch": 3734} {"train_loss": -25.624670028686523, "global_step": 310002, "epoch": 3734} {"train_loss": -26.093297958374023, "global_step": 310003, "epoch": 3734} {"train_loss": -25.646946849593196, "global_step": 310004, "epoch": 3734, "val_loss": 7258869.0} {"train_loss": -25.132898330688477, "global_step": 310005, "epoch": 3735} {"train_loss": -24.372900009155273, "global_step": 310006, "epoch": 3735} {"train_loss": -25.0102596282959, "global_step": 310007, "epoch": 3735} {"train_loss": -25.42101287841797, "global_step": 310008, "epoch": 3735} {"train_loss": -24.63405418395996, "global_step": 310009, "epoch": 3735} {"train_loss": -25.034400939941406, "global_step": 310010, "epoch": 3735} {"train_loss": -25.149948120117188, "global_step": 310011, "epoch": 3735} {"train_loss": -25.56169319152832, "global_step": 310012, "epoch": 3735} {"train_loss": -25.55386734008789, "global_step": 310013, "epoch": 3735} {"train_loss": -24.95661735534668, "global_step": 310014, "epoch": 3735} {"train_loss": -25.71931266784668, "global_step": 310015, "epoch": 3735} {"train_loss": -25.107080459594727, "global_step": 310016, "epoch": 3735} {"train_loss": -25.328594207763672, "global_step": 310017, "epoch": 3735} {"train_loss": -25.2385311126709, "global_step": 310018, "epoch": 3735} {"train_loss": -25.592599868774414, "global_step": 310019, "epoch": 3735} {"train_loss": -25.241058349609375, "global_step": 310020, "epoch": 3735} {"train_loss": -25.470195770263672, "global_step": 310021, "epoch": 3735} {"train_loss": -25.435108184814453, "global_step": 310022, "epoch": 3735} {"train_loss": -25.836090087890625, "global_step": 310023, "epoch": 3735} {"train_loss": -25.712873458862305, "global_step": 310024, "epoch": 3735} {"train_loss": -25.455568313598633, "global_step": 310025, "epoch": 3735} {"train_loss": -26.06900405883789, "global_step": 310026, "epoch": 3735} {"train_loss": -25.442829132080078, "global_step": 310027, "epoch": 3735} {"train_loss": -25.42856788635254, "global_step": 310028, "epoch": 3735} {"train_loss": -25.618383407592773, "global_step": 310029, "epoch": 3735} {"train_loss": -25.76710319519043, "global_step": 310030, "epoch": 3735} {"train_loss": -25.56353759765625, "global_step": 310031, "epoch": 3735} {"train_loss": -25.756546020507812, "global_step": 310032, "epoch": 3735} {"train_loss": -25.725534439086914, "global_step": 310033, "epoch": 3735} {"train_loss": -25.739789962768555, "global_step": 310034, "epoch": 3735} {"train_loss": -25.702966690063477, "global_step": 310035, "epoch": 3735} {"train_loss": -25.638471603393555, "global_step": 310036, "epoch": 3735} {"train_loss": -25.7559757232666, "global_step": 310037, "epoch": 3735} {"train_loss": -25.994733810424805, "global_step": 310038, "epoch": 3735} {"train_loss": -25.717987060546875, "global_step": 310039, "epoch": 3735} {"train_loss": -25.519309997558594, "global_step": 310040, "epoch": 3735} {"train_loss": -26.127582550048828, "global_step": 310041, "epoch": 3735} {"train_loss": -26.0039119720459, "global_step": 310042, "epoch": 3735} {"train_loss": -25.645404815673828, "global_step": 310043, "epoch": 3735} {"train_loss": -26.267194747924805, "global_step": 310044, "epoch": 3735} {"train_loss": -25.836706161499023, "global_step": 310045, "epoch": 3735} {"train_loss": -26.040502548217773, "global_step": 310046, "epoch": 3735} {"train_loss": -25.547866821289062, "global_step": 310047, "epoch": 3735} {"train_loss": -25.820043563842773, "global_step": 310048, "epoch": 3735} {"train_loss": -25.928857803344727, "global_step": 310049, "epoch": 3735} {"train_loss": -25.616806030273438, "global_step": 310050, "epoch": 3735} {"train_loss": -25.51181983947754, "global_step": 310051, "epoch": 3735} {"train_loss": -26.157026290893555, "global_step": 310052, "epoch": 3735} {"train_loss": -25.7279052734375, "global_step": 310053, "epoch": 3735} {"train_loss": -25.97027587890625, "global_step": 310054, "epoch": 3735} {"train_loss": -25.59847068786621, "global_step": 310055, "epoch": 3735} {"train_loss": -25.822797775268555, "global_step": 310056, "epoch": 3735} {"train_loss": -25.743799209594727, "global_step": 310057, "epoch": 3735} {"train_loss": -25.680511474609375, "global_step": 310058, "epoch": 3735} {"train_loss": -25.721078872680664, "global_step": 310059, "epoch": 3735} {"train_loss": -25.782699584960938, "global_step": 310060, "epoch": 3735} {"train_loss": -26.03473472595215, "global_step": 310061, "epoch": 3735} {"train_loss": -25.661474227905273, "global_step": 310062, "epoch": 3735} {"train_loss": -25.875280380249023, "global_step": 310063, "epoch": 3735} {"train_loss": -25.63288688659668, "global_step": 310064, "epoch": 3735} {"train_loss": -25.857608795166016, "global_step": 310065, "epoch": 3735} {"train_loss": -25.49995231628418, "global_step": 310066, "epoch": 3735} {"train_loss": -25.758615493774414, "global_step": 310067, "epoch": 3735} {"train_loss": -25.652368545532227, "global_step": 310068, "epoch": 3735} {"train_loss": -25.735177993774414, "global_step": 310069, "epoch": 3735} {"train_loss": -25.791736602783203, "global_step": 310070, "epoch": 3735} {"train_loss": -25.75874137878418, "global_step": 310071, "epoch": 3735} {"train_loss": -26.034902572631836, "global_step": 310072, "epoch": 3735} {"train_loss": -25.66766357421875, "global_step": 310073, "epoch": 3735} {"train_loss": -25.904722213745117, "global_step": 310074, "epoch": 3735} {"train_loss": -25.924863815307617, "global_step": 310075, "epoch": 3735} {"train_loss": -25.667831420898438, "global_step": 310076, "epoch": 3735} {"train_loss": -25.91070556640625, "global_step": 310077, "epoch": 3735} {"train_loss": -25.769689559936523, "global_step": 310078, "epoch": 3735} {"train_loss": -25.98709487915039, "global_step": 310079, "epoch": 3735} {"train_loss": -25.516874313354492, "global_step": 310080, "epoch": 3735} {"train_loss": -25.26575469970703, "global_step": 310081, "epoch": 3735} {"train_loss": -25.512418746948242, "global_step": 310082, "epoch": 3735} {"train_loss": -25.905136108398438, "global_step": 310083, "epoch": 3735} {"train_loss": -25.325571060180664, "global_step": 310084, "epoch": 3735} {"train_loss": -25.5377254486084, "global_step": 310085, "epoch": 3735} {"train_loss": -25.46638298034668, "global_step": 310086, "epoch": 3735} {"train_loss": -25.629159651606916, "global_step": 310087, "epoch": 3735, "val_loss": 7167240.0} {"train_loss": -24.898027420043945, "global_step": 310088, "epoch": 3736} {"train_loss": -25.49163246154785, "global_step": 310089, "epoch": 3736} {"train_loss": -24.949016571044922, "global_step": 310090, "epoch": 3736} {"train_loss": -24.86741065979004, "global_step": 310091, "epoch": 3736} {"train_loss": -25.314096450805664, "global_step": 310092, "epoch": 3736} {"train_loss": -24.88054847717285, "global_step": 310093, "epoch": 3736} {"train_loss": -25.18723487854004, "global_step": 310094, "epoch": 3736} {"train_loss": -25.301084518432617, "global_step": 310095, "epoch": 3736} {"train_loss": -25.01853370666504, "global_step": 310096, "epoch": 3736} {"train_loss": -25.471206665039062, "global_step": 310097, "epoch": 3736} {"train_loss": -25.17842674255371, "global_step": 310098, "epoch": 3736} {"train_loss": -25.467588424682617, "global_step": 310099, "epoch": 3736} {"train_loss": -24.84821128845215, "global_step": 310100, "epoch": 3736} {"train_loss": -25.334692001342773, "global_step": 310101, "epoch": 3736} {"train_loss": -25.33624267578125, "global_step": 310102, "epoch": 3736} {"train_loss": -25.284231185913086, "global_step": 310103, "epoch": 3736} {"train_loss": -25.099720001220703, "global_step": 310104, "epoch": 3736} {"train_loss": -25.39883804321289, "global_step": 310105, "epoch": 3736} {"train_loss": -25.73774528503418, "global_step": 310106, "epoch": 3736} {"train_loss": -25.27933692932129, "global_step": 310107, "epoch": 3736} {"train_loss": -25.591541290283203, "global_step": 310108, "epoch": 3736} {"train_loss": -25.28799819946289, "global_step": 310109, "epoch": 3736} {"train_loss": -25.552953720092773, "global_step": 310110, "epoch": 3736} {"train_loss": -25.638330459594727, "global_step": 310111, "epoch": 3736} {"train_loss": -25.465734481811523, "global_step": 310112, "epoch": 3736} {"train_loss": -25.82485008239746, "global_step": 310113, "epoch": 3736} {"train_loss": -25.68509864807129, "global_step": 310114, "epoch": 3736} {"train_loss": -25.975051879882812, "global_step": 310115, "epoch": 3736} {"train_loss": -25.385608673095703, "global_step": 310116, "epoch": 3736} {"train_loss": -25.494285583496094, "global_step": 310117, "epoch": 3736} {"train_loss": -25.82234001159668, "global_step": 310118, "epoch": 3736} {"train_loss": -25.680145263671875, "global_step": 310119, "epoch": 3736} {"train_loss": -25.440414428710938, "global_step": 310120, "epoch": 3736} {"train_loss": -25.53810691833496, "global_step": 310121, "epoch": 3736} {"train_loss": -25.439912796020508, "global_step": 310122, "epoch": 3736} {"train_loss": -25.181360244750977, "global_step": 310123, "epoch": 3736} {"train_loss": -25.45881462097168, "global_step": 310124, "epoch": 3736} {"train_loss": -25.671056747436523, "global_step": 310125, "epoch": 3736} {"train_loss": -25.429475784301758, "global_step": 310126, "epoch": 3736} {"train_loss": -25.839481353759766, "global_step": 310127, "epoch": 3736} {"train_loss": -25.692157745361328, "global_step": 310128, "epoch": 3736} {"train_loss": -25.57813262939453, "global_step": 310129, "epoch": 3736} {"train_loss": -25.861011505126953, "global_step": 310130, "epoch": 3736} {"train_loss": -25.8169002532959, "global_step": 310131, "epoch": 3736} {"train_loss": -25.8810977935791, "global_step": 310132, "epoch": 3736} {"train_loss": -25.698978424072266, "global_step": 310133, "epoch": 3736} {"train_loss": -25.785049438476562, "global_step": 310134, "epoch": 3736} {"train_loss": -25.91285514831543, "global_step": 310135, "epoch": 3736} {"train_loss": -25.771650314331055, "global_step": 310136, "epoch": 3736} {"train_loss": -26.097415924072266, "global_step": 310137, "epoch": 3736} {"train_loss": -26.016494750976562, "global_step": 310138, "epoch": 3736} {"train_loss": -25.923192977905273, "global_step": 310139, "epoch": 3736} {"train_loss": -26.008609771728516, "global_step": 310140, "epoch": 3736} {"train_loss": -25.793039321899414, "global_step": 310141, "epoch": 3736} {"train_loss": -25.928918838500977, "global_step": 310142, "epoch": 3736} {"train_loss": -25.866254806518555, "global_step": 310143, "epoch": 3736} {"train_loss": -26.168853759765625, "global_step": 310144, "epoch": 3736} {"train_loss": -25.82020378112793, "global_step": 310145, "epoch": 3736} {"train_loss": -26.007619857788086, "global_step": 310146, "epoch": 3736} {"train_loss": -25.884321212768555, "global_step": 310147, "epoch": 3736} {"train_loss": -26.000659942626953, "global_step": 310148, "epoch": 3736} {"train_loss": -25.9827880859375, "global_step": 310149, "epoch": 3736} {"train_loss": -25.79511833190918, "global_step": 310150, "epoch": 3736} {"train_loss": -26.01166343688965, "global_step": 310151, "epoch": 3736} {"train_loss": -25.780780792236328, "global_step": 310152, "epoch": 3736} {"train_loss": -25.605670928955078, "global_step": 310153, "epoch": 3736} {"train_loss": -25.545324325561523, "global_step": 310154, "epoch": 3736} {"train_loss": -25.853910446166992, "global_step": 310155, "epoch": 3736} {"train_loss": -25.636123657226562, "global_step": 310156, "epoch": 3736} {"train_loss": -25.47352409362793, "global_step": 310157, "epoch": 3736} {"train_loss": -26.110143661499023, "global_step": 310158, "epoch": 3736} {"train_loss": -25.490217208862305, "global_step": 310159, "epoch": 3736} {"train_loss": -25.889362335205078, "global_step": 310160, "epoch": 3736} {"train_loss": -25.988794326782227, "global_step": 310161, "epoch": 3736} {"train_loss": -26.0286808013916, "global_step": 310162, "epoch": 3736} {"train_loss": -25.824705123901367, "global_step": 310163, "epoch": 3736} {"train_loss": -26.349842071533203, "global_step": 310164, "epoch": 3736} {"train_loss": -25.742523193359375, "global_step": 310165, "epoch": 3736} {"train_loss": -25.658222198486328, "global_step": 310166, "epoch": 3736} {"train_loss": -25.32675552368164, "global_step": 310167, "epoch": 3736} {"train_loss": -25.60395622253418, "global_step": 310168, "epoch": 3736} {"train_loss": -25.83565330505371, "global_step": 310169, "epoch": 3736} {"train_loss": -25.622451690306146, "global_step": 310170, "epoch": 3736, "val_loss": 7354087.0} {"train_loss": -23.50727653503418, "global_step": 310171, "epoch": 3737} {"train_loss": -24.974241256713867, "global_step": 310172, "epoch": 3737} {"train_loss": -24.327299118041992, "global_step": 310173, "epoch": 3737} {"train_loss": -25.142309188842773, "global_step": 310174, "epoch": 3737} {"train_loss": -25.127788543701172, "global_step": 310175, "epoch": 3737} {"train_loss": -25.561010360717773, "global_step": 310176, "epoch": 3737} {"train_loss": -25.07562255859375, "global_step": 310177, "epoch": 3737} {"train_loss": -25.32866096496582, "global_step": 310178, "epoch": 3737} {"train_loss": -25.28529167175293, "global_step": 310179, "epoch": 3737} {"train_loss": -25.57381248474121, "global_step": 310180, "epoch": 3737} {"train_loss": -25.486526489257812, "global_step": 310181, "epoch": 3737} {"train_loss": -25.48036766052246, "global_step": 310182, "epoch": 3737} {"train_loss": -25.529163360595703, "global_step": 310183, "epoch": 3737} {"train_loss": -25.597105026245117, "global_step": 310184, "epoch": 3737} {"train_loss": -25.701025009155273, "global_step": 310185, "epoch": 3737} {"train_loss": -25.31149673461914, "global_step": 310186, "epoch": 3737} {"train_loss": -25.116891860961914, "global_step": 310187, "epoch": 3737} {"train_loss": -25.472339630126953, "global_step": 310188, "epoch": 3737} {"train_loss": -25.188644409179688, "global_step": 310189, "epoch": 3737} {"train_loss": -25.802261352539062, "global_step": 310190, "epoch": 3737} {"train_loss": -25.78433609008789, "global_step": 310191, "epoch": 3737} {"train_loss": -25.507436752319336, "global_step": 310192, "epoch": 3737} {"train_loss": -25.729358673095703, "global_step": 310193, "epoch": 3737} {"train_loss": -25.928699493408203, "global_step": 310194, "epoch": 3737} {"train_loss": -25.865034103393555, "global_step": 310195, "epoch": 3737} {"train_loss": -25.798913955688477, "global_step": 310196, "epoch": 3737} {"train_loss": -25.766254425048828, "global_step": 310197, "epoch": 3737} {"train_loss": -26.148391723632812, "global_step": 310198, "epoch": 3737} {"train_loss": -25.814777374267578, "global_step": 310199, "epoch": 3737} {"train_loss": -25.75506591796875, "global_step": 310200, "epoch": 3737} {"train_loss": -25.591463088989258, "global_step": 310201, "epoch": 3737} {"train_loss": -25.477615356445312, "global_step": 310202, "epoch": 3737} {"train_loss": -25.580326080322266, "global_step": 310203, "epoch": 3737} {"train_loss": -25.606042861938477, "global_step": 310204, "epoch": 3737} {"train_loss": -25.9010009765625, "global_step": 310205, "epoch": 3737} {"train_loss": -25.96173095703125, "global_step": 310206, "epoch": 3737} {"train_loss": -25.708093643188477, "global_step": 310207, "epoch": 3737} {"train_loss": -25.812681198120117, "global_step": 310208, "epoch": 3737} {"train_loss": -25.638946533203125, "global_step": 310209, "epoch": 3737} {"train_loss": -25.74944496154785, "global_step": 310210, "epoch": 3737} {"train_loss": -25.777862548828125, "global_step": 310211, "epoch": 3737} {"train_loss": -25.959924697875977, "global_step": 310212, "epoch": 3737} {"train_loss": -25.77662467956543, "global_step": 310213, "epoch": 3737} {"train_loss": -25.999744415283203, "global_step": 310214, "epoch": 3737} {"train_loss": -25.596261978149414, "global_step": 310215, "epoch": 3737} {"train_loss": -26.018115997314453, "global_step": 310216, "epoch": 3737} {"train_loss": -25.71192741394043, "global_step": 310217, "epoch": 3737} {"train_loss": -25.830825805664062, "global_step": 310218, "epoch": 3737} {"train_loss": -25.448694229125977, "global_step": 310219, "epoch": 3737} {"train_loss": -25.530132293701172, "global_step": 310220, "epoch": 3737} {"train_loss": -25.33601188659668, "global_step": 310221, "epoch": 3737} {"train_loss": -25.44539451599121, "global_step": 310222, "epoch": 3737} {"train_loss": -25.7779598236084, "global_step": 310223, "epoch": 3737} {"train_loss": -26.0009822845459, "global_step": 310224, "epoch": 3737} {"train_loss": -25.749679565429688, "global_step": 310225, "epoch": 3737} {"train_loss": -25.42185401916504, "global_step": 310226, "epoch": 3737} {"train_loss": -25.381023406982422, "global_step": 310227, "epoch": 3737} {"train_loss": -25.839651107788086, "global_step": 310228, "epoch": 3737} {"train_loss": -25.67830467224121, "global_step": 310229, "epoch": 3737} {"train_loss": -26.00127601623535, "global_step": 310230, "epoch": 3737} {"train_loss": -25.371994018554688, "global_step": 310231, "epoch": 3737} {"train_loss": -25.650968551635742, "global_step": 310232, "epoch": 3737} {"train_loss": -25.54670524597168, "global_step": 310233, "epoch": 3737} {"train_loss": -25.64571189880371, "global_step": 310234, "epoch": 3737} {"train_loss": -25.830759048461914, "global_step": 310235, "epoch": 3737} {"train_loss": -25.467378616333008, "global_step": 310236, "epoch": 3737} {"train_loss": -25.6357479095459, "global_step": 310237, "epoch": 3737} {"train_loss": -26.205163955688477, "global_step": 310238, "epoch": 3737} {"train_loss": -26.001007080078125, "global_step": 310239, "epoch": 3737} {"train_loss": -25.396121978759766, "global_step": 310240, "epoch": 3737} {"train_loss": -25.5703125, "global_step": 310241, "epoch": 3737} {"train_loss": -25.79804801940918, "global_step": 310242, "epoch": 3737} {"train_loss": -25.969335556030273, "global_step": 310243, "epoch": 3737} {"train_loss": -25.7310733795166, "global_step": 310244, "epoch": 3737} {"train_loss": -25.793970108032227, "global_step": 310245, "epoch": 3737} {"train_loss": -25.56241226196289, "global_step": 310246, "epoch": 3737} {"train_loss": -25.712371826171875, "global_step": 310247, "epoch": 3737} {"train_loss": -25.589860916137695, "global_step": 310248, "epoch": 3737} {"train_loss": -25.929401397705078, "global_step": 310249, "epoch": 3737} {"train_loss": -25.746021270751953, "global_step": 310250, "epoch": 3737} {"train_loss": -25.84086036682129, "global_step": 310251, "epoch": 3737} {"train_loss": -25.9880313873291, "global_step": 310252, "epoch": 3737} {"train_loss": -25.620800431952418, "global_step": 310253, "epoch": 3737, "val_loss": 7242772.0} {"train_loss": -26.069578170776367, "global_step": 310254, "epoch": 3738} {"train_loss": -25.68218994140625, "global_step": 310255, "epoch": 3738} {"train_loss": -25.45613670349121, "global_step": 310256, "epoch": 3738} {"train_loss": -25.546483993530273, "global_step": 310257, "epoch": 3738} {"train_loss": -26.125091552734375, "global_step": 310258, "epoch": 3738} {"train_loss": -25.640029907226562, "global_step": 310259, "epoch": 3738} {"train_loss": -25.914854049682617, "global_step": 310260, "epoch": 3738} {"train_loss": -25.404865264892578, "global_step": 310261, "epoch": 3738} {"train_loss": -25.3869686126709, "global_step": 310262, "epoch": 3738} {"train_loss": -25.7209529876709, "global_step": 310263, "epoch": 3738} {"train_loss": -25.394132614135742, "global_step": 310264, "epoch": 3738} {"train_loss": -25.397069931030273, "global_step": 310265, "epoch": 3738} {"train_loss": -25.71931266784668, "global_step": 310266, "epoch": 3738} {"train_loss": -25.74529457092285, "global_step": 310267, "epoch": 3738} {"train_loss": -25.109357833862305, "global_step": 310268, "epoch": 3738} {"train_loss": -25.7176456451416, "global_step": 310269, "epoch": 3738} {"train_loss": -25.473005294799805, "global_step": 310270, "epoch": 3738} {"train_loss": -25.21634864807129, "global_step": 310271, "epoch": 3738} {"train_loss": -25.349367141723633, "global_step": 310272, "epoch": 3738} {"train_loss": -26.09492301940918, "global_step": 310273, "epoch": 3738} {"train_loss": -25.888952255249023, "global_step": 310274, "epoch": 3738} {"train_loss": -25.581174850463867, "global_step": 310275, "epoch": 3738} {"train_loss": -25.682727813720703, "global_step": 310276, "epoch": 3738} {"train_loss": -25.903100967407227, "global_step": 310277, "epoch": 3738} {"train_loss": -25.73969078063965, "global_step": 310278, "epoch": 3738} {"train_loss": -26.00361442565918, "global_step": 310279, "epoch": 3738} {"train_loss": -25.65323829650879, "global_step": 310280, "epoch": 3738} {"train_loss": -25.976058959960938, "global_step": 310281, "epoch": 3738} {"train_loss": -25.992578506469727, "global_step": 310282, "epoch": 3738} {"train_loss": -25.319032669067383, "global_step": 310283, "epoch": 3738} {"train_loss": -25.461965560913086, "global_step": 310284, "epoch": 3738} {"train_loss": -25.731689453125, "global_step": 310285, "epoch": 3738} {"train_loss": -25.754194259643555, "global_step": 310286, "epoch": 3738} {"train_loss": -25.657806396484375, "global_step": 310287, "epoch": 3738} {"train_loss": -25.99555778503418, "global_step": 310288, "epoch": 3738} {"train_loss": -25.92791748046875, "global_step": 310289, "epoch": 3738} {"train_loss": -25.545021057128906, "global_step": 310290, "epoch": 3738} {"train_loss": -25.70759391784668, "global_step": 310291, "epoch": 3738} {"train_loss": -26.088266372680664, "global_step": 310292, "epoch": 3738} {"train_loss": -25.86368179321289, "global_step": 310293, "epoch": 3738} {"train_loss": -26.004425048828125, "global_step": 310294, "epoch": 3738} {"train_loss": -25.940176010131836, "global_step": 310295, "epoch": 3738} {"train_loss": -25.951007843017578, "global_step": 310296, "epoch": 3738} {"train_loss": -25.966272354125977, "global_step": 310297, "epoch": 3738} {"train_loss": -25.719266891479492, "global_step": 310298, "epoch": 3738} {"train_loss": -26.184101104736328, "global_step": 310299, "epoch": 3738} {"train_loss": -25.89031982421875, "global_step": 310300, "epoch": 3738} {"train_loss": -25.707345962524414, "global_step": 310301, "epoch": 3738} {"train_loss": -25.698444366455078, "global_step": 310302, "epoch": 3738} {"train_loss": -25.7674617767334, "global_step": 310303, "epoch": 3738} {"train_loss": -26.086267471313477, "global_step": 310304, "epoch": 3738} {"train_loss": -25.60944175720215, "global_step": 310305, "epoch": 3738} {"train_loss": -25.716577529907227, "global_step": 310306, "epoch": 3738} {"train_loss": -25.803640365600586, "global_step": 310307, "epoch": 3738} {"train_loss": -25.7283935546875, "global_step": 310308, "epoch": 3738} {"train_loss": -25.243574142456055, "global_step": 310309, "epoch": 3738} {"train_loss": -25.47673988342285, "global_step": 310310, "epoch": 3738} {"train_loss": -25.27512550354004, "global_step": 310311, "epoch": 3738} {"train_loss": -25.254114151000977, "global_step": 310312, "epoch": 3738} {"train_loss": -24.902463912963867, "global_step": 310313, "epoch": 3738} {"train_loss": -25.6630802154541, "global_step": 310314, "epoch": 3738} {"train_loss": -25.540908813476562, "global_step": 310315, "epoch": 3738} {"train_loss": -25.153738021850586, "global_step": 310316, "epoch": 3738} {"train_loss": -25.483642578125, "global_step": 310317, "epoch": 3738} {"train_loss": -25.8343563079834, "global_step": 310318, "epoch": 3738} {"train_loss": -25.44178581237793, "global_step": 310319, "epoch": 3738} {"train_loss": -25.8242244720459, "global_step": 310320, "epoch": 3738} {"train_loss": -25.475698471069336, "global_step": 310321, "epoch": 3738} {"train_loss": -25.62747573852539, "global_step": 310322, "epoch": 3738} {"train_loss": -25.648786544799805, "global_step": 310323, "epoch": 3738} {"train_loss": -25.735111236572266, "global_step": 310324, "epoch": 3738} {"train_loss": -25.450403213500977, "global_step": 310325, "epoch": 3738} {"train_loss": -25.916227340698242, "global_step": 310326, "epoch": 3738} {"train_loss": -25.940998077392578, "global_step": 310327, "epoch": 3738} {"train_loss": -26.073047637939453, "global_step": 310328, "epoch": 3738} {"train_loss": -25.536787033081055, "global_step": 310329, "epoch": 3738} {"train_loss": -25.781538009643555, "global_step": 310330, "epoch": 3738} {"train_loss": -25.76410484313965, "global_step": 310331, "epoch": 3738} {"train_loss": -25.767414093017578, "global_step": 310332, "epoch": 3738} {"train_loss": -25.928546905517578, "global_step": 310333, "epoch": 3738} {"train_loss": -25.619665145874023, "global_step": 310334, "epoch": 3738} {"train_loss": -25.844852447509766, "global_step": 310335, "epoch": 3738} {"train_loss": -25.705800987151733, "global_step": 310336, "epoch": 3738, "val_loss": 7222023.0} {"train_loss": -25.51561164855957, "global_step": 310337, "epoch": 3739} {"train_loss": -25.62788200378418, "global_step": 310338, "epoch": 3739} {"train_loss": -25.34717559814453, "global_step": 310339, "epoch": 3739} {"train_loss": -25.5965633392334, "global_step": 310340, "epoch": 3739} {"train_loss": -25.851980209350586, "global_step": 310341, "epoch": 3739} {"train_loss": -25.51300811767578, "global_step": 310342, "epoch": 3739} {"train_loss": -25.7464599609375, "global_step": 310343, "epoch": 3739} {"train_loss": -25.47867774963379, "global_step": 310344, "epoch": 3739} {"train_loss": -25.593677520751953, "global_step": 310345, "epoch": 3739} {"train_loss": -25.6197452545166, "global_step": 310346, "epoch": 3739} {"train_loss": -25.651586532592773, "global_step": 310347, "epoch": 3739} {"train_loss": -25.695453643798828, "global_step": 310348, "epoch": 3739} {"train_loss": -25.90585708618164, "global_step": 310349, "epoch": 3739} {"train_loss": -25.81304931640625, "global_step": 310350, "epoch": 3739} {"train_loss": -25.9261417388916, "global_step": 310351, "epoch": 3739} {"train_loss": -25.566226959228516, "global_step": 310352, "epoch": 3739} {"train_loss": -25.742273330688477, "global_step": 310353, "epoch": 3739} {"train_loss": -26.09771156311035, "global_step": 310354, "epoch": 3739} {"train_loss": -25.747516632080078, "global_step": 310355, "epoch": 3739} {"train_loss": -25.65955924987793, "global_step": 310356, "epoch": 3739} {"train_loss": -25.573455810546875, "global_step": 310357, "epoch": 3739} {"train_loss": -26.160598754882812, "global_step": 310358, "epoch": 3739} {"train_loss": -25.97914695739746, "global_step": 310359, "epoch": 3739} {"train_loss": -25.75614356994629, "global_step": 310360, "epoch": 3739} {"train_loss": -25.618057250976562, "global_step": 310361, "epoch": 3739} {"train_loss": -25.872323989868164, "global_step": 310362, "epoch": 3739} {"train_loss": -25.931671142578125, "global_step": 310363, "epoch": 3739} {"train_loss": -26.12811851501465, "global_step": 310364, "epoch": 3739} {"train_loss": -25.578651428222656, "global_step": 310365, "epoch": 3739} {"train_loss": -25.89141273498535, "global_step": 310366, "epoch": 3739} {"train_loss": -25.634252548217773, "global_step": 310367, "epoch": 3739} {"train_loss": -25.930097579956055, "global_step": 310368, "epoch": 3739} {"train_loss": -26.25225830078125, "global_step": 310369, "epoch": 3739} {"train_loss": -25.7683048248291, "global_step": 310370, "epoch": 3739} {"train_loss": -25.817296981811523, "global_step": 310371, "epoch": 3739} {"train_loss": -25.623004913330078, "global_step": 310372, "epoch": 3739} {"train_loss": -25.5279483795166, "global_step": 310373, "epoch": 3739} {"train_loss": -25.850177764892578, "global_step": 310374, "epoch": 3739} {"train_loss": -26.101171493530273, "global_step": 310375, "epoch": 3739} {"train_loss": -26.060251235961914, "global_step": 310376, "epoch": 3739} {"train_loss": -25.65537452697754, "global_step": 310377, "epoch": 3739} {"train_loss": -25.768285751342773, "global_step": 310378, "epoch": 3739} {"train_loss": -25.6259708404541, "global_step": 310379, "epoch": 3739} {"train_loss": -25.772756576538086, "global_step": 310380, "epoch": 3739} {"train_loss": -25.703229904174805, "global_step": 310381, "epoch": 3739} {"train_loss": -25.49959373474121, "global_step": 310382, "epoch": 3739} {"train_loss": -26.020090103149414, "global_step": 310383, "epoch": 3739} {"train_loss": -25.588836669921875, "global_step": 310384, "epoch": 3739} {"train_loss": -25.421926498413086, "global_step": 310385, "epoch": 3739} {"train_loss": -25.48142433166504, "global_step": 310386, "epoch": 3739} {"train_loss": -25.9681453704834, "global_step": 310387, "epoch": 3739} {"train_loss": -25.55314826965332, "global_step": 310388, "epoch": 3739} {"train_loss": -25.370397567749023, "global_step": 310389, "epoch": 3739} {"train_loss": -25.348674774169922, "global_step": 310390, "epoch": 3739} {"train_loss": -24.991514205932617, "global_step": 310391, "epoch": 3739} {"train_loss": -25.54547691345215, "global_step": 310392, "epoch": 3739} {"train_loss": -25.472835540771484, "global_step": 310393, "epoch": 3739} {"train_loss": -25.55079460144043, "global_step": 310394, "epoch": 3739} {"train_loss": -25.469398498535156, "global_step": 310395, "epoch": 3739} {"train_loss": -25.587114334106445, "global_step": 310396, "epoch": 3739} {"train_loss": -25.753564834594727, "global_step": 310397, "epoch": 3739} {"train_loss": -25.671018600463867, "global_step": 310398, "epoch": 3739} {"train_loss": -25.534711837768555, "global_step": 310399, "epoch": 3739} {"train_loss": -25.791563034057617, "global_step": 310400, "epoch": 3739} {"train_loss": -25.954206466674805, "global_step": 310401, "epoch": 3739} {"train_loss": -26.091583251953125, "global_step": 310402, "epoch": 3739} {"train_loss": -26.08021354675293, "global_step": 310403, "epoch": 3739} {"train_loss": -25.793752670288086, "global_step": 310404, "epoch": 3739} {"train_loss": -25.838836669921875, "global_step": 310405, "epoch": 3739} {"train_loss": -25.557809829711914, "global_step": 310406, "epoch": 3739} {"train_loss": -25.675790786743164, "global_step": 310407, "epoch": 3739} {"train_loss": -26.0063419342041, "global_step": 310408, "epoch": 3739} {"train_loss": -25.794004440307617, "global_step": 310409, "epoch": 3739} {"train_loss": -25.62013053894043, "global_step": 310410, "epoch": 3739} {"train_loss": -25.941925048828125, "global_step": 310411, "epoch": 3739} {"train_loss": -26.06284523010254, "global_step": 310412, "epoch": 3739} {"train_loss": -25.8056640625, "global_step": 310413, "epoch": 3739} {"train_loss": -25.83357810974121, "global_step": 310414, "epoch": 3739} {"train_loss": -26.122602462768555, "global_step": 310415, "epoch": 3739} {"train_loss": -25.879846572875977, "global_step": 310416, "epoch": 3739} {"train_loss": -26.042728424072266, "global_step": 310417, "epoch": 3739} {"train_loss": -25.692276000976562, "global_step": 310418, "epoch": 3739} {"train_loss": -25.743277216532146, "global_step": 310419, "epoch": 3739, "val_loss": 7244913.0} {"train_loss": -25.22029685974121, "global_step": 310420, "epoch": 3740} {"train_loss": -25.063215255737305, "global_step": 310421, "epoch": 3740} {"train_loss": -24.469867706298828, "global_step": 310422, "epoch": 3740} {"train_loss": -25.524621963500977, "global_step": 310423, "epoch": 3740} {"train_loss": -25.5163631439209, "global_step": 310424, "epoch": 3740} {"train_loss": -24.75143051147461, "global_step": 310425, "epoch": 3740} {"train_loss": -25.106225967407227, "global_step": 310426, "epoch": 3740} {"train_loss": -25.39926528930664, "global_step": 310427, "epoch": 3740} {"train_loss": -25.086645126342773, "global_step": 310428, "epoch": 3740} {"train_loss": -25.41579818725586, "global_step": 310429, "epoch": 3740} {"train_loss": -25.4597110748291, "global_step": 310430, "epoch": 3740} {"train_loss": -25.63239097595215, "global_step": 310431, "epoch": 3740} {"train_loss": -25.28663444519043, "global_step": 310432, "epoch": 3740} {"train_loss": -25.987279891967773, "global_step": 310433, "epoch": 3740} {"train_loss": -25.62795066833496, "global_step": 310434, "epoch": 3740} {"train_loss": -25.83205223083496, "global_step": 310435, "epoch": 3740} {"train_loss": -25.578304290771484, "global_step": 310436, "epoch": 3740} {"train_loss": -25.575103759765625, "global_step": 310437, "epoch": 3740} {"train_loss": -25.986438751220703, "global_step": 310438, "epoch": 3740} {"train_loss": -25.526504516601562, "global_step": 310439, "epoch": 3740} {"train_loss": -25.88917350769043, "global_step": 310440, "epoch": 3740} {"train_loss": -25.566837310791016, "global_step": 310441, "epoch": 3740} {"train_loss": -25.772327423095703, "global_step": 310442, "epoch": 3740} {"train_loss": -25.631933212280273, "global_step": 310443, "epoch": 3740} {"train_loss": -25.716093063354492, "global_step": 310444, "epoch": 3740} {"train_loss": -25.52841567993164, "global_step": 310445, "epoch": 3740} {"train_loss": -25.538976669311523, "global_step": 310446, "epoch": 3740} {"train_loss": -25.68899917602539, "global_step": 310447, "epoch": 3740} {"train_loss": -25.411489486694336, "global_step": 310448, "epoch": 3740} {"train_loss": -25.477502822875977, "global_step": 310449, "epoch": 3740} {"train_loss": -25.712570190429688, "global_step": 310450, "epoch": 3740} {"train_loss": -25.314857482910156, "global_step": 310451, "epoch": 3740} {"train_loss": -25.49348258972168, "global_step": 310452, "epoch": 3740} {"train_loss": -26.0091552734375, "global_step": 310453, "epoch": 3740} {"train_loss": -25.89295768737793, "global_step": 310454, "epoch": 3740} {"train_loss": -25.935571670532227, "global_step": 310455, "epoch": 3740} {"train_loss": -25.736230850219727, "global_step": 310456, "epoch": 3740} {"train_loss": -25.705474853515625, "global_step": 310457, "epoch": 3740} {"train_loss": -25.672266006469727, "global_step": 310458, "epoch": 3740} {"train_loss": -25.952932357788086, "global_step": 310459, "epoch": 3740} {"train_loss": -25.493017196655273, "global_step": 310460, "epoch": 3740} {"train_loss": -25.76629638671875, "global_step": 310461, "epoch": 3740} {"train_loss": -25.278921127319336, "global_step": 310462, "epoch": 3740} {"train_loss": -25.89235496520996, "global_step": 310463, "epoch": 3740} {"train_loss": -25.698246002197266, "global_step": 310464, "epoch": 3740} {"train_loss": -25.8665714263916, "global_step": 310465, "epoch": 3740} {"train_loss": -25.96632194519043, "global_step": 310466, "epoch": 3740} {"train_loss": -25.910873413085938, "global_step": 310467, "epoch": 3740} {"train_loss": -25.400548934936523, "global_step": 310468, "epoch": 3740} {"train_loss": -26.049488067626953, "global_step": 310469, "epoch": 3740} {"train_loss": -25.597585678100586, "global_step": 310470, "epoch": 3740} {"train_loss": -25.63315773010254, "global_step": 310471, "epoch": 3740} {"train_loss": -25.54036521911621, "global_step": 310472, "epoch": 3740} {"train_loss": -25.530216217041016, "global_step": 310473, "epoch": 3740} {"train_loss": -25.870595932006836, "global_step": 310474, "epoch": 3740} {"train_loss": -25.553068161010742, "global_step": 310475, "epoch": 3740} {"train_loss": -25.626020431518555, "global_step": 310476, "epoch": 3740} {"train_loss": -26.0140380859375, "global_step": 310477, "epoch": 3740} {"train_loss": -25.938068389892578, "global_step": 310478, "epoch": 3740} {"train_loss": -25.367664337158203, "global_step": 310479, "epoch": 3740} {"train_loss": -25.970266342163086, "global_step": 310480, "epoch": 3740} {"train_loss": -25.47532081604004, "global_step": 310481, "epoch": 3740} {"train_loss": -25.16090965270996, "global_step": 310482, "epoch": 3740} {"train_loss": -25.107444763183594, "global_step": 310483, "epoch": 3740} {"train_loss": -25.578649520874023, "global_step": 310484, "epoch": 3740} {"train_loss": -25.340604782104492, "global_step": 310485, "epoch": 3740} {"train_loss": -25.89264488220215, "global_step": 310486, "epoch": 3740} {"train_loss": -25.448877334594727, "global_step": 310487, "epoch": 3740} {"train_loss": -25.82973289489746, "global_step": 310488, "epoch": 3740} {"train_loss": -25.443693161010742, "global_step": 310489, "epoch": 3740} {"train_loss": -25.809240341186523, "global_step": 310490, "epoch": 3740} {"train_loss": -25.93891716003418, "global_step": 310491, "epoch": 3740} {"train_loss": -25.616851806640625, "global_step": 310492, "epoch": 3740} {"train_loss": -25.596961975097656, "global_step": 310493, "epoch": 3740} {"train_loss": -25.72200584411621, "global_step": 310494, "epoch": 3740} {"train_loss": -25.3873233795166, "global_step": 310495, "epoch": 3740} {"train_loss": -25.579084396362305, "global_step": 310496, "epoch": 3740} {"train_loss": -25.683307647705078, "global_step": 310497, "epoch": 3740} {"train_loss": -25.195796966552734, "global_step": 310498, "epoch": 3740} {"train_loss": -25.661123275756836, "global_step": 310499, "epoch": 3740} {"train_loss": -25.530460357666016, "global_step": 310500, "epoch": 3740} {"train_loss": -25.621002197265625, "global_step": 310501, "epoch": 3740} {"train_loss": -25.5995990569333, "global_step": 310502, "epoch": 3740, "val_loss": 7294171.0} {"train_loss": -25.41391944885254, "global_step": 310503, "epoch": 3741} {"train_loss": -24.62070655822754, "global_step": 310504, "epoch": 3741} {"train_loss": -25.474332809448242, "global_step": 310505, "epoch": 3741} {"train_loss": -24.834148406982422, "global_step": 310506, "epoch": 3741} {"train_loss": -24.826276779174805, "global_step": 310507, "epoch": 3741} {"train_loss": -24.57191276550293, "global_step": 310508, "epoch": 3741} {"train_loss": -24.726490020751953, "global_step": 310509, "epoch": 3741} {"train_loss": -25.255701065063477, "global_step": 310510, "epoch": 3741} {"train_loss": -25.190595626831055, "global_step": 310511, "epoch": 3741} {"train_loss": -25.370357513427734, "global_step": 310512, "epoch": 3741} {"train_loss": -25.702667236328125, "global_step": 310513, "epoch": 3741} {"train_loss": -25.160436630249023, "global_step": 310514, "epoch": 3741} {"train_loss": -25.097293853759766, "global_step": 310515, "epoch": 3741} {"train_loss": -25.01561164855957, "global_step": 310516, "epoch": 3741} {"train_loss": -25.684423446655273, "global_step": 310517, "epoch": 3741} {"train_loss": -25.57354736328125, "global_step": 310518, "epoch": 3741} {"train_loss": -25.3380184173584, "global_step": 310519, "epoch": 3741} {"train_loss": -25.6226863861084, "global_step": 310520, "epoch": 3741} {"train_loss": -26.063329696655273, "global_step": 310521, "epoch": 3741} {"train_loss": -25.10451316833496, "global_step": 310522, "epoch": 3741} {"train_loss": -25.484922409057617, "global_step": 310523, "epoch": 3741} {"train_loss": -25.682905197143555, "global_step": 310524, "epoch": 3741} {"train_loss": -25.404722213745117, "global_step": 310525, "epoch": 3741} {"train_loss": -25.49774742126465, "global_step": 310526, "epoch": 3741} {"train_loss": -25.7578182220459, "global_step": 310527, "epoch": 3741} {"train_loss": -25.635305404663086, "global_step": 310528, "epoch": 3741} {"train_loss": -25.42165184020996, "global_step": 310529, "epoch": 3741} {"train_loss": -25.669458389282227, "global_step": 310530, "epoch": 3741} {"train_loss": -25.50202178955078, "global_step": 310531, "epoch": 3741} {"train_loss": -25.836627960205078, "global_step": 310532, "epoch": 3741} {"train_loss": -25.790740966796875, "global_step": 310533, "epoch": 3741} {"train_loss": -25.685047149658203, "global_step": 310534, "epoch": 3741} {"train_loss": -25.798669815063477, "global_step": 310535, "epoch": 3741} {"train_loss": -26.014184951782227, "global_step": 310536, "epoch": 3741} {"train_loss": -25.451936721801758, "global_step": 310537, "epoch": 3741} {"train_loss": -25.869962692260742, "global_step": 310538, "epoch": 3741} {"train_loss": -25.686246871948242, "global_step": 310539, "epoch": 3741} {"train_loss": -26.05438232421875, "global_step": 310540, "epoch": 3741} {"train_loss": -25.947126388549805, "global_step": 310541, "epoch": 3741} {"train_loss": -25.8618106842041, "global_step": 310542, "epoch": 3741} {"train_loss": -25.631961822509766, "global_step": 310543, "epoch": 3741} {"train_loss": -25.952713012695312, "global_step": 310544, "epoch": 3741} {"train_loss": -25.855276107788086, "global_step": 310545, "epoch": 3741} {"train_loss": -25.689828872680664, "global_step": 310546, "epoch": 3741} {"train_loss": -25.742345809936523, "global_step": 310547, "epoch": 3741} {"train_loss": -26.16337013244629, "global_step": 310548, "epoch": 3741} {"train_loss": -25.618581771850586, "global_step": 310549, "epoch": 3741} {"train_loss": -25.968931198120117, "global_step": 310550, "epoch": 3741} {"train_loss": -25.76637840270996, "global_step": 310551, "epoch": 3741} {"train_loss": -25.605854034423828, "global_step": 310552, "epoch": 3741} {"train_loss": -25.604141235351562, "global_step": 310553, "epoch": 3741} {"train_loss": -25.758991241455078, "global_step": 310554, "epoch": 3741} {"train_loss": -25.667715072631836, "global_step": 310555, "epoch": 3741} {"train_loss": -25.887027740478516, "global_step": 310556, "epoch": 3741} {"train_loss": -25.942214965820312, "global_step": 310557, "epoch": 3741} {"train_loss": -25.910358428955078, "global_step": 310558, "epoch": 3741} {"train_loss": -25.627195358276367, "global_step": 310559, "epoch": 3741} {"train_loss": -25.9880313873291, "global_step": 310560, "epoch": 3741} {"train_loss": -26.01951026916504, "global_step": 310561, "epoch": 3741} {"train_loss": -25.273000717163086, "global_step": 310562, "epoch": 3741} {"train_loss": -25.526304244995117, "global_step": 310563, "epoch": 3741} {"train_loss": -25.6954288482666, "global_step": 310564, "epoch": 3741} {"train_loss": -25.43714714050293, "global_step": 310565, "epoch": 3741} {"train_loss": -25.409841537475586, "global_step": 310566, "epoch": 3741} {"train_loss": -25.515085220336914, "global_step": 310567, "epoch": 3741} {"train_loss": -25.213272094726562, "global_step": 310568, "epoch": 3741} {"train_loss": -25.489871978759766, "global_step": 310569, "epoch": 3741} {"train_loss": -25.802881240844727, "global_step": 310570, "epoch": 3741} {"train_loss": -25.886640548706055, "global_step": 310571, "epoch": 3741} {"train_loss": -25.39110565185547, "global_step": 310572, "epoch": 3741} {"train_loss": -25.62953758239746, "global_step": 310573, "epoch": 3741} {"train_loss": -25.6015567779541, "global_step": 310574, "epoch": 3741} {"train_loss": -25.64765739440918, "global_step": 310575, "epoch": 3741} {"train_loss": -25.856128692626953, "global_step": 310576, "epoch": 3741} {"train_loss": -26.056833267211914, "global_step": 310577, "epoch": 3741} {"train_loss": -25.943700790405273, "global_step": 310578, "epoch": 3741} {"train_loss": -26.065509796142578, "global_step": 310579, "epoch": 3741} {"train_loss": -26.081439971923828, "global_step": 310580, "epoch": 3741} {"train_loss": -25.798559188842773, "global_step": 310581, "epoch": 3741} {"train_loss": -26.351926803588867, "global_step": 310582, "epoch": 3741} {"train_loss": -25.87442398071289, "global_step": 310583, "epoch": 3741} {"train_loss": -25.749805450439453, "global_step": 310584, "epoch": 3741} {"train_loss": -25.617061178368257, "global_step": 310585, "epoch": 3741, "val_loss": 7291391.5} {"train_loss": -25.21546745300293, "global_step": 310586, "epoch": 3742} {"train_loss": -24.924455642700195, "global_step": 310587, "epoch": 3742} {"train_loss": -25.643787384033203, "global_step": 310588, "epoch": 3742} {"train_loss": -25.430713653564453, "global_step": 310589, "epoch": 3742} {"train_loss": -25.263776779174805, "global_step": 310590, "epoch": 3742} {"train_loss": -25.186582565307617, "global_step": 310591, "epoch": 3742} {"train_loss": -25.41031837463379, "global_step": 310592, "epoch": 3742} {"train_loss": -25.389570236206055, "global_step": 310593, "epoch": 3742} {"train_loss": -25.380170822143555, "global_step": 310594, "epoch": 3742} {"train_loss": -24.844303131103516, "global_step": 310595, "epoch": 3742} {"train_loss": -25.391544342041016, "global_step": 310596, "epoch": 3742} {"train_loss": -25.690185546875, "global_step": 310597, "epoch": 3742} {"train_loss": -25.75054931640625, "global_step": 310598, "epoch": 3742} {"train_loss": -25.240177154541016, "global_step": 310599, "epoch": 3742} {"train_loss": -25.407541275024414, "global_step": 310600, "epoch": 3742} {"train_loss": -25.570966720581055, "global_step": 310601, "epoch": 3742} {"train_loss": -25.663105010986328, "global_step": 310602, "epoch": 3742} {"train_loss": -25.728010177612305, "global_step": 310603, "epoch": 3742} {"train_loss": -25.878583908081055, "global_step": 310604, "epoch": 3742} {"train_loss": -25.3750057220459, "global_step": 310605, "epoch": 3742} {"train_loss": -25.8963565826416, "global_step": 310606, "epoch": 3742} {"train_loss": -25.520763397216797, "global_step": 310607, "epoch": 3742} {"train_loss": -25.6630802154541, "global_step": 310608, "epoch": 3742} {"train_loss": -25.91054344177246, "global_step": 310609, "epoch": 3742} {"train_loss": -25.7506103515625, "global_step": 310610, "epoch": 3742} {"train_loss": -25.515958786010742, "global_step": 310611, "epoch": 3742} {"train_loss": -25.90498924255371, "global_step": 310612, "epoch": 3742} {"train_loss": -25.33837890625, "global_step": 310613, "epoch": 3742} {"train_loss": -25.783390045166016, "global_step": 310614, "epoch": 3742} {"train_loss": -25.76471519470215, "global_step": 310615, "epoch": 3742} {"train_loss": -25.824981689453125, "global_step": 310616, "epoch": 3742} {"train_loss": -25.866064071655273, "global_step": 310617, "epoch": 3742} {"train_loss": -26.10440444946289, "global_step": 310618, "epoch": 3742} {"train_loss": -25.942590713500977, "global_step": 310619, "epoch": 3742} {"train_loss": -25.542722702026367, "global_step": 310620, "epoch": 3742} {"train_loss": -26.0648193359375, "global_step": 310621, "epoch": 3742} {"train_loss": -25.913898468017578, "global_step": 310622, "epoch": 3742} {"train_loss": -25.291053771972656, "global_step": 310623, "epoch": 3742} {"train_loss": -25.64850425720215, "global_step": 310624, "epoch": 3742} {"train_loss": -25.6015682220459, "global_step": 310625, "epoch": 3742} {"train_loss": -26.08839225769043, "global_step": 310626, "epoch": 3742} {"train_loss": -25.60719108581543, "global_step": 310627, "epoch": 3742} {"train_loss": -25.807416915893555, "global_step": 310628, "epoch": 3742} {"train_loss": -26.295948028564453, "global_step": 310629, "epoch": 3742} {"train_loss": -26.288129806518555, "global_step": 310630, "epoch": 3742} {"train_loss": -25.661569595336914, "global_step": 310631, "epoch": 3742} {"train_loss": -25.6727352142334, "global_step": 310632, "epoch": 3742} {"train_loss": -25.647708892822266, "global_step": 310633, "epoch": 3742} {"train_loss": -25.616947174072266, "global_step": 310634, "epoch": 3742} {"train_loss": -25.41656494140625, "global_step": 310635, "epoch": 3742} {"train_loss": -25.807403564453125, "global_step": 310636, "epoch": 3742} {"train_loss": -25.963773727416992, "global_step": 310637, "epoch": 3742} {"train_loss": -25.567670822143555, "global_step": 310638, "epoch": 3742} {"train_loss": -25.818090438842773, "global_step": 310639, "epoch": 3742} {"train_loss": -25.80828857421875, "global_step": 310640, "epoch": 3742} {"train_loss": -25.715988159179688, "global_step": 310641, "epoch": 3742} {"train_loss": -26.036901473999023, "global_step": 310642, "epoch": 3742} {"train_loss": -26.051084518432617, "global_step": 310643, "epoch": 3742} {"train_loss": -25.7387638092041, "global_step": 310644, "epoch": 3742} {"train_loss": -25.703784942626953, "global_step": 310645, "epoch": 3742} {"train_loss": -25.45649528503418, "global_step": 310646, "epoch": 3742} {"train_loss": -25.31357192993164, "global_step": 310647, "epoch": 3742} {"train_loss": -25.206069946289062, "global_step": 310648, "epoch": 3742} {"train_loss": -25.75465202331543, "global_step": 310649, "epoch": 3742} {"train_loss": -25.391956329345703, "global_step": 310650, "epoch": 3742} {"train_loss": -25.511747360229492, "global_step": 310651, "epoch": 3742} {"train_loss": -25.659635543823242, "global_step": 310652, "epoch": 3742} {"train_loss": -25.113693237304688, "global_step": 310653, "epoch": 3742} {"train_loss": -25.7076416015625, "global_step": 310654, "epoch": 3742} {"train_loss": -25.104772567749023, "global_step": 310655, "epoch": 3742} {"train_loss": -25.469274520874023, "global_step": 310656, "epoch": 3742} {"train_loss": -25.73630714416504, "global_step": 310657, "epoch": 3742} {"train_loss": -25.601552963256836, "global_step": 310658, "epoch": 3742} {"train_loss": -25.349472045898438, "global_step": 310659, "epoch": 3742} {"train_loss": -25.483474731445312, "global_step": 310660, "epoch": 3742} {"train_loss": -26.018590927124023, "global_step": 310661, "epoch": 3742} {"train_loss": -25.62356948852539, "global_step": 310662, "epoch": 3742} {"train_loss": -25.491605758666992, "global_step": 310663, "epoch": 3742} {"train_loss": -25.62556266784668, "global_step": 310664, "epoch": 3742} {"train_loss": -25.65865135192871, "global_step": 310665, "epoch": 3742} {"train_loss": -25.789030075073242, "global_step": 310666, "epoch": 3742} {"train_loss": -25.695297241210938, "global_step": 310667, "epoch": 3742} {"train_loss": -25.61984657379518, "global_step": 310668, "epoch": 3742, "val_loss": 7384659.5} {"train_loss": -25.357982635498047, "global_step": 310669, "epoch": 3743} {"train_loss": -25.69207763671875, "global_step": 310670, "epoch": 3743} {"train_loss": -25.603330612182617, "global_step": 310671, "epoch": 3743} {"train_loss": -25.417129516601562, "global_step": 310672, "epoch": 3743} {"train_loss": -25.40608787536621, "global_step": 310673, "epoch": 3743} {"train_loss": -25.451980590820312, "global_step": 310674, "epoch": 3743} {"train_loss": -25.904052734375, "global_step": 310675, "epoch": 3743} {"train_loss": -25.6673526763916, "global_step": 310676, "epoch": 3743} {"train_loss": -25.858261108398438, "global_step": 310677, "epoch": 3743} {"train_loss": -25.92172622680664, "global_step": 310678, "epoch": 3743} {"train_loss": -25.733062744140625, "global_step": 310679, "epoch": 3743} {"train_loss": -26.02857780456543, "global_step": 310680, "epoch": 3743} {"train_loss": -26.242822647094727, "global_step": 310681, "epoch": 3743} {"train_loss": -25.788867950439453, "global_step": 310682, "epoch": 3743} {"train_loss": -25.57758903503418, "global_step": 310683, "epoch": 3743} {"train_loss": -25.834508895874023, "global_step": 310684, "epoch": 3743} {"train_loss": -26.14691734313965, "global_step": 310685, "epoch": 3743} {"train_loss": -26.041656494140625, "global_step": 310686, "epoch": 3743} {"train_loss": -25.746618270874023, "global_step": 310687, "epoch": 3743} {"train_loss": -25.43387794494629, "global_step": 310688, "epoch": 3743} {"train_loss": -25.9531307220459, "global_step": 310689, "epoch": 3743} {"train_loss": -25.70170021057129, "global_step": 310690, "epoch": 3743} {"train_loss": -26.105268478393555, "global_step": 310691, "epoch": 3743} {"train_loss": -25.601469039916992, "global_step": 310692, "epoch": 3743} {"train_loss": -25.770551681518555, "global_step": 310693, "epoch": 3743} {"train_loss": -25.52399253845215, "global_step": 310694, "epoch": 3743} {"train_loss": -25.873767852783203, "global_step": 310695, "epoch": 3743} {"train_loss": -25.81318473815918, "global_step": 310696, "epoch": 3743} {"train_loss": -25.856735229492188, "global_step": 310697, "epoch": 3743} {"train_loss": -25.813867568969727, "global_step": 310698, "epoch": 3743} {"train_loss": -25.60333251953125, "global_step": 310699, "epoch": 3743} {"train_loss": -25.557523727416992, "global_step": 310700, "epoch": 3743} {"train_loss": -25.334016799926758, "global_step": 310701, "epoch": 3743} {"train_loss": -25.651641845703125, "global_step": 310702, "epoch": 3743} {"train_loss": -25.9403018951416, "global_step": 310703, "epoch": 3743} {"train_loss": -25.596391677856445, "global_step": 310704, "epoch": 3743} {"train_loss": -25.451446533203125, "global_step": 310705, "epoch": 3743} {"train_loss": -25.585988998413086, "global_step": 310706, "epoch": 3743} {"train_loss": -25.8359317779541, "global_step": 310707, "epoch": 3743} {"train_loss": -25.745954513549805, "global_step": 310708, "epoch": 3743} {"train_loss": -26.263687133789062, "global_step": 310709, "epoch": 3743} {"train_loss": -25.686857223510742, "global_step": 310710, "epoch": 3743} {"train_loss": -25.920886993408203, "global_step": 310711, "epoch": 3743} {"train_loss": -25.268461227416992, "global_step": 310712, "epoch": 3743} {"train_loss": -25.63404655456543, "global_step": 310713, "epoch": 3743} {"train_loss": -26.050745010375977, "global_step": 310714, "epoch": 3743} {"train_loss": -25.799768447875977, "global_step": 310715, "epoch": 3743} {"train_loss": -25.664508819580078, "global_step": 310716, "epoch": 3743} {"train_loss": -25.27425193786621, "global_step": 310717, "epoch": 3743} {"train_loss": -25.476226806640625, "global_step": 310718, "epoch": 3743} {"train_loss": -25.789764404296875, "global_step": 310719, "epoch": 3743} {"train_loss": -25.95761489868164, "global_step": 310720, "epoch": 3743} {"train_loss": -25.842004776000977, "global_step": 310721, "epoch": 3743} {"train_loss": -25.743467330932617, "global_step": 310722, "epoch": 3743} {"train_loss": -25.565174102783203, "global_step": 310723, "epoch": 3743} {"train_loss": -25.784290313720703, "global_step": 310724, "epoch": 3743} {"train_loss": -25.57794761657715, "global_step": 310725, "epoch": 3743} {"train_loss": -25.8789005279541, "global_step": 310726, "epoch": 3743} {"train_loss": -25.710599899291992, "global_step": 310727, "epoch": 3743} {"train_loss": -26.245758056640625, "global_step": 310728, "epoch": 3743} {"train_loss": -25.891164779663086, "global_step": 310729, "epoch": 3743} {"train_loss": -25.467514038085938, "global_step": 310730, "epoch": 3743} {"train_loss": -25.631622314453125, "global_step": 310731, "epoch": 3743} {"train_loss": -25.78302574157715, "global_step": 310732, "epoch": 3743} {"train_loss": -25.845922470092773, "global_step": 310733, "epoch": 3743} {"train_loss": -26.22992515563965, "global_step": 310734, "epoch": 3743} {"train_loss": -25.86821937561035, "global_step": 310735, "epoch": 3743} {"train_loss": -25.703271865844727, "global_step": 310736, "epoch": 3743} {"train_loss": -25.874958038330078, "global_step": 310737, "epoch": 3743} {"train_loss": -25.851713180541992, "global_step": 310738, "epoch": 3743} {"train_loss": -25.95911979675293, "global_step": 310739, "epoch": 3743} {"train_loss": -26.1954345703125, "global_step": 310740, "epoch": 3743} {"train_loss": -26.21600914001465, "global_step": 310741, "epoch": 3743} {"train_loss": -25.67413902282715, "global_step": 310742, "epoch": 3743} {"train_loss": -25.92047691345215, "global_step": 310743, "epoch": 3743} {"train_loss": -25.69244956970215, "global_step": 310744, "epoch": 3743} {"train_loss": -25.189435958862305, "global_step": 310745, "epoch": 3743} {"train_loss": -25.16127586364746, "global_step": 310746, "epoch": 3743} {"train_loss": -25.113161087036133, "global_step": 310747, "epoch": 3743} {"train_loss": -25.937612533569336, "global_step": 310748, "epoch": 3743} {"train_loss": -25.172317504882812, "global_step": 310749, "epoch": 3743} {"train_loss": -24.94148826599121, "global_step": 310750, "epoch": 3743} {"train_loss": -25.70183117418404, "global_step": 310751, "epoch": 3743, "val_loss": 7263442.0} {"train_loss": -19.292978286743164, "global_step": 310752, "epoch": 3744} {"train_loss": -23.24641990661621, "global_step": 310753, "epoch": 3744} {"train_loss": -22.573972702026367, "global_step": 310754, "epoch": 3744} {"train_loss": -23.37526512145996, "global_step": 310755, "epoch": 3744} {"train_loss": -23.720043182373047, "global_step": 310756, "epoch": 3744} {"train_loss": -23.53938865661621, "global_step": 310757, "epoch": 3744} {"train_loss": -24.21540641784668, "global_step": 310758, "epoch": 3744} {"train_loss": -24.144126892089844, "global_step": 310759, "epoch": 3744} {"train_loss": -23.28073501586914, "global_step": 310760, "epoch": 3744} {"train_loss": -24.004610061645508, "global_step": 310761, "epoch": 3744} {"train_loss": -24.318098068237305, "global_step": 310762, "epoch": 3744} {"train_loss": -24.221221923828125, "global_step": 310763, "epoch": 3744} {"train_loss": -24.165613174438477, "global_step": 310764, "epoch": 3744} {"train_loss": -24.376903533935547, "global_step": 310765, "epoch": 3744} {"train_loss": -24.66322898864746, "global_step": 310766, "epoch": 3744} {"train_loss": -24.45218849182129, "global_step": 310767, "epoch": 3744} {"train_loss": -24.4542179107666, "global_step": 310768, "epoch": 3744} {"train_loss": -24.40410041809082, "global_step": 310769, "epoch": 3744} {"train_loss": -24.314838409423828, "global_step": 310770, "epoch": 3744} {"train_loss": -24.416349411010742, "global_step": 310771, "epoch": 3744} {"train_loss": -25.01410484313965, "global_step": 310772, "epoch": 3744} {"train_loss": -24.703290939331055, "global_step": 310773, "epoch": 3744} {"train_loss": -25.137908935546875, "global_step": 310774, "epoch": 3744} {"train_loss": -25.16969108581543, "global_step": 310775, "epoch": 3744} {"train_loss": -24.9569034576416, "global_step": 310776, "epoch": 3744} {"train_loss": -24.683000564575195, "global_step": 310777, "epoch": 3744} {"train_loss": -24.56904411315918, "global_step": 310778, "epoch": 3744} {"train_loss": -25.246673583984375, "global_step": 310779, "epoch": 3744} {"train_loss": -25.059368133544922, "global_step": 310780, "epoch": 3744} {"train_loss": -25.012182235717773, "global_step": 310781, "epoch": 3744} {"train_loss": -25.148405075073242, "global_step": 310782, "epoch": 3744} {"train_loss": -25.03914451599121, "global_step": 310783, "epoch": 3744} {"train_loss": -25.11359977722168, "global_step": 310784, "epoch": 3744} {"train_loss": -25.61248779296875, "global_step": 310785, "epoch": 3744} {"train_loss": -25.106647491455078, "global_step": 310786, "epoch": 3744} {"train_loss": -25.2874813079834, "global_step": 310787, "epoch": 3744} {"train_loss": -25.39356803894043, "global_step": 310788, "epoch": 3744} {"train_loss": -25.611682891845703, "global_step": 310789, "epoch": 3744} {"train_loss": -25.30301284790039, "global_step": 310790, "epoch": 3744} {"train_loss": -25.54151725769043, "global_step": 310791, "epoch": 3744} {"train_loss": -25.60517692565918, "global_step": 310792, "epoch": 3744} {"train_loss": -25.348119735717773, "global_step": 310793, "epoch": 3744} {"train_loss": -25.170726776123047, "global_step": 310794, "epoch": 3744} {"train_loss": -25.361473083496094, "global_step": 310795, "epoch": 3744} {"train_loss": -25.79911231994629, "global_step": 310796, "epoch": 3744} {"train_loss": -25.905920028686523, "global_step": 310797, "epoch": 3744} {"train_loss": -25.66474723815918, "global_step": 310798, "epoch": 3744} {"train_loss": -25.419870376586914, "global_step": 310799, "epoch": 3744} {"train_loss": -25.810138702392578, "global_step": 310800, "epoch": 3744} {"train_loss": -25.750274658203125, "global_step": 310801, "epoch": 3744} {"train_loss": -25.600574493408203, "global_step": 310802, "epoch": 3744} {"train_loss": -25.700637817382812, "global_step": 310803, "epoch": 3744} {"train_loss": -25.76739501953125, "global_step": 310804, "epoch": 3744} {"train_loss": -25.356842041015625, "global_step": 310805, "epoch": 3744} {"train_loss": -25.577388763427734, "global_step": 310806, "epoch": 3744} {"train_loss": -25.187259674072266, "global_step": 310807, "epoch": 3744} {"train_loss": -25.814102172851562, "global_step": 310808, "epoch": 3744} {"train_loss": -25.5421199798584, "global_step": 310809, "epoch": 3744} {"train_loss": -25.63056755065918, "global_step": 310810, "epoch": 3744} {"train_loss": -25.84132194519043, "global_step": 310811, "epoch": 3744} {"train_loss": -25.58795738220215, "global_step": 310812, "epoch": 3744} {"train_loss": -25.3538875579834, "global_step": 310813, "epoch": 3744} {"train_loss": -25.977664947509766, "global_step": 310814, "epoch": 3744} {"train_loss": -26.008420944213867, "global_step": 310815, "epoch": 3744} {"train_loss": -25.76301383972168, "global_step": 310816, "epoch": 3744} {"train_loss": -25.615156173706055, "global_step": 310817, "epoch": 3744} {"train_loss": -25.397106170654297, "global_step": 310818, "epoch": 3744} {"train_loss": -25.164785385131836, "global_step": 310819, "epoch": 3744} {"train_loss": -25.537158966064453, "global_step": 310820, "epoch": 3744} {"train_loss": -25.598676681518555, "global_step": 310821, "epoch": 3744} {"train_loss": -25.598487854003906, "global_step": 310822, "epoch": 3744} {"train_loss": -25.48463249206543, "global_step": 310823, "epoch": 3744} {"train_loss": -25.9589900970459, "global_step": 310824, "epoch": 3744} {"train_loss": -25.671630859375, "global_step": 310825, "epoch": 3744} {"train_loss": -25.663116455078125, "global_step": 310826, "epoch": 3744} {"train_loss": -25.722339630126953, "global_step": 310827, "epoch": 3744} {"train_loss": -25.610952377319336, "global_step": 310828, "epoch": 3744} {"train_loss": -25.451568603515625, "global_step": 310829, "epoch": 3744} {"train_loss": -25.570114135742188, "global_step": 310830, "epoch": 3744} {"train_loss": -25.68313980102539, "global_step": 310831, "epoch": 3744} {"train_loss": -25.58453369140625, "global_step": 310832, "epoch": 3744} {"train_loss": -25.823972702026367, "global_step": 310833, "epoch": 3744} {"train_loss": -25.06577275747276, "global_step": 310834, "epoch": 3744, "val_loss": 7424552.5} {"train_loss": -23.53238868713379, "global_step": 310835, "epoch": 3745} {"train_loss": -24.051849365234375, "global_step": 310836, "epoch": 3745} {"train_loss": -25.10092544555664, "global_step": 310837, "epoch": 3745} {"train_loss": -24.298246383666992, "global_step": 310838, "epoch": 3745} {"train_loss": -24.639225006103516, "global_step": 310839, "epoch": 3745} {"train_loss": -24.922204971313477, "global_step": 310840, "epoch": 3745} {"train_loss": -24.839990615844727, "global_step": 310841, "epoch": 3745} {"train_loss": -25.32325553894043, "global_step": 310842, "epoch": 3745} {"train_loss": -24.58744239807129, "global_step": 310843, "epoch": 3745} {"train_loss": -25.08328628540039, "global_step": 310844, "epoch": 3745} {"train_loss": -24.99985694885254, "global_step": 310845, "epoch": 3745} {"train_loss": -25.28849220275879, "global_step": 310846, "epoch": 3745} {"train_loss": -25.045629501342773, "global_step": 310847, "epoch": 3745} {"train_loss": -25.48262596130371, "global_step": 310848, "epoch": 3745} {"train_loss": -25.506372451782227, "global_step": 310849, "epoch": 3745} {"train_loss": -25.33318328857422, "global_step": 310850, "epoch": 3745} {"train_loss": -25.30097007751465, "global_step": 310851, "epoch": 3745} {"train_loss": -25.359838485717773, "global_step": 310852, "epoch": 3745} {"train_loss": -24.85721778869629, "global_step": 310853, "epoch": 3745} {"train_loss": -25.367963790893555, "global_step": 310854, "epoch": 3745} {"train_loss": -25.424955368041992, "global_step": 310855, "epoch": 3745} {"train_loss": -25.702661514282227, "global_step": 310856, "epoch": 3745} {"train_loss": -25.854475021362305, "global_step": 310857, "epoch": 3745} {"train_loss": -25.635541915893555, "global_step": 310858, "epoch": 3745} {"train_loss": -25.65458106994629, "global_step": 310859, "epoch": 3745} {"train_loss": -25.500080108642578, "global_step": 310860, "epoch": 3745} {"train_loss": -25.523401260375977, "global_step": 310861, "epoch": 3745} {"train_loss": -25.574289321899414, "global_step": 310862, "epoch": 3745} {"train_loss": -25.748249053955078, "global_step": 310863, "epoch": 3745} {"train_loss": -25.861806869506836, "global_step": 310864, "epoch": 3745} {"train_loss": -25.981586456298828, "global_step": 310865, "epoch": 3745} {"train_loss": -25.628284454345703, "global_step": 310866, "epoch": 3745} {"train_loss": -25.972278594970703, "global_step": 310867, "epoch": 3745} {"train_loss": -25.53447914123535, "global_step": 310868, "epoch": 3745} {"train_loss": -25.664541244506836, "global_step": 310869, "epoch": 3745} {"train_loss": -25.780426025390625, "global_step": 310870, "epoch": 3745} {"train_loss": -25.27998924255371, "global_step": 310871, "epoch": 3745} {"train_loss": -25.511003494262695, "global_step": 310872, "epoch": 3745} {"train_loss": -25.594717025756836, "global_step": 310873, "epoch": 3745} {"train_loss": -26.001317977905273, "global_step": 310874, "epoch": 3745} {"train_loss": -25.928375244140625, "global_step": 310875, "epoch": 3745} {"train_loss": -25.741968154907227, "global_step": 310876, "epoch": 3745} {"train_loss": -25.551984786987305, "global_step": 310877, "epoch": 3745} {"train_loss": -25.8811092376709, "global_step": 310878, "epoch": 3745} {"train_loss": -25.985563278198242, "global_step": 310879, "epoch": 3745} {"train_loss": -25.84492301940918, "global_step": 310880, "epoch": 3745} {"train_loss": -25.8308048248291, "global_step": 310881, "epoch": 3745} {"train_loss": -25.940637588500977, "global_step": 310882, "epoch": 3745} {"train_loss": -25.915998458862305, "global_step": 310883, "epoch": 3745} {"train_loss": -26.019454956054688, "global_step": 310884, "epoch": 3745} {"train_loss": -25.708959579467773, "global_step": 310885, "epoch": 3745} {"train_loss": -26.02986717224121, "global_step": 310886, "epoch": 3745} {"train_loss": -25.8526668548584, "global_step": 310887, "epoch": 3745} {"train_loss": -25.624631881713867, "global_step": 310888, "epoch": 3745} {"train_loss": -26.2325382232666, "global_step": 310889, "epoch": 3745} {"train_loss": -26.005414962768555, "global_step": 310890, "epoch": 3745} {"train_loss": -25.97486686706543, "global_step": 310891, "epoch": 3745} {"train_loss": -25.9164981842041, "global_step": 310892, "epoch": 3745} {"train_loss": -26.12640380859375, "global_step": 310893, "epoch": 3745} {"train_loss": -25.484338760375977, "global_step": 310894, "epoch": 3745} {"train_loss": -25.691974639892578, "global_step": 310895, "epoch": 3745} {"train_loss": -25.93134880065918, "global_step": 310896, "epoch": 3745} {"train_loss": -25.756668090820312, "global_step": 310897, "epoch": 3745} {"train_loss": -25.594789505004883, "global_step": 310898, "epoch": 3745} {"train_loss": -26.091739654541016, "global_step": 310899, "epoch": 3745} {"train_loss": -26.078689575195312, "global_step": 310900, "epoch": 3745} {"train_loss": -25.90768814086914, "global_step": 310901, "epoch": 3745} {"train_loss": -25.416709899902344, "global_step": 310902, "epoch": 3745} {"train_loss": -25.623701095581055, "global_step": 310903, "epoch": 3745} {"train_loss": -25.525876998901367, "global_step": 310904, "epoch": 3745} {"train_loss": -25.4666805267334, "global_step": 310905, "epoch": 3745} {"train_loss": -25.244443893432617, "global_step": 310906, "epoch": 3745} {"train_loss": -25.726858139038086, "global_step": 310907, "epoch": 3745} {"train_loss": -25.740400314331055, "global_step": 310908, "epoch": 3745} {"train_loss": -25.41067886352539, "global_step": 310909, "epoch": 3745} {"train_loss": -25.374311447143555, "global_step": 310910, "epoch": 3745} {"train_loss": -25.86322593688965, "global_step": 310911, "epoch": 3745} {"train_loss": -25.746973037719727, "global_step": 310912, "epoch": 3745} {"train_loss": -25.29594612121582, "global_step": 310913, "epoch": 3745} {"train_loss": -25.946369171142578, "global_step": 310914, "epoch": 3745} {"train_loss": -25.584537506103516, "global_step": 310915, "epoch": 3745} {"train_loss": -25.79534339904785, "global_step": 310916, "epoch": 3745} {"train_loss": -25.53564476105104, "global_step": 310917, "epoch": 3745, "val_loss": 7343459.0} {"train_loss": -25.201562881469727, "global_step": 310918, "epoch": 3746} {"train_loss": -25.376564025878906, "global_step": 310919, "epoch": 3746} {"train_loss": -25.274133682250977, "global_step": 310920, "epoch": 3746} {"train_loss": -25.06468391418457, "global_step": 310921, "epoch": 3746} {"train_loss": -25.218460083007812, "global_step": 310922, "epoch": 3746} {"train_loss": -25.558712005615234, "global_step": 310923, "epoch": 3746} {"train_loss": -25.197248458862305, "global_step": 310924, "epoch": 3746} {"train_loss": -25.26906394958496, "global_step": 310925, "epoch": 3746} {"train_loss": -25.340627670288086, "global_step": 310926, "epoch": 3746} {"train_loss": -25.86501121520996, "global_step": 310927, "epoch": 3746} {"train_loss": -25.8763484954834, "global_step": 310928, "epoch": 3746} {"train_loss": -25.392353057861328, "global_step": 310929, "epoch": 3746} {"train_loss": -25.72736930847168, "global_step": 310930, "epoch": 3746} {"train_loss": -25.61567497253418, "global_step": 310931, "epoch": 3746} {"train_loss": -25.455102920532227, "global_step": 310932, "epoch": 3746} {"train_loss": -25.535205841064453, "global_step": 310933, "epoch": 3746} {"train_loss": -25.753503799438477, "global_step": 310934, "epoch": 3746} {"train_loss": -25.67527198791504, "global_step": 310935, "epoch": 3746} {"train_loss": -25.57659149169922, "global_step": 310936, "epoch": 3746} {"train_loss": -25.88825035095215, "global_step": 310937, "epoch": 3746} {"train_loss": -26.061420440673828, "global_step": 310938, "epoch": 3746} {"train_loss": -25.618314743041992, "global_step": 310939, "epoch": 3746} {"train_loss": -25.831480026245117, "global_step": 310940, "epoch": 3746} {"train_loss": -25.986602783203125, "global_step": 310941, "epoch": 3746} {"train_loss": -25.712677001953125, "global_step": 310942, "epoch": 3746} {"train_loss": -25.5873966217041, "global_step": 310943, "epoch": 3746} {"train_loss": -26.034149169921875, "global_step": 310944, "epoch": 3746} {"train_loss": -25.84034538269043, "global_step": 310945, "epoch": 3746} {"train_loss": -25.481523513793945, "global_step": 310946, "epoch": 3746} {"train_loss": -25.9780216217041, "global_step": 310947, "epoch": 3746} {"train_loss": -25.976896286010742, "global_step": 310948, "epoch": 3746} {"train_loss": -25.977645874023438, "global_step": 310949, "epoch": 3746} {"train_loss": -25.971418380737305, "global_step": 310950, "epoch": 3746} {"train_loss": -25.58310890197754, "global_step": 310951, "epoch": 3746} {"train_loss": -25.688617706298828, "global_step": 310952, "epoch": 3746} {"train_loss": -25.866968154907227, "global_step": 310953, "epoch": 3746} {"train_loss": -25.798114776611328, "global_step": 310954, "epoch": 3746} {"train_loss": -25.8365421295166, "global_step": 310955, "epoch": 3746} {"train_loss": -25.89668846130371, "global_step": 310956, "epoch": 3746} {"train_loss": -25.840576171875, "global_step": 310957, "epoch": 3746} {"train_loss": -25.7023983001709, "global_step": 310958, "epoch": 3746} {"train_loss": -26.008106231689453, "global_step": 310959, "epoch": 3746} {"train_loss": -25.699934005737305, "global_step": 310960, "epoch": 3746} {"train_loss": -26.00318717956543, "global_step": 310961, "epoch": 3746} {"train_loss": -25.925434112548828, "global_step": 310962, "epoch": 3746} {"train_loss": -25.82504653930664, "global_step": 310963, "epoch": 3746} {"train_loss": -25.7370548248291, "global_step": 310964, "epoch": 3746} {"train_loss": -25.915220260620117, "global_step": 310965, "epoch": 3746} {"train_loss": -26.06707191467285, "global_step": 310966, "epoch": 3746} {"train_loss": -25.939924240112305, "global_step": 310967, "epoch": 3746} {"train_loss": -25.79912757873535, "global_step": 310968, "epoch": 3746} {"train_loss": -25.48381996154785, "global_step": 310969, "epoch": 3746} {"train_loss": -25.629636764526367, "global_step": 310970, "epoch": 3746} {"train_loss": -25.95889663696289, "global_step": 310971, "epoch": 3746} {"train_loss": -25.53398895263672, "global_step": 310972, "epoch": 3746} {"train_loss": -25.868457794189453, "global_step": 310973, "epoch": 3746} {"train_loss": -25.7407169342041, "global_step": 310974, "epoch": 3746} {"train_loss": -26.127782821655273, "global_step": 310975, "epoch": 3746} {"train_loss": -26.00420570373535, "global_step": 310976, "epoch": 3746} {"train_loss": -25.85072135925293, "global_step": 310977, "epoch": 3746} {"train_loss": -25.43854331970215, "global_step": 310978, "epoch": 3746} {"train_loss": -25.752859115600586, "global_step": 310979, "epoch": 3746} {"train_loss": -25.630868911743164, "global_step": 310980, "epoch": 3746} {"train_loss": -25.960309982299805, "global_step": 310981, "epoch": 3746} {"train_loss": -25.798383712768555, "global_step": 310982, "epoch": 3746} {"train_loss": -25.948993682861328, "global_step": 310983, "epoch": 3746} {"train_loss": -25.64019775390625, "global_step": 310984, "epoch": 3746} {"train_loss": -25.905649185180664, "global_step": 310985, "epoch": 3746} {"train_loss": -25.73172378540039, "global_step": 310986, "epoch": 3746} {"train_loss": -25.72931480407715, "global_step": 310987, "epoch": 3746} {"train_loss": -25.818185806274414, "global_step": 310988, "epoch": 3746} {"train_loss": -25.856836318969727, "global_step": 310989, "epoch": 3746} {"train_loss": -25.763687133789062, "global_step": 310990, "epoch": 3746} {"train_loss": -25.873483657836914, "global_step": 310991, "epoch": 3746} {"train_loss": -25.89381980895996, "global_step": 310992, "epoch": 3746} {"train_loss": -25.554218292236328, "global_step": 310993, "epoch": 3746} {"train_loss": -26.014760971069336, "global_step": 310994, "epoch": 3746} {"train_loss": -25.74574089050293, "global_step": 310995, "epoch": 3746} {"train_loss": -25.898218154907227, "global_step": 310996, "epoch": 3746} {"train_loss": -25.679548263549805, "global_step": 310997, "epoch": 3746} {"train_loss": -25.938825607299805, "global_step": 310998, "epoch": 3746} {"train_loss": -26.130842208862305, "global_step": 310999, "epoch": 3746} {"train_loss": -25.746913197528887, "global_step": 311000, "epoch": 3746, "val_loss": 7254222.0} {"train_loss": -25.3836727142334, "global_step": 311001, "epoch": 3747} {"train_loss": -24.81904411315918, "global_step": 311002, "epoch": 3747} {"train_loss": -25.13976287841797, "global_step": 311003, "epoch": 3747} {"train_loss": -24.920543670654297, "global_step": 311004, "epoch": 3747} {"train_loss": -25.46225929260254, "global_step": 311005, "epoch": 3747} {"train_loss": -24.81103515625, "global_step": 311006, "epoch": 3747} {"train_loss": -24.29041862487793, "global_step": 311007, "epoch": 3747} {"train_loss": -24.9757137298584, "global_step": 311008, "epoch": 3747} {"train_loss": -25.322357177734375, "global_step": 311009, "epoch": 3747} {"train_loss": -24.984220504760742, "global_step": 311010, "epoch": 3747} {"train_loss": -25.228872299194336, "global_step": 311011, "epoch": 3747} {"train_loss": -25.554052352905273, "global_step": 311012, "epoch": 3747} {"train_loss": -25.258447647094727, "global_step": 311013, "epoch": 3747} {"train_loss": -25.27651596069336, "global_step": 311014, "epoch": 3747} {"train_loss": -25.264982223510742, "global_step": 311015, "epoch": 3747} {"train_loss": -25.120927810668945, "global_step": 311016, "epoch": 3747} {"train_loss": -25.450300216674805, "global_step": 311017, "epoch": 3747} {"train_loss": -25.763254165649414, "global_step": 311018, "epoch": 3747} {"train_loss": -25.408111572265625, "global_step": 311019, "epoch": 3747} {"train_loss": -25.436389923095703, "global_step": 311020, "epoch": 3747} {"train_loss": -25.75909423828125, "global_step": 311021, "epoch": 3747} {"train_loss": -25.519433975219727, "global_step": 311022, "epoch": 3747} {"train_loss": -25.737924575805664, "global_step": 311023, "epoch": 3747} {"train_loss": -25.66071891784668, "global_step": 311024, "epoch": 3747} {"train_loss": -25.594789505004883, "global_step": 311025, "epoch": 3747} {"train_loss": -26.027631759643555, "global_step": 311026, "epoch": 3747} {"train_loss": -25.5430908203125, "global_step": 311027, "epoch": 3747} {"train_loss": -25.777515411376953, "global_step": 311028, "epoch": 3747} {"train_loss": -26.075414657592773, "global_step": 311029, "epoch": 3747} {"train_loss": -25.898151397705078, "global_step": 311030, "epoch": 3747} {"train_loss": -25.527692794799805, "global_step": 311031, "epoch": 3747} {"train_loss": -25.933887481689453, "global_step": 311032, "epoch": 3747} {"train_loss": -25.89900016784668, "global_step": 311033, "epoch": 3747} {"train_loss": -25.392385482788086, "global_step": 311034, "epoch": 3747} {"train_loss": -25.750812530517578, "global_step": 311035, "epoch": 3747} {"train_loss": -25.601486206054688, "global_step": 311036, "epoch": 3747} {"train_loss": -26.15570068359375, "global_step": 311037, "epoch": 3747} {"train_loss": -25.910648345947266, "global_step": 311038, "epoch": 3747} {"train_loss": -25.85151481628418, "global_step": 311039, "epoch": 3747} {"train_loss": -25.76971435546875, "global_step": 311040, "epoch": 3747} {"train_loss": -25.95073890686035, "global_step": 311041, "epoch": 3747} {"train_loss": -25.630529403686523, "global_step": 311042, "epoch": 3747} {"train_loss": -26.153844833374023, "global_step": 311043, "epoch": 3747} {"train_loss": -25.73438835144043, "global_step": 311044, "epoch": 3747} {"train_loss": -25.741689682006836, "global_step": 311045, "epoch": 3747} {"train_loss": -25.881601333618164, "global_step": 311046, "epoch": 3747} {"train_loss": -26.108154296875, "global_step": 311047, "epoch": 3747} {"train_loss": -25.985395431518555, "global_step": 311048, "epoch": 3747} {"train_loss": -25.804105758666992, "global_step": 311049, "epoch": 3747} {"train_loss": -25.762134552001953, "global_step": 311050, "epoch": 3747} {"train_loss": -25.71967887878418, "global_step": 311051, "epoch": 3747} {"train_loss": -25.83025550842285, "global_step": 311052, "epoch": 3747} {"train_loss": -25.64007568359375, "global_step": 311053, "epoch": 3747} {"train_loss": -25.872425079345703, "global_step": 311054, "epoch": 3747} {"train_loss": -25.8543701171875, "global_step": 311055, "epoch": 3747} {"train_loss": -25.463397979736328, "global_step": 311056, "epoch": 3747} {"train_loss": -25.7088680267334, "global_step": 311057, "epoch": 3747} {"train_loss": -25.42762565612793, "global_step": 311058, "epoch": 3747} {"train_loss": -26.183425903320312, "global_step": 311059, "epoch": 3747} {"train_loss": -25.74065589904785, "global_step": 311060, "epoch": 3747} {"train_loss": -25.535261154174805, "global_step": 311061, "epoch": 3747} {"train_loss": -25.56749153137207, "global_step": 311062, "epoch": 3747} {"train_loss": -25.691577911376953, "global_step": 311063, "epoch": 3747} {"train_loss": -26.111698150634766, "global_step": 311064, "epoch": 3747} {"train_loss": -25.97014808654785, "global_step": 311065, "epoch": 3747} {"train_loss": -25.756824493408203, "global_step": 311066, "epoch": 3747} {"train_loss": -25.177165985107422, "global_step": 311067, "epoch": 3747} {"train_loss": -25.364166259765625, "global_step": 311068, "epoch": 3747} {"train_loss": -25.9996395111084, "global_step": 311069, "epoch": 3747} {"train_loss": -25.72975730895996, "global_step": 311070, "epoch": 3747} {"train_loss": -25.8041934967041, "global_step": 311071, "epoch": 3747} {"train_loss": -25.938323974609375, "global_step": 311072, "epoch": 3747} {"train_loss": -25.498010635375977, "global_step": 311073, "epoch": 3747} {"train_loss": -25.877103805541992, "global_step": 311074, "epoch": 3747} {"train_loss": -25.62537956237793, "global_step": 311075, "epoch": 3747} {"train_loss": -25.90138816833496, "global_step": 311076, "epoch": 3747} {"train_loss": -26.32159996032715, "global_step": 311077, "epoch": 3747} {"train_loss": -25.600988388061523, "global_step": 311078, "epoch": 3747} {"train_loss": -25.232831954956055, "global_step": 311079, "epoch": 3747} {"train_loss": -25.69817543029785, "global_step": 311080, "epoch": 3747} {"train_loss": -25.892414093017578, "global_step": 311081, "epoch": 3747} {"train_loss": -25.61115837097168, "global_step": 311082, "epoch": 3747} {"train_loss": -25.641886033207538, "global_step": 311083, "epoch": 3747, "val_loss": 7255119.5} {"train_loss": -25.411672592163086, "global_step": 311084, "epoch": 3748} {"train_loss": -25.433658599853516, "global_step": 311085, "epoch": 3748} {"train_loss": -25.525793075561523, "global_step": 311086, "epoch": 3748} {"train_loss": -25.401447296142578, "global_step": 311087, "epoch": 3748} {"train_loss": -25.436405181884766, "global_step": 311088, "epoch": 3748} {"train_loss": -25.5079402923584, "global_step": 311089, "epoch": 3748} {"train_loss": -25.381929397583008, "global_step": 311090, "epoch": 3748} {"train_loss": -25.51216697692871, "global_step": 311091, "epoch": 3748} {"train_loss": -25.8430118560791, "global_step": 311092, "epoch": 3748} {"train_loss": -25.808277130126953, "global_step": 311093, "epoch": 3748} {"train_loss": -25.83259391784668, "global_step": 311094, "epoch": 3748} {"train_loss": -25.753009796142578, "global_step": 311095, "epoch": 3748} {"train_loss": -25.865385055541992, "global_step": 311096, "epoch": 3748} {"train_loss": -25.850433349609375, "global_step": 311097, "epoch": 3748} {"train_loss": -25.79254150390625, "global_step": 311098, "epoch": 3748} {"train_loss": -26.001449584960938, "global_step": 311099, "epoch": 3748} {"train_loss": -26.024276733398438, "global_step": 311100, "epoch": 3748} {"train_loss": -25.9910831451416, "global_step": 311101, "epoch": 3748} {"train_loss": -26.03350830078125, "global_step": 311102, "epoch": 3748} {"train_loss": -26.058307647705078, "global_step": 311103, "epoch": 3748} {"train_loss": -25.80428123474121, "global_step": 311104, "epoch": 3748} {"train_loss": -25.89991569519043, "global_step": 311105, "epoch": 3748} {"train_loss": -25.808950424194336, "global_step": 311106, "epoch": 3748} {"train_loss": -25.722064971923828, "global_step": 311107, "epoch": 3748} {"train_loss": -26.143238067626953, "global_step": 311108, "epoch": 3748} {"train_loss": -25.796951293945312, "global_step": 311109, "epoch": 3748} {"train_loss": -26.1455078125, "global_step": 311110, "epoch": 3748} {"train_loss": -25.808576583862305, "global_step": 311111, "epoch": 3748} {"train_loss": -25.801788330078125, "global_step": 311112, "epoch": 3748} {"train_loss": -26.16455078125, "global_step": 311113, "epoch": 3748} {"train_loss": -25.5806827545166, "global_step": 311114, "epoch": 3748} {"train_loss": -25.673816680908203, "global_step": 311115, "epoch": 3748} {"train_loss": -25.228595733642578, "global_step": 311116, "epoch": 3748} {"train_loss": -25.31156349182129, "global_step": 311117, "epoch": 3748} {"train_loss": -25.97723388671875, "global_step": 311118, "epoch": 3748} {"train_loss": -25.340286254882812, "global_step": 311119, "epoch": 3748} {"train_loss": -25.27829933166504, "global_step": 311120, "epoch": 3748} {"train_loss": -25.818998336791992, "global_step": 311121, "epoch": 3748} {"train_loss": -25.305492401123047, "global_step": 311122, "epoch": 3748} {"train_loss": -25.3250789642334, "global_step": 311123, "epoch": 3748} {"train_loss": -25.403812408447266, "global_step": 311124, "epoch": 3748} {"train_loss": -25.387365341186523, "global_step": 311125, "epoch": 3748} {"train_loss": -25.127824783325195, "global_step": 311126, "epoch": 3748} {"train_loss": -25.29334831237793, "global_step": 311127, "epoch": 3748} {"train_loss": -25.874237060546875, "global_step": 311128, "epoch": 3748} {"train_loss": -25.287322998046875, "global_step": 311129, "epoch": 3748} {"train_loss": -25.687177658081055, "global_step": 311130, "epoch": 3748} {"train_loss": -25.435205459594727, "global_step": 311131, "epoch": 3748} {"train_loss": -25.59247589111328, "global_step": 311132, "epoch": 3748} {"train_loss": -25.46563148498535, "global_step": 311133, "epoch": 3748} {"train_loss": -26.04750633239746, "global_step": 311134, "epoch": 3748} {"train_loss": -25.470932006835938, "global_step": 311135, "epoch": 3748} {"train_loss": -25.731708526611328, "global_step": 311136, "epoch": 3748} {"train_loss": -25.807926177978516, "global_step": 311137, "epoch": 3748} {"train_loss": -25.36746597290039, "global_step": 311138, "epoch": 3748} {"train_loss": -25.862497329711914, "global_step": 311139, "epoch": 3748} {"train_loss": -25.697229385375977, "global_step": 311140, "epoch": 3748} {"train_loss": -25.65608024597168, "global_step": 311141, "epoch": 3748} {"train_loss": -25.766584396362305, "global_step": 311142, "epoch": 3748} {"train_loss": -25.653356552124023, "global_step": 311143, "epoch": 3748} {"train_loss": -25.256895065307617, "global_step": 311144, "epoch": 3748} {"train_loss": -25.922897338867188, "global_step": 311145, "epoch": 3748} {"train_loss": -25.71213150024414, "global_step": 311146, "epoch": 3748} {"train_loss": -25.726181030273438, "global_step": 311147, "epoch": 3748} {"train_loss": -25.765045166015625, "global_step": 311148, "epoch": 3748} {"train_loss": -25.929004669189453, "global_step": 311149, "epoch": 3748} {"train_loss": -25.982725143432617, "global_step": 311150, "epoch": 3748} {"train_loss": -25.952960968017578, "global_step": 311151, "epoch": 3748} {"train_loss": -25.837249755859375, "global_step": 311152, "epoch": 3748} {"train_loss": -25.70208168029785, "global_step": 311153, "epoch": 3748} {"train_loss": -25.96795654296875, "global_step": 311154, "epoch": 3748} {"train_loss": -25.91855239868164, "global_step": 311155, "epoch": 3748} {"train_loss": -25.74407958984375, "global_step": 311156, "epoch": 3748} {"train_loss": -26.064237594604492, "global_step": 311157, "epoch": 3748} {"train_loss": -25.86054801940918, "global_step": 311158, "epoch": 3748} {"train_loss": -25.883930206298828, "global_step": 311159, "epoch": 3748} {"train_loss": -25.757282257080078, "global_step": 311160, "epoch": 3748} {"train_loss": -26.020532608032227, "global_step": 311161, "epoch": 3748} {"train_loss": -25.993452072143555, "global_step": 311162, "epoch": 3748} {"train_loss": -25.8644962310791, "global_step": 311163, "epoch": 3748} {"train_loss": -25.777048110961914, "global_step": 311164, "epoch": 3748} {"train_loss": -25.681386947631836, "global_step": 311165, "epoch": 3748} {"train_loss": -25.709805660937207, "global_step": 311166, "epoch": 3748, "val_loss": 7222625.0} {"train_loss": -24.79341697692871, "global_step": 311167, "epoch": 3749} {"train_loss": -24.77899169921875, "global_step": 311168, "epoch": 3749} {"train_loss": -25.008115768432617, "global_step": 311169, "epoch": 3749} {"train_loss": -25.32977294921875, "global_step": 311170, "epoch": 3749} {"train_loss": -25.507102966308594, "global_step": 311171, "epoch": 3749} {"train_loss": -25.210004806518555, "global_step": 311172, "epoch": 3749} {"train_loss": -25.510650634765625, "global_step": 311173, "epoch": 3749} {"train_loss": -25.499570846557617, "global_step": 311174, "epoch": 3749} {"train_loss": -25.58123016357422, "global_step": 311175, "epoch": 3749} {"train_loss": -25.133499145507812, "global_step": 311176, "epoch": 3749} {"train_loss": -25.334630966186523, "global_step": 311177, "epoch": 3749} {"train_loss": -25.690229415893555, "global_step": 311178, "epoch": 3749} {"train_loss": -25.367630004882812, "global_step": 311179, "epoch": 3749} {"train_loss": -24.998126983642578, "global_step": 311180, "epoch": 3749} {"train_loss": -25.614856719970703, "global_step": 311181, "epoch": 3749} {"train_loss": -25.305187225341797, "global_step": 311182, "epoch": 3749} {"train_loss": -25.333805084228516, "global_step": 311183, "epoch": 3749} {"train_loss": -25.629501342773438, "global_step": 311184, "epoch": 3749} {"train_loss": -25.573957443237305, "global_step": 311185, "epoch": 3749} {"train_loss": -25.425247192382812, "global_step": 311186, "epoch": 3749} {"train_loss": -25.618209838867188, "global_step": 311187, "epoch": 3749} {"train_loss": -25.9632568359375, "global_step": 311188, "epoch": 3749} {"train_loss": -25.819738388061523, "global_step": 311189, "epoch": 3749} {"train_loss": -25.853124618530273, "global_step": 311190, "epoch": 3749} {"train_loss": -25.8669490814209, "global_step": 311191, "epoch": 3749} {"train_loss": -25.73919677734375, "global_step": 311192, "epoch": 3749} {"train_loss": -25.651885986328125, "global_step": 311193, "epoch": 3749} {"train_loss": -25.85059928894043, "global_step": 311194, "epoch": 3749} {"train_loss": -25.574735641479492, "global_step": 311195, "epoch": 3749} {"train_loss": -25.536359786987305, "global_step": 311196, "epoch": 3749} {"train_loss": -25.79490089416504, "global_step": 311197, "epoch": 3749} {"train_loss": -25.646848678588867, "global_step": 311198, "epoch": 3749} {"train_loss": -26.044031143188477, "global_step": 311199, "epoch": 3749} {"train_loss": -25.70939064025879, "global_step": 311200, "epoch": 3749} {"train_loss": -25.99555015563965, "global_step": 311201, "epoch": 3749} {"train_loss": -25.641733169555664, "global_step": 311202, "epoch": 3749} {"train_loss": -25.980939865112305, "global_step": 311203, "epoch": 3749} {"train_loss": -25.731372833251953, "global_step": 311204, "epoch": 3749} {"train_loss": -26.121906280517578, "global_step": 311205, "epoch": 3749} {"train_loss": -26.035964965820312, "global_step": 311206, "epoch": 3749} {"train_loss": -25.784162521362305, "global_step": 311207, "epoch": 3749} {"train_loss": -25.931171417236328, "global_step": 311208, "epoch": 3749} {"train_loss": -25.966400146484375, "global_step": 311209, "epoch": 3749} {"train_loss": -26.499921798706055, "global_step": 311210, "epoch": 3749} {"train_loss": -25.56523323059082, "global_step": 311211, "epoch": 3749} {"train_loss": -25.803497314453125, "global_step": 311212, "epoch": 3749} {"train_loss": -25.43697166442871, "global_step": 311213, "epoch": 3749} {"train_loss": -26.2219181060791, "global_step": 311214, "epoch": 3749} {"train_loss": -25.806787490844727, "global_step": 311215, "epoch": 3749} {"train_loss": -25.927509307861328, "global_step": 311216, "epoch": 3749} {"train_loss": -25.979888916015625, "global_step": 311217, "epoch": 3749} {"train_loss": -25.93231201171875, "global_step": 311218, "epoch": 3749} {"train_loss": -26.053953170776367, "global_step": 311219, "epoch": 3749} {"train_loss": -25.966522216796875, "global_step": 311220, "epoch": 3749} {"train_loss": -25.558238983154297, "global_step": 311221, "epoch": 3749} {"train_loss": -25.549402236938477, "global_step": 311222, "epoch": 3749} {"train_loss": -25.570213317871094, "global_step": 311223, "epoch": 3749} {"train_loss": -25.76708984375, "global_step": 311224, "epoch": 3749} {"train_loss": -25.595266342163086, "global_step": 311225, "epoch": 3749} {"train_loss": -25.88935661315918, "global_step": 311226, "epoch": 3749} {"train_loss": -25.886749267578125, "global_step": 311227, "epoch": 3749} {"train_loss": -26.217702865600586, "global_step": 311228, "epoch": 3749} {"train_loss": -25.67928123474121, "global_step": 311229, "epoch": 3749} {"train_loss": -26.307275772094727, "global_step": 311230, "epoch": 3749} {"train_loss": -25.74808692932129, "global_step": 311231, "epoch": 3749} {"train_loss": -25.764310836791992, "global_step": 311232, "epoch": 3749} {"train_loss": -25.50966453552246, "global_step": 311233, "epoch": 3749} {"train_loss": -25.200429916381836, "global_step": 311234, "epoch": 3749} {"train_loss": -25.559751510620117, "global_step": 311235, "epoch": 3749} {"train_loss": -25.791324615478516, "global_step": 311236, "epoch": 3749} {"train_loss": -25.52239227294922, "global_step": 311237, "epoch": 3749} {"train_loss": -25.797809600830078, "global_step": 311238, "epoch": 3749} {"train_loss": -25.492231369018555, "global_step": 311239, "epoch": 3749} {"train_loss": -25.506362915039062, "global_step": 311240, "epoch": 3749} {"train_loss": -25.526426315307617, "global_step": 311241, "epoch": 3749} {"train_loss": -25.54952049255371, "global_step": 311242, "epoch": 3749} {"train_loss": -25.954015731811523, "global_step": 311243, "epoch": 3749} {"train_loss": -25.67427635192871, "global_step": 311244, "epoch": 3749} {"train_loss": -25.97429847717285, "global_step": 311245, "epoch": 3749} {"train_loss": -25.249135971069336, "global_step": 311246, "epoch": 3749} {"train_loss": -25.922958374023438, "global_step": 311247, "epoch": 3749} {"train_loss": -26.01202964782715, "global_step": 311248, "epoch": 3749} {"train_loss": -25.681905930300793, "global_step": 311249, "epoch": 3749, "val_loss": 7506331.5} {"train_loss": -23.373849868774414, "global_step": 311250, "epoch": 3750} {"train_loss": -24.712514877319336, "global_step": 311251, "epoch": 3750} {"train_loss": -24.06146812438965, "global_step": 311252, "epoch": 3750} {"train_loss": -24.276182174682617, "global_step": 311253, "epoch": 3750} {"train_loss": -23.753568649291992, "global_step": 311254, "epoch": 3750} {"train_loss": -25.11289405822754, "global_step": 311255, "epoch": 3750} {"train_loss": -24.676069259643555, "global_step": 311256, "epoch": 3750} {"train_loss": -24.935199737548828, "global_step": 311257, "epoch": 3750} {"train_loss": -25.050973892211914, "global_step": 311258, "epoch": 3750} {"train_loss": -24.795690536499023, "global_step": 311259, "epoch": 3750} {"train_loss": -25.377662658691406, "global_step": 311260, "epoch": 3750} {"train_loss": -24.6861515045166, "global_step": 311261, "epoch": 3750} {"train_loss": -24.99900245666504, "global_step": 311262, "epoch": 3750} {"train_loss": -24.967227935791016, "global_step": 311263, "epoch": 3750} {"train_loss": -25.043954849243164, "global_step": 311264, "epoch": 3750} {"train_loss": -25.009389877319336, "global_step": 311265, "epoch": 3750} {"train_loss": -25.262725830078125, "global_step": 311266, "epoch": 3750} {"train_loss": -25.106327056884766, "global_step": 311267, "epoch": 3750} {"train_loss": -25.435659408569336, "global_step": 311268, "epoch": 3750} {"train_loss": -25.440271377563477, "global_step": 311269, "epoch": 3750} {"train_loss": -25.538604736328125, "global_step": 311270, "epoch": 3750} {"train_loss": -25.695056915283203, "global_step": 311271, "epoch": 3750} {"train_loss": -25.527387619018555, "global_step": 311272, "epoch": 3750} {"train_loss": -25.345090866088867, "global_step": 311273, "epoch": 3750} {"train_loss": -25.428970336914062, "global_step": 311274, "epoch": 3750} {"train_loss": -25.431589126586914, "global_step": 311275, "epoch": 3750} {"train_loss": -25.415077209472656, "global_step": 311276, "epoch": 3750} {"train_loss": -25.539464950561523, "global_step": 311277, "epoch": 3750} {"train_loss": -25.45659828186035, "global_step": 311278, "epoch": 3750} {"train_loss": -25.62029457092285, "global_step": 311279, "epoch": 3750} {"train_loss": -25.544153213500977, "global_step": 311280, "epoch": 3750} {"train_loss": -25.22344398498535, "global_step": 311281, "epoch": 3750} {"train_loss": -25.62396812438965, "global_step": 311282, "epoch": 3750} {"train_loss": -25.58802032470703, "global_step": 311283, "epoch": 3750} {"train_loss": -25.826618194580078, "global_step": 311284, "epoch": 3750} {"train_loss": -25.674182891845703, "global_step": 311285, "epoch": 3750} {"train_loss": -25.90093994140625, "global_step": 311286, "epoch": 3750} {"train_loss": -25.91948890686035, "global_step": 311287, "epoch": 3750} {"train_loss": -25.296798706054688, "global_step": 311288, "epoch": 3750} {"train_loss": -25.48172378540039, "global_step": 311289, "epoch": 3750} {"train_loss": -26.05769157409668, "global_step": 311290, "epoch": 3750} {"train_loss": -25.939411163330078, "global_step": 311291, "epoch": 3750} {"train_loss": -25.822004318237305, "global_step": 311292, "epoch": 3750} {"train_loss": -25.308008193969727, "global_step": 311293, "epoch": 3750} {"train_loss": -25.609830856323242, "global_step": 311294, "epoch": 3750} {"train_loss": -25.438955307006836, "global_step": 311295, "epoch": 3750} {"train_loss": -25.6042423248291, "global_step": 311296, "epoch": 3750} {"train_loss": -25.931854248046875, "global_step": 311297, "epoch": 3750} {"train_loss": -25.788732528686523, "global_step": 311298, "epoch": 3750} {"train_loss": -25.938602447509766, "global_step": 311299, "epoch": 3750} {"train_loss": -25.916101455688477, "global_step": 311300, "epoch": 3750} {"train_loss": -26.025699615478516, "global_step": 311301, "epoch": 3750} {"train_loss": -25.95551872253418, "global_step": 311302, "epoch": 3750} {"train_loss": -25.875654220581055, "global_step": 311303, "epoch": 3750} {"train_loss": -25.962018966674805, "global_step": 311304, "epoch": 3750} {"train_loss": -26.138151168823242, "global_step": 311305, "epoch": 3750} {"train_loss": -26.060169219970703, "global_step": 311306, "epoch": 3750} {"train_loss": -25.735986709594727, "global_step": 311307, "epoch": 3750} {"train_loss": -25.89031982421875, "global_step": 311308, "epoch": 3750} {"train_loss": -25.539113998413086, "global_step": 311309, "epoch": 3750} {"train_loss": -25.704456329345703, "global_step": 311310, "epoch": 3750} {"train_loss": -25.87841796875, "global_step": 311311, "epoch": 3750} {"train_loss": -25.75494384765625, "global_step": 311312, "epoch": 3750} {"train_loss": -25.82318687438965, "global_step": 311313, "epoch": 3750} {"train_loss": -26.027923583984375, "global_step": 311314, "epoch": 3750} {"train_loss": -25.683286666870117, "global_step": 311315, "epoch": 3750} {"train_loss": -25.945514678955078, "global_step": 311316, "epoch": 3750} {"train_loss": -25.819080352783203, "global_step": 311317, "epoch": 3750} {"train_loss": -25.94427490234375, "global_step": 311318, "epoch": 3750} {"train_loss": -25.436731338500977, "global_step": 311319, "epoch": 3750} {"train_loss": -25.814090728759766, "global_step": 311320, "epoch": 3750} {"train_loss": -25.26651954650879, "global_step": 311321, "epoch": 3750} {"train_loss": -25.479841232299805, "global_step": 311322, "epoch": 3750} {"train_loss": -25.733779907226562, "global_step": 311323, "epoch": 3750} {"train_loss": -26.2059268951416, "global_step": 311324, "epoch": 3750} {"train_loss": -25.857709884643555, "global_step": 311325, "epoch": 3750} {"train_loss": -26.003448486328125, "global_step": 311326, "epoch": 3750} {"train_loss": -26.26581382751465, "global_step": 311327, "epoch": 3750} {"train_loss": -25.8255558013916, "global_step": 311328, "epoch": 3750} {"train_loss": -26.32379722595215, "global_step": 311329, "epoch": 3750} {"train_loss": -25.957660675048828, "global_step": 311330, "epoch": 3750} {"train_loss": -26.00677490234375, "global_step": 311331, "epoch": 3750} {"train_loss": -25.51448826617505, "global_step": 311332, "epoch": 3750, "train/sim_max_reward_0": 1.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4500000": 1.0, "test/sim_max_reward_4500001": 1.0, "test/sim_max_reward_4500002": 1.0, "test/sim_max_reward_4500003": 1.0, "test/sim_max_reward_4500004": 1.0, "test/sim_max_reward_4500005": 1.0, "test/sim_max_reward_4500006": 1.0, "test/sim_max_reward_4500007": 0.0, "test/sim_max_reward_4500008": 1.0, "test/sim_max_reward_4500009": 1.0, "test/sim_max_reward_4500010": 0.0, "test/sim_max_reward_4500011": 1.0, "test/sim_max_reward_4500012": 1.0, "test/sim_max_reward_4500013": 0.0, "test/sim_max_reward_4500014": 1.0, "test/sim_max_reward_4500015": 1.0, "test/sim_max_reward_4500016": 1.0, "test/sim_max_reward_4500017": 1.0, "test/sim_max_reward_4500018": 0.0, "test/sim_max_reward_4500019": 0.0, "test/sim_max_reward_4500020": 1.0, "test/sim_max_reward_4500021": 1.0, "train/mean_score": 1.0, "test/mean_score": 0.7727272727272727, "val_loss": 7174589.5} {"train_loss": -25.7133731842041, "global_step": 311333, "epoch": 3751} {"train_loss": -25.6796932220459, "global_step": 311334, "epoch": 3751} {"train_loss": -25.78474235534668, "global_step": 311335, "epoch": 3751} {"train_loss": -25.318029403686523, "global_step": 311336, "epoch": 3751} {"train_loss": -25.54583168029785, "global_step": 311337, "epoch": 3751} {"train_loss": -25.040719985961914, "global_step": 311338, "epoch": 3751} {"train_loss": -25.773191452026367, "global_step": 311339, "epoch": 3751} {"train_loss": -25.222148895263672, "global_step": 311340, "epoch": 3751} {"train_loss": -25.800220489501953, "global_step": 311341, "epoch": 3751} {"train_loss": -25.37896728515625, "global_step": 311342, "epoch": 3751} {"train_loss": -25.217138290405273, "global_step": 311343, "epoch": 3751} {"train_loss": -25.25684928894043, "global_step": 311344, "epoch": 3751} {"train_loss": -25.611555099487305, "global_step": 311345, "epoch": 3751} {"train_loss": -25.8686580657959, "global_step": 311346, "epoch": 3751} {"train_loss": -25.360807418823242, "global_step": 311347, "epoch": 3751} {"train_loss": -25.418371200561523, "global_step": 311348, "epoch": 3751} {"train_loss": -25.7054500579834, "global_step": 311349, "epoch": 3751} {"train_loss": -25.670690536499023, "global_step": 311350, "epoch": 3751} {"train_loss": -25.99358558654785, "global_step": 311351, "epoch": 3751} {"train_loss": -25.459096908569336, "global_step": 311352, "epoch": 3751} {"train_loss": -25.797971725463867, "global_step": 311353, "epoch": 3751} {"train_loss": -25.691946029663086, "global_step": 311354, "epoch": 3751} {"train_loss": -25.89114761352539, "global_step": 311355, "epoch": 3751} {"train_loss": -26.022443771362305, "global_step": 311356, "epoch": 3751} {"train_loss": -25.546545028686523, "global_step": 311357, "epoch": 3751} {"train_loss": -25.881027221679688, "global_step": 311358, "epoch": 3751} {"train_loss": -25.534854888916016, "global_step": 311359, "epoch": 3751} {"train_loss": -25.76828956604004, "global_step": 311360, "epoch": 3751} {"train_loss": -25.928308486938477, "global_step": 311361, "epoch": 3751} {"train_loss": -25.4869327545166, "global_step": 311362, "epoch": 3751} {"train_loss": -25.582469940185547, "global_step": 311363, "epoch": 3751} {"train_loss": -25.732406616210938, "global_step": 311364, "epoch": 3751} {"train_loss": -25.413780212402344, "global_step": 311365, "epoch": 3751} {"train_loss": -25.882644653320312, "global_step": 311366, "epoch": 3751} {"train_loss": -25.807601928710938, "global_step": 311367, "epoch": 3751} {"train_loss": -25.8297119140625, "global_step": 311368, "epoch": 3751} {"train_loss": -26.003860473632812, "global_step": 311369, "epoch": 3751} {"train_loss": -25.719207763671875, "global_step": 311370, "epoch": 3751} {"train_loss": -25.77569007873535, "global_step": 311371, "epoch": 3751} {"train_loss": -25.853185653686523, "global_step": 311372, "epoch": 3751} {"train_loss": -25.750165939331055, "global_step": 311373, "epoch": 3751} {"train_loss": -25.956892013549805, "global_step": 311374, "epoch": 3751} {"train_loss": -25.64243507385254, "global_step": 311375, "epoch": 3751} {"train_loss": -25.498199462890625, "global_step": 311376, "epoch": 3751} {"train_loss": -25.60162925720215, "global_step": 311377, "epoch": 3751} {"train_loss": -26.066980361938477, "global_step": 311378, "epoch": 3751} {"train_loss": -26.38718032836914, "global_step": 311379, "epoch": 3751} {"train_loss": -25.645217895507812, "global_step": 311380, "epoch": 3751} {"train_loss": -25.488203048706055, "global_step": 311381, "epoch": 3751} {"train_loss": -26.059247970581055, "global_step": 311382, "epoch": 3751} {"train_loss": -25.5252685546875, "global_step": 311383, "epoch": 3751} {"train_loss": -25.689167022705078, "global_step": 311384, "epoch": 3751} {"train_loss": -26.1004638671875, "global_step": 311385, "epoch": 3751} {"train_loss": -26.018096923828125, "global_step": 311386, "epoch": 3751} {"train_loss": -25.7120304107666, "global_step": 311387, "epoch": 3751} {"train_loss": -25.589447021484375, "global_step": 311388, "epoch": 3751} {"train_loss": -25.61907386779785, "global_step": 311389, "epoch": 3751} {"train_loss": -25.68934440612793, "global_step": 311390, "epoch": 3751} {"train_loss": -25.788543701171875, "global_step": 311391, "epoch": 3751} {"train_loss": -25.704965591430664, "global_step": 311392, "epoch": 3751} {"train_loss": -25.733596801757812, "global_step": 311393, "epoch": 3751} {"train_loss": -26.019514083862305, "global_step": 311394, "epoch": 3751} {"train_loss": -25.82305335998535, "global_step": 311395, "epoch": 3751} {"train_loss": -25.2691707611084, "global_step": 311396, "epoch": 3751} {"train_loss": -25.551380157470703, "global_step": 311397, "epoch": 3751} {"train_loss": -25.993078231811523, "global_step": 311398, "epoch": 3751} {"train_loss": -26.023731231689453, "global_step": 311399, "epoch": 3751} {"train_loss": -25.288488388061523, "global_step": 311400, "epoch": 3751} {"train_loss": -26.0531005859375, "global_step": 311401, "epoch": 3751} {"train_loss": -25.671323776245117, "global_step": 311402, "epoch": 3751} {"train_loss": -25.519134521484375, "global_step": 311403, "epoch": 3751} {"train_loss": -25.58674430847168, "global_step": 311404, "epoch": 3751} {"train_loss": -25.309757232666016, "global_step": 311405, "epoch": 3751} {"train_loss": -25.702075958251953, "global_step": 311406, "epoch": 3751} {"train_loss": -25.518285751342773, "global_step": 311407, "epoch": 3751} {"train_loss": -25.520156860351562, "global_step": 311408, "epoch": 3751} {"train_loss": -25.71710205078125, "global_step": 311409, "epoch": 3751} {"train_loss": -25.41175079345703, "global_step": 311410, "epoch": 3751} {"train_loss": -25.8526611328125, "global_step": 311411, "epoch": 3751} {"train_loss": -25.74769401550293, "global_step": 311412, "epoch": 3751} {"train_loss": -25.824298858642578, "global_step": 311413, "epoch": 3751} {"train_loss": -25.8211727142334, "global_step": 311414, "epoch": 3751} {"train_loss": -25.683436106486493, "global_step": 311415, "epoch": 3751, "val_loss": 7372649.0} {"train_loss": -25.341373443603516, "global_step": 311416, "epoch": 3752} {"train_loss": -25.346866607666016, "global_step": 311417, "epoch": 3752} {"train_loss": -24.918272018432617, "global_step": 311418, "epoch": 3752} {"train_loss": -25.26488494873047, "global_step": 311419, "epoch": 3752} {"train_loss": -25.33030128479004, "global_step": 311420, "epoch": 3752} {"train_loss": -25.131383895874023, "global_step": 311421, "epoch": 3752} {"train_loss": -25.36405372619629, "global_step": 311422, "epoch": 3752} {"train_loss": -25.65537452697754, "global_step": 311423, "epoch": 3752} {"train_loss": -25.48920440673828, "global_step": 311424, "epoch": 3752} {"train_loss": -25.101938247680664, "global_step": 311425, "epoch": 3752} {"train_loss": -25.322446823120117, "global_step": 311426, "epoch": 3752} {"train_loss": -25.191253662109375, "global_step": 311427, "epoch": 3752} {"train_loss": -25.43143653869629, "global_step": 311428, "epoch": 3752} {"train_loss": -25.499113082885742, "global_step": 311429, "epoch": 3752} {"train_loss": -25.77808952331543, "global_step": 311430, "epoch": 3752} {"train_loss": -25.651639938354492, "global_step": 311431, "epoch": 3752} {"train_loss": -25.546178817749023, "global_step": 311432, "epoch": 3752} {"train_loss": -25.705520629882812, "global_step": 311433, "epoch": 3752} {"train_loss": -25.54212760925293, "global_step": 311434, "epoch": 3752} {"train_loss": -25.815570831298828, "global_step": 311435, "epoch": 3752} {"train_loss": -25.8091983795166, "global_step": 311436, "epoch": 3752} {"train_loss": -25.552032470703125, "global_step": 311437, "epoch": 3752} {"train_loss": -25.58728790283203, "global_step": 311438, "epoch": 3752} {"train_loss": -25.932233810424805, "global_step": 311439, "epoch": 3752} {"train_loss": -25.70664405822754, "global_step": 311440, "epoch": 3752} {"train_loss": -25.80169677734375, "global_step": 311441, "epoch": 3752} {"train_loss": -25.473417282104492, "global_step": 311442, "epoch": 3752} {"train_loss": -25.814176559448242, "global_step": 311443, "epoch": 3752} {"train_loss": -25.82234001159668, "global_step": 311444, "epoch": 3752} {"train_loss": -25.789371490478516, "global_step": 311445, "epoch": 3752} {"train_loss": -25.39909553527832, "global_step": 311446, "epoch": 3752} {"train_loss": -25.75058937072754, "global_step": 311447, "epoch": 3752} {"train_loss": -25.685407638549805, "global_step": 311448, "epoch": 3752} {"train_loss": -25.71219825744629, "global_step": 311449, "epoch": 3752} {"train_loss": -26.375402450561523, "global_step": 311450, "epoch": 3752} {"train_loss": -26.239749908447266, "global_step": 311451, "epoch": 3752} {"train_loss": -25.878223419189453, "global_step": 311452, "epoch": 3752} {"train_loss": -25.78057861328125, "global_step": 311453, "epoch": 3752} {"train_loss": -25.876972198486328, "global_step": 311454, "epoch": 3752} {"train_loss": -25.996992111206055, "global_step": 311455, "epoch": 3752} {"train_loss": -25.79665184020996, "global_step": 311456, "epoch": 3752} {"train_loss": -26.107709884643555, "global_step": 311457, "epoch": 3752} {"train_loss": -26.310331344604492, "global_step": 311458, "epoch": 3752} {"train_loss": -26.152257919311523, "global_step": 311459, "epoch": 3752} {"train_loss": -25.896787643432617, "global_step": 311460, "epoch": 3752} {"train_loss": -25.791364669799805, "global_step": 311461, "epoch": 3752} {"train_loss": -26.023374557495117, "global_step": 311462, "epoch": 3752} {"train_loss": -25.92250633239746, "global_step": 311463, "epoch": 3752} {"train_loss": -26.069690704345703, "global_step": 311464, "epoch": 3752} {"train_loss": -26.159576416015625, "global_step": 311465, "epoch": 3752} {"train_loss": -26.17514991760254, "global_step": 311466, "epoch": 3752} {"train_loss": -25.828699111938477, "global_step": 311467, "epoch": 3752} {"train_loss": -25.631399154663086, "global_step": 311468, "epoch": 3752} {"train_loss": -25.609882354736328, "global_step": 311469, "epoch": 3752} {"train_loss": -25.009119033813477, "global_step": 311470, "epoch": 3752} {"train_loss": -25.296527862548828, "global_step": 311471, "epoch": 3752} {"train_loss": -25.931049346923828, "global_step": 311472, "epoch": 3752} {"train_loss": -25.73565101623535, "global_step": 311473, "epoch": 3752} {"train_loss": -25.824039459228516, "global_step": 311474, "epoch": 3752} {"train_loss": -25.69740104675293, "global_step": 311475, "epoch": 3752} {"train_loss": -25.394485473632812, "global_step": 311476, "epoch": 3752} {"train_loss": -25.61406898498535, "global_step": 311477, "epoch": 3752} {"train_loss": -25.84328269958496, "global_step": 311478, "epoch": 3752} {"train_loss": -25.870447158813477, "global_step": 311479, "epoch": 3752} {"train_loss": -25.77424430847168, "global_step": 311480, "epoch": 3752} {"train_loss": -25.61557388305664, "global_step": 311481, "epoch": 3752} {"train_loss": -26.1734676361084, "global_step": 311482, "epoch": 3752} {"train_loss": -26.103946685791016, "global_step": 311483, "epoch": 3752} {"train_loss": -25.849838256835938, "global_step": 311484, "epoch": 3752} {"train_loss": -26.0751953125, "global_step": 311485, "epoch": 3752} {"train_loss": -25.989160537719727, "global_step": 311486, "epoch": 3752} {"train_loss": -25.55891990661621, "global_step": 311487, "epoch": 3752} {"train_loss": -25.4559383392334, "global_step": 311488, "epoch": 3752} {"train_loss": -25.600866317749023, "global_step": 311489, "epoch": 3752} {"train_loss": -25.978235244750977, "global_step": 311490, "epoch": 3752} {"train_loss": -25.965070724487305, "global_step": 311491, "epoch": 3752} {"train_loss": -25.783292770385742, "global_step": 311492, "epoch": 3752} {"train_loss": -25.682035446166992, "global_step": 311493, "epoch": 3752} {"train_loss": -25.669971466064453, "global_step": 311494, "epoch": 3752} {"train_loss": -25.492177963256836, "global_step": 311495, "epoch": 3752} {"train_loss": -25.8402099609375, "global_step": 311496, "epoch": 3752} {"train_loss": -26.00189781188965, "global_step": 311497, "epoch": 3752} {"train_loss": -25.715060475360918, "global_step": 311498, "epoch": 3752, "val_loss": 7332119.0} {"train_loss": -25.1474609375, "global_step": 311499, "epoch": 3753} {"train_loss": -25.030166625976562, "global_step": 311500, "epoch": 3753} {"train_loss": -24.919734954833984, "global_step": 311501, "epoch": 3753} {"train_loss": -24.996139526367188, "global_step": 311502, "epoch": 3753} {"train_loss": -24.722806930541992, "global_step": 311503, "epoch": 3753} {"train_loss": -25.076969146728516, "global_step": 311504, "epoch": 3753} {"train_loss": -25.19826316833496, "global_step": 311505, "epoch": 3753} {"train_loss": -25.15399742126465, "global_step": 311506, "epoch": 3753} {"train_loss": -25.290225982666016, "global_step": 311507, "epoch": 3753} {"train_loss": -25.473281860351562, "global_step": 311508, "epoch": 3753} {"train_loss": -25.27738380432129, "global_step": 311509, "epoch": 3753} {"train_loss": -25.543119430541992, "global_step": 311510, "epoch": 3753} {"train_loss": -25.372743606567383, "global_step": 311511, "epoch": 3753} {"train_loss": -25.377744674682617, "global_step": 311512, "epoch": 3753} {"train_loss": -25.426782608032227, "global_step": 311513, "epoch": 3753} {"train_loss": -25.119789123535156, "global_step": 311514, "epoch": 3753} {"train_loss": -25.559995651245117, "global_step": 311515, "epoch": 3753} {"train_loss": -25.563152313232422, "global_step": 311516, "epoch": 3753} {"train_loss": -25.876327514648438, "global_step": 311517, "epoch": 3753} {"train_loss": -25.312192916870117, "global_step": 311518, "epoch": 3753} {"train_loss": -25.821542739868164, "global_step": 311519, "epoch": 3753} {"train_loss": -25.60161781311035, "global_step": 311520, "epoch": 3753} {"train_loss": -25.452091217041016, "global_step": 311521, "epoch": 3753} {"train_loss": -25.36323356628418, "global_step": 311522, "epoch": 3753} {"train_loss": -25.928791046142578, "global_step": 311523, "epoch": 3753} {"train_loss": -25.6731014251709, "global_step": 311524, "epoch": 3753} {"train_loss": -25.76984977722168, "global_step": 311525, "epoch": 3753} {"train_loss": -25.54166603088379, "global_step": 311526, "epoch": 3753} {"train_loss": -25.968219757080078, "global_step": 311527, "epoch": 3753} {"train_loss": -25.972564697265625, "global_step": 311528, "epoch": 3753} {"train_loss": -25.545602798461914, "global_step": 311529, "epoch": 3753} {"train_loss": -25.824234008789062, "global_step": 311530, "epoch": 3753} {"train_loss": -25.819852828979492, "global_step": 311531, "epoch": 3753} {"train_loss": -25.903152465820312, "global_step": 311532, "epoch": 3753} {"train_loss": -25.98567771911621, "global_step": 311533, "epoch": 3753} {"train_loss": -25.73853874206543, "global_step": 311534, "epoch": 3753} {"train_loss": -25.8542537689209, "global_step": 311535, "epoch": 3753} {"train_loss": -25.781665802001953, "global_step": 311536, "epoch": 3753} {"train_loss": -25.312055587768555, "global_step": 311537, "epoch": 3753} {"train_loss": -25.65056800842285, "global_step": 311538, "epoch": 3753} {"train_loss": -26.030969619750977, "global_step": 311539, "epoch": 3753} {"train_loss": -25.478124618530273, "global_step": 311540, "epoch": 3753} {"train_loss": -25.529197692871094, "global_step": 311541, "epoch": 3753} {"train_loss": -25.76690673828125, "global_step": 311542, "epoch": 3753} {"train_loss": -25.54443359375, "global_step": 311543, "epoch": 3753} {"train_loss": -25.34416961669922, "global_step": 311544, "epoch": 3753} {"train_loss": -25.897409439086914, "global_step": 311545, "epoch": 3753} {"train_loss": -25.381744384765625, "global_step": 311546, "epoch": 3753} {"train_loss": -25.733930587768555, "global_step": 311547, "epoch": 3753} {"train_loss": -25.772592544555664, "global_step": 311548, "epoch": 3753} {"train_loss": -25.453433990478516, "global_step": 311549, "epoch": 3753} {"train_loss": -25.819477081298828, "global_step": 311550, "epoch": 3753} {"train_loss": -25.833541870117188, "global_step": 311551, "epoch": 3753} {"train_loss": -25.594440460205078, "global_step": 311552, "epoch": 3753} {"train_loss": -25.77046012878418, "global_step": 311553, "epoch": 3753} {"train_loss": -25.82869529724121, "global_step": 311554, "epoch": 3753} {"train_loss": -25.59880828857422, "global_step": 311555, "epoch": 3753} {"train_loss": -25.746801376342773, "global_step": 311556, "epoch": 3753} {"train_loss": -25.801349639892578, "global_step": 311557, "epoch": 3753} {"train_loss": -25.5390682220459, "global_step": 311558, "epoch": 3753} {"train_loss": -26.22199821472168, "global_step": 311559, "epoch": 3753} {"train_loss": -25.988004684448242, "global_step": 311560, "epoch": 3753} {"train_loss": -26.004980087280273, "global_step": 311561, "epoch": 3753} {"train_loss": -25.85438346862793, "global_step": 311562, "epoch": 3753} {"train_loss": -25.7611141204834, "global_step": 311563, "epoch": 3753} {"train_loss": -25.960193634033203, "global_step": 311564, "epoch": 3753} {"train_loss": -25.97858238220215, "global_step": 311565, "epoch": 3753} {"train_loss": -25.932647705078125, "global_step": 311566, "epoch": 3753} {"train_loss": -25.72959327697754, "global_step": 311567, "epoch": 3753} {"train_loss": -26.086368560791016, "global_step": 311568, "epoch": 3753} {"train_loss": -26.004446029663086, "global_step": 311569, "epoch": 3753} {"train_loss": -25.90705680847168, "global_step": 311570, "epoch": 3753} {"train_loss": -25.55138397216797, "global_step": 311571, "epoch": 3753} {"train_loss": -26.035736083984375, "global_step": 311572, "epoch": 3753} {"train_loss": -25.861791610717773, "global_step": 311573, "epoch": 3753} {"train_loss": -25.550424575805664, "global_step": 311574, "epoch": 3753} {"train_loss": -25.611358642578125, "global_step": 311575, "epoch": 3753} {"train_loss": -26.023466110229492, "global_step": 311576, "epoch": 3753} {"train_loss": -25.541519165039062, "global_step": 311577, "epoch": 3753} {"train_loss": -25.556005477905273, "global_step": 311578, "epoch": 3753} {"train_loss": -25.64863395690918, "global_step": 311579, "epoch": 3753} {"train_loss": -25.90616226196289, "global_step": 311580, "epoch": 3753} {"train_loss": -25.63359359373529, "global_step": 311581, "epoch": 3753, "val_loss": 7357975.5} {"train_loss": -24.9042911529541, "global_step": 311582, "epoch": 3754} {"train_loss": -25.152528762817383, "global_step": 311583, "epoch": 3754} {"train_loss": -25.252883911132812, "global_step": 311584, "epoch": 3754} {"train_loss": -24.896793365478516, "global_step": 311585, "epoch": 3754} {"train_loss": -25.67138671875, "global_step": 311586, "epoch": 3754} {"train_loss": -25.2586727142334, "global_step": 311587, "epoch": 3754} {"train_loss": -25.37188148498535, "global_step": 311588, "epoch": 3754} {"train_loss": -25.12563133239746, "global_step": 311589, "epoch": 3754} {"train_loss": -25.428754806518555, "global_step": 311590, "epoch": 3754} {"train_loss": -25.515623092651367, "global_step": 311591, "epoch": 3754} {"train_loss": -25.65053367614746, "global_step": 311592, "epoch": 3754} {"train_loss": -25.639570236206055, "global_step": 311593, "epoch": 3754} {"train_loss": -25.35455322265625, "global_step": 311594, "epoch": 3754} {"train_loss": -25.598596572875977, "global_step": 311595, "epoch": 3754} {"train_loss": -25.331205368041992, "global_step": 311596, "epoch": 3754} {"train_loss": -25.68158531188965, "global_step": 311597, "epoch": 3754} {"train_loss": -25.60330581665039, "global_step": 311598, "epoch": 3754} {"train_loss": -25.272754669189453, "global_step": 311599, "epoch": 3754} {"train_loss": -25.31532096862793, "global_step": 311600, "epoch": 3754} {"train_loss": -25.618148803710938, "global_step": 311601, "epoch": 3754} {"train_loss": -25.090551376342773, "global_step": 311602, "epoch": 3754} {"train_loss": -24.967405319213867, "global_step": 311603, "epoch": 3754} {"train_loss": -25.4338321685791, "global_step": 311604, "epoch": 3754} {"train_loss": -25.82919692993164, "global_step": 311605, "epoch": 3754} {"train_loss": -25.55646324157715, "global_step": 311606, "epoch": 3754} {"train_loss": -25.58492088317871, "global_step": 311607, "epoch": 3754} {"train_loss": -25.459718704223633, "global_step": 311608, "epoch": 3754} {"train_loss": -25.59162712097168, "global_step": 311609, "epoch": 3754} {"train_loss": -25.73943519592285, "global_step": 311610, "epoch": 3754} {"train_loss": -25.411664962768555, "global_step": 311611, "epoch": 3754} {"train_loss": -25.109045028686523, "global_step": 311612, "epoch": 3754} {"train_loss": -25.811811447143555, "global_step": 311613, "epoch": 3754} {"train_loss": -25.582448959350586, "global_step": 311614, "epoch": 3754} {"train_loss": -26.07183265686035, "global_step": 311615, "epoch": 3754} {"train_loss": -25.474157333374023, "global_step": 311616, "epoch": 3754} {"train_loss": -25.94764518737793, "global_step": 311617, "epoch": 3754} {"train_loss": -25.838415145874023, "global_step": 311618, "epoch": 3754} {"train_loss": -25.632688522338867, "global_step": 311619, "epoch": 3754} {"train_loss": -25.650415420532227, "global_step": 311620, "epoch": 3754} {"train_loss": -25.912622451782227, "global_step": 311621, "epoch": 3754} {"train_loss": -25.766897201538086, "global_step": 311622, "epoch": 3754} {"train_loss": -25.728748321533203, "global_step": 311623, "epoch": 3754} {"train_loss": -25.569988250732422, "global_step": 311624, "epoch": 3754} {"train_loss": -26.202138900756836, "global_step": 311625, "epoch": 3754} {"train_loss": -25.683944702148438, "global_step": 311626, "epoch": 3754} {"train_loss": -25.711776733398438, "global_step": 311627, "epoch": 3754} {"train_loss": -25.77618408203125, "global_step": 311628, "epoch": 3754} {"train_loss": -26.0355281829834, "global_step": 311629, "epoch": 3754} {"train_loss": -25.76605796813965, "global_step": 311630, "epoch": 3754} {"train_loss": -25.838775634765625, "global_step": 311631, "epoch": 3754} {"train_loss": -26.072378158569336, "global_step": 311632, "epoch": 3754} {"train_loss": -25.728559494018555, "global_step": 311633, "epoch": 3754} {"train_loss": -26.09687614440918, "global_step": 311634, "epoch": 3754} {"train_loss": -26.41754722595215, "global_step": 311635, "epoch": 3754} {"train_loss": -25.762426376342773, "global_step": 311636, "epoch": 3754} {"train_loss": -25.97413444519043, "global_step": 311637, "epoch": 3754} {"train_loss": -25.829700469970703, "global_step": 311638, "epoch": 3754} {"train_loss": -25.854690551757812, "global_step": 311639, "epoch": 3754} {"train_loss": -26.268014907836914, "global_step": 311640, "epoch": 3754} {"train_loss": -25.69852066040039, "global_step": 311641, "epoch": 3754} {"train_loss": -26.07655906677246, "global_step": 311642, "epoch": 3754} {"train_loss": -25.784040451049805, "global_step": 311643, "epoch": 3754} {"train_loss": -25.64192008972168, "global_step": 311644, "epoch": 3754} {"train_loss": -25.92333984375, "global_step": 311645, "epoch": 3754} {"train_loss": -25.410419464111328, "global_step": 311646, "epoch": 3754} {"train_loss": -25.82430076599121, "global_step": 311647, "epoch": 3754} {"train_loss": -26.112567901611328, "global_step": 311648, "epoch": 3754} {"train_loss": -26.048627853393555, "global_step": 311649, "epoch": 3754} {"train_loss": -26.08905601501465, "global_step": 311650, "epoch": 3754} {"train_loss": -25.82083511352539, "global_step": 311651, "epoch": 3754} {"train_loss": -25.59962272644043, "global_step": 311652, "epoch": 3754} {"train_loss": -25.700448989868164, "global_step": 311653, "epoch": 3754} {"train_loss": -25.817691802978516, "global_step": 311654, "epoch": 3754} {"train_loss": -25.969863891601562, "global_step": 311655, "epoch": 3754} {"train_loss": -26.018024444580078, "global_step": 311656, "epoch": 3754} {"train_loss": -26.170881271362305, "global_step": 311657, "epoch": 3754} {"train_loss": -25.891111373901367, "global_step": 311658, "epoch": 3754} {"train_loss": -25.981815338134766, "global_step": 311659, "epoch": 3754} {"train_loss": -26.0129337310791, "global_step": 311660, "epoch": 3754} {"train_loss": -25.994800567626953, "global_step": 311661, "epoch": 3754} {"train_loss": -25.81379508972168, "global_step": 311662, "epoch": 3754} {"train_loss": -26.043704986572266, "global_step": 311663, "epoch": 3754} {"train_loss": -25.680987415543523, "global_step": 311664, "epoch": 3754, "val_loss": 7317064.0} {"train_loss": -25.034318923950195, "global_step": 311665, "epoch": 3755} {"train_loss": -25.069591522216797, "global_step": 311666, "epoch": 3755} {"train_loss": -24.89967918395996, "global_step": 311667, "epoch": 3755} {"train_loss": -25.382780075073242, "global_step": 311668, "epoch": 3755} {"train_loss": -25.21187400817871, "global_step": 311669, "epoch": 3755} {"train_loss": -25.67755126953125, "global_step": 311670, "epoch": 3755} {"train_loss": -25.552597045898438, "global_step": 311671, "epoch": 3755} {"train_loss": -25.553131103515625, "global_step": 311672, "epoch": 3755} {"train_loss": -25.271623611450195, "global_step": 311673, "epoch": 3755} {"train_loss": -25.08763885498047, "global_step": 311674, "epoch": 3755} {"train_loss": -25.25150489807129, "global_step": 311675, "epoch": 3755} {"train_loss": -25.54999351501465, "global_step": 311676, "epoch": 3755} {"train_loss": -25.528730392456055, "global_step": 311677, "epoch": 3755} {"train_loss": -25.288949966430664, "global_step": 311678, "epoch": 3755} {"train_loss": -25.363143920898438, "global_step": 311679, "epoch": 3755} {"train_loss": -25.192432403564453, "global_step": 311680, "epoch": 3755} {"train_loss": -25.514524459838867, "global_step": 311681, "epoch": 3755} {"train_loss": -25.690027236938477, "global_step": 311682, "epoch": 3755} {"train_loss": -25.82642936706543, "global_step": 311683, "epoch": 3755} {"train_loss": -25.526094436645508, "global_step": 311684, "epoch": 3755} {"train_loss": -25.683475494384766, "global_step": 311685, "epoch": 3755} {"train_loss": -25.888599395751953, "global_step": 311686, "epoch": 3755} {"train_loss": -25.680957794189453, "global_step": 311687, "epoch": 3755} {"train_loss": -25.514928817749023, "global_step": 311688, "epoch": 3755} {"train_loss": -25.781827926635742, "global_step": 311689, "epoch": 3755} {"train_loss": -25.64689064025879, "global_step": 311690, "epoch": 3755} {"train_loss": -25.60674476623535, "global_step": 311691, "epoch": 3755} {"train_loss": -25.662580490112305, "global_step": 311692, "epoch": 3755} {"train_loss": -25.360443115234375, "global_step": 311693, "epoch": 3755} {"train_loss": -25.555593490600586, "global_step": 311694, "epoch": 3755} {"train_loss": -25.69428825378418, "global_step": 311695, "epoch": 3755} {"train_loss": -25.9755859375, "global_step": 311696, "epoch": 3755} {"train_loss": -25.510791778564453, "global_step": 311697, "epoch": 3755} {"train_loss": -25.720386505126953, "global_step": 311698, "epoch": 3755} {"train_loss": -25.637006759643555, "global_step": 311699, "epoch": 3755} {"train_loss": -26.058324813842773, "global_step": 311700, "epoch": 3755} {"train_loss": -26.002180099487305, "global_step": 311701, "epoch": 3755} {"train_loss": -25.641803741455078, "global_step": 311702, "epoch": 3755} {"train_loss": -26.018522262573242, "global_step": 311703, "epoch": 3755} {"train_loss": -25.690805435180664, "global_step": 311704, "epoch": 3755} {"train_loss": -26.050338745117188, "global_step": 311705, "epoch": 3755} {"train_loss": -25.72686767578125, "global_step": 311706, "epoch": 3755} {"train_loss": -25.986371994018555, "global_step": 311707, "epoch": 3755} {"train_loss": -25.927539825439453, "global_step": 311708, "epoch": 3755} {"train_loss": -26.017194747924805, "global_step": 311709, "epoch": 3755} {"train_loss": -25.975568771362305, "global_step": 311710, "epoch": 3755} {"train_loss": -25.867252349853516, "global_step": 311711, "epoch": 3755} {"train_loss": -25.898080825805664, "global_step": 311712, "epoch": 3755} {"train_loss": -25.96262550354004, "global_step": 311713, "epoch": 3755} {"train_loss": -26.042112350463867, "global_step": 311714, "epoch": 3755} {"train_loss": -26.10931968688965, "global_step": 311715, "epoch": 3755} {"train_loss": -25.759336471557617, "global_step": 311716, "epoch": 3755} {"train_loss": -25.9154109954834, "global_step": 311717, "epoch": 3755} {"train_loss": -25.684879302978516, "global_step": 311718, "epoch": 3755} {"train_loss": -25.459209442138672, "global_step": 311719, "epoch": 3755} {"train_loss": -25.544912338256836, "global_step": 311720, "epoch": 3755} {"train_loss": -25.384401321411133, "global_step": 311721, "epoch": 3755} {"train_loss": -25.54062271118164, "global_step": 311722, "epoch": 3755} {"train_loss": -26.07269287109375, "global_step": 311723, "epoch": 3755} {"train_loss": -26.01397132873535, "global_step": 311724, "epoch": 3755} {"train_loss": -25.873584747314453, "global_step": 311725, "epoch": 3755} {"train_loss": -25.850576400756836, "global_step": 311726, "epoch": 3755} {"train_loss": -26.15473747253418, "global_step": 311727, "epoch": 3755} {"train_loss": -25.851179122924805, "global_step": 311728, "epoch": 3755} {"train_loss": -25.476333618164062, "global_step": 311729, "epoch": 3755} {"train_loss": -25.668975830078125, "global_step": 311730, "epoch": 3755} {"train_loss": -25.851606369018555, "global_step": 311731, "epoch": 3755} {"train_loss": -25.950536727905273, "global_step": 311732, "epoch": 3755} {"train_loss": -25.693273544311523, "global_step": 311733, "epoch": 3755} {"train_loss": -26.1584529876709, "global_step": 311734, "epoch": 3755} {"train_loss": -25.462148666381836, "global_step": 311735, "epoch": 3755} {"train_loss": -25.71537208557129, "global_step": 311736, "epoch": 3755} {"train_loss": -25.7957763671875, "global_step": 311737, "epoch": 3755} {"train_loss": -25.936187744140625, "global_step": 311738, "epoch": 3755} {"train_loss": -25.379140853881836, "global_step": 311739, "epoch": 3755} {"train_loss": -25.194629669189453, "global_step": 311740, "epoch": 3755} {"train_loss": -25.882482528686523, "global_step": 311741, "epoch": 3755} {"train_loss": -25.655792236328125, "global_step": 311742, "epoch": 3755} {"train_loss": -25.687210083007812, "global_step": 311743, "epoch": 3755} {"train_loss": -25.79268455505371, "global_step": 311744, "epoch": 3755} {"train_loss": -25.71053123474121, "global_step": 311745, "epoch": 3755} {"train_loss": -25.89192008972168, "global_step": 311746, "epoch": 3755} {"train_loss": -25.67788859447801, "global_step": 311747, "epoch": 3755, "val_loss": 7375255.0} {"train_loss": -25.490602493286133, "global_step": 311748, "epoch": 3756} {"train_loss": -25.035884857177734, "global_step": 311749, "epoch": 3756} {"train_loss": -24.856332778930664, "global_step": 311750, "epoch": 3756} {"train_loss": -25.07151985168457, "global_step": 311751, "epoch": 3756} {"train_loss": -25.72174072265625, "global_step": 311752, "epoch": 3756} {"train_loss": -25.175695419311523, "global_step": 311753, "epoch": 3756} {"train_loss": -25.44955825805664, "global_step": 311754, "epoch": 3756} {"train_loss": -25.70790672302246, "global_step": 311755, "epoch": 3756} {"train_loss": -25.446943283081055, "global_step": 311756, "epoch": 3756} {"train_loss": -25.410131454467773, "global_step": 311757, "epoch": 3756} {"train_loss": -25.768239974975586, "global_step": 311758, "epoch": 3756} {"train_loss": -25.431461334228516, "global_step": 311759, "epoch": 3756} {"train_loss": -25.621484756469727, "global_step": 311760, "epoch": 3756} {"train_loss": -25.7451229095459, "global_step": 311761, "epoch": 3756} {"train_loss": -25.667333602905273, "global_step": 311762, "epoch": 3756} {"train_loss": -25.696552276611328, "global_step": 311763, "epoch": 3756} {"train_loss": -25.67377281188965, "global_step": 311764, "epoch": 3756} {"train_loss": -25.639148712158203, "global_step": 311765, "epoch": 3756} {"train_loss": -25.81751823425293, "global_step": 311766, "epoch": 3756} {"train_loss": -25.747943878173828, "global_step": 311767, "epoch": 3756} {"train_loss": -25.829938888549805, "global_step": 311768, "epoch": 3756} {"train_loss": -25.71026611328125, "global_step": 311769, "epoch": 3756} {"train_loss": -25.781721115112305, "global_step": 311770, "epoch": 3756} {"train_loss": -25.87582778930664, "global_step": 311771, "epoch": 3756} {"train_loss": -25.88254737854004, "global_step": 311772, "epoch": 3756} {"train_loss": -25.870532989501953, "global_step": 311773, "epoch": 3756} {"train_loss": -25.796125411987305, "global_step": 311774, "epoch": 3756} {"train_loss": -26.014617919921875, "global_step": 311775, "epoch": 3756} {"train_loss": -25.776508331298828, "global_step": 311776, "epoch": 3756} {"train_loss": -25.622053146362305, "global_step": 311777, "epoch": 3756} {"train_loss": -25.83176040649414, "global_step": 311778, "epoch": 3756} {"train_loss": -26.004812240600586, "global_step": 311779, "epoch": 3756} {"train_loss": -25.547222137451172, "global_step": 311780, "epoch": 3756} {"train_loss": -25.588977813720703, "global_step": 311781, "epoch": 3756} {"train_loss": -25.470230102539062, "global_step": 311782, "epoch": 3756} {"train_loss": -25.90059471130371, "global_step": 311783, "epoch": 3756} {"train_loss": -25.694143295288086, "global_step": 311784, "epoch": 3756} {"train_loss": -25.337804794311523, "global_step": 311785, "epoch": 3756} {"train_loss": -25.43657684326172, "global_step": 311786, "epoch": 3756} {"train_loss": -25.578479766845703, "global_step": 311787, "epoch": 3756} {"train_loss": -25.6393985748291, "global_step": 311788, "epoch": 3756} {"train_loss": -24.714426040649414, "global_step": 311789, "epoch": 3756} {"train_loss": -25.66346549987793, "global_step": 311790, "epoch": 3756} {"train_loss": -25.77240562438965, "global_step": 311791, "epoch": 3756} {"train_loss": -25.263147354125977, "global_step": 311792, "epoch": 3756} {"train_loss": -25.304407119750977, "global_step": 311793, "epoch": 3756} {"train_loss": -25.085556030273438, "global_step": 311794, "epoch": 3756} {"train_loss": -25.789793014526367, "global_step": 311795, "epoch": 3756} {"train_loss": -25.101539611816406, "global_step": 311796, "epoch": 3756} {"train_loss": -25.785892486572266, "global_step": 311797, "epoch": 3756} {"train_loss": -25.566272735595703, "global_step": 311798, "epoch": 3756} {"train_loss": -25.9709415435791, "global_step": 311799, "epoch": 3756} {"train_loss": -25.24762535095215, "global_step": 311800, "epoch": 3756} {"train_loss": -25.4848690032959, "global_step": 311801, "epoch": 3756} {"train_loss": -25.898792266845703, "global_step": 311802, "epoch": 3756} {"train_loss": -25.951770782470703, "global_step": 311803, "epoch": 3756} {"train_loss": -25.75044822692871, "global_step": 311804, "epoch": 3756} {"train_loss": -25.8020076751709, "global_step": 311805, "epoch": 3756} {"train_loss": -25.40336036682129, "global_step": 311806, "epoch": 3756} {"train_loss": -25.383481979370117, "global_step": 311807, "epoch": 3756} {"train_loss": -25.8288516998291, "global_step": 311808, "epoch": 3756} {"train_loss": -25.811521530151367, "global_step": 311809, "epoch": 3756} {"train_loss": -25.517635345458984, "global_step": 311810, "epoch": 3756} {"train_loss": -25.86146354675293, "global_step": 311811, "epoch": 3756} {"train_loss": -25.54762077331543, "global_step": 311812, "epoch": 3756} {"train_loss": -25.9606990814209, "global_step": 311813, "epoch": 3756} {"train_loss": -25.777395248413086, "global_step": 311814, "epoch": 3756} {"train_loss": -25.829410552978516, "global_step": 311815, "epoch": 3756} {"train_loss": -25.7236328125, "global_step": 311816, "epoch": 3756} {"train_loss": -25.89251136779785, "global_step": 311817, "epoch": 3756} {"train_loss": -25.95624351501465, "global_step": 311818, "epoch": 3756} {"train_loss": -26.012252807617188, "global_step": 311819, "epoch": 3756} {"train_loss": -25.845605850219727, "global_step": 311820, "epoch": 3756} {"train_loss": -26.098814010620117, "global_step": 311821, "epoch": 3756} {"train_loss": -25.69021987915039, "global_step": 311822, "epoch": 3756} {"train_loss": -26.110334396362305, "global_step": 311823, "epoch": 3756} {"train_loss": -25.9846248626709, "global_step": 311824, "epoch": 3756} {"train_loss": -25.628387451171875, "global_step": 311825, "epoch": 3756} {"train_loss": -25.92758560180664, "global_step": 311826, "epoch": 3756} {"train_loss": -26.012882232666016, "global_step": 311827, "epoch": 3756} {"train_loss": -26.171295166015625, "global_step": 311828, "epoch": 3756} {"train_loss": -26.02864646911621, "global_step": 311829, "epoch": 3756} {"train_loss": -25.67358805185341, "global_step": 311830, "epoch": 3756, "val_loss": 7181902.0} {"train_loss": -24.983144760131836, "global_step": 311831, "epoch": 3757} {"train_loss": -26.04664421081543, "global_step": 311832, "epoch": 3757} {"train_loss": -25.640872955322266, "global_step": 311833, "epoch": 3757} {"train_loss": -25.349475860595703, "global_step": 311834, "epoch": 3757} {"train_loss": -25.187307357788086, "global_step": 311835, "epoch": 3757} {"train_loss": -25.172706604003906, "global_step": 311836, "epoch": 3757} {"train_loss": -25.397645950317383, "global_step": 311837, "epoch": 3757} {"train_loss": -25.331584930419922, "global_step": 311838, "epoch": 3757} {"train_loss": -25.719751358032227, "global_step": 311839, "epoch": 3757} {"train_loss": -25.893726348876953, "global_step": 311840, "epoch": 3757} {"train_loss": -25.499256134033203, "global_step": 311841, "epoch": 3757} {"train_loss": -25.389554977416992, "global_step": 311842, "epoch": 3757} {"train_loss": -25.569852828979492, "global_step": 311843, "epoch": 3757} {"train_loss": -25.6789608001709, "global_step": 311844, "epoch": 3757} {"train_loss": -25.329753875732422, "global_step": 311845, "epoch": 3757} {"train_loss": -25.634658813476562, "global_step": 311846, "epoch": 3757} {"train_loss": -25.57745933532715, "global_step": 311847, "epoch": 3757} {"train_loss": -25.472684860229492, "global_step": 311848, "epoch": 3757} {"train_loss": -25.859899520874023, "global_step": 311849, "epoch": 3757} {"train_loss": -25.760974884033203, "global_step": 311850, "epoch": 3757} {"train_loss": -25.75270652770996, "global_step": 311851, "epoch": 3757} {"train_loss": -25.922149658203125, "global_step": 311852, "epoch": 3757} {"train_loss": -25.538877487182617, "global_step": 311853, "epoch": 3757} {"train_loss": -25.81601333618164, "global_step": 311854, "epoch": 3757} {"train_loss": -26.00274085998535, "global_step": 311855, "epoch": 3757} {"train_loss": -25.552946090698242, "global_step": 311856, "epoch": 3757} {"train_loss": -25.732641220092773, "global_step": 311857, "epoch": 3757} {"train_loss": -25.622207641601562, "global_step": 311858, "epoch": 3757} {"train_loss": -25.777502059936523, "global_step": 311859, "epoch": 3757} {"train_loss": -25.66619873046875, "global_step": 311860, "epoch": 3757} {"train_loss": -25.6700382232666, "global_step": 311861, "epoch": 3757} {"train_loss": -25.59394645690918, "global_step": 311862, "epoch": 3757} {"train_loss": -25.86492347717285, "global_step": 311863, "epoch": 3757} {"train_loss": -25.9078369140625, "global_step": 311864, "epoch": 3757} {"train_loss": -25.707311630249023, "global_step": 311865, "epoch": 3757} {"train_loss": -26.402301788330078, "global_step": 311866, "epoch": 3757} {"train_loss": -25.959827423095703, "global_step": 311867, "epoch": 3757} {"train_loss": -25.843713760375977, "global_step": 311868, "epoch": 3757} {"train_loss": -25.829328536987305, "global_step": 311869, "epoch": 3757} {"train_loss": -26.1617374420166, "global_step": 311870, "epoch": 3757} {"train_loss": -25.22157859802246, "global_step": 311871, "epoch": 3757} {"train_loss": -25.290639877319336, "global_step": 311872, "epoch": 3757} {"train_loss": -25.32547950744629, "global_step": 311873, "epoch": 3757} {"train_loss": -25.360776901245117, "global_step": 311874, "epoch": 3757} {"train_loss": -25.74947166442871, "global_step": 311875, "epoch": 3757} {"train_loss": -25.253023147583008, "global_step": 311876, "epoch": 3757} {"train_loss": -25.282073974609375, "global_step": 311877, "epoch": 3757} {"train_loss": -25.51666831970215, "global_step": 311878, "epoch": 3757} {"train_loss": -25.257516860961914, "global_step": 311879, "epoch": 3757} {"train_loss": -25.948205947875977, "global_step": 311880, "epoch": 3757} {"train_loss": -25.4731388092041, "global_step": 311881, "epoch": 3757} {"train_loss": -25.82663917541504, "global_step": 311882, "epoch": 3757} {"train_loss": -25.635787963867188, "global_step": 311883, "epoch": 3757} {"train_loss": -25.9160099029541, "global_step": 311884, "epoch": 3757} {"train_loss": -25.848230361938477, "global_step": 311885, "epoch": 3757} {"train_loss": -25.51114845275879, "global_step": 311886, "epoch": 3757} {"train_loss": -25.852359771728516, "global_step": 311887, "epoch": 3757} {"train_loss": -26.027585983276367, "global_step": 311888, "epoch": 3757} {"train_loss": -26.03838539123535, "global_step": 311889, "epoch": 3757} {"train_loss": -25.996871948242188, "global_step": 311890, "epoch": 3757} {"train_loss": -25.7586612701416, "global_step": 311891, "epoch": 3757} {"train_loss": -25.51827049255371, "global_step": 311892, "epoch": 3757} {"train_loss": -25.922605514526367, "global_step": 311893, "epoch": 3757} {"train_loss": -25.881505966186523, "global_step": 311894, "epoch": 3757} {"train_loss": -25.6187801361084, "global_step": 311895, "epoch": 3757} {"train_loss": -25.862401962280273, "global_step": 311896, "epoch": 3757} {"train_loss": -25.9594783782959, "global_step": 311897, "epoch": 3757} {"train_loss": -25.859785079956055, "global_step": 311898, "epoch": 3757} {"train_loss": -25.901540756225586, "global_step": 311899, "epoch": 3757} {"train_loss": -25.949695587158203, "global_step": 311900, "epoch": 3757} {"train_loss": -25.717863082885742, "global_step": 311901, "epoch": 3757} {"train_loss": -25.680301666259766, "global_step": 311902, "epoch": 3757} {"train_loss": -25.71842384338379, "global_step": 311903, "epoch": 3757} {"train_loss": -25.633691787719727, "global_step": 311904, "epoch": 3757} {"train_loss": -25.66521644592285, "global_step": 311905, "epoch": 3757} {"train_loss": -25.561912536621094, "global_step": 311906, "epoch": 3757} {"train_loss": -25.63862419128418, "global_step": 311907, "epoch": 3757} {"train_loss": -25.4572696685791, "global_step": 311908, "epoch": 3757} {"train_loss": -26.107221603393555, "global_step": 311909, "epoch": 3757} {"train_loss": -25.61457633972168, "global_step": 311910, "epoch": 3757} {"train_loss": -25.84132194519043, "global_step": 311911, "epoch": 3757} {"train_loss": -25.736923217773438, "global_step": 311912, "epoch": 3757} {"train_loss": -25.68180934492364, "global_step": 311913, "epoch": 3757, "val_loss": 7266321.0} {"train_loss": -25.936811447143555, "global_step": 311914, "epoch": 3758} {"train_loss": -25.350418090820312, "global_step": 311915, "epoch": 3758} {"train_loss": -25.496225357055664, "global_step": 311916, "epoch": 3758} {"train_loss": -25.544574737548828, "global_step": 311917, "epoch": 3758} {"train_loss": -25.80695152282715, "global_step": 311918, "epoch": 3758} {"train_loss": -25.3295841217041, "global_step": 311919, "epoch": 3758} {"train_loss": -25.767410278320312, "global_step": 311920, "epoch": 3758} {"train_loss": -25.347238540649414, "global_step": 311921, "epoch": 3758} {"train_loss": -25.649127960205078, "global_step": 311922, "epoch": 3758} {"train_loss": -25.373567581176758, "global_step": 311923, "epoch": 3758} {"train_loss": -25.325790405273438, "global_step": 311924, "epoch": 3758} {"train_loss": -25.81306266784668, "global_step": 311925, "epoch": 3758} {"train_loss": -25.90589714050293, "global_step": 311926, "epoch": 3758} {"train_loss": -25.212554931640625, "global_step": 311927, "epoch": 3758} {"train_loss": -25.23628807067871, "global_step": 311928, "epoch": 3758} {"train_loss": -25.262592315673828, "global_step": 311929, "epoch": 3758} {"train_loss": -25.50702476501465, "global_step": 311930, "epoch": 3758} {"train_loss": -25.40389060974121, "global_step": 311931, "epoch": 3758} {"train_loss": -25.506601333618164, "global_step": 311932, "epoch": 3758} {"train_loss": -25.770526885986328, "global_step": 311933, "epoch": 3758} {"train_loss": -25.882476806640625, "global_step": 311934, "epoch": 3758} {"train_loss": -25.85896110534668, "global_step": 311935, "epoch": 3758} {"train_loss": -25.555500030517578, "global_step": 311936, "epoch": 3758} {"train_loss": -25.650867462158203, "global_step": 311937, "epoch": 3758} {"train_loss": -25.30093765258789, "global_step": 311938, "epoch": 3758} {"train_loss": -25.71408462524414, "global_step": 311939, "epoch": 3758} {"train_loss": -26.04034423828125, "global_step": 311940, "epoch": 3758} {"train_loss": -26.039264678955078, "global_step": 311941, "epoch": 3758} {"train_loss": -25.74191665649414, "global_step": 311942, "epoch": 3758} {"train_loss": -25.783227920532227, "global_step": 311943, "epoch": 3758} {"train_loss": -25.962116241455078, "global_step": 311944, "epoch": 3758} {"train_loss": -26.120712280273438, "global_step": 311945, "epoch": 3758} {"train_loss": -26.006616592407227, "global_step": 311946, "epoch": 3758} {"train_loss": -25.7266788482666, "global_step": 311947, "epoch": 3758} {"train_loss": -26.002079010009766, "global_step": 311948, "epoch": 3758} {"train_loss": -25.677032470703125, "global_step": 311949, "epoch": 3758} {"train_loss": -25.93048095703125, "global_step": 311950, "epoch": 3758} {"train_loss": -25.840240478515625, "global_step": 311951, "epoch": 3758} {"train_loss": -25.850433349609375, "global_step": 311952, "epoch": 3758} {"train_loss": -25.955862045288086, "global_step": 311953, "epoch": 3758} {"train_loss": -25.83064079284668, "global_step": 311954, "epoch": 3758} {"train_loss": -25.960113525390625, "global_step": 311955, "epoch": 3758} {"train_loss": -25.77117919921875, "global_step": 311956, "epoch": 3758} {"train_loss": -25.853193283081055, "global_step": 311957, "epoch": 3758} {"train_loss": -26.263952255249023, "global_step": 311958, "epoch": 3758} {"train_loss": -26.00715446472168, "global_step": 311959, "epoch": 3758} {"train_loss": -25.68172264099121, "global_step": 311960, "epoch": 3758} {"train_loss": -25.767318725585938, "global_step": 311961, "epoch": 3758} {"train_loss": -25.475770950317383, "global_step": 311962, "epoch": 3758} {"train_loss": -25.932275772094727, "global_step": 311963, "epoch": 3758} {"train_loss": -25.824228286743164, "global_step": 311964, "epoch": 3758} {"train_loss": -25.770999908447266, "global_step": 311965, "epoch": 3758} {"train_loss": -25.74904441833496, "global_step": 311966, "epoch": 3758} {"train_loss": -25.083759307861328, "global_step": 311967, "epoch": 3758} {"train_loss": -24.824981689453125, "global_step": 311968, "epoch": 3758} {"train_loss": -25.34761619567871, "global_step": 311969, "epoch": 3758} {"train_loss": -25.628223419189453, "global_step": 311970, "epoch": 3758} {"train_loss": -25.967483520507812, "global_step": 311971, "epoch": 3758} {"train_loss": -25.573606491088867, "global_step": 311972, "epoch": 3758} {"train_loss": -25.443557739257812, "global_step": 311973, "epoch": 3758} {"train_loss": -25.862232208251953, "global_step": 311974, "epoch": 3758} {"train_loss": -25.66216468811035, "global_step": 311975, "epoch": 3758} {"train_loss": -25.524871826171875, "global_step": 311976, "epoch": 3758} {"train_loss": -25.931262969970703, "global_step": 311977, "epoch": 3758} {"train_loss": -25.337894439697266, "global_step": 311978, "epoch": 3758} {"train_loss": -25.237873077392578, "global_step": 311979, "epoch": 3758} {"train_loss": -25.494308471679688, "global_step": 311980, "epoch": 3758} {"train_loss": -25.840045928955078, "global_step": 311981, "epoch": 3758} {"train_loss": -26.020360946655273, "global_step": 311982, "epoch": 3758} {"train_loss": -25.73395347595215, "global_step": 311983, "epoch": 3758} {"train_loss": -25.644567489624023, "global_step": 311984, "epoch": 3758} {"train_loss": -25.753278732299805, "global_step": 311985, "epoch": 3758} {"train_loss": -25.694528579711914, "global_step": 311986, "epoch": 3758} {"train_loss": -26.201080322265625, "global_step": 311987, "epoch": 3758} {"train_loss": -25.7227840423584, "global_step": 311988, "epoch": 3758} {"train_loss": -25.97950553894043, "global_step": 311989, "epoch": 3758} {"train_loss": -25.618627548217773, "global_step": 311990, "epoch": 3758} {"train_loss": -25.690214157104492, "global_step": 311991, "epoch": 3758} {"train_loss": -25.703872680664062, "global_step": 311992, "epoch": 3758} {"train_loss": -25.386905670166016, "global_step": 311993, "epoch": 3758} {"train_loss": -25.6238956451416, "global_step": 311994, "epoch": 3758} {"train_loss": -26.46839714050293, "global_step": 311995, "epoch": 3758} {"train_loss": -25.685240021671156, "global_step": 311996, "epoch": 3758, "val_loss": 7122173.0} {"train_loss": -25.624998092651367, "global_step": 311997, "epoch": 3759} {"train_loss": -25.63044548034668, "global_step": 311998, "epoch": 3759} {"train_loss": -25.392261505126953, "global_step": 311999, "epoch": 3759} {"train_loss": -25.052698135375977, "global_step": 312000, "epoch": 3759} {"train_loss": -25.572120666503906, "global_step": 312001, "epoch": 3759} {"train_loss": -25.313344955444336, "global_step": 312002, "epoch": 3759} {"train_loss": -25.32069206237793, "global_step": 312003, "epoch": 3759} {"train_loss": -25.386024475097656, "global_step": 312004, "epoch": 3759} {"train_loss": -25.127134323120117, "global_step": 312005, "epoch": 3759} {"train_loss": -25.1834716796875, "global_step": 312006, "epoch": 3759} {"train_loss": -25.52326774597168, "global_step": 312007, "epoch": 3759} {"train_loss": -25.45794105529785, "global_step": 312008, "epoch": 3759} {"train_loss": -25.589975357055664, "global_step": 312009, "epoch": 3759} {"train_loss": -25.473064422607422, "global_step": 312010, "epoch": 3759} {"train_loss": -25.988630294799805, "global_step": 312011, "epoch": 3759} {"train_loss": -25.7216796875, "global_step": 312012, "epoch": 3759} {"train_loss": -25.614276885986328, "global_step": 312013, "epoch": 3759} {"train_loss": -25.765981674194336, "global_step": 312014, "epoch": 3759} {"train_loss": -25.93194007873535, "global_step": 312015, "epoch": 3759} {"train_loss": -25.550642013549805, "global_step": 312016, "epoch": 3759} {"train_loss": -25.7387752532959, "global_step": 312017, "epoch": 3759} {"train_loss": -25.456501007080078, "global_step": 312018, "epoch": 3759} {"train_loss": -25.457332611083984, "global_step": 312019, "epoch": 3759} {"train_loss": -25.86471939086914, "global_step": 312020, "epoch": 3759} {"train_loss": -25.7801513671875, "global_step": 312021, "epoch": 3759} {"train_loss": -25.56395149230957, "global_step": 312022, "epoch": 3759} {"train_loss": -25.867828369140625, "global_step": 312023, "epoch": 3759} {"train_loss": -25.897510528564453, "global_step": 312024, "epoch": 3759} {"train_loss": -25.70542335510254, "global_step": 312025, "epoch": 3759} {"train_loss": -25.597339630126953, "global_step": 312026, "epoch": 3759} {"train_loss": -25.61847496032715, "global_step": 312027, "epoch": 3759} {"train_loss": -25.7253360748291, "global_step": 312028, "epoch": 3759} {"train_loss": -25.713315963745117, "global_step": 312029, "epoch": 3759} {"train_loss": -25.9219970703125, "global_step": 312030, "epoch": 3759} {"train_loss": -25.666000366210938, "global_step": 312031, "epoch": 3759} {"train_loss": -25.890729904174805, "global_step": 312032, "epoch": 3759} {"train_loss": -25.898548126220703, "global_step": 312033, "epoch": 3759} {"train_loss": -25.818134307861328, "global_step": 312034, "epoch": 3759} {"train_loss": -25.641504287719727, "global_step": 312035, "epoch": 3759} {"train_loss": -25.84220314025879, "global_step": 312036, "epoch": 3759} {"train_loss": -26.032384872436523, "global_step": 312037, "epoch": 3759} {"train_loss": -26.038633346557617, "global_step": 312038, "epoch": 3759} {"train_loss": -25.847888946533203, "global_step": 312039, "epoch": 3759} {"train_loss": -25.77094078063965, "global_step": 312040, "epoch": 3759} {"train_loss": -25.81760597229004, "global_step": 312041, "epoch": 3759} {"train_loss": -25.440906524658203, "global_step": 312042, "epoch": 3759} {"train_loss": -25.67679214477539, "global_step": 312043, "epoch": 3759} {"train_loss": -25.657079696655273, "global_step": 312044, "epoch": 3759} {"train_loss": -25.866697311401367, "global_step": 312045, "epoch": 3759} {"train_loss": -25.977252960205078, "global_step": 312046, "epoch": 3759} {"train_loss": -25.315444946289062, "global_step": 312047, "epoch": 3759} {"train_loss": -25.927396774291992, "global_step": 312048, "epoch": 3759} {"train_loss": -26.097183227539062, "global_step": 312049, "epoch": 3759} {"train_loss": -25.511831283569336, "global_step": 312050, "epoch": 3759} {"train_loss": -25.86799430847168, "global_step": 312051, "epoch": 3759} {"train_loss": -25.779626846313477, "global_step": 312052, "epoch": 3759} {"train_loss": -25.502578735351562, "global_step": 312053, "epoch": 3759} {"train_loss": -25.922224044799805, "global_step": 312054, "epoch": 3759} {"train_loss": -26.1440372467041, "global_step": 312055, "epoch": 3759} {"train_loss": -26.08575439453125, "global_step": 312056, "epoch": 3759} {"train_loss": -25.804162979125977, "global_step": 312057, "epoch": 3759} {"train_loss": -26.08835220336914, "global_step": 312058, "epoch": 3759} {"train_loss": -26.2707462310791, "global_step": 312059, "epoch": 3759} {"train_loss": -25.73105812072754, "global_step": 312060, "epoch": 3759} {"train_loss": -25.977375030517578, "global_step": 312061, "epoch": 3759} {"train_loss": -26.238727569580078, "global_step": 312062, "epoch": 3759} {"train_loss": -25.86821937561035, "global_step": 312063, "epoch": 3759} {"train_loss": -26.123014450073242, "global_step": 312064, "epoch": 3759} {"train_loss": -26.075342178344727, "global_step": 312065, "epoch": 3759} {"train_loss": -25.861108779907227, "global_step": 312066, "epoch": 3759} {"train_loss": -25.946317672729492, "global_step": 312067, "epoch": 3759} {"train_loss": -25.859670639038086, "global_step": 312068, "epoch": 3759} {"train_loss": -25.62619400024414, "global_step": 312069, "epoch": 3759} {"train_loss": -25.767568588256836, "global_step": 312070, "epoch": 3759} {"train_loss": -25.650861740112305, "global_step": 312071, "epoch": 3759} {"train_loss": -26.024723052978516, "global_step": 312072, "epoch": 3759} {"train_loss": -25.85394859313965, "global_step": 312073, "epoch": 3759} {"train_loss": -25.81402587890625, "global_step": 312074, "epoch": 3759} {"train_loss": -25.553537368774414, "global_step": 312075, "epoch": 3759} {"train_loss": -25.893396377563477, "global_step": 312076, "epoch": 3759} {"train_loss": -25.918970108032227, "global_step": 312077, "epoch": 3759} {"train_loss": -26.028024673461914, "global_step": 312078, "epoch": 3759} {"train_loss": -25.738089044410064, "global_step": 312079, "epoch": 3759, "val_loss": 7321868.5} {"train_loss": -25.32389259338379, "global_step": 312080, "epoch": 3760} {"train_loss": -25.648334503173828, "global_step": 312081, "epoch": 3760} {"train_loss": -25.214780807495117, "global_step": 312082, "epoch": 3760} {"train_loss": -25.1055908203125, "global_step": 312083, "epoch": 3760} {"train_loss": -25.373680114746094, "global_step": 312084, "epoch": 3760} {"train_loss": -25.152761459350586, "global_step": 312085, "epoch": 3760} {"train_loss": -25.248672485351562, "global_step": 312086, "epoch": 3760} {"train_loss": -25.429115295410156, "global_step": 312087, "epoch": 3760} {"train_loss": -25.159399032592773, "global_step": 312088, "epoch": 3760} {"train_loss": -25.487192153930664, "global_step": 312089, "epoch": 3760} {"train_loss": -25.7439022064209, "global_step": 312090, "epoch": 3760} {"train_loss": -25.542638778686523, "global_step": 312091, "epoch": 3760} {"train_loss": -25.740991592407227, "global_step": 312092, "epoch": 3760} {"train_loss": -25.044713973999023, "global_step": 312093, "epoch": 3760} {"train_loss": -25.678674697875977, "global_step": 312094, "epoch": 3760} {"train_loss": -25.50689125061035, "global_step": 312095, "epoch": 3760} {"train_loss": -25.329914093017578, "global_step": 312096, "epoch": 3760} {"train_loss": -25.506986618041992, "global_step": 312097, "epoch": 3760} {"train_loss": -25.8044490814209, "global_step": 312098, "epoch": 3760} {"train_loss": -25.461084365844727, "global_step": 312099, "epoch": 3760} {"train_loss": -25.85845375061035, "global_step": 312100, "epoch": 3760} {"train_loss": -25.9713077545166, "global_step": 312101, "epoch": 3760} {"train_loss": -25.54279136657715, "global_step": 312102, "epoch": 3760} {"train_loss": -25.57181167602539, "global_step": 312103, "epoch": 3760} {"train_loss": -25.481048583984375, "global_step": 312104, "epoch": 3760} {"train_loss": -25.6767520904541, "global_step": 312105, "epoch": 3760} {"train_loss": -25.575458526611328, "global_step": 312106, "epoch": 3760} {"train_loss": -25.66851234436035, "global_step": 312107, "epoch": 3760} {"train_loss": -26.036558151245117, "global_step": 312108, "epoch": 3760} {"train_loss": -25.734344482421875, "global_step": 312109, "epoch": 3760} {"train_loss": -25.42558479309082, "global_step": 312110, "epoch": 3760} {"train_loss": -25.845773696899414, "global_step": 312111, "epoch": 3760} {"train_loss": -25.868146896362305, "global_step": 312112, "epoch": 3760} {"train_loss": -25.806989669799805, "global_step": 312113, "epoch": 3760} {"train_loss": -25.93228530883789, "global_step": 312114, "epoch": 3760} {"train_loss": -25.943836212158203, "global_step": 312115, "epoch": 3760} {"train_loss": -25.924997329711914, "global_step": 312116, "epoch": 3760} {"train_loss": -25.67609214782715, "global_step": 312117, "epoch": 3760} {"train_loss": -25.802988052368164, "global_step": 312118, "epoch": 3760} {"train_loss": -25.513647079467773, "global_step": 312119, "epoch": 3760} {"train_loss": -25.9381160736084, "global_step": 312120, "epoch": 3760} {"train_loss": -25.369131088256836, "global_step": 312121, "epoch": 3760} {"train_loss": -25.09208869934082, "global_step": 312122, "epoch": 3760} {"train_loss": -24.969114303588867, "global_step": 312123, "epoch": 3760} {"train_loss": -25.37038230895996, "global_step": 312124, "epoch": 3760} {"train_loss": -25.504911422729492, "global_step": 312125, "epoch": 3760} {"train_loss": -25.8703670501709, "global_step": 312126, "epoch": 3760} {"train_loss": -25.695032119750977, "global_step": 312127, "epoch": 3760} {"train_loss": -25.520124435424805, "global_step": 312128, "epoch": 3760} {"train_loss": -26.006580352783203, "global_step": 312129, "epoch": 3760} {"train_loss": -25.97759437561035, "global_step": 312130, "epoch": 3760} {"train_loss": -25.497488021850586, "global_step": 312131, "epoch": 3760} {"train_loss": -25.635883331298828, "global_step": 312132, "epoch": 3760} {"train_loss": -25.830093383789062, "global_step": 312133, "epoch": 3760} {"train_loss": -26.242996215820312, "global_step": 312134, "epoch": 3760} {"train_loss": -25.677322387695312, "global_step": 312135, "epoch": 3760} {"train_loss": -26.02143669128418, "global_step": 312136, "epoch": 3760} {"train_loss": -25.849164962768555, "global_step": 312137, "epoch": 3760} {"train_loss": -25.54132652282715, "global_step": 312138, "epoch": 3760} {"train_loss": -26.15435218811035, "global_step": 312139, "epoch": 3760} {"train_loss": -25.89716148376465, "global_step": 312140, "epoch": 3760} {"train_loss": -25.82086753845215, "global_step": 312141, "epoch": 3760} {"train_loss": -26.16261100769043, "global_step": 312142, "epoch": 3760} {"train_loss": -26.181203842163086, "global_step": 312143, "epoch": 3760} {"train_loss": -25.816877365112305, "global_step": 312144, "epoch": 3760} {"train_loss": -25.921466827392578, "global_step": 312145, "epoch": 3760} {"train_loss": -25.882299423217773, "global_step": 312146, "epoch": 3760} {"train_loss": -25.579322814941406, "global_step": 312147, "epoch": 3760} {"train_loss": -26.10333824157715, "global_step": 312148, "epoch": 3760} {"train_loss": -25.825735092163086, "global_step": 312149, "epoch": 3760} {"train_loss": -25.409868240356445, "global_step": 312150, "epoch": 3760} {"train_loss": -25.88003921508789, "global_step": 312151, "epoch": 3760} {"train_loss": -25.856069564819336, "global_step": 312152, "epoch": 3760} {"train_loss": -25.581892013549805, "global_step": 312153, "epoch": 3760} {"train_loss": -26.006711959838867, "global_step": 312154, "epoch": 3760} {"train_loss": -25.76932144165039, "global_step": 312155, "epoch": 3760} {"train_loss": -25.963483810424805, "global_step": 312156, "epoch": 3760} {"train_loss": -25.764175415039062, "global_step": 312157, "epoch": 3760} {"train_loss": -25.719640731811523, "global_step": 312158, "epoch": 3760} {"train_loss": -25.660131454467773, "global_step": 312159, "epoch": 3760} {"train_loss": -25.7563533782959, "global_step": 312160, "epoch": 3760} {"train_loss": -25.807174682617188, "global_step": 312161, "epoch": 3760} {"train_loss": -25.665340998086585, "global_step": 312162, "epoch": 3760, "val_loss": 7332818.0} {"train_loss": -24.686826705932617, "global_step": 312163, "epoch": 3761} {"train_loss": -24.949060440063477, "global_step": 312164, "epoch": 3761} {"train_loss": -25.11771583557129, "global_step": 312165, "epoch": 3761} {"train_loss": -24.96160888671875, "global_step": 312166, "epoch": 3761} {"train_loss": -25.583703994750977, "global_step": 312167, "epoch": 3761} {"train_loss": -25.09785270690918, "global_step": 312168, "epoch": 3761} {"train_loss": -25.446971893310547, "global_step": 312169, "epoch": 3761} {"train_loss": -25.41503143310547, "global_step": 312170, "epoch": 3761} {"train_loss": -25.849185943603516, "global_step": 312171, "epoch": 3761} {"train_loss": -25.255340576171875, "global_step": 312172, "epoch": 3761} {"train_loss": -25.08539581298828, "global_step": 312173, "epoch": 3761} {"train_loss": -25.353363037109375, "global_step": 312174, "epoch": 3761} {"train_loss": -25.197935104370117, "global_step": 312175, "epoch": 3761} {"train_loss": -25.416879653930664, "global_step": 312176, "epoch": 3761} {"train_loss": -25.416763305664062, "global_step": 312177, "epoch": 3761} {"train_loss": -25.50335121154785, "global_step": 312178, "epoch": 3761} {"train_loss": -25.552444458007812, "global_step": 312179, "epoch": 3761} {"train_loss": -25.52854347229004, "global_step": 312180, "epoch": 3761} {"train_loss": -25.713903427124023, "global_step": 312181, "epoch": 3761} {"train_loss": -25.459300994873047, "global_step": 312182, "epoch": 3761} {"train_loss": -25.611059188842773, "global_step": 312183, "epoch": 3761} {"train_loss": -25.57002830505371, "global_step": 312184, "epoch": 3761} {"train_loss": -25.66941261291504, "global_step": 312185, "epoch": 3761} {"train_loss": -25.930999755859375, "global_step": 312186, "epoch": 3761} {"train_loss": -26.07035255432129, "global_step": 312187, "epoch": 3761} {"train_loss": -25.753690719604492, "global_step": 312188, "epoch": 3761} {"train_loss": -25.608386993408203, "global_step": 312189, "epoch": 3761} {"train_loss": -25.9183292388916, "global_step": 312190, "epoch": 3761} {"train_loss": -25.9296817779541, "global_step": 312191, "epoch": 3761} {"train_loss": -25.49578857421875, "global_step": 312192, "epoch": 3761} {"train_loss": -25.935651779174805, "global_step": 312193, "epoch": 3761} {"train_loss": -25.86378288269043, "global_step": 312194, "epoch": 3761} {"train_loss": -25.736083984375, "global_step": 312195, "epoch": 3761} {"train_loss": -25.906158447265625, "global_step": 312196, "epoch": 3761} {"train_loss": -25.670743942260742, "global_step": 312197, "epoch": 3761} {"train_loss": -25.75262451171875, "global_step": 312198, "epoch": 3761} {"train_loss": -25.8546142578125, "global_step": 312199, "epoch": 3761} {"train_loss": -25.863767623901367, "global_step": 312200, "epoch": 3761} {"train_loss": -26.15266227722168, "global_step": 312201, "epoch": 3761} {"train_loss": -25.930084228515625, "global_step": 312202, "epoch": 3761} {"train_loss": -26.014081954956055, "global_step": 312203, "epoch": 3761} {"train_loss": -25.674488067626953, "global_step": 312204, "epoch": 3761} {"train_loss": -25.271757125854492, "global_step": 312205, "epoch": 3761} {"train_loss": -25.972753524780273, "global_step": 312206, "epoch": 3761} {"train_loss": -25.375404357910156, "global_step": 312207, "epoch": 3761} {"train_loss": -25.714929580688477, "global_step": 312208, "epoch": 3761} {"train_loss": -25.870996475219727, "global_step": 312209, "epoch": 3761} {"train_loss": -26.054040908813477, "global_step": 312210, "epoch": 3761} {"train_loss": -25.49092674255371, "global_step": 312211, "epoch": 3761} {"train_loss": -25.402950286865234, "global_step": 312212, "epoch": 3761} {"train_loss": -25.270721435546875, "global_step": 312213, "epoch": 3761} {"train_loss": -25.445301055908203, "global_step": 312214, "epoch": 3761} {"train_loss": -25.52146339416504, "global_step": 312215, "epoch": 3761} {"train_loss": -25.483470916748047, "global_step": 312216, "epoch": 3761} {"train_loss": -25.36568260192871, "global_step": 312217, "epoch": 3761} {"train_loss": -25.381860733032227, "global_step": 312218, "epoch": 3761} {"train_loss": -25.131681442260742, "global_step": 312219, "epoch": 3761} {"train_loss": -25.037036895751953, "global_step": 312220, "epoch": 3761} {"train_loss": -25.900217056274414, "global_step": 312221, "epoch": 3761} {"train_loss": -25.09022331237793, "global_step": 312222, "epoch": 3761} {"train_loss": -25.27211570739746, "global_step": 312223, "epoch": 3761} {"train_loss": -25.37619972229004, "global_step": 312224, "epoch": 3761} {"train_loss": -25.969329833984375, "global_step": 312225, "epoch": 3761} {"train_loss": -25.563283920288086, "global_step": 312226, "epoch": 3761} {"train_loss": -25.707014083862305, "global_step": 312227, "epoch": 3761} {"train_loss": -25.480796813964844, "global_step": 312228, "epoch": 3761} {"train_loss": -25.750314712524414, "global_step": 312229, "epoch": 3761} {"train_loss": -25.914106369018555, "global_step": 312230, "epoch": 3761} {"train_loss": -25.281349182128906, "global_step": 312231, "epoch": 3761} {"train_loss": -25.630399703979492, "global_step": 312232, "epoch": 3761} {"train_loss": -25.645044326782227, "global_step": 312233, "epoch": 3761} {"train_loss": -25.412145614624023, "global_step": 312234, "epoch": 3761} {"train_loss": -25.936853408813477, "global_step": 312235, "epoch": 3761} {"train_loss": -25.708913803100586, "global_step": 312236, "epoch": 3761} {"train_loss": -25.573162078857422, "global_step": 312237, "epoch": 3761} {"train_loss": -25.823974609375, "global_step": 312238, "epoch": 3761} {"train_loss": -25.963764190673828, "global_step": 312239, "epoch": 3761} {"train_loss": -25.942358016967773, "global_step": 312240, "epoch": 3761} {"train_loss": -25.960859298706055, "global_step": 312241, "epoch": 3761} {"train_loss": -25.902790069580078, "global_step": 312242, "epoch": 3761} {"train_loss": -25.886199951171875, "global_step": 312243, "epoch": 3761} {"train_loss": -25.7152156829834, "global_step": 312244, "epoch": 3761} {"train_loss": -25.60382801653391, "global_step": 312245, "epoch": 3761, "val_loss": 7233875.0} {"train_loss": -25.21173858642578, "global_step": 312246, "epoch": 3762} {"train_loss": -25.401729583740234, "global_step": 312247, "epoch": 3762} {"train_loss": -25.560720443725586, "global_step": 312248, "epoch": 3762} {"train_loss": -25.932886123657227, "global_step": 312249, "epoch": 3762} {"train_loss": -25.9047794342041, "global_step": 312250, "epoch": 3762} {"train_loss": -25.419511795043945, "global_step": 312251, "epoch": 3762} {"train_loss": -25.481266021728516, "global_step": 312252, "epoch": 3762} {"train_loss": -25.108509063720703, "global_step": 312253, "epoch": 3762} {"train_loss": -25.640470504760742, "global_step": 312254, "epoch": 3762} {"train_loss": -25.933332443237305, "global_step": 312255, "epoch": 3762} {"train_loss": -25.938373565673828, "global_step": 312256, "epoch": 3762} {"train_loss": -25.6821231842041, "global_step": 312257, "epoch": 3762} {"train_loss": -25.919830322265625, "global_step": 312258, "epoch": 3762} {"train_loss": -25.539087295532227, "global_step": 312259, "epoch": 3762} {"train_loss": -25.952436447143555, "global_step": 312260, "epoch": 3762} {"train_loss": -25.73602294921875, "global_step": 312261, "epoch": 3762} {"train_loss": -25.774946212768555, "global_step": 312262, "epoch": 3762} {"train_loss": -26.062519073486328, "global_step": 312263, "epoch": 3762} {"train_loss": -26.232473373413086, "global_step": 312264, "epoch": 3762} {"train_loss": -25.721155166625977, "global_step": 312265, "epoch": 3762} {"train_loss": -25.88347816467285, "global_step": 312266, "epoch": 3762} {"train_loss": -25.873754501342773, "global_step": 312267, "epoch": 3762} {"train_loss": -25.91963005065918, "global_step": 312268, "epoch": 3762} {"train_loss": -25.802448272705078, "global_step": 312269, "epoch": 3762} {"train_loss": -25.775659561157227, "global_step": 312270, "epoch": 3762} {"train_loss": -25.807205200195312, "global_step": 312271, "epoch": 3762} {"train_loss": -25.723188400268555, "global_step": 312272, "epoch": 3762} {"train_loss": -25.672840118408203, "global_step": 312273, "epoch": 3762} {"train_loss": -25.99051856994629, "global_step": 312274, "epoch": 3762} {"train_loss": -26.180500030517578, "global_step": 312275, "epoch": 3762} {"train_loss": -26.36858558654785, "global_step": 312276, "epoch": 3762} {"train_loss": -25.72336769104004, "global_step": 312277, "epoch": 3762} {"train_loss": -25.994068145751953, "global_step": 312278, "epoch": 3762} {"train_loss": -25.75492286682129, "global_step": 312279, "epoch": 3762} {"train_loss": -26.019256591796875, "global_step": 312280, "epoch": 3762} {"train_loss": -26.045429229736328, "global_step": 312281, "epoch": 3762} {"train_loss": -25.653295516967773, "global_step": 312282, "epoch": 3762} {"train_loss": -25.96559715270996, "global_step": 312283, "epoch": 3762} {"train_loss": -26.103612899780273, "global_step": 312284, "epoch": 3762} {"train_loss": -25.83086585998535, "global_step": 312285, "epoch": 3762} {"train_loss": -25.922170639038086, "global_step": 312286, "epoch": 3762} {"train_loss": -25.95216178894043, "global_step": 312287, "epoch": 3762} {"train_loss": -25.815521240234375, "global_step": 312288, "epoch": 3762} {"train_loss": -26.031280517578125, "global_step": 312289, "epoch": 3762} {"train_loss": -25.65960693359375, "global_step": 312290, "epoch": 3762} {"train_loss": -25.873693466186523, "global_step": 312291, "epoch": 3762} {"train_loss": -25.84724998474121, "global_step": 312292, "epoch": 3762} {"train_loss": -25.292634963989258, "global_step": 312293, "epoch": 3762} {"train_loss": -25.839908599853516, "global_step": 312294, "epoch": 3762} {"train_loss": -24.929853439331055, "global_step": 312295, "epoch": 3762} {"train_loss": -25.176355361938477, "global_step": 312296, "epoch": 3762} {"train_loss": -25.387792587280273, "global_step": 312297, "epoch": 3762} {"train_loss": -25.183271408081055, "global_step": 312298, "epoch": 3762} {"train_loss": -25.005781173706055, "global_step": 312299, "epoch": 3762} {"train_loss": -25.441923141479492, "global_step": 312300, "epoch": 3762} {"train_loss": -25.842945098876953, "global_step": 312301, "epoch": 3762} {"train_loss": -25.633712768554688, "global_step": 312302, "epoch": 3762} {"train_loss": -25.430673599243164, "global_step": 312303, "epoch": 3762} {"train_loss": -25.90680503845215, "global_step": 312304, "epoch": 3762} {"train_loss": -25.33477210998535, "global_step": 312305, "epoch": 3762} {"train_loss": -25.496559143066406, "global_step": 312306, "epoch": 3762} {"train_loss": -25.512096405029297, "global_step": 312307, "epoch": 3762} {"train_loss": -25.640233993530273, "global_step": 312308, "epoch": 3762} {"train_loss": -25.281627655029297, "global_step": 312309, "epoch": 3762} {"train_loss": -25.709630966186523, "global_step": 312310, "epoch": 3762} {"train_loss": -25.450178146362305, "global_step": 312311, "epoch": 3762} {"train_loss": -25.790088653564453, "global_step": 312312, "epoch": 3762} {"train_loss": -25.332212448120117, "global_step": 312313, "epoch": 3762} {"train_loss": -25.935577392578125, "global_step": 312314, "epoch": 3762} {"train_loss": -25.891754150390625, "global_step": 312315, "epoch": 3762} {"train_loss": -25.259540557861328, "global_step": 312316, "epoch": 3762} {"train_loss": -25.351266860961914, "global_step": 312317, "epoch": 3762} {"train_loss": -25.334476470947266, "global_step": 312318, "epoch": 3762} {"train_loss": -25.19944190979004, "global_step": 312319, "epoch": 3762} {"train_loss": -25.86090660095215, "global_step": 312320, "epoch": 3762} {"train_loss": -25.496931076049805, "global_step": 312321, "epoch": 3762} {"train_loss": -25.407209396362305, "global_step": 312322, "epoch": 3762} {"train_loss": -25.379150390625, "global_step": 312323, "epoch": 3762} {"train_loss": -25.537527084350586, "global_step": 312324, "epoch": 3762} {"train_loss": -25.66432762145996, "global_step": 312325, "epoch": 3762} {"train_loss": -25.841779708862305, "global_step": 312326, "epoch": 3762} {"train_loss": -25.70100212097168, "global_step": 312327, "epoch": 3762} {"train_loss": -25.678697632019777, "global_step": 312328, "epoch": 3762, "val_loss": 7294131.0} {"train_loss": -25.329959869384766, "global_step": 312329, "epoch": 3763} {"train_loss": -25.369640350341797, "global_step": 312330, "epoch": 3763} {"train_loss": -25.527297973632812, "global_step": 312331, "epoch": 3763} {"train_loss": -25.660568237304688, "global_step": 312332, "epoch": 3763} {"train_loss": -25.881479263305664, "global_step": 312333, "epoch": 3763} {"train_loss": -25.451486587524414, "global_step": 312334, "epoch": 3763} {"train_loss": -25.739429473876953, "global_step": 312335, "epoch": 3763} {"train_loss": -26.044174194335938, "global_step": 312336, "epoch": 3763} {"train_loss": -25.577871322631836, "global_step": 312337, "epoch": 3763} {"train_loss": -25.666065216064453, "global_step": 312338, "epoch": 3763} {"train_loss": -25.538192749023438, "global_step": 312339, "epoch": 3763} {"train_loss": -25.559125900268555, "global_step": 312340, "epoch": 3763} {"train_loss": -25.865097045898438, "global_step": 312341, "epoch": 3763} {"train_loss": -25.915918350219727, "global_step": 312342, "epoch": 3763} {"train_loss": -25.76668357849121, "global_step": 312343, "epoch": 3763} {"train_loss": -25.6599178314209, "global_step": 312344, "epoch": 3763} {"train_loss": -25.309661865234375, "global_step": 312345, "epoch": 3763} {"train_loss": -25.6110897064209, "global_step": 312346, "epoch": 3763} {"train_loss": -25.704145431518555, "global_step": 312347, "epoch": 3763} {"train_loss": -25.77887535095215, "global_step": 312348, "epoch": 3763} {"train_loss": -25.80191993713379, "global_step": 312349, "epoch": 3763} {"train_loss": -25.802778244018555, "global_step": 312350, "epoch": 3763} {"train_loss": -26.18487548828125, "global_step": 312351, "epoch": 3763} {"train_loss": -25.961349487304688, "global_step": 312352, "epoch": 3763} {"train_loss": -25.608530044555664, "global_step": 312353, "epoch": 3763} {"train_loss": -25.34791374206543, "global_step": 312354, "epoch": 3763} {"train_loss": -26.082965850830078, "global_step": 312355, "epoch": 3763} {"train_loss": -25.59879493713379, "global_step": 312356, "epoch": 3763} {"train_loss": -25.82236671447754, "global_step": 312357, "epoch": 3763} {"train_loss": -25.83270835876465, "global_step": 312358, "epoch": 3763} {"train_loss": -26.288253784179688, "global_step": 312359, "epoch": 3763} {"train_loss": -25.600194931030273, "global_step": 312360, "epoch": 3763} {"train_loss": -25.747852325439453, "global_step": 312361, "epoch": 3763} {"train_loss": -25.602643966674805, "global_step": 312362, "epoch": 3763} {"train_loss": -26.002490997314453, "global_step": 312363, "epoch": 3763} {"train_loss": -25.754749298095703, "global_step": 312364, "epoch": 3763} {"train_loss": -26.267465591430664, "global_step": 312365, "epoch": 3763} {"train_loss": -26.2117977142334, "global_step": 312366, "epoch": 3763} {"train_loss": -25.62129020690918, "global_step": 312367, "epoch": 3763} {"train_loss": -25.966537475585938, "global_step": 312368, "epoch": 3763} {"train_loss": -25.98221206665039, "global_step": 312369, "epoch": 3763} {"train_loss": -25.662952423095703, "global_step": 312370, "epoch": 3763} {"train_loss": -25.54499626159668, "global_step": 312371, "epoch": 3763} {"train_loss": -26.14469337463379, "global_step": 312372, "epoch": 3763} {"train_loss": -25.856048583984375, "global_step": 312373, "epoch": 3763} {"train_loss": -25.991357803344727, "global_step": 312374, "epoch": 3763} {"train_loss": -25.962268829345703, "global_step": 312375, "epoch": 3763} {"train_loss": -26.30670166015625, "global_step": 312376, "epoch": 3763} {"train_loss": -26.053869247436523, "global_step": 312377, "epoch": 3763} {"train_loss": -25.775989532470703, "global_step": 312378, "epoch": 3763} {"train_loss": -26.2116756439209, "global_step": 312379, "epoch": 3763} {"train_loss": -25.81715202331543, "global_step": 312380, "epoch": 3763} {"train_loss": -25.73774528503418, "global_step": 312381, "epoch": 3763} {"train_loss": -25.810470581054688, "global_step": 312382, "epoch": 3763} {"train_loss": -25.76495361328125, "global_step": 312383, "epoch": 3763} {"train_loss": -25.5748233795166, "global_step": 312384, "epoch": 3763} {"train_loss": -25.83414649963379, "global_step": 312385, "epoch": 3763} {"train_loss": -25.810287475585938, "global_step": 312386, "epoch": 3763} {"train_loss": -26.09861183166504, "global_step": 312387, "epoch": 3763} {"train_loss": -25.534534454345703, "global_step": 312388, "epoch": 3763} {"train_loss": -26.08821678161621, "global_step": 312389, "epoch": 3763} {"train_loss": -26.0308837890625, "global_step": 312390, "epoch": 3763} {"train_loss": -25.843652725219727, "global_step": 312391, "epoch": 3763} {"train_loss": -25.88785171508789, "global_step": 312392, "epoch": 3763} {"train_loss": -25.707921981811523, "global_step": 312393, "epoch": 3763} {"train_loss": -26.18690299987793, "global_step": 312394, "epoch": 3763} {"train_loss": -25.97039794921875, "global_step": 312395, "epoch": 3763} {"train_loss": -25.757421493530273, "global_step": 312396, "epoch": 3763} {"train_loss": -26.282007217407227, "global_step": 312397, "epoch": 3763} {"train_loss": -26.2955265045166, "global_step": 312398, "epoch": 3763} {"train_loss": -25.56451416015625, "global_step": 312399, "epoch": 3763} {"train_loss": -25.928424835205078, "global_step": 312400, "epoch": 3763} {"train_loss": -26.254541397094727, "global_step": 312401, "epoch": 3763} {"train_loss": -25.833160400390625, "global_step": 312402, "epoch": 3763} {"train_loss": -25.939105987548828, "global_step": 312403, "epoch": 3763} {"train_loss": -25.81757164001465, "global_step": 312404, "epoch": 3763} {"train_loss": -25.865705490112305, "global_step": 312405, "epoch": 3763} {"train_loss": -25.557369232177734, "global_step": 312406, "epoch": 3763} {"train_loss": -25.616291046142578, "global_step": 312407, "epoch": 3763} {"train_loss": -25.859176635742188, "global_step": 312408, "epoch": 3763} {"train_loss": -26.0007381439209, "global_step": 312409, "epoch": 3763} {"train_loss": -25.62141990661621, "global_step": 312410, "epoch": 3763} {"train_loss": -25.831301769578314, "global_step": 312411, "epoch": 3763, "val_loss": 7239462.0} {"train_loss": -24.646718978881836, "global_step": 312412, "epoch": 3764} {"train_loss": -23.772043228149414, "global_step": 312413, "epoch": 3764} {"train_loss": -24.5119686126709, "global_step": 312414, "epoch": 3764} {"train_loss": -23.70351219177246, "global_step": 312415, "epoch": 3764} {"train_loss": -24.786930084228516, "global_step": 312416, "epoch": 3764} {"train_loss": -24.994964599609375, "global_step": 312417, "epoch": 3764} {"train_loss": -24.893157958984375, "global_step": 312418, "epoch": 3764} {"train_loss": -24.94736099243164, "global_step": 312419, "epoch": 3764} {"train_loss": -25.117177963256836, "global_step": 312420, "epoch": 3764} {"train_loss": -24.804441452026367, "global_step": 312421, "epoch": 3764} {"train_loss": -24.242218017578125, "global_step": 312422, "epoch": 3764} {"train_loss": -25.084814071655273, "global_step": 312423, "epoch": 3764} {"train_loss": -24.97628402709961, "global_step": 312424, "epoch": 3764} {"train_loss": -24.993515014648438, "global_step": 312425, "epoch": 3764} {"train_loss": -25.10413932800293, "global_step": 312426, "epoch": 3764} {"train_loss": -24.73129653930664, "global_step": 312427, "epoch": 3764} {"train_loss": -25.159671783447266, "global_step": 312428, "epoch": 3764} {"train_loss": -24.669626235961914, "global_step": 312429, "epoch": 3764} {"train_loss": -24.998029708862305, "global_step": 312430, "epoch": 3764} {"train_loss": -25.20319938659668, "global_step": 312431, "epoch": 3764} {"train_loss": -25.619129180908203, "global_step": 312432, "epoch": 3764} {"train_loss": -24.843204498291016, "global_step": 312433, "epoch": 3764} {"train_loss": -25.251956939697266, "global_step": 312434, "epoch": 3764} {"train_loss": -25.29950523376465, "global_step": 312435, "epoch": 3764} {"train_loss": -25.445819854736328, "global_step": 312436, "epoch": 3764} {"train_loss": -25.393640518188477, "global_step": 312437, "epoch": 3764} {"train_loss": -25.6318416595459, "global_step": 312438, "epoch": 3764} {"train_loss": -24.92992401123047, "global_step": 312439, "epoch": 3764} {"train_loss": -25.208663940429688, "global_step": 312440, "epoch": 3764} {"train_loss": -25.327404022216797, "global_step": 312441, "epoch": 3764} {"train_loss": -25.569042205810547, "global_step": 312442, "epoch": 3764} {"train_loss": -25.21123504638672, "global_step": 312443, "epoch": 3764} {"train_loss": -25.71992301940918, "global_step": 312444, "epoch": 3764} {"train_loss": -25.709875106811523, "global_step": 312445, "epoch": 3764} {"train_loss": -25.492298126220703, "global_step": 312446, "epoch": 3764} {"train_loss": -25.8106632232666, "global_step": 312447, "epoch": 3764} {"train_loss": -25.7007999420166, "global_step": 312448, "epoch": 3764} {"train_loss": -26.019742965698242, "global_step": 312449, "epoch": 3764} {"train_loss": -25.566659927368164, "global_step": 312450, "epoch": 3764} {"train_loss": -25.56796646118164, "global_step": 312451, "epoch": 3764} {"train_loss": -25.668628692626953, "global_step": 312452, "epoch": 3764} {"train_loss": -25.70100212097168, "global_step": 312453, "epoch": 3764} {"train_loss": -25.6594295501709, "global_step": 312454, "epoch": 3764} {"train_loss": -25.84796714782715, "global_step": 312455, "epoch": 3764} {"train_loss": -25.826452255249023, "global_step": 312456, "epoch": 3764} {"train_loss": -26.2659854888916, "global_step": 312457, "epoch": 3764} {"train_loss": -25.812314987182617, "global_step": 312458, "epoch": 3764} {"train_loss": -26.06610679626465, "global_step": 312459, "epoch": 3764} {"train_loss": -26.005294799804688, "global_step": 312460, "epoch": 3764} {"train_loss": -25.9180850982666, "global_step": 312461, "epoch": 3764} {"train_loss": -25.534006118774414, "global_step": 312462, "epoch": 3764} {"train_loss": -25.94990348815918, "global_step": 312463, "epoch": 3764} {"train_loss": -26.128955841064453, "global_step": 312464, "epoch": 3764} {"train_loss": -25.672155380249023, "global_step": 312465, "epoch": 3764} {"train_loss": -25.75593376159668, "global_step": 312466, "epoch": 3764} {"train_loss": -25.763019561767578, "global_step": 312467, "epoch": 3764} {"train_loss": -25.8204288482666, "global_step": 312468, "epoch": 3764} {"train_loss": -26.309213638305664, "global_step": 312469, "epoch": 3764} {"train_loss": -25.69677734375, "global_step": 312470, "epoch": 3764} {"train_loss": -25.719465255737305, "global_step": 312471, "epoch": 3764} {"train_loss": -25.630767822265625, "global_step": 312472, "epoch": 3764} {"train_loss": -25.35226821899414, "global_step": 312473, "epoch": 3764} {"train_loss": -25.399494171142578, "global_step": 312474, "epoch": 3764} {"train_loss": -25.267196655273438, "global_step": 312475, "epoch": 3764} {"train_loss": -25.09528923034668, "global_step": 312476, "epoch": 3764} {"train_loss": -25.081480026245117, "global_step": 312477, "epoch": 3764} {"train_loss": -25.567401885986328, "global_step": 312478, "epoch": 3764} {"train_loss": -26.007970809936523, "global_step": 312479, "epoch": 3764} {"train_loss": -25.704975128173828, "global_step": 312480, "epoch": 3764} {"train_loss": -25.14141082763672, "global_step": 312481, "epoch": 3764} {"train_loss": -25.8629207611084, "global_step": 312482, "epoch": 3764} {"train_loss": -25.71942138671875, "global_step": 312483, "epoch": 3764} {"train_loss": -25.483915328979492, "global_step": 312484, "epoch": 3764} {"train_loss": -25.861194610595703, "global_step": 312485, "epoch": 3764} {"train_loss": -25.448545455932617, "global_step": 312486, "epoch": 3764} {"train_loss": -25.506593704223633, "global_step": 312487, "epoch": 3764} {"train_loss": -25.593841552734375, "global_step": 312488, "epoch": 3764} {"train_loss": -25.33042335510254, "global_step": 312489, "epoch": 3764} {"train_loss": -25.64859390258789, "global_step": 312490, "epoch": 3764} {"train_loss": -25.65812110900879, "global_step": 312491, "epoch": 3764} {"train_loss": -25.591449737548828, "global_step": 312492, "epoch": 3764} {"train_loss": -25.345449447631836, "global_step": 312493, "epoch": 3764} {"train_loss": -25.408908315451747, "global_step": 312494, "epoch": 3764, "val_loss": 7309648.0} {"train_loss": -24.85272216796875, "global_step": 312495, "epoch": 3765} {"train_loss": -24.41305923461914, "global_step": 312496, "epoch": 3765} {"train_loss": -24.601791381835938, "global_step": 312497, "epoch": 3765} {"train_loss": -25.345548629760742, "global_step": 312498, "epoch": 3765} {"train_loss": -23.905786514282227, "global_step": 312499, "epoch": 3765} {"train_loss": -25.4205379486084, "global_step": 312500, "epoch": 3765} {"train_loss": -24.817493438720703, "global_step": 312501, "epoch": 3765} {"train_loss": -24.790395736694336, "global_step": 312502, "epoch": 3765} {"train_loss": -24.70015525817871, "global_step": 312503, "epoch": 3765} {"train_loss": -25.456344604492188, "global_step": 312504, "epoch": 3765} {"train_loss": -24.92681312561035, "global_step": 312505, "epoch": 3765} {"train_loss": -25.02034568786621, "global_step": 312506, "epoch": 3765} {"train_loss": -25.09076499938965, "global_step": 312507, "epoch": 3765} {"train_loss": -25.414995193481445, "global_step": 312508, "epoch": 3765} {"train_loss": -25.311954498291016, "global_step": 312509, "epoch": 3765} {"train_loss": -25.365081787109375, "global_step": 312510, "epoch": 3765} {"train_loss": -25.06355857849121, "global_step": 312511, "epoch": 3765} {"train_loss": -25.458724975585938, "global_step": 312512, "epoch": 3765} {"train_loss": -25.03572654724121, "global_step": 312513, "epoch": 3765} {"train_loss": -25.521604537963867, "global_step": 312514, "epoch": 3765} {"train_loss": -24.92637825012207, "global_step": 312515, "epoch": 3765} {"train_loss": -25.41037940979004, "global_step": 312516, "epoch": 3765} {"train_loss": -25.07512855529785, "global_step": 312517, "epoch": 3765} {"train_loss": -25.144235610961914, "global_step": 312518, "epoch": 3765} {"train_loss": -25.227340698242188, "global_step": 312519, "epoch": 3765} {"train_loss": -25.373533248901367, "global_step": 312520, "epoch": 3765} {"train_loss": -25.386722564697266, "global_step": 312521, "epoch": 3765} {"train_loss": -25.803333282470703, "global_step": 312522, "epoch": 3765} {"train_loss": -25.42628288269043, "global_step": 312523, "epoch": 3765} {"train_loss": -25.431730270385742, "global_step": 312524, "epoch": 3765} {"train_loss": -25.217832565307617, "global_step": 312525, "epoch": 3765} {"train_loss": -25.61195182800293, "global_step": 312526, "epoch": 3765} {"train_loss": -25.211441040039062, "global_step": 312527, "epoch": 3765} {"train_loss": -25.829999923706055, "global_step": 312528, "epoch": 3765} {"train_loss": -25.294095993041992, "global_step": 312529, "epoch": 3765} {"train_loss": -25.478853225708008, "global_step": 312530, "epoch": 3765} {"train_loss": -25.90631103515625, "global_step": 312531, "epoch": 3765} {"train_loss": -25.760242462158203, "global_step": 312532, "epoch": 3765} {"train_loss": -25.8249568939209, "global_step": 312533, "epoch": 3765} {"train_loss": -25.848730087280273, "global_step": 312534, "epoch": 3765} {"train_loss": -25.872909545898438, "global_step": 312535, "epoch": 3765} {"train_loss": -25.747655868530273, "global_step": 312536, "epoch": 3765} {"train_loss": -25.509855270385742, "global_step": 312537, "epoch": 3765} {"train_loss": -25.914127349853516, "global_step": 312538, "epoch": 3765} {"train_loss": -25.83827018737793, "global_step": 312539, "epoch": 3765} {"train_loss": -25.8591251373291, "global_step": 312540, "epoch": 3765} {"train_loss": -25.8156795501709, "global_step": 312541, "epoch": 3765} {"train_loss": -25.89511489868164, "global_step": 312542, "epoch": 3765} {"train_loss": -25.81780433654785, "global_step": 312543, "epoch": 3765} {"train_loss": -26.138385772705078, "global_step": 312544, "epoch": 3765} {"train_loss": -26.127471923828125, "global_step": 312545, "epoch": 3765} {"train_loss": -26.024494171142578, "global_step": 312546, "epoch": 3765} {"train_loss": -25.925397872924805, "global_step": 312547, "epoch": 3765} {"train_loss": -25.660276412963867, "global_step": 312548, "epoch": 3765} {"train_loss": -25.99529457092285, "global_step": 312549, "epoch": 3765} {"train_loss": -25.90284538269043, "global_step": 312550, "epoch": 3765} {"train_loss": -25.944732666015625, "global_step": 312551, "epoch": 3765} {"train_loss": -25.982391357421875, "global_step": 312552, "epoch": 3765} {"train_loss": -25.68275260925293, "global_step": 312553, "epoch": 3765} {"train_loss": -25.658432006835938, "global_step": 312554, "epoch": 3765} {"train_loss": -25.84012222290039, "global_step": 312555, "epoch": 3765} {"train_loss": -25.795576095581055, "global_step": 312556, "epoch": 3765} {"train_loss": -25.84735107421875, "global_step": 312557, "epoch": 3765} {"train_loss": -25.81231689453125, "global_step": 312558, "epoch": 3765} {"train_loss": -25.79652214050293, "global_step": 312559, "epoch": 3765} {"train_loss": -25.9278564453125, "global_step": 312560, "epoch": 3765} {"train_loss": -25.8005428314209, "global_step": 312561, "epoch": 3765} {"train_loss": -25.812204360961914, "global_step": 312562, "epoch": 3765} {"train_loss": -25.578441619873047, "global_step": 312563, "epoch": 3765} {"train_loss": -25.177749633789062, "global_step": 312564, "epoch": 3765} {"train_loss": -25.113065719604492, "global_step": 312565, "epoch": 3765} {"train_loss": -25.38149070739746, "global_step": 312566, "epoch": 3765} {"train_loss": -25.6386661529541, "global_step": 312567, "epoch": 3765} {"train_loss": -25.458669662475586, "global_step": 312568, "epoch": 3765} {"train_loss": -25.76462173461914, "global_step": 312569, "epoch": 3765} {"train_loss": -25.68019676208496, "global_step": 312570, "epoch": 3765} {"train_loss": -25.575119018554688, "global_step": 312571, "epoch": 3765} {"train_loss": -25.693866729736328, "global_step": 312572, "epoch": 3765} {"train_loss": -25.831079483032227, "global_step": 312573, "epoch": 3765} {"train_loss": -26.02423667907715, "global_step": 312574, "epoch": 3765} {"train_loss": -25.7147274017334, "global_step": 312575, "epoch": 3765} {"train_loss": -25.576255798339844, "global_step": 312576, "epoch": 3765} {"train_loss": -25.523438626025097, "global_step": 312577, "epoch": 3765, "val_loss": 7253583.0} {"train_loss": -25.206174850463867, "global_step": 312578, "epoch": 3766} {"train_loss": -24.54213523864746, "global_step": 312579, "epoch": 3766} {"train_loss": -24.77485466003418, "global_step": 312580, "epoch": 3766} {"train_loss": -25.50905990600586, "global_step": 312581, "epoch": 3766} {"train_loss": -24.99972915649414, "global_step": 312582, "epoch": 3766} {"train_loss": -25.212671279907227, "global_step": 312583, "epoch": 3766} {"train_loss": -25.363037109375, "global_step": 312584, "epoch": 3766} {"train_loss": -25.099634170532227, "global_step": 312585, "epoch": 3766} {"train_loss": -25.349210739135742, "global_step": 312586, "epoch": 3766} {"train_loss": -25.009679794311523, "global_step": 312587, "epoch": 3766} {"train_loss": -25.214365005493164, "global_step": 312588, "epoch": 3766} {"train_loss": -25.306468963623047, "global_step": 312589, "epoch": 3766} {"train_loss": -25.29556655883789, "global_step": 312590, "epoch": 3766} {"train_loss": -25.358327865600586, "global_step": 312591, "epoch": 3766} {"train_loss": -25.37448501586914, "global_step": 312592, "epoch": 3766} {"train_loss": -25.58518409729004, "global_step": 312593, "epoch": 3766} {"train_loss": -25.46064567565918, "global_step": 312594, "epoch": 3766} {"train_loss": -25.331689834594727, "global_step": 312595, "epoch": 3766} {"train_loss": -25.420202255249023, "global_step": 312596, "epoch": 3766} {"train_loss": -25.577001571655273, "global_step": 312597, "epoch": 3766} {"train_loss": -25.524816513061523, "global_step": 312598, "epoch": 3766} {"train_loss": -25.966466903686523, "global_step": 312599, "epoch": 3766} {"train_loss": -25.98044776916504, "global_step": 312600, "epoch": 3766} {"train_loss": -25.903600692749023, "global_step": 312601, "epoch": 3766} {"train_loss": -25.816762924194336, "global_step": 312602, "epoch": 3766} {"train_loss": -25.914785385131836, "global_step": 312603, "epoch": 3766} {"train_loss": -25.716550827026367, "global_step": 312604, "epoch": 3766} {"train_loss": -25.906705856323242, "global_step": 312605, "epoch": 3766} {"train_loss": -25.97389793395996, "global_step": 312606, "epoch": 3766} {"train_loss": -25.57334327697754, "global_step": 312607, "epoch": 3766} {"train_loss": -25.878992080688477, "global_step": 312608, "epoch": 3766} {"train_loss": -25.843103408813477, "global_step": 312609, "epoch": 3766} {"train_loss": -25.9335880279541, "global_step": 312610, "epoch": 3766} {"train_loss": -25.955114364624023, "global_step": 312611, "epoch": 3766} {"train_loss": -25.993106842041016, "global_step": 312612, "epoch": 3766} {"train_loss": -25.8409366607666, "global_step": 312613, "epoch": 3766} {"train_loss": -25.868366241455078, "global_step": 312614, "epoch": 3766} {"train_loss": -26.199838638305664, "global_step": 312615, "epoch": 3766} {"train_loss": -25.95088005065918, "global_step": 312616, "epoch": 3766} {"train_loss": -25.943342208862305, "global_step": 312617, "epoch": 3766} {"train_loss": -25.988605499267578, "global_step": 312618, "epoch": 3766} {"train_loss": -26.220800399780273, "global_step": 312619, "epoch": 3766} {"train_loss": -25.881855010986328, "global_step": 312620, "epoch": 3766} {"train_loss": -26.023197174072266, "global_step": 312621, "epoch": 3766} {"train_loss": -25.740863800048828, "global_step": 312622, "epoch": 3766} {"train_loss": -25.92975425720215, "global_step": 312623, "epoch": 3766} {"train_loss": -25.927209854125977, "global_step": 312624, "epoch": 3766} {"train_loss": -25.606678009033203, "global_step": 312625, "epoch": 3766} {"train_loss": -25.976566314697266, "global_step": 312626, "epoch": 3766} {"train_loss": -25.797521591186523, "global_step": 312627, "epoch": 3766} {"train_loss": -25.6683349609375, "global_step": 312628, "epoch": 3766} {"train_loss": -25.71367835998535, "global_step": 312629, "epoch": 3766} {"train_loss": -25.529821395874023, "global_step": 312630, "epoch": 3766} {"train_loss": -25.820465087890625, "global_step": 312631, "epoch": 3766} {"train_loss": -25.88360023498535, "global_step": 312632, "epoch": 3766} {"train_loss": -25.860544204711914, "global_step": 312633, "epoch": 3766} {"train_loss": -25.65813636779785, "global_step": 312634, "epoch": 3766} {"train_loss": -25.864883422851562, "global_step": 312635, "epoch": 3766} {"train_loss": -25.420400619506836, "global_step": 312636, "epoch": 3766} {"train_loss": -25.384511947631836, "global_step": 312637, "epoch": 3766} {"train_loss": -25.67913818359375, "global_step": 312638, "epoch": 3766} {"train_loss": -25.861465454101562, "global_step": 312639, "epoch": 3766} {"train_loss": -25.659704208374023, "global_step": 312640, "epoch": 3766} {"train_loss": -25.701068878173828, "global_step": 312641, "epoch": 3766} {"train_loss": -25.675628662109375, "global_step": 312642, "epoch": 3766} {"train_loss": -25.707366943359375, "global_step": 312643, "epoch": 3766} {"train_loss": -25.419544219970703, "global_step": 312644, "epoch": 3766} {"train_loss": -25.683088302612305, "global_step": 312645, "epoch": 3766} {"train_loss": -25.64459228515625, "global_step": 312646, "epoch": 3766} {"train_loss": -25.496137619018555, "global_step": 312647, "epoch": 3766} {"train_loss": -25.894433975219727, "global_step": 312648, "epoch": 3766} {"train_loss": -25.334901809692383, "global_step": 312649, "epoch": 3766} {"train_loss": -25.451189041137695, "global_step": 312650, "epoch": 3766} {"train_loss": -25.564729690551758, "global_step": 312651, "epoch": 3766} {"train_loss": -25.41754913330078, "global_step": 312652, "epoch": 3766} {"train_loss": -25.90506935119629, "global_step": 312653, "epoch": 3766} {"train_loss": -25.893293380737305, "global_step": 312654, "epoch": 3766} {"train_loss": -25.79032325744629, "global_step": 312655, "epoch": 3766} {"train_loss": -25.615209579467773, "global_step": 312656, "epoch": 3766} {"train_loss": -25.614614486694336, "global_step": 312657, "epoch": 3766} {"train_loss": -25.55878257751465, "global_step": 312658, "epoch": 3766} {"train_loss": -25.744043350219727, "global_step": 312659, "epoch": 3766} {"train_loss": -25.61833627539945, "global_step": 312660, "epoch": 3766, "val_loss": 7183741.0} {"train_loss": -25.230300903320312, "global_step": 312661, "epoch": 3767} {"train_loss": -25.73807144165039, "global_step": 312662, "epoch": 3767} {"train_loss": -25.288419723510742, "global_step": 312663, "epoch": 3767} {"train_loss": -26.008045196533203, "global_step": 312664, "epoch": 3767} {"train_loss": -25.3575382232666, "global_step": 312665, "epoch": 3767} {"train_loss": -25.704065322875977, "global_step": 312666, "epoch": 3767} {"train_loss": -25.57091522216797, "global_step": 312667, "epoch": 3767} {"train_loss": -25.814619064331055, "global_step": 312668, "epoch": 3767} {"train_loss": -25.684309005737305, "global_step": 312669, "epoch": 3767} {"train_loss": -25.704090118408203, "global_step": 312670, "epoch": 3767} {"train_loss": -25.987060546875, "global_step": 312671, "epoch": 3767} {"train_loss": -25.585296630859375, "global_step": 312672, "epoch": 3767} {"train_loss": -25.9482479095459, "global_step": 312673, "epoch": 3767} {"train_loss": -25.85346794128418, "global_step": 312674, "epoch": 3767} {"train_loss": -26.002838134765625, "global_step": 312675, "epoch": 3767} {"train_loss": -26.059186935424805, "global_step": 312676, "epoch": 3767} {"train_loss": -25.134267807006836, "global_step": 312677, "epoch": 3767} {"train_loss": -25.585947036743164, "global_step": 312678, "epoch": 3767} {"train_loss": -25.76678466796875, "global_step": 312679, "epoch": 3767} {"train_loss": -25.510295867919922, "global_step": 312680, "epoch": 3767} {"train_loss": -25.878381729125977, "global_step": 312681, "epoch": 3767} {"train_loss": -25.978775024414062, "global_step": 312682, "epoch": 3767} {"train_loss": -25.819135665893555, "global_step": 312683, "epoch": 3767} {"train_loss": -25.84295654296875, "global_step": 312684, "epoch": 3767} {"train_loss": -25.77625846862793, "global_step": 312685, "epoch": 3767} {"train_loss": -25.655466079711914, "global_step": 312686, "epoch": 3767} {"train_loss": -25.669126510620117, "global_step": 312687, "epoch": 3767} {"train_loss": -25.799671173095703, "global_step": 312688, "epoch": 3767} {"train_loss": -25.96174430847168, "global_step": 312689, "epoch": 3767} {"train_loss": -25.742420196533203, "global_step": 312690, "epoch": 3767} {"train_loss": -25.81585693359375, "global_step": 312691, "epoch": 3767} {"train_loss": -25.437585830688477, "global_step": 312692, "epoch": 3767} {"train_loss": -25.70338249206543, "global_step": 312693, "epoch": 3767} {"train_loss": -25.735090255737305, "global_step": 312694, "epoch": 3767} {"train_loss": -25.825952529907227, "global_step": 312695, "epoch": 3767} {"train_loss": -25.783203125, "global_step": 312696, "epoch": 3767} {"train_loss": -25.8031005859375, "global_step": 312697, "epoch": 3767} {"train_loss": -25.747379302978516, "global_step": 312698, "epoch": 3767} {"train_loss": -25.892805099487305, "global_step": 312699, "epoch": 3767} {"train_loss": -25.965442657470703, "global_step": 312700, "epoch": 3767} {"train_loss": -25.564268112182617, "global_step": 312701, "epoch": 3767} {"train_loss": -25.694107055664062, "global_step": 312702, "epoch": 3767} {"train_loss": -26.025781631469727, "global_step": 312703, "epoch": 3767} {"train_loss": -25.7808837890625, "global_step": 312704, "epoch": 3767} {"train_loss": -25.7667293548584, "global_step": 312705, "epoch": 3767} {"train_loss": -25.852380752563477, "global_step": 312706, "epoch": 3767} {"train_loss": -25.805389404296875, "global_step": 312707, "epoch": 3767} {"train_loss": -25.716522216796875, "global_step": 312708, "epoch": 3767} {"train_loss": -26.031736373901367, "global_step": 312709, "epoch": 3767} {"train_loss": -25.370901107788086, "global_step": 312710, "epoch": 3767} {"train_loss": -25.76519775390625, "global_step": 312711, "epoch": 3767} {"train_loss": -25.870996475219727, "global_step": 312712, "epoch": 3767} {"train_loss": -25.388978958129883, "global_step": 312713, "epoch": 3767} {"train_loss": -25.583425521850586, "global_step": 312714, "epoch": 3767} {"train_loss": -25.989959716796875, "global_step": 312715, "epoch": 3767} {"train_loss": -25.564559936523438, "global_step": 312716, "epoch": 3767} {"train_loss": -25.412656784057617, "global_step": 312717, "epoch": 3767} {"train_loss": -25.902179718017578, "global_step": 312718, "epoch": 3767} {"train_loss": -25.89910316467285, "global_step": 312719, "epoch": 3767} {"train_loss": -25.618558883666992, "global_step": 312720, "epoch": 3767} {"train_loss": -25.793115615844727, "global_step": 312721, "epoch": 3767} {"train_loss": -25.77534294128418, "global_step": 312722, "epoch": 3767} {"train_loss": -25.86916160583496, "global_step": 312723, "epoch": 3767} {"train_loss": -26.016489028930664, "global_step": 312724, "epoch": 3767} {"train_loss": -25.662525177001953, "global_step": 312725, "epoch": 3767} {"train_loss": -25.387226104736328, "global_step": 312726, "epoch": 3767} {"train_loss": -25.77131462097168, "global_step": 312727, "epoch": 3767} {"train_loss": -25.504444122314453, "global_step": 312728, "epoch": 3767} {"train_loss": -25.888120651245117, "global_step": 312729, "epoch": 3767} {"train_loss": -25.417545318603516, "global_step": 312730, "epoch": 3767} {"train_loss": -25.34504508972168, "global_step": 312731, "epoch": 3767} {"train_loss": -25.60684585571289, "global_step": 312732, "epoch": 3767} {"train_loss": -25.610671997070312, "global_step": 312733, "epoch": 3767} {"train_loss": -25.648239135742188, "global_step": 312734, "epoch": 3767} {"train_loss": -25.686080932617188, "global_step": 312735, "epoch": 3767} {"train_loss": -25.3853702545166, "global_step": 312736, "epoch": 3767} {"train_loss": -26.02680015563965, "global_step": 312737, "epoch": 3767} {"train_loss": -25.946685791015625, "global_step": 312738, "epoch": 3767} {"train_loss": -25.29947280883789, "global_step": 312739, "epoch": 3767} {"train_loss": -25.689558029174805, "global_step": 312740, "epoch": 3767} {"train_loss": -25.37678337097168, "global_step": 312741, "epoch": 3767} {"train_loss": -25.511980056762695, "global_step": 312742, "epoch": 3767} {"train_loss": -25.690473280757306, "global_step": 312743, "epoch": 3767, "val_loss": 7164575.0} {"train_loss": -25.607227325439453, "global_step": 312744, "epoch": 3768} {"train_loss": -25.032087326049805, "global_step": 312745, "epoch": 3768} {"train_loss": -25.222776412963867, "global_step": 312746, "epoch": 3768} {"train_loss": -25.275527954101562, "global_step": 312747, "epoch": 3768} {"train_loss": -25.063289642333984, "global_step": 312748, "epoch": 3768} {"train_loss": -25.322057723999023, "global_step": 312749, "epoch": 3768} {"train_loss": -25.11545753479004, "global_step": 312750, "epoch": 3768} {"train_loss": -25.556997299194336, "global_step": 312751, "epoch": 3768} {"train_loss": -25.18894386291504, "global_step": 312752, "epoch": 3768} {"train_loss": -25.383268356323242, "global_step": 312753, "epoch": 3768} {"train_loss": -25.675504684448242, "global_step": 312754, "epoch": 3768} {"train_loss": -26.136966705322266, "global_step": 312755, "epoch": 3768} {"train_loss": -25.458541870117188, "global_step": 312756, "epoch": 3768} {"train_loss": -25.428546905517578, "global_step": 312757, "epoch": 3768} {"train_loss": -25.47133445739746, "global_step": 312758, "epoch": 3768} {"train_loss": -25.734268188476562, "global_step": 312759, "epoch": 3768} {"train_loss": -25.643905639648438, "global_step": 312760, "epoch": 3768} {"train_loss": -25.772174835205078, "global_step": 312761, "epoch": 3768} {"train_loss": -25.4516544342041, "global_step": 312762, "epoch": 3768} {"train_loss": -25.54776954650879, "global_step": 312763, "epoch": 3768} {"train_loss": -25.96136474609375, "global_step": 312764, "epoch": 3768} {"train_loss": -26.179046630859375, "global_step": 312765, "epoch": 3768} {"train_loss": -25.563072204589844, "global_step": 312766, "epoch": 3768} {"train_loss": -25.834577560424805, "global_step": 312767, "epoch": 3768} {"train_loss": -25.548568725585938, "global_step": 312768, "epoch": 3768} {"train_loss": -26.032140731811523, "global_step": 312769, "epoch": 3768} {"train_loss": -25.573863983154297, "global_step": 312770, "epoch": 3768} {"train_loss": -25.521963119506836, "global_step": 312771, "epoch": 3768} {"train_loss": -25.672504425048828, "global_step": 312772, "epoch": 3768} {"train_loss": -26.090742111206055, "global_step": 312773, "epoch": 3768} {"train_loss": -25.556516647338867, "global_step": 312774, "epoch": 3768} {"train_loss": -26.01283073425293, "global_step": 312775, "epoch": 3768} {"train_loss": -25.640857696533203, "global_step": 312776, "epoch": 3768} {"train_loss": -25.748367309570312, "global_step": 312777, "epoch": 3768} {"train_loss": -25.646987915039062, "global_step": 312778, "epoch": 3768} {"train_loss": -25.663869857788086, "global_step": 312779, "epoch": 3768} {"train_loss": -25.835180282592773, "global_step": 312780, "epoch": 3768} {"train_loss": -25.505704879760742, "global_step": 312781, "epoch": 3768} {"train_loss": -25.909189224243164, "global_step": 312782, "epoch": 3768} {"train_loss": -25.68653678894043, "global_step": 312783, "epoch": 3768} {"train_loss": -25.39705467224121, "global_step": 312784, "epoch": 3768} {"train_loss": -25.76373291015625, "global_step": 312785, "epoch": 3768} {"train_loss": -25.984479904174805, "global_step": 312786, "epoch": 3768} {"train_loss": -25.639814376831055, "global_step": 312787, "epoch": 3768} {"train_loss": -25.857275009155273, "global_step": 312788, "epoch": 3768} {"train_loss": -25.59792709350586, "global_step": 312789, "epoch": 3768} {"train_loss": -25.784229278564453, "global_step": 312790, "epoch": 3768} {"train_loss": -25.9138126373291, "global_step": 312791, "epoch": 3768} {"train_loss": -25.574512481689453, "global_step": 312792, "epoch": 3768} {"train_loss": -25.71497917175293, "global_step": 312793, "epoch": 3768} {"train_loss": -25.511377334594727, "global_step": 312794, "epoch": 3768} {"train_loss": -25.666717529296875, "global_step": 312795, "epoch": 3768} {"train_loss": -25.952850341796875, "global_step": 312796, "epoch": 3768} {"train_loss": -26.187210083007812, "global_step": 312797, "epoch": 3768} {"train_loss": -25.60691261291504, "global_step": 312798, "epoch": 3768} {"train_loss": -25.912429809570312, "global_step": 312799, "epoch": 3768} {"train_loss": -25.943159103393555, "global_step": 312800, "epoch": 3768} {"train_loss": -25.609296798706055, "global_step": 312801, "epoch": 3768} {"train_loss": -25.919666290283203, "global_step": 312802, "epoch": 3768} {"train_loss": -25.728870391845703, "global_step": 312803, "epoch": 3768} {"train_loss": -25.97157096862793, "global_step": 312804, "epoch": 3768} {"train_loss": -26.09944725036621, "global_step": 312805, "epoch": 3768} {"train_loss": -26.078359603881836, "global_step": 312806, "epoch": 3768} {"train_loss": -25.91189956665039, "global_step": 312807, "epoch": 3768} {"train_loss": -26.167713165283203, "global_step": 312808, "epoch": 3768} {"train_loss": -25.7974796295166, "global_step": 312809, "epoch": 3768} {"train_loss": -25.82935905456543, "global_step": 312810, "epoch": 3768} {"train_loss": -25.844928741455078, "global_step": 312811, "epoch": 3768} {"train_loss": -26.141401290893555, "global_step": 312812, "epoch": 3768} {"train_loss": -25.6633243560791, "global_step": 312813, "epoch": 3768} {"train_loss": -25.63995933532715, "global_step": 312814, "epoch": 3768} {"train_loss": -25.709674835205078, "global_step": 312815, "epoch": 3768} {"train_loss": -25.673614501953125, "global_step": 312816, "epoch": 3768} {"train_loss": -25.67689323425293, "global_step": 312817, "epoch": 3768} {"train_loss": -25.621068954467773, "global_step": 312818, "epoch": 3768} {"train_loss": -25.782245635986328, "global_step": 312819, "epoch": 3768} {"train_loss": -26.2341251373291, "global_step": 312820, "epoch": 3768} {"train_loss": -25.599279403686523, "global_step": 312821, "epoch": 3768} {"train_loss": -25.97565269470215, "global_step": 312822, "epoch": 3768} {"train_loss": -25.64772605895996, "global_step": 312823, "epoch": 3768} {"train_loss": -26.03690528869629, "global_step": 312824, "epoch": 3768} {"train_loss": -25.674240112304688, "global_step": 312825, "epoch": 3768} {"train_loss": -25.709959972335632, "global_step": 312826, "epoch": 3768, "val_loss": 7324810.0} {"train_loss": -25.087350845336914, "global_step": 312827, "epoch": 3769} {"train_loss": -24.027225494384766, "global_step": 312828, "epoch": 3769} {"train_loss": -24.440420150756836, "global_step": 312829, "epoch": 3769} {"train_loss": -24.73668670654297, "global_step": 312830, "epoch": 3769} {"train_loss": -25.247724533081055, "global_step": 312831, "epoch": 3769} {"train_loss": -24.86469841003418, "global_step": 312832, "epoch": 3769} {"train_loss": -24.929357528686523, "global_step": 312833, "epoch": 3769} {"train_loss": -25.39141273498535, "global_step": 312834, "epoch": 3769} {"train_loss": -25.524261474609375, "global_step": 312835, "epoch": 3769} {"train_loss": -25.309167861938477, "global_step": 312836, "epoch": 3769} {"train_loss": -25.009361267089844, "global_step": 312837, "epoch": 3769} {"train_loss": -25.216846466064453, "global_step": 312838, "epoch": 3769} {"train_loss": -25.446510314941406, "global_step": 312839, "epoch": 3769} {"train_loss": -25.217273712158203, "global_step": 312840, "epoch": 3769} {"train_loss": -25.155790328979492, "global_step": 312841, "epoch": 3769} {"train_loss": -25.145906448364258, "global_step": 312842, "epoch": 3769} {"train_loss": -25.414697647094727, "global_step": 312843, "epoch": 3769} {"train_loss": -25.0849609375, "global_step": 312844, "epoch": 3769} {"train_loss": -25.450681686401367, "global_step": 312845, "epoch": 3769} {"train_loss": -25.484146118164062, "global_step": 312846, "epoch": 3769} {"train_loss": -25.244468688964844, "global_step": 312847, "epoch": 3769} {"train_loss": -25.370227813720703, "global_step": 312848, "epoch": 3769} {"train_loss": -25.574819564819336, "global_step": 312849, "epoch": 3769} {"train_loss": -25.62640380859375, "global_step": 312850, "epoch": 3769} {"train_loss": -25.669696807861328, "global_step": 312851, "epoch": 3769} {"train_loss": -25.684528350830078, "global_step": 312852, "epoch": 3769} {"train_loss": -25.493255615234375, "global_step": 312853, "epoch": 3769} {"train_loss": -25.890844345092773, "global_step": 312854, "epoch": 3769} {"train_loss": -26.2718563079834, "global_step": 312855, "epoch": 3769} {"train_loss": -25.801969528198242, "global_step": 312856, "epoch": 3769} {"train_loss": -25.729528427124023, "global_step": 312857, "epoch": 3769} {"train_loss": -25.454355239868164, "global_step": 312858, "epoch": 3769} {"train_loss": -25.84295654296875, "global_step": 312859, "epoch": 3769} {"train_loss": -26.119516372680664, "global_step": 312860, "epoch": 3769} {"train_loss": -25.985157012939453, "global_step": 312861, "epoch": 3769} {"train_loss": -25.7392635345459, "global_step": 312862, "epoch": 3769} {"train_loss": -25.774768829345703, "global_step": 312863, "epoch": 3769} {"train_loss": -25.303991317749023, "global_step": 312864, "epoch": 3769} {"train_loss": -25.84429359436035, "global_step": 312865, "epoch": 3769} {"train_loss": -25.80497169494629, "global_step": 312866, "epoch": 3769} {"train_loss": -26.186132431030273, "global_step": 312867, "epoch": 3769} {"train_loss": -25.83221435546875, "global_step": 312868, "epoch": 3769} {"train_loss": -25.84473991394043, "global_step": 312869, "epoch": 3769} {"train_loss": -25.516218185424805, "global_step": 312870, "epoch": 3769} {"train_loss": -25.796710968017578, "global_step": 312871, "epoch": 3769} {"train_loss": -26.223026275634766, "global_step": 312872, "epoch": 3769} {"train_loss": -25.832584381103516, "global_step": 312873, "epoch": 3769} {"train_loss": -25.878814697265625, "global_step": 312874, "epoch": 3769} {"train_loss": -25.806049346923828, "global_step": 312875, "epoch": 3769} {"train_loss": -25.889474868774414, "global_step": 312876, "epoch": 3769} {"train_loss": -25.689191818237305, "global_step": 312877, "epoch": 3769} {"train_loss": -25.695341110229492, "global_step": 312878, "epoch": 3769} {"train_loss": -25.907958984375, "global_step": 312879, "epoch": 3769} {"train_loss": -25.507238388061523, "global_step": 312880, "epoch": 3769} {"train_loss": -25.78497886657715, "global_step": 312881, "epoch": 3769} {"train_loss": -25.68818473815918, "global_step": 312882, "epoch": 3769} {"train_loss": -25.587934494018555, "global_step": 312883, "epoch": 3769} {"train_loss": -25.581838607788086, "global_step": 312884, "epoch": 3769} {"train_loss": -26.2796573638916, "global_step": 312885, "epoch": 3769} {"train_loss": -25.445226669311523, "global_step": 312886, "epoch": 3769} {"train_loss": -25.81341552734375, "global_step": 312887, "epoch": 3769} {"train_loss": -25.918310165405273, "global_step": 312888, "epoch": 3769} {"train_loss": -25.55885887145996, "global_step": 312889, "epoch": 3769} {"train_loss": -25.653778076171875, "global_step": 312890, "epoch": 3769} {"train_loss": -25.569339752197266, "global_step": 312891, "epoch": 3769} {"train_loss": -26.05194664001465, "global_step": 312892, "epoch": 3769} {"train_loss": -25.899023056030273, "global_step": 312893, "epoch": 3769} {"train_loss": -26.172138214111328, "global_step": 312894, "epoch": 3769} {"train_loss": -26.106698989868164, "global_step": 312895, "epoch": 3769} {"train_loss": -25.657352447509766, "global_step": 312896, "epoch": 3769} {"train_loss": -25.585031509399414, "global_step": 312897, "epoch": 3769} {"train_loss": -26.0764102935791, "global_step": 312898, "epoch": 3769} {"train_loss": -25.8960018157959, "global_step": 312899, "epoch": 3769} {"train_loss": -25.808805465698242, "global_step": 312900, "epoch": 3769} {"train_loss": -26.142642974853516, "global_step": 312901, "epoch": 3769} {"train_loss": -26.03668212890625, "global_step": 312902, "epoch": 3769} {"train_loss": -25.911725997924805, "global_step": 312903, "epoch": 3769} {"train_loss": -25.960540771484375, "global_step": 312904, "epoch": 3769} {"train_loss": -25.9351863861084, "global_step": 312905, "epoch": 3769} {"train_loss": -26.174177169799805, "global_step": 312906, "epoch": 3769} {"train_loss": -25.782663345336914, "global_step": 312907, "epoch": 3769} {"train_loss": -26.196752548217773, "global_step": 312908, "epoch": 3769} {"train_loss": -25.620212738772473, "global_step": 312909, "epoch": 3769, "val_loss": 7241068.5} {"train_loss": -24.94709587097168, "global_step": 312910, "epoch": 3770} {"train_loss": -24.795194625854492, "global_step": 312911, "epoch": 3770} {"train_loss": -24.784910202026367, "global_step": 312912, "epoch": 3770} {"train_loss": -25.60601234436035, "global_step": 312913, "epoch": 3770} {"train_loss": -25.227313995361328, "global_step": 312914, "epoch": 3770} {"train_loss": -24.615177154541016, "global_step": 312915, "epoch": 3770} {"train_loss": -25.88091468811035, "global_step": 312916, "epoch": 3770} {"train_loss": -25.318178176879883, "global_step": 312917, "epoch": 3770} {"train_loss": -25.26899528503418, "global_step": 312918, "epoch": 3770} {"train_loss": -25.44899559020996, "global_step": 312919, "epoch": 3770} {"train_loss": -25.47504997253418, "global_step": 312920, "epoch": 3770} {"train_loss": -25.315839767456055, "global_step": 312921, "epoch": 3770} {"train_loss": -25.75994300842285, "global_step": 312922, "epoch": 3770} {"train_loss": -25.390125274658203, "global_step": 312923, "epoch": 3770} {"train_loss": -25.172788619995117, "global_step": 312924, "epoch": 3770} {"train_loss": -25.2911376953125, "global_step": 312925, "epoch": 3770} {"train_loss": -25.823505401611328, "global_step": 312926, "epoch": 3770} {"train_loss": -25.793912887573242, "global_step": 312927, "epoch": 3770} {"train_loss": -25.734663009643555, "global_step": 312928, "epoch": 3770} {"train_loss": -25.595436096191406, "global_step": 312929, "epoch": 3770} {"train_loss": -25.7037410736084, "global_step": 312930, "epoch": 3770} {"train_loss": -25.722497940063477, "global_step": 312931, "epoch": 3770} {"train_loss": -25.381065368652344, "global_step": 312932, "epoch": 3770} {"train_loss": -25.9941463470459, "global_step": 312933, "epoch": 3770} {"train_loss": -25.48169708251953, "global_step": 312934, "epoch": 3770} {"train_loss": -25.62837028503418, "global_step": 312935, "epoch": 3770} {"train_loss": -25.60407829284668, "global_step": 312936, "epoch": 3770} {"train_loss": -25.7653865814209, "global_step": 312937, "epoch": 3770} {"train_loss": -25.796329498291016, "global_step": 312938, "epoch": 3770} {"train_loss": -25.87293815612793, "global_step": 312939, "epoch": 3770} {"train_loss": -25.8813533782959, "global_step": 312940, "epoch": 3770} {"train_loss": -25.689329147338867, "global_step": 312941, "epoch": 3770} {"train_loss": -25.537120819091797, "global_step": 312942, "epoch": 3770} {"train_loss": -25.561864852905273, "global_step": 312943, "epoch": 3770} {"train_loss": -25.61383056640625, "global_step": 312944, "epoch": 3770} {"train_loss": -26.01824951171875, "global_step": 312945, "epoch": 3770} {"train_loss": -25.801267623901367, "global_step": 312946, "epoch": 3770} {"train_loss": -25.441720962524414, "global_step": 312947, "epoch": 3770} {"train_loss": -25.981855392456055, "global_step": 312948, "epoch": 3770} {"train_loss": -26.01557731628418, "global_step": 312949, "epoch": 3770} {"train_loss": -25.55295753479004, "global_step": 312950, "epoch": 3770} {"train_loss": -25.588865280151367, "global_step": 312951, "epoch": 3770} {"train_loss": -25.763092041015625, "global_step": 312952, "epoch": 3770} {"train_loss": -26.338123321533203, "global_step": 312953, "epoch": 3770} {"train_loss": -25.95542335510254, "global_step": 312954, "epoch": 3770} {"train_loss": -25.472745895385742, "global_step": 312955, "epoch": 3770} {"train_loss": -25.3315486907959, "global_step": 312956, "epoch": 3770} {"train_loss": -25.426212310791016, "global_step": 312957, "epoch": 3770} {"train_loss": -24.640853881835938, "global_step": 312958, "epoch": 3770} {"train_loss": -25.106412887573242, "global_step": 312959, "epoch": 3770} {"train_loss": -25.79303550720215, "global_step": 312960, "epoch": 3770} {"train_loss": -26.113208770751953, "global_step": 312961, "epoch": 3770} {"train_loss": -25.473548889160156, "global_step": 312962, "epoch": 3770} {"train_loss": -26.175251007080078, "global_step": 312963, "epoch": 3770} {"train_loss": -25.649831771850586, "global_step": 312964, "epoch": 3770} {"train_loss": -25.8951358795166, "global_step": 312965, "epoch": 3770} {"train_loss": -26.176671981811523, "global_step": 312966, "epoch": 3770} {"train_loss": -26.029821395874023, "global_step": 312967, "epoch": 3770} {"train_loss": -25.751087188720703, "global_step": 312968, "epoch": 3770} {"train_loss": -25.40472984313965, "global_step": 312969, "epoch": 3770} {"train_loss": -25.76297950744629, "global_step": 312970, "epoch": 3770} {"train_loss": -25.71674156188965, "global_step": 312971, "epoch": 3770} {"train_loss": -25.929244995117188, "global_step": 312972, "epoch": 3770} {"train_loss": -25.713037490844727, "global_step": 312973, "epoch": 3770} {"train_loss": -26.231855392456055, "global_step": 312974, "epoch": 3770} {"train_loss": -25.839466094970703, "global_step": 312975, "epoch": 3770} {"train_loss": -25.79073143005371, "global_step": 312976, "epoch": 3770} {"train_loss": -25.881153106689453, "global_step": 312977, "epoch": 3770} {"train_loss": -25.645715713500977, "global_step": 312978, "epoch": 3770} {"train_loss": -25.676488876342773, "global_step": 312979, "epoch": 3770} {"train_loss": -26.099027633666992, "global_step": 312980, "epoch": 3770} {"train_loss": -25.790571212768555, "global_step": 312981, "epoch": 3770} {"train_loss": -26.072614669799805, "global_step": 312982, "epoch": 3770} {"train_loss": -26.007980346679688, "global_step": 312983, "epoch": 3770} {"train_loss": -25.681365966796875, "global_step": 312984, "epoch": 3770} {"train_loss": -25.993783950805664, "global_step": 312985, "epoch": 3770} {"train_loss": -25.74016761779785, "global_step": 312986, "epoch": 3770} {"train_loss": -26.226728439331055, "global_step": 312987, "epoch": 3770} {"train_loss": -25.64210319519043, "global_step": 312988, "epoch": 3770} {"train_loss": -26.034626007080078, "global_step": 312989, "epoch": 3770} {"train_loss": -26.10296058654785, "global_step": 312990, "epoch": 3770} {"train_loss": -25.90907096862793, "global_step": 312991, "epoch": 3770} {"train_loss": -25.65720128438559, "global_step": 312992, "epoch": 3770, "val_loss": 7264909.5} {"train_loss": -25.377593994140625, "global_step": 312993, "epoch": 3771} {"train_loss": -25.611547470092773, "global_step": 312994, "epoch": 3771} {"train_loss": -25.04981803894043, "global_step": 312995, "epoch": 3771} {"train_loss": -25.321781158447266, "global_step": 312996, "epoch": 3771} {"train_loss": -25.286184310913086, "global_step": 312997, "epoch": 3771} {"train_loss": -25.386133193969727, "global_step": 312998, "epoch": 3771} {"train_loss": -25.27419090270996, "global_step": 312999, "epoch": 3771} {"train_loss": -25.771753311157227, "global_step": 313000, "epoch": 3771} {"train_loss": -24.139265060424805, "global_step": 313001, "epoch": 3771} {"train_loss": -25.528730392456055, "global_step": 313002, "epoch": 3771} {"train_loss": -25.376609802246094, "global_step": 313003, "epoch": 3771} {"train_loss": -25.5156307220459, "global_step": 313004, "epoch": 3771} {"train_loss": -25.586578369140625, "global_step": 313005, "epoch": 3771} {"train_loss": -25.60023307800293, "global_step": 313006, "epoch": 3771} {"train_loss": -25.14849853515625, "global_step": 313007, "epoch": 3771} {"train_loss": -25.2701358795166, "global_step": 313008, "epoch": 3771} {"train_loss": -25.434961318969727, "global_step": 313009, "epoch": 3771} {"train_loss": -25.35405921936035, "global_step": 313010, "epoch": 3771} {"train_loss": -25.379793167114258, "global_step": 313011, "epoch": 3771} {"train_loss": -25.47265625, "global_step": 313012, "epoch": 3771} {"train_loss": -25.36733627319336, "global_step": 313013, "epoch": 3771} {"train_loss": -25.878713607788086, "global_step": 313014, "epoch": 3771} {"train_loss": -25.710845947265625, "global_step": 313015, "epoch": 3771} {"train_loss": -25.280553817749023, "global_step": 313016, "epoch": 3771} {"train_loss": -25.711029052734375, "global_step": 313017, "epoch": 3771} {"train_loss": -25.45576286315918, "global_step": 313018, "epoch": 3771} {"train_loss": -25.6912899017334, "global_step": 313019, "epoch": 3771} {"train_loss": -25.8042049407959, "global_step": 313020, "epoch": 3771} {"train_loss": -25.593481063842773, "global_step": 313021, "epoch": 3771} {"train_loss": -25.438589096069336, "global_step": 313022, "epoch": 3771} {"train_loss": -25.597326278686523, "global_step": 313023, "epoch": 3771} {"train_loss": -25.741559982299805, "global_step": 313024, "epoch": 3771} {"train_loss": -25.821760177612305, "global_step": 313025, "epoch": 3771} {"train_loss": -25.719009399414062, "global_step": 313026, "epoch": 3771} {"train_loss": -25.907703399658203, "global_step": 313027, "epoch": 3771} {"train_loss": -25.947141647338867, "global_step": 313028, "epoch": 3771} {"train_loss": -25.941608428955078, "global_step": 313029, "epoch": 3771} {"train_loss": -26.050939559936523, "global_step": 313030, "epoch": 3771} {"train_loss": -26.420089721679688, "global_step": 313031, "epoch": 3771} {"train_loss": -25.758544921875, "global_step": 313032, "epoch": 3771} {"train_loss": -25.859943389892578, "global_step": 313033, "epoch": 3771} {"train_loss": -26.053348541259766, "global_step": 313034, "epoch": 3771} {"train_loss": -26.1602725982666, "global_step": 313035, "epoch": 3771} {"train_loss": -25.924718856811523, "global_step": 313036, "epoch": 3771} {"train_loss": -25.214290618896484, "global_step": 313037, "epoch": 3771} {"train_loss": -26.0030574798584, "global_step": 313038, "epoch": 3771} {"train_loss": -26.092182159423828, "global_step": 313039, "epoch": 3771} {"train_loss": -25.93951416015625, "global_step": 313040, "epoch": 3771} {"train_loss": -26.061664581298828, "global_step": 313041, "epoch": 3771} {"train_loss": -26.1281681060791, "global_step": 313042, "epoch": 3771} {"train_loss": -26.004749298095703, "global_step": 313043, "epoch": 3771} {"train_loss": -26.087743759155273, "global_step": 313044, "epoch": 3771} {"train_loss": -25.89693260192871, "global_step": 313045, "epoch": 3771} {"train_loss": -25.8890380859375, "global_step": 313046, "epoch": 3771} {"train_loss": -26.081323623657227, "global_step": 313047, "epoch": 3771} {"train_loss": -26.157941818237305, "global_step": 313048, "epoch": 3771} {"train_loss": -26.154062271118164, "global_step": 313049, "epoch": 3771} {"train_loss": -25.87204933166504, "global_step": 313050, "epoch": 3771} {"train_loss": -25.96942710876465, "global_step": 313051, "epoch": 3771} {"train_loss": -25.80445671081543, "global_step": 313052, "epoch": 3771} {"train_loss": -25.587514877319336, "global_step": 313053, "epoch": 3771} {"train_loss": -26.221250534057617, "global_step": 313054, "epoch": 3771} {"train_loss": -26.22291374206543, "global_step": 313055, "epoch": 3771} {"train_loss": -26.03266716003418, "global_step": 313056, "epoch": 3771} {"train_loss": -25.795379638671875, "global_step": 313057, "epoch": 3771} {"train_loss": -25.905460357666016, "global_step": 313058, "epoch": 3771} {"train_loss": -25.95545768737793, "global_step": 313059, "epoch": 3771} {"train_loss": -26.12737464904785, "global_step": 313060, "epoch": 3771} {"train_loss": -25.765817642211914, "global_step": 313061, "epoch": 3771} {"train_loss": -25.7186222076416, "global_step": 313062, "epoch": 3771} {"train_loss": -25.700143814086914, "global_step": 313063, "epoch": 3771} {"train_loss": -25.853042602539062, "global_step": 313064, "epoch": 3771} {"train_loss": -25.77711296081543, "global_step": 313065, "epoch": 3771} {"train_loss": -25.328603744506836, "global_step": 313066, "epoch": 3771} {"train_loss": -25.490982055664062, "global_step": 313067, "epoch": 3771} {"train_loss": -25.344322204589844, "global_step": 313068, "epoch": 3771} {"train_loss": -25.858203887939453, "global_step": 313069, "epoch": 3771} {"train_loss": -25.439470291137695, "global_step": 313070, "epoch": 3771} {"train_loss": -25.149188995361328, "global_step": 313071, "epoch": 3771} {"train_loss": -25.107145309448242, "global_step": 313072, "epoch": 3771} {"train_loss": -26.178424835205078, "global_step": 313073, "epoch": 3771} {"train_loss": -25.413911819458008, "global_step": 313074, "epoch": 3771} {"train_loss": -25.689697863107703, "global_step": 313075, "epoch": 3771, "val_loss": 7268130.0} {"train_loss": -24.750574111938477, "global_step": 313076, "epoch": 3772} {"train_loss": -25.07566261291504, "global_step": 313077, "epoch": 3772} {"train_loss": -24.561697006225586, "global_step": 313078, "epoch": 3772} {"train_loss": -23.82048225402832, "global_step": 313079, "epoch": 3772} {"train_loss": -25.274202346801758, "global_step": 313080, "epoch": 3772} {"train_loss": -25.07466697692871, "global_step": 313081, "epoch": 3772} {"train_loss": -25.060516357421875, "global_step": 313082, "epoch": 3772} {"train_loss": -24.794095993041992, "global_step": 313083, "epoch": 3772} {"train_loss": -24.86846351623535, "global_step": 313084, "epoch": 3772} {"train_loss": -25.308277130126953, "global_step": 313085, "epoch": 3772} {"train_loss": -25.458723068237305, "global_step": 313086, "epoch": 3772} {"train_loss": -25.086898803710938, "global_step": 313087, "epoch": 3772} {"train_loss": -24.629323959350586, "global_step": 313088, "epoch": 3772} {"train_loss": -25.22344970703125, "global_step": 313089, "epoch": 3772} {"train_loss": -25.20146942138672, "global_step": 313090, "epoch": 3772} {"train_loss": -25.44536781311035, "global_step": 313091, "epoch": 3772} {"train_loss": -25.195968627929688, "global_step": 313092, "epoch": 3772} {"train_loss": -25.523035049438477, "global_step": 313093, "epoch": 3772} {"train_loss": -25.449554443359375, "global_step": 313094, "epoch": 3772} {"train_loss": -25.444992065429688, "global_step": 313095, "epoch": 3772} {"train_loss": -25.564817428588867, "global_step": 313096, "epoch": 3772} {"train_loss": -25.055959701538086, "global_step": 313097, "epoch": 3772} {"train_loss": -25.440723419189453, "global_step": 313098, "epoch": 3772} {"train_loss": -25.55682945251465, "global_step": 313099, "epoch": 3772} {"train_loss": -25.677661895751953, "global_step": 313100, "epoch": 3772} {"train_loss": -25.490209579467773, "global_step": 313101, "epoch": 3772} {"train_loss": -25.77555274963379, "global_step": 313102, "epoch": 3772} {"train_loss": -25.555130004882812, "global_step": 313103, "epoch": 3772} {"train_loss": -25.7498722076416, "global_step": 313104, "epoch": 3772} {"train_loss": -25.708703994750977, "global_step": 313105, "epoch": 3772} {"train_loss": -25.629873275756836, "global_step": 313106, "epoch": 3772} {"train_loss": -25.8675594329834, "global_step": 313107, "epoch": 3772} {"train_loss": -25.719680786132812, "global_step": 313108, "epoch": 3772} {"train_loss": -25.887903213500977, "global_step": 313109, "epoch": 3772} {"train_loss": -25.522958755493164, "global_step": 313110, "epoch": 3772} {"train_loss": -26.088165283203125, "global_step": 313111, "epoch": 3772} {"train_loss": -25.5535945892334, "global_step": 313112, "epoch": 3772} {"train_loss": -25.665555953979492, "global_step": 313113, "epoch": 3772} {"train_loss": -25.901386260986328, "global_step": 313114, "epoch": 3772} {"train_loss": -25.753828048706055, "global_step": 313115, "epoch": 3772} {"train_loss": -25.7913761138916, "global_step": 313116, "epoch": 3772} {"train_loss": -26.131696701049805, "global_step": 313117, "epoch": 3772} {"train_loss": -25.904199600219727, "global_step": 313118, "epoch": 3772} {"train_loss": -26.049030303955078, "global_step": 313119, "epoch": 3772} {"train_loss": -25.8565616607666, "global_step": 313120, "epoch": 3772} {"train_loss": -25.603864669799805, "global_step": 313121, "epoch": 3772} {"train_loss": -25.98939323425293, "global_step": 313122, "epoch": 3772} {"train_loss": -25.926420211791992, "global_step": 313123, "epoch": 3772} {"train_loss": -26.107345581054688, "global_step": 313124, "epoch": 3772} {"train_loss": -25.85833168029785, "global_step": 313125, "epoch": 3772} {"train_loss": -25.975818634033203, "global_step": 313126, "epoch": 3772} {"train_loss": -25.984525680541992, "global_step": 313127, "epoch": 3772} {"train_loss": -25.772985458374023, "global_step": 313128, "epoch": 3772} {"train_loss": -25.675939559936523, "global_step": 313129, "epoch": 3772} {"train_loss": -25.520666122436523, "global_step": 313130, "epoch": 3772} {"train_loss": -26.086471557617188, "global_step": 313131, "epoch": 3772} {"train_loss": -25.789581298828125, "global_step": 313132, "epoch": 3772} {"train_loss": -25.506107330322266, "global_step": 313133, "epoch": 3772} {"train_loss": -25.8270206451416, "global_step": 313134, "epoch": 3772} {"train_loss": -25.51470184326172, "global_step": 313135, "epoch": 3772} {"train_loss": -25.660694122314453, "global_step": 313136, "epoch": 3772} {"train_loss": -25.9619197845459, "global_step": 313137, "epoch": 3772} {"train_loss": -26.115985870361328, "global_step": 313138, "epoch": 3772} {"train_loss": -25.64887046813965, "global_step": 313139, "epoch": 3772} {"train_loss": -25.67473793029785, "global_step": 313140, "epoch": 3772} {"train_loss": -25.734426498413086, "global_step": 313141, "epoch": 3772} {"train_loss": -25.816198348999023, "global_step": 313142, "epoch": 3772} {"train_loss": -26.10013771057129, "global_step": 313143, "epoch": 3772} {"train_loss": -25.715940475463867, "global_step": 313144, "epoch": 3772} {"train_loss": -25.439565658569336, "global_step": 313145, "epoch": 3772} {"train_loss": -25.930164337158203, "global_step": 313146, "epoch": 3772} {"train_loss": -25.496417999267578, "global_step": 313147, "epoch": 3772} {"train_loss": -25.335315704345703, "global_step": 313148, "epoch": 3772} {"train_loss": -25.1895751953125, "global_step": 313149, "epoch": 3772} {"train_loss": -25.355554580688477, "global_step": 313150, "epoch": 3772} {"train_loss": -25.475055694580078, "global_step": 313151, "epoch": 3772} {"train_loss": -25.370588302612305, "global_step": 313152, "epoch": 3772} {"train_loss": -25.63031578063965, "global_step": 313153, "epoch": 3772} {"train_loss": -25.27262306213379, "global_step": 313154, "epoch": 3772} {"train_loss": -25.436172485351562, "global_step": 313155, "epoch": 3772} {"train_loss": -25.277334213256836, "global_step": 313156, "epoch": 3772} {"train_loss": -25.668630599975586, "global_step": 313157, "epoch": 3772} {"train_loss": -25.551663387252624, "global_step": 313158, "epoch": 3772, "val_loss": 7218403.0} {"train_loss": -24.644596099853516, "global_step": 313159, "epoch": 3773} {"train_loss": -24.884571075439453, "global_step": 313160, "epoch": 3773} {"train_loss": -24.935697555541992, "global_step": 313161, "epoch": 3773} {"train_loss": -25.14946937561035, "global_step": 313162, "epoch": 3773} {"train_loss": -24.746850967407227, "global_step": 313163, "epoch": 3773} {"train_loss": -25.364856719970703, "global_step": 313164, "epoch": 3773} {"train_loss": -24.815155029296875, "global_step": 313165, "epoch": 3773} {"train_loss": -25.56109046936035, "global_step": 313166, "epoch": 3773} {"train_loss": -24.891510009765625, "global_step": 313167, "epoch": 3773} {"train_loss": -24.939680099487305, "global_step": 313168, "epoch": 3773} {"train_loss": -25.46084213256836, "global_step": 313169, "epoch": 3773} {"train_loss": -25.383647918701172, "global_step": 313170, "epoch": 3773} {"train_loss": -25.272836685180664, "global_step": 313171, "epoch": 3773} {"train_loss": -25.34011459350586, "global_step": 313172, "epoch": 3773} {"train_loss": -25.492183685302734, "global_step": 313173, "epoch": 3773} {"train_loss": -25.546611785888672, "global_step": 313174, "epoch": 3773} {"train_loss": -25.292112350463867, "global_step": 313175, "epoch": 3773} {"train_loss": -25.355960845947266, "global_step": 313176, "epoch": 3773} {"train_loss": -25.270050048828125, "global_step": 313177, "epoch": 3773} {"train_loss": -25.283666610717773, "global_step": 313178, "epoch": 3773} {"train_loss": -25.532438278198242, "global_step": 313179, "epoch": 3773} {"train_loss": -25.48719596862793, "global_step": 313180, "epoch": 3773} {"train_loss": -25.501516342163086, "global_step": 313181, "epoch": 3773} {"train_loss": -25.614850997924805, "global_step": 313182, "epoch": 3773} {"train_loss": -25.382848739624023, "global_step": 313183, "epoch": 3773} {"train_loss": -25.618408203125, "global_step": 313184, "epoch": 3773} {"train_loss": -25.521825790405273, "global_step": 313185, "epoch": 3773} {"train_loss": -25.7047176361084, "global_step": 313186, "epoch": 3773} {"train_loss": -25.161836624145508, "global_step": 313187, "epoch": 3773} {"train_loss": -25.82191276550293, "global_step": 313188, "epoch": 3773} {"train_loss": -25.57741355895996, "global_step": 313189, "epoch": 3773} {"train_loss": -25.678192138671875, "global_step": 313190, "epoch": 3773} {"train_loss": -25.651945114135742, "global_step": 313191, "epoch": 3773} {"train_loss": -25.737186431884766, "global_step": 313192, "epoch": 3773} {"train_loss": -25.1076717376709, "global_step": 313193, "epoch": 3773} {"train_loss": -25.93233299255371, "global_step": 313194, "epoch": 3773} {"train_loss": -25.925962448120117, "global_step": 313195, "epoch": 3773} {"train_loss": -25.6350040435791, "global_step": 313196, "epoch": 3773} {"train_loss": -26.181476593017578, "global_step": 313197, "epoch": 3773} {"train_loss": -25.699445724487305, "global_step": 313198, "epoch": 3773} {"train_loss": -25.78717613220215, "global_step": 313199, "epoch": 3773} {"train_loss": -25.66753578186035, "global_step": 313200, "epoch": 3773} {"train_loss": -25.725570678710938, "global_step": 313201, "epoch": 3773} {"train_loss": -25.71425437927246, "global_step": 313202, "epoch": 3773} {"train_loss": -25.79098892211914, "global_step": 313203, "epoch": 3773} {"train_loss": -25.617511749267578, "global_step": 313204, "epoch": 3773} {"train_loss": -26.064855575561523, "global_step": 313205, "epoch": 3773} {"train_loss": -26.023880004882812, "global_step": 313206, "epoch": 3773} {"train_loss": -25.413267135620117, "global_step": 313207, "epoch": 3773} {"train_loss": -25.7224178314209, "global_step": 313208, "epoch": 3773} {"train_loss": -25.637866973876953, "global_step": 313209, "epoch": 3773} {"train_loss": -25.8659725189209, "global_step": 313210, "epoch": 3773} {"train_loss": -26.075927734375, "global_step": 313211, "epoch": 3773} {"train_loss": -25.640172958374023, "global_step": 313212, "epoch": 3773} {"train_loss": -26.119125366210938, "global_step": 313213, "epoch": 3773} {"train_loss": -25.468557357788086, "global_step": 313214, "epoch": 3773} {"train_loss": -25.63620948791504, "global_step": 313215, "epoch": 3773} {"train_loss": -25.591888427734375, "global_step": 313216, "epoch": 3773} {"train_loss": -25.51242446899414, "global_step": 313217, "epoch": 3773} {"train_loss": -25.920028686523438, "global_step": 313218, "epoch": 3773} {"train_loss": -25.54465103149414, "global_step": 313219, "epoch": 3773} {"train_loss": -25.96591567993164, "global_step": 313220, "epoch": 3773} {"train_loss": -25.927587509155273, "global_step": 313221, "epoch": 3773} {"train_loss": -25.783803939819336, "global_step": 313222, "epoch": 3773} {"train_loss": -25.85322380065918, "global_step": 313223, "epoch": 3773} {"train_loss": -25.807971954345703, "global_step": 313224, "epoch": 3773} {"train_loss": -25.877050399780273, "global_step": 313225, "epoch": 3773} {"train_loss": -25.580148696899414, "global_step": 313226, "epoch": 3773} {"train_loss": -25.466459274291992, "global_step": 313227, "epoch": 3773} {"train_loss": -25.84348487854004, "global_step": 313228, "epoch": 3773} {"train_loss": -25.67288589477539, "global_step": 313229, "epoch": 3773} {"train_loss": -26.0700626373291, "global_step": 313230, "epoch": 3773} {"train_loss": -25.810937881469727, "global_step": 313231, "epoch": 3773} {"train_loss": -25.831323623657227, "global_step": 313232, "epoch": 3773} {"train_loss": -25.899398803710938, "global_step": 313233, "epoch": 3773} {"train_loss": -26.2056941986084, "global_step": 313234, "epoch": 3773} {"train_loss": -25.666025161743164, "global_step": 313235, "epoch": 3773} {"train_loss": -25.787694931030273, "global_step": 313236, "epoch": 3773} {"train_loss": -26.022626876831055, "global_step": 313237, "epoch": 3773} {"train_loss": -25.661474227905273, "global_step": 313238, "epoch": 3773} {"train_loss": -26.001325607299805, "global_step": 313239, "epoch": 3773} {"train_loss": -25.981225967407227, "global_step": 313240, "epoch": 3773} {"train_loss": -25.583411825708595, "global_step": 313241, "epoch": 3773, "val_loss": 7348402.0} {"train_loss": -24.785938262939453, "global_step": 313242, "epoch": 3774} {"train_loss": -24.140012741088867, "global_step": 313243, "epoch": 3774} {"train_loss": -25.170326232910156, "global_step": 313244, "epoch": 3774} {"train_loss": -24.976749420166016, "global_step": 313245, "epoch": 3774} {"train_loss": -24.8275089263916, "global_step": 313246, "epoch": 3774} {"train_loss": -25.11039161682129, "global_step": 313247, "epoch": 3774} {"train_loss": -25.073596954345703, "global_step": 313248, "epoch": 3774} {"train_loss": -25.14116859436035, "global_step": 313249, "epoch": 3774} {"train_loss": -25.348905563354492, "global_step": 313250, "epoch": 3774} {"train_loss": -25.405492782592773, "global_step": 313251, "epoch": 3774} {"train_loss": -25.36144256591797, "global_step": 313252, "epoch": 3774} {"train_loss": -25.114194869995117, "global_step": 313253, "epoch": 3774} {"train_loss": -25.05928611755371, "global_step": 313254, "epoch": 3774} {"train_loss": -25.22883415222168, "global_step": 313255, "epoch": 3774} {"train_loss": -25.453641891479492, "global_step": 313256, "epoch": 3774} {"train_loss": -25.27450942993164, "global_step": 313257, "epoch": 3774} {"train_loss": -25.524181365966797, "global_step": 313258, "epoch": 3774} {"train_loss": -25.61344337463379, "global_step": 313259, "epoch": 3774} {"train_loss": -25.519086837768555, "global_step": 313260, "epoch": 3774} {"train_loss": -25.568906784057617, "global_step": 313261, "epoch": 3774} {"train_loss": -25.31569480895996, "global_step": 313262, "epoch": 3774} {"train_loss": -25.97078514099121, "global_step": 313263, "epoch": 3774} {"train_loss": -25.335603713989258, "global_step": 313264, "epoch": 3774} {"train_loss": -25.79877281188965, "global_step": 313265, "epoch": 3774} {"train_loss": -25.32693099975586, "global_step": 313266, "epoch": 3774} {"train_loss": -25.871793746948242, "global_step": 313267, "epoch": 3774} {"train_loss": -25.591434478759766, "global_step": 313268, "epoch": 3774} {"train_loss": -25.58064079284668, "global_step": 313269, "epoch": 3774} {"train_loss": -25.958621978759766, "global_step": 313270, "epoch": 3774} {"train_loss": -25.4672794342041, "global_step": 313271, "epoch": 3774} {"train_loss": -25.852426528930664, "global_step": 313272, "epoch": 3774} {"train_loss": -25.98555564880371, "global_step": 313273, "epoch": 3774} {"train_loss": -25.484577178955078, "global_step": 313274, "epoch": 3774} {"train_loss": -25.759504318237305, "global_step": 313275, "epoch": 3774} {"train_loss": -26.01742935180664, "global_step": 313276, "epoch": 3774} {"train_loss": -25.930286407470703, "global_step": 313277, "epoch": 3774} {"train_loss": -25.707056045532227, "global_step": 313278, "epoch": 3774} {"train_loss": -25.63553237915039, "global_step": 313279, "epoch": 3774} {"train_loss": -25.6571102142334, "global_step": 313280, "epoch": 3774} {"train_loss": -25.866107940673828, "global_step": 313281, "epoch": 3774} {"train_loss": -25.699859619140625, "global_step": 313282, "epoch": 3774} {"train_loss": -25.639972686767578, "global_step": 313283, "epoch": 3774} {"train_loss": -25.726505279541016, "global_step": 313284, "epoch": 3774} {"train_loss": -25.771718978881836, "global_step": 313285, "epoch": 3774} {"train_loss": -25.69257926940918, "global_step": 313286, "epoch": 3774} {"train_loss": -26.043445587158203, "global_step": 313287, "epoch": 3774} {"train_loss": -25.700763702392578, "global_step": 313288, "epoch": 3774} {"train_loss": -25.945831298828125, "global_step": 313289, "epoch": 3774} {"train_loss": -25.95453453063965, "global_step": 313290, "epoch": 3774} {"train_loss": -26.081151962280273, "global_step": 313291, "epoch": 3774} {"train_loss": -25.517475128173828, "global_step": 313292, "epoch": 3774} {"train_loss": -25.631906509399414, "global_step": 313293, "epoch": 3774} {"train_loss": -25.48002052307129, "global_step": 313294, "epoch": 3774} {"train_loss": -25.797956466674805, "global_step": 313295, "epoch": 3774} {"train_loss": -26.234180450439453, "global_step": 313296, "epoch": 3774} {"train_loss": -25.652570724487305, "global_step": 313297, "epoch": 3774} {"train_loss": -25.763263702392578, "global_step": 313298, "epoch": 3774} {"train_loss": -25.776636123657227, "global_step": 313299, "epoch": 3774} {"train_loss": -25.88741111755371, "global_step": 313300, "epoch": 3774} {"train_loss": -25.95783805847168, "global_step": 313301, "epoch": 3774} {"train_loss": -25.7636775970459, "global_step": 313302, "epoch": 3774} {"train_loss": -25.605756759643555, "global_step": 313303, "epoch": 3774} {"train_loss": -25.805017471313477, "global_step": 313304, "epoch": 3774} {"train_loss": -26.019983291625977, "global_step": 313305, "epoch": 3774} {"train_loss": -25.8651123046875, "global_step": 313306, "epoch": 3774} {"train_loss": -25.77268409729004, "global_step": 313307, "epoch": 3774} {"train_loss": -25.966022491455078, "global_step": 313308, "epoch": 3774} {"train_loss": -26.000732421875, "global_step": 313309, "epoch": 3774} {"train_loss": -25.8592529296875, "global_step": 313310, "epoch": 3774} {"train_loss": -26.132892608642578, "global_step": 313311, "epoch": 3774} {"train_loss": -25.905698776245117, "global_step": 313312, "epoch": 3774} {"train_loss": -25.69904899597168, "global_step": 313313, "epoch": 3774} {"train_loss": -25.49545669555664, "global_step": 313314, "epoch": 3774} {"train_loss": -25.396915435791016, "global_step": 313315, "epoch": 3774} {"train_loss": -25.454736709594727, "global_step": 313316, "epoch": 3774} {"train_loss": -25.83632469177246, "global_step": 313317, "epoch": 3774} {"train_loss": -25.963321685791016, "global_step": 313318, "epoch": 3774} {"train_loss": -25.705636978149414, "global_step": 313319, "epoch": 3774} {"train_loss": -26.169818878173828, "global_step": 313320, "epoch": 3774} {"train_loss": -25.864892959594727, "global_step": 313321, "epoch": 3774} {"train_loss": -25.88449478149414, "global_step": 313322, "epoch": 3774} {"train_loss": -25.87580680847168, "global_step": 313323, "epoch": 3774} {"train_loss": -25.627712387636482, "global_step": 313324, "epoch": 3774, "val_loss": 7284061.5} {"train_loss": -25.62642478942871, "global_step": 313325, "epoch": 3775} {"train_loss": -25.57660484313965, "global_step": 313326, "epoch": 3775} {"train_loss": -25.48674964904785, "global_step": 313327, "epoch": 3775} {"train_loss": -25.52047348022461, "global_step": 313328, "epoch": 3775} {"train_loss": -24.815067291259766, "global_step": 313329, "epoch": 3775} {"train_loss": -25.404470443725586, "global_step": 313330, "epoch": 3775} {"train_loss": -24.794034957885742, "global_step": 313331, "epoch": 3775} {"train_loss": -25.24659538269043, "global_step": 313332, "epoch": 3775} {"train_loss": -24.889760971069336, "global_step": 313333, "epoch": 3775} {"train_loss": -25.20940589904785, "global_step": 313334, "epoch": 3775} {"train_loss": -25.3337345123291, "global_step": 313335, "epoch": 3775} {"train_loss": -25.5363826751709, "global_step": 313336, "epoch": 3775} {"train_loss": -24.9977970123291, "global_step": 313337, "epoch": 3775} {"train_loss": -25.703857421875, "global_step": 313338, "epoch": 3775} {"train_loss": -25.829486846923828, "global_step": 313339, "epoch": 3775} {"train_loss": -25.451507568359375, "global_step": 313340, "epoch": 3775} {"train_loss": -25.733991622924805, "global_step": 313341, "epoch": 3775} {"train_loss": -26.075586318969727, "global_step": 313342, "epoch": 3775} {"train_loss": -25.4877872467041, "global_step": 313343, "epoch": 3775} {"train_loss": -25.644561767578125, "global_step": 313344, "epoch": 3775} {"train_loss": -25.716482162475586, "global_step": 313345, "epoch": 3775} {"train_loss": -25.56494903564453, "global_step": 313346, "epoch": 3775} {"train_loss": -25.622974395751953, "global_step": 313347, "epoch": 3775} {"train_loss": -25.61212158203125, "global_step": 313348, "epoch": 3775} {"train_loss": -25.840805053710938, "global_step": 313349, "epoch": 3775} {"train_loss": -25.58542251586914, "global_step": 313350, "epoch": 3775} {"train_loss": -25.625568389892578, "global_step": 313351, "epoch": 3775} {"train_loss": -25.318851470947266, "global_step": 313352, "epoch": 3775} {"train_loss": -25.57779312133789, "global_step": 313353, "epoch": 3775} {"train_loss": -25.711267471313477, "global_step": 313354, "epoch": 3775} {"train_loss": -25.79905128479004, "global_step": 313355, "epoch": 3775} {"train_loss": -25.587604522705078, "global_step": 313356, "epoch": 3775} {"train_loss": -25.571081161499023, "global_step": 313357, "epoch": 3775} {"train_loss": -25.769392013549805, "global_step": 313358, "epoch": 3775} {"train_loss": -25.62940788269043, "global_step": 313359, "epoch": 3775} {"train_loss": -25.654367446899414, "global_step": 313360, "epoch": 3775} {"train_loss": -25.43851661682129, "global_step": 313361, "epoch": 3775} {"train_loss": -25.764728546142578, "global_step": 313362, "epoch": 3775} {"train_loss": -25.630762100219727, "global_step": 313363, "epoch": 3775} {"train_loss": -25.748844146728516, "global_step": 313364, "epoch": 3775} {"train_loss": -25.657331466674805, "global_step": 313365, "epoch": 3775} {"train_loss": -25.754474639892578, "global_step": 313366, "epoch": 3775} {"train_loss": -25.817285537719727, "global_step": 313367, "epoch": 3775} {"train_loss": -25.712568283081055, "global_step": 313368, "epoch": 3775} {"train_loss": -25.819122314453125, "global_step": 313369, "epoch": 3775} {"train_loss": -25.918121337890625, "global_step": 313370, "epoch": 3775} {"train_loss": -25.580543518066406, "global_step": 313371, "epoch": 3775} {"train_loss": -25.662302017211914, "global_step": 313372, "epoch": 3775} {"train_loss": -25.863662719726562, "global_step": 313373, "epoch": 3775} {"train_loss": -25.97174072265625, "global_step": 313374, "epoch": 3775} {"train_loss": -25.908050537109375, "global_step": 313375, "epoch": 3775} {"train_loss": -25.45881462097168, "global_step": 313376, "epoch": 3775} {"train_loss": -25.71860122680664, "global_step": 313377, "epoch": 3775} {"train_loss": -26.1298770904541, "global_step": 313378, "epoch": 3775} {"train_loss": -25.807531356811523, "global_step": 313379, "epoch": 3775} {"train_loss": -25.33282470703125, "global_step": 313380, "epoch": 3775} {"train_loss": -25.873960494995117, "global_step": 313381, "epoch": 3775} {"train_loss": -25.787275314331055, "global_step": 313382, "epoch": 3775} {"train_loss": -25.29052734375, "global_step": 313383, "epoch": 3775} {"train_loss": -25.744354248046875, "global_step": 313384, "epoch": 3775} {"train_loss": -25.85089111328125, "global_step": 313385, "epoch": 3775} {"train_loss": -25.791034698486328, "global_step": 313386, "epoch": 3775} {"train_loss": -25.937957763671875, "global_step": 313387, "epoch": 3775} {"train_loss": -25.833881378173828, "global_step": 313388, "epoch": 3775} {"train_loss": -25.990400314331055, "global_step": 313389, "epoch": 3775} {"train_loss": -25.6652774810791, "global_step": 313390, "epoch": 3775} {"train_loss": -25.5167293548584, "global_step": 313391, "epoch": 3775} {"train_loss": -25.54804801940918, "global_step": 313392, "epoch": 3775} {"train_loss": -25.419530868530273, "global_step": 313393, "epoch": 3775} {"train_loss": -25.747915267944336, "global_step": 313394, "epoch": 3775} {"train_loss": -25.732105255126953, "global_step": 313395, "epoch": 3775} {"train_loss": -25.444896697998047, "global_step": 313396, "epoch": 3775} {"train_loss": -25.762170791625977, "global_step": 313397, "epoch": 3775} {"train_loss": -25.855487823486328, "global_step": 313398, "epoch": 3775} {"train_loss": -25.596052169799805, "global_step": 313399, "epoch": 3775} {"train_loss": -25.76917839050293, "global_step": 313400, "epoch": 3775} {"train_loss": -25.602466583251953, "global_step": 313401, "epoch": 3775} {"train_loss": -25.891727447509766, "global_step": 313402, "epoch": 3775} {"train_loss": -25.64034080505371, "global_step": 313403, "epoch": 3775} {"train_loss": -25.281248092651367, "global_step": 313404, "epoch": 3775} {"train_loss": -25.6766357421875, "global_step": 313405, "epoch": 3775} {"train_loss": -25.886707305908203, "global_step": 313406, "epoch": 3775} {"train_loss": -25.646666377423756, "global_step": 313407, "epoch": 3775, "val_loss": 7285995.0} {"train_loss": -25.275365829467773, "global_step": 313408, "epoch": 3776} {"train_loss": -25.413440704345703, "global_step": 313409, "epoch": 3776} {"train_loss": -24.88098907470703, "global_step": 313410, "epoch": 3776} {"train_loss": -25.03076934814453, "global_step": 313411, "epoch": 3776} {"train_loss": -25.538557052612305, "global_step": 313412, "epoch": 3776} {"train_loss": -24.713459014892578, "global_step": 313413, "epoch": 3776} {"train_loss": -25.370742797851562, "global_step": 313414, "epoch": 3776} {"train_loss": -25.2402286529541, "global_step": 313415, "epoch": 3776} {"train_loss": -24.94160270690918, "global_step": 313416, "epoch": 3776} {"train_loss": -25.540363311767578, "global_step": 313417, "epoch": 3776} {"train_loss": -25.17795753479004, "global_step": 313418, "epoch": 3776} {"train_loss": -25.52439308166504, "global_step": 313419, "epoch": 3776} {"train_loss": -25.246341705322266, "global_step": 313420, "epoch": 3776} {"train_loss": -25.49103355407715, "global_step": 313421, "epoch": 3776} {"train_loss": -25.6955509185791, "global_step": 313422, "epoch": 3776} {"train_loss": -25.623273849487305, "global_step": 313423, "epoch": 3776} {"train_loss": -25.555078506469727, "global_step": 313424, "epoch": 3776} {"train_loss": -25.378175735473633, "global_step": 313425, "epoch": 3776} {"train_loss": -25.507797241210938, "global_step": 313426, "epoch": 3776} {"train_loss": -25.630294799804688, "global_step": 313427, "epoch": 3776} {"train_loss": -25.82851219177246, "global_step": 313428, "epoch": 3776} {"train_loss": -25.61482048034668, "global_step": 313429, "epoch": 3776} {"train_loss": -25.538116455078125, "global_step": 313430, "epoch": 3776} {"train_loss": -25.290876388549805, "global_step": 313431, "epoch": 3776} {"train_loss": -25.38265037536621, "global_step": 313432, "epoch": 3776} {"train_loss": -25.745086669921875, "global_step": 313433, "epoch": 3776} {"train_loss": -25.91425132751465, "global_step": 313434, "epoch": 3776} {"train_loss": -25.429731369018555, "global_step": 313435, "epoch": 3776} {"train_loss": -25.638092041015625, "global_step": 313436, "epoch": 3776} {"train_loss": -25.696552276611328, "global_step": 313437, "epoch": 3776} {"train_loss": -25.350412368774414, "global_step": 313438, "epoch": 3776} {"train_loss": -25.801435470581055, "global_step": 313439, "epoch": 3776} {"train_loss": -26.001779556274414, "global_step": 313440, "epoch": 3776} {"train_loss": -26.069040298461914, "global_step": 313441, "epoch": 3776} {"train_loss": -25.571609497070312, "global_step": 313442, "epoch": 3776} {"train_loss": -25.769254684448242, "global_step": 313443, "epoch": 3776} {"train_loss": -25.727758407592773, "global_step": 313444, "epoch": 3776} {"train_loss": -26.003870010375977, "global_step": 313445, "epoch": 3776} {"train_loss": -25.847721099853516, "global_step": 313446, "epoch": 3776} {"train_loss": -25.7222957611084, "global_step": 313447, "epoch": 3776} {"train_loss": -26.14470863342285, "global_step": 313448, "epoch": 3776} {"train_loss": -25.786985397338867, "global_step": 313449, "epoch": 3776} {"train_loss": -25.881427764892578, "global_step": 313450, "epoch": 3776} {"train_loss": -25.7329158782959, "global_step": 313451, "epoch": 3776} {"train_loss": -25.81744956970215, "global_step": 313452, "epoch": 3776} {"train_loss": -26.06000328063965, "global_step": 313453, "epoch": 3776} {"train_loss": -26.049457550048828, "global_step": 313454, "epoch": 3776} {"train_loss": -25.894927978515625, "global_step": 313455, "epoch": 3776} {"train_loss": -25.816329956054688, "global_step": 313456, "epoch": 3776} {"train_loss": -26.03714370727539, "global_step": 313457, "epoch": 3776} {"train_loss": -25.919143676757812, "global_step": 313458, "epoch": 3776} {"train_loss": -25.727859497070312, "global_step": 313459, "epoch": 3776} {"train_loss": -25.878040313720703, "global_step": 313460, "epoch": 3776} {"train_loss": -25.965734481811523, "global_step": 313461, "epoch": 3776} {"train_loss": -25.801889419555664, "global_step": 313462, "epoch": 3776} {"train_loss": -25.533222198486328, "global_step": 313463, "epoch": 3776} {"train_loss": -25.411680221557617, "global_step": 313464, "epoch": 3776} {"train_loss": -25.64794921875, "global_step": 313465, "epoch": 3776} {"train_loss": -26.023706436157227, "global_step": 313466, "epoch": 3776} {"train_loss": -25.781982421875, "global_step": 313467, "epoch": 3776} {"train_loss": -25.637720108032227, "global_step": 313468, "epoch": 3776} {"train_loss": -25.860519409179688, "global_step": 313469, "epoch": 3776} {"train_loss": -25.948627471923828, "global_step": 313470, "epoch": 3776} {"train_loss": -25.746185302734375, "global_step": 313471, "epoch": 3776} {"train_loss": -26.017744064331055, "global_step": 313472, "epoch": 3776} {"train_loss": -26.092573165893555, "global_step": 313473, "epoch": 3776} {"train_loss": -25.328067779541016, "global_step": 313474, "epoch": 3776} {"train_loss": -25.577116012573242, "global_step": 313475, "epoch": 3776} {"train_loss": -25.601011276245117, "global_step": 313476, "epoch": 3776} {"train_loss": -25.82012939453125, "global_step": 313477, "epoch": 3776} {"train_loss": -25.64740562438965, "global_step": 313478, "epoch": 3776} {"train_loss": -26.120153427124023, "global_step": 313479, "epoch": 3776} {"train_loss": -25.781299591064453, "global_step": 313480, "epoch": 3776} {"train_loss": -25.815656661987305, "global_step": 313481, "epoch": 3776} {"train_loss": -25.600482940673828, "global_step": 313482, "epoch": 3776} {"train_loss": -25.36832618713379, "global_step": 313483, "epoch": 3776} {"train_loss": -25.99176597595215, "global_step": 313484, "epoch": 3776} {"train_loss": -26.271154403686523, "global_step": 313485, "epoch": 3776} {"train_loss": -25.931238174438477, "global_step": 313486, "epoch": 3776} {"train_loss": -25.916223526000977, "global_step": 313487, "epoch": 3776} {"train_loss": -25.79839515686035, "global_step": 313488, "epoch": 3776} {"train_loss": -25.773290634155273, "global_step": 313489, "epoch": 3776} {"train_loss": -25.677257078239716, "global_step": 313490, "epoch": 3776, "val_loss": 7251053.0} {"train_loss": -25.16623878479004, "global_step": 313491, "epoch": 3777} {"train_loss": -25.598453521728516, "global_step": 313492, "epoch": 3777} {"train_loss": -25.639286041259766, "global_step": 313493, "epoch": 3777} {"train_loss": -25.388795852661133, "global_step": 313494, "epoch": 3777} {"train_loss": -25.17656707763672, "global_step": 313495, "epoch": 3777} {"train_loss": -25.375835418701172, "global_step": 313496, "epoch": 3777} {"train_loss": -25.208641052246094, "global_step": 313497, "epoch": 3777} {"train_loss": -25.441089630126953, "global_step": 313498, "epoch": 3777} {"train_loss": -25.621652603149414, "global_step": 313499, "epoch": 3777} {"train_loss": -25.721149444580078, "global_step": 313500, "epoch": 3777} {"train_loss": -25.803808212280273, "global_step": 313501, "epoch": 3777} {"train_loss": -25.727115631103516, "global_step": 313502, "epoch": 3777} {"train_loss": -25.725427627563477, "global_step": 313503, "epoch": 3777} {"train_loss": -25.380704879760742, "global_step": 313504, "epoch": 3777} {"train_loss": -25.787912368774414, "global_step": 313505, "epoch": 3777} {"train_loss": -25.66190528869629, "global_step": 313506, "epoch": 3777} {"train_loss": -25.605005264282227, "global_step": 313507, "epoch": 3777} {"train_loss": -25.788137435913086, "global_step": 313508, "epoch": 3777} {"train_loss": -26.022953033447266, "global_step": 313509, "epoch": 3777} {"train_loss": -26.12872314453125, "global_step": 313510, "epoch": 3777} {"train_loss": -25.90395164489746, "global_step": 313511, "epoch": 3777} {"train_loss": -26.014087677001953, "global_step": 313512, "epoch": 3777} {"train_loss": -25.901935577392578, "global_step": 313513, "epoch": 3777} {"train_loss": -25.686933517456055, "global_step": 313514, "epoch": 3777} {"train_loss": -26.112472534179688, "global_step": 313515, "epoch": 3777} {"train_loss": -25.72193717956543, "global_step": 313516, "epoch": 3777} {"train_loss": -25.86201286315918, "global_step": 313517, "epoch": 3777} {"train_loss": -25.718219757080078, "global_step": 313518, "epoch": 3777} {"train_loss": -26.20978355407715, "global_step": 313519, "epoch": 3777} {"train_loss": -25.937707901000977, "global_step": 313520, "epoch": 3777} {"train_loss": -26.22125816345215, "global_step": 313521, "epoch": 3777} {"train_loss": -25.957120895385742, "global_step": 313522, "epoch": 3777} {"train_loss": -26.04176139831543, "global_step": 313523, "epoch": 3777} {"train_loss": -26.219709396362305, "global_step": 313524, "epoch": 3777} {"train_loss": -25.8841495513916, "global_step": 313525, "epoch": 3777} {"train_loss": -26.177478790283203, "global_step": 313526, "epoch": 3777} {"train_loss": -25.70847511291504, "global_step": 313527, "epoch": 3777} {"train_loss": -25.846466064453125, "global_step": 313528, "epoch": 3777} {"train_loss": -25.83832359313965, "global_step": 313529, "epoch": 3777} {"train_loss": -25.974706649780273, "global_step": 313530, "epoch": 3777} {"train_loss": -25.800262451171875, "global_step": 313531, "epoch": 3777} {"train_loss": -26.038043975830078, "global_step": 313532, "epoch": 3777} {"train_loss": -25.490142822265625, "global_step": 313533, "epoch": 3777} {"train_loss": -25.67835807800293, "global_step": 313534, "epoch": 3777} {"train_loss": -26.3653621673584, "global_step": 313535, "epoch": 3777} {"train_loss": -25.4998722076416, "global_step": 313536, "epoch": 3777} {"train_loss": -25.391157150268555, "global_step": 313537, "epoch": 3777} {"train_loss": -24.18891716003418, "global_step": 313538, "epoch": 3777} {"train_loss": -20.798479080200195, "global_step": 313539, "epoch": 3777} {"train_loss": -23.62979507446289, "global_step": 313540, "epoch": 3777} {"train_loss": -25.233917236328125, "global_step": 313541, "epoch": 3777} {"train_loss": -25.02231216430664, "global_step": 313542, "epoch": 3777} {"train_loss": -25.00435447692871, "global_step": 313543, "epoch": 3777} {"train_loss": -24.969240188598633, "global_step": 313544, "epoch": 3777} {"train_loss": -24.722576141357422, "global_step": 313545, "epoch": 3777} {"train_loss": -25.294004440307617, "global_step": 313546, "epoch": 3777} {"train_loss": -25.195714950561523, "global_step": 313547, "epoch": 3777} {"train_loss": -25.348506927490234, "global_step": 313548, "epoch": 3777} {"train_loss": -25.54560661315918, "global_step": 313549, "epoch": 3777} {"train_loss": -25.39338493347168, "global_step": 313550, "epoch": 3777} {"train_loss": -25.345266342163086, "global_step": 313551, "epoch": 3777} {"train_loss": -25.08285140991211, "global_step": 313552, "epoch": 3777} {"train_loss": -25.27452850341797, "global_step": 313553, "epoch": 3777} {"train_loss": -25.05982208251953, "global_step": 313554, "epoch": 3777} {"train_loss": -25.33302879333496, "global_step": 313555, "epoch": 3777} {"train_loss": -25.0435848236084, "global_step": 313556, "epoch": 3777} {"train_loss": -25.488744735717773, "global_step": 313557, "epoch": 3777} {"train_loss": -25.34528160095215, "global_step": 313558, "epoch": 3777} {"train_loss": -25.253578186035156, "global_step": 313559, "epoch": 3777} {"train_loss": -25.58698844909668, "global_step": 313560, "epoch": 3777} {"train_loss": -25.6473445892334, "global_step": 313561, "epoch": 3777} {"train_loss": -25.473831176757812, "global_step": 313562, "epoch": 3777} {"train_loss": -25.059879302978516, "global_step": 313563, "epoch": 3777} {"train_loss": -25.35733985900879, "global_step": 313564, "epoch": 3777} {"train_loss": -25.994428634643555, "global_step": 313565, "epoch": 3777} {"train_loss": -25.424118041992188, "global_step": 313566, "epoch": 3777} {"train_loss": -25.48874855041504, "global_step": 313567, "epoch": 3777} {"train_loss": -25.540979385375977, "global_step": 313568, "epoch": 3777} {"train_loss": -25.94935417175293, "global_step": 313569, "epoch": 3777} {"train_loss": -25.275405883789062, "global_step": 313570, "epoch": 3777} {"train_loss": -25.81650733947754, "global_step": 313571, "epoch": 3777} {"train_loss": -25.585737228393555, "global_step": 313572, "epoch": 3777} {"train_loss": -25.49746644353292, "global_step": 313573, "epoch": 3777, "val_loss": 7197757.0} {"train_loss": -25.308542251586914, "global_step": 313574, "epoch": 3778} {"train_loss": -25.617507934570312, "global_step": 313575, "epoch": 3778} {"train_loss": -25.466293334960938, "global_step": 313576, "epoch": 3778} {"train_loss": -25.366357803344727, "global_step": 313577, "epoch": 3778} {"train_loss": -25.808130264282227, "global_step": 313578, "epoch": 3778} {"train_loss": -25.56985092163086, "global_step": 313579, "epoch": 3778} {"train_loss": -25.50290298461914, "global_step": 313580, "epoch": 3778} {"train_loss": -25.765928268432617, "global_step": 313581, "epoch": 3778} {"train_loss": -25.731201171875, "global_step": 313582, "epoch": 3778} {"train_loss": -25.38158416748047, "global_step": 313583, "epoch": 3778} {"train_loss": -25.64887809753418, "global_step": 313584, "epoch": 3778} {"train_loss": -25.93283462524414, "global_step": 313585, "epoch": 3778} {"train_loss": -25.54841423034668, "global_step": 313586, "epoch": 3778} {"train_loss": -26.25800895690918, "global_step": 313587, "epoch": 3778} {"train_loss": -25.858753204345703, "global_step": 313588, "epoch": 3778} {"train_loss": -25.943817138671875, "global_step": 313589, "epoch": 3778} {"train_loss": -25.77229118347168, "global_step": 313590, "epoch": 3778} {"train_loss": -26.1888484954834, "global_step": 313591, "epoch": 3778} {"train_loss": -25.674030303955078, "global_step": 313592, "epoch": 3778} {"train_loss": -25.896780014038086, "global_step": 313593, "epoch": 3778} {"train_loss": -25.790119171142578, "global_step": 313594, "epoch": 3778} {"train_loss": -25.98453712463379, "global_step": 313595, "epoch": 3778} {"train_loss": -26.21088981628418, "global_step": 313596, "epoch": 3778} {"train_loss": -25.796051025390625, "global_step": 313597, "epoch": 3778} {"train_loss": -25.6738338470459, "global_step": 313598, "epoch": 3778} {"train_loss": -26.005414962768555, "global_step": 313599, "epoch": 3778} {"train_loss": -26.032758712768555, "global_step": 313600, "epoch": 3778} {"train_loss": -25.927961349487305, "global_step": 313601, "epoch": 3778} {"train_loss": -25.88966178894043, "global_step": 313602, "epoch": 3778} {"train_loss": -25.4610538482666, "global_step": 313603, "epoch": 3778} {"train_loss": -26.116931915283203, "global_step": 313604, "epoch": 3778} {"train_loss": -25.769392013549805, "global_step": 313605, "epoch": 3778} {"train_loss": -25.946630477905273, "global_step": 313606, "epoch": 3778} {"train_loss": -26.157007217407227, "global_step": 313607, "epoch": 3778} {"train_loss": -25.8687686920166, "global_step": 313608, "epoch": 3778} {"train_loss": -26.169355392456055, "global_step": 313609, "epoch": 3778} {"train_loss": -26.075946807861328, "global_step": 313610, "epoch": 3778} {"train_loss": -26.08711051940918, "global_step": 313611, "epoch": 3778} {"train_loss": -25.93301773071289, "global_step": 313612, "epoch": 3778} {"train_loss": -25.934545516967773, "global_step": 313613, "epoch": 3778} {"train_loss": -25.579532623291016, "global_step": 313614, "epoch": 3778} {"train_loss": -26.222991943359375, "global_step": 313615, "epoch": 3778} {"train_loss": -25.9370174407959, "global_step": 313616, "epoch": 3778} {"train_loss": -25.750213623046875, "global_step": 313617, "epoch": 3778} {"train_loss": -26.089834213256836, "global_step": 313618, "epoch": 3778} {"train_loss": -25.914392471313477, "global_step": 313619, "epoch": 3778} {"train_loss": -26.008874893188477, "global_step": 313620, "epoch": 3778} {"train_loss": -25.66170310974121, "global_step": 313621, "epoch": 3778} {"train_loss": -25.6630802154541, "global_step": 313622, "epoch": 3778} {"train_loss": -25.733911514282227, "global_step": 313623, "epoch": 3778} {"train_loss": -25.680368423461914, "global_step": 313624, "epoch": 3778} {"train_loss": -25.738927841186523, "global_step": 313625, "epoch": 3778} {"train_loss": -25.363134384155273, "global_step": 313626, "epoch": 3778} {"train_loss": -25.802244186401367, "global_step": 313627, "epoch": 3778} {"train_loss": -25.91997718811035, "global_step": 313628, "epoch": 3778} {"train_loss": -25.808286666870117, "global_step": 313629, "epoch": 3778} {"train_loss": -25.595548629760742, "global_step": 313630, "epoch": 3778} {"train_loss": -25.838260650634766, "global_step": 313631, "epoch": 3778} {"train_loss": -25.524993896484375, "global_step": 313632, "epoch": 3778} {"train_loss": -25.78883171081543, "global_step": 313633, "epoch": 3778} {"train_loss": -26.053787231445312, "global_step": 313634, "epoch": 3778} {"train_loss": -25.78755760192871, "global_step": 313635, "epoch": 3778} {"train_loss": -25.942626953125, "global_step": 313636, "epoch": 3778} {"train_loss": -25.91961097717285, "global_step": 313637, "epoch": 3778} {"train_loss": -25.48414421081543, "global_step": 313638, "epoch": 3778} {"train_loss": -25.830108642578125, "global_step": 313639, "epoch": 3778} {"train_loss": -26.221088409423828, "global_step": 313640, "epoch": 3778} {"train_loss": -25.891462326049805, "global_step": 313641, "epoch": 3778} {"train_loss": -26.035058975219727, "global_step": 313642, "epoch": 3778} {"train_loss": -25.665552139282227, "global_step": 313643, "epoch": 3778} {"train_loss": -25.58896827697754, "global_step": 313644, "epoch": 3778} {"train_loss": -25.692258834838867, "global_step": 313645, "epoch": 3778} {"train_loss": -26.030149459838867, "global_step": 313646, "epoch": 3778} {"train_loss": -26.05695152282715, "global_step": 313647, "epoch": 3778} {"train_loss": -25.631322860717773, "global_step": 313648, "epoch": 3778} {"train_loss": -25.869810104370117, "global_step": 313649, "epoch": 3778} {"train_loss": -25.85638999938965, "global_step": 313650, "epoch": 3778} {"train_loss": -25.81914710998535, "global_step": 313651, "epoch": 3778} {"train_loss": -25.67213249206543, "global_step": 313652, "epoch": 3778} {"train_loss": -25.58624839782715, "global_step": 313653, "epoch": 3778} {"train_loss": -26.514245986938477, "global_step": 313654, "epoch": 3778} {"train_loss": -25.78350257873535, "global_step": 313655, "epoch": 3778} {"train_loss": -25.838286641132402, "global_step": 313656, "epoch": 3778, "val_loss": 7283251.0} {"train_loss": -23.672815322875977, "global_step": 313657, "epoch": 3779} {"train_loss": -25.005084991455078, "global_step": 313658, "epoch": 3779} {"train_loss": -24.809776306152344, "global_step": 313659, "epoch": 3779} {"train_loss": -24.869050979614258, "global_step": 313660, "epoch": 3779} {"train_loss": -24.841886520385742, "global_step": 313661, "epoch": 3779} {"train_loss": -25.322650909423828, "global_step": 313662, "epoch": 3779} {"train_loss": -24.86884117126465, "global_step": 313663, "epoch": 3779} {"train_loss": -25.103958129882812, "global_step": 313664, "epoch": 3779} {"train_loss": -25.306814193725586, "global_step": 313665, "epoch": 3779} {"train_loss": -25.073179244995117, "global_step": 313666, "epoch": 3779} {"train_loss": -25.039562225341797, "global_step": 313667, "epoch": 3779} {"train_loss": -25.050939559936523, "global_step": 313668, "epoch": 3779} {"train_loss": -25.480392456054688, "global_step": 313669, "epoch": 3779} {"train_loss": -25.141809463500977, "global_step": 313670, "epoch": 3779} {"train_loss": -25.045820236206055, "global_step": 313671, "epoch": 3779} {"train_loss": -25.321508407592773, "global_step": 313672, "epoch": 3779} {"train_loss": -25.247730255126953, "global_step": 313673, "epoch": 3779} {"train_loss": -24.946264266967773, "global_step": 313674, "epoch": 3779} {"train_loss": -25.379108428955078, "global_step": 313675, "epoch": 3779} {"train_loss": -25.172292709350586, "global_step": 313676, "epoch": 3779} {"train_loss": -25.29538917541504, "global_step": 313677, "epoch": 3779} {"train_loss": -25.338178634643555, "global_step": 313678, "epoch": 3779} {"train_loss": -25.106674194335938, "global_step": 313679, "epoch": 3779} {"train_loss": -25.59108543395996, "global_step": 313680, "epoch": 3779} {"train_loss": -25.271352767944336, "global_step": 313681, "epoch": 3779} {"train_loss": -25.360309600830078, "global_step": 313682, "epoch": 3779} {"train_loss": -25.738431930541992, "global_step": 313683, "epoch": 3779} {"train_loss": -25.70020866394043, "global_step": 313684, "epoch": 3779} {"train_loss": -25.60381507873535, "global_step": 313685, "epoch": 3779} {"train_loss": -25.47933578491211, "global_step": 313686, "epoch": 3779} {"train_loss": -25.840656280517578, "global_step": 313687, "epoch": 3779} {"train_loss": -25.953168869018555, "global_step": 313688, "epoch": 3779} {"train_loss": -25.54240608215332, "global_step": 313689, "epoch": 3779} {"train_loss": -25.86627769470215, "global_step": 313690, "epoch": 3779} {"train_loss": -25.716882705688477, "global_step": 313691, "epoch": 3779} {"train_loss": -25.557769775390625, "global_step": 313692, "epoch": 3779} {"train_loss": -25.606464385986328, "global_step": 313693, "epoch": 3779} {"train_loss": -25.541423797607422, "global_step": 313694, "epoch": 3779} {"train_loss": -26.002227783203125, "global_step": 313695, "epoch": 3779} {"train_loss": -25.451786041259766, "global_step": 313696, "epoch": 3779} {"train_loss": -25.762649536132812, "global_step": 313697, "epoch": 3779} {"train_loss": -26.041248321533203, "global_step": 313698, "epoch": 3779} {"train_loss": -25.86630630493164, "global_step": 313699, "epoch": 3779} {"train_loss": -25.668792724609375, "global_step": 313700, "epoch": 3779} {"train_loss": -25.631855010986328, "global_step": 313701, "epoch": 3779} {"train_loss": -25.452972412109375, "global_step": 313702, "epoch": 3779} {"train_loss": -26.089019775390625, "global_step": 313703, "epoch": 3779} {"train_loss": -26.156076431274414, "global_step": 313704, "epoch": 3779} {"train_loss": -26.13248634338379, "global_step": 313705, "epoch": 3779} {"train_loss": -25.865583419799805, "global_step": 313706, "epoch": 3779} {"train_loss": -25.858121871948242, "global_step": 313707, "epoch": 3779} {"train_loss": -25.66019058227539, "global_step": 313708, "epoch": 3779} {"train_loss": -25.6639347076416, "global_step": 313709, "epoch": 3779} {"train_loss": -25.578754425048828, "global_step": 313710, "epoch": 3779} {"train_loss": -25.988412857055664, "global_step": 313711, "epoch": 3779} {"train_loss": -25.858112335205078, "global_step": 313712, "epoch": 3779} {"train_loss": -25.76901626586914, "global_step": 313713, "epoch": 3779} {"train_loss": -25.739883422851562, "global_step": 313714, "epoch": 3779} {"train_loss": -25.753585815429688, "global_step": 313715, "epoch": 3779} {"train_loss": -25.7650089263916, "global_step": 313716, "epoch": 3779} {"train_loss": -26.08980369567871, "global_step": 313717, "epoch": 3779} {"train_loss": -26.026269912719727, "global_step": 313718, "epoch": 3779} {"train_loss": -25.757658004760742, "global_step": 313719, "epoch": 3779} {"train_loss": -25.69584083557129, "global_step": 313720, "epoch": 3779} {"train_loss": -25.71381187438965, "global_step": 313721, "epoch": 3779} {"train_loss": -25.723920822143555, "global_step": 313722, "epoch": 3779} {"train_loss": -25.93806266784668, "global_step": 313723, "epoch": 3779} {"train_loss": -25.75701332092285, "global_step": 313724, "epoch": 3779} {"train_loss": -25.83514404296875, "global_step": 313725, "epoch": 3779} {"train_loss": -25.843931198120117, "global_step": 313726, "epoch": 3779} {"train_loss": -25.89373207092285, "global_step": 313727, "epoch": 3779} {"train_loss": -25.79730224609375, "global_step": 313728, "epoch": 3779} {"train_loss": -25.903690338134766, "global_step": 313729, "epoch": 3779} {"train_loss": -25.868494033813477, "global_step": 313730, "epoch": 3779} {"train_loss": -25.999557495117188, "global_step": 313731, "epoch": 3779} {"train_loss": -25.715330123901367, "global_step": 313732, "epoch": 3779} {"train_loss": -25.740942001342773, "global_step": 313733, "epoch": 3779} {"train_loss": -25.71803855895996, "global_step": 313734, "epoch": 3779} {"train_loss": -25.99256706237793, "global_step": 313735, "epoch": 3779} {"train_loss": -25.94716453552246, "global_step": 313736, "epoch": 3779} {"train_loss": -25.499324798583984, "global_step": 313737, "epoch": 3779} {"train_loss": -25.744291305541992, "global_step": 313738, "epoch": 3779} {"train_loss": -25.555869251848705, "global_step": 313739, "epoch": 3779, "val_loss": 7191264.0} {"train_loss": -25.60196876525879, "global_step": 313740, "epoch": 3780} {"train_loss": -25.353906631469727, "global_step": 313741, "epoch": 3780} {"train_loss": -24.47719955444336, "global_step": 313742, "epoch": 3780} {"train_loss": -24.61627769470215, "global_step": 313743, "epoch": 3780} {"train_loss": -25.439350128173828, "global_step": 313744, "epoch": 3780} {"train_loss": -24.51888656616211, "global_step": 313745, "epoch": 3780} {"train_loss": -23.96486473083496, "global_step": 313746, "epoch": 3780} {"train_loss": -25.15709114074707, "global_step": 313747, "epoch": 3780} {"train_loss": -25.334543228149414, "global_step": 313748, "epoch": 3780} {"train_loss": -25.126873016357422, "global_step": 313749, "epoch": 3780} {"train_loss": -25.592397689819336, "global_step": 313750, "epoch": 3780} {"train_loss": -25.674793243408203, "global_step": 313751, "epoch": 3780} {"train_loss": -25.45131492614746, "global_step": 313752, "epoch": 3780} {"train_loss": -25.337034225463867, "global_step": 313753, "epoch": 3780} {"train_loss": -25.296329498291016, "global_step": 313754, "epoch": 3780} {"train_loss": -25.444894790649414, "global_step": 313755, "epoch": 3780} {"train_loss": -25.23525047302246, "global_step": 313756, "epoch": 3780} {"train_loss": -25.330543518066406, "global_step": 313757, "epoch": 3780} {"train_loss": -25.64755630493164, "global_step": 313758, "epoch": 3780} {"train_loss": -25.626188278198242, "global_step": 313759, "epoch": 3780} {"train_loss": -25.5526180267334, "global_step": 313760, "epoch": 3780} {"train_loss": -25.334430694580078, "global_step": 313761, "epoch": 3780} {"train_loss": -25.559946060180664, "global_step": 313762, "epoch": 3780} {"train_loss": -25.44697380065918, "global_step": 313763, "epoch": 3780} {"train_loss": -25.489776611328125, "global_step": 313764, "epoch": 3780} {"train_loss": -25.592304229736328, "global_step": 313765, "epoch": 3780} {"train_loss": -25.55585289001465, "global_step": 313766, "epoch": 3780} {"train_loss": -25.498477935791016, "global_step": 313767, "epoch": 3780} {"train_loss": -25.73978042602539, "global_step": 313768, "epoch": 3780} {"train_loss": -25.733551025390625, "global_step": 313769, "epoch": 3780} {"train_loss": -25.80243492126465, "global_step": 313770, "epoch": 3780} {"train_loss": -25.86163902282715, "global_step": 313771, "epoch": 3780} {"train_loss": -25.79119300842285, "global_step": 313772, "epoch": 3780} {"train_loss": -25.832563400268555, "global_step": 313773, "epoch": 3780} {"train_loss": -25.459125518798828, "global_step": 313774, "epoch": 3780} {"train_loss": -25.59053611755371, "global_step": 313775, "epoch": 3780} {"train_loss": -25.693235397338867, "global_step": 313776, "epoch": 3780} {"train_loss": -25.792606353759766, "global_step": 313777, "epoch": 3780} {"train_loss": -25.8264102935791, "global_step": 313778, "epoch": 3780} {"train_loss": -26.064453125, "global_step": 313779, "epoch": 3780} {"train_loss": -25.759241104125977, "global_step": 313780, "epoch": 3780} {"train_loss": -26.462467193603516, "global_step": 313781, "epoch": 3780} {"train_loss": -25.914443969726562, "global_step": 313782, "epoch": 3780} {"train_loss": -25.898147583007812, "global_step": 313783, "epoch": 3780} {"train_loss": -25.899688720703125, "global_step": 313784, "epoch": 3780} {"train_loss": -25.693485260009766, "global_step": 313785, "epoch": 3780} {"train_loss": -26.0993709564209, "global_step": 313786, "epoch": 3780} {"train_loss": -25.619604110717773, "global_step": 313787, "epoch": 3780} {"train_loss": -25.45304298400879, "global_step": 313788, "epoch": 3780} {"train_loss": -25.87739372253418, "global_step": 313789, "epoch": 3780} {"train_loss": -26.017728805541992, "global_step": 313790, "epoch": 3780} {"train_loss": -26.086383819580078, "global_step": 313791, "epoch": 3780} {"train_loss": -25.82850456237793, "global_step": 313792, "epoch": 3780} {"train_loss": -25.994009017944336, "global_step": 313793, "epoch": 3780} {"train_loss": -25.9126033782959, "global_step": 313794, "epoch": 3780} {"train_loss": -26.112945556640625, "global_step": 313795, "epoch": 3780} {"train_loss": -25.977340698242188, "global_step": 313796, "epoch": 3780} {"train_loss": -25.692779541015625, "global_step": 313797, "epoch": 3780} {"train_loss": -25.912525177001953, "global_step": 313798, "epoch": 3780} {"train_loss": -26.114171981811523, "global_step": 313799, "epoch": 3780} {"train_loss": -26.02662467956543, "global_step": 313800, "epoch": 3780} {"train_loss": -25.964740753173828, "global_step": 313801, "epoch": 3780} {"train_loss": -25.962879180908203, "global_step": 313802, "epoch": 3780} {"train_loss": -26.234220504760742, "global_step": 313803, "epoch": 3780} {"train_loss": -26.093948364257812, "global_step": 313804, "epoch": 3780} {"train_loss": -26.374530792236328, "global_step": 313805, "epoch": 3780} {"train_loss": -25.75481605529785, "global_step": 313806, "epoch": 3780} {"train_loss": -25.995824813842773, "global_step": 313807, "epoch": 3780} {"train_loss": -25.981433868408203, "global_step": 313808, "epoch": 3780} {"train_loss": -25.73659324645996, "global_step": 313809, "epoch": 3780} {"train_loss": -25.824054718017578, "global_step": 313810, "epoch": 3780} {"train_loss": -26.24041175842285, "global_step": 313811, "epoch": 3780} {"train_loss": -25.58194923400879, "global_step": 313812, "epoch": 3780} {"train_loss": -24.93982696533203, "global_step": 313813, "epoch": 3780} {"train_loss": -25.014686584472656, "global_step": 313814, "epoch": 3780} {"train_loss": -25.12334442138672, "global_step": 313815, "epoch": 3780} {"train_loss": -25.713586807250977, "global_step": 313816, "epoch": 3780} {"train_loss": -25.749332427978516, "global_step": 313817, "epoch": 3780} {"train_loss": -25.321516036987305, "global_step": 313818, "epoch": 3780} {"train_loss": -25.07451629638672, "global_step": 313819, "epoch": 3780} {"train_loss": -25.507688522338867, "global_step": 313820, "epoch": 3780} {"train_loss": -25.439437866210938, "global_step": 313821, "epoch": 3780} {"train_loss": -25.62753029329231, "global_step": 313822, "epoch": 3780, "val_loss": 7203705.0} {"train_loss": -25.368873596191406, "global_step": 313823, "epoch": 3781} {"train_loss": -24.84916114807129, "global_step": 313824, "epoch": 3781} {"train_loss": -25.32540512084961, "global_step": 313825, "epoch": 3781} {"train_loss": -24.9630069732666, "global_step": 313826, "epoch": 3781} {"train_loss": -24.836122512817383, "global_step": 313827, "epoch": 3781} {"train_loss": -25.195592880249023, "global_step": 313828, "epoch": 3781} {"train_loss": -25.26629638671875, "global_step": 313829, "epoch": 3781} {"train_loss": -25.322832107543945, "global_step": 313830, "epoch": 3781} {"train_loss": -25.25855827331543, "global_step": 313831, "epoch": 3781} {"train_loss": -25.55108642578125, "global_step": 313832, "epoch": 3781} {"train_loss": -25.500957489013672, "global_step": 313833, "epoch": 3781} {"train_loss": -25.181848526000977, "global_step": 313834, "epoch": 3781} {"train_loss": -25.809661865234375, "global_step": 313835, "epoch": 3781} {"train_loss": -25.501951217651367, "global_step": 313836, "epoch": 3781} {"train_loss": -25.556875228881836, "global_step": 313837, "epoch": 3781} {"train_loss": -25.285615921020508, "global_step": 313838, "epoch": 3781} {"train_loss": -25.35577964782715, "global_step": 313839, "epoch": 3781} {"train_loss": -25.747732162475586, "global_step": 313840, "epoch": 3781} {"train_loss": -25.731901168823242, "global_step": 313841, "epoch": 3781} {"train_loss": -25.33936882019043, "global_step": 313842, "epoch": 3781} {"train_loss": -25.549240112304688, "global_step": 313843, "epoch": 3781} {"train_loss": -25.661590576171875, "global_step": 313844, "epoch": 3781} {"train_loss": -25.846607208251953, "global_step": 313845, "epoch": 3781} {"train_loss": -26.043365478515625, "global_step": 313846, "epoch": 3781} {"train_loss": -25.876562118530273, "global_step": 313847, "epoch": 3781} {"train_loss": -25.777875900268555, "global_step": 313848, "epoch": 3781} {"train_loss": -25.440061569213867, "global_step": 313849, "epoch": 3781} {"train_loss": -25.7801570892334, "global_step": 313850, "epoch": 3781} {"train_loss": -25.740692138671875, "global_step": 313851, "epoch": 3781} {"train_loss": -25.58339500427246, "global_step": 313852, "epoch": 3781} {"train_loss": -26.085865020751953, "global_step": 313853, "epoch": 3781} {"train_loss": -25.933149337768555, "global_step": 313854, "epoch": 3781} {"train_loss": -25.739856719970703, "global_step": 313855, "epoch": 3781} {"train_loss": -26.05620765686035, "global_step": 313856, "epoch": 3781} {"train_loss": -25.9647216796875, "global_step": 313857, "epoch": 3781} {"train_loss": -25.83237648010254, "global_step": 313858, "epoch": 3781} {"train_loss": -26.0274600982666, "global_step": 313859, "epoch": 3781} {"train_loss": -25.749679565429688, "global_step": 313860, "epoch": 3781} {"train_loss": -25.67695426940918, "global_step": 313861, "epoch": 3781} {"train_loss": -25.856616973876953, "global_step": 313862, "epoch": 3781} {"train_loss": -25.99445152282715, "global_step": 313863, "epoch": 3781} {"train_loss": -25.558853149414062, "global_step": 313864, "epoch": 3781} {"train_loss": -25.46463966369629, "global_step": 313865, "epoch": 3781} {"train_loss": -25.999094009399414, "global_step": 313866, "epoch": 3781} {"train_loss": -25.876306533813477, "global_step": 313867, "epoch": 3781} {"train_loss": -25.657236099243164, "global_step": 313868, "epoch": 3781} {"train_loss": -26.193485260009766, "global_step": 313869, "epoch": 3781} {"train_loss": -25.833234786987305, "global_step": 313870, "epoch": 3781} {"train_loss": -25.359914779663086, "global_step": 313871, "epoch": 3781} {"train_loss": -25.932998657226562, "global_step": 313872, "epoch": 3781} {"train_loss": -25.76239585876465, "global_step": 313873, "epoch": 3781} {"train_loss": -25.85871696472168, "global_step": 313874, "epoch": 3781} {"train_loss": -26.106504440307617, "global_step": 313875, "epoch": 3781} {"train_loss": -25.675817489624023, "global_step": 313876, "epoch": 3781} {"train_loss": -25.984891891479492, "global_step": 313877, "epoch": 3781} {"train_loss": -25.697662353515625, "global_step": 313878, "epoch": 3781} {"train_loss": -25.458627700805664, "global_step": 313879, "epoch": 3781} {"train_loss": -25.866498947143555, "global_step": 313880, "epoch": 3781} {"train_loss": -25.52128028869629, "global_step": 313881, "epoch": 3781} {"train_loss": -25.86337661743164, "global_step": 313882, "epoch": 3781} {"train_loss": -25.98872947692871, "global_step": 313883, "epoch": 3781} {"train_loss": -25.985986709594727, "global_step": 313884, "epoch": 3781} {"train_loss": -25.97767448425293, "global_step": 313885, "epoch": 3781} {"train_loss": -25.585590362548828, "global_step": 313886, "epoch": 3781} {"train_loss": -26.1131591796875, "global_step": 313887, "epoch": 3781} {"train_loss": -25.78656578063965, "global_step": 313888, "epoch": 3781} {"train_loss": -26.081298828125, "global_step": 313889, "epoch": 3781} {"train_loss": -25.7236270904541, "global_step": 313890, "epoch": 3781} {"train_loss": -25.8109188079834, "global_step": 313891, "epoch": 3781} {"train_loss": -25.52764892578125, "global_step": 313892, "epoch": 3781} {"train_loss": -26.113035202026367, "global_step": 313893, "epoch": 3781} {"train_loss": -26.066247940063477, "global_step": 313894, "epoch": 3781} {"train_loss": -25.7371826171875, "global_step": 313895, "epoch": 3781} {"train_loss": -26.12714958190918, "global_step": 313896, "epoch": 3781} {"train_loss": -26.132537841796875, "global_step": 313897, "epoch": 3781} {"train_loss": -26.364439010620117, "global_step": 313898, "epoch": 3781} {"train_loss": -26.0091609954834, "global_step": 313899, "epoch": 3781} {"train_loss": -25.771398544311523, "global_step": 313900, "epoch": 3781} {"train_loss": -25.7066593170166, "global_step": 313901, "epoch": 3781} {"train_loss": -25.75098991394043, "global_step": 313902, "epoch": 3781} {"train_loss": -26.116668701171875, "global_step": 313903, "epoch": 3781} {"train_loss": -25.901945114135742, "global_step": 313904, "epoch": 3781} {"train_loss": -25.746370361511964, "global_step": 313905, "epoch": 3781, "val_loss": 7275034.5} {"train_loss": -24.502119064331055, "global_step": 313906, "epoch": 3782} {"train_loss": -23.428281784057617, "global_step": 313907, "epoch": 3782} {"train_loss": -23.583024978637695, "global_step": 313908, "epoch": 3782} {"train_loss": -24.5098819732666, "global_step": 313909, "epoch": 3782} {"train_loss": -24.488021850585938, "global_step": 313910, "epoch": 3782} {"train_loss": -24.605756759643555, "global_step": 313911, "epoch": 3782} {"train_loss": -24.638526916503906, "global_step": 313912, "epoch": 3782} {"train_loss": -25.34166717529297, "global_step": 313913, "epoch": 3782} {"train_loss": -25.44506072998047, "global_step": 313914, "epoch": 3782} {"train_loss": -25.07814598083496, "global_step": 313915, "epoch": 3782} {"train_loss": -25.27406883239746, "global_step": 313916, "epoch": 3782} {"train_loss": -25.28484535217285, "global_step": 313917, "epoch": 3782} {"train_loss": -25.300539016723633, "global_step": 313918, "epoch": 3782} {"train_loss": -25.13104248046875, "global_step": 313919, "epoch": 3782} {"train_loss": -25.4122371673584, "global_step": 313920, "epoch": 3782} {"train_loss": -25.442529678344727, "global_step": 313921, "epoch": 3782} {"train_loss": -25.4304141998291, "global_step": 313922, "epoch": 3782} {"train_loss": -25.3878231048584, "global_step": 313923, "epoch": 3782} {"train_loss": -25.233097076416016, "global_step": 313924, "epoch": 3782} {"train_loss": -25.763174057006836, "global_step": 313925, "epoch": 3782} {"train_loss": -25.766708374023438, "global_step": 313926, "epoch": 3782} {"train_loss": -25.528409957885742, "global_step": 313927, "epoch": 3782} {"train_loss": -25.3316650390625, "global_step": 313928, "epoch": 3782} {"train_loss": -25.2591552734375, "global_step": 313929, "epoch": 3782} {"train_loss": -25.455459594726562, "global_step": 313930, "epoch": 3782} {"train_loss": -25.295591354370117, "global_step": 313931, "epoch": 3782} {"train_loss": -25.63882827758789, "global_step": 313932, "epoch": 3782} {"train_loss": -25.866363525390625, "global_step": 313933, "epoch": 3782} {"train_loss": -25.74774169921875, "global_step": 313934, "epoch": 3782} {"train_loss": -25.64539909362793, "global_step": 313935, "epoch": 3782} {"train_loss": -25.543357849121094, "global_step": 313936, "epoch": 3782} {"train_loss": -25.873098373413086, "global_step": 313937, "epoch": 3782} {"train_loss": -25.675464630126953, "global_step": 313938, "epoch": 3782} {"train_loss": -25.585206985473633, "global_step": 313939, "epoch": 3782} {"train_loss": -25.481613159179688, "global_step": 313940, "epoch": 3782} {"train_loss": -25.33711051940918, "global_step": 313941, "epoch": 3782} {"train_loss": -25.888843536376953, "global_step": 313942, "epoch": 3782} {"train_loss": -25.91971778869629, "global_step": 313943, "epoch": 3782} {"train_loss": -25.656660079956055, "global_step": 313944, "epoch": 3782} {"train_loss": -25.90386962890625, "global_step": 313945, "epoch": 3782} {"train_loss": -25.960147857666016, "global_step": 313946, "epoch": 3782} {"train_loss": -26.0279541015625, "global_step": 313947, "epoch": 3782} {"train_loss": -25.96573257446289, "global_step": 313948, "epoch": 3782} {"train_loss": -26.247303009033203, "global_step": 313949, "epoch": 3782} {"train_loss": -26.306110382080078, "global_step": 313950, "epoch": 3782} {"train_loss": -25.82086753845215, "global_step": 313951, "epoch": 3782} {"train_loss": -25.678791046142578, "global_step": 313952, "epoch": 3782} {"train_loss": -25.769229888916016, "global_step": 313953, "epoch": 3782} {"train_loss": -26.259206771850586, "global_step": 313954, "epoch": 3782} {"train_loss": -25.842618942260742, "global_step": 313955, "epoch": 3782} {"train_loss": -26.085912704467773, "global_step": 313956, "epoch": 3782} {"train_loss": -26.075397491455078, "global_step": 313957, "epoch": 3782} {"train_loss": -26.029218673706055, "global_step": 313958, "epoch": 3782} {"train_loss": -26.019155502319336, "global_step": 313959, "epoch": 3782} {"train_loss": -25.73114013671875, "global_step": 313960, "epoch": 3782} {"train_loss": -25.484661102294922, "global_step": 313961, "epoch": 3782} {"train_loss": -25.8418025970459, "global_step": 313962, "epoch": 3782} {"train_loss": -25.816614151000977, "global_step": 313963, "epoch": 3782} {"train_loss": -25.943078994750977, "global_step": 313964, "epoch": 3782} {"train_loss": -25.37042808532715, "global_step": 313965, "epoch": 3782} {"train_loss": -26.031965255737305, "global_step": 313966, "epoch": 3782} {"train_loss": -25.709552764892578, "global_step": 313967, "epoch": 3782} {"train_loss": -26.2097110748291, "global_step": 313968, "epoch": 3782} {"train_loss": -25.985639572143555, "global_step": 313969, "epoch": 3782} {"train_loss": -26.277606964111328, "global_step": 313970, "epoch": 3782} {"train_loss": -25.941503524780273, "global_step": 313971, "epoch": 3782} {"train_loss": -25.445764541625977, "global_step": 313972, "epoch": 3782} {"train_loss": -25.80978775024414, "global_step": 313973, "epoch": 3782} {"train_loss": -25.817670822143555, "global_step": 313974, "epoch": 3782} {"train_loss": -25.605438232421875, "global_step": 313975, "epoch": 3782} {"train_loss": -25.66390037536621, "global_step": 313976, "epoch": 3782} {"train_loss": -25.663461685180664, "global_step": 313977, "epoch": 3782} {"train_loss": -25.85603141784668, "global_step": 313978, "epoch": 3782} {"train_loss": -25.704212188720703, "global_step": 313979, "epoch": 3782} {"train_loss": -25.89276123046875, "global_step": 313980, "epoch": 3782} {"train_loss": -26.02997398376465, "global_step": 313981, "epoch": 3782} {"train_loss": -25.87005615234375, "global_step": 313982, "epoch": 3782} {"train_loss": -25.91668701171875, "global_step": 313983, "epoch": 3782} {"train_loss": -25.679920196533203, "global_step": 313984, "epoch": 3782} {"train_loss": -26.085525512695312, "global_step": 313985, "epoch": 3782} {"train_loss": -25.769384384155273, "global_step": 313986, "epoch": 3782} {"train_loss": -25.748071670532227, "global_step": 313987, "epoch": 3782} {"train_loss": -25.60363151366452, "global_step": 313988, "epoch": 3782, "val_loss": 7223695.0} {"train_loss": -25.08510398864746, "global_step": 313989, "epoch": 3783} {"train_loss": -25.62692642211914, "global_step": 313990, "epoch": 3783} {"train_loss": -25.262508392333984, "global_step": 313991, "epoch": 3783} {"train_loss": -25.61384391784668, "global_step": 313992, "epoch": 3783} {"train_loss": -25.434921264648438, "global_step": 313993, "epoch": 3783} {"train_loss": -25.661575317382812, "global_step": 313994, "epoch": 3783} {"train_loss": -25.516826629638672, "global_step": 313995, "epoch": 3783} {"train_loss": -25.43393325805664, "global_step": 313996, "epoch": 3783} {"train_loss": -25.223081588745117, "global_step": 313997, "epoch": 3783} {"train_loss": -25.241987228393555, "global_step": 313998, "epoch": 3783} {"train_loss": -25.758752822875977, "global_step": 313999, "epoch": 3783} {"train_loss": -25.253061294555664, "global_step": 314000, "epoch": 3783} {"train_loss": -25.23640251159668, "global_step": 314001, "epoch": 3783} {"train_loss": -25.689855575561523, "global_step": 314002, "epoch": 3783} {"train_loss": -25.37482261657715, "global_step": 314003, "epoch": 3783} {"train_loss": -25.595687866210938, "global_step": 314004, "epoch": 3783} {"train_loss": -25.57257652282715, "global_step": 314005, "epoch": 3783} {"train_loss": -26.010684967041016, "global_step": 314006, "epoch": 3783} {"train_loss": -25.81546401977539, "global_step": 314007, "epoch": 3783} {"train_loss": -25.41046905517578, "global_step": 314008, "epoch": 3783} {"train_loss": -25.4835262298584, "global_step": 314009, "epoch": 3783} {"train_loss": -25.495145797729492, "global_step": 314010, "epoch": 3783} {"train_loss": -25.878360748291016, "global_step": 314011, "epoch": 3783} {"train_loss": -25.690855026245117, "global_step": 314012, "epoch": 3783} {"train_loss": -26.10902976989746, "global_step": 314013, "epoch": 3783} {"train_loss": -25.786550521850586, "global_step": 314014, "epoch": 3783} {"train_loss": -25.514596939086914, "global_step": 314015, "epoch": 3783} {"train_loss": -25.337310791015625, "global_step": 314016, "epoch": 3783} {"train_loss": -25.787988662719727, "global_step": 314017, "epoch": 3783} {"train_loss": -25.817182540893555, "global_step": 314018, "epoch": 3783} {"train_loss": -25.770587921142578, "global_step": 314019, "epoch": 3783} {"train_loss": -25.899478912353516, "global_step": 314020, "epoch": 3783} {"train_loss": -25.798633575439453, "global_step": 314021, "epoch": 3783} {"train_loss": -25.75434684753418, "global_step": 314022, "epoch": 3783} {"train_loss": -25.936044692993164, "global_step": 314023, "epoch": 3783} {"train_loss": -25.96003532409668, "global_step": 314024, "epoch": 3783} {"train_loss": -26.106130599975586, "global_step": 314025, "epoch": 3783} {"train_loss": -25.583742141723633, "global_step": 314026, "epoch": 3783} {"train_loss": -25.857595443725586, "global_step": 314027, "epoch": 3783} {"train_loss": -26.304433822631836, "global_step": 314028, "epoch": 3783} {"train_loss": -25.77545738220215, "global_step": 314029, "epoch": 3783} {"train_loss": -26.1395263671875, "global_step": 314030, "epoch": 3783} {"train_loss": -25.8990421295166, "global_step": 314031, "epoch": 3783} {"train_loss": -26.215499877929688, "global_step": 314032, "epoch": 3783} {"train_loss": -25.777780532836914, "global_step": 314033, "epoch": 3783} {"train_loss": -25.850805282592773, "global_step": 314034, "epoch": 3783} {"train_loss": -25.86895179748535, "global_step": 314035, "epoch": 3783} {"train_loss": -25.305816650390625, "global_step": 314036, "epoch": 3783} {"train_loss": -24.96027946472168, "global_step": 314037, "epoch": 3783} {"train_loss": -25.165658950805664, "global_step": 314038, "epoch": 3783} {"train_loss": -26.149145126342773, "global_step": 314039, "epoch": 3783} {"train_loss": -25.79391860961914, "global_step": 314040, "epoch": 3783} {"train_loss": -25.515714645385742, "global_step": 314041, "epoch": 3783} {"train_loss": -26.155736923217773, "global_step": 314042, "epoch": 3783} {"train_loss": -25.737091064453125, "global_step": 314043, "epoch": 3783} {"train_loss": -25.355314254760742, "global_step": 314044, "epoch": 3783} {"train_loss": -25.8255615234375, "global_step": 314045, "epoch": 3783} {"train_loss": -25.64987564086914, "global_step": 314046, "epoch": 3783} {"train_loss": -25.53888511657715, "global_step": 314047, "epoch": 3783} {"train_loss": -25.987457275390625, "global_step": 314048, "epoch": 3783} {"train_loss": -25.765100479125977, "global_step": 314049, "epoch": 3783} {"train_loss": -25.54670524597168, "global_step": 314050, "epoch": 3783} {"train_loss": -25.866424560546875, "global_step": 314051, "epoch": 3783} {"train_loss": -25.418825149536133, "global_step": 314052, "epoch": 3783} {"train_loss": -25.916418075561523, "global_step": 314053, "epoch": 3783} {"train_loss": -26.175506591796875, "global_step": 314054, "epoch": 3783} {"train_loss": -25.447391510009766, "global_step": 314055, "epoch": 3783} {"train_loss": -25.811941146850586, "global_step": 314056, "epoch": 3783} {"train_loss": -25.705591201782227, "global_step": 314057, "epoch": 3783} {"train_loss": -25.49582290649414, "global_step": 314058, "epoch": 3783} {"train_loss": -25.366357803344727, "global_step": 314059, "epoch": 3783} {"train_loss": -25.246658325195312, "global_step": 314060, "epoch": 3783} {"train_loss": -25.904449462890625, "global_step": 314061, "epoch": 3783} {"train_loss": -26.407978057861328, "global_step": 314062, "epoch": 3783} {"train_loss": -25.65498161315918, "global_step": 314063, "epoch": 3783} {"train_loss": -26.106473922729492, "global_step": 314064, "epoch": 3783} {"train_loss": -25.880035400390625, "global_step": 314065, "epoch": 3783} {"train_loss": -25.573598861694336, "global_step": 314066, "epoch": 3783} {"train_loss": -26.041309356689453, "global_step": 314067, "epoch": 3783} {"train_loss": -25.749608993530273, "global_step": 314068, "epoch": 3783} {"train_loss": -25.648679733276367, "global_step": 314069, "epoch": 3783} {"train_loss": -25.96915626525879, "global_step": 314070, "epoch": 3783} {"train_loss": -25.69794634164098, "global_step": 314071, "epoch": 3783, "val_loss": 7260881.0} {"train_loss": -24.924909591674805, "global_step": 314072, "epoch": 3784} {"train_loss": -24.616436004638672, "global_step": 314073, "epoch": 3784} {"train_loss": -25.39850425720215, "global_step": 314074, "epoch": 3784} {"train_loss": -25.352720260620117, "global_step": 314075, "epoch": 3784} {"train_loss": -25.35999870300293, "global_step": 314076, "epoch": 3784} {"train_loss": -24.869617462158203, "global_step": 314077, "epoch": 3784} {"train_loss": -25.537769317626953, "global_step": 314078, "epoch": 3784} {"train_loss": -25.480127334594727, "global_step": 314079, "epoch": 3784} {"train_loss": -25.27351951599121, "global_step": 314080, "epoch": 3784} {"train_loss": -25.576162338256836, "global_step": 314081, "epoch": 3784} {"train_loss": -25.058298110961914, "global_step": 314082, "epoch": 3784} {"train_loss": -25.498708724975586, "global_step": 314083, "epoch": 3784} {"train_loss": -25.83949851989746, "global_step": 314084, "epoch": 3784} {"train_loss": -25.642688751220703, "global_step": 314085, "epoch": 3784} {"train_loss": -25.488544464111328, "global_step": 314086, "epoch": 3784} {"train_loss": -25.582550048828125, "global_step": 314087, "epoch": 3784} {"train_loss": -25.749408721923828, "global_step": 314088, "epoch": 3784} {"train_loss": -25.2432918548584, "global_step": 314089, "epoch": 3784} {"train_loss": -25.630084991455078, "global_step": 314090, "epoch": 3784} {"train_loss": -25.405738830566406, "global_step": 314091, "epoch": 3784} {"train_loss": -25.370962142944336, "global_step": 314092, "epoch": 3784} {"train_loss": -26.013778686523438, "global_step": 314093, "epoch": 3784} {"train_loss": -25.601362228393555, "global_step": 314094, "epoch": 3784} {"train_loss": -25.39755630493164, "global_step": 314095, "epoch": 3784} {"train_loss": -25.57759666442871, "global_step": 314096, "epoch": 3784} {"train_loss": -26.052038192749023, "global_step": 314097, "epoch": 3784} {"train_loss": -25.910444259643555, "global_step": 314098, "epoch": 3784} {"train_loss": -25.84356117248535, "global_step": 314099, "epoch": 3784} {"train_loss": -25.632675170898438, "global_step": 314100, "epoch": 3784} {"train_loss": -25.75710105895996, "global_step": 314101, "epoch": 3784} {"train_loss": -25.49148941040039, "global_step": 314102, "epoch": 3784} {"train_loss": -25.87203025817871, "global_step": 314103, "epoch": 3784} {"train_loss": -25.99286460876465, "global_step": 314104, "epoch": 3784} {"train_loss": -25.633289337158203, "global_step": 314105, "epoch": 3784} {"train_loss": -26.28750991821289, "global_step": 314106, "epoch": 3784} {"train_loss": -25.85999870300293, "global_step": 314107, "epoch": 3784} {"train_loss": -25.929428100585938, "global_step": 314108, "epoch": 3784} {"train_loss": -25.658538818359375, "global_step": 314109, "epoch": 3784} {"train_loss": -25.796430587768555, "global_step": 314110, "epoch": 3784} {"train_loss": -25.992084503173828, "global_step": 314111, "epoch": 3784} {"train_loss": -26.269651412963867, "global_step": 314112, "epoch": 3784} {"train_loss": -25.68794059753418, "global_step": 314113, "epoch": 3784} {"train_loss": -25.96877098083496, "global_step": 314114, "epoch": 3784} {"train_loss": -25.659931182861328, "global_step": 314115, "epoch": 3784} {"train_loss": -26.064428329467773, "global_step": 314116, "epoch": 3784} {"train_loss": -25.996448516845703, "global_step": 314117, "epoch": 3784} {"train_loss": -25.86200523376465, "global_step": 314118, "epoch": 3784} {"train_loss": -26.147674560546875, "global_step": 314119, "epoch": 3784} {"train_loss": -25.97870445251465, "global_step": 314120, "epoch": 3784} {"train_loss": -25.9058895111084, "global_step": 314121, "epoch": 3784} {"train_loss": -26.131683349609375, "global_step": 314122, "epoch": 3784} {"train_loss": -26.172409057617188, "global_step": 314123, "epoch": 3784} {"train_loss": -25.995834350585938, "global_step": 314124, "epoch": 3784} {"train_loss": -25.95795249938965, "global_step": 314125, "epoch": 3784} {"train_loss": -26.426435470581055, "global_step": 314126, "epoch": 3784} {"train_loss": -26.074689865112305, "global_step": 314127, "epoch": 3784} {"train_loss": -26.170629501342773, "global_step": 314128, "epoch": 3784} {"train_loss": -26.078489303588867, "global_step": 314129, "epoch": 3784} {"train_loss": -25.267385482788086, "global_step": 314130, "epoch": 3784} {"train_loss": -26.0594425201416, "global_step": 314131, "epoch": 3784} {"train_loss": -25.720060348510742, "global_step": 314132, "epoch": 3784} {"train_loss": -25.789770126342773, "global_step": 314133, "epoch": 3784} {"train_loss": -25.730518341064453, "global_step": 314134, "epoch": 3784} {"train_loss": -26.260818481445312, "global_step": 314135, "epoch": 3784} {"train_loss": -25.50122833251953, "global_step": 314136, "epoch": 3784} {"train_loss": -26.087133407592773, "global_step": 314137, "epoch": 3784} {"train_loss": -25.346866607666016, "global_step": 314138, "epoch": 3784} {"train_loss": -25.030302047729492, "global_step": 314139, "epoch": 3784} {"train_loss": -25.574506759643555, "global_step": 314140, "epoch": 3784} {"train_loss": -25.784473419189453, "global_step": 314141, "epoch": 3784} {"train_loss": -25.438400268554688, "global_step": 314142, "epoch": 3784} {"train_loss": -25.596744537353516, "global_step": 314143, "epoch": 3784} {"train_loss": -25.609411239624023, "global_step": 314144, "epoch": 3784} {"train_loss": -25.714248657226562, "global_step": 314145, "epoch": 3784} {"train_loss": -25.5762882232666, "global_step": 314146, "epoch": 3784} {"train_loss": -25.90631103515625, "global_step": 314147, "epoch": 3784} {"train_loss": -25.945770263671875, "global_step": 314148, "epoch": 3784} {"train_loss": -25.475095748901367, "global_step": 314149, "epoch": 3784} {"train_loss": -25.40765380859375, "global_step": 314150, "epoch": 3784} {"train_loss": -25.50845718383789, "global_step": 314151, "epoch": 3784} {"train_loss": -25.10049819946289, "global_step": 314152, "epoch": 3784} {"train_loss": -25.76519203186035, "global_step": 314153, "epoch": 3784} {"train_loss": -25.69545180539051, "global_step": 314154, "epoch": 3784, "val_loss": 7265318.5} {"train_loss": -25.52149772644043, "global_step": 314155, "epoch": 3785} {"train_loss": -25.60230827331543, "global_step": 314156, "epoch": 3785} {"train_loss": -25.488191604614258, "global_step": 314157, "epoch": 3785} {"train_loss": -25.67588233947754, "global_step": 314158, "epoch": 3785} {"train_loss": -25.446821212768555, "global_step": 314159, "epoch": 3785} {"train_loss": -25.4318790435791, "global_step": 314160, "epoch": 3785} {"train_loss": -25.50469970703125, "global_step": 314161, "epoch": 3785} {"train_loss": -25.545303344726562, "global_step": 314162, "epoch": 3785} {"train_loss": -25.461536407470703, "global_step": 314163, "epoch": 3785} {"train_loss": -25.46050453186035, "global_step": 314164, "epoch": 3785} {"train_loss": -25.740793228149414, "global_step": 314165, "epoch": 3785} {"train_loss": -25.37395668029785, "global_step": 314166, "epoch": 3785} {"train_loss": -25.599590301513672, "global_step": 314167, "epoch": 3785} {"train_loss": -25.627765655517578, "global_step": 314168, "epoch": 3785} {"train_loss": -25.592382431030273, "global_step": 314169, "epoch": 3785} {"train_loss": -25.802148818969727, "global_step": 314170, "epoch": 3785} {"train_loss": -25.501361846923828, "global_step": 314171, "epoch": 3785} {"train_loss": -25.39696502685547, "global_step": 314172, "epoch": 3785} {"train_loss": -25.810998916625977, "global_step": 314173, "epoch": 3785} {"train_loss": -25.769168853759766, "global_step": 314174, "epoch": 3785} {"train_loss": -25.200559616088867, "global_step": 314175, "epoch": 3785} {"train_loss": -26.04608154296875, "global_step": 314176, "epoch": 3785} {"train_loss": -25.890607833862305, "global_step": 314177, "epoch": 3785} {"train_loss": -25.780719757080078, "global_step": 314178, "epoch": 3785} {"train_loss": -25.49977684020996, "global_step": 314179, "epoch": 3785} {"train_loss": -25.53249168395996, "global_step": 314180, "epoch": 3785} {"train_loss": -25.7179012298584, "global_step": 314181, "epoch": 3785} {"train_loss": -25.989526748657227, "global_step": 314182, "epoch": 3785} {"train_loss": -25.90359878540039, "global_step": 314183, "epoch": 3785} {"train_loss": -25.641345977783203, "global_step": 314184, "epoch": 3785} {"train_loss": -26.00071144104004, "global_step": 314185, "epoch": 3785} {"train_loss": -25.934701919555664, "global_step": 314186, "epoch": 3785} {"train_loss": -25.607839584350586, "global_step": 314187, "epoch": 3785} {"train_loss": -25.678180694580078, "global_step": 314188, "epoch": 3785} {"train_loss": -25.842472076416016, "global_step": 314189, "epoch": 3785} {"train_loss": -25.724985122680664, "global_step": 314190, "epoch": 3785} {"train_loss": -25.810522079467773, "global_step": 314191, "epoch": 3785} {"train_loss": -25.886219024658203, "global_step": 314192, "epoch": 3785} {"train_loss": -25.78704833984375, "global_step": 314193, "epoch": 3785} {"train_loss": -25.853864669799805, "global_step": 314194, "epoch": 3785} {"train_loss": -25.56679344177246, "global_step": 314195, "epoch": 3785} {"train_loss": -25.8658390045166, "global_step": 314196, "epoch": 3785} {"train_loss": -25.95343589782715, "global_step": 314197, "epoch": 3785} {"train_loss": -25.57754898071289, "global_step": 314198, "epoch": 3785} {"train_loss": -25.49964714050293, "global_step": 314199, "epoch": 3785} {"train_loss": -25.34262466430664, "global_step": 314200, "epoch": 3785} {"train_loss": -25.737707138061523, "global_step": 314201, "epoch": 3785} {"train_loss": -25.87787437438965, "global_step": 314202, "epoch": 3785} {"train_loss": -26.019947052001953, "global_step": 314203, "epoch": 3785} {"train_loss": -25.656604766845703, "global_step": 314204, "epoch": 3785} {"train_loss": -26.033447265625, "global_step": 314205, "epoch": 3785} {"train_loss": -26.1016788482666, "global_step": 314206, "epoch": 3785} {"train_loss": -25.738134384155273, "global_step": 314207, "epoch": 3785} {"train_loss": -25.428455352783203, "global_step": 314208, "epoch": 3785} {"train_loss": -26.19464683532715, "global_step": 314209, "epoch": 3785} {"train_loss": -26.00239372253418, "global_step": 314210, "epoch": 3785} {"train_loss": -25.925006866455078, "global_step": 314211, "epoch": 3785} {"train_loss": -26.00381851196289, "global_step": 314212, "epoch": 3785} {"train_loss": -25.718435287475586, "global_step": 314213, "epoch": 3785} {"train_loss": -25.750751495361328, "global_step": 314214, "epoch": 3785} {"train_loss": -26.33563804626465, "global_step": 314215, "epoch": 3785} {"train_loss": -25.850128173828125, "global_step": 314216, "epoch": 3785} {"train_loss": -25.6656494140625, "global_step": 314217, "epoch": 3785} {"train_loss": -26.034381866455078, "global_step": 314218, "epoch": 3785} {"train_loss": -25.73095703125, "global_step": 314219, "epoch": 3785} {"train_loss": -25.701711654663086, "global_step": 314220, "epoch": 3785} {"train_loss": -25.7481746673584, "global_step": 314221, "epoch": 3785} {"train_loss": -25.975875854492188, "global_step": 314222, "epoch": 3785} {"train_loss": -26.011173248291016, "global_step": 314223, "epoch": 3785} {"train_loss": -25.915311813354492, "global_step": 314224, "epoch": 3785} {"train_loss": -25.49287986755371, "global_step": 314225, "epoch": 3785} {"train_loss": -25.717910766601562, "global_step": 314226, "epoch": 3785} {"train_loss": -26.012853622436523, "global_step": 314227, "epoch": 3785} {"train_loss": -25.293752670288086, "global_step": 314228, "epoch": 3785} {"train_loss": -26.055387496948242, "global_step": 314229, "epoch": 3785} {"train_loss": -25.330514907836914, "global_step": 314230, "epoch": 3785} {"train_loss": -25.89519691467285, "global_step": 314231, "epoch": 3785} {"train_loss": -25.740066528320312, "global_step": 314232, "epoch": 3785} {"train_loss": -25.67274284362793, "global_step": 314233, "epoch": 3785} {"train_loss": -25.5474910736084, "global_step": 314234, "epoch": 3785} {"train_loss": -25.92521095275879, "global_step": 314235, "epoch": 3785} {"train_loss": -25.785364151000977, "global_step": 314236, "epoch": 3785} {"train_loss": -25.730249060205665, "global_step": 314237, "epoch": 3785, "val_loss": 7309502.0} {"train_loss": -25.086841583251953, "global_step": 314238, "epoch": 3786} {"train_loss": -23.684425354003906, "global_step": 314239, "epoch": 3786} {"train_loss": -23.02126693725586, "global_step": 314240, "epoch": 3786} {"train_loss": -25.125608444213867, "global_step": 314241, "epoch": 3786} {"train_loss": -24.48543357849121, "global_step": 314242, "epoch": 3786} {"train_loss": -24.773998260498047, "global_step": 314243, "epoch": 3786} {"train_loss": -24.477781295776367, "global_step": 314244, "epoch": 3786} {"train_loss": -25.199262619018555, "global_step": 314245, "epoch": 3786} {"train_loss": -24.52687644958496, "global_step": 314246, "epoch": 3786} {"train_loss": -24.854217529296875, "global_step": 314247, "epoch": 3786} {"train_loss": -25.039628982543945, "global_step": 314248, "epoch": 3786} {"train_loss": -24.851415634155273, "global_step": 314249, "epoch": 3786} {"train_loss": -24.592397689819336, "global_step": 314250, "epoch": 3786} {"train_loss": -25.24973487854004, "global_step": 314251, "epoch": 3786} {"train_loss": -25.2402400970459, "global_step": 314252, "epoch": 3786} {"train_loss": -24.81831169128418, "global_step": 314253, "epoch": 3786} {"train_loss": -25.198843002319336, "global_step": 314254, "epoch": 3786} {"train_loss": -25.139142990112305, "global_step": 314255, "epoch": 3786} {"train_loss": -25.36696434020996, "global_step": 314256, "epoch": 3786} {"train_loss": -25.05169105529785, "global_step": 314257, "epoch": 3786} {"train_loss": -25.1325740814209, "global_step": 314258, "epoch": 3786} {"train_loss": -25.28431510925293, "global_step": 314259, "epoch": 3786} {"train_loss": -25.26189613342285, "global_step": 314260, "epoch": 3786} {"train_loss": -25.326719284057617, "global_step": 314261, "epoch": 3786} {"train_loss": -25.60601234436035, "global_step": 314262, "epoch": 3786} {"train_loss": -25.5636043548584, "global_step": 314263, "epoch": 3786} {"train_loss": -25.43377113342285, "global_step": 314264, "epoch": 3786} {"train_loss": -25.79669761657715, "global_step": 314265, "epoch": 3786} {"train_loss": -25.37520408630371, "global_step": 314266, "epoch": 3786} {"train_loss": -25.201383590698242, "global_step": 314267, "epoch": 3786} {"train_loss": -25.693771362304688, "global_step": 314268, "epoch": 3786} {"train_loss": -25.326858520507812, "global_step": 314269, "epoch": 3786} {"train_loss": -25.357160568237305, "global_step": 314270, "epoch": 3786} {"train_loss": -25.460081100463867, "global_step": 314271, "epoch": 3786} {"train_loss": -25.56031608581543, "global_step": 314272, "epoch": 3786} {"train_loss": -25.549673080444336, "global_step": 314273, "epoch": 3786} {"train_loss": -25.271183013916016, "global_step": 314274, "epoch": 3786} {"train_loss": -25.854694366455078, "global_step": 314275, "epoch": 3786} {"train_loss": -25.53541374206543, "global_step": 314276, "epoch": 3786} {"train_loss": -25.744613647460938, "global_step": 314277, "epoch": 3786} {"train_loss": -25.665525436401367, "global_step": 314278, "epoch": 3786} {"train_loss": -25.898427963256836, "global_step": 314279, "epoch": 3786} {"train_loss": -25.716535568237305, "global_step": 314280, "epoch": 3786} {"train_loss": -25.672941207885742, "global_step": 314281, "epoch": 3786} {"train_loss": -25.626020431518555, "global_step": 314282, "epoch": 3786} {"train_loss": -25.9002742767334, "global_step": 314283, "epoch": 3786} {"train_loss": -26.074878692626953, "global_step": 314284, "epoch": 3786} {"train_loss": -25.703201293945312, "global_step": 314285, "epoch": 3786} {"train_loss": -26.012500762939453, "global_step": 314286, "epoch": 3786} {"train_loss": -26.11909294128418, "global_step": 314287, "epoch": 3786} {"train_loss": -25.996826171875, "global_step": 314288, "epoch": 3786} {"train_loss": -25.81119155883789, "global_step": 314289, "epoch": 3786} {"train_loss": -25.81145668029785, "global_step": 314290, "epoch": 3786} {"train_loss": -25.922245025634766, "global_step": 314291, "epoch": 3786} {"train_loss": -25.751483917236328, "global_step": 314292, "epoch": 3786} {"train_loss": -26.25446128845215, "global_step": 314293, "epoch": 3786} {"train_loss": -25.8520450592041, "global_step": 314294, "epoch": 3786} {"train_loss": -26.05259132385254, "global_step": 314295, "epoch": 3786} {"train_loss": -25.940637588500977, "global_step": 314296, "epoch": 3786} {"train_loss": -25.549537658691406, "global_step": 314297, "epoch": 3786} {"train_loss": -25.9556884765625, "global_step": 314298, "epoch": 3786} {"train_loss": -26.075281143188477, "global_step": 314299, "epoch": 3786} {"train_loss": -25.685895919799805, "global_step": 314300, "epoch": 3786} {"train_loss": -26.068073272705078, "global_step": 314301, "epoch": 3786} {"train_loss": -25.752405166625977, "global_step": 314302, "epoch": 3786} {"train_loss": -25.8808536529541, "global_step": 314303, "epoch": 3786} {"train_loss": -26.206872940063477, "global_step": 314304, "epoch": 3786} {"train_loss": -26.110177993774414, "global_step": 314305, "epoch": 3786} {"train_loss": -25.8698673248291, "global_step": 314306, "epoch": 3786} {"train_loss": -26.081663131713867, "global_step": 314307, "epoch": 3786} {"train_loss": -26.232770919799805, "global_step": 314308, "epoch": 3786} {"train_loss": -25.90899085998535, "global_step": 314309, "epoch": 3786} {"train_loss": -25.735736846923828, "global_step": 314310, "epoch": 3786} {"train_loss": -26.107349395751953, "global_step": 314311, "epoch": 3786} {"train_loss": -26.087066650390625, "global_step": 314312, "epoch": 3786} {"train_loss": -26.17173194885254, "global_step": 314313, "epoch": 3786} {"train_loss": -25.53974723815918, "global_step": 314314, "epoch": 3786} {"train_loss": -25.73261833190918, "global_step": 314315, "epoch": 3786} {"train_loss": -25.8734073638916, "global_step": 314316, "epoch": 3786} {"train_loss": -25.199857711791992, "global_step": 314317, "epoch": 3786} {"train_loss": -25.39177703857422, "global_step": 314318, "epoch": 3786} {"train_loss": -25.189952850341797, "global_step": 314319, "epoch": 3786} {"train_loss": -25.49880698790033, "global_step": 314320, "epoch": 3786, "val_loss": 7286469.0} {"train_loss": -24.831212997436523, "global_step": 314321, "epoch": 3787} {"train_loss": -24.502731323242188, "global_step": 314322, "epoch": 3787} {"train_loss": -24.327909469604492, "global_step": 314323, "epoch": 3787} {"train_loss": -25.404443740844727, "global_step": 314324, "epoch": 3787} {"train_loss": -25.142284393310547, "global_step": 314325, "epoch": 3787} {"train_loss": -25.41964340209961, "global_step": 314326, "epoch": 3787} {"train_loss": -25.269384384155273, "global_step": 314327, "epoch": 3787} {"train_loss": -25.37727165222168, "global_step": 314328, "epoch": 3787} {"train_loss": -25.739953994750977, "global_step": 314329, "epoch": 3787} {"train_loss": -25.25640296936035, "global_step": 314330, "epoch": 3787} {"train_loss": -25.158376693725586, "global_step": 314331, "epoch": 3787} {"train_loss": -25.425992965698242, "global_step": 314332, "epoch": 3787} {"train_loss": -24.858312606811523, "global_step": 314333, "epoch": 3787} {"train_loss": -25.57489585876465, "global_step": 314334, "epoch": 3787} {"train_loss": -25.18843650817871, "global_step": 314335, "epoch": 3787} {"train_loss": -25.297388076782227, "global_step": 314336, "epoch": 3787} {"train_loss": -25.284311294555664, "global_step": 314337, "epoch": 3787} {"train_loss": -25.22201919555664, "global_step": 314338, "epoch": 3787} {"train_loss": -25.552614212036133, "global_step": 314339, "epoch": 3787} {"train_loss": -25.270532608032227, "global_step": 314340, "epoch": 3787} {"train_loss": -25.23432731628418, "global_step": 314341, "epoch": 3787} {"train_loss": -25.70914649963379, "global_step": 314342, "epoch": 3787} {"train_loss": -25.660293579101562, "global_step": 314343, "epoch": 3787} {"train_loss": -25.651813507080078, "global_step": 314344, "epoch": 3787} {"train_loss": -25.38711929321289, "global_step": 314345, "epoch": 3787} {"train_loss": -25.6268310546875, "global_step": 314346, "epoch": 3787} {"train_loss": -25.609054565429688, "global_step": 314347, "epoch": 3787} {"train_loss": -25.811126708984375, "global_step": 314348, "epoch": 3787} {"train_loss": -25.803335189819336, "global_step": 314349, "epoch": 3787} {"train_loss": -25.588672637939453, "global_step": 314350, "epoch": 3787} {"train_loss": -25.335439682006836, "global_step": 314351, "epoch": 3787} {"train_loss": -25.70285415649414, "global_step": 314352, "epoch": 3787} {"train_loss": -25.930490493774414, "global_step": 314353, "epoch": 3787} {"train_loss": -25.57541847229004, "global_step": 314354, "epoch": 3787} {"train_loss": -25.716028213500977, "global_step": 314355, "epoch": 3787} {"train_loss": -25.70905113220215, "global_step": 314356, "epoch": 3787} {"train_loss": -25.906097412109375, "global_step": 314357, "epoch": 3787} {"train_loss": -25.9028377532959, "global_step": 314358, "epoch": 3787} {"train_loss": -25.803760528564453, "global_step": 314359, "epoch": 3787} {"train_loss": -25.927474975585938, "global_step": 314360, "epoch": 3787} {"train_loss": -25.771408081054688, "global_step": 314361, "epoch": 3787} {"train_loss": -25.86872673034668, "global_step": 314362, "epoch": 3787} {"train_loss": -25.800323486328125, "global_step": 314363, "epoch": 3787} {"train_loss": -25.886213302612305, "global_step": 314364, "epoch": 3787} {"train_loss": -25.716588973999023, "global_step": 314365, "epoch": 3787} {"train_loss": -25.895877838134766, "global_step": 314366, "epoch": 3787} {"train_loss": -25.889312744140625, "global_step": 314367, "epoch": 3787} {"train_loss": -26.0859317779541, "global_step": 314368, "epoch": 3787} {"train_loss": -25.5042781829834, "global_step": 314369, "epoch": 3787} {"train_loss": -25.71514320373535, "global_step": 314370, "epoch": 3787} {"train_loss": -25.846912384033203, "global_step": 314371, "epoch": 3787} {"train_loss": -25.878385543823242, "global_step": 314372, "epoch": 3787} {"train_loss": -25.68769645690918, "global_step": 314373, "epoch": 3787} {"train_loss": -25.82563591003418, "global_step": 314374, "epoch": 3787} {"train_loss": -25.944766998291016, "global_step": 314375, "epoch": 3787} {"train_loss": -25.930334091186523, "global_step": 314376, "epoch": 3787} {"train_loss": -25.578847885131836, "global_step": 314377, "epoch": 3787} {"train_loss": -25.748815536499023, "global_step": 314378, "epoch": 3787} {"train_loss": -25.583513259887695, "global_step": 314379, "epoch": 3787} {"train_loss": -25.800983428955078, "global_step": 314380, "epoch": 3787} {"train_loss": -25.747278213500977, "global_step": 314381, "epoch": 3787} {"train_loss": -26.417804718017578, "global_step": 314382, "epoch": 3787} {"train_loss": -25.476057052612305, "global_step": 314383, "epoch": 3787} {"train_loss": -25.935321807861328, "global_step": 314384, "epoch": 3787} {"train_loss": -25.8067684173584, "global_step": 314385, "epoch": 3787} {"train_loss": -25.742048263549805, "global_step": 314386, "epoch": 3787} {"train_loss": -25.487247467041016, "global_step": 314387, "epoch": 3787} {"train_loss": -25.58355712890625, "global_step": 314388, "epoch": 3787} {"train_loss": -25.63465690612793, "global_step": 314389, "epoch": 3787} {"train_loss": -25.873062133789062, "global_step": 314390, "epoch": 3787} {"train_loss": -25.894977569580078, "global_step": 314391, "epoch": 3787} {"train_loss": -25.27315330505371, "global_step": 314392, "epoch": 3787} {"train_loss": -25.38497543334961, "global_step": 314393, "epoch": 3787} {"train_loss": -25.447460174560547, "global_step": 314394, "epoch": 3787} {"train_loss": -25.697065353393555, "global_step": 314395, "epoch": 3787} {"train_loss": -25.597097396850586, "global_step": 314396, "epoch": 3787} {"train_loss": -25.826765060424805, "global_step": 314397, "epoch": 3787} {"train_loss": -26.19807243347168, "global_step": 314398, "epoch": 3787} {"train_loss": -25.75640296936035, "global_step": 314399, "epoch": 3787} {"train_loss": -26.1425838470459, "global_step": 314400, "epoch": 3787} {"train_loss": -25.94794273376465, "global_step": 314401, "epoch": 3787} {"train_loss": -25.628942489624023, "global_step": 314402, "epoch": 3787} {"train_loss": -25.621949712914155, "global_step": 314403, "epoch": 3787, "val_loss": 7299916.0} {"train_loss": -25.35335350036621, "global_step": 314404, "epoch": 3788} {"train_loss": -25.349782943725586, "global_step": 314405, "epoch": 3788} {"train_loss": -25.614990234375, "global_step": 314406, "epoch": 3788} {"train_loss": -25.10902214050293, "global_step": 314407, "epoch": 3788} {"train_loss": -25.502851486206055, "global_step": 314408, "epoch": 3788} {"train_loss": -25.26618003845215, "global_step": 314409, "epoch": 3788} {"train_loss": -25.228979110717773, "global_step": 314410, "epoch": 3788} {"train_loss": -25.65011978149414, "global_step": 314411, "epoch": 3788} {"train_loss": -25.11414909362793, "global_step": 314412, "epoch": 3788} {"train_loss": -25.521448135375977, "global_step": 314413, "epoch": 3788} {"train_loss": -25.28486442565918, "global_step": 314414, "epoch": 3788} {"train_loss": -25.738998413085938, "global_step": 314415, "epoch": 3788} {"train_loss": -25.46294593811035, "global_step": 314416, "epoch": 3788} {"train_loss": -25.544631958007812, "global_step": 314417, "epoch": 3788} {"train_loss": -25.922931671142578, "global_step": 314418, "epoch": 3788} {"train_loss": -25.482738494873047, "global_step": 314419, "epoch": 3788} {"train_loss": -25.419649124145508, "global_step": 314420, "epoch": 3788} {"train_loss": -25.435367584228516, "global_step": 314421, "epoch": 3788} {"train_loss": -25.351810455322266, "global_step": 314422, "epoch": 3788} {"train_loss": -25.331769943237305, "global_step": 314423, "epoch": 3788} {"train_loss": -25.717626571655273, "global_step": 314424, "epoch": 3788} {"train_loss": -25.553138732910156, "global_step": 314425, "epoch": 3788} {"train_loss": -25.641889572143555, "global_step": 314426, "epoch": 3788} {"train_loss": -26.070755004882812, "global_step": 314427, "epoch": 3788} {"train_loss": -25.477338790893555, "global_step": 314428, "epoch": 3788} {"train_loss": -25.655179977416992, "global_step": 314429, "epoch": 3788} {"train_loss": -25.897491455078125, "global_step": 314430, "epoch": 3788} {"train_loss": -25.56747055053711, "global_step": 314431, "epoch": 3788} {"train_loss": -26.050031661987305, "global_step": 314432, "epoch": 3788} {"train_loss": -25.763158798217773, "global_step": 314433, "epoch": 3788} {"train_loss": -25.70315933227539, "global_step": 314434, "epoch": 3788} {"train_loss": -25.8950252532959, "global_step": 314435, "epoch": 3788} {"train_loss": -25.584928512573242, "global_step": 314436, "epoch": 3788} {"train_loss": -25.886030197143555, "global_step": 314437, "epoch": 3788} {"train_loss": -25.87982749938965, "global_step": 314438, "epoch": 3788} {"train_loss": -25.7713680267334, "global_step": 314439, "epoch": 3788} {"train_loss": -26.042875289916992, "global_step": 314440, "epoch": 3788} {"train_loss": -25.769189834594727, "global_step": 314441, "epoch": 3788} {"train_loss": -25.75495719909668, "global_step": 314442, "epoch": 3788} {"train_loss": -25.89155387878418, "global_step": 314443, "epoch": 3788} {"train_loss": -26.09003257751465, "global_step": 314444, "epoch": 3788} {"train_loss": -25.668045043945312, "global_step": 314445, "epoch": 3788} {"train_loss": -25.56083106994629, "global_step": 314446, "epoch": 3788} {"train_loss": -25.849889755249023, "global_step": 314447, "epoch": 3788} {"train_loss": -26.085983276367188, "global_step": 314448, "epoch": 3788} {"train_loss": -25.683963775634766, "global_step": 314449, "epoch": 3788} {"train_loss": -26.059045791625977, "global_step": 314450, "epoch": 3788} {"train_loss": -25.840784072875977, "global_step": 314451, "epoch": 3788} {"train_loss": -25.928815841674805, "global_step": 314452, "epoch": 3788} {"train_loss": -25.789026260375977, "global_step": 314453, "epoch": 3788} {"train_loss": -26.22761344909668, "global_step": 314454, "epoch": 3788} {"train_loss": -25.862939834594727, "global_step": 314455, "epoch": 3788} {"train_loss": -25.876737594604492, "global_step": 314456, "epoch": 3788} {"train_loss": -25.966032028198242, "global_step": 314457, "epoch": 3788} {"train_loss": -26.12277603149414, "global_step": 314458, "epoch": 3788} {"train_loss": -25.533132553100586, "global_step": 314459, "epoch": 3788} {"train_loss": -26.000207901000977, "global_step": 314460, "epoch": 3788} {"train_loss": -25.23262596130371, "global_step": 314461, "epoch": 3788} {"train_loss": -25.418060302734375, "global_step": 314462, "epoch": 3788} {"train_loss": -26.29559898376465, "global_step": 314463, "epoch": 3788} {"train_loss": -25.925748825073242, "global_step": 314464, "epoch": 3788} {"train_loss": -25.730276107788086, "global_step": 314465, "epoch": 3788} {"train_loss": -25.380264282226562, "global_step": 314466, "epoch": 3788} {"train_loss": -25.884078979492188, "global_step": 314467, "epoch": 3788} {"train_loss": -25.737546920776367, "global_step": 314468, "epoch": 3788} {"train_loss": -25.792407989501953, "global_step": 314469, "epoch": 3788} {"train_loss": -25.443405151367188, "global_step": 314470, "epoch": 3788} {"train_loss": -25.905858993530273, "global_step": 314471, "epoch": 3788} {"train_loss": -25.90409278869629, "global_step": 314472, "epoch": 3788} {"train_loss": -25.659082412719727, "global_step": 314473, "epoch": 3788} {"train_loss": -25.89288902282715, "global_step": 314474, "epoch": 3788} {"train_loss": -26.079681396484375, "global_step": 314475, "epoch": 3788} {"train_loss": -25.87911033630371, "global_step": 314476, "epoch": 3788} {"train_loss": -25.727643966674805, "global_step": 314477, "epoch": 3788} {"train_loss": -26.008686065673828, "global_step": 314478, "epoch": 3788} {"train_loss": -25.760168075561523, "global_step": 314479, "epoch": 3788} {"train_loss": -25.518800735473633, "global_step": 314480, "epoch": 3788} {"train_loss": -25.489713668823242, "global_step": 314481, "epoch": 3788} {"train_loss": -26.042814254760742, "global_step": 314482, "epoch": 3788} {"train_loss": -26.08466148376465, "global_step": 314483, "epoch": 3788} {"train_loss": -25.718143463134766, "global_step": 314484, "epoch": 3788} {"train_loss": -25.648160934448242, "global_step": 314485, "epoch": 3788} {"train_loss": -25.729621496545263, "global_step": 314486, "epoch": 3788, "val_loss": 7136103.0} {"train_loss": -25.653432846069336, "global_step": 314487, "epoch": 3789} {"train_loss": -25.356481552124023, "global_step": 314488, "epoch": 3789} {"train_loss": -25.269865036010742, "global_step": 314489, "epoch": 3789} {"train_loss": -25.472837448120117, "global_step": 314490, "epoch": 3789} {"train_loss": -25.527177810668945, "global_step": 314491, "epoch": 3789} {"train_loss": -25.106550216674805, "global_step": 314492, "epoch": 3789} {"train_loss": -25.627399444580078, "global_step": 314493, "epoch": 3789} {"train_loss": -25.681243896484375, "global_step": 314494, "epoch": 3789} {"train_loss": -25.411596298217773, "global_step": 314495, "epoch": 3789} {"train_loss": -25.478029251098633, "global_step": 314496, "epoch": 3789} {"train_loss": -25.856855392456055, "global_step": 314497, "epoch": 3789} {"train_loss": -25.771360397338867, "global_step": 314498, "epoch": 3789} {"train_loss": -25.71773338317871, "global_step": 314499, "epoch": 3789} {"train_loss": -25.651382446289062, "global_step": 314500, "epoch": 3789} {"train_loss": -25.492084503173828, "global_step": 314501, "epoch": 3789} {"train_loss": -25.529375076293945, "global_step": 314502, "epoch": 3789} {"train_loss": -25.433504104614258, "global_step": 314503, "epoch": 3789} {"train_loss": -25.3549861907959, "global_step": 314504, "epoch": 3789} {"train_loss": -25.639301300048828, "global_step": 314505, "epoch": 3789} {"train_loss": -25.2557373046875, "global_step": 314506, "epoch": 3789} {"train_loss": -25.451675415039062, "global_step": 314507, "epoch": 3789} {"train_loss": -25.662939071655273, "global_step": 314508, "epoch": 3789} {"train_loss": -25.770465850830078, "global_step": 314509, "epoch": 3789} {"train_loss": -25.56108283996582, "global_step": 314510, "epoch": 3789} {"train_loss": -25.8271427154541, "global_step": 314511, "epoch": 3789} {"train_loss": -25.757186889648438, "global_step": 314512, "epoch": 3789} {"train_loss": -26.154382705688477, "global_step": 314513, "epoch": 3789} {"train_loss": -25.526731491088867, "global_step": 314514, "epoch": 3789} {"train_loss": -25.569387435913086, "global_step": 314515, "epoch": 3789} {"train_loss": -25.85127830505371, "global_step": 314516, "epoch": 3789} {"train_loss": -25.6414737701416, "global_step": 314517, "epoch": 3789} {"train_loss": -25.85824966430664, "global_step": 314518, "epoch": 3789} {"train_loss": -25.638416290283203, "global_step": 314519, "epoch": 3789} {"train_loss": -26.00684928894043, "global_step": 314520, "epoch": 3789} {"train_loss": -25.896692276000977, "global_step": 314521, "epoch": 3789} {"train_loss": -25.88932228088379, "global_step": 314522, "epoch": 3789} {"train_loss": -25.579614639282227, "global_step": 314523, "epoch": 3789} {"train_loss": -26.03995132446289, "global_step": 314524, "epoch": 3789} {"train_loss": -25.9822998046875, "global_step": 314525, "epoch": 3789} {"train_loss": -25.849103927612305, "global_step": 314526, "epoch": 3789} {"train_loss": -25.798994064331055, "global_step": 314527, "epoch": 3789} {"train_loss": -25.691486358642578, "global_step": 314528, "epoch": 3789} {"train_loss": -25.95827293395996, "global_step": 314529, "epoch": 3789} {"train_loss": -26.039220809936523, "global_step": 314530, "epoch": 3789} {"train_loss": -25.97931480407715, "global_step": 314531, "epoch": 3789} {"train_loss": -25.66263198852539, "global_step": 314532, "epoch": 3789} {"train_loss": -25.835922241210938, "global_step": 314533, "epoch": 3789} {"train_loss": -25.6731014251709, "global_step": 314534, "epoch": 3789} {"train_loss": -25.649850845336914, "global_step": 314535, "epoch": 3789} {"train_loss": -25.666738510131836, "global_step": 314536, "epoch": 3789} {"train_loss": -25.673376083374023, "global_step": 314537, "epoch": 3789} {"train_loss": -25.854307174682617, "global_step": 314538, "epoch": 3789} {"train_loss": -25.699878692626953, "global_step": 314539, "epoch": 3789} {"train_loss": -25.888647079467773, "global_step": 314540, "epoch": 3789} {"train_loss": -25.798566818237305, "global_step": 314541, "epoch": 3789} {"train_loss": -25.60370445251465, "global_step": 314542, "epoch": 3789} {"train_loss": -25.48824691772461, "global_step": 314543, "epoch": 3789} {"train_loss": -25.592641830444336, "global_step": 314544, "epoch": 3789} {"train_loss": -25.805837631225586, "global_step": 314545, "epoch": 3789} {"train_loss": -25.575332641601562, "global_step": 314546, "epoch": 3789} {"train_loss": -25.978857040405273, "global_step": 314547, "epoch": 3789} {"train_loss": -25.35871696472168, "global_step": 314548, "epoch": 3789} {"train_loss": -25.60103416442871, "global_step": 314549, "epoch": 3789} {"train_loss": -25.723196029663086, "global_step": 314550, "epoch": 3789} {"train_loss": -25.62053871154785, "global_step": 314551, "epoch": 3789} {"train_loss": -25.5815372467041, "global_step": 314552, "epoch": 3789} {"train_loss": -25.996063232421875, "global_step": 314553, "epoch": 3789} {"train_loss": -25.696823120117188, "global_step": 314554, "epoch": 3789} {"train_loss": -25.950098037719727, "global_step": 314555, "epoch": 3789} {"train_loss": -25.545373916625977, "global_step": 314556, "epoch": 3789} {"train_loss": -26.17401695251465, "global_step": 314557, "epoch": 3789} {"train_loss": -25.79534912109375, "global_step": 314558, "epoch": 3789} {"train_loss": -25.512128829956055, "global_step": 314559, "epoch": 3789} {"train_loss": -25.448118209838867, "global_step": 314560, "epoch": 3789} {"train_loss": -25.801855087280273, "global_step": 314561, "epoch": 3789} {"train_loss": -25.7884521484375, "global_step": 314562, "epoch": 3789} {"train_loss": -25.565692901611328, "global_step": 314563, "epoch": 3789} {"train_loss": -26.0496883392334, "global_step": 314564, "epoch": 3789} {"train_loss": -26.11279296875, "global_step": 314565, "epoch": 3789} {"train_loss": -25.425861358642578, "global_step": 314566, "epoch": 3789} {"train_loss": -25.84486198425293, "global_step": 314567, "epoch": 3789} {"train_loss": -25.576587677001953, "global_step": 314568, "epoch": 3789} {"train_loss": -25.70332295061594, "global_step": 314569, "epoch": 3789, "val_loss": 7256427.0} {"train_loss": -25.924320220947266, "global_step": 314570, "epoch": 3790} {"train_loss": -25.37870216369629, "global_step": 314571, "epoch": 3790} {"train_loss": -25.71211814880371, "global_step": 314572, "epoch": 3790} {"train_loss": -25.925338745117188, "global_step": 314573, "epoch": 3790} {"train_loss": -25.358198165893555, "global_step": 314574, "epoch": 3790} {"train_loss": -25.414915084838867, "global_step": 314575, "epoch": 3790} {"train_loss": -25.791486740112305, "global_step": 314576, "epoch": 3790} {"train_loss": -25.690277099609375, "global_step": 314577, "epoch": 3790} {"train_loss": -25.581090927124023, "global_step": 314578, "epoch": 3790} {"train_loss": -25.542896270751953, "global_step": 314579, "epoch": 3790} {"train_loss": -25.764495849609375, "global_step": 314580, "epoch": 3790} {"train_loss": -25.950366973876953, "global_step": 314581, "epoch": 3790} {"train_loss": -25.79483413696289, "global_step": 314582, "epoch": 3790} {"train_loss": -26.10674476623535, "global_step": 314583, "epoch": 3790} {"train_loss": -25.86260414123535, "global_step": 314584, "epoch": 3790} {"train_loss": -25.488788604736328, "global_step": 314585, "epoch": 3790} {"train_loss": -25.843603134155273, "global_step": 314586, "epoch": 3790} {"train_loss": -26.034290313720703, "global_step": 314587, "epoch": 3790} {"train_loss": -25.8144474029541, "global_step": 314588, "epoch": 3790} {"train_loss": -25.9103946685791, "global_step": 314589, "epoch": 3790} {"train_loss": -25.825439453125, "global_step": 314590, "epoch": 3790} {"train_loss": -26.0571231842041, "global_step": 314591, "epoch": 3790} {"train_loss": -25.54249382019043, "global_step": 314592, "epoch": 3790} {"train_loss": -25.9172306060791, "global_step": 314593, "epoch": 3790} {"train_loss": -25.808561325073242, "global_step": 314594, "epoch": 3790} {"train_loss": -25.575071334838867, "global_step": 314595, "epoch": 3790} {"train_loss": -25.66086769104004, "global_step": 314596, "epoch": 3790} {"train_loss": -25.661911010742188, "global_step": 314597, "epoch": 3790} {"train_loss": -26.023969650268555, "global_step": 314598, "epoch": 3790} {"train_loss": -26.015167236328125, "global_step": 314599, "epoch": 3790} {"train_loss": -25.780359268188477, "global_step": 314600, "epoch": 3790} {"train_loss": -25.902856826782227, "global_step": 314601, "epoch": 3790} {"train_loss": -25.855085372924805, "global_step": 314602, "epoch": 3790} {"train_loss": -25.762731552124023, "global_step": 314603, "epoch": 3790} {"train_loss": -25.71906852722168, "global_step": 314604, "epoch": 3790} {"train_loss": -25.710424423217773, "global_step": 314605, "epoch": 3790} {"train_loss": -25.787307739257812, "global_step": 314606, "epoch": 3790} {"train_loss": -25.613101959228516, "global_step": 314607, "epoch": 3790} {"train_loss": -25.699615478515625, "global_step": 314608, "epoch": 3790} {"train_loss": -26.016910552978516, "global_step": 314609, "epoch": 3790} {"train_loss": -25.760046005249023, "global_step": 314610, "epoch": 3790} {"train_loss": -25.728836059570312, "global_step": 314611, "epoch": 3790} {"train_loss": -25.75689697265625, "global_step": 314612, "epoch": 3790} {"train_loss": -25.512670516967773, "global_step": 314613, "epoch": 3790} {"train_loss": -25.464035034179688, "global_step": 314614, "epoch": 3790} {"train_loss": -25.579797744750977, "global_step": 314615, "epoch": 3790} {"train_loss": -25.7947998046875, "global_step": 314616, "epoch": 3790} {"train_loss": -25.966299057006836, "global_step": 314617, "epoch": 3790} {"train_loss": -25.488420486450195, "global_step": 314618, "epoch": 3790} {"train_loss": -25.396499633789062, "global_step": 314619, "epoch": 3790} {"train_loss": -25.515323638916016, "global_step": 314620, "epoch": 3790} {"train_loss": -25.424314498901367, "global_step": 314621, "epoch": 3790} {"train_loss": -25.430622100830078, "global_step": 314622, "epoch": 3790} {"train_loss": -25.906614303588867, "global_step": 314623, "epoch": 3790} {"train_loss": -25.751514434814453, "global_step": 314624, "epoch": 3790} {"train_loss": -25.141115188598633, "global_step": 314625, "epoch": 3790} {"train_loss": -25.958271026611328, "global_step": 314626, "epoch": 3790} {"train_loss": -25.842914581298828, "global_step": 314627, "epoch": 3790} {"train_loss": -25.852935791015625, "global_step": 314628, "epoch": 3790} {"train_loss": -25.523212432861328, "global_step": 314629, "epoch": 3790} {"train_loss": -25.263168334960938, "global_step": 314630, "epoch": 3790} {"train_loss": -25.83990478515625, "global_step": 314631, "epoch": 3790} {"train_loss": -26.055822372436523, "global_step": 314632, "epoch": 3790} {"train_loss": -25.88239860534668, "global_step": 314633, "epoch": 3790} {"train_loss": -25.764978408813477, "global_step": 314634, "epoch": 3790} {"train_loss": -25.61067771911621, "global_step": 314635, "epoch": 3790} {"train_loss": -25.8526611328125, "global_step": 314636, "epoch": 3790} {"train_loss": -25.65215492248535, "global_step": 314637, "epoch": 3790} {"train_loss": -26.128576278686523, "global_step": 314638, "epoch": 3790} {"train_loss": -25.977310180664062, "global_step": 314639, "epoch": 3790} {"train_loss": -25.97083854675293, "global_step": 314640, "epoch": 3790} {"train_loss": -25.97015380859375, "global_step": 314641, "epoch": 3790} {"train_loss": -25.762914657592773, "global_step": 314642, "epoch": 3790} {"train_loss": -25.824710845947266, "global_step": 314643, "epoch": 3790} {"train_loss": -25.74238395690918, "global_step": 314644, "epoch": 3790} {"train_loss": -25.69550895690918, "global_step": 314645, "epoch": 3790} {"train_loss": -26.12430763244629, "global_step": 314646, "epoch": 3790} {"train_loss": -25.817041397094727, "global_step": 314647, "epoch": 3790} {"train_loss": -25.691043853759766, "global_step": 314648, "epoch": 3790} {"train_loss": -25.543935775756836, "global_step": 314649, "epoch": 3790} {"train_loss": -25.165380477905273, "global_step": 314650, "epoch": 3790} {"train_loss": -25.57564353942871, "global_step": 314651, "epoch": 3790} {"train_loss": -25.713109165789135, "global_step": 314652, "epoch": 3790, "val_loss": 7282723.0} {"train_loss": -23.347219467163086, "global_step": 314653, "epoch": 3791} {"train_loss": -23.88714027404785, "global_step": 314654, "epoch": 3791} {"train_loss": -24.918256759643555, "global_step": 314655, "epoch": 3791} {"train_loss": -24.200241088867188, "global_step": 314656, "epoch": 3791} {"train_loss": -25.02448844909668, "global_step": 314657, "epoch": 3791} {"train_loss": -25.070127487182617, "global_step": 314658, "epoch": 3791} {"train_loss": -25.220874786376953, "global_step": 314659, "epoch": 3791} {"train_loss": -25.167587280273438, "global_step": 314660, "epoch": 3791} {"train_loss": -24.879669189453125, "global_step": 314661, "epoch": 3791} {"train_loss": -25.362367630004883, "global_step": 314662, "epoch": 3791} {"train_loss": -25.249401092529297, "global_step": 314663, "epoch": 3791} {"train_loss": -25.23590850830078, "global_step": 314664, "epoch": 3791} {"train_loss": -25.02908706665039, "global_step": 314665, "epoch": 3791} {"train_loss": -25.134815216064453, "global_step": 314666, "epoch": 3791} {"train_loss": -25.096527099609375, "global_step": 314667, "epoch": 3791} {"train_loss": -25.226341247558594, "global_step": 314668, "epoch": 3791} {"train_loss": -25.093679428100586, "global_step": 314669, "epoch": 3791} {"train_loss": -25.8289737701416, "global_step": 314670, "epoch": 3791} {"train_loss": -25.18657875061035, "global_step": 314671, "epoch": 3791} {"train_loss": -25.237266540527344, "global_step": 314672, "epoch": 3791} {"train_loss": -25.660083770751953, "global_step": 314673, "epoch": 3791} {"train_loss": -25.248483657836914, "global_step": 314674, "epoch": 3791} {"train_loss": -25.433320999145508, "global_step": 314675, "epoch": 3791} {"train_loss": -25.126819610595703, "global_step": 314676, "epoch": 3791} {"train_loss": -25.426427841186523, "global_step": 314677, "epoch": 3791} {"train_loss": -25.452869415283203, "global_step": 314678, "epoch": 3791} {"train_loss": -25.325450897216797, "global_step": 314679, "epoch": 3791} {"train_loss": -25.480125427246094, "global_step": 314680, "epoch": 3791} {"train_loss": -25.412710189819336, "global_step": 314681, "epoch": 3791} {"train_loss": -25.76214027404785, "global_step": 314682, "epoch": 3791} {"train_loss": -25.287500381469727, "global_step": 314683, "epoch": 3791} {"train_loss": -25.378284454345703, "global_step": 314684, "epoch": 3791} {"train_loss": -25.762243270874023, "global_step": 314685, "epoch": 3791} {"train_loss": -25.603424072265625, "global_step": 314686, "epoch": 3791} {"train_loss": -25.81739616394043, "global_step": 314687, "epoch": 3791} {"train_loss": -25.520355224609375, "global_step": 314688, "epoch": 3791} {"train_loss": -25.853515625, "global_step": 314689, "epoch": 3791} {"train_loss": -25.71854591369629, "global_step": 314690, "epoch": 3791} {"train_loss": -25.662622451782227, "global_step": 314691, "epoch": 3791} {"train_loss": -25.85500144958496, "global_step": 314692, "epoch": 3791} {"train_loss": -25.7432861328125, "global_step": 314693, "epoch": 3791} {"train_loss": -26.032094955444336, "global_step": 314694, "epoch": 3791} {"train_loss": -25.908674240112305, "global_step": 314695, "epoch": 3791} {"train_loss": -25.50551986694336, "global_step": 314696, "epoch": 3791} {"train_loss": -25.539615631103516, "global_step": 314697, "epoch": 3791} {"train_loss": -25.65594482421875, "global_step": 314698, "epoch": 3791} {"train_loss": -25.547826766967773, "global_step": 314699, "epoch": 3791} {"train_loss": -25.97869873046875, "global_step": 314700, "epoch": 3791} {"train_loss": -25.79212760925293, "global_step": 314701, "epoch": 3791} {"train_loss": -26.06660270690918, "global_step": 314702, "epoch": 3791} {"train_loss": -26.005359649658203, "global_step": 314703, "epoch": 3791} {"train_loss": -25.89202880859375, "global_step": 314704, "epoch": 3791} {"train_loss": -25.85158348083496, "global_step": 314705, "epoch": 3791} {"train_loss": -26.0996036529541, "global_step": 314706, "epoch": 3791} {"train_loss": -26.095380783081055, "global_step": 314707, "epoch": 3791} {"train_loss": -25.995777130126953, "global_step": 314708, "epoch": 3791} {"train_loss": -26.139892578125, "global_step": 314709, "epoch": 3791} {"train_loss": -25.78626823425293, "global_step": 314710, "epoch": 3791} {"train_loss": -25.793701171875, "global_step": 314711, "epoch": 3791} {"train_loss": -26.195180892944336, "global_step": 314712, "epoch": 3791} {"train_loss": -25.851520538330078, "global_step": 314713, "epoch": 3791} {"train_loss": -25.614383697509766, "global_step": 314714, "epoch": 3791} {"train_loss": -25.825164794921875, "global_step": 314715, "epoch": 3791} {"train_loss": -26.319311141967773, "global_step": 314716, "epoch": 3791} {"train_loss": -25.82842445373535, "global_step": 314717, "epoch": 3791} {"train_loss": -26.00830078125, "global_step": 314718, "epoch": 3791} {"train_loss": -25.776611328125, "global_step": 314719, "epoch": 3791} {"train_loss": -25.829700469970703, "global_step": 314720, "epoch": 3791} {"train_loss": -25.732885360717773, "global_step": 314721, "epoch": 3791} {"train_loss": -25.741931915283203, "global_step": 314722, "epoch": 3791} {"train_loss": -25.819372177124023, "global_step": 314723, "epoch": 3791} {"train_loss": -26.06843376159668, "global_step": 314724, "epoch": 3791} {"train_loss": -25.90388298034668, "global_step": 314725, "epoch": 3791} {"train_loss": -25.874982833862305, "global_step": 314726, "epoch": 3791} {"train_loss": -25.80719566345215, "global_step": 314727, "epoch": 3791} {"train_loss": -25.880847930908203, "global_step": 314728, "epoch": 3791} {"train_loss": -26.149282455444336, "global_step": 314729, "epoch": 3791} {"train_loss": -25.920166015625, "global_step": 314730, "epoch": 3791} {"train_loss": -25.944700241088867, "global_step": 314731, "epoch": 3791} {"train_loss": -25.824018478393555, "global_step": 314732, "epoch": 3791} {"train_loss": -25.912824630737305, "global_step": 314733, "epoch": 3791} {"train_loss": -25.915084838867188, "global_step": 314734, "epoch": 3791} {"train_loss": -25.580125211233117, "global_step": 314735, "epoch": 3791, "val_loss": 7433335.5} {"train_loss": -25.268360137939453, "global_step": 314736, "epoch": 3792} {"train_loss": -24.925931930541992, "global_step": 314737, "epoch": 3792} {"train_loss": -25.3792667388916, "global_step": 314738, "epoch": 3792} {"train_loss": -25.168848037719727, "global_step": 314739, "epoch": 3792} {"train_loss": -25.721975326538086, "global_step": 314740, "epoch": 3792} {"train_loss": -25.29454231262207, "global_step": 314741, "epoch": 3792} {"train_loss": -25.636987686157227, "global_step": 314742, "epoch": 3792} {"train_loss": -25.456222534179688, "global_step": 314743, "epoch": 3792} {"train_loss": -25.37513542175293, "global_step": 314744, "epoch": 3792} {"train_loss": -25.414348602294922, "global_step": 314745, "epoch": 3792} {"train_loss": -25.1995792388916, "global_step": 314746, "epoch": 3792} {"train_loss": -25.579980850219727, "global_step": 314747, "epoch": 3792} {"train_loss": -25.584121704101562, "global_step": 314748, "epoch": 3792} {"train_loss": -25.04058265686035, "global_step": 314749, "epoch": 3792} {"train_loss": -25.67572593688965, "global_step": 314750, "epoch": 3792} {"train_loss": -26.14794921875, "global_step": 314751, "epoch": 3792} {"train_loss": -25.98138999938965, "global_step": 314752, "epoch": 3792} {"train_loss": -25.451274871826172, "global_step": 314753, "epoch": 3792} {"train_loss": -26.37884521484375, "global_step": 314754, "epoch": 3792} {"train_loss": -25.861820220947266, "global_step": 314755, "epoch": 3792} {"train_loss": -25.844953536987305, "global_step": 314756, "epoch": 3792} {"train_loss": -25.8301944732666, "global_step": 314757, "epoch": 3792} {"train_loss": -25.977771759033203, "global_step": 314758, "epoch": 3792} {"train_loss": -25.890884399414062, "global_step": 314759, "epoch": 3792} {"train_loss": -25.616369247436523, "global_step": 314760, "epoch": 3792} {"train_loss": -25.77621841430664, "global_step": 314761, "epoch": 3792} {"train_loss": -25.6897029876709, "global_step": 314762, "epoch": 3792} {"train_loss": -25.916278839111328, "global_step": 314763, "epoch": 3792} {"train_loss": -25.914785385131836, "global_step": 314764, "epoch": 3792} {"train_loss": -25.955591201782227, "global_step": 314765, "epoch": 3792} {"train_loss": -26.149667739868164, "global_step": 314766, "epoch": 3792} {"train_loss": -25.896869659423828, "global_step": 314767, "epoch": 3792} {"train_loss": -26.18250846862793, "global_step": 314768, "epoch": 3792} {"train_loss": -25.8038330078125, "global_step": 314769, "epoch": 3792} {"train_loss": -25.903797149658203, "global_step": 314770, "epoch": 3792} {"train_loss": -25.976123809814453, "global_step": 314771, "epoch": 3792} {"train_loss": -26.001157760620117, "global_step": 314772, "epoch": 3792} {"train_loss": -25.958301544189453, "global_step": 314773, "epoch": 3792} {"train_loss": -25.95582389831543, "global_step": 314774, "epoch": 3792} {"train_loss": -25.666040420532227, "global_step": 314775, "epoch": 3792} {"train_loss": -25.975080490112305, "global_step": 314776, "epoch": 3792} {"train_loss": -26.127044677734375, "global_step": 314777, "epoch": 3792} {"train_loss": -25.830829620361328, "global_step": 314778, "epoch": 3792} {"train_loss": -25.749841690063477, "global_step": 314779, "epoch": 3792} {"train_loss": -25.496591567993164, "global_step": 314780, "epoch": 3792} {"train_loss": -25.939443588256836, "global_step": 314781, "epoch": 3792} {"train_loss": -25.9266414642334, "global_step": 314782, "epoch": 3792} {"train_loss": -25.834842681884766, "global_step": 314783, "epoch": 3792} {"train_loss": -25.936689376831055, "global_step": 314784, "epoch": 3792} {"train_loss": -25.641386032104492, "global_step": 314785, "epoch": 3792} {"train_loss": -25.41436767578125, "global_step": 314786, "epoch": 3792} {"train_loss": -25.925037384033203, "global_step": 314787, "epoch": 3792} {"train_loss": -25.9423770904541, "global_step": 314788, "epoch": 3792} {"train_loss": -26.101806640625, "global_step": 314789, "epoch": 3792} {"train_loss": -25.71632957458496, "global_step": 314790, "epoch": 3792} {"train_loss": -25.767807006835938, "global_step": 314791, "epoch": 3792} {"train_loss": -25.589717864990234, "global_step": 314792, "epoch": 3792} {"train_loss": -25.84320068359375, "global_step": 314793, "epoch": 3792} {"train_loss": -26.096805572509766, "global_step": 314794, "epoch": 3792} {"train_loss": -25.700002670288086, "global_step": 314795, "epoch": 3792} {"train_loss": -25.214792251586914, "global_step": 314796, "epoch": 3792} {"train_loss": -25.15720558166504, "global_step": 314797, "epoch": 3792} {"train_loss": -25.640058517456055, "global_step": 314798, "epoch": 3792} {"train_loss": -25.752771377563477, "global_step": 314799, "epoch": 3792} {"train_loss": -25.619155883789062, "global_step": 314800, "epoch": 3792} {"train_loss": -25.208362579345703, "global_step": 314801, "epoch": 3792} {"train_loss": -24.708932876586914, "global_step": 314802, "epoch": 3792} {"train_loss": -25.55408477783203, "global_step": 314803, "epoch": 3792} {"train_loss": -25.6893310546875, "global_step": 314804, "epoch": 3792} {"train_loss": -25.238412857055664, "global_step": 314805, "epoch": 3792} {"train_loss": -25.029733657836914, "global_step": 314806, "epoch": 3792} {"train_loss": -25.849811553955078, "global_step": 314807, "epoch": 3792} {"train_loss": -25.360868453979492, "global_step": 314808, "epoch": 3792} {"train_loss": -25.11653709411621, "global_step": 314809, "epoch": 3792} {"train_loss": -25.638324737548828, "global_step": 314810, "epoch": 3792} {"train_loss": -25.519411087036133, "global_step": 314811, "epoch": 3792} {"train_loss": -25.5748348236084, "global_step": 314812, "epoch": 3792} {"train_loss": -25.37141227722168, "global_step": 314813, "epoch": 3792} {"train_loss": -25.756467819213867, "global_step": 314814, "epoch": 3792} {"train_loss": -25.595966339111328, "global_step": 314815, "epoch": 3792} {"train_loss": -25.49176597595215, "global_step": 314816, "epoch": 3792} {"train_loss": -25.499835968017578, "global_step": 314817, "epoch": 3792} {"train_loss": -25.663918690509107, "global_step": 314818, "epoch": 3792, "val_loss": 7251089.0} {"train_loss": -25.81085777282715, "global_step": 314819, "epoch": 3793} {"train_loss": -25.466842651367188, "global_step": 314820, "epoch": 3793} {"train_loss": -25.601388931274414, "global_step": 314821, "epoch": 3793} {"train_loss": -25.145753860473633, "global_step": 314822, "epoch": 3793} {"train_loss": -25.339998245239258, "global_step": 314823, "epoch": 3793} {"train_loss": -25.504499435424805, "global_step": 314824, "epoch": 3793} {"train_loss": -25.42478370666504, "global_step": 314825, "epoch": 3793} {"train_loss": -25.721792221069336, "global_step": 314826, "epoch": 3793} {"train_loss": -25.781341552734375, "global_step": 314827, "epoch": 3793} {"train_loss": -25.74566078186035, "global_step": 314828, "epoch": 3793} {"train_loss": -25.598793029785156, "global_step": 314829, "epoch": 3793} {"train_loss": -25.837326049804688, "global_step": 314830, "epoch": 3793} {"train_loss": -25.753889083862305, "global_step": 314831, "epoch": 3793} {"train_loss": -25.636335372924805, "global_step": 314832, "epoch": 3793} {"train_loss": -25.9801025390625, "global_step": 314833, "epoch": 3793} {"train_loss": -25.51920509338379, "global_step": 314834, "epoch": 3793} {"train_loss": -25.88623046875, "global_step": 314835, "epoch": 3793} {"train_loss": -25.482528686523438, "global_step": 314836, "epoch": 3793} {"train_loss": -25.48719596862793, "global_step": 314837, "epoch": 3793} {"train_loss": -25.645944595336914, "global_step": 314838, "epoch": 3793} {"train_loss": -25.689111709594727, "global_step": 314839, "epoch": 3793} {"train_loss": -25.402942657470703, "global_step": 314840, "epoch": 3793} {"train_loss": -25.840234756469727, "global_step": 314841, "epoch": 3793} {"train_loss": -25.894256591796875, "global_step": 314842, "epoch": 3793} {"train_loss": -25.7650146484375, "global_step": 314843, "epoch": 3793} {"train_loss": -25.844013214111328, "global_step": 314844, "epoch": 3793} {"train_loss": -25.78693199157715, "global_step": 314845, "epoch": 3793} {"train_loss": -25.697834014892578, "global_step": 314846, "epoch": 3793} {"train_loss": -25.9184513092041, "global_step": 314847, "epoch": 3793} {"train_loss": -25.82110595703125, "global_step": 314848, "epoch": 3793} {"train_loss": -25.968114852905273, "global_step": 314849, "epoch": 3793} {"train_loss": -25.91229248046875, "global_step": 314850, "epoch": 3793} {"train_loss": -26.0620174407959, "global_step": 314851, "epoch": 3793} {"train_loss": -25.850589752197266, "global_step": 314852, "epoch": 3793} {"train_loss": -26.00139808654785, "global_step": 314853, "epoch": 3793} {"train_loss": -25.77350425720215, "global_step": 314854, "epoch": 3793} {"train_loss": -25.78792381286621, "global_step": 314855, "epoch": 3793} {"train_loss": -25.74591064453125, "global_step": 314856, "epoch": 3793} {"train_loss": -25.94679069519043, "global_step": 314857, "epoch": 3793} {"train_loss": -25.61665916442871, "global_step": 314858, "epoch": 3793} {"train_loss": -25.8872127532959, "global_step": 314859, "epoch": 3793} {"train_loss": -25.8166446685791, "global_step": 314860, "epoch": 3793} {"train_loss": -26.12299919128418, "global_step": 314861, "epoch": 3793} {"train_loss": -25.818811416625977, "global_step": 314862, "epoch": 3793} {"train_loss": -25.8267879486084, "global_step": 314863, "epoch": 3793} {"train_loss": -26.33489990234375, "global_step": 314864, "epoch": 3793} {"train_loss": -25.773345947265625, "global_step": 314865, "epoch": 3793} {"train_loss": -25.61153221130371, "global_step": 314866, "epoch": 3793} {"train_loss": -25.944982528686523, "global_step": 314867, "epoch": 3793} {"train_loss": -25.837568283081055, "global_step": 314868, "epoch": 3793} {"train_loss": -26.11348533630371, "global_step": 314869, "epoch": 3793} {"train_loss": -25.606536865234375, "global_step": 314870, "epoch": 3793} {"train_loss": -26.04215431213379, "global_step": 314871, "epoch": 3793} {"train_loss": -25.401309967041016, "global_step": 314872, "epoch": 3793} {"train_loss": -25.564741134643555, "global_step": 314873, "epoch": 3793} {"train_loss": -25.182268142700195, "global_step": 314874, "epoch": 3793} {"train_loss": -25.852338790893555, "global_step": 314875, "epoch": 3793} {"train_loss": -25.46932601928711, "global_step": 314876, "epoch": 3793} {"train_loss": -26.205291748046875, "global_step": 314877, "epoch": 3793} {"train_loss": -25.68221092224121, "global_step": 314878, "epoch": 3793} {"train_loss": -25.401487350463867, "global_step": 314879, "epoch": 3793} {"train_loss": -25.8597469329834, "global_step": 314880, "epoch": 3793} {"train_loss": -25.448291778564453, "global_step": 314881, "epoch": 3793} {"train_loss": -25.4989070892334, "global_step": 314882, "epoch": 3793} {"train_loss": -25.544967651367188, "global_step": 314883, "epoch": 3793} {"train_loss": -25.730487823486328, "global_step": 314884, "epoch": 3793} {"train_loss": -25.496286392211914, "global_step": 314885, "epoch": 3793} {"train_loss": -25.148378372192383, "global_step": 314886, "epoch": 3793} {"train_loss": -25.916492462158203, "global_step": 314887, "epoch": 3793} {"train_loss": -25.492557525634766, "global_step": 314888, "epoch": 3793} {"train_loss": -25.717493057250977, "global_step": 314889, "epoch": 3793} {"train_loss": -25.227685928344727, "global_step": 314890, "epoch": 3793} {"train_loss": -25.74798011779785, "global_step": 314891, "epoch": 3793} {"train_loss": -25.749069213867188, "global_step": 314892, "epoch": 3793} {"train_loss": -25.68585777282715, "global_step": 314893, "epoch": 3793} {"train_loss": -25.832233428955078, "global_step": 314894, "epoch": 3793} {"train_loss": -25.826257705688477, "global_step": 314895, "epoch": 3793} {"train_loss": -26.09510612487793, "global_step": 314896, "epoch": 3793} {"train_loss": -25.835744857788086, "global_step": 314897, "epoch": 3793} {"train_loss": -26.233301162719727, "global_step": 314898, "epoch": 3793} {"train_loss": -26.280073165893555, "global_step": 314899, "epoch": 3793} {"train_loss": -26.30716323852539, "global_step": 314900, "epoch": 3793} {"train_loss": -25.743643358529333, "global_step": 314901, "epoch": 3793, "val_loss": 7328435.5} {"train_loss": -25.496505737304688, "global_step": 314902, "epoch": 3794} {"train_loss": -25.415699005126953, "global_step": 314903, "epoch": 3794} {"train_loss": -25.513822555541992, "global_step": 314904, "epoch": 3794} {"train_loss": -25.516769409179688, "global_step": 314905, "epoch": 3794} {"train_loss": -25.361690521240234, "global_step": 314906, "epoch": 3794} {"train_loss": -25.199316024780273, "global_step": 314907, "epoch": 3794} {"train_loss": -25.595319747924805, "global_step": 314908, "epoch": 3794} {"train_loss": -25.349822998046875, "global_step": 314909, "epoch": 3794} {"train_loss": -25.17717933654785, "global_step": 314910, "epoch": 3794} {"train_loss": -25.588594436645508, "global_step": 314911, "epoch": 3794} {"train_loss": -25.387895584106445, "global_step": 314912, "epoch": 3794} {"train_loss": -25.45882225036621, "global_step": 314913, "epoch": 3794} {"train_loss": -25.789478302001953, "global_step": 314914, "epoch": 3794} {"train_loss": -25.88165283203125, "global_step": 314915, "epoch": 3794} {"train_loss": -25.36273765563965, "global_step": 314916, "epoch": 3794} {"train_loss": -25.45745277404785, "global_step": 314917, "epoch": 3794} {"train_loss": -25.88162612915039, "global_step": 314918, "epoch": 3794} {"train_loss": -25.45853614807129, "global_step": 314919, "epoch": 3794} {"train_loss": -25.954208374023438, "global_step": 314920, "epoch": 3794} {"train_loss": -25.64987564086914, "global_step": 314921, "epoch": 3794} {"train_loss": -25.44127655029297, "global_step": 314922, "epoch": 3794} {"train_loss": -25.7258358001709, "global_step": 314923, "epoch": 3794} {"train_loss": -25.898305892944336, "global_step": 314924, "epoch": 3794} {"train_loss": -25.434579849243164, "global_step": 314925, "epoch": 3794} {"train_loss": -25.659399032592773, "global_step": 314926, "epoch": 3794} {"train_loss": -25.729175567626953, "global_step": 314927, "epoch": 3794} {"train_loss": -25.494308471679688, "global_step": 314928, "epoch": 3794} {"train_loss": -25.65793228149414, "global_step": 314929, "epoch": 3794} {"train_loss": -25.677169799804688, "global_step": 314930, "epoch": 3794} {"train_loss": -25.547794342041016, "global_step": 314931, "epoch": 3794} {"train_loss": -25.730859756469727, "global_step": 314932, "epoch": 3794} {"train_loss": -25.607776641845703, "global_step": 314933, "epoch": 3794} {"train_loss": -26.081350326538086, "global_step": 314934, "epoch": 3794} {"train_loss": -25.832752227783203, "global_step": 314935, "epoch": 3794} {"train_loss": -25.538726806640625, "global_step": 314936, "epoch": 3794} {"train_loss": -25.978906631469727, "global_step": 314937, "epoch": 3794} {"train_loss": -25.859027862548828, "global_step": 314938, "epoch": 3794} {"train_loss": -25.947797775268555, "global_step": 314939, "epoch": 3794} {"train_loss": -25.883691787719727, "global_step": 314940, "epoch": 3794} {"train_loss": -26.122655868530273, "global_step": 314941, "epoch": 3794} {"train_loss": -25.728708267211914, "global_step": 314942, "epoch": 3794} {"train_loss": -26.1180362701416, "global_step": 314943, "epoch": 3794} {"train_loss": -26.120086669921875, "global_step": 314944, "epoch": 3794} {"train_loss": -25.518875122070312, "global_step": 314945, "epoch": 3794} {"train_loss": -26.114362716674805, "global_step": 314946, "epoch": 3794} {"train_loss": -26.086606979370117, "global_step": 314947, "epoch": 3794} {"train_loss": -25.891162872314453, "global_step": 314948, "epoch": 3794} {"train_loss": -26.094785690307617, "global_step": 314949, "epoch": 3794} {"train_loss": -25.95037841796875, "global_step": 314950, "epoch": 3794} {"train_loss": -25.867630004882812, "global_step": 314951, "epoch": 3794} {"train_loss": -26.074731826782227, "global_step": 314952, "epoch": 3794} {"train_loss": -25.75469970703125, "global_step": 314953, "epoch": 3794} {"train_loss": -25.80010986328125, "global_step": 314954, "epoch": 3794} {"train_loss": -26.120380401611328, "global_step": 314955, "epoch": 3794} {"train_loss": -26.117706298828125, "global_step": 314956, "epoch": 3794} {"train_loss": -25.885242462158203, "global_step": 314957, "epoch": 3794} {"train_loss": -25.975004196166992, "global_step": 314958, "epoch": 3794} {"train_loss": -25.560155868530273, "global_step": 314959, "epoch": 3794} {"train_loss": -26.08057975769043, "global_step": 314960, "epoch": 3794} {"train_loss": -25.932144165039062, "global_step": 314961, "epoch": 3794} {"train_loss": -25.83967399597168, "global_step": 314962, "epoch": 3794} {"train_loss": -25.558706283569336, "global_step": 314963, "epoch": 3794} {"train_loss": -25.752765655517578, "global_step": 314964, "epoch": 3794} {"train_loss": -26.072601318359375, "global_step": 314965, "epoch": 3794} {"train_loss": -25.988235473632812, "global_step": 314966, "epoch": 3794} {"train_loss": -25.88405418395996, "global_step": 314967, "epoch": 3794} {"train_loss": -26.098840713500977, "global_step": 314968, "epoch": 3794} {"train_loss": -25.86566162109375, "global_step": 314969, "epoch": 3794} {"train_loss": -26.06702995300293, "global_step": 314970, "epoch": 3794} {"train_loss": -25.867950439453125, "global_step": 314971, "epoch": 3794} {"train_loss": -25.690185546875, "global_step": 314972, "epoch": 3794} {"train_loss": -25.82037925720215, "global_step": 314973, "epoch": 3794} {"train_loss": -25.50018310546875, "global_step": 314974, "epoch": 3794} {"train_loss": -25.575214385986328, "global_step": 314975, "epoch": 3794} {"train_loss": -25.937849044799805, "global_step": 314976, "epoch": 3794} {"train_loss": -25.705005645751953, "global_step": 314977, "epoch": 3794} {"train_loss": -25.464879989624023, "global_step": 314978, "epoch": 3794} {"train_loss": -25.570585250854492, "global_step": 314979, "epoch": 3794} {"train_loss": -26.18464469909668, "global_step": 314980, "epoch": 3794} {"train_loss": -26.041671752929688, "global_step": 314981, "epoch": 3794} {"train_loss": -25.877553939819336, "global_step": 314982, "epoch": 3794} {"train_loss": -25.9713077545166, "global_step": 314983, "epoch": 3794} {"train_loss": -25.768119628170886, "global_step": 314984, "epoch": 3794, "val_loss": 7341221.0} {"train_loss": -25.64261245727539, "global_step": 314985, "epoch": 3795} {"train_loss": -25.4257869720459, "global_step": 314986, "epoch": 3795} {"train_loss": -24.926603317260742, "global_step": 314987, "epoch": 3795} {"train_loss": -25.132360458374023, "global_step": 314988, "epoch": 3795} {"train_loss": -25.015531539916992, "global_step": 314989, "epoch": 3795} {"train_loss": -25.22004508972168, "global_step": 314990, "epoch": 3795} {"train_loss": -25.923673629760742, "global_step": 314991, "epoch": 3795} {"train_loss": -24.66861915588379, "global_step": 314992, "epoch": 3795} {"train_loss": -25.465621948242188, "global_step": 314993, "epoch": 3795} {"train_loss": -25.203784942626953, "global_step": 314994, "epoch": 3795} {"train_loss": -25.851398468017578, "global_step": 314995, "epoch": 3795} {"train_loss": -25.58009147644043, "global_step": 314996, "epoch": 3795} {"train_loss": -25.489948272705078, "global_step": 314997, "epoch": 3795} {"train_loss": -25.440204620361328, "global_step": 314998, "epoch": 3795} {"train_loss": -25.78724479675293, "global_step": 314999, "epoch": 3795} {"train_loss": -25.972482681274414, "global_step": 315000, "epoch": 3795} {"train_loss": -25.48139762878418, "global_step": 315001, "epoch": 3795} {"train_loss": -25.389341354370117, "global_step": 315002, "epoch": 3795} {"train_loss": -25.926111221313477, "global_step": 315003, "epoch": 3795} {"train_loss": -25.621076583862305, "global_step": 315004, "epoch": 3795} {"train_loss": -25.92384147644043, "global_step": 315005, "epoch": 3795} {"train_loss": -25.428457260131836, "global_step": 315006, "epoch": 3795} {"train_loss": -25.6982364654541, "global_step": 315007, "epoch": 3795} {"train_loss": -25.878259658813477, "global_step": 315008, "epoch": 3795} {"train_loss": -25.702878952026367, "global_step": 315009, "epoch": 3795} {"train_loss": -25.752246856689453, "global_step": 315010, "epoch": 3795} {"train_loss": -25.688650131225586, "global_step": 315011, "epoch": 3795} {"train_loss": -26.067707061767578, "global_step": 315012, "epoch": 3795} {"train_loss": -25.6851863861084, "global_step": 315013, "epoch": 3795} {"train_loss": -25.70553970336914, "global_step": 315014, "epoch": 3795} {"train_loss": -25.74232292175293, "global_step": 315015, "epoch": 3795} {"train_loss": -25.911840438842773, "global_step": 315016, "epoch": 3795} {"train_loss": -25.87057876586914, "global_step": 315017, "epoch": 3795} {"train_loss": -25.778873443603516, "global_step": 315018, "epoch": 3795} {"train_loss": -25.95170021057129, "global_step": 315019, "epoch": 3795} {"train_loss": -25.641555786132812, "global_step": 315020, "epoch": 3795} {"train_loss": -25.5506649017334, "global_step": 315021, "epoch": 3795} {"train_loss": -25.863372802734375, "global_step": 315022, "epoch": 3795} {"train_loss": -25.833093643188477, "global_step": 315023, "epoch": 3795} {"train_loss": -25.941425323486328, "global_step": 315024, "epoch": 3795} {"train_loss": -26.0546875, "global_step": 315025, "epoch": 3795} {"train_loss": -25.60870361328125, "global_step": 315026, "epoch": 3795} {"train_loss": -25.81072425842285, "global_step": 315027, "epoch": 3795} {"train_loss": -25.983478546142578, "global_step": 315028, "epoch": 3795} {"train_loss": -26.112045288085938, "global_step": 315029, "epoch": 3795} {"train_loss": -26.00638198852539, "global_step": 315030, "epoch": 3795} {"train_loss": -25.921478271484375, "global_step": 315031, "epoch": 3795} {"train_loss": -26.09229850769043, "global_step": 315032, "epoch": 3795} {"train_loss": -25.996204376220703, "global_step": 315033, "epoch": 3795} {"train_loss": -25.8375244140625, "global_step": 315034, "epoch": 3795} {"train_loss": -25.76824951171875, "global_step": 315035, "epoch": 3795} {"train_loss": -25.894550323486328, "global_step": 315036, "epoch": 3795} {"train_loss": -26.15205192565918, "global_step": 315037, "epoch": 3795} {"train_loss": -26.3177433013916, "global_step": 315038, "epoch": 3795} {"train_loss": -25.85141372680664, "global_step": 315039, "epoch": 3795} {"train_loss": -25.805103302001953, "global_step": 315040, "epoch": 3795} {"train_loss": -26.369510650634766, "global_step": 315041, "epoch": 3795} {"train_loss": -25.632404327392578, "global_step": 315042, "epoch": 3795} {"train_loss": -25.728546142578125, "global_step": 315043, "epoch": 3795} {"train_loss": -25.952808380126953, "global_step": 315044, "epoch": 3795} {"train_loss": -25.827407836914062, "global_step": 315045, "epoch": 3795} {"train_loss": -26.050947189331055, "global_step": 315046, "epoch": 3795} {"train_loss": -25.93244743347168, "global_step": 315047, "epoch": 3795} {"train_loss": -26.067005157470703, "global_step": 315048, "epoch": 3795} {"train_loss": -25.492456436157227, "global_step": 315049, "epoch": 3795} {"train_loss": -25.39778709411621, "global_step": 315050, "epoch": 3795} {"train_loss": -25.129098892211914, "global_step": 315051, "epoch": 3795} {"train_loss": -25.395307540893555, "global_step": 315052, "epoch": 3795} {"train_loss": -25.6171817779541, "global_step": 315053, "epoch": 3795} {"train_loss": -25.382125854492188, "global_step": 315054, "epoch": 3795} {"train_loss": -25.410871505737305, "global_step": 315055, "epoch": 3795} {"train_loss": -25.976520538330078, "global_step": 315056, "epoch": 3795} {"train_loss": -25.586578369140625, "global_step": 315057, "epoch": 3795} {"train_loss": -25.917627334594727, "global_step": 315058, "epoch": 3795} {"train_loss": -25.953540802001953, "global_step": 315059, "epoch": 3795} {"train_loss": -25.532880783081055, "global_step": 315060, "epoch": 3795} {"train_loss": -25.785907745361328, "global_step": 315061, "epoch": 3795} {"train_loss": -25.969013214111328, "global_step": 315062, "epoch": 3795} {"train_loss": -25.448814392089844, "global_step": 315063, "epoch": 3795} {"train_loss": -26.148054122924805, "global_step": 315064, "epoch": 3795} {"train_loss": -25.776290893554688, "global_step": 315065, "epoch": 3795} {"train_loss": -25.914356231689453, "global_step": 315066, "epoch": 3795} {"train_loss": -25.72451400756836, "global_step": 315067, "epoch": 3795, "val_loss": 7344425.0} {"train_loss": -25.257953643798828, "global_step": 315068, "epoch": 3796} {"train_loss": -25.269052505493164, "global_step": 315069, "epoch": 3796} {"train_loss": -25.7703857421875, "global_step": 315070, "epoch": 3796} {"train_loss": -25.43760871887207, "global_step": 315071, "epoch": 3796} {"train_loss": -25.400821685791016, "global_step": 315072, "epoch": 3796} {"train_loss": -24.96036148071289, "global_step": 315073, "epoch": 3796} {"train_loss": -25.27583885192871, "global_step": 315074, "epoch": 3796} {"train_loss": -25.434709548950195, "global_step": 315075, "epoch": 3796} {"train_loss": -25.725065231323242, "global_step": 315076, "epoch": 3796} {"train_loss": -25.579002380371094, "global_step": 315077, "epoch": 3796} {"train_loss": -25.590560913085938, "global_step": 315078, "epoch": 3796} {"train_loss": -25.351652145385742, "global_step": 315079, "epoch": 3796} {"train_loss": -25.08802604675293, "global_step": 315080, "epoch": 3796} {"train_loss": -25.594085693359375, "global_step": 315081, "epoch": 3796} {"train_loss": -25.23193359375, "global_step": 315082, "epoch": 3796} {"train_loss": -25.538393020629883, "global_step": 315083, "epoch": 3796} {"train_loss": -25.572607040405273, "global_step": 315084, "epoch": 3796} {"train_loss": -25.4600772857666, "global_step": 315085, "epoch": 3796} {"train_loss": -25.225017547607422, "global_step": 315086, "epoch": 3796} {"train_loss": -25.71857261657715, "global_step": 315087, "epoch": 3796} {"train_loss": -25.661788940429688, "global_step": 315088, "epoch": 3796} {"train_loss": -25.84149742126465, "global_step": 315089, "epoch": 3796} {"train_loss": -25.31007194519043, "global_step": 315090, "epoch": 3796} {"train_loss": -26.113983154296875, "global_step": 315091, "epoch": 3796} {"train_loss": -25.39479637145996, "global_step": 315092, "epoch": 3796} {"train_loss": -25.814411163330078, "global_step": 315093, "epoch": 3796} {"train_loss": -26.0405216217041, "global_step": 315094, "epoch": 3796} {"train_loss": -26.144479751586914, "global_step": 315095, "epoch": 3796} {"train_loss": -25.374221801757812, "global_step": 315096, "epoch": 3796} {"train_loss": -25.969648361206055, "global_step": 315097, "epoch": 3796} {"train_loss": -25.46640396118164, "global_step": 315098, "epoch": 3796} {"train_loss": -25.882604598999023, "global_step": 315099, "epoch": 3796} {"train_loss": -26.21476173400879, "global_step": 315100, "epoch": 3796} {"train_loss": -25.56862449645996, "global_step": 315101, "epoch": 3796} {"train_loss": -25.924657821655273, "global_step": 315102, "epoch": 3796} {"train_loss": -26.08786964416504, "global_step": 315103, "epoch": 3796} {"train_loss": -25.771560668945312, "global_step": 315104, "epoch": 3796} {"train_loss": -25.721343994140625, "global_step": 315105, "epoch": 3796} {"train_loss": -25.8227596282959, "global_step": 315106, "epoch": 3796} {"train_loss": -26.123510360717773, "global_step": 315107, "epoch": 3796} {"train_loss": -25.947433471679688, "global_step": 315108, "epoch": 3796} {"train_loss": -25.913925170898438, "global_step": 315109, "epoch": 3796} {"train_loss": -26.043188095092773, "global_step": 315110, "epoch": 3796} {"train_loss": -26.20853042602539, "global_step": 315111, "epoch": 3796} {"train_loss": -25.718801498413086, "global_step": 315112, "epoch": 3796} {"train_loss": -25.8066463470459, "global_step": 315113, "epoch": 3796} {"train_loss": -25.736846923828125, "global_step": 315114, "epoch": 3796} {"train_loss": -25.897802352905273, "global_step": 315115, "epoch": 3796} {"train_loss": -26.194196701049805, "global_step": 315116, "epoch": 3796} {"train_loss": -25.374061584472656, "global_step": 315117, "epoch": 3796} {"train_loss": -26.050128936767578, "global_step": 315118, "epoch": 3796} {"train_loss": -25.719074249267578, "global_step": 315119, "epoch": 3796} {"train_loss": -25.85316276550293, "global_step": 315120, "epoch": 3796} {"train_loss": -25.6839542388916, "global_step": 315121, "epoch": 3796} {"train_loss": -25.747873306274414, "global_step": 315122, "epoch": 3796} {"train_loss": -25.908740997314453, "global_step": 315123, "epoch": 3796} {"train_loss": -25.800464630126953, "global_step": 315124, "epoch": 3796} {"train_loss": -25.71554946899414, "global_step": 315125, "epoch": 3796} {"train_loss": -26.044132232666016, "global_step": 315126, "epoch": 3796} {"train_loss": -25.782312393188477, "global_step": 315127, "epoch": 3796} {"train_loss": -25.677173614501953, "global_step": 315128, "epoch": 3796} {"train_loss": -25.615238189697266, "global_step": 315129, "epoch": 3796} {"train_loss": -25.752500534057617, "global_step": 315130, "epoch": 3796} {"train_loss": -25.529582977294922, "global_step": 315131, "epoch": 3796} {"train_loss": -25.885635375976562, "global_step": 315132, "epoch": 3796} {"train_loss": -25.827268600463867, "global_step": 315133, "epoch": 3796} {"train_loss": -25.7476806640625, "global_step": 315134, "epoch": 3796} {"train_loss": -26.1868896484375, "global_step": 315135, "epoch": 3796} {"train_loss": -25.628009796142578, "global_step": 315136, "epoch": 3796} {"train_loss": -26.04725456237793, "global_step": 315137, "epoch": 3796} {"train_loss": -25.8922119140625, "global_step": 315138, "epoch": 3796} {"train_loss": -25.338001251220703, "global_step": 315139, "epoch": 3796} {"train_loss": -25.316991806030273, "global_step": 315140, "epoch": 3796} {"train_loss": -25.775634765625, "global_step": 315141, "epoch": 3796} {"train_loss": -26.014484405517578, "global_step": 315142, "epoch": 3796} {"train_loss": -26.098575592041016, "global_step": 315143, "epoch": 3796} {"train_loss": -25.821130752563477, "global_step": 315144, "epoch": 3796} {"train_loss": -25.654882431030273, "global_step": 315145, "epoch": 3796} {"train_loss": -25.886823654174805, "global_step": 315146, "epoch": 3796} {"train_loss": -25.85291862487793, "global_step": 315147, "epoch": 3796} {"train_loss": -25.7043399810791, "global_step": 315148, "epoch": 3796} {"train_loss": -25.504703521728516, "global_step": 315149, "epoch": 3796} {"train_loss": -25.71237832954131, "global_step": 315150, "epoch": 3796, "val_loss": 7248801.0} {"train_loss": -25.423948287963867, "global_step": 315151, "epoch": 3797} {"train_loss": -25.65155601501465, "global_step": 315152, "epoch": 3797} {"train_loss": -25.54518699645996, "global_step": 315153, "epoch": 3797} {"train_loss": -25.592880249023438, "global_step": 315154, "epoch": 3797} {"train_loss": -25.38330078125, "global_step": 315155, "epoch": 3797} {"train_loss": -25.79932975769043, "global_step": 315156, "epoch": 3797} {"train_loss": -26.020435333251953, "global_step": 315157, "epoch": 3797} {"train_loss": -25.618627548217773, "global_step": 315158, "epoch": 3797} {"train_loss": -25.744827270507812, "global_step": 315159, "epoch": 3797} {"train_loss": -25.861913681030273, "global_step": 315160, "epoch": 3797} {"train_loss": -25.53364372253418, "global_step": 315161, "epoch": 3797} {"train_loss": -25.13405418395996, "global_step": 315162, "epoch": 3797} {"train_loss": -25.437673568725586, "global_step": 315163, "epoch": 3797} {"train_loss": -25.33876609802246, "global_step": 315164, "epoch": 3797} {"train_loss": -25.97671890258789, "global_step": 315165, "epoch": 3797} {"train_loss": -25.6224365234375, "global_step": 315166, "epoch": 3797} {"train_loss": -25.805648803710938, "global_step": 315167, "epoch": 3797} {"train_loss": -25.71735191345215, "global_step": 315168, "epoch": 3797} {"train_loss": -25.779062271118164, "global_step": 315169, "epoch": 3797} {"train_loss": -25.751087188720703, "global_step": 315170, "epoch": 3797} {"train_loss": -25.592554092407227, "global_step": 315171, "epoch": 3797} {"train_loss": -25.903106689453125, "global_step": 315172, "epoch": 3797} {"train_loss": -26.16620445251465, "global_step": 315173, "epoch": 3797} {"train_loss": -25.806028366088867, "global_step": 315174, "epoch": 3797} {"train_loss": -25.941104888916016, "global_step": 315175, "epoch": 3797} {"train_loss": -26.127044677734375, "global_step": 315176, "epoch": 3797} {"train_loss": -25.694116592407227, "global_step": 315177, "epoch": 3797} {"train_loss": -25.852313995361328, "global_step": 315178, "epoch": 3797} {"train_loss": -26.392499923706055, "global_step": 315179, "epoch": 3797} {"train_loss": -25.933889389038086, "global_step": 315180, "epoch": 3797} {"train_loss": -25.583892822265625, "global_step": 315181, "epoch": 3797} {"train_loss": -25.810041427612305, "global_step": 315182, "epoch": 3797} {"train_loss": -25.704126358032227, "global_step": 315183, "epoch": 3797} {"train_loss": -25.8233699798584, "global_step": 315184, "epoch": 3797} {"train_loss": -25.922657012939453, "global_step": 315185, "epoch": 3797} {"train_loss": -25.765430450439453, "global_step": 315186, "epoch": 3797} {"train_loss": -25.869434356689453, "global_step": 315187, "epoch": 3797} {"train_loss": -26.15106773376465, "global_step": 315188, "epoch": 3797} {"train_loss": -26.077381134033203, "global_step": 315189, "epoch": 3797} {"train_loss": -25.96241569519043, "global_step": 315190, "epoch": 3797} {"train_loss": -25.700658798217773, "global_step": 315191, "epoch": 3797} {"train_loss": -26.07814598083496, "global_step": 315192, "epoch": 3797} {"train_loss": -25.631128311157227, "global_step": 315193, "epoch": 3797} {"train_loss": -25.953399658203125, "global_step": 315194, "epoch": 3797} {"train_loss": -25.94050407409668, "global_step": 315195, "epoch": 3797} {"train_loss": -25.758779525756836, "global_step": 315196, "epoch": 3797} {"train_loss": -25.481449127197266, "global_step": 315197, "epoch": 3797} {"train_loss": -26.27430534362793, "global_step": 315198, "epoch": 3797} {"train_loss": -26.192731857299805, "global_step": 315199, "epoch": 3797} {"train_loss": -25.947223663330078, "global_step": 315200, "epoch": 3797} {"train_loss": -25.63539695739746, "global_step": 315201, "epoch": 3797} {"train_loss": -25.94890785217285, "global_step": 315202, "epoch": 3797} {"train_loss": -26.09730339050293, "global_step": 315203, "epoch": 3797} {"train_loss": -25.68715476989746, "global_step": 315204, "epoch": 3797} {"train_loss": -25.502939224243164, "global_step": 315205, "epoch": 3797} {"train_loss": -25.903244018554688, "global_step": 315206, "epoch": 3797} {"train_loss": -26.21565055847168, "global_step": 315207, "epoch": 3797} {"train_loss": -25.63652992248535, "global_step": 315208, "epoch": 3797} {"train_loss": -25.534564971923828, "global_step": 315209, "epoch": 3797} {"train_loss": -25.500585556030273, "global_step": 315210, "epoch": 3797} {"train_loss": -25.66278648376465, "global_step": 315211, "epoch": 3797} {"train_loss": -25.44351577758789, "global_step": 315212, "epoch": 3797} {"train_loss": -25.717321395874023, "global_step": 315213, "epoch": 3797} {"train_loss": -25.512531280517578, "global_step": 315214, "epoch": 3797} {"train_loss": -25.30633544921875, "global_step": 315215, "epoch": 3797} {"train_loss": -24.61101722717285, "global_step": 315216, "epoch": 3797} {"train_loss": -25.712411880493164, "global_step": 315217, "epoch": 3797} {"train_loss": -25.540119171142578, "global_step": 315218, "epoch": 3797} {"train_loss": -25.846006393432617, "global_step": 315219, "epoch": 3797} {"train_loss": -25.361154556274414, "global_step": 315220, "epoch": 3797} {"train_loss": -25.269861221313477, "global_step": 315221, "epoch": 3797} {"train_loss": -25.646514892578125, "global_step": 315222, "epoch": 3797} {"train_loss": -25.839874267578125, "global_step": 315223, "epoch": 3797} {"train_loss": -25.888418197631836, "global_step": 315224, "epoch": 3797} {"train_loss": -26.0511417388916, "global_step": 315225, "epoch": 3797} {"train_loss": -25.73138999938965, "global_step": 315226, "epoch": 3797} {"train_loss": -25.730539321899414, "global_step": 315227, "epoch": 3797} {"train_loss": -25.69081687927246, "global_step": 315228, "epoch": 3797} {"train_loss": -25.804269790649414, "global_step": 315229, "epoch": 3797} {"train_loss": -25.695682525634766, "global_step": 315230, "epoch": 3797} {"train_loss": -25.934263229370117, "global_step": 315231, "epoch": 3797} {"train_loss": -25.6591739654541, "global_step": 315232, "epoch": 3797} {"train_loss": -25.75968606787992, "global_step": 315233, "epoch": 3797, "val_loss": 7335462.0} {"train_loss": -25.388376235961914, "global_step": 315234, "epoch": 3798} {"train_loss": -25.06519317626953, "global_step": 315235, "epoch": 3798} {"train_loss": -25.380043029785156, "global_step": 315236, "epoch": 3798} {"train_loss": -25.36575698852539, "global_step": 315237, "epoch": 3798} {"train_loss": -25.224018096923828, "global_step": 315238, "epoch": 3798} {"train_loss": -25.023035049438477, "global_step": 315239, "epoch": 3798} {"train_loss": -24.963041305541992, "global_step": 315240, "epoch": 3798} {"train_loss": -25.253747940063477, "global_step": 315241, "epoch": 3798} {"train_loss": -25.37177848815918, "global_step": 315242, "epoch": 3798} {"train_loss": -25.14961814880371, "global_step": 315243, "epoch": 3798} {"train_loss": -25.138856887817383, "global_step": 315244, "epoch": 3798} {"train_loss": -25.341646194458008, "global_step": 315245, "epoch": 3798} {"train_loss": -25.142684936523438, "global_step": 315246, "epoch": 3798} {"train_loss": -25.532474517822266, "global_step": 315247, "epoch": 3798} {"train_loss": -25.362333297729492, "global_step": 315248, "epoch": 3798} {"train_loss": -25.707748413085938, "global_step": 315249, "epoch": 3798} {"train_loss": -25.27701759338379, "global_step": 315250, "epoch": 3798} {"train_loss": -25.592609405517578, "global_step": 315251, "epoch": 3798} {"train_loss": -25.612974166870117, "global_step": 315252, "epoch": 3798} {"train_loss": -25.654953002929688, "global_step": 315253, "epoch": 3798} {"train_loss": -25.664234161376953, "global_step": 315254, "epoch": 3798} {"train_loss": -25.625335693359375, "global_step": 315255, "epoch": 3798} {"train_loss": -25.776203155517578, "global_step": 315256, "epoch": 3798} {"train_loss": -25.560171127319336, "global_step": 315257, "epoch": 3798} {"train_loss": -25.624555587768555, "global_step": 315258, "epoch": 3798} {"train_loss": -25.90217399597168, "global_step": 315259, "epoch": 3798} {"train_loss": -25.71596336364746, "global_step": 315260, "epoch": 3798} {"train_loss": -25.788007736206055, "global_step": 315261, "epoch": 3798} {"train_loss": -25.428876876831055, "global_step": 315262, "epoch": 3798} {"train_loss": -26.002349853515625, "global_step": 315263, "epoch": 3798} {"train_loss": -25.887470245361328, "global_step": 315264, "epoch": 3798} {"train_loss": -25.916166305541992, "global_step": 315265, "epoch": 3798} {"train_loss": -25.6015682220459, "global_step": 315266, "epoch": 3798} {"train_loss": -25.74827003479004, "global_step": 315267, "epoch": 3798} {"train_loss": -26.049535751342773, "global_step": 315268, "epoch": 3798} {"train_loss": -25.955921173095703, "global_step": 315269, "epoch": 3798} {"train_loss": -25.51200294494629, "global_step": 315270, "epoch": 3798} {"train_loss": -25.791101455688477, "global_step": 315271, "epoch": 3798} {"train_loss": -26.0732364654541, "global_step": 315272, "epoch": 3798} {"train_loss": -25.442964553833008, "global_step": 315273, "epoch": 3798} {"train_loss": -25.85207176208496, "global_step": 315274, "epoch": 3798} {"train_loss": -26.191869735717773, "global_step": 315275, "epoch": 3798} {"train_loss": -25.768224716186523, "global_step": 315276, "epoch": 3798} {"train_loss": -25.905261993408203, "global_step": 315277, "epoch": 3798} {"train_loss": -25.881759643554688, "global_step": 315278, "epoch": 3798} {"train_loss": -25.907506942749023, "global_step": 315279, "epoch": 3798} {"train_loss": -25.927082061767578, "global_step": 315280, "epoch": 3798} {"train_loss": -25.696857452392578, "global_step": 315281, "epoch": 3798} {"train_loss": -25.754175186157227, "global_step": 315282, "epoch": 3798} {"train_loss": -26.059423446655273, "global_step": 315283, "epoch": 3798} {"train_loss": -25.56526756286621, "global_step": 315284, "epoch": 3798} {"train_loss": -26.148151397705078, "global_step": 315285, "epoch": 3798} {"train_loss": -26.104455947875977, "global_step": 315286, "epoch": 3798} {"train_loss": -25.90537452697754, "global_step": 315287, "epoch": 3798} {"train_loss": -25.81135368347168, "global_step": 315288, "epoch": 3798} {"train_loss": -25.917734146118164, "global_step": 315289, "epoch": 3798} {"train_loss": -25.835996627807617, "global_step": 315290, "epoch": 3798} {"train_loss": -26.095251083374023, "global_step": 315291, "epoch": 3798} {"train_loss": -25.592529296875, "global_step": 315292, "epoch": 3798} {"train_loss": -25.840219497680664, "global_step": 315293, "epoch": 3798} {"train_loss": -25.928695678710938, "global_step": 315294, "epoch": 3798} {"train_loss": -25.906951904296875, "global_step": 315295, "epoch": 3798} {"train_loss": -25.653827667236328, "global_step": 315296, "epoch": 3798} {"train_loss": -25.60284423828125, "global_step": 315297, "epoch": 3798} {"train_loss": -25.862531661987305, "global_step": 315298, "epoch": 3798} {"train_loss": -26.057022094726562, "global_step": 315299, "epoch": 3798} {"train_loss": -25.8551082611084, "global_step": 315300, "epoch": 3798} {"train_loss": -25.95673942565918, "global_step": 315301, "epoch": 3798} {"train_loss": -25.814624786376953, "global_step": 315302, "epoch": 3798} {"train_loss": -26.0717716217041, "global_step": 315303, "epoch": 3798} {"train_loss": -25.925466537475586, "global_step": 315304, "epoch": 3798} {"train_loss": -25.93051528930664, "global_step": 315305, "epoch": 3798} {"train_loss": -25.537010192871094, "global_step": 315306, "epoch": 3798} {"train_loss": -25.867273330688477, "global_step": 315307, "epoch": 3798} {"train_loss": -26.225982666015625, "global_step": 315308, "epoch": 3798} {"train_loss": -26.052433013916016, "global_step": 315309, "epoch": 3798} {"train_loss": -25.819046020507812, "global_step": 315310, "epoch": 3798} {"train_loss": -26.0485897064209, "global_step": 315311, "epoch": 3798} {"train_loss": -25.7923641204834, "global_step": 315312, "epoch": 3798} {"train_loss": -26.27619743347168, "global_step": 315313, "epoch": 3798} {"train_loss": -25.969167709350586, "global_step": 315314, "epoch": 3798} {"train_loss": -25.99909019470215, "global_step": 315315, "epoch": 3798} {"train_loss": -25.724073501954596, "global_step": 315316, "epoch": 3798, "val_loss": 7404247.5} {"train_loss": -25.716184616088867, "global_step": 315317, "epoch": 3799} {"train_loss": -25.088470458984375, "global_step": 315318, "epoch": 3799} {"train_loss": -25.311481475830078, "global_step": 315319, "epoch": 3799} {"train_loss": -25.377716064453125, "global_step": 315320, "epoch": 3799} {"train_loss": -25.2002010345459, "global_step": 315321, "epoch": 3799} {"train_loss": -25.41816520690918, "global_step": 315322, "epoch": 3799} {"train_loss": -25.19996452331543, "global_step": 315323, "epoch": 3799} {"train_loss": -25.15370750427246, "global_step": 315324, "epoch": 3799} {"train_loss": -25.392879486083984, "global_step": 315325, "epoch": 3799} {"train_loss": -25.440799713134766, "global_step": 315326, "epoch": 3799} {"train_loss": -25.74017906188965, "global_step": 315327, "epoch": 3799} {"train_loss": -25.36482048034668, "global_step": 315328, "epoch": 3799} {"train_loss": -25.28009605407715, "global_step": 315329, "epoch": 3799} {"train_loss": -25.576248168945312, "global_step": 315330, "epoch": 3799} {"train_loss": -25.785053253173828, "global_step": 315331, "epoch": 3799} {"train_loss": -25.6715030670166, "global_step": 315332, "epoch": 3799} {"train_loss": -25.421842575073242, "global_step": 315333, "epoch": 3799} {"train_loss": -25.696561813354492, "global_step": 315334, "epoch": 3799} {"train_loss": -25.827655792236328, "global_step": 315335, "epoch": 3799} {"train_loss": -25.955968856811523, "global_step": 315336, "epoch": 3799} {"train_loss": -25.34486961364746, "global_step": 315337, "epoch": 3799} {"train_loss": -25.734479904174805, "global_step": 315338, "epoch": 3799} {"train_loss": -25.720600128173828, "global_step": 315339, "epoch": 3799} {"train_loss": -25.735380172729492, "global_step": 315340, "epoch": 3799} {"train_loss": -26.06789207458496, "global_step": 315341, "epoch": 3799} {"train_loss": -25.773725509643555, "global_step": 315342, "epoch": 3799} {"train_loss": -25.973745346069336, "global_step": 315343, "epoch": 3799} {"train_loss": -25.55965232849121, "global_step": 315344, "epoch": 3799} {"train_loss": -25.83233070373535, "global_step": 315345, "epoch": 3799} {"train_loss": -25.194347381591797, "global_step": 315346, "epoch": 3799} {"train_loss": -25.836719512939453, "global_step": 315347, "epoch": 3799} {"train_loss": -25.965192794799805, "global_step": 315348, "epoch": 3799} {"train_loss": -25.861164093017578, "global_step": 315349, "epoch": 3799} {"train_loss": -25.73981285095215, "global_step": 315350, "epoch": 3799} {"train_loss": -25.677249908447266, "global_step": 315351, "epoch": 3799} {"train_loss": -25.97918701171875, "global_step": 315352, "epoch": 3799} {"train_loss": -25.734891891479492, "global_step": 315353, "epoch": 3799} {"train_loss": -25.28412628173828, "global_step": 315354, "epoch": 3799} {"train_loss": -25.841989517211914, "global_step": 315355, "epoch": 3799} {"train_loss": -26.097309112548828, "global_step": 315356, "epoch": 3799} {"train_loss": -25.683704376220703, "global_step": 315357, "epoch": 3799} {"train_loss": -25.872175216674805, "global_step": 315358, "epoch": 3799} {"train_loss": -25.831039428710938, "global_step": 315359, "epoch": 3799} {"train_loss": -25.827930450439453, "global_step": 315360, "epoch": 3799} {"train_loss": -25.964649200439453, "global_step": 315361, "epoch": 3799} {"train_loss": -25.74958610534668, "global_step": 315362, "epoch": 3799} {"train_loss": -25.7367000579834, "global_step": 315363, "epoch": 3799} {"train_loss": -25.837209701538086, "global_step": 315364, "epoch": 3799} {"train_loss": -25.854467391967773, "global_step": 315365, "epoch": 3799} {"train_loss": -25.341398239135742, "global_step": 315366, "epoch": 3799} {"train_loss": -26.0325870513916, "global_step": 315367, "epoch": 3799} {"train_loss": -26.017126083374023, "global_step": 315368, "epoch": 3799} {"train_loss": -25.697101593017578, "global_step": 315369, "epoch": 3799} {"train_loss": -25.630659103393555, "global_step": 315370, "epoch": 3799} {"train_loss": -25.801111221313477, "global_step": 315371, "epoch": 3799} {"train_loss": -25.72235107421875, "global_step": 315372, "epoch": 3799} {"train_loss": -25.905231475830078, "global_step": 315373, "epoch": 3799} {"train_loss": -25.73736000061035, "global_step": 315374, "epoch": 3799} {"train_loss": -25.784658432006836, "global_step": 315375, "epoch": 3799} {"train_loss": -25.53760528564453, "global_step": 315376, "epoch": 3799} {"train_loss": -26.013574600219727, "global_step": 315377, "epoch": 3799} {"train_loss": -26.039026260375977, "global_step": 315378, "epoch": 3799} {"train_loss": -26.23200798034668, "global_step": 315379, "epoch": 3799} {"train_loss": -26.00864601135254, "global_step": 315380, "epoch": 3799} {"train_loss": -25.620929718017578, "global_step": 315381, "epoch": 3799} {"train_loss": -25.52137565612793, "global_step": 315382, "epoch": 3799} {"train_loss": -25.918731689453125, "global_step": 315383, "epoch": 3799} {"train_loss": -26.0154972076416, "global_step": 315384, "epoch": 3799} {"train_loss": -25.904815673828125, "global_step": 315385, "epoch": 3799} {"train_loss": -25.53158950805664, "global_step": 315386, "epoch": 3799} {"train_loss": -26.02615737915039, "global_step": 315387, "epoch": 3799} {"train_loss": -25.708765029907227, "global_step": 315388, "epoch": 3799} {"train_loss": -26.171173095703125, "global_step": 315389, "epoch": 3799} {"train_loss": -25.782739639282227, "global_step": 315390, "epoch": 3799} {"train_loss": -25.8560791015625, "global_step": 315391, "epoch": 3799} {"train_loss": -25.82065773010254, "global_step": 315392, "epoch": 3799} {"train_loss": -25.97356605529785, "global_step": 315393, "epoch": 3799} {"train_loss": -25.74836540222168, "global_step": 315394, "epoch": 3799} {"train_loss": -25.890607833862305, "global_step": 315395, "epoch": 3799} {"train_loss": -25.659265518188477, "global_step": 315396, "epoch": 3799} {"train_loss": -25.90228271484375, "global_step": 315397, "epoch": 3799} {"train_loss": -25.9594669342041, "global_step": 315398, "epoch": 3799} {"train_loss": -25.73378590503371, "global_step": 315399, "epoch": 3799, "val_loss": 7265060.0} {"train_loss": -24.74065589904785, "global_step": 315400, "epoch": 3800} {"train_loss": -24.38614273071289, "global_step": 315401, "epoch": 3800} {"train_loss": -24.456754684448242, "global_step": 315402, "epoch": 3800} {"train_loss": -24.780752182006836, "global_step": 315403, "epoch": 3800} {"train_loss": -25.07957649230957, "global_step": 315404, "epoch": 3800} {"train_loss": -25.10591697692871, "global_step": 315405, "epoch": 3800} {"train_loss": -25.437681198120117, "global_step": 315406, "epoch": 3800} {"train_loss": -25.437692642211914, "global_step": 315407, "epoch": 3800} {"train_loss": -24.98993492126465, "global_step": 315408, "epoch": 3800} {"train_loss": -25.249759674072266, "global_step": 315409, "epoch": 3800} {"train_loss": -25.207225799560547, "global_step": 315410, "epoch": 3800} {"train_loss": -25.121496200561523, "global_step": 315411, "epoch": 3800} {"train_loss": -25.386396408081055, "global_step": 315412, "epoch": 3800} {"train_loss": -25.6668758392334, "global_step": 315413, "epoch": 3800} {"train_loss": -25.344058990478516, "global_step": 315414, "epoch": 3800} {"train_loss": -25.423351287841797, "global_step": 315415, "epoch": 3800} {"train_loss": -25.801010131835938, "global_step": 315416, "epoch": 3800} {"train_loss": -25.335615158081055, "global_step": 315417, "epoch": 3800} {"train_loss": -25.47271156311035, "global_step": 315418, "epoch": 3800} {"train_loss": -25.647443771362305, "global_step": 315419, "epoch": 3800} {"train_loss": -25.383380889892578, "global_step": 315420, "epoch": 3800} {"train_loss": -25.577905654907227, "global_step": 315421, "epoch": 3800} {"train_loss": -25.648101806640625, "global_step": 315422, "epoch": 3800} {"train_loss": -25.670881271362305, "global_step": 315423, "epoch": 3800} {"train_loss": -25.27848243713379, "global_step": 315424, "epoch": 3800} {"train_loss": -25.58587646484375, "global_step": 315425, "epoch": 3800} {"train_loss": -25.764699935913086, "global_step": 315426, "epoch": 3800} {"train_loss": -25.5444278717041, "global_step": 315427, "epoch": 3800} {"train_loss": -25.779956817626953, "global_step": 315428, "epoch": 3800} {"train_loss": -25.94435691833496, "global_step": 315429, "epoch": 3800} {"train_loss": -25.5966739654541, "global_step": 315430, "epoch": 3800} {"train_loss": -25.63071060180664, "global_step": 315431, "epoch": 3800} {"train_loss": -25.300146102905273, "global_step": 315432, "epoch": 3800} {"train_loss": -25.97395133972168, "global_step": 315433, "epoch": 3800} {"train_loss": -26.05344581604004, "global_step": 315434, "epoch": 3800} {"train_loss": -25.6220703125, "global_step": 315435, "epoch": 3800} {"train_loss": -25.775964736938477, "global_step": 315436, "epoch": 3800} {"train_loss": -25.82752799987793, "global_step": 315437, "epoch": 3800} {"train_loss": -25.830707550048828, "global_step": 315438, "epoch": 3800} {"train_loss": -25.78700828552246, "global_step": 315439, "epoch": 3800} {"train_loss": -25.805789947509766, "global_step": 315440, "epoch": 3800} {"train_loss": -26.17364501953125, "global_step": 315441, "epoch": 3800} {"train_loss": -25.79249382019043, "global_step": 315442, "epoch": 3800} {"train_loss": -25.962987899780273, "global_step": 315443, "epoch": 3800} {"train_loss": -25.867273330688477, "global_step": 315444, "epoch": 3800} {"train_loss": -26.106664657592773, "global_step": 315445, "epoch": 3800} {"train_loss": -26.1549129486084, "global_step": 315446, "epoch": 3800} {"train_loss": -25.643238067626953, "global_step": 315447, "epoch": 3800} {"train_loss": -25.738727569580078, "global_step": 315448, "epoch": 3800} {"train_loss": -25.43625259399414, "global_step": 315449, "epoch": 3800} {"train_loss": -26.101552963256836, "global_step": 315450, "epoch": 3800} {"train_loss": -25.7205810546875, "global_step": 315451, "epoch": 3800} {"train_loss": -25.757049560546875, "global_step": 315452, "epoch": 3800} {"train_loss": -25.287322998046875, "global_step": 315453, "epoch": 3800} {"train_loss": -25.984882354736328, "global_step": 315454, "epoch": 3800} {"train_loss": -25.59469223022461, "global_step": 315455, "epoch": 3800} {"train_loss": -25.822101593017578, "global_step": 315456, "epoch": 3800} {"train_loss": -25.779682159423828, "global_step": 315457, "epoch": 3800} {"train_loss": -25.774280548095703, "global_step": 315458, "epoch": 3800} {"train_loss": -25.824365615844727, "global_step": 315459, "epoch": 3800} {"train_loss": -25.8013858795166, "global_step": 315460, "epoch": 3800} {"train_loss": -25.687891006469727, "global_step": 315461, "epoch": 3800} {"train_loss": -25.389204025268555, "global_step": 315462, "epoch": 3800} {"train_loss": -25.735647201538086, "global_step": 315463, "epoch": 3800} {"train_loss": -25.856901168823242, "global_step": 315464, "epoch": 3800} {"train_loss": -25.817991256713867, "global_step": 315465, "epoch": 3800} {"train_loss": -25.10146141052246, "global_step": 315466, "epoch": 3800} {"train_loss": -25.474088668823242, "global_step": 315467, "epoch": 3800} {"train_loss": -25.45406150817871, "global_step": 315468, "epoch": 3800} {"train_loss": -25.575042724609375, "global_step": 315469, "epoch": 3800} {"train_loss": -25.431140899658203, "global_step": 315470, "epoch": 3800} {"train_loss": -25.278493881225586, "global_step": 315471, "epoch": 3800} {"train_loss": -25.40528678894043, "global_step": 315472, "epoch": 3800} {"train_loss": -25.49183464050293, "global_step": 315473, "epoch": 3800} {"train_loss": -25.369604110717773, "global_step": 315474, "epoch": 3800} {"train_loss": -25.804885864257812, "global_step": 315475, "epoch": 3800} {"train_loss": -25.514448165893555, "global_step": 315476, "epoch": 3800} {"train_loss": -25.492650985717773, "global_step": 315477, "epoch": 3800} {"train_loss": -26.13506507873535, "global_step": 315478, "epoch": 3800} {"train_loss": -25.509567260742188, "global_step": 315479, "epoch": 3800} {"train_loss": -25.706512451171875, "global_step": 315480, "epoch": 3800} {"train_loss": -26.19366455078125, "global_step": 315481, "epoch": 3800} {"train_loss": -25.553910818444677, "global_step": 315482, "epoch": 3800, "train/sim_max_reward_0": 1.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4500000": 1.0, "test/sim_max_reward_4500001": 1.0, "test/sim_max_reward_4500002": 1.0, "test/sim_max_reward_4500003": 1.0, "test/sim_max_reward_4500004": 1.0, "test/sim_max_reward_4500005": 1.0, "test/sim_max_reward_4500006": 1.0, "test/sim_max_reward_4500007": 0.0, "test/sim_max_reward_4500008": 1.0, "test/sim_max_reward_4500009": 1.0, "test/sim_max_reward_4500010": 1.0, "test/sim_max_reward_4500011": 1.0, "test/sim_max_reward_4500012": 1.0, "test/sim_max_reward_4500013": 1.0, "test/sim_max_reward_4500014": 1.0, "test/sim_max_reward_4500015": 1.0, "test/sim_max_reward_4500016": 1.0, "test/sim_max_reward_4500017": 1.0, "test/sim_max_reward_4500018": 1.0, "test/sim_max_reward_4500019": 0.0, "test/sim_max_reward_4500020": 0.0, "test/sim_max_reward_4500021": 1.0, "train/mean_score": 1.0, "test/mean_score": 0.8636363636363636, "val_loss": 7340399.0} {"train_loss": -24.164648056030273, "global_step": 315483, "epoch": 3801} {"train_loss": -24.391433715820312, "global_step": 315484, "epoch": 3801} {"train_loss": -25.16995620727539, "global_step": 315485, "epoch": 3801} {"train_loss": -24.60706901550293, "global_step": 315486, "epoch": 3801} {"train_loss": -24.938840866088867, "global_step": 315487, "epoch": 3801} {"train_loss": -25.007516860961914, "global_step": 315488, "epoch": 3801} {"train_loss": -24.815574645996094, "global_step": 315489, "epoch": 3801} {"train_loss": -25.095083236694336, "global_step": 315490, "epoch": 3801} {"train_loss": -25.10384750366211, "global_step": 315491, "epoch": 3801} {"train_loss": -25.210758209228516, "global_step": 315492, "epoch": 3801} {"train_loss": -25.53103256225586, "global_step": 315493, "epoch": 3801} {"train_loss": -25.150981903076172, "global_step": 315494, "epoch": 3801} {"train_loss": -24.98793601989746, "global_step": 315495, "epoch": 3801} {"train_loss": -25.063261032104492, "global_step": 315496, "epoch": 3801} {"train_loss": -25.439105987548828, "global_step": 315497, "epoch": 3801} {"train_loss": -25.489582061767578, "global_step": 315498, "epoch": 3801} {"train_loss": -25.55597496032715, "global_step": 315499, "epoch": 3801} {"train_loss": -25.261816024780273, "global_step": 315500, "epoch": 3801} {"train_loss": -25.345190048217773, "global_step": 315501, "epoch": 3801} {"train_loss": -25.739953994750977, "global_step": 315502, "epoch": 3801} {"train_loss": -25.634296417236328, "global_step": 315503, "epoch": 3801} {"train_loss": -25.977447509765625, "global_step": 315504, "epoch": 3801} {"train_loss": -25.63010597229004, "global_step": 315505, "epoch": 3801} {"train_loss": -25.896642684936523, "global_step": 315506, "epoch": 3801} {"train_loss": -25.615234375, "global_step": 315507, "epoch": 3801} {"train_loss": -25.288227081298828, "global_step": 315508, "epoch": 3801} {"train_loss": -26.022323608398438, "global_step": 315509, "epoch": 3801} {"train_loss": -25.763181686401367, "global_step": 315510, "epoch": 3801} {"train_loss": -25.8529109954834, "global_step": 315511, "epoch": 3801} {"train_loss": -25.7540283203125, "global_step": 315512, "epoch": 3801} {"train_loss": -26.042041778564453, "global_step": 315513, "epoch": 3801} {"train_loss": -25.97916603088379, "global_step": 315514, "epoch": 3801} {"train_loss": -26.09671974182129, "global_step": 315515, "epoch": 3801} {"train_loss": -26.03785514831543, "global_step": 315516, "epoch": 3801} {"train_loss": -25.9222469329834, "global_step": 315517, "epoch": 3801} {"train_loss": -26.091766357421875, "global_step": 315518, "epoch": 3801} {"train_loss": -25.499685287475586, "global_step": 315519, "epoch": 3801} {"train_loss": -25.610776901245117, "global_step": 315520, "epoch": 3801} {"train_loss": -25.648365020751953, "global_step": 315521, "epoch": 3801} {"train_loss": -26.091917037963867, "global_step": 315522, "epoch": 3801} {"train_loss": -26.0549259185791, "global_step": 315523, "epoch": 3801} {"train_loss": -25.66510009765625, "global_step": 315524, "epoch": 3801} {"train_loss": -26.053014755249023, "global_step": 315525, "epoch": 3801} {"train_loss": -25.9468994140625, "global_step": 315526, "epoch": 3801} {"train_loss": -25.939573287963867, "global_step": 315527, "epoch": 3801} {"train_loss": -26.13176918029785, "global_step": 315528, "epoch": 3801} {"train_loss": -26.22822380065918, "global_step": 315529, "epoch": 3801} {"train_loss": -26.182971954345703, "global_step": 315530, "epoch": 3801} {"train_loss": -26.04811668395996, "global_step": 315531, "epoch": 3801} {"train_loss": -26.051366806030273, "global_step": 315532, "epoch": 3801} {"train_loss": -26.14231300354004, "global_step": 315533, "epoch": 3801} {"train_loss": -25.869464874267578, "global_step": 315534, "epoch": 3801} {"train_loss": -25.8430118560791, "global_step": 315535, "epoch": 3801} {"train_loss": -26.19791603088379, "global_step": 315536, "epoch": 3801} {"train_loss": -25.9399356842041, "global_step": 315537, "epoch": 3801} {"train_loss": -25.746540069580078, "global_step": 315538, "epoch": 3801} {"train_loss": -25.890745162963867, "global_step": 315539, "epoch": 3801} {"train_loss": -25.883228302001953, "global_step": 315540, "epoch": 3801} {"train_loss": -25.84246826171875, "global_step": 315541, "epoch": 3801} {"train_loss": -26.1068115234375, "global_step": 315542, "epoch": 3801} {"train_loss": -25.754322052001953, "global_step": 315543, "epoch": 3801} {"train_loss": -25.81598472595215, "global_step": 315544, "epoch": 3801} {"train_loss": -25.943302154541016, "global_step": 315545, "epoch": 3801} {"train_loss": -25.733015060424805, "global_step": 315546, "epoch": 3801} {"train_loss": -25.9027156829834, "global_step": 315547, "epoch": 3801} {"train_loss": -26.066259384155273, "global_step": 315548, "epoch": 3801} {"train_loss": -25.70330238342285, "global_step": 315549, "epoch": 3801} {"train_loss": -25.719236373901367, "global_step": 315550, "epoch": 3801} {"train_loss": -26.02463150024414, "global_step": 315551, "epoch": 3801} {"train_loss": -25.784381866455078, "global_step": 315552, "epoch": 3801} {"train_loss": -25.8836612701416, "global_step": 315553, "epoch": 3801} {"train_loss": -25.68170166015625, "global_step": 315554, "epoch": 3801} {"train_loss": -25.92002296447754, "global_step": 315555, "epoch": 3801} {"train_loss": -25.959625244140625, "global_step": 315556, "epoch": 3801} {"train_loss": -26.201171875, "global_step": 315557, "epoch": 3801} {"train_loss": -25.836456298828125, "global_step": 315558, "epoch": 3801} {"train_loss": -26.008686065673828, "global_step": 315559, "epoch": 3801} {"train_loss": -25.404804229736328, "global_step": 315560, "epoch": 3801} {"train_loss": -25.69174575805664, "global_step": 315561, "epoch": 3801} {"train_loss": -25.55931282043457, "global_step": 315562, "epoch": 3801} {"train_loss": -25.68543815612793, "global_step": 315563, "epoch": 3801} {"train_loss": -25.782880783081055, "global_step": 315564, "epoch": 3801} {"train_loss": -25.683781221688513, "global_step": 315565, "epoch": 3801, "val_loss": 7229339.0} {"train_loss": -25.109134674072266, "global_step": 315566, "epoch": 3802} {"train_loss": -25.144697189331055, "global_step": 315567, "epoch": 3802} {"train_loss": -24.988805770874023, "global_step": 315568, "epoch": 3802} {"train_loss": -25.3961124420166, "global_step": 315569, "epoch": 3802} {"train_loss": -24.944717407226562, "global_step": 315570, "epoch": 3802} {"train_loss": -25.870391845703125, "global_step": 315571, "epoch": 3802} {"train_loss": -25.11865997314453, "global_step": 315572, "epoch": 3802} {"train_loss": -25.504825592041016, "global_step": 315573, "epoch": 3802} {"train_loss": -25.337814331054688, "global_step": 315574, "epoch": 3802} {"train_loss": -25.54091453552246, "global_step": 315575, "epoch": 3802} {"train_loss": -25.622289657592773, "global_step": 315576, "epoch": 3802} {"train_loss": -25.025754928588867, "global_step": 315577, "epoch": 3802} {"train_loss": -25.602203369140625, "global_step": 315578, "epoch": 3802} {"train_loss": -25.092374801635742, "global_step": 315579, "epoch": 3802} {"train_loss": -25.341230392456055, "global_step": 315580, "epoch": 3802} {"train_loss": -25.815185546875, "global_step": 315581, "epoch": 3802} {"train_loss": -25.076459884643555, "global_step": 315582, "epoch": 3802} {"train_loss": -25.930688858032227, "global_step": 315583, "epoch": 3802} {"train_loss": -25.514419555664062, "global_step": 315584, "epoch": 3802} {"train_loss": -25.48980140686035, "global_step": 315585, "epoch": 3802} {"train_loss": -25.62603187561035, "global_step": 315586, "epoch": 3802} {"train_loss": -25.502857208251953, "global_step": 315587, "epoch": 3802} {"train_loss": -25.305335998535156, "global_step": 315588, "epoch": 3802} {"train_loss": -25.836923599243164, "global_step": 315589, "epoch": 3802} {"train_loss": -25.78899574279785, "global_step": 315590, "epoch": 3802} {"train_loss": -25.811416625976562, "global_step": 315591, "epoch": 3802} {"train_loss": -25.57297134399414, "global_step": 315592, "epoch": 3802} {"train_loss": -25.634662628173828, "global_step": 315593, "epoch": 3802} {"train_loss": -26.052997589111328, "global_step": 315594, "epoch": 3802} {"train_loss": -25.90687370300293, "global_step": 315595, "epoch": 3802} {"train_loss": -25.710351943969727, "global_step": 315596, "epoch": 3802} {"train_loss": -25.832630157470703, "global_step": 315597, "epoch": 3802} {"train_loss": -25.758991241455078, "global_step": 315598, "epoch": 3802} {"train_loss": -25.668500900268555, "global_step": 315599, "epoch": 3802} {"train_loss": -25.83609390258789, "global_step": 315600, "epoch": 3802} {"train_loss": -25.52367401123047, "global_step": 315601, "epoch": 3802} {"train_loss": -26.10699462890625, "global_step": 315602, "epoch": 3802} {"train_loss": -26.04170036315918, "global_step": 315603, "epoch": 3802} {"train_loss": -25.923751831054688, "global_step": 315604, "epoch": 3802} {"train_loss": -26.067859649658203, "global_step": 315605, "epoch": 3802} {"train_loss": -25.84113883972168, "global_step": 315606, "epoch": 3802} {"train_loss": -25.7349796295166, "global_step": 315607, "epoch": 3802} {"train_loss": -26.074304580688477, "global_step": 315608, "epoch": 3802} {"train_loss": -26.492172241210938, "global_step": 315609, "epoch": 3802} {"train_loss": -25.534400939941406, "global_step": 315610, "epoch": 3802} {"train_loss": -25.851154327392578, "global_step": 315611, "epoch": 3802} {"train_loss": -25.80112075805664, "global_step": 315612, "epoch": 3802} {"train_loss": -26.208881378173828, "global_step": 315613, "epoch": 3802} {"train_loss": -26.005231857299805, "global_step": 315614, "epoch": 3802} {"train_loss": -26.04176139831543, "global_step": 315615, "epoch": 3802} {"train_loss": -25.87701416015625, "global_step": 315616, "epoch": 3802} {"train_loss": -26.027067184448242, "global_step": 315617, "epoch": 3802} {"train_loss": -25.479612350463867, "global_step": 315618, "epoch": 3802} {"train_loss": -26.22285270690918, "global_step": 315619, "epoch": 3802} {"train_loss": -25.66269874572754, "global_step": 315620, "epoch": 3802} {"train_loss": -25.96305274963379, "global_step": 315621, "epoch": 3802} {"train_loss": -25.72028923034668, "global_step": 315622, "epoch": 3802} {"train_loss": -25.730207443237305, "global_step": 315623, "epoch": 3802} {"train_loss": -26.034381866455078, "global_step": 315624, "epoch": 3802} {"train_loss": -25.6627140045166, "global_step": 315625, "epoch": 3802} {"train_loss": -25.867101669311523, "global_step": 315626, "epoch": 3802} {"train_loss": -25.720483779907227, "global_step": 315627, "epoch": 3802} {"train_loss": -25.95804214477539, "global_step": 315628, "epoch": 3802} {"train_loss": -25.880268096923828, "global_step": 315629, "epoch": 3802} {"train_loss": -25.56333351135254, "global_step": 315630, "epoch": 3802} {"train_loss": -24.868391036987305, "global_step": 315631, "epoch": 3802} {"train_loss": -23.999326705932617, "global_step": 315632, "epoch": 3802} {"train_loss": -22.635482788085938, "global_step": 315633, "epoch": 3802} {"train_loss": -22.931943893432617, "global_step": 315634, "epoch": 3802} {"train_loss": -24.562305450439453, "global_step": 315635, "epoch": 3802} {"train_loss": -24.07994842529297, "global_step": 315636, "epoch": 3802} {"train_loss": -24.940305709838867, "global_step": 315637, "epoch": 3802} {"train_loss": -24.640995025634766, "global_step": 315638, "epoch": 3802} {"train_loss": -24.636152267456055, "global_step": 315639, "epoch": 3802} {"train_loss": -25.545698165893555, "global_step": 315640, "epoch": 3802} {"train_loss": -25.246633529663086, "global_step": 315641, "epoch": 3802} {"train_loss": -25.241762161254883, "global_step": 315642, "epoch": 3802} {"train_loss": -25.268260955810547, "global_step": 315643, "epoch": 3802} {"train_loss": -25.46196174621582, "global_step": 315644, "epoch": 3802} {"train_loss": -24.8789119720459, "global_step": 315645, "epoch": 3802} {"train_loss": -25.710874557495117, "global_step": 315646, "epoch": 3802} {"train_loss": -25.550128936767578, "global_step": 315647, "epoch": 3802} {"train_loss": -25.481923436544026, "global_step": 315648, "epoch": 3802, "val_loss": 7223915.0} {"train_loss": -24.623329162597656, "global_step": 315649, "epoch": 3803} {"train_loss": -25.21681022644043, "global_step": 315650, "epoch": 3803} {"train_loss": -25.282522201538086, "global_step": 315651, "epoch": 3803} {"train_loss": -25.115400314331055, "global_step": 315652, "epoch": 3803} {"train_loss": -24.845842361450195, "global_step": 315653, "epoch": 3803} {"train_loss": -24.790714263916016, "global_step": 315654, "epoch": 3803} {"train_loss": -25.152681350708008, "global_step": 315655, "epoch": 3803} {"train_loss": -25.380252838134766, "global_step": 315656, "epoch": 3803} {"train_loss": -25.111379623413086, "global_step": 315657, "epoch": 3803} {"train_loss": -25.01234245300293, "global_step": 315658, "epoch": 3803} {"train_loss": -25.046222686767578, "global_step": 315659, "epoch": 3803} {"train_loss": -25.429813385009766, "global_step": 315660, "epoch": 3803} {"train_loss": -25.192655563354492, "global_step": 315661, "epoch": 3803} {"train_loss": -25.35761070251465, "global_step": 315662, "epoch": 3803} {"train_loss": -25.12816047668457, "global_step": 315663, "epoch": 3803} {"train_loss": -25.271873474121094, "global_step": 315664, "epoch": 3803} {"train_loss": -25.672468185424805, "global_step": 315665, "epoch": 3803} {"train_loss": -25.462953567504883, "global_step": 315666, "epoch": 3803} {"train_loss": -25.746976852416992, "global_step": 315667, "epoch": 3803} {"train_loss": -25.234739303588867, "global_step": 315668, "epoch": 3803} {"train_loss": -25.159854888916016, "global_step": 315669, "epoch": 3803} {"train_loss": -25.560012817382812, "global_step": 315670, "epoch": 3803} {"train_loss": -25.535764694213867, "global_step": 315671, "epoch": 3803} {"train_loss": -25.292240142822266, "global_step": 315672, "epoch": 3803} {"train_loss": -25.704877853393555, "global_step": 315673, "epoch": 3803} {"train_loss": -25.53449821472168, "global_step": 315674, "epoch": 3803} {"train_loss": -25.49306297302246, "global_step": 315675, "epoch": 3803} {"train_loss": -25.889606475830078, "global_step": 315676, "epoch": 3803} {"train_loss": -25.356494903564453, "global_step": 315677, "epoch": 3803} {"train_loss": -25.460878372192383, "global_step": 315678, "epoch": 3803} {"train_loss": -25.874128341674805, "global_step": 315679, "epoch": 3803} {"train_loss": -25.935041427612305, "global_step": 315680, "epoch": 3803} {"train_loss": -25.861352920532227, "global_step": 315681, "epoch": 3803} {"train_loss": -25.57840347290039, "global_step": 315682, "epoch": 3803} {"train_loss": -25.998035430908203, "global_step": 315683, "epoch": 3803} {"train_loss": -25.504125595092773, "global_step": 315684, "epoch": 3803} {"train_loss": -25.645292282104492, "global_step": 315685, "epoch": 3803} {"train_loss": -26.02848243713379, "global_step": 315686, "epoch": 3803} {"train_loss": -25.78272819519043, "global_step": 315687, "epoch": 3803} {"train_loss": -25.539487838745117, "global_step": 315688, "epoch": 3803} {"train_loss": -25.631031036376953, "global_step": 315689, "epoch": 3803} {"train_loss": -25.78376579284668, "global_step": 315690, "epoch": 3803} {"train_loss": -25.937158584594727, "global_step": 315691, "epoch": 3803} {"train_loss": -25.44142723083496, "global_step": 315692, "epoch": 3803} {"train_loss": -25.60527992248535, "global_step": 315693, "epoch": 3803} {"train_loss": -25.348899841308594, "global_step": 315694, "epoch": 3803} {"train_loss": -25.95588493347168, "global_step": 315695, "epoch": 3803} {"train_loss": -26.0020809173584, "global_step": 315696, "epoch": 3803} {"train_loss": -25.947614669799805, "global_step": 315697, "epoch": 3803} {"train_loss": -25.540685653686523, "global_step": 315698, "epoch": 3803} {"train_loss": -25.678436279296875, "global_step": 315699, "epoch": 3803} {"train_loss": -25.584564208984375, "global_step": 315700, "epoch": 3803} {"train_loss": -26.175556182861328, "global_step": 315701, "epoch": 3803} {"train_loss": -25.731006622314453, "global_step": 315702, "epoch": 3803} {"train_loss": -25.78546142578125, "global_step": 315703, "epoch": 3803} {"train_loss": -25.982452392578125, "global_step": 315704, "epoch": 3803} {"train_loss": -25.711700439453125, "global_step": 315705, "epoch": 3803} {"train_loss": -25.747995376586914, "global_step": 315706, "epoch": 3803} {"train_loss": -25.65366554260254, "global_step": 315707, "epoch": 3803} {"train_loss": -25.6363525390625, "global_step": 315708, "epoch": 3803} {"train_loss": -25.946807861328125, "global_step": 315709, "epoch": 3803} {"train_loss": -25.95009422302246, "global_step": 315710, "epoch": 3803} {"train_loss": -26.157669067382812, "global_step": 315711, "epoch": 3803} {"train_loss": -25.94219970703125, "global_step": 315712, "epoch": 3803} {"train_loss": -25.960906982421875, "global_step": 315713, "epoch": 3803} {"train_loss": -26.052520751953125, "global_step": 315714, "epoch": 3803} {"train_loss": -25.86641502380371, "global_step": 315715, "epoch": 3803} {"train_loss": -25.87054443359375, "global_step": 315716, "epoch": 3803} {"train_loss": -25.930408477783203, "global_step": 315717, "epoch": 3803} {"train_loss": -25.755041122436523, "global_step": 315718, "epoch": 3803} {"train_loss": -26.06801414489746, "global_step": 315719, "epoch": 3803} {"train_loss": -25.864948272705078, "global_step": 315720, "epoch": 3803} {"train_loss": -25.957767486572266, "global_step": 315721, "epoch": 3803} {"train_loss": -25.860931396484375, "global_step": 315722, "epoch": 3803} {"train_loss": -26.06040382385254, "global_step": 315723, "epoch": 3803} {"train_loss": -26.444507598876953, "global_step": 315724, "epoch": 3803} {"train_loss": -26.243762969970703, "global_step": 315725, "epoch": 3803} {"train_loss": -26.301366806030273, "global_step": 315726, "epoch": 3803} {"train_loss": -26.49842643737793, "global_step": 315727, "epoch": 3803} {"train_loss": -25.881072998046875, "global_step": 315728, "epoch": 3803} {"train_loss": -25.970243453979492, "global_step": 315729, "epoch": 3803} {"train_loss": -25.883832931518555, "global_step": 315730, "epoch": 3803} {"train_loss": -25.672441781285297, "global_step": 315731, "epoch": 3803, "val_loss": 7416019.0} {"train_loss": -25.04872703552246, "global_step": 315732, "epoch": 3804} {"train_loss": -24.16470718383789, "global_step": 315733, "epoch": 3804} {"train_loss": -25.36977195739746, "global_step": 315734, "epoch": 3804} {"train_loss": -25.136459350585938, "global_step": 315735, "epoch": 3804} {"train_loss": -24.853971481323242, "global_step": 315736, "epoch": 3804} {"train_loss": -25.283761978149414, "global_step": 315737, "epoch": 3804} {"train_loss": -25.6834774017334, "global_step": 315738, "epoch": 3804} {"train_loss": -25.547582626342773, "global_step": 315739, "epoch": 3804} {"train_loss": -24.86756706237793, "global_step": 315740, "epoch": 3804} {"train_loss": -25.482913970947266, "global_step": 315741, "epoch": 3804} {"train_loss": -25.48615264892578, "global_step": 315742, "epoch": 3804} {"train_loss": -25.48656463623047, "global_step": 315743, "epoch": 3804} {"train_loss": -25.231748580932617, "global_step": 315744, "epoch": 3804} {"train_loss": -25.200963973999023, "global_step": 315745, "epoch": 3804} {"train_loss": -25.32331657409668, "global_step": 315746, "epoch": 3804} {"train_loss": -25.226591110229492, "global_step": 315747, "epoch": 3804} {"train_loss": -25.35260581970215, "global_step": 315748, "epoch": 3804} {"train_loss": -25.286239624023438, "global_step": 315749, "epoch": 3804} {"train_loss": -25.85310173034668, "global_step": 315750, "epoch": 3804} {"train_loss": -25.32206916809082, "global_step": 315751, "epoch": 3804} {"train_loss": -25.462583541870117, "global_step": 315752, "epoch": 3804} {"train_loss": -25.403228759765625, "global_step": 315753, "epoch": 3804} {"train_loss": -25.472063064575195, "global_step": 315754, "epoch": 3804} {"train_loss": -25.825031280517578, "global_step": 315755, "epoch": 3804} {"train_loss": -25.575193405151367, "global_step": 315756, "epoch": 3804} {"train_loss": -25.470458984375, "global_step": 315757, "epoch": 3804} {"train_loss": -25.52956199645996, "global_step": 315758, "epoch": 3804} {"train_loss": -25.448257446289062, "global_step": 315759, "epoch": 3804} {"train_loss": -25.457908630371094, "global_step": 315760, "epoch": 3804} {"train_loss": -25.508543014526367, "global_step": 315761, "epoch": 3804} {"train_loss": -25.480148315429688, "global_step": 315762, "epoch": 3804} {"train_loss": -25.74233055114746, "global_step": 315763, "epoch": 3804} {"train_loss": -25.34768295288086, "global_step": 315764, "epoch": 3804} {"train_loss": -25.50301170349121, "global_step": 315765, "epoch": 3804} {"train_loss": -25.756061553955078, "global_step": 315766, "epoch": 3804} {"train_loss": -25.698637008666992, "global_step": 315767, "epoch": 3804} {"train_loss": -25.738983154296875, "global_step": 315768, "epoch": 3804} {"train_loss": -26.15729331970215, "global_step": 315769, "epoch": 3804} {"train_loss": -26.413253784179688, "global_step": 315770, "epoch": 3804} {"train_loss": -26.130666732788086, "global_step": 315771, "epoch": 3804} {"train_loss": -25.436763763427734, "global_step": 315772, "epoch": 3804} {"train_loss": -25.813140869140625, "global_step": 315773, "epoch": 3804} {"train_loss": -25.97466468811035, "global_step": 315774, "epoch": 3804} {"train_loss": -25.848590850830078, "global_step": 315775, "epoch": 3804} {"train_loss": -25.948078155517578, "global_step": 315776, "epoch": 3804} {"train_loss": -25.81684684753418, "global_step": 315777, "epoch": 3804} {"train_loss": -25.60123634338379, "global_step": 315778, "epoch": 3804} {"train_loss": -25.60627555847168, "global_step": 315779, "epoch": 3804} {"train_loss": -26.042280197143555, "global_step": 315780, "epoch": 3804} {"train_loss": -26.11134147644043, "global_step": 315781, "epoch": 3804} {"train_loss": -25.438344955444336, "global_step": 315782, "epoch": 3804} {"train_loss": -26.115753173828125, "global_step": 315783, "epoch": 3804} {"train_loss": -25.93013572692871, "global_step": 315784, "epoch": 3804} {"train_loss": -25.81125831604004, "global_step": 315785, "epoch": 3804} {"train_loss": -26.102954864501953, "global_step": 315786, "epoch": 3804} {"train_loss": -25.900312423706055, "global_step": 315787, "epoch": 3804} {"train_loss": -25.78081703186035, "global_step": 315788, "epoch": 3804} {"train_loss": -26.139148712158203, "global_step": 315789, "epoch": 3804} {"train_loss": -25.9664363861084, "global_step": 315790, "epoch": 3804} {"train_loss": -25.8823299407959, "global_step": 315791, "epoch": 3804} {"train_loss": -25.651050567626953, "global_step": 315792, "epoch": 3804} {"train_loss": -25.4033260345459, "global_step": 315793, "epoch": 3804} {"train_loss": -25.65791893005371, "global_step": 315794, "epoch": 3804} {"train_loss": -26.230253219604492, "global_step": 315795, "epoch": 3804} {"train_loss": -25.902387619018555, "global_step": 315796, "epoch": 3804} {"train_loss": -25.6796817779541, "global_step": 315797, "epoch": 3804} {"train_loss": -25.714685440063477, "global_step": 315798, "epoch": 3804} {"train_loss": -25.896833419799805, "global_step": 315799, "epoch": 3804} {"train_loss": -26.030868530273438, "global_step": 315800, "epoch": 3804} {"train_loss": -25.794967651367188, "global_step": 315801, "epoch": 3804} {"train_loss": -25.078182220458984, "global_step": 315802, "epoch": 3804} {"train_loss": -24.876462936401367, "global_step": 315803, "epoch": 3804} {"train_loss": -25.50129508972168, "global_step": 315804, "epoch": 3804} {"train_loss": -25.950849533081055, "global_step": 315805, "epoch": 3804} {"train_loss": -25.892621994018555, "global_step": 315806, "epoch": 3804} {"train_loss": -25.622251510620117, "global_step": 315807, "epoch": 3804} {"train_loss": -25.86378288269043, "global_step": 315808, "epoch": 3804} {"train_loss": -25.63108253479004, "global_step": 315809, "epoch": 3804} {"train_loss": -26.040258407592773, "global_step": 315810, "epoch": 3804} {"train_loss": -25.6656436920166, "global_step": 315811, "epoch": 3804} {"train_loss": -25.84343910217285, "global_step": 315812, "epoch": 3804} {"train_loss": -25.794937133789062, "global_step": 315813, "epoch": 3804} {"train_loss": -25.636615546352893, "global_step": 315814, "epoch": 3804, "val_loss": 7259798.0} {"train_loss": -24.351255416870117, "global_step": 315815, "epoch": 3805} {"train_loss": -24.960878372192383, "global_step": 315816, "epoch": 3805} {"train_loss": -24.926868438720703, "global_step": 315817, "epoch": 3805} {"train_loss": -24.929487228393555, "global_step": 315818, "epoch": 3805} {"train_loss": -25.47556495666504, "global_step": 315819, "epoch": 3805} {"train_loss": -24.986846923828125, "global_step": 315820, "epoch": 3805} {"train_loss": -25.37027359008789, "global_step": 315821, "epoch": 3805} {"train_loss": -25.331228256225586, "global_step": 315822, "epoch": 3805} {"train_loss": -25.497434616088867, "global_step": 315823, "epoch": 3805} {"train_loss": -25.49375343322754, "global_step": 315824, "epoch": 3805} {"train_loss": -25.311538696289062, "global_step": 315825, "epoch": 3805} {"train_loss": -25.325231552124023, "global_step": 315826, "epoch": 3805} {"train_loss": -25.2470703125, "global_step": 315827, "epoch": 3805} {"train_loss": -25.30047607421875, "global_step": 315828, "epoch": 3805} {"train_loss": -25.609622955322266, "global_step": 315829, "epoch": 3805} {"train_loss": -25.632917404174805, "global_step": 315830, "epoch": 3805} {"train_loss": -25.699609756469727, "global_step": 315831, "epoch": 3805} {"train_loss": -25.570636749267578, "global_step": 315832, "epoch": 3805} {"train_loss": -25.641342163085938, "global_step": 315833, "epoch": 3805} {"train_loss": -25.505895614624023, "global_step": 315834, "epoch": 3805} {"train_loss": -25.739078521728516, "global_step": 315835, "epoch": 3805} {"train_loss": -25.538612365722656, "global_step": 315836, "epoch": 3805} {"train_loss": -25.592021942138672, "global_step": 315837, "epoch": 3805} {"train_loss": -25.603139877319336, "global_step": 315838, "epoch": 3805} {"train_loss": -25.720569610595703, "global_step": 315839, "epoch": 3805} {"train_loss": -25.186023712158203, "global_step": 315840, "epoch": 3805} {"train_loss": -25.704870223999023, "global_step": 315841, "epoch": 3805} {"train_loss": -25.67298698425293, "global_step": 315842, "epoch": 3805} {"train_loss": -25.68817710876465, "global_step": 315843, "epoch": 3805} {"train_loss": -25.57333755493164, "global_step": 315844, "epoch": 3805} {"train_loss": -25.390045166015625, "global_step": 315845, "epoch": 3805} {"train_loss": -25.61323356628418, "global_step": 315846, "epoch": 3805} {"train_loss": -25.80779457092285, "global_step": 315847, "epoch": 3805} {"train_loss": -26.01133155822754, "global_step": 315848, "epoch": 3805} {"train_loss": -25.991138458251953, "global_step": 315849, "epoch": 3805} {"train_loss": -25.367393493652344, "global_step": 315850, "epoch": 3805} {"train_loss": -25.865880966186523, "global_step": 315851, "epoch": 3805} {"train_loss": -25.832447052001953, "global_step": 315852, "epoch": 3805} {"train_loss": -25.6601619720459, "global_step": 315853, "epoch": 3805} {"train_loss": -25.677392959594727, "global_step": 315854, "epoch": 3805} {"train_loss": -26.322248458862305, "global_step": 315855, "epoch": 3805} {"train_loss": -25.5899600982666, "global_step": 315856, "epoch": 3805} {"train_loss": -25.689966201782227, "global_step": 315857, "epoch": 3805} {"train_loss": -26.139144897460938, "global_step": 315858, "epoch": 3805} {"train_loss": -26.077972412109375, "global_step": 315859, "epoch": 3805} {"train_loss": -25.67255210876465, "global_step": 315860, "epoch": 3805} {"train_loss": -25.9130916595459, "global_step": 315861, "epoch": 3805} {"train_loss": -26.0229434967041, "global_step": 315862, "epoch": 3805} {"train_loss": -25.51744270324707, "global_step": 315863, "epoch": 3805} {"train_loss": -25.898523330688477, "global_step": 315864, "epoch": 3805} {"train_loss": -26.270099639892578, "global_step": 315865, "epoch": 3805} {"train_loss": -25.995664596557617, "global_step": 315866, "epoch": 3805} {"train_loss": -25.79048728942871, "global_step": 315867, "epoch": 3805} {"train_loss": -25.81300163269043, "global_step": 315868, "epoch": 3805} {"train_loss": -25.7356014251709, "global_step": 315869, "epoch": 3805} {"train_loss": -26.076740264892578, "global_step": 315870, "epoch": 3805} {"train_loss": -25.769433975219727, "global_step": 315871, "epoch": 3805} {"train_loss": -25.63077163696289, "global_step": 315872, "epoch": 3805} {"train_loss": -25.834012985229492, "global_step": 315873, "epoch": 3805} {"train_loss": -25.829833984375, "global_step": 315874, "epoch": 3805} {"train_loss": -25.91794204711914, "global_step": 315875, "epoch": 3805} {"train_loss": -25.904882431030273, "global_step": 315876, "epoch": 3805} {"train_loss": -25.74750328063965, "global_step": 315877, "epoch": 3805} {"train_loss": -25.86516761779785, "global_step": 315878, "epoch": 3805} {"train_loss": -25.9039249420166, "global_step": 315879, "epoch": 3805} {"train_loss": -25.733640670776367, "global_step": 315880, "epoch": 3805} {"train_loss": -26.015974044799805, "global_step": 315881, "epoch": 3805} {"train_loss": -26.21392822265625, "global_step": 315882, "epoch": 3805} {"train_loss": -25.96477699279785, "global_step": 315883, "epoch": 3805} {"train_loss": -25.7220458984375, "global_step": 315884, "epoch": 3805} {"train_loss": -25.753223419189453, "global_step": 315885, "epoch": 3805} {"train_loss": -25.61187744140625, "global_step": 315886, "epoch": 3805} {"train_loss": -26.18231201171875, "global_step": 315887, "epoch": 3805} {"train_loss": -25.95416831970215, "global_step": 315888, "epoch": 3805} {"train_loss": -25.71880531311035, "global_step": 315889, "epoch": 3805} {"train_loss": -25.736597061157227, "global_step": 315890, "epoch": 3805} {"train_loss": -25.499357223510742, "global_step": 315891, "epoch": 3805} {"train_loss": -25.76194190979004, "global_step": 315892, "epoch": 3805} {"train_loss": -25.6384334564209, "global_step": 315893, "epoch": 3805} {"train_loss": -25.872587203979492, "global_step": 315894, "epoch": 3805} {"train_loss": -25.73801612854004, "global_step": 315895, "epoch": 3805} {"train_loss": -25.962045669555664, "global_step": 315896, "epoch": 3805} {"train_loss": -25.66298098736499, "global_step": 315897, "epoch": 3805, "val_loss": 7201940.5} {"train_loss": -24.766071319580078, "global_step": 315898, "epoch": 3806} {"train_loss": -24.993362426757812, "global_step": 315899, "epoch": 3806} {"train_loss": -24.53437614440918, "global_step": 315900, "epoch": 3806} {"train_loss": -24.872724533081055, "global_step": 315901, "epoch": 3806} {"train_loss": -25.155813217163086, "global_step": 315902, "epoch": 3806} {"train_loss": -24.702627182006836, "global_step": 315903, "epoch": 3806} {"train_loss": -25.41457748413086, "global_step": 315904, "epoch": 3806} {"train_loss": -25.44928550720215, "global_step": 315905, "epoch": 3806} {"train_loss": -25.449995040893555, "global_step": 315906, "epoch": 3806} {"train_loss": -25.187789916992188, "global_step": 315907, "epoch": 3806} {"train_loss": -25.686864852905273, "global_step": 315908, "epoch": 3806} {"train_loss": -25.26675796508789, "global_step": 315909, "epoch": 3806} {"train_loss": -25.267974853515625, "global_step": 315910, "epoch": 3806} {"train_loss": -25.44750213623047, "global_step": 315911, "epoch": 3806} {"train_loss": -25.172330856323242, "global_step": 315912, "epoch": 3806} {"train_loss": -25.21209144592285, "global_step": 315913, "epoch": 3806} {"train_loss": -25.151391983032227, "global_step": 315914, "epoch": 3806} {"train_loss": -25.512882232666016, "global_step": 315915, "epoch": 3806} {"train_loss": -25.706384658813477, "global_step": 315916, "epoch": 3806} {"train_loss": -25.204923629760742, "global_step": 315917, "epoch": 3806} {"train_loss": -25.292089462280273, "global_step": 315918, "epoch": 3806} {"train_loss": -25.7633056640625, "global_step": 315919, "epoch": 3806} {"train_loss": -25.573009490966797, "global_step": 315920, "epoch": 3806} {"train_loss": -25.73150634765625, "global_step": 315921, "epoch": 3806} {"train_loss": -25.2452449798584, "global_step": 315922, "epoch": 3806} {"train_loss": -25.46376609802246, "global_step": 315923, "epoch": 3806} {"train_loss": -25.782697677612305, "global_step": 315924, "epoch": 3806} {"train_loss": -25.593168258666992, "global_step": 315925, "epoch": 3806} {"train_loss": -25.526952743530273, "global_step": 315926, "epoch": 3806} {"train_loss": -25.807641983032227, "global_step": 315927, "epoch": 3806} {"train_loss": -25.69862174987793, "global_step": 315928, "epoch": 3806} {"train_loss": -25.74320411682129, "global_step": 315929, "epoch": 3806} {"train_loss": -25.81007957458496, "global_step": 315930, "epoch": 3806} {"train_loss": -25.54923439025879, "global_step": 315931, "epoch": 3806} {"train_loss": -25.93292236328125, "global_step": 315932, "epoch": 3806} {"train_loss": -25.3287410736084, "global_step": 315933, "epoch": 3806} {"train_loss": -26.15180015563965, "global_step": 315934, "epoch": 3806} {"train_loss": -25.94498634338379, "global_step": 315935, "epoch": 3806} {"train_loss": -25.9316349029541, "global_step": 315936, "epoch": 3806} {"train_loss": -25.744571685791016, "global_step": 315937, "epoch": 3806} {"train_loss": -25.80324363708496, "global_step": 315938, "epoch": 3806} {"train_loss": -25.73472023010254, "global_step": 315939, "epoch": 3806} {"train_loss": -25.80303382873535, "global_step": 315940, "epoch": 3806} {"train_loss": -25.806360244750977, "global_step": 315941, "epoch": 3806} {"train_loss": -25.811664581298828, "global_step": 315942, "epoch": 3806} {"train_loss": -25.93817710876465, "global_step": 315943, "epoch": 3806} {"train_loss": -25.365129470825195, "global_step": 315944, "epoch": 3806} {"train_loss": -25.52796173095703, "global_step": 315945, "epoch": 3806} {"train_loss": -25.9135684967041, "global_step": 315946, "epoch": 3806} {"train_loss": -25.698835372924805, "global_step": 315947, "epoch": 3806} {"train_loss": -25.66932487487793, "global_step": 315948, "epoch": 3806} {"train_loss": -25.784149169921875, "global_step": 315949, "epoch": 3806} {"train_loss": -25.7273006439209, "global_step": 315950, "epoch": 3806} {"train_loss": -25.07655906677246, "global_step": 315951, "epoch": 3806} {"train_loss": -25.575056076049805, "global_step": 315952, "epoch": 3806} {"train_loss": -25.493810653686523, "global_step": 315953, "epoch": 3806} {"train_loss": -25.422021865844727, "global_step": 315954, "epoch": 3806} {"train_loss": -25.510568618774414, "global_step": 315955, "epoch": 3806} {"train_loss": -25.656599044799805, "global_step": 315956, "epoch": 3806} {"train_loss": -25.545961380004883, "global_step": 315957, "epoch": 3806} {"train_loss": -24.854312896728516, "global_step": 315958, "epoch": 3806} {"train_loss": -25.722946166992188, "global_step": 315959, "epoch": 3806} {"train_loss": -25.552061080932617, "global_step": 315960, "epoch": 3806} {"train_loss": -25.222349166870117, "global_step": 315961, "epoch": 3806} {"train_loss": -25.861587524414062, "global_step": 315962, "epoch": 3806} {"train_loss": -25.401775360107422, "global_step": 315963, "epoch": 3806} {"train_loss": -25.682209014892578, "global_step": 315964, "epoch": 3806} {"train_loss": -25.474760055541992, "global_step": 315965, "epoch": 3806} {"train_loss": -25.951385498046875, "global_step": 315966, "epoch": 3806} {"train_loss": -25.778156280517578, "global_step": 315967, "epoch": 3806} {"train_loss": -25.835981369018555, "global_step": 315968, "epoch": 3806} {"train_loss": -25.685338973999023, "global_step": 315969, "epoch": 3806} {"train_loss": -26.028852462768555, "global_step": 315970, "epoch": 3806} {"train_loss": -25.582843780517578, "global_step": 315971, "epoch": 3806} {"train_loss": -25.922338485717773, "global_step": 315972, "epoch": 3806} {"train_loss": -25.592084884643555, "global_step": 315973, "epoch": 3806} {"train_loss": -25.766468048095703, "global_step": 315974, "epoch": 3806} {"train_loss": -25.856897354125977, "global_step": 315975, "epoch": 3806} {"train_loss": -25.684371948242188, "global_step": 315976, "epoch": 3806} {"train_loss": -26.063568115234375, "global_step": 315977, "epoch": 3806} {"train_loss": -25.94856834411621, "global_step": 315978, "epoch": 3806} {"train_loss": -25.259313583374023, "global_step": 315979, "epoch": 3806} {"train_loss": -25.577134580497283, "global_step": 315980, "epoch": 3806, "val_loss": 7372406.0} {"train_loss": -25.277759552001953, "global_step": 315981, "epoch": 3807} {"train_loss": -25.465856552124023, "global_step": 315982, "epoch": 3807} {"train_loss": -25.85297966003418, "global_step": 315983, "epoch": 3807} {"train_loss": -25.0601863861084, "global_step": 315984, "epoch": 3807} {"train_loss": -25.522809982299805, "global_step": 315985, "epoch": 3807} {"train_loss": -25.03767967224121, "global_step": 315986, "epoch": 3807} {"train_loss": -25.59898567199707, "global_step": 315987, "epoch": 3807} {"train_loss": -25.066078186035156, "global_step": 315988, "epoch": 3807} {"train_loss": -25.539459228515625, "global_step": 315989, "epoch": 3807} {"train_loss": -25.357648849487305, "global_step": 315990, "epoch": 3807} {"train_loss": -25.591459274291992, "global_step": 315991, "epoch": 3807} {"train_loss": -25.75602149963379, "global_step": 315992, "epoch": 3807} {"train_loss": -25.412588119506836, "global_step": 315993, "epoch": 3807} {"train_loss": -25.608793258666992, "global_step": 315994, "epoch": 3807} {"train_loss": -25.849761962890625, "global_step": 315995, "epoch": 3807} {"train_loss": -25.5328426361084, "global_step": 315996, "epoch": 3807} {"train_loss": -25.327938079833984, "global_step": 315997, "epoch": 3807} {"train_loss": -25.58937644958496, "global_step": 315998, "epoch": 3807} {"train_loss": -25.746198654174805, "global_step": 315999, "epoch": 3807} {"train_loss": -25.987173080444336, "global_step": 316000, "epoch": 3807} {"train_loss": -25.697589874267578, "global_step": 316001, "epoch": 3807} {"train_loss": -25.676624298095703, "global_step": 316002, "epoch": 3807} {"train_loss": -26.100311279296875, "global_step": 316003, "epoch": 3807} {"train_loss": -26.007888793945312, "global_step": 316004, "epoch": 3807} {"train_loss": -25.90411376953125, "global_step": 316005, "epoch": 3807} {"train_loss": -25.938007354736328, "global_step": 316006, "epoch": 3807} {"train_loss": -25.686716079711914, "global_step": 316007, "epoch": 3807} {"train_loss": -25.6673583984375, "global_step": 316008, "epoch": 3807} {"train_loss": -25.427936553955078, "global_step": 316009, "epoch": 3807} {"train_loss": -26.03667640686035, "global_step": 316010, "epoch": 3807} {"train_loss": -25.705060958862305, "global_step": 316011, "epoch": 3807} {"train_loss": -25.740741729736328, "global_step": 316012, "epoch": 3807} {"train_loss": -25.63302993774414, "global_step": 316013, "epoch": 3807} {"train_loss": -25.99384880065918, "global_step": 316014, "epoch": 3807} {"train_loss": -26.0762882232666, "global_step": 316015, "epoch": 3807} {"train_loss": -25.883142471313477, "global_step": 316016, "epoch": 3807} {"train_loss": -25.794095993041992, "global_step": 316017, "epoch": 3807} {"train_loss": -26.238264083862305, "global_step": 316018, "epoch": 3807} {"train_loss": -25.79046630859375, "global_step": 316019, "epoch": 3807} {"train_loss": -25.900129318237305, "global_step": 316020, "epoch": 3807} {"train_loss": -25.82462501525879, "global_step": 316021, "epoch": 3807} {"train_loss": -26.090341567993164, "global_step": 316022, "epoch": 3807} {"train_loss": -25.57773780822754, "global_step": 316023, "epoch": 3807} {"train_loss": -25.76544189453125, "global_step": 316024, "epoch": 3807} {"train_loss": -26.346357345581055, "global_step": 316025, "epoch": 3807} {"train_loss": -25.636449813842773, "global_step": 316026, "epoch": 3807} {"train_loss": -25.57295036315918, "global_step": 316027, "epoch": 3807} {"train_loss": -25.491939544677734, "global_step": 316028, "epoch": 3807} {"train_loss": -25.86708641052246, "global_step": 316029, "epoch": 3807} {"train_loss": -25.978412628173828, "global_step": 316030, "epoch": 3807} {"train_loss": -25.888824462890625, "global_step": 316031, "epoch": 3807} {"train_loss": -25.785144805908203, "global_step": 316032, "epoch": 3807} {"train_loss": -26.141193389892578, "global_step": 316033, "epoch": 3807} {"train_loss": -26.02241325378418, "global_step": 316034, "epoch": 3807} {"train_loss": -26.018299102783203, "global_step": 316035, "epoch": 3807} {"train_loss": -25.907623291015625, "global_step": 316036, "epoch": 3807} {"train_loss": -25.909971237182617, "global_step": 316037, "epoch": 3807} {"train_loss": -26.1807804107666, "global_step": 316038, "epoch": 3807} {"train_loss": -25.869903564453125, "global_step": 316039, "epoch": 3807} {"train_loss": -25.7285213470459, "global_step": 316040, "epoch": 3807} {"train_loss": -25.900711059570312, "global_step": 316041, "epoch": 3807} {"train_loss": -25.874860763549805, "global_step": 316042, "epoch": 3807} {"train_loss": -25.8421688079834, "global_step": 316043, "epoch": 3807} {"train_loss": -25.945728302001953, "global_step": 316044, "epoch": 3807} {"train_loss": -26.0642032623291, "global_step": 316045, "epoch": 3807} {"train_loss": -25.625146865844727, "global_step": 316046, "epoch": 3807} {"train_loss": -25.750751495361328, "global_step": 316047, "epoch": 3807} {"train_loss": -25.677326202392578, "global_step": 316048, "epoch": 3807} {"train_loss": -26.15015983581543, "global_step": 316049, "epoch": 3807} {"train_loss": -25.817981719970703, "global_step": 316050, "epoch": 3807} {"train_loss": -25.951862335205078, "global_step": 316051, "epoch": 3807} {"train_loss": -25.968103408813477, "global_step": 316052, "epoch": 3807} {"train_loss": -26.1292781829834, "global_step": 316053, "epoch": 3807} {"train_loss": -25.91107749938965, "global_step": 316054, "epoch": 3807} {"train_loss": -25.86794090270996, "global_step": 316055, "epoch": 3807} {"train_loss": -25.97579002380371, "global_step": 316056, "epoch": 3807} {"train_loss": -25.81694984436035, "global_step": 316057, "epoch": 3807} {"train_loss": -25.889331817626953, "global_step": 316058, "epoch": 3807} {"train_loss": -25.50621795654297, "global_step": 316059, "epoch": 3807} {"train_loss": -25.584827423095703, "global_step": 316060, "epoch": 3807} {"train_loss": -25.52756118774414, "global_step": 316061, "epoch": 3807} {"train_loss": -25.535642623901367, "global_step": 316062, "epoch": 3807} {"train_loss": -25.76618667970221, "global_step": 316063, "epoch": 3807, "val_loss": 7322344.0} {"train_loss": -24.491535186767578, "global_step": 316064, "epoch": 3808} {"train_loss": -24.166139602661133, "global_step": 316065, "epoch": 3808} {"train_loss": -25.2003173828125, "global_step": 316066, "epoch": 3808} {"train_loss": -24.526830673217773, "global_step": 316067, "epoch": 3808} {"train_loss": -24.5644588470459, "global_step": 316068, "epoch": 3808} {"train_loss": -25.00817108154297, "global_step": 316069, "epoch": 3808} {"train_loss": -25.20949363708496, "global_step": 316070, "epoch": 3808} {"train_loss": -25.1027774810791, "global_step": 316071, "epoch": 3808} {"train_loss": -25.552213668823242, "global_step": 316072, "epoch": 3808} {"train_loss": -25.23583984375, "global_step": 316073, "epoch": 3808} {"train_loss": -25.406740188598633, "global_step": 316074, "epoch": 3808} {"train_loss": -25.323163986206055, "global_step": 316075, "epoch": 3808} {"train_loss": -25.57765007019043, "global_step": 316076, "epoch": 3808} {"train_loss": -25.6850528717041, "global_step": 316077, "epoch": 3808} {"train_loss": -25.27501678466797, "global_step": 316078, "epoch": 3808} {"train_loss": -25.572187423706055, "global_step": 316079, "epoch": 3808} {"train_loss": -25.438390731811523, "global_step": 316080, "epoch": 3808} {"train_loss": -25.914081573486328, "global_step": 316081, "epoch": 3808} {"train_loss": -25.29527473449707, "global_step": 316082, "epoch": 3808} {"train_loss": -25.6712703704834, "global_step": 316083, "epoch": 3808} {"train_loss": -25.5814208984375, "global_step": 316084, "epoch": 3808} {"train_loss": -25.246000289916992, "global_step": 316085, "epoch": 3808} {"train_loss": -25.52080726623535, "global_step": 316086, "epoch": 3808} {"train_loss": -25.726215362548828, "global_step": 316087, "epoch": 3808} {"train_loss": -25.27039909362793, "global_step": 316088, "epoch": 3808} {"train_loss": -25.958480834960938, "global_step": 316089, "epoch": 3808} {"train_loss": -25.80527687072754, "global_step": 316090, "epoch": 3808} {"train_loss": -25.581985473632812, "global_step": 316091, "epoch": 3808} {"train_loss": -25.56157875061035, "global_step": 316092, "epoch": 3808} {"train_loss": -25.7761173248291, "global_step": 316093, "epoch": 3808} {"train_loss": -25.694299697875977, "global_step": 316094, "epoch": 3808} {"train_loss": -25.767210006713867, "global_step": 316095, "epoch": 3808} {"train_loss": -25.751440048217773, "global_step": 316096, "epoch": 3808} {"train_loss": -25.46775245666504, "global_step": 316097, "epoch": 3808} {"train_loss": -25.902088165283203, "global_step": 316098, "epoch": 3808} {"train_loss": -25.876184463500977, "global_step": 316099, "epoch": 3808} {"train_loss": -25.715673446655273, "global_step": 316100, "epoch": 3808} {"train_loss": -25.63861083984375, "global_step": 316101, "epoch": 3808} {"train_loss": -25.786279678344727, "global_step": 316102, "epoch": 3808} {"train_loss": -25.65488052368164, "global_step": 316103, "epoch": 3808} {"train_loss": -25.84832191467285, "global_step": 316104, "epoch": 3808} {"train_loss": -25.68229103088379, "global_step": 316105, "epoch": 3808} {"train_loss": -25.68893814086914, "global_step": 316106, "epoch": 3808} {"train_loss": -25.928394317626953, "global_step": 316107, "epoch": 3808} {"train_loss": -25.56159210205078, "global_step": 316108, "epoch": 3808} {"train_loss": -25.469039916992188, "global_step": 316109, "epoch": 3808} {"train_loss": -25.608917236328125, "global_step": 316110, "epoch": 3808} {"train_loss": -25.720813751220703, "global_step": 316111, "epoch": 3808} {"train_loss": -25.921527862548828, "global_step": 316112, "epoch": 3808} {"train_loss": -25.51740074157715, "global_step": 316113, "epoch": 3808} {"train_loss": -25.907779693603516, "global_step": 316114, "epoch": 3808} {"train_loss": -25.841642379760742, "global_step": 316115, "epoch": 3808} {"train_loss": -26.015058517456055, "global_step": 316116, "epoch": 3808} {"train_loss": -25.8297176361084, "global_step": 316117, "epoch": 3808} {"train_loss": -25.742156982421875, "global_step": 316118, "epoch": 3808} {"train_loss": -25.68975830078125, "global_step": 316119, "epoch": 3808} {"train_loss": -25.97258949279785, "global_step": 316120, "epoch": 3808} {"train_loss": -26.17291831970215, "global_step": 316121, "epoch": 3808} {"train_loss": -25.826868057250977, "global_step": 316122, "epoch": 3808} {"train_loss": -25.390108108520508, "global_step": 316123, "epoch": 3808} {"train_loss": -25.60068130493164, "global_step": 316124, "epoch": 3808} {"train_loss": -25.984411239624023, "global_step": 316125, "epoch": 3808} {"train_loss": -25.775503158569336, "global_step": 316126, "epoch": 3808} {"train_loss": -25.91341209411621, "global_step": 316127, "epoch": 3808} {"train_loss": -26.058658599853516, "global_step": 316128, "epoch": 3808} {"train_loss": -25.725561141967773, "global_step": 316129, "epoch": 3808} {"train_loss": -26.034442901611328, "global_step": 316130, "epoch": 3808} {"train_loss": -25.9334774017334, "global_step": 316131, "epoch": 3808} {"train_loss": -26.117761611938477, "global_step": 316132, "epoch": 3808} {"train_loss": -25.6859188079834, "global_step": 316133, "epoch": 3808} {"train_loss": -26.220569610595703, "global_step": 316134, "epoch": 3808} {"train_loss": -25.59885025024414, "global_step": 316135, "epoch": 3808} {"train_loss": -25.819061279296875, "global_step": 316136, "epoch": 3808} {"train_loss": -25.718931198120117, "global_step": 316137, "epoch": 3808} {"train_loss": -26.006793975830078, "global_step": 316138, "epoch": 3808} {"train_loss": -26.060382843017578, "global_step": 316139, "epoch": 3808} {"train_loss": -25.493986129760742, "global_step": 316140, "epoch": 3808} {"train_loss": -25.60346794128418, "global_step": 316141, "epoch": 3808} {"train_loss": -25.895740509033203, "global_step": 316142, "epoch": 3808} {"train_loss": -25.875385284423828, "global_step": 316143, "epoch": 3808} {"train_loss": -25.950580596923828, "global_step": 316144, "epoch": 3808} {"train_loss": -26.1423397064209, "global_step": 316145, "epoch": 3808} {"train_loss": -25.621106044355646, "global_step": 316146, "epoch": 3808, "val_loss": 7281763.0} {"train_loss": -24.495502471923828, "global_step": 316147, "epoch": 3809} {"train_loss": -25.395544052124023, "global_step": 316148, "epoch": 3809} {"train_loss": -24.863203048706055, "global_step": 316149, "epoch": 3809} {"train_loss": -24.698596954345703, "global_step": 316150, "epoch": 3809} {"train_loss": -25.044092178344727, "global_step": 316151, "epoch": 3809} {"train_loss": -24.993045806884766, "global_step": 316152, "epoch": 3809} {"train_loss": -25.11042594909668, "global_step": 316153, "epoch": 3809} {"train_loss": -25.501203536987305, "global_step": 316154, "epoch": 3809} {"train_loss": -25.158437728881836, "global_step": 316155, "epoch": 3809} {"train_loss": -25.366941452026367, "global_step": 316156, "epoch": 3809} {"train_loss": -24.976898193359375, "global_step": 316157, "epoch": 3809} {"train_loss": -25.39844512939453, "global_step": 316158, "epoch": 3809} {"train_loss": -25.8890438079834, "global_step": 316159, "epoch": 3809} {"train_loss": -25.299671173095703, "global_step": 316160, "epoch": 3809} {"train_loss": -25.59914207458496, "global_step": 316161, "epoch": 3809} {"train_loss": -25.21112632751465, "global_step": 316162, "epoch": 3809} {"train_loss": -25.559415817260742, "global_step": 316163, "epoch": 3809} {"train_loss": -25.412601470947266, "global_step": 316164, "epoch": 3809} {"train_loss": -25.222623825073242, "global_step": 316165, "epoch": 3809} {"train_loss": -25.23884391784668, "global_step": 316166, "epoch": 3809} {"train_loss": -25.646947860717773, "global_step": 316167, "epoch": 3809} {"train_loss": -25.667932510375977, "global_step": 316168, "epoch": 3809} {"train_loss": -25.957660675048828, "global_step": 316169, "epoch": 3809} {"train_loss": -25.18644142150879, "global_step": 316170, "epoch": 3809} {"train_loss": -25.678955078125, "global_step": 316171, "epoch": 3809} {"train_loss": -25.45686149597168, "global_step": 316172, "epoch": 3809} {"train_loss": -25.9260311126709, "global_step": 316173, "epoch": 3809} {"train_loss": -25.57423210144043, "global_step": 316174, "epoch": 3809} {"train_loss": -25.833465576171875, "global_step": 316175, "epoch": 3809} {"train_loss": -25.891773223876953, "global_step": 316176, "epoch": 3809} {"train_loss": -25.920873641967773, "global_step": 316177, "epoch": 3809} {"train_loss": -25.70516014099121, "global_step": 316178, "epoch": 3809} {"train_loss": -25.743558883666992, "global_step": 316179, "epoch": 3809} {"train_loss": -25.798553466796875, "global_step": 316180, "epoch": 3809} {"train_loss": -25.92755699157715, "global_step": 316181, "epoch": 3809} {"train_loss": -26.07721519470215, "global_step": 316182, "epoch": 3809} {"train_loss": -26.060455322265625, "global_step": 316183, "epoch": 3809} {"train_loss": -25.681325912475586, "global_step": 316184, "epoch": 3809} {"train_loss": -26.03780174255371, "global_step": 316185, "epoch": 3809} {"train_loss": -26.0312442779541, "global_step": 316186, "epoch": 3809} {"train_loss": -26.05791664123535, "global_step": 316187, "epoch": 3809} {"train_loss": -25.88787269592285, "global_step": 316188, "epoch": 3809} {"train_loss": -25.801523208618164, "global_step": 316189, "epoch": 3809} {"train_loss": -25.64306640625, "global_step": 316190, "epoch": 3809} {"train_loss": -25.615686416625977, "global_step": 316191, "epoch": 3809} {"train_loss": -26.0546817779541, "global_step": 316192, "epoch": 3809} {"train_loss": -26.08497428894043, "global_step": 316193, "epoch": 3809} {"train_loss": -25.560951232910156, "global_step": 316194, "epoch": 3809} {"train_loss": -25.42494010925293, "global_step": 316195, "epoch": 3809} {"train_loss": -26.092130661010742, "global_step": 316196, "epoch": 3809} {"train_loss": -25.65799331665039, "global_step": 316197, "epoch": 3809} {"train_loss": -26.1907958984375, "global_step": 316198, "epoch": 3809} {"train_loss": -25.763891220092773, "global_step": 316199, "epoch": 3809} {"train_loss": -25.42313575744629, "global_step": 316200, "epoch": 3809} {"train_loss": -25.361717224121094, "global_step": 316201, "epoch": 3809} {"train_loss": -25.40770721435547, "global_step": 316202, "epoch": 3809} {"train_loss": -25.707380294799805, "global_step": 316203, "epoch": 3809} {"train_loss": -25.996763229370117, "global_step": 316204, "epoch": 3809} {"train_loss": -25.657556533813477, "global_step": 316205, "epoch": 3809} {"train_loss": -25.53092384338379, "global_step": 316206, "epoch": 3809} {"train_loss": -25.785232543945312, "global_step": 316207, "epoch": 3809} {"train_loss": -25.903472900390625, "global_step": 316208, "epoch": 3809} {"train_loss": -25.669279098510742, "global_step": 316209, "epoch": 3809} {"train_loss": -26.02022361755371, "global_step": 316210, "epoch": 3809} {"train_loss": -25.57025909423828, "global_step": 316211, "epoch": 3809} {"train_loss": -25.6904354095459, "global_step": 316212, "epoch": 3809} {"train_loss": -25.793508529663086, "global_step": 316213, "epoch": 3809} {"train_loss": -26.10736656188965, "global_step": 316214, "epoch": 3809} {"train_loss": -25.720478057861328, "global_step": 316215, "epoch": 3809} {"train_loss": -25.810205459594727, "global_step": 316216, "epoch": 3809} {"train_loss": -25.817285537719727, "global_step": 316217, "epoch": 3809} {"train_loss": -25.714929580688477, "global_step": 316218, "epoch": 3809} {"train_loss": -25.536865234375, "global_step": 316219, "epoch": 3809} {"train_loss": -25.759662628173828, "global_step": 316220, "epoch": 3809} {"train_loss": -25.836217880249023, "global_step": 316221, "epoch": 3809} {"train_loss": -25.67807388305664, "global_step": 316222, "epoch": 3809} {"train_loss": -25.9112606048584, "global_step": 316223, "epoch": 3809} {"train_loss": -25.90470314025879, "global_step": 316224, "epoch": 3809} {"train_loss": -26.016584396362305, "global_step": 316225, "epoch": 3809} {"train_loss": -25.81013298034668, "global_step": 316226, "epoch": 3809} {"train_loss": -25.844221115112305, "global_step": 316227, "epoch": 3809} {"train_loss": -25.801488876342773, "global_step": 316228, "epoch": 3809} {"train_loss": -25.634397024131683, "global_step": 316229, "epoch": 3809, "val_loss": 7261100.0} {"train_loss": -24.994836807250977, "global_step": 316230, "epoch": 3810} {"train_loss": -25.39299201965332, "global_step": 316231, "epoch": 3810} {"train_loss": -25.3875789642334, "global_step": 316232, "epoch": 3810} {"train_loss": -25.419395446777344, "global_step": 316233, "epoch": 3810} {"train_loss": -25.420486450195312, "global_step": 316234, "epoch": 3810} {"train_loss": -24.68180274963379, "global_step": 316235, "epoch": 3810} {"train_loss": -25.42461585998535, "global_step": 316236, "epoch": 3810} {"train_loss": -25.35916519165039, "global_step": 316237, "epoch": 3810} {"train_loss": -25.469526290893555, "global_step": 316238, "epoch": 3810} {"train_loss": -25.42513084411621, "global_step": 316239, "epoch": 3810} {"train_loss": -25.86359977722168, "global_step": 316240, "epoch": 3810} {"train_loss": -25.951812744140625, "global_step": 316241, "epoch": 3810} {"train_loss": -25.343894958496094, "global_step": 316242, "epoch": 3810} {"train_loss": -25.52691078186035, "global_step": 316243, "epoch": 3810} {"train_loss": -25.836517333984375, "global_step": 316244, "epoch": 3810} {"train_loss": -25.599782943725586, "global_step": 316245, "epoch": 3810} {"train_loss": -25.84393882751465, "global_step": 316246, "epoch": 3810} {"train_loss": -25.825220108032227, "global_step": 316247, "epoch": 3810} {"train_loss": -25.960500717163086, "global_step": 316248, "epoch": 3810} {"train_loss": -25.80999755859375, "global_step": 316249, "epoch": 3810} {"train_loss": -25.724409103393555, "global_step": 316250, "epoch": 3810} {"train_loss": -26.01505470275879, "global_step": 316251, "epoch": 3810} {"train_loss": -25.519760131835938, "global_step": 316252, "epoch": 3810} {"train_loss": -25.899633407592773, "global_step": 316253, "epoch": 3810} {"train_loss": -25.759984970092773, "global_step": 316254, "epoch": 3810} {"train_loss": -25.59524917602539, "global_step": 316255, "epoch": 3810} {"train_loss": -25.519378662109375, "global_step": 316256, "epoch": 3810} {"train_loss": -25.444692611694336, "global_step": 316257, "epoch": 3810} {"train_loss": -25.6530818939209, "global_step": 316258, "epoch": 3810} {"train_loss": -25.64119529724121, "global_step": 316259, "epoch": 3810} {"train_loss": -25.938159942626953, "global_step": 316260, "epoch": 3810} {"train_loss": -25.993680953979492, "global_step": 316261, "epoch": 3810} {"train_loss": -26.011350631713867, "global_step": 316262, "epoch": 3810} {"train_loss": -25.859180450439453, "global_step": 316263, "epoch": 3810} {"train_loss": -26.0838623046875, "global_step": 316264, "epoch": 3810} {"train_loss": -26.06388282775879, "global_step": 316265, "epoch": 3810} {"train_loss": -25.79315185546875, "global_step": 316266, "epoch": 3810} {"train_loss": -25.788238525390625, "global_step": 316267, "epoch": 3810} {"train_loss": -25.954303741455078, "global_step": 316268, "epoch": 3810} {"train_loss": -26.19636344909668, "global_step": 316269, "epoch": 3810} {"train_loss": -25.706220626831055, "global_step": 316270, "epoch": 3810} {"train_loss": -25.767728805541992, "global_step": 316271, "epoch": 3810} {"train_loss": -25.885639190673828, "global_step": 316272, "epoch": 3810} {"train_loss": -25.657880783081055, "global_step": 316273, "epoch": 3810} {"train_loss": -25.755231857299805, "global_step": 316274, "epoch": 3810} {"train_loss": -25.776647567749023, "global_step": 316275, "epoch": 3810} {"train_loss": -25.979063034057617, "global_step": 316276, "epoch": 3810} {"train_loss": -25.679853439331055, "global_step": 316277, "epoch": 3810} {"train_loss": -25.974348068237305, "global_step": 316278, "epoch": 3810} {"train_loss": -25.940185546875, "global_step": 316279, "epoch": 3810} {"train_loss": -25.5887451171875, "global_step": 316280, "epoch": 3810} {"train_loss": -25.61850929260254, "global_step": 316281, "epoch": 3810} {"train_loss": -25.63972282409668, "global_step": 316282, "epoch": 3810} {"train_loss": -25.64369010925293, "global_step": 316283, "epoch": 3810} {"train_loss": -25.74653434753418, "global_step": 316284, "epoch": 3810} {"train_loss": -25.961706161499023, "global_step": 316285, "epoch": 3810} {"train_loss": -25.889713287353516, "global_step": 316286, "epoch": 3810} {"train_loss": -25.976654052734375, "global_step": 316287, "epoch": 3810} {"train_loss": -26.097471237182617, "global_step": 316288, "epoch": 3810} {"train_loss": -26.120542526245117, "global_step": 316289, "epoch": 3810} {"train_loss": -26.038604736328125, "global_step": 316290, "epoch": 3810} {"train_loss": -26.126331329345703, "global_step": 316291, "epoch": 3810} {"train_loss": -26.16733741760254, "global_step": 316292, "epoch": 3810} {"train_loss": -25.95417594909668, "global_step": 316293, "epoch": 3810} {"train_loss": -25.983509063720703, "global_step": 316294, "epoch": 3810} {"train_loss": -25.891448974609375, "global_step": 316295, "epoch": 3810} {"train_loss": -26.139362335205078, "global_step": 316296, "epoch": 3810} {"train_loss": -25.738439559936523, "global_step": 316297, "epoch": 3810} {"train_loss": -25.81158447265625, "global_step": 316298, "epoch": 3810} {"train_loss": -25.93317222595215, "global_step": 316299, "epoch": 3810} {"train_loss": -25.68975830078125, "global_step": 316300, "epoch": 3810} {"train_loss": -26.166982650756836, "global_step": 316301, "epoch": 3810} {"train_loss": -25.89361572265625, "global_step": 316302, "epoch": 3810} {"train_loss": -25.90805435180664, "global_step": 316303, "epoch": 3810} {"train_loss": -25.809057235717773, "global_step": 316304, "epoch": 3810} {"train_loss": -26.303314208984375, "global_step": 316305, "epoch": 3810} {"train_loss": -26.12570571899414, "global_step": 316306, "epoch": 3810} {"train_loss": -25.676939010620117, "global_step": 316307, "epoch": 3810} {"train_loss": -25.812671661376953, "global_step": 316308, "epoch": 3810} {"train_loss": -25.88543128967285, "global_step": 316309, "epoch": 3810} {"train_loss": -25.910266876220703, "global_step": 316310, "epoch": 3810} {"train_loss": -25.83286476135254, "global_step": 316311, "epoch": 3810} {"train_loss": -25.77516962533974, "global_step": 316312, "epoch": 3810, "val_loss": 7231012.0} {"train_loss": -24.52675437927246, "global_step": 316313, "epoch": 3811} {"train_loss": -23.493452072143555, "global_step": 316314, "epoch": 3811} {"train_loss": -24.77889060974121, "global_step": 316315, "epoch": 3811} {"train_loss": -24.249479293823242, "global_step": 316316, "epoch": 3811} {"train_loss": -24.383634567260742, "global_step": 316317, "epoch": 3811} {"train_loss": -24.587900161743164, "global_step": 316318, "epoch": 3811} {"train_loss": -24.940032958984375, "global_step": 316319, "epoch": 3811} {"train_loss": -24.9129638671875, "global_step": 316320, "epoch": 3811} {"train_loss": -24.690027236938477, "global_step": 316321, "epoch": 3811} {"train_loss": -24.58103370666504, "global_step": 316322, "epoch": 3811} {"train_loss": -25.011138916015625, "global_step": 316323, "epoch": 3811} {"train_loss": -24.99942970275879, "global_step": 316324, "epoch": 3811} {"train_loss": -24.8758544921875, "global_step": 316325, "epoch": 3811} {"train_loss": -25.160898208618164, "global_step": 316326, "epoch": 3811} {"train_loss": -25.392425537109375, "global_step": 316327, "epoch": 3811} {"train_loss": -25.336877822875977, "global_step": 316328, "epoch": 3811} {"train_loss": -25.278736114501953, "global_step": 316329, "epoch": 3811} {"train_loss": -25.206205368041992, "global_step": 316330, "epoch": 3811} {"train_loss": -25.26544761657715, "global_step": 316331, "epoch": 3811} {"train_loss": -25.2315673828125, "global_step": 316332, "epoch": 3811} {"train_loss": -25.19342041015625, "global_step": 316333, "epoch": 3811} {"train_loss": -25.750699996948242, "global_step": 316334, "epoch": 3811} {"train_loss": -25.46795082092285, "global_step": 316335, "epoch": 3811} {"train_loss": -25.309545516967773, "global_step": 316336, "epoch": 3811} {"train_loss": -25.484149932861328, "global_step": 316337, "epoch": 3811} {"train_loss": -25.711423873901367, "global_step": 316338, "epoch": 3811} {"train_loss": -25.791711807250977, "global_step": 316339, "epoch": 3811} {"train_loss": -25.317840576171875, "global_step": 316340, "epoch": 3811} {"train_loss": -25.364866256713867, "global_step": 316341, "epoch": 3811} {"train_loss": -25.957101821899414, "global_step": 316342, "epoch": 3811} {"train_loss": -25.65921401977539, "global_step": 316343, "epoch": 3811} {"train_loss": -25.726110458374023, "global_step": 316344, "epoch": 3811} {"train_loss": -25.7308349609375, "global_step": 316345, "epoch": 3811} {"train_loss": -25.739484786987305, "global_step": 316346, "epoch": 3811} {"train_loss": -26.053150177001953, "global_step": 316347, "epoch": 3811} {"train_loss": -25.451459884643555, "global_step": 316348, "epoch": 3811} {"train_loss": -25.589031219482422, "global_step": 316349, "epoch": 3811} {"train_loss": -26.0233211517334, "global_step": 316350, "epoch": 3811} {"train_loss": -25.893110275268555, "global_step": 316351, "epoch": 3811} {"train_loss": -25.65865135192871, "global_step": 316352, "epoch": 3811} {"train_loss": -25.728302001953125, "global_step": 316353, "epoch": 3811} {"train_loss": -25.641759872436523, "global_step": 316354, "epoch": 3811} {"train_loss": -25.680328369140625, "global_step": 316355, "epoch": 3811} {"train_loss": -25.939483642578125, "global_step": 316356, "epoch": 3811} {"train_loss": -26.03435707092285, "global_step": 316357, "epoch": 3811} {"train_loss": -25.547025680541992, "global_step": 316358, "epoch": 3811} {"train_loss": -26.059925079345703, "global_step": 316359, "epoch": 3811} {"train_loss": -26.146472930908203, "global_step": 316360, "epoch": 3811} {"train_loss": -25.93548011779785, "global_step": 316361, "epoch": 3811} {"train_loss": -25.848663330078125, "global_step": 316362, "epoch": 3811} {"train_loss": -26.02357292175293, "global_step": 316363, "epoch": 3811} {"train_loss": -25.772336959838867, "global_step": 316364, "epoch": 3811} {"train_loss": -25.69227409362793, "global_step": 316365, "epoch": 3811} {"train_loss": -26.052228927612305, "global_step": 316366, "epoch": 3811} {"train_loss": -25.569578170776367, "global_step": 316367, "epoch": 3811} {"train_loss": -26.323415756225586, "global_step": 316368, "epoch": 3811} {"train_loss": -25.99481773376465, "global_step": 316369, "epoch": 3811} {"train_loss": -26.14407730102539, "global_step": 316370, "epoch": 3811} {"train_loss": -25.592756271362305, "global_step": 316371, "epoch": 3811} {"train_loss": -26.307844161987305, "global_step": 316372, "epoch": 3811} {"train_loss": -26.14539909362793, "global_step": 316373, "epoch": 3811} {"train_loss": -25.9136905670166, "global_step": 316374, "epoch": 3811} {"train_loss": -25.874460220336914, "global_step": 316375, "epoch": 3811} {"train_loss": -25.476430892944336, "global_step": 316376, "epoch": 3811} {"train_loss": -25.94783592224121, "global_step": 316377, "epoch": 3811} {"train_loss": -25.723669052124023, "global_step": 316378, "epoch": 3811} {"train_loss": -25.830907821655273, "global_step": 316379, "epoch": 3811} {"train_loss": -25.970935821533203, "global_step": 316380, "epoch": 3811} {"train_loss": -26.230335235595703, "global_step": 316381, "epoch": 3811} {"train_loss": -25.824539184570312, "global_step": 316382, "epoch": 3811} {"train_loss": -25.937305450439453, "global_step": 316383, "epoch": 3811} {"train_loss": -25.73065757751465, "global_step": 316384, "epoch": 3811} {"train_loss": -25.918262481689453, "global_step": 316385, "epoch": 3811} {"train_loss": -25.408782958984375, "global_step": 316386, "epoch": 3811} {"train_loss": -25.870752334594727, "global_step": 316387, "epoch": 3811} {"train_loss": -25.87978172302246, "global_step": 316388, "epoch": 3811} {"train_loss": -25.53139305114746, "global_step": 316389, "epoch": 3811} {"train_loss": -25.725982666015625, "global_step": 316390, "epoch": 3811} {"train_loss": -25.896732330322266, "global_step": 316391, "epoch": 3811} {"train_loss": -25.409469604492188, "global_step": 316392, "epoch": 3811} {"train_loss": -25.737491607666016, "global_step": 316393, "epoch": 3811} {"train_loss": -25.570951461791992, "global_step": 316394, "epoch": 3811} {"train_loss": -25.550099016672156, "global_step": 316395, "epoch": 3811, "val_loss": 7290013.0} {"train_loss": -25.366601943969727, "global_step": 316396, "epoch": 3812} {"train_loss": -25.721515655517578, "global_step": 316397, "epoch": 3812} {"train_loss": -25.584455490112305, "global_step": 316398, "epoch": 3812} {"train_loss": -25.553348541259766, "global_step": 316399, "epoch": 3812} {"train_loss": -26.2536678314209, "global_step": 316400, "epoch": 3812} {"train_loss": -25.25739288330078, "global_step": 316401, "epoch": 3812} {"train_loss": -25.476436614990234, "global_step": 316402, "epoch": 3812} {"train_loss": -25.798688888549805, "global_step": 316403, "epoch": 3812} {"train_loss": -25.311344146728516, "global_step": 316404, "epoch": 3812} {"train_loss": -25.59906768798828, "global_step": 316405, "epoch": 3812} {"train_loss": -25.300180435180664, "global_step": 316406, "epoch": 3812} {"train_loss": -25.890180587768555, "global_step": 316407, "epoch": 3812} {"train_loss": -25.400253295898438, "global_step": 316408, "epoch": 3812} {"train_loss": -25.40107536315918, "global_step": 316409, "epoch": 3812} {"train_loss": -25.95293617248535, "global_step": 316410, "epoch": 3812} {"train_loss": -25.52018165588379, "global_step": 316411, "epoch": 3812} {"train_loss": -25.50178337097168, "global_step": 316412, "epoch": 3812} {"train_loss": -25.47466278076172, "global_step": 316413, "epoch": 3812} {"train_loss": -25.33058738708496, "global_step": 316414, "epoch": 3812} {"train_loss": -25.942062377929688, "global_step": 316415, "epoch": 3812} {"train_loss": -25.755615234375, "global_step": 316416, "epoch": 3812} {"train_loss": -25.615570068359375, "global_step": 316417, "epoch": 3812} {"train_loss": -25.62747573852539, "global_step": 316418, "epoch": 3812} {"train_loss": -25.58599281311035, "global_step": 316419, "epoch": 3812} {"train_loss": -25.540040969848633, "global_step": 316420, "epoch": 3812} {"train_loss": -25.878406524658203, "global_step": 316421, "epoch": 3812} {"train_loss": -25.939361572265625, "global_step": 316422, "epoch": 3812} {"train_loss": -25.806720733642578, "global_step": 316423, "epoch": 3812} {"train_loss": -25.827716827392578, "global_step": 316424, "epoch": 3812} {"train_loss": -26.07283592224121, "global_step": 316425, "epoch": 3812} {"train_loss": -25.780567169189453, "global_step": 316426, "epoch": 3812} {"train_loss": -25.949447631835938, "global_step": 316427, "epoch": 3812} {"train_loss": -25.812671661376953, "global_step": 316428, "epoch": 3812} {"train_loss": -26.331968307495117, "global_step": 316429, "epoch": 3812} {"train_loss": -25.6796817779541, "global_step": 316430, "epoch": 3812} {"train_loss": -26.282800674438477, "global_step": 316431, "epoch": 3812} {"train_loss": -25.873748779296875, "global_step": 316432, "epoch": 3812} {"train_loss": -25.91596031188965, "global_step": 316433, "epoch": 3812} {"train_loss": -25.900217056274414, "global_step": 316434, "epoch": 3812} {"train_loss": -25.7231388092041, "global_step": 316435, "epoch": 3812} {"train_loss": -25.623682022094727, "global_step": 316436, "epoch": 3812} {"train_loss": -25.882522583007812, "global_step": 316437, "epoch": 3812} {"train_loss": -26.056074142456055, "global_step": 316438, "epoch": 3812} {"train_loss": -25.8743896484375, "global_step": 316439, "epoch": 3812} {"train_loss": -25.404409408569336, "global_step": 316440, "epoch": 3812} {"train_loss": -25.84443473815918, "global_step": 316441, "epoch": 3812} {"train_loss": -25.742401123046875, "global_step": 316442, "epoch": 3812} {"train_loss": -25.98862075805664, "global_step": 316443, "epoch": 3812} {"train_loss": -25.762378692626953, "global_step": 316444, "epoch": 3812} {"train_loss": -25.69733238220215, "global_step": 316445, "epoch": 3812} {"train_loss": -25.901227951049805, "global_step": 316446, "epoch": 3812} {"train_loss": -25.95208740234375, "global_step": 316447, "epoch": 3812} {"train_loss": -25.85527992248535, "global_step": 316448, "epoch": 3812} {"train_loss": -25.46748161315918, "global_step": 316449, "epoch": 3812} {"train_loss": -25.7880916595459, "global_step": 316450, "epoch": 3812} {"train_loss": -25.791730880737305, "global_step": 316451, "epoch": 3812} {"train_loss": -25.9493465423584, "global_step": 316452, "epoch": 3812} {"train_loss": -25.871442794799805, "global_step": 316453, "epoch": 3812} {"train_loss": -25.679264068603516, "global_step": 316454, "epoch": 3812} {"train_loss": -25.6104793548584, "global_step": 316455, "epoch": 3812} {"train_loss": -25.942243576049805, "global_step": 316456, "epoch": 3812} {"train_loss": -25.651838302612305, "global_step": 316457, "epoch": 3812} {"train_loss": -25.81293296813965, "global_step": 316458, "epoch": 3812} {"train_loss": -25.522573471069336, "global_step": 316459, "epoch": 3812} {"train_loss": -25.822607040405273, "global_step": 316460, "epoch": 3812} {"train_loss": -25.65138053894043, "global_step": 316461, "epoch": 3812} {"train_loss": -25.990345001220703, "global_step": 316462, "epoch": 3812} {"train_loss": -25.57331085205078, "global_step": 316463, "epoch": 3812} {"train_loss": -26.047119140625, "global_step": 316464, "epoch": 3812} {"train_loss": -26.03107261657715, "global_step": 316465, "epoch": 3812} {"train_loss": -25.670148849487305, "global_step": 316466, "epoch": 3812} {"train_loss": -25.562570571899414, "global_step": 316467, "epoch": 3812} {"train_loss": -25.611902236938477, "global_step": 316468, "epoch": 3812} {"train_loss": -25.474885940551758, "global_step": 316469, "epoch": 3812} {"train_loss": -25.8250675201416, "global_step": 316470, "epoch": 3812} {"train_loss": -26.057947158813477, "global_step": 316471, "epoch": 3812} {"train_loss": -25.831281661987305, "global_step": 316472, "epoch": 3812} {"train_loss": -25.891895294189453, "global_step": 316473, "epoch": 3812} {"train_loss": -25.7205867767334, "global_step": 316474, "epoch": 3812} {"train_loss": -26.10957145690918, "global_step": 316475, "epoch": 3812} {"train_loss": -25.776111602783203, "global_step": 316476, "epoch": 3812} {"train_loss": -25.650043487548828, "global_step": 316477, "epoch": 3812} {"train_loss": -25.715453159378235, "global_step": 316478, "epoch": 3812, "val_loss": 7187835.0} {"train_loss": -25.575773239135742, "global_step": 316479, "epoch": 3813} {"train_loss": -25.729887008666992, "global_step": 316480, "epoch": 3813} {"train_loss": -25.290767669677734, "global_step": 316481, "epoch": 3813} {"train_loss": -25.411935806274414, "global_step": 316482, "epoch": 3813} {"train_loss": -25.85837173461914, "global_step": 316483, "epoch": 3813} {"train_loss": -25.839502334594727, "global_step": 316484, "epoch": 3813} {"train_loss": -25.380542755126953, "global_step": 316485, "epoch": 3813} {"train_loss": -25.922483444213867, "global_step": 316486, "epoch": 3813} {"train_loss": -25.491384506225586, "global_step": 316487, "epoch": 3813} {"train_loss": -26.040424346923828, "global_step": 316488, "epoch": 3813} {"train_loss": -25.7767391204834, "global_step": 316489, "epoch": 3813} {"train_loss": -26.35694694519043, "global_step": 316490, "epoch": 3813} {"train_loss": -25.773061752319336, "global_step": 316491, "epoch": 3813} {"train_loss": -25.82145118713379, "global_step": 316492, "epoch": 3813} {"train_loss": -25.97597312927246, "global_step": 316493, "epoch": 3813} {"train_loss": -26.217060089111328, "global_step": 316494, "epoch": 3813} {"train_loss": -25.50996971130371, "global_step": 316495, "epoch": 3813} {"train_loss": -25.46381187438965, "global_step": 316496, "epoch": 3813} {"train_loss": -25.651611328125, "global_step": 316497, "epoch": 3813} {"train_loss": -25.449325561523438, "global_step": 316498, "epoch": 3813} {"train_loss": -25.143325805664062, "global_step": 316499, "epoch": 3813} {"train_loss": -25.269372940063477, "global_step": 316500, "epoch": 3813} {"train_loss": -25.692453384399414, "global_step": 316501, "epoch": 3813} {"train_loss": -26.128747940063477, "global_step": 316502, "epoch": 3813} {"train_loss": -25.552221298217773, "global_step": 316503, "epoch": 3813} {"train_loss": -25.389074325561523, "global_step": 316504, "epoch": 3813} {"train_loss": -25.432451248168945, "global_step": 316505, "epoch": 3813} {"train_loss": -25.708526611328125, "global_step": 316506, "epoch": 3813} {"train_loss": -25.85719871520996, "global_step": 316507, "epoch": 3813} {"train_loss": -25.66652488708496, "global_step": 316508, "epoch": 3813} {"train_loss": -26.087438583374023, "global_step": 316509, "epoch": 3813} {"train_loss": -26.239013671875, "global_step": 316510, "epoch": 3813} {"train_loss": -25.43623161315918, "global_step": 316511, "epoch": 3813} {"train_loss": -25.85573387145996, "global_step": 316512, "epoch": 3813} {"train_loss": -25.60793113708496, "global_step": 316513, "epoch": 3813} {"train_loss": -26.119144439697266, "global_step": 316514, "epoch": 3813} {"train_loss": -25.426427841186523, "global_step": 316515, "epoch": 3813} {"train_loss": -26.03394889831543, "global_step": 316516, "epoch": 3813} {"train_loss": -25.714651107788086, "global_step": 316517, "epoch": 3813} {"train_loss": -26.123523712158203, "global_step": 316518, "epoch": 3813} {"train_loss": -25.79242515563965, "global_step": 316519, "epoch": 3813} {"train_loss": -25.76372718811035, "global_step": 316520, "epoch": 3813} {"train_loss": -26.106725692749023, "global_step": 316521, "epoch": 3813} {"train_loss": -25.85029411315918, "global_step": 316522, "epoch": 3813} {"train_loss": -25.938526153564453, "global_step": 316523, "epoch": 3813} {"train_loss": -26.136728286743164, "global_step": 316524, "epoch": 3813} {"train_loss": -25.70562744140625, "global_step": 316525, "epoch": 3813} {"train_loss": -25.852893829345703, "global_step": 316526, "epoch": 3813} {"train_loss": -26.18829917907715, "global_step": 316527, "epoch": 3813} {"train_loss": -25.519460678100586, "global_step": 316528, "epoch": 3813} {"train_loss": -25.421756744384766, "global_step": 316529, "epoch": 3813} {"train_loss": -25.90885353088379, "global_step": 316530, "epoch": 3813} {"train_loss": -26.389911651611328, "global_step": 316531, "epoch": 3813} {"train_loss": -25.867782592773438, "global_step": 316532, "epoch": 3813} {"train_loss": -25.814416885375977, "global_step": 316533, "epoch": 3813} {"train_loss": -26.31280517578125, "global_step": 316534, "epoch": 3813} {"train_loss": -26.003931045532227, "global_step": 316535, "epoch": 3813} {"train_loss": -26.047632217407227, "global_step": 316536, "epoch": 3813} {"train_loss": -25.812103271484375, "global_step": 316537, "epoch": 3813} {"train_loss": -25.719694137573242, "global_step": 316538, "epoch": 3813} {"train_loss": -25.5690975189209, "global_step": 316539, "epoch": 3813} {"train_loss": -25.990951538085938, "global_step": 316540, "epoch": 3813} {"train_loss": -25.848520278930664, "global_step": 316541, "epoch": 3813} {"train_loss": -25.74188232421875, "global_step": 316542, "epoch": 3813} {"train_loss": -25.648481369018555, "global_step": 316543, "epoch": 3813} {"train_loss": -26.171300888061523, "global_step": 316544, "epoch": 3813} {"train_loss": -25.79083251953125, "global_step": 316545, "epoch": 3813} {"train_loss": -25.77861976623535, "global_step": 316546, "epoch": 3813} {"train_loss": -25.972341537475586, "global_step": 316547, "epoch": 3813} {"train_loss": -25.86037254333496, "global_step": 316548, "epoch": 3813} {"train_loss": -25.761993408203125, "global_step": 316549, "epoch": 3813} {"train_loss": -26.015289306640625, "global_step": 316550, "epoch": 3813} {"train_loss": -25.490272521972656, "global_step": 316551, "epoch": 3813} {"train_loss": -25.832962036132812, "global_step": 316552, "epoch": 3813} {"train_loss": -25.421985626220703, "global_step": 316553, "epoch": 3813} {"train_loss": -25.49817657470703, "global_step": 316554, "epoch": 3813} {"train_loss": -25.73824119567871, "global_step": 316555, "epoch": 3813} {"train_loss": -25.344785690307617, "global_step": 316556, "epoch": 3813} {"train_loss": -25.66510009765625, "global_step": 316557, "epoch": 3813} {"train_loss": -25.68522071838379, "global_step": 316558, "epoch": 3813} {"train_loss": -25.504316329956055, "global_step": 316559, "epoch": 3813} {"train_loss": -25.786924362182617, "global_step": 316560, "epoch": 3813} {"train_loss": -25.772769904998412, "global_step": 316561, "epoch": 3813, "val_loss": 7302469.0} {"train_loss": -25.087299346923828, "global_step": 316562, "epoch": 3814} {"train_loss": -25.13669204711914, "global_step": 316563, "epoch": 3814} {"train_loss": -25.051939010620117, "global_step": 316564, "epoch": 3814} {"train_loss": -25.119123458862305, "global_step": 316565, "epoch": 3814} {"train_loss": -25.318906784057617, "global_step": 316566, "epoch": 3814} {"train_loss": -25.10962677001953, "global_step": 316567, "epoch": 3814} {"train_loss": -25.077613830566406, "global_step": 316568, "epoch": 3814} {"train_loss": -25.128498077392578, "global_step": 316569, "epoch": 3814} {"train_loss": -25.656436920166016, "global_step": 316570, "epoch": 3814} {"train_loss": -25.580387115478516, "global_step": 316571, "epoch": 3814} {"train_loss": -25.699817657470703, "global_step": 316572, "epoch": 3814} {"train_loss": -25.187536239624023, "global_step": 316573, "epoch": 3814} {"train_loss": -25.194812774658203, "global_step": 316574, "epoch": 3814} {"train_loss": -25.470911026000977, "global_step": 316575, "epoch": 3814} {"train_loss": -25.081552505493164, "global_step": 316576, "epoch": 3814} {"train_loss": -24.99032211303711, "global_step": 316577, "epoch": 3814} {"train_loss": -25.590818405151367, "global_step": 316578, "epoch": 3814} {"train_loss": -25.61494255065918, "global_step": 316579, "epoch": 3814} {"train_loss": -25.331783294677734, "global_step": 316580, "epoch": 3814} {"train_loss": -25.8021240234375, "global_step": 316581, "epoch": 3814} {"train_loss": -25.750532150268555, "global_step": 316582, "epoch": 3814} {"train_loss": -25.615894317626953, "global_step": 316583, "epoch": 3814} {"train_loss": -25.468122482299805, "global_step": 316584, "epoch": 3814} {"train_loss": -26.018634796142578, "global_step": 316585, "epoch": 3814} {"train_loss": -25.82999038696289, "global_step": 316586, "epoch": 3814} {"train_loss": -26.07122802734375, "global_step": 316587, "epoch": 3814} {"train_loss": -25.790714263916016, "global_step": 316588, "epoch": 3814} {"train_loss": -25.651620864868164, "global_step": 316589, "epoch": 3814} {"train_loss": -26.300052642822266, "global_step": 316590, "epoch": 3814} {"train_loss": -25.93304443359375, "global_step": 316591, "epoch": 3814} {"train_loss": -26.07354736328125, "global_step": 316592, "epoch": 3814} {"train_loss": -25.54532241821289, "global_step": 316593, "epoch": 3814} {"train_loss": -25.854162216186523, "global_step": 316594, "epoch": 3814} {"train_loss": -26.052978515625, "global_step": 316595, "epoch": 3814} {"train_loss": -25.785810470581055, "global_step": 316596, "epoch": 3814} {"train_loss": -25.899612426757812, "global_step": 316597, "epoch": 3814} {"train_loss": -25.814844131469727, "global_step": 316598, "epoch": 3814} {"train_loss": -25.984893798828125, "global_step": 316599, "epoch": 3814} {"train_loss": -26.12406349182129, "global_step": 316600, "epoch": 3814} {"train_loss": -26.27857780456543, "global_step": 316601, "epoch": 3814} {"train_loss": -25.836034774780273, "global_step": 316602, "epoch": 3814} {"train_loss": -25.538360595703125, "global_step": 316603, "epoch": 3814} {"train_loss": -25.682790756225586, "global_step": 316604, "epoch": 3814} {"train_loss": -25.78008460998535, "global_step": 316605, "epoch": 3814} {"train_loss": -26.10474967956543, "global_step": 316606, "epoch": 3814} {"train_loss": -25.700668334960938, "global_step": 316607, "epoch": 3814} {"train_loss": -25.36798095703125, "global_step": 316608, "epoch": 3814} {"train_loss": -25.5323543548584, "global_step": 316609, "epoch": 3814} {"train_loss": -25.854177474975586, "global_step": 316610, "epoch": 3814} {"train_loss": -25.7098388671875, "global_step": 316611, "epoch": 3814} {"train_loss": -25.78720474243164, "global_step": 316612, "epoch": 3814} {"train_loss": -25.561920166015625, "global_step": 316613, "epoch": 3814} {"train_loss": -25.619977951049805, "global_step": 316614, "epoch": 3814} {"train_loss": -25.8085880279541, "global_step": 316615, "epoch": 3814} {"train_loss": -25.5018310546875, "global_step": 316616, "epoch": 3814} {"train_loss": -26.17913246154785, "global_step": 316617, "epoch": 3814} {"train_loss": -25.555665969848633, "global_step": 316618, "epoch": 3814} {"train_loss": -25.636459350585938, "global_step": 316619, "epoch": 3814} {"train_loss": -25.95509147644043, "global_step": 316620, "epoch": 3814} {"train_loss": -26.134702682495117, "global_step": 316621, "epoch": 3814} {"train_loss": -25.749608993530273, "global_step": 316622, "epoch": 3814} {"train_loss": -25.987613677978516, "global_step": 316623, "epoch": 3814} {"train_loss": -25.804794311523438, "global_step": 316624, "epoch": 3814} {"train_loss": -25.685094833374023, "global_step": 316625, "epoch": 3814} {"train_loss": -25.748327255249023, "global_step": 316626, "epoch": 3814} {"train_loss": -25.745899200439453, "global_step": 316627, "epoch": 3814} {"train_loss": -26.145788192749023, "global_step": 316628, "epoch": 3814} {"train_loss": -26.365659713745117, "global_step": 316629, "epoch": 3814} {"train_loss": -25.78652000427246, "global_step": 316630, "epoch": 3814} {"train_loss": -26.074115753173828, "global_step": 316631, "epoch": 3814} {"train_loss": -26.100849151611328, "global_step": 316632, "epoch": 3814} {"train_loss": -26.063806533813477, "global_step": 316633, "epoch": 3814} {"train_loss": -25.52989959716797, "global_step": 316634, "epoch": 3814} {"train_loss": -25.94159507751465, "global_step": 316635, "epoch": 3814} {"train_loss": -26.038599014282227, "global_step": 316636, "epoch": 3814} {"train_loss": -25.811010360717773, "global_step": 316637, "epoch": 3814} {"train_loss": -25.936172485351562, "global_step": 316638, "epoch": 3814} {"train_loss": -26.121063232421875, "global_step": 316639, "epoch": 3814} {"train_loss": -25.757551193237305, "global_step": 316640, "epoch": 3814} {"train_loss": -26.046979904174805, "global_step": 316641, "epoch": 3814} {"train_loss": -25.757322311401367, "global_step": 316642, "epoch": 3814} {"train_loss": -26.054697036743164, "global_step": 316643, "epoch": 3814} {"train_loss": -25.73283976819142, "global_step": 316644, "epoch": 3814, "val_loss": 7304228.0} {"train_loss": -25.44064712524414, "global_step": 316645, "epoch": 3815} {"train_loss": -24.450597763061523, "global_step": 316646, "epoch": 3815} {"train_loss": -24.881080627441406, "global_step": 316647, "epoch": 3815} {"train_loss": -24.799978256225586, "global_step": 316648, "epoch": 3815} {"train_loss": -24.478225708007812, "global_step": 316649, "epoch": 3815} {"train_loss": -24.824237823486328, "global_step": 316650, "epoch": 3815} {"train_loss": -25.133657455444336, "global_step": 316651, "epoch": 3815} {"train_loss": -25.33854866027832, "global_step": 316652, "epoch": 3815} {"train_loss": -24.851354598999023, "global_step": 316653, "epoch": 3815} {"train_loss": -25.323436737060547, "global_step": 316654, "epoch": 3815} {"train_loss": -25.434833526611328, "global_step": 316655, "epoch": 3815} {"train_loss": -25.23438835144043, "global_step": 316656, "epoch": 3815} {"train_loss": -25.556324005126953, "global_step": 316657, "epoch": 3815} {"train_loss": -25.574604034423828, "global_step": 316658, "epoch": 3815} {"train_loss": -25.613439559936523, "global_step": 316659, "epoch": 3815} {"train_loss": -25.531949996948242, "global_step": 316660, "epoch": 3815} {"train_loss": -25.309864044189453, "global_step": 316661, "epoch": 3815} {"train_loss": -25.655012130737305, "global_step": 316662, "epoch": 3815} {"train_loss": -25.54534339904785, "global_step": 316663, "epoch": 3815} {"train_loss": -25.684873580932617, "global_step": 316664, "epoch": 3815} {"train_loss": -25.35268211364746, "global_step": 316665, "epoch": 3815} {"train_loss": -25.4951229095459, "global_step": 316666, "epoch": 3815} {"train_loss": -25.71467399597168, "global_step": 316667, "epoch": 3815} {"train_loss": -25.549535751342773, "global_step": 316668, "epoch": 3815} {"train_loss": -25.615402221679688, "global_step": 316669, "epoch": 3815} {"train_loss": -25.9962215423584, "global_step": 316670, "epoch": 3815} {"train_loss": -25.69769859313965, "global_step": 316671, "epoch": 3815} {"train_loss": -25.862777709960938, "global_step": 316672, "epoch": 3815} {"train_loss": -25.752517700195312, "global_step": 316673, "epoch": 3815} {"train_loss": -26.1905574798584, "global_step": 316674, "epoch": 3815} {"train_loss": -25.35879898071289, "global_step": 316675, "epoch": 3815} {"train_loss": -25.917455673217773, "global_step": 316676, "epoch": 3815} {"train_loss": -25.707067489624023, "global_step": 316677, "epoch": 3815} {"train_loss": -25.73719596862793, "global_step": 316678, "epoch": 3815} {"train_loss": -25.99224281311035, "global_step": 316679, "epoch": 3815} {"train_loss": -25.506607055664062, "global_step": 316680, "epoch": 3815} {"train_loss": -25.863082885742188, "global_step": 316681, "epoch": 3815} {"train_loss": -26.1014347076416, "global_step": 316682, "epoch": 3815} {"train_loss": -25.944494247436523, "global_step": 316683, "epoch": 3815} {"train_loss": -26.128143310546875, "global_step": 316684, "epoch": 3815} {"train_loss": -26.238027572631836, "global_step": 316685, "epoch": 3815} {"train_loss": -25.758686065673828, "global_step": 316686, "epoch": 3815} {"train_loss": -25.986474990844727, "global_step": 316687, "epoch": 3815} {"train_loss": -25.83503532409668, "global_step": 316688, "epoch": 3815} {"train_loss": -26.04810905456543, "global_step": 316689, "epoch": 3815} {"train_loss": -25.95989990234375, "global_step": 316690, "epoch": 3815} {"train_loss": -26.017908096313477, "global_step": 316691, "epoch": 3815} {"train_loss": -25.55129051208496, "global_step": 316692, "epoch": 3815} {"train_loss": -26.05511474609375, "global_step": 316693, "epoch": 3815} {"train_loss": -25.8052921295166, "global_step": 316694, "epoch": 3815} {"train_loss": -25.896717071533203, "global_step": 316695, "epoch": 3815} {"train_loss": -26.1397762298584, "global_step": 316696, "epoch": 3815} {"train_loss": -25.971654891967773, "global_step": 316697, "epoch": 3815} {"train_loss": -25.8935604095459, "global_step": 316698, "epoch": 3815} {"train_loss": -25.142974853515625, "global_step": 316699, "epoch": 3815} {"train_loss": -25.875364303588867, "global_step": 316700, "epoch": 3815} {"train_loss": -26.432096481323242, "global_step": 316701, "epoch": 3815} {"train_loss": -25.832895278930664, "global_step": 316702, "epoch": 3815} {"train_loss": -26.141340255737305, "global_step": 316703, "epoch": 3815} {"train_loss": -26.18842887878418, "global_step": 316704, "epoch": 3815} {"train_loss": -25.95180320739746, "global_step": 316705, "epoch": 3815} {"train_loss": -25.648588180541992, "global_step": 316706, "epoch": 3815} {"train_loss": -25.99445152282715, "global_step": 316707, "epoch": 3815} {"train_loss": -26.254119873046875, "global_step": 316708, "epoch": 3815} {"train_loss": -25.547868728637695, "global_step": 316709, "epoch": 3815} {"train_loss": -25.581045150756836, "global_step": 316710, "epoch": 3815} {"train_loss": -26.05136489868164, "global_step": 316711, "epoch": 3815} {"train_loss": -25.72198486328125, "global_step": 316712, "epoch": 3815} {"train_loss": -25.81853675842285, "global_step": 316713, "epoch": 3815} {"train_loss": -25.653894424438477, "global_step": 316714, "epoch": 3815} {"train_loss": -25.730594635009766, "global_step": 316715, "epoch": 3815} {"train_loss": -26.279809951782227, "global_step": 316716, "epoch": 3815} {"train_loss": -26.124963760375977, "global_step": 316717, "epoch": 3815} {"train_loss": -25.722492218017578, "global_step": 316718, "epoch": 3815} {"train_loss": -25.895172119140625, "global_step": 316719, "epoch": 3815} {"train_loss": -25.95350456237793, "global_step": 316720, "epoch": 3815} {"train_loss": -25.5858097076416, "global_step": 316721, "epoch": 3815} {"train_loss": -25.394834518432617, "global_step": 316722, "epoch": 3815} {"train_loss": -25.462623596191406, "global_step": 316723, "epoch": 3815} {"train_loss": -25.538131713867188, "global_step": 316724, "epoch": 3815} {"train_loss": -25.14471435546875, "global_step": 316725, "epoch": 3815} {"train_loss": -25.881479263305664, "global_step": 316726, "epoch": 3815} {"train_loss": -25.670287419514484, "global_step": 316727, "epoch": 3815, "val_loss": 7284266.0} {"train_loss": -23.932083129882812, "global_step": 316728, "epoch": 3816} {"train_loss": -25.11651611328125, "global_step": 316729, "epoch": 3816} {"train_loss": -25.090763092041016, "global_step": 316730, "epoch": 3816} {"train_loss": -24.837434768676758, "global_step": 316731, "epoch": 3816} {"train_loss": -25.03512954711914, "global_step": 316732, "epoch": 3816} {"train_loss": -24.917375564575195, "global_step": 316733, "epoch": 3816} {"train_loss": -24.822614669799805, "global_step": 316734, "epoch": 3816} {"train_loss": -25.21803092956543, "global_step": 316735, "epoch": 3816} {"train_loss": -25.371017456054688, "global_step": 316736, "epoch": 3816} {"train_loss": -25.079214096069336, "global_step": 316737, "epoch": 3816} {"train_loss": -25.3916072845459, "global_step": 316738, "epoch": 3816} {"train_loss": -25.121068954467773, "global_step": 316739, "epoch": 3816} {"train_loss": -25.626562118530273, "global_step": 316740, "epoch": 3816} {"train_loss": -25.700143814086914, "global_step": 316741, "epoch": 3816} {"train_loss": -25.35247802734375, "global_step": 316742, "epoch": 3816} {"train_loss": -25.322948455810547, "global_step": 316743, "epoch": 3816} {"train_loss": -25.209306716918945, "global_step": 316744, "epoch": 3816} {"train_loss": -25.462635040283203, "global_step": 316745, "epoch": 3816} {"train_loss": -25.8049373626709, "global_step": 316746, "epoch": 3816} {"train_loss": -25.653539657592773, "global_step": 316747, "epoch": 3816} {"train_loss": -25.47963523864746, "global_step": 316748, "epoch": 3816} {"train_loss": -25.686338424682617, "global_step": 316749, "epoch": 3816} {"train_loss": -25.875516891479492, "global_step": 316750, "epoch": 3816} {"train_loss": -25.33759880065918, "global_step": 316751, "epoch": 3816} {"train_loss": -25.349300384521484, "global_step": 316752, "epoch": 3816} {"train_loss": -25.915563583374023, "global_step": 316753, "epoch": 3816} {"train_loss": -26.11065101623535, "global_step": 316754, "epoch": 3816} {"train_loss": -25.922719955444336, "global_step": 316755, "epoch": 3816} {"train_loss": -26.10508155822754, "global_step": 316756, "epoch": 3816} {"train_loss": -25.782556533813477, "global_step": 316757, "epoch": 3816} {"train_loss": -25.829015731811523, "global_step": 316758, "epoch": 3816} {"train_loss": -25.2890682220459, "global_step": 316759, "epoch": 3816} {"train_loss": -25.916290283203125, "global_step": 316760, "epoch": 3816} {"train_loss": -25.641027450561523, "global_step": 316761, "epoch": 3816} {"train_loss": -25.58432960510254, "global_step": 316762, "epoch": 3816} {"train_loss": -26.00458335876465, "global_step": 316763, "epoch": 3816} {"train_loss": -25.81287956237793, "global_step": 316764, "epoch": 3816} {"train_loss": -25.7954044342041, "global_step": 316765, "epoch": 3816} {"train_loss": -25.501256942749023, "global_step": 316766, "epoch": 3816} {"train_loss": -25.914655685424805, "global_step": 316767, "epoch": 3816} {"train_loss": -26.147052764892578, "global_step": 316768, "epoch": 3816} {"train_loss": -25.58646011352539, "global_step": 316769, "epoch": 3816} {"train_loss": -25.657791137695312, "global_step": 316770, "epoch": 3816} {"train_loss": -25.544984817504883, "global_step": 316771, "epoch": 3816} {"train_loss": -26.180959701538086, "global_step": 316772, "epoch": 3816} {"train_loss": -25.75443458557129, "global_step": 316773, "epoch": 3816} {"train_loss": -25.625879287719727, "global_step": 316774, "epoch": 3816} {"train_loss": -26.096771240234375, "global_step": 316775, "epoch": 3816} {"train_loss": -25.846158981323242, "global_step": 316776, "epoch": 3816} {"train_loss": -25.420682907104492, "global_step": 316777, "epoch": 3816} {"train_loss": -25.39164161682129, "global_step": 316778, "epoch": 3816} {"train_loss": -25.560171127319336, "global_step": 316779, "epoch": 3816} {"train_loss": -25.55242156982422, "global_step": 316780, "epoch": 3816} {"train_loss": -25.83930778503418, "global_step": 316781, "epoch": 3816} {"train_loss": -25.86328125, "global_step": 316782, "epoch": 3816} {"train_loss": -25.6905517578125, "global_step": 316783, "epoch": 3816} {"train_loss": -25.35447120666504, "global_step": 316784, "epoch": 3816} {"train_loss": -26.169443130493164, "global_step": 316785, "epoch": 3816} {"train_loss": -25.624799728393555, "global_step": 316786, "epoch": 3816} {"train_loss": -25.823740005493164, "global_step": 316787, "epoch": 3816} {"train_loss": -25.390724182128906, "global_step": 316788, "epoch": 3816} {"train_loss": -25.52400779724121, "global_step": 316789, "epoch": 3816} {"train_loss": -25.714017868041992, "global_step": 316790, "epoch": 3816} {"train_loss": -25.831144332885742, "global_step": 316791, "epoch": 3816} {"train_loss": -25.911712646484375, "global_step": 316792, "epoch": 3816} {"train_loss": -25.54703712463379, "global_step": 316793, "epoch": 3816} {"train_loss": -25.898319244384766, "global_step": 316794, "epoch": 3816} {"train_loss": -26.260671615600586, "global_step": 316795, "epoch": 3816} {"train_loss": -25.371912002563477, "global_step": 316796, "epoch": 3816} {"train_loss": -25.67573356628418, "global_step": 316797, "epoch": 3816} {"train_loss": -25.726993560791016, "global_step": 316798, "epoch": 3816} {"train_loss": -26.11427116394043, "global_step": 316799, "epoch": 3816} {"train_loss": -26.260272979736328, "global_step": 316800, "epoch": 3816} {"train_loss": -25.81471061706543, "global_step": 316801, "epoch": 3816} {"train_loss": -26.166563034057617, "global_step": 316802, "epoch": 3816} {"train_loss": -25.819711685180664, "global_step": 316803, "epoch": 3816} {"train_loss": -26.025060653686523, "global_step": 316804, "epoch": 3816} {"train_loss": -26.1403865814209, "global_step": 316805, "epoch": 3816} {"train_loss": -26.032825469970703, "global_step": 316806, "epoch": 3816} {"train_loss": -25.829023361206055, "global_step": 316807, "epoch": 3816} {"train_loss": -26.14497184753418, "global_step": 316808, "epoch": 3816} {"train_loss": -25.924652099609375, "global_step": 316809, "epoch": 3816} {"train_loss": -25.633572865681476, "global_step": 316810, "epoch": 3816, "val_loss": 7242323.0} {"train_loss": -24.805583953857422, "global_step": 316811, "epoch": 3817} {"train_loss": -24.80475425720215, "global_step": 316812, "epoch": 3817} {"train_loss": -24.978408813476562, "global_step": 316813, "epoch": 3817} {"train_loss": -24.942373275756836, "global_step": 316814, "epoch": 3817} {"train_loss": -25.362165451049805, "global_step": 316815, "epoch": 3817} {"train_loss": -25.013137817382812, "global_step": 316816, "epoch": 3817} {"train_loss": -25.092376708984375, "global_step": 316817, "epoch": 3817} {"train_loss": -25.69426918029785, "global_step": 316818, "epoch": 3817} {"train_loss": -25.11647605895996, "global_step": 316819, "epoch": 3817} {"train_loss": -24.80141258239746, "global_step": 316820, "epoch": 3817} {"train_loss": -25.20768165588379, "global_step": 316821, "epoch": 3817} {"train_loss": -25.02213478088379, "global_step": 316822, "epoch": 3817} {"train_loss": -25.484207153320312, "global_step": 316823, "epoch": 3817} {"train_loss": -25.527034759521484, "global_step": 316824, "epoch": 3817} {"train_loss": -25.524280548095703, "global_step": 316825, "epoch": 3817} {"train_loss": -25.579465866088867, "global_step": 316826, "epoch": 3817} {"train_loss": -25.67120933532715, "global_step": 316827, "epoch": 3817} {"train_loss": -25.035799026489258, "global_step": 316828, "epoch": 3817} {"train_loss": -25.372228622436523, "global_step": 316829, "epoch": 3817} {"train_loss": -26.039636611938477, "global_step": 316830, "epoch": 3817} {"train_loss": -25.67183494567871, "global_step": 316831, "epoch": 3817} {"train_loss": -25.71970558166504, "global_step": 316832, "epoch": 3817} {"train_loss": -25.321622848510742, "global_step": 316833, "epoch": 3817} {"train_loss": -26.033605575561523, "global_step": 316834, "epoch": 3817} {"train_loss": -25.82842445373535, "global_step": 316835, "epoch": 3817} {"train_loss": -25.826507568359375, "global_step": 316836, "epoch": 3817} {"train_loss": -25.61612892150879, "global_step": 316837, "epoch": 3817} {"train_loss": -25.642414093017578, "global_step": 316838, "epoch": 3817} {"train_loss": -25.79058837890625, "global_step": 316839, "epoch": 3817} {"train_loss": -25.77020263671875, "global_step": 316840, "epoch": 3817} {"train_loss": -25.939748764038086, "global_step": 316841, "epoch": 3817} {"train_loss": -25.821557998657227, "global_step": 316842, "epoch": 3817} {"train_loss": -25.624942779541016, "global_step": 316843, "epoch": 3817} {"train_loss": -25.723615646362305, "global_step": 316844, "epoch": 3817} {"train_loss": -25.898191452026367, "global_step": 316845, "epoch": 3817} {"train_loss": -26.124637603759766, "global_step": 316846, "epoch": 3817} {"train_loss": -26.070337295532227, "global_step": 316847, "epoch": 3817} {"train_loss": -25.749902725219727, "global_step": 316848, "epoch": 3817} {"train_loss": -25.92792320251465, "global_step": 316849, "epoch": 3817} {"train_loss": -25.98682975769043, "global_step": 316850, "epoch": 3817} {"train_loss": -25.602985382080078, "global_step": 316851, "epoch": 3817} {"train_loss": -25.53486442565918, "global_step": 316852, "epoch": 3817} {"train_loss": -26.128864288330078, "global_step": 316853, "epoch": 3817} {"train_loss": -26.343414306640625, "global_step": 316854, "epoch": 3817} {"train_loss": -25.681121826171875, "global_step": 316855, "epoch": 3817} {"train_loss": -25.854084014892578, "global_step": 316856, "epoch": 3817} {"train_loss": -25.860187530517578, "global_step": 316857, "epoch": 3817} {"train_loss": -25.786102294921875, "global_step": 316858, "epoch": 3817} {"train_loss": -26.0207576751709, "global_step": 316859, "epoch": 3817} {"train_loss": -25.989566802978516, "global_step": 316860, "epoch": 3817} {"train_loss": -25.322656631469727, "global_step": 316861, "epoch": 3817} {"train_loss": -25.789539337158203, "global_step": 316862, "epoch": 3817} {"train_loss": -26.01300048828125, "global_step": 316863, "epoch": 3817} {"train_loss": -25.747119903564453, "global_step": 316864, "epoch": 3817} {"train_loss": -25.393573760986328, "global_step": 316865, "epoch": 3817} {"train_loss": -25.846399307250977, "global_step": 316866, "epoch": 3817} {"train_loss": -25.675006866455078, "global_step": 316867, "epoch": 3817} {"train_loss": -26.065282821655273, "global_step": 316868, "epoch": 3817} {"train_loss": -25.76593589782715, "global_step": 316869, "epoch": 3817} {"train_loss": -25.707365036010742, "global_step": 316870, "epoch": 3817} {"train_loss": -25.981897354125977, "global_step": 316871, "epoch": 3817} {"train_loss": -25.816144943237305, "global_step": 316872, "epoch": 3817} {"train_loss": -25.770355224609375, "global_step": 316873, "epoch": 3817} {"train_loss": -26.189682006835938, "global_step": 316874, "epoch": 3817} {"train_loss": -25.941675186157227, "global_step": 316875, "epoch": 3817} {"train_loss": -25.6340274810791, "global_step": 316876, "epoch": 3817} {"train_loss": -25.653974533081055, "global_step": 316877, "epoch": 3817} {"train_loss": -25.60546875, "global_step": 316878, "epoch": 3817} {"train_loss": -25.632678985595703, "global_step": 316879, "epoch": 3817} {"train_loss": -25.769880294799805, "global_step": 316880, "epoch": 3817} {"train_loss": -26.114166259765625, "global_step": 316881, "epoch": 3817} {"train_loss": -25.85524559020996, "global_step": 316882, "epoch": 3817} {"train_loss": -25.753347396850586, "global_step": 316883, "epoch": 3817} {"train_loss": -25.884443283081055, "global_step": 316884, "epoch": 3817} {"train_loss": -25.795547485351562, "global_step": 316885, "epoch": 3817} {"train_loss": -25.38010597229004, "global_step": 316886, "epoch": 3817} {"train_loss": -25.146848678588867, "global_step": 316887, "epoch": 3817} {"train_loss": -25.556671142578125, "global_step": 316888, "epoch": 3817} {"train_loss": -25.6502685546875, "global_step": 316889, "epoch": 3817} {"train_loss": -25.45406150817871, "global_step": 316890, "epoch": 3817} {"train_loss": -25.13332176208496, "global_step": 316891, "epoch": 3817} {"train_loss": -25.609663009643555, "global_step": 316892, "epoch": 3817} {"train_loss": -25.647479988006225, "global_step": 316893, "epoch": 3817, "val_loss": 7351289.0} {"train_loss": -25.234636306762695, "global_step": 316894, "epoch": 3818} {"train_loss": -25.35367774963379, "global_step": 316895, "epoch": 3818} {"train_loss": -25.461599349975586, "global_step": 316896, "epoch": 3818} {"train_loss": -25.309492111206055, "global_step": 316897, "epoch": 3818} {"train_loss": -25.6468563079834, "global_step": 316898, "epoch": 3818} {"train_loss": -25.271154403686523, "global_step": 316899, "epoch": 3818} {"train_loss": -25.278608322143555, "global_step": 316900, "epoch": 3818} {"train_loss": -25.661096572875977, "global_step": 316901, "epoch": 3818} {"train_loss": -25.640222549438477, "global_step": 316902, "epoch": 3818} {"train_loss": -25.658628463745117, "global_step": 316903, "epoch": 3818} {"train_loss": -25.798227310180664, "global_step": 316904, "epoch": 3818} {"train_loss": -25.764068603515625, "global_step": 316905, "epoch": 3818} {"train_loss": -25.60161781311035, "global_step": 316906, "epoch": 3818} {"train_loss": -25.800092697143555, "global_step": 316907, "epoch": 3818} {"train_loss": -25.999481201171875, "global_step": 316908, "epoch": 3818} {"train_loss": -25.57170295715332, "global_step": 316909, "epoch": 3818} {"train_loss": -25.404069900512695, "global_step": 316910, "epoch": 3818} {"train_loss": -25.68289566040039, "global_step": 316911, "epoch": 3818} {"train_loss": -25.536447525024414, "global_step": 316912, "epoch": 3818} {"train_loss": -25.7095947265625, "global_step": 316913, "epoch": 3818} {"train_loss": -25.585668563842773, "global_step": 316914, "epoch": 3818} {"train_loss": -26.33709144592285, "global_step": 316915, "epoch": 3818} {"train_loss": -25.622995376586914, "global_step": 316916, "epoch": 3818} {"train_loss": -25.836740493774414, "global_step": 316917, "epoch": 3818} {"train_loss": -25.38169288635254, "global_step": 316918, "epoch": 3818} {"train_loss": -26.015594482421875, "global_step": 316919, "epoch": 3818} {"train_loss": -25.527616500854492, "global_step": 316920, "epoch": 3818} {"train_loss": -26.029895782470703, "global_step": 316921, "epoch": 3818} {"train_loss": -25.9810848236084, "global_step": 316922, "epoch": 3818} {"train_loss": -25.905719757080078, "global_step": 316923, "epoch": 3818} {"train_loss": -25.41965675354004, "global_step": 316924, "epoch": 3818} {"train_loss": -26.122568130493164, "global_step": 316925, "epoch": 3818} {"train_loss": -25.905298233032227, "global_step": 316926, "epoch": 3818} {"train_loss": -25.87616539001465, "global_step": 316927, "epoch": 3818} {"train_loss": -25.716907501220703, "global_step": 316928, "epoch": 3818} {"train_loss": -25.830942153930664, "global_step": 316929, "epoch": 3818} {"train_loss": -25.765762329101562, "global_step": 316930, "epoch": 3818} {"train_loss": -25.660486221313477, "global_step": 316931, "epoch": 3818} {"train_loss": -25.848020553588867, "global_step": 316932, "epoch": 3818} {"train_loss": -26.00602149963379, "global_step": 316933, "epoch": 3818} {"train_loss": -25.552831649780273, "global_step": 316934, "epoch": 3818} {"train_loss": -25.787290573120117, "global_step": 316935, "epoch": 3818} {"train_loss": -25.635761260986328, "global_step": 316936, "epoch": 3818} {"train_loss": -25.957767486572266, "global_step": 316937, "epoch": 3818} {"train_loss": -26.0305118560791, "global_step": 316938, "epoch": 3818} {"train_loss": -25.660898208618164, "global_step": 316939, "epoch": 3818} {"train_loss": -25.582748413085938, "global_step": 316940, "epoch": 3818} {"train_loss": -25.935321807861328, "global_step": 316941, "epoch": 3818} {"train_loss": -25.781599044799805, "global_step": 316942, "epoch": 3818} {"train_loss": -25.831069946289062, "global_step": 316943, "epoch": 3818} {"train_loss": -25.840484619140625, "global_step": 316944, "epoch": 3818} {"train_loss": -26.025304794311523, "global_step": 316945, "epoch": 3818} {"train_loss": -25.7186279296875, "global_step": 316946, "epoch": 3818} {"train_loss": -25.452512741088867, "global_step": 316947, "epoch": 3818} {"train_loss": -26.1058349609375, "global_step": 316948, "epoch": 3818} {"train_loss": -25.963958740234375, "global_step": 316949, "epoch": 3818} {"train_loss": -25.947668075561523, "global_step": 316950, "epoch": 3818} {"train_loss": -25.697330474853516, "global_step": 316951, "epoch": 3818} {"train_loss": -25.723596572875977, "global_step": 316952, "epoch": 3818} {"train_loss": -25.845178604125977, "global_step": 316953, "epoch": 3818} {"train_loss": -25.59700584411621, "global_step": 316954, "epoch": 3818} {"train_loss": -25.699737548828125, "global_step": 316955, "epoch": 3818} {"train_loss": -25.2748966217041, "global_step": 316956, "epoch": 3818} {"train_loss": -25.927032470703125, "global_step": 316957, "epoch": 3818} {"train_loss": -25.707677841186523, "global_step": 316958, "epoch": 3818} {"train_loss": -25.8553466796875, "global_step": 316959, "epoch": 3818} {"train_loss": -25.887887954711914, "global_step": 316960, "epoch": 3818} {"train_loss": -25.584280014038086, "global_step": 316961, "epoch": 3818} {"train_loss": -25.576581954956055, "global_step": 316962, "epoch": 3818} {"train_loss": -25.89631462097168, "global_step": 316963, "epoch": 3818} {"train_loss": -25.80194091796875, "global_step": 316964, "epoch": 3818} {"train_loss": -25.7842960357666, "global_step": 316965, "epoch": 3818} {"train_loss": -25.83475685119629, "global_step": 316966, "epoch": 3818} {"train_loss": -26.112186431884766, "global_step": 316967, "epoch": 3818} {"train_loss": -25.541213989257812, "global_step": 316968, "epoch": 3818} {"train_loss": -25.53389549255371, "global_step": 316969, "epoch": 3818} {"train_loss": -25.798049926757812, "global_step": 316970, "epoch": 3818} {"train_loss": -25.362295150756836, "global_step": 316971, "epoch": 3818} {"train_loss": -25.876428604125977, "global_step": 316972, "epoch": 3818} {"train_loss": -25.85023307800293, "global_step": 316973, "epoch": 3818} {"train_loss": -25.92389488220215, "global_step": 316974, "epoch": 3818} {"train_loss": -25.72345542907715, "global_step": 316975, "epoch": 3818} {"train_loss": -25.744408940694417, "global_step": 316976, "epoch": 3818, "val_loss": 7352411.0} {"train_loss": -25.454626083374023, "global_step": 316977, "epoch": 3819} {"train_loss": -25.3048095703125, "global_step": 316978, "epoch": 3819} {"train_loss": -25.595291137695312, "global_step": 316979, "epoch": 3819} {"train_loss": -25.65122413635254, "global_step": 316980, "epoch": 3819} {"train_loss": -25.439950942993164, "global_step": 316981, "epoch": 3819} {"train_loss": -25.13984489440918, "global_step": 316982, "epoch": 3819} {"train_loss": -25.563459396362305, "global_step": 316983, "epoch": 3819} {"train_loss": -25.674835205078125, "global_step": 316984, "epoch": 3819} {"train_loss": -25.60968589782715, "global_step": 316985, "epoch": 3819} {"train_loss": -25.12618064880371, "global_step": 316986, "epoch": 3819} {"train_loss": -25.734731674194336, "global_step": 316987, "epoch": 3819} {"train_loss": -25.47382926940918, "global_step": 316988, "epoch": 3819} {"train_loss": -25.509967803955078, "global_step": 316989, "epoch": 3819} {"train_loss": -25.568666458129883, "global_step": 316990, "epoch": 3819} {"train_loss": -25.68124771118164, "global_step": 316991, "epoch": 3819} {"train_loss": -25.550737380981445, "global_step": 316992, "epoch": 3819} {"train_loss": -25.346540451049805, "global_step": 316993, "epoch": 3819} {"train_loss": -25.30491065979004, "global_step": 316994, "epoch": 3819} {"train_loss": -25.418466567993164, "global_step": 316995, "epoch": 3819} {"train_loss": -25.338449478149414, "global_step": 316996, "epoch": 3819} {"train_loss": -26.08016014099121, "global_step": 316997, "epoch": 3819} {"train_loss": -25.789447784423828, "global_step": 316998, "epoch": 3819} {"train_loss": -25.864362716674805, "global_step": 316999, "epoch": 3819} {"train_loss": -26.237539291381836, "global_step": 317000, "epoch": 3819} {"train_loss": -25.7810115814209, "global_step": 317001, "epoch": 3819} {"train_loss": -25.514440536499023, "global_step": 317002, "epoch": 3819} {"train_loss": -25.8625431060791, "global_step": 317003, "epoch": 3819} {"train_loss": -25.63532066345215, "global_step": 317004, "epoch": 3819} {"train_loss": -25.984304428100586, "global_step": 317005, "epoch": 3819} {"train_loss": -26.023889541625977, "global_step": 317006, "epoch": 3819} {"train_loss": -25.895370483398438, "global_step": 317007, "epoch": 3819} {"train_loss": -25.943603515625, "global_step": 317008, "epoch": 3819} {"train_loss": -25.8325252532959, "global_step": 317009, "epoch": 3819} {"train_loss": -25.80496597290039, "global_step": 317010, "epoch": 3819} {"train_loss": -25.825559616088867, "global_step": 317011, "epoch": 3819} {"train_loss": -26.123865127563477, "global_step": 317012, "epoch": 3819} {"train_loss": -25.734298706054688, "global_step": 317013, "epoch": 3819} {"train_loss": -25.71194839477539, "global_step": 317014, "epoch": 3819} {"train_loss": -25.744428634643555, "global_step": 317015, "epoch": 3819} {"train_loss": -26.065006256103516, "global_step": 317016, "epoch": 3819} {"train_loss": -25.77808952331543, "global_step": 317017, "epoch": 3819} {"train_loss": -25.649160385131836, "global_step": 317018, "epoch": 3819} {"train_loss": -25.848499298095703, "global_step": 317019, "epoch": 3819} {"train_loss": -26.43448257446289, "global_step": 317020, "epoch": 3819} {"train_loss": -26.213346481323242, "global_step": 317021, "epoch": 3819} {"train_loss": -25.84476661682129, "global_step": 317022, "epoch": 3819} {"train_loss": -25.94491958618164, "global_step": 317023, "epoch": 3819} {"train_loss": -26.113813400268555, "global_step": 317024, "epoch": 3819} {"train_loss": -26.03900146484375, "global_step": 317025, "epoch": 3819} {"train_loss": -26.055133819580078, "global_step": 317026, "epoch": 3819} {"train_loss": -25.649438858032227, "global_step": 317027, "epoch": 3819} {"train_loss": -25.82443618774414, "global_step": 317028, "epoch": 3819} {"train_loss": -25.805288314819336, "global_step": 317029, "epoch": 3819} {"train_loss": -25.6756534576416, "global_step": 317030, "epoch": 3819} {"train_loss": -26.077871322631836, "global_step": 317031, "epoch": 3819} {"train_loss": -25.950952529907227, "global_step": 317032, "epoch": 3819} {"train_loss": -25.989978790283203, "global_step": 317033, "epoch": 3819} {"train_loss": -25.269235610961914, "global_step": 317034, "epoch": 3819} {"train_loss": -25.26091957092285, "global_step": 317035, "epoch": 3819} {"train_loss": -25.46231460571289, "global_step": 317036, "epoch": 3819} {"train_loss": -25.29464340209961, "global_step": 317037, "epoch": 3819} {"train_loss": -25.699878692626953, "global_step": 317038, "epoch": 3819} {"train_loss": -25.785627365112305, "global_step": 317039, "epoch": 3819} {"train_loss": -25.0462703704834, "global_step": 317040, "epoch": 3819} {"train_loss": -25.82198143005371, "global_step": 317041, "epoch": 3819} {"train_loss": -25.718534469604492, "global_step": 317042, "epoch": 3819} {"train_loss": -25.835437774658203, "global_step": 317043, "epoch": 3819} {"train_loss": -25.734060287475586, "global_step": 317044, "epoch": 3819} {"train_loss": -25.986364364624023, "global_step": 317045, "epoch": 3819} {"train_loss": -25.825464248657227, "global_step": 317046, "epoch": 3819} {"train_loss": -25.654855728149414, "global_step": 317047, "epoch": 3819} {"train_loss": -25.831689834594727, "global_step": 317048, "epoch": 3819} {"train_loss": -25.913129806518555, "global_step": 317049, "epoch": 3819} {"train_loss": -25.76141929626465, "global_step": 317050, "epoch": 3819} {"train_loss": -25.665451049804688, "global_step": 317051, "epoch": 3819} {"train_loss": -26.03643798828125, "global_step": 317052, "epoch": 3819} {"train_loss": -26.07996940612793, "global_step": 317053, "epoch": 3819} {"train_loss": -25.847700119018555, "global_step": 317054, "epoch": 3819} {"train_loss": -25.970855712890625, "global_step": 317055, "epoch": 3819} {"train_loss": -25.517414093017578, "global_step": 317056, "epoch": 3819} {"train_loss": -25.908588409423828, "global_step": 317057, "epoch": 3819} {"train_loss": -25.945276260375977, "global_step": 317058, "epoch": 3819} {"train_loss": -25.74759115655738, "global_step": 317059, "epoch": 3819, "val_loss": 7323072.5} {"train_loss": -25.523101806640625, "global_step": 317060, "epoch": 3820} {"train_loss": -25.535125732421875, "global_step": 317061, "epoch": 3820} {"train_loss": -25.042051315307617, "global_step": 317062, "epoch": 3820} {"train_loss": -25.367380142211914, "global_step": 317063, "epoch": 3820} {"train_loss": -25.655542373657227, "global_step": 317064, "epoch": 3820} {"train_loss": -25.459407806396484, "global_step": 317065, "epoch": 3820} {"train_loss": -25.50281524658203, "global_step": 317066, "epoch": 3820} {"train_loss": -25.80751609802246, "global_step": 317067, "epoch": 3820} {"train_loss": -25.558170318603516, "global_step": 317068, "epoch": 3820} {"train_loss": -25.395658493041992, "global_step": 317069, "epoch": 3820} {"train_loss": -25.354825973510742, "global_step": 317070, "epoch": 3820} {"train_loss": -25.242658615112305, "global_step": 317071, "epoch": 3820} {"train_loss": -25.89821434020996, "global_step": 317072, "epoch": 3820} {"train_loss": -25.5009822845459, "global_step": 317073, "epoch": 3820} {"train_loss": -25.236120223999023, "global_step": 317074, "epoch": 3820} {"train_loss": -25.6500186920166, "global_step": 317075, "epoch": 3820} {"train_loss": -25.756162643432617, "global_step": 317076, "epoch": 3820} {"train_loss": -25.214344024658203, "global_step": 317077, "epoch": 3820} {"train_loss": -25.75831413269043, "global_step": 317078, "epoch": 3820} {"train_loss": -25.55449104309082, "global_step": 317079, "epoch": 3820} {"train_loss": -25.73309326171875, "global_step": 317080, "epoch": 3820} {"train_loss": -25.652099609375, "global_step": 317081, "epoch": 3820} {"train_loss": -26.119007110595703, "global_step": 317082, "epoch": 3820} {"train_loss": -25.432693481445312, "global_step": 317083, "epoch": 3820} {"train_loss": -25.574234008789062, "global_step": 317084, "epoch": 3820} {"train_loss": -25.61517333984375, "global_step": 317085, "epoch": 3820} {"train_loss": -25.653730392456055, "global_step": 317086, "epoch": 3820} {"train_loss": -26.057104110717773, "global_step": 317087, "epoch": 3820} {"train_loss": -25.71405601501465, "global_step": 317088, "epoch": 3820} {"train_loss": -25.897260665893555, "global_step": 317089, "epoch": 3820} {"train_loss": -25.652057647705078, "global_step": 317090, "epoch": 3820} {"train_loss": -26.30341148376465, "global_step": 317091, "epoch": 3820} {"train_loss": -26.143049240112305, "global_step": 317092, "epoch": 3820} {"train_loss": -25.983158111572266, "global_step": 317093, "epoch": 3820} {"train_loss": -25.780786514282227, "global_step": 317094, "epoch": 3820} {"train_loss": -25.906482696533203, "global_step": 317095, "epoch": 3820} {"train_loss": -26.000873565673828, "global_step": 317096, "epoch": 3820} {"train_loss": -25.76862907409668, "global_step": 317097, "epoch": 3820} {"train_loss": -26.00892448425293, "global_step": 317098, "epoch": 3820} {"train_loss": -25.872709274291992, "global_step": 317099, "epoch": 3820} {"train_loss": -25.794958114624023, "global_step": 317100, "epoch": 3820} {"train_loss": -25.88124656677246, "global_step": 317101, "epoch": 3820} {"train_loss": -25.945566177368164, "global_step": 317102, "epoch": 3820} {"train_loss": -25.81414222717285, "global_step": 317103, "epoch": 3820} {"train_loss": -25.809528350830078, "global_step": 317104, "epoch": 3820} {"train_loss": -25.684152603149414, "global_step": 317105, "epoch": 3820} {"train_loss": -25.554819107055664, "global_step": 317106, "epoch": 3820} {"train_loss": -26.147388458251953, "global_step": 317107, "epoch": 3820} {"train_loss": -25.84307861328125, "global_step": 317108, "epoch": 3820} {"train_loss": -25.747175216674805, "global_step": 317109, "epoch": 3820} {"train_loss": -26.1938419342041, "global_step": 317110, "epoch": 3820} {"train_loss": -26.214624404907227, "global_step": 317111, "epoch": 3820} {"train_loss": -25.653329849243164, "global_step": 317112, "epoch": 3820} {"train_loss": -25.461688995361328, "global_step": 317113, "epoch": 3820} {"train_loss": -25.397878646850586, "global_step": 317114, "epoch": 3820} {"train_loss": -26.10735511779785, "global_step": 317115, "epoch": 3820} {"train_loss": -26.039264678955078, "global_step": 317116, "epoch": 3820} {"train_loss": -25.557758331298828, "global_step": 317117, "epoch": 3820} {"train_loss": -25.74603843688965, "global_step": 317118, "epoch": 3820} {"train_loss": -25.92921257019043, "global_step": 317119, "epoch": 3820} {"train_loss": -25.89727210998535, "global_step": 317120, "epoch": 3820} {"train_loss": -26.064727783203125, "global_step": 317121, "epoch": 3820} {"train_loss": -25.848346710205078, "global_step": 317122, "epoch": 3820} {"train_loss": -26.011579513549805, "global_step": 317123, "epoch": 3820} {"train_loss": -26.070043563842773, "global_step": 317124, "epoch": 3820} {"train_loss": -25.9548397064209, "global_step": 317125, "epoch": 3820} {"train_loss": -25.65277099609375, "global_step": 317126, "epoch": 3820} {"train_loss": -25.640975952148438, "global_step": 317127, "epoch": 3820} {"train_loss": -25.974950790405273, "global_step": 317128, "epoch": 3820} {"train_loss": -25.961246490478516, "global_step": 317129, "epoch": 3820} {"train_loss": -25.619897842407227, "global_step": 317130, "epoch": 3820} {"train_loss": -25.950092315673828, "global_step": 317131, "epoch": 3820} {"train_loss": -25.385848999023438, "global_step": 317132, "epoch": 3820} {"train_loss": -25.990283966064453, "global_step": 317133, "epoch": 3820} {"train_loss": -25.7255916595459, "global_step": 317134, "epoch": 3820} {"train_loss": -25.69295310974121, "global_step": 317135, "epoch": 3820} {"train_loss": -25.95220375061035, "global_step": 317136, "epoch": 3820} {"train_loss": -26.069995880126953, "global_step": 317137, "epoch": 3820} {"train_loss": -25.46224021911621, "global_step": 317138, "epoch": 3820} {"train_loss": -25.58131980895996, "global_step": 317139, "epoch": 3820} {"train_loss": -25.7020206451416, "global_step": 317140, "epoch": 3820} {"train_loss": -26.021203994750977, "global_step": 317141, "epoch": 3820} {"train_loss": -25.751623682228917, "global_step": 317142, "epoch": 3820, "val_loss": 7114161.0} {"train_loss": -25.631702423095703, "global_step": 317143, "epoch": 3821} {"train_loss": -25.083600997924805, "global_step": 317144, "epoch": 3821} {"train_loss": -25.877277374267578, "global_step": 317145, "epoch": 3821} {"train_loss": -25.72452163696289, "global_step": 317146, "epoch": 3821} {"train_loss": -25.1743221282959, "global_step": 317147, "epoch": 3821} {"train_loss": -25.430057525634766, "global_step": 317148, "epoch": 3821} {"train_loss": -25.46438980102539, "global_step": 317149, "epoch": 3821} {"train_loss": -25.202367782592773, "global_step": 317150, "epoch": 3821} {"train_loss": -25.221128463745117, "global_step": 317151, "epoch": 3821} {"train_loss": -25.15737533569336, "global_step": 317152, "epoch": 3821} {"train_loss": -25.474157333374023, "global_step": 317153, "epoch": 3821} {"train_loss": -25.808639526367188, "global_step": 317154, "epoch": 3821} {"train_loss": -25.063472747802734, "global_step": 317155, "epoch": 3821} {"train_loss": -25.657556533813477, "global_step": 317156, "epoch": 3821} {"train_loss": -25.015254974365234, "global_step": 317157, "epoch": 3821} {"train_loss": -25.338058471679688, "global_step": 317158, "epoch": 3821} {"train_loss": -25.77606773376465, "global_step": 317159, "epoch": 3821} {"train_loss": -25.54191017150879, "global_step": 317160, "epoch": 3821} {"train_loss": -25.623991012573242, "global_step": 317161, "epoch": 3821} {"train_loss": -26.13205909729004, "global_step": 317162, "epoch": 3821} {"train_loss": -25.75080680847168, "global_step": 317163, "epoch": 3821} {"train_loss": -25.624958038330078, "global_step": 317164, "epoch": 3821} {"train_loss": -25.459671020507812, "global_step": 317165, "epoch": 3821} {"train_loss": -25.716419219970703, "global_step": 317166, "epoch": 3821} {"train_loss": -25.58680534362793, "global_step": 317167, "epoch": 3821} {"train_loss": -25.75935935974121, "global_step": 317168, "epoch": 3821} {"train_loss": -25.74662208557129, "global_step": 317169, "epoch": 3821} {"train_loss": -25.746173858642578, "global_step": 317170, "epoch": 3821} {"train_loss": -25.67929458618164, "global_step": 317171, "epoch": 3821} {"train_loss": -25.799436569213867, "global_step": 317172, "epoch": 3821} {"train_loss": -25.85286521911621, "global_step": 317173, "epoch": 3821} {"train_loss": -25.900043487548828, "global_step": 317174, "epoch": 3821} {"train_loss": -26.164505004882812, "global_step": 317175, "epoch": 3821} {"train_loss": -25.62380027770996, "global_step": 317176, "epoch": 3821} {"train_loss": -25.898656845092773, "global_step": 317177, "epoch": 3821} {"train_loss": -26.012195587158203, "global_step": 317178, "epoch": 3821} {"train_loss": -25.87774085998535, "global_step": 317179, "epoch": 3821} {"train_loss": -25.99143409729004, "global_step": 317180, "epoch": 3821} {"train_loss": -26.115768432617188, "global_step": 317181, "epoch": 3821} {"train_loss": -26.340707778930664, "global_step": 317182, "epoch": 3821} {"train_loss": -26.00006675720215, "global_step": 317183, "epoch": 3821} {"train_loss": -25.978195190429688, "global_step": 317184, "epoch": 3821} {"train_loss": -25.84183120727539, "global_step": 317185, "epoch": 3821} {"train_loss": -26.075809478759766, "global_step": 317186, "epoch": 3821} {"train_loss": -25.9860782623291, "global_step": 317187, "epoch": 3821} {"train_loss": -26.004087448120117, "global_step": 317188, "epoch": 3821} {"train_loss": -25.9027156829834, "global_step": 317189, "epoch": 3821} {"train_loss": -25.570371627807617, "global_step": 317190, "epoch": 3821} {"train_loss": -25.896442413330078, "global_step": 317191, "epoch": 3821} {"train_loss": -26.21622085571289, "global_step": 317192, "epoch": 3821} {"train_loss": -25.764179229736328, "global_step": 317193, "epoch": 3821} {"train_loss": -26.06546974182129, "global_step": 317194, "epoch": 3821} {"train_loss": -25.90931510925293, "global_step": 317195, "epoch": 3821} {"train_loss": -25.922626495361328, "global_step": 317196, "epoch": 3821} {"train_loss": -25.840208053588867, "global_step": 317197, "epoch": 3821} {"train_loss": -25.886444091796875, "global_step": 317198, "epoch": 3821} {"train_loss": -25.722135543823242, "global_step": 317199, "epoch": 3821} {"train_loss": -25.611066818237305, "global_step": 317200, "epoch": 3821} {"train_loss": -25.807584762573242, "global_step": 317201, "epoch": 3821} {"train_loss": -25.84869956970215, "global_step": 317202, "epoch": 3821} {"train_loss": -25.513093948364258, "global_step": 317203, "epoch": 3821} {"train_loss": -25.892169952392578, "global_step": 317204, "epoch": 3821} {"train_loss": -25.983325958251953, "global_step": 317205, "epoch": 3821} {"train_loss": -25.666748046875, "global_step": 317206, "epoch": 3821} {"train_loss": -25.699493408203125, "global_step": 317207, "epoch": 3821} {"train_loss": -25.367774963378906, "global_step": 317208, "epoch": 3821} {"train_loss": -24.453176498413086, "global_step": 317209, "epoch": 3821} {"train_loss": -24.33930206298828, "global_step": 317210, "epoch": 3821} {"train_loss": -25.230871200561523, "global_step": 317211, "epoch": 3821} {"train_loss": -25.321081161499023, "global_step": 317212, "epoch": 3821} {"train_loss": -25.383220672607422, "global_step": 317213, "epoch": 3821} {"train_loss": -25.507843017578125, "global_step": 317214, "epoch": 3821} {"train_loss": -25.230520248413086, "global_step": 317215, "epoch": 3821} {"train_loss": -25.92657470703125, "global_step": 317216, "epoch": 3821} {"train_loss": -25.176183700561523, "global_step": 317217, "epoch": 3821} {"train_loss": -25.683881759643555, "global_step": 317218, "epoch": 3821} {"train_loss": -25.883533477783203, "global_step": 317219, "epoch": 3821} {"train_loss": -25.70149803161621, "global_step": 317220, "epoch": 3821} {"train_loss": -25.713912963867188, "global_step": 317221, "epoch": 3821} {"train_loss": -25.981367111206055, "global_step": 317222, "epoch": 3821} {"train_loss": -26.034671783447266, "global_step": 317223, "epoch": 3821} {"train_loss": -25.685712814331055, "global_step": 317224, "epoch": 3821} {"train_loss": -25.658633381487377, "global_step": 317225, "epoch": 3821, "val_loss": 7262125.0} {"train_loss": -25.699844360351562, "global_step": 317226, "epoch": 3822} {"train_loss": -25.504589080810547, "global_step": 317227, "epoch": 3822} {"train_loss": -25.445892333984375, "global_step": 317228, "epoch": 3822} {"train_loss": -25.5526123046875, "global_step": 317229, "epoch": 3822} {"train_loss": -25.51421356201172, "global_step": 317230, "epoch": 3822} {"train_loss": -25.842554092407227, "global_step": 317231, "epoch": 3822} {"train_loss": -25.202239990234375, "global_step": 317232, "epoch": 3822} {"train_loss": -25.94325828552246, "global_step": 317233, "epoch": 3822} {"train_loss": -25.496599197387695, "global_step": 317234, "epoch": 3822} {"train_loss": -25.75160026550293, "global_step": 317235, "epoch": 3822} {"train_loss": -25.462064743041992, "global_step": 317236, "epoch": 3822} {"train_loss": -25.670927047729492, "global_step": 317237, "epoch": 3822} {"train_loss": -25.95454216003418, "global_step": 317238, "epoch": 3822} {"train_loss": -25.797170639038086, "global_step": 317239, "epoch": 3822} {"train_loss": -25.692035675048828, "global_step": 317240, "epoch": 3822} {"train_loss": -26.044355392456055, "global_step": 317241, "epoch": 3822} {"train_loss": -25.933454513549805, "global_step": 317242, "epoch": 3822} {"train_loss": -26.13838768005371, "global_step": 317243, "epoch": 3822} {"train_loss": -25.730512619018555, "global_step": 317244, "epoch": 3822} {"train_loss": -25.58382225036621, "global_step": 317245, "epoch": 3822} {"train_loss": -25.772314071655273, "global_step": 317246, "epoch": 3822} {"train_loss": -25.77241325378418, "global_step": 317247, "epoch": 3822} {"train_loss": -25.880756378173828, "global_step": 317248, "epoch": 3822} {"train_loss": -26.062559127807617, "global_step": 317249, "epoch": 3822} {"train_loss": -25.848480224609375, "global_step": 317250, "epoch": 3822} {"train_loss": -25.773954391479492, "global_step": 317251, "epoch": 3822} {"train_loss": -25.7762508392334, "global_step": 317252, "epoch": 3822} {"train_loss": -25.76112937927246, "global_step": 317253, "epoch": 3822} {"train_loss": -25.87836265563965, "global_step": 317254, "epoch": 3822} {"train_loss": -25.909473419189453, "global_step": 317255, "epoch": 3822} {"train_loss": -26.187292098999023, "global_step": 317256, "epoch": 3822} {"train_loss": -25.915517807006836, "global_step": 317257, "epoch": 3822} {"train_loss": -26.048267364501953, "global_step": 317258, "epoch": 3822} {"train_loss": -25.79056167602539, "global_step": 317259, "epoch": 3822} {"train_loss": -25.784564971923828, "global_step": 317260, "epoch": 3822} {"train_loss": -25.763051986694336, "global_step": 317261, "epoch": 3822} {"train_loss": -26.1680908203125, "global_step": 317262, "epoch": 3822} {"train_loss": -25.89320182800293, "global_step": 317263, "epoch": 3822} {"train_loss": -25.669727325439453, "global_step": 317264, "epoch": 3822} {"train_loss": -25.821557998657227, "global_step": 317265, "epoch": 3822} {"train_loss": -25.70948600769043, "global_step": 317266, "epoch": 3822} {"train_loss": -26.003265380859375, "global_step": 317267, "epoch": 3822} {"train_loss": -25.896076202392578, "global_step": 317268, "epoch": 3822} {"train_loss": -25.426084518432617, "global_step": 317269, "epoch": 3822} {"train_loss": -25.485143661499023, "global_step": 317270, "epoch": 3822} {"train_loss": -26.208240509033203, "global_step": 317271, "epoch": 3822} {"train_loss": -26.106409072875977, "global_step": 317272, "epoch": 3822} {"train_loss": -25.9421329498291, "global_step": 317273, "epoch": 3822} {"train_loss": -25.580812454223633, "global_step": 317274, "epoch": 3822} {"train_loss": -25.797016143798828, "global_step": 317275, "epoch": 3822} {"train_loss": -25.76265525817871, "global_step": 317276, "epoch": 3822} {"train_loss": -25.991413116455078, "global_step": 317277, "epoch": 3822} {"train_loss": -26.206451416015625, "global_step": 317278, "epoch": 3822} {"train_loss": -25.69733238220215, "global_step": 317279, "epoch": 3822} {"train_loss": -25.79541015625, "global_step": 317280, "epoch": 3822} {"train_loss": -25.723556518554688, "global_step": 317281, "epoch": 3822} {"train_loss": -25.92194938659668, "global_step": 317282, "epoch": 3822} {"train_loss": -26.09397315979004, "global_step": 317283, "epoch": 3822} {"train_loss": -26.130462646484375, "global_step": 317284, "epoch": 3822} {"train_loss": -25.87764549255371, "global_step": 317285, "epoch": 3822} {"train_loss": -25.96701431274414, "global_step": 317286, "epoch": 3822} {"train_loss": -25.948556900024414, "global_step": 317287, "epoch": 3822} {"train_loss": -26.241199493408203, "global_step": 317288, "epoch": 3822} {"train_loss": -25.797250747680664, "global_step": 317289, "epoch": 3822} {"train_loss": -25.920995712280273, "global_step": 317290, "epoch": 3822} {"train_loss": -25.762592315673828, "global_step": 317291, "epoch": 3822} {"train_loss": -25.793737411499023, "global_step": 317292, "epoch": 3822} {"train_loss": -25.572975158691406, "global_step": 317293, "epoch": 3822} {"train_loss": -25.827611923217773, "global_step": 317294, "epoch": 3822} {"train_loss": -25.9996337890625, "global_step": 317295, "epoch": 3822} {"train_loss": -25.801782608032227, "global_step": 317296, "epoch": 3822} {"train_loss": -26.035877227783203, "global_step": 317297, "epoch": 3822} {"train_loss": -25.8320369720459, "global_step": 317298, "epoch": 3822} {"train_loss": -25.748550415039062, "global_step": 317299, "epoch": 3822} {"train_loss": -25.280750274658203, "global_step": 317300, "epoch": 3822} {"train_loss": -26.003219604492188, "global_step": 317301, "epoch": 3822} {"train_loss": -25.941511154174805, "global_step": 317302, "epoch": 3822} {"train_loss": -26.061323165893555, "global_step": 317303, "epoch": 3822} {"train_loss": -25.79084587097168, "global_step": 317304, "epoch": 3822} {"train_loss": -26.072067260742188, "global_step": 317305, "epoch": 3822} {"train_loss": -25.811695098876953, "global_step": 317306, "epoch": 3822} {"train_loss": -25.727096557617188, "global_step": 317307, "epoch": 3822} {"train_loss": -25.85534599028438, "global_step": 317308, "epoch": 3822, "val_loss": 7329771.0} {"train_loss": -24.675495147705078, "global_step": 317309, "epoch": 3823} {"train_loss": -24.720808029174805, "global_step": 317310, "epoch": 3823} {"train_loss": -25.18636131286621, "global_step": 317311, "epoch": 3823} {"train_loss": -25.058820724487305, "global_step": 317312, "epoch": 3823} {"train_loss": -25.493759155273438, "global_step": 317313, "epoch": 3823} {"train_loss": -24.94287109375, "global_step": 317314, "epoch": 3823} {"train_loss": -25.662084579467773, "global_step": 317315, "epoch": 3823} {"train_loss": -25.324676513671875, "global_step": 317316, "epoch": 3823} {"train_loss": -25.24271011352539, "global_step": 317317, "epoch": 3823} {"train_loss": -25.22188949584961, "global_step": 317318, "epoch": 3823} {"train_loss": -25.855411529541016, "global_step": 317319, "epoch": 3823} {"train_loss": -25.54684066772461, "global_step": 317320, "epoch": 3823} {"train_loss": -25.16774559020996, "global_step": 317321, "epoch": 3823} {"train_loss": -25.359817504882812, "global_step": 317322, "epoch": 3823} {"train_loss": -25.401803970336914, "global_step": 317323, "epoch": 3823} {"train_loss": -25.55716896057129, "global_step": 317324, "epoch": 3823} {"train_loss": -25.566850662231445, "global_step": 317325, "epoch": 3823} {"train_loss": -25.10199546813965, "global_step": 317326, "epoch": 3823} {"train_loss": -25.394750595092773, "global_step": 317327, "epoch": 3823} {"train_loss": -25.774145126342773, "global_step": 317328, "epoch": 3823} {"train_loss": -25.3966007232666, "global_step": 317329, "epoch": 3823} {"train_loss": -25.62908363342285, "global_step": 317330, "epoch": 3823} {"train_loss": -25.7684268951416, "global_step": 317331, "epoch": 3823} {"train_loss": -25.86688232421875, "global_step": 317332, "epoch": 3823} {"train_loss": -25.498254776000977, "global_step": 317333, "epoch": 3823} {"train_loss": -25.797651290893555, "global_step": 317334, "epoch": 3823} {"train_loss": -25.752416610717773, "global_step": 317335, "epoch": 3823} {"train_loss": -25.950586318969727, "global_step": 317336, "epoch": 3823} {"train_loss": -25.853240966796875, "global_step": 317337, "epoch": 3823} {"train_loss": -25.6047306060791, "global_step": 317338, "epoch": 3823} {"train_loss": -25.95624351501465, "global_step": 317339, "epoch": 3823} {"train_loss": -25.507436752319336, "global_step": 317340, "epoch": 3823} {"train_loss": -25.8084716796875, "global_step": 317341, "epoch": 3823} {"train_loss": -25.471220016479492, "global_step": 317342, "epoch": 3823} {"train_loss": -25.456655502319336, "global_step": 317343, "epoch": 3823} {"train_loss": -25.712614059448242, "global_step": 317344, "epoch": 3823} {"train_loss": -25.431583404541016, "global_step": 317345, "epoch": 3823} {"train_loss": -25.227678298950195, "global_step": 317346, "epoch": 3823} {"train_loss": -25.88653564453125, "global_step": 317347, "epoch": 3823} {"train_loss": -25.665246963500977, "global_step": 317348, "epoch": 3823} {"train_loss": -25.664093017578125, "global_step": 317349, "epoch": 3823} {"train_loss": -25.878137588500977, "global_step": 317350, "epoch": 3823} {"train_loss": -25.816059112548828, "global_step": 317351, "epoch": 3823} {"train_loss": -25.904865264892578, "global_step": 317352, "epoch": 3823} {"train_loss": -25.735767364501953, "global_step": 317353, "epoch": 3823} {"train_loss": -25.654006958007812, "global_step": 317354, "epoch": 3823} {"train_loss": -26.06330680847168, "global_step": 317355, "epoch": 3823} {"train_loss": -25.860214233398438, "global_step": 317356, "epoch": 3823} {"train_loss": -26.14462661743164, "global_step": 317357, "epoch": 3823} {"train_loss": -26.19056510925293, "global_step": 317358, "epoch": 3823} {"train_loss": -25.774627685546875, "global_step": 317359, "epoch": 3823} {"train_loss": -25.423171997070312, "global_step": 317360, "epoch": 3823} {"train_loss": -25.956348419189453, "global_step": 317361, "epoch": 3823} {"train_loss": -25.689453125, "global_step": 317362, "epoch": 3823} {"train_loss": -26.015424728393555, "global_step": 317363, "epoch": 3823} {"train_loss": -25.567718505859375, "global_step": 317364, "epoch": 3823} {"train_loss": -26.057605743408203, "global_step": 317365, "epoch": 3823} {"train_loss": -26.098072052001953, "global_step": 317366, "epoch": 3823} {"train_loss": -26.117170333862305, "global_step": 317367, "epoch": 3823} {"train_loss": -26.058307647705078, "global_step": 317368, "epoch": 3823} {"train_loss": -25.76190185546875, "global_step": 317369, "epoch": 3823} {"train_loss": -25.8266658782959, "global_step": 317370, "epoch": 3823} {"train_loss": -25.622970581054688, "global_step": 317371, "epoch": 3823} {"train_loss": -25.639123916625977, "global_step": 317372, "epoch": 3823} {"train_loss": -25.74725341796875, "global_step": 317373, "epoch": 3823} {"train_loss": -25.57059669494629, "global_step": 317374, "epoch": 3823} {"train_loss": -26.09964942932129, "global_step": 317375, "epoch": 3823} {"train_loss": -25.918598175048828, "global_step": 317376, "epoch": 3823} {"train_loss": -25.85042381286621, "global_step": 317377, "epoch": 3823} {"train_loss": -25.589296340942383, "global_step": 317378, "epoch": 3823} {"train_loss": -26.078229904174805, "global_step": 317379, "epoch": 3823} {"train_loss": -25.950275421142578, "global_step": 317380, "epoch": 3823} {"train_loss": -25.525121688842773, "global_step": 317381, "epoch": 3823} {"train_loss": -25.872034072875977, "global_step": 317382, "epoch": 3823} {"train_loss": -25.66766929626465, "global_step": 317383, "epoch": 3823} {"train_loss": -25.8456974029541, "global_step": 317384, "epoch": 3823} {"train_loss": -25.985675811767578, "global_step": 317385, "epoch": 3823} {"train_loss": -25.62225914001465, "global_step": 317386, "epoch": 3823} {"train_loss": -25.67705726623535, "global_step": 317387, "epoch": 3823} {"train_loss": -25.540922164916992, "global_step": 317388, "epoch": 3823} {"train_loss": -25.33302116394043, "global_step": 317389, "epoch": 3823} {"train_loss": -25.83368492126465, "global_step": 317390, "epoch": 3823} {"train_loss": -25.672832489013672, "global_step": 317391, "epoch": 3823, "val_loss": 7429377.0} {"train_loss": -24.82940673828125, "global_step": 317392, "epoch": 3824} {"train_loss": -24.621549606323242, "global_step": 317393, "epoch": 3824} {"train_loss": -25.21681785583496, "global_step": 317394, "epoch": 3824} {"train_loss": -25.358396530151367, "global_step": 317395, "epoch": 3824} {"train_loss": -25.089426040649414, "global_step": 317396, "epoch": 3824} {"train_loss": -25.04833984375, "global_step": 317397, "epoch": 3824} {"train_loss": -25.15677833557129, "global_step": 317398, "epoch": 3824} {"train_loss": -24.900257110595703, "global_step": 317399, "epoch": 3824} {"train_loss": -25.26045799255371, "global_step": 317400, "epoch": 3824} {"train_loss": -25.14714241027832, "global_step": 317401, "epoch": 3824} {"train_loss": -25.112478256225586, "global_step": 317402, "epoch": 3824} {"train_loss": -25.507614135742188, "global_step": 317403, "epoch": 3824} {"train_loss": -25.64004898071289, "global_step": 317404, "epoch": 3824} {"train_loss": -25.643604278564453, "global_step": 317405, "epoch": 3824} {"train_loss": -25.402301788330078, "global_step": 317406, "epoch": 3824} {"train_loss": -25.39849281311035, "global_step": 317407, "epoch": 3824} {"train_loss": -25.409032821655273, "global_step": 317408, "epoch": 3824} {"train_loss": -25.507299423217773, "global_step": 317409, "epoch": 3824} {"train_loss": -25.698883056640625, "global_step": 317410, "epoch": 3824} {"train_loss": -25.3875789642334, "global_step": 317411, "epoch": 3824} {"train_loss": -25.4530029296875, "global_step": 317412, "epoch": 3824} {"train_loss": -25.911407470703125, "global_step": 317413, "epoch": 3824} {"train_loss": -25.57258415222168, "global_step": 317414, "epoch": 3824} {"train_loss": -25.686487197875977, "global_step": 317415, "epoch": 3824} {"train_loss": -25.51850700378418, "global_step": 317416, "epoch": 3824} {"train_loss": -25.829320907592773, "global_step": 317417, "epoch": 3824} {"train_loss": -25.75660514831543, "global_step": 317418, "epoch": 3824} {"train_loss": -25.7310791015625, "global_step": 317419, "epoch": 3824} {"train_loss": -25.738317489624023, "global_step": 317420, "epoch": 3824} {"train_loss": -25.84653091430664, "global_step": 317421, "epoch": 3824} {"train_loss": -25.829864501953125, "global_step": 317422, "epoch": 3824} {"train_loss": -26.191919326782227, "global_step": 317423, "epoch": 3824} {"train_loss": -25.800907135009766, "global_step": 317424, "epoch": 3824} {"train_loss": -26.0980167388916, "global_step": 317425, "epoch": 3824} {"train_loss": -25.8892879486084, "global_step": 317426, "epoch": 3824} {"train_loss": -25.9625301361084, "global_step": 317427, "epoch": 3824} {"train_loss": -26.050628662109375, "global_step": 317428, "epoch": 3824} {"train_loss": -25.72504234313965, "global_step": 317429, "epoch": 3824} {"train_loss": -26.012542724609375, "global_step": 317430, "epoch": 3824} {"train_loss": -26.304824829101562, "global_step": 317431, "epoch": 3824} {"train_loss": -25.90586280822754, "global_step": 317432, "epoch": 3824} {"train_loss": -26.046344757080078, "global_step": 317433, "epoch": 3824} {"train_loss": -25.941577911376953, "global_step": 317434, "epoch": 3824} {"train_loss": -26.052366256713867, "global_step": 317435, "epoch": 3824} {"train_loss": -25.56409454345703, "global_step": 317436, "epoch": 3824} {"train_loss": -26.293079376220703, "global_step": 317437, "epoch": 3824} {"train_loss": -25.851428985595703, "global_step": 317438, "epoch": 3824} {"train_loss": -25.987384796142578, "global_step": 317439, "epoch": 3824} {"train_loss": -25.953128814697266, "global_step": 317440, "epoch": 3824} {"train_loss": -25.6466121673584, "global_step": 317441, "epoch": 3824} {"train_loss": -25.920135498046875, "global_step": 317442, "epoch": 3824} {"train_loss": -26.535663604736328, "global_step": 317443, "epoch": 3824} {"train_loss": -25.897375106811523, "global_step": 317444, "epoch": 3824} {"train_loss": -25.676313400268555, "global_step": 317445, "epoch": 3824} {"train_loss": -25.791086196899414, "global_step": 317446, "epoch": 3824} {"train_loss": -25.85784912109375, "global_step": 317447, "epoch": 3824} {"train_loss": -26.189905166625977, "global_step": 317448, "epoch": 3824} {"train_loss": -25.83026123046875, "global_step": 317449, "epoch": 3824} {"train_loss": -25.658483505249023, "global_step": 317450, "epoch": 3824} {"train_loss": -25.9903564453125, "global_step": 317451, "epoch": 3824} {"train_loss": -25.889606475830078, "global_step": 317452, "epoch": 3824} {"train_loss": -26.2146053314209, "global_step": 317453, "epoch": 3824} {"train_loss": -26.4003849029541, "global_step": 317454, "epoch": 3824} {"train_loss": -26.04957389831543, "global_step": 317455, "epoch": 3824} {"train_loss": -25.830228805541992, "global_step": 317456, "epoch": 3824} {"train_loss": -25.570125579833984, "global_step": 317457, "epoch": 3824} {"train_loss": -25.46698570251465, "global_step": 317458, "epoch": 3824} {"train_loss": -25.7689151763916, "global_step": 317459, "epoch": 3824} {"train_loss": -26.140653610229492, "global_step": 317460, "epoch": 3824} {"train_loss": -25.865772247314453, "global_step": 317461, "epoch": 3824} {"train_loss": -26.146177291870117, "global_step": 317462, "epoch": 3824} {"train_loss": -25.62702751159668, "global_step": 317463, "epoch": 3824} {"train_loss": -26.202661514282227, "global_step": 317464, "epoch": 3824} {"train_loss": -25.56534767150879, "global_step": 317465, "epoch": 3824} {"train_loss": -25.758243560791016, "global_step": 317466, "epoch": 3824} {"train_loss": -25.675756454467773, "global_step": 317467, "epoch": 3824} {"train_loss": -25.709753036499023, "global_step": 317468, "epoch": 3824} {"train_loss": -25.508230209350586, "global_step": 317469, "epoch": 3824} {"train_loss": -25.85614013671875, "global_step": 317470, "epoch": 3824} {"train_loss": -25.877477645874023, "global_step": 317471, "epoch": 3824} {"train_loss": -25.630002975463867, "global_step": 317472, "epoch": 3824} {"train_loss": -25.9169921875, "global_step": 317473, "epoch": 3824} {"train_loss": -25.744032342749907, "global_step": 317474, "epoch": 3824, "val_loss": 7411103.5} {"train_loss": -24.05263328552246, "global_step": 317475, "epoch": 3825} {"train_loss": -24.724889755249023, "global_step": 317476, "epoch": 3825} {"train_loss": -24.068601608276367, "global_step": 317477, "epoch": 3825} {"train_loss": -24.016483306884766, "global_step": 317478, "epoch": 3825} {"train_loss": -23.704511642456055, "global_step": 317479, "epoch": 3825} {"train_loss": -24.30487632751465, "global_step": 317480, "epoch": 3825} {"train_loss": -24.092741012573242, "global_step": 317481, "epoch": 3825} {"train_loss": -24.178205490112305, "global_step": 317482, "epoch": 3825} {"train_loss": -24.398508071899414, "global_step": 317483, "epoch": 3825} {"train_loss": -24.687255859375, "global_step": 317484, "epoch": 3825} {"train_loss": -24.53397560119629, "global_step": 317485, "epoch": 3825} {"train_loss": -24.46465492248535, "global_step": 317486, "epoch": 3825} {"train_loss": -24.69587516784668, "global_step": 317487, "epoch": 3825} {"train_loss": -24.2011775970459, "global_step": 317488, "epoch": 3825} {"train_loss": -24.77630043029785, "global_step": 317489, "epoch": 3825} {"train_loss": -24.69232177734375, "global_step": 317490, "epoch": 3825} {"train_loss": -24.640724182128906, "global_step": 317491, "epoch": 3825} {"train_loss": -24.580692291259766, "global_step": 317492, "epoch": 3825} {"train_loss": -24.30483055114746, "global_step": 317493, "epoch": 3825} {"train_loss": -24.733016967773438, "global_step": 317494, "epoch": 3825} {"train_loss": -24.955005645751953, "global_step": 317495, "epoch": 3825} {"train_loss": -24.75552749633789, "global_step": 317496, "epoch": 3825} {"train_loss": -25.063106536865234, "global_step": 317497, "epoch": 3825} {"train_loss": -25.131818771362305, "global_step": 317498, "epoch": 3825} {"train_loss": -25.396203994750977, "global_step": 317499, "epoch": 3825} {"train_loss": -25.027698516845703, "global_step": 317500, "epoch": 3825} {"train_loss": -25.458803176879883, "global_step": 317501, "epoch": 3825} {"train_loss": -25.1313533782959, "global_step": 317502, "epoch": 3825} {"train_loss": -25.513328552246094, "global_step": 317503, "epoch": 3825} {"train_loss": -25.26177978515625, "global_step": 317504, "epoch": 3825} {"train_loss": -25.212167739868164, "global_step": 317505, "epoch": 3825} {"train_loss": -25.616674423217773, "global_step": 317506, "epoch": 3825} {"train_loss": -25.50758934020996, "global_step": 317507, "epoch": 3825} {"train_loss": -25.603174209594727, "global_step": 317508, "epoch": 3825} {"train_loss": -25.28696060180664, "global_step": 317509, "epoch": 3825} {"train_loss": -25.465532302856445, "global_step": 317510, "epoch": 3825} {"train_loss": -25.429304122924805, "global_step": 317511, "epoch": 3825} {"train_loss": -25.6224365234375, "global_step": 317512, "epoch": 3825} {"train_loss": -25.53487205505371, "global_step": 317513, "epoch": 3825} {"train_loss": -25.656644821166992, "global_step": 317514, "epoch": 3825} {"train_loss": -25.95145034790039, "global_step": 317515, "epoch": 3825} {"train_loss": -25.543851852416992, "global_step": 317516, "epoch": 3825} {"train_loss": -25.86960792541504, "global_step": 317517, "epoch": 3825} {"train_loss": -26.3109130859375, "global_step": 317518, "epoch": 3825} {"train_loss": -25.818933486938477, "global_step": 317519, "epoch": 3825} {"train_loss": -25.859045028686523, "global_step": 317520, "epoch": 3825} {"train_loss": -25.82557487487793, "global_step": 317521, "epoch": 3825} {"train_loss": -26.005359649658203, "global_step": 317522, "epoch": 3825} {"train_loss": -25.753164291381836, "global_step": 317523, "epoch": 3825} {"train_loss": -25.82073974609375, "global_step": 317524, "epoch": 3825} {"train_loss": -25.426050186157227, "global_step": 317525, "epoch": 3825} {"train_loss": -26.1312255859375, "global_step": 317526, "epoch": 3825} {"train_loss": -25.79901123046875, "global_step": 317527, "epoch": 3825} {"train_loss": -25.781946182250977, "global_step": 317528, "epoch": 3825} {"train_loss": -26.024763107299805, "global_step": 317529, "epoch": 3825} {"train_loss": -25.95733070373535, "global_step": 317530, "epoch": 3825} {"train_loss": -26.09588050842285, "global_step": 317531, "epoch": 3825} {"train_loss": -25.71384620666504, "global_step": 317532, "epoch": 3825} {"train_loss": -25.961652755737305, "global_step": 317533, "epoch": 3825} {"train_loss": -25.843170166015625, "global_step": 317534, "epoch": 3825} {"train_loss": -25.636083602905273, "global_step": 317535, "epoch": 3825} {"train_loss": -26.484546661376953, "global_step": 317536, "epoch": 3825} {"train_loss": -25.726163864135742, "global_step": 317537, "epoch": 3825} {"train_loss": -25.53376579284668, "global_step": 317538, "epoch": 3825} {"train_loss": -25.517322540283203, "global_step": 317539, "epoch": 3825} {"train_loss": -26.05152702331543, "global_step": 317540, "epoch": 3825} {"train_loss": -26.027606964111328, "global_step": 317541, "epoch": 3825} {"train_loss": -25.610626220703125, "global_step": 317542, "epoch": 3825} {"train_loss": -26.017465591430664, "global_step": 317543, "epoch": 3825} {"train_loss": -25.91891860961914, "global_step": 317544, "epoch": 3825} {"train_loss": -25.641942977905273, "global_step": 317545, "epoch": 3825} {"train_loss": -25.5450439453125, "global_step": 317546, "epoch": 3825} {"train_loss": -25.530691146850586, "global_step": 317547, "epoch": 3825} {"train_loss": -25.651992797851562, "global_step": 317548, "epoch": 3825} {"train_loss": -25.694904327392578, "global_step": 317549, "epoch": 3825} {"train_loss": -26.284555435180664, "global_step": 317550, "epoch": 3825} {"train_loss": -25.95777702331543, "global_step": 317551, "epoch": 3825} {"train_loss": -26.2127628326416, "global_step": 317552, "epoch": 3825} {"train_loss": -25.98929786682129, "global_step": 317553, "epoch": 3825} {"train_loss": -26.18121910095215, "global_step": 317554, "epoch": 3825} {"train_loss": -26.142902374267578, "global_step": 317555, "epoch": 3825} {"train_loss": -25.891162872314453, "global_step": 317556, "epoch": 3825} {"train_loss": -25.39971409073795, "global_step": 317557, "epoch": 3825, "val_loss": 7323157.0} {"train_loss": -25.392127990722656, "global_step": 317558, "epoch": 3826} {"train_loss": -25.614948272705078, "global_step": 317559, "epoch": 3826} {"train_loss": -25.317718505859375, "global_step": 317560, "epoch": 3826} {"train_loss": -25.165693283081055, "global_step": 317561, "epoch": 3826} {"train_loss": -25.57948112487793, "global_step": 317562, "epoch": 3826} {"train_loss": -25.610960006713867, "global_step": 317563, "epoch": 3826} {"train_loss": -25.46307945251465, "global_step": 317564, "epoch": 3826} {"train_loss": -25.679229736328125, "global_step": 317565, "epoch": 3826} {"train_loss": -26.154876708984375, "global_step": 317566, "epoch": 3826} {"train_loss": -25.828771591186523, "global_step": 317567, "epoch": 3826} {"train_loss": -25.581520080566406, "global_step": 317568, "epoch": 3826} {"train_loss": -25.454021453857422, "global_step": 317569, "epoch": 3826} {"train_loss": -25.826725006103516, "global_step": 317570, "epoch": 3826} {"train_loss": -25.63224220275879, "global_step": 317571, "epoch": 3826} {"train_loss": -25.927448272705078, "global_step": 317572, "epoch": 3826} {"train_loss": -25.72247886657715, "global_step": 317573, "epoch": 3826} {"train_loss": -26.115671157836914, "global_step": 317574, "epoch": 3826} {"train_loss": -25.733362197875977, "global_step": 317575, "epoch": 3826} {"train_loss": -25.75177574157715, "global_step": 317576, "epoch": 3826} {"train_loss": -25.6453857421875, "global_step": 317577, "epoch": 3826} {"train_loss": -26.112768173217773, "global_step": 317578, "epoch": 3826} {"train_loss": -26.207107543945312, "global_step": 317579, "epoch": 3826} {"train_loss": -26.059843063354492, "global_step": 317580, "epoch": 3826} {"train_loss": -25.839340209960938, "global_step": 317581, "epoch": 3826} {"train_loss": -25.9423885345459, "global_step": 317582, "epoch": 3826} {"train_loss": -25.572471618652344, "global_step": 317583, "epoch": 3826} {"train_loss": -25.915725708007812, "global_step": 317584, "epoch": 3826} {"train_loss": -25.8343448638916, "global_step": 317585, "epoch": 3826} {"train_loss": -26.064014434814453, "global_step": 317586, "epoch": 3826} {"train_loss": -26.08279800415039, "global_step": 317587, "epoch": 3826} {"train_loss": -25.745040893554688, "global_step": 317588, "epoch": 3826} {"train_loss": -25.45064353942871, "global_step": 317589, "epoch": 3826} {"train_loss": -25.936059951782227, "global_step": 317590, "epoch": 3826} {"train_loss": -25.669677734375, "global_step": 317591, "epoch": 3826} {"train_loss": -25.443214416503906, "global_step": 317592, "epoch": 3826} {"train_loss": -25.750019073486328, "global_step": 317593, "epoch": 3826} {"train_loss": -25.721927642822266, "global_step": 317594, "epoch": 3826} {"train_loss": -25.79621696472168, "global_step": 317595, "epoch": 3826} {"train_loss": -25.519058227539062, "global_step": 317596, "epoch": 3826} {"train_loss": -25.51873016357422, "global_step": 317597, "epoch": 3826} {"train_loss": -25.6789493560791, "global_step": 317598, "epoch": 3826} {"train_loss": -25.824966430664062, "global_step": 317599, "epoch": 3826} {"train_loss": -25.849328994750977, "global_step": 317600, "epoch": 3826} {"train_loss": -25.608976364135742, "global_step": 317601, "epoch": 3826} {"train_loss": -25.654279708862305, "global_step": 317602, "epoch": 3826} {"train_loss": -25.836139678955078, "global_step": 317603, "epoch": 3826} {"train_loss": -25.860614776611328, "global_step": 317604, "epoch": 3826} {"train_loss": -25.935956954956055, "global_step": 317605, "epoch": 3826} {"train_loss": -25.602502822875977, "global_step": 317606, "epoch": 3826} {"train_loss": -25.932178497314453, "global_step": 317607, "epoch": 3826} {"train_loss": -26.212305068969727, "global_step": 317608, "epoch": 3826} {"train_loss": -26.23016929626465, "global_step": 317609, "epoch": 3826} {"train_loss": -25.867948532104492, "global_step": 317610, "epoch": 3826} {"train_loss": -25.581884384155273, "global_step": 317611, "epoch": 3826} {"train_loss": -25.716495513916016, "global_step": 317612, "epoch": 3826} {"train_loss": -26.181360244750977, "global_step": 317613, "epoch": 3826} {"train_loss": -25.69977378845215, "global_step": 317614, "epoch": 3826} {"train_loss": -25.98652458190918, "global_step": 317615, "epoch": 3826} {"train_loss": -26.109649658203125, "global_step": 317616, "epoch": 3826} {"train_loss": -26.008817672729492, "global_step": 317617, "epoch": 3826} {"train_loss": -25.957355499267578, "global_step": 317618, "epoch": 3826} {"train_loss": -25.67535400390625, "global_step": 317619, "epoch": 3826} {"train_loss": -25.904829025268555, "global_step": 317620, "epoch": 3826} {"train_loss": -25.59458351135254, "global_step": 317621, "epoch": 3826} {"train_loss": -25.888708114624023, "global_step": 317622, "epoch": 3826} {"train_loss": -26.031814575195312, "global_step": 317623, "epoch": 3826} {"train_loss": -26.0494327545166, "global_step": 317624, "epoch": 3826} {"train_loss": -25.83306312561035, "global_step": 317625, "epoch": 3826} {"train_loss": -25.669925689697266, "global_step": 317626, "epoch": 3826} {"train_loss": -25.86602210998535, "global_step": 317627, "epoch": 3826} {"train_loss": -26.104543685913086, "global_step": 317628, "epoch": 3826} {"train_loss": -25.5988826751709, "global_step": 317629, "epoch": 3826} {"train_loss": -25.659875869750977, "global_step": 317630, "epoch": 3826} {"train_loss": -25.677505493164062, "global_step": 317631, "epoch": 3826} {"train_loss": -25.81158447265625, "global_step": 317632, "epoch": 3826} {"train_loss": -25.865568161010742, "global_step": 317633, "epoch": 3826} {"train_loss": -26.044189453125, "global_step": 317634, "epoch": 3826} {"train_loss": -25.74302101135254, "global_step": 317635, "epoch": 3826} {"train_loss": -25.82014274597168, "global_step": 317636, "epoch": 3826} {"train_loss": -25.551050186157227, "global_step": 317637, "epoch": 3826} {"train_loss": -25.8848876953125, "global_step": 317638, "epoch": 3826} {"train_loss": -25.867511749267578, "global_step": 317639, "epoch": 3826} {"train_loss": -25.791676831532673, "global_step": 317640, "epoch": 3826, "val_loss": 7349864.5} {"train_loss": -25.168045043945312, "global_step": 317641, "epoch": 3827} {"train_loss": -25.447954177856445, "global_step": 317642, "epoch": 3827} {"train_loss": -25.08803367614746, "global_step": 317643, "epoch": 3827} {"train_loss": -24.807411193847656, "global_step": 317644, "epoch": 3827} {"train_loss": -25.12240219116211, "global_step": 317645, "epoch": 3827} {"train_loss": -25.0040340423584, "global_step": 317646, "epoch": 3827} {"train_loss": -25.271177291870117, "global_step": 317647, "epoch": 3827} {"train_loss": -25.095813751220703, "global_step": 317648, "epoch": 3827} {"train_loss": -25.59267234802246, "global_step": 317649, "epoch": 3827} {"train_loss": -25.220911026000977, "global_step": 317650, "epoch": 3827} {"train_loss": -25.247129440307617, "global_step": 317651, "epoch": 3827} {"train_loss": -25.73660659790039, "global_step": 317652, "epoch": 3827} {"train_loss": -25.322734832763672, "global_step": 317653, "epoch": 3827} {"train_loss": -25.58123779296875, "global_step": 317654, "epoch": 3827} {"train_loss": -25.586395263671875, "global_step": 317655, "epoch": 3827} {"train_loss": -25.21564483642578, "global_step": 317656, "epoch": 3827} {"train_loss": -25.476715087890625, "global_step": 317657, "epoch": 3827} {"train_loss": -25.263713836669922, "global_step": 317658, "epoch": 3827} {"train_loss": -25.786779403686523, "global_step": 317659, "epoch": 3827} {"train_loss": -25.337867736816406, "global_step": 317660, "epoch": 3827} {"train_loss": -25.57736587524414, "global_step": 317661, "epoch": 3827} {"train_loss": -25.00909423828125, "global_step": 317662, "epoch": 3827} {"train_loss": -25.829334259033203, "global_step": 317663, "epoch": 3827} {"train_loss": -25.80169105529785, "global_step": 317664, "epoch": 3827} {"train_loss": -25.652633666992188, "global_step": 317665, "epoch": 3827} {"train_loss": -25.384870529174805, "global_step": 317666, "epoch": 3827} {"train_loss": -25.69073486328125, "global_step": 317667, "epoch": 3827} {"train_loss": -26.154376983642578, "global_step": 317668, "epoch": 3827} {"train_loss": -25.401611328125, "global_step": 317669, "epoch": 3827} {"train_loss": -26.121673583984375, "global_step": 317670, "epoch": 3827} {"train_loss": -25.768203735351562, "global_step": 317671, "epoch": 3827} {"train_loss": -25.854772567749023, "global_step": 317672, "epoch": 3827} {"train_loss": -25.751981735229492, "global_step": 317673, "epoch": 3827} {"train_loss": -26.11387062072754, "global_step": 317674, "epoch": 3827} {"train_loss": -26.007612228393555, "global_step": 317675, "epoch": 3827} {"train_loss": -26.132028579711914, "global_step": 317676, "epoch": 3827} {"train_loss": -25.772165298461914, "global_step": 317677, "epoch": 3827} {"train_loss": -25.893400192260742, "global_step": 317678, "epoch": 3827} {"train_loss": -25.79367446899414, "global_step": 317679, "epoch": 3827} {"train_loss": -26.01814842224121, "global_step": 317680, "epoch": 3827} {"train_loss": -26.277814865112305, "global_step": 317681, "epoch": 3827} {"train_loss": -25.857013702392578, "global_step": 317682, "epoch": 3827} {"train_loss": -25.947965621948242, "global_step": 317683, "epoch": 3827} {"train_loss": -26.269287109375, "global_step": 317684, "epoch": 3827} {"train_loss": -25.593673706054688, "global_step": 317685, "epoch": 3827} {"train_loss": -25.886022567749023, "global_step": 317686, "epoch": 3827} {"train_loss": -26.252405166625977, "global_step": 317687, "epoch": 3827} {"train_loss": -26.109012603759766, "global_step": 317688, "epoch": 3827} {"train_loss": -25.831073760986328, "global_step": 317689, "epoch": 3827} {"train_loss": -25.90212059020996, "global_step": 317690, "epoch": 3827} {"train_loss": -25.73789405822754, "global_step": 317691, "epoch": 3827} {"train_loss": -25.788827896118164, "global_step": 317692, "epoch": 3827} {"train_loss": -25.41897964477539, "global_step": 317693, "epoch": 3827} {"train_loss": -25.35321617126465, "global_step": 317694, "epoch": 3827} {"train_loss": -25.674619674682617, "global_step": 317695, "epoch": 3827} {"train_loss": -24.992046356201172, "global_step": 317696, "epoch": 3827} {"train_loss": -24.85628318786621, "global_step": 317697, "epoch": 3827} {"train_loss": -25.064924240112305, "global_step": 317698, "epoch": 3827} {"train_loss": -25.128555297851562, "global_step": 317699, "epoch": 3827} {"train_loss": -25.988855361938477, "global_step": 317700, "epoch": 3827} {"train_loss": -25.369136810302734, "global_step": 317701, "epoch": 3827} {"train_loss": -25.565624237060547, "global_step": 317702, "epoch": 3827} {"train_loss": -25.555789947509766, "global_step": 317703, "epoch": 3827} {"train_loss": -25.636266708374023, "global_step": 317704, "epoch": 3827} {"train_loss": -25.690053939819336, "global_step": 317705, "epoch": 3827} {"train_loss": -25.643247604370117, "global_step": 317706, "epoch": 3827} {"train_loss": -25.618749618530273, "global_step": 317707, "epoch": 3827} {"train_loss": -25.59656524658203, "global_step": 317708, "epoch": 3827} {"train_loss": -25.8348331451416, "global_step": 317709, "epoch": 3827} {"train_loss": -25.440052032470703, "global_step": 317710, "epoch": 3827} {"train_loss": -25.8654842376709, "global_step": 317711, "epoch": 3827} {"train_loss": -25.892526626586914, "global_step": 317712, "epoch": 3827} {"train_loss": -25.86944007873535, "global_step": 317713, "epoch": 3827} {"train_loss": -25.73798942565918, "global_step": 317714, "epoch": 3827} {"train_loss": -25.765710830688477, "global_step": 317715, "epoch": 3827} {"train_loss": -25.865314483642578, "global_step": 317716, "epoch": 3827} {"train_loss": -25.70012855529785, "global_step": 317717, "epoch": 3827} {"train_loss": -25.767934799194336, "global_step": 317718, "epoch": 3827} {"train_loss": -25.655317306518555, "global_step": 317719, "epoch": 3827} {"train_loss": -25.97519874572754, "global_step": 317720, "epoch": 3827} {"train_loss": -25.684101104736328, "global_step": 317721, "epoch": 3827} {"train_loss": -26.06072998046875, "global_step": 317722, "epoch": 3827} {"train_loss": -25.633513898734588, "global_step": 317723, "epoch": 3827, "val_loss": 7258899.0} {"train_loss": -25.82185935974121, "global_step": 317724, "epoch": 3828} {"train_loss": -25.993741989135742, "global_step": 317725, "epoch": 3828} {"train_loss": -26.007837295532227, "global_step": 317726, "epoch": 3828} {"train_loss": -26.297351837158203, "global_step": 317727, "epoch": 3828} {"train_loss": -26.020017623901367, "global_step": 317728, "epoch": 3828} {"train_loss": -25.67621421813965, "global_step": 317729, "epoch": 3828} {"train_loss": -25.819177627563477, "global_step": 317730, "epoch": 3828} {"train_loss": -26.024667739868164, "global_step": 317731, "epoch": 3828} {"train_loss": -25.509662628173828, "global_step": 317732, "epoch": 3828} {"train_loss": -25.762983322143555, "global_step": 317733, "epoch": 3828} {"train_loss": -25.97732925415039, "global_step": 317734, "epoch": 3828} {"train_loss": -25.698877334594727, "global_step": 317735, "epoch": 3828} {"train_loss": -26.191497802734375, "global_step": 317736, "epoch": 3828} {"train_loss": -25.703561782836914, "global_step": 317737, "epoch": 3828} {"train_loss": -25.59102439880371, "global_step": 317738, "epoch": 3828} {"train_loss": -25.914234161376953, "global_step": 317739, "epoch": 3828} {"train_loss": -25.518178939819336, "global_step": 317740, "epoch": 3828} {"train_loss": -25.65581703186035, "global_step": 317741, "epoch": 3828} {"train_loss": -26.100875854492188, "global_step": 317742, "epoch": 3828} {"train_loss": -26.034692764282227, "global_step": 317743, "epoch": 3828} {"train_loss": -25.74909019470215, "global_step": 317744, "epoch": 3828} {"train_loss": -26.204437255859375, "global_step": 317745, "epoch": 3828} {"train_loss": -26.015090942382812, "global_step": 317746, "epoch": 3828} {"train_loss": -26.306211471557617, "global_step": 317747, "epoch": 3828} {"train_loss": -26.271005630493164, "global_step": 317748, "epoch": 3828} {"train_loss": -25.9675350189209, "global_step": 317749, "epoch": 3828} {"train_loss": -25.595407485961914, "global_step": 317750, "epoch": 3828} {"train_loss": -26.07379150390625, "global_step": 317751, "epoch": 3828} {"train_loss": -26.12408447265625, "global_step": 317752, "epoch": 3828} {"train_loss": -25.958240509033203, "global_step": 317753, "epoch": 3828} {"train_loss": -26.05079460144043, "global_step": 317754, "epoch": 3828} {"train_loss": -25.87196922302246, "global_step": 317755, "epoch": 3828} {"train_loss": -25.6021785736084, "global_step": 317756, "epoch": 3828} {"train_loss": -26.115392684936523, "global_step": 317757, "epoch": 3828} {"train_loss": -25.82158851623535, "global_step": 317758, "epoch": 3828} {"train_loss": -25.225738525390625, "global_step": 317759, "epoch": 3828} {"train_loss": -25.762975692749023, "global_step": 317760, "epoch": 3828} {"train_loss": -25.730222702026367, "global_step": 317761, "epoch": 3828} {"train_loss": -25.787399291992188, "global_step": 317762, "epoch": 3828} {"train_loss": -25.63981056213379, "global_step": 317763, "epoch": 3828} {"train_loss": -25.241918563842773, "global_step": 317764, "epoch": 3828} {"train_loss": -25.136762619018555, "global_step": 317765, "epoch": 3828} {"train_loss": -26.158838272094727, "global_step": 317766, "epoch": 3828} {"train_loss": -25.611148834228516, "global_step": 317767, "epoch": 3828} {"train_loss": -25.366613388061523, "global_step": 317768, "epoch": 3828} {"train_loss": -25.6080379486084, "global_step": 317769, "epoch": 3828} {"train_loss": -25.24553871154785, "global_step": 317770, "epoch": 3828} {"train_loss": -25.840442657470703, "global_step": 317771, "epoch": 3828} {"train_loss": -25.42887306213379, "global_step": 317772, "epoch": 3828} {"train_loss": -25.97869873046875, "global_step": 317773, "epoch": 3828} {"train_loss": -25.679712295532227, "global_step": 317774, "epoch": 3828} {"train_loss": -25.256994247436523, "global_step": 317775, "epoch": 3828} {"train_loss": -25.779560089111328, "global_step": 317776, "epoch": 3828} {"train_loss": -25.645673751831055, "global_step": 317777, "epoch": 3828} {"train_loss": -25.940692901611328, "global_step": 317778, "epoch": 3828} {"train_loss": -25.3950252532959, "global_step": 317779, "epoch": 3828} {"train_loss": -25.796842575073242, "global_step": 317780, "epoch": 3828} {"train_loss": -26.081125259399414, "global_step": 317781, "epoch": 3828} {"train_loss": -25.695226669311523, "global_step": 317782, "epoch": 3828} {"train_loss": -25.3833065032959, "global_step": 317783, "epoch": 3828} {"train_loss": -25.71467399597168, "global_step": 317784, "epoch": 3828} {"train_loss": -25.89588737487793, "global_step": 317785, "epoch": 3828} {"train_loss": -25.670795440673828, "global_step": 317786, "epoch": 3828} {"train_loss": -25.870563507080078, "global_step": 317787, "epoch": 3828} {"train_loss": -26.06699562072754, "global_step": 317788, "epoch": 3828} {"train_loss": -25.607572555541992, "global_step": 317789, "epoch": 3828} {"train_loss": -25.630720138549805, "global_step": 317790, "epoch": 3828} {"train_loss": -25.965234756469727, "global_step": 317791, "epoch": 3828} {"train_loss": -25.520631790161133, "global_step": 317792, "epoch": 3828} {"train_loss": -25.520450592041016, "global_step": 317793, "epoch": 3828} {"train_loss": -25.478940963745117, "global_step": 317794, "epoch": 3828} {"train_loss": -25.963226318359375, "global_step": 317795, "epoch": 3828} {"train_loss": -25.276729583740234, "global_step": 317796, "epoch": 3828} {"train_loss": -25.789688110351562, "global_step": 317797, "epoch": 3828} {"train_loss": -25.739965438842773, "global_step": 317798, "epoch": 3828} {"train_loss": -26.052539825439453, "global_step": 317799, "epoch": 3828} {"train_loss": -25.755441665649414, "global_step": 317800, "epoch": 3828} {"train_loss": -25.384702682495117, "global_step": 317801, "epoch": 3828} {"train_loss": -26.122211456298828, "global_step": 317802, "epoch": 3828} {"train_loss": -25.903966903686523, "global_step": 317803, "epoch": 3828} {"train_loss": -25.714086532592773, "global_step": 317804, "epoch": 3828} {"train_loss": -25.58622932434082, "global_step": 317805, "epoch": 3828} {"train_loss": -25.756400878170886, "global_step": 317806, "epoch": 3828, "val_loss": 7189934.5} {"train_loss": -25.14681053161621, "global_step": 317807, "epoch": 3829} {"train_loss": -24.917037963867188, "global_step": 317808, "epoch": 3829} {"train_loss": -25.595413208007812, "global_step": 317809, "epoch": 3829} {"train_loss": -25.1422119140625, "global_step": 317810, "epoch": 3829} {"train_loss": -25.448781967163086, "global_step": 317811, "epoch": 3829} {"train_loss": -25.316238403320312, "global_step": 317812, "epoch": 3829} {"train_loss": -24.955188751220703, "global_step": 317813, "epoch": 3829} {"train_loss": -25.617639541625977, "global_step": 317814, "epoch": 3829} {"train_loss": -25.679285049438477, "global_step": 317815, "epoch": 3829} {"train_loss": -25.56390953063965, "global_step": 317816, "epoch": 3829} {"train_loss": -25.501522064208984, "global_step": 317817, "epoch": 3829} {"train_loss": -25.846261978149414, "global_step": 317818, "epoch": 3829} {"train_loss": -25.523462295532227, "global_step": 317819, "epoch": 3829} {"train_loss": -25.727869033813477, "global_step": 317820, "epoch": 3829} {"train_loss": -25.838764190673828, "global_step": 317821, "epoch": 3829} {"train_loss": -25.616540908813477, "global_step": 317822, "epoch": 3829} {"train_loss": -25.623905181884766, "global_step": 317823, "epoch": 3829} {"train_loss": -25.940723419189453, "global_step": 317824, "epoch": 3829} {"train_loss": -25.70768165588379, "global_step": 317825, "epoch": 3829} {"train_loss": -25.670446395874023, "global_step": 317826, "epoch": 3829} {"train_loss": -25.75339698791504, "global_step": 317827, "epoch": 3829} {"train_loss": -26.0640926361084, "global_step": 317828, "epoch": 3829} {"train_loss": -25.50864028930664, "global_step": 317829, "epoch": 3829} {"train_loss": -25.61940574645996, "global_step": 317830, "epoch": 3829} {"train_loss": -25.543455123901367, "global_step": 317831, "epoch": 3829} {"train_loss": -25.748334884643555, "global_step": 317832, "epoch": 3829} {"train_loss": -25.926111221313477, "global_step": 317833, "epoch": 3829} {"train_loss": -25.6525936126709, "global_step": 317834, "epoch": 3829} {"train_loss": -26.11398696899414, "global_step": 317835, "epoch": 3829} {"train_loss": -26.091520309448242, "global_step": 317836, "epoch": 3829} {"train_loss": -26.109729766845703, "global_step": 317837, "epoch": 3829} {"train_loss": -26.31328773498535, "global_step": 317838, "epoch": 3829} {"train_loss": -25.631200790405273, "global_step": 317839, "epoch": 3829} {"train_loss": -25.93812370300293, "global_step": 317840, "epoch": 3829} {"train_loss": -25.96378517150879, "global_step": 317841, "epoch": 3829} {"train_loss": -25.979032516479492, "global_step": 317842, "epoch": 3829} {"train_loss": -26.141096115112305, "global_step": 317843, "epoch": 3829} {"train_loss": -26.209638595581055, "global_step": 317844, "epoch": 3829} {"train_loss": -26.06842613220215, "global_step": 317845, "epoch": 3829} {"train_loss": -26.12285804748535, "global_step": 317846, "epoch": 3829} {"train_loss": -26.070220947265625, "global_step": 317847, "epoch": 3829} {"train_loss": -25.919925689697266, "global_step": 317848, "epoch": 3829} {"train_loss": -25.90705680847168, "global_step": 317849, "epoch": 3829} {"train_loss": -25.633153915405273, "global_step": 317850, "epoch": 3829} {"train_loss": -26.214231491088867, "global_step": 317851, "epoch": 3829} {"train_loss": -26.0366153717041, "global_step": 317852, "epoch": 3829} {"train_loss": -25.765674591064453, "global_step": 317853, "epoch": 3829} {"train_loss": -25.452423095703125, "global_step": 317854, "epoch": 3829} {"train_loss": -25.914167404174805, "global_step": 317855, "epoch": 3829} {"train_loss": -25.478025436401367, "global_step": 317856, "epoch": 3829} {"train_loss": -25.745227813720703, "global_step": 317857, "epoch": 3829} {"train_loss": -25.3249568939209, "global_step": 317858, "epoch": 3829} {"train_loss": -25.78106689453125, "global_step": 317859, "epoch": 3829} {"train_loss": -25.59426498413086, "global_step": 317860, "epoch": 3829} {"train_loss": -25.606491088867188, "global_step": 317861, "epoch": 3829} {"train_loss": -25.418581008911133, "global_step": 317862, "epoch": 3829} {"train_loss": -25.507583618164062, "global_step": 317863, "epoch": 3829} {"train_loss": -25.610395431518555, "global_step": 317864, "epoch": 3829} {"train_loss": -25.687030792236328, "global_step": 317865, "epoch": 3829} {"train_loss": -25.25670051574707, "global_step": 317866, "epoch": 3829} {"train_loss": -25.407724380493164, "global_step": 317867, "epoch": 3829} {"train_loss": -25.3407039642334, "global_step": 317868, "epoch": 3829} {"train_loss": -25.55450439453125, "global_step": 317869, "epoch": 3829} {"train_loss": -25.177490234375, "global_step": 317870, "epoch": 3829} {"train_loss": -25.8981990814209, "global_step": 317871, "epoch": 3829} {"train_loss": -25.475234985351562, "global_step": 317872, "epoch": 3829} {"train_loss": -25.635690689086914, "global_step": 317873, "epoch": 3829} {"train_loss": -25.998716354370117, "global_step": 317874, "epoch": 3829} {"train_loss": -25.435216903686523, "global_step": 317875, "epoch": 3829} {"train_loss": -25.709253311157227, "global_step": 317876, "epoch": 3829} {"train_loss": -25.52156639099121, "global_step": 317877, "epoch": 3829} {"train_loss": -25.762292861938477, "global_step": 317878, "epoch": 3829} {"train_loss": -25.66334342956543, "global_step": 317879, "epoch": 3829} {"train_loss": -25.57056999206543, "global_step": 317880, "epoch": 3829} {"train_loss": -25.825403213500977, "global_step": 317881, "epoch": 3829} {"train_loss": -25.531457901000977, "global_step": 317882, "epoch": 3829} {"train_loss": -25.445781707763672, "global_step": 317883, "epoch": 3829} {"train_loss": -25.749897003173828, "global_step": 317884, "epoch": 3829} {"train_loss": -25.54479217529297, "global_step": 317885, "epoch": 3829} {"train_loss": -25.887741088867188, "global_step": 317886, "epoch": 3829} {"train_loss": -25.371673583984375, "global_step": 317887, "epoch": 3829} {"train_loss": -25.551212310791016, "global_step": 317888, "epoch": 3829} {"train_loss": -25.674292460981622, "global_step": 317889, "epoch": 3829, "val_loss": 7340149.5} {"train_loss": -25.473730087280273, "global_step": 317890, "epoch": 3830} {"train_loss": -25.75941276550293, "global_step": 317891, "epoch": 3830} {"train_loss": -25.38458824157715, "global_step": 317892, "epoch": 3830} {"train_loss": -25.324359893798828, "global_step": 317893, "epoch": 3830} {"train_loss": -25.490812301635742, "global_step": 317894, "epoch": 3830} {"train_loss": -25.540081024169922, "global_step": 317895, "epoch": 3830} {"train_loss": -25.38475799560547, "global_step": 317896, "epoch": 3830} {"train_loss": -23.981088638305664, "global_step": 317897, "epoch": 3830} {"train_loss": -25.554609298706055, "global_step": 317898, "epoch": 3830} {"train_loss": -25.411584854125977, "global_step": 317899, "epoch": 3830} {"train_loss": -25.511398315429688, "global_step": 317900, "epoch": 3830} {"train_loss": -25.504047393798828, "global_step": 317901, "epoch": 3830} {"train_loss": -25.779394149780273, "global_step": 317902, "epoch": 3830} {"train_loss": -25.43756103515625, "global_step": 317903, "epoch": 3830} {"train_loss": -25.553863525390625, "global_step": 317904, "epoch": 3830} {"train_loss": -25.497146606445312, "global_step": 317905, "epoch": 3830} {"train_loss": -25.651702880859375, "global_step": 317906, "epoch": 3830} {"train_loss": -25.24713706970215, "global_step": 317907, "epoch": 3830} {"train_loss": -25.311017990112305, "global_step": 317908, "epoch": 3830} {"train_loss": -25.734790802001953, "global_step": 317909, "epoch": 3830} {"train_loss": -25.445220947265625, "global_step": 317910, "epoch": 3830} {"train_loss": -26.023046493530273, "global_step": 317911, "epoch": 3830} {"train_loss": -25.54550552368164, "global_step": 317912, "epoch": 3830} {"train_loss": -25.77088737487793, "global_step": 317913, "epoch": 3830} {"train_loss": -25.144983291625977, "global_step": 317914, "epoch": 3830} {"train_loss": -25.72651481628418, "global_step": 317915, "epoch": 3830} {"train_loss": -25.628620147705078, "global_step": 317916, "epoch": 3830} {"train_loss": -25.65887451171875, "global_step": 317917, "epoch": 3830} {"train_loss": -25.826730728149414, "global_step": 317918, "epoch": 3830} {"train_loss": -25.58267593383789, "global_step": 317919, "epoch": 3830} {"train_loss": -25.689483642578125, "global_step": 317920, "epoch": 3830} {"train_loss": -25.264142990112305, "global_step": 317921, "epoch": 3830} {"train_loss": -25.985692977905273, "global_step": 317922, "epoch": 3830} {"train_loss": -25.36172866821289, "global_step": 317923, "epoch": 3830} {"train_loss": -25.71809196472168, "global_step": 317924, "epoch": 3830} {"train_loss": -25.843793869018555, "global_step": 317925, "epoch": 3830} {"train_loss": -26.358367919921875, "global_step": 317926, "epoch": 3830} {"train_loss": -25.570226669311523, "global_step": 317927, "epoch": 3830} {"train_loss": -25.697986602783203, "global_step": 317928, "epoch": 3830} {"train_loss": -25.849475860595703, "global_step": 317929, "epoch": 3830} {"train_loss": -26.055936813354492, "global_step": 317930, "epoch": 3830} {"train_loss": -26.037519454956055, "global_step": 317931, "epoch": 3830} {"train_loss": -25.624591827392578, "global_step": 317932, "epoch": 3830} {"train_loss": -25.9294376373291, "global_step": 317933, "epoch": 3830} {"train_loss": -25.978199005126953, "global_step": 317934, "epoch": 3830} {"train_loss": -26.1218318939209, "global_step": 317935, "epoch": 3830} {"train_loss": -25.62613868713379, "global_step": 317936, "epoch": 3830} {"train_loss": -25.747629165649414, "global_step": 317937, "epoch": 3830} {"train_loss": -25.713117599487305, "global_step": 317938, "epoch": 3830} {"train_loss": -25.6392765045166, "global_step": 317939, "epoch": 3830} {"train_loss": -25.7585391998291, "global_step": 317940, "epoch": 3830} {"train_loss": -26.236059188842773, "global_step": 317941, "epoch": 3830} {"train_loss": -25.81941032409668, "global_step": 317942, "epoch": 3830} {"train_loss": -25.9141845703125, "global_step": 317943, "epoch": 3830} {"train_loss": -25.70855712890625, "global_step": 317944, "epoch": 3830} {"train_loss": -25.943988800048828, "global_step": 317945, "epoch": 3830} {"train_loss": -25.07660484313965, "global_step": 317946, "epoch": 3830} {"train_loss": -25.429479598999023, "global_step": 317947, "epoch": 3830} {"train_loss": -25.096771240234375, "global_step": 317948, "epoch": 3830} {"train_loss": -25.061426162719727, "global_step": 317949, "epoch": 3830} {"train_loss": -25.571096420288086, "global_step": 317950, "epoch": 3830} {"train_loss": -26.270801544189453, "global_step": 317951, "epoch": 3830} {"train_loss": -25.178180694580078, "global_step": 317952, "epoch": 3830} {"train_loss": -25.344223022460938, "global_step": 317953, "epoch": 3830} {"train_loss": -25.819095611572266, "global_step": 317954, "epoch": 3830} {"train_loss": -25.44584083557129, "global_step": 317955, "epoch": 3830} {"train_loss": -24.891820907592773, "global_step": 317956, "epoch": 3830} {"train_loss": -25.7867374420166, "global_step": 317957, "epoch": 3830} {"train_loss": -25.631757736206055, "global_step": 317958, "epoch": 3830} {"train_loss": -25.453767776489258, "global_step": 317959, "epoch": 3830} {"train_loss": -26.263843536376953, "global_step": 317960, "epoch": 3830} {"train_loss": -25.410276412963867, "global_step": 317961, "epoch": 3830} {"train_loss": -25.6508731842041, "global_step": 317962, "epoch": 3830} {"train_loss": -25.74334716796875, "global_step": 317963, "epoch": 3830} {"train_loss": -25.615798950195312, "global_step": 317964, "epoch": 3830} {"train_loss": -25.586807250976562, "global_step": 317965, "epoch": 3830} {"train_loss": -25.60137939453125, "global_step": 317966, "epoch": 3830} {"train_loss": -26.303152084350586, "global_step": 317967, "epoch": 3830} {"train_loss": -25.807897567749023, "global_step": 317968, "epoch": 3830} {"train_loss": -25.47383689880371, "global_step": 317969, "epoch": 3830} {"train_loss": -26.335229873657227, "global_step": 317970, "epoch": 3830} {"train_loss": -25.909154891967773, "global_step": 317971, "epoch": 3830} {"train_loss": -25.61458900175899, "global_step": 317972, "epoch": 3830, "val_loss": 7289454.0} {"train_loss": -25.31580352783203, "global_step": 317973, "epoch": 3831} {"train_loss": -25.202228546142578, "global_step": 317974, "epoch": 3831} {"train_loss": -25.156518936157227, "global_step": 317975, "epoch": 3831} {"train_loss": -25.44902229309082, "global_step": 317976, "epoch": 3831} {"train_loss": -25.217952728271484, "global_step": 317977, "epoch": 3831} {"train_loss": -25.290023803710938, "global_step": 317978, "epoch": 3831} {"train_loss": -25.3995304107666, "global_step": 317979, "epoch": 3831} {"train_loss": -25.769495010375977, "global_step": 317980, "epoch": 3831} {"train_loss": -25.222126007080078, "global_step": 317981, "epoch": 3831} {"train_loss": -25.440696716308594, "global_step": 317982, "epoch": 3831} {"train_loss": -25.55596351623535, "global_step": 317983, "epoch": 3831} {"train_loss": -25.403669357299805, "global_step": 317984, "epoch": 3831} {"train_loss": -25.52589988708496, "global_step": 317985, "epoch": 3831} {"train_loss": -25.431913375854492, "global_step": 317986, "epoch": 3831} {"train_loss": -25.57622718811035, "global_step": 317987, "epoch": 3831} {"train_loss": -25.723285675048828, "global_step": 317988, "epoch": 3831} {"train_loss": -25.72397232055664, "global_step": 317989, "epoch": 3831} {"train_loss": -25.698627471923828, "global_step": 317990, "epoch": 3831} {"train_loss": -25.96393394470215, "global_step": 317991, "epoch": 3831} {"train_loss": -25.669391632080078, "global_step": 317992, "epoch": 3831} {"train_loss": -25.665363311767578, "global_step": 317993, "epoch": 3831} {"train_loss": -25.828718185424805, "global_step": 317994, "epoch": 3831} {"train_loss": -25.59193229675293, "global_step": 317995, "epoch": 3831} {"train_loss": -25.97052001953125, "global_step": 317996, "epoch": 3831} {"train_loss": -25.60062599182129, "global_step": 317997, "epoch": 3831} {"train_loss": -25.9180908203125, "global_step": 317998, "epoch": 3831} {"train_loss": -25.838354110717773, "global_step": 317999, "epoch": 3831} {"train_loss": -25.847991943359375, "global_step": 318000, "epoch": 3831} {"train_loss": -25.927820205688477, "global_step": 318001, "epoch": 3831} {"train_loss": -26.082258224487305, "global_step": 318002, "epoch": 3831} {"train_loss": -26.010934829711914, "global_step": 318003, "epoch": 3831} {"train_loss": -25.86329460144043, "global_step": 318004, "epoch": 3831} {"train_loss": -25.741540908813477, "global_step": 318005, "epoch": 3831} {"train_loss": -25.82769203186035, "global_step": 318006, "epoch": 3831} {"train_loss": -25.458227157592773, "global_step": 318007, "epoch": 3831} {"train_loss": -25.843204498291016, "global_step": 318008, "epoch": 3831} {"train_loss": -25.97767448425293, "global_step": 318009, "epoch": 3831} {"train_loss": -25.59195327758789, "global_step": 318010, "epoch": 3831} {"train_loss": -25.42673683166504, "global_step": 318011, "epoch": 3831} {"train_loss": -25.72474479675293, "global_step": 318012, "epoch": 3831} {"train_loss": -25.70362663269043, "global_step": 318013, "epoch": 3831} {"train_loss": -25.93726921081543, "global_step": 318014, "epoch": 3831} {"train_loss": -25.67469596862793, "global_step": 318015, "epoch": 3831} {"train_loss": -25.627317428588867, "global_step": 318016, "epoch": 3831} {"train_loss": -25.13722801208496, "global_step": 318017, "epoch": 3831} {"train_loss": -25.746694564819336, "global_step": 318018, "epoch": 3831} {"train_loss": -25.7603816986084, "global_step": 318019, "epoch": 3831} {"train_loss": -25.485517501831055, "global_step": 318020, "epoch": 3831} {"train_loss": -25.16547393798828, "global_step": 318021, "epoch": 3831} {"train_loss": -25.696807861328125, "global_step": 318022, "epoch": 3831} {"train_loss": -25.498754501342773, "global_step": 318023, "epoch": 3831} {"train_loss": -25.825925827026367, "global_step": 318024, "epoch": 3831} {"train_loss": -25.518924713134766, "global_step": 318025, "epoch": 3831} {"train_loss": -25.43708610534668, "global_step": 318026, "epoch": 3831} {"train_loss": -25.205490112304688, "global_step": 318027, "epoch": 3831} {"train_loss": -25.703989028930664, "global_step": 318028, "epoch": 3831} {"train_loss": -25.49561309814453, "global_step": 318029, "epoch": 3831} {"train_loss": -26.08949089050293, "global_step": 318030, "epoch": 3831} {"train_loss": -25.727386474609375, "global_step": 318031, "epoch": 3831} {"train_loss": -25.395387649536133, "global_step": 318032, "epoch": 3831} {"train_loss": -25.7783203125, "global_step": 318033, "epoch": 3831} {"train_loss": -25.277822494506836, "global_step": 318034, "epoch": 3831} {"train_loss": -26.058673858642578, "global_step": 318035, "epoch": 3831} {"train_loss": -25.487445831298828, "global_step": 318036, "epoch": 3831} {"train_loss": -26.02351188659668, "global_step": 318037, "epoch": 3831} {"train_loss": -25.88958168029785, "global_step": 318038, "epoch": 3831} {"train_loss": -25.814237594604492, "global_step": 318039, "epoch": 3831} {"train_loss": -25.948881149291992, "global_step": 318040, "epoch": 3831} {"train_loss": -25.77471923828125, "global_step": 318041, "epoch": 3831} {"train_loss": -25.51397132873535, "global_step": 318042, "epoch": 3831} {"train_loss": -25.670331954956055, "global_step": 318043, "epoch": 3831} {"train_loss": -25.78081703186035, "global_step": 318044, "epoch": 3831} {"train_loss": -26.00372314453125, "global_step": 318045, "epoch": 3831} {"train_loss": -25.652734756469727, "global_step": 318046, "epoch": 3831} {"train_loss": -25.7144775390625, "global_step": 318047, "epoch": 3831} {"train_loss": -26.112085342407227, "global_step": 318048, "epoch": 3831} {"train_loss": -25.76129722595215, "global_step": 318049, "epoch": 3831} {"train_loss": -25.709442138671875, "global_step": 318050, "epoch": 3831} {"train_loss": -25.71119499206543, "global_step": 318051, "epoch": 3831} {"train_loss": -25.81085777282715, "global_step": 318052, "epoch": 3831} {"train_loss": -26.108081817626953, "global_step": 318053, "epoch": 3831} {"train_loss": -25.939773559570312, "global_step": 318054, "epoch": 3831} {"train_loss": -25.67095014273402, "global_step": 318055, "epoch": 3831, "val_loss": 7377490.0} {"train_loss": -24.848491668701172, "global_step": 318056, "epoch": 3832} {"train_loss": -25.10111427307129, "global_step": 318057, "epoch": 3832} {"train_loss": -24.875158309936523, "global_step": 318058, "epoch": 3832} {"train_loss": -25.419036865234375, "global_step": 318059, "epoch": 3832} {"train_loss": -24.695751190185547, "global_step": 318060, "epoch": 3832} {"train_loss": -25.216297149658203, "global_step": 318061, "epoch": 3832} {"train_loss": -25.124990463256836, "global_step": 318062, "epoch": 3832} {"train_loss": -25.36178207397461, "global_step": 318063, "epoch": 3832} {"train_loss": -25.010709762573242, "global_step": 318064, "epoch": 3832} {"train_loss": -25.50339126586914, "global_step": 318065, "epoch": 3832} {"train_loss": -24.962669372558594, "global_step": 318066, "epoch": 3832} {"train_loss": -25.20659828186035, "global_step": 318067, "epoch": 3832} {"train_loss": -25.66340446472168, "global_step": 318068, "epoch": 3832} {"train_loss": -25.302440643310547, "global_step": 318069, "epoch": 3832} {"train_loss": -25.35005760192871, "global_step": 318070, "epoch": 3832} {"train_loss": -25.933109283447266, "global_step": 318071, "epoch": 3832} {"train_loss": -25.738962173461914, "global_step": 318072, "epoch": 3832} {"train_loss": -25.373624801635742, "global_step": 318073, "epoch": 3832} {"train_loss": -25.682722091674805, "global_step": 318074, "epoch": 3832} {"train_loss": -25.55470085144043, "global_step": 318075, "epoch": 3832} {"train_loss": -25.59579086303711, "global_step": 318076, "epoch": 3832} {"train_loss": -25.727787017822266, "global_step": 318077, "epoch": 3832} {"train_loss": -25.658843994140625, "global_step": 318078, "epoch": 3832} {"train_loss": -25.56015396118164, "global_step": 318079, "epoch": 3832} {"train_loss": -25.35675048828125, "global_step": 318080, "epoch": 3832} {"train_loss": -25.60953140258789, "global_step": 318081, "epoch": 3832} {"train_loss": -25.713397979736328, "global_step": 318082, "epoch": 3832} {"train_loss": -25.7785701751709, "global_step": 318083, "epoch": 3832} {"train_loss": -25.918676376342773, "global_step": 318084, "epoch": 3832} {"train_loss": -25.56716537475586, "global_step": 318085, "epoch": 3832} {"train_loss": -25.80427360534668, "global_step": 318086, "epoch": 3832} {"train_loss": -26.02606201171875, "global_step": 318087, "epoch": 3832} {"train_loss": -25.400707244873047, "global_step": 318088, "epoch": 3832} {"train_loss": -25.832141876220703, "global_step": 318089, "epoch": 3832} {"train_loss": -25.5750732421875, "global_step": 318090, "epoch": 3832} {"train_loss": -25.56985855102539, "global_step": 318091, "epoch": 3832} {"train_loss": -26.049457550048828, "global_step": 318092, "epoch": 3832} {"train_loss": -25.67340660095215, "global_step": 318093, "epoch": 3832} {"train_loss": -25.798965454101562, "global_step": 318094, "epoch": 3832} {"train_loss": -25.640066146850586, "global_step": 318095, "epoch": 3832} {"train_loss": -25.73557472229004, "global_step": 318096, "epoch": 3832} {"train_loss": -25.853271484375, "global_step": 318097, "epoch": 3832} {"train_loss": -26.27223777770996, "global_step": 318098, "epoch": 3832} {"train_loss": -25.981266021728516, "global_step": 318099, "epoch": 3832} {"train_loss": -26.083709716796875, "global_step": 318100, "epoch": 3832} {"train_loss": -26.117481231689453, "global_step": 318101, "epoch": 3832} {"train_loss": -25.568603515625, "global_step": 318102, "epoch": 3832} {"train_loss": -25.53017807006836, "global_step": 318103, "epoch": 3832} {"train_loss": -25.960119247436523, "global_step": 318104, "epoch": 3832} {"train_loss": -25.777057647705078, "global_step": 318105, "epoch": 3832} {"train_loss": -25.847631454467773, "global_step": 318106, "epoch": 3832} {"train_loss": -26.2652587890625, "global_step": 318107, "epoch": 3832} {"train_loss": -25.60141944885254, "global_step": 318108, "epoch": 3832} {"train_loss": -25.950550079345703, "global_step": 318109, "epoch": 3832} {"train_loss": -25.835874557495117, "global_step": 318110, "epoch": 3832} {"train_loss": -26.11224365234375, "global_step": 318111, "epoch": 3832} {"train_loss": -26.066272735595703, "global_step": 318112, "epoch": 3832} {"train_loss": -25.907819747924805, "global_step": 318113, "epoch": 3832} {"train_loss": -25.912763595581055, "global_step": 318114, "epoch": 3832} {"train_loss": -26.296018600463867, "global_step": 318115, "epoch": 3832} {"train_loss": -25.90492057800293, "global_step": 318116, "epoch": 3832} {"train_loss": -26.3271484375, "global_step": 318117, "epoch": 3832} {"train_loss": -25.64129066467285, "global_step": 318118, "epoch": 3832} {"train_loss": -26.14918327331543, "global_step": 318119, "epoch": 3832} {"train_loss": -26.091821670532227, "global_step": 318120, "epoch": 3832} {"train_loss": -25.901371002197266, "global_step": 318121, "epoch": 3832} {"train_loss": -26.08127212524414, "global_step": 318122, "epoch": 3832} {"train_loss": -25.78360939025879, "global_step": 318123, "epoch": 3832} {"train_loss": -26.08868980407715, "global_step": 318124, "epoch": 3832} {"train_loss": -25.66845703125, "global_step": 318125, "epoch": 3832} {"train_loss": -25.8917236328125, "global_step": 318126, "epoch": 3832} {"train_loss": -25.798498153686523, "global_step": 318127, "epoch": 3832} {"train_loss": -26.052051544189453, "global_step": 318128, "epoch": 3832} {"train_loss": -26.132938385009766, "global_step": 318129, "epoch": 3832} {"train_loss": -26.011341094970703, "global_step": 318130, "epoch": 3832} {"train_loss": -25.73419189453125, "global_step": 318131, "epoch": 3832} {"train_loss": -25.864704132080078, "global_step": 318132, "epoch": 3832} {"train_loss": -25.904714584350586, "global_step": 318133, "epoch": 3832} {"train_loss": -25.666213989257812, "global_step": 318134, "epoch": 3832} {"train_loss": -25.796911239624023, "global_step": 318135, "epoch": 3832} {"train_loss": -25.50471305847168, "global_step": 318136, "epoch": 3832} {"train_loss": -24.98607635498047, "global_step": 318137, "epoch": 3832} {"train_loss": -25.69686234715473, "global_step": 318138, "epoch": 3832, "val_loss": 7336316.0} {"train_loss": -25.14221954345703, "global_step": 318139, "epoch": 3833} {"train_loss": -25.336904525756836, "global_step": 318140, "epoch": 3833} {"train_loss": -25.230703353881836, "global_step": 318141, "epoch": 3833} {"train_loss": -25.48980140686035, "global_step": 318142, "epoch": 3833} {"train_loss": -25.372554779052734, "global_step": 318143, "epoch": 3833} {"train_loss": -25.287220001220703, "global_step": 318144, "epoch": 3833} {"train_loss": -25.073293685913086, "global_step": 318145, "epoch": 3833} {"train_loss": -25.094425201416016, "global_step": 318146, "epoch": 3833} {"train_loss": -25.119903564453125, "global_step": 318147, "epoch": 3833} {"train_loss": -25.226041793823242, "global_step": 318148, "epoch": 3833} {"train_loss": -25.5413875579834, "global_step": 318149, "epoch": 3833} {"train_loss": -24.90308952331543, "global_step": 318150, "epoch": 3833} {"train_loss": -25.45990562438965, "global_step": 318151, "epoch": 3833} {"train_loss": -25.573694229125977, "global_step": 318152, "epoch": 3833} {"train_loss": -25.639089584350586, "global_step": 318153, "epoch": 3833} {"train_loss": -25.59590721130371, "global_step": 318154, "epoch": 3833} {"train_loss": -25.6497802734375, "global_step": 318155, "epoch": 3833} {"train_loss": -25.6452693939209, "global_step": 318156, "epoch": 3833} {"train_loss": -25.364227294921875, "global_step": 318157, "epoch": 3833} {"train_loss": -25.8470401763916, "global_step": 318158, "epoch": 3833} {"train_loss": -26.005456924438477, "global_step": 318159, "epoch": 3833} {"train_loss": -25.68577003479004, "global_step": 318160, "epoch": 3833} {"train_loss": -25.775678634643555, "global_step": 318161, "epoch": 3833} {"train_loss": -25.379364013671875, "global_step": 318162, "epoch": 3833} {"train_loss": -25.834531784057617, "global_step": 318163, "epoch": 3833} {"train_loss": -25.619525909423828, "global_step": 318164, "epoch": 3833} {"train_loss": -25.6326961517334, "global_step": 318165, "epoch": 3833} {"train_loss": -25.85444450378418, "global_step": 318166, "epoch": 3833} {"train_loss": -25.856842041015625, "global_step": 318167, "epoch": 3833} {"train_loss": -26.066802978515625, "global_step": 318168, "epoch": 3833} {"train_loss": -26.129440307617188, "global_step": 318169, "epoch": 3833} {"train_loss": -25.91301918029785, "global_step": 318170, "epoch": 3833} {"train_loss": -25.700836181640625, "global_step": 318171, "epoch": 3833} {"train_loss": -26.218809127807617, "global_step": 318172, "epoch": 3833} {"train_loss": -26.075946807861328, "global_step": 318173, "epoch": 3833} {"train_loss": -25.99066162109375, "global_step": 318174, "epoch": 3833} {"train_loss": -25.84608268737793, "global_step": 318175, "epoch": 3833} {"train_loss": -25.910184860229492, "global_step": 318176, "epoch": 3833} {"train_loss": -25.681833267211914, "global_step": 318177, "epoch": 3833} {"train_loss": -25.875736236572266, "global_step": 318178, "epoch": 3833} {"train_loss": -26.02410316467285, "global_step": 318179, "epoch": 3833} {"train_loss": -26.121435165405273, "global_step": 318180, "epoch": 3833} {"train_loss": -26.326826095581055, "global_step": 318181, "epoch": 3833} {"train_loss": -26.313373565673828, "global_step": 318182, "epoch": 3833} {"train_loss": -25.761816024780273, "global_step": 318183, "epoch": 3833} {"train_loss": -26.190820693969727, "global_step": 318184, "epoch": 3833} {"train_loss": -26.163419723510742, "global_step": 318185, "epoch": 3833} {"train_loss": -26.007551193237305, "global_step": 318186, "epoch": 3833} {"train_loss": -26.027685165405273, "global_step": 318187, "epoch": 3833} {"train_loss": -25.925445556640625, "global_step": 318188, "epoch": 3833} {"train_loss": -25.973886489868164, "global_step": 318189, "epoch": 3833} {"train_loss": -25.918302536010742, "global_step": 318190, "epoch": 3833} {"train_loss": -25.9266414642334, "global_step": 318191, "epoch": 3833} {"train_loss": -25.85145378112793, "global_step": 318192, "epoch": 3833} {"train_loss": -25.630578994750977, "global_step": 318193, "epoch": 3833} {"train_loss": -25.965322494506836, "global_step": 318194, "epoch": 3833} {"train_loss": -25.841846466064453, "global_step": 318195, "epoch": 3833} {"train_loss": -25.80712890625, "global_step": 318196, "epoch": 3833} {"train_loss": -25.73517417907715, "global_step": 318197, "epoch": 3833} {"train_loss": -25.7074031829834, "global_step": 318198, "epoch": 3833} {"train_loss": -26.060810089111328, "global_step": 318199, "epoch": 3833} {"train_loss": -25.835559844970703, "global_step": 318200, "epoch": 3833} {"train_loss": -25.7134952545166, "global_step": 318201, "epoch": 3833} {"train_loss": -25.973697662353516, "global_step": 318202, "epoch": 3833} {"train_loss": -25.402860641479492, "global_step": 318203, "epoch": 3833} {"train_loss": -25.799240112304688, "global_step": 318204, "epoch": 3833} {"train_loss": -25.990676879882812, "global_step": 318205, "epoch": 3833} {"train_loss": -26.029895782470703, "global_step": 318206, "epoch": 3833} {"train_loss": -25.708993911743164, "global_step": 318207, "epoch": 3833} {"train_loss": -25.825841903686523, "global_step": 318208, "epoch": 3833} {"train_loss": -25.831710815429688, "global_step": 318209, "epoch": 3833} {"train_loss": -25.962247848510742, "global_step": 318210, "epoch": 3833} {"train_loss": -25.3531494140625, "global_step": 318211, "epoch": 3833} {"train_loss": -25.9799747467041, "global_step": 318212, "epoch": 3833} {"train_loss": -25.479421615600586, "global_step": 318213, "epoch": 3833} {"train_loss": -25.71072769165039, "global_step": 318214, "epoch": 3833} {"train_loss": -25.6145076751709, "global_step": 318215, "epoch": 3833} {"train_loss": -25.830366134643555, "global_step": 318216, "epoch": 3833} {"train_loss": -26.178668975830078, "global_step": 318217, "epoch": 3833} {"train_loss": -25.808216094970703, "global_step": 318218, "epoch": 3833} {"train_loss": -26.057355880737305, "global_step": 318219, "epoch": 3833} {"train_loss": -26.237333297729492, "global_step": 318220, "epoch": 3833} {"train_loss": -25.766909358013105, "global_step": 318221, "epoch": 3833, "val_loss": 7285950.0} {"train_loss": -25.535892486572266, "global_step": 318222, "epoch": 3834} {"train_loss": -25.357629776000977, "global_step": 318223, "epoch": 3834} {"train_loss": -25.016704559326172, "global_step": 318224, "epoch": 3834} {"train_loss": -25.472919464111328, "global_step": 318225, "epoch": 3834} {"train_loss": -25.854114532470703, "global_step": 318226, "epoch": 3834} {"train_loss": -25.449298858642578, "global_step": 318227, "epoch": 3834} {"train_loss": -25.4307918548584, "global_step": 318228, "epoch": 3834} {"train_loss": -25.103734970092773, "global_step": 318229, "epoch": 3834} {"train_loss": -25.76447868347168, "global_step": 318230, "epoch": 3834} {"train_loss": -25.650516510009766, "global_step": 318231, "epoch": 3834} {"train_loss": -25.732213973999023, "global_step": 318232, "epoch": 3834} {"train_loss": -25.559772491455078, "global_step": 318233, "epoch": 3834} {"train_loss": -25.65083122253418, "global_step": 318234, "epoch": 3834} {"train_loss": -25.683582305908203, "global_step": 318235, "epoch": 3834} {"train_loss": -25.706939697265625, "global_step": 318236, "epoch": 3834} {"train_loss": -25.302814483642578, "global_step": 318237, "epoch": 3834} {"train_loss": -26.070453643798828, "global_step": 318238, "epoch": 3834} {"train_loss": -25.690078735351562, "global_step": 318239, "epoch": 3834} {"train_loss": -25.94158935546875, "global_step": 318240, "epoch": 3834} {"train_loss": -25.56354522705078, "global_step": 318241, "epoch": 3834} {"train_loss": -25.69596290588379, "global_step": 318242, "epoch": 3834} {"train_loss": -25.900541305541992, "global_step": 318243, "epoch": 3834} {"train_loss": -26.02861976623535, "global_step": 318244, "epoch": 3834} {"train_loss": -26.24112892150879, "global_step": 318245, "epoch": 3834} {"train_loss": -25.737110137939453, "global_step": 318246, "epoch": 3834} {"train_loss": -26.03401756286621, "global_step": 318247, "epoch": 3834} {"train_loss": -25.521427154541016, "global_step": 318248, "epoch": 3834} {"train_loss": -25.92181968688965, "global_step": 318249, "epoch": 3834} {"train_loss": -26.028303146362305, "global_step": 318250, "epoch": 3834} {"train_loss": -25.645980834960938, "global_step": 318251, "epoch": 3834} {"train_loss": -26.01559829711914, "global_step": 318252, "epoch": 3834} {"train_loss": -26.011621475219727, "global_step": 318253, "epoch": 3834} {"train_loss": -26.073644638061523, "global_step": 318254, "epoch": 3834} {"train_loss": -25.68220329284668, "global_step": 318255, "epoch": 3834} {"train_loss": -25.753278732299805, "global_step": 318256, "epoch": 3834} {"train_loss": -26.240949630737305, "global_step": 318257, "epoch": 3834} {"train_loss": -25.449298858642578, "global_step": 318258, "epoch": 3834} {"train_loss": -25.915729522705078, "global_step": 318259, "epoch": 3834} {"train_loss": -26.046567916870117, "global_step": 318260, "epoch": 3834} {"train_loss": -25.956695556640625, "global_step": 318261, "epoch": 3834} {"train_loss": -25.869800567626953, "global_step": 318262, "epoch": 3834} {"train_loss": -25.87432861328125, "global_step": 318263, "epoch": 3834} {"train_loss": -26.040800094604492, "global_step": 318264, "epoch": 3834} {"train_loss": -26.085941314697266, "global_step": 318265, "epoch": 3834} {"train_loss": -25.85919189453125, "global_step": 318266, "epoch": 3834} {"train_loss": -25.685407638549805, "global_step": 318267, "epoch": 3834} {"train_loss": -24.74417495727539, "global_step": 318268, "epoch": 3834} {"train_loss": -25.7755126953125, "global_step": 318269, "epoch": 3834} {"train_loss": -24.601646423339844, "global_step": 318270, "epoch": 3834} {"train_loss": -25.511587142944336, "global_step": 318271, "epoch": 3834} {"train_loss": -25.246353149414062, "global_step": 318272, "epoch": 3834} {"train_loss": -25.4786434173584, "global_step": 318273, "epoch": 3834} {"train_loss": -24.88148307800293, "global_step": 318274, "epoch": 3834} {"train_loss": -25.48634147644043, "global_step": 318275, "epoch": 3834} {"train_loss": -25.32697868347168, "global_step": 318276, "epoch": 3834} {"train_loss": -25.23728370666504, "global_step": 318277, "epoch": 3834} {"train_loss": -25.499313354492188, "global_step": 318278, "epoch": 3834} {"train_loss": -25.311792373657227, "global_step": 318279, "epoch": 3834} {"train_loss": -25.85025978088379, "global_step": 318280, "epoch": 3834} {"train_loss": -25.562124252319336, "global_step": 318281, "epoch": 3834} {"train_loss": -25.56545066833496, "global_step": 318282, "epoch": 3834} {"train_loss": -25.56612777709961, "global_step": 318283, "epoch": 3834} {"train_loss": -25.642120361328125, "global_step": 318284, "epoch": 3834} {"train_loss": -25.5716495513916, "global_step": 318285, "epoch": 3834} {"train_loss": -25.848127365112305, "global_step": 318286, "epoch": 3834} {"train_loss": -25.80242347717285, "global_step": 318287, "epoch": 3834} {"train_loss": -25.958776473999023, "global_step": 318288, "epoch": 3834} {"train_loss": -25.439041137695312, "global_step": 318289, "epoch": 3834} {"train_loss": -25.66192626953125, "global_step": 318290, "epoch": 3834} {"train_loss": -25.741376876831055, "global_step": 318291, "epoch": 3834} {"train_loss": -26.288549423217773, "global_step": 318292, "epoch": 3834} {"train_loss": -25.79896354675293, "global_step": 318293, "epoch": 3834} {"train_loss": -25.6904239654541, "global_step": 318294, "epoch": 3834} {"train_loss": -25.712324142456055, "global_step": 318295, "epoch": 3834} {"train_loss": -26.045515060424805, "global_step": 318296, "epoch": 3834} {"train_loss": -25.83546257019043, "global_step": 318297, "epoch": 3834} {"train_loss": -25.9206485748291, "global_step": 318298, "epoch": 3834} {"train_loss": -26.02174186706543, "global_step": 318299, "epoch": 3834} {"train_loss": -25.9332275390625, "global_step": 318300, "epoch": 3834} {"train_loss": -25.84622573852539, "global_step": 318301, "epoch": 3834} {"train_loss": -26.02031898498535, "global_step": 318302, "epoch": 3834} {"train_loss": -26.022846221923828, "global_step": 318303, "epoch": 3834} {"train_loss": -25.712527585316852, "global_step": 318304, "epoch": 3834, "val_loss": 7297334.0} {"train_loss": -25.622900009155273, "global_step": 318305, "epoch": 3835} {"train_loss": -25.16987419128418, "global_step": 318306, "epoch": 3835} {"train_loss": -25.639678955078125, "global_step": 318307, "epoch": 3835} {"train_loss": -25.57779884338379, "global_step": 318308, "epoch": 3835} {"train_loss": -25.122968673706055, "global_step": 318309, "epoch": 3835} {"train_loss": -25.328998565673828, "global_step": 318310, "epoch": 3835} {"train_loss": -25.689252853393555, "global_step": 318311, "epoch": 3835} {"train_loss": -25.437345504760742, "global_step": 318312, "epoch": 3835} {"train_loss": -25.523862838745117, "global_step": 318313, "epoch": 3835} {"train_loss": -25.496395111083984, "global_step": 318314, "epoch": 3835} {"train_loss": -25.577232360839844, "global_step": 318315, "epoch": 3835} {"train_loss": -25.678312301635742, "global_step": 318316, "epoch": 3835} {"train_loss": -25.487525939941406, "global_step": 318317, "epoch": 3835} {"train_loss": -25.340246200561523, "global_step": 318318, "epoch": 3835} {"train_loss": -24.8116512298584, "global_step": 318319, "epoch": 3835} {"train_loss": -25.412246704101562, "global_step": 318320, "epoch": 3835} {"train_loss": -25.66507339477539, "global_step": 318321, "epoch": 3835} {"train_loss": -25.634912490844727, "global_step": 318322, "epoch": 3835} {"train_loss": -25.28525733947754, "global_step": 318323, "epoch": 3835} {"train_loss": -25.69727897644043, "global_step": 318324, "epoch": 3835} {"train_loss": -25.672195434570312, "global_step": 318325, "epoch": 3835} {"train_loss": -25.915653228759766, "global_step": 318326, "epoch": 3835} {"train_loss": -25.625385284423828, "global_step": 318327, "epoch": 3835} {"train_loss": -25.628753662109375, "global_step": 318328, "epoch": 3835} {"train_loss": -25.95035743713379, "global_step": 318329, "epoch": 3835} {"train_loss": -25.662445068359375, "global_step": 318330, "epoch": 3835} {"train_loss": -26.043731689453125, "global_step": 318331, "epoch": 3835} {"train_loss": -25.7812557220459, "global_step": 318332, "epoch": 3835} {"train_loss": -25.819644927978516, "global_step": 318333, "epoch": 3835} {"train_loss": -25.66225242614746, "global_step": 318334, "epoch": 3835} {"train_loss": -26.098724365234375, "global_step": 318335, "epoch": 3835} {"train_loss": -25.779150009155273, "global_step": 318336, "epoch": 3835} {"train_loss": -25.964801788330078, "global_step": 318337, "epoch": 3835} {"train_loss": -25.859609603881836, "global_step": 318338, "epoch": 3835} {"train_loss": -25.906457901000977, "global_step": 318339, "epoch": 3835} {"train_loss": -25.679141998291016, "global_step": 318340, "epoch": 3835} {"train_loss": -25.7310848236084, "global_step": 318341, "epoch": 3835} {"train_loss": -25.9632625579834, "global_step": 318342, "epoch": 3835} {"train_loss": -26.09320640563965, "global_step": 318343, "epoch": 3835} {"train_loss": -25.952062606811523, "global_step": 318344, "epoch": 3835} {"train_loss": -25.9867000579834, "global_step": 318345, "epoch": 3835} {"train_loss": -25.9582462310791, "global_step": 318346, "epoch": 3835} {"train_loss": -25.712390899658203, "global_step": 318347, "epoch": 3835} {"train_loss": -25.885473251342773, "global_step": 318348, "epoch": 3835} {"train_loss": -25.83615493774414, "global_step": 318349, "epoch": 3835} {"train_loss": -26.098196029663086, "global_step": 318350, "epoch": 3835} {"train_loss": -26.116117477416992, "global_step": 318351, "epoch": 3835} {"train_loss": -26.017393112182617, "global_step": 318352, "epoch": 3835} {"train_loss": -25.905420303344727, "global_step": 318353, "epoch": 3835} {"train_loss": -26.188634872436523, "global_step": 318354, "epoch": 3835} {"train_loss": -25.740217208862305, "global_step": 318355, "epoch": 3835} {"train_loss": -25.925384521484375, "global_step": 318356, "epoch": 3835} {"train_loss": -26.025028228759766, "global_step": 318357, "epoch": 3835} {"train_loss": -25.7844295501709, "global_step": 318358, "epoch": 3835} {"train_loss": -25.9696102142334, "global_step": 318359, "epoch": 3835} {"train_loss": -25.8673095703125, "global_step": 318360, "epoch": 3835} {"train_loss": -26.065343856811523, "global_step": 318361, "epoch": 3835} {"train_loss": -25.843524932861328, "global_step": 318362, "epoch": 3835} {"train_loss": -25.743738174438477, "global_step": 318363, "epoch": 3835} {"train_loss": -25.8822078704834, "global_step": 318364, "epoch": 3835} {"train_loss": -25.893835067749023, "global_step": 318365, "epoch": 3835} {"train_loss": -24.95261573791504, "global_step": 318366, "epoch": 3835} {"train_loss": -24.5233097076416, "global_step": 318367, "epoch": 3835} {"train_loss": -24.714248657226562, "global_step": 318368, "epoch": 3835} {"train_loss": -25.428571701049805, "global_step": 318369, "epoch": 3835} {"train_loss": -25.741357803344727, "global_step": 318370, "epoch": 3835} {"train_loss": -25.520856857299805, "global_step": 318371, "epoch": 3835} {"train_loss": -24.96399688720703, "global_step": 318372, "epoch": 3835} {"train_loss": -25.709463119506836, "global_step": 318373, "epoch": 3835} {"train_loss": -25.049667358398438, "global_step": 318374, "epoch": 3835} {"train_loss": -25.255218505859375, "global_step": 318375, "epoch": 3835} {"train_loss": -25.541330337524414, "global_step": 318376, "epoch": 3835} {"train_loss": -25.05829429626465, "global_step": 318377, "epoch": 3835} {"train_loss": -25.601423263549805, "global_step": 318378, "epoch": 3835} {"train_loss": -25.63425064086914, "global_step": 318379, "epoch": 3835} {"train_loss": -25.660276412963867, "global_step": 318380, "epoch": 3835} {"train_loss": -25.406259536743164, "global_step": 318381, "epoch": 3835} {"train_loss": -25.606225967407227, "global_step": 318382, "epoch": 3835} {"train_loss": -25.464418411254883, "global_step": 318383, "epoch": 3835} {"train_loss": -25.736539840698242, "global_step": 318384, "epoch": 3835} {"train_loss": -25.297544479370117, "global_step": 318385, "epoch": 3835} {"train_loss": -25.80391502380371, "global_step": 318386, "epoch": 3835} {"train_loss": -25.6526411814862, "global_step": 318387, "epoch": 3835, "val_loss": 7326239.0} {"train_loss": -25.534276962280273, "global_step": 318388, "epoch": 3836} {"train_loss": -25.241413116455078, "global_step": 318389, "epoch": 3836} {"train_loss": -25.262792587280273, "global_step": 318390, "epoch": 3836} {"train_loss": -25.16781997680664, "global_step": 318391, "epoch": 3836} {"train_loss": -25.13559341430664, "global_step": 318392, "epoch": 3836} {"train_loss": -25.225116729736328, "global_step": 318393, "epoch": 3836} {"train_loss": -25.201642990112305, "global_step": 318394, "epoch": 3836} {"train_loss": -25.152551651000977, "global_step": 318395, "epoch": 3836} {"train_loss": -25.46039390563965, "global_step": 318396, "epoch": 3836} {"train_loss": -25.559574127197266, "global_step": 318397, "epoch": 3836} {"train_loss": -25.129405975341797, "global_step": 318398, "epoch": 3836} {"train_loss": -25.428525924682617, "global_step": 318399, "epoch": 3836} {"train_loss": -25.492963790893555, "global_step": 318400, "epoch": 3836} {"train_loss": -24.784101486206055, "global_step": 318401, "epoch": 3836} {"train_loss": -25.53704833984375, "global_step": 318402, "epoch": 3836} {"train_loss": -25.738452911376953, "global_step": 318403, "epoch": 3836} {"train_loss": -25.480886459350586, "global_step": 318404, "epoch": 3836} {"train_loss": -25.619253158569336, "global_step": 318405, "epoch": 3836} {"train_loss": -25.673017501831055, "global_step": 318406, "epoch": 3836} {"train_loss": -25.72832679748535, "global_step": 318407, "epoch": 3836} {"train_loss": -26.10243034362793, "global_step": 318408, "epoch": 3836} {"train_loss": -25.61490249633789, "global_step": 318409, "epoch": 3836} {"train_loss": -25.7586612701416, "global_step": 318410, "epoch": 3836} {"train_loss": -25.789377212524414, "global_step": 318411, "epoch": 3836} {"train_loss": -25.784595489501953, "global_step": 318412, "epoch": 3836} {"train_loss": -25.94691276550293, "global_step": 318413, "epoch": 3836} {"train_loss": -25.738861083984375, "global_step": 318414, "epoch": 3836} {"train_loss": -25.913101196289062, "global_step": 318415, "epoch": 3836} {"train_loss": -25.565547943115234, "global_step": 318416, "epoch": 3836} {"train_loss": -26.32271385192871, "global_step": 318417, "epoch": 3836} {"train_loss": -26.05976676940918, "global_step": 318418, "epoch": 3836} {"train_loss": -26.187551498413086, "global_step": 318419, "epoch": 3836} {"train_loss": -26.264249801635742, "global_step": 318420, "epoch": 3836} {"train_loss": -25.992130279541016, "global_step": 318421, "epoch": 3836} {"train_loss": -25.910572052001953, "global_step": 318422, "epoch": 3836} {"train_loss": -25.814096450805664, "global_step": 318423, "epoch": 3836} {"train_loss": -25.573423385620117, "global_step": 318424, "epoch": 3836} {"train_loss": -26.2402400970459, "global_step": 318425, "epoch": 3836} {"train_loss": -26.018341064453125, "global_step": 318426, "epoch": 3836} {"train_loss": -25.562576293945312, "global_step": 318427, "epoch": 3836} {"train_loss": -26.280227661132812, "global_step": 318428, "epoch": 3836} {"train_loss": -25.89661979675293, "global_step": 318429, "epoch": 3836} {"train_loss": -25.512826919555664, "global_step": 318430, "epoch": 3836} {"train_loss": -26.293378829956055, "global_step": 318431, "epoch": 3836} {"train_loss": -25.855276107788086, "global_step": 318432, "epoch": 3836} {"train_loss": -25.79414176940918, "global_step": 318433, "epoch": 3836} {"train_loss": -25.75730323791504, "global_step": 318434, "epoch": 3836} {"train_loss": -26.30267333984375, "global_step": 318435, "epoch": 3836} {"train_loss": -25.290071487426758, "global_step": 318436, "epoch": 3836} {"train_loss": -25.941633224487305, "global_step": 318437, "epoch": 3836} {"train_loss": -26.22500991821289, "global_step": 318438, "epoch": 3836} {"train_loss": -25.883718490600586, "global_step": 318439, "epoch": 3836} {"train_loss": -25.66118812561035, "global_step": 318440, "epoch": 3836} {"train_loss": -26.151456832885742, "global_step": 318441, "epoch": 3836} {"train_loss": -25.79193115234375, "global_step": 318442, "epoch": 3836} {"train_loss": -25.88446044921875, "global_step": 318443, "epoch": 3836} {"train_loss": -25.794403076171875, "global_step": 318444, "epoch": 3836} {"train_loss": -26.028356552124023, "global_step": 318445, "epoch": 3836} {"train_loss": -25.958066940307617, "global_step": 318446, "epoch": 3836} {"train_loss": -25.55341911315918, "global_step": 318447, "epoch": 3836} {"train_loss": -25.779428482055664, "global_step": 318448, "epoch": 3836} {"train_loss": -25.8422794342041, "global_step": 318449, "epoch": 3836} {"train_loss": -25.675785064697266, "global_step": 318450, "epoch": 3836} {"train_loss": -25.75098991394043, "global_step": 318451, "epoch": 3836} {"train_loss": -25.583641052246094, "global_step": 318452, "epoch": 3836} {"train_loss": -25.591960906982422, "global_step": 318453, "epoch": 3836} {"train_loss": -26.116302490234375, "global_step": 318454, "epoch": 3836} {"train_loss": -25.840009689331055, "global_step": 318455, "epoch": 3836} {"train_loss": -26.178403854370117, "global_step": 318456, "epoch": 3836} {"train_loss": -25.51833152770996, "global_step": 318457, "epoch": 3836} {"train_loss": -25.825708389282227, "global_step": 318458, "epoch": 3836} {"train_loss": -25.643152236938477, "global_step": 318459, "epoch": 3836} {"train_loss": -25.58310890197754, "global_step": 318460, "epoch": 3836} {"train_loss": -26.01093864440918, "global_step": 318461, "epoch": 3836} {"train_loss": -25.8705997467041, "global_step": 318462, "epoch": 3836} {"train_loss": -25.685565948486328, "global_step": 318463, "epoch": 3836} {"train_loss": -25.834339141845703, "global_step": 318464, "epoch": 3836} {"train_loss": -26.098957061767578, "global_step": 318465, "epoch": 3836} {"train_loss": -25.80975914001465, "global_step": 318466, "epoch": 3836} {"train_loss": -26.000516891479492, "global_step": 318467, "epoch": 3836} {"train_loss": -25.611072540283203, "global_step": 318468, "epoch": 3836} {"train_loss": -26.009170532226562, "global_step": 318469, "epoch": 3836} {"train_loss": -25.744502469717737, "global_step": 318470, "epoch": 3836, "val_loss": 7349235.0} {"train_loss": -25.666040420532227, "global_step": 318471, "epoch": 3837} {"train_loss": -25.22430419921875, "global_step": 318472, "epoch": 3837} {"train_loss": -25.091466903686523, "global_step": 318473, "epoch": 3837} {"train_loss": -25.292720794677734, "global_step": 318474, "epoch": 3837} {"train_loss": -25.773193359375, "global_step": 318475, "epoch": 3837} {"train_loss": -25.11946678161621, "global_step": 318476, "epoch": 3837} {"train_loss": -25.568031311035156, "global_step": 318477, "epoch": 3837} {"train_loss": -25.369449615478516, "global_step": 318478, "epoch": 3837} {"train_loss": -24.986555099487305, "global_step": 318479, "epoch": 3837} {"train_loss": -25.645383834838867, "global_step": 318480, "epoch": 3837} {"train_loss": -25.21234130859375, "global_step": 318481, "epoch": 3837} {"train_loss": -25.70405387878418, "global_step": 318482, "epoch": 3837} {"train_loss": -26.0396671295166, "global_step": 318483, "epoch": 3837} {"train_loss": -25.83115005493164, "global_step": 318484, "epoch": 3837} {"train_loss": -25.347990036010742, "global_step": 318485, "epoch": 3837} {"train_loss": -25.789236068725586, "global_step": 318486, "epoch": 3837} {"train_loss": -25.85894775390625, "global_step": 318487, "epoch": 3837} {"train_loss": -25.716978073120117, "global_step": 318488, "epoch": 3837} {"train_loss": -25.93950843811035, "global_step": 318489, "epoch": 3837} {"train_loss": -25.665800094604492, "global_step": 318490, "epoch": 3837} {"train_loss": -25.222936630249023, "global_step": 318491, "epoch": 3837} {"train_loss": -26.051366806030273, "global_step": 318492, "epoch": 3837} {"train_loss": -25.82429313659668, "global_step": 318493, "epoch": 3837} {"train_loss": -25.263437271118164, "global_step": 318494, "epoch": 3837} {"train_loss": -25.66680908203125, "global_step": 318495, "epoch": 3837} {"train_loss": -26.009159088134766, "global_step": 318496, "epoch": 3837} {"train_loss": -26.212865829467773, "global_step": 318497, "epoch": 3837} {"train_loss": -25.732940673828125, "global_step": 318498, "epoch": 3837} {"train_loss": -25.798492431640625, "global_step": 318499, "epoch": 3837} {"train_loss": -25.944726943969727, "global_step": 318500, "epoch": 3837} {"train_loss": -26.153501510620117, "global_step": 318501, "epoch": 3837} {"train_loss": -25.899728775024414, "global_step": 318502, "epoch": 3837} {"train_loss": -25.6862735748291, "global_step": 318503, "epoch": 3837} {"train_loss": -26.17343521118164, "global_step": 318504, "epoch": 3837} {"train_loss": -26.026798248291016, "global_step": 318505, "epoch": 3837} {"train_loss": -25.656070709228516, "global_step": 318506, "epoch": 3837} {"train_loss": -25.906187057495117, "global_step": 318507, "epoch": 3837} {"train_loss": -25.918188095092773, "global_step": 318508, "epoch": 3837} {"train_loss": -26.077896118164062, "global_step": 318509, "epoch": 3837} {"train_loss": -26.10894203186035, "global_step": 318510, "epoch": 3837} {"train_loss": -25.873929977416992, "global_step": 318511, "epoch": 3837} {"train_loss": -25.705896377563477, "global_step": 318512, "epoch": 3837} {"train_loss": -26.050708770751953, "global_step": 318513, "epoch": 3837} {"train_loss": -25.8687801361084, "global_step": 318514, "epoch": 3837} {"train_loss": -26.054386138916016, "global_step": 318515, "epoch": 3837} {"train_loss": -25.980215072631836, "global_step": 318516, "epoch": 3837} {"train_loss": -25.729450225830078, "global_step": 318517, "epoch": 3837} {"train_loss": -26.106964111328125, "global_step": 318518, "epoch": 3837} {"train_loss": -25.790985107421875, "global_step": 318519, "epoch": 3837} {"train_loss": -25.9727783203125, "global_step": 318520, "epoch": 3837} {"train_loss": -26.110034942626953, "global_step": 318521, "epoch": 3837} {"train_loss": -25.761951446533203, "global_step": 318522, "epoch": 3837} {"train_loss": -26.46356201171875, "global_step": 318523, "epoch": 3837} {"train_loss": -26.067520141601562, "global_step": 318524, "epoch": 3837} {"train_loss": -25.782672882080078, "global_step": 318525, "epoch": 3837} {"train_loss": -25.885406494140625, "global_step": 318526, "epoch": 3837} {"train_loss": -25.81522560119629, "global_step": 318527, "epoch": 3837} {"train_loss": -26.00752067565918, "global_step": 318528, "epoch": 3837} {"train_loss": -26.288654327392578, "global_step": 318529, "epoch": 3837} {"train_loss": -25.86067008972168, "global_step": 318530, "epoch": 3837} {"train_loss": -25.95810890197754, "global_step": 318531, "epoch": 3837} {"train_loss": -25.698150634765625, "global_step": 318532, "epoch": 3837} {"train_loss": -25.97770118713379, "global_step": 318533, "epoch": 3837} {"train_loss": -25.927518844604492, "global_step": 318534, "epoch": 3837} {"train_loss": -25.784513473510742, "global_step": 318535, "epoch": 3837} {"train_loss": -25.330488204956055, "global_step": 318536, "epoch": 3837} {"train_loss": -26.150409698486328, "global_step": 318537, "epoch": 3837} {"train_loss": -25.962331771850586, "global_step": 318538, "epoch": 3837} {"train_loss": -25.865890502929688, "global_step": 318539, "epoch": 3837} {"train_loss": -26.14328384399414, "global_step": 318540, "epoch": 3837} {"train_loss": -25.2789306640625, "global_step": 318541, "epoch": 3837} {"train_loss": -25.35670280456543, "global_step": 318542, "epoch": 3837} {"train_loss": -25.223989486694336, "global_step": 318543, "epoch": 3837} {"train_loss": -25.429706573486328, "global_step": 318544, "epoch": 3837} {"train_loss": -25.738269805908203, "global_step": 318545, "epoch": 3837} {"train_loss": -25.859952926635742, "global_step": 318546, "epoch": 3837} {"train_loss": -25.539209365844727, "global_step": 318547, "epoch": 3837} {"train_loss": -25.750120162963867, "global_step": 318548, "epoch": 3837} {"train_loss": -25.95023536682129, "global_step": 318549, "epoch": 3837} {"train_loss": -25.583147048950195, "global_step": 318550, "epoch": 3837} {"train_loss": -25.70556640625, "global_step": 318551, "epoch": 3837} {"train_loss": -26.096881866455078, "global_step": 318552, "epoch": 3837} {"train_loss": -25.787840785750422, "global_step": 318553, "epoch": 3837, "val_loss": 7265452.5} {"train_loss": -24.87476921081543, "global_step": 318554, "epoch": 3838} {"train_loss": -24.36134147644043, "global_step": 318555, "epoch": 3838} {"train_loss": -25.323410034179688, "global_step": 318556, "epoch": 3838} {"train_loss": -25.33705711364746, "global_step": 318557, "epoch": 3838} {"train_loss": -24.905431747436523, "global_step": 318558, "epoch": 3838} {"train_loss": -25.146337509155273, "global_step": 318559, "epoch": 3838} {"train_loss": -25.643878936767578, "global_step": 318560, "epoch": 3838} {"train_loss": -24.97123146057129, "global_step": 318561, "epoch": 3838} {"train_loss": -25.884618759155273, "global_step": 318562, "epoch": 3838} {"train_loss": -25.24416160583496, "global_step": 318563, "epoch": 3838} {"train_loss": -25.680835723876953, "global_step": 318564, "epoch": 3838} {"train_loss": -25.570966720581055, "global_step": 318565, "epoch": 3838} {"train_loss": -25.33758544921875, "global_step": 318566, "epoch": 3838} {"train_loss": -25.488813400268555, "global_step": 318567, "epoch": 3838} {"train_loss": -25.81888198852539, "global_step": 318568, "epoch": 3838} {"train_loss": -25.639123916625977, "global_step": 318569, "epoch": 3838} {"train_loss": -25.637653350830078, "global_step": 318570, "epoch": 3838} {"train_loss": -25.605260848999023, "global_step": 318571, "epoch": 3838} {"train_loss": -25.717060089111328, "global_step": 318572, "epoch": 3838} {"train_loss": -25.662656784057617, "global_step": 318573, "epoch": 3838} {"train_loss": -26.03220558166504, "global_step": 318574, "epoch": 3838} {"train_loss": -26.122394561767578, "global_step": 318575, "epoch": 3838} {"train_loss": -25.907672882080078, "global_step": 318576, "epoch": 3838} {"train_loss": -25.49458122253418, "global_step": 318577, "epoch": 3838} {"train_loss": -25.526365280151367, "global_step": 318578, "epoch": 3838} {"train_loss": -25.760217666625977, "global_step": 318579, "epoch": 3838} {"train_loss": -26.22188377380371, "global_step": 318580, "epoch": 3838} {"train_loss": -26.12700843811035, "global_step": 318581, "epoch": 3838} {"train_loss": -25.6210994720459, "global_step": 318582, "epoch": 3838} {"train_loss": -26.355588912963867, "global_step": 318583, "epoch": 3838} {"train_loss": -26.008779525756836, "global_step": 318584, "epoch": 3838} {"train_loss": -25.85489845275879, "global_step": 318585, "epoch": 3838} {"train_loss": -26.0197696685791, "global_step": 318586, "epoch": 3838} {"train_loss": -25.85758399963379, "global_step": 318587, "epoch": 3838} {"train_loss": -25.960296630859375, "global_step": 318588, "epoch": 3838} {"train_loss": -25.888757705688477, "global_step": 318589, "epoch": 3838} {"train_loss": -25.648773193359375, "global_step": 318590, "epoch": 3838} {"train_loss": -25.853622436523438, "global_step": 318591, "epoch": 3838} {"train_loss": -25.381210327148438, "global_step": 318592, "epoch": 3838} {"train_loss": -25.709156036376953, "global_step": 318593, "epoch": 3838} {"train_loss": -25.996789932250977, "global_step": 318594, "epoch": 3838} {"train_loss": -26.122312545776367, "global_step": 318595, "epoch": 3838} {"train_loss": -25.95160484313965, "global_step": 318596, "epoch": 3838} {"train_loss": -25.89383316040039, "global_step": 318597, "epoch": 3838} {"train_loss": -25.9283447265625, "global_step": 318598, "epoch": 3838} {"train_loss": -25.857473373413086, "global_step": 318599, "epoch": 3838} {"train_loss": -26.142850875854492, "global_step": 318600, "epoch": 3838} {"train_loss": -25.99909782409668, "global_step": 318601, "epoch": 3838} {"train_loss": -25.925403594970703, "global_step": 318602, "epoch": 3838} {"train_loss": -25.814477920532227, "global_step": 318603, "epoch": 3838} {"train_loss": -26.07364273071289, "global_step": 318604, "epoch": 3838} {"train_loss": -25.866535186767578, "global_step": 318605, "epoch": 3838} {"train_loss": -25.97760581970215, "global_step": 318606, "epoch": 3838} {"train_loss": -26.135068893432617, "global_step": 318607, "epoch": 3838} {"train_loss": -25.930028915405273, "global_step": 318608, "epoch": 3838} {"train_loss": -25.8681583404541, "global_step": 318609, "epoch": 3838} {"train_loss": -25.9115047454834, "global_step": 318610, "epoch": 3838} {"train_loss": -25.325321197509766, "global_step": 318611, "epoch": 3838} {"train_loss": -25.729034423828125, "global_step": 318612, "epoch": 3838} {"train_loss": -26.102615356445312, "global_step": 318613, "epoch": 3838} {"train_loss": -26.1044921875, "global_step": 318614, "epoch": 3838} {"train_loss": -25.590497970581055, "global_step": 318615, "epoch": 3838} {"train_loss": -26.13386344909668, "global_step": 318616, "epoch": 3838} {"train_loss": -25.74991798400879, "global_step": 318617, "epoch": 3838} {"train_loss": -25.812488555908203, "global_step": 318618, "epoch": 3838} {"train_loss": -25.765045166015625, "global_step": 318619, "epoch": 3838} {"train_loss": -25.80730628967285, "global_step": 318620, "epoch": 3838} {"train_loss": -25.822101593017578, "global_step": 318621, "epoch": 3838} {"train_loss": -25.69318199157715, "global_step": 318622, "epoch": 3838} {"train_loss": -26.03912925720215, "global_step": 318623, "epoch": 3838} {"train_loss": -25.760862350463867, "global_step": 318624, "epoch": 3838} {"train_loss": -26.052526473999023, "global_step": 318625, "epoch": 3838} {"train_loss": -26.315738677978516, "global_step": 318626, "epoch": 3838} {"train_loss": -26.0167179107666, "global_step": 318627, "epoch": 3838} {"train_loss": -26.135425567626953, "global_step": 318628, "epoch": 3838} {"train_loss": -26.224409103393555, "global_step": 318629, "epoch": 3838} {"train_loss": -25.68854331970215, "global_step": 318630, "epoch": 3838} {"train_loss": -26.05901527404785, "global_step": 318631, "epoch": 3838} {"train_loss": -25.86863136291504, "global_step": 318632, "epoch": 3838} {"train_loss": -26.1898136138916, "global_step": 318633, "epoch": 3838} {"train_loss": -25.992151260375977, "global_step": 318634, "epoch": 3838} {"train_loss": -25.887182235717773, "global_step": 318635, "epoch": 3838} {"train_loss": -25.789777916598034, "global_step": 318636, "epoch": 3838, "val_loss": 7287903.0} {"train_loss": -25.788618087768555, "global_step": 318637, "epoch": 3839} {"train_loss": -25.502758026123047, "global_step": 318638, "epoch": 3839} {"train_loss": -25.7386474609375, "global_step": 318639, "epoch": 3839} {"train_loss": -25.49803352355957, "global_step": 318640, "epoch": 3839} {"train_loss": -25.260574340820312, "global_step": 318641, "epoch": 3839} {"train_loss": -25.912643432617188, "global_step": 318642, "epoch": 3839} {"train_loss": -25.544523239135742, "global_step": 318643, "epoch": 3839} {"train_loss": -25.661956787109375, "global_step": 318644, "epoch": 3839} {"train_loss": -25.846662521362305, "global_step": 318645, "epoch": 3839} {"train_loss": -25.688222885131836, "global_step": 318646, "epoch": 3839} {"train_loss": -25.90692138671875, "global_step": 318647, "epoch": 3839} {"train_loss": -25.83981704711914, "global_step": 318648, "epoch": 3839} {"train_loss": -25.637073516845703, "global_step": 318649, "epoch": 3839} {"train_loss": -25.800678253173828, "global_step": 318650, "epoch": 3839} {"train_loss": -25.16225242614746, "global_step": 318651, "epoch": 3839} {"train_loss": -25.82489013671875, "global_step": 318652, "epoch": 3839} {"train_loss": -25.752643585205078, "global_step": 318653, "epoch": 3839} {"train_loss": -25.291105270385742, "global_step": 318654, "epoch": 3839} {"train_loss": -25.737491607666016, "global_step": 318655, "epoch": 3839} {"train_loss": -25.622421264648438, "global_step": 318656, "epoch": 3839} {"train_loss": -25.4880428314209, "global_step": 318657, "epoch": 3839} {"train_loss": -25.34287452697754, "global_step": 318658, "epoch": 3839} {"train_loss": -25.486417770385742, "global_step": 318659, "epoch": 3839} {"train_loss": -25.84100914001465, "global_step": 318660, "epoch": 3839} {"train_loss": -25.700321197509766, "global_step": 318661, "epoch": 3839} {"train_loss": -25.757492065429688, "global_step": 318662, "epoch": 3839} {"train_loss": -25.766998291015625, "global_step": 318663, "epoch": 3839} {"train_loss": -26.263671875, "global_step": 318664, "epoch": 3839} {"train_loss": -25.87640380859375, "global_step": 318665, "epoch": 3839} {"train_loss": -26.49611473083496, "global_step": 318666, "epoch": 3839} {"train_loss": -25.52398109436035, "global_step": 318667, "epoch": 3839} {"train_loss": -25.42388916015625, "global_step": 318668, "epoch": 3839} {"train_loss": -25.49962043762207, "global_step": 318669, "epoch": 3839} {"train_loss": -25.70517921447754, "global_step": 318670, "epoch": 3839} {"train_loss": -25.316282272338867, "global_step": 318671, "epoch": 3839} {"train_loss": -25.991662979125977, "global_step": 318672, "epoch": 3839} {"train_loss": -26.109174728393555, "global_step": 318673, "epoch": 3839} {"train_loss": -25.855838775634766, "global_step": 318674, "epoch": 3839} {"train_loss": -26.107702255249023, "global_step": 318675, "epoch": 3839} {"train_loss": -26.047327041625977, "global_step": 318676, "epoch": 3839} {"train_loss": -25.920331954956055, "global_step": 318677, "epoch": 3839} {"train_loss": -25.7313289642334, "global_step": 318678, "epoch": 3839} {"train_loss": -25.754819869995117, "global_step": 318679, "epoch": 3839} {"train_loss": -25.731449127197266, "global_step": 318680, "epoch": 3839} {"train_loss": -25.882843017578125, "global_step": 318681, "epoch": 3839} {"train_loss": -25.702228546142578, "global_step": 318682, "epoch": 3839} {"train_loss": -25.754674911499023, "global_step": 318683, "epoch": 3839} {"train_loss": -25.776464462280273, "global_step": 318684, "epoch": 3839} {"train_loss": -25.89887046813965, "global_step": 318685, "epoch": 3839} {"train_loss": -26.0788631439209, "global_step": 318686, "epoch": 3839} {"train_loss": -25.649749755859375, "global_step": 318687, "epoch": 3839} {"train_loss": -25.846221923828125, "global_step": 318688, "epoch": 3839} {"train_loss": -25.192214965820312, "global_step": 318689, "epoch": 3839} {"train_loss": -25.62355613708496, "global_step": 318690, "epoch": 3839} {"train_loss": -25.34102439880371, "global_step": 318691, "epoch": 3839} {"train_loss": -25.59812355041504, "global_step": 318692, "epoch": 3839} {"train_loss": -25.761396408081055, "global_step": 318693, "epoch": 3839} {"train_loss": -25.511337280273438, "global_step": 318694, "epoch": 3839} {"train_loss": -25.706451416015625, "global_step": 318695, "epoch": 3839} {"train_loss": -25.940536499023438, "global_step": 318696, "epoch": 3839} {"train_loss": -25.48866081237793, "global_step": 318697, "epoch": 3839} {"train_loss": -25.7185115814209, "global_step": 318698, "epoch": 3839} {"train_loss": -25.930912017822266, "global_step": 318699, "epoch": 3839} {"train_loss": -25.543466567993164, "global_step": 318700, "epoch": 3839} {"train_loss": -25.87099266052246, "global_step": 318701, "epoch": 3839} {"train_loss": -25.34944725036621, "global_step": 318702, "epoch": 3839} {"train_loss": -25.958852767944336, "global_step": 318703, "epoch": 3839} {"train_loss": -25.956384658813477, "global_step": 318704, "epoch": 3839} {"train_loss": -26.093887329101562, "global_step": 318705, "epoch": 3839} {"train_loss": -25.940353393554688, "global_step": 318706, "epoch": 3839} {"train_loss": -25.392431259155273, "global_step": 318707, "epoch": 3839} {"train_loss": -25.834463119506836, "global_step": 318708, "epoch": 3839} {"train_loss": -25.587146759033203, "global_step": 318709, "epoch": 3839} {"train_loss": -26.104480743408203, "global_step": 318710, "epoch": 3839} {"train_loss": -25.532617568969727, "global_step": 318711, "epoch": 3839} {"train_loss": -25.500858306884766, "global_step": 318712, "epoch": 3839} {"train_loss": -25.65207862854004, "global_step": 318713, "epoch": 3839} {"train_loss": -25.371885299682617, "global_step": 318714, "epoch": 3839} {"train_loss": -25.589345932006836, "global_step": 318715, "epoch": 3839} {"train_loss": -25.608625411987305, "global_step": 318716, "epoch": 3839} {"train_loss": -25.950916290283203, "global_step": 318717, "epoch": 3839} {"train_loss": -25.495792388916016, "global_step": 318718, "epoch": 3839} {"train_loss": -25.734502723418085, "global_step": 318719, "epoch": 3839, "val_loss": 7329019.0} {"train_loss": -24.9877986907959, "global_step": 318720, "epoch": 3840} {"train_loss": -25.076719284057617, "global_step": 318721, "epoch": 3840} {"train_loss": -25.156356811523438, "global_step": 318722, "epoch": 3840} {"train_loss": -24.6789608001709, "global_step": 318723, "epoch": 3840} {"train_loss": -25.176620483398438, "global_step": 318724, "epoch": 3840} {"train_loss": -25.20387840270996, "global_step": 318725, "epoch": 3840} {"train_loss": -25.43844223022461, "global_step": 318726, "epoch": 3840} {"train_loss": -25.47194480895996, "global_step": 318727, "epoch": 3840} {"train_loss": -25.527700424194336, "global_step": 318728, "epoch": 3840} {"train_loss": -25.25847816467285, "global_step": 318729, "epoch": 3840} {"train_loss": -25.442140579223633, "global_step": 318730, "epoch": 3840} {"train_loss": -25.44463539123535, "global_step": 318731, "epoch": 3840} {"train_loss": -25.510074615478516, "global_step": 318732, "epoch": 3840} {"train_loss": -25.443058013916016, "global_step": 318733, "epoch": 3840} {"train_loss": -25.616117477416992, "global_step": 318734, "epoch": 3840} {"train_loss": -25.531085968017578, "global_step": 318735, "epoch": 3840} {"train_loss": -25.97330665588379, "global_step": 318736, "epoch": 3840} {"train_loss": -25.358577728271484, "global_step": 318737, "epoch": 3840} {"train_loss": -25.91410255432129, "global_step": 318738, "epoch": 3840} {"train_loss": -25.4363956451416, "global_step": 318739, "epoch": 3840} {"train_loss": -25.788721084594727, "global_step": 318740, "epoch": 3840} {"train_loss": -25.8729190826416, "global_step": 318741, "epoch": 3840} {"train_loss": -25.679113388061523, "global_step": 318742, "epoch": 3840} {"train_loss": -25.968305587768555, "global_step": 318743, "epoch": 3840} {"train_loss": -25.620758056640625, "global_step": 318744, "epoch": 3840} {"train_loss": -25.881006240844727, "global_step": 318745, "epoch": 3840} {"train_loss": -26.12564468383789, "global_step": 318746, "epoch": 3840} {"train_loss": -26.071210861206055, "global_step": 318747, "epoch": 3840} {"train_loss": -25.850019454956055, "global_step": 318748, "epoch": 3840} {"train_loss": -26.27691650390625, "global_step": 318749, "epoch": 3840} {"train_loss": -25.199235916137695, "global_step": 318750, "epoch": 3840} {"train_loss": -26.1280517578125, "global_step": 318751, "epoch": 3840} {"train_loss": -25.9356746673584, "global_step": 318752, "epoch": 3840} {"train_loss": -26.471601486206055, "global_step": 318753, "epoch": 3840} {"train_loss": -26.095212936401367, "global_step": 318754, "epoch": 3840} {"train_loss": -26.05952262878418, "global_step": 318755, "epoch": 3840} {"train_loss": -25.9704647064209, "global_step": 318756, "epoch": 3840} {"train_loss": -26.00874900817871, "global_step": 318757, "epoch": 3840} {"train_loss": -25.952070236206055, "global_step": 318758, "epoch": 3840} {"train_loss": -25.917266845703125, "global_step": 318759, "epoch": 3840} {"train_loss": -26.063461303710938, "global_step": 318760, "epoch": 3840} {"train_loss": -25.678974151611328, "global_step": 318761, "epoch": 3840} {"train_loss": -26.202255249023438, "global_step": 318762, "epoch": 3840} {"train_loss": -25.905139923095703, "global_step": 318763, "epoch": 3840} {"train_loss": -25.713077545166016, "global_step": 318764, "epoch": 3840} {"train_loss": -25.87332534790039, "global_step": 318765, "epoch": 3840} {"train_loss": -26.34881019592285, "global_step": 318766, "epoch": 3840} {"train_loss": -26.182920455932617, "global_step": 318767, "epoch": 3840} {"train_loss": -26.118408203125, "global_step": 318768, "epoch": 3840} {"train_loss": -26.0113525390625, "global_step": 318769, "epoch": 3840} {"train_loss": -26.11370277404785, "global_step": 318770, "epoch": 3840} {"train_loss": -26.150562286376953, "global_step": 318771, "epoch": 3840} {"train_loss": -26.49793815612793, "global_step": 318772, "epoch": 3840} {"train_loss": -25.89751625061035, "global_step": 318773, "epoch": 3840} {"train_loss": -25.30275535583496, "global_step": 318774, "epoch": 3840} {"train_loss": -23.568878173828125, "global_step": 318775, "epoch": 3840} {"train_loss": -22.699975967407227, "global_step": 318776, "epoch": 3840} {"train_loss": -23.981552124023438, "global_step": 318777, "epoch": 3840} {"train_loss": -24.652799606323242, "global_step": 318778, "epoch": 3840} {"train_loss": -24.780302047729492, "global_step": 318779, "epoch": 3840} {"train_loss": -24.059528350830078, "global_step": 318780, "epoch": 3840} {"train_loss": -25.15825080871582, "global_step": 318781, "epoch": 3840} {"train_loss": -24.466909408569336, "global_step": 318782, "epoch": 3840} {"train_loss": -25.060497283935547, "global_step": 318783, "epoch": 3840} {"train_loss": -24.843198776245117, "global_step": 318784, "epoch": 3840} {"train_loss": -25.236024856567383, "global_step": 318785, "epoch": 3840} {"train_loss": -24.945261001586914, "global_step": 318786, "epoch": 3840} {"train_loss": -24.5760440826416, "global_step": 318787, "epoch": 3840} {"train_loss": -24.898239135742188, "global_step": 318788, "epoch": 3840} {"train_loss": -25.294479370117188, "global_step": 318789, "epoch": 3840} {"train_loss": -25.153512954711914, "global_step": 318790, "epoch": 3840} {"train_loss": -25.20224952697754, "global_step": 318791, "epoch": 3840} {"train_loss": -25.6447696685791, "global_step": 318792, "epoch": 3840} {"train_loss": -25.285629272460938, "global_step": 318793, "epoch": 3840} {"train_loss": -25.156232833862305, "global_step": 318794, "epoch": 3840} {"train_loss": -25.23782730102539, "global_step": 318795, "epoch": 3840} {"train_loss": -25.46689796447754, "global_step": 318796, "epoch": 3840} {"train_loss": -25.584199905395508, "global_step": 318797, "epoch": 3840} {"train_loss": -25.3746337890625, "global_step": 318798, "epoch": 3840} {"train_loss": -25.17817497253418, "global_step": 318799, "epoch": 3840} {"train_loss": -25.246517181396484, "global_step": 318800, "epoch": 3840} {"train_loss": -25.156906127929688, "global_step": 318801, "epoch": 3840} {"train_loss": -25.462149516645685, "global_step": 318802, "epoch": 3840, "val_loss": 7352660.0} {"train_loss": -25.53975486755371, "global_step": 318803, "epoch": 3841} {"train_loss": -25.82069206237793, "global_step": 318804, "epoch": 3841} {"train_loss": -25.585851669311523, "global_step": 318805, "epoch": 3841} {"train_loss": -25.53998374938965, "global_step": 318806, "epoch": 3841} {"train_loss": -25.585302352905273, "global_step": 318807, "epoch": 3841} {"train_loss": -25.527780532836914, "global_step": 318808, "epoch": 3841} {"train_loss": -25.20005226135254, "global_step": 318809, "epoch": 3841} {"train_loss": -25.55008316040039, "global_step": 318810, "epoch": 3841} {"train_loss": -25.821691513061523, "global_step": 318811, "epoch": 3841} {"train_loss": -25.713281631469727, "global_step": 318812, "epoch": 3841} {"train_loss": -25.645706176757812, "global_step": 318813, "epoch": 3841} {"train_loss": -25.58517837524414, "global_step": 318814, "epoch": 3841} {"train_loss": -25.144569396972656, "global_step": 318815, "epoch": 3841} {"train_loss": -25.426671981811523, "global_step": 318816, "epoch": 3841} {"train_loss": -26.041650772094727, "global_step": 318817, "epoch": 3841} {"train_loss": -25.635284423828125, "global_step": 318818, "epoch": 3841} {"train_loss": -26.080413818359375, "global_step": 318819, "epoch": 3841} {"train_loss": -26.020788192749023, "global_step": 318820, "epoch": 3841} {"train_loss": -25.905323028564453, "global_step": 318821, "epoch": 3841} {"train_loss": -25.8984317779541, "global_step": 318822, "epoch": 3841} {"train_loss": -25.400360107421875, "global_step": 318823, "epoch": 3841} {"train_loss": -26.339941024780273, "global_step": 318824, "epoch": 3841} {"train_loss": -26.034530639648438, "global_step": 318825, "epoch": 3841} {"train_loss": -25.9932804107666, "global_step": 318826, "epoch": 3841} {"train_loss": -26.081384658813477, "global_step": 318827, "epoch": 3841} {"train_loss": -25.936140060424805, "global_step": 318828, "epoch": 3841} {"train_loss": -25.92169189453125, "global_step": 318829, "epoch": 3841} {"train_loss": -25.878314971923828, "global_step": 318830, "epoch": 3841} {"train_loss": -25.94158935546875, "global_step": 318831, "epoch": 3841} {"train_loss": -26.193567276000977, "global_step": 318832, "epoch": 3841} {"train_loss": -26.116613388061523, "global_step": 318833, "epoch": 3841} {"train_loss": -25.996688842773438, "global_step": 318834, "epoch": 3841} {"train_loss": -25.871801376342773, "global_step": 318835, "epoch": 3841} {"train_loss": -26.087331771850586, "global_step": 318836, "epoch": 3841} {"train_loss": -25.931249618530273, "global_step": 318837, "epoch": 3841} {"train_loss": -25.970172882080078, "global_step": 318838, "epoch": 3841} {"train_loss": -26.054677963256836, "global_step": 318839, "epoch": 3841} {"train_loss": -25.6125545501709, "global_step": 318840, "epoch": 3841} {"train_loss": -25.437088012695312, "global_step": 318841, "epoch": 3841} {"train_loss": -25.1077938079834, "global_step": 318842, "epoch": 3841} {"train_loss": -25.492542266845703, "global_step": 318843, "epoch": 3841} {"train_loss": -25.12114143371582, "global_step": 318844, "epoch": 3841} {"train_loss": -25.59345054626465, "global_step": 318845, "epoch": 3841} {"train_loss": -25.799976348876953, "global_step": 318846, "epoch": 3841} {"train_loss": -25.3182430267334, "global_step": 318847, "epoch": 3841} {"train_loss": -25.358732223510742, "global_step": 318848, "epoch": 3841} {"train_loss": -25.575754165649414, "global_step": 318849, "epoch": 3841} {"train_loss": -25.69037437438965, "global_step": 318850, "epoch": 3841} {"train_loss": -25.635297775268555, "global_step": 318851, "epoch": 3841} {"train_loss": -25.87824821472168, "global_step": 318852, "epoch": 3841} {"train_loss": -25.34108543395996, "global_step": 318853, "epoch": 3841} {"train_loss": -25.894140243530273, "global_step": 318854, "epoch": 3841} {"train_loss": -26.23164176940918, "global_step": 318855, "epoch": 3841} {"train_loss": -26.0836238861084, "global_step": 318856, "epoch": 3841} {"train_loss": -25.8809814453125, "global_step": 318857, "epoch": 3841} {"train_loss": -26.247928619384766, "global_step": 318858, "epoch": 3841} {"train_loss": -25.756650924682617, "global_step": 318859, "epoch": 3841} {"train_loss": -26.002225875854492, "global_step": 318860, "epoch": 3841} {"train_loss": -26.03130531311035, "global_step": 318861, "epoch": 3841} {"train_loss": -25.87733268737793, "global_step": 318862, "epoch": 3841} {"train_loss": -25.714075088500977, "global_step": 318863, "epoch": 3841} {"train_loss": -25.944671630859375, "global_step": 318864, "epoch": 3841} {"train_loss": -25.83709716796875, "global_step": 318865, "epoch": 3841} {"train_loss": -26.186019897460938, "global_step": 318866, "epoch": 3841} {"train_loss": -26.17791175842285, "global_step": 318867, "epoch": 3841} {"train_loss": -25.62908363342285, "global_step": 318868, "epoch": 3841} {"train_loss": -25.81683921813965, "global_step": 318869, "epoch": 3841} {"train_loss": -25.740924835205078, "global_step": 318870, "epoch": 3841} {"train_loss": -26.051267623901367, "global_step": 318871, "epoch": 3841} {"train_loss": -26.089635848999023, "global_step": 318872, "epoch": 3841} {"train_loss": -25.712085723876953, "global_step": 318873, "epoch": 3841} {"train_loss": -25.69300651550293, "global_step": 318874, "epoch": 3841} {"train_loss": -26.08441734313965, "global_step": 318875, "epoch": 3841} {"train_loss": -25.67328453063965, "global_step": 318876, "epoch": 3841} {"train_loss": -25.833826065063477, "global_step": 318877, "epoch": 3841} {"train_loss": -25.67840003967285, "global_step": 318878, "epoch": 3841} {"train_loss": -26.02727699279785, "global_step": 318879, "epoch": 3841} {"train_loss": -26.093530654907227, "global_step": 318880, "epoch": 3841} {"train_loss": -26.018451690673828, "global_step": 318881, "epoch": 3841} {"train_loss": -26.337621688842773, "global_step": 318882, "epoch": 3841} {"train_loss": -25.778196334838867, "global_step": 318883, "epoch": 3841} {"train_loss": -25.744359970092773, "global_step": 318884, "epoch": 3841} {"train_loss": -25.80894316248147, "global_step": 318885, "epoch": 3841, "val_loss": 7334216.0} {"train_loss": -25.550880432128906, "global_step": 318886, "epoch": 3842} {"train_loss": -25.157785415649414, "global_step": 318887, "epoch": 3842} {"train_loss": -24.762388229370117, "global_step": 318888, "epoch": 3842} {"train_loss": -24.893381118774414, "global_step": 318889, "epoch": 3842} {"train_loss": -24.848148345947266, "global_step": 318890, "epoch": 3842} {"train_loss": -25.186574935913086, "global_step": 318891, "epoch": 3842} {"train_loss": -25.407794952392578, "global_step": 318892, "epoch": 3842} {"train_loss": -25.119230270385742, "global_step": 318893, "epoch": 3842} {"train_loss": -25.13153076171875, "global_step": 318894, "epoch": 3842} {"train_loss": -25.383413314819336, "global_step": 318895, "epoch": 3842} {"train_loss": -25.575531005859375, "global_step": 318896, "epoch": 3842} {"train_loss": -25.50269889831543, "global_step": 318897, "epoch": 3842} {"train_loss": -25.37896156311035, "global_step": 318898, "epoch": 3842} {"train_loss": -25.484468460083008, "global_step": 318899, "epoch": 3842} {"train_loss": -25.222026824951172, "global_step": 318900, "epoch": 3842} {"train_loss": -25.753223419189453, "global_step": 318901, "epoch": 3842} {"train_loss": -25.289955139160156, "global_step": 318902, "epoch": 3842} {"train_loss": -25.7880802154541, "global_step": 318903, "epoch": 3842} {"train_loss": -25.488492965698242, "global_step": 318904, "epoch": 3842} {"train_loss": -25.764780044555664, "global_step": 318905, "epoch": 3842} {"train_loss": -25.782516479492188, "global_step": 318906, "epoch": 3842} {"train_loss": -25.426725387573242, "global_step": 318907, "epoch": 3842} {"train_loss": -25.453039169311523, "global_step": 318908, "epoch": 3842} {"train_loss": -25.695331573486328, "global_step": 318909, "epoch": 3842} {"train_loss": -25.70185661315918, "global_step": 318910, "epoch": 3842} {"train_loss": -25.863828659057617, "global_step": 318911, "epoch": 3842} {"train_loss": -25.57386589050293, "global_step": 318912, "epoch": 3842} {"train_loss": -26.115753173828125, "global_step": 318913, "epoch": 3842} {"train_loss": -25.842437744140625, "global_step": 318914, "epoch": 3842} {"train_loss": -25.8675537109375, "global_step": 318915, "epoch": 3842} {"train_loss": -25.674177169799805, "global_step": 318916, "epoch": 3842} {"train_loss": -25.870092391967773, "global_step": 318917, "epoch": 3842} {"train_loss": -26.092565536499023, "global_step": 318918, "epoch": 3842} {"train_loss": -25.888336181640625, "global_step": 318919, "epoch": 3842} {"train_loss": -25.799314498901367, "global_step": 318920, "epoch": 3842} {"train_loss": -25.909971237182617, "global_step": 318921, "epoch": 3842} {"train_loss": -25.954015731811523, "global_step": 318922, "epoch": 3842} {"train_loss": -26.448278427124023, "global_step": 318923, "epoch": 3842} {"train_loss": -25.81780433654785, "global_step": 318924, "epoch": 3842} {"train_loss": -25.532657623291016, "global_step": 318925, "epoch": 3842} {"train_loss": -25.7968807220459, "global_step": 318926, "epoch": 3842} {"train_loss": -25.926267623901367, "global_step": 318927, "epoch": 3842} {"train_loss": -26.078521728515625, "global_step": 318928, "epoch": 3842} {"train_loss": -25.735321044921875, "global_step": 318929, "epoch": 3842} {"train_loss": -25.989057540893555, "global_step": 318930, "epoch": 3842} {"train_loss": -26.0078182220459, "global_step": 318931, "epoch": 3842} {"train_loss": -25.96607780456543, "global_step": 318932, "epoch": 3842} {"train_loss": -26.314130783081055, "global_step": 318933, "epoch": 3842} {"train_loss": -25.72989845275879, "global_step": 318934, "epoch": 3842} {"train_loss": -26.244049072265625, "global_step": 318935, "epoch": 3842} {"train_loss": -25.89436912536621, "global_step": 318936, "epoch": 3842} {"train_loss": -26.073638916015625, "global_step": 318937, "epoch": 3842} {"train_loss": -26.490503311157227, "global_step": 318938, "epoch": 3842} {"train_loss": -26.01397132873535, "global_step": 318939, "epoch": 3842} {"train_loss": -25.71143913269043, "global_step": 318940, "epoch": 3842} {"train_loss": -26.0988712310791, "global_step": 318941, "epoch": 3842} {"train_loss": -25.908655166625977, "global_step": 318942, "epoch": 3842} {"train_loss": -26.139312744140625, "global_step": 318943, "epoch": 3842} {"train_loss": -25.67536735534668, "global_step": 318944, "epoch": 3842} {"train_loss": -25.9489803314209, "global_step": 318945, "epoch": 3842} {"train_loss": -25.968366622924805, "global_step": 318946, "epoch": 3842} {"train_loss": -25.73579216003418, "global_step": 318947, "epoch": 3842} {"train_loss": -25.9285888671875, "global_step": 318948, "epoch": 3842} {"train_loss": -26.46286964416504, "global_step": 318949, "epoch": 3842} {"train_loss": -26.137710571289062, "global_step": 318950, "epoch": 3842} {"train_loss": -25.96354103088379, "global_step": 318951, "epoch": 3842} {"train_loss": -25.983844757080078, "global_step": 318952, "epoch": 3842} {"train_loss": -26.007226943969727, "global_step": 318953, "epoch": 3842} {"train_loss": -25.599653244018555, "global_step": 318954, "epoch": 3842} {"train_loss": -25.793100357055664, "global_step": 318955, "epoch": 3842} {"train_loss": -26.1369571685791, "global_step": 318956, "epoch": 3842} {"train_loss": -26.3040828704834, "global_step": 318957, "epoch": 3842} {"train_loss": -26.036314010620117, "global_step": 318958, "epoch": 3842} {"train_loss": -26.3919677734375, "global_step": 318959, "epoch": 3842} {"train_loss": -26.260364532470703, "global_step": 318960, "epoch": 3842} {"train_loss": -25.87668800354004, "global_step": 318961, "epoch": 3842} {"train_loss": -26.178409576416016, "global_step": 318962, "epoch": 3842} {"train_loss": -25.837743759155273, "global_step": 318963, "epoch": 3842} {"train_loss": -25.786865234375, "global_step": 318964, "epoch": 3842} {"train_loss": -25.46529197692871, "global_step": 318965, "epoch": 3842} {"train_loss": -25.3084716796875, "global_step": 318966, "epoch": 3842} {"train_loss": -25.690412521362305, "global_step": 318967, "epoch": 3842} {"train_loss": -25.777757667633423, "global_step": 318968, "epoch": 3842, "val_loss": 7277047.0} {"train_loss": -24.835309982299805, "global_step": 318969, "epoch": 3843} {"train_loss": -24.054529190063477, "global_step": 318970, "epoch": 3843} {"train_loss": -24.89705467224121, "global_step": 318971, "epoch": 3843} {"train_loss": -25.116483688354492, "global_step": 318972, "epoch": 3843} {"train_loss": -25.35780143737793, "global_step": 318973, "epoch": 3843} {"train_loss": -25.008920669555664, "global_step": 318974, "epoch": 3843} {"train_loss": -25.78013038635254, "global_step": 318975, "epoch": 3843} {"train_loss": -25.511037826538086, "global_step": 318976, "epoch": 3843} {"train_loss": -25.291364669799805, "global_step": 318977, "epoch": 3843} {"train_loss": -25.229291915893555, "global_step": 318978, "epoch": 3843} {"train_loss": -25.731225967407227, "global_step": 318979, "epoch": 3843} {"train_loss": -25.7778263092041, "global_step": 318980, "epoch": 3843} {"train_loss": -25.4619197845459, "global_step": 318981, "epoch": 3843} {"train_loss": -25.251419067382812, "global_step": 318982, "epoch": 3843} {"train_loss": -25.424150466918945, "global_step": 318983, "epoch": 3843} {"train_loss": -25.440725326538086, "global_step": 318984, "epoch": 3843} {"train_loss": -25.483068466186523, "global_step": 318985, "epoch": 3843} {"train_loss": -25.52182960510254, "global_step": 318986, "epoch": 3843} {"train_loss": -25.553571701049805, "global_step": 318987, "epoch": 3843} {"train_loss": -25.462690353393555, "global_step": 318988, "epoch": 3843} {"train_loss": -25.214994430541992, "global_step": 318989, "epoch": 3843} {"train_loss": -25.588850021362305, "global_step": 318990, "epoch": 3843} {"train_loss": -25.6578426361084, "global_step": 318991, "epoch": 3843} {"train_loss": -25.853845596313477, "global_step": 318992, "epoch": 3843} {"train_loss": -25.993499755859375, "global_step": 318993, "epoch": 3843} {"train_loss": -25.72413444519043, "global_step": 318994, "epoch": 3843} {"train_loss": -25.930633544921875, "global_step": 318995, "epoch": 3843} {"train_loss": -26.1601505279541, "global_step": 318996, "epoch": 3843} {"train_loss": -25.791351318359375, "global_step": 318997, "epoch": 3843} {"train_loss": -26.0289249420166, "global_step": 318998, "epoch": 3843} {"train_loss": -26.164875030517578, "global_step": 318999, "epoch": 3843} {"train_loss": -25.6441593170166, "global_step": 319000, "epoch": 3843} {"train_loss": -25.7840576171875, "global_step": 319001, "epoch": 3843} {"train_loss": -25.795551300048828, "global_step": 319002, "epoch": 3843} {"train_loss": -25.975004196166992, "global_step": 319003, "epoch": 3843} {"train_loss": -25.874792098999023, "global_step": 319004, "epoch": 3843} {"train_loss": -26.034809112548828, "global_step": 319005, "epoch": 3843} {"train_loss": -25.944995880126953, "global_step": 319006, "epoch": 3843} {"train_loss": -26.108976364135742, "global_step": 319007, "epoch": 3843} {"train_loss": -26.09433364868164, "global_step": 319008, "epoch": 3843} {"train_loss": -26.118122100830078, "global_step": 319009, "epoch": 3843} {"train_loss": -25.893835067749023, "global_step": 319010, "epoch": 3843} {"train_loss": -25.900802612304688, "global_step": 319011, "epoch": 3843} {"train_loss": -26.196945190429688, "global_step": 319012, "epoch": 3843} {"train_loss": -26.114593505859375, "global_step": 319013, "epoch": 3843} {"train_loss": -25.944110870361328, "global_step": 319014, "epoch": 3843} {"train_loss": -25.833044052124023, "global_step": 319015, "epoch": 3843} {"train_loss": -26.12799644470215, "global_step": 319016, "epoch": 3843} {"train_loss": -25.58675193786621, "global_step": 319017, "epoch": 3843} {"train_loss": -25.936176300048828, "global_step": 319018, "epoch": 3843} {"train_loss": -26.043048858642578, "global_step": 319019, "epoch": 3843} {"train_loss": -26.13311195373535, "global_step": 319020, "epoch": 3843} {"train_loss": -25.98305320739746, "global_step": 319021, "epoch": 3843} {"train_loss": -25.900665283203125, "global_step": 319022, "epoch": 3843} {"train_loss": -26.00443458557129, "global_step": 319023, "epoch": 3843} {"train_loss": -25.93720054626465, "global_step": 319024, "epoch": 3843} {"train_loss": -25.94087028503418, "global_step": 319025, "epoch": 3843} {"train_loss": -25.56459617614746, "global_step": 319026, "epoch": 3843} {"train_loss": -25.98233985900879, "global_step": 319027, "epoch": 3843} {"train_loss": -26.139448165893555, "global_step": 319028, "epoch": 3843} {"train_loss": -25.977136611938477, "global_step": 319029, "epoch": 3843} {"train_loss": -25.352294921875, "global_step": 319030, "epoch": 3843} {"train_loss": -25.668676376342773, "global_step": 319031, "epoch": 3843} {"train_loss": -26.130142211914062, "global_step": 319032, "epoch": 3843} {"train_loss": -25.750165939331055, "global_step": 319033, "epoch": 3843} {"train_loss": -26.094879150390625, "global_step": 319034, "epoch": 3843} {"train_loss": -25.75440788269043, "global_step": 319035, "epoch": 3843} {"train_loss": -26.0311336517334, "global_step": 319036, "epoch": 3843} {"train_loss": -26.010690689086914, "global_step": 319037, "epoch": 3843} {"train_loss": -26.108718872070312, "global_step": 319038, "epoch": 3843} {"train_loss": -25.868305206298828, "global_step": 319039, "epoch": 3843} {"train_loss": -25.330129623413086, "global_step": 319040, "epoch": 3843} {"train_loss": -25.68169593811035, "global_step": 319041, "epoch": 3843} {"train_loss": -26.070005416870117, "global_step": 319042, "epoch": 3843} {"train_loss": -25.907745361328125, "global_step": 319043, "epoch": 3843} {"train_loss": -26.008960723876953, "global_step": 319044, "epoch": 3843} {"train_loss": -25.7972354888916, "global_step": 319045, "epoch": 3843} {"train_loss": -25.90949058532715, "global_step": 319046, "epoch": 3843} {"train_loss": -26.02411460876465, "global_step": 319047, "epoch": 3843} {"train_loss": -25.981616973876953, "global_step": 319048, "epoch": 3843} {"train_loss": -25.948522567749023, "global_step": 319049, "epoch": 3843} {"train_loss": -25.925695419311523, "global_step": 319050, "epoch": 3843} {"train_loss": -25.750831144401825, "global_step": 319051, "epoch": 3843, "val_loss": 7243625.0} {"train_loss": -25.458545684814453, "global_step": 319052, "epoch": 3844} {"train_loss": -25.605823516845703, "global_step": 319053, "epoch": 3844} {"train_loss": -25.905359268188477, "global_step": 319054, "epoch": 3844} {"train_loss": -25.436140060424805, "global_step": 319055, "epoch": 3844} {"train_loss": -25.48213768005371, "global_step": 319056, "epoch": 3844} {"train_loss": -25.860614776611328, "global_step": 319057, "epoch": 3844} {"train_loss": -25.374765396118164, "global_step": 319058, "epoch": 3844} {"train_loss": -25.389142990112305, "global_step": 319059, "epoch": 3844} {"train_loss": -25.527023315429688, "global_step": 319060, "epoch": 3844} {"train_loss": -25.6348934173584, "global_step": 319061, "epoch": 3844} {"train_loss": -25.72214126586914, "global_step": 319062, "epoch": 3844} {"train_loss": -25.890913009643555, "global_step": 319063, "epoch": 3844} {"train_loss": -25.618749618530273, "global_step": 319064, "epoch": 3844} {"train_loss": -25.520483016967773, "global_step": 319065, "epoch": 3844} {"train_loss": -25.690549850463867, "global_step": 319066, "epoch": 3844} {"train_loss": -25.74220085144043, "global_step": 319067, "epoch": 3844} {"train_loss": -24.923444747924805, "global_step": 319068, "epoch": 3844} {"train_loss": -25.838659286499023, "global_step": 319069, "epoch": 3844} {"train_loss": -25.829309463500977, "global_step": 319070, "epoch": 3844} {"train_loss": -25.842687606811523, "global_step": 319071, "epoch": 3844} {"train_loss": -25.470340728759766, "global_step": 319072, "epoch": 3844} {"train_loss": -26.072240829467773, "global_step": 319073, "epoch": 3844} {"train_loss": -25.764551162719727, "global_step": 319074, "epoch": 3844} {"train_loss": -25.935407638549805, "global_step": 319075, "epoch": 3844} {"train_loss": -25.679670333862305, "global_step": 319076, "epoch": 3844} {"train_loss": -25.56770896911621, "global_step": 319077, "epoch": 3844} {"train_loss": -25.773822784423828, "global_step": 319078, "epoch": 3844} {"train_loss": -26.031545639038086, "global_step": 319079, "epoch": 3844} {"train_loss": -25.939722061157227, "global_step": 319080, "epoch": 3844} {"train_loss": -25.777545928955078, "global_step": 319081, "epoch": 3844} {"train_loss": -25.897663116455078, "global_step": 319082, "epoch": 3844} {"train_loss": -26.132665634155273, "global_step": 319083, "epoch": 3844} {"train_loss": -26.170978546142578, "global_step": 319084, "epoch": 3844} {"train_loss": -26.00752830505371, "global_step": 319085, "epoch": 3844} {"train_loss": -25.8410701751709, "global_step": 319086, "epoch": 3844} {"train_loss": -25.82990074157715, "global_step": 319087, "epoch": 3844} {"train_loss": -26.041492462158203, "global_step": 319088, "epoch": 3844} {"train_loss": -25.900449752807617, "global_step": 319089, "epoch": 3844} {"train_loss": -26.132970809936523, "global_step": 319090, "epoch": 3844} {"train_loss": -26.100330352783203, "global_step": 319091, "epoch": 3844} {"train_loss": -26.067148208618164, "global_step": 319092, "epoch": 3844} {"train_loss": -26.096349716186523, "global_step": 319093, "epoch": 3844} {"train_loss": -26.14295768737793, "global_step": 319094, "epoch": 3844} {"train_loss": -26.135944366455078, "global_step": 319095, "epoch": 3844} {"train_loss": -26.229629516601562, "global_step": 319096, "epoch": 3844} {"train_loss": -25.991043090820312, "global_step": 319097, "epoch": 3844} {"train_loss": -25.804731369018555, "global_step": 319098, "epoch": 3844} {"train_loss": -25.9678897857666, "global_step": 319099, "epoch": 3844} {"train_loss": -25.964752197265625, "global_step": 319100, "epoch": 3844} {"train_loss": -25.802228927612305, "global_step": 319101, "epoch": 3844} {"train_loss": -25.264455795288086, "global_step": 319102, "epoch": 3844} {"train_loss": -25.751691818237305, "global_step": 319103, "epoch": 3844} {"train_loss": -25.119186401367188, "global_step": 319104, "epoch": 3844} {"train_loss": -25.45685577392578, "global_step": 319105, "epoch": 3844} {"train_loss": -25.736968994140625, "global_step": 319106, "epoch": 3844} {"train_loss": -25.725311279296875, "global_step": 319107, "epoch": 3844} {"train_loss": -25.4381160736084, "global_step": 319108, "epoch": 3844} {"train_loss": -25.32649803161621, "global_step": 319109, "epoch": 3844} {"train_loss": -25.269418716430664, "global_step": 319110, "epoch": 3844} {"train_loss": -25.758487701416016, "global_step": 319111, "epoch": 3844} {"train_loss": -25.604337692260742, "global_step": 319112, "epoch": 3844} {"train_loss": -25.8643856048584, "global_step": 319113, "epoch": 3844} {"train_loss": -25.590457916259766, "global_step": 319114, "epoch": 3844} {"train_loss": -25.827993392944336, "global_step": 319115, "epoch": 3844} {"train_loss": -25.782501220703125, "global_step": 319116, "epoch": 3844} {"train_loss": -25.9046573638916, "global_step": 319117, "epoch": 3844} {"train_loss": -25.582841873168945, "global_step": 319118, "epoch": 3844} {"train_loss": -25.19431495666504, "global_step": 319119, "epoch": 3844} {"train_loss": -25.678409576416016, "global_step": 319120, "epoch": 3844} {"train_loss": -25.994375228881836, "global_step": 319121, "epoch": 3844} {"train_loss": -25.6236629486084, "global_step": 319122, "epoch": 3844} {"train_loss": -25.502676010131836, "global_step": 319123, "epoch": 3844} {"train_loss": -25.393911361694336, "global_step": 319124, "epoch": 3844} {"train_loss": -25.72047996520996, "global_step": 319125, "epoch": 3844} {"train_loss": -25.623666763305664, "global_step": 319126, "epoch": 3844} {"train_loss": -25.76228141784668, "global_step": 319127, "epoch": 3844} {"train_loss": -25.868810653686523, "global_step": 319128, "epoch": 3844} {"train_loss": -25.713407516479492, "global_step": 319129, "epoch": 3844} {"train_loss": -26.113800048828125, "global_step": 319130, "epoch": 3844} {"train_loss": -25.871984481811523, "global_step": 319131, "epoch": 3844} {"train_loss": -26.156543731689453, "global_step": 319132, "epoch": 3844} {"train_loss": -25.695758819580078, "global_step": 319133, "epoch": 3844} {"train_loss": -25.736984804452185, "global_step": 319134, "epoch": 3844, "val_loss": 7185468.5} {"train_loss": -25.354215621948242, "global_step": 319135, "epoch": 3845} {"train_loss": -25.62255859375, "global_step": 319136, "epoch": 3845} {"train_loss": -25.68079948425293, "global_step": 319137, "epoch": 3845} {"train_loss": -25.528274536132812, "global_step": 319138, "epoch": 3845} {"train_loss": -26.029951095581055, "global_step": 319139, "epoch": 3845} {"train_loss": -25.782941818237305, "global_step": 319140, "epoch": 3845} {"train_loss": -25.601348876953125, "global_step": 319141, "epoch": 3845} {"train_loss": -25.623559951782227, "global_step": 319142, "epoch": 3845} {"train_loss": -25.662067413330078, "global_step": 319143, "epoch": 3845} {"train_loss": -25.602033615112305, "global_step": 319144, "epoch": 3845} {"train_loss": -25.697891235351562, "global_step": 319145, "epoch": 3845} {"train_loss": -25.886871337890625, "global_step": 319146, "epoch": 3845} {"train_loss": -25.9849910736084, "global_step": 319147, "epoch": 3845} {"train_loss": -25.842864990234375, "global_step": 319148, "epoch": 3845} {"train_loss": -25.95416831970215, "global_step": 319149, "epoch": 3845} {"train_loss": -25.66303825378418, "global_step": 319150, "epoch": 3845} {"train_loss": -26.013843536376953, "global_step": 319151, "epoch": 3845} {"train_loss": -25.967905044555664, "global_step": 319152, "epoch": 3845} {"train_loss": -25.85357093811035, "global_step": 319153, "epoch": 3845} {"train_loss": -25.75732421875, "global_step": 319154, "epoch": 3845} {"train_loss": -25.887693405151367, "global_step": 319155, "epoch": 3845} {"train_loss": -25.95670509338379, "global_step": 319156, "epoch": 3845} {"train_loss": -25.554738998413086, "global_step": 319157, "epoch": 3845} {"train_loss": -25.7632999420166, "global_step": 319158, "epoch": 3845} {"train_loss": -25.794696807861328, "global_step": 319159, "epoch": 3845} {"train_loss": -25.74725914001465, "global_step": 319160, "epoch": 3845} {"train_loss": -25.231922149658203, "global_step": 319161, "epoch": 3845} {"train_loss": -25.778837203979492, "global_step": 319162, "epoch": 3845} {"train_loss": -25.97043228149414, "global_step": 319163, "epoch": 3845} {"train_loss": -25.94382667541504, "global_step": 319164, "epoch": 3845} {"train_loss": -25.53645896911621, "global_step": 319165, "epoch": 3845} {"train_loss": -25.666339874267578, "global_step": 319166, "epoch": 3845} {"train_loss": -25.600988388061523, "global_step": 319167, "epoch": 3845} {"train_loss": -25.769622802734375, "global_step": 319168, "epoch": 3845} {"train_loss": -26.16420555114746, "global_step": 319169, "epoch": 3845} {"train_loss": -25.552488327026367, "global_step": 319170, "epoch": 3845} {"train_loss": -25.2724666595459, "global_step": 319171, "epoch": 3845} {"train_loss": -25.6619815826416, "global_step": 319172, "epoch": 3845} {"train_loss": -25.125730514526367, "global_step": 319173, "epoch": 3845} {"train_loss": -25.24524688720703, "global_step": 319174, "epoch": 3845} {"train_loss": -25.565515518188477, "global_step": 319175, "epoch": 3845} {"train_loss": -25.6138916015625, "global_step": 319176, "epoch": 3845} {"train_loss": -25.56924819946289, "global_step": 319177, "epoch": 3845} {"train_loss": -26.0540714263916, "global_step": 319178, "epoch": 3845} {"train_loss": -25.612564086914062, "global_step": 319179, "epoch": 3845} {"train_loss": -25.869245529174805, "global_step": 319180, "epoch": 3845} {"train_loss": -25.822301864624023, "global_step": 319181, "epoch": 3845} {"train_loss": -26.180908203125, "global_step": 319182, "epoch": 3845} {"train_loss": -25.608503341674805, "global_step": 319183, "epoch": 3845} {"train_loss": -26.026233673095703, "global_step": 319184, "epoch": 3845} {"train_loss": -25.725757598876953, "global_step": 319185, "epoch": 3845} {"train_loss": -25.607263565063477, "global_step": 319186, "epoch": 3845} {"train_loss": -26.200220108032227, "global_step": 319187, "epoch": 3845} {"train_loss": -26.086339950561523, "global_step": 319188, "epoch": 3845} {"train_loss": -26.136951446533203, "global_step": 319189, "epoch": 3845} {"train_loss": -25.86086082458496, "global_step": 319190, "epoch": 3845} {"train_loss": -26.079687118530273, "global_step": 319191, "epoch": 3845} {"train_loss": -25.729736328125, "global_step": 319192, "epoch": 3845} {"train_loss": -25.986669540405273, "global_step": 319193, "epoch": 3845} {"train_loss": -25.7147274017334, "global_step": 319194, "epoch": 3845} {"train_loss": -26.09998893737793, "global_step": 319195, "epoch": 3845} {"train_loss": -25.952680587768555, "global_step": 319196, "epoch": 3845} {"train_loss": -25.975753784179688, "global_step": 319197, "epoch": 3845} {"train_loss": -25.84039878845215, "global_step": 319198, "epoch": 3845} {"train_loss": -26.41609001159668, "global_step": 319199, "epoch": 3845} {"train_loss": -26.168170928955078, "global_step": 319200, "epoch": 3845} {"train_loss": -25.93731117248535, "global_step": 319201, "epoch": 3845} {"train_loss": -25.811233520507812, "global_step": 319202, "epoch": 3845} {"train_loss": -26.3444881439209, "global_step": 319203, "epoch": 3845} {"train_loss": -26.024051666259766, "global_step": 319204, "epoch": 3845} {"train_loss": -25.85736656188965, "global_step": 319205, "epoch": 3845} {"train_loss": -25.679250717163086, "global_step": 319206, "epoch": 3845} {"train_loss": -25.646020889282227, "global_step": 319207, "epoch": 3845} {"train_loss": -25.70467185974121, "global_step": 319208, "epoch": 3845} {"train_loss": -25.7589054107666, "global_step": 319209, "epoch": 3845} {"train_loss": -25.85181999206543, "global_step": 319210, "epoch": 3845} {"train_loss": -25.91214942932129, "global_step": 319211, "epoch": 3845} {"train_loss": -25.853906631469727, "global_step": 319212, "epoch": 3845} {"train_loss": -25.54396629333496, "global_step": 319213, "epoch": 3845} {"train_loss": -26.208295822143555, "global_step": 319214, "epoch": 3845} {"train_loss": -25.584510803222656, "global_step": 319215, "epoch": 3845} {"train_loss": -25.901355743408203, "global_step": 319216, "epoch": 3845} {"train_loss": -25.814642251256, "global_step": 319217, "epoch": 3845, "val_loss": 7407406.0} {"train_loss": -25.222305297851562, "global_step": 319218, "epoch": 3846} {"train_loss": -25.35076332092285, "global_step": 319219, "epoch": 3846} {"train_loss": -25.4121036529541, "global_step": 319220, "epoch": 3846} {"train_loss": -25.12895393371582, "global_step": 319221, "epoch": 3846} {"train_loss": -25.587162017822266, "global_step": 319222, "epoch": 3846} {"train_loss": -25.692001342773438, "global_step": 319223, "epoch": 3846} {"train_loss": -25.631576538085938, "global_step": 319224, "epoch": 3846} {"train_loss": -25.72661781311035, "global_step": 319225, "epoch": 3846} {"train_loss": -25.6144962310791, "global_step": 319226, "epoch": 3846} {"train_loss": -25.704267501831055, "global_step": 319227, "epoch": 3846} {"train_loss": -25.980915069580078, "global_step": 319228, "epoch": 3846} {"train_loss": -25.911914825439453, "global_step": 319229, "epoch": 3846} {"train_loss": -25.91407585144043, "global_step": 319230, "epoch": 3846} {"train_loss": -25.7066650390625, "global_step": 319231, "epoch": 3846} {"train_loss": -26.1275577545166, "global_step": 319232, "epoch": 3846} {"train_loss": -25.792463302612305, "global_step": 319233, "epoch": 3846} {"train_loss": -25.627307891845703, "global_step": 319234, "epoch": 3846} {"train_loss": -25.756057739257812, "global_step": 319235, "epoch": 3846} {"train_loss": -25.568552017211914, "global_step": 319236, "epoch": 3846} {"train_loss": -25.724262237548828, "global_step": 319237, "epoch": 3846} {"train_loss": -25.7005558013916, "global_step": 319238, "epoch": 3846} {"train_loss": -25.83563804626465, "global_step": 319239, "epoch": 3846} {"train_loss": -25.537757873535156, "global_step": 319240, "epoch": 3846} {"train_loss": -26.003488540649414, "global_step": 319241, "epoch": 3846} {"train_loss": -25.664716720581055, "global_step": 319242, "epoch": 3846} {"train_loss": -25.993518829345703, "global_step": 319243, "epoch": 3846} {"train_loss": -26.2202091217041, "global_step": 319244, "epoch": 3846} {"train_loss": -26.15481948852539, "global_step": 319245, "epoch": 3846} {"train_loss": -25.694717407226562, "global_step": 319246, "epoch": 3846} {"train_loss": -25.813690185546875, "global_step": 319247, "epoch": 3846} {"train_loss": -25.9593563079834, "global_step": 319248, "epoch": 3846} {"train_loss": -25.492141723632812, "global_step": 319249, "epoch": 3846} {"train_loss": -26.13435173034668, "global_step": 319250, "epoch": 3846} {"train_loss": -25.378263473510742, "global_step": 319251, "epoch": 3846} {"train_loss": -25.968185424804688, "global_step": 319252, "epoch": 3846} {"train_loss": -25.83282470703125, "global_step": 319253, "epoch": 3846} {"train_loss": -26.0939884185791, "global_step": 319254, "epoch": 3846} {"train_loss": -25.822101593017578, "global_step": 319255, "epoch": 3846} {"train_loss": -25.82756996154785, "global_step": 319256, "epoch": 3846} {"train_loss": -25.7762393951416, "global_step": 319257, "epoch": 3846} {"train_loss": -26.025604248046875, "global_step": 319258, "epoch": 3846} {"train_loss": -25.838529586791992, "global_step": 319259, "epoch": 3846} {"train_loss": -26.097721099853516, "global_step": 319260, "epoch": 3846} {"train_loss": -26.2200984954834, "global_step": 319261, "epoch": 3846} {"train_loss": -25.924230575561523, "global_step": 319262, "epoch": 3846} {"train_loss": -26.001890182495117, "global_step": 319263, "epoch": 3846} {"train_loss": -26.115232467651367, "global_step": 319264, "epoch": 3846} {"train_loss": -25.96992301940918, "global_step": 319265, "epoch": 3846} {"train_loss": -26.00783348083496, "global_step": 319266, "epoch": 3846} {"train_loss": -25.890851974487305, "global_step": 319267, "epoch": 3846} {"train_loss": -26.182214736938477, "global_step": 319268, "epoch": 3846} {"train_loss": -25.986541748046875, "global_step": 319269, "epoch": 3846} {"train_loss": -25.594858169555664, "global_step": 319270, "epoch": 3846} {"train_loss": -25.51662254333496, "global_step": 319271, "epoch": 3846} {"train_loss": -26.04511833190918, "global_step": 319272, "epoch": 3846} {"train_loss": -25.89954948425293, "global_step": 319273, "epoch": 3846} {"train_loss": -25.182920455932617, "global_step": 319274, "epoch": 3846} {"train_loss": -25.993549346923828, "global_step": 319275, "epoch": 3846} {"train_loss": -25.324670791625977, "global_step": 319276, "epoch": 3846} {"train_loss": -25.364986419677734, "global_step": 319277, "epoch": 3846} {"train_loss": -25.816070556640625, "global_step": 319278, "epoch": 3846} {"train_loss": -25.8328800201416, "global_step": 319279, "epoch": 3846} {"train_loss": -25.489408493041992, "global_step": 319280, "epoch": 3846} {"train_loss": -25.712982177734375, "global_step": 319281, "epoch": 3846} {"train_loss": -25.48712921142578, "global_step": 319282, "epoch": 3846} {"train_loss": -26.004627227783203, "global_step": 319283, "epoch": 3846} {"train_loss": -25.63368034362793, "global_step": 319284, "epoch": 3846} {"train_loss": -25.685529708862305, "global_step": 319285, "epoch": 3846} {"train_loss": -25.269533157348633, "global_step": 319286, "epoch": 3846} {"train_loss": -26.106046676635742, "global_step": 319287, "epoch": 3846} {"train_loss": -25.884784698486328, "global_step": 319288, "epoch": 3846} {"train_loss": -25.75501823425293, "global_step": 319289, "epoch": 3846} {"train_loss": -26.5128116607666, "global_step": 319290, "epoch": 3846} {"train_loss": -25.58124351501465, "global_step": 319291, "epoch": 3846} {"train_loss": -25.67266273498535, "global_step": 319292, "epoch": 3846} {"train_loss": -25.917516708374023, "global_step": 319293, "epoch": 3846} {"train_loss": -25.893722534179688, "global_step": 319294, "epoch": 3846} {"train_loss": -26.060148239135742, "global_step": 319295, "epoch": 3846} {"train_loss": -25.70965576171875, "global_step": 319296, "epoch": 3846} {"train_loss": -25.93121910095215, "global_step": 319297, "epoch": 3846} {"train_loss": -25.657190322875977, "global_step": 319298, "epoch": 3846} {"train_loss": -25.88726806640625, "global_step": 319299, "epoch": 3846} {"train_loss": -25.784503683986433, "global_step": 319300, "epoch": 3846, "val_loss": 7323670.0} {"train_loss": -25.17305564880371, "global_step": 319301, "epoch": 3847} {"train_loss": -24.43817138671875, "global_step": 319302, "epoch": 3847} {"train_loss": -25.088050842285156, "global_step": 319303, "epoch": 3847} {"train_loss": -25.332365036010742, "global_step": 319304, "epoch": 3847} {"train_loss": -25.019397735595703, "global_step": 319305, "epoch": 3847} {"train_loss": -25.103818893432617, "global_step": 319306, "epoch": 3847} {"train_loss": -25.18259620666504, "global_step": 319307, "epoch": 3847} {"train_loss": -25.266799926757812, "global_step": 319308, "epoch": 3847} {"train_loss": -26.13434410095215, "global_step": 319309, "epoch": 3847} {"train_loss": -25.547592163085938, "global_step": 319310, "epoch": 3847} {"train_loss": -25.393980026245117, "global_step": 319311, "epoch": 3847} {"train_loss": -25.495702743530273, "global_step": 319312, "epoch": 3847} {"train_loss": -25.5222225189209, "global_step": 319313, "epoch": 3847} {"train_loss": -25.25080108642578, "global_step": 319314, "epoch": 3847} {"train_loss": -25.398273468017578, "global_step": 319315, "epoch": 3847} {"train_loss": -25.620166778564453, "global_step": 319316, "epoch": 3847} {"train_loss": -25.952533721923828, "global_step": 319317, "epoch": 3847} {"train_loss": -25.433805465698242, "global_step": 319318, "epoch": 3847} {"train_loss": -25.748138427734375, "global_step": 319319, "epoch": 3847} {"train_loss": -25.593769073486328, "global_step": 319320, "epoch": 3847} {"train_loss": -25.659870147705078, "global_step": 319321, "epoch": 3847} {"train_loss": -25.74709129333496, "global_step": 319322, "epoch": 3847} {"train_loss": -25.942398071289062, "global_step": 319323, "epoch": 3847} {"train_loss": -25.92374610900879, "global_step": 319324, "epoch": 3847} {"train_loss": -25.331960678100586, "global_step": 319325, "epoch": 3847} {"train_loss": -25.31654167175293, "global_step": 319326, "epoch": 3847} {"train_loss": -25.738483428955078, "global_step": 319327, "epoch": 3847} {"train_loss": -26.01871681213379, "global_step": 319328, "epoch": 3847} {"train_loss": -25.933643341064453, "global_step": 319329, "epoch": 3847} {"train_loss": -26.0064640045166, "global_step": 319330, "epoch": 3847} {"train_loss": -25.983245849609375, "global_step": 319331, "epoch": 3847} {"train_loss": -25.8783016204834, "global_step": 319332, "epoch": 3847} {"train_loss": -25.895954132080078, "global_step": 319333, "epoch": 3847} {"train_loss": -25.872085571289062, "global_step": 319334, "epoch": 3847} {"train_loss": -26.389312744140625, "global_step": 319335, "epoch": 3847} {"train_loss": -25.890029907226562, "global_step": 319336, "epoch": 3847} {"train_loss": -26.222986221313477, "global_step": 319337, "epoch": 3847} {"train_loss": -26.08247947692871, "global_step": 319338, "epoch": 3847} {"train_loss": -26.202295303344727, "global_step": 319339, "epoch": 3847} {"train_loss": -26.085275650024414, "global_step": 319340, "epoch": 3847} {"train_loss": -26.17719841003418, "global_step": 319341, "epoch": 3847} {"train_loss": -26.149702072143555, "global_step": 319342, "epoch": 3847} {"train_loss": -26.3349609375, "global_step": 319343, "epoch": 3847} {"train_loss": -25.995880126953125, "global_step": 319344, "epoch": 3847} {"train_loss": -25.65262222290039, "global_step": 319345, "epoch": 3847} {"train_loss": -26.262388229370117, "global_step": 319346, "epoch": 3847} {"train_loss": -26.294525146484375, "global_step": 319347, "epoch": 3847} {"train_loss": -25.777816772460938, "global_step": 319348, "epoch": 3847} {"train_loss": -26.05419921875, "global_step": 319349, "epoch": 3847} {"train_loss": -25.714902877807617, "global_step": 319350, "epoch": 3847} {"train_loss": -25.92616844177246, "global_step": 319351, "epoch": 3847} {"train_loss": -26.323657989501953, "global_step": 319352, "epoch": 3847} {"train_loss": -25.642805099487305, "global_step": 319353, "epoch": 3847} {"train_loss": -25.375003814697266, "global_step": 319354, "epoch": 3847} {"train_loss": -25.216367721557617, "global_step": 319355, "epoch": 3847} {"train_loss": -25.877216339111328, "global_step": 319356, "epoch": 3847} {"train_loss": -25.58094024658203, "global_step": 319357, "epoch": 3847} {"train_loss": -25.927968978881836, "global_step": 319358, "epoch": 3847} {"train_loss": -25.81625747680664, "global_step": 319359, "epoch": 3847} {"train_loss": -25.06073570251465, "global_step": 319360, "epoch": 3847} {"train_loss": -24.75685691833496, "global_step": 319361, "epoch": 3847} {"train_loss": -24.991971969604492, "global_step": 319362, "epoch": 3847} {"train_loss": -25.80329704284668, "global_step": 319363, "epoch": 3847} {"train_loss": -25.6826229095459, "global_step": 319364, "epoch": 3847} {"train_loss": -25.253870010375977, "global_step": 319365, "epoch": 3847} {"train_loss": -25.639362335205078, "global_step": 319366, "epoch": 3847} {"train_loss": -25.886518478393555, "global_step": 319367, "epoch": 3847} {"train_loss": -25.492286682128906, "global_step": 319368, "epoch": 3847} {"train_loss": -25.881643295288086, "global_step": 319369, "epoch": 3847} {"train_loss": -25.3317813873291, "global_step": 319370, "epoch": 3847} {"train_loss": -25.65024757385254, "global_step": 319371, "epoch": 3847} {"train_loss": -26.096054077148438, "global_step": 319372, "epoch": 3847} {"train_loss": -25.35072898864746, "global_step": 319373, "epoch": 3847} {"train_loss": -25.83135986328125, "global_step": 319374, "epoch": 3847} {"train_loss": -25.630985260009766, "global_step": 319375, "epoch": 3847} {"train_loss": -25.751562118530273, "global_step": 319376, "epoch": 3847} {"train_loss": -25.592214584350586, "global_step": 319377, "epoch": 3847} {"train_loss": -25.7349853515625, "global_step": 319378, "epoch": 3847} {"train_loss": -25.840795516967773, "global_step": 319379, "epoch": 3847} {"train_loss": -25.458539962768555, "global_step": 319380, "epoch": 3847} {"train_loss": -25.999561309814453, "global_step": 319381, "epoch": 3847} {"train_loss": -25.76471519470215, "global_step": 319382, "epoch": 3847} {"train_loss": -25.676403597176794, "global_step": 319383, "epoch": 3847, "val_loss": 7340115.0} {"train_loss": -25.107330322265625, "global_step": 319384, "epoch": 3848} {"train_loss": -25.50284194946289, "global_step": 319385, "epoch": 3848} {"train_loss": -25.216476440429688, "global_step": 319386, "epoch": 3848} {"train_loss": -25.201627731323242, "global_step": 319387, "epoch": 3848} {"train_loss": -25.51419448852539, "global_step": 319388, "epoch": 3848} {"train_loss": -25.287113189697266, "global_step": 319389, "epoch": 3848} {"train_loss": -25.390684127807617, "global_step": 319390, "epoch": 3848} {"train_loss": -25.288999557495117, "global_step": 319391, "epoch": 3848} {"train_loss": -25.52737808227539, "global_step": 319392, "epoch": 3848} {"train_loss": -25.26765251159668, "global_step": 319393, "epoch": 3848} {"train_loss": -25.961383819580078, "global_step": 319394, "epoch": 3848} {"train_loss": -25.594303131103516, "global_step": 319395, "epoch": 3848} {"train_loss": -25.503076553344727, "global_step": 319396, "epoch": 3848} {"train_loss": -25.48550796508789, "global_step": 319397, "epoch": 3848} {"train_loss": -25.7033748626709, "global_step": 319398, "epoch": 3848} {"train_loss": -25.314176559448242, "global_step": 319399, "epoch": 3848} {"train_loss": -25.883548736572266, "global_step": 319400, "epoch": 3848} {"train_loss": -25.622024536132812, "global_step": 319401, "epoch": 3848} {"train_loss": -25.9102725982666, "global_step": 319402, "epoch": 3848} {"train_loss": -25.595693588256836, "global_step": 319403, "epoch": 3848} {"train_loss": -25.911148071289062, "global_step": 319404, "epoch": 3848} {"train_loss": -25.355472564697266, "global_step": 319405, "epoch": 3848} {"train_loss": -25.488605499267578, "global_step": 319406, "epoch": 3848} {"train_loss": -25.677953720092773, "global_step": 319407, "epoch": 3848} {"train_loss": -25.861371994018555, "global_step": 319408, "epoch": 3848} {"train_loss": -25.687585830688477, "global_step": 319409, "epoch": 3848} {"train_loss": -26.078657150268555, "global_step": 319410, "epoch": 3848} {"train_loss": -26.160425186157227, "global_step": 319411, "epoch": 3848} {"train_loss": -25.8902645111084, "global_step": 319412, "epoch": 3848} {"train_loss": -25.800207138061523, "global_step": 319413, "epoch": 3848} {"train_loss": -26.152753829956055, "global_step": 319414, "epoch": 3848} {"train_loss": -25.81035804748535, "global_step": 319415, "epoch": 3848} {"train_loss": -25.994522094726562, "global_step": 319416, "epoch": 3848} {"train_loss": -25.716962814331055, "global_step": 319417, "epoch": 3848} {"train_loss": -25.80421257019043, "global_step": 319418, "epoch": 3848} {"train_loss": -25.948200225830078, "global_step": 319419, "epoch": 3848} {"train_loss": -26.233875274658203, "global_step": 319420, "epoch": 3848} {"train_loss": -25.90326499938965, "global_step": 319421, "epoch": 3848} {"train_loss": -25.886093139648438, "global_step": 319422, "epoch": 3848} {"train_loss": -26.215795516967773, "global_step": 319423, "epoch": 3848} {"train_loss": -25.85883903503418, "global_step": 319424, "epoch": 3848} {"train_loss": -26.113025665283203, "global_step": 319425, "epoch": 3848} {"train_loss": -25.879392623901367, "global_step": 319426, "epoch": 3848} {"train_loss": -25.692731857299805, "global_step": 319427, "epoch": 3848} {"train_loss": -25.56894874572754, "global_step": 319428, "epoch": 3848} {"train_loss": -25.818222045898438, "global_step": 319429, "epoch": 3848} {"train_loss": -25.58374786376953, "global_step": 319430, "epoch": 3848} {"train_loss": -25.95361328125, "global_step": 319431, "epoch": 3848} {"train_loss": -25.562793731689453, "global_step": 319432, "epoch": 3848} {"train_loss": -25.731237411499023, "global_step": 319433, "epoch": 3848} {"train_loss": -25.568130493164062, "global_step": 319434, "epoch": 3848} {"train_loss": -25.639102935791016, "global_step": 319435, "epoch": 3848} {"train_loss": -25.866119384765625, "global_step": 319436, "epoch": 3848} {"train_loss": -25.92164421081543, "global_step": 319437, "epoch": 3848} {"train_loss": -25.88739585876465, "global_step": 319438, "epoch": 3848} {"train_loss": -25.943164825439453, "global_step": 319439, "epoch": 3848} {"train_loss": -25.9140625, "global_step": 319440, "epoch": 3848} {"train_loss": -26.105802536010742, "global_step": 319441, "epoch": 3848} {"train_loss": -26.119901657104492, "global_step": 319442, "epoch": 3848} {"train_loss": -26.28297233581543, "global_step": 319443, "epoch": 3848} {"train_loss": -26.082477569580078, "global_step": 319444, "epoch": 3848} {"train_loss": -25.82465934753418, "global_step": 319445, "epoch": 3848} {"train_loss": -26.35273551940918, "global_step": 319446, "epoch": 3848} {"train_loss": -26.03858757019043, "global_step": 319447, "epoch": 3848} {"train_loss": -25.949838638305664, "global_step": 319448, "epoch": 3848} {"train_loss": -26.005767822265625, "global_step": 319449, "epoch": 3848} {"train_loss": -25.824377059936523, "global_step": 319450, "epoch": 3848} {"train_loss": -26.204023361206055, "global_step": 319451, "epoch": 3848} {"train_loss": -26.319793701171875, "global_step": 319452, "epoch": 3848} {"train_loss": -26.26112174987793, "global_step": 319453, "epoch": 3848} {"train_loss": -26.126117706298828, "global_step": 319454, "epoch": 3848} {"train_loss": -26.07366943359375, "global_step": 319455, "epoch": 3848} {"train_loss": -26.131179809570312, "global_step": 319456, "epoch": 3848} {"train_loss": -26.01883316040039, "global_step": 319457, "epoch": 3848} {"train_loss": -26.138137817382812, "global_step": 319458, "epoch": 3848} {"train_loss": -25.835737228393555, "global_step": 319459, "epoch": 3848} {"train_loss": -25.934152603149414, "global_step": 319460, "epoch": 3848} {"train_loss": -26.0035457611084, "global_step": 319461, "epoch": 3848} {"train_loss": -26.019025802612305, "global_step": 319462, "epoch": 3848} {"train_loss": -25.992145538330078, "global_step": 319463, "epoch": 3848} {"train_loss": -25.877099990844727, "global_step": 319464, "epoch": 3848} {"train_loss": -25.943531036376953, "global_step": 319465, "epoch": 3848} {"train_loss": -25.82727324244488, "global_step": 319466, "epoch": 3848, "val_loss": 7319419.5} {"train_loss": -26.2166690826416, "global_step": 319467, "epoch": 3849} {"train_loss": -25.35957908630371, "global_step": 319468, "epoch": 3849} {"train_loss": -25.288883209228516, "global_step": 319469, "epoch": 3849} {"train_loss": -25.84754753112793, "global_step": 319470, "epoch": 3849} {"train_loss": -25.541275024414062, "global_step": 319471, "epoch": 3849} {"train_loss": -26.005517959594727, "global_step": 319472, "epoch": 3849} {"train_loss": -25.672582626342773, "global_step": 319473, "epoch": 3849} {"train_loss": -25.49068260192871, "global_step": 319474, "epoch": 3849} {"train_loss": -25.556650161743164, "global_step": 319475, "epoch": 3849} {"train_loss": -25.86578941345215, "global_step": 319476, "epoch": 3849} {"train_loss": -25.89406394958496, "global_step": 319477, "epoch": 3849} {"train_loss": -26.317535400390625, "global_step": 319478, "epoch": 3849} {"train_loss": -25.79603385925293, "global_step": 319479, "epoch": 3849} {"train_loss": -25.871702194213867, "global_step": 319480, "epoch": 3849} {"train_loss": -26.2099552154541, "global_step": 319481, "epoch": 3849} {"train_loss": -25.465274810791016, "global_step": 319482, "epoch": 3849} {"train_loss": -25.77667808532715, "global_step": 319483, "epoch": 3849} {"train_loss": -26.12660026550293, "global_step": 319484, "epoch": 3849} {"train_loss": -25.808080673217773, "global_step": 319485, "epoch": 3849} {"train_loss": -26.012985229492188, "global_step": 319486, "epoch": 3849} {"train_loss": -25.854726791381836, "global_step": 319487, "epoch": 3849} {"train_loss": -25.676084518432617, "global_step": 319488, "epoch": 3849} {"train_loss": -25.60735511779785, "global_step": 319489, "epoch": 3849} {"train_loss": -25.832006454467773, "global_step": 319490, "epoch": 3849} {"train_loss": -26.11004066467285, "global_step": 319491, "epoch": 3849} {"train_loss": -26.16265296936035, "global_step": 319492, "epoch": 3849} {"train_loss": -25.974090576171875, "global_step": 319493, "epoch": 3849} {"train_loss": -25.77805519104004, "global_step": 319494, "epoch": 3849} {"train_loss": -25.85346031188965, "global_step": 319495, "epoch": 3849} {"train_loss": -26.11651039123535, "global_step": 319496, "epoch": 3849} {"train_loss": -26.231592178344727, "global_step": 319497, "epoch": 3849} {"train_loss": -25.7841796875, "global_step": 319498, "epoch": 3849} {"train_loss": -26.377716064453125, "global_step": 319499, "epoch": 3849} {"train_loss": -26.3854923248291, "global_step": 319500, "epoch": 3849} {"train_loss": -26.000202178955078, "global_step": 319501, "epoch": 3849} {"train_loss": -25.913028717041016, "global_step": 319502, "epoch": 3849} {"train_loss": -25.92704200744629, "global_step": 319503, "epoch": 3849} {"train_loss": -25.87623405456543, "global_step": 319504, "epoch": 3849} {"train_loss": -25.923294067382812, "global_step": 319505, "epoch": 3849} {"train_loss": -26.177045822143555, "global_step": 319506, "epoch": 3849} {"train_loss": -25.888141632080078, "global_step": 319507, "epoch": 3849} {"train_loss": -25.821826934814453, "global_step": 319508, "epoch": 3849} {"train_loss": -25.70210838317871, "global_step": 319509, "epoch": 3849} {"train_loss": -26.0747013092041, "global_step": 319510, "epoch": 3849} {"train_loss": -26.14324378967285, "global_step": 319511, "epoch": 3849} {"train_loss": -25.94300651550293, "global_step": 319512, "epoch": 3849} {"train_loss": -25.994089126586914, "global_step": 319513, "epoch": 3849} {"train_loss": -25.96246337890625, "global_step": 319514, "epoch": 3849} {"train_loss": -25.629404067993164, "global_step": 319515, "epoch": 3849} {"train_loss": -25.611291885375977, "global_step": 319516, "epoch": 3849} {"train_loss": -25.08360481262207, "global_step": 319517, "epoch": 3849} {"train_loss": -25.71087074279785, "global_step": 319518, "epoch": 3849} {"train_loss": -25.921010971069336, "global_step": 319519, "epoch": 3849} {"train_loss": -25.689733505249023, "global_step": 319520, "epoch": 3849} {"train_loss": -26.0003719329834, "global_step": 319521, "epoch": 3849} {"train_loss": -25.934864044189453, "global_step": 319522, "epoch": 3849} {"train_loss": -25.745222091674805, "global_step": 319523, "epoch": 3849} {"train_loss": -25.958459854125977, "global_step": 319524, "epoch": 3849} {"train_loss": -25.858076095581055, "global_step": 319525, "epoch": 3849} {"train_loss": -25.926589965820312, "global_step": 319526, "epoch": 3849} {"train_loss": -25.586851119995117, "global_step": 319527, "epoch": 3849} {"train_loss": -25.889774322509766, "global_step": 319528, "epoch": 3849} {"train_loss": -25.854724884033203, "global_step": 319529, "epoch": 3849} {"train_loss": -25.561019897460938, "global_step": 319530, "epoch": 3849} {"train_loss": -25.270368576049805, "global_step": 319531, "epoch": 3849} {"train_loss": -25.61481285095215, "global_step": 319532, "epoch": 3849} {"train_loss": -25.368310928344727, "global_step": 319533, "epoch": 3849} {"train_loss": -25.918012619018555, "global_step": 319534, "epoch": 3849} {"train_loss": -25.66961669921875, "global_step": 319535, "epoch": 3849} {"train_loss": -25.7601375579834, "global_step": 319536, "epoch": 3849} {"train_loss": -25.787677764892578, "global_step": 319537, "epoch": 3849} {"train_loss": -25.709020614624023, "global_step": 319538, "epoch": 3849} {"train_loss": -25.590896606445312, "global_step": 319539, "epoch": 3849} {"train_loss": -25.634611129760742, "global_step": 319540, "epoch": 3849} {"train_loss": -26.199954986572266, "global_step": 319541, "epoch": 3849} {"train_loss": -25.74186134338379, "global_step": 319542, "epoch": 3849} {"train_loss": -25.862436294555664, "global_step": 319543, "epoch": 3849} {"train_loss": -25.791366577148438, "global_step": 319544, "epoch": 3849} {"train_loss": -25.733808517456055, "global_step": 319545, "epoch": 3849} {"train_loss": -25.5987491607666, "global_step": 319546, "epoch": 3849} {"train_loss": -25.939420700073242, "global_step": 319547, "epoch": 3849} {"train_loss": -25.7503719329834, "global_step": 319548, "epoch": 3849} {"train_loss": -25.833491313888366, "global_step": 319549, "epoch": 3849, "val_loss": 7434917.0} {"train_loss": -24.97132682800293, "global_step": 319550, "epoch": 3850} {"train_loss": -24.893997192382812, "global_step": 319551, "epoch": 3850} {"train_loss": -24.98784828186035, "global_step": 319552, "epoch": 3850} {"train_loss": -24.538349151611328, "global_step": 319553, "epoch": 3850} {"train_loss": -24.821701049804688, "global_step": 319554, "epoch": 3850} {"train_loss": -24.93279266357422, "global_step": 319555, "epoch": 3850} {"train_loss": -25.308256149291992, "global_step": 319556, "epoch": 3850} {"train_loss": -25.32932472229004, "global_step": 319557, "epoch": 3850} {"train_loss": -25.610828399658203, "global_step": 319558, "epoch": 3850} {"train_loss": -25.24405860900879, "global_step": 319559, "epoch": 3850} {"train_loss": -25.28432273864746, "global_step": 319560, "epoch": 3850} {"train_loss": -25.25103187561035, "global_step": 319561, "epoch": 3850} {"train_loss": -25.423307418823242, "global_step": 319562, "epoch": 3850} {"train_loss": -25.383045196533203, "global_step": 319563, "epoch": 3850} {"train_loss": -26.143590927124023, "global_step": 319564, "epoch": 3850} {"train_loss": -25.2688045501709, "global_step": 319565, "epoch": 3850} {"train_loss": -25.605573654174805, "global_step": 319566, "epoch": 3850} {"train_loss": -25.735687255859375, "global_step": 319567, "epoch": 3850} {"train_loss": -25.439002990722656, "global_step": 319568, "epoch": 3850} {"train_loss": -25.637958526611328, "global_step": 319569, "epoch": 3850} {"train_loss": -25.724822998046875, "global_step": 319570, "epoch": 3850} {"train_loss": -25.880712509155273, "global_step": 319571, "epoch": 3850} {"train_loss": -25.77520751953125, "global_step": 319572, "epoch": 3850} {"train_loss": -25.48957633972168, "global_step": 319573, "epoch": 3850} {"train_loss": -25.647785186767578, "global_step": 319574, "epoch": 3850} {"train_loss": -25.57343864440918, "global_step": 319575, "epoch": 3850} {"train_loss": -25.6473445892334, "global_step": 319576, "epoch": 3850} {"train_loss": -25.664350509643555, "global_step": 319577, "epoch": 3850} {"train_loss": -25.6032772064209, "global_step": 319578, "epoch": 3850} {"train_loss": -25.775196075439453, "global_step": 319579, "epoch": 3850} {"train_loss": -25.859451293945312, "global_step": 319580, "epoch": 3850} {"train_loss": -25.89914321899414, "global_step": 319581, "epoch": 3850} {"train_loss": -25.7211856842041, "global_step": 319582, "epoch": 3850} {"train_loss": -25.747522354125977, "global_step": 319583, "epoch": 3850} {"train_loss": -25.620624542236328, "global_step": 319584, "epoch": 3850} {"train_loss": -25.666467666625977, "global_step": 319585, "epoch": 3850} {"train_loss": -25.942407608032227, "global_step": 319586, "epoch": 3850} {"train_loss": -25.546558380126953, "global_step": 319587, "epoch": 3850} {"train_loss": -25.8919734954834, "global_step": 319588, "epoch": 3850} {"train_loss": -25.910343170166016, "global_step": 319589, "epoch": 3850} {"train_loss": -26.220426559448242, "global_step": 319590, "epoch": 3850} {"train_loss": -25.84617042541504, "global_step": 319591, "epoch": 3850} {"train_loss": -26.140399932861328, "global_step": 319592, "epoch": 3850} {"train_loss": -26.318151473999023, "global_step": 319593, "epoch": 3850} {"train_loss": -26.081710815429688, "global_step": 319594, "epoch": 3850} {"train_loss": -25.82032585144043, "global_step": 319595, "epoch": 3850} {"train_loss": -26.090906143188477, "global_step": 319596, "epoch": 3850} {"train_loss": -26.0277042388916, "global_step": 319597, "epoch": 3850} {"train_loss": -26.141332626342773, "global_step": 319598, "epoch": 3850} {"train_loss": -26.196943283081055, "global_step": 319599, "epoch": 3850} {"train_loss": -25.83904457092285, "global_step": 319600, "epoch": 3850} {"train_loss": -25.773603439331055, "global_step": 319601, "epoch": 3850} {"train_loss": -25.989200592041016, "global_step": 319602, "epoch": 3850} {"train_loss": -25.708515167236328, "global_step": 319603, "epoch": 3850} {"train_loss": -26.313018798828125, "global_step": 319604, "epoch": 3850} {"train_loss": -25.64448356628418, "global_step": 319605, "epoch": 3850} {"train_loss": -26.244232177734375, "global_step": 319606, "epoch": 3850} {"train_loss": -25.82758903503418, "global_step": 319607, "epoch": 3850} {"train_loss": -25.993743896484375, "global_step": 319608, "epoch": 3850} {"train_loss": -26.32158851623535, "global_step": 319609, "epoch": 3850} {"train_loss": -25.966123580932617, "global_step": 319610, "epoch": 3850} {"train_loss": -25.87744140625, "global_step": 319611, "epoch": 3850} {"train_loss": -25.741241455078125, "global_step": 319612, "epoch": 3850} {"train_loss": -25.239397048950195, "global_step": 319613, "epoch": 3850} {"train_loss": -25.095834732055664, "global_step": 319614, "epoch": 3850} {"train_loss": -25.004196166992188, "global_step": 319615, "epoch": 3850} {"train_loss": -25.501937866210938, "global_step": 319616, "epoch": 3850} {"train_loss": -25.784238815307617, "global_step": 319617, "epoch": 3850} {"train_loss": -25.572099685668945, "global_step": 319618, "epoch": 3850} {"train_loss": -25.488019943237305, "global_step": 319619, "epoch": 3850} {"train_loss": -25.43941307067871, "global_step": 319620, "epoch": 3850} {"train_loss": -25.83460807800293, "global_step": 319621, "epoch": 3850} {"train_loss": -26.450489044189453, "global_step": 319622, "epoch": 3850} {"train_loss": -26.0585880279541, "global_step": 319623, "epoch": 3850} {"train_loss": -25.995023727416992, "global_step": 319624, "epoch": 3850} {"train_loss": -25.88323974609375, "global_step": 319625, "epoch": 3850} {"train_loss": -25.82905387878418, "global_step": 319626, "epoch": 3850} {"train_loss": -26.133939743041992, "global_step": 319627, "epoch": 3850} {"train_loss": -25.85968017578125, "global_step": 319628, "epoch": 3850} {"train_loss": -26.020944595336914, "global_step": 319629, "epoch": 3850} {"train_loss": -25.774200439453125, "global_step": 319630, "epoch": 3850} {"train_loss": -25.52692222595215, "global_step": 319631, "epoch": 3850} {"train_loss": -25.704645294740974, "global_step": 319632, "epoch": 3850, "train/sim_max_reward_0": 1.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4500000": 1.0, "test/sim_max_reward_4500001": 1.0, "test/sim_max_reward_4500002": 1.0, "test/sim_max_reward_4500003": 1.0, "test/sim_max_reward_4500004": 1.0, "test/sim_max_reward_4500005": 1.0, "test/sim_max_reward_4500006": 1.0, "test/sim_max_reward_4500007": 0.0, "test/sim_max_reward_4500008": 1.0, "test/sim_max_reward_4500009": 1.0, "test/sim_max_reward_4500010": 1.0, "test/sim_max_reward_4500011": 1.0, "test/sim_max_reward_4500012": 1.0, "test/sim_max_reward_4500013": 0.0, "test/sim_max_reward_4500014": 1.0, "test/sim_max_reward_4500015": 1.0, "test/sim_max_reward_4500016": 1.0, "test/sim_max_reward_4500017": 1.0, "test/sim_max_reward_4500018": 1.0, "test/sim_max_reward_4500019": 0.0, "test/sim_max_reward_4500020": 1.0, "test/sim_max_reward_4500021": 1.0, "train/mean_score": 1.0, "test/mean_score": 0.8636363636363636, "val_loss": 7188919.5} {"train_loss": -25.95707130432129, "global_step": 319633, "epoch": 3851} {"train_loss": -25.912256240844727, "global_step": 319634, "epoch": 3851} {"train_loss": -25.72344398498535, "global_step": 319635, "epoch": 3851} {"train_loss": -25.399946212768555, "global_step": 319636, "epoch": 3851} {"train_loss": -25.556427001953125, "global_step": 319637, "epoch": 3851} {"train_loss": -25.742761611938477, "global_step": 319638, "epoch": 3851} {"train_loss": -25.54709243774414, "global_step": 319639, "epoch": 3851} {"train_loss": -25.491479873657227, "global_step": 319640, "epoch": 3851} {"train_loss": -25.560705184936523, "global_step": 319641, "epoch": 3851} {"train_loss": -25.654626846313477, "global_step": 319642, "epoch": 3851} {"train_loss": -25.9211368560791, "global_step": 319643, "epoch": 3851} {"train_loss": -25.45691680908203, "global_step": 319644, "epoch": 3851} {"train_loss": -25.552228927612305, "global_step": 319645, "epoch": 3851} {"train_loss": -25.488422393798828, "global_step": 319646, "epoch": 3851} {"train_loss": -25.940113067626953, "global_step": 319647, "epoch": 3851} {"train_loss": -25.804931640625, "global_step": 319648, "epoch": 3851} {"train_loss": -25.842239379882812, "global_step": 319649, "epoch": 3851} {"train_loss": -25.74462890625, "global_step": 319650, "epoch": 3851} {"train_loss": -25.81682777404785, "global_step": 319651, "epoch": 3851} {"train_loss": -25.802236557006836, "global_step": 319652, "epoch": 3851} {"train_loss": -26.088748931884766, "global_step": 319653, "epoch": 3851} {"train_loss": -25.73841667175293, "global_step": 319654, "epoch": 3851} {"train_loss": -26.019611358642578, "global_step": 319655, "epoch": 3851} {"train_loss": -25.971036911010742, "global_step": 319656, "epoch": 3851} {"train_loss": -26.189908981323242, "global_step": 319657, "epoch": 3851} {"train_loss": -25.7004451751709, "global_step": 319658, "epoch": 3851} {"train_loss": -25.443466186523438, "global_step": 319659, "epoch": 3851} {"train_loss": -26.157947540283203, "global_step": 319660, "epoch": 3851} {"train_loss": -26.00897216796875, "global_step": 319661, "epoch": 3851} {"train_loss": -25.824655532836914, "global_step": 319662, "epoch": 3851} {"train_loss": -25.895246505737305, "global_step": 319663, "epoch": 3851} {"train_loss": -25.676477432250977, "global_step": 319664, "epoch": 3851} {"train_loss": -26.160139083862305, "global_step": 319665, "epoch": 3851} {"train_loss": -25.977325439453125, "global_step": 319666, "epoch": 3851} {"train_loss": -25.81460952758789, "global_step": 319667, "epoch": 3851} {"train_loss": -25.752622604370117, "global_step": 319668, "epoch": 3851} {"train_loss": -25.864301681518555, "global_step": 319669, "epoch": 3851} {"train_loss": -25.449705123901367, "global_step": 319670, "epoch": 3851} {"train_loss": -25.826562881469727, "global_step": 319671, "epoch": 3851} {"train_loss": -25.48568344116211, "global_step": 319672, "epoch": 3851} {"train_loss": -25.65182876586914, "global_step": 319673, "epoch": 3851} {"train_loss": -25.885339736938477, "global_step": 319674, "epoch": 3851} {"train_loss": -25.368486404418945, "global_step": 319675, "epoch": 3851} {"train_loss": -25.741098403930664, "global_step": 319676, "epoch": 3851} {"train_loss": -25.910593032836914, "global_step": 319677, "epoch": 3851} {"train_loss": -26.152860641479492, "global_step": 319678, "epoch": 3851} {"train_loss": -26.044692993164062, "global_step": 319679, "epoch": 3851} {"train_loss": -25.6754093170166, "global_step": 319680, "epoch": 3851} {"train_loss": -25.836856842041016, "global_step": 319681, "epoch": 3851} {"train_loss": -26.15144157409668, "global_step": 319682, "epoch": 3851} {"train_loss": -25.85662841796875, "global_step": 319683, "epoch": 3851} {"train_loss": -25.440420150756836, "global_step": 319684, "epoch": 3851} {"train_loss": -25.34577751159668, "global_step": 319685, "epoch": 3851} {"train_loss": -25.452733993530273, "global_step": 319686, "epoch": 3851} {"train_loss": -25.18907928466797, "global_step": 319687, "epoch": 3851} {"train_loss": -25.802631378173828, "global_step": 319688, "epoch": 3851} {"train_loss": -26.0035457611084, "global_step": 319689, "epoch": 3851} {"train_loss": -25.194658279418945, "global_step": 319690, "epoch": 3851} {"train_loss": -25.922399520874023, "global_step": 319691, "epoch": 3851} {"train_loss": -25.752765655517578, "global_step": 319692, "epoch": 3851} {"train_loss": -25.82322120666504, "global_step": 319693, "epoch": 3851} {"train_loss": -26.1099910736084, "global_step": 319694, "epoch": 3851} {"train_loss": -25.896820068359375, "global_step": 319695, "epoch": 3851} {"train_loss": -25.811664581298828, "global_step": 319696, "epoch": 3851} {"train_loss": -25.998031616210938, "global_step": 319697, "epoch": 3851} {"train_loss": -25.799030303955078, "global_step": 319698, "epoch": 3851} {"train_loss": -26.0532169342041, "global_step": 319699, "epoch": 3851} {"train_loss": -26.02546501159668, "global_step": 319700, "epoch": 3851} {"train_loss": -25.784652709960938, "global_step": 319701, "epoch": 3851} {"train_loss": -26.226856231689453, "global_step": 319702, "epoch": 3851} {"train_loss": -25.95468521118164, "global_step": 319703, "epoch": 3851} {"train_loss": -25.545639038085938, "global_step": 319704, "epoch": 3851} {"train_loss": -25.436025619506836, "global_step": 319705, "epoch": 3851} {"train_loss": -26.492223739624023, "global_step": 319706, "epoch": 3851} {"train_loss": -25.355167388916016, "global_step": 319707, "epoch": 3851} {"train_loss": -25.42317771911621, "global_step": 319708, "epoch": 3851} {"train_loss": -25.941238403320312, "global_step": 319709, "epoch": 3851} {"train_loss": -25.66004753112793, "global_step": 319710, "epoch": 3851} {"train_loss": -26.0665283203125, "global_step": 319711, "epoch": 3851} {"train_loss": -25.643268585205078, "global_step": 319712, "epoch": 3851} {"train_loss": -25.549057006835938, "global_step": 319713, "epoch": 3851} {"train_loss": -26.00140953063965, "global_step": 319714, "epoch": 3851} {"train_loss": -25.78289181353098, "global_step": 319715, "epoch": 3851, "val_loss": 7351242.0} {"train_loss": -25.199100494384766, "global_step": 319716, "epoch": 3852} {"train_loss": -24.94803810119629, "global_step": 319717, "epoch": 3852} {"train_loss": -25.38433265686035, "global_step": 319718, "epoch": 3852} {"train_loss": -25.612714767456055, "global_step": 319719, "epoch": 3852} {"train_loss": -25.51496696472168, "global_step": 319720, "epoch": 3852} {"train_loss": -25.239187240600586, "global_step": 319721, "epoch": 3852} {"train_loss": -25.400449752807617, "global_step": 319722, "epoch": 3852} {"train_loss": -25.13301658630371, "global_step": 319723, "epoch": 3852} {"train_loss": -25.445409774780273, "global_step": 319724, "epoch": 3852} {"train_loss": -25.567808151245117, "global_step": 319725, "epoch": 3852} {"train_loss": -25.745981216430664, "global_step": 319726, "epoch": 3852} {"train_loss": -25.42177391052246, "global_step": 319727, "epoch": 3852} {"train_loss": -25.587125778198242, "global_step": 319728, "epoch": 3852} {"train_loss": -25.61138343811035, "global_step": 319729, "epoch": 3852} {"train_loss": -24.853559494018555, "global_step": 319730, "epoch": 3852} {"train_loss": -25.908252716064453, "global_step": 319731, "epoch": 3852} {"train_loss": -25.496742248535156, "global_step": 319732, "epoch": 3852} {"train_loss": -25.752676010131836, "global_step": 319733, "epoch": 3852} {"train_loss": -26.00898551940918, "global_step": 319734, "epoch": 3852} {"train_loss": -25.78850746154785, "global_step": 319735, "epoch": 3852} {"train_loss": -25.900854110717773, "global_step": 319736, "epoch": 3852} {"train_loss": -25.608911514282227, "global_step": 319737, "epoch": 3852} {"train_loss": -25.20993995666504, "global_step": 319738, "epoch": 3852} {"train_loss": -25.50995445251465, "global_step": 319739, "epoch": 3852} {"train_loss": -25.932180404663086, "global_step": 319740, "epoch": 3852} {"train_loss": -25.94862937927246, "global_step": 319741, "epoch": 3852} {"train_loss": -25.971479415893555, "global_step": 319742, "epoch": 3852} {"train_loss": -26.179990768432617, "global_step": 319743, "epoch": 3852} {"train_loss": -26.0054931640625, "global_step": 319744, "epoch": 3852} {"train_loss": -25.722043991088867, "global_step": 319745, "epoch": 3852} {"train_loss": -26.1784725189209, "global_step": 319746, "epoch": 3852} {"train_loss": -25.95293617248535, "global_step": 319747, "epoch": 3852} {"train_loss": -25.870885848999023, "global_step": 319748, "epoch": 3852} {"train_loss": -25.741352081298828, "global_step": 319749, "epoch": 3852} {"train_loss": -26.030231475830078, "global_step": 319750, "epoch": 3852} {"train_loss": -25.9238338470459, "global_step": 319751, "epoch": 3852} {"train_loss": -25.89243507385254, "global_step": 319752, "epoch": 3852} {"train_loss": -25.788156509399414, "global_step": 319753, "epoch": 3852} {"train_loss": -26.003583908081055, "global_step": 319754, "epoch": 3852} {"train_loss": -26.0421199798584, "global_step": 319755, "epoch": 3852} {"train_loss": -25.739736557006836, "global_step": 319756, "epoch": 3852} {"train_loss": -25.95662498474121, "global_step": 319757, "epoch": 3852} {"train_loss": -25.899555206298828, "global_step": 319758, "epoch": 3852} {"train_loss": -25.830276489257812, "global_step": 319759, "epoch": 3852} {"train_loss": -26.0898380279541, "global_step": 319760, "epoch": 3852} {"train_loss": -25.803586959838867, "global_step": 319761, "epoch": 3852} {"train_loss": -25.842945098876953, "global_step": 319762, "epoch": 3852} {"train_loss": -25.48870849609375, "global_step": 319763, "epoch": 3852} {"train_loss": -25.93140983581543, "global_step": 319764, "epoch": 3852} {"train_loss": -25.852624893188477, "global_step": 319765, "epoch": 3852} {"train_loss": -26.212848663330078, "global_step": 319766, "epoch": 3852} {"train_loss": -26.1423397064209, "global_step": 319767, "epoch": 3852} {"train_loss": -25.6850643157959, "global_step": 319768, "epoch": 3852} {"train_loss": -25.73615074157715, "global_step": 319769, "epoch": 3852} {"train_loss": -25.857284545898438, "global_step": 319770, "epoch": 3852} {"train_loss": -25.78242301940918, "global_step": 319771, "epoch": 3852} {"train_loss": -26.3555965423584, "global_step": 319772, "epoch": 3852} {"train_loss": -26.037519454956055, "global_step": 319773, "epoch": 3852} {"train_loss": -25.64935302734375, "global_step": 319774, "epoch": 3852} {"train_loss": -25.54543685913086, "global_step": 319775, "epoch": 3852} {"train_loss": -25.619308471679688, "global_step": 319776, "epoch": 3852} {"train_loss": -25.679473876953125, "global_step": 319777, "epoch": 3852} {"train_loss": -25.933134078979492, "global_step": 319778, "epoch": 3852} {"train_loss": -25.987186431884766, "global_step": 319779, "epoch": 3852} {"train_loss": -26.261737823486328, "global_step": 319780, "epoch": 3852} {"train_loss": -26.023908615112305, "global_step": 319781, "epoch": 3852} {"train_loss": -25.978918075561523, "global_step": 319782, "epoch": 3852} {"train_loss": -26.085498809814453, "global_step": 319783, "epoch": 3852} {"train_loss": -26.154830932617188, "global_step": 319784, "epoch": 3852} {"train_loss": -25.765186309814453, "global_step": 319785, "epoch": 3852} {"train_loss": -26.13228416442871, "global_step": 319786, "epoch": 3852} {"train_loss": -25.980712890625, "global_step": 319787, "epoch": 3852} {"train_loss": -25.78150749206543, "global_step": 319788, "epoch": 3852} {"train_loss": -25.38471031188965, "global_step": 319789, "epoch": 3852} {"train_loss": -25.254465103149414, "global_step": 319790, "epoch": 3852} {"train_loss": -25.72491455078125, "global_step": 319791, "epoch": 3852} {"train_loss": -25.96311378479004, "global_step": 319792, "epoch": 3852} {"train_loss": -25.410306930541992, "global_step": 319793, "epoch": 3852} {"train_loss": -25.675262451171875, "global_step": 319794, "epoch": 3852} {"train_loss": -25.92776870727539, "global_step": 319795, "epoch": 3852} {"train_loss": -26.498228073120117, "global_step": 319796, "epoch": 3852} {"train_loss": -25.873966217041016, "global_step": 319797, "epoch": 3852} {"train_loss": -25.79647691565824, "global_step": 319798, "epoch": 3852, "val_loss": 7288056.0} {"train_loss": -25.172134399414062, "global_step": 319799, "epoch": 3853} {"train_loss": -25.238367080688477, "global_step": 319800, "epoch": 3853} {"train_loss": -24.485397338867188, "global_step": 319801, "epoch": 3853} {"train_loss": -24.501983642578125, "global_step": 319802, "epoch": 3853} {"train_loss": -25.445255279541016, "global_step": 319803, "epoch": 3853} {"train_loss": -25.1119384765625, "global_step": 319804, "epoch": 3853} {"train_loss": -25.416610717773438, "global_step": 319805, "epoch": 3853} {"train_loss": -25.71222496032715, "global_step": 319806, "epoch": 3853} {"train_loss": -25.47161865234375, "global_step": 319807, "epoch": 3853} {"train_loss": -25.47043228149414, "global_step": 319808, "epoch": 3853} {"train_loss": -25.176803588867188, "global_step": 319809, "epoch": 3853} {"train_loss": -25.703378677368164, "global_step": 319810, "epoch": 3853} {"train_loss": -25.43826675415039, "global_step": 319811, "epoch": 3853} {"train_loss": -25.547788619995117, "global_step": 319812, "epoch": 3853} {"train_loss": -25.87265968322754, "global_step": 319813, "epoch": 3853} {"train_loss": -25.477087020874023, "global_step": 319814, "epoch": 3853} {"train_loss": -25.7763671875, "global_step": 319815, "epoch": 3853} {"train_loss": -25.77845573425293, "global_step": 319816, "epoch": 3853} {"train_loss": -25.740354537963867, "global_step": 319817, "epoch": 3853} {"train_loss": -25.551979064941406, "global_step": 319818, "epoch": 3853} {"train_loss": -25.189626693725586, "global_step": 319819, "epoch": 3853} {"train_loss": -25.99488639831543, "global_step": 319820, "epoch": 3853} {"train_loss": -25.703527450561523, "global_step": 319821, "epoch": 3853} {"train_loss": -25.7629337310791, "global_step": 319822, "epoch": 3853} {"train_loss": -25.739673614501953, "global_step": 319823, "epoch": 3853} {"train_loss": -25.96363639831543, "global_step": 319824, "epoch": 3853} {"train_loss": -25.63749122619629, "global_step": 319825, "epoch": 3853} {"train_loss": -25.741138458251953, "global_step": 319826, "epoch": 3853} {"train_loss": -26.23013687133789, "global_step": 319827, "epoch": 3853} {"train_loss": -25.518346786499023, "global_step": 319828, "epoch": 3853} {"train_loss": -25.826391220092773, "global_step": 319829, "epoch": 3853} {"train_loss": -26.242761611938477, "global_step": 319830, "epoch": 3853} {"train_loss": -25.987201690673828, "global_step": 319831, "epoch": 3853} {"train_loss": -26.009016036987305, "global_step": 319832, "epoch": 3853} {"train_loss": -25.720380783081055, "global_step": 319833, "epoch": 3853} {"train_loss": -26.311115264892578, "global_step": 319834, "epoch": 3853} {"train_loss": -26.030460357666016, "global_step": 319835, "epoch": 3853} {"train_loss": -25.872867584228516, "global_step": 319836, "epoch": 3853} {"train_loss": -26.224470138549805, "global_step": 319837, "epoch": 3853} {"train_loss": -26.03082847595215, "global_step": 319838, "epoch": 3853} {"train_loss": -26.0212345123291, "global_step": 319839, "epoch": 3853} {"train_loss": -26.0499267578125, "global_step": 319840, "epoch": 3853} {"train_loss": -26.011005401611328, "global_step": 319841, "epoch": 3853} {"train_loss": -25.918323516845703, "global_step": 319842, "epoch": 3853} {"train_loss": -25.897363662719727, "global_step": 319843, "epoch": 3853} {"train_loss": -25.883691787719727, "global_step": 319844, "epoch": 3853} {"train_loss": -25.62454605102539, "global_step": 319845, "epoch": 3853} {"train_loss": -25.824731826782227, "global_step": 319846, "epoch": 3853} {"train_loss": -25.841644287109375, "global_step": 319847, "epoch": 3853} {"train_loss": -25.98943519592285, "global_step": 319848, "epoch": 3853} {"train_loss": -25.757080078125, "global_step": 319849, "epoch": 3853} {"train_loss": -25.60028076171875, "global_step": 319850, "epoch": 3853} {"train_loss": -25.848953247070312, "global_step": 319851, "epoch": 3853} {"train_loss": -26.153345108032227, "global_step": 319852, "epoch": 3853} {"train_loss": -25.785131454467773, "global_step": 319853, "epoch": 3853} {"train_loss": -25.883651733398438, "global_step": 319854, "epoch": 3853} {"train_loss": -26.167316436767578, "global_step": 319855, "epoch": 3853} {"train_loss": -25.96339988708496, "global_step": 319856, "epoch": 3853} {"train_loss": -25.909414291381836, "global_step": 319857, "epoch": 3853} {"train_loss": -26.353254318237305, "global_step": 319858, "epoch": 3853} {"train_loss": -26.33295249938965, "global_step": 319859, "epoch": 3853} {"train_loss": -26.1315860748291, "global_step": 319860, "epoch": 3853} {"train_loss": -25.706024169921875, "global_step": 319861, "epoch": 3853} {"train_loss": -26.03167724609375, "global_step": 319862, "epoch": 3853} {"train_loss": -26.20111656188965, "global_step": 319863, "epoch": 3853} {"train_loss": -26.055944442749023, "global_step": 319864, "epoch": 3853} {"train_loss": -26.00198745727539, "global_step": 319865, "epoch": 3853} {"train_loss": -25.785791397094727, "global_step": 319866, "epoch": 3853} {"train_loss": -26.036468505859375, "global_step": 319867, "epoch": 3853} {"train_loss": -26.311878204345703, "global_step": 319868, "epoch": 3853} {"train_loss": -25.560850143432617, "global_step": 319869, "epoch": 3853} {"train_loss": -25.32503318786621, "global_step": 319870, "epoch": 3853} {"train_loss": -24.936832427978516, "global_step": 319871, "epoch": 3853} {"train_loss": -25.18050193786621, "global_step": 319872, "epoch": 3853} {"train_loss": -25.945844650268555, "global_step": 319873, "epoch": 3853} {"train_loss": -25.60589599609375, "global_step": 319874, "epoch": 3853} {"train_loss": -25.283205032348633, "global_step": 319875, "epoch": 3853} {"train_loss": -25.941064834594727, "global_step": 319876, "epoch": 3853} {"train_loss": -25.50844383239746, "global_step": 319877, "epoch": 3853} {"train_loss": -25.649383544921875, "global_step": 319878, "epoch": 3853} {"train_loss": -25.599334716796875, "global_step": 319879, "epoch": 3853} {"train_loss": -25.765094757080078, "global_step": 319880, "epoch": 3853} {"train_loss": -25.73634696868529, "global_step": 319881, "epoch": 3853, "val_loss": 7279366.0} {"train_loss": -25.067188262939453, "global_step": 319882, "epoch": 3854} {"train_loss": -24.252120971679688, "global_step": 319883, "epoch": 3854} {"train_loss": -25.072660446166992, "global_step": 319884, "epoch": 3854} {"train_loss": -24.645736694335938, "global_step": 319885, "epoch": 3854} {"train_loss": -24.4613037109375, "global_step": 319886, "epoch": 3854} {"train_loss": -25.42989158630371, "global_step": 319887, "epoch": 3854} {"train_loss": -24.194055557250977, "global_step": 319888, "epoch": 3854} {"train_loss": -24.775665283203125, "global_step": 319889, "epoch": 3854} {"train_loss": -24.998291015625, "global_step": 319890, "epoch": 3854} {"train_loss": -25.094120025634766, "global_step": 319891, "epoch": 3854} {"train_loss": -24.73053550720215, "global_step": 319892, "epoch": 3854} {"train_loss": -25.44134521484375, "global_step": 319893, "epoch": 3854} {"train_loss": -25.01968002319336, "global_step": 319894, "epoch": 3854} {"train_loss": -25.132278442382812, "global_step": 319895, "epoch": 3854} {"train_loss": -24.980846405029297, "global_step": 319896, "epoch": 3854} {"train_loss": -25.141849517822266, "global_step": 319897, "epoch": 3854} {"train_loss": -25.458036422729492, "global_step": 319898, "epoch": 3854} {"train_loss": -25.244871139526367, "global_step": 319899, "epoch": 3854} {"train_loss": -25.4287166595459, "global_step": 319900, "epoch": 3854} {"train_loss": -25.091466903686523, "global_step": 319901, "epoch": 3854} {"train_loss": -25.18158531188965, "global_step": 319902, "epoch": 3854} {"train_loss": -25.372549057006836, "global_step": 319903, "epoch": 3854} {"train_loss": -25.668989181518555, "global_step": 319904, "epoch": 3854} {"train_loss": -25.706756591796875, "global_step": 319905, "epoch": 3854} {"train_loss": -25.36443519592285, "global_step": 319906, "epoch": 3854} {"train_loss": -25.7305965423584, "global_step": 319907, "epoch": 3854} {"train_loss": -25.2263240814209, "global_step": 319908, "epoch": 3854} {"train_loss": -25.828100204467773, "global_step": 319909, "epoch": 3854} {"train_loss": -25.473365783691406, "global_step": 319910, "epoch": 3854} {"train_loss": -25.830839157104492, "global_step": 319911, "epoch": 3854} {"train_loss": -25.93302345275879, "global_step": 319912, "epoch": 3854} {"train_loss": -25.51850700378418, "global_step": 319913, "epoch": 3854} {"train_loss": -25.8171329498291, "global_step": 319914, "epoch": 3854} {"train_loss": -25.774494171142578, "global_step": 319915, "epoch": 3854} {"train_loss": -25.948694229125977, "global_step": 319916, "epoch": 3854} {"train_loss": -25.756494522094727, "global_step": 319917, "epoch": 3854} {"train_loss": -25.657501220703125, "global_step": 319918, "epoch": 3854} {"train_loss": -26.31971549987793, "global_step": 319919, "epoch": 3854} {"train_loss": -25.95527458190918, "global_step": 319920, "epoch": 3854} {"train_loss": -25.959287643432617, "global_step": 319921, "epoch": 3854} {"train_loss": -26.245365142822266, "global_step": 319922, "epoch": 3854} {"train_loss": -26.586761474609375, "global_step": 319923, "epoch": 3854} {"train_loss": -25.812198638916016, "global_step": 319924, "epoch": 3854} {"train_loss": -26.15289878845215, "global_step": 319925, "epoch": 3854} {"train_loss": -25.81329917907715, "global_step": 319926, "epoch": 3854} {"train_loss": -26.206573486328125, "global_step": 319927, "epoch": 3854} {"train_loss": -25.91953468322754, "global_step": 319928, "epoch": 3854} {"train_loss": -25.9523868560791, "global_step": 319929, "epoch": 3854} {"train_loss": -26.020761489868164, "global_step": 319930, "epoch": 3854} {"train_loss": -25.66585350036621, "global_step": 319931, "epoch": 3854} {"train_loss": -25.38640594482422, "global_step": 319932, "epoch": 3854} {"train_loss": -24.700132369995117, "global_step": 319933, "epoch": 3854} {"train_loss": -24.739490509033203, "global_step": 319934, "epoch": 3854} {"train_loss": -24.851240158081055, "global_step": 319935, "epoch": 3854} {"train_loss": -25.208723068237305, "global_step": 319936, "epoch": 3854} {"train_loss": -25.562808990478516, "global_step": 319937, "epoch": 3854} {"train_loss": -25.49502944946289, "global_step": 319938, "epoch": 3854} {"train_loss": -25.60732078552246, "global_step": 319939, "epoch": 3854} {"train_loss": -25.524999618530273, "global_step": 319940, "epoch": 3854} {"train_loss": -25.716693878173828, "global_step": 319941, "epoch": 3854} {"train_loss": -25.6348934173584, "global_step": 319942, "epoch": 3854} {"train_loss": -25.688343048095703, "global_step": 319943, "epoch": 3854} {"train_loss": -25.7839298248291, "global_step": 319944, "epoch": 3854} {"train_loss": -25.956945419311523, "global_step": 319945, "epoch": 3854} {"train_loss": -25.643674850463867, "global_step": 319946, "epoch": 3854} {"train_loss": -25.598052978515625, "global_step": 319947, "epoch": 3854} {"train_loss": -25.99444007873535, "global_step": 319948, "epoch": 3854} {"train_loss": -25.942358016967773, "global_step": 319949, "epoch": 3854} {"train_loss": -25.520462036132812, "global_step": 319950, "epoch": 3854} {"train_loss": -25.488908767700195, "global_step": 319951, "epoch": 3854} {"train_loss": -25.93312644958496, "global_step": 319952, "epoch": 3854} {"train_loss": -26.10177993774414, "global_step": 319953, "epoch": 3854} {"train_loss": -25.964160919189453, "global_step": 319954, "epoch": 3854} {"train_loss": -25.958465576171875, "global_step": 319955, "epoch": 3854} {"train_loss": -25.960554122924805, "global_step": 319956, "epoch": 3854} {"train_loss": -25.640798568725586, "global_step": 319957, "epoch": 3854} {"train_loss": -25.894514083862305, "global_step": 319958, "epoch": 3854} {"train_loss": -25.922910690307617, "global_step": 319959, "epoch": 3854} {"train_loss": -25.803876876831055, "global_step": 319960, "epoch": 3854} {"train_loss": -26.3529052734375, "global_step": 319961, "epoch": 3854} {"train_loss": -25.706607818603516, "global_step": 319962, "epoch": 3854} {"train_loss": -26.1988468170166, "global_step": 319963, "epoch": 3854} {"train_loss": -25.556771496692335, "global_step": 319964, "epoch": 3854, "val_loss": 7281960.0} {"train_loss": -25.609792709350586, "global_step": 319965, "epoch": 3855} {"train_loss": -25.46599769592285, "global_step": 319966, "epoch": 3855} {"train_loss": -25.162832260131836, "global_step": 319967, "epoch": 3855} {"train_loss": -24.87555503845215, "global_step": 319968, "epoch": 3855} {"train_loss": -25.14282989501953, "global_step": 319969, "epoch": 3855} {"train_loss": -25.937402725219727, "global_step": 319970, "epoch": 3855} {"train_loss": -25.304712295532227, "global_step": 319971, "epoch": 3855} {"train_loss": -25.277570724487305, "global_step": 319972, "epoch": 3855} {"train_loss": -25.573143005371094, "global_step": 319973, "epoch": 3855} {"train_loss": -25.324554443359375, "global_step": 319974, "epoch": 3855} {"train_loss": -25.864715576171875, "global_step": 319975, "epoch": 3855} {"train_loss": -25.657346725463867, "global_step": 319976, "epoch": 3855} {"train_loss": -25.55191993713379, "global_step": 319977, "epoch": 3855} {"train_loss": -25.6444034576416, "global_step": 319978, "epoch": 3855} {"train_loss": -25.379297256469727, "global_step": 319979, "epoch": 3855} {"train_loss": -26.223241806030273, "global_step": 319980, "epoch": 3855} {"train_loss": -25.87885093688965, "global_step": 319981, "epoch": 3855} {"train_loss": -25.816877365112305, "global_step": 319982, "epoch": 3855} {"train_loss": -25.616474151611328, "global_step": 319983, "epoch": 3855} {"train_loss": -25.292646408081055, "global_step": 319984, "epoch": 3855} {"train_loss": -25.3835506439209, "global_step": 319985, "epoch": 3855} {"train_loss": -25.97116470336914, "global_step": 319986, "epoch": 3855} {"train_loss": -25.362119674682617, "global_step": 319987, "epoch": 3855} {"train_loss": -25.8593692779541, "global_step": 319988, "epoch": 3855} {"train_loss": -25.985300064086914, "global_step": 319989, "epoch": 3855} {"train_loss": -25.95802116394043, "global_step": 319990, "epoch": 3855} {"train_loss": -25.963911056518555, "global_step": 319991, "epoch": 3855} {"train_loss": -25.715734481811523, "global_step": 319992, "epoch": 3855} {"train_loss": -25.984851837158203, "global_step": 319993, "epoch": 3855} {"train_loss": -26.049863815307617, "global_step": 319994, "epoch": 3855} {"train_loss": -26.011371612548828, "global_step": 319995, "epoch": 3855} {"train_loss": -26.500944137573242, "global_step": 319996, "epoch": 3855} {"train_loss": -25.816389083862305, "global_step": 319997, "epoch": 3855} {"train_loss": -25.427608489990234, "global_step": 319998, "epoch": 3855} {"train_loss": -25.518312454223633, "global_step": 319999, "epoch": 3855} {"train_loss": -26.081043243408203, "global_step": 320000, "epoch": 3855} {"train_loss": -25.607349395751953, "global_step": 320001, "epoch": 3855} {"train_loss": -25.441293716430664, "global_step": 320002, "epoch": 3855} {"train_loss": -25.55633544921875, "global_step": 320003, "epoch": 3855} {"train_loss": -25.543071746826172, "global_step": 320004, "epoch": 3855} {"train_loss": -25.5136775970459, "global_step": 320005, "epoch": 3855} {"train_loss": -25.77131462097168, "global_step": 320006, "epoch": 3855} {"train_loss": -25.702686309814453, "global_step": 320007, "epoch": 3855} {"train_loss": -25.792951583862305, "global_step": 320008, "epoch": 3855} {"train_loss": -25.7589054107666, "global_step": 320009, "epoch": 3855} {"train_loss": -25.571918487548828, "global_step": 320010, "epoch": 3855} {"train_loss": -26.236618041992188, "global_step": 320011, "epoch": 3855} {"train_loss": -25.838003158569336, "global_step": 320012, "epoch": 3855} {"train_loss": -26.115406036376953, "global_step": 320013, "epoch": 3855} {"train_loss": -25.672901153564453, "global_step": 320014, "epoch": 3855} {"train_loss": -25.897308349609375, "global_step": 320015, "epoch": 3855} {"train_loss": -25.99179458618164, "global_step": 320016, "epoch": 3855} {"train_loss": -26.280242919921875, "global_step": 320017, "epoch": 3855} {"train_loss": -25.83564567565918, "global_step": 320018, "epoch": 3855} {"train_loss": -25.75263786315918, "global_step": 320019, "epoch": 3855} {"train_loss": -25.991308212280273, "global_step": 320020, "epoch": 3855} {"train_loss": -25.994802474975586, "global_step": 320021, "epoch": 3855} {"train_loss": -25.840576171875, "global_step": 320022, "epoch": 3855} {"train_loss": -25.985681533813477, "global_step": 320023, "epoch": 3855} {"train_loss": -26.131372451782227, "global_step": 320024, "epoch": 3855} {"train_loss": -25.790668487548828, "global_step": 320025, "epoch": 3855} {"train_loss": -26.021265029907227, "global_step": 320026, "epoch": 3855} {"train_loss": -25.58160972595215, "global_step": 320027, "epoch": 3855} {"train_loss": -25.95003318786621, "global_step": 320028, "epoch": 3855} {"train_loss": -25.867414474487305, "global_step": 320029, "epoch": 3855} {"train_loss": -25.871496200561523, "global_step": 320030, "epoch": 3855} {"train_loss": -26.239704132080078, "global_step": 320031, "epoch": 3855} {"train_loss": -26.190526962280273, "global_step": 320032, "epoch": 3855} {"train_loss": -25.96529197692871, "global_step": 320033, "epoch": 3855} {"train_loss": -26.120044708251953, "global_step": 320034, "epoch": 3855} {"train_loss": -25.80720329284668, "global_step": 320035, "epoch": 3855} {"train_loss": -25.84515953063965, "global_step": 320036, "epoch": 3855} {"train_loss": -26.09938621520996, "global_step": 320037, "epoch": 3855} {"train_loss": -26.025781631469727, "global_step": 320038, "epoch": 3855} {"train_loss": -26.153797149658203, "global_step": 320039, "epoch": 3855} {"train_loss": -26.31031608581543, "global_step": 320040, "epoch": 3855} {"train_loss": -26.270734786987305, "global_step": 320041, "epoch": 3855} {"train_loss": -26.163610458374023, "global_step": 320042, "epoch": 3855} {"train_loss": -26.08656120300293, "global_step": 320043, "epoch": 3855} {"train_loss": -25.819772720336914, "global_step": 320044, "epoch": 3855} {"train_loss": -25.886859893798828, "global_step": 320045, "epoch": 3855} {"train_loss": -25.890289306640625, "global_step": 320046, "epoch": 3855} {"train_loss": -25.8266956834908, "global_step": 320047, "epoch": 3855, "val_loss": 7341376.5} {"train_loss": -25.04629898071289, "global_step": 320048, "epoch": 3856} {"train_loss": -23.44144630432129, "global_step": 320049, "epoch": 3856} {"train_loss": -22.24888801574707, "global_step": 320050, "epoch": 3856} {"train_loss": -23.017431259155273, "global_step": 320051, "epoch": 3856} {"train_loss": -24.643579483032227, "global_step": 320052, "epoch": 3856} {"train_loss": -24.819854736328125, "global_step": 320053, "epoch": 3856} {"train_loss": -24.3070068359375, "global_step": 320054, "epoch": 3856} {"train_loss": -25.395854949951172, "global_step": 320055, "epoch": 3856} {"train_loss": -24.80606460571289, "global_step": 320056, "epoch": 3856} {"train_loss": -24.908674240112305, "global_step": 320057, "epoch": 3856} {"train_loss": -25.182523727416992, "global_step": 320058, "epoch": 3856} {"train_loss": -24.93942642211914, "global_step": 320059, "epoch": 3856} {"train_loss": -25.130857467651367, "global_step": 320060, "epoch": 3856} {"train_loss": -25.02048683166504, "global_step": 320061, "epoch": 3856} {"train_loss": -25.2032470703125, "global_step": 320062, "epoch": 3856} {"train_loss": -24.712610244750977, "global_step": 320063, "epoch": 3856} {"train_loss": -25.015771865844727, "global_step": 320064, "epoch": 3856} {"train_loss": -25.15228271484375, "global_step": 320065, "epoch": 3856} {"train_loss": -25.39078140258789, "global_step": 320066, "epoch": 3856} {"train_loss": -25.322858810424805, "global_step": 320067, "epoch": 3856} {"train_loss": -25.43660545349121, "global_step": 320068, "epoch": 3856} {"train_loss": -25.44423484802246, "global_step": 320069, "epoch": 3856} {"train_loss": -25.492883682250977, "global_step": 320070, "epoch": 3856} {"train_loss": -25.29117202758789, "global_step": 320071, "epoch": 3856} {"train_loss": -25.567947387695312, "global_step": 320072, "epoch": 3856} {"train_loss": -25.547475814819336, "global_step": 320073, "epoch": 3856} {"train_loss": -25.67582130432129, "global_step": 320074, "epoch": 3856} {"train_loss": -25.1173095703125, "global_step": 320075, "epoch": 3856} {"train_loss": -25.599599838256836, "global_step": 320076, "epoch": 3856} {"train_loss": -25.90158462524414, "global_step": 320077, "epoch": 3856} {"train_loss": -25.6160945892334, "global_step": 320078, "epoch": 3856} {"train_loss": -25.714889526367188, "global_step": 320079, "epoch": 3856} {"train_loss": -25.72747230529785, "global_step": 320080, "epoch": 3856} {"train_loss": -25.970569610595703, "global_step": 320081, "epoch": 3856} {"train_loss": -25.524877548217773, "global_step": 320082, "epoch": 3856} {"train_loss": -25.857868194580078, "global_step": 320083, "epoch": 3856} {"train_loss": -25.92378044128418, "global_step": 320084, "epoch": 3856} {"train_loss": -25.766864776611328, "global_step": 320085, "epoch": 3856} {"train_loss": -25.67144203186035, "global_step": 320086, "epoch": 3856} {"train_loss": -25.847082138061523, "global_step": 320087, "epoch": 3856} {"train_loss": -26.239990234375, "global_step": 320088, "epoch": 3856} {"train_loss": -26.053373336791992, "global_step": 320089, "epoch": 3856} {"train_loss": -25.706945419311523, "global_step": 320090, "epoch": 3856} {"train_loss": -25.813451766967773, "global_step": 320091, "epoch": 3856} {"train_loss": -26.001026153564453, "global_step": 320092, "epoch": 3856} {"train_loss": -25.580860137939453, "global_step": 320093, "epoch": 3856} {"train_loss": -25.862884521484375, "global_step": 320094, "epoch": 3856} {"train_loss": -25.90396499633789, "global_step": 320095, "epoch": 3856} {"train_loss": -25.793729782104492, "global_step": 320096, "epoch": 3856} {"train_loss": -25.576671600341797, "global_step": 320097, "epoch": 3856} {"train_loss": -25.422574996948242, "global_step": 320098, "epoch": 3856} {"train_loss": -25.76801872253418, "global_step": 320099, "epoch": 3856} {"train_loss": -25.835952758789062, "global_step": 320100, "epoch": 3856} {"train_loss": -25.89066505432129, "global_step": 320101, "epoch": 3856} {"train_loss": -25.843017578125, "global_step": 320102, "epoch": 3856} {"train_loss": -25.6418514251709, "global_step": 320103, "epoch": 3856} {"train_loss": -26.055410385131836, "global_step": 320104, "epoch": 3856} {"train_loss": -26.28888511657715, "global_step": 320105, "epoch": 3856} {"train_loss": -25.654083251953125, "global_step": 320106, "epoch": 3856} {"train_loss": -25.75052833557129, "global_step": 320107, "epoch": 3856} {"train_loss": -25.86707878112793, "global_step": 320108, "epoch": 3856} {"train_loss": -25.80372428894043, "global_step": 320109, "epoch": 3856} {"train_loss": -26.44205093383789, "global_step": 320110, "epoch": 3856} {"train_loss": -25.727527618408203, "global_step": 320111, "epoch": 3856} {"train_loss": -26.2120361328125, "global_step": 320112, "epoch": 3856} {"train_loss": -26.091388702392578, "global_step": 320113, "epoch": 3856} {"train_loss": -25.900115966796875, "global_step": 320114, "epoch": 3856} {"train_loss": -26.310169219970703, "global_step": 320115, "epoch": 3856} {"train_loss": -26.308704376220703, "global_step": 320116, "epoch": 3856} {"train_loss": -25.916339874267578, "global_step": 320117, "epoch": 3856} {"train_loss": -25.85438346862793, "global_step": 320118, "epoch": 3856} {"train_loss": -26.1513729095459, "global_step": 320119, "epoch": 3856} {"train_loss": -25.60822105407715, "global_step": 320120, "epoch": 3856} {"train_loss": -26.06149673461914, "global_step": 320121, "epoch": 3856} {"train_loss": -26.044401168823242, "global_step": 320122, "epoch": 3856} {"train_loss": -25.756027221679688, "global_step": 320123, "epoch": 3856} {"train_loss": -26.169397354125977, "global_step": 320124, "epoch": 3856} {"train_loss": -26.1387882232666, "global_step": 320125, "epoch": 3856} {"train_loss": -26.265735626220703, "global_step": 320126, "epoch": 3856} {"train_loss": -25.852832794189453, "global_step": 320127, "epoch": 3856} {"train_loss": -26.2562198638916, "global_step": 320128, "epoch": 3856} {"train_loss": -25.696985244750977, "global_step": 320129, "epoch": 3856} {"train_loss": -25.572996874889697, "global_step": 320130, "epoch": 3856, "val_loss": 7338673.0} {"train_loss": -25.215259552001953, "global_step": 320131, "epoch": 3857} {"train_loss": -25.054885864257812, "global_step": 320132, "epoch": 3857} {"train_loss": -24.392902374267578, "global_step": 320133, "epoch": 3857} {"train_loss": -24.833829879760742, "global_step": 320134, "epoch": 3857} {"train_loss": -24.74615478515625, "global_step": 320135, "epoch": 3857} {"train_loss": -25.419878005981445, "global_step": 320136, "epoch": 3857} {"train_loss": -24.642057418823242, "global_step": 320137, "epoch": 3857} {"train_loss": -24.878393173217773, "global_step": 320138, "epoch": 3857} {"train_loss": -25.372243881225586, "global_step": 320139, "epoch": 3857} {"train_loss": -25.16438102722168, "global_step": 320140, "epoch": 3857} {"train_loss": -25.343544006347656, "global_step": 320141, "epoch": 3857} {"train_loss": -25.422882080078125, "global_step": 320142, "epoch": 3857} {"train_loss": -24.792316436767578, "global_step": 320143, "epoch": 3857} {"train_loss": -25.24878692626953, "global_step": 320144, "epoch": 3857} {"train_loss": -25.59943199157715, "global_step": 320145, "epoch": 3857} {"train_loss": -25.307052612304688, "global_step": 320146, "epoch": 3857} {"train_loss": -25.3364315032959, "global_step": 320147, "epoch": 3857} {"train_loss": -25.67002296447754, "global_step": 320148, "epoch": 3857} {"train_loss": -25.427749633789062, "global_step": 320149, "epoch": 3857} {"train_loss": -25.182086944580078, "global_step": 320150, "epoch": 3857} {"train_loss": -25.3018741607666, "global_step": 320151, "epoch": 3857} {"train_loss": -25.385656356811523, "global_step": 320152, "epoch": 3857} {"train_loss": -25.95440673828125, "global_step": 320153, "epoch": 3857} {"train_loss": -25.600021362304688, "global_step": 320154, "epoch": 3857} {"train_loss": -25.61982536315918, "global_step": 320155, "epoch": 3857} {"train_loss": -25.751346588134766, "global_step": 320156, "epoch": 3857} {"train_loss": -25.699377059936523, "global_step": 320157, "epoch": 3857} {"train_loss": -25.56646728515625, "global_step": 320158, "epoch": 3857} {"train_loss": -25.865753173828125, "global_step": 320159, "epoch": 3857} {"train_loss": -25.514944076538086, "global_step": 320160, "epoch": 3857} {"train_loss": -25.814233779907227, "global_step": 320161, "epoch": 3857} {"train_loss": -25.952747344970703, "global_step": 320162, "epoch": 3857} {"train_loss": -25.983901977539062, "global_step": 320163, "epoch": 3857} {"train_loss": -25.72391128540039, "global_step": 320164, "epoch": 3857} {"train_loss": -25.651411056518555, "global_step": 320165, "epoch": 3857} {"train_loss": -25.72369956970215, "global_step": 320166, "epoch": 3857} {"train_loss": -25.9190616607666, "global_step": 320167, "epoch": 3857} {"train_loss": -26.086746215820312, "global_step": 320168, "epoch": 3857} {"train_loss": -25.806720733642578, "global_step": 320169, "epoch": 3857} {"train_loss": -25.737106323242188, "global_step": 320170, "epoch": 3857} {"train_loss": -25.69732093811035, "global_step": 320171, "epoch": 3857} {"train_loss": -26.018787384033203, "global_step": 320172, "epoch": 3857} {"train_loss": -25.725278854370117, "global_step": 320173, "epoch": 3857} {"train_loss": -25.8193359375, "global_step": 320174, "epoch": 3857} {"train_loss": -26.137022018432617, "global_step": 320175, "epoch": 3857} {"train_loss": -25.834339141845703, "global_step": 320176, "epoch": 3857} {"train_loss": -25.6898136138916, "global_step": 320177, "epoch": 3857} {"train_loss": -26.282697677612305, "global_step": 320178, "epoch": 3857} {"train_loss": -26.410968780517578, "global_step": 320179, "epoch": 3857} {"train_loss": -26.18848991394043, "global_step": 320180, "epoch": 3857} {"train_loss": -26.3057804107666, "global_step": 320181, "epoch": 3857} {"train_loss": -26.240127563476562, "global_step": 320182, "epoch": 3857} {"train_loss": -26.39033317565918, "global_step": 320183, "epoch": 3857} {"train_loss": -25.790449142456055, "global_step": 320184, "epoch": 3857} {"train_loss": -26.243762969970703, "global_step": 320185, "epoch": 3857} {"train_loss": -25.74042320251465, "global_step": 320186, "epoch": 3857} {"train_loss": -26.47233009338379, "global_step": 320187, "epoch": 3857} {"train_loss": -25.942243576049805, "global_step": 320188, "epoch": 3857} {"train_loss": -26.342809677124023, "global_step": 320189, "epoch": 3857} {"train_loss": -26.315444946289062, "global_step": 320190, "epoch": 3857} {"train_loss": -26.112030029296875, "global_step": 320191, "epoch": 3857} {"train_loss": -25.950916290283203, "global_step": 320192, "epoch": 3857} {"train_loss": -26.046661376953125, "global_step": 320193, "epoch": 3857} {"train_loss": -25.788572311401367, "global_step": 320194, "epoch": 3857} {"train_loss": -26.201452255249023, "global_step": 320195, "epoch": 3857} {"train_loss": -25.966405868530273, "global_step": 320196, "epoch": 3857} {"train_loss": -26.177570343017578, "global_step": 320197, "epoch": 3857} {"train_loss": -26.152082443237305, "global_step": 320198, "epoch": 3857} {"train_loss": -25.922422409057617, "global_step": 320199, "epoch": 3857} {"train_loss": -26.1297550201416, "global_step": 320200, "epoch": 3857} {"train_loss": -25.883752822875977, "global_step": 320201, "epoch": 3857} {"train_loss": -26.07899284362793, "global_step": 320202, "epoch": 3857} {"train_loss": -25.986083984375, "global_step": 320203, "epoch": 3857} {"train_loss": -25.8746280670166, "global_step": 320204, "epoch": 3857} {"train_loss": -25.63665199279785, "global_step": 320205, "epoch": 3857} {"train_loss": -25.714502334594727, "global_step": 320206, "epoch": 3857} {"train_loss": -25.818769454956055, "global_step": 320207, "epoch": 3857} {"train_loss": -25.624786376953125, "global_step": 320208, "epoch": 3857} {"train_loss": -25.171396255493164, "global_step": 320209, "epoch": 3857} {"train_loss": -25.065595626831055, "global_step": 320210, "epoch": 3857} {"train_loss": -25.207609176635742, "global_step": 320211, "epoch": 3857} {"train_loss": -25.552419662475586, "global_step": 320212, "epoch": 3857} {"train_loss": -25.69327352133142, "global_step": 320213, "epoch": 3857, "val_loss": 7313476.5} {"train_loss": -25.177309036254883, "global_step": 320214, "epoch": 3858} {"train_loss": -25.2362117767334, "global_step": 320215, "epoch": 3858} {"train_loss": -25.565494537353516, "global_step": 320216, "epoch": 3858} {"train_loss": -25.191679000854492, "global_step": 320217, "epoch": 3858} {"train_loss": -25.560747146606445, "global_step": 320218, "epoch": 3858} {"train_loss": -25.138872146606445, "global_step": 320219, "epoch": 3858} {"train_loss": -25.43393325805664, "global_step": 320220, "epoch": 3858} {"train_loss": -25.216352462768555, "global_step": 320221, "epoch": 3858} {"train_loss": -25.497365951538086, "global_step": 320222, "epoch": 3858} {"train_loss": -25.359594345092773, "global_step": 320223, "epoch": 3858} {"train_loss": -25.677900314331055, "global_step": 320224, "epoch": 3858} {"train_loss": -25.138402938842773, "global_step": 320225, "epoch": 3858} {"train_loss": -25.5830135345459, "global_step": 320226, "epoch": 3858} {"train_loss": -25.429569244384766, "global_step": 320227, "epoch": 3858} {"train_loss": -25.784820556640625, "global_step": 320228, "epoch": 3858} {"train_loss": -25.9156436920166, "global_step": 320229, "epoch": 3858} {"train_loss": -25.097558975219727, "global_step": 320230, "epoch": 3858} {"train_loss": -25.703445434570312, "global_step": 320231, "epoch": 3858} {"train_loss": -25.2998104095459, "global_step": 320232, "epoch": 3858} {"train_loss": -25.879980087280273, "global_step": 320233, "epoch": 3858} {"train_loss": -25.8803768157959, "global_step": 320234, "epoch": 3858} {"train_loss": -25.823028564453125, "global_step": 320235, "epoch": 3858} {"train_loss": -25.518980026245117, "global_step": 320236, "epoch": 3858} {"train_loss": -25.59147071838379, "global_step": 320237, "epoch": 3858} {"train_loss": -25.877166748046875, "global_step": 320238, "epoch": 3858} {"train_loss": -25.925012588500977, "global_step": 320239, "epoch": 3858} {"train_loss": -25.85691261291504, "global_step": 320240, "epoch": 3858} {"train_loss": -25.785261154174805, "global_step": 320241, "epoch": 3858} {"train_loss": -25.866912841796875, "global_step": 320242, "epoch": 3858} {"train_loss": -25.85470962524414, "global_step": 320243, "epoch": 3858} {"train_loss": -26.07474136352539, "global_step": 320244, "epoch": 3858} {"train_loss": -25.890905380249023, "global_step": 320245, "epoch": 3858} {"train_loss": -25.567615509033203, "global_step": 320246, "epoch": 3858} {"train_loss": -26.086774826049805, "global_step": 320247, "epoch": 3858} {"train_loss": -25.550121307373047, "global_step": 320248, "epoch": 3858} {"train_loss": -25.612695693969727, "global_step": 320249, "epoch": 3858} {"train_loss": -25.78264808654785, "global_step": 320250, "epoch": 3858} {"train_loss": -25.919599533081055, "global_step": 320251, "epoch": 3858} {"train_loss": -25.721820831298828, "global_step": 320252, "epoch": 3858} {"train_loss": -25.687097549438477, "global_step": 320253, "epoch": 3858} {"train_loss": -25.242626190185547, "global_step": 320254, "epoch": 3858} {"train_loss": -26.083093643188477, "global_step": 320255, "epoch": 3858} {"train_loss": -25.64458656311035, "global_step": 320256, "epoch": 3858} {"train_loss": -25.733016967773438, "global_step": 320257, "epoch": 3858} {"train_loss": -26.154937744140625, "global_step": 320258, "epoch": 3858} {"train_loss": -25.744123458862305, "global_step": 320259, "epoch": 3858} {"train_loss": -25.798572540283203, "global_step": 320260, "epoch": 3858} {"train_loss": -25.667917251586914, "global_step": 320261, "epoch": 3858} {"train_loss": -25.59433937072754, "global_step": 320262, "epoch": 3858} {"train_loss": -26.110797882080078, "global_step": 320263, "epoch": 3858} {"train_loss": -25.896900177001953, "global_step": 320264, "epoch": 3858} {"train_loss": -25.835037231445312, "global_step": 320265, "epoch": 3858} {"train_loss": -25.7452335357666, "global_step": 320266, "epoch": 3858} {"train_loss": -25.616790771484375, "global_step": 320267, "epoch": 3858} {"train_loss": -25.971967697143555, "global_step": 320268, "epoch": 3858} {"train_loss": -25.807058334350586, "global_step": 320269, "epoch": 3858} {"train_loss": -25.803394317626953, "global_step": 320270, "epoch": 3858} {"train_loss": -25.960657119750977, "global_step": 320271, "epoch": 3858} {"train_loss": -25.7721004486084, "global_step": 320272, "epoch": 3858} {"train_loss": -25.89655876159668, "global_step": 320273, "epoch": 3858} {"train_loss": -26.020099639892578, "global_step": 320274, "epoch": 3858} {"train_loss": -26.260974884033203, "global_step": 320275, "epoch": 3858} {"train_loss": -25.866918563842773, "global_step": 320276, "epoch": 3858} {"train_loss": -25.694135665893555, "global_step": 320277, "epoch": 3858} {"train_loss": -25.76350212097168, "global_step": 320278, "epoch": 3858} {"train_loss": -25.325468063354492, "global_step": 320279, "epoch": 3858} {"train_loss": -25.559980392456055, "global_step": 320280, "epoch": 3858} {"train_loss": -25.65595054626465, "global_step": 320281, "epoch": 3858} {"train_loss": -25.684417724609375, "global_step": 320282, "epoch": 3858} {"train_loss": -25.9627628326416, "global_step": 320283, "epoch": 3858} {"train_loss": -26.367843627929688, "global_step": 320284, "epoch": 3858} {"train_loss": -26.316547393798828, "global_step": 320285, "epoch": 3858} {"train_loss": -25.93631935119629, "global_step": 320286, "epoch": 3858} {"train_loss": -26.141416549682617, "global_step": 320287, "epoch": 3858} {"train_loss": -26.13421058654785, "global_step": 320288, "epoch": 3858} {"train_loss": -25.709228515625, "global_step": 320289, "epoch": 3858} {"train_loss": -25.962690353393555, "global_step": 320290, "epoch": 3858} {"train_loss": -25.817312240600586, "global_step": 320291, "epoch": 3858} {"train_loss": -25.9420166015625, "global_step": 320292, "epoch": 3858} {"train_loss": -26.430566787719727, "global_step": 320293, "epoch": 3858} {"train_loss": -25.8823184967041, "global_step": 320294, "epoch": 3858} {"train_loss": -26.076065063476562, "global_step": 320295, "epoch": 3858} {"train_loss": -25.767807167696667, "global_step": 320296, "epoch": 3858, "val_loss": 7331186.5} {"train_loss": -25.50518226623535, "global_step": 320297, "epoch": 3859} {"train_loss": -25.18023109436035, "global_step": 320298, "epoch": 3859} {"train_loss": -25.001583099365234, "global_step": 320299, "epoch": 3859} {"train_loss": -24.68869972229004, "global_step": 320300, "epoch": 3859} {"train_loss": -24.336484909057617, "global_step": 320301, "epoch": 3859} {"train_loss": -24.964256286621094, "global_step": 320302, "epoch": 3859} {"train_loss": -25.43892478942871, "global_step": 320303, "epoch": 3859} {"train_loss": -25.171279907226562, "global_step": 320304, "epoch": 3859} {"train_loss": -24.9566650390625, "global_step": 320305, "epoch": 3859} {"train_loss": -25.609350204467773, "global_step": 320306, "epoch": 3859} {"train_loss": -25.531553268432617, "global_step": 320307, "epoch": 3859} {"train_loss": -25.74201774597168, "global_step": 320308, "epoch": 3859} {"train_loss": -25.54315948486328, "global_step": 320309, "epoch": 3859} {"train_loss": -25.908004760742188, "global_step": 320310, "epoch": 3859} {"train_loss": -25.865116119384766, "global_step": 320311, "epoch": 3859} {"train_loss": -25.707406997680664, "global_step": 320312, "epoch": 3859} {"train_loss": -25.301239013671875, "global_step": 320313, "epoch": 3859} {"train_loss": -25.336776733398438, "global_step": 320314, "epoch": 3859} {"train_loss": -25.730573654174805, "global_step": 320315, "epoch": 3859} {"train_loss": -25.690704345703125, "global_step": 320316, "epoch": 3859} {"train_loss": -25.9068660736084, "global_step": 320317, "epoch": 3859} {"train_loss": -25.493642807006836, "global_step": 320318, "epoch": 3859} {"train_loss": -25.82024574279785, "global_step": 320319, "epoch": 3859} {"train_loss": -25.638952255249023, "global_step": 320320, "epoch": 3859} {"train_loss": -25.547122955322266, "global_step": 320321, "epoch": 3859} {"train_loss": -25.751419067382812, "global_step": 320322, "epoch": 3859} {"train_loss": -25.898923873901367, "global_step": 320323, "epoch": 3859} {"train_loss": -25.665246963500977, "global_step": 320324, "epoch": 3859} {"train_loss": -25.77996253967285, "global_step": 320325, "epoch": 3859} {"train_loss": -26.0380916595459, "global_step": 320326, "epoch": 3859} {"train_loss": -26.268482208251953, "global_step": 320327, "epoch": 3859} {"train_loss": -26.413272857666016, "global_step": 320328, "epoch": 3859} {"train_loss": -26.170001983642578, "global_step": 320329, "epoch": 3859} {"train_loss": -26.374235153198242, "global_step": 320330, "epoch": 3859} {"train_loss": -25.833911895751953, "global_step": 320331, "epoch": 3859} {"train_loss": -25.845123291015625, "global_step": 320332, "epoch": 3859} {"train_loss": -25.529027938842773, "global_step": 320333, "epoch": 3859} {"train_loss": -25.782611846923828, "global_step": 320334, "epoch": 3859} {"train_loss": -26.14752197265625, "global_step": 320335, "epoch": 3859} {"train_loss": -25.818639755249023, "global_step": 320336, "epoch": 3859} {"train_loss": -26.047962188720703, "global_step": 320337, "epoch": 3859} {"train_loss": -26.028369903564453, "global_step": 320338, "epoch": 3859} {"train_loss": -26.299274444580078, "global_step": 320339, "epoch": 3859} {"train_loss": -25.949237823486328, "global_step": 320340, "epoch": 3859} {"train_loss": -26.204885482788086, "global_step": 320341, "epoch": 3859} {"train_loss": -26.222259521484375, "global_step": 320342, "epoch": 3859} {"train_loss": -26.062814712524414, "global_step": 320343, "epoch": 3859} {"train_loss": -25.68475914001465, "global_step": 320344, "epoch": 3859} {"train_loss": -26.324682235717773, "global_step": 320345, "epoch": 3859} {"train_loss": -26.067127227783203, "global_step": 320346, "epoch": 3859} {"train_loss": -26.019765853881836, "global_step": 320347, "epoch": 3859} {"train_loss": -25.68048667907715, "global_step": 320348, "epoch": 3859} {"train_loss": -26.06170082092285, "global_step": 320349, "epoch": 3859} {"train_loss": -25.99152946472168, "global_step": 320350, "epoch": 3859} {"train_loss": -25.811017990112305, "global_step": 320351, "epoch": 3859} {"train_loss": -26.058246612548828, "global_step": 320352, "epoch": 3859} {"train_loss": -26.101160049438477, "global_step": 320353, "epoch": 3859} {"train_loss": -26.222858428955078, "global_step": 320354, "epoch": 3859} {"train_loss": -25.850549697875977, "global_step": 320355, "epoch": 3859} {"train_loss": -26.165433883666992, "global_step": 320356, "epoch": 3859} {"train_loss": -26.04630470275879, "global_step": 320357, "epoch": 3859} {"train_loss": -25.77370262145996, "global_step": 320358, "epoch": 3859} {"train_loss": -25.704761505126953, "global_step": 320359, "epoch": 3859} {"train_loss": -25.602813720703125, "global_step": 320360, "epoch": 3859} {"train_loss": -25.606733322143555, "global_step": 320361, "epoch": 3859} {"train_loss": -25.875141143798828, "global_step": 320362, "epoch": 3859} {"train_loss": -25.718774795532227, "global_step": 320363, "epoch": 3859} {"train_loss": -26.244220733642578, "global_step": 320364, "epoch": 3859} {"train_loss": -25.862409591674805, "global_step": 320365, "epoch": 3859} {"train_loss": -25.88618278503418, "global_step": 320366, "epoch": 3859} {"train_loss": -25.8801326751709, "global_step": 320367, "epoch": 3859} {"train_loss": -25.92806053161621, "global_step": 320368, "epoch": 3859} {"train_loss": -26.155309677124023, "global_step": 320369, "epoch": 3859} {"train_loss": -25.587825775146484, "global_step": 320370, "epoch": 3859} {"train_loss": -25.629377365112305, "global_step": 320371, "epoch": 3859} {"train_loss": -25.632160186767578, "global_step": 320372, "epoch": 3859} {"train_loss": -25.66975975036621, "global_step": 320373, "epoch": 3859} {"train_loss": -25.73135757446289, "global_step": 320374, "epoch": 3859} {"train_loss": -25.724878311157227, "global_step": 320375, "epoch": 3859} {"train_loss": -25.634326934814453, "global_step": 320376, "epoch": 3859} {"train_loss": -25.822275161743164, "global_step": 320377, "epoch": 3859} {"train_loss": -25.9637451171875, "global_step": 320378, "epoch": 3859} {"train_loss": -25.774740586797876, "global_step": 320379, "epoch": 3859, "val_loss": 7120617.0} {"train_loss": -25.656675338745117, "global_step": 320380, "epoch": 3860} {"train_loss": -25.62737464904785, "global_step": 320381, "epoch": 3860} {"train_loss": -25.438343048095703, "global_step": 320382, "epoch": 3860} {"train_loss": -25.5579776763916, "global_step": 320383, "epoch": 3860} {"train_loss": -25.3216609954834, "global_step": 320384, "epoch": 3860} {"train_loss": -25.84657096862793, "global_step": 320385, "epoch": 3860} {"train_loss": -25.49660301208496, "global_step": 320386, "epoch": 3860} {"train_loss": -25.551124572753906, "global_step": 320387, "epoch": 3860} {"train_loss": -25.97357749938965, "global_step": 320388, "epoch": 3860} {"train_loss": -25.356245040893555, "global_step": 320389, "epoch": 3860} {"train_loss": -25.45359992980957, "global_step": 320390, "epoch": 3860} {"train_loss": -25.931623458862305, "global_step": 320391, "epoch": 3860} {"train_loss": -26.2445011138916, "global_step": 320392, "epoch": 3860} {"train_loss": -25.956281661987305, "global_step": 320393, "epoch": 3860} {"train_loss": -25.924930572509766, "global_step": 320394, "epoch": 3860} {"train_loss": -25.733320236206055, "global_step": 320395, "epoch": 3860} {"train_loss": -25.8795223236084, "global_step": 320396, "epoch": 3860} {"train_loss": -25.920637130737305, "global_step": 320397, "epoch": 3860} {"train_loss": -25.830976486206055, "global_step": 320398, "epoch": 3860} {"train_loss": -25.726301193237305, "global_step": 320399, "epoch": 3860} {"train_loss": -25.649551391601562, "global_step": 320400, "epoch": 3860} {"train_loss": -25.987497329711914, "global_step": 320401, "epoch": 3860} {"train_loss": -25.58176612854004, "global_step": 320402, "epoch": 3860} {"train_loss": -25.574247360229492, "global_step": 320403, "epoch": 3860} {"train_loss": -25.75237464904785, "global_step": 320404, "epoch": 3860} {"train_loss": -25.9445743560791, "global_step": 320405, "epoch": 3860} {"train_loss": -26.195703506469727, "global_step": 320406, "epoch": 3860} {"train_loss": -25.8210506439209, "global_step": 320407, "epoch": 3860} {"train_loss": -25.70086669921875, "global_step": 320408, "epoch": 3860} {"train_loss": -25.79422950744629, "global_step": 320409, "epoch": 3860} {"train_loss": -25.581571578979492, "global_step": 320410, "epoch": 3860} {"train_loss": -25.650320053100586, "global_step": 320411, "epoch": 3860} {"train_loss": -25.92083168029785, "global_step": 320412, "epoch": 3860} {"train_loss": -25.884613037109375, "global_step": 320413, "epoch": 3860} {"train_loss": -26.085723876953125, "global_step": 320414, "epoch": 3860} {"train_loss": -25.79218101501465, "global_step": 320415, "epoch": 3860} {"train_loss": -25.79277992248535, "global_step": 320416, "epoch": 3860} {"train_loss": -25.818429946899414, "global_step": 320417, "epoch": 3860} {"train_loss": -25.8622989654541, "global_step": 320418, "epoch": 3860} {"train_loss": -26.137048721313477, "global_step": 320419, "epoch": 3860} {"train_loss": -25.84600830078125, "global_step": 320420, "epoch": 3860} {"train_loss": -26.001794815063477, "global_step": 320421, "epoch": 3860} {"train_loss": -25.835851669311523, "global_step": 320422, "epoch": 3860} {"train_loss": -25.99410057067871, "global_step": 320423, "epoch": 3860} {"train_loss": -25.365909576416016, "global_step": 320424, "epoch": 3860} {"train_loss": -25.70115089416504, "global_step": 320425, "epoch": 3860} {"train_loss": -26.05597496032715, "global_step": 320426, "epoch": 3860} {"train_loss": -26.094892501831055, "global_step": 320427, "epoch": 3860} {"train_loss": -25.545272827148438, "global_step": 320428, "epoch": 3860} {"train_loss": -25.789377212524414, "global_step": 320429, "epoch": 3860} {"train_loss": -25.640186309814453, "global_step": 320430, "epoch": 3860} {"train_loss": -25.806354522705078, "global_step": 320431, "epoch": 3860} {"train_loss": -26.066205978393555, "global_step": 320432, "epoch": 3860} {"train_loss": -25.177268981933594, "global_step": 320433, "epoch": 3860} {"train_loss": -25.397594451904297, "global_step": 320434, "epoch": 3860} {"train_loss": -25.95265007019043, "global_step": 320435, "epoch": 3860} {"train_loss": -25.626819610595703, "global_step": 320436, "epoch": 3860} {"train_loss": -26.10357093811035, "global_step": 320437, "epoch": 3860} {"train_loss": -25.751510620117188, "global_step": 320438, "epoch": 3860} {"train_loss": -25.767850875854492, "global_step": 320439, "epoch": 3860} {"train_loss": -25.747802734375, "global_step": 320440, "epoch": 3860} {"train_loss": -25.751989364624023, "global_step": 320441, "epoch": 3860} {"train_loss": -25.642385482788086, "global_step": 320442, "epoch": 3860} {"train_loss": -26.00214195251465, "global_step": 320443, "epoch": 3860} {"train_loss": -25.82941246032715, "global_step": 320444, "epoch": 3860} {"train_loss": -25.78040885925293, "global_step": 320445, "epoch": 3860} {"train_loss": -25.53390884399414, "global_step": 320446, "epoch": 3860} {"train_loss": -25.81525230407715, "global_step": 320447, "epoch": 3860} {"train_loss": -25.94961929321289, "global_step": 320448, "epoch": 3860} {"train_loss": -25.921772003173828, "global_step": 320449, "epoch": 3860} {"train_loss": -26.135404586791992, "global_step": 320450, "epoch": 3860} {"train_loss": -25.758527755737305, "global_step": 320451, "epoch": 3860} {"train_loss": -25.93692398071289, "global_step": 320452, "epoch": 3860} {"train_loss": -26.23447036743164, "global_step": 320453, "epoch": 3860} {"train_loss": -25.920080184936523, "global_step": 320454, "epoch": 3860} {"train_loss": -25.8937931060791, "global_step": 320455, "epoch": 3860} {"train_loss": -25.76204490661621, "global_step": 320456, "epoch": 3860} {"train_loss": -26.072301864624023, "global_step": 320457, "epoch": 3860} {"train_loss": -25.89166259765625, "global_step": 320458, "epoch": 3860} {"train_loss": -26.157135009765625, "global_step": 320459, "epoch": 3860} {"train_loss": -25.988941192626953, "global_step": 320460, "epoch": 3860} {"train_loss": -25.935382843017578, "global_step": 320461, "epoch": 3860} {"train_loss": -25.811642980001057, "global_step": 320462, "epoch": 3860, "val_loss": 7145618.0} {"train_loss": -24.162282943725586, "global_step": 320463, "epoch": 3861} {"train_loss": -24.041154861450195, "global_step": 320464, "epoch": 3861} {"train_loss": -25.2602481842041, "global_step": 320465, "epoch": 3861} {"train_loss": -24.975126266479492, "global_step": 320466, "epoch": 3861} {"train_loss": -24.33041763305664, "global_step": 320467, "epoch": 3861} {"train_loss": -25.487380981445312, "global_step": 320468, "epoch": 3861} {"train_loss": -25.274267196655273, "global_step": 320469, "epoch": 3861} {"train_loss": -25.263296127319336, "global_step": 320470, "epoch": 3861} {"train_loss": -25.63714599609375, "global_step": 320471, "epoch": 3861} {"train_loss": -25.870283126831055, "global_step": 320472, "epoch": 3861} {"train_loss": -25.410730361938477, "global_step": 320473, "epoch": 3861} {"train_loss": -25.43608856201172, "global_step": 320474, "epoch": 3861} {"train_loss": -25.26167869567871, "global_step": 320475, "epoch": 3861} {"train_loss": -25.28584098815918, "global_step": 320476, "epoch": 3861} {"train_loss": -25.506925582885742, "global_step": 320477, "epoch": 3861} {"train_loss": -25.301687240600586, "global_step": 320478, "epoch": 3861} {"train_loss": -25.948780059814453, "global_step": 320479, "epoch": 3861} {"train_loss": -25.441333770751953, "global_step": 320480, "epoch": 3861} {"train_loss": -25.850006103515625, "global_step": 320481, "epoch": 3861} {"train_loss": -25.587364196777344, "global_step": 320482, "epoch": 3861} {"train_loss": -26.06007957458496, "global_step": 320483, "epoch": 3861} {"train_loss": -26.232471466064453, "global_step": 320484, "epoch": 3861} {"train_loss": -25.508546829223633, "global_step": 320485, "epoch": 3861} {"train_loss": -25.604318618774414, "global_step": 320486, "epoch": 3861} {"train_loss": -25.539447784423828, "global_step": 320487, "epoch": 3861} {"train_loss": -25.9622859954834, "global_step": 320488, "epoch": 3861} {"train_loss": -25.681140899658203, "global_step": 320489, "epoch": 3861} {"train_loss": -25.9531192779541, "global_step": 320490, "epoch": 3861} {"train_loss": -25.899805068969727, "global_step": 320491, "epoch": 3861} {"train_loss": -26.00994873046875, "global_step": 320492, "epoch": 3861} {"train_loss": -25.577190399169922, "global_step": 320493, "epoch": 3861} {"train_loss": -25.76105308532715, "global_step": 320494, "epoch": 3861} {"train_loss": -25.9852352142334, "global_step": 320495, "epoch": 3861} {"train_loss": -25.687803268432617, "global_step": 320496, "epoch": 3861} {"train_loss": -25.90351676940918, "global_step": 320497, "epoch": 3861} {"train_loss": -26.345998764038086, "global_step": 320498, "epoch": 3861} {"train_loss": -25.678281784057617, "global_step": 320499, "epoch": 3861} {"train_loss": -25.9755802154541, "global_step": 320500, "epoch": 3861} {"train_loss": -25.76856803894043, "global_step": 320501, "epoch": 3861} {"train_loss": -25.923864364624023, "global_step": 320502, "epoch": 3861} {"train_loss": -26.120458602905273, "global_step": 320503, "epoch": 3861} {"train_loss": -25.996662139892578, "global_step": 320504, "epoch": 3861} {"train_loss": -25.657413482666016, "global_step": 320505, "epoch": 3861} {"train_loss": -25.74346351623535, "global_step": 320506, "epoch": 3861} {"train_loss": -25.97052574157715, "global_step": 320507, "epoch": 3861} {"train_loss": -25.81446647644043, "global_step": 320508, "epoch": 3861} {"train_loss": -25.83436393737793, "global_step": 320509, "epoch": 3861} {"train_loss": -25.811553955078125, "global_step": 320510, "epoch": 3861} {"train_loss": -26.129302978515625, "global_step": 320511, "epoch": 3861} {"train_loss": -25.74493408203125, "global_step": 320512, "epoch": 3861} {"train_loss": -26.357938766479492, "global_step": 320513, "epoch": 3861} {"train_loss": -25.968006134033203, "global_step": 320514, "epoch": 3861} {"train_loss": -25.61627197265625, "global_step": 320515, "epoch": 3861} {"train_loss": -26.024267196655273, "global_step": 320516, "epoch": 3861} {"train_loss": -25.690732955932617, "global_step": 320517, "epoch": 3861} {"train_loss": -25.605819702148438, "global_step": 320518, "epoch": 3861} {"train_loss": -26.039770126342773, "global_step": 320519, "epoch": 3861} {"train_loss": -26.228952407836914, "global_step": 320520, "epoch": 3861} {"train_loss": -26.31202507019043, "global_step": 320521, "epoch": 3861} {"train_loss": -26.153751373291016, "global_step": 320522, "epoch": 3861} {"train_loss": -26.144474029541016, "global_step": 320523, "epoch": 3861} {"train_loss": -26.319944381713867, "global_step": 320524, "epoch": 3861} {"train_loss": -25.955997467041016, "global_step": 320525, "epoch": 3861} {"train_loss": -26.143091201782227, "global_step": 320526, "epoch": 3861} {"train_loss": -26.392160415649414, "global_step": 320527, "epoch": 3861} {"train_loss": -25.87680435180664, "global_step": 320528, "epoch": 3861} {"train_loss": -25.915494918823242, "global_step": 320529, "epoch": 3861} {"train_loss": -26.09930992126465, "global_step": 320530, "epoch": 3861} {"train_loss": -26.084836959838867, "global_step": 320531, "epoch": 3861} {"train_loss": -26.026052474975586, "global_step": 320532, "epoch": 3861} {"train_loss": -26.03912353515625, "global_step": 320533, "epoch": 3861} {"train_loss": -25.83949089050293, "global_step": 320534, "epoch": 3861} {"train_loss": -25.892688751220703, "global_step": 320535, "epoch": 3861} {"train_loss": -25.977970123291016, "global_step": 320536, "epoch": 3861} {"train_loss": -26.036285400390625, "global_step": 320537, "epoch": 3861} {"train_loss": -25.800931930541992, "global_step": 320538, "epoch": 3861} {"train_loss": -26.05457878112793, "global_step": 320539, "epoch": 3861} {"train_loss": -26.10341453552246, "global_step": 320540, "epoch": 3861} {"train_loss": -25.90472412109375, "global_step": 320541, "epoch": 3861} {"train_loss": -25.626306533813477, "global_step": 320542, "epoch": 3861} {"train_loss": -26.127161026000977, "global_step": 320543, "epoch": 3861} {"train_loss": -25.64039421081543, "global_step": 320544, "epoch": 3861} {"train_loss": -25.78119859350733, "global_step": 320545, "epoch": 3861, "val_loss": 7222374.0} {"train_loss": -25.59002685546875, "global_step": 320546, "epoch": 3862} {"train_loss": -25.851364135742188, "global_step": 320547, "epoch": 3862} {"train_loss": -25.756101608276367, "global_step": 320548, "epoch": 3862} {"train_loss": -25.5067081451416, "global_step": 320549, "epoch": 3862} {"train_loss": -25.329587936401367, "global_step": 320550, "epoch": 3862} {"train_loss": -25.631086349487305, "global_step": 320551, "epoch": 3862} {"train_loss": -25.535892486572266, "global_step": 320552, "epoch": 3862} {"train_loss": -25.74165153503418, "global_step": 320553, "epoch": 3862} {"train_loss": -25.567623138427734, "global_step": 320554, "epoch": 3862} {"train_loss": -25.390594482421875, "global_step": 320555, "epoch": 3862} {"train_loss": -25.97273063659668, "global_step": 320556, "epoch": 3862} {"train_loss": -25.605335235595703, "global_step": 320557, "epoch": 3862} {"train_loss": -26.023828506469727, "global_step": 320558, "epoch": 3862} {"train_loss": -25.663129806518555, "global_step": 320559, "epoch": 3862} {"train_loss": -25.55019187927246, "global_step": 320560, "epoch": 3862} {"train_loss": -25.960540771484375, "global_step": 320561, "epoch": 3862} {"train_loss": -25.844501495361328, "global_step": 320562, "epoch": 3862} {"train_loss": -25.85361671447754, "global_step": 320563, "epoch": 3862} {"train_loss": -25.8118839263916, "global_step": 320564, "epoch": 3862} {"train_loss": -25.79206657409668, "global_step": 320565, "epoch": 3862} {"train_loss": -25.911645889282227, "global_step": 320566, "epoch": 3862} {"train_loss": -25.812719345092773, "global_step": 320567, "epoch": 3862} {"train_loss": -25.66868019104004, "global_step": 320568, "epoch": 3862} {"train_loss": -26.117528915405273, "global_step": 320569, "epoch": 3862} {"train_loss": -25.47262954711914, "global_step": 320570, "epoch": 3862} {"train_loss": -25.60797119140625, "global_step": 320571, "epoch": 3862} {"train_loss": -25.70541763305664, "global_step": 320572, "epoch": 3862} {"train_loss": -25.6315860748291, "global_step": 320573, "epoch": 3862} {"train_loss": -26.20490074157715, "global_step": 320574, "epoch": 3862} {"train_loss": -25.989065170288086, "global_step": 320575, "epoch": 3862} {"train_loss": -25.771230697631836, "global_step": 320576, "epoch": 3862} {"train_loss": -25.9638614654541, "global_step": 320577, "epoch": 3862} {"train_loss": -26.05274772644043, "global_step": 320578, "epoch": 3862} {"train_loss": -26.261499404907227, "global_step": 320579, "epoch": 3862} {"train_loss": -26.148212432861328, "global_step": 320580, "epoch": 3862} {"train_loss": -25.722824096679688, "global_step": 320581, "epoch": 3862} {"train_loss": -25.61188316345215, "global_step": 320582, "epoch": 3862} {"train_loss": -25.999914169311523, "global_step": 320583, "epoch": 3862} {"train_loss": -25.94251823425293, "global_step": 320584, "epoch": 3862} {"train_loss": -25.7928524017334, "global_step": 320585, "epoch": 3862} {"train_loss": -25.868513107299805, "global_step": 320586, "epoch": 3862} {"train_loss": -25.51822853088379, "global_step": 320587, "epoch": 3862} {"train_loss": -25.777036666870117, "global_step": 320588, "epoch": 3862} {"train_loss": -25.897748947143555, "global_step": 320589, "epoch": 3862} {"train_loss": -26.149982452392578, "global_step": 320590, "epoch": 3862} {"train_loss": -25.897932052612305, "global_step": 320591, "epoch": 3862} {"train_loss": -25.861591339111328, "global_step": 320592, "epoch": 3862} {"train_loss": -25.904977798461914, "global_step": 320593, "epoch": 3862} {"train_loss": -26.157093048095703, "global_step": 320594, "epoch": 3862} {"train_loss": -25.74920654296875, "global_step": 320595, "epoch": 3862} {"train_loss": -25.715879440307617, "global_step": 320596, "epoch": 3862} {"train_loss": -25.559946060180664, "global_step": 320597, "epoch": 3862} {"train_loss": -25.852270126342773, "global_step": 320598, "epoch": 3862} {"train_loss": -25.493459701538086, "global_step": 320599, "epoch": 3862} {"train_loss": -25.90704345703125, "global_step": 320600, "epoch": 3862} {"train_loss": -25.7368221282959, "global_step": 320601, "epoch": 3862} {"train_loss": -26.061933517456055, "global_step": 320602, "epoch": 3862} {"train_loss": -26.1127986907959, "global_step": 320603, "epoch": 3862} {"train_loss": -25.9200382232666, "global_step": 320604, "epoch": 3862} {"train_loss": -25.932815551757812, "global_step": 320605, "epoch": 3862} {"train_loss": -26.083642959594727, "global_step": 320606, "epoch": 3862} {"train_loss": -26.03483009338379, "global_step": 320607, "epoch": 3862} {"train_loss": -25.891483306884766, "global_step": 320608, "epoch": 3862} {"train_loss": -25.790048599243164, "global_step": 320609, "epoch": 3862} {"train_loss": -25.86850929260254, "global_step": 320610, "epoch": 3862} {"train_loss": -25.982181549072266, "global_step": 320611, "epoch": 3862} {"train_loss": -26.1087646484375, "global_step": 320612, "epoch": 3862} {"train_loss": -25.9612979888916, "global_step": 320613, "epoch": 3862} {"train_loss": -25.926816940307617, "global_step": 320614, "epoch": 3862} {"train_loss": -26.13226318359375, "global_step": 320615, "epoch": 3862} {"train_loss": -26.27070426940918, "global_step": 320616, "epoch": 3862} {"train_loss": -25.54515838623047, "global_step": 320617, "epoch": 3862} {"train_loss": -25.905115127563477, "global_step": 320618, "epoch": 3862} {"train_loss": -26.230199813842773, "global_step": 320619, "epoch": 3862} {"train_loss": -26.22356605529785, "global_step": 320620, "epoch": 3862} {"train_loss": -25.56197166442871, "global_step": 320621, "epoch": 3862} {"train_loss": -26.025165557861328, "global_step": 320622, "epoch": 3862} {"train_loss": -25.752017974853516, "global_step": 320623, "epoch": 3862} {"train_loss": -25.556289672851562, "global_step": 320624, "epoch": 3862} {"train_loss": -25.640241622924805, "global_step": 320625, "epoch": 3862} {"train_loss": -25.92803955078125, "global_step": 320626, "epoch": 3862} {"train_loss": -25.6569766998291, "global_step": 320627, "epoch": 3862} {"train_loss": -25.832697695996387, "global_step": 320628, "epoch": 3862, "val_loss": 7197095.0} {"train_loss": -25.502046585083008, "global_step": 320629, "epoch": 3863} {"train_loss": -24.611297607421875, "global_step": 320630, "epoch": 3863} {"train_loss": -25.832189559936523, "global_step": 320631, "epoch": 3863} {"train_loss": -25.58810806274414, "global_step": 320632, "epoch": 3863} {"train_loss": -26.068012237548828, "global_step": 320633, "epoch": 3863} {"train_loss": -25.677600860595703, "global_step": 320634, "epoch": 3863} {"train_loss": -25.71150016784668, "global_step": 320635, "epoch": 3863} {"train_loss": -25.73076820373535, "global_step": 320636, "epoch": 3863} {"train_loss": -25.7510929107666, "global_step": 320637, "epoch": 3863} {"train_loss": -25.8516845703125, "global_step": 320638, "epoch": 3863} {"train_loss": -25.96803092956543, "global_step": 320639, "epoch": 3863} {"train_loss": -25.852792739868164, "global_step": 320640, "epoch": 3863} {"train_loss": -25.788379669189453, "global_step": 320641, "epoch": 3863} {"train_loss": -25.97083854675293, "global_step": 320642, "epoch": 3863} {"train_loss": -25.692392349243164, "global_step": 320643, "epoch": 3863} {"train_loss": -25.708209991455078, "global_step": 320644, "epoch": 3863} {"train_loss": -25.561742782592773, "global_step": 320645, "epoch": 3863} {"train_loss": -25.680429458618164, "global_step": 320646, "epoch": 3863} {"train_loss": -26.076568603515625, "global_step": 320647, "epoch": 3863} {"train_loss": -25.807636260986328, "global_step": 320648, "epoch": 3863} {"train_loss": -26.062421798706055, "global_step": 320649, "epoch": 3863} {"train_loss": -25.99982261657715, "global_step": 320650, "epoch": 3863} {"train_loss": -26.16999626159668, "global_step": 320651, "epoch": 3863} {"train_loss": -26.147705078125, "global_step": 320652, "epoch": 3863} {"train_loss": -25.897388458251953, "global_step": 320653, "epoch": 3863} {"train_loss": -25.547361373901367, "global_step": 320654, "epoch": 3863} {"train_loss": -25.748193740844727, "global_step": 320655, "epoch": 3863} {"train_loss": -25.856882095336914, "global_step": 320656, "epoch": 3863} {"train_loss": -25.996967315673828, "global_step": 320657, "epoch": 3863} {"train_loss": -25.908557891845703, "global_step": 320658, "epoch": 3863} {"train_loss": -25.88630485534668, "global_step": 320659, "epoch": 3863} {"train_loss": -25.90443229675293, "global_step": 320660, "epoch": 3863} {"train_loss": -26.123199462890625, "global_step": 320661, "epoch": 3863} {"train_loss": -26.1129150390625, "global_step": 320662, "epoch": 3863} {"train_loss": -25.74336051940918, "global_step": 320663, "epoch": 3863} {"train_loss": -25.855005264282227, "global_step": 320664, "epoch": 3863} {"train_loss": -26.140594482421875, "global_step": 320665, "epoch": 3863} {"train_loss": -26.15532875061035, "global_step": 320666, "epoch": 3863} {"train_loss": -25.901762008666992, "global_step": 320667, "epoch": 3863} {"train_loss": -26.29495620727539, "global_step": 320668, "epoch": 3863} {"train_loss": -26.356292724609375, "global_step": 320669, "epoch": 3863} {"train_loss": -25.942798614501953, "global_step": 320670, "epoch": 3863} {"train_loss": -25.929636001586914, "global_step": 320671, "epoch": 3863} {"train_loss": -26.064184188842773, "global_step": 320672, "epoch": 3863} {"train_loss": -25.88323974609375, "global_step": 320673, "epoch": 3863} {"train_loss": -26.098669052124023, "global_step": 320674, "epoch": 3863} {"train_loss": -26.352142333984375, "global_step": 320675, "epoch": 3863} {"train_loss": -26.29328727722168, "global_step": 320676, "epoch": 3863} {"train_loss": -26.396942138671875, "global_step": 320677, "epoch": 3863} {"train_loss": -26.155752182006836, "global_step": 320678, "epoch": 3863} {"train_loss": -26.051908493041992, "global_step": 320679, "epoch": 3863} {"train_loss": -25.843820571899414, "global_step": 320680, "epoch": 3863} {"train_loss": -25.731061935424805, "global_step": 320681, "epoch": 3863} {"train_loss": -26.19325828552246, "global_step": 320682, "epoch": 3863} {"train_loss": -25.97186851501465, "global_step": 320683, "epoch": 3863} {"train_loss": -25.863622665405273, "global_step": 320684, "epoch": 3863} {"train_loss": -25.800519943237305, "global_step": 320685, "epoch": 3863} {"train_loss": -25.650989532470703, "global_step": 320686, "epoch": 3863} {"train_loss": -25.635656356811523, "global_step": 320687, "epoch": 3863} {"train_loss": -25.624282836914062, "global_step": 320688, "epoch": 3863} {"train_loss": -26.011640548706055, "global_step": 320689, "epoch": 3863} {"train_loss": -25.852460861206055, "global_step": 320690, "epoch": 3863} {"train_loss": -25.32927894592285, "global_step": 320691, "epoch": 3863} {"train_loss": -24.383628845214844, "global_step": 320692, "epoch": 3863} {"train_loss": -24.369504928588867, "global_step": 320693, "epoch": 3863} {"train_loss": -24.062864303588867, "global_step": 320694, "epoch": 3863} {"train_loss": -24.941125869750977, "global_step": 320695, "epoch": 3863} {"train_loss": -25.49197769165039, "global_step": 320696, "epoch": 3863} {"train_loss": -25.391782760620117, "global_step": 320697, "epoch": 3863} {"train_loss": -25.507766723632812, "global_step": 320698, "epoch": 3863} {"train_loss": -25.727584838867188, "global_step": 320699, "epoch": 3863} {"train_loss": -25.659942626953125, "global_step": 320700, "epoch": 3863} {"train_loss": -25.285099029541016, "global_step": 320701, "epoch": 3863} {"train_loss": -25.88014030456543, "global_step": 320702, "epoch": 3863} {"train_loss": -25.073490142822266, "global_step": 320703, "epoch": 3863} {"train_loss": -25.513904571533203, "global_step": 320704, "epoch": 3863} {"train_loss": -25.652759552001953, "global_step": 320705, "epoch": 3863} {"train_loss": -25.70295524597168, "global_step": 320706, "epoch": 3863} {"train_loss": -25.46840476989746, "global_step": 320707, "epoch": 3863} {"train_loss": -25.062480926513672, "global_step": 320708, "epoch": 3863} {"train_loss": -25.68536949157715, "global_step": 320709, "epoch": 3863} {"train_loss": -25.583118438720703, "global_step": 320710, "epoch": 3863} {"train_loss": -25.742242996951184, "global_step": 320711, "epoch": 3863, "val_loss": 7155019.0} {"train_loss": -25.25289535522461, "global_step": 320712, "epoch": 3864} {"train_loss": -25.179716110229492, "global_step": 320713, "epoch": 3864} {"train_loss": -25.08758544921875, "global_step": 320714, "epoch": 3864} {"train_loss": -25.17162322998047, "global_step": 320715, "epoch": 3864} {"train_loss": -25.593923568725586, "global_step": 320716, "epoch": 3864} {"train_loss": -25.73712730407715, "global_step": 320717, "epoch": 3864} {"train_loss": -25.477252960205078, "global_step": 320718, "epoch": 3864} {"train_loss": -25.954925537109375, "global_step": 320719, "epoch": 3864} {"train_loss": -25.16164207458496, "global_step": 320720, "epoch": 3864} {"train_loss": -25.57798957824707, "global_step": 320721, "epoch": 3864} {"train_loss": -25.55154800415039, "global_step": 320722, "epoch": 3864} {"train_loss": -25.666173934936523, "global_step": 320723, "epoch": 3864} {"train_loss": -25.244346618652344, "global_step": 320724, "epoch": 3864} {"train_loss": -25.33441734313965, "global_step": 320725, "epoch": 3864} {"train_loss": -25.857013702392578, "global_step": 320726, "epoch": 3864} {"train_loss": -25.558252334594727, "global_step": 320727, "epoch": 3864} {"train_loss": -25.558761596679688, "global_step": 320728, "epoch": 3864} {"train_loss": -25.54291343688965, "global_step": 320729, "epoch": 3864} {"train_loss": -25.56039810180664, "global_step": 320730, "epoch": 3864} {"train_loss": -25.71243667602539, "global_step": 320731, "epoch": 3864} {"train_loss": -25.977224349975586, "global_step": 320732, "epoch": 3864} {"train_loss": -25.939594268798828, "global_step": 320733, "epoch": 3864} {"train_loss": -25.786855697631836, "global_step": 320734, "epoch": 3864} {"train_loss": -25.661752700805664, "global_step": 320735, "epoch": 3864} {"train_loss": -25.73639488220215, "global_step": 320736, "epoch": 3864} {"train_loss": -25.89631462097168, "global_step": 320737, "epoch": 3864} {"train_loss": -25.71268081665039, "global_step": 320738, "epoch": 3864} {"train_loss": -25.770984649658203, "global_step": 320739, "epoch": 3864} {"train_loss": -25.83660888671875, "global_step": 320740, "epoch": 3864} {"train_loss": -25.92787742614746, "global_step": 320741, "epoch": 3864} {"train_loss": -26.100317001342773, "global_step": 320742, "epoch": 3864} {"train_loss": -25.5788631439209, "global_step": 320743, "epoch": 3864} {"train_loss": -25.687713623046875, "global_step": 320744, "epoch": 3864} {"train_loss": -25.866357803344727, "global_step": 320745, "epoch": 3864} {"train_loss": -25.86655616760254, "global_step": 320746, "epoch": 3864} {"train_loss": -25.858661651611328, "global_step": 320747, "epoch": 3864} {"train_loss": -25.76814079284668, "global_step": 320748, "epoch": 3864} {"train_loss": -25.9742431640625, "global_step": 320749, "epoch": 3864} {"train_loss": -26.4560604095459, "global_step": 320750, "epoch": 3864} {"train_loss": -25.961389541625977, "global_step": 320751, "epoch": 3864} {"train_loss": -26.269250869750977, "global_step": 320752, "epoch": 3864} {"train_loss": -25.854406356811523, "global_step": 320753, "epoch": 3864} {"train_loss": -26.422595977783203, "global_step": 320754, "epoch": 3864} {"train_loss": -25.877145767211914, "global_step": 320755, "epoch": 3864} {"train_loss": -26.135910034179688, "global_step": 320756, "epoch": 3864} {"train_loss": -25.544803619384766, "global_step": 320757, "epoch": 3864} {"train_loss": -25.84644889831543, "global_step": 320758, "epoch": 3864} {"train_loss": -25.86737060546875, "global_step": 320759, "epoch": 3864} {"train_loss": -26.19253921508789, "global_step": 320760, "epoch": 3864} {"train_loss": -25.77268409729004, "global_step": 320761, "epoch": 3864} {"train_loss": -25.930612564086914, "global_step": 320762, "epoch": 3864} {"train_loss": -25.87152671813965, "global_step": 320763, "epoch": 3864} {"train_loss": -25.998926162719727, "global_step": 320764, "epoch": 3864} {"train_loss": -26.118335723876953, "global_step": 320765, "epoch": 3864} {"train_loss": -25.638517379760742, "global_step": 320766, "epoch": 3864} {"train_loss": -25.13193702697754, "global_step": 320767, "epoch": 3864} {"train_loss": -24.631168365478516, "global_step": 320768, "epoch": 3864} {"train_loss": -24.474748611450195, "global_step": 320769, "epoch": 3864} {"train_loss": -24.36431312561035, "global_step": 320770, "epoch": 3864} {"train_loss": -25.45956802368164, "global_step": 320771, "epoch": 3864} {"train_loss": -25.52187156677246, "global_step": 320772, "epoch": 3864} {"train_loss": -24.665815353393555, "global_step": 320773, "epoch": 3864} {"train_loss": -25.672941207885742, "global_step": 320774, "epoch": 3864} {"train_loss": -25.137781143188477, "global_step": 320775, "epoch": 3864} {"train_loss": -25.458120346069336, "global_step": 320776, "epoch": 3864} {"train_loss": -25.64106559753418, "global_step": 320777, "epoch": 3864} {"train_loss": -25.58490753173828, "global_step": 320778, "epoch": 3864} {"train_loss": -25.471975326538086, "global_step": 320779, "epoch": 3864} {"train_loss": -25.660037994384766, "global_step": 320780, "epoch": 3864} {"train_loss": -25.787927627563477, "global_step": 320781, "epoch": 3864} {"train_loss": -25.902149200439453, "global_step": 320782, "epoch": 3864} {"train_loss": -25.8126277923584, "global_step": 320783, "epoch": 3864} {"train_loss": -25.75947380065918, "global_step": 320784, "epoch": 3864} {"train_loss": -25.74749755859375, "global_step": 320785, "epoch": 3864} {"train_loss": -25.5257625579834, "global_step": 320786, "epoch": 3864} {"train_loss": -25.868391036987305, "global_step": 320787, "epoch": 3864} {"train_loss": -25.917449951171875, "global_step": 320788, "epoch": 3864} {"train_loss": -25.660825729370117, "global_step": 320789, "epoch": 3864} {"train_loss": -26.094816207885742, "global_step": 320790, "epoch": 3864} {"train_loss": -25.812702178955078, "global_step": 320791, "epoch": 3864} {"train_loss": -25.88482666015625, "global_step": 320792, "epoch": 3864} {"train_loss": -26.20171546936035, "global_step": 320793, "epoch": 3864} {"train_loss": -25.694703228502387, "global_step": 320794, "epoch": 3864, "val_loss": 7193143.0} {"train_loss": -24.49364471435547, "global_step": 320795, "epoch": 3865} {"train_loss": -25.004745483398438, "global_step": 320796, "epoch": 3865} {"train_loss": -25.174442291259766, "global_step": 320797, "epoch": 3865} {"train_loss": -25.287803649902344, "global_step": 320798, "epoch": 3865} {"train_loss": -25.206083297729492, "global_step": 320799, "epoch": 3865} {"train_loss": -25.298940658569336, "global_step": 320800, "epoch": 3865} {"train_loss": -25.388675689697266, "global_step": 320801, "epoch": 3865} {"train_loss": -25.41944694519043, "global_step": 320802, "epoch": 3865} {"train_loss": -25.19729995727539, "global_step": 320803, "epoch": 3865} {"train_loss": -25.693225860595703, "global_step": 320804, "epoch": 3865} {"train_loss": -25.089231491088867, "global_step": 320805, "epoch": 3865} {"train_loss": -25.318021774291992, "global_step": 320806, "epoch": 3865} {"train_loss": -25.53491973876953, "global_step": 320807, "epoch": 3865} {"train_loss": -25.328277587890625, "global_step": 320808, "epoch": 3865} {"train_loss": -25.33928680419922, "global_step": 320809, "epoch": 3865} {"train_loss": -25.662994384765625, "global_step": 320810, "epoch": 3865} {"train_loss": -25.5231990814209, "global_step": 320811, "epoch": 3865} {"train_loss": -25.069379806518555, "global_step": 320812, "epoch": 3865} {"train_loss": -25.659894943237305, "global_step": 320813, "epoch": 3865} {"train_loss": -25.937763214111328, "global_step": 320814, "epoch": 3865} {"train_loss": -25.480682373046875, "global_step": 320815, "epoch": 3865} {"train_loss": -25.731342315673828, "global_step": 320816, "epoch": 3865} {"train_loss": -25.643463134765625, "global_step": 320817, "epoch": 3865} {"train_loss": -25.733264923095703, "global_step": 320818, "epoch": 3865} {"train_loss": -25.856830596923828, "global_step": 320819, "epoch": 3865} {"train_loss": -25.477262496948242, "global_step": 320820, "epoch": 3865} {"train_loss": -26.016681671142578, "global_step": 320821, "epoch": 3865} {"train_loss": -25.867786407470703, "global_step": 320822, "epoch": 3865} {"train_loss": -25.814252853393555, "global_step": 320823, "epoch": 3865} {"train_loss": -25.953144073486328, "global_step": 320824, "epoch": 3865} {"train_loss": -25.659290313720703, "global_step": 320825, "epoch": 3865} {"train_loss": -25.71051597595215, "global_step": 320826, "epoch": 3865} {"train_loss": -26.056568145751953, "global_step": 320827, "epoch": 3865} {"train_loss": -25.875761032104492, "global_step": 320828, "epoch": 3865} {"train_loss": -25.757410049438477, "global_step": 320829, "epoch": 3865} {"train_loss": -25.869281768798828, "global_step": 320830, "epoch": 3865} {"train_loss": -25.917896270751953, "global_step": 320831, "epoch": 3865} {"train_loss": -25.95698356628418, "global_step": 320832, "epoch": 3865} {"train_loss": -25.717456817626953, "global_step": 320833, "epoch": 3865} {"train_loss": -25.832111358642578, "global_step": 320834, "epoch": 3865} {"train_loss": -25.809255599975586, "global_step": 320835, "epoch": 3865} {"train_loss": -25.4562931060791, "global_step": 320836, "epoch": 3865} {"train_loss": -25.451873779296875, "global_step": 320837, "epoch": 3865} {"train_loss": -25.980005264282227, "global_step": 320838, "epoch": 3865} {"train_loss": -26.1328125, "global_step": 320839, "epoch": 3865} {"train_loss": -26.243932723999023, "global_step": 320840, "epoch": 3865} {"train_loss": -26.054956436157227, "global_step": 320841, "epoch": 3865} {"train_loss": -25.915491104125977, "global_step": 320842, "epoch": 3865} {"train_loss": -25.517629623413086, "global_step": 320843, "epoch": 3865} {"train_loss": -26.009052276611328, "global_step": 320844, "epoch": 3865} {"train_loss": -25.89076042175293, "global_step": 320845, "epoch": 3865} {"train_loss": -25.628549575805664, "global_step": 320846, "epoch": 3865} {"train_loss": -25.839929580688477, "global_step": 320847, "epoch": 3865} {"train_loss": -26.219175338745117, "global_step": 320848, "epoch": 3865} {"train_loss": -26.1207332611084, "global_step": 320849, "epoch": 3865} {"train_loss": -26.54290199279785, "global_step": 320850, "epoch": 3865} {"train_loss": -25.50129508972168, "global_step": 320851, "epoch": 3865} {"train_loss": -25.82752799987793, "global_step": 320852, "epoch": 3865} {"train_loss": -26.268613815307617, "global_step": 320853, "epoch": 3865} {"train_loss": -25.8505859375, "global_step": 320854, "epoch": 3865} {"train_loss": -25.656835556030273, "global_step": 320855, "epoch": 3865} {"train_loss": -26.120941162109375, "global_step": 320856, "epoch": 3865} {"train_loss": -26.166975021362305, "global_step": 320857, "epoch": 3865} {"train_loss": -26.05059814453125, "global_step": 320858, "epoch": 3865} {"train_loss": -26.0141658782959, "global_step": 320859, "epoch": 3865} {"train_loss": -26.050092697143555, "global_step": 320860, "epoch": 3865} {"train_loss": -26.185718536376953, "global_step": 320861, "epoch": 3865} {"train_loss": -26.098682403564453, "global_step": 320862, "epoch": 3865} {"train_loss": -26.18929100036621, "global_step": 320863, "epoch": 3865} {"train_loss": -25.9884090423584, "global_step": 320864, "epoch": 3865} {"train_loss": -26.473535537719727, "global_step": 320865, "epoch": 3865} {"train_loss": -26.131916046142578, "global_step": 320866, "epoch": 3865} {"train_loss": -26.172056198120117, "global_step": 320867, "epoch": 3865} {"train_loss": -25.692129135131836, "global_step": 320868, "epoch": 3865} {"train_loss": -25.484291076660156, "global_step": 320869, "epoch": 3865} {"train_loss": -25.441686630249023, "global_step": 320870, "epoch": 3865} {"train_loss": -25.487192153930664, "global_step": 320871, "epoch": 3865} {"train_loss": -25.8773193359375, "global_step": 320872, "epoch": 3865} {"train_loss": -25.884841918945312, "global_step": 320873, "epoch": 3865} {"train_loss": -25.90236473083496, "global_step": 320874, "epoch": 3865} {"train_loss": -26.434951782226562, "global_step": 320875, "epoch": 3865} {"train_loss": -25.94111442565918, "global_step": 320876, "epoch": 3865} {"train_loss": -25.74850231768137, "global_step": 320877, "epoch": 3865, "val_loss": 7118961.0} {"train_loss": -25.721820831298828, "global_step": 320878, "epoch": 3866} {"train_loss": -23.749509811401367, "global_step": 320879, "epoch": 3866} {"train_loss": -23.91766357421875, "global_step": 320880, "epoch": 3866} {"train_loss": -25.250669479370117, "global_step": 320881, "epoch": 3866} {"train_loss": -24.62669563293457, "global_step": 320882, "epoch": 3866} {"train_loss": -25.28757095336914, "global_step": 320883, "epoch": 3866} {"train_loss": -24.947113037109375, "global_step": 320884, "epoch": 3866} {"train_loss": -25.280759811401367, "global_step": 320885, "epoch": 3866} {"train_loss": -25.004941940307617, "global_step": 320886, "epoch": 3866} {"train_loss": -25.150821685791016, "global_step": 320887, "epoch": 3866} {"train_loss": -25.524290084838867, "global_step": 320888, "epoch": 3866} {"train_loss": -25.00828742980957, "global_step": 320889, "epoch": 3866} {"train_loss": -24.90235710144043, "global_step": 320890, "epoch": 3866} {"train_loss": -25.398221969604492, "global_step": 320891, "epoch": 3866} {"train_loss": -25.493934631347656, "global_step": 320892, "epoch": 3866} {"train_loss": -25.05779457092285, "global_step": 320893, "epoch": 3866} {"train_loss": -25.3878231048584, "global_step": 320894, "epoch": 3866} {"train_loss": -25.40158462524414, "global_step": 320895, "epoch": 3866} {"train_loss": -25.342248916625977, "global_step": 320896, "epoch": 3866} {"train_loss": -25.44855308532715, "global_step": 320897, "epoch": 3866} {"train_loss": -25.50263023376465, "global_step": 320898, "epoch": 3866} {"train_loss": -25.65096092224121, "global_step": 320899, "epoch": 3866} {"train_loss": -25.626882553100586, "global_step": 320900, "epoch": 3866} {"train_loss": -25.559682846069336, "global_step": 320901, "epoch": 3866} {"train_loss": -25.141950607299805, "global_step": 320902, "epoch": 3866} {"train_loss": -25.880279541015625, "global_step": 320903, "epoch": 3866} {"train_loss": -25.65654945373535, "global_step": 320904, "epoch": 3866} {"train_loss": -25.6866512298584, "global_step": 320905, "epoch": 3866} {"train_loss": -26.20001220703125, "global_step": 320906, "epoch": 3866} {"train_loss": -25.817285537719727, "global_step": 320907, "epoch": 3866} {"train_loss": -25.583911895751953, "global_step": 320908, "epoch": 3866} {"train_loss": -25.7786808013916, "global_step": 320909, "epoch": 3866} {"train_loss": -25.788461685180664, "global_step": 320910, "epoch": 3866} {"train_loss": -26.00809097290039, "global_step": 320911, "epoch": 3866} {"train_loss": -25.377193450927734, "global_step": 320912, "epoch": 3866} {"train_loss": -25.878095626831055, "global_step": 320913, "epoch": 3866} {"train_loss": -26.126434326171875, "global_step": 320914, "epoch": 3866} {"train_loss": -25.79147720336914, "global_step": 320915, "epoch": 3866} {"train_loss": -25.659198760986328, "global_step": 320916, "epoch": 3866} {"train_loss": -26.145431518554688, "global_step": 320917, "epoch": 3866} {"train_loss": -26.157373428344727, "global_step": 320918, "epoch": 3866} {"train_loss": -25.600296020507812, "global_step": 320919, "epoch": 3866} {"train_loss": -25.75762939453125, "global_step": 320920, "epoch": 3866} {"train_loss": -25.74110221862793, "global_step": 320921, "epoch": 3866} {"train_loss": -25.97100257873535, "global_step": 320922, "epoch": 3866} {"train_loss": -25.72119140625, "global_step": 320923, "epoch": 3866} {"train_loss": -26.088781356811523, "global_step": 320924, "epoch": 3866} {"train_loss": -25.592092514038086, "global_step": 320925, "epoch": 3866} {"train_loss": -25.863067626953125, "global_step": 320926, "epoch": 3866} {"train_loss": -26.137842178344727, "global_step": 320927, "epoch": 3866} {"train_loss": -26.02100944519043, "global_step": 320928, "epoch": 3866} {"train_loss": -25.84467124938965, "global_step": 320929, "epoch": 3866} {"train_loss": -26.0033016204834, "global_step": 320930, "epoch": 3866} {"train_loss": -26.020431518554688, "global_step": 320931, "epoch": 3866} {"train_loss": -26.13410758972168, "global_step": 320932, "epoch": 3866} {"train_loss": -26.047327041625977, "global_step": 320933, "epoch": 3866} {"train_loss": -26.060998916625977, "global_step": 320934, "epoch": 3866} {"train_loss": -25.795740127563477, "global_step": 320935, "epoch": 3866} {"train_loss": -26.014270782470703, "global_step": 320936, "epoch": 3866} {"train_loss": -25.854352951049805, "global_step": 320937, "epoch": 3866} {"train_loss": -25.9892635345459, "global_step": 320938, "epoch": 3866} {"train_loss": -25.92473793029785, "global_step": 320939, "epoch": 3866} {"train_loss": -25.834836959838867, "global_step": 320940, "epoch": 3866} {"train_loss": -26.15155601501465, "global_step": 320941, "epoch": 3866} {"train_loss": -26.12748146057129, "global_step": 320942, "epoch": 3866} {"train_loss": -25.84375, "global_step": 320943, "epoch": 3866} {"train_loss": -25.9062442779541, "global_step": 320944, "epoch": 3866} {"train_loss": -26.273298263549805, "global_step": 320945, "epoch": 3866} {"train_loss": -25.700830459594727, "global_step": 320946, "epoch": 3866} {"train_loss": -25.731842041015625, "global_step": 320947, "epoch": 3866} {"train_loss": -25.617694854736328, "global_step": 320948, "epoch": 3866} {"train_loss": -26.27070426940918, "global_step": 320949, "epoch": 3866} {"train_loss": -25.604734420776367, "global_step": 320950, "epoch": 3866} {"train_loss": -26.107534408569336, "global_step": 320951, "epoch": 3866} {"train_loss": -25.991992950439453, "global_step": 320952, "epoch": 3866} {"train_loss": -25.886625289916992, "global_step": 320953, "epoch": 3866} {"train_loss": -25.982315063476562, "global_step": 320954, "epoch": 3866} {"train_loss": -25.87116050720215, "global_step": 320955, "epoch": 3866} {"train_loss": -26.013940811157227, "global_step": 320956, "epoch": 3866} {"train_loss": -26.037189483642578, "global_step": 320957, "epoch": 3866} {"train_loss": -25.762609481811523, "global_step": 320958, "epoch": 3866} {"train_loss": -25.88995361328125, "global_step": 320959, "epoch": 3866} {"train_loss": -25.68234147221209, "global_step": 320960, "epoch": 3866, "val_loss": 7235641.0} {"train_loss": -26.07364845275879, "global_step": 320961, "epoch": 3867} {"train_loss": -25.616498947143555, "global_step": 320962, "epoch": 3867} {"train_loss": -25.70599937438965, "global_step": 320963, "epoch": 3867} {"train_loss": -25.697656631469727, "global_step": 320964, "epoch": 3867} {"train_loss": -25.451162338256836, "global_step": 320965, "epoch": 3867} {"train_loss": -25.658166885375977, "global_step": 320966, "epoch": 3867} {"train_loss": -25.747425079345703, "global_step": 320967, "epoch": 3867} {"train_loss": -25.59440040588379, "global_step": 320968, "epoch": 3867} {"train_loss": -25.497724533081055, "global_step": 320969, "epoch": 3867} {"train_loss": -25.663604736328125, "global_step": 320970, "epoch": 3867} {"train_loss": -25.639957427978516, "global_step": 320971, "epoch": 3867} {"train_loss": -25.678165435791016, "global_step": 320972, "epoch": 3867} {"train_loss": -25.474998474121094, "global_step": 320973, "epoch": 3867} {"train_loss": -25.42343521118164, "global_step": 320974, "epoch": 3867} {"train_loss": -25.44020652770996, "global_step": 320975, "epoch": 3867} {"train_loss": -25.38795280456543, "global_step": 320976, "epoch": 3867} {"train_loss": -25.32448387145996, "global_step": 320977, "epoch": 3867} {"train_loss": -25.471267700195312, "global_step": 320978, "epoch": 3867} {"train_loss": -25.560312271118164, "global_step": 320979, "epoch": 3867} {"train_loss": -25.582822799682617, "global_step": 320980, "epoch": 3867} {"train_loss": -25.316526412963867, "global_step": 320981, "epoch": 3867} {"train_loss": -25.6826114654541, "global_step": 320982, "epoch": 3867} {"train_loss": -25.857873916625977, "global_step": 320983, "epoch": 3867} {"train_loss": -25.438215255737305, "global_step": 320984, "epoch": 3867} {"train_loss": -25.528860092163086, "global_step": 320985, "epoch": 3867} {"train_loss": -25.845703125, "global_step": 320986, "epoch": 3867} {"train_loss": -25.75432777404785, "global_step": 320987, "epoch": 3867} {"train_loss": -25.737287521362305, "global_step": 320988, "epoch": 3867} {"train_loss": -25.88361930847168, "global_step": 320989, "epoch": 3867} {"train_loss": -25.688138961791992, "global_step": 320990, "epoch": 3867} {"train_loss": -25.544889450073242, "global_step": 320991, "epoch": 3867} {"train_loss": -25.586149215698242, "global_step": 320992, "epoch": 3867} {"train_loss": -25.900110244750977, "global_step": 320993, "epoch": 3867} {"train_loss": -25.702014923095703, "global_step": 320994, "epoch": 3867} {"train_loss": -25.618640899658203, "global_step": 320995, "epoch": 3867} {"train_loss": -25.999683380126953, "global_step": 320996, "epoch": 3867} {"train_loss": -25.62353515625, "global_step": 320997, "epoch": 3867} {"train_loss": -25.934301376342773, "global_step": 320998, "epoch": 3867} {"train_loss": -26.152729034423828, "global_step": 320999, "epoch": 3867} {"train_loss": -25.64495849609375, "global_step": 321000, "epoch": 3867} {"train_loss": -25.8623046875, "global_step": 321001, "epoch": 3867} {"train_loss": -26.025049209594727, "global_step": 321002, "epoch": 3867} {"train_loss": -26.087736129760742, "global_step": 321003, "epoch": 3867} {"train_loss": -25.781003952026367, "global_step": 321004, "epoch": 3867} {"train_loss": -25.932783126831055, "global_step": 321005, "epoch": 3867} {"train_loss": -26.274267196655273, "global_step": 321006, "epoch": 3867} {"train_loss": -26.269180297851562, "global_step": 321007, "epoch": 3867} {"train_loss": -25.958967208862305, "global_step": 321008, "epoch": 3867} {"train_loss": -25.865188598632812, "global_step": 321009, "epoch": 3867} {"train_loss": -25.849451065063477, "global_step": 321010, "epoch": 3867} {"train_loss": -26.05692481994629, "global_step": 321011, "epoch": 3867} {"train_loss": -26.217382431030273, "global_step": 321012, "epoch": 3867} {"train_loss": -26.269556045532227, "global_step": 321013, "epoch": 3867} {"train_loss": -26.01126480102539, "global_step": 321014, "epoch": 3867} {"train_loss": -26.3470401763916, "global_step": 321015, "epoch": 3867} {"train_loss": -25.809171676635742, "global_step": 321016, "epoch": 3867} {"train_loss": -25.843793869018555, "global_step": 321017, "epoch": 3867} {"train_loss": -25.938886642456055, "global_step": 321018, "epoch": 3867} {"train_loss": -25.89899253845215, "global_step": 321019, "epoch": 3867} {"train_loss": -26.00909996032715, "global_step": 321020, "epoch": 3867} {"train_loss": -26.25440788269043, "global_step": 321021, "epoch": 3867} {"train_loss": -25.978601455688477, "global_step": 321022, "epoch": 3867} {"train_loss": -25.9593563079834, "global_step": 321023, "epoch": 3867} {"train_loss": -25.812292098999023, "global_step": 321024, "epoch": 3867} {"train_loss": -25.704633712768555, "global_step": 321025, "epoch": 3867} {"train_loss": -25.80519676208496, "global_step": 321026, "epoch": 3867} {"train_loss": -25.962848663330078, "global_step": 321027, "epoch": 3867} {"train_loss": -25.435443878173828, "global_step": 321028, "epoch": 3867} {"train_loss": -25.661884307861328, "global_step": 321029, "epoch": 3867} {"train_loss": -24.878820419311523, "global_step": 321030, "epoch": 3867} {"train_loss": -25.78908348083496, "global_step": 321031, "epoch": 3867} {"train_loss": -25.915470123291016, "global_step": 321032, "epoch": 3867} {"train_loss": -25.791593551635742, "global_step": 321033, "epoch": 3867} {"train_loss": -25.414236068725586, "global_step": 321034, "epoch": 3867} {"train_loss": -25.739898681640625, "global_step": 321035, "epoch": 3867} {"train_loss": -25.6334228515625, "global_step": 321036, "epoch": 3867} {"train_loss": -25.778827667236328, "global_step": 321037, "epoch": 3867} {"train_loss": -25.9398193359375, "global_step": 321038, "epoch": 3867} {"train_loss": -25.599050521850586, "global_step": 321039, "epoch": 3867} {"train_loss": -25.52242660522461, "global_step": 321040, "epoch": 3867} {"train_loss": -25.945165634155273, "global_step": 321041, "epoch": 3867} {"train_loss": -26.01910400390625, "global_step": 321042, "epoch": 3867} {"train_loss": -25.771112005394624, "global_step": 321043, "epoch": 3867, "val_loss": 7336735.0} {"train_loss": -25.575716018676758, "global_step": 321044, "epoch": 3868} {"train_loss": -25.73150634765625, "global_step": 321045, "epoch": 3868} {"train_loss": -25.433324813842773, "global_step": 321046, "epoch": 3868} {"train_loss": -25.263038635253906, "global_step": 321047, "epoch": 3868} {"train_loss": -25.71808433532715, "global_step": 321048, "epoch": 3868} {"train_loss": -25.31730842590332, "global_step": 321049, "epoch": 3868} {"train_loss": -25.79458999633789, "global_step": 321050, "epoch": 3868} {"train_loss": -25.17584800720215, "global_step": 321051, "epoch": 3868} {"train_loss": -26.03128433227539, "global_step": 321052, "epoch": 3868} {"train_loss": -25.569171905517578, "global_step": 321053, "epoch": 3868} {"train_loss": -25.68462562561035, "global_step": 321054, "epoch": 3868} {"train_loss": -25.564008712768555, "global_step": 321055, "epoch": 3868} {"train_loss": -25.886648178100586, "global_step": 321056, "epoch": 3868} {"train_loss": -25.797138214111328, "global_step": 321057, "epoch": 3868} {"train_loss": -25.530866622924805, "global_step": 321058, "epoch": 3868} {"train_loss": -25.615354537963867, "global_step": 321059, "epoch": 3868} {"train_loss": -25.49201202392578, "global_step": 321060, "epoch": 3868} {"train_loss": -25.86771011352539, "global_step": 321061, "epoch": 3868} {"train_loss": -25.66128921508789, "global_step": 321062, "epoch": 3868} {"train_loss": -25.87238121032715, "global_step": 321063, "epoch": 3868} {"train_loss": -25.76820182800293, "global_step": 321064, "epoch": 3868} {"train_loss": -26.012292861938477, "global_step": 321065, "epoch": 3868} {"train_loss": -25.727161407470703, "global_step": 321066, "epoch": 3868} {"train_loss": -25.107454299926758, "global_step": 321067, "epoch": 3868} {"train_loss": -25.411968231201172, "global_step": 321068, "epoch": 3868} {"train_loss": -25.550222396850586, "global_step": 321069, "epoch": 3868} {"train_loss": -25.89237403869629, "global_step": 321070, "epoch": 3868} {"train_loss": -25.371315002441406, "global_step": 321071, "epoch": 3868} {"train_loss": -25.25501823425293, "global_step": 321072, "epoch": 3868} {"train_loss": -25.565326690673828, "global_step": 321073, "epoch": 3868} {"train_loss": -25.62860679626465, "global_step": 321074, "epoch": 3868} {"train_loss": -25.777774810791016, "global_step": 321075, "epoch": 3868} {"train_loss": -26.00177574157715, "global_step": 321076, "epoch": 3868} {"train_loss": -26.241857528686523, "global_step": 321077, "epoch": 3868} {"train_loss": -26.070056915283203, "global_step": 321078, "epoch": 3868} {"train_loss": -26.125776290893555, "global_step": 321079, "epoch": 3868} {"train_loss": -25.733322143554688, "global_step": 321080, "epoch": 3868} {"train_loss": -26.4300479888916, "global_step": 321081, "epoch": 3868} {"train_loss": -25.798017501831055, "global_step": 321082, "epoch": 3868} {"train_loss": -25.9222469329834, "global_step": 321083, "epoch": 3868} {"train_loss": -25.957624435424805, "global_step": 321084, "epoch": 3868} {"train_loss": -26.024494171142578, "global_step": 321085, "epoch": 3868} {"train_loss": -26.10808753967285, "global_step": 321086, "epoch": 3868} {"train_loss": -26.24680519104004, "global_step": 321087, "epoch": 3868} {"train_loss": -25.953454971313477, "global_step": 321088, "epoch": 3868} {"train_loss": -25.393232345581055, "global_step": 321089, "epoch": 3868} {"train_loss": -26.098209381103516, "global_step": 321090, "epoch": 3868} {"train_loss": -26.198270797729492, "global_step": 321091, "epoch": 3868} {"train_loss": -25.775165557861328, "global_step": 321092, "epoch": 3868} {"train_loss": -25.915435791015625, "global_step": 321093, "epoch": 3868} {"train_loss": -26.0172061920166, "global_step": 321094, "epoch": 3868} {"train_loss": -25.956018447875977, "global_step": 321095, "epoch": 3868} {"train_loss": -25.8617000579834, "global_step": 321096, "epoch": 3868} {"train_loss": -25.948827743530273, "global_step": 321097, "epoch": 3868} {"train_loss": -25.982074737548828, "global_step": 321098, "epoch": 3868} {"train_loss": -25.799535751342773, "global_step": 321099, "epoch": 3868} {"train_loss": -25.7314510345459, "global_step": 321100, "epoch": 3868} {"train_loss": -26.04878044128418, "global_step": 321101, "epoch": 3868} {"train_loss": -26.405380249023438, "global_step": 321102, "epoch": 3868} {"train_loss": -26.00982666015625, "global_step": 321103, "epoch": 3868} {"train_loss": -26.01123046875, "global_step": 321104, "epoch": 3868} {"train_loss": -25.890974044799805, "global_step": 321105, "epoch": 3868} {"train_loss": -25.74863624572754, "global_step": 321106, "epoch": 3868} {"train_loss": -25.539825439453125, "global_step": 321107, "epoch": 3868} {"train_loss": -25.169519424438477, "global_step": 321108, "epoch": 3868} {"train_loss": -25.352584838867188, "global_step": 321109, "epoch": 3868} {"train_loss": -25.575708389282227, "global_step": 321110, "epoch": 3868} {"train_loss": -25.63140296936035, "global_step": 321111, "epoch": 3868} {"train_loss": -25.637771606445312, "global_step": 321112, "epoch": 3868} {"train_loss": -25.756912231445312, "global_step": 321113, "epoch": 3868} {"train_loss": -25.806203842163086, "global_step": 321114, "epoch": 3868} {"train_loss": -25.77432632446289, "global_step": 321115, "epoch": 3868} {"train_loss": -26.064929962158203, "global_step": 321116, "epoch": 3868} {"train_loss": -25.910608291625977, "global_step": 321117, "epoch": 3868} {"train_loss": -25.820392608642578, "global_step": 321118, "epoch": 3868} {"train_loss": -25.93868064880371, "global_step": 321119, "epoch": 3868} {"train_loss": -25.929031372070312, "global_step": 321120, "epoch": 3868} {"train_loss": -25.584135055541992, "global_step": 321121, "epoch": 3868} {"train_loss": -25.864850997924805, "global_step": 321122, "epoch": 3868} {"train_loss": -25.75996208190918, "global_step": 321123, "epoch": 3868} {"train_loss": -25.807355880737305, "global_step": 321124, "epoch": 3868} {"train_loss": -25.62091636657715, "global_step": 321125, "epoch": 3868} {"train_loss": -25.76677630321089, "global_step": 321126, "epoch": 3868, "val_loss": 7197145.5} {"train_loss": -25.268545150756836, "global_step": 321127, "epoch": 3869} {"train_loss": -25.7237491607666, "global_step": 321128, "epoch": 3869} {"train_loss": -25.218595504760742, "global_step": 321129, "epoch": 3869} {"train_loss": -25.575254440307617, "global_step": 321130, "epoch": 3869} {"train_loss": -25.521177291870117, "global_step": 321131, "epoch": 3869} {"train_loss": -25.429908752441406, "global_step": 321132, "epoch": 3869} {"train_loss": -25.772008895874023, "global_step": 321133, "epoch": 3869} {"train_loss": -25.44582176208496, "global_step": 321134, "epoch": 3869} {"train_loss": -25.987411499023438, "global_step": 321135, "epoch": 3869} {"train_loss": -25.731409072875977, "global_step": 321136, "epoch": 3869} {"train_loss": -25.722387313842773, "global_step": 321137, "epoch": 3869} {"train_loss": -25.326129913330078, "global_step": 321138, "epoch": 3869} {"train_loss": -25.161649703979492, "global_step": 321139, "epoch": 3869} {"train_loss": -25.73810386657715, "global_step": 321140, "epoch": 3869} {"train_loss": -25.756711959838867, "global_step": 321141, "epoch": 3869} {"train_loss": -25.373668670654297, "global_step": 321142, "epoch": 3869} {"train_loss": -25.802936553955078, "global_step": 321143, "epoch": 3869} {"train_loss": -25.92792320251465, "global_step": 321144, "epoch": 3869} {"train_loss": -26.248334884643555, "global_step": 321145, "epoch": 3869} {"train_loss": -25.91175651550293, "global_step": 321146, "epoch": 3869} {"train_loss": -25.869155883789062, "global_step": 321147, "epoch": 3869} {"train_loss": -25.641422271728516, "global_step": 321148, "epoch": 3869} {"train_loss": -26.01943016052246, "global_step": 321149, "epoch": 3869} {"train_loss": -25.902379989624023, "global_step": 321150, "epoch": 3869} {"train_loss": -25.823226928710938, "global_step": 321151, "epoch": 3869} {"train_loss": -25.91916847229004, "global_step": 321152, "epoch": 3869} {"train_loss": -26.14703941345215, "global_step": 321153, "epoch": 3869} {"train_loss": -26.100330352783203, "global_step": 321154, "epoch": 3869} {"train_loss": -25.948471069335938, "global_step": 321155, "epoch": 3869} {"train_loss": -25.999298095703125, "global_step": 321156, "epoch": 3869} {"train_loss": -25.71188735961914, "global_step": 321157, "epoch": 3869} {"train_loss": -25.662572860717773, "global_step": 321158, "epoch": 3869} {"train_loss": -25.977741241455078, "global_step": 321159, "epoch": 3869} {"train_loss": -26.2891902923584, "global_step": 321160, "epoch": 3869} {"train_loss": -25.765836715698242, "global_step": 321161, "epoch": 3869} {"train_loss": -26.186445236206055, "global_step": 321162, "epoch": 3869} {"train_loss": -26.18720054626465, "global_step": 321163, "epoch": 3869} {"train_loss": -26.42989158630371, "global_step": 321164, "epoch": 3869} {"train_loss": -26.200626373291016, "global_step": 321165, "epoch": 3869} {"train_loss": -26.029211044311523, "global_step": 321166, "epoch": 3869} {"train_loss": -25.667322158813477, "global_step": 321167, "epoch": 3869} {"train_loss": -25.816198348999023, "global_step": 321168, "epoch": 3869} {"train_loss": -26.023590087890625, "global_step": 321169, "epoch": 3869} {"train_loss": -25.83637809753418, "global_step": 321170, "epoch": 3869} {"train_loss": -25.9000186920166, "global_step": 321171, "epoch": 3869} {"train_loss": -25.919239044189453, "global_step": 321172, "epoch": 3869} {"train_loss": -25.83731460571289, "global_step": 321173, "epoch": 3869} {"train_loss": -26.242719650268555, "global_step": 321174, "epoch": 3869} {"train_loss": -25.94597816467285, "global_step": 321175, "epoch": 3869} {"train_loss": -25.766462326049805, "global_step": 321176, "epoch": 3869} {"train_loss": -25.870710372924805, "global_step": 321177, "epoch": 3869} {"train_loss": -25.710834503173828, "global_step": 321178, "epoch": 3869} {"train_loss": -25.955001831054688, "global_step": 321179, "epoch": 3869} {"train_loss": -25.736555099487305, "global_step": 321180, "epoch": 3869} {"train_loss": -26.22084617614746, "global_step": 321181, "epoch": 3869} {"train_loss": -26.146329879760742, "global_step": 321182, "epoch": 3869} {"train_loss": -25.835926055908203, "global_step": 321183, "epoch": 3869} {"train_loss": -25.723020553588867, "global_step": 321184, "epoch": 3869} {"train_loss": -25.904565811157227, "global_step": 321185, "epoch": 3869} {"train_loss": -26.23963737487793, "global_step": 321186, "epoch": 3869} {"train_loss": -25.79473876953125, "global_step": 321187, "epoch": 3869} {"train_loss": -25.9955997467041, "global_step": 321188, "epoch": 3869} {"train_loss": -25.718215942382812, "global_step": 321189, "epoch": 3869} {"train_loss": -26.098142623901367, "global_step": 321190, "epoch": 3869} {"train_loss": -25.900293350219727, "global_step": 321191, "epoch": 3869} {"train_loss": -26.110116958618164, "global_step": 321192, "epoch": 3869} {"train_loss": -25.240558624267578, "global_step": 321193, "epoch": 3869} {"train_loss": -25.525110244750977, "global_step": 321194, "epoch": 3869} {"train_loss": -25.9184627532959, "global_step": 321195, "epoch": 3869} {"train_loss": -26.0457820892334, "global_step": 321196, "epoch": 3869} {"train_loss": -25.609516143798828, "global_step": 321197, "epoch": 3869} {"train_loss": -25.694074630737305, "global_step": 321198, "epoch": 3869} {"train_loss": -26.02127456665039, "global_step": 321199, "epoch": 3869} {"train_loss": -25.73628044128418, "global_step": 321200, "epoch": 3869} {"train_loss": -25.767446517944336, "global_step": 321201, "epoch": 3869} {"train_loss": -25.977569580078125, "global_step": 321202, "epoch": 3869} {"train_loss": -25.90447425842285, "global_step": 321203, "epoch": 3869} {"train_loss": -25.698654174804688, "global_step": 321204, "epoch": 3869} {"train_loss": -25.619434356689453, "global_step": 321205, "epoch": 3869} {"train_loss": -25.642887115478516, "global_step": 321206, "epoch": 3869} {"train_loss": -25.846826553344727, "global_step": 321207, "epoch": 3869} {"train_loss": -25.723590850830078, "global_step": 321208, "epoch": 3869} {"train_loss": -25.84860397246947, "global_step": 321209, "epoch": 3869, "val_loss": 7085199.0} {"train_loss": -24.982175827026367, "global_step": 321210, "epoch": 3870} {"train_loss": -25.70001792907715, "global_step": 321211, "epoch": 3870} {"train_loss": -25.379043579101562, "global_step": 321212, "epoch": 3870} {"train_loss": -25.27769660949707, "global_step": 321213, "epoch": 3870} {"train_loss": -25.6375675201416, "global_step": 321214, "epoch": 3870} {"train_loss": -25.77143669128418, "global_step": 321215, "epoch": 3870} {"train_loss": -25.085824966430664, "global_step": 321216, "epoch": 3870} {"train_loss": -25.501829147338867, "global_step": 321217, "epoch": 3870} {"train_loss": -25.815505981445312, "global_step": 321218, "epoch": 3870} {"train_loss": -25.541217803955078, "global_step": 321219, "epoch": 3870} {"train_loss": -25.439077377319336, "global_step": 321220, "epoch": 3870} {"train_loss": -25.7027645111084, "global_step": 321221, "epoch": 3870} {"train_loss": -25.626663208007812, "global_step": 321222, "epoch": 3870} {"train_loss": -25.93208122253418, "global_step": 321223, "epoch": 3870} {"train_loss": -25.719345092773438, "global_step": 321224, "epoch": 3870} {"train_loss": -25.804569244384766, "global_step": 321225, "epoch": 3870} {"train_loss": -25.168079376220703, "global_step": 321226, "epoch": 3870} {"train_loss": -25.8201847076416, "global_step": 321227, "epoch": 3870} {"train_loss": -25.6483211517334, "global_step": 321228, "epoch": 3870} {"train_loss": -25.46161460876465, "global_step": 321229, "epoch": 3870} {"train_loss": -25.5482177734375, "global_step": 321230, "epoch": 3870} {"train_loss": -25.769550323486328, "global_step": 321231, "epoch": 3870} {"train_loss": -26.061065673828125, "global_step": 321232, "epoch": 3870} {"train_loss": -25.66718101501465, "global_step": 321233, "epoch": 3870} {"train_loss": -25.60967445373535, "global_step": 321234, "epoch": 3870} {"train_loss": -25.751012802124023, "global_step": 321235, "epoch": 3870} {"train_loss": -25.911130905151367, "global_step": 321236, "epoch": 3870} {"train_loss": -26.05133056640625, "global_step": 321237, "epoch": 3870} {"train_loss": -25.586483001708984, "global_step": 321238, "epoch": 3870} {"train_loss": -25.794824600219727, "global_step": 321239, "epoch": 3870} {"train_loss": -25.91070556640625, "global_step": 321240, "epoch": 3870} {"train_loss": -26.0151309967041, "global_step": 321241, "epoch": 3870} {"train_loss": -26.04056739807129, "global_step": 321242, "epoch": 3870} {"train_loss": -25.61533546447754, "global_step": 321243, "epoch": 3870} {"train_loss": -25.58009910583496, "global_step": 321244, "epoch": 3870} {"train_loss": -26.037124633789062, "global_step": 321245, "epoch": 3870} {"train_loss": -26.10589599609375, "global_step": 321246, "epoch": 3870} {"train_loss": -25.9445858001709, "global_step": 321247, "epoch": 3870} {"train_loss": -26.062549591064453, "global_step": 321248, "epoch": 3870} {"train_loss": -25.506977081298828, "global_step": 321249, "epoch": 3870} {"train_loss": -25.98261833190918, "global_step": 321250, "epoch": 3870} {"train_loss": -25.73777198791504, "global_step": 321251, "epoch": 3870} {"train_loss": -25.73322868347168, "global_step": 321252, "epoch": 3870} {"train_loss": -26.332828521728516, "global_step": 321253, "epoch": 3870} {"train_loss": -25.942182540893555, "global_step": 321254, "epoch": 3870} {"train_loss": -26.000747680664062, "global_step": 321255, "epoch": 3870} {"train_loss": -26.108442306518555, "global_step": 321256, "epoch": 3870} {"train_loss": -25.964929580688477, "global_step": 321257, "epoch": 3870} {"train_loss": -26.152639389038086, "global_step": 321258, "epoch": 3870} {"train_loss": -26.02560806274414, "global_step": 321259, "epoch": 3870} {"train_loss": -26.22566032409668, "global_step": 321260, "epoch": 3870} {"train_loss": -26.222265243530273, "global_step": 321261, "epoch": 3870} {"train_loss": -25.943281173706055, "global_step": 321262, "epoch": 3870} {"train_loss": -26.08228874206543, "global_step": 321263, "epoch": 3870} {"train_loss": -25.7669620513916, "global_step": 321264, "epoch": 3870} {"train_loss": -25.788253784179688, "global_step": 321265, "epoch": 3870} {"train_loss": -25.800922393798828, "global_step": 321266, "epoch": 3870} {"train_loss": -26.249113082885742, "global_step": 321267, "epoch": 3870} {"train_loss": -25.9846134185791, "global_step": 321268, "epoch": 3870} {"train_loss": -26.228443145751953, "global_step": 321269, "epoch": 3870} {"train_loss": -26.196775436401367, "global_step": 321270, "epoch": 3870} {"train_loss": -25.878034591674805, "global_step": 321271, "epoch": 3870} {"train_loss": -25.5366268157959, "global_step": 321272, "epoch": 3870} {"train_loss": -26.0412540435791, "global_step": 321273, "epoch": 3870} {"train_loss": -25.853229522705078, "global_step": 321274, "epoch": 3870} {"train_loss": -26.20380210876465, "global_step": 321275, "epoch": 3870} {"train_loss": -26.137048721313477, "global_step": 321276, "epoch": 3870} {"train_loss": -25.34812355041504, "global_step": 321277, "epoch": 3870} {"train_loss": -24.809741973876953, "global_step": 321278, "epoch": 3870} {"train_loss": -25.767179489135742, "global_step": 321279, "epoch": 3870} {"train_loss": -25.49787712097168, "global_step": 321280, "epoch": 3870} {"train_loss": -25.7854061126709, "global_step": 321281, "epoch": 3870} {"train_loss": -25.466577529907227, "global_step": 321282, "epoch": 3870} {"train_loss": -25.440732955932617, "global_step": 321283, "epoch": 3870} {"train_loss": -25.850982666015625, "global_step": 321284, "epoch": 3870} {"train_loss": -26.030553817749023, "global_step": 321285, "epoch": 3870} {"train_loss": -25.75209617614746, "global_step": 321286, "epoch": 3870} {"train_loss": -25.959081649780273, "global_step": 321287, "epoch": 3870} {"train_loss": -25.86622428894043, "global_step": 321288, "epoch": 3870} {"train_loss": -25.887487411499023, "global_step": 321289, "epoch": 3870} {"train_loss": -25.7214412689209, "global_step": 321290, "epoch": 3870} {"train_loss": -25.815357208251953, "global_step": 321291, "epoch": 3870} {"train_loss": -25.773467879697503, "global_step": 321292, "epoch": 3870, "val_loss": 7267880.0} {"train_loss": -24.898107528686523, "global_step": 321293, "epoch": 3871} {"train_loss": -24.60548210144043, "global_step": 321294, "epoch": 3871} {"train_loss": -24.988187789916992, "global_step": 321295, "epoch": 3871} {"train_loss": -24.904199600219727, "global_step": 321296, "epoch": 3871} {"train_loss": -24.088308334350586, "global_step": 321297, "epoch": 3871} {"train_loss": -24.70975685119629, "global_step": 321298, "epoch": 3871} {"train_loss": -25.263151168823242, "global_step": 321299, "epoch": 3871} {"train_loss": -25.024534225463867, "global_step": 321300, "epoch": 3871} {"train_loss": -24.76230239868164, "global_step": 321301, "epoch": 3871} {"train_loss": -25.394067764282227, "global_step": 321302, "epoch": 3871} {"train_loss": -24.850187301635742, "global_step": 321303, "epoch": 3871} {"train_loss": -25.41287612915039, "global_step": 321304, "epoch": 3871} {"train_loss": -25.12662124633789, "global_step": 321305, "epoch": 3871} {"train_loss": -25.318601608276367, "global_step": 321306, "epoch": 3871} {"train_loss": -25.18828010559082, "global_step": 321307, "epoch": 3871} {"train_loss": -25.197450637817383, "global_step": 321308, "epoch": 3871} {"train_loss": -25.67058753967285, "global_step": 321309, "epoch": 3871} {"train_loss": -25.54863166809082, "global_step": 321310, "epoch": 3871} {"train_loss": -25.53577995300293, "global_step": 321311, "epoch": 3871} {"train_loss": -25.770557403564453, "global_step": 321312, "epoch": 3871} {"train_loss": -25.54194450378418, "global_step": 321313, "epoch": 3871} {"train_loss": -25.406614303588867, "global_step": 321314, "epoch": 3871} {"train_loss": -25.7247314453125, "global_step": 321315, "epoch": 3871} {"train_loss": -25.924482345581055, "global_step": 321316, "epoch": 3871} {"train_loss": -26.043426513671875, "global_step": 321317, "epoch": 3871} {"train_loss": -25.97321891784668, "global_step": 321318, "epoch": 3871} {"train_loss": -25.54733657836914, "global_step": 321319, "epoch": 3871} {"train_loss": -25.98585319519043, "global_step": 321320, "epoch": 3871} {"train_loss": -25.881763458251953, "global_step": 321321, "epoch": 3871} {"train_loss": -26.004703521728516, "global_step": 321322, "epoch": 3871} {"train_loss": -25.758625030517578, "global_step": 321323, "epoch": 3871} {"train_loss": -25.83717155456543, "global_step": 321324, "epoch": 3871} {"train_loss": -25.866230010986328, "global_step": 321325, "epoch": 3871} {"train_loss": -25.646875381469727, "global_step": 321326, "epoch": 3871} {"train_loss": -25.53012466430664, "global_step": 321327, "epoch": 3871} {"train_loss": -26.005712509155273, "global_step": 321328, "epoch": 3871} {"train_loss": -25.564102172851562, "global_step": 321329, "epoch": 3871} {"train_loss": -26.30573081970215, "global_step": 321330, "epoch": 3871} {"train_loss": -25.55124855041504, "global_step": 321331, "epoch": 3871} {"train_loss": -25.911081314086914, "global_step": 321332, "epoch": 3871} {"train_loss": -25.97415542602539, "global_step": 321333, "epoch": 3871} {"train_loss": -25.766386032104492, "global_step": 321334, "epoch": 3871} {"train_loss": -26.103490829467773, "global_step": 321335, "epoch": 3871} {"train_loss": -25.970563888549805, "global_step": 321336, "epoch": 3871} {"train_loss": -25.826581954956055, "global_step": 321337, "epoch": 3871} {"train_loss": -25.925399780273438, "global_step": 321338, "epoch": 3871} {"train_loss": -25.883228302001953, "global_step": 321339, "epoch": 3871} {"train_loss": -26.24342155456543, "global_step": 321340, "epoch": 3871} {"train_loss": -25.666522979736328, "global_step": 321341, "epoch": 3871} {"train_loss": -26.07169532775879, "global_step": 321342, "epoch": 3871} {"train_loss": -26.03682518005371, "global_step": 321343, "epoch": 3871} {"train_loss": -25.849905014038086, "global_step": 321344, "epoch": 3871} {"train_loss": -25.97528076171875, "global_step": 321345, "epoch": 3871} {"train_loss": -25.60981559753418, "global_step": 321346, "epoch": 3871} {"train_loss": -25.889829635620117, "global_step": 321347, "epoch": 3871} {"train_loss": -25.748395919799805, "global_step": 321348, "epoch": 3871} {"train_loss": -26.19703483581543, "global_step": 321349, "epoch": 3871} {"train_loss": -26.155963897705078, "global_step": 321350, "epoch": 3871} {"train_loss": -26.2589054107666, "global_step": 321351, "epoch": 3871} {"train_loss": -25.952600479125977, "global_step": 321352, "epoch": 3871} {"train_loss": -26.215774536132812, "global_step": 321353, "epoch": 3871} {"train_loss": -26.04742431640625, "global_step": 321354, "epoch": 3871} {"train_loss": -25.88165283203125, "global_step": 321355, "epoch": 3871} {"train_loss": -26.009241104125977, "global_step": 321356, "epoch": 3871} {"train_loss": -26.21089744567871, "global_step": 321357, "epoch": 3871} {"train_loss": -25.9489688873291, "global_step": 321358, "epoch": 3871} {"train_loss": -26.031280517578125, "global_step": 321359, "epoch": 3871} {"train_loss": -26.318134307861328, "global_step": 321360, "epoch": 3871} {"train_loss": -26.32614517211914, "global_step": 321361, "epoch": 3871} {"train_loss": -26.09038734436035, "global_step": 321362, "epoch": 3871} {"train_loss": -25.980854034423828, "global_step": 321363, "epoch": 3871} {"train_loss": -25.9985294342041, "global_step": 321364, "epoch": 3871} {"train_loss": -26.023529052734375, "global_step": 321365, "epoch": 3871} {"train_loss": -25.433828353881836, "global_step": 321366, "epoch": 3871} {"train_loss": -25.789926528930664, "global_step": 321367, "epoch": 3871} {"train_loss": -25.577823638916016, "global_step": 321368, "epoch": 3871} {"train_loss": -25.590417861938477, "global_step": 321369, "epoch": 3871} {"train_loss": -26.28375816345215, "global_step": 321370, "epoch": 3871} {"train_loss": -25.761850357055664, "global_step": 321371, "epoch": 3871} {"train_loss": -25.860193252563477, "global_step": 321372, "epoch": 3871} {"train_loss": -25.7717342376709, "global_step": 321373, "epoch": 3871} {"train_loss": -26.091867446899414, "global_step": 321374, "epoch": 3871} {"train_loss": -25.717776907495704, "global_step": 321375, "epoch": 3871, "val_loss": 7391926.5} {"train_loss": -25.50777816772461, "global_step": 321376, "epoch": 3872} {"train_loss": -25.3908634185791, "global_step": 321377, "epoch": 3872} {"train_loss": -25.419281005859375, "global_step": 321378, "epoch": 3872} {"train_loss": -25.507402420043945, "global_step": 321379, "epoch": 3872} {"train_loss": -25.53163719177246, "global_step": 321380, "epoch": 3872} {"train_loss": -25.483978271484375, "global_step": 321381, "epoch": 3872} {"train_loss": -25.786474227905273, "global_step": 321382, "epoch": 3872} {"train_loss": -25.556354522705078, "global_step": 321383, "epoch": 3872} {"train_loss": -25.6474609375, "global_step": 321384, "epoch": 3872} {"train_loss": -25.46195411682129, "global_step": 321385, "epoch": 3872} {"train_loss": -25.843891143798828, "global_step": 321386, "epoch": 3872} {"train_loss": -25.33843994140625, "global_step": 321387, "epoch": 3872} {"train_loss": -25.806013107299805, "global_step": 321388, "epoch": 3872} {"train_loss": -25.91412353515625, "global_step": 321389, "epoch": 3872} {"train_loss": -25.8128662109375, "global_step": 321390, "epoch": 3872} {"train_loss": -25.512060165405273, "global_step": 321391, "epoch": 3872} {"train_loss": -25.776662826538086, "global_step": 321392, "epoch": 3872} {"train_loss": -25.7604923248291, "global_step": 321393, "epoch": 3872} {"train_loss": -26.049848556518555, "global_step": 321394, "epoch": 3872} {"train_loss": -25.56683349609375, "global_step": 321395, "epoch": 3872} {"train_loss": -26.255529403686523, "global_step": 321396, "epoch": 3872} {"train_loss": -25.8360652923584, "global_step": 321397, "epoch": 3872} {"train_loss": -25.81463050842285, "global_step": 321398, "epoch": 3872} {"train_loss": -26.03742027282715, "global_step": 321399, "epoch": 3872} {"train_loss": -26.113412857055664, "global_step": 321400, "epoch": 3872} {"train_loss": -25.856739044189453, "global_step": 321401, "epoch": 3872} {"train_loss": -25.450191497802734, "global_step": 321402, "epoch": 3872} {"train_loss": -26.10028648376465, "global_step": 321403, "epoch": 3872} {"train_loss": -25.930103302001953, "global_step": 321404, "epoch": 3872} {"train_loss": -25.767560958862305, "global_step": 321405, "epoch": 3872} {"train_loss": -26.0949649810791, "global_step": 321406, "epoch": 3872} {"train_loss": -26.03889274597168, "global_step": 321407, "epoch": 3872} {"train_loss": -25.9084415435791, "global_step": 321408, "epoch": 3872} {"train_loss": -25.854639053344727, "global_step": 321409, "epoch": 3872} {"train_loss": -26.11591148376465, "global_step": 321410, "epoch": 3872} {"train_loss": -26.454090118408203, "global_step": 321411, "epoch": 3872} {"train_loss": -25.933515548706055, "global_step": 321412, "epoch": 3872} {"train_loss": -26.146787643432617, "global_step": 321413, "epoch": 3872} {"train_loss": -26.316802978515625, "global_step": 321414, "epoch": 3872} {"train_loss": -25.64507484436035, "global_step": 321415, "epoch": 3872} {"train_loss": -26.473007202148438, "global_step": 321416, "epoch": 3872} {"train_loss": -25.91444206237793, "global_step": 321417, "epoch": 3872} {"train_loss": -25.956998825073242, "global_step": 321418, "epoch": 3872} {"train_loss": -25.576242446899414, "global_step": 321419, "epoch": 3872} {"train_loss": -25.786945343017578, "global_step": 321420, "epoch": 3872} {"train_loss": -25.604440689086914, "global_step": 321421, "epoch": 3872} {"train_loss": -25.799213409423828, "global_step": 321422, "epoch": 3872} {"train_loss": -25.932865142822266, "global_step": 321423, "epoch": 3872} {"train_loss": -25.94949722290039, "global_step": 321424, "epoch": 3872} {"train_loss": -26.595138549804688, "global_step": 321425, "epoch": 3872} {"train_loss": -25.552915573120117, "global_step": 321426, "epoch": 3872} {"train_loss": -25.703821182250977, "global_step": 321427, "epoch": 3872} {"train_loss": -25.716562271118164, "global_step": 321428, "epoch": 3872} {"train_loss": -25.578153610229492, "global_step": 321429, "epoch": 3872} {"train_loss": -25.32526206970215, "global_step": 321430, "epoch": 3872} {"train_loss": -26.00933265686035, "global_step": 321431, "epoch": 3872} {"train_loss": -26.23638343811035, "global_step": 321432, "epoch": 3872} {"train_loss": -25.780363082885742, "global_step": 321433, "epoch": 3872} {"train_loss": -25.81484031677246, "global_step": 321434, "epoch": 3872} {"train_loss": -25.809921264648438, "global_step": 321435, "epoch": 3872} {"train_loss": -25.96681785583496, "global_step": 321436, "epoch": 3872} {"train_loss": -26.08880043029785, "global_step": 321437, "epoch": 3872} {"train_loss": -26.02894401550293, "global_step": 321438, "epoch": 3872} {"train_loss": -25.905057907104492, "global_step": 321439, "epoch": 3872} {"train_loss": -25.806798934936523, "global_step": 321440, "epoch": 3872} {"train_loss": -25.814193725585938, "global_step": 321441, "epoch": 3872} {"train_loss": -25.58025550842285, "global_step": 321442, "epoch": 3872} {"train_loss": -25.767353057861328, "global_step": 321443, "epoch": 3872} {"train_loss": -25.92803382873535, "global_step": 321444, "epoch": 3872} {"train_loss": -25.84750747680664, "global_step": 321445, "epoch": 3872} {"train_loss": -25.780384063720703, "global_step": 321446, "epoch": 3872} {"train_loss": -25.60890007019043, "global_step": 321447, "epoch": 3872} {"train_loss": -25.7353515625, "global_step": 321448, "epoch": 3872} {"train_loss": -25.77131462097168, "global_step": 321449, "epoch": 3872} {"train_loss": -26.05428123474121, "global_step": 321450, "epoch": 3872} {"train_loss": -25.805490493774414, "global_step": 321451, "epoch": 3872} {"train_loss": -25.80608558654785, "global_step": 321452, "epoch": 3872} {"train_loss": -25.80824851989746, "global_step": 321453, "epoch": 3872} {"train_loss": -25.90525245666504, "global_step": 321454, "epoch": 3872} {"train_loss": -26.228281021118164, "global_step": 321455, "epoch": 3872} {"train_loss": -25.464643478393555, "global_step": 321456, "epoch": 3872} {"train_loss": -25.71510124206543, "global_step": 321457, "epoch": 3872} {"train_loss": -25.82031523463238, "global_step": 321458, "epoch": 3872, "val_loss": 7261348.0} {"train_loss": -25.27645492553711, "global_step": 321459, "epoch": 3873} {"train_loss": -25.144657135009766, "global_step": 321460, "epoch": 3873} {"train_loss": -25.30977439880371, "global_step": 321461, "epoch": 3873} {"train_loss": -25.056541442871094, "global_step": 321462, "epoch": 3873} {"train_loss": -25.330551147460938, "global_step": 321463, "epoch": 3873} {"train_loss": -25.211896896362305, "global_step": 321464, "epoch": 3873} {"train_loss": -25.53580665588379, "global_step": 321465, "epoch": 3873} {"train_loss": -25.342914581298828, "global_step": 321466, "epoch": 3873} {"train_loss": -24.063703536987305, "global_step": 321467, "epoch": 3873} {"train_loss": -25.343982696533203, "global_step": 321468, "epoch": 3873} {"train_loss": -25.29301643371582, "global_step": 321469, "epoch": 3873} {"train_loss": -25.536733627319336, "global_step": 321470, "epoch": 3873} {"train_loss": -25.185171127319336, "global_step": 321471, "epoch": 3873} {"train_loss": -25.211477279663086, "global_step": 321472, "epoch": 3873} {"train_loss": -25.193649291992188, "global_step": 321473, "epoch": 3873} {"train_loss": -25.791446685791016, "global_step": 321474, "epoch": 3873} {"train_loss": -25.8159236907959, "global_step": 321475, "epoch": 3873} {"train_loss": -25.381736755371094, "global_step": 321476, "epoch": 3873} {"train_loss": -25.549625396728516, "global_step": 321477, "epoch": 3873} {"train_loss": -25.665082931518555, "global_step": 321478, "epoch": 3873} {"train_loss": -25.841012954711914, "global_step": 321479, "epoch": 3873} {"train_loss": -25.796295166015625, "global_step": 321480, "epoch": 3873} {"train_loss": -25.66731071472168, "global_step": 321481, "epoch": 3873} {"train_loss": -26.108142852783203, "global_step": 321482, "epoch": 3873} {"train_loss": -25.50370216369629, "global_step": 321483, "epoch": 3873} {"train_loss": -25.769180297851562, "global_step": 321484, "epoch": 3873} {"train_loss": -26.022689819335938, "global_step": 321485, "epoch": 3873} {"train_loss": -25.51382827758789, "global_step": 321486, "epoch": 3873} {"train_loss": -25.562856674194336, "global_step": 321487, "epoch": 3873} {"train_loss": -25.705190658569336, "global_step": 321488, "epoch": 3873} {"train_loss": -25.816587448120117, "global_step": 321489, "epoch": 3873} {"train_loss": -25.836505889892578, "global_step": 321490, "epoch": 3873} {"train_loss": -26.178075790405273, "global_step": 321491, "epoch": 3873} {"train_loss": -26.060373306274414, "global_step": 321492, "epoch": 3873} {"train_loss": -25.797544479370117, "global_step": 321493, "epoch": 3873} {"train_loss": -26.206769943237305, "global_step": 321494, "epoch": 3873} {"train_loss": -25.717798233032227, "global_step": 321495, "epoch": 3873} {"train_loss": -25.962865829467773, "global_step": 321496, "epoch": 3873} {"train_loss": -26.183958053588867, "global_step": 321497, "epoch": 3873} {"train_loss": -25.997638702392578, "global_step": 321498, "epoch": 3873} {"train_loss": -25.642683029174805, "global_step": 321499, "epoch": 3873} {"train_loss": -25.85249900817871, "global_step": 321500, "epoch": 3873} {"train_loss": -25.330385208129883, "global_step": 321501, "epoch": 3873} {"train_loss": -25.883182525634766, "global_step": 321502, "epoch": 3873} {"train_loss": -26.1177921295166, "global_step": 321503, "epoch": 3873} {"train_loss": -25.859766006469727, "global_step": 321504, "epoch": 3873} {"train_loss": -25.688465118408203, "global_step": 321505, "epoch": 3873} {"train_loss": -25.94929313659668, "global_step": 321506, "epoch": 3873} {"train_loss": -26.038471221923828, "global_step": 321507, "epoch": 3873} {"train_loss": -25.698944091796875, "global_step": 321508, "epoch": 3873} {"train_loss": -25.247995376586914, "global_step": 321509, "epoch": 3873} {"train_loss": -25.290407180786133, "global_step": 321510, "epoch": 3873} {"train_loss": -25.712360382080078, "global_step": 321511, "epoch": 3873} {"train_loss": -25.881366729736328, "global_step": 321512, "epoch": 3873} {"train_loss": -25.54829216003418, "global_step": 321513, "epoch": 3873} {"train_loss": -25.742755889892578, "global_step": 321514, "epoch": 3873} {"train_loss": -25.856006622314453, "global_step": 321515, "epoch": 3873} {"train_loss": -25.954345703125, "global_step": 321516, "epoch": 3873} {"train_loss": -25.42091941833496, "global_step": 321517, "epoch": 3873} {"train_loss": -25.456552505493164, "global_step": 321518, "epoch": 3873} {"train_loss": -25.81989860534668, "global_step": 321519, "epoch": 3873} {"train_loss": -26.018020629882812, "global_step": 321520, "epoch": 3873} {"train_loss": -25.745458602905273, "global_step": 321521, "epoch": 3873} {"train_loss": -25.87900733947754, "global_step": 321522, "epoch": 3873} {"train_loss": -25.839147567749023, "global_step": 321523, "epoch": 3873} {"train_loss": -25.774002075195312, "global_step": 321524, "epoch": 3873} {"train_loss": -25.686552047729492, "global_step": 321525, "epoch": 3873} {"train_loss": -25.793750762939453, "global_step": 321526, "epoch": 3873} {"train_loss": -25.664627075195312, "global_step": 321527, "epoch": 3873} {"train_loss": -25.5864200592041, "global_step": 321528, "epoch": 3873} {"train_loss": -25.786203384399414, "global_step": 321529, "epoch": 3873} {"train_loss": -25.030027389526367, "global_step": 321530, "epoch": 3873} {"train_loss": -25.710973739624023, "global_step": 321531, "epoch": 3873} {"train_loss": -25.830968856811523, "global_step": 321532, "epoch": 3873} {"train_loss": -25.966705322265625, "global_step": 321533, "epoch": 3873} {"train_loss": -25.70863151550293, "global_step": 321534, "epoch": 3873} {"train_loss": -25.693267822265625, "global_step": 321535, "epoch": 3873} {"train_loss": -25.736364364624023, "global_step": 321536, "epoch": 3873} {"train_loss": -25.805377960205078, "global_step": 321537, "epoch": 3873} {"train_loss": -25.89272117614746, "global_step": 321538, "epoch": 3873} {"train_loss": -26.114837646484375, "global_step": 321539, "epoch": 3873} {"train_loss": -25.564151763916016, "global_step": 321540, "epoch": 3873} {"train_loss": -25.62911490934441, "global_step": 321541, "epoch": 3873, "val_loss": 7229612.0} {"train_loss": -25.279821395874023, "global_step": 321542, "epoch": 3874} {"train_loss": -25.174251556396484, "global_step": 321543, "epoch": 3874} {"train_loss": -25.07182502746582, "global_step": 321544, "epoch": 3874} {"train_loss": -25.344518661499023, "global_step": 321545, "epoch": 3874} {"train_loss": -25.530439376831055, "global_step": 321546, "epoch": 3874} {"train_loss": -25.052907943725586, "global_step": 321547, "epoch": 3874} {"train_loss": -25.1878719329834, "global_step": 321548, "epoch": 3874} {"train_loss": -25.513734817504883, "global_step": 321549, "epoch": 3874} {"train_loss": -25.452411651611328, "global_step": 321550, "epoch": 3874} {"train_loss": -25.552066802978516, "global_step": 321551, "epoch": 3874} {"train_loss": -25.360069274902344, "global_step": 321552, "epoch": 3874} {"train_loss": -25.455976486206055, "global_step": 321553, "epoch": 3874} {"train_loss": -25.606306076049805, "global_step": 321554, "epoch": 3874} {"train_loss": -25.581449508666992, "global_step": 321555, "epoch": 3874} {"train_loss": -25.50592041015625, "global_step": 321556, "epoch": 3874} {"train_loss": -25.32257080078125, "global_step": 321557, "epoch": 3874} {"train_loss": -25.6679630279541, "global_step": 321558, "epoch": 3874} {"train_loss": -25.26252555847168, "global_step": 321559, "epoch": 3874} {"train_loss": -25.407207489013672, "global_step": 321560, "epoch": 3874} {"train_loss": -25.445465087890625, "global_step": 321561, "epoch": 3874} {"train_loss": -25.84697914123535, "global_step": 321562, "epoch": 3874} {"train_loss": -25.558006286621094, "global_step": 321563, "epoch": 3874} {"train_loss": -25.796117782592773, "global_step": 321564, "epoch": 3874} {"train_loss": -25.73443603515625, "global_step": 321565, "epoch": 3874} {"train_loss": -25.543996810913086, "global_step": 321566, "epoch": 3874} {"train_loss": -25.652685165405273, "global_step": 321567, "epoch": 3874} {"train_loss": -25.634140014648438, "global_step": 321568, "epoch": 3874} {"train_loss": -25.89651870727539, "global_step": 321569, "epoch": 3874} {"train_loss": -25.63252830505371, "global_step": 321570, "epoch": 3874} {"train_loss": -25.855321884155273, "global_step": 321571, "epoch": 3874} {"train_loss": -25.861921310424805, "global_step": 321572, "epoch": 3874} {"train_loss": -26.216894149780273, "global_step": 321573, "epoch": 3874} {"train_loss": -25.940616607666016, "global_step": 321574, "epoch": 3874} {"train_loss": -25.957412719726562, "global_step": 321575, "epoch": 3874} {"train_loss": -25.67266273498535, "global_step": 321576, "epoch": 3874} {"train_loss": -25.903242111206055, "global_step": 321577, "epoch": 3874} {"train_loss": -25.81984519958496, "global_step": 321578, "epoch": 3874} {"train_loss": -25.566802978515625, "global_step": 321579, "epoch": 3874} {"train_loss": -25.52593994140625, "global_step": 321580, "epoch": 3874} {"train_loss": -25.82253074645996, "global_step": 321581, "epoch": 3874} {"train_loss": -25.561918258666992, "global_step": 321582, "epoch": 3874} {"train_loss": -25.924970626831055, "global_step": 321583, "epoch": 3874} {"train_loss": -26.070905685424805, "global_step": 321584, "epoch": 3874} {"train_loss": -26.16409683227539, "global_step": 321585, "epoch": 3874} {"train_loss": -26.102415084838867, "global_step": 321586, "epoch": 3874} {"train_loss": -25.88739013671875, "global_step": 321587, "epoch": 3874} {"train_loss": -26.15171241760254, "global_step": 321588, "epoch": 3874} {"train_loss": -25.673648834228516, "global_step": 321589, "epoch": 3874} {"train_loss": -25.684772491455078, "global_step": 321590, "epoch": 3874} {"train_loss": -25.91594886779785, "global_step": 321591, "epoch": 3874} {"train_loss": -25.7391357421875, "global_step": 321592, "epoch": 3874} {"train_loss": -25.53306007385254, "global_step": 321593, "epoch": 3874} {"train_loss": -25.817340850830078, "global_step": 321594, "epoch": 3874} {"train_loss": -25.530237197875977, "global_step": 321595, "epoch": 3874} {"train_loss": -26.065185546875, "global_step": 321596, "epoch": 3874} {"train_loss": -25.975393295288086, "global_step": 321597, "epoch": 3874} {"train_loss": -26.26837158203125, "global_step": 321598, "epoch": 3874} {"train_loss": -26.003265380859375, "global_step": 321599, "epoch": 3874} {"train_loss": -26.0494384765625, "global_step": 321600, "epoch": 3874} {"train_loss": -25.91096305847168, "global_step": 321601, "epoch": 3874} {"train_loss": -25.861785888671875, "global_step": 321602, "epoch": 3874} {"train_loss": -25.788330078125, "global_step": 321603, "epoch": 3874} {"train_loss": -26.23020362854004, "global_step": 321604, "epoch": 3874} {"train_loss": -25.935468673706055, "global_step": 321605, "epoch": 3874} {"train_loss": -26.137571334838867, "global_step": 321606, "epoch": 3874} {"train_loss": -25.918737411499023, "global_step": 321607, "epoch": 3874} {"train_loss": -26.185943603515625, "global_step": 321608, "epoch": 3874} {"train_loss": -25.879499435424805, "global_step": 321609, "epoch": 3874} {"train_loss": -25.598072052001953, "global_step": 321610, "epoch": 3874} {"train_loss": -25.790420532226562, "global_step": 321611, "epoch": 3874} {"train_loss": -25.90692138671875, "global_step": 321612, "epoch": 3874} {"train_loss": -25.82843017578125, "global_step": 321613, "epoch": 3874} {"train_loss": -25.84893226623535, "global_step": 321614, "epoch": 3874} {"train_loss": -25.711225509643555, "global_step": 321615, "epoch": 3874} {"train_loss": -25.936721801757812, "global_step": 321616, "epoch": 3874} {"train_loss": -25.631591796875, "global_step": 321617, "epoch": 3874} {"train_loss": -25.846332550048828, "global_step": 321618, "epoch": 3874} {"train_loss": -25.720014572143555, "global_step": 321619, "epoch": 3874} {"train_loss": -26.1724910736084, "global_step": 321620, "epoch": 3874} {"train_loss": -25.89324951171875, "global_step": 321621, "epoch": 3874} {"train_loss": -25.945117950439453, "global_step": 321622, "epoch": 3874} {"train_loss": -26.095855712890625, "global_step": 321623, "epoch": 3874} {"train_loss": -25.764786249183746, "global_step": 321624, "epoch": 3874, "val_loss": 7165698.0} {"train_loss": -25.139421463012695, "global_step": 321625, "epoch": 3875} {"train_loss": -24.391143798828125, "global_step": 321626, "epoch": 3875} {"train_loss": -25.12983512878418, "global_step": 321627, "epoch": 3875} {"train_loss": -25.175718307495117, "global_step": 321628, "epoch": 3875} {"train_loss": -25.241886138916016, "global_step": 321629, "epoch": 3875} {"train_loss": -25.263044357299805, "global_step": 321630, "epoch": 3875} {"train_loss": -25.256572723388672, "global_step": 321631, "epoch": 3875} {"train_loss": -25.360977172851562, "global_step": 321632, "epoch": 3875} {"train_loss": -25.425994873046875, "global_step": 321633, "epoch": 3875} {"train_loss": -25.354555130004883, "global_step": 321634, "epoch": 3875} {"train_loss": -25.56056785583496, "global_step": 321635, "epoch": 3875} {"train_loss": -25.564239501953125, "global_step": 321636, "epoch": 3875} {"train_loss": -25.537153244018555, "global_step": 321637, "epoch": 3875} {"train_loss": -25.269319534301758, "global_step": 321638, "epoch": 3875} {"train_loss": -25.728717803955078, "global_step": 321639, "epoch": 3875} {"train_loss": -25.580495834350586, "global_step": 321640, "epoch": 3875} {"train_loss": -25.835927963256836, "global_step": 321641, "epoch": 3875} {"train_loss": -25.509672164916992, "global_step": 321642, "epoch": 3875} {"train_loss": -25.918935775756836, "global_step": 321643, "epoch": 3875} {"train_loss": -25.549930572509766, "global_step": 321644, "epoch": 3875} {"train_loss": -25.722583770751953, "global_step": 321645, "epoch": 3875} {"train_loss": -25.570302963256836, "global_step": 321646, "epoch": 3875} {"train_loss": -26.026819229125977, "global_step": 321647, "epoch": 3875} {"train_loss": -25.801321029663086, "global_step": 321648, "epoch": 3875} {"train_loss": -25.786645889282227, "global_step": 321649, "epoch": 3875} {"train_loss": -25.69618034362793, "global_step": 321650, "epoch": 3875} {"train_loss": -25.716665267944336, "global_step": 321651, "epoch": 3875} {"train_loss": -25.67426109313965, "global_step": 321652, "epoch": 3875} {"train_loss": -25.93192481994629, "global_step": 321653, "epoch": 3875} {"train_loss": -25.906095504760742, "global_step": 321654, "epoch": 3875} {"train_loss": -25.944509506225586, "global_step": 321655, "epoch": 3875} {"train_loss": -25.859216690063477, "global_step": 321656, "epoch": 3875} {"train_loss": -25.999719619750977, "global_step": 321657, "epoch": 3875} {"train_loss": -26.193695068359375, "global_step": 321658, "epoch": 3875} {"train_loss": -25.885740280151367, "global_step": 321659, "epoch": 3875} {"train_loss": -26.077341079711914, "global_step": 321660, "epoch": 3875} {"train_loss": -25.879648208618164, "global_step": 321661, "epoch": 3875} {"train_loss": -25.91657066345215, "global_step": 321662, "epoch": 3875} {"train_loss": -26.039175033569336, "global_step": 321663, "epoch": 3875} {"train_loss": -26.16977882385254, "global_step": 321664, "epoch": 3875} {"train_loss": -25.777292251586914, "global_step": 321665, "epoch": 3875} {"train_loss": -26.238117218017578, "global_step": 321666, "epoch": 3875} {"train_loss": -26.17866325378418, "global_step": 321667, "epoch": 3875} {"train_loss": -26.260725021362305, "global_step": 321668, "epoch": 3875} {"train_loss": -25.9801082611084, "global_step": 321669, "epoch": 3875} {"train_loss": -26.356582641601562, "global_step": 321670, "epoch": 3875} {"train_loss": -26.326642990112305, "global_step": 321671, "epoch": 3875} {"train_loss": -25.906797409057617, "global_step": 321672, "epoch": 3875} {"train_loss": -26.163949966430664, "global_step": 321673, "epoch": 3875} {"train_loss": -26.09840202331543, "global_step": 321674, "epoch": 3875} {"train_loss": -25.81842041015625, "global_step": 321675, "epoch": 3875} {"train_loss": -25.882028579711914, "global_step": 321676, "epoch": 3875} {"train_loss": -26.196943283081055, "global_step": 321677, "epoch": 3875} {"train_loss": -26.123579025268555, "global_step": 321678, "epoch": 3875} {"train_loss": -25.84819984436035, "global_step": 321679, "epoch": 3875} {"train_loss": -26.29775047302246, "global_step": 321680, "epoch": 3875} {"train_loss": -26.06868553161621, "global_step": 321681, "epoch": 3875} {"train_loss": -25.588539123535156, "global_step": 321682, "epoch": 3875} {"train_loss": -25.89533805847168, "global_step": 321683, "epoch": 3875} {"train_loss": -25.827463150024414, "global_step": 321684, "epoch": 3875} {"train_loss": -25.49652671813965, "global_step": 321685, "epoch": 3875} {"train_loss": -25.41843032836914, "global_step": 321686, "epoch": 3875} {"train_loss": -25.397584915161133, "global_step": 321687, "epoch": 3875} {"train_loss": -25.402448654174805, "global_step": 321688, "epoch": 3875} {"train_loss": -25.04524803161621, "global_step": 321689, "epoch": 3875} {"train_loss": -25.7737979888916, "global_step": 321690, "epoch": 3875} {"train_loss": -25.826129913330078, "global_step": 321691, "epoch": 3875} {"train_loss": -25.725996017456055, "global_step": 321692, "epoch": 3875} {"train_loss": -25.600461959838867, "global_step": 321693, "epoch": 3875} {"train_loss": -25.973852157592773, "global_step": 321694, "epoch": 3875} {"train_loss": -25.78326988220215, "global_step": 321695, "epoch": 3875} {"train_loss": -25.9215030670166, "global_step": 321696, "epoch": 3875} {"train_loss": -26.237411499023438, "global_step": 321697, "epoch": 3875} {"train_loss": -25.450042724609375, "global_step": 321698, "epoch": 3875} {"train_loss": -26.07380485534668, "global_step": 321699, "epoch": 3875} {"train_loss": -25.996667861938477, "global_step": 321700, "epoch": 3875} {"train_loss": -25.97053337097168, "global_step": 321701, "epoch": 3875} {"train_loss": -26.02182960510254, "global_step": 321702, "epoch": 3875} {"train_loss": -25.65511131286621, "global_step": 321703, "epoch": 3875} {"train_loss": -25.797941207885742, "global_step": 321704, "epoch": 3875} {"train_loss": -25.983642578125, "global_step": 321705, "epoch": 3875} {"train_loss": -26.033599853515625, "global_step": 321706, "epoch": 3875} {"train_loss": -25.79362662441759, "global_step": 321707, "epoch": 3875, "val_loss": 7197735.0} {"train_loss": -25.19724464416504, "global_step": 321708, "epoch": 3876} {"train_loss": -25.5234317779541, "global_step": 321709, "epoch": 3876} {"train_loss": -25.68310546875, "global_step": 321710, "epoch": 3876} {"train_loss": -25.90447425842285, "global_step": 321711, "epoch": 3876} {"train_loss": -25.800634384155273, "global_step": 321712, "epoch": 3876} {"train_loss": -25.643163681030273, "global_step": 321713, "epoch": 3876} {"train_loss": -25.841842651367188, "global_step": 321714, "epoch": 3876} {"train_loss": -25.58453369140625, "global_step": 321715, "epoch": 3876} {"train_loss": -26.090421676635742, "global_step": 321716, "epoch": 3876} {"train_loss": -25.913623809814453, "global_step": 321717, "epoch": 3876} {"train_loss": -25.923681259155273, "global_step": 321718, "epoch": 3876} {"train_loss": -25.870031356811523, "global_step": 321719, "epoch": 3876} {"train_loss": -25.896015167236328, "global_step": 321720, "epoch": 3876} {"train_loss": -26.429555892944336, "global_step": 321721, "epoch": 3876} {"train_loss": -25.719818115234375, "global_step": 321722, "epoch": 3876} {"train_loss": -26.21082878112793, "global_step": 321723, "epoch": 3876} {"train_loss": -25.806623458862305, "global_step": 321724, "epoch": 3876} {"train_loss": -26.052066802978516, "global_step": 321725, "epoch": 3876} {"train_loss": -25.787708282470703, "global_step": 321726, "epoch": 3876} {"train_loss": -25.746061325073242, "global_step": 321727, "epoch": 3876} {"train_loss": -26.054580688476562, "global_step": 321728, "epoch": 3876} {"train_loss": -25.9364013671875, "global_step": 321729, "epoch": 3876} {"train_loss": -25.850271224975586, "global_step": 321730, "epoch": 3876} {"train_loss": -26.10346794128418, "global_step": 321731, "epoch": 3876} {"train_loss": -25.82984733581543, "global_step": 321732, "epoch": 3876} {"train_loss": -25.89487648010254, "global_step": 321733, "epoch": 3876} {"train_loss": -26.106510162353516, "global_step": 321734, "epoch": 3876} {"train_loss": -26.25547218322754, "global_step": 321735, "epoch": 3876} {"train_loss": -25.970712661743164, "global_step": 321736, "epoch": 3876} {"train_loss": -26.1025390625, "global_step": 321737, "epoch": 3876} {"train_loss": -25.823705673217773, "global_step": 321738, "epoch": 3876} {"train_loss": -26.287405014038086, "global_step": 321739, "epoch": 3876} {"train_loss": -25.563024520874023, "global_step": 321740, "epoch": 3876} {"train_loss": -25.696020126342773, "global_step": 321741, "epoch": 3876} {"train_loss": -25.820392608642578, "global_step": 321742, "epoch": 3876} {"train_loss": -25.56171226501465, "global_step": 321743, "epoch": 3876} {"train_loss": -25.751386642456055, "global_step": 321744, "epoch": 3876} {"train_loss": -26.021825790405273, "global_step": 321745, "epoch": 3876} {"train_loss": -26.05194664001465, "global_step": 321746, "epoch": 3876} {"train_loss": -26.24061393737793, "global_step": 321747, "epoch": 3876} {"train_loss": -25.849655151367188, "global_step": 321748, "epoch": 3876} {"train_loss": -26.039785385131836, "global_step": 321749, "epoch": 3876} {"train_loss": -25.934894561767578, "global_step": 321750, "epoch": 3876} {"train_loss": -26.197101593017578, "global_step": 321751, "epoch": 3876} {"train_loss": -25.877548217773438, "global_step": 321752, "epoch": 3876} {"train_loss": -25.512760162353516, "global_step": 321753, "epoch": 3876} {"train_loss": -25.847944259643555, "global_step": 321754, "epoch": 3876} {"train_loss": -25.740039825439453, "global_step": 321755, "epoch": 3876} {"train_loss": -25.58064842224121, "global_step": 321756, "epoch": 3876} {"train_loss": -25.67854118347168, "global_step": 321757, "epoch": 3876} {"train_loss": -25.327068328857422, "global_step": 321758, "epoch": 3876} {"train_loss": -25.50058364868164, "global_step": 321759, "epoch": 3876} {"train_loss": -25.357309341430664, "global_step": 321760, "epoch": 3876} {"train_loss": -25.913589477539062, "global_step": 321761, "epoch": 3876} {"train_loss": -25.663129806518555, "global_step": 321762, "epoch": 3876} {"train_loss": -25.991926193237305, "global_step": 321763, "epoch": 3876} {"train_loss": -25.998126983642578, "global_step": 321764, "epoch": 3876} {"train_loss": -26.29998779296875, "global_step": 321765, "epoch": 3876} {"train_loss": -25.602680206298828, "global_step": 321766, "epoch": 3876} {"train_loss": -25.45069694519043, "global_step": 321767, "epoch": 3876} {"train_loss": -25.92803955078125, "global_step": 321768, "epoch": 3876} {"train_loss": -25.924484252929688, "global_step": 321769, "epoch": 3876} {"train_loss": -25.965072631835938, "global_step": 321770, "epoch": 3876} {"train_loss": -26.1199893951416, "global_step": 321771, "epoch": 3876} {"train_loss": -26.005157470703125, "global_step": 321772, "epoch": 3876} {"train_loss": -25.631223678588867, "global_step": 321773, "epoch": 3876} {"train_loss": -25.907251358032227, "global_step": 321774, "epoch": 3876} {"train_loss": -26.092992782592773, "global_step": 321775, "epoch": 3876} {"train_loss": -25.960941314697266, "global_step": 321776, "epoch": 3876} {"train_loss": -25.881820678710938, "global_step": 321777, "epoch": 3876} {"train_loss": -25.736286163330078, "global_step": 321778, "epoch": 3876} {"train_loss": -25.612985610961914, "global_step": 321779, "epoch": 3876} {"train_loss": -26.219696044921875, "global_step": 321780, "epoch": 3876} {"train_loss": -26.22153091430664, "global_step": 321781, "epoch": 3876} {"train_loss": -26.014646530151367, "global_step": 321782, "epoch": 3876} {"train_loss": -25.95111656188965, "global_step": 321783, "epoch": 3876} {"train_loss": -25.9182071685791, "global_step": 321784, "epoch": 3876} {"train_loss": -25.555797576904297, "global_step": 321785, "epoch": 3876} {"train_loss": -26.027563095092773, "global_step": 321786, "epoch": 3876} {"train_loss": -26.2487735748291, "global_step": 321787, "epoch": 3876} {"train_loss": -26.0004940032959, "global_step": 321788, "epoch": 3876} {"train_loss": -26.094440460205078, "global_step": 321789, "epoch": 3876} {"train_loss": -25.879782596266413, "global_step": 321790, "epoch": 3876, "val_loss": 7168097.0} {"train_loss": -25.817724227905273, "global_step": 321791, "epoch": 3877} {"train_loss": -25.18220329284668, "global_step": 321792, "epoch": 3877} {"train_loss": -25.667438507080078, "global_step": 321793, "epoch": 3877} {"train_loss": -25.771728515625, "global_step": 321794, "epoch": 3877} {"train_loss": -25.639814376831055, "global_step": 321795, "epoch": 3877} {"train_loss": -25.027807235717773, "global_step": 321796, "epoch": 3877} {"train_loss": -25.16408348083496, "global_step": 321797, "epoch": 3877} {"train_loss": -25.540267944335938, "global_step": 321798, "epoch": 3877} {"train_loss": -25.9322509765625, "global_step": 321799, "epoch": 3877} {"train_loss": -25.039813995361328, "global_step": 321800, "epoch": 3877} {"train_loss": -25.761783599853516, "global_step": 321801, "epoch": 3877} {"train_loss": -25.734052658081055, "global_step": 321802, "epoch": 3877} {"train_loss": -25.732946395874023, "global_step": 321803, "epoch": 3877} {"train_loss": -25.76544189453125, "global_step": 321804, "epoch": 3877} {"train_loss": -25.46650505065918, "global_step": 321805, "epoch": 3877} {"train_loss": -25.648710250854492, "global_step": 321806, "epoch": 3877} {"train_loss": -25.88667106628418, "global_step": 321807, "epoch": 3877} {"train_loss": -25.799718856811523, "global_step": 321808, "epoch": 3877} {"train_loss": -25.726255416870117, "global_step": 321809, "epoch": 3877} {"train_loss": -25.68903923034668, "global_step": 321810, "epoch": 3877} {"train_loss": -25.74180030822754, "global_step": 321811, "epoch": 3877} {"train_loss": -25.984399795532227, "global_step": 321812, "epoch": 3877} {"train_loss": -25.66497230529785, "global_step": 321813, "epoch": 3877} {"train_loss": -25.807641983032227, "global_step": 321814, "epoch": 3877} {"train_loss": -25.69999122619629, "global_step": 321815, "epoch": 3877} {"train_loss": -25.95830726623535, "global_step": 321816, "epoch": 3877} {"train_loss": -25.679807662963867, "global_step": 321817, "epoch": 3877} {"train_loss": -25.76456642150879, "global_step": 321818, "epoch": 3877} {"train_loss": -26.144140243530273, "global_step": 321819, "epoch": 3877} {"train_loss": -25.8867130279541, "global_step": 321820, "epoch": 3877} {"train_loss": -25.980947494506836, "global_step": 321821, "epoch": 3877} {"train_loss": -26.129362106323242, "global_step": 321822, "epoch": 3877} {"train_loss": -25.993844985961914, "global_step": 321823, "epoch": 3877} {"train_loss": -25.673925399780273, "global_step": 321824, "epoch": 3877} {"train_loss": -26.014982223510742, "global_step": 321825, "epoch": 3877} {"train_loss": -26.11187171936035, "global_step": 321826, "epoch": 3877} {"train_loss": -25.940088272094727, "global_step": 321827, "epoch": 3877} {"train_loss": -26.106964111328125, "global_step": 321828, "epoch": 3877} {"train_loss": -26.100311279296875, "global_step": 321829, "epoch": 3877} {"train_loss": -25.91815185546875, "global_step": 321830, "epoch": 3877} {"train_loss": -26.23142433166504, "global_step": 321831, "epoch": 3877} {"train_loss": -25.984521865844727, "global_step": 321832, "epoch": 3877} {"train_loss": -26.140684127807617, "global_step": 321833, "epoch": 3877} {"train_loss": -26.078039169311523, "global_step": 321834, "epoch": 3877} {"train_loss": -25.838672637939453, "global_step": 321835, "epoch": 3877} {"train_loss": -25.991384506225586, "global_step": 321836, "epoch": 3877} {"train_loss": -26.266279220581055, "global_step": 321837, "epoch": 3877} {"train_loss": -26.240936279296875, "global_step": 321838, "epoch": 3877} {"train_loss": -26.31123161315918, "global_step": 321839, "epoch": 3877} {"train_loss": -25.899991989135742, "global_step": 321840, "epoch": 3877} {"train_loss": -25.848682403564453, "global_step": 321841, "epoch": 3877} {"train_loss": -26.37929344177246, "global_step": 321842, "epoch": 3877} {"train_loss": -25.82087516784668, "global_step": 321843, "epoch": 3877} {"train_loss": -25.867877960205078, "global_step": 321844, "epoch": 3877} {"train_loss": -25.485898971557617, "global_step": 321845, "epoch": 3877} {"train_loss": -25.307092666625977, "global_step": 321846, "epoch": 3877} {"train_loss": -25.53255271911621, "global_step": 321847, "epoch": 3877} {"train_loss": -25.34172821044922, "global_step": 321848, "epoch": 3877} {"train_loss": -26.066679000854492, "global_step": 321849, "epoch": 3877} {"train_loss": -25.77203369140625, "global_step": 321850, "epoch": 3877} {"train_loss": -25.618011474609375, "global_step": 321851, "epoch": 3877} {"train_loss": -25.630157470703125, "global_step": 321852, "epoch": 3877} {"train_loss": -26.199783325195312, "global_step": 321853, "epoch": 3877} {"train_loss": -25.686248779296875, "global_step": 321854, "epoch": 3877} {"train_loss": -26.06917381286621, "global_step": 321855, "epoch": 3877} {"train_loss": -26.207361221313477, "global_step": 321856, "epoch": 3877} {"train_loss": -25.7611026763916, "global_step": 321857, "epoch": 3877} {"train_loss": -25.939844131469727, "global_step": 321858, "epoch": 3877} {"train_loss": -25.864233016967773, "global_step": 321859, "epoch": 3877} {"train_loss": -25.723737716674805, "global_step": 321860, "epoch": 3877} {"train_loss": -25.69415855407715, "global_step": 321861, "epoch": 3877} {"train_loss": -25.862628936767578, "global_step": 321862, "epoch": 3877} {"train_loss": -25.7628173828125, "global_step": 321863, "epoch": 3877} {"train_loss": -25.66377067565918, "global_step": 321864, "epoch": 3877} {"train_loss": -25.677234649658203, "global_step": 321865, "epoch": 3877} {"train_loss": -25.611927032470703, "global_step": 321866, "epoch": 3877} {"train_loss": -25.7031192779541, "global_step": 321867, "epoch": 3877} {"train_loss": -25.40873908996582, "global_step": 321868, "epoch": 3877} {"train_loss": -25.92433738708496, "global_step": 321869, "epoch": 3877} {"train_loss": -25.77739906311035, "global_step": 321870, "epoch": 3877} {"train_loss": -25.87346839904785, "global_step": 321871, "epoch": 3877} {"train_loss": -25.91408348083496, "global_step": 321872, "epoch": 3877} {"train_loss": -25.815644114850514, "global_step": 321873, "epoch": 3877, "val_loss": 7071725.0} {"train_loss": -24.73185157775879, "global_step": 321874, "epoch": 3878} {"train_loss": -24.81966209411621, "global_step": 321875, "epoch": 3878} {"train_loss": -25.220672607421875, "global_step": 321876, "epoch": 3878} {"train_loss": -24.855369567871094, "global_step": 321877, "epoch": 3878} {"train_loss": -25.335063934326172, "global_step": 321878, "epoch": 3878} {"train_loss": -24.6756649017334, "global_step": 321879, "epoch": 3878} {"train_loss": -25.628286361694336, "global_step": 321880, "epoch": 3878} {"train_loss": -25.216957092285156, "global_step": 321881, "epoch": 3878} {"train_loss": -25.231016159057617, "global_step": 321882, "epoch": 3878} {"train_loss": -25.123884201049805, "global_step": 321883, "epoch": 3878} {"train_loss": -24.984882354736328, "global_step": 321884, "epoch": 3878} {"train_loss": -24.763774871826172, "global_step": 321885, "epoch": 3878} {"train_loss": -25.4021053314209, "global_step": 321886, "epoch": 3878} {"train_loss": -25.159772872924805, "global_step": 321887, "epoch": 3878} {"train_loss": -24.798694610595703, "global_step": 321888, "epoch": 3878} {"train_loss": -25.53117561340332, "global_step": 321889, "epoch": 3878} {"train_loss": -25.209978103637695, "global_step": 321890, "epoch": 3878} {"train_loss": -25.21946144104004, "global_step": 321891, "epoch": 3878} {"train_loss": -25.60306167602539, "global_step": 321892, "epoch": 3878} {"train_loss": -25.287229537963867, "global_step": 321893, "epoch": 3878} {"train_loss": -25.290891647338867, "global_step": 321894, "epoch": 3878} {"train_loss": -25.703405380249023, "global_step": 321895, "epoch": 3878} {"train_loss": -25.76936912536621, "global_step": 321896, "epoch": 3878} {"train_loss": -25.30630111694336, "global_step": 321897, "epoch": 3878} {"train_loss": -25.586021423339844, "global_step": 321898, "epoch": 3878} {"train_loss": -25.900609970092773, "global_step": 321899, "epoch": 3878} {"train_loss": -25.767364501953125, "global_step": 321900, "epoch": 3878} {"train_loss": -25.93092155456543, "global_step": 321901, "epoch": 3878} {"train_loss": -25.55197525024414, "global_step": 321902, "epoch": 3878} {"train_loss": -25.842899322509766, "global_step": 321903, "epoch": 3878} {"train_loss": -25.462553024291992, "global_step": 321904, "epoch": 3878} {"train_loss": -25.85666275024414, "global_step": 321905, "epoch": 3878} {"train_loss": -25.602924346923828, "global_step": 321906, "epoch": 3878} {"train_loss": -25.586938858032227, "global_step": 321907, "epoch": 3878} {"train_loss": -25.677845001220703, "global_step": 321908, "epoch": 3878} {"train_loss": -25.784696578979492, "global_step": 321909, "epoch": 3878} {"train_loss": -25.68263053894043, "global_step": 321910, "epoch": 3878} {"train_loss": -25.827930450439453, "global_step": 321911, "epoch": 3878} {"train_loss": -25.9940185546875, "global_step": 321912, "epoch": 3878} {"train_loss": -25.736759185791016, "global_step": 321913, "epoch": 3878} {"train_loss": -25.746877670288086, "global_step": 321914, "epoch": 3878} {"train_loss": -25.856199264526367, "global_step": 321915, "epoch": 3878} {"train_loss": -26.076215744018555, "global_step": 321916, "epoch": 3878} {"train_loss": -26.084882736206055, "global_step": 321917, "epoch": 3878} {"train_loss": -26.043455123901367, "global_step": 321918, "epoch": 3878} {"train_loss": -25.523550033569336, "global_step": 321919, "epoch": 3878} {"train_loss": -25.96258544921875, "global_step": 321920, "epoch": 3878} {"train_loss": -25.800207138061523, "global_step": 321921, "epoch": 3878} {"train_loss": -25.9477481842041, "global_step": 321922, "epoch": 3878} {"train_loss": -25.901214599609375, "global_step": 321923, "epoch": 3878} {"train_loss": -25.72269058227539, "global_step": 321924, "epoch": 3878} {"train_loss": -25.932769775390625, "global_step": 321925, "epoch": 3878} {"train_loss": -26.31269645690918, "global_step": 321926, "epoch": 3878} {"train_loss": -26.05177116394043, "global_step": 321927, "epoch": 3878} {"train_loss": -26.17494010925293, "global_step": 321928, "epoch": 3878} {"train_loss": -25.94880485534668, "global_step": 321929, "epoch": 3878} {"train_loss": -26.211957931518555, "global_step": 321930, "epoch": 3878} {"train_loss": -26.18963050842285, "global_step": 321931, "epoch": 3878} {"train_loss": -25.96607780456543, "global_step": 321932, "epoch": 3878} {"train_loss": -25.63484764099121, "global_step": 321933, "epoch": 3878} {"train_loss": -25.999570846557617, "global_step": 321934, "epoch": 3878} {"train_loss": -25.663650512695312, "global_step": 321935, "epoch": 3878} {"train_loss": -26.176746368408203, "global_step": 321936, "epoch": 3878} {"train_loss": -25.651203155517578, "global_step": 321937, "epoch": 3878} {"train_loss": -26.038602828979492, "global_step": 321938, "epoch": 3878} {"train_loss": -25.76889991760254, "global_step": 321939, "epoch": 3878} {"train_loss": -25.60706901550293, "global_step": 321940, "epoch": 3878} {"train_loss": -25.37190055847168, "global_step": 321941, "epoch": 3878} {"train_loss": -25.875120162963867, "global_step": 321942, "epoch": 3878} {"train_loss": -25.883380889892578, "global_step": 321943, "epoch": 3878} {"train_loss": -25.509288787841797, "global_step": 321944, "epoch": 3878} {"train_loss": -25.386281967163086, "global_step": 321945, "epoch": 3878} {"train_loss": -25.95672035217285, "global_step": 321946, "epoch": 3878} {"train_loss": -25.604272842407227, "global_step": 321947, "epoch": 3878} {"train_loss": -25.884714126586914, "global_step": 321948, "epoch": 3878} {"train_loss": -26.1956787109375, "global_step": 321949, "epoch": 3878} {"train_loss": -26.1409854888916, "global_step": 321950, "epoch": 3878} {"train_loss": -26.07354164123535, "global_step": 321951, "epoch": 3878} {"train_loss": -26.26129722595215, "global_step": 321952, "epoch": 3878} {"train_loss": -26.131011962890625, "global_step": 321953, "epoch": 3878} {"train_loss": -26.07952880859375, "global_step": 321954, "epoch": 3878} {"train_loss": -25.88422203063965, "global_step": 321955, "epoch": 3878} {"train_loss": -25.68262780430805, "global_step": 321956, "epoch": 3878, "val_loss": 7300343.0} {"train_loss": -24.872783660888672, "global_step": 321957, "epoch": 3879} {"train_loss": -25.69415855407715, "global_step": 321958, "epoch": 3879} {"train_loss": -25.437299728393555, "global_step": 321959, "epoch": 3879} {"train_loss": -25.37704849243164, "global_step": 321960, "epoch": 3879} {"train_loss": -25.47182846069336, "global_step": 321961, "epoch": 3879} {"train_loss": -25.741403579711914, "global_step": 321962, "epoch": 3879} {"train_loss": -25.058719635009766, "global_step": 321963, "epoch": 3879} {"train_loss": -25.64320182800293, "global_step": 321964, "epoch": 3879} {"train_loss": -25.4547176361084, "global_step": 321965, "epoch": 3879} {"train_loss": -25.90166664123535, "global_step": 321966, "epoch": 3879} {"train_loss": -26.10989761352539, "global_step": 321967, "epoch": 3879} {"train_loss": -25.860675811767578, "global_step": 321968, "epoch": 3879} {"train_loss": -25.60394287109375, "global_step": 321969, "epoch": 3879} {"train_loss": -25.927093505859375, "global_step": 321970, "epoch": 3879} {"train_loss": -25.944074630737305, "global_step": 321971, "epoch": 3879} {"train_loss": -25.533010482788086, "global_step": 321972, "epoch": 3879} {"train_loss": -25.68012809753418, "global_step": 321973, "epoch": 3879} {"train_loss": -25.906888961791992, "global_step": 321974, "epoch": 3879} {"train_loss": -25.5220947265625, "global_step": 321975, "epoch": 3879} {"train_loss": -25.722492218017578, "global_step": 321976, "epoch": 3879} {"train_loss": -25.584884643554688, "global_step": 321977, "epoch": 3879} {"train_loss": -25.87786293029785, "global_step": 321978, "epoch": 3879} {"train_loss": -26.012182235717773, "global_step": 321979, "epoch": 3879} {"train_loss": -26.017438888549805, "global_step": 321980, "epoch": 3879} {"train_loss": -25.707868576049805, "global_step": 321981, "epoch": 3879} {"train_loss": -25.617664337158203, "global_step": 321982, "epoch": 3879} {"train_loss": -25.710037231445312, "global_step": 321983, "epoch": 3879} {"train_loss": -25.8342227935791, "global_step": 321984, "epoch": 3879} {"train_loss": -25.766021728515625, "global_step": 321985, "epoch": 3879} {"train_loss": -25.70891761779785, "global_step": 321986, "epoch": 3879} {"train_loss": -25.566316604614258, "global_step": 321987, "epoch": 3879} {"train_loss": -25.800323486328125, "global_step": 321988, "epoch": 3879} {"train_loss": -26.011737823486328, "global_step": 321989, "epoch": 3879} {"train_loss": -25.69784927368164, "global_step": 321990, "epoch": 3879} {"train_loss": -26.0751895904541, "global_step": 321991, "epoch": 3879} {"train_loss": -26.226062774658203, "global_step": 321992, "epoch": 3879} {"train_loss": -26.385498046875, "global_step": 321993, "epoch": 3879} {"train_loss": -25.803558349609375, "global_step": 321994, "epoch": 3879} {"train_loss": -25.730731964111328, "global_step": 321995, "epoch": 3879} {"train_loss": -25.667804718017578, "global_step": 321996, "epoch": 3879} {"train_loss": -26.162906646728516, "global_step": 321997, "epoch": 3879} {"train_loss": -25.8577938079834, "global_step": 321998, "epoch": 3879} {"train_loss": -25.79184913635254, "global_step": 321999, "epoch": 3879} {"train_loss": -25.703857421875, "global_step": 322000, "epoch": 3879} {"train_loss": -25.885297775268555, "global_step": 322001, "epoch": 3879} {"train_loss": -26.105817794799805, "global_step": 322002, "epoch": 3879} {"train_loss": -26.085046768188477, "global_step": 322003, "epoch": 3879} {"train_loss": -25.94062614440918, "global_step": 322004, "epoch": 3879} {"train_loss": -25.75018310546875, "global_step": 322005, "epoch": 3879} {"train_loss": -25.85843276977539, "global_step": 322006, "epoch": 3879} {"train_loss": -25.930908203125, "global_step": 322007, "epoch": 3879} {"train_loss": -26.226455688476562, "global_step": 322008, "epoch": 3879} {"train_loss": -26.064773559570312, "global_step": 322009, "epoch": 3879} {"train_loss": -26.041223526000977, "global_step": 322010, "epoch": 3879} {"train_loss": -26.077869415283203, "global_step": 322011, "epoch": 3879} {"train_loss": -25.886295318603516, "global_step": 322012, "epoch": 3879} {"train_loss": -25.794544219970703, "global_step": 322013, "epoch": 3879} {"train_loss": -26.29762077331543, "global_step": 322014, "epoch": 3879} {"train_loss": -26.37184715270996, "global_step": 322015, "epoch": 3879} {"train_loss": -26.081390380859375, "global_step": 322016, "epoch": 3879} {"train_loss": -26.17170524597168, "global_step": 322017, "epoch": 3879} {"train_loss": -26.195449829101562, "global_step": 322018, "epoch": 3879} {"train_loss": -26.386188507080078, "global_step": 322019, "epoch": 3879} {"train_loss": -26.262311935424805, "global_step": 322020, "epoch": 3879} {"train_loss": -25.65852165222168, "global_step": 322021, "epoch": 3879} {"train_loss": -25.944730758666992, "global_step": 322022, "epoch": 3879} {"train_loss": -25.736221313476562, "global_step": 322023, "epoch": 3879} {"train_loss": -25.64116859436035, "global_step": 322024, "epoch": 3879} {"train_loss": -25.997394561767578, "global_step": 322025, "epoch": 3879} {"train_loss": -25.532339096069336, "global_step": 322026, "epoch": 3879} {"train_loss": -25.914703369140625, "global_step": 322027, "epoch": 3879} {"train_loss": -25.880664825439453, "global_step": 322028, "epoch": 3879} {"train_loss": -25.889789581298828, "global_step": 322029, "epoch": 3879} {"train_loss": -25.808950424194336, "global_step": 322030, "epoch": 3879} {"train_loss": -26.10589599609375, "global_step": 322031, "epoch": 3879} {"train_loss": -25.865070343017578, "global_step": 322032, "epoch": 3879} {"train_loss": -25.7315731048584, "global_step": 322033, "epoch": 3879} {"train_loss": -25.942523956298828, "global_step": 322034, "epoch": 3879} {"train_loss": -26.191146850585938, "global_step": 322035, "epoch": 3879} {"train_loss": -25.970355987548828, "global_step": 322036, "epoch": 3879} {"train_loss": -26.059736251831055, "global_step": 322037, "epoch": 3879} {"train_loss": -25.86616325378418, "global_step": 322038, "epoch": 3879} {"train_loss": -25.85678704962673, "global_step": 322039, "epoch": 3879, "val_loss": 7224112.0} {"train_loss": -25.714990615844727, "global_step": 322040, "epoch": 3880} {"train_loss": -25.023115158081055, "global_step": 322041, "epoch": 3880} {"train_loss": -25.741846084594727, "global_step": 322042, "epoch": 3880} {"train_loss": -25.714679718017578, "global_step": 322043, "epoch": 3880} {"train_loss": -25.462491989135742, "global_step": 322044, "epoch": 3880} {"train_loss": -25.452299118041992, "global_step": 322045, "epoch": 3880} {"train_loss": -25.77752113342285, "global_step": 322046, "epoch": 3880} {"train_loss": -25.464542388916016, "global_step": 322047, "epoch": 3880} {"train_loss": -25.42333984375, "global_step": 322048, "epoch": 3880} {"train_loss": -25.53539276123047, "global_step": 322049, "epoch": 3880} {"train_loss": -24.92536735534668, "global_step": 322050, "epoch": 3880} {"train_loss": -25.663171768188477, "global_step": 322051, "epoch": 3880} {"train_loss": -25.280431747436523, "global_step": 322052, "epoch": 3880} {"train_loss": -25.692419052124023, "global_step": 322053, "epoch": 3880} {"train_loss": -25.37677001953125, "global_step": 322054, "epoch": 3880} {"train_loss": -25.610370635986328, "global_step": 322055, "epoch": 3880} {"train_loss": -25.54793357849121, "global_step": 322056, "epoch": 3880} {"train_loss": -25.6989803314209, "global_step": 322057, "epoch": 3880} {"train_loss": -25.506677627563477, "global_step": 322058, "epoch": 3880} {"train_loss": -25.655805587768555, "global_step": 322059, "epoch": 3880} {"train_loss": -25.971302032470703, "global_step": 322060, "epoch": 3880} {"train_loss": -25.928668975830078, "global_step": 322061, "epoch": 3880} {"train_loss": -25.564041137695312, "global_step": 322062, "epoch": 3880} {"train_loss": -25.899221420288086, "global_step": 322063, "epoch": 3880} {"train_loss": -25.698261260986328, "global_step": 322064, "epoch": 3880} {"train_loss": -26.058074951171875, "global_step": 322065, "epoch": 3880} {"train_loss": -25.56366729736328, "global_step": 322066, "epoch": 3880} {"train_loss": -25.92181396484375, "global_step": 322067, "epoch": 3880} {"train_loss": -26.075347900390625, "global_step": 322068, "epoch": 3880} {"train_loss": -25.858020782470703, "global_step": 322069, "epoch": 3880} {"train_loss": -26.168283462524414, "global_step": 322070, "epoch": 3880} {"train_loss": -25.659595489501953, "global_step": 322071, "epoch": 3880} {"train_loss": -26.147216796875, "global_step": 322072, "epoch": 3880} {"train_loss": -26.00506591796875, "global_step": 322073, "epoch": 3880} {"train_loss": -25.821182250976562, "global_step": 322074, "epoch": 3880} {"train_loss": -26.235126495361328, "global_step": 322075, "epoch": 3880} {"train_loss": -25.751123428344727, "global_step": 322076, "epoch": 3880} {"train_loss": -26.045459747314453, "global_step": 322077, "epoch": 3880} {"train_loss": -26.10845947265625, "global_step": 322078, "epoch": 3880} {"train_loss": -26.096576690673828, "global_step": 322079, "epoch": 3880} {"train_loss": -25.73921012878418, "global_step": 322080, "epoch": 3880} {"train_loss": -25.9294490814209, "global_step": 322081, "epoch": 3880} {"train_loss": -25.82073974609375, "global_step": 322082, "epoch": 3880} {"train_loss": -25.827289581298828, "global_step": 322083, "epoch": 3880} {"train_loss": -26.18487548828125, "global_step": 322084, "epoch": 3880} {"train_loss": -25.7506160736084, "global_step": 322085, "epoch": 3880} {"train_loss": -25.447967529296875, "global_step": 322086, "epoch": 3880} {"train_loss": -25.888843536376953, "global_step": 322087, "epoch": 3880} {"train_loss": -25.354902267456055, "global_step": 322088, "epoch": 3880} {"train_loss": -25.97589111328125, "global_step": 322089, "epoch": 3880} {"train_loss": -25.996793746948242, "global_step": 322090, "epoch": 3880} {"train_loss": -25.595529556274414, "global_step": 322091, "epoch": 3880} {"train_loss": -25.949735641479492, "global_step": 322092, "epoch": 3880} {"train_loss": -25.685455322265625, "global_step": 322093, "epoch": 3880} {"train_loss": -26.20440673828125, "global_step": 322094, "epoch": 3880} {"train_loss": -25.70383644104004, "global_step": 322095, "epoch": 3880} {"train_loss": -26.23158073425293, "global_step": 322096, "epoch": 3880} {"train_loss": -25.903104782104492, "global_step": 322097, "epoch": 3880} {"train_loss": -26.059600830078125, "global_step": 322098, "epoch": 3880} {"train_loss": -26.265792846679688, "global_step": 322099, "epoch": 3880} {"train_loss": -26.0316162109375, "global_step": 322100, "epoch": 3880} {"train_loss": -25.685209274291992, "global_step": 322101, "epoch": 3880} {"train_loss": -26.085294723510742, "global_step": 322102, "epoch": 3880} {"train_loss": -25.793577194213867, "global_step": 322103, "epoch": 3880} {"train_loss": -26.010303497314453, "global_step": 322104, "epoch": 3880} {"train_loss": -25.860395431518555, "global_step": 322105, "epoch": 3880} {"train_loss": -26.1010799407959, "global_step": 322106, "epoch": 3880} {"train_loss": -25.893844604492188, "global_step": 322107, "epoch": 3880} {"train_loss": -26.333850860595703, "global_step": 322108, "epoch": 3880} {"train_loss": -25.814489364624023, "global_step": 322109, "epoch": 3880} {"train_loss": -25.512407302856445, "global_step": 322110, "epoch": 3880} {"train_loss": -25.682668685913086, "global_step": 322111, "epoch": 3880} {"train_loss": -26.11115837097168, "global_step": 322112, "epoch": 3880} {"train_loss": -25.852863311767578, "global_step": 322113, "epoch": 3880} {"train_loss": -25.756818771362305, "global_step": 322114, "epoch": 3880} {"train_loss": -25.81868553161621, "global_step": 322115, "epoch": 3880} {"train_loss": -25.820709228515625, "global_step": 322116, "epoch": 3880} {"train_loss": -25.82488441467285, "global_step": 322117, "epoch": 3880} {"train_loss": -26.091520309448242, "global_step": 322118, "epoch": 3880} {"train_loss": -25.81593132019043, "global_step": 322119, "epoch": 3880} {"train_loss": -26.00983238220215, "global_step": 322120, "epoch": 3880} {"train_loss": -26.12812614440918, "global_step": 322121, "epoch": 3880} {"train_loss": -25.833301383328724, "global_step": 322122, "epoch": 3880, "val_loss": 7209133.0} {"train_loss": -24.800582885742188, "global_step": 322123, "epoch": 3881} {"train_loss": -25.48139762878418, "global_step": 322124, "epoch": 3881} {"train_loss": -25.24587631225586, "global_step": 322125, "epoch": 3881} {"train_loss": -25.518394470214844, "global_step": 322126, "epoch": 3881} {"train_loss": -25.197799682617188, "global_step": 322127, "epoch": 3881} {"train_loss": -25.030614852905273, "global_step": 322128, "epoch": 3881} {"train_loss": -24.97316551208496, "global_step": 322129, "epoch": 3881} {"train_loss": -25.688522338867188, "global_step": 322130, "epoch": 3881} {"train_loss": -25.338729858398438, "global_step": 322131, "epoch": 3881} {"train_loss": -25.526914596557617, "global_step": 322132, "epoch": 3881} {"train_loss": -25.451765060424805, "global_step": 322133, "epoch": 3881} {"train_loss": -25.495832443237305, "global_step": 322134, "epoch": 3881} {"train_loss": -25.549039840698242, "global_step": 322135, "epoch": 3881} {"train_loss": -25.703954696655273, "global_step": 322136, "epoch": 3881} {"train_loss": -25.354785919189453, "global_step": 322137, "epoch": 3881} {"train_loss": -25.669172286987305, "global_step": 322138, "epoch": 3881} {"train_loss": -25.477325439453125, "global_step": 322139, "epoch": 3881} {"train_loss": -25.7479190826416, "global_step": 322140, "epoch": 3881} {"train_loss": -25.74494743347168, "global_step": 322141, "epoch": 3881} {"train_loss": -25.357709884643555, "global_step": 322142, "epoch": 3881} {"train_loss": -25.8924617767334, "global_step": 322143, "epoch": 3881} {"train_loss": -25.805377960205078, "global_step": 322144, "epoch": 3881} {"train_loss": -25.388471603393555, "global_step": 322145, "epoch": 3881} {"train_loss": -25.620349884033203, "global_step": 322146, "epoch": 3881} {"train_loss": -25.74627113342285, "global_step": 322147, "epoch": 3881} {"train_loss": -25.911087036132812, "global_step": 322148, "epoch": 3881} {"train_loss": -25.639785766601562, "global_step": 322149, "epoch": 3881} {"train_loss": -26.224645614624023, "global_step": 322150, "epoch": 3881} {"train_loss": -25.851001739501953, "global_step": 322151, "epoch": 3881} {"train_loss": -25.703994750976562, "global_step": 322152, "epoch": 3881} {"train_loss": -25.865402221679688, "global_step": 322153, "epoch": 3881} {"train_loss": -26.133747100830078, "global_step": 322154, "epoch": 3881} {"train_loss": -25.92569351196289, "global_step": 322155, "epoch": 3881} {"train_loss": -25.79871940612793, "global_step": 322156, "epoch": 3881} {"train_loss": -25.861509323120117, "global_step": 322157, "epoch": 3881} {"train_loss": -25.901823043823242, "global_step": 322158, "epoch": 3881} {"train_loss": -26.113361358642578, "global_step": 322159, "epoch": 3881} {"train_loss": -26.0939998626709, "global_step": 322160, "epoch": 3881} {"train_loss": -26.160781860351562, "global_step": 322161, "epoch": 3881} {"train_loss": -25.81117057800293, "global_step": 322162, "epoch": 3881} {"train_loss": -26.130054473876953, "global_step": 322163, "epoch": 3881} {"train_loss": -25.80031394958496, "global_step": 322164, "epoch": 3881} {"train_loss": -25.649377822875977, "global_step": 322165, "epoch": 3881} {"train_loss": -25.855600357055664, "global_step": 322166, "epoch": 3881} {"train_loss": -26.03125, "global_step": 322167, "epoch": 3881} {"train_loss": -26.072513580322266, "global_step": 322168, "epoch": 3881} {"train_loss": -26.065082550048828, "global_step": 322169, "epoch": 3881} {"train_loss": -25.879058837890625, "global_step": 322170, "epoch": 3881} {"train_loss": -25.763126373291016, "global_step": 322171, "epoch": 3881} {"train_loss": -26.08331298828125, "global_step": 322172, "epoch": 3881} {"train_loss": -26.189443588256836, "global_step": 322173, "epoch": 3881} {"train_loss": -25.893850326538086, "global_step": 322174, "epoch": 3881} {"train_loss": -25.943647384643555, "global_step": 322175, "epoch": 3881} {"train_loss": -26.0195369720459, "global_step": 322176, "epoch": 3881} {"train_loss": -25.910978317260742, "global_step": 322177, "epoch": 3881} {"train_loss": -26.15252113342285, "global_step": 322178, "epoch": 3881} {"train_loss": -25.767810821533203, "global_step": 322179, "epoch": 3881} {"train_loss": -25.876361846923828, "global_step": 322180, "epoch": 3881} {"train_loss": -26.252613067626953, "global_step": 322181, "epoch": 3881} {"train_loss": -26.264860153198242, "global_step": 322182, "epoch": 3881} {"train_loss": -26.017444610595703, "global_step": 322183, "epoch": 3881} {"train_loss": -25.75324821472168, "global_step": 322184, "epoch": 3881} {"train_loss": -25.6699275970459, "global_step": 322185, "epoch": 3881} {"train_loss": -25.77723503112793, "global_step": 322186, "epoch": 3881} {"train_loss": -26.112289428710938, "global_step": 322187, "epoch": 3881} {"train_loss": -25.639699935913086, "global_step": 322188, "epoch": 3881} {"train_loss": -26.011798858642578, "global_step": 322189, "epoch": 3881} {"train_loss": -25.53260612487793, "global_step": 322190, "epoch": 3881} {"train_loss": -25.742633819580078, "global_step": 322191, "epoch": 3881} {"train_loss": -25.803314208984375, "global_step": 322192, "epoch": 3881} {"train_loss": -26.003503799438477, "global_step": 322193, "epoch": 3881} {"train_loss": -25.752897262573242, "global_step": 322194, "epoch": 3881} {"train_loss": -25.912778854370117, "global_step": 322195, "epoch": 3881} {"train_loss": -25.671833038330078, "global_step": 322196, "epoch": 3881} {"train_loss": -26.225217819213867, "global_step": 322197, "epoch": 3881} {"train_loss": -25.6981258392334, "global_step": 322198, "epoch": 3881} {"train_loss": -25.72733497619629, "global_step": 322199, "epoch": 3881} {"train_loss": -26.109149932861328, "global_step": 322200, "epoch": 3881} {"train_loss": -25.785160064697266, "global_step": 322201, "epoch": 3881} {"train_loss": -25.752120971679688, "global_step": 322202, "epoch": 3881} {"train_loss": -25.511722564697266, "global_step": 322203, "epoch": 3881} {"train_loss": -26.048450469970703, "global_step": 322204, "epoch": 3881} {"train_loss": -25.774680631706513, "global_step": 322205, "epoch": 3881, "val_loss": 7242866.0} {"train_loss": -25.621784210205078, "global_step": 322206, "epoch": 3882} {"train_loss": -25.065126419067383, "global_step": 322207, "epoch": 3882} {"train_loss": -24.760622024536133, "global_step": 322208, "epoch": 3882} {"train_loss": -25.41884994506836, "global_step": 322209, "epoch": 3882} {"train_loss": -25.437463760375977, "global_step": 322210, "epoch": 3882} {"train_loss": -25.676040649414062, "global_step": 322211, "epoch": 3882} {"train_loss": -25.08563804626465, "global_step": 322212, "epoch": 3882} {"train_loss": -25.780115127563477, "global_step": 322213, "epoch": 3882} {"train_loss": -25.299148559570312, "global_step": 322214, "epoch": 3882} {"train_loss": -25.754453659057617, "global_step": 322215, "epoch": 3882} {"train_loss": -25.970245361328125, "global_step": 322216, "epoch": 3882} {"train_loss": -25.69724464416504, "global_step": 322217, "epoch": 3882} {"train_loss": -25.868946075439453, "global_step": 322218, "epoch": 3882} {"train_loss": -25.58358383178711, "global_step": 322219, "epoch": 3882} {"train_loss": -26.00190544128418, "global_step": 322220, "epoch": 3882} {"train_loss": -25.45865821838379, "global_step": 322221, "epoch": 3882} {"train_loss": -25.581146240234375, "global_step": 322222, "epoch": 3882} {"train_loss": -25.720975875854492, "global_step": 322223, "epoch": 3882} {"train_loss": -26.1497859954834, "global_step": 322224, "epoch": 3882} {"train_loss": -25.740869522094727, "global_step": 322225, "epoch": 3882} {"train_loss": -25.898862838745117, "global_step": 322226, "epoch": 3882} {"train_loss": -26.243000030517578, "global_step": 322227, "epoch": 3882} {"train_loss": -25.822498321533203, "global_step": 322228, "epoch": 3882} {"train_loss": -25.8181095123291, "global_step": 322229, "epoch": 3882} {"train_loss": -26.042407989501953, "global_step": 322230, "epoch": 3882} {"train_loss": -25.632205963134766, "global_step": 322231, "epoch": 3882} {"train_loss": -25.935260772705078, "global_step": 322232, "epoch": 3882} {"train_loss": -25.65513038635254, "global_step": 322233, "epoch": 3882} {"train_loss": -25.898908615112305, "global_step": 322234, "epoch": 3882} {"train_loss": -26.017969131469727, "global_step": 322235, "epoch": 3882} {"train_loss": -26.29593849182129, "global_step": 322236, "epoch": 3882} {"train_loss": -25.938873291015625, "global_step": 322237, "epoch": 3882} {"train_loss": -26.292993545532227, "global_step": 322238, "epoch": 3882} {"train_loss": -26.051977157592773, "global_step": 322239, "epoch": 3882} {"train_loss": -26.031164169311523, "global_step": 322240, "epoch": 3882} {"train_loss": -25.795780181884766, "global_step": 322241, "epoch": 3882} {"train_loss": -25.59052085876465, "global_step": 322242, "epoch": 3882} {"train_loss": -25.393888473510742, "global_step": 322243, "epoch": 3882} {"train_loss": -25.276601791381836, "global_step": 322244, "epoch": 3882} {"train_loss": -25.883563995361328, "global_step": 322245, "epoch": 3882} {"train_loss": -25.69855308532715, "global_step": 322246, "epoch": 3882} {"train_loss": -25.06561279296875, "global_step": 322247, "epoch": 3882} {"train_loss": -24.463714599609375, "global_step": 322248, "epoch": 3882} {"train_loss": -25.642292022705078, "global_step": 322249, "epoch": 3882} {"train_loss": -25.449289321899414, "global_step": 322250, "epoch": 3882} {"train_loss": -25.319623947143555, "global_step": 322251, "epoch": 3882} {"train_loss": -25.39802360534668, "global_step": 322252, "epoch": 3882} {"train_loss": -25.45021629333496, "global_step": 322253, "epoch": 3882} {"train_loss": -25.626361846923828, "global_step": 322254, "epoch": 3882} {"train_loss": -25.119680404663086, "global_step": 322255, "epoch": 3882} {"train_loss": -25.48529624938965, "global_step": 322256, "epoch": 3882} {"train_loss": -25.803842544555664, "global_step": 322257, "epoch": 3882} {"train_loss": -25.572792053222656, "global_step": 322258, "epoch": 3882} {"train_loss": -25.758588790893555, "global_step": 322259, "epoch": 3882} {"train_loss": -25.76625633239746, "global_step": 322260, "epoch": 3882} {"train_loss": -25.662235260009766, "global_step": 322261, "epoch": 3882} {"train_loss": -25.538314819335938, "global_step": 322262, "epoch": 3882} {"train_loss": -25.617816925048828, "global_step": 322263, "epoch": 3882} {"train_loss": -25.281553268432617, "global_step": 322264, "epoch": 3882} {"train_loss": -25.402502059936523, "global_step": 322265, "epoch": 3882} {"train_loss": -25.42093849182129, "global_step": 322266, "epoch": 3882} {"train_loss": -25.587020874023438, "global_step": 322267, "epoch": 3882} {"train_loss": -25.444421768188477, "global_step": 322268, "epoch": 3882} {"train_loss": -25.604324340820312, "global_step": 322269, "epoch": 3882} {"train_loss": -25.9879093170166, "global_step": 322270, "epoch": 3882} {"train_loss": -26.04498291015625, "global_step": 322271, "epoch": 3882} {"train_loss": -25.59209632873535, "global_step": 322272, "epoch": 3882} {"train_loss": -26.328088760375977, "global_step": 322273, "epoch": 3882} {"train_loss": -26.244482040405273, "global_step": 322274, "epoch": 3882} {"train_loss": -25.84321403503418, "global_step": 322275, "epoch": 3882} {"train_loss": -25.88724708557129, "global_step": 322276, "epoch": 3882} {"train_loss": -25.95098876953125, "global_step": 322277, "epoch": 3882} {"train_loss": -26.153528213500977, "global_step": 322278, "epoch": 3882} {"train_loss": -25.817731857299805, "global_step": 322279, "epoch": 3882} {"train_loss": -25.973058700561523, "global_step": 322280, "epoch": 3882} {"train_loss": -25.768512725830078, "global_step": 322281, "epoch": 3882} {"train_loss": -25.939136505126953, "global_step": 322282, "epoch": 3882} {"train_loss": -25.938953399658203, "global_step": 322283, "epoch": 3882} {"train_loss": -26.097564697265625, "global_step": 322284, "epoch": 3882} {"train_loss": -26.108556747436523, "global_step": 322285, "epoch": 3882} {"train_loss": -25.867599487304688, "global_step": 322286, "epoch": 3882} {"train_loss": -25.85150146484375, "global_step": 322287, "epoch": 3882} {"train_loss": -25.70104739177658, "global_step": 322288, "epoch": 3882, "val_loss": 7137747.0} {"train_loss": -25.57867431640625, "global_step": 322289, "epoch": 3883} {"train_loss": -25.51314353942871, "global_step": 322290, "epoch": 3883} {"train_loss": -25.180953979492188, "global_step": 322291, "epoch": 3883} {"train_loss": -24.636838912963867, "global_step": 322292, "epoch": 3883} {"train_loss": -24.58858299255371, "global_step": 322293, "epoch": 3883} {"train_loss": -25.1846981048584, "global_step": 322294, "epoch": 3883} {"train_loss": -25.476394653320312, "global_step": 322295, "epoch": 3883} {"train_loss": -24.8848934173584, "global_step": 322296, "epoch": 3883} {"train_loss": -25.56511878967285, "global_step": 322297, "epoch": 3883} {"train_loss": -25.467679977416992, "global_step": 322298, "epoch": 3883} {"train_loss": -25.506620407104492, "global_step": 322299, "epoch": 3883} {"train_loss": -25.388151168823242, "global_step": 322300, "epoch": 3883} {"train_loss": -25.289573669433594, "global_step": 322301, "epoch": 3883} {"train_loss": -25.014774322509766, "global_step": 322302, "epoch": 3883} {"train_loss": -25.07761001586914, "global_step": 322303, "epoch": 3883} {"train_loss": -25.23445701599121, "global_step": 322304, "epoch": 3883} {"train_loss": -25.345426559448242, "global_step": 322305, "epoch": 3883} {"train_loss": -25.40822410583496, "global_step": 322306, "epoch": 3883} {"train_loss": -25.51014518737793, "global_step": 322307, "epoch": 3883} {"train_loss": -25.682037353515625, "global_step": 322308, "epoch": 3883} {"train_loss": -25.858585357666016, "global_step": 322309, "epoch": 3883} {"train_loss": -26.07546043395996, "global_step": 322310, "epoch": 3883} {"train_loss": -25.775598526000977, "global_step": 322311, "epoch": 3883} {"train_loss": -26.060312271118164, "global_step": 322312, "epoch": 3883} {"train_loss": -25.368946075439453, "global_step": 322313, "epoch": 3883} {"train_loss": -25.68861198425293, "global_step": 322314, "epoch": 3883} {"train_loss": -25.807947158813477, "global_step": 322315, "epoch": 3883} {"train_loss": -25.9281005859375, "global_step": 322316, "epoch": 3883} {"train_loss": -25.814376831054688, "global_step": 322317, "epoch": 3883} {"train_loss": -25.896371841430664, "global_step": 322318, "epoch": 3883} {"train_loss": -25.725881576538086, "global_step": 322319, "epoch": 3883} {"train_loss": -25.50334930419922, "global_step": 322320, "epoch": 3883} {"train_loss": -25.89002799987793, "global_step": 322321, "epoch": 3883} {"train_loss": -25.81501579284668, "global_step": 322322, "epoch": 3883} {"train_loss": -25.90229606628418, "global_step": 322323, "epoch": 3883} {"train_loss": -25.87702751159668, "global_step": 322324, "epoch": 3883} {"train_loss": -25.798742294311523, "global_step": 322325, "epoch": 3883} {"train_loss": -26.090576171875, "global_step": 322326, "epoch": 3883} {"train_loss": -26.072879791259766, "global_step": 322327, "epoch": 3883} {"train_loss": -26.20432472229004, "global_step": 322328, "epoch": 3883} {"train_loss": -25.794763565063477, "global_step": 322329, "epoch": 3883} {"train_loss": -25.79566764831543, "global_step": 322330, "epoch": 3883} {"train_loss": -25.479394912719727, "global_step": 322331, "epoch": 3883} {"train_loss": -25.442060470581055, "global_step": 322332, "epoch": 3883} {"train_loss": -25.427595138549805, "global_step": 322333, "epoch": 3883} {"train_loss": -26.05047035217285, "global_step": 322334, "epoch": 3883} {"train_loss": -25.75958251953125, "global_step": 322335, "epoch": 3883} {"train_loss": -25.817890167236328, "global_step": 322336, "epoch": 3883} {"train_loss": -26.119251251220703, "global_step": 322337, "epoch": 3883} {"train_loss": -25.853803634643555, "global_step": 322338, "epoch": 3883} {"train_loss": -25.816436767578125, "global_step": 322339, "epoch": 3883} {"train_loss": -25.968915939331055, "global_step": 322340, "epoch": 3883} {"train_loss": -25.802478790283203, "global_step": 322341, "epoch": 3883} {"train_loss": -25.511104583740234, "global_step": 322342, "epoch": 3883} {"train_loss": -25.744897842407227, "global_step": 322343, "epoch": 3883} {"train_loss": -25.93281364440918, "global_step": 322344, "epoch": 3883} {"train_loss": -26.267318725585938, "global_step": 322345, "epoch": 3883} {"train_loss": -25.47205924987793, "global_step": 322346, "epoch": 3883} {"train_loss": -26.095172882080078, "global_step": 322347, "epoch": 3883} {"train_loss": -25.623767852783203, "global_step": 322348, "epoch": 3883} {"train_loss": -26.362783432006836, "global_step": 322349, "epoch": 3883} {"train_loss": -26.0572509765625, "global_step": 322350, "epoch": 3883} {"train_loss": -25.90329933166504, "global_step": 322351, "epoch": 3883} {"train_loss": -26.121740341186523, "global_step": 322352, "epoch": 3883} {"train_loss": -26.045190811157227, "global_step": 322353, "epoch": 3883} {"train_loss": -25.7126407623291, "global_step": 322354, "epoch": 3883} {"train_loss": -25.99655532836914, "global_step": 322355, "epoch": 3883} {"train_loss": -25.99042320251465, "global_step": 322356, "epoch": 3883} {"train_loss": -25.913822174072266, "global_step": 322357, "epoch": 3883} {"train_loss": -25.73731803894043, "global_step": 322358, "epoch": 3883} {"train_loss": -25.51122283935547, "global_step": 322359, "epoch": 3883} {"train_loss": -25.856842041015625, "global_step": 322360, "epoch": 3883} {"train_loss": -26.022680282592773, "global_step": 322361, "epoch": 3883} {"train_loss": -25.81145668029785, "global_step": 322362, "epoch": 3883} {"train_loss": -25.206897735595703, "global_step": 322363, "epoch": 3883} {"train_loss": -25.515432357788086, "global_step": 322364, "epoch": 3883} {"train_loss": -25.6130313873291, "global_step": 322365, "epoch": 3883} {"train_loss": -25.238235473632812, "global_step": 322366, "epoch": 3883} {"train_loss": -25.461585998535156, "global_step": 322367, "epoch": 3883} {"train_loss": -25.55485725402832, "global_step": 322368, "epoch": 3883} {"train_loss": -26.294513702392578, "global_step": 322369, "epoch": 3883} {"train_loss": -25.592588424682617, "global_step": 322370, "epoch": 3883} {"train_loss": -25.689818738454797, "global_step": 322371, "epoch": 3883, "val_loss": 7237523.0} {"train_loss": -25.144521713256836, "global_step": 322372, "epoch": 3884} {"train_loss": -25.64347267150879, "global_step": 322373, "epoch": 3884} {"train_loss": -25.233625411987305, "global_step": 322374, "epoch": 3884} {"train_loss": -25.684667587280273, "global_step": 322375, "epoch": 3884} {"train_loss": -24.904075622558594, "global_step": 322376, "epoch": 3884} {"train_loss": -25.92121696472168, "global_step": 322377, "epoch": 3884} {"train_loss": -25.7779598236084, "global_step": 322378, "epoch": 3884} {"train_loss": -25.718006134033203, "global_step": 322379, "epoch": 3884} {"train_loss": -25.780664443969727, "global_step": 322380, "epoch": 3884} {"train_loss": -25.6853084564209, "global_step": 322381, "epoch": 3884} {"train_loss": -25.67624282836914, "global_step": 322382, "epoch": 3884} {"train_loss": -25.83439064025879, "global_step": 322383, "epoch": 3884} {"train_loss": -25.912769317626953, "global_step": 322384, "epoch": 3884} {"train_loss": -25.606510162353516, "global_step": 322385, "epoch": 3884} {"train_loss": -25.48344612121582, "global_step": 322386, "epoch": 3884} {"train_loss": -26.094955444335938, "global_step": 322387, "epoch": 3884} {"train_loss": -25.631580352783203, "global_step": 322388, "epoch": 3884} {"train_loss": -26.349075317382812, "global_step": 322389, "epoch": 3884} {"train_loss": -25.774755477905273, "global_step": 322390, "epoch": 3884} {"train_loss": -25.493961334228516, "global_step": 322391, "epoch": 3884} {"train_loss": -25.868677139282227, "global_step": 322392, "epoch": 3884} {"train_loss": -25.606815338134766, "global_step": 322393, "epoch": 3884} {"train_loss": -26.0472354888916, "global_step": 322394, "epoch": 3884} {"train_loss": -25.98538589477539, "global_step": 322395, "epoch": 3884} {"train_loss": -25.90286636352539, "global_step": 322396, "epoch": 3884} {"train_loss": -25.79127311706543, "global_step": 322397, "epoch": 3884} {"train_loss": -26.1387882232666, "global_step": 322398, "epoch": 3884} {"train_loss": -25.840301513671875, "global_step": 322399, "epoch": 3884} {"train_loss": -26.231769561767578, "global_step": 322400, "epoch": 3884} {"train_loss": -26.113880157470703, "global_step": 322401, "epoch": 3884} {"train_loss": -25.8718204498291, "global_step": 322402, "epoch": 3884} {"train_loss": -25.57370376586914, "global_step": 322403, "epoch": 3884} {"train_loss": -25.901203155517578, "global_step": 322404, "epoch": 3884} {"train_loss": -25.821430206298828, "global_step": 322405, "epoch": 3884} {"train_loss": -26.057348251342773, "global_step": 322406, "epoch": 3884} {"train_loss": -26.215702056884766, "global_step": 322407, "epoch": 3884} {"train_loss": -26.186609268188477, "global_step": 322408, "epoch": 3884} {"train_loss": -25.9765682220459, "global_step": 322409, "epoch": 3884} {"train_loss": -26.27524185180664, "global_step": 322410, "epoch": 3884} {"train_loss": -26.01617431640625, "global_step": 322411, "epoch": 3884} {"train_loss": -25.86044692993164, "global_step": 322412, "epoch": 3884} {"train_loss": -25.52461051940918, "global_step": 322413, "epoch": 3884} {"train_loss": -25.74574851989746, "global_step": 322414, "epoch": 3884} {"train_loss": -25.495277404785156, "global_step": 322415, "epoch": 3884} {"train_loss": -25.506467819213867, "global_step": 322416, "epoch": 3884} {"train_loss": -25.569913864135742, "global_step": 322417, "epoch": 3884} {"train_loss": -25.905054092407227, "global_step": 322418, "epoch": 3884} {"train_loss": -25.980939865112305, "global_step": 322419, "epoch": 3884} {"train_loss": -25.692413330078125, "global_step": 322420, "epoch": 3884} {"train_loss": -25.656265258789062, "global_step": 322421, "epoch": 3884} {"train_loss": -25.808561325073242, "global_step": 322422, "epoch": 3884} {"train_loss": -25.386245727539062, "global_step": 322423, "epoch": 3884} {"train_loss": -25.422027587890625, "global_step": 322424, "epoch": 3884} {"train_loss": -25.834232330322266, "global_step": 322425, "epoch": 3884} {"train_loss": -25.297414779663086, "global_step": 322426, "epoch": 3884} {"train_loss": -26.070178985595703, "global_step": 322427, "epoch": 3884} {"train_loss": -26.0931396484375, "global_step": 322428, "epoch": 3884} {"train_loss": -25.731307983398438, "global_step": 322429, "epoch": 3884} {"train_loss": -25.973108291625977, "global_step": 322430, "epoch": 3884} {"train_loss": -25.87411880493164, "global_step": 322431, "epoch": 3884} {"train_loss": -26.08806800842285, "global_step": 322432, "epoch": 3884} {"train_loss": -25.528606414794922, "global_step": 322433, "epoch": 3884} {"train_loss": -25.7620792388916, "global_step": 322434, "epoch": 3884} {"train_loss": -25.891096115112305, "global_step": 322435, "epoch": 3884} {"train_loss": -25.751428604125977, "global_step": 322436, "epoch": 3884} {"train_loss": -26.076074600219727, "global_step": 322437, "epoch": 3884} {"train_loss": -25.56161880493164, "global_step": 322438, "epoch": 3884} {"train_loss": -26.204435348510742, "global_step": 322439, "epoch": 3884} {"train_loss": -25.801443099975586, "global_step": 322440, "epoch": 3884} {"train_loss": -25.864471435546875, "global_step": 322441, "epoch": 3884} {"train_loss": -25.78653907775879, "global_step": 322442, "epoch": 3884} {"train_loss": -26.13335609436035, "global_step": 322443, "epoch": 3884} {"train_loss": -25.92081069946289, "global_step": 322444, "epoch": 3884} {"train_loss": -25.996923446655273, "global_step": 322445, "epoch": 3884} {"train_loss": -25.842025756835938, "global_step": 322446, "epoch": 3884} {"train_loss": -25.892852783203125, "global_step": 322447, "epoch": 3884} {"train_loss": -26.249963760375977, "global_step": 322448, "epoch": 3884} {"train_loss": -25.689559936523438, "global_step": 322449, "epoch": 3884} {"train_loss": -25.98762321472168, "global_step": 322450, "epoch": 3884} {"train_loss": -25.712987899780273, "global_step": 322451, "epoch": 3884} {"train_loss": -25.954254150390625, "global_step": 322452, "epoch": 3884} {"train_loss": -25.717178344726562, "global_step": 322453, "epoch": 3884} {"train_loss": -25.83104855181223, "global_step": 322454, "epoch": 3884, "val_loss": 7182722.0} {"train_loss": -24.46074676513672, "global_step": 322455, "epoch": 3885} {"train_loss": -24.53757095336914, "global_step": 322456, "epoch": 3885} {"train_loss": -24.719839096069336, "global_step": 322457, "epoch": 3885} {"train_loss": -24.19881820678711, "global_step": 322458, "epoch": 3885} {"train_loss": -25.946088790893555, "global_step": 322459, "epoch": 3885} {"train_loss": -24.58760643005371, "global_step": 322460, "epoch": 3885} {"train_loss": -25.676773071289062, "global_step": 322461, "epoch": 3885} {"train_loss": -24.683774948120117, "global_step": 322462, "epoch": 3885} {"train_loss": -25.024280548095703, "global_step": 322463, "epoch": 3885} {"train_loss": -25.1458797454834, "global_step": 322464, "epoch": 3885} {"train_loss": -24.891733169555664, "global_step": 322465, "epoch": 3885} {"train_loss": -25.537208557128906, "global_step": 322466, "epoch": 3885} {"train_loss": -25.257963180541992, "global_step": 322467, "epoch": 3885} {"train_loss": -25.241300582885742, "global_step": 322468, "epoch": 3885} {"train_loss": -25.638891220092773, "global_step": 322469, "epoch": 3885} {"train_loss": -25.365087509155273, "global_step": 322470, "epoch": 3885} {"train_loss": -25.418468475341797, "global_step": 322471, "epoch": 3885} {"train_loss": -25.56941032409668, "global_step": 322472, "epoch": 3885} {"train_loss": -25.668012619018555, "global_step": 322473, "epoch": 3885} {"train_loss": -25.668231964111328, "global_step": 322474, "epoch": 3885} {"train_loss": -25.32845115661621, "global_step": 322475, "epoch": 3885} {"train_loss": -25.63532066345215, "global_step": 322476, "epoch": 3885} {"train_loss": -25.7218017578125, "global_step": 322477, "epoch": 3885} {"train_loss": -25.517444610595703, "global_step": 322478, "epoch": 3885} {"train_loss": -25.574630737304688, "global_step": 322479, "epoch": 3885} {"train_loss": -25.74102783203125, "global_step": 322480, "epoch": 3885} {"train_loss": -25.44063949584961, "global_step": 322481, "epoch": 3885} {"train_loss": -25.6021671295166, "global_step": 322482, "epoch": 3885} {"train_loss": -25.91559410095215, "global_step": 322483, "epoch": 3885} {"train_loss": -25.873931884765625, "global_step": 322484, "epoch": 3885} {"train_loss": -25.649221420288086, "global_step": 322485, "epoch": 3885} {"train_loss": -26.134862899780273, "global_step": 322486, "epoch": 3885} {"train_loss": -25.67255210876465, "global_step": 322487, "epoch": 3885} {"train_loss": -26.0330867767334, "global_step": 322488, "epoch": 3885} {"train_loss": -25.822980880737305, "global_step": 322489, "epoch": 3885} {"train_loss": -25.619754791259766, "global_step": 322490, "epoch": 3885} {"train_loss": -25.801061630249023, "global_step": 322491, "epoch": 3885} {"train_loss": -25.479890823364258, "global_step": 322492, "epoch": 3885} {"train_loss": -26.199064254760742, "global_step": 322493, "epoch": 3885} {"train_loss": -25.185848236083984, "global_step": 322494, "epoch": 3885} {"train_loss": -25.75555419921875, "global_step": 322495, "epoch": 3885} {"train_loss": -25.720258712768555, "global_step": 322496, "epoch": 3885} {"train_loss": -25.811664581298828, "global_step": 322497, "epoch": 3885} {"train_loss": -25.655078887939453, "global_step": 322498, "epoch": 3885} {"train_loss": -25.525684356689453, "global_step": 322499, "epoch": 3885} {"train_loss": -25.901081085205078, "global_step": 322500, "epoch": 3885} {"train_loss": -25.981542587280273, "global_step": 322501, "epoch": 3885} {"train_loss": -25.63789176940918, "global_step": 322502, "epoch": 3885} {"train_loss": -25.808313369750977, "global_step": 322503, "epoch": 3885} {"train_loss": -25.527814865112305, "global_step": 322504, "epoch": 3885} {"train_loss": -25.660083770751953, "global_step": 322505, "epoch": 3885} {"train_loss": -25.641468048095703, "global_step": 322506, "epoch": 3885} {"train_loss": -25.558279037475586, "global_step": 322507, "epoch": 3885} {"train_loss": -25.91036033630371, "global_step": 322508, "epoch": 3885} {"train_loss": -26.150074005126953, "global_step": 322509, "epoch": 3885} {"train_loss": -26.027545928955078, "global_step": 322510, "epoch": 3885} {"train_loss": -25.923221588134766, "global_step": 322511, "epoch": 3885} {"train_loss": -25.5185604095459, "global_step": 322512, "epoch": 3885} {"train_loss": -25.7492618560791, "global_step": 322513, "epoch": 3885} {"train_loss": -25.742050170898438, "global_step": 322514, "epoch": 3885} {"train_loss": -25.97748374938965, "global_step": 322515, "epoch": 3885} {"train_loss": -25.85919189453125, "global_step": 322516, "epoch": 3885} {"train_loss": -25.969696044921875, "global_step": 322517, "epoch": 3885} {"train_loss": -26.067352294921875, "global_step": 322518, "epoch": 3885} {"train_loss": -25.955493927001953, "global_step": 322519, "epoch": 3885} {"train_loss": -25.783843994140625, "global_step": 322520, "epoch": 3885} {"train_loss": -25.804901123046875, "global_step": 322521, "epoch": 3885} {"train_loss": -25.319059371948242, "global_step": 322522, "epoch": 3885} {"train_loss": -25.55573844909668, "global_step": 322523, "epoch": 3885} {"train_loss": -25.75531578063965, "global_step": 322524, "epoch": 3885} {"train_loss": -25.740758895874023, "global_step": 322525, "epoch": 3885} {"train_loss": -25.519880294799805, "global_step": 322526, "epoch": 3885} {"train_loss": -25.563993453979492, "global_step": 322527, "epoch": 3885} {"train_loss": -26.069822311401367, "global_step": 322528, "epoch": 3885} {"train_loss": -25.52834129333496, "global_step": 322529, "epoch": 3885} {"train_loss": -25.880273818969727, "global_step": 322530, "epoch": 3885} {"train_loss": -25.777984619140625, "global_step": 322531, "epoch": 3885} {"train_loss": -26.231231689453125, "global_step": 322532, "epoch": 3885} {"train_loss": -25.71095085144043, "global_step": 322533, "epoch": 3885} {"train_loss": -25.9698486328125, "global_step": 322534, "epoch": 3885} {"train_loss": -25.960895538330078, "global_step": 322535, "epoch": 3885} {"train_loss": -25.87188148498535, "global_step": 322536, "epoch": 3885} {"train_loss": -25.616288954953113, "global_step": 322537, "epoch": 3885, "val_loss": 7318026.0} {"train_loss": -24.935102462768555, "global_step": 322538, "epoch": 3886} {"train_loss": -24.91192626953125, "global_step": 322539, "epoch": 3886} {"train_loss": -25.26009178161621, "global_step": 322540, "epoch": 3886} {"train_loss": -25.70734214782715, "global_step": 322541, "epoch": 3886} {"train_loss": -24.887407302856445, "global_step": 322542, "epoch": 3886} {"train_loss": -25.461421966552734, "global_step": 322543, "epoch": 3886} {"train_loss": -24.545774459838867, "global_step": 322544, "epoch": 3886} {"train_loss": -25.39426040649414, "global_step": 322545, "epoch": 3886} {"train_loss": -25.343975067138672, "global_step": 322546, "epoch": 3886} {"train_loss": -25.406539916992188, "global_step": 322547, "epoch": 3886} {"train_loss": -25.247711181640625, "global_step": 322548, "epoch": 3886} {"train_loss": -25.387042999267578, "global_step": 322549, "epoch": 3886} {"train_loss": -25.41594123840332, "global_step": 322550, "epoch": 3886} {"train_loss": -25.311561584472656, "global_step": 322551, "epoch": 3886} {"train_loss": -25.36067771911621, "global_step": 322552, "epoch": 3886} {"train_loss": -25.497472763061523, "global_step": 322553, "epoch": 3886} {"train_loss": -25.528440475463867, "global_step": 322554, "epoch": 3886} {"train_loss": -25.6765193939209, "global_step": 322555, "epoch": 3886} {"train_loss": -25.512435913085938, "global_step": 322556, "epoch": 3886} {"train_loss": -25.434995651245117, "global_step": 322557, "epoch": 3886} {"train_loss": -25.477462768554688, "global_step": 322558, "epoch": 3886} {"train_loss": -25.292207717895508, "global_step": 322559, "epoch": 3886} {"train_loss": -25.842620849609375, "global_step": 322560, "epoch": 3886} {"train_loss": -25.38856315612793, "global_step": 322561, "epoch": 3886} {"train_loss": -25.624160766601562, "global_step": 322562, "epoch": 3886} {"train_loss": -25.8172607421875, "global_step": 322563, "epoch": 3886} {"train_loss": -25.818939208984375, "global_step": 322564, "epoch": 3886} {"train_loss": -25.805557250976562, "global_step": 322565, "epoch": 3886} {"train_loss": -25.675403594970703, "global_step": 322566, "epoch": 3886} {"train_loss": -25.590635299682617, "global_step": 322567, "epoch": 3886} {"train_loss": -25.758386611938477, "global_step": 322568, "epoch": 3886} {"train_loss": -25.507644653320312, "global_step": 322569, "epoch": 3886} {"train_loss": -25.888519287109375, "global_step": 322570, "epoch": 3886} {"train_loss": -25.703327178955078, "global_step": 322571, "epoch": 3886} {"train_loss": -25.45865249633789, "global_step": 322572, "epoch": 3886} {"train_loss": -25.7828369140625, "global_step": 322573, "epoch": 3886} {"train_loss": -25.58884620666504, "global_step": 322574, "epoch": 3886} {"train_loss": -26.262653350830078, "global_step": 322575, "epoch": 3886} {"train_loss": -25.677717208862305, "global_step": 322576, "epoch": 3886} {"train_loss": -26.048044204711914, "global_step": 322577, "epoch": 3886} {"train_loss": -25.830060958862305, "global_step": 322578, "epoch": 3886} {"train_loss": -25.79596519470215, "global_step": 322579, "epoch": 3886} {"train_loss": -25.865768432617188, "global_step": 322580, "epoch": 3886} {"train_loss": -25.985382080078125, "global_step": 322581, "epoch": 3886} {"train_loss": -25.779577255249023, "global_step": 322582, "epoch": 3886} {"train_loss": -25.551477432250977, "global_step": 322583, "epoch": 3886} {"train_loss": -26.206811904907227, "global_step": 322584, "epoch": 3886} {"train_loss": -25.50250816345215, "global_step": 322585, "epoch": 3886} {"train_loss": -26.014755249023438, "global_step": 322586, "epoch": 3886} {"train_loss": -25.77292251586914, "global_step": 322587, "epoch": 3886} {"train_loss": -25.855215072631836, "global_step": 322588, "epoch": 3886} {"train_loss": -25.624719619750977, "global_step": 322589, "epoch": 3886} {"train_loss": -25.80156898498535, "global_step": 322590, "epoch": 3886} {"train_loss": -26.077850341796875, "global_step": 322591, "epoch": 3886} {"train_loss": -26.07215690612793, "global_step": 322592, "epoch": 3886} {"train_loss": -26.171966552734375, "global_step": 322593, "epoch": 3886} {"train_loss": -25.882659912109375, "global_step": 322594, "epoch": 3886} {"train_loss": -25.929380416870117, "global_step": 322595, "epoch": 3886} {"train_loss": -26.133237838745117, "global_step": 322596, "epoch": 3886} {"train_loss": -25.827096939086914, "global_step": 322597, "epoch": 3886} {"train_loss": -25.915979385375977, "global_step": 322598, "epoch": 3886} {"train_loss": -26.097537994384766, "global_step": 322599, "epoch": 3886} {"train_loss": -26.312427520751953, "global_step": 322600, "epoch": 3886} {"train_loss": -26.0505313873291, "global_step": 322601, "epoch": 3886} {"train_loss": -26.272626876831055, "global_step": 322602, "epoch": 3886} {"train_loss": -25.976675033569336, "global_step": 322603, "epoch": 3886} {"train_loss": -26.062910079956055, "global_step": 322604, "epoch": 3886} {"train_loss": -26.3109073638916, "global_step": 322605, "epoch": 3886} {"train_loss": -25.656171798706055, "global_step": 322606, "epoch": 3886} {"train_loss": -25.916229248046875, "global_step": 322607, "epoch": 3886} {"train_loss": -25.8985538482666, "global_step": 322608, "epoch": 3886} {"train_loss": -26.15394401550293, "global_step": 322609, "epoch": 3886} {"train_loss": -26.0564022064209, "global_step": 322610, "epoch": 3886} {"train_loss": -26.121692657470703, "global_step": 322611, "epoch": 3886} {"train_loss": -25.660558700561523, "global_step": 322612, "epoch": 3886} {"train_loss": -25.332048416137695, "global_step": 322613, "epoch": 3886} {"train_loss": -25.593219757080078, "global_step": 322614, "epoch": 3886} {"train_loss": -25.861286163330078, "global_step": 322615, "epoch": 3886} {"train_loss": -25.645822525024414, "global_step": 322616, "epoch": 3886} {"train_loss": -25.335895538330078, "global_step": 322617, "epoch": 3886} {"train_loss": -25.952472686767578, "global_step": 322618, "epoch": 3886} {"train_loss": -25.47195053100586, "global_step": 322619, "epoch": 3886} {"train_loss": -25.692782712269977, "global_step": 322620, "epoch": 3886, "val_loss": 7142896.0} {"train_loss": -24.37446403503418, "global_step": 322621, "epoch": 3887} {"train_loss": -23.761962890625, "global_step": 322622, "epoch": 3887} {"train_loss": -24.81683921813965, "global_step": 322623, "epoch": 3887} {"train_loss": -24.817813873291016, "global_step": 322624, "epoch": 3887} {"train_loss": -24.75753402709961, "global_step": 322625, "epoch": 3887} {"train_loss": -25.082468032836914, "global_step": 322626, "epoch": 3887} {"train_loss": -25.460105895996094, "global_step": 322627, "epoch": 3887} {"train_loss": -24.679609298706055, "global_step": 322628, "epoch": 3887} {"train_loss": -25.274717330932617, "global_step": 322629, "epoch": 3887} {"train_loss": -24.83987808227539, "global_step": 322630, "epoch": 3887} {"train_loss": -25.18717384338379, "global_step": 322631, "epoch": 3887} {"train_loss": -25.290719985961914, "global_step": 322632, "epoch": 3887} {"train_loss": -25.069074630737305, "global_step": 322633, "epoch": 3887} {"train_loss": -25.079252243041992, "global_step": 322634, "epoch": 3887} {"train_loss": -25.500919342041016, "global_step": 322635, "epoch": 3887} {"train_loss": -25.059738159179688, "global_step": 322636, "epoch": 3887} {"train_loss": -25.62918472290039, "global_step": 322637, "epoch": 3887} {"train_loss": -25.399045944213867, "global_step": 322638, "epoch": 3887} {"train_loss": -24.954612731933594, "global_step": 322639, "epoch": 3887} {"train_loss": -25.37017822265625, "global_step": 322640, "epoch": 3887} {"train_loss": -25.753690719604492, "global_step": 322641, "epoch": 3887} {"train_loss": -25.36465835571289, "global_step": 322642, "epoch": 3887} {"train_loss": -25.529592514038086, "global_step": 322643, "epoch": 3887} {"train_loss": -25.491943359375, "global_step": 322644, "epoch": 3887} {"train_loss": -25.23027992248535, "global_step": 322645, "epoch": 3887} {"train_loss": -25.471792221069336, "global_step": 322646, "epoch": 3887} {"train_loss": -25.706134796142578, "global_step": 322647, "epoch": 3887} {"train_loss": -25.481582641601562, "global_step": 322648, "epoch": 3887} {"train_loss": -25.662784576416016, "global_step": 322649, "epoch": 3887} {"train_loss": -25.401382446289062, "global_step": 322650, "epoch": 3887} {"train_loss": -25.71164894104004, "global_step": 322651, "epoch": 3887} {"train_loss": -25.36512565612793, "global_step": 322652, "epoch": 3887} {"train_loss": -25.56145668029785, "global_step": 322653, "epoch": 3887} {"train_loss": -26.19849967956543, "global_step": 322654, "epoch": 3887} {"train_loss": -25.706384658813477, "global_step": 322655, "epoch": 3887} {"train_loss": -25.684873580932617, "global_step": 322656, "epoch": 3887} {"train_loss": -25.6217098236084, "global_step": 322657, "epoch": 3887} {"train_loss": -25.741003036499023, "global_step": 322658, "epoch": 3887} {"train_loss": -25.531017303466797, "global_step": 322659, "epoch": 3887} {"train_loss": -26.0296688079834, "global_step": 322660, "epoch": 3887} {"train_loss": -25.901891708374023, "global_step": 322661, "epoch": 3887} {"train_loss": -25.890615463256836, "global_step": 322662, "epoch": 3887} {"train_loss": -25.837751388549805, "global_step": 322663, "epoch": 3887} {"train_loss": -26.153076171875, "global_step": 322664, "epoch": 3887} {"train_loss": -25.654455184936523, "global_step": 322665, "epoch": 3887} {"train_loss": -25.761560440063477, "global_step": 322666, "epoch": 3887} {"train_loss": -26.2574520111084, "global_step": 322667, "epoch": 3887} {"train_loss": -25.971216201782227, "global_step": 322668, "epoch": 3887} {"train_loss": -25.911834716796875, "global_step": 322669, "epoch": 3887} {"train_loss": -25.671478271484375, "global_step": 322670, "epoch": 3887} {"train_loss": -25.740192413330078, "global_step": 322671, "epoch": 3887} {"train_loss": -25.912933349609375, "global_step": 322672, "epoch": 3887} {"train_loss": -25.667724609375, "global_step": 322673, "epoch": 3887} {"train_loss": -25.685667037963867, "global_step": 322674, "epoch": 3887} {"train_loss": -26.1510066986084, "global_step": 322675, "epoch": 3887} {"train_loss": -25.9149112701416, "global_step": 322676, "epoch": 3887} {"train_loss": -25.78956413269043, "global_step": 322677, "epoch": 3887} {"train_loss": -25.679733276367188, "global_step": 322678, "epoch": 3887} {"train_loss": -25.79754638671875, "global_step": 322679, "epoch": 3887} {"train_loss": -25.82850456237793, "global_step": 322680, "epoch": 3887} {"train_loss": -25.822498321533203, "global_step": 322681, "epoch": 3887} {"train_loss": -25.705169677734375, "global_step": 322682, "epoch": 3887} {"train_loss": -25.657794952392578, "global_step": 322683, "epoch": 3887} {"train_loss": -26.019681930541992, "global_step": 322684, "epoch": 3887} {"train_loss": -25.945941925048828, "global_step": 322685, "epoch": 3887} {"train_loss": -25.917882919311523, "global_step": 322686, "epoch": 3887} {"train_loss": -26.463855743408203, "global_step": 322687, "epoch": 3887} {"train_loss": -26.262500762939453, "global_step": 322688, "epoch": 3887} {"train_loss": -26.007892608642578, "global_step": 322689, "epoch": 3887} {"train_loss": -26.100072860717773, "global_step": 322690, "epoch": 3887} {"train_loss": -25.950244903564453, "global_step": 322691, "epoch": 3887} {"train_loss": -26.082605361938477, "global_step": 322692, "epoch": 3887} {"train_loss": -25.942426681518555, "global_step": 322693, "epoch": 3887} {"train_loss": -25.974653244018555, "global_step": 322694, "epoch": 3887} {"train_loss": -26.123294830322266, "global_step": 322695, "epoch": 3887} {"train_loss": -25.85572624206543, "global_step": 322696, "epoch": 3887} {"train_loss": -25.675634384155273, "global_step": 322697, "epoch": 3887} {"train_loss": -25.761280059814453, "global_step": 322698, "epoch": 3887} {"train_loss": -25.635400772094727, "global_step": 322699, "epoch": 3887} {"train_loss": -26.334003448486328, "global_step": 322700, "epoch": 3887} {"train_loss": -26.20659828186035, "global_step": 322701, "epoch": 3887} {"train_loss": -26.403451919555664, "global_step": 322702, "epoch": 3887} {"train_loss": -25.631981033876716, "global_step": 322703, "epoch": 3887, "val_loss": 7191229.0} {"train_loss": -25.04059410095215, "global_step": 322704, "epoch": 3888} {"train_loss": -25.275938034057617, "global_step": 322705, "epoch": 3888} {"train_loss": -25.774505615234375, "global_step": 322706, "epoch": 3888} {"train_loss": -25.56800651550293, "global_step": 322707, "epoch": 3888} {"train_loss": -25.44949722290039, "global_step": 322708, "epoch": 3888} {"train_loss": -25.60516929626465, "global_step": 322709, "epoch": 3888} {"train_loss": -25.8735408782959, "global_step": 322710, "epoch": 3888} {"train_loss": -25.5394344329834, "global_step": 322711, "epoch": 3888} {"train_loss": -25.443649291992188, "global_step": 322712, "epoch": 3888} {"train_loss": -25.65931510925293, "global_step": 322713, "epoch": 3888} {"train_loss": -25.94476318359375, "global_step": 322714, "epoch": 3888} {"train_loss": -25.67889404296875, "global_step": 322715, "epoch": 3888} {"train_loss": -25.88372802734375, "global_step": 322716, "epoch": 3888} {"train_loss": -25.64519691467285, "global_step": 322717, "epoch": 3888} {"train_loss": -25.54719352722168, "global_step": 322718, "epoch": 3888} {"train_loss": -25.872650146484375, "global_step": 322719, "epoch": 3888} {"train_loss": -25.779163360595703, "global_step": 322720, "epoch": 3888} {"train_loss": -25.677778244018555, "global_step": 322721, "epoch": 3888} {"train_loss": -25.7365665435791, "global_step": 322722, "epoch": 3888} {"train_loss": -25.921167373657227, "global_step": 322723, "epoch": 3888} {"train_loss": -26.280088424682617, "global_step": 322724, "epoch": 3888} {"train_loss": -26.205860137939453, "global_step": 322725, "epoch": 3888} {"train_loss": -25.752721786499023, "global_step": 322726, "epoch": 3888} {"train_loss": -26.049488067626953, "global_step": 322727, "epoch": 3888} {"train_loss": -26.1236515045166, "global_step": 322728, "epoch": 3888} {"train_loss": -26.056732177734375, "global_step": 322729, "epoch": 3888} {"train_loss": -25.866941452026367, "global_step": 322730, "epoch": 3888} {"train_loss": -26.09286880493164, "global_step": 322731, "epoch": 3888} {"train_loss": -26.107099533081055, "global_step": 322732, "epoch": 3888} {"train_loss": -25.862594604492188, "global_step": 322733, "epoch": 3888} {"train_loss": -26.005878448486328, "global_step": 322734, "epoch": 3888} {"train_loss": -26.077871322631836, "global_step": 322735, "epoch": 3888} {"train_loss": -26.113340377807617, "global_step": 322736, "epoch": 3888} {"train_loss": -26.27316665649414, "global_step": 322737, "epoch": 3888} {"train_loss": -25.6376895904541, "global_step": 322738, "epoch": 3888} {"train_loss": -25.827960968017578, "global_step": 322739, "epoch": 3888} {"train_loss": -25.922513961791992, "global_step": 322740, "epoch": 3888} {"train_loss": -25.87418556213379, "global_step": 322741, "epoch": 3888} {"train_loss": -25.645307540893555, "global_step": 322742, "epoch": 3888} {"train_loss": -25.549657821655273, "global_step": 322743, "epoch": 3888} {"train_loss": -25.795621871948242, "global_step": 322744, "epoch": 3888} {"train_loss": -26.23261070251465, "global_step": 322745, "epoch": 3888} {"train_loss": -25.749713897705078, "global_step": 322746, "epoch": 3888} {"train_loss": -25.975299835205078, "global_step": 322747, "epoch": 3888} {"train_loss": -26.028833389282227, "global_step": 322748, "epoch": 3888} {"train_loss": -25.921979904174805, "global_step": 322749, "epoch": 3888} {"train_loss": -25.93963050842285, "global_step": 322750, "epoch": 3888} {"train_loss": -26.313730239868164, "global_step": 322751, "epoch": 3888} {"train_loss": -25.579450607299805, "global_step": 322752, "epoch": 3888} {"train_loss": -25.914386749267578, "global_step": 322753, "epoch": 3888} {"train_loss": -25.14290428161621, "global_step": 322754, "epoch": 3888} {"train_loss": -25.49811363220215, "global_step": 322755, "epoch": 3888} {"train_loss": -26.00190544128418, "global_step": 322756, "epoch": 3888} {"train_loss": -25.0733699798584, "global_step": 322757, "epoch": 3888} {"train_loss": -25.770496368408203, "global_step": 322758, "epoch": 3888} {"train_loss": -25.244909286499023, "global_step": 322759, "epoch": 3888} {"train_loss": -25.823423385620117, "global_step": 322760, "epoch": 3888} {"train_loss": -25.667139053344727, "global_step": 322761, "epoch": 3888} {"train_loss": -25.83637809753418, "global_step": 322762, "epoch": 3888} {"train_loss": -25.6746768951416, "global_step": 322763, "epoch": 3888} {"train_loss": -26.082019805908203, "global_step": 322764, "epoch": 3888} {"train_loss": -26.12626075744629, "global_step": 322765, "epoch": 3888} {"train_loss": -25.845727920532227, "global_step": 322766, "epoch": 3888} {"train_loss": -25.696197509765625, "global_step": 322767, "epoch": 3888} {"train_loss": -26.170141220092773, "global_step": 322768, "epoch": 3888} {"train_loss": -25.92628288269043, "global_step": 322769, "epoch": 3888} {"train_loss": -25.94199562072754, "global_step": 322770, "epoch": 3888} {"train_loss": -25.8940372467041, "global_step": 322771, "epoch": 3888} {"train_loss": -25.816450119018555, "global_step": 322772, "epoch": 3888} {"train_loss": -25.811603546142578, "global_step": 322773, "epoch": 3888} {"train_loss": -26.100759506225586, "global_step": 322774, "epoch": 3888} {"train_loss": -25.855443954467773, "global_step": 322775, "epoch": 3888} {"train_loss": -25.83144187927246, "global_step": 322776, "epoch": 3888} {"train_loss": -25.868005752563477, "global_step": 322777, "epoch": 3888} {"train_loss": -25.985748291015625, "global_step": 322778, "epoch": 3888} {"train_loss": -26.168298721313477, "global_step": 322779, "epoch": 3888} {"train_loss": -25.8931827545166, "global_step": 322780, "epoch": 3888} {"train_loss": -26.13326072692871, "global_step": 322781, "epoch": 3888} {"train_loss": -25.884862899780273, "global_step": 322782, "epoch": 3888} {"train_loss": -25.70673942565918, "global_step": 322783, "epoch": 3888} {"train_loss": -26.05048942565918, "global_step": 322784, "epoch": 3888} {"train_loss": -26.13340187072754, "global_step": 322785, "epoch": 3888} {"train_loss": -25.82154958793916, "global_step": 322786, "epoch": 3888, "val_loss": 7260005.0} {"train_loss": -25.455829620361328, "global_step": 322787, "epoch": 3889} {"train_loss": -25.816564559936523, "global_step": 322788, "epoch": 3889} {"train_loss": -25.1785831451416, "global_step": 322789, "epoch": 3889} {"train_loss": -25.728025436401367, "global_step": 322790, "epoch": 3889} {"train_loss": -25.914081573486328, "global_step": 322791, "epoch": 3889} {"train_loss": -25.901899337768555, "global_step": 322792, "epoch": 3889} {"train_loss": -25.638839721679688, "global_step": 322793, "epoch": 3889} {"train_loss": -25.514240264892578, "global_step": 322794, "epoch": 3889} {"train_loss": -25.757755279541016, "global_step": 322795, "epoch": 3889} {"train_loss": -26.02048110961914, "global_step": 322796, "epoch": 3889} {"train_loss": -25.874357223510742, "global_step": 322797, "epoch": 3889} {"train_loss": -25.796106338500977, "global_step": 322798, "epoch": 3889} {"train_loss": -25.77249526977539, "global_step": 322799, "epoch": 3889} {"train_loss": -26.059839248657227, "global_step": 322800, "epoch": 3889} {"train_loss": -25.830610275268555, "global_step": 322801, "epoch": 3889} {"train_loss": -25.8951358795166, "global_step": 322802, "epoch": 3889} {"train_loss": -25.90455436706543, "global_step": 322803, "epoch": 3889} {"train_loss": -25.84500503540039, "global_step": 322804, "epoch": 3889} {"train_loss": -26.10194969177246, "global_step": 322805, "epoch": 3889} {"train_loss": -25.761316299438477, "global_step": 322806, "epoch": 3889} {"train_loss": -25.707639694213867, "global_step": 322807, "epoch": 3889} {"train_loss": -25.810270309448242, "global_step": 322808, "epoch": 3889} {"train_loss": -25.707855224609375, "global_step": 322809, "epoch": 3889} {"train_loss": -25.695220947265625, "global_step": 322810, "epoch": 3889} {"train_loss": -26.051837921142578, "global_step": 322811, "epoch": 3889} {"train_loss": -25.593067169189453, "global_step": 322812, "epoch": 3889} {"train_loss": -25.6492919921875, "global_step": 322813, "epoch": 3889} {"train_loss": -25.591642379760742, "global_step": 322814, "epoch": 3889} {"train_loss": -25.837980270385742, "global_step": 322815, "epoch": 3889} {"train_loss": -25.502273559570312, "global_step": 322816, "epoch": 3889} {"train_loss": -25.927968978881836, "global_step": 322817, "epoch": 3889} {"train_loss": -25.635053634643555, "global_step": 322818, "epoch": 3889} {"train_loss": -25.656986236572266, "global_step": 322819, "epoch": 3889} {"train_loss": -25.32554054260254, "global_step": 322820, "epoch": 3889} {"train_loss": -25.489540100097656, "global_step": 322821, "epoch": 3889} {"train_loss": -25.990835189819336, "global_step": 322822, "epoch": 3889} {"train_loss": -25.761926651000977, "global_step": 322823, "epoch": 3889} {"train_loss": -25.57699966430664, "global_step": 322824, "epoch": 3889} {"train_loss": -25.906005859375, "global_step": 322825, "epoch": 3889} {"train_loss": -25.5341796875, "global_step": 322826, "epoch": 3889} {"train_loss": -26.191059112548828, "global_step": 322827, "epoch": 3889} {"train_loss": -26.003467559814453, "global_step": 322828, "epoch": 3889} {"train_loss": -26.230716705322266, "global_step": 322829, "epoch": 3889} {"train_loss": -25.7811279296875, "global_step": 322830, "epoch": 3889} {"train_loss": -26.179916381835938, "global_step": 322831, "epoch": 3889} {"train_loss": -25.75811195373535, "global_step": 322832, "epoch": 3889} {"train_loss": -26.01104164123535, "global_step": 322833, "epoch": 3889} {"train_loss": -25.687280654907227, "global_step": 322834, "epoch": 3889} {"train_loss": -25.49822425842285, "global_step": 322835, "epoch": 3889} {"train_loss": -26.221954345703125, "global_step": 322836, "epoch": 3889} {"train_loss": -25.919363021850586, "global_step": 322837, "epoch": 3889} {"train_loss": -26.15290641784668, "global_step": 322838, "epoch": 3889} {"train_loss": -26.10888671875, "global_step": 322839, "epoch": 3889} {"train_loss": -26.368825912475586, "global_step": 322840, "epoch": 3889} {"train_loss": -25.64094352722168, "global_step": 322841, "epoch": 3889} {"train_loss": -26.345991134643555, "global_step": 322842, "epoch": 3889} {"train_loss": -26.121200561523438, "global_step": 322843, "epoch": 3889} {"train_loss": -25.783843994140625, "global_step": 322844, "epoch": 3889} {"train_loss": -26.050281524658203, "global_step": 322845, "epoch": 3889} {"train_loss": -26.31756591796875, "global_step": 322846, "epoch": 3889} {"train_loss": -25.881122589111328, "global_step": 322847, "epoch": 3889} {"train_loss": -25.782297134399414, "global_step": 322848, "epoch": 3889} {"train_loss": -25.906721115112305, "global_step": 322849, "epoch": 3889} {"train_loss": -25.917367935180664, "global_step": 322850, "epoch": 3889} {"train_loss": -25.43849754333496, "global_step": 322851, "epoch": 3889} {"train_loss": -25.646747589111328, "global_step": 322852, "epoch": 3889} {"train_loss": -25.880767822265625, "global_step": 322853, "epoch": 3889} {"train_loss": -26.388715744018555, "global_step": 322854, "epoch": 3889} {"train_loss": -26.024084091186523, "global_step": 322855, "epoch": 3889} {"train_loss": -25.78521156311035, "global_step": 322856, "epoch": 3889} {"train_loss": -25.623029708862305, "global_step": 322857, "epoch": 3889} {"train_loss": -25.65545654296875, "global_step": 322858, "epoch": 3889} {"train_loss": -26.09025001525879, "global_step": 322859, "epoch": 3889} {"train_loss": -25.721120834350586, "global_step": 322860, "epoch": 3889} {"train_loss": -25.575830459594727, "global_step": 322861, "epoch": 3889} {"train_loss": -25.804443359375, "global_step": 322862, "epoch": 3889} {"train_loss": -25.459928512573242, "global_step": 322863, "epoch": 3889} {"train_loss": -25.507312774658203, "global_step": 322864, "epoch": 3889} {"train_loss": -25.574193954467773, "global_step": 322865, "epoch": 3889} {"train_loss": -25.533828735351562, "global_step": 322866, "epoch": 3889} {"train_loss": -25.88972282409668, "global_step": 322867, "epoch": 3889} {"train_loss": -25.835498809814453, "global_step": 322868, "epoch": 3889} {"train_loss": -25.826234013201244, "global_step": 322869, "epoch": 3889, "val_loss": 7213600.0} {"train_loss": -24.655834197998047, "global_step": 322870, "epoch": 3890} {"train_loss": -25.46428680419922, "global_step": 322871, "epoch": 3890} {"train_loss": -25.006826400756836, "global_step": 322872, "epoch": 3890} {"train_loss": -25.02530860900879, "global_step": 322873, "epoch": 3890} {"train_loss": -25.06084632873535, "global_step": 322874, "epoch": 3890} {"train_loss": -25.3531436920166, "global_step": 322875, "epoch": 3890} {"train_loss": -25.112234115600586, "global_step": 322876, "epoch": 3890} {"train_loss": -25.18955421447754, "global_step": 322877, "epoch": 3890} {"train_loss": -25.28220558166504, "global_step": 322878, "epoch": 3890} {"train_loss": -25.393156051635742, "global_step": 322879, "epoch": 3890} {"train_loss": -25.586624145507812, "global_step": 322880, "epoch": 3890} {"train_loss": -24.92566680908203, "global_step": 322881, "epoch": 3890} {"train_loss": -25.25213050842285, "global_step": 322882, "epoch": 3890} {"train_loss": -25.2545223236084, "global_step": 322883, "epoch": 3890} {"train_loss": -25.48251724243164, "global_step": 322884, "epoch": 3890} {"train_loss": -25.632400512695312, "global_step": 322885, "epoch": 3890} {"train_loss": -25.464887619018555, "global_step": 322886, "epoch": 3890} {"train_loss": -25.4627628326416, "global_step": 322887, "epoch": 3890} {"train_loss": -25.809356689453125, "global_step": 322888, "epoch": 3890} {"train_loss": -25.471994400024414, "global_step": 322889, "epoch": 3890} {"train_loss": -25.873579025268555, "global_step": 322890, "epoch": 3890} {"train_loss": -25.662128448486328, "global_step": 322891, "epoch": 3890} {"train_loss": -25.4764347076416, "global_step": 322892, "epoch": 3890} {"train_loss": -25.560239791870117, "global_step": 322893, "epoch": 3890} {"train_loss": -25.963796615600586, "global_step": 322894, "epoch": 3890} {"train_loss": -25.536664962768555, "global_step": 322895, "epoch": 3890} {"train_loss": -25.63398551940918, "global_step": 322896, "epoch": 3890} {"train_loss": -25.6042537689209, "global_step": 322897, "epoch": 3890} {"train_loss": -25.826282501220703, "global_step": 322898, "epoch": 3890} {"train_loss": -25.80556297302246, "global_step": 322899, "epoch": 3890} {"train_loss": -25.965085983276367, "global_step": 322900, "epoch": 3890} {"train_loss": -25.531217575073242, "global_step": 322901, "epoch": 3890} {"train_loss": -25.634641647338867, "global_step": 322902, "epoch": 3890} {"train_loss": -25.796955108642578, "global_step": 322903, "epoch": 3890} {"train_loss": -25.650012969970703, "global_step": 322904, "epoch": 3890} {"train_loss": -26.386856079101562, "global_step": 322905, "epoch": 3890} {"train_loss": -26.032190322875977, "global_step": 322906, "epoch": 3890} {"train_loss": -25.97959327697754, "global_step": 322907, "epoch": 3890} {"train_loss": -26.069534301757812, "global_step": 322908, "epoch": 3890} {"train_loss": -26.171422958374023, "global_step": 322909, "epoch": 3890} {"train_loss": -25.74346351623535, "global_step": 322910, "epoch": 3890} {"train_loss": -25.90541648864746, "global_step": 322911, "epoch": 3890} {"train_loss": -26.194326400756836, "global_step": 322912, "epoch": 3890} {"train_loss": -26.204660415649414, "global_step": 322913, "epoch": 3890} {"train_loss": -26.13128662109375, "global_step": 322914, "epoch": 3890} {"train_loss": -26.09339714050293, "global_step": 322915, "epoch": 3890} {"train_loss": -25.947223663330078, "global_step": 322916, "epoch": 3890} {"train_loss": -25.831527709960938, "global_step": 322917, "epoch": 3890} {"train_loss": -25.840906143188477, "global_step": 322918, "epoch": 3890} {"train_loss": -25.95170021057129, "global_step": 322919, "epoch": 3890} {"train_loss": -26.065805435180664, "global_step": 322920, "epoch": 3890} {"train_loss": -25.906152725219727, "global_step": 322921, "epoch": 3890} {"train_loss": -25.943613052368164, "global_step": 322922, "epoch": 3890} {"train_loss": -26.24336814880371, "global_step": 322923, "epoch": 3890} {"train_loss": -25.694610595703125, "global_step": 322924, "epoch": 3890} {"train_loss": -25.762746810913086, "global_step": 322925, "epoch": 3890} {"train_loss": -25.403974533081055, "global_step": 322926, "epoch": 3890} {"train_loss": -25.864124298095703, "global_step": 322927, "epoch": 3890} {"train_loss": -25.929784774780273, "global_step": 322928, "epoch": 3890} {"train_loss": -25.91872215270996, "global_step": 322929, "epoch": 3890} {"train_loss": -25.988296508789062, "global_step": 322930, "epoch": 3890} {"train_loss": -25.900726318359375, "global_step": 322931, "epoch": 3890} {"train_loss": -26.126440048217773, "global_step": 322932, "epoch": 3890} {"train_loss": -25.544286727905273, "global_step": 322933, "epoch": 3890} {"train_loss": -26.179950714111328, "global_step": 322934, "epoch": 3890} {"train_loss": -25.674795150756836, "global_step": 322935, "epoch": 3890} {"train_loss": -25.334238052368164, "global_step": 322936, "epoch": 3890} {"train_loss": -25.694000244140625, "global_step": 322937, "epoch": 3890} {"train_loss": -25.71540641784668, "global_step": 322938, "epoch": 3890} {"train_loss": -25.85194206237793, "global_step": 322939, "epoch": 3890} {"train_loss": -25.75575065612793, "global_step": 322940, "epoch": 3890} {"train_loss": -25.748477935791016, "global_step": 322941, "epoch": 3890} {"train_loss": -25.996740341186523, "global_step": 322942, "epoch": 3890} {"train_loss": -25.67466163635254, "global_step": 322943, "epoch": 3890} {"train_loss": -25.67140769958496, "global_step": 322944, "epoch": 3890} {"train_loss": -25.567861557006836, "global_step": 322945, "epoch": 3890} {"train_loss": -25.58447265625, "global_step": 322946, "epoch": 3890} {"train_loss": -25.789331436157227, "global_step": 322947, "epoch": 3890} {"train_loss": -25.930749893188477, "global_step": 322948, "epoch": 3890} {"train_loss": -25.723968505859375, "global_step": 322949, "epoch": 3890} {"train_loss": -25.790449142456055, "global_step": 322950, "epoch": 3890} {"train_loss": -26.062488555908203, "global_step": 322951, "epoch": 3890} {"train_loss": -25.718731179294817, "global_step": 322952, "epoch": 3890, "val_loss": 7200184.0} {"train_loss": -25.64487648010254, "global_step": 322953, "epoch": 3891} {"train_loss": -24.928438186645508, "global_step": 322954, "epoch": 3891} {"train_loss": -25.2977237701416, "global_step": 322955, "epoch": 3891} {"train_loss": -25.705596923828125, "global_step": 322956, "epoch": 3891} {"train_loss": -25.154706954956055, "global_step": 322957, "epoch": 3891} {"train_loss": -25.900455474853516, "global_step": 322958, "epoch": 3891} {"train_loss": -25.79425621032715, "global_step": 322959, "epoch": 3891} {"train_loss": -25.27998161315918, "global_step": 322960, "epoch": 3891} {"train_loss": -25.438459396362305, "global_step": 322961, "epoch": 3891} {"train_loss": -25.60791015625, "global_step": 322962, "epoch": 3891} {"train_loss": -25.418554306030273, "global_step": 322963, "epoch": 3891} {"train_loss": -25.51840591430664, "global_step": 322964, "epoch": 3891} {"train_loss": -25.7445125579834, "global_step": 322965, "epoch": 3891} {"train_loss": -25.53917121887207, "global_step": 322966, "epoch": 3891} {"train_loss": -25.892414093017578, "global_step": 322967, "epoch": 3891} {"train_loss": -26.12885093688965, "global_step": 322968, "epoch": 3891} {"train_loss": -25.5164852142334, "global_step": 322969, "epoch": 3891} {"train_loss": -25.985082626342773, "global_step": 322970, "epoch": 3891} {"train_loss": -25.921100616455078, "global_step": 322971, "epoch": 3891} {"train_loss": -25.9875545501709, "global_step": 322972, "epoch": 3891} {"train_loss": -25.925769805908203, "global_step": 322973, "epoch": 3891} {"train_loss": -25.902740478515625, "global_step": 322974, "epoch": 3891} {"train_loss": -26.121841430664062, "global_step": 322975, "epoch": 3891} {"train_loss": -26.170761108398438, "global_step": 322976, "epoch": 3891} {"train_loss": -25.813520431518555, "global_step": 322977, "epoch": 3891} {"train_loss": -25.867725372314453, "global_step": 322978, "epoch": 3891} {"train_loss": -25.91068458557129, "global_step": 322979, "epoch": 3891} {"train_loss": -26.02703285217285, "global_step": 322980, "epoch": 3891} {"train_loss": -25.864246368408203, "global_step": 322981, "epoch": 3891} {"train_loss": -26.0572452545166, "global_step": 322982, "epoch": 3891} {"train_loss": -26.211963653564453, "global_step": 322983, "epoch": 3891} {"train_loss": -25.99726676940918, "global_step": 322984, "epoch": 3891} {"train_loss": -25.85346794128418, "global_step": 322985, "epoch": 3891} {"train_loss": -25.902814865112305, "global_step": 322986, "epoch": 3891} {"train_loss": -25.904626846313477, "global_step": 322987, "epoch": 3891} {"train_loss": -26.245166778564453, "global_step": 322988, "epoch": 3891} {"train_loss": -26.31048011779785, "global_step": 322989, "epoch": 3891} {"train_loss": -25.7568302154541, "global_step": 322990, "epoch": 3891} {"train_loss": -26.347244262695312, "global_step": 322991, "epoch": 3891} {"train_loss": -25.975637435913086, "global_step": 322992, "epoch": 3891} {"train_loss": -26.192304611206055, "global_step": 322993, "epoch": 3891} {"train_loss": -25.58738899230957, "global_step": 322994, "epoch": 3891} {"train_loss": -25.636764526367188, "global_step": 322995, "epoch": 3891} {"train_loss": -26.110925674438477, "global_step": 322996, "epoch": 3891} {"train_loss": -25.9603214263916, "global_step": 322997, "epoch": 3891} {"train_loss": -25.745502471923828, "global_step": 322998, "epoch": 3891} {"train_loss": -25.521446228027344, "global_step": 322999, "epoch": 3891} {"train_loss": -25.850736618041992, "global_step": 323000, "epoch": 3891} {"train_loss": -25.811756134033203, "global_step": 323001, "epoch": 3891} {"train_loss": -25.965957641601562, "global_step": 323002, "epoch": 3891} {"train_loss": -26.098724365234375, "global_step": 323003, "epoch": 3891} {"train_loss": -25.460458755493164, "global_step": 323004, "epoch": 3891} {"train_loss": -26.101318359375, "global_step": 323005, "epoch": 3891} {"train_loss": -26.053470611572266, "global_step": 323006, "epoch": 3891} {"train_loss": -25.48491668701172, "global_step": 323007, "epoch": 3891} {"train_loss": -25.586427688598633, "global_step": 323008, "epoch": 3891} {"train_loss": -25.984760284423828, "global_step": 323009, "epoch": 3891} {"train_loss": -26.024200439453125, "global_step": 323010, "epoch": 3891} {"train_loss": -25.697986602783203, "global_step": 323011, "epoch": 3891} {"train_loss": -25.555295944213867, "global_step": 323012, "epoch": 3891} {"train_loss": -25.71478843688965, "global_step": 323013, "epoch": 3891} {"train_loss": -25.96095848083496, "global_step": 323014, "epoch": 3891} {"train_loss": -25.858978271484375, "global_step": 323015, "epoch": 3891} {"train_loss": -25.64764976501465, "global_step": 323016, "epoch": 3891} {"train_loss": -25.124116897583008, "global_step": 323017, "epoch": 3891} {"train_loss": -25.808942794799805, "global_step": 323018, "epoch": 3891} {"train_loss": -25.7052059173584, "global_step": 323019, "epoch": 3891} {"train_loss": -25.526309967041016, "global_step": 323020, "epoch": 3891} {"train_loss": -25.953052520751953, "global_step": 323021, "epoch": 3891} {"train_loss": -25.898788452148438, "global_step": 323022, "epoch": 3891} {"train_loss": -25.685407638549805, "global_step": 323023, "epoch": 3891} {"train_loss": -25.636764526367188, "global_step": 323024, "epoch": 3891} {"train_loss": -25.37984275817871, "global_step": 323025, "epoch": 3891} {"train_loss": -25.903705596923828, "global_step": 323026, "epoch": 3891} {"train_loss": -25.9628849029541, "global_step": 323027, "epoch": 3891} {"train_loss": -26.072040557861328, "global_step": 323028, "epoch": 3891} {"train_loss": -25.867111206054688, "global_step": 323029, "epoch": 3891} {"train_loss": -25.565631866455078, "global_step": 323030, "epoch": 3891} {"train_loss": -25.940643310546875, "global_step": 323031, "epoch": 3891} {"train_loss": -25.951807022094727, "global_step": 323032, "epoch": 3891} {"train_loss": -25.807331085205078, "global_step": 323033, "epoch": 3891} {"train_loss": -25.931568145751953, "global_step": 323034, "epoch": 3891} {"train_loss": -25.79763826117458, "global_step": 323035, "epoch": 3891, "val_loss": 7121212.0} {"train_loss": -25.953399658203125, "global_step": 323036, "epoch": 3892} {"train_loss": -25.352949142456055, "global_step": 323037, "epoch": 3892} {"train_loss": -25.226665496826172, "global_step": 323038, "epoch": 3892} {"train_loss": -25.8826961517334, "global_step": 323039, "epoch": 3892} {"train_loss": -24.910627365112305, "global_step": 323040, "epoch": 3892} {"train_loss": -25.7291316986084, "global_step": 323041, "epoch": 3892} {"train_loss": -25.600431442260742, "global_step": 323042, "epoch": 3892} {"train_loss": -25.213916778564453, "global_step": 323043, "epoch": 3892} {"train_loss": -25.646881103515625, "global_step": 323044, "epoch": 3892} {"train_loss": -25.22176170349121, "global_step": 323045, "epoch": 3892} {"train_loss": -25.877243041992188, "global_step": 323046, "epoch": 3892} {"train_loss": -25.603595733642578, "global_step": 323047, "epoch": 3892} {"train_loss": -25.77058219909668, "global_step": 323048, "epoch": 3892} {"train_loss": -25.699193954467773, "global_step": 323049, "epoch": 3892} {"train_loss": -25.86024284362793, "global_step": 323050, "epoch": 3892} {"train_loss": -25.641382217407227, "global_step": 323051, "epoch": 3892} {"train_loss": -25.770633697509766, "global_step": 323052, "epoch": 3892} {"train_loss": -26.20281410217285, "global_step": 323053, "epoch": 3892} {"train_loss": -25.856122970581055, "global_step": 323054, "epoch": 3892} {"train_loss": -25.9829044342041, "global_step": 323055, "epoch": 3892} {"train_loss": -25.777402877807617, "global_step": 323056, "epoch": 3892} {"train_loss": -25.998737335205078, "global_step": 323057, "epoch": 3892} {"train_loss": -26.162412643432617, "global_step": 323058, "epoch": 3892} {"train_loss": -25.950254440307617, "global_step": 323059, "epoch": 3892} {"train_loss": -25.674097061157227, "global_step": 323060, "epoch": 3892} {"train_loss": -25.714200973510742, "global_step": 323061, "epoch": 3892} {"train_loss": -26.062902450561523, "global_step": 323062, "epoch": 3892} {"train_loss": -25.843107223510742, "global_step": 323063, "epoch": 3892} {"train_loss": -25.7816104888916, "global_step": 323064, "epoch": 3892} {"train_loss": -25.9509334564209, "global_step": 323065, "epoch": 3892} {"train_loss": -25.83734703063965, "global_step": 323066, "epoch": 3892} {"train_loss": -26.101816177368164, "global_step": 323067, "epoch": 3892} {"train_loss": -25.68538475036621, "global_step": 323068, "epoch": 3892} {"train_loss": -25.71535301208496, "global_step": 323069, "epoch": 3892} {"train_loss": -25.8024845123291, "global_step": 323070, "epoch": 3892} {"train_loss": -25.642547607421875, "global_step": 323071, "epoch": 3892} {"train_loss": -25.742162704467773, "global_step": 323072, "epoch": 3892} {"train_loss": -25.328311920166016, "global_step": 323073, "epoch": 3892} {"train_loss": -25.65340232849121, "global_step": 323074, "epoch": 3892} {"train_loss": -25.916162490844727, "global_step": 323075, "epoch": 3892} {"train_loss": -25.637653350830078, "global_step": 323076, "epoch": 3892} {"train_loss": -25.546775817871094, "global_step": 323077, "epoch": 3892} {"train_loss": -25.770889282226562, "global_step": 323078, "epoch": 3892} {"train_loss": -25.88959312438965, "global_step": 323079, "epoch": 3892} {"train_loss": -26.21132469177246, "global_step": 323080, "epoch": 3892} {"train_loss": -25.427921295166016, "global_step": 323081, "epoch": 3892} {"train_loss": -25.829456329345703, "global_step": 323082, "epoch": 3892} {"train_loss": -26.059253692626953, "global_step": 323083, "epoch": 3892} {"train_loss": -26.00203514099121, "global_step": 323084, "epoch": 3892} {"train_loss": -25.964269638061523, "global_step": 323085, "epoch": 3892} {"train_loss": -25.949665069580078, "global_step": 323086, "epoch": 3892} {"train_loss": -25.452211380004883, "global_step": 323087, "epoch": 3892} {"train_loss": -25.758731842041016, "global_step": 323088, "epoch": 3892} {"train_loss": -25.92391014099121, "global_step": 323089, "epoch": 3892} {"train_loss": -25.543964385986328, "global_step": 323090, "epoch": 3892} {"train_loss": -25.916446685791016, "global_step": 323091, "epoch": 3892} {"train_loss": -25.245162963867188, "global_step": 323092, "epoch": 3892} {"train_loss": -26.00152015686035, "global_step": 323093, "epoch": 3892} {"train_loss": -25.990680694580078, "global_step": 323094, "epoch": 3892} {"train_loss": -26.157733917236328, "global_step": 323095, "epoch": 3892} {"train_loss": -25.800764083862305, "global_step": 323096, "epoch": 3892} {"train_loss": -26.06483268737793, "global_step": 323097, "epoch": 3892} {"train_loss": -25.848291397094727, "global_step": 323098, "epoch": 3892} {"train_loss": -26.28205680847168, "global_step": 323099, "epoch": 3892} {"train_loss": -25.94137954711914, "global_step": 323100, "epoch": 3892} {"train_loss": -26.095111846923828, "global_step": 323101, "epoch": 3892} {"train_loss": -25.5721492767334, "global_step": 323102, "epoch": 3892} {"train_loss": -26.1601505279541, "global_step": 323103, "epoch": 3892} {"train_loss": -26.20814323425293, "global_step": 323104, "epoch": 3892} {"train_loss": -25.954498291015625, "global_step": 323105, "epoch": 3892} {"train_loss": -26.390073776245117, "global_step": 323106, "epoch": 3892} {"train_loss": -26.21968650817871, "global_step": 323107, "epoch": 3892} {"train_loss": -26.1751708984375, "global_step": 323108, "epoch": 3892} {"train_loss": -26.13433265686035, "global_step": 323109, "epoch": 3892} {"train_loss": -26.088397979736328, "global_step": 323110, "epoch": 3892} {"train_loss": -25.802204132080078, "global_step": 323111, "epoch": 3892} {"train_loss": -25.8736515045166, "global_step": 323112, "epoch": 3892} {"train_loss": -26.404062271118164, "global_step": 323113, "epoch": 3892} {"train_loss": -26.21217155456543, "global_step": 323114, "epoch": 3892} {"train_loss": -26.19053077697754, "global_step": 323115, "epoch": 3892} {"train_loss": -25.739500045776367, "global_step": 323116, "epoch": 3892} {"train_loss": -26.00518798828125, "global_step": 323117, "epoch": 3892} {"train_loss": -25.855543228517096, "global_step": 323118, "epoch": 3892, "val_loss": 7129549.0} {"train_loss": -25.625091552734375, "global_step": 323119, "epoch": 3893} {"train_loss": -24.459489822387695, "global_step": 323120, "epoch": 3893} {"train_loss": -24.32520866394043, "global_step": 323121, "epoch": 3893} {"train_loss": -24.541234970092773, "global_step": 323122, "epoch": 3893} {"train_loss": -24.541440963745117, "global_step": 323123, "epoch": 3893} {"train_loss": -24.784147262573242, "global_step": 323124, "epoch": 3893} {"train_loss": -25.057952880859375, "global_step": 323125, "epoch": 3893} {"train_loss": -25.068429946899414, "global_step": 323126, "epoch": 3893} {"train_loss": -25.57143211364746, "global_step": 323127, "epoch": 3893} {"train_loss": -25.396034240722656, "global_step": 323128, "epoch": 3893} {"train_loss": -25.505231857299805, "global_step": 323129, "epoch": 3893} {"train_loss": -25.69148063659668, "global_step": 323130, "epoch": 3893} {"train_loss": -25.456584930419922, "global_step": 323131, "epoch": 3893} {"train_loss": -25.60035514831543, "global_step": 323132, "epoch": 3893} {"train_loss": -25.398595809936523, "global_step": 323133, "epoch": 3893} {"train_loss": -25.421716690063477, "global_step": 323134, "epoch": 3893} {"train_loss": -25.45265007019043, "global_step": 323135, "epoch": 3893} {"train_loss": -25.7080078125, "global_step": 323136, "epoch": 3893} {"train_loss": -25.749765396118164, "global_step": 323137, "epoch": 3893} {"train_loss": -25.493040084838867, "global_step": 323138, "epoch": 3893} {"train_loss": -25.855932235717773, "global_step": 323139, "epoch": 3893} {"train_loss": -25.79463005065918, "global_step": 323140, "epoch": 3893} {"train_loss": -25.893945693969727, "global_step": 323141, "epoch": 3893} {"train_loss": -25.57889175415039, "global_step": 323142, "epoch": 3893} {"train_loss": -25.82636070251465, "global_step": 323143, "epoch": 3893} {"train_loss": -25.597074508666992, "global_step": 323144, "epoch": 3893} {"train_loss": -25.945348739624023, "global_step": 323145, "epoch": 3893} {"train_loss": -25.482223510742188, "global_step": 323146, "epoch": 3893} {"train_loss": -25.90264892578125, "global_step": 323147, "epoch": 3893} {"train_loss": -25.45416831970215, "global_step": 323148, "epoch": 3893} {"train_loss": -25.847747802734375, "global_step": 323149, "epoch": 3893} {"train_loss": -25.91940689086914, "global_step": 323150, "epoch": 3893} {"train_loss": -25.761709213256836, "global_step": 323151, "epoch": 3893} {"train_loss": -25.900543212890625, "global_step": 323152, "epoch": 3893} {"train_loss": -25.671056747436523, "global_step": 323153, "epoch": 3893} {"train_loss": -25.473901748657227, "global_step": 323154, "epoch": 3893} {"train_loss": -25.812271118164062, "global_step": 323155, "epoch": 3893} {"train_loss": -25.81439208984375, "global_step": 323156, "epoch": 3893} {"train_loss": -25.9747314453125, "global_step": 323157, "epoch": 3893} {"train_loss": -25.940704345703125, "global_step": 323158, "epoch": 3893} {"train_loss": -26.18001365661621, "global_step": 323159, "epoch": 3893} {"train_loss": -25.752134323120117, "global_step": 323160, "epoch": 3893} {"train_loss": -25.79911231994629, "global_step": 323161, "epoch": 3893} {"train_loss": -26.10959815979004, "global_step": 323162, "epoch": 3893} {"train_loss": -25.704120635986328, "global_step": 323163, "epoch": 3893} {"train_loss": -26.165678024291992, "global_step": 323164, "epoch": 3893} {"train_loss": -26.02704429626465, "global_step": 323165, "epoch": 3893} {"train_loss": -25.872028350830078, "global_step": 323166, "epoch": 3893} {"train_loss": -26.256500244140625, "global_step": 323167, "epoch": 3893} {"train_loss": -25.884674072265625, "global_step": 323168, "epoch": 3893} {"train_loss": -25.920766830444336, "global_step": 323169, "epoch": 3893} {"train_loss": -26.033655166625977, "global_step": 323170, "epoch": 3893} {"train_loss": -25.85316276550293, "global_step": 323171, "epoch": 3893} {"train_loss": -25.267427444458008, "global_step": 323172, "epoch": 3893} {"train_loss": -25.835346221923828, "global_step": 323173, "epoch": 3893} {"train_loss": -26.005517959594727, "global_step": 323174, "epoch": 3893} {"train_loss": -26.161972045898438, "global_step": 323175, "epoch": 3893} {"train_loss": -25.9200382232666, "global_step": 323176, "epoch": 3893} {"train_loss": -25.799915313720703, "global_step": 323177, "epoch": 3893} {"train_loss": -25.920385360717773, "global_step": 323178, "epoch": 3893} {"train_loss": -26.072355270385742, "global_step": 323179, "epoch": 3893} {"train_loss": -25.957056045532227, "global_step": 323180, "epoch": 3893} {"train_loss": -25.615020751953125, "global_step": 323181, "epoch": 3893} {"train_loss": -26.20680046081543, "global_step": 323182, "epoch": 3893} {"train_loss": -25.943883895874023, "global_step": 323183, "epoch": 3893} {"train_loss": -25.849090576171875, "global_step": 323184, "epoch": 3893} {"train_loss": -25.879003524780273, "global_step": 323185, "epoch": 3893} {"train_loss": -26.19589614868164, "global_step": 323186, "epoch": 3893} {"train_loss": -26.02638053894043, "global_step": 323187, "epoch": 3893} {"train_loss": -26.267852783203125, "global_step": 323188, "epoch": 3893} {"train_loss": -25.931821823120117, "global_step": 323189, "epoch": 3893} {"train_loss": -25.995227813720703, "global_step": 323190, "epoch": 3893} {"train_loss": -25.621109008789062, "global_step": 323191, "epoch": 3893} {"train_loss": -26.18416404724121, "global_step": 323192, "epoch": 3893} {"train_loss": -26.051273345947266, "global_step": 323193, "epoch": 3893} {"train_loss": -26.074752807617188, "global_step": 323194, "epoch": 3893} {"train_loss": -25.958969116210938, "global_step": 323195, "epoch": 3893} {"train_loss": -26.351318359375, "global_step": 323196, "epoch": 3893} {"train_loss": -25.995458602905273, "global_step": 323197, "epoch": 3893} {"train_loss": -25.977331161499023, "global_step": 323198, "epoch": 3893} {"train_loss": -26.048694610595703, "global_step": 323199, "epoch": 3893} {"train_loss": -26.030014038085938, "global_step": 323200, "epoch": 3893} {"train_loss": -25.739968357315984, "global_step": 323201, "epoch": 3893, "val_loss": 7228769.0} {"train_loss": -25.946353912353516, "global_step": 323202, "epoch": 3894} {"train_loss": -25.07419204711914, "global_step": 323203, "epoch": 3894} {"train_loss": -26.04707145690918, "global_step": 323204, "epoch": 3894} {"train_loss": -25.810773849487305, "global_step": 323205, "epoch": 3894} {"train_loss": -25.591140747070312, "global_step": 323206, "epoch": 3894} {"train_loss": -25.611684799194336, "global_step": 323207, "epoch": 3894} {"train_loss": -25.393320083618164, "global_step": 323208, "epoch": 3894} {"train_loss": -25.217817306518555, "global_step": 323209, "epoch": 3894} {"train_loss": -25.466503143310547, "global_step": 323210, "epoch": 3894} {"train_loss": -25.431623458862305, "global_step": 323211, "epoch": 3894} {"train_loss": -25.46724510192871, "global_step": 323212, "epoch": 3894} {"train_loss": -25.518169403076172, "global_step": 323213, "epoch": 3894} {"train_loss": -25.556005477905273, "global_step": 323214, "epoch": 3894} {"train_loss": -25.196624755859375, "global_step": 323215, "epoch": 3894} {"train_loss": -25.763376235961914, "global_step": 323216, "epoch": 3894} {"train_loss": -25.886505126953125, "global_step": 323217, "epoch": 3894} {"train_loss": -25.654020309448242, "global_step": 323218, "epoch": 3894} {"train_loss": -25.941272735595703, "global_step": 323219, "epoch": 3894} {"train_loss": -25.682178497314453, "global_step": 323220, "epoch": 3894} {"train_loss": -25.709497451782227, "global_step": 323221, "epoch": 3894} {"train_loss": -25.699811935424805, "global_step": 323222, "epoch": 3894} {"train_loss": -25.399118423461914, "global_step": 323223, "epoch": 3894} {"train_loss": -25.861835479736328, "global_step": 323224, "epoch": 3894} {"train_loss": -25.85457420349121, "global_step": 323225, "epoch": 3894} {"train_loss": -26.04827308654785, "global_step": 323226, "epoch": 3894} {"train_loss": -25.66438102722168, "global_step": 323227, "epoch": 3894} {"train_loss": -25.915597915649414, "global_step": 323228, "epoch": 3894} {"train_loss": -25.831390380859375, "global_step": 323229, "epoch": 3894} {"train_loss": -26.1154727935791, "global_step": 323230, "epoch": 3894} {"train_loss": -25.891376495361328, "global_step": 323231, "epoch": 3894} {"train_loss": -26.290082931518555, "global_step": 323232, "epoch": 3894} {"train_loss": -26.38868522644043, "global_step": 323233, "epoch": 3894} {"train_loss": -26.00166130065918, "global_step": 323234, "epoch": 3894} {"train_loss": -25.960126876831055, "global_step": 323235, "epoch": 3894} {"train_loss": -25.8353271484375, "global_step": 323236, "epoch": 3894} {"train_loss": -25.815759658813477, "global_step": 323237, "epoch": 3894} {"train_loss": -25.9752254486084, "global_step": 323238, "epoch": 3894} {"train_loss": -26.3106632232666, "global_step": 323239, "epoch": 3894} {"train_loss": -26.225202560424805, "global_step": 323240, "epoch": 3894} {"train_loss": -25.612939834594727, "global_step": 323241, "epoch": 3894} {"train_loss": -25.41653823852539, "global_step": 323242, "epoch": 3894} {"train_loss": -25.50074577331543, "global_step": 323243, "epoch": 3894} {"train_loss": -26.215742111206055, "global_step": 323244, "epoch": 3894} {"train_loss": -25.90262794494629, "global_step": 323245, "epoch": 3894} {"train_loss": -25.653051376342773, "global_step": 323246, "epoch": 3894} {"train_loss": -26.1163330078125, "global_step": 323247, "epoch": 3894} {"train_loss": -26.07499122619629, "global_step": 323248, "epoch": 3894} {"train_loss": -25.567800521850586, "global_step": 323249, "epoch": 3894} {"train_loss": -26.044336318969727, "global_step": 323250, "epoch": 3894} {"train_loss": -25.912765502929688, "global_step": 323251, "epoch": 3894} {"train_loss": -25.867490768432617, "global_step": 323252, "epoch": 3894} {"train_loss": -25.960920333862305, "global_step": 323253, "epoch": 3894} {"train_loss": -26.08928871154785, "global_step": 323254, "epoch": 3894} {"train_loss": -25.97040367126465, "global_step": 323255, "epoch": 3894} {"train_loss": -25.9332218170166, "global_step": 323256, "epoch": 3894} {"train_loss": -25.7980899810791, "global_step": 323257, "epoch": 3894} {"train_loss": -26.237462997436523, "global_step": 323258, "epoch": 3894} {"train_loss": -25.851484298706055, "global_step": 323259, "epoch": 3894} {"train_loss": -25.521461486816406, "global_step": 323260, "epoch": 3894} {"train_loss": -25.655759811401367, "global_step": 323261, "epoch": 3894} {"train_loss": -25.669754028320312, "global_step": 323262, "epoch": 3894} {"train_loss": -25.775739669799805, "global_step": 323263, "epoch": 3894} {"train_loss": -25.646692276000977, "global_step": 323264, "epoch": 3894} {"train_loss": -25.687719345092773, "global_step": 323265, "epoch": 3894} {"train_loss": -25.919031143188477, "global_step": 323266, "epoch": 3894} {"train_loss": -25.810626983642578, "global_step": 323267, "epoch": 3894} {"train_loss": -26.207120895385742, "global_step": 323268, "epoch": 3894} {"train_loss": -25.812597274780273, "global_step": 323269, "epoch": 3894} {"train_loss": -26.14703369140625, "global_step": 323270, "epoch": 3894} {"train_loss": -25.71866226196289, "global_step": 323271, "epoch": 3894} {"train_loss": -26.481088638305664, "global_step": 323272, "epoch": 3894} {"train_loss": -26.0360107421875, "global_step": 323273, "epoch": 3894} {"train_loss": -26.13154411315918, "global_step": 323274, "epoch": 3894} {"train_loss": -26.03132438659668, "global_step": 323275, "epoch": 3894} {"train_loss": -25.877172470092773, "global_step": 323276, "epoch": 3894} {"train_loss": -26.050994873046875, "global_step": 323277, "epoch": 3894} {"train_loss": -25.776630401611328, "global_step": 323278, "epoch": 3894} {"train_loss": -25.757627487182617, "global_step": 323279, "epoch": 3894} {"train_loss": -26.094823837280273, "global_step": 323280, "epoch": 3894} {"train_loss": -25.872802734375, "global_step": 323281, "epoch": 3894} {"train_loss": -25.955718994140625, "global_step": 323282, "epoch": 3894} {"train_loss": -25.952070236206055, "global_step": 323283, "epoch": 3894} {"train_loss": -25.839103859591198, "global_step": 323284, "epoch": 3894, "val_loss": 7156087.0} {"train_loss": -26.131591796875, "global_step": 323285, "epoch": 3895} {"train_loss": -25.75347328186035, "global_step": 323286, "epoch": 3895} {"train_loss": -25.40280532836914, "global_step": 323287, "epoch": 3895} {"train_loss": -25.705768585205078, "global_step": 323288, "epoch": 3895} {"train_loss": -25.79563331604004, "global_step": 323289, "epoch": 3895} {"train_loss": -25.426523208618164, "global_step": 323290, "epoch": 3895} {"train_loss": -25.626209259033203, "global_step": 323291, "epoch": 3895} {"train_loss": -25.549654006958008, "global_step": 323292, "epoch": 3895} {"train_loss": -25.1702823638916, "global_step": 323293, "epoch": 3895} {"train_loss": -25.420673370361328, "global_step": 323294, "epoch": 3895} {"train_loss": -25.778528213500977, "global_step": 323295, "epoch": 3895} {"train_loss": -25.443069458007812, "global_step": 323296, "epoch": 3895} {"train_loss": -25.658491134643555, "global_step": 323297, "epoch": 3895} {"train_loss": -25.603246688842773, "global_step": 323298, "epoch": 3895} {"train_loss": -25.282073974609375, "global_step": 323299, "epoch": 3895} {"train_loss": -25.724109649658203, "global_step": 323300, "epoch": 3895} {"train_loss": -25.903127670288086, "global_step": 323301, "epoch": 3895} {"train_loss": -25.866357803344727, "global_step": 323302, "epoch": 3895} {"train_loss": -25.38472557067871, "global_step": 323303, "epoch": 3895} {"train_loss": -25.607107162475586, "global_step": 323304, "epoch": 3895} {"train_loss": -25.485105514526367, "global_step": 323305, "epoch": 3895} {"train_loss": -25.885974884033203, "global_step": 323306, "epoch": 3895} {"train_loss": -25.587997436523438, "global_step": 323307, "epoch": 3895} {"train_loss": -25.888797760009766, "global_step": 323308, "epoch": 3895} {"train_loss": -26.092041015625, "global_step": 323309, "epoch": 3895} {"train_loss": -25.746442794799805, "global_step": 323310, "epoch": 3895} {"train_loss": -25.435855865478516, "global_step": 323311, "epoch": 3895} {"train_loss": -25.865583419799805, "global_step": 323312, "epoch": 3895} {"train_loss": -25.7926082611084, "global_step": 323313, "epoch": 3895} {"train_loss": -25.635339736938477, "global_step": 323314, "epoch": 3895} {"train_loss": -25.8505859375, "global_step": 323315, "epoch": 3895} {"train_loss": -25.299823760986328, "global_step": 323316, "epoch": 3895} {"train_loss": -25.734479904174805, "global_step": 323317, "epoch": 3895} {"train_loss": -25.793170928955078, "global_step": 323318, "epoch": 3895} {"train_loss": -26.053552627563477, "global_step": 323319, "epoch": 3895} {"train_loss": -25.642568588256836, "global_step": 323320, "epoch": 3895} {"train_loss": -25.86049461364746, "global_step": 323321, "epoch": 3895} {"train_loss": -26.045942306518555, "global_step": 323322, "epoch": 3895} {"train_loss": -26.162389755249023, "global_step": 323323, "epoch": 3895} {"train_loss": -25.74127197265625, "global_step": 323324, "epoch": 3895} {"train_loss": -25.627607345581055, "global_step": 323325, "epoch": 3895} {"train_loss": -25.895612716674805, "global_step": 323326, "epoch": 3895} {"train_loss": -25.862201690673828, "global_step": 323327, "epoch": 3895} {"train_loss": -25.8369197845459, "global_step": 323328, "epoch": 3895} {"train_loss": -25.644092559814453, "global_step": 323329, "epoch": 3895} {"train_loss": -25.829360961914062, "global_step": 323330, "epoch": 3895} {"train_loss": -25.82569694519043, "global_step": 323331, "epoch": 3895} {"train_loss": -25.559326171875, "global_step": 323332, "epoch": 3895} {"train_loss": -25.574756622314453, "global_step": 323333, "epoch": 3895} {"train_loss": -25.462671279907227, "global_step": 323334, "epoch": 3895} {"train_loss": -25.470956802368164, "global_step": 323335, "epoch": 3895} {"train_loss": -25.610919952392578, "global_step": 323336, "epoch": 3895} {"train_loss": -25.835113525390625, "global_step": 323337, "epoch": 3895} {"train_loss": -25.93471336364746, "global_step": 323338, "epoch": 3895} {"train_loss": -25.99722671508789, "global_step": 323339, "epoch": 3895} {"train_loss": -25.86435317993164, "global_step": 323340, "epoch": 3895} {"train_loss": -25.719879150390625, "global_step": 323341, "epoch": 3895} {"train_loss": -25.769651412963867, "global_step": 323342, "epoch": 3895} {"train_loss": -25.8697509765625, "global_step": 323343, "epoch": 3895} {"train_loss": -25.886215209960938, "global_step": 323344, "epoch": 3895} {"train_loss": -26.01291847229004, "global_step": 323345, "epoch": 3895} {"train_loss": -25.644529342651367, "global_step": 323346, "epoch": 3895} {"train_loss": -25.779211044311523, "global_step": 323347, "epoch": 3895} {"train_loss": -26.177825927734375, "global_step": 323348, "epoch": 3895} {"train_loss": -25.899871826171875, "global_step": 323349, "epoch": 3895} {"train_loss": -25.970685958862305, "global_step": 323350, "epoch": 3895} {"train_loss": -25.695520401000977, "global_step": 323351, "epoch": 3895} {"train_loss": -26.08747673034668, "global_step": 323352, "epoch": 3895} {"train_loss": -26.02849769592285, "global_step": 323353, "epoch": 3895} {"train_loss": -25.9011287689209, "global_step": 323354, "epoch": 3895} {"train_loss": -25.54592514038086, "global_step": 323355, "epoch": 3895} {"train_loss": -25.832122802734375, "global_step": 323356, "epoch": 3895} {"train_loss": -25.734968185424805, "global_step": 323357, "epoch": 3895} {"train_loss": -25.978641510009766, "global_step": 323358, "epoch": 3895} {"train_loss": -25.479476928710938, "global_step": 323359, "epoch": 3895} {"train_loss": -25.76905632019043, "global_step": 323360, "epoch": 3895} {"train_loss": -25.975605010986328, "global_step": 323361, "epoch": 3895} {"train_loss": -25.739389419555664, "global_step": 323362, "epoch": 3895} {"train_loss": -25.9204158782959, "global_step": 323363, "epoch": 3895} {"train_loss": -26.250951766967773, "global_step": 323364, "epoch": 3895} {"train_loss": -25.928953170776367, "global_step": 323365, "epoch": 3895} {"train_loss": -26.283374786376953, "global_step": 323366, "epoch": 3895} {"train_loss": -25.772418723048933, "global_step": 323367, "epoch": 3895, "val_loss": 7247887.0} {"train_loss": -25.282392501831055, "global_step": 323368, "epoch": 3896} {"train_loss": -25.554954528808594, "global_step": 323369, "epoch": 3896} {"train_loss": -25.405506134033203, "global_step": 323370, "epoch": 3896} {"train_loss": -25.55732536315918, "global_step": 323371, "epoch": 3896} {"train_loss": -25.501928329467773, "global_step": 323372, "epoch": 3896} {"train_loss": -25.898141860961914, "global_step": 323373, "epoch": 3896} {"train_loss": -25.490615844726562, "global_step": 323374, "epoch": 3896} {"train_loss": -26.087121963500977, "global_step": 323375, "epoch": 3896} {"train_loss": -25.43332290649414, "global_step": 323376, "epoch": 3896} {"train_loss": -25.599586486816406, "global_step": 323377, "epoch": 3896} {"train_loss": -25.85048484802246, "global_step": 323378, "epoch": 3896} {"train_loss": -25.840269088745117, "global_step": 323379, "epoch": 3896} {"train_loss": -25.653034210205078, "global_step": 323380, "epoch": 3896} {"train_loss": -25.85651206970215, "global_step": 323381, "epoch": 3896} {"train_loss": -25.962848663330078, "global_step": 323382, "epoch": 3896} {"train_loss": -25.99678611755371, "global_step": 323383, "epoch": 3896} {"train_loss": -25.563858032226562, "global_step": 323384, "epoch": 3896} {"train_loss": -25.862829208374023, "global_step": 323385, "epoch": 3896} {"train_loss": -25.677326202392578, "global_step": 323386, "epoch": 3896} {"train_loss": -25.94830894470215, "global_step": 323387, "epoch": 3896} {"train_loss": -26.044296264648438, "global_step": 323388, "epoch": 3896} {"train_loss": -25.6394100189209, "global_step": 323389, "epoch": 3896} {"train_loss": -25.95782470703125, "global_step": 323390, "epoch": 3896} {"train_loss": -26.093765258789062, "global_step": 323391, "epoch": 3896} {"train_loss": -25.804052352905273, "global_step": 323392, "epoch": 3896} {"train_loss": -26.143024444580078, "global_step": 323393, "epoch": 3896} {"train_loss": -25.794708251953125, "global_step": 323394, "epoch": 3896} {"train_loss": -26.03547477722168, "global_step": 323395, "epoch": 3896} {"train_loss": -26.190549850463867, "global_step": 323396, "epoch": 3896} {"train_loss": -25.85178565979004, "global_step": 323397, "epoch": 3896} {"train_loss": -25.720264434814453, "global_step": 323398, "epoch": 3896} {"train_loss": -26.124433517456055, "global_step": 323399, "epoch": 3896} {"train_loss": -26.047956466674805, "global_step": 323400, "epoch": 3896} {"train_loss": -25.8974609375, "global_step": 323401, "epoch": 3896} {"train_loss": -25.617273330688477, "global_step": 323402, "epoch": 3896} {"train_loss": -25.73090171813965, "global_step": 323403, "epoch": 3896} {"train_loss": -25.88092041015625, "global_step": 323404, "epoch": 3896} {"train_loss": -25.5866756439209, "global_step": 323405, "epoch": 3896} {"train_loss": -25.638620376586914, "global_step": 323406, "epoch": 3896} {"train_loss": -25.842273712158203, "global_step": 323407, "epoch": 3896} {"train_loss": -25.69890785217285, "global_step": 323408, "epoch": 3896} {"train_loss": -25.840606689453125, "global_step": 323409, "epoch": 3896} {"train_loss": -25.405567169189453, "global_step": 323410, "epoch": 3896} {"train_loss": -26.204376220703125, "global_step": 323411, "epoch": 3896} {"train_loss": -25.636030197143555, "global_step": 323412, "epoch": 3896} {"train_loss": -25.9091854095459, "global_step": 323413, "epoch": 3896} {"train_loss": -25.767637252807617, "global_step": 323414, "epoch": 3896} {"train_loss": -25.364471435546875, "global_step": 323415, "epoch": 3896} {"train_loss": -26.083906173706055, "global_step": 323416, "epoch": 3896} {"train_loss": -26.23443603515625, "global_step": 323417, "epoch": 3896} {"train_loss": -25.912939071655273, "global_step": 323418, "epoch": 3896} {"train_loss": -25.689233779907227, "global_step": 323419, "epoch": 3896} {"train_loss": -26.259845733642578, "global_step": 323420, "epoch": 3896} {"train_loss": -26.000076293945312, "global_step": 323421, "epoch": 3896} {"train_loss": -25.87855339050293, "global_step": 323422, "epoch": 3896} {"train_loss": -25.58155632019043, "global_step": 323423, "epoch": 3896} {"train_loss": -25.741296768188477, "global_step": 323424, "epoch": 3896} {"train_loss": -25.729150772094727, "global_step": 323425, "epoch": 3896} {"train_loss": -25.887609481811523, "global_step": 323426, "epoch": 3896} {"train_loss": -26.070642471313477, "global_step": 323427, "epoch": 3896} {"train_loss": -26.014896392822266, "global_step": 323428, "epoch": 3896} {"train_loss": -26.39876365661621, "global_step": 323429, "epoch": 3896} {"train_loss": -25.80917739868164, "global_step": 323430, "epoch": 3896} {"train_loss": -26.119766235351562, "global_step": 323431, "epoch": 3896} {"train_loss": -26.441518783569336, "global_step": 323432, "epoch": 3896} {"train_loss": -25.60536003112793, "global_step": 323433, "epoch": 3896} {"train_loss": -25.587392807006836, "global_step": 323434, "epoch": 3896} {"train_loss": -25.51531410217285, "global_step": 323435, "epoch": 3896} {"train_loss": -25.913854598999023, "global_step": 323436, "epoch": 3896} {"train_loss": -26.37055015563965, "global_step": 323437, "epoch": 3896} {"train_loss": -25.98111915588379, "global_step": 323438, "epoch": 3896} {"train_loss": -25.580760955810547, "global_step": 323439, "epoch": 3896} {"train_loss": -25.90986442565918, "global_step": 323440, "epoch": 3896} {"train_loss": -26.002948760986328, "global_step": 323441, "epoch": 3896} {"train_loss": -25.88857078552246, "global_step": 323442, "epoch": 3896} {"train_loss": -25.892004013061523, "global_step": 323443, "epoch": 3896} {"train_loss": -26.050384521484375, "global_step": 323444, "epoch": 3896} {"train_loss": -26.264509201049805, "global_step": 323445, "epoch": 3896} {"train_loss": -25.822675704956055, "global_step": 323446, "epoch": 3896} {"train_loss": -26.171131134033203, "global_step": 323447, "epoch": 3896} {"train_loss": -26.204336166381836, "global_step": 323448, "epoch": 3896} {"train_loss": -26.205276489257812, "global_step": 323449, "epoch": 3896} {"train_loss": -25.860460924814983, "global_step": 323450, "epoch": 3896, "val_loss": 7116998.0} {"train_loss": -25.330608367919922, "global_step": 323451, "epoch": 3897} {"train_loss": -25.814788818359375, "global_step": 323452, "epoch": 3897} {"train_loss": -25.54355239868164, "global_step": 323453, "epoch": 3897} {"train_loss": -25.80024528503418, "global_step": 323454, "epoch": 3897} {"train_loss": -25.429174423217773, "global_step": 323455, "epoch": 3897} {"train_loss": -25.129751205444336, "global_step": 323456, "epoch": 3897} {"train_loss": -25.68646240234375, "global_step": 323457, "epoch": 3897} {"train_loss": -25.183313369750977, "global_step": 323458, "epoch": 3897} {"train_loss": -25.614988327026367, "global_step": 323459, "epoch": 3897} {"train_loss": -25.643125534057617, "global_step": 323460, "epoch": 3897} {"train_loss": -25.778440475463867, "global_step": 323461, "epoch": 3897} {"train_loss": -25.86948013305664, "global_step": 323462, "epoch": 3897} {"train_loss": -26.0988712310791, "global_step": 323463, "epoch": 3897} {"train_loss": -25.726247787475586, "global_step": 323464, "epoch": 3897} {"train_loss": -25.619924545288086, "global_step": 323465, "epoch": 3897} {"train_loss": -25.826108932495117, "global_step": 323466, "epoch": 3897} {"train_loss": -25.92854118347168, "global_step": 323467, "epoch": 3897} {"train_loss": -25.515167236328125, "global_step": 323468, "epoch": 3897} {"train_loss": -25.698257446289062, "global_step": 323469, "epoch": 3897} {"train_loss": -25.66094970703125, "global_step": 323470, "epoch": 3897} {"train_loss": -25.75031089782715, "global_step": 323471, "epoch": 3897} {"train_loss": -25.731714248657227, "global_step": 323472, "epoch": 3897} {"train_loss": -25.85967445373535, "global_step": 323473, "epoch": 3897} {"train_loss": -26.19895362854004, "global_step": 323474, "epoch": 3897} {"train_loss": -25.728424072265625, "global_step": 323475, "epoch": 3897} {"train_loss": -25.96016502380371, "global_step": 323476, "epoch": 3897} {"train_loss": -25.942676544189453, "global_step": 323477, "epoch": 3897} {"train_loss": -25.61783790588379, "global_step": 323478, "epoch": 3897} {"train_loss": -26.0767879486084, "global_step": 323479, "epoch": 3897} {"train_loss": -26.149747848510742, "global_step": 323480, "epoch": 3897} {"train_loss": -25.751317977905273, "global_step": 323481, "epoch": 3897} {"train_loss": -25.322629928588867, "global_step": 323482, "epoch": 3897} {"train_loss": -25.651081085205078, "global_step": 323483, "epoch": 3897} {"train_loss": -26.133588790893555, "global_step": 323484, "epoch": 3897} {"train_loss": -25.782861709594727, "global_step": 323485, "epoch": 3897} {"train_loss": -25.999784469604492, "global_step": 323486, "epoch": 3897} {"train_loss": -25.97210693359375, "global_step": 323487, "epoch": 3897} {"train_loss": -26.056289672851562, "global_step": 323488, "epoch": 3897} {"train_loss": -25.445945739746094, "global_step": 323489, "epoch": 3897} {"train_loss": -25.79998207092285, "global_step": 323490, "epoch": 3897} {"train_loss": -26.001346588134766, "global_step": 323491, "epoch": 3897} {"train_loss": -25.683507919311523, "global_step": 323492, "epoch": 3897} {"train_loss": -25.681116104125977, "global_step": 323493, "epoch": 3897} {"train_loss": -26.104806900024414, "global_step": 323494, "epoch": 3897} {"train_loss": -26.05579948425293, "global_step": 323495, "epoch": 3897} {"train_loss": -25.81292724609375, "global_step": 323496, "epoch": 3897} {"train_loss": -26.034021377563477, "global_step": 323497, "epoch": 3897} {"train_loss": -25.907428741455078, "global_step": 323498, "epoch": 3897} {"train_loss": -25.736257553100586, "global_step": 323499, "epoch": 3897} {"train_loss": -26.19636344909668, "global_step": 323500, "epoch": 3897} {"train_loss": -25.657154083251953, "global_step": 323501, "epoch": 3897} {"train_loss": -26.042280197143555, "global_step": 323502, "epoch": 3897} {"train_loss": -26.110456466674805, "global_step": 323503, "epoch": 3897} {"train_loss": -26.1180362701416, "global_step": 323504, "epoch": 3897} {"train_loss": -25.494253158569336, "global_step": 323505, "epoch": 3897} {"train_loss": -26.028799057006836, "global_step": 323506, "epoch": 3897} {"train_loss": -25.698535919189453, "global_step": 323507, "epoch": 3897} {"train_loss": -25.645111083984375, "global_step": 323508, "epoch": 3897} {"train_loss": -25.71978187561035, "global_step": 323509, "epoch": 3897} {"train_loss": -26.156625747680664, "global_step": 323510, "epoch": 3897} {"train_loss": -26.063459396362305, "global_step": 323511, "epoch": 3897} {"train_loss": -26.21380615234375, "global_step": 323512, "epoch": 3897} {"train_loss": -26.508941650390625, "global_step": 323513, "epoch": 3897} {"train_loss": -25.5009765625, "global_step": 323514, "epoch": 3897} {"train_loss": -25.714954376220703, "global_step": 323515, "epoch": 3897} {"train_loss": -25.680856704711914, "global_step": 323516, "epoch": 3897} {"train_loss": -25.28607749938965, "global_step": 323517, "epoch": 3897} {"train_loss": -26.16187858581543, "global_step": 323518, "epoch": 3897} {"train_loss": -25.46894645690918, "global_step": 323519, "epoch": 3897} {"train_loss": -25.65395164489746, "global_step": 323520, "epoch": 3897} {"train_loss": -25.7108097076416, "global_step": 323521, "epoch": 3897} {"train_loss": -25.848379135131836, "global_step": 323522, "epoch": 3897} {"train_loss": -25.649023056030273, "global_step": 323523, "epoch": 3897} {"train_loss": -25.71185302734375, "global_step": 323524, "epoch": 3897} {"train_loss": -26.252826690673828, "global_step": 323525, "epoch": 3897} {"train_loss": -26.07569694519043, "global_step": 323526, "epoch": 3897} {"train_loss": -25.35799217224121, "global_step": 323527, "epoch": 3897} {"train_loss": -25.900217056274414, "global_step": 323528, "epoch": 3897} {"train_loss": -25.791982650756836, "global_step": 323529, "epoch": 3897} {"train_loss": -25.734411239624023, "global_step": 323530, "epoch": 3897} {"train_loss": -25.9453067779541, "global_step": 323531, "epoch": 3897} {"train_loss": -25.97125244140625, "global_step": 323532, "epoch": 3897} {"train_loss": -25.814118465745306, "global_step": 323533, "epoch": 3897, "val_loss": 7131739.5} {"train_loss": -25.834409713745117, "global_step": 323534, "epoch": 3898} {"train_loss": -25.308544158935547, "global_step": 323535, "epoch": 3898} {"train_loss": -25.330589294433594, "global_step": 323536, "epoch": 3898} {"train_loss": -24.707263946533203, "global_step": 323537, "epoch": 3898} {"train_loss": -24.53816032409668, "global_step": 323538, "epoch": 3898} {"train_loss": -25.051591873168945, "global_step": 323539, "epoch": 3898} {"train_loss": -24.70760154724121, "global_step": 323540, "epoch": 3898} {"train_loss": -24.89057731628418, "global_step": 323541, "epoch": 3898} {"train_loss": -25.404722213745117, "global_step": 323542, "epoch": 3898} {"train_loss": -25.01897621154785, "global_step": 323543, "epoch": 3898} {"train_loss": -25.534696578979492, "global_step": 323544, "epoch": 3898} {"train_loss": -25.16734504699707, "global_step": 323545, "epoch": 3898} {"train_loss": -25.806344985961914, "global_step": 323546, "epoch": 3898} {"train_loss": -25.42295265197754, "global_step": 323547, "epoch": 3898} {"train_loss": -25.148479461669922, "global_step": 323548, "epoch": 3898} {"train_loss": -25.364959716796875, "global_step": 323549, "epoch": 3898} {"train_loss": -25.777286529541016, "global_step": 323550, "epoch": 3898} {"train_loss": -25.366504669189453, "global_step": 323551, "epoch": 3898} {"train_loss": -25.409509658813477, "global_step": 323552, "epoch": 3898} {"train_loss": -25.574661254882812, "global_step": 323553, "epoch": 3898} {"train_loss": -25.41837501525879, "global_step": 323554, "epoch": 3898} {"train_loss": -25.683826446533203, "global_step": 323555, "epoch": 3898} {"train_loss": -25.897993087768555, "global_step": 323556, "epoch": 3898} {"train_loss": -25.553194046020508, "global_step": 323557, "epoch": 3898} {"train_loss": -25.914825439453125, "global_step": 323558, "epoch": 3898} {"train_loss": -25.864093780517578, "global_step": 323559, "epoch": 3898} {"train_loss": -25.625913619995117, "global_step": 323560, "epoch": 3898} {"train_loss": -25.29791831970215, "global_step": 323561, "epoch": 3898} {"train_loss": -25.633634567260742, "global_step": 323562, "epoch": 3898} {"train_loss": -25.86077308654785, "global_step": 323563, "epoch": 3898} {"train_loss": -25.884275436401367, "global_step": 323564, "epoch": 3898} {"train_loss": -25.917224884033203, "global_step": 323565, "epoch": 3898} {"train_loss": -25.992887496948242, "global_step": 323566, "epoch": 3898} {"train_loss": -25.79192543029785, "global_step": 323567, "epoch": 3898} {"train_loss": -25.94113540649414, "global_step": 323568, "epoch": 3898} {"train_loss": -26.112634658813477, "global_step": 323569, "epoch": 3898} {"train_loss": -25.46638298034668, "global_step": 323570, "epoch": 3898} {"train_loss": -25.926055908203125, "global_step": 323571, "epoch": 3898} {"train_loss": -25.926971435546875, "global_step": 323572, "epoch": 3898} {"train_loss": -26.180707931518555, "global_step": 323573, "epoch": 3898} {"train_loss": -25.919818878173828, "global_step": 323574, "epoch": 3898} {"train_loss": -25.668750762939453, "global_step": 323575, "epoch": 3898} {"train_loss": -25.79877281188965, "global_step": 323576, "epoch": 3898} {"train_loss": -26.042448043823242, "global_step": 323577, "epoch": 3898} {"train_loss": -25.9213924407959, "global_step": 323578, "epoch": 3898} {"train_loss": -26.04517936706543, "global_step": 323579, "epoch": 3898} {"train_loss": -25.925678253173828, "global_step": 323580, "epoch": 3898} {"train_loss": -25.740467071533203, "global_step": 323581, "epoch": 3898} {"train_loss": -25.8065128326416, "global_step": 323582, "epoch": 3898} {"train_loss": -25.736066818237305, "global_step": 323583, "epoch": 3898} {"train_loss": -25.860538482666016, "global_step": 323584, "epoch": 3898} {"train_loss": -25.56077766418457, "global_step": 323585, "epoch": 3898} {"train_loss": -25.936288833618164, "global_step": 323586, "epoch": 3898} {"train_loss": -25.534948348999023, "global_step": 323587, "epoch": 3898} {"train_loss": -25.72163200378418, "global_step": 323588, "epoch": 3898} {"train_loss": -25.90315818786621, "global_step": 323589, "epoch": 3898} {"train_loss": -26.07114028930664, "global_step": 323590, "epoch": 3898} {"train_loss": -25.602262496948242, "global_step": 323591, "epoch": 3898} {"train_loss": -25.62627601623535, "global_step": 323592, "epoch": 3898} {"train_loss": -25.82806396484375, "global_step": 323593, "epoch": 3898} {"train_loss": -25.743101119995117, "global_step": 323594, "epoch": 3898} {"train_loss": -25.83253288269043, "global_step": 323595, "epoch": 3898} {"train_loss": -25.896711349487305, "global_step": 323596, "epoch": 3898} {"train_loss": -26.036603927612305, "global_step": 323597, "epoch": 3898} {"train_loss": -26.065404891967773, "global_step": 323598, "epoch": 3898} {"train_loss": -25.996265411376953, "global_step": 323599, "epoch": 3898} {"train_loss": -25.993505477905273, "global_step": 323600, "epoch": 3898} {"train_loss": -25.960668563842773, "global_step": 323601, "epoch": 3898} {"train_loss": -25.794355392456055, "global_step": 323602, "epoch": 3898} {"train_loss": -25.61724281311035, "global_step": 323603, "epoch": 3898} {"train_loss": -26.109848022460938, "global_step": 323604, "epoch": 3898} {"train_loss": -25.921478271484375, "global_step": 323605, "epoch": 3898} {"train_loss": -26.414621353149414, "global_step": 323606, "epoch": 3898} {"train_loss": -25.714324951171875, "global_step": 323607, "epoch": 3898} {"train_loss": -26.46044921875, "global_step": 323608, "epoch": 3898} {"train_loss": -26.271081924438477, "global_step": 323609, "epoch": 3898} {"train_loss": -26.194910049438477, "global_step": 323610, "epoch": 3898} {"train_loss": -26.089679718017578, "global_step": 323611, "epoch": 3898} {"train_loss": -26.11543083190918, "global_step": 323612, "epoch": 3898} {"train_loss": -25.6466121673584, "global_step": 323613, "epoch": 3898} {"train_loss": -25.813135147094727, "global_step": 323614, "epoch": 3898} {"train_loss": -25.839651107788086, "global_step": 323615, "epoch": 3898} {"train_loss": -25.73087363645255, "global_step": 323616, "epoch": 3898, "val_loss": 7235690.0} {"train_loss": -25.1657772064209, "global_step": 323617, "epoch": 3899} {"train_loss": -25.406326293945312, "global_step": 323618, "epoch": 3899} {"train_loss": -25.46201515197754, "global_step": 323619, "epoch": 3899} {"train_loss": -25.883848190307617, "global_step": 323620, "epoch": 3899} {"train_loss": -24.956674575805664, "global_step": 323621, "epoch": 3899} {"train_loss": -25.172260284423828, "global_step": 323622, "epoch": 3899} {"train_loss": -25.9815616607666, "global_step": 323623, "epoch": 3899} {"train_loss": -25.012897491455078, "global_step": 323624, "epoch": 3899} {"train_loss": -25.788373947143555, "global_step": 323625, "epoch": 3899} {"train_loss": -25.827075958251953, "global_step": 323626, "epoch": 3899} {"train_loss": -25.46319580078125, "global_step": 323627, "epoch": 3899} {"train_loss": -25.687650680541992, "global_step": 323628, "epoch": 3899} {"train_loss": -25.89950942993164, "global_step": 323629, "epoch": 3899} {"train_loss": -25.804248809814453, "global_step": 323630, "epoch": 3899} {"train_loss": -26.105295181274414, "global_step": 323631, "epoch": 3899} {"train_loss": -25.663192749023438, "global_step": 323632, "epoch": 3899} {"train_loss": -25.823572158813477, "global_step": 323633, "epoch": 3899} {"train_loss": -25.692066192626953, "global_step": 323634, "epoch": 3899} {"train_loss": -25.543161392211914, "global_step": 323635, "epoch": 3899} {"train_loss": -25.59962272644043, "global_step": 323636, "epoch": 3899} {"train_loss": -25.33700942993164, "global_step": 323637, "epoch": 3899} {"train_loss": -25.641164779663086, "global_step": 323638, "epoch": 3899} {"train_loss": -25.558856964111328, "global_step": 323639, "epoch": 3899} {"train_loss": -25.785184860229492, "global_step": 323640, "epoch": 3899} {"train_loss": -25.639867782592773, "global_step": 323641, "epoch": 3899} {"train_loss": -26.057714462280273, "global_step": 323642, "epoch": 3899} {"train_loss": -25.43562126159668, "global_step": 323643, "epoch": 3899} {"train_loss": -25.596776962280273, "global_step": 323644, "epoch": 3899} {"train_loss": -26.070770263671875, "global_step": 323645, "epoch": 3899} {"train_loss": -25.707763671875, "global_step": 323646, "epoch": 3899} {"train_loss": -25.770963668823242, "global_step": 323647, "epoch": 3899} {"train_loss": -25.827550888061523, "global_step": 323648, "epoch": 3899} {"train_loss": -25.935422897338867, "global_step": 323649, "epoch": 3899} {"train_loss": -26.042755126953125, "global_step": 323650, "epoch": 3899} {"train_loss": -26.38016700744629, "global_step": 323651, "epoch": 3899} {"train_loss": -26.29517936706543, "global_step": 323652, "epoch": 3899} {"train_loss": -25.965429306030273, "global_step": 323653, "epoch": 3899} {"train_loss": -25.83660888671875, "global_step": 323654, "epoch": 3899} {"train_loss": -25.725311279296875, "global_step": 323655, "epoch": 3899} {"train_loss": -25.915220260620117, "global_step": 323656, "epoch": 3899} {"train_loss": -25.95122718811035, "global_step": 323657, "epoch": 3899} {"train_loss": -26.37686538696289, "global_step": 323658, "epoch": 3899} {"train_loss": -25.933307647705078, "global_step": 323659, "epoch": 3899} {"train_loss": -25.832910537719727, "global_step": 323660, "epoch": 3899} {"train_loss": -25.719501495361328, "global_step": 323661, "epoch": 3899} {"train_loss": -25.815210342407227, "global_step": 323662, "epoch": 3899} {"train_loss": -25.779218673706055, "global_step": 323663, "epoch": 3899} {"train_loss": -25.980121612548828, "global_step": 323664, "epoch": 3899} {"train_loss": -25.715381622314453, "global_step": 323665, "epoch": 3899} {"train_loss": -25.700851440429688, "global_step": 323666, "epoch": 3899} {"train_loss": -25.76454734802246, "global_step": 323667, "epoch": 3899} {"train_loss": -25.97755241394043, "global_step": 323668, "epoch": 3899} {"train_loss": -26.21563720703125, "global_step": 323669, "epoch": 3899} {"train_loss": -25.925296783447266, "global_step": 323670, "epoch": 3899} {"train_loss": -26.162073135375977, "global_step": 323671, "epoch": 3899} {"train_loss": -26.0673885345459, "global_step": 323672, "epoch": 3899} {"train_loss": -25.552419662475586, "global_step": 323673, "epoch": 3899} {"train_loss": -25.46278190612793, "global_step": 323674, "epoch": 3899} {"train_loss": -26.085901260375977, "global_step": 323675, "epoch": 3899} {"train_loss": -25.672592163085938, "global_step": 323676, "epoch": 3899} {"train_loss": -25.744504928588867, "global_step": 323677, "epoch": 3899} {"train_loss": -26.11075210571289, "global_step": 323678, "epoch": 3899} {"train_loss": -25.955228805541992, "global_step": 323679, "epoch": 3899} {"train_loss": -25.922719955444336, "global_step": 323680, "epoch": 3899} {"train_loss": -25.904132843017578, "global_step": 323681, "epoch": 3899} {"train_loss": -25.975004196166992, "global_step": 323682, "epoch": 3899} {"train_loss": -25.73383903503418, "global_step": 323683, "epoch": 3899} {"train_loss": -26.013288497924805, "global_step": 323684, "epoch": 3899} {"train_loss": -26.233997344970703, "global_step": 323685, "epoch": 3899} {"train_loss": -25.921070098876953, "global_step": 323686, "epoch": 3899} {"train_loss": -26.04705238342285, "global_step": 323687, "epoch": 3899} {"train_loss": -26.037220001220703, "global_step": 323688, "epoch": 3899} {"train_loss": -25.807682037353516, "global_step": 323689, "epoch": 3899} {"train_loss": -25.815961837768555, "global_step": 323690, "epoch": 3899} {"train_loss": -25.891809463500977, "global_step": 323691, "epoch": 3899} {"train_loss": -25.880685806274414, "global_step": 323692, "epoch": 3899} {"train_loss": -25.99509048461914, "global_step": 323693, "epoch": 3899} {"train_loss": -26.03731346130371, "global_step": 323694, "epoch": 3899} {"train_loss": -26.17348289489746, "global_step": 323695, "epoch": 3899} {"train_loss": -25.885208129882812, "global_step": 323696, "epoch": 3899} {"train_loss": -26.01190185546875, "global_step": 323697, "epoch": 3899} {"train_loss": -25.920032501220703, "global_step": 323698, "epoch": 3899} {"train_loss": -25.81734029930758, "global_step": 323699, "epoch": 3899, "val_loss": 7155078.0} {"train_loss": -25.35333824157715, "global_step": 323700, "epoch": 3900} {"train_loss": -25.64875602722168, "global_step": 323701, "epoch": 3900} {"train_loss": -25.274446487426758, "global_step": 323702, "epoch": 3900} {"train_loss": -25.06601905822754, "global_step": 323703, "epoch": 3900} {"train_loss": -24.913949966430664, "global_step": 323704, "epoch": 3900} {"train_loss": -25.57327651977539, "global_step": 323705, "epoch": 3900} {"train_loss": -25.488693237304688, "global_step": 323706, "epoch": 3900} {"train_loss": -25.369091033935547, "global_step": 323707, "epoch": 3900} {"train_loss": -25.500242233276367, "global_step": 323708, "epoch": 3900} {"train_loss": -25.508188247680664, "global_step": 323709, "epoch": 3900} {"train_loss": -25.32575225830078, "global_step": 323710, "epoch": 3900} {"train_loss": -25.528120040893555, "global_step": 323711, "epoch": 3900} {"train_loss": -25.26167869567871, "global_step": 323712, "epoch": 3900} {"train_loss": -25.758014678955078, "global_step": 323713, "epoch": 3900} {"train_loss": -25.815357208251953, "global_step": 323714, "epoch": 3900} {"train_loss": -25.53444480895996, "global_step": 323715, "epoch": 3900} {"train_loss": -25.67203140258789, "global_step": 323716, "epoch": 3900} {"train_loss": -25.572053909301758, "global_step": 323717, "epoch": 3900} {"train_loss": -25.763647079467773, "global_step": 323718, "epoch": 3900} {"train_loss": -25.773740768432617, "global_step": 323719, "epoch": 3900} {"train_loss": -25.84049415588379, "global_step": 323720, "epoch": 3900} {"train_loss": -25.722064971923828, "global_step": 323721, "epoch": 3900} {"train_loss": -25.792957305908203, "global_step": 323722, "epoch": 3900} {"train_loss": -25.805173873901367, "global_step": 323723, "epoch": 3900} {"train_loss": -26.203527450561523, "global_step": 323724, "epoch": 3900} {"train_loss": -26.274845123291016, "global_step": 323725, "epoch": 3900} {"train_loss": -26.190576553344727, "global_step": 323726, "epoch": 3900} {"train_loss": -25.92774772644043, "global_step": 323727, "epoch": 3900} {"train_loss": -25.910337448120117, "global_step": 323728, "epoch": 3900} {"train_loss": -25.98396110534668, "global_step": 323729, "epoch": 3900} {"train_loss": -25.902830123901367, "global_step": 323730, "epoch": 3900} {"train_loss": -25.979650497436523, "global_step": 323731, "epoch": 3900} {"train_loss": -26.02799415588379, "global_step": 323732, "epoch": 3900} {"train_loss": -25.866483688354492, "global_step": 323733, "epoch": 3900} {"train_loss": -25.718774795532227, "global_step": 323734, "epoch": 3900} {"train_loss": -25.97794532775879, "global_step": 323735, "epoch": 3900} {"train_loss": -26.167682647705078, "global_step": 323736, "epoch": 3900} {"train_loss": -25.811355590820312, "global_step": 323737, "epoch": 3900} {"train_loss": -25.92522621154785, "global_step": 323738, "epoch": 3900} {"train_loss": -26.233396530151367, "global_step": 323739, "epoch": 3900} {"train_loss": -25.864667892456055, "global_step": 323740, "epoch": 3900} {"train_loss": -26.20173454284668, "global_step": 323741, "epoch": 3900} {"train_loss": -25.706546783447266, "global_step": 323742, "epoch": 3900} {"train_loss": -26.02178382873535, "global_step": 323743, "epoch": 3900} {"train_loss": -25.686630249023438, "global_step": 323744, "epoch": 3900} {"train_loss": -25.83978843688965, "global_step": 323745, "epoch": 3900} {"train_loss": -26.129501342773438, "global_step": 323746, "epoch": 3900} {"train_loss": -26.25409507751465, "global_step": 323747, "epoch": 3900} {"train_loss": -25.849811553955078, "global_step": 323748, "epoch": 3900} {"train_loss": -26.03717041015625, "global_step": 323749, "epoch": 3900} {"train_loss": -25.8411865234375, "global_step": 323750, "epoch": 3900} {"train_loss": -25.458724975585938, "global_step": 323751, "epoch": 3900} {"train_loss": -25.728504180908203, "global_step": 323752, "epoch": 3900} {"train_loss": -25.594675064086914, "global_step": 323753, "epoch": 3900} {"train_loss": -25.855121612548828, "global_step": 323754, "epoch": 3900} {"train_loss": -25.823883056640625, "global_step": 323755, "epoch": 3900} {"train_loss": -25.769460678100586, "global_step": 323756, "epoch": 3900} {"train_loss": -26.0787353515625, "global_step": 323757, "epoch": 3900} {"train_loss": -25.667776107788086, "global_step": 323758, "epoch": 3900} {"train_loss": -25.759952545166016, "global_step": 323759, "epoch": 3900} {"train_loss": -25.526273727416992, "global_step": 323760, "epoch": 3900} {"train_loss": -25.83984375, "global_step": 323761, "epoch": 3900} {"train_loss": -26.028100967407227, "global_step": 323762, "epoch": 3900} {"train_loss": -25.521533966064453, "global_step": 323763, "epoch": 3900} {"train_loss": -26.017292022705078, "global_step": 323764, "epoch": 3900} {"train_loss": -25.89576530456543, "global_step": 323765, "epoch": 3900} {"train_loss": -25.694238662719727, "global_step": 323766, "epoch": 3900} {"train_loss": -25.916915893554688, "global_step": 323767, "epoch": 3900} {"train_loss": -25.67669677734375, "global_step": 323768, "epoch": 3900} {"train_loss": -25.592716217041016, "global_step": 323769, "epoch": 3900} {"train_loss": -26.026615142822266, "global_step": 323770, "epoch": 3900} {"train_loss": -26.033554077148438, "global_step": 323771, "epoch": 3900} {"train_loss": -25.66242790222168, "global_step": 323772, "epoch": 3900} {"train_loss": -26.125646591186523, "global_step": 323773, "epoch": 3900} {"train_loss": -25.92767906188965, "global_step": 323774, "epoch": 3900} {"train_loss": -25.527942657470703, "global_step": 323775, "epoch": 3900} {"train_loss": -25.98701286315918, "global_step": 323776, "epoch": 3900} {"train_loss": -26.03950309753418, "global_step": 323777, "epoch": 3900} {"train_loss": -25.514944076538086, "global_step": 323778, "epoch": 3900} {"train_loss": -25.811269760131836, "global_step": 323779, "epoch": 3900} {"train_loss": -26.034284591674805, "global_step": 323780, "epoch": 3900} {"train_loss": -25.58775520324707, "global_step": 323781, "epoch": 3900} {"train_loss": -25.776511272752142, "global_step": 323782, "epoch": 3900, "train/sim_max_reward_0": 1.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4500000": 1.0, "test/sim_max_reward_4500001": 1.0, "test/sim_max_reward_4500002": 1.0, "test/sim_max_reward_4500003": 1.0, "test/sim_max_reward_4500004": 1.0, "test/sim_max_reward_4500005": 1.0, "test/sim_max_reward_4500006": 1.0, "test/sim_max_reward_4500007": 0.0, "test/sim_max_reward_4500008": 1.0, "test/sim_max_reward_4500009": 1.0, "test/sim_max_reward_4500010": 1.0, "test/sim_max_reward_4500011": 1.0, "test/sim_max_reward_4500012": 1.0, "test/sim_max_reward_4500013": 0.0, "test/sim_max_reward_4500014": 1.0, "test/sim_max_reward_4500015": 1.0, "test/sim_max_reward_4500016": 1.0, "test/sim_max_reward_4500017": 1.0, "test/sim_max_reward_4500018": 0.0, "test/sim_max_reward_4500019": 1.0, "test/sim_max_reward_4500020": 1.0, "test/sim_max_reward_4500021": 1.0, "train/mean_score": 1.0, "test/mean_score": 0.8636363636363636, "val_loss": 7167649.0} {"train_loss": -24.895511627197266, "global_step": 323783, "epoch": 3901} {"train_loss": -25.288013458251953, "global_step": 323784, "epoch": 3901} {"train_loss": -25.68910789489746, "global_step": 323785, "epoch": 3901} {"train_loss": -25.120161056518555, "global_step": 323786, "epoch": 3901} {"train_loss": -25.675573348999023, "global_step": 323787, "epoch": 3901} {"train_loss": -25.097822189331055, "global_step": 323788, "epoch": 3901} {"train_loss": -25.32051658630371, "global_step": 323789, "epoch": 3901} {"train_loss": -25.565515518188477, "global_step": 323790, "epoch": 3901} {"train_loss": -25.586408615112305, "global_step": 323791, "epoch": 3901} {"train_loss": -25.251157760620117, "global_step": 323792, "epoch": 3901} {"train_loss": -25.620380401611328, "global_step": 323793, "epoch": 3901} {"train_loss": -25.040571212768555, "global_step": 323794, "epoch": 3901} {"train_loss": -25.555421829223633, "global_step": 323795, "epoch": 3901} {"train_loss": -25.5006160736084, "global_step": 323796, "epoch": 3901} {"train_loss": -25.417577743530273, "global_step": 323797, "epoch": 3901} {"train_loss": -25.70536231994629, "global_step": 323798, "epoch": 3901} {"train_loss": -26.183141708374023, "global_step": 323799, "epoch": 3901} {"train_loss": -25.70548439025879, "global_step": 323800, "epoch": 3901} {"train_loss": -25.346765518188477, "global_step": 323801, "epoch": 3901} {"train_loss": -25.72940444946289, "global_step": 323802, "epoch": 3901} {"train_loss": -25.88838768005371, "global_step": 323803, "epoch": 3901} {"train_loss": -25.610639572143555, "global_step": 323804, "epoch": 3901} {"train_loss": -25.618284225463867, "global_step": 323805, "epoch": 3901} {"train_loss": -25.939865112304688, "global_step": 323806, "epoch": 3901} {"train_loss": -25.9636287689209, "global_step": 323807, "epoch": 3901} {"train_loss": -25.7372989654541, "global_step": 323808, "epoch": 3901} {"train_loss": -26.109344482421875, "global_step": 323809, "epoch": 3901} {"train_loss": -25.6917667388916, "global_step": 323810, "epoch": 3901} {"train_loss": -25.892385482788086, "global_step": 323811, "epoch": 3901} {"train_loss": -25.895538330078125, "global_step": 323812, "epoch": 3901} {"train_loss": -25.93305778503418, "global_step": 323813, "epoch": 3901} {"train_loss": -26.05810546875, "global_step": 323814, "epoch": 3901} {"train_loss": -25.94178581237793, "global_step": 323815, "epoch": 3901} {"train_loss": -25.84946632385254, "global_step": 323816, "epoch": 3901} {"train_loss": -25.815820693969727, "global_step": 323817, "epoch": 3901} {"train_loss": -25.676654815673828, "global_step": 323818, "epoch": 3901} {"train_loss": -26.2370548248291, "global_step": 323819, "epoch": 3901} {"train_loss": -26.33098793029785, "global_step": 323820, "epoch": 3901} {"train_loss": -25.921527862548828, "global_step": 323821, "epoch": 3901} {"train_loss": -26.05303382873535, "global_step": 323822, "epoch": 3901} {"train_loss": -26.069299697875977, "global_step": 323823, "epoch": 3901} {"train_loss": -25.981740951538086, "global_step": 323824, "epoch": 3901} {"train_loss": -26.204870223999023, "global_step": 323825, "epoch": 3901} {"train_loss": -26.046064376831055, "global_step": 323826, "epoch": 3901} {"train_loss": -26.03407096862793, "global_step": 323827, "epoch": 3901} {"train_loss": -26.147735595703125, "global_step": 323828, "epoch": 3901} {"train_loss": -25.695627212524414, "global_step": 323829, "epoch": 3901} {"train_loss": -25.987546920776367, "global_step": 323830, "epoch": 3901} {"train_loss": -25.65433692932129, "global_step": 323831, "epoch": 3901} {"train_loss": -25.5965576171875, "global_step": 323832, "epoch": 3901} {"train_loss": -25.757001876831055, "global_step": 323833, "epoch": 3901} {"train_loss": -25.43613624572754, "global_step": 323834, "epoch": 3901} {"train_loss": -24.844985961914062, "global_step": 323835, "epoch": 3901} {"train_loss": -24.74520492553711, "global_step": 323836, "epoch": 3901} {"train_loss": -25.31288719177246, "global_step": 323837, "epoch": 3901} {"train_loss": -25.80120849609375, "global_step": 323838, "epoch": 3901} {"train_loss": -25.40122413635254, "global_step": 323839, "epoch": 3901} {"train_loss": -25.123733520507812, "global_step": 323840, "epoch": 3901} {"train_loss": -25.53797149658203, "global_step": 323841, "epoch": 3901} {"train_loss": -25.454565048217773, "global_step": 323842, "epoch": 3901} {"train_loss": -25.25408363342285, "global_step": 323843, "epoch": 3901} {"train_loss": -25.707223892211914, "global_step": 323844, "epoch": 3901} {"train_loss": -25.602462768554688, "global_step": 323845, "epoch": 3901} {"train_loss": -25.533781051635742, "global_step": 323846, "epoch": 3901} {"train_loss": -25.8193416595459, "global_step": 323847, "epoch": 3901} {"train_loss": -25.716266632080078, "global_step": 323848, "epoch": 3901} {"train_loss": -26.043359756469727, "global_step": 323849, "epoch": 3901} {"train_loss": -25.27477264404297, "global_step": 323850, "epoch": 3901} {"train_loss": -25.74346351623535, "global_step": 323851, "epoch": 3901} {"train_loss": -25.22968101501465, "global_step": 323852, "epoch": 3901} {"train_loss": -25.641437530517578, "global_step": 323853, "epoch": 3901} {"train_loss": -25.536304473876953, "global_step": 323854, "epoch": 3901} {"train_loss": -25.791486740112305, "global_step": 323855, "epoch": 3901} {"train_loss": -25.7861270904541, "global_step": 323856, "epoch": 3901} {"train_loss": -25.5852108001709, "global_step": 323857, "epoch": 3901} {"train_loss": -25.449899673461914, "global_step": 323858, "epoch": 3901} {"train_loss": -25.759872436523438, "global_step": 323859, "epoch": 3901} {"train_loss": -25.852985382080078, "global_step": 323860, "epoch": 3901} {"train_loss": -25.44498634338379, "global_step": 323861, "epoch": 3901} {"train_loss": -25.981250762939453, "global_step": 323862, "epoch": 3901} {"train_loss": -25.864709854125977, "global_step": 323863, "epoch": 3901} {"train_loss": -25.985095977783203, "global_step": 323864, "epoch": 3901} {"train_loss": -25.668143123029225, "global_step": 323865, "epoch": 3901, "val_loss": 7223330.0} {"train_loss": -25.099748611450195, "global_step": 323866, "epoch": 3902} {"train_loss": -25.881336212158203, "global_step": 323867, "epoch": 3902} {"train_loss": -25.60271644592285, "global_step": 323868, "epoch": 3902} {"train_loss": -25.01358985900879, "global_step": 323869, "epoch": 3902} {"train_loss": -25.8172550201416, "global_step": 323870, "epoch": 3902} {"train_loss": -25.300676345825195, "global_step": 323871, "epoch": 3902} {"train_loss": -25.448110580444336, "global_step": 323872, "epoch": 3902} {"train_loss": -25.638402938842773, "global_step": 323873, "epoch": 3902} {"train_loss": -25.238555908203125, "global_step": 323874, "epoch": 3902} {"train_loss": -25.560148239135742, "global_step": 323875, "epoch": 3902} {"train_loss": -25.521757125854492, "global_step": 323876, "epoch": 3902} {"train_loss": -25.912342071533203, "global_step": 323877, "epoch": 3902} {"train_loss": -25.44643783569336, "global_step": 323878, "epoch": 3902} {"train_loss": -25.480329513549805, "global_step": 323879, "epoch": 3902} {"train_loss": -25.944299697875977, "global_step": 323880, "epoch": 3902} {"train_loss": -25.430173873901367, "global_step": 323881, "epoch": 3902} {"train_loss": -25.7929744720459, "global_step": 323882, "epoch": 3902} {"train_loss": -25.499713897705078, "global_step": 323883, "epoch": 3902} {"train_loss": -25.921310424804688, "global_step": 323884, "epoch": 3902} {"train_loss": -25.222320556640625, "global_step": 323885, "epoch": 3902} {"train_loss": -25.924467086791992, "global_step": 323886, "epoch": 3902} {"train_loss": -25.906967163085938, "global_step": 323887, "epoch": 3902} {"train_loss": -26.0125675201416, "global_step": 323888, "epoch": 3902} {"train_loss": -25.725366592407227, "global_step": 323889, "epoch": 3902} {"train_loss": -26.023624420166016, "global_step": 323890, "epoch": 3902} {"train_loss": -25.851043701171875, "global_step": 323891, "epoch": 3902} {"train_loss": -25.99444007873535, "global_step": 323892, "epoch": 3902} {"train_loss": -26.341064453125, "global_step": 323893, "epoch": 3902} {"train_loss": -25.595199584960938, "global_step": 323894, "epoch": 3902} {"train_loss": -25.75263786315918, "global_step": 323895, "epoch": 3902} {"train_loss": -25.488832473754883, "global_step": 323896, "epoch": 3902} {"train_loss": -26.157257080078125, "global_step": 323897, "epoch": 3902} {"train_loss": -26.04931640625, "global_step": 323898, "epoch": 3902} {"train_loss": -26.171966552734375, "global_step": 323899, "epoch": 3902} {"train_loss": -25.8170166015625, "global_step": 323900, "epoch": 3902} {"train_loss": -26.011999130249023, "global_step": 323901, "epoch": 3902} {"train_loss": -25.873319625854492, "global_step": 323902, "epoch": 3902} {"train_loss": -26.237279891967773, "global_step": 323903, "epoch": 3902} {"train_loss": -25.935693740844727, "global_step": 323904, "epoch": 3902} {"train_loss": -26.28890037536621, "global_step": 323905, "epoch": 3902} {"train_loss": -25.976537704467773, "global_step": 323906, "epoch": 3902} {"train_loss": -26.154531478881836, "global_step": 323907, "epoch": 3902} {"train_loss": -26.08733558654785, "global_step": 323908, "epoch": 3902} {"train_loss": -25.9160099029541, "global_step": 323909, "epoch": 3902} {"train_loss": -26.12322425842285, "global_step": 323910, "epoch": 3902} {"train_loss": -25.951887130737305, "global_step": 323911, "epoch": 3902} {"train_loss": -25.856245040893555, "global_step": 323912, "epoch": 3902} {"train_loss": -25.87776756286621, "global_step": 323913, "epoch": 3902} {"train_loss": -25.90935707092285, "global_step": 323914, "epoch": 3902} {"train_loss": -25.921899795532227, "global_step": 323915, "epoch": 3902} {"train_loss": -26.300565719604492, "global_step": 323916, "epoch": 3902} {"train_loss": -26.020490646362305, "global_step": 323917, "epoch": 3902} {"train_loss": -26.34840202331543, "global_step": 323918, "epoch": 3902} {"train_loss": -25.562789916992188, "global_step": 323919, "epoch": 3902} {"train_loss": -25.81007957458496, "global_step": 323920, "epoch": 3902} {"train_loss": -25.956375122070312, "global_step": 323921, "epoch": 3902} {"train_loss": -26.18792152404785, "global_step": 323922, "epoch": 3902} {"train_loss": -26.091175079345703, "global_step": 323923, "epoch": 3902} {"train_loss": -25.838455200195312, "global_step": 323924, "epoch": 3902} {"train_loss": -26.253498077392578, "global_step": 323925, "epoch": 3902} {"train_loss": -25.654874801635742, "global_step": 323926, "epoch": 3902} {"train_loss": -26.011377334594727, "global_step": 323927, "epoch": 3902} {"train_loss": -25.933364868164062, "global_step": 323928, "epoch": 3902} {"train_loss": -25.76850700378418, "global_step": 323929, "epoch": 3902} {"train_loss": -25.612096786499023, "global_step": 323930, "epoch": 3902} {"train_loss": -25.632116317749023, "global_step": 323931, "epoch": 3902} {"train_loss": -25.853973388671875, "global_step": 323932, "epoch": 3902} {"train_loss": -26.091827392578125, "global_step": 323933, "epoch": 3902} {"train_loss": -25.526472091674805, "global_step": 323934, "epoch": 3902} {"train_loss": -25.60333251953125, "global_step": 323935, "epoch": 3902} {"train_loss": -26.0972900390625, "global_step": 323936, "epoch": 3902} {"train_loss": -25.898603439331055, "global_step": 323937, "epoch": 3902} {"train_loss": -25.94843101501465, "global_step": 323938, "epoch": 3902} {"train_loss": -26.040058135986328, "global_step": 323939, "epoch": 3902} {"train_loss": -25.548995971679688, "global_step": 323940, "epoch": 3902} {"train_loss": -25.973712921142578, "global_step": 323941, "epoch": 3902} {"train_loss": -26.275787353515625, "global_step": 323942, "epoch": 3902} {"train_loss": -25.740278244018555, "global_step": 323943, "epoch": 3902} {"train_loss": -25.84882164001465, "global_step": 323944, "epoch": 3902} {"train_loss": -25.720205307006836, "global_step": 323945, "epoch": 3902} {"train_loss": -25.936527252197266, "global_step": 323946, "epoch": 3902} {"train_loss": -25.69898796081543, "global_step": 323947, "epoch": 3902} {"train_loss": -25.824159415371447, "global_step": 323948, "epoch": 3902, "val_loss": 7217506.5} {"train_loss": -25.531469345092773, "global_step": 323949, "epoch": 3903} {"train_loss": -25.065046310424805, "global_step": 323950, "epoch": 3903} {"train_loss": -24.475263595581055, "global_step": 323951, "epoch": 3903} {"train_loss": -24.8343448638916, "global_step": 323952, "epoch": 3903} {"train_loss": -25.299306869506836, "global_step": 323953, "epoch": 3903} {"train_loss": -24.747961044311523, "global_step": 323954, "epoch": 3903} {"train_loss": -25.257776260375977, "global_step": 323955, "epoch": 3903} {"train_loss": -25.339574813842773, "global_step": 323956, "epoch": 3903} {"train_loss": -25.61610984802246, "global_step": 323957, "epoch": 3903} {"train_loss": -25.50950050354004, "global_step": 323958, "epoch": 3903} {"train_loss": -25.602460861206055, "global_step": 323959, "epoch": 3903} {"train_loss": -25.70017433166504, "global_step": 323960, "epoch": 3903} {"train_loss": -25.545536041259766, "global_step": 323961, "epoch": 3903} {"train_loss": -25.178640365600586, "global_step": 323962, "epoch": 3903} {"train_loss": -25.482162475585938, "global_step": 323963, "epoch": 3903} {"train_loss": -25.273147583007812, "global_step": 323964, "epoch": 3903} {"train_loss": -25.143423080444336, "global_step": 323965, "epoch": 3903} {"train_loss": -25.55238151550293, "global_step": 323966, "epoch": 3903} {"train_loss": -25.582265853881836, "global_step": 323967, "epoch": 3903} {"train_loss": -25.340391159057617, "global_step": 323968, "epoch": 3903} {"train_loss": -25.99843406677246, "global_step": 323969, "epoch": 3903} {"train_loss": -25.699853897094727, "global_step": 323970, "epoch": 3903} {"train_loss": -25.6312198638916, "global_step": 323971, "epoch": 3903} {"train_loss": -25.840606689453125, "global_step": 323972, "epoch": 3903} {"train_loss": -25.928241729736328, "global_step": 323973, "epoch": 3903} {"train_loss": -25.756296157836914, "global_step": 323974, "epoch": 3903} {"train_loss": -25.96856689453125, "global_step": 323975, "epoch": 3903} {"train_loss": -25.656187057495117, "global_step": 323976, "epoch": 3903} {"train_loss": -25.733301162719727, "global_step": 323977, "epoch": 3903} {"train_loss": -25.606342315673828, "global_step": 323978, "epoch": 3903} {"train_loss": -25.967147827148438, "global_step": 323979, "epoch": 3903} {"train_loss": -25.749759674072266, "global_step": 323980, "epoch": 3903} {"train_loss": -25.7125244140625, "global_step": 323981, "epoch": 3903} {"train_loss": -26.174612045288086, "global_step": 323982, "epoch": 3903} {"train_loss": -25.932950973510742, "global_step": 323983, "epoch": 3903} {"train_loss": -26.233707427978516, "global_step": 323984, "epoch": 3903} {"train_loss": -26.19501304626465, "global_step": 323985, "epoch": 3903} {"train_loss": -26.29241371154785, "global_step": 323986, "epoch": 3903} {"train_loss": -25.96282958984375, "global_step": 323987, "epoch": 3903} {"train_loss": -25.74994468688965, "global_step": 323988, "epoch": 3903} {"train_loss": -25.830734252929688, "global_step": 323989, "epoch": 3903} {"train_loss": -25.845434188842773, "global_step": 323990, "epoch": 3903} {"train_loss": -25.711334228515625, "global_step": 323991, "epoch": 3903} {"train_loss": -26.246564865112305, "global_step": 323992, "epoch": 3903} {"train_loss": -25.798131942749023, "global_step": 323993, "epoch": 3903} {"train_loss": -26.37137794494629, "global_step": 323994, "epoch": 3903} {"train_loss": -26.019733428955078, "global_step": 323995, "epoch": 3903} {"train_loss": -25.833038330078125, "global_step": 323996, "epoch": 3903} {"train_loss": -26.110828399658203, "global_step": 323997, "epoch": 3903} {"train_loss": -26.02052116394043, "global_step": 323998, "epoch": 3903} {"train_loss": -26.013193130493164, "global_step": 323999, "epoch": 3903} {"train_loss": -25.989215850830078, "global_step": 324000, "epoch": 3903} {"train_loss": -26.080839157104492, "global_step": 324001, "epoch": 3903} {"train_loss": -25.580739974975586, "global_step": 324002, "epoch": 3903} {"train_loss": -25.85919189453125, "global_step": 324003, "epoch": 3903} {"train_loss": -25.276960372924805, "global_step": 324004, "epoch": 3903} {"train_loss": -25.71955680847168, "global_step": 324005, "epoch": 3903} {"train_loss": -26.151945114135742, "global_step": 324006, "epoch": 3903} {"train_loss": -25.922155380249023, "global_step": 324007, "epoch": 3903} {"train_loss": -25.837116241455078, "global_step": 324008, "epoch": 3903} {"train_loss": -26.250473022460938, "global_step": 324009, "epoch": 3903} {"train_loss": -25.615705490112305, "global_step": 324010, "epoch": 3903} {"train_loss": -25.891845703125, "global_step": 324011, "epoch": 3903} {"train_loss": -25.517560958862305, "global_step": 324012, "epoch": 3903} {"train_loss": -25.365354537963867, "global_step": 324013, "epoch": 3903} {"train_loss": -25.697874069213867, "global_step": 324014, "epoch": 3903} {"train_loss": -25.6981258392334, "global_step": 324015, "epoch": 3903} {"train_loss": -26.25921630859375, "global_step": 324016, "epoch": 3903} {"train_loss": -25.844892501831055, "global_step": 324017, "epoch": 3903} {"train_loss": -25.888105392456055, "global_step": 324018, "epoch": 3903} {"train_loss": -25.829797744750977, "global_step": 324019, "epoch": 3903} {"train_loss": -26.083282470703125, "global_step": 324020, "epoch": 3903} {"train_loss": -25.6607666015625, "global_step": 324021, "epoch": 3903} {"train_loss": -25.72024917602539, "global_step": 324022, "epoch": 3903} {"train_loss": -25.746389389038086, "global_step": 324023, "epoch": 3903} {"train_loss": -26.060657501220703, "global_step": 324024, "epoch": 3903} {"train_loss": -26.687482833862305, "global_step": 324025, "epoch": 3903} {"train_loss": -26.0667667388916, "global_step": 324026, "epoch": 3903} {"train_loss": -25.510156631469727, "global_step": 324027, "epoch": 3903} {"train_loss": -25.66509437561035, "global_step": 324028, "epoch": 3903} {"train_loss": -26.15388298034668, "global_step": 324029, "epoch": 3903} {"train_loss": -26.211750030517578, "global_step": 324030, "epoch": 3903} {"train_loss": -25.752838295626354, "global_step": 324031, "epoch": 3903, "val_loss": 7279419.0} {"train_loss": -25.512929916381836, "global_step": 324032, "epoch": 3904} {"train_loss": -25.865798950195312, "global_step": 324033, "epoch": 3904} {"train_loss": -25.404836654663086, "global_step": 324034, "epoch": 3904} {"train_loss": -25.374990463256836, "global_step": 324035, "epoch": 3904} {"train_loss": -25.927087783813477, "global_step": 324036, "epoch": 3904} {"train_loss": -25.4867000579834, "global_step": 324037, "epoch": 3904} {"train_loss": -25.77300453186035, "global_step": 324038, "epoch": 3904} {"train_loss": -26.253936767578125, "global_step": 324039, "epoch": 3904} {"train_loss": -25.50750732421875, "global_step": 324040, "epoch": 3904} {"train_loss": -25.668365478515625, "global_step": 324041, "epoch": 3904} {"train_loss": -25.59498405456543, "global_step": 324042, "epoch": 3904} {"train_loss": -25.681604385375977, "global_step": 324043, "epoch": 3904} {"train_loss": -25.95110511779785, "global_step": 324044, "epoch": 3904} {"train_loss": -25.881351470947266, "global_step": 324045, "epoch": 3904} {"train_loss": -25.598979949951172, "global_step": 324046, "epoch": 3904} {"train_loss": -26.009138107299805, "global_step": 324047, "epoch": 3904} {"train_loss": -25.625030517578125, "global_step": 324048, "epoch": 3904} {"train_loss": -25.909032821655273, "global_step": 324049, "epoch": 3904} {"train_loss": -25.68511962890625, "global_step": 324050, "epoch": 3904} {"train_loss": -25.9417781829834, "global_step": 324051, "epoch": 3904} {"train_loss": -25.51152229309082, "global_step": 324052, "epoch": 3904} {"train_loss": -26.181955337524414, "global_step": 324053, "epoch": 3904} {"train_loss": -25.74551773071289, "global_step": 324054, "epoch": 3904} {"train_loss": -26.24321937561035, "global_step": 324055, "epoch": 3904} {"train_loss": -26.005590438842773, "global_step": 324056, "epoch": 3904} {"train_loss": -25.884485244750977, "global_step": 324057, "epoch": 3904} {"train_loss": -25.76886558532715, "global_step": 324058, "epoch": 3904} {"train_loss": -26.13128662109375, "global_step": 324059, "epoch": 3904} {"train_loss": -25.88642692565918, "global_step": 324060, "epoch": 3904} {"train_loss": -25.9362735748291, "global_step": 324061, "epoch": 3904} {"train_loss": -26.097204208374023, "global_step": 324062, "epoch": 3904} {"train_loss": -25.945417404174805, "global_step": 324063, "epoch": 3904} {"train_loss": -26.089696884155273, "global_step": 324064, "epoch": 3904} {"train_loss": -25.46107292175293, "global_step": 324065, "epoch": 3904} {"train_loss": -26.113727569580078, "global_step": 324066, "epoch": 3904} {"train_loss": -25.802764892578125, "global_step": 324067, "epoch": 3904} {"train_loss": -26.15828514099121, "global_step": 324068, "epoch": 3904} {"train_loss": -25.719863891601562, "global_step": 324069, "epoch": 3904} {"train_loss": -25.835132598876953, "global_step": 324070, "epoch": 3904} {"train_loss": -26.041776657104492, "global_step": 324071, "epoch": 3904} {"train_loss": -26.168014526367188, "global_step": 324072, "epoch": 3904} {"train_loss": -25.98868179321289, "global_step": 324073, "epoch": 3904} {"train_loss": -26.20939064025879, "global_step": 324074, "epoch": 3904} {"train_loss": -25.971588134765625, "global_step": 324075, "epoch": 3904} {"train_loss": -25.360700607299805, "global_step": 324076, "epoch": 3904} {"train_loss": -25.20284080505371, "global_step": 324077, "epoch": 3904} {"train_loss": -25.957000732421875, "global_step": 324078, "epoch": 3904} {"train_loss": -26.08209800720215, "global_step": 324079, "epoch": 3904} {"train_loss": -26.182180404663086, "global_step": 324080, "epoch": 3904} {"train_loss": -25.826696395874023, "global_step": 324081, "epoch": 3904} {"train_loss": -25.8764591217041, "global_step": 324082, "epoch": 3904} {"train_loss": -25.770404815673828, "global_step": 324083, "epoch": 3904} {"train_loss": -26.161651611328125, "global_step": 324084, "epoch": 3904} {"train_loss": -26.055280685424805, "global_step": 324085, "epoch": 3904} {"train_loss": -25.7507266998291, "global_step": 324086, "epoch": 3904} {"train_loss": -25.919052124023438, "global_step": 324087, "epoch": 3904} {"train_loss": -26.034597396850586, "global_step": 324088, "epoch": 3904} {"train_loss": -25.880582809448242, "global_step": 324089, "epoch": 3904} {"train_loss": -25.9798583984375, "global_step": 324090, "epoch": 3904} {"train_loss": -26.165302276611328, "global_step": 324091, "epoch": 3904} {"train_loss": -26.14546012878418, "global_step": 324092, "epoch": 3904} {"train_loss": -26.03086280822754, "global_step": 324093, "epoch": 3904} {"train_loss": -25.84343910217285, "global_step": 324094, "epoch": 3904} {"train_loss": -26.039758682250977, "global_step": 324095, "epoch": 3904} {"train_loss": -26.120304107666016, "global_step": 324096, "epoch": 3904} {"train_loss": -25.953887939453125, "global_step": 324097, "epoch": 3904} {"train_loss": -25.73980140686035, "global_step": 324098, "epoch": 3904} {"train_loss": -25.74155044555664, "global_step": 324099, "epoch": 3904} {"train_loss": -25.92425537109375, "global_step": 324100, "epoch": 3904} {"train_loss": -25.805997848510742, "global_step": 324101, "epoch": 3904} {"train_loss": -25.996179580688477, "global_step": 324102, "epoch": 3904} {"train_loss": -26.009815216064453, "global_step": 324103, "epoch": 3904} {"train_loss": -25.839923858642578, "global_step": 324104, "epoch": 3904} {"train_loss": -25.765613555908203, "global_step": 324105, "epoch": 3904} {"train_loss": -25.859394073486328, "global_step": 324106, "epoch": 3904} {"train_loss": -25.59746551513672, "global_step": 324107, "epoch": 3904} {"train_loss": -26.020532608032227, "global_step": 324108, "epoch": 3904} {"train_loss": -25.989858627319336, "global_step": 324109, "epoch": 3904} {"train_loss": -26.223804473876953, "global_step": 324110, "epoch": 3904} {"train_loss": -25.690906524658203, "global_step": 324111, "epoch": 3904} {"train_loss": -25.79456901550293, "global_step": 324112, "epoch": 3904} {"train_loss": -25.7080020904541, "global_step": 324113, "epoch": 3904} {"train_loss": -25.873919245708418, "global_step": 324114, "epoch": 3904, "val_loss": 7278122.0} {"train_loss": -24.578168869018555, "global_step": 324115, "epoch": 3905} {"train_loss": -24.333059310913086, "global_step": 324116, "epoch": 3905} {"train_loss": -24.359159469604492, "global_step": 324117, "epoch": 3905} {"train_loss": -25.46192169189453, "global_step": 324118, "epoch": 3905} {"train_loss": -25.545270919799805, "global_step": 324119, "epoch": 3905} {"train_loss": -25.535987854003906, "global_step": 324120, "epoch": 3905} {"train_loss": -25.3572998046875, "global_step": 324121, "epoch": 3905} {"train_loss": -25.730865478515625, "global_step": 324122, "epoch": 3905} {"train_loss": -25.368242263793945, "global_step": 324123, "epoch": 3905} {"train_loss": -25.536405563354492, "global_step": 324124, "epoch": 3905} {"train_loss": -25.456403732299805, "global_step": 324125, "epoch": 3905} {"train_loss": -25.652475357055664, "global_step": 324126, "epoch": 3905} {"train_loss": -25.663360595703125, "global_step": 324127, "epoch": 3905} {"train_loss": -25.917505264282227, "global_step": 324128, "epoch": 3905} {"train_loss": -25.874134063720703, "global_step": 324129, "epoch": 3905} {"train_loss": -25.7767391204834, "global_step": 324130, "epoch": 3905} {"train_loss": -25.758188247680664, "global_step": 324131, "epoch": 3905} {"train_loss": -25.730100631713867, "global_step": 324132, "epoch": 3905} {"train_loss": -26.148178100585938, "global_step": 324133, "epoch": 3905} {"train_loss": -26.194355010986328, "global_step": 324134, "epoch": 3905} {"train_loss": -25.996902465820312, "global_step": 324135, "epoch": 3905} {"train_loss": -25.6618595123291, "global_step": 324136, "epoch": 3905} {"train_loss": -25.9465389251709, "global_step": 324137, "epoch": 3905} {"train_loss": -26.052658081054688, "global_step": 324138, "epoch": 3905} {"train_loss": -25.923038482666016, "global_step": 324139, "epoch": 3905} {"train_loss": -25.8610897064209, "global_step": 324140, "epoch": 3905} {"train_loss": -25.897552490234375, "global_step": 324141, "epoch": 3905} {"train_loss": -25.699682235717773, "global_step": 324142, "epoch": 3905} {"train_loss": -25.632659912109375, "global_step": 324143, "epoch": 3905} {"train_loss": -25.456741333007812, "global_step": 324144, "epoch": 3905} {"train_loss": -26.346643447875977, "global_step": 324145, "epoch": 3905} {"train_loss": -25.5805721282959, "global_step": 324146, "epoch": 3905} {"train_loss": -26.04062271118164, "global_step": 324147, "epoch": 3905} {"train_loss": -25.912256240844727, "global_step": 324148, "epoch": 3905} {"train_loss": -25.890125274658203, "global_step": 324149, "epoch": 3905} {"train_loss": -25.866718292236328, "global_step": 324150, "epoch": 3905} {"train_loss": -26.139692306518555, "global_step": 324151, "epoch": 3905} {"train_loss": -25.78215980529785, "global_step": 324152, "epoch": 3905} {"train_loss": -25.489410400390625, "global_step": 324153, "epoch": 3905} {"train_loss": -26.041650772094727, "global_step": 324154, "epoch": 3905} {"train_loss": -26.162811279296875, "global_step": 324155, "epoch": 3905} {"train_loss": -26.07648277282715, "global_step": 324156, "epoch": 3905} {"train_loss": -25.8040771484375, "global_step": 324157, "epoch": 3905} {"train_loss": -26.082056045532227, "global_step": 324158, "epoch": 3905} {"train_loss": -25.838306427001953, "global_step": 324159, "epoch": 3905} {"train_loss": -25.689905166625977, "global_step": 324160, "epoch": 3905} {"train_loss": -25.84840202331543, "global_step": 324161, "epoch": 3905} {"train_loss": -25.78362464904785, "global_step": 324162, "epoch": 3905} {"train_loss": -25.77402687072754, "global_step": 324163, "epoch": 3905} {"train_loss": -25.84034538269043, "global_step": 324164, "epoch": 3905} {"train_loss": -25.86836814880371, "global_step": 324165, "epoch": 3905} {"train_loss": -25.49043846130371, "global_step": 324166, "epoch": 3905} {"train_loss": -26.1212215423584, "global_step": 324167, "epoch": 3905} {"train_loss": -25.968494415283203, "global_step": 324168, "epoch": 3905} {"train_loss": -25.874114990234375, "global_step": 324169, "epoch": 3905} {"train_loss": -25.8728084564209, "global_step": 324170, "epoch": 3905} {"train_loss": -25.953420639038086, "global_step": 324171, "epoch": 3905} {"train_loss": -25.887479782104492, "global_step": 324172, "epoch": 3905} {"train_loss": -25.68971061706543, "global_step": 324173, "epoch": 3905} {"train_loss": -25.6806583404541, "global_step": 324174, "epoch": 3905} {"train_loss": -25.505197525024414, "global_step": 324175, "epoch": 3905} {"train_loss": -25.3284912109375, "global_step": 324176, "epoch": 3905} {"train_loss": -25.814685821533203, "global_step": 324177, "epoch": 3905} {"train_loss": -25.982532501220703, "global_step": 324178, "epoch": 3905} {"train_loss": -25.785612106323242, "global_step": 324179, "epoch": 3905} {"train_loss": -25.399932861328125, "global_step": 324180, "epoch": 3905} {"train_loss": -26.277647018432617, "global_step": 324181, "epoch": 3905} {"train_loss": -25.781503677368164, "global_step": 324182, "epoch": 3905} {"train_loss": -26.0548095703125, "global_step": 324183, "epoch": 3905} {"train_loss": -25.82931900024414, "global_step": 324184, "epoch": 3905} {"train_loss": -25.496755599975586, "global_step": 324185, "epoch": 3905} {"train_loss": -25.83436393737793, "global_step": 324186, "epoch": 3905} {"train_loss": -25.538619995117188, "global_step": 324187, "epoch": 3905} {"train_loss": -25.89072608947754, "global_step": 324188, "epoch": 3905} {"train_loss": -25.83893394470215, "global_step": 324189, "epoch": 3905} {"train_loss": -25.605255126953125, "global_step": 324190, "epoch": 3905} {"train_loss": -25.696645736694336, "global_step": 324191, "epoch": 3905} {"train_loss": -26.2180233001709, "global_step": 324192, "epoch": 3905} {"train_loss": -25.5057430267334, "global_step": 324193, "epoch": 3905} {"train_loss": -25.973419189453125, "global_step": 324194, "epoch": 3905} {"train_loss": -26.057113647460938, "global_step": 324195, "epoch": 3905} {"train_loss": -25.36696434020996, "global_step": 324196, "epoch": 3905} {"train_loss": -25.751004207565124, "global_step": 324197, "epoch": 3905, "val_loss": 7260736.0} {"train_loss": -25.401044845581055, "global_step": 324198, "epoch": 3906} {"train_loss": -25.180463790893555, "global_step": 324199, "epoch": 3906} {"train_loss": -25.427146911621094, "global_step": 324200, "epoch": 3906} {"train_loss": -25.46152114868164, "global_step": 324201, "epoch": 3906} {"train_loss": -25.255109786987305, "global_step": 324202, "epoch": 3906} {"train_loss": -25.535388946533203, "global_step": 324203, "epoch": 3906} {"train_loss": -25.779621124267578, "global_step": 324204, "epoch": 3906} {"train_loss": -25.283447265625, "global_step": 324205, "epoch": 3906} {"train_loss": -25.801340103149414, "global_step": 324206, "epoch": 3906} {"train_loss": -25.625675201416016, "global_step": 324207, "epoch": 3906} {"train_loss": -25.919219970703125, "global_step": 324208, "epoch": 3906} {"train_loss": -25.869794845581055, "global_step": 324209, "epoch": 3906} {"train_loss": -25.6960391998291, "global_step": 324210, "epoch": 3906} {"train_loss": -25.73822593688965, "global_step": 324211, "epoch": 3906} {"train_loss": -25.16992950439453, "global_step": 324212, "epoch": 3906} {"train_loss": -25.68037223815918, "global_step": 324213, "epoch": 3906} {"train_loss": -25.72684669494629, "global_step": 324214, "epoch": 3906} {"train_loss": -25.516647338867188, "global_step": 324215, "epoch": 3906} {"train_loss": -25.737863540649414, "global_step": 324216, "epoch": 3906} {"train_loss": -25.811908721923828, "global_step": 324217, "epoch": 3906} {"train_loss": -25.7707462310791, "global_step": 324218, "epoch": 3906} {"train_loss": -25.871341705322266, "global_step": 324219, "epoch": 3906} {"train_loss": -25.723974227905273, "global_step": 324220, "epoch": 3906} {"train_loss": -25.902875900268555, "global_step": 324221, "epoch": 3906} {"train_loss": -25.884103775024414, "global_step": 324222, "epoch": 3906} {"train_loss": -25.782638549804688, "global_step": 324223, "epoch": 3906} {"train_loss": -25.648645401000977, "global_step": 324224, "epoch": 3906} {"train_loss": -26.37546730041504, "global_step": 324225, "epoch": 3906} {"train_loss": -26.042926788330078, "global_step": 324226, "epoch": 3906} {"train_loss": -26.168569564819336, "global_step": 324227, "epoch": 3906} {"train_loss": -25.88409996032715, "global_step": 324228, "epoch": 3906} {"train_loss": -26.134552001953125, "global_step": 324229, "epoch": 3906} {"train_loss": -25.710437774658203, "global_step": 324230, "epoch": 3906} {"train_loss": -26.059457778930664, "global_step": 324231, "epoch": 3906} {"train_loss": -26.11838150024414, "global_step": 324232, "epoch": 3906} {"train_loss": -25.9251651763916, "global_step": 324233, "epoch": 3906} {"train_loss": -26.325742721557617, "global_step": 324234, "epoch": 3906} {"train_loss": -26.288537979125977, "global_step": 324235, "epoch": 3906} {"train_loss": -26.112125396728516, "global_step": 324236, "epoch": 3906} {"train_loss": -26.204849243164062, "global_step": 324237, "epoch": 3906} {"train_loss": -26.005786895751953, "global_step": 324238, "epoch": 3906} {"train_loss": -26.24102783203125, "global_step": 324239, "epoch": 3906} {"train_loss": -26.005741119384766, "global_step": 324240, "epoch": 3906} {"train_loss": -26.31717300415039, "global_step": 324241, "epoch": 3906} {"train_loss": -26.036046981811523, "global_step": 324242, "epoch": 3906} {"train_loss": -26.23371696472168, "global_step": 324243, "epoch": 3906} {"train_loss": -26.207416534423828, "global_step": 324244, "epoch": 3906} {"train_loss": -26.12749671936035, "global_step": 324245, "epoch": 3906} {"train_loss": -25.701385498046875, "global_step": 324246, "epoch": 3906} {"train_loss": -25.80126953125, "global_step": 324247, "epoch": 3906} {"train_loss": -25.662817001342773, "global_step": 324248, "epoch": 3906} {"train_loss": -26.082508087158203, "global_step": 324249, "epoch": 3906} {"train_loss": -25.555883407592773, "global_step": 324250, "epoch": 3906} {"train_loss": -25.6939697265625, "global_step": 324251, "epoch": 3906} {"train_loss": -25.905078887939453, "global_step": 324252, "epoch": 3906} {"train_loss": -25.75748634338379, "global_step": 324253, "epoch": 3906} {"train_loss": -24.745708465576172, "global_step": 324254, "epoch": 3906} {"train_loss": -24.896860122680664, "global_step": 324255, "epoch": 3906} {"train_loss": -24.46704864501953, "global_step": 324256, "epoch": 3906} {"train_loss": -24.521059036254883, "global_step": 324257, "epoch": 3906} {"train_loss": -24.790573120117188, "global_step": 324258, "epoch": 3906} {"train_loss": -25.50076675415039, "global_step": 324259, "epoch": 3906} {"train_loss": -25.288433074951172, "global_step": 324260, "epoch": 3906} {"train_loss": -26.025060653686523, "global_step": 324261, "epoch": 3906} {"train_loss": -25.38608741760254, "global_step": 324262, "epoch": 3906} {"train_loss": -25.60593032836914, "global_step": 324263, "epoch": 3906} {"train_loss": -25.05567741394043, "global_step": 324264, "epoch": 3906} {"train_loss": -25.482318878173828, "global_step": 324265, "epoch": 3906} {"train_loss": -25.19605827331543, "global_step": 324266, "epoch": 3906} {"train_loss": -25.743152618408203, "global_step": 324267, "epoch": 3906} {"train_loss": -25.631412506103516, "global_step": 324268, "epoch": 3906} {"train_loss": -25.505765914916992, "global_step": 324269, "epoch": 3906} {"train_loss": -25.61529541015625, "global_step": 324270, "epoch": 3906} {"train_loss": -25.949670791625977, "global_step": 324271, "epoch": 3906} {"train_loss": -25.65032386779785, "global_step": 324272, "epoch": 3906} {"train_loss": -25.547639846801758, "global_step": 324273, "epoch": 3906} {"train_loss": -25.576068878173828, "global_step": 324274, "epoch": 3906} {"train_loss": -25.85813331604004, "global_step": 324275, "epoch": 3906} {"train_loss": -25.91463279724121, "global_step": 324276, "epoch": 3906} {"train_loss": -25.820276260375977, "global_step": 324277, "epoch": 3906} {"train_loss": -25.84963035583496, "global_step": 324278, "epoch": 3906} {"train_loss": -25.97974967956543, "global_step": 324279, "epoch": 3906} {"train_loss": -25.71184270927705, "global_step": 324280, "epoch": 3906, "val_loss": 7233395.0} {"train_loss": -25.513107299804688, "global_step": 324281, "epoch": 3907} {"train_loss": -25.71381187438965, "global_step": 324282, "epoch": 3907} {"train_loss": -25.552719116210938, "global_step": 324283, "epoch": 3907} {"train_loss": -25.338964462280273, "global_step": 324284, "epoch": 3907} {"train_loss": -25.57777976989746, "global_step": 324285, "epoch": 3907} {"train_loss": -25.296384811401367, "global_step": 324286, "epoch": 3907} {"train_loss": -25.24110984802246, "global_step": 324287, "epoch": 3907} {"train_loss": -25.3655948638916, "global_step": 324288, "epoch": 3907} {"train_loss": -25.8975830078125, "global_step": 324289, "epoch": 3907} {"train_loss": -25.458938598632812, "global_step": 324290, "epoch": 3907} {"train_loss": -25.62406349182129, "global_step": 324291, "epoch": 3907} {"train_loss": -25.7257022857666, "global_step": 324292, "epoch": 3907} {"train_loss": -25.68194580078125, "global_step": 324293, "epoch": 3907} {"train_loss": -25.706348419189453, "global_step": 324294, "epoch": 3907} {"train_loss": -25.771854400634766, "global_step": 324295, "epoch": 3907} {"train_loss": -25.865766525268555, "global_step": 324296, "epoch": 3907} {"train_loss": -25.910001754760742, "global_step": 324297, "epoch": 3907} {"train_loss": -26.259708404541016, "global_step": 324298, "epoch": 3907} {"train_loss": -25.441186904907227, "global_step": 324299, "epoch": 3907} {"train_loss": -25.951208114624023, "global_step": 324300, "epoch": 3907} {"train_loss": -26.13596534729004, "global_step": 324301, "epoch": 3907} {"train_loss": -25.89845085144043, "global_step": 324302, "epoch": 3907} {"train_loss": -26.05328369140625, "global_step": 324303, "epoch": 3907} {"train_loss": -25.93057632446289, "global_step": 324304, "epoch": 3907} {"train_loss": -25.9732723236084, "global_step": 324305, "epoch": 3907} {"train_loss": -25.889759063720703, "global_step": 324306, "epoch": 3907} {"train_loss": -25.81989097595215, "global_step": 324307, "epoch": 3907} {"train_loss": -26.343618392944336, "global_step": 324308, "epoch": 3907} {"train_loss": -25.86475944519043, "global_step": 324309, "epoch": 3907} {"train_loss": -26.14264488220215, "global_step": 324310, "epoch": 3907} {"train_loss": -26.143735885620117, "global_step": 324311, "epoch": 3907} {"train_loss": -25.985132217407227, "global_step": 324312, "epoch": 3907} {"train_loss": -25.78180503845215, "global_step": 324313, "epoch": 3907} {"train_loss": -26.127893447875977, "global_step": 324314, "epoch": 3907} {"train_loss": -26.025161743164062, "global_step": 324315, "epoch": 3907} {"train_loss": -26.2613582611084, "global_step": 324316, "epoch": 3907} {"train_loss": -25.812543869018555, "global_step": 324317, "epoch": 3907} {"train_loss": -25.831098556518555, "global_step": 324318, "epoch": 3907} {"train_loss": -25.953414916992188, "global_step": 324319, "epoch": 3907} {"train_loss": -26.356740951538086, "global_step": 324320, "epoch": 3907} {"train_loss": -25.986572265625, "global_step": 324321, "epoch": 3907} {"train_loss": -26.062658309936523, "global_step": 324322, "epoch": 3907} {"train_loss": -25.956571578979492, "global_step": 324323, "epoch": 3907} {"train_loss": -25.745203018188477, "global_step": 324324, "epoch": 3907} {"train_loss": -25.660430908203125, "global_step": 324325, "epoch": 3907} {"train_loss": -25.542926788330078, "global_step": 324326, "epoch": 3907} {"train_loss": -25.396337509155273, "global_step": 324327, "epoch": 3907} {"train_loss": -25.217222213745117, "global_step": 324328, "epoch": 3907} {"train_loss": -25.60337257385254, "global_step": 324329, "epoch": 3907} {"train_loss": -25.686864852905273, "global_step": 324330, "epoch": 3907} {"train_loss": -25.7946834564209, "global_step": 324331, "epoch": 3907} {"train_loss": -25.801971435546875, "global_step": 324332, "epoch": 3907} {"train_loss": -25.7902889251709, "global_step": 324333, "epoch": 3907} {"train_loss": -25.923980712890625, "global_step": 324334, "epoch": 3907} {"train_loss": -26.07978630065918, "global_step": 324335, "epoch": 3907} {"train_loss": -26.205310821533203, "global_step": 324336, "epoch": 3907} {"train_loss": -25.731048583984375, "global_step": 324337, "epoch": 3907} {"train_loss": -25.800983428955078, "global_step": 324338, "epoch": 3907} {"train_loss": -25.93271827697754, "global_step": 324339, "epoch": 3907} {"train_loss": -26.148242950439453, "global_step": 324340, "epoch": 3907} {"train_loss": -25.74867820739746, "global_step": 324341, "epoch": 3907} {"train_loss": -25.90225601196289, "global_step": 324342, "epoch": 3907} {"train_loss": -25.93074607849121, "global_step": 324343, "epoch": 3907} {"train_loss": -25.516347885131836, "global_step": 324344, "epoch": 3907} {"train_loss": -26.141149520874023, "global_step": 324345, "epoch": 3907} {"train_loss": -26.135822296142578, "global_step": 324346, "epoch": 3907} {"train_loss": -26.125120162963867, "global_step": 324347, "epoch": 3907} {"train_loss": -26.17823600769043, "global_step": 324348, "epoch": 3907} {"train_loss": -25.887720108032227, "global_step": 324349, "epoch": 3907} {"train_loss": -25.86630630493164, "global_step": 324350, "epoch": 3907} {"train_loss": -26.3143367767334, "global_step": 324351, "epoch": 3907} {"train_loss": -26.04091453552246, "global_step": 324352, "epoch": 3907} {"train_loss": -26.10504722595215, "global_step": 324353, "epoch": 3907} {"train_loss": -25.879840850830078, "global_step": 324354, "epoch": 3907} {"train_loss": -26.164600372314453, "global_step": 324355, "epoch": 3907} {"train_loss": -25.893335342407227, "global_step": 324356, "epoch": 3907} {"train_loss": -26.361318588256836, "global_step": 324357, "epoch": 3907} {"train_loss": -26.164636611938477, "global_step": 324358, "epoch": 3907} {"train_loss": -25.54438591003418, "global_step": 324359, "epoch": 3907} {"train_loss": -25.829992294311523, "global_step": 324360, "epoch": 3907} {"train_loss": -26.000513076782227, "global_step": 324361, "epoch": 3907} {"train_loss": -25.57197380065918, "global_step": 324362, "epoch": 3907} {"train_loss": -25.871837868747942, "global_step": 324363, "epoch": 3907, "val_loss": 7234526.0} {"train_loss": -25.12166976928711, "global_step": 324364, "epoch": 3908} {"train_loss": -23.680953979492188, "global_step": 324365, "epoch": 3908} {"train_loss": -25.23076820373535, "global_step": 324366, "epoch": 3908} {"train_loss": -24.512537002563477, "global_step": 324367, "epoch": 3908} {"train_loss": -24.834157943725586, "global_step": 324368, "epoch": 3908} {"train_loss": -24.64934730529785, "global_step": 324369, "epoch": 3908} {"train_loss": -25.42323112487793, "global_step": 324370, "epoch": 3908} {"train_loss": -25.60115623474121, "global_step": 324371, "epoch": 3908} {"train_loss": -25.165924072265625, "global_step": 324372, "epoch": 3908} {"train_loss": -25.27306365966797, "global_step": 324373, "epoch": 3908} {"train_loss": -25.095991134643555, "global_step": 324374, "epoch": 3908} {"train_loss": -25.259174346923828, "global_step": 324375, "epoch": 3908} {"train_loss": -25.488645553588867, "global_step": 324376, "epoch": 3908} {"train_loss": -25.79754066467285, "global_step": 324377, "epoch": 3908} {"train_loss": -25.653247833251953, "global_step": 324378, "epoch": 3908} {"train_loss": -25.444766998291016, "global_step": 324379, "epoch": 3908} {"train_loss": -25.3181209564209, "global_step": 324380, "epoch": 3908} {"train_loss": -25.50273895263672, "global_step": 324381, "epoch": 3908} {"train_loss": -25.859357833862305, "global_step": 324382, "epoch": 3908} {"train_loss": -25.8365535736084, "global_step": 324383, "epoch": 3908} {"train_loss": -25.44321632385254, "global_step": 324384, "epoch": 3908} {"train_loss": -25.540056228637695, "global_step": 324385, "epoch": 3908} {"train_loss": -25.860553741455078, "global_step": 324386, "epoch": 3908} {"train_loss": -25.67643165588379, "global_step": 324387, "epoch": 3908} {"train_loss": -25.771595001220703, "global_step": 324388, "epoch": 3908} {"train_loss": -25.54823112487793, "global_step": 324389, "epoch": 3908} {"train_loss": -25.862192153930664, "global_step": 324390, "epoch": 3908} {"train_loss": -25.854780197143555, "global_step": 324391, "epoch": 3908} {"train_loss": -26.429431915283203, "global_step": 324392, "epoch": 3908} {"train_loss": -25.81660270690918, "global_step": 324393, "epoch": 3908} {"train_loss": -25.925989151000977, "global_step": 324394, "epoch": 3908} {"train_loss": -26.222402572631836, "global_step": 324395, "epoch": 3908} {"train_loss": -25.952224731445312, "global_step": 324396, "epoch": 3908} {"train_loss": -26.001422882080078, "global_step": 324397, "epoch": 3908} {"train_loss": -25.85262107849121, "global_step": 324398, "epoch": 3908} {"train_loss": -25.905506134033203, "global_step": 324399, "epoch": 3908} {"train_loss": -25.92769432067871, "global_step": 324400, "epoch": 3908} {"train_loss": -25.98966407775879, "global_step": 324401, "epoch": 3908} {"train_loss": -25.947647094726562, "global_step": 324402, "epoch": 3908} {"train_loss": -26.18572425842285, "global_step": 324403, "epoch": 3908} {"train_loss": -26.249530792236328, "global_step": 324404, "epoch": 3908} {"train_loss": -25.7888240814209, "global_step": 324405, "epoch": 3908} {"train_loss": -26.269699096679688, "global_step": 324406, "epoch": 3908} {"train_loss": -26.0195369720459, "global_step": 324407, "epoch": 3908} {"train_loss": -25.85550308227539, "global_step": 324408, "epoch": 3908} {"train_loss": -25.998254776000977, "global_step": 324409, "epoch": 3908} {"train_loss": -26.07847023010254, "global_step": 324410, "epoch": 3908} {"train_loss": -25.721731185913086, "global_step": 324411, "epoch": 3908} {"train_loss": -25.475624084472656, "global_step": 324412, "epoch": 3908} {"train_loss": -25.62030029296875, "global_step": 324413, "epoch": 3908} {"train_loss": -25.774993896484375, "global_step": 324414, "epoch": 3908} {"train_loss": -26.05350685119629, "global_step": 324415, "epoch": 3908} {"train_loss": -25.742826461791992, "global_step": 324416, "epoch": 3908} {"train_loss": -26.00333595275879, "global_step": 324417, "epoch": 3908} {"train_loss": -26.06451988220215, "global_step": 324418, "epoch": 3908} {"train_loss": -26.145959854125977, "global_step": 324419, "epoch": 3908} {"train_loss": -26.08064079284668, "global_step": 324420, "epoch": 3908} {"train_loss": -26.0142879486084, "global_step": 324421, "epoch": 3908} {"train_loss": -26.138837814331055, "global_step": 324422, "epoch": 3908} {"train_loss": -25.9068660736084, "global_step": 324423, "epoch": 3908} {"train_loss": -26.016855239868164, "global_step": 324424, "epoch": 3908} {"train_loss": -25.963119506835938, "global_step": 324425, "epoch": 3908} {"train_loss": -25.800451278686523, "global_step": 324426, "epoch": 3908} {"train_loss": -25.59152603149414, "global_step": 324427, "epoch": 3908} {"train_loss": -26.182403564453125, "global_step": 324428, "epoch": 3908} {"train_loss": -25.78569984436035, "global_step": 324429, "epoch": 3908} {"train_loss": -25.879535675048828, "global_step": 324430, "epoch": 3908} {"train_loss": -25.8282527923584, "global_step": 324431, "epoch": 3908} {"train_loss": -26.179977416992188, "global_step": 324432, "epoch": 3908} {"train_loss": -25.695068359375, "global_step": 324433, "epoch": 3908} {"train_loss": -25.76206398010254, "global_step": 324434, "epoch": 3908} {"train_loss": -26.02674674987793, "global_step": 324435, "epoch": 3908} {"train_loss": -26.16596031188965, "global_step": 324436, "epoch": 3908} {"train_loss": -26.112518310546875, "global_step": 324437, "epoch": 3908} {"train_loss": -26.206823348999023, "global_step": 324438, "epoch": 3908} {"train_loss": -26.32856559753418, "global_step": 324439, "epoch": 3908} {"train_loss": -26.074249267578125, "global_step": 324440, "epoch": 3908} {"train_loss": -25.923095703125, "global_step": 324441, "epoch": 3908} {"train_loss": -26.083118438720703, "global_step": 324442, "epoch": 3908} {"train_loss": -26.191986083984375, "global_step": 324443, "epoch": 3908} {"train_loss": -25.823766708374023, "global_step": 324444, "epoch": 3908} {"train_loss": -26.0054931640625, "global_step": 324445, "epoch": 3908} {"train_loss": -25.778730507356574, "global_step": 324446, "epoch": 3908, "val_loss": 7178935.5} {"train_loss": -25.6038818359375, "global_step": 324447, "epoch": 3909} {"train_loss": -25.699127197265625, "global_step": 324448, "epoch": 3909} {"train_loss": -25.214994430541992, "global_step": 324449, "epoch": 3909} {"train_loss": -25.52457046508789, "global_step": 324450, "epoch": 3909} {"train_loss": -25.501171112060547, "global_step": 324451, "epoch": 3909} {"train_loss": -25.549381256103516, "global_step": 324452, "epoch": 3909} {"train_loss": -25.692291259765625, "global_step": 324453, "epoch": 3909} {"train_loss": -26.14017677307129, "global_step": 324454, "epoch": 3909} {"train_loss": -26.220991134643555, "global_step": 324455, "epoch": 3909} {"train_loss": -25.672576904296875, "global_step": 324456, "epoch": 3909} {"train_loss": -26.250600814819336, "global_step": 324457, "epoch": 3909} {"train_loss": -25.59529685974121, "global_step": 324458, "epoch": 3909} {"train_loss": -26.06532859802246, "global_step": 324459, "epoch": 3909} {"train_loss": -26.07069206237793, "global_step": 324460, "epoch": 3909} {"train_loss": -25.964462280273438, "global_step": 324461, "epoch": 3909} {"train_loss": -25.80936622619629, "global_step": 324462, "epoch": 3909} {"train_loss": -25.861196517944336, "global_step": 324463, "epoch": 3909} {"train_loss": -26.15540885925293, "global_step": 324464, "epoch": 3909} {"train_loss": -25.989456176757812, "global_step": 324465, "epoch": 3909} {"train_loss": -25.838134765625, "global_step": 324466, "epoch": 3909} {"train_loss": -26.029382705688477, "global_step": 324467, "epoch": 3909} {"train_loss": -25.856714248657227, "global_step": 324468, "epoch": 3909} {"train_loss": -25.771503448486328, "global_step": 324469, "epoch": 3909} {"train_loss": -26.191064834594727, "global_step": 324470, "epoch": 3909} {"train_loss": -26.189411163330078, "global_step": 324471, "epoch": 3909} {"train_loss": -25.75703239440918, "global_step": 324472, "epoch": 3909} {"train_loss": -25.81975746154785, "global_step": 324473, "epoch": 3909} {"train_loss": -26.1205997467041, "global_step": 324474, "epoch": 3909} {"train_loss": -26.247909545898438, "global_step": 324475, "epoch": 3909} {"train_loss": -25.944629669189453, "global_step": 324476, "epoch": 3909} {"train_loss": -26.174468994140625, "global_step": 324477, "epoch": 3909} {"train_loss": -25.7772159576416, "global_step": 324478, "epoch": 3909} {"train_loss": -25.818140029907227, "global_step": 324479, "epoch": 3909} {"train_loss": -25.71921730041504, "global_step": 324480, "epoch": 3909} {"train_loss": -25.93556022644043, "global_step": 324481, "epoch": 3909} {"train_loss": -26.09037208557129, "global_step": 324482, "epoch": 3909} {"train_loss": -25.918746948242188, "global_step": 324483, "epoch": 3909} {"train_loss": -25.92951774597168, "global_step": 324484, "epoch": 3909} {"train_loss": -26.06549644470215, "global_step": 324485, "epoch": 3909} {"train_loss": -25.980335235595703, "global_step": 324486, "epoch": 3909} {"train_loss": -25.99811363220215, "global_step": 324487, "epoch": 3909} {"train_loss": -25.75795555114746, "global_step": 324488, "epoch": 3909} {"train_loss": -25.939863204956055, "global_step": 324489, "epoch": 3909} {"train_loss": -25.907093048095703, "global_step": 324490, "epoch": 3909} {"train_loss": -25.898849487304688, "global_step": 324491, "epoch": 3909} {"train_loss": -26.27469253540039, "global_step": 324492, "epoch": 3909} {"train_loss": -26.077783584594727, "global_step": 324493, "epoch": 3909} {"train_loss": -26.014394760131836, "global_step": 324494, "epoch": 3909} {"train_loss": -25.80099868774414, "global_step": 324495, "epoch": 3909} {"train_loss": -25.541908264160156, "global_step": 324496, "epoch": 3909} {"train_loss": -25.702518463134766, "global_step": 324497, "epoch": 3909} {"train_loss": -25.76661491394043, "global_step": 324498, "epoch": 3909} {"train_loss": -25.974628448486328, "global_step": 324499, "epoch": 3909} {"train_loss": -25.709259033203125, "global_step": 324500, "epoch": 3909} {"train_loss": -25.59794807434082, "global_step": 324501, "epoch": 3909} {"train_loss": -25.949695587158203, "global_step": 324502, "epoch": 3909} {"train_loss": -26.0737247467041, "global_step": 324503, "epoch": 3909} {"train_loss": -25.75372886657715, "global_step": 324504, "epoch": 3909} {"train_loss": -26.0293025970459, "global_step": 324505, "epoch": 3909} {"train_loss": -25.595014572143555, "global_step": 324506, "epoch": 3909} {"train_loss": -25.482707977294922, "global_step": 324507, "epoch": 3909} {"train_loss": -25.91131019592285, "global_step": 324508, "epoch": 3909} {"train_loss": -26.11795425415039, "global_step": 324509, "epoch": 3909} {"train_loss": -25.989877700805664, "global_step": 324510, "epoch": 3909} {"train_loss": -25.823352813720703, "global_step": 324511, "epoch": 3909} {"train_loss": -25.9779052734375, "global_step": 324512, "epoch": 3909} {"train_loss": -25.927764892578125, "global_step": 324513, "epoch": 3909} {"train_loss": -25.894201278686523, "global_step": 324514, "epoch": 3909} {"train_loss": -25.86993408203125, "global_step": 324515, "epoch": 3909} {"train_loss": -26.135101318359375, "global_step": 324516, "epoch": 3909} {"train_loss": -25.93269920349121, "global_step": 324517, "epoch": 3909} {"train_loss": -26.08054542541504, "global_step": 324518, "epoch": 3909} {"train_loss": -25.996219635009766, "global_step": 324519, "epoch": 3909} {"train_loss": -25.908954620361328, "global_step": 324520, "epoch": 3909} {"train_loss": -26.097997665405273, "global_step": 324521, "epoch": 3909} {"train_loss": -26.40546226501465, "global_step": 324522, "epoch": 3909} {"train_loss": -25.877408981323242, "global_step": 324523, "epoch": 3909} {"train_loss": -26.091053009033203, "global_step": 324524, "epoch": 3909} {"train_loss": -25.984399795532227, "global_step": 324525, "epoch": 3909} {"train_loss": -25.842191696166992, "global_step": 324526, "epoch": 3909} {"train_loss": -26.006940841674805, "global_step": 324527, "epoch": 3909} {"train_loss": -25.88762855529785, "global_step": 324528, "epoch": 3909} {"train_loss": -25.909140230661414, "global_step": 324529, "epoch": 3909, "val_loss": 7254931.0} {"train_loss": -25.74041175842285, "global_step": 324530, "epoch": 3910} {"train_loss": -25.275644302368164, "global_step": 324531, "epoch": 3910} {"train_loss": -25.520994186401367, "global_step": 324532, "epoch": 3910} {"train_loss": -25.789169311523438, "global_step": 324533, "epoch": 3910} {"train_loss": -25.273178100585938, "global_step": 324534, "epoch": 3910} {"train_loss": -25.56134796142578, "global_step": 324535, "epoch": 3910} {"train_loss": -25.108219146728516, "global_step": 324536, "epoch": 3910} {"train_loss": -25.050148010253906, "global_step": 324537, "epoch": 3910} {"train_loss": -25.561382293701172, "global_step": 324538, "epoch": 3910} {"train_loss": -25.781156539916992, "global_step": 324539, "epoch": 3910} {"train_loss": -25.51021385192871, "global_step": 324540, "epoch": 3910} {"train_loss": -25.3538761138916, "global_step": 324541, "epoch": 3910} {"train_loss": -25.670928955078125, "global_step": 324542, "epoch": 3910} {"train_loss": -25.5748348236084, "global_step": 324543, "epoch": 3910} {"train_loss": -25.9293212890625, "global_step": 324544, "epoch": 3910} {"train_loss": -25.270601272583008, "global_step": 324545, "epoch": 3910} {"train_loss": -25.436548233032227, "global_step": 324546, "epoch": 3910} {"train_loss": -25.86075782775879, "global_step": 324547, "epoch": 3910} {"train_loss": -25.673187255859375, "global_step": 324548, "epoch": 3910} {"train_loss": -26.187026977539062, "global_step": 324549, "epoch": 3910} {"train_loss": -25.59783172607422, "global_step": 324550, "epoch": 3910} {"train_loss": -25.82021141052246, "global_step": 324551, "epoch": 3910} {"train_loss": -25.466794967651367, "global_step": 324552, "epoch": 3910} {"train_loss": -25.650659561157227, "global_step": 324553, "epoch": 3910} {"train_loss": -25.57826042175293, "global_step": 324554, "epoch": 3910} {"train_loss": -26.007322311401367, "global_step": 324555, "epoch": 3910} {"train_loss": -25.812820434570312, "global_step": 324556, "epoch": 3910} {"train_loss": -25.87357521057129, "global_step": 324557, "epoch": 3910} {"train_loss": -25.8663387298584, "global_step": 324558, "epoch": 3910} {"train_loss": -25.941516876220703, "global_step": 324559, "epoch": 3910} {"train_loss": -25.75533103942871, "global_step": 324560, "epoch": 3910} {"train_loss": -25.661401748657227, "global_step": 324561, "epoch": 3910} {"train_loss": -25.956619262695312, "global_step": 324562, "epoch": 3910} {"train_loss": -25.74567222595215, "global_step": 324563, "epoch": 3910} {"train_loss": -25.7905330657959, "global_step": 324564, "epoch": 3910} {"train_loss": -26.1595401763916, "global_step": 324565, "epoch": 3910} {"train_loss": -25.831220626831055, "global_step": 324566, "epoch": 3910} {"train_loss": -26.178543090820312, "global_step": 324567, "epoch": 3910} {"train_loss": -25.992938995361328, "global_step": 324568, "epoch": 3910} {"train_loss": -26.23621940612793, "global_step": 324569, "epoch": 3910} {"train_loss": -26.357864379882812, "global_step": 324570, "epoch": 3910} {"train_loss": -25.8083553314209, "global_step": 324571, "epoch": 3910} {"train_loss": -26.228830337524414, "global_step": 324572, "epoch": 3910} {"train_loss": -26.227432250976562, "global_step": 324573, "epoch": 3910} {"train_loss": -25.857269287109375, "global_step": 324574, "epoch": 3910} {"train_loss": -25.913602828979492, "global_step": 324575, "epoch": 3910} {"train_loss": -25.878631591796875, "global_step": 324576, "epoch": 3910} {"train_loss": -25.967010498046875, "global_step": 324577, "epoch": 3910} {"train_loss": -25.864713668823242, "global_step": 324578, "epoch": 3910} {"train_loss": -25.857431411743164, "global_step": 324579, "epoch": 3910} {"train_loss": -25.8245849609375, "global_step": 324580, "epoch": 3910} {"train_loss": -25.625980377197266, "global_step": 324581, "epoch": 3910} {"train_loss": -25.53875160217285, "global_step": 324582, "epoch": 3910} {"train_loss": -25.471227645874023, "global_step": 324583, "epoch": 3910} {"train_loss": -25.562227249145508, "global_step": 324584, "epoch": 3910} {"train_loss": -25.9489688873291, "global_step": 324585, "epoch": 3910} {"train_loss": -25.924001693725586, "global_step": 324586, "epoch": 3910} {"train_loss": -24.9160099029541, "global_step": 324587, "epoch": 3910} {"train_loss": -25.29268455505371, "global_step": 324588, "epoch": 3910} {"train_loss": -26.068403244018555, "global_step": 324589, "epoch": 3910} {"train_loss": -25.79446792602539, "global_step": 324590, "epoch": 3910} {"train_loss": -25.860462188720703, "global_step": 324591, "epoch": 3910} {"train_loss": -25.70762062072754, "global_step": 324592, "epoch": 3910} {"train_loss": -26.01527214050293, "global_step": 324593, "epoch": 3910} {"train_loss": -25.857685089111328, "global_step": 324594, "epoch": 3910} {"train_loss": -25.888463973999023, "global_step": 324595, "epoch": 3910} {"train_loss": -26.252471923828125, "global_step": 324596, "epoch": 3910} {"train_loss": -25.766376495361328, "global_step": 324597, "epoch": 3910} {"train_loss": -25.83011245727539, "global_step": 324598, "epoch": 3910} {"train_loss": -26.1947078704834, "global_step": 324599, "epoch": 3910} {"train_loss": -25.851825714111328, "global_step": 324600, "epoch": 3910} {"train_loss": -26.202728271484375, "global_step": 324601, "epoch": 3910} {"train_loss": -25.97401237487793, "global_step": 324602, "epoch": 3910} {"train_loss": -26.182600021362305, "global_step": 324603, "epoch": 3910} {"train_loss": -25.587955474853516, "global_step": 324604, "epoch": 3910} {"train_loss": -26.0762939453125, "global_step": 324605, "epoch": 3910} {"train_loss": -26.542158126831055, "global_step": 324606, "epoch": 3910} {"train_loss": -25.98963737487793, "global_step": 324607, "epoch": 3910} {"train_loss": -26.181791305541992, "global_step": 324608, "epoch": 3910} {"train_loss": -26.0823917388916, "global_step": 324609, "epoch": 3910} {"train_loss": -25.92302894592285, "global_step": 324610, "epoch": 3910} {"train_loss": -25.897708892822266, "global_step": 324611, "epoch": 3910} {"train_loss": -25.810680596225232, "global_step": 324612, "epoch": 3910, "val_loss": 7218636.0} {"train_loss": -25.481840133666992, "global_step": 324613, "epoch": 3911} {"train_loss": -25.818668365478516, "global_step": 324614, "epoch": 3911} {"train_loss": -25.64411735534668, "global_step": 324615, "epoch": 3911} {"train_loss": -25.860919952392578, "global_step": 324616, "epoch": 3911} {"train_loss": -26.308271408081055, "global_step": 324617, "epoch": 3911} {"train_loss": -25.7535457611084, "global_step": 324618, "epoch": 3911} {"train_loss": -26.357715606689453, "global_step": 324619, "epoch": 3911} {"train_loss": -26.260452270507812, "global_step": 324620, "epoch": 3911} {"train_loss": -25.77359962463379, "global_step": 324621, "epoch": 3911} {"train_loss": -25.701322555541992, "global_step": 324622, "epoch": 3911} {"train_loss": -25.968460083007812, "global_step": 324623, "epoch": 3911} {"train_loss": -25.92902183532715, "global_step": 324624, "epoch": 3911} {"train_loss": -25.924890518188477, "global_step": 324625, "epoch": 3911} {"train_loss": -25.513639450073242, "global_step": 324626, "epoch": 3911} {"train_loss": -26.037525177001953, "global_step": 324627, "epoch": 3911} {"train_loss": -25.97926902770996, "global_step": 324628, "epoch": 3911} {"train_loss": -26.107666015625, "global_step": 324629, "epoch": 3911} {"train_loss": -25.922422409057617, "global_step": 324630, "epoch": 3911} {"train_loss": -25.94943618774414, "global_step": 324631, "epoch": 3911} {"train_loss": -25.79595375061035, "global_step": 324632, "epoch": 3911} {"train_loss": -25.48164939880371, "global_step": 324633, "epoch": 3911} {"train_loss": -25.35774040222168, "global_step": 324634, "epoch": 3911} {"train_loss": -25.01935386657715, "global_step": 324635, "epoch": 3911} {"train_loss": -25.59927749633789, "global_step": 324636, "epoch": 3911} {"train_loss": -25.284366607666016, "global_step": 324637, "epoch": 3911} {"train_loss": -25.325397491455078, "global_step": 324638, "epoch": 3911} {"train_loss": -25.497007369995117, "global_step": 324639, "epoch": 3911} {"train_loss": -25.6309871673584, "global_step": 324640, "epoch": 3911} {"train_loss": -26.017309188842773, "global_step": 324641, "epoch": 3911} {"train_loss": -25.926008224487305, "global_step": 324642, "epoch": 3911} {"train_loss": -25.9312801361084, "global_step": 324643, "epoch": 3911} {"train_loss": -26.251279830932617, "global_step": 324644, "epoch": 3911} {"train_loss": -25.93471336364746, "global_step": 324645, "epoch": 3911} {"train_loss": -25.44205093383789, "global_step": 324646, "epoch": 3911} {"train_loss": -26.242475509643555, "global_step": 324647, "epoch": 3911} {"train_loss": -26.043262481689453, "global_step": 324648, "epoch": 3911} {"train_loss": -25.79981803894043, "global_step": 324649, "epoch": 3911} {"train_loss": -25.563589096069336, "global_step": 324650, "epoch": 3911} {"train_loss": -25.636011123657227, "global_step": 324651, "epoch": 3911} {"train_loss": -25.598249435424805, "global_step": 324652, "epoch": 3911} {"train_loss": -25.82720375061035, "global_step": 324653, "epoch": 3911} {"train_loss": -25.932544708251953, "global_step": 324654, "epoch": 3911} {"train_loss": -26.011829376220703, "global_step": 324655, "epoch": 3911} {"train_loss": -26.036352157592773, "global_step": 324656, "epoch": 3911} {"train_loss": -25.889963150024414, "global_step": 324657, "epoch": 3911} {"train_loss": -25.884077072143555, "global_step": 324658, "epoch": 3911} {"train_loss": -26.03449821472168, "global_step": 324659, "epoch": 3911} {"train_loss": -25.862659454345703, "global_step": 324660, "epoch": 3911} {"train_loss": -25.965625762939453, "global_step": 324661, "epoch": 3911} {"train_loss": -25.782007217407227, "global_step": 324662, "epoch": 3911} {"train_loss": -26.0745849609375, "global_step": 324663, "epoch": 3911} {"train_loss": -26.16950798034668, "global_step": 324664, "epoch": 3911} {"train_loss": -26.014205932617188, "global_step": 324665, "epoch": 3911} {"train_loss": -26.17386817932129, "global_step": 324666, "epoch": 3911} {"train_loss": -25.9343318939209, "global_step": 324667, "epoch": 3911} {"train_loss": -26.2614688873291, "global_step": 324668, "epoch": 3911} {"train_loss": -26.097885131835938, "global_step": 324669, "epoch": 3911} {"train_loss": -26.399124145507812, "global_step": 324670, "epoch": 3911} {"train_loss": -25.736310958862305, "global_step": 324671, "epoch": 3911} {"train_loss": -26.3061580657959, "global_step": 324672, "epoch": 3911} {"train_loss": -26.406339645385742, "global_step": 324673, "epoch": 3911} {"train_loss": -26.356250762939453, "global_step": 324674, "epoch": 3911} {"train_loss": -25.953479766845703, "global_step": 324675, "epoch": 3911} {"train_loss": -26.440542221069336, "global_step": 324676, "epoch": 3911} {"train_loss": -25.96360206604004, "global_step": 324677, "epoch": 3911} {"train_loss": -25.74410057067871, "global_step": 324678, "epoch": 3911} {"train_loss": -26.09844398498535, "global_step": 324679, "epoch": 3911} {"train_loss": -26.14773941040039, "global_step": 324680, "epoch": 3911} {"train_loss": -25.748859405517578, "global_step": 324681, "epoch": 3911} {"train_loss": -25.762365341186523, "global_step": 324682, "epoch": 3911} {"train_loss": -25.644514083862305, "global_step": 324683, "epoch": 3911} {"train_loss": -25.624866485595703, "global_step": 324684, "epoch": 3911} {"train_loss": -26.290924072265625, "global_step": 324685, "epoch": 3911} {"train_loss": -25.63651466369629, "global_step": 324686, "epoch": 3911} {"train_loss": -25.959745407104492, "global_step": 324687, "epoch": 3911} {"train_loss": -26.074514389038086, "global_step": 324688, "epoch": 3911} {"train_loss": -25.464445114135742, "global_step": 324689, "epoch": 3911} {"train_loss": -25.915618896484375, "global_step": 324690, "epoch": 3911} {"train_loss": -26.0311336517334, "global_step": 324691, "epoch": 3911} {"train_loss": -25.472631454467773, "global_step": 324692, "epoch": 3911} {"train_loss": -25.995044708251953, "global_step": 324693, "epoch": 3911} {"train_loss": -25.822763442993164, "global_step": 324694, "epoch": 3911} {"train_loss": -25.869717609451477, "global_step": 324695, "epoch": 3911, "val_loss": 7202913.0} {"train_loss": -25.842084884643555, "global_step": 324696, "epoch": 3912} {"train_loss": -25.15569496154785, "global_step": 324697, "epoch": 3912} {"train_loss": -25.511537551879883, "global_step": 324698, "epoch": 3912} {"train_loss": -24.417016983032227, "global_step": 324699, "epoch": 3912} {"train_loss": -24.98872947692871, "global_step": 324700, "epoch": 3912} {"train_loss": -25.145902633666992, "global_step": 324701, "epoch": 3912} {"train_loss": -25.717443466186523, "global_step": 324702, "epoch": 3912} {"train_loss": -25.387527465820312, "global_step": 324703, "epoch": 3912} {"train_loss": -25.522031784057617, "global_step": 324704, "epoch": 3912} {"train_loss": -25.409137725830078, "global_step": 324705, "epoch": 3912} {"train_loss": -25.48837661743164, "global_step": 324706, "epoch": 3912} {"train_loss": -25.366016387939453, "global_step": 324707, "epoch": 3912} {"train_loss": -25.445539474487305, "global_step": 324708, "epoch": 3912} {"train_loss": -25.21664810180664, "global_step": 324709, "epoch": 3912} {"train_loss": -25.44830322265625, "global_step": 324710, "epoch": 3912} {"train_loss": -25.846654891967773, "global_step": 324711, "epoch": 3912} {"train_loss": -25.55409049987793, "global_step": 324712, "epoch": 3912} {"train_loss": -25.63312339782715, "global_step": 324713, "epoch": 3912} {"train_loss": -25.646656036376953, "global_step": 324714, "epoch": 3912} {"train_loss": -25.499340057373047, "global_step": 324715, "epoch": 3912} {"train_loss": -26.03744888305664, "global_step": 324716, "epoch": 3912} {"train_loss": -25.945220947265625, "global_step": 324717, "epoch": 3912} {"train_loss": -25.67390251159668, "global_step": 324718, "epoch": 3912} {"train_loss": -25.797760009765625, "global_step": 324719, "epoch": 3912} {"train_loss": -25.60939598083496, "global_step": 324720, "epoch": 3912} {"train_loss": -25.81673240661621, "global_step": 324721, "epoch": 3912} {"train_loss": -26.01405143737793, "global_step": 324722, "epoch": 3912} {"train_loss": -26.077951431274414, "global_step": 324723, "epoch": 3912} {"train_loss": -25.729536056518555, "global_step": 324724, "epoch": 3912} {"train_loss": -26.134170532226562, "global_step": 324725, "epoch": 3912} {"train_loss": -25.614404678344727, "global_step": 324726, "epoch": 3912} {"train_loss": -25.53641700744629, "global_step": 324727, "epoch": 3912} {"train_loss": -26.100217819213867, "global_step": 324728, "epoch": 3912} {"train_loss": -26.193044662475586, "global_step": 324729, "epoch": 3912} {"train_loss": -26.1304988861084, "global_step": 324730, "epoch": 3912} {"train_loss": -25.83694839477539, "global_step": 324731, "epoch": 3912} {"train_loss": -25.934972763061523, "global_step": 324732, "epoch": 3912} {"train_loss": -26.081510543823242, "global_step": 324733, "epoch": 3912} {"train_loss": -26.05023193359375, "global_step": 324734, "epoch": 3912} {"train_loss": -26.28314208984375, "global_step": 324735, "epoch": 3912} {"train_loss": -25.89215087890625, "global_step": 324736, "epoch": 3912} {"train_loss": -25.930816650390625, "global_step": 324737, "epoch": 3912} {"train_loss": -25.72348403930664, "global_step": 324738, "epoch": 3912} {"train_loss": -25.81534767150879, "global_step": 324739, "epoch": 3912} {"train_loss": -25.758947372436523, "global_step": 324740, "epoch": 3912} {"train_loss": -26.40949058532715, "global_step": 324741, "epoch": 3912} {"train_loss": -26.386493682861328, "global_step": 324742, "epoch": 3912} {"train_loss": -25.759206771850586, "global_step": 324743, "epoch": 3912} {"train_loss": -25.84111976623535, "global_step": 324744, "epoch": 3912} {"train_loss": -25.638477325439453, "global_step": 324745, "epoch": 3912} {"train_loss": -26.25591468811035, "global_step": 324746, "epoch": 3912} {"train_loss": -25.8817081451416, "global_step": 324747, "epoch": 3912} {"train_loss": -25.793222427368164, "global_step": 324748, "epoch": 3912} {"train_loss": -24.930612564086914, "global_step": 324749, "epoch": 3912} {"train_loss": -25.743513107299805, "global_step": 324750, "epoch": 3912} {"train_loss": -25.916095733642578, "global_step": 324751, "epoch": 3912} {"train_loss": -25.914594650268555, "global_step": 324752, "epoch": 3912} {"train_loss": -25.64240837097168, "global_step": 324753, "epoch": 3912} {"train_loss": -25.835601806640625, "global_step": 324754, "epoch": 3912} {"train_loss": -25.900421142578125, "global_step": 324755, "epoch": 3912} {"train_loss": -25.69072914123535, "global_step": 324756, "epoch": 3912} {"train_loss": -26.10787010192871, "global_step": 324757, "epoch": 3912} {"train_loss": -25.74664878845215, "global_step": 324758, "epoch": 3912} {"train_loss": -25.875288009643555, "global_step": 324759, "epoch": 3912} {"train_loss": -25.51544761657715, "global_step": 324760, "epoch": 3912} {"train_loss": -25.623172760009766, "global_step": 324761, "epoch": 3912} {"train_loss": -25.66843032836914, "global_step": 324762, "epoch": 3912} {"train_loss": -25.602176666259766, "global_step": 324763, "epoch": 3912} {"train_loss": -25.832799911499023, "global_step": 324764, "epoch": 3912} {"train_loss": -25.34712028503418, "global_step": 324765, "epoch": 3912} {"train_loss": -25.493383407592773, "global_step": 324766, "epoch": 3912} {"train_loss": -25.964908599853516, "global_step": 324767, "epoch": 3912} {"train_loss": -25.617889404296875, "global_step": 324768, "epoch": 3912} {"train_loss": -25.528562545776367, "global_step": 324769, "epoch": 3912} {"train_loss": -25.723901748657227, "global_step": 324770, "epoch": 3912} {"train_loss": -25.377887725830078, "global_step": 324771, "epoch": 3912} {"train_loss": -25.652801513671875, "global_step": 324772, "epoch": 3912} {"train_loss": -25.820844650268555, "global_step": 324773, "epoch": 3912} {"train_loss": -25.72859001159668, "global_step": 324774, "epoch": 3912} {"train_loss": -25.929641723632812, "global_step": 324775, "epoch": 3912} {"train_loss": -25.730478286743164, "global_step": 324776, "epoch": 3912} {"train_loss": -25.791645050048828, "global_step": 324777, "epoch": 3912} {"train_loss": -25.714637572506824, "global_step": 324778, "epoch": 3912, "val_loss": 7293873.0} {"train_loss": -25.62041664123535, "global_step": 324779, "epoch": 3913} {"train_loss": -25.584508895874023, "global_step": 324780, "epoch": 3913} {"train_loss": -25.742874145507812, "global_step": 324781, "epoch": 3913} {"train_loss": -25.7402400970459, "global_step": 324782, "epoch": 3913} {"train_loss": -26.1473445892334, "global_step": 324783, "epoch": 3913} {"train_loss": -25.918659210205078, "global_step": 324784, "epoch": 3913} {"train_loss": -25.998044967651367, "global_step": 324785, "epoch": 3913} {"train_loss": -25.7346248626709, "global_step": 324786, "epoch": 3913} {"train_loss": -26.026548385620117, "global_step": 324787, "epoch": 3913} {"train_loss": -25.840063095092773, "global_step": 324788, "epoch": 3913} {"train_loss": -26.092742919921875, "global_step": 324789, "epoch": 3913} {"train_loss": -26.328027725219727, "global_step": 324790, "epoch": 3913} {"train_loss": -25.70928382873535, "global_step": 324791, "epoch": 3913} {"train_loss": -25.797199249267578, "global_step": 324792, "epoch": 3913} {"train_loss": -25.897994995117188, "global_step": 324793, "epoch": 3913} {"train_loss": -25.86175537109375, "global_step": 324794, "epoch": 3913} {"train_loss": -26.135589599609375, "global_step": 324795, "epoch": 3913} {"train_loss": -25.81119155883789, "global_step": 324796, "epoch": 3913} {"train_loss": -25.638349533081055, "global_step": 324797, "epoch": 3913} {"train_loss": -26.028730392456055, "global_step": 324798, "epoch": 3913} {"train_loss": -26.222803115844727, "global_step": 324799, "epoch": 3913} {"train_loss": -25.8862247467041, "global_step": 324800, "epoch": 3913} {"train_loss": -25.857580184936523, "global_step": 324801, "epoch": 3913} {"train_loss": -25.66162109375, "global_step": 324802, "epoch": 3913} {"train_loss": -25.720800399780273, "global_step": 324803, "epoch": 3913} {"train_loss": -25.888574600219727, "global_step": 324804, "epoch": 3913} {"train_loss": -26.065763473510742, "global_step": 324805, "epoch": 3913} {"train_loss": -26.023950576782227, "global_step": 324806, "epoch": 3913} {"train_loss": -25.4880313873291, "global_step": 324807, "epoch": 3913} {"train_loss": -25.23495864868164, "global_step": 324808, "epoch": 3913} {"train_loss": -25.902530670166016, "global_step": 324809, "epoch": 3913} {"train_loss": -25.961645126342773, "global_step": 324810, "epoch": 3913} {"train_loss": -25.886545181274414, "global_step": 324811, "epoch": 3913} {"train_loss": -26.2820987701416, "global_step": 324812, "epoch": 3913} {"train_loss": -26.14393424987793, "global_step": 324813, "epoch": 3913} {"train_loss": -26.24835205078125, "global_step": 324814, "epoch": 3913} {"train_loss": -25.97895622253418, "global_step": 324815, "epoch": 3913} {"train_loss": -25.69403076171875, "global_step": 324816, "epoch": 3913} {"train_loss": -25.98748207092285, "global_step": 324817, "epoch": 3913} {"train_loss": -26.608869552612305, "global_step": 324818, "epoch": 3913} {"train_loss": -25.839792251586914, "global_step": 324819, "epoch": 3913} {"train_loss": -25.74722671508789, "global_step": 324820, "epoch": 3913} {"train_loss": -25.637113571166992, "global_step": 324821, "epoch": 3913} {"train_loss": -25.869800567626953, "global_step": 324822, "epoch": 3913} {"train_loss": -25.854598999023438, "global_step": 324823, "epoch": 3913} {"train_loss": -26.09295082092285, "global_step": 324824, "epoch": 3913} {"train_loss": -26.492279052734375, "global_step": 324825, "epoch": 3913} {"train_loss": -25.91352653503418, "global_step": 324826, "epoch": 3913} {"train_loss": -25.8433837890625, "global_step": 324827, "epoch": 3913} {"train_loss": -25.896997451782227, "global_step": 324828, "epoch": 3913} {"train_loss": -25.94189453125, "global_step": 324829, "epoch": 3913} {"train_loss": -25.932708740234375, "global_step": 324830, "epoch": 3913} {"train_loss": -26.015989303588867, "global_step": 324831, "epoch": 3913} {"train_loss": -25.844152450561523, "global_step": 324832, "epoch": 3913} {"train_loss": -25.90730094909668, "global_step": 324833, "epoch": 3913} {"train_loss": -26.49238395690918, "global_step": 324834, "epoch": 3913} {"train_loss": -26.157135009765625, "global_step": 324835, "epoch": 3913} {"train_loss": -25.99810218811035, "global_step": 324836, "epoch": 3913} {"train_loss": -25.76541519165039, "global_step": 324837, "epoch": 3913} {"train_loss": -25.563512802124023, "global_step": 324838, "epoch": 3913} {"train_loss": -26.05759620666504, "global_step": 324839, "epoch": 3913} {"train_loss": -26.126352310180664, "global_step": 324840, "epoch": 3913} {"train_loss": -25.6961727142334, "global_step": 324841, "epoch": 3913} {"train_loss": -26.066526412963867, "global_step": 324842, "epoch": 3913} {"train_loss": -25.774091720581055, "global_step": 324843, "epoch": 3913} {"train_loss": -25.821136474609375, "global_step": 324844, "epoch": 3913} {"train_loss": -25.45154571533203, "global_step": 324845, "epoch": 3913} {"train_loss": -25.645004272460938, "global_step": 324846, "epoch": 3913} {"train_loss": -25.770883560180664, "global_step": 324847, "epoch": 3913} {"train_loss": -25.319660186767578, "global_step": 324848, "epoch": 3913} {"train_loss": -25.606048583984375, "global_step": 324849, "epoch": 3913} {"train_loss": -25.80661392211914, "global_step": 324850, "epoch": 3913} {"train_loss": -25.675260543823242, "global_step": 324851, "epoch": 3913} {"train_loss": -25.656274795532227, "global_step": 324852, "epoch": 3913} {"train_loss": -25.498159408569336, "global_step": 324853, "epoch": 3913} {"train_loss": -26.025659561157227, "global_step": 324854, "epoch": 3913} {"train_loss": -25.591228485107422, "global_step": 324855, "epoch": 3913} {"train_loss": -25.522184371948242, "global_step": 324856, "epoch": 3913} {"train_loss": -25.809375762939453, "global_step": 324857, "epoch": 3913} {"train_loss": -25.369829177856445, "global_step": 324858, "epoch": 3913} {"train_loss": -25.96222496032715, "global_step": 324859, "epoch": 3913} {"train_loss": -25.70868492126465, "global_step": 324860, "epoch": 3913} {"train_loss": -25.859449570437512, "global_step": 324861, "epoch": 3913, "val_loss": 7174543.0} {"train_loss": -25.350345611572266, "global_step": 324862, "epoch": 3914} {"train_loss": -25.6849308013916, "global_step": 324863, "epoch": 3914} {"train_loss": -25.18697166442871, "global_step": 324864, "epoch": 3914} {"train_loss": -24.603469848632812, "global_step": 324865, "epoch": 3914} {"train_loss": -24.837350845336914, "global_step": 324866, "epoch": 3914} {"train_loss": -25.532793045043945, "global_step": 324867, "epoch": 3914} {"train_loss": -25.40266227722168, "global_step": 324868, "epoch": 3914} {"train_loss": -25.38855743408203, "global_step": 324869, "epoch": 3914} {"train_loss": -25.329090118408203, "global_step": 324870, "epoch": 3914} {"train_loss": -25.203275680541992, "global_step": 324871, "epoch": 3914} {"train_loss": -25.185760498046875, "global_step": 324872, "epoch": 3914} {"train_loss": -25.806461334228516, "global_step": 324873, "epoch": 3914} {"train_loss": -25.64657974243164, "global_step": 324874, "epoch": 3914} {"train_loss": -25.640399932861328, "global_step": 324875, "epoch": 3914} {"train_loss": -25.508752822875977, "global_step": 324876, "epoch": 3914} {"train_loss": -25.54859733581543, "global_step": 324877, "epoch": 3914} {"train_loss": -25.892541885375977, "global_step": 324878, "epoch": 3914} {"train_loss": -25.660558700561523, "global_step": 324879, "epoch": 3914} {"train_loss": -25.942235946655273, "global_step": 324880, "epoch": 3914} {"train_loss": -25.518863677978516, "global_step": 324881, "epoch": 3914} {"train_loss": -25.641965866088867, "global_step": 324882, "epoch": 3914} {"train_loss": -25.966169357299805, "global_step": 324883, "epoch": 3914} {"train_loss": -25.763107299804688, "global_step": 324884, "epoch": 3914} {"train_loss": -25.76698875427246, "global_step": 324885, "epoch": 3914} {"train_loss": -26.042861938476562, "global_step": 324886, "epoch": 3914} {"train_loss": -25.828161239624023, "global_step": 324887, "epoch": 3914} {"train_loss": -25.86382484436035, "global_step": 324888, "epoch": 3914} {"train_loss": -25.908374786376953, "global_step": 324889, "epoch": 3914} {"train_loss": -25.974517822265625, "global_step": 324890, "epoch": 3914} {"train_loss": -26.143091201782227, "global_step": 324891, "epoch": 3914} {"train_loss": -25.7659854888916, "global_step": 324892, "epoch": 3914} {"train_loss": -26.300642013549805, "global_step": 324893, "epoch": 3914} {"train_loss": -26.07679557800293, "global_step": 324894, "epoch": 3914} {"train_loss": -26.049081802368164, "global_step": 324895, "epoch": 3914} {"train_loss": -26.300718307495117, "global_step": 324896, "epoch": 3914} {"train_loss": -25.990875244140625, "global_step": 324897, "epoch": 3914} {"train_loss": -26.124393463134766, "global_step": 324898, "epoch": 3914} {"train_loss": -25.997634887695312, "global_step": 324899, "epoch": 3914} {"train_loss": -25.782018661499023, "global_step": 324900, "epoch": 3914} {"train_loss": -25.981098175048828, "global_step": 324901, "epoch": 3914} {"train_loss": -25.9703369140625, "global_step": 324902, "epoch": 3914} {"train_loss": -26.32370948791504, "global_step": 324903, "epoch": 3914} {"train_loss": -26.1420841217041, "global_step": 324904, "epoch": 3914} {"train_loss": -26.376144409179688, "global_step": 324905, "epoch": 3914} {"train_loss": -25.935728073120117, "global_step": 324906, "epoch": 3914} {"train_loss": -25.947952270507812, "global_step": 324907, "epoch": 3914} {"train_loss": -25.977991104125977, "global_step": 324908, "epoch": 3914} {"train_loss": -25.88165855407715, "global_step": 324909, "epoch": 3914} {"train_loss": -25.933393478393555, "global_step": 324910, "epoch": 3914} {"train_loss": -25.740753173828125, "global_step": 324911, "epoch": 3914} {"train_loss": -25.963422775268555, "global_step": 324912, "epoch": 3914} {"train_loss": -25.907590866088867, "global_step": 324913, "epoch": 3914} {"train_loss": -26.421743392944336, "global_step": 324914, "epoch": 3914} {"train_loss": -26.018604278564453, "global_step": 324915, "epoch": 3914} {"train_loss": -26.000768661499023, "global_step": 324916, "epoch": 3914} {"train_loss": -25.96735954284668, "global_step": 324917, "epoch": 3914} {"train_loss": -25.674304962158203, "global_step": 324918, "epoch": 3914} {"train_loss": -25.823022842407227, "global_step": 324919, "epoch": 3914} {"train_loss": -25.959970474243164, "global_step": 324920, "epoch": 3914} {"train_loss": -25.979522705078125, "global_step": 324921, "epoch": 3914} {"train_loss": -25.83794593811035, "global_step": 324922, "epoch": 3914} {"train_loss": -26.099950790405273, "global_step": 324923, "epoch": 3914} {"train_loss": -26.059432983398438, "global_step": 324924, "epoch": 3914} {"train_loss": -25.7641544342041, "global_step": 324925, "epoch": 3914} {"train_loss": -26.0939884185791, "global_step": 324926, "epoch": 3914} {"train_loss": -25.827367782592773, "global_step": 324927, "epoch": 3914} {"train_loss": -26.229150772094727, "global_step": 324928, "epoch": 3914} {"train_loss": -26.193008422851562, "global_step": 324929, "epoch": 3914} {"train_loss": -26.360916137695312, "global_step": 324930, "epoch": 3914} {"train_loss": -26.17535972595215, "global_step": 324931, "epoch": 3914} {"train_loss": -25.95159339904785, "global_step": 324932, "epoch": 3914} {"train_loss": -25.83338737487793, "global_step": 324933, "epoch": 3914} {"train_loss": -26.319915771484375, "global_step": 324934, "epoch": 3914} {"train_loss": -25.9815616607666, "global_step": 324935, "epoch": 3914} {"train_loss": -25.91650390625, "global_step": 324936, "epoch": 3914} {"train_loss": -25.866748809814453, "global_step": 324937, "epoch": 3914} {"train_loss": -26.038055419921875, "global_step": 324938, "epoch": 3914} {"train_loss": -26.15583610534668, "global_step": 324939, "epoch": 3914} {"train_loss": -26.128149032592773, "global_step": 324940, "epoch": 3914} {"train_loss": -25.98081398010254, "global_step": 324941, "epoch": 3914} {"train_loss": -25.950986862182617, "global_step": 324942, "epoch": 3914} {"train_loss": -26.129779815673828, "global_step": 324943, "epoch": 3914} {"train_loss": -25.8662275521152, "global_step": 324944, "epoch": 3914, "val_loss": 7215607.0} {"train_loss": -25.77056884765625, "global_step": 324945, "epoch": 3915} {"train_loss": -25.484920501708984, "global_step": 324946, "epoch": 3915} {"train_loss": -25.536725997924805, "global_step": 324947, "epoch": 3915} {"train_loss": -25.261030197143555, "global_step": 324948, "epoch": 3915} {"train_loss": -25.320354461669922, "global_step": 324949, "epoch": 3915} {"train_loss": -25.99518394470215, "global_step": 324950, "epoch": 3915} {"train_loss": -25.31681251525879, "global_step": 324951, "epoch": 3915} {"train_loss": -25.607654571533203, "global_step": 324952, "epoch": 3915} {"train_loss": -25.612506866455078, "global_step": 324953, "epoch": 3915} {"train_loss": -25.581554412841797, "global_step": 324954, "epoch": 3915} {"train_loss": -25.884784698486328, "global_step": 324955, "epoch": 3915} {"train_loss": -25.746143341064453, "global_step": 324956, "epoch": 3915} {"train_loss": -25.55714225769043, "global_step": 324957, "epoch": 3915} {"train_loss": -25.545957565307617, "global_step": 324958, "epoch": 3915} {"train_loss": -25.76899528503418, "global_step": 324959, "epoch": 3915} {"train_loss": -25.872446060180664, "global_step": 324960, "epoch": 3915} {"train_loss": -25.573368072509766, "global_step": 324961, "epoch": 3915} {"train_loss": -25.755964279174805, "global_step": 324962, "epoch": 3915} {"train_loss": -25.795562744140625, "global_step": 324963, "epoch": 3915} {"train_loss": -26.034692764282227, "global_step": 324964, "epoch": 3915} {"train_loss": -25.423786163330078, "global_step": 324965, "epoch": 3915} {"train_loss": -25.913557052612305, "global_step": 324966, "epoch": 3915} {"train_loss": -25.73200035095215, "global_step": 324967, "epoch": 3915} {"train_loss": -25.93171501159668, "global_step": 324968, "epoch": 3915} {"train_loss": -25.83497428894043, "global_step": 324969, "epoch": 3915} {"train_loss": -26.078458786010742, "global_step": 324970, "epoch": 3915} {"train_loss": -26.058765411376953, "global_step": 324971, "epoch": 3915} {"train_loss": -25.91717529296875, "global_step": 324972, "epoch": 3915} {"train_loss": -26.024423599243164, "global_step": 324973, "epoch": 3915} {"train_loss": -25.826208114624023, "global_step": 324974, "epoch": 3915} {"train_loss": -26.21978187561035, "global_step": 324975, "epoch": 3915} {"train_loss": -25.74873161315918, "global_step": 324976, "epoch": 3915} {"train_loss": -25.7974910736084, "global_step": 324977, "epoch": 3915} {"train_loss": -25.99015235900879, "global_step": 324978, "epoch": 3915} {"train_loss": -25.961322784423828, "global_step": 324979, "epoch": 3915} {"train_loss": -26.393390655517578, "global_step": 324980, "epoch": 3915} {"train_loss": -26.098684310913086, "global_step": 324981, "epoch": 3915} {"train_loss": -26.2393856048584, "global_step": 324982, "epoch": 3915} {"train_loss": -26.297998428344727, "global_step": 324983, "epoch": 3915} {"train_loss": -26.182422637939453, "global_step": 324984, "epoch": 3915} {"train_loss": -25.965559005737305, "global_step": 324985, "epoch": 3915} {"train_loss": -25.761396408081055, "global_step": 324986, "epoch": 3915} {"train_loss": -26.00372314453125, "global_step": 324987, "epoch": 3915} {"train_loss": -26.169391632080078, "global_step": 324988, "epoch": 3915} {"train_loss": -25.97743034362793, "global_step": 324989, "epoch": 3915} {"train_loss": -25.957355499267578, "global_step": 324990, "epoch": 3915} {"train_loss": -26.38373374938965, "global_step": 324991, "epoch": 3915} {"train_loss": -25.645105361938477, "global_step": 324992, "epoch": 3915} {"train_loss": -24.680402755737305, "global_step": 324993, "epoch": 3915} {"train_loss": -24.587974548339844, "global_step": 324994, "epoch": 3915} {"train_loss": -24.22867202758789, "global_step": 324995, "epoch": 3915} {"train_loss": -24.85931968688965, "global_step": 324996, "epoch": 3915} {"train_loss": -25.583444595336914, "global_step": 324997, "epoch": 3915} {"train_loss": -25.07672882080078, "global_step": 324998, "epoch": 3915} {"train_loss": -25.439125061035156, "global_step": 324999, "epoch": 3915} {"train_loss": -25.029687881469727, "global_step": 325000, "epoch": 3915} {"train_loss": -25.459308624267578, "global_step": 325001, "epoch": 3915} {"train_loss": -25.371726989746094, "global_step": 325002, "epoch": 3915} {"train_loss": -25.765323638916016, "global_step": 325003, "epoch": 3915} {"train_loss": -25.162485122680664, "global_step": 325004, "epoch": 3915} {"train_loss": -25.309341430664062, "global_step": 325005, "epoch": 3915} {"train_loss": -25.64851951599121, "global_step": 325006, "epoch": 3915} {"train_loss": -25.42415428161621, "global_step": 325007, "epoch": 3915} {"train_loss": -25.41517448425293, "global_step": 325008, "epoch": 3915} {"train_loss": -25.758352279663086, "global_step": 325009, "epoch": 3915} {"train_loss": -25.901899337768555, "global_step": 325010, "epoch": 3915} {"train_loss": -26.11675453186035, "global_step": 325011, "epoch": 3915} {"train_loss": -25.953779220581055, "global_step": 325012, "epoch": 3915} {"train_loss": -25.329519271850586, "global_step": 325013, "epoch": 3915} {"train_loss": -25.800277709960938, "global_step": 325014, "epoch": 3915} {"train_loss": -25.47748565673828, "global_step": 325015, "epoch": 3915} {"train_loss": -25.95552635192871, "global_step": 325016, "epoch": 3915} {"train_loss": -25.78676414489746, "global_step": 325017, "epoch": 3915} {"train_loss": -25.90283203125, "global_step": 325018, "epoch": 3915} {"train_loss": -25.92302894592285, "global_step": 325019, "epoch": 3915} {"train_loss": -25.667465209960938, "global_step": 325020, "epoch": 3915} {"train_loss": -25.83038330078125, "global_step": 325021, "epoch": 3915} {"train_loss": -25.707380294799805, "global_step": 325022, "epoch": 3915} {"train_loss": -25.97535514831543, "global_step": 325023, "epoch": 3915} {"train_loss": -26.213748931884766, "global_step": 325024, "epoch": 3915} {"train_loss": -25.601043701171875, "global_step": 325025, "epoch": 3915} {"train_loss": -25.681324005126953, "global_step": 325026, "epoch": 3915} {"train_loss": -25.71152464165745, "global_step": 325027, "epoch": 3915, "val_loss": 7232471.0} {"train_loss": -25.408626556396484, "global_step": 325028, "epoch": 3916} {"train_loss": -25.48299217224121, "global_step": 325029, "epoch": 3916} {"train_loss": -25.416152954101562, "global_step": 325030, "epoch": 3916} {"train_loss": -26.014068603515625, "global_step": 325031, "epoch": 3916} {"train_loss": -25.849201202392578, "global_step": 325032, "epoch": 3916} {"train_loss": -25.540842056274414, "global_step": 325033, "epoch": 3916} {"train_loss": -25.7962703704834, "global_step": 325034, "epoch": 3916} {"train_loss": -25.680143356323242, "global_step": 325035, "epoch": 3916} {"train_loss": -25.6053409576416, "global_step": 325036, "epoch": 3916} {"train_loss": -25.72189712524414, "global_step": 325037, "epoch": 3916} {"train_loss": -25.787540435791016, "global_step": 325038, "epoch": 3916} {"train_loss": -25.54096221923828, "global_step": 325039, "epoch": 3916} {"train_loss": -25.861438751220703, "global_step": 325040, "epoch": 3916} {"train_loss": -25.506881713867188, "global_step": 325041, "epoch": 3916} {"train_loss": -25.699447631835938, "global_step": 325042, "epoch": 3916} {"train_loss": -25.787439346313477, "global_step": 325043, "epoch": 3916} {"train_loss": -26.281997680664062, "global_step": 325044, "epoch": 3916} {"train_loss": -25.831226348876953, "global_step": 325045, "epoch": 3916} {"train_loss": -26.12531852722168, "global_step": 325046, "epoch": 3916} {"train_loss": -25.843143463134766, "global_step": 325047, "epoch": 3916} {"train_loss": -25.60055923461914, "global_step": 325048, "epoch": 3916} {"train_loss": -25.812299728393555, "global_step": 325049, "epoch": 3916} {"train_loss": -26.125680923461914, "global_step": 325050, "epoch": 3916} {"train_loss": -25.543012619018555, "global_step": 325051, "epoch": 3916} {"train_loss": -26.104421615600586, "global_step": 325052, "epoch": 3916} {"train_loss": -25.648035049438477, "global_step": 325053, "epoch": 3916} {"train_loss": -25.83355712890625, "global_step": 325054, "epoch": 3916} {"train_loss": -25.77959632873535, "global_step": 325055, "epoch": 3916} {"train_loss": -25.55793571472168, "global_step": 325056, "epoch": 3916} {"train_loss": -25.839223861694336, "global_step": 325057, "epoch": 3916} {"train_loss": -26.001056671142578, "global_step": 325058, "epoch": 3916} {"train_loss": -25.84885025024414, "global_step": 325059, "epoch": 3916} {"train_loss": -26.090612411499023, "global_step": 325060, "epoch": 3916} {"train_loss": -26.00080680847168, "global_step": 325061, "epoch": 3916} {"train_loss": -26.077777862548828, "global_step": 325062, "epoch": 3916} {"train_loss": -25.419788360595703, "global_step": 325063, "epoch": 3916} {"train_loss": -25.39361000061035, "global_step": 325064, "epoch": 3916} {"train_loss": -25.528690338134766, "global_step": 325065, "epoch": 3916} {"train_loss": -25.813751220703125, "global_step": 325066, "epoch": 3916} {"train_loss": -25.621244430541992, "global_step": 325067, "epoch": 3916} {"train_loss": -25.249393463134766, "global_step": 325068, "epoch": 3916} {"train_loss": -25.90802574157715, "global_step": 325069, "epoch": 3916} {"train_loss": -25.886707305908203, "global_step": 325070, "epoch": 3916} {"train_loss": -25.8439884185791, "global_step": 325071, "epoch": 3916} {"train_loss": -25.847585678100586, "global_step": 325072, "epoch": 3916} {"train_loss": -25.915119171142578, "global_step": 325073, "epoch": 3916} {"train_loss": -26.319211959838867, "global_step": 325074, "epoch": 3916} {"train_loss": -26.113401412963867, "global_step": 325075, "epoch": 3916} {"train_loss": -25.861648559570312, "global_step": 325076, "epoch": 3916} {"train_loss": -26.018163681030273, "global_step": 325077, "epoch": 3916} {"train_loss": -25.91937828063965, "global_step": 325078, "epoch": 3916} {"train_loss": -25.66651725769043, "global_step": 325079, "epoch": 3916} {"train_loss": -26.18265151977539, "global_step": 325080, "epoch": 3916} {"train_loss": -25.816816329956055, "global_step": 325081, "epoch": 3916} {"train_loss": -25.577686309814453, "global_step": 325082, "epoch": 3916} {"train_loss": -25.971776962280273, "global_step": 325083, "epoch": 3916} {"train_loss": -25.825000762939453, "global_step": 325084, "epoch": 3916} {"train_loss": -26.102270126342773, "global_step": 325085, "epoch": 3916} {"train_loss": -25.956541061401367, "global_step": 325086, "epoch": 3916} {"train_loss": -26.0151309967041, "global_step": 325087, "epoch": 3916} {"train_loss": -26.15766716003418, "global_step": 325088, "epoch": 3916} {"train_loss": -26.41693115234375, "global_step": 325089, "epoch": 3916} {"train_loss": -26.195886611938477, "global_step": 325090, "epoch": 3916} {"train_loss": -26.090396881103516, "global_step": 325091, "epoch": 3916} {"train_loss": -26.202091217041016, "global_step": 325092, "epoch": 3916} {"train_loss": -26.043476104736328, "global_step": 325093, "epoch": 3916} {"train_loss": -25.964487075805664, "global_step": 325094, "epoch": 3916} {"train_loss": -26.122243881225586, "global_step": 325095, "epoch": 3916} {"train_loss": -25.990772247314453, "global_step": 325096, "epoch": 3916} {"train_loss": -26.278268814086914, "global_step": 325097, "epoch": 3916} {"train_loss": -26.050031661987305, "global_step": 325098, "epoch": 3916} {"train_loss": -26.233917236328125, "global_step": 325099, "epoch": 3916} {"train_loss": -25.460342407226562, "global_step": 325100, "epoch": 3916} {"train_loss": -25.640111923217773, "global_step": 325101, "epoch": 3916} {"train_loss": -25.489500045776367, "global_step": 325102, "epoch": 3916} {"train_loss": -25.507596969604492, "global_step": 325103, "epoch": 3916} {"train_loss": -25.902908325195312, "global_step": 325104, "epoch": 3916} {"train_loss": -26.047468185424805, "global_step": 325105, "epoch": 3916} {"train_loss": -25.8040828704834, "global_step": 325106, "epoch": 3916} {"train_loss": -25.62031364440918, "global_step": 325107, "epoch": 3916} {"train_loss": -26.003644943237305, "global_step": 325108, "epoch": 3916} {"train_loss": -26.44837760925293, "global_step": 325109, "epoch": 3916} {"train_loss": -25.862332930047828, "global_step": 325110, "epoch": 3916, "val_loss": 7245548.0} {"train_loss": -25.681079864501953, "global_step": 325111, "epoch": 3917} {"train_loss": -25.529172897338867, "global_step": 325112, "epoch": 3917} {"train_loss": -25.635839462280273, "global_step": 325113, "epoch": 3917} {"train_loss": -25.4162654876709, "global_step": 325114, "epoch": 3917} {"train_loss": -25.674392700195312, "global_step": 325115, "epoch": 3917} {"train_loss": -25.663129806518555, "global_step": 325116, "epoch": 3917} {"train_loss": -25.59377670288086, "global_step": 325117, "epoch": 3917} {"train_loss": -25.611560821533203, "global_step": 325118, "epoch": 3917} {"train_loss": -25.576580047607422, "global_step": 325119, "epoch": 3917} {"train_loss": -25.89568519592285, "global_step": 325120, "epoch": 3917} {"train_loss": -25.965978622436523, "global_step": 325121, "epoch": 3917} {"train_loss": -25.680429458618164, "global_step": 325122, "epoch": 3917} {"train_loss": -25.841222763061523, "global_step": 325123, "epoch": 3917} {"train_loss": -25.70672035217285, "global_step": 325124, "epoch": 3917} {"train_loss": -25.36622428894043, "global_step": 325125, "epoch": 3917} {"train_loss": -25.570253372192383, "global_step": 325126, "epoch": 3917} {"train_loss": -25.56403160095215, "global_step": 325127, "epoch": 3917} {"train_loss": -25.999021530151367, "global_step": 325128, "epoch": 3917} {"train_loss": -25.622968673706055, "global_step": 325129, "epoch": 3917} {"train_loss": -25.322599411010742, "global_step": 325130, "epoch": 3917} {"train_loss": -26.058080673217773, "global_step": 325131, "epoch": 3917} {"train_loss": -25.598663330078125, "global_step": 325132, "epoch": 3917} {"train_loss": -25.812742233276367, "global_step": 325133, "epoch": 3917} {"train_loss": -25.6446475982666, "global_step": 325134, "epoch": 3917} {"train_loss": -25.945714950561523, "global_step": 325135, "epoch": 3917} {"train_loss": -25.647052764892578, "global_step": 325136, "epoch": 3917} {"train_loss": -25.580747604370117, "global_step": 325137, "epoch": 3917} {"train_loss": -25.719785690307617, "global_step": 325138, "epoch": 3917} {"train_loss": -25.57065200805664, "global_step": 325139, "epoch": 3917} {"train_loss": -25.533281326293945, "global_step": 325140, "epoch": 3917} {"train_loss": -25.996814727783203, "global_step": 325141, "epoch": 3917} {"train_loss": -25.71956443786621, "global_step": 325142, "epoch": 3917} {"train_loss": -25.69623374938965, "global_step": 325143, "epoch": 3917} {"train_loss": -26.023151397705078, "global_step": 325144, "epoch": 3917} {"train_loss": -25.75362205505371, "global_step": 325145, "epoch": 3917} {"train_loss": -26.143171310424805, "global_step": 325146, "epoch": 3917} {"train_loss": -25.941659927368164, "global_step": 325147, "epoch": 3917} {"train_loss": -25.875070571899414, "global_step": 325148, "epoch": 3917} {"train_loss": -25.55451011657715, "global_step": 325149, "epoch": 3917} {"train_loss": -25.777957916259766, "global_step": 325150, "epoch": 3917} {"train_loss": -25.51540184020996, "global_step": 325151, "epoch": 3917} {"train_loss": -26.000629425048828, "global_step": 325152, "epoch": 3917} {"train_loss": -25.91314697265625, "global_step": 325153, "epoch": 3917} {"train_loss": -26.09685707092285, "global_step": 325154, "epoch": 3917} {"train_loss": -25.97797203063965, "global_step": 325155, "epoch": 3917} {"train_loss": -25.8840389251709, "global_step": 325156, "epoch": 3917} {"train_loss": -25.536643981933594, "global_step": 325157, "epoch": 3917} {"train_loss": -25.749460220336914, "global_step": 325158, "epoch": 3917} {"train_loss": -25.642566680908203, "global_step": 325159, "epoch": 3917} {"train_loss": -25.695941925048828, "global_step": 325160, "epoch": 3917} {"train_loss": -25.9351806640625, "global_step": 325161, "epoch": 3917} {"train_loss": -25.721342086791992, "global_step": 325162, "epoch": 3917} {"train_loss": -25.82074546813965, "global_step": 325163, "epoch": 3917} {"train_loss": -25.468982696533203, "global_step": 325164, "epoch": 3917} {"train_loss": -25.825653076171875, "global_step": 325165, "epoch": 3917} {"train_loss": -25.9985294342041, "global_step": 325166, "epoch": 3917} {"train_loss": -26.09394645690918, "global_step": 325167, "epoch": 3917} {"train_loss": -25.972387313842773, "global_step": 325168, "epoch": 3917} {"train_loss": -26.16277503967285, "global_step": 325169, "epoch": 3917} {"train_loss": -25.937524795532227, "global_step": 325170, "epoch": 3917} {"train_loss": -26.100317001342773, "global_step": 325171, "epoch": 3917} {"train_loss": -26.064468383789062, "global_step": 325172, "epoch": 3917} {"train_loss": -25.914941787719727, "global_step": 325173, "epoch": 3917} {"train_loss": -26.252370834350586, "global_step": 325174, "epoch": 3917} {"train_loss": -26.232131958007812, "global_step": 325175, "epoch": 3917} {"train_loss": -25.96132469177246, "global_step": 325176, "epoch": 3917} {"train_loss": -26.104047775268555, "global_step": 325177, "epoch": 3917} {"train_loss": -25.983753204345703, "global_step": 325178, "epoch": 3917} {"train_loss": -25.90595817565918, "global_step": 325179, "epoch": 3917} {"train_loss": -26.51190185546875, "global_step": 325180, "epoch": 3917} {"train_loss": -25.91288185119629, "global_step": 325181, "epoch": 3917} {"train_loss": -25.48031997680664, "global_step": 325182, "epoch": 3917} {"train_loss": -25.628904342651367, "global_step": 325183, "epoch": 3917} {"train_loss": -25.357755661010742, "global_step": 325184, "epoch": 3917} {"train_loss": -24.99111557006836, "global_step": 325185, "epoch": 3917} {"train_loss": -25.6654052734375, "global_step": 325186, "epoch": 3917} {"train_loss": -25.689361572265625, "global_step": 325187, "epoch": 3917} {"train_loss": -25.855554580688477, "global_step": 325188, "epoch": 3917} {"train_loss": -25.87367057800293, "global_step": 325189, "epoch": 3917} {"train_loss": -25.43085289001465, "global_step": 325190, "epoch": 3917} {"train_loss": -25.554067611694336, "global_step": 325191, "epoch": 3917} {"train_loss": -25.477394104003906, "global_step": 325192, "epoch": 3917} {"train_loss": -25.793862469225044, "global_step": 325193, "epoch": 3917, "val_loss": 7333672.0} {"train_loss": -25.58510398864746, "global_step": 325194, "epoch": 3918} {"train_loss": -25.78021812438965, "global_step": 325195, "epoch": 3918} {"train_loss": -25.81721305847168, "global_step": 325196, "epoch": 3918} {"train_loss": -25.258441925048828, "global_step": 325197, "epoch": 3918} {"train_loss": -26.036041259765625, "global_step": 325198, "epoch": 3918} {"train_loss": -25.68768310546875, "global_step": 325199, "epoch": 3918} {"train_loss": -25.631561279296875, "global_step": 325200, "epoch": 3918} {"train_loss": -25.47342300415039, "global_step": 325201, "epoch": 3918} {"train_loss": -25.7764892578125, "global_step": 325202, "epoch": 3918} {"train_loss": -25.550399780273438, "global_step": 325203, "epoch": 3918} {"train_loss": -25.577741622924805, "global_step": 325204, "epoch": 3918} {"train_loss": -25.49043846130371, "global_step": 325205, "epoch": 3918} {"train_loss": -25.530630111694336, "global_step": 325206, "epoch": 3918} {"train_loss": -25.57888412475586, "global_step": 325207, "epoch": 3918} {"train_loss": -25.64471435546875, "global_step": 325208, "epoch": 3918} {"train_loss": -25.722854614257812, "global_step": 325209, "epoch": 3918} {"train_loss": -25.826135635375977, "global_step": 325210, "epoch": 3918} {"train_loss": -25.605823516845703, "global_step": 325211, "epoch": 3918} {"train_loss": -25.794845581054688, "global_step": 325212, "epoch": 3918} {"train_loss": -25.975202560424805, "global_step": 325213, "epoch": 3918} {"train_loss": -26.12174415588379, "global_step": 325214, "epoch": 3918} {"train_loss": -26.14179039001465, "global_step": 325215, "epoch": 3918} {"train_loss": -25.768171310424805, "global_step": 325216, "epoch": 3918} {"train_loss": -25.77190589904785, "global_step": 325217, "epoch": 3918} {"train_loss": -26.168745040893555, "global_step": 325218, "epoch": 3918} {"train_loss": -25.636159896850586, "global_step": 325219, "epoch": 3918} {"train_loss": -25.729238510131836, "global_step": 325220, "epoch": 3918} {"train_loss": -25.592063903808594, "global_step": 325221, "epoch": 3918} {"train_loss": -25.76800537109375, "global_step": 325222, "epoch": 3918} {"train_loss": -25.97593116760254, "global_step": 325223, "epoch": 3918} {"train_loss": -25.914819717407227, "global_step": 325224, "epoch": 3918} {"train_loss": -26.165069580078125, "global_step": 325225, "epoch": 3918} {"train_loss": -26.05034828186035, "global_step": 325226, "epoch": 3918} {"train_loss": -26.0541934967041, "global_step": 325227, "epoch": 3918} {"train_loss": -25.713163375854492, "global_step": 325228, "epoch": 3918} {"train_loss": -25.662887573242188, "global_step": 325229, "epoch": 3918} {"train_loss": -25.850757598876953, "global_step": 325230, "epoch": 3918} {"train_loss": -26.223846435546875, "global_step": 325231, "epoch": 3918} {"train_loss": -25.51654624938965, "global_step": 325232, "epoch": 3918} {"train_loss": -26.34613609313965, "global_step": 325233, "epoch": 3918} {"train_loss": -25.979154586791992, "global_step": 325234, "epoch": 3918} {"train_loss": -25.800451278686523, "global_step": 325235, "epoch": 3918} {"train_loss": -26.0775203704834, "global_step": 325236, "epoch": 3918} {"train_loss": -26.297290802001953, "global_step": 325237, "epoch": 3918} {"train_loss": -26.15601921081543, "global_step": 325238, "epoch": 3918} {"train_loss": -25.973804473876953, "global_step": 325239, "epoch": 3918} {"train_loss": -26.03561782836914, "global_step": 325240, "epoch": 3918} {"train_loss": -26.019758224487305, "global_step": 325241, "epoch": 3918} {"train_loss": -25.980859756469727, "global_step": 325242, "epoch": 3918} {"train_loss": -26.171985626220703, "global_step": 325243, "epoch": 3918} {"train_loss": -25.969562530517578, "global_step": 325244, "epoch": 3918} {"train_loss": -26.02118492126465, "global_step": 325245, "epoch": 3918} {"train_loss": -25.70066261291504, "global_step": 325246, "epoch": 3918} {"train_loss": -26.164514541625977, "global_step": 325247, "epoch": 3918} {"train_loss": -26.165058135986328, "global_step": 325248, "epoch": 3918} {"train_loss": -25.826858520507812, "global_step": 325249, "epoch": 3918} {"train_loss": -26.165380477905273, "global_step": 325250, "epoch": 3918} {"train_loss": -26.08021354675293, "global_step": 325251, "epoch": 3918} {"train_loss": -25.532094955444336, "global_step": 325252, "epoch": 3918} {"train_loss": -26.272382736206055, "global_step": 325253, "epoch": 3918} {"train_loss": -25.962854385375977, "global_step": 325254, "epoch": 3918} {"train_loss": -25.575651168823242, "global_step": 325255, "epoch": 3918} {"train_loss": -25.9130916595459, "global_step": 325256, "epoch": 3918} {"train_loss": -25.65838050842285, "global_step": 325257, "epoch": 3918} {"train_loss": -26.049108505249023, "global_step": 325258, "epoch": 3918} {"train_loss": -25.99442481994629, "global_step": 325259, "epoch": 3918} {"train_loss": -26.298492431640625, "global_step": 325260, "epoch": 3918} {"train_loss": -26.129377365112305, "global_step": 325261, "epoch": 3918} {"train_loss": -25.718109130859375, "global_step": 325262, "epoch": 3918} {"train_loss": -25.852575302124023, "global_step": 325263, "epoch": 3918} {"train_loss": -25.898752212524414, "global_step": 325264, "epoch": 3918} {"train_loss": -25.70667839050293, "global_step": 325265, "epoch": 3918} {"train_loss": -25.8270263671875, "global_step": 325266, "epoch": 3918} {"train_loss": -26.219329833984375, "global_step": 325267, "epoch": 3918} {"train_loss": -26.220184326171875, "global_step": 325268, "epoch": 3918} {"train_loss": -25.865636825561523, "global_step": 325269, "epoch": 3918} {"train_loss": -25.997058868408203, "global_step": 325270, "epoch": 3918} {"train_loss": -25.89582633972168, "global_step": 325271, "epoch": 3918} {"train_loss": -26.269174575805664, "global_step": 325272, "epoch": 3918} {"train_loss": -26.048070907592773, "global_step": 325273, "epoch": 3918} {"train_loss": -25.8616943359375, "global_step": 325274, "epoch": 3918} {"train_loss": -25.714435577392578, "global_step": 325275, "epoch": 3918} {"train_loss": -25.89509511281209, "global_step": 325276, "epoch": 3918, "val_loss": 7258821.0} {"train_loss": -25.733007431030273, "global_step": 325277, "epoch": 3919} {"train_loss": -24.940195083618164, "global_step": 325278, "epoch": 3919} {"train_loss": -25.696699142456055, "global_step": 325279, "epoch": 3919} {"train_loss": -25.922199249267578, "global_step": 325280, "epoch": 3919} {"train_loss": -25.07294273376465, "global_step": 325281, "epoch": 3919} {"train_loss": -25.707843780517578, "global_step": 325282, "epoch": 3919} {"train_loss": -25.484111785888672, "global_step": 325283, "epoch": 3919} {"train_loss": -25.477584838867188, "global_step": 325284, "epoch": 3919} {"train_loss": -25.343608856201172, "global_step": 325285, "epoch": 3919} {"train_loss": -25.56499671936035, "global_step": 325286, "epoch": 3919} {"train_loss": -25.657180786132812, "global_step": 325287, "epoch": 3919} {"train_loss": -25.9114933013916, "global_step": 325288, "epoch": 3919} {"train_loss": -25.509538650512695, "global_step": 325289, "epoch": 3919} {"train_loss": -25.5929012298584, "global_step": 325290, "epoch": 3919} {"train_loss": -25.514028549194336, "global_step": 325291, "epoch": 3919} {"train_loss": -26.08198356628418, "global_step": 325292, "epoch": 3919} {"train_loss": -25.84111976623535, "global_step": 325293, "epoch": 3919} {"train_loss": -25.95582389831543, "global_step": 325294, "epoch": 3919} {"train_loss": -25.880163192749023, "global_step": 325295, "epoch": 3919} {"train_loss": -26.137115478515625, "global_step": 325296, "epoch": 3919} {"train_loss": -25.852079391479492, "global_step": 325297, "epoch": 3919} {"train_loss": -26.118030548095703, "global_step": 325298, "epoch": 3919} {"train_loss": -25.80584716796875, "global_step": 325299, "epoch": 3919} {"train_loss": -25.82322120666504, "global_step": 325300, "epoch": 3919} {"train_loss": -25.983823776245117, "global_step": 325301, "epoch": 3919} {"train_loss": -26.186237335205078, "global_step": 325302, "epoch": 3919} {"train_loss": -26.093677520751953, "global_step": 325303, "epoch": 3919} {"train_loss": -26.021438598632812, "global_step": 325304, "epoch": 3919} {"train_loss": -25.82147216796875, "global_step": 325305, "epoch": 3919} {"train_loss": -26.087142944335938, "global_step": 325306, "epoch": 3919} {"train_loss": -26.12091636657715, "global_step": 325307, "epoch": 3919} {"train_loss": -26.055105209350586, "global_step": 325308, "epoch": 3919} {"train_loss": -26.23603630065918, "global_step": 325309, "epoch": 3919} {"train_loss": -25.775726318359375, "global_step": 325310, "epoch": 3919} {"train_loss": -26.069263458251953, "global_step": 325311, "epoch": 3919} {"train_loss": -25.916242599487305, "global_step": 325312, "epoch": 3919} {"train_loss": -26.521713256835938, "global_step": 325313, "epoch": 3919} {"train_loss": -26.235260009765625, "global_step": 325314, "epoch": 3919} {"train_loss": -25.757654190063477, "global_step": 325315, "epoch": 3919} {"train_loss": -26.55356216430664, "global_step": 325316, "epoch": 3919} {"train_loss": -25.9055118560791, "global_step": 325317, "epoch": 3919} {"train_loss": -25.959264755249023, "global_step": 325318, "epoch": 3919} {"train_loss": -25.705856323242188, "global_step": 325319, "epoch": 3919} {"train_loss": -25.798730850219727, "global_step": 325320, "epoch": 3919} {"train_loss": -26.291675567626953, "global_step": 325321, "epoch": 3919} {"train_loss": -25.942890167236328, "global_step": 325322, "epoch": 3919} {"train_loss": -25.60577392578125, "global_step": 325323, "epoch": 3919} {"train_loss": -25.463363647460938, "global_step": 325324, "epoch": 3919} {"train_loss": -25.586502075195312, "global_step": 325325, "epoch": 3919} {"train_loss": -25.587305068969727, "global_step": 325326, "epoch": 3919} {"train_loss": -25.76775550842285, "global_step": 325327, "epoch": 3919} {"train_loss": -25.89405632019043, "global_step": 325328, "epoch": 3919} {"train_loss": -25.225412368774414, "global_step": 325329, "epoch": 3919} {"train_loss": -25.995655059814453, "global_step": 325330, "epoch": 3919} {"train_loss": -26.035449981689453, "global_step": 325331, "epoch": 3919} {"train_loss": -25.868122100830078, "global_step": 325332, "epoch": 3919} {"train_loss": -25.808185577392578, "global_step": 325333, "epoch": 3919} {"train_loss": -26.167041778564453, "global_step": 325334, "epoch": 3919} {"train_loss": -25.833698272705078, "global_step": 325335, "epoch": 3919} {"train_loss": -26.000654220581055, "global_step": 325336, "epoch": 3919} {"train_loss": -25.777698516845703, "global_step": 325337, "epoch": 3919} {"train_loss": -25.707441329956055, "global_step": 325338, "epoch": 3919} {"train_loss": -25.76155662536621, "global_step": 325339, "epoch": 3919} {"train_loss": -26.05853271484375, "global_step": 325340, "epoch": 3919} {"train_loss": -25.823694229125977, "global_step": 325341, "epoch": 3919} {"train_loss": -25.86773109436035, "global_step": 325342, "epoch": 3919} {"train_loss": -25.996023178100586, "global_step": 325343, "epoch": 3919} {"train_loss": -25.90647315979004, "global_step": 325344, "epoch": 3919} {"train_loss": -26.125051498413086, "global_step": 325345, "epoch": 3919} {"train_loss": -25.899877548217773, "global_step": 325346, "epoch": 3919} {"train_loss": -25.981719970703125, "global_step": 325347, "epoch": 3919} {"train_loss": -26.147192001342773, "global_step": 325348, "epoch": 3919} {"train_loss": -26.024023056030273, "global_step": 325349, "epoch": 3919} {"train_loss": -25.793729782104492, "global_step": 325350, "epoch": 3919} {"train_loss": -26.384231567382812, "global_step": 325351, "epoch": 3919} {"train_loss": -26.107824325561523, "global_step": 325352, "epoch": 3919} {"train_loss": -25.870468139648438, "global_step": 325353, "epoch": 3919} {"train_loss": -25.869720458984375, "global_step": 325354, "epoch": 3919} {"train_loss": -25.952564239501953, "global_step": 325355, "epoch": 3919} {"train_loss": -26.131704330444336, "global_step": 325356, "epoch": 3919} {"train_loss": -26.300983428955078, "global_step": 325357, "epoch": 3919} {"train_loss": -26.351499557495117, "global_step": 325358, "epoch": 3919} {"train_loss": -25.884805265679418, "global_step": 325359, "epoch": 3919, "val_loss": 7315002.0} {"train_loss": -25.86310386657715, "global_step": 325360, "epoch": 3920} {"train_loss": -25.260112762451172, "global_step": 325361, "epoch": 3920} {"train_loss": -25.310306549072266, "global_step": 325362, "epoch": 3920} {"train_loss": -25.795246124267578, "global_step": 325363, "epoch": 3920} {"train_loss": -25.611591339111328, "global_step": 325364, "epoch": 3920} {"train_loss": -25.8515682220459, "global_step": 325365, "epoch": 3920} {"train_loss": -25.49335289001465, "global_step": 325366, "epoch": 3920} {"train_loss": -25.7800235748291, "global_step": 325367, "epoch": 3920} {"train_loss": -25.582473754882812, "global_step": 325368, "epoch": 3920} {"train_loss": -25.9053897857666, "global_step": 325369, "epoch": 3920} {"train_loss": -25.965124130249023, "global_step": 325370, "epoch": 3920} {"train_loss": -26.147480010986328, "global_step": 325371, "epoch": 3920} {"train_loss": -25.385412216186523, "global_step": 325372, "epoch": 3920} {"train_loss": -25.663549423217773, "global_step": 325373, "epoch": 3920} {"train_loss": -25.531503677368164, "global_step": 325374, "epoch": 3920} {"train_loss": -25.740386962890625, "global_step": 325375, "epoch": 3920} {"train_loss": -26.000268936157227, "global_step": 325376, "epoch": 3920} {"train_loss": -26.072797775268555, "global_step": 325377, "epoch": 3920} {"train_loss": -26.161710739135742, "global_step": 325378, "epoch": 3920} {"train_loss": -25.91814613342285, "global_step": 325379, "epoch": 3920} {"train_loss": -25.92560386657715, "global_step": 325380, "epoch": 3920} {"train_loss": -26.195425033569336, "global_step": 325381, "epoch": 3920} {"train_loss": -26.110370635986328, "global_step": 325382, "epoch": 3920} {"train_loss": -26.030370712280273, "global_step": 325383, "epoch": 3920} {"train_loss": -25.996967315673828, "global_step": 325384, "epoch": 3920} {"train_loss": -25.720611572265625, "global_step": 325385, "epoch": 3920} {"train_loss": -25.81319236755371, "global_step": 325386, "epoch": 3920} {"train_loss": -25.619495391845703, "global_step": 325387, "epoch": 3920} {"train_loss": -26.01507568359375, "global_step": 325388, "epoch": 3920} {"train_loss": -25.852527618408203, "global_step": 325389, "epoch": 3920} {"train_loss": -25.705951690673828, "global_step": 325390, "epoch": 3920} {"train_loss": -25.690759658813477, "global_step": 325391, "epoch": 3920} {"train_loss": -25.829315185546875, "global_step": 325392, "epoch": 3920} {"train_loss": -25.894208908081055, "global_step": 325393, "epoch": 3920} {"train_loss": -25.542356491088867, "global_step": 325394, "epoch": 3920} {"train_loss": -26.198474884033203, "global_step": 325395, "epoch": 3920} {"train_loss": -25.76670265197754, "global_step": 325396, "epoch": 3920} {"train_loss": -25.7509708404541, "global_step": 325397, "epoch": 3920} {"train_loss": -26.133777618408203, "global_step": 325398, "epoch": 3920} {"train_loss": -26.144330978393555, "global_step": 325399, "epoch": 3920} {"train_loss": -25.74202537536621, "global_step": 325400, "epoch": 3920} {"train_loss": -26.14007568359375, "global_step": 325401, "epoch": 3920} {"train_loss": -25.847660064697266, "global_step": 325402, "epoch": 3920} {"train_loss": -25.973546981811523, "global_step": 325403, "epoch": 3920} {"train_loss": -25.826419830322266, "global_step": 325404, "epoch": 3920} {"train_loss": -25.750959396362305, "global_step": 325405, "epoch": 3920} {"train_loss": -25.681640625, "global_step": 325406, "epoch": 3920} {"train_loss": -25.988691329956055, "global_step": 325407, "epoch": 3920} {"train_loss": -25.727426528930664, "global_step": 325408, "epoch": 3920} {"train_loss": -25.85529899597168, "global_step": 325409, "epoch": 3920} {"train_loss": -26.26395034790039, "global_step": 325410, "epoch": 3920} {"train_loss": -25.877975463867188, "global_step": 325411, "epoch": 3920} {"train_loss": -26.102893829345703, "global_step": 325412, "epoch": 3920} {"train_loss": -26.011472702026367, "global_step": 325413, "epoch": 3920} {"train_loss": -25.759601593017578, "global_step": 325414, "epoch": 3920} {"train_loss": -25.98858070373535, "global_step": 325415, "epoch": 3920} {"train_loss": -25.747262954711914, "global_step": 325416, "epoch": 3920} {"train_loss": -25.532819747924805, "global_step": 325417, "epoch": 3920} {"train_loss": -25.993383407592773, "global_step": 325418, "epoch": 3920} {"train_loss": -25.676071166992188, "global_step": 325419, "epoch": 3920} {"train_loss": -25.919294357299805, "global_step": 325420, "epoch": 3920} {"train_loss": -25.78455924987793, "global_step": 325421, "epoch": 3920} {"train_loss": -25.995458602905273, "global_step": 325422, "epoch": 3920} {"train_loss": -25.995410919189453, "global_step": 325423, "epoch": 3920} {"train_loss": -25.83172035217285, "global_step": 325424, "epoch": 3920} {"train_loss": -25.76728630065918, "global_step": 325425, "epoch": 3920} {"train_loss": -26.216028213500977, "global_step": 325426, "epoch": 3920} {"train_loss": -25.971878051757812, "global_step": 325427, "epoch": 3920} {"train_loss": -25.772354125976562, "global_step": 325428, "epoch": 3920} {"train_loss": -25.875629425048828, "global_step": 325429, "epoch": 3920} {"train_loss": -26.218048095703125, "global_step": 325430, "epoch": 3920} {"train_loss": -25.9434814453125, "global_step": 325431, "epoch": 3920} {"train_loss": -25.794958114624023, "global_step": 325432, "epoch": 3920} {"train_loss": -26.089460372924805, "global_step": 325433, "epoch": 3920} {"train_loss": -25.896474838256836, "global_step": 325434, "epoch": 3920} {"train_loss": -25.776214599609375, "global_step": 325435, "epoch": 3920} {"train_loss": -26.086835861206055, "global_step": 325436, "epoch": 3920} {"train_loss": -26.001169204711914, "global_step": 325437, "epoch": 3920} {"train_loss": -26.6043701171875, "global_step": 325438, "epoch": 3920} {"train_loss": -26.448200225830078, "global_step": 325439, "epoch": 3920} {"train_loss": -26.246021270751953, "global_step": 325440, "epoch": 3920} {"train_loss": -26.23688316345215, "global_step": 325441, "epoch": 3920} {"train_loss": -25.88927701007889, "global_step": 325442, "epoch": 3920, "val_loss": 7224828.0} {"train_loss": -24.8007755279541, "global_step": 325443, "epoch": 3921} {"train_loss": -24.455121994018555, "global_step": 325444, "epoch": 3921} {"train_loss": -24.26819610595703, "global_step": 325445, "epoch": 3921} {"train_loss": -25.165658950805664, "global_step": 325446, "epoch": 3921} {"train_loss": -24.199874877929688, "global_step": 325447, "epoch": 3921} {"train_loss": -25.181537628173828, "global_step": 325448, "epoch": 3921} {"train_loss": -24.99336814880371, "global_step": 325449, "epoch": 3921} {"train_loss": -25.247556686401367, "global_step": 325450, "epoch": 3921} {"train_loss": -24.510787963867188, "global_step": 325451, "epoch": 3921} {"train_loss": -24.712434768676758, "global_step": 325452, "epoch": 3921} {"train_loss": -25.346357345581055, "global_step": 325453, "epoch": 3921} {"train_loss": -24.74161148071289, "global_step": 325454, "epoch": 3921} {"train_loss": -25.128530502319336, "global_step": 325455, "epoch": 3921} {"train_loss": -25.52939796447754, "global_step": 325456, "epoch": 3921} {"train_loss": -24.853778839111328, "global_step": 325457, "epoch": 3921} {"train_loss": -25.763763427734375, "global_step": 325458, "epoch": 3921} {"train_loss": -24.713163375854492, "global_step": 325459, "epoch": 3921} {"train_loss": -25.559955596923828, "global_step": 325460, "epoch": 3921} {"train_loss": -25.326993942260742, "global_step": 325461, "epoch": 3921} {"train_loss": -25.242908477783203, "global_step": 325462, "epoch": 3921} {"train_loss": -25.302127838134766, "global_step": 325463, "epoch": 3921} {"train_loss": -25.308759689331055, "global_step": 325464, "epoch": 3921} {"train_loss": -25.289051055908203, "global_step": 325465, "epoch": 3921} {"train_loss": -25.348791122436523, "global_step": 325466, "epoch": 3921} {"train_loss": -25.571805953979492, "global_step": 325467, "epoch": 3921} {"train_loss": -25.715320587158203, "global_step": 325468, "epoch": 3921} {"train_loss": -25.69622802734375, "global_step": 325469, "epoch": 3921} {"train_loss": -25.726795196533203, "global_step": 325470, "epoch": 3921} {"train_loss": -25.78228187561035, "global_step": 325471, "epoch": 3921} {"train_loss": -25.560441970825195, "global_step": 325472, "epoch": 3921} {"train_loss": -25.61582374572754, "global_step": 325473, "epoch": 3921} {"train_loss": -25.829376220703125, "global_step": 325474, "epoch": 3921} {"train_loss": -26.011255264282227, "global_step": 325475, "epoch": 3921} {"train_loss": -25.548246383666992, "global_step": 325476, "epoch": 3921} {"train_loss": -25.666446685791016, "global_step": 325477, "epoch": 3921} {"train_loss": -25.753461837768555, "global_step": 325478, "epoch": 3921} {"train_loss": -25.660669326782227, "global_step": 325479, "epoch": 3921} {"train_loss": -25.45250129699707, "global_step": 325480, "epoch": 3921} {"train_loss": -25.8881893157959, "global_step": 325481, "epoch": 3921} {"train_loss": -26.269079208374023, "global_step": 325482, "epoch": 3921} {"train_loss": -26.4775447845459, "global_step": 325483, "epoch": 3921} {"train_loss": -25.809131622314453, "global_step": 325484, "epoch": 3921} {"train_loss": -25.799942016601562, "global_step": 325485, "epoch": 3921} {"train_loss": -26.164770126342773, "global_step": 325486, "epoch": 3921} {"train_loss": -26.043060302734375, "global_step": 325487, "epoch": 3921} {"train_loss": -26.008935928344727, "global_step": 325488, "epoch": 3921} {"train_loss": -25.788135528564453, "global_step": 325489, "epoch": 3921} {"train_loss": -25.906293869018555, "global_step": 325490, "epoch": 3921} {"train_loss": -25.90140151977539, "global_step": 325491, "epoch": 3921} {"train_loss": -26.125288009643555, "global_step": 325492, "epoch": 3921} {"train_loss": -25.92535972595215, "global_step": 325493, "epoch": 3921} {"train_loss": -26.14826011657715, "global_step": 325494, "epoch": 3921} {"train_loss": -25.994367599487305, "global_step": 325495, "epoch": 3921} {"train_loss": -25.89835548400879, "global_step": 325496, "epoch": 3921} {"train_loss": -26.092884063720703, "global_step": 325497, "epoch": 3921} {"train_loss": -25.320859909057617, "global_step": 325498, "epoch": 3921} {"train_loss": -25.90532875061035, "global_step": 325499, "epoch": 3921} {"train_loss": -25.27686309814453, "global_step": 325500, "epoch": 3921} {"train_loss": -25.540861129760742, "global_step": 325501, "epoch": 3921} {"train_loss": -25.53263282775879, "global_step": 325502, "epoch": 3921} {"train_loss": -25.66153907775879, "global_step": 325503, "epoch": 3921} {"train_loss": -25.634668350219727, "global_step": 325504, "epoch": 3921} {"train_loss": -25.63165855407715, "global_step": 325505, "epoch": 3921} {"train_loss": -25.808887481689453, "global_step": 325506, "epoch": 3921} {"train_loss": -25.49458885192871, "global_step": 325507, "epoch": 3921} {"train_loss": -26.060943603515625, "global_step": 325508, "epoch": 3921} {"train_loss": -26.0069522857666, "global_step": 325509, "epoch": 3921} {"train_loss": -25.462961196899414, "global_step": 325510, "epoch": 3921} {"train_loss": -25.9051456451416, "global_step": 325511, "epoch": 3921} {"train_loss": -25.77503776550293, "global_step": 325512, "epoch": 3921} {"train_loss": -26.039525985717773, "global_step": 325513, "epoch": 3921} {"train_loss": -25.529943466186523, "global_step": 325514, "epoch": 3921} {"train_loss": -25.97906494140625, "global_step": 325515, "epoch": 3921} {"train_loss": -25.9240665435791, "global_step": 325516, "epoch": 3921} {"train_loss": -25.641666412353516, "global_step": 325517, "epoch": 3921} {"train_loss": -26.276601791381836, "global_step": 325518, "epoch": 3921} {"train_loss": -25.64204978942871, "global_step": 325519, "epoch": 3921} {"train_loss": -25.999759674072266, "global_step": 325520, "epoch": 3921} {"train_loss": -26.147260665893555, "global_step": 325521, "epoch": 3921} {"train_loss": -25.703887939453125, "global_step": 325522, "epoch": 3921} {"train_loss": -25.708332061767578, "global_step": 325523, "epoch": 3921} {"train_loss": -25.670934677124023, "global_step": 325524, "epoch": 3921} {"train_loss": -25.59926127238446, "global_step": 325525, "epoch": 3921, "val_loss": 7138480.0} {"train_loss": -25.36049461364746, "global_step": 325526, "epoch": 3922} {"train_loss": -25.277456283569336, "global_step": 325527, "epoch": 3922} {"train_loss": -25.674057006835938, "global_step": 325528, "epoch": 3922} {"train_loss": -25.512331008911133, "global_step": 325529, "epoch": 3922} {"train_loss": -25.79005241394043, "global_step": 325530, "epoch": 3922} {"train_loss": -25.345947265625, "global_step": 325531, "epoch": 3922} {"train_loss": -25.582059860229492, "global_step": 325532, "epoch": 3922} {"train_loss": -25.68424415588379, "global_step": 325533, "epoch": 3922} {"train_loss": -25.464624404907227, "global_step": 325534, "epoch": 3922} {"train_loss": -25.720016479492188, "global_step": 325535, "epoch": 3922} {"train_loss": -25.33866310119629, "global_step": 325536, "epoch": 3922} {"train_loss": -26.268163681030273, "global_step": 325537, "epoch": 3922} {"train_loss": -25.447383880615234, "global_step": 325538, "epoch": 3922} {"train_loss": -25.833328247070312, "global_step": 325539, "epoch": 3922} {"train_loss": -25.817996978759766, "global_step": 325540, "epoch": 3922} {"train_loss": -25.7738094329834, "global_step": 325541, "epoch": 3922} {"train_loss": -25.747100830078125, "global_step": 325542, "epoch": 3922} {"train_loss": -26.019163131713867, "global_step": 325543, "epoch": 3922} {"train_loss": -25.531156539916992, "global_step": 325544, "epoch": 3922} {"train_loss": -25.89375877380371, "global_step": 325545, "epoch": 3922} {"train_loss": -26.05964469909668, "global_step": 325546, "epoch": 3922} {"train_loss": -25.710073471069336, "global_step": 325547, "epoch": 3922} {"train_loss": -25.961400985717773, "global_step": 325548, "epoch": 3922} {"train_loss": -26.07559585571289, "global_step": 325549, "epoch": 3922} {"train_loss": -25.698209762573242, "global_step": 325550, "epoch": 3922} {"train_loss": -26.31612205505371, "global_step": 325551, "epoch": 3922} {"train_loss": -26.4263973236084, "global_step": 325552, "epoch": 3922} {"train_loss": -26.041723251342773, "global_step": 325553, "epoch": 3922} {"train_loss": -25.877838134765625, "global_step": 325554, "epoch": 3922} {"train_loss": -25.945362091064453, "global_step": 325555, "epoch": 3922} {"train_loss": -25.75177574157715, "global_step": 325556, "epoch": 3922} {"train_loss": -26.075971603393555, "global_step": 325557, "epoch": 3922} {"train_loss": -26.151086807250977, "global_step": 325558, "epoch": 3922} {"train_loss": -26.216293334960938, "global_step": 325559, "epoch": 3922} {"train_loss": -25.958852767944336, "global_step": 325560, "epoch": 3922} {"train_loss": -26.365570068359375, "global_step": 325561, "epoch": 3922} {"train_loss": -25.52321434020996, "global_step": 325562, "epoch": 3922} {"train_loss": -25.77656364440918, "global_step": 325563, "epoch": 3922} {"train_loss": -25.83710289001465, "global_step": 325564, "epoch": 3922} {"train_loss": -26.010726928710938, "global_step": 325565, "epoch": 3922} {"train_loss": -25.825193405151367, "global_step": 325566, "epoch": 3922} {"train_loss": -25.7797908782959, "global_step": 325567, "epoch": 3922} {"train_loss": -25.830625534057617, "global_step": 325568, "epoch": 3922} {"train_loss": -25.33487892150879, "global_step": 325569, "epoch": 3922} {"train_loss": -25.80988121032715, "global_step": 325570, "epoch": 3922} {"train_loss": -25.64686393737793, "global_step": 325571, "epoch": 3922} {"train_loss": -26.26700782775879, "global_step": 325572, "epoch": 3922} {"train_loss": -25.59848976135254, "global_step": 325573, "epoch": 3922} {"train_loss": -25.47183609008789, "global_step": 325574, "epoch": 3922} {"train_loss": -25.788358688354492, "global_step": 325575, "epoch": 3922} {"train_loss": -25.75412940979004, "global_step": 325576, "epoch": 3922} {"train_loss": -25.68760108947754, "global_step": 325577, "epoch": 3922} {"train_loss": -25.489633560180664, "global_step": 325578, "epoch": 3922} {"train_loss": -25.946847915649414, "global_step": 325579, "epoch": 3922} {"train_loss": -26.027420043945312, "global_step": 325580, "epoch": 3922} {"train_loss": -25.784467697143555, "global_step": 325581, "epoch": 3922} {"train_loss": -25.887271881103516, "global_step": 325582, "epoch": 3922} {"train_loss": -25.927886962890625, "global_step": 325583, "epoch": 3922} {"train_loss": -26.042083740234375, "global_step": 325584, "epoch": 3922} {"train_loss": -25.78814697265625, "global_step": 325585, "epoch": 3922} {"train_loss": -26.025487899780273, "global_step": 325586, "epoch": 3922} {"train_loss": -25.469038009643555, "global_step": 325587, "epoch": 3922} {"train_loss": -25.891178131103516, "global_step": 325588, "epoch": 3922} {"train_loss": -25.836090087890625, "global_step": 325589, "epoch": 3922} {"train_loss": -25.703109741210938, "global_step": 325590, "epoch": 3922} {"train_loss": -25.64271354675293, "global_step": 325591, "epoch": 3922} {"train_loss": -26.06941032409668, "global_step": 325592, "epoch": 3922} {"train_loss": -25.676496505737305, "global_step": 325593, "epoch": 3922} {"train_loss": -26.148584365844727, "global_step": 325594, "epoch": 3922} {"train_loss": -26.116567611694336, "global_step": 325595, "epoch": 3922} {"train_loss": -25.53406524658203, "global_step": 325596, "epoch": 3922} {"train_loss": -25.810047149658203, "global_step": 325597, "epoch": 3922} {"train_loss": -26.0113582611084, "global_step": 325598, "epoch": 3922} {"train_loss": -26.0017032623291, "global_step": 325599, "epoch": 3922} {"train_loss": -26.035568237304688, "global_step": 325600, "epoch": 3922} {"train_loss": -25.766035079956055, "global_step": 325601, "epoch": 3922} {"train_loss": -26.079370498657227, "global_step": 325602, "epoch": 3922} {"train_loss": -26.192996978759766, "global_step": 325603, "epoch": 3922} {"train_loss": -26.067218780517578, "global_step": 325604, "epoch": 3922} {"train_loss": -26.353729248046875, "global_step": 325605, "epoch": 3922} {"train_loss": -26.15726089477539, "global_step": 325606, "epoch": 3922} {"train_loss": -25.602066040039062, "global_step": 325607, "epoch": 3922} {"train_loss": -25.847313271947655, "global_step": 325608, "epoch": 3922, "val_loss": 7153964.5} {"train_loss": -25.65764808654785, "global_step": 325609, "epoch": 3923} {"train_loss": -25.46559715270996, "global_step": 325610, "epoch": 3923} {"train_loss": -25.850967407226562, "global_step": 325611, "epoch": 3923} {"train_loss": -25.728199005126953, "global_step": 325612, "epoch": 3923} {"train_loss": -24.791183471679688, "global_step": 325613, "epoch": 3923} {"train_loss": -25.540363311767578, "global_step": 325614, "epoch": 3923} {"train_loss": -25.58445167541504, "global_step": 325615, "epoch": 3923} {"train_loss": -25.329578399658203, "global_step": 325616, "epoch": 3923} {"train_loss": -25.6406192779541, "global_step": 325617, "epoch": 3923} {"train_loss": -25.609861373901367, "global_step": 325618, "epoch": 3923} {"train_loss": -25.263914108276367, "global_step": 325619, "epoch": 3923} {"train_loss": -26.028772354125977, "global_step": 325620, "epoch": 3923} {"train_loss": -25.729415893554688, "global_step": 325621, "epoch": 3923} {"train_loss": -25.197956085205078, "global_step": 325622, "epoch": 3923} {"train_loss": -25.436994552612305, "global_step": 325623, "epoch": 3923} {"train_loss": -25.38825798034668, "global_step": 325624, "epoch": 3923} {"train_loss": -25.756677627563477, "global_step": 325625, "epoch": 3923} {"train_loss": -25.657087326049805, "global_step": 325626, "epoch": 3923} {"train_loss": -25.962615966796875, "global_step": 325627, "epoch": 3923} {"train_loss": -25.516746520996094, "global_step": 325628, "epoch": 3923} {"train_loss": -26.07915687561035, "global_step": 325629, "epoch": 3923} {"train_loss": -25.682035446166992, "global_step": 325630, "epoch": 3923} {"train_loss": -26.04938316345215, "global_step": 325631, "epoch": 3923} {"train_loss": -25.934356689453125, "global_step": 325632, "epoch": 3923} {"train_loss": -25.730894088745117, "global_step": 325633, "epoch": 3923} {"train_loss": -26.094058990478516, "global_step": 325634, "epoch": 3923} {"train_loss": -25.8118839263916, "global_step": 325635, "epoch": 3923} {"train_loss": -25.6276912689209, "global_step": 325636, "epoch": 3923} {"train_loss": -25.865936279296875, "global_step": 325637, "epoch": 3923} {"train_loss": -25.958189010620117, "global_step": 325638, "epoch": 3923} {"train_loss": -25.755033493041992, "global_step": 325639, "epoch": 3923} {"train_loss": -25.651601791381836, "global_step": 325640, "epoch": 3923} {"train_loss": -25.9737491607666, "global_step": 325641, "epoch": 3923} {"train_loss": -25.77353858947754, "global_step": 325642, "epoch": 3923} {"train_loss": -26.05517578125, "global_step": 325643, "epoch": 3923} {"train_loss": -25.941442489624023, "global_step": 325644, "epoch": 3923} {"train_loss": -26.0191707611084, "global_step": 325645, "epoch": 3923} {"train_loss": -25.88128662109375, "global_step": 325646, "epoch": 3923} {"train_loss": -26.021753311157227, "global_step": 325647, "epoch": 3923} {"train_loss": -25.813501358032227, "global_step": 325648, "epoch": 3923} {"train_loss": -25.985559463500977, "global_step": 325649, "epoch": 3923} {"train_loss": -26.074268341064453, "global_step": 325650, "epoch": 3923} {"train_loss": -25.94245719909668, "global_step": 325651, "epoch": 3923} {"train_loss": -26.102567672729492, "global_step": 325652, "epoch": 3923} {"train_loss": -25.92987060546875, "global_step": 325653, "epoch": 3923} {"train_loss": -25.88972282409668, "global_step": 325654, "epoch": 3923} {"train_loss": -26.04066276550293, "global_step": 325655, "epoch": 3923} {"train_loss": -25.75470542907715, "global_step": 325656, "epoch": 3923} {"train_loss": -26.264022827148438, "global_step": 325657, "epoch": 3923} {"train_loss": -25.822187423706055, "global_step": 325658, "epoch": 3923} {"train_loss": -25.89841651916504, "global_step": 325659, "epoch": 3923} {"train_loss": -25.94622230529785, "global_step": 325660, "epoch": 3923} {"train_loss": -26.008249282836914, "global_step": 325661, "epoch": 3923} {"train_loss": -26.324934005737305, "global_step": 325662, "epoch": 3923} {"train_loss": -25.778837203979492, "global_step": 325663, "epoch": 3923} {"train_loss": -25.76456642150879, "global_step": 325664, "epoch": 3923} {"train_loss": -25.990758895874023, "global_step": 325665, "epoch": 3923} {"train_loss": -25.931949615478516, "global_step": 325666, "epoch": 3923} {"train_loss": -25.58072853088379, "global_step": 325667, "epoch": 3923} {"train_loss": -25.886091232299805, "global_step": 325668, "epoch": 3923} {"train_loss": -26.05112075805664, "global_step": 325669, "epoch": 3923} {"train_loss": -26.091527938842773, "global_step": 325670, "epoch": 3923} {"train_loss": -26.011493682861328, "global_step": 325671, "epoch": 3923} {"train_loss": -26.137104034423828, "global_step": 325672, "epoch": 3923} {"train_loss": -25.964420318603516, "global_step": 325673, "epoch": 3923} {"train_loss": -26.171850204467773, "global_step": 325674, "epoch": 3923} {"train_loss": -25.896930694580078, "global_step": 325675, "epoch": 3923} {"train_loss": -26.327070236206055, "global_step": 325676, "epoch": 3923} {"train_loss": -25.90260124206543, "global_step": 325677, "epoch": 3923} {"train_loss": -26.259017944335938, "global_step": 325678, "epoch": 3923} {"train_loss": -26.238920211791992, "global_step": 325679, "epoch": 3923} {"train_loss": -26.2027645111084, "global_step": 325680, "epoch": 3923} {"train_loss": -25.78190040588379, "global_step": 325681, "epoch": 3923} {"train_loss": -25.84576416015625, "global_step": 325682, "epoch": 3923} {"train_loss": -25.994049072265625, "global_step": 325683, "epoch": 3923} {"train_loss": -26.47537612915039, "global_step": 325684, "epoch": 3923} {"train_loss": -26.042749404907227, "global_step": 325685, "epoch": 3923} {"train_loss": -25.96073341369629, "global_step": 325686, "epoch": 3923} {"train_loss": -25.942138671875, "global_step": 325687, "epoch": 3923} {"train_loss": -26.010852813720703, "global_step": 325688, "epoch": 3923} {"train_loss": -26.0909366607666, "global_step": 325689, "epoch": 3923} {"train_loss": -26.196548461914062, "global_step": 325690, "epoch": 3923} {"train_loss": -25.863201095397216, "global_step": 325691, "epoch": 3923, "val_loss": 7237989.5} {"train_loss": -25.010120391845703, "global_step": 325692, "epoch": 3924} {"train_loss": -25.54746437072754, "global_step": 325693, "epoch": 3924} {"train_loss": -25.573530197143555, "global_step": 325694, "epoch": 3924} {"train_loss": -25.116165161132812, "global_step": 325695, "epoch": 3924} {"train_loss": -25.102367401123047, "global_step": 325696, "epoch": 3924} {"train_loss": -25.57541847229004, "global_step": 325697, "epoch": 3924} {"train_loss": -25.291893005371094, "global_step": 325698, "epoch": 3924} {"train_loss": -25.164514541625977, "global_step": 325699, "epoch": 3924} {"train_loss": -25.441938400268555, "global_step": 325700, "epoch": 3924} {"train_loss": -25.464506149291992, "global_step": 325701, "epoch": 3924} {"train_loss": -25.44367790222168, "global_step": 325702, "epoch": 3924} {"train_loss": -25.72075843811035, "global_step": 325703, "epoch": 3924} {"train_loss": -25.631025314331055, "global_step": 325704, "epoch": 3924} {"train_loss": -25.54766082763672, "global_step": 325705, "epoch": 3924} {"train_loss": -25.035226821899414, "global_step": 325706, "epoch": 3924} {"train_loss": -25.749271392822266, "global_step": 325707, "epoch": 3924} {"train_loss": -25.71603775024414, "global_step": 325708, "epoch": 3924} {"train_loss": -25.551849365234375, "global_step": 325709, "epoch": 3924} {"train_loss": -25.452817916870117, "global_step": 325710, "epoch": 3924} {"train_loss": -25.710718154907227, "global_step": 325711, "epoch": 3924} {"train_loss": -25.87013816833496, "global_step": 325712, "epoch": 3924} {"train_loss": -25.752973556518555, "global_step": 325713, "epoch": 3924} {"train_loss": -25.840368270874023, "global_step": 325714, "epoch": 3924} {"train_loss": -25.89226722717285, "global_step": 325715, "epoch": 3924} {"train_loss": -25.71821403503418, "global_step": 325716, "epoch": 3924} {"train_loss": -25.616790771484375, "global_step": 325717, "epoch": 3924} {"train_loss": -25.90406608581543, "global_step": 325718, "epoch": 3924} {"train_loss": -25.6978702545166, "global_step": 325719, "epoch": 3924} {"train_loss": -25.449277877807617, "global_step": 325720, "epoch": 3924} {"train_loss": -25.790822982788086, "global_step": 325721, "epoch": 3924} {"train_loss": -25.994077682495117, "global_step": 325722, "epoch": 3924} {"train_loss": -26.13657569885254, "global_step": 325723, "epoch": 3924} {"train_loss": -25.808013916015625, "global_step": 325724, "epoch": 3924} {"train_loss": -25.796926498413086, "global_step": 325725, "epoch": 3924} {"train_loss": -26.04557228088379, "global_step": 325726, "epoch": 3924} {"train_loss": -25.897436141967773, "global_step": 325727, "epoch": 3924} {"train_loss": -25.71718406677246, "global_step": 325728, "epoch": 3924} {"train_loss": -26.350500106811523, "global_step": 325729, "epoch": 3924} {"train_loss": -26.467914581298828, "global_step": 325730, "epoch": 3924} {"train_loss": -26.142974853515625, "global_step": 325731, "epoch": 3924} {"train_loss": -26.199689865112305, "global_step": 325732, "epoch": 3924} {"train_loss": -26.139440536499023, "global_step": 325733, "epoch": 3924} {"train_loss": -25.656278610229492, "global_step": 325734, "epoch": 3924} {"train_loss": -26.20208740234375, "global_step": 325735, "epoch": 3924} {"train_loss": -25.78309440612793, "global_step": 325736, "epoch": 3924} {"train_loss": -26.15888786315918, "global_step": 325737, "epoch": 3924} {"train_loss": -25.6354923248291, "global_step": 325738, "epoch": 3924} {"train_loss": -25.896894454956055, "global_step": 325739, "epoch": 3924} {"train_loss": -25.92009925842285, "global_step": 325740, "epoch": 3924} {"train_loss": -26.375654220581055, "global_step": 325741, "epoch": 3924} {"train_loss": -25.741117477416992, "global_step": 325742, "epoch": 3924} {"train_loss": -25.929168701171875, "global_step": 325743, "epoch": 3924} {"train_loss": -26.163949966430664, "global_step": 325744, "epoch": 3924} {"train_loss": -26.17738151550293, "global_step": 325745, "epoch": 3924} {"train_loss": -26.356128692626953, "global_step": 325746, "epoch": 3924} {"train_loss": -25.882810592651367, "global_step": 325747, "epoch": 3924} {"train_loss": -26.391983032226562, "global_step": 325748, "epoch": 3924} {"train_loss": -25.87925148010254, "global_step": 325749, "epoch": 3924} {"train_loss": -26.012954711914062, "global_step": 325750, "epoch": 3924} {"train_loss": -25.760391235351562, "global_step": 325751, "epoch": 3924} {"train_loss": -25.52369499206543, "global_step": 325752, "epoch": 3924} {"train_loss": -25.279794692993164, "global_step": 325753, "epoch": 3924} {"train_loss": -25.05817222595215, "global_step": 325754, "epoch": 3924} {"train_loss": -25.58639907836914, "global_step": 325755, "epoch": 3924} {"train_loss": -25.499975204467773, "global_step": 325756, "epoch": 3924} {"train_loss": -25.80682945251465, "global_step": 325757, "epoch": 3924} {"train_loss": -25.5314884185791, "global_step": 325758, "epoch": 3924} {"train_loss": -25.498952865600586, "global_step": 325759, "epoch": 3924} {"train_loss": -25.49461555480957, "global_step": 325760, "epoch": 3924} {"train_loss": -25.434585571289062, "global_step": 325761, "epoch": 3924} {"train_loss": -25.92286491394043, "global_step": 325762, "epoch": 3924} {"train_loss": -25.708219528198242, "global_step": 325763, "epoch": 3924} {"train_loss": -25.5402889251709, "global_step": 325764, "epoch": 3924} {"train_loss": -25.508495330810547, "global_step": 325765, "epoch": 3924} {"train_loss": -26.024539947509766, "global_step": 325766, "epoch": 3924} {"train_loss": -25.21341896057129, "global_step": 325767, "epoch": 3924} {"train_loss": -25.372791290283203, "global_step": 325768, "epoch": 3924} {"train_loss": -25.56505584716797, "global_step": 325769, "epoch": 3924} {"train_loss": -25.38789176940918, "global_step": 325770, "epoch": 3924} {"train_loss": -25.23938751220703, "global_step": 325771, "epoch": 3924} {"train_loss": -25.697397232055664, "global_step": 325772, "epoch": 3924} {"train_loss": -25.549205780029297, "global_step": 325773, "epoch": 3924} {"train_loss": -25.696135095803136, "global_step": 325774, "epoch": 3924, "val_loss": 7288424.0} {"train_loss": -24.634126663208008, "global_step": 325775, "epoch": 3925} {"train_loss": -24.686742782592773, "global_step": 325776, "epoch": 3925} {"train_loss": -24.791940689086914, "global_step": 325777, "epoch": 3925} {"train_loss": -24.9653263092041, "global_step": 325778, "epoch": 3925} {"train_loss": -24.6239013671875, "global_step": 325779, "epoch": 3925} {"train_loss": -24.773027420043945, "global_step": 325780, "epoch": 3925} {"train_loss": -25.578468322753906, "global_step": 325781, "epoch": 3925} {"train_loss": -25.0965518951416, "global_step": 325782, "epoch": 3925} {"train_loss": -25.326635360717773, "global_step": 325783, "epoch": 3925} {"train_loss": -25.182615280151367, "global_step": 325784, "epoch": 3925} {"train_loss": -25.700260162353516, "global_step": 325785, "epoch": 3925} {"train_loss": -25.1155948638916, "global_step": 325786, "epoch": 3925} {"train_loss": -25.62735939025879, "global_step": 325787, "epoch": 3925} {"train_loss": -25.862518310546875, "global_step": 325788, "epoch": 3925} {"train_loss": -25.311702728271484, "global_step": 325789, "epoch": 3925} {"train_loss": -25.566402435302734, "global_step": 325790, "epoch": 3925} {"train_loss": -25.277969360351562, "global_step": 325791, "epoch": 3925} {"train_loss": -25.519773483276367, "global_step": 325792, "epoch": 3925} {"train_loss": -25.706653594970703, "global_step": 325793, "epoch": 3925} {"train_loss": -25.847013473510742, "global_step": 325794, "epoch": 3925} {"train_loss": -25.815311431884766, "global_step": 325795, "epoch": 3925} {"train_loss": -25.60822105407715, "global_step": 325796, "epoch": 3925} {"train_loss": -25.526992797851562, "global_step": 325797, "epoch": 3925} {"train_loss": -25.778478622436523, "global_step": 325798, "epoch": 3925} {"train_loss": -25.770532608032227, "global_step": 325799, "epoch": 3925} {"train_loss": -26.019275665283203, "global_step": 325800, "epoch": 3925} {"train_loss": -26.170331954956055, "global_step": 325801, "epoch": 3925} {"train_loss": -25.9534969329834, "global_step": 325802, "epoch": 3925} {"train_loss": -25.726318359375, "global_step": 325803, "epoch": 3925} {"train_loss": -25.846113204956055, "global_step": 325804, "epoch": 3925} {"train_loss": -26.070758819580078, "global_step": 325805, "epoch": 3925} {"train_loss": -26.126434326171875, "global_step": 325806, "epoch": 3925} {"train_loss": -25.808929443359375, "global_step": 325807, "epoch": 3925} {"train_loss": -26.17228126525879, "global_step": 325808, "epoch": 3925} {"train_loss": -26.14240837097168, "global_step": 325809, "epoch": 3925} {"train_loss": -26.13330078125, "global_step": 325810, "epoch": 3925} {"train_loss": -26.083789825439453, "global_step": 325811, "epoch": 3925} {"train_loss": -25.87688636779785, "global_step": 325812, "epoch": 3925} {"train_loss": -25.81121253967285, "global_step": 325813, "epoch": 3925} {"train_loss": -25.907678604125977, "global_step": 325814, "epoch": 3925} {"train_loss": -26.076282501220703, "global_step": 325815, "epoch": 3925} {"train_loss": -25.831436157226562, "global_step": 325816, "epoch": 3925} {"train_loss": -25.934162139892578, "global_step": 325817, "epoch": 3925} {"train_loss": -25.765609741210938, "global_step": 325818, "epoch": 3925} {"train_loss": -26.2017879486084, "global_step": 325819, "epoch": 3925} {"train_loss": -26.181644439697266, "global_step": 325820, "epoch": 3925} {"train_loss": -25.969152450561523, "global_step": 325821, "epoch": 3925} {"train_loss": -26.020551681518555, "global_step": 325822, "epoch": 3925} {"train_loss": -26.1146183013916, "global_step": 325823, "epoch": 3925} {"train_loss": -25.80414390563965, "global_step": 325824, "epoch": 3925} {"train_loss": -25.45859146118164, "global_step": 325825, "epoch": 3925} {"train_loss": -26.27507972717285, "global_step": 325826, "epoch": 3925} {"train_loss": -25.713964462280273, "global_step": 325827, "epoch": 3925} {"train_loss": -26.323123931884766, "global_step": 325828, "epoch": 3925} {"train_loss": -25.834125518798828, "global_step": 325829, "epoch": 3925} {"train_loss": -25.446630477905273, "global_step": 325830, "epoch": 3925} {"train_loss": -25.800552368164062, "global_step": 325831, "epoch": 3925} {"train_loss": -25.592315673828125, "global_step": 325832, "epoch": 3925} {"train_loss": -25.551227569580078, "global_step": 325833, "epoch": 3925} {"train_loss": -25.827917098999023, "global_step": 325834, "epoch": 3925} {"train_loss": -25.8022403717041, "global_step": 325835, "epoch": 3925} {"train_loss": -25.52691650390625, "global_step": 325836, "epoch": 3925} {"train_loss": -25.910999298095703, "global_step": 325837, "epoch": 3925} {"train_loss": -26.065561294555664, "global_step": 325838, "epoch": 3925} {"train_loss": -26.07044792175293, "global_step": 325839, "epoch": 3925} {"train_loss": -26.020496368408203, "global_step": 325840, "epoch": 3925} {"train_loss": -26.119298934936523, "global_step": 325841, "epoch": 3925} {"train_loss": -26.04072380065918, "global_step": 325842, "epoch": 3925} {"train_loss": -25.61676597595215, "global_step": 325843, "epoch": 3925} {"train_loss": -26.07057762145996, "global_step": 325844, "epoch": 3925} {"train_loss": -26.06001091003418, "global_step": 325845, "epoch": 3925} {"train_loss": -25.859350204467773, "global_step": 325846, "epoch": 3925} {"train_loss": -26.1192684173584, "global_step": 325847, "epoch": 3925} {"train_loss": -26.25245475769043, "global_step": 325848, "epoch": 3925} {"train_loss": -25.9487247467041, "global_step": 325849, "epoch": 3925} {"train_loss": -26.31196403503418, "global_step": 325850, "epoch": 3925} {"train_loss": -26.1124267578125, "global_step": 325851, "epoch": 3925} {"train_loss": -26.257726669311523, "global_step": 325852, "epoch": 3925} {"train_loss": -26.037372589111328, "global_step": 325853, "epoch": 3925} {"train_loss": -25.8825740814209, "global_step": 325854, "epoch": 3925} {"train_loss": -25.907806396484375, "global_step": 325855, "epoch": 3925} {"train_loss": -26.06807518005371, "global_step": 325856, "epoch": 3925} {"train_loss": -25.761394133050757, "global_step": 325857, "epoch": 3925, "val_loss": 7288486.0} {"train_loss": -25.77596092224121, "global_step": 325858, "epoch": 3926} {"train_loss": -25.939207077026367, "global_step": 325859, "epoch": 3926} {"train_loss": -25.638044357299805, "global_step": 325860, "epoch": 3926} {"train_loss": -25.896406173706055, "global_step": 325861, "epoch": 3926} {"train_loss": -25.611886978149414, "global_step": 325862, "epoch": 3926} {"train_loss": -25.916259765625, "global_step": 325863, "epoch": 3926} {"train_loss": -25.41310691833496, "global_step": 325864, "epoch": 3926} {"train_loss": -25.606748580932617, "global_step": 325865, "epoch": 3926} {"train_loss": -26.101337432861328, "global_step": 325866, "epoch": 3926} {"train_loss": -25.693201065063477, "global_step": 325867, "epoch": 3926} {"train_loss": -25.366607666015625, "global_step": 325868, "epoch": 3926} {"train_loss": -25.88483238220215, "global_step": 325869, "epoch": 3926} {"train_loss": -25.621057510375977, "global_step": 325870, "epoch": 3926} {"train_loss": -25.65711784362793, "global_step": 325871, "epoch": 3926} {"train_loss": -25.63710594177246, "global_step": 325872, "epoch": 3926} {"train_loss": -25.625152587890625, "global_step": 325873, "epoch": 3926} {"train_loss": -25.613422393798828, "global_step": 325874, "epoch": 3926} {"train_loss": -25.756488800048828, "global_step": 325875, "epoch": 3926} {"train_loss": -25.946807861328125, "global_step": 325876, "epoch": 3926} {"train_loss": -25.848953247070312, "global_step": 325877, "epoch": 3926} {"train_loss": -25.57858657836914, "global_step": 325878, "epoch": 3926} {"train_loss": -25.289432525634766, "global_step": 325879, "epoch": 3926} {"train_loss": -25.904035568237305, "global_step": 325880, "epoch": 3926} {"train_loss": -25.790098190307617, "global_step": 325881, "epoch": 3926} {"train_loss": -25.741897583007812, "global_step": 325882, "epoch": 3926} {"train_loss": -25.665454864501953, "global_step": 325883, "epoch": 3926} {"train_loss": -25.767236709594727, "global_step": 325884, "epoch": 3926} {"train_loss": -25.925739288330078, "global_step": 325885, "epoch": 3926} {"train_loss": -25.758649826049805, "global_step": 325886, "epoch": 3926} {"train_loss": -25.85455322265625, "global_step": 325887, "epoch": 3926} {"train_loss": -26.001996994018555, "global_step": 325888, "epoch": 3926} {"train_loss": -26.009048461914062, "global_step": 325889, "epoch": 3926} {"train_loss": -25.965229034423828, "global_step": 325890, "epoch": 3926} {"train_loss": -25.949644088745117, "global_step": 325891, "epoch": 3926} {"train_loss": -25.779773712158203, "global_step": 325892, "epoch": 3926} {"train_loss": -26.215295791625977, "global_step": 325893, "epoch": 3926} {"train_loss": -26.011642456054688, "global_step": 325894, "epoch": 3926} {"train_loss": -26.0636043548584, "global_step": 325895, "epoch": 3926} {"train_loss": -26.20078468322754, "global_step": 325896, "epoch": 3926} {"train_loss": -26.09003257751465, "global_step": 325897, "epoch": 3926} {"train_loss": -25.674163818359375, "global_step": 325898, "epoch": 3926} {"train_loss": -26.095380783081055, "global_step": 325899, "epoch": 3926} {"train_loss": -25.725605010986328, "global_step": 325900, "epoch": 3926} {"train_loss": -25.636077880859375, "global_step": 325901, "epoch": 3926} {"train_loss": -26.006078720092773, "global_step": 325902, "epoch": 3926} {"train_loss": -25.950897216796875, "global_step": 325903, "epoch": 3926} {"train_loss": -25.97007179260254, "global_step": 325904, "epoch": 3926} {"train_loss": -25.837188720703125, "global_step": 325905, "epoch": 3926} {"train_loss": -25.7972354888916, "global_step": 325906, "epoch": 3926} {"train_loss": -25.822484970092773, "global_step": 325907, "epoch": 3926} {"train_loss": -26.24851417541504, "global_step": 325908, "epoch": 3926} {"train_loss": -25.78656578063965, "global_step": 325909, "epoch": 3926} {"train_loss": -26.309362411499023, "global_step": 325910, "epoch": 3926} {"train_loss": -26.1844482421875, "global_step": 325911, "epoch": 3926} {"train_loss": -26.0616512298584, "global_step": 325912, "epoch": 3926} {"train_loss": -25.79380226135254, "global_step": 325913, "epoch": 3926} {"train_loss": -26.162580490112305, "global_step": 325914, "epoch": 3926} {"train_loss": -25.890766143798828, "global_step": 325915, "epoch": 3926} {"train_loss": -25.9527530670166, "global_step": 325916, "epoch": 3926} {"train_loss": -25.82305908203125, "global_step": 325917, "epoch": 3926} {"train_loss": -26.201507568359375, "global_step": 325918, "epoch": 3926} {"train_loss": -25.767263412475586, "global_step": 325919, "epoch": 3926} {"train_loss": -25.80732536315918, "global_step": 325920, "epoch": 3926} {"train_loss": -25.679431915283203, "global_step": 325921, "epoch": 3926} {"train_loss": -25.689117431640625, "global_step": 325922, "epoch": 3926} {"train_loss": -25.951318740844727, "global_step": 325923, "epoch": 3926} {"train_loss": -25.8411865234375, "global_step": 325924, "epoch": 3926} {"train_loss": -25.75459098815918, "global_step": 325925, "epoch": 3926} {"train_loss": -25.822650909423828, "global_step": 325926, "epoch": 3926} {"train_loss": -25.944555282592773, "global_step": 325927, "epoch": 3926} {"train_loss": -25.93256950378418, "global_step": 325928, "epoch": 3926} {"train_loss": -25.774005889892578, "global_step": 325929, "epoch": 3926} {"train_loss": -26.030210494995117, "global_step": 325930, "epoch": 3926} {"train_loss": -25.7971134185791, "global_step": 325931, "epoch": 3926} {"train_loss": -25.994293212890625, "global_step": 325932, "epoch": 3926} {"train_loss": -26.01025390625, "global_step": 325933, "epoch": 3926} {"train_loss": -26.395368576049805, "global_step": 325934, "epoch": 3926} {"train_loss": -25.78739356994629, "global_step": 325935, "epoch": 3926} {"train_loss": -26.05169677734375, "global_step": 325936, "epoch": 3926} {"train_loss": -25.9088077545166, "global_step": 325937, "epoch": 3926} {"train_loss": -25.96185874938965, "global_step": 325938, "epoch": 3926} {"train_loss": -26.023681640625, "global_step": 325939, "epoch": 3926} {"train_loss": -25.85761323032609, "global_step": 325940, "epoch": 3926, "val_loss": 7238027.0} {"train_loss": -24.787796020507812, "global_step": 325941, "epoch": 3927} {"train_loss": -24.342844009399414, "global_step": 325942, "epoch": 3927} {"train_loss": -25.322580337524414, "global_step": 325943, "epoch": 3927} {"train_loss": -24.937612533569336, "global_step": 325944, "epoch": 3927} {"train_loss": -25.19451332092285, "global_step": 325945, "epoch": 3927} {"train_loss": -25.318620681762695, "global_step": 325946, "epoch": 3927} {"train_loss": -25.31983757019043, "global_step": 325947, "epoch": 3927} {"train_loss": -24.616254806518555, "global_step": 325948, "epoch": 3927} {"train_loss": -25.488759994506836, "global_step": 325949, "epoch": 3927} {"train_loss": -25.34817123413086, "global_step": 325950, "epoch": 3927} {"train_loss": -25.523662567138672, "global_step": 325951, "epoch": 3927} {"train_loss": -25.2322940826416, "global_step": 325952, "epoch": 3927} {"train_loss": -25.280691146850586, "global_step": 325953, "epoch": 3927} {"train_loss": -25.00939178466797, "global_step": 325954, "epoch": 3927} {"train_loss": -25.299711227416992, "global_step": 325955, "epoch": 3927} {"train_loss": -24.928611755371094, "global_step": 325956, "epoch": 3927} {"train_loss": -25.144689559936523, "global_step": 325957, "epoch": 3927} {"train_loss": -25.128555297851562, "global_step": 325958, "epoch": 3927} {"train_loss": -25.33375358581543, "global_step": 325959, "epoch": 3927} {"train_loss": -25.720319747924805, "global_step": 325960, "epoch": 3927} {"train_loss": -25.295881271362305, "global_step": 325961, "epoch": 3927} {"train_loss": -25.968276977539062, "global_step": 325962, "epoch": 3927} {"train_loss": -25.67604637145996, "global_step": 325963, "epoch": 3927} {"train_loss": -25.792951583862305, "global_step": 325964, "epoch": 3927} {"train_loss": -25.834882736206055, "global_step": 325965, "epoch": 3927} {"train_loss": -25.74238395690918, "global_step": 325966, "epoch": 3927} {"train_loss": -25.715185165405273, "global_step": 325967, "epoch": 3927} {"train_loss": -25.748462677001953, "global_step": 325968, "epoch": 3927} {"train_loss": -25.59363555908203, "global_step": 325969, "epoch": 3927} {"train_loss": -25.865060806274414, "global_step": 325970, "epoch": 3927} {"train_loss": -25.631444931030273, "global_step": 325971, "epoch": 3927} {"train_loss": -26.06005859375, "global_step": 325972, "epoch": 3927} {"train_loss": -25.75874137878418, "global_step": 325973, "epoch": 3927} {"train_loss": -26.07037353515625, "global_step": 325974, "epoch": 3927} {"train_loss": -25.914159774780273, "global_step": 325975, "epoch": 3927} {"train_loss": -25.802194595336914, "global_step": 325976, "epoch": 3927} {"train_loss": -25.939777374267578, "global_step": 325977, "epoch": 3927} {"train_loss": -25.879423141479492, "global_step": 325978, "epoch": 3927} {"train_loss": -26.139423370361328, "global_step": 325979, "epoch": 3927} {"train_loss": -26.09649658203125, "global_step": 325980, "epoch": 3927} {"train_loss": -25.925500869750977, "global_step": 325981, "epoch": 3927} {"train_loss": -25.97391700744629, "global_step": 325982, "epoch": 3927} {"train_loss": -26.17667579650879, "global_step": 325983, "epoch": 3927} {"train_loss": -25.8226261138916, "global_step": 325984, "epoch": 3927} {"train_loss": -26.061193466186523, "global_step": 325985, "epoch": 3927} {"train_loss": -25.86565589904785, "global_step": 325986, "epoch": 3927} {"train_loss": -25.70953369140625, "global_step": 325987, "epoch": 3927} {"train_loss": -26.365447998046875, "global_step": 325988, "epoch": 3927} {"train_loss": -25.98430824279785, "global_step": 325989, "epoch": 3927} {"train_loss": -26.246479034423828, "global_step": 325990, "epoch": 3927} {"train_loss": -26.24383544921875, "global_step": 325991, "epoch": 3927} {"train_loss": -26.107013702392578, "global_step": 325992, "epoch": 3927} {"train_loss": -26.076324462890625, "global_step": 325993, "epoch": 3927} {"train_loss": -26.22882652282715, "global_step": 325994, "epoch": 3927} {"train_loss": -26.08169937133789, "global_step": 325995, "epoch": 3927} {"train_loss": -26.244104385375977, "global_step": 325996, "epoch": 3927} {"train_loss": -26.205036163330078, "global_step": 325997, "epoch": 3927} {"train_loss": -26.022918701171875, "global_step": 325998, "epoch": 3927} {"train_loss": -25.725915908813477, "global_step": 325999, "epoch": 3927} {"train_loss": -25.86749267578125, "global_step": 326000, "epoch": 3927} {"train_loss": -26.410064697265625, "global_step": 326001, "epoch": 3927} {"train_loss": -25.928625106811523, "global_step": 326002, "epoch": 3927} {"train_loss": -25.878843307495117, "global_step": 326003, "epoch": 3927} {"train_loss": -25.913009643554688, "global_step": 326004, "epoch": 3927} {"train_loss": -26.344970703125, "global_step": 326005, "epoch": 3927} {"train_loss": -25.863309860229492, "global_step": 326006, "epoch": 3927} {"train_loss": -25.532047271728516, "global_step": 326007, "epoch": 3927} {"train_loss": -25.293079376220703, "global_step": 326008, "epoch": 3927} {"train_loss": -25.186635971069336, "global_step": 326009, "epoch": 3927} {"train_loss": -24.99399185180664, "global_step": 326010, "epoch": 3927} {"train_loss": -25.242843627929688, "global_step": 326011, "epoch": 3927} {"train_loss": -25.417417526245117, "global_step": 326012, "epoch": 3927} {"train_loss": -26.101892471313477, "global_step": 326013, "epoch": 3927} {"train_loss": -25.334697723388672, "global_step": 326014, "epoch": 3927} {"train_loss": -25.8172664642334, "global_step": 326015, "epoch": 3927} {"train_loss": -25.732437133789062, "global_step": 326016, "epoch": 3927} {"train_loss": -25.525800704956055, "global_step": 326017, "epoch": 3927} {"train_loss": -25.530744552612305, "global_step": 326018, "epoch": 3927} {"train_loss": -25.542333602905273, "global_step": 326019, "epoch": 3927} {"train_loss": -25.474138259887695, "global_step": 326020, "epoch": 3927} {"train_loss": -25.81953239440918, "global_step": 326021, "epoch": 3927} {"train_loss": -25.88003921508789, "global_step": 326022, "epoch": 3927} {"train_loss": -25.676023230495222, "global_step": 326023, "epoch": 3927, "val_loss": 7211379.0} {"train_loss": -25.39253044128418, "global_step": 326024, "epoch": 3928} {"train_loss": -25.075674057006836, "global_step": 326025, "epoch": 3928} {"train_loss": -25.54610252380371, "global_step": 326026, "epoch": 3928} {"train_loss": -24.996997833251953, "global_step": 326027, "epoch": 3928} {"train_loss": -24.8786678314209, "global_step": 326028, "epoch": 3928} {"train_loss": -25.292036056518555, "global_step": 326029, "epoch": 3928} {"train_loss": -25.277318954467773, "global_step": 326030, "epoch": 3928} {"train_loss": -25.16542625427246, "global_step": 326031, "epoch": 3928} {"train_loss": -25.684289932250977, "global_step": 326032, "epoch": 3928} {"train_loss": -25.301631927490234, "global_step": 326033, "epoch": 3928} {"train_loss": -25.874143600463867, "global_step": 326034, "epoch": 3928} {"train_loss": -25.394039154052734, "global_step": 326035, "epoch": 3928} {"train_loss": -25.115249633789062, "global_step": 326036, "epoch": 3928} {"train_loss": -25.50758934020996, "global_step": 326037, "epoch": 3928} {"train_loss": -25.830707550048828, "global_step": 326038, "epoch": 3928} {"train_loss": -25.27297019958496, "global_step": 326039, "epoch": 3928} {"train_loss": -25.819005966186523, "global_step": 326040, "epoch": 3928} {"train_loss": -25.549957275390625, "global_step": 326041, "epoch": 3928} {"train_loss": -25.764856338500977, "global_step": 326042, "epoch": 3928} {"train_loss": -25.551395416259766, "global_step": 326043, "epoch": 3928} {"train_loss": -25.55000877380371, "global_step": 326044, "epoch": 3928} {"train_loss": -25.662389755249023, "global_step": 326045, "epoch": 3928} {"train_loss": -25.91107177734375, "global_step": 326046, "epoch": 3928} {"train_loss": -26.28692054748535, "global_step": 326047, "epoch": 3928} {"train_loss": -25.59585189819336, "global_step": 326048, "epoch": 3928} {"train_loss": -25.745046615600586, "global_step": 326049, "epoch": 3928} {"train_loss": -25.93230628967285, "global_step": 326050, "epoch": 3928} {"train_loss": -25.819416046142578, "global_step": 326051, "epoch": 3928} {"train_loss": -25.97492027282715, "global_step": 326052, "epoch": 3928} {"train_loss": -26.204614639282227, "global_step": 326053, "epoch": 3928} {"train_loss": -26.10169792175293, "global_step": 326054, "epoch": 3928} {"train_loss": -26.2237606048584, "global_step": 326055, "epoch": 3928} {"train_loss": -26.013397216796875, "global_step": 326056, "epoch": 3928} {"train_loss": -25.554304122924805, "global_step": 326057, "epoch": 3928} {"train_loss": -26.071369171142578, "global_step": 326058, "epoch": 3928} {"train_loss": -26.039899826049805, "global_step": 326059, "epoch": 3928} {"train_loss": -26.085412979125977, "global_step": 326060, "epoch": 3928} {"train_loss": -26.403411865234375, "global_step": 326061, "epoch": 3928} {"train_loss": -25.609634399414062, "global_step": 326062, "epoch": 3928} {"train_loss": -26.130277633666992, "global_step": 326063, "epoch": 3928} {"train_loss": -25.83827781677246, "global_step": 326064, "epoch": 3928} {"train_loss": -26.187341690063477, "global_step": 326065, "epoch": 3928} {"train_loss": -26.060306549072266, "global_step": 326066, "epoch": 3928} {"train_loss": -25.800739288330078, "global_step": 326067, "epoch": 3928} {"train_loss": -25.96221923828125, "global_step": 326068, "epoch": 3928} {"train_loss": -26.094940185546875, "global_step": 326069, "epoch": 3928} {"train_loss": -26.271032333374023, "global_step": 326070, "epoch": 3928} {"train_loss": -26.210599899291992, "global_step": 326071, "epoch": 3928} {"train_loss": -26.00798988342285, "global_step": 326072, "epoch": 3928} {"train_loss": -25.835052490234375, "global_step": 326073, "epoch": 3928} {"train_loss": -25.858869552612305, "global_step": 326074, "epoch": 3928} {"train_loss": -26.050352096557617, "global_step": 326075, "epoch": 3928} {"train_loss": -25.908863067626953, "global_step": 326076, "epoch": 3928} {"train_loss": -25.707212448120117, "global_step": 326077, "epoch": 3928} {"train_loss": -25.982410430908203, "global_step": 326078, "epoch": 3928} {"train_loss": -26.2435245513916, "global_step": 326079, "epoch": 3928} {"train_loss": -26.357763290405273, "global_step": 326080, "epoch": 3928} {"train_loss": -25.74969482421875, "global_step": 326081, "epoch": 3928} {"train_loss": -25.816619873046875, "global_step": 326082, "epoch": 3928} {"train_loss": -25.59003448486328, "global_step": 326083, "epoch": 3928} {"train_loss": -26.1746768951416, "global_step": 326084, "epoch": 3928} {"train_loss": -25.896926879882812, "global_step": 326085, "epoch": 3928} {"train_loss": -25.745386123657227, "global_step": 326086, "epoch": 3928} {"train_loss": -25.381162643432617, "global_step": 326087, "epoch": 3928} {"train_loss": -25.883764266967773, "global_step": 326088, "epoch": 3928} {"train_loss": -25.765064239501953, "global_step": 326089, "epoch": 3928} {"train_loss": -25.862567901611328, "global_step": 326090, "epoch": 3928} {"train_loss": -25.779071807861328, "global_step": 326091, "epoch": 3928} {"train_loss": -25.94732666015625, "global_step": 326092, "epoch": 3928} {"train_loss": -25.552082061767578, "global_step": 326093, "epoch": 3928} {"train_loss": -25.923978805541992, "global_step": 326094, "epoch": 3928} {"train_loss": -25.63556480407715, "global_step": 326095, "epoch": 3928} {"train_loss": -25.745410919189453, "global_step": 326096, "epoch": 3928} {"train_loss": -25.647729873657227, "global_step": 326097, "epoch": 3928} {"train_loss": -25.949604034423828, "global_step": 326098, "epoch": 3928} {"train_loss": -25.50719451904297, "global_step": 326099, "epoch": 3928} {"train_loss": -25.795761108398438, "global_step": 326100, "epoch": 3928} {"train_loss": -25.990432739257812, "global_step": 326101, "epoch": 3928} {"train_loss": -25.604633331298828, "global_step": 326102, "epoch": 3928} {"train_loss": -25.7642765045166, "global_step": 326103, "epoch": 3928} {"train_loss": -25.464502334594727, "global_step": 326104, "epoch": 3928} {"train_loss": -25.84186363220215, "global_step": 326105, "epoch": 3928} {"train_loss": -25.775642119258283, "global_step": 326106, "epoch": 3928, "val_loss": 7197513.0} {"train_loss": -25.187294006347656, "global_step": 326107, "epoch": 3929} {"train_loss": -24.727758407592773, "global_step": 326108, "epoch": 3929} {"train_loss": -25.479276657104492, "global_step": 326109, "epoch": 3929} {"train_loss": -25.365644454956055, "global_step": 326110, "epoch": 3929} {"train_loss": -25.28704833984375, "global_step": 326111, "epoch": 3929} {"train_loss": -25.772968292236328, "global_step": 326112, "epoch": 3929} {"train_loss": -25.097209930419922, "global_step": 326113, "epoch": 3929} {"train_loss": -25.806304931640625, "global_step": 326114, "epoch": 3929} {"train_loss": -25.367475509643555, "global_step": 326115, "epoch": 3929} {"train_loss": -24.990463256835938, "global_step": 326116, "epoch": 3929} {"train_loss": -25.28365707397461, "global_step": 326117, "epoch": 3929} {"train_loss": -25.335098266601562, "global_step": 326118, "epoch": 3929} {"train_loss": -25.739837646484375, "global_step": 326119, "epoch": 3929} {"train_loss": -25.33574867248535, "global_step": 326120, "epoch": 3929} {"train_loss": -25.496931076049805, "global_step": 326121, "epoch": 3929} {"train_loss": -25.553394317626953, "global_step": 326122, "epoch": 3929} {"train_loss": -25.191003799438477, "global_step": 326123, "epoch": 3929} {"train_loss": -25.503995895385742, "global_step": 326124, "epoch": 3929} {"train_loss": -25.763671875, "global_step": 326125, "epoch": 3929} {"train_loss": -25.443525314331055, "global_step": 326126, "epoch": 3929} {"train_loss": -25.401317596435547, "global_step": 326127, "epoch": 3929} {"train_loss": -25.428499221801758, "global_step": 326128, "epoch": 3929} {"train_loss": -25.44209861755371, "global_step": 326129, "epoch": 3929} {"train_loss": -25.473766326904297, "global_step": 326130, "epoch": 3929} {"train_loss": -25.382007598876953, "global_step": 326131, "epoch": 3929} {"train_loss": -25.624237060546875, "global_step": 326132, "epoch": 3929} {"train_loss": -25.56990623474121, "global_step": 326133, "epoch": 3929} {"train_loss": -25.898956298828125, "global_step": 326134, "epoch": 3929} {"train_loss": -25.794952392578125, "global_step": 326135, "epoch": 3929} {"train_loss": -25.704105377197266, "global_step": 326136, "epoch": 3929} {"train_loss": -25.873687744140625, "global_step": 326137, "epoch": 3929} {"train_loss": -25.809778213500977, "global_step": 326138, "epoch": 3929} {"train_loss": -25.534326553344727, "global_step": 326139, "epoch": 3929} {"train_loss": -25.903467178344727, "global_step": 326140, "epoch": 3929} {"train_loss": -25.894113540649414, "global_step": 326141, "epoch": 3929} {"train_loss": -25.70233154296875, "global_step": 326142, "epoch": 3929} {"train_loss": -25.75111198425293, "global_step": 326143, "epoch": 3929} {"train_loss": -25.980224609375, "global_step": 326144, "epoch": 3929} {"train_loss": -26.14739418029785, "global_step": 326145, "epoch": 3929} {"train_loss": -26.12074851989746, "global_step": 326146, "epoch": 3929} {"train_loss": -26.0274658203125, "global_step": 326147, "epoch": 3929} {"train_loss": -25.747577667236328, "global_step": 326148, "epoch": 3929} {"train_loss": -25.925674438476562, "global_step": 326149, "epoch": 3929} {"train_loss": -25.896432876586914, "global_step": 326150, "epoch": 3929} {"train_loss": -25.7676944732666, "global_step": 326151, "epoch": 3929} {"train_loss": -26.176599502563477, "global_step": 326152, "epoch": 3929} {"train_loss": -26.250919342041016, "global_step": 326153, "epoch": 3929} {"train_loss": -26.29312515258789, "global_step": 326154, "epoch": 3929} {"train_loss": -25.738428115844727, "global_step": 326155, "epoch": 3929} {"train_loss": -25.916959762573242, "global_step": 326156, "epoch": 3929} {"train_loss": -25.935373306274414, "global_step": 326157, "epoch": 3929} {"train_loss": -25.857709884643555, "global_step": 326158, "epoch": 3929} {"train_loss": -26.29732322692871, "global_step": 326159, "epoch": 3929} {"train_loss": -25.706024169921875, "global_step": 326160, "epoch": 3929} {"train_loss": -26.147241592407227, "global_step": 326161, "epoch": 3929} {"train_loss": -26.225858688354492, "global_step": 326162, "epoch": 3929} {"train_loss": -26.07793617248535, "global_step": 326163, "epoch": 3929} {"train_loss": -26.257917404174805, "global_step": 326164, "epoch": 3929} {"train_loss": -25.958038330078125, "global_step": 326165, "epoch": 3929} {"train_loss": -25.95167350769043, "global_step": 326166, "epoch": 3929} {"train_loss": -26.260009765625, "global_step": 326167, "epoch": 3929} {"train_loss": -25.917749404907227, "global_step": 326168, "epoch": 3929} {"train_loss": -25.78220558166504, "global_step": 326169, "epoch": 3929} {"train_loss": -26.327863693237305, "global_step": 326170, "epoch": 3929} {"train_loss": -25.78826904296875, "global_step": 326171, "epoch": 3929} {"train_loss": -26.204099655151367, "global_step": 326172, "epoch": 3929} {"train_loss": -26.1738338470459, "global_step": 326173, "epoch": 3929} {"train_loss": -26.02618980407715, "global_step": 326174, "epoch": 3929} {"train_loss": -26.179981231689453, "global_step": 326175, "epoch": 3929} {"train_loss": -26.002490997314453, "global_step": 326176, "epoch": 3929} {"train_loss": -25.93601417541504, "global_step": 326177, "epoch": 3929} {"train_loss": -25.580209732055664, "global_step": 326178, "epoch": 3929} {"train_loss": -25.626575469970703, "global_step": 326179, "epoch": 3929} {"train_loss": -25.289533615112305, "global_step": 326180, "epoch": 3929} {"train_loss": -25.66261100769043, "global_step": 326181, "epoch": 3929} {"train_loss": -26.073816299438477, "global_step": 326182, "epoch": 3929} {"train_loss": -25.677845001220703, "global_step": 326183, "epoch": 3929} {"train_loss": -26.03877067565918, "global_step": 326184, "epoch": 3929} {"train_loss": -25.96687126159668, "global_step": 326185, "epoch": 3929} {"train_loss": -25.629505157470703, "global_step": 326186, "epoch": 3929} {"train_loss": -26.111433029174805, "global_step": 326187, "epoch": 3929} {"train_loss": -25.64817237854004, "global_step": 326188, "epoch": 3929} {"train_loss": -25.76754765338208, "global_step": 326189, "epoch": 3929, "val_loss": 7160012.0} {"train_loss": -25.771240234375, "global_step": 326190, "epoch": 3930} {"train_loss": -25.446327209472656, "global_step": 326191, "epoch": 3930} {"train_loss": -25.132062911987305, "global_step": 326192, "epoch": 3930} {"train_loss": -25.39277458190918, "global_step": 326193, "epoch": 3930} {"train_loss": -25.457609176635742, "global_step": 326194, "epoch": 3930} {"train_loss": -25.59803581237793, "global_step": 326195, "epoch": 3930} {"train_loss": -25.21518325805664, "global_step": 326196, "epoch": 3930} {"train_loss": -25.489633560180664, "global_step": 326197, "epoch": 3930} {"train_loss": -25.50074577331543, "global_step": 326198, "epoch": 3930} {"train_loss": -25.83893394470215, "global_step": 326199, "epoch": 3930} {"train_loss": -25.472639083862305, "global_step": 326200, "epoch": 3930} {"train_loss": -25.306570053100586, "global_step": 326201, "epoch": 3930} {"train_loss": -25.754562377929688, "global_step": 326202, "epoch": 3930} {"train_loss": -25.944278717041016, "global_step": 326203, "epoch": 3930} {"train_loss": -25.592679977416992, "global_step": 326204, "epoch": 3930} {"train_loss": -25.714664459228516, "global_step": 326205, "epoch": 3930} {"train_loss": -25.658126831054688, "global_step": 326206, "epoch": 3930} {"train_loss": -25.463300704956055, "global_step": 326207, "epoch": 3930} {"train_loss": -25.72060203552246, "global_step": 326208, "epoch": 3930} {"train_loss": -25.512432098388672, "global_step": 326209, "epoch": 3930} {"train_loss": -25.713916778564453, "global_step": 326210, "epoch": 3930} {"train_loss": -25.78778648376465, "global_step": 326211, "epoch": 3930} {"train_loss": -25.766437530517578, "global_step": 326212, "epoch": 3930} {"train_loss": -25.64263343811035, "global_step": 326213, "epoch": 3930} {"train_loss": -25.583499908447266, "global_step": 326214, "epoch": 3930} {"train_loss": -25.787006378173828, "global_step": 326215, "epoch": 3930} {"train_loss": -25.62116050720215, "global_step": 326216, "epoch": 3930} {"train_loss": -25.56707763671875, "global_step": 326217, "epoch": 3930} {"train_loss": -26.008386611938477, "global_step": 326218, "epoch": 3930} {"train_loss": -25.750152587890625, "global_step": 326219, "epoch": 3930} {"train_loss": -26.065671920776367, "global_step": 326220, "epoch": 3930} {"train_loss": -25.853544235229492, "global_step": 326221, "epoch": 3930} {"train_loss": -25.72358512878418, "global_step": 326222, "epoch": 3930} {"train_loss": -26.148523330688477, "global_step": 326223, "epoch": 3930} {"train_loss": -25.9509220123291, "global_step": 326224, "epoch": 3930} {"train_loss": -26.115802764892578, "global_step": 326225, "epoch": 3930} {"train_loss": -25.635107040405273, "global_step": 326226, "epoch": 3930} {"train_loss": -26.121084213256836, "global_step": 326227, "epoch": 3930} {"train_loss": -25.701831817626953, "global_step": 326228, "epoch": 3930} {"train_loss": -25.864110946655273, "global_step": 326229, "epoch": 3930} {"train_loss": -26.132965087890625, "global_step": 326230, "epoch": 3930} {"train_loss": -26.047760009765625, "global_step": 326231, "epoch": 3930} {"train_loss": -25.939960479736328, "global_step": 326232, "epoch": 3930} {"train_loss": -25.799467086791992, "global_step": 326233, "epoch": 3930} {"train_loss": -26.21015739440918, "global_step": 326234, "epoch": 3930} {"train_loss": -26.008426666259766, "global_step": 326235, "epoch": 3930} {"train_loss": -26.091073989868164, "global_step": 326236, "epoch": 3930} {"train_loss": -26.157506942749023, "global_step": 326237, "epoch": 3930} {"train_loss": -26.05768394470215, "global_step": 326238, "epoch": 3930} {"train_loss": -26.076574325561523, "global_step": 326239, "epoch": 3930} {"train_loss": -25.876758575439453, "global_step": 326240, "epoch": 3930} {"train_loss": -26.37432861328125, "global_step": 326241, "epoch": 3930} {"train_loss": -26.01161003112793, "global_step": 326242, "epoch": 3930} {"train_loss": -26.223590850830078, "global_step": 326243, "epoch": 3930} {"train_loss": -26.11753273010254, "global_step": 326244, "epoch": 3930} {"train_loss": -25.8980655670166, "global_step": 326245, "epoch": 3930} {"train_loss": -26.16016960144043, "global_step": 326246, "epoch": 3930} {"train_loss": -26.4799747467041, "global_step": 326247, "epoch": 3930} {"train_loss": -26.10159683227539, "global_step": 326248, "epoch": 3930} {"train_loss": -25.778913497924805, "global_step": 326249, "epoch": 3930} {"train_loss": -26.04860496520996, "global_step": 326250, "epoch": 3930} {"train_loss": -25.923974990844727, "global_step": 326251, "epoch": 3930} {"train_loss": -25.24631118774414, "global_step": 326252, "epoch": 3930} {"train_loss": -24.736614227294922, "global_step": 326253, "epoch": 3930} {"train_loss": -24.38636016845703, "global_step": 326254, "epoch": 3930} {"train_loss": -24.744470596313477, "global_step": 326255, "epoch": 3930} {"train_loss": -25.920202255249023, "global_step": 326256, "epoch": 3930} {"train_loss": -25.659381866455078, "global_step": 326257, "epoch": 3930} {"train_loss": -25.804779052734375, "global_step": 326258, "epoch": 3930} {"train_loss": -25.462024688720703, "global_step": 326259, "epoch": 3930} {"train_loss": -25.51607322692871, "global_step": 326260, "epoch": 3930} {"train_loss": -25.703168869018555, "global_step": 326261, "epoch": 3930} {"train_loss": -25.726428985595703, "global_step": 326262, "epoch": 3930} {"train_loss": -25.752593994140625, "global_step": 326263, "epoch": 3930} {"train_loss": -25.57119369506836, "global_step": 326264, "epoch": 3930} {"train_loss": -25.944494247436523, "global_step": 326265, "epoch": 3930} {"train_loss": -25.6621150970459, "global_step": 326266, "epoch": 3930} {"train_loss": -26.089208602905273, "global_step": 326267, "epoch": 3930} {"train_loss": -25.503128051757812, "global_step": 326268, "epoch": 3930} {"train_loss": -25.832433700561523, "global_step": 326269, "epoch": 3930} {"train_loss": -26.077774047851562, "global_step": 326270, "epoch": 3930} {"train_loss": -25.809858322143555, "global_step": 326271, "epoch": 3930} {"train_loss": -25.761427247380634, "global_step": 326272, "epoch": 3930, "val_loss": 7335020.0} {"train_loss": -25.77322769165039, "global_step": 326273, "epoch": 3931} {"train_loss": -25.6005916595459, "global_step": 326274, "epoch": 3931} {"train_loss": -26.0582275390625, "global_step": 326275, "epoch": 3931} {"train_loss": -25.45182991027832, "global_step": 326276, "epoch": 3931} {"train_loss": -25.9591007232666, "global_step": 326277, "epoch": 3931} {"train_loss": -25.804540634155273, "global_step": 326278, "epoch": 3931} {"train_loss": -26.044677734375, "global_step": 326279, "epoch": 3931} {"train_loss": -25.817869186401367, "global_step": 326280, "epoch": 3931} {"train_loss": -25.67579460144043, "global_step": 326281, "epoch": 3931} {"train_loss": -25.9487361907959, "global_step": 326282, "epoch": 3931} {"train_loss": -26.108966827392578, "global_step": 326283, "epoch": 3931} {"train_loss": -26.178943634033203, "global_step": 326284, "epoch": 3931} {"train_loss": -26.169116973876953, "global_step": 326285, "epoch": 3931} {"train_loss": -25.90167236328125, "global_step": 326286, "epoch": 3931} {"train_loss": -26.226362228393555, "global_step": 326287, "epoch": 3931} {"train_loss": -26.082128524780273, "global_step": 326288, "epoch": 3931} {"train_loss": -25.897323608398438, "global_step": 326289, "epoch": 3931} {"train_loss": -25.529722213745117, "global_step": 326290, "epoch": 3931} {"train_loss": -26.065702438354492, "global_step": 326291, "epoch": 3931} {"train_loss": -26.0462646484375, "global_step": 326292, "epoch": 3931} {"train_loss": -26.24930763244629, "global_step": 326293, "epoch": 3931} {"train_loss": -26.029691696166992, "global_step": 326294, "epoch": 3931} {"train_loss": -26.356420516967773, "global_step": 326295, "epoch": 3931} {"train_loss": -25.9705810546875, "global_step": 326296, "epoch": 3931} {"train_loss": -26.318897247314453, "global_step": 326297, "epoch": 3931} {"train_loss": -26.187753677368164, "global_step": 326298, "epoch": 3931} {"train_loss": -26.06345558166504, "global_step": 326299, "epoch": 3931} {"train_loss": -25.885284423828125, "global_step": 326300, "epoch": 3931} {"train_loss": -26.049097061157227, "global_step": 326301, "epoch": 3931} {"train_loss": -26.181501388549805, "global_step": 326302, "epoch": 3931} {"train_loss": -25.90997314453125, "global_step": 326303, "epoch": 3931} {"train_loss": -25.855899810791016, "global_step": 326304, "epoch": 3931} {"train_loss": -25.74482536315918, "global_step": 326305, "epoch": 3931} {"train_loss": -26.137388229370117, "global_step": 326306, "epoch": 3931} {"train_loss": -25.89694595336914, "global_step": 326307, "epoch": 3931} {"train_loss": -25.649892807006836, "global_step": 326308, "epoch": 3931} {"train_loss": -25.633710861206055, "global_step": 326309, "epoch": 3931} {"train_loss": -26.075185775756836, "global_step": 326310, "epoch": 3931} {"train_loss": -26.200525283813477, "global_step": 326311, "epoch": 3931} {"train_loss": -26.214635848999023, "global_step": 326312, "epoch": 3931} {"train_loss": -25.83148765563965, "global_step": 326313, "epoch": 3931} {"train_loss": -26.089160919189453, "global_step": 326314, "epoch": 3931} {"train_loss": -26.341785430908203, "global_step": 326315, "epoch": 3931} {"train_loss": -26.041141510009766, "global_step": 326316, "epoch": 3931} {"train_loss": -25.933095932006836, "global_step": 326317, "epoch": 3931} {"train_loss": -25.656005859375, "global_step": 326318, "epoch": 3931} {"train_loss": -25.964075088500977, "global_step": 326319, "epoch": 3931} {"train_loss": -25.9362850189209, "global_step": 326320, "epoch": 3931} {"train_loss": -25.628467559814453, "global_step": 326321, "epoch": 3931} {"train_loss": -25.641149520874023, "global_step": 326322, "epoch": 3931} {"train_loss": -26.218494415283203, "global_step": 326323, "epoch": 3931} {"train_loss": -25.81342124938965, "global_step": 326324, "epoch": 3931} {"train_loss": -25.898574829101562, "global_step": 326325, "epoch": 3931} {"train_loss": -25.96265983581543, "global_step": 326326, "epoch": 3931} {"train_loss": -26.208765029907227, "global_step": 326327, "epoch": 3931} {"train_loss": -26.205846786499023, "global_step": 326328, "epoch": 3931} {"train_loss": -25.39061164855957, "global_step": 326329, "epoch": 3931} {"train_loss": -26.00958824157715, "global_step": 326330, "epoch": 3931} {"train_loss": -25.661884307861328, "global_step": 326331, "epoch": 3931} {"train_loss": -25.791187286376953, "global_step": 326332, "epoch": 3931} {"train_loss": -25.991575241088867, "global_step": 326333, "epoch": 3931} {"train_loss": -26.0252685546875, "global_step": 326334, "epoch": 3931} {"train_loss": -26.120695114135742, "global_step": 326335, "epoch": 3931} {"train_loss": -26.20371437072754, "global_step": 326336, "epoch": 3931} {"train_loss": -25.922016143798828, "global_step": 326337, "epoch": 3931} {"train_loss": -25.78374671936035, "global_step": 326338, "epoch": 3931} {"train_loss": -25.94135856628418, "global_step": 326339, "epoch": 3931} {"train_loss": -25.471269607543945, "global_step": 326340, "epoch": 3931} {"train_loss": -25.97222328186035, "global_step": 326341, "epoch": 3931} {"train_loss": -25.75666618347168, "global_step": 326342, "epoch": 3931} {"train_loss": -25.80879020690918, "global_step": 326343, "epoch": 3931} {"train_loss": -25.80377769470215, "global_step": 326344, "epoch": 3931} {"train_loss": -25.62863540649414, "global_step": 326345, "epoch": 3931} {"train_loss": -25.815587997436523, "global_step": 326346, "epoch": 3931} {"train_loss": -25.636335372924805, "global_step": 326347, "epoch": 3931} {"train_loss": -26.0018253326416, "global_step": 326348, "epoch": 3931} {"train_loss": -26.089981079101562, "global_step": 326349, "epoch": 3931} {"train_loss": -26.071075439453125, "global_step": 326350, "epoch": 3931} {"train_loss": -25.867218017578125, "global_step": 326351, "epoch": 3931} {"train_loss": -26.116546630859375, "global_step": 326352, "epoch": 3931} {"train_loss": -26.111597061157227, "global_step": 326353, "epoch": 3931} {"train_loss": -25.843557357788086, "global_step": 326354, "epoch": 3931} {"train_loss": -25.954102619584784, "global_step": 326355, "epoch": 3931, "val_loss": 7195584.0} {"train_loss": -25.73779296875, "global_step": 326356, "epoch": 3932} {"train_loss": -25.538217544555664, "global_step": 326357, "epoch": 3932} {"train_loss": -25.593204498291016, "global_step": 326358, "epoch": 3932} {"train_loss": -25.511106491088867, "global_step": 326359, "epoch": 3932} {"train_loss": -25.244998931884766, "global_step": 326360, "epoch": 3932} {"train_loss": -25.818317413330078, "global_step": 326361, "epoch": 3932} {"train_loss": -25.934919357299805, "global_step": 326362, "epoch": 3932} {"train_loss": -25.490478515625, "global_step": 326363, "epoch": 3932} {"train_loss": -25.6330623626709, "global_step": 326364, "epoch": 3932} {"train_loss": -25.660694122314453, "global_step": 326365, "epoch": 3932} {"train_loss": -25.569032669067383, "global_step": 326366, "epoch": 3932} {"train_loss": -25.952930450439453, "global_step": 326367, "epoch": 3932} {"train_loss": -25.7186336517334, "global_step": 326368, "epoch": 3932} {"train_loss": -26.18244743347168, "global_step": 326369, "epoch": 3932} {"train_loss": -25.90354347229004, "global_step": 326370, "epoch": 3932} {"train_loss": -25.956409454345703, "global_step": 326371, "epoch": 3932} {"train_loss": -25.928136825561523, "global_step": 326372, "epoch": 3932} {"train_loss": -26.078222274780273, "global_step": 326373, "epoch": 3932} {"train_loss": -25.715045928955078, "global_step": 326374, "epoch": 3932} {"train_loss": -26.01215171813965, "global_step": 326375, "epoch": 3932} {"train_loss": -25.779523849487305, "global_step": 326376, "epoch": 3932} {"train_loss": -26.033401489257812, "global_step": 326377, "epoch": 3932} {"train_loss": -25.781156539916992, "global_step": 326378, "epoch": 3932} {"train_loss": -25.895658493041992, "global_step": 326379, "epoch": 3932} {"train_loss": -25.693273544311523, "global_step": 326380, "epoch": 3932} {"train_loss": -25.61775016784668, "global_step": 326381, "epoch": 3932} {"train_loss": -25.783700942993164, "global_step": 326382, "epoch": 3932} {"train_loss": -25.700408935546875, "global_step": 326383, "epoch": 3932} {"train_loss": -25.522968292236328, "global_step": 326384, "epoch": 3932} {"train_loss": -25.879852294921875, "global_step": 326385, "epoch": 3932} {"train_loss": -25.644582748413086, "global_step": 326386, "epoch": 3932} {"train_loss": -25.632354736328125, "global_step": 326387, "epoch": 3932} {"train_loss": -25.87236976623535, "global_step": 326388, "epoch": 3932} {"train_loss": -25.295461654663086, "global_step": 326389, "epoch": 3932} {"train_loss": -26.101537704467773, "global_step": 326390, "epoch": 3932} {"train_loss": -25.701440811157227, "global_step": 326391, "epoch": 3932} {"train_loss": -25.714141845703125, "global_step": 326392, "epoch": 3932} {"train_loss": -26.286911010742188, "global_step": 326393, "epoch": 3932} {"train_loss": -25.720020294189453, "global_step": 326394, "epoch": 3932} {"train_loss": -25.60112953186035, "global_step": 326395, "epoch": 3932} {"train_loss": -26.029983520507812, "global_step": 326396, "epoch": 3932} {"train_loss": -26.105695724487305, "global_step": 326397, "epoch": 3932} {"train_loss": -25.56182861328125, "global_step": 326398, "epoch": 3932} {"train_loss": -25.822622299194336, "global_step": 326399, "epoch": 3932} {"train_loss": -25.73914909362793, "global_step": 326400, "epoch": 3932} {"train_loss": -25.83302116394043, "global_step": 326401, "epoch": 3932} {"train_loss": -26.0112361907959, "global_step": 326402, "epoch": 3932} {"train_loss": -26.011655807495117, "global_step": 326403, "epoch": 3932} {"train_loss": -25.821613311767578, "global_step": 326404, "epoch": 3932} {"train_loss": -25.861169815063477, "global_step": 326405, "epoch": 3932} {"train_loss": -25.922170639038086, "global_step": 326406, "epoch": 3932} {"train_loss": -25.894500732421875, "global_step": 326407, "epoch": 3932} {"train_loss": -25.9625244140625, "global_step": 326408, "epoch": 3932} {"train_loss": -25.750959396362305, "global_step": 326409, "epoch": 3932} {"train_loss": -25.850549697875977, "global_step": 326410, "epoch": 3932} {"train_loss": -26.147993087768555, "global_step": 326411, "epoch": 3932} {"train_loss": -25.983154296875, "global_step": 326412, "epoch": 3932} {"train_loss": -26.269758224487305, "global_step": 326413, "epoch": 3932} {"train_loss": -26.054601669311523, "global_step": 326414, "epoch": 3932} {"train_loss": -26.208419799804688, "global_step": 326415, "epoch": 3932} {"train_loss": -25.618759155273438, "global_step": 326416, "epoch": 3932} {"train_loss": -26.1605167388916, "global_step": 326417, "epoch": 3932} {"train_loss": -25.90093421936035, "global_step": 326418, "epoch": 3932} {"train_loss": -26.068252563476562, "global_step": 326419, "epoch": 3932} {"train_loss": -26.20148277282715, "global_step": 326420, "epoch": 3932} {"train_loss": -25.526884078979492, "global_step": 326421, "epoch": 3932} {"train_loss": -26.175445556640625, "global_step": 326422, "epoch": 3932} {"train_loss": -26.390655517578125, "global_step": 326423, "epoch": 3932} {"train_loss": -26.228607177734375, "global_step": 326424, "epoch": 3932} {"train_loss": -26.3280029296875, "global_step": 326425, "epoch": 3932} {"train_loss": -26.010242462158203, "global_step": 326426, "epoch": 3932} {"train_loss": -25.932861328125, "global_step": 326427, "epoch": 3932} {"train_loss": -25.92840576171875, "global_step": 326428, "epoch": 3932} {"train_loss": -26.2093563079834, "global_step": 326429, "epoch": 3932} {"train_loss": -26.408283233642578, "global_step": 326430, "epoch": 3932} {"train_loss": -26.085546493530273, "global_step": 326431, "epoch": 3932} {"train_loss": -25.80598258972168, "global_step": 326432, "epoch": 3932} {"train_loss": -25.57195472717285, "global_step": 326433, "epoch": 3932} {"train_loss": -25.487890243530273, "global_step": 326434, "epoch": 3932} {"train_loss": -25.71766471862793, "global_step": 326435, "epoch": 3932} {"train_loss": -25.587249755859375, "global_step": 326436, "epoch": 3932} {"train_loss": -25.888036727905273, "global_step": 326437, "epoch": 3932} {"train_loss": -25.849711245801075, "global_step": 326438, "epoch": 3932, "val_loss": 7201199.0} {"train_loss": -24.890384674072266, "global_step": 326439, "epoch": 3933} {"train_loss": -25.356643676757812, "global_step": 326440, "epoch": 3933} {"train_loss": -25.116811752319336, "global_step": 326441, "epoch": 3933} {"train_loss": -25.395071029663086, "global_step": 326442, "epoch": 3933} {"train_loss": -25.26698112487793, "global_step": 326443, "epoch": 3933} {"train_loss": -25.259883880615234, "global_step": 326444, "epoch": 3933} {"train_loss": -25.77783203125, "global_step": 326445, "epoch": 3933} {"train_loss": -25.694849014282227, "global_step": 326446, "epoch": 3933} {"train_loss": -25.631671905517578, "global_step": 326447, "epoch": 3933} {"train_loss": -25.394094467163086, "global_step": 326448, "epoch": 3933} {"train_loss": -26.007343292236328, "global_step": 326449, "epoch": 3933} {"train_loss": -25.72119140625, "global_step": 326450, "epoch": 3933} {"train_loss": -25.66928482055664, "global_step": 326451, "epoch": 3933} {"train_loss": -25.470617294311523, "global_step": 326452, "epoch": 3933} {"train_loss": -26.090253829956055, "global_step": 326453, "epoch": 3933} {"train_loss": -25.896692276000977, "global_step": 326454, "epoch": 3933} {"train_loss": -25.734495162963867, "global_step": 326455, "epoch": 3933} {"train_loss": -26.006921768188477, "global_step": 326456, "epoch": 3933} {"train_loss": -25.735212326049805, "global_step": 326457, "epoch": 3933} {"train_loss": -25.619924545288086, "global_step": 326458, "epoch": 3933} {"train_loss": -25.875900268554688, "global_step": 326459, "epoch": 3933} {"train_loss": -25.512527465820312, "global_step": 326460, "epoch": 3933} {"train_loss": -25.8763370513916, "global_step": 326461, "epoch": 3933} {"train_loss": -25.8668270111084, "global_step": 326462, "epoch": 3933} {"train_loss": -26.035364151000977, "global_step": 326463, "epoch": 3933} {"train_loss": -25.900766372680664, "global_step": 326464, "epoch": 3933} {"train_loss": -25.963239669799805, "global_step": 326465, "epoch": 3933} {"train_loss": -26.23908042907715, "global_step": 326466, "epoch": 3933} {"train_loss": -25.842365264892578, "global_step": 326467, "epoch": 3933} {"train_loss": -26.204355239868164, "global_step": 326468, "epoch": 3933} {"train_loss": -26.105911254882812, "global_step": 326469, "epoch": 3933} {"train_loss": -25.72751808166504, "global_step": 326470, "epoch": 3933} {"train_loss": -25.93059730529785, "global_step": 326471, "epoch": 3933} {"train_loss": -26.381948471069336, "global_step": 326472, "epoch": 3933} {"train_loss": -25.97629165649414, "global_step": 326473, "epoch": 3933} {"train_loss": -26.114286422729492, "global_step": 326474, "epoch": 3933} {"train_loss": -25.63034439086914, "global_step": 326475, "epoch": 3933} {"train_loss": -25.57463264465332, "global_step": 326476, "epoch": 3933} {"train_loss": -25.7536678314209, "global_step": 326477, "epoch": 3933} {"train_loss": -25.8864688873291, "global_step": 326478, "epoch": 3933} {"train_loss": -26.269262313842773, "global_step": 326479, "epoch": 3933} {"train_loss": -26.448583602905273, "global_step": 326480, "epoch": 3933} {"train_loss": -26.326704025268555, "global_step": 326481, "epoch": 3933} {"train_loss": -26.374494552612305, "global_step": 326482, "epoch": 3933} {"train_loss": -25.81916618347168, "global_step": 326483, "epoch": 3933} {"train_loss": -26.038867950439453, "global_step": 326484, "epoch": 3933} {"train_loss": -26.185958862304688, "global_step": 326485, "epoch": 3933} {"train_loss": -25.85208511352539, "global_step": 326486, "epoch": 3933} {"train_loss": -25.650897979736328, "global_step": 326487, "epoch": 3933} {"train_loss": -25.734058380126953, "global_step": 326488, "epoch": 3933} {"train_loss": -26.07869529724121, "global_step": 326489, "epoch": 3933} {"train_loss": -25.989154815673828, "global_step": 326490, "epoch": 3933} {"train_loss": -25.98103904724121, "global_step": 326491, "epoch": 3933} {"train_loss": -25.905521392822266, "global_step": 326492, "epoch": 3933} {"train_loss": -25.76556396484375, "global_step": 326493, "epoch": 3933} {"train_loss": -25.675519943237305, "global_step": 326494, "epoch": 3933} {"train_loss": -25.77581787109375, "global_step": 326495, "epoch": 3933} {"train_loss": -25.486560821533203, "global_step": 326496, "epoch": 3933} {"train_loss": -25.638080596923828, "global_step": 326497, "epoch": 3933} {"train_loss": -25.6199951171875, "global_step": 326498, "epoch": 3933} {"train_loss": -25.597257614135742, "global_step": 326499, "epoch": 3933} {"train_loss": -26.10784912109375, "global_step": 326500, "epoch": 3933} {"train_loss": -25.980854034423828, "global_step": 326501, "epoch": 3933} {"train_loss": -26.002782821655273, "global_step": 326502, "epoch": 3933} {"train_loss": -25.702594757080078, "global_step": 326503, "epoch": 3933} {"train_loss": -26.037805557250977, "global_step": 326504, "epoch": 3933} {"train_loss": -25.8050594329834, "global_step": 326505, "epoch": 3933} {"train_loss": -26.18501091003418, "global_step": 326506, "epoch": 3933} {"train_loss": -25.92389488220215, "global_step": 326507, "epoch": 3933} {"train_loss": -26.098342895507812, "global_step": 326508, "epoch": 3933} {"train_loss": -25.869115829467773, "global_step": 326509, "epoch": 3933} {"train_loss": -25.947097778320312, "global_step": 326510, "epoch": 3933} {"train_loss": -25.461170196533203, "global_step": 326511, "epoch": 3933} {"train_loss": -25.79568862915039, "global_step": 326512, "epoch": 3933} {"train_loss": -26.265064239501953, "global_step": 326513, "epoch": 3933} {"train_loss": -25.844684600830078, "global_step": 326514, "epoch": 3933} {"train_loss": -25.683670043945312, "global_step": 326515, "epoch": 3933} {"train_loss": -26.39557456970215, "global_step": 326516, "epoch": 3933} {"train_loss": -25.945898056030273, "global_step": 326517, "epoch": 3933} {"train_loss": -26.026386260986328, "global_step": 326518, "epoch": 3933} {"train_loss": -26.297195434570312, "global_step": 326519, "epoch": 3933} {"train_loss": -26.210119247436523, "global_step": 326520, "epoch": 3933} {"train_loss": -25.83821099063, "global_step": 326521, "epoch": 3933, "val_loss": 7275187.5} {"train_loss": -24.659748077392578, "global_step": 326522, "epoch": 3934} {"train_loss": -23.01679801940918, "global_step": 326523, "epoch": 3934} {"train_loss": -22.377805709838867, "global_step": 326524, "epoch": 3934} {"train_loss": -23.756940841674805, "global_step": 326525, "epoch": 3934} {"train_loss": -24.743038177490234, "global_step": 326526, "epoch": 3934} {"train_loss": -24.77536964416504, "global_step": 326527, "epoch": 3934} {"train_loss": -24.931833267211914, "global_step": 326528, "epoch": 3934} {"train_loss": -25.14957046508789, "global_step": 326529, "epoch": 3934} {"train_loss": -24.636550903320312, "global_step": 326530, "epoch": 3934} {"train_loss": -25.287826538085938, "global_step": 326531, "epoch": 3934} {"train_loss": -25.20161247253418, "global_step": 326532, "epoch": 3934} {"train_loss": -24.994253158569336, "global_step": 326533, "epoch": 3934} {"train_loss": -24.999013900756836, "global_step": 326534, "epoch": 3934} {"train_loss": -25.46759796142578, "global_step": 326535, "epoch": 3934} {"train_loss": -25.347131729125977, "global_step": 326536, "epoch": 3934} {"train_loss": -25.28689956665039, "global_step": 326537, "epoch": 3934} {"train_loss": -25.315814971923828, "global_step": 326538, "epoch": 3934} {"train_loss": -25.201984405517578, "global_step": 326539, "epoch": 3934} {"train_loss": -25.723535537719727, "global_step": 326540, "epoch": 3934} {"train_loss": -25.841291427612305, "global_step": 326541, "epoch": 3934} {"train_loss": -25.197507858276367, "global_step": 326542, "epoch": 3934} {"train_loss": -25.557538986206055, "global_step": 326543, "epoch": 3934} {"train_loss": -25.84955406188965, "global_step": 326544, "epoch": 3934} {"train_loss": -25.749887466430664, "global_step": 326545, "epoch": 3934} {"train_loss": -25.248117446899414, "global_step": 326546, "epoch": 3934} {"train_loss": -25.826990127563477, "global_step": 326547, "epoch": 3934} {"train_loss": -25.78557777404785, "global_step": 326548, "epoch": 3934} {"train_loss": -25.805831909179688, "global_step": 326549, "epoch": 3934} {"train_loss": -25.870019912719727, "global_step": 326550, "epoch": 3934} {"train_loss": -25.80824089050293, "global_step": 326551, "epoch": 3934} {"train_loss": -25.867828369140625, "global_step": 326552, "epoch": 3934} {"train_loss": -25.59775161743164, "global_step": 326553, "epoch": 3934} {"train_loss": -25.61673355102539, "global_step": 326554, "epoch": 3934} {"train_loss": -25.98988151550293, "global_step": 326555, "epoch": 3934} {"train_loss": -26.087890625, "global_step": 326556, "epoch": 3934} {"train_loss": -25.90717124938965, "global_step": 326557, "epoch": 3934} {"train_loss": -25.7884578704834, "global_step": 326558, "epoch": 3934} {"train_loss": -25.797687530517578, "global_step": 326559, "epoch": 3934} {"train_loss": -25.84929847717285, "global_step": 326560, "epoch": 3934} {"train_loss": -25.966012954711914, "global_step": 326561, "epoch": 3934} {"train_loss": -26.087055206298828, "global_step": 326562, "epoch": 3934} {"train_loss": -26.119237899780273, "global_step": 326563, "epoch": 3934} {"train_loss": -25.9466552734375, "global_step": 326564, "epoch": 3934} {"train_loss": -25.790821075439453, "global_step": 326565, "epoch": 3934} {"train_loss": -26.124786376953125, "global_step": 326566, "epoch": 3934} {"train_loss": -26.060474395751953, "global_step": 326567, "epoch": 3934} {"train_loss": -25.9217472076416, "global_step": 326568, "epoch": 3934} {"train_loss": -26.103469848632812, "global_step": 326569, "epoch": 3934} {"train_loss": -25.993494033813477, "global_step": 326570, "epoch": 3934} {"train_loss": -25.595218658447266, "global_step": 326571, "epoch": 3934} {"train_loss": -25.604206085205078, "global_step": 326572, "epoch": 3934} {"train_loss": -26.138944625854492, "global_step": 326573, "epoch": 3934} {"train_loss": -25.771804809570312, "global_step": 326574, "epoch": 3934} {"train_loss": -26.208740234375, "global_step": 326575, "epoch": 3934} {"train_loss": -26.003538131713867, "global_step": 326576, "epoch": 3934} {"train_loss": -25.713525772094727, "global_step": 326577, "epoch": 3934} {"train_loss": -25.94807243347168, "global_step": 326578, "epoch": 3934} {"train_loss": -26.176563262939453, "global_step": 326579, "epoch": 3934} {"train_loss": -25.733539581298828, "global_step": 326580, "epoch": 3934} {"train_loss": -25.517988204956055, "global_step": 326581, "epoch": 3934} {"train_loss": -25.517005920410156, "global_step": 326582, "epoch": 3934} {"train_loss": -26.297277450561523, "global_step": 326583, "epoch": 3934} {"train_loss": -26.1624755859375, "global_step": 326584, "epoch": 3934} {"train_loss": -25.88351821899414, "global_step": 326585, "epoch": 3934} {"train_loss": -25.707239151000977, "global_step": 326586, "epoch": 3934} {"train_loss": -25.87049674987793, "global_step": 326587, "epoch": 3934} {"train_loss": -25.725128173828125, "global_step": 326588, "epoch": 3934} {"train_loss": -25.944915771484375, "global_step": 326589, "epoch": 3934} {"train_loss": -25.984006881713867, "global_step": 326590, "epoch": 3934} {"train_loss": -25.980504989624023, "global_step": 326591, "epoch": 3934} {"train_loss": -25.93971061706543, "global_step": 326592, "epoch": 3934} {"train_loss": -25.76787757873535, "global_step": 326593, "epoch": 3934} {"train_loss": -26.1980037689209, "global_step": 326594, "epoch": 3934} {"train_loss": -25.59791374206543, "global_step": 326595, "epoch": 3934} {"train_loss": -26.216217041015625, "global_step": 326596, "epoch": 3934} {"train_loss": -26.169111251831055, "global_step": 326597, "epoch": 3934} {"train_loss": -26.16985511779785, "global_step": 326598, "epoch": 3934} {"train_loss": -25.95891761779785, "global_step": 326599, "epoch": 3934} {"train_loss": -25.986356735229492, "global_step": 326600, "epoch": 3934} {"train_loss": -26.31672477722168, "global_step": 326601, "epoch": 3934} {"train_loss": -25.784595489501953, "global_step": 326602, "epoch": 3934} {"train_loss": -26.403461456298828, "global_step": 326603, "epoch": 3934} {"train_loss": -25.649910869368586, "global_step": 326604, "epoch": 3934, "val_loss": 7264387.0} {"train_loss": -24.947786331176758, "global_step": 326605, "epoch": 3935} {"train_loss": -25.732580184936523, "global_step": 326606, "epoch": 3935} {"train_loss": -25.693145751953125, "global_step": 326607, "epoch": 3935} {"train_loss": -25.72503662109375, "global_step": 326608, "epoch": 3935} {"train_loss": -25.764074325561523, "global_step": 326609, "epoch": 3935} {"train_loss": -25.845794677734375, "global_step": 326610, "epoch": 3935} {"train_loss": -25.599130630493164, "global_step": 326611, "epoch": 3935} {"train_loss": -25.68832778930664, "global_step": 326612, "epoch": 3935} {"train_loss": -25.266937255859375, "global_step": 326613, "epoch": 3935} {"train_loss": -25.790616989135742, "global_step": 326614, "epoch": 3935} {"train_loss": -25.55242919921875, "global_step": 326615, "epoch": 3935} {"train_loss": -25.320575714111328, "global_step": 326616, "epoch": 3935} {"train_loss": -25.810171127319336, "global_step": 326617, "epoch": 3935} {"train_loss": -25.566177368164062, "global_step": 326618, "epoch": 3935} {"train_loss": -25.41627311706543, "global_step": 326619, "epoch": 3935} {"train_loss": -25.6613712310791, "global_step": 326620, "epoch": 3935} {"train_loss": -25.66712760925293, "global_step": 326621, "epoch": 3935} {"train_loss": -25.60821533203125, "global_step": 326622, "epoch": 3935} {"train_loss": -25.376813888549805, "global_step": 326623, "epoch": 3935} {"train_loss": -25.82916259765625, "global_step": 326624, "epoch": 3935} {"train_loss": -25.534366607666016, "global_step": 326625, "epoch": 3935} {"train_loss": -25.751501083374023, "global_step": 326626, "epoch": 3935} {"train_loss": -25.863264083862305, "global_step": 326627, "epoch": 3935} {"train_loss": -25.66640281677246, "global_step": 326628, "epoch": 3935} {"train_loss": -25.92535972595215, "global_step": 326629, "epoch": 3935} {"train_loss": -26.150182723999023, "global_step": 326630, "epoch": 3935} {"train_loss": -25.894495010375977, "global_step": 326631, "epoch": 3935} {"train_loss": -25.924901962280273, "global_step": 326632, "epoch": 3935} {"train_loss": -26.095691680908203, "global_step": 326633, "epoch": 3935} {"train_loss": -25.707956314086914, "global_step": 326634, "epoch": 3935} {"train_loss": -25.87494468688965, "global_step": 326635, "epoch": 3935} {"train_loss": -25.760852813720703, "global_step": 326636, "epoch": 3935} {"train_loss": -26.070749282836914, "global_step": 326637, "epoch": 3935} {"train_loss": -25.8896541595459, "global_step": 326638, "epoch": 3935} {"train_loss": -25.723779678344727, "global_step": 326639, "epoch": 3935} {"train_loss": -25.85479736328125, "global_step": 326640, "epoch": 3935} {"train_loss": -25.93132972717285, "global_step": 326641, "epoch": 3935} {"train_loss": -25.986042022705078, "global_step": 326642, "epoch": 3935} {"train_loss": -26.168710708618164, "global_step": 326643, "epoch": 3935} {"train_loss": -26.17547607421875, "global_step": 326644, "epoch": 3935} {"train_loss": -25.832996368408203, "global_step": 326645, "epoch": 3935} {"train_loss": -26.159900665283203, "global_step": 326646, "epoch": 3935} {"train_loss": -26.0401668548584, "global_step": 326647, "epoch": 3935} {"train_loss": -25.830408096313477, "global_step": 326648, "epoch": 3935} {"train_loss": -26.259084701538086, "global_step": 326649, "epoch": 3935} {"train_loss": -25.885290145874023, "global_step": 326650, "epoch": 3935} {"train_loss": -26.06939125061035, "global_step": 326651, "epoch": 3935} {"train_loss": -26.094308853149414, "global_step": 326652, "epoch": 3935} {"train_loss": -26.153507232666016, "global_step": 326653, "epoch": 3935} {"train_loss": -26.29018211364746, "global_step": 326654, "epoch": 3935} {"train_loss": -25.981857299804688, "global_step": 326655, "epoch": 3935} {"train_loss": -25.9158935546875, "global_step": 326656, "epoch": 3935} {"train_loss": -26.20461082458496, "global_step": 326657, "epoch": 3935} {"train_loss": -26.225635528564453, "global_step": 326658, "epoch": 3935} {"train_loss": -25.8189754486084, "global_step": 326659, "epoch": 3935} {"train_loss": -26.304275512695312, "global_step": 326660, "epoch": 3935} {"train_loss": -26.07057762145996, "global_step": 326661, "epoch": 3935} {"train_loss": -26.07769775390625, "global_step": 326662, "epoch": 3935} {"train_loss": -26.091150283813477, "global_step": 326663, "epoch": 3935} {"train_loss": -26.4019832611084, "global_step": 326664, "epoch": 3935} {"train_loss": -26.206668853759766, "global_step": 326665, "epoch": 3935} {"train_loss": -25.853057861328125, "global_step": 326666, "epoch": 3935} {"train_loss": -25.878711700439453, "global_step": 326667, "epoch": 3935} {"train_loss": -26.100849151611328, "global_step": 326668, "epoch": 3935} {"train_loss": -25.98420524597168, "global_step": 326669, "epoch": 3935} {"train_loss": -25.7567195892334, "global_step": 326670, "epoch": 3935} {"train_loss": -26.017480850219727, "global_step": 326671, "epoch": 3935} {"train_loss": -25.679052352905273, "global_step": 326672, "epoch": 3935} {"train_loss": -26.120641708374023, "global_step": 326673, "epoch": 3935} {"train_loss": -25.759735107421875, "global_step": 326674, "epoch": 3935} {"train_loss": -26.013769149780273, "global_step": 326675, "epoch": 3935} {"train_loss": -26.09370231628418, "global_step": 326676, "epoch": 3935} {"train_loss": -26.048511505126953, "global_step": 326677, "epoch": 3935} {"train_loss": -25.860584259033203, "global_step": 326678, "epoch": 3935} {"train_loss": -25.862577438354492, "global_step": 326679, "epoch": 3935} {"train_loss": -26.238012313842773, "global_step": 326680, "epoch": 3935} {"train_loss": -25.954303741455078, "global_step": 326681, "epoch": 3935} {"train_loss": -25.821069717407227, "global_step": 326682, "epoch": 3935} {"train_loss": -25.87455177307129, "global_step": 326683, "epoch": 3935} {"train_loss": -25.52680015563965, "global_step": 326684, "epoch": 3935} {"train_loss": -24.919645309448242, "global_step": 326685, "epoch": 3935} {"train_loss": -24.98773765563965, "global_step": 326686, "epoch": 3935} {"train_loss": -25.826537718255835, "global_step": 326687, "epoch": 3935, "val_loss": 7159314.5} {"train_loss": -25.71821403503418, "global_step": 326688, "epoch": 3936} {"train_loss": -25.13356590270996, "global_step": 326689, "epoch": 3936} {"train_loss": -25.46432876586914, "global_step": 326690, "epoch": 3936} {"train_loss": -25.477628707885742, "global_step": 326691, "epoch": 3936} {"train_loss": -25.2320556640625, "global_step": 326692, "epoch": 3936} {"train_loss": -25.48858070373535, "global_step": 326693, "epoch": 3936} {"train_loss": -25.56586265563965, "global_step": 326694, "epoch": 3936} {"train_loss": -25.28844451904297, "global_step": 326695, "epoch": 3936} {"train_loss": -25.046798706054688, "global_step": 326696, "epoch": 3936} {"train_loss": -25.749683380126953, "global_step": 326697, "epoch": 3936} {"train_loss": -25.514667510986328, "global_step": 326698, "epoch": 3936} {"train_loss": -25.732343673706055, "global_step": 326699, "epoch": 3936} {"train_loss": -26.043720245361328, "global_step": 326700, "epoch": 3936} {"train_loss": -25.380184173583984, "global_step": 326701, "epoch": 3936} {"train_loss": -25.708419799804688, "global_step": 326702, "epoch": 3936} {"train_loss": -25.77956199645996, "global_step": 326703, "epoch": 3936} {"train_loss": -25.701955795288086, "global_step": 326704, "epoch": 3936} {"train_loss": -25.72903823852539, "global_step": 326705, "epoch": 3936} {"train_loss": -25.937841415405273, "global_step": 326706, "epoch": 3936} {"train_loss": -26.317474365234375, "global_step": 326707, "epoch": 3936} {"train_loss": -25.759353637695312, "global_step": 326708, "epoch": 3936} {"train_loss": -25.79596519470215, "global_step": 326709, "epoch": 3936} {"train_loss": -25.665517807006836, "global_step": 326710, "epoch": 3936} {"train_loss": -25.958545684814453, "global_step": 326711, "epoch": 3936} {"train_loss": -25.860708236694336, "global_step": 326712, "epoch": 3936} {"train_loss": -25.614179611206055, "global_step": 326713, "epoch": 3936} {"train_loss": -25.752798080444336, "global_step": 326714, "epoch": 3936} {"train_loss": -25.539758682250977, "global_step": 326715, "epoch": 3936} {"train_loss": -25.857709884643555, "global_step": 326716, "epoch": 3936} {"train_loss": -25.947406768798828, "global_step": 326717, "epoch": 3936} {"train_loss": -26.1671142578125, "global_step": 326718, "epoch": 3936} {"train_loss": -25.94989585876465, "global_step": 326719, "epoch": 3936} {"train_loss": -26.163375854492188, "global_step": 326720, "epoch": 3936} {"train_loss": -25.861557006835938, "global_step": 326721, "epoch": 3936} {"train_loss": -25.77686882019043, "global_step": 326722, "epoch": 3936} {"train_loss": -26.01619529724121, "global_step": 326723, "epoch": 3936} {"train_loss": -26.055585861206055, "global_step": 326724, "epoch": 3936} {"train_loss": -25.647369384765625, "global_step": 326725, "epoch": 3936} {"train_loss": -25.80378532409668, "global_step": 326726, "epoch": 3936} {"train_loss": -25.91218376159668, "global_step": 326727, "epoch": 3936} {"train_loss": -26.121091842651367, "global_step": 326728, "epoch": 3936} {"train_loss": -25.853845596313477, "global_step": 326729, "epoch": 3936} {"train_loss": -26.5736083984375, "global_step": 326730, "epoch": 3936} {"train_loss": -26.230194091796875, "global_step": 326731, "epoch": 3936} {"train_loss": -26.167301177978516, "global_step": 326732, "epoch": 3936} {"train_loss": -25.865530014038086, "global_step": 326733, "epoch": 3936} {"train_loss": -25.708288192749023, "global_step": 326734, "epoch": 3936} {"train_loss": -25.986921310424805, "global_step": 326735, "epoch": 3936} {"train_loss": -25.9960994720459, "global_step": 326736, "epoch": 3936} {"train_loss": -26.0947322845459, "global_step": 326737, "epoch": 3936} {"train_loss": -25.73249626159668, "global_step": 326738, "epoch": 3936} {"train_loss": -25.98297119140625, "global_step": 326739, "epoch": 3936} {"train_loss": -25.586395263671875, "global_step": 326740, "epoch": 3936} {"train_loss": -25.65252685546875, "global_step": 326741, "epoch": 3936} {"train_loss": -25.400909423828125, "global_step": 326742, "epoch": 3936} {"train_loss": -25.7205753326416, "global_step": 326743, "epoch": 3936} {"train_loss": -26.24224281311035, "global_step": 326744, "epoch": 3936} {"train_loss": -25.717060089111328, "global_step": 326745, "epoch": 3936} {"train_loss": -26.310821533203125, "global_step": 326746, "epoch": 3936} {"train_loss": -25.916234970092773, "global_step": 326747, "epoch": 3936} {"train_loss": -25.866275787353516, "global_step": 326748, "epoch": 3936} {"train_loss": -25.91668701171875, "global_step": 326749, "epoch": 3936} {"train_loss": -26.132282257080078, "global_step": 326750, "epoch": 3936} {"train_loss": -25.786787033081055, "global_step": 326751, "epoch": 3936} {"train_loss": -25.724029541015625, "global_step": 326752, "epoch": 3936} {"train_loss": -25.795019149780273, "global_step": 326753, "epoch": 3936} {"train_loss": -26.117767333984375, "global_step": 326754, "epoch": 3936} {"train_loss": -25.713897705078125, "global_step": 326755, "epoch": 3936} {"train_loss": -25.941333770751953, "global_step": 326756, "epoch": 3936} {"train_loss": -25.620513916015625, "global_step": 326757, "epoch": 3936} {"train_loss": -26.174482345581055, "global_step": 326758, "epoch": 3936} {"train_loss": -25.950408935546875, "global_step": 326759, "epoch": 3936} {"train_loss": -26.324201583862305, "global_step": 326760, "epoch": 3936} {"train_loss": -26.05332374572754, "global_step": 326761, "epoch": 3936} {"train_loss": -26.035242080688477, "global_step": 326762, "epoch": 3936} {"train_loss": -26.28635025024414, "global_step": 326763, "epoch": 3936} {"train_loss": -25.657739639282227, "global_step": 326764, "epoch": 3936} {"train_loss": -25.977951049804688, "global_step": 326765, "epoch": 3936} {"train_loss": -25.720006942749023, "global_step": 326766, "epoch": 3936} {"train_loss": -25.530405044555664, "global_step": 326767, "epoch": 3936} {"train_loss": -25.927579879760742, "global_step": 326768, "epoch": 3936} {"train_loss": -26.024648666381836, "global_step": 326769, "epoch": 3936} {"train_loss": -25.831307169902754, "global_step": 326770, "epoch": 3936, "val_loss": 7351568.0} {"train_loss": -24.82373046875, "global_step": 326771, "epoch": 3937} {"train_loss": -24.482816696166992, "global_step": 326772, "epoch": 3937} {"train_loss": -25.132339477539062, "global_step": 326773, "epoch": 3937} {"train_loss": -24.89339256286621, "global_step": 326774, "epoch": 3937} {"train_loss": -24.931949615478516, "global_step": 326775, "epoch": 3937} {"train_loss": -24.657447814941406, "global_step": 326776, "epoch": 3937} {"train_loss": -25.408361434936523, "global_step": 326777, "epoch": 3937} {"train_loss": -25.35822105407715, "global_step": 326778, "epoch": 3937} {"train_loss": -24.948253631591797, "global_step": 326779, "epoch": 3937} {"train_loss": -25.398597717285156, "global_step": 326780, "epoch": 3937} {"train_loss": -25.329328536987305, "global_step": 326781, "epoch": 3937} {"train_loss": -25.611562728881836, "global_step": 326782, "epoch": 3937} {"train_loss": -24.890592575073242, "global_step": 326783, "epoch": 3937} {"train_loss": -25.34748649597168, "global_step": 326784, "epoch": 3937} {"train_loss": -25.13678550720215, "global_step": 326785, "epoch": 3937} {"train_loss": -25.557687759399414, "global_step": 326786, "epoch": 3937} {"train_loss": -25.213207244873047, "global_step": 326787, "epoch": 3937} {"train_loss": -25.45891761779785, "global_step": 326788, "epoch": 3937} {"train_loss": -25.153539657592773, "global_step": 326789, "epoch": 3937} {"train_loss": -25.367231369018555, "global_step": 326790, "epoch": 3937} {"train_loss": -25.16060447692871, "global_step": 326791, "epoch": 3937} {"train_loss": -25.255979537963867, "global_step": 326792, "epoch": 3937} {"train_loss": -25.612567901611328, "global_step": 326793, "epoch": 3937} {"train_loss": -25.403766632080078, "global_step": 326794, "epoch": 3937} {"train_loss": -25.862592697143555, "global_step": 326795, "epoch": 3937} {"train_loss": -25.31937599182129, "global_step": 326796, "epoch": 3937} {"train_loss": -25.39615249633789, "global_step": 326797, "epoch": 3937} {"train_loss": -25.578100204467773, "global_step": 326798, "epoch": 3937} {"train_loss": -25.879247665405273, "global_step": 326799, "epoch": 3937} {"train_loss": -25.51906967163086, "global_step": 326800, "epoch": 3937} {"train_loss": -25.60524559020996, "global_step": 326801, "epoch": 3937} {"train_loss": -25.69648551940918, "global_step": 326802, "epoch": 3937} {"train_loss": -25.635833740234375, "global_step": 326803, "epoch": 3937} {"train_loss": -25.764169692993164, "global_step": 326804, "epoch": 3937} {"train_loss": -25.726943969726562, "global_step": 326805, "epoch": 3937} {"train_loss": -25.818876266479492, "global_step": 326806, "epoch": 3937} {"train_loss": -25.784860610961914, "global_step": 326807, "epoch": 3937} {"train_loss": -26.080556869506836, "global_step": 326808, "epoch": 3937} {"train_loss": -25.857770919799805, "global_step": 326809, "epoch": 3937} {"train_loss": -25.641748428344727, "global_step": 326810, "epoch": 3937} {"train_loss": -26.021162033081055, "global_step": 326811, "epoch": 3937} {"train_loss": -26.003503799438477, "global_step": 326812, "epoch": 3937} {"train_loss": -25.801664352416992, "global_step": 326813, "epoch": 3937} {"train_loss": -26.032962799072266, "global_step": 326814, "epoch": 3937} {"train_loss": -25.621601104736328, "global_step": 326815, "epoch": 3937} {"train_loss": -26.319583892822266, "global_step": 326816, "epoch": 3937} {"train_loss": -26.122705459594727, "global_step": 326817, "epoch": 3937} {"train_loss": -26.069791793823242, "global_step": 326818, "epoch": 3937} {"train_loss": -26.286664962768555, "global_step": 326819, "epoch": 3937} {"train_loss": -25.986942291259766, "global_step": 326820, "epoch": 3937} {"train_loss": -26.238849639892578, "global_step": 326821, "epoch": 3937} {"train_loss": -26.239532470703125, "global_step": 326822, "epoch": 3937} {"train_loss": -25.887845993041992, "global_step": 326823, "epoch": 3937} {"train_loss": -26.10357093811035, "global_step": 326824, "epoch": 3937} {"train_loss": -26.116743087768555, "global_step": 326825, "epoch": 3937} {"train_loss": -25.888961791992188, "global_step": 326826, "epoch": 3937} {"train_loss": -26.008874893188477, "global_step": 326827, "epoch": 3937} {"train_loss": -25.603607177734375, "global_step": 326828, "epoch": 3937} {"train_loss": -26.3304443359375, "global_step": 326829, "epoch": 3937} {"train_loss": -26.119739532470703, "global_step": 326830, "epoch": 3937} {"train_loss": -26.05368995666504, "global_step": 326831, "epoch": 3937} {"train_loss": -25.76716423034668, "global_step": 326832, "epoch": 3937} {"train_loss": -25.866943359375, "global_step": 326833, "epoch": 3937} {"train_loss": -25.85739517211914, "global_step": 326834, "epoch": 3937} {"train_loss": -26.246671676635742, "global_step": 326835, "epoch": 3937} {"train_loss": -25.614194869995117, "global_step": 326836, "epoch": 3937} {"train_loss": -25.65576171875, "global_step": 326837, "epoch": 3937} {"train_loss": -25.995534896850586, "global_step": 326838, "epoch": 3937} {"train_loss": -26.0323486328125, "global_step": 326839, "epoch": 3937} {"train_loss": -25.595701217651367, "global_step": 326840, "epoch": 3937} {"train_loss": -25.58603858947754, "global_step": 326841, "epoch": 3937} {"train_loss": -25.804218292236328, "global_step": 326842, "epoch": 3937} {"train_loss": -25.788122177124023, "global_step": 326843, "epoch": 3937} {"train_loss": -25.4998836517334, "global_step": 326844, "epoch": 3937} {"train_loss": -26.29365348815918, "global_step": 326845, "epoch": 3937} {"train_loss": -25.8524169921875, "global_step": 326846, "epoch": 3937} {"train_loss": -25.76498794555664, "global_step": 326847, "epoch": 3937} {"train_loss": -26.047504425048828, "global_step": 326848, "epoch": 3937} {"train_loss": -25.864404678344727, "global_step": 326849, "epoch": 3937} {"train_loss": -25.63739013671875, "global_step": 326850, "epoch": 3937} {"train_loss": -26.037946701049805, "global_step": 326851, "epoch": 3937} {"train_loss": -25.977643966674805, "global_step": 326852, "epoch": 3937} {"train_loss": -25.65736605173134, "global_step": 326853, "epoch": 3937, "val_loss": 7226330.0} {"train_loss": -25.36202049255371, "global_step": 326854, "epoch": 3938} {"train_loss": -25.43413734436035, "global_step": 326855, "epoch": 3938} {"train_loss": -24.651182174682617, "global_step": 326856, "epoch": 3938} {"train_loss": -24.97857666015625, "global_step": 326857, "epoch": 3938} {"train_loss": -25.01278305053711, "global_step": 326858, "epoch": 3938} {"train_loss": -24.887868881225586, "global_step": 326859, "epoch": 3938} {"train_loss": -24.907367706298828, "global_step": 326860, "epoch": 3938} {"train_loss": -24.93316650390625, "global_step": 326861, "epoch": 3938} {"train_loss": -25.178220748901367, "global_step": 326862, "epoch": 3938} {"train_loss": -24.940889358520508, "global_step": 326863, "epoch": 3938} {"train_loss": -25.08463478088379, "global_step": 326864, "epoch": 3938} {"train_loss": -25.315052032470703, "global_step": 326865, "epoch": 3938} {"train_loss": -25.439924240112305, "global_step": 326866, "epoch": 3938} {"train_loss": -25.37103843688965, "global_step": 326867, "epoch": 3938} {"train_loss": -25.19007682800293, "global_step": 326868, "epoch": 3938} {"train_loss": -25.51764488220215, "global_step": 326869, "epoch": 3938} {"train_loss": -25.197147369384766, "global_step": 326870, "epoch": 3938} {"train_loss": -25.563581466674805, "global_step": 326871, "epoch": 3938} {"train_loss": -25.22747802734375, "global_step": 326872, "epoch": 3938} {"train_loss": -25.659399032592773, "global_step": 326873, "epoch": 3938} {"train_loss": -25.62666130065918, "global_step": 326874, "epoch": 3938} {"train_loss": -25.55219268798828, "global_step": 326875, "epoch": 3938} {"train_loss": -25.60450553894043, "global_step": 326876, "epoch": 3938} {"train_loss": -25.7299861907959, "global_step": 326877, "epoch": 3938} {"train_loss": -25.866043090820312, "global_step": 326878, "epoch": 3938} {"train_loss": -25.614500045776367, "global_step": 326879, "epoch": 3938} {"train_loss": -25.684316635131836, "global_step": 326880, "epoch": 3938} {"train_loss": -25.59059715270996, "global_step": 326881, "epoch": 3938} {"train_loss": -25.79334831237793, "global_step": 326882, "epoch": 3938} {"train_loss": -25.95627784729004, "global_step": 326883, "epoch": 3938} {"train_loss": -26.18694496154785, "global_step": 326884, "epoch": 3938} {"train_loss": -26.2119197845459, "global_step": 326885, "epoch": 3938} {"train_loss": -25.765771865844727, "global_step": 326886, "epoch": 3938} {"train_loss": -25.997678756713867, "global_step": 326887, "epoch": 3938} {"train_loss": -26.0657958984375, "global_step": 326888, "epoch": 3938} {"train_loss": -26.10089683532715, "global_step": 326889, "epoch": 3938} {"train_loss": -26.06271743774414, "global_step": 326890, "epoch": 3938} {"train_loss": -25.903104782104492, "global_step": 326891, "epoch": 3938} {"train_loss": -25.744359970092773, "global_step": 326892, "epoch": 3938} {"train_loss": -26.0030574798584, "global_step": 326893, "epoch": 3938} {"train_loss": -26.077680587768555, "global_step": 326894, "epoch": 3938} {"train_loss": -26.16462516784668, "global_step": 326895, "epoch": 3938} {"train_loss": -25.775497436523438, "global_step": 326896, "epoch": 3938} {"train_loss": -26.26816749572754, "global_step": 326897, "epoch": 3938} {"train_loss": -25.77583122253418, "global_step": 326898, "epoch": 3938} {"train_loss": -25.644529342651367, "global_step": 326899, "epoch": 3938} {"train_loss": -25.601266860961914, "global_step": 326900, "epoch": 3938} {"train_loss": -25.658594131469727, "global_step": 326901, "epoch": 3938} {"train_loss": -26.0513973236084, "global_step": 326902, "epoch": 3938} {"train_loss": -26.211502075195312, "global_step": 326903, "epoch": 3938} {"train_loss": -25.544706344604492, "global_step": 326904, "epoch": 3938} {"train_loss": -25.86366081237793, "global_step": 326905, "epoch": 3938} {"train_loss": -26.127094268798828, "global_step": 326906, "epoch": 3938} {"train_loss": -25.94817543029785, "global_step": 326907, "epoch": 3938} {"train_loss": -26.00373649597168, "global_step": 326908, "epoch": 3938} {"train_loss": -26.07313346862793, "global_step": 326909, "epoch": 3938} {"train_loss": -26.071008682250977, "global_step": 326910, "epoch": 3938} {"train_loss": -25.709653854370117, "global_step": 326911, "epoch": 3938} {"train_loss": -25.952863693237305, "global_step": 326912, "epoch": 3938} {"train_loss": -25.871976852416992, "global_step": 326913, "epoch": 3938} {"train_loss": -25.9298038482666, "global_step": 326914, "epoch": 3938} {"train_loss": -25.78607749938965, "global_step": 326915, "epoch": 3938} {"train_loss": -25.687149047851562, "global_step": 326916, "epoch": 3938} {"train_loss": -25.828672409057617, "global_step": 326917, "epoch": 3938} {"train_loss": -26.117334365844727, "global_step": 326918, "epoch": 3938} {"train_loss": -26.00565528869629, "global_step": 326919, "epoch": 3938} {"train_loss": -25.886341094970703, "global_step": 326920, "epoch": 3938} {"train_loss": -25.9594783782959, "global_step": 326921, "epoch": 3938} {"train_loss": -25.698888778686523, "global_step": 326922, "epoch": 3938} {"train_loss": -25.832305908203125, "global_step": 326923, "epoch": 3938} {"train_loss": -25.95026969909668, "global_step": 326924, "epoch": 3938} {"train_loss": -26.054960250854492, "global_step": 326925, "epoch": 3938} {"train_loss": -26.038183212280273, "global_step": 326926, "epoch": 3938} {"train_loss": -26.082563400268555, "global_step": 326927, "epoch": 3938} {"train_loss": -25.722003936767578, "global_step": 326928, "epoch": 3938} {"train_loss": -25.760656356811523, "global_step": 326929, "epoch": 3938} {"train_loss": -26.096149444580078, "global_step": 326930, "epoch": 3938} {"train_loss": -25.770889282226562, "global_step": 326931, "epoch": 3938} {"train_loss": -25.6944637298584, "global_step": 326932, "epoch": 3938} {"train_loss": -25.92555046081543, "global_step": 326933, "epoch": 3938} {"train_loss": -26.1364688873291, "global_step": 326934, "epoch": 3938} {"train_loss": -26.115392684936523, "global_step": 326935, "epoch": 3938} {"train_loss": -25.73641885045063, "global_step": 326936, "epoch": 3938, "val_loss": 7262844.0} {"train_loss": -24.107572555541992, "global_step": 326937, "epoch": 3939} {"train_loss": -24.930700302124023, "global_step": 326938, "epoch": 3939} {"train_loss": -25.154874801635742, "global_step": 326939, "epoch": 3939} {"train_loss": -24.638824462890625, "global_step": 326940, "epoch": 3939} {"train_loss": -25.386987686157227, "global_step": 326941, "epoch": 3939} {"train_loss": -24.974924087524414, "global_step": 326942, "epoch": 3939} {"train_loss": -25.212278366088867, "global_step": 326943, "epoch": 3939} {"train_loss": -24.988142013549805, "global_step": 326944, "epoch": 3939} {"train_loss": -25.469390869140625, "global_step": 326945, "epoch": 3939} {"train_loss": -25.1303768157959, "global_step": 326946, "epoch": 3939} {"train_loss": -25.153472900390625, "global_step": 326947, "epoch": 3939} {"train_loss": -25.513931274414062, "global_step": 326948, "epoch": 3939} {"train_loss": -25.073347091674805, "global_step": 326949, "epoch": 3939} {"train_loss": -25.302154541015625, "global_step": 326950, "epoch": 3939} {"train_loss": -25.068471908569336, "global_step": 326951, "epoch": 3939} {"train_loss": -25.65654945373535, "global_step": 326952, "epoch": 3939} {"train_loss": -25.176645278930664, "global_step": 326953, "epoch": 3939} {"train_loss": -25.621662139892578, "global_step": 326954, "epoch": 3939} {"train_loss": -25.514375686645508, "global_step": 326955, "epoch": 3939} {"train_loss": -25.47909927368164, "global_step": 326956, "epoch": 3939} {"train_loss": -25.3525333404541, "global_step": 326957, "epoch": 3939} {"train_loss": -25.848596572875977, "global_step": 326958, "epoch": 3939} {"train_loss": -25.274850845336914, "global_step": 326959, "epoch": 3939} {"train_loss": -25.25857162475586, "global_step": 326960, "epoch": 3939} {"train_loss": -25.90888023376465, "global_step": 326961, "epoch": 3939} {"train_loss": -25.97852897644043, "global_step": 326962, "epoch": 3939} {"train_loss": -25.68898582458496, "global_step": 326963, "epoch": 3939} {"train_loss": -25.753360748291016, "global_step": 326964, "epoch": 3939} {"train_loss": -25.743091583251953, "global_step": 326965, "epoch": 3939} {"train_loss": -26.030139923095703, "global_step": 326966, "epoch": 3939} {"train_loss": -25.614831924438477, "global_step": 326967, "epoch": 3939} {"train_loss": -25.633560180664062, "global_step": 326968, "epoch": 3939} {"train_loss": -25.823261260986328, "global_step": 326969, "epoch": 3939} {"train_loss": -25.792007446289062, "global_step": 326970, "epoch": 3939} {"train_loss": -25.756391525268555, "global_step": 326971, "epoch": 3939} {"train_loss": -25.863574981689453, "global_step": 326972, "epoch": 3939} {"train_loss": -25.917768478393555, "global_step": 326973, "epoch": 3939} {"train_loss": -25.88300895690918, "global_step": 326974, "epoch": 3939} {"train_loss": -26.124725341796875, "global_step": 326975, "epoch": 3939} {"train_loss": -25.724252700805664, "global_step": 326976, "epoch": 3939} {"train_loss": -26.004165649414062, "global_step": 326977, "epoch": 3939} {"train_loss": -25.839635848999023, "global_step": 326978, "epoch": 3939} {"train_loss": -25.833450317382812, "global_step": 326979, "epoch": 3939} {"train_loss": -26.251874923706055, "global_step": 326980, "epoch": 3939} {"train_loss": -26.0942440032959, "global_step": 326981, "epoch": 3939} {"train_loss": -26.14373779296875, "global_step": 326982, "epoch": 3939} {"train_loss": -25.883270263671875, "global_step": 326983, "epoch": 3939} {"train_loss": -26.192520141601562, "global_step": 326984, "epoch": 3939} {"train_loss": -26.122121810913086, "global_step": 326985, "epoch": 3939} {"train_loss": -26.483556747436523, "global_step": 326986, "epoch": 3939} {"train_loss": -26.13394546508789, "global_step": 326987, "epoch": 3939} {"train_loss": -26.15191650390625, "global_step": 326988, "epoch": 3939} {"train_loss": -26.031681060791016, "global_step": 326989, "epoch": 3939} {"train_loss": -25.790771484375, "global_step": 326990, "epoch": 3939} {"train_loss": -25.925024032592773, "global_step": 326991, "epoch": 3939} {"train_loss": -25.637571334838867, "global_step": 326992, "epoch": 3939} {"train_loss": -26.437108993530273, "global_step": 326993, "epoch": 3939} {"train_loss": -26.058990478515625, "global_step": 326994, "epoch": 3939} {"train_loss": -26.375394821166992, "global_step": 326995, "epoch": 3939} {"train_loss": -25.649805068969727, "global_step": 326996, "epoch": 3939} {"train_loss": -26.035282135009766, "global_step": 326997, "epoch": 3939} {"train_loss": -25.539958953857422, "global_step": 326998, "epoch": 3939} {"train_loss": -25.737781524658203, "global_step": 326999, "epoch": 3939} {"train_loss": -26.28489112854004, "global_step": 327000, "epoch": 3939} {"train_loss": -26.14594841003418, "global_step": 327001, "epoch": 3939} {"train_loss": -25.694787979125977, "global_step": 327002, "epoch": 3939} {"train_loss": -26.049945831298828, "global_step": 327003, "epoch": 3939} {"train_loss": -25.8209228515625, "global_step": 327004, "epoch": 3939} {"train_loss": -25.66412925720215, "global_step": 327005, "epoch": 3939} {"train_loss": -25.680164337158203, "global_step": 327006, "epoch": 3939} {"train_loss": -25.78194236755371, "global_step": 327007, "epoch": 3939} {"train_loss": -25.688079833984375, "global_step": 327008, "epoch": 3939} {"train_loss": -25.664052963256836, "global_step": 327009, "epoch": 3939} {"train_loss": -25.533140182495117, "global_step": 327010, "epoch": 3939} {"train_loss": -25.923192977905273, "global_step": 327011, "epoch": 3939} {"train_loss": -25.601285934448242, "global_step": 327012, "epoch": 3939} {"train_loss": -26.02431297302246, "global_step": 327013, "epoch": 3939} {"train_loss": -26.231281280517578, "global_step": 327014, "epoch": 3939} {"train_loss": -26.028234481811523, "global_step": 327015, "epoch": 3939} {"train_loss": -26.225576400756836, "global_step": 327016, "epoch": 3939} {"train_loss": -26.031421661376953, "global_step": 327017, "epoch": 3939} {"train_loss": -25.640914916992188, "global_step": 327018, "epoch": 3939} {"train_loss": -25.712490035826903, "global_step": 327019, "epoch": 3939, "val_loss": 7189313.0} {"train_loss": -25.141611099243164, "global_step": 327020, "epoch": 3940} {"train_loss": -24.64654541015625, "global_step": 327021, "epoch": 3940} {"train_loss": -25.68703269958496, "global_step": 327022, "epoch": 3940} {"train_loss": -25.413532257080078, "global_step": 327023, "epoch": 3940} {"train_loss": -24.49721336364746, "global_step": 327024, "epoch": 3940} {"train_loss": -24.99372673034668, "global_step": 327025, "epoch": 3940} {"train_loss": -25.36754608154297, "global_step": 327026, "epoch": 3940} {"train_loss": -24.829221725463867, "global_step": 327027, "epoch": 3940} {"train_loss": -25.234262466430664, "global_step": 327028, "epoch": 3940} {"train_loss": -25.335491180419922, "global_step": 327029, "epoch": 3940} {"train_loss": -25.712427139282227, "global_step": 327030, "epoch": 3940} {"train_loss": -25.257373809814453, "global_step": 327031, "epoch": 3940} {"train_loss": -25.25369644165039, "global_step": 327032, "epoch": 3940} {"train_loss": -25.3822078704834, "global_step": 327033, "epoch": 3940} {"train_loss": -25.674352645874023, "global_step": 327034, "epoch": 3940} {"train_loss": -25.33024024963379, "global_step": 327035, "epoch": 3940} {"train_loss": -25.463851928710938, "global_step": 327036, "epoch": 3940} {"train_loss": -25.81913185119629, "global_step": 327037, "epoch": 3940} {"train_loss": -25.42548942565918, "global_step": 327038, "epoch": 3940} {"train_loss": -25.83003807067871, "global_step": 327039, "epoch": 3940} {"train_loss": -25.81756591796875, "global_step": 327040, "epoch": 3940} {"train_loss": -25.69365882873535, "global_step": 327041, "epoch": 3940} {"train_loss": -25.521108627319336, "global_step": 327042, "epoch": 3940} {"train_loss": -25.864944458007812, "global_step": 327043, "epoch": 3940} {"train_loss": -25.87225341796875, "global_step": 327044, "epoch": 3940} {"train_loss": -25.626577377319336, "global_step": 327045, "epoch": 3940} {"train_loss": -25.960336685180664, "global_step": 327046, "epoch": 3940} {"train_loss": -25.771780014038086, "global_step": 327047, "epoch": 3940} {"train_loss": -25.612289428710938, "global_step": 327048, "epoch": 3940} {"train_loss": -25.647802352905273, "global_step": 327049, "epoch": 3940} {"train_loss": -25.929407119750977, "global_step": 327050, "epoch": 3940} {"train_loss": -26.03460693359375, "global_step": 327051, "epoch": 3940} {"train_loss": -25.778568267822266, "global_step": 327052, "epoch": 3940} {"train_loss": -25.89453125, "global_step": 327053, "epoch": 3940} {"train_loss": -26.170507431030273, "global_step": 327054, "epoch": 3940} {"train_loss": -26.076032638549805, "global_step": 327055, "epoch": 3940} {"train_loss": -26.26642417907715, "global_step": 327056, "epoch": 3940} {"train_loss": -26.00321388244629, "global_step": 327057, "epoch": 3940} {"train_loss": -25.7252197265625, "global_step": 327058, "epoch": 3940} {"train_loss": -26.2198486328125, "global_step": 327059, "epoch": 3940} {"train_loss": -26.018543243408203, "global_step": 327060, "epoch": 3940} {"train_loss": -25.676488876342773, "global_step": 327061, "epoch": 3940} {"train_loss": -25.814573287963867, "global_step": 327062, "epoch": 3940} {"train_loss": -26.04534339904785, "global_step": 327063, "epoch": 3940} {"train_loss": -25.975448608398438, "global_step": 327064, "epoch": 3940} {"train_loss": -25.935546875, "global_step": 327065, "epoch": 3940} {"train_loss": -25.915210723876953, "global_step": 327066, "epoch": 3940} {"train_loss": -25.948766708374023, "global_step": 327067, "epoch": 3940} {"train_loss": -26.307519912719727, "global_step": 327068, "epoch": 3940} {"train_loss": -26.01727294921875, "global_step": 327069, "epoch": 3940} {"train_loss": -26.17266273498535, "global_step": 327070, "epoch": 3940} {"train_loss": -26.03238296508789, "global_step": 327071, "epoch": 3940} {"train_loss": -26.514450073242188, "global_step": 327072, "epoch": 3940} {"train_loss": -26.118911743164062, "global_step": 327073, "epoch": 3940} {"train_loss": -25.88001823425293, "global_step": 327074, "epoch": 3940} {"train_loss": -26.099365234375, "global_step": 327075, "epoch": 3940} {"train_loss": -26.001367568969727, "global_step": 327076, "epoch": 3940} {"train_loss": -26.263784408569336, "global_step": 327077, "epoch": 3940} {"train_loss": -26.153348922729492, "global_step": 327078, "epoch": 3940} {"train_loss": -25.888565063476562, "global_step": 327079, "epoch": 3940} {"train_loss": -25.290645599365234, "global_step": 327080, "epoch": 3940} {"train_loss": -25.912036895751953, "global_step": 327081, "epoch": 3940} {"train_loss": -26.339298248291016, "global_step": 327082, "epoch": 3940} {"train_loss": -25.716848373413086, "global_step": 327083, "epoch": 3940} {"train_loss": -25.896869659423828, "global_step": 327084, "epoch": 3940} {"train_loss": -26.343658447265625, "global_step": 327085, "epoch": 3940} {"train_loss": -26.11622428894043, "global_step": 327086, "epoch": 3940} {"train_loss": -26.13433837890625, "global_step": 327087, "epoch": 3940} {"train_loss": -25.838953018188477, "global_step": 327088, "epoch": 3940} {"train_loss": -25.56458854675293, "global_step": 327089, "epoch": 3940} {"train_loss": -26.13441276550293, "global_step": 327090, "epoch": 3940} {"train_loss": -26.0563907623291, "global_step": 327091, "epoch": 3940} {"train_loss": -25.627548217773438, "global_step": 327092, "epoch": 3940} {"train_loss": -25.718536376953125, "global_step": 327093, "epoch": 3940} {"train_loss": -25.47100257873535, "global_step": 327094, "epoch": 3940} {"train_loss": -26.10664939880371, "global_step": 327095, "epoch": 3940} {"train_loss": -25.971670150756836, "global_step": 327096, "epoch": 3940} {"train_loss": -25.77399253845215, "global_step": 327097, "epoch": 3940} {"train_loss": -25.81502342224121, "global_step": 327098, "epoch": 3940} {"train_loss": -26.042036056518555, "global_step": 327099, "epoch": 3940} {"train_loss": -25.6491641998291, "global_step": 327100, "epoch": 3940} {"train_loss": -26.410200119018555, "global_step": 327101, "epoch": 3940} {"train_loss": -25.775492771562323, "global_step": 327102, "epoch": 3940, "val_loss": 7161631.0} {"train_loss": -25.51447868347168, "global_step": 327103, "epoch": 3941} {"train_loss": -25.510404586791992, "global_step": 327104, "epoch": 3941} {"train_loss": -25.3643856048584, "global_step": 327105, "epoch": 3941} {"train_loss": -25.48902130126953, "global_step": 327106, "epoch": 3941} {"train_loss": -25.359180450439453, "global_step": 327107, "epoch": 3941} {"train_loss": -25.562286376953125, "global_step": 327108, "epoch": 3941} {"train_loss": -25.828144073486328, "global_step": 327109, "epoch": 3941} {"train_loss": -25.309024810791016, "global_step": 327110, "epoch": 3941} {"train_loss": -25.834985733032227, "global_step": 327111, "epoch": 3941} {"train_loss": -25.62944984436035, "global_step": 327112, "epoch": 3941} {"train_loss": -26.285369873046875, "global_step": 327113, "epoch": 3941} {"train_loss": -25.589311599731445, "global_step": 327114, "epoch": 3941} {"train_loss": -25.75351905822754, "global_step": 327115, "epoch": 3941} {"train_loss": -25.58487319946289, "global_step": 327116, "epoch": 3941} {"train_loss": -25.712400436401367, "global_step": 327117, "epoch": 3941} {"train_loss": -26.018604278564453, "global_step": 327118, "epoch": 3941} {"train_loss": -25.478809356689453, "global_step": 327119, "epoch": 3941} {"train_loss": -25.95308494567871, "global_step": 327120, "epoch": 3941} {"train_loss": -25.687955856323242, "global_step": 327121, "epoch": 3941} {"train_loss": -25.451908111572266, "global_step": 327122, "epoch": 3941} {"train_loss": -25.975223541259766, "global_step": 327123, "epoch": 3941} {"train_loss": -26.064218521118164, "global_step": 327124, "epoch": 3941} {"train_loss": -25.85052490234375, "global_step": 327125, "epoch": 3941} {"train_loss": -25.933826446533203, "global_step": 327126, "epoch": 3941} {"train_loss": -26.017282485961914, "global_step": 327127, "epoch": 3941} {"train_loss": -26.22627830505371, "global_step": 327128, "epoch": 3941} {"train_loss": -26.019399642944336, "global_step": 327129, "epoch": 3941} {"train_loss": -25.824621200561523, "global_step": 327130, "epoch": 3941} {"train_loss": -26.04022789001465, "global_step": 327131, "epoch": 3941} {"train_loss": -26.047941207885742, "global_step": 327132, "epoch": 3941} {"train_loss": -25.98556900024414, "global_step": 327133, "epoch": 3941} {"train_loss": -26.28669548034668, "global_step": 327134, "epoch": 3941} {"train_loss": -26.138275146484375, "global_step": 327135, "epoch": 3941} {"train_loss": -26.200902938842773, "global_step": 327136, "epoch": 3941} {"train_loss": -26.16659927368164, "global_step": 327137, "epoch": 3941} {"train_loss": -25.667875289916992, "global_step": 327138, "epoch": 3941} {"train_loss": -25.930191040039062, "global_step": 327139, "epoch": 3941} {"train_loss": -25.997838973999023, "global_step": 327140, "epoch": 3941} {"train_loss": -25.56451988220215, "global_step": 327141, "epoch": 3941} {"train_loss": -25.553438186645508, "global_step": 327142, "epoch": 3941} {"train_loss": -25.306692123413086, "global_step": 327143, "epoch": 3941} {"train_loss": -25.99041175842285, "global_step": 327144, "epoch": 3941} {"train_loss": -25.944915771484375, "global_step": 327145, "epoch": 3941} {"train_loss": -25.897235870361328, "global_step": 327146, "epoch": 3941} {"train_loss": -26.02109146118164, "global_step": 327147, "epoch": 3941} {"train_loss": -25.8524112701416, "global_step": 327148, "epoch": 3941} {"train_loss": -26.056066513061523, "global_step": 327149, "epoch": 3941} {"train_loss": -26.150588989257812, "global_step": 327150, "epoch": 3941} {"train_loss": -26.06560707092285, "global_step": 327151, "epoch": 3941} {"train_loss": -25.88522720336914, "global_step": 327152, "epoch": 3941} {"train_loss": -26.272748947143555, "global_step": 327153, "epoch": 3941} {"train_loss": -26.260053634643555, "global_step": 327154, "epoch": 3941} {"train_loss": -26.10443687438965, "global_step": 327155, "epoch": 3941} {"train_loss": -26.09814453125, "global_step": 327156, "epoch": 3941} {"train_loss": -26.506973266601562, "global_step": 327157, "epoch": 3941} {"train_loss": -26.161649703979492, "global_step": 327158, "epoch": 3941} {"train_loss": -25.636981964111328, "global_step": 327159, "epoch": 3941} {"train_loss": -26.053083419799805, "global_step": 327160, "epoch": 3941} {"train_loss": -26.05022621154785, "global_step": 327161, "epoch": 3941} {"train_loss": -26.245630264282227, "global_step": 327162, "epoch": 3941} {"train_loss": -26.277170181274414, "global_step": 327163, "epoch": 3941} {"train_loss": -25.59479331970215, "global_step": 327164, "epoch": 3941} {"train_loss": -25.127647399902344, "global_step": 327165, "epoch": 3941} {"train_loss": -25.36800193786621, "global_step": 327166, "epoch": 3941} {"train_loss": -25.79388427734375, "global_step": 327167, "epoch": 3941} {"train_loss": -25.63555908203125, "global_step": 327168, "epoch": 3941} {"train_loss": -25.030166625976562, "global_step": 327169, "epoch": 3941} {"train_loss": -25.73636817932129, "global_step": 327170, "epoch": 3941} {"train_loss": -25.782445907592773, "global_step": 327171, "epoch": 3941} {"train_loss": -25.796796798706055, "global_step": 327172, "epoch": 3941} {"train_loss": -25.527637481689453, "global_step": 327173, "epoch": 3941} {"train_loss": -25.7717227935791, "global_step": 327174, "epoch": 3941} {"train_loss": -25.934844970703125, "global_step": 327175, "epoch": 3941} {"train_loss": -25.734460830688477, "global_step": 327176, "epoch": 3941} {"train_loss": -25.545578002929688, "global_step": 327177, "epoch": 3941} {"train_loss": -25.81717872619629, "global_step": 327178, "epoch": 3941} {"train_loss": -25.531641006469727, "global_step": 327179, "epoch": 3941} {"train_loss": -25.820575714111328, "global_step": 327180, "epoch": 3941} {"train_loss": -25.600738525390625, "global_step": 327181, "epoch": 3941} {"train_loss": -25.802539825439453, "global_step": 327182, "epoch": 3941} {"train_loss": -25.493579864501953, "global_step": 327183, "epoch": 3941} {"train_loss": -25.862186431884766, "global_step": 327184, "epoch": 3941} {"train_loss": -25.83528038392584, "global_step": 327185, "epoch": 3941, "val_loss": 7250140.0} {"train_loss": -24.985876083374023, "global_step": 327186, "epoch": 3942} {"train_loss": -25.043306350708008, "global_step": 327187, "epoch": 3942} {"train_loss": -25.28407096862793, "global_step": 327188, "epoch": 3942} {"train_loss": -24.959440231323242, "global_step": 327189, "epoch": 3942} {"train_loss": -25.33051872253418, "global_step": 327190, "epoch": 3942} {"train_loss": -25.275787353515625, "global_step": 327191, "epoch": 3942} {"train_loss": -25.340103149414062, "global_step": 327192, "epoch": 3942} {"train_loss": -25.316978454589844, "global_step": 327193, "epoch": 3942} {"train_loss": -24.994508743286133, "global_step": 327194, "epoch": 3942} {"train_loss": -25.3848934173584, "global_step": 327195, "epoch": 3942} {"train_loss": -25.78464126586914, "global_step": 327196, "epoch": 3942} {"train_loss": -25.337385177612305, "global_step": 327197, "epoch": 3942} {"train_loss": -25.36603355407715, "global_step": 327198, "epoch": 3942} {"train_loss": -25.64522361755371, "global_step": 327199, "epoch": 3942} {"train_loss": -25.429052352905273, "global_step": 327200, "epoch": 3942} {"train_loss": -25.421472549438477, "global_step": 327201, "epoch": 3942} {"train_loss": -25.560617446899414, "global_step": 327202, "epoch": 3942} {"train_loss": -25.276168823242188, "global_step": 327203, "epoch": 3942} {"train_loss": -25.76865577697754, "global_step": 327204, "epoch": 3942} {"train_loss": -25.57406997680664, "global_step": 327205, "epoch": 3942} {"train_loss": -25.811756134033203, "global_step": 327206, "epoch": 3942} {"train_loss": -25.682886123657227, "global_step": 327207, "epoch": 3942} {"train_loss": -25.82203483581543, "global_step": 327208, "epoch": 3942} {"train_loss": -25.67205810546875, "global_step": 327209, "epoch": 3942} {"train_loss": -25.70782470703125, "global_step": 327210, "epoch": 3942} {"train_loss": -25.767065048217773, "global_step": 327211, "epoch": 3942} {"train_loss": -25.7613582611084, "global_step": 327212, "epoch": 3942} {"train_loss": -25.795032501220703, "global_step": 327213, "epoch": 3942} {"train_loss": -25.916889190673828, "global_step": 327214, "epoch": 3942} {"train_loss": -25.744836807250977, "global_step": 327215, "epoch": 3942} {"train_loss": -25.80881118774414, "global_step": 327216, "epoch": 3942} {"train_loss": -26.192968368530273, "global_step": 327217, "epoch": 3942} {"train_loss": -25.884235382080078, "global_step": 327218, "epoch": 3942} {"train_loss": -25.87091636657715, "global_step": 327219, "epoch": 3942} {"train_loss": -26.225433349609375, "global_step": 327220, "epoch": 3942} {"train_loss": -25.968250274658203, "global_step": 327221, "epoch": 3942} {"train_loss": -26.233600616455078, "global_step": 327222, "epoch": 3942} {"train_loss": -25.957834243774414, "global_step": 327223, "epoch": 3942} {"train_loss": -26.060321807861328, "global_step": 327224, "epoch": 3942} {"train_loss": -26.06715202331543, "global_step": 327225, "epoch": 3942} {"train_loss": -26.189538955688477, "global_step": 327226, "epoch": 3942} {"train_loss": -25.7630558013916, "global_step": 327227, "epoch": 3942} {"train_loss": -26.402875900268555, "global_step": 327228, "epoch": 3942} {"train_loss": -26.026227951049805, "global_step": 327229, "epoch": 3942} {"train_loss": -25.995466232299805, "global_step": 327230, "epoch": 3942} {"train_loss": -25.72003173828125, "global_step": 327231, "epoch": 3942} {"train_loss": -26.210723876953125, "global_step": 327232, "epoch": 3942} {"train_loss": -25.749420166015625, "global_step": 327233, "epoch": 3942} {"train_loss": -26.03645133972168, "global_step": 327234, "epoch": 3942} {"train_loss": -26.012683868408203, "global_step": 327235, "epoch": 3942} {"train_loss": -26.110544204711914, "global_step": 327236, "epoch": 3942} {"train_loss": -25.832427978515625, "global_step": 327237, "epoch": 3942} {"train_loss": -25.999176025390625, "global_step": 327238, "epoch": 3942} {"train_loss": -25.942533493041992, "global_step": 327239, "epoch": 3942} {"train_loss": -25.933542251586914, "global_step": 327240, "epoch": 3942} {"train_loss": -26.061370849609375, "global_step": 327241, "epoch": 3942} {"train_loss": -26.098896026611328, "global_step": 327242, "epoch": 3942} {"train_loss": -26.385740280151367, "global_step": 327243, "epoch": 3942} {"train_loss": -26.144229888916016, "global_step": 327244, "epoch": 3942} {"train_loss": -26.125171661376953, "global_step": 327245, "epoch": 3942} {"train_loss": -26.040014266967773, "global_step": 327246, "epoch": 3942} {"train_loss": -25.878896713256836, "global_step": 327247, "epoch": 3942} {"train_loss": -25.941259384155273, "global_step": 327248, "epoch": 3942} {"train_loss": -25.726205825805664, "global_step": 327249, "epoch": 3942} {"train_loss": -25.823211669921875, "global_step": 327250, "epoch": 3942} {"train_loss": -26.158451080322266, "global_step": 327251, "epoch": 3942} {"train_loss": -25.65947914123535, "global_step": 327252, "epoch": 3942} {"train_loss": -25.507360458374023, "global_step": 327253, "epoch": 3942} {"train_loss": -25.969013214111328, "global_step": 327254, "epoch": 3942} {"train_loss": -26.02362060546875, "global_step": 327255, "epoch": 3942} {"train_loss": -26.065784454345703, "global_step": 327256, "epoch": 3942} {"train_loss": -26.04485511779785, "global_step": 327257, "epoch": 3942} {"train_loss": -26.142126083374023, "global_step": 327258, "epoch": 3942} {"train_loss": -26.144317626953125, "global_step": 327259, "epoch": 3942} {"train_loss": -25.87916374206543, "global_step": 327260, "epoch": 3942} {"train_loss": -25.968652725219727, "global_step": 327261, "epoch": 3942} {"train_loss": -25.970380783081055, "global_step": 327262, "epoch": 3942} {"train_loss": -26.48894691467285, "global_step": 327263, "epoch": 3942} {"train_loss": -26.094043731689453, "global_step": 327264, "epoch": 3942} {"train_loss": -26.07822608947754, "global_step": 327265, "epoch": 3942} {"train_loss": -25.8643798828125, "global_step": 327266, "epoch": 3942} {"train_loss": -26.321821212768555, "global_step": 327267, "epoch": 3942} {"train_loss": -25.8219126046422, "global_step": 327268, "epoch": 3942, "val_loss": 7110353.0} {"train_loss": -24.503507614135742, "global_step": 327269, "epoch": 3943} {"train_loss": -24.22048568725586, "global_step": 327270, "epoch": 3943} {"train_loss": -24.735254287719727, "global_step": 327271, "epoch": 3943} {"train_loss": -25.747594833374023, "global_step": 327272, "epoch": 3943} {"train_loss": -24.583158493041992, "global_step": 327273, "epoch": 3943} {"train_loss": -25.147512435913086, "global_step": 327274, "epoch": 3943} {"train_loss": -25.301742553710938, "global_step": 327275, "epoch": 3943} {"train_loss": -25.030963897705078, "global_step": 327276, "epoch": 3943} {"train_loss": -25.1939640045166, "global_step": 327277, "epoch": 3943} {"train_loss": -25.313129425048828, "global_step": 327278, "epoch": 3943} {"train_loss": -24.898712158203125, "global_step": 327279, "epoch": 3943} {"train_loss": -25.407751083374023, "global_step": 327280, "epoch": 3943} {"train_loss": -25.321046829223633, "global_step": 327281, "epoch": 3943} {"train_loss": -25.023916244506836, "global_step": 327282, "epoch": 3943} {"train_loss": -25.499887466430664, "global_step": 327283, "epoch": 3943} {"train_loss": -25.010955810546875, "global_step": 327284, "epoch": 3943} {"train_loss": -25.48064422607422, "global_step": 327285, "epoch": 3943} {"train_loss": -25.954620361328125, "global_step": 327286, "epoch": 3943} {"train_loss": -25.94736671447754, "global_step": 327287, "epoch": 3943} {"train_loss": -25.365201950073242, "global_step": 327288, "epoch": 3943} {"train_loss": -25.544570922851562, "global_step": 327289, "epoch": 3943} {"train_loss": -25.672199249267578, "global_step": 327290, "epoch": 3943} {"train_loss": -25.795629501342773, "global_step": 327291, "epoch": 3943} {"train_loss": -25.467296600341797, "global_step": 327292, "epoch": 3943} {"train_loss": -25.826379776000977, "global_step": 327293, "epoch": 3943} {"train_loss": -25.669830322265625, "global_step": 327294, "epoch": 3943} {"train_loss": -26.04279136657715, "global_step": 327295, "epoch": 3943} {"train_loss": -26.19460105895996, "global_step": 327296, "epoch": 3943} {"train_loss": -26.072431564331055, "global_step": 327297, "epoch": 3943} {"train_loss": -26.09580421447754, "global_step": 327298, "epoch": 3943} {"train_loss": -26.150409698486328, "global_step": 327299, "epoch": 3943} {"train_loss": -25.627614974975586, "global_step": 327300, "epoch": 3943} {"train_loss": -25.932418823242188, "global_step": 327301, "epoch": 3943} {"train_loss": -26.124540328979492, "global_step": 327302, "epoch": 3943} {"train_loss": -25.9691219329834, "global_step": 327303, "epoch": 3943} {"train_loss": -26.16767692565918, "global_step": 327304, "epoch": 3943} {"train_loss": -25.75349998474121, "global_step": 327305, "epoch": 3943} {"train_loss": -26.13579750061035, "global_step": 327306, "epoch": 3943} {"train_loss": -26.08626365661621, "global_step": 327307, "epoch": 3943} {"train_loss": -26.0302734375, "global_step": 327308, "epoch": 3943} {"train_loss": -26.381128311157227, "global_step": 327309, "epoch": 3943} {"train_loss": -26.022619247436523, "global_step": 327310, "epoch": 3943} {"train_loss": -26.10577392578125, "global_step": 327311, "epoch": 3943} {"train_loss": -25.9172420501709, "global_step": 327312, "epoch": 3943} {"train_loss": -26.264606475830078, "global_step": 327313, "epoch": 3943} {"train_loss": -26.24945640563965, "global_step": 327314, "epoch": 3943} {"train_loss": -26.024282455444336, "global_step": 327315, "epoch": 3943} {"train_loss": -26.32411003112793, "global_step": 327316, "epoch": 3943} {"train_loss": -25.985610961914062, "global_step": 327317, "epoch": 3943} {"train_loss": -25.98042869567871, "global_step": 327318, "epoch": 3943} {"train_loss": -26.31427574157715, "global_step": 327319, "epoch": 3943} {"train_loss": -26.32095718383789, "global_step": 327320, "epoch": 3943} {"train_loss": -25.722436904907227, "global_step": 327321, "epoch": 3943} {"train_loss": -26.106470108032227, "global_step": 327322, "epoch": 3943} {"train_loss": -26.03156089782715, "global_step": 327323, "epoch": 3943} {"train_loss": -26.056180953979492, "global_step": 327324, "epoch": 3943} {"train_loss": -25.79549217224121, "global_step": 327325, "epoch": 3943} {"train_loss": -26.18682289123535, "global_step": 327326, "epoch": 3943} {"train_loss": -25.71551513671875, "global_step": 327327, "epoch": 3943} {"train_loss": -25.670988082885742, "global_step": 327328, "epoch": 3943} {"train_loss": -26.098169326782227, "global_step": 327329, "epoch": 3943} {"train_loss": -26.144845962524414, "global_step": 327330, "epoch": 3943} {"train_loss": -26.040449142456055, "global_step": 327331, "epoch": 3943} {"train_loss": -26.187292098999023, "global_step": 327332, "epoch": 3943} {"train_loss": -25.903451919555664, "global_step": 327333, "epoch": 3943} {"train_loss": -26.107254028320312, "global_step": 327334, "epoch": 3943} {"train_loss": -25.98258399963379, "global_step": 327335, "epoch": 3943} {"train_loss": -26.052045822143555, "global_step": 327336, "epoch": 3943} {"train_loss": -25.779159545898438, "global_step": 327337, "epoch": 3943} {"train_loss": -25.4892578125, "global_step": 327338, "epoch": 3943} {"train_loss": -25.254817962646484, "global_step": 327339, "epoch": 3943} {"train_loss": -24.86515998840332, "global_step": 327340, "epoch": 3943} {"train_loss": -24.767614364624023, "global_step": 327341, "epoch": 3943} {"train_loss": -25.822431564331055, "global_step": 327342, "epoch": 3943} {"train_loss": -25.596593856811523, "global_step": 327343, "epoch": 3943} {"train_loss": -25.0167236328125, "global_step": 327344, "epoch": 3943} {"train_loss": -25.592069625854492, "global_step": 327345, "epoch": 3943} {"train_loss": -25.28672981262207, "global_step": 327346, "epoch": 3943} {"train_loss": -25.63418960571289, "global_step": 327347, "epoch": 3943} {"train_loss": -25.69877052307129, "global_step": 327348, "epoch": 3943} {"train_loss": -25.536096572875977, "global_step": 327349, "epoch": 3943} {"train_loss": -25.446151733398438, "global_step": 327350, "epoch": 3943} {"train_loss": -25.68752481851233, "global_step": 327351, "epoch": 3943, "val_loss": 7250298.0} {"train_loss": -24.06922721862793, "global_step": 327352, "epoch": 3944} {"train_loss": -24.664775848388672, "global_step": 327353, "epoch": 3944} {"train_loss": -25.18708610534668, "global_step": 327354, "epoch": 3944} {"train_loss": -24.351394653320312, "global_step": 327355, "epoch": 3944} {"train_loss": -25.075698852539062, "global_step": 327356, "epoch": 3944} {"train_loss": -24.666522979736328, "global_step": 327357, "epoch": 3944} {"train_loss": -25.04140281677246, "global_step": 327358, "epoch": 3944} {"train_loss": -25.044662475585938, "global_step": 327359, "epoch": 3944} {"train_loss": -24.880401611328125, "global_step": 327360, "epoch": 3944} {"train_loss": -25.04348373413086, "global_step": 327361, "epoch": 3944} {"train_loss": -25.14387321472168, "global_step": 327362, "epoch": 3944} {"train_loss": -24.932586669921875, "global_step": 327363, "epoch": 3944} {"train_loss": -25.204500198364258, "global_step": 327364, "epoch": 3944} {"train_loss": -25.204267501831055, "global_step": 327365, "epoch": 3944} {"train_loss": -25.18743896484375, "global_step": 327366, "epoch": 3944} {"train_loss": -25.258695602416992, "global_step": 327367, "epoch": 3944} {"train_loss": -25.22450065612793, "global_step": 327368, "epoch": 3944} {"train_loss": -24.9722843170166, "global_step": 327369, "epoch": 3944} {"train_loss": -25.26863670349121, "global_step": 327370, "epoch": 3944} {"train_loss": -25.1802978515625, "global_step": 327371, "epoch": 3944} {"train_loss": -25.655038833618164, "global_step": 327372, "epoch": 3944} {"train_loss": -25.130918502807617, "global_step": 327373, "epoch": 3944} {"train_loss": -25.21428871154785, "global_step": 327374, "epoch": 3944} {"train_loss": -25.475833892822266, "global_step": 327375, "epoch": 3944} {"train_loss": -25.34627342224121, "global_step": 327376, "epoch": 3944} {"train_loss": -25.498620986938477, "global_step": 327377, "epoch": 3944} {"train_loss": -25.779356002807617, "global_step": 327378, "epoch": 3944} {"train_loss": -25.637714385986328, "global_step": 327379, "epoch": 3944} {"train_loss": -25.63435173034668, "global_step": 327380, "epoch": 3944} {"train_loss": -25.640100479125977, "global_step": 327381, "epoch": 3944} {"train_loss": -25.02610969543457, "global_step": 327382, "epoch": 3944} {"train_loss": -26.28851318359375, "global_step": 327383, "epoch": 3944} {"train_loss": -26.0322208404541, "global_step": 327384, "epoch": 3944} {"train_loss": -25.843555450439453, "global_step": 327385, "epoch": 3944} {"train_loss": -25.61146354675293, "global_step": 327386, "epoch": 3944} {"train_loss": -25.37552833557129, "global_step": 327387, "epoch": 3944} {"train_loss": -26.02924156188965, "global_step": 327388, "epoch": 3944} {"train_loss": -25.65386962890625, "global_step": 327389, "epoch": 3944} {"train_loss": -25.9754581451416, "global_step": 327390, "epoch": 3944} {"train_loss": -25.912824630737305, "global_step": 327391, "epoch": 3944} {"train_loss": -26.0318546295166, "global_step": 327392, "epoch": 3944} {"train_loss": -25.65939712524414, "global_step": 327393, "epoch": 3944} {"train_loss": -25.88496208190918, "global_step": 327394, "epoch": 3944} {"train_loss": -25.849573135375977, "global_step": 327395, "epoch": 3944} {"train_loss": -26.21063232421875, "global_step": 327396, "epoch": 3944} {"train_loss": -26.2169246673584, "global_step": 327397, "epoch": 3944} {"train_loss": -25.853906631469727, "global_step": 327398, "epoch": 3944} {"train_loss": -26.09649085998535, "global_step": 327399, "epoch": 3944} {"train_loss": -26.23500633239746, "global_step": 327400, "epoch": 3944} {"train_loss": -25.887720108032227, "global_step": 327401, "epoch": 3944} {"train_loss": -25.81728172302246, "global_step": 327402, "epoch": 3944} {"train_loss": -25.786542892456055, "global_step": 327403, "epoch": 3944} {"train_loss": -26.47943687438965, "global_step": 327404, "epoch": 3944} {"train_loss": -25.874469757080078, "global_step": 327405, "epoch": 3944} {"train_loss": -26.250585556030273, "global_step": 327406, "epoch": 3944} {"train_loss": -25.726062774658203, "global_step": 327407, "epoch": 3944} {"train_loss": -26.172107696533203, "global_step": 327408, "epoch": 3944} {"train_loss": -26.090478897094727, "global_step": 327409, "epoch": 3944} {"train_loss": -26.04229736328125, "global_step": 327410, "epoch": 3944} {"train_loss": -25.875137329101562, "global_step": 327411, "epoch": 3944} {"train_loss": -25.745630264282227, "global_step": 327412, "epoch": 3944} {"train_loss": -26.029077529907227, "global_step": 327413, "epoch": 3944} {"train_loss": -25.83024024963379, "global_step": 327414, "epoch": 3944} {"train_loss": -26.0587158203125, "global_step": 327415, "epoch": 3944} {"train_loss": -26.111886978149414, "global_step": 327416, "epoch": 3944} {"train_loss": -26.156370162963867, "global_step": 327417, "epoch": 3944} {"train_loss": -26.058948516845703, "global_step": 327418, "epoch": 3944} {"train_loss": -25.99897575378418, "global_step": 327419, "epoch": 3944} {"train_loss": -25.79684829711914, "global_step": 327420, "epoch": 3944} {"train_loss": -26.128707885742188, "global_step": 327421, "epoch": 3944} {"train_loss": -25.97340202331543, "global_step": 327422, "epoch": 3944} {"train_loss": -26.1865234375, "global_step": 327423, "epoch": 3944} {"train_loss": -25.969762802124023, "global_step": 327424, "epoch": 3944} {"train_loss": -26.170978546142578, "global_step": 327425, "epoch": 3944} {"train_loss": -26.113431930541992, "global_step": 327426, "epoch": 3944} {"train_loss": -25.98602867126465, "global_step": 327427, "epoch": 3944} {"train_loss": -26.39483070373535, "global_step": 327428, "epoch": 3944} {"train_loss": -26.386938095092773, "global_step": 327429, "epoch": 3944} {"train_loss": -25.744367599487305, "global_step": 327430, "epoch": 3944} {"train_loss": -26.377857208251953, "global_step": 327431, "epoch": 3944} {"train_loss": -26.094533920288086, "global_step": 327432, "epoch": 3944} {"train_loss": -25.90498161315918, "global_step": 327433, "epoch": 3944} {"train_loss": -25.674025363232715, "global_step": 327434, "epoch": 3944, "val_loss": 7228460.5} {"train_loss": -24.866561889648438, "global_step": 327435, "epoch": 3945} {"train_loss": -24.612051010131836, "global_step": 327436, "epoch": 3945} {"train_loss": -24.85983657836914, "global_step": 327437, "epoch": 3945} {"train_loss": -25.034826278686523, "global_step": 327438, "epoch": 3945} {"train_loss": -25.019527435302734, "global_step": 327439, "epoch": 3945} {"train_loss": -25.027191162109375, "global_step": 327440, "epoch": 3945} {"train_loss": -25.546859741210938, "global_step": 327441, "epoch": 3945} {"train_loss": -25.061437606811523, "global_step": 327442, "epoch": 3945} {"train_loss": -25.32208251953125, "global_step": 327443, "epoch": 3945} {"train_loss": -25.412628173828125, "global_step": 327444, "epoch": 3945} {"train_loss": -25.188621520996094, "global_step": 327445, "epoch": 3945} {"train_loss": -25.5659122467041, "global_step": 327446, "epoch": 3945} {"train_loss": -25.082731246948242, "global_step": 327447, "epoch": 3945} {"train_loss": -25.519285202026367, "global_step": 327448, "epoch": 3945} {"train_loss": -25.6004638671875, "global_step": 327449, "epoch": 3945} {"train_loss": -25.19978141784668, "global_step": 327450, "epoch": 3945} {"train_loss": -25.53512954711914, "global_step": 327451, "epoch": 3945} {"train_loss": -25.56011390686035, "global_step": 327452, "epoch": 3945} {"train_loss": -25.747949600219727, "global_step": 327453, "epoch": 3945} {"train_loss": -25.6114559173584, "global_step": 327454, "epoch": 3945} {"train_loss": -25.547025680541992, "global_step": 327455, "epoch": 3945} {"train_loss": -25.670215606689453, "global_step": 327456, "epoch": 3945} {"train_loss": -25.708328247070312, "global_step": 327457, "epoch": 3945} {"train_loss": -26.043405532836914, "global_step": 327458, "epoch": 3945} {"train_loss": -25.67242431640625, "global_step": 327459, "epoch": 3945} {"train_loss": -25.742435455322266, "global_step": 327460, "epoch": 3945} {"train_loss": -25.99602699279785, "global_step": 327461, "epoch": 3945} {"train_loss": -25.984344482421875, "global_step": 327462, "epoch": 3945} {"train_loss": -26.104963302612305, "global_step": 327463, "epoch": 3945} {"train_loss": -25.546173095703125, "global_step": 327464, "epoch": 3945} {"train_loss": -25.842514038085938, "global_step": 327465, "epoch": 3945} {"train_loss": -25.735456466674805, "global_step": 327466, "epoch": 3945} {"train_loss": -26.21778678894043, "global_step": 327467, "epoch": 3945} {"train_loss": -25.93830680847168, "global_step": 327468, "epoch": 3945} {"train_loss": -25.817291259765625, "global_step": 327469, "epoch": 3945} {"train_loss": -25.863943099975586, "global_step": 327470, "epoch": 3945} {"train_loss": -25.966796875, "global_step": 327471, "epoch": 3945} {"train_loss": -26.394163131713867, "global_step": 327472, "epoch": 3945} {"train_loss": -25.969776153564453, "global_step": 327473, "epoch": 3945} {"train_loss": -26.2402400970459, "global_step": 327474, "epoch": 3945} {"train_loss": -25.604703903198242, "global_step": 327475, "epoch": 3945} {"train_loss": -26.269866943359375, "global_step": 327476, "epoch": 3945} {"train_loss": -26.3049373626709, "global_step": 327477, "epoch": 3945} {"train_loss": -25.803028106689453, "global_step": 327478, "epoch": 3945} {"train_loss": -26.0167236328125, "global_step": 327479, "epoch": 3945} {"train_loss": -26.25287437438965, "global_step": 327480, "epoch": 3945} {"train_loss": -25.954565048217773, "global_step": 327481, "epoch": 3945} {"train_loss": -26.3275203704834, "global_step": 327482, "epoch": 3945} {"train_loss": -26.129907608032227, "global_step": 327483, "epoch": 3945} {"train_loss": -26.000699996948242, "global_step": 327484, "epoch": 3945} {"train_loss": -26.12457275390625, "global_step": 327485, "epoch": 3945} {"train_loss": -25.94049644470215, "global_step": 327486, "epoch": 3945} {"train_loss": -25.99361228942871, "global_step": 327487, "epoch": 3945} {"train_loss": -26.2261905670166, "global_step": 327488, "epoch": 3945} {"train_loss": -26.105274200439453, "global_step": 327489, "epoch": 3945} {"train_loss": -26.141510009765625, "global_step": 327490, "epoch": 3945} {"train_loss": -25.674610137939453, "global_step": 327491, "epoch": 3945} {"train_loss": -25.738758087158203, "global_step": 327492, "epoch": 3945} {"train_loss": -25.985570907592773, "global_step": 327493, "epoch": 3945} {"train_loss": -26.327733993530273, "global_step": 327494, "epoch": 3945} {"train_loss": -26.27974510192871, "global_step": 327495, "epoch": 3945} {"train_loss": -25.712299346923828, "global_step": 327496, "epoch": 3945} {"train_loss": -25.595552444458008, "global_step": 327497, "epoch": 3945} {"train_loss": -26.141071319580078, "global_step": 327498, "epoch": 3945} {"train_loss": -25.803943634033203, "global_step": 327499, "epoch": 3945} {"train_loss": -25.416013717651367, "global_step": 327500, "epoch": 3945} {"train_loss": -25.781904220581055, "global_step": 327501, "epoch": 3945} {"train_loss": -25.69698143005371, "global_step": 327502, "epoch": 3945} {"train_loss": -25.42189598083496, "global_step": 327503, "epoch": 3945} {"train_loss": -26.237319946289062, "global_step": 327504, "epoch": 3945} {"train_loss": -26.12100601196289, "global_step": 327505, "epoch": 3945} {"train_loss": -26.4144287109375, "global_step": 327506, "epoch": 3945} {"train_loss": -25.732763290405273, "global_step": 327507, "epoch": 3945} {"train_loss": -26.12433433532715, "global_step": 327508, "epoch": 3945} {"train_loss": -25.919065475463867, "global_step": 327509, "epoch": 3945} {"train_loss": -25.752704620361328, "global_step": 327510, "epoch": 3945} {"train_loss": -25.9951171875, "global_step": 327511, "epoch": 3945} {"train_loss": -26.14788246154785, "global_step": 327512, "epoch": 3945} {"train_loss": -25.540481567382812, "global_step": 327513, "epoch": 3945} {"train_loss": -25.85909080505371, "global_step": 327514, "epoch": 3945} {"train_loss": -25.906864166259766, "global_step": 327515, "epoch": 3945} {"train_loss": -26.14409828186035, "global_step": 327516, "epoch": 3945} {"train_loss": -25.786453040249377, "global_step": 327517, "epoch": 3945, "val_loss": 7241304.0} {"train_loss": -24.502302169799805, "global_step": 327518, "epoch": 3946} {"train_loss": -24.856571197509766, "global_step": 327519, "epoch": 3946} {"train_loss": -25.56211280822754, "global_step": 327520, "epoch": 3946} {"train_loss": -25.27956199645996, "global_step": 327521, "epoch": 3946} {"train_loss": -25.017398834228516, "global_step": 327522, "epoch": 3946} {"train_loss": -25.397438049316406, "global_step": 327523, "epoch": 3946} {"train_loss": -25.44991683959961, "global_step": 327524, "epoch": 3946} {"train_loss": -25.442243576049805, "global_step": 327525, "epoch": 3946} {"train_loss": -25.584331512451172, "global_step": 327526, "epoch": 3946} {"train_loss": -25.44664764404297, "global_step": 327527, "epoch": 3946} {"train_loss": -25.43880271911621, "global_step": 327528, "epoch": 3946} {"train_loss": -25.544754028320312, "global_step": 327529, "epoch": 3946} {"train_loss": -25.618494033813477, "global_step": 327530, "epoch": 3946} {"train_loss": -25.601703643798828, "global_step": 327531, "epoch": 3946} {"train_loss": -25.664566040039062, "global_step": 327532, "epoch": 3946} {"train_loss": -25.362548828125, "global_step": 327533, "epoch": 3946} {"train_loss": -25.83945083618164, "global_step": 327534, "epoch": 3946} {"train_loss": -25.662601470947266, "global_step": 327535, "epoch": 3946} {"train_loss": -25.765531539916992, "global_step": 327536, "epoch": 3946} {"train_loss": -25.686487197875977, "global_step": 327537, "epoch": 3946} {"train_loss": -26.03667640686035, "global_step": 327538, "epoch": 3946} {"train_loss": -25.58393669128418, "global_step": 327539, "epoch": 3946} {"train_loss": -25.9435977935791, "global_step": 327540, "epoch": 3946} {"train_loss": -25.835187911987305, "global_step": 327541, "epoch": 3946} {"train_loss": -26.213464736938477, "global_step": 327542, "epoch": 3946} {"train_loss": -25.818750381469727, "global_step": 327543, "epoch": 3946} {"train_loss": -25.809553146362305, "global_step": 327544, "epoch": 3946} {"train_loss": -25.840219497680664, "global_step": 327545, "epoch": 3946} {"train_loss": -26.10458755493164, "global_step": 327546, "epoch": 3946} {"train_loss": -26.148651123046875, "global_step": 327547, "epoch": 3946} {"train_loss": -25.810224533081055, "global_step": 327548, "epoch": 3946} {"train_loss": -25.937305450439453, "global_step": 327549, "epoch": 3946} {"train_loss": -26.001684188842773, "global_step": 327550, "epoch": 3946} {"train_loss": -25.695302963256836, "global_step": 327551, "epoch": 3946} {"train_loss": -26.08962059020996, "global_step": 327552, "epoch": 3946} {"train_loss": -25.978071212768555, "global_step": 327553, "epoch": 3946} {"train_loss": -26.324920654296875, "global_step": 327554, "epoch": 3946} {"train_loss": -26.23919105529785, "global_step": 327555, "epoch": 3946} {"train_loss": -26.061803817749023, "global_step": 327556, "epoch": 3946} {"train_loss": -25.949848175048828, "global_step": 327557, "epoch": 3946} {"train_loss": -26.19573402404785, "global_step": 327558, "epoch": 3946} {"train_loss": -25.746692657470703, "global_step": 327559, "epoch": 3946} {"train_loss": -25.93808937072754, "global_step": 327560, "epoch": 3946} {"train_loss": -25.59063720703125, "global_step": 327561, "epoch": 3946} {"train_loss": -25.778583526611328, "global_step": 327562, "epoch": 3946} {"train_loss": -25.442171096801758, "global_step": 327563, "epoch": 3946} {"train_loss": -25.89837074279785, "global_step": 327564, "epoch": 3946} {"train_loss": -25.826297760009766, "global_step": 327565, "epoch": 3946} {"train_loss": -25.93842124938965, "global_step": 327566, "epoch": 3946} {"train_loss": -25.629053115844727, "global_step": 327567, "epoch": 3946} {"train_loss": -25.872766494750977, "global_step": 327568, "epoch": 3946} {"train_loss": -25.921430587768555, "global_step": 327569, "epoch": 3946} {"train_loss": -26.061246871948242, "global_step": 327570, "epoch": 3946} {"train_loss": -26.089731216430664, "global_step": 327571, "epoch": 3946} {"train_loss": -26.046594619750977, "global_step": 327572, "epoch": 3946} {"train_loss": -25.5328426361084, "global_step": 327573, "epoch": 3946} {"train_loss": -25.66346549987793, "global_step": 327574, "epoch": 3946} {"train_loss": -25.981067657470703, "global_step": 327575, "epoch": 3946} {"train_loss": -25.8641414642334, "global_step": 327576, "epoch": 3946} {"train_loss": -26.057966232299805, "global_step": 327577, "epoch": 3946} {"train_loss": -26.15924644470215, "global_step": 327578, "epoch": 3946} {"train_loss": -26.1083984375, "global_step": 327579, "epoch": 3946} {"train_loss": -26.0736083984375, "global_step": 327580, "epoch": 3946} {"train_loss": -25.86163902282715, "global_step": 327581, "epoch": 3946} {"train_loss": -26.08033561706543, "global_step": 327582, "epoch": 3946} {"train_loss": -25.709228515625, "global_step": 327583, "epoch": 3946} {"train_loss": -26.169775009155273, "global_step": 327584, "epoch": 3946} {"train_loss": -26.195846557617188, "global_step": 327585, "epoch": 3946} {"train_loss": -25.70356559753418, "global_step": 327586, "epoch": 3946} {"train_loss": -25.602148056030273, "global_step": 327587, "epoch": 3946} {"train_loss": -26.013525009155273, "global_step": 327588, "epoch": 3946} {"train_loss": -25.980146408081055, "global_step": 327589, "epoch": 3946} {"train_loss": -25.873071670532227, "global_step": 327590, "epoch": 3946} {"train_loss": -26.133533477783203, "global_step": 327591, "epoch": 3946} {"train_loss": -25.89228630065918, "global_step": 327592, "epoch": 3946} {"train_loss": -25.861303329467773, "global_step": 327593, "epoch": 3946} {"train_loss": -25.804615020751953, "global_step": 327594, "epoch": 3946} {"train_loss": -25.817462921142578, "global_step": 327595, "epoch": 3946} {"train_loss": -25.933277130126953, "global_step": 327596, "epoch": 3946} {"train_loss": -25.53388214111328, "global_step": 327597, "epoch": 3946} {"train_loss": -25.691186904907227, "global_step": 327598, "epoch": 3946} {"train_loss": -26.024866104125977, "global_step": 327599, "epoch": 3946} {"train_loss": -25.800348327820558, "global_step": 327600, "epoch": 3946, "val_loss": 7310207.0} {"train_loss": -25.498281478881836, "global_step": 327601, "epoch": 3947} {"train_loss": -24.880970001220703, "global_step": 327602, "epoch": 3947} {"train_loss": -25.391437530517578, "global_step": 327603, "epoch": 3947} {"train_loss": -25.991544723510742, "global_step": 327604, "epoch": 3947} {"train_loss": -25.53673553466797, "global_step": 327605, "epoch": 3947} {"train_loss": -25.382495880126953, "global_step": 327606, "epoch": 3947} {"train_loss": -25.6605224609375, "global_step": 327607, "epoch": 3947} {"train_loss": -25.566736221313477, "global_step": 327608, "epoch": 3947} {"train_loss": -25.899255752563477, "global_step": 327609, "epoch": 3947} {"train_loss": -25.652435302734375, "global_step": 327610, "epoch": 3947} {"train_loss": -25.8563232421875, "global_step": 327611, "epoch": 3947} {"train_loss": -25.47020149230957, "global_step": 327612, "epoch": 3947} {"train_loss": -25.51980972290039, "global_step": 327613, "epoch": 3947} {"train_loss": -25.939802169799805, "global_step": 327614, "epoch": 3947} {"train_loss": -25.425138473510742, "global_step": 327615, "epoch": 3947} {"train_loss": -25.893360137939453, "global_step": 327616, "epoch": 3947} {"train_loss": -26.032079696655273, "global_step": 327617, "epoch": 3947} {"train_loss": -25.9418888092041, "global_step": 327618, "epoch": 3947} {"train_loss": -25.906635284423828, "global_step": 327619, "epoch": 3947} {"train_loss": -25.9160213470459, "global_step": 327620, "epoch": 3947} {"train_loss": -26.274805068969727, "global_step": 327621, "epoch": 3947} {"train_loss": -25.7545108795166, "global_step": 327622, "epoch": 3947} {"train_loss": -25.521081924438477, "global_step": 327623, "epoch": 3947} {"train_loss": -25.617990493774414, "global_step": 327624, "epoch": 3947} {"train_loss": -25.959430694580078, "global_step": 327625, "epoch": 3947} {"train_loss": -25.83835792541504, "global_step": 327626, "epoch": 3947} {"train_loss": -25.798492431640625, "global_step": 327627, "epoch": 3947} {"train_loss": -25.855554580688477, "global_step": 327628, "epoch": 3947} {"train_loss": -25.332298278808594, "global_step": 327629, "epoch": 3947} {"train_loss": -25.96634292602539, "global_step": 327630, "epoch": 3947} {"train_loss": -25.897815704345703, "global_step": 327631, "epoch": 3947} {"train_loss": -25.98670768737793, "global_step": 327632, "epoch": 3947} {"train_loss": -26.201696395874023, "global_step": 327633, "epoch": 3947} {"train_loss": -25.98233413696289, "global_step": 327634, "epoch": 3947} {"train_loss": -25.6037540435791, "global_step": 327635, "epoch": 3947} {"train_loss": -25.931854248046875, "global_step": 327636, "epoch": 3947} {"train_loss": -26.324899673461914, "global_step": 327637, "epoch": 3947} {"train_loss": -26.147348403930664, "global_step": 327638, "epoch": 3947} {"train_loss": -26.37476921081543, "global_step": 327639, "epoch": 3947} {"train_loss": -26.1082763671875, "global_step": 327640, "epoch": 3947} {"train_loss": -26.07984733581543, "global_step": 327641, "epoch": 3947} {"train_loss": -26.16196632385254, "global_step": 327642, "epoch": 3947} {"train_loss": -26.090368270874023, "global_step": 327643, "epoch": 3947} {"train_loss": -25.988468170166016, "global_step": 327644, "epoch": 3947} {"train_loss": -25.986570358276367, "global_step": 327645, "epoch": 3947} {"train_loss": -25.861440658569336, "global_step": 327646, "epoch": 3947} {"train_loss": -26.152008056640625, "global_step": 327647, "epoch": 3947} {"train_loss": -26.397449493408203, "global_step": 327648, "epoch": 3947} {"train_loss": -26.225305557250977, "global_step": 327649, "epoch": 3947} {"train_loss": -26.12615394592285, "global_step": 327650, "epoch": 3947} {"train_loss": -25.70203971862793, "global_step": 327651, "epoch": 3947} {"train_loss": -25.851736068725586, "global_step": 327652, "epoch": 3947} {"train_loss": -25.935636520385742, "global_step": 327653, "epoch": 3947} {"train_loss": -25.813419342041016, "global_step": 327654, "epoch": 3947} {"train_loss": -25.925113677978516, "global_step": 327655, "epoch": 3947} {"train_loss": -25.52842140197754, "global_step": 327656, "epoch": 3947} {"train_loss": -26.194440841674805, "global_step": 327657, "epoch": 3947} {"train_loss": -25.766733169555664, "global_step": 327658, "epoch": 3947} {"train_loss": -25.770048141479492, "global_step": 327659, "epoch": 3947} {"train_loss": -25.978302001953125, "global_step": 327660, "epoch": 3947} {"train_loss": -26.090972900390625, "global_step": 327661, "epoch": 3947} {"train_loss": -26.095447540283203, "global_step": 327662, "epoch": 3947} {"train_loss": -25.853601455688477, "global_step": 327663, "epoch": 3947} {"train_loss": -25.7415714263916, "global_step": 327664, "epoch": 3947} {"train_loss": -25.890460968017578, "global_step": 327665, "epoch": 3947} {"train_loss": -26.010900497436523, "global_step": 327666, "epoch": 3947} {"train_loss": -25.609256744384766, "global_step": 327667, "epoch": 3947} {"train_loss": -25.86675453186035, "global_step": 327668, "epoch": 3947} {"train_loss": -26.335119247436523, "global_step": 327669, "epoch": 3947} {"train_loss": -25.806106567382812, "global_step": 327670, "epoch": 3947} {"train_loss": -25.80377769470215, "global_step": 327671, "epoch": 3947} {"train_loss": -25.99042320251465, "global_step": 327672, "epoch": 3947} {"train_loss": -26.097305297851562, "global_step": 327673, "epoch": 3947} {"train_loss": -25.91086196899414, "global_step": 327674, "epoch": 3947} {"train_loss": -26.002283096313477, "global_step": 327675, "epoch": 3947} {"train_loss": -26.00019645690918, "global_step": 327676, "epoch": 3947} {"train_loss": -25.641565322875977, "global_step": 327677, "epoch": 3947} {"train_loss": -26.0537052154541, "global_step": 327678, "epoch": 3947} {"train_loss": -26.310028076171875, "global_step": 327679, "epoch": 3947} {"train_loss": -25.86639976501465, "global_step": 327680, "epoch": 3947} {"train_loss": -25.986982345581055, "global_step": 327681, "epoch": 3947} {"train_loss": -25.621429443359375, "global_step": 327682, "epoch": 3947} {"train_loss": -25.8864390821342, "global_step": 327683, "epoch": 3947, "val_loss": 7247509.0} {"train_loss": -25.44948387145996, "global_step": 327684, "epoch": 3948} {"train_loss": -25.079866409301758, "global_step": 327685, "epoch": 3948} {"train_loss": -25.940155029296875, "global_step": 327686, "epoch": 3948} {"train_loss": -25.36191177368164, "global_step": 327687, "epoch": 3948} {"train_loss": -25.328351974487305, "global_step": 327688, "epoch": 3948} {"train_loss": -25.48062515258789, "global_step": 327689, "epoch": 3948} {"train_loss": -25.676084518432617, "global_step": 327690, "epoch": 3948} {"train_loss": -25.804025650024414, "global_step": 327691, "epoch": 3948} {"train_loss": -25.840839385986328, "global_step": 327692, "epoch": 3948} {"train_loss": -25.83513832092285, "global_step": 327693, "epoch": 3948} {"train_loss": -26.048200607299805, "global_step": 327694, "epoch": 3948} {"train_loss": -25.417234420776367, "global_step": 327695, "epoch": 3948} {"train_loss": -25.770837783813477, "global_step": 327696, "epoch": 3948} {"train_loss": -25.4735164642334, "global_step": 327697, "epoch": 3948} {"train_loss": -25.71173667907715, "global_step": 327698, "epoch": 3948} {"train_loss": -26.16227149963379, "global_step": 327699, "epoch": 3948} {"train_loss": -25.84089469909668, "global_step": 327700, "epoch": 3948} {"train_loss": -25.856042861938477, "global_step": 327701, "epoch": 3948} {"train_loss": -25.720977783203125, "global_step": 327702, "epoch": 3948} {"train_loss": -26.047840118408203, "global_step": 327703, "epoch": 3948} {"train_loss": -26.009265899658203, "global_step": 327704, "epoch": 3948} {"train_loss": -26.074209213256836, "global_step": 327705, "epoch": 3948} {"train_loss": -25.844934463500977, "global_step": 327706, "epoch": 3948} {"train_loss": -25.82349967956543, "global_step": 327707, "epoch": 3948} {"train_loss": -26.201019287109375, "global_step": 327708, "epoch": 3948} {"train_loss": -25.852705001831055, "global_step": 327709, "epoch": 3948} {"train_loss": -25.99140739440918, "global_step": 327710, "epoch": 3948} {"train_loss": -25.521514892578125, "global_step": 327711, "epoch": 3948} {"train_loss": -26.065332412719727, "global_step": 327712, "epoch": 3948} {"train_loss": -26.109594345092773, "global_step": 327713, "epoch": 3948} {"train_loss": -26.022113800048828, "global_step": 327714, "epoch": 3948} {"train_loss": -26.52186393737793, "global_step": 327715, "epoch": 3948} {"train_loss": -26.08963966369629, "global_step": 327716, "epoch": 3948} {"train_loss": -25.843067169189453, "global_step": 327717, "epoch": 3948} {"train_loss": -26.003620147705078, "global_step": 327718, "epoch": 3948} {"train_loss": -25.832263946533203, "global_step": 327719, "epoch": 3948} {"train_loss": -25.816030502319336, "global_step": 327720, "epoch": 3948} {"train_loss": -26.01972770690918, "global_step": 327721, "epoch": 3948} {"train_loss": -25.972274780273438, "global_step": 327722, "epoch": 3948} {"train_loss": -25.862262725830078, "global_step": 327723, "epoch": 3948} {"train_loss": -26.06451988220215, "global_step": 327724, "epoch": 3948} {"train_loss": -25.833860397338867, "global_step": 327725, "epoch": 3948} {"train_loss": -25.948938369750977, "global_step": 327726, "epoch": 3948} {"train_loss": -25.92331886291504, "global_step": 327727, "epoch": 3948} {"train_loss": -26.219823837280273, "global_step": 327728, "epoch": 3948} {"train_loss": -26.025259017944336, "global_step": 327729, "epoch": 3948} {"train_loss": -25.953393936157227, "global_step": 327730, "epoch": 3948} {"train_loss": -25.80352783203125, "global_step": 327731, "epoch": 3948} {"train_loss": -25.9638729095459, "global_step": 327732, "epoch": 3948} {"train_loss": -26.39845085144043, "global_step": 327733, "epoch": 3948} {"train_loss": -25.86130142211914, "global_step": 327734, "epoch": 3948} {"train_loss": -25.918912887573242, "global_step": 327735, "epoch": 3948} {"train_loss": -26.18482780456543, "global_step": 327736, "epoch": 3948} {"train_loss": -25.310327529907227, "global_step": 327737, "epoch": 3948} {"train_loss": -25.07404899597168, "global_step": 327738, "epoch": 3948} {"train_loss": -25.39829444885254, "global_step": 327739, "epoch": 3948} {"train_loss": -25.593311309814453, "global_step": 327740, "epoch": 3948} {"train_loss": -26.03969383239746, "global_step": 327741, "epoch": 3948} {"train_loss": -25.85297203063965, "global_step": 327742, "epoch": 3948} {"train_loss": -25.494741439819336, "global_step": 327743, "epoch": 3948} {"train_loss": -25.510875701904297, "global_step": 327744, "epoch": 3948} {"train_loss": -25.95254898071289, "global_step": 327745, "epoch": 3948} {"train_loss": -25.629913330078125, "global_step": 327746, "epoch": 3948} {"train_loss": -25.889062881469727, "global_step": 327747, "epoch": 3948} {"train_loss": -25.62344741821289, "global_step": 327748, "epoch": 3948} {"train_loss": -26.10841178894043, "global_step": 327749, "epoch": 3948} {"train_loss": -25.826047897338867, "global_step": 327750, "epoch": 3948} {"train_loss": -25.87407875061035, "global_step": 327751, "epoch": 3948} {"train_loss": -25.883230209350586, "global_step": 327752, "epoch": 3948} {"train_loss": -25.678674697875977, "global_step": 327753, "epoch": 3948} {"train_loss": -25.869098663330078, "global_step": 327754, "epoch": 3948} {"train_loss": -25.995681762695312, "global_step": 327755, "epoch": 3948} {"train_loss": -25.797718048095703, "global_step": 327756, "epoch": 3948} {"train_loss": -25.645572662353516, "global_step": 327757, "epoch": 3948} {"train_loss": -25.9464168548584, "global_step": 327758, "epoch": 3948} {"train_loss": -25.624902725219727, "global_step": 327759, "epoch": 3948} {"train_loss": -26.61895179748535, "global_step": 327760, "epoch": 3948} {"train_loss": -25.697174072265625, "global_step": 327761, "epoch": 3948} {"train_loss": -25.780105590820312, "global_step": 327762, "epoch": 3948} {"train_loss": -25.939294815063477, "global_step": 327763, "epoch": 3948} {"train_loss": -26.117828369140625, "global_step": 327764, "epoch": 3948} {"train_loss": -25.95643424987793, "global_step": 327765, "epoch": 3948} {"train_loss": -25.832824339349585, "global_step": 327766, "epoch": 3948, "val_loss": 7158358.5} {"train_loss": -25.034345626831055, "global_step": 327767, "epoch": 3949} {"train_loss": -25.0191593170166, "global_step": 327768, "epoch": 3949} {"train_loss": -25.3643741607666, "global_step": 327769, "epoch": 3949} {"train_loss": -25.358434677124023, "global_step": 327770, "epoch": 3949} {"train_loss": -25.095552444458008, "global_step": 327771, "epoch": 3949} {"train_loss": -25.778676986694336, "global_step": 327772, "epoch": 3949} {"train_loss": -25.523683547973633, "global_step": 327773, "epoch": 3949} {"train_loss": -25.852924346923828, "global_step": 327774, "epoch": 3949} {"train_loss": -25.488832473754883, "global_step": 327775, "epoch": 3949} {"train_loss": -25.887434005737305, "global_step": 327776, "epoch": 3949} {"train_loss": -25.66401481628418, "global_step": 327777, "epoch": 3949} {"train_loss": -25.571735382080078, "global_step": 327778, "epoch": 3949} {"train_loss": -25.429677963256836, "global_step": 327779, "epoch": 3949} {"train_loss": -26.123291015625, "global_step": 327780, "epoch": 3949} {"train_loss": -26.13865089416504, "global_step": 327781, "epoch": 3949} {"train_loss": -25.600019454956055, "global_step": 327782, "epoch": 3949} {"train_loss": -25.70802879333496, "global_step": 327783, "epoch": 3949} {"train_loss": -25.81394386291504, "global_step": 327784, "epoch": 3949} {"train_loss": -26.033910751342773, "global_step": 327785, "epoch": 3949} {"train_loss": -25.925634384155273, "global_step": 327786, "epoch": 3949} {"train_loss": -25.697568893432617, "global_step": 327787, "epoch": 3949} {"train_loss": -25.824148178100586, "global_step": 327788, "epoch": 3949} {"train_loss": -25.757482528686523, "global_step": 327789, "epoch": 3949} {"train_loss": -25.8065185546875, "global_step": 327790, "epoch": 3949} {"train_loss": -25.757535934448242, "global_step": 327791, "epoch": 3949} {"train_loss": -26.203323364257812, "global_step": 327792, "epoch": 3949} {"train_loss": -25.624942779541016, "global_step": 327793, "epoch": 3949} {"train_loss": -25.887332916259766, "global_step": 327794, "epoch": 3949} {"train_loss": -25.852025985717773, "global_step": 327795, "epoch": 3949} {"train_loss": -25.674213409423828, "global_step": 327796, "epoch": 3949} {"train_loss": -25.7722110748291, "global_step": 327797, "epoch": 3949} {"train_loss": -25.846811294555664, "global_step": 327798, "epoch": 3949} {"train_loss": -26.394418716430664, "global_step": 327799, "epoch": 3949} {"train_loss": -25.936614990234375, "global_step": 327800, "epoch": 3949} {"train_loss": -25.442842483520508, "global_step": 327801, "epoch": 3949} {"train_loss": -25.99860954284668, "global_step": 327802, "epoch": 3949} {"train_loss": -26.018085479736328, "global_step": 327803, "epoch": 3949} {"train_loss": -26.385101318359375, "global_step": 327804, "epoch": 3949} {"train_loss": -25.983020782470703, "global_step": 327805, "epoch": 3949} {"train_loss": -26.179433822631836, "global_step": 327806, "epoch": 3949} {"train_loss": -25.854360580444336, "global_step": 327807, "epoch": 3949} {"train_loss": -26.03900146484375, "global_step": 327808, "epoch": 3949} {"train_loss": -26.007604598999023, "global_step": 327809, "epoch": 3949} {"train_loss": -25.999588012695312, "global_step": 327810, "epoch": 3949} {"train_loss": -26.06910514831543, "global_step": 327811, "epoch": 3949} {"train_loss": -25.770994186401367, "global_step": 327812, "epoch": 3949} {"train_loss": -25.868947982788086, "global_step": 327813, "epoch": 3949} {"train_loss": -26.18683433532715, "global_step": 327814, "epoch": 3949} {"train_loss": -26.21857261657715, "global_step": 327815, "epoch": 3949} {"train_loss": -26.48305320739746, "global_step": 327816, "epoch": 3949} {"train_loss": -26.113672256469727, "global_step": 327817, "epoch": 3949} {"train_loss": -25.77131462097168, "global_step": 327818, "epoch": 3949} {"train_loss": -26.022602081298828, "global_step": 327819, "epoch": 3949} {"train_loss": -25.639389038085938, "global_step": 327820, "epoch": 3949} {"train_loss": -25.628768920898438, "global_step": 327821, "epoch": 3949} {"train_loss": -25.124601364135742, "global_step": 327822, "epoch": 3949} {"train_loss": -25.284835815429688, "global_step": 327823, "epoch": 3949} {"train_loss": -26.3425350189209, "global_step": 327824, "epoch": 3949} {"train_loss": -25.709375381469727, "global_step": 327825, "epoch": 3949} {"train_loss": -26.22785758972168, "global_step": 327826, "epoch": 3949} {"train_loss": -25.484577178955078, "global_step": 327827, "epoch": 3949} {"train_loss": -25.894262313842773, "global_step": 327828, "epoch": 3949} {"train_loss": -25.706823348999023, "global_step": 327829, "epoch": 3949} {"train_loss": -25.40524673461914, "global_step": 327830, "epoch": 3949} {"train_loss": -26.159488677978516, "global_step": 327831, "epoch": 3949} {"train_loss": -25.85626220703125, "global_step": 327832, "epoch": 3949} {"train_loss": -25.92274284362793, "global_step": 327833, "epoch": 3949} {"train_loss": -25.60674476623535, "global_step": 327834, "epoch": 3949} {"train_loss": -25.60706901550293, "global_step": 327835, "epoch": 3949} {"train_loss": -25.44610023498535, "global_step": 327836, "epoch": 3949} {"train_loss": -25.966154098510742, "global_step": 327837, "epoch": 3949} {"train_loss": -25.518095016479492, "global_step": 327838, "epoch": 3949} {"train_loss": -25.44045066833496, "global_step": 327839, "epoch": 3949} {"train_loss": -26.074934005737305, "global_step": 327840, "epoch": 3949} {"train_loss": -26.245141983032227, "global_step": 327841, "epoch": 3949} {"train_loss": -25.702909469604492, "global_step": 327842, "epoch": 3949} {"train_loss": -25.795089721679688, "global_step": 327843, "epoch": 3949} {"train_loss": -25.58564567565918, "global_step": 327844, "epoch": 3949} {"train_loss": -25.6411190032959, "global_step": 327845, "epoch": 3949} {"train_loss": -25.949649810791016, "global_step": 327846, "epoch": 3949} {"train_loss": -26.10873794555664, "global_step": 327847, "epoch": 3949} {"train_loss": -26.00299644470215, "global_step": 327848, "epoch": 3949} {"train_loss": -25.8041269922831, "global_step": 327849, "epoch": 3949, "val_loss": 7255450.5} {"train_loss": -25.634214401245117, "global_step": 327850, "epoch": 3950} {"train_loss": -25.517627716064453, "global_step": 327851, "epoch": 3950} {"train_loss": -25.981420516967773, "global_step": 327852, "epoch": 3950} {"train_loss": -25.220632553100586, "global_step": 327853, "epoch": 3950} {"train_loss": -25.49306297302246, "global_step": 327854, "epoch": 3950} {"train_loss": -25.689212799072266, "global_step": 327855, "epoch": 3950} {"train_loss": -25.5465030670166, "global_step": 327856, "epoch": 3950} {"train_loss": -25.57978630065918, "global_step": 327857, "epoch": 3950} {"train_loss": -25.52803611755371, "global_step": 327858, "epoch": 3950} {"train_loss": -25.899494171142578, "global_step": 327859, "epoch": 3950} {"train_loss": -25.889434814453125, "global_step": 327860, "epoch": 3950} {"train_loss": -25.486913681030273, "global_step": 327861, "epoch": 3950} {"train_loss": -25.62518882751465, "global_step": 327862, "epoch": 3950} {"train_loss": -25.585962295532227, "global_step": 327863, "epoch": 3950} {"train_loss": -25.709630966186523, "global_step": 327864, "epoch": 3950} {"train_loss": -26.181549072265625, "global_step": 327865, "epoch": 3950} {"train_loss": -25.856576919555664, "global_step": 327866, "epoch": 3950} {"train_loss": -25.8814697265625, "global_step": 327867, "epoch": 3950} {"train_loss": -26.140588760375977, "global_step": 327868, "epoch": 3950} {"train_loss": -25.787832260131836, "global_step": 327869, "epoch": 3950} {"train_loss": -26.0322322845459, "global_step": 327870, "epoch": 3950} {"train_loss": -26.202911376953125, "global_step": 327871, "epoch": 3950} {"train_loss": -25.840167999267578, "global_step": 327872, "epoch": 3950} {"train_loss": -26.05341911315918, "global_step": 327873, "epoch": 3950} {"train_loss": -25.816537857055664, "global_step": 327874, "epoch": 3950} {"train_loss": -26.06056785583496, "global_step": 327875, "epoch": 3950} {"train_loss": -25.8604736328125, "global_step": 327876, "epoch": 3950} {"train_loss": -25.755956649780273, "global_step": 327877, "epoch": 3950} {"train_loss": -26.01453971862793, "global_step": 327878, "epoch": 3950} {"train_loss": -25.923269271850586, "global_step": 327879, "epoch": 3950} {"train_loss": -26.104307174682617, "global_step": 327880, "epoch": 3950} {"train_loss": -25.89363670349121, "global_step": 327881, "epoch": 3950} {"train_loss": -25.91212272644043, "global_step": 327882, "epoch": 3950} {"train_loss": -26.169174194335938, "global_step": 327883, "epoch": 3950} {"train_loss": -25.892688751220703, "global_step": 327884, "epoch": 3950} {"train_loss": -26.066007614135742, "global_step": 327885, "epoch": 3950} {"train_loss": -25.98050308227539, "global_step": 327886, "epoch": 3950} {"train_loss": -26.3503475189209, "global_step": 327887, "epoch": 3950} {"train_loss": -25.948379516601562, "global_step": 327888, "epoch": 3950} {"train_loss": -26.090620040893555, "global_step": 327889, "epoch": 3950} {"train_loss": -26.233251571655273, "global_step": 327890, "epoch": 3950} {"train_loss": -25.93994140625, "global_step": 327891, "epoch": 3950} {"train_loss": -26.324249267578125, "global_step": 327892, "epoch": 3950} {"train_loss": -25.858722686767578, "global_step": 327893, "epoch": 3950} {"train_loss": -26.148517608642578, "global_step": 327894, "epoch": 3950} {"train_loss": -25.710432052612305, "global_step": 327895, "epoch": 3950} {"train_loss": -26.251821517944336, "global_step": 327896, "epoch": 3950} {"train_loss": -26.150049209594727, "global_step": 327897, "epoch": 3950} {"train_loss": -26.140188217163086, "global_step": 327898, "epoch": 3950} {"train_loss": -26.32853126525879, "global_step": 327899, "epoch": 3950} {"train_loss": -25.6519832611084, "global_step": 327900, "epoch": 3950} {"train_loss": -26.02187156677246, "global_step": 327901, "epoch": 3950} {"train_loss": -25.76715087890625, "global_step": 327902, "epoch": 3950} {"train_loss": -25.853452682495117, "global_step": 327903, "epoch": 3950} {"train_loss": -26.25664710998535, "global_step": 327904, "epoch": 3950} {"train_loss": -26.25409507751465, "global_step": 327905, "epoch": 3950} {"train_loss": -25.84796142578125, "global_step": 327906, "epoch": 3950} {"train_loss": -26.2220458984375, "global_step": 327907, "epoch": 3950} {"train_loss": -26.401142120361328, "global_step": 327908, "epoch": 3950} {"train_loss": -26.13704490661621, "global_step": 327909, "epoch": 3950} {"train_loss": -25.954381942749023, "global_step": 327910, "epoch": 3950} {"train_loss": -26.02952003479004, "global_step": 327911, "epoch": 3950} {"train_loss": -26.10976219177246, "global_step": 327912, "epoch": 3950} {"train_loss": -25.487627029418945, "global_step": 327913, "epoch": 3950} {"train_loss": -25.703937530517578, "global_step": 327914, "epoch": 3950} {"train_loss": -25.72572135925293, "global_step": 327915, "epoch": 3950} {"train_loss": -25.12948989868164, "global_step": 327916, "epoch": 3950} {"train_loss": -25.381620407104492, "global_step": 327917, "epoch": 3950} {"train_loss": -25.579622268676758, "global_step": 327918, "epoch": 3950} {"train_loss": -25.709821701049805, "global_step": 327919, "epoch": 3950} {"train_loss": -25.982099533081055, "global_step": 327920, "epoch": 3950} {"train_loss": -24.78348159790039, "global_step": 327921, "epoch": 3950} {"train_loss": -25.39201545715332, "global_step": 327922, "epoch": 3950} {"train_loss": -25.81720542907715, "global_step": 327923, "epoch": 3950} {"train_loss": -25.64700698852539, "global_step": 327924, "epoch": 3950} {"train_loss": -25.379743576049805, "global_step": 327925, "epoch": 3950} {"train_loss": -25.45590591430664, "global_step": 327926, "epoch": 3950} {"train_loss": -25.302709579467773, "global_step": 327927, "epoch": 3950} {"train_loss": -25.655029296875, "global_step": 327928, "epoch": 3950} {"train_loss": -25.61090660095215, "global_step": 327929, "epoch": 3950} {"train_loss": -25.64246940612793, "global_step": 327930, "epoch": 3950} {"train_loss": -25.815107345581055, "global_step": 327931, "epoch": 3950} {"train_loss": -25.829618591860115, "global_step": 327932, "epoch": 3950, "train/sim_max_reward_0": 1.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4500000": 1.0, "test/sim_max_reward_4500001": 1.0, "test/sim_max_reward_4500002": 1.0, "test/sim_max_reward_4500003": 1.0, "test/sim_max_reward_4500004": 1.0, "test/sim_max_reward_4500005": 1.0, "test/sim_max_reward_4500006": 1.0, "test/sim_max_reward_4500007": 1.0, "test/sim_max_reward_4500008": 1.0, "test/sim_max_reward_4500009": 1.0, "test/sim_max_reward_4500010": 1.0, "test/sim_max_reward_4500011": 1.0, "test/sim_max_reward_4500012": 1.0, "test/sim_max_reward_4500013": 1.0, "test/sim_max_reward_4500014": 1.0, "test/sim_max_reward_4500015": 1.0, "test/sim_max_reward_4500016": 1.0, "test/sim_max_reward_4500017": 1.0, "test/sim_max_reward_4500018": 1.0, "test/sim_max_reward_4500019": 1.0, "test/sim_max_reward_4500020": 1.0, "test/sim_max_reward_4500021": 1.0, "train/mean_score": 1.0, "test/mean_score": 1.0, "val_loss": 7311591.5} {"train_loss": -25.020904541015625, "global_step": 327933, "epoch": 3951} {"train_loss": -25.58506202697754, "global_step": 327934, "epoch": 3951} {"train_loss": -24.704214096069336, "global_step": 327935, "epoch": 3951} {"train_loss": -25.443546295166016, "global_step": 327936, "epoch": 3951} {"train_loss": -25.237157821655273, "global_step": 327937, "epoch": 3951} {"train_loss": -25.417268753051758, "global_step": 327938, "epoch": 3951} {"train_loss": -25.24787712097168, "global_step": 327939, "epoch": 3951} {"train_loss": -24.923852920532227, "global_step": 327940, "epoch": 3951} {"train_loss": -25.097320556640625, "global_step": 327941, "epoch": 3951} {"train_loss": -25.26661491394043, "global_step": 327942, "epoch": 3951} {"train_loss": -25.305908203125, "global_step": 327943, "epoch": 3951} {"train_loss": -25.6883487701416, "global_step": 327944, "epoch": 3951} {"train_loss": -25.50029182434082, "global_step": 327945, "epoch": 3951} {"train_loss": -25.69508171081543, "global_step": 327946, "epoch": 3951} {"train_loss": -25.199310302734375, "global_step": 327947, "epoch": 3951} {"train_loss": -25.723712921142578, "global_step": 327948, "epoch": 3951} {"train_loss": -25.617420196533203, "global_step": 327949, "epoch": 3951} {"train_loss": -25.7409610748291, "global_step": 327950, "epoch": 3951} {"train_loss": -25.72747802734375, "global_step": 327951, "epoch": 3951} {"train_loss": -25.651273727416992, "global_step": 327952, "epoch": 3951} {"train_loss": -25.55974769592285, "global_step": 327953, "epoch": 3951} {"train_loss": -25.276823043823242, "global_step": 327954, "epoch": 3951} {"train_loss": -26.027685165405273, "global_step": 327955, "epoch": 3951} {"train_loss": -25.656301498413086, "global_step": 327956, "epoch": 3951} {"train_loss": -25.922042846679688, "global_step": 327957, "epoch": 3951} {"train_loss": -25.93798828125, "global_step": 327958, "epoch": 3951} {"train_loss": -25.546903610229492, "global_step": 327959, "epoch": 3951} {"train_loss": -25.93924331665039, "global_step": 327960, "epoch": 3951} {"train_loss": -25.62861442565918, "global_step": 327961, "epoch": 3951} {"train_loss": -26.035968780517578, "global_step": 327962, "epoch": 3951} {"train_loss": -26.03851318359375, "global_step": 327963, "epoch": 3951} {"train_loss": -25.844837188720703, "global_step": 327964, "epoch": 3951} {"train_loss": -25.82442283630371, "global_step": 327965, "epoch": 3951} {"train_loss": -25.785663604736328, "global_step": 327966, "epoch": 3951} {"train_loss": -25.8474178314209, "global_step": 327967, "epoch": 3951} {"train_loss": -26.252792358398438, "global_step": 327968, "epoch": 3951} {"train_loss": -26.0699520111084, "global_step": 327969, "epoch": 3951} {"train_loss": -26.216318130493164, "global_step": 327970, "epoch": 3951} {"train_loss": -25.628049850463867, "global_step": 327971, "epoch": 3951} {"train_loss": -26.066930770874023, "global_step": 327972, "epoch": 3951} {"train_loss": -26.296377182006836, "global_step": 327973, "epoch": 3951} {"train_loss": -26.05156898498535, "global_step": 327974, "epoch": 3951} {"train_loss": -26.2529239654541, "global_step": 327975, "epoch": 3951} {"train_loss": -25.989227294921875, "global_step": 327976, "epoch": 3951} {"train_loss": -25.823022842407227, "global_step": 327977, "epoch": 3951} {"train_loss": -26.233596801757812, "global_step": 327978, "epoch": 3951} {"train_loss": -26.153003692626953, "global_step": 327979, "epoch": 3951} {"train_loss": -26.01490592956543, "global_step": 327980, "epoch": 3951} {"train_loss": -25.990331649780273, "global_step": 327981, "epoch": 3951} {"train_loss": -26.258886337280273, "global_step": 327982, "epoch": 3951} {"train_loss": -26.04501724243164, "global_step": 327983, "epoch": 3951} {"train_loss": -26.01775550842285, "global_step": 327984, "epoch": 3951} {"train_loss": -26.082080841064453, "global_step": 327985, "epoch": 3951} {"train_loss": -25.990890502929688, "global_step": 327986, "epoch": 3951} {"train_loss": -25.68007469177246, "global_step": 327987, "epoch": 3951} {"train_loss": -26.026838302612305, "global_step": 327988, "epoch": 3951} {"train_loss": -26.022138595581055, "global_step": 327989, "epoch": 3951} {"train_loss": -25.81146812438965, "global_step": 327990, "epoch": 3951} {"train_loss": -25.950702667236328, "global_step": 327991, "epoch": 3951} {"train_loss": -26.081811904907227, "global_step": 327992, "epoch": 3951} {"train_loss": -26.24757194519043, "global_step": 327993, "epoch": 3951} {"train_loss": -25.795978546142578, "global_step": 327994, "epoch": 3951} {"train_loss": -26.330951690673828, "global_step": 327995, "epoch": 3951} {"train_loss": -25.99065589904785, "global_step": 327996, "epoch": 3951} {"train_loss": -26.142566680908203, "global_step": 327997, "epoch": 3951} {"train_loss": -25.834028244018555, "global_step": 327998, "epoch": 3951} {"train_loss": -26.012983322143555, "global_step": 327999, "epoch": 3951} {"train_loss": -25.701852798461914, "global_step": 328000, "epoch": 3951} {"train_loss": -25.912343978881836, "global_step": 328001, "epoch": 3951} {"train_loss": -25.969573974609375, "global_step": 328002, "epoch": 3951} {"train_loss": -25.143234252929688, "global_step": 328003, "epoch": 3951} {"train_loss": -25.686574935913086, "global_step": 328004, "epoch": 3951} {"train_loss": -25.783666610717773, "global_step": 328005, "epoch": 3951} {"train_loss": -25.627471923828125, "global_step": 328006, "epoch": 3951} {"train_loss": -25.43886947631836, "global_step": 328007, "epoch": 3951} {"train_loss": -26.199121475219727, "global_step": 328008, "epoch": 3951} {"train_loss": -26.09378433227539, "global_step": 328009, "epoch": 3951} {"train_loss": -26.0664119720459, "global_step": 328010, "epoch": 3951} {"train_loss": -25.762556076049805, "global_step": 328011, "epoch": 3951} {"train_loss": -25.960824966430664, "global_step": 328012, "epoch": 3951} {"train_loss": -25.73377799987793, "global_step": 328013, "epoch": 3951} {"train_loss": -25.738006591796875, "global_step": 328014, "epoch": 3951} {"train_loss": -25.786937529782215, "global_step": 328015, "epoch": 3951, "val_loss": 7258595.0} {"train_loss": -25.547056198120117, "global_step": 328016, "epoch": 3952} {"train_loss": -25.379377365112305, "global_step": 328017, "epoch": 3952} {"train_loss": -25.75884437561035, "global_step": 328018, "epoch": 3952} {"train_loss": -25.23246192932129, "global_step": 328019, "epoch": 3952} {"train_loss": -25.320219039916992, "global_step": 328020, "epoch": 3952} {"train_loss": -25.78388023376465, "global_step": 328021, "epoch": 3952} {"train_loss": -25.569303512573242, "global_step": 328022, "epoch": 3952} {"train_loss": -25.60028648376465, "global_step": 328023, "epoch": 3952} {"train_loss": -25.691577911376953, "global_step": 328024, "epoch": 3952} {"train_loss": -25.717992782592773, "global_step": 328025, "epoch": 3952} {"train_loss": -25.77167320251465, "global_step": 328026, "epoch": 3952} {"train_loss": -25.854904174804688, "global_step": 328027, "epoch": 3952} {"train_loss": -25.88657569885254, "global_step": 328028, "epoch": 3952} {"train_loss": -25.52327537536621, "global_step": 328029, "epoch": 3952} {"train_loss": -25.782669067382812, "global_step": 328030, "epoch": 3952} {"train_loss": -25.726165771484375, "global_step": 328031, "epoch": 3952} {"train_loss": -25.84442138671875, "global_step": 328032, "epoch": 3952} {"train_loss": -25.782922744750977, "global_step": 328033, "epoch": 3952} {"train_loss": -26.145246505737305, "global_step": 328034, "epoch": 3952} {"train_loss": -25.681547164916992, "global_step": 328035, "epoch": 3952} {"train_loss": -26.11575698852539, "global_step": 328036, "epoch": 3952} {"train_loss": -25.804712295532227, "global_step": 328037, "epoch": 3952} {"train_loss": -25.957687377929688, "global_step": 328038, "epoch": 3952} {"train_loss": -25.581892013549805, "global_step": 328039, "epoch": 3952} {"train_loss": -25.493276596069336, "global_step": 328040, "epoch": 3952} {"train_loss": -25.919300079345703, "global_step": 328041, "epoch": 3952} {"train_loss": -26.18076515197754, "global_step": 328042, "epoch": 3952} {"train_loss": -25.583343505859375, "global_step": 328043, "epoch": 3952} {"train_loss": -26.06708335876465, "global_step": 328044, "epoch": 3952} {"train_loss": -25.821054458618164, "global_step": 328045, "epoch": 3952} {"train_loss": -25.854589462280273, "global_step": 328046, "epoch": 3952} {"train_loss": -25.56806755065918, "global_step": 328047, "epoch": 3952} {"train_loss": -25.686664581298828, "global_step": 328048, "epoch": 3952} {"train_loss": -25.8118953704834, "global_step": 328049, "epoch": 3952} {"train_loss": -25.978961944580078, "global_step": 328050, "epoch": 3952} {"train_loss": -25.746652603149414, "global_step": 328051, "epoch": 3952} {"train_loss": -25.7430362701416, "global_step": 328052, "epoch": 3952} {"train_loss": -25.815872192382812, "global_step": 328053, "epoch": 3952} {"train_loss": -26.13970375061035, "global_step": 328054, "epoch": 3952} {"train_loss": -26.075408935546875, "global_step": 328055, "epoch": 3952} {"train_loss": -26.2381591796875, "global_step": 328056, "epoch": 3952} {"train_loss": -25.98650550842285, "global_step": 328057, "epoch": 3952} {"train_loss": -26.080718994140625, "global_step": 328058, "epoch": 3952} {"train_loss": -25.79703140258789, "global_step": 328059, "epoch": 3952} {"train_loss": -26.041671752929688, "global_step": 328060, "epoch": 3952} {"train_loss": -25.7999210357666, "global_step": 328061, "epoch": 3952} {"train_loss": -26.065092086791992, "global_step": 328062, "epoch": 3952} {"train_loss": -26.045019149780273, "global_step": 328063, "epoch": 3952} {"train_loss": -25.87447166442871, "global_step": 328064, "epoch": 3952} {"train_loss": -26.02777099609375, "global_step": 328065, "epoch": 3952} {"train_loss": -26.119800567626953, "global_step": 328066, "epoch": 3952} {"train_loss": -25.880603790283203, "global_step": 328067, "epoch": 3952} {"train_loss": -25.521099090576172, "global_step": 328068, "epoch": 3952} {"train_loss": -25.810871124267578, "global_step": 328069, "epoch": 3952} {"train_loss": -26.034299850463867, "global_step": 328070, "epoch": 3952} {"train_loss": -26.19677734375, "global_step": 328071, "epoch": 3952} {"train_loss": -26.40875244140625, "global_step": 328072, "epoch": 3952} {"train_loss": -26.002429962158203, "global_step": 328073, "epoch": 3952} {"train_loss": -26.14045524597168, "global_step": 328074, "epoch": 3952} {"train_loss": -25.900808334350586, "global_step": 328075, "epoch": 3952} {"train_loss": -26.24237060546875, "global_step": 328076, "epoch": 3952} {"train_loss": -26.180814743041992, "global_step": 328077, "epoch": 3952} {"train_loss": -25.863956451416016, "global_step": 328078, "epoch": 3952} {"train_loss": -25.797513961791992, "global_step": 328079, "epoch": 3952} {"train_loss": -26.08101463317871, "global_step": 328080, "epoch": 3952} {"train_loss": -25.96516227722168, "global_step": 328081, "epoch": 3952} {"train_loss": -25.81610679626465, "global_step": 328082, "epoch": 3952} {"train_loss": -26.327238082885742, "global_step": 328083, "epoch": 3952} {"train_loss": -25.987821578979492, "global_step": 328084, "epoch": 3952} {"train_loss": -26.281375885009766, "global_step": 328085, "epoch": 3952} {"train_loss": -26.187225341796875, "global_step": 328086, "epoch": 3952} {"train_loss": -26.124963760375977, "global_step": 328087, "epoch": 3952} {"train_loss": -26.1740665435791, "global_step": 328088, "epoch": 3952} {"train_loss": -25.6688175201416, "global_step": 328089, "epoch": 3952} {"train_loss": -25.836828231811523, "global_step": 328090, "epoch": 3952} {"train_loss": -25.632770538330078, "global_step": 328091, "epoch": 3952} {"train_loss": -25.61372184753418, "global_step": 328092, "epoch": 3952} {"train_loss": -25.78826904296875, "global_step": 328093, "epoch": 3952} {"train_loss": -25.7384033203125, "global_step": 328094, "epoch": 3952} {"train_loss": -25.6788387298584, "global_step": 328095, "epoch": 3952} {"train_loss": -25.83660888671875, "global_step": 328096, "epoch": 3952} {"train_loss": -25.940338134765625, "global_step": 328097, "epoch": 3952} {"train_loss": -25.87796732891037, "global_step": 328098, "epoch": 3952, "val_loss": 7176110.0} {"train_loss": -23.74688720703125, "global_step": 328099, "epoch": 3953} {"train_loss": -23.720151901245117, "global_step": 328100, "epoch": 3953} {"train_loss": -24.77192497253418, "global_step": 328101, "epoch": 3953} {"train_loss": -24.895055770874023, "global_step": 328102, "epoch": 3953} {"train_loss": -24.19449234008789, "global_step": 328103, "epoch": 3953} {"train_loss": -25.249385833740234, "global_step": 328104, "epoch": 3953} {"train_loss": -24.989728927612305, "global_step": 328105, "epoch": 3953} {"train_loss": -24.37281036376953, "global_step": 328106, "epoch": 3953} {"train_loss": -25.231101989746094, "global_step": 328107, "epoch": 3953} {"train_loss": -24.763721466064453, "global_step": 328108, "epoch": 3953} {"train_loss": -25.4680118560791, "global_step": 328109, "epoch": 3953} {"train_loss": -25.17628288269043, "global_step": 328110, "epoch": 3953} {"train_loss": -25.218276977539062, "global_step": 328111, "epoch": 3953} {"train_loss": -25.043411254882812, "global_step": 328112, "epoch": 3953} {"train_loss": -24.998071670532227, "global_step": 328113, "epoch": 3953} {"train_loss": -25.3996639251709, "global_step": 328114, "epoch": 3953} {"train_loss": -25.370595932006836, "global_step": 328115, "epoch": 3953} {"train_loss": -25.420318603515625, "global_step": 328116, "epoch": 3953} {"train_loss": -25.353811264038086, "global_step": 328117, "epoch": 3953} {"train_loss": -25.283353805541992, "global_step": 328118, "epoch": 3953} {"train_loss": -25.62578773498535, "global_step": 328119, "epoch": 3953} {"train_loss": -25.520549774169922, "global_step": 328120, "epoch": 3953} {"train_loss": -25.443748474121094, "global_step": 328121, "epoch": 3953} {"train_loss": -25.392786026000977, "global_step": 328122, "epoch": 3953} {"train_loss": -25.63852882385254, "global_step": 328123, "epoch": 3953} {"train_loss": -25.435155868530273, "global_step": 328124, "epoch": 3953} {"train_loss": -25.377431869506836, "global_step": 328125, "epoch": 3953} {"train_loss": -25.815122604370117, "global_step": 328126, "epoch": 3953} {"train_loss": -25.512413024902344, "global_step": 328127, "epoch": 3953} {"train_loss": -25.727447509765625, "global_step": 328128, "epoch": 3953} {"train_loss": -25.893030166625977, "global_step": 328129, "epoch": 3953} {"train_loss": -25.940683364868164, "global_step": 328130, "epoch": 3953} {"train_loss": -25.48905372619629, "global_step": 328131, "epoch": 3953} {"train_loss": -26.1506290435791, "global_step": 328132, "epoch": 3953} {"train_loss": -25.769697189331055, "global_step": 328133, "epoch": 3953} {"train_loss": -25.6892147064209, "global_step": 328134, "epoch": 3953} {"train_loss": -25.887969970703125, "global_step": 328135, "epoch": 3953} {"train_loss": -25.56866455078125, "global_step": 328136, "epoch": 3953} {"train_loss": -25.481748580932617, "global_step": 328137, "epoch": 3953} {"train_loss": -26.235992431640625, "global_step": 328138, "epoch": 3953} {"train_loss": -25.676679611206055, "global_step": 328139, "epoch": 3953} {"train_loss": -26.09076499938965, "global_step": 328140, "epoch": 3953} {"train_loss": -26.044321060180664, "global_step": 328141, "epoch": 3953} {"train_loss": -25.978979110717773, "global_step": 328142, "epoch": 3953} {"train_loss": -25.969318389892578, "global_step": 328143, "epoch": 3953} {"train_loss": -26.08041763305664, "global_step": 328144, "epoch": 3953} {"train_loss": -26.278717041015625, "global_step": 328145, "epoch": 3953} {"train_loss": -26.191375732421875, "global_step": 328146, "epoch": 3953} {"train_loss": -25.95692253112793, "global_step": 328147, "epoch": 3953} {"train_loss": -25.831012725830078, "global_step": 328148, "epoch": 3953} {"train_loss": -26.3868408203125, "global_step": 328149, "epoch": 3953} {"train_loss": -26.345245361328125, "global_step": 328150, "epoch": 3953} {"train_loss": -26.13837242126465, "global_step": 328151, "epoch": 3953} {"train_loss": -26.00957679748535, "global_step": 328152, "epoch": 3953} {"train_loss": -26.152578353881836, "global_step": 328153, "epoch": 3953} {"train_loss": -26.06141471862793, "global_step": 328154, "epoch": 3953} {"train_loss": -25.888151168823242, "global_step": 328155, "epoch": 3953} {"train_loss": -25.97877311706543, "global_step": 328156, "epoch": 3953} {"train_loss": -26.188568115234375, "global_step": 328157, "epoch": 3953} {"train_loss": -26.0393009185791, "global_step": 328158, "epoch": 3953} {"train_loss": -25.929767608642578, "global_step": 328159, "epoch": 3953} {"train_loss": -26.14143180847168, "global_step": 328160, "epoch": 3953} {"train_loss": -26.092390060424805, "global_step": 328161, "epoch": 3953} {"train_loss": -26.283552169799805, "global_step": 328162, "epoch": 3953} {"train_loss": -26.118993759155273, "global_step": 328163, "epoch": 3953} {"train_loss": -26.180585861206055, "global_step": 328164, "epoch": 3953} {"train_loss": -26.236005783081055, "global_step": 328165, "epoch": 3953} {"train_loss": -25.780935287475586, "global_step": 328166, "epoch": 3953} {"train_loss": -26.3011474609375, "global_step": 328167, "epoch": 3953} {"train_loss": -25.830472946166992, "global_step": 328168, "epoch": 3953} {"train_loss": -26.133386611938477, "global_step": 328169, "epoch": 3953} {"train_loss": -26.35613441467285, "global_step": 328170, "epoch": 3953} {"train_loss": -26.34830665588379, "global_step": 328171, "epoch": 3953} {"train_loss": -25.83131217956543, "global_step": 328172, "epoch": 3953} {"train_loss": -25.646032333374023, "global_step": 328173, "epoch": 3953} {"train_loss": -26.087621688842773, "global_step": 328174, "epoch": 3953} {"train_loss": -25.88422203063965, "global_step": 328175, "epoch": 3953} {"train_loss": -26.25174903869629, "global_step": 328176, "epoch": 3953} {"train_loss": -25.939895629882812, "global_step": 328177, "epoch": 3953} {"train_loss": -26.127058029174805, "global_step": 328178, "epoch": 3953} {"train_loss": -25.85333251953125, "global_step": 328179, "epoch": 3953} {"train_loss": -25.606861114501953, "global_step": 328180, "epoch": 3953} {"train_loss": -25.676891579685442, "global_step": 328181, "epoch": 3953, "val_loss": 7241519.5} {"train_loss": -25.571985244750977, "global_step": 328182, "epoch": 3954} {"train_loss": -25.042156219482422, "global_step": 328183, "epoch": 3954} {"train_loss": -25.749210357666016, "global_step": 328184, "epoch": 3954} {"train_loss": -25.278779983520508, "global_step": 328185, "epoch": 3954} {"train_loss": -25.9559326171875, "global_step": 328186, "epoch": 3954} {"train_loss": -24.864486694335938, "global_step": 328187, "epoch": 3954} {"train_loss": -25.5045223236084, "global_step": 328188, "epoch": 3954} {"train_loss": -25.633935928344727, "global_step": 328189, "epoch": 3954} {"train_loss": -25.926420211791992, "global_step": 328190, "epoch": 3954} {"train_loss": -25.469690322875977, "global_step": 328191, "epoch": 3954} {"train_loss": -25.814970016479492, "global_step": 328192, "epoch": 3954} {"train_loss": -25.727020263671875, "global_step": 328193, "epoch": 3954} {"train_loss": -25.666549682617188, "global_step": 328194, "epoch": 3954} {"train_loss": -25.81682777404785, "global_step": 328195, "epoch": 3954} {"train_loss": -25.988143920898438, "global_step": 328196, "epoch": 3954} {"train_loss": -26.10609245300293, "global_step": 328197, "epoch": 3954} {"train_loss": -26.03139305114746, "global_step": 328198, "epoch": 3954} {"train_loss": -25.66357421875, "global_step": 328199, "epoch": 3954} {"train_loss": -25.554908752441406, "global_step": 328200, "epoch": 3954} {"train_loss": -25.924209594726562, "global_step": 328201, "epoch": 3954} {"train_loss": -25.838438034057617, "global_step": 328202, "epoch": 3954} {"train_loss": -26.086355209350586, "global_step": 328203, "epoch": 3954} {"train_loss": -25.925750732421875, "global_step": 328204, "epoch": 3954} {"train_loss": -25.94016456604004, "global_step": 328205, "epoch": 3954} {"train_loss": -25.776885986328125, "global_step": 328206, "epoch": 3954} {"train_loss": -26.064950942993164, "global_step": 328207, "epoch": 3954} {"train_loss": -26.046045303344727, "global_step": 328208, "epoch": 3954} {"train_loss": -25.772186279296875, "global_step": 328209, "epoch": 3954} {"train_loss": -25.474632263183594, "global_step": 328210, "epoch": 3954} {"train_loss": -25.821258544921875, "global_step": 328211, "epoch": 3954} {"train_loss": -25.794492721557617, "global_step": 328212, "epoch": 3954} {"train_loss": -26.143817901611328, "global_step": 328213, "epoch": 3954} {"train_loss": -25.84442710876465, "global_step": 328214, "epoch": 3954} {"train_loss": -25.75225257873535, "global_step": 328215, "epoch": 3954} {"train_loss": -26.18549156188965, "global_step": 328216, "epoch": 3954} {"train_loss": -25.9237060546875, "global_step": 328217, "epoch": 3954} {"train_loss": -25.615524291992188, "global_step": 328218, "epoch": 3954} {"train_loss": -26.01165199279785, "global_step": 328219, "epoch": 3954} {"train_loss": -25.868011474609375, "global_step": 328220, "epoch": 3954} {"train_loss": -25.842870712280273, "global_step": 328221, "epoch": 3954} {"train_loss": -25.43086051940918, "global_step": 328222, "epoch": 3954} {"train_loss": -26.022363662719727, "global_step": 328223, "epoch": 3954} {"train_loss": -26.40577507019043, "global_step": 328224, "epoch": 3954} {"train_loss": -25.994043350219727, "global_step": 328225, "epoch": 3954} {"train_loss": -25.36874008178711, "global_step": 328226, "epoch": 3954} {"train_loss": -25.954254150390625, "global_step": 328227, "epoch": 3954} {"train_loss": -26.1806697845459, "global_step": 328228, "epoch": 3954} {"train_loss": -25.759979248046875, "global_step": 328229, "epoch": 3954} {"train_loss": -25.264511108398438, "global_step": 328230, "epoch": 3954} {"train_loss": -25.942413330078125, "global_step": 328231, "epoch": 3954} {"train_loss": -25.887990951538086, "global_step": 328232, "epoch": 3954} {"train_loss": -25.703027725219727, "global_step": 328233, "epoch": 3954} {"train_loss": -25.6656551361084, "global_step": 328234, "epoch": 3954} {"train_loss": -25.70038414001465, "global_step": 328235, "epoch": 3954} {"train_loss": -26.032123565673828, "global_step": 328236, "epoch": 3954} {"train_loss": -25.3131046295166, "global_step": 328237, "epoch": 3954} {"train_loss": -25.346508026123047, "global_step": 328238, "epoch": 3954} {"train_loss": -25.63916015625, "global_step": 328239, "epoch": 3954} {"train_loss": -25.49770736694336, "global_step": 328240, "epoch": 3954} {"train_loss": -25.748289108276367, "global_step": 328241, "epoch": 3954} {"train_loss": -25.62900733947754, "global_step": 328242, "epoch": 3954} {"train_loss": -26.3038272857666, "global_step": 328243, "epoch": 3954} {"train_loss": -25.8716983795166, "global_step": 328244, "epoch": 3954} {"train_loss": -26.048450469970703, "global_step": 328245, "epoch": 3954} {"train_loss": -25.857410430908203, "global_step": 328246, "epoch": 3954} {"train_loss": -25.935016632080078, "global_step": 328247, "epoch": 3954} {"train_loss": -26.179412841796875, "global_step": 328248, "epoch": 3954} {"train_loss": -26.053730010986328, "global_step": 328249, "epoch": 3954} {"train_loss": -25.90105628967285, "global_step": 328250, "epoch": 3954} {"train_loss": -26.268415451049805, "global_step": 328251, "epoch": 3954} {"train_loss": -26.137243270874023, "global_step": 328252, "epoch": 3954} {"train_loss": -26.396697998046875, "global_step": 328253, "epoch": 3954} {"train_loss": -25.700824737548828, "global_step": 328254, "epoch": 3954} {"train_loss": -26.17401695251465, "global_step": 328255, "epoch": 3954} {"train_loss": -26.06609535217285, "global_step": 328256, "epoch": 3954} {"train_loss": -25.91682243347168, "global_step": 328257, "epoch": 3954} {"train_loss": -25.7821102142334, "global_step": 328258, "epoch": 3954} {"train_loss": -25.859617233276367, "global_step": 328259, "epoch": 3954} {"train_loss": -26.089773178100586, "global_step": 328260, "epoch": 3954} {"train_loss": -25.910358428955078, "global_step": 328261, "epoch": 3954} {"train_loss": -25.99212074279785, "global_step": 328262, "epoch": 3954} {"train_loss": -26.29975700378418, "global_step": 328263, "epoch": 3954} {"train_loss": -25.84638843766178, "global_step": 328264, "epoch": 3954, "val_loss": 7222962.5} {"train_loss": -25.348299026489258, "global_step": 328265, "epoch": 3955} {"train_loss": -25.45977020263672, "global_step": 328266, "epoch": 3955} {"train_loss": -25.563840866088867, "global_step": 328267, "epoch": 3955} {"train_loss": -25.934656143188477, "global_step": 328268, "epoch": 3955} {"train_loss": -25.968551635742188, "global_step": 328269, "epoch": 3955} {"train_loss": -25.913806915283203, "global_step": 328270, "epoch": 3955} {"train_loss": -25.818073272705078, "global_step": 328271, "epoch": 3955} {"train_loss": -25.53510093688965, "global_step": 328272, "epoch": 3955} {"train_loss": -25.618473052978516, "global_step": 328273, "epoch": 3955} {"train_loss": -26.00442886352539, "global_step": 328274, "epoch": 3955} {"train_loss": -25.612628936767578, "global_step": 328275, "epoch": 3955} {"train_loss": -26.03023338317871, "global_step": 328276, "epoch": 3955} {"train_loss": -26.412235260009766, "global_step": 328277, "epoch": 3955} {"train_loss": -25.558977127075195, "global_step": 328278, "epoch": 3955} {"train_loss": -25.981504440307617, "global_step": 328279, "epoch": 3955} {"train_loss": -25.684858322143555, "global_step": 328280, "epoch": 3955} {"train_loss": -25.912872314453125, "global_step": 328281, "epoch": 3955} {"train_loss": -25.784448623657227, "global_step": 328282, "epoch": 3955} {"train_loss": -25.944067001342773, "global_step": 328283, "epoch": 3955} {"train_loss": -25.95609474182129, "global_step": 328284, "epoch": 3955} {"train_loss": -25.854055404663086, "global_step": 328285, "epoch": 3955} {"train_loss": -25.744016647338867, "global_step": 328286, "epoch": 3955} {"train_loss": -25.866540908813477, "global_step": 328287, "epoch": 3955} {"train_loss": -25.90180015563965, "global_step": 328288, "epoch": 3955} {"train_loss": -26.04026222229004, "global_step": 328289, "epoch": 3955} {"train_loss": -26.01896095275879, "global_step": 328290, "epoch": 3955} {"train_loss": -26.2503604888916, "global_step": 328291, "epoch": 3955} {"train_loss": -26.03059196472168, "global_step": 328292, "epoch": 3955} {"train_loss": -25.919620513916016, "global_step": 328293, "epoch": 3955} {"train_loss": -25.959320068359375, "global_step": 328294, "epoch": 3955} {"train_loss": -26.08721351623535, "global_step": 328295, "epoch": 3955} {"train_loss": -25.889066696166992, "global_step": 328296, "epoch": 3955} {"train_loss": -26.146900177001953, "global_step": 328297, "epoch": 3955} {"train_loss": -25.954328536987305, "global_step": 328298, "epoch": 3955} {"train_loss": -25.633413314819336, "global_step": 328299, "epoch": 3955} {"train_loss": -25.894378662109375, "global_step": 328300, "epoch": 3955} {"train_loss": -26.357419967651367, "global_step": 328301, "epoch": 3955} {"train_loss": -25.779617309570312, "global_step": 328302, "epoch": 3955} {"train_loss": -26.023324966430664, "global_step": 328303, "epoch": 3955} {"train_loss": -25.846994400024414, "global_step": 328304, "epoch": 3955} {"train_loss": -25.663089752197266, "global_step": 328305, "epoch": 3955} {"train_loss": -26.222726821899414, "global_step": 328306, "epoch": 3955} {"train_loss": -25.805831909179688, "global_step": 328307, "epoch": 3955} {"train_loss": -25.973575592041016, "global_step": 328308, "epoch": 3955} {"train_loss": -26.26045036315918, "global_step": 328309, "epoch": 3955} {"train_loss": -26.063318252563477, "global_step": 328310, "epoch": 3955} {"train_loss": -26.07147216796875, "global_step": 328311, "epoch": 3955} {"train_loss": -25.918289184570312, "global_step": 328312, "epoch": 3955} {"train_loss": -26.123937606811523, "global_step": 328313, "epoch": 3955} {"train_loss": -25.944244384765625, "global_step": 328314, "epoch": 3955} {"train_loss": -26.084457397460938, "global_step": 328315, "epoch": 3955} {"train_loss": -26.23154067993164, "global_step": 328316, "epoch": 3955} {"train_loss": -26.10272216796875, "global_step": 328317, "epoch": 3955} {"train_loss": -26.320270538330078, "global_step": 328318, "epoch": 3955} {"train_loss": -25.912342071533203, "global_step": 328319, "epoch": 3955} {"train_loss": -25.854299545288086, "global_step": 328320, "epoch": 3955} {"train_loss": -25.846464157104492, "global_step": 328321, "epoch": 3955} {"train_loss": -26.035581588745117, "global_step": 328322, "epoch": 3955} {"train_loss": -25.866840362548828, "global_step": 328323, "epoch": 3955} {"train_loss": -26.19655418395996, "global_step": 328324, "epoch": 3955} {"train_loss": -26.039716720581055, "global_step": 328325, "epoch": 3955} {"train_loss": -25.53886604309082, "global_step": 328326, "epoch": 3955} {"train_loss": -25.17693328857422, "global_step": 328327, "epoch": 3955} {"train_loss": -25.13132095336914, "global_step": 328328, "epoch": 3955} {"train_loss": -25.502302169799805, "global_step": 328329, "epoch": 3955} {"train_loss": -26.25855827331543, "global_step": 328330, "epoch": 3955} {"train_loss": -25.60285758972168, "global_step": 328331, "epoch": 3955} {"train_loss": -25.355867385864258, "global_step": 328332, "epoch": 3955} {"train_loss": -25.49518394470215, "global_step": 328333, "epoch": 3955} {"train_loss": -25.782819747924805, "global_step": 328334, "epoch": 3955} {"train_loss": -25.493993759155273, "global_step": 328335, "epoch": 3955} {"train_loss": -25.597148895263672, "global_step": 328336, "epoch": 3955} {"train_loss": -25.78411293029785, "global_step": 328337, "epoch": 3955} {"train_loss": -25.89934730529785, "global_step": 328338, "epoch": 3955} {"train_loss": -25.54306411743164, "global_step": 328339, "epoch": 3955} {"train_loss": -26.049386978149414, "global_step": 328340, "epoch": 3955} {"train_loss": -25.678409576416016, "global_step": 328341, "epoch": 3955} {"train_loss": -25.8789119720459, "global_step": 328342, "epoch": 3955} {"train_loss": -26.179962158203125, "global_step": 328343, "epoch": 3955} {"train_loss": -26.02475357055664, "global_step": 328344, "epoch": 3955} {"train_loss": -25.806570053100586, "global_step": 328345, "epoch": 3955} {"train_loss": -26.080549240112305, "global_step": 328346, "epoch": 3955} {"train_loss": -25.874357062650013, "global_step": 328347, "epoch": 3955, "val_loss": 7290616.5} {"train_loss": -25.63825035095215, "global_step": 328348, "epoch": 3956} {"train_loss": -25.809118270874023, "global_step": 328349, "epoch": 3956} {"train_loss": -25.58753204345703, "global_step": 328350, "epoch": 3956} {"train_loss": -25.791147232055664, "global_step": 328351, "epoch": 3956} {"train_loss": -25.78464126586914, "global_step": 328352, "epoch": 3956} {"train_loss": -25.650266647338867, "global_step": 328353, "epoch": 3956} {"train_loss": -25.686368942260742, "global_step": 328354, "epoch": 3956} {"train_loss": -25.491352081298828, "global_step": 328355, "epoch": 3956} {"train_loss": -25.22679901123047, "global_step": 328356, "epoch": 3956} {"train_loss": -25.691486358642578, "global_step": 328357, "epoch": 3956} {"train_loss": -25.746835708618164, "global_step": 328358, "epoch": 3956} {"train_loss": -26.067594528198242, "global_step": 328359, "epoch": 3956} {"train_loss": -25.575082778930664, "global_step": 328360, "epoch": 3956} {"train_loss": -25.720458984375, "global_step": 328361, "epoch": 3956} {"train_loss": -25.47011375427246, "global_step": 328362, "epoch": 3956} {"train_loss": -25.685373306274414, "global_step": 328363, "epoch": 3956} {"train_loss": -25.901838302612305, "global_step": 328364, "epoch": 3956} {"train_loss": -25.549985885620117, "global_step": 328365, "epoch": 3956} {"train_loss": -26.028676986694336, "global_step": 328366, "epoch": 3956} {"train_loss": -25.659494400024414, "global_step": 328367, "epoch": 3956} {"train_loss": -25.958898544311523, "global_step": 328368, "epoch": 3956} {"train_loss": -25.505216598510742, "global_step": 328369, "epoch": 3956} {"train_loss": -25.96698570251465, "global_step": 328370, "epoch": 3956} {"train_loss": -25.881580352783203, "global_step": 328371, "epoch": 3956} {"train_loss": -26.211530685424805, "global_step": 328372, "epoch": 3956} {"train_loss": -25.87611198425293, "global_step": 328373, "epoch": 3956} {"train_loss": -26.116491317749023, "global_step": 328374, "epoch": 3956} {"train_loss": -25.903244018554688, "global_step": 328375, "epoch": 3956} {"train_loss": -26.064123153686523, "global_step": 328376, "epoch": 3956} {"train_loss": -26.07318687438965, "global_step": 328377, "epoch": 3956} {"train_loss": -25.685937881469727, "global_step": 328378, "epoch": 3956} {"train_loss": -26.139429092407227, "global_step": 328379, "epoch": 3956} {"train_loss": -26.0458984375, "global_step": 328380, "epoch": 3956} {"train_loss": -26.29412269592285, "global_step": 328381, "epoch": 3956} {"train_loss": -26.217487335205078, "global_step": 328382, "epoch": 3956} {"train_loss": -26.244943618774414, "global_step": 328383, "epoch": 3956} {"train_loss": -26.034656524658203, "global_step": 328384, "epoch": 3956} {"train_loss": -26.232669830322266, "global_step": 328385, "epoch": 3956} {"train_loss": -26.275068283081055, "global_step": 328386, "epoch": 3956} {"train_loss": -26.28215980529785, "global_step": 328387, "epoch": 3956} {"train_loss": -25.74005126953125, "global_step": 328388, "epoch": 3956} {"train_loss": -26.22956657409668, "global_step": 328389, "epoch": 3956} {"train_loss": -26.1436710357666, "global_step": 328390, "epoch": 3956} {"train_loss": -25.8045654296875, "global_step": 328391, "epoch": 3956} {"train_loss": -26.07215690612793, "global_step": 328392, "epoch": 3956} {"train_loss": -25.794803619384766, "global_step": 328393, "epoch": 3956} {"train_loss": -26.061391830444336, "global_step": 328394, "epoch": 3956} {"train_loss": -25.586339950561523, "global_step": 328395, "epoch": 3956} {"train_loss": -25.9688777923584, "global_step": 328396, "epoch": 3956} {"train_loss": -26.09754753112793, "global_step": 328397, "epoch": 3956} {"train_loss": -26.461339950561523, "global_step": 328398, "epoch": 3956} {"train_loss": -26.160568237304688, "global_step": 328399, "epoch": 3956} {"train_loss": -25.831317901611328, "global_step": 328400, "epoch": 3956} {"train_loss": -26.069822311401367, "global_step": 328401, "epoch": 3956} {"train_loss": -26.266584396362305, "global_step": 328402, "epoch": 3956} {"train_loss": -26.321569442749023, "global_step": 328403, "epoch": 3956} {"train_loss": -25.595714569091797, "global_step": 328404, "epoch": 3956} {"train_loss": -24.992733001708984, "global_step": 328405, "epoch": 3956} {"train_loss": -25.130292892456055, "global_step": 328406, "epoch": 3956} {"train_loss": -25.26716423034668, "global_step": 328407, "epoch": 3956} {"train_loss": -25.763540267944336, "global_step": 328408, "epoch": 3956} {"train_loss": -26.060134887695312, "global_step": 328409, "epoch": 3956} {"train_loss": -25.814056396484375, "global_step": 328410, "epoch": 3956} {"train_loss": -25.691486358642578, "global_step": 328411, "epoch": 3956} {"train_loss": -25.582355499267578, "global_step": 328412, "epoch": 3956} {"train_loss": -26.236663818359375, "global_step": 328413, "epoch": 3956} {"train_loss": -25.900922775268555, "global_step": 328414, "epoch": 3956} {"train_loss": -25.519237518310547, "global_step": 328415, "epoch": 3956} {"train_loss": -26.015615463256836, "global_step": 328416, "epoch": 3956} {"train_loss": -25.999744415283203, "global_step": 328417, "epoch": 3956} {"train_loss": -25.84076499938965, "global_step": 328418, "epoch": 3956} {"train_loss": -26.18794059753418, "global_step": 328419, "epoch": 3956} {"train_loss": -25.895328521728516, "global_step": 328420, "epoch": 3956} {"train_loss": -25.8542423248291, "global_step": 328421, "epoch": 3956} {"train_loss": -25.711355209350586, "global_step": 328422, "epoch": 3956} {"train_loss": -25.44025421142578, "global_step": 328423, "epoch": 3956} {"train_loss": -26.17633628845215, "global_step": 328424, "epoch": 3956} {"train_loss": -26.02546501159668, "global_step": 328425, "epoch": 3956} {"train_loss": -26.042753219604492, "global_step": 328426, "epoch": 3956} {"train_loss": -26.209491729736328, "global_step": 328427, "epoch": 3956} {"train_loss": -25.939706802368164, "global_step": 328428, "epoch": 3956} {"train_loss": -25.899686813354492, "global_step": 328429, "epoch": 3956} {"train_loss": -25.88818444401385, "global_step": 328430, "epoch": 3956, "val_loss": 7187212.0} {"train_loss": -25.505685806274414, "global_step": 328431, "epoch": 3957} {"train_loss": -25.7796688079834, "global_step": 328432, "epoch": 3957} {"train_loss": -25.920331954956055, "global_step": 328433, "epoch": 3957} {"train_loss": -25.6610107421875, "global_step": 328434, "epoch": 3957} {"train_loss": -26.22002601623535, "global_step": 328435, "epoch": 3957} {"train_loss": -25.828439712524414, "global_step": 328436, "epoch": 3957} {"train_loss": -25.99985122680664, "global_step": 328437, "epoch": 3957} {"train_loss": -25.607492446899414, "global_step": 328438, "epoch": 3957} {"train_loss": -25.72162437438965, "global_step": 328439, "epoch": 3957} {"train_loss": -25.908594131469727, "global_step": 328440, "epoch": 3957} {"train_loss": -25.923994064331055, "global_step": 328441, "epoch": 3957} {"train_loss": -25.603534698486328, "global_step": 328442, "epoch": 3957} {"train_loss": -25.574525833129883, "global_step": 328443, "epoch": 3957} {"train_loss": -25.430173873901367, "global_step": 328444, "epoch": 3957} {"train_loss": -26.059955596923828, "global_step": 328445, "epoch": 3957} {"train_loss": -25.694232940673828, "global_step": 328446, "epoch": 3957} {"train_loss": -25.603174209594727, "global_step": 328447, "epoch": 3957} {"train_loss": -26.00977897644043, "global_step": 328448, "epoch": 3957} {"train_loss": -25.695484161376953, "global_step": 328449, "epoch": 3957} {"train_loss": -26.141271591186523, "global_step": 328450, "epoch": 3957} {"train_loss": -26.004745483398438, "global_step": 328451, "epoch": 3957} {"train_loss": -25.757266998291016, "global_step": 328452, "epoch": 3957} {"train_loss": -26.0033016204834, "global_step": 328453, "epoch": 3957} {"train_loss": -25.85210609436035, "global_step": 328454, "epoch": 3957} {"train_loss": -25.90131950378418, "global_step": 328455, "epoch": 3957} {"train_loss": -26.13750648498535, "global_step": 328456, "epoch": 3957} {"train_loss": -25.707782745361328, "global_step": 328457, "epoch": 3957} {"train_loss": -26.200780868530273, "global_step": 328458, "epoch": 3957} {"train_loss": -25.97263526916504, "global_step": 328459, "epoch": 3957} {"train_loss": -25.792179107666016, "global_step": 328460, "epoch": 3957} {"train_loss": -26.12598991394043, "global_step": 328461, "epoch": 3957} {"train_loss": -26.116622924804688, "global_step": 328462, "epoch": 3957} {"train_loss": -25.873992919921875, "global_step": 328463, "epoch": 3957} {"train_loss": -25.804901123046875, "global_step": 328464, "epoch": 3957} {"train_loss": -25.33141326904297, "global_step": 328465, "epoch": 3957} {"train_loss": -25.590839385986328, "global_step": 328466, "epoch": 3957} {"train_loss": -26.00002098083496, "global_step": 328467, "epoch": 3957} {"train_loss": -26.155141830444336, "global_step": 328468, "epoch": 3957} {"train_loss": -26.358596801757812, "global_step": 328469, "epoch": 3957} {"train_loss": -26.091846466064453, "global_step": 328470, "epoch": 3957} {"train_loss": -26.109411239624023, "global_step": 328471, "epoch": 3957} {"train_loss": -26.172943115234375, "global_step": 328472, "epoch": 3957} {"train_loss": -26.2266788482666, "global_step": 328473, "epoch": 3957} {"train_loss": -25.67310905456543, "global_step": 328474, "epoch": 3957} {"train_loss": -25.588523864746094, "global_step": 328475, "epoch": 3957} {"train_loss": -25.76642417907715, "global_step": 328476, "epoch": 3957} {"train_loss": -26.017990112304688, "global_step": 328477, "epoch": 3957} {"train_loss": -25.719181060791016, "global_step": 328478, "epoch": 3957} {"train_loss": -25.909147262573242, "global_step": 328479, "epoch": 3957} {"train_loss": -25.921491622924805, "global_step": 328480, "epoch": 3957} {"train_loss": -26.1592960357666, "global_step": 328481, "epoch": 3957} {"train_loss": -25.810699462890625, "global_step": 328482, "epoch": 3957} {"train_loss": -26.12152671813965, "global_step": 328483, "epoch": 3957} {"train_loss": -25.720006942749023, "global_step": 328484, "epoch": 3957} {"train_loss": -25.9724063873291, "global_step": 328485, "epoch": 3957} {"train_loss": -26.288288116455078, "global_step": 328486, "epoch": 3957} {"train_loss": -26.377172470092773, "global_step": 328487, "epoch": 3957} {"train_loss": -26.13880729675293, "global_step": 328488, "epoch": 3957} {"train_loss": -25.96792984008789, "global_step": 328489, "epoch": 3957} {"train_loss": -26.276493072509766, "global_step": 328490, "epoch": 3957} {"train_loss": -25.854572296142578, "global_step": 328491, "epoch": 3957} {"train_loss": -26.3542537689209, "global_step": 328492, "epoch": 3957} {"train_loss": -25.890003204345703, "global_step": 328493, "epoch": 3957} {"train_loss": -25.57598876953125, "global_step": 328494, "epoch": 3957} {"train_loss": -26.14702796936035, "global_step": 328495, "epoch": 3957} {"train_loss": -26.199411392211914, "global_step": 328496, "epoch": 3957} {"train_loss": -25.811391830444336, "global_step": 328497, "epoch": 3957} {"train_loss": -25.584287643432617, "global_step": 328498, "epoch": 3957} {"train_loss": -25.733535766601562, "global_step": 328499, "epoch": 3957} {"train_loss": -26.396799087524414, "global_step": 328500, "epoch": 3957} {"train_loss": -25.939905166625977, "global_step": 328501, "epoch": 3957} {"train_loss": -25.48483657836914, "global_step": 328502, "epoch": 3957} {"train_loss": -25.903364181518555, "global_step": 328503, "epoch": 3957} {"train_loss": -26.206823348999023, "global_step": 328504, "epoch": 3957} {"train_loss": -26.08353042602539, "global_step": 328505, "epoch": 3957} {"train_loss": -26.201513290405273, "global_step": 328506, "epoch": 3957} {"train_loss": -25.533172607421875, "global_step": 328507, "epoch": 3957} {"train_loss": -26.127593994140625, "global_step": 328508, "epoch": 3957} {"train_loss": -25.699880599975586, "global_step": 328509, "epoch": 3957} {"train_loss": -26.157629013061523, "global_step": 328510, "epoch": 3957} {"train_loss": -25.984710693359375, "global_step": 328511, "epoch": 3957} {"train_loss": -25.71877098083496, "global_step": 328512, "epoch": 3957} {"train_loss": -25.905582519898932, "global_step": 328513, "epoch": 3957, "val_loss": 7297910.0} {"train_loss": -25.7784481048584, "global_step": 328514, "epoch": 3958} {"train_loss": -25.756763458251953, "global_step": 328515, "epoch": 3958} {"train_loss": -25.3875789642334, "global_step": 328516, "epoch": 3958} {"train_loss": -25.9228572845459, "global_step": 328517, "epoch": 3958} {"train_loss": -25.500333786010742, "global_step": 328518, "epoch": 3958} {"train_loss": -25.892560958862305, "global_step": 328519, "epoch": 3958} {"train_loss": -25.540956497192383, "global_step": 328520, "epoch": 3958} {"train_loss": -25.827606201171875, "global_step": 328521, "epoch": 3958} {"train_loss": -25.8070011138916, "global_step": 328522, "epoch": 3958} {"train_loss": -25.65155029296875, "global_step": 328523, "epoch": 3958} {"train_loss": -25.690099716186523, "global_step": 328524, "epoch": 3958} {"train_loss": -25.81806755065918, "global_step": 328525, "epoch": 3958} {"train_loss": -25.551868438720703, "global_step": 328526, "epoch": 3958} {"train_loss": -25.66843605041504, "global_step": 328527, "epoch": 3958} {"train_loss": -25.802978515625, "global_step": 328528, "epoch": 3958} {"train_loss": -25.689838409423828, "global_step": 328529, "epoch": 3958} {"train_loss": -25.762250900268555, "global_step": 328530, "epoch": 3958} {"train_loss": -25.7755184173584, "global_step": 328531, "epoch": 3958} {"train_loss": -25.9296817779541, "global_step": 328532, "epoch": 3958} {"train_loss": -25.510778427124023, "global_step": 328533, "epoch": 3958} {"train_loss": -25.681081771850586, "global_step": 328534, "epoch": 3958} {"train_loss": -25.841693878173828, "global_step": 328535, "epoch": 3958} {"train_loss": -25.829862594604492, "global_step": 328536, "epoch": 3958} {"train_loss": -25.654111862182617, "global_step": 328537, "epoch": 3958} {"train_loss": -25.667097091674805, "global_step": 328538, "epoch": 3958} {"train_loss": -25.68548583984375, "global_step": 328539, "epoch": 3958} {"train_loss": -25.732648849487305, "global_step": 328540, "epoch": 3958} {"train_loss": -26.03145408630371, "global_step": 328541, "epoch": 3958} {"train_loss": -26.061756134033203, "global_step": 328542, "epoch": 3958} {"train_loss": -25.847339630126953, "global_step": 328543, "epoch": 3958} {"train_loss": -25.933130264282227, "global_step": 328544, "epoch": 3958} {"train_loss": -25.912893295288086, "global_step": 328545, "epoch": 3958} {"train_loss": -25.508037567138672, "global_step": 328546, "epoch": 3958} {"train_loss": -26.140522003173828, "global_step": 328547, "epoch": 3958} {"train_loss": -25.92307472229004, "global_step": 328548, "epoch": 3958} {"train_loss": -25.96296501159668, "global_step": 328549, "epoch": 3958} {"train_loss": -26.061767578125, "global_step": 328550, "epoch": 3958} {"train_loss": -25.74005126953125, "global_step": 328551, "epoch": 3958} {"train_loss": -25.834949493408203, "global_step": 328552, "epoch": 3958} {"train_loss": -26.0350341796875, "global_step": 328553, "epoch": 3958} {"train_loss": -26.02247428894043, "global_step": 328554, "epoch": 3958} {"train_loss": -25.937116622924805, "global_step": 328555, "epoch": 3958} {"train_loss": -26.581283569335938, "global_step": 328556, "epoch": 3958} {"train_loss": -26.395055770874023, "global_step": 328557, "epoch": 3958} {"train_loss": -25.800800323486328, "global_step": 328558, "epoch": 3958} {"train_loss": -25.93816566467285, "global_step": 328559, "epoch": 3958} {"train_loss": -26.34303855895996, "global_step": 328560, "epoch": 3958} {"train_loss": -25.842884063720703, "global_step": 328561, "epoch": 3958} {"train_loss": -26.197284698486328, "global_step": 328562, "epoch": 3958} {"train_loss": -26.180707931518555, "global_step": 328563, "epoch": 3958} {"train_loss": -26.481128692626953, "global_step": 328564, "epoch": 3958} {"train_loss": -25.87744140625, "global_step": 328565, "epoch": 3958} {"train_loss": -25.703466415405273, "global_step": 328566, "epoch": 3958} {"train_loss": -26.076812744140625, "global_step": 328567, "epoch": 3958} {"train_loss": -25.995956420898438, "global_step": 328568, "epoch": 3958} {"train_loss": -25.40423011779785, "global_step": 328569, "epoch": 3958} {"train_loss": -25.695114135742188, "global_step": 328570, "epoch": 3958} {"train_loss": -24.912141799926758, "global_step": 328571, "epoch": 3958} {"train_loss": -25.619556427001953, "global_step": 328572, "epoch": 3958} {"train_loss": -26.195148468017578, "global_step": 328573, "epoch": 3958} {"train_loss": -25.607465744018555, "global_step": 328574, "epoch": 3958} {"train_loss": -25.93598747253418, "global_step": 328575, "epoch": 3958} {"train_loss": -25.8852596282959, "global_step": 328576, "epoch": 3958} {"train_loss": -25.997465133666992, "global_step": 328577, "epoch": 3958} {"train_loss": -25.953229904174805, "global_step": 328578, "epoch": 3958} {"train_loss": -26.085779190063477, "global_step": 328579, "epoch": 3958} {"train_loss": -26.03420066833496, "global_step": 328580, "epoch": 3958} {"train_loss": -26.00678062438965, "global_step": 328581, "epoch": 3958} {"train_loss": -26.040576934814453, "global_step": 328582, "epoch": 3958} {"train_loss": -26.0230712890625, "global_step": 328583, "epoch": 3958} {"train_loss": -25.931211471557617, "global_step": 328584, "epoch": 3958} {"train_loss": -25.57572364807129, "global_step": 328585, "epoch": 3958} {"train_loss": -26.266510009765625, "global_step": 328586, "epoch": 3958} {"train_loss": -26.181549072265625, "global_step": 328587, "epoch": 3958} {"train_loss": -25.73817253112793, "global_step": 328588, "epoch": 3958} {"train_loss": -26.302637100219727, "global_step": 328589, "epoch": 3958} {"train_loss": -25.85560417175293, "global_step": 328590, "epoch": 3958} {"train_loss": -25.615171432495117, "global_step": 328591, "epoch": 3958} {"train_loss": -25.961750030517578, "global_step": 328592, "epoch": 3958} {"train_loss": -25.88226318359375, "global_step": 328593, "epoch": 3958} {"train_loss": -25.919702529907227, "global_step": 328594, "epoch": 3958} {"train_loss": -25.7745304107666, "global_step": 328595, "epoch": 3958} {"train_loss": -25.866625958178417, "global_step": 328596, "epoch": 3958, "val_loss": 7227814.0} {"train_loss": -24.954984664916992, "global_step": 328597, "epoch": 3959} {"train_loss": -25.58547592163086, "global_step": 328598, "epoch": 3959} {"train_loss": -25.414316177368164, "global_step": 328599, "epoch": 3959} {"train_loss": -25.384187698364258, "global_step": 328600, "epoch": 3959} {"train_loss": -25.74574089050293, "global_step": 328601, "epoch": 3959} {"train_loss": -25.56833267211914, "global_step": 328602, "epoch": 3959} {"train_loss": -25.487226486206055, "global_step": 328603, "epoch": 3959} {"train_loss": -25.543437957763672, "global_step": 328604, "epoch": 3959} {"train_loss": -25.879638671875, "global_step": 328605, "epoch": 3959} {"train_loss": -25.825448989868164, "global_step": 328606, "epoch": 3959} {"train_loss": -25.632831573486328, "global_step": 328607, "epoch": 3959} {"train_loss": -25.586774826049805, "global_step": 328608, "epoch": 3959} {"train_loss": -26.038848876953125, "global_step": 328609, "epoch": 3959} {"train_loss": -25.388286590576172, "global_step": 328610, "epoch": 3959} {"train_loss": -25.83318519592285, "global_step": 328611, "epoch": 3959} {"train_loss": -26.242374420166016, "global_step": 328612, "epoch": 3959} {"train_loss": -25.986536026000977, "global_step": 328613, "epoch": 3959} {"train_loss": -25.980173110961914, "global_step": 328614, "epoch": 3959} {"train_loss": -26.136234283447266, "global_step": 328615, "epoch": 3959} {"train_loss": -25.832258224487305, "global_step": 328616, "epoch": 3959} {"train_loss": -25.91651725769043, "global_step": 328617, "epoch": 3959} {"train_loss": -25.984012603759766, "global_step": 328618, "epoch": 3959} {"train_loss": -26.107152938842773, "global_step": 328619, "epoch": 3959} {"train_loss": -26.0393123626709, "global_step": 328620, "epoch": 3959} {"train_loss": -25.820398330688477, "global_step": 328621, "epoch": 3959} {"train_loss": -25.780975341796875, "global_step": 328622, "epoch": 3959} {"train_loss": -26.1162109375, "global_step": 328623, "epoch": 3959} {"train_loss": -25.745731353759766, "global_step": 328624, "epoch": 3959} {"train_loss": -25.915685653686523, "global_step": 328625, "epoch": 3959} {"train_loss": -25.445484161376953, "global_step": 328626, "epoch": 3959} {"train_loss": -26.169355392456055, "global_step": 328627, "epoch": 3959} {"train_loss": -25.791370391845703, "global_step": 328628, "epoch": 3959} {"train_loss": -25.611103057861328, "global_step": 328629, "epoch": 3959} {"train_loss": -25.664321899414062, "global_step": 328630, "epoch": 3959} {"train_loss": -25.90179443359375, "global_step": 328631, "epoch": 3959} {"train_loss": -25.84659194946289, "global_step": 328632, "epoch": 3959} {"train_loss": -25.693470001220703, "global_step": 328633, "epoch": 3959} {"train_loss": -25.8885440826416, "global_step": 328634, "epoch": 3959} {"train_loss": -25.660696029663086, "global_step": 328635, "epoch": 3959} {"train_loss": -25.9984188079834, "global_step": 328636, "epoch": 3959} {"train_loss": -26.194873809814453, "global_step": 328637, "epoch": 3959} {"train_loss": -25.793729782104492, "global_step": 328638, "epoch": 3959} {"train_loss": -25.8718204498291, "global_step": 328639, "epoch": 3959} {"train_loss": -25.885883331298828, "global_step": 328640, "epoch": 3959} {"train_loss": -25.564594268798828, "global_step": 328641, "epoch": 3959} {"train_loss": -26.137348175048828, "global_step": 328642, "epoch": 3959} {"train_loss": -25.856800079345703, "global_step": 328643, "epoch": 3959} {"train_loss": -25.941186904907227, "global_step": 328644, "epoch": 3959} {"train_loss": -26.02314567565918, "global_step": 328645, "epoch": 3959} {"train_loss": -25.882360458374023, "global_step": 328646, "epoch": 3959} {"train_loss": -26.202255249023438, "global_step": 328647, "epoch": 3959} {"train_loss": -26.35347557067871, "global_step": 328648, "epoch": 3959} {"train_loss": -25.878559112548828, "global_step": 328649, "epoch": 3959} {"train_loss": -26.243383407592773, "global_step": 328650, "epoch": 3959} {"train_loss": -26.147546768188477, "global_step": 328651, "epoch": 3959} {"train_loss": -25.718366622924805, "global_step": 328652, "epoch": 3959} {"train_loss": -25.939453125, "global_step": 328653, "epoch": 3959} {"train_loss": -25.818344116210938, "global_step": 328654, "epoch": 3959} {"train_loss": -25.88995933532715, "global_step": 328655, "epoch": 3959} {"train_loss": -25.9844913482666, "global_step": 328656, "epoch": 3959} {"train_loss": -26.02921485900879, "global_step": 328657, "epoch": 3959} {"train_loss": -26.16480827331543, "global_step": 328658, "epoch": 3959} {"train_loss": -26.019275665283203, "global_step": 328659, "epoch": 3959} {"train_loss": -25.872955322265625, "global_step": 328660, "epoch": 3959} {"train_loss": -26.055435180664062, "global_step": 328661, "epoch": 3959} {"train_loss": -26.065954208374023, "global_step": 328662, "epoch": 3959} {"train_loss": -26.430377960205078, "global_step": 328663, "epoch": 3959} {"train_loss": -26.053577423095703, "global_step": 328664, "epoch": 3959} {"train_loss": -25.891559600830078, "global_step": 328665, "epoch": 3959} {"train_loss": -26.234745025634766, "global_step": 328666, "epoch": 3959} {"train_loss": -26.112598419189453, "global_step": 328667, "epoch": 3959} {"train_loss": -26.029754638671875, "global_step": 328668, "epoch": 3959} {"train_loss": -25.971616744995117, "global_step": 328669, "epoch": 3959} {"train_loss": -26.13104248046875, "global_step": 328670, "epoch": 3959} {"train_loss": -25.6370849609375, "global_step": 328671, "epoch": 3959} {"train_loss": -25.775426864624023, "global_step": 328672, "epoch": 3959} {"train_loss": -26.326343536376953, "global_step": 328673, "epoch": 3959} {"train_loss": -26.073789596557617, "global_step": 328674, "epoch": 3959} {"train_loss": -25.920272827148438, "global_step": 328675, "epoch": 3959} {"train_loss": -25.954259872436523, "global_step": 328676, "epoch": 3959} {"train_loss": -25.976247787475586, "global_step": 328677, "epoch": 3959} {"train_loss": -25.539140701293945, "global_step": 328678, "epoch": 3959} {"train_loss": -25.877449334385883, "global_step": 328679, "epoch": 3959, "val_loss": 7206394.5} {"train_loss": -25.427640914916992, "global_step": 328680, "epoch": 3960} {"train_loss": -25.061038970947266, "global_step": 328681, "epoch": 3960} {"train_loss": -24.781949996948242, "global_step": 328682, "epoch": 3960} {"train_loss": -25.21454429626465, "global_step": 328683, "epoch": 3960} {"train_loss": -24.787796020507812, "global_step": 328684, "epoch": 3960} {"train_loss": -25.357641220092773, "global_step": 328685, "epoch": 3960} {"train_loss": -24.8316593170166, "global_step": 328686, "epoch": 3960} {"train_loss": -24.876781463623047, "global_step": 328687, "epoch": 3960} {"train_loss": -25.80183219909668, "global_step": 328688, "epoch": 3960} {"train_loss": -25.4285831451416, "global_step": 328689, "epoch": 3960} {"train_loss": -25.11244010925293, "global_step": 328690, "epoch": 3960} {"train_loss": -25.368885040283203, "global_step": 328691, "epoch": 3960} {"train_loss": -25.765411376953125, "global_step": 328692, "epoch": 3960} {"train_loss": -25.62247657775879, "global_step": 328693, "epoch": 3960} {"train_loss": -25.573537826538086, "global_step": 328694, "epoch": 3960} {"train_loss": -25.26413917541504, "global_step": 328695, "epoch": 3960} {"train_loss": -25.889240264892578, "global_step": 328696, "epoch": 3960} {"train_loss": -25.84527015686035, "global_step": 328697, "epoch": 3960} {"train_loss": -25.66431999206543, "global_step": 328698, "epoch": 3960} {"train_loss": -25.313613891601562, "global_step": 328699, "epoch": 3960} {"train_loss": -25.47261619567871, "global_step": 328700, "epoch": 3960} {"train_loss": -25.519775390625, "global_step": 328701, "epoch": 3960} {"train_loss": -25.793806076049805, "global_step": 328702, "epoch": 3960} {"train_loss": -25.634485244750977, "global_step": 328703, "epoch": 3960} {"train_loss": -26.090635299682617, "global_step": 328704, "epoch": 3960} {"train_loss": -25.874835968017578, "global_step": 328705, "epoch": 3960} {"train_loss": -25.435144424438477, "global_step": 328706, "epoch": 3960} {"train_loss": -25.958662033081055, "global_step": 328707, "epoch": 3960} {"train_loss": -25.5046329498291, "global_step": 328708, "epoch": 3960} {"train_loss": -25.8436336517334, "global_step": 328709, "epoch": 3960} {"train_loss": -25.628936767578125, "global_step": 328710, "epoch": 3960} {"train_loss": -25.679651260375977, "global_step": 328711, "epoch": 3960} {"train_loss": -25.888227462768555, "global_step": 328712, "epoch": 3960} {"train_loss": -26.178730010986328, "global_step": 328713, "epoch": 3960} {"train_loss": -25.68814468383789, "global_step": 328714, "epoch": 3960} {"train_loss": -25.798322677612305, "global_step": 328715, "epoch": 3960} {"train_loss": -25.654340744018555, "global_step": 328716, "epoch": 3960} {"train_loss": -25.785242080688477, "global_step": 328717, "epoch": 3960} {"train_loss": -26.189472198486328, "global_step": 328718, "epoch": 3960} {"train_loss": -26.03531265258789, "global_step": 328719, "epoch": 3960} {"train_loss": -25.643035888671875, "global_step": 328720, "epoch": 3960} {"train_loss": -25.766529083251953, "global_step": 328721, "epoch": 3960} {"train_loss": -25.992816925048828, "global_step": 328722, "epoch": 3960} {"train_loss": -25.9880428314209, "global_step": 328723, "epoch": 3960} {"train_loss": -26.048437118530273, "global_step": 328724, "epoch": 3960} {"train_loss": -26.083471298217773, "global_step": 328725, "epoch": 3960} {"train_loss": -26.192590713500977, "global_step": 328726, "epoch": 3960} {"train_loss": -26.069936752319336, "global_step": 328727, "epoch": 3960} {"train_loss": -25.945837020874023, "global_step": 328728, "epoch": 3960} {"train_loss": -25.856204986572266, "global_step": 328729, "epoch": 3960} {"train_loss": -25.887121200561523, "global_step": 328730, "epoch": 3960} {"train_loss": -26.2227725982666, "global_step": 328731, "epoch": 3960} {"train_loss": -25.54732322692871, "global_step": 328732, "epoch": 3960} {"train_loss": -26.098546981811523, "global_step": 328733, "epoch": 3960} {"train_loss": -25.805097579956055, "global_step": 328734, "epoch": 3960} {"train_loss": -26.158124923706055, "global_step": 328735, "epoch": 3960} {"train_loss": -26.0117244720459, "global_step": 328736, "epoch": 3960} {"train_loss": -25.912994384765625, "global_step": 328737, "epoch": 3960} {"train_loss": -25.953784942626953, "global_step": 328738, "epoch": 3960} {"train_loss": -26.07793617248535, "global_step": 328739, "epoch": 3960} {"train_loss": -25.68543815612793, "global_step": 328740, "epoch": 3960} {"train_loss": -25.980255126953125, "global_step": 328741, "epoch": 3960} {"train_loss": -25.926523208618164, "global_step": 328742, "epoch": 3960} {"train_loss": -25.894758224487305, "global_step": 328743, "epoch": 3960} {"train_loss": -26.138242721557617, "global_step": 328744, "epoch": 3960} {"train_loss": -25.78018569946289, "global_step": 328745, "epoch": 3960} {"train_loss": -25.898334503173828, "global_step": 328746, "epoch": 3960} {"train_loss": -25.913257598876953, "global_step": 328747, "epoch": 3960} {"train_loss": -25.955869674682617, "global_step": 328748, "epoch": 3960} {"train_loss": -25.816503524780273, "global_step": 328749, "epoch": 3960} {"train_loss": -25.716718673706055, "global_step": 328750, "epoch": 3960} {"train_loss": -26.524234771728516, "global_step": 328751, "epoch": 3960} {"train_loss": -26.018980026245117, "global_step": 328752, "epoch": 3960} {"train_loss": -25.735931396484375, "global_step": 328753, "epoch": 3960} {"train_loss": -25.50696563720703, "global_step": 328754, "epoch": 3960} {"train_loss": -25.58797264099121, "global_step": 328755, "epoch": 3960} {"train_loss": -25.808927536010742, "global_step": 328756, "epoch": 3960} {"train_loss": -25.831085205078125, "global_step": 328757, "epoch": 3960} {"train_loss": -25.713659286499023, "global_step": 328758, "epoch": 3960} {"train_loss": -25.86594581604004, "global_step": 328759, "epoch": 3960} {"train_loss": -25.473365783691406, "global_step": 328760, "epoch": 3960} {"train_loss": -25.64715576171875, "global_step": 328761, "epoch": 3960} {"train_loss": -25.737059443830006, "global_step": 328762, "epoch": 3960, "val_loss": 7201543.5} {"train_loss": -24.138187408447266, "global_step": 328763, "epoch": 3961} {"train_loss": -25.085920333862305, "global_step": 328764, "epoch": 3961} {"train_loss": -24.84322166442871, "global_step": 328765, "epoch": 3961} {"train_loss": -24.65119171142578, "global_step": 328766, "epoch": 3961} {"train_loss": -24.523822784423828, "global_step": 328767, "epoch": 3961} {"train_loss": -24.798486709594727, "global_step": 328768, "epoch": 3961} {"train_loss": -25.58730125427246, "global_step": 328769, "epoch": 3961} {"train_loss": -24.8807430267334, "global_step": 328770, "epoch": 3961} {"train_loss": -25.00616455078125, "global_step": 328771, "epoch": 3961} {"train_loss": -25.070369720458984, "global_step": 328772, "epoch": 3961} {"train_loss": -25.25038719177246, "global_step": 328773, "epoch": 3961} {"train_loss": -25.52146339416504, "global_step": 328774, "epoch": 3961} {"train_loss": -24.989749908447266, "global_step": 328775, "epoch": 3961} {"train_loss": -25.105079650878906, "global_step": 328776, "epoch": 3961} {"train_loss": -25.241928100585938, "global_step": 328777, "epoch": 3961} {"train_loss": -25.269445419311523, "global_step": 328778, "epoch": 3961} {"train_loss": -25.316152572631836, "global_step": 328779, "epoch": 3961} {"train_loss": -25.305784225463867, "global_step": 328780, "epoch": 3961} {"train_loss": -25.73744010925293, "global_step": 328781, "epoch": 3961} {"train_loss": -25.23335075378418, "global_step": 328782, "epoch": 3961} {"train_loss": -25.39920425415039, "global_step": 328783, "epoch": 3961} {"train_loss": -25.820051193237305, "global_step": 328784, "epoch": 3961} {"train_loss": -25.54380226135254, "global_step": 328785, "epoch": 3961} {"train_loss": -25.392587661743164, "global_step": 328786, "epoch": 3961} {"train_loss": -25.54521942138672, "global_step": 328787, "epoch": 3961} {"train_loss": -25.79461669921875, "global_step": 328788, "epoch": 3961} {"train_loss": -25.175132751464844, "global_step": 328789, "epoch": 3961} {"train_loss": -25.530529022216797, "global_step": 328790, "epoch": 3961} {"train_loss": -25.53436279296875, "global_step": 328791, "epoch": 3961} {"train_loss": -25.949111938476562, "global_step": 328792, "epoch": 3961} {"train_loss": -25.689237594604492, "global_step": 328793, "epoch": 3961} {"train_loss": -25.72700309753418, "global_step": 328794, "epoch": 3961} {"train_loss": -26.1435489654541, "global_step": 328795, "epoch": 3961} {"train_loss": -26.130264282226562, "global_step": 328796, "epoch": 3961} {"train_loss": -26.205175399780273, "global_step": 328797, "epoch": 3961} {"train_loss": -25.823272705078125, "global_step": 328798, "epoch": 3961} {"train_loss": -25.933347702026367, "global_step": 328799, "epoch": 3961} {"train_loss": -25.84210777282715, "global_step": 328800, "epoch": 3961} {"train_loss": -25.770105361938477, "global_step": 328801, "epoch": 3961} {"train_loss": -25.752004623413086, "global_step": 328802, "epoch": 3961} {"train_loss": -26.07810401916504, "global_step": 328803, "epoch": 3961} {"train_loss": -25.600006103515625, "global_step": 328804, "epoch": 3961} {"train_loss": -25.928979873657227, "global_step": 328805, "epoch": 3961} {"train_loss": -26.4278507232666, "global_step": 328806, "epoch": 3961} {"train_loss": -25.902013778686523, "global_step": 328807, "epoch": 3961} {"train_loss": -25.816455841064453, "global_step": 328808, "epoch": 3961} {"train_loss": -26.025171279907227, "global_step": 328809, "epoch": 3961} {"train_loss": -26.270435333251953, "global_step": 328810, "epoch": 3961} {"train_loss": -25.3850154876709, "global_step": 328811, "epoch": 3961} {"train_loss": -26.2281494140625, "global_step": 328812, "epoch": 3961} {"train_loss": -25.876602172851562, "global_step": 328813, "epoch": 3961} {"train_loss": -25.75728416442871, "global_step": 328814, "epoch": 3961} {"train_loss": -25.766529083251953, "global_step": 328815, "epoch": 3961} {"train_loss": -26.07819175720215, "global_step": 328816, "epoch": 3961} {"train_loss": -25.706064224243164, "global_step": 328817, "epoch": 3961} {"train_loss": -25.75931739807129, "global_step": 328818, "epoch": 3961} {"train_loss": -26.187835693359375, "global_step": 328819, "epoch": 3961} {"train_loss": -26.023473739624023, "global_step": 328820, "epoch": 3961} {"train_loss": -26.113433837890625, "global_step": 328821, "epoch": 3961} {"train_loss": -25.980365753173828, "global_step": 328822, "epoch": 3961} {"train_loss": -25.949756622314453, "global_step": 328823, "epoch": 3961} {"train_loss": -26.067508697509766, "global_step": 328824, "epoch": 3961} {"train_loss": -25.735986709594727, "global_step": 328825, "epoch": 3961} {"train_loss": -25.970006942749023, "global_step": 328826, "epoch": 3961} {"train_loss": -25.692991256713867, "global_step": 328827, "epoch": 3961} {"train_loss": -25.665449142456055, "global_step": 328828, "epoch": 3961} {"train_loss": -25.601459503173828, "global_step": 328829, "epoch": 3961} {"train_loss": -26.240676879882812, "global_step": 328830, "epoch": 3961} {"train_loss": -25.960983276367188, "global_step": 328831, "epoch": 3961} {"train_loss": -26.066965103149414, "global_step": 328832, "epoch": 3961} {"train_loss": -25.923120498657227, "global_step": 328833, "epoch": 3961} {"train_loss": -25.60138511657715, "global_step": 328834, "epoch": 3961} {"train_loss": -25.31199073791504, "global_step": 328835, "epoch": 3961} {"train_loss": -25.088523864746094, "global_step": 328836, "epoch": 3961} {"train_loss": -24.92708396911621, "global_step": 328837, "epoch": 3961} {"train_loss": -25.2285099029541, "global_step": 328838, "epoch": 3961} {"train_loss": -25.740829467773438, "global_step": 328839, "epoch": 3961} {"train_loss": -25.793649673461914, "global_step": 328840, "epoch": 3961} {"train_loss": -25.459230422973633, "global_step": 328841, "epoch": 3961} {"train_loss": -25.474185943603516, "global_step": 328842, "epoch": 3961} {"train_loss": -25.472190856933594, "global_step": 328843, "epoch": 3961} {"train_loss": -25.66719627380371, "global_step": 328844, "epoch": 3961} {"train_loss": -25.619620288710998, "global_step": 328845, "epoch": 3961, "val_loss": 7350955.0} {"train_loss": -25.21708869934082, "global_step": 328846, "epoch": 3962} {"train_loss": -25.128419876098633, "global_step": 328847, "epoch": 3962} {"train_loss": -25.01569175720215, "global_step": 328848, "epoch": 3962} {"train_loss": -25.3093204498291, "global_step": 328849, "epoch": 3962} {"train_loss": -25.28629493713379, "global_step": 328850, "epoch": 3962} {"train_loss": -25.073596954345703, "global_step": 328851, "epoch": 3962} {"train_loss": -25.461822509765625, "global_step": 328852, "epoch": 3962} {"train_loss": -25.48016929626465, "global_step": 328853, "epoch": 3962} {"train_loss": -25.489580154418945, "global_step": 328854, "epoch": 3962} {"train_loss": -25.470502853393555, "global_step": 328855, "epoch": 3962} {"train_loss": -25.437240600585938, "global_step": 328856, "epoch": 3962} {"train_loss": -25.041296005249023, "global_step": 328857, "epoch": 3962} {"train_loss": -25.299474716186523, "global_step": 328858, "epoch": 3962} {"train_loss": -25.47408103942871, "global_step": 328859, "epoch": 3962} {"train_loss": -25.504133224487305, "global_step": 328860, "epoch": 3962} {"train_loss": -26.040674209594727, "global_step": 328861, "epoch": 3962} {"train_loss": -25.87528419494629, "global_step": 328862, "epoch": 3962} {"train_loss": -25.73355484008789, "global_step": 328863, "epoch": 3962} {"train_loss": -25.774682998657227, "global_step": 328864, "epoch": 3962} {"train_loss": -25.441238403320312, "global_step": 328865, "epoch": 3962} {"train_loss": -25.642099380493164, "global_step": 328866, "epoch": 3962} {"train_loss": -25.423254013061523, "global_step": 328867, "epoch": 3962} {"train_loss": -25.670578002929688, "global_step": 328868, "epoch": 3962} {"train_loss": -25.68674087524414, "global_step": 328869, "epoch": 3962} {"train_loss": -25.851720809936523, "global_step": 328870, "epoch": 3962} {"train_loss": -25.73821449279785, "global_step": 328871, "epoch": 3962} {"train_loss": -25.886133193969727, "global_step": 328872, "epoch": 3962} {"train_loss": -25.70746421813965, "global_step": 328873, "epoch": 3962} {"train_loss": -25.87723159790039, "global_step": 328874, "epoch": 3962} {"train_loss": -26.137405395507812, "global_step": 328875, "epoch": 3962} {"train_loss": -26.122268676757812, "global_step": 328876, "epoch": 3962} {"train_loss": -25.646692276000977, "global_step": 328877, "epoch": 3962} {"train_loss": -26.124719619750977, "global_step": 328878, "epoch": 3962} {"train_loss": -25.653202056884766, "global_step": 328879, "epoch": 3962} {"train_loss": -26.111740112304688, "global_step": 328880, "epoch": 3962} {"train_loss": -25.9097900390625, "global_step": 328881, "epoch": 3962} {"train_loss": -25.965579986572266, "global_step": 328882, "epoch": 3962} {"train_loss": -26.213159561157227, "global_step": 328883, "epoch": 3962} {"train_loss": -26.166532516479492, "global_step": 328884, "epoch": 3962} {"train_loss": -25.947423934936523, "global_step": 328885, "epoch": 3962} {"train_loss": -26.114057540893555, "global_step": 328886, "epoch": 3962} {"train_loss": -26.32257080078125, "global_step": 328887, "epoch": 3962} {"train_loss": -25.984546661376953, "global_step": 328888, "epoch": 3962} {"train_loss": -26.090497970581055, "global_step": 328889, "epoch": 3962} {"train_loss": -26.15484046936035, "global_step": 328890, "epoch": 3962} {"train_loss": -26.185941696166992, "global_step": 328891, "epoch": 3962} {"train_loss": -26.020212173461914, "global_step": 328892, "epoch": 3962} {"train_loss": -25.607290267944336, "global_step": 328893, "epoch": 3962} {"train_loss": -26.33155632019043, "global_step": 328894, "epoch": 3962} {"train_loss": -25.989974975585938, "global_step": 328895, "epoch": 3962} {"train_loss": -26.238269805908203, "global_step": 328896, "epoch": 3962} {"train_loss": -25.58693504333496, "global_step": 328897, "epoch": 3962} {"train_loss": -25.948551177978516, "global_step": 328898, "epoch": 3962} {"train_loss": -25.87286376953125, "global_step": 328899, "epoch": 3962} {"train_loss": -26.00982093811035, "global_step": 328900, "epoch": 3962} {"train_loss": -26.349552154541016, "global_step": 328901, "epoch": 3962} {"train_loss": -26.22608757019043, "global_step": 328902, "epoch": 3962} {"train_loss": -25.289886474609375, "global_step": 328903, "epoch": 3962} {"train_loss": -25.282838821411133, "global_step": 328904, "epoch": 3962} {"train_loss": -25.110300064086914, "global_step": 328905, "epoch": 3962} {"train_loss": -25.425846099853516, "global_step": 328906, "epoch": 3962} {"train_loss": -25.7806396484375, "global_step": 328907, "epoch": 3962} {"train_loss": -25.765060424804688, "global_step": 328908, "epoch": 3962} {"train_loss": -25.805328369140625, "global_step": 328909, "epoch": 3962} {"train_loss": -26.089069366455078, "global_step": 328910, "epoch": 3962} {"train_loss": -25.95867919921875, "global_step": 328911, "epoch": 3962} {"train_loss": -25.928070068359375, "global_step": 328912, "epoch": 3962} {"train_loss": -25.788488388061523, "global_step": 328913, "epoch": 3962} {"train_loss": -26.03668785095215, "global_step": 328914, "epoch": 3962} {"train_loss": -25.646530151367188, "global_step": 328915, "epoch": 3962} {"train_loss": -25.710235595703125, "global_step": 328916, "epoch": 3962} {"train_loss": -26.128507614135742, "global_step": 328917, "epoch": 3962} {"train_loss": -25.539731979370117, "global_step": 328918, "epoch": 3962} {"train_loss": -26.041736602783203, "global_step": 328919, "epoch": 3962} {"train_loss": -25.9420108795166, "global_step": 328920, "epoch": 3962} {"train_loss": -25.84731101989746, "global_step": 328921, "epoch": 3962} {"train_loss": -25.705432891845703, "global_step": 328922, "epoch": 3962} {"train_loss": -25.87216567993164, "global_step": 328923, "epoch": 3962} {"train_loss": -25.498626708984375, "global_step": 328924, "epoch": 3962} {"train_loss": -25.51167869567871, "global_step": 328925, "epoch": 3962} {"train_loss": -25.723230361938477, "global_step": 328926, "epoch": 3962} {"train_loss": -26.091022491455078, "global_step": 328927, "epoch": 3962} {"train_loss": -25.763731577310217, "global_step": 328928, "epoch": 3962, "val_loss": 7248831.0} {"train_loss": -25.491931915283203, "global_step": 328929, "epoch": 3963} {"train_loss": -24.989477157592773, "global_step": 328930, "epoch": 3963} {"train_loss": -25.462642669677734, "global_step": 328931, "epoch": 3963} {"train_loss": -25.21077537536621, "global_step": 328932, "epoch": 3963} {"train_loss": -25.537206649780273, "global_step": 328933, "epoch": 3963} {"train_loss": -25.349441528320312, "global_step": 328934, "epoch": 3963} {"train_loss": -25.542190551757812, "global_step": 328935, "epoch": 3963} {"train_loss": -25.611221313476562, "global_step": 328936, "epoch": 3963} {"train_loss": -25.26832389831543, "global_step": 328937, "epoch": 3963} {"train_loss": -25.97284507751465, "global_step": 328938, "epoch": 3963} {"train_loss": -25.547870635986328, "global_step": 328939, "epoch": 3963} {"train_loss": -25.853681564331055, "global_step": 328940, "epoch": 3963} {"train_loss": -25.743310928344727, "global_step": 328941, "epoch": 3963} {"train_loss": -25.685489654541016, "global_step": 328942, "epoch": 3963} {"train_loss": -25.3894100189209, "global_step": 328943, "epoch": 3963} {"train_loss": -25.430500030517578, "global_step": 328944, "epoch": 3963} {"train_loss": -25.48738670349121, "global_step": 328945, "epoch": 3963} {"train_loss": -25.894811630249023, "global_step": 328946, "epoch": 3963} {"train_loss": -25.733762741088867, "global_step": 328947, "epoch": 3963} {"train_loss": -25.60407066345215, "global_step": 328948, "epoch": 3963} {"train_loss": -25.58218002319336, "global_step": 328949, "epoch": 3963} {"train_loss": -25.987512588500977, "global_step": 328950, "epoch": 3963} {"train_loss": -25.937606811523438, "global_step": 328951, "epoch": 3963} {"train_loss": -26.162052154541016, "global_step": 328952, "epoch": 3963} {"train_loss": -25.87733268737793, "global_step": 328953, "epoch": 3963} {"train_loss": -25.942123413085938, "global_step": 328954, "epoch": 3963} {"train_loss": -25.86669921875, "global_step": 328955, "epoch": 3963} {"train_loss": -26.109861373901367, "global_step": 328956, "epoch": 3963} {"train_loss": -25.731586456298828, "global_step": 328957, "epoch": 3963} {"train_loss": -26.102231979370117, "global_step": 328958, "epoch": 3963} {"train_loss": -25.722522735595703, "global_step": 328959, "epoch": 3963} {"train_loss": -26.141666412353516, "global_step": 328960, "epoch": 3963} {"train_loss": -26.115705490112305, "global_step": 328961, "epoch": 3963} {"train_loss": -26.105213165283203, "global_step": 328962, "epoch": 3963} {"train_loss": -25.886438369750977, "global_step": 328963, "epoch": 3963} {"train_loss": -25.86195945739746, "global_step": 328964, "epoch": 3963} {"train_loss": -25.833282470703125, "global_step": 328965, "epoch": 3963} {"train_loss": -26.029279708862305, "global_step": 328966, "epoch": 3963} {"train_loss": -26.084753036499023, "global_step": 328967, "epoch": 3963} {"train_loss": -26.010480880737305, "global_step": 328968, "epoch": 3963} {"train_loss": -26.026330947875977, "global_step": 328969, "epoch": 3963} {"train_loss": -26.071996688842773, "global_step": 328970, "epoch": 3963} {"train_loss": -25.882841110229492, "global_step": 328971, "epoch": 3963} {"train_loss": -25.903913497924805, "global_step": 328972, "epoch": 3963} {"train_loss": -25.969526290893555, "global_step": 328973, "epoch": 3963} {"train_loss": -25.913070678710938, "global_step": 328974, "epoch": 3963} {"train_loss": -26.39911460876465, "global_step": 328975, "epoch": 3963} {"train_loss": -26.290876388549805, "global_step": 328976, "epoch": 3963} {"train_loss": -25.895788192749023, "global_step": 328977, "epoch": 3963} {"train_loss": -26.460693359375, "global_step": 328978, "epoch": 3963} {"train_loss": -26.34263038635254, "global_step": 328979, "epoch": 3963} {"train_loss": -25.93131446838379, "global_step": 328980, "epoch": 3963} {"train_loss": -26.04697036743164, "global_step": 328981, "epoch": 3963} {"train_loss": -25.940210342407227, "global_step": 328982, "epoch": 3963} {"train_loss": -25.945032119750977, "global_step": 328983, "epoch": 3963} {"train_loss": -25.779495239257812, "global_step": 328984, "epoch": 3963} {"train_loss": -25.667638778686523, "global_step": 328985, "epoch": 3963} {"train_loss": -25.95806312561035, "global_step": 328986, "epoch": 3963} {"train_loss": -26.309524536132812, "global_step": 328987, "epoch": 3963} {"train_loss": -26.1270694732666, "global_step": 328988, "epoch": 3963} {"train_loss": -25.76163673400879, "global_step": 328989, "epoch": 3963} {"train_loss": -25.814910888671875, "global_step": 328990, "epoch": 3963} {"train_loss": -26.034650802612305, "global_step": 328991, "epoch": 3963} {"train_loss": -26.13413429260254, "global_step": 328992, "epoch": 3963} {"train_loss": -26.047250747680664, "global_step": 328993, "epoch": 3963} {"train_loss": -25.923181533813477, "global_step": 328994, "epoch": 3963} {"train_loss": -26.12824821472168, "global_step": 328995, "epoch": 3963} {"train_loss": -26.07391357421875, "global_step": 328996, "epoch": 3963} {"train_loss": -25.928144454956055, "global_step": 328997, "epoch": 3963} {"train_loss": -26.133771896362305, "global_step": 328998, "epoch": 3963} {"train_loss": -26.040857315063477, "global_step": 328999, "epoch": 3963} {"train_loss": -26.25079917907715, "global_step": 329000, "epoch": 3963} {"train_loss": -25.93595314025879, "global_step": 329001, "epoch": 3963} {"train_loss": -26.201547622680664, "global_step": 329002, "epoch": 3963} {"train_loss": -26.028594970703125, "global_step": 329003, "epoch": 3963} {"train_loss": -25.8518009185791, "global_step": 329004, "epoch": 3963} {"train_loss": -26.063657760620117, "global_step": 329005, "epoch": 3963} {"train_loss": -26.0892276763916, "global_step": 329006, "epoch": 3963} {"train_loss": -25.99452781677246, "global_step": 329007, "epoch": 3963} {"train_loss": -25.909521102905273, "global_step": 329008, "epoch": 3963} {"train_loss": -26.088592529296875, "global_step": 329009, "epoch": 3963} {"train_loss": -26.211774826049805, "global_step": 329010, "epoch": 3963} {"train_loss": -25.870327777173145, "global_step": 329011, "epoch": 3963, "val_loss": 7120394.0} {"train_loss": -24.351181030273438, "global_step": 329012, "epoch": 3964} {"train_loss": -24.378616333007812, "global_step": 329013, "epoch": 3964} {"train_loss": -25.173887252807617, "global_step": 329014, "epoch": 3964} {"train_loss": -24.976572036743164, "global_step": 329015, "epoch": 3964} {"train_loss": -24.924171447753906, "global_step": 329016, "epoch": 3964} {"train_loss": -25.017431259155273, "global_step": 329017, "epoch": 3964} {"train_loss": -25.484437942504883, "global_step": 329018, "epoch": 3964} {"train_loss": -24.791635513305664, "global_step": 329019, "epoch": 3964} {"train_loss": -25.578800201416016, "global_step": 329020, "epoch": 3964} {"train_loss": -25.014408111572266, "global_step": 329021, "epoch": 3964} {"train_loss": -25.312273025512695, "global_step": 329022, "epoch": 3964} {"train_loss": -25.066280364990234, "global_step": 329023, "epoch": 3964} {"train_loss": -25.38393783569336, "global_step": 329024, "epoch": 3964} {"train_loss": -25.612293243408203, "global_step": 329025, "epoch": 3964} {"train_loss": -25.54849624633789, "global_step": 329026, "epoch": 3964} {"train_loss": -25.631103515625, "global_step": 329027, "epoch": 3964} {"train_loss": -25.51997947692871, "global_step": 329028, "epoch": 3964} {"train_loss": -25.78753089904785, "global_step": 329029, "epoch": 3964} {"train_loss": -25.6215763092041, "global_step": 329030, "epoch": 3964} {"train_loss": -25.48611831665039, "global_step": 329031, "epoch": 3964} {"train_loss": -26.037939071655273, "global_step": 329032, "epoch": 3964} {"train_loss": -25.26972770690918, "global_step": 329033, "epoch": 3964} {"train_loss": -25.487051010131836, "global_step": 329034, "epoch": 3964} {"train_loss": -25.4901065826416, "global_step": 329035, "epoch": 3964} {"train_loss": -25.673690795898438, "global_step": 329036, "epoch": 3964} {"train_loss": -25.43783187866211, "global_step": 329037, "epoch": 3964} {"train_loss": -25.6698055267334, "global_step": 329038, "epoch": 3964} {"train_loss": -25.736448287963867, "global_step": 329039, "epoch": 3964} {"train_loss": -25.707305908203125, "global_step": 329040, "epoch": 3964} {"train_loss": -25.758533477783203, "global_step": 329041, "epoch": 3964} {"train_loss": -25.668521881103516, "global_step": 329042, "epoch": 3964} {"train_loss": -25.749860763549805, "global_step": 329043, "epoch": 3964} {"train_loss": -26.050537109375, "global_step": 329044, "epoch": 3964} {"train_loss": -26.1782169342041, "global_step": 329045, "epoch": 3964} {"train_loss": -26.083541870117188, "global_step": 329046, "epoch": 3964} {"train_loss": -26.009021759033203, "global_step": 329047, "epoch": 3964} {"train_loss": -25.807880401611328, "global_step": 329048, "epoch": 3964} {"train_loss": -25.689298629760742, "global_step": 329049, "epoch": 3964} {"train_loss": -26.051300048828125, "global_step": 329050, "epoch": 3964} {"train_loss": -26.147924423217773, "global_step": 329051, "epoch": 3964} {"train_loss": -25.91999626159668, "global_step": 329052, "epoch": 3964} {"train_loss": -26.16145133972168, "global_step": 329053, "epoch": 3964} {"train_loss": -26.077392578125, "global_step": 329054, "epoch": 3964} {"train_loss": -26.26420021057129, "global_step": 329055, "epoch": 3964} {"train_loss": -26.134765625, "global_step": 329056, "epoch": 3964} {"train_loss": -26.0682430267334, "global_step": 329057, "epoch": 3964} {"train_loss": -26.155044555664062, "global_step": 329058, "epoch": 3964} {"train_loss": -25.84124755859375, "global_step": 329059, "epoch": 3964} {"train_loss": -25.931751251220703, "global_step": 329060, "epoch": 3964} {"train_loss": -25.937576293945312, "global_step": 329061, "epoch": 3964} {"train_loss": -25.976465225219727, "global_step": 329062, "epoch": 3964} {"train_loss": -25.83051109313965, "global_step": 329063, "epoch": 3964} {"train_loss": -25.88691520690918, "global_step": 329064, "epoch": 3964} {"train_loss": -25.8925838470459, "global_step": 329065, "epoch": 3964} {"train_loss": -25.960248947143555, "global_step": 329066, "epoch": 3964} {"train_loss": -25.6641845703125, "global_step": 329067, "epoch": 3964} {"train_loss": -26.089492797851562, "global_step": 329068, "epoch": 3964} {"train_loss": -25.954456329345703, "global_step": 329069, "epoch": 3964} {"train_loss": -25.860427856445312, "global_step": 329070, "epoch": 3964} {"train_loss": -26.226999282836914, "global_step": 329071, "epoch": 3964} {"train_loss": -26.180845260620117, "global_step": 329072, "epoch": 3964} {"train_loss": -26.205793380737305, "global_step": 329073, "epoch": 3964} {"train_loss": -25.945905685424805, "global_step": 329074, "epoch": 3964} {"train_loss": -25.69928550720215, "global_step": 329075, "epoch": 3964} {"train_loss": -26.1579532623291, "global_step": 329076, "epoch": 3964} {"train_loss": -26.050146102905273, "global_step": 329077, "epoch": 3964} {"train_loss": -26.351613998413086, "global_step": 329078, "epoch": 3964} {"train_loss": -25.952138900756836, "global_step": 329079, "epoch": 3964} {"train_loss": -26.2945499420166, "global_step": 329080, "epoch": 3964} {"train_loss": -25.992462158203125, "global_step": 329081, "epoch": 3964} {"train_loss": -25.90388298034668, "global_step": 329082, "epoch": 3964} {"train_loss": -25.7121524810791, "global_step": 329083, "epoch": 3964} {"train_loss": -26.083972930908203, "global_step": 329084, "epoch": 3964} {"train_loss": -26.372360229492188, "global_step": 329085, "epoch": 3964} {"train_loss": -26.07184410095215, "global_step": 329086, "epoch": 3964} {"train_loss": -26.316638946533203, "global_step": 329087, "epoch": 3964} {"train_loss": -26.21436882019043, "global_step": 329088, "epoch": 3964} {"train_loss": -26.5892391204834, "global_step": 329089, "epoch": 3964} {"train_loss": -25.874292373657227, "global_step": 329090, "epoch": 3964} {"train_loss": -26.0115909576416, "global_step": 329091, "epoch": 3964} {"train_loss": -26.358325958251953, "global_step": 329092, "epoch": 3964} {"train_loss": -26.18947410583496, "global_step": 329093, "epoch": 3964} {"train_loss": -25.793268387576184, "global_step": 329094, "epoch": 3964, "val_loss": 7270494.5} {"train_loss": -24.728456497192383, "global_step": 329095, "epoch": 3965} {"train_loss": -24.83424186706543, "global_step": 329096, "epoch": 3965} {"train_loss": -25.432058334350586, "global_step": 329097, "epoch": 3965} {"train_loss": -25.051605224609375, "global_step": 329098, "epoch": 3965} {"train_loss": -25.21234130859375, "global_step": 329099, "epoch": 3965} {"train_loss": -25.368947982788086, "global_step": 329100, "epoch": 3965} {"train_loss": -25.270231246948242, "global_step": 329101, "epoch": 3965} {"train_loss": -25.29373550415039, "global_step": 329102, "epoch": 3965} {"train_loss": -25.52920913696289, "global_step": 329103, "epoch": 3965} {"train_loss": -25.26862335205078, "global_step": 329104, "epoch": 3965} {"train_loss": -25.28840446472168, "global_step": 329105, "epoch": 3965} {"train_loss": -25.26078224182129, "global_step": 329106, "epoch": 3965} {"train_loss": -25.330738067626953, "global_step": 329107, "epoch": 3965} {"train_loss": -25.842529296875, "global_step": 329108, "epoch": 3965} {"train_loss": -25.9443416595459, "global_step": 329109, "epoch": 3965} {"train_loss": -25.137723922729492, "global_step": 329110, "epoch": 3965} {"train_loss": -26.0319881439209, "global_step": 329111, "epoch": 3965} {"train_loss": -26.007566452026367, "global_step": 329112, "epoch": 3965} {"train_loss": -25.801122665405273, "global_step": 329113, "epoch": 3965} {"train_loss": -25.549476623535156, "global_step": 329114, "epoch": 3965} {"train_loss": -25.875717163085938, "global_step": 329115, "epoch": 3965} {"train_loss": -25.53720474243164, "global_step": 329116, "epoch": 3965} {"train_loss": -25.628448486328125, "global_step": 329117, "epoch": 3965} {"train_loss": -25.7247314453125, "global_step": 329118, "epoch": 3965} {"train_loss": -25.731470108032227, "global_step": 329119, "epoch": 3965} {"train_loss": -25.659372329711914, "global_step": 329120, "epoch": 3965} {"train_loss": -25.96365737915039, "global_step": 329121, "epoch": 3965} {"train_loss": -25.540855407714844, "global_step": 329122, "epoch": 3965} {"train_loss": -26.08416175842285, "global_step": 329123, "epoch": 3965} {"train_loss": -25.9890079498291, "global_step": 329124, "epoch": 3965} {"train_loss": -25.628494262695312, "global_step": 329125, "epoch": 3965} {"train_loss": -26.152759552001953, "global_step": 329126, "epoch": 3965} {"train_loss": -25.861722946166992, "global_step": 329127, "epoch": 3965} {"train_loss": -25.946155548095703, "global_step": 329128, "epoch": 3965} {"train_loss": -26.03705406188965, "global_step": 329129, "epoch": 3965} {"train_loss": -25.886844635009766, "global_step": 329130, "epoch": 3965} {"train_loss": -26.039432525634766, "global_step": 329131, "epoch": 3965} {"train_loss": -26.327823638916016, "global_step": 329132, "epoch": 3965} {"train_loss": -26.052509307861328, "global_step": 329133, "epoch": 3965} {"train_loss": -26.23185157775879, "global_step": 329134, "epoch": 3965} {"train_loss": -25.91529655456543, "global_step": 329135, "epoch": 3965} {"train_loss": -26.198474884033203, "global_step": 329136, "epoch": 3965} {"train_loss": -25.43118667602539, "global_step": 329137, "epoch": 3965} {"train_loss": -25.91743278503418, "global_step": 329138, "epoch": 3965} {"train_loss": -26.081762313842773, "global_step": 329139, "epoch": 3965} {"train_loss": -26.24065589904785, "global_step": 329140, "epoch": 3965} {"train_loss": -25.9294490814209, "global_step": 329141, "epoch": 3965} {"train_loss": -26.086444854736328, "global_step": 329142, "epoch": 3965} {"train_loss": -25.764984130859375, "global_step": 329143, "epoch": 3965} {"train_loss": -26.317991256713867, "global_step": 329144, "epoch": 3965} {"train_loss": -25.665807723999023, "global_step": 329145, "epoch": 3965} {"train_loss": -26.122955322265625, "global_step": 329146, "epoch": 3965} {"train_loss": -25.981977462768555, "global_step": 329147, "epoch": 3965} {"train_loss": -25.6072998046875, "global_step": 329148, "epoch": 3965} {"train_loss": -25.90643882751465, "global_step": 329149, "epoch": 3965} {"train_loss": -26.414779663085938, "global_step": 329150, "epoch": 3965} {"train_loss": -25.885435104370117, "global_step": 329151, "epoch": 3965} {"train_loss": -26.266454696655273, "global_step": 329152, "epoch": 3965} {"train_loss": -25.657001495361328, "global_step": 329153, "epoch": 3965} {"train_loss": -26.060510635375977, "global_step": 329154, "epoch": 3965} {"train_loss": -26.08469581604004, "global_step": 329155, "epoch": 3965} {"train_loss": -25.8570499420166, "global_step": 329156, "epoch": 3965} {"train_loss": -26.118560791015625, "global_step": 329157, "epoch": 3965} {"train_loss": -25.7883243560791, "global_step": 329158, "epoch": 3965} {"train_loss": -26.107709884643555, "global_step": 329159, "epoch": 3965} {"train_loss": -25.993986129760742, "global_step": 329160, "epoch": 3965} {"train_loss": -26.186527252197266, "global_step": 329161, "epoch": 3965} {"train_loss": -26.031967163085938, "global_step": 329162, "epoch": 3965} {"train_loss": -26.023019790649414, "global_step": 329163, "epoch": 3965} {"train_loss": -26.011030197143555, "global_step": 329164, "epoch": 3965} {"train_loss": -26.030303955078125, "global_step": 329165, "epoch": 3965} {"train_loss": -25.6562557220459, "global_step": 329166, "epoch": 3965} {"train_loss": -25.99308204650879, "global_step": 329167, "epoch": 3965} {"train_loss": -25.699926376342773, "global_step": 329168, "epoch": 3965} {"train_loss": -25.64434242248535, "global_step": 329169, "epoch": 3965} {"train_loss": -26.338586807250977, "global_step": 329170, "epoch": 3965} {"train_loss": -26.07736587524414, "global_step": 329171, "epoch": 3965} {"train_loss": -26.432926177978516, "global_step": 329172, "epoch": 3965} {"train_loss": -25.95911979675293, "global_step": 329173, "epoch": 3965} {"train_loss": -26.048004150390625, "global_step": 329174, "epoch": 3965} {"train_loss": -26.327356338500977, "global_step": 329175, "epoch": 3965} {"train_loss": -26.392108917236328, "global_step": 329176, "epoch": 3965} {"train_loss": -25.834190391632447, "global_step": 329177, "epoch": 3965, "val_loss": 7170912.0} {"train_loss": -24.51734161376953, "global_step": 329178, "epoch": 3966} {"train_loss": -25.62891960144043, "global_step": 329179, "epoch": 3966} {"train_loss": -25.213815689086914, "global_step": 329180, "epoch": 3966} {"train_loss": -24.77147102355957, "global_step": 329181, "epoch": 3966} {"train_loss": -25.40281105041504, "global_step": 329182, "epoch": 3966} {"train_loss": -25.446720123291016, "global_step": 329183, "epoch": 3966} {"train_loss": -25.185260772705078, "global_step": 329184, "epoch": 3966} {"train_loss": -25.48430824279785, "global_step": 329185, "epoch": 3966} {"train_loss": -25.250457763671875, "global_step": 329186, "epoch": 3966} {"train_loss": -25.385574340820312, "global_step": 329187, "epoch": 3966} {"train_loss": -25.52150535583496, "global_step": 329188, "epoch": 3966} {"train_loss": -25.624425888061523, "global_step": 329189, "epoch": 3966} {"train_loss": -25.53922462463379, "global_step": 329190, "epoch": 3966} {"train_loss": -25.5489559173584, "global_step": 329191, "epoch": 3966} {"train_loss": -25.4200496673584, "global_step": 329192, "epoch": 3966} {"train_loss": -25.7578182220459, "global_step": 329193, "epoch": 3966} {"train_loss": -25.546573638916016, "global_step": 329194, "epoch": 3966} {"train_loss": -25.879953384399414, "global_step": 329195, "epoch": 3966} {"train_loss": -25.9935359954834, "global_step": 329196, "epoch": 3966} {"train_loss": -25.23528480529785, "global_step": 329197, "epoch": 3966} {"train_loss": -25.53822135925293, "global_step": 329198, "epoch": 3966} {"train_loss": -25.71597671508789, "global_step": 329199, "epoch": 3966} {"train_loss": -25.926837921142578, "global_step": 329200, "epoch": 3966} {"train_loss": -25.712604522705078, "global_step": 329201, "epoch": 3966} {"train_loss": -25.845670700073242, "global_step": 329202, "epoch": 3966} {"train_loss": -25.903247833251953, "global_step": 329203, "epoch": 3966} {"train_loss": -25.8963680267334, "global_step": 329204, "epoch": 3966} {"train_loss": -26.246007919311523, "global_step": 329205, "epoch": 3966} {"train_loss": -25.68169593811035, "global_step": 329206, "epoch": 3966} {"train_loss": -25.747114181518555, "global_step": 329207, "epoch": 3966} {"train_loss": -25.983449935913086, "global_step": 329208, "epoch": 3966} {"train_loss": -25.9444580078125, "global_step": 329209, "epoch": 3966} {"train_loss": -25.754568099975586, "global_step": 329210, "epoch": 3966} {"train_loss": -26.085437774658203, "global_step": 329211, "epoch": 3966} {"train_loss": -26.076948165893555, "global_step": 329212, "epoch": 3966} {"train_loss": -25.989776611328125, "global_step": 329213, "epoch": 3966} {"train_loss": -26.004064559936523, "global_step": 329214, "epoch": 3966} {"train_loss": -25.960981369018555, "global_step": 329215, "epoch": 3966} {"train_loss": -25.813068389892578, "global_step": 329216, "epoch": 3966} {"train_loss": -26.18293571472168, "global_step": 329217, "epoch": 3966} {"train_loss": -26.304595947265625, "global_step": 329218, "epoch": 3966} {"train_loss": -26.33169937133789, "global_step": 329219, "epoch": 3966} {"train_loss": -26.007843017578125, "global_step": 329220, "epoch": 3966} {"train_loss": -26.021337509155273, "global_step": 329221, "epoch": 3966} {"train_loss": -26.272796630859375, "global_step": 329222, "epoch": 3966} {"train_loss": -25.8580265045166, "global_step": 329223, "epoch": 3966} {"train_loss": -26.374988555908203, "global_step": 329224, "epoch": 3966} {"train_loss": -25.930139541625977, "global_step": 329225, "epoch": 3966} {"train_loss": -26.067651748657227, "global_step": 329226, "epoch": 3966} {"train_loss": -25.752134323120117, "global_step": 329227, "epoch": 3966} {"train_loss": -26.03130531311035, "global_step": 329228, "epoch": 3966} {"train_loss": -26.077468872070312, "global_step": 329229, "epoch": 3966} {"train_loss": -26.08205223083496, "global_step": 329230, "epoch": 3966} {"train_loss": -25.73223876953125, "global_step": 329231, "epoch": 3966} {"train_loss": -26.166242599487305, "global_step": 329232, "epoch": 3966} {"train_loss": -25.51187515258789, "global_step": 329233, "epoch": 3966} {"train_loss": -25.420392990112305, "global_step": 329234, "epoch": 3966} {"train_loss": -25.979339599609375, "global_step": 329235, "epoch": 3966} {"train_loss": -26.094167709350586, "global_step": 329236, "epoch": 3966} {"train_loss": -25.851926803588867, "global_step": 329237, "epoch": 3966} {"train_loss": -25.985074996948242, "global_step": 329238, "epoch": 3966} {"train_loss": -26.02589225769043, "global_step": 329239, "epoch": 3966} {"train_loss": -25.909082412719727, "global_step": 329240, "epoch": 3966} {"train_loss": -25.974090576171875, "global_step": 329241, "epoch": 3966} {"train_loss": -26.021345138549805, "global_step": 329242, "epoch": 3966} {"train_loss": -26.1453857421875, "global_step": 329243, "epoch": 3966} {"train_loss": -25.991846084594727, "global_step": 329244, "epoch": 3966} {"train_loss": -25.865646362304688, "global_step": 329245, "epoch": 3966} {"train_loss": -25.911853790283203, "global_step": 329246, "epoch": 3966} {"train_loss": -26.068761825561523, "global_step": 329247, "epoch": 3966} {"train_loss": -25.944263458251953, "global_step": 329248, "epoch": 3966} {"train_loss": -25.731733322143555, "global_step": 329249, "epoch": 3966} {"train_loss": -26.1839599609375, "global_step": 329250, "epoch": 3966} {"train_loss": -25.66864585876465, "global_step": 329251, "epoch": 3966} {"train_loss": -26.041669845581055, "global_step": 329252, "epoch": 3966} {"train_loss": -26.116565704345703, "global_step": 329253, "epoch": 3966} {"train_loss": -25.825641632080078, "global_step": 329254, "epoch": 3966} {"train_loss": -26.32122230529785, "global_step": 329255, "epoch": 3966} {"train_loss": -25.649423599243164, "global_step": 329256, "epoch": 3966} {"train_loss": -26.463537216186523, "global_step": 329257, "epoch": 3966} {"train_loss": -25.981983184814453, "global_step": 329258, "epoch": 3966} {"train_loss": -25.912403106689453, "global_step": 329259, "epoch": 3966} {"train_loss": -25.83436182320836, "global_step": 329260, "epoch": 3966, "val_loss": 7152334.5} {"train_loss": -25.864316940307617, "global_step": 329261, "epoch": 3967} {"train_loss": -25.94862174987793, "global_step": 329262, "epoch": 3967} {"train_loss": -25.477670669555664, "global_step": 329263, "epoch": 3967} {"train_loss": -25.522016525268555, "global_step": 329264, "epoch": 3967} {"train_loss": -25.63566017150879, "global_step": 329265, "epoch": 3967} {"train_loss": -25.720388412475586, "global_step": 329266, "epoch": 3967} {"train_loss": -25.732481002807617, "global_step": 329267, "epoch": 3967} {"train_loss": -25.698654174804688, "global_step": 329268, "epoch": 3967} {"train_loss": -25.963041305541992, "global_step": 329269, "epoch": 3967} {"train_loss": -25.75044822692871, "global_step": 329270, "epoch": 3967} {"train_loss": -25.774478912353516, "global_step": 329271, "epoch": 3967} {"train_loss": -25.602991104125977, "global_step": 329272, "epoch": 3967} {"train_loss": -25.97456169128418, "global_step": 329273, "epoch": 3967} {"train_loss": -25.55122947692871, "global_step": 329274, "epoch": 3967} {"train_loss": -25.903547286987305, "global_step": 329275, "epoch": 3967} {"train_loss": -25.54952049255371, "global_step": 329276, "epoch": 3967} {"train_loss": -26.011499404907227, "global_step": 329277, "epoch": 3967} {"train_loss": -25.937549591064453, "global_step": 329278, "epoch": 3967} {"train_loss": -26.242862701416016, "global_step": 329279, "epoch": 3967} {"train_loss": -25.759784698486328, "global_step": 329280, "epoch": 3967} {"train_loss": -25.927343368530273, "global_step": 329281, "epoch": 3967} {"train_loss": -26.083520889282227, "global_step": 329282, "epoch": 3967} {"train_loss": -26.033002853393555, "global_step": 329283, "epoch": 3967} {"train_loss": -26.205121994018555, "global_step": 329284, "epoch": 3967} {"train_loss": -26.2591495513916, "global_step": 329285, "epoch": 3967} {"train_loss": -25.867338180541992, "global_step": 329286, "epoch": 3967} {"train_loss": -25.81293296813965, "global_step": 329287, "epoch": 3967} {"train_loss": -25.846887588500977, "global_step": 329288, "epoch": 3967} {"train_loss": -25.96478843688965, "global_step": 329289, "epoch": 3967} {"train_loss": -26.065387725830078, "global_step": 329290, "epoch": 3967} {"train_loss": -26.047697067260742, "global_step": 329291, "epoch": 3967} {"train_loss": -26.097244262695312, "global_step": 329292, "epoch": 3967} {"train_loss": -26.05780029296875, "global_step": 329293, "epoch": 3967} {"train_loss": -25.96533203125, "global_step": 329294, "epoch": 3967} {"train_loss": -25.774301528930664, "global_step": 329295, "epoch": 3967} {"train_loss": -25.849912643432617, "global_step": 329296, "epoch": 3967} {"train_loss": -26.12257194519043, "global_step": 329297, "epoch": 3967} {"train_loss": -25.918928146362305, "global_step": 329298, "epoch": 3967} {"train_loss": -26.075666427612305, "global_step": 329299, "epoch": 3967} {"train_loss": -26.290164947509766, "global_step": 329300, "epoch": 3967} {"train_loss": -25.803205490112305, "global_step": 329301, "epoch": 3967} {"train_loss": -25.922155380249023, "global_step": 329302, "epoch": 3967} {"train_loss": -25.32498550415039, "global_step": 329303, "epoch": 3967} {"train_loss": -25.749006271362305, "global_step": 329304, "epoch": 3967} {"train_loss": -26.057260513305664, "global_step": 329305, "epoch": 3967} {"train_loss": -25.841827392578125, "global_step": 329306, "epoch": 3967} {"train_loss": -25.641788482666016, "global_step": 329307, "epoch": 3967} {"train_loss": -25.739622116088867, "global_step": 329308, "epoch": 3967} {"train_loss": -25.7686767578125, "global_step": 329309, "epoch": 3967} {"train_loss": -26.158090591430664, "global_step": 329310, "epoch": 3967} {"train_loss": -26.144628524780273, "global_step": 329311, "epoch": 3967} {"train_loss": -25.958789825439453, "global_step": 329312, "epoch": 3967} {"train_loss": -25.732763290405273, "global_step": 329313, "epoch": 3967} {"train_loss": -25.908283233642578, "global_step": 329314, "epoch": 3967} {"train_loss": -26.0836181640625, "global_step": 329315, "epoch": 3967} {"train_loss": -26.227264404296875, "global_step": 329316, "epoch": 3967} {"train_loss": -25.628768920898438, "global_step": 329317, "epoch": 3967} {"train_loss": -25.71844482421875, "global_step": 329318, "epoch": 3967} {"train_loss": -26.05866050720215, "global_step": 329319, "epoch": 3967} {"train_loss": -25.905832290649414, "global_step": 329320, "epoch": 3967} {"train_loss": -26.29937744140625, "global_step": 329321, "epoch": 3967} {"train_loss": -25.95234489440918, "global_step": 329322, "epoch": 3967} {"train_loss": -26.177839279174805, "global_step": 329323, "epoch": 3967} {"train_loss": -26.117395401000977, "global_step": 329324, "epoch": 3967} {"train_loss": -25.886999130249023, "global_step": 329325, "epoch": 3967} {"train_loss": -25.85791015625, "global_step": 329326, "epoch": 3967} {"train_loss": -26.21429443359375, "global_step": 329327, "epoch": 3967} {"train_loss": -26.0321044921875, "global_step": 329328, "epoch": 3967} {"train_loss": -25.989322662353516, "global_step": 329329, "epoch": 3967} {"train_loss": -26.0811824798584, "global_step": 329330, "epoch": 3967} {"train_loss": -26.133895874023438, "global_step": 329331, "epoch": 3967} {"train_loss": -26.194860458374023, "global_step": 329332, "epoch": 3967} {"train_loss": -26.026248931884766, "global_step": 329333, "epoch": 3967} {"train_loss": -25.851659774780273, "global_step": 329334, "epoch": 3967} {"train_loss": -25.948453903198242, "global_step": 329335, "epoch": 3967} {"train_loss": -26.244226455688477, "global_step": 329336, "epoch": 3967} {"train_loss": -26.379663467407227, "global_step": 329337, "epoch": 3967} {"train_loss": -25.574369430541992, "global_step": 329338, "epoch": 3967} {"train_loss": -25.717267990112305, "global_step": 329339, "epoch": 3967} {"train_loss": -26.16151237487793, "global_step": 329340, "epoch": 3967} {"train_loss": -26.006200790405273, "global_step": 329341, "epoch": 3967} {"train_loss": -26.10494041442871, "global_step": 329342, "epoch": 3967} {"train_loss": -25.93031000803752, "global_step": 329343, "epoch": 3967, "val_loss": 7304551.0} {"train_loss": -26.008380889892578, "global_step": 329344, "epoch": 3968} {"train_loss": -25.353561401367188, "global_step": 329345, "epoch": 3968} {"train_loss": -25.060686111450195, "global_step": 329346, "epoch": 3968} {"train_loss": -25.553205490112305, "global_step": 329347, "epoch": 3968} {"train_loss": -24.66257095336914, "global_step": 329348, "epoch": 3968} {"train_loss": -25.186166763305664, "global_step": 329349, "epoch": 3968} {"train_loss": -24.709089279174805, "global_step": 329350, "epoch": 3968} {"train_loss": -25.2359561920166, "global_step": 329351, "epoch": 3968} {"train_loss": -24.924152374267578, "global_step": 329352, "epoch": 3968} {"train_loss": -25.03240966796875, "global_step": 329353, "epoch": 3968} {"train_loss": -25.672449111938477, "global_step": 329354, "epoch": 3968} {"train_loss": -25.380252838134766, "global_step": 329355, "epoch": 3968} {"train_loss": -25.469623565673828, "global_step": 329356, "epoch": 3968} {"train_loss": -25.4913272857666, "global_step": 329357, "epoch": 3968} {"train_loss": -25.401233673095703, "global_step": 329358, "epoch": 3968} {"train_loss": -25.36455535888672, "global_step": 329359, "epoch": 3968} {"train_loss": -25.460418701171875, "global_step": 329360, "epoch": 3968} {"train_loss": -25.210378646850586, "global_step": 329361, "epoch": 3968} {"train_loss": -25.462430953979492, "global_step": 329362, "epoch": 3968} {"train_loss": -25.567901611328125, "global_step": 329363, "epoch": 3968} {"train_loss": -25.76007652282715, "global_step": 329364, "epoch": 3968} {"train_loss": -25.2304744720459, "global_step": 329365, "epoch": 3968} {"train_loss": -25.715539932250977, "global_step": 329366, "epoch": 3968} {"train_loss": -25.40117835998535, "global_step": 329367, "epoch": 3968} {"train_loss": -25.13681411743164, "global_step": 329368, "epoch": 3968} {"train_loss": -25.663610458374023, "global_step": 329369, "epoch": 3968} {"train_loss": -25.38481330871582, "global_step": 329370, "epoch": 3968} {"train_loss": -25.391016006469727, "global_step": 329371, "epoch": 3968} {"train_loss": -25.818933486938477, "global_step": 329372, "epoch": 3968} {"train_loss": -25.590787887573242, "global_step": 329373, "epoch": 3968} {"train_loss": -25.729206085205078, "global_step": 329374, "epoch": 3968} {"train_loss": -25.78925895690918, "global_step": 329375, "epoch": 3968} {"train_loss": -25.996366500854492, "global_step": 329376, "epoch": 3968} {"train_loss": -25.48093605041504, "global_step": 329377, "epoch": 3968} {"train_loss": -25.92792320251465, "global_step": 329378, "epoch": 3968} {"train_loss": -25.99835777282715, "global_step": 329379, "epoch": 3968} {"train_loss": -25.709503173828125, "global_step": 329380, "epoch": 3968} {"train_loss": -25.856903076171875, "global_step": 329381, "epoch": 3968} {"train_loss": -26.10652732849121, "global_step": 329382, "epoch": 3968} {"train_loss": -26.09742546081543, "global_step": 329383, "epoch": 3968} {"train_loss": -26.154199600219727, "global_step": 329384, "epoch": 3968} {"train_loss": -25.848987579345703, "global_step": 329385, "epoch": 3968} {"train_loss": -25.879484176635742, "global_step": 329386, "epoch": 3968} {"train_loss": -26.017499923706055, "global_step": 329387, "epoch": 3968} {"train_loss": -26.34796142578125, "global_step": 329388, "epoch": 3968} {"train_loss": -26.41639518737793, "global_step": 329389, "epoch": 3968} {"train_loss": -26.107091903686523, "global_step": 329390, "epoch": 3968} {"train_loss": -26.001779556274414, "global_step": 329391, "epoch": 3968} {"train_loss": -25.759876251220703, "global_step": 329392, "epoch": 3968} {"train_loss": -26.060333251953125, "global_step": 329393, "epoch": 3968} {"train_loss": -26.061655044555664, "global_step": 329394, "epoch": 3968} {"train_loss": -25.88532066345215, "global_step": 329395, "epoch": 3968} {"train_loss": -26.214765548706055, "global_step": 329396, "epoch": 3968} {"train_loss": -26.029571533203125, "global_step": 329397, "epoch": 3968} {"train_loss": -26.042285919189453, "global_step": 329398, "epoch": 3968} {"train_loss": -25.812768936157227, "global_step": 329399, "epoch": 3968} {"train_loss": -26.027374267578125, "global_step": 329400, "epoch": 3968} {"train_loss": -26.133893966674805, "global_step": 329401, "epoch": 3968} {"train_loss": -25.789859771728516, "global_step": 329402, "epoch": 3968} {"train_loss": -26.472095489501953, "global_step": 329403, "epoch": 3968} {"train_loss": -25.93770408630371, "global_step": 329404, "epoch": 3968} {"train_loss": -25.9366397857666, "global_step": 329405, "epoch": 3968} {"train_loss": -26.058969497680664, "global_step": 329406, "epoch": 3968} {"train_loss": -25.883472442626953, "global_step": 329407, "epoch": 3968} {"train_loss": -26.0084285736084, "global_step": 329408, "epoch": 3968} {"train_loss": -25.993274688720703, "global_step": 329409, "epoch": 3968} {"train_loss": -25.947797775268555, "global_step": 329410, "epoch": 3968} {"train_loss": -25.97222900390625, "global_step": 329411, "epoch": 3968} {"train_loss": -25.567073822021484, "global_step": 329412, "epoch": 3968} {"train_loss": -25.983993530273438, "global_step": 329413, "epoch": 3968} {"train_loss": -26.03977394104004, "global_step": 329414, "epoch": 3968} {"train_loss": -26.23211097717285, "global_step": 329415, "epoch": 3968} {"train_loss": -26.154541015625, "global_step": 329416, "epoch": 3968} {"train_loss": -26.270404815673828, "global_step": 329417, "epoch": 3968} {"train_loss": -25.8837833404541, "global_step": 329418, "epoch": 3968} {"train_loss": -25.94293212890625, "global_step": 329419, "epoch": 3968} {"train_loss": -25.75714683532715, "global_step": 329420, "epoch": 3968} {"train_loss": -25.654937744140625, "global_step": 329421, "epoch": 3968} {"train_loss": -25.754728317260742, "global_step": 329422, "epoch": 3968} {"train_loss": -26.007205963134766, "global_step": 329423, "epoch": 3968} {"train_loss": -25.627344131469727, "global_step": 329424, "epoch": 3968} {"train_loss": -26.025970458984375, "global_step": 329425, "epoch": 3968} {"train_loss": -25.758078035101832, "global_step": 329426, "epoch": 3968, "val_loss": 7218669.0} {"train_loss": -25.392478942871094, "global_step": 329427, "epoch": 3969} {"train_loss": -25.256515502929688, "global_step": 329428, "epoch": 3969} {"train_loss": -25.3372859954834, "global_step": 329429, "epoch": 3969} {"train_loss": -25.48848533630371, "global_step": 329430, "epoch": 3969} {"train_loss": -25.614782333374023, "global_step": 329431, "epoch": 3969} {"train_loss": -25.243371963500977, "global_step": 329432, "epoch": 3969} {"train_loss": -25.1057071685791, "global_step": 329433, "epoch": 3969} {"train_loss": -25.698835372924805, "global_step": 329434, "epoch": 3969} {"train_loss": -25.576866149902344, "global_step": 329435, "epoch": 3969} {"train_loss": -25.346017837524414, "global_step": 329436, "epoch": 3969} {"train_loss": -25.63372802734375, "global_step": 329437, "epoch": 3969} {"train_loss": -25.73382568359375, "global_step": 329438, "epoch": 3969} {"train_loss": -26.115407943725586, "global_step": 329439, "epoch": 3969} {"train_loss": -25.96649742126465, "global_step": 329440, "epoch": 3969} {"train_loss": -25.707416534423828, "global_step": 329441, "epoch": 3969} {"train_loss": -25.80109977722168, "global_step": 329442, "epoch": 3969} {"train_loss": -25.764759063720703, "global_step": 329443, "epoch": 3969} {"train_loss": -26.190353393554688, "global_step": 329444, "epoch": 3969} {"train_loss": -26.0517635345459, "global_step": 329445, "epoch": 3969} {"train_loss": -25.764423370361328, "global_step": 329446, "epoch": 3969} {"train_loss": -25.749164581298828, "global_step": 329447, "epoch": 3969} {"train_loss": -26.126882553100586, "global_step": 329448, "epoch": 3969} {"train_loss": -25.654035568237305, "global_step": 329449, "epoch": 3969} {"train_loss": -25.942167282104492, "global_step": 329450, "epoch": 3969} {"train_loss": -25.95020866394043, "global_step": 329451, "epoch": 3969} {"train_loss": -26.048460006713867, "global_step": 329452, "epoch": 3969} {"train_loss": -26.016300201416016, "global_step": 329453, "epoch": 3969} {"train_loss": -25.79737663269043, "global_step": 329454, "epoch": 3969} {"train_loss": -25.630781173706055, "global_step": 329455, "epoch": 3969} {"train_loss": -25.700891494750977, "global_step": 329456, "epoch": 3969} {"train_loss": -25.903644561767578, "global_step": 329457, "epoch": 3969} {"train_loss": -26.267724990844727, "global_step": 329458, "epoch": 3969} {"train_loss": -26.19308853149414, "global_step": 329459, "epoch": 3969} {"train_loss": -25.894804000854492, "global_step": 329460, "epoch": 3969} {"train_loss": -25.734289169311523, "global_step": 329461, "epoch": 3969} {"train_loss": -26.00507926940918, "global_step": 329462, "epoch": 3969} {"train_loss": -25.79432487487793, "global_step": 329463, "epoch": 3969} {"train_loss": -26.30462074279785, "global_step": 329464, "epoch": 3969} {"train_loss": -25.7567081451416, "global_step": 329465, "epoch": 3969} {"train_loss": -26.128034591674805, "global_step": 329466, "epoch": 3969} {"train_loss": -26.095239639282227, "global_step": 329467, "epoch": 3969} {"train_loss": -26.320728302001953, "global_step": 329468, "epoch": 3969} {"train_loss": -26.090499877929688, "global_step": 329469, "epoch": 3969} {"train_loss": -26.200061798095703, "global_step": 329470, "epoch": 3969} {"train_loss": -26.567916870117188, "global_step": 329471, "epoch": 3969} {"train_loss": -25.720373153686523, "global_step": 329472, "epoch": 3969} {"train_loss": -26.4046630859375, "global_step": 329473, "epoch": 3969} {"train_loss": -26.001718521118164, "global_step": 329474, "epoch": 3969} {"train_loss": -25.596195220947266, "global_step": 329475, "epoch": 3969} {"train_loss": -26.187219619750977, "global_step": 329476, "epoch": 3969} {"train_loss": -26.332141876220703, "global_step": 329477, "epoch": 3969} {"train_loss": -25.907611846923828, "global_step": 329478, "epoch": 3969} {"train_loss": -25.648168563842773, "global_step": 329479, "epoch": 3969} {"train_loss": -25.501708984375, "global_step": 329480, "epoch": 3969} {"train_loss": -25.898971557617188, "global_step": 329481, "epoch": 3969} {"train_loss": -26.142871856689453, "global_step": 329482, "epoch": 3969} {"train_loss": -26.080081939697266, "global_step": 329483, "epoch": 3969} {"train_loss": -26.2526798248291, "global_step": 329484, "epoch": 3969} {"train_loss": -25.742639541625977, "global_step": 329485, "epoch": 3969} {"train_loss": -25.797992706298828, "global_step": 329486, "epoch": 3969} {"train_loss": -25.7528018951416, "global_step": 329487, "epoch": 3969} {"train_loss": -26.109052658081055, "global_step": 329488, "epoch": 3969} {"train_loss": -25.81577491760254, "global_step": 329489, "epoch": 3969} {"train_loss": -26.176776885986328, "global_step": 329490, "epoch": 3969} {"train_loss": -25.944272994995117, "global_step": 329491, "epoch": 3969} {"train_loss": -26.261768341064453, "global_step": 329492, "epoch": 3969} {"train_loss": -26.1005859375, "global_step": 329493, "epoch": 3969} {"train_loss": -26.059741973876953, "global_step": 329494, "epoch": 3969} {"train_loss": -26.11836814880371, "global_step": 329495, "epoch": 3969} {"train_loss": -26.016162872314453, "global_step": 329496, "epoch": 3969} {"train_loss": -25.91302490234375, "global_step": 329497, "epoch": 3969} {"train_loss": -26.248605728149414, "global_step": 329498, "epoch": 3969} {"train_loss": -25.986196517944336, "global_step": 329499, "epoch": 3969} {"train_loss": -26.163251876831055, "global_step": 329500, "epoch": 3969} {"train_loss": -25.74518394470215, "global_step": 329501, "epoch": 3969} {"train_loss": -25.93295669555664, "global_step": 329502, "epoch": 3969} {"train_loss": -26.06906509399414, "global_step": 329503, "epoch": 3969} {"train_loss": -26.129058837890625, "global_step": 329504, "epoch": 3969} {"train_loss": -25.931982040405273, "global_step": 329505, "epoch": 3969} {"train_loss": -25.927398681640625, "global_step": 329506, "epoch": 3969} {"train_loss": -26.100799560546875, "global_step": 329507, "epoch": 3969} {"train_loss": -26.171411514282227, "global_step": 329508, "epoch": 3969} {"train_loss": -25.897117178124116, "global_step": 329509, "epoch": 3969, "val_loss": 7295721.0} {"train_loss": -25.107528686523438, "global_step": 329510, "epoch": 3970} {"train_loss": -23.63045310974121, "global_step": 329511, "epoch": 3970} {"train_loss": -24.99717140197754, "global_step": 329512, "epoch": 3970} {"train_loss": -25.638370513916016, "global_step": 329513, "epoch": 3970} {"train_loss": -25.249481201171875, "global_step": 329514, "epoch": 3970} {"train_loss": -25.50731086730957, "global_step": 329515, "epoch": 3970} {"train_loss": -24.874414443969727, "global_step": 329516, "epoch": 3970} {"train_loss": -25.67408561706543, "global_step": 329517, "epoch": 3970} {"train_loss": -25.37230682373047, "global_step": 329518, "epoch": 3970} {"train_loss": -25.046276092529297, "global_step": 329519, "epoch": 3970} {"train_loss": -25.491544723510742, "global_step": 329520, "epoch": 3970} {"train_loss": -25.726470947265625, "global_step": 329521, "epoch": 3970} {"train_loss": -25.70228385925293, "global_step": 329522, "epoch": 3970} {"train_loss": -25.71723747253418, "global_step": 329523, "epoch": 3970} {"train_loss": -25.4720516204834, "global_step": 329524, "epoch": 3970} {"train_loss": -25.566043853759766, "global_step": 329525, "epoch": 3970} {"train_loss": -25.615161895751953, "global_step": 329526, "epoch": 3970} {"train_loss": -25.59838104248047, "global_step": 329527, "epoch": 3970} {"train_loss": -25.66607666015625, "global_step": 329528, "epoch": 3970} {"train_loss": -25.611541748046875, "global_step": 329529, "epoch": 3970} {"train_loss": -25.972564697265625, "global_step": 329530, "epoch": 3970} {"train_loss": -25.31156349182129, "global_step": 329531, "epoch": 3970} {"train_loss": -26.0434513092041, "global_step": 329532, "epoch": 3970} {"train_loss": -25.479644775390625, "global_step": 329533, "epoch": 3970} {"train_loss": -25.748090744018555, "global_step": 329534, "epoch": 3970} {"train_loss": -25.688444137573242, "global_step": 329535, "epoch": 3970} {"train_loss": -25.838571548461914, "global_step": 329536, "epoch": 3970} {"train_loss": -25.550491333007812, "global_step": 329537, "epoch": 3970} {"train_loss": -26.120624542236328, "global_step": 329538, "epoch": 3970} {"train_loss": -25.91666603088379, "global_step": 329539, "epoch": 3970} {"train_loss": -25.625654220581055, "global_step": 329540, "epoch": 3970} {"train_loss": -26.009021759033203, "global_step": 329541, "epoch": 3970} {"train_loss": -25.8800048828125, "global_step": 329542, "epoch": 3970} {"train_loss": -25.814502716064453, "global_step": 329543, "epoch": 3970} {"train_loss": -25.75592041015625, "global_step": 329544, "epoch": 3970} {"train_loss": -26.11846923828125, "global_step": 329545, "epoch": 3970} {"train_loss": -26.10418128967285, "global_step": 329546, "epoch": 3970} {"train_loss": -25.814899444580078, "global_step": 329547, "epoch": 3970} {"train_loss": -25.84418296813965, "global_step": 329548, "epoch": 3970} {"train_loss": -25.331647872924805, "global_step": 329549, "epoch": 3970} {"train_loss": -25.831876754760742, "global_step": 329550, "epoch": 3970} {"train_loss": -26.122791290283203, "global_step": 329551, "epoch": 3970} {"train_loss": -26.029327392578125, "global_step": 329552, "epoch": 3970} {"train_loss": -25.8098087310791, "global_step": 329553, "epoch": 3970} {"train_loss": -26.161273956298828, "global_step": 329554, "epoch": 3970} {"train_loss": -26.048999786376953, "global_step": 329555, "epoch": 3970} {"train_loss": -26.151081085205078, "global_step": 329556, "epoch": 3970} {"train_loss": -25.882490158081055, "global_step": 329557, "epoch": 3970} {"train_loss": -25.860326766967773, "global_step": 329558, "epoch": 3970} {"train_loss": -26.195144653320312, "global_step": 329559, "epoch": 3970} {"train_loss": -26.19605827331543, "global_step": 329560, "epoch": 3970} {"train_loss": -26.250137329101562, "global_step": 329561, "epoch": 3970} {"train_loss": -26.24957847595215, "global_step": 329562, "epoch": 3970} {"train_loss": -26.06751823425293, "global_step": 329563, "epoch": 3970} {"train_loss": -26.14756202697754, "global_step": 329564, "epoch": 3970} {"train_loss": -26.30340576171875, "global_step": 329565, "epoch": 3970} {"train_loss": -26.057392120361328, "global_step": 329566, "epoch": 3970} {"train_loss": -25.806976318359375, "global_step": 329567, "epoch": 3970} {"train_loss": -26.1885986328125, "global_step": 329568, "epoch": 3970} {"train_loss": -26.04465103149414, "global_step": 329569, "epoch": 3970} {"train_loss": -25.749195098876953, "global_step": 329570, "epoch": 3970} {"train_loss": -26.208593368530273, "global_step": 329571, "epoch": 3970} {"train_loss": -25.95208740234375, "global_step": 329572, "epoch": 3970} {"train_loss": -26.01557731628418, "global_step": 329573, "epoch": 3970} {"train_loss": -26.386091232299805, "global_step": 329574, "epoch": 3970} {"train_loss": -26.246992111206055, "global_step": 329575, "epoch": 3970} {"train_loss": -26.10480308532715, "global_step": 329576, "epoch": 3970} {"train_loss": -26.281208038330078, "global_step": 329577, "epoch": 3970} {"train_loss": -26.183353424072266, "global_step": 329578, "epoch": 3970} {"train_loss": -25.574682235717773, "global_step": 329579, "epoch": 3970} {"train_loss": -25.872848510742188, "global_step": 329580, "epoch": 3970} {"train_loss": -26.065176010131836, "global_step": 329581, "epoch": 3970} {"train_loss": -26.22653579711914, "global_step": 329582, "epoch": 3970} {"train_loss": -26.004907608032227, "global_step": 329583, "epoch": 3970} {"train_loss": -25.533132553100586, "global_step": 329584, "epoch": 3970} {"train_loss": -26.140308380126953, "global_step": 329585, "epoch": 3970} {"train_loss": -25.79676628112793, "global_step": 329586, "epoch": 3970} {"train_loss": -26.1948299407959, "global_step": 329587, "epoch": 3970} {"train_loss": -25.693073272705078, "global_step": 329588, "epoch": 3970} {"train_loss": -25.695301055908203, "global_step": 329589, "epoch": 3970} {"train_loss": -25.863494873046875, "global_step": 329590, "epoch": 3970} {"train_loss": -25.904462814331055, "global_step": 329591, "epoch": 3970} {"train_loss": -25.816696488713642, "global_step": 329592, "epoch": 3970, "val_loss": 7087622.0} {"train_loss": -25.7878475189209, "global_step": 329593, "epoch": 3971} {"train_loss": -25.431598663330078, "global_step": 329594, "epoch": 3971} {"train_loss": -25.762802124023438, "global_step": 329595, "epoch": 3971} {"train_loss": -26.042097091674805, "global_step": 329596, "epoch": 3971} {"train_loss": -25.870803833007812, "global_step": 329597, "epoch": 3971} {"train_loss": -25.602252960205078, "global_step": 329598, "epoch": 3971} {"train_loss": -25.551313400268555, "global_step": 329599, "epoch": 3971} {"train_loss": -25.93930435180664, "global_step": 329600, "epoch": 3971} {"train_loss": -25.8697566986084, "global_step": 329601, "epoch": 3971} {"train_loss": -25.991867065429688, "global_step": 329602, "epoch": 3971} {"train_loss": -25.649682998657227, "global_step": 329603, "epoch": 3971} {"train_loss": -26.13327980041504, "global_step": 329604, "epoch": 3971} {"train_loss": -25.703739166259766, "global_step": 329605, "epoch": 3971} {"train_loss": -25.632863998413086, "global_step": 329606, "epoch": 3971} {"train_loss": -25.565793991088867, "global_step": 329607, "epoch": 3971} {"train_loss": -25.738229751586914, "global_step": 329608, "epoch": 3971} {"train_loss": -25.892475128173828, "global_step": 329609, "epoch": 3971} {"train_loss": -26.109766006469727, "global_step": 329610, "epoch": 3971} {"train_loss": -26.37432861328125, "global_step": 329611, "epoch": 3971} {"train_loss": -26.042510986328125, "global_step": 329612, "epoch": 3971} {"train_loss": -26.19135093688965, "global_step": 329613, "epoch": 3971} {"train_loss": -26.067724227905273, "global_step": 329614, "epoch": 3971} {"train_loss": -26.101343154907227, "global_step": 329615, "epoch": 3971} {"train_loss": -25.855371475219727, "global_step": 329616, "epoch": 3971} {"train_loss": -25.85206413269043, "global_step": 329617, "epoch": 3971} {"train_loss": -25.802539825439453, "global_step": 329618, "epoch": 3971} {"train_loss": -25.820852279663086, "global_step": 329619, "epoch": 3971} {"train_loss": -25.787372589111328, "global_step": 329620, "epoch": 3971} {"train_loss": -26.252222061157227, "global_step": 329621, "epoch": 3971} {"train_loss": -25.359630584716797, "global_step": 329622, "epoch": 3971} {"train_loss": -25.936925888061523, "global_step": 329623, "epoch": 3971} {"train_loss": -26.2413272857666, "global_step": 329624, "epoch": 3971} {"train_loss": -25.461212158203125, "global_step": 329625, "epoch": 3971} {"train_loss": -24.971759796142578, "global_step": 329626, "epoch": 3971} {"train_loss": -25.74932289123535, "global_step": 329627, "epoch": 3971} {"train_loss": -25.94233512878418, "global_step": 329628, "epoch": 3971} {"train_loss": -25.281600952148438, "global_step": 329629, "epoch": 3971} {"train_loss": -25.235000610351562, "global_step": 329630, "epoch": 3971} {"train_loss": -25.832117080688477, "global_step": 329631, "epoch": 3971} {"train_loss": -24.549222946166992, "global_step": 329632, "epoch": 3971} {"train_loss": -25.5860652923584, "global_step": 329633, "epoch": 3971} {"train_loss": -25.61505126953125, "global_step": 329634, "epoch": 3971} {"train_loss": -25.310550689697266, "global_step": 329635, "epoch": 3971} {"train_loss": -25.61553382873535, "global_step": 329636, "epoch": 3971} {"train_loss": -25.837244033813477, "global_step": 329637, "epoch": 3971} {"train_loss": -25.80209732055664, "global_step": 329638, "epoch": 3971} {"train_loss": -25.865310668945312, "global_step": 329639, "epoch": 3971} {"train_loss": -25.64900016784668, "global_step": 329640, "epoch": 3971} {"train_loss": -25.744394302368164, "global_step": 329641, "epoch": 3971} {"train_loss": -25.847166061401367, "global_step": 329642, "epoch": 3971} {"train_loss": -25.72059440612793, "global_step": 329643, "epoch": 3971} {"train_loss": -25.970951080322266, "global_step": 329644, "epoch": 3971} {"train_loss": -26.129358291625977, "global_step": 329645, "epoch": 3971} {"train_loss": -26.027429580688477, "global_step": 329646, "epoch": 3971} {"train_loss": -25.574119567871094, "global_step": 329647, "epoch": 3971} {"train_loss": -25.8869686126709, "global_step": 329648, "epoch": 3971} {"train_loss": -25.9035701751709, "global_step": 329649, "epoch": 3971} {"train_loss": -25.933828353881836, "global_step": 329650, "epoch": 3971} {"train_loss": -26.013410568237305, "global_step": 329651, "epoch": 3971} {"train_loss": -25.770156860351562, "global_step": 329652, "epoch": 3971} {"train_loss": -25.804147720336914, "global_step": 329653, "epoch": 3971} {"train_loss": -26.1044921875, "global_step": 329654, "epoch": 3971} {"train_loss": -25.904706954956055, "global_step": 329655, "epoch": 3971} {"train_loss": -25.946807861328125, "global_step": 329656, "epoch": 3971} {"train_loss": -25.990966796875, "global_step": 329657, "epoch": 3971} {"train_loss": -26.029788970947266, "global_step": 329658, "epoch": 3971} {"train_loss": -25.894062042236328, "global_step": 329659, "epoch": 3971} {"train_loss": -26.24079704284668, "global_step": 329660, "epoch": 3971} {"train_loss": -25.961227416992188, "global_step": 329661, "epoch": 3971} {"train_loss": -25.8468074798584, "global_step": 329662, "epoch": 3971} {"train_loss": -26.113325119018555, "global_step": 329663, "epoch": 3971} {"train_loss": -26.022098541259766, "global_step": 329664, "epoch": 3971} {"train_loss": -25.6888427734375, "global_step": 329665, "epoch": 3971} {"train_loss": -26.2008113861084, "global_step": 329666, "epoch": 3971} {"train_loss": -25.839216232299805, "global_step": 329667, "epoch": 3971} {"train_loss": -25.677824020385742, "global_step": 329668, "epoch": 3971} {"train_loss": -25.688709259033203, "global_step": 329669, "epoch": 3971} {"train_loss": -25.97913932800293, "global_step": 329670, "epoch": 3971} {"train_loss": -25.690784454345703, "global_step": 329671, "epoch": 3971} {"train_loss": -26.146087646484375, "global_step": 329672, "epoch": 3971} {"train_loss": -25.26434326171875, "global_step": 329673, "epoch": 3971} {"train_loss": -25.80861473083496, "global_step": 329674, "epoch": 3971} {"train_loss": -25.798866363893072, "global_step": 329675, "epoch": 3971, "val_loss": 7155985.0} {"train_loss": -25.683521270751953, "global_step": 329676, "epoch": 3972} {"train_loss": -25.016437530517578, "global_step": 329677, "epoch": 3972} {"train_loss": -26.044891357421875, "global_step": 329678, "epoch": 3972} {"train_loss": -25.33441162109375, "global_step": 329679, "epoch": 3972} {"train_loss": -25.423349380493164, "global_step": 329680, "epoch": 3972} {"train_loss": -25.69361686706543, "global_step": 329681, "epoch": 3972} {"train_loss": -25.36786651611328, "global_step": 329682, "epoch": 3972} {"train_loss": -25.560317993164062, "global_step": 329683, "epoch": 3972} {"train_loss": -25.64508056640625, "global_step": 329684, "epoch": 3972} {"train_loss": -25.31293296813965, "global_step": 329685, "epoch": 3972} {"train_loss": -25.577306747436523, "global_step": 329686, "epoch": 3972} {"train_loss": -25.947378158569336, "global_step": 329687, "epoch": 3972} {"train_loss": -25.81263542175293, "global_step": 329688, "epoch": 3972} {"train_loss": -25.574556350708008, "global_step": 329689, "epoch": 3972} {"train_loss": -25.708972930908203, "global_step": 329690, "epoch": 3972} {"train_loss": -25.893896102905273, "global_step": 329691, "epoch": 3972} {"train_loss": -25.731876373291016, "global_step": 329692, "epoch": 3972} {"train_loss": -25.973495483398438, "global_step": 329693, "epoch": 3972} {"train_loss": -25.67600440979004, "global_step": 329694, "epoch": 3972} {"train_loss": -25.319868087768555, "global_step": 329695, "epoch": 3972} {"train_loss": -25.732192993164062, "global_step": 329696, "epoch": 3972} {"train_loss": -25.914220809936523, "global_step": 329697, "epoch": 3972} {"train_loss": -25.571447372436523, "global_step": 329698, "epoch": 3972} {"train_loss": -25.455862045288086, "global_step": 329699, "epoch": 3972} {"train_loss": -25.830066680908203, "global_step": 329700, "epoch": 3972} {"train_loss": -25.45391845703125, "global_step": 329701, "epoch": 3972} {"train_loss": -25.8045711517334, "global_step": 329702, "epoch": 3972} {"train_loss": -25.782440185546875, "global_step": 329703, "epoch": 3972} {"train_loss": -26.11575698852539, "global_step": 329704, "epoch": 3972} {"train_loss": -26.034692764282227, "global_step": 329705, "epoch": 3972} {"train_loss": -25.659284591674805, "global_step": 329706, "epoch": 3972} {"train_loss": -26.344358444213867, "global_step": 329707, "epoch": 3972} {"train_loss": -26.004505157470703, "global_step": 329708, "epoch": 3972} {"train_loss": -25.71634864807129, "global_step": 329709, "epoch": 3972} {"train_loss": -25.758880615234375, "global_step": 329710, "epoch": 3972} {"train_loss": -25.624591827392578, "global_step": 329711, "epoch": 3972} {"train_loss": -26.15070915222168, "global_step": 329712, "epoch": 3972} {"train_loss": -25.80158042907715, "global_step": 329713, "epoch": 3972} {"train_loss": -26.404010772705078, "global_step": 329714, "epoch": 3972} {"train_loss": -26.30217933654785, "global_step": 329715, "epoch": 3972} {"train_loss": -25.950881958007812, "global_step": 329716, "epoch": 3972} {"train_loss": -25.983734130859375, "global_step": 329717, "epoch": 3972} {"train_loss": -25.85298728942871, "global_step": 329718, "epoch": 3972} {"train_loss": -25.479089736938477, "global_step": 329719, "epoch": 3972} {"train_loss": -25.95342445373535, "global_step": 329720, "epoch": 3972} {"train_loss": -26.144407272338867, "global_step": 329721, "epoch": 3972} {"train_loss": -25.774768829345703, "global_step": 329722, "epoch": 3972} {"train_loss": -25.703588485717773, "global_step": 329723, "epoch": 3972} {"train_loss": -26.27811622619629, "global_step": 329724, "epoch": 3972} {"train_loss": -26.03641700744629, "global_step": 329725, "epoch": 3972} {"train_loss": -25.77997398376465, "global_step": 329726, "epoch": 3972} {"train_loss": -26.115400314331055, "global_step": 329727, "epoch": 3972} {"train_loss": -26.26776123046875, "global_step": 329728, "epoch": 3972} {"train_loss": -26.081329345703125, "global_step": 329729, "epoch": 3972} {"train_loss": -25.895721435546875, "global_step": 329730, "epoch": 3972} {"train_loss": -26.31208610534668, "global_step": 329731, "epoch": 3972} {"train_loss": -26.003986358642578, "global_step": 329732, "epoch": 3972} {"train_loss": -25.836145401000977, "global_step": 329733, "epoch": 3972} {"train_loss": -26.067169189453125, "global_step": 329734, "epoch": 3972} {"train_loss": -26.174219131469727, "global_step": 329735, "epoch": 3972} {"train_loss": -26.114500045776367, "global_step": 329736, "epoch": 3972} {"train_loss": -25.758371353149414, "global_step": 329737, "epoch": 3972} {"train_loss": -25.7772159576416, "global_step": 329738, "epoch": 3972} {"train_loss": -25.7473087310791, "global_step": 329739, "epoch": 3972} {"train_loss": -26.0568790435791, "global_step": 329740, "epoch": 3972} {"train_loss": -26.18524169921875, "global_step": 329741, "epoch": 3972} {"train_loss": -26.112592697143555, "global_step": 329742, "epoch": 3972} {"train_loss": -26.004444122314453, "global_step": 329743, "epoch": 3972} {"train_loss": -26.20716667175293, "global_step": 329744, "epoch": 3972} {"train_loss": -25.836181640625, "global_step": 329745, "epoch": 3972} {"train_loss": -26.615549087524414, "global_step": 329746, "epoch": 3972} {"train_loss": -26.25031852722168, "global_step": 329747, "epoch": 3972} {"train_loss": -25.98628044128418, "global_step": 329748, "epoch": 3972} {"train_loss": -26.5943660736084, "global_step": 329749, "epoch": 3972} {"train_loss": -25.792102813720703, "global_step": 329750, "epoch": 3972} {"train_loss": -25.94940757751465, "global_step": 329751, "epoch": 3972} {"train_loss": -25.982879638671875, "global_step": 329752, "epoch": 3972} {"train_loss": -26.10597038269043, "global_step": 329753, "epoch": 3972} {"train_loss": -25.977970123291016, "global_step": 329754, "epoch": 3972} {"train_loss": -25.938983917236328, "global_step": 329755, "epoch": 3972} {"train_loss": -25.651304244995117, "global_step": 329756, "epoch": 3972} {"train_loss": -25.88051414489746, "global_step": 329757, "epoch": 3972} {"train_loss": -25.893303354102446, "global_step": 329758, "epoch": 3972, "val_loss": 7125894.0} {"train_loss": -25.2955322265625, "global_step": 329759, "epoch": 3973} {"train_loss": -25.322092056274414, "global_step": 329760, "epoch": 3973} {"train_loss": -24.817447662353516, "global_step": 329761, "epoch": 3973} {"train_loss": -25.360069274902344, "global_step": 329762, "epoch": 3973} {"train_loss": -25.596845626831055, "global_step": 329763, "epoch": 3973} {"train_loss": -25.69049644470215, "global_step": 329764, "epoch": 3973} {"train_loss": -25.64154624938965, "global_step": 329765, "epoch": 3973} {"train_loss": -25.442310333251953, "global_step": 329766, "epoch": 3973} {"train_loss": -25.483327865600586, "global_step": 329767, "epoch": 3973} {"train_loss": -25.294736862182617, "global_step": 329768, "epoch": 3973} {"train_loss": -25.79865074157715, "global_step": 329769, "epoch": 3973} {"train_loss": -26.02679443359375, "global_step": 329770, "epoch": 3973} {"train_loss": -25.855396270751953, "global_step": 329771, "epoch": 3973} {"train_loss": -25.778656005859375, "global_step": 329772, "epoch": 3973} {"train_loss": -25.469091415405273, "global_step": 329773, "epoch": 3973} {"train_loss": -25.995941162109375, "global_step": 329774, "epoch": 3973} {"train_loss": -25.64979362487793, "global_step": 329775, "epoch": 3973} {"train_loss": -25.732501983642578, "global_step": 329776, "epoch": 3973} {"train_loss": -25.76984977722168, "global_step": 329777, "epoch": 3973} {"train_loss": -25.94577980041504, "global_step": 329778, "epoch": 3973} {"train_loss": -26.12007713317871, "global_step": 329779, "epoch": 3973} {"train_loss": -25.797622680664062, "global_step": 329780, "epoch": 3973} {"train_loss": -26.1503963470459, "global_step": 329781, "epoch": 3973} {"train_loss": -25.904943466186523, "global_step": 329782, "epoch": 3973} {"train_loss": -25.948453903198242, "global_step": 329783, "epoch": 3973} {"train_loss": -26.17703628540039, "global_step": 329784, "epoch": 3973} {"train_loss": -25.860614776611328, "global_step": 329785, "epoch": 3973} {"train_loss": -25.842926025390625, "global_step": 329786, "epoch": 3973} {"train_loss": -25.972396850585938, "global_step": 329787, "epoch": 3973} {"train_loss": -25.448270797729492, "global_step": 329788, "epoch": 3973} {"train_loss": -26.144729614257812, "global_step": 329789, "epoch": 3973} {"train_loss": -25.8320369720459, "global_step": 329790, "epoch": 3973} {"train_loss": -25.785181045532227, "global_step": 329791, "epoch": 3973} {"train_loss": -25.867568969726562, "global_step": 329792, "epoch": 3973} {"train_loss": -26.128515243530273, "global_step": 329793, "epoch": 3973} {"train_loss": -25.96268081665039, "global_step": 329794, "epoch": 3973} {"train_loss": -26.216339111328125, "global_step": 329795, "epoch": 3973} {"train_loss": -26.181182861328125, "global_step": 329796, "epoch": 3973} {"train_loss": -25.80732536315918, "global_step": 329797, "epoch": 3973} {"train_loss": -26.431549072265625, "global_step": 329798, "epoch": 3973} {"train_loss": -25.84881591796875, "global_step": 329799, "epoch": 3973} {"train_loss": -26.2873592376709, "global_step": 329800, "epoch": 3973} {"train_loss": -25.949304580688477, "global_step": 329801, "epoch": 3973} {"train_loss": -25.80409049987793, "global_step": 329802, "epoch": 3973} {"train_loss": -26.124937057495117, "global_step": 329803, "epoch": 3973} {"train_loss": -25.82398796081543, "global_step": 329804, "epoch": 3973} {"train_loss": -26.066349029541016, "global_step": 329805, "epoch": 3973} {"train_loss": -25.85273551940918, "global_step": 329806, "epoch": 3973} {"train_loss": -26.135406494140625, "global_step": 329807, "epoch": 3973} {"train_loss": -26.134145736694336, "global_step": 329808, "epoch": 3973} {"train_loss": -25.749530792236328, "global_step": 329809, "epoch": 3973} {"train_loss": -26.154022216796875, "global_step": 329810, "epoch": 3973} {"train_loss": -26.077411651611328, "global_step": 329811, "epoch": 3973} {"train_loss": -26.144683837890625, "global_step": 329812, "epoch": 3973} {"train_loss": -26.36627769470215, "global_step": 329813, "epoch": 3973} {"train_loss": -25.769861221313477, "global_step": 329814, "epoch": 3973} {"train_loss": -25.87485122680664, "global_step": 329815, "epoch": 3973} {"train_loss": -25.946691513061523, "global_step": 329816, "epoch": 3973} {"train_loss": -26.146780014038086, "global_step": 329817, "epoch": 3973} {"train_loss": -25.83251953125, "global_step": 329818, "epoch": 3973} {"train_loss": -26.274707794189453, "global_step": 329819, "epoch": 3973} {"train_loss": -26.29432487487793, "global_step": 329820, "epoch": 3973} {"train_loss": -25.968017578125, "global_step": 329821, "epoch": 3973} {"train_loss": -25.915882110595703, "global_step": 329822, "epoch": 3973} {"train_loss": -25.501005172729492, "global_step": 329823, "epoch": 3973} {"train_loss": -25.22165870666504, "global_step": 329824, "epoch": 3973} {"train_loss": -25.633657455444336, "global_step": 329825, "epoch": 3973} {"train_loss": -25.774381637573242, "global_step": 329826, "epoch": 3973} {"train_loss": -25.749067306518555, "global_step": 329827, "epoch": 3973} {"train_loss": -25.53375244140625, "global_step": 329828, "epoch": 3973} {"train_loss": -25.37434196472168, "global_step": 329829, "epoch": 3973} {"train_loss": -26.120389938354492, "global_step": 329830, "epoch": 3973} {"train_loss": -25.785120010375977, "global_step": 329831, "epoch": 3973} {"train_loss": -25.4703311920166, "global_step": 329832, "epoch": 3973} {"train_loss": -25.689374923706055, "global_step": 329833, "epoch": 3973} {"train_loss": -26.044973373413086, "global_step": 329834, "epoch": 3973} {"train_loss": -25.929412841796875, "global_step": 329835, "epoch": 3973} {"train_loss": -25.95379638671875, "global_step": 329836, "epoch": 3973} {"train_loss": -25.72053337097168, "global_step": 329837, "epoch": 3973} {"train_loss": -26.03931999206543, "global_step": 329838, "epoch": 3973} {"train_loss": -25.951322555541992, "global_step": 329839, "epoch": 3973} {"train_loss": -25.958890914916992, "global_step": 329840, "epoch": 3973} {"train_loss": -25.855334339371648, "global_step": 329841, "epoch": 3973, "val_loss": 7098868.0} {"train_loss": -25.883962631225586, "global_step": 329842, "epoch": 3974} {"train_loss": -25.84124183654785, "global_step": 329843, "epoch": 3974} {"train_loss": -25.85822868347168, "global_step": 329844, "epoch": 3974} {"train_loss": -25.72321128845215, "global_step": 329845, "epoch": 3974} {"train_loss": -25.724853515625, "global_step": 329846, "epoch": 3974} {"train_loss": -25.45370864868164, "global_step": 329847, "epoch": 3974} {"train_loss": -26.018646240234375, "global_step": 329848, "epoch": 3974} {"train_loss": -25.638898849487305, "global_step": 329849, "epoch": 3974} {"train_loss": -25.504718780517578, "global_step": 329850, "epoch": 3974} {"train_loss": -25.752700805664062, "global_step": 329851, "epoch": 3974} {"train_loss": -25.86028480529785, "global_step": 329852, "epoch": 3974} {"train_loss": -25.6470890045166, "global_step": 329853, "epoch": 3974} {"train_loss": -25.6202392578125, "global_step": 329854, "epoch": 3974} {"train_loss": -26.013031005859375, "global_step": 329855, "epoch": 3974} {"train_loss": -25.885648727416992, "global_step": 329856, "epoch": 3974} {"train_loss": -25.974822998046875, "global_step": 329857, "epoch": 3974} {"train_loss": -26.046710968017578, "global_step": 329858, "epoch": 3974} {"train_loss": -26.001699447631836, "global_step": 329859, "epoch": 3974} {"train_loss": -25.957189559936523, "global_step": 329860, "epoch": 3974} {"train_loss": -26.096927642822266, "global_step": 329861, "epoch": 3974} {"train_loss": -26.061996459960938, "global_step": 329862, "epoch": 3974} {"train_loss": -26.05222511291504, "global_step": 329863, "epoch": 3974} {"train_loss": -25.876697540283203, "global_step": 329864, "epoch": 3974} {"train_loss": -26.05958366394043, "global_step": 329865, "epoch": 3974} {"train_loss": -26.16424560546875, "global_step": 329866, "epoch": 3974} {"train_loss": -25.732481002807617, "global_step": 329867, "epoch": 3974} {"train_loss": -25.773773193359375, "global_step": 329868, "epoch": 3974} {"train_loss": -25.5042724609375, "global_step": 329869, "epoch": 3974} {"train_loss": -26.294233322143555, "global_step": 329870, "epoch": 3974} {"train_loss": -25.682416915893555, "global_step": 329871, "epoch": 3974} {"train_loss": -25.843658447265625, "global_step": 329872, "epoch": 3974} {"train_loss": -26.170988082885742, "global_step": 329873, "epoch": 3974} {"train_loss": -25.765249252319336, "global_step": 329874, "epoch": 3974} {"train_loss": -25.9549617767334, "global_step": 329875, "epoch": 3974} {"train_loss": -25.75847816467285, "global_step": 329876, "epoch": 3974} {"train_loss": -25.99008560180664, "global_step": 329877, "epoch": 3974} {"train_loss": -26.01288414001465, "global_step": 329878, "epoch": 3974} {"train_loss": -26.402271270751953, "global_step": 329879, "epoch": 3974} {"train_loss": -25.697301864624023, "global_step": 329880, "epoch": 3974} {"train_loss": -25.864521026611328, "global_step": 329881, "epoch": 3974} {"train_loss": -25.476560592651367, "global_step": 329882, "epoch": 3974} {"train_loss": -25.94789695739746, "global_step": 329883, "epoch": 3974} {"train_loss": -26.014148712158203, "global_step": 329884, "epoch": 3974} {"train_loss": -26.181781768798828, "global_step": 329885, "epoch": 3974} {"train_loss": -26.28020668029785, "global_step": 329886, "epoch": 3974} {"train_loss": -25.562658309936523, "global_step": 329887, "epoch": 3974} {"train_loss": -26.696002960205078, "global_step": 329888, "epoch": 3974} {"train_loss": -26.033422470092773, "global_step": 329889, "epoch": 3974} {"train_loss": -25.910934448242188, "global_step": 329890, "epoch": 3974} {"train_loss": -25.831350326538086, "global_step": 329891, "epoch": 3974} {"train_loss": -25.977710723876953, "global_step": 329892, "epoch": 3974} {"train_loss": -25.872394561767578, "global_step": 329893, "epoch": 3974} {"train_loss": -26.106582641601562, "global_step": 329894, "epoch": 3974} {"train_loss": -26.119001388549805, "global_step": 329895, "epoch": 3974} {"train_loss": -26.4023494720459, "global_step": 329896, "epoch": 3974} {"train_loss": -26.2268009185791, "global_step": 329897, "epoch": 3974} {"train_loss": -26.103315353393555, "global_step": 329898, "epoch": 3974} {"train_loss": -26.3132266998291, "global_step": 329899, "epoch": 3974} {"train_loss": -25.993881225585938, "global_step": 329900, "epoch": 3974} {"train_loss": -25.761478424072266, "global_step": 329901, "epoch": 3974} {"train_loss": -26.057348251342773, "global_step": 329902, "epoch": 3974} {"train_loss": -26.19296646118164, "global_step": 329903, "epoch": 3974} {"train_loss": -26.0718936920166, "global_step": 329904, "epoch": 3974} {"train_loss": -25.94189453125, "global_step": 329905, "epoch": 3974} {"train_loss": -25.758825302124023, "global_step": 329906, "epoch": 3974} {"train_loss": -25.644697189331055, "global_step": 329907, "epoch": 3974} {"train_loss": -25.768146514892578, "global_step": 329908, "epoch": 3974} {"train_loss": -26.069082260131836, "global_step": 329909, "epoch": 3974} {"train_loss": -26.009878158569336, "global_step": 329910, "epoch": 3974} {"train_loss": -25.877981185913086, "global_step": 329911, "epoch": 3974} {"train_loss": -26.073110580444336, "global_step": 329912, "epoch": 3974} {"train_loss": -25.930194854736328, "global_step": 329913, "epoch": 3974} {"train_loss": -25.8054256439209, "global_step": 329914, "epoch": 3974} {"train_loss": -25.717853546142578, "global_step": 329915, "epoch": 3974} {"train_loss": -26.068603515625, "global_step": 329916, "epoch": 3974} {"train_loss": -25.68889808654785, "global_step": 329917, "epoch": 3974} {"train_loss": -25.926300048828125, "global_step": 329918, "epoch": 3974} {"train_loss": -26.373279571533203, "global_step": 329919, "epoch": 3974} {"train_loss": -25.563621520996094, "global_step": 329920, "epoch": 3974} {"train_loss": -26.1582088470459, "global_step": 329921, "epoch": 3974} {"train_loss": -25.860107421875, "global_step": 329922, "epoch": 3974} {"train_loss": -25.834259033203125, "global_step": 329923, "epoch": 3974} {"train_loss": -25.939476610666297, "global_step": 329924, "epoch": 3974, "val_loss": 7214199.5} {"train_loss": -24.895631790161133, "global_step": 329925, "epoch": 3975} {"train_loss": -25.322553634643555, "global_step": 329926, "epoch": 3975} {"train_loss": -24.97934913635254, "global_step": 329927, "epoch": 3975} {"train_loss": -24.90241813659668, "global_step": 329928, "epoch": 3975} {"train_loss": -25.88763427734375, "global_step": 329929, "epoch": 3975} {"train_loss": -25.19917106628418, "global_step": 329930, "epoch": 3975} {"train_loss": -25.035566329956055, "global_step": 329931, "epoch": 3975} {"train_loss": -26.07350730895996, "global_step": 329932, "epoch": 3975} {"train_loss": -25.264562606811523, "global_step": 329933, "epoch": 3975} {"train_loss": -25.10575294494629, "global_step": 329934, "epoch": 3975} {"train_loss": -25.903614044189453, "global_step": 329935, "epoch": 3975} {"train_loss": -24.98325538635254, "global_step": 329936, "epoch": 3975} {"train_loss": -25.809844970703125, "global_step": 329937, "epoch": 3975} {"train_loss": -25.887985229492188, "global_step": 329938, "epoch": 3975} {"train_loss": -25.2817325592041, "global_step": 329939, "epoch": 3975} {"train_loss": -25.416797637939453, "global_step": 329940, "epoch": 3975} {"train_loss": -25.60587501525879, "global_step": 329941, "epoch": 3975} {"train_loss": -25.84267234802246, "global_step": 329942, "epoch": 3975} {"train_loss": -25.841928482055664, "global_step": 329943, "epoch": 3975} {"train_loss": -26.00884437561035, "global_step": 329944, "epoch": 3975} {"train_loss": -25.249956130981445, "global_step": 329945, "epoch": 3975} {"train_loss": -25.994787216186523, "global_step": 329946, "epoch": 3975} {"train_loss": -25.486408233642578, "global_step": 329947, "epoch": 3975} {"train_loss": -25.744983673095703, "global_step": 329948, "epoch": 3975} {"train_loss": -25.458118438720703, "global_step": 329949, "epoch": 3975} {"train_loss": -26.078290939331055, "global_step": 329950, "epoch": 3975} {"train_loss": -25.614530563354492, "global_step": 329951, "epoch": 3975} {"train_loss": -26.01387596130371, "global_step": 329952, "epoch": 3975} {"train_loss": -26.074573516845703, "global_step": 329953, "epoch": 3975} {"train_loss": -25.642709732055664, "global_step": 329954, "epoch": 3975} {"train_loss": -25.723657608032227, "global_step": 329955, "epoch": 3975} {"train_loss": -25.556657791137695, "global_step": 329956, "epoch": 3975} {"train_loss": -26.102746963500977, "global_step": 329957, "epoch": 3975} {"train_loss": -25.699506759643555, "global_step": 329958, "epoch": 3975} {"train_loss": -25.651952743530273, "global_step": 329959, "epoch": 3975} {"train_loss": -26.508344650268555, "global_step": 329960, "epoch": 3975} {"train_loss": -26.269245147705078, "global_step": 329961, "epoch": 3975} {"train_loss": -25.9737491607666, "global_step": 329962, "epoch": 3975} {"train_loss": -25.840789794921875, "global_step": 329963, "epoch": 3975} {"train_loss": -26.10028076171875, "global_step": 329964, "epoch": 3975} {"train_loss": -26.062353134155273, "global_step": 329965, "epoch": 3975} {"train_loss": -26.028528213500977, "global_step": 329966, "epoch": 3975} {"train_loss": -25.876708984375, "global_step": 329967, "epoch": 3975} {"train_loss": -26.34610366821289, "global_step": 329968, "epoch": 3975} {"train_loss": -26.05634117126465, "global_step": 329969, "epoch": 3975} {"train_loss": -25.925687789916992, "global_step": 329970, "epoch": 3975} {"train_loss": -26.05207633972168, "global_step": 329971, "epoch": 3975} {"train_loss": -25.780115127563477, "global_step": 329972, "epoch": 3975} {"train_loss": -26.038854598999023, "global_step": 329973, "epoch": 3975} {"train_loss": -26.335432052612305, "global_step": 329974, "epoch": 3975} {"train_loss": -26.104690551757812, "global_step": 329975, "epoch": 3975} {"train_loss": -26.34527587890625, "global_step": 329976, "epoch": 3975} {"train_loss": -26.283191680908203, "global_step": 329977, "epoch": 3975} {"train_loss": -26.2828426361084, "global_step": 329978, "epoch": 3975} {"train_loss": -25.89484977722168, "global_step": 329979, "epoch": 3975} {"train_loss": -25.645038604736328, "global_step": 329980, "epoch": 3975} {"train_loss": -25.750900268554688, "global_step": 329981, "epoch": 3975} {"train_loss": -26.207019805908203, "global_step": 329982, "epoch": 3975} {"train_loss": -26.03986930847168, "global_step": 329983, "epoch": 3975} {"train_loss": -25.780073165893555, "global_step": 329984, "epoch": 3975} {"train_loss": -25.990758895874023, "global_step": 329985, "epoch": 3975} {"train_loss": -26.52680015563965, "global_step": 329986, "epoch": 3975} {"train_loss": -25.912750244140625, "global_step": 329987, "epoch": 3975} {"train_loss": -25.922704696655273, "global_step": 329988, "epoch": 3975} {"train_loss": -25.89069938659668, "global_step": 329989, "epoch": 3975} {"train_loss": -25.6529483795166, "global_step": 329990, "epoch": 3975} {"train_loss": -25.877119064331055, "global_step": 329991, "epoch": 3975} {"train_loss": -25.716171264648438, "global_step": 329992, "epoch": 3975} {"train_loss": -25.38337516784668, "global_step": 329993, "epoch": 3975} {"train_loss": -25.9908504486084, "global_step": 329994, "epoch": 3975} {"train_loss": -26.07575035095215, "global_step": 329995, "epoch": 3975} {"train_loss": -25.524295806884766, "global_step": 329996, "epoch": 3975} {"train_loss": -25.91705322265625, "global_step": 329997, "epoch": 3975} {"train_loss": -25.452911376953125, "global_step": 329998, "epoch": 3975} {"train_loss": -25.52973747253418, "global_step": 329999, "epoch": 3975} {"train_loss": -26.21311378479004, "global_step": 330000, "epoch": 3975} {"train_loss": -25.88629150390625, "global_step": 330001, "epoch": 3975} {"train_loss": -25.54361343383789, "global_step": 330002, "epoch": 3975} {"train_loss": -26.041351318359375, "global_step": 330003, "epoch": 3975} {"train_loss": -26.21919822692871, "global_step": 330004, "epoch": 3975} {"train_loss": -25.912866592407227, "global_step": 330005, "epoch": 3975} {"train_loss": -25.794788360595703, "global_step": 330006, "epoch": 3975} {"train_loss": -25.788807237004658, "global_step": 330007, "epoch": 3975, "val_loss": 7108226.0} {"train_loss": -25.231801986694336, "global_step": 330008, "epoch": 3976} {"train_loss": -25.07906150817871, "global_step": 330009, "epoch": 3976} {"train_loss": -25.388059616088867, "global_step": 330010, "epoch": 3976} {"train_loss": -25.221399307250977, "global_step": 330011, "epoch": 3976} {"train_loss": -25.931562423706055, "global_step": 330012, "epoch": 3976} {"train_loss": -25.40458106994629, "global_step": 330013, "epoch": 3976} {"train_loss": -25.8283748626709, "global_step": 330014, "epoch": 3976} {"train_loss": -25.39206886291504, "global_step": 330015, "epoch": 3976} {"train_loss": -25.377613067626953, "global_step": 330016, "epoch": 3976} {"train_loss": -25.6630859375, "global_step": 330017, "epoch": 3976} {"train_loss": -25.7060546875, "global_step": 330018, "epoch": 3976} {"train_loss": -25.76181983947754, "global_step": 330019, "epoch": 3976} {"train_loss": -25.488309860229492, "global_step": 330020, "epoch": 3976} {"train_loss": -25.579761505126953, "global_step": 330021, "epoch": 3976} {"train_loss": -25.814157485961914, "global_step": 330022, "epoch": 3976} {"train_loss": -25.514047622680664, "global_step": 330023, "epoch": 3976} {"train_loss": -25.90520668029785, "global_step": 330024, "epoch": 3976} {"train_loss": -25.95200538635254, "global_step": 330025, "epoch": 3976} {"train_loss": -25.96600341796875, "global_step": 330026, "epoch": 3976} {"train_loss": -26.023832321166992, "global_step": 330027, "epoch": 3976} {"train_loss": -26.205976486206055, "global_step": 330028, "epoch": 3976} {"train_loss": -26.173986434936523, "global_step": 330029, "epoch": 3976} {"train_loss": -26.096155166625977, "global_step": 330030, "epoch": 3976} {"train_loss": -26.094160079956055, "global_step": 330031, "epoch": 3976} {"train_loss": -25.89668083190918, "global_step": 330032, "epoch": 3976} {"train_loss": -26.174869537353516, "global_step": 330033, "epoch": 3976} {"train_loss": -26.443490982055664, "global_step": 330034, "epoch": 3976} {"train_loss": -25.951990127563477, "global_step": 330035, "epoch": 3976} {"train_loss": -26.042993545532227, "global_step": 330036, "epoch": 3976} {"train_loss": -25.877731323242188, "global_step": 330037, "epoch": 3976} {"train_loss": -26.34522819519043, "global_step": 330038, "epoch": 3976} {"train_loss": -25.84077262878418, "global_step": 330039, "epoch": 3976} {"train_loss": -26.133087158203125, "global_step": 330040, "epoch": 3976} {"train_loss": -25.585996627807617, "global_step": 330041, "epoch": 3976} {"train_loss": -25.476444244384766, "global_step": 330042, "epoch": 3976} {"train_loss": -24.891769409179688, "global_step": 330043, "epoch": 3976} {"train_loss": -25.862939834594727, "global_step": 330044, "epoch": 3976} {"train_loss": -26.41351318359375, "global_step": 330045, "epoch": 3976} {"train_loss": -25.697668075561523, "global_step": 330046, "epoch": 3976} {"train_loss": -25.679258346557617, "global_step": 330047, "epoch": 3976} {"train_loss": -26.053831100463867, "global_step": 330048, "epoch": 3976} {"train_loss": -25.855417251586914, "global_step": 330049, "epoch": 3976} {"train_loss": -26.0584716796875, "global_step": 330050, "epoch": 3976} {"train_loss": -25.670385360717773, "global_step": 330051, "epoch": 3976} {"train_loss": -25.851303100585938, "global_step": 330052, "epoch": 3976} {"train_loss": -25.890485763549805, "global_step": 330053, "epoch": 3976} {"train_loss": -25.830307006835938, "global_step": 330054, "epoch": 3976} {"train_loss": -25.754804611206055, "global_step": 330055, "epoch": 3976} {"train_loss": -25.95814323425293, "global_step": 330056, "epoch": 3976} {"train_loss": -25.7824764251709, "global_step": 330057, "epoch": 3976} {"train_loss": -25.996490478515625, "global_step": 330058, "epoch": 3976} {"train_loss": -25.527421951293945, "global_step": 330059, "epoch": 3976} {"train_loss": -25.740385055541992, "global_step": 330060, "epoch": 3976} {"train_loss": -25.52772331237793, "global_step": 330061, "epoch": 3976} {"train_loss": -25.82733726501465, "global_step": 330062, "epoch": 3976} {"train_loss": -26.16387939453125, "global_step": 330063, "epoch": 3976} {"train_loss": -25.518430709838867, "global_step": 330064, "epoch": 3976} {"train_loss": -26.128232955932617, "global_step": 330065, "epoch": 3976} {"train_loss": -25.91826820373535, "global_step": 330066, "epoch": 3976} {"train_loss": -26.107778549194336, "global_step": 330067, "epoch": 3976} {"train_loss": -25.42404556274414, "global_step": 330068, "epoch": 3976} {"train_loss": -24.83336639404297, "global_step": 330069, "epoch": 3976} {"train_loss": -25.3607177734375, "global_step": 330070, "epoch": 3976} {"train_loss": -25.873083114624023, "global_step": 330071, "epoch": 3976} {"train_loss": -25.40671730041504, "global_step": 330072, "epoch": 3976} {"train_loss": -26.005075454711914, "global_step": 330073, "epoch": 3976} {"train_loss": -25.203847885131836, "global_step": 330074, "epoch": 3976} {"train_loss": -25.89021873474121, "global_step": 330075, "epoch": 3976} {"train_loss": -25.944965362548828, "global_step": 330076, "epoch": 3976} {"train_loss": -26.097402572631836, "global_step": 330077, "epoch": 3976} {"train_loss": -25.85748863220215, "global_step": 330078, "epoch": 3976} {"train_loss": -26.006946563720703, "global_step": 330079, "epoch": 3976} {"train_loss": -25.984039306640625, "global_step": 330080, "epoch": 3976} {"train_loss": -26.1640682220459, "global_step": 330081, "epoch": 3976} {"train_loss": -26.135971069335938, "global_step": 330082, "epoch": 3976} {"train_loss": -25.91619873046875, "global_step": 330083, "epoch": 3976} {"train_loss": -25.876794815063477, "global_step": 330084, "epoch": 3976} {"train_loss": -26.196552276611328, "global_step": 330085, "epoch": 3976} {"train_loss": -26.010534286499023, "global_step": 330086, "epoch": 3976} {"train_loss": -26.213552474975586, "global_step": 330087, "epoch": 3976} {"train_loss": -26.012542724609375, "global_step": 330088, "epoch": 3976} {"train_loss": -25.827167510986328, "global_step": 330089, "epoch": 3976} {"train_loss": -25.813733617943452, "global_step": 330090, "epoch": 3976, "val_loss": 7153461.0} {"train_loss": -25.684370040893555, "global_step": 330091, "epoch": 3977} {"train_loss": -25.356952667236328, "global_step": 330092, "epoch": 3977} {"train_loss": -25.063108444213867, "global_step": 330093, "epoch": 3977} {"train_loss": -24.156335830688477, "global_step": 330094, "epoch": 3977} {"train_loss": -24.2044677734375, "global_step": 330095, "epoch": 3977} {"train_loss": -24.99281883239746, "global_step": 330096, "epoch": 3977} {"train_loss": -25.208730697631836, "global_step": 330097, "epoch": 3977} {"train_loss": -24.86978530883789, "global_step": 330098, "epoch": 3977} {"train_loss": -25.308195114135742, "global_step": 330099, "epoch": 3977} {"train_loss": -25.624608993530273, "global_step": 330100, "epoch": 3977} {"train_loss": -25.36591148376465, "global_step": 330101, "epoch": 3977} {"train_loss": -25.266714096069336, "global_step": 330102, "epoch": 3977} {"train_loss": -25.799604415893555, "global_step": 330103, "epoch": 3977} {"train_loss": -25.697702407836914, "global_step": 330104, "epoch": 3977} {"train_loss": -25.43423843383789, "global_step": 330105, "epoch": 3977} {"train_loss": -25.58357048034668, "global_step": 330106, "epoch": 3977} {"train_loss": -25.723852157592773, "global_step": 330107, "epoch": 3977} {"train_loss": -25.574399948120117, "global_step": 330108, "epoch": 3977} {"train_loss": -25.664457321166992, "global_step": 330109, "epoch": 3977} {"train_loss": -25.775747299194336, "global_step": 330110, "epoch": 3977} {"train_loss": -25.543302536010742, "global_step": 330111, "epoch": 3977} {"train_loss": -25.735645294189453, "global_step": 330112, "epoch": 3977} {"train_loss": -25.532758712768555, "global_step": 330113, "epoch": 3977} {"train_loss": -25.90384864807129, "global_step": 330114, "epoch": 3977} {"train_loss": -25.28360939025879, "global_step": 330115, "epoch": 3977} {"train_loss": -25.76885414123535, "global_step": 330116, "epoch": 3977} {"train_loss": -25.872114181518555, "global_step": 330117, "epoch": 3977} {"train_loss": -25.66131019592285, "global_step": 330118, "epoch": 3977} {"train_loss": -25.915151596069336, "global_step": 330119, "epoch": 3977} {"train_loss": -25.834644317626953, "global_step": 330120, "epoch": 3977} {"train_loss": -26.15036964416504, "global_step": 330121, "epoch": 3977} {"train_loss": -25.700693130493164, "global_step": 330122, "epoch": 3977} {"train_loss": -26.12629508972168, "global_step": 330123, "epoch": 3977} {"train_loss": -25.804784774780273, "global_step": 330124, "epoch": 3977} {"train_loss": -25.89960289001465, "global_step": 330125, "epoch": 3977} {"train_loss": -26.06817626953125, "global_step": 330126, "epoch": 3977} {"train_loss": -25.986072540283203, "global_step": 330127, "epoch": 3977} {"train_loss": -26.164936065673828, "global_step": 330128, "epoch": 3977} {"train_loss": -25.992944717407227, "global_step": 330129, "epoch": 3977} {"train_loss": -25.897497177124023, "global_step": 330130, "epoch": 3977} {"train_loss": -25.829572677612305, "global_step": 330131, "epoch": 3977} {"train_loss": -26.010766983032227, "global_step": 330132, "epoch": 3977} {"train_loss": -25.635908126831055, "global_step": 330133, "epoch": 3977} {"train_loss": -25.963708877563477, "global_step": 330134, "epoch": 3977} {"train_loss": -25.87543296813965, "global_step": 330135, "epoch": 3977} {"train_loss": -26.540176391601562, "global_step": 330136, "epoch": 3977} {"train_loss": -25.926483154296875, "global_step": 330137, "epoch": 3977} {"train_loss": -25.889455795288086, "global_step": 330138, "epoch": 3977} {"train_loss": -26.159208297729492, "global_step": 330139, "epoch": 3977} {"train_loss": -26.23682975769043, "global_step": 330140, "epoch": 3977} {"train_loss": -25.654163360595703, "global_step": 330141, "epoch": 3977} {"train_loss": -26.22440528869629, "global_step": 330142, "epoch": 3977} {"train_loss": -25.761510848999023, "global_step": 330143, "epoch": 3977} {"train_loss": -26.34610939025879, "global_step": 330144, "epoch": 3977} {"train_loss": -26.135854721069336, "global_step": 330145, "epoch": 3977} {"train_loss": -26.145313262939453, "global_step": 330146, "epoch": 3977} {"train_loss": -26.277143478393555, "global_step": 330147, "epoch": 3977} {"train_loss": -26.117294311523438, "global_step": 330148, "epoch": 3977} {"train_loss": -26.16750144958496, "global_step": 330149, "epoch": 3977} {"train_loss": -25.968122482299805, "global_step": 330150, "epoch": 3977} {"train_loss": -25.8940372467041, "global_step": 330151, "epoch": 3977} {"train_loss": -25.850067138671875, "global_step": 330152, "epoch": 3977} {"train_loss": -25.83148193359375, "global_step": 330153, "epoch": 3977} {"train_loss": -25.928253173828125, "global_step": 330154, "epoch": 3977} {"train_loss": -26.14637565612793, "global_step": 330155, "epoch": 3977} {"train_loss": -26.034574508666992, "global_step": 330156, "epoch": 3977} {"train_loss": -26.118932723999023, "global_step": 330157, "epoch": 3977} {"train_loss": -26.053144454956055, "global_step": 330158, "epoch": 3977} {"train_loss": -25.345067977905273, "global_step": 330159, "epoch": 3977} {"train_loss": -26.216764450073242, "global_step": 330160, "epoch": 3977} {"train_loss": -25.849424362182617, "global_step": 330161, "epoch": 3977} {"train_loss": -25.537153244018555, "global_step": 330162, "epoch": 3977} {"train_loss": -26.162012100219727, "global_step": 330163, "epoch": 3977} {"train_loss": -26.083242416381836, "global_step": 330164, "epoch": 3977} {"train_loss": -26.11762046813965, "global_step": 330165, "epoch": 3977} {"train_loss": -25.901426315307617, "global_step": 330166, "epoch": 3977} {"train_loss": -26.110456466674805, "global_step": 330167, "epoch": 3977} {"train_loss": -26.342300415039062, "global_step": 330168, "epoch": 3977} {"train_loss": -26.21624183654785, "global_step": 330169, "epoch": 3977} {"train_loss": -26.151411056518555, "global_step": 330170, "epoch": 3977} {"train_loss": -26.3896484375, "global_step": 330171, "epoch": 3977} {"train_loss": -26.04086685180664, "global_step": 330172, "epoch": 3977} {"train_loss": -25.807376562830914, "global_step": 330173, "epoch": 3977, "val_loss": 7171333.5} {"train_loss": -25.295564651489258, "global_step": 330174, "epoch": 3978} {"train_loss": -25.376855850219727, "global_step": 330175, "epoch": 3978} {"train_loss": -25.53069496154785, "global_step": 330176, "epoch": 3978} {"train_loss": -25.66280174255371, "global_step": 330177, "epoch": 3978} {"train_loss": -25.80683708190918, "global_step": 330178, "epoch": 3978} {"train_loss": -25.836706161499023, "global_step": 330179, "epoch": 3978} {"train_loss": -25.549280166625977, "global_step": 330180, "epoch": 3978} {"train_loss": -25.7067928314209, "global_step": 330181, "epoch": 3978} {"train_loss": -26.006078720092773, "global_step": 330182, "epoch": 3978} {"train_loss": -25.419387817382812, "global_step": 330183, "epoch": 3978} {"train_loss": -25.710895538330078, "global_step": 330184, "epoch": 3978} {"train_loss": -25.982648849487305, "global_step": 330185, "epoch": 3978} {"train_loss": -25.931283950805664, "global_step": 330186, "epoch": 3978} {"train_loss": -25.7872371673584, "global_step": 330187, "epoch": 3978} {"train_loss": -25.924957275390625, "global_step": 330188, "epoch": 3978} {"train_loss": -25.846435546875, "global_step": 330189, "epoch": 3978} {"train_loss": -25.68243408203125, "global_step": 330190, "epoch": 3978} {"train_loss": -26.16437339782715, "global_step": 330191, "epoch": 3978} {"train_loss": -26.005170822143555, "global_step": 330192, "epoch": 3978} {"train_loss": -25.964160919189453, "global_step": 330193, "epoch": 3978} {"train_loss": -25.7912654876709, "global_step": 330194, "epoch": 3978} {"train_loss": -25.8624324798584, "global_step": 330195, "epoch": 3978} {"train_loss": -26.1019344329834, "global_step": 330196, "epoch": 3978} {"train_loss": -25.909936904907227, "global_step": 330197, "epoch": 3978} {"train_loss": -25.86155128479004, "global_step": 330198, "epoch": 3978} {"train_loss": -26.005746841430664, "global_step": 330199, "epoch": 3978} {"train_loss": -26.006072998046875, "global_step": 330200, "epoch": 3978} {"train_loss": -26.237234115600586, "global_step": 330201, "epoch": 3978} {"train_loss": -26.11984634399414, "global_step": 330202, "epoch": 3978} {"train_loss": -25.77704429626465, "global_step": 330203, "epoch": 3978} {"train_loss": -26.11944007873535, "global_step": 330204, "epoch": 3978} {"train_loss": -25.89771842956543, "global_step": 330205, "epoch": 3978} {"train_loss": -26.206396102905273, "global_step": 330206, "epoch": 3978} {"train_loss": -25.954496383666992, "global_step": 330207, "epoch": 3978} {"train_loss": -26.024890899658203, "global_step": 330208, "epoch": 3978} {"train_loss": -26.27894401550293, "global_step": 330209, "epoch": 3978} {"train_loss": -26.1361083984375, "global_step": 330210, "epoch": 3978} {"train_loss": -26.1634578704834, "global_step": 330211, "epoch": 3978} {"train_loss": -26.255985260009766, "global_step": 330212, "epoch": 3978} {"train_loss": -26.30000877380371, "global_step": 330213, "epoch": 3978} {"train_loss": -26.135116577148438, "global_step": 330214, "epoch": 3978} {"train_loss": -26.00742530822754, "global_step": 330215, "epoch": 3978} {"train_loss": -26.539905548095703, "global_step": 330216, "epoch": 3978} {"train_loss": -26.24546241760254, "global_step": 330217, "epoch": 3978} {"train_loss": -25.748117446899414, "global_step": 330218, "epoch": 3978} {"train_loss": -26.083988189697266, "global_step": 330219, "epoch": 3978} {"train_loss": -26.096424102783203, "global_step": 330220, "epoch": 3978} {"train_loss": -26.273807525634766, "global_step": 330221, "epoch": 3978} {"train_loss": -25.90854263305664, "global_step": 330222, "epoch": 3978} {"train_loss": -26.509836196899414, "global_step": 330223, "epoch": 3978} {"train_loss": -26.14838218688965, "global_step": 330224, "epoch": 3978} {"train_loss": -25.757001876831055, "global_step": 330225, "epoch": 3978} {"train_loss": -26.287153244018555, "global_step": 330226, "epoch": 3978} {"train_loss": -26.066884994506836, "global_step": 330227, "epoch": 3978} {"train_loss": -25.96416664123535, "global_step": 330228, "epoch": 3978} {"train_loss": -25.985980987548828, "global_step": 330229, "epoch": 3978} {"train_loss": -26.219913482666016, "global_step": 330230, "epoch": 3978} {"train_loss": -25.89731788635254, "global_step": 330231, "epoch": 3978} {"train_loss": -26.234622955322266, "global_step": 330232, "epoch": 3978} {"train_loss": -26.181594848632812, "global_step": 330233, "epoch": 3978} {"train_loss": -25.929473876953125, "global_step": 330234, "epoch": 3978} {"train_loss": -26.441091537475586, "global_step": 330235, "epoch": 3978} {"train_loss": -26.223684310913086, "global_step": 330236, "epoch": 3978} {"train_loss": -26.529783248901367, "global_step": 330237, "epoch": 3978} {"train_loss": -26.12983512878418, "global_step": 330238, "epoch": 3978} {"train_loss": -26.369709014892578, "global_step": 330239, "epoch": 3978} {"train_loss": -26.166141510009766, "global_step": 330240, "epoch": 3978} {"train_loss": -26.1646728515625, "global_step": 330241, "epoch": 3978} {"train_loss": -26.077116012573242, "global_step": 330242, "epoch": 3978} {"train_loss": -26.3774356842041, "global_step": 330243, "epoch": 3978} {"train_loss": -26.24458885192871, "global_step": 330244, "epoch": 3978} {"train_loss": -25.824777603149414, "global_step": 330245, "epoch": 3978} {"train_loss": -25.818246841430664, "global_step": 330246, "epoch": 3978} {"train_loss": -26.077869415283203, "global_step": 330247, "epoch": 3978} {"train_loss": -25.931106567382812, "global_step": 330248, "epoch": 3978} {"train_loss": -25.669050216674805, "global_step": 330249, "epoch": 3978} {"train_loss": -25.128660202026367, "global_step": 330250, "epoch": 3978} {"train_loss": -25.674779891967773, "global_step": 330251, "epoch": 3978} {"train_loss": -25.779932022094727, "global_step": 330252, "epoch": 3978} {"train_loss": -25.810962677001953, "global_step": 330253, "epoch": 3978} {"train_loss": -25.86604881286621, "global_step": 330254, "epoch": 3978} {"train_loss": -25.83888816833496, "global_step": 330255, "epoch": 3978} {"train_loss": -25.95238311032215, "global_step": 330256, "epoch": 3978, "val_loss": 7146596.0} {"train_loss": -24.767229080200195, "global_step": 330257, "epoch": 3979} {"train_loss": -24.74310874938965, "global_step": 330258, "epoch": 3979} {"train_loss": -25.104877471923828, "global_step": 330259, "epoch": 3979} {"train_loss": -24.67963218688965, "global_step": 330260, "epoch": 3979} {"train_loss": -25.26099967956543, "global_step": 330261, "epoch": 3979} {"train_loss": -24.8188419342041, "global_step": 330262, "epoch": 3979} {"train_loss": -25.182363510131836, "global_step": 330263, "epoch": 3979} {"train_loss": -24.608556747436523, "global_step": 330264, "epoch": 3979} {"train_loss": -24.775907516479492, "global_step": 330265, "epoch": 3979} {"train_loss": -25.355493545532227, "global_step": 330266, "epoch": 3979} {"train_loss": -25.179147720336914, "global_step": 330267, "epoch": 3979} {"train_loss": -25.11880874633789, "global_step": 330268, "epoch": 3979} {"train_loss": -25.36195945739746, "global_step": 330269, "epoch": 3979} {"train_loss": -25.242055892944336, "global_step": 330270, "epoch": 3979} {"train_loss": -25.179141998291016, "global_step": 330271, "epoch": 3979} {"train_loss": -25.51728630065918, "global_step": 330272, "epoch": 3979} {"train_loss": -25.422496795654297, "global_step": 330273, "epoch": 3979} {"train_loss": -25.521831512451172, "global_step": 330274, "epoch": 3979} {"train_loss": -25.1547908782959, "global_step": 330275, "epoch": 3979} {"train_loss": -25.424592971801758, "global_step": 330276, "epoch": 3979} {"train_loss": -25.691131591796875, "global_step": 330277, "epoch": 3979} {"train_loss": -25.54500389099121, "global_step": 330278, "epoch": 3979} {"train_loss": -25.808507919311523, "global_step": 330279, "epoch": 3979} {"train_loss": -25.569883346557617, "global_step": 330280, "epoch": 3979} {"train_loss": -25.851362228393555, "global_step": 330281, "epoch": 3979} {"train_loss": -25.859704971313477, "global_step": 330282, "epoch": 3979} {"train_loss": -25.62226676940918, "global_step": 330283, "epoch": 3979} {"train_loss": -25.6690731048584, "global_step": 330284, "epoch": 3979} {"train_loss": -25.675024032592773, "global_step": 330285, "epoch": 3979} {"train_loss": -25.955825805664062, "global_step": 330286, "epoch": 3979} {"train_loss": -25.806921005249023, "global_step": 330287, "epoch": 3979} {"train_loss": -25.91937828063965, "global_step": 330288, "epoch": 3979} {"train_loss": -25.954620361328125, "global_step": 330289, "epoch": 3979} {"train_loss": -25.955322265625, "global_step": 330290, "epoch": 3979} {"train_loss": -25.994861602783203, "global_step": 330291, "epoch": 3979} {"train_loss": -26.323410034179688, "global_step": 330292, "epoch": 3979} {"train_loss": -25.832334518432617, "global_step": 330293, "epoch": 3979} {"train_loss": -25.93069839477539, "global_step": 330294, "epoch": 3979} {"train_loss": -26.215656280517578, "global_step": 330295, "epoch": 3979} {"train_loss": -25.890790939331055, "global_step": 330296, "epoch": 3979} {"train_loss": -26.437162399291992, "global_step": 330297, "epoch": 3979} {"train_loss": -26.2047176361084, "global_step": 330298, "epoch": 3979} {"train_loss": -26.233936309814453, "global_step": 330299, "epoch": 3979} {"train_loss": -26.144433975219727, "global_step": 330300, "epoch": 3979} {"train_loss": -25.810155868530273, "global_step": 330301, "epoch": 3979} {"train_loss": -26.037317276000977, "global_step": 330302, "epoch": 3979} {"train_loss": -26.07459831237793, "global_step": 330303, "epoch": 3979} {"train_loss": -26.107654571533203, "global_step": 330304, "epoch": 3979} {"train_loss": -26.852094650268555, "global_step": 330305, "epoch": 3979} {"train_loss": -26.141510009765625, "global_step": 330306, "epoch": 3979} {"train_loss": -26.066171646118164, "global_step": 330307, "epoch": 3979} {"train_loss": -25.815893173217773, "global_step": 330308, "epoch": 3979} {"train_loss": -26.105375289916992, "global_step": 330309, "epoch": 3979} {"train_loss": -25.828784942626953, "global_step": 330310, "epoch": 3979} {"train_loss": -25.8173770904541, "global_step": 330311, "epoch": 3979} {"train_loss": -26.001422882080078, "global_step": 330312, "epoch": 3979} {"train_loss": -26.150466918945312, "global_step": 330313, "epoch": 3979} {"train_loss": -25.80584716796875, "global_step": 330314, "epoch": 3979} {"train_loss": -26.3558349609375, "global_step": 330315, "epoch": 3979} {"train_loss": -26.284748077392578, "global_step": 330316, "epoch": 3979} {"train_loss": -25.849597930908203, "global_step": 330317, "epoch": 3979} {"train_loss": -26.363513946533203, "global_step": 330318, "epoch": 3979} {"train_loss": -26.0362548828125, "global_step": 330319, "epoch": 3979} {"train_loss": -25.91874122619629, "global_step": 330320, "epoch": 3979} {"train_loss": -26.062976837158203, "global_step": 330321, "epoch": 3979} {"train_loss": -26.0059871673584, "global_step": 330322, "epoch": 3979} {"train_loss": -26.141983032226562, "global_step": 330323, "epoch": 3979} {"train_loss": -26.0805606842041, "global_step": 330324, "epoch": 3979} {"train_loss": -25.724084854125977, "global_step": 330325, "epoch": 3979} {"train_loss": -25.6260929107666, "global_step": 330326, "epoch": 3979} {"train_loss": -25.68427085876465, "global_step": 330327, "epoch": 3979} {"train_loss": -26.070892333984375, "global_step": 330328, "epoch": 3979} {"train_loss": -25.903600692749023, "global_step": 330329, "epoch": 3979} {"train_loss": -26.335981369018555, "global_step": 330330, "epoch": 3979} {"train_loss": -25.822834014892578, "global_step": 330331, "epoch": 3979} {"train_loss": -25.647918701171875, "global_step": 330332, "epoch": 3979} {"train_loss": -26.319599151611328, "global_step": 330333, "epoch": 3979} {"train_loss": -26.09736442565918, "global_step": 330334, "epoch": 3979} {"train_loss": -26.146331787109375, "global_step": 330335, "epoch": 3979} {"train_loss": -26.298343658447266, "global_step": 330336, "epoch": 3979} {"train_loss": -26.234949111938477, "global_step": 330337, "epoch": 3979} {"train_loss": -25.99159049987793, "global_step": 330338, "epoch": 3979} {"train_loss": -25.787797766995716, "global_step": 330339, "epoch": 3979, "val_loss": 7047298.0} {"train_loss": -25.54207420349121, "global_step": 330340, "epoch": 3980} {"train_loss": -25.049753189086914, "global_step": 330341, "epoch": 3980} {"train_loss": -24.662015914916992, "global_step": 330342, "epoch": 3980} {"train_loss": -25.281944274902344, "global_step": 330343, "epoch": 3980} {"train_loss": -25.938512802124023, "global_step": 330344, "epoch": 3980} {"train_loss": -26.025135040283203, "global_step": 330345, "epoch": 3980} {"train_loss": -25.696191787719727, "global_step": 330346, "epoch": 3980} {"train_loss": -25.8658504486084, "global_step": 330347, "epoch": 3980} {"train_loss": -25.603412628173828, "global_step": 330348, "epoch": 3980} {"train_loss": -26.035114288330078, "global_step": 330349, "epoch": 3980} {"train_loss": -25.9231014251709, "global_step": 330350, "epoch": 3980} {"train_loss": -25.909759521484375, "global_step": 330351, "epoch": 3980} {"train_loss": -25.489456176757812, "global_step": 330352, "epoch": 3980} {"train_loss": -25.99077796936035, "global_step": 330353, "epoch": 3980} {"train_loss": -26.149215698242188, "global_step": 330354, "epoch": 3980} {"train_loss": -26.35283851623535, "global_step": 330355, "epoch": 3980} {"train_loss": -26.11543083190918, "global_step": 330356, "epoch": 3980} {"train_loss": -25.900470733642578, "global_step": 330357, "epoch": 3980} {"train_loss": -26.14008903503418, "global_step": 330358, "epoch": 3980} {"train_loss": -26.137622833251953, "global_step": 330359, "epoch": 3980} {"train_loss": -26.067367553710938, "global_step": 330360, "epoch": 3980} {"train_loss": -25.917407989501953, "global_step": 330361, "epoch": 3980} {"train_loss": -25.80647087097168, "global_step": 330362, "epoch": 3980} {"train_loss": -25.873432159423828, "global_step": 330363, "epoch": 3980} {"train_loss": -25.8212947845459, "global_step": 330364, "epoch": 3980} {"train_loss": -26.12139892578125, "global_step": 330365, "epoch": 3980} {"train_loss": -26.117401123046875, "global_step": 330366, "epoch": 3980} {"train_loss": -25.959211349487305, "global_step": 330367, "epoch": 3980} {"train_loss": -26.140878677368164, "global_step": 330368, "epoch": 3980} {"train_loss": -26.090442657470703, "global_step": 330369, "epoch": 3980} {"train_loss": -25.89312744140625, "global_step": 330370, "epoch": 3980} {"train_loss": -26.053205490112305, "global_step": 330371, "epoch": 3980} {"train_loss": -25.900278091430664, "global_step": 330372, "epoch": 3980} {"train_loss": -25.839923858642578, "global_step": 330373, "epoch": 3980} {"train_loss": -25.534563064575195, "global_step": 330374, "epoch": 3980} {"train_loss": -25.767667770385742, "global_step": 330375, "epoch": 3980} {"train_loss": -26.23455810546875, "global_step": 330376, "epoch": 3980} {"train_loss": -25.830686569213867, "global_step": 330377, "epoch": 3980} {"train_loss": -25.52342987060547, "global_step": 330378, "epoch": 3980} {"train_loss": -25.792724609375, "global_step": 330379, "epoch": 3980} {"train_loss": -25.92853355407715, "global_step": 330380, "epoch": 3980} {"train_loss": -25.9145450592041, "global_step": 330381, "epoch": 3980} {"train_loss": -26.035940170288086, "global_step": 330382, "epoch": 3980} {"train_loss": -26.23640251159668, "global_step": 330383, "epoch": 3980} {"train_loss": -26.050098419189453, "global_step": 330384, "epoch": 3980} {"train_loss": -26.016077041625977, "global_step": 330385, "epoch": 3980} {"train_loss": -25.88665199279785, "global_step": 330386, "epoch": 3980} {"train_loss": -26.177350997924805, "global_step": 330387, "epoch": 3980} {"train_loss": -25.731430053710938, "global_step": 330388, "epoch": 3980} {"train_loss": -25.798263549804688, "global_step": 330389, "epoch": 3980} {"train_loss": -26.22865867614746, "global_step": 330390, "epoch": 3980} {"train_loss": -25.900602340698242, "global_step": 330391, "epoch": 3980} {"train_loss": -25.900348663330078, "global_step": 330392, "epoch": 3980} {"train_loss": -26.203161239624023, "global_step": 330393, "epoch": 3980} {"train_loss": -26.206594467163086, "global_step": 330394, "epoch": 3980} {"train_loss": -26.076187133789062, "global_step": 330395, "epoch": 3980} {"train_loss": -26.071674346923828, "global_step": 330396, "epoch": 3980} {"train_loss": -25.98016929626465, "global_step": 330397, "epoch": 3980} {"train_loss": -26.0020751953125, "global_step": 330398, "epoch": 3980} {"train_loss": -25.759069442749023, "global_step": 330399, "epoch": 3980} {"train_loss": -25.5260066986084, "global_step": 330400, "epoch": 3980} {"train_loss": -25.958393096923828, "global_step": 330401, "epoch": 3980} {"train_loss": -26.119150161743164, "global_step": 330402, "epoch": 3980} {"train_loss": -25.73287010192871, "global_step": 330403, "epoch": 3980} {"train_loss": -25.647464752197266, "global_step": 330404, "epoch": 3980} {"train_loss": -26.261754989624023, "global_step": 330405, "epoch": 3980} {"train_loss": -25.982324600219727, "global_step": 330406, "epoch": 3980} {"train_loss": -26.0505428314209, "global_step": 330407, "epoch": 3980} {"train_loss": -25.906442642211914, "global_step": 330408, "epoch": 3980} {"train_loss": -25.9100284576416, "global_step": 330409, "epoch": 3980} {"train_loss": -25.849546432495117, "global_step": 330410, "epoch": 3980} {"train_loss": -26.39214515686035, "global_step": 330411, "epoch": 3980} {"train_loss": -25.662189483642578, "global_step": 330412, "epoch": 3980} {"train_loss": -25.832983016967773, "global_step": 330413, "epoch": 3980} {"train_loss": -25.862049102783203, "global_step": 330414, "epoch": 3980} {"train_loss": -25.440027236938477, "global_step": 330415, "epoch": 3980} {"train_loss": -25.067960739135742, "global_step": 330416, "epoch": 3980} {"train_loss": -25.27335548400879, "global_step": 330417, "epoch": 3980} {"train_loss": -26.117040634155273, "global_step": 330418, "epoch": 3980} {"train_loss": -25.93012046813965, "global_step": 330419, "epoch": 3980} {"train_loss": -25.712005615234375, "global_step": 330420, "epoch": 3980} {"train_loss": -26.037128448486328, "global_step": 330421, "epoch": 3980} {"train_loss": -25.891315253384143, "global_step": 330422, "epoch": 3980, "val_loss": 7113964.5} {"train_loss": -25.770227432250977, "global_step": 330423, "epoch": 3981} {"train_loss": -25.449438095092773, "global_step": 330424, "epoch": 3981} {"train_loss": -25.62896728515625, "global_step": 330425, "epoch": 3981} {"train_loss": -25.103851318359375, "global_step": 330426, "epoch": 3981} {"train_loss": -25.59047508239746, "global_step": 330427, "epoch": 3981} {"train_loss": -25.380847930908203, "global_step": 330428, "epoch": 3981} {"train_loss": -25.64325523376465, "global_step": 330429, "epoch": 3981} {"train_loss": -25.1997013092041, "global_step": 330430, "epoch": 3981} {"train_loss": -25.58798599243164, "global_step": 330431, "epoch": 3981} {"train_loss": -25.19063949584961, "global_step": 330432, "epoch": 3981} {"train_loss": -25.62656593322754, "global_step": 330433, "epoch": 3981} {"train_loss": -25.643884658813477, "global_step": 330434, "epoch": 3981} {"train_loss": -25.8626766204834, "global_step": 330435, "epoch": 3981} {"train_loss": -25.731952667236328, "global_step": 330436, "epoch": 3981} {"train_loss": -26.39027214050293, "global_step": 330437, "epoch": 3981} {"train_loss": -25.874670028686523, "global_step": 330438, "epoch": 3981} {"train_loss": -25.558713912963867, "global_step": 330439, "epoch": 3981} {"train_loss": -25.61106300354004, "global_step": 330440, "epoch": 3981} {"train_loss": -25.8380069732666, "global_step": 330441, "epoch": 3981} {"train_loss": -25.559833526611328, "global_step": 330442, "epoch": 3981} {"train_loss": -25.9664306640625, "global_step": 330443, "epoch": 3981} {"train_loss": -25.709793090820312, "global_step": 330444, "epoch": 3981} {"train_loss": -25.71809959411621, "global_step": 330445, "epoch": 3981} {"train_loss": -25.774499893188477, "global_step": 330446, "epoch": 3981} {"train_loss": -26.129438400268555, "global_step": 330447, "epoch": 3981} {"train_loss": -26.011335372924805, "global_step": 330448, "epoch": 3981} {"train_loss": -25.800251007080078, "global_step": 330449, "epoch": 3981} {"train_loss": -25.574878692626953, "global_step": 330450, "epoch": 3981} {"train_loss": -25.916868209838867, "global_step": 330451, "epoch": 3981} {"train_loss": -25.919397354125977, "global_step": 330452, "epoch": 3981} {"train_loss": -25.623456954956055, "global_step": 330453, "epoch": 3981} {"train_loss": -25.849145889282227, "global_step": 330454, "epoch": 3981} {"train_loss": -26.15144157409668, "global_step": 330455, "epoch": 3981} {"train_loss": -26.278852462768555, "global_step": 330456, "epoch": 3981} {"train_loss": -25.959671020507812, "global_step": 330457, "epoch": 3981} {"train_loss": -25.821863174438477, "global_step": 330458, "epoch": 3981} {"train_loss": -26.087392807006836, "global_step": 330459, "epoch": 3981} {"train_loss": -26.04302978515625, "global_step": 330460, "epoch": 3981} {"train_loss": -25.66834831237793, "global_step": 330461, "epoch": 3981} {"train_loss": -25.955915451049805, "global_step": 330462, "epoch": 3981} {"train_loss": -25.83172607421875, "global_step": 330463, "epoch": 3981} {"train_loss": -26.116580963134766, "global_step": 330464, "epoch": 3981} {"train_loss": -26.18903923034668, "global_step": 330465, "epoch": 3981} {"train_loss": -25.94854164123535, "global_step": 330466, "epoch": 3981} {"train_loss": -26.0813045501709, "global_step": 330467, "epoch": 3981} {"train_loss": -26.23915672302246, "global_step": 330468, "epoch": 3981} {"train_loss": -26.00942039489746, "global_step": 330469, "epoch": 3981} {"train_loss": -26.59962272644043, "global_step": 330470, "epoch": 3981} {"train_loss": -26.09451675415039, "global_step": 330471, "epoch": 3981} {"train_loss": -25.610700607299805, "global_step": 330472, "epoch": 3981} {"train_loss": -25.644399642944336, "global_step": 330473, "epoch": 3981} {"train_loss": -25.232160568237305, "global_step": 330474, "epoch": 3981} {"train_loss": -25.708423614501953, "global_step": 330475, "epoch": 3981} {"train_loss": -25.841358184814453, "global_step": 330476, "epoch": 3981} {"train_loss": -25.313474655151367, "global_step": 330477, "epoch": 3981} {"train_loss": -25.7169246673584, "global_step": 330478, "epoch": 3981} {"train_loss": -25.64234733581543, "global_step": 330479, "epoch": 3981} {"train_loss": -25.84126091003418, "global_step": 330480, "epoch": 3981} {"train_loss": -25.976886749267578, "global_step": 330481, "epoch": 3981} {"train_loss": -25.61859703063965, "global_step": 330482, "epoch": 3981} {"train_loss": -25.85235595703125, "global_step": 330483, "epoch": 3981} {"train_loss": -25.920337677001953, "global_step": 330484, "epoch": 3981} {"train_loss": -26.160924911499023, "global_step": 330485, "epoch": 3981} {"train_loss": -26.113269805908203, "global_step": 330486, "epoch": 3981} {"train_loss": -25.721776962280273, "global_step": 330487, "epoch": 3981} {"train_loss": -25.1639347076416, "global_step": 330488, "epoch": 3981} {"train_loss": -26.278507232666016, "global_step": 330489, "epoch": 3981} {"train_loss": -25.30521011352539, "global_step": 330490, "epoch": 3981} {"train_loss": -25.36530113220215, "global_step": 330491, "epoch": 3981} {"train_loss": -25.3560791015625, "global_step": 330492, "epoch": 3981} {"train_loss": -25.471288681030273, "global_step": 330493, "epoch": 3981} {"train_loss": -25.871374130249023, "global_step": 330494, "epoch": 3981} {"train_loss": -25.350271224975586, "global_step": 330495, "epoch": 3981} {"train_loss": -25.437131881713867, "global_step": 330496, "epoch": 3981} {"train_loss": -25.916173934936523, "global_step": 330497, "epoch": 3981} {"train_loss": -25.966739654541016, "global_step": 330498, "epoch": 3981} {"train_loss": -25.969009399414062, "global_step": 330499, "epoch": 3981} {"train_loss": -25.599895477294922, "global_step": 330500, "epoch": 3981} {"train_loss": -26.06658935546875, "global_step": 330501, "epoch": 3981} {"train_loss": -25.91004753112793, "global_step": 330502, "epoch": 3981} {"train_loss": -26.34259033203125, "global_step": 330503, "epoch": 3981} {"train_loss": -25.854806900024414, "global_step": 330504, "epoch": 3981} {"train_loss": -25.771289618618518, "global_step": 330505, "epoch": 3981, "val_loss": 7203327.0} {"train_loss": -25.38416862487793, "global_step": 330506, "epoch": 3982} {"train_loss": -25.633563995361328, "global_step": 330507, "epoch": 3982} {"train_loss": -25.57736587524414, "global_step": 330508, "epoch": 3982} {"train_loss": -25.922815322875977, "global_step": 330509, "epoch": 3982} {"train_loss": -25.54310417175293, "global_step": 330510, "epoch": 3982} {"train_loss": -25.77521324157715, "global_step": 330511, "epoch": 3982} {"train_loss": -25.68708610534668, "global_step": 330512, "epoch": 3982} {"train_loss": -25.52589988708496, "global_step": 330513, "epoch": 3982} {"train_loss": -25.70550537109375, "global_step": 330514, "epoch": 3982} {"train_loss": -25.638702392578125, "global_step": 330515, "epoch": 3982} {"train_loss": -25.83292579650879, "global_step": 330516, "epoch": 3982} {"train_loss": -25.802719116210938, "global_step": 330517, "epoch": 3982} {"train_loss": -25.546297073364258, "global_step": 330518, "epoch": 3982} {"train_loss": -25.630584716796875, "global_step": 330519, "epoch": 3982} {"train_loss": -25.582256317138672, "global_step": 330520, "epoch": 3982} {"train_loss": -25.65852165222168, "global_step": 330521, "epoch": 3982} {"train_loss": -25.967742919921875, "global_step": 330522, "epoch": 3982} {"train_loss": -25.601898193359375, "global_step": 330523, "epoch": 3982} {"train_loss": -25.747943878173828, "global_step": 330524, "epoch": 3982} {"train_loss": -25.959836959838867, "global_step": 330525, "epoch": 3982} {"train_loss": -25.61097526550293, "global_step": 330526, "epoch": 3982} {"train_loss": -26.0673828125, "global_step": 330527, "epoch": 3982} {"train_loss": -25.64375877380371, "global_step": 330528, "epoch": 3982} {"train_loss": -26.12984275817871, "global_step": 330529, "epoch": 3982} {"train_loss": -26.100650787353516, "global_step": 330530, "epoch": 3982} {"train_loss": -26.0539493560791, "global_step": 330531, "epoch": 3982} {"train_loss": -26.192432403564453, "global_step": 330532, "epoch": 3982} {"train_loss": -26.110919952392578, "global_step": 330533, "epoch": 3982} {"train_loss": -26.0057315826416, "global_step": 330534, "epoch": 3982} {"train_loss": -25.805830001831055, "global_step": 330535, "epoch": 3982} {"train_loss": -25.956247329711914, "global_step": 330536, "epoch": 3982} {"train_loss": -25.787445068359375, "global_step": 330537, "epoch": 3982} {"train_loss": -26.17461585998535, "global_step": 330538, "epoch": 3982} {"train_loss": -25.62284278869629, "global_step": 330539, "epoch": 3982} {"train_loss": -25.799341201782227, "global_step": 330540, "epoch": 3982} {"train_loss": -26.1212158203125, "global_step": 330541, "epoch": 3982} {"train_loss": -25.809040069580078, "global_step": 330542, "epoch": 3982} {"train_loss": -25.944406509399414, "global_step": 330543, "epoch": 3982} {"train_loss": -26.24515151977539, "global_step": 330544, "epoch": 3982} {"train_loss": -26.088186264038086, "global_step": 330545, "epoch": 3982} {"train_loss": -26.125097274780273, "global_step": 330546, "epoch": 3982} {"train_loss": -26.011001586914062, "global_step": 330547, "epoch": 3982} {"train_loss": -26.529041290283203, "global_step": 330548, "epoch": 3982} {"train_loss": -26.113525390625, "global_step": 330549, "epoch": 3982} {"train_loss": -26.0047607421875, "global_step": 330550, "epoch": 3982} {"train_loss": -26.328474044799805, "global_step": 330551, "epoch": 3982} {"train_loss": -25.977497100830078, "global_step": 330552, "epoch": 3982} {"train_loss": -25.91741371154785, "global_step": 330553, "epoch": 3982} {"train_loss": -26.1781005859375, "global_step": 330554, "epoch": 3982} {"train_loss": -26.378522872924805, "global_step": 330555, "epoch": 3982} {"train_loss": -26.081937789916992, "global_step": 330556, "epoch": 3982} {"train_loss": -25.665430068969727, "global_step": 330557, "epoch": 3982} {"train_loss": -26.054052352905273, "global_step": 330558, "epoch": 3982} {"train_loss": -26.35944938659668, "global_step": 330559, "epoch": 3982} {"train_loss": -26.049468994140625, "global_step": 330560, "epoch": 3982} {"train_loss": -26.049345016479492, "global_step": 330561, "epoch": 3982} {"train_loss": -26.072818756103516, "global_step": 330562, "epoch": 3982} {"train_loss": -26.059009552001953, "global_step": 330563, "epoch": 3982} {"train_loss": -26.030935287475586, "global_step": 330564, "epoch": 3982} {"train_loss": -26.275861740112305, "global_step": 330565, "epoch": 3982} {"train_loss": -26.435943603515625, "global_step": 330566, "epoch": 3982} {"train_loss": -26.093017578125, "global_step": 330567, "epoch": 3982} {"train_loss": -26.34137535095215, "global_step": 330568, "epoch": 3982} {"train_loss": -26.25612449645996, "global_step": 330569, "epoch": 3982} {"train_loss": -26.015127182006836, "global_step": 330570, "epoch": 3982} {"train_loss": -25.729511260986328, "global_step": 330571, "epoch": 3982} {"train_loss": -26.29109001159668, "global_step": 330572, "epoch": 3982} {"train_loss": -26.335126876831055, "global_step": 330573, "epoch": 3982} {"train_loss": -26.260114669799805, "global_step": 330574, "epoch": 3982} {"train_loss": -25.885623931884766, "global_step": 330575, "epoch": 3982} {"train_loss": -24.936723709106445, "global_step": 330576, "epoch": 3982} {"train_loss": -25.233076095581055, "global_step": 330577, "epoch": 3982} {"train_loss": -24.70740509033203, "global_step": 330578, "epoch": 3982} {"train_loss": -23.42270278930664, "global_step": 330579, "epoch": 3982} {"train_loss": -24.98341178894043, "global_step": 330580, "epoch": 3982} {"train_loss": -25.186851501464844, "global_step": 330581, "epoch": 3982} {"train_loss": -24.75851821899414, "global_step": 330582, "epoch": 3982} {"train_loss": -25.046056747436523, "global_step": 330583, "epoch": 3982} {"train_loss": -24.967517852783203, "global_step": 330584, "epoch": 3982} {"train_loss": -25.082242965698242, "global_step": 330585, "epoch": 3982} {"train_loss": -25.553707122802734, "global_step": 330586, "epoch": 3982} {"train_loss": -24.9207763671875, "global_step": 330587, "epoch": 3982} {"train_loss": -25.79251507678664, "global_step": 330588, "epoch": 3982, "val_loss": 7292680.5} {"train_loss": -25.179059982299805, "global_step": 330589, "epoch": 3983} {"train_loss": -24.73593521118164, "global_step": 330590, "epoch": 3983} {"train_loss": -24.855369567871094, "global_step": 330591, "epoch": 3983} {"train_loss": -25.116809844970703, "global_step": 330592, "epoch": 3983} {"train_loss": -25.10822868347168, "global_step": 330593, "epoch": 3983} {"train_loss": -25.017776489257812, "global_step": 330594, "epoch": 3983} {"train_loss": -25.25104331970215, "global_step": 330595, "epoch": 3983} {"train_loss": -24.681272506713867, "global_step": 330596, "epoch": 3983} {"train_loss": -24.961288452148438, "global_step": 330597, "epoch": 3983} {"train_loss": -25.109485626220703, "global_step": 330598, "epoch": 3983} {"train_loss": -25.363487243652344, "global_step": 330599, "epoch": 3983} {"train_loss": -25.333528518676758, "global_step": 330600, "epoch": 3983} {"train_loss": -25.42941665649414, "global_step": 330601, "epoch": 3983} {"train_loss": -25.505268096923828, "global_step": 330602, "epoch": 3983} {"train_loss": -25.419998168945312, "global_step": 330603, "epoch": 3983} {"train_loss": -25.522192001342773, "global_step": 330604, "epoch": 3983} {"train_loss": -25.569244384765625, "global_step": 330605, "epoch": 3983} {"train_loss": -25.499113082885742, "global_step": 330606, "epoch": 3983} {"train_loss": -25.27020263671875, "global_step": 330607, "epoch": 3983} {"train_loss": -25.401874542236328, "global_step": 330608, "epoch": 3983} {"train_loss": -25.82758140563965, "global_step": 330609, "epoch": 3983} {"train_loss": -25.585256576538086, "global_step": 330610, "epoch": 3983} {"train_loss": -25.709012985229492, "global_step": 330611, "epoch": 3983} {"train_loss": -25.688627243041992, "global_step": 330612, "epoch": 3983} {"train_loss": -26.127429962158203, "global_step": 330613, "epoch": 3983} {"train_loss": -25.612869262695312, "global_step": 330614, "epoch": 3983} {"train_loss": -25.63477897644043, "global_step": 330615, "epoch": 3983} {"train_loss": -25.783788681030273, "global_step": 330616, "epoch": 3983} {"train_loss": -25.9685001373291, "global_step": 330617, "epoch": 3983} {"train_loss": -25.807880401611328, "global_step": 330618, "epoch": 3983} {"train_loss": -26.18170738220215, "global_step": 330619, "epoch": 3983} {"train_loss": -25.967792510986328, "global_step": 330620, "epoch": 3983} {"train_loss": -25.923858642578125, "global_step": 330621, "epoch": 3983} {"train_loss": -25.606054306030273, "global_step": 330622, "epoch": 3983} {"train_loss": -26.21463966369629, "global_step": 330623, "epoch": 3983} {"train_loss": -25.949670791625977, "global_step": 330624, "epoch": 3983} {"train_loss": -26.0372257232666, "global_step": 330625, "epoch": 3983} {"train_loss": -26.212732315063477, "global_step": 330626, "epoch": 3983} {"train_loss": -26.05219078063965, "global_step": 330627, "epoch": 3983} {"train_loss": -26.22014808654785, "global_step": 330628, "epoch": 3983} {"train_loss": -25.951919555664062, "global_step": 330629, "epoch": 3983} {"train_loss": -26.016706466674805, "global_step": 330630, "epoch": 3983} {"train_loss": -26.058246612548828, "global_step": 330631, "epoch": 3983} {"train_loss": -25.727252960205078, "global_step": 330632, "epoch": 3983} {"train_loss": -26.2584285736084, "global_step": 330633, "epoch": 3983} {"train_loss": -26.214771270751953, "global_step": 330634, "epoch": 3983} {"train_loss": -26.101806640625, "global_step": 330635, "epoch": 3983} {"train_loss": -25.744428634643555, "global_step": 330636, "epoch": 3983} {"train_loss": -25.867542266845703, "global_step": 330637, "epoch": 3983} {"train_loss": -25.940683364868164, "global_step": 330638, "epoch": 3983} {"train_loss": -26.192697525024414, "global_step": 330639, "epoch": 3983} {"train_loss": -25.727880477905273, "global_step": 330640, "epoch": 3983} {"train_loss": -26.178380966186523, "global_step": 330641, "epoch": 3983} {"train_loss": -26.06776237487793, "global_step": 330642, "epoch": 3983} {"train_loss": -25.6890869140625, "global_step": 330643, "epoch": 3983} {"train_loss": -26.231908798217773, "global_step": 330644, "epoch": 3983} {"train_loss": -26.08049964904785, "global_step": 330645, "epoch": 3983} {"train_loss": -25.72305679321289, "global_step": 330646, "epoch": 3983} {"train_loss": -26.011615753173828, "global_step": 330647, "epoch": 3983} {"train_loss": -25.85104751586914, "global_step": 330648, "epoch": 3983} {"train_loss": -26.329681396484375, "global_step": 330649, "epoch": 3983} {"train_loss": -25.773550033569336, "global_step": 330650, "epoch": 3983} {"train_loss": -26.11337661743164, "global_step": 330651, "epoch": 3983} {"train_loss": -25.797163009643555, "global_step": 330652, "epoch": 3983} {"train_loss": -25.913990020751953, "global_step": 330653, "epoch": 3983} {"train_loss": -25.91106605529785, "global_step": 330654, "epoch": 3983} {"train_loss": -26.140975952148438, "global_step": 330655, "epoch": 3983} {"train_loss": -25.953699111938477, "global_step": 330656, "epoch": 3983} {"train_loss": -26.284637451171875, "global_step": 330657, "epoch": 3983} {"train_loss": -26.038232803344727, "global_step": 330658, "epoch": 3983} {"train_loss": -26.165454864501953, "global_step": 330659, "epoch": 3983} {"train_loss": -26.1647891998291, "global_step": 330660, "epoch": 3983} {"train_loss": -25.854278564453125, "global_step": 330661, "epoch": 3983} {"train_loss": -26.184507369995117, "global_step": 330662, "epoch": 3983} {"train_loss": -26.145856857299805, "global_step": 330663, "epoch": 3983} {"train_loss": -26.260095596313477, "global_step": 330664, "epoch": 3983} {"train_loss": -25.9160213470459, "global_step": 330665, "epoch": 3983} {"train_loss": -25.83308219909668, "global_step": 330666, "epoch": 3983} {"train_loss": -25.8985652923584, "global_step": 330667, "epoch": 3983} {"train_loss": -26.140100479125977, "global_step": 330668, "epoch": 3983} {"train_loss": -25.7655029296875, "global_step": 330669, "epoch": 3983} {"train_loss": -25.931610107421875, "global_step": 330670, "epoch": 3983} {"train_loss": -25.784963722688605, "global_step": 330671, "epoch": 3983, "val_loss": 7225946.5} {"train_loss": -25.200220108032227, "global_step": 330672, "epoch": 3984} {"train_loss": -25.005826950073242, "global_step": 330673, "epoch": 3984} {"train_loss": -25.631250381469727, "global_step": 330674, "epoch": 3984} {"train_loss": -24.71822738647461, "global_step": 330675, "epoch": 3984} {"train_loss": -24.519372940063477, "global_step": 330676, "epoch": 3984} {"train_loss": -24.971355438232422, "global_step": 330677, "epoch": 3984} {"train_loss": -25.57794189453125, "global_step": 330678, "epoch": 3984} {"train_loss": -25.777429580688477, "global_step": 330679, "epoch": 3984} {"train_loss": -25.162002563476562, "global_step": 330680, "epoch": 3984} {"train_loss": -25.540128707885742, "global_step": 330681, "epoch": 3984} {"train_loss": -25.28724479675293, "global_step": 330682, "epoch": 3984} {"train_loss": -25.667566299438477, "global_step": 330683, "epoch": 3984} {"train_loss": -25.356958389282227, "global_step": 330684, "epoch": 3984} {"train_loss": -24.904672622680664, "global_step": 330685, "epoch": 3984} {"train_loss": -26.000110626220703, "global_step": 330686, "epoch": 3984} {"train_loss": -25.382919311523438, "global_step": 330687, "epoch": 3984} {"train_loss": -25.609821319580078, "global_step": 330688, "epoch": 3984} {"train_loss": -25.6346492767334, "global_step": 330689, "epoch": 3984} {"train_loss": -25.091379165649414, "global_step": 330690, "epoch": 3984} {"train_loss": -25.65157127380371, "global_step": 330691, "epoch": 3984} {"train_loss": -25.642215728759766, "global_step": 330692, "epoch": 3984} {"train_loss": -25.561574935913086, "global_step": 330693, "epoch": 3984} {"train_loss": -25.692426681518555, "global_step": 330694, "epoch": 3984} {"train_loss": -25.523279190063477, "global_step": 330695, "epoch": 3984} {"train_loss": -25.752363204956055, "global_step": 330696, "epoch": 3984} {"train_loss": -25.558502197265625, "global_step": 330697, "epoch": 3984} {"train_loss": -25.873493194580078, "global_step": 330698, "epoch": 3984} {"train_loss": -25.829492568969727, "global_step": 330699, "epoch": 3984} {"train_loss": -25.8819522857666, "global_step": 330700, "epoch": 3984} {"train_loss": -25.693464279174805, "global_step": 330701, "epoch": 3984} {"train_loss": -26.10003662109375, "global_step": 330702, "epoch": 3984} {"train_loss": -25.879316329956055, "global_step": 330703, "epoch": 3984} {"train_loss": -25.830785751342773, "global_step": 330704, "epoch": 3984} {"train_loss": -25.928503036499023, "global_step": 330705, "epoch": 3984} {"train_loss": -25.741046905517578, "global_step": 330706, "epoch": 3984} {"train_loss": -25.768701553344727, "global_step": 330707, "epoch": 3984} {"train_loss": -26.160070419311523, "global_step": 330708, "epoch": 3984} {"train_loss": -25.815176010131836, "global_step": 330709, "epoch": 3984} {"train_loss": -26.20453453063965, "global_step": 330710, "epoch": 3984} {"train_loss": -25.742050170898438, "global_step": 330711, "epoch": 3984} {"train_loss": -26.097747802734375, "global_step": 330712, "epoch": 3984} {"train_loss": -25.943557739257812, "global_step": 330713, "epoch": 3984} {"train_loss": -26.084726333618164, "global_step": 330714, "epoch": 3984} {"train_loss": -25.700214385986328, "global_step": 330715, "epoch": 3984} {"train_loss": -26.170394897460938, "global_step": 330716, "epoch": 3984} {"train_loss": -25.587257385253906, "global_step": 330717, "epoch": 3984} {"train_loss": -26.0484561920166, "global_step": 330718, "epoch": 3984} {"train_loss": -26.008508682250977, "global_step": 330719, "epoch": 3984} {"train_loss": -26.1427001953125, "global_step": 330720, "epoch": 3984} {"train_loss": -25.933820724487305, "global_step": 330721, "epoch": 3984} {"train_loss": -25.942428588867188, "global_step": 330722, "epoch": 3984} {"train_loss": -25.820653915405273, "global_step": 330723, "epoch": 3984} {"train_loss": -26.106054306030273, "global_step": 330724, "epoch": 3984} {"train_loss": -26.155323028564453, "global_step": 330725, "epoch": 3984} {"train_loss": -26.078413009643555, "global_step": 330726, "epoch": 3984} {"train_loss": -26.304471969604492, "global_step": 330727, "epoch": 3984} {"train_loss": -25.976587295532227, "global_step": 330728, "epoch": 3984} {"train_loss": -26.511371612548828, "global_step": 330729, "epoch": 3984} {"train_loss": -26.236841201782227, "global_step": 330730, "epoch": 3984} {"train_loss": -26.241214752197266, "global_step": 330731, "epoch": 3984} {"train_loss": -25.880542755126953, "global_step": 330732, "epoch": 3984} {"train_loss": -25.94134521484375, "global_step": 330733, "epoch": 3984} {"train_loss": -26.28546142578125, "global_step": 330734, "epoch": 3984} {"train_loss": -26.213184356689453, "global_step": 330735, "epoch": 3984} {"train_loss": -25.982975006103516, "global_step": 330736, "epoch": 3984} {"train_loss": -26.145963668823242, "global_step": 330737, "epoch": 3984} {"train_loss": -25.983606338500977, "global_step": 330738, "epoch": 3984} {"train_loss": -25.903167724609375, "global_step": 330739, "epoch": 3984} {"train_loss": -26.1290340423584, "global_step": 330740, "epoch": 3984} {"train_loss": -25.888227462768555, "global_step": 330741, "epoch": 3984} {"train_loss": -26.15546226501465, "global_step": 330742, "epoch": 3984} {"train_loss": -26.2111873626709, "global_step": 330743, "epoch": 3984} {"train_loss": -25.834400177001953, "global_step": 330744, "epoch": 3984} {"train_loss": -25.712072372436523, "global_step": 330745, "epoch": 3984} {"train_loss": -25.820493698120117, "global_step": 330746, "epoch": 3984} {"train_loss": -26.3612060546875, "global_step": 330747, "epoch": 3984} {"train_loss": -25.81884765625, "global_step": 330748, "epoch": 3984} {"train_loss": -26.08772087097168, "global_step": 330749, "epoch": 3984} {"train_loss": -25.688812255859375, "global_step": 330750, "epoch": 3984} {"train_loss": -25.26109504699707, "global_step": 330751, "epoch": 3984} {"train_loss": -25.092235565185547, "global_step": 330752, "epoch": 3984} {"train_loss": -25.077945709228516, "global_step": 330753, "epoch": 3984} {"train_loss": -25.77593518452472, "global_step": 330754, "epoch": 3984, "val_loss": 7228260.0} {"train_loss": -24.06402587890625, "global_step": 330755, "epoch": 3985} {"train_loss": -24.16701316833496, "global_step": 330756, "epoch": 3985} {"train_loss": -23.937461853027344, "global_step": 330757, "epoch": 3985} {"train_loss": -24.76325798034668, "global_step": 330758, "epoch": 3985} {"train_loss": -24.136558532714844, "global_step": 330759, "epoch": 3985} {"train_loss": -24.758678436279297, "global_step": 330760, "epoch": 3985} {"train_loss": -24.712495803833008, "global_step": 330761, "epoch": 3985} {"train_loss": -24.358983993530273, "global_step": 330762, "epoch": 3985} {"train_loss": -25.116836547851562, "global_step": 330763, "epoch": 3985} {"train_loss": -24.67490005493164, "global_step": 330764, "epoch": 3985} {"train_loss": -24.863859176635742, "global_step": 330765, "epoch": 3985} {"train_loss": -25.002859115600586, "global_step": 330766, "epoch": 3985} {"train_loss": -25.326374053955078, "global_step": 330767, "epoch": 3985} {"train_loss": -24.854345321655273, "global_step": 330768, "epoch": 3985} {"train_loss": -25.144689559936523, "global_step": 330769, "epoch": 3985} {"train_loss": -25.29602813720703, "global_step": 330770, "epoch": 3985} {"train_loss": -24.755422592163086, "global_step": 330771, "epoch": 3985} {"train_loss": -25.483198165893555, "global_step": 330772, "epoch": 3985} {"train_loss": -25.46522331237793, "global_step": 330773, "epoch": 3985} {"train_loss": -25.110580444335938, "global_step": 330774, "epoch": 3985} {"train_loss": -25.330768585205078, "global_step": 330775, "epoch": 3985} {"train_loss": -25.553516387939453, "global_step": 330776, "epoch": 3985} {"train_loss": -25.824661254882812, "global_step": 330777, "epoch": 3985} {"train_loss": -25.77863883972168, "global_step": 330778, "epoch": 3985} {"train_loss": -25.361783981323242, "global_step": 330779, "epoch": 3985} {"train_loss": -25.87457847595215, "global_step": 330780, "epoch": 3985} {"train_loss": -25.465925216674805, "global_step": 330781, "epoch": 3985} {"train_loss": -25.285802841186523, "global_step": 330782, "epoch": 3985} {"train_loss": -25.274892807006836, "global_step": 330783, "epoch": 3985} {"train_loss": -25.816497802734375, "global_step": 330784, "epoch": 3985} {"train_loss": -25.4746150970459, "global_step": 330785, "epoch": 3985} {"train_loss": -25.689496994018555, "global_step": 330786, "epoch": 3985} {"train_loss": -25.808393478393555, "global_step": 330787, "epoch": 3985} {"train_loss": -25.95088005065918, "global_step": 330788, "epoch": 3985} {"train_loss": -26.06829833984375, "global_step": 330789, "epoch": 3985} {"train_loss": -25.557342529296875, "global_step": 330790, "epoch": 3985} {"train_loss": -25.778223037719727, "global_step": 330791, "epoch": 3985} {"train_loss": -25.988325119018555, "global_step": 330792, "epoch": 3985} {"train_loss": -25.771106719970703, "global_step": 330793, "epoch": 3985} {"train_loss": -26.014612197875977, "global_step": 330794, "epoch": 3985} {"train_loss": -26.04070472717285, "global_step": 330795, "epoch": 3985} {"train_loss": -25.88726234436035, "global_step": 330796, "epoch": 3985} {"train_loss": -25.808874130249023, "global_step": 330797, "epoch": 3985} {"train_loss": -25.939416885375977, "global_step": 330798, "epoch": 3985} {"train_loss": -26.054615020751953, "global_step": 330799, "epoch": 3985} {"train_loss": -25.762781143188477, "global_step": 330800, "epoch": 3985} {"train_loss": -26.230838775634766, "global_step": 330801, "epoch": 3985} {"train_loss": -26.190353393554688, "global_step": 330802, "epoch": 3985} {"train_loss": -25.884546279907227, "global_step": 330803, "epoch": 3985} {"train_loss": -26.420795440673828, "global_step": 330804, "epoch": 3985} {"train_loss": -26.247785568237305, "global_step": 330805, "epoch": 3985} {"train_loss": -26.02545738220215, "global_step": 330806, "epoch": 3985} {"train_loss": -25.897476196289062, "global_step": 330807, "epoch": 3985} {"train_loss": -26.10060691833496, "global_step": 330808, "epoch": 3985} {"train_loss": -26.124441146850586, "global_step": 330809, "epoch": 3985} {"train_loss": -25.98542594909668, "global_step": 330810, "epoch": 3985} {"train_loss": -26.157440185546875, "global_step": 330811, "epoch": 3985} {"train_loss": -26.569318771362305, "global_step": 330812, "epoch": 3985} {"train_loss": -25.912057876586914, "global_step": 330813, "epoch": 3985} {"train_loss": -26.225492477416992, "global_step": 330814, "epoch": 3985} {"train_loss": -26.021442413330078, "global_step": 330815, "epoch": 3985} {"train_loss": -26.042098999023438, "global_step": 330816, "epoch": 3985} {"train_loss": -26.66301918029785, "global_step": 330817, "epoch": 3985} {"train_loss": -26.265796661376953, "global_step": 330818, "epoch": 3985} {"train_loss": -25.95172119140625, "global_step": 330819, "epoch": 3985} {"train_loss": -26.00022315979004, "global_step": 330820, "epoch": 3985} {"train_loss": -26.361234664916992, "global_step": 330821, "epoch": 3985} {"train_loss": -26.242908477783203, "global_step": 330822, "epoch": 3985} {"train_loss": -25.973974227905273, "global_step": 330823, "epoch": 3985} {"train_loss": -26.247594833374023, "global_step": 330824, "epoch": 3985} {"train_loss": -25.976842880249023, "global_step": 330825, "epoch": 3985} {"train_loss": -26.234899520874023, "global_step": 330826, "epoch": 3985} {"train_loss": -26.136905670166016, "global_step": 330827, "epoch": 3985} {"train_loss": -26.310409545898438, "global_step": 330828, "epoch": 3985} {"train_loss": -26.106109619140625, "global_step": 330829, "epoch": 3985} {"train_loss": -26.033023834228516, "global_step": 330830, "epoch": 3985} {"train_loss": -25.844451904296875, "global_step": 330831, "epoch": 3985} {"train_loss": -25.385425567626953, "global_step": 330832, "epoch": 3985} {"train_loss": -24.74030876159668, "global_step": 330833, "epoch": 3985} {"train_loss": -24.551523208618164, "global_step": 330834, "epoch": 3985} {"train_loss": -24.215503692626953, "global_step": 330835, "epoch": 3985} {"train_loss": -25.678943634033203, "global_step": 330836, "epoch": 3985} {"train_loss": -25.610965452998517, "global_step": 330837, "epoch": 3985, "val_loss": 7124744.0} {"train_loss": -23.88675880432129, "global_step": 330838, "epoch": 3986} {"train_loss": -23.565397262573242, "global_step": 330839, "epoch": 3986} {"train_loss": -24.065101623535156, "global_step": 330840, "epoch": 3986} {"train_loss": -23.838125228881836, "global_step": 330841, "epoch": 3986} {"train_loss": -24.566696166992188, "global_step": 330842, "epoch": 3986} {"train_loss": -24.591449737548828, "global_step": 330843, "epoch": 3986} {"train_loss": -24.30660057067871, "global_step": 330844, "epoch": 3986} {"train_loss": -24.93791389465332, "global_step": 330845, "epoch": 3986} {"train_loss": -24.09657096862793, "global_step": 330846, "epoch": 3986} {"train_loss": -24.752134323120117, "global_step": 330847, "epoch": 3986} {"train_loss": -25.04886817932129, "global_step": 330848, "epoch": 3986} {"train_loss": -24.904394149780273, "global_step": 330849, "epoch": 3986} {"train_loss": -24.7065372467041, "global_step": 330850, "epoch": 3986} {"train_loss": -24.824277877807617, "global_step": 330851, "epoch": 3986} {"train_loss": -24.799802780151367, "global_step": 330852, "epoch": 3986} {"train_loss": -24.7670841217041, "global_step": 330853, "epoch": 3986} {"train_loss": -25.306621551513672, "global_step": 330854, "epoch": 3986} {"train_loss": -25.160451889038086, "global_step": 330855, "epoch": 3986} {"train_loss": -25.03707504272461, "global_step": 330856, "epoch": 3986} {"train_loss": -25.045257568359375, "global_step": 330857, "epoch": 3986} {"train_loss": -24.84922218322754, "global_step": 330858, "epoch": 3986} {"train_loss": -25.328393936157227, "global_step": 330859, "epoch": 3986} {"train_loss": -25.348569869995117, "global_step": 330860, "epoch": 3986} {"train_loss": -25.2445068359375, "global_step": 330861, "epoch": 3986} {"train_loss": -25.678308486938477, "global_step": 330862, "epoch": 3986} {"train_loss": -25.737173080444336, "global_step": 330863, "epoch": 3986} {"train_loss": -24.92127799987793, "global_step": 330864, "epoch": 3986} {"train_loss": -25.742658615112305, "global_step": 330865, "epoch": 3986} {"train_loss": -25.868295669555664, "global_step": 330866, "epoch": 3986} {"train_loss": -25.484132766723633, "global_step": 330867, "epoch": 3986} {"train_loss": -25.56879997253418, "global_step": 330868, "epoch": 3986} {"train_loss": -25.61882972717285, "global_step": 330869, "epoch": 3986} {"train_loss": -25.569683074951172, "global_step": 330870, "epoch": 3986} {"train_loss": -25.587738037109375, "global_step": 330871, "epoch": 3986} {"train_loss": -25.606109619140625, "global_step": 330872, "epoch": 3986} {"train_loss": -25.47344398498535, "global_step": 330873, "epoch": 3986} {"train_loss": -25.256912231445312, "global_step": 330874, "epoch": 3986} {"train_loss": -25.493528366088867, "global_step": 330875, "epoch": 3986} {"train_loss": -26.090579986572266, "global_step": 330876, "epoch": 3986} {"train_loss": -25.910261154174805, "global_step": 330877, "epoch": 3986} {"train_loss": -25.610645294189453, "global_step": 330878, "epoch": 3986} {"train_loss": -25.784210205078125, "global_step": 330879, "epoch": 3986} {"train_loss": -25.524160385131836, "global_step": 330880, "epoch": 3986} {"train_loss": -25.795547485351562, "global_step": 330881, "epoch": 3986} {"train_loss": -25.971323013305664, "global_step": 330882, "epoch": 3986} {"train_loss": -26.25015640258789, "global_step": 330883, "epoch": 3986} {"train_loss": -25.906116485595703, "global_step": 330884, "epoch": 3986} {"train_loss": -25.450666427612305, "global_step": 330885, "epoch": 3986} {"train_loss": -25.996204376220703, "global_step": 330886, "epoch": 3986} {"train_loss": -25.812774658203125, "global_step": 330887, "epoch": 3986} {"train_loss": -25.500595092773438, "global_step": 330888, "epoch": 3986} {"train_loss": -26.07806396484375, "global_step": 330889, "epoch": 3986} {"train_loss": -26.204931259155273, "global_step": 330890, "epoch": 3986} {"train_loss": -25.821247100830078, "global_step": 330891, "epoch": 3986} {"train_loss": -25.717620849609375, "global_step": 330892, "epoch": 3986} {"train_loss": -25.69461441040039, "global_step": 330893, "epoch": 3986} {"train_loss": -25.98821449279785, "global_step": 330894, "epoch": 3986} {"train_loss": -25.922292709350586, "global_step": 330895, "epoch": 3986} {"train_loss": -25.873580932617188, "global_step": 330896, "epoch": 3986} {"train_loss": -25.940893173217773, "global_step": 330897, "epoch": 3986} {"train_loss": -25.91639518737793, "global_step": 330898, "epoch": 3986} {"train_loss": -25.92890739440918, "global_step": 330899, "epoch": 3986} {"train_loss": -26.19830894470215, "global_step": 330900, "epoch": 3986} {"train_loss": -26.029260635375977, "global_step": 330901, "epoch": 3986} {"train_loss": -25.762632369995117, "global_step": 330902, "epoch": 3986} {"train_loss": -26.301227569580078, "global_step": 330903, "epoch": 3986} {"train_loss": -25.657175064086914, "global_step": 330904, "epoch": 3986} {"train_loss": -25.770490646362305, "global_step": 330905, "epoch": 3986} {"train_loss": -25.834314346313477, "global_step": 330906, "epoch": 3986} {"train_loss": -26.13605308532715, "global_step": 330907, "epoch": 3986} {"train_loss": -25.91092300415039, "global_step": 330908, "epoch": 3986} {"train_loss": -25.827350616455078, "global_step": 330909, "epoch": 3986} {"train_loss": -25.91438102722168, "global_step": 330910, "epoch": 3986} {"train_loss": -26.19815444946289, "global_step": 330911, "epoch": 3986} {"train_loss": -25.979446411132812, "global_step": 330912, "epoch": 3986} {"train_loss": -25.896921157836914, "global_step": 330913, "epoch": 3986} {"train_loss": -25.978534698486328, "global_step": 330914, "epoch": 3986} {"train_loss": -25.586912155151367, "global_step": 330915, "epoch": 3986} {"train_loss": -26.471357345581055, "global_step": 330916, "epoch": 3986} {"train_loss": -25.921920776367188, "global_step": 330917, "epoch": 3986} {"train_loss": -26.07673454284668, "global_step": 330918, "epoch": 3986} {"train_loss": -26.041400909423828, "global_step": 330919, "epoch": 3986} {"train_loss": -25.500227204288343, "global_step": 330920, "epoch": 3986, "val_loss": 7142153.0} {"train_loss": -25.441076278686523, "global_step": 330921, "epoch": 3987} {"train_loss": -25.57708740234375, "global_step": 330922, "epoch": 3987} {"train_loss": -25.662458419799805, "global_step": 330923, "epoch": 3987} {"train_loss": -25.383739471435547, "global_step": 330924, "epoch": 3987} {"train_loss": -25.38374900817871, "global_step": 330925, "epoch": 3987} {"train_loss": -25.424589157104492, "global_step": 330926, "epoch": 3987} {"train_loss": -25.572980880737305, "global_step": 330927, "epoch": 3987} {"train_loss": -26.365854263305664, "global_step": 330928, "epoch": 3987} {"train_loss": -25.8124942779541, "global_step": 330929, "epoch": 3987} {"train_loss": -25.706701278686523, "global_step": 330930, "epoch": 3987} {"train_loss": -25.893178939819336, "global_step": 330931, "epoch": 3987} {"train_loss": -25.715076446533203, "global_step": 330932, "epoch": 3987} {"train_loss": -25.388944625854492, "global_step": 330933, "epoch": 3987} {"train_loss": -25.80840492248535, "global_step": 330934, "epoch": 3987} {"train_loss": -25.68373680114746, "global_step": 330935, "epoch": 3987} {"train_loss": -25.724716186523438, "global_step": 330936, "epoch": 3987} {"train_loss": -25.643096923828125, "global_step": 330937, "epoch": 3987} {"train_loss": -25.762704849243164, "global_step": 330938, "epoch": 3987} {"train_loss": -25.90885353088379, "global_step": 330939, "epoch": 3987} {"train_loss": -25.7646427154541, "global_step": 330940, "epoch": 3987} {"train_loss": -26.116540908813477, "global_step": 330941, "epoch": 3987} {"train_loss": -26.088623046875, "global_step": 330942, "epoch": 3987} {"train_loss": -25.773664474487305, "global_step": 330943, "epoch": 3987} {"train_loss": -26.041547775268555, "global_step": 330944, "epoch": 3987} {"train_loss": -25.978286743164062, "global_step": 330945, "epoch": 3987} {"train_loss": -25.549673080444336, "global_step": 330946, "epoch": 3987} {"train_loss": -25.673980712890625, "global_step": 330947, "epoch": 3987} {"train_loss": -25.70453453063965, "global_step": 330948, "epoch": 3987} {"train_loss": -26.013635635375977, "global_step": 330949, "epoch": 3987} {"train_loss": -26.158517837524414, "global_step": 330950, "epoch": 3987} {"train_loss": -26.12972068786621, "global_step": 330951, "epoch": 3987} {"train_loss": -26.237720489501953, "global_step": 330952, "epoch": 3987} {"train_loss": -26.1340389251709, "global_step": 330953, "epoch": 3987} {"train_loss": -26.09084129333496, "global_step": 330954, "epoch": 3987} {"train_loss": -25.940317153930664, "global_step": 330955, "epoch": 3987} {"train_loss": -26.165210723876953, "global_step": 330956, "epoch": 3987} {"train_loss": -25.989459991455078, "global_step": 330957, "epoch": 3987} {"train_loss": -25.734582901000977, "global_step": 330958, "epoch": 3987} {"train_loss": -25.887781143188477, "global_step": 330959, "epoch": 3987} {"train_loss": -26.432477951049805, "global_step": 330960, "epoch": 3987} {"train_loss": -26.09343910217285, "global_step": 330961, "epoch": 3987} {"train_loss": -26.25824546813965, "global_step": 330962, "epoch": 3987} {"train_loss": -26.054243087768555, "global_step": 330963, "epoch": 3987} {"train_loss": -25.981786727905273, "global_step": 330964, "epoch": 3987} {"train_loss": -25.83017349243164, "global_step": 330965, "epoch": 3987} {"train_loss": -25.9942626953125, "global_step": 330966, "epoch": 3987} {"train_loss": -25.93353843688965, "global_step": 330967, "epoch": 3987} {"train_loss": -26.374805450439453, "global_step": 330968, "epoch": 3987} {"train_loss": -26.1043643951416, "global_step": 330969, "epoch": 3987} {"train_loss": -26.182315826416016, "global_step": 330970, "epoch": 3987} {"train_loss": -26.496557235717773, "global_step": 330971, "epoch": 3987} {"train_loss": -26.20436668395996, "global_step": 330972, "epoch": 3987} {"train_loss": -26.11311912536621, "global_step": 330973, "epoch": 3987} {"train_loss": -26.07718276977539, "global_step": 330974, "epoch": 3987} {"train_loss": -26.1070499420166, "global_step": 330975, "epoch": 3987} {"train_loss": -26.393341064453125, "global_step": 330976, "epoch": 3987} {"train_loss": -26.09944725036621, "global_step": 330977, "epoch": 3987} {"train_loss": -26.105443954467773, "global_step": 330978, "epoch": 3987} {"train_loss": -26.135385513305664, "global_step": 330979, "epoch": 3987} {"train_loss": -26.183149337768555, "global_step": 330980, "epoch": 3987} {"train_loss": -25.930219650268555, "global_step": 330981, "epoch": 3987} {"train_loss": -25.83156394958496, "global_step": 330982, "epoch": 3987} {"train_loss": -25.89668083190918, "global_step": 330983, "epoch": 3987} {"train_loss": -25.74141502380371, "global_step": 330984, "epoch": 3987} {"train_loss": -25.970062255859375, "global_step": 330985, "epoch": 3987} {"train_loss": -26.46055030822754, "global_step": 330986, "epoch": 3987} {"train_loss": -25.87529945373535, "global_step": 330987, "epoch": 3987} {"train_loss": -25.83077049255371, "global_step": 330988, "epoch": 3987} {"train_loss": -26.187625885009766, "global_step": 330989, "epoch": 3987} {"train_loss": -26.054431915283203, "global_step": 330990, "epoch": 3987} {"train_loss": -25.9320068359375, "global_step": 330991, "epoch": 3987} {"train_loss": -26.139057159423828, "global_step": 330992, "epoch": 3987} {"train_loss": -26.302886962890625, "global_step": 330993, "epoch": 3987} {"train_loss": -26.187335968017578, "global_step": 330994, "epoch": 3987} {"train_loss": -26.094863891601562, "global_step": 330995, "epoch": 3987} {"train_loss": -26.453638076782227, "global_step": 330996, "epoch": 3987} {"train_loss": -26.333173751831055, "global_step": 330997, "epoch": 3987} {"train_loss": -26.203779220581055, "global_step": 330998, "epoch": 3987} {"train_loss": -25.916263580322266, "global_step": 330999, "epoch": 3987} {"train_loss": -26.296178817749023, "global_step": 331000, "epoch": 3987} {"train_loss": -26.078998565673828, "global_step": 331001, "epoch": 3987} {"train_loss": -25.942712783813477, "global_step": 331002, "epoch": 3987} {"train_loss": -25.985520305403742, "global_step": 331003, "epoch": 3987, "val_loss": 7248612.0} {"train_loss": -24.19708824157715, "global_step": 331004, "epoch": 3988} {"train_loss": -23.278228759765625, "global_step": 331005, "epoch": 3988} {"train_loss": -23.034549713134766, "global_step": 331006, "epoch": 3988} {"train_loss": -24.085193634033203, "global_step": 331007, "epoch": 3988} {"train_loss": -24.94771385192871, "global_step": 331008, "epoch": 3988} {"train_loss": -24.341337203979492, "global_step": 331009, "epoch": 3988} {"train_loss": -24.82078742980957, "global_step": 331010, "epoch": 3988} {"train_loss": -24.886669158935547, "global_step": 331011, "epoch": 3988} {"train_loss": -24.80402946472168, "global_step": 331012, "epoch": 3988} {"train_loss": -25.07649803161621, "global_step": 331013, "epoch": 3988} {"train_loss": -25.206953048706055, "global_step": 331014, "epoch": 3988} {"train_loss": -24.737226486206055, "global_step": 331015, "epoch": 3988} {"train_loss": -25.056100845336914, "global_step": 331016, "epoch": 3988} {"train_loss": -25.45128059387207, "global_step": 331017, "epoch": 3988} {"train_loss": -25.057065963745117, "global_step": 331018, "epoch": 3988} {"train_loss": -24.93561363220215, "global_step": 331019, "epoch": 3988} {"train_loss": -25.437419891357422, "global_step": 331020, "epoch": 3988} {"train_loss": -24.916433334350586, "global_step": 331021, "epoch": 3988} {"train_loss": -25.08037757873535, "global_step": 331022, "epoch": 3988} {"train_loss": -25.6391544342041, "global_step": 331023, "epoch": 3988} {"train_loss": -25.294586181640625, "global_step": 331024, "epoch": 3988} {"train_loss": -25.558740615844727, "global_step": 331025, "epoch": 3988} {"train_loss": -25.280759811401367, "global_step": 331026, "epoch": 3988} {"train_loss": -25.568986892700195, "global_step": 331027, "epoch": 3988} {"train_loss": -25.63689613342285, "global_step": 331028, "epoch": 3988} {"train_loss": -25.876306533813477, "global_step": 331029, "epoch": 3988} {"train_loss": -25.650238037109375, "global_step": 331030, "epoch": 3988} {"train_loss": -25.708967208862305, "global_step": 331031, "epoch": 3988} {"train_loss": -25.6640682220459, "global_step": 331032, "epoch": 3988} {"train_loss": -25.88551139831543, "global_step": 331033, "epoch": 3988} {"train_loss": -25.554771423339844, "global_step": 331034, "epoch": 3988} {"train_loss": -26.084325790405273, "global_step": 331035, "epoch": 3988} {"train_loss": -25.800378799438477, "global_step": 331036, "epoch": 3988} {"train_loss": -25.8061580657959, "global_step": 331037, "epoch": 3988} {"train_loss": -25.87794303894043, "global_step": 331038, "epoch": 3988} {"train_loss": -25.793170928955078, "global_step": 331039, "epoch": 3988} {"train_loss": -25.757558822631836, "global_step": 331040, "epoch": 3988} {"train_loss": -25.689069747924805, "global_step": 331041, "epoch": 3988} {"train_loss": -25.8472843170166, "global_step": 331042, "epoch": 3988} {"train_loss": -25.811792373657227, "global_step": 331043, "epoch": 3988} {"train_loss": -25.959217071533203, "global_step": 331044, "epoch": 3988} {"train_loss": -25.95515251159668, "global_step": 331045, "epoch": 3988} {"train_loss": -26.311010360717773, "global_step": 331046, "epoch": 3988} {"train_loss": -25.874801635742188, "global_step": 331047, "epoch": 3988} {"train_loss": -26.292373657226562, "global_step": 331048, "epoch": 3988} {"train_loss": -25.927839279174805, "global_step": 331049, "epoch": 3988} {"train_loss": -26.074426651000977, "global_step": 331050, "epoch": 3988} {"train_loss": -25.98883628845215, "global_step": 331051, "epoch": 3988} {"train_loss": -26.270471572875977, "global_step": 331052, "epoch": 3988} {"train_loss": -26.13661003112793, "global_step": 331053, "epoch": 3988} {"train_loss": -26.28998374938965, "global_step": 331054, "epoch": 3988} {"train_loss": -26.18482780456543, "global_step": 331055, "epoch": 3988} {"train_loss": -25.88483238220215, "global_step": 331056, "epoch": 3988} {"train_loss": -25.822021484375, "global_step": 331057, "epoch": 3988} {"train_loss": -25.719058990478516, "global_step": 331058, "epoch": 3988} {"train_loss": -25.91077995300293, "global_step": 331059, "epoch": 3988} {"train_loss": -26.06640625, "global_step": 331060, "epoch": 3988} {"train_loss": -25.70330238342285, "global_step": 331061, "epoch": 3988} {"train_loss": -25.53779411315918, "global_step": 331062, "epoch": 3988} {"train_loss": -25.81439208984375, "global_step": 331063, "epoch": 3988} {"train_loss": -26.048364639282227, "global_step": 331064, "epoch": 3988} {"train_loss": -25.909143447875977, "global_step": 331065, "epoch": 3988} {"train_loss": -25.8494873046875, "global_step": 331066, "epoch": 3988} {"train_loss": -25.82305335998535, "global_step": 331067, "epoch": 3988} {"train_loss": -25.906681060791016, "global_step": 331068, "epoch": 3988} {"train_loss": -26.028461456298828, "global_step": 331069, "epoch": 3988} {"train_loss": -26.161447525024414, "global_step": 331070, "epoch": 3988} {"train_loss": -25.8023681640625, "global_step": 331071, "epoch": 3988} {"train_loss": -26.04679298400879, "global_step": 331072, "epoch": 3988} {"train_loss": -26.175649642944336, "global_step": 331073, "epoch": 3988} {"train_loss": -25.67020034790039, "global_step": 331074, "epoch": 3988} {"train_loss": -26.316059112548828, "global_step": 331075, "epoch": 3988} {"train_loss": -26.140094757080078, "global_step": 331076, "epoch": 3988} {"train_loss": -25.933263778686523, "global_step": 331077, "epoch": 3988} {"train_loss": -25.63165855407715, "global_step": 331078, "epoch": 3988} {"train_loss": -25.90235710144043, "global_step": 331079, "epoch": 3988} {"train_loss": -26.07667350769043, "global_step": 331080, "epoch": 3988} {"train_loss": -26.234540939331055, "global_step": 331081, "epoch": 3988} {"train_loss": -26.294647216796875, "global_step": 331082, "epoch": 3988} {"train_loss": -26.364072799682617, "global_step": 331083, "epoch": 3988} {"train_loss": -26.247777938842773, "global_step": 331084, "epoch": 3988} {"train_loss": -26.072290420532227, "global_step": 331085, "epoch": 3988} {"train_loss": -25.629939757197736, "global_step": 331086, "epoch": 3988, "val_loss": 7250106.5} {"train_loss": -25.134862899780273, "global_step": 331087, "epoch": 3989} {"train_loss": -25.2607364654541, "global_step": 331088, "epoch": 3989} {"train_loss": -25.402414321899414, "global_step": 331089, "epoch": 3989} {"train_loss": -25.027496337890625, "global_step": 331090, "epoch": 3989} {"train_loss": -24.786579132080078, "global_step": 331091, "epoch": 3989} {"train_loss": -25.4910888671875, "global_step": 331092, "epoch": 3989} {"train_loss": -25.4228458404541, "global_step": 331093, "epoch": 3989} {"train_loss": -25.227638244628906, "global_step": 331094, "epoch": 3989} {"train_loss": -25.496891021728516, "global_step": 331095, "epoch": 3989} {"train_loss": -25.3100528717041, "global_step": 331096, "epoch": 3989} {"train_loss": -25.76369285583496, "global_step": 331097, "epoch": 3989} {"train_loss": -25.391538619995117, "global_step": 331098, "epoch": 3989} {"train_loss": -25.796300888061523, "global_step": 331099, "epoch": 3989} {"train_loss": -25.42407989501953, "global_step": 331100, "epoch": 3989} {"train_loss": -25.485450744628906, "global_step": 331101, "epoch": 3989} {"train_loss": -25.248857498168945, "global_step": 331102, "epoch": 3989} {"train_loss": -25.78336524963379, "global_step": 331103, "epoch": 3989} {"train_loss": -25.785938262939453, "global_step": 331104, "epoch": 3989} {"train_loss": -26.040512084960938, "global_step": 331105, "epoch": 3989} {"train_loss": -25.668598175048828, "global_step": 331106, "epoch": 3989} {"train_loss": -25.705322265625, "global_step": 331107, "epoch": 3989} {"train_loss": -25.477346420288086, "global_step": 331108, "epoch": 3989} {"train_loss": -25.856983184814453, "global_step": 331109, "epoch": 3989} {"train_loss": -25.81149673461914, "global_step": 331110, "epoch": 3989} {"train_loss": -25.649133682250977, "global_step": 331111, "epoch": 3989} {"train_loss": -25.931232452392578, "global_step": 331112, "epoch": 3989} {"train_loss": -26.19523048400879, "global_step": 331113, "epoch": 3989} {"train_loss": -26.00831413269043, "global_step": 331114, "epoch": 3989} {"train_loss": -25.645278930664062, "global_step": 331115, "epoch": 3989} {"train_loss": -25.665563583374023, "global_step": 331116, "epoch": 3989} {"train_loss": -25.997791290283203, "global_step": 331117, "epoch": 3989} {"train_loss": -26.28889274597168, "global_step": 331118, "epoch": 3989} {"train_loss": -25.72224235534668, "global_step": 331119, "epoch": 3989} {"train_loss": -26.12005615234375, "global_step": 331120, "epoch": 3989} {"train_loss": -25.860517501831055, "global_step": 331121, "epoch": 3989} {"train_loss": -26.056970596313477, "global_step": 331122, "epoch": 3989} {"train_loss": -26.096466064453125, "global_step": 331123, "epoch": 3989} {"train_loss": -25.9537296295166, "global_step": 331124, "epoch": 3989} {"train_loss": -25.57422637939453, "global_step": 331125, "epoch": 3989} {"train_loss": -25.668561935424805, "global_step": 331126, "epoch": 3989} {"train_loss": -26.263158798217773, "global_step": 331127, "epoch": 3989} {"train_loss": -25.73091697692871, "global_step": 331128, "epoch": 3989} {"train_loss": -26.400653839111328, "global_step": 331129, "epoch": 3989} {"train_loss": -26.39057731628418, "global_step": 331130, "epoch": 3989} {"train_loss": -25.89747428894043, "global_step": 331131, "epoch": 3989} {"train_loss": -26.0854434967041, "global_step": 331132, "epoch": 3989} {"train_loss": -26.09980583190918, "global_step": 331133, "epoch": 3989} {"train_loss": -26.267963409423828, "global_step": 331134, "epoch": 3989} {"train_loss": -26.347187042236328, "global_step": 331135, "epoch": 3989} {"train_loss": -25.979618072509766, "global_step": 331136, "epoch": 3989} {"train_loss": -26.03565788269043, "global_step": 331137, "epoch": 3989} {"train_loss": -26.217138290405273, "global_step": 331138, "epoch": 3989} {"train_loss": -25.82940101623535, "global_step": 331139, "epoch": 3989} {"train_loss": -26.416431427001953, "global_step": 331140, "epoch": 3989} {"train_loss": -26.1208438873291, "global_step": 331141, "epoch": 3989} {"train_loss": -26.449859619140625, "global_step": 331142, "epoch": 3989} {"train_loss": -25.96302604675293, "global_step": 331143, "epoch": 3989} {"train_loss": -25.9963321685791, "global_step": 331144, "epoch": 3989} {"train_loss": -25.98798179626465, "global_step": 331145, "epoch": 3989} {"train_loss": -26.037939071655273, "global_step": 331146, "epoch": 3989} {"train_loss": -26.107961654663086, "global_step": 331147, "epoch": 3989} {"train_loss": -25.958377838134766, "global_step": 331148, "epoch": 3989} {"train_loss": -25.9482421875, "global_step": 331149, "epoch": 3989} {"train_loss": -25.641088485717773, "global_step": 331150, "epoch": 3989} {"train_loss": -25.39775276184082, "global_step": 331151, "epoch": 3989} {"train_loss": -25.93348503112793, "global_step": 331152, "epoch": 3989} {"train_loss": -26.256256103515625, "global_step": 331153, "epoch": 3989} {"train_loss": -25.93397331237793, "global_step": 331154, "epoch": 3989} {"train_loss": -25.761688232421875, "global_step": 331155, "epoch": 3989} {"train_loss": -25.786176681518555, "global_step": 331156, "epoch": 3989} {"train_loss": -26.124897003173828, "global_step": 331157, "epoch": 3989} {"train_loss": -25.897207260131836, "global_step": 331158, "epoch": 3989} {"train_loss": -25.798765182495117, "global_step": 331159, "epoch": 3989} {"train_loss": -25.870695114135742, "global_step": 331160, "epoch": 3989} {"train_loss": -25.837446212768555, "global_step": 331161, "epoch": 3989} {"train_loss": -25.784887313842773, "global_step": 331162, "epoch": 3989} {"train_loss": -26.161136627197266, "global_step": 331163, "epoch": 3989} {"train_loss": -25.932525634765625, "global_step": 331164, "epoch": 3989} {"train_loss": -26.046817779541016, "global_step": 331165, "epoch": 3989} {"train_loss": -25.94705581665039, "global_step": 331166, "epoch": 3989} {"train_loss": -26.026960372924805, "global_step": 331167, "epoch": 3989} {"train_loss": -26.08673667907715, "global_step": 331168, "epoch": 3989} {"train_loss": -25.858699798583984, "global_step": 331169, "epoch": 3989, "val_loss": 7231748.0} {"train_loss": -25.521015167236328, "global_step": 331170, "epoch": 3990} {"train_loss": -25.56182289123535, "global_step": 331171, "epoch": 3990} {"train_loss": -25.9001407623291, "global_step": 331172, "epoch": 3990} {"train_loss": -25.781583786010742, "global_step": 331173, "epoch": 3990} {"train_loss": -25.718326568603516, "global_step": 331174, "epoch": 3990} {"train_loss": -25.782150268554688, "global_step": 331175, "epoch": 3990} {"train_loss": -25.600683212280273, "global_step": 331176, "epoch": 3990} {"train_loss": -25.982080459594727, "global_step": 331177, "epoch": 3990} {"train_loss": -25.843311309814453, "global_step": 331178, "epoch": 3990} {"train_loss": -25.857208251953125, "global_step": 331179, "epoch": 3990} {"train_loss": -25.690185546875, "global_step": 331180, "epoch": 3990} {"train_loss": -26.028310775756836, "global_step": 331181, "epoch": 3990} {"train_loss": -26.28570556640625, "global_step": 331182, "epoch": 3990} {"train_loss": -26.503097534179688, "global_step": 331183, "epoch": 3990} {"train_loss": -25.708209991455078, "global_step": 331184, "epoch": 3990} {"train_loss": -25.680917739868164, "global_step": 331185, "epoch": 3990} {"train_loss": -25.85047721862793, "global_step": 331186, "epoch": 3990} {"train_loss": -26.041839599609375, "global_step": 331187, "epoch": 3990} {"train_loss": -25.880712509155273, "global_step": 331188, "epoch": 3990} {"train_loss": -25.844324111938477, "global_step": 331189, "epoch": 3990} {"train_loss": -25.93531608581543, "global_step": 331190, "epoch": 3990} {"train_loss": -25.638471603393555, "global_step": 331191, "epoch": 3990} {"train_loss": -25.91932487487793, "global_step": 331192, "epoch": 3990} {"train_loss": -25.84956932067871, "global_step": 331193, "epoch": 3990} {"train_loss": -25.8782901763916, "global_step": 331194, "epoch": 3990} {"train_loss": -25.7562198638916, "global_step": 331195, "epoch": 3990} {"train_loss": -25.661376953125, "global_step": 331196, "epoch": 3990} {"train_loss": -26.099700927734375, "global_step": 331197, "epoch": 3990} {"train_loss": -25.812854766845703, "global_step": 331198, "epoch": 3990} {"train_loss": -25.939374923706055, "global_step": 331199, "epoch": 3990} {"train_loss": -26.09109878540039, "global_step": 331200, "epoch": 3990} {"train_loss": -26.08941650390625, "global_step": 331201, "epoch": 3990} {"train_loss": -25.597545623779297, "global_step": 331202, "epoch": 3990} {"train_loss": -25.976224899291992, "global_step": 331203, "epoch": 3990} {"train_loss": -26.163467407226562, "global_step": 331204, "epoch": 3990} {"train_loss": -25.707233428955078, "global_step": 331205, "epoch": 3990} {"train_loss": -26.470428466796875, "global_step": 331206, "epoch": 3990} {"train_loss": -26.090377807617188, "global_step": 331207, "epoch": 3990} {"train_loss": -26.111120223999023, "global_step": 331208, "epoch": 3990} {"train_loss": -25.477920532226562, "global_step": 331209, "epoch": 3990} {"train_loss": -26.086414337158203, "global_step": 331210, "epoch": 3990} {"train_loss": -25.77779197692871, "global_step": 331211, "epoch": 3990} {"train_loss": -25.866003036499023, "global_step": 331212, "epoch": 3990} {"train_loss": -25.756711959838867, "global_step": 331213, "epoch": 3990} {"train_loss": -26.118101119995117, "global_step": 331214, "epoch": 3990} {"train_loss": -25.735137939453125, "global_step": 331215, "epoch": 3990} {"train_loss": -25.950794219970703, "global_step": 331216, "epoch": 3990} {"train_loss": -25.925092697143555, "global_step": 331217, "epoch": 3990} {"train_loss": -26.2070255279541, "global_step": 331218, "epoch": 3990} {"train_loss": -26.201175689697266, "global_step": 331219, "epoch": 3990} {"train_loss": -25.97947120666504, "global_step": 331220, "epoch": 3990} {"train_loss": -26.078643798828125, "global_step": 331221, "epoch": 3990} {"train_loss": -26.11756706237793, "global_step": 331222, "epoch": 3990} {"train_loss": -26.26717185974121, "global_step": 331223, "epoch": 3990} {"train_loss": -26.040014266967773, "global_step": 331224, "epoch": 3990} {"train_loss": -26.105335235595703, "global_step": 331225, "epoch": 3990} {"train_loss": -25.73322105407715, "global_step": 331226, "epoch": 3990} {"train_loss": -26.45290184020996, "global_step": 331227, "epoch": 3990} {"train_loss": -26.13435935974121, "global_step": 331228, "epoch": 3990} {"train_loss": -26.1218318939209, "global_step": 331229, "epoch": 3990} {"train_loss": -26.13343620300293, "global_step": 331230, "epoch": 3990} {"train_loss": -26.324665069580078, "global_step": 331231, "epoch": 3990} {"train_loss": -26.168970108032227, "global_step": 331232, "epoch": 3990} {"train_loss": -26.14533805847168, "global_step": 331233, "epoch": 3990} {"train_loss": -26.13227653503418, "global_step": 331234, "epoch": 3990} {"train_loss": -26.18665885925293, "global_step": 331235, "epoch": 3990} {"train_loss": -26.09552574157715, "global_step": 331236, "epoch": 3990} {"train_loss": -25.917470932006836, "global_step": 331237, "epoch": 3990} {"train_loss": -25.817785263061523, "global_step": 331238, "epoch": 3990} {"train_loss": -26.2282772064209, "global_step": 331239, "epoch": 3990} {"train_loss": -25.820215225219727, "global_step": 331240, "epoch": 3990} {"train_loss": -25.67963218688965, "global_step": 331241, "epoch": 3990} {"train_loss": -26.2366886138916, "global_step": 331242, "epoch": 3990} {"train_loss": -25.471179962158203, "global_step": 331243, "epoch": 3990} {"train_loss": -25.418167114257812, "global_step": 331244, "epoch": 3990} {"train_loss": -25.918975830078125, "global_step": 331245, "epoch": 3990} {"train_loss": -25.4508056640625, "global_step": 331246, "epoch": 3990} {"train_loss": -25.103199005126953, "global_step": 331247, "epoch": 3990} {"train_loss": -25.40742301940918, "global_step": 331248, "epoch": 3990} {"train_loss": -26.144378662109375, "global_step": 331249, "epoch": 3990} {"train_loss": -25.098230361938477, "global_step": 331250, "epoch": 3990} {"train_loss": -25.07660675048828, "global_step": 331251, "epoch": 3990} {"train_loss": -25.908530890223492, "global_step": 331252, "epoch": 3990, "val_loss": 7076226.0} {"train_loss": -25.100095748901367, "global_step": 331253, "epoch": 3991} {"train_loss": -25.4888916015625, "global_step": 331254, "epoch": 3991} {"train_loss": -25.10898780822754, "global_step": 331255, "epoch": 3991} {"train_loss": -25.76824951171875, "global_step": 331256, "epoch": 3991} {"train_loss": -25.33660888671875, "global_step": 331257, "epoch": 3991} {"train_loss": -25.504743576049805, "global_step": 331258, "epoch": 3991} {"train_loss": -25.624860763549805, "global_step": 331259, "epoch": 3991} {"train_loss": -25.27923011779785, "global_step": 331260, "epoch": 3991} {"train_loss": -25.34706687927246, "global_step": 331261, "epoch": 3991} {"train_loss": -25.120197296142578, "global_step": 331262, "epoch": 3991} {"train_loss": -25.736825942993164, "global_step": 331263, "epoch": 3991} {"train_loss": -25.43089485168457, "global_step": 331264, "epoch": 3991} {"train_loss": -25.478239059448242, "global_step": 331265, "epoch": 3991} {"train_loss": -25.324996948242188, "global_step": 331266, "epoch": 3991} {"train_loss": -25.6280517578125, "global_step": 331267, "epoch": 3991} {"train_loss": -25.453813552856445, "global_step": 331268, "epoch": 3991} {"train_loss": -25.91693687438965, "global_step": 331269, "epoch": 3991} {"train_loss": -25.330678939819336, "global_step": 331270, "epoch": 3991} {"train_loss": -25.908349990844727, "global_step": 331271, "epoch": 3991} {"train_loss": -25.612228393554688, "global_step": 331272, "epoch": 3991} {"train_loss": -25.743305206298828, "global_step": 331273, "epoch": 3991} {"train_loss": -25.875104904174805, "global_step": 331274, "epoch": 3991} {"train_loss": -25.76154899597168, "global_step": 331275, "epoch": 3991} {"train_loss": -25.503501892089844, "global_step": 331276, "epoch": 3991} {"train_loss": -25.95070457458496, "global_step": 331277, "epoch": 3991} {"train_loss": -25.725635528564453, "global_step": 331278, "epoch": 3991} {"train_loss": -25.5384521484375, "global_step": 331279, "epoch": 3991} {"train_loss": -25.655553817749023, "global_step": 331280, "epoch": 3991} {"train_loss": -26.17205810546875, "global_step": 331281, "epoch": 3991} {"train_loss": -26.20722007751465, "global_step": 331282, "epoch": 3991} {"train_loss": -25.549774169921875, "global_step": 331283, "epoch": 3991} {"train_loss": -25.808746337890625, "global_step": 331284, "epoch": 3991} {"train_loss": -25.79762077331543, "global_step": 331285, "epoch": 3991} {"train_loss": -25.792646408081055, "global_step": 331286, "epoch": 3991} {"train_loss": -26.056875228881836, "global_step": 331287, "epoch": 3991} {"train_loss": -26.276647567749023, "global_step": 331288, "epoch": 3991} {"train_loss": -26.19888687133789, "global_step": 331289, "epoch": 3991} {"train_loss": -25.743314743041992, "global_step": 331290, "epoch": 3991} {"train_loss": -25.945478439331055, "global_step": 331291, "epoch": 3991} {"train_loss": -26.28712272644043, "global_step": 331292, "epoch": 3991} {"train_loss": -26.164331436157227, "global_step": 331293, "epoch": 3991} {"train_loss": -25.735132217407227, "global_step": 331294, "epoch": 3991} {"train_loss": -26.279077529907227, "global_step": 331295, "epoch": 3991} {"train_loss": -26.25884437561035, "global_step": 331296, "epoch": 3991} {"train_loss": -25.815082550048828, "global_step": 331297, "epoch": 3991} {"train_loss": -25.934179306030273, "global_step": 331298, "epoch": 3991} {"train_loss": -26.1751766204834, "global_step": 331299, "epoch": 3991} {"train_loss": -26.153684616088867, "global_step": 331300, "epoch": 3991} {"train_loss": -26.275304794311523, "global_step": 331301, "epoch": 3991} {"train_loss": -26.134979248046875, "global_step": 331302, "epoch": 3991} {"train_loss": -25.788360595703125, "global_step": 331303, "epoch": 3991} {"train_loss": -26.728239059448242, "global_step": 331304, "epoch": 3991} {"train_loss": -26.298871994018555, "global_step": 331305, "epoch": 3991} {"train_loss": -26.024038314819336, "global_step": 331306, "epoch": 3991} {"train_loss": -26.354413986206055, "global_step": 331307, "epoch": 3991} {"train_loss": -25.937498092651367, "global_step": 331308, "epoch": 3991} {"train_loss": -26.175851821899414, "global_step": 331309, "epoch": 3991} {"train_loss": -26.16449546813965, "global_step": 331310, "epoch": 3991} {"train_loss": -26.0029354095459, "global_step": 331311, "epoch": 3991} {"train_loss": -26.296707153320312, "global_step": 331312, "epoch": 3991} {"train_loss": -26.27920913696289, "global_step": 331313, "epoch": 3991} {"train_loss": -26.4814395904541, "global_step": 331314, "epoch": 3991} {"train_loss": -26.2501163482666, "global_step": 331315, "epoch": 3991} {"train_loss": -25.907270431518555, "global_step": 331316, "epoch": 3991} {"train_loss": -25.98479652404785, "global_step": 331317, "epoch": 3991} {"train_loss": -26.122888565063477, "global_step": 331318, "epoch": 3991} {"train_loss": -26.134723663330078, "global_step": 331319, "epoch": 3991} {"train_loss": -26.08982276916504, "global_step": 331320, "epoch": 3991} {"train_loss": -25.80034828186035, "global_step": 331321, "epoch": 3991} {"train_loss": -25.714344024658203, "global_step": 331322, "epoch": 3991} {"train_loss": -25.67689323425293, "global_step": 331323, "epoch": 3991} {"train_loss": -25.399377822875977, "global_step": 331324, "epoch": 3991} {"train_loss": -26.06369400024414, "global_step": 331325, "epoch": 3991} {"train_loss": -26.355640411376953, "global_step": 331326, "epoch": 3991} {"train_loss": -25.970657348632812, "global_step": 331327, "epoch": 3991} {"train_loss": -26.08167839050293, "global_step": 331328, "epoch": 3991} {"train_loss": -26.48583984375, "global_step": 331329, "epoch": 3991} {"train_loss": -26.212244033813477, "global_step": 331330, "epoch": 3991} {"train_loss": -25.5867977142334, "global_step": 331331, "epoch": 3991} {"train_loss": -25.876752853393555, "global_step": 331332, "epoch": 3991} {"train_loss": -26.33237075805664, "global_step": 331333, "epoch": 3991} {"train_loss": -26.0737361907959, "global_step": 331334, "epoch": 3991} {"train_loss": -25.881158507013897, "global_step": 331335, "epoch": 3991, "val_loss": 7175403.0} {"train_loss": -25.622913360595703, "global_step": 331336, "epoch": 3992} {"train_loss": -25.553882598876953, "global_step": 331337, "epoch": 3992} {"train_loss": -25.721723556518555, "global_step": 331338, "epoch": 3992} {"train_loss": -25.633441925048828, "global_step": 331339, "epoch": 3992} {"train_loss": -25.82146644592285, "global_step": 331340, "epoch": 3992} {"train_loss": -25.6389102935791, "global_step": 331341, "epoch": 3992} {"train_loss": -25.897933959960938, "global_step": 331342, "epoch": 3992} {"train_loss": -25.707563400268555, "global_step": 331343, "epoch": 3992} {"train_loss": -25.8050594329834, "global_step": 331344, "epoch": 3992} {"train_loss": -25.339862823486328, "global_step": 331345, "epoch": 3992} {"train_loss": -25.841291427612305, "global_step": 331346, "epoch": 3992} {"train_loss": -25.818220138549805, "global_step": 331347, "epoch": 3992} {"train_loss": -25.999347686767578, "global_step": 331348, "epoch": 3992} {"train_loss": -25.843658447265625, "global_step": 331349, "epoch": 3992} {"train_loss": -25.439794540405273, "global_step": 331350, "epoch": 3992} {"train_loss": -25.916580200195312, "global_step": 331351, "epoch": 3992} {"train_loss": -25.59092903137207, "global_step": 331352, "epoch": 3992} {"train_loss": -25.72531509399414, "global_step": 331353, "epoch": 3992} {"train_loss": -25.8310489654541, "global_step": 331354, "epoch": 3992} {"train_loss": -25.68927001953125, "global_step": 331355, "epoch": 3992} {"train_loss": -26.01763343811035, "global_step": 331356, "epoch": 3992} {"train_loss": -26.089879989624023, "global_step": 331357, "epoch": 3992} {"train_loss": -25.80632972717285, "global_step": 331358, "epoch": 3992} {"train_loss": -25.67683219909668, "global_step": 331359, "epoch": 3992} {"train_loss": -26.03631019592285, "global_step": 331360, "epoch": 3992} {"train_loss": -26.11673355102539, "global_step": 331361, "epoch": 3992} {"train_loss": -26.1712703704834, "global_step": 331362, "epoch": 3992} {"train_loss": -25.9342041015625, "global_step": 331363, "epoch": 3992} {"train_loss": -25.78131103515625, "global_step": 331364, "epoch": 3992} {"train_loss": -26.188074111938477, "global_step": 331365, "epoch": 3992} {"train_loss": -26.37952995300293, "global_step": 331366, "epoch": 3992} {"train_loss": -25.957868576049805, "global_step": 331367, "epoch": 3992} {"train_loss": -26.323883056640625, "global_step": 331368, "epoch": 3992} {"train_loss": -26.07391929626465, "global_step": 331369, "epoch": 3992} {"train_loss": -26.374052047729492, "global_step": 331370, "epoch": 3992} {"train_loss": -26.07392692565918, "global_step": 331371, "epoch": 3992} {"train_loss": -26.07398796081543, "global_step": 331372, "epoch": 3992} {"train_loss": -26.1922607421875, "global_step": 331373, "epoch": 3992} {"train_loss": -25.9699649810791, "global_step": 331374, "epoch": 3992} {"train_loss": -25.942138671875, "global_step": 331375, "epoch": 3992} {"train_loss": -26.3657283782959, "global_step": 331376, "epoch": 3992} {"train_loss": -26.12347412109375, "global_step": 331377, "epoch": 3992} {"train_loss": -25.889373779296875, "global_step": 331378, "epoch": 3992} {"train_loss": -26.02411460876465, "global_step": 331379, "epoch": 3992} {"train_loss": -25.992176055908203, "global_step": 331380, "epoch": 3992} {"train_loss": -26.576711654663086, "global_step": 331381, "epoch": 3992} {"train_loss": -26.001983642578125, "global_step": 331382, "epoch": 3992} {"train_loss": -26.070188522338867, "global_step": 331383, "epoch": 3992} {"train_loss": -25.294391632080078, "global_step": 331384, "epoch": 3992} {"train_loss": -25.954669952392578, "global_step": 331385, "epoch": 3992} {"train_loss": -25.743314743041992, "global_step": 331386, "epoch": 3992} {"train_loss": -26.298791885375977, "global_step": 331387, "epoch": 3992} {"train_loss": -25.6687068939209, "global_step": 331388, "epoch": 3992} {"train_loss": -25.753116607666016, "global_step": 331389, "epoch": 3992} {"train_loss": -25.806543350219727, "global_step": 331390, "epoch": 3992} {"train_loss": -25.9134521484375, "global_step": 331391, "epoch": 3992} {"train_loss": -25.91193962097168, "global_step": 331392, "epoch": 3992} {"train_loss": -25.942581176757812, "global_step": 331393, "epoch": 3992} {"train_loss": -26.254425048828125, "global_step": 331394, "epoch": 3992} {"train_loss": -25.829681396484375, "global_step": 331395, "epoch": 3992} {"train_loss": -25.73752784729004, "global_step": 331396, "epoch": 3992} {"train_loss": -26.23076820373535, "global_step": 331397, "epoch": 3992} {"train_loss": -25.506162643432617, "global_step": 331398, "epoch": 3992} {"train_loss": -25.868513107299805, "global_step": 331399, "epoch": 3992} {"train_loss": -25.86286735534668, "global_step": 331400, "epoch": 3992} {"train_loss": -25.7430419921875, "global_step": 331401, "epoch": 3992} {"train_loss": -25.817224502563477, "global_step": 331402, "epoch": 3992} {"train_loss": -26.202665328979492, "global_step": 331403, "epoch": 3992} {"train_loss": -25.948104858398438, "global_step": 331404, "epoch": 3992} {"train_loss": -25.982114791870117, "global_step": 331405, "epoch": 3992} {"train_loss": -26.1197452545166, "global_step": 331406, "epoch": 3992} {"train_loss": -26.132360458374023, "global_step": 331407, "epoch": 3992} {"train_loss": -26.025470733642578, "global_step": 331408, "epoch": 3992} {"train_loss": -26.11676025390625, "global_step": 331409, "epoch": 3992} {"train_loss": -25.80799674987793, "global_step": 331410, "epoch": 3992} {"train_loss": -26.448715209960938, "global_step": 331411, "epoch": 3992} {"train_loss": -26.23785972595215, "global_step": 331412, "epoch": 3992} {"train_loss": -25.80838394165039, "global_step": 331413, "epoch": 3992} {"train_loss": -25.976547241210938, "global_step": 331414, "epoch": 3992} {"train_loss": -26.049406051635742, "global_step": 331415, "epoch": 3992} {"train_loss": -25.7929630279541, "global_step": 331416, "epoch": 3992} {"train_loss": -25.821802139282227, "global_step": 331417, "epoch": 3992} {"train_loss": -25.936963736292828, "global_step": 331418, "epoch": 3992, "val_loss": 7161832.0} {"train_loss": -24.48797035217285, "global_step": 331419, "epoch": 3993} {"train_loss": -25.250600814819336, "global_step": 331420, "epoch": 3993} {"train_loss": -25.72340202331543, "global_step": 331421, "epoch": 3993} {"train_loss": -25.20467185974121, "global_step": 331422, "epoch": 3993} {"train_loss": -25.869943618774414, "global_step": 331423, "epoch": 3993} {"train_loss": -25.645965576171875, "global_step": 331424, "epoch": 3993} {"train_loss": -26.189685821533203, "global_step": 331425, "epoch": 3993} {"train_loss": -25.68729019165039, "global_step": 331426, "epoch": 3993} {"train_loss": -26.01016616821289, "global_step": 331427, "epoch": 3993} {"train_loss": -25.655792236328125, "global_step": 331428, "epoch": 3993} {"train_loss": -25.828414916992188, "global_step": 331429, "epoch": 3993} {"train_loss": -25.5327205657959, "global_step": 331430, "epoch": 3993} {"train_loss": -25.68558692932129, "global_step": 331431, "epoch": 3993} {"train_loss": -25.6892147064209, "global_step": 331432, "epoch": 3993} {"train_loss": -25.994237899780273, "global_step": 331433, "epoch": 3993} {"train_loss": -25.96466636657715, "global_step": 331434, "epoch": 3993} {"train_loss": -25.671405792236328, "global_step": 331435, "epoch": 3993} {"train_loss": -25.70576286315918, "global_step": 331436, "epoch": 3993} {"train_loss": -26.0152645111084, "global_step": 331437, "epoch": 3993} {"train_loss": -25.648740768432617, "global_step": 331438, "epoch": 3993} {"train_loss": -26.055912017822266, "global_step": 331439, "epoch": 3993} {"train_loss": -25.610010147094727, "global_step": 331440, "epoch": 3993} {"train_loss": -26.039871215820312, "global_step": 331441, "epoch": 3993} {"train_loss": -25.567216873168945, "global_step": 331442, "epoch": 3993} {"train_loss": -26.155929565429688, "global_step": 331443, "epoch": 3993} {"train_loss": -26.120100021362305, "global_step": 331444, "epoch": 3993} {"train_loss": -26.06741714477539, "global_step": 331445, "epoch": 3993} {"train_loss": -26.035079956054688, "global_step": 331446, "epoch": 3993} {"train_loss": -25.707305908203125, "global_step": 331447, "epoch": 3993} {"train_loss": -25.765058517456055, "global_step": 331448, "epoch": 3993} {"train_loss": -26.122106552124023, "global_step": 331449, "epoch": 3993} {"train_loss": -25.971094131469727, "global_step": 331450, "epoch": 3993} {"train_loss": -25.961210250854492, "global_step": 331451, "epoch": 3993} {"train_loss": -25.764577865600586, "global_step": 331452, "epoch": 3993} {"train_loss": -25.8966007232666, "global_step": 331453, "epoch": 3993} {"train_loss": -25.985000610351562, "global_step": 331454, "epoch": 3993} {"train_loss": -25.7490234375, "global_step": 331455, "epoch": 3993} {"train_loss": -26.057668685913086, "global_step": 331456, "epoch": 3993} {"train_loss": -26.160938262939453, "global_step": 331457, "epoch": 3993} {"train_loss": -26.30549430847168, "global_step": 331458, "epoch": 3993} {"train_loss": -25.820138931274414, "global_step": 331459, "epoch": 3993} {"train_loss": -26.072452545166016, "global_step": 331460, "epoch": 3993} {"train_loss": -26.133893966674805, "global_step": 331461, "epoch": 3993} {"train_loss": -26.359546661376953, "global_step": 331462, "epoch": 3993} {"train_loss": -26.045684814453125, "global_step": 331463, "epoch": 3993} {"train_loss": -26.068017959594727, "global_step": 331464, "epoch": 3993} {"train_loss": -26.004377365112305, "global_step": 331465, "epoch": 3993} {"train_loss": -25.82631492614746, "global_step": 331466, "epoch": 3993} {"train_loss": -26.04339027404785, "global_step": 331467, "epoch": 3993} {"train_loss": -26.034902572631836, "global_step": 331468, "epoch": 3993} {"train_loss": -25.93402099609375, "global_step": 331469, "epoch": 3993} {"train_loss": -26.22344398498535, "global_step": 331470, "epoch": 3993} {"train_loss": -26.02924156188965, "global_step": 331471, "epoch": 3993} {"train_loss": -26.194849014282227, "global_step": 331472, "epoch": 3993} {"train_loss": -26.0034236907959, "global_step": 331473, "epoch": 3993} {"train_loss": -26.05804443359375, "global_step": 331474, "epoch": 3993} {"train_loss": -25.88736915588379, "global_step": 331475, "epoch": 3993} {"train_loss": -26.19657325744629, "global_step": 331476, "epoch": 3993} {"train_loss": -25.92742347717285, "global_step": 331477, "epoch": 3993} {"train_loss": -26.09339714050293, "global_step": 331478, "epoch": 3993} {"train_loss": -25.9177303314209, "global_step": 331479, "epoch": 3993} {"train_loss": -25.75345802307129, "global_step": 331480, "epoch": 3993} {"train_loss": -25.76747703552246, "global_step": 331481, "epoch": 3993} {"train_loss": -26.0336856842041, "global_step": 331482, "epoch": 3993} {"train_loss": -25.7908878326416, "global_step": 331483, "epoch": 3993} {"train_loss": -25.674789428710938, "global_step": 331484, "epoch": 3993} {"train_loss": -26.20001220703125, "global_step": 331485, "epoch": 3993} {"train_loss": -26.007802963256836, "global_step": 331486, "epoch": 3993} {"train_loss": -25.934711456298828, "global_step": 331487, "epoch": 3993} {"train_loss": -25.989561080932617, "global_step": 331488, "epoch": 3993} {"train_loss": -26.198896408081055, "global_step": 331489, "epoch": 3993} {"train_loss": -26.3063907623291, "global_step": 331490, "epoch": 3993} {"train_loss": -26.078643798828125, "global_step": 331491, "epoch": 3993} {"train_loss": -26.034259796142578, "global_step": 331492, "epoch": 3993} {"train_loss": -26.077184677124023, "global_step": 331493, "epoch": 3993} {"train_loss": -25.791486740112305, "global_step": 331494, "epoch": 3993} {"train_loss": -26.56159782409668, "global_step": 331495, "epoch": 3993} {"train_loss": -25.776891708374023, "global_step": 331496, "epoch": 3993} {"train_loss": -25.63602638244629, "global_step": 331497, "epoch": 3993} {"train_loss": -25.317262649536133, "global_step": 331498, "epoch": 3993} {"train_loss": -26.284610748291016, "global_step": 331499, "epoch": 3993} {"train_loss": -25.552751541137695, "global_step": 331500, "epoch": 3993} {"train_loss": -25.91281755286527, "global_step": 331501, "epoch": 3993, "val_loss": 7083037.0} {"train_loss": -25.123748779296875, "global_step": 331502, "epoch": 3994} {"train_loss": -24.87598419189453, "global_step": 331503, "epoch": 3994} {"train_loss": -24.672794342041016, "global_step": 331504, "epoch": 3994} {"train_loss": -24.6727352142334, "global_step": 331505, "epoch": 3994} {"train_loss": -25.211620330810547, "global_step": 331506, "epoch": 3994} {"train_loss": -25.1654052734375, "global_step": 331507, "epoch": 3994} {"train_loss": -25.331985473632812, "global_step": 331508, "epoch": 3994} {"train_loss": -25.4935245513916, "global_step": 331509, "epoch": 3994} {"train_loss": -25.560876846313477, "global_step": 331510, "epoch": 3994} {"train_loss": -25.03659439086914, "global_step": 331511, "epoch": 3994} {"train_loss": -25.416101455688477, "global_step": 331512, "epoch": 3994} {"train_loss": -25.321430206298828, "global_step": 331513, "epoch": 3994} {"train_loss": -25.438251495361328, "global_step": 331514, "epoch": 3994} {"train_loss": -25.7088623046875, "global_step": 331515, "epoch": 3994} {"train_loss": -25.659320831298828, "global_step": 331516, "epoch": 3994} {"train_loss": -25.307973861694336, "global_step": 331517, "epoch": 3994} {"train_loss": -25.355398178100586, "global_step": 331518, "epoch": 3994} {"train_loss": -25.64272117614746, "global_step": 331519, "epoch": 3994} {"train_loss": -25.4066162109375, "global_step": 331520, "epoch": 3994} {"train_loss": -25.3817195892334, "global_step": 331521, "epoch": 3994} {"train_loss": -25.44931411743164, "global_step": 331522, "epoch": 3994} {"train_loss": -26.029199600219727, "global_step": 331523, "epoch": 3994} {"train_loss": -25.804553985595703, "global_step": 331524, "epoch": 3994} {"train_loss": -25.598787307739258, "global_step": 331525, "epoch": 3994} {"train_loss": -26.13714027404785, "global_step": 331526, "epoch": 3994} {"train_loss": -25.673599243164062, "global_step": 331527, "epoch": 3994} {"train_loss": -25.921661376953125, "global_step": 331528, "epoch": 3994} {"train_loss": -26.027236938476562, "global_step": 331529, "epoch": 3994} {"train_loss": -25.8917293548584, "global_step": 331530, "epoch": 3994} {"train_loss": -25.724899291992188, "global_step": 331531, "epoch": 3994} {"train_loss": -25.7576847076416, "global_step": 331532, "epoch": 3994} {"train_loss": -25.785444259643555, "global_step": 331533, "epoch": 3994} {"train_loss": -25.608001708984375, "global_step": 331534, "epoch": 3994} {"train_loss": -26.201635360717773, "global_step": 331535, "epoch": 3994} {"train_loss": -25.940933227539062, "global_step": 331536, "epoch": 3994} {"train_loss": -26.053876876831055, "global_step": 331537, "epoch": 3994} {"train_loss": -25.97832679748535, "global_step": 331538, "epoch": 3994} {"train_loss": -25.992618560791016, "global_step": 331539, "epoch": 3994} {"train_loss": -25.991891860961914, "global_step": 331540, "epoch": 3994} {"train_loss": -26.11895179748535, "global_step": 331541, "epoch": 3994} {"train_loss": -26.077823638916016, "global_step": 331542, "epoch": 3994} {"train_loss": -25.54120445251465, "global_step": 331543, "epoch": 3994} {"train_loss": -25.7882022857666, "global_step": 331544, "epoch": 3994} {"train_loss": -25.789152145385742, "global_step": 331545, "epoch": 3994} {"train_loss": -25.72053337097168, "global_step": 331546, "epoch": 3994} {"train_loss": -25.621891021728516, "global_step": 331547, "epoch": 3994} {"train_loss": -26.00660514831543, "global_step": 331548, "epoch": 3994} {"train_loss": -25.9235782623291, "global_step": 331549, "epoch": 3994} {"train_loss": -25.959264755249023, "global_step": 331550, "epoch": 3994} {"train_loss": -25.8582820892334, "global_step": 331551, "epoch": 3994} {"train_loss": -25.87863540649414, "global_step": 331552, "epoch": 3994} {"train_loss": -26.0900936126709, "global_step": 331553, "epoch": 3994} {"train_loss": -26.02713394165039, "global_step": 331554, "epoch": 3994} {"train_loss": -26.381006240844727, "global_step": 331555, "epoch": 3994} {"train_loss": -25.892868041992188, "global_step": 331556, "epoch": 3994} {"train_loss": -25.8868465423584, "global_step": 331557, "epoch": 3994} {"train_loss": -26.1336727142334, "global_step": 331558, "epoch": 3994} {"train_loss": -26.306320190429688, "global_step": 331559, "epoch": 3994} {"train_loss": -26.080291748046875, "global_step": 331560, "epoch": 3994} {"train_loss": -26.019641876220703, "global_step": 331561, "epoch": 3994} {"train_loss": -25.332918167114258, "global_step": 331562, "epoch": 3994} {"train_loss": -25.689651489257812, "global_step": 331563, "epoch": 3994} {"train_loss": -25.83538246154785, "global_step": 331564, "epoch": 3994} {"train_loss": -26.35528564453125, "global_step": 331565, "epoch": 3994} {"train_loss": -26.066904067993164, "global_step": 331566, "epoch": 3994} {"train_loss": -25.79108238220215, "global_step": 331567, "epoch": 3994} {"train_loss": -25.389535903930664, "global_step": 331568, "epoch": 3994} {"train_loss": -25.6273136138916, "global_step": 331569, "epoch": 3994} {"train_loss": -25.784870147705078, "global_step": 331570, "epoch": 3994} {"train_loss": -26.07744789123535, "global_step": 331571, "epoch": 3994} {"train_loss": -25.911535263061523, "global_step": 331572, "epoch": 3994} {"train_loss": -26.15423583984375, "global_step": 331573, "epoch": 3994} {"train_loss": -25.80561637878418, "global_step": 331574, "epoch": 3994} {"train_loss": -26.02534294128418, "global_step": 331575, "epoch": 3994} {"train_loss": -26.117218017578125, "global_step": 331576, "epoch": 3994} {"train_loss": -25.77628517150879, "global_step": 331577, "epoch": 3994} {"train_loss": -25.88431167602539, "global_step": 331578, "epoch": 3994} {"train_loss": -25.656070709228516, "global_step": 331579, "epoch": 3994} {"train_loss": -26.35176658630371, "global_step": 331580, "epoch": 3994} {"train_loss": -25.983978271484375, "global_step": 331581, "epoch": 3994} {"train_loss": -26.565290451049805, "global_step": 331582, "epoch": 3994} {"train_loss": -25.920673370361328, "global_step": 331583, "epoch": 3994} {"train_loss": -25.76408514919051, "global_step": 331584, "epoch": 3994, "val_loss": 7074967.0} {"train_loss": -25.153736114501953, "global_step": 331585, "epoch": 3995} {"train_loss": -25.5792293548584, "global_step": 331586, "epoch": 3995} {"train_loss": -25.70496940612793, "global_step": 331587, "epoch": 3995} {"train_loss": -25.588972091674805, "global_step": 331588, "epoch": 3995} {"train_loss": -25.516794204711914, "global_step": 331589, "epoch": 3995} {"train_loss": -25.618406295776367, "global_step": 331590, "epoch": 3995} {"train_loss": -25.552331924438477, "global_step": 331591, "epoch": 3995} {"train_loss": -26.111907958984375, "global_step": 331592, "epoch": 3995} {"train_loss": -26.000629425048828, "global_step": 331593, "epoch": 3995} {"train_loss": -26.08234977722168, "global_step": 331594, "epoch": 3995} {"train_loss": -25.79951286315918, "global_step": 331595, "epoch": 3995} {"train_loss": -25.809518814086914, "global_step": 331596, "epoch": 3995} {"train_loss": -25.814680099487305, "global_step": 331597, "epoch": 3995} {"train_loss": -25.91249656677246, "global_step": 331598, "epoch": 3995} {"train_loss": -26.167795181274414, "global_step": 331599, "epoch": 3995} {"train_loss": -25.77836036682129, "global_step": 331600, "epoch": 3995} {"train_loss": -25.68379020690918, "global_step": 331601, "epoch": 3995} {"train_loss": -25.825454711914062, "global_step": 331602, "epoch": 3995} {"train_loss": -26.154052734375, "global_step": 331603, "epoch": 3995} {"train_loss": -25.927465438842773, "global_step": 331604, "epoch": 3995} {"train_loss": -25.989587783813477, "global_step": 331605, "epoch": 3995} {"train_loss": -25.915319442749023, "global_step": 331606, "epoch": 3995} {"train_loss": -26.2769832611084, "global_step": 331607, "epoch": 3995} {"train_loss": -26.071521759033203, "global_step": 331608, "epoch": 3995} {"train_loss": -25.744796752929688, "global_step": 331609, "epoch": 3995} {"train_loss": -26.05067253112793, "global_step": 331610, "epoch": 3995} {"train_loss": -25.879364013671875, "global_step": 331611, "epoch": 3995} {"train_loss": -25.73261833190918, "global_step": 331612, "epoch": 3995} {"train_loss": -26.215290069580078, "global_step": 331613, "epoch": 3995} {"train_loss": -25.704553604125977, "global_step": 331614, "epoch": 3995} {"train_loss": -26.427276611328125, "global_step": 331615, "epoch": 3995} {"train_loss": -25.954137802124023, "global_step": 331616, "epoch": 3995} {"train_loss": -25.894012451171875, "global_step": 331617, "epoch": 3995} {"train_loss": -25.810834884643555, "global_step": 331618, "epoch": 3995} {"train_loss": -26.03046226501465, "global_step": 331619, "epoch": 3995} {"train_loss": -25.783588409423828, "global_step": 331620, "epoch": 3995} {"train_loss": -25.942243576049805, "global_step": 331621, "epoch": 3995} {"train_loss": -26.075550079345703, "global_step": 331622, "epoch": 3995} {"train_loss": -26.199176788330078, "global_step": 331623, "epoch": 3995} {"train_loss": -25.857925415039062, "global_step": 331624, "epoch": 3995} {"train_loss": -26.169214248657227, "global_step": 331625, "epoch": 3995} {"train_loss": -26.08269691467285, "global_step": 331626, "epoch": 3995} {"train_loss": -26.05607032775879, "global_step": 331627, "epoch": 3995} {"train_loss": -25.927946090698242, "global_step": 331628, "epoch": 3995} {"train_loss": -26.183624267578125, "global_step": 331629, "epoch": 3995} {"train_loss": -26.594135284423828, "global_step": 331630, "epoch": 3995} {"train_loss": -26.098621368408203, "global_step": 331631, "epoch": 3995} {"train_loss": -26.118375778198242, "global_step": 331632, "epoch": 3995} {"train_loss": -26.045095443725586, "global_step": 331633, "epoch": 3995} {"train_loss": -25.70193862915039, "global_step": 331634, "epoch": 3995} {"train_loss": -25.855859756469727, "global_step": 331635, "epoch": 3995} {"train_loss": -25.9384822845459, "global_step": 331636, "epoch": 3995} {"train_loss": -25.94744300842285, "global_step": 331637, "epoch": 3995} {"train_loss": -25.79843521118164, "global_step": 331638, "epoch": 3995} {"train_loss": -26.172027587890625, "global_step": 331639, "epoch": 3995} {"train_loss": -25.8580265045166, "global_step": 331640, "epoch": 3995} {"train_loss": -25.50491714477539, "global_step": 331641, "epoch": 3995} {"train_loss": -25.604312896728516, "global_step": 331642, "epoch": 3995} {"train_loss": -25.530263900756836, "global_step": 331643, "epoch": 3995} {"train_loss": -25.853519439697266, "global_step": 331644, "epoch": 3995} {"train_loss": -25.984729766845703, "global_step": 331645, "epoch": 3995} {"train_loss": -25.306631088256836, "global_step": 331646, "epoch": 3995} {"train_loss": -26.110937118530273, "global_step": 331647, "epoch": 3995} {"train_loss": -25.524152755737305, "global_step": 331648, "epoch": 3995} {"train_loss": -25.7498722076416, "global_step": 331649, "epoch": 3995} {"train_loss": -25.469629287719727, "global_step": 331650, "epoch": 3995} {"train_loss": -25.964990615844727, "global_step": 331651, "epoch": 3995} {"train_loss": -25.859426498413086, "global_step": 331652, "epoch": 3995} {"train_loss": -26.217573165893555, "global_step": 331653, "epoch": 3995} {"train_loss": -25.752918243408203, "global_step": 331654, "epoch": 3995} {"train_loss": -26.114248275756836, "global_step": 331655, "epoch": 3995} {"train_loss": -25.688013076782227, "global_step": 331656, "epoch": 3995} {"train_loss": -25.690290451049805, "global_step": 331657, "epoch": 3995} {"train_loss": -25.68745231628418, "global_step": 331658, "epoch": 3995} {"train_loss": -25.401731491088867, "global_step": 331659, "epoch": 3995} {"train_loss": -25.811887741088867, "global_step": 331660, "epoch": 3995} {"train_loss": -26.066808700561523, "global_step": 331661, "epoch": 3995} {"train_loss": -25.54729461669922, "global_step": 331662, "epoch": 3995} {"train_loss": -26.038175582885742, "global_step": 331663, "epoch": 3995} {"train_loss": -25.83487892150879, "global_step": 331664, "epoch": 3995} {"train_loss": -26.12721061706543, "global_step": 331665, "epoch": 3995} {"train_loss": -26.46730613708496, "global_step": 331666, "epoch": 3995} {"train_loss": -25.902035678725646, "global_step": 331667, "epoch": 3995, "val_loss": 7074438.0} {"train_loss": -25.8756103515625, "global_step": 331668, "epoch": 3996} {"train_loss": -25.51997947692871, "global_step": 331669, "epoch": 3996} {"train_loss": -25.454862594604492, "global_step": 331670, "epoch": 3996} {"train_loss": -25.97354507446289, "global_step": 331671, "epoch": 3996} {"train_loss": -25.204727172851562, "global_step": 331672, "epoch": 3996} {"train_loss": -25.883115768432617, "global_step": 331673, "epoch": 3996} {"train_loss": -25.61968421936035, "global_step": 331674, "epoch": 3996} {"train_loss": -25.501325607299805, "global_step": 331675, "epoch": 3996} {"train_loss": -25.66961669921875, "global_step": 331676, "epoch": 3996} {"train_loss": -26.04146385192871, "global_step": 331677, "epoch": 3996} {"train_loss": -25.779953002929688, "global_step": 331678, "epoch": 3996} {"train_loss": -25.8359317779541, "global_step": 331679, "epoch": 3996} {"train_loss": -25.791452407836914, "global_step": 331680, "epoch": 3996} {"train_loss": -26.09076499938965, "global_step": 331681, "epoch": 3996} {"train_loss": -26.255142211914062, "global_step": 331682, "epoch": 3996} {"train_loss": -25.849945068359375, "global_step": 331683, "epoch": 3996} {"train_loss": -25.78702735900879, "global_step": 331684, "epoch": 3996} {"train_loss": -25.701284408569336, "global_step": 331685, "epoch": 3996} {"train_loss": -26.089929580688477, "global_step": 331686, "epoch": 3996} {"train_loss": -25.547208786010742, "global_step": 331687, "epoch": 3996} {"train_loss": -25.76226234436035, "global_step": 331688, "epoch": 3996} {"train_loss": -25.97552490234375, "global_step": 331689, "epoch": 3996} {"train_loss": -25.9174747467041, "global_step": 331690, "epoch": 3996} {"train_loss": -25.933080673217773, "global_step": 331691, "epoch": 3996} {"train_loss": -25.80963134765625, "global_step": 331692, "epoch": 3996} {"train_loss": -25.660186767578125, "global_step": 331693, "epoch": 3996} {"train_loss": -25.885709762573242, "global_step": 331694, "epoch": 3996} {"train_loss": -26.163854598999023, "global_step": 331695, "epoch": 3996} {"train_loss": -25.93989372253418, "global_step": 331696, "epoch": 3996} {"train_loss": -25.920324325561523, "global_step": 331697, "epoch": 3996} {"train_loss": -25.91224479675293, "global_step": 331698, "epoch": 3996} {"train_loss": -26.36532974243164, "global_step": 331699, "epoch": 3996} {"train_loss": -25.67176628112793, "global_step": 331700, "epoch": 3996} {"train_loss": -26.01100730895996, "global_step": 331701, "epoch": 3996} {"train_loss": -25.901105880737305, "global_step": 331702, "epoch": 3996} {"train_loss": -25.836872100830078, "global_step": 331703, "epoch": 3996} {"train_loss": -25.789764404296875, "global_step": 331704, "epoch": 3996} {"train_loss": -26.13504981994629, "global_step": 331705, "epoch": 3996} {"train_loss": -26.17777442932129, "global_step": 331706, "epoch": 3996} {"train_loss": -26.044708251953125, "global_step": 331707, "epoch": 3996} {"train_loss": -25.983325958251953, "global_step": 331708, "epoch": 3996} {"train_loss": -25.909826278686523, "global_step": 331709, "epoch": 3996} {"train_loss": -25.989166259765625, "global_step": 331710, "epoch": 3996} {"train_loss": -26.021240234375, "global_step": 331711, "epoch": 3996} {"train_loss": -26.303415298461914, "global_step": 331712, "epoch": 3996} {"train_loss": -25.926502227783203, "global_step": 331713, "epoch": 3996} {"train_loss": -26.223346710205078, "global_step": 331714, "epoch": 3996} {"train_loss": -26.236530303955078, "global_step": 331715, "epoch": 3996} {"train_loss": -26.054157257080078, "global_step": 331716, "epoch": 3996} {"train_loss": -26.14170265197754, "global_step": 331717, "epoch": 3996} {"train_loss": -26.048063278198242, "global_step": 331718, "epoch": 3996} {"train_loss": -25.88347816467285, "global_step": 331719, "epoch": 3996} {"train_loss": -26.159284591674805, "global_step": 331720, "epoch": 3996} {"train_loss": -26.10076904296875, "global_step": 331721, "epoch": 3996} {"train_loss": -26.102523803710938, "global_step": 331722, "epoch": 3996} {"train_loss": -26.138931274414062, "global_step": 331723, "epoch": 3996} {"train_loss": -26.250837326049805, "global_step": 331724, "epoch": 3996} {"train_loss": -26.26325035095215, "global_step": 331725, "epoch": 3996} {"train_loss": -26.232885360717773, "global_step": 331726, "epoch": 3996} {"train_loss": -25.93635368347168, "global_step": 331727, "epoch": 3996} {"train_loss": -26.436187744140625, "global_step": 331728, "epoch": 3996} {"train_loss": -25.99714469909668, "global_step": 331729, "epoch": 3996} {"train_loss": -26.056909561157227, "global_step": 331730, "epoch": 3996} {"train_loss": -25.9521484375, "global_step": 331731, "epoch": 3996} {"train_loss": -26.161352157592773, "global_step": 331732, "epoch": 3996} {"train_loss": -26.04558753967285, "global_step": 331733, "epoch": 3996} {"train_loss": -25.906158447265625, "global_step": 331734, "epoch": 3996} {"train_loss": -26.37420654296875, "global_step": 331735, "epoch": 3996} {"train_loss": -25.975727081298828, "global_step": 331736, "epoch": 3996} {"train_loss": -26.417510986328125, "global_step": 331737, "epoch": 3996} {"train_loss": -26.33294677734375, "global_step": 331738, "epoch": 3996} {"train_loss": -26.325178146362305, "global_step": 331739, "epoch": 3996} {"train_loss": -26.186185836791992, "global_step": 331740, "epoch": 3996} {"train_loss": -25.83316421508789, "global_step": 331741, "epoch": 3996} {"train_loss": -25.682153701782227, "global_step": 331742, "epoch": 3996} {"train_loss": -24.631223678588867, "global_step": 331743, "epoch": 3996} {"train_loss": -24.673974990844727, "global_step": 331744, "epoch": 3996} {"train_loss": -23.817190170288086, "global_step": 331745, "epoch": 3996} {"train_loss": -24.556720733642578, "global_step": 331746, "epoch": 3996} {"train_loss": -25.4476261138916, "global_step": 331747, "epoch": 3996} {"train_loss": -24.764713287353516, "global_step": 331748, "epoch": 3996} {"train_loss": -25.369510650634766, "global_step": 331749, "epoch": 3996} {"train_loss": -25.871260401714277, "global_step": 331750, "epoch": 3996, "val_loss": 7091944.5} {"train_loss": -24.20404624938965, "global_step": 331751, "epoch": 3997} {"train_loss": -25.14902114868164, "global_step": 331752, "epoch": 3997} {"train_loss": -24.51641273498535, "global_step": 331753, "epoch": 3997} {"train_loss": -25.25593376159668, "global_step": 331754, "epoch": 3997} {"train_loss": -24.96591567993164, "global_step": 331755, "epoch": 3997} {"train_loss": -24.958301544189453, "global_step": 331756, "epoch": 3997} {"train_loss": -24.99537467956543, "global_step": 331757, "epoch": 3997} {"train_loss": -25.23355484008789, "global_step": 331758, "epoch": 3997} {"train_loss": -24.68277931213379, "global_step": 331759, "epoch": 3997} {"train_loss": -25.23065185546875, "global_step": 331760, "epoch": 3997} {"train_loss": -25.365400314331055, "global_step": 331761, "epoch": 3997} {"train_loss": -25.157930374145508, "global_step": 331762, "epoch": 3997} {"train_loss": -25.52062225341797, "global_step": 331763, "epoch": 3997} {"train_loss": -25.694095611572266, "global_step": 331764, "epoch": 3997} {"train_loss": -25.777429580688477, "global_step": 331765, "epoch": 3997} {"train_loss": -25.5341854095459, "global_step": 331766, "epoch": 3997} {"train_loss": -25.688520431518555, "global_step": 331767, "epoch": 3997} {"train_loss": -25.779804229736328, "global_step": 331768, "epoch": 3997} {"train_loss": -25.932260513305664, "global_step": 331769, "epoch": 3997} {"train_loss": -26.067584991455078, "global_step": 331770, "epoch": 3997} {"train_loss": -25.591657638549805, "global_step": 331771, "epoch": 3997} {"train_loss": -25.7026309967041, "global_step": 331772, "epoch": 3997} {"train_loss": -25.606414794921875, "global_step": 331773, "epoch": 3997} {"train_loss": -25.83078384399414, "global_step": 331774, "epoch": 3997} {"train_loss": -25.565675735473633, "global_step": 331775, "epoch": 3997} {"train_loss": -25.9139347076416, "global_step": 331776, "epoch": 3997} {"train_loss": -26.057302474975586, "global_step": 331777, "epoch": 3997} {"train_loss": -25.903461456298828, "global_step": 331778, "epoch": 3997} {"train_loss": -26.115583419799805, "global_step": 331779, "epoch": 3997} {"train_loss": -25.782018661499023, "global_step": 331780, "epoch": 3997} {"train_loss": -26.0773983001709, "global_step": 331781, "epoch": 3997} {"train_loss": -26.18092918395996, "global_step": 331782, "epoch": 3997} {"train_loss": -25.654760360717773, "global_step": 331783, "epoch": 3997} {"train_loss": -25.981237411499023, "global_step": 331784, "epoch": 3997} {"train_loss": -25.757339477539062, "global_step": 331785, "epoch": 3997} {"train_loss": -26.082645416259766, "global_step": 331786, "epoch": 3997} {"train_loss": -26.137235641479492, "global_step": 331787, "epoch": 3997} {"train_loss": -26.14503288269043, "global_step": 331788, "epoch": 3997} {"train_loss": -26.077972412109375, "global_step": 331789, "epoch": 3997} {"train_loss": -25.899200439453125, "global_step": 331790, "epoch": 3997} {"train_loss": -25.75665283203125, "global_step": 331791, "epoch": 3997} {"train_loss": -25.839862823486328, "global_step": 331792, "epoch": 3997} {"train_loss": -25.74468994140625, "global_step": 331793, "epoch": 3997} {"train_loss": -26.354917526245117, "global_step": 331794, "epoch": 3997} {"train_loss": -26.04425048828125, "global_step": 331795, "epoch": 3997} {"train_loss": -26.33208656311035, "global_step": 331796, "epoch": 3997} {"train_loss": -25.984888076782227, "global_step": 331797, "epoch": 3997} {"train_loss": -26.25165367126465, "global_step": 331798, "epoch": 3997} {"train_loss": -26.2193603515625, "global_step": 331799, "epoch": 3997} {"train_loss": -26.426776885986328, "global_step": 331800, "epoch": 3997} {"train_loss": -26.126062393188477, "global_step": 331801, "epoch": 3997} {"train_loss": -26.249536514282227, "global_step": 331802, "epoch": 3997} {"train_loss": -26.121191024780273, "global_step": 331803, "epoch": 3997} {"train_loss": -26.00315284729004, "global_step": 331804, "epoch": 3997} {"train_loss": -25.9233341217041, "global_step": 331805, "epoch": 3997} {"train_loss": -26.13934898376465, "global_step": 331806, "epoch": 3997} {"train_loss": -26.199094772338867, "global_step": 331807, "epoch": 3997} {"train_loss": -25.665616989135742, "global_step": 331808, "epoch": 3997} {"train_loss": -25.6170654296875, "global_step": 331809, "epoch": 3997} {"train_loss": -25.38953971862793, "global_step": 331810, "epoch": 3997} {"train_loss": -25.733139038085938, "global_step": 331811, "epoch": 3997} {"train_loss": -25.639753341674805, "global_step": 331812, "epoch": 3997} {"train_loss": -25.8552303314209, "global_step": 331813, "epoch": 3997} {"train_loss": -26.048044204711914, "global_step": 331814, "epoch": 3997} {"train_loss": -25.739957809448242, "global_step": 331815, "epoch": 3997} {"train_loss": -25.968664169311523, "global_step": 331816, "epoch": 3997} {"train_loss": -25.897802352905273, "global_step": 331817, "epoch": 3997} {"train_loss": -25.66425895690918, "global_step": 331818, "epoch": 3997} {"train_loss": -26.045124053955078, "global_step": 331819, "epoch": 3997} {"train_loss": -25.896270751953125, "global_step": 331820, "epoch": 3997} {"train_loss": -26.25494956970215, "global_step": 331821, "epoch": 3997} {"train_loss": -25.852746963500977, "global_step": 331822, "epoch": 3997} {"train_loss": -25.9094295501709, "global_step": 331823, "epoch": 3997} {"train_loss": -25.7156925201416, "global_step": 331824, "epoch": 3997} {"train_loss": -25.843961715698242, "global_step": 331825, "epoch": 3997} {"train_loss": -25.776065826416016, "global_step": 331826, "epoch": 3997} {"train_loss": -25.978300094604492, "global_step": 331827, "epoch": 3997} {"train_loss": -26.1043758392334, "global_step": 331828, "epoch": 3997} {"train_loss": -26.2018985748291, "global_step": 331829, "epoch": 3997} {"train_loss": -26.18104362487793, "global_step": 331830, "epoch": 3997} {"train_loss": -25.907032012939453, "global_step": 331831, "epoch": 3997} {"train_loss": -26.4697208404541, "global_step": 331832, "epoch": 3997} {"train_loss": -25.789894333804945, "global_step": 331833, "epoch": 3997, "val_loss": 7078514.0} {"train_loss": -25.606739044189453, "global_step": 331834, "epoch": 3998} {"train_loss": -25.796674728393555, "global_step": 331835, "epoch": 3998} {"train_loss": -26.004425048828125, "global_step": 331836, "epoch": 3998} {"train_loss": -25.348628997802734, "global_step": 331837, "epoch": 3998} {"train_loss": -25.731958389282227, "global_step": 331838, "epoch": 3998} {"train_loss": -26.020191192626953, "global_step": 331839, "epoch": 3998} {"train_loss": -25.41048240661621, "global_step": 331840, "epoch": 3998} {"train_loss": -25.615924835205078, "global_step": 331841, "epoch": 3998} {"train_loss": -25.617385864257812, "global_step": 331842, "epoch": 3998} {"train_loss": -25.866504669189453, "global_step": 331843, "epoch": 3998} {"train_loss": -25.42132568359375, "global_step": 331844, "epoch": 3998} {"train_loss": -25.892593383789062, "global_step": 331845, "epoch": 3998} {"train_loss": -25.662994384765625, "global_step": 331846, "epoch": 3998} {"train_loss": -26.26984214782715, "global_step": 331847, "epoch": 3998} {"train_loss": -25.27092742919922, "global_step": 331848, "epoch": 3998} {"train_loss": -25.703336715698242, "global_step": 331849, "epoch": 3998} {"train_loss": -25.762598037719727, "global_step": 331850, "epoch": 3998} {"train_loss": -25.666675567626953, "global_step": 331851, "epoch": 3998} {"train_loss": -25.740814208984375, "global_step": 331852, "epoch": 3998} {"train_loss": -26.055219650268555, "global_step": 331853, "epoch": 3998} {"train_loss": -25.99942970275879, "global_step": 331854, "epoch": 3998} {"train_loss": -25.905500411987305, "global_step": 331855, "epoch": 3998} {"train_loss": -26.100385665893555, "global_step": 331856, "epoch": 3998} {"train_loss": -25.958459854125977, "global_step": 331857, "epoch": 3998} {"train_loss": -26.06892967224121, "global_step": 331858, "epoch": 3998} {"train_loss": -26.13861083984375, "global_step": 331859, "epoch": 3998} {"train_loss": -26.342254638671875, "global_step": 331860, "epoch": 3998} {"train_loss": -26.208240509033203, "global_step": 331861, "epoch": 3998} {"train_loss": -25.974212646484375, "global_step": 331862, "epoch": 3998} {"train_loss": -26.309171676635742, "global_step": 331863, "epoch": 3998} {"train_loss": -26.224584579467773, "global_step": 331864, "epoch": 3998} {"train_loss": -25.816986083984375, "global_step": 331865, "epoch": 3998} {"train_loss": -26.0139102935791, "global_step": 331866, "epoch": 3998} {"train_loss": -26.0543155670166, "global_step": 331867, "epoch": 3998} {"train_loss": -26.1225528717041, "global_step": 331868, "epoch": 3998} {"train_loss": -26.001605987548828, "global_step": 331869, "epoch": 3998} {"train_loss": -26.139184951782227, "global_step": 331870, "epoch": 3998} {"train_loss": -25.893997192382812, "global_step": 331871, "epoch": 3998} {"train_loss": -25.78255271911621, "global_step": 331872, "epoch": 3998} {"train_loss": -26.374231338500977, "global_step": 331873, "epoch": 3998} {"train_loss": -26.17327880859375, "global_step": 331874, "epoch": 3998} {"train_loss": -25.820575714111328, "global_step": 331875, "epoch": 3998} {"train_loss": -25.728729248046875, "global_step": 331876, "epoch": 3998} {"train_loss": -26.270599365234375, "global_step": 331877, "epoch": 3998} {"train_loss": -25.96895408630371, "global_step": 331878, "epoch": 3998} {"train_loss": -26.18583106994629, "global_step": 331879, "epoch": 3998} {"train_loss": -26.075490951538086, "global_step": 331880, "epoch": 3998} {"train_loss": -26.146093368530273, "global_step": 331881, "epoch": 3998} {"train_loss": -26.055524826049805, "global_step": 331882, "epoch": 3998} {"train_loss": -25.907684326171875, "global_step": 331883, "epoch": 3998} {"train_loss": -25.820947647094727, "global_step": 331884, "epoch": 3998} {"train_loss": -25.8969669342041, "global_step": 331885, "epoch": 3998} {"train_loss": -25.819293975830078, "global_step": 331886, "epoch": 3998} {"train_loss": -26.057754516601562, "global_step": 331887, "epoch": 3998} {"train_loss": -25.823394775390625, "global_step": 331888, "epoch": 3998} {"train_loss": -25.799835205078125, "global_step": 331889, "epoch": 3998} {"train_loss": -26.090717315673828, "global_step": 331890, "epoch": 3998} {"train_loss": -26.2606258392334, "global_step": 331891, "epoch": 3998} {"train_loss": -26.112207412719727, "global_step": 331892, "epoch": 3998} {"train_loss": -26.049880981445312, "global_step": 331893, "epoch": 3998} {"train_loss": -26.175174713134766, "global_step": 331894, "epoch": 3998} {"train_loss": -25.75367546081543, "global_step": 331895, "epoch": 3998} {"train_loss": -25.87754249572754, "global_step": 331896, "epoch": 3998} {"train_loss": -26.231470108032227, "global_step": 331897, "epoch": 3998} {"train_loss": -25.733081817626953, "global_step": 331898, "epoch": 3998} {"train_loss": -26.297077178955078, "global_step": 331899, "epoch": 3998} {"train_loss": -26.042194366455078, "global_step": 331900, "epoch": 3998} {"train_loss": -26.033811569213867, "global_step": 331901, "epoch": 3998} {"train_loss": -26.048980712890625, "global_step": 331902, "epoch": 3998} {"train_loss": -26.40870475769043, "global_step": 331903, "epoch": 3998} {"train_loss": -26.074804306030273, "global_step": 331904, "epoch": 3998} {"train_loss": -26.07685661315918, "global_step": 331905, "epoch": 3998} {"train_loss": -25.97523307800293, "global_step": 331906, "epoch": 3998} {"train_loss": -25.7495059967041, "global_step": 331907, "epoch": 3998} {"train_loss": -26.189868927001953, "global_step": 331908, "epoch": 3998} {"train_loss": -26.0132999420166, "global_step": 331909, "epoch": 3998} {"train_loss": -26.405197143554688, "global_step": 331910, "epoch": 3998} {"train_loss": -26.262042999267578, "global_step": 331911, "epoch": 3998} {"train_loss": -26.14803123474121, "global_step": 331912, "epoch": 3998} {"train_loss": -25.565786361694336, "global_step": 331913, "epoch": 3998} {"train_loss": -25.644428253173828, "global_step": 331914, "epoch": 3998} {"train_loss": -25.609329223632812, "global_step": 331915, "epoch": 3998} {"train_loss": -25.961295093398498, "global_step": 331916, "epoch": 3998, "val_loss": 7077736.0} {"train_loss": -24.976633071899414, "global_step": 331917, "epoch": 3999} {"train_loss": -24.539796829223633, "global_step": 331918, "epoch": 3999} {"train_loss": -24.963254928588867, "global_step": 331919, "epoch": 3999} {"train_loss": -25.193437576293945, "global_step": 331920, "epoch": 3999} {"train_loss": -25.798620223999023, "global_step": 331921, "epoch": 3999} {"train_loss": -25.404508590698242, "global_step": 331922, "epoch": 3999} {"train_loss": -25.35458755493164, "global_step": 331923, "epoch": 3999} {"train_loss": -25.68779945373535, "global_step": 331924, "epoch": 3999} {"train_loss": -25.5606632232666, "global_step": 331925, "epoch": 3999} {"train_loss": -25.74873161315918, "global_step": 331926, "epoch": 3999} {"train_loss": -25.6280574798584, "global_step": 331927, "epoch": 3999} {"train_loss": -25.50429344177246, "global_step": 331928, "epoch": 3999} {"train_loss": -25.880659103393555, "global_step": 331929, "epoch": 3999} {"train_loss": -25.78354263305664, "global_step": 331930, "epoch": 3999} {"train_loss": -26.213043212890625, "global_step": 331931, "epoch": 3999} {"train_loss": -25.980518341064453, "global_step": 331932, "epoch": 3999} {"train_loss": -26.22878074645996, "global_step": 331933, "epoch": 3999} {"train_loss": -25.8533878326416, "global_step": 331934, "epoch": 3999} {"train_loss": -25.712604522705078, "global_step": 331935, "epoch": 3999} {"train_loss": -25.96588134765625, "global_step": 331936, "epoch": 3999} {"train_loss": -26.034835815429688, "global_step": 331937, "epoch": 3999} {"train_loss": -26.0130615234375, "global_step": 331938, "epoch": 3999} {"train_loss": -25.74954605102539, "global_step": 331939, "epoch": 3999} {"train_loss": -26.244464874267578, "global_step": 331940, "epoch": 3999} {"train_loss": -26.0816650390625, "global_step": 331941, "epoch": 3999} {"train_loss": -25.7042179107666, "global_step": 331942, "epoch": 3999} {"train_loss": -26.031843185424805, "global_step": 331943, "epoch": 3999} {"train_loss": -26.142419815063477, "global_step": 331944, "epoch": 3999} {"train_loss": -26.36332130432129, "global_step": 331945, "epoch": 3999} {"train_loss": -26.0688419342041, "global_step": 331946, "epoch": 3999} {"train_loss": -26.200336456298828, "global_step": 331947, "epoch": 3999} {"train_loss": -26.16408348083496, "global_step": 331948, "epoch": 3999} {"train_loss": -26.141706466674805, "global_step": 331949, "epoch": 3999} {"train_loss": -26.717731475830078, "global_step": 331950, "epoch": 3999} {"train_loss": -26.318099975585938, "global_step": 331951, "epoch": 3999} {"train_loss": -26.232397079467773, "global_step": 331952, "epoch": 3999} {"train_loss": -25.999555587768555, "global_step": 331953, "epoch": 3999} {"train_loss": -26.2007999420166, "global_step": 331954, "epoch": 3999} {"train_loss": -25.92437744140625, "global_step": 331955, "epoch": 3999} {"train_loss": -25.855289459228516, "global_step": 331956, "epoch": 3999} {"train_loss": -26.1262264251709, "global_step": 331957, "epoch": 3999} {"train_loss": -26.010242462158203, "global_step": 331958, "epoch": 3999} {"train_loss": -25.627668380737305, "global_step": 331959, "epoch": 3999} {"train_loss": -25.934751510620117, "global_step": 331960, "epoch": 3999} {"train_loss": -25.84266471862793, "global_step": 331961, "epoch": 3999} {"train_loss": -25.734954833984375, "global_step": 331962, "epoch": 3999} {"train_loss": -25.687795639038086, "global_step": 331963, "epoch": 3999} {"train_loss": -25.795194625854492, "global_step": 331964, "epoch": 3999} {"train_loss": -25.832746505737305, "global_step": 331965, "epoch": 3999} {"train_loss": -25.781408309936523, "global_step": 331966, "epoch": 3999} {"train_loss": -25.45904541015625, "global_step": 331967, "epoch": 3999} {"train_loss": -26.09119987487793, "global_step": 331968, "epoch": 3999} {"train_loss": -25.93709373474121, "global_step": 331969, "epoch": 3999} {"train_loss": -26.186559677124023, "global_step": 331970, "epoch": 3999} {"train_loss": -25.957788467407227, "global_step": 331971, "epoch": 3999} {"train_loss": -26.06109619140625, "global_step": 331972, "epoch": 3999} {"train_loss": -25.835065841674805, "global_step": 331973, "epoch": 3999} {"train_loss": -25.844482421875, "global_step": 331974, "epoch": 3999} {"train_loss": -26.393482208251953, "global_step": 331975, "epoch": 3999} {"train_loss": -25.45943260192871, "global_step": 331976, "epoch": 3999} {"train_loss": -26.141645431518555, "global_step": 331977, "epoch": 3999} {"train_loss": -25.74933433532715, "global_step": 331978, "epoch": 3999} {"train_loss": -26.15095329284668, "global_step": 331979, "epoch": 3999} {"train_loss": -25.540878295898438, "global_step": 331980, "epoch": 3999} {"train_loss": -26.086090087890625, "global_step": 331981, "epoch": 3999} {"train_loss": -25.8630428314209, "global_step": 331982, "epoch": 3999} {"train_loss": -25.745569229125977, "global_step": 331983, "epoch": 3999} {"train_loss": -25.761377334594727, "global_step": 331984, "epoch": 3999} {"train_loss": -25.905380249023438, "global_step": 331985, "epoch": 3999} {"train_loss": -25.84955406188965, "global_step": 331986, "epoch": 3999} {"train_loss": -25.9365234375, "global_step": 331987, "epoch": 3999} {"train_loss": -25.959518432617188, "global_step": 331988, "epoch": 3999} {"train_loss": -26.219852447509766, "global_step": 331989, "epoch": 3999} {"train_loss": -25.91337013244629, "global_step": 331990, "epoch": 3999} {"train_loss": -26.082529067993164, "global_step": 331991, "epoch": 3999} {"train_loss": -26.03937339782715, "global_step": 331992, "epoch": 3999} {"train_loss": -25.906835556030273, "global_step": 331993, "epoch": 3999} {"train_loss": -26.165145874023438, "global_step": 331994, "epoch": 3999} {"train_loss": -25.83107566833496, "global_step": 331995, "epoch": 3999} {"train_loss": -26.04379653930664, "global_step": 331996, "epoch": 3999} {"train_loss": -26.277713775634766, "global_step": 331997, "epoch": 3999} {"train_loss": -26.48908042907715, "global_step": 331998, "epoch": 3999} {"train_loss": -25.922493624399944, "global_step": 331999, "epoch": 3999, "val_loss": 7188908.5} {"train_loss": -23.87395477294922, "global_step": 332000, "epoch": 4000} {"train_loss": -24.02665138244629, "global_step": 332001, "epoch": 4000} {"train_loss": -23.78501319885254, "global_step": 332002, "epoch": 4000} {"train_loss": -24.209470748901367, "global_step": 332003, "epoch": 4000} {"train_loss": -25.23457908630371, "global_step": 332004, "epoch": 4000} {"train_loss": -24.304107666015625, "global_step": 332005, "epoch": 4000} {"train_loss": -25.23634910583496, "global_step": 332006, "epoch": 4000} {"train_loss": -24.450345993041992, "global_step": 332007, "epoch": 4000} {"train_loss": -25.00909423828125, "global_step": 332008, "epoch": 4000} {"train_loss": -24.660572052001953, "global_step": 332009, "epoch": 4000} {"train_loss": -25.08107566833496, "global_step": 332010, "epoch": 4000} {"train_loss": -24.67807388305664, "global_step": 332011, "epoch": 4000} {"train_loss": -25.2011775970459, "global_step": 332012, "epoch": 4000} {"train_loss": -25.27311134338379, "global_step": 332013, "epoch": 4000} {"train_loss": -25.241371154785156, "global_step": 332014, "epoch": 4000} {"train_loss": -25.47492027282715, "global_step": 332015, "epoch": 4000} {"train_loss": -25.03376579284668, "global_step": 332016, "epoch": 4000} {"train_loss": -25.112632751464844, "global_step": 332017, "epoch": 4000} {"train_loss": -25.2469539642334, "global_step": 332018, "epoch": 4000} {"train_loss": -25.177818298339844, "global_step": 332019, "epoch": 4000} {"train_loss": -25.599651336669922, "global_step": 332020, "epoch": 4000} {"train_loss": -25.3499698638916, "global_step": 332021, "epoch": 4000} {"train_loss": -25.495010375976562, "global_step": 332022, "epoch": 4000} {"train_loss": -25.007177352905273, "global_step": 332023, "epoch": 4000} {"train_loss": -25.57772445678711, "global_step": 332024, "epoch": 4000} {"train_loss": -25.430089950561523, "global_step": 332025, "epoch": 4000} {"train_loss": -25.76123046875, "global_step": 332026, "epoch": 4000} {"train_loss": -25.719099044799805, "global_step": 332027, "epoch": 4000} {"train_loss": -26.06989097595215, "global_step": 332028, "epoch": 4000} {"train_loss": -25.5384464263916, "global_step": 332029, "epoch": 4000} {"train_loss": -25.41155433654785, "global_step": 332030, "epoch": 4000} {"train_loss": -25.910856246948242, "global_step": 332031, "epoch": 4000} {"train_loss": -25.82415771484375, "global_step": 332032, "epoch": 4000} {"train_loss": -25.59297752380371, "global_step": 332033, "epoch": 4000} {"train_loss": -25.832183837890625, "global_step": 332034, "epoch": 4000} {"train_loss": -25.904321670532227, "global_step": 332035, "epoch": 4000} {"train_loss": -25.73601722717285, "global_step": 332036, "epoch": 4000} {"train_loss": -26.21282958984375, "global_step": 332037, "epoch": 4000} {"train_loss": -25.950794219970703, "global_step": 332038, "epoch": 4000} {"train_loss": -25.66371726989746, "global_step": 332039, "epoch": 4000} {"train_loss": -25.716278076171875, "global_step": 332040, "epoch": 4000} {"train_loss": -26.005084991455078, "global_step": 332041, "epoch": 4000} {"train_loss": -26.2253360748291, "global_step": 332042, "epoch": 4000} {"train_loss": -26.11118507385254, "global_step": 332043, "epoch": 4000} {"train_loss": -26.07596778869629, "global_step": 332044, "epoch": 4000} {"train_loss": -25.957868576049805, "global_step": 332045, "epoch": 4000} {"train_loss": -25.777257919311523, "global_step": 332046, "epoch": 4000} {"train_loss": -26.155866622924805, "global_step": 332047, "epoch": 4000} {"train_loss": -26.175527572631836, "global_step": 332048, "epoch": 4000} {"train_loss": -25.910358428955078, "global_step": 332049, "epoch": 4000} {"train_loss": -26.157636642456055, "global_step": 332050, "epoch": 4000} {"train_loss": -26.031787872314453, "global_step": 332051, "epoch": 4000} {"train_loss": -26.511417388916016, "global_step": 332052, "epoch": 4000} {"train_loss": -26.00312614440918, "global_step": 332053, "epoch": 4000} {"train_loss": -26.27552604675293, "global_step": 332054, "epoch": 4000} {"train_loss": -26.359994888305664, "global_step": 332055, "epoch": 4000} {"train_loss": -26.458541870117188, "global_step": 332056, "epoch": 4000} {"train_loss": -26.045663833618164, "global_step": 332057, "epoch": 4000} {"train_loss": -26.06342124938965, "global_step": 332058, "epoch": 4000} {"train_loss": -26.360584259033203, "global_step": 332059, "epoch": 4000} {"train_loss": -26.5059757232666, "global_step": 332060, "epoch": 4000} {"train_loss": -26.311079025268555, "global_step": 332061, "epoch": 4000} {"train_loss": -26.138635635375977, "global_step": 332062, "epoch": 4000} {"train_loss": -26.216779708862305, "global_step": 332063, "epoch": 4000} {"train_loss": -26.166662216186523, "global_step": 332064, "epoch": 4000} {"train_loss": -26.45903968811035, "global_step": 332065, "epoch": 4000} {"train_loss": -26.138757705688477, "global_step": 332066, "epoch": 4000} {"train_loss": -26.097991943359375, "global_step": 332067, "epoch": 4000} {"train_loss": -26.0897274017334, "global_step": 332068, "epoch": 4000} {"train_loss": -26.37202262878418, "global_step": 332069, "epoch": 4000} {"train_loss": -26.02911376953125, "global_step": 332070, "epoch": 4000} {"train_loss": -25.65846061706543, "global_step": 332071, "epoch": 4000} {"train_loss": -26.118932723999023, "global_step": 332072, "epoch": 4000} {"train_loss": -25.837833404541016, "global_step": 332073, "epoch": 4000} {"train_loss": -26.164106369018555, "global_step": 332074, "epoch": 4000} {"train_loss": -25.529783248901367, "global_step": 332075, "epoch": 4000} {"train_loss": -25.81878089904785, "global_step": 332076, "epoch": 4000} {"train_loss": -24.755308151245117, "global_step": 332077, "epoch": 4000} {"train_loss": -25.664472579956055, "global_step": 332078, "epoch": 4000} {"train_loss": -25.767383575439453, "global_step": 332079, "epoch": 4000} {"train_loss": -25.365131378173828, "global_step": 332080, "epoch": 4000} {"train_loss": -25.666706085205078, "global_step": 332081, "epoch": 4000} {"train_loss": -25.643390517636956, "global_step": 332082, "epoch": 4000, "train/sim_max_reward_0": 1.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4500000": 1.0, "test/sim_max_reward_4500001": 1.0, "test/sim_max_reward_4500002": 1.0, "test/sim_max_reward_4500003": 1.0, "test/sim_max_reward_4500004": 1.0, "test/sim_max_reward_4500005": 1.0, "test/sim_max_reward_4500006": 1.0, "test/sim_max_reward_4500007": 0.0, "test/sim_max_reward_4500008": 1.0, "test/sim_max_reward_4500009": 1.0, "test/sim_max_reward_4500010": 1.0, "test/sim_max_reward_4500011": 1.0, "test/sim_max_reward_4500012": 1.0, "test/sim_max_reward_4500013": 1.0, "test/sim_max_reward_4500014": 1.0, "test/sim_max_reward_4500015": 1.0, "test/sim_max_reward_4500016": 1.0, "test/sim_max_reward_4500017": 1.0, "test/sim_max_reward_4500018": 1.0, "test/sim_max_reward_4500019": 1.0, "test/sim_max_reward_4500020": 1.0, "test/sim_max_reward_4500021": 1.0, "train/mean_score": 1.0, "test/mean_score": 0.9545454545454546, "val_loss": 7131373.0} {"train_loss": -21.864973068237305, "global_step": 332083, "epoch": 4001} {"train_loss": -23.44888687133789, "global_step": 332084, "epoch": 4001} {"train_loss": -23.836368560791016, "global_step": 332085, "epoch": 4001} {"train_loss": -24.825851440429688, "global_step": 332086, "epoch": 4001} {"train_loss": -24.525588989257812, "global_step": 332087, "epoch": 4001} {"train_loss": -24.982351303100586, "global_step": 332088, "epoch": 4001} {"train_loss": -24.931934356689453, "global_step": 332089, "epoch": 4001} {"train_loss": -24.783069610595703, "global_step": 332090, "epoch": 4001} {"train_loss": -24.714752197265625, "global_step": 332091, "epoch": 4001} {"train_loss": -25.101110458374023, "global_step": 332092, "epoch": 4001} {"train_loss": -24.893064498901367, "global_step": 332093, "epoch": 4001} {"train_loss": -25.265026092529297, "global_step": 332094, "epoch": 4001} {"train_loss": -25.27508544921875, "global_step": 332095, "epoch": 4001} {"train_loss": -25.166208267211914, "global_step": 332096, "epoch": 4001} {"train_loss": -25.448928833007812, "global_step": 332097, "epoch": 4001} {"train_loss": -25.380029678344727, "global_step": 332098, "epoch": 4001} {"train_loss": -25.37217140197754, "global_step": 332099, "epoch": 4001} {"train_loss": -25.327375411987305, "global_step": 332100, "epoch": 4001} {"train_loss": -25.574787139892578, "global_step": 332101, "epoch": 4001} {"train_loss": -25.487308502197266, "global_step": 332102, "epoch": 4001} {"train_loss": -25.328981399536133, "global_step": 332103, "epoch": 4001} {"train_loss": -25.42176055908203, "global_step": 332104, "epoch": 4001} {"train_loss": -25.48874855041504, "global_step": 332105, "epoch": 4001} {"train_loss": -25.53452491760254, "global_step": 332106, "epoch": 4001} {"train_loss": -25.756330490112305, "global_step": 332107, "epoch": 4001} {"train_loss": -25.55534553527832, "global_step": 332108, "epoch": 4001} {"train_loss": -25.465635299682617, "global_step": 332109, "epoch": 4001} {"train_loss": -25.498891830444336, "global_step": 332110, "epoch": 4001} {"train_loss": -25.540084838867188, "global_step": 332111, "epoch": 4001} {"train_loss": -25.549638748168945, "global_step": 332112, "epoch": 4001} {"train_loss": -25.598791122436523, "global_step": 332113, "epoch": 4001} {"train_loss": -25.741806030273438, "global_step": 332114, "epoch": 4001} {"train_loss": -25.719024658203125, "global_step": 332115, "epoch": 4001} {"train_loss": -25.765674591064453, "global_step": 332116, "epoch": 4001} {"train_loss": -25.73072624206543, "global_step": 332117, "epoch": 4001} {"train_loss": -25.747882843017578, "global_step": 332118, "epoch": 4001} {"train_loss": -26.031652450561523, "global_step": 332119, "epoch": 4001} {"train_loss": -25.82564353942871, "global_step": 332120, "epoch": 4001} {"train_loss": -25.873981475830078, "global_step": 332121, "epoch": 4001} {"train_loss": -26.410924911499023, "global_step": 332122, "epoch": 4001} {"train_loss": -26.240026473999023, "global_step": 332123, "epoch": 4001} {"train_loss": -25.916492462158203, "global_step": 332124, "epoch": 4001} {"train_loss": -25.5001277923584, "global_step": 332125, "epoch": 4001} {"train_loss": -26.16016960144043, "global_step": 332126, "epoch": 4001} {"train_loss": -26.31787109375, "global_step": 332127, "epoch": 4001} {"train_loss": -25.735177993774414, "global_step": 332128, "epoch": 4001} {"train_loss": -26.134618759155273, "global_step": 332129, "epoch": 4001} {"train_loss": -25.58249282836914, "global_step": 332130, "epoch": 4001} {"train_loss": -26.132583618164062, "global_step": 332131, "epoch": 4001} {"train_loss": -26.1637020111084, "global_step": 332132, "epoch": 4001} {"train_loss": -26.27322769165039, "global_step": 332133, "epoch": 4001} {"train_loss": -25.959487915039062, "global_step": 332134, "epoch": 4001} {"train_loss": -26.093994140625, "global_step": 332135, "epoch": 4001} {"train_loss": -26.126550674438477, "global_step": 332136, "epoch": 4001} {"train_loss": -26.236398696899414, "global_step": 332137, "epoch": 4001} {"train_loss": -25.956708908081055, "global_step": 332138, "epoch": 4001} {"train_loss": -26.138477325439453, "global_step": 332139, "epoch": 4001} {"train_loss": -26.122228622436523, "global_step": 332140, "epoch": 4001} {"train_loss": -26.239282608032227, "global_step": 332141, "epoch": 4001} {"train_loss": -26.033649444580078, "global_step": 332142, "epoch": 4001} {"train_loss": -26.14154624938965, "global_step": 332143, "epoch": 4001} {"train_loss": -26.195877075195312, "global_step": 332144, "epoch": 4001} {"train_loss": -25.903213500976562, "global_step": 332145, "epoch": 4001} {"train_loss": -26.14259147644043, "global_step": 332146, "epoch": 4001} {"train_loss": -26.304935455322266, "global_step": 332147, "epoch": 4001} {"train_loss": -26.303823471069336, "global_step": 332148, "epoch": 4001} {"train_loss": -25.74602699279785, "global_step": 332149, "epoch": 4001} {"train_loss": -26.143945693969727, "global_step": 332150, "epoch": 4001} {"train_loss": -26.450193405151367, "global_step": 332151, "epoch": 4001} {"train_loss": -25.83363151550293, "global_step": 332152, "epoch": 4001} {"train_loss": -25.915695190429688, "global_step": 332153, "epoch": 4001} {"train_loss": -26.048242568969727, "global_step": 332154, "epoch": 4001} {"train_loss": -26.2929630279541, "global_step": 332155, "epoch": 4001} {"train_loss": -26.35626220703125, "global_step": 332156, "epoch": 4001} {"train_loss": -26.0183048248291, "global_step": 332157, "epoch": 4001} {"train_loss": -26.040266036987305, "global_step": 332158, "epoch": 4001} {"train_loss": -26.015979766845703, "global_step": 332159, "epoch": 4001} {"train_loss": -26.235578536987305, "global_step": 332160, "epoch": 4001} {"train_loss": -26.098255157470703, "global_step": 332161, "epoch": 4001} {"train_loss": -26.43770408630371, "global_step": 332162, "epoch": 4001} {"train_loss": -26.55865478515625, "global_step": 332163, "epoch": 4001} {"train_loss": -26.125152587890625, "global_step": 332164, "epoch": 4001} {"train_loss": -25.69132407314806, "global_step": 332165, "epoch": 4001, "val_loss": 7142305.0} {"train_loss": -24.361602783203125, "global_step": 332166, "epoch": 4002} {"train_loss": -24.28289222717285, "global_step": 332167, "epoch": 4002} {"train_loss": -24.81734275817871, "global_step": 332168, "epoch": 4002} {"train_loss": -24.66253089904785, "global_step": 332169, "epoch": 4002} {"train_loss": -25.412771224975586, "global_step": 332170, "epoch": 4002} {"train_loss": -25.0072021484375, "global_step": 332171, "epoch": 4002} {"train_loss": -24.906291961669922, "global_step": 332172, "epoch": 4002} {"train_loss": -25.511600494384766, "global_step": 332173, "epoch": 4002} {"train_loss": -24.963092803955078, "global_step": 332174, "epoch": 4002} {"train_loss": -25.779035568237305, "global_step": 332175, "epoch": 4002} {"train_loss": -25.144763946533203, "global_step": 332176, "epoch": 4002} {"train_loss": -25.629486083984375, "global_step": 332177, "epoch": 4002} {"train_loss": -25.764404296875, "global_step": 332178, "epoch": 4002} {"train_loss": -25.358976364135742, "global_step": 332179, "epoch": 4002} {"train_loss": -25.46565055847168, "global_step": 332180, "epoch": 4002} {"train_loss": -25.456127166748047, "global_step": 332181, "epoch": 4002} {"train_loss": -25.550352096557617, "global_step": 332182, "epoch": 4002} {"train_loss": -25.585193634033203, "global_step": 332183, "epoch": 4002} {"train_loss": -25.783376693725586, "global_step": 332184, "epoch": 4002} {"train_loss": -25.612808227539062, "global_step": 332185, "epoch": 4002} {"train_loss": -25.46754264831543, "global_step": 332186, "epoch": 4002} {"train_loss": -25.56875991821289, "global_step": 332187, "epoch": 4002} {"train_loss": -25.70392417907715, "global_step": 332188, "epoch": 4002} {"train_loss": -26.011890411376953, "global_step": 332189, "epoch": 4002} {"train_loss": -25.419525146484375, "global_step": 332190, "epoch": 4002} {"train_loss": -25.67852210998535, "global_step": 332191, "epoch": 4002} {"train_loss": -25.862409591674805, "global_step": 332192, "epoch": 4002} {"train_loss": -26.02535057067871, "global_step": 332193, "epoch": 4002} {"train_loss": -25.8460636138916, "global_step": 332194, "epoch": 4002} {"train_loss": -25.703125, "global_step": 332195, "epoch": 4002} {"train_loss": -25.669647216796875, "global_step": 332196, "epoch": 4002} {"train_loss": -25.69379234313965, "global_step": 332197, "epoch": 4002} {"train_loss": -25.908283233642578, "global_step": 332198, "epoch": 4002} {"train_loss": -25.770832061767578, "global_step": 332199, "epoch": 4002} {"train_loss": -25.74604606628418, "global_step": 332200, "epoch": 4002} {"train_loss": -25.98970603942871, "global_step": 332201, "epoch": 4002} {"train_loss": -25.696002960205078, "global_step": 332202, "epoch": 4002} {"train_loss": -26.00446891784668, "global_step": 332203, "epoch": 4002} {"train_loss": -25.780710220336914, "global_step": 332204, "epoch": 4002} {"train_loss": -25.86391258239746, "global_step": 332205, "epoch": 4002} {"train_loss": -26.055429458618164, "global_step": 332206, "epoch": 4002} {"train_loss": -25.917882919311523, "global_step": 332207, "epoch": 4002} {"train_loss": -25.944232940673828, "global_step": 332208, "epoch": 4002} {"train_loss": -25.874231338500977, "global_step": 332209, "epoch": 4002} {"train_loss": -26.38960075378418, "global_step": 332210, "epoch": 4002} {"train_loss": -26.422521591186523, "global_step": 332211, "epoch": 4002} {"train_loss": -25.95361328125, "global_step": 332212, "epoch": 4002} {"train_loss": -26.318872451782227, "global_step": 332213, "epoch": 4002} {"train_loss": -26.088703155517578, "global_step": 332214, "epoch": 4002} {"train_loss": -25.634750366210938, "global_step": 332215, "epoch": 4002} {"train_loss": -25.891706466674805, "global_step": 332216, "epoch": 4002} {"train_loss": -25.845754623413086, "global_step": 332217, "epoch": 4002} {"train_loss": -26.1734619140625, "global_step": 332218, "epoch": 4002} {"train_loss": -26.37298583984375, "global_step": 332219, "epoch": 4002} {"train_loss": -25.859943389892578, "global_step": 332220, "epoch": 4002} {"train_loss": -26.345762252807617, "global_step": 332221, "epoch": 4002} {"train_loss": -26.20454216003418, "global_step": 332222, "epoch": 4002} {"train_loss": -26.441333770751953, "global_step": 332223, "epoch": 4002} {"train_loss": -25.985315322875977, "global_step": 332224, "epoch": 4002} {"train_loss": -26.1468563079834, "global_step": 332225, "epoch": 4002} {"train_loss": -26.197050094604492, "global_step": 332226, "epoch": 4002} {"train_loss": -26.2260684967041, "global_step": 332227, "epoch": 4002} {"train_loss": -25.81744956970215, "global_step": 332228, "epoch": 4002} {"train_loss": -26.3657283782959, "global_step": 332229, "epoch": 4002} {"train_loss": -25.988574981689453, "global_step": 332230, "epoch": 4002} {"train_loss": -26.345306396484375, "global_step": 332231, "epoch": 4002} {"train_loss": -26.110309600830078, "global_step": 332232, "epoch": 4002} {"train_loss": -25.722702026367188, "global_step": 332233, "epoch": 4002} {"train_loss": -25.85590934753418, "global_step": 332234, "epoch": 4002} {"train_loss": -25.905963897705078, "global_step": 332235, "epoch": 4002} {"train_loss": -26.152021408081055, "global_step": 332236, "epoch": 4002} {"train_loss": -26.077987670898438, "global_step": 332237, "epoch": 4002} {"train_loss": -26.084457397460938, "global_step": 332238, "epoch": 4002} {"train_loss": -25.867368698120117, "global_step": 332239, "epoch": 4002} {"train_loss": -25.785573959350586, "global_step": 332240, "epoch": 4002} {"train_loss": -25.989526748657227, "global_step": 332241, "epoch": 4002} {"train_loss": -25.619709014892578, "global_step": 332242, "epoch": 4002} {"train_loss": -25.766881942749023, "global_step": 332243, "epoch": 4002} {"train_loss": -25.531240463256836, "global_step": 332244, "epoch": 4002} {"train_loss": -25.69093894958496, "global_step": 332245, "epoch": 4002} {"train_loss": -26.100400924682617, "global_step": 332246, "epoch": 4002} {"train_loss": -25.546873092651367, "global_step": 332247, "epoch": 4002} {"train_loss": -25.76785774690559, "global_step": 332248, "epoch": 4002, "val_loss": 7198506.0} {"train_loss": -24.12433433532715, "global_step": 332249, "epoch": 4003} {"train_loss": -24.250743865966797, "global_step": 332250, "epoch": 4003} {"train_loss": -25.05946159362793, "global_step": 332251, "epoch": 4003} {"train_loss": -25.150278091430664, "global_step": 332252, "epoch": 4003} {"train_loss": -24.859272003173828, "global_step": 332253, "epoch": 4003} {"train_loss": -25.281925201416016, "global_step": 332254, "epoch": 4003} {"train_loss": -25.543737411499023, "global_step": 332255, "epoch": 4003} {"train_loss": -25.28114128112793, "global_step": 332256, "epoch": 4003} {"train_loss": -25.098302841186523, "global_step": 332257, "epoch": 4003} {"train_loss": -25.5128116607666, "global_step": 332258, "epoch": 4003} {"train_loss": -25.546377182006836, "global_step": 332259, "epoch": 4003} {"train_loss": -25.494789123535156, "global_step": 332260, "epoch": 4003} {"train_loss": -25.40317153930664, "global_step": 332261, "epoch": 4003} {"train_loss": -25.773681640625, "global_step": 332262, "epoch": 4003} {"train_loss": -25.549352645874023, "global_step": 332263, "epoch": 4003} {"train_loss": -25.163387298583984, "global_step": 332264, "epoch": 4003} {"train_loss": -25.718387603759766, "global_step": 332265, "epoch": 4003} {"train_loss": -25.578943252563477, "global_step": 332266, "epoch": 4003} {"train_loss": -25.751256942749023, "global_step": 332267, "epoch": 4003} {"train_loss": -25.578794479370117, "global_step": 332268, "epoch": 4003} {"train_loss": -25.918811798095703, "global_step": 332269, "epoch": 4003} {"train_loss": -25.612796783447266, "global_step": 332270, "epoch": 4003} {"train_loss": -25.685062408447266, "global_step": 332271, "epoch": 4003} {"train_loss": -25.82541847229004, "global_step": 332272, "epoch": 4003} {"train_loss": -25.759021759033203, "global_step": 332273, "epoch": 4003} {"train_loss": -25.58966636657715, "global_step": 332274, "epoch": 4003} {"train_loss": -26.18755531311035, "global_step": 332275, "epoch": 4003} {"train_loss": -25.977075576782227, "global_step": 332276, "epoch": 4003} {"train_loss": -25.9243221282959, "global_step": 332277, "epoch": 4003} {"train_loss": -26.22516441345215, "global_step": 332278, "epoch": 4003} {"train_loss": -25.967336654663086, "global_step": 332279, "epoch": 4003} {"train_loss": -25.860700607299805, "global_step": 332280, "epoch": 4003} {"train_loss": -26.015735626220703, "global_step": 332281, "epoch": 4003} {"train_loss": -25.966581344604492, "global_step": 332282, "epoch": 4003} {"train_loss": -26.0168399810791, "global_step": 332283, "epoch": 4003} {"train_loss": -25.698102951049805, "global_step": 332284, "epoch": 4003} {"train_loss": -26.264938354492188, "global_step": 332285, "epoch": 4003} {"train_loss": -26.058258056640625, "global_step": 332286, "epoch": 4003} {"train_loss": -25.93280601501465, "global_step": 332287, "epoch": 4003} {"train_loss": -26.064428329467773, "global_step": 332288, "epoch": 4003} {"train_loss": -25.9719295501709, "global_step": 332289, "epoch": 4003} {"train_loss": -26.129308700561523, "global_step": 332290, "epoch": 4003} {"train_loss": -26.395267486572266, "global_step": 332291, "epoch": 4003} {"train_loss": -26.16421890258789, "global_step": 332292, "epoch": 4003} {"train_loss": -26.16280174255371, "global_step": 332293, "epoch": 4003} {"train_loss": -25.987802505493164, "global_step": 332294, "epoch": 4003} {"train_loss": -26.11768913269043, "global_step": 332295, "epoch": 4003} {"train_loss": -26.00641441345215, "global_step": 332296, "epoch": 4003} {"train_loss": -26.059589385986328, "global_step": 332297, "epoch": 4003} {"train_loss": -26.143070220947266, "global_step": 332298, "epoch": 4003} {"train_loss": -25.838830947875977, "global_step": 332299, "epoch": 4003} {"train_loss": -26.019702911376953, "global_step": 332300, "epoch": 4003} {"train_loss": -25.78021240234375, "global_step": 332301, "epoch": 4003} {"train_loss": -26.39751625061035, "global_step": 332302, "epoch": 4003} {"train_loss": -26.026412963867188, "global_step": 332303, "epoch": 4003} {"train_loss": -26.19537353515625, "global_step": 332304, "epoch": 4003} {"train_loss": -25.710956573486328, "global_step": 332305, "epoch": 4003} {"train_loss": -25.703948974609375, "global_step": 332306, "epoch": 4003} {"train_loss": -25.79310417175293, "global_step": 332307, "epoch": 4003} {"train_loss": -25.91383171081543, "global_step": 332308, "epoch": 4003} {"train_loss": -25.872472763061523, "global_step": 332309, "epoch": 4003} {"train_loss": -25.813451766967773, "global_step": 332310, "epoch": 4003} {"train_loss": -25.877029418945312, "global_step": 332311, "epoch": 4003} {"train_loss": -26.151681900024414, "global_step": 332312, "epoch": 4003} {"train_loss": -25.857885360717773, "global_step": 332313, "epoch": 4003} {"train_loss": -25.903715133666992, "global_step": 332314, "epoch": 4003} {"train_loss": -26.051715850830078, "global_step": 332315, "epoch": 4003} {"train_loss": -25.948627471923828, "global_step": 332316, "epoch": 4003} {"train_loss": -26.07525634765625, "global_step": 332317, "epoch": 4003} {"train_loss": -26.203144073486328, "global_step": 332318, "epoch": 4003} {"train_loss": -25.964075088500977, "global_step": 332319, "epoch": 4003} {"train_loss": -26.13665199279785, "global_step": 332320, "epoch": 4003} {"train_loss": -26.016284942626953, "global_step": 332321, "epoch": 4003} {"train_loss": -26.276092529296875, "global_step": 332322, "epoch": 4003} {"train_loss": -25.9665470123291, "global_step": 332323, "epoch": 4003} {"train_loss": -26.098478317260742, "global_step": 332324, "epoch": 4003} {"train_loss": -26.126331329345703, "global_step": 332325, "epoch": 4003} {"train_loss": -26.116241455078125, "global_step": 332326, "epoch": 4003} {"train_loss": -26.082401275634766, "global_step": 332327, "epoch": 4003} {"train_loss": -26.157907485961914, "global_step": 332328, "epoch": 4003} {"train_loss": -26.064865112304688, "global_step": 332329, "epoch": 4003} {"train_loss": -26.180830001831055, "global_step": 332330, "epoch": 4003} {"train_loss": -25.826051551175404, "global_step": 332331, "epoch": 4003, "val_loss": 7150818.0} {"train_loss": -25.760595321655273, "global_step": 332332, "epoch": 4004} {"train_loss": -26.00648307800293, "global_step": 332333, "epoch": 4004} {"train_loss": -26.08414077758789, "global_step": 332334, "epoch": 4004} {"train_loss": -26.053268432617188, "global_step": 332335, "epoch": 4004} {"train_loss": -25.67854118347168, "global_step": 332336, "epoch": 4004} {"train_loss": -25.993810653686523, "global_step": 332337, "epoch": 4004} {"train_loss": -25.959716796875, "global_step": 332338, "epoch": 4004} {"train_loss": -26.052392959594727, "global_step": 332339, "epoch": 4004} {"train_loss": -25.68143081665039, "global_step": 332340, "epoch": 4004} {"train_loss": -26.232929229736328, "global_step": 332341, "epoch": 4004} {"train_loss": -25.81231117248535, "global_step": 332342, "epoch": 4004} {"train_loss": -26.064075469970703, "global_step": 332343, "epoch": 4004} {"train_loss": -25.6098690032959, "global_step": 332344, "epoch": 4004} {"train_loss": -26.06329917907715, "global_step": 332345, "epoch": 4004} {"train_loss": -25.902923583984375, "global_step": 332346, "epoch": 4004} {"train_loss": -26.06990623474121, "global_step": 332347, "epoch": 4004} {"train_loss": -25.921655654907227, "global_step": 332348, "epoch": 4004} {"train_loss": -26.083332061767578, "global_step": 332349, "epoch": 4004} {"train_loss": -25.971027374267578, "global_step": 332350, "epoch": 4004} {"train_loss": -25.871875762939453, "global_step": 332351, "epoch": 4004} {"train_loss": -26.027313232421875, "global_step": 332352, "epoch": 4004} {"train_loss": -25.865325927734375, "global_step": 332353, "epoch": 4004} {"train_loss": -26.24395179748535, "global_step": 332354, "epoch": 4004} {"train_loss": -25.97334098815918, "global_step": 332355, "epoch": 4004} {"train_loss": -25.994159698486328, "global_step": 332356, "epoch": 4004} {"train_loss": -26.331579208374023, "global_step": 332357, "epoch": 4004} {"train_loss": -26.162662506103516, "global_step": 332358, "epoch": 4004} {"train_loss": -25.747283935546875, "global_step": 332359, "epoch": 4004} {"train_loss": -26.299518585205078, "global_step": 332360, "epoch": 4004} {"train_loss": -26.23621940612793, "global_step": 332361, "epoch": 4004} {"train_loss": -25.891748428344727, "global_step": 332362, "epoch": 4004} {"train_loss": -26.115888595581055, "global_step": 332363, "epoch": 4004} {"train_loss": -25.914630889892578, "global_step": 332364, "epoch": 4004} {"train_loss": -25.958271026611328, "global_step": 332365, "epoch": 4004} {"train_loss": -25.929128646850586, "global_step": 332366, "epoch": 4004} {"train_loss": -25.942434310913086, "global_step": 332367, "epoch": 4004} {"train_loss": -25.352949142456055, "global_step": 332368, "epoch": 4004} {"train_loss": -25.590839385986328, "global_step": 332369, "epoch": 4004} {"train_loss": -25.302616119384766, "global_step": 332370, "epoch": 4004} {"train_loss": -26.08721351623535, "global_step": 332371, "epoch": 4004} {"train_loss": -25.205142974853516, "global_step": 332372, "epoch": 4004} {"train_loss": -25.800281524658203, "global_step": 332373, "epoch": 4004} {"train_loss": -25.533288955688477, "global_step": 332374, "epoch": 4004} {"train_loss": -25.541372299194336, "global_step": 332375, "epoch": 4004} {"train_loss": -25.612030029296875, "global_step": 332376, "epoch": 4004} {"train_loss": -25.83967399597168, "global_step": 332377, "epoch": 4004} {"train_loss": -25.79129409790039, "global_step": 332378, "epoch": 4004} {"train_loss": -26.011341094970703, "global_step": 332379, "epoch": 4004} {"train_loss": -25.963098526000977, "global_step": 332380, "epoch": 4004} {"train_loss": -25.700651168823242, "global_step": 332381, "epoch": 4004} {"train_loss": -25.9375057220459, "global_step": 332382, "epoch": 4004} {"train_loss": -26.129941940307617, "global_step": 332383, "epoch": 4004} {"train_loss": -25.876203536987305, "global_step": 332384, "epoch": 4004} {"train_loss": -26.29365348815918, "global_step": 332385, "epoch": 4004} {"train_loss": -25.545495986938477, "global_step": 332386, "epoch": 4004} {"train_loss": -26.017688751220703, "global_step": 332387, "epoch": 4004} {"train_loss": -26.19624137878418, "global_step": 332388, "epoch": 4004} {"train_loss": -25.896284103393555, "global_step": 332389, "epoch": 4004} {"train_loss": -26.02292251586914, "global_step": 332390, "epoch": 4004} {"train_loss": -25.651046752929688, "global_step": 332391, "epoch": 4004} {"train_loss": -25.940271377563477, "global_step": 332392, "epoch": 4004} {"train_loss": -25.869596481323242, "global_step": 332393, "epoch": 4004} {"train_loss": -25.952899932861328, "global_step": 332394, "epoch": 4004} {"train_loss": -26.215742111206055, "global_step": 332395, "epoch": 4004} {"train_loss": -25.88750648498535, "global_step": 332396, "epoch": 4004} {"train_loss": -25.780170440673828, "global_step": 332397, "epoch": 4004} {"train_loss": -25.9304256439209, "global_step": 332398, "epoch": 4004} {"train_loss": -26.235198974609375, "global_step": 332399, "epoch": 4004} {"train_loss": -26.188119888305664, "global_step": 332400, "epoch": 4004} {"train_loss": -25.960973739624023, "global_step": 332401, "epoch": 4004} {"train_loss": -26.276142120361328, "global_step": 332402, "epoch": 4004} {"train_loss": -26.23602867126465, "global_step": 332403, "epoch": 4004} {"train_loss": -26.056772232055664, "global_step": 332404, "epoch": 4004} {"train_loss": -26.25927734375, "global_step": 332405, "epoch": 4004} {"train_loss": -26.050933837890625, "global_step": 332406, "epoch": 4004} {"train_loss": -26.327285766601562, "global_step": 332407, "epoch": 4004} {"train_loss": -26.162311553955078, "global_step": 332408, "epoch": 4004} {"train_loss": -26.1005916595459, "global_step": 332409, "epoch": 4004} {"train_loss": -25.906787872314453, "global_step": 332410, "epoch": 4004} {"train_loss": -25.91657066345215, "global_step": 332411, "epoch": 4004} {"train_loss": -26.18572425842285, "global_step": 332412, "epoch": 4004} {"train_loss": -26.272497177124023, "global_step": 332413, "epoch": 4004} {"train_loss": -25.938107295208667, "global_step": 332414, "epoch": 4004, "val_loss": 7014841.0} {"train_loss": -25.45777130126953, "global_step": 332415, "epoch": 4005} {"train_loss": -24.052677154541016, "global_step": 332416, "epoch": 4005} {"train_loss": -23.97197151184082, "global_step": 332417, "epoch": 4005} {"train_loss": -24.200435638427734, "global_step": 332418, "epoch": 4005} {"train_loss": -24.508371353149414, "global_step": 332419, "epoch": 4005} {"train_loss": -24.903974533081055, "global_step": 332420, "epoch": 4005} {"train_loss": -25.11158561706543, "global_step": 332421, "epoch": 4005} {"train_loss": -24.760766983032227, "global_step": 332422, "epoch": 4005} {"train_loss": -25.06498146057129, "global_step": 332423, "epoch": 4005} {"train_loss": -25.23493766784668, "global_step": 332424, "epoch": 4005} {"train_loss": -24.78131675720215, "global_step": 332425, "epoch": 4005} {"train_loss": -25.60809326171875, "global_step": 332426, "epoch": 4005} {"train_loss": -25.04239845275879, "global_step": 332427, "epoch": 4005} {"train_loss": -25.789234161376953, "global_step": 332428, "epoch": 4005} {"train_loss": -24.537954330444336, "global_step": 332429, "epoch": 4005} {"train_loss": -25.418901443481445, "global_step": 332430, "epoch": 4005} {"train_loss": -25.442041397094727, "global_step": 332431, "epoch": 4005} {"train_loss": -25.068288803100586, "global_step": 332432, "epoch": 4005} {"train_loss": -25.364561080932617, "global_step": 332433, "epoch": 4005} {"train_loss": -25.322660446166992, "global_step": 332434, "epoch": 4005} {"train_loss": -25.4462833404541, "global_step": 332435, "epoch": 4005} {"train_loss": -25.175870895385742, "global_step": 332436, "epoch": 4005} {"train_loss": -25.536462783813477, "global_step": 332437, "epoch": 4005} {"train_loss": -25.829755783081055, "global_step": 332438, "epoch": 4005} {"train_loss": -25.90399169921875, "global_step": 332439, "epoch": 4005} {"train_loss": -25.73746681213379, "global_step": 332440, "epoch": 4005} {"train_loss": -25.456388473510742, "global_step": 332441, "epoch": 4005} {"train_loss": -25.84393882751465, "global_step": 332442, "epoch": 4005} {"train_loss": -25.664636611938477, "global_step": 332443, "epoch": 4005} {"train_loss": -25.73902702331543, "global_step": 332444, "epoch": 4005} {"train_loss": -25.71547508239746, "global_step": 332445, "epoch": 4005} {"train_loss": -25.795522689819336, "global_step": 332446, "epoch": 4005} {"train_loss": -25.793787002563477, "global_step": 332447, "epoch": 4005} {"train_loss": -25.68475341796875, "global_step": 332448, "epoch": 4005} {"train_loss": -25.7420654296875, "global_step": 332449, "epoch": 4005} {"train_loss": -26.081518173217773, "global_step": 332450, "epoch": 4005} {"train_loss": -25.72733497619629, "global_step": 332451, "epoch": 4005} {"train_loss": -25.77326011657715, "global_step": 332452, "epoch": 4005} {"train_loss": -25.98674964904785, "global_step": 332453, "epoch": 4005} {"train_loss": -25.903715133666992, "global_step": 332454, "epoch": 4005} {"train_loss": -25.992597579956055, "global_step": 332455, "epoch": 4005} {"train_loss": -25.937255859375, "global_step": 332456, "epoch": 4005} {"train_loss": -26.384138107299805, "global_step": 332457, "epoch": 4005} {"train_loss": -26.10725212097168, "global_step": 332458, "epoch": 4005} {"train_loss": -26.062427520751953, "global_step": 332459, "epoch": 4005} {"train_loss": -25.968908309936523, "global_step": 332460, "epoch": 4005} {"train_loss": -25.902542114257812, "global_step": 332461, "epoch": 4005} {"train_loss": -25.876953125, "global_step": 332462, "epoch": 4005} {"train_loss": -26.18826675415039, "global_step": 332463, "epoch": 4005} {"train_loss": -26.42608642578125, "global_step": 332464, "epoch": 4005} {"train_loss": -26.3504581451416, "global_step": 332465, "epoch": 4005} {"train_loss": -26.076374053955078, "global_step": 332466, "epoch": 4005} {"train_loss": -25.94512939453125, "global_step": 332467, "epoch": 4005} {"train_loss": -26.220197677612305, "global_step": 332468, "epoch": 4005} {"train_loss": -25.948816299438477, "global_step": 332469, "epoch": 4005} {"train_loss": -26.29422378540039, "global_step": 332470, "epoch": 4005} {"train_loss": -26.010940551757812, "global_step": 332471, "epoch": 4005} {"train_loss": -26.065149307250977, "global_step": 332472, "epoch": 4005} {"train_loss": -25.991046905517578, "global_step": 332473, "epoch": 4005} {"train_loss": -26.083927154541016, "global_step": 332474, "epoch": 4005} {"train_loss": -25.96786880493164, "global_step": 332475, "epoch": 4005} {"train_loss": -25.98951530456543, "global_step": 332476, "epoch": 4005} {"train_loss": -25.750507354736328, "global_step": 332477, "epoch": 4005} {"train_loss": -25.589582443237305, "global_step": 332478, "epoch": 4005} {"train_loss": -25.667591094970703, "global_step": 332479, "epoch": 4005} {"train_loss": -25.966552734375, "global_step": 332480, "epoch": 4005} {"train_loss": -25.873945236206055, "global_step": 332481, "epoch": 4005} {"train_loss": -26.23451805114746, "global_step": 332482, "epoch": 4005} {"train_loss": -26.186176300048828, "global_step": 332483, "epoch": 4005} {"train_loss": -25.774402618408203, "global_step": 332484, "epoch": 4005} {"train_loss": -25.71040916442871, "global_step": 332485, "epoch": 4005} {"train_loss": -25.72446060180664, "global_step": 332486, "epoch": 4005} {"train_loss": -25.253469467163086, "global_step": 332487, "epoch": 4005} {"train_loss": -25.48334312438965, "global_step": 332488, "epoch": 4005} {"train_loss": -25.970006942749023, "global_step": 332489, "epoch": 4005} {"train_loss": -25.592126846313477, "global_step": 332490, "epoch": 4005} {"train_loss": -25.863178253173828, "global_step": 332491, "epoch": 4005} {"train_loss": -25.552169799804688, "global_step": 332492, "epoch": 4005} {"train_loss": -26.08295249938965, "global_step": 332493, "epoch": 4005} {"train_loss": -25.592191696166992, "global_step": 332494, "epoch": 4005} {"train_loss": -26.098922729492188, "global_step": 332495, "epoch": 4005} {"train_loss": -25.310977935791016, "global_step": 332496, "epoch": 4005} {"train_loss": -25.64608585403626, "global_step": 332497, "epoch": 4005, "val_loss": 7124405.0} {"train_loss": -25.171241760253906, "global_step": 332498, "epoch": 4006} {"train_loss": -25.16397476196289, "global_step": 332499, "epoch": 4006} {"train_loss": -24.9621639251709, "global_step": 332500, "epoch": 4006} {"train_loss": -25.34415626525879, "global_step": 332501, "epoch": 4006} {"train_loss": -25.193389892578125, "global_step": 332502, "epoch": 4006} {"train_loss": -25.396509170532227, "global_step": 332503, "epoch": 4006} {"train_loss": -25.44370460510254, "global_step": 332504, "epoch": 4006} {"train_loss": -25.276947021484375, "global_step": 332505, "epoch": 4006} {"train_loss": -25.411483764648438, "global_step": 332506, "epoch": 4006} {"train_loss": -24.896060943603516, "global_step": 332507, "epoch": 4006} {"train_loss": -25.33130645751953, "global_step": 332508, "epoch": 4006} {"train_loss": -24.62723731994629, "global_step": 332509, "epoch": 4006} {"train_loss": -25.679121017456055, "global_step": 332510, "epoch": 4006} {"train_loss": -25.514774322509766, "global_step": 332511, "epoch": 4006} {"train_loss": -25.54920196533203, "global_step": 332512, "epoch": 4006} {"train_loss": -25.46726417541504, "global_step": 332513, "epoch": 4006} {"train_loss": -25.430137634277344, "global_step": 332514, "epoch": 4006} {"train_loss": -25.543716430664062, "global_step": 332515, "epoch": 4006} {"train_loss": -25.57114028930664, "global_step": 332516, "epoch": 4006} {"train_loss": -25.628238677978516, "global_step": 332517, "epoch": 4006} {"train_loss": -25.74098777770996, "global_step": 332518, "epoch": 4006} {"train_loss": -25.8325138092041, "global_step": 332519, "epoch": 4006} {"train_loss": -25.6650390625, "global_step": 332520, "epoch": 4006} {"train_loss": -25.496200561523438, "global_step": 332521, "epoch": 4006} {"train_loss": -25.8225040435791, "global_step": 332522, "epoch": 4006} {"train_loss": -25.634140014648438, "global_step": 332523, "epoch": 4006} {"train_loss": -26.028303146362305, "global_step": 332524, "epoch": 4006} {"train_loss": -25.651174545288086, "global_step": 332525, "epoch": 4006} {"train_loss": -25.57394790649414, "global_step": 332526, "epoch": 4006} {"train_loss": -25.537094116210938, "global_step": 332527, "epoch": 4006} {"train_loss": -25.945892333984375, "global_step": 332528, "epoch": 4006} {"train_loss": -25.65534019470215, "global_step": 332529, "epoch": 4006} {"train_loss": -25.774763107299805, "global_step": 332530, "epoch": 4006} {"train_loss": -25.663253784179688, "global_step": 332531, "epoch": 4006} {"train_loss": -25.747089385986328, "global_step": 332532, "epoch": 4006} {"train_loss": -26.072275161743164, "global_step": 332533, "epoch": 4006} {"train_loss": -26.3138370513916, "global_step": 332534, "epoch": 4006} {"train_loss": -25.623416900634766, "global_step": 332535, "epoch": 4006} {"train_loss": -25.842004776000977, "global_step": 332536, "epoch": 4006} {"train_loss": -26.20454216003418, "global_step": 332537, "epoch": 4006} {"train_loss": -25.80567741394043, "global_step": 332538, "epoch": 4006} {"train_loss": -25.690021514892578, "global_step": 332539, "epoch": 4006} {"train_loss": -26.15594482421875, "global_step": 332540, "epoch": 4006} {"train_loss": -26.269678115844727, "global_step": 332541, "epoch": 4006} {"train_loss": -26.0671443939209, "global_step": 332542, "epoch": 4006} {"train_loss": -26.414159774780273, "global_step": 332543, "epoch": 4006} {"train_loss": -26.151777267456055, "global_step": 332544, "epoch": 4006} {"train_loss": -26.365985870361328, "global_step": 332545, "epoch": 4006} {"train_loss": -26.36038589477539, "global_step": 332546, "epoch": 4006} {"train_loss": -25.857275009155273, "global_step": 332547, "epoch": 4006} {"train_loss": -26.476215362548828, "global_step": 332548, "epoch": 4006} {"train_loss": -26.04261589050293, "global_step": 332549, "epoch": 4006} {"train_loss": -26.105762481689453, "global_step": 332550, "epoch": 4006} {"train_loss": -25.92872428894043, "global_step": 332551, "epoch": 4006} {"train_loss": -26.42121696472168, "global_step": 332552, "epoch": 4006} {"train_loss": -26.024057388305664, "global_step": 332553, "epoch": 4006} {"train_loss": -26.47248649597168, "global_step": 332554, "epoch": 4006} {"train_loss": -26.056446075439453, "global_step": 332555, "epoch": 4006} {"train_loss": -26.090177536010742, "global_step": 332556, "epoch": 4006} {"train_loss": -25.84042739868164, "global_step": 332557, "epoch": 4006} {"train_loss": -26.445419311523438, "global_step": 332558, "epoch": 4006} {"train_loss": -26.2517032623291, "global_step": 332559, "epoch": 4006} {"train_loss": -25.95619773864746, "global_step": 332560, "epoch": 4006} {"train_loss": -25.924360275268555, "global_step": 332561, "epoch": 4006} {"train_loss": -25.66482925415039, "global_step": 332562, "epoch": 4006} {"train_loss": -26.0104923248291, "global_step": 332563, "epoch": 4006} {"train_loss": -25.42342185974121, "global_step": 332564, "epoch": 4006} {"train_loss": -25.409814834594727, "global_step": 332565, "epoch": 4006} {"train_loss": -26.211429595947266, "global_step": 332566, "epoch": 4006} {"train_loss": -25.891529083251953, "global_step": 332567, "epoch": 4006} {"train_loss": -25.864227294921875, "global_step": 332568, "epoch": 4006} {"train_loss": -25.747777938842773, "global_step": 332569, "epoch": 4006} {"train_loss": -26.350088119506836, "global_step": 332570, "epoch": 4006} {"train_loss": -25.840566635131836, "global_step": 332571, "epoch": 4006} {"train_loss": -25.983015060424805, "global_step": 332572, "epoch": 4006} {"train_loss": -25.768951416015625, "global_step": 332573, "epoch": 4006} {"train_loss": -25.710229873657227, "global_step": 332574, "epoch": 4006} {"train_loss": -25.945714950561523, "global_step": 332575, "epoch": 4006} {"train_loss": -26.124927520751953, "global_step": 332576, "epoch": 4006} {"train_loss": -25.555654525756836, "global_step": 332577, "epoch": 4006} {"train_loss": -25.848052978515625, "global_step": 332578, "epoch": 4006} {"train_loss": -26.075101852416992, "global_step": 332579, "epoch": 4006} {"train_loss": -25.793211029236573, "global_step": 332580, "epoch": 4006, "val_loss": 7251560.5} {"train_loss": -25.592933654785156, "global_step": 332581, "epoch": 4007} {"train_loss": -25.915918350219727, "global_step": 332582, "epoch": 4007} {"train_loss": -25.562992095947266, "global_step": 332583, "epoch": 4007} {"train_loss": -25.576396942138672, "global_step": 332584, "epoch": 4007} {"train_loss": -25.356090545654297, "global_step": 332585, "epoch": 4007} {"train_loss": -25.633838653564453, "global_step": 332586, "epoch": 4007} {"train_loss": -25.910303115844727, "global_step": 332587, "epoch": 4007} {"train_loss": -25.859130859375, "global_step": 332588, "epoch": 4007} {"train_loss": -25.565900802612305, "global_step": 332589, "epoch": 4007} {"train_loss": -25.598594665527344, "global_step": 332590, "epoch": 4007} {"train_loss": -26.01502799987793, "global_step": 332591, "epoch": 4007} {"train_loss": -25.822647094726562, "global_step": 332592, "epoch": 4007} {"train_loss": -25.815540313720703, "global_step": 332593, "epoch": 4007} {"train_loss": -25.642932891845703, "global_step": 332594, "epoch": 4007} {"train_loss": -25.883817672729492, "global_step": 332595, "epoch": 4007} {"train_loss": -26.0317440032959, "global_step": 332596, "epoch": 4007} {"train_loss": -25.934309005737305, "global_step": 332597, "epoch": 4007} {"train_loss": -26.061796188354492, "global_step": 332598, "epoch": 4007} {"train_loss": -25.642892837524414, "global_step": 332599, "epoch": 4007} {"train_loss": -26.08961296081543, "global_step": 332600, "epoch": 4007} {"train_loss": -26.00029945373535, "global_step": 332601, "epoch": 4007} {"train_loss": -26.24724769592285, "global_step": 332602, "epoch": 4007} {"train_loss": -26.148645401000977, "global_step": 332603, "epoch": 4007} {"train_loss": -25.710126876831055, "global_step": 332604, "epoch": 4007} {"train_loss": -26.201099395751953, "global_step": 332605, "epoch": 4007} {"train_loss": -25.766849517822266, "global_step": 332606, "epoch": 4007} {"train_loss": -25.811365127563477, "global_step": 332607, "epoch": 4007} {"train_loss": -25.800756454467773, "global_step": 332608, "epoch": 4007} {"train_loss": -25.88950538635254, "global_step": 332609, "epoch": 4007} {"train_loss": -25.840726852416992, "global_step": 332610, "epoch": 4007} {"train_loss": -25.994476318359375, "global_step": 332611, "epoch": 4007} {"train_loss": -25.90191078186035, "global_step": 332612, "epoch": 4007} {"train_loss": -25.903385162353516, "global_step": 332613, "epoch": 4007} {"train_loss": -26.420934677124023, "global_step": 332614, "epoch": 4007} {"train_loss": -26.020116806030273, "global_step": 332615, "epoch": 4007} {"train_loss": -26.074310302734375, "global_step": 332616, "epoch": 4007} {"train_loss": -26.000625610351562, "global_step": 332617, "epoch": 4007} {"train_loss": -25.949995040893555, "global_step": 332618, "epoch": 4007} {"train_loss": -25.798974990844727, "global_step": 332619, "epoch": 4007} {"train_loss": -25.71980094909668, "global_step": 332620, "epoch": 4007} {"train_loss": -25.855695724487305, "global_step": 332621, "epoch": 4007} {"train_loss": -26.12495994567871, "global_step": 332622, "epoch": 4007} {"train_loss": -26.192609786987305, "global_step": 332623, "epoch": 4007} {"train_loss": -26.049835205078125, "global_step": 332624, "epoch": 4007} {"train_loss": -26.04551124572754, "global_step": 332625, "epoch": 4007} {"train_loss": -26.263086318969727, "global_step": 332626, "epoch": 4007} {"train_loss": -26.172739028930664, "global_step": 332627, "epoch": 4007} {"train_loss": -26.070581436157227, "global_step": 332628, "epoch": 4007} {"train_loss": -26.030607223510742, "global_step": 332629, "epoch": 4007} {"train_loss": -25.94272232055664, "global_step": 332630, "epoch": 4007} {"train_loss": -25.829029083251953, "global_step": 332631, "epoch": 4007} {"train_loss": -26.033010482788086, "global_step": 332632, "epoch": 4007} {"train_loss": -25.8763484954834, "global_step": 332633, "epoch": 4007} {"train_loss": -25.338550567626953, "global_step": 332634, "epoch": 4007} {"train_loss": -25.365732192993164, "global_step": 332635, "epoch": 4007} {"train_loss": -26.234785079956055, "global_step": 332636, "epoch": 4007} {"train_loss": -25.6852970123291, "global_step": 332637, "epoch": 4007} {"train_loss": -25.928394317626953, "global_step": 332638, "epoch": 4007} {"train_loss": -25.479705810546875, "global_step": 332639, "epoch": 4007} {"train_loss": -25.378190994262695, "global_step": 332640, "epoch": 4007} {"train_loss": -26.060321807861328, "global_step": 332641, "epoch": 4007} {"train_loss": -25.742431640625, "global_step": 332642, "epoch": 4007} {"train_loss": -25.796127319335938, "global_step": 332643, "epoch": 4007} {"train_loss": -25.75929069519043, "global_step": 332644, "epoch": 4007} {"train_loss": -25.89344596862793, "global_step": 332645, "epoch": 4007} {"train_loss": -25.742496490478516, "global_step": 332646, "epoch": 4007} {"train_loss": -26.206958770751953, "global_step": 332647, "epoch": 4007} {"train_loss": -25.51307487487793, "global_step": 332648, "epoch": 4007} {"train_loss": -25.54903793334961, "global_step": 332649, "epoch": 4007} {"train_loss": -25.830320358276367, "global_step": 332650, "epoch": 4007} {"train_loss": -25.905654907226562, "global_step": 332651, "epoch": 4007} {"train_loss": -25.939443588256836, "global_step": 332652, "epoch": 4007} {"train_loss": -26.186573028564453, "global_step": 332653, "epoch": 4007} {"train_loss": -25.80517578125, "global_step": 332654, "epoch": 4007} {"train_loss": -26.072423934936523, "global_step": 332655, "epoch": 4007} {"train_loss": -25.794424057006836, "global_step": 332656, "epoch": 4007} {"train_loss": -26.0793514251709, "global_step": 332657, "epoch": 4007} {"train_loss": -25.7846736907959, "global_step": 332658, "epoch": 4007} {"train_loss": -25.552736282348633, "global_step": 332659, "epoch": 4007} {"train_loss": -25.921417236328125, "global_step": 332660, "epoch": 4007} {"train_loss": -26.17167091369629, "global_step": 332661, "epoch": 4007} {"train_loss": -25.552534103393555, "global_step": 332662, "epoch": 4007} {"train_loss": -25.865727275250904, "global_step": 332663, "epoch": 4007, "val_loss": 7137916.0} {"train_loss": -25.2384033203125, "global_step": 332664, "epoch": 4008} {"train_loss": -25.234424591064453, "global_step": 332665, "epoch": 4008} {"train_loss": -25.70307731628418, "global_step": 332666, "epoch": 4008} {"train_loss": -25.498401641845703, "global_step": 332667, "epoch": 4008} {"train_loss": -25.611108779907227, "global_step": 332668, "epoch": 4008} {"train_loss": -25.958288192749023, "global_step": 332669, "epoch": 4008} {"train_loss": -25.406335830688477, "global_step": 332670, "epoch": 4008} {"train_loss": -25.698774337768555, "global_step": 332671, "epoch": 4008} {"train_loss": -25.873315811157227, "global_step": 332672, "epoch": 4008} {"train_loss": -25.582279205322266, "global_step": 332673, "epoch": 4008} {"train_loss": -25.662811279296875, "global_step": 332674, "epoch": 4008} {"train_loss": -25.824377059936523, "global_step": 332675, "epoch": 4008} {"train_loss": -25.61231803894043, "global_step": 332676, "epoch": 4008} {"train_loss": -25.62939453125, "global_step": 332677, "epoch": 4008} {"train_loss": -26.068212509155273, "global_step": 332678, "epoch": 4008} {"train_loss": -26.014163970947266, "global_step": 332679, "epoch": 4008} {"train_loss": -26.184324264526367, "global_step": 332680, "epoch": 4008} {"train_loss": -25.652982711791992, "global_step": 332681, "epoch": 4008} {"train_loss": -25.7866268157959, "global_step": 332682, "epoch": 4008} {"train_loss": -25.850067138671875, "global_step": 332683, "epoch": 4008} {"train_loss": -26.017093658447266, "global_step": 332684, "epoch": 4008} {"train_loss": -25.778217315673828, "global_step": 332685, "epoch": 4008} {"train_loss": -25.679889678955078, "global_step": 332686, "epoch": 4008} {"train_loss": -25.90476417541504, "global_step": 332687, "epoch": 4008} {"train_loss": -26.0274600982666, "global_step": 332688, "epoch": 4008} {"train_loss": -25.77833366394043, "global_step": 332689, "epoch": 4008} {"train_loss": -26.4620361328125, "global_step": 332690, "epoch": 4008} {"train_loss": -25.672433853149414, "global_step": 332691, "epoch": 4008} {"train_loss": -26.275562286376953, "global_step": 332692, "epoch": 4008} {"train_loss": -25.679428100585938, "global_step": 332693, "epoch": 4008} {"train_loss": -25.973554611206055, "global_step": 332694, "epoch": 4008} {"train_loss": -26.035266876220703, "global_step": 332695, "epoch": 4008} {"train_loss": -25.889495849609375, "global_step": 332696, "epoch": 4008} {"train_loss": -25.797657012939453, "global_step": 332697, "epoch": 4008} {"train_loss": -26.01741600036621, "global_step": 332698, "epoch": 4008} {"train_loss": -25.982770919799805, "global_step": 332699, "epoch": 4008} {"train_loss": -26.274707794189453, "global_step": 332700, "epoch": 4008} {"train_loss": -26.200342178344727, "global_step": 332701, "epoch": 4008} {"train_loss": -26.299657821655273, "global_step": 332702, "epoch": 4008} {"train_loss": -26.099328994750977, "global_step": 332703, "epoch": 4008} {"train_loss": -26.290739059448242, "global_step": 332704, "epoch": 4008} {"train_loss": -26.124082565307617, "global_step": 332705, "epoch": 4008} {"train_loss": -26.007471084594727, "global_step": 332706, "epoch": 4008} {"train_loss": -25.997364044189453, "global_step": 332707, "epoch": 4008} {"train_loss": -25.7883358001709, "global_step": 332708, "epoch": 4008} {"train_loss": -25.9709529876709, "global_step": 332709, "epoch": 4008} {"train_loss": -26.323705673217773, "global_step": 332710, "epoch": 4008} {"train_loss": -26.454559326171875, "global_step": 332711, "epoch": 4008} {"train_loss": -26.02569007873535, "global_step": 332712, "epoch": 4008} {"train_loss": -26.077619552612305, "global_step": 332713, "epoch": 4008} {"train_loss": -26.198530197143555, "global_step": 332714, "epoch": 4008} {"train_loss": -25.860483169555664, "global_step": 332715, "epoch": 4008} {"train_loss": -26.006423950195312, "global_step": 332716, "epoch": 4008} {"train_loss": -26.114953994750977, "global_step": 332717, "epoch": 4008} {"train_loss": -26.111722946166992, "global_step": 332718, "epoch": 4008} {"train_loss": -26.12529945373535, "global_step": 332719, "epoch": 4008} {"train_loss": -26.255762100219727, "global_step": 332720, "epoch": 4008} {"train_loss": -26.168136596679688, "global_step": 332721, "epoch": 4008} {"train_loss": -25.921863555908203, "global_step": 332722, "epoch": 4008} {"train_loss": -25.84518814086914, "global_step": 332723, "epoch": 4008} {"train_loss": -26.168004989624023, "global_step": 332724, "epoch": 4008} {"train_loss": -25.7830810546875, "global_step": 332725, "epoch": 4008} {"train_loss": -26.15003776550293, "global_step": 332726, "epoch": 4008} {"train_loss": -26.1690673828125, "global_step": 332727, "epoch": 4008} {"train_loss": -25.924671173095703, "global_step": 332728, "epoch": 4008} {"train_loss": -25.53420639038086, "global_step": 332729, "epoch": 4008} {"train_loss": -25.964704513549805, "global_step": 332730, "epoch": 4008} {"train_loss": -26.0893611907959, "global_step": 332731, "epoch": 4008} {"train_loss": -25.977313995361328, "global_step": 332732, "epoch": 4008} {"train_loss": -25.702041625976562, "global_step": 332733, "epoch": 4008} {"train_loss": -26.104093551635742, "global_step": 332734, "epoch": 4008} {"train_loss": -26.284564971923828, "global_step": 332735, "epoch": 4008} {"train_loss": -26.101001739501953, "global_step": 332736, "epoch": 4008} {"train_loss": -25.935169219970703, "global_step": 332737, "epoch": 4008} {"train_loss": -25.817386627197266, "global_step": 332738, "epoch": 4008} {"train_loss": -25.851764678955078, "global_step": 332739, "epoch": 4008} {"train_loss": -26.034393310546875, "global_step": 332740, "epoch": 4008} {"train_loss": -25.879535675048828, "global_step": 332741, "epoch": 4008} {"train_loss": -25.930953979492188, "global_step": 332742, "epoch": 4008} {"train_loss": -25.557767868041992, "global_step": 332743, "epoch": 4008} {"train_loss": -26.509586334228516, "global_step": 332744, "epoch": 4008} {"train_loss": -25.942413330078125, "global_step": 332745, "epoch": 4008} {"train_loss": -25.936925727200794, "global_step": 332746, "epoch": 4008, "val_loss": 7129133.0} {"train_loss": -25.408369064331055, "global_step": 332747, "epoch": 4009} {"train_loss": -23.846878051757812, "global_step": 332748, "epoch": 4009} {"train_loss": -25.32355308532715, "global_step": 332749, "epoch": 4009} {"train_loss": -25.697412490844727, "global_step": 332750, "epoch": 4009} {"train_loss": -25.140945434570312, "global_step": 332751, "epoch": 4009} {"train_loss": -24.230512619018555, "global_step": 332752, "epoch": 4009} {"train_loss": -25.259109497070312, "global_step": 332753, "epoch": 4009} {"train_loss": -25.562992095947266, "global_step": 332754, "epoch": 4009} {"train_loss": -25.59174919128418, "global_step": 332755, "epoch": 4009} {"train_loss": -25.36779022216797, "global_step": 332756, "epoch": 4009} {"train_loss": -25.57206916809082, "global_step": 332757, "epoch": 4009} {"train_loss": -25.287944793701172, "global_step": 332758, "epoch": 4009} {"train_loss": -25.612573623657227, "global_step": 332759, "epoch": 4009} {"train_loss": -25.741790771484375, "global_step": 332760, "epoch": 4009} {"train_loss": -25.819488525390625, "global_step": 332761, "epoch": 4009} {"train_loss": -25.673818588256836, "global_step": 332762, "epoch": 4009} {"train_loss": -25.556421279907227, "global_step": 332763, "epoch": 4009} {"train_loss": -25.670867919921875, "global_step": 332764, "epoch": 4009} {"train_loss": -25.925302505493164, "global_step": 332765, "epoch": 4009} {"train_loss": -25.712732315063477, "global_step": 332766, "epoch": 4009} {"train_loss": -25.73296546936035, "global_step": 332767, "epoch": 4009} {"train_loss": -26.03547477722168, "global_step": 332768, "epoch": 4009} {"train_loss": -25.670230865478516, "global_step": 332769, "epoch": 4009} {"train_loss": -25.837736129760742, "global_step": 332770, "epoch": 4009} {"train_loss": -25.925344467163086, "global_step": 332771, "epoch": 4009} {"train_loss": -25.85454750061035, "global_step": 332772, "epoch": 4009} {"train_loss": -25.8317928314209, "global_step": 332773, "epoch": 4009} {"train_loss": -25.701648712158203, "global_step": 332774, "epoch": 4009} {"train_loss": -25.859073638916016, "global_step": 332775, "epoch": 4009} {"train_loss": -26.22749137878418, "global_step": 332776, "epoch": 4009} {"train_loss": -25.911502838134766, "global_step": 332777, "epoch": 4009} {"train_loss": -25.21311378479004, "global_step": 332778, "epoch": 4009} {"train_loss": -26.320850372314453, "global_step": 332779, "epoch": 4009} {"train_loss": -25.787586212158203, "global_step": 332780, "epoch": 4009} {"train_loss": -25.994495391845703, "global_step": 332781, "epoch": 4009} {"train_loss": -25.814313888549805, "global_step": 332782, "epoch": 4009} {"train_loss": -26.099506378173828, "global_step": 332783, "epoch": 4009} {"train_loss": -26.19211769104004, "global_step": 332784, "epoch": 4009} {"train_loss": -25.96303367614746, "global_step": 332785, "epoch": 4009} {"train_loss": -25.838056564331055, "global_step": 332786, "epoch": 4009} {"train_loss": -25.9024600982666, "global_step": 332787, "epoch": 4009} {"train_loss": -26.288639068603516, "global_step": 332788, "epoch": 4009} {"train_loss": -26.225650787353516, "global_step": 332789, "epoch": 4009} {"train_loss": -26.070148468017578, "global_step": 332790, "epoch": 4009} {"train_loss": -26.046178817749023, "global_step": 332791, "epoch": 4009} {"train_loss": -25.979230880737305, "global_step": 332792, "epoch": 4009} {"train_loss": -26.37796974182129, "global_step": 332793, "epoch": 4009} {"train_loss": -26.358701705932617, "global_step": 332794, "epoch": 4009} {"train_loss": -26.08583641052246, "global_step": 332795, "epoch": 4009} {"train_loss": -26.073942184448242, "global_step": 332796, "epoch": 4009} {"train_loss": -25.839704513549805, "global_step": 332797, "epoch": 4009} {"train_loss": -26.150476455688477, "global_step": 332798, "epoch": 4009} {"train_loss": -25.675649642944336, "global_step": 332799, "epoch": 4009} {"train_loss": -26.08033561706543, "global_step": 332800, "epoch": 4009} {"train_loss": -26.1326847076416, "global_step": 332801, "epoch": 4009} {"train_loss": -26.157596588134766, "global_step": 332802, "epoch": 4009} {"train_loss": -26.163602828979492, "global_step": 332803, "epoch": 4009} {"train_loss": -25.946537017822266, "global_step": 332804, "epoch": 4009} {"train_loss": -26.141454696655273, "global_step": 332805, "epoch": 4009} {"train_loss": -26.11799430847168, "global_step": 332806, "epoch": 4009} {"train_loss": -26.3342342376709, "global_step": 332807, "epoch": 4009} {"train_loss": -26.395618438720703, "global_step": 332808, "epoch": 4009} {"train_loss": -25.96609878540039, "global_step": 332809, "epoch": 4009} {"train_loss": -26.296894073486328, "global_step": 332810, "epoch": 4009} {"train_loss": -25.87836265563965, "global_step": 332811, "epoch": 4009} {"train_loss": -25.87587547302246, "global_step": 332812, "epoch": 4009} {"train_loss": -25.74329948425293, "global_step": 332813, "epoch": 4009} {"train_loss": -26.301801681518555, "global_step": 332814, "epoch": 4009} {"train_loss": -26.27229118347168, "global_step": 332815, "epoch": 4009} {"train_loss": -25.912744522094727, "global_step": 332816, "epoch": 4009} {"train_loss": -25.75132179260254, "global_step": 332817, "epoch": 4009} {"train_loss": -25.352306365966797, "global_step": 332818, "epoch": 4009} {"train_loss": -25.516586303710938, "global_step": 332819, "epoch": 4009} {"train_loss": -25.5880126953125, "global_step": 332820, "epoch": 4009} {"train_loss": -26.0699405670166, "global_step": 332821, "epoch": 4009} {"train_loss": -26.042449951171875, "global_step": 332822, "epoch": 4009} {"train_loss": -26.13958740234375, "global_step": 332823, "epoch": 4009} {"train_loss": -25.753345489501953, "global_step": 332824, "epoch": 4009} {"train_loss": -25.661855697631836, "global_step": 332825, "epoch": 4009} {"train_loss": -25.769927978515625, "global_step": 332826, "epoch": 4009} {"train_loss": -26.094196319580078, "global_step": 332827, "epoch": 4009} {"train_loss": -26.0369873046875, "global_step": 332828, "epoch": 4009} {"train_loss": -25.82006624520543, "global_step": 332829, "epoch": 4009, "val_loss": 7150728.0} {"train_loss": -24.768522262573242, "global_step": 332830, "epoch": 4010} {"train_loss": -24.970256805419922, "global_step": 332831, "epoch": 4010} {"train_loss": -25.818817138671875, "global_step": 332832, "epoch": 4010} {"train_loss": -25.246145248413086, "global_step": 332833, "epoch": 4010} {"train_loss": -25.79767417907715, "global_step": 332834, "epoch": 4010} {"train_loss": -25.52652931213379, "global_step": 332835, "epoch": 4010} {"train_loss": -25.813190460205078, "global_step": 332836, "epoch": 4010} {"train_loss": -25.180681228637695, "global_step": 332837, "epoch": 4010} {"train_loss": -25.69028091430664, "global_step": 332838, "epoch": 4010} {"train_loss": -25.758249282836914, "global_step": 332839, "epoch": 4010} {"train_loss": -26.05324363708496, "global_step": 332840, "epoch": 4010} {"train_loss": -25.670812606811523, "global_step": 332841, "epoch": 4010} {"train_loss": -25.392850875854492, "global_step": 332842, "epoch": 4010} {"train_loss": -26.138137817382812, "global_step": 332843, "epoch": 4010} {"train_loss": -25.334693908691406, "global_step": 332844, "epoch": 4010} {"train_loss": -25.863683700561523, "global_step": 332845, "epoch": 4010} {"train_loss": -25.888647079467773, "global_step": 332846, "epoch": 4010} {"train_loss": -25.968664169311523, "global_step": 332847, "epoch": 4010} {"train_loss": -26.30632972717285, "global_step": 332848, "epoch": 4010} {"train_loss": -25.66986083984375, "global_step": 332849, "epoch": 4010} {"train_loss": -25.89495277404785, "global_step": 332850, "epoch": 4010} {"train_loss": -25.400150299072266, "global_step": 332851, "epoch": 4010} {"train_loss": -25.713315963745117, "global_step": 332852, "epoch": 4010} {"train_loss": -25.749042510986328, "global_step": 332853, "epoch": 4010} {"train_loss": -26.012598037719727, "global_step": 332854, "epoch": 4010} {"train_loss": -25.798288345336914, "global_step": 332855, "epoch": 4010} {"train_loss": -26.188709259033203, "global_step": 332856, "epoch": 4010} {"train_loss": -26.16179847717285, "global_step": 332857, "epoch": 4010} {"train_loss": -25.952594757080078, "global_step": 332858, "epoch": 4010} {"train_loss": -25.653440475463867, "global_step": 332859, "epoch": 4010} {"train_loss": -25.987592697143555, "global_step": 332860, "epoch": 4010} {"train_loss": -25.9327392578125, "global_step": 332861, "epoch": 4010} {"train_loss": -26.18177604675293, "global_step": 332862, "epoch": 4010} {"train_loss": -26.056396484375, "global_step": 332863, "epoch": 4010} {"train_loss": -26.038360595703125, "global_step": 332864, "epoch": 4010} {"train_loss": -26.269412994384766, "global_step": 332865, "epoch": 4010} {"train_loss": -25.889982223510742, "global_step": 332866, "epoch": 4010} {"train_loss": -25.95979118347168, "global_step": 332867, "epoch": 4010} {"train_loss": -25.836393356323242, "global_step": 332868, "epoch": 4010} {"train_loss": -26.04108238220215, "global_step": 332869, "epoch": 4010} {"train_loss": -25.9139461517334, "global_step": 332870, "epoch": 4010} {"train_loss": -26.13038444519043, "global_step": 332871, "epoch": 4010} {"train_loss": -25.90961265563965, "global_step": 332872, "epoch": 4010} {"train_loss": -26.383214950561523, "global_step": 332873, "epoch": 4010} {"train_loss": -26.18790626525879, "global_step": 332874, "epoch": 4010} {"train_loss": -26.118207931518555, "global_step": 332875, "epoch": 4010} {"train_loss": -26.036096572875977, "global_step": 332876, "epoch": 4010} {"train_loss": -26.185510635375977, "global_step": 332877, "epoch": 4010} {"train_loss": -26.510156631469727, "global_step": 332878, "epoch": 4010} {"train_loss": -25.88150405883789, "global_step": 332879, "epoch": 4010} {"train_loss": -26.03202247619629, "global_step": 332880, "epoch": 4010} {"train_loss": -25.83656883239746, "global_step": 332881, "epoch": 4010} {"train_loss": -26.16701316833496, "global_step": 332882, "epoch": 4010} {"train_loss": -26.005142211914062, "global_step": 332883, "epoch": 4010} {"train_loss": -26.106149673461914, "global_step": 332884, "epoch": 4010} {"train_loss": -26.243865966796875, "global_step": 332885, "epoch": 4010} {"train_loss": -25.869583129882812, "global_step": 332886, "epoch": 4010} {"train_loss": -25.988189697265625, "global_step": 332887, "epoch": 4010} {"train_loss": -26.3110294342041, "global_step": 332888, "epoch": 4010} {"train_loss": -26.05103874206543, "global_step": 332889, "epoch": 4010} {"train_loss": -26.20985221862793, "global_step": 332890, "epoch": 4010} {"train_loss": -25.93719482421875, "global_step": 332891, "epoch": 4010} {"train_loss": -26.494781494140625, "global_step": 332892, "epoch": 4010} {"train_loss": -25.9570255279541, "global_step": 332893, "epoch": 4010} {"train_loss": -26.229156494140625, "global_step": 332894, "epoch": 4010} {"train_loss": -26.194250106811523, "global_step": 332895, "epoch": 4010} {"train_loss": -26.20060157775879, "global_step": 332896, "epoch": 4010} {"train_loss": -26.68745231628418, "global_step": 332897, "epoch": 4010} {"train_loss": -26.38699722290039, "global_step": 332898, "epoch": 4010} {"train_loss": -26.1910343170166, "global_step": 332899, "epoch": 4010} {"train_loss": -25.885465621948242, "global_step": 332900, "epoch": 4010} {"train_loss": -26.05517578125, "global_step": 332901, "epoch": 4010} {"train_loss": -26.151636123657227, "global_step": 332902, "epoch": 4010} {"train_loss": -25.994537353515625, "global_step": 332903, "epoch": 4010} {"train_loss": -26.0302677154541, "global_step": 332904, "epoch": 4010} {"train_loss": -26.080148696899414, "global_step": 332905, "epoch": 4010} {"train_loss": -25.96259117126465, "global_step": 332906, "epoch": 4010} {"train_loss": -25.767744064331055, "global_step": 332907, "epoch": 4010} {"train_loss": -26.127660751342773, "global_step": 332908, "epoch": 4010} {"train_loss": -26.09515953063965, "global_step": 332909, "epoch": 4010} {"train_loss": -25.83631706237793, "global_step": 332910, "epoch": 4010} {"train_loss": -26.05938148498535, "global_step": 332911, "epoch": 4010} {"train_loss": -25.955526099147566, "global_step": 332912, "epoch": 4010, "val_loss": 7169747.0} {"train_loss": -24.295459747314453, "global_step": 332913, "epoch": 4011} {"train_loss": -24.06649398803711, "global_step": 332914, "epoch": 4011} {"train_loss": -25.37135887145996, "global_step": 332915, "epoch": 4011} {"train_loss": -25.140432357788086, "global_step": 332916, "epoch": 4011} {"train_loss": -24.840713500976562, "global_step": 332917, "epoch": 4011} {"train_loss": -24.45576286315918, "global_step": 332918, "epoch": 4011} {"train_loss": -25.271577835083008, "global_step": 332919, "epoch": 4011} {"train_loss": -25.05426597595215, "global_step": 332920, "epoch": 4011} {"train_loss": -25.346139907836914, "global_step": 332921, "epoch": 4011} {"train_loss": -25.08919334411621, "global_step": 332922, "epoch": 4011} {"train_loss": -25.274280548095703, "global_step": 332923, "epoch": 4011} {"train_loss": -25.311079025268555, "global_step": 332924, "epoch": 4011} {"train_loss": -25.485692977905273, "global_step": 332925, "epoch": 4011} {"train_loss": -25.66176414489746, "global_step": 332926, "epoch": 4011} {"train_loss": -25.451555252075195, "global_step": 332927, "epoch": 4011} {"train_loss": -25.317523956298828, "global_step": 332928, "epoch": 4011} {"train_loss": -25.530973434448242, "global_step": 332929, "epoch": 4011} {"train_loss": -25.263412475585938, "global_step": 332930, "epoch": 4011} {"train_loss": -25.7852783203125, "global_step": 332931, "epoch": 4011} {"train_loss": -25.14479637145996, "global_step": 332932, "epoch": 4011} {"train_loss": -25.952306747436523, "global_step": 332933, "epoch": 4011} {"train_loss": -25.58272361755371, "global_step": 332934, "epoch": 4011} {"train_loss": -25.612491607666016, "global_step": 332935, "epoch": 4011} {"train_loss": -25.846851348876953, "global_step": 332936, "epoch": 4011} {"train_loss": -25.78168296813965, "global_step": 332937, "epoch": 4011} {"train_loss": -26.047042846679688, "global_step": 332938, "epoch": 4011} {"train_loss": -25.956531524658203, "global_step": 332939, "epoch": 4011} {"train_loss": -25.500106811523438, "global_step": 332940, "epoch": 4011} {"train_loss": -25.768163681030273, "global_step": 332941, "epoch": 4011} {"train_loss": -25.884754180908203, "global_step": 332942, "epoch": 4011} {"train_loss": -25.824777603149414, "global_step": 332943, "epoch": 4011} {"train_loss": -25.75115394592285, "global_step": 332944, "epoch": 4011} {"train_loss": -25.870893478393555, "global_step": 332945, "epoch": 4011} {"train_loss": -25.951135635375977, "global_step": 332946, "epoch": 4011} {"train_loss": -25.797779083251953, "global_step": 332947, "epoch": 4011} {"train_loss": -26.129714965820312, "global_step": 332948, "epoch": 4011} {"train_loss": -25.638477325439453, "global_step": 332949, "epoch": 4011} {"train_loss": -25.726892471313477, "global_step": 332950, "epoch": 4011} {"train_loss": -25.986169815063477, "global_step": 332951, "epoch": 4011} {"train_loss": -26.008508682250977, "global_step": 332952, "epoch": 4011} {"train_loss": -26.0226993560791, "global_step": 332953, "epoch": 4011} {"train_loss": -25.742612838745117, "global_step": 332954, "epoch": 4011} {"train_loss": -25.94697380065918, "global_step": 332955, "epoch": 4011} {"train_loss": -25.93561363220215, "global_step": 332956, "epoch": 4011} {"train_loss": -26.37604331970215, "global_step": 332957, "epoch": 4011} {"train_loss": -26.141284942626953, "global_step": 332958, "epoch": 4011} {"train_loss": -25.920007705688477, "global_step": 332959, "epoch": 4011} {"train_loss": -25.857929229736328, "global_step": 332960, "epoch": 4011} {"train_loss": -25.70722770690918, "global_step": 332961, "epoch": 4011} {"train_loss": -26.218341827392578, "global_step": 332962, "epoch": 4011} {"train_loss": -26.103357315063477, "global_step": 332963, "epoch": 4011} {"train_loss": -25.88030433654785, "global_step": 332964, "epoch": 4011} {"train_loss": -26.435653686523438, "global_step": 332965, "epoch": 4011} {"train_loss": -25.786893844604492, "global_step": 332966, "epoch": 4011} {"train_loss": -25.72625160217285, "global_step": 332967, "epoch": 4011} {"train_loss": -26.173063278198242, "global_step": 332968, "epoch": 4011} {"train_loss": -26.009994506835938, "global_step": 332969, "epoch": 4011} {"train_loss": -26.074920654296875, "global_step": 332970, "epoch": 4011} {"train_loss": -26.36557960510254, "global_step": 332971, "epoch": 4011} {"train_loss": -26.12363052368164, "global_step": 332972, "epoch": 4011} {"train_loss": -26.088245391845703, "global_step": 332973, "epoch": 4011} {"train_loss": -25.618688583374023, "global_step": 332974, "epoch": 4011} {"train_loss": -26.226226806640625, "global_step": 332975, "epoch": 4011} {"train_loss": -25.94142723083496, "global_step": 332976, "epoch": 4011} {"train_loss": -26.459314346313477, "global_step": 332977, "epoch": 4011} {"train_loss": -25.740522384643555, "global_step": 332978, "epoch": 4011} {"train_loss": -25.8719482421875, "global_step": 332979, "epoch": 4011} {"train_loss": -25.56105613708496, "global_step": 332980, "epoch": 4011} {"train_loss": -25.858539581298828, "global_step": 332981, "epoch": 4011} {"train_loss": -26.234067916870117, "global_step": 332982, "epoch": 4011} {"train_loss": -26.1240234375, "global_step": 332983, "epoch": 4011} {"train_loss": -25.786542892456055, "global_step": 332984, "epoch": 4011} {"train_loss": -26.07520866394043, "global_step": 332985, "epoch": 4011} {"train_loss": -25.962087631225586, "global_step": 332986, "epoch": 4011} {"train_loss": -25.702030181884766, "global_step": 332987, "epoch": 4011} {"train_loss": -25.790552139282227, "global_step": 332988, "epoch": 4011} {"train_loss": -26.18360710144043, "global_step": 332989, "epoch": 4011} {"train_loss": -26.17417335510254, "global_step": 332990, "epoch": 4011} {"train_loss": -26.116260528564453, "global_step": 332991, "epoch": 4011} {"train_loss": -25.844594955444336, "global_step": 332992, "epoch": 4011} {"train_loss": -25.9128475189209, "global_step": 332993, "epoch": 4011} {"train_loss": -26.061065673828125, "global_step": 332994, "epoch": 4011} {"train_loss": -25.762490743614105, "global_step": 332995, "epoch": 4011, "val_loss": 7151439.0} {"train_loss": -25.612585067749023, "global_step": 332996, "epoch": 4012} {"train_loss": -25.801721572875977, "global_step": 332997, "epoch": 4012} {"train_loss": -25.689191818237305, "global_step": 332998, "epoch": 4012} {"train_loss": -25.4257869720459, "global_step": 332999, "epoch": 4012} {"train_loss": -25.7134952545166, "global_step": 333000, "epoch": 4012} {"train_loss": -25.05897331237793, "global_step": 333001, "epoch": 4012} {"train_loss": -25.823455810546875, "global_step": 333002, "epoch": 4012} {"train_loss": -25.511323928833008, "global_step": 333003, "epoch": 4012} {"train_loss": -25.184965133666992, "global_step": 333004, "epoch": 4012} {"train_loss": -25.8880672454834, "global_step": 333005, "epoch": 4012} {"train_loss": -25.62652015686035, "global_step": 333006, "epoch": 4012} {"train_loss": -25.73357582092285, "global_step": 333007, "epoch": 4012} {"train_loss": -26.022031784057617, "global_step": 333008, "epoch": 4012} {"train_loss": -25.493778228759766, "global_step": 333009, "epoch": 4012} {"train_loss": -25.603281021118164, "global_step": 333010, "epoch": 4012} {"train_loss": -25.9342041015625, "global_step": 333011, "epoch": 4012} {"train_loss": -26.094465255737305, "global_step": 333012, "epoch": 4012} {"train_loss": -25.609495162963867, "global_step": 333013, "epoch": 4012} {"train_loss": -25.9392032623291, "global_step": 333014, "epoch": 4012} {"train_loss": -25.917688369750977, "global_step": 333015, "epoch": 4012} {"train_loss": -25.681100845336914, "global_step": 333016, "epoch": 4012} {"train_loss": -26.395681381225586, "global_step": 333017, "epoch": 4012} {"train_loss": -25.825927734375, "global_step": 333018, "epoch": 4012} {"train_loss": -26.448205947875977, "global_step": 333019, "epoch": 4012} {"train_loss": -25.799192428588867, "global_step": 333020, "epoch": 4012} {"train_loss": -26.14697265625, "global_step": 333021, "epoch": 4012} {"train_loss": -26.300256729125977, "global_step": 333022, "epoch": 4012} {"train_loss": -25.8325138092041, "global_step": 333023, "epoch": 4012} {"train_loss": -25.964941024780273, "global_step": 333024, "epoch": 4012} {"train_loss": -26.46156120300293, "global_step": 333025, "epoch": 4012} {"train_loss": -26.024316787719727, "global_step": 333026, "epoch": 4012} {"train_loss": -26.13986587524414, "global_step": 333027, "epoch": 4012} {"train_loss": -26.16865348815918, "global_step": 333028, "epoch": 4012} {"train_loss": -26.0600643157959, "global_step": 333029, "epoch": 4012} {"train_loss": -26.2587833404541, "global_step": 333030, "epoch": 4012} {"train_loss": -26.213727951049805, "global_step": 333031, "epoch": 4012} {"train_loss": -26.339956283569336, "global_step": 333032, "epoch": 4012} {"train_loss": -26.406158447265625, "global_step": 333033, "epoch": 4012} {"train_loss": -26.02740478515625, "global_step": 333034, "epoch": 4012} {"train_loss": -26.339065551757812, "global_step": 333035, "epoch": 4012} {"train_loss": -26.0417537689209, "global_step": 333036, "epoch": 4012} {"train_loss": -26.155975341796875, "global_step": 333037, "epoch": 4012} {"train_loss": -26.129926681518555, "global_step": 333038, "epoch": 4012} {"train_loss": -26.23189353942871, "global_step": 333039, "epoch": 4012} {"train_loss": -26.2872371673584, "global_step": 333040, "epoch": 4012} {"train_loss": -26.21624755859375, "global_step": 333041, "epoch": 4012} {"train_loss": -26.209165573120117, "global_step": 333042, "epoch": 4012} {"train_loss": -25.64435386657715, "global_step": 333043, "epoch": 4012} {"train_loss": -25.935413360595703, "global_step": 333044, "epoch": 4012} {"train_loss": -25.907806396484375, "global_step": 333045, "epoch": 4012} {"train_loss": -26.085941314697266, "global_step": 333046, "epoch": 4012} {"train_loss": -26.092798233032227, "global_step": 333047, "epoch": 4012} {"train_loss": -26.160490036010742, "global_step": 333048, "epoch": 4012} {"train_loss": -26.084732055664062, "global_step": 333049, "epoch": 4012} {"train_loss": -25.939252853393555, "global_step": 333050, "epoch": 4012} {"train_loss": -26.27518653869629, "global_step": 333051, "epoch": 4012} {"train_loss": -26.207141876220703, "global_step": 333052, "epoch": 4012} {"train_loss": -26.417510986328125, "global_step": 333053, "epoch": 4012} {"train_loss": -25.95319175720215, "global_step": 333054, "epoch": 4012} {"train_loss": -25.668060302734375, "global_step": 333055, "epoch": 4012} {"train_loss": -25.879858016967773, "global_step": 333056, "epoch": 4012} {"train_loss": -26.32511329650879, "global_step": 333057, "epoch": 4012} {"train_loss": -26.134403228759766, "global_step": 333058, "epoch": 4012} {"train_loss": -26.30584716796875, "global_step": 333059, "epoch": 4012} {"train_loss": -26.182958602905273, "global_step": 333060, "epoch": 4012} {"train_loss": -25.913679122924805, "global_step": 333061, "epoch": 4012} {"train_loss": -25.76173210144043, "global_step": 333062, "epoch": 4012} {"train_loss": -25.9668025970459, "global_step": 333063, "epoch": 4012} {"train_loss": -26.03887367248535, "global_step": 333064, "epoch": 4012} {"train_loss": -26.090742111206055, "global_step": 333065, "epoch": 4012} {"train_loss": -26.3975887298584, "global_step": 333066, "epoch": 4012} {"train_loss": -26.058734893798828, "global_step": 333067, "epoch": 4012} {"train_loss": -26.1552677154541, "global_step": 333068, "epoch": 4012} {"train_loss": -25.894824981689453, "global_step": 333069, "epoch": 4012} {"train_loss": -25.923419952392578, "global_step": 333070, "epoch": 4012} {"train_loss": -26.199323654174805, "global_step": 333071, "epoch": 4012} {"train_loss": -25.909610748291016, "global_step": 333072, "epoch": 4012} {"train_loss": -25.93657875061035, "global_step": 333073, "epoch": 4012} {"train_loss": -26.245275497436523, "global_step": 333074, "epoch": 4012} {"train_loss": -26.125946044921875, "global_step": 333075, "epoch": 4012} {"train_loss": -26.111963272094727, "global_step": 333076, "epoch": 4012} {"train_loss": -26.17109489440918, "global_step": 333077, "epoch": 4012} {"train_loss": -25.99537943644696, "global_step": 333078, "epoch": 4012, "val_loss": 7177657.0} {"train_loss": -23.332916259765625, "global_step": 333079, "epoch": 4013} {"train_loss": -20.966520309448242, "global_step": 333080, "epoch": 4013} {"train_loss": -23.602542877197266, "global_step": 333081, "epoch": 4013} {"train_loss": -24.443178176879883, "global_step": 333082, "epoch": 4013} {"train_loss": -24.399463653564453, "global_step": 333083, "epoch": 4013} {"train_loss": -25.02315330505371, "global_step": 333084, "epoch": 4013} {"train_loss": -24.677906036376953, "global_step": 333085, "epoch": 4013} {"train_loss": -24.739185333251953, "global_step": 333086, "epoch": 4013} {"train_loss": -24.952625274658203, "global_step": 333087, "epoch": 4013} {"train_loss": -25.2265567779541, "global_step": 333088, "epoch": 4013} {"train_loss": -24.81000518798828, "global_step": 333089, "epoch": 4013} {"train_loss": -25.34502601623535, "global_step": 333090, "epoch": 4013} {"train_loss": -25.251577377319336, "global_step": 333091, "epoch": 4013} {"train_loss": -24.83942413330078, "global_step": 333092, "epoch": 4013} {"train_loss": -25.411426544189453, "global_step": 333093, "epoch": 4013} {"train_loss": -25.384065628051758, "global_step": 333094, "epoch": 4013} {"train_loss": -25.31796646118164, "global_step": 333095, "epoch": 4013} {"train_loss": -25.17563819885254, "global_step": 333096, "epoch": 4013} {"train_loss": -25.28925895690918, "global_step": 333097, "epoch": 4013} {"train_loss": -25.355371475219727, "global_step": 333098, "epoch": 4013} {"train_loss": -25.256324768066406, "global_step": 333099, "epoch": 4013} {"train_loss": -25.5002498626709, "global_step": 333100, "epoch": 4013} {"train_loss": -25.166431427001953, "global_step": 333101, "epoch": 4013} {"train_loss": -25.71137046813965, "global_step": 333102, "epoch": 4013} {"train_loss": -25.544475555419922, "global_step": 333103, "epoch": 4013} {"train_loss": -25.2789363861084, "global_step": 333104, "epoch": 4013} {"train_loss": -25.413816452026367, "global_step": 333105, "epoch": 4013} {"train_loss": -25.78767204284668, "global_step": 333106, "epoch": 4013} {"train_loss": -25.556814193725586, "global_step": 333107, "epoch": 4013} {"train_loss": -25.547739028930664, "global_step": 333108, "epoch": 4013} {"train_loss": -25.500879287719727, "global_step": 333109, "epoch": 4013} {"train_loss": -25.897974014282227, "global_step": 333110, "epoch": 4013} {"train_loss": -25.514636993408203, "global_step": 333111, "epoch": 4013} {"train_loss": -25.992700576782227, "global_step": 333112, "epoch": 4013} {"train_loss": -25.91654396057129, "global_step": 333113, "epoch": 4013} {"train_loss": -25.991113662719727, "global_step": 333114, "epoch": 4013} {"train_loss": -26.05592155456543, "global_step": 333115, "epoch": 4013} {"train_loss": -25.61490249633789, "global_step": 333116, "epoch": 4013} {"train_loss": -25.64969825744629, "global_step": 333117, "epoch": 4013} {"train_loss": -26.02875328063965, "global_step": 333118, "epoch": 4013} {"train_loss": -25.453330993652344, "global_step": 333119, "epoch": 4013} {"train_loss": -26.26886558532715, "global_step": 333120, "epoch": 4013} {"train_loss": -25.962793350219727, "global_step": 333121, "epoch": 4013} {"train_loss": -26.166955947875977, "global_step": 333122, "epoch": 4013} {"train_loss": -26.133411407470703, "global_step": 333123, "epoch": 4013} {"train_loss": -25.946258544921875, "global_step": 333124, "epoch": 4013} {"train_loss": -25.69459342956543, "global_step": 333125, "epoch": 4013} {"train_loss": -25.946706771850586, "global_step": 333126, "epoch": 4013} {"train_loss": -25.82016372680664, "global_step": 333127, "epoch": 4013} {"train_loss": -25.60381507873535, "global_step": 333128, "epoch": 4013} {"train_loss": -26.088850021362305, "global_step": 333129, "epoch": 4013} {"train_loss": -25.884841918945312, "global_step": 333130, "epoch": 4013} {"train_loss": -26.141138076782227, "global_step": 333131, "epoch": 4013} {"train_loss": -25.957508087158203, "global_step": 333132, "epoch": 4013} {"train_loss": -26.210041046142578, "global_step": 333133, "epoch": 4013} {"train_loss": -26.180740356445312, "global_step": 333134, "epoch": 4013} {"train_loss": -26.064252853393555, "global_step": 333135, "epoch": 4013} {"train_loss": -26.099557876586914, "global_step": 333136, "epoch": 4013} {"train_loss": -25.91506004333496, "global_step": 333137, "epoch": 4013} {"train_loss": -26.158308029174805, "global_step": 333138, "epoch": 4013} {"train_loss": -26.206098556518555, "global_step": 333139, "epoch": 4013} {"train_loss": -26.334054946899414, "global_step": 333140, "epoch": 4013} {"train_loss": -25.67913818359375, "global_step": 333141, "epoch": 4013} {"train_loss": -26.396162033081055, "global_step": 333142, "epoch": 4013} {"train_loss": -25.87232780456543, "global_step": 333143, "epoch": 4013} {"train_loss": -26.199310302734375, "global_step": 333144, "epoch": 4013} {"train_loss": -25.679107666015625, "global_step": 333145, "epoch": 4013} {"train_loss": -25.87172508239746, "global_step": 333146, "epoch": 4013} {"train_loss": -25.735401153564453, "global_step": 333147, "epoch": 4013} {"train_loss": -25.9931697845459, "global_step": 333148, "epoch": 4013} {"train_loss": -26.07569694519043, "global_step": 333149, "epoch": 4013} {"train_loss": -25.928802490234375, "global_step": 333150, "epoch": 4013} {"train_loss": -25.715368270874023, "global_step": 333151, "epoch": 4013} {"train_loss": -25.99915885925293, "global_step": 333152, "epoch": 4013} {"train_loss": -25.97116470336914, "global_step": 333153, "epoch": 4013} {"train_loss": -26.193811416625977, "global_step": 333154, "epoch": 4013} {"train_loss": -26.246875762939453, "global_step": 333155, "epoch": 4013} {"train_loss": -25.932119369506836, "global_step": 333156, "epoch": 4013} {"train_loss": -26.10101890563965, "global_step": 333157, "epoch": 4013} {"train_loss": -26.370824813842773, "global_step": 333158, "epoch": 4013} {"train_loss": -26.23227310180664, "global_step": 333159, "epoch": 4013} {"train_loss": -26.144514083862305, "global_step": 333160, "epoch": 4013} {"train_loss": -25.604230329214808, "global_step": 333161, "epoch": 4013, "val_loss": 7187690.0} {"train_loss": -26.11578369140625, "global_step": 333162, "epoch": 4014} {"train_loss": -25.72440528869629, "global_step": 333163, "epoch": 4014} {"train_loss": -25.3404598236084, "global_step": 333164, "epoch": 4014} {"train_loss": -25.8708553314209, "global_step": 333165, "epoch": 4014} {"train_loss": -25.410886764526367, "global_step": 333166, "epoch": 4014} {"train_loss": -25.868072509765625, "global_step": 333167, "epoch": 4014} {"train_loss": -25.874914169311523, "global_step": 333168, "epoch": 4014} {"train_loss": -25.68231773376465, "global_step": 333169, "epoch": 4014} {"train_loss": -25.822834014892578, "global_step": 333170, "epoch": 4014} {"train_loss": -25.970117568969727, "global_step": 333171, "epoch": 4014} {"train_loss": -26.23479652404785, "global_step": 333172, "epoch": 4014} {"train_loss": -26.181238174438477, "global_step": 333173, "epoch": 4014} {"train_loss": -26.1487979888916, "global_step": 333174, "epoch": 4014} {"train_loss": -25.913740158081055, "global_step": 333175, "epoch": 4014} {"train_loss": -25.944055557250977, "global_step": 333176, "epoch": 4014} {"train_loss": -26.309179306030273, "global_step": 333177, "epoch": 4014} {"train_loss": -26.342090606689453, "global_step": 333178, "epoch": 4014} {"train_loss": -26.024255752563477, "global_step": 333179, "epoch": 4014} {"train_loss": -25.88876724243164, "global_step": 333180, "epoch": 4014} {"train_loss": -26.434803009033203, "global_step": 333181, "epoch": 4014} {"train_loss": -25.953384399414062, "global_step": 333182, "epoch": 4014} {"train_loss": -25.954736709594727, "global_step": 333183, "epoch": 4014} {"train_loss": -26.036237716674805, "global_step": 333184, "epoch": 4014} {"train_loss": -26.24002456665039, "global_step": 333185, "epoch": 4014} {"train_loss": -26.031164169311523, "global_step": 333186, "epoch": 4014} {"train_loss": -26.13568115234375, "global_step": 333187, "epoch": 4014} {"train_loss": -26.0082950592041, "global_step": 333188, "epoch": 4014} {"train_loss": -26.376941680908203, "global_step": 333189, "epoch": 4014} {"train_loss": -25.677600860595703, "global_step": 333190, "epoch": 4014} {"train_loss": -26.241016387939453, "global_step": 333191, "epoch": 4014} {"train_loss": -26.153003692626953, "global_step": 333192, "epoch": 4014} {"train_loss": -25.601469039916992, "global_step": 333193, "epoch": 4014} {"train_loss": -26.05645751953125, "global_step": 333194, "epoch": 4014} {"train_loss": -26.423376083374023, "global_step": 333195, "epoch": 4014} {"train_loss": -26.068140029907227, "global_step": 333196, "epoch": 4014} {"train_loss": -26.254108428955078, "global_step": 333197, "epoch": 4014} {"train_loss": -26.018888473510742, "global_step": 333198, "epoch": 4014} {"train_loss": -25.657367706298828, "global_step": 333199, "epoch": 4014} {"train_loss": -26.124792098999023, "global_step": 333200, "epoch": 4014} {"train_loss": -26.0024471282959, "global_step": 333201, "epoch": 4014} {"train_loss": -26.078125, "global_step": 333202, "epoch": 4014} {"train_loss": -25.860828399658203, "global_step": 333203, "epoch": 4014} {"train_loss": -25.952783584594727, "global_step": 333204, "epoch": 4014} {"train_loss": -25.76629066467285, "global_step": 333205, "epoch": 4014} {"train_loss": -25.98455810546875, "global_step": 333206, "epoch": 4014} {"train_loss": -25.643634796142578, "global_step": 333207, "epoch": 4014} {"train_loss": -26.128849029541016, "global_step": 333208, "epoch": 4014} {"train_loss": -25.521947860717773, "global_step": 333209, "epoch": 4014} {"train_loss": -25.644437789916992, "global_step": 333210, "epoch": 4014} {"train_loss": -25.333688735961914, "global_step": 333211, "epoch": 4014} {"train_loss": -26.05803871154785, "global_step": 333212, "epoch": 4014} {"train_loss": -25.578041076660156, "global_step": 333213, "epoch": 4014} {"train_loss": -25.48311424255371, "global_step": 333214, "epoch": 4014} {"train_loss": -26.19856834411621, "global_step": 333215, "epoch": 4014} {"train_loss": -25.71626091003418, "global_step": 333216, "epoch": 4014} {"train_loss": -25.809864044189453, "global_step": 333217, "epoch": 4014} {"train_loss": -25.652313232421875, "global_step": 333218, "epoch": 4014} {"train_loss": -25.8676700592041, "global_step": 333219, "epoch": 4014} {"train_loss": -25.780561447143555, "global_step": 333220, "epoch": 4014} {"train_loss": -25.760211944580078, "global_step": 333221, "epoch": 4014} {"train_loss": -25.794097900390625, "global_step": 333222, "epoch": 4014} {"train_loss": -26.33355712890625, "global_step": 333223, "epoch": 4014} {"train_loss": -25.825363159179688, "global_step": 333224, "epoch": 4014} {"train_loss": -26.24740982055664, "global_step": 333225, "epoch": 4014} {"train_loss": -25.845794677734375, "global_step": 333226, "epoch": 4014} {"train_loss": -25.9630126953125, "global_step": 333227, "epoch": 4014} {"train_loss": -26.066162109375, "global_step": 333228, "epoch": 4014} {"train_loss": -25.58241844177246, "global_step": 333229, "epoch": 4014} {"train_loss": -25.834447860717773, "global_step": 333230, "epoch": 4014} {"train_loss": -25.777196884155273, "global_step": 333231, "epoch": 4014} {"train_loss": -26.251707077026367, "global_step": 333232, "epoch": 4014} {"train_loss": -26.050344467163086, "global_step": 333233, "epoch": 4014} {"train_loss": -26.0563907623291, "global_step": 333234, "epoch": 4014} {"train_loss": -25.964740753173828, "global_step": 333235, "epoch": 4014} {"train_loss": -25.95429801940918, "global_step": 333236, "epoch": 4014} {"train_loss": -25.681787490844727, "global_step": 333237, "epoch": 4014} {"train_loss": -25.93665885925293, "global_step": 333238, "epoch": 4014} {"train_loss": -26.15437889099121, "global_step": 333239, "epoch": 4014} {"train_loss": -26.198633193969727, "global_step": 333240, "epoch": 4014} {"train_loss": -26.23682975769043, "global_step": 333241, "epoch": 4014} {"train_loss": -26.08237075805664, "global_step": 333242, "epoch": 4014} {"train_loss": -26.1180419921875, "global_step": 333243, "epoch": 4014} {"train_loss": -25.949288885277436, "global_step": 333244, "epoch": 4014, "val_loss": 6933300.0} {"train_loss": -25.469940185546875, "global_step": 333245, "epoch": 4015} {"train_loss": -25.51934814453125, "global_step": 333246, "epoch": 4015} {"train_loss": -26.213346481323242, "global_step": 333247, "epoch": 4015} {"train_loss": -25.87664222717285, "global_step": 333248, "epoch": 4015} {"train_loss": -25.7051944732666, "global_step": 333249, "epoch": 4015} {"train_loss": -25.974512100219727, "global_step": 333250, "epoch": 4015} {"train_loss": -26.368484497070312, "global_step": 333251, "epoch": 4015} {"train_loss": -25.909780502319336, "global_step": 333252, "epoch": 4015} {"train_loss": -25.53657341003418, "global_step": 333253, "epoch": 4015} {"train_loss": -25.793994903564453, "global_step": 333254, "epoch": 4015} {"train_loss": -26.04632568359375, "global_step": 333255, "epoch": 4015} {"train_loss": -26.102310180664062, "global_step": 333256, "epoch": 4015} {"train_loss": -25.971343994140625, "global_step": 333257, "epoch": 4015} {"train_loss": -26.285266876220703, "global_step": 333258, "epoch": 4015} {"train_loss": -25.89861488342285, "global_step": 333259, "epoch": 4015} {"train_loss": -25.94327735900879, "global_step": 333260, "epoch": 4015} {"train_loss": -25.88153648376465, "global_step": 333261, "epoch": 4015} {"train_loss": -26.176361083984375, "global_step": 333262, "epoch": 4015} {"train_loss": -26.2066593170166, "global_step": 333263, "epoch": 4015} {"train_loss": -25.64430046081543, "global_step": 333264, "epoch": 4015} {"train_loss": -25.991647720336914, "global_step": 333265, "epoch": 4015} {"train_loss": -25.91765785217285, "global_step": 333266, "epoch": 4015} {"train_loss": -25.94521141052246, "global_step": 333267, "epoch": 4015} {"train_loss": -25.655460357666016, "global_step": 333268, "epoch": 4015} {"train_loss": -25.9219970703125, "global_step": 333269, "epoch": 4015} {"train_loss": -25.500404357910156, "global_step": 333270, "epoch": 4015} {"train_loss": -26.07673454284668, "global_step": 333271, "epoch": 4015} {"train_loss": -25.891469955444336, "global_step": 333272, "epoch": 4015} {"train_loss": -26.140905380249023, "global_step": 333273, "epoch": 4015} {"train_loss": -26.14423179626465, "global_step": 333274, "epoch": 4015} {"train_loss": -26.138681411743164, "global_step": 333275, "epoch": 4015} {"train_loss": -26.004384994506836, "global_step": 333276, "epoch": 4015} {"train_loss": -26.161527633666992, "global_step": 333277, "epoch": 4015} {"train_loss": -26.131093978881836, "global_step": 333278, "epoch": 4015} {"train_loss": -26.278696060180664, "global_step": 333279, "epoch": 4015} {"train_loss": -25.82318687438965, "global_step": 333280, "epoch": 4015} {"train_loss": -26.18682289123535, "global_step": 333281, "epoch": 4015} {"train_loss": -25.663049697875977, "global_step": 333282, "epoch": 4015} {"train_loss": -26.247785568237305, "global_step": 333283, "epoch": 4015} {"train_loss": -26.193073272705078, "global_step": 333284, "epoch": 4015} {"train_loss": -26.065372467041016, "global_step": 333285, "epoch": 4015} {"train_loss": -26.049829483032227, "global_step": 333286, "epoch": 4015} {"train_loss": -26.302032470703125, "global_step": 333287, "epoch": 4015} {"train_loss": -26.209247589111328, "global_step": 333288, "epoch": 4015} {"train_loss": -25.953901290893555, "global_step": 333289, "epoch": 4015} {"train_loss": -26.127918243408203, "global_step": 333290, "epoch": 4015} {"train_loss": -26.046768188476562, "global_step": 333291, "epoch": 4015} {"train_loss": -26.15447425842285, "global_step": 333292, "epoch": 4015} {"train_loss": -26.3353214263916, "global_step": 333293, "epoch": 4015} {"train_loss": -26.17034912109375, "global_step": 333294, "epoch": 4015} {"train_loss": -26.4317569732666, "global_step": 333295, "epoch": 4015} {"train_loss": -25.8148193359375, "global_step": 333296, "epoch": 4015} {"train_loss": -26.104095458984375, "global_step": 333297, "epoch": 4015} {"train_loss": -25.89640235900879, "global_step": 333298, "epoch": 4015} {"train_loss": -25.518741607666016, "global_step": 333299, "epoch": 4015} {"train_loss": -24.83368492126465, "global_step": 333300, "epoch": 4015} {"train_loss": -24.59756851196289, "global_step": 333301, "epoch": 4015} {"train_loss": -25.638538360595703, "global_step": 333302, "epoch": 4015} {"train_loss": -25.77594566345215, "global_step": 333303, "epoch": 4015} {"train_loss": -25.70587158203125, "global_step": 333304, "epoch": 4015} {"train_loss": -26.059146881103516, "global_step": 333305, "epoch": 4015} {"train_loss": -25.90118980407715, "global_step": 333306, "epoch": 4015} {"train_loss": -25.319557189941406, "global_step": 333307, "epoch": 4015} {"train_loss": -25.932086944580078, "global_step": 333308, "epoch": 4015} {"train_loss": -25.720874786376953, "global_step": 333309, "epoch": 4015} {"train_loss": -25.418668746948242, "global_step": 333310, "epoch": 4015} {"train_loss": -25.870641708374023, "global_step": 333311, "epoch": 4015} {"train_loss": -25.532522201538086, "global_step": 333312, "epoch": 4015} {"train_loss": -26.3487548828125, "global_step": 333313, "epoch": 4015} {"train_loss": -25.2965145111084, "global_step": 333314, "epoch": 4015} {"train_loss": -25.720142364501953, "global_step": 333315, "epoch": 4015} {"train_loss": -25.598480224609375, "global_step": 333316, "epoch": 4015} {"train_loss": -25.841079711914062, "global_step": 333317, "epoch": 4015} {"train_loss": -25.738727569580078, "global_step": 333318, "epoch": 4015} {"train_loss": -25.928674697875977, "global_step": 333319, "epoch": 4015} {"train_loss": -25.987401962280273, "global_step": 333320, "epoch": 4015} {"train_loss": -25.855594635009766, "global_step": 333321, "epoch": 4015} {"train_loss": -25.92805290222168, "global_step": 333322, "epoch": 4015} {"train_loss": -25.554767608642578, "global_step": 333323, "epoch": 4015} {"train_loss": -25.994186401367188, "global_step": 333324, "epoch": 4015} {"train_loss": -25.842905044555664, "global_step": 333325, "epoch": 4015} {"train_loss": -26.267908096313477, "global_step": 333326, "epoch": 4015} {"train_loss": -25.91111298067024, "global_step": 333327, "epoch": 4015, "val_loss": 6842360.0} {"train_loss": -24.55143165588379, "global_step": 333328, "epoch": 4016} {"train_loss": -23.516740798950195, "global_step": 333329, "epoch": 4016} {"train_loss": -25.0994930267334, "global_step": 333330, "epoch": 4016} {"train_loss": -24.565311431884766, "global_step": 333331, "epoch": 4016} {"train_loss": -25.47559928894043, "global_step": 333332, "epoch": 4016} {"train_loss": -24.90522575378418, "global_step": 333333, "epoch": 4016} {"train_loss": -25.329833984375, "global_step": 333334, "epoch": 4016} {"train_loss": -24.962940216064453, "global_step": 333335, "epoch": 4016} {"train_loss": -25.159048080444336, "global_step": 333336, "epoch": 4016} {"train_loss": -25.120771408081055, "global_step": 333337, "epoch": 4016} {"train_loss": -24.86213493347168, "global_step": 333338, "epoch": 4016} {"train_loss": -25.581298828125, "global_step": 333339, "epoch": 4016} {"train_loss": -25.240802764892578, "global_step": 333340, "epoch": 4016} {"train_loss": -25.242780685424805, "global_step": 333341, "epoch": 4016} {"train_loss": -25.295957565307617, "global_step": 333342, "epoch": 4016} {"train_loss": -25.70807456970215, "global_step": 333343, "epoch": 4016} {"train_loss": -25.436811447143555, "global_step": 333344, "epoch": 4016} {"train_loss": -25.657941818237305, "global_step": 333345, "epoch": 4016} {"train_loss": -25.645849227905273, "global_step": 333346, "epoch": 4016} {"train_loss": -25.920291900634766, "global_step": 333347, "epoch": 4016} {"train_loss": -25.6976375579834, "global_step": 333348, "epoch": 4016} {"train_loss": -25.631269454956055, "global_step": 333349, "epoch": 4016} {"train_loss": -25.4432315826416, "global_step": 333350, "epoch": 4016} {"train_loss": -26.052581787109375, "global_step": 333351, "epoch": 4016} {"train_loss": -25.88649559020996, "global_step": 333352, "epoch": 4016} {"train_loss": -25.798664093017578, "global_step": 333353, "epoch": 4016} {"train_loss": -25.638004302978516, "global_step": 333354, "epoch": 4016} {"train_loss": -25.9689884185791, "global_step": 333355, "epoch": 4016} {"train_loss": -26.02241325378418, "global_step": 333356, "epoch": 4016} {"train_loss": -25.979480743408203, "global_step": 333357, "epoch": 4016} {"train_loss": -25.67523193359375, "global_step": 333358, "epoch": 4016} {"train_loss": -25.61256217956543, "global_step": 333359, "epoch": 4016} {"train_loss": -25.761194229125977, "global_step": 333360, "epoch": 4016} {"train_loss": -26.033124923706055, "global_step": 333361, "epoch": 4016} {"train_loss": -26.177631378173828, "global_step": 333362, "epoch": 4016} {"train_loss": -25.727392196655273, "global_step": 333363, "epoch": 4016} {"train_loss": -26.4333553314209, "global_step": 333364, "epoch": 4016} {"train_loss": -25.740859985351562, "global_step": 333365, "epoch": 4016} {"train_loss": -26.317651748657227, "global_step": 333366, "epoch": 4016} {"train_loss": -26.29810905456543, "global_step": 333367, "epoch": 4016} {"train_loss": -25.903223037719727, "global_step": 333368, "epoch": 4016} {"train_loss": -26.072864532470703, "global_step": 333369, "epoch": 4016} {"train_loss": -26.026416778564453, "global_step": 333370, "epoch": 4016} {"train_loss": -26.102502822875977, "global_step": 333371, "epoch": 4016} {"train_loss": -26.102142333984375, "global_step": 333372, "epoch": 4016} {"train_loss": -25.931432723999023, "global_step": 333373, "epoch": 4016} {"train_loss": -26.1746883392334, "global_step": 333374, "epoch": 4016} {"train_loss": -25.900043487548828, "global_step": 333375, "epoch": 4016} {"train_loss": -25.87041664123535, "global_step": 333376, "epoch": 4016} {"train_loss": -25.96011734008789, "global_step": 333377, "epoch": 4016} {"train_loss": -26.331724166870117, "global_step": 333378, "epoch": 4016} {"train_loss": -25.992420196533203, "global_step": 333379, "epoch": 4016} {"train_loss": -26.170806884765625, "global_step": 333380, "epoch": 4016} {"train_loss": -25.825092315673828, "global_step": 333381, "epoch": 4016} {"train_loss": -26.451587677001953, "global_step": 333382, "epoch": 4016} {"train_loss": -25.932748794555664, "global_step": 333383, "epoch": 4016} {"train_loss": -26.031864166259766, "global_step": 333384, "epoch": 4016} {"train_loss": -26.164798736572266, "global_step": 333385, "epoch": 4016} {"train_loss": -26.050464630126953, "global_step": 333386, "epoch": 4016} {"train_loss": -26.098310470581055, "global_step": 333387, "epoch": 4016} {"train_loss": -25.996902465820312, "global_step": 333388, "epoch": 4016} {"train_loss": -26.063135147094727, "global_step": 333389, "epoch": 4016} {"train_loss": -25.723480224609375, "global_step": 333390, "epoch": 4016} {"train_loss": -25.73501968383789, "global_step": 333391, "epoch": 4016} {"train_loss": -25.55244255065918, "global_step": 333392, "epoch": 4016} {"train_loss": -26.297637939453125, "global_step": 333393, "epoch": 4016} {"train_loss": -26.246173858642578, "global_step": 333394, "epoch": 4016} {"train_loss": -25.97833251953125, "global_step": 333395, "epoch": 4016} {"train_loss": -25.77621841430664, "global_step": 333396, "epoch": 4016} {"train_loss": -26.144424438476562, "global_step": 333397, "epoch": 4016} {"train_loss": -25.96528434753418, "global_step": 333398, "epoch": 4016} {"train_loss": -25.64047622680664, "global_step": 333399, "epoch": 4016} {"train_loss": -25.8951358795166, "global_step": 333400, "epoch": 4016} {"train_loss": -25.487516403198242, "global_step": 333401, "epoch": 4016} {"train_loss": -26.459577560424805, "global_step": 333402, "epoch": 4016} {"train_loss": -26.059772491455078, "global_step": 333403, "epoch": 4016} {"train_loss": -25.78412437438965, "global_step": 333404, "epoch": 4016} {"train_loss": -25.900409698486328, "global_step": 333405, "epoch": 4016} {"train_loss": -25.98053550720215, "global_step": 333406, "epoch": 4016} {"train_loss": -25.90009117126465, "global_step": 333407, "epoch": 4016} {"train_loss": -26.2738037109375, "global_step": 333408, "epoch": 4016} {"train_loss": -25.48178482055664, "global_step": 333409, "epoch": 4016} {"train_loss": -25.749245149543487, "global_step": 333410, "epoch": 4016, "val_loss": 6870211.0} {"train_loss": -25.518613815307617, "global_step": 333411, "epoch": 4017} {"train_loss": -25.430692672729492, "global_step": 333412, "epoch": 4017} {"train_loss": -25.33684539794922, "global_step": 333413, "epoch": 4017} {"train_loss": -25.131376266479492, "global_step": 333414, "epoch": 4017} {"train_loss": -25.23493003845215, "global_step": 333415, "epoch": 4017} {"train_loss": -25.136795043945312, "global_step": 333416, "epoch": 4017} {"train_loss": -25.183792114257812, "global_step": 333417, "epoch": 4017} {"train_loss": -25.775592803955078, "global_step": 333418, "epoch": 4017} {"train_loss": -25.6457462310791, "global_step": 333419, "epoch": 4017} {"train_loss": -25.073095321655273, "global_step": 333420, "epoch": 4017} {"train_loss": -24.728870391845703, "global_step": 333421, "epoch": 4017} {"train_loss": -25.47264862060547, "global_step": 333422, "epoch": 4017} {"train_loss": -25.604673385620117, "global_step": 333423, "epoch": 4017} {"train_loss": -25.70452308654785, "global_step": 333424, "epoch": 4017} {"train_loss": -25.747037887573242, "global_step": 333425, "epoch": 4017} {"train_loss": -25.661245346069336, "global_step": 333426, "epoch": 4017} {"train_loss": -25.75221824645996, "global_step": 333427, "epoch": 4017} {"train_loss": -25.585302352905273, "global_step": 333428, "epoch": 4017} {"train_loss": -25.56601333618164, "global_step": 333429, "epoch": 4017} {"train_loss": -25.843021392822266, "global_step": 333430, "epoch": 4017} {"train_loss": -25.802539825439453, "global_step": 333431, "epoch": 4017} {"train_loss": -25.893396377563477, "global_step": 333432, "epoch": 4017} {"train_loss": -25.58879280090332, "global_step": 333433, "epoch": 4017} {"train_loss": -25.629602432250977, "global_step": 333434, "epoch": 4017} {"train_loss": -25.830963134765625, "global_step": 333435, "epoch": 4017} {"train_loss": -25.76032829284668, "global_step": 333436, "epoch": 4017} {"train_loss": -25.89838981628418, "global_step": 333437, "epoch": 4017} {"train_loss": -26.259979248046875, "global_step": 333438, "epoch": 4017} {"train_loss": -25.830677032470703, "global_step": 333439, "epoch": 4017} {"train_loss": -25.89041519165039, "global_step": 333440, "epoch": 4017} {"train_loss": -25.786176681518555, "global_step": 333441, "epoch": 4017} {"train_loss": -25.904870986938477, "global_step": 333442, "epoch": 4017} {"train_loss": -25.897932052612305, "global_step": 333443, "epoch": 4017} {"train_loss": -26.1082763671875, "global_step": 333444, "epoch": 4017} {"train_loss": -25.85906982421875, "global_step": 333445, "epoch": 4017} {"train_loss": -26.0739803314209, "global_step": 333446, "epoch": 4017} {"train_loss": -26.027633666992188, "global_step": 333447, "epoch": 4017} {"train_loss": -26.121374130249023, "global_step": 333448, "epoch": 4017} {"train_loss": -26.108945846557617, "global_step": 333449, "epoch": 4017} {"train_loss": -25.88791275024414, "global_step": 333450, "epoch": 4017} {"train_loss": -26.238204956054688, "global_step": 333451, "epoch": 4017} {"train_loss": -25.79364585876465, "global_step": 333452, "epoch": 4017} {"train_loss": -26.284963607788086, "global_step": 333453, "epoch": 4017} {"train_loss": -26.225061416625977, "global_step": 333454, "epoch": 4017} {"train_loss": -26.135847091674805, "global_step": 333455, "epoch": 4017} {"train_loss": -26.217336654663086, "global_step": 333456, "epoch": 4017} {"train_loss": -25.8560733795166, "global_step": 333457, "epoch": 4017} {"train_loss": -26.2229061126709, "global_step": 333458, "epoch": 4017} {"train_loss": -26.145475387573242, "global_step": 333459, "epoch": 4017} {"train_loss": -26.18474769592285, "global_step": 333460, "epoch": 4017} {"train_loss": -25.852277755737305, "global_step": 333461, "epoch": 4017} {"train_loss": -26.316980361938477, "global_step": 333462, "epoch": 4017} {"train_loss": -26.183734893798828, "global_step": 333463, "epoch": 4017} {"train_loss": -26.109785079956055, "global_step": 333464, "epoch": 4017} {"train_loss": -25.941761016845703, "global_step": 333465, "epoch": 4017} {"train_loss": -26.284460067749023, "global_step": 333466, "epoch": 4017} {"train_loss": -26.21649742126465, "global_step": 333467, "epoch": 4017} {"train_loss": -26.102685928344727, "global_step": 333468, "epoch": 4017} {"train_loss": -25.945907592773438, "global_step": 333469, "epoch": 4017} {"train_loss": -25.77496910095215, "global_step": 333470, "epoch": 4017} {"train_loss": -25.981372833251953, "global_step": 333471, "epoch": 4017} {"train_loss": -26.01303482055664, "global_step": 333472, "epoch": 4017} {"train_loss": -26.06954002380371, "global_step": 333473, "epoch": 4017} {"train_loss": -26.378192901611328, "global_step": 333474, "epoch": 4017} {"train_loss": -26.071836471557617, "global_step": 333475, "epoch": 4017} {"train_loss": -26.222883224487305, "global_step": 333476, "epoch": 4017} {"train_loss": -25.830808639526367, "global_step": 333477, "epoch": 4017} {"train_loss": -26.118432998657227, "global_step": 333478, "epoch": 4017} {"train_loss": -25.796070098876953, "global_step": 333479, "epoch": 4017} {"train_loss": -25.60662841796875, "global_step": 333480, "epoch": 4017} {"train_loss": -25.823999404907227, "global_step": 333481, "epoch": 4017} {"train_loss": -25.93243980407715, "global_step": 333482, "epoch": 4017} {"train_loss": -25.7545108795166, "global_step": 333483, "epoch": 4017} {"train_loss": -26.332006454467773, "global_step": 333484, "epoch": 4017} {"train_loss": -25.73914909362793, "global_step": 333485, "epoch": 4017} {"train_loss": -25.96221351623535, "global_step": 333486, "epoch": 4017} {"train_loss": -26.367895126342773, "global_step": 333487, "epoch": 4017} {"train_loss": -26.35013198852539, "global_step": 333488, "epoch": 4017} {"train_loss": -26.114572525024414, "global_step": 333489, "epoch": 4017} {"train_loss": -25.861005783081055, "global_step": 333490, "epoch": 4017} {"train_loss": -26.023340225219727, "global_step": 333491, "epoch": 4017} {"train_loss": -26.1014404296875, "global_step": 333492, "epoch": 4017} {"train_loss": -25.89550512382783, "global_step": 333493, "epoch": 4017, "val_loss": 6906441.5} {"train_loss": -26.194019317626953, "global_step": 333494, "epoch": 4018} {"train_loss": -25.73590087890625, "global_step": 333495, "epoch": 4018} {"train_loss": -25.8061466217041, "global_step": 333496, "epoch": 4018} {"train_loss": -25.849496841430664, "global_step": 333497, "epoch": 4018} {"train_loss": -25.947406768798828, "global_step": 333498, "epoch": 4018} {"train_loss": -25.9532413482666, "global_step": 333499, "epoch": 4018} {"train_loss": -26.009057998657227, "global_step": 333500, "epoch": 4018} {"train_loss": -25.91725730895996, "global_step": 333501, "epoch": 4018} {"train_loss": -25.569656372070312, "global_step": 333502, "epoch": 4018} {"train_loss": -25.846670150756836, "global_step": 333503, "epoch": 4018} {"train_loss": -26.079269409179688, "global_step": 333504, "epoch": 4018} {"train_loss": -25.82305335998535, "global_step": 333505, "epoch": 4018} {"train_loss": -25.506887435913086, "global_step": 333506, "epoch": 4018} {"train_loss": -26.037744522094727, "global_step": 333507, "epoch": 4018} {"train_loss": -25.86475944519043, "global_step": 333508, "epoch": 4018} {"train_loss": -25.9112491607666, "global_step": 333509, "epoch": 4018} {"train_loss": -25.935033798217773, "global_step": 333510, "epoch": 4018} {"train_loss": -26.196569442749023, "global_step": 333511, "epoch": 4018} {"train_loss": -25.870107650756836, "global_step": 333512, "epoch": 4018} {"train_loss": -25.847082138061523, "global_step": 333513, "epoch": 4018} {"train_loss": -25.413623809814453, "global_step": 333514, "epoch": 4018} {"train_loss": -26.161848068237305, "global_step": 333515, "epoch": 4018} {"train_loss": -26.00082778930664, "global_step": 333516, "epoch": 4018} {"train_loss": -25.687406539916992, "global_step": 333517, "epoch": 4018} {"train_loss": -25.85040283203125, "global_step": 333518, "epoch": 4018} {"train_loss": -25.868383407592773, "global_step": 333519, "epoch": 4018} {"train_loss": -26.169906616210938, "global_step": 333520, "epoch": 4018} {"train_loss": -26.045703887939453, "global_step": 333521, "epoch": 4018} {"train_loss": -26.096221923828125, "global_step": 333522, "epoch": 4018} {"train_loss": -25.985944747924805, "global_step": 333523, "epoch": 4018} {"train_loss": -26.129175186157227, "global_step": 333524, "epoch": 4018} {"train_loss": -25.767475128173828, "global_step": 333525, "epoch": 4018} {"train_loss": -26.17268180847168, "global_step": 333526, "epoch": 4018} {"train_loss": -26.40504264831543, "global_step": 333527, "epoch": 4018} {"train_loss": -26.003934860229492, "global_step": 333528, "epoch": 4018} {"train_loss": -26.1202335357666, "global_step": 333529, "epoch": 4018} {"train_loss": -26.271697998046875, "global_step": 333530, "epoch": 4018} {"train_loss": -26.223236083984375, "global_step": 333531, "epoch": 4018} {"train_loss": -26.130712509155273, "global_step": 333532, "epoch": 4018} {"train_loss": -25.901092529296875, "global_step": 333533, "epoch": 4018} {"train_loss": -26.0416316986084, "global_step": 333534, "epoch": 4018} {"train_loss": -26.21864891052246, "global_step": 333535, "epoch": 4018} {"train_loss": -26.101795196533203, "global_step": 333536, "epoch": 4018} {"train_loss": -25.898252487182617, "global_step": 333537, "epoch": 4018} {"train_loss": -25.828882217407227, "global_step": 333538, "epoch": 4018} {"train_loss": -26.15797996520996, "global_step": 333539, "epoch": 4018} {"train_loss": -25.925785064697266, "global_step": 333540, "epoch": 4018} {"train_loss": -25.983753204345703, "global_step": 333541, "epoch": 4018} {"train_loss": -26.235549926757812, "global_step": 333542, "epoch": 4018} {"train_loss": -25.895715713500977, "global_step": 333543, "epoch": 4018} {"train_loss": -26.231653213500977, "global_step": 333544, "epoch": 4018} {"train_loss": -26.19753074645996, "global_step": 333545, "epoch": 4018} {"train_loss": -25.9174747467041, "global_step": 333546, "epoch": 4018} {"train_loss": -26.164356231689453, "global_step": 333547, "epoch": 4018} {"train_loss": -26.166296005249023, "global_step": 333548, "epoch": 4018} {"train_loss": -26.3614444732666, "global_step": 333549, "epoch": 4018} {"train_loss": -26.02374839782715, "global_step": 333550, "epoch": 4018} {"train_loss": -25.91242027282715, "global_step": 333551, "epoch": 4018} {"train_loss": -26.067331314086914, "global_step": 333552, "epoch": 4018} {"train_loss": -26.04374122619629, "global_step": 333553, "epoch": 4018} {"train_loss": -25.9411563873291, "global_step": 333554, "epoch": 4018} {"train_loss": -25.97471046447754, "global_step": 333555, "epoch": 4018} {"train_loss": -25.771482467651367, "global_step": 333556, "epoch": 4018} {"train_loss": -25.748676300048828, "global_step": 333557, "epoch": 4018} {"train_loss": -26.058441162109375, "global_step": 333558, "epoch": 4018} {"train_loss": -26.052900314331055, "global_step": 333559, "epoch": 4018} {"train_loss": -25.88702392578125, "global_step": 333560, "epoch": 4018} {"train_loss": -26.16791343688965, "global_step": 333561, "epoch": 4018} {"train_loss": -25.836088180541992, "global_step": 333562, "epoch": 4018} {"train_loss": -25.179027557373047, "global_step": 333563, "epoch": 4018} {"train_loss": -25.85236930847168, "global_step": 333564, "epoch": 4018} {"train_loss": -25.814533233642578, "global_step": 333565, "epoch": 4018} {"train_loss": -25.75153923034668, "global_step": 333566, "epoch": 4018} {"train_loss": -25.75704002380371, "global_step": 333567, "epoch": 4018} {"train_loss": -26.036285400390625, "global_step": 333568, "epoch": 4018} {"train_loss": -26.135351181030273, "global_step": 333569, "epoch": 4018} {"train_loss": -25.993146896362305, "global_step": 333570, "epoch": 4018} {"train_loss": -25.969602584838867, "global_step": 333571, "epoch": 4018} {"train_loss": -26.150135040283203, "global_step": 333572, "epoch": 4018} {"train_loss": -26.247211456298828, "global_step": 333573, "epoch": 4018} {"train_loss": -26.26007080078125, "global_step": 333574, "epoch": 4018} {"train_loss": -26.083480834960938, "global_step": 333575, "epoch": 4018} {"train_loss": -25.976809007575714, "global_step": 333576, "epoch": 4018, "val_loss": 6871705.0} {"train_loss": -23.658954620361328, "global_step": 333577, "epoch": 4019} {"train_loss": -24.79132652282715, "global_step": 333578, "epoch": 4019} {"train_loss": -25.288633346557617, "global_step": 333579, "epoch": 4019} {"train_loss": -24.172292709350586, "global_step": 333580, "epoch": 4019} {"train_loss": -24.987686157226562, "global_step": 333581, "epoch": 4019} {"train_loss": -25.30588150024414, "global_step": 333582, "epoch": 4019} {"train_loss": -24.8745174407959, "global_step": 333583, "epoch": 4019} {"train_loss": -24.9763240814209, "global_step": 333584, "epoch": 4019} {"train_loss": -24.949003219604492, "global_step": 333585, "epoch": 4019} {"train_loss": -25.33379364013672, "global_step": 333586, "epoch": 4019} {"train_loss": -25.8100528717041, "global_step": 333587, "epoch": 4019} {"train_loss": -25.414392471313477, "global_step": 333588, "epoch": 4019} {"train_loss": -25.54911231994629, "global_step": 333589, "epoch": 4019} {"train_loss": -25.576480865478516, "global_step": 333590, "epoch": 4019} {"train_loss": -25.072553634643555, "global_step": 333591, "epoch": 4019} {"train_loss": -25.73369789123535, "global_step": 333592, "epoch": 4019} {"train_loss": -25.5970516204834, "global_step": 333593, "epoch": 4019} {"train_loss": -25.87189292907715, "global_step": 333594, "epoch": 4019} {"train_loss": -25.885944366455078, "global_step": 333595, "epoch": 4019} {"train_loss": -25.86822509765625, "global_step": 333596, "epoch": 4019} {"train_loss": -25.532644271850586, "global_step": 333597, "epoch": 4019} {"train_loss": -25.851179122924805, "global_step": 333598, "epoch": 4019} {"train_loss": -26.028564453125, "global_step": 333599, "epoch": 4019} {"train_loss": -25.44903564453125, "global_step": 333600, "epoch": 4019} {"train_loss": -25.305011749267578, "global_step": 333601, "epoch": 4019} {"train_loss": -25.646259307861328, "global_step": 333602, "epoch": 4019} {"train_loss": -25.381900787353516, "global_step": 333603, "epoch": 4019} {"train_loss": -25.976648330688477, "global_step": 333604, "epoch": 4019} {"train_loss": -25.452253341674805, "global_step": 333605, "epoch": 4019} {"train_loss": -25.60146141052246, "global_step": 333606, "epoch": 4019} {"train_loss": -25.852705001831055, "global_step": 333607, "epoch": 4019} {"train_loss": -25.791894912719727, "global_step": 333608, "epoch": 4019} {"train_loss": -26.060565948486328, "global_step": 333609, "epoch": 4019} {"train_loss": -25.9141788482666, "global_step": 333610, "epoch": 4019} {"train_loss": -25.826995849609375, "global_step": 333611, "epoch": 4019} {"train_loss": -25.660776138305664, "global_step": 333612, "epoch": 4019} {"train_loss": -25.5495548248291, "global_step": 333613, "epoch": 4019} {"train_loss": -25.251441955566406, "global_step": 333614, "epoch": 4019} {"train_loss": -25.459922790527344, "global_step": 333615, "epoch": 4019} {"train_loss": -26.132665634155273, "global_step": 333616, "epoch": 4019} {"train_loss": -25.6650390625, "global_step": 333617, "epoch": 4019} {"train_loss": -25.903610229492188, "global_step": 333618, "epoch": 4019} {"train_loss": -25.809879302978516, "global_step": 333619, "epoch": 4019} {"train_loss": -25.70843505859375, "global_step": 333620, "epoch": 4019} {"train_loss": -25.887441635131836, "global_step": 333621, "epoch": 4019} {"train_loss": -25.852466583251953, "global_step": 333622, "epoch": 4019} {"train_loss": -25.860227584838867, "global_step": 333623, "epoch": 4019} {"train_loss": -25.572416305541992, "global_step": 333624, "epoch": 4019} {"train_loss": -26.019800186157227, "global_step": 333625, "epoch": 4019} {"train_loss": -25.82911491394043, "global_step": 333626, "epoch": 4019} {"train_loss": -25.783634185791016, "global_step": 333627, "epoch": 4019} {"train_loss": -25.85951042175293, "global_step": 333628, "epoch": 4019} {"train_loss": -25.76083755493164, "global_step": 333629, "epoch": 4019} {"train_loss": -25.993066787719727, "global_step": 333630, "epoch": 4019} {"train_loss": -26.19550895690918, "global_step": 333631, "epoch": 4019} {"train_loss": -25.980005264282227, "global_step": 333632, "epoch": 4019} {"train_loss": -25.761571884155273, "global_step": 333633, "epoch": 4019} {"train_loss": -25.916528701782227, "global_step": 333634, "epoch": 4019} {"train_loss": -26.339475631713867, "global_step": 333635, "epoch": 4019} {"train_loss": -25.977630615234375, "global_step": 333636, "epoch": 4019} {"train_loss": -25.784378051757812, "global_step": 333637, "epoch": 4019} {"train_loss": -26.114322662353516, "global_step": 333638, "epoch": 4019} {"train_loss": -25.762548446655273, "global_step": 333639, "epoch": 4019} {"train_loss": -26.14130210876465, "global_step": 333640, "epoch": 4019} {"train_loss": -26.039602279663086, "global_step": 333641, "epoch": 4019} {"train_loss": -25.97283935546875, "global_step": 333642, "epoch": 4019} {"train_loss": -25.619653701782227, "global_step": 333643, "epoch": 4019} {"train_loss": -25.632266998291016, "global_step": 333644, "epoch": 4019} {"train_loss": -25.51644515991211, "global_step": 333645, "epoch": 4019} {"train_loss": -25.772130966186523, "global_step": 333646, "epoch": 4019} {"train_loss": -25.84663200378418, "global_step": 333647, "epoch": 4019} {"train_loss": -25.82259178161621, "global_step": 333648, "epoch": 4019} {"train_loss": -25.611923217773438, "global_step": 333649, "epoch": 4019} {"train_loss": -25.579687118530273, "global_step": 333650, "epoch": 4019} {"train_loss": -25.564077377319336, "global_step": 333651, "epoch": 4019} {"train_loss": -25.79443359375, "global_step": 333652, "epoch": 4019} {"train_loss": -26.031940460205078, "global_step": 333653, "epoch": 4019} {"train_loss": -26.216840744018555, "global_step": 333654, "epoch": 4019} {"train_loss": -25.49544334411621, "global_step": 333655, "epoch": 4019} {"train_loss": -25.8499755859375, "global_step": 333656, "epoch": 4019} {"train_loss": -25.94195556640625, "global_step": 333657, "epoch": 4019} {"train_loss": -26.361230850219727, "global_step": 333658, "epoch": 4019} {"train_loss": -25.671826557940747, "global_step": 333659, "epoch": 4019, "val_loss": 6830022.0} {"train_loss": -25.685516357421875, "global_step": 333660, "epoch": 4020} {"train_loss": -25.340906143188477, "global_step": 333661, "epoch": 4020} {"train_loss": -25.116857528686523, "global_step": 333662, "epoch": 4020} {"train_loss": -25.43081283569336, "global_step": 333663, "epoch": 4020} {"train_loss": -25.273561477661133, "global_step": 333664, "epoch": 4020} {"train_loss": -25.7664794921875, "global_step": 333665, "epoch": 4020} {"train_loss": -25.51527214050293, "global_step": 333666, "epoch": 4020} {"train_loss": -25.61579704284668, "global_step": 333667, "epoch": 4020} {"train_loss": -25.92926025390625, "global_step": 333668, "epoch": 4020} {"train_loss": -25.4770565032959, "global_step": 333669, "epoch": 4020} {"train_loss": -25.91644859313965, "global_step": 333670, "epoch": 4020} {"train_loss": -25.665430068969727, "global_step": 333671, "epoch": 4020} {"train_loss": -25.7443904876709, "global_step": 333672, "epoch": 4020} {"train_loss": -25.736989974975586, "global_step": 333673, "epoch": 4020} {"train_loss": -25.547931671142578, "global_step": 333674, "epoch": 4020} {"train_loss": -25.70468521118164, "global_step": 333675, "epoch": 4020} {"train_loss": -25.57880210876465, "global_step": 333676, "epoch": 4020} {"train_loss": -25.827146530151367, "global_step": 333677, "epoch": 4020} {"train_loss": -25.4654483795166, "global_step": 333678, "epoch": 4020} {"train_loss": -25.53622055053711, "global_step": 333679, "epoch": 4020} {"train_loss": -25.910537719726562, "global_step": 333680, "epoch": 4020} {"train_loss": -25.921295166015625, "global_step": 333681, "epoch": 4020} {"train_loss": -25.7413272857666, "global_step": 333682, "epoch": 4020} {"train_loss": -26.267431259155273, "global_step": 333683, "epoch": 4020} {"train_loss": -25.92013931274414, "global_step": 333684, "epoch": 4020} {"train_loss": -25.931562423706055, "global_step": 333685, "epoch": 4020} {"train_loss": -25.97373390197754, "global_step": 333686, "epoch": 4020} {"train_loss": -25.913318634033203, "global_step": 333687, "epoch": 4020} {"train_loss": -25.730560302734375, "global_step": 333688, "epoch": 4020} {"train_loss": -25.740964889526367, "global_step": 333689, "epoch": 4020} {"train_loss": -26.13465690612793, "global_step": 333690, "epoch": 4020} {"train_loss": -25.99491310119629, "global_step": 333691, "epoch": 4020} {"train_loss": -26.31560707092285, "global_step": 333692, "epoch": 4020} {"train_loss": -25.975982666015625, "global_step": 333693, "epoch": 4020} {"train_loss": -25.649005889892578, "global_step": 333694, "epoch": 4020} {"train_loss": -25.88455581665039, "global_step": 333695, "epoch": 4020} {"train_loss": -26.397043228149414, "global_step": 333696, "epoch": 4020} {"train_loss": -26.408130645751953, "global_step": 333697, "epoch": 4020} {"train_loss": -26.027097702026367, "global_step": 333698, "epoch": 4020} {"train_loss": -26.308246612548828, "global_step": 333699, "epoch": 4020} {"train_loss": -25.9677677154541, "global_step": 333700, "epoch": 4020} {"train_loss": -26.15705680847168, "global_step": 333701, "epoch": 4020} {"train_loss": -25.964038848876953, "global_step": 333702, "epoch": 4020} {"train_loss": -26.0892391204834, "global_step": 333703, "epoch": 4020} {"train_loss": -26.136520385742188, "global_step": 333704, "epoch": 4020} {"train_loss": -26.208417892456055, "global_step": 333705, "epoch": 4020} {"train_loss": -26.23025894165039, "global_step": 333706, "epoch": 4020} {"train_loss": -25.90970230102539, "global_step": 333707, "epoch": 4020} {"train_loss": -25.423152923583984, "global_step": 333708, "epoch": 4020} {"train_loss": -26.174970626831055, "global_step": 333709, "epoch": 4020} {"train_loss": -25.91157341003418, "global_step": 333710, "epoch": 4020} {"train_loss": -25.81416130065918, "global_step": 333711, "epoch": 4020} {"train_loss": -26.00908851623535, "global_step": 333712, "epoch": 4020} {"train_loss": -25.759733200073242, "global_step": 333713, "epoch": 4020} {"train_loss": -25.828893661499023, "global_step": 333714, "epoch": 4020} {"train_loss": -25.815998077392578, "global_step": 333715, "epoch": 4020} {"train_loss": -25.792810440063477, "global_step": 333716, "epoch": 4020} {"train_loss": -25.850645065307617, "global_step": 333717, "epoch": 4020} {"train_loss": -25.963775634765625, "global_step": 333718, "epoch": 4020} {"train_loss": -26.113218307495117, "global_step": 333719, "epoch": 4020} {"train_loss": -25.639184951782227, "global_step": 333720, "epoch": 4020} {"train_loss": -25.808408737182617, "global_step": 333721, "epoch": 4020} {"train_loss": -26.036624908447266, "global_step": 333722, "epoch": 4020} {"train_loss": -25.604537963867188, "global_step": 333723, "epoch": 4020} {"train_loss": -25.50528907775879, "global_step": 333724, "epoch": 4020} {"train_loss": -25.980981826782227, "global_step": 333725, "epoch": 4020} {"train_loss": -26.112518310546875, "global_step": 333726, "epoch": 4020} {"train_loss": -25.837921142578125, "global_step": 333727, "epoch": 4020} {"train_loss": -25.74951171875, "global_step": 333728, "epoch": 4020} {"train_loss": -25.7139892578125, "global_step": 333729, "epoch": 4020} {"train_loss": -25.707199096679688, "global_step": 333730, "epoch": 4020} {"train_loss": -25.99549674987793, "global_step": 333731, "epoch": 4020} {"train_loss": -25.94635581970215, "global_step": 333732, "epoch": 4020} {"train_loss": -26.331205368041992, "global_step": 333733, "epoch": 4020} {"train_loss": -25.714004516601562, "global_step": 333734, "epoch": 4020} {"train_loss": -25.915454864501953, "global_step": 333735, "epoch": 4020} {"train_loss": -26.395709991455078, "global_step": 333736, "epoch": 4020} {"train_loss": -26.08302116394043, "global_step": 333737, "epoch": 4020} {"train_loss": -25.990095138549805, "global_step": 333738, "epoch": 4020} {"train_loss": -26.047834396362305, "global_step": 333739, "epoch": 4020} {"train_loss": -25.646106719970703, "global_step": 333740, "epoch": 4020} {"train_loss": -26.011981964111328, "global_step": 333741, "epoch": 4020} {"train_loss": -25.85024856659303, "global_step": 333742, "epoch": 4020, "val_loss": 6746893.0} {"train_loss": -25.44498634338379, "global_step": 333743, "epoch": 4021} {"train_loss": -25.477453231811523, "global_step": 333744, "epoch": 4021} {"train_loss": -25.140920639038086, "global_step": 333745, "epoch": 4021} {"train_loss": -25.11305046081543, "global_step": 333746, "epoch": 4021} {"train_loss": -25.040281295776367, "global_step": 333747, "epoch": 4021} {"train_loss": -25.26929473876953, "global_step": 333748, "epoch": 4021} {"train_loss": -25.686279296875, "global_step": 333749, "epoch": 4021} {"train_loss": -25.778018951416016, "global_step": 333750, "epoch": 4021} {"train_loss": -25.930999755859375, "global_step": 333751, "epoch": 4021} {"train_loss": -25.78603172302246, "global_step": 333752, "epoch": 4021} {"train_loss": -26.186355590820312, "global_step": 333753, "epoch": 4021} {"train_loss": -25.937152862548828, "global_step": 333754, "epoch": 4021} {"train_loss": -25.890710830688477, "global_step": 333755, "epoch": 4021} {"train_loss": -25.405691146850586, "global_step": 333756, "epoch": 4021} {"train_loss": -25.714797973632812, "global_step": 333757, "epoch": 4021} {"train_loss": -25.78400993347168, "global_step": 333758, "epoch": 4021} {"train_loss": -25.7423038482666, "global_step": 333759, "epoch": 4021} {"train_loss": -25.672353744506836, "global_step": 333760, "epoch": 4021} {"train_loss": -25.61279296875, "global_step": 333761, "epoch": 4021} {"train_loss": -26.277557373046875, "global_step": 333762, "epoch": 4021} {"train_loss": -25.737476348876953, "global_step": 333763, "epoch": 4021} {"train_loss": -26.093875885009766, "global_step": 333764, "epoch": 4021} {"train_loss": -26.136005401611328, "global_step": 333765, "epoch": 4021} {"train_loss": -25.978656768798828, "global_step": 333766, "epoch": 4021} {"train_loss": -26.114364624023438, "global_step": 333767, "epoch": 4021} {"train_loss": -25.7905216217041, "global_step": 333768, "epoch": 4021} {"train_loss": -25.927417755126953, "global_step": 333769, "epoch": 4021} {"train_loss": -25.920562744140625, "global_step": 333770, "epoch": 4021} {"train_loss": -26.094345092773438, "global_step": 333771, "epoch": 4021} {"train_loss": -26.066823959350586, "global_step": 333772, "epoch": 4021} {"train_loss": -26.19318962097168, "global_step": 333773, "epoch": 4021} {"train_loss": -26.501541137695312, "global_step": 333774, "epoch": 4021} {"train_loss": -25.918537139892578, "global_step": 333775, "epoch": 4021} {"train_loss": -25.961917877197266, "global_step": 333776, "epoch": 4021} {"train_loss": -25.841999053955078, "global_step": 333777, "epoch": 4021} {"train_loss": -26.225086212158203, "global_step": 333778, "epoch": 4021} {"train_loss": -25.800012588500977, "global_step": 333779, "epoch": 4021} {"train_loss": -25.916168212890625, "global_step": 333780, "epoch": 4021} {"train_loss": -26.127302169799805, "global_step": 333781, "epoch": 4021} {"train_loss": -26.210622787475586, "global_step": 333782, "epoch": 4021} {"train_loss": -26.161029815673828, "global_step": 333783, "epoch": 4021} {"train_loss": -26.0714111328125, "global_step": 333784, "epoch": 4021} {"train_loss": -26.125106811523438, "global_step": 333785, "epoch": 4021} {"train_loss": -26.339324951171875, "global_step": 333786, "epoch": 4021} {"train_loss": -26.21351432800293, "global_step": 333787, "epoch": 4021} {"train_loss": -25.949609756469727, "global_step": 333788, "epoch": 4021} {"train_loss": -26.047361373901367, "global_step": 333789, "epoch": 4021} {"train_loss": -26.266576766967773, "global_step": 333790, "epoch": 4021} {"train_loss": -26.080305099487305, "global_step": 333791, "epoch": 4021} {"train_loss": -26.373823165893555, "global_step": 333792, "epoch": 4021} {"train_loss": -26.035566329956055, "global_step": 333793, "epoch": 4021} {"train_loss": -25.772680282592773, "global_step": 333794, "epoch": 4021} {"train_loss": -25.985092163085938, "global_step": 333795, "epoch": 4021} {"train_loss": -25.80743980407715, "global_step": 333796, "epoch": 4021} {"train_loss": -25.53388786315918, "global_step": 333797, "epoch": 4021} {"train_loss": -26.053592681884766, "global_step": 333798, "epoch": 4021} {"train_loss": -26.50714683532715, "global_step": 333799, "epoch": 4021} {"train_loss": -26.057653427124023, "global_step": 333800, "epoch": 4021} {"train_loss": -25.758886337280273, "global_step": 333801, "epoch": 4021} {"train_loss": -26.079614639282227, "global_step": 333802, "epoch": 4021} {"train_loss": -26.118179321289062, "global_step": 333803, "epoch": 4021} {"train_loss": -26.149709701538086, "global_step": 333804, "epoch": 4021} {"train_loss": -25.75501823425293, "global_step": 333805, "epoch": 4021} {"train_loss": -25.922409057617188, "global_step": 333806, "epoch": 4021} {"train_loss": -25.07571792602539, "global_step": 333807, "epoch": 4021} {"train_loss": -25.470996856689453, "global_step": 333808, "epoch": 4021} {"train_loss": -25.9268798828125, "global_step": 333809, "epoch": 4021} {"train_loss": -25.57097816467285, "global_step": 333810, "epoch": 4021} {"train_loss": -25.889463424682617, "global_step": 333811, "epoch": 4021} {"train_loss": -25.77392578125, "global_step": 333812, "epoch": 4021} {"train_loss": -25.601957321166992, "global_step": 333813, "epoch": 4021} {"train_loss": -25.6351261138916, "global_step": 333814, "epoch": 4021} {"train_loss": -26.003381729125977, "global_step": 333815, "epoch": 4021} {"train_loss": -26.12161636352539, "global_step": 333816, "epoch": 4021} {"train_loss": -25.7821044921875, "global_step": 333817, "epoch": 4021} {"train_loss": -25.986343383789062, "global_step": 333818, "epoch": 4021} {"train_loss": -25.871755599975586, "global_step": 333819, "epoch": 4021} {"train_loss": -25.96734046936035, "global_step": 333820, "epoch": 4021} {"train_loss": -25.83601951599121, "global_step": 333821, "epoch": 4021} {"train_loss": -25.931272506713867, "global_step": 333822, "epoch": 4021} {"train_loss": -25.900989532470703, "global_step": 333823, "epoch": 4021} {"train_loss": -26.013080596923828, "global_step": 333824, "epoch": 4021} {"train_loss": -25.89699437244829, "global_step": 333825, "epoch": 4021, "val_loss": 6846319.0} {"train_loss": -25.162601470947266, "global_step": 333826, "epoch": 4022} {"train_loss": -25.811941146850586, "global_step": 333827, "epoch": 4022} {"train_loss": -25.570789337158203, "global_step": 333828, "epoch": 4022} {"train_loss": -25.61256217956543, "global_step": 333829, "epoch": 4022} {"train_loss": -25.768020629882812, "global_step": 333830, "epoch": 4022} {"train_loss": -25.980960845947266, "global_step": 333831, "epoch": 4022} {"train_loss": -26.094762802124023, "global_step": 333832, "epoch": 4022} {"train_loss": -25.81199073791504, "global_step": 333833, "epoch": 4022} {"train_loss": -25.821929931640625, "global_step": 333834, "epoch": 4022} {"train_loss": -25.62200927734375, "global_step": 333835, "epoch": 4022} {"train_loss": -25.126983642578125, "global_step": 333836, "epoch": 4022} {"train_loss": -25.856897354125977, "global_step": 333837, "epoch": 4022} {"train_loss": -25.788619995117188, "global_step": 333838, "epoch": 4022} {"train_loss": -25.809858322143555, "global_step": 333839, "epoch": 4022} {"train_loss": -25.692626953125, "global_step": 333840, "epoch": 4022} {"train_loss": -26.041418075561523, "global_step": 333841, "epoch": 4022} {"train_loss": -25.8554744720459, "global_step": 333842, "epoch": 4022} {"train_loss": -26.15167236328125, "global_step": 333843, "epoch": 4022} {"train_loss": -26.173816680908203, "global_step": 333844, "epoch": 4022} {"train_loss": -25.83038902282715, "global_step": 333845, "epoch": 4022} {"train_loss": -25.930103302001953, "global_step": 333846, "epoch": 4022} {"train_loss": -25.907012939453125, "global_step": 333847, "epoch": 4022} {"train_loss": -25.523605346679688, "global_step": 333848, "epoch": 4022} {"train_loss": -25.95168113708496, "global_step": 333849, "epoch": 4022} {"train_loss": -26.102521896362305, "global_step": 333850, "epoch": 4022} {"train_loss": -26.218952178955078, "global_step": 333851, "epoch": 4022} {"train_loss": -26.040185928344727, "global_step": 333852, "epoch": 4022} {"train_loss": -26.0500545501709, "global_step": 333853, "epoch": 4022} {"train_loss": -25.811254501342773, "global_step": 333854, "epoch": 4022} {"train_loss": -25.98396110534668, "global_step": 333855, "epoch": 4022} {"train_loss": -25.967853546142578, "global_step": 333856, "epoch": 4022} {"train_loss": -26.20435905456543, "global_step": 333857, "epoch": 4022} {"train_loss": -25.705982208251953, "global_step": 333858, "epoch": 4022} {"train_loss": -25.62685203552246, "global_step": 333859, "epoch": 4022} {"train_loss": -25.438419342041016, "global_step": 333860, "epoch": 4022} {"train_loss": -25.74053955078125, "global_step": 333861, "epoch": 4022} {"train_loss": -26.326873779296875, "global_step": 333862, "epoch": 4022} {"train_loss": -25.7635440826416, "global_step": 333863, "epoch": 4022} {"train_loss": -25.975162506103516, "global_step": 333864, "epoch": 4022} {"train_loss": -26.166189193725586, "global_step": 333865, "epoch": 4022} {"train_loss": -25.459875106811523, "global_step": 333866, "epoch": 4022} {"train_loss": -25.998504638671875, "global_step": 333867, "epoch": 4022} {"train_loss": -25.84278678894043, "global_step": 333868, "epoch": 4022} {"train_loss": -26.038618087768555, "global_step": 333869, "epoch": 4022} {"train_loss": -25.981159210205078, "global_step": 333870, "epoch": 4022} {"train_loss": -25.969898223876953, "global_step": 333871, "epoch": 4022} {"train_loss": -26.276336669921875, "global_step": 333872, "epoch": 4022} {"train_loss": -25.955575942993164, "global_step": 333873, "epoch": 4022} {"train_loss": -25.774877548217773, "global_step": 333874, "epoch": 4022} {"train_loss": -25.83338737487793, "global_step": 333875, "epoch": 4022} {"train_loss": -25.53569793701172, "global_step": 333876, "epoch": 4022} {"train_loss": -25.761920928955078, "global_step": 333877, "epoch": 4022} {"train_loss": -25.79913330078125, "global_step": 333878, "epoch": 4022} {"train_loss": -25.967498779296875, "global_step": 333879, "epoch": 4022} {"train_loss": -26.231048583984375, "global_step": 333880, "epoch": 4022} {"train_loss": -25.9946231842041, "global_step": 333881, "epoch": 4022} {"train_loss": -25.940244674682617, "global_step": 333882, "epoch": 4022} {"train_loss": -25.75784683227539, "global_step": 333883, "epoch": 4022} {"train_loss": -26.338333129882812, "global_step": 333884, "epoch": 4022} {"train_loss": -26.394638061523438, "global_step": 333885, "epoch": 4022} {"train_loss": -25.838071823120117, "global_step": 333886, "epoch": 4022} {"train_loss": -25.846776962280273, "global_step": 333887, "epoch": 4022} {"train_loss": -25.9367618560791, "global_step": 333888, "epoch": 4022} {"train_loss": -26.106786727905273, "global_step": 333889, "epoch": 4022} {"train_loss": -25.64950942993164, "global_step": 333890, "epoch": 4022} {"train_loss": -26.082828521728516, "global_step": 333891, "epoch": 4022} {"train_loss": -26.158918380737305, "global_step": 333892, "epoch": 4022} {"train_loss": -26.037153244018555, "global_step": 333893, "epoch": 4022} {"train_loss": -26.1457576751709, "global_step": 333894, "epoch": 4022} {"train_loss": -25.819366455078125, "global_step": 333895, "epoch": 4022} {"train_loss": -26.566375732421875, "global_step": 333896, "epoch": 4022} {"train_loss": -26.093658447265625, "global_step": 333897, "epoch": 4022} {"train_loss": -25.909719467163086, "global_step": 333898, "epoch": 4022} {"train_loss": -26.00321388244629, "global_step": 333899, "epoch": 4022} {"train_loss": -26.1782283782959, "global_step": 333900, "epoch": 4022} {"train_loss": -26.0728816986084, "global_step": 333901, "epoch": 4022} {"train_loss": -25.9248104095459, "global_step": 333902, "epoch": 4022} {"train_loss": -25.468564987182617, "global_step": 333903, "epoch": 4022} {"train_loss": -25.796056747436523, "global_step": 333904, "epoch": 4022} {"train_loss": -25.729429244995117, "global_step": 333905, "epoch": 4022} {"train_loss": -26.089231491088867, "global_step": 333906, "epoch": 4022} {"train_loss": -25.9219913482666, "global_step": 333907, "epoch": 4022} {"train_loss": -25.903115306992127, "global_step": 333908, "epoch": 4022, "val_loss": 6778622.0} {"train_loss": -25.682727813720703, "global_step": 333909, "epoch": 4023} {"train_loss": -25.674100875854492, "global_step": 333910, "epoch": 4023} {"train_loss": -25.478713989257812, "global_step": 333911, "epoch": 4023} {"train_loss": -26.171274185180664, "global_step": 333912, "epoch": 4023} {"train_loss": -25.953399658203125, "global_step": 333913, "epoch": 4023} {"train_loss": -25.731287002563477, "global_step": 333914, "epoch": 4023} {"train_loss": -25.888071060180664, "global_step": 333915, "epoch": 4023} {"train_loss": -25.907705307006836, "global_step": 333916, "epoch": 4023} {"train_loss": -25.97756004333496, "global_step": 333917, "epoch": 4023} {"train_loss": -25.8893985748291, "global_step": 333918, "epoch": 4023} {"train_loss": -26.167621612548828, "global_step": 333919, "epoch": 4023} {"train_loss": -25.701574325561523, "global_step": 333920, "epoch": 4023} {"train_loss": -26.076078414916992, "global_step": 333921, "epoch": 4023} {"train_loss": -25.90869140625, "global_step": 333922, "epoch": 4023} {"train_loss": -26.128625869750977, "global_step": 333923, "epoch": 4023} {"train_loss": -25.873579025268555, "global_step": 333924, "epoch": 4023} {"train_loss": -26.132612228393555, "global_step": 333925, "epoch": 4023} {"train_loss": -25.937469482421875, "global_step": 333926, "epoch": 4023} {"train_loss": -26.202951431274414, "global_step": 333927, "epoch": 4023} {"train_loss": -25.7152099609375, "global_step": 333928, "epoch": 4023} {"train_loss": -26.165775299072266, "global_step": 333929, "epoch": 4023} {"train_loss": -26.249967575073242, "global_step": 333930, "epoch": 4023} {"train_loss": -25.817672729492188, "global_step": 333931, "epoch": 4023} {"train_loss": -25.81551170349121, "global_step": 333932, "epoch": 4023} {"train_loss": -26.178882598876953, "global_step": 333933, "epoch": 4023} {"train_loss": -25.942001342773438, "global_step": 333934, "epoch": 4023} {"train_loss": -26.121896743774414, "global_step": 333935, "epoch": 4023} {"train_loss": -25.975183486938477, "global_step": 333936, "epoch": 4023} {"train_loss": -25.85332679748535, "global_step": 333937, "epoch": 4023} {"train_loss": -25.71310806274414, "global_step": 333938, "epoch": 4023} {"train_loss": -26.12457275390625, "global_step": 333939, "epoch": 4023} {"train_loss": -26.15716552734375, "global_step": 333940, "epoch": 4023} {"train_loss": -25.9727840423584, "global_step": 333941, "epoch": 4023} {"train_loss": -26.1550235748291, "global_step": 333942, "epoch": 4023} {"train_loss": -26.52720069885254, "global_step": 333943, "epoch": 4023} {"train_loss": -26.07527732849121, "global_step": 333944, "epoch": 4023} {"train_loss": -26.49991226196289, "global_step": 333945, "epoch": 4023} {"train_loss": -26.185810089111328, "global_step": 333946, "epoch": 4023} {"train_loss": -26.31348991394043, "global_step": 333947, "epoch": 4023} {"train_loss": -26.245935440063477, "global_step": 333948, "epoch": 4023} {"train_loss": -26.52471351623535, "global_step": 333949, "epoch": 4023} {"train_loss": -25.848005294799805, "global_step": 333950, "epoch": 4023} {"train_loss": -26.193069458007812, "global_step": 333951, "epoch": 4023} {"train_loss": -26.246185302734375, "global_step": 333952, "epoch": 4023} {"train_loss": -26.151601791381836, "global_step": 333953, "epoch": 4023} {"train_loss": -26.189544677734375, "global_step": 333954, "epoch": 4023} {"train_loss": -26.0872859954834, "global_step": 333955, "epoch": 4023} {"train_loss": -26.05975914001465, "global_step": 333956, "epoch": 4023} {"train_loss": -26.336530685424805, "global_step": 333957, "epoch": 4023} {"train_loss": -25.772235870361328, "global_step": 333958, "epoch": 4023} {"train_loss": -25.915363311767578, "global_step": 333959, "epoch": 4023} {"train_loss": -25.981510162353516, "global_step": 333960, "epoch": 4023} {"train_loss": -26.260181427001953, "global_step": 333961, "epoch": 4023} {"train_loss": -26.23064613342285, "global_step": 333962, "epoch": 4023} {"train_loss": -26.28632164001465, "global_step": 333963, "epoch": 4023} {"train_loss": -25.874195098876953, "global_step": 333964, "epoch": 4023} {"train_loss": -26.6307373046875, "global_step": 333965, "epoch": 4023} {"train_loss": -26.006317138671875, "global_step": 333966, "epoch": 4023} {"train_loss": -26.400564193725586, "global_step": 333967, "epoch": 4023} {"train_loss": -26.279071807861328, "global_step": 333968, "epoch": 4023} {"train_loss": -25.8353328704834, "global_step": 333969, "epoch": 4023} {"train_loss": -26.122486114501953, "global_step": 333970, "epoch": 4023} {"train_loss": -25.6910400390625, "global_step": 333971, "epoch": 4023} {"train_loss": -26.055694580078125, "global_step": 333972, "epoch": 4023} {"train_loss": -25.921844482421875, "global_step": 333973, "epoch": 4023} {"train_loss": -26.340728759765625, "global_step": 333974, "epoch": 4023} {"train_loss": -25.817279815673828, "global_step": 333975, "epoch": 4023} {"train_loss": -25.824146270751953, "global_step": 333976, "epoch": 4023} {"train_loss": -25.704132080078125, "global_step": 333977, "epoch": 4023} {"train_loss": -25.8012752532959, "global_step": 333978, "epoch": 4023} {"train_loss": -25.726465225219727, "global_step": 333979, "epoch": 4023} {"train_loss": -26.010297775268555, "global_step": 333980, "epoch": 4023} {"train_loss": -25.589509963989258, "global_step": 333981, "epoch": 4023} {"train_loss": -25.96380615234375, "global_step": 333982, "epoch": 4023} {"train_loss": -26.028888702392578, "global_step": 333983, "epoch": 4023} {"train_loss": -25.7122745513916, "global_step": 333984, "epoch": 4023} {"train_loss": -25.901031494140625, "global_step": 333985, "epoch": 4023} {"train_loss": -25.589277267456055, "global_step": 333986, "epoch": 4023} {"train_loss": -25.66200065612793, "global_step": 333987, "epoch": 4023} {"train_loss": -26.029088973999023, "global_step": 333988, "epoch": 4023} {"train_loss": -25.70429039001465, "global_step": 333989, "epoch": 4023} {"train_loss": -25.460378646850586, "global_step": 333990, "epoch": 4023} {"train_loss": -25.99948271785874, "global_step": 333991, "epoch": 4023, "val_loss": 6785430.0} {"train_loss": -25.594533920288086, "global_step": 333992, "epoch": 4024} {"train_loss": -25.782201766967773, "global_step": 333993, "epoch": 4024} {"train_loss": -25.328304290771484, "global_step": 333994, "epoch": 4024} {"train_loss": -25.480955123901367, "global_step": 333995, "epoch": 4024} {"train_loss": -25.478729248046875, "global_step": 333996, "epoch": 4024} {"train_loss": -25.559284210205078, "global_step": 333997, "epoch": 4024} {"train_loss": -25.259567260742188, "global_step": 333998, "epoch": 4024} {"train_loss": -25.866682052612305, "global_step": 333999, "epoch": 4024} {"train_loss": -25.694995880126953, "global_step": 334000, "epoch": 4024} {"train_loss": -25.691328048706055, "global_step": 334001, "epoch": 4024} {"train_loss": -25.72979736328125, "global_step": 334002, "epoch": 4024} {"train_loss": -26.002058029174805, "global_step": 334003, "epoch": 4024} {"train_loss": -25.624975204467773, "global_step": 334004, "epoch": 4024} {"train_loss": -25.643238067626953, "global_step": 334005, "epoch": 4024} {"train_loss": -25.866413116455078, "global_step": 334006, "epoch": 4024} {"train_loss": -25.778125762939453, "global_step": 334007, "epoch": 4024} {"train_loss": -25.541669845581055, "global_step": 334008, "epoch": 4024} {"train_loss": -25.743228912353516, "global_step": 334009, "epoch": 4024} {"train_loss": -25.860157012939453, "global_step": 334010, "epoch": 4024} {"train_loss": -25.901052474975586, "global_step": 334011, "epoch": 4024} {"train_loss": -25.888751983642578, "global_step": 334012, "epoch": 4024} {"train_loss": -26.019071578979492, "global_step": 334013, "epoch": 4024} {"train_loss": -26.115148544311523, "global_step": 334014, "epoch": 4024} {"train_loss": -26.1107177734375, "global_step": 334015, "epoch": 4024} {"train_loss": -26.33026123046875, "global_step": 334016, "epoch": 4024} {"train_loss": -26.075719833374023, "global_step": 334017, "epoch": 4024} {"train_loss": -25.780298233032227, "global_step": 334018, "epoch": 4024} {"train_loss": -25.963275909423828, "global_step": 334019, "epoch": 4024} {"train_loss": -26.086856842041016, "global_step": 334020, "epoch": 4024} {"train_loss": -26.249221801757812, "global_step": 334021, "epoch": 4024} {"train_loss": -26.0427303314209, "global_step": 334022, "epoch": 4024} {"train_loss": -25.965911865234375, "global_step": 334023, "epoch": 4024} {"train_loss": -26.4554443359375, "global_step": 334024, "epoch": 4024} {"train_loss": -25.809045791625977, "global_step": 334025, "epoch": 4024} {"train_loss": -26.192617416381836, "global_step": 334026, "epoch": 4024} {"train_loss": -26.27141761779785, "global_step": 334027, "epoch": 4024} {"train_loss": -26.301233291625977, "global_step": 334028, "epoch": 4024} {"train_loss": -26.290063858032227, "global_step": 334029, "epoch": 4024} {"train_loss": -25.7479248046875, "global_step": 334030, "epoch": 4024} {"train_loss": -25.900470733642578, "global_step": 334031, "epoch": 4024} {"train_loss": -25.950305938720703, "global_step": 334032, "epoch": 4024} {"train_loss": -26.195556640625, "global_step": 334033, "epoch": 4024} {"train_loss": -26.218244552612305, "global_step": 334034, "epoch": 4024} {"train_loss": -26.0430850982666, "global_step": 334035, "epoch": 4024} {"train_loss": -25.809431076049805, "global_step": 334036, "epoch": 4024} {"train_loss": -25.91061782836914, "global_step": 334037, "epoch": 4024} {"train_loss": -26.04052734375, "global_step": 334038, "epoch": 4024} {"train_loss": -26.063867568969727, "global_step": 334039, "epoch": 4024} {"train_loss": -26.117584228515625, "global_step": 334040, "epoch": 4024} {"train_loss": -26.0599308013916, "global_step": 334041, "epoch": 4024} {"train_loss": -26.199832916259766, "global_step": 334042, "epoch": 4024} {"train_loss": -26.01715660095215, "global_step": 334043, "epoch": 4024} {"train_loss": -26.127302169799805, "global_step": 334044, "epoch": 4024} {"train_loss": -26.010181427001953, "global_step": 334045, "epoch": 4024} {"train_loss": -25.9436092376709, "global_step": 334046, "epoch": 4024} {"train_loss": -26.162872314453125, "global_step": 334047, "epoch": 4024} {"train_loss": -26.273054122924805, "global_step": 334048, "epoch": 4024} {"train_loss": -26.23236656188965, "global_step": 334049, "epoch": 4024} {"train_loss": -25.879175186157227, "global_step": 334050, "epoch": 4024} {"train_loss": -26.237884521484375, "global_step": 334051, "epoch": 4024} {"train_loss": -26.0606746673584, "global_step": 334052, "epoch": 4024} {"train_loss": -26.096445083618164, "global_step": 334053, "epoch": 4024} {"train_loss": -26.48787498474121, "global_step": 334054, "epoch": 4024} {"train_loss": -25.724781036376953, "global_step": 334055, "epoch": 4024} {"train_loss": -25.84453773498535, "global_step": 334056, "epoch": 4024} {"train_loss": -25.85721206665039, "global_step": 334057, "epoch": 4024} {"train_loss": -25.655981063842773, "global_step": 334058, "epoch": 4024} {"train_loss": -25.992477416992188, "global_step": 334059, "epoch": 4024} {"train_loss": -26.007511138916016, "global_step": 334060, "epoch": 4024} {"train_loss": -25.813398361206055, "global_step": 334061, "epoch": 4024} {"train_loss": -26.35523796081543, "global_step": 334062, "epoch": 4024} {"train_loss": -25.589618682861328, "global_step": 334063, "epoch": 4024} {"train_loss": -25.928821563720703, "global_step": 334064, "epoch": 4024} {"train_loss": -25.79317283630371, "global_step": 334065, "epoch": 4024} {"train_loss": -25.96502113342285, "global_step": 334066, "epoch": 4024} {"train_loss": -26.212270736694336, "global_step": 334067, "epoch": 4024} {"train_loss": -25.59554672241211, "global_step": 334068, "epoch": 4024} {"train_loss": -25.522144317626953, "global_step": 334069, "epoch": 4024} {"train_loss": -25.545093536376953, "global_step": 334070, "epoch": 4024} {"train_loss": -26.002490997314453, "global_step": 334071, "epoch": 4024} {"train_loss": -26.0427303314209, "global_step": 334072, "epoch": 4024} {"train_loss": -25.391616821289062, "global_step": 334073, "epoch": 4024} {"train_loss": -25.923840993858246, "global_step": 334074, "epoch": 4024, "val_loss": 6915364.0} {"train_loss": -24.045576095581055, "global_step": 334075, "epoch": 4025} {"train_loss": -24.542213439941406, "global_step": 334076, "epoch": 4025} {"train_loss": -25.51227378845215, "global_step": 334077, "epoch": 4025} {"train_loss": -24.640104293823242, "global_step": 334078, "epoch": 4025} {"train_loss": -25.076034545898438, "global_step": 334079, "epoch": 4025} {"train_loss": -25.34810447692871, "global_step": 334080, "epoch": 4025} {"train_loss": -25.2012939453125, "global_step": 334081, "epoch": 4025} {"train_loss": -25.35670280456543, "global_step": 334082, "epoch": 4025} {"train_loss": -25.543092727661133, "global_step": 334083, "epoch": 4025} {"train_loss": -25.794458389282227, "global_step": 334084, "epoch": 4025} {"train_loss": -25.24024772644043, "global_step": 334085, "epoch": 4025} {"train_loss": -25.466472625732422, "global_step": 334086, "epoch": 4025} {"train_loss": -25.3455867767334, "global_step": 334087, "epoch": 4025} {"train_loss": -25.441450119018555, "global_step": 334088, "epoch": 4025} {"train_loss": -25.7426815032959, "global_step": 334089, "epoch": 4025} {"train_loss": -25.468069076538086, "global_step": 334090, "epoch": 4025} {"train_loss": -25.337980270385742, "global_step": 334091, "epoch": 4025} {"train_loss": -25.403989791870117, "global_step": 334092, "epoch": 4025} {"train_loss": -25.4530086517334, "global_step": 334093, "epoch": 4025} {"train_loss": -25.82539939880371, "global_step": 334094, "epoch": 4025} {"train_loss": -25.705982208251953, "global_step": 334095, "epoch": 4025} {"train_loss": -25.71242332458496, "global_step": 334096, "epoch": 4025} {"train_loss": -25.97364616394043, "global_step": 334097, "epoch": 4025} {"train_loss": -25.797651290893555, "global_step": 334098, "epoch": 4025} {"train_loss": -25.850204467773438, "global_step": 334099, "epoch": 4025} {"train_loss": -25.688501358032227, "global_step": 334100, "epoch": 4025} {"train_loss": -26.154556274414062, "global_step": 334101, "epoch": 4025} {"train_loss": -25.649677276611328, "global_step": 334102, "epoch": 4025} {"train_loss": -25.367002487182617, "global_step": 334103, "epoch": 4025} {"train_loss": -25.581539154052734, "global_step": 334104, "epoch": 4025} {"train_loss": -25.803632736206055, "global_step": 334105, "epoch": 4025} {"train_loss": -25.361684799194336, "global_step": 334106, "epoch": 4025} {"train_loss": -25.835742950439453, "global_step": 334107, "epoch": 4025} {"train_loss": -25.39999771118164, "global_step": 334108, "epoch": 4025} {"train_loss": -26.293710708618164, "global_step": 334109, "epoch": 4025} {"train_loss": -25.91376304626465, "global_step": 334110, "epoch": 4025} {"train_loss": -25.9493350982666, "global_step": 334111, "epoch": 4025} {"train_loss": -25.9625244140625, "global_step": 334112, "epoch": 4025} {"train_loss": -26.15032386779785, "global_step": 334113, "epoch": 4025} {"train_loss": -26.18951988220215, "global_step": 334114, "epoch": 4025} {"train_loss": -26.431018829345703, "global_step": 334115, "epoch": 4025} {"train_loss": -25.996912002563477, "global_step": 334116, "epoch": 4025} {"train_loss": -26.074438095092773, "global_step": 334117, "epoch": 4025} {"train_loss": -26.182937622070312, "global_step": 334118, "epoch": 4025} {"train_loss": -26.13266372680664, "global_step": 334119, "epoch": 4025} {"train_loss": -26.001256942749023, "global_step": 334120, "epoch": 4025} {"train_loss": -26.117279052734375, "global_step": 334121, "epoch": 4025} {"train_loss": -26.20802116394043, "global_step": 334122, "epoch": 4025} {"train_loss": -26.228626251220703, "global_step": 334123, "epoch": 4025} {"train_loss": -25.921676635742188, "global_step": 334124, "epoch": 4025} {"train_loss": -26.412921905517578, "global_step": 334125, "epoch": 4025} {"train_loss": -26.276641845703125, "global_step": 334126, "epoch": 4025} {"train_loss": -26.301624298095703, "global_step": 334127, "epoch": 4025} {"train_loss": -26.04924964904785, "global_step": 334128, "epoch": 4025} {"train_loss": -26.032611846923828, "global_step": 334129, "epoch": 4025} {"train_loss": -25.935226440429688, "global_step": 334130, "epoch": 4025} {"train_loss": -25.99690055847168, "global_step": 334131, "epoch": 4025} {"train_loss": -26.107725143432617, "global_step": 334132, "epoch": 4025} {"train_loss": -26.0518741607666, "global_step": 334133, "epoch": 4025} {"train_loss": -26.13714599609375, "global_step": 334134, "epoch": 4025} {"train_loss": -25.919818878173828, "global_step": 334135, "epoch": 4025} {"train_loss": -25.9394474029541, "global_step": 334136, "epoch": 4025} {"train_loss": -25.901647567749023, "global_step": 334137, "epoch": 4025} {"train_loss": -26.09869956970215, "global_step": 334138, "epoch": 4025} {"train_loss": -26.128347396850586, "global_step": 334139, "epoch": 4025} {"train_loss": -25.873218536376953, "global_step": 334140, "epoch": 4025} {"train_loss": -25.925262451171875, "global_step": 334141, "epoch": 4025} {"train_loss": -25.731603622436523, "global_step": 334142, "epoch": 4025} {"train_loss": -26.076587677001953, "global_step": 334143, "epoch": 4025} {"train_loss": -25.583694458007812, "global_step": 334144, "epoch": 4025} {"train_loss": -25.925689697265625, "global_step": 334145, "epoch": 4025} {"train_loss": -25.70582389831543, "global_step": 334146, "epoch": 4025} {"train_loss": -25.922534942626953, "global_step": 334147, "epoch": 4025} {"train_loss": -26.18592643737793, "global_step": 334148, "epoch": 4025} {"train_loss": -26.227834701538086, "global_step": 334149, "epoch": 4025} {"train_loss": -25.990087509155273, "global_step": 334150, "epoch": 4025} {"train_loss": -26.047760009765625, "global_step": 334151, "epoch": 4025} {"train_loss": -26.128250122070312, "global_step": 334152, "epoch": 4025} {"train_loss": -26.357999801635742, "global_step": 334153, "epoch": 4025} {"train_loss": -25.8984375, "global_step": 334154, "epoch": 4025} {"train_loss": -26.17439079284668, "global_step": 334155, "epoch": 4025} {"train_loss": -26.120529174804688, "global_step": 334156, "epoch": 4025} {"train_loss": -25.814255335244788, "global_step": 334157, "epoch": 4025, "val_loss": 6791303.5} {"train_loss": -25.439985275268555, "global_step": 334158, "epoch": 4026} {"train_loss": -25.414348602294922, "global_step": 334159, "epoch": 4026} {"train_loss": -25.282072067260742, "global_step": 334160, "epoch": 4026} {"train_loss": -25.946741104125977, "global_step": 334161, "epoch": 4026} {"train_loss": -25.445335388183594, "global_step": 334162, "epoch": 4026} {"train_loss": -25.521108627319336, "global_step": 334163, "epoch": 4026} {"train_loss": -25.680402755737305, "global_step": 334164, "epoch": 4026} {"train_loss": -24.7479305267334, "global_step": 334165, "epoch": 4026} {"train_loss": -25.628402709960938, "global_step": 334166, "epoch": 4026} {"train_loss": -25.05853271484375, "global_step": 334167, "epoch": 4026} {"train_loss": -25.317768096923828, "global_step": 334168, "epoch": 4026} {"train_loss": -25.375308990478516, "global_step": 334169, "epoch": 4026} {"train_loss": -26.232221603393555, "global_step": 334170, "epoch": 4026} {"train_loss": -25.5645751953125, "global_step": 334171, "epoch": 4026} {"train_loss": -25.802366256713867, "global_step": 334172, "epoch": 4026} {"train_loss": -25.821186065673828, "global_step": 334173, "epoch": 4026} {"train_loss": -25.447202682495117, "global_step": 334174, "epoch": 4026} {"train_loss": -25.51045036315918, "global_step": 334175, "epoch": 4026} {"train_loss": -25.735937118530273, "global_step": 334176, "epoch": 4026} {"train_loss": -25.53617286682129, "global_step": 334177, "epoch": 4026} {"train_loss": -25.822973251342773, "global_step": 334178, "epoch": 4026} {"train_loss": -26.1224308013916, "global_step": 334179, "epoch": 4026} {"train_loss": -26.003223419189453, "global_step": 334180, "epoch": 4026} {"train_loss": -25.6706485748291, "global_step": 334181, "epoch": 4026} {"train_loss": -26.082502365112305, "global_step": 334182, "epoch": 4026} {"train_loss": -26.04900550842285, "global_step": 334183, "epoch": 4026} {"train_loss": -26.1180419921875, "global_step": 334184, "epoch": 4026} {"train_loss": -25.84173011779785, "global_step": 334185, "epoch": 4026} {"train_loss": -25.83916664123535, "global_step": 334186, "epoch": 4026} {"train_loss": -25.801136016845703, "global_step": 334187, "epoch": 4026} {"train_loss": -25.975696563720703, "global_step": 334188, "epoch": 4026} {"train_loss": -26.014429092407227, "global_step": 334189, "epoch": 4026} {"train_loss": -26.164525985717773, "global_step": 334190, "epoch": 4026} {"train_loss": -26.274213790893555, "global_step": 334191, "epoch": 4026} {"train_loss": -25.869949340820312, "global_step": 334192, "epoch": 4026} {"train_loss": -25.948841094970703, "global_step": 334193, "epoch": 4026} {"train_loss": -26.075885772705078, "global_step": 334194, "epoch": 4026} {"train_loss": -26.17848014831543, "global_step": 334195, "epoch": 4026} {"train_loss": -26.05377197265625, "global_step": 334196, "epoch": 4026} {"train_loss": -26.2858943939209, "global_step": 334197, "epoch": 4026} {"train_loss": -26.161090850830078, "global_step": 334198, "epoch": 4026} {"train_loss": -26.145063400268555, "global_step": 334199, "epoch": 4026} {"train_loss": -26.04556655883789, "global_step": 334200, "epoch": 4026} {"train_loss": -26.16936683654785, "global_step": 334201, "epoch": 4026} {"train_loss": -25.885589599609375, "global_step": 334202, "epoch": 4026} {"train_loss": -26.257822036743164, "global_step": 334203, "epoch": 4026} {"train_loss": -26.337568283081055, "global_step": 334204, "epoch": 4026} {"train_loss": -26.24566078186035, "global_step": 334205, "epoch": 4026} {"train_loss": -25.811691284179688, "global_step": 334206, "epoch": 4026} {"train_loss": -26.04375648498535, "global_step": 334207, "epoch": 4026} {"train_loss": -26.39479637145996, "global_step": 334208, "epoch": 4026} {"train_loss": -25.913562774658203, "global_step": 334209, "epoch": 4026} {"train_loss": -25.828893661499023, "global_step": 334210, "epoch": 4026} {"train_loss": -26.522809982299805, "global_step": 334211, "epoch": 4026} {"train_loss": -25.72802734375, "global_step": 334212, "epoch": 4026} {"train_loss": -25.96755027770996, "global_step": 334213, "epoch": 4026} {"train_loss": -26.1380558013916, "global_step": 334214, "epoch": 4026} {"train_loss": -25.94593620300293, "global_step": 334215, "epoch": 4026} {"train_loss": -26.480222702026367, "global_step": 334216, "epoch": 4026} {"train_loss": -26.27300453186035, "global_step": 334217, "epoch": 4026} {"train_loss": -26.032608032226562, "global_step": 334218, "epoch": 4026} {"train_loss": -26.064977645874023, "global_step": 334219, "epoch": 4026} {"train_loss": -25.818557739257812, "global_step": 334220, "epoch": 4026} {"train_loss": -25.983068466186523, "global_step": 334221, "epoch": 4026} {"train_loss": -26.17034339904785, "global_step": 334222, "epoch": 4026} {"train_loss": -26.33491325378418, "global_step": 334223, "epoch": 4026} {"train_loss": -25.964731216430664, "global_step": 334224, "epoch": 4026} {"train_loss": -26.180667877197266, "global_step": 334225, "epoch": 4026} {"train_loss": -25.9780216217041, "global_step": 334226, "epoch": 4026} {"train_loss": -26.139328002929688, "global_step": 334227, "epoch": 4026} {"train_loss": -26.2080020904541, "global_step": 334228, "epoch": 4026} {"train_loss": -26.368927001953125, "global_step": 334229, "epoch": 4026} {"train_loss": -26.37078857421875, "global_step": 334230, "epoch": 4026} {"train_loss": -26.418493270874023, "global_step": 334231, "epoch": 4026} {"train_loss": -25.9610595703125, "global_step": 334232, "epoch": 4026} {"train_loss": -25.97699546813965, "global_step": 334233, "epoch": 4026} {"train_loss": -26.10273551940918, "global_step": 334234, "epoch": 4026} {"train_loss": -26.159162521362305, "global_step": 334235, "epoch": 4026} {"train_loss": -26.282093048095703, "global_step": 334236, "epoch": 4026} {"train_loss": -25.84284019470215, "global_step": 334237, "epoch": 4026} {"train_loss": -25.618213653564453, "global_step": 334238, "epoch": 4026} {"train_loss": -25.565725326538086, "global_step": 334239, "epoch": 4026} {"train_loss": -25.915967803403557, "global_step": 334240, "epoch": 4026, "val_loss": 6741861.0} {"train_loss": -23.044889450073242, "global_step": 334241, "epoch": 4027} {"train_loss": -23.612911224365234, "global_step": 334242, "epoch": 4027} {"train_loss": -25.033140182495117, "global_step": 334243, "epoch": 4027} {"train_loss": -23.297929763793945, "global_step": 334244, "epoch": 4027} {"train_loss": -23.872373580932617, "global_step": 334245, "epoch": 4027} {"train_loss": -24.69061279296875, "global_step": 334246, "epoch": 4027} {"train_loss": -24.43337631225586, "global_step": 334247, "epoch": 4027} {"train_loss": -24.86614418029785, "global_step": 334248, "epoch": 4027} {"train_loss": -24.956802368164062, "global_step": 334249, "epoch": 4027} {"train_loss": -24.9115047454834, "global_step": 334250, "epoch": 4027} {"train_loss": -24.96405601501465, "global_step": 334251, "epoch": 4027} {"train_loss": -25.138927459716797, "global_step": 334252, "epoch": 4027} {"train_loss": -25.22553062438965, "global_step": 334253, "epoch": 4027} {"train_loss": -25.449979782104492, "global_step": 334254, "epoch": 4027} {"train_loss": -25.09498405456543, "global_step": 334255, "epoch": 4027} {"train_loss": -25.240283966064453, "global_step": 334256, "epoch": 4027} {"train_loss": -24.966594696044922, "global_step": 334257, "epoch": 4027} {"train_loss": -25.10491371154785, "global_step": 334258, "epoch": 4027} {"train_loss": -25.12377166748047, "global_step": 334259, "epoch": 4027} {"train_loss": -25.291147232055664, "global_step": 334260, "epoch": 4027} {"train_loss": -25.28682518005371, "global_step": 334261, "epoch": 4027} {"train_loss": -25.229801177978516, "global_step": 334262, "epoch": 4027} {"train_loss": -25.23064613342285, "global_step": 334263, "epoch": 4027} {"train_loss": -25.35125732421875, "global_step": 334264, "epoch": 4027} {"train_loss": -25.710020065307617, "global_step": 334265, "epoch": 4027} {"train_loss": -25.386520385742188, "global_step": 334266, "epoch": 4027} {"train_loss": -25.59276008605957, "global_step": 334267, "epoch": 4027} {"train_loss": -26.101917266845703, "global_step": 334268, "epoch": 4027} {"train_loss": -25.671728134155273, "global_step": 334269, "epoch": 4027} {"train_loss": -25.689130783081055, "global_step": 334270, "epoch": 4027} {"train_loss": -25.405614852905273, "global_step": 334271, "epoch": 4027} {"train_loss": -25.6015682220459, "global_step": 334272, "epoch": 4027} {"train_loss": -25.666717529296875, "global_step": 334273, "epoch": 4027} {"train_loss": -25.774246215820312, "global_step": 334274, "epoch": 4027} {"train_loss": -25.966989517211914, "global_step": 334275, "epoch": 4027} {"train_loss": -25.658233642578125, "global_step": 334276, "epoch": 4027} {"train_loss": -25.774799346923828, "global_step": 334277, "epoch": 4027} {"train_loss": -25.931228637695312, "global_step": 334278, "epoch": 4027} {"train_loss": -25.93739891052246, "global_step": 334279, "epoch": 4027} {"train_loss": -26.02157974243164, "global_step": 334280, "epoch": 4027} {"train_loss": -25.9935359954834, "global_step": 334281, "epoch": 4027} {"train_loss": -26.335493087768555, "global_step": 334282, "epoch": 4027} {"train_loss": -25.915815353393555, "global_step": 334283, "epoch": 4027} {"train_loss": -26.143014907836914, "global_step": 334284, "epoch": 4027} {"train_loss": -25.688180923461914, "global_step": 334285, "epoch": 4027} {"train_loss": -25.938751220703125, "global_step": 334286, "epoch": 4027} {"train_loss": -25.751184463500977, "global_step": 334287, "epoch": 4027} {"train_loss": -26.165912628173828, "global_step": 334288, "epoch": 4027} {"train_loss": -25.97907066345215, "global_step": 334289, "epoch": 4027} {"train_loss": -25.965036392211914, "global_step": 334290, "epoch": 4027} {"train_loss": -26.006580352783203, "global_step": 334291, "epoch": 4027} {"train_loss": -26.0654296875, "global_step": 334292, "epoch": 4027} {"train_loss": -26.0833740234375, "global_step": 334293, "epoch": 4027} {"train_loss": -25.910749435424805, "global_step": 334294, "epoch": 4027} {"train_loss": -26.254114151000977, "global_step": 334295, "epoch": 4027} {"train_loss": -25.842529296875, "global_step": 334296, "epoch": 4027} {"train_loss": -25.8059139251709, "global_step": 334297, "epoch": 4027} {"train_loss": -26.166547775268555, "global_step": 334298, "epoch": 4027} {"train_loss": -26.099628448486328, "global_step": 334299, "epoch": 4027} {"train_loss": -25.74458122253418, "global_step": 334300, "epoch": 4027} {"train_loss": -26.038419723510742, "global_step": 334301, "epoch": 4027} {"train_loss": -25.89324951171875, "global_step": 334302, "epoch": 4027} {"train_loss": -26.466161727905273, "global_step": 334303, "epoch": 4027} {"train_loss": -25.691198348999023, "global_step": 334304, "epoch": 4027} {"train_loss": -26.008316040039062, "global_step": 334305, "epoch": 4027} {"train_loss": -26.175811767578125, "global_step": 334306, "epoch": 4027} {"train_loss": -25.958099365234375, "global_step": 334307, "epoch": 4027} {"train_loss": -25.822362899780273, "global_step": 334308, "epoch": 4027} {"train_loss": -26.029682159423828, "global_step": 334309, "epoch": 4027} {"train_loss": -26.038984298706055, "global_step": 334310, "epoch": 4027} {"train_loss": -26.164148330688477, "global_step": 334311, "epoch": 4027} {"train_loss": -25.89923667907715, "global_step": 334312, "epoch": 4027} {"train_loss": -26.0228271484375, "global_step": 334313, "epoch": 4027} {"train_loss": -26.11641502380371, "global_step": 334314, "epoch": 4027} {"train_loss": -25.94697380065918, "global_step": 334315, "epoch": 4027} {"train_loss": -25.643808364868164, "global_step": 334316, "epoch": 4027} {"train_loss": -25.99579429626465, "global_step": 334317, "epoch": 4027} {"train_loss": -26.123340606689453, "global_step": 334318, "epoch": 4027} {"train_loss": -26.184223175048828, "global_step": 334319, "epoch": 4027} {"train_loss": -26.227737426757812, "global_step": 334320, "epoch": 4027} {"train_loss": -26.157773971557617, "global_step": 334321, "epoch": 4027} {"train_loss": -26.056995391845703, "global_step": 334322, "epoch": 4027} {"train_loss": -25.620133917015718, "global_step": 334323, "epoch": 4027, "val_loss": 6736109.0} {"train_loss": -24.706195831298828, "global_step": 334324, "epoch": 4028} {"train_loss": -25.593250274658203, "global_step": 334325, "epoch": 4028} {"train_loss": -25.678680419921875, "global_step": 334326, "epoch": 4028} {"train_loss": -25.491605758666992, "global_step": 334327, "epoch": 4028} {"train_loss": -26.109588623046875, "global_step": 334328, "epoch": 4028} {"train_loss": -25.317415237426758, "global_step": 334329, "epoch": 4028} {"train_loss": -25.857141494750977, "global_step": 334330, "epoch": 4028} {"train_loss": -25.391143798828125, "global_step": 334331, "epoch": 4028} {"train_loss": -25.685043334960938, "global_step": 334332, "epoch": 4028} {"train_loss": -25.886655807495117, "global_step": 334333, "epoch": 4028} {"train_loss": -25.92458152770996, "global_step": 334334, "epoch": 4028} {"train_loss": -25.5434513092041, "global_step": 334335, "epoch": 4028} {"train_loss": -25.649932861328125, "global_step": 334336, "epoch": 4028} {"train_loss": -25.960668563842773, "global_step": 334337, "epoch": 4028} {"train_loss": -26.0244083404541, "global_step": 334338, "epoch": 4028} {"train_loss": -26.00446128845215, "global_step": 334339, "epoch": 4028} {"train_loss": -25.733304977416992, "global_step": 334340, "epoch": 4028} {"train_loss": -25.76641845703125, "global_step": 334341, "epoch": 4028} {"train_loss": -25.9549560546875, "global_step": 334342, "epoch": 4028} {"train_loss": -25.77559471130371, "global_step": 334343, "epoch": 4028} {"train_loss": -25.951791763305664, "global_step": 334344, "epoch": 4028} {"train_loss": -25.950000762939453, "global_step": 334345, "epoch": 4028} {"train_loss": -25.93145751953125, "global_step": 334346, "epoch": 4028} {"train_loss": -25.774337768554688, "global_step": 334347, "epoch": 4028} {"train_loss": -25.836200714111328, "global_step": 334348, "epoch": 4028} {"train_loss": -25.93232536315918, "global_step": 334349, "epoch": 4028} {"train_loss": -25.96209144592285, "global_step": 334350, "epoch": 4028} {"train_loss": -25.703327178955078, "global_step": 334351, "epoch": 4028} {"train_loss": -26.0213565826416, "global_step": 334352, "epoch": 4028} {"train_loss": -26.02853775024414, "global_step": 334353, "epoch": 4028} {"train_loss": -25.96746826171875, "global_step": 334354, "epoch": 4028} {"train_loss": -26.109928131103516, "global_step": 334355, "epoch": 4028} {"train_loss": -26.365921020507812, "global_step": 334356, "epoch": 4028} {"train_loss": -26.235504150390625, "global_step": 334357, "epoch": 4028} {"train_loss": -26.10349464416504, "global_step": 334358, "epoch": 4028} {"train_loss": -26.26007080078125, "global_step": 334359, "epoch": 4028} {"train_loss": -25.94491958618164, "global_step": 334360, "epoch": 4028} {"train_loss": -26.15470314025879, "global_step": 334361, "epoch": 4028} {"train_loss": -25.977102279663086, "global_step": 334362, "epoch": 4028} {"train_loss": -26.086889266967773, "global_step": 334363, "epoch": 4028} {"train_loss": -26.256118774414062, "global_step": 334364, "epoch": 4028} {"train_loss": -26.064640045166016, "global_step": 334365, "epoch": 4028} {"train_loss": -26.28790283203125, "global_step": 334366, "epoch": 4028} {"train_loss": -26.410131454467773, "global_step": 334367, "epoch": 4028} {"train_loss": -26.158004760742188, "global_step": 334368, "epoch": 4028} {"train_loss": -25.964385986328125, "global_step": 334369, "epoch": 4028} {"train_loss": -26.086627960205078, "global_step": 334370, "epoch": 4028} {"train_loss": -26.144926071166992, "global_step": 334371, "epoch": 4028} {"train_loss": -26.23016357421875, "global_step": 334372, "epoch": 4028} {"train_loss": -26.516477584838867, "global_step": 334373, "epoch": 4028} {"train_loss": -26.139450073242188, "global_step": 334374, "epoch": 4028} {"train_loss": -26.179046630859375, "global_step": 334375, "epoch": 4028} {"train_loss": -26.26932144165039, "global_step": 334376, "epoch": 4028} {"train_loss": -25.98328971862793, "global_step": 334377, "epoch": 4028} {"train_loss": -26.0941104888916, "global_step": 334378, "epoch": 4028} {"train_loss": -25.20241928100586, "global_step": 334379, "epoch": 4028} {"train_loss": -25.128372192382812, "global_step": 334380, "epoch": 4028} {"train_loss": -25.916244506835938, "global_step": 334381, "epoch": 4028} {"train_loss": -25.75896644592285, "global_step": 334382, "epoch": 4028} {"train_loss": -25.584095001220703, "global_step": 334383, "epoch": 4028} {"train_loss": -25.458538055419922, "global_step": 334384, "epoch": 4028} {"train_loss": -25.750717163085938, "global_step": 334385, "epoch": 4028} {"train_loss": -25.745981216430664, "global_step": 334386, "epoch": 4028} {"train_loss": -25.297805786132812, "global_step": 334387, "epoch": 4028} {"train_loss": -25.496719360351562, "global_step": 334388, "epoch": 4028} {"train_loss": -25.464181900024414, "global_step": 334389, "epoch": 4028} {"train_loss": -25.510128021240234, "global_step": 334390, "epoch": 4028} {"train_loss": -25.66645622253418, "global_step": 334391, "epoch": 4028} {"train_loss": -26.326160430908203, "global_step": 334392, "epoch": 4028} {"train_loss": -25.82478904724121, "global_step": 334393, "epoch": 4028} {"train_loss": -26.19471549987793, "global_step": 334394, "epoch": 4028} {"train_loss": -25.60365867614746, "global_step": 334395, "epoch": 4028} {"train_loss": -25.73261833190918, "global_step": 334396, "epoch": 4028} {"train_loss": -25.660009384155273, "global_step": 334397, "epoch": 4028} {"train_loss": -25.869384765625, "global_step": 334398, "epoch": 4028} {"train_loss": -25.87733268737793, "global_step": 334399, "epoch": 4028} {"train_loss": -25.671918869018555, "global_step": 334400, "epoch": 4028} {"train_loss": -26.138830184936523, "global_step": 334401, "epoch": 4028} {"train_loss": -26.05402183532715, "global_step": 334402, "epoch": 4028} {"train_loss": -26.16586685180664, "global_step": 334403, "epoch": 4028} {"train_loss": -26.18509864807129, "global_step": 334404, "epoch": 4028} {"train_loss": -25.9095516204834, "global_step": 334405, "epoch": 4028} {"train_loss": -25.894380362637072, "global_step": 334406, "epoch": 4028, "val_loss": 6762484.5} {"train_loss": -26.042463302612305, "global_step": 334407, "epoch": 4029} {"train_loss": -26.08322525024414, "global_step": 334408, "epoch": 4029} {"train_loss": -25.93939208984375, "global_step": 334409, "epoch": 4029} {"train_loss": -26.05521583557129, "global_step": 334410, "epoch": 4029} {"train_loss": -25.62726402282715, "global_step": 334411, "epoch": 4029} {"train_loss": -25.964141845703125, "global_step": 334412, "epoch": 4029} {"train_loss": -25.672300338745117, "global_step": 334413, "epoch": 4029} {"train_loss": -25.882965087890625, "global_step": 334414, "epoch": 4029} {"train_loss": -26.075580596923828, "global_step": 334415, "epoch": 4029} {"train_loss": -26.212039947509766, "global_step": 334416, "epoch": 4029} {"train_loss": -26.13007926940918, "global_step": 334417, "epoch": 4029} {"train_loss": -25.97250747680664, "global_step": 334418, "epoch": 4029} {"train_loss": -25.873291015625, "global_step": 334419, "epoch": 4029} {"train_loss": -26.00925636291504, "global_step": 334420, "epoch": 4029} {"train_loss": -26.62225341796875, "global_step": 334421, "epoch": 4029} {"train_loss": -25.767333984375, "global_step": 334422, "epoch": 4029} {"train_loss": -25.561752319335938, "global_step": 334423, "epoch": 4029} {"train_loss": -25.947370529174805, "global_step": 334424, "epoch": 4029} {"train_loss": -26.173959732055664, "global_step": 334425, "epoch": 4029} {"train_loss": -25.7440128326416, "global_step": 334426, "epoch": 4029} {"train_loss": -26.04239845275879, "global_step": 334427, "epoch": 4029} {"train_loss": -26.102890014648438, "global_step": 334428, "epoch": 4029} {"train_loss": -26.180021286010742, "global_step": 334429, "epoch": 4029} {"train_loss": -26.322235107421875, "global_step": 334430, "epoch": 4029} {"train_loss": -26.089508056640625, "global_step": 334431, "epoch": 4029} {"train_loss": -25.965513229370117, "global_step": 334432, "epoch": 4029} {"train_loss": -25.431339263916016, "global_step": 334433, "epoch": 4029} {"train_loss": -25.897058486938477, "global_step": 334434, "epoch": 4029} {"train_loss": -25.697172164916992, "global_step": 334435, "epoch": 4029} {"train_loss": -26.211109161376953, "global_step": 334436, "epoch": 4029} {"train_loss": -26.000965118408203, "global_step": 334437, "epoch": 4029} {"train_loss": -25.47820281982422, "global_step": 334438, "epoch": 4029} {"train_loss": -25.549142837524414, "global_step": 334439, "epoch": 4029} {"train_loss": -25.947118759155273, "global_step": 334440, "epoch": 4029} {"train_loss": -25.882404327392578, "global_step": 334441, "epoch": 4029} {"train_loss": -25.73896598815918, "global_step": 334442, "epoch": 4029} {"train_loss": -25.529144287109375, "global_step": 334443, "epoch": 4029} {"train_loss": -25.836395263671875, "global_step": 334444, "epoch": 4029} {"train_loss": -26.11688232421875, "global_step": 334445, "epoch": 4029} {"train_loss": -26.001073837280273, "global_step": 334446, "epoch": 4029} {"train_loss": -25.9155330657959, "global_step": 334447, "epoch": 4029} {"train_loss": -25.842365264892578, "global_step": 334448, "epoch": 4029} {"train_loss": -25.925321578979492, "global_step": 334449, "epoch": 4029} {"train_loss": -25.902450561523438, "global_step": 334450, "epoch": 4029} {"train_loss": -25.718063354492188, "global_step": 334451, "epoch": 4029} {"train_loss": -26.030969619750977, "global_step": 334452, "epoch": 4029} {"train_loss": -26.07673454284668, "global_step": 334453, "epoch": 4029} {"train_loss": -25.810531616210938, "global_step": 334454, "epoch": 4029} {"train_loss": -25.90872573852539, "global_step": 334455, "epoch": 4029} {"train_loss": -25.993810653686523, "global_step": 334456, "epoch": 4029} {"train_loss": -26.376012802124023, "global_step": 334457, "epoch": 4029} {"train_loss": -26.084640502929688, "global_step": 334458, "epoch": 4029} {"train_loss": -26.040876388549805, "global_step": 334459, "epoch": 4029} {"train_loss": -26.044361114501953, "global_step": 334460, "epoch": 4029} {"train_loss": -26.153888702392578, "global_step": 334461, "epoch": 4029} {"train_loss": -26.38427734375, "global_step": 334462, "epoch": 4029} {"train_loss": -26.155847549438477, "global_step": 334463, "epoch": 4029} {"train_loss": -26.013425827026367, "global_step": 334464, "epoch": 4029} {"train_loss": -26.0867862701416, "global_step": 334465, "epoch": 4029} {"train_loss": -26.215478897094727, "global_step": 334466, "epoch": 4029} {"train_loss": -26.151906967163086, "global_step": 334467, "epoch": 4029} {"train_loss": -26.03306007385254, "global_step": 334468, "epoch": 4029} {"train_loss": -26.289880752563477, "global_step": 334469, "epoch": 4029} {"train_loss": -25.810394287109375, "global_step": 334470, "epoch": 4029} {"train_loss": -26.083480834960938, "global_step": 334471, "epoch": 4029} {"train_loss": -25.548343658447266, "global_step": 334472, "epoch": 4029} {"train_loss": -26.3809814453125, "global_step": 334473, "epoch": 4029} {"train_loss": -26.277297973632812, "global_step": 334474, "epoch": 4029} {"train_loss": -26.620208740234375, "global_step": 334475, "epoch": 4029} {"train_loss": -26.2241153717041, "global_step": 334476, "epoch": 4029} {"train_loss": -25.73713493347168, "global_step": 334477, "epoch": 4029} {"train_loss": -25.66131591796875, "global_step": 334478, "epoch": 4029} {"train_loss": -25.892934799194336, "global_step": 334479, "epoch": 4029} {"train_loss": -26.13880729675293, "global_step": 334480, "epoch": 4029} {"train_loss": -25.88641357421875, "global_step": 334481, "epoch": 4029} {"train_loss": -25.83295249938965, "global_step": 334482, "epoch": 4029} {"train_loss": -26.254358291625977, "global_step": 334483, "epoch": 4029} {"train_loss": -25.689977645874023, "global_step": 334484, "epoch": 4029} {"train_loss": -26.15171241760254, "global_step": 334485, "epoch": 4029} {"train_loss": -25.759017944335938, "global_step": 334486, "epoch": 4029} {"train_loss": -26.115619659423828, "global_step": 334487, "epoch": 4029} {"train_loss": -25.751068115234375, "global_step": 334488, "epoch": 4029} {"train_loss": -25.966265161353423, "global_step": 334489, "epoch": 4029, "val_loss": 6783029.0} {"train_loss": -25.10980796813965, "global_step": 334490, "epoch": 4030} {"train_loss": -24.55939292907715, "global_step": 334491, "epoch": 4030} {"train_loss": -25.39818572998047, "global_step": 334492, "epoch": 4030} {"train_loss": -24.71707534790039, "global_step": 334493, "epoch": 4030} {"train_loss": -25.025407791137695, "global_step": 334494, "epoch": 4030} {"train_loss": -25.09250831604004, "global_step": 334495, "epoch": 4030} {"train_loss": -25.25861930847168, "global_step": 334496, "epoch": 4030} {"train_loss": -25.03859519958496, "global_step": 334497, "epoch": 4030} {"train_loss": -25.49615478515625, "global_step": 334498, "epoch": 4030} {"train_loss": -25.25747299194336, "global_step": 334499, "epoch": 4030} {"train_loss": -25.169248580932617, "global_step": 334500, "epoch": 4030} {"train_loss": -24.813291549682617, "global_step": 334501, "epoch": 4030} {"train_loss": -25.116931915283203, "global_step": 334502, "epoch": 4030} {"train_loss": -25.20704460144043, "global_step": 334503, "epoch": 4030} {"train_loss": -25.551416397094727, "global_step": 334504, "epoch": 4030} {"train_loss": -25.653356552124023, "global_step": 334505, "epoch": 4030} {"train_loss": -25.620849609375, "global_step": 334506, "epoch": 4030} {"train_loss": -26.010046005249023, "global_step": 334507, "epoch": 4030} {"train_loss": -25.526273727416992, "global_step": 334508, "epoch": 4030} {"train_loss": -25.595779418945312, "global_step": 334509, "epoch": 4030} {"train_loss": -25.59193229675293, "global_step": 334510, "epoch": 4030} {"train_loss": -25.787073135375977, "global_step": 334511, "epoch": 4030} {"train_loss": -25.699920654296875, "global_step": 334512, "epoch": 4030} {"train_loss": -25.70709800720215, "global_step": 334513, "epoch": 4030} {"train_loss": -25.60650634765625, "global_step": 334514, "epoch": 4030} {"train_loss": -25.492633819580078, "global_step": 334515, "epoch": 4030} {"train_loss": -26.240589141845703, "global_step": 334516, "epoch": 4030} {"train_loss": -26.022327423095703, "global_step": 334517, "epoch": 4030} {"train_loss": -26.120588302612305, "global_step": 334518, "epoch": 4030} {"train_loss": -25.567846298217773, "global_step": 334519, "epoch": 4030} {"train_loss": -25.910612106323242, "global_step": 334520, "epoch": 4030} {"train_loss": -25.851943969726562, "global_step": 334521, "epoch": 4030} {"train_loss": -26.12018394470215, "global_step": 334522, "epoch": 4030} {"train_loss": -25.94513511657715, "global_step": 334523, "epoch": 4030} {"train_loss": -25.9343204498291, "global_step": 334524, "epoch": 4030} {"train_loss": -26.251605987548828, "global_step": 334525, "epoch": 4030} {"train_loss": -26.156600952148438, "global_step": 334526, "epoch": 4030} {"train_loss": -26.274206161499023, "global_step": 334527, "epoch": 4030} {"train_loss": -26.216602325439453, "global_step": 334528, "epoch": 4030} {"train_loss": -26.0358829498291, "global_step": 334529, "epoch": 4030} {"train_loss": -26.391569137573242, "global_step": 334530, "epoch": 4030} {"train_loss": -25.916217803955078, "global_step": 334531, "epoch": 4030} {"train_loss": -25.905292510986328, "global_step": 334532, "epoch": 4030} {"train_loss": -25.769636154174805, "global_step": 334533, "epoch": 4030} {"train_loss": -26.306921005249023, "global_step": 334534, "epoch": 4030} {"train_loss": -25.988544464111328, "global_step": 334535, "epoch": 4030} {"train_loss": -26.24365234375, "global_step": 334536, "epoch": 4030} {"train_loss": -25.749698638916016, "global_step": 334537, "epoch": 4030} {"train_loss": -25.98818016052246, "global_step": 334538, "epoch": 4030} {"train_loss": -25.970077514648438, "global_step": 334539, "epoch": 4030} {"train_loss": -25.734878540039062, "global_step": 334540, "epoch": 4030} {"train_loss": -25.956634521484375, "global_step": 334541, "epoch": 4030} {"train_loss": -25.574573516845703, "global_step": 334542, "epoch": 4030} {"train_loss": -26.048370361328125, "global_step": 334543, "epoch": 4030} {"train_loss": -26.25044059753418, "global_step": 334544, "epoch": 4030} {"train_loss": -26.34197425842285, "global_step": 334545, "epoch": 4030} {"train_loss": -26.045175552368164, "global_step": 334546, "epoch": 4030} {"train_loss": -25.789709091186523, "global_step": 334547, "epoch": 4030} {"train_loss": -25.689167022705078, "global_step": 334548, "epoch": 4030} {"train_loss": -25.935550689697266, "global_step": 334549, "epoch": 4030} {"train_loss": -25.57048225402832, "global_step": 334550, "epoch": 4030} {"train_loss": -26.266462326049805, "global_step": 334551, "epoch": 4030} {"train_loss": -26.025415420532227, "global_step": 334552, "epoch": 4030} {"train_loss": -25.94123649597168, "global_step": 334553, "epoch": 4030} {"train_loss": -26.25678062438965, "global_step": 334554, "epoch": 4030} {"train_loss": -26.469552993774414, "global_step": 334555, "epoch": 4030} {"train_loss": -25.813573837280273, "global_step": 334556, "epoch": 4030} {"train_loss": -26.209081649780273, "global_step": 334557, "epoch": 4030} {"train_loss": -26.202001571655273, "global_step": 334558, "epoch": 4030} {"train_loss": -26.08497428894043, "global_step": 334559, "epoch": 4030} {"train_loss": -25.922719955444336, "global_step": 334560, "epoch": 4030} {"train_loss": -26.35504150390625, "global_step": 334561, "epoch": 4030} {"train_loss": -25.707977294921875, "global_step": 334562, "epoch": 4030} {"train_loss": -26.074909210205078, "global_step": 334563, "epoch": 4030} {"train_loss": -25.702411651611328, "global_step": 334564, "epoch": 4030} {"train_loss": -26.0826416015625, "global_step": 334565, "epoch": 4030} {"train_loss": -25.694549560546875, "global_step": 334566, "epoch": 4030} {"train_loss": -25.843900680541992, "global_step": 334567, "epoch": 4030} {"train_loss": -26.065942764282227, "global_step": 334568, "epoch": 4030} {"train_loss": -25.993993759155273, "global_step": 334569, "epoch": 4030} {"train_loss": -25.995283126831055, "global_step": 334570, "epoch": 4030} {"train_loss": -25.908599853515625, "global_step": 334571, "epoch": 4030} {"train_loss": -25.81419425412833, "global_step": 334572, "epoch": 4030, "val_loss": 6739960.0} {"train_loss": -22.607982635498047, "global_step": 334573, "epoch": 4031} {"train_loss": -22.170507431030273, "global_step": 334574, "epoch": 4031} {"train_loss": -24.319904327392578, "global_step": 334575, "epoch": 4031} {"train_loss": -24.594690322875977, "global_step": 334576, "epoch": 4031} {"train_loss": -24.154523849487305, "global_step": 334577, "epoch": 4031} {"train_loss": -24.97723388671875, "global_step": 334578, "epoch": 4031} {"train_loss": -24.56903076171875, "global_step": 334579, "epoch": 4031} {"train_loss": -24.224645614624023, "global_step": 334580, "epoch": 4031} {"train_loss": -24.922727584838867, "global_step": 334581, "epoch": 4031} {"train_loss": -25.2665958404541, "global_step": 334582, "epoch": 4031} {"train_loss": -25.027881622314453, "global_step": 334583, "epoch": 4031} {"train_loss": -25.04719352722168, "global_step": 334584, "epoch": 4031} {"train_loss": -24.938695907592773, "global_step": 334585, "epoch": 4031} {"train_loss": -25.448925018310547, "global_step": 334586, "epoch": 4031} {"train_loss": -25.076364517211914, "global_step": 334587, "epoch": 4031} {"train_loss": -25.018566131591797, "global_step": 334588, "epoch": 4031} {"train_loss": -25.08180809020996, "global_step": 334589, "epoch": 4031} {"train_loss": -25.090789794921875, "global_step": 334590, "epoch": 4031} {"train_loss": -25.02278709411621, "global_step": 334591, "epoch": 4031} {"train_loss": -25.743677139282227, "global_step": 334592, "epoch": 4031} {"train_loss": -25.40569496154785, "global_step": 334593, "epoch": 4031} {"train_loss": -25.20564842224121, "global_step": 334594, "epoch": 4031} {"train_loss": -25.31157112121582, "global_step": 334595, "epoch": 4031} {"train_loss": -25.490692138671875, "global_step": 334596, "epoch": 4031} {"train_loss": -25.308774948120117, "global_step": 334597, "epoch": 4031} {"train_loss": -25.746442794799805, "global_step": 334598, "epoch": 4031} {"train_loss": -25.343040466308594, "global_step": 334599, "epoch": 4031} {"train_loss": -25.536151885986328, "global_step": 334600, "epoch": 4031} {"train_loss": -25.518678665161133, "global_step": 334601, "epoch": 4031} {"train_loss": -25.55017852783203, "global_step": 334602, "epoch": 4031} {"train_loss": -25.366352081298828, "global_step": 334603, "epoch": 4031} {"train_loss": -25.804096221923828, "global_step": 334604, "epoch": 4031} {"train_loss": -25.34864616394043, "global_step": 334605, "epoch": 4031} {"train_loss": -25.64680290222168, "global_step": 334606, "epoch": 4031} {"train_loss": -25.632221221923828, "global_step": 334607, "epoch": 4031} {"train_loss": -25.906543731689453, "global_step": 334608, "epoch": 4031} {"train_loss": -25.799091339111328, "global_step": 334609, "epoch": 4031} {"train_loss": -25.772979736328125, "global_step": 334610, "epoch": 4031} {"train_loss": -25.9039249420166, "global_step": 334611, "epoch": 4031} {"train_loss": -26.033349990844727, "global_step": 334612, "epoch": 4031} {"train_loss": -25.756479263305664, "global_step": 334613, "epoch": 4031} {"train_loss": -26.045995712280273, "global_step": 334614, "epoch": 4031} {"train_loss": -25.72368812561035, "global_step": 334615, "epoch": 4031} {"train_loss": -25.956445693969727, "global_step": 334616, "epoch": 4031} {"train_loss": -25.998350143432617, "global_step": 334617, "epoch": 4031} {"train_loss": -26.391550064086914, "global_step": 334618, "epoch": 4031} {"train_loss": -25.861501693725586, "global_step": 334619, "epoch": 4031} {"train_loss": -25.987218856811523, "global_step": 334620, "epoch": 4031} {"train_loss": -25.827987670898438, "global_step": 334621, "epoch": 4031} {"train_loss": -26.037378311157227, "global_step": 334622, "epoch": 4031} {"train_loss": -25.990137100219727, "global_step": 334623, "epoch": 4031} {"train_loss": -26.108642578125, "global_step": 334624, "epoch": 4031} {"train_loss": -26.036239624023438, "global_step": 334625, "epoch": 4031} {"train_loss": -26.14470863342285, "global_step": 334626, "epoch": 4031} {"train_loss": -26.557165145874023, "global_step": 334627, "epoch": 4031} {"train_loss": -25.88160514831543, "global_step": 334628, "epoch": 4031} {"train_loss": -26.065723419189453, "global_step": 334629, "epoch": 4031} {"train_loss": -26.277374267578125, "global_step": 334630, "epoch": 4031} {"train_loss": -26.104480743408203, "global_step": 334631, "epoch": 4031} {"train_loss": -26.51386833190918, "global_step": 334632, "epoch": 4031} {"train_loss": -26.0307559967041, "global_step": 334633, "epoch": 4031} {"train_loss": -26.252302169799805, "global_step": 334634, "epoch": 4031} {"train_loss": -26.16519546508789, "global_step": 334635, "epoch": 4031} {"train_loss": -26.377918243408203, "global_step": 334636, "epoch": 4031} {"train_loss": -26.058637619018555, "global_step": 334637, "epoch": 4031} {"train_loss": -26.230854034423828, "global_step": 334638, "epoch": 4031} {"train_loss": -26.74590492248535, "global_step": 334639, "epoch": 4031} {"train_loss": -26.019428253173828, "global_step": 334640, "epoch": 4031} {"train_loss": -25.928104400634766, "global_step": 334641, "epoch": 4031} {"train_loss": -25.92148780822754, "global_step": 334642, "epoch": 4031} {"train_loss": -26.183490753173828, "global_step": 334643, "epoch": 4031} {"train_loss": -26.14068603515625, "global_step": 334644, "epoch": 4031} {"train_loss": -25.87946128845215, "global_step": 334645, "epoch": 4031} {"train_loss": -25.890005111694336, "global_step": 334646, "epoch": 4031} {"train_loss": -25.957199096679688, "global_step": 334647, "epoch": 4031} {"train_loss": -26.376203536987305, "global_step": 334648, "epoch": 4031} {"train_loss": -25.99989128112793, "global_step": 334649, "epoch": 4031} {"train_loss": -25.51909828186035, "global_step": 334650, "epoch": 4031} {"train_loss": -24.686498641967773, "global_step": 334651, "epoch": 4031} {"train_loss": -25.233036041259766, "global_step": 334652, "epoch": 4031} {"train_loss": -25.80860710144043, "global_step": 334653, "epoch": 4031} {"train_loss": -25.348798751831055, "global_step": 334654, "epoch": 4031} {"train_loss": -25.594780749585254, "global_step": 334655, "epoch": 4031, "val_loss": 6747677.5} {"train_loss": -21.760494232177734, "global_step": 334656, "epoch": 4032} {"train_loss": -25.120412826538086, "global_step": 334657, "epoch": 4032} {"train_loss": -22.80621910095215, "global_step": 334658, "epoch": 4032} {"train_loss": -24.83945655822754, "global_step": 334659, "epoch": 4032} {"train_loss": -24.171873092651367, "global_step": 334660, "epoch": 4032} {"train_loss": -24.5960636138916, "global_step": 334661, "epoch": 4032} {"train_loss": -24.78578758239746, "global_step": 334662, "epoch": 4032} {"train_loss": -24.429372787475586, "global_step": 334663, "epoch": 4032} {"train_loss": -25.34149932861328, "global_step": 334664, "epoch": 4032} {"train_loss": -24.964872360229492, "global_step": 334665, "epoch": 4032} {"train_loss": -25.023847579956055, "global_step": 334666, "epoch": 4032} {"train_loss": -24.357297897338867, "global_step": 334667, "epoch": 4032} {"train_loss": -24.877944946289062, "global_step": 334668, "epoch": 4032} {"train_loss": -25.087501525878906, "global_step": 334669, "epoch": 4032} {"train_loss": -25.24502944946289, "global_step": 334670, "epoch": 4032} {"train_loss": -25.499805450439453, "global_step": 334671, "epoch": 4032} {"train_loss": -25.165634155273438, "global_step": 334672, "epoch": 4032} {"train_loss": -25.252866744995117, "global_step": 334673, "epoch": 4032} {"train_loss": -25.26355743408203, "global_step": 334674, "epoch": 4032} {"train_loss": -24.907758712768555, "global_step": 334675, "epoch": 4032} {"train_loss": -25.417572021484375, "global_step": 334676, "epoch": 4032} {"train_loss": -25.390729904174805, "global_step": 334677, "epoch": 4032} {"train_loss": -25.600000381469727, "global_step": 334678, "epoch": 4032} {"train_loss": -25.376760482788086, "global_step": 334679, "epoch": 4032} {"train_loss": -25.50998878479004, "global_step": 334680, "epoch": 4032} {"train_loss": -25.369611740112305, "global_step": 334681, "epoch": 4032} {"train_loss": -25.391712188720703, "global_step": 334682, "epoch": 4032} {"train_loss": -25.70623779296875, "global_step": 334683, "epoch": 4032} {"train_loss": -25.38599395751953, "global_step": 334684, "epoch": 4032} {"train_loss": -25.313711166381836, "global_step": 334685, "epoch": 4032} {"train_loss": -25.586790084838867, "global_step": 334686, "epoch": 4032} {"train_loss": -25.77338218688965, "global_step": 334687, "epoch": 4032} {"train_loss": -25.579145431518555, "global_step": 334688, "epoch": 4032} {"train_loss": -25.7751407623291, "global_step": 334689, "epoch": 4032} {"train_loss": -25.591218948364258, "global_step": 334690, "epoch": 4032} {"train_loss": -25.75234031677246, "global_step": 334691, "epoch": 4032} {"train_loss": -25.9129695892334, "global_step": 334692, "epoch": 4032} {"train_loss": -25.421493530273438, "global_step": 334693, "epoch": 4032} {"train_loss": -25.644445419311523, "global_step": 334694, "epoch": 4032} {"train_loss": -25.671533584594727, "global_step": 334695, "epoch": 4032} {"train_loss": -26.02711296081543, "global_step": 334696, "epoch": 4032} {"train_loss": -25.5018253326416, "global_step": 334697, "epoch": 4032} {"train_loss": -26.20789909362793, "global_step": 334698, "epoch": 4032} {"train_loss": -26.096500396728516, "global_step": 334699, "epoch": 4032} {"train_loss": -25.68840980529785, "global_step": 334700, "epoch": 4032} {"train_loss": -26.2724609375, "global_step": 334701, "epoch": 4032} {"train_loss": -25.85175132751465, "global_step": 334702, "epoch": 4032} {"train_loss": -26.017684936523438, "global_step": 334703, "epoch": 4032} {"train_loss": -25.988698959350586, "global_step": 334704, "epoch": 4032} {"train_loss": -25.790668487548828, "global_step": 334705, "epoch": 4032} {"train_loss": -26.035675048828125, "global_step": 334706, "epoch": 4032} {"train_loss": -26.222158432006836, "global_step": 334707, "epoch": 4032} {"train_loss": -25.919416427612305, "global_step": 334708, "epoch": 4032} {"train_loss": -26.325458526611328, "global_step": 334709, "epoch": 4032} {"train_loss": -25.87409782409668, "global_step": 334710, "epoch": 4032} {"train_loss": -26.256261825561523, "global_step": 334711, "epoch": 4032} {"train_loss": -26.2293643951416, "global_step": 334712, "epoch": 4032} {"train_loss": -26.244709014892578, "global_step": 334713, "epoch": 4032} {"train_loss": -26.226795196533203, "global_step": 334714, "epoch": 4032} {"train_loss": -26.105527877807617, "global_step": 334715, "epoch": 4032} {"train_loss": -26.10088539123535, "global_step": 334716, "epoch": 4032} {"train_loss": -26.311887741088867, "global_step": 334717, "epoch": 4032} {"train_loss": -26.3073787689209, "global_step": 334718, "epoch": 4032} {"train_loss": -25.8560848236084, "global_step": 334719, "epoch": 4032} {"train_loss": -26.045841217041016, "global_step": 334720, "epoch": 4032} {"train_loss": -25.702823638916016, "global_step": 334721, "epoch": 4032} {"train_loss": -26.30146598815918, "global_step": 334722, "epoch": 4032} {"train_loss": -25.575149536132812, "global_step": 334723, "epoch": 4032} {"train_loss": -25.834508895874023, "global_step": 334724, "epoch": 4032} {"train_loss": -26.163549423217773, "global_step": 334725, "epoch": 4032} {"train_loss": -26.1420955657959, "global_step": 334726, "epoch": 4032} {"train_loss": -26.642019271850586, "global_step": 334727, "epoch": 4032} {"train_loss": -25.9807071685791, "global_step": 334728, "epoch": 4032} {"train_loss": -26.23328971862793, "global_step": 334729, "epoch": 4032} {"train_loss": -26.185749053955078, "global_step": 334730, "epoch": 4032} {"train_loss": -26.399738311767578, "global_step": 334731, "epoch": 4032} {"train_loss": -26.029224395751953, "global_step": 334732, "epoch": 4032} {"train_loss": -26.24720573425293, "global_step": 334733, "epoch": 4032} {"train_loss": -26.2027587890625, "global_step": 334734, "epoch": 4032} {"train_loss": -25.766647338867188, "global_step": 334735, "epoch": 4032} {"train_loss": -26.42667007446289, "global_step": 334736, "epoch": 4032} {"train_loss": -26.227140426635742, "global_step": 334737, "epoch": 4032} {"train_loss": -25.626189174422297, "global_step": 334738, "epoch": 4032, "val_loss": 6726518.0} {"train_loss": -25.35657501220703, "global_step": 334739, "epoch": 4033} {"train_loss": -25.6469669342041, "global_step": 334740, "epoch": 4033} {"train_loss": -25.94256591796875, "global_step": 334741, "epoch": 4033} {"train_loss": -25.288423538208008, "global_step": 334742, "epoch": 4033} {"train_loss": -25.323667526245117, "global_step": 334743, "epoch": 4033} {"train_loss": -25.941864013671875, "global_step": 334744, "epoch": 4033} {"train_loss": -25.938268661499023, "global_step": 334745, "epoch": 4033} {"train_loss": -25.766620635986328, "global_step": 334746, "epoch": 4033} {"train_loss": -25.7206974029541, "global_step": 334747, "epoch": 4033} {"train_loss": -25.688220977783203, "global_step": 334748, "epoch": 4033} {"train_loss": -25.814746856689453, "global_step": 334749, "epoch": 4033} {"train_loss": -25.479145050048828, "global_step": 334750, "epoch": 4033} {"train_loss": -26.000253677368164, "global_step": 334751, "epoch": 4033} {"train_loss": -25.59006118774414, "global_step": 334752, "epoch": 4033} {"train_loss": -25.625110626220703, "global_step": 334753, "epoch": 4033} {"train_loss": -25.956378936767578, "global_step": 334754, "epoch": 4033} {"train_loss": -25.92496681213379, "global_step": 334755, "epoch": 4033} {"train_loss": -25.76883888244629, "global_step": 334756, "epoch": 4033} {"train_loss": -25.832443237304688, "global_step": 334757, "epoch": 4033} {"train_loss": -26.114004135131836, "global_step": 334758, "epoch": 4033} {"train_loss": -25.574195861816406, "global_step": 334759, "epoch": 4033} {"train_loss": -25.883316040039062, "global_step": 334760, "epoch": 4033} {"train_loss": -25.80927848815918, "global_step": 334761, "epoch": 4033} {"train_loss": -26.02713394165039, "global_step": 334762, "epoch": 4033} {"train_loss": -25.945968627929688, "global_step": 334763, "epoch": 4033} {"train_loss": -26.16851806640625, "global_step": 334764, "epoch": 4033} {"train_loss": -26.1058292388916, "global_step": 334765, "epoch": 4033} {"train_loss": -26.120473861694336, "global_step": 334766, "epoch": 4033} {"train_loss": -26.365650177001953, "global_step": 334767, "epoch": 4033} {"train_loss": -26.38868522644043, "global_step": 334768, "epoch": 4033} {"train_loss": -26.08856201171875, "global_step": 334769, "epoch": 4033} {"train_loss": -25.8128604888916, "global_step": 334770, "epoch": 4033} {"train_loss": -26.257339477539062, "global_step": 334771, "epoch": 4033} {"train_loss": -25.719425201416016, "global_step": 334772, "epoch": 4033} {"train_loss": -25.787628173828125, "global_step": 334773, "epoch": 4033} {"train_loss": -26.24673843383789, "global_step": 334774, "epoch": 4033} {"train_loss": -26.08953285217285, "global_step": 334775, "epoch": 4033} {"train_loss": -25.936044692993164, "global_step": 334776, "epoch": 4033} {"train_loss": -26.508787155151367, "global_step": 334777, "epoch": 4033} {"train_loss": -25.956884384155273, "global_step": 334778, "epoch": 4033} {"train_loss": -26.015405654907227, "global_step": 334779, "epoch": 4033} {"train_loss": -25.551389694213867, "global_step": 334780, "epoch": 4033} {"train_loss": -26.211149215698242, "global_step": 334781, "epoch": 4033} {"train_loss": -26.036951065063477, "global_step": 334782, "epoch": 4033} {"train_loss": -26.3283634185791, "global_step": 334783, "epoch": 4033} {"train_loss": -26.057653427124023, "global_step": 334784, "epoch": 4033} {"train_loss": -26.098876953125, "global_step": 334785, "epoch": 4033} {"train_loss": -25.89474868774414, "global_step": 334786, "epoch": 4033} {"train_loss": -26.048187255859375, "global_step": 334787, "epoch": 4033} {"train_loss": -25.8109188079834, "global_step": 334788, "epoch": 4033} {"train_loss": -25.86382484436035, "global_step": 334789, "epoch": 4033} {"train_loss": -25.9576358795166, "global_step": 334790, "epoch": 4033} {"train_loss": -25.755773544311523, "global_step": 334791, "epoch": 4033} {"train_loss": -26.10028648376465, "global_step": 334792, "epoch": 4033} {"train_loss": -25.773141860961914, "global_step": 334793, "epoch": 4033} {"train_loss": -25.973020553588867, "global_step": 334794, "epoch": 4033} {"train_loss": -26.316381454467773, "global_step": 334795, "epoch": 4033} {"train_loss": -26.011905670166016, "global_step": 334796, "epoch": 4033} {"train_loss": -25.973773956298828, "global_step": 334797, "epoch": 4033} {"train_loss": -26.157913208007812, "global_step": 334798, "epoch": 4033} {"train_loss": -25.953994750976562, "global_step": 334799, "epoch": 4033} {"train_loss": -25.918363571166992, "global_step": 334800, "epoch": 4033} {"train_loss": -25.969236373901367, "global_step": 334801, "epoch": 4033} {"train_loss": -26.036855697631836, "global_step": 334802, "epoch": 4033} {"train_loss": -26.218225479125977, "global_step": 334803, "epoch": 4033} {"train_loss": -26.159229278564453, "global_step": 334804, "epoch": 4033} {"train_loss": -26.196691513061523, "global_step": 334805, "epoch": 4033} {"train_loss": -25.957258224487305, "global_step": 334806, "epoch": 4033} {"train_loss": -25.753997802734375, "global_step": 334807, "epoch": 4033} {"train_loss": -26.14436149597168, "global_step": 334808, "epoch": 4033} {"train_loss": -26.329334259033203, "global_step": 334809, "epoch": 4033} {"train_loss": -26.049428939819336, "global_step": 334810, "epoch": 4033} {"train_loss": -26.292036056518555, "global_step": 334811, "epoch": 4033} {"train_loss": -26.143583297729492, "global_step": 334812, "epoch": 4033} {"train_loss": -26.033954620361328, "global_step": 334813, "epoch": 4033} {"train_loss": -26.050033569335938, "global_step": 334814, "epoch": 4033} {"train_loss": -25.739545822143555, "global_step": 334815, "epoch": 4033} {"train_loss": -26.289783477783203, "global_step": 334816, "epoch": 4033} {"train_loss": -26.489593505859375, "global_step": 334817, "epoch": 4033} {"train_loss": -26.08335304260254, "global_step": 334818, "epoch": 4033} {"train_loss": -25.943603515625, "global_step": 334819, "epoch": 4033} {"train_loss": -25.740201950073242, "global_step": 334820, "epoch": 4033} {"train_loss": -25.949155095111895, "global_step": 334821, "epoch": 4033, "val_loss": 6783201.0} {"train_loss": -24.102636337280273, "global_step": 334822, "epoch": 4034} {"train_loss": -24.83639907836914, "global_step": 334823, "epoch": 4034} {"train_loss": -25.28973960876465, "global_step": 334824, "epoch": 4034} {"train_loss": -24.803138732910156, "global_step": 334825, "epoch": 4034} {"train_loss": -25.670093536376953, "global_step": 334826, "epoch": 4034} {"train_loss": -25.121580123901367, "global_step": 334827, "epoch": 4034} {"train_loss": -24.822275161743164, "global_step": 334828, "epoch": 4034} {"train_loss": -25.621124267578125, "global_step": 334829, "epoch": 4034} {"train_loss": -25.60407829284668, "global_step": 334830, "epoch": 4034} {"train_loss": -24.854446411132812, "global_step": 334831, "epoch": 4034} {"train_loss": -25.111156463623047, "global_step": 334832, "epoch": 4034} {"train_loss": -24.784454345703125, "global_step": 334833, "epoch": 4034} {"train_loss": -25.053279876708984, "global_step": 334834, "epoch": 4034} {"train_loss": -25.09917640686035, "global_step": 334835, "epoch": 4034} {"train_loss": -25.5120906829834, "global_step": 334836, "epoch": 4034} {"train_loss": -25.286279678344727, "global_step": 334837, "epoch": 4034} {"train_loss": -25.687728881835938, "global_step": 334838, "epoch": 4034} {"train_loss": -25.755828857421875, "global_step": 334839, "epoch": 4034} {"train_loss": -25.345561981201172, "global_step": 334840, "epoch": 4034} {"train_loss": -25.601505279541016, "global_step": 334841, "epoch": 4034} {"train_loss": -25.305418014526367, "global_step": 334842, "epoch": 4034} {"train_loss": -25.46786880493164, "global_step": 334843, "epoch": 4034} {"train_loss": -25.61484146118164, "global_step": 334844, "epoch": 4034} {"train_loss": -25.390920639038086, "global_step": 334845, "epoch": 4034} {"train_loss": -25.863080978393555, "global_step": 334846, "epoch": 4034} {"train_loss": -25.37476921081543, "global_step": 334847, "epoch": 4034} {"train_loss": -25.85896873474121, "global_step": 334848, "epoch": 4034} {"train_loss": -26.086994171142578, "global_step": 334849, "epoch": 4034} {"train_loss": -25.675537109375, "global_step": 334850, "epoch": 4034} {"train_loss": -25.7347412109375, "global_step": 334851, "epoch": 4034} {"train_loss": -25.571828842163086, "global_step": 334852, "epoch": 4034} {"train_loss": -25.781204223632812, "global_step": 334853, "epoch": 4034} {"train_loss": -26.171422958374023, "global_step": 334854, "epoch": 4034} {"train_loss": -25.95676040649414, "global_step": 334855, "epoch": 4034} {"train_loss": -26.002832412719727, "global_step": 334856, "epoch": 4034} {"train_loss": -25.9980525970459, "global_step": 334857, "epoch": 4034} {"train_loss": -25.926471710205078, "global_step": 334858, "epoch": 4034} {"train_loss": -26.2259464263916, "global_step": 334859, "epoch": 4034} {"train_loss": -26.070947647094727, "global_step": 334860, "epoch": 4034} {"train_loss": -26.391504287719727, "global_step": 334861, "epoch": 4034} {"train_loss": -26.26983070373535, "global_step": 334862, "epoch": 4034} {"train_loss": -26.191577911376953, "global_step": 334863, "epoch": 4034} {"train_loss": -26.20075035095215, "global_step": 334864, "epoch": 4034} {"train_loss": -25.84519386291504, "global_step": 334865, "epoch": 4034} {"train_loss": -26.031036376953125, "global_step": 334866, "epoch": 4034} {"train_loss": -26.486480712890625, "global_step": 334867, "epoch": 4034} {"train_loss": -26.268049240112305, "global_step": 334868, "epoch": 4034} {"train_loss": -26.19476890563965, "global_step": 334869, "epoch": 4034} {"train_loss": -26.15338134765625, "global_step": 334870, "epoch": 4034} {"train_loss": -26.26871109008789, "global_step": 334871, "epoch": 4034} {"train_loss": -26.426000595092773, "global_step": 334872, "epoch": 4034} {"train_loss": -26.242963790893555, "global_step": 334873, "epoch": 4034} {"train_loss": -26.249755859375, "global_step": 334874, "epoch": 4034} {"train_loss": -25.921146392822266, "global_step": 334875, "epoch": 4034} {"train_loss": -26.125608444213867, "global_step": 334876, "epoch": 4034} {"train_loss": -25.7509822845459, "global_step": 334877, "epoch": 4034} {"train_loss": -26.1612491607666, "global_step": 334878, "epoch": 4034} {"train_loss": -26.530527114868164, "global_step": 334879, "epoch": 4034} {"train_loss": -25.981842041015625, "global_step": 334880, "epoch": 4034} {"train_loss": -26.205530166625977, "global_step": 334881, "epoch": 4034} {"train_loss": -25.946399688720703, "global_step": 334882, "epoch": 4034} {"train_loss": -26.14129638671875, "global_step": 334883, "epoch": 4034} {"train_loss": -26.04257583618164, "global_step": 334884, "epoch": 4034} {"train_loss": -26.049413681030273, "global_step": 334885, "epoch": 4034} {"train_loss": -25.619953155517578, "global_step": 334886, "epoch": 4034} {"train_loss": -25.98011589050293, "global_step": 334887, "epoch": 4034} {"train_loss": -25.515501022338867, "global_step": 334888, "epoch": 4034} {"train_loss": -26.044492721557617, "global_step": 334889, "epoch": 4034} {"train_loss": -26.127511978149414, "global_step": 334890, "epoch": 4034} {"train_loss": -25.998920440673828, "global_step": 334891, "epoch": 4034} {"train_loss": -25.48835563659668, "global_step": 334892, "epoch": 4034} {"train_loss": -24.90978240966797, "global_step": 334893, "epoch": 4034} {"train_loss": -25.165815353393555, "global_step": 334894, "epoch": 4034} {"train_loss": -25.714385986328125, "global_step": 334895, "epoch": 4034} {"train_loss": -25.847360610961914, "global_step": 334896, "epoch": 4034} {"train_loss": -25.525775909423828, "global_step": 334897, "epoch": 4034} {"train_loss": -25.491174697875977, "global_step": 334898, "epoch": 4034} {"train_loss": -25.709070205688477, "global_step": 334899, "epoch": 4034} {"train_loss": -25.551300048828125, "global_step": 334900, "epoch": 4034} {"train_loss": -25.95060157775879, "global_step": 334901, "epoch": 4034} {"train_loss": -25.93585777282715, "global_step": 334902, "epoch": 4034} {"train_loss": -26.003189086914062, "global_step": 334903, "epoch": 4034} {"train_loss": -25.719507562108788, "global_step": 334904, "epoch": 4034, "val_loss": 6687464.0} {"train_loss": -25.715839385986328, "global_step": 334905, "epoch": 4035} {"train_loss": -25.8179931640625, "global_step": 334906, "epoch": 4035} {"train_loss": -25.64313316345215, "global_step": 334907, "epoch": 4035} {"train_loss": -26.03534507751465, "global_step": 334908, "epoch": 4035} {"train_loss": -25.812429428100586, "global_step": 334909, "epoch": 4035} {"train_loss": -25.577678680419922, "global_step": 334910, "epoch": 4035} {"train_loss": -25.703271865844727, "global_step": 334911, "epoch": 4035} {"train_loss": -25.637304306030273, "global_step": 334912, "epoch": 4035} {"train_loss": -25.937671661376953, "global_step": 334913, "epoch": 4035} {"train_loss": -25.812088012695312, "global_step": 334914, "epoch": 4035} {"train_loss": -25.813922882080078, "global_step": 334915, "epoch": 4035} {"train_loss": -25.7540283203125, "global_step": 334916, "epoch": 4035} {"train_loss": -25.791711807250977, "global_step": 334917, "epoch": 4035} {"train_loss": -26.014484405517578, "global_step": 334918, "epoch": 4035} {"train_loss": -25.83515739440918, "global_step": 334919, "epoch": 4035} {"train_loss": -26.119293212890625, "global_step": 334920, "epoch": 4035} {"train_loss": -25.923389434814453, "global_step": 334921, "epoch": 4035} {"train_loss": -26.018091201782227, "global_step": 334922, "epoch": 4035} {"train_loss": -26.341232299804688, "global_step": 334923, "epoch": 4035} {"train_loss": -25.973779678344727, "global_step": 334924, "epoch": 4035} {"train_loss": -25.933364868164062, "global_step": 334925, "epoch": 4035} {"train_loss": -26.040807723999023, "global_step": 334926, "epoch": 4035} {"train_loss": -25.868345260620117, "global_step": 334927, "epoch": 4035} {"train_loss": -25.932891845703125, "global_step": 334928, "epoch": 4035} {"train_loss": -25.937454223632812, "global_step": 334929, "epoch": 4035} {"train_loss": -26.302343368530273, "global_step": 334930, "epoch": 4035} {"train_loss": -25.84673500061035, "global_step": 334931, "epoch": 4035} {"train_loss": -26.01481056213379, "global_step": 334932, "epoch": 4035} {"train_loss": -25.9200439453125, "global_step": 334933, "epoch": 4035} {"train_loss": -26.31098747253418, "global_step": 334934, "epoch": 4035} {"train_loss": -26.32293128967285, "global_step": 334935, "epoch": 4035} {"train_loss": -25.93107032775879, "global_step": 334936, "epoch": 4035} {"train_loss": -26.020862579345703, "global_step": 334937, "epoch": 4035} {"train_loss": -25.9046630859375, "global_step": 334938, "epoch": 4035} {"train_loss": -26.113046646118164, "global_step": 334939, "epoch": 4035} {"train_loss": -26.018030166625977, "global_step": 334940, "epoch": 4035} {"train_loss": -26.168729782104492, "global_step": 334941, "epoch": 4035} {"train_loss": -26.236799240112305, "global_step": 334942, "epoch": 4035} {"train_loss": -26.144062042236328, "global_step": 334943, "epoch": 4035} {"train_loss": -26.16449546813965, "global_step": 334944, "epoch": 4035} {"train_loss": -25.704755783081055, "global_step": 334945, "epoch": 4035} {"train_loss": -25.780858993530273, "global_step": 334946, "epoch": 4035} {"train_loss": -25.810453414916992, "global_step": 334947, "epoch": 4035} {"train_loss": -25.689062118530273, "global_step": 334948, "epoch": 4035} {"train_loss": -25.918256759643555, "global_step": 334949, "epoch": 4035} {"train_loss": -26.12275505065918, "global_step": 334950, "epoch": 4035} {"train_loss": -26.185443878173828, "global_step": 334951, "epoch": 4035} {"train_loss": -26.304290771484375, "global_step": 334952, "epoch": 4035} {"train_loss": -26.01179313659668, "global_step": 334953, "epoch": 4035} {"train_loss": -25.741952896118164, "global_step": 334954, "epoch": 4035} {"train_loss": -26.2746639251709, "global_step": 334955, "epoch": 4035} {"train_loss": -26.088693618774414, "global_step": 334956, "epoch": 4035} {"train_loss": -26.400793075561523, "global_step": 334957, "epoch": 4035} {"train_loss": -26.05632972717285, "global_step": 334958, "epoch": 4035} {"train_loss": -25.6927490234375, "global_step": 334959, "epoch": 4035} {"train_loss": -26.14235496520996, "global_step": 334960, "epoch": 4035} {"train_loss": -26.450525283813477, "global_step": 334961, "epoch": 4035} {"train_loss": -26.2999324798584, "global_step": 334962, "epoch": 4035} {"train_loss": -26.05267906188965, "global_step": 334963, "epoch": 4035} {"train_loss": -26.0596923828125, "global_step": 334964, "epoch": 4035} {"train_loss": -26.008962631225586, "global_step": 334965, "epoch": 4035} {"train_loss": -26.11323356628418, "global_step": 334966, "epoch": 4035} {"train_loss": -26.457651138305664, "global_step": 334967, "epoch": 4035} {"train_loss": -26.03681755065918, "global_step": 334968, "epoch": 4035} {"train_loss": -25.96514320373535, "global_step": 334969, "epoch": 4035} {"train_loss": -26.271743774414062, "global_step": 334970, "epoch": 4035} {"train_loss": -26.263797760009766, "global_step": 334971, "epoch": 4035} {"train_loss": -26.292633056640625, "global_step": 334972, "epoch": 4035} {"train_loss": -26.216922760009766, "global_step": 334973, "epoch": 4035} {"train_loss": -25.5328426361084, "global_step": 334974, "epoch": 4035} {"train_loss": -26.4967098236084, "global_step": 334975, "epoch": 4035} {"train_loss": -26.262353897094727, "global_step": 334976, "epoch": 4035} {"train_loss": -25.999967575073242, "global_step": 334977, "epoch": 4035} {"train_loss": -25.554624557495117, "global_step": 334978, "epoch": 4035} {"train_loss": -25.85190773010254, "global_step": 334979, "epoch": 4035} {"train_loss": -26.31446647644043, "global_step": 334980, "epoch": 4035} {"train_loss": -25.91525650024414, "global_step": 334981, "epoch": 4035} {"train_loss": -25.594030380249023, "global_step": 334982, "epoch": 4035} {"train_loss": -25.44464111328125, "global_step": 334983, "epoch": 4035} {"train_loss": -25.033761978149414, "global_step": 334984, "epoch": 4035} {"train_loss": -25.70283317565918, "global_step": 334985, "epoch": 4035} {"train_loss": -25.678241729736328, "global_step": 334986, "epoch": 4035} {"train_loss": -25.972041578177947, "global_step": 334987, "epoch": 4035, "val_loss": 6713586.0} {"train_loss": -24.49455451965332, "global_step": 334988, "epoch": 4036} {"train_loss": -24.908843994140625, "global_step": 334989, "epoch": 4036} {"train_loss": -25.445518493652344, "global_step": 334990, "epoch": 4036} {"train_loss": -24.46343421936035, "global_step": 334991, "epoch": 4036} {"train_loss": -25.02970314025879, "global_step": 334992, "epoch": 4036} {"train_loss": -24.82588005065918, "global_step": 334993, "epoch": 4036} {"train_loss": -25.156230926513672, "global_step": 334994, "epoch": 4036} {"train_loss": -24.692907333374023, "global_step": 334995, "epoch": 4036} {"train_loss": -24.96908187866211, "global_step": 334996, "epoch": 4036} {"train_loss": -25.042848587036133, "global_step": 334997, "epoch": 4036} {"train_loss": -25.126020431518555, "global_step": 334998, "epoch": 4036} {"train_loss": -25.21192741394043, "global_step": 334999, "epoch": 4036} {"train_loss": -25.067258834838867, "global_step": 335000, "epoch": 4036} {"train_loss": -25.18907356262207, "global_step": 335001, "epoch": 4036} {"train_loss": -25.246000289916992, "global_step": 335002, "epoch": 4036} {"train_loss": -25.32315444946289, "global_step": 335003, "epoch": 4036} {"train_loss": -25.409086227416992, "global_step": 335004, "epoch": 4036} {"train_loss": -25.546598434448242, "global_step": 335005, "epoch": 4036} {"train_loss": -25.46832847595215, "global_step": 335006, "epoch": 4036} {"train_loss": -25.590559005737305, "global_step": 335007, "epoch": 4036} {"train_loss": -25.602060317993164, "global_step": 335008, "epoch": 4036} {"train_loss": -25.528165817260742, "global_step": 335009, "epoch": 4036} {"train_loss": -25.471389770507812, "global_step": 335010, "epoch": 4036} {"train_loss": -25.610950469970703, "global_step": 335011, "epoch": 4036} {"train_loss": -25.687673568725586, "global_step": 335012, "epoch": 4036} {"train_loss": -25.73763084411621, "global_step": 335013, "epoch": 4036} {"train_loss": -25.581262588500977, "global_step": 335014, "epoch": 4036} {"train_loss": -25.795578002929688, "global_step": 335015, "epoch": 4036} {"train_loss": -25.620969772338867, "global_step": 335016, "epoch": 4036} {"train_loss": -25.94247817993164, "global_step": 335017, "epoch": 4036} {"train_loss": -25.60801124572754, "global_step": 335018, "epoch": 4036} {"train_loss": -26.007062911987305, "global_step": 335019, "epoch": 4036} {"train_loss": -25.708005905151367, "global_step": 335020, "epoch": 4036} {"train_loss": -25.8891544342041, "global_step": 335021, "epoch": 4036} {"train_loss": -25.906396865844727, "global_step": 335022, "epoch": 4036} {"train_loss": -26.00471305847168, "global_step": 335023, "epoch": 4036} {"train_loss": -25.993778228759766, "global_step": 335024, "epoch": 4036} {"train_loss": -26.20294761657715, "global_step": 335025, "epoch": 4036} {"train_loss": -26.305118560791016, "global_step": 335026, "epoch": 4036} {"train_loss": -26.087116241455078, "global_step": 335027, "epoch": 4036} {"train_loss": -26.028493881225586, "global_step": 335028, "epoch": 4036} {"train_loss": -26.081396102905273, "global_step": 335029, "epoch": 4036} {"train_loss": -25.9777889251709, "global_step": 335030, "epoch": 4036} {"train_loss": -26.412954330444336, "global_step": 335031, "epoch": 4036} {"train_loss": -26.233083724975586, "global_step": 335032, "epoch": 4036} {"train_loss": -25.780542373657227, "global_step": 335033, "epoch": 4036} {"train_loss": -26.10125732421875, "global_step": 335034, "epoch": 4036} {"train_loss": -26.202423095703125, "global_step": 335035, "epoch": 4036} {"train_loss": -25.73345375061035, "global_step": 335036, "epoch": 4036} {"train_loss": -26.040802001953125, "global_step": 335037, "epoch": 4036} {"train_loss": -26.265233993530273, "global_step": 335038, "epoch": 4036} {"train_loss": -26.0465145111084, "global_step": 335039, "epoch": 4036} {"train_loss": -26.38616371154785, "global_step": 335040, "epoch": 4036} {"train_loss": -26.184982299804688, "global_step": 335041, "epoch": 4036} {"train_loss": -26.419483184814453, "global_step": 335042, "epoch": 4036} {"train_loss": -26.27125358581543, "global_step": 335043, "epoch": 4036} {"train_loss": -25.975271224975586, "global_step": 335044, "epoch": 4036} {"train_loss": -25.870269775390625, "global_step": 335045, "epoch": 4036} {"train_loss": -26.083234786987305, "global_step": 335046, "epoch": 4036} {"train_loss": -25.88116455078125, "global_step": 335047, "epoch": 4036} {"train_loss": -26.33930015563965, "global_step": 335048, "epoch": 4036} {"train_loss": -26.202478408813477, "global_step": 335049, "epoch": 4036} {"train_loss": -26.278701782226562, "global_step": 335050, "epoch": 4036} {"train_loss": -26.289438247680664, "global_step": 335051, "epoch": 4036} {"train_loss": -26.06831932067871, "global_step": 335052, "epoch": 4036} {"train_loss": -26.32208824157715, "global_step": 335053, "epoch": 4036} {"train_loss": -26.433917999267578, "global_step": 335054, "epoch": 4036} {"train_loss": -26.073322296142578, "global_step": 335055, "epoch": 4036} {"train_loss": -26.309844970703125, "global_step": 335056, "epoch": 4036} {"train_loss": -26.22568130493164, "global_step": 335057, "epoch": 4036} {"train_loss": -26.323347091674805, "global_step": 335058, "epoch": 4036} {"train_loss": -26.01051139831543, "global_step": 335059, "epoch": 4036} {"train_loss": -25.737943649291992, "global_step": 335060, "epoch": 4036} {"train_loss": -25.35466766357422, "global_step": 335061, "epoch": 4036} {"train_loss": -24.967390060424805, "global_step": 335062, "epoch": 4036} {"train_loss": -25.625171661376953, "global_step": 335063, "epoch": 4036} {"train_loss": -26.069189071655273, "global_step": 335064, "epoch": 4036} {"train_loss": -25.68218994140625, "global_step": 335065, "epoch": 4036} {"train_loss": -25.8437557220459, "global_step": 335066, "epoch": 4036} {"train_loss": -25.759052276611328, "global_step": 335067, "epoch": 4036} {"train_loss": -25.618616104125977, "global_step": 335068, "epoch": 4036} {"train_loss": -25.880407333374023, "global_step": 335069, "epoch": 4036} {"train_loss": -25.757829804018318, "global_step": 335070, "epoch": 4036, "val_loss": 6760088.0} {"train_loss": -25.229455947875977, "global_step": 335071, "epoch": 4037} {"train_loss": -25.278156280517578, "global_step": 335072, "epoch": 4037} {"train_loss": -25.46388816833496, "global_step": 335073, "epoch": 4037} {"train_loss": -25.768537521362305, "global_step": 335074, "epoch": 4037} {"train_loss": -25.37757682800293, "global_step": 335075, "epoch": 4037} {"train_loss": -25.298696517944336, "global_step": 335076, "epoch": 4037} {"train_loss": -25.982282638549805, "global_step": 335077, "epoch": 4037} {"train_loss": -25.40526008605957, "global_step": 335078, "epoch": 4037} {"train_loss": -25.58454132080078, "global_step": 335079, "epoch": 4037} {"train_loss": -24.99163246154785, "global_step": 335080, "epoch": 4037} {"train_loss": -25.446699142456055, "global_step": 335081, "epoch": 4037} {"train_loss": -25.714385986328125, "global_step": 335082, "epoch": 4037} {"train_loss": -25.57282829284668, "global_step": 335083, "epoch": 4037} {"train_loss": -25.800764083862305, "global_step": 335084, "epoch": 4037} {"train_loss": -25.493860244750977, "global_step": 335085, "epoch": 4037} {"train_loss": -26.10273551940918, "global_step": 335086, "epoch": 4037} {"train_loss": -25.716999053955078, "global_step": 335087, "epoch": 4037} {"train_loss": -25.76300621032715, "global_step": 335088, "epoch": 4037} {"train_loss": -25.873291015625, "global_step": 335089, "epoch": 4037} {"train_loss": -26.008569717407227, "global_step": 335090, "epoch": 4037} {"train_loss": -25.874725341796875, "global_step": 335091, "epoch": 4037} {"train_loss": -25.746915817260742, "global_step": 335092, "epoch": 4037} {"train_loss": -25.830915451049805, "global_step": 335093, "epoch": 4037} {"train_loss": -25.861509323120117, "global_step": 335094, "epoch": 4037} {"train_loss": -25.997547149658203, "global_step": 335095, "epoch": 4037} {"train_loss": -26.023883819580078, "global_step": 335096, "epoch": 4037} {"train_loss": -26.0073299407959, "global_step": 335097, "epoch": 4037} {"train_loss": -26.037311553955078, "global_step": 335098, "epoch": 4037} {"train_loss": -26.1530818939209, "global_step": 335099, "epoch": 4037} {"train_loss": -25.845388412475586, "global_step": 335100, "epoch": 4037} {"train_loss": -25.780654907226562, "global_step": 335101, "epoch": 4037} {"train_loss": -26.1263370513916, "global_step": 335102, "epoch": 4037} {"train_loss": -26.173688888549805, "global_step": 335103, "epoch": 4037} {"train_loss": -26.02743911743164, "global_step": 335104, "epoch": 4037} {"train_loss": -25.942829132080078, "global_step": 335105, "epoch": 4037} {"train_loss": -25.834915161132812, "global_step": 335106, "epoch": 4037} {"train_loss": -25.8564395904541, "global_step": 335107, "epoch": 4037} {"train_loss": -26.3232479095459, "global_step": 335108, "epoch": 4037} {"train_loss": -26.304040908813477, "global_step": 335109, "epoch": 4037} {"train_loss": -26.19464111328125, "global_step": 335110, "epoch": 4037} {"train_loss": -26.242889404296875, "global_step": 335111, "epoch": 4037} {"train_loss": -26.47430419921875, "global_step": 335112, "epoch": 4037} {"train_loss": -25.804794311523438, "global_step": 335113, "epoch": 4037} {"train_loss": -25.9488525390625, "global_step": 335114, "epoch": 4037} {"train_loss": -26.12908363342285, "global_step": 335115, "epoch": 4037} {"train_loss": -26.373260498046875, "global_step": 335116, "epoch": 4037} {"train_loss": -26.22076988220215, "global_step": 335117, "epoch": 4037} {"train_loss": -26.346078872680664, "global_step": 335118, "epoch": 4037} {"train_loss": -26.291257858276367, "global_step": 335119, "epoch": 4037} {"train_loss": -26.080520629882812, "global_step": 335120, "epoch": 4037} {"train_loss": -26.360193252563477, "global_step": 335121, "epoch": 4037} {"train_loss": -26.180908203125, "global_step": 335122, "epoch": 4037} {"train_loss": -26.24837303161621, "global_step": 335123, "epoch": 4037} {"train_loss": -26.410736083984375, "global_step": 335124, "epoch": 4037} {"train_loss": -26.318790435791016, "global_step": 335125, "epoch": 4037} {"train_loss": -26.395517349243164, "global_step": 335126, "epoch": 4037} {"train_loss": -26.20940589904785, "global_step": 335127, "epoch": 4037} {"train_loss": -25.989294052124023, "global_step": 335128, "epoch": 4037} {"train_loss": -26.24433708190918, "global_step": 335129, "epoch": 4037} {"train_loss": -25.578935623168945, "global_step": 335130, "epoch": 4037} {"train_loss": -26.084609985351562, "global_step": 335131, "epoch": 4037} {"train_loss": -26.3676815032959, "global_step": 335132, "epoch": 4037} {"train_loss": -25.84450340270996, "global_step": 335133, "epoch": 4037} {"train_loss": -25.733610153198242, "global_step": 335134, "epoch": 4037} {"train_loss": -25.702423095703125, "global_step": 335135, "epoch": 4037} {"train_loss": -25.8029842376709, "global_step": 335136, "epoch": 4037} {"train_loss": -25.917577743530273, "global_step": 335137, "epoch": 4037} {"train_loss": -25.79099464416504, "global_step": 335138, "epoch": 4037} {"train_loss": -26.108346939086914, "global_step": 335139, "epoch": 4037} {"train_loss": -26.025121688842773, "global_step": 335140, "epoch": 4037} {"train_loss": -26.23428726196289, "global_step": 335141, "epoch": 4037} {"train_loss": -26.13185691833496, "global_step": 335142, "epoch": 4037} {"train_loss": -25.96851921081543, "global_step": 335143, "epoch": 4037} {"train_loss": -26.068063735961914, "global_step": 335144, "epoch": 4037} {"train_loss": -26.155597686767578, "global_step": 335145, "epoch": 4037} {"train_loss": -25.9398193359375, "global_step": 335146, "epoch": 4037} {"train_loss": -25.708053588867188, "global_step": 335147, "epoch": 4037} {"train_loss": -25.21608543395996, "global_step": 335148, "epoch": 4037} {"train_loss": -24.960304260253906, "global_step": 335149, "epoch": 4037} {"train_loss": -24.19849967956543, "global_step": 335150, "epoch": 4037} {"train_loss": -25.00361442565918, "global_step": 335151, "epoch": 4037} {"train_loss": -25.640182495117188, "global_step": 335152, "epoch": 4037} {"train_loss": -25.86951285672475, "global_step": 335153, "epoch": 4037, "val_loss": 6813486.0} {"train_loss": -22.621408462524414, "global_step": 335154, "epoch": 4038} {"train_loss": -24.140514373779297, "global_step": 335155, "epoch": 4038} {"train_loss": -23.631206512451172, "global_step": 335156, "epoch": 4038} {"train_loss": -23.97458267211914, "global_step": 335157, "epoch": 4038} {"train_loss": -24.232511520385742, "global_step": 335158, "epoch": 4038} {"train_loss": -23.34866714477539, "global_step": 335159, "epoch": 4038} {"train_loss": -24.579029083251953, "global_step": 335160, "epoch": 4038} {"train_loss": -24.69489288330078, "global_step": 335161, "epoch": 4038} {"train_loss": -24.071216583251953, "global_step": 335162, "epoch": 4038} {"train_loss": -24.49519157409668, "global_step": 335163, "epoch": 4038} {"train_loss": -24.757787704467773, "global_step": 335164, "epoch": 4038} {"train_loss": -24.81412124633789, "global_step": 335165, "epoch": 4038} {"train_loss": -25.0259952545166, "global_step": 335166, "epoch": 4038} {"train_loss": -24.870010375976562, "global_step": 335167, "epoch": 4038} {"train_loss": -25.11259651184082, "global_step": 335168, "epoch": 4038} {"train_loss": -25.25928497314453, "global_step": 335169, "epoch": 4038} {"train_loss": -25.13193130493164, "global_step": 335170, "epoch": 4038} {"train_loss": -25.180191040039062, "global_step": 335171, "epoch": 4038} {"train_loss": -24.91213607788086, "global_step": 335172, "epoch": 4038} {"train_loss": -25.041244506835938, "global_step": 335173, "epoch": 4038} {"train_loss": -25.11474609375, "global_step": 335174, "epoch": 4038} {"train_loss": -25.010589599609375, "global_step": 335175, "epoch": 4038} {"train_loss": -25.294008255004883, "global_step": 335176, "epoch": 4038} {"train_loss": -25.407459259033203, "global_step": 335177, "epoch": 4038} {"train_loss": -25.303525924682617, "global_step": 335178, "epoch": 4038} {"train_loss": -25.68033790588379, "global_step": 335179, "epoch": 4038} {"train_loss": -25.18842887878418, "global_step": 335180, "epoch": 4038} {"train_loss": -25.483434677124023, "global_step": 335181, "epoch": 4038} {"train_loss": -25.52591323852539, "global_step": 335182, "epoch": 4038} {"train_loss": -25.418787002563477, "global_step": 335183, "epoch": 4038} {"train_loss": -25.6646671295166, "global_step": 335184, "epoch": 4038} {"train_loss": -25.623004913330078, "global_step": 335185, "epoch": 4038} {"train_loss": -25.682056427001953, "global_step": 335186, "epoch": 4038} {"train_loss": -25.46964454650879, "global_step": 335187, "epoch": 4038} {"train_loss": -25.940664291381836, "global_step": 335188, "epoch": 4038} {"train_loss": -25.766733169555664, "global_step": 335189, "epoch": 4038} {"train_loss": -25.602563858032227, "global_step": 335190, "epoch": 4038} {"train_loss": -25.485509872436523, "global_step": 335191, "epoch": 4038} {"train_loss": -25.8035945892334, "global_step": 335192, "epoch": 4038} {"train_loss": -25.66310691833496, "global_step": 335193, "epoch": 4038} {"train_loss": -25.90481948852539, "global_step": 335194, "epoch": 4038} {"train_loss": -25.86164665222168, "global_step": 335195, "epoch": 4038} {"train_loss": -25.772817611694336, "global_step": 335196, "epoch": 4038} {"train_loss": -25.71744155883789, "global_step": 335197, "epoch": 4038} {"train_loss": -25.844207763671875, "global_step": 335198, "epoch": 4038} {"train_loss": -25.86530113220215, "global_step": 335199, "epoch": 4038} {"train_loss": -25.95496940612793, "global_step": 335200, "epoch": 4038} {"train_loss": -25.85274314880371, "global_step": 335201, "epoch": 4038} {"train_loss": -26.058210372924805, "global_step": 335202, "epoch": 4038} {"train_loss": -25.969608306884766, "global_step": 335203, "epoch": 4038} {"train_loss": -26.2646484375, "global_step": 335204, "epoch": 4038} {"train_loss": -26.268232345581055, "global_step": 335205, "epoch": 4038} {"train_loss": -25.763051986694336, "global_step": 335206, "epoch": 4038} {"train_loss": -25.99076271057129, "global_step": 335207, "epoch": 4038} {"train_loss": -25.895553588867188, "global_step": 335208, "epoch": 4038} {"train_loss": -26.13629150390625, "global_step": 335209, "epoch": 4038} {"train_loss": -25.469205856323242, "global_step": 335210, "epoch": 4038} {"train_loss": -25.51827049255371, "global_step": 335211, "epoch": 4038} {"train_loss": -25.552907943725586, "global_step": 335212, "epoch": 4038} {"train_loss": -26.0140323638916, "global_step": 335213, "epoch": 4038} {"train_loss": -25.8154239654541, "global_step": 335214, "epoch": 4038} {"train_loss": -25.832956314086914, "global_step": 335215, "epoch": 4038} {"train_loss": -26.00048828125, "global_step": 335216, "epoch": 4038} {"train_loss": -26.041730880737305, "global_step": 335217, "epoch": 4038} {"train_loss": -26.268407821655273, "global_step": 335218, "epoch": 4038} {"train_loss": -26.0853271484375, "global_step": 335219, "epoch": 4038} {"train_loss": -26.04029655456543, "global_step": 335220, "epoch": 4038} {"train_loss": -26.100311279296875, "global_step": 335221, "epoch": 4038} {"train_loss": -26.301593780517578, "global_step": 335222, "epoch": 4038} {"train_loss": -25.816925048828125, "global_step": 335223, "epoch": 4038} {"train_loss": -25.826141357421875, "global_step": 335224, "epoch": 4038} {"train_loss": -26.003732681274414, "global_step": 335225, "epoch": 4038} {"train_loss": -26.019269943237305, "global_step": 335226, "epoch": 4038} {"train_loss": -26.080596923828125, "global_step": 335227, "epoch": 4038} {"train_loss": -26.278305053710938, "global_step": 335228, "epoch": 4038} {"train_loss": -25.886743545532227, "global_step": 335229, "epoch": 4038} {"train_loss": -26.090972900390625, "global_step": 335230, "epoch": 4038} {"train_loss": -26.07254409790039, "global_step": 335231, "epoch": 4038} {"train_loss": -25.872251510620117, "global_step": 335232, "epoch": 4038} {"train_loss": -26.104887008666992, "global_step": 335233, "epoch": 4038} {"train_loss": -26.00968360900879, "global_step": 335234, "epoch": 4038} {"train_loss": -26.355215072631836, "global_step": 335235, "epoch": 4038} {"train_loss": -25.516918113432734, "global_step": 335236, "epoch": 4038, "val_loss": 6730474.0} {"train_loss": -25.841617584228516, "global_step": 335237, "epoch": 4039} {"train_loss": -25.771772384643555, "global_step": 335238, "epoch": 4039} {"train_loss": -25.947986602783203, "global_step": 335239, "epoch": 4039} {"train_loss": -25.715042114257812, "global_step": 335240, "epoch": 4039} {"train_loss": -26.170373916625977, "global_step": 335241, "epoch": 4039} {"train_loss": -26.00882911682129, "global_step": 335242, "epoch": 4039} {"train_loss": -25.824987411499023, "global_step": 335243, "epoch": 4039} {"train_loss": -25.87064552307129, "global_step": 335244, "epoch": 4039} {"train_loss": -25.6337890625, "global_step": 335245, "epoch": 4039} {"train_loss": -25.952381134033203, "global_step": 335246, "epoch": 4039} {"train_loss": -25.9475154876709, "global_step": 335247, "epoch": 4039} {"train_loss": -25.87774658203125, "global_step": 335248, "epoch": 4039} {"train_loss": -26.410327911376953, "global_step": 335249, "epoch": 4039} {"train_loss": -25.9274959564209, "global_step": 335250, "epoch": 4039} {"train_loss": -26.098052978515625, "global_step": 335251, "epoch": 4039} {"train_loss": -26.085729598999023, "global_step": 335252, "epoch": 4039} {"train_loss": -26.26255226135254, "global_step": 335253, "epoch": 4039} {"train_loss": -25.711774826049805, "global_step": 335254, "epoch": 4039} {"train_loss": -25.936506271362305, "global_step": 335255, "epoch": 4039} {"train_loss": -25.831125259399414, "global_step": 335256, "epoch": 4039} {"train_loss": -26.266422271728516, "global_step": 335257, "epoch": 4039} {"train_loss": -25.344205856323242, "global_step": 335258, "epoch": 4039} {"train_loss": -25.011474609375, "global_step": 335259, "epoch": 4039} {"train_loss": -25.84929847717285, "global_step": 335260, "epoch": 4039} {"train_loss": -26.03592300415039, "global_step": 335261, "epoch": 4039} {"train_loss": -26.573688507080078, "global_step": 335262, "epoch": 4039} {"train_loss": -25.599668502807617, "global_step": 335263, "epoch": 4039} {"train_loss": -25.930072784423828, "global_step": 335264, "epoch": 4039} {"train_loss": -25.679731369018555, "global_step": 335265, "epoch": 4039} {"train_loss": -25.937610626220703, "global_step": 335266, "epoch": 4039} {"train_loss": -25.90374183654785, "global_step": 335267, "epoch": 4039} {"train_loss": -26.063589096069336, "global_step": 335268, "epoch": 4039} {"train_loss": -25.728775024414062, "global_step": 335269, "epoch": 4039} {"train_loss": -25.678632736206055, "global_step": 335270, "epoch": 4039} {"train_loss": -26.19085121154785, "global_step": 335271, "epoch": 4039} {"train_loss": -25.80743408203125, "global_step": 335272, "epoch": 4039} {"train_loss": -26.02949333190918, "global_step": 335273, "epoch": 4039} {"train_loss": -25.95168113708496, "global_step": 335274, "epoch": 4039} {"train_loss": -25.793060302734375, "global_step": 335275, "epoch": 4039} {"train_loss": -26.18659782409668, "global_step": 335276, "epoch": 4039} {"train_loss": -25.954410552978516, "global_step": 335277, "epoch": 4039} {"train_loss": -26.21261978149414, "global_step": 335278, "epoch": 4039} {"train_loss": -25.88617515563965, "global_step": 335279, "epoch": 4039} {"train_loss": -26.335147857666016, "global_step": 335280, "epoch": 4039} {"train_loss": -25.84513282775879, "global_step": 335281, "epoch": 4039} {"train_loss": -26.097492218017578, "global_step": 335282, "epoch": 4039} {"train_loss": -26.21319580078125, "global_step": 335283, "epoch": 4039} {"train_loss": -26.218524932861328, "global_step": 335284, "epoch": 4039} {"train_loss": -26.192535400390625, "global_step": 335285, "epoch": 4039} {"train_loss": -25.8293514251709, "global_step": 335286, "epoch": 4039} {"train_loss": -26.19217872619629, "global_step": 335287, "epoch": 4039} {"train_loss": -25.731735229492188, "global_step": 335288, "epoch": 4039} {"train_loss": -26.35706901550293, "global_step": 335289, "epoch": 4039} {"train_loss": -26.346988677978516, "global_step": 335290, "epoch": 4039} {"train_loss": -25.81001853942871, "global_step": 335291, "epoch": 4039} {"train_loss": -26.03241539001465, "global_step": 335292, "epoch": 4039} {"train_loss": -25.896997451782227, "global_step": 335293, "epoch": 4039} {"train_loss": -25.835142135620117, "global_step": 335294, "epoch": 4039} {"train_loss": -26.356138229370117, "global_step": 335295, "epoch": 4039} {"train_loss": -26.263341903686523, "global_step": 335296, "epoch": 4039} {"train_loss": -26.540510177612305, "global_step": 335297, "epoch": 4039} {"train_loss": -26.019575119018555, "global_step": 335298, "epoch": 4039} {"train_loss": -26.09807777404785, "global_step": 335299, "epoch": 4039} {"train_loss": -25.85761070251465, "global_step": 335300, "epoch": 4039} {"train_loss": -25.79889488220215, "global_step": 335301, "epoch": 4039} {"train_loss": -25.498563766479492, "global_step": 335302, "epoch": 4039} {"train_loss": -25.7117977142334, "global_step": 335303, "epoch": 4039} {"train_loss": -26.020679473876953, "global_step": 335304, "epoch": 4039} {"train_loss": -26.270612716674805, "global_step": 335305, "epoch": 4039} {"train_loss": -26.020694732666016, "global_step": 335306, "epoch": 4039} {"train_loss": -26.15177345275879, "global_step": 335307, "epoch": 4039} {"train_loss": -26.422428131103516, "global_step": 335308, "epoch": 4039} {"train_loss": -26.086536407470703, "global_step": 335309, "epoch": 4039} {"train_loss": -26.086042404174805, "global_step": 335310, "epoch": 4039} {"train_loss": -25.97503089904785, "global_step": 335311, "epoch": 4039} {"train_loss": -26.2120304107666, "global_step": 335312, "epoch": 4039} {"train_loss": -25.98992347717285, "global_step": 335313, "epoch": 4039} {"train_loss": -25.825098037719727, "global_step": 335314, "epoch": 4039} {"train_loss": -26.16425132751465, "global_step": 335315, "epoch": 4039} {"train_loss": -26.49175453186035, "global_step": 335316, "epoch": 4039} {"train_loss": -26.33966064453125, "global_step": 335317, "epoch": 4039} {"train_loss": -26.14862632751465, "global_step": 335318, "epoch": 4039} {"train_loss": -25.99587385338473, "global_step": 335319, "epoch": 4039, "val_loss": 6696782.0} {"train_loss": -26.099279403686523, "global_step": 335320, "epoch": 4040} {"train_loss": -25.818878173828125, "global_step": 335321, "epoch": 4040} {"train_loss": -25.321447372436523, "global_step": 335322, "epoch": 4040} {"train_loss": -25.478530883789062, "global_step": 335323, "epoch": 4040} {"train_loss": -25.949146270751953, "global_step": 335324, "epoch": 4040} {"train_loss": -25.375261306762695, "global_step": 335325, "epoch": 4040} {"train_loss": -25.656042098999023, "global_step": 335326, "epoch": 4040} {"train_loss": -25.87042236328125, "global_step": 335327, "epoch": 4040} {"train_loss": -25.744245529174805, "global_step": 335328, "epoch": 4040} {"train_loss": -25.83277702331543, "global_step": 335329, "epoch": 4040} {"train_loss": -26.10474967956543, "global_step": 335330, "epoch": 4040} {"train_loss": -25.79559326171875, "global_step": 335331, "epoch": 4040} {"train_loss": -26.044677734375, "global_step": 335332, "epoch": 4040} {"train_loss": -25.623266220092773, "global_step": 335333, "epoch": 4040} {"train_loss": -25.603260040283203, "global_step": 335334, "epoch": 4040} {"train_loss": -26.22014808654785, "global_step": 335335, "epoch": 4040} {"train_loss": -25.89813804626465, "global_step": 335336, "epoch": 4040} {"train_loss": -25.799407958984375, "global_step": 335337, "epoch": 4040} {"train_loss": -25.952381134033203, "global_step": 335338, "epoch": 4040} {"train_loss": -26.04705810546875, "global_step": 335339, "epoch": 4040} {"train_loss": -25.891376495361328, "global_step": 335340, "epoch": 4040} {"train_loss": -25.966053009033203, "global_step": 335341, "epoch": 4040} {"train_loss": -26.139759063720703, "global_step": 335342, "epoch": 4040} {"train_loss": -25.8865909576416, "global_step": 335343, "epoch": 4040} {"train_loss": -26.048215866088867, "global_step": 335344, "epoch": 4040} {"train_loss": -26.1298770904541, "global_step": 335345, "epoch": 4040} {"train_loss": -26.179306030273438, "global_step": 335346, "epoch": 4040} {"train_loss": -26.183032989501953, "global_step": 335347, "epoch": 4040} {"train_loss": -26.131488800048828, "global_step": 335348, "epoch": 4040} {"train_loss": -25.8321533203125, "global_step": 335349, "epoch": 4040} {"train_loss": -26.24100685119629, "global_step": 335350, "epoch": 4040} {"train_loss": -26.18409538269043, "global_step": 335351, "epoch": 4040} {"train_loss": -26.36712074279785, "global_step": 335352, "epoch": 4040} {"train_loss": -26.363950729370117, "global_step": 335353, "epoch": 4040} {"train_loss": -26.35321044921875, "global_step": 335354, "epoch": 4040} {"train_loss": -26.330463409423828, "global_step": 335355, "epoch": 4040} {"train_loss": -26.586933135986328, "global_step": 335356, "epoch": 4040} {"train_loss": -26.216266632080078, "global_step": 335357, "epoch": 4040} {"train_loss": -26.458322525024414, "global_step": 335358, "epoch": 4040} {"train_loss": -26.148086547851562, "global_step": 335359, "epoch": 4040} {"train_loss": -26.15403175354004, "global_step": 335360, "epoch": 4040} {"train_loss": -26.183332443237305, "global_step": 335361, "epoch": 4040} {"train_loss": -26.210256576538086, "global_step": 335362, "epoch": 4040} {"train_loss": -25.94308853149414, "global_step": 335363, "epoch": 4040} {"train_loss": -25.855321884155273, "global_step": 335364, "epoch": 4040} {"train_loss": -26.028268814086914, "global_step": 335365, "epoch": 4040} {"train_loss": -26.009496688842773, "global_step": 335366, "epoch": 4040} {"train_loss": -26.07879066467285, "global_step": 335367, "epoch": 4040} {"train_loss": -26.13886833190918, "global_step": 335368, "epoch": 4040} {"train_loss": -25.9197998046875, "global_step": 335369, "epoch": 4040} {"train_loss": -26.25588035583496, "global_step": 335370, "epoch": 4040} {"train_loss": -25.949661254882812, "global_step": 335371, "epoch": 4040} {"train_loss": -25.937591552734375, "global_step": 335372, "epoch": 4040} {"train_loss": -26.286731719970703, "global_step": 335373, "epoch": 4040} {"train_loss": -25.955249786376953, "global_step": 335374, "epoch": 4040} {"train_loss": -26.537988662719727, "global_step": 335375, "epoch": 4040} {"train_loss": -26.113544464111328, "global_step": 335376, "epoch": 4040} {"train_loss": -25.8619441986084, "global_step": 335377, "epoch": 4040} {"train_loss": -26.202844619750977, "global_step": 335378, "epoch": 4040} {"train_loss": -26.1053524017334, "global_step": 335379, "epoch": 4040} {"train_loss": -26.119384765625, "global_step": 335380, "epoch": 4040} {"train_loss": -25.95256996154785, "global_step": 335381, "epoch": 4040} {"train_loss": -25.99814224243164, "global_step": 335382, "epoch": 4040} {"train_loss": -25.725961685180664, "global_step": 335383, "epoch": 4040} {"train_loss": -25.560142517089844, "global_step": 335384, "epoch": 4040} {"train_loss": -26.25946617126465, "global_step": 335385, "epoch": 4040} {"train_loss": -26.051639556884766, "global_step": 335386, "epoch": 4040} {"train_loss": -25.74141502380371, "global_step": 335387, "epoch": 4040} {"train_loss": -25.884366989135742, "global_step": 335388, "epoch": 4040} {"train_loss": -25.869937896728516, "global_step": 335389, "epoch": 4040} {"train_loss": -25.95454978942871, "global_step": 335390, "epoch": 4040} {"train_loss": -25.603235244750977, "global_step": 335391, "epoch": 4040} {"train_loss": -25.88115882873535, "global_step": 335392, "epoch": 4040} {"train_loss": -25.82332420349121, "global_step": 335393, "epoch": 4040} {"train_loss": -26.07293701171875, "global_step": 335394, "epoch": 4040} {"train_loss": -25.909961700439453, "global_step": 335395, "epoch": 4040} {"train_loss": -25.849706649780273, "global_step": 335396, "epoch": 4040} {"train_loss": -25.761228561401367, "global_step": 335397, "epoch": 4040} {"train_loss": -26.134063720703125, "global_step": 335398, "epoch": 4040} {"train_loss": -26.194137573242188, "global_step": 335399, "epoch": 4040} {"train_loss": -26.169208526611328, "global_step": 335400, "epoch": 4040} {"train_loss": -25.716552734375, "global_step": 335401, "epoch": 4040} {"train_loss": -26.0074073148061, "global_step": 335402, "epoch": 4040, "val_loss": 6639511.0} {"train_loss": -25.56098747253418, "global_step": 335403, "epoch": 4041} {"train_loss": -25.600934982299805, "global_step": 335404, "epoch": 4041} {"train_loss": -25.936298370361328, "global_step": 335405, "epoch": 4041} {"train_loss": -25.65690040588379, "global_step": 335406, "epoch": 4041} {"train_loss": -25.464323043823242, "global_step": 335407, "epoch": 4041} {"train_loss": -25.785858154296875, "global_step": 335408, "epoch": 4041} {"train_loss": -25.6911563873291, "global_step": 335409, "epoch": 4041} {"train_loss": -25.708023071289062, "global_step": 335410, "epoch": 4041} {"train_loss": -25.56679344177246, "global_step": 335411, "epoch": 4041} {"train_loss": -25.79416847229004, "global_step": 335412, "epoch": 4041} {"train_loss": -25.969640731811523, "global_step": 335413, "epoch": 4041} {"train_loss": -25.845727920532227, "global_step": 335414, "epoch": 4041} {"train_loss": -25.700592041015625, "global_step": 335415, "epoch": 4041} {"train_loss": -26.042383193969727, "global_step": 335416, "epoch": 4041} {"train_loss": -25.900121688842773, "global_step": 335417, "epoch": 4041} {"train_loss": -25.971540451049805, "global_step": 335418, "epoch": 4041} {"train_loss": -26.284168243408203, "global_step": 335419, "epoch": 4041} {"train_loss": -26.052783966064453, "global_step": 335420, "epoch": 4041} {"train_loss": -26.197187423706055, "global_step": 335421, "epoch": 4041} {"train_loss": -26.193588256835938, "global_step": 335422, "epoch": 4041} {"train_loss": -26.116870880126953, "global_step": 335423, "epoch": 4041} {"train_loss": -25.869775772094727, "global_step": 335424, "epoch": 4041} {"train_loss": -25.622894287109375, "global_step": 335425, "epoch": 4041} {"train_loss": -25.705142974853516, "global_step": 335426, "epoch": 4041} {"train_loss": -26.062347412109375, "global_step": 335427, "epoch": 4041} {"train_loss": -26.064167022705078, "global_step": 335428, "epoch": 4041} {"train_loss": -26.01076316833496, "global_step": 335429, "epoch": 4041} {"train_loss": -26.1348819732666, "global_step": 335430, "epoch": 4041} {"train_loss": -26.07801628112793, "global_step": 335431, "epoch": 4041} {"train_loss": -25.865339279174805, "global_step": 335432, "epoch": 4041} {"train_loss": -26.005430221557617, "global_step": 335433, "epoch": 4041} {"train_loss": -26.18900489807129, "global_step": 335434, "epoch": 4041} {"train_loss": -26.332263946533203, "global_step": 335435, "epoch": 4041} {"train_loss": -26.077356338500977, "global_step": 335436, "epoch": 4041} {"train_loss": -26.282373428344727, "global_step": 335437, "epoch": 4041} {"train_loss": -26.149396896362305, "global_step": 335438, "epoch": 4041} {"train_loss": -25.98577880859375, "global_step": 335439, "epoch": 4041} {"train_loss": -26.032697677612305, "global_step": 335440, "epoch": 4041} {"train_loss": -25.779993057250977, "global_step": 335441, "epoch": 4041} {"train_loss": -25.710357666015625, "global_step": 335442, "epoch": 4041} {"train_loss": -25.727848052978516, "global_step": 335443, "epoch": 4041} {"train_loss": -26.348133087158203, "global_step": 335444, "epoch": 4041} {"train_loss": -25.716955184936523, "global_step": 335445, "epoch": 4041} {"train_loss": -25.7043514251709, "global_step": 335446, "epoch": 4041} {"train_loss": -25.19703483581543, "global_step": 335447, "epoch": 4041} {"train_loss": -25.387283325195312, "global_step": 335448, "epoch": 4041} {"train_loss": -25.618274688720703, "global_step": 335449, "epoch": 4041} {"train_loss": -25.858417510986328, "global_step": 335450, "epoch": 4041} {"train_loss": -25.543418884277344, "global_step": 335451, "epoch": 4041} {"train_loss": -26.0413875579834, "global_step": 335452, "epoch": 4041} {"train_loss": -26.032861709594727, "global_step": 335453, "epoch": 4041} {"train_loss": -25.203617095947266, "global_step": 335454, "epoch": 4041} {"train_loss": -25.46877098083496, "global_step": 335455, "epoch": 4041} {"train_loss": -25.900070190429688, "global_step": 335456, "epoch": 4041} {"train_loss": -25.979528427124023, "global_step": 335457, "epoch": 4041} {"train_loss": -25.819639205932617, "global_step": 335458, "epoch": 4041} {"train_loss": -26.10980224609375, "global_step": 335459, "epoch": 4041} {"train_loss": -25.96004295349121, "global_step": 335460, "epoch": 4041} {"train_loss": -25.904895782470703, "global_step": 335461, "epoch": 4041} {"train_loss": -26.0257568359375, "global_step": 335462, "epoch": 4041} {"train_loss": -25.94365882873535, "global_step": 335463, "epoch": 4041} {"train_loss": -26.0889892578125, "global_step": 335464, "epoch": 4041} {"train_loss": -25.994354248046875, "global_step": 335465, "epoch": 4041} {"train_loss": -25.913227081298828, "global_step": 335466, "epoch": 4041} {"train_loss": -26.511133193969727, "global_step": 335467, "epoch": 4041} {"train_loss": -25.925073623657227, "global_step": 335468, "epoch": 4041} {"train_loss": -26.124256134033203, "global_step": 335469, "epoch": 4041} {"train_loss": -25.73455810546875, "global_step": 335470, "epoch": 4041} {"train_loss": -25.95734977722168, "global_step": 335471, "epoch": 4041} {"train_loss": -26.23990821838379, "global_step": 335472, "epoch": 4041} {"train_loss": -25.938507080078125, "global_step": 335473, "epoch": 4041} {"train_loss": -25.909391403198242, "global_step": 335474, "epoch": 4041} {"train_loss": -25.942996978759766, "global_step": 335475, "epoch": 4041} {"train_loss": -25.92072868347168, "global_step": 335476, "epoch": 4041} {"train_loss": -26.2750186920166, "global_step": 335477, "epoch": 4041} {"train_loss": -26.093290328979492, "global_step": 335478, "epoch": 4041} {"train_loss": -26.19282341003418, "global_step": 335479, "epoch": 4041} {"train_loss": -25.96026039123535, "global_step": 335480, "epoch": 4041} {"train_loss": -26.477731704711914, "global_step": 335481, "epoch": 4041} {"train_loss": -26.16177749633789, "global_step": 335482, "epoch": 4041} {"train_loss": -26.140247344970703, "global_step": 335483, "epoch": 4041} {"train_loss": -25.7686710357666, "global_step": 335484, "epoch": 4041} {"train_loss": -25.93056968321283, "global_step": 335485, "epoch": 4041, "val_loss": 6694882.0} {"train_loss": -25.330459594726562, "global_step": 335486, "epoch": 4042} {"train_loss": -25.36187744140625, "global_step": 335487, "epoch": 4042} {"train_loss": -25.173017501831055, "global_step": 335488, "epoch": 4042} {"train_loss": -24.736059188842773, "global_step": 335489, "epoch": 4042} {"train_loss": -25.025693893432617, "global_step": 335490, "epoch": 4042} {"train_loss": -25.5062313079834, "global_step": 335491, "epoch": 4042} {"train_loss": -25.417591094970703, "global_step": 335492, "epoch": 4042} {"train_loss": -25.03009796142578, "global_step": 335493, "epoch": 4042} {"train_loss": -25.010120391845703, "global_step": 335494, "epoch": 4042} {"train_loss": -25.75693130493164, "global_step": 335495, "epoch": 4042} {"train_loss": -25.27176284790039, "global_step": 335496, "epoch": 4042} {"train_loss": -25.317190170288086, "global_step": 335497, "epoch": 4042} {"train_loss": -25.436798095703125, "global_step": 335498, "epoch": 4042} {"train_loss": -25.7093563079834, "global_step": 335499, "epoch": 4042} {"train_loss": -25.58588218688965, "global_step": 335500, "epoch": 4042} {"train_loss": -25.58699607849121, "global_step": 335501, "epoch": 4042} {"train_loss": -25.25198745727539, "global_step": 335502, "epoch": 4042} {"train_loss": -25.60438346862793, "global_step": 335503, "epoch": 4042} {"train_loss": -25.57770347595215, "global_step": 335504, "epoch": 4042} {"train_loss": -25.874597549438477, "global_step": 335505, "epoch": 4042} {"train_loss": -25.771499633789062, "global_step": 335506, "epoch": 4042} {"train_loss": -26.01771354675293, "global_step": 335507, "epoch": 4042} {"train_loss": -25.851123809814453, "global_step": 335508, "epoch": 4042} {"train_loss": -25.68204116821289, "global_step": 335509, "epoch": 4042} {"train_loss": -26.013525009155273, "global_step": 335510, "epoch": 4042} {"train_loss": -25.733154296875, "global_step": 335511, "epoch": 4042} {"train_loss": -25.963886260986328, "global_step": 335512, "epoch": 4042} {"train_loss": -26.3946533203125, "global_step": 335513, "epoch": 4042} {"train_loss": -25.6815128326416, "global_step": 335514, "epoch": 4042} {"train_loss": -26.001928329467773, "global_step": 335515, "epoch": 4042} {"train_loss": -25.92506980895996, "global_step": 335516, "epoch": 4042} {"train_loss": -25.75135612487793, "global_step": 335517, "epoch": 4042} {"train_loss": -25.981372833251953, "global_step": 335518, "epoch": 4042} {"train_loss": -25.89216423034668, "global_step": 335519, "epoch": 4042} {"train_loss": -26.105436325073242, "global_step": 335520, "epoch": 4042} {"train_loss": -25.634464263916016, "global_step": 335521, "epoch": 4042} {"train_loss": -26.22134780883789, "global_step": 335522, "epoch": 4042} {"train_loss": -25.94685173034668, "global_step": 335523, "epoch": 4042} {"train_loss": -26.174102783203125, "global_step": 335524, "epoch": 4042} {"train_loss": -25.818063735961914, "global_step": 335525, "epoch": 4042} {"train_loss": -26.098169326782227, "global_step": 335526, "epoch": 4042} {"train_loss": -26.032611846923828, "global_step": 335527, "epoch": 4042} {"train_loss": -26.410388946533203, "global_step": 335528, "epoch": 4042} {"train_loss": -26.14812660217285, "global_step": 335529, "epoch": 4042} {"train_loss": -26.2657413482666, "global_step": 335530, "epoch": 4042} {"train_loss": -26.256988525390625, "global_step": 335531, "epoch": 4042} {"train_loss": -26.14666748046875, "global_step": 335532, "epoch": 4042} {"train_loss": -25.62099266052246, "global_step": 335533, "epoch": 4042} {"train_loss": -26.244998931884766, "global_step": 335534, "epoch": 4042} {"train_loss": -25.9538516998291, "global_step": 335535, "epoch": 4042} {"train_loss": -25.656824111938477, "global_step": 335536, "epoch": 4042} {"train_loss": -25.979450225830078, "global_step": 335537, "epoch": 4042} {"train_loss": -25.854944229125977, "global_step": 335538, "epoch": 4042} {"train_loss": -25.844898223876953, "global_step": 335539, "epoch": 4042} {"train_loss": -25.6683406829834, "global_step": 335540, "epoch": 4042} {"train_loss": -25.9779052734375, "global_step": 335541, "epoch": 4042} {"train_loss": -25.7617130279541, "global_step": 335542, "epoch": 4042} {"train_loss": -25.984731674194336, "global_step": 335543, "epoch": 4042} {"train_loss": -26.34998893737793, "global_step": 335544, "epoch": 4042} {"train_loss": -26.084325790405273, "global_step": 335545, "epoch": 4042} {"train_loss": -25.977888107299805, "global_step": 335546, "epoch": 4042} {"train_loss": -26.36274528503418, "global_step": 335547, "epoch": 4042} {"train_loss": -26.123579025268555, "global_step": 335548, "epoch": 4042} {"train_loss": -26.182226181030273, "global_step": 335549, "epoch": 4042} {"train_loss": -26.200031280517578, "global_step": 335550, "epoch": 4042} {"train_loss": -26.1129207611084, "global_step": 335551, "epoch": 4042} {"train_loss": -25.998584747314453, "global_step": 335552, "epoch": 4042} {"train_loss": -25.92841148376465, "global_step": 335553, "epoch": 4042} {"train_loss": -26.00811195373535, "global_step": 335554, "epoch": 4042} {"train_loss": -26.08125877380371, "global_step": 335555, "epoch": 4042} {"train_loss": -26.34929847717285, "global_step": 335556, "epoch": 4042} {"train_loss": -26.60162353515625, "global_step": 335557, "epoch": 4042} {"train_loss": -26.333709716796875, "global_step": 335558, "epoch": 4042} {"train_loss": -26.132965087890625, "global_step": 335559, "epoch": 4042} {"train_loss": -25.779356002807617, "global_step": 335560, "epoch": 4042} {"train_loss": -26.395246505737305, "global_step": 335561, "epoch": 4042} {"train_loss": -26.256811141967773, "global_step": 335562, "epoch": 4042} {"train_loss": -26.579938888549805, "global_step": 335563, "epoch": 4042} {"train_loss": -26.5756893157959, "global_step": 335564, "epoch": 4042} {"train_loss": -25.615650177001953, "global_step": 335565, "epoch": 4042} {"train_loss": -25.574087142944336, "global_step": 335566, "epoch": 4042} {"train_loss": -26.20111656188965, "global_step": 335567, "epoch": 4042} {"train_loss": -25.877925826842528, "global_step": 335568, "epoch": 4042, "val_loss": 6717057.5} {"train_loss": -24.635990142822266, "global_step": 335569, "epoch": 4043} {"train_loss": -23.048892974853516, "global_step": 335570, "epoch": 4043} {"train_loss": -24.18234634399414, "global_step": 335571, "epoch": 4043} {"train_loss": -24.205562591552734, "global_step": 335572, "epoch": 4043} {"train_loss": -24.948205947875977, "global_step": 335573, "epoch": 4043} {"train_loss": -24.071741104125977, "global_step": 335574, "epoch": 4043} {"train_loss": -24.836023330688477, "global_step": 335575, "epoch": 4043} {"train_loss": -25.062158584594727, "global_step": 335576, "epoch": 4043} {"train_loss": -24.927860260009766, "global_step": 335577, "epoch": 4043} {"train_loss": -25.249897003173828, "global_step": 335578, "epoch": 4043} {"train_loss": -25.300048828125, "global_step": 335579, "epoch": 4043} {"train_loss": -25.2395076751709, "global_step": 335580, "epoch": 4043} {"train_loss": -25.516504287719727, "global_step": 335581, "epoch": 4043} {"train_loss": -25.316572189331055, "global_step": 335582, "epoch": 4043} {"train_loss": -24.834348678588867, "global_step": 335583, "epoch": 4043} {"train_loss": -25.36895751953125, "global_step": 335584, "epoch": 4043} {"train_loss": -24.931333541870117, "global_step": 335585, "epoch": 4043} {"train_loss": -25.62324333190918, "global_step": 335586, "epoch": 4043} {"train_loss": -25.102354049682617, "global_step": 335587, "epoch": 4043} {"train_loss": -25.75880241394043, "global_step": 335588, "epoch": 4043} {"train_loss": -25.594057083129883, "global_step": 335589, "epoch": 4043} {"train_loss": -25.293987274169922, "global_step": 335590, "epoch": 4043} {"train_loss": -25.572559356689453, "global_step": 335591, "epoch": 4043} {"train_loss": -25.313920974731445, "global_step": 335592, "epoch": 4043} {"train_loss": -25.955642700195312, "global_step": 335593, "epoch": 4043} {"train_loss": -25.44021987915039, "global_step": 335594, "epoch": 4043} {"train_loss": -25.429140090942383, "global_step": 335595, "epoch": 4043} {"train_loss": -25.39145278930664, "global_step": 335596, "epoch": 4043} {"train_loss": -26.099411010742188, "global_step": 335597, "epoch": 4043} {"train_loss": -25.765979766845703, "global_step": 335598, "epoch": 4043} {"train_loss": -26.001691818237305, "global_step": 335599, "epoch": 4043} {"train_loss": -26.1074275970459, "global_step": 335600, "epoch": 4043} {"train_loss": -25.785741806030273, "global_step": 335601, "epoch": 4043} {"train_loss": -25.79575538635254, "global_step": 335602, "epoch": 4043} {"train_loss": -25.677221298217773, "global_step": 335603, "epoch": 4043} {"train_loss": -25.52315330505371, "global_step": 335604, "epoch": 4043} {"train_loss": -26.261005401611328, "global_step": 335605, "epoch": 4043} {"train_loss": -25.883207321166992, "global_step": 335606, "epoch": 4043} {"train_loss": -25.681726455688477, "global_step": 335607, "epoch": 4043} {"train_loss": -26.04597282409668, "global_step": 335608, "epoch": 4043} {"train_loss": -26.015689849853516, "global_step": 335609, "epoch": 4043} {"train_loss": -26.014074325561523, "global_step": 335610, "epoch": 4043} {"train_loss": -26.183517456054688, "global_step": 335611, "epoch": 4043} {"train_loss": -25.937854766845703, "global_step": 335612, "epoch": 4043} {"train_loss": -26.255483627319336, "global_step": 335613, "epoch": 4043} {"train_loss": -26.535552978515625, "global_step": 335614, "epoch": 4043} {"train_loss": -25.744718551635742, "global_step": 335615, "epoch": 4043} {"train_loss": -26.254194259643555, "global_step": 335616, "epoch": 4043} {"train_loss": -26.3409366607666, "global_step": 335617, "epoch": 4043} {"train_loss": -26.09124755859375, "global_step": 335618, "epoch": 4043} {"train_loss": -25.91033935546875, "global_step": 335619, "epoch": 4043} {"train_loss": -26.1517391204834, "global_step": 335620, "epoch": 4043} {"train_loss": -25.934141159057617, "global_step": 335621, "epoch": 4043} {"train_loss": -25.6307430267334, "global_step": 335622, "epoch": 4043} {"train_loss": -25.63812828063965, "global_step": 335623, "epoch": 4043} {"train_loss": -26.00873374938965, "global_step": 335624, "epoch": 4043} {"train_loss": -25.934843063354492, "global_step": 335625, "epoch": 4043} {"train_loss": -25.8485050201416, "global_step": 335626, "epoch": 4043} {"train_loss": -26.027257919311523, "global_step": 335627, "epoch": 4043} {"train_loss": -26.2473087310791, "global_step": 335628, "epoch": 4043} {"train_loss": -25.899372100830078, "global_step": 335629, "epoch": 4043} {"train_loss": -26.01362419128418, "global_step": 335630, "epoch": 4043} {"train_loss": -26.085004806518555, "global_step": 335631, "epoch": 4043} {"train_loss": -26.130640029907227, "global_step": 335632, "epoch": 4043} {"train_loss": -26.4918155670166, "global_step": 335633, "epoch": 4043} {"train_loss": -26.143497467041016, "global_step": 335634, "epoch": 4043} {"train_loss": -26.1686954498291, "global_step": 335635, "epoch": 4043} {"train_loss": -26.293975830078125, "global_step": 335636, "epoch": 4043} {"train_loss": -26.08623695373535, "global_step": 335637, "epoch": 4043} {"train_loss": -26.18813133239746, "global_step": 335638, "epoch": 4043} {"train_loss": -25.845117568969727, "global_step": 335639, "epoch": 4043} {"train_loss": -25.987768173217773, "global_step": 335640, "epoch": 4043} {"train_loss": -26.223346710205078, "global_step": 335641, "epoch": 4043} {"train_loss": -26.348983764648438, "global_step": 335642, "epoch": 4043} {"train_loss": -25.96880531311035, "global_step": 335643, "epoch": 4043} {"train_loss": -26.16888427734375, "global_step": 335644, "epoch": 4043} {"train_loss": -26.415552139282227, "global_step": 335645, "epoch": 4043} {"train_loss": -26.08711814880371, "global_step": 335646, "epoch": 4043} {"train_loss": -26.116291046142578, "global_step": 335647, "epoch": 4043} {"train_loss": -26.1179256439209, "global_step": 335648, "epoch": 4043} {"train_loss": -25.883981704711914, "global_step": 335649, "epoch": 4043} {"train_loss": -26.29180908203125, "global_step": 335650, "epoch": 4043} {"train_loss": -25.72540747401226, "global_step": 335651, "epoch": 4043, "val_loss": 6775845.5} {"train_loss": -26.388874053955078, "global_step": 335652, "epoch": 4044} {"train_loss": -25.846851348876953, "global_step": 335653, "epoch": 4044} {"train_loss": -25.85684585571289, "global_step": 335654, "epoch": 4044} {"train_loss": -25.708837509155273, "global_step": 335655, "epoch": 4044} {"train_loss": -26.059667587280273, "global_step": 335656, "epoch": 4044} {"train_loss": -25.9517822265625, "global_step": 335657, "epoch": 4044} {"train_loss": -25.708539962768555, "global_step": 335658, "epoch": 4044} {"train_loss": -26.059619903564453, "global_step": 335659, "epoch": 4044} {"train_loss": -26.07378578186035, "global_step": 335660, "epoch": 4044} {"train_loss": -25.956518173217773, "global_step": 335661, "epoch": 4044} {"train_loss": -26.061368942260742, "global_step": 335662, "epoch": 4044} {"train_loss": -25.87875747680664, "global_step": 335663, "epoch": 4044} {"train_loss": -25.75729751586914, "global_step": 335664, "epoch": 4044} {"train_loss": -25.952451705932617, "global_step": 335665, "epoch": 4044} {"train_loss": -25.886640548706055, "global_step": 335666, "epoch": 4044} {"train_loss": -25.7082576751709, "global_step": 335667, "epoch": 4044} {"train_loss": -25.997909545898438, "global_step": 335668, "epoch": 4044} {"train_loss": -26.003223419189453, "global_step": 335669, "epoch": 4044} {"train_loss": -26.379247665405273, "global_step": 335670, "epoch": 4044} {"train_loss": -25.779296875, "global_step": 335671, "epoch": 4044} {"train_loss": -26.11113929748535, "global_step": 335672, "epoch": 4044} {"train_loss": -25.956769943237305, "global_step": 335673, "epoch": 4044} {"train_loss": -26.08429527282715, "global_step": 335674, "epoch": 4044} {"train_loss": -26.005390167236328, "global_step": 335675, "epoch": 4044} {"train_loss": -26.260847091674805, "global_step": 335676, "epoch": 4044} {"train_loss": -25.86368179321289, "global_step": 335677, "epoch": 4044} {"train_loss": -25.764419555664062, "global_step": 335678, "epoch": 4044} {"train_loss": -26.17780113220215, "global_step": 335679, "epoch": 4044} {"train_loss": -25.753345489501953, "global_step": 335680, "epoch": 4044} {"train_loss": -26.025739669799805, "global_step": 335681, "epoch": 4044} {"train_loss": -26.34279441833496, "global_step": 335682, "epoch": 4044} {"train_loss": -25.96587562561035, "global_step": 335683, "epoch": 4044} {"train_loss": -26.451324462890625, "global_step": 335684, "epoch": 4044} {"train_loss": -26.049606323242188, "global_step": 335685, "epoch": 4044} {"train_loss": -26.311140060424805, "global_step": 335686, "epoch": 4044} {"train_loss": -25.891523361206055, "global_step": 335687, "epoch": 4044} {"train_loss": -26.299230575561523, "global_step": 335688, "epoch": 4044} {"train_loss": -26.213424682617188, "global_step": 335689, "epoch": 4044} {"train_loss": -26.215070724487305, "global_step": 335690, "epoch": 4044} {"train_loss": -26.211292266845703, "global_step": 335691, "epoch": 4044} {"train_loss": -26.574979782104492, "global_step": 335692, "epoch": 4044} {"train_loss": -26.354049682617188, "global_step": 335693, "epoch": 4044} {"train_loss": -25.996204376220703, "global_step": 335694, "epoch": 4044} {"train_loss": -26.19862937927246, "global_step": 335695, "epoch": 4044} {"train_loss": -26.099103927612305, "global_step": 335696, "epoch": 4044} {"train_loss": -26.23597526550293, "global_step": 335697, "epoch": 4044} {"train_loss": -25.793399810791016, "global_step": 335698, "epoch": 4044} {"train_loss": -25.648651123046875, "global_step": 335699, "epoch": 4044} {"train_loss": -25.32270050048828, "global_step": 335700, "epoch": 4044} {"train_loss": -25.232746124267578, "global_step": 335701, "epoch": 4044} {"train_loss": -24.881052017211914, "global_step": 335702, "epoch": 4044} {"train_loss": -25.56570053100586, "global_step": 335703, "epoch": 4044} {"train_loss": -26.209386825561523, "global_step": 335704, "epoch": 4044} {"train_loss": -25.86493492126465, "global_step": 335705, "epoch": 4044} {"train_loss": -25.6903018951416, "global_step": 335706, "epoch": 4044} {"train_loss": -25.84464454650879, "global_step": 335707, "epoch": 4044} {"train_loss": -25.91162109375, "global_step": 335708, "epoch": 4044} {"train_loss": -25.66175651550293, "global_step": 335709, "epoch": 4044} {"train_loss": -25.9722843170166, "global_step": 335710, "epoch": 4044} {"train_loss": -25.941822052001953, "global_step": 335711, "epoch": 4044} {"train_loss": -26.154743194580078, "global_step": 335712, "epoch": 4044} {"train_loss": -26.07721519470215, "global_step": 335713, "epoch": 4044} {"train_loss": -26.041162490844727, "global_step": 335714, "epoch": 4044} {"train_loss": -25.608386993408203, "global_step": 335715, "epoch": 4044} {"train_loss": -25.925220489501953, "global_step": 335716, "epoch": 4044} {"train_loss": -25.929712295532227, "global_step": 335717, "epoch": 4044} {"train_loss": -26.32703971862793, "global_step": 335718, "epoch": 4044} {"train_loss": -25.70624351501465, "global_step": 335719, "epoch": 4044} {"train_loss": -25.484779357910156, "global_step": 335720, "epoch": 4044} {"train_loss": -25.841434478759766, "global_step": 335721, "epoch": 4044} {"train_loss": -26.14850425720215, "global_step": 335722, "epoch": 4044} {"train_loss": -26.432538986206055, "global_step": 335723, "epoch": 4044} {"train_loss": -26.24909019470215, "global_step": 335724, "epoch": 4044} {"train_loss": -25.699207305908203, "global_step": 335725, "epoch": 4044} {"train_loss": -26.2416934967041, "global_step": 335726, "epoch": 4044} {"train_loss": -26.04886245727539, "global_step": 335727, "epoch": 4044} {"train_loss": -26.108789443969727, "global_step": 335728, "epoch": 4044} {"train_loss": -26.158918380737305, "global_step": 335729, "epoch": 4044} {"train_loss": -26.11353874206543, "global_step": 335730, "epoch": 4044} {"train_loss": -25.82831382751465, "global_step": 335731, "epoch": 4044} {"train_loss": -25.790781021118164, "global_step": 335732, "epoch": 4044} {"train_loss": -25.950529098510742, "global_step": 335733, "epoch": 4044} {"train_loss": -25.98463897245476, "global_step": 335734, "epoch": 4044, "val_loss": 6671577.5} {"train_loss": -25.57010269165039, "global_step": 335735, "epoch": 4045} {"train_loss": -25.167865753173828, "global_step": 335736, "epoch": 4045} {"train_loss": -25.723663330078125, "global_step": 335737, "epoch": 4045} {"train_loss": -25.73075294494629, "global_step": 335738, "epoch": 4045} {"train_loss": -25.336139678955078, "global_step": 335739, "epoch": 4045} {"train_loss": -25.847763061523438, "global_step": 335740, "epoch": 4045} {"train_loss": -25.426700592041016, "global_step": 335741, "epoch": 4045} {"train_loss": -26.0064640045166, "global_step": 335742, "epoch": 4045} {"train_loss": -25.405410766601562, "global_step": 335743, "epoch": 4045} {"train_loss": -25.411117553710938, "global_step": 335744, "epoch": 4045} {"train_loss": -25.748579025268555, "global_step": 335745, "epoch": 4045} {"train_loss": -26.103271484375, "global_step": 335746, "epoch": 4045} {"train_loss": -25.837787628173828, "global_step": 335747, "epoch": 4045} {"train_loss": -25.739307403564453, "global_step": 335748, "epoch": 4045} {"train_loss": -26.098072052001953, "global_step": 335749, "epoch": 4045} {"train_loss": -25.86677360534668, "global_step": 335750, "epoch": 4045} {"train_loss": -25.837738037109375, "global_step": 335751, "epoch": 4045} {"train_loss": -25.953405380249023, "global_step": 335752, "epoch": 4045} {"train_loss": -25.841785430908203, "global_step": 335753, "epoch": 4045} {"train_loss": -25.963993072509766, "global_step": 335754, "epoch": 4045} {"train_loss": -25.823139190673828, "global_step": 335755, "epoch": 4045} {"train_loss": -26.02084732055664, "global_step": 335756, "epoch": 4045} {"train_loss": -26.236896514892578, "global_step": 335757, "epoch": 4045} {"train_loss": -26.12076759338379, "global_step": 335758, "epoch": 4045} {"train_loss": -26.117847442626953, "global_step": 335759, "epoch": 4045} {"train_loss": -25.91389274597168, "global_step": 335760, "epoch": 4045} {"train_loss": -26.130640029907227, "global_step": 335761, "epoch": 4045} {"train_loss": -25.952260971069336, "global_step": 335762, "epoch": 4045} {"train_loss": -26.022653579711914, "global_step": 335763, "epoch": 4045} {"train_loss": -25.915740966796875, "global_step": 335764, "epoch": 4045} {"train_loss": -26.0357666015625, "global_step": 335765, "epoch": 4045} {"train_loss": -26.183929443359375, "global_step": 335766, "epoch": 4045} {"train_loss": -26.192291259765625, "global_step": 335767, "epoch": 4045} {"train_loss": -26.418354034423828, "global_step": 335768, "epoch": 4045} {"train_loss": -26.274168014526367, "global_step": 335769, "epoch": 4045} {"train_loss": -26.372039794921875, "global_step": 335770, "epoch": 4045} {"train_loss": -26.08330726623535, "global_step": 335771, "epoch": 4045} {"train_loss": -26.16383171081543, "global_step": 335772, "epoch": 4045} {"train_loss": -26.007293701171875, "global_step": 335773, "epoch": 4045} {"train_loss": -26.119159698486328, "global_step": 335774, "epoch": 4045} {"train_loss": -26.32413673400879, "global_step": 335775, "epoch": 4045} {"train_loss": -26.47287368774414, "global_step": 335776, "epoch": 4045} {"train_loss": -25.85951042175293, "global_step": 335777, "epoch": 4045} {"train_loss": -26.224416732788086, "global_step": 335778, "epoch": 4045} {"train_loss": -26.4356632232666, "global_step": 335779, "epoch": 4045} {"train_loss": -25.81195640563965, "global_step": 335780, "epoch": 4045} {"train_loss": -26.53946876525879, "global_step": 335781, "epoch": 4045} {"train_loss": -26.256032943725586, "global_step": 335782, "epoch": 4045} {"train_loss": -26.028305053710938, "global_step": 335783, "epoch": 4045} {"train_loss": -26.206562042236328, "global_step": 335784, "epoch": 4045} {"train_loss": -26.29534912109375, "global_step": 335785, "epoch": 4045} {"train_loss": -26.298749923706055, "global_step": 335786, "epoch": 4045} {"train_loss": -26.09686851501465, "global_step": 335787, "epoch": 4045} {"train_loss": -25.65787696838379, "global_step": 335788, "epoch": 4045} {"train_loss": -26.219457626342773, "global_step": 335789, "epoch": 4045} {"train_loss": -25.206701278686523, "global_step": 335790, "epoch": 4045} {"train_loss": -26.249582290649414, "global_step": 335791, "epoch": 4045} {"train_loss": -25.755407333374023, "global_step": 335792, "epoch": 4045} {"train_loss": -25.76325035095215, "global_step": 335793, "epoch": 4045} {"train_loss": -25.51891326904297, "global_step": 335794, "epoch": 4045} {"train_loss": -25.667449951171875, "global_step": 335795, "epoch": 4045} {"train_loss": -25.623823165893555, "global_step": 335796, "epoch": 4045} {"train_loss": -26.289276123046875, "global_step": 335797, "epoch": 4045} {"train_loss": -25.797637939453125, "global_step": 335798, "epoch": 4045} {"train_loss": -26.09111976623535, "global_step": 335799, "epoch": 4045} {"train_loss": -25.705005645751953, "global_step": 335800, "epoch": 4045} {"train_loss": -26.16485595703125, "global_step": 335801, "epoch": 4045} {"train_loss": -26.209217071533203, "global_step": 335802, "epoch": 4045} {"train_loss": -25.969390869140625, "global_step": 335803, "epoch": 4045} {"train_loss": -25.873279571533203, "global_step": 335804, "epoch": 4045} {"train_loss": -26.072174072265625, "global_step": 335805, "epoch": 4045} {"train_loss": -26.157855987548828, "global_step": 335806, "epoch": 4045} {"train_loss": -26.407073974609375, "global_step": 335807, "epoch": 4045} {"train_loss": -26.0494384765625, "global_step": 335808, "epoch": 4045} {"train_loss": -25.904911041259766, "global_step": 335809, "epoch": 4045} {"train_loss": -26.209671020507812, "global_step": 335810, "epoch": 4045} {"train_loss": -25.91357421875, "global_step": 335811, "epoch": 4045} {"train_loss": -26.09504508972168, "global_step": 335812, "epoch": 4045} {"train_loss": -26.2785587310791, "global_step": 335813, "epoch": 4045} {"train_loss": -26.180850982666016, "global_step": 335814, "epoch": 4045} {"train_loss": -26.086698532104492, "global_step": 335815, "epoch": 4045} {"train_loss": -26.084640502929688, "global_step": 335816, "epoch": 4045} {"train_loss": -25.996834467692548, "global_step": 335817, "epoch": 4045, "val_loss": 6685389.0} {"train_loss": -25.85316276550293, "global_step": 335818, "epoch": 4046} {"train_loss": -25.23060417175293, "global_step": 335819, "epoch": 4046} {"train_loss": -25.384723663330078, "global_step": 335820, "epoch": 4046} {"train_loss": -25.563892364501953, "global_step": 335821, "epoch": 4046} {"train_loss": -25.603979110717773, "global_step": 335822, "epoch": 4046} {"train_loss": -24.83623504638672, "global_step": 335823, "epoch": 4046} {"train_loss": -25.279804229736328, "global_step": 335824, "epoch": 4046} {"train_loss": -25.422941207885742, "global_step": 335825, "epoch": 4046} {"train_loss": -25.476337432861328, "global_step": 335826, "epoch": 4046} {"train_loss": -25.39818572998047, "global_step": 335827, "epoch": 4046} {"train_loss": -26.137353897094727, "global_step": 335828, "epoch": 4046} {"train_loss": -25.804548263549805, "global_step": 335829, "epoch": 4046} {"train_loss": -26.028182983398438, "global_step": 335830, "epoch": 4046} {"train_loss": -25.932706832885742, "global_step": 335831, "epoch": 4046} {"train_loss": -25.81178092956543, "global_step": 335832, "epoch": 4046} {"train_loss": -25.534198760986328, "global_step": 335833, "epoch": 4046} {"train_loss": -26.03303337097168, "global_step": 335834, "epoch": 4046} {"train_loss": -25.931842803955078, "global_step": 335835, "epoch": 4046} {"train_loss": -25.815643310546875, "global_step": 335836, "epoch": 4046} {"train_loss": -26.068700790405273, "global_step": 335837, "epoch": 4046} {"train_loss": -25.993488311767578, "global_step": 335838, "epoch": 4046} {"train_loss": -25.930540084838867, "global_step": 335839, "epoch": 4046} {"train_loss": -26.228179931640625, "global_step": 335840, "epoch": 4046} {"train_loss": -26.104446411132812, "global_step": 335841, "epoch": 4046} {"train_loss": -26.217939376831055, "global_step": 335842, "epoch": 4046} {"train_loss": -26.078062057495117, "global_step": 335843, "epoch": 4046} {"train_loss": -25.976531982421875, "global_step": 335844, "epoch": 4046} {"train_loss": -26.39381217956543, "global_step": 335845, "epoch": 4046} {"train_loss": -25.961994171142578, "global_step": 335846, "epoch": 4046} {"train_loss": -25.938323974609375, "global_step": 335847, "epoch": 4046} {"train_loss": -25.968433380126953, "global_step": 335848, "epoch": 4046} {"train_loss": -26.09461784362793, "global_step": 335849, "epoch": 4046} {"train_loss": -26.221607208251953, "global_step": 335850, "epoch": 4046} {"train_loss": -26.21551513671875, "global_step": 335851, "epoch": 4046} {"train_loss": -25.9700984954834, "global_step": 335852, "epoch": 4046} {"train_loss": -26.19834327697754, "global_step": 335853, "epoch": 4046} {"train_loss": -26.45556640625, "global_step": 335854, "epoch": 4046} {"train_loss": -26.237781524658203, "global_step": 335855, "epoch": 4046} {"train_loss": -26.454755783081055, "global_step": 335856, "epoch": 4046} {"train_loss": -25.978551864624023, "global_step": 335857, "epoch": 4046} {"train_loss": -25.82549476623535, "global_step": 335858, "epoch": 4046} {"train_loss": -26.190444946289062, "global_step": 335859, "epoch": 4046} {"train_loss": -26.130542755126953, "global_step": 335860, "epoch": 4046} {"train_loss": -26.23133659362793, "global_step": 335861, "epoch": 4046} {"train_loss": -26.181903839111328, "global_step": 335862, "epoch": 4046} {"train_loss": -26.005910873413086, "global_step": 335863, "epoch": 4046} {"train_loss": -26.436634063720703, "global_step": 335864, "epoch": 4046} {"train_loss": -26.180988311767578, "global_step": 335865, "epoch": 4046} {"train_loss": -25.90883445739746, "global_step": 335866, "epoch": 4046} {"train_loss": -25.9405517578125, "global_step": 335867, "epoch": 4046} {"train_loss": -26.029150009155273, "global_step": 335868, "epoch": 4046} {"train_loss": -26.064640045166016, "global_step": 335869, "epoch": 4046} {"train_loss": -25.907751083374023, "global_step": 335870, "epoch": 4046} {"train_loss": -26.180999755859375, "global_step": 335871, "epoch": 4046} {"train_loss": -26.2690372467041, "global_step": 335872, "epoch": 4046} {"train_loss": -25.751432418823242, "global_step": 335873, "epoch": 4046} {"train_loss": -25.875219345092773, "global_step": 335874, "epoch": 4046} {"train_loss": -25.97930335998535, "global_step": 335875, "epoch": 4046} {"train_loss": -26.25115394592285, "global_step": 335876, "epoch": 4046} {"train_loss": -26.09515953063965, "global_step": 335877, "epoch": 4046} {"train_loss": -26.316436767578125, "global_step": 335878, "epoch": 4046} {"train_loss": -26.494409561157227, "global_step": 335879, "epoch": 4046} {"train_loss": -25.988723754882812, "global_step": 335880, "epoch": 4046} {"train_loss": -25.975006103515625, "global_step": 335881, "epoch": 4046} {"train_loss": -26.228830337524414, "global_step": 335882, "epoch": 4046} {"train_loss": -26.179834365844727, "global_step": 335883, "epoch": 4046} {"train_loss": -26.10541343688965, "global_step": 335884, "epoch": 4046} {"train_loss": -26.12744140625, "global_step": 335885, "epoch": 4046} {"train_loss": -26.123605728149414, "global_step": 335886, "epoch": 4046} {"train_loss": -26.111438751220703, "global_step": 335887, "epoch": 4046} {"train_loss": -25.57880973815918, "global_step": 335888, "epoch": 4046} {"train_loss": -25.91029930114746, "global_step": 335889, "epoch": 4046} {"train_loss": -26.104337692260742, "global_step": 335890, "epoch": 4046} {"train_loss": -26.001001358032227, "global_step": 335891, "epoch": 4046} {"train_loss": -25.816720962524414, "global_step": 335892, "epoch": 4046} {"train_loss": -25.685688018798828, "global_step": 335893, "epoch": 4046} {"train_loss": -25.9986515045166, "global_step": 335894, "epoch": 4046} {"train_loss": -26.219877243041992, "global_step": 335895, "epoch": 4046} {"train_loss": -26.230321884155273, "global_step": 335896, "epoch": 4046} {"train_loss": -26.013288497924805, "global_step": 335897, "epoch": 4046} {"train_loss": -25.359365463256836, "global_step": 335898, "epoch": 4046} {"train_loss": -25.809720993041992, "global_step": 335899, "epoch": 4046} {"train_loss": -25.963435827967633, "global_step": 335900, "epoch": 4046, "val_loss": 6679619.0} {"train_loss": -25.601715087890625, "global_step": 335901, "epoch": 4047} {"train_loss": -25.607654571533203, "global_step": 335902, "epoch": 4047} {"train_loss": -25.500328063964844, "global_step": 335903, "epoch": 4047} {"train_loss": -25.447113037109375, "global_step": 335904, "epoch": 4047} {"train_loss": -25.980222702026367, "global_step": 335905, "epoch": 4047} {"train_loss": -25.50493049621582, "global_step": 335906, "epoch": 4047} {"train_loss": -25.735620498657227, "global_step": 335907, "epoch": 4047} {"train_loss": -25.069196701049805, "global_step": 335908, "epoch": 4047} {"train_loss": -26.067514419555664, "global_step": 335909, "epoch": 4047} {"train_loss": -25.606916427612305, "global_step": 335910, "epoch": 4047} {"train_loss": -26.044727325439453, "global_step": 335911, "epoch": 4047} {"train_loss": -25.656051635742188, "global_step": 335912, "epoch": 4047} {"train_loss": -26.053808212280273, "global_step": 335913, "epoch": 4047} {"train_loss": -25.715301513671875, "global_step": 335914, "epoch": 4047} {"train_loss": -25.456504821777344, "global_step": 335915, "epoch": 4047} {"train_loss": -26.051660537719727, "global_step": 335916, "epoch": 4047} {"train_loss": -25.886627197265625, "global_step": 335917, "epoch": 4047} {"train_loss": -25.978586196899414, "global_step": 335918, "epoch": 4047} {"train_loss": -25.867040634155273, "global_step": 335919, "epoch": 4047} {"train_loss": -26.21331214904785, "global_step": 335920, "epoch": 4047} {"train_loss": -25.955493927001953, "global_step": 335921, "epoch": 4047} {"train_loss": -26.16326904296875, "global_step": 335922, "epoch": 4047} {"train_loss": -25.67072105407715, "global_step": 335923, "epoch": 4047} {"train_loss": -25.8662052154541, "global_step": 335924, "epoch": 4047} {"train_loss": -26.495742797851562, "global_step": 335925, "epoch": 4047} {"train_loss": -25.90869140625, "global_step": 335926, "epoch": 4047} {"train_loss": -26.113056182861328, "global_step": 335927, "epoch": 4047} {"train_loss": -25.953216552734375, "global_step": 335928, "epoch": 4047} {"train_loss": -25.993940353393555, "global_step": 335929, "epoch": 4047} {"train_loss": -25.745243072509766, "global_step": 335930, "epoch": 4047} {"train_loss": -26.267759323120117, "global_step": 335931, "epoch": 4047} {"train_loss": -26.006383895874023, "global_step": 335932, "epoch": 4047} {"train_loss": -25.932641983032227, "global_step": 335933, "epoch": 4047} {"train_loss": -26.257978439331055, "global_step": 335934, "epoch": 4047} {"train_loss": -25.921960830688477, "global_step": 335935, "epoch": 4047} {"train_loss": -26.05414390563965, "global_step": 335936, "epoch": 4047} {"train_loss": -25.76275634765625, "global_step": 335937, "epoch": 4047} {"train_loss": -25.59478187561035, "global_step": 335938, "epoch": 4047} {"train_loss": -25.787540435791016, "global_step": 335939, "epoch": 4047} {"train_loss": -26.083707809448242, "global_step": 335940, "epoch": 4047} {"train_loss": -26.049081802368164, "global_step": 335941, "epoch": 4047} {"train_loss": -26.134504318237305, "global_step": 335942, "epoch": 4047} {"train_loss": -25.957569122314453, "global_step": 335943, "epoch": 4047} {"train_loss": -25.974512100219727, "global_step": 335944, "epoch": 4047} {"train_loss": -26.103973388671875, "global_step": 335945, "epoch": 4047} {"train_loss": -25.84492301940918, "global_step": 335946, "epoch": 4047} {"train_loss": -25.8009090423584, "global_step": 335947, "epoch": 4047} {"train_loss": -25.99407958984375, "global_step": 335948, "epoch": 4047} {"train_loss": -25.938251495361328, "global_step": 335949, "epoch": 4047} {"train_loss": -26.292402267456055, "global_step": 335950, "epoch": 4047} {"train_loss": -26.245468139648438, "global_step": 335951, "epoch": 4047} {"train_loss": -25.799161911010742, "global_step": 335952, "epoch": 4047} {"train_loss": -26.16592788696289, "global_step": 335953, "epoch": 4047} {"train_loss": -25.9350643157959, "global_step": 335954, "epoch": 4047} {"train_loss": -26.091949462890625, "global_step": 335955, "epoch": 4047} {"train_loss": -25.967914581298828, "global_step": 335956, "epoch": 4047} {"train_loss": -26.494565963745117, "global_step": 335957, "epoch": 4047} {"train_loss": -25.975692749023438, "global_step": 335958, "epoch": 4047} {"train_loss": -26.16659927368164, "global_step": 335959, "epoch": 4047} {"train_loss": -26.12030601501465, "global_step": 335960, "epoch": 4047} {"train_loss": -26.061254501342773, "global_step": 335961, "epoch": 4047} {"train_loss": -25.718168258666992, "global_step": 335962, "epoch": 4047} {"train_loss": -26.253772735595703, "global_step": 335963, "epoch": 4047} {"train_loss": -26.052717208862305, "global_step": 335964, "epoch": 4047} {"train_loss": -26.467823028564453, "global_step": 335965, "epoch": 4047} {"train_loss": -25.87250328063965, "global_step": 335966, "epoch": 4047} {"train_loss": -26.278722763061523, "global_step": 335967, "epoch": 4047} {"train_loss": -25.994781494140625, "global_step": 335968, "epoch": 4047} {"train_loss": -26.28089714050293, "global_step": 335969, "epoch": 4047} {"train_loss": -25.66078758239746, "global_step": 335970, "epoch": 4047} {"train_loss": -26.305561065673828, "global_step": 335971, "epoch": 4047} {"train_loss": -25.848676681518555, "global_step": 335972, "epoch": 4047} {"train_loss": -25.502567291259766, "global_step": 335973, "epoch": 4047} {"train_loss": -25.464141845703125, "global_step": 335974, "epoch": 4047} {"train_loss": -25.780088424682617, "global_step": 335975, "epoch": 4047} {"train_loss": -26.07637596130371, "global_step": 335976, "epoch": 4047} {"train_loss": -26.1814022064209, "global_step": 335977, "epoch": 4047} {"train_loss": -26.343210220336914, "global_step": 335978, "epoch": 4047} {"train_loss": -26.088361740112305, "global_step": 335979, "epoch": 4047} {"train_loss": -25.98408317565918, "global_step": 335980, "epoch": 4047} {"train_loss": -25.779211044311523, "global_step": 335981, "epoch": 4047} {"train_loss": -25.789663314819336, "global_step": 335982, "epoch": 4047} {"train_loss": -25.940848821617035, "global_step": 335983, "epoch": 4047, "val_loss": 6681664.5} {"train_loss": -25.63606834411621, "global_step": 335984, "epoch": 4048} {"train_loss": -25.273569107055664, "global_step": 335985, "epoch": 4048} {"train_loss": -25.873828887939453, "global_step": 335986, "epoch": 4048} {"train_loss": -25.71368980407715, "global_step": 335987, "epoch": 4048} {"train_loss": -25.501785278320312, "global_step": 335988, "epoch": 4048} {"train_loss": -25.978246688842773, "global_step": 335989, "epoch": 4048} {"train_loss": -25.959735870361328, "global_step": 335990, "epoch": 4048} {"train_loss": -25.4863224029541, "global_step": 335991, "epoch": 4048} {"train_loss": -26.0080509185791, "global_step": 335992, "epoch": 4048} {"train_loss": -25.698095321655273, "global_step": 335993, "epoch": 4048} {"train_loss": -25.716949462890625, "global_step": 335994, "epoch": 4048} {"train_loss": -25.8527889251709, "global_step": 335995, "epoch": 4048} {"train_loss": -26.148639678955078, "global_step": 335996, "epoch": 4048} {"train_loss": -26.10243034362793, "global_step": 335997, "epoch": 4048} {"train_loss": -25.743408203125, "global_step": 335998, "epoch": 4048} {"train_loss": -25.69185447692871, "global_step": 335999, "epoch": 4048} {"train_loss": -26.03369140625, "global_step": 336000, "epoch": 4048} {"train_loss": -25.951704025268555, "global_step": 336001, "epoch": 4048} {"train_loss": -26.09552574157715, "global_step": 336002, "epoch": 4048} {"train_loss": -26.016225814819336, "global_step": 336003, "epoch": 4048} {"train_loss": -26.060510635375977, "global_step": 336004, "epoch": 4048} {"train_loss": -26.0599365234375, "global_step": 336005, "epoch": 4048} {"train_loss": -26.204742431640625, "global_step": 336006, "epoch": 4048} {"train_loss": -26.024036407470703, "global_step": 336007, "epoch": 4048} {"train_loss": -25.818098068237305, "global_step": 336008, "epoch": 4048} {"train_loss": -25.8671875, "global_step": 336009, "epoch": 4048} {"train_loss": -25.92715835571289, "global_step": 336010, "epoch": 4048} {"train_loss": -26.10796546936035, "global_step": 336011, "epoch": 4048} {"train_loss": -25.668701171875, "global_step": 336012, "epoch": 4048} {"train_loss": -25.5968017578125, "global_step": 336013, "epoch": 4048} {"train_loss": -26.111547470092773, "global_step": 336014, "epoch": 4048} {"train_loss": -25.9589900970459, "global_step": 336015, "epoch": 4048} {"train_loss": -25.911046981811523, "global_step": 336016, "epoch": 4048} {"train_loss": -25.97784423828125, "global_step": 336017, "epoch": 4048} {"train_loss": -26.185230255126953, "global_step": 336018, "epoch": 4048} {"train_loss": -25.877599716186523, "global_step": 336019, "epoch": 4048} {"train_loss": -26.03742790222168, "global_step": 336020, "epoch": 4048} {"train_loss": -26.024921417236328, "global_step": 336021, "epoch": 4048} {"train_loss": -26.083770751953125, "global_step": 336022, "epoch": 4048} {"train_loss": -26.02154541015625, "global_step": 336023, "epoch": 4048} {"train_loss": -26.329694747924805, "global_step": 336024, "epoch": 4048} {"train_loss": -25.97955894470215, "global_step": 336025, "epoch": 4048} {"train_loss": -26.19939613342285, "global_step": 336026, "epoch": 4048} {"train_loss": -25.9979305267334, "global_step": 336027, "epoch": 4048} {"train_loss": -26.102981567382812, "global_step": 336028, "epoch": 4048} {"train_loss": -25.846771240234375, "global_step": 336029, "epoch": 4048} {"train_loss": -26.237512588500977, "global_step": 336030, "epoch": 4048} {"train_loss": -26.041669845581055, "global_step": 336031, "epoch": 4048} {"train_loss": -25.9476318359375, "global_step": 336032, "epoch": 4048} {"train_loss": -25.887399673461914, "global_step": 336033, "epoch": 4048} {"train_loss": -26.291030883789062, "global_step": 336034, "epoch": 4048} {"train_loss": -25.89483070373535, "global_step": 336035, "epoch": 4048} {"train_loss": -25.750457763671875, "global_step": 336036, "epoch": 4048} {"train_loss": -25.931379318237305, "global_step": 336037, "epoch": 4048} {"train_loss": -26.279006958007812, "global_step": 336038, "epoch": 4048} {"train_loss": -26.327224731445312, "global_step": 336039, "epoch": 4048} {"train_loss": -26.186304092407227, "global_step": 336040, "epoch": 4048} {"train_loss": -26.306812286376953, "global_step": 336041, "epoch": 4048} {"train_loss": -26.013608932495117, "global_step": 336042, "epoch": 4048} {"train_loss": -25.962371826171875, "global_step": 336043, "epoch": 4048} {"train_loss": -26.3823184967041, "global_step": 336044, "epoch": 4048} {"train_loss": -26.06027603149414, "global_step": 336045, "epoch": 4048} {"train_loss": -26.067279815673828, "global_step": 336046, "epoch": 4048} {"train_loss": -25.828596115112305, "global_step": 336047, "epoch": 4048} {"train_loss": -26.006994247436523, "global_step": 336048, "epoch": 4048} {"train_loss": -26.020727157592773, "global_step": 336049, "epoch": 4048} {"train_loss": -25.96490478515625, "global_step": 336050, "epoch": 4048} {"train_loss": -26.497989654541016, "global_step": 336051, "epoch": 4048} {"train_loss": -26.29852294921875, "global_step": 336052, "epoch": 4048} {"train_loss": -25.9695987701416, "global_step": 336053, "epoch": 4048} {"train_loss": -26.313947677612305, "global_step": 336054, "epoch": 4048} {"train_loss": -26.2665958404541, "global_step": 336055, "epoch": 4048} {"train_loss": -25.886056900024414, "global_step": 336056, "epoch": 4048} {"train_loss": -26.11298179626465, "global_step": 336057, "epoch": 4048} {"train_loss": -26.180618286132812, "global_step": 336058, "epoch": 4048} {"train_loss": -25.655532836914062, "global_step": 336059, "epoch": 4048} {"train_loss": -26.159143447875977, "global_step": 336060, "epoch": 4048} {"train_loss": -26.21173095703125, "global_step": 336061, "epoch": 4048} {"train_loss": -26.09735679626465, "global_step": 336062, "epoch": 4048} {"train_loss": -26.09258460998535, "global_step": 336063, "epoch": 4048} {"train_loss": -26.201627731323242, "global_step": 336064, "epoch": 4048} {"train_loss": -25.945829391479492, "global_step": 336065, "epoch": 4048} {"train_loss": -25.982025996748224, "global_step": 336066, "epoch": 4048, "val_loss": 6655703.0} {"train_loss": -25.35120964050293, "global_step": 336067, "epoch": 4049} {"train_loss": -25.15105628967285, "global_step": 336068, "epoch": 4049} {"train_loss": -25.82703971862793, "global_step": 336069, "epoch": 4049} {"train_loss": -25.46487045288086, "global_step": 336070, "epoch": 4049} {"train_loss": -25.524972915649414, "global_step": 336071, "epoch": 4049} {"train_loss": -25.261943817138672, "global_step": 336072, "epoch": 4049} {"train_loss": -25.174358367919922, "global_step": 336073, "epoch": 4049} {"train_loss": -24.88507652282715, "global_step": 336074, "epoch": 4049} {"train_loss": -25.419784545898438, "global_step": 336075, "epoch": 4049} {"train_loss": -25.8438663482666, "global_step": 336076, "epoch": 4049} {"train_loss": -25.654560089111328, "global_step": 336077, "epoch": 4049} {"train_loss": -25.58719825744629, "global_step": 336078, "epoch": 4049} {"train_loss": -25.63427734375, "global_step": 336079, "epoch": 4049} {"train_loss": -25.651498794555664, "global_step": 336080, "epoch": 4049} {"train_loss": -25.913305282592773, "global_step": 336081, "epoch": 4049} {"train_loss": -25.780324935913086, "global_step": 336082, "epoch": 4049} {"train_loss": -25.694549560546875, "global_step": 336083, "epoch": 4049} {"train_loss": -26.15057945251465, "global_step": 336084, "epoch": 4049} {"train_loss": -25.928457260131836, "global_step": 336085, "epoch": 4049} {"train_loss": -25.979894638061523, "global_step": 336086, "epoch": 4049} {"train_loss": -25.913183212280273, "global_step": 336087, "epoch": 4049} {"train_loss": -26.283130645751953, "global_step": 336088, "epoch": 4049} {"train_loss": -26.090423583984375, "global_step": 336089, "epoch": 4049} {"train_loss": -25.7652530670166, "global_step": 336090, "epoch": 4049} {"train_loss": -25.6307373046875, "global_step": 336091, "epoch": 4049} {"train_loss": -26.010297775268555, "global_step": 336092, "epoch": 4049} {"train_loss": -26.058923721313477, "global_step": 336093, "epoch": 4049} {"train_loss": -26.09248924255371, "global_step": 336094, "epoch": 4049} {"train_loss": -26.336252212524414, "global_step": 336095, "epoch": 4049} {"train_loss": -25.726947784423828, "global_step": 336096, "epoch": 4049} {"train_loss": -26.11040687561035, "global_step": 336097, "epoch": 4049} {"train_loss": -25.820789337158203, "global_step": 336098, "epoch": 4049} {"train_loss": -25.895557403564453, "global_step": 336099, "epoch": 4049} {"train_loss": -26.413007736206055, "global_step": 336100, "epoch": 4049} {"train_loss": -26.265623092651367, "global_step": 336101, "epoch": 4049} {"train_loss": -26.06808853149414, "global_step": 336102, "epoch": 4049} {"train_loss": -26.049375534057617, "global_step": 336103, "epoch": 4049} {"train_loss": -26.055089950561523, "global_step": 336104, "epoch": 4049} {"train_loss": -26.250288009643555, "global_step": 336105, "epoch": 4049} {"train_loss": -26.4217529296875, "global_step": 336106, "epoch": 4049} {"train_loss": -25.967182159423828, "global_step": 336107, "epoch": 4049} {"train_loss": -26.289764404296875, "global_step": 336108, "epoch": 4049} {"train_loss": -26.36374855041504, "global_step": 336109, "epoch": 4049} {"train_loss": -26.324445724487305, "global_step": 336110, "epoch": 4049} {"train_loss": -26.12212562561035, "global_step": 336111, "epoch": 4049} {"train_loss": -26.108978271484375, "global_step": 336112, "epoch": 4049} {"train_loss": -26.337228775024414, "global_step": 336113, "epoch": 4049} {"train_loss": -26.202917098999023, "global_step": 336114, "epoch": 4049} {"train_loss": -25.951934814453125, "global_step": 336115, "epoch": 4049} {"train_loss": -26.375106811523438, "global_step": 336116, "epoch": 4049} {"train_loss": -26.19696044921875, "global_step": 336117, "epoch": 4049} {"train_loss": -26.184797286987305, "global_step": 336118, "epoch": 4049} {"train_loss": -26.18048667907715, "global_step": 336119, "epoch": 4049} {"train_loss": -26.02850914001465, "global_step": 336120, "epoch": 4049} {"train_loss": -26.078088760375977, "global_step": 336121, "epoch": 4049} {"train_loss": -25.952838897705078, "global_step": 336122, "epoch": 4049} {"train_loss": -25.918912887573242, "global_step": 336123, "epoch": 4049} {"train_loss": -25.961416244506836, "global_step": 336124, "epoch": 4049} {"train_loss": -25.8839168548584, "global_step": 336125, "epoch": 4049} {"train_loss": -25.750600814819336, "global_step": 336126, "epoch": 4049} {"train_loss": -25.31804084777832, "global_step": 336127, "epoch": 4049} {"train_loss": -25.38524055480957, "global_step": 336128, "epoch": 4049} {"train_loss": -25.919408798217773, "global_step": 336129, "epoch": 4049} {"train_loss": -25.979907989501953, "global_step": 336130, "epoch": 4049} {"train_loss": -25.68281364440918, "global_step": 336131, "epoch": 4049} {"train_loss": -26.11240577697754, "global_step": 336132, "epoch": 4049} {"train_loss": -25.7648868560791, "global_step": 336133, "epoch": 4049} {"train_loss": -25.94109535217285, "global_step": 336134, "epoch": 4049} {"train_loss": -25.998046875, "global_step": 336135, "epoch": 4049} {"train_loss": -25.439823150634766, "global_step": 336136, "epoch": 4049} {"train_loss": -25.972333908081055, "global_step": 336137, "epoch": 4049} {"train_loss": -26.175703048706055, "global_step": 336138, "epoch": 4049} {"train_loss": -25.8796443939209, "global_step": 336139, "epoch": 4049} {"train_loss": -26.0490779876709, "global_step": 336140, "epoch": 4049} {"train_loss": -25.721036911010742, "global_step": 336141, "epoch": 4049} {"train_loss": -25.91437339782715, "global_step": 336142, "epoch": 4049} {"train_loss": -26.2893123626709, "global_step": 336143, "epoch": 4049} {"train_loss": -25.858631134033203, "global_step": 336144, "epoch": 4049} {"train_loss": -26.185626983642578, "global_step": 336145, "epoch": 4049} {"train_loss": -25.591209411621094, "global_step": 336146, "epoch": 4049} {"train_loss": -25.9865665435791, "global_step": 336147, "epoch": 4049} {"train_loss": -25.719501495361328, "global_step": 336148, "epoch": 4049} {"train_loss": -25.91561450728451, "global_step": 336149, "epoch": 4049, "val_loss": 6727006.0} {"train_loss": -25.695419311523438, "global_step": 336150, "epoch": 4050} {"train_loss": -25.954206466674805, "global_step": 336151, "epoch": 4050} {"train_loss": -25.810617446899414, "global_step": 336152, "epoch": 4050} {"train_loss": -25.7058162689209, "global_step": 336153, "epoch": 4050} {"train_loss": -25.939544677734375, "global_step": 336154, "epoch": 4050} {"train_loss": -25.801977157592773, "global_step": 336155, "epoch": 4050} {"train_loss": -25.8167667388916, "global_step": 336156, "epoch": 4050} {"train_loss": -26.27931785583496, "global_step": 336157, "epoch": 4050} {"train_loss": -26.16946792602539, "global_step": 336158, "epoch": 4050} {"train_loss": -25.772558212280273, "global_step": 336159, "epoch": 4050} {"train_loss": -26.07387351989746, "global_step": 336160, "epoch": 4050} {"train_loss": -25.85170555114746, "global_step": 336161, "epoch": 4050} {"train_loss": -26.11842155456543, "global_step": 336162, "epoch": 4050} {"train_loss": -26.47113609313965, "global_step": 336163, "epoch": 4050} {"train_loss": -26.002883911132812, "global_step": 336164, "epoch": 4050} {"train_loss": -26.022836685180664, "global_step": 336165, "epoch": 4050} {"train_loss": -26.156274795532227, "global_step": 336166, "epoch": 4050} {"train_loss": -26.045251846313477, "global_step": 336167, "epoch": 4050} {"train_loss": -25.809675216674805, "global_step": 336168, "epoch": 4050} {"train_loss": -25.53643226623535, "global_step": 336169, "epoch": 4050} {"train_loss": -25.3105411529541, "global_step": 336170, "epoch": 4050} {"train_loss": -25.975778579711914, "global_step": 336171, "epoch": 4050} {"train_loss": -25.88813591003418, "global_step": 336172, "epoch": 4050} {"train_loss": -25.792749404907227, "global_step": 336173, "epoch": 4050} {"train_loss": -26.089811325073242, "global_step": 336174, "epoch": 4050} {"train_loss": -26.201007843017578, "global_step": 336175, "epoch": 4050} {"train_loss": -25.98345375061035, "global_step": 336176, "epoch": 4050} {"train_loss": -25.960607528686523, "global_step": 336177, "epoch": 4050} {"train_loss": -26.003820419311523, "global_step": 336178, "epoch": 4050} {"train_loss": -26.149200439453125, "global_step": 336179, "epoch": 4050} {"train_loss": -25.860919952392578, "global_step": 336180, "epoch": 4050} {"train_loss": -25.92487144470215, "global_step": 336181, "epoch": 4050} {"train_loss": -25.980749130249023, "global_step": 336182, "epoch": 4050} {"train_loss": -26.10096549987793, "global_step": 336183, "epoch": 4050} {"train_loss": -26.086400985717773, "global_step": 336184, "epoch": 4050} {"train_loss": -26.22346305847168, "global_step": 336185, "epoch": 4050} {"train_loss": -26.033679962158203, "global_step": 336186, "epoch": 4050} {"train_loss": -26.060277938842773, "global_step": 336187, "epoch": 4050} {"train_loss": -25.643301010131836, "global_step": 336188, "epoch": 4050} {"train_loss": -25.911157608032227, "global_step": 336189, "epoch": 4050} {"train_loss": -26.064924240112305, "global_step": 336190, "epoch": 4050} {"train_loss": -26.14272117614746, "global_step": 336191, "epoch": 4050} {"train_loss": -25.484716415405273, "global_step": 336192, "epoch": 4050} {"train_loss": -25.915395736694336, "global_step": 336193, "epoch": 4050} {"train_loss": -26.112232208251953, "global_step": 336194, "epoch": 4050} {"train_loss": -26.186609268188477, "global_step": 336195, "epoch": 4050} {"train_loss": -26.257551193237305, "global_step": 336196, "epoch": 4050} {"train_loss": -26.056522369384766, "global_step": 336197, "epoch": 4050} {"train_loss": -26.102222442626953, "global_step": 336198, "epoch": 4050} {"train_loss": -26.1711483001709, "global_step": 336199, "epoch": 4050} {"train_loss": -26.693716049194336, "global_step": 336200, "epoch": 4050} {"train_loss": -26.333032608032227, "global_step": 336201, "epoch": 4050} {"train_loss": -26.109699249267578, "global_step": 336202, "epoch": 4050} {"train_loss": -26.344974517822266, "global_step": 336203, "epoch": 4050} {"train_loss": -26.22157096862793, "global_step": 336204, "epoch": 4050} {"train_loss": -25.97651481628418, "global_step": 336205, "epoch": 4050} {"train_loss": -26.31458854675293, "global_step": 336206, "epoch": 4050} {"train_loss": -26.200286865234375, "global_step": 336207, "epoch": 4050} {"train_loss": -26.03546142578125, "global_step": 336208, "epoch": 4050} {"train_loss": -26.101720809936523, "global_step": 336209, "epoch": 4050} {"train_loss": -26.1938419342041, "global_step": 336210, "epoch": 4050} {"train_loss": -26.255651473999023, "global_step": 336211, "epoch": 4050} {"train_loss": -26.39664649963379, "global_step": 336212, "epoch": 4050} {"train_loss": -26.548480987548828, "global_step": 336213, "epoch": 4050} {"train_loss": -26.246381759643555, "global_step": 336214, "epoch": 4050} {"train_loss": -25.940988540649414, "global_step": 336215, "epoch": 4050} {"train_loss": -25.8059024810791, "global_step": 336216, "epoch": 4050} {"train_loss": -25.872507095336914, "global_step": 336217, "epoch": 4050} {"train_loss": -25.557802200317383, "global_step": 336218, "epoch": 4050} {"train_loss": -26.339111328125, "global_step": 336219, "epoch": 4050} {"train_loss": -25.883625030517578, "global_step": 336220, "epoch": 4050} {"train_loss": -25.79910659790039, "global_step": 336221, "epoch": 4050} {"train_loss": -25.882444381713867, "global_step": 336222, "epoch": 4050} {"train_loss": -26.3494815826416, "global_step": 336223, "epoch": 4050} {"train_loss": -26.22340202331543, "global_step": 336224, "epoch": 4050} {"train_loss": -26.199514389038086, "global_step": 336225, "epoch": 4050} {"train_loss": -26.1677303314209, "global_step": 336226, "epoch": 4050} {"train_loss": -25.539670944213867, "global_step": 336227, "epoch": 4050} {"train_loss": -26.470996856689453, "global_step": 336228, "epoch": 4050} {"train_loss": -26.423187255859375, "global_step": 336229, "epoch": 4050} {"train_loss": -25.665496826171875, "global_step": 336230, "epoch": 4050} {"train_loss": -25.65923500061035, "global_step": 336231, "epoch": 4050} {"train_loss": -26.03120695826519, "global_step": 336232, "epoch": 4050, "train/sim_max_reward_0": 1.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4500000": 1.0, "test/sim_max_reward_4500001": 1.0, "test/sim_max_reward_4500002": 1.0, "test/sim_max_reward_4500003": 1.0, "test/sim_max_reward_4500004": 1.0, "test/sim_max_reward_4500005": 1.0, "test/sim_max_reward_4500006": 1.0, "test/sim_max_reward_4500007": 0.0, "test/sim_max_reward_4500008": 1.0, "test/sim_max_reward_4500009": 1.0, "test/sim_max_reward_4500010": 1.0, "test/sim_max_reward_4500011": 1.0, "test/sim_max_reward_4500012": 1.0, "test/sim_max_reward_4500013": 0.0, "test/sim_max_reward_4500014": 1.0, "test/sim_max_reward_4500015": 1.0, "test/sim_max_reward_4500016": 1.0, "test/sim_max_reward_4500017": 1.0, "test/sim_max_reward_4500018": 1.0, "test/sim_max_reward_4500019": 0.0, "test/sim_max_reward_4500020": 1.0, "test/sim_max_reward_4500021": 1.0, "train/mean_score": 1.0, "test/mean_score": 0.8636363636363636, "val_loss": 6696719.0} {"train_loss": -25.624128341674805, "global_step": 336233, "epoch": 4051} {"train_loss": -24.874753952026367, "global_step": 336234, "epoch": 4051} {"train_loss": -25.33746337890625, "global_step": 336235, "epoch": 4051} {"train_loss": -25.555692672729492, "global_step": 336236, "epoch": 4051} {"train_loss": -25.633153915405273, "global_step": 336237, "epoch": 4051} {"train_loss": -25.415056228637695, "global_step": 336238, "epoch": 4051} {"train_loss": -25.5814266204834, "global_step": 336239, "epoch": 4051} {"train_loss": -25.237924575805664, "global_step": 336240, "epoch": 4051} {"train_loss": -25.5690975189209, "global_step": 336241, "epoch": 4051} {"train_loss": -25.544118881225586, "global_step": 336242, "epoch": 4051} {"train_loss": -25.590946197509766, "global_step": 336243, "epoch": 4051} {"train_loss": -25.943897247314453, "global_step": 336244, "epoch": 4051} {"train_loss": -25.67563819885254, "global_step": 336245, "epoch": 4051} {"train_loss": -25.918872833251953, "global_step": 336246, "epoch": 4051} {"train_loss": -25.65333366394043, "global_step": 336247, "epoch": 4051} {"train_loss": -25.713205337524414, "global_step": 336248, "epoch": 4051} {"train_loss": -26.02153968811035, "global_step": 336249, "epoch": 4051} {"train_loss": -25.779056549072266, "global_step": 336250, "epoch": 4051} {"train_loss": -25.788022994995117, "global_step": 336251, "epoch": 4051} {"train_loss": -25.973119735717773, "global_step": 336252, "epoch": 4051} {"train_loss": -25.813831329345703, "global_step": 336253, "epoch": 4051} {"train_loss": -26.01478385925293, "global_step": 336254, "epoch": 4051} {"train_loss": -25.8028621673584, "global_step": 336255, "epoch": 4051} {"train_loss": -25.934057235717773, "global_step": 336256, "epoch": 4051} {"train_loss": -26.15131950378418, "global_step": 336257, "epoch": 4051} {"train_loss": -25.872360229492188, "global_step": 336258, "epoch": 4051} {"train_loss": -25.82529067993164, "global_step": 336259, "epoch": 4051} {"train_loss": -25.716562271118164, "global_step": 336260, "epoch": 4051} {"train_loss": -25.71185874938965, "global_step": 336261, "epoch": 4051} {"train_loss": -25.846105575561523, "global_step": 336262, "epoch": 4051} {"train_loss": -26.04402732849121, "global_step": 336263, "epoch": 4051} {"train_loss": -25.7259521484375, "global_step": 336264, "epoch": 4051} {"train_loss": -26.17219352722168, "global_step": 336265, "epoch": 4051} {"train_loss": -25.836713790893555, "global_step": 336266, "epoch": 4051} {"train_loss": -26.18906593322754, "global_step": 336267, "epoch": 4051} {"train_loss": -26.459028244018555, "global_step": 336268, "epoch": 4051} {"train_loss": -26.14902687072754, "global_step": 336269, "epoch": 4051} {"train_loss": -25.746667861938477, "global_step": 336270, "epoch": 4051} {"train_loss": -26.093708038330078, "global_step": 336271, "epoch": 4051} {"train_loss": -26.133710861206055, "global_step": 336272, "epoch": 4051} {"train_loss": -26.204862594604492, "global_step": 336273, "epoch": 4051} {"train_loss": -25.977582931518555, "global_step": 336274, "epoch": 4051} {"train_loss": -25.82813835144043, "global_step": 336275, "epoch": 4051} {"train_loss": -25.7181396484375, "global_step": 336276, "epoch": 4051} {"train_loss": -26.094587326049805, "global_step": 336277, "epoch": 4051} {"train_loss": -26.08646583557129, "global_step": 336278, "epoch": 4051} {"train_loss": -25.68256187438965, "global_step": 336279, "epoch": 4051} {"train_loss": -26.0882511138916, "global_step": 336280, "epoch": 4051} {"train_loss": -26.00526237487793, "global_step": 336281, "epoch": 4051} {"train_loss": -25.96074867248535, "global_step": 336282, "epoch": 4051} {"train_loss": -25.676910400390625, "global_step": 336283, "epoch": 4051} {"train_loss": -25.965925216674805, "global_step": 336284, "epoch": 4051} {"train_loss": -25.98805046081543, "global_step": 336285, "epoch": 4051} {"train_loss": -26.02482032775879, "global_step": 336286, "epoch": 4051} {"train_loss": -26.14009666442871, "global_step": 336287, "epoch": 4051} {"train_loss": -26.24471092224121, "global_step": 336288, "epoch": 4051} {"train_loss": -26.10749626159668, "global_step": 336289, "epoch": 4051} {"train_loss": -25.97853660583496, "global_step": 336290, "epoch": 4051} {"train_loss": -25.809253692626953, "global_step": 336291, "epoch": 4051} {"train_loss": -25.988357543945312, "global_step": 336292, "epoch": 4051} {"train_loss": -26.383834838867188, "global_step": 336293, "epoch": 4051} {"train_loss": -25.87476921081543, "global_step": 336294, "epoch": 4051} {"train_loss": -25.76407814025879, "global_step": 336295, "epoch": 4051} {"train_loss": -26.176549911499023, "global_step": 336296, "epoch": 4051} {"train_loss": -26.030179977416992, "global_step": 336297, "epoch": 4051} {"train_loss": -25.7260684967041, "global_step": 336298, "epoch": 4051} {"train_loss": -26.227659225463867, "global_step": 336299, "epoch": 4051} {"train_loss": -26.039936065673828, "global_step": 336300, "epoch": 4051} {"train_loss": -26.034900665283203, "global_step": 336301, "epoch": 4051} {"train_loss": -26.124414443969727, "global_step": 336302, "epoch": 4051} {"train_loss": -26.172657012939453, "global_step": 336303, "epoch": 4051} {"train_loss": -26.165512084960938, "global_step": 336304, "epoch": 4051} {"train_loss": -26.25531005859375, "global_step": 336305, "epoch": 4051} {"train_loss": -26.17551612854004, "global_step": 336306, "epoch": 4051} {"train_loss": -26.243207931518555, "global_step": 336307, "epoch": 4051} {"train_loss": -26.316638946533203, "global_step": 336308, "epoch": 4051} {"train_loss": -25.93365478515625, "global_step": 336309, "epoch": 4051} {"train_loss": -26.213712692260742, "global_step": 336310, "epoch": 4051} {"train_loss": -26.210525512695312, "global_step": 336311, "epoch": 4051} {"train_loss": -26.203617095947266, "global_step": 336312, "epoch": 4051} {"train_loss": -26.04962730407715, "global_step": 336313, "epoch": 4051} {"train_loss": -26.135852813720703, "global_step": 336314, "epoch": 4051} {"train_loss": -25.92720849829984, "global_step": 336315, "epoch": 4051, "val_loss": 6784576.5} {"train_loss": -25.661117553710938, "global_step": 336316, "epoch": 4052} {"train_loss": -24.69696044921875, "global_step": 336317, "epoch": 4052} {"train_loss": -25.01926040649414, "global_step": 336318, "epoch": 4052} {"train_loss": -25.8726806640625, "global_step": 336319, "epoch": 4052} {"train_loss": -25.12662696838379, "global_step": 336320, "epoch": 4052} {"train_loss": -25.03916358947754, "global_step": 336321, "epoch": 4052} {"train_loss": -24.820772171020508, "global_step": 336322, "epoch": 4052} {"train_loss": -25.694263458251953, "global_step": 336323, "epoch": 4052} {"train_loss": -24.930940628051758, "global_step": 336324, "epoch": 4052} {"train_loss": -24.667707443237305, "global_step": 336325, "epoch": 4052} {"train_loss": -25.44049072265625, "global_step": 336326, "epoch": 4052} {"train_loss": -25.303359985351562, "global_step": 336327, "epoch": 4052} {"train_loss": -25.293209075927734, "global_step": 336328, "epoch": 4052} {"train_loss": -25.32268714904785, "global_step": 336329, "epoch": 4052} {"train_loss": -25.092697143554688, "global_step": 336330, "epoch": 4052} {"train_loss": -25.384920120239258, "global_step": 336331, "epoch": 4052} {"train_loss": -25.338546752929688, "global_step": 336332, "epoch": 4052} {"train_loss": -25.265493392944336, "global_step": 336333, "epoch": 4052} {"train_loss": -25.773456573486328, "global_step": 336334, "epoch": 4052} {"train_loss": -25.32770538330078, "global_step": 336335, "epoch": 4052} {"train_loss": -25.53809928894043, "global_step": 336336, "epoch": 4052} {"train_loss": -25.538679122924805, "global_step": 336337, "epoch": 4052} {"train_loss": -26.200056076049805, "global_step": 336338, "epoch": 4052} {"train_loss": -25.721546173095703, "global_step": 336339, "epoch": 4052} {"train_loss": -26.09454345703125, "global_step": 336340, "epoch": 4052} {"train_loss": -25.648971557617188, "global_step": 336341, "epoch": 4052} {"train_loss": -25.628894805908203, "global_step": 336342, "epoch": 4052} {"train_loss": -26.2313289642334, "global_step": 336343, "epoch": 4052} {"train_loss": -25.652936935424805, "global_step": 336344, "epoch": 4052} {"train_loss": -25.85572624206543, "global_step": 336345, "epoch": 4052} {"train_loss": -25.67156410217285, "global_step": 336346, "epoch": 4052} {"train_loss": -25.7675838470459, "global_step": 336347, "epoch": 4052} {"train_loss": -25.779626846313477, "global_step": 336348, "epoch": 4052} {"train_loss": -25.99787712097168, "global_step": 336349, "epoch": 4052} {"train_loss": -25.960660934448242, "global_step": 336350, "epoch": 4052} {"train_loss": -25.72603416442871, "global_step": 336351, "epoch": 4052} {"train_loss": -26.003515243530273, "global_step": 336352, "epoch": 4052} {"train_loss": -25.772607803344727, "global_step": 336353, "epoch": 4052} {"train_loss": -26.133779525756836, "global_step": 336354, "epoch": 4052} {"train_loss": -26.089038848876953, "global_step": 336355, "epoch": 4052} {"train_loss": -25.87312126159668, "global_step": 336356, "epoch": 4052} {"train_loss": -25.727231979370117, "global_step": 336357, "epoch": 4052} {"train_loss": -26.129362106323242, "global_step": 336358, "epoch": 4052} {"train_loss": -25.802724838256836, "global_step": 336359, "epoch": 4052} {"train_loss": -26.097110748291016, "global_step": 336360, "epoch": 4052} {"train_loss": -25.8247013092041, "global_step": 336361, "epoch": 4052} {"train_loss": -26.355880737304688, "global_step": 336362, "epoch": 4052} {"train_loss": -26.026596069335938, "global_step": 336363, "epoch": 4052} {"train_loss": -25.965137481689453, "global_step": 336364, "epoch": 4052} {"train_loss": -25.804677963256836, "global_step": 336365, "epoch": 4052} {"train_loss": -25.572114944458008, "global_step": 336366, "epoch": 4052} {"train_loss": -26.226850509643555, "global_step": 336367, "epoch": 4052} {"train_loss": -25.928741455078125, "global_step": 336368, "epoch": 4052} {"train_loss": -26.040924072265625, "global_step": 336369, "epoch": 4052} {"train_loss": -25.717023849487305, "global_step": 336370, "epoch": 4052} {"train_loss": -26.30628776550293, "global_step": 336371, "epoch": 4052} {"train_loss": -26.038406372070312, "global_step": 336372, "epoch": 4052} {"train_loss": -25.920303344726562, "global_step": 336373, "epoch": 4052} {"train_loss": -25.92120361328125, "global_step": 336374, "epoch": 4052} {"train_loss": -26.283044815063477, "global_step": 336375, "epoch": 4052} {"train_loss": -26.238737106323242, "global_step": 336376, "epoch": 4052} {"train_loss": -26.12298011779785, "global_step": 336377, "epoch": 4052} {"train_loss": -25.965972900390625, "global_step": 336378, "epoch": 4052} {"train_loss": -25.663898468017578, "global_step": 336379, "epoch": 4052} {"train_loss": -25.989166259765625, "global_step": 336380, "epoch": 4052} {"train_loss": -26.080718994140625, "global_step": 336381, "epoch": 4052} {"train_loss": -26.212909698486328, "global_step": 336382, "epoch": 4052} {"train_loss": -26.284072875976562, "global_step": 336383, "epoch": 4052} {"train_loss": -25.801660537719727, "global_step": 336384, "epoch": 4052} {"train_loss": -25.992267608642578, "global_step": 336385, "epoch": 4052} {"train_loss": -26.0731201171875, "global_step": 336386, "epoch": 4052} {"train_loss": -25.851545333862305, "global_step": 336387, "epoch": 4052} {"train_loss": -26.025054931640625, "global_step": 336388, "epoch": 4052} {"train_loss": -26.698156356811523, "global_step": 336389, "epoch": 4052} {"train_loss": -25.808979034423828, "global_step": 336390, "epoch": 4052} {"train_loss": -26.34636878967285, "global_step": 336391, "epoch": 4052} {"train_loss": -26.2752742767334, "global_step": 336392, "epoch": 4052} {"train_loss": -26.035566329956055, "global_step": 336393, "epoch": 4052} {"train_loss": -26.3057861328125, "global_step": 336394, "epoch": 4052} {"train_loss": -25.972326278686523, "global_step": 336395, "epoch": 4052} {"train_loss": -26.040302276611328, "global_step": 336396, "epoch": 4052} {"train_loss": -26.14719581604004, "global_step": 336397, "epoch": 4052} {"train_loss": -25.828604364969646, "global_step": 336398, "epoch": 4052, "val_loss": 6799712.0} {"train_loss": -23.951684951782227, "global_step": 336399, "epoch": 4053} {"train_loss": -25.092212677001953, "global_step": 336400, "epoch": 4053} {"train_loss": -25.0308895111084, "global_step": 336401, "epoch": 4053} {"train_loss": -25.000673294067383, "global_step": 336402, "epoch": 4053} {"train_loss": -24.790220260620117, "global_step": 336403, "epoch": 4053} {"train_loss": -25.550146102905273, "global_step": 336404, "epoch": 4053} {"train_loss": -24.996435165405273, "global_step": 336405, "epoch": 4053} {"train_loss": -25.439237594604492, "global_step": 336406, "epoch": 4053} {"train_loss": -25.303964614868164, "global_step": 336407, "epoch": 4053} {"train_loss": -25.08062171936035, "global_step": 336408, "epoch": 4053} {"train_loss": -25.462358474731445, "global_step": 336409, "epoch": 4053} {"train_loss": -25.251007080078125, "global_step": 336410, "epoch": 4053} {"train_loss": -25.478147506713867, "global_step": 336411, "epoch": 4053} {"train_loss": -25.22430992126465, "global_step": 336412, "epoch": 4053} {"train_loss": -25.22535514831543, "global_step": 336413, "epoch": 4053} {"train_loss": -25.204544067382812, "global_step": 336414, "epoch": 4053} {"train_loss": -25.700458526611328, "global_step": 336415, "epoch": 4053} {"train_loss": -25.190858840942383, "global_step": 336416, "epoch": 4053} {"train_loss": -25.673246383666992, "global_step": 336417, "epoch": 4053} {"train_loss": -25.5322265625, "global_step": 336418, "epoch": 4053} {"train_loss": -25.538244247436523, "global_step": 336419, "epoch": 4053} {"train_loss": -25.246023178100586, "global_step": 336420, "epoch": 4053} {"train_loss": -25.4853572845459, "global_step": 336421, "epoch": 4053} {"train_loss": -25.723419189453125, "global_step": 336422, "epoch": 4053} {"train_loss": -25.6104793548584, "global_step": 336423, "epoch": 4053} {"train_loss": -25.94239616394043, "global_step": 336424, "epoch": 4053} {"train_loss": -25.75315284729004, "global_step": 336425, "epoch": 4053} {"train_loss": -25.93511390686035, "global_step": 336426, "epoch": 4053} {"train_loss": -25.79157829284668, "global_step": 336427, "epoch": 4053} {"train_loss": -25.700891494750977, "global_step": 336428, "epoch": 4053} {"train_loss": -25.61542320251465, "global_step": 336429, "epoch": 4053} {"train_loss": -25.655017852783203, "global_step": 336430, "epoch": 4053} {"train_loss": -25.841657638549805, "global_step": 336431, "epoch": 4053} {"train_loss": -26.213171005249023, "global_step": 336432, "epoch": 4053} {"train_loss": -25.944726943969727, "global_step": 336433, "epoch": 4053} {"train_loss": -25.840436935424805, "global_step": 336434, "epoch": 4053} {"train_loss": -26.02137565612793, "global_step": 336435, "epoch": 4053} {"train_loss": -25.855009078979492, "global_step": 336436, "epoch": 4053} {"train_loss": -25.999658584594727, "global_step": 336437, "epoch": 4053} {"train_loss": -25.927152633666992, "global_step": 336438, "epoch": 4053} {"train_loss": -26.03500747680664, "global_step": 336439, "epoch": 4053} {"train_loss": -26.004928588867188, "global_step": 336440, "epoch": 4053} {"train_loss": -26.18415641784668, "global_step": 336441, "epoch": 4053} {"train_loss": -26.099384307861328, "global_step": 336442, "epoch": 4053} {"train_loss": -25.94976234436035, "global_step": 336443, "epoch": 4053} {"train_loss": -26.244260787963867, "global_step": 336444, "epoch": 4053} {"train_loss": -26.108261108398438, "global_step": 336445, "epoch": 4053} {"train_loss": -25.895315170288086, "global_step": 336446, "epoch": 4053} {"train_loss": -25.728734970092773, "global_step": 336447, "epoch": 4053} {"train_loss": -26.173871994018555, "global_step": 336448, "epoch": 4053} {"train_loss": -25.84158706665039, "global_step": 336449, "epoch": 4053} {"train_loss": -25.64678382873535, "global_step": 336450, "epoch": 4053} {"train_loss": -26.007673263549805, "global_step": 336451, "epoch": 4053} {"train_loss": -26.29543113708496, "global_step": 336452, "epoch": 4053} {"train_loss": -25.634992599487305, "global_step": 336453, "epoch": 4053} {"train_loss": -25.756671905517578, "global_step": 336454, "epoch": 4053} {"train_loss": -26.18109130859375, "global_step": 336455, "epoch": 4053} {"train_loss": -26.173009872436523, "global_step": 336456, "epoch": 4053} {"train_loss": -25.952056884765625, "global_step": 336457, "epoch": 4053} {"train_loss": -25.82988929748535, "global_step": 336458, "epoch": 4053} {"train_loss": -26.10993766784668, "global_step": 336459, "epoch": 4053} {"train_loss": -26.11079216003418, "global_step": 336460, "epoch": 4053} {"train_loss": -25.989789962768555, "global_step": 336461, "epoch": 4053} {"train_loss": -25.777297973632812, "global_step": 336462, "epoch": 4053} {"train_loss": -26.295312881469727, "global_step": 336463, "epoch": 4053} {"train_loss": -26.33552360534668, "global_step": 336464, "epoch": 4053} {"train_loss": -26.04205894470215, "global_step": 336465, "epoch": 4053} {"train_loss": -26.173940658569336, "global_step": 336466, "epoch": 4053} {"train_loss": -25.938467025756836, "global_step": 336467, "epoch": 4053} {"train_loss": -25.80088233947754, "global_step": 336468, "epoch": 4053} {"train_loss": -26.019262313842773, "global_step": 336469, "epoch": 4053} {"train_loss": -25.9268856048584, "global_step": 336470, "epoch": 4053} {"train_loss": -25.891300201416016, "global_step": 336471, "epoch": 4053} {"train_loss": -25.781585693359375, "global_step": 336472, "epoch": 4053} {"train_loss": -26.269926071166992, "global_step": 336473, "epoch": 4053} {"train_loss": -26.05816650390625, "global_step": 336474, "epoch": 4053} {"train_loss": -26.44185447692871, "global_step": 336475, "epoch": 4053} {"train_loss": -26.082401275634766, "global_step": 336476, "epoch": 4053} {"train_loss": -25.9761905670166, "global_step": 336477, "epoch": 4053} {"train_loss": -26.115636825561523, "global_step": 336478, "epoch": 4053} {"train_loss": -26.364782333374023, "global_step": 336479, "epoch": 4053} {"train_loss": -25.68194580078125, "global_step": 336480, "epoch": 4053} {"train_loss": -25.78565558468003, "global_step": 336481, "epoch": 4053, "val_loss": 6764438.5} {"train_loss": -24.91901206970215, "global_step": 336482, "epoch": 4054} {"train_loss": -23.506412506103516, "global_step": 336483, "epoch": 4054} {"train_loss": -23.083908081054688, "global_step": 336484, "epoch": 4054} {"train_loss": -25.1370849609375, "global_step": 336485, "epoch": 4054} {"train_loss": -24.87727165222168, "global_step": 336486, "epoch": 4054} {"train_loss": -25.13558006286621, "global_step": 336487, "epoch": 4054} {"train_loss": -24.956811904907227, "global_step": 336488, "epoch": 4054} {"train_loss": -25.635440826416016, "global_step": 336489, "epoch": 4054} {"train_loss": -24.910276412963867, "global_step": 336490, "epoch": 4054} {"train_loss": -25.076696395874023, "global_step": 336491, "epoch": 4054} {"train_loss": -25.247751235961914, "global_step": 336492, "epoch": 4054} {"train_loss": -25.336002349853516, "global_step": 336493, "epoch": 4054} {"train_loss": -25.58381462097168, "global_step": 336494, "epoch": 4054} {"train_loss": -25.337244033813477, "global_step": 336495, "epoch": 4054} {"train_loss": -25.182058334350586, "global_step": 336496, "epoch": 4054} {"train_loss": -25.479528427124023, "global_step": 336497, "epoch": 4054} {"train_loss": -25.43861198425293, "global_step": 336498, "epoch": 4054} {"train_loss": -25.419179916381836, "global_step": 336499, "epoch": 4054} {"train_loss": -25.60972023010254, "global_step": 336500, "epoch": 4054} {"train_loss": -25.74146842956543, "global_step": 336501, "epoch": 4054} {"train_loss": -25.26614761352539, "global_step": 336502, "epoch": 4054} {"train_loss": -25.544200897216797, "global_step": 336503, "epoch": 4054} {"train_loss": -25.565906524658203, "global_step": 336504, "epoch": 4054} {"train_loss": -25.51388931274414, "global_step": 336505, "epoch": 4054} {"train_loss": -25.69902992248535, "global_step": 336506, "epoch": 4054} {"train_loss": -25.888891220092773, "global_step": 336507, "epoch": 4054} {"train_loss": -25.94292640686035, "global_step": 336508, "epoch": 4054} {"train_loss": -25.964941024780273, "global_step": 336509, "epoch": 4054} {"train_loss": -25.9293270111084, "global_step": 336510, "epoch": 4054} {"train_loss": -25.801374435424805, "global_step": 336511, "epoch": 4054} {"train_loss": -25.99236488342285, "global_step": 336512, "epoch": 4054} {"train_loss": -25.61878776550293, "global_step": 336513, "epoch": 4054} {"train_loss": -25.887531280517578, "global_step": 336514, "epoch": 4054} {"train_loss": -25.993738174438477, "global_step": 336515, "epoch": 4054} {"train_loss": -25.927490234375, "global_step": 336516, "epoch": 4054} {"train_loss": -26.24112892150879, "global_step": 336517, "epoch": 4054} {"train_loss": -26.300561904907227, "global_step": 336518, "epoch": 4054} {"train_loss": -26.013395309448242, "global_step": 336519, "epoch": 4054} {"train_loss": -25.915546417236328, "global_step": 336520, "epoch": 4054} {"train_loss": -25.81764793395996, "global_step": 336521, "epoch": 4054} {"train_loss": -26.174352645874023, "global_step": 336522, "epoch": 4054} {"train_loss": -25.96317481994629, "global_step": 336523, "epoch": 4054} {"train_loss": -25.8631591796875, "global_step": 336524, "epoch": 4054} {"train_loss": -26.034229278564453, "global_step": 336525, "epoch": 4054} {"train_loss": -26.064172744750977, "global_step": 336526, "epoch": 4054} {"train_loss": -25.91328239440918, "global_step": 336527, "epoch": 4054} {"train_loss": -26.03948402404785, "global_step": 336528, "epoch": 4054} {"train_loss": -26.02092933654785, "global_step": 336529, "epoch": 4054} {"train_loss": -26.27853775024414, "global_step": 336530, "epoch": 4054} {"train_loss": -26.008447647094727, "global_step": 336531, "epoch": 4054} {"train_loss": -25.70376968383789, "global_step": 336532, "epoch": 4054} {"train_loss": -25.954736709594727, "global_step": 336533, "epoch": 4054} {"train_loss": -25.813627243041992, "global_step": 336534, "epoch": 4054} {"train_loss": -25.96358299255371, "global_step": 336535, "epoch": 4054} {"train_loss": -25.9857120513916, "global_step": 336536, "epoch": 4054} {"train_loss": -25.655332565307617, "global_step": 336537, "epoch": 4054} {"train_loss": -26.27906608581543, "global_step": 336538, "epoch": 4054} {"train_loss": -26.586872100830078, "global_step": 336539, "epoch": 4054} {"train_loss": -26.176130294799805, "global_step": 336540, "epoch": 4054} {"train_loss": -26.34877586364746, "global_step": 336541, "epoch": 4054} {"train_loss": -26.06892967224121, "global_step": 336542, "epoch": 4054} {"train_loss": -26.338964462280273, "global_step": 336543, "epoch": 4054} {"train_loss": -26.471698760986328, "global_step": 336544, "epoch": 4054} {"train_loss": -26.34869956970215, "global_step": 336545, "epoch": 4054} {"train_loss": -26.36006736755371, "global_step": 336546, "epoch": 4054} {"train_loss": -25.926183700561523, "global_step": 336547, "epoch": 4054} {"train_loss": -26.009374618530273, "global_step": 336548, "epoch": 4054} {"train_loss": -26.774999618530273, "global_step": 336549, "epoch": 4054} {"train_loss": -25.941633224487305, "global_step": 336550, "epoch": 4054} {"train_loss": -26.20332145690918, "global_step": 336551, "epoch": 4054} {"train_loss": -26.133764266967773, "global_step": 336552, "epoch": 4054} {"train_loss": -26.176061630249023, "global_step": 336553, "epoch": 4054} {"train_loss": -25.794065475463867, "global_step": 336554, "epoch": 4054} {"train_loss": -26.0242862701416, "global_step": 336555, "epoch": 4054} {"train_loss": -25.977191925048828, "global_step": 336556, "epoch": 4054} {"train_loss": -25.911725997924805, "global_step": 336557, "epoch": 4054} {"train_loss": -26.259687423706055, "global_step": 336558, "epoch": 4054} {"train_loss": -25.448265075683594, "global_step": 336559, "epoch": 4054} {"train_loss": -25.365102767944336, "global_step": 336560, "epoch": 4054} {"train_loss": -25.696008682250977, "global_step": 336561, "epoch": 4054} {"train_loss": -26.24879264831543, "global_step": 336562, "epoch": 4054} {"train_loss": -25.437044143676758, "global_step": 336563, "epoch": 4054} {"train_loss": -25.74591871054776, "global_step": 336564, "epoch": 4054, "val_loss": 6659116.0} {"train_loss": -24.275983810424805, "global_step": 336565, "epoch": 4055} {"train_loss": -21.28708839416504, "global_step": 336566, "epoch": 4055} {"train_loss": -24.109161376953125, "global_step": 336567, "epoch": 4055} {"train_loss": -23.501798629760742, "global_step": 336568, "epoch": 4055} {"train_loss": -23.26213264465332, "global_step": 336569, "epoch": 4055} {"train_loss": -24.894357681274414, "global_step": 336570, "epoch": 4055} {"train_loss": -24.018795013427734, "global_step": 336571, "epoch": 4055} {"train_loss": -25.017169952392578, "global_step": 336572, "epoch": 4055} {"train_loss": -24.26923942565918, "global_step": 336573, "epoch": 4055} {"train_loss": -24.985578536987305, "global_step": 336574, "epoch": 4055} {"train_loss": -24.689069747924805, "global_step": 336575, "epoch": 4055} {"train_loss": -24.966176986694336, "global_step": 336576, "epoch": 4055} {"train_loss": -24.809350967407227, "global_step": 336577, "epoch": 4055} {"train_loss": -24.874961853027344, "global_step": 336578, "epoch": 4055} {"train_loss": -24.624862670898438, "global_step": 336579, "epoch": 4055} {"train_loss": -25.00495719909668, "global_step": 336580, "epoch": 4055} {"train_loss": -25.249361038208008, "global_step": 336581, "epoch": 4055} {"train_loss": -25.381738662719727, "global_step": 336582, "epoch": 4055} {"train_loss": -25.371763229370117, "global_step": 336583, "epoch": 4055} {"train_loss": -24.96173095703125, "global_step": 336584, "epoch": 4055} {"train_loss": -25.306015014648438, "global_step": 336585, "epoch": 4055} {"train_loss": -25.127798080444336, "global_step": 336586, "epoch": 4055} {"train_loss": -25.687000274658203, "global_step": 336587, "epoch": 4055} {"train_loss": -25.401601791381836, "global_step": 336588, "epoch": 4055} {"train_loss": -25.243717193603516, "global_step": 336589, "epoch": 4055} {"train_loss": -25.805944442749023, "global_step": 336590, "epoch": 4055} {"train_loss": -25.397302627563477, "global_step": 336591, "epoch": 4055} {"train_loss": -25.703577041625977, "global_step": 336592, "epoch": 4055} {"train_loss": -25.569379806518555, "global_step": 336593, "epoch": 4055} {"train_loss": -25.831619262695312, "global_step": 336594, "epoch": 4055} {"train_loss": -25.5133113861084, "global_step": 336595, "epoch": 4055} {"train_loss": -25.599740982055664, "global_step": 336596, "epoch": 4055} {"train_loss": -25.705520629882812, "global_step": 336597, "epoch": 4055} {"train_loss": -25.937936782836914, "global_step": 336598, "epoch": 4055} {"train_loss": -26.341352462768555, "global_step": 336599, "epoch": 4055} {"train_loss": -25.865095138549805, "global_step": 336600, "epoch": 4055} {"train_loss": -25.996051788330078, "global_step": 336601, "epoch": 4055} {"train_loss": -25.8092041015625, "global_step": 336602, "epoch": 4055} {"train_loss": -26.1660213470459, "global_step": 336603, "epoch": 4055} {"train_loss": -25.77972412109375, "global_step": 336604, "epoch": 4055} {"train_loss": -26.12745475769043, "global_step": 336605, "epoch": 4055} {"train_loss": -26.260427474975586, "global_step": 336606, "epoch": 4055} {"train_loss": -25.8269100189209, "global_step": 336607, "epoch": 4055} {"train_loss": -26.146026611328125, "global_step": 336608, "epoch": 4055} {"train_loss": -26.068103790283203, "global_step": 336609, "epoch": 4055} {"train_loss": -26.331872940063477, "global_step": 336610, "epoch": 4055} {"train_loss": -25.981109619140625, "global_step": 336611, "epoch": 4055} {"train_loss": -25.724451065063477, "global_step": 336612, "epoch": 4055} {"train_loss": -25.521032333374023, "global_step": 336613, "epoch": 4055} {"train_loss": -26.050626754760742, "global_step": 336614, "epoch": 4055} {"train_loss": -26.05047035217285, "global_step": 336615, "epoch": 4055} {"train_loss": -25.680526733398438, "global_step": 336616, "epoch": 4055} {"train_loss": -25.63681983947754, "global_step": 336617, "epoch": 4055} {"train_loss": -26.09100914001465, "global_step": 336618, "epoch": 4055} {"train_loss": -25.98933982849121, "global_step": 336619, "epoch": 4055} {"train_loss": -26.02518653869629, "global_step": 336620, "epoch": 4055} {"train_loss": -26.01886558532715, "global_step": 336621, "epoch": 4055} {"train_loss": -26.16263771057129, "global_step": 336622, "epoch": 4055} {"train_loss": -26.40130615234375, "global_step": 336623, "epoch": 4055} {"train_loss": -26.134765625, "global_step": 336624, "epoch": 4055} {"train_loss": -25.981184005737305, "global_step": 336625, "epoch": 4055} {"train_loss": -26.258710861206055, "global_step": 336626, "epoch": 4055} {"train_loss": -25.90565299987793, "global_step": 336627, "epoch": 4055} {"train_loss": -26.298633575439453, "global_step": 336628, "epoch": 4055} {"train_loss": -26.15030288696289, "global_step": 336629, "epoch": 4055} {"train_loss": -26.135395050048828, "global_step": 336630, "epoch": 4055} {"train_loss": -25.9847412109375, "global_step": 336631, "epoch": 4055} {"train_loss": -26.077878952026367, "global_step": 336632, "epoch": 4055} {"train_loss": -26.095849990844727, "global_step": 336633, "epoch": 4055} {"train_loss": -25.935083389282227, "global_step": 336634, "epoch": 4055} {"train_loss": -26.223621368408203, "global_step": 336635, "epoch": 4055} {"train_loss": -26.194604873657227, "global_step": 336636, "epoch": 4055} {"train_loss": -25.879638671875, "global_step": 336637, "epoch": 4055} {"train_loss": -26.485294342041016, "global_step": 336638, "epoch": 4055} {"train_loss": -26.069061279296875, "global_step": 336639, "epoch": 4055} {"train_loss": -26.103412628173828, "global_step": 336640, "epoch": 4055} {"train_loss": -25.8542423248291, "global_step": 336641, "epoch": 4055} {"train_loss": -25.87519645690918, "global_step": 336642, "epoch": 4055} {"train_loss": -26.28668785095215, "global_step": 336643, "epoch": 4055} {"train_loss": -25.76679039001465, "global_step": 336644, "epoch": 4055} {"train_loss": -26.05084228515625, "global_step": 336645, "epoch": 4055} {"train_loss": -25.946752548217773, "global_step": 336646, "epoch": 4055} {"train_loss": -25.584624945399273, "global_step": 336647, "epoch": 4055, "val_loss": 6687018.0} {"train_loss": -25.187725067138672, "global_step": 336648, "epoch": 4056} {"train_loss": -24.345306396484375, "global_step": 336649, "epoch": 4056} {"train_loss": -24.77914810180664, "global_step": 336650, "epoch": 4056} {"train_loss": -25.54543113708496, "global_step": 336651, "epoch": 4056} {"train_loss": -25.28626251220703, "global_step": 336652, "epoch": 4056} {"train_loss": -25.54732322692871, "global_step": 336653, "epoch": 4056} {"train_loss": -25.8338623046875, "global_step": 336654, "epoch": 4056} {"train_loss": -25.19709014892578, "global_step": 336655, "epoch": 4056} {"train_loss": -25.868783950805664, "global_step": 336656, "epoch": 4056} {"train_loss": -25.531185150146484, "global_step": 336657, "epoch": 4056} {"train_loss": -26.0870361328125, "global_step": 336658, "epoch": 4056} {"train_loss": -25.018356323242188, "global_step": 336659, "epoch": 4056} {"train_loss": -25.488330841064453, "global_step": 336660, "epoch": 4056} {"train_loss": -25.48538589477539, "global_step": 336661, "epoch": 4056} {"train_loss": -25.78525733947754, "global_step": 336662, "epoch": 4056} {"train_loss": -25.339757919311523, "global_step": 336663, "epoch": 4056} {"train_loss": -25.328641891479492, "global_step": 336664, "epoch": 4056} {"train_loss": -25.672483444213867, "global_step": 336665, "epoch": 4056} {"train_loss": -25.679946899414062, "global_step": 336666, "epoch": 4056} {"train_loss": -25.664892196655273, "global_step": 336667, "epoch": 4056} {"train_loss": -25.595182418823242, "global_step": 336668, "epoch": 4056} {"train_loss": -25.918447494506836, "global_step": 336669, "epoch": 4056} {"train_loss": -25.917404174804688, "global_step": 336670, "epoch": 4056} {"train_loss": -26.07462501525879, "global_step": 336671, "epoch": 4056} {"train_loss": -25.86700439453125, "global_step": 336672, "epoch": 4056} {"train_loss": -26.079132080078125, "global_step": 336673, "epoch": 4056} {"train_loss": -26.1037540435791, "global_step": 336674, "epoch": 4056} {"train_loss": -25.712873458862305, "global_step": 336675, "epoch": 4056} {"train_loss": -26.070737838745117, "global_step": 336676, "epoch": 4056} {"train_loss": -26.003503799438477, "global_step": 336677, "epoch": 4056} {"train_loss": -25.946455001831055, "global_step": 336678, "epoch": 4056} {"train_loss": -25.960906982421875, "global_step": 336679, "epoch": 4056} {"train_loss": -25.923376083374023, "global_step": 336680, "epoch": 4056} {"train_loss": -26.462493896484375, "global_step": 336681, "epoch": 4056} {"train_loss": -25.92608070373535, "global_step": 336682, "epoch": 4056} {"train_loss": -26.137954711914062, "global_step": 336683, "epoch": 4056} {"train_loss": -26.399036407470703, "global_step": 336684, "epoch": 4056} {"train_loss": -25.84684181213379, "global_step": 336685, "epoch": 4056} {"train_loss": -26.270435333251953, "global_step": 336686, "epoch": 4056} {"train_loss": -26.330698013305664, "global_step": 336687, "epoch": 4056} {"train_loss": -26.302335739135742, "global_step": 336688, "epoch": 4056} {"train_loss": -26.059640884399414, "global_step": 336689, "epoch": 4056} {"train_loss": -26.2740478515625, "global_step": 336690, "epoch": 4056} {"train_loss": -26.120941162109375, "global_step": 336691, "epoch": 4056} {"train_loss": -26.116363525390625, "global_step": 336692, "epoch": 4056} {"train_loss": -26.015363693237305, "global_step": 336693, "epoch": 4056} {"train_loss": -26.000341415405273, "global_step": 336694, "epoch": 4056} {"train_loss": -25.943029403686523, "global_step": 336695, "epoch": 4056} {"train_loss": -26.050573348999023, "global_step": 336696, "epoch": 4056} {"train_loss": -26.004093170166016, "global_step": 336697, "epoch": 4056} {"train_loss": -26.081043243408203, "global_step": 336698, "epoch": 4056} {"train_loss": -26.4763126373291, "global_step": 336699, "epoch": 4056} {"train_loss": -26.33365249633789, "global_step": 336700, "epoch": 4056} {"train_loss": -25.749618530273438, "global_step": 336701, "epoch": 4056} {"train_loss": -25.769153594970703, "global_step": 336702, "epoch": 4056} {"train_loss": -26.210256576538086, "global_step": 336703, "epoch": 4056} {"train_loss": -25.823572158813477, "global_step": 336704, "epoch": 4056} {"train_loss": -26.5065860748291, "global_step": 336705, "epoch": 4056} {"train_loss": -26.366979598999023, "global_step": 336706, "epoch": 4056} {"train_loss": -25.870563507080078, "global_step": 336707, "epoch": 4056} {"train_loss": -26.510923385620117, "global_step": 336708, "epoch": 4056} {"train_loss": -25.98090171813965, "global_step": 336709, "epoch": 4056} {"train_loss": -26.282873153686523, "global_step": 336710, "epoch": 4056} {"train_loss": -25.951684951782227, "global_step": 336711, "epoch": 4056} {"train_loss": -26.568899154663086, "global_step": 336712, "epoch": 4056} {"train_loss": -25.775226593017578, "global_step": 336713, "epoch": 4056} {"train_loss": -25.75306510925293, "global_step": 336714, "epoch": 4056} {"train_loss": -26.045032501220703, "global_step": 336715, "epoch": 4056} {"train_loss": -25.9326171875, "global_step": 336716, "epoch": 4056} {"train_loss": -26.573627471923828, "global_step": 336717, "epoch": 4056} {"train_loss": -25.9991455078125, "global_step": 336718, "epoch": 4056} {"train_loss": -26.199689865112305, "global_step": 336719, "epoch": 4056} {"train_loss": -26.024194717407227, "global_step": 336720, "epoch": 4056} {"train_loss": -25.85524559020996, "global_step": 336721, "epoch": 4056} {"train_loss": -26.260358810424805, "global_step": 336722, "epoch": 4056} {"train_loss": -25.908100128173828, "global_step": 336723, "epoch": 4056} {"train_loss": -26.245298385620117, "global_step": 336724, "epoch": 4056} {"train_loss": -26.26861000061035, "global_step": 336725, "epoch": 4056} {"train_loss": -26.18235206604004, "global_step": 336726, "epoch": 4056} {"train_loss": -26.299036026000977, "global_step": 336727, "epoch": 4056} {"train_loss": -26.34731101989746, "global_step": 336728, "epoch": 4056} {"train_loss": -26.165069580078125, "global_step": 336729, "epoch": 4056} {"train_loss": -25.931540937308807, "global_step": 336730, "epoch": 4056, "val_loss": 6704374.0} {"train_loss": -25.530813217163086, "global_step": 336731, "epoch": 4057} {"train_loss": -25.62282371520996, "global_step": 336732, "epoch": 4057} {"train_loss": -25.576419830322266, "global_step": 336733, "epoch": 4057} {"train_loss": -25.883331298828125, "global_step": 336734, "epoch": 4057} {"train_loss": -25.546274185180664, "global_step": 336735, "epoch": 4057} {"train_loss": -25.85169792175293, "global_step": 336736, "epoch": 4057} {"train_loss": -25.818450927734375, "global_step": 336737, "epoch": 4057} {"train_loss": -25.70184326171875, "global_step": 336738, "epoch": 4057} {"train_loss": -25.88716697692871, "global_step": 336739, "epoch": 4057} {"train_loss": -25.9246768951416, "global_step": 336740, "epoch": 4057} {"train_loss": -25.29229736328125, "global_step": 336741, "epoch": 4057} {"train_loss": -25.867334365844727, "global_step": 336742, "epoch": 4057} {"train_loss": -25.74045181274414, "global_step": 336743, "epoch": 4057} {"train_loss": -26.075307846069336, "global_step": 336744, "epoch": 4057} {"train_loss": -25.825946807861328, "global_step": 336745, "epoch": 4057} {"train_loss": -25.8631534576416, "global_step": 336746, "epoch": 4057} {"train_loss": -26.30908203125, "global_step": 336747, "epoch": 4057} {"train_loss": -25.947757720947266, "global_step": 336748, "epoch": 4057} {"train_loss": -25.836872100830078, "global_step": 336749, "epoch": 4057} {"train_loss": -25.674488067626953, "global_step": 336750, "epoch": 4057} {"train_loss": -25.96294593811035, "global_step": 336751, "epoch": 4057} {"train_loss": -25.927417755126953, "global_step": 336752, "epoch": 4057} {"train_loss": -25.768041610717773, "global_step": 336753, "epoch": 4057} {"train_loss": -25.986957550048828, "global_step": 336754, "epoch": 4057} {"train_loss": -25.92837905883789, "global_step": 336755, "epoch": 4057} {"train_loss": -25.977649688720703, "global_step": 336756, "epoch": 4057} {"train_loss": -25.909452438354492, "global_step": 336757, "epoch": 4057} {"train_loss": -26.12373161315918, "global_step": 336758, "epoch": 4057} {"train_loss": -26.083642959594727, "global_step": 336759, "epoch": 4057} {"train_loss": -26.214618682861328, "global_step": 336760, "epoch": 4057} {"train_loss": -26.20295524597168, "global_step": 336761, "epoch": 4057} {"train_loss": -26.269916534423828, "global_step": 336762, "epoch": 4057} {"train_loss": -25.81013298034668, "global_step": 336763, "epoch": 4057} {"train_loss": -26.26436424255371, "global_step": 336764, "epoch": 4057} {"train_loss": -26.149072647094727, "global_step": 336765, "epoch": 4057} {"train_loss": -25.8284969329834, "global_step": 336766, "epoch": 4057} {"train_loss": -26.39084243774414, "global_step": 336767, "epoch": 4057} {"train_loss": -26.04768180847168, "global_step": 336768, "epoch": 4057} {"train_loss": -26.028390884399414, "global_step": 336769, "epoch": 4057} {"train_loss": -26.191360473632812, "global_step": 336770, "epoch": 4057} {"train_loss": -25.932147979736328, "global_step": 336771, "epoch": 4057} {"train_loss": -25.966506958007812, "global_step": 336772, "epoch": 4057} {"train_loss": -26.237646102905273, "global_step": 336773, "epoch": 4057} {"train_loss": -25.879886627197266, "global_step": 336774, "epoch": 4057} {"train_loss": -26.174530029296875, "global_step": 336775, "epoch": 4057} {"train_loss": -26.07319450378418, "global_step": 336776, "epoch": 4057} {"train_loss": -26.354089736938477, "global_step": 336777, "epoch": 4057} {"train_loss": -25.694360733032227, "global_step": 336778, "epoch": 4057} {"train_loss": -25.7041015625, "global_step": 336779, "epoch": 4057} {"train_loss": -26.27326011657715, "global_step": 336780, "epoch": 4057} {"train_loss": -26.30679702758789, "global_step": 336781, "epoch": 4057} {"train_loss": -26.28449058532715, "global_step": 336782, "epoch": 4057} {"train_loss": -26.275205612182617, "global_step": 336783, "epoch": 4057} {"train_loss": -26.341064453125, "global_step": 336784, "epoch": 4057} {"train_loss": -26.193883895874023, "global_step": 336785, "epoch": 4057} {"train_loss": -26.09016990661621, "global_step": 336786, "epoch": 4057} {"train_loss": -26.34247398376465, "global_step": 336787, "epoch": 4057} {"train_loss": -25.86957359313965, "global_step": 336788, "epoch": 4057} {"train_loss": -26.28586769104004, "global_step": 336789, "epoch": 4057} {"train_loss": -26.294153213500977, "global_step": 336790, "epoch": 4057} {"train_loss": -26.088733673095703, "global_step": 336791, "epoch": 4057} {"train_loss": -26.0601749420166, "global_step": 336792, "epoch": 4057} {"train_loss": -26.058446884155273, "global_step": 336793, "epoch": 4057} {"train_loss": -25.983966827392578, "global_step": 336794, "epoch": 4057} {"train_loss": -25.914093017578125, "global_step": 336795, "epoch": 4057} {"train_loss": -26.203659057617188, "global_step": 336796, "epoch": 4057} {"train_loss": -25.853290557861328, "global_step": 336797, "epoch": 4057} {"train_loss": -26.201797485351562, "global_step": 336798, "epoch": 4057} {"train_loss": -26.290943145751953, "global_step": 336799, "epoch": 4057} {"train_loss": -26.050535202026367, "global_step": 336800, "epoch": 4057} {"train_loss": -26.435705184936523, "global_step": 336801, "epoch": 4057} {"train_loss": -25.90509605407715, "global_step": 336802, "epoch": 4057} {"train_loss": -26.212310791015625, "global_step": 336803, "epoch": 4057} {"train_loss": -25.812402725219727, "global_step": 336804, "epoch": 4057} {"train_loss": -26.16591453552246, "global_step": 336805, "epoch": 4057} {"train_loss": -25.81318473815918, "global_step": 336806, "epoch": 4057} {"train_loss": -26.344928741455078, "global_step": 336807, "epoch": 4057} {"train_loss": -26.13654899597168, "global_step": 336808, "epoch": 4057} {"train_loss": -25.878833770751953, "global_step": 336809, "epoch": 4057} {"train_loss": -26.101449966430664, "global_step": 336810, "epoch": 4057} {"train_loss": -26.351652145385742, "global_step": 336811, "epoch": 4057} {"train_loss": -25.984357833862305, "global_step": 336812, "epoch": 4057} {"train_loss": -26.013380556221467, "global_step": 336813, "epoch": 4057, "val_loss": 6739855.5} {"train_loss": -25.31454849243164, "global_step": 336814, "epoch": 4058} {"train_loss": -22.5911922454834, "global_step": 336815, "epoch": 4058} {"train_loss": -22.69635009765625, "global_step": 336816, "epoch": 4058} {"train_loss": -25.161540985107422, "global_step": 336817, "epoch": 4058} {"train_loss": -24.34734535217285, "global_step": 336818, "epoch": 4058} {"train_loss": -24.809911727905273, "global_step": 336819, "epoch": 4058} {"train_loss": -24.471399307250977, "global_step": 336820, "epoch": 4058} {"train_loss": -24.927473068237305, "global_step": 336821, "epoch": 4058} {"train_loss": -25.409503936767578, "global_step": 336822, "epoch": 4058} {"train_loss": -24.74612808227539, "global_step": 336823, "epoch": 4058} {"train_loss": -25.236160278320312, "global_step": 336824, "epoch": 4058} {"train_loss": -25.20153045654297, "global_step": 336825, "epoch": 4058} {"train_loss": -25.639429092407227, "global_step": 336826, "epoch": 4058} {"train_loss": -24.990419387817383, "global_step": 336827, "epoch": 4058} {"train_loss": -25.32928466796875, "global_step": 336828, "epoch": 4058} {"train_loss": -25.12666130065918, "global_step": 336829, "epoch": 4058} {"train_loss": -25.310102462768555, "global_step": 336830, "epoch": 4058} {"train_loss": -25.15316390991211, "global_step": 336831, "epoch": 4058} {"train_loss": -25.50946617126465, "global_step": 336832, "epoch": 4058} {"train_loss": -25.384801864624023, "global_step": 336833, "epoch": 4058} {"train_loss": -25.148130416870117, "global_step": 336834, "epoch": 4058} {"train_loss": -25.542943954467773, "global_step": 336835, "epoch": 4058} {"train_loss": -25.23761558532715, "global_step": 336836, "epoch": 4058} {"train_loss": -25.189611434936523, "global_step": 336837, "epoch": 4058} {"train_loss": -25.268529891967773, "global_step": 336838, "epoch": 4058} {"train_loss": -25.913488388061523, "global_step": 336839, "epoch": 4058} {"train_loss": -25.5413875579834, "global_step": 336840, "epoch": 4058} {"train_loss": -25.001483917236328, "global_step": 336841, "epoch": 4058} {"train_loss": -25.691450119018555, "global_step": 336842, "epoch": 4058} {"train_loss": -25.625659942626953, "global_step": 336843, "epoch": 4058} {"train_loss": -25.953720092773438, "global_step": 336844, "epoch": 4058} {"train_loss": -25.913532257080078, "global_step": 336845, "epoch": 4058} {"train_loss": -25.70904541015625, "global_step": 336846, "epoch": 4058} {"train_loss": -25.921802520751953, "global_step": 336847, "epoch": 4058} {"train_loss": -25.85355567932129, "global_step": 336848, "epoch": 4058} {"train_loss": -25.735342025756836, "global_step": 336849, "epoch": 4058} {"train_loss": -25.686365127563477, "global_step": 336850, "epoch": 4058} {"train_loss": -25.76372718811035, "global_step": 336851, "epoch": 4058} {"train_loss": -26.068267822265625, "global_step": 336852, "epoch": 4058} {"train_loss": -25.820173263549805, "global_step": 336853, "epoch": 4058} {"train_loss": -25.9023494720459, "global_step": 336854, "epoch": 4058} {"train_loss": -25.926361083984375, "global_step": 336855, "epoch": 4058} {"train_loss": -26.00541114807129, "global_step": 336856, "epoch": 4058} {"train_loss": -25.959131240844727, "global_step": 336857, "epoch": 4058} {"train_loss": -26.320615768432617, "global_step": 336858, "epoch": 4058} {"train_loss": -25.8485107421875, "global_step": 336859, "epoch": 4058} {"train_loss": -26.311201095581055, "global_step": 336860, "epoch": 4058} {"train_loss": -26.064123153686523, "global_step": 336861, "epoch": 4058} {"train_loss": -25.979740142822266, "global_step": 336862, "epoch": 4058} {"train_loss": -26.10442543029785, "global_step": 336863, "epoch": 4058} {"train_loss": -26.190763473510742, "global_step": 336864, "epoch": 4058} {"train_loss": -26.05921745300293, "global_step": 336865, "epoch": 4058} {"train_loss": -26.29729652404785, "global_step": 336866, "epoch": 4058} {"train_loss": -26.099807739257812, "global_step": 336867, "epoch": 4058} {"train_loss": -26.012786865234375, "global_step": 336868, "epoch": 4058} {"train_loss": -26.352527618408203, "global_step": 336869, "epoch": 4058} {"train_loss": -25.938764572143555, "global_step": 336870, "epoch": 4058} {"train_loss": -26.089330673217773, "global_step": 336871, "epoch": 4058} {"train_loss": -26.381412506103516, "global_step": 336872, "epoch": 4058} {"train_loss": -26.052814483642578, "global_step": 336873, "epoch": 4058} {"train_loss": -25.995487213134766, "global_step": 336874, "epoch": 4058} {"train_loss": -26.17098045349121, "global_step": 336875, "epoch": 4058} {"train_loss": -26.40455436706543, "global_step": 336876, "epoch": 4058} {"train_loss": -26.123498916625977, "global_step": 336877, "epoch": 4058} {"train_loss": -25.935871124267578, "global_step": 336878, "epoch": 4058} {"train_loss": -26.3258113861084, "global_step": 336879, "epoch": 4058} {"train_loss": -25.965911865234375, "global_step": 336880, "epoch": 4058} {"train_loss": -26.226078033447266, "global_step": 336881, "epoch": 4058} {"train_loss": -26.320837020874023, "global_step": 336882, "epoch": 4058} {"train_loss": -25.920806884765625, "global_step": 336883, "epoch": 4058} {"train_loss": -26.26923179626465, "global_step": 336884, "epoch": 4058} {"train_loss": -26.362340927124023, "global_step": 336885, "epoch": 4058} {"train_loss": -26.38818359375, "global_step": 336886, "epoch": 4058} {"train_loss": -26.245588302612305, "global_step": 336887, "epoch": 4058} {"train_loss": -26.345386505126953, "global_step": 336888, "epoch": 4058} {"train_loss": -26.653966903686523, "global_step": 336889, "epoch": 4058} {"train_loss": -26.434024810791016, "global_step": 336890, "epoch": 4058} {"train_loss": -26.155786514282227, "global_step": 336891, "epoch": 4058} {"train_loss": -26.1723690032959, "global_step": 336892, "epoch": 4058} {"train_loss": -26.107946395874023, "global_step": 336893, "epoch": 4058} {"train_loss": -26.311731338500977, "global_step": 336894, "epoch": 4058} {"train_loss": -26.51679801940918, "global_step": 336895, "epoch": 4058} {"train_loss": -25.71472076048334, "global_step": 336896, "epoch": 4058, "val_loss": 6746425.0} {"train_loss": -25.849706649780273, "global_step": 336897, "epoch": 4059} {"train_loss": -25.88393211364746, "global_step": 336898, "epoch": 4059} {"train_loss": -25.725317001342773, "global_step": 336899, "epoch": 4059} {"train_loss": -25.337217330932617, "global_step": 336900, "epoch": 4059} {"train_loss": -24.95159339904785, "global_step": 336901, "epoch": 4059} {"train_loss": -23.53363037109375, "global_step": 336902, "epoch": 4059} {"train_loss": -24.566938400268555, "global_step": 336903, "epoch": 4059} {"train_loss": -24.98095703125, "global_step": 336904, "epoch": 4059} {"train_loss": -24.582355499267578, "global_step": 336905, "epoch": 4059} {"train_loss": -24.250045776367188, "global_step": 336906, "epoch": 4059} {"train_loss": -25.392972946166992, "global_step": 336907, "epoch": 4059} {"train_loss": -25.015789031982422, "global_step": 336908, "epoch": 4059} {"train_loss": -24.628950119018555, "global_step": 336909, "epoch": 4059} {"train_loss": -25.213809967041016, "global_step": 336910, "epoch": 4059} {"train_loss": -24.95643424987793, "global_step": 336911, "epoch": 4059} {"train_loss": -25.10797119140625, "global_step": 336912, "epoch": 4059} {"train_loss": -25.573394775390625, "global_step": 336913, "epoch": 4059} {"train_loss": -25.341766357421875, "global_step": 336914, "epoch": 4059} {"train_loss": -25.396852493286133, "global_step": 336915, "epoch": 4059} {"train_loss": -25.616291046142578, "global_step": 336916, "epoch": 4059} {"train_loss": -25.26203727722168, "global_step": 336917, "epoch": 4059} {"train_loss": -25.521686553955078, "global_step": 336918, "epoch": 4059} {"train_loss": -25.496763229370117, "global_step": 336919, "epoch": 4059} {"train_loss": -25.922998428344727, "global_step": 336920, "epoch": 4059} {"train_loss": -25.52800750732422, "global_step": 336921, "epoch": 4059} {"train_loss": -25.77092933654785, "global_step": 336922, "epoch": 4059} {"train_loss": -25.16287612915039, "global_step": 336923, "epoch": 4059} {"train_loss": -25.656116485595703, "global_step": 336924, "epoch": 4059} {"train_loss": -25.789113998413086, "global_step": 336925, "epoch": 4059} {"train_loss": -25.646085739135742, "global_step": 336926, "epoch": 4059} {"train_loss": -26.0587215423584, "global_step": 336927, "epoch": 4059} {"train_loss": -25.7425537109375, "global_step": 336928, "epoch": 4059} {"train_loss": -25.908472061157227, "global_step": 336929, "epoch": 4059} {"train_loss": -25.680133819580078, "global_step": 336930, "epoch": 4059} {"train_loss": -25.761585235595703, "global_step": 336931, "epoch": 4059} {"train_loss": -25.94000816345215, "global_step": 336932, "epoch": 4059} {"train_loss": -25.96498680114746, "global_step": 336933, "epoch": 4059} {"train_loss": -25.546480178833008, "global_step": 336934, "epoch": 4059} {"train_loss": -26.0377197265625, "global_step": 336935, "epoch": 4059} {"train_loss": -26.00725746154785, "global_step": 336936, "epoch": 4059} {"train_loss": -25.89727210998535, "global_step": 336937, "epoch": 4059} {"train_loss": -25.87188148498535, "global_step": 336938, "epoch": 4059} {"train_loss": -26.1134033203125, "global_step": 336939, "epoch": 4059} {"train_loss": -26.03594398498535, "global_step": 336940, "epoch": 4059} {"train_loss": -25.82561683654785, "global_step": 336941, "epoch": 4059} {"train_loss": -26.170917510986328, "global_step": 336942, "epoch": 4059} {"train_loss": -26.130640029907227, "global_step": 336943, "epoch": 4059} {"train_loss": -25.8880615234375, "global_step": 336944, "epoch": 4059} {"train_loss": -26.252334594726562, "global_step": 336945, "epoch": 4059} {"train_loss": -25.993566513061523, "global_step": 336946, "epoch": 4059} {"train_loss": -26.325422286987305, "global_step": 336947, "epoch": 4059} {"train_loss": -26.19976806640625, "global_step": 336948, "epoch": 4059} {"train_loss": -25.763456344604492, "global_step": 336949, "epoch": 4059} {"train_loss": -26.211362838745117, "global_step": 336950, "epoch": 4059} {"train_loss": -26.37891960144043, "global_step": 336951, "epoch": 4059} {"train_loss": -25.906391143798828, "global_step": 336952, "epoch": 4059} {"train_loss": -26.243854522705078, "global_step": 336953, "epoch": 4059} {"train_loss": -26.301969528198242, "global_step": 336954, "epoch": 4059} {"train_loss": -26.07404136657715, "global_step": 336955, "epoch": 4059} {"train_loss": -26.179996490478516, "global_step": 336956, "epoch": 4059} {"train_loss": -25.820337295532227, "global_step": 336957, "epoch": 4059} {"train_loss": -26.19419288635254, "global_step": 336958, "epoch": 4059} {"train_loss": -26.2993221282959, "global_step": 336959, "epoch": 4059} {"train_loss": -26.154682159423828, "global_step": 336960, "epoch": 4059} {"train_loss": -26.263065338134766, "global_step": 336961, "epoch": 4059} {"train_loss": -26.18523597717285, "global_step": 336962, "epoch": 4059} {"train_loss": -26.014368057250977, "global_step": 336963, "epoch": 4059} {"train_loss": -26.17850685119629, "global_step": 336964, "epoch": 4059} {"train_loss": -26.070356369018555, "global_step": 336965, "epoch": 4059} {"train_loss": -26.400915145874023, "global_step": 336966, "epoch": 4059} {"train_loss": -26.163135528564453, "global_step": 336967, "epoch": 4059} {"train_loss": -26.176069259643555, "global_step": 336968, "epoch": 4059} {"train_loss": -26.500534057617188, "global_step": 336969, "epoch": 4059} {"train_loss": -26.133625030517578, "global_step": 336970, "epoch": 4059} {"train_loss": -26.281387329101562, "global_step": 336971, "epoch": 4059} {"train_loss": -26.25984001159668, "global_step": 336972, "epoch": 4059} {"train_loss": -25.97509765625, "global_step": 336973, "epoch": 4059} {"train_loss": -26.427820205688477, "global_step": 336974, "epoch": 4059} {"train_loss": -26.40486717224121, "global_step": 336975, "epoch": 4059} {"train_loss": -26.32600975036621, "global_step": 336976, "epoch": 4059} {"train_loss": -26.23052978515625, "global_step": 336977, "epoch": 4059} {"train_loss": -26.19656753540039, "global_step": 336978, "epoch": 4059} {"train_loss": -25.76701446900885, "global_step": 336979, "epoch": 4059, "val_loss": 6765970.0} {"train_loss": -25.74462890625, "global_step": 336980, "epoch": 4060} {"train_loss": -25.601333618164062, "global_step": 336981, "epoch": 4060} {"train_loss": -26.10991859436035, "global_step": 336982, "epoch": 4060} {"train_loss": -25.556276321411133, "global_step": 336983, "epoch": 4060} {"train_loss": -25.448469161987305, "global_step": 336984, "epoch": 4060} {"train_loss": -26.03729248046875, "global_step": 336985, "epoch": 4060} {"train_loss": -25.656126022338867, "global_step": 336986, "epoch": 4060} {"train_loss": -25.676319122314453, "global_step": 336987, "epoch": 4060} {"train_loss": -26.092641830444336, "global_step": 336988, "epoch": 4060} {"train_loss": -25.488203048706055, "global_step": 336989, "epoch": 4060} {"train_loss": -25.63446044921875, "global_step": 336990, "epoch": 4060} {"train_loss": -25.629718780517578, "global_step": 336991, "epoch": 4060} {"train_loss": -25.855121612548828, "global_step": 336992, "epoch": 4060} {"train_loss": -25.86907386779785, "global_step": 336993, "epoch": 4060} {"train_loss": -25.563756942749023, "global_step": 336994, "epoch": 4060} {"train_loss": -25.970239639282227, "global_step": 336995, "epoch": 4060} {"train_loss": -25.496767044067383, "global_step": 336996, "epoch": 4060} {"train_loss": -25.8818359375, "global_step": 336997, "epoch": 4060} {"train_loss": -25.989917755126953, "global_step": 336998, "epoch": 4060} {"train_loss": -25.86224937438965, "global_step": 336999, "epoch": 4060} {"train_loss": -25.80047607421875, "global_step": 337000, "epoch": 4060} {"train_loss": -25.971485137939453, "global_step": 337001, "epoch": 4060} {"train_loss": -26.090988159179688, "global_step": 337002, "epoch": 4060} {"train_loss": -26.000629425048828, "global_step": 337003, "epoch": 4060} {"train_loss": -26.21512222290039, "global_step": 337004, "epoch": 4060} {"train_loss": -26.162038803100586, "global_step": 337005, "epoch": 4060} {"train_loss": -25.968725204467773, "global_step": 337006, "epoch": 4060} {"train_loss": -25.76714515686035, "global_step": 337007, "epoch": 4060} {"train_loss": -25.9300479888916, "global_step": 337008, "epoch": 4060} {"train_loss": -25.737548828125, "global_step": 337009, "epoch": 4060} {"train_loss": -26.01865005493164, "global_step": 337010, "epoch": 4060} {"train_loss": -25.78973388671875, "global_step": 337011, "epoch": 4060} {"train_loss": -25.855627059936523, "global_step": 337012, "epoch": 4060} {"train_loss": -26.271656036376953, "global_step": 337013, "epoch": 4060} {"train_loss": -26.170551300048828, "global_step": 337014, "epoch": 4060} {"train_loss": -25.9785213470459, "global_step": 337015, "epoch": 4060} {"train_loss": -26.134313583374023, "global_step": 337016, "epoch": 4060} {"train_loss": -25.72979164123535, "global_step": 337017, "epoch": 4060} {"train_loss": -26.216482162475586, "global_step": 337018, "epoch": 4060} {"train_loss": -26.34730339050293, "global_step": 337019, "epoch": 4060} {"train_loss": -25.807287216186523, "global_step": 337020, "epoch": 4060} {"train_loss": -26.368762969970703, "global_step": 337021, "epoch": 4060} {"train_loss": -26.334070205688477, "global_step": 337022, "epoch": 4060} {"train_loss": -25.716367721557617, "global_step": 337023, "epoch": 4060} {"train_loss": -25.958988189697266, "global_step": 337024, "epoch": 4060} {"train_loss": -25.910369873046875, "global_step": 337025, "epoch": 4060} {"train_loss": -25.7551212310791, "global_step": 337026, "epoch": 4060} {"train_loss": -26.16912269592285, "global_step": 337027, "epoch": 4060} {"train_loss": -26.296039581298828, "global_step": 337028, "epoch": 4060} {"train_loss": -26.13591957092285, "global_step": 337029, "epoch": 4060} {"train_loss": -26.305511474609375, "global_step": 337030, "epoch": 4060} {"train_loss": -26.03304100036621, "global_step": 337031, "epoch": 4060} {"train_loss": -25.994842529296875, "global_step": 337032, "epoch": 4060} {"train_loss": -26.228729248046875, "global_step": 337033, "epoch": 4060} {"train_loss": -26.063129425048828, "global_step": 337034, "epoch": 4060} {"train_loss": -26.17148780822754, "global_step": 337035, "epoch": 4060} {"train_loss": -26.53740882873535, "global_step": 337036, "epoch": 4060} {"train_loss": -26.07684898376465, "global_step": 337037, "epoch": 4060} {"train_loss": -26.049955368041992, "global_step": 337038, "epoch": 4060} {"train_loss": -25.63515281677246, "global_step": 337039, "epoch": 4060} {"train_loss": -26.5677433013916, "global_step": 337040, "epoch": 4060} {"train_loss": -26.1514835357666, "global_step": 337041, "epoch": 4060} {"train_loss": -25.91371726989746, "global_step": 337042, "epoch": 4060} {"train_loss": -26.32216453552246, "global_step": 337043, "epoch": 4060} {"train_loss": -26.300100326538086, "global_step": 337044, "epoch": 4060} {"train_loss": -26.258426666259766, "global_step": 337045, "epoch": 4060} {"train_loss": -26.011917114257812, "global_step": 337046, "epoch": 4060} {"train_loss": -26.264148712158203, "global_step": 337047, "epoch": 4060} {"train_loss": -25.934864044189453, "global_step": 337048, "epoch": 4060} {"train_loss": -26.076461791992188, "global_step": 337049, "epoch": 4060} {"train_loss": -26.249481201171875, "global_step": 337050, "epoch": 4060} {"train_loss": -26.30621910095215, "global_step": 337051, "epoch": 4060} {"train_loss": -25.984756469726562, "global_step": 337052, "epoch": 4060} {"train_loss": -25.788837432861328, "global_step": 337053, "epoch": 4060} {"train_loss": -26.12349510192871, "global_step": 337054, "epoch": 4060} {"train_loss": -25.821386337280273, "global_step": 337055, "epoch": 4060} {"train_loss": -26.177082061767578, "global_step": 337056, "epoch": 4060} {"train_loss": -26.33881187438965, "global_step": 337057, "epoch": 4060} {"train_loss": -26.027149200439453, "global_step": 337058, "epoch": 4060} {"train_loss": -26.041534423828125, "global_step": 337059, "epoch": 4060} {"train_loss": -26.3797607421875, "global_step": 337060, "epoch": 4060} {"train_loss": -25.863500595092773, "global_step": 337061, "epoch": 4060} {"train_loss": -25.990693471517908, "global_step": 337062, "epoch": 4060, "val_loss": 6740241.0} {"train_loss": -25.59137535095215, "global_step": 337063, "epoch": 4061} {"train_loss": -25.36075782775879, "global_step": 337064, "epoch": 4061} {"train_loss": -25.607839584350586, "global_step": 337065, "epoch": 4061} {"train_loss": -24.903018951416016, "global_step": 337066, "epoch": 4061} {"train_loss": -25.155555725097656, "global_step": 337067, "epoch": 4061} {"train_loss": -25.925708770751953, "global_step": 337068, "epoch": 4061} {"train_loss": -25.37864112854004, "global_step": 337069, "epoch": 4061} {"train_loss": -25.7728214263916, "global_step": 337070, "epoch": 4061} {"train_loss": -25.7540283203125, "global_step": 337071, "epoch": 4061} {"train_loss": -25.482877731323242, "global_step": 337072, "epoch": 4061} {"train_loss": -25.929494857788086, "global_step": 337073, "epoch": 4061} {"train_loss": -25.5728759765625, "global_step": 337074, "epoch": 4061} {"train_loss": -25.78803825378418, "global_step": 337075, "epoch": 4061} {"train_loss": -25.522687911987305, "global_step": 337076, "epoch": 4061} {"train_loss": -25.814655303955078, "global_step": 337077, "epoch": 4061} {"train_loss": -25.6082706451416, "global_step": 337078, "epoch": 4061} {"train_loss": -25.92389488220215, "global_step": 337079, "epoch": 4061} {"train_loss": -25.667682647705078, "global_step": 337080, "epoch": 4061} {"train_loss": -26.0416259765625, "global_step": 337081, "epoch": 4061} {"train_loss": -26.224231719970703, "global_step": 337082, "epoch": 4061} {"train_loss": -26.119516372680664, "global_step": 337083, "epoch": 4061} {"train_loss": -25.68133544921875, "global_step": 337084, "epoch": 4061} {"train_loss": -25.797163009643555, "global_step": 337085, "epoch": 4061} {"train_loss": -25.83457374572754, "global_step": 337086, "epoch": 4061} {"train_loss": -26.125425338745117, "global_step": 337087, "epoch": 4061} {"train_loss": -25.817279815673828, "global_step": 337088, "epoch": 4061} {"train_loss": -25.8339900970459, "global_step": 337089, "epoch": 4061} {"train_loss": -26.013097763061523, "global_step": 337090, "epoch": 4061} {"train_loss": -26.141971588134766, "global_step": 337091, "epoch": 4061} {"train_loss": -26.183332443237305, "global_step": 337092, "epoch": 4061} {"train_loss": -26.112791061401367, "global_step": 337093, "epoch": 4061} {"train_loss": -26.085132598876953, "global_step": 337094, "epoch": 4061} {"train_loss": -25.9979190826416, "global_step": 337095, "epoch": 4061} {"train_loss": -26.398578643798828, "global_step": 337096, "epoch": 4061} {"train_loss": -26.233732223510742, "global_step": 337097, "epoch": 4061} {"train_loss": -26.1343936920166, "global_step": 337098, "epoch": 4061} {"train_loss": -26.155237197875977, "global_step": 337099, "epoch": 4061} {"train_loss": -26.004871368408203, "global_step": 337100, "epoch": 4061} {"train_loss": -26.490222930908203, "global_step": 337101, "epoch": 4061} {"train_loss": -26.204198837280273, "global_step": 337102, "epoch": 4061} {"train_loss": -26.278152465820312, "global_step": 337103, "epoch": 4061} {"train_loss": -26.39703369140625, "global_step": 337104, "epoch": 4061} {"train_loss": -26.272064208984375, "global_step": 337105, "epoch": 4061} {"train_loss": -26.24716567993164, "global_step": 337106, "epoch": 4061} {"train_loss": -26.170398712158203, "global_step": 337107, "epoch": 4061} {"train_loss": -26.16184425354004, "global_step": 337108, "epoch": 4061} {"train_loss": -25.964147567749023, "global_step": 337109, "epoch": 4061} {"train_loss": -26.253849029541016, "global_step": 337110, "epoch": 4061} {"train_loss": -25.7428035736084, "global_step": 337111, "epoch": 4061} {"train_loss": -26.23590660095215, "global_step": 337112, "epoch": 4061} {"train_loss": -26.05628776550293, "global_step": 337113, "epoch": 4061} {"train_loss": -26.139102935791016, "global_step": 337114, "epoch": 4061} {"train_loss": -26.347631454467773, "global_step": 337115, "epoch": 4061} {"train_loss": -26.43304443359375, "global_step": 337116, "epoch": 4061} {"train_loss": -25.604154586791992, "global_step": 337117, "epoch": 4061} {"train_loss": -25.156225204467773, "global_step": 337118, "epoch": 4061} {"train_loss": -24.20631217956543, "global_step": 337119, "epoch": 4061} {"train_loss": -24.777698516845703, "global_step": 337120, "epoch": 4061} {"train_loss": -25.88848304748535, "global_step": 337121, "epoch": 4061} {"train_loss": -25.8908634185791, "global_step": 337122, "epoch": 4061} {"train_loss": -26.281766891479492, "global_step": 337123, "epoch": 4061} {"train_loss": -25.654321670532227, "global_step": 337124, "epoch": 4061} {"train_loss": -26.040739059448242, "global_step": 337125, "epoch": 4061} {"train_loss": -26.1020565032959, "global_step": 337126, "epoch": 4061} {"train_loss": -25.792219161987305, "global_step": 337127, "epoch": 4061} {"train_loss": -25.374570846557617, "global_step": 337128, "epoch": 4061} {"train_loss": -25.953662872314453, "global_step": 337129, "epoch": 4061} {"train_loss": -25.837888717651367, "global_step": 337130, "epoch": 4061} {"train_loss": -25.68406105041504, "global_step": 337131, "epoch": 4061} {"train_loss": -25.824237823486328, "global_step": 337132, "epoch": 4061} {"train_loss": -25.46135902404785, "global_step": 337133, "epoch": 4061} {"train_loss": -25.746597290039062, "global_step": 337134, "epoch": 4061} {"train_loss": -25.571186065673828, "global_step": 337135, "epoch": 4061} {"train_loss": -26.08637046813965, "global_step": 337136, "epoch": 4061} {"train_loss": -26.184223175048828, "global_step": 337137, "epoch": 4061} {"train_loss": -25.930768966674805, "global_step": 337138, "epoch": 4061} {"train_loss": -26.079877853393555, "global_step": 337139, "epoch": 4061} {"train_loss": -25.652524948120117, "global_step": 337140, "epoch": 4061} {"train_loss": -26.126800537109375, "global_step": 337141, "epoch": 4061} {"train_loss": -26.089405059814453, "global_step": 337142, "epoch": 4061} {"train_loss": -25.90557861328125, "global_step": 337143, "epoch": 4061} {"train_loss": -25.87255859375, "global_step": 337144, "epoch": 4061} {"train_loss": -25.856021421501435, "global_step": 337145, "epoch": 4061, "val_loss": 6764468.0} {"train_loss": -25.64582633972168, "global_step": 337146, "epoch": 4062} {"train_loss": -25.703922271728516, "global_step": 337147, "epoch": 4062} {"train_loss": -26.0533504486084, "global_step": 337148, "epoch": 4062} {"train_loss": -25.288562774658203, "global_step": 337149, "epoch": 4062} {"train_loss": -25.793720245361328, "global_step": 337150, "epoch": 4062} {"train_loss": -25.433677673339844, "global_step": 337151, "epoch": 4062} {"train_loss": -25.548320770263672, "global_step": 337152, "epoch": 4062} {"train_loss": -26.011823654174805, "global_step": 337153, "epoch": 4062} {"train_loss": -26.153533935546875, "global_step": 337154, "epoch": 4062} {"train_loss": -25.790014266967773, "global_step": 337155, "epoch": 4062} {"train_loss": -25.89572525024414, "global_step": 337156, "epoch": 4062} {"train_loss": -25.70877456665039, "global_step": 337157, "epoch": 4062} {"train_loss": -25.875829696655273, "global_step": 337158, "epoch": 4062} {"train_loss": -25.58595085144043, "global_step": 337159, "epoch": 4062} {"train_loss": -25.978025436401367, "global_step": 337160, "epoch": 4062} {"train_loss": -26.090444564819336, "global_step": 337161, "epoch": 4062} {"train_loss": -25.983076095581055, "global_step": 337162, "epoch": 4062} {"train_loss": -25.968366622924805, "global_step": 337163, "epoch": 4062} {"train_loss": -25.84657096862793, "global_step": 337164, "epoch": 4062} {"train_loss": -26.181537628173828, "global_step": 337165, "epoch": 4062} {"train_loss": -25.954885482788086, "global_step": 337166, "epoch": 4062} {"train_loss": -25.774322509765625, "global_step": 337167, "epoch": 4062} {"train_loss": -25.764719009399414, "global_step": 337168, "epoch": 4062} {"train_loss": -26.481891632080078, "global_step": 337169, "epoch": 4062} {"train_loss": -25.96046257019043, "global_step": 337170, "epoch": 4062} {"train_loss": -25.641393661499023, "global_step": 337171, "epoch": 4062} {"train_loss": -26.09210777282715, "global_step": 337172, "epoch": 4062} {"train_loss": -26.191389083862305, "global_step": 337173, "epoch": 4062} {"train_loss": -25.957197189331055, "global_step": 337174, "epoch": 4062} {"train_loss": -26.13726234436035, "global_step": 337175, "epoch": 4062} {"train_loss": -26.37412452697754, "global_step": 337176, "epoch": 4062} {"train_loss": -26.046802520751953, "global_step": 337177, "epoch": 4062} {"train_loss": -26.197132110595703, "global_step": 337178, "epoch": 4062} {"train_loss": -26.280099868774414, "global_step": 337179, "epoch": 4062} {"train_loss": -26.250579833984375, "global_step": 337180, "epoch": 4062} {"train_loss": -26.186487197875977, "global_step": 337181, "epoch": 4062} {"train_loss": -26.00916862487793, "global_step": 337182, "epoch": 4062} {"train_loss": -26.0700626373291, "global_step": 337183, "epoch": 4062} {"train_loss": -26.145078659057617, "global_step": 337184, "epoch": 4062} {"train_loss": -25.953832626342773, "global_step": 337185, "epoch": 4062} {"train_loss": -25.801502227783203, "global_step": 337186, "epoch": 4062} {"train_loss": -25.99371337890625, "global_step": 337187, "epoch": 4062} {"train_loss": -26.16798973083496, "global_step": 337188, "epoch": 4062} {"train_loss": -26.3975772857666, "global_step": 337189, "epoch": 4062} {"train_loss": -26.172550201416016, "global_step": 337190, "epoch": 4062} {"train_loss": -26.276273727416992, "global_step": 337191, "epoch": 4062} {"train_loss": -26.309619903564453, "global_step": 337192, "epoch": 4062} {"train_loss": -25.939746856689453, "global_step": 337193, "epoch": 4062} {"train_loss": -26.395462036132812, "global_step": 337194, "epoch": 4062} {"train_loss": -26.25031852722168, "global_step": 337195, "epoch": 4062} {"train_loss": -26.0356388092041, "global_step": 337196, "epoch": 4062} {"train_loss": -26.141345977783203, "global_step": 337197, "epoch": 4062} {"train_loss": -26.3826904296875, "global_step": 337198, "epoch": 4062} {"train_loss": -25.86701774597168, "global_step": 337199, "epoch": 4062} {"train_loss": -26.614765167236328, "global_step": 337200, "epoch": 4062} {"train_loss": -25.838306427001953, "global_step": 337201, "epoch": 4062} {"train_loss": -26.04400062561035, "global_step": 337202, "epoch": 4062} {"train_loss": -26.306304931640625, "global_step": 337203, "epoch": 4062} {"train_loss": -26.23514747619629, "global_step": 337204, "epoch": 4062} {"train_loss": -26.141721725463867, "global_step": 337205, "epoch": 4062} {"train_loss": -26.25557518005371, "global_step": 337206, "epoch": 4062} {"train_loss": -26.154760360717773, "global_step": 337207, "epoch": 4062} {"train_loss": -26.0377140045166, "global_step": 337208, "epoch": 4062} {"train_loss": -26.3248348236084, "global_step": 337209, "epoch": 4062} {"train_loss": -26.2481746673584, "global_step": 337210, "epoch": 4062} {"train_loss": -26.38931655883789, "global_step": 337211, "epoch": 4062} {"train_loss": -25.974079132080078, "global_step": 337212, "epoch": 4062} {"train_loss": -26.084598541259766, "global_step": 337213, "epoch": 4062} {"train_loss": -26.213031768798828, "global_step": 337214, "epoch": 4062} {"train_loss": -26.0670166015625, "global_step": 337215, "epoch": 4062} {"train_loss": -26.337116241455078, "global_step": 337216, "epoch": 4062} {"train_loss": -26.047353744506836, "global_step": 337217, "epoch": 4062} {"train_loss": -25.55832862854004, "global_step": 337218, "epoch": 4062} {"train_loss": -25.617910385131836, "global_step": 337219, "epoch": 4062} {"train_loss": -25.869384765625, "global_step": 337220, "epoch": 4062} {"train_loss": -25.605924606323242, "global_step": 337221, "epoch": 4062} {"train_loss": -25.51767921447754, "global_step": 337222, "epoch": 4062} {"train_loss": -25.691486358642578, "global_step": 337223, "epoch": 4062} {"train_loss": -26.125486373901367, "global_step": 337224, "epoch": 4062} {"train_loss": -25.769582748413086, "global_step": 337225, "epoch": 4062} {"train_loss": -26.225439071655273, "global_step": 337226, "epoch": 4062} {"train_loss": -25.711181640625, "global_step": 337227, "epoch": 4062} {"train_loss": -26.015355673181006, "global_step": 337228, "epoch": 4062, "val_loss": 6853767.0} {"train_loss": -25.346250534057617, "global_step": 337229, "epoch": 4063} {"train_loss": -24.510421752929688, "global_step": 337230, "epoch": 4063} {"train_loss": -24.929401397705078, "global_step": 337231, "epoch": 4063} {"train_loss": -25.070146560668945, "global_step": 337232, "epoch": 4063} {"train_loss": -25.112293243408203, "global_step": 337233, "epoch": 4063} {"train_loss": -25.59634780883789, "global_step": 337234, "epoch": 4063} {"train_loss": -25.259140014648438, "global_step": 337235, "epoch": 4063} {"train_loss": -25.28582191467285, "global_step": 337236, "epoch": 4063} {"train_loss": -25.63776206970215, "global_step": 337237, "epoch": 4063} {"train_loss": -25.465452194213867, "global_step": 337238, "epoch": 4063} {"train_loss": -25.527265548706055, "global_step": 337239, "epoch": 4063} {"train_loss": -25.76837158203125, "global_step": 337240, "epoch": 4063} {"train_loss": -25.507009506225586, "global_step": 337241, "epoch": 4063} {"train_loss": -25.651113510131836, "global_step": 337242, "epoch": 4063} {"train_loss": -25.67500114440918, "global_step": 337243, "epoch": 4063} {"train_loss": -25.779993057250977, "global_step": 337244, "epoch": 4063} {"train_loss": -25.799482345581055, "global_step": 337245, "epoch": 4063} {"train_loss": -25.656766891479492, "global_step": 337246, "epoch": 4063} {"train_loss": -26.022388458251953, "global_step": 337247, "epoch": 4063} {"train_loss": -25.797657012939453, "global_step": 337248, "epoch": 4063} {"train_loss": -26.153722763061523, "global_step": 337249, "epoch": 4063} {"train_loss": -25.788715362548828, "global_step": 337250, "epoch": 4063} {"train_loss": -26.01157569885254, "global_step": 337251, "epoch": 4063} {"train_loss": -26.498960494995117, "global_step": 337252, "epoch": 4063} {"train_loss": -25.878564834594727, "global_step": 337253, "epoch": 4063} {"train_loss": -26.004968643188477, "global_step": 337254, "epoch": 4063} {"train_loss": -25.630218505859375, "global_step": 337255, "epoch": 4063} {"train_loss": -26.111602783203125, "global_step": 337256, "epoch": 4063} {"train_loss": -25.87271499633789, "global_step": 337257, "epoch": 4063} {"train_loss": -26.059955596923828, "global_step": 337258, "epoch": 4063} {"train_loss": -25.749755859375, "global_step": 337259, "epoch": 4063} {"train_loss": -26.048643112182617, "global_step": 337260, "epoch": 4063} {"train_loss": -26.081485748291016, "global_step": 337261, "epoch": 4063} {"train_loss": -25.98594093322754, "global_step": 337262, "epoch": 4063} {"train_loss": -26.210256576538086, "global_step": 337263, "epoch": 4063} {"train_loss": -26.2507381439209, "global_step": 337264, "epoch": 4063} {"train_loss": -26.190845489501953, "global_step": 337265, "epoch": 4063} {"train_loss": -26.295780181884766, "global_step": 337266, "epoch": 4063} {"train_loss": -26.348962783813477, "global_step": 337267, "epoch": 4063} {"train_loss": -26.628772735595703, "global_step": 337268, "epoch": 4063} {"train_loss": -25.988744735717773, "global_step": 337269, "epoch": 4063} {"train_loss": -26.196950912475586, "global_step": 337270, "epoch": 4063} {"train_loss": -25.963781356811523, "global_step": 337271, "epoch": 4063} {"train_loss": -25.855680465698242, "global_step": 337272, "epoch": 4063} {"train_loss": -25.90948486328125, "global_step": 337273, "epoch": 4063} {"train_loss": -26.217023849487305, "global_step": 337274, "epoch": 4063} {"train_loss": -25.94272232055664, "global_step": 337275, "epoch": 4063} {"train_loss": -26.001733779907227, "global_step": 337276, "epoch": 4063} {"train_loss": -26.281293869018555, "global_step": 337277, "epoch": 4063} {"train_loss": -25.8563232421875, "global_step": 337278, "epoch": 4063} {"train_loss": -26.037763595581055, "global_step": 337279, "epoch": 4063} {"train_loss": -26.44141960144043, "global_step": 337280, "epoch": 4063} {"train_loss": -26.201818466186523, "global_step": 337281, "epoch": 4063} {"train_loss": -25.942468643188477, "global_step": 337282, "epoch": 4063} {"train_loss": -26.171472549438477, "global_step": 337283, "epoch": 4063} {"train_loss": -26.295246124267578, "global_step": 337284, "epoch": 4063} {"train_loss": -26.381759643554688, "global_step": 337285, "epoch": 4063} {"train_loss": -26.4419002532959, "global_step": 337286, "epoch": 4063} {"train_loss": -26.13775634765625, "global_step": 337287, "epoch": 4063} {"train_loss": -26.181623458862305, "global_step": 337288, "epoch": 4063} {"train_loss": -26.52933120727539, "global_step": 337289, "epoch": 4063} {"train_loss": -25.7869930267334, "global_step": 337290, "epoch": 4063} {"train_loss": -25.43043327331543, "global_step": 337291, "epoch": 4063} {"train_loss": -25.254667282104492, "global_step": 337292, "epoch": 4063} {"train_loss": -25.875680923461914, "global_step": 337293, "epoch": 4063} {"train_loss": -26.20489501953125, "global_step": 337294, "epoch": 4063} {"train_loss": -26.080801010131836, "global_step": 337295, "epoch": 4063} {"train_loss": -25.352130889892578, "global_step": 337296, "epoch": 4063} {"train_loss": -25.14906120300293, "global_step": 337297, "epoch": 4063} {"train_loss": -25.831466674804688, "global_step": 337298, "epoch": 4063} {"train_loss": -25.804792404174805, "global_step": 337299, "epoch": 4063} {"train_loss": -25.6616268157959, "global_step": 337300, "epoch": 4063} {"train_loss": -25.74910545349121, "global_step": 337301, "epoch": 4063} {"train_loss": -25.816486358642578, "global_step": 337302, "epoch": 4063} {"train_loss": -24.992298126220703, "global_step": 337303, "epoch": 4063} {"train_loss": -25.354598999023438, "global_step": 337304, "epoch": 4063} {"train_loss": -25.67096519470215, "global_step": 337305, "epoch": 4063} {"train_loss": -25.43019676208496, "global_step": 337306, "epoch": 4063} {"train_loss": -25.86016273498535, "global_step": 337307, "epoch": 4063} {"train_loss": -25.984039306640625, "global_step": 337308, "epoch": 4063} {"train_loss": -25.869159698486328, "global_step": 337309, "epoch": 4063} {"train_loss": -25.894834518432617, "global_step": 337310, "epoch": 4063} {"train_loss": -25.832934873649872, "global_step": 337311, "epoch": 4063, "val_loss": 6759993.0} {"train_loss": -25.551170349121094, "global_step": 337312, "epoch": 4064} {"train_loss": -25.303604125976562, "global_step": 337313, "epoch": 4064} {"train_loss": -25.6813907623291, "global_step": 337314, "epoch": 4064} {"train_loss": -25.463369369506836, "global_step": 337315, "epoch": 4064} {"train_loss": -25.25229263305664, "global_step": 337316, "epoch": 4064} {"train_loss": -25.504470825195312, "global_step": 337317, "epoch": 4064} {"train_loss": -25.41096305847168, "global_step": 337318, "epoch": 4064} {"train_loss": -25.2097110748291, "global_step": 337319, "epoch": 4064} {"train_loss": -25.520721435546875, "global_step": 337320, "epoch": 4064} {"train_loss": -25.500102996826172, "global_step": 337321, "epoch": 4064} {"train_loss": -25.222625732421875, "global_step": 337322, "epoch": 4064} {"train_loss": -25.69331169128418, "global_step": 337323, "epoch": 4064} {"train_loss": -25.495962142944336, "global_step": 337324, "epoch": 4064} {"train_loss": -25.995960235595703, "global_step": 337325, "epoch": 4064} {"train_loss": -25.298242568969727, "global_step": 337326, "epoch": 4064} {"train_loss": -25.44122314453125, "global_step": 337327, "epoch": 4064} {"train_loss": -25.7849063873291, "global_step": 337328, "epoch": 4064} {"train_loss": -25.763263702392578, "global_step": 337329, "epoch": 4064} {"train_loss": -25.87388038635254, "global_step": 337330, "epoch": 4064} {"train_loss": -25.83904457092285, "global_step": 337331, "epoch": 4064} {"train_loss": -25.564592361450195, "global_step": 337332, "epoch": 4064} {"train_loss": -25.963903427124023, "global_step": 337333, "epoch": 4064} {"train_loss": -26.0942325592041, "global_step": 337334, "epoch": 4064} {"train_loss": -25.841794967651367, "global_step": 337335, "epoch": 4064} {"train_loss": -26.158203125, "global_step": 337336, "epoch": 4064} {"train_loss": -25.759674072265625, "global_step": 337337, "epoch": 4064} {"train_loss": -25.937213897705078, "global_step": 337338, "epoch": 4064} {"train_loss": -26.308862686157227, "global_step": 337339, "epoch": 4064} {"train_loss": -25.445283889770508, "global_step": 337340, "epoch": 4064} {"train_loss": -25.91364097595215, "global_step": 337341, "epoch": 4064} {"train_loss": -26.0595645904541, "global_step": 337342, "epoch": 4064} {"train_loss": -25.915807723999023, "global_step": 337343, "epoch": 4064} {"train_loss": -25.740936279296875, "global_step": 337344, "epoch": 4064} {"train_loss": -26.38091468811035, "global_step": 337345, "epoch": 4064} {"train_loss": -26.239273071289062, "global_step": 337346, "epoch": 4064} {"train_loss": -26.173315048217773, "global_step": 337347, "epoch": 4064} {"train_loss": -26.264684677124023, "global_step": 337348, "epoch": 4064} {"train_loss": -26.16438102722168, "global_step": 337349, "epoch": 4064} {"train_loss": -26.007648468017578, "global_step": 337350, "epoch": 4064} {"train_loss": -26.33440589904785, "global_step": 337351, "epoch": 4064} {"train_loss": -26.5213680267334, "global_step": 337352, "epoch": 4064} {"train_loss": -25.948598861694336, "global_step": 337353, "epoch": 4064} {"train_loss": -26.37798500061035, "global_step": 337354, "epoch": 4064} {"train_loss": -26.224218368530273, "global_step": 337355, "epoch": 4064} {"train_loss": -25.7791748046875, "global_step": 337356, "epoch": 4064} {"train_loss": -26.258655548095703, "global_step": 337357, "epoch": 4064} {"train_loss": -25.98894691467285, "global_step": 337358, "epoch": 4064} {"train_loss": -26.290042877197266, "global_step": 337359, "epoch": 4064} {"train_loss": -26.378259658813477, "global_step": 337360, "epoch": 4064} {"train_loss": -26.104169845581055, "global_step": 337361, "epoch": 4064} {"train_loss": -26.316328048706055, "global_step": 337362, "epoch": 4064} {"train_loss": -26.305158615112305, "global_step": 337363, "epoch": 4064} {"train_loss": -26.46592140197754, "global_step": 337364, "epoch": 4064} {"train_loss": -26.43269157409668, "global_step": 337365, "epoch": 4064} {"train_loss": -26.229312896728516, "global_step": 337366, "epoch": 4064} {"train_loss": -26.038806915283203, "global_step": 337367, "epoch": 4064} {"train_loss": -26.0697078704834, "global_step": 337368, "epoch": 4064} {"train_loss": -26.064178466796875, "global_step": 337369, "epoch": 4064} {"train_loss": -26.60206413269043, "global_step": 337370, "epoch": 4064} {"train_loss": -26.261693954467773, "global_step": 337371, "epoch": 4064} {"train_loss": -26.227588653564453, "global_step": 337372, "epoch": 4064} {"train_loss": -26.0568790435791, "global_step": 337373, "epoch": 4064} {"train_loss": -26.005285263061523, "global_step": 337374, "epoch": 4064} {"train_loss": -25.66391944885254, "global_step": 337375, "epoch": 4064} {"train_loss": -25.14131736755371, "global_step": 337376, "epoch": 4064} {"train_loss": -25.135343551635742, "global_step": 337377, "epoch": 4064} {"train_loss": -25.052087783813477, "global_step": 337378, "epoch": 4064} {"train_loss": -25.678735733032227, "global_step": 337379, "epoch": 4064} {"train_loss": -25.84845542907715, "global_step": 337380, "epoch": 4064} {"train_loss": -25.789764404296875, "global_step": 337381, "epoch": 4064} {"train_loss": -25.865705490112305, "global_step": 337382, "epoch": 4064} {"train_loss": -25.834936141967773, "global_step": 337383, "epoch": 4064} {"train_loss": -26.426319122314453, "global_step": 337384, "epoch": 4064} {"train_loss": -25.549949645996094, "global_step": 337385, "epoch": 4064} {"train_loss": -26.2513370513916, "global_step": 337386, "epoch": 4064} {"train_loss": -25.97198486328125, "global_step": 337387, "epoch": 4064} {"train_loss": -25.734228134155273, "global_step": 337388, "epoch": 4064} {"train_loss": -26.075109481811523, "global_step": 337389, "epoch": 4064} {"train_loss": -25.691333770751953, "global_step": 337390, "epoch": 4064} {"train_loss": -25.556121826171875, "global_step": 337391, "epoch": 4064} {"train_loss": -25.71070671081543, "global_step": 337392, "epoch": 4064} {"train_loss": -26.011194229125977, "global_step": 337393, "epoch": 4064} {"train_loss": -25.89584164447095, "global_step": 337394, "epoch": 4064, "val_loss": 6697314.0} {"train_loss": -25.934906005859375, "global_step": 337395, "epoch": 4065} {"train_loss": -25.59966278076172, "global_step": 337396, "epoch": 4065} {"train_loss": -25.683286666870117, "global_step": 337397, "epoch": 4065} {"train_loss": -25.512723922729492, "global_step": 337398, "epoch": 4065} {"train_loss": -25.414609909057617, "global_step": 337399, "epoch": 4065} {"train_loss": -25.406299591064453, "global_step": 337400, "epoch": 4065} {"train_loss": -26.158451080322266, "global_step": 337401, "epoch": 4065} {"train_loss": -25.054168701171875, "global_step": 337402, "epoch": 4065} {"train_loss": -25.829980850219727, "global_step": 337403, "epoch": 4065} {"train_loss": -25.680362701416016, "global_step": 337404, "epoch": 4065} {"train_loss": -25.523128509521484, "global_step": 337405, "epoch": 4065} {"train_loss": -26.27106285095215, "global_step": 337406, "epoch": 4065} {"train_loss": -25.805517196655273, "global_step": 337407, "epoch": 4065} {"train_loss": -25.900144577026367, "global_step": 337408, "epoch": 4065} {"train_loss": -25.805402755737305, "global_step": 337409, "epoch": 4065} {"train_loss": -25.818750381469727, "global_step": 337410, "epoch": 4065} {"train_loss": -25.975616455078125, "global_step": 337411, "epoch": 4065} {"train_loss": -25.87067985534668, "global_step": 337412, "epoch": 4065} {"train_loss": -26.054792404174805, "global_step": 337413, "epoch": 4065} {"train_loss": -25.997180938720703, "global_step": 337414, "epoch": 4065} {"train_loss": -25.42194938659668, "global_step": 337415, "epoch": 4065} {"train_loss": -25.84046745300293, "global_step": 337416, "epoch": 4065} {"train_loss": -26.098285675048828, "global_step": 337417, "epoch": 4065} {"train_loss": -26.21636962890625, "global_step": 337418, "epoch": 4065} {"train_loss": -25.86358642578125, "global_step": 337419, "epoch": 4065} {"train_loss": -26.160572052001953, "global_step": 337420, "epoch": 4065} {"train_loss": -26.100690841674805, "global_step": 337421, "epoch": 4065} {"train_loss": -26.19829750061035, "global_step": 337422, "epoch": 4065} {"train_loss": -25.86530113220215, "global_step": 337423, "epoch": 4065} {"train_loss": -25.978002548217773, "global_step": 337424, "epoch": 4065} {"train_loss": -25.951812744140625, "global_step": 337425, "epoch": 4065} {"train_loss": -26.000070571899414, "global_step": 337426, "epoch": 4065} {"train_loss": -26.323978424072266, "global_step": 337427, "epoch": 4065} {"train_loss": -26.380767822265625, "global_step": 337428, "epoch": 4065} {"train_loss": -25.99506187438965, "global_step": 337429, "epoch": 4065} {"train_loss": -26.22784996032715, "global_step": 337430, "epoch": 4065} {"train_loss": -26.279321670532227, "global_step": 337431, "epoch": 4065} {"train_loss": -25.887353897094727, "global_step": 337432, "epoch": 4065} {"train_loss": -25.663732528686523, "global_step": 337433, "epoch": 4065} {"train_loss": -26.131393432617188, "global_step": 337434, "epoch": 4065} {"train_loss": -26.10316276550293, "global_step": 337435, "epoch": 4065} {"train_loss": -26.01152992248535, "global_step": 337436, "epoch": 4065} {"train_loss": -25.89963722229004, "global_step": 337437, "epoch": 4065} {"train_loss": -26.192533493041992, "global_step": 337438, "epoch": 4065} {"train_loss": -26.4180965423584, "global_step": 337439, "epoch": 4065} {"train_loss": -25.44764518737793, "global_step": 337440, "epoch": 4065} {"train_loss": -25.850561141967773, "global_step": 337441, "epoch": 4065} {"train_loss": -26.400537490844727, "global_step": 337442, "epoch": 4065} {"train_loss": -26.185705184936523, "global_step": 337443, "epoch": 4065} {"train_loss": -25.931676864624023, "global_step": 337444, "epoch": 4065} {"train_loss": -26.107892990112305, "global_step": 337445, "epoch": 4065} {"train_loss": -26.076284408569336, "global_step": 337446, "epoch": 4065} {"train_loss": -26.419111251831055, "global_step": 337447, "epoch": 4065} {"train_loss": -26.477680206298828, "global_step": 337448, "epoch": 4065} {"train_loss": -26.205554962158203, "global_step": 337449, "epoch": 4065} {"train_loss": -26.0329647064209, "global_step": 337450, "epoch": 4065} {"train_loss": -26.493362426757812, "global_step": 337451, "epoch": 4065} {"train_loss": -26.686262130737305, "global_step": 337452, "epoch": 4065} {"train_loss": -26.255157470703125, "global_step": 337453, "epoch": 4065} {"train_loss": -26.33551025390625, "global_step": 337454, "epoch": 4065} {"train_loss": -26.09016227722168, "global_step": 337455, "epoch": 4065} {"train_loss": -26.05751609802246, "global_step": 337456, "epoch": 4065} {"train_loss": -26.66657829284668, "global_step": 337457, "epoch": 4065} {"train_loss": -26.14951515197754, "global_step": 337458, "epoch": 4065} {"train_loss": -26.037052154541016, "global_step": 337459, "epoch": 4065} {"train_loss": -26.442779541015625, "global_step": 337460, "epoch": 4065} {"train_loss": -25.87098503112793, "global_step": 337461, "epoch": 4065} {"train_loss": -26.03034019470215, "global_step": 337462, "epoch": 4065} {"train_loss": -26.2987060546875, "global_step": 337463, "epoch": 4065} {"train_loss": -26.236154556274414, "global_step": 337464, "epoch": 4065} {"train_loss": -26.3133602142334, "global_step": 337465, "epoch": 4065} {"train_loss": -26.376846313476562, "global_step": 337466, "epoch": 4065} {"train_loss": -26.30415153503418, "global_step": 337467, "epoch": 4065} {"train_loss": -26.338041305541992, "global_step": 337468, "epoch": 4065} {"train_loss": -25.98910903930664, "global_step": 337469, "epoch": 4065} {"train_loss": -25.793439865112305, "global_step": 337470, "epoch": 4065} {"train_loss": -25.691242218017578, "global_step": 337471, "epoch": 4065} {"train_loss": -26.183115005493164, "global_step": 337472, "epoch": 4065} {"train_loss": -26.20279884338379, "global_step": 337473, "epoch": 4065} {"train_loss": -25.728551864624023, "global_step": 337474, "epoch": 4065} {"train_loss": -26.010883331298828, "global_step": 337475, "epoch": 4065} {"train_loss": -25.47542953491211, "global_step": 337476, "epoch": 4065} {"train_loss": -26.00907098241599, "global_step": 337477, "epoch": 4065, "val_loss": 6840078.0} {"train_loss": -23.730066299438477, "global_step": 337478, "epoch": 4066} {"train_loss": -22.0854549407959, "global_step": 337479, "epoch": 4066} {"train_loss": -24.343908309936523, "global_step": 337480, "epoch": 4066} {"train_loss": -24.192045211791992, "global_step": 337481, "epoch": 4066} {"train_loss": -24.506383895874023, "global_step": 337482, "epoch": 4066} {"train_loss": -24.502410888671875, "global_step": 337483, "epoch": 4066} {"train_loss": -24.720584869384766, "global_step": 337484, "epoch": 4066} {"train_loss": -24.85100746154785, "global_step": 337485, "epoch": 4066} {"train_loss": -24.972944259643555, "global_step": 337486, "epoch": 4066} {"train_loss": -24.830223083496094, "global_step": 337487, "epoch": 4066} {"train_loss": -25.029630661010742, "global_step": 337488, "epoch": 4066} {"train_loss": -24.813709259033203, "global_step": 337489, "epoch": 4066} {"train_loss": -25.0965518951416, "global_step": 337490, "epoch": 4066} {"train_loss": -25.086811065673828, "global_step": 337491, "epoch": 4066} {"train_loss": -24.726879119873047, "global_step": 337492, "epoch": 4066} {"train_loss": -25.503311157226562, "global_step": 337493, "epoch": 4066} {"train_loss": -25.211761474609375, "global_step": 337494, "epoch": 4066} {"train_loss": -25.54230308532715, "global_step": 337495, "epoch": 4066} {"train_loss": -25.42315673828125, "global_step": 337496, "epoch": 4066} {"train_loss": -25.342443466186523, "global_step": 337497, "epoch": 4066} {"train_loss": -25.041515350341797, "global_step": 337498, "epoch": 4066} {"train_loss": -25.548349380493164, "global_step": 337499, "epoch": 4066} {"train_loss": -25.396291732788086, "global_step": 337500, "epoch": 4066} {"train_loss": -25.402496337890625, "global_step": 337501, "epoch": 4066} {"train_loss": -25.383291244506836, "global_step": 337502, "epoch": 4066} {"train_loss": -25.696630477905273, "global_step": 337503, "epoch": 4066} {"train_loss": -25.5443058013916, "global_step": 337504, "epoch": 4066} {"train_loss": -25.75272560119629, "global_step": 337505, "epoch": 4066} {"train_loss": -25.622350692749023, "global_step": 337506, "epoch": 4066} {"train_loss": -25.558996200561523, "global_step": 337507, "epoch": 4066} {"train_loss": -25.121112823486328, "global_step": 337508, "epoch": 4066} {"train_loss": -25.518177032470703, "global_step": 337509, "epoch": 4066} {"train_loss": -26.072656631469727, "global_step": 337510, "epoch": 4066} {"train_loss": -25.973363876342773, "global_step": 337511, "epoch": 4066} {"train_loss": -25.86524772644043, "global_step": 337512, "epoch": 4066} {"train_loss": -26.126920700073242, "global_step": 337513, "epoch": 4066} {"train_loss": -26.22161293029785, "global_step": 337514, "epoch": 4066} {"train_loss": -25.812841415405273, "global_step": 337515, "epoch": 4066} {"train_loss": -25.522085189819336, "global_step": 337516, "epoch": 4066} {"train_loss": -25.520755767822266, "global_step": 337517, "epoch": 4066} {"train_loss": -26.100934982299805, "global_step": 337518, "epoch": 4066} {"train_loss": -25.688312530517578, "global_step": 337519, "epoch": 4066} {"train_loss": -26.1350154876709, "global_step": 337520, "epoch": 4066} {"train_loss": -26.110706329345703, "global_step": 337521, "epoch": 4066} {"train_loss": -26.42170524597168, "global_step": 337522, "epoch": 4066} {"train_loss": -25.901508331298828, "global_step": 337523, "epoch": 4066} {"train_loss": -26.284631729125977, "global_step": 337524, "epoch": 4066} {"train_loss": -26.239545822143555, "global_step": 337525, "epoch": 4066} {"train_loss": -25.934467315673828, "global_step": 337526, "epoch": 4066} {"train_loss": -26.281713485717773, "global_step": 337527, "epoch": 4066} {"train_loss": -26.121479034423828, "global_step": 337528, "epoch": 4066} {"train_loss": -26.175378799438477, "global_step": 337529, "epoch": 4066} {"train_loss": -26.2652645111084, "global_step": 337530, "epoch": 4066} {"train_loss": -25.948078155517578, "global_step": 337531, "epoch": 4066} {"train_loss": -26.17280387878418, "global_step": 337532, "epoch": 4066} {"train_loss": -26.212665557861328, "global_step": 337533, "epoch": 4066} {"train_loss": -26.361581802368164, "global_step": 337534, "epoch": 4066} {"train_loss": -26.151437759399414, "global_step": 337535, "epoch": 4066} {"train_loss": -26.425373077392578, "global_step": 337536, "epoch": 4066} {"train_loss": -26.0683650970459, "global_step": 337537, "epoch": 4066} {"train_loss": -26.014612197875977, "global_step": 337538, "epoch": 4066} {"train_loss": -26.339675903320312, "global_step": 337539, "epoch": 4066} {"train_loss": -25.972919464111328, "global_step": 337540, "epoch": 4066} {"train_loss": -25.953149795532227, "global_step": 337541, "epoch": 4066} {"train_loss": -26.086851119995117, "global_step": 337542, "epoch": 4066} {"train_loss": -26.173547744750977, "global_step": 337543, "epoch": 4066} {"train_loss": -26.14841079711914, "global_step": 337544, "epoch": 4066} {"train_loss": -25.842737197875977, "global_step": 337545, "epoch": 4066} {"train_loss": -25.534500122070312, "global_step": 337546, "epoch": 4066} {"train_loss": -25.727262496948242, "global_step": 337547, "epoch": 4066} {"train_loss": -25.892560958862305, "global_step": 337548, "epoch": 4066} {"train_loss": -25.67230224609375, "global_step": 337549, "epoch": 4066} {"train_loss": -25.82404899597168, "global_step": 337550, "epoch": 4066} {"train_loss": -26.106882095336914, "global_step": 337551, "epoch": 4066} {"train_loss": -26.08282470703125, "global_step": 337552, "epoch": 4066} {"train_loss": -26.241918563842773, "global_step": 337553, "epoch": 4066} {"train_loss": -26.24726676940918, "global_step": 337554, "epoch": 4066} {"train_loss": -25.936304092407227, "global_step": 337555, "epoch": 4066} {"train_loss": -25.770322799682617, "global_step": 337556, "epoch": 4066} {"train_loss": -26.010725021362305, "global_step": 337557, "epoch": 4066} {"train_loss": -26.08097267150879, "global_step": 337558, "epoch": 4066} {"train_loss": -26.193084716796875, "global_step": 337559, "epoch": 4066} {"train_loss": -25.655720446483198, "global_step": 337560, "epoch": 4066, "val_loss": 6744726.0} {"train_loss": -24.98738670349121, "global_step": 337561, "epoch": 4067} {"train_loss": -24.549203872680664, "global_step": 337562, "epoch": 4067} {"train_loss": -25.31183433532715, "global_step": 337563, "epoch": 4067} {"train_loss": -25.649457931518555, "global_step": 337564, "epoch": 4067} {"train_loss": -24.734800338745117, "global_step": 337565, "epoch": 4067} {"train_loss": -25.801862716674805, "global_step": 337566, "epoch": 4067} {"train_loss": -25.181753158569336, "global_step": 337567, "epoch": 4067} {"train_loss": -25.78055763244629, "global_step": 337568, "epoch": 4067} {"train_loss": -25.225242614746094, "global_step": 337569, "epoch": 4067} {"train_loss": -26.088947296142578, "global_step": 337570, "epoch": 4067} {"train_loss": -25.616443634033203, "global_step": 337571, "epoch": 4067} {"train_loss": -25.397018432617188, "global_step": 337572, "epoch": 4067} {"train_loss": -25.539508819580078, "global_step": 337573, "epoch": 4067} {"train_loss": -25.60976219177246, "global_step": 337574, "epoch": 4067} {"train_loss": -25.298015594482422, "global_step": 337575, "epoch": 4067} {"train_loss": -25.7863712310791, "global_step": 337576, "epoch": 4067} {"train_loss": -25.570653915405273, "global_step": 337577, "epoch": 4067} {"train_loss": -25.757572174072266, "global_step": 337578, "epoch": 4067} {"train_loss": -25.934783935546875, "global_step": 337579, "epoch": 4067} {"train_loss": -25.748855590820312, "global_step": 337580, "epoch": 4067} {"train_loss": -26.339599609375, "global_step": 337581, "epoch": 4067} {"train_loss": -25.802839279174805, "global_step": 337582, "epoch": 4067} {"train_loss": -25.6115779876709, "global_step": 337583, "epoch": 4067} {"train_loss": -26.034717559814453, "global_step": 337584, "epoch": 4067} {"train_loss": -25.6752986907959, "global_step": 337585, "epoch": 4067} {"train_loss": -26.01143455505371, "global_step": 337586, "epoch": 4067} {"train_loss": -25.80573844909668, "global_step": 337587, "epoch": 4067} {"train_loss": -25.93452262878418, "global_step": 337588, "epoch": 4067} {"train_loss": -26.094898223876953, "global_step": 337589, "epoch": 4067} {"train_loss": -25.964101791381836, "global_step": 337590, "epoch": 4067} {"train_loss": -25.97635841369629, "global_step": 337591, "epoch": 4067} {"train_loss": -26.114099502563477, "global_step": 337592, "epoch": 4067} {"train_loss": -26.087921142578125, "global_step": 337593, "epoch": 4067} {"train_loss": -26.128469467163086, "global_step": 337594, "epoch": 4067} {"train_loss": -26.30278968811035, "global_step": 337595, "epoch": 4067} {"train_loss": -26.176593780517578, "global_step": 337596, "epoch": 4067} {"train_loss": -26.106595993041992, "global_step": 337597, "epoch": 4067} {"train_loss": -26.03618812561035, "global_step": 337598, "epoch": 4067} {"train_loss": -26.17231559753418, "global_step": 337599, "epoch": 4067} {"train_loss": -26.1174373626709, "global_step": 337600, "epoch": 4067} {"train_loss": -26.120498657226562, "global_step": 337601, "epoch": 4067} {"train_loss": -26.050739288330078, "global_step": 337602, "epoch": 4067} {"train_loss": -26.249713897705078, "global_step": 337603, "epoch": 4067} {"train_loss": -26.196516036987305, "global_step": 337604, "epoch": 4067} {"train_loss": -25.983978271484375, "global_step": 337605, "epoch": 4067} {"train_loss": -26.1101016998291, "global_step": 337606, "epoch": 4067} {"train_loss": -26.402978897094727, "global_step": 337607, "epoch": 4067} {"train_loss": -26.08648109436035, "global_step": 337608, "epoch": 4067} {"train_loss": -26.300342559814453, "global_step": 337609, "epoch": 4067} {"train_loss": -26.3289794921875, "global_step": 337610, "epoch": 4067} {"train_loss": -25.993606567382812, "global_step": 337611, "epoch": 4067} {"train_loss": -25.747007369995117, "global_step": 337612, "epoch": 4067} {"train_loss": -26.167272567749023, "global_step": 337613, "epoch": 4067} {"train_loss": -26.379913330078125, "global_step": 337614, "epoch": 4067} {"train_loss": -26.121692657470703, "global_step": 337615, "epoch": 4067} {"train_loss": -25.889001846313477, "global_step": 337616, "epoch": 4067} {"train_loss": -26.123559951782227, "global_step": 337617, "epoch": 4067} {"train_loss": -25.732166290283203, "global_step": 337618, "epoch": 4067} {"train_loss": -25.996891021728516, "global_step": 337619, "epoch": 4067} {"train_loss": -26.098005294799805, "global_step": 337620, "epoch": 4067} {"train_loss": -25.616424560546875, "global_step": 337621, "epoch": 4067} {"train_loss": -26.1256046295166, "global_step": 337622, "epoch": 4067} {"train_loss": -26.07667350769043, "global_step": 337623, "epoch": 4067} {"train_loss": -25.909704208374023, "global_step": 337624, "epoch": 4067} {"train_loss": -25.636255264282227, "global_step": 337625, "epoch": 4067} {"train_loss": -25.868682861328125, "global_step": 337626, "epoch": 4067} {"train_loss": -26.198837280273438, "global_step": 337627, "epoch": 4067} {"train_loss": -25.83562660217285, "global_step": 337628, "epoch": 4067} {"train_loss": -25.51422119140625, "global_step": 337629, "epoch": 4067} {"train_loss": -26.130895614624023, "global_step": 337630, "epoch": 4067} {"train_loss": -25.624460220336914, "global_step": 337631, "epoch": 4067} {"train_loss": -25.794042587280273, "global_step": 337632, "epoch": 4067} {"train_loss": -25.96945571899414, "global_step": 337633, "epoch": 4067} {"train_loss": -25.759992599487305, "global_step": 337634, "epoch": 4067} {"train_loss": -26.303083419799805, "global_step": 337635, "epoch": 4067} {"train_loss": -26.2520751953125, "global_step": 337636, "epoch": 4067} {"train_loss": -26.19874382019043, "global_step": 337637, "epoch": 4067} {"train_loss": -25.982038497924805, "global_step": 337638, "epoch": 4067} {"train_loss": -26.12689208984375, "global_step": 337639, "epoch": 4067} {"train_loss": -26.033544540405273, "global_step": 337640, "epoch": 4067} {"train_loss": -26.330963134765625, "global_step": 337641, "epoch": 4067} {"train_loss": -26.31440544128418, "global_step": 337642, "epoch": 4067} {"train_loss": -25.902684751763402, "global_step": 337643, "epoch": 4067, "val_loss": 6757127.5} {"train_loss": -25.811426162719727, "global_step": 337644, "epoch": 4068} {"train_loss": -25.315793991088867, "global_step": 337645, "epoch": 4068} {"train_loss": -26.039037704467773, "global_step": 337646, "epoch": 4068} {"train_loss": -26.001028060913086, "global_step": 337647, "epoch": 4068} {"train_loss": -25.897611618041992, "global_step": 337648, "epoch": 4068} {"train_loss": -25.805028915405273, "global_step": 337649, "epoch": 4068} {"train_loss": -25.78085708618164, "global_step": 337650, "epoch": 4068} {"train_loss": -25.738901138305664, "global_step": 337651, "epoch": 4068} {"train_loss": -25.7171573638916, "global_step": 337652, "epoch": 4068} {"train_loss": -25.935733795166016, "global_step": 337653, "epoch": 4068} {"train_loss": -25.912809371948242, "global_step": 337654, "epoch": 4068} {"train_loss": -25.77288818359375, "global_step": 337655, "epoch": 4068} {"train_loss": -26.155460357666016, "global_step": 337656, "epoch": 4068} {"train_loss": -25.948083877563477, "global_step": 337657, "epoch": 4068} {"train_loss": -25.88547134399414, "global_step": 337658, "epoch": 4068} {"train_loss": -25.987863540649414, "global_step": 337659, "epoch": 4068} {"train_loss": -26.063282012939453, "global_step": 337660, "epoch": 4068} {"train_loss": -25.682920455932617, "global_step": 337661, "epoch": 4068} {"train_loss": -26.180500030517578, "global_step": 337662, "epoch": 4068} {"train_loss": -26.007959365844727, "global_step": 337663, "epoch": 4068} {"train_loss": -25.963132858276367, "global_step": 337664, "epoch": 4068} {"train_loss": -25.8514404296875, "global_step": 337665, "epoch": 4068} {"train_loss": -26.02947998046875, "global_step": 337666, "epoch": 4068} {"train_loss": -26.133901596069336, "global_step": 337667, "epoch": 4068} {"train_loss": -26.116016387939453, "global_step": 337668, "epoch": 4068} {"train_loss": -26.222692489624023, "global_step": 337669, "epoch": 4068} {"train_loss": -26.05999755859375, "global_step": 337670, "epoch": 4068} {"train_loss": -26.050153732299805, "global_step": 337671, "epoch": 4068} {"train_loss": -26.114917755126953, "global_step": 337672, "epoch": 4068} {"train_loss": -25.884174346923828, "global_step": 337673, "epoch": 4068} {"train_loss": -26.28824234008789, "global_step": 337674, "epoch": 4068} {"train_loss": -26.100744247436523, "global_step": 337675, "epoch": 4068} {"train_loss": -25.976316452026367, "global_step": 337676, "epoch": 4068} {"train_loss": -25.80258560180664, "global_step": 337677, "epoch": 4068} {"train_loss": -25.781497955322266, "global_step": 337678, "epoch": 4068} {"train_loss": -26.11014175415039, "global_step": 337679, "epoch": 4068} {"train_loss": -25.716779708862305, "global_step": 337680, "epoch": 4068} {"train_loss": -26.30191421508789, "global_step": 337681, "epoch": 4068} {"train_loss": -26.410566329956055, "global_step": 337682, "epoch": 4068} {"train_loss": -26.24490737915039, "global_step": 337683, "epoch": 4068} {"train_loss": -25.905902862548828, "global_step": 337684, "epoch": 4068} {"train_loss": -26.137983322143555, "global_step": 337685, "epoch": 4068} {"train_loss": -26.08465003967285, "global_step": 337686, "epoch": 4068} {"train_loss": -25.781457901000977, "global_step": 337687, "epoch": 4068} {"train_loss": -25.863922119140625, "global_step": 337688, "epoch": 4068} {"train_loss": -25.689228057861328, "global_step": 337689, "epoch": 4068} {"train_loss": -25.835142135620117, "global_step": 337690, "epoch": 4068} {"train_loss": -25.784570693969727, "global_step": 337691, "epoch": 4068} {"train_loss": -26.091657638549805, "global_step": 337692, "epoch": 4068} {"train_loss": -26.103652954101562, "global_step": 337693, "epoch": 4068} {"train_loss": -25.8026180267334, "global_step": 337694, "epoch": 4068} {"train_loss": -26.00715446472168, "global_step": 337695, "epoch": 4068} {"train_loss": -25.794849395751953, "global_step": 337696, "epoch": 4068} {"train_loss": -25.707136154174805, "global_step": 337697, "epoch": 4068} {"train_loss": -25.9996337890625, "global_step": 337698, "epoch": 4068} {"train_loss": -25.96759033203125, "global_step": 337699, "epoch": 4068} {"train_loss": -25.68105125427246, "global_step": 337700, "epoch": 4068} {"train_loss": -25.86248779296875, "global_step": 337701, "epoch": 4068} {"train_loss": -26.02996253967285, "global_step": 337702, "epoch": 4068} {"train_loss": -25.791259765625, "global_step": 337703, "epoch": 4068} {"train_loss": -25.805831909179688, "global_step": 337704, "epoch": 4068} {"train_loss": -25.183727264404297, "global_step": 337705, "epoch": 4068} {"train_loss": -25.87237548828125, "global_step": 337706, "epoch": 4068} {"train_loss": -25.69950294494629, "global_step": 337707, "epoch": 4068} {"train_loss": -25.781396865844727, "global_step": 337708, "epoch": 4068} {"train_loss": -25.730344772338867, "global_step": 337709, "epoch": 4068} {"train_loss": -26.116857528686523, "global_step": 337710, "epoch": 4068} {"train_loss": -26.06147575378418, "global_step": 337711, "epoch": 4068} {"train_loss": -26.459043502807617, "global_step": 337712, "epoch": 4068} {"train_loss": -25.93202018737793, "global_step": 337713, "epoch": 4068} {"train_loss": -25.971494674682617, "global_step": 337714, "epoch": 4068} {"train_loss": -25.97596549987793, "global_step": 337715, "epoch": 4068} {"train_loss": -26.021413803100586, "global_step": 337716, "epoch": 4068} {"train_loss": -26.030378341674805, "global_step": 337717, "epoch": 4068} {"train_loss": -26.43192481994629, "global_step": 337718, "epoch": 4068} {"train_loss": -25.79172706604004, "global_step": 337719, "epoch": 4068} {"train_loss": -26.192813873291016, "global_step": 337720, "epoch": 4068} {"train_loss": -26.049091339111328, "global_step": 337721, "epoch": 4068} {"train_loss": -26.227420806884766, "global_step": 337722, "epoch": 4068} {"train_loss": -25.892684936523438, "global_step": 337723, "epoch": 4068} {"train_loss": -26.01502799987793, "global_step": 337724, "epoch": 4068} {"train_loss": -25.941381454467773, "global_step": 337725, "epoch": 4068} {"train_loss": -25.945379050381213, "global_step": 337726, "epoch": 4068, "val_loss": 6780629.0} {"train_loss": -26.337100982666016, "global_step": 337727, "epoch": 4069} {"train_loss": -25.26429557800293, "global_step": 337728, "epoch": 4069} {"train_loss": -26.13007926940918, "global_step": 337729, "epoch": 4069} {"train_loss": -25.334379196166992, "global_step": 337730, "epoch": 4069} {"train_loss": -25.429059982299805, "global_step": 337731, "epoch": 4069} {"train_loss": -26.057165145874023, "global_step": 337732, "epoch": 4069} {"train_loss": -25.53604507446289, "global_step": 337733, "epoch": 4069} {"train_loss": -25.55193519592285, "global_step": 337734, "epoch": 4069} {"train_loss": -26.100467681884766, "global_step": 337735, "epoch": 4069} {"train_loss": -25.274076461791992, "global_step": 337736, "epoch": 4069} {"train_loss": -25.682737350463867, "global_step": 337737, "epoch": 4069} {"train_loss": -25.868194580078125, "global_step": 337738, "epoch": 4069} {"train_loss": -26.09113883972168, "global_step": 337739, "epoch": 4069} {"train_loss": -25.649860382080078, "global_step": 337740, "epoch": 4069} {"train_loss": -26.14115333557129, "global_step": 337741, "epoch": 4069} {"train_loss": -25.93035888671875, "global_step": 337742, "epoch": 4069} {"train_loss": -26.088102340698242, "global_step": 337743, "epoch": 4069} {"train_loss": -25.96382713317871, "global_step": 337744, "epoch": 4069} {"train_loss": -25.671186447143555, "global_step": 337745, "epoch": 4069} {"train_loss": -25.640302658081055, "global_step": 337746, "epoch": 4069} {"train_loss": -25.783140182495117, "global_step": 337747, "epoch": 4069} {"train_loss": -26.20490074157715, "global_step": 337748, "epoch": 4069} {"train_loss": -25.497426986694336, "global_step": 337749, "epoch": 4069} {"train_loss": -25.952978134155273, "global_step": 337750, "epoch": 4069} {"train_loss": -25.56266212463379, "global_step": 337751, "epoch": 4069} {"train_loss": -26.498682022094727, "global_step": 337752, "epoch": 4069} {"train_loss": -26.141300201416016, "global_step": 337753, "epoch": 4069} {"train_loss": -26.39166831970215, "global_step": 337754, "epoch": 4069} {"train_loss": -25.984130859375, "global_step": 337755, "epoch": 4069} {"train_loss": -25.854618072509766, "global_step": 337756, "epoch": 4069} {"train_loss": -26.284372329711914, "global_step": 337757, "epoch": 4069} {"train_loss": -25.928577423095703, "global_step": 337758, "epoch": 4069} {"train_loss": -26.12884521484375, "global_step": 337759, "epoch": 4069} {"train_loss": -26.127410888671875, "global_step": 337760, "epoch": 4069} {"train_loss": -26.2215518951416, "global_step": 337761, "epoch": 4069} {"train_loss": -26.0459041595459, "global_step": 337762, "epoch": 4069} {"train_loss": -26.11334800720215, "global_step": 337763, "epoch": 4069} {"train_loss": -25.767118453979492, "global_step": 337764, "epoch": 4069} {"train_loss": -26.068777084350586, "global_step": 337765, "epoch": 4069} {"train_loss": -25.94622230529785, "global_step": 337766, "epoch": 4069} {"train_loss": -25.936935424804688, "global_step": 337767, "epoch": 4069} {"train_loss": -26.154279708862305, "global_step": 337768, "epoch": 4069} {"train_loss": -26.208486557006836, "global_step": 337769, "epoch": 4069} {"train_loss": -25.743162155151367, "global_step": 337770, "epoch": 4069} {"train_loss": -26.169071197509766, "global_step": 337771, "epoch": 4069} {"train_loss": -26.229055404663086, "global_step": 337772, "epoch": 4069} {"train_loss": -26.417816162109375, "global_step": 337773, "epoch": 4069} {"train_loss": -25.55284881591797, "global_step": 337774, "epoch": 4069} {"train_loss": -25.9439697265625, "global_step": 337775, "epoch": 4069} {"train_loss": -25.931549072265625, "global_step": 337776, "epoch": 4069} {"train_loss": -26.04633903503418, "global_step": 337777, "epoch": 4069} {"train_loss": -26.024946212768555, "global_step": 337778, "epoch": 4069} {"train_loss": -26.0493106842041, "global_step": 337779, "epoch": 4069} {"train_loss": -26.185821533203125, "global_step": 337780, "epoch": 4069} {"train_loss": -26.370084762573242, "global_step": 337781, "epoch": 4069} {"train_loss": -26.15854835510254, "global_step": 337782, "epoch": 4069} {"train_loss": -26.171924591064453, "global_step": 337783, "epoch": 4069} {"train_loss": -26.405866622924805, "global_step": 337784, "epoch": 4069} {"train_loss": -25.762022018432617, "global_step": 337785, "epoch": 4069} {"train_loss": -26.14145851135254, "global_step": 337786, "epoch": 4069} {"train_loss": -25.924787521362305, "global_step": 337787, "epoch": 4069} {"train_loss": -26.178308486938477, "global_step": 337788, "epoch": 4069} {"train_loss": -26.433990478515625, "global_step": 337789, "epoch": 4069} {"train_loss": -26.30811882019043, "global_step": 337790, "epoch": 4069} {"train_loss": -26.066354751586914, "global_step": 337791, "epoch": 4069} {"train_loss": -26.1653995513916, "global_step": 337792, "epoch": 4069} {"train_loss": -26.14763832092285, "global_step": 337793, "epoch": 4069} {"train_loss": -26.244735717773438, "global_step": 337794, "epoch": 4069} {"train_loss": -25.954010009765625, "global_step": 337795, "epoch": 4069} {"train_loss": -25.990034103393555, "global_step": 337796, "epoch": 4069} {"train_loss": -26.277450561523438, "global_step": 337797, "epoch": 4069} {"train_loss": -26.02594566345215, "global_step": 337798, "epoch": 4069} {"train_loss": -25.74952507019043, "global_step": 337799, "epoch": 4069} {"train_loss": -26.095630645751953, "global_step": 337800, "epoch": 4069} {"train_loss": -26.031494140625, "global_step": 337801, "epoch": 4069} {"train_loss": -26.005752563476562, "global_step": 337802, "epoch": 4069} {"train_loss": -25.922605514526367, "global_step": 337803, "epoch": 4069} {"train_loss": -25.81565284729004, "global_step": 337804, "epoch": 4069} {"train_loss": -26.1016902923584, "global_step": 337805, "epoch": 4069} {"train_loss": -26.099853515625, "global_step": 337806, "epoch": 4069} {"train_loss": -25.90576171875, "global_step": 337807, "epoch": 4069} {"train_loss": -26.630762100219727, "global_step": 337808, "epoch": 4069} {"train_loss": -26.005206923886956, "global_step": 337809, "epoch": 4069, "val_loss": 6810158.0} {"train_loss": -25.876001358032227, "global_step": 337810, "epoch": 4070} {"train_loss": -25.077646255493164, "global_step": 337811, "epoch": 4070} {"train_loss": -25.18439292907715, "global_step": 337812, "epoch": 4070} {"train_loss": -25.25979995727539, "global_step": 337813, "epoch": 4070} {"train_loss": -25.287342071533203, "global_step": 337814, "epoch": 4070} {"train_loss": -25.553449630737305, "global_step": 337815, "epoch": 4070} {"train_loss": -25.697019577026367, "global_step": 337816, "epoch": 4070} {"train_loss": -25.523405075073242, "global_step": 337817, "epoch": 4070} {"train_loss": -24.626949310302734, "global_step": 337818, "epoch": 4070} {"train_loss": -25.16694450378418, "global_step": 337819, "epoch": 4070} {"train_loss": -25.838300704956055, "global_step": 337820, "epoch": 4070} {"train_loss": -25.527868270874023, "global_step": 337821, "epoch": 4070} {"train_loss": -25.64765739440918, "global_step": 337822, "epoch": 4070} {"train_loss": -25.552505493164062, "global_step": 337823, "epoch": 4070} {"train_loss": -25.765161514282227, "global_step": 337824, "epoch": 4070} {"train_loss": -25.651020050048828, "global_step": 337825, "epoch": 4070} {"train_loss": -25.672266006469727, "global_step": 337826, "epoch": 4070} {"train_loss": -25.54006576538086, "global_step": 337827, "epoch": 4070} {"train_loss": -25.589658737182617, "global_step": 337828, "epoch": 4070} {"train_loss": -25.886585235595703, "global_step": 337829, "epoch": 4070} {"train_loss": -25.563108444213867, "global_step": 337830, "epoch": 4070} {"train_loss": -25.818933486938477, "global_step": 337831, "epoch": 4070} {"train_loss": -26.25152587890625, "global_step": 337832, "epoch": 4070} {"train_loss": -25.63740348815918, "global_step": 337833, "epoch": 4070} {"train_loss": -25.797327041625977, "global_step": 337834, "epoch": 4070} {"train_loss": -25.85652732849121, "global_step": 337835, "epoch": 4070} {"train_loss": -26.03595542907715, "global_step": 337836, "epoch": 4070} {"train_loss": -25.85552406311035, "global_step": 337837, "epoch": 4070} {"train_loss": -26.246612548828125, "global_step": 337838, "epoch": 4070} {"train_loss": -26.299219131469727, "global_step": 337839, "epoch": 4070} {"train_loss": -26.070682525634766, "global_step": 337840, "epoch": 4070} {"train_loss": -25.790985107421875, "global_step": 337841, "epoch": 4070} {"train_loss": -26.56879997253418, "global_step": 337842, "epoch": 4070} {"train_loss": -26.288183212280273, "global_step": 337843, "epoch": 4070} {"train_loss": -25.87325096130371, "global_step": 337844, "epoch": 4070} {"train_loss": -26.360279083251953, "global_step": 337845, "epoch": 4070} {"train_loss": -26.100019454956055, "global_step": 337846, "epoch": 4070} {"train_loss": -26.291473388671875, "global_step": 337847, "epoch": 4070} {"train_loss": -26.15056800842285, "global_step": 337848, "epoch": 4070} {"train_loss": -26.381784439086914, "global_step": 337849, "epoch": 4070} {"train_loss": -26.340627670288086, "global_step": 337850, "epoch": 4070} {"train_loss": -26.014816284179688, "global_step": 337851, "epoch": 4070} {"train_loss": -26.39283561706543, "global_step": 337852, "epoch": 4070} {"train_loss": -26.163877487182617, "global_step": 337853, "epoch": 4070} {"train_loss": -26.377344131469727, "global_step": 337854, "epoch": 4070} {"train_loss": -26.0756778717041, "global_step": 337855, "epoch": 4070} {"train_loss": -26.088809967041016, "global_step": 337856, "epoch": 4070} {"train_loss": -26.00355339050293, "global_step": 337857, "epoch": 4070} {"train_loss": -26.223295211791992, "global_step": 337858, "epoch": 4070} {"train_loss": -26.11960220336914, "global_step": 337859, "epoch": 4070} {"train_loss": -25.81694984436035, "global_step": 337860, "epoch": 4070} {"train_loss": -26.604578018188477, "global_step": 337861, "epoch": 4070} {"train_loss": -26.020898818969727, "global_step": 337862, "epoch": 4070} {"train_loss": -26.282855987548828, "global_step": 337863, "epoch": 4070} {"train_loss": -25.945287704467773, "global_step": 337864, "epoch": 4070} {"train_loss": -26.341663360595703, "global_step": 337865, "epoch": 4070} {"train_loss": -26.369592666625977, "global_step": 337866, "epoch": 4070} {"train_loss": -26.33172607421875, "global_step": 337867, "epoch": 4070} {"train_loss": -26.26912498474121, "global_step": 337868, "epoch": 4070} {"train_loss": -25.568490982055664, "global_step": 337869, "epoch": 4070} {"train_loss": -26.212345123291016, "global_step": 337870, "epoch": 4070} {"train_loss": -25.853260040283203, "global_step": 337871, "epoch": 4070} {"train_loss": -25.646991729736328, "global_step": 337872, "epoch": 4070} {"train_loss": -25.718128204345703, "global_step": 337873, "epoch": 4070} {"train_loss": -25.83064079284668, "global_step": 337874, "epoch": 4070} {"train_loss": -25.899633407592773, "global_step": 337875, "epoch": 4070} {"train_loss": -26.23140525817871, "global_step": 337876, "epoch": 4070} {"train_loss": -25.994598388671875, "global_step": 337877, "epoch": 4070} {"train_loss": -26.02860450744629, "global_step": 337878, "epoch": 4070} {"train_loss": -25.997589111328125, "global_step": 337879, "epoch": 4070} {"train_loss": -25.41897964477539, "global_step": 337880, "epoch": 4070} {"train_loss": -25.989416122436523, "global_step": 337881, "epoch": 4070} {"train_loss": -25.906421661376953, "global_step": 337882, "epoch": 4070} {"train_loss": -25.697290420532227, "global_step": 337883, "epoch": 4070} {"train_loss": -25.91798210144043, "global_step": 337884, "epoch": 4070} {"train_loss": -25.84331703186035, "global_step": 337885, "epoch": 4070} {"train_loss": -26.15289306640625, "global_step": 337886, "epoch": 4070} {"train_loss": -25.826190948486328, "global_step": 337887, "epoch": 4070} {"train_loss": -26.2274227142334, "global_step": 337888, "epoch": 4070} {"train_loss": -25.893829345703125, "global_step": 337889, "epoch": 4070} {"train_loss": -25.905210494995117, "global_step": 337890, "epoch": 4070} {"train_loss": -26.035566329956055, "global_step": 337891, "epoch": 4070} {"train_loss": -25.910519289683148, "global_step": 337892, "epoch": 4070, "val_loss": 6781517.0} {"train_loss": -25.526899337768555, "global_step": 337893, "epoch": 4071} {"train_loss": -25.57037925720215, "global_step": 337894, "epoch": 4071} {"train_loss": -25.729551315307617, "global_step": 337895, "epoch": 4071} {"train_loss": -25.938369750976562, "global_step": 337896, "epoch": 4071} {"train_loss": -25.47707176208496, "global_step": 337897, "epoch": 4071} {"train_loss": -25.664642333984375, "global_step": 337898, "epoch": 4071} {"train_loss": -25.49769401550293, "global_step": 337899, "epoch": 4071} {"train_loss": -25.350942611694336, "global_step": 337900, "epoch": 4071} {"train_loss": -25.76047706604004, "global_step": 337901, "epoch": 4071} {"train_loss": -25.7270450592041, "global_step": 337902, "epoch": 4071} {"train_loss": -25.542800903320312, "global_step": 337903, "epoch": 4071} {"train_loss": -25.90217399597168, "global_step": 337904, "epoch": 4071} {"train_loss": -25.94341468811035, "global_step": 337905, "epoch": 4071} {"train_loss": -25.81940269470215, "global_step": 337906, "epoch": 4071} {"train_loss": -25.94902992248535, "global_step": 337907, "epoch": 4071} {"train_loss": -25.7025203704834, "global_step": 337908, "epoch": 4071} {"train_loss": -26.117889404296875, "global_step": 337909, "epoch": 4071} {"train_loss": -26.033842086791992, "global_step": 337910, "epoch": 4071} {"train_loss": -26.007349014282227, "global_step": 337911, "epoch": 4071} {"train_loss": -26.043167114257812, "global_step": 337912, "epoch": 4071} {"train_loss": -25.81058692932129, "global_step": 337913, "epoch": 4071} {"train_loss": -26.23748207092285, "global_step": 337914, "epoch": 4071} {"train_loss": -26.29290199279785, "global_step": 337915, "epoch": 4071} {"train_loss": -26.147907257080078, "global_step": 337916, "epoch": 4071} {"train_loss": -26.169607162475586, "global_step": 337917, "epoch": 4071} {"train_loss": -25.999088287353516, "global_step": 337918, "epoch": 4071} {"train_loss": -26.129928588867188, "global_step": 337919, "epoch": 4071} {"train_loss": -26.269433975219727, "global_step": 337920, "epoch": 4071} {"train_loss": -26.3859806060791, "global_step": 337921, "epoch": 4071} {"train_loss": -25.91301918029785, "global_step": 337922, "epoch": 4071} {"train_loss": -26.220930099487305, "global_step": 337923, "epoch": 4071} {"train_loss": -26.278295516967773, "global_step": 337924, "epoch": 4071} {"train_loss": -25.97096061706543, "global_step": 337925, "epoch": 4071} {"train_loss": -26.245283126831055, "global_step": 337926, "epoch": 4071} {"train_loss": -26.077478408813477, "global_step": 337927, "epoch": 4071} {"train_loss": -25.912221908569336, "global_step": 337928, "epoch": 4071} {"train_loss": -25.93231773376465, "global_step": 337929, "epoch": 4071} {"train_loss": -26.022809982299805, "global_step": 337930, "epoch": 4071} {"train_loss": -26.018964767456055, "global_step": 337931, "epoch": 4071} {"train_loss": -26.4581241607666, "global_step": 337932, "epoch": 4071} {"train_loss": -26.63861656188965, "global_step": 337933, "epoch": 4071} {"train_loss": -26.060754776000977, "global_step": 337934, "epoch": 4071} {"train_loss": -26.307147979736328, "global_step": 337935, "epoch": 4071} {"train_loss": -26.317148208618164, "global_step": 337936, "epoch": 4071} {"train_loss": -26.027124404907227, "global_step": 337937, "epoch": 4071} {"train_loss": -26.100839614868164, "global_step": 337938, "epoch": 4071} {"train_loss": -26.280176162719727, "global_step": 337939, "epoch": 4071} {"train_loss": -26.130813598632812, "global_step": 337940, "epoch": 4071} {"train_loss": -26.01228904724121, "global_step": 337941, "epoch": 4071} {"train_loss": -25.9398250579834, "global_step": 337942, "epoch": 4071} {"train_loss": -25.436508178710938, "global_step": 337943, "epoch": 4071} {"train_loss": -25.7552490234375, "global_step": 337944, "epoch": 4071} {"train_loss": -25.95008659362793, "global_step": 337945, "epoch": 4071} {"train_loss": -26.424346923828125, "global_step": 337946, "epoch": 4071} {"train_loss": -25.984525680541992, "global_step": 337947, "epoch": 4071} {"train_loss": -26.03980827331543, "global_step": 337948, "epoch": 4071} {"train_loss": -26.341047286987305, "global_step": 337949, "epoch": 4071} {"train_loss": -25.805709838867188, "global_step": 337950, "epoch": 4071} {"train_loss": -25.23410987854004, "global_step": 337951, "epoch": 4071} {"train_loss": -25.44069480895996, "global_step": 337952, "epoch": 4071} {"train_loss": -26.047422409057617, "global_step": 337953, "epoch": 4071} {"train_loss": -25.27569007873535, "global_step": 337954, "epoch": 4071} {"train_loss": -25.905710220336914, "global_step": 337955, "epoch": 4071} {"train_loss": -25.488468170166016, "global_step": 337956, "epoch": 4071} {"train_loss": -25.416885375976562, "global_step": 337957, "epoch": 4071} {"train_loss": -25.359373092651367, "global_step": 337958, "epoch": 4071} {"train_loss": -25.52341079711914, "global_step": 337959, "epoch": 4071} {"train_loss": -25.843286514282227, "global_step": 337960, "epoch": 4071} {"train_loss": -25.707971572875977, "global_step": 337961, "epoch": 4071} {"train_loss": -25.577774047851562, "global_step": 337962, "epoch": 4071} {"train_loss": -25.880664825439453, "global_step": 337963, "epoch": 4071} {"train_loss": -25.8632869720459, "global_step": 337964, "epoch": 4071} {"train_loss": -25.748233795166016, "global_step": 337965, "epoch": 4071} {"train_loss": -26.068185806274414, "global_step": 337966, "epoch": 4071} {"train_loss": -25.629470825195312, "global_step": 337967, "epoch": 4071} {"train_loss": -25.7835750579834, "global_step": 337968, "epoch": 4071} {"train_loss": -25.618921279907227, "global_step": 337969, "epoch": 4071} {"train_loss": -25.366296768188477, "global_step": 337970, "epoch": 4071} {"train_loss": -25.402469635009766, "global_step": 337971, "epoch": 4071} {"train_loss": -26.080036163330078, "global_step": 337972, "epoch": 4071} {"train_loss": -25.537796020507812, "global_step": 337973, "epoch": 4071} {"train_loss": -26.133636474609375, "global_step": 337974, "epoch": 4071} {"train_loss": -25.882457779114503, "global_step": 337975, "epoch": 4071, "val_loss": 6768833.0} {"train_loss": -25.050230026245117, "global_step": 337976, "epoch": 4072} {"train_loss": -25.77931022644043, "global_step": 337977, "epoch": 4072} {"train_loss": -25.170072555541992, "global_step": 337978, "epoch": 4072} {"train_loss": -25.322275161743164, "global_step": 337979, "epoch": 4072} {"train_loss": -25.306806564331055, "global_step": 337980, "epoch": 4072} {"train_loss": -25.22003936767578, "global_step": 337981, "epoch": 4072} {"train_loss": -25.288869857788086, "global_step": 337982, "epoch": 4072} {"train_loss": -25.43160057067871, "global_step": 337983, "epoch": 4072} {"train_loss": -25.51966667175293, "global_step": 337984, "epoch": 4072} {"train_loss": -25.53878402709961, "global_step": 337985, "epoch": 4072} {"train_loss": -25.956205368041992, "global_step": 337986, "epoch": 4072} {"train_loss": -25.641345977783203, "global_step": 337987, "epoch": 4072} {"train_loss": -25.487369537353516, "global_step": 337988, "epoch": 4072} {"train_loss": -25.671100616455078, "global_step": 337989, "epoch": 4072} {"train_loss": -25.779096603393555, "global_step": 337990, "epoch": 4072} {"train_loss": -25.783910751342773, "global_step": 337991, "epoch": 4072} {"train_loss": -25.325326919555664, "global_step": 337992, "epoch": 4072} {"train_loss": -25.657194137573242, "global_step": 337993, "epoch": 4072} {"train_loss": -25.803308486938477, "global_step": 337994, "epoch": 4072} {"train_loss": -26.213987350463867, "global_step": 337995, "epoch": 4072} {"train_loss": -25.659406661987305, "global_step": 337996, "epoch": 4072} {"train_loss": -25.96368980407715, "global_step": 337997, "epoch": 4072} {"train_loss": -25.83342933654785, "global_step": 337998, "epoch": 4072} {"train_loss": -26.06650161743164, "global_step": 337999, "epoch": 4072} {"train_loss": -26.153966903686523, "global_step": 338000, "epoch": 4072} {"train_loss": -26.307449340820312, "global_step": 338001, "epoch": 4072} {"train_loss": -25.95572853088379, "global_step": 338002, "epoch": 4072} {"train_loss": -25.852094650268555, "global_step": 338003, "epoch": 4072} {"train_loss": -26.07700538635254, "global_step": 338004, "epoch": 4072} {"train_loss": -26.086261749267578, "global_step": 338005, "epoch": 4072} {"train_loss": -26.12183952331543, "global_step": 338006, "epoch": 4072} {"train_loss": -26.073118209838867, "global_step": 338007, "epoch": 4072} {"train_loss": -25.9134578704834, "global_step": 338008, "epoch": 4072} {"train_loss": -26.03729248046875, "global_step": 338009, "epoch": 4072} {"train_loss": -26.05112075805664, "global_step": 338010, "epoch": 4072} {"train_loss": -26.171308517456055, "global_step": 338011, "epoch": 4072} {"train_loss": -26.438425064086914, "global_step": 338012, "epoch": 4072} {"train_loss": -26.100799560546875, "global_step": 338013, "epoch": 4072} {"train_loss": -25.95505714416504, "global_step": 338014, "epoch": 4072} {"train_loss": -26.10829734802246, "global_step": 338015, "epoch": 4072} {"train_loss": -26.153446197509766, "global_step": 338016, "epoch": 4072} {"train_loss": -25.987567901611328, "global_step": 338017, "epoch": 4072} {"train_loss": -25.960058212280273, "global_step": 338018, "epoch": 4072} {"train_loss": -26.023151397705078, "global_step": 338019, "epoch": 4072} {"train_loss": -26.304712295532227, "global_step": 338020, "epoch": 4072} {"train_loss": -26.313100814819336, "global_step": 338021, "epoch": 4072} {"train_loss": -26.09505271911621, "global_step": 338022, "epoch": 4072} {"train_loss": -25.994159698486328, "global_step": 338023, "epoch": 4072} {"train_loss": -26.17228126525879, "global_step": 338024, "epoch": 4072} {"train_loss": -26.42927360534668, "global_step": 338025, "epoch": 4072} {"train_loss": -25.970691680908203, "global_step": 338026, "epoch": 4072} {"train_loss": -26.23430824279785, "global_step": 338027, "epoch": 4072} {"train_loss": -25.984670639038086, "global_step": 338028, "epoch": 4072} {"train_loss": -26.254175186157227, "global_step": 338029, "epoch": 4072} {"train_loss": -26.309005737304688, "global_step": 338030, "epoch": 4072} {"train_loss": -26.052154541015625, "global_step": 338031, "epoch": 4072} {"train_loss": -26.394489288330078, "global_step": 338032, "epoch": 4072} {"train_loss": -26.32960319519043, "global_step": 338033, "epoch": 4072} {"train_loss": -25.98151969909668, "global_step": 338034, "epoch": 4072} {"train_loss": -25.771167755126953, "global_step": 338035, "epoch": 4072} {"train_loss": -26.241735458374023, "global_step": 338036, "epoch": 4072} {"train_loss": -25.80133056640625, "global_step": 338037, "epoch": 4072} {"train_loss": -25.82061767578125, "global_step": 338038, "epoch": 4072} {"train_loss": -26.183246612548828, "global_step": 338039, "epoch": 4072} {"train_loss": -25.973743438720703, "global_step": 338040, "epoch": 4072} {"train_loss": -25.622724533081055, "global_step": 338041, "epoch": 4072} {"train_loss": -25.8306827545166, "global_step": 338042, "epoch": 4072} {"train_loss": -26.39725112915039, "global_step": 338043, "epoch": 4072} {"train_loss": -25.871097564697266, "global_step": 338044, "epoch": 4072} {"train_loss": -25.882593154907227, "global_step": 338045, "epoch": 4072} {"train_loss": -26.08961296081543, "global_step": 338046, "epoch": 4072} {"train_loss": -25.919818878173828, "global_step": 338047, "epoch": 4072} {"train_loss": -26.037336349487305, "global_step": 338048, "epoch": 4072} {"train_loss": -26.039813995361328, "global_step": 338049, "epoch": 4072} {"train_loss": -26.483549118041992, "global_step": 338050, "epoch": 4072} {"train_loss": -26.239215850830078, "global_step": 338051, "epoch": 4072} {"train_loss": -26.488189697265625, "global_step": 338052, "epoch": 4072} {"train_loss": -26.127546310424805, "global_step": 338053, "epoch": 4072} {"train_loss": -25.996850967407227, "global_step": 338054, "epoch": 4072} {"train_loss": -26.080530166625977, "global_step": 338055, "epoch": 4072} {"train_loss": -26.19698143005371, "global_step": 338056, "epoch": 4072} {"train_loss": -26.263580322265625, "global_step": 338057, "epoch": 4072} {"train_loss": -25.955552227525825, "global_step": 338058, "epoch": 4072, "val_loss": 6850060.0} {"train_loss": -25.961761474609375, "global_step": 338059, "epoch": 4073} {"train_loss": -25.787694931030273, "global_step": 338060, "epoch": 4073} {"train_loss": -25.448415756225586, "global_step": 338061, "epoch": 4073} {"train_loss": -26.0721492767334, "global_step": 338062, "epoch": 4073} {"train_loss": -25.729827880859375, "global_step": 338063, "epoch": 4073} {"train_loss": -25.599746704101562, "global_step": 338064, "epoch": 4073} {"train_loss": -25.913623809814453, "global_step": 338065, "epoch": 4073} {"train_loss": -25.662353515625, "global_step": 338066, "epoch": 4073} {"train_loss": -25.961475372314453, "global_step": 338067, "epoch": 4073} {"train_loss": -25.9818058013916, "global_step": 338068, "epoch": 4073} {"train_loss": -25.79542350769043, "global_step": 338069, "epoch": 4073} {"train_loss": -26.038808822631836, "global_step": 338070, "epoch": 4073} {"train_loss": -26.03952407836914, "global_step": 338071, "epoch": 4073} {"train_loss": -26.070728302001953, "global_step": 338072, "epoch": 4073} {"train_loss": -25.803974151611328, "global_step": 338073, "epoch": 4073} {"train_loss": -26.17087745666504, "global_step": 338074, "epoch": 4073} {"train_loss": -25.896259307861328, "global_step": 338075, "epoch": 4073} {"train_loss": -26.274169921875, "global_step": 338076, "epoch": 4073} {"train_loss": -26.10763931274414, "global_step": 338077, "epoch": 4073} {"train_loss": -26.103002548217773, "global_step": 338078, "epoch": 4073} {"train_loss": -26.265674591064453, "global_step": 338079, "epoch": 4073} {"train_loss": -25.921859741210938, "global_step": 338080, "epoch": 4073} {"train_loss": -25.8085994720459, "global_step": 338081, "epoch": 4073} {"train_loss": -26.372838973999023, "global_step": 338082, "epoch": 4073} {"train_loss": -26.31194496154785, "global_step": 338083, "epoch": 4073} {"train_loss": -25.883045196533203, "global_step": 338084, "epoch": 4073} {"train_loss": -26.656965255737305, "global_step": 338085, "epoch": 4073} {"train_loss": -25.912954330444336, "global_step": 338086, "epoch": 4073} {"train_loss": -26.077533721923828, "global_step": 338087, "epoch": 4073} {"train_loss": -26.250885009765625, "global_step": 338088, "epoch": 4073} {"train_loss": -26.155317306518555, "global_step": 338089, "epoch": 4073} {"train_loss": -26.072357177734375, "global_step": 338090, "epoch": 4073} {"train_loss": -25.952138900756836, "global_step": 338091, "epoch": 4073} {"train_loss": -26.287139892578125, "global_step": 338092, "epoch": 4073} {"train_loss": -26.18465232849121, "global_step": 338093, "epoch": 4073} {"train_loss": -26.285009384155273, "global_step": 338094, "epoch": 4073} {"train_loss": -26.137720108032227, "global_step": 338095, "epoch": 4073} {"train_loss": -25.83509635925293, "global_step": 338096, "epoch": 4073} {"train_loss": -25.72321891784668, "global_step": 338097, "epoch": 4073} {"train_loss": -25.86590003967285, "global_step": 338098, "epoch": 4073} {"train_loss": -26.04364013671875, "global_step": 338099, "epoch": 4073} {"train_loss": -26.040494918823242, "global_step": 338100, "epoch": 4073} {"train_loss": -26.161640167236328, "global_step": 338101, "epoch": 4073} {"train_loss": -26.017011642456055, "global_step": 338102, "epoch": 4073} {"train_loss": -25.641828536987305, "global_step": 338103, "epoch": 4073} {"train_loss": -25.940628051757812, "global_step": 338104, "epoch": 4073} {"train_loss": -25.828327178955078, "global_step": 338105, "epoch": 4073} {"train_loss": -26.208576202392578, "global_step": 338106, "epoch": 4073} {"train_loss": -25.815465927124023, "global_step": 338107, "epoch": 4073} {"train_loss": -26.179733276367188, "global_step": 338108, "epoch": 4073} {"train_loss": -26.246097564697266, "global_step": 338109, "epoch": 4073} {"train_loss": -25.679468154907227, "global_step": 338110, "epoch": 4073} {"train_loss": -26.175886154174805, "global_step": 338111, "epoch": 4073} {"train_loss": -25.961933135986328, "global_step": 338112, "epoch": 4073} {"train_loss": -26.251794815063477, "global_step": 338113, "epoch": 4073} {"train_loss": -26.097278594970703, "global_step": 338114, "epoch": 4073} {"train_loss": -26.2756290435791, "global_step": 338115, "epoch": 4073} {"train_loss": -25.985815048217773, "global_step": 338116, "epoch": 4073} {"train_loss": -26.042236328125, "global_step": 338117, "epoch": 4073} {"train_loss": -26.210372924804688, "global_step": 338118, "epoch": 4073} {"train_loss": -25.701086044311523, "global_step": 338119, "epoch": 4073} {"train_loss": -26.043256759643555, "global_step": 338120, "epoch": 4073} {"train_loss": -25.82958984375, "global_step": 338121, "epoch": 4073} {"train_loss": -25.64141273498535, "global_step": 338122, "epoch": 4073} {"train_loss": -26.1407470703125, "global_step": 338123, "epoch": 4073} {"train_loss": -25.756860733032227, "global_step": 338124, "epoch": 4073} {"train_loss": -25.59149742126465, "global_step": 338125, "epoch": 4073} {"train_loss": -25.868619918823242, "global_step": 338126, "epoch": 4073} {"train_loss": -25.7418155670166, "global_step": 338127, "epoch": 4073} {"train_loss": -25.9752254486084, "global_step": 338128, "epoch": 4073} {"train_loss": -25.96675682067871, "global_step": 338129, "epoch": 4073} {"train_loss": -25.920291900634766, "global_step": 338130, "epoch": 4073} {"train_loss": -26.100095748901367, "global_step": 338131, "epoch": 4073} {"train_loss": -26.232656478881836, "global_step": 338132, "epoch": 4073} {"train_loss": -26.11665916442871, "global_step": 338133, "epoch": 4073} {"train_loss": -25.862146377563477, "global_step": 338134, "epoch": 4073} {"train_loss": -26.006017684936523, "global_step": 338135, "epoch": 4073} {"train_loss": -25.982105255126953, "global_step": 338136, "epoch": 4073} {"train_loss": -25.869384765625, "global_step": 338137, "epoch": 4073} {"train_loss": -26.049535751342773, "global_step": 338138, "epoch": 4073} {"train_loss": -25.993444442749023, "global_step": 338139, "epoch": 4073} {"train_loss": -25.91485595703125, "global_step": 338140, "epoch": 4073} {"train_loss": -26.01150710324207, "global_step": 338141, "epoch": 4073, "val_loss": 6826328.0} {"train_loss": -24.80945587158203, "global_step": 338142, "epoch": 4074} {"train_loss": -25.265594482421875, "global_step": 338143, "epoch": 4074} {"train_loss": -24.81201171875, "global_step": 338144, "epoch": 4074} {"train_loss": -25.591691970825195, "global_step": 338145, "epoch": 4074} {"train_loss": -25.761310577392578, "global_step": 338146, "epoch": 4074} {"train_loss": -25.26822280883789, "global_step": 338147, "epoch": 4074} {"train_loss": -25.736352920532227, "global_step": 338148, "epoch": 4074} {"train_loss": -25.965539932250977, "global_step": 338149, "epoch": 4074} {"train_loss": -25.505672454833984, "global_step": 338150, "epoch": 4074} {"train_loss": -25.74087905883789, "global_step": 338151, "epoch": 4074} {"train_loss": -25.979175567626953, "global_step": 338152, "epoch": 4074} {"train_loss": -25.596477508544922, "global_step": 338153, "epoch": 4074} {"train_loss": -25.6334228515625, "global_step": 338154, "epoch": 4074} {"train_loss": -25.8541316986084, "global_step": 338155, "epoch": 4074} {"train_loss": -25.736753463745117, "global_step": 338156, "epoch": 4074} {"train_loss": -25.929676055908203, "global_step": 338157, "epoch": 4074} {"train_loss": -26.135175704956055, "global_step": 338158, "epoch": 4074} {"train_loss": -25.905832290649414, "global_step": 338159, "epoch": 4074} {"train_loss": -25.914142608642578, "global_step": 338160, "epoch": 4074} {"train_loss": -25.97190284729004, "global_step": 338161, "epoch": 4074} {"train_loss": -25.939014434814453, "global_step": 338162, "epoch": 4074} {"train_loss": -26.222070693969727, "global_step": 338163, "epoch": 4074} {"train_loss": -25.46958351135254, "global_step": 338164, "epoch": 4074} {"train_loss": -25.727399826049805, "global_step": 338165, "epoch": 4074} {"train_loss": -25.96512794494629, "global_step": 338166, "epoch": 4074} {"train_loss": -26.185577392578125, "global_step": 338167, "epoch": 4074} {"train_loss": -26.243515014648438, "global_step": 338168, "epoch": 4074} {"train_loss": -25.880462646484375, "global_step": 338169, "epoch": 4074} {"train_loss": -26.301504135131836, "global_step": 338170, "epoch": 4074} {"train_loss": -25.880544662475586, "global_step": 338171, "epoch": 4074} {"train_loss": -26.224655151367188, "global_step": 338172, "epoch": 4074} {"train_loss": -25.533092498779297, "global_step": 338173, "epoch": 4074} {"train_loss": -26.046850204467773, "global_step": 338174, "epoch": 4074} {"train_loss": -26.24921989440918, "global_step": 338175, "epoch": 4074} {"train_loss": -26.0960693359375, "global_step": 338176, "epoch": 4074} {"train_loss": -26.54593276977539, "global_step": 338177, "epoch": 4074} {"train_loss": -26.388050079345703, "global_step": 338178, "epoch": 4074} {"train_loss": -26.0399227142334, "global_step": 338179, "epoch": 4074} {"train_loss": -25.75676918029785, "global_step": 338180, "epoch": 4074} {"train_loss": -25.769128799438477, "global_step": 338181, "epoch": 4074} {"train_loss": -26.000518798828125, "global_step": 338182, "epoch": 4074} {"train_loss": -26.050745010375977, "global_step": 338183, "epoch": 4074} {"train_loss": -26.126073837280273, "global_step": 338184, "epoch": 4074} {"train_loss": -26.233612060546875, "global_step": 338185, "epoch": 4074} {"train_loss": -26.050460815429688, "global_step": 338186, "epoch": 4074} {"train_loss": -26.024066925048828, "global_step": 338187, "epoch": 4074} {"train_loss": -26.32916259765625, "global_step": 338188, "epoch": 4074} {"train_loss": -26.071741104125977, "global_step": 338189, "epoch": 4074} {"train_loss": -26.051176071166992, "global_step": 338190, "epoch": 4074} {"train_loss": -26.236225128173828, "global_step": 338191, "epoch": 4074} {"train_loss": -25.982534408569336, "global_step": 338192, "epoch": 4074} {"train_loss": -26.612548828125, "global_step": 338193, "epoch": 4074} {"train_loss": -26.094465255737305, "global_step": 338194, "epoch": 4074} {"train_loss": -26.07110023498535, "global_step": 338195, "epoch": 4074} {"train_loss": -26.447961807250977, "global_step": 338196, "epoch": 4074} {"train_loss": -26.3989200592041, "global_step": 338197, "epoch": 4074} {"train_loss": -26.011762619018555, "global_step": 338198, "epoch": 4074} {"train_loss": -25.942047119140625, "global_step": 338199, "epoch": 4074} {"train_loss": -26.1519775390625, "global_step": 338200, "epoch": 4074} {"train_loss": -26.379735946655273, "global_step": 338201, "epoch": 4074} {"train_loss": -26.173059463500977, "global_step": 338202, "epoch": 4074} {"train_loss": -25.991825103759766, "global_step": 338203, "epoch": 4074} {"train_loss": -26.31025505065918, "global_step": 338204, "epoch": 4074} {"train_loss": -26.368444442749023, "global_step": 338205, "epoch": 4074} {"train_loss": -25.613861083984375, "global_step": 338206, "epoch": 4074} {"train_loss": -25.914758682250977, "global_step": 338207, "epoch": 4074} {"train_loss": -26.482242584228516, "global_step": 338208, "epoch": 4074} {"train_loss": -25.916105270385742, "global_step": 338209, "epoch": 4074} {"train_loss": -25.957441329956055, "global_step": 338210, "epoch": 4074} {"train_loss": -25.974618911743164, "global_step": 338211, "epoch": 4074} {"train_loss": -26.226713180541992, "global_step": 338212, "epoch": 4074} {"train_loss": -26.397974014282227, "global_step": 338213, "epoch": 4074} {"train_loss": -25.913206100463867, "global_step": 338214, "epoch": 4074} {"train_loss": -25.92594337463379, "global_step": 338215, "epoch": 4074} {"train_loss": -26.233535766601562, "global_step": 338216, "epoch": 4074} {"train_loss": -26.266645431518555, "global_step": 338217, "epoch": 4074} {"train_loss": -25.981571197509766, "global_step": 338218, "epoch": 4074} {"train_loss": -26.20302391052246, "global_step": 338219, "epoch": 4074} {"train_loss": -26.006793975830078, "global_step": 338220, "epoch": 4074} {"train_loss": -25.78265380859375, "global_step": 338221, "epoch": 4074} {"train_loss": -25.674118041992188, "global_step": 338222, "epoch": 4074} {"train_loss": -25.998355865478516, "global_step": 338223, "epoch": 4074} {"train_loss": -25.9757114548281, "global_step": 338224, "epoch": 4074, "val_loss": 6731377.0} {"train_loss": -25.458471298217773, "global_step": 338225, "epoch": 4075} {"train_loss": -25.59224510192871, "global_step": 338226, "epoch": 4075} {"train_loss": -25.952381134033203, "global_step": 338227, "epoch": 4075} {"train_loss": -25.515079498291016, "global_step": 338228, "epoch": 4075} {"train_loss": -25.589696884155273, "global_step": 338229, "epoch": 4075} {"train_loss": -25.479568481445312, "global_step": 338230, "epoch": 4075} {"train_loss": -25.782794952392578, "global_step": 338231, "epoch": 4075} {"train_loss": -25.846105575561523, "global_step": 338232, "epoch": 4075} {"train_loss": -25.649450302124023, "global_step": 338233, "epoch": 4075} {"train_loss": -25.481752395629883, "global_step": 338234, "epoch": 4075} {"train_loss": -25.655780792236328, "global_step": 338235, "epoch": 4075} {"train_loss": -25.531021118164062, "global_step": 338236, "epoch": 4075} {"train_loss": -25.57288932800293, "global_step": 338237, "epoch": 4075} {"train_loss": -25.711688995361328, "global_step": 338238, "epoch": 4075} {"train_loss": -25.856159210205078, "global_step": 338239, "epoch": 4075} {"train_loss": -26.034564971923828, "global_step": 338240, "epoch": 4075} {"train_loss": -25.80010986328125, "global_step": 338241, "epoch": 4075} {"train_loss": -26.284305572509766, "global_step": 338242, "epoch": 4075} {"train_loss": -25.58109474182129, "global_step": 338243, "epoch": 4075} {"train_loss": -26.156747817993164, "global_step": 338244, "epoch": 4075} {"train_loss": -25.802947998046875, "global_step": 338245, "epoch": 4075} {"train_loss": -25.94675636291504, "global_step": 338246, "epoch": 4075} {"train_loss": -26.067434310913086, "global_step": 338247, "epoch": 4075} {"train_loss": -26.0638370513916, "global_step": 338248, "epoch": 4075} {"train_loss": -25.84248161315918, "global_step": 338249, "epoch": 4075} {"train_loss": -25.931903839111328, "global_step": 338250, "epoch": 4075} {"train_loss": -25.93190574645996, "global_step": 338251, "epoch": 4075} {"train_loss": -26.38909912109375, "global_step": 338252, "epoch": 4075} {"train_loss": -26.0079288482666, "global_step": 338253, "epoch": 4075} {"train_loss": -26.13290786743164, "global_step": 338254, "epoch": 4075} {"train_loss": -26.157428741455078, "global_step": 338255, "epoch": 4075} {"train_loss": -26.51089859008789, "global_step": 338256, "epoch": 4075} {"train_loss": -26.301345825195312, "global_step": 338257, "epoch": 4075} {"train_loss": -25.989276885986328, "global_step": 338258, "epoch": 4075} {"train_loss": -26.30616569519043, "global_step": 338259, "epoch": 4075} {"train_loss": -26.2803897857666, "global_step": 338260, "epoch": 4075} {"train_loss": -26.3394775390625, "global_step": 338261, "epoch": 4075} {"train_loss": -26.716278076171875, "global_step": 338262, "epoch": 4075} {"train_loss": -26.204883575439453, "global_step": 338263, "epoch": 4075} {"train_loss": -26.35392189025879, "global_step": 338264, "epoch": 4075} {"train_loss": -25.936079025268555, "global_step": 338265, "epoch": 4075} {"train_loss": -26.053272247314453, "global_step": 338266, "epoch": 4075} {"train_loss": -26.42225456237793, "global_step": 338267, "epoch": 4075} {"train_loss": -26.301000595092773, "global_step": 338268, "epoch": 4075} {"train_loss": -25.923730850219727, "global_step": 338269, "epoch": 4075} {"train_loss": -26.19032096862793, "global_step": 338270, "epoch": 4075} {"train_loss": -26.296823501586914, "global_step": 338271, "epoch": 4075} {"train_loss": -26.39277458190918, "global_step": 338272, "epoch": 4075} {"train_loss": -26.455265045166016, "global_step": 338273, "epoch": 4075} {"train_loss": -26.398681640625, "global_step": 338274, "epoch": 4075} {"train_loss": -26.28838539123535, "global_step": 338275, "epoch": 4075} {"train_loss": -26.090579986572266, "global_step": 338276, "epoch": 4075} {"train_loss": -25.722509384155273, "global_step": 338277, "epoch": 4075} {"train_loss": -24.430971145629883, "global_step": 338278, "epoch": 4075} {"train_loss": -24.052051544189453, "global_step": 338279, "epoch": 4075} {"train_loss": -25.00274085998535, "global_step": 338280, "epoch": 4075} {"train_loss": -24.384998321533203, "global_step": 338281, "epoch": 4075} {"train_loss": -25.7604923248291, "global_step": 338282, "epoch": 4075} {"train_loss": -25.70125389099121, "global_step": 338283, "epoch": 4075} {"train_loss": -25.104602813720703, "global_step": 338284, "epoch": 4075} {"train_loss": -25.127721786499023, "global_step": 338285, "epoch": 4075} {"train_loss": -25.70562171936035, "global_step": 338286, "epoch": 4075} {"train_loss": -25.326770782470703, "global_step": 338287, "epoch": 4075} {"train_loss": -25.49704360961914, "global_step": 338288, "epoch": 4075} {"train_loss": -25.860807418823242, "global_step": 338289, "epoch": 4075} {"train_loss": -25.927692413330078, "global_step": 338290, "epoch": 4075} {"train_loss": -25.55109977722168, "global_step": 338291, "epoch": 4075} {"train_loss": -26.133081436157227, "global_step": 338292, "epoch": 4075} {"train_loss": -25.14568519592285, "global_step": 338293, "epoch": 4075} {"train_loss": -25.919492721557617, "global_step": 338294, "epoch": 4075} {"train_loss": -25.623945236206055, "global_step": 338295, "epoch": 4075} {"train_loss": -25.304386138916016, "global_step": 338296, "epoch": 4075} {"train_loss": -25.36166763305664, "global_step": 338297, "epoch": 4075} {"train_loss": -26.06830406188965, "global_step": 338298, "epoch": 4075} {"train_loss": -25.57697105407715, "global_step": 338299, "epoch": 4075} {"train_loss": -25.49268341064453, "global_step": 338300, "epoch": 4075} {"train_loss": -26.07501792907715, "global_step": 338301, "epoch": 4075} {"train_loss": -25.943069458007812, "global_step": 338302, "epoch": 4075} {"train_loss": -26.1830997467041, "global_step": 338303, "epoch": 4075} {"train_loss": -25.95502281188965, "global_step": 338304, "epoch": 4075} {"train_loss": -26.013879776000977, "global_step": 338305, "epoch": 4075} {"train_loss": -25.91878318786621, "global_step": 338306, "epoch": 4075} {"train_loss": -25.839715130357856, "global_step": 338307, "epoch": 4075, "val_loss": 6750607.0} {"train_loss": -25.78870964050293, "global_step": 338308, "epoch": 4076} {"train_loss": -25.643850326538086, "global_step": 338309, "epoch": 4076} {"train_loss": -26.205596923828125, "global_step": 338310, "epoch": 4076} {"train_loss": -25.762720108032227, "global_step": 338311, "epoch": 4076} {"train_loss": -25.488645553588867, "global_step": 338312, "epoch": 4076} {"train_loss": -25.551694869995117, "global_step": 338313, "epoch": 4076} {"train_loss": -25.543821334838867, "global_step": 338314, "epoch": 4076} {"train_loss": -25.518247604370117, "global_step": 338315, "epoch": 4076} {"train_loss": -26.034460067749023, "global_step": 338316, "epoch": 4076} {"train_loss": -25.74871253967285, "global_step": 338317, "epoch": 4076} {"train_loss": -25.987350463867188, "global_step": 338318, "epoch": 4076} {"train_loss": -25.922998428344727, "global_step": 338319, "epoch": 4076} {"train_loss": -25.62116813659668, "global_step": 338320, "epoch": 4076} {"train_loss": -25.905929565429688, "global_step": 338321, "epoch": 4076} {"train_loss": -25.70556640625, "global_step": 338322, "epoch": 4076} {"train_loss": -25.90363121032715, "global_step": 338323, "epoch": 4076} {"train_loss": -25.982030868530273, "global_step": 338324, "epoch": 4076} {"train_loss": -25.755050659179688, "global_step": 338325, "epoch": 4076} {"train_loss": -26.39238929748535, "global_step": 338326, "epoch": 4076} {"train_loss": -25.96137046813965, "global_step": 338327, "epoch": 4076} {"train_loss": -25.810317993164062, "global_step": 338328, "epoch": 4076} {"train_loss": -26.150348663330078, "global_step": 338329, "epoch": 4076} {"train_loss": -26.120466232299805, "global_step": 338330, "epoch": 4076} {"train_loss": -26.126455307006836, "global_step": 338331, "epoch": 4076} {"train_loss": -26.056310653686523, "global_step": 338332, "epoch": 4076} {"train_loss": -26.145889282226562, "global_step": 338333, "epoch": 4076} {"train_loss": -26.306909561157227, "global_step": 338334, "epoch": 4076} {"train_loss": -26.44278335571289, "global_step": 338335, "epoch": 4076} {"train_loss": -26.344324111938477, "global_step": 338336, "epoch": 4076} {"train_loss": -25.845874786376953, "global_step": 338337, "epoch": 4076} {"train_loss": -26.17469596862793, "global_step": 338338, "epoch": 4076} {"train_loss": -26.37384605407715, "global_step": 338339, "epoch": 4076} {"train_loss": -26.172895431518555, "global_step": 338340, "epoch": 4076} {"train_loss": -26.015380859375, "global_step": 338341, "epoch": 4076} {"train_loss": -25.921558380126953, "global_step": 338342, "epoch": 4076} {"train_loss": -26.300771713256836, "global_step": 338343, "epoch": 4076} {"train_loss": -26.313764572143555, "global_step": 338344, "epoch": 4076} {"train_loss": -25.545412063598633, "global_step": 338345, "epoch": 4076} {"train_loss": -26.03875732421875, "global_step": 338346, "epoch": 4076} {"train_loss": -26.2312068939209, "global_step": 338347, "epoch": 4076} {"train_loss": -26.08858299255371, "global_step": 338348, "epoch": 4076} {"train_loss": -26.181798934936523, "global_step": 338349, "epoch": 4076} {"train_loss": -26.383039474487305, "global_step": 338350, "epoch": 4076} {"train_loss": -26.347553253173828, "global_step": 338351, "epoch": 4076} {"train_loss": -26.137479782104492, "global_step": 338352, "epoch": 4076} {"train_loss": -26.155536651611328, "global_step": 338353, "epoch": 4076} {"train_loss": -25.952743530273438, "global_step": 338354, "epoch": 4076} {"train_loss": -25.796340942382812, "global_step": 338355, "epoch": 4076} {"train_loss": -26.569473266601562, "global_step": 338356, "epoch": 4076} {"train_loss": -25.900409698486328, "global_step": 338357, "epoch": 4076} {"train_loss": -25.785871505737305, "global_step": 338358, "epoch": 4076} {"train_loss": -25.833036422729492, "global_step": 338359, "epoch": 4076} {"train_loss": -26.02207374572754, "global_step": 338360, "epoch": 4076} {"train_loss": -26.149078369140625, "global_step": 338361, "epoch": 4076} {"train_loss": -26.025436401367188, "global_step": 338362, "epoch": 4076} {"train_loss": -26.47538185119629, "global_step": 338363, "epoch": 4076} {"train_loss": -26.212305068969727, "global_step": 338364, "epoch": 4076} {"train_loss": -25.999616622924805, "global_step": 338365, "epoch": 4076} {"train_loss": -25.903478622436523, "global_step": 338366, "epoch": 4076} {"train_loss": -26.162399291992188, "global_step": 338367, "epoch": 4076} {"train_loss": -25.904571533203125, "global_step": 338368, "epoch": 4076} {"train_loss": -26.32962417602539, "global_step": 338369, "epoch": 4076} {"train_loss": -25.955291748046875, "global_step": 338370, "epoch": 4076} {"train_loss": -26.1231689453125, "global_step": 338371, "epoch": 4076} {"train_loss": -26.0122127532959, "global_step": 338372, "epoch": 4076} {"train_loss": -26.028827667236328, "global_step": 338373, "epoch": 4076} {"train_loss": -26.276662826538086, "global_step": 338374, "epoch": 4076} {"train_loss": -26.21075439453125, "global_step": 338375, "epoch": 4076} {"train_loss": -26.451068878173828, "global_step": 338376, "epoch": 4076} {"train_loss": -26.353378295898438, "global_step": 338377, "epoch": 4076} {"train_loss": -26.089807510375977, "global_step": 338378, "epoch": 4076} {"train_loss": -26.306385040283203, "global_step": 338379, "epoch": 4076} {"train_loss": -26.109350204467773, "global_step": 338380, "epoch": 4076} {"train_loss": -26.03741455078125, "global_step": 338381, "epoch": 4076} {"train_loss": -26.04509925842285, "global_step": 338382, "epoch": 4076} {"train_loss": -26.218183517456055, "global_step": 338383, "epoch": 4076} {"train_loss": -26.24466323852539, "global_step": 338384, "epoch": 4076} {"train_loss": -26.303552627563477, "global_step": 338385, "epoch": 4076} {"train_loss": -26.147647857666016, "global_step": 338386, "epoch": 4076} {"train_loss": -26.037189483642578, "global_step": 338387, "epoch": 4076} {"train_loss": -26.148895263671875, "global_step": 338388, "epoch": 4076} {"train_loss": -25.990192413330078, "global_step": 338389, "epoch": 4076} {"train_loss": -26.038951414177216, "global_step": 338390, "epoch": 4076, "val_loss": 6843691.0} {"train_loss": -23.6112117767334, "global_step": 338391, "epoch": 4077} {"train_loss": -21.082304000854492, "global_step": 338392, "epoch": 4077} {"train_loss": -25.371891021728516, "global_step": 338393, "epoch": 4077} {"train_loss": -22.723918914794922, "global_step": 338394, "epoch": 4077} {"train_loss": -24.44657325744629, "global_step": 338395, "epoch": 4077} {"train_loss": -24.32197380065918, "global_step": 338396, "epoch": 4077} {"train_loss": -24.378211975097656, "global_step": 338397, "epoch": 4077} {"train_loss": -25.244037628173828, "global_step": 338398, "epoch": 4077} {"train_loss": -24.441755294799805, "global_step": 338399, "epoch": 4077} {"train_loss": -24.811498641967773, "global_step": 338400, "epoch": 4077} {"train_loss": -25.442975997924805, "global_step": 338401, "epoch": 4077} {"train_loss": -25.189085006713867, "global_step": 338402, "epoch": 4077} {"train_loss": -25.358579635620117, "global_step": 338403, "epoch": 4077} {"train_loss": -25.011381149291992, "global_step": 338404, "epoch": 4077} {"train_loss": -25.50161361694336, "global_step": 338405, "epoch": 4077} {"train_loss": -25.049901962280273, "global_step": 338406, "epoch": 4077} {"train_loss": -25.652170181274414, "global_step": 338407, "epoch": 4077} {"train_loss": -24.808330535888672, "global_step": 338408, "epoch": 4077} {"train_loss": -25.300777435302734, "global_step": 338409, "epoch": 4077} {"train_loss": -25.154254913330078, "global_step": 338410, "epoch": 4077} {"train_loss": -25.20792007446289, "global_step": 338411, "epoch": 4077} {"train_loss": -25.420413970947266, "global_step": 338412, "epoch": 4077} {"train_loss": -25.661237716674805, "global_step": 338413, "epoch": 4077} {"train_loss": -25.001598358154297, "global_step": 338414, "epoch": 4077} {"train_loss": -25.777807235717773, "global_step": 338415, "epoch": 4077} {"train_loss": -25.142990112304688, "global_step": 338416, "epoch": 4077} {"train_loss": -25.287343978881836, "global_step": 338417, "epoch": 4077} {"train_loss": -25.681631088256836, "global_step": 338418, "epoch": 4077} {"train_loss": -25.510025024414062, "global_step": 338419, "epoch": 4077} {"train_loss": -25.21491050720215, "global_step": 338420, "epoch": 4077} {"train_loss": -25.449844360351562, "global_step": 338421, "epoch": 4077} {"train_loss": -25.583093643188477, "global_step": 338422, "epoch": 4077} {"train_loss": -25.810598373413086, "global_step": 338423, "epoch": 4077} {"train_loss": -25.586097717285156, "global_step": 338424, "epoch": 4077} {"train_loss": -25.6784610748291, "global_step": 338425, "epoch": 4077} {"train_loss": -25.865827560424805, "global_step": 338426, "epoch": 4077} {"train_loss": -25.733869552612305, "global_step": 338427, "epoch": 4077} {"train_loss": -25.908771514892578, "global_step": 338428, "epoch": 4077} {"train_loss": -25.843341827392578, "global_step": 338429, "epoch": 4077} {"train_loss": -26.011123657226562, "global_step": 338430, "epoch": 4077} {"train_loss": -25.719879150390625, "global_step": 338431, "epoch": 4077} {"train_loss": -25.65876579284668, "global_step": 338432, "epoch": 4077} {"train_loss": -25.598039627075195, "global_step": 338433, "epoch": 4077} {"train_loss": -25.638458251953125, "global_step": 338434, "epoch": 4077} {"train_loss": -25.50398063659668, "global_step": 338435, "epoch": 4077} {"train_loss": -25.89383888244629, "global_step": 338436, "epoch": 4077} {"train_loss": -25.867084503173828, "global_step": 338437, "epoch": 4077} {"train_loss": -26.07185173034668, "global_step": 338438, "epoch": 4077} {"train_loss": -26.059040069580078, "global_step": 338439, "epoch": 4077} {"train_loss": -25.72938346862793, "global_step": 338440, "epoch": 4077} {"train_loss": -25.9780330657959, "global_step": 338441, "epoch": 4077} {"train_loss": -26.204833984375, "global_step": 338442, "epoch": 4077} {"train_loss": -26.02054786682129, "global_step": 338443, "epoch": 4077} {"train_loss": -25.863798141479492, "global_step": 338444, "epoch": 4077} {"train_loss": -26.165685653686523, "global_step": 338445, "epoch": 4077} {"train_loss": -26.244962692260742, "global_step": 338446, "epoch": 4077} {"train_loss": -26.0540828704834, "global_step": 338447, "epoch": 4077} {"train_loss": -26.02431297302246, "global_step": 338448, "epoch": 4077} {"train_loss": -26.212629318237305, "global_step": 338449, "epoch": 4077} {"train_loss": -26.134647369384766, "global_step": 338450, "epoch": 4077} {"train_loss": -26.083982467651367, "global_step": 338451, "epoch": 4077} {"train_loss": -26.447052001953125, "global_step": 338452, "epoch": 4077} {"train_loss": -25.90726661682129, "global_step": 338453, "epoch": 4077} {"train_loss": -26.404809951782227, "global_step": 338454, "epoch": 4077} {"train_loss": -26.229461669921875, "global_step": 338455, "epoch": 4077} {"train_loss": -26.122028350830078, "global_step": 338456, "epoch": 4077} {"train_loss": -26.292688369750977, "global_step": 338457, "epoch": 4077} {"train_loss": -26.1221866607666, "global_step": 338458, "epoch": 4077} {"train_loss": -26.34547233581543, "global_step": 338459, "epoch": 4077} {"train_loss": -26.288639068603516, "global_step": 338460, "epoch": 4077} {"train_loss": -25.926380157470703, "global_step": 338461, "epoch": 4077} {"train_loss": -25.7936954498291, "global_step": 338462, "epoch": 4077} {"train_loss": -25.58424186706543, "global_step": 338463, "epoch": 4077} {"train_loss": -25.393552780151367, "global_step": 338464, "epoch": 4077} {"train_loss": -26.142187118530273, "global_step": 338465, "epoch": 4077} {"train_loss": -25.950519561767578, "global_step": 338466, "epoch": 4077} {"train_loss": -26.160425186157227, "global_step": 338467, "epoch": 4077} {"train_loss": -26.10479736328125, "global_step": 338468, "epoch": 4077} {"train_loss": -26.210102081298828, "global_step": 338469, "epoch": 4077} {"train_loss": -25.7971248626709, "global_step": 338470, "epoch": 4077} {"train_loss": -25.78248405456543, "global_step": 338471, "epoch": 4077} {"train_loss": -25.830835342407227, "global_step": 338472, "epoch": 4077} {"train_loss": -25.554807548063348, "global_step": 338473, "epoch": 4077, "val_loss": 6846103.5} {"train_loss": -23.572261810302734, "global_step": 338474, "epoch": 4078} {"train_loss": -25.046363830566406, "global_step": 338475, "epoch": 4078} {"train_loss": -25.441709518432617, "global_step": 338476, "epoch": 4078} {"train_loss": -25.092239379882812, "global_step": 338477, "epoch": 4078} {"train_loss": -24.963117599487305, "global_step": 338478, "epoch": 4078} {"train_loss": -25.16933250427246, "global_step": 338479, "epoch": 4078} {"train_loss": -24.692304611206055, "global_step": 338480, "epoch": 4078} {"train_loss": -25.574100494384766, "global_step": 338481, "epoch": 4078} {"train_loss": -25.094823837280273, "global_step": 338482, "epoch": 4078} {"train_loss": -25.317405700683594, "global_step": 338483, "epoch": 4078} {"train_loss": -25.299108505249023, "global_step": 338484, "epoch": 4078} {"train_loss": -25.85987663269043, "global_step": 338485, "epoch": 4078} {"train_loss": -25.16242218017578, "global_step": 338486, "epoch": 4078} {"train_loss": -25.865793228149414, "global_step": 338487, "epoch": 4078} {"train_loss": -25.7141170501709, "global_step": 338488, "epoch": 4078} {"train_loss": -25.632221221923828, "global_step": 338489, "epoch": 4078} {"train_loss": -25.399560928344727, "global_step": 338490, "epoch": 4078} {"train_loss": -25.487812042236328, "global_step": 338491, "epoch": 4078} {"train_loss": -25.14850425720215, "global_step": 338492, "epoch": 4078} {"train_loss": -25.390424728393555, "global_step": 338493, "epoch": 4078} {"train_loss": -25.38433265686035, "global_step": 338494, "epoch": 4078} {"train_loss": -25.629608154296875, "global_step": 338495, "epoch": 4078} {"train_loss": -25.575124740600586, "global_step": 338496, "epoch": 4078} {"train_loss": -25.659879684448242, "global_step": 338497, "epoch": 4078} {"train_loss": -25.864606857299805, "global_step": 338498, "epoch": 4078} {"train_loss": -25.87470054626465, "global_step": 338499, "epoch": 4078} {"train_loss": -25.72555923461914, "global_step": 338500, "epoch": 4078} {"train_loss": -26.21890640258789, "global_step": 338501, "epoch": 4078} {"train_loss": -26.069019317626953, "global_step": 338502, "epoch": 4078} {"train_loss": -26.215396881103516, "global_step": 338503, "epoch": 4078} {"train_loss": -26.127716064453125, "global_step": 338504, "epoch": 4078} {"train_loss": -25.961090087890625, "global_step": 338505, "epoch": 4078} {"train_loss": -25.656982421875, "global_step": 338506, "epoch": 4078} {"train_loss": -25.759313583374023, "global_step": 338507, "epoch": 4078} {"train_loss": -25.95484733581543, "global_step": 338508, "epoch": 4078} {"train_loss": -26.020429611206055, "global_step": 338509, "epoch": 4078} {"train_loss": -25.683439254760742, "global_step": 338510, "epoch": 4078} {"train_loss": -26.436689376831055, "global_step": 338511, "epoch": 4078} {"train_loss": -26.150476455688477, "global_step": 338512, "epoch": 4078} {"train_loss": -26.165435791015625, "global_step": 338513, "epoch": 4078} {"train_loss": -26.014013290405273, "global_step": 338514, "epoch": 4078} {"train_loss": -26.28046989440918, "global_step": 338515, "epoch": 4078} {"train_loss": -25.91640281677246, "global_step": 338516, "epoch": 4078} {"train_loss": -26.059717178344727, "global_step": 338517, "epoch": 4078} {"train_loss": -26.141660690307617, "global_step": 338518, "epoch": 4078} {"train_loss": -26.159997940063477, "global_step": 338519, "epoch": 4078} {"train_loss": -25.950851440429688, "global_step": 338520, "epoch": 4078} {"train_loss": -26.52008056640625, "global_step": 338521, "epoch": 4078} {"train_loss": -25.96589469909668, "global_step": 338522, "epoch": 4078} {"train_loss": -26.437885284423828, "global_step": 338523, "epoch": 4078} {"train_loss": -25.937711715698242, "global_step": 338524, "epoch": 4078} {"train_loss": -26.21514892578125, "global_step": 338525, "epoch": 4078} {"train_loss": -26.02314567565918, "global_step": 338526, "epoch": 4078} {"train_loss": -26.18405532836914, "global_step": 338527, "epoch": 4078} {"train_loss": -25.813825607299805, "global_step": 338528, "epoch": 4078} {"train_loss": -26.3121395111084, "global_step": 338529, "epoch": 4078} {"train_loss": -26.141088485717773, "global_step": 338530, "epoch": 4078} {"train_loss": -26.239587783813477, "global_step": 338531, "epoch": 4078} {"train_loss": -26.049697875976562, "global_step": 338532, "epoch": 4078} {"train_loss": -25.95285415649414, "global_step": 338533, "epoch": 4078} {"train_loss": -26.04400634765625, "global_step": 338534, "epoch": 4078} {"train_loss": -26.356830596923828, "global_step": 338535, "epoch": 4078} {"train_loss": -26.240705490112305, "global_step": 338536, "epoch": 4078} {"train_loss": -25.973554611206055, "global_step": 338537, "epoch": 4078} {"train_loss": -26.369140625, "global_step": 338538, "epoch": 4078} {"train_loss": -25.91522216796875, "global_step": 338539, "epoch": 4078} {"train_loss": -25.799238204956055, "global_step": 338540, "epoch": 4078} {"train_loss": -25.456275939941406, "global_step": 338541, "epoch": 4078} {"train_loss": -25.780324935913086, "global_step": 338542, "epoch": 4078} {"train_loss": -26.070117950439453, "global_step": 338543, "epoch": 4078} {"train_loss": -25.720876693725586, "global_step": 338544, "epoch": 4078} {"train_loss": -25.819562911987305, "global_step": 338545, "epoch": 4078} {"train_loss": -25.95098304748535, "global_step": 338546, "epoch": 4078} {"train_loss": -25.85104751586914, "global_step": 338547, "epoch": 4078} {"train_loss": -25.743452072143555, "global_step": 338548, "epoch": 4078} {"train_loss": -25.902099609375, "global_step": 338549, "epoch": 4078} {"train_loss": -26.17341423034668, "global_step": 338550, "epoch": 4078} {"train_loss": -26.257749557495117, "global_step": 338551, "epoch": 4078} {"train_loss": -26.161304473876953, "global_step": 338552, "epoch": 4078} {"train_loss": -26.07984733581543, "global_step": 338553, "epoch": 4078} {"train_loss": -26.00154685974121, "global_step": 338554, "epoch": 4078} {"train_loss": -26.086395263671875, "global_step": 338555, "epoch": 4078} {"train_loss": -25.81787320791957, "global_step": 338556, "epoch": 4078, "val_loss": 6678429.0} {"train_loss": -25.847030639648438, "global_step": 338557, "epoch": 4079} {"train_loss": -25.829294204711914, "global_step": 338558, "epoch": 4079} {"train_loss": -25.886646270751953, "global_step": 338559, "epoch": 4079} {"train_loss": -25.792163848876953, "global_step": 338560, "epoch": 4079} {"train_loss": -25.781604766845703, "global_step": 338561, "epoch": 4079} {"train_loss": -25.8587589263916, "global_step": 338562, "epoch": 4079} {"train_loss": -25.82305908203125, "global_step": 338563, "epoch": 4079} {"train_loss": -25.67487144470215, "global_step": 338564, "epoch": 4079} {"train_loss": -25.497161865234375, "global_step": 338565, "epoch": 4079} {"train_loss": -25.75762939453125, "global_step": 338566, "epoch": 4079} {"train_loss": -26.070661544799805, "global_step": 338567, "epoch": 4079} {"train_loss": -25.526113510131836, "global_step": 338568, "epoch": 4079} {"train_loss": -25.957157135009766, "global_step": 338569, "epoch": 4079} {"train_loss": -26.404138565063477, "global_step": 338570, "epoch": 4079} {"train_loss": -26.192529678344727, "global_step": 338571, "epoch": 4079} {"train_loss": -26.218000411987305, "global_step": 338572, "epoch": 4079} {"train_loss": -25.75575828552246, "global_step": 338573, "epoch": 4079} {"train_loss": -25.827259063720703, "global_step": 338574, "epoch": 4079} {"train_loss": -26.1463565826416, "global_step": 338575, "epoch": 4079} {"train_loss": -26.04736328125, "global_step": 338576, "epoch": 4079} {"train_loss": -26.049468994140625, "global_step": 338577, "epoch": 4079} {"train_loss": -25.97297477722168, "global_step": 338578, "epoch": 4079} {"train_loss": -26.219308853149414, "global_step": 338579, "epoch": 4079} {"train_loss": -26.03736686706543, "global_step": 338580, "epoch": 4079} {"train_loss": -25.92390251159668, "global_step": 338581, "epoch": 4079} {"train_loss": -26.33342933654785, "global_step": 338582, "epoch": 4079} {"train_loss": -26.04951286315918, "global_step": 338583, "epoch": 4079} {"train_loss": -26.374292373657227, "global_step": 338584, "epoch": 4079} {"train_loss": -26.0561580657959, "global_step": 338585, "epoch": 4079} {"train_loss": -26.299362182617188, "global_step": 338586, "epoch": 4079} {"train_loss": -26.518529891967773, "global_step": 338587, "epoch": 4079} {"train_loss": -26.1754207611084, "global_step": 338588, "epoch": 4079} {"train_loss": -26.451261520385742, "global_step": 338589, "epoch": 4079} {"train_loss": -25.988636016845703, "global_step": 338590, "epoch": 4079} {"train_loss": -25.921497344970703, "global_step": 338591, "epoch": 4079} {"train_loss": -25.944433212280273, "global_step": 338592, "epoch": 4079} {"train_loss": -25.720996856689453, "global_step": 338593, "epoch": 4079} {"train_loss": -26.312545776367188, "global_step": 338594, "epoch": 4079} {"train_loss": -26.19410514831543, "global_step": 338595, "epoch": 4079} {"train_loss": -25.8834228515625, "global_step": 338596, "epoch": 4079} {"train_loss": -25.911651611328125, "global_step": 338597, "epoch": 4079} {"train_loss": -26.260461807250977, "global_step": 338598, "epoch": 4079} {"train_loss": -26.174163818359375, "global_step": 338599, "epoch": 4079} {"train_loss": -26.278974533081055, "global_step": 338600, "epoch": 4079} {"train_loss": -26.026575088500977, "global_step": 338601, "epoch": 4079} {"train_loss": -26.2214298248291, "global_step": 338602, "epoch": 4079} {"train_loss": -25.769811630249023, "global_step": 338603, "epoch": 4079} {"train_loss": -26.16206932067871, "global_step": 338604, "epoch": 4079} {"train_loss": -26.367420196533203, "global_step": 338605, "epoch": 4079} {"train_loss": -26.077804565429688, "global_step": 338606, "epoch": 4079} {"train_loss": -26.25935935974121, "global_step": 338607, "epoch": 4079} {"train_loss": -26.039342880249023, "global_step": 338608, "epoch": 4079} {"train_loss": -26.2629337310791, "global_step": 338609, "epoch": 4079} {"train_loss": -26.311737060546875, "global_step": 338610, "epoch": 4079} {"train_loss": -26.114856719970703, "global_step": 338611, "epoch": 4079} {"train_loss": -26.25398063659668, "global_step": 338612, "epoch": 4079} {"train_loss": -26.031606674194336, "global_step": 338613, "epoch": 4079} {"train_loss": -25.873498916625977, "global_step": 338614, "epoch": 4079} {"train_loss": -26.07489013671875, "global_step": 338615, "epoch": 4079} {"train_loss": -25.750873565673828, "global_step": 338616, "epoch": 4079} {"train_loss": -25.9289608001709, "global_step": 338617, "epoch": 4079} {"train_loss": -25.86189079284668, "global_step": 338618, "epoch": 4079} {"train_loss": -26.102893829345703, "global_step": 338619, "epoch": 4079} {"train_loss": -26.32770347595215, "global_step": 338620, "epoch": 4079} {"train_loss": -26.07724952697754, "global_step": 338621, "epoch": 4079} {"train_loss": -25.82447624206543, "global_step": 338622, "epoch": 4079} {"train_loss": -25.45168113708496, "global_step": 338623, "epoch": 4079} {"train_loss": -25.096935272216797, "global_step": 338624, "epoch": 4079} {"train_loss": -25.329221725463867, "global_step": 338625, "epoch": 4079} {"train_loss": -25.864973068237305, "global_step": 338626, "epoch": 4079} {"train_loss": -26.23892593383789, "global_step": 338627, "epoch": 4079} {"train_loss": -25.75750160217285, "global_step": 338628, "epoch": 4079} {"train_loss": -25.65699577331543, "global_step": 338629, "epoch": 4079} {"train_loss": -25.627180099487305, "global_step": 338630, "epoch": 4079} {"train_loss": -25.532861709594727, "global_step": 338631, "epoch": 4079} {"train_loss": -26.148029327392578, "global_step": 338632, "epoch": 4079} {"train_loss": -26.021635055541992, "global_step": 338633, "epoch": 4079} {"train_loss": -26.075977325439453, "global_step": 338634, "epoch": 4079} {"train_loss": -25.78504753112793, "global_step": 338635, "epoch": 4079} {"train_loss": -26.02924156188965, "global_step": 338636, "epoch": 4079} {"train_loss": -25.509687423706055, "global_step": 338637, "epoch": 4079} {"train_loss": -25.6534423828125, "global_step": 338638, "epoch": 4079} {"train_loss": -25.986543931156756, "global_step": 338639, "epoch": 4079, "val_loss": 6746054.0} {"train_loss": -24.16053009033203, "global_step": 338640, "epoch": 4080} {"train_loss": -24.840106964111328, "global_step": 338641, "epoch": 4080} {"train_loss": -24.11215591430664, "global_step": 338642, "epoch": 4080} {"train_loss": -24.60020637512207, "global_step": 338643, "epoch": 4080} {"train_loss": -25.170902252197266, "global_step": 338644, "epoch": 4080} {"train_loss": -24.863296508789062, "global_step": 338645, "epoch": 4080} {"train_loss": -25.130199432373047, "global_step": 338646, "epoch": 4080} {"train_loss": -25.19101333618164, "global_step": 338647, "epoch": 4080} {"train_loss": -24.849809646606445, "global_step": 338648, "epoch": 4080} {"train_loss": -25.255416870117188, "global_step": 338649, "epoch": 4080} {"train_loss": -25.439468383789062, "global_step": 338650, "epoch": 4080} {"train_loss": -25.502290725708008, "global_step": 338651, "epoch": 4080} {"train_loss": -25.18642234802246, "global_step": 338652, "epoch": 4080} {"train_loss": -25.383386611938477, "global_step": 338653, "epoch": 4080} {"train_loss": -25.7442626953125, "global_step": 338654, "epoch": 4080} {"train_loss": -25.08624839782715, "global_step": 338655, "epoch": 4080} {"train_loss": -25.761198043823242, "global_step": 338656, "epoch": 4080} {"train_loss": -25.2653751373291, "global_step": 338657, "epoch": 4080} {"train_loss": -25.39503288269043, "global_step": 338658, "epoch": 4080} {"train_loss": -25.437803268432617, "global_step": 338659, "epoch": 4080} {"train_loss": -25.48719024658203, "global_step": 338660, "epoch": 4080} {"train_loss": -25.971851348876953, "global_step": 338661, "epoch": 4080} {"train_loss": -25.534351348876953, "global_step": 338662, "epoch": 4080} {"train_loss": -25.817890167236328, "global_step": 338663, "epoch": 4080} {"train_loss": -25.438833236694336, "global_step": 338664, "epoch": 4080} {"train_loss": -25.876150131225586, "global_step": 338665, "epoch": 4080} {"train_loss": -25.73793601989746, "global_step": 338666, "epoch": 4080} {"train_loss": -25.8668155670166, "global_step": 338667, "epoch": 4080} {"train_loss": -25.6246395111084, "global_step": 338668, "epoch": 4080} {"train_loss": -26.06159782409668, "global_step": 338669, "epoch": 4080} {"train_loss": -25.828886032104492, "global_step": 338670, "epoch": 4080} {"train_loss": -25.930097579956055, "global_step": 338671, "epoch": 4080} {"train_loss": -25.986902236938477, "global_step": 338672, "epoch": 4080} {"train_loss": -25.94184684753418, "global_step": 338673, "epoch": 4080} {"train_loss": -25.96955680847168, "global_step": 338674, "epoch": 4080} {"train_loss": -26.288711547851562, "global_step": 338675, "epoch": 4080} {"train_loss": -25.8887939453125, "global_step": 338676, "epoch": 4080} {"train_loss": -26.048542022705078, "global_step": 338677, "epoch": 4080} {"train_loss": -26.09112548828125, "global_step": 338678, "epoch": 4080} {"train_loss": -26.03934097290039, "global_step": 338679, "epoch": 4080} {"train_loss": -26.31707191467285, "global_step": 338680, "epoch": 4080} {"train_loss": -26.19114112854004, "global_step": 338681, "epoch": 4080} {"train_loss": -26.187387466430664, "global_step": 338682, "epoch": 4080} {"train_loss": -26.030237197875977, "global_step": 338683, "epoch": 4080} {"train_loss": -26.3308162689209, "global_step": 338684, "epoch": 4080} {"train_loss": -26.058218002319336, "global_step": 338685, "epoch": 4080} {"train_loss": -25.909582138061523, "global_step": 338686, "epoch": 4080} {"train_loss": -26.273330688476562, "global_step": 338687, "epoch": 4080} {"train_loss": -26.235273361206055, "global_step": 338688, "epoch": 4080} {"train_loss": -26.307748794555664, "global_step": 338689, "epoch": 4080} {"train_loss": -26.312057495117188, "global_step": 338690, "epoch": 4080} {"train_loss": -26.459257125854492, "global_step": 338691, "epoch": 4080} {"train_loss": -26.290719985961914, "global_step": 338692, "epoch": 4080} {"train_loss": -25.806411743164062, "global_step": 338693, "epoch": 4080} {"train_loss": -25.909093856811523, "global_step": 338694, "epoch": 4080} {"train_loss": -26.069976806640625, "global_step": 338695, "epoch": 4080} {"train_loss": -26.10894203186035, "global_step": 338696, "epoch": 4080} {"train_loss": -26.003225326538086, "global_step": 338697, "epoch": 4080} {"train_loss": -26.331439971923828, "global_step": 338698, "epoch": 4080} {"train_loss": -26.03487205505371, "global_step": 338699, "epoch": 4080} {"train_loss": -26.34136390686035, "global_step": 338700, "epoch": 4080} {"train_loss": -26.1207218170166, "global_step": 338701, "epoch": 4080} {"train_loss": -25.892019271850586, "global_step": 338702, "epoch": 4080} {"train_loss": -26.277402877807617, "global_step": 338703, "epoch": 4080} {"train_loss": -26.024927139282227, "global_step": 338704, "epoch": 4080} {"train_loss": -26.26194190979004, "global_step": 338705, "epoch": 4080} {"train_loss": -26.564218521118164, "global_step": 338706, "epoch": 4080} {"train_loss": -26.30472755432129, "global_step": 338707, "epoch": 4080} {"train_loss": -26.439788818359375, "global_step": 338708, "epoch": 4080} {"train_loss": -26.25811767578125, "global_step": 338709, "epoch": 4080} {"train_loss": -26.25664710998535, "global_step": 338710, "epoch": 4080} {"train_loss": -26.07242202758789, "global_step": 338711, "epoch": 4080} {"train_loss": -26.464263916015625, "global_step": 338712, "epoch": 4080} {"train_loss": -26.542871475219727, "global_step": 338713, "epoch": 4080} {"train_loss": -26.18159294128418, "global_step": 338714, "epoch": 4080} {"train_loss": -25.521284103393555, "global_step": 338715, "epoch": 4080} {"train_loss": -25.305395126342773, "global_step": 338716, "epoch": 4080} {"train_loss": -25.566082000732422, "global_step": 338717, "epoch": 4080} {"train_loss": -25.29067039489746, "global_step": 338718, "epoch": 4080} {"train_loss": -25.897918701171875, "global_step": 338719, "epoch": 4080} {"train_loss": -25.833602905273438, "global_step": 338720, "epoch": 4080} {"train_loss": -25.998931884765625, "global_step": 338721, "epoch": 4080} {"train_loss": -25.7997450771102, "global_step": 338722, "epoch": 4080, "val_loss": 6673621.0} {"train_loss": -24.706302642822266, "global_step": 338723, "epoch": 4081} {"train_loss": -24.279037475585938, "global_step": 338724, "epoch": 4081} {"train_loss": -25.28582763671875, "global_step": 338725, "epoch": 4081} {"train_loss": -24.761249542236328, "global_step": 338726, "epoch": 4081} {"train_loss": -24.596660614013672, "global_step": 338727, "epoch": 4081} {"train_loss": -25.408672332763672, "global_step": 338728, "epoch": 4081} {"train_loss": -24.792470932006836, "global_step": 338729, "epoch": 4081} {"train_loss": -25.584627151489258, "global_step": 338730, "epoch": 4081} {"train_loss": -24.28729820251465, "global_step": 338731, "epoch": 4081} {"train_loss": -25.614904403686523, "global_step": 338732, "epoch": 4081} {"train_loss": -24.732385635375977, "global_step": 338733, "epoch": 4081} {"train_loss": -25.020801544189453, "global_step": 338734, "epoch": 4081} {"train_loss": -25.4877872467041, "global_step": 338735, "epoch": 4081} {"train_loss": -24.917268753051758, "global_step": 338736, "epoch": 4081} {"train_loss": -24.99102210998535, "global_step": 338737, "epoch": 4081} {"train_loss": -25.26002311706543, "global_step": 338738, "epoch": 4081} {"train_loss": -25.312875747680664, "global_step": 338739, "epoch": 4081} {"train_loss": -25.606491088867188, "global_step": 338740, "epoch": 4081} {"train_loss": -25.470352172851562, "global_step": 338741, "epoch": 4081} {"train_loss": -25.60825538635254, "global_step": 338742, "epoch": 4081} {"train_loss": -25.6137752532959, "global_step": 338743, "epoch": 4081} {"train_loss": -25.34722900390625, "global_step": 338744, "epoch": 4081} {"train_loss": -25.538087844848633, "global_step": 338745, "epoch": 4081} {"train_loss": -25.514951705932617, "global_step": 338746, "epoch": 4081} {"train_loss": -25.798736572265625, "global_step": 338747, "epoch": 4081} {"train_loss": -25.94788932800293, "global_step": 338748, "epoch": 4081} {"train_loss": -25.7395076751709, "global_step": 338749, "epoch": 4081} {"train_loss": -25.448577880859375, "global_step": 338750, "epoch": 4081} {"train_loss": -25.935667037963867, "global_step": 338751, "epoch": 4081} {"train_loss": -25.57354736328125, "global_step": 338752, "epoch": 4081} {"train_loss": -25.949975967407227, "global_step": 338753, "epoch": 4081} {"train_loss": -26.013757705688477, "global_step": 338754, "epoch": 4081} {"train_loss": -26.314172744750977, "global_step": 338755, "epoch": 4081} {"train_loss": -25.844099044799805, "global_step": 338756, "epoch": 4081} {"train_loss": -25.88776206970215, "global_step": 338757, "epoch": 4081} {"train_loss": -25.78168296813965, "global_step": 338758, "epoch": 4081} {"train_loss": -26.157079696655273, "global_step": 338759, "epoch": 4081} {"train_loss": -26.261960983276367, "global_step": 338760, "epoch": 4081} {"train_loss": -26.544397354125977, "global_step": 338761, "epoch": 4081} {"train_loss": -25.785558700561523, "global_step": 338762, "epoch": 4081} {"train_loss": -26.24749755859375, "global_step": 338763, "epoch": 4081} {"train_loss": -26.064762115478516, "global_step": 338764, "epoch": 4081} {"train_loss": -25.596738815307617, "global_step": 338765, "epoch": 4081} {"train_loss": -26.252954483032227, "global_step": 338766, "epoch": 4081} {"train_loss": -26.350494384765625, "global_step": 338767, "epoch": 4081} {"train_loss": -25.861652374267578, "global_step": 338768, "epoch": 4081} {"train_loss": -25.986387252807617, "global_step": 338769, "epoch": 4081} {"train_loss": -26.0449161529541, "global_step": 338770, "epoch": 4081} {"train_loss": -26.168249130249023, "global_step": 338771, "epoch": 4081} {"train_loss": -26.240142822265625, "global_step": 338772, "epoch": 4081} {"train_loss": -26.34613037109375, "global_step": 338773, "epoch": 4081} {"train_loss": -26.114789962768555, "global_step": 338774, "epoch": 4081} {"train_loss": -26.394489288330078, "global_step": 338775, "epoch": 4081} {"train_loss": -26.01869010925293, "global_step": 338776, "epoch": 4081} {"train_loss": -25.882827758789062, "global_step": 338777, "epoch": 4081} {"train_loss": -26.06730079650879, "global_step": 338778, "epoch": 4081} {"train_loss": -26.06171989440918, "global_step": 338779, "epoch": 4081} {"train_loss": -25.92104148864746, "global_step": 338780, "epoch": 4081} {"train_loss": -25.77288246154785, "global_step": 338781, "epoch": 4081} {"train_loss": -26.22824478149414, "global_step": 338782, "epoch": 4081} {"train_loss": -26.233291625976562, "global_step": 338783, "epoch": 4081} {"train_loss": -26.15228271484375, "global_step": 338784, "epoch": 4081} {"train_loss": -25.99555015563965, "global_step": 338785, "epoch": 4081} {"train_loss": -25.746936798095703, "global_step": 338786, "epoch": 4081} {"train_loss": -26.090967178344727, "global_step": 338787, "epoch": 4081} {"train_loss": -25.912689208984375, "global_step": 338788, "epoch": 4081} {"train_loss": -25.777084350585938, "global_step": 338789, "epoch": 4081} {"train_loss": -26.133270263671875, "global_step": 338790, "epoch": 4081} {"train_loss": -26.210012435913086, "global_step": 338791, "epoch": 4081} {"train_loss": -25.851093292236328, "global_step": 338792, "epoch": 4081} {"train_loss": -25.861316680908203, "global_step": 338793, "epoch": 4081} {"train_loss": -26.096036911010742, "global_step": 338794, "epoch": 4081} {"train_loss": -25.924121856689453, "global_step": 338795, "epoch": 4081} {"train_loss": -26.405658721923828, "global_step": 338796, "epoch": 4081} {"train_loss": -26.180856704711914, "global_step": 338797, "epoch": 4081} {"train_loss": -26.212757110595703, "global_step": 338798, "epoch": 4081} {"train_loss": -26.0334415435791, "global_step": 338799, "epoch": 4081} {"train_loss": -25.390958786010742, "global_step": 338800, "epoch": 4081} {"train_loss": -26.277206420898438, "global_step": 338801, "epoch": 4081} {"train_loss": -25.954309463500977, "global_step": 338802, "epoch": 4081} {"train_loss": -26.25235366821289, "global_step": 338803, "epoch": 4081} {"train_loss": -26.35906410217285, "global_step": 338804, "epoch": 4081} {"train_loss": -25.779522677502, "global_step": 338805, "epoch": 4081, "val_loss": 6688933.0} {"train_loss": -25.215036392211914, "global_step": 338806, "epoch": 4082} {"train_loss": -25.028125762939453, "global_step": 338807, "epoch": 4082} {"train_loss": -24.966705322265625, "global_step": 338808, "epoch": 4082} {"train_loss": -25.48883628845215, "global_step": 338809, "epoch": 4082} {"train_loss": -23.718687057495117, "global_step": 338810, "epoch": 4082} {"train_loss": -25.73042106628418, "global_step": 338811, "epoch": 4082} {"train_loss": -23.79449462890625, "global_step": 338812, "epoch": 4082} {"train_loss": -25.136476516723633, "global_step": 338813, "epoch": 4082} {"train_loss": -25.323789596557617, "global_step": 338814, "epoch": 4082} {"train_loss": -25.6647891998291, "global_step": 338815, "epoch": 4082} {"train_loss": -25.37942123413086, "global_step": 338816, "epoch": 4082} {"train_loss": -25.728910446166992, "global_step": 338817, "epoch": 4082} {"train_loss": -25.62624168395996, "global_step": 338818, "epoch": 4082} {"train_loss": -25.458606719970703, "global_step": 338819, "epoch": 4082} {"train_loss": -25.867328643798828, "global_step": 338820, "epoch": 4082} {"train_loss": -25.32056999206543, "global_step": 338821, "epoch": 4082} {"train_loss": -25.459625244140625, "global_step": 338822, "epoch": 4082} {"train_loss": -26.030736923217773, "global_step": 338823, "epoch": 4082} {"train_loss": -25.67862319946289, "global_step": 338824, "epoch": 4082} {"train_loss": -25.45465660095215, "global_step": 338825, "epoch": 4082} {"train_loss": -25.40638542175293, "global_step": 338826, "epoch": 4082} {"train_loss": -25.67376708984375, "global_step": 338827, "epoch": 4082} {"train_loss": -25.498218536376953, "global_step": 338828, "epoch": 4082} {"train_loss": -25.914188385009766, "global_step": 338829, "epoch": 4082} {"train_loss": -25.518796920776367, "global_step": 338830, "epoch": 4082} {"train_loss": -25.69148063659668, "global_step": 338831, "epoch": 4082} {"train_loss": -25.9600772857666, "global_step": 338832, "epoch": 4082} {"train_loss": -25.79703140258789, "global_step": 338833, "epoch": 4082} {"train_loss": -25.98105239868164, "global_step": 338834, "epoch": 4082} {"train_loss": -26.00225830078125, "global_step": 338835, "epoch": 4082} {"train_loss": -25.509946823120117, "global_step": 338836, "epoch": 4082} {"train_loss": -25.923376083374023, "global_step": 338837, "epoch": 4082} {"train_loss": -25.769210815429688, "global_step": 338838, "epoch": 4082} {"train_loss": -25.704343795776367, "global_step": 338839, "epoch": 4082} {"train_loss": -26.171064376831055, "global_step": 338840, "epoch": 4082} {"train_loss": -26.022245407104492, "global_step": 338841, "epoch": 4082} {"train_loss": -25.868452072143555, "global_step": 338842, "epoch": 4082} {"train_loss": -25.981836318969727, "global_step": 338843, "epoch": 4082} {"train_loss": -25.83340835571289, "global_step": 338844, "epoch": 4082} {"train_loss": -26.241596221923828, "global_step": 338845, "epoch": 4082} {"train_loss": -26.018823623657227, "global_step": 338846, "epoch": 4082} {"train_loss": -25.93511962890625, "global_step": 338847, "epoch": 4082} {"train_loss": -25.859119415283203, "global_step": 338848, "epoch": 4082} {"train_loss": -26.06292724609375, "global_step": 338849, "epoch": 4082} {"train_loss": -26.113113403320312, "global_step": 338850, "epoch": 4082} {"train_loss": -26.057287216186523, "global_step": 338851, "epoch": 4082} {"train_loss": -26.17120933532715, "global_step": 338852, "epoch": 4082} {"train_loss": -26.21050453186035, "global_step": 338853, "epoch": 4082} {"train_loss": -26.006351470947266, "global_step": 338854, "epoch": 4082} {"train_loss": -26.23089027404785, "global_step": 338855, "epoch": 4082} {"train_loss": -26.438720703125, "global_step": 338856, "epoch": 4082} {"train_loss": -25.848691940307617, "global_step": 338857, "epoch": 4082} {"train_loss": -26.323013305664062, "global_step": 338858, "epoch": 4082} {"train_loss": -26.23565101623535, "global_step": 338859, "epoch": 4082} {"train_loss": -26.178730010986328, "global_step": 338860, "epoch": 4082} {"train_loss": -26.065587997436523, "global_step": 338861, "epoch": 4082} {"train_loss": -26.03681755065918, "global_step": 338862, "epoch": 4082} {"train_loss": -26.191394805908203, "global_step": 338863, "epoch": 4082} {"train_loss": -25.945077896118164, "global_step": 338864, "epoch": 4082} {"train_loss": -25.705554962158203, "global_step": 338865, "epoch": 4082} {"train_loss": -26.032520294189453, "global_step": 338866, "epoch": 4082} {"train_loss": -25.90723991394043, "global_step": 338867, "epoch": 4082} {"train_loss": -26.15085792541504, "global_step": 338868, "epoch": 4082} {"train_loss": -25.968027114868164, "global_step": 338869, "epoch": 4082} {"train_loss": -26.229129791259766, "global_step": 338870, "epoch": 4082} {"train_loss": -26.338171005249023, "global_step": 338871, "epoch": 4082} {"train_loss": -26.427112579345703, "global_step": 338872, "epoch": 4082} {"train_loss": -26.149005889892578, "global_step": 338873, "epoch": 4082} {"train_loss": -26.118391036987305, "global_step": 338874, "epoch": 4082} {"train_loss": -26.414886474609375, "global_step": 338875, "epoch": 4082} {"train_loss": -26.114538192749023, "global_step": 338876, "epoch": 4082} {"train_loss": -26.15663719177246, "global_step": 338877, "epoch": 4082} {"train_loss": -25.82745361328125, "global_step": 338878, "epoch": 4082} {"train_loss": -25.857282638549805, "global_step": 338879, "epoch": 4082} {"train_loss": -26.2420597076416, "global_step": 338880, "epoch": 4082} {"train_loss": -26.070480346679688, "global_step": 338881, "epoch": 4082} {"train_loss": -26.055591583251953, "global_step": 338882, "epoch": 4082} {"train_loss": -26.705677032470703, "global_step": 338883, "epoch": 4082} {"train_loss": -25.874073028564453, "global_step": 338884, "epoch": 4082} {"train_loss": -26.054901123046875, "global_step": 338885, "epoch": 4082} {"train_loss": -26.082538604736328, "global_step": 338886, "epoch": 4082} {"train_loss": -26.201679229736328, "global_step": 338887, "epoch": 4082} {"train_loss": -25.85582287340279, "global_step": 338888, "epoch": 4082, "val_loss": 6770189.0} {"train_loss": -25.627344131469727, "global_step": 338889, "epoch": 4083} {"train_loss": -24.627336502075195, "global_step": 338890, "epoch": 4083} {"train_loss": -25.719635009765625, "global_step": 338891, "epoch": 4083} {"train_loss": -25.07550621032715, "global_step": 338892, "epoch": 4083} {"train_loss": -25.062978744506836, "global_step": 338893, "epoch": 4083} {"train_loss": -25.44952392578125, "global_step": 338894, "epoch": 4083} {"train_loss": -25.31507682800293, "global_step": 338895, "epoch": 4083} {"train_loss": -25.82269859313965, "global_step": 338896, "epoch": 4083} {"train_loss": -25.190494537353516, "global_step": 338897, "epoch": 4083} {"train_loss": -25.8394718170166, "global_step": 338898, "epoch": 4083} {"train_loss": -25.585979461669922, "global_step": 338899, "epoch": 4083} {"train_loss": -25.831195831298828, "global_step": 338900, "epoch": 4083} {"train_loss": -25.492633819580078, "global_step": 338901, "epoch": 4083} {"train_loss": -26.178747177124023, "global_step": 338902, "epoch": 4083} {"train_loss": -25.498077392578125, "global_step": 338903, "epoch": 4083} {"train_loss": -25.966064453125, "global_step": 338904, "epoch": 4083} {"train_loss": -25.74595069885254, "global_step": 338905, "epoch": 4083} {"train_loss": -25.666112899780273, "global_step": 338906, "epoch": 4083} {"train_loss": -25.932098388671875, "global_step": 338907, "epoch": 4083} {"train_loss": -26.062732696533203, "global_step": 338908, "epoch": 4083} {"train_loss": -25.930694580078125, "global_step": 338909, "epoch": 4083} {"train_loss": -25.64105224609375, "global_step": 338910, "epoch": 4083} {"train_loss": -25.68682289123535, "global_step": 338911, "epoch": 4083} {"train_loss": -26.04730796813965, "global_step": 338912, "epoch": 4083} {"train_loss": -25.869115829467773, "global_step": 338913, "epoch": 4083} {"train_loss": -26.0628719329834, "global_step": 338914, "epoch": 4083} {"train_loss": -25.662261962890625, "global_step": 338915, "epoch": 4083} {"train_loss": -25.796506881713867, "global_step": 338916, "epoch": 4083} {"train_loss": -25.99344253540039, "global_step": 338917, "epoch": 4083} {"train_loss": -25.9141788482666, "global_step": 338918, "epoch": 4083} {"train_loss": -25.906574249267578, "global_step": 338919, "epoch": 4083} {"train_loss": -25.797321319580078, "global_step": 338920, "epoch": 4083} {"train_loss": -25.998615264892578, "global_step": 338921, "epoch": 4083} {"train_loss": -26.245508193969727, "global_step": 338922, "epoch": 4083} {"train_loss": -26.280609130859375, "global_step": 338923, "epoch": 4083} {"train_loss": -26.06807518005371, "global_step": 338924, "epoch": 4083} {"train_loss": -26.187524795532227, "global_step": 338925, "epoch": 4083} {"train_loss": -25.989368438720703, "global_step": 338926, "epoch": 4083} {"train_loss": -26.03508949279785, "global_step": 338927, "epoch": 4083} {"train_loss": -26.362096786499023, "global_step": 338928, "epoch": 4083} {"train_loss": -26.011884689331055, "global_step": 338929, "epoch": 4083} {"train_loss": -26.43416404724121, "global_step": 338930, "epoch": 4083} {"train_loss": -26.3523006439209, "global_step": 338931, "epoch": 4083} {"train_loss": -26.139892578125, "global_step": 338932, "epoch": 4083} {"train_loss": -26.140552520751953, "global_step": 338933, "epoch": 4083} {"train_loss": -25.906408309936523, "global_step": 338934, "epoch": 4083} {"train_loss": -26.24909019470215, "global_step": 338935, "epoch": 4083} {"train_loss": -26.24652671813965, "global_step": 338936, "epoch": 4083} {"train_loss": -26.139806747436523, "global_step": 338937, "epoch": 4083} {"train_loss": -25.974475860595703, "global_step": 338938, "epoch": 4083} {"train_loss": -26.367650985717773, "global_step": 338939, "epoch": 4083} {"train_loss": -26.171728134155273, "global_step": 338940, "epoch": 4083} {"train_loss": -26.171720504760742, "global_step": 338941, "epoch": 4083} {"train_loss": -25.81058692932129, "global_step": 338942, "epoch": 4083} {"train_loss": -26.16143226623535, "global_step": 338943, "epoch": 4083} {"train_loss": -25.979169845581055, "global_step": 338944, "epoch": 4083} {"train_loss": -26.119327545166016, "global_step": 338945, "epoch": 4083} {"train_loss": -26.07284927368164, "global_step": 338946, "epoch": 4083} {"train_loss": -25.554126739501953, "global_step": 338947, "epoch": 4083} {"train_loss": -25.961334228515625, "global_step": 338948, "epoch": 4083} {"train_loss": -26.004236221313477, "global_step": 338949, "epoch": 4083} {"train_loss": -26.316543579101562, "global_step": 338950, "epoch": 4083} {"train_loss": -25.92072105407715, "global_step": 338951, "epoch": 4083} {"train_loss": -25.8226261138916, "global_step": 338952, "epoch": 4083} {"train_loss": -26.04074478149414, "global_step": 338953, "epoch": 4083} {"train_loss": -25.50689125061035, "global_step": 338954, "epoch": 4083} {"train_loss": -25.792133331298828, "global_step": 338955, "epoch": 4083} {"train_loss": -26.249303817749023, "global_step": 338956, "epoch": 4083} {"train_loss": -25.695327758789062, "global_step": 338957, "epoch": 4083} {"train_loss": -26.5327091217041, "global_step": 338958, "epoch": 4083} {"train_loss": -26.05484962463379, "global_step": 338959, "epoch": 4083} {"train_loss": -25.835569381713867, "global_step": 338960, "epoch": 4083} {"train_loss": -25.911645889282227, "global_step": 338961, "epoch": 4083} {"train_loss": -26.011062622070312, "global_step": 338962, "epoch": 4083} {"train_loss": -26.153940200805664, "global_step": 338963, "epoch": 4083} {"train_loss": -25.771249771118164, "global_step": 338964, "epoch": 4083} {"train_loss": -26.052106857299805, "global_step": 338965, "epoch": 4083} {"train_loss": -25.65363883972168, "global_step": 338966, "epoch": 4083} {"train_loss": -26.085693359375, "global_step": 338967, "epoch": 4083} {"train_loss": -26.3272762298584, "global_step": 338968, "epoch": 4083} {"train_loss": -26.352863311767578, "global_step": 338969, "epoch": 4083} {"train_loss": -25.90479850769043, "global_step": 338970, "epoch": 4083} {"train_loss": -25.938086429274225, "global_step": 338971, "epoch": 4083, "val_loss": 6741383.5} {"train_loss": -23.274831771850586, "global_step": 338972, "epoch": 4084} {"train_loss": -24.075525283813477, "global_step": 338973, "epoch": 4084} {"train_loss": -24.366840362548828, "global_step": 338974, "epoch": 4084} {"train_loss": -24.748380661010742, "global_step": 338975, "epoch": 4084} {"train_loss": -24.493860244750977, "global_step": 338976, "epoch": 4084} {"train_loss": -24.973554611206055, "global_step": 338977, "epoch": 4084} {"train_loss": -25.18109703063965, "global_step": 338978, "epoch": 4084} {"train_loss": -24.749608993530273, "global_step": 338979, "epoch": 4084} {"train_loss": -25.230854034423828, "global_step": 338980, "epoch": 4084} {"train_loss": -25.307235717773438, "global_step": 338981, "epoch": 4084} {"train_loss": -24.915647506713867, "global_step": 338982, "epoch": 4084} {"train_loss": -25.20826530456543, "global_step": 338983, "epoch": 4084} {"train_loss": -25.45250129699707, "global_step": 338984, "epoch": 4084} {"train_loss": -24.818143844604492, "global_step": 338985, "epoch": 4084} {"train_loss": -25.295337677001953, "global_step": 338986, "epoch": 4084} {"train_loss": -25.09256362915039, "global_step": 338987, "epoch": 4084} {"train_loss": -25.05326271057129, "global_step": 338988, "epoch": 4084} {"train_loss": -25.219680786132812, "global_step": 338989, "epoch": 4084} {"train_loss": -25.334075927734375, "global_step": 338990, "epoch": 4084} {"train_loss": -25.40095329284668, "global_step": 338991, "epoch": 4084} {"train_loss": -25.234418869018555, "global_step": 338992, "epoch": 4084} {"train_loss": -25.69537353515625, "global_step": 338993, "epoch": 4084} {"train_loss": -25.65966796875, "global_step": 338994, "epoch": 4084} {"train_loss": -25.286787033081055, "global_step": 338995, "epoch": 4084} {"train_loss": -25.72113037109375, "global_step": 338996, "epoch": 4084} {"train_loss": -25.40291404724121, "global_step": 338997, "epoch": 4084} {"train_loss": -25.289974212646484, "global_step": 338998, "epoch": 4084} {"train_loss": -25.582794189453125, "global_step": 338999, "epoch": 4084} {"train_loss": -25.586761474609375, "global_step": 339000, "epoch": 4084} {"train_loss": -25.46112632751465, "global_step": 339001, "epoch": 4084} {"train_loss": -25.774494171142578, "global_step": 339002, "epoch": 4084} {"train_loss": -25.959426879882812, "global_step": 339003, "epoch": 4084} {"train_loss": -25.614194869995117, "global_step": 339004, "epoch": 4084} {"train_loss": -26.02008056640625, "global_step": 339005, "epoch": 4084} {"train_loss": -25.952787399291992, "global_step": 339006, "epoch": 4084} {"train_loss": -25.867528915405273, "global_step": 339007, "epoch": 4084} {"train_loss": -25.631505966186523, "global_step": 339008, "epoch": 4084} {"train_loss": -26.0668888092041, "global_step": 339009, "epoch": 4084} {"train_loss": -25.88584327697754, "global_step": 339010, "epoch": 4084} {"train_loss": -25.710128784179688, "global_step": 339011, "epoch": 4084} {"train_loss": -25.77691650390625, "global_step": 339012, "epoch": 4084} {"train_loss": -26.032079696655273, "global_step": 339013, "epoch": 4084} {"train_loss": -26.10916519165039, "global_step": 339014, "epoch": 4084} {"train_loss": -26.097370147705078, "global_step": 339015, "epoch": 4084} {"train_loss": -26.028600692749023, "global_step": 339016, "epoch": 4084} {"train_loss": -26.043481826782227, "global_step": 339017, "epoch": 4084} {"train_loss": -26.00221061706543, "global_step": 339018, "epoch": 4084} {"train_loss": -26.027612686157227, "global_step": 339019, "epoch": 4084} {"train_loss": -26.43662452697754, "global_step": 339020, "epoch": 4084} {"train_loss": -26.29560661315918, "global_step": 339021, "epoch": 4084} {"train_loss": -26.180261611938477, "global_step": 339022, "epoch": 4084} {"train_loss": -25.995508193969727, "global_step": 339023, "epoch": 4084} {"train_loss": -25.8607234954834, "global_step": 339024, "epoch": 4084} {"train_loss": -25.835739135742188, "global_step": 339025, "epoch": 4084} {"train_loss": -26.55889320373535, "global_step": 339026, "epoch": 4084} {"train_loss": -26.060169219970703, "global_step": 339027, "epoch": 4084} {"train_loss": -26.292505264282227, "global_step": 339028, "epoch": 4084} {"train_loss": -25.765661239624023, "global_step": 339029, "epoch": 4084} {"train_loss": -26.11362075805664, "global_step": 339030, "epoch": 4084} {"train_loss": -26.34014320373535, "global_step": 339031, "epoch": 4084} {"train_loss": -26.03250503540039, "global_step": 339032, "epoch": 4084} {"train_loss": -25.448850631713867, "global_step": 339033, "epoch": 4084} {"train_loss": -26.133075714111328, "global_step": 339034, "epoch": 4084} {"train_loss": -26.196073532104492, "global_step": 339035, "epoch": 4084} {"train_loss": -26.00489616394043, "global_step": 339036, "epoch": 4084} {"train_loss": -25.63123893737793, "global_step": 339037, "epoch": 4084} {"train_loss": -26.218103408813477, "global_step": 339038, "epoch": 4084} {"train_loss": -26.232690811157227, "global_step": 339039, "epoch": 4084} {"train_loss": -26.05616569519043, "global_step": 339040, "epoch": 4084} {"train_loss": -25.841827392578125, "global_step": 339041, "epoch": 4084} {"train_loss": -26.209402084350586, "global_step": 339042, "epoch": 4084} {"train_loss": -26.4515380859375, "global_step": 339043, "epoch": 4084} {"train_loss": -26.213781356811523, "global_step": 339044, "epoch": 4084} {"train_loss": -26.002492904663086, "global_step": 339045, "epoch": 4084} {"train_loss": -25.645200729370117, "global_step": 339046, "epoch": 4084} {"train_loss": -26.509870529174805, "global_step": 339047, "epoch": 4084} {"train_loss": -26.047101974487305, "global_step": 339048, "epoch": 4084} {"train_loss": -25.73211097717285, "global_step": 339049, "epoch": 4084} {"train_loss": -25.960058212280273, "global_step": 339050, "epoch": 4084} {"train_loss": -25.866107940673828, "global_step": 339051, "epoch": 4084} {"train_loss": -26.281864166259766, "global_step": 339052, "epoch": 4084} {"train_loss": -26.375904083251953, "global_step": 339053, "epoch": 4084} {"train_loss": -25.682379021702044, "global_step": 339054, "epoch": 4084, "val_loss": 6549920.5} {"train_loss": -24.28956413269043, "global_step": 339055, "epoch": 4085} {"train_loss": -24.930374145507812, "global_step": 339056, "epoch": 4085} {"train_loss": -25.148313522338867, "global_step": 339057, "epoch": 4085} {"train_loss": -24.910886764526367, "global_step": 339058, "epoch": 4085} {"train_loss": -25.18370819091797, "global_step": 339059, "epoch": 4085} {"train_loss": -24.936681747436523, "global_step": 339060, "epoch": 4085} {"train_loss": -25.362974166870117, "global_step": 339061, "epoch": 4085} {"train_loss": -24.979511260986328, "global_step": 339062, "epoch": 4085} {"train_loss": -25.442676544189453, "global_step": 339063, "epoch": 4085} {"train_loss": -25.50718116760254, "global_step": 339064, "epoch": 4085} {"train_loss": -25.454343795776367, "global_step": 339065, "epoch": 4085} {"train_loss": -25.499902725219727, "global_step": 339066, "epoch": 4085} {"train_loss": -25.363576889038086, "global_step": 339067, "epoch": 4085} {"train_loss": -25.787832260131836, "global_step": 339068, "epoch": 4085} {"train_loss": -25.491262435913086, "global_step": 339069, "epoch": 4085} {"train_loss": -25.497127532958984, "global_step": 339070, "epoch": 4085} {"train_loss": -25.753021240234375, "global_step": 339071, "epoch": 4085} {"train_loss": -25.78645896911621, "global_step": 339072, "epoch": 4085} {"train_loss": -25.771163940429688, "global_step": 339073, "epoch": 4085} {"train_loss": -25.740249633789062, "global_step": 339074, "epoch": 4085} {"train_loss": -26.009647369384766, "global_step": 339075, "epoch": 4085} {"train_loss": -25.881011962890625, "global_step": 339076, "epoch": 4085} {"train_loss": -26.012115478515625, "global_step": 339077, "epoch": 4085} {"train_loss": -25.897878646850586, "global_step": 339078, "epoch": 4085} {"train_loss": -25.697528839111328, "global_step": 339079, "epoch": 4085} {"train_loss": -25.639463424682617, "global_step": 339080, "epoch": 4085} {"train_loss": -26.094287872314453, "global_step": 339081, "epoch": 4085} {"train_loss": -25.8436279296875, "global_step": 339082, "epoch": 4085} {"train_loss": -25.693286895751953, "global_step": 339083, "epoch": 4085} {"train_loss": -25.938461303710938, "global_step": 339084, "epoch": 4085} {"train_loss": -25.9227237701416, "global_step": 339085, "epoch": 4085} {"train_loss": -26.13686180114746, "global_step": 339086, "epoch": 4085} {"train_loss": -26.048810958862305, "global_step": 339087, "epoch": 4085} {"train_loss": -26.332183837890625, "global_step": 339088, "epoch": 4085} {"train_loss": -26.041894912719727, "global_step": 339089, "epoch": 4085} {"train_loss": -26.208972930908203, "global_step": 339090, "epoch": 4085} {"train_loss": -26.201887130737305, "global_step": 339091, "epoch": 4085} {"train_loss": -25.979480743408203, "global_step": 339092, "epoch": 4085} {"train_loss": -25.768035888671875, "global_step": 339093, "epoch": 4085} {"train_loss": -26.25139808654785, "global_step": 339094, "epoch": 4085} {"train_loss": -25.955066680908203, "global_step": 339095, "epoch": 4085} {"train_loss": -26.205692291259766, "global_step": 339096, "epoch": 4085} {"train_loss": -26.12424087524414, "global_step": 339097, "epoch": 4085} {"train_loss": -25.989227294921875, "global_step": 339098, "epoch": 4085} {"train_loss": -26.014951705932617, "global_step": 339099, "epoch": 4085} {"train_loss": -26.361906051635742, "global_step": 339100, "epoch": 4085} {"train_loss": -26.376941680908203, "global_step": 339101, "epoch": 4085} {"train_loss": -25.9725399017334, "global_step": 339102, "epoch": 4085} {"train_loss": -26.42167091369629, "global_step": 339103, "epoch": 4085} {"train_loss": -26.278806686401367, "global_step": 339104, "epoch": 4085} {"train_loss": -26.14873695373535, "global_step": 339105, "epoch": 4085} {"train_loss": -26.163976669311523, "global_step": 339106, "epoch": 4085} {"train_loss": -26.169443130493164, "global_step": 339107, "epoch": 4085} {"train_loss": -26.404834747314453, "global_step": 339108, "epoch": 4085} {"train_loss": -25.986984252929688, "global_step": 339109, "epoch": 4085} {"train_loss": -25.87965202331543, "global_step": 339110, "epoch": 4085} {"train_loss": -26.21527671813965, "global_step": 339111, "epoch": 4085} {"train_loss": -26.100427627563477, "global_step": 339112, "epoch": 4085} {"train_loss": -25.66473388671875, "global_step": 339113, "epoch": 4085} {"train_loss": -26.217559814453125, "global_step": 339114, "epoch": 4085} {"train_loss": -26.266324996948242, "global_step": 339115, "epoch": 4085} {"train_loss": -25.945764541625977, "global_step": 339116, "epoch": 4085} {"train_loss": -26.32264518737793, "global_step": 339117, "epoch": 4085} {"train_loss": -26.18218421936035, "global_step": 339118, "epoch": 4085} {"train_loss": -25.746686935424805, "global_step": 339119, "epoch": 4085} {"train_loss": -26.186044692993164, "global_step": 339120, "epoch": 4085} {"train_loss": -26.118560791015625, "global_step": 339121, "epoch": 4085} {"train_loss": -26.0369815826416, "global_step": 339122, "epoch": 4085} {"train_loss": -26.147266387939453, "global_step": 339123, "epoch": 4085} {"train_loss": -25.8046817779541, "global_step": 339124, "epoch": 4085} {"train_loss": -25.972070693969727, "global_step": 339125, "epoch": 4085} {"train_loss": -25.989246368408203, "global_step": 339126, "epoch": 4085} {"train_loss": -26.115345001220703, "global_step": 339127, "epoch": 4085} {"train_loss": -25.970556259155273, "global_step": 339128, "epoch": 4085} {"train_loss": -26.041553497314453, "global_step": 339129, "epoch": 4085} {"train_loss": -25.91314697265625, "global_step": 339130, "epoch": 4085} {"train_loss": -25.861547470092773, "global_step": 339131, "epoch": 4085} {"train_loss": -26.126220703125, "global_step": 339132, "epoch": 4085} {"train_loss": -26.148914337158203, "global_step": 339133, "epoch": 4085} {"train_loss": -25.885107040405273, "global_step": 339134, "epoch": 4085} {"train_loss": -26.4022274017334, "global_step": 339135, "epoch": 4085} {"train_loss": -26.1007080078125, "global_step": 339136, "epoch": 4085} {"train_loss": -25.878424518079644, "global_step": 339137, "epoch": 4085, "val_loss": 6572624.0} {"train_loss": -26.094465255737305, "global_step": 339138, "epoch": 4086} {"train_loss": -25.74625015258789, "global_step": 339139, "epoch": 4086} {"train_loss": -25.75457763671875, "global_step": 339140, "epoch": 4086} {"train_loss": -25.66034507751465, "global_step": 339141, "epoch": 4086} {"train_loss": -25.751789093017578, "global_step": 339142, "epoch": 4086} {"train_loss": -25.841358184814453, "global_step": 339143, "epoch": 4086} {"train_loss": -26.053913116455078, "global_step": 339144, "epoch": 4086} {"train_loss": -25.900943756103516, "global_step": 339145, "epoch": 4086} {"train_loss": -25.745849609375, "global_step": 339146, "epoch": 4086} {"train_loss": -25.734638214111328, "global_step": 339147, "epoch": 4086} {"train_loss": -25.991886138916016, "global_step": 339148, "epoch": 4086} {"train_loss": -25.704885482788086, "global_step": 339149, "epoch": 4086} {"train_loss": -25.827838897705078, "global_step": 339150, "epoch": 4086} {"train_loss": -26.243377685546875, "global_step": 339151, "epoch": 4086} {"train_loss": -25.979944229125977, "global_step": 339152, "epoch": 4086} {"train_loss": -25.856250762939453, "global_step": 339153, "epoch": 4086} {"train_loss": -25.483417510986328, "global_step": 339154, "epoch": 4086} {"train_loss": -26.01083755493164, "global_step": 339155, "epoch": 4086} {"train_loss": -25.930967330932617, "global_step": 339156, "epoch": 4086} {"train_loss": -25.612897872924805, "global_step": 339157, "epoch": 4086} {"train_loss": -25.490575790405273, "global_step": 339158, "epoch": 4086} {"train_loss": -25.829299926757812, "global_step": 339159, "epoch": 4086} {"train_loss": -26.081335067749023, "global_step": 339160, "epoch": 4086} {"train_loss": -25.925933837890625, "global_step": 339161, "epoch": 4086} {"train_loss": -26.212488174438477, "global_step": 339162, "epoch": 4086} {"train_loss": -26.038818359375, "global_step": 339163, "epoch": 4086} {"train_loss": -26.191909790039062, "global_step": 339164, "epoch": 4086} {"train_loss": -25.878982543945312, "global_step": 339165, "epoch": 4086} {"train_loss": -25.601856231689453, "global_step": 339166, "epoch": 4086} {"train_loss": -25.688871383666992, "global_step": 339167, "epoch": 4086} {"train_loss": -26.40589714050293, "global_step": 339168, "epoch": 4086} {"train_loss": -25.930952072143555, "global_step": 339169, "epoch": 4086} {"train_loss": -26.262060165405273, "global_step": 339170, "epoch": 4086} {"train_loss": -26.05329704284668, "global_step": 339171, "epoch": 4086} {"train_loss": -26.399179458618164, "global_step": 339172, "epoch": 4086} {"train_loss": -26.198715209960938, "global_step": 339173, "epoch": 4086} {"train_loss": -26.341283798217773, "global_step": 339174, "epoch": 4086} {"train_loss": -26.061410903930664, "global_step": 339175, "epoch": 4086} {"train_loss": -26.084863662719727, "global_step": 339176, "epoch": 4086} {"train_loss": -26.33428955078125, "global_step": 339177, "epoch": 4086} {"train_loss": -26.316335678100586, "global_step": 339178, "epoch": 4086} {"train_loss": -26.328088760375977, "global_step": 339179, "epoch": 4086} {"train_loss": -26.44227409362793, "global_step": 339180, "epoch": 4086} {"train_loss": -26.040485382080078, "global_step": 339181, "epoch": 4086} {"train_loss": -26.127750396728516, "global_step": 339182, "epoch": 4086} {"train_loss": -26.509138107299805, "global_step": 339183, "epoch": 4086} {"train_loss": -26.340734481811523, "global_step": 339184, "epoch": 4086} {"train_loss": -26.017126083374023, "global_step": 339185, "epoch": 4086} {"train_loss": -26.584503173828125, "global_step": 339186, "epoch": 4086} {"train_loss": -26.02680015563965, "global_step": 339187, "epoch": 4086} {"train_loss": -26.20977210998535, "global_step": 339188, "epoch": 4086} {"train_loss": -26.24891471862793, "global_step": 339189, "epoch": 4086} {"train_loss": -26.471750259399414, "global_step": 339190, "epoch": 4086} {"train_loss": -26.018787384033203, "global_step": 339191, "epoch": 4086} {"train_loss": -26.14224624633789, "global_step": 339192, "epoch": 4086} {"train_loss": -26.553449630737305, "global_step": 339193, "epoch": 4086} {"train_loss": -25.949771881103516, "global_step": 339194, "epoch": 4086} {"train_loss": -26.331512451171875, "global_step": 339195, "epoch": 4086} {"train_loss": -25.845727920532227, "global_step": 339196, "epoch": 4086} {"train_loss": -25.89039421081543, "global_step": 339197, "epoch": 4086} {"train_loss": -25.75433349609375, "global_step": 339198, "epoch": 4086} {"train_loss": -26.02979850769043, "global_step": 339199, "epoch": 4086} {"train_loss": -25.737668991088867, "global_step": 339200, "epoch": 4086} {"train_loss": -26.135177612304688, "global_step": 339201, "epoch": 4086} {"train_loss": -26.14481544494629, "global_step": 339202, "epoch": 4086} {"train_loss": -25.942052841186523, "global_step": 339203, "epoch": 4086} {"train_loss": -26.601362228393555, "global_step": 339204, "epoch": 4086} {"train_loss": -25.959857940673828, "global_step": 339205, "epoch": 4086} {"train_loss": -26.085424423217773, "global_step": 339206, "epoch": 4086} {"train_loss": -25.71150016784668, "global_step": 339207, "epoch": 4086} {"train_loss": -25.924915313720703, "global_step": 339208, "epoch": 4086} {"train_loss": -26.17531394958496, "global_step": 339209, "epoch": 4086} {"train_loss": -26.10107421875, "global_step": 339210, "epoch": 4086} {"train_loss": -26.20973014831543, "global_step": 339211, "epoch": 4086} {"train_loss": -26.002599716186523, "global_step": 339212, "epoch": 4086} {"train_loss": -25.77914810180664, "global_step": 339213, "epoch": 4086} {"train_loss": -26.039770126342773, "global_step": 339214, "epoch": 4086} {"train_loss": -25.774946212768555, "global_step": 339215, "epoch": 4086} {"train_loss": -26.153182983398438, "global_step": 339216, "epoch": 4086} {"train_loss": -25.957616806030273, "global_step": 339217, "epoch": 4086} {"train_loss": -26.00751304626465, "global_step": 339218, "epoch": 4086} {"train_loss": -26.2868595123291, "global_step": 339219, "epoch": 4086} {"train_loss": -26.019740690667945, "global_step": 339220, "epoch": 4086, "val_loss": 6695181.0} {"train_loss": -26.067428588867188, "global_step": 339221, "epoch": 4087} {"train_loss": -25.685428619384766, "global_step": 339222, "epoch": 4087} {"train_loss": -25.878314971923828, "global_step": 339223, "epoch": 4087} {"train_loss": -25.983524322509766, "global_step": 339224, "epoch": 4087} {"train_loss": -26.086225509643555, "global_step": 339225, "epoch": 4087} {"train_loss": -25.15863609313965, "global_step": 339226, "epoch": 4087} {"train_loss": -25.552278518676758, "global_step": 339227, "epoch": 4087} {"train_loss": -25.56485939025879, "global_step": 339228, "epoch": 4087} {"train_loss": -25.835046768188477, "global_step": 339229, "epoch": 4087} {"train_loss": -25.990385055541992, "global_step": 339230, "epoch": 4087} {"train_loss": -25.361286163330078, "global_step": 339231, "epoch": 4087} {"train_loss": -25.876134872436523, "global_step": 339232, "epoch": 4087} {"train_loss": -26.0059757232666, "global_step": 339233, "epoch": 4087} {"train_loss": -25.99090576171875, "global_step": 339234, "epoch": 4087} {"train_loss": -25.450241088867188, "global_step": 339235, "epoch": 4087} {"train_loss": -25.897048950195312, "global_step": 339236, "epoch": 4087} {"train_loss": -25.348861694335938, "global_step": 339237, "epoch": 4087} {"train_loss": -26.003320693969727, "global_step": 339238, "epoch": 4087} {"train_loss": -25.73170280456543, "global_step": 339239, "epoch": 4087} {"train_loss": -26.33924674987793, "global_step": 339240, "epoch": 4087} {"train_loss": -25.995777130126953, "global_step": 339241, "epoch": 4087} {"train_loss": -25.958847045898438, "global_step": 339242, "epoch": 4087} {"train_loss": -26.072528839111328, "global_step": 339243, "epoch": 4087} {"train_loss": -26.168567657470703, "global_step": 339244, "epoch": 4087} {"train_loss": -26.08600425720215, "global_step": 339245, "epoch": 4087} {"train_loss": -26.26430320739746, "global_step": 339246, "epoch": 4087} {"train_loss": -25.932199478149414, "global_step": 339247, "epoch": 4087} {"train_loss": -26.009185791015625, "global_step": 339248, "epoch": 4087} {"train_loss": -26.159208297729492, "global_step": 339249, "epoch": 4087} {"train_loss": -26.279775619506836, "global_step": 339250, "epoch": 4087} {"train_loss": -26.218719482421875, "global_step": 339251, "epoch": 4087} {"train_loss": -26.432910919189453, "global_step": 339252, "epoch": 4087} {"train_loss": -26.277740478515625, "global_step": 339253, "epoch": 4087} {"train_loss": -25.956689834594727, "global_step": 339254, "epoch": 4087} {"train_loss": -26.165130615234375, "global_step": 339255, "epoch": 4087} {"train_loss": -26.277496337890625, "global_step": 339256, "epoch": 4087} {"train_loss": -25.99818229675293, "global_step": 339257, "epoch": 4087} {"train_loss": -26.55018424987793, "global_step": 339258, "epoch": 4087} {"train_loss": -26.331674575805664, "global_step": 339259, "epoch": 4087} {"train_loss": -26.401838302612305, "global_step": 339260, "epoch": 4087} {"train_loss": -26.179590225219727, "global_step": 339261, "epoch": 4087} {"train_loss": -26.4102840423584, "global_step": 339262, "epoch": 4087} {"train_loss": -26.21296501159668, "global_step": 339263, "epoch": 4087} {"train_loss": -26.334735870361328, "global_step": 339264, "epoch": 4087} {"train_loss": -26.200613021850586, "global_step": 339265, "epoch": 4087} {"train_loss": -26.15244483947754, "global_step": 339266, "epoch": 4087} {"train_loss": -26.306655883789062, "global_step": 339267, "epoch": 4087} {"train_loss": -26.209060668945312, "global_step": 339268, "epoch": 4087} {"train_loss": -26.199432373046875, "global_step": 339269, "epoch": 4087} {"train_loss": -26.267911911010742, "global_step": 339270, "epoch": 4087} {"train_loss": -26.243146896362305, "global_step": 339271, "epoch": 4087} {"train_loss": -26.166553497314453, "global_step": 339272, "epoch": 4087} {"train_loss": -26.3795108795166, "global_step": 339273, "epoch": 4087} {"train_loss": -26.358631134033203, "global_step": 339274, "epoch": 4087} {"train_loss": -25.95123291015625, "global_step": 339275, "epoch": 4087} {"train_loss": -26.27057456970215, "global_step": 339276, "epoch": 4087} {"train_loss": -26.459686279296875, "global_step": 339277, "epoch": 4087} {"train_loss": -25.89887046813965, "global_step": 339278, "epoch": 4087} {"train_loss": -25.982940673828125, "global_step": 339279, "epoch": 4087} {"train_loss": -26.042926788330078, "global_step": 339280, "epoch": 4087} {"train_loss": -26.3898868560791, "global_step": 339281, "epoch": 4087} {"train_loss": -26.203266143798828, "global_step": 339282, "epoch": 4087} {"train_loss": -26.169815063476562, "global_step": 339283, "epoch": 4087} {"train_loss": -26.11273193359375, "global_step": 339284, "epoch": 4087} {"train_loss": -26.146610260009766, "global_step": 339285, "epoch": 4087} {"train_loss": -26.56239128112793, "global_step": 339286, "epoch": 4087} {"train_loss": -26.218189239501953, "global_step": 339287, "epoch": 4087} {"train_loss": -25.85881996154785, "global_step": 339288, "epoch": 4087} {"train_loss": -25.496206283569336, "global_step": 339289, "epoch": 4087} {"train_loss": -25.51871109008789, "global_step": 339290, "epoch": 4087} {"train_loss": -25.276784896850586, "global_step": 339291, "epoch": 4087} {"train_loss": -25.76662254333496, "global_step": 339292, "epoch": 4087} {"train_loss": -25.93816566467285, "global_step": 339293, "epoch": 4087} {"train_loss": -25.7618408203125, "global_step": 339294, "epoch": 4087} {"train_loss": -25.70270347595215, "global_step": 339295, "epoch": 4087} {"train_loss": -26.141653060913086, "global_step": 339296, "epoch": 4087} {"train_loss": -26.11921501159668, "global_step": 339297, "epoch": 4087} {"train_loss": -25.85235023498535, "global_step": 339298, "epoch": 4087} {"train_loss": -25.460783004760742, "global_step": 339299, "epoch": 4087} {"train_loss": -25.942737579345703, "global_step": 339300, "epoch": 4087} {"train_loss": -25.949560165405273, "global_step": 339301, "epoch": 4087} {"train_loss": -25.751001358032227, "global_step": 339302, "epoch": 4087} {"train_loss": -26.019649068993257, "global_step": 339303, "epoch": 4087, "val_loss": 6774503.0} {"train_loss": -25.528369903564453, "global_step": 339304, "epoch": 4088} {"train_loss": -24.938949584960938, "global_step": 339305, "epoch": 4088} {"train_loss": -25.514522552490234, "global_step": 339306, "epoch": 4088} {"train_loss": -25.615833282470703, "global_step": 339307, "epoch": 4088} {"train_loss": -24.87212562561035, "global_step": 339308, "epoch": 4088} {"train_loss": -26.172712326049805, "global_step": 339309, "epoch": 4088} {"train_loss": -25.12013816833496, "global_step": 339310, "epoch": 4088} {"train_loss": -25.297016143798828, "global_step": 339311, "epoch": 4088} {"train_loss": -24.957548141479492, "global_step": 339312, "epoch": 4088} {"train_loss": -25.355022430419922, "global_step": 339313, "epoch": 4088} {"train_loss": -25.44697380065918, "global_step": 339314, "epoch": 4088} {"train_loss": -25.15650749206543, "global_step": 339315, "epoch": 4088} {"train_loss": -25.113039016723633, "global_step": 339316, "epoch": 4088} {"train_loss": -25.75330924987793, "global_step": 339317, "epoch": 4088} {"train_loss": -25.36968421936035, "global_step": 339318, "epoch": 4088} {"train_loss": -25.954303741455078, "global_step": 339319, "epoch": 4088} {"train_loss": -25.222021102905273, "global_step": 339320, "epoch": 4088} {"train_loss": -25.818649291992188, "global_step": 339321, "epoch": 4088} {"train_loss": -25.816715240478516, "global_step": 339322, "epoch": 4088} {"train_loss": -25.603199005126953, "global_step": 339323, "epoch": 4088} {"train_loss": -25.761037826538086, "global_step": 339324, "epoch": 4088} {"train_loss": -25.53156089782715, "global_step": 339325, "epoch": 4088} {"train_loss": -26.163745880126953, "global_step": 339326, "epoch": 4088} {"train_loss": -26.104887008666992, "global_step": 339327, "epoch": 4088} {"train_loss": -25.573068618774414, "global_step": 339328, "epoch": 4088} {"train_loss": -26.012723922729492, "global_step": 339329, "epoch": 4088} {"train_loss": -26.32874870300293, "global_step": 339330, "epoch": 4088} {"train_loss": -25.894933700561523, "global_step": 339331, "epoch": 4088} {"train_loss": -26.11849021911621, "global_step": 339332, "epoch": 4088} {"train_loss": -26.432294845581055, "global_step": 339333, "epoch": 4088} {"train_loss": -25.81402015686035, "global_step": 339334, "epoch": 4088} {"train_loss": -26.00850486755371, "global_step": 339335, "epoch": 4088} {"train_loss": -26.103729248046875, "global_step": 339336, "epoch": 4088} {"train_loss": -26.26944351196289, "global_step": 339337, "epoch": 4088} {"train_loss": -26.449838638305664, "global_step": 339338, "epoch": 4088} {"train_loss": -25.964019775390625, "global_step": 339339, "epoch": 4088} {"train_loss": -26.40895652770996, "global_step": 339340, "epoch": 4088} {"train_loss": -26.1716251373291, "global_step": 339341, "epoch": 4088} {"train_loss": -26.039560317993164, "global_step": 339342, "epoch": 4088} {"train_loss": -26.354806900024414, "global_step": 339343, "epoch": 4088} {"train_loss": -26.01264762878418, "global_step": 339344, "epoch": 4088} {"train_loss": -26.293670654296875, "global_step": 339345, "epoch": 4088} {"train_loss": -26.292999267578125, "global_step": 339346, "epoch": 4088} {"train_loss": -26.117618560791016, "global_step": 339347, "epoch": 4088} {"train_loss": -26.212390899658203, "global_step": 339348, "epoch": 4088} {"train_loss": -26.3359317779541, "global_step": 339349, "epoch": 4088} {"train_loss": -26.680347442626953, "global_step": 339350, "epoch": 4088} {"train_loss": -26.46540641784668, "global_step": 339351, "epoch": 4088} {"train_loss": -26.524585723876953, "global_step": 339352, "epoch": 4088} {"train_loss": -26.306140899658203, "global_step": 339353, "epoch": 4088} {"train_loss": -26.162199020385742, "global_step": 339354, "epoch": 4088} {"train_loss": -26.282705307006836, "global_step": 339355, "epoch": 4088} {"train_loss": -25.960309982299805, "global_step": 339356, "epoch": 4088} {"train_loss": -26.225610733032227, "global_step": 339357, "epoch": 4088} {"train_loss": -25.82362174987793, "global_step": 339358, "epoch": 4088} {"train_loss": -26.10515785217285, "global_step": 339359, "epoch": 4088} {"train_loss": -26.09514808654785, "global_step": 339360, "epoch": 4088} {"train_loss": -26.427892684936523, "global_step": 339361, "epoch": 4088} {"train_loss": -26.361242294311523, "global_step": 339362, "epoch": 4088} {"train_loss": -26.10821533203125, "global_step": 339363, "epoch": 4088} {"train_loss": -26.161962509155273, "global_step": 339364, "epoch": 4088} {"train_loss": -25.9594783782959, "global_step": 339365, "epoch": 4088} {"train_loss": -26.03583335876465, "global_step": 339366, "epoch": 4088} {"train_loss": -25.990217208862305, "global_step": 339367, "epoch": 4088} {"train_loss": -25.966028213500977, "global_step": 339368, "epoch": 4088} {"train_loss": -26.078256607055664, "global_step": 339369, "epoch": 4088} {"train_loss": -25.629180908203125, "global_step": 339370, "epoch": 4088} {"train_loss": -25.51854133605957, "global_step": 339371, "epoch": 4088} {"train_loss": -25.868295669555664, "global_step": 339372, "epoch": 4088} {"train_loss": -26.519575119018555, "global_step": 339373, "epoch": 4088} {"train_loss": -26.07918357849121, "global_step": 339374, "epoch": 4088} {"train_loss": -25.98065757751465, "global_step": 339375, "epoch": 4088} {"train_loss": -25.72174644470215, "global_step": 339376, "epoch": 4088} {"train_loss": -26.231170654296875, "global_step": 339377, "epoch": 4088} {"train_loss": -26.053464889526367, "global_step": 339378, "epoch": 4088} {"train_loss": -26.066802978515625, "global_step": 339379, "epoch": 4088} {"train_loss": -25.910980224609375, "global_step": 339380, "epoch": 4088} {"train_loss": -26.1627140045166, "global_step": 339381, "epoch": 4088} {"train_loss": -25.91767692565918, "global_step": 339382, "epoch": 4088} {"train_loss": -25.805194854736328, "global_step": 339383, "epoch": 4088} {"train_loss": -26.1595458984375, "global_step": 339384, "epoch": 4088} {"train_loss": -25.99947166442871, "global_step": 339385, "epoch": 4088} {"train_loss": -25.958005307668664, "global_step": 339386, "epoch": 4088, "val_loss": 6631405.0} {"train_loss": -25.219913482666016, "global_step": 339387, "epoch": 4089} {"train_loss": -25.01788902282715, "global_step": 339388, "epoch": 4089} {"train_loss": -25.959335327148438, "global_step": 339389, "epoch": 4089} {"train_loss": -25.7811222076416, "global_step": 339390, "epoch": 4089} {"train_loss": -25.618896484375, "global_step": 339391, "epoch": 4089} {"train_loss": -25.689380645751953, "global_step": 339392, "epoch": 4089} {"train_loss": -25.746585845947266, "global_step": 339393, "epoch": 4089} {"train_loss": -26.006271362304688, "global_step": 339394, "epoch": 4089} {"train_loss": -25.957555770874023, "global_step": 339395, "epoch": 4089} {"train_loss": -26.22543716430664, "global_step": 339396, "epoch": 4089} {"train_loss": -25.793582916259766, "global_step": 339397, "epoch": 4089} {"train_loss": -25.990345001220703, "global_step": 339398, "epoch": 4089} {"train_loss": -25.946094512939453, "global_step": 339399, "epoch": 4089} {"train_loss": -26.04839515686035, "global_step": 339400, "epoch": 4089} {"train_loss": -25.697254180908203, "global_step": 339401, "epoch": 4089} {"train_loss": -25.789167404174805, "global_step": 339402, "epoch": 4089} {"train_loss": -25.71321678161621, "global_step": 339403, "epoch": 4089} {"train_loss": -25.677404403686523, "global_step": 339404, "epoch": 4089} {"train_loss": -25.92576026916504, "global_step": 339405, "epoch": 4089} {"train_loss": -26.043140411376953, "global_step": 339406, "epoch": 4089} {"train_loss": -25.940505981445312, "global_step": 339407, "epoch": 4089} {"train_loss": -25.829172134399414, "global_step": 339408, "epoch": 4089} {"train_loss": -25.930450439453125, "global_step": 339409, "epoch": 4089} {"train_loss": -26.2565860748291, "global_step": 339410, "epoch": 4089} {"train_loss": -25.759754180908203, "global_step": 339411, "epoch": 4089} {"train_loss": -25.663434982299805, "global_step": 339412, "epoch": 4089} {"train_loss": -25.6536922454834, "global_step": 339413, "epoch": 4089} {"train_loss": -25.95448112487793, "global_step": 339414, "epoch": 4089} {"train_loss": -26.109420776367188, "global_step": 339415, "epoch": 4089} {"train_loss": -25.911624908447266, "global_step": 339416, "epoch": 4089} {"train_loss": -25.725610733032227, "global_step": 339417, "epoch": 4089} {"train_loss": -26.35332679748535, "global_step": 339418, "epoch": 4089} {"train_loss": -26.171894073486328, "global_step": 339419, "epoch": 4089} {"train_loss": -26.381982803344727, "global_step": 339420, "epoch": 4089} {"train_loss": -26.011545181274414, "global_step": 339421, "epoch": 4089} {"train_loss": -26.102293014526367, "global_step": 339422, "epoch": 4089} {"train_loss": -26.21209716796875, "global_step": 339423, "epoch": 4089} {"train_loss": -26.59515380859375, "global_step": 339424, "epoch": 4089} {"train_loss": -26.315465927124023, "global_step": 339425, "epoch": 4089} {"train_loss": -26.037830352783203, "global_step": 339426, "epoch": 4089} {"train_loss": -26.155481338500977, "global_step": 339427, "epoch": 4089} {"train_loss": -26.351104736328125, "global_step": 339428, "epoch": 4089} {"train_loss": -25.974958419799805, "global_step": 339429, "epoch": 4089} {"train_loss": -26.1051025390625, "global_step": 339430, "epoch": 4089} {"train_loss": -26.27345085144043, "global_step": 339431, "epoch": 4089} {"train_loss": -26.216882705688477, "global_step": 339432, "epoch": 4089} {"train_loss": -26.1682071685791, "global_step": 339433, "epoch": 4089} {"train_loss": -25.78375244140625, "global_step": 339434, "epoch": 4089} {"train_loss": -26.118183135986328, "global_step": 339435, "epoch": 4089} {"train_loss": -26.11333656311035, "global_step": 339436, "epoch": 4089} {"train_loss": -26.63641357421875, "global_step": 339437, "epoch": 4089} {"train_loss": -26.518056869506836, "global_step": 339438, "epoch": 4089} {"train_loss": -26.0512638092041, "global_step": 339439, "epoch": 4089} {"train_loss": -25.907148361206055, "global_step": 339440, "epoch": 4089} {"train_loss": -25.809661865234375, "global_step": 339441, "epoch": 4089} {"train_loss": -26.091251373291016, "global_step": 339442, "epoch": 4089} {"train_loss": -26.141992568969727, "global_step": 339443, "epoch": 4089} {"train_loss": -25.941633224487305, "global_step": 339444, "epoch": 4089} {"train_loss": -26.0780029296875, "global_step": 339445, "epoch": 4089} {"train_loss": -26.125900268554688, "global_step": 339446, "epoch": 4089} {"train_loss": -26.12906265258789, "global_step": 339447, "epoch": 4089} {"train_loss": -25.58576774597168, "global_step": 339448, "epoch": 4089} {"train_loss": -25.941211700439453, "global_step": 339449, "epoch": 4089} {"train_loss": -25.849843978881836, "global_step": 339450, "epoch": 4089} {"train_loss": -26.03420066833496, "global_step": 339451, "epoch": 4089} {"train_loss": -25.597715377807617, "global_step": 339452, "epoch": 4089} {"train_loss": -26.00522232055664, "global_step": 339453, "epoch": 4089} {"train_loss": -25.705249786376953, "global_step": 339454, "epoch": 4089} {"train_loss": -26.14568519592285, "global_step": 339455, "epoch": 4089} {"train_loss": -25.808074951171875, "global_step": 339456, "epoch": 4089} {"train_loss": -25.688232421875, "global_step": 339457, "epoch": 4089} {"train_loss": -25.835468292236328, "global_step": 339458, "epoch": 4089} {"train_loss": -25.72698974609375, "global_step": 339459, "epoch": 4089} {"train_loss": -25.965417861938477, "global_step": 339460, "epoch": 4089} {"train_loss": -25.780750274658203, "global_step": 339461, "epoch": 4089} {"train_loss": -26.517480850219727, "global_step": 339462, "epoch": 4089} {"train_loss": -25.858245849609375, "global_step": 339463, "epoch": 4089} {"train_loss": -25.990991592407227, "global_step": 339464, "epoch": 4089} {"train_loss": -26.132150650024414, "global_step": 339465, "epoch": 4089} {"train_loss": -26.269184112548828, "global_step": 339466, "epoch": 4089} {"train_loss": -26.44167137145996, "global_step": 339467, "epoch": 4089} {"train_loss": -25.887170791625977, "global_step": 339468, "epoch": 4089} {"train_loss": -25.981656982238036, "global_step": 339469, "epoch": 4089, "val_loss": 6647672.0} {"train_loss": -25.18970489501953, "global_step": 339470, "epoch": 4090} {"train_loss": -24.339218139648438, "global_step": 339471, "epoch": 4090} {"train_loss": -24.435720443725586, "global_step": 339472, "epoch": 4090} {"train_loss": -25.05004119873047, "global_step": 339473, "epoch": 4090} {"train_loss": -25.28484344482422, "global_step": 339474, "epoch": 4090} {"train_loss": -25.164234161376953, "global_step": 339475, "epoch": 4090} {"train_loss": -24.977188110351562, "global_step": 339476, "epoch": 4090} {"train_loss": -25.128454208374023, "global_step": 339477, "epoch": 4090} {"train_loss": -25.374876022338867, "global_step": 339478, "epoch": 4090} {"train_loss": -25.157880783081055, "global_step": 339479, "epoch": 4090} {"train_loss": -25.591196060180664, "global_step": 339480, "epoch": 4090} {"train_loss": -25.369796752929688, "global_step": 339481, "epoch": 4090} {"train_loss": -25.42598533630371, "global_step": 339482, "epoch": 4090} {"train_loss": -25.25812339782715, "global_step": 339483, "epoch": 4090} {"train_loss": -25.441326141357422, "global_step": 339484, "epoch": 4090} {"train_loss": -25.386423110961914, "global_step": 339485, "epoch": 4090} {"train_loss": -25.069698333740234, "global_step": 339486, "epoch": 4090} {"train_loss": -25.59893798828125, "global_step": 339487, "epoch": 4090} {"train_loss": -25.7918701171875, "global_step": 339488, "epoch": 4090} {"train_loss": -25.727222442626953, "global_step": 339489, "epoch": 4090} {"train_loss": -25.568025588989258, "global_step": 339490, "epoch": 4090} {"train_loss": -26.037927627563477, "global_step": 339491, "epoch": 4090} {"train_loss": -25.781497955322266, "global_step": 339492, "epoch": 4090} {"train_loss": -25.905298233032227, "global_step": 339493, "epoch": 4090} {"train_loss": -25.90703773498535, "global_step": 339494, "epoch": 4090} {"train_loss": -25.886306762695312, "global_step": 339495, "epoch": 4090} {"train_loss": -26.075780868530273, "global_step": 339496, "epoch": 4090} {"train_loss": -25.866445541381836, "global_step": 339497, "epoch": 4090} {"train_loss": -25.786697387695312, "global_step": 339498, "epoch": 4090} {"train_loss": -25.788715362548828, "global_step": 339499, "epoch": 4090} {"train_loss": -26.05478286743164, "global_step": 339500, "epoch": 4090} {"train_loss": -25.777185440063477, "global_step": 339501, "epoch": 4090} {"train_loss": -26.024377822875977, "global_step": 339502, "epoch": 4090} {"train_loss": -26.3089599609375, "global_step": 339503, "epoch": 4090} {"train_loss": -26.091516494750977, "global_step": 339504, "epoch": 4090} {"train_loss": -26.3536376953125, "global_step": 339505, "epoch": 4090} {"train_loss": -26.037809371948242, "global_step": 339506, "epoch": 4090} {"train_loss": -26.028945922851562, "global_step": 339507, "epoch": 4090} {"train_loss": -26.192373275756836, "global_step": 339508, "epoch": 4090} {"train_loss": -26.298315048217773, "global_step": 339509, "epoch": 4090} {"train_loss": -26.37550163269043, "global_step": 339510, "epoch": 4090} {"train_loss": -26.459156036376953, "global_step": 339511, "epoch": 4090} {"train_loss": -26.16717529296875, "global_step": 339512, "epoch": 4090} {"train_loss": -26.1842041015625, "global_step": 339513, "epoch": 4090} {"train_loss": -26.192686080932617, "global_step": 339514, "epoch": 4090} {"train_loss": -26.38372802734375, "global_step": 339515, "epoch": 4090} {"train_loss": -26.328535079956055, "global_step": 339516, "epoch": 4090} {"train_loss": -26.26654624938965, "global_step": 339517, "epoch": 4090} {"train_loss": -25.950687408447266, "global_step": 339518, "epoch": 4090} {"train_loss": -26.094379425048828, "global_step": 339519, "epoch": 4090} {"train_loss": -25.741323471069336, "global_step": 339520, "epoch": 4090} {"train_loss": -26.268798828125, "global_step": 339521, "epoch": 4090} {"train_loss": -26.201919555664062, "global_step": 339522, "epoch": 4090} {"train_loss": -26.242849349975586, "global_step": 339523, "epoch": 4090} {"train_loss": -25.895200729370117, "global_step": 339524, "epoch": 4090} {"train_loss": -25.885986328125, "global_step": 339525, "epoch": 4090} {"train_loss": -26.196645736694336, "global_step": 339526, "epoch": 4090} {"train_loss": -26.277013778686523, "global_step": 339527, "epoch": 4090} {"train_loss": -26.21109390258789, "global_step": 339528, "epoch": 4090} {"train_loss": -25.820043563842773, "global_step": 339529, "epoch": 4090} {"train_loss": -26.07539176940918, "global_step": 339530, "epoch": 4090} {"train_loss": -26.34168815612793, "global_step": 339531, "epoch": 4090} {"train_loss": -25.682580947875977, "global_step": 339532, "epoch": 4090} {"train_loss": -25.505273818969727, "global_step": 339533, "epoch": 4090} {"train_loss": -25.99616813659668, "global_step": 339534, "epoch": 4090} {"train_loss": -26.23306655883789, "global_step": 339535, "epoch": 4090} {"train_loss": -26.445087432861328, "global_step": 339536, "epoch": 4090} {"train_loss": -25.76261329650879, "global_step": 339537, "epoch": 4090} {"train_loss": -25.882734298706055, "global_step": 339538, "epoch": 4090} {"train_loss": -25.592859268188477, "global_step": 339539, "epoch": 4090} {"train_loss": -26.088048934936523, "global_step": 339540, "epoch": 4090} {"train_loss": -26.00783348083496, "global_step": 339541, "epoch": 4090} {"train_loss": -25.826879501342773, "global_step": 339542, "epoch": 4090} {"train_loss": -26.013208389282227, "global_step": 339543, "epoch": 4090} {"train_loss": -25.38248062133789, "global_step": 339544, "epoch": 4090} {"train_loss": -25.905166625976562, "global_step": 339545, "epoch": 4090} {"train_loss": -25.778247833251953, "global_step": 339546, "epoch": 4090} {"train_loss": -25.88892936706543, "global_step": 339547, "epoch": 4090} {"train_loss": -25.78645896911621, "global_step": 339548, "epoch": 4090} {"train_loss": -25.826343536376953, "global_step": 339549, "epoch": 4090} {"train_loss": -25.951095581054688, "global_step": 339550, "epoch": 4090} {"train_loss": -25.64633560180664, "global_step": 339551, "epoch": 4090} {"train_loss": -25.814581767622247, "global_step": 339552, "epoch": 4090, "val_loss": 6725909.0} {"train_loss": -25.56562614440918, "global_step": 339553, "epoch": 4091} {"train_loss": -24.95619010925293, "global_step": 339554, "epoch": 4091} {"train_loss": -25.66212272644043, "global_step": 339555, "epoch": 4091} {"train_loss": -25.71744155883789, "global_step": 339556, "epoch": 4091} {"train_loss": -25.889780044555664, "global_step": 339557, "epoch": 4091} {"train_loss": -25.69186782836914, "global_step": 339558, "epoch": 4091} {"train_loss": -25.405385971069336, "global_step": 339559, "epoch": 4091} {"train_loss": -25.573057174682617, "global_step": 339560, "epoch": 4091} {"train_loss": -25.724695205688477, "global_step": 339561, "epoch": 4091} {"train_loss": -25.355884552001953, "global_step": 339562, "epoch": 4091} {"train_loss": -25.9183349609375, "global_step": 339563, "epoch": 4091} {"train_loss": -25.83609962463379, "global_step": 339564, "epoch": 4091} {"train_loss": -25.53215980529785, "global_step": 339565, "epoch": 4091} {"train_loss": -26.09405517578125, "global_step": 339566, "epoch": 4091} {"train_loss": -25.57878875732422, "global_step": 339567, "epoch": 4091} {"train_loss": -25.588871002197266, "global_step": 339568, "epoch": 4091} {"train_loss": -25.978254318237305, "global_step": 339569, "epoch": 4091} {"train_loss": -25.525827407836914, "global_step": 339570, "epoch": 4091} {"train_loss": -26.144372940063477, "global_step": 339571, "epoch": 4091} {"train_loss": -25.465591430664062, "global_step": 339572, "epoch": 4091} {"train_loss": -26.105859756469727, "global_step": 339573, "epoch": 4091} {"train_loss": -25.7855281829834, "global_step": 339574, "epoch": 4091} {"train_loss": -25.705907821655273, "global_step": 339575, "epoch": 4091} {"train_loss": -26.097116470336914, "global_step": 339576, "epoch": 4091} {"train_loss": -25.856958389282227, "global_step": 339577, "epoch": 4091} {"train_loss": -25.98358726501465, "global_step": 339578, "epoch": 4091} {"train_loss": -26.046884536743164, "global_step": 339579, "epoch": 4091} {"train_loss": -25.861255645751953, "global_step": 339580, "epoch": 4091} {"train_loss": -26.154916763305664, "global_step": 339581, "epoch": 4091} {"train_loss": -26.344778060913086, "global_step": 339582, "epoch": 4091} {"train_loss": -26.121305465698242, "global_step": 339583, "epoch": 4091} {"train_loss": -25.665342330932617, "global_step": 339584, "epoch": 4091} {"train_loss": -26.014877319335938, "global_step": 339585, "epoch": 4091} {"train_loss": -25.9008731842041, "global_step": 339586, "epoch": 4091} {"train_loss": -26.192014694213867, "global_step": 339587, "epoch": 4091} {"train_loss": -26.43720817565918, "global_step": 339588, "epoch": 4091} {"train_loss": -26.048978805541992, "global_step": 339589, "epoch": 4091} {"train_loss": -26.40870475769043, "global_step": 339590, "epoch": 4091} {"train_loss": -26.35194206237793, "global_step": 339591, "epoch": 4091} {"train_loss": -25.896345138549805, "global_step": 339592, "epoch": 4091} {"train_loss": -25.7806453704834, "global_step": 339593, "epoch": 4091} {"train_loss": -25.743078231811523, "global_step": 339594, "epoch": 4091} {"train_loss": -26.20916175842285, "global_step": 339595, "epoch": 4091} {"train_loss": -26.481271743774414, "global_step": 339596, "epoch": 4091} {"train_loss": -26.023359298706055, "global_step": 339597, "epoch": 4091} {"train_loss": -26.258764266967773, "global_step": 339598, "epoch": 4091} {"train_loss": -25.509185791015625, "global_step": 339599, "epoch": 4091} {"train_loss": -26.126386642456055, "global_step": 339600, "epoch": 4091} {"train_loss": -25.91998863220215, "global_step": 339601, "epoch": 4091} {"train_loss": -26.334272384643555, "global_step": 339602, "epoch": 4091} {"train_loss": -25.8701114654541, "global_step": 339603, "epoch": 4091} {"train_loss": -26.191003799438477, "global_step": 339604, "epoch": 4091} {"train_loss": -25.860864639282227, "global_step": 339605, "epoch": 4091} {"train_loss": -25.8957576751709, "global_step": 339606, "epoch": 4091} {"train_loss": -25.9912166595459, "global_step": 339607, "epoch": 4091} {"train_loss": -26.293848037719727, "global_step": 339608, "epoch": 4091} {"train_loss": -26.00492286682129, "global_step": 339609, "epoch": 4091} {"train_loss": -26.063846588134766, "global_step": 339610, "epoch": 4091} {"train_loss": -26.1716251373291, "global_step": 339611, "epoch": 4091} {"train_loss": -25.803075790405273, "global_step": 339612, "epoch": 4091} {"train_loss": -26.292062759399414, "global_step": 339613, "epoch": 4091} {"train_loss": -25.942602157592773, "global_step": 339614, "epoch": 4091} {"train_loss": -26.31342887878418, "global_step": 339615, "epoch": 4091} {"train_loss": -25.758344650268555, "global_step": 339616, "epoch": 4091} {"train_loss": -26.285551071166992, "global_step": 339617, "epoch": 4091} {"train_loss": -26.313623428344727, "global_step": 339618, "epoch": 4091} {"train_loss": -26.070337295532227, "global_step": 339619, "epoch": 4091} {"train_loss": -26.190893173217773, "global_step": 339620, "epoch": 4091} {"train_loss": -26.130224227905273, "global_step": 339621, "epoch": 4091} {"train_loss": -26.16011619567871, "global_step": 339622, "epoch": 4091} {"train_loss": -25.658905029296875, "global_step": 339623, "epoch": 4091} {"train_loss": -26.200225830078125, "global_step": 339624, "epoch": 4091} {"train_loss": -25.821353912353516, "global_step": 339625, "epoch": 4091} {"train_loss": -25.884296417236328, "global_step": 339626, "epoch": 4091} {"train_loss": -26.06599235534668, "global_step": 339627, "epoch": 4091} {"train_loss": -26.49576187133789, "global_step": 339628, "epoch": 4091} {"train_loss": -25.86102867126465, "global_step": 339629, "epoch": 4091} {"train_loss": -26.11163902282715, "global_step": 339630, "epoch": 4091} {"train_loss": -25.70200538635254, "global_step": 339631, "epoch": 4091} {"train_loss": -26.094091415405273, "global_step": 339632, "epoch": 4091} {"train_loss": -25.82864761352539, "global_step": 339633, "epoch": 4091} {"train_loss": -26.198230743408203, "global_step": 339634, "epoch": 4091} {"train_loss": -25.952986223151886, "global_step": 339635, "epoch": 4091, "val_loss": 6630690.5} {"train_loss": -25.860095977783203, "global_step": 339636, "epoch": 4092} {"train_loss": -25.346115112304688, "global_step": 339637, "epoch": 4092} {"train_loss": -25.904993057250977, "global_step": 339638, "epoch": 4092} {"train_loss": -26.026554107666016, "global_step": 339639, "epoch": 4092} {"train_loss": -25.677597045898438, "global_step": 339640, "epoch": 4092} {"train_loss": -26.03655433654785, "global_step": 339641, "epoch": 4092} {"train_loss": -25.62359046936035, "global_step": 339642, "epoch": 4092} {"train_loss": -26.021503448486328, "global_step": 339643, "epoch": 4092} {"train_loss": -26.360244750976562, "global_step": 339644, "epoch": 4092} {"train_loss": -25.84287452697754, "global_step": 339645, "epoch": 4092} {"train_loss": -25.528242111206055, "global_step": 339646, "epoch": 4092} {"train_loss": -25.884078979492188, "global_step": 339647, "epoch": 4092} {"train_loss": -25.467939376831055, "global_step": 339648, "epoch": 4092} {"train_loss": -26.040830612182617, "global_step": 339649, "epoch": 4092} {"train_loss": -25.93891716003418, "global_step": 339650, "epoch": 4092} {"train_loss": -25.744903564453125, "global_step": 339651, "epoch": 4092} {"train_loss": -26.103017807006836, "global_step": 339652, "epoch": 4092} {"train_loss": -26.082799911499023, "global_step": 339653, "epoch": 4092} {"train_loss": -25.80257225036621, "global_step": 339654, "epoch": 4092} {"train_loss": -26.230712890625, "global_step": 339655, "epoch": 4092} {"train_loss": -26.527379989624023, "global_step": 339656, "epoch": 4092} {"train_loss": -26.17249870300293, "global_step": 339657, "epoch": 4092} {"train_loss": -26.070484161376953, "global_step": 339658, "epoch": 4092} {"train_loss": -26.191055297851562, "global_step": 339659, "epoch": 4092} {"train_loss": -26.053009033203125, "global_step": 339660, "epoch": 4092} {"train_loss": -26.183752059936523, "global_step": 339661, "epoch": 4092} {"train_loss": -26.065509796142578, "global_step": 339662, "epoch": 4092} {"train_loss": -25.883100509643555, "global_step": 339663, "epoch": 4092} {"train_loss": -25.8131046295166, "global_step": 339664, "epoch": 4092} {"train_loss": -25.57608413696289, "global_step": 339665, "epoch": 4092} {"train_loss": -26.198413848876953, "global_step": 339666, "epoch": 4092} {"train_loss": -26.393695831298828, "global_step": 339667, "epoch": 4092} {"train_loss": -25.401052474975586, "global_step": 339668, "epoch": 4092} {"train_loss": -26.304035186767578, "global_step": 339669, "epoch": 4092} {"train_loss": -25.99827003479004, "global_step": 339670, "epoch": 4092} {"train_loss": -26.263280868530273, "global_step": 339671, "epoch": 4092} {"train_loss": -25.724767684936523, "global_step": 339672, "epoch": 4092} {"train_loss": -26.010141372680664, "global_step": 339673, "epoch": 4092} {"train_loss": -25.972524642944336, "global_step": 339674, "epoch": 4092} {"train_loss": -26.172714233398438, "global_step": 339675, "epoch": 4092} {"train_loss": -26.004962921142578, "global_step": 339676, "epoch": 4092} {"train_loss": -26.04083251953125, "global_step": 339677, "epoch": 4092} {"train_loss": -26.3730525970459, "global_step": 339678, "epoch": 4092} {"train_loss": -25.632617950439453, "global_step": 339679, "epoch": 4092} {"train_loss": -25.951635360717773, "global_step": 339680, "epoch": 4092} {"train_loss": -26.226720809936523, "global_step": 339681, "epoch": 4092} {"train_loss": -26.48297119140625, "global_step": 339682, "epoch": 4092} {"train_loss": -26.1568546295166, "global_step": 339683, "epoch": 4092} {"train_loss": -26.1420841217041, "global_step": 339684, "epoch": 4092} {"train_loss": -25.87937355041504, "global_step": 339685, "epoch": 4092} {"train_loss": -26.1595458984375, "global_step": 339686, "epoch": 4092} {"train_loss": -25.881147384643555, "global_step": 339687, "epoch": 4092} {"train_loss": -26.05048179626465, "global_step": 339688, "epoch": 4092} {"train_loss": -26.2568359375, "global_step": 339689, "epoch": 4092} {"train_loss": -26.139699935913086, "global_step": 339690, "epoch": 4092} {"train_loss": -26.234251022338867, "global_step": 339691, "epoch": 4092} {"train_loss": -26.55328941345215, "global_step": 339692, "epoch": 4092} {"train_loss": -26.00543212890625, "global_step": 339693, "epoch": 4092} {"train_loss": -26.286420822143555, "global_step": 339694, "epoch": 4092} {"train_loss": -26.268781661987305, "global_step": 339695, "epoch": 4092} {"train_loss": -26.436817169189453, "global_step": 339696, "epoch": 4092} {"train_loss": -26.345678329467773, "global_step": 339697, "epoch": 4092} {"train_loss": -26.192981719970703, "global_step": 339698, "epoch": 4092} {"train_loss": -26.372222900390625, "global_step": 339699, "epoch": 4092} {"train_loss": -25.89893913269043, "global_step": 339700, "epoch": 4092} {"train_loss": -25.832794189453125, "global_step": 339701, "epoch": 4092} {"train_loss": -25.89349365234375, "global_step": 339702, "epoch": 4092} {"train_loss": -25.899307250976562, "global_step": 339703, "epoch": 4092} {"train_loss": -26.107654571533203, "global_step": 339704, "epoch": 4092} {"train_loss": -26.239721298217773, "global_step": 339705, "epoch": 4092} {"train_loss": -26.2916316986084, "global_step": 339706, "epoch": 4092} {"train_loss": -26.2814998626709, "global_step": 339707, "epoch": 4092} {"train_loss": -25.955427169799805, "global_step": 339708, "epoch": 4092} {"train_loss": -26.073028564453125, "global_step": 339709, "epoch": 4092} {"train_loss": -26.266345977783203, "global_step": 339710, "epoch": 4092} {"train_loss": -26.000341415405273, "global_step": 339711, "epoch": 4092} {"train_loss": -26.298227310180664, "global_step": 339712, "epoch": 4092} {"train_loss": -26.566980361938477, "global_step": 339713, "epoch": 4092} {"train_loss": -26.495519638061523, "global_step": 339714, "epoch": 4092} {"train_loss": -26.458114624023438, "global_step": 339715, "epoch": 4092} {"train_loss": -26.16554832458496, "global_step": 339716, "epoch": 4092} {"train_loss": -26.10419273376465, "global_step": 339717, "epoch": 4092} {"train_loss": -26.071065466087983, "global_step": 339718, "epoch": 4092, "val_loss": 6625621.0} {"train_loss": -25.80457878112793, "global_step": 339719, "epoch": 4093} {"train_loss": -26.16513442993164, "global_step": 339720, "epoch": 4093} {"train_loss": -25.554147720336914, "global_step": 339721, "epoch": 4093} {"train_loss": -25.791662216186523, "global_step": 339722, "epoch": 4093} {"train_loss": -25.4067440032959, "global_step": 339723, "epoch": 4093} {"train_loss": -25.02769660949707, "global_step": 339724, "epoch": 4093} {"train_loss": -24.872873306274414, "global_step": 339725, "epoch": 4093} {"train_loss": -26.02223014831543, "global_step": 339726, "epoch": 4093} {"train_loss": -25.71649742126465, "global_step": 339727, "epoch": 4093} {"train_loss": -25.18470573425293, "global_step": 339728, "epoch": 4093} {"train_loss": -25.60371971130371, "global_step": 339729, "epoch": 4093} {"train_loss": -25.704267501831055, "global_step": 339730, "epoch": 4093} {"train_loss": -25.6716251373291, "global_step": 339731, "epoch": 4093} {"train_loss": -26.078399658203125, "global_step": 339732, "epoch": 4093} {"train_loss": -25.499141693115234, "global_step": 339733, "epoch": 4093} {"train_loss": -25.8439884185791, "global_step": 339734, "epoch": 4093} {"train_loss": -25.487884521484375, "global_step": 339735, "epoch": 4093} {"train_loss": -26.24212646484375, "global_step": 339736, "epoch": 4093} {"train_loss": -25.695669174194336, "global_step": 339737, "epoch": 4093} {"train_loss": -25.756244659423828, "global_step": 339738, "epoch": 4093} {"train_loss": -25.919025421142578, "global_step": 339739, "epoch": 4093} {"train_loss": -26.006879806518555, "global_step": 339740, "epoch": 4093} {"train_loss": -25.82695960998535, "global_step": 339741, "epoch": 4093} {"train_loss": -26.02664566040039, "global_step": 339742, "epoch": 4093} {"train_loss": -26.002639770507812, "global_step": 339743, "epoch": 4093} {"train_loss": -25.93182373046875, "global_step": 339744, "epoch": 4093} {"train_loss": -25.959680557250977, "global_step": 339745, "epoch": 4093} {"train_loss": -25.904882431030273, "global_step": 339746, "epoch": 4093} {"train_loss": -25.9190731048584, "global_step": 339747, "epoch": 4093} {"train_loss": -25.768590927124023, "global_step": 339748, "epoch": 4093} {"train_loss": -26.483957290649414, "global_step": 339749, "epoch": 4093} {"train_loss": -25.63274574279785, "global_step": 339750, "epoch": 4093} {"train_loss": -26.311735153198242, "global_step": 339751, "epoch": 4093} {"train_loss": -26.197986602783203, "global_step": 339752, "epoch": 4093} {"train_loss": -26.142810821533203, "global_step": 339753, "epoch": 4093} {"train_loss": -26.2769718170166, "global_step": 339754, "epoch": 4093} {"train_loss": -26.0999698638916, "global_step": 339755, "epoch": 4093} {"train_loss": -25.944061279296875, "global_step": 339756, "epoch": 4093} {"train_loss": -26.141616821289062, "global_step": 339757, "epoch": 4093} {"train_loss": -26.281879425048828, "global_step": 339758, "epoch": 4093} {"train_loss": -26.12513542175293, "global_step": 339759, "epoch": 4093} {"train_loss": -26.06790542602539, "global_step": 339760, "epoch": 4093} {"train_loss": -25.75394058227539, "global_step": 339761, "epoch": 4093} {"train_loss": -25.801727294921875, "global_step": 339762, "epoch": 4093} {"train_loss": -25.892988204956055, "global_step": 339763, "epoch": 4093} {"train_loss": -25.676288604736328, "global_step": 339764, "epoch": 4093} {"train_loss": -26.026865005493164, "global_step": 339765, "epoch": 4093} {"train_loss": -26.494054794311523, "global_step": 339766, "epoch": 4093} {"train_loss": -25.8352108001709, "global_step": 339767, "epoch": 4093} {"train_loss": -26.165090560913086, "global_step": 339768, "epoch": 4093} {"train_loss": -25.873926162719727, "global_step": 339769, "epoch": 4093} {"train_loss": -26.246540069580078, "global_step": 339770, "epoch": 4093} {"train_loss": -26.01786231994629, "global_step": 339771, "epoch": 4093} {"train_loss": -26.25168800354004, "global_step": 339772, "epoch": 4093} {"train_loss": -26.361616134643555, "global_step": 339773, "epoch": 4093} {"train_loss": -26.02446937561035, "global_step": 339774, "epoch": 4093} {"train_loss": -26.433095932006836, "global_step": 339775, "epoch": 4093} {"train_loss": -25.895536422729492, "global_step": 339776, "epoch": 4093} {"train_loss": -26.11687660217285, "global_step": 339777, "epoch": 4093} {"train_loss": -26.03045654296875, "global_step": 339778, "epoch": 4093} {"train_loss": -26.43372917175293, "global_step": 339779, "epoch": 4093} {"train_loss": -26.132312774658203, "global_step": 339780, "epoch": 4093} {"train_loss": -26.33846092224121, "global_step": 339781, "epoch": 4093} {"train_loss": -25.878238677978516, "global_step": 339782, "epoch": 4093} {"train_loss": -26.202733993530273, "global_step": 339783, "epoch": 4093} {"train_loss": -26.20383071899414, "global_step": 339784, "epoch": 4093} {"train_loss": -25.898508071899414, "global_step": 339785, "epoch": 4093} {"train_loss": -26.430007934570312, "global_step": 339786, "epoch": 4093} {"train_loss": -26.202497482299805, "global_step": 339787, "epoch": 4093} {"train_loss": -26.125761032104492, "global_step": 339788, "epoch": 4093} {"train_loss": -25.834070205688477, "global_step": 339789, "epoch": 4093} {"train_loss": -26.04899024963379, "global_step": 339790, "epoch": 4093} {"train_loss": -26.09077262878418, "global_step": 339791, "epoch": 4093} {"train_loss": -26.238983154296875, "global_step": 339792, "epoch": 4093} {"train_loss": -26.036731719970703, "global_step": 339793, "epoch": 4093} {"train_loss": -26.0706729888916, "global_step": 339794, "epoch": 4093} {"train_loss": -25.975738525390625, "global_step": 339795, "epoch": 4093} {"train_loss": -25.881269454956055, "global_step": 339796, "epoch": 4093} {"train_loss": -25.781848907470703, "global_step": 339797, "epoch": 4093} {"train_loss": -26.037378311157227, "global_step": 339798, "epoch": 4093} {"train_loss": -26.13331413269043, "global_step": 339799, "epoch": 4093} {"train_loss": -25.68094825744629, "global_step": 339800, "epoch": 4093} {"train_loss": -25.961463123919017, "global_step": 339801, "epoch": 4093, "val_loss": 6599015.0} {"train_loss": -25.592052459716797, "global_step": 339802, "epoch": 4094} {"train_loss": -25.482452392578125, "global_step": 339803, "epoch": 4094} {"train_loss": -25.683340072631836, "global_step": 339804, "epoch": 4094} {"train_loss": -25.22187614440918, "global_step": 339805, "epoch": 4094} {"train_loss": -25.648855209350586, "global_step": 339806, "epoch": 4094} {"train_loss": -25.294660568237305, "global_step": 339807, "epoch": 4094} {"train_loss": -25.700841903686523, "global_step": 339808, "epoch": 4094} {"train_loss": -25.31389617919922, "global_step": 339809, "epoch": 4094} {"train_loss": -25.7608699798584, "global_step": 339810, "epoch": 4094} {"train_loss": -25.582826614379883, "global_step": 339811, "epoch": 4094} {"train_loss": -25.874608993530273, "global_step": 339812, "epoch": 4094} {"train_loss": -25.924604415893555, "global_step": 339813, "epoch": 4094} {"train_loss": -25.626806259155273, "global_step": 339814, "epoch": 4094} {"train_loss": -25.704303741455078, "global_step": 339815, "epoch": 4094} {"train_loss": -25.592823028564453, "global_step": 339816, "epoch": 4094} {"train_loss": -25.791305541992188, "global_step": 339817, "epoch": 4094} {"train_loss": -26.0797119140625, "global_step": 339818, "epoch": 4094} {"train_loss": -25.5699520111084, "global_step": 339819, "epoch": 4094} {"train_loss": -25.9965877532959, "global_step": 339820, "epoch": 4094} {"train_loss": -26.29033851623535, "global_step": 339821, "epoch": 4094} {"train_loss": -26.106719970703125, "global_step": 339822, "epoch": 4094} {"train_loss": -25.949987411499023, "global_step": 339823, "epoch": 4094} {"train_loss": -26.233015060424805, "global_step": 339824, "epoch": 4094} {"train_loss": -25.912702560424805, "global_step": 339825, "epoch": 4094} {"train_loss": -25.93288230895996, "global_step": 339826, "epoch": 4094} {"train_loss": -25.763412475585938, "global_step": 339827, "epoch": 4094} {"train_loss": -25.695470809936523, "global_step": 339828, "epoch": 4094} {"train_loss": -25.455224990844727, "global_step": 339829, "epoch": 4094} {"train_loss": -25.859222412109375, "global_step": 339830, "epoch": 4094} {"train_loss": -26.032806396484375, "global_step": 339831, "epoch": 4094} {"train_loss": -26.072193145751953, "global_step": 339832, "epoch": 4094} {"train_loss": -25.653675079345703, "global_step": 339833, "epoch": 4094} {"train_loss": -25.8707275390625, "global_step": 339834, "epoch": 4094} {"train_loss": -26.008075714111328, "global_step": 339835, "epoch": 4094} {"train_loss": -26.259496688842773, "global_step": 339836, "epoch": 4094} {"train_loss": -26.75489616394043, "global_step": 339837, "epoch": 4094} {"train_loss": -25.949512481689453, "global_step": 339838, "epoch": 4094} {"train_loss": -25.751218795776367, "global_step": 339839, "epoch": 4094} {"train_loss": -25.845163345336914, "global_step": 339840, "epoch": 4094} {"train_loss": -25.697513580322266, "global_step": 339841, "epoch": 4094} {"train_loss": -26.309024810791016, "global_step": 339842, "epoch": 4094} {"train_loss": -26.288562774658203, "global_step": 339843, "epoch": 4094} {"train_loss": -26.3416805267334, "global_step": 339844, "epoch": 4094} {"train_loss": -26.00837516784668, "global_step": 339845, "epoch": 4094} {"train_loss": -26.21369743347168, "global_step": 339846, "epoch": 4094} {"train_loss": -26.187576293945312, "global_step": 339847, "epoch": 4094} {"train_loss": -26.410974502563477, "global_step": 339848, "epoch": 4094} {"train_loss": -26.051593780517578, "global_step": 339849, "epoch": 4094} {"train_loss": -26.02168083190918, "global_step": 339850, "epoch": 4094} {"train_loss": -26.063159942626953, "global_step": 339851, "epoch": 4094} {"train_loss": -25.9476375579834, "global_step": 339852, "epoch": 4094} {"train_loss": -26.50674819946289, "global_step": 339853, "epoch": 4094} {"train_loss": -26.51955223083496, "global_step": 339854, "epoch": 4094} {"train_loss": -25.878293991088867, "global_step": 339855, "epoch": 4094} {"train_loss": -26.150497436523438, "global_step": 339856, "epoch": 4094} {"train_loss": -26.018537521362305, "global_step": 339857, "epoch": 4094} {"train_loss": -25.61578369140625, "global_step": 339858, "epoch": 4094} {"train_loss": -25.950178146362305, "global_step": 339859, "epoch": 4094} {"train_loss": -25.853164672851562, "global_step": 339860, "epoch": 4094} {"train_loss": -26.35060691833496, "global_step": 339861, "epoch": 4094} {"train_loss": -26.453771591186523, "global_step": 339862, "epoch": 4094} {"train_loss": -26.0361385345459, "global_step": 339863, "epoch": 4094} {"train_loss": -26.228036880493164, "global_step": 339864, "epoch": 4094} {"train_loss": -25.870344161987305, "global_step": 339865, "epoch": 4094} {"train_loss": -25.773120880126953, "global_step": 339866, "epoch": 4094} {"train_loss": -26.204885482788086, "global_step": 339867, "epoch": 4094} {"train_loss": -26.10597038269043, "global_step": 339868, "epoch": 4094} {"train_loss": -26.010168075561523, "global_step": 339869, "epoch": 4094} {"train_loss": -26.031946182250977, "global_step": 339870, "epoch": 4094} {"train_loss": -25.790756225585938, "global_step": 339871, "epoch": 4094} {"train_loss": -26.119421005249023, "global_step": 339872, "epoch": 4094} {"train_loss": -26.2434139251709, "global_step": 339873, "epoch": 4094} {"train_loss": -26.00668716430664, "global_step": 339874, "epoch": 4094} {"train_loss": -26.115854263305664, "global_step": 339875, "epoch": 4094} {"train_loss": -25.866697311401367, "global_step": 339876, "epoch": 4094} {"train_loss": -26.022878646850586, "global_step": 339877, "epoch": 4094} {"train_loss": -25.674915313720703, "global_step": 339878, "epoch": 4094} {"train_loss": -25.946935653686523, "global_step": 339879, "epoch": 4094} {"train_loss": -26.031646728515625, "global_step": 339880, "epoch": 4094} {"train_loss": -26.182937622070312, "global_step": 339881, "epoch": 4094} {"train_loss": -26.286334991455078, "global_step": 339882, "epoch": 4094} {"train_loss": -26.331979751586914, "global_step": 339883, "epoch": 4094} {"train_loss": -25.967558274786157, "global_step": 339884, "epoch": 4094, "val_loss": 6568811.0} {"train_loss": -24.88813018798828, "global_step": 339885, "epoch": 4095} {"train_loss": -25.723325729370117, "global_step": 339886, "epoch": 4095} {"train_loss": -25.23847770690918, "global_step": 339887, "epoch": 4095} {"train_loss": -25.350879669189453, "global_step": 339888, "epoch": 4095} {"train_loss": -25.339460372924805, "global_step": 339889, "epoch": 4095} {"train_loss": -25.49677085876465, "global_step": 339890, "epoch": 4095} {"train_loss": -25.774677276611328, "global_step": 339891, "epoch": 4095} {"train_loss": -25.62017822265625, "global_step": 339892, "epoch": 4095} {"train_loss": -25.329965591430664, "global_step": 339893, "epoch": 4095} {"train_loss": -25.88651466369629, "global_step": 339894, "epoch": 4095} {"train_loss": -25.69327735900879, "global_step": 339895, "epoch": 4095} {"train_loss": -25.57711410522461, "global_step": 339896, "epoch": 4095} {"train_loss": -25.927886962890625, "global_step": 339897, "epoch": 4095} {"train_loss": -25.477630615234375, "global_step": 339898, "epoch": 4095} {"train_loss": -25.322643280029297, "global_step": 339899, "epoch": 4095} {"train_loss": -25.262985229492188, "global_step": 339900, "epoch": 4095} {"train_loss": -25.546751022338867, "global_step": 339901, "epoch": 4095} {"train_loss": -25.531658172607422, "global_step": 339902, "epoch": 4095} {"train_loss": -25.326017379760742, "global_step": 339903, "epoch": 4095} {"train_loss": -25.50982666015625, "global_step": 339904, "epoch": 4095} {"train_loss": -25.611682891845703, "global_step": 339905, "epoch": 4095} {"train_loss": -25.614105224609375, "global_step": 339906, "epoch": 4095} {"train_loss": -25.5502986907959, "global_step": 339907, "epoch": 4095} {"train_loss": -25.87615966796875, "global_step": 339908, "epoch": 4095} {"train_loss": -25.9257755279541, "global_step": 339909, "epoch": 4095} {"train_loss": -25.699155807495117, "global_step": 339910, "epoch": 4095} {"train_loss": -25.901025772094727, "global_step": 339911, "epoch": 4095} {"train_loss": -26.145984649658203, "global_step": 339912, "epoch": 4095} {"train_loss": -25.87137222290039, "global_step": 339913, "epoch": 4095} {"train_loss": -26.174341201782227, "global_step": 339914, "epoch": 4095} {"train_loss": -26.0953426361084, "global_step": 339915, "epoch": 4095} {"train_loss": -25.770578384399414, "global_step": 339916, "epoch": 4095} {"train_loss": -26.2896785736084, "global_step": 339917, "epoch": 4095} {"train_loss": -25.847803115844727, "global_step": 339918, "epoch": 4095} {"train_loss": -26.175321578979492, "global_step": 339919, "epoch": 4095} {"train_loss": -25.863874435424805, "global_step": 339920, "epoch": 4095} {"train_loss": -26.25543785095215, "global_step": 339921, "epoch": 4095} {"train_loss": -25.94647216796875, "global_step": 339922, "epoch": 4095} {"train_loss": -26.108346939086914, "global_step": 339923, "epoch": 4095} {"train_loss": -26.25302505493164, "global_step": 339924, "epoch": 4095} {"train_loss": -25.992919921875, "global_step": 339925, "epoch": 4095} {"train_loss": -25.859777450561523, "global_step": 339926, "epoch": 4095} {"train_loss": -26.115427017211914, "global_step": 339927, "epoch": 4095} {"train_loss": -26.275527954101562, "global_step": 339928, "epoch": 4095} {"train_loss": -26.450708389282227, "global_step": 339929, "epoch": 4095} {"train_loss": -26.64496421813965, "global_step": 339930, "epoch": 4095} {"train_loss": -26.310922622680664, "global_step": 339931, "epoch": 4095} {"train_loss": -26.31412696838379, "global_step": 339932, "epoch": 4095} {"train_loss": -26.04014015197754, "global_step": 339933, "epoch": 4095} {"train_loss": -26.370956420898438, "global_step": 339934, "epoch": 4095} {"train_loss": -25.494150161743164, "global_step": 339935, "epoch": 4095} {"train_loss": -24.29861831665039, "global_step": 339936, "epoch": 4095} {"train_loss": -23.896013259887695, "global_step": 339937, "epoch": 4095} {"train_loss": -25.04542350769043, "global_step": 339938, "epoch": 4095} {"train_loss": -25.299985885620117, "global_step": 339939, "epoch": 4095} {"train_loss": -25.384180068969727, "global_step": 339940, "epoch": 4095} {"train_loss": -25.360214233398438, "global_step": 339941, "epoch": 4095} {"train_loss": -25.54080581665039, "global_step": 339942, "epoch": 4095} {"train_loss": -25.461761474609375, "global_step": 339943, "epoch": 4095} {"train_loss": -25.7883358001709, "global_step": 339944, "epoch": 4095} {"train_loss": -25.362653732299805, "global_step": 339945, "epoch": 4095} {"train_loss": -25.661142349243164, "global_step": 339946, "epoch": 4095} {"train_loss": -25.62259292602539, "global_step": 339947, "epoch": 4095} {"train_loss": -25.466550827026367, "global_step": 339948, "epoch": 4095} {"train_loss": -25.740558624267578, "global_step": 339949, "epoch": 4095} {"train_loss": -25.806222915649414, "global_step": 339950, "epoch": 4095} {"train_loss": -25.64383888244629, "global_step": 339951, "epoch": 4095} {"train_loss": -26.1519775390625, "global_step": 339952, "epoch": 4095} {"train_loss": -26.020618438720703, "global_step": 339953, "epoch": 4095} {"train_loss": -26.140716552734375, "global_step": 339954, "epoch": 4095} {"train_loss": -25.819446563720703, "global_step": 339955, "epoch": 4095} {"train_loss": -25.993894577026367, "global_step": 339956, "epoch": 4095} {"train_loss": -26.109333038330078, "global_step": 339957, "epoch": 4095} {"train_loss": -25.907331466674805, "global_step": 339958, "epoch": 4095} {"train_loss": -25.817853927612305, "global_step": 339959, "epoch": 4095} {"train_loss": -26.1475887298584, "global_step": 339960, "epoch": 4095} {"train_loss": -25.940155029296875, "global_step": 339961, "epoch": 4095} {"train_loss": -25.747488021850586, "global_step": 339962, "epoch": 4095} {"train_loss": -25.808277130126953, "global_step": 339963, "epoch": 4095} {"train_loss": -25.66632080078125, "global_step": 339964, "epoch": 4095} {"train_loss": -26.179492950439453, "global_step": 339965, "epoch": 4095} {"train_loss": -26.11036491394043, "global_step": 339966, "epoch": 4095} {"train_loss": -25.777055717376342, "global_step": 339967, "epoch": 4095, "val_loss": 6509714.0} {"train_loss": -25.401880264282227, "global_step": 339968, "epoch": 4096} {"train_loss": -26.49628257751465, "global_step": 339969, "epoch": 4096} {"train_loss": -25.538557052612305, "global_step": 339970, "epoch": 4096} {"train_loss": -25.71417808532715, "global_step": 339971, "epoch": 4096} {"train_loss": -25.667926788330078, "global_step": 339972, "epoch": 4096} {"train_loss": -25.76712417602539, "global_step": 339973, "epoch": 4096} {"train_loss": -25.799219131469727, "global_step": 339974, "epoch": 4096} {"train_loss": -25.977996826171875, "global_step": 339975, "epoch": 4096} {"train_loss": -25.512287139892578, "global_step": 339976, "epoch": 4096} {"train_loss": -25.485750198364258, "global_step": 339977, "epoch": 4096} {"train_loss": -25.605741500854492, "global_step": 339978, "epoch": 4096} {"train_loss": -26.251148223876953, "global_step": 339979, "epoch": 4096} {"train_loss": -25.570444107055664, "global_step": 339980, "epoch": 4096} {"train_loss": -25.7448787689209, "global_step": 339981, "epoch": 4096} {"train_loss": -25.899078369140625, "global_step": 339982, "epoch": 4096} {"train_loss": -25.970861434936523, "global_step": 339983, "epoch": 4096} {"train_loss": -25.99228858947754, "global_step": 339984, "epoch": 4096} {"train_loss": -25.941974639892578, "global_step": 339985, "epoch": 4096} {"train_loss": -25.879602432250977, "global_step": 339986, "epoch": 4096} {"train_loss": -26.171222686767578, "global_step": 339987, "epoch": 4096} {"train_loss": -26.444311141967773, "global_step": 339988, "epoch": 4096} {"train_loss": -25.9608211517334, "global_step": 339989, "epoch": 4096} {"train_loss": -26.02286148071289, "global_step": 339990, "epoch": 4096} {"train_loss": -25.941986083984375, "global_step": 339991, "epoch": 4096} {"train_loss": -26.405790328979492, "global_step": 339992, "epoch": 4096} {"train_loss": -25.758075714111328, "global_step": 339993, "epoch": 4096} {"train_loss": -26.05474853515625, "global_step": 339994, "epoch": 4096} {"train_loss": -25.81741714477539, "global_step": 339995, "epoch": 4096} {"train_loss": -26.020212173461914, "global_step": 339996, "epoch": 4096} {"train_loss": -25.98456382751465, "global_step": 339997, "epoch": 4096} {"train_loss": -26.11821937561035, "global_step": 339998, "epoch": 4096} {"train_loss": -25.8138484954834, "global_step": 339999, "epoch": 4096} {"train_loss": -25.703235626220703, "global_step": 340000, "epoch": 4096} {"train_loss": -25.843881607055664, "global_step": 340001, "epoch": 4096} {"train_loss": -25.997028350830078, "global_step": 340002, "epoch": 4096} {"train_loss": -25.715747833251953, "global_step": 340003, "epoch": 4096} {"train_loss": -25.942235946655273, "global_step": 340004, "epoch": 4096} {"train_loss": -25.781890869140625, "global_step": 340005, "epoch": 4096} {"train_loss": -25.9105281829834, "global_step": 340006, "epoch": 4096} {"train_loss": -25.661849975585938, "global_step": 340007, "epoch": 4096} {"train_loss": -26.237390518188477, "global_step": 340008, "epoch": 4096} {"train_loss": -26.18912696838379, "global_step": 340009, "epoch": 4096} {"train_loss": -25.83298683166504, "global_step": 340010, "epoch": 4096} {"train_loss": -26.074914932250977, "global_step": 340011, "epoch": 4096} {"train_loss": -26.111204147338867, "global_step": 340012, "epoch": 4096} {"train_loss": -25.89899253845215, "global_step": 340013, "epoch": 4096} {"train_loss": -26.18623924255371, "global_step": 340014, "epoch": 4096} {"train_loss": -26.01592445373535, "global_step": 340015, "epoch": 4096} {"train_loss": -26.475378036499023, "global_step": 340016, "epoch": 4096} {"train_loss": -26.15869140625, "global_step": 340017, "epoch": 4096} {"train_loss": -26.268274307250977, "global_step": 340018, "epoch": 4096} {"train_loss": -26.346277236938477, "global_step": 340019, "epoch": 4096} {"train_loss": -26.07203483581543, "global_step": 340020, "epoch": 4096} {"train_loss": -26.330785751342773, "global_step": 340021, "epoch": 4096} {"train_loss": -25.978368759155273, "global_step": 340022, "epoch": 4096} {"train_loss": -26.14217185974121, "global_step": 340023, "epoch": 4096} {"train_loss": -26.221515655517578, "global_step": 340024, "epoch": 4096} {"train_loss": -26.3408203125, "global_step": 340025, "epoch": 4096} {"train_loss": -26.03826904296875, "global_step": 340026, "epoch": 4096} {"train_loss": -26.0814151763916, "global_step": 340027, "epoch": 4096} {"train_loss": -26.018217086791992, "global_step": 340028, "epoch": 4096} {"train_loss": -26.47944450378418, "global_step": 340029, "epoch": 4096} {"train_loss": -25.993988037109375, "global_step": 340030, "epoch": 4096} {"train_loss": -26.223840713500977, "global_step": 340031, "epoch": 4096} {"train_loss": -25.776992797851562, "global_step": 340032, "epoch": 4096} {"train_loss": -26.042577743530273, "global_step": 340033, "epoch": 4096} {"train_loss": -26.151752471923828, "global_step": 340034, "epoch": 4096} {"train_loss": -26.097915649414062, "global_step": 340035, "epoch": 4096} {"train_loss": -26.087390899658203, "global_step": 340036, "epoch": 4096} {"train_loss": -26.103918075561523, "global_step": 340037, "epoch": 4096} {"train_loss": -25.821094512939453, "global_step": 340038, "epoch": 4096} {"train_loss": -26.0108642578125, "global_step": 340039, "epoch": 4096} {"train_loss": -25.911649703979492, "global_step": 340040, "epoch": 4096} {"train_loss": -25.640256881713867, "global_step": 340041, "epoch": 4096} {"train_loss": -26.036794662475586, "global_step": 340042, "epoch": 4096} {"train_loss": -26.0175838470459, "global_step": 340043, "epoch": 4096} {"train_loss": -26.382511138916016, "global_step": 340044, "epoch": 4096} {"train_loss": -26.035017013549805, "global_step": 340045, "epoch": 4096} {"train_loss": -26.07806396484375, "global_step": 340046, "epoch": 4096} {"train_loss": -25.9893798828125, "global_step": 340047, "epoch": 4096} {"train_loss": -26.262609481811523, "global_step": 340048, "epoch": 4096} {"train_loss": -25.83392906188965, "global_step": 340049, "epoch": 4096} {"train_loss": -25.98990580547287, "global_step": 340050, "epoch": 4096, "val_loss": 6558298.5} {"train_loss": -21.447513580322266, "global_step": 340051, "epoch": 4097} {"train_loss": -23.841564178466797, "global_step": 340052, "epoch": 4097} {"train_loss": -23.5584716796875, "global_step": 340053, "epoch": 4097} {"train_loss": -22.564868927001953, "global_step": 340054, "epoch": 4097} {"train_loss": -23.740724563598633, "global_step": 340055, "epoch": 4097} {"train_loss": -24.58725357055664, "global_step": 340056, "epoch": 4097} {"train_loss": -23.48149299621582, "global_step": 340057, "epoch": 4097} {"train_loss": -24.16214370727539, "global_step": 340058, "epoch": 4097} {"train_loss": -24.50954818725586, "global_step": 340059, "epoch": 4097} {"train_loss": -24.4948673248291, "global_step": 340060, "epoch": 4097} {"train_loss": -24.62459373474121, "global_step": 340061, "epoch": 4097} {"train_loss": -24.660802841186523, "global_step": 340062, "epoch": 4097} {"train_loss": -24.723201751708984, "global_step": 340063, "epoch": 4097} {"train_loss": -24.874095916748047, "global_step": 340064, "epoch": 4097} {"train_loss": -25.135072708129883, "global_step": 340065, "epoch": 4097} {"train_loss": -25.037479400634766, "global_step": 340066, "epoch": 4097} {"train_loss": -25.02906608581543, "global_step": 340067, "epoch": 4097} {"train_loss": -25.142053604125977, "global_step": 340068, "epoch": 4097} {"train_loss": -25.520349502563477, "global_step": 340069, "epoch": 4097} {"train_loss": -24.681900024414062, "global_step": 340070, "epoch": 4097} {"train_loss": -25.190628051757812, "global_step": 340071, "epoch": 4097} {"train_loss": -25.37974739074707, "global_step": 340072, "epoch": 4097} {"train_loss": -25.483448028564453, "global_step": 340073, "epoch": 4097} {"train_loss": -25.52742576599121, "global_step": 340074, "epoch": 4097} {"train_loss": -25.374113082885742, "global_step": 340075, "epoch": 4097} {"train_loss": -25.42109489440918, "global_step": 340076, "epoch": 4097} {"train_loss": -25.61810874938965, "global_step": 340077, "epoch": 4097} {"train_loss": -25.27427101135254, "global_step": 340078, "epoch": 4097} {"train_loss": -25.659177780151367, "global_step": 340079, "epoch": 4097} {"train_loss": -25.546873092651367, "global_step": 340080, "epoch": 4097} {"train_loss": -25.939453125, "global_step": 340081, "epoch": 4097} {"train_loss": -25.75873374938965, "global_step": 340082, "epoch": 4097} {"train_loss": -25.89076805114746, "global_step": 340083, "epoch": 4097} {"train_loss": -26.047887802124023, "global_step": 340084, "epoch": 4097} {"train_loss": -25.6795654296875, "global_step": 340085, "epoch": 4097} {"train_loss": -25.78205680847168, "global_step": 340086, "epoch": 4097} {"train_loss": -25.92568016052246, "global_step": 340087, "epoch": 4097} {"train_loss": -26.068695068359375, "global_step": 340088, "epoch": 4097} {"train_loss": -25.60506248474121, "global_step": 340089, "epoch": 4097} {"train_loss": -25.707059860229492, "global_step": 340090, "epoch": 4097} {"train_loss": -25.946210861206055, "global_step": 340091, "epoch": 4097} {"train_loss": -25.76727294921875, "global_step": 340092, "epoch": 4097} {"train_loss": -25.66910743713379, "global_step": 340093, "epoch": 4097} {"train_loss": -25.829938888549805, "global_step": 340094, "epoch": 4097} {"train_loss": -26.02825355529785, "global_step": 340095, "epoch": 4097} {"train_loss": -25.997594833374023, "global_step": 340096, "epoch": 4097} {"train_loss": -26.15584373474121, "global_step": 340097, "epoch": 4097} {"train_loss": -26.230804443359375, "global_step": 340098, "epoch": 4097} {"train_loss": -26.0062255859375, "global_step": 340099, "epoch": 4097} {"train_loss": -25.69892692565918, "global_step": 340100, "epoch": 4097} {"train_loss": -26.121252059936523, "global_step": 340101, "epoch": 4097} {"train_loss": -26.288238525390625, "global_step": 340102, "epoch": 4097} {"train_loss": -26.263025283813477, "global_step": 340103, "epoch": 4097} {"train_loss": -25.968198776245117, "global_step": 340104, "epoch": 4097} {"train_loss": -25.991302490234375, "global_step": 340105, "epoch": 4097} {"train_loss": -25.9708251953125, "global_step": 340106, "epoch": 4097} {"train_loss": -25.913965225219727, "global_step": 340107, "epoch": 4097} {"train_loss": -25.742849349975586, "global_step": 340108, "epoch": 4097} {"train_loss": -25.938024520874023, "global_step": 340109, "epoch": 4097} {"train_loss": -26.088232040405273, "global_step": 340110, "epoch": 4097} {"train_loss": -25.941577911376953, "global_step": 340111, "epoch": 4097} {"train_loss": -26.075122833251953, "global_step": 340112, "epoch": 4097} {"train_loss": -26.03696060180664, "global_step": 340113, "epoch": 4097} {"train_loss": -26.1455020904541, "global_step": 340114, "epoch": 4097} {"train_loss": -26.30116081237793, "global_step": 340115, "epoch": 4097} {"train_loss": -25.956714630126953, "global_step": 340116, "epoch": 4097} {"train_loss": -26.279163360595703, "global_step": 340117, "epoch": 4097} {"train_loss": -26.201568603515625, "global_step": 340118, "epoch": 4097} {"train_loss": -26.0976505279541, "global_step": 340119, "epoch": 4097} {"train_loss": -25.872394561767578, "global_step": 340120, "epoch": 4097} {"train_loss": -25.815784454345703, "global_step": 340121, "epoch": 4097} {"train_loss": -26.12190055847168, "global_step": 340122, "epoch": 4097} {"train_loss": -25.877826690673828, "global_step": 340123, "epoch": 4097} {"train_loss": -26.072834014892578, "global_step": 340124, "epoch": 4097} {"train_loss": -25.977294921875, "global_step": 340125, "epoch": 4097} {"train_loss": -26.01002311706543, "global_step": 340126, "epoch": 4097} {"train_loss": -25.887298583984375, "global_step": 340127, "epoch": 4097} {"train_loss": -25.8907413482666, "global_step": 340128, "epoch": 4097} {"train_loss": -26.005334854125977, "global_step": 340129, "epoch": 4097} {"train_loss": -25.832014083862305, "global_step": 340130, "epoch": 4097} {"train_loss": -25.870595932006836, "global_step": 340131, "epoch": 4097} {"train_loss": -26.311254501342773, "global_step": 340132, "epoch": 4097} {"train_loss": -25.50608133982463, "global_step": 340133, "epoch": 4097, "val_loss": 6567964.0} {"train_loss": -25.371381759643555, "global_step": 340134, "epoch": 4098} {"train_loss": -25.273365020751953, "global_step": 340135, "epoch": 4098} {"train_loss": -25.326416015625, "global_step": 340136, "epoch": 4098} {"train_loss": -25.410978317260742, "global_step": 340137, "epoch": 4098} {"train_loss": -25.798620223999023, "global_step": 340138, "epoch": 4098} {"train_loss": -25.293352127075195, "global_step": 340139, "epoch": 4098} {"train_loss": -25.742467880249023, "global_step": 340140, "epoch": 4098} {"train_loss": -25.94883155822754, "global_step": 340141, "epoch": 4098} {"train_loss": -25.694482803344727, "global_step": 340142, "epoch": 4098} {"train_loss": -25.935529708862305, "global_step": 340143, "epoch": 4098} {"train_loss": -25.699493408203125, "global_step": 340144, "epoch": 4098} {"train_loss": -25.686798095703125, "global_step": 340145, "epoch": 4098} {"train_loss": -25.984832763671875, "global_step": 340146, "epoch": 4098} {"train_loss": -25.927038192749023, "global_step": 340147, "epoch": 4098} {"train_loss": -25.695539474487305, "global_step": 340148, "epoch": 4098} {"train_loss": -25.895883560180664, "global_step": 340149, "epoch": 4098} {"train_loss": -25.924535751342773, "global_step": 340150, "epoch": 4098} {"train_loss": -25.82636833190918, "global_step": 340151, "epoch": 4098} {"train_loss": -26.21851921081543, "global_step": 340152, "epoch": 4098} {"train_loss": -25.79316520690918, "global_step": 340153, "epoch": 4098} {"train_loss": -26.155166625976562, "global_step": 340154, "epoch": 4098} {"train_loss": -25.593130111694336, "global_step": 340155, "epoch": 4098} {"train_loss": -25.779266357421875, "global_step": 340156, "epoch": 4098} {"train_loss": -25.997848510742188, "global_step": 340157, "epoch": 4098} {"train_loss": -25.87733268737793, "global_step": 340158, "epoch": 4098} {"train_loss": -26.119586944580078, "global_step": 340159, "epoch": 4098} {"train_loss": -26.209980010986328, "global_step": 340160, "epoch": 4098} {"train_loss": -26.032026290893555, "global_step": 340161, "epoch": 4098} {"train_loss": -25.767745971679688, "global_step": 340162, "epoch": 4098} {"train_loss": -25.80707359313965, "global_step": 340163, "epoch": 4098} {"train_loss": -25.917728424072266, "global_step": 340164, "epoch": 4098} {"train_loss": -26.130599975585938, "global_step": 340165, "epoch": 4098} {"train_loss": -26.07240104675293, "global_step": 340166, "epoch": 4098} {"train_loss": -26.030664443969727, "global_step": 340167, "epoch": 4098} {"train_loss": -25.6286563873291, "global_step": 340168, "epoch": 4098} {"train_loss": -26.328771591186523, "global_step": 340169, "epoch": 4098} {"train_loss": -26.258853912353516, "global_step": 340170, "epoch": 4098} {"train_loss": -25.9148006439209, "global_step": 340171, "epoch": 4098} {"train_loss": -26.199872970581055, "global_step": 340172, "epoch": 4098} {"train_loss": -26.208478927612305, "global_step": 340173, "epoch": 4098} {"train_loss": -26.325489044189453, "global_step": 340174, "epoch": 4098} {"train_loss": -26.21567726135254, "global_step": 340175, "epoch": 4098} {"train_loss": -26.018798828125, "global_step": 340176, "epoch": 4098} {"train_loss": -26.161182403564453, "global_step": 340177, "epoch": 4098} {"train_loss": -26.467741012573242, "global_step": 340178, "epoch": 4098} {"train_loss": -26.236740112304688, "global_step": 340179, "epoch": 4098} {"train_loss": -25.980688095092773, "global_step": 340180, "epoch": 4098} {"train_loss": -26.2204532623291, "global_step": 340181, "epoch": 4098} {"train_loss": -26.343103408813477, "global_step": 340182, "epoch": 4098} {"train_loss": -26.280506134033203, "global_step": 340183, "epoch": 4098} {"train_loss": -25.916656494140625, "global_step": 340184, "epoch": 4098} {"train_loss": -26.037067413330078, "global_step": 340185, "epoch": 4098} {"train_loss": -26.244970321655273, "global_step": 340186, "epoch": 4098} {"train_loss": -26.331205368041992, "global_step": 340187, "epoch": 4098} {"train_loss": -26.627294540405273, "global_step": 340188, "epoch": 4098} {"train_loss": -26.16629981994629, "global_step": 340189, "epoch": 4098} {"train_loss": -25.933862686157227, "global_step": 340190, "epoch": 4098} {"train_loss": -26.025909423828125, "global_step": 340191, "epoch": 4098} {"train_loss": -26.012720108032227, "global_step": 340192, "epoch": 4098} {"train_loss": -26.29425621032715, "global_step": 340193, "epoch": 4098} {"train_loss": -25.921239852905273, "global_step": 340194, "epoch": 4098} {"train_loss": -26.140851974487305, "global_step": 340195, "epoch": 4098} {"train_loss": -26.169347763061523, "global_step": 340196, "epoch": 4098} {"train_loss": -26.201330184936523, "global_step": 340197, "epoch": 4098} {"train_loss": -26.456228256225586, "global_step": 340198, "epoch": 4098} {"train_loss": -25.938562393188477, "global_step": 340199, "epoch": 4098} {"train_loss": -25.887725830078125, "global_step": 340200, "epoch": 4098} {"train_loss": -26.111780166625977, "global_step": 340201, "epoch": 4098} {"train_loss": -25.9732666015625, "global_step": 340202, "epoch": 4098} {"train_loss": -25.96246337890625, "global_step": 340203, "epoch": 4098} {"train_loss": -25.8282413482666, "global_step": 340204, "epoch": 4098} {"train_loss": -26.29642677307129, "global_step": 340205, "epoch": 4098} {"train_loss": -26.39983558654785, "global_step": 340206, "epoch": 4098} {"train_loss": -25.839954376220703, "global_step": 340207, "epoch": 4098} {"train_loss": -26.0264949798584, "global_step": 340208, "epoch": 4098} {"train_loss": -26.32941246032715, "global_step": 340209, "epoch": 4098} {"train_loss": -25.965152740478516, "global_step": 340210, "epoch": 4098} {"train_loss": -26.22022819519043, "global_step": 340211, "epoch": 4098} {"train_loss": -26.49321937561035, "global_step": 340212, "epoch": 4098} {"train_loss": -26.13302993774414, "global_step": 340213, "epoch": 4098} {"train_loss": -25.70728874206543, "global_step": 340214, "epoch": 4098} {"train_loss": -25.329103469848633, "global_step": 340215, "epoch": 4098} {"train_loss": -25.979953168386437, "global_step": 340216, "epoch": 4098, "val_loss": 6457281.0} {"train_loss": -22.416194915771484, "global_step": 340217, "epoch": 4099} {"train_loss": -22.365766525268555, "global_step": 340218, "epoch": 4099} {"train_loss": -24.036466598510742, "global_step": 340219, "epoch": 4099} {"train_loss": -21.652753829956055, "global_step": 340220, "epoch": 4099} {"train_loss": -24.600351333618164, "global_step": 340221, "epoch": 4099} {"train_loss": -23.124860763549805, "global_step": 340222, "epoch": 4099} {"train_loss": -24.62530517578125, "global_step": 340223, "epoch": 4099} {"train_loss": -24.671960830688477, "global_step": 340224, "epoch": 4099} {"train_loss": -24.20201301574707, "global_step": 340225, "epoch": 4099} {"train_loss": -24.650245666503906, "global_step": 340226, "epoch": 4099} {"train_loss": -24.357728958129883, "global_step": 340227, "epoch": 4099} {"train_loss": -24.49668312072754, "global_step": 340228, "epoch": 4099} {"train_loss": -24.67539405822754, "global_step": 340229, "epoch": 4099} {"train_loss": -25.140493392944336, "global_step": 340230, "epoch": 4099} {"train_loss": -24.977079391479492, "global_step": 340231, "epoch": 4099} {"train_loss": -25.0580997467041, "global_step": 340232, "epoch": 4099} {"train_loss": -25.056936264038086, "global_step": 340233, "epoch": 4099} {"train_loss": -25.05175018310547, "global_step": 340234, "epoch": 4099} {"train_loss": -25.136795043945312, "global_step": 340235, "epoch": 4099} {"train_loss": -25.36895751953125, "global_step": 340236, "epoch": 4099} {"train_loss": -25.12393569946289, "global_step": 340237, "epoch": 4099} {"train_loss": -25.12152099609375, "global_step": 340238, "epoch": 4099} {"train_loss": -25.12420082092285, "global_step": 340239, "epoch": 4099} {"train_loss": -25.2275390625, "global_step": 340240, "epoch": 4099} {"train_loss": -25.31748390197754, "global_step": 340241, "epoch": 4099} {"train_loss": -24.974416732788086, "global_step": 340242, "epoch": 4099} {"train_loss": -25.10857582092285, "global_step": 340243, "epoch": 4099} {"train_loss": -24.966941833496094, "global_step": 340244, "epoch": 4099} {"train_loss": -24.967954635620117, "global_step": 340245, "epoch": 4099} {"train_loss": -25.655654907226562, "global_step": 340246, "epoch": 4099} {"train_loss": -25.44139862060547, "global_step": 340247, "epoch": 4099} {"train_loss": -25.555828094482422, "global_step": 340248, "epoch": 4099} {"train_loss": -25.1982364654541, "global_step": 340249, "epoch": 4099} {"train_loss": -25.249357223510742, "global_step": 340250, "epoch": 4099} {"train_loss": -25.854944229125977, "global_step": 340251, "epoch": 4099} {"train_loss": -25.83051872253418, "global_step": 340252, "epoch": 4099} {"train_loss": -25.758630752563477, "global_step": 340253, "epoch": 4099} {"train_loss": -25.648929595947266, "global_step": 340254, "epoch": 4099} {"train_loss": -25.88276481628418, "global_step": 340255, "epoch": 4099} {"train_loss": -25.555681228637695, "global_step": 340256, "epoch": 4099} {"train_loss": -25.718854904174805, "global_step": 340257, "epoch": 4099} {"train_loss": -25.46928596496582, "global_step": 340258, "epoch": 4099} {"train_loss": -25.566354751586914, "global_step": 340259, "epoch": 4099} {"train_loss": -25.6323184967041, "global_step": 340260, "epoch": 4099} {"train_loss": -25.867965698242188, "global_step": 340261, "epoch": 4099} {"train_loss": -25.832883834838867, "global_step": 340262, "epoch": 4099} {"train_loss": -25.62611961364746, "global_step": 340263, "epoch": 4099} {"train_loss": -25.75062370300293, "global_step": 340264, "epoch": 4099} {"train_loss": -25.744953155517578, "global_step": 340265, "epoch": 4099} {"train_loss": -26.161130905151367, "global_step": 340266, "epoch": 4099} {"train_loss": -25.87384605407715, "global_step": 340267, "epoch": 4099} {"train_loss": -26.115747451782227, "global_step": 340268, "epoch": 4099} {"train_loss": -25.40237045288086, "global_step": 340269, "epoch": 4099} {"train_loss": -25.73186683654785, "global_step": 340270, "epoch": 4099} {"train_loss": -25.7650089263916, "global_step": 340271, "epoch": 4099} {"train_loss": -25.965167999267578, "global_step": 340272, "epoch": 4099} {"train_loss": -26.055957794189453, "global_step": 340273, "epoch": 4099} {"train_loss": -25.742944717407227, "global_step": 340274, "epoch": 4099} {"train_loss": -25.476158142089844, "global_step": 340275, "epoch": 4099} {"train_loss": -25.674413681030273, "global_step": 340276, "epoch": 4099} {"train_loss": -25.66688346862793, "global_step": 340277, "epoch": 4099} {"train_loss": -26.169906616210938, "global_step": 340278, "epoch": 4099} {"train_loss": -26.066425323486328, "global_step": 340279, "epoch": 4099} {"train_loss": -25.97785758972168, "global_step": 340280, "epoch": 4099} {"train_loss": -26.096527099609375, "global_step": 340281, "epoch": 4099} {"train_loss": -26.10916519165039, "global_step": 340282, "epoch": 4099} {"train_loss": -25.944976806640625, "global_step": 340283, "epoch": 4099} {"train_loss": -25.4111270904541, "global_step": 340284, "epoch": 4099} {"train_loss": -26.125106811523438, "global_step": 340285, "epoch": 4099} {"train_loss": -26.504993438720703, "global_step": 340286, "epoch": 4099} {"train_loss": -26.264801025390625, "global_step": 340287, "epoch": 4099} {"train_loss": -26.15228843688965, "global_step": 340288, "epoch": 4099} {"train_loss": -26.213825225830078, "global_step": 340289, "epoch": 4099} {"train_loss": -26.406118392944336, "global_step": 340290, "epoch": 4099} {"train_loss": -26.025251388549805, "global_step": 340291, "epoch": 4099} {"train_loss": -26.247907638549805, "global_step": 340292, "epoch": 4099} {"train_loss": -26.151487350463867, "global_step": 340293, "epoch": 4099} {"train_loss": -26.411869049072266, "global_step": 340294, "epoch": 4099} {"train_loss": -26.24127197265625, "global_step": 340295, "epoch": 4099} {"train_loss": -26.047260284423828, "global_step": 340296, "epoch": 4099} {"train_loss": -26.262924194335938, "global_step": 340297, "epoch": 4099} {"train_loss": -26.32551383972168, "global_step": 340298, "epoch": 4099} {"train_loss": -25.419927275324444, "global_step": 340299, "epoch": 4099, "val_loss": 6561834.0} {"train_loss": -25.97467613220215, "global_step": 340300, "epoch": 4100} {"train_loss": -25.787580490112305, "global_step": 340301, "epoch": 4100} {"train_loss": -26.1151065826416, "global_step": 340302, "epoch": 4100} {"train_loss": -25.56938934326172, "global_step": 340303, "epoch": 4100} {"train_loss": -25.996784210205078, "global_step": 340304, "epoch": 4100} {"train_loss": -25.839508056640625, "global_step": 340305, "epoch": 4100} {"train_loss": -26.383535385131836, "global_step": 340306, "epoch": 4100} {"train_loss": -25.488035202026367, "global_step": 340307, "epoch": 4100} {"train_loss": -25.932239532470703, "global_step": 340308, "epoch": 4100} {"train_loss": -26.40882682800293, "global_step": 340309, "epoch": 4100} {"train_loss": -25.93340492248535, "global_step": 340310, "epoch": 4100} {"train_loss": -26.22242546081543, "global_step": 340311, "epoch": 4100} {"train_loss": -26.0089111328125, "global_step": 340312, "epoch": 4100} {"train_loss": -26.181055068969727, "global_step": 340313, "epoch": 4100} {"train_loss": -26.238317489624023, "global_step": 340314, "epoch": 4100} {"train_loss": -25.872196197509766, "global_step": 340315, "epoch": 4100} {"train_loss": -26.291471481323242, "global_step": 340316, "epoch": 4100} {"train_loss": -25.975830078125, "global_step": 340317, "epoch": 4100} {"train_loss": -25.883214950561523, "global_step": 340318, "epoch": 4100} {"train_loss": -26.01096534729004, "global_step": 340319, "epoch": 4100} {"train_loss": -26.003400802612305, "global_step": 340320, "epoch": 4100} {"train_loss": -25.792139053344727, "global_step": 340321, "epoch": 4100} {"train_loss": -25.699905395507812, "global_step": 340322, "epoch": 4100} {"train_loss": -26.308237075805664, "global_step": 340323, "epoch": 4100} {"train_loss": -25.844043731689453, "global_step": 340324, "epoch": 4100} {"train_loss": -26.329792022705078, "global_step": 340325, "epoch": 4100} {"train_loss": -26.151647567749023, "global_step": 340326, "epoch": 4100} {"train_loss": -25.80035400390625, "global_step": 340327, "epoch": 4100} {"train_loss": -26.182266235351562, "global_step": 340328, "epoch": 4100} {"train_loss": -25.923749923706055, "global_step": 340329, "epoch": 4100} {"train_loss": -25.837034225463867, "global_step": 340330, "epoch": 4100} {"train_loss": -26.00458335876465, "global_step": 340331, "epoch": 4100} {"train_loss": -25.91944694519043, "global_step": 340332, "epoch": 4100} {"train_loss": -25.907001495361328, "global_step": 340333, "epoch": 4100} {"train_loss": -26.12531852722168, "global_step": 340334, "epoch": 4100} {"train_loss": -25.45160484313965, "global_step": 340335, "epoch": 4100} {"train_loss": -25.784399032592773, "global_step": 340336, "epoch": 4100} {"train_loss": -25.99469566345215, "global_step": 340337, "epoch": 4100} {"train_loss": -25.799657821655273, "global_step": 340338, "epoch": 4100} {"train_loss": -26.12025260925293, "global_step": 340339, "epoch": 4100} {"train_loss": -25.714231491088867, "global_step": 340340, "epoch": 4100} {"train_loss": -25.873483657836914, "global_step": 340341, "epoch": 4100} {"train_loss": -25.95918846130371, "global_step": 340342, "epoch": 4100} {"train_loss": -26.14381217956543, "global_step": 340343, "epoch": 4100} {"train_loss": -26.423919677734375, "global_step": 340344, "epoch": 4100} {"train_loss": -26.283039093017578, "global_step": 340345, "epoch": 4100} {"train_loss": -26.209848403930664, "global_step": 340346, "epoch": 4100} {"train_loss": -26.32537841796875, "global_step": 340347, "epoch": 4100} {"train_loss": -25.819766998291016, "global_step": 340348, "epoch": 4100} {"train_loss": -26.394485473632812, "global_step": 340349, "epoch": 4100} {"train_loss": -25.839208602905273, "global_step": 340350, "epoch": 4100} {"train_loss": -26.384958267211914, "global_step": 340351, "epoch": 4100} {"train_loss": -26.325708389282227, "global_step": 340352, "epoch": 4100} {"train_loss": -26.21600914001465, "global_step": 340353, "epoch": 4100} {"train_loss": -26.177413940429688, "global_step": 340354, "epoch": 4100} {"train_loss": -26.252872467041016, "global_step": 340355, "epoch": 4100} {"train_loss": -26.120834350585938, "global_step": 340356, "epoch": 4100} {"train_loss": -26.42115592956543, "global_step": 340357, "epoch": 4100} {"train_loss": -26.190876007080078, "global_step": 340358, "epoch": 4100} {"train_loss": -26.357873916625977, "global_step": 340359, "epoch": 4100} {"train_loss": -26.01807975769043, "global_step": 340360, "epoch": 4100} {"train_loss": -26.175506591796875, "global_step": 340361, "epoch": 4100} {"train_loss": -26.404260635375977, "global_step": 340362, "epoch": 4100} {"train_loss": -26.261499404907227, "global_step": 340363, "epoch": 4100} {"train_loss": -26.38102149963379, "global_step": 340364, "epoch": 4100} {"train_loss": -26.1762638092041, "global_step": 340365, "epoch": 4100} {"train_loss": -26.051971435546875, "global_step": 340366, "epoch": 4100} {"train_loss": -25.879657745361328, "global_step": 340367, "epoch": 4100} {"train_loss": -25.940876007080078, "global_step": 340368, "epoch": 4100} {"train_loss": -25.668548583984375, "global_step": 340369, "epoch": 4100} {"train_loss": -26.255773544311523, "global_step": 340370, "epoch": 4100} {"train_loss": -25.911115646362305, "global_step": 340371, "epoch": 4100} {"train_loss": -25.970556259155273, "global_step": 340372, "epoch": 4100} {"train_loss": -26.122791290283203, "global_step": 340373, "epoch": 4100} {"train_loss": -25.776342391967773, "global_step": 340374, "epoch": 4100} {"train_loss": -26.05474853515625, "global_step": 340375, "epoch": 4100} {"train_loss": -26.43955421447754, "global_step": 340376, "epoch": 4100} {"train_loss": -25.827178955078125, "global_step": 340377, "epoch": 4100} {"train_loss": -25.67791175842285, "global_step": 340378, "epoch": 4100} {"train_loss": -26.0985164642334, "global_step": 340379, "epoch": 4100} {"train_loss": -26.1362361907959, "global_step": 340380, "epoch": 4100} {"train_loss": -25.369298934936523, "global_step": 340381, "epoch": 4100} {"train_loss": -26.035655446799403, "global_step": 340382, "epoch": 4100, "train/sim_max_reward_0": 1.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4500000": 1.0, "test/sim_max_reward_4500001": 1.0, "test/sim_max_reward_4500002": 1.0, "test/sim_max_reward_4500003": 1.0, "test/sim_max_reward_4500004": 1.0, "test/sim_max_reward_4500005": 1.0, "test/sim_max_reward_4500006": 1.0, "test/sim_max_reward_4500007": 0.0, "test/sim_max_reward_4500008": 1.0, "test/sim_max_reward_4500009": 1.0, "test/sim_max_reward_4500010": 1.0, "test/sim_max_reward_4500011": 1.0, "test/sim_max_reward_4500012": 1.0, "test/sim_max_reward_4500013": 0.0, "test/sim_max_reward_4500014": 1.0, "test/sim_max_reward_4500015": 1.0, "test/sim_max_reward_4500016": 1.0, "test/sim_max_reward_4500017": 1.0, "test/sim_max_reward_4500018": 0.0, "test/sim_max_reward_4500019": 1.0, "test/sim_max_reward_4500020": 1.0, "test/sim_max_reward_4500021": 1.0, "train/mean_score": 1.0, "test/mean_score": 0.8636363636363636, "val_loss": 6572094.0} {"train_loss": -25.93353843688965, "global_step": 340383, "epoch": 4101} {"train_loss": -25.5129337310791, "global_step": 340384, "epoch": 4101} {"train_loss": -25.7608642578125, "global_step": 340385, "epoch": 4101} {"train_loss": -25.65232276916504, "global_step": 340386, "epoch": 4101} {"train_loss": -25.786741256713867, "global_step": 340387, "epoch": 4101} {"train_loss": -25.841886520385742, "global_step": 340388, "epoch": 4101} {"train_loss": -25.549968719482422, "global_step": 340389, "epoch": 4101} {"train_loss": -25.80226707458496, "global_step": 340390, "epoch": 4101} {"train_loss": -25.784265518188477, "global_step": 340391, "epoch": 4101} {"train_loss": -25.821592330932617, "global_step": 340392, "epoch": 4101} {"train_loss": -25.886343002319336, "global_step": 340393, "epoch": 4101} {"train_loss": -25.822097778320312, "global_step": 340394, "epoch": 4101} {"train_loss": -25.570178985595703, "global_step": 340395, "epoch": 4101} {"train_loss": -25.606658935546875, "global_step": 340396, "epoch": 4101} {"train_loss": -25.86110496520996, "global_step": 340397, "epoch": 4101} {"train_loss": -25.979663848876953, "global_step": 340398, "epoch": 4101} {"train_loss": -26.034299850463867, "global_step": 340399, "epoch": 4101} {"train_loss": -25.891782760620117, "global_step": 340400, "epoch": 4101} {"train_loss": -26.1037654876709, "global_step": 340401, "epoch": 4101} {"train_loss": -26.062469482421875, "global_step": 340402, "epoch": 4101} {"train_loss": -26.0831298828125, "global_step": 340403, "epoch": 4101} {"train_loss": -25.770727157592773, "global_step": 340404, "epoch": 4101} {"train_loss": -26.157739639282227, "global_step": 340405, "epoch": 4101} {"train_loss": -26.123228073120117, "global_step": 340406, "epoch": 4101} {"train_loss": -26.14055824279785, "global_step": 340407, "epoch": 4101} {"train_loss": -25.911972045898438, "global_step": 340408, "epoch": 4101} {"train_loss": -26.569242477416992, "global_step": 340409, "epoch": 4101} {"train_loss": -25.994754791259766, "global_step": 340410, "epoch": 4101} {"train_loss": -26.16868019104004, "global_step": 340411, "epoch": 4101} {"train_loss": -26.01666831970215, "global_step": 340412, "epoch": 4101} {"train_loss": -26.45143699645996, "global_step": 340413, "epoch": 4101} {"train_loss": -26.445358276367188, "global_step": 340414, "epoch": 4101} {"train_loss": -26.409177780151367, "global_step": 340415, "epoch": 4101} {"train_loss": -26.46807861328125, "global_step": 340416, "epoch": 4101} {"train_loss": -26.2684383392334, "global_step": 340417, "epoch": 4101} {"train_loss": -26.306547164916992, "global_step": 340418, "epoch": 4101} {"train_loss": -26.56732749938965, "global_step": 340419, "epoch": 4101} {"train_loss": -26.058490753173828, "global_step": 340420, "epoch": 4101} {"train_loss": -26.343597412109375, "global_step": 340421, "epoch": 4101} {"train_loss": -26.19392204284668, "global_step": 340422, "epoch": 4101} {"train_loss": -25.92970085144043, "global_step": 340423, "epoch": 4101} {"train_loss": -26.23316764831543, "global_step": 340424, "epoch": 4101} {"train_loss": -26.28582191467285, "global_step": 340425, "epoch": 4101} {"train_loss": -26.028478622436523, "global_step": 340426, "epoch": 4101} {"train_loss": -26.072265625, "global_step": 340427, "epoch": 4101} {"train_loss": -26.091474533081055, "global_step": 340428, "epoch": 4101} {"train_loss": -25.905750274658203, "global_step": 340429, "epoch": 4101} {"train_loss": -26.2122802734375, "global_step": 340430, "epoch": 4101} {"train_loss": -26.4277286529541, "global_step": 340431, "epoch": 4101} {"train_loss": -26.132028579711914, "global_step": 340432, "epoch": 4101} {"train_loss": -25.976659774780273, "global_step": 340433, "epoch": 4101} {"train_loss": -26.0605411529541, "global_step": 340434, "epoch": 4101} {"train_loss": -26.022916793823242, "global_step": 340435, "epoch": 4101} {"train_loss": -26.327558517456055, "global_step": 340436, "epoch": 4101} {"train_loss": -26.057992935180664, "global_step": 340437, "epoch": 4101} {"train_loss": -26.273584365844727, "global_step": 340438, "epoch": 4101} {"train_loss": -26.17987060546875, "global_step": 340439, "epoch": 4101} {"train_loss": -26.231796264648438, "global_step": 340440, "epoch": 4101} {"train_loss": -25.9045352935791, "global_step": 340441, "epoch": 4101} {"train_loss": -25.98240089416504, "global_step": 340442, "epoch": 4101} {"train_loss": -25.943037033081055, "global_step": 340443, "epoch": 4101} {"train_loss": -25.701129913330078, "global_step": 340444, "epoch": 4101} {"train_loss": -25.86924171447754, "global_step": 340445, "epoch": 4101} {"train_loss": -25.906570434570312, "global_step": 340446, "epoch": 4101} {"train_loss": -26.061132431030273, "global_step": 340447, "epoch": 4101} {"train_loss": -25.882165908813477, "global_step": 340448, "epoch": 4101} {"train_loss": -26.442245483398438, "global_step": 340449, "epoch": 4101} {"train_loss": -26.085058212280273, "global_step": 340450, "epoch": 4101} {"train_loss": -26.502811431884766, "global_step": 340451, "epoch": 4101} {"train_loss": -26.381702423095703, "global_step": 340452, "epoch": 4101} {"train_loss": -25.9808406829834, "global_step": 340453, "epoch": 4101} {"train_loss": -26.54511833190918, "global_step": 340454, "epoch": 4101} {"train_loss": -26.614805221557617, "global_step": 340455, "epoch": 4101} {"train_loss": -25.90728759765625, "global_step": 340456, "epoch": 4101} {"train_loss": -26.239423751831055, "global_step": 340457, "epoch": 4101} {"train_loss": -26.04835319519043, "global_step": 340458, "epoch": 4101} {"train_loss": -26.318689346313477, "global_step": 340459, "epoch": 4101} {"train_loss": -26.11077880859375, "global_step": 340460, "epoch": 4101} {"train_loss": -25.97096824645996, "global_step": 340461, "epoch": 4101} {"train_loss": -26.236974716186523, "global_step": 340462, "epoch": 4101} {"train_loss": -25.961231231689453, "global_step": 340463, "epoch": 4101} {"train_loss": -26.609949111938477, "global_step": 340464, "epoch": 4101} {"train_loss": -26.08687773095556, "global_step": 340465, "epoch": 4101, "val_loss": 6580380.0} {"train_loss": -25.818668365478516, "global_step": 340466, "epoch": 4102} {"train_loss": -25.311386108398438, "global_step": 340467, "epoch": 4102} {"train_loss": -24.932580947875977, "global_step": 340468, "epoch": 4102} {"train_loss": -24.801315307617188, "global_step": 340469, "epoch": 4102} {"train_loss": -25.625497817993164, "global_step": 340470, "epoch": 4102} {"train_loss": -25.940641403198242, "global_step": 340471, "epoch": 4102} {"train_loss": -25.20810317993164, "global_step": 340472, "epoch": 4102} {"train_loss": -25.4354305267334, "global_step": 340473, "epoch": 4102} {"train_loss": -25.40839195251465, "global_step": 340474, "epoch": 4102} {"train_loss": -25.618316650390625, "global_step": 340475, "epoch": 4102} {"train_loss": -25.393218994140625, "global_step": 340476, "epoch": 4102} {"train_loss": -25.626203536987305, "global_step": 340477, "epoch": 4102} {"train_loss": -25.629867553710938, "global_step": 340478, "epoch": 4102} {"train_loss": -25.700815200805664, "global_step": 340479, "epoch": 4102} {"train_loss": -25.603931427001953, "global_step": 340480, "epoch": 4102} {"train_loss": -26.116010665893555, "global_step": 340481, "epoch": 4102} {"train_loss": -25.78229331970215, "global_step": 340482, "epoch": 4102} {"train_loss": -25.781646728515625, "global_step": 340483, "epoch": 4102} {"train_loss": -25.588491439819336, "global_step": 340484, "epoch": 4102} {"train_loss": -25.996936798095703, "global_step": 340485, "epoch": 4102} {"train_loss": -25.608625411987305, "global_step": 340486, "epoch": 4102} {"train_loss": -25.738073348999023, "global_step": 340487, "epoch": 4102} {"train_loss": -25.657318115234375, "global_step": 340488, "epoch": 4102} {"train_loss": -25.746183395385742, "global_step": 340489, "epoch": 4102} {"train_loss": -26.13800048828125, "global_step": 340490, "epoch": 4102} {"train_loss": -25.601125717163086, "global_step": 340491, "epoch": 4102} {"train_loss": -25.8515567779541, "global_step": 340492, "epoch": 4102} {"train_loss": -26.1171875, "global_step": 340493, "epoch": 4102} {"train_loss": -25.96261978149414, "global_step": 340494, "epoch": 4102} {"train_loss": -26.24188804626465, "global_step": 340495, "epoch": 4102} {"train_loss": -25.675556182861328, "global_step": 340496, "epoch": 4102} {"train_loss": -25.56924819946289, "global_step": 340497, "epoch": 4102} {"train_loss": -25.9493350982666, "global_step": 340498, "epoch": 4102} {"train_loss": -26.309772491455078, "global_step": 340499, "epoch": 4102} {"train_loss": -25.87911033630371, "global_step": 340500, "epoch": 4102} {"train_loss": -25.882299423217773, "global_step": 340501, "epoch": 4102} {"train_loss": -26.112396240234375, "global_step": 340502, "epoch": 4102} {"train_loss": -26.480619430541992, "global_step": 340503, "epoch": 4102} {"train_loss": -26.230573654174805, "global_step": 340504, "epoch": 4102} {"train_loss": -26.0264892578125, "global_step": 340505, "epoch": 4102} {"train_loss": -25.93115234375, "global_step": 340506, "epoch": 4102} {"train_loss": -26.39179801940918, "global_step": 340507, "epoch": 4102} {"train_loss": -26.658491134643555, "global_step": 340508, "epoch": 4102} {"train_loss": -26.178211212158203, "global_step": 340509, "epoch": 4102} {"train_loss": -25.967792510986328, "global_step": 340510, "epoch": 4102} {"train_loss": -26.426074981689453, "global_step": 340511, "epoch": 4102} {"train_loss": -26.208770751953125, "global_step": 340512, "epoch": 4102} {"train_loss": -25.61447525024414, "global_step": 340513, "epoch": 4102} {"train_loss": -25.863386154174805, "global_step": 340514, "epoch": 4102} {"train_loss": -26.207870483398438, "global_step": 340515, "epoch": 4102} {"train_loss": -25.859556198120117, "global_step": 340516, "epoch": 4102} {"train_loss": -25.82630729675293, "global_step": 340517, "epoch": 4102} {"train_loss": -26.127429962158203, "global_step": 340518, "epoch": 4102} {"train_loss": -26.18212890625, "global_step": 340519, "epoch": 4102} {"train_loss": -26.054845809936523, "global_step": 340520, "epoch": 4102} {"train_loss": -26.452392578125, "global_step": 340521, "epoch": 4102} {"train_loss": -25.784849166870117, "global_step": 340522, "epoch": 4102} {"train_loss": -26.159210205078125, "global_step": 340523, "epoch": 4102} {"train_loss": -26.117177963256836, "global_step": 340524, "epoch": 4102} {"train_loss": -26.086166381835938, "global_step": 340525, "epoch": 4102} {"train_loss": -26.005191802978516, "global_step": 340526, "epoch": 4102} {"train_loss": -26.24165916442871, "global_step": 340527, "epoch": 4102} {"train_loss": -25.81403160095215, "global_step": 340528, "epoch": 4102} {"train_loss": -26.08075523376465, "global_step": 340529, "epoch": 4102} {"train_loss": -26.222471237182617, "global_step": 340530, "epoch": 4102} {"train_loss": -26.220300674438477, "global_step": 340531, "epoch": 4102} {"train_loss": -26.112091064453125, "global_step": 340532, "epoch": 4102} {"train_loss": -25.90203285217285, "global_step": 340533, "epoch": 4102} {"train_loss": -26.00421714782715, "global_step": 340534, "epoch": 4102} {"train_loss": -26.316980361938477, "global_step": 340535, "epoch": 4102} {"train_loss": -26.06366539001465, "global_step": 340536, "epoch": 4102} {"train_loss": -26.0609188079834, "global_step": 340537, "epoch": 4102} {"train_loss": -26.190404891967773, "global_step": 340538, "epoch": 4102} {"train_loss": -26.039600372314453, "global_step": 340539, "epoch": 4102} {"train_loss": -26.431119918823242, "global_step": 340540, "epoch": 4102} {"train_loss": -26.27203941345215, "global_step": 340541, "epoch": 4102} {"train_loss": -25.9929141998291, "global_step": 340542, "epoch": 4102} {"train_loss": -25.7105712890625, "global_step": 340543, "epoch": 4102} {"train_loss": -25.95762062072754, "global_step": 340544, "epoch": 4102} {"train_loss": -26.440587997436523, "global_step": 340545, "epoch": 4102} {"train_loss": -25.879209518432617, "global_step": 340546, "epoch": 4102} {"train_loss": -25.6977596282959, "global_step": 340547, "epoch": 4102} {"train_loss": -25.930944442749023, "global_step": 340548, "epoch": 4102, "val_loss": 6550758.0} {"train_loss": -25.958221435546875, "global_step": 340549, "epoch": 4103} {"train_loss": -25.305877685546875, "global_step": 340550, "epoch": 4103} {"train_loss": -25.34706687927246, "global_step": 340551, "epoch": 4103} {"train_loss": -26.201520919799805, "global_step": 340552, "epoch": 4103} {"train_loss": -25.64080810546875, "global_step": 340553, "epoch": 4103} {"train_loss": -25.648303985595703, "global_step": 340554, "epoch": 4103} {"train_loss": -25.678253173828125, "global_step": 340555, "epoch": 4103} {"train_loss": -25.938154220581055, "global_step": 340556, "epoch": 4103} {"train_loss": -26.178394317626953, "global_step": 340557, "epoch": 4103} {"train_loss": -26.025739669799805, "global_step": 340558, "epoch": 4103} {"train_loss": -25.85501480102539, "global_step": 340559, "epoch": 4103} {"train_loss": -25.799484252929688, "global_step": 340560, "epoch": 4103} {"train_loss": -26.02322769165039, "global_step": 340561, "epoch": 4103} {"train_loss": -25.554203033447266, "global_step": 340562, "epoch": 4103} {"train_loss": -26.245641708374023, "global_step": 340563, "epoch": 4103} {"train_loss": -26.30959129333496, "global_step": 340564, "epoch": 4103} {"train_loss": -26.325305938720703, "global_step": 340565, "epoch": 4103} {"train_loss": -25.915790557861328, "global_step": 340566, "epoch": 4103} {"train_loss": -26.078886032104492, "global_step": 340567, "epoch": 4103} {"train_loss": -25.92303466796875, "global_step": 340568, "epoch": 4103} {"train_loss": -26.290206909179688, "global_step": 340569, "epoch": 4103} {"train_loss": -26.218534469604492, "global_step": 340570, "epoch": 4103} {"train_loss": -26.243804931640625, "global_step": 340571, "epoch": 4103} {"train_loss": -25.978002548217773, "global_step": 340572, "epoch": 4103} {"train_loss": -26.406335830688477, "global_step": 340573, "epoch": 4103} {"train_loss": -26.122465133666992, "global_step": 340574, "epoch": 4103} {"train_loss": -26.3243350982666, "global_step": 340575, "epoch": 4103} {"train_loss": -26.068527221679688, "global_step": 340576, "epoch": 4103} {"train_loss": -26.072973251342773, "global_step": 340577, "epoch": 4103} {"train_loss": -26.47454261779785, "global_step": 340578, "epoch": 4103} {"train_loss": -25.746686935424805, "global_step": 340579, "epoch": 4103} {"train_loss": -26.10953712463379, "global_step": 340580, "epoch": 4103} {"train_loss": -25.86504554748535, "global_step": 340581, "epoch": 4103} {"train_loss": -25.664081573486328, "global_step": 340582, "epoch": 4103} {"train_loss": -26.042037963867188, "global_step": 340583, "epoch": 4103} {"train_loss": -26.128774642944336, "global_step": 340584, "epoch": 4103} {"train_loss": -25.896265029907227, "global_step": 340585, "epoch": 4103} {"train_loss": -26.147912979125977, "global_step": 340586, "epoch": 4103} {"train_loss": -26.044605255126953, "global_step": 340587, "epoch": 4103} {"train_loss": -26.1332950592041, "global_step": 340588, "epoch": 4103} {"train_loss": -26.391340255737305, "global_step": 340589, "epoch": 4103} {"train_loss": -26.03228187561035, "global_step": 340590, "epoch": 4103} {"train_loss": -26.105438232421875, "global_step": 340591, "epoch": 4103} {"train_loss": -25.868927001953125, "global_step": 340592, "epoch": 4103} {"train_loss": -26.136707305908203, "global_step": 340593, "epoch": 4103} {"train_loss": -26.255456924438477, "global_step": 340594, "epoch": 4103} {"train_loss": -26.050357818603516, "global_step": 340595, "epoch": 4103} {"train_loss": -26.308979034423828, "global_step": 340596, "epoch": 4103} {"train_loss": -26.173322677612305, "global_step": 340597, "epoch": 4103} {"train_loss": -25.800495147705078, "global_step": 340598, "epoch": 4103} {"train_loss": -25.939558029174805, "global_step": 340599, "epoch": 4103} {"train_loss": -25.52998924255371, "global_step": 340600, "epoch": 4103} {"train_loss": -25.601709365844727, "global_step": 340601, "epoch": 4103} {"train_loss": -25.457456588745117, "global_step": 340602, "epoch": 4103} {"train_loss": -25.8226261138916, "global_step": 340603, "epoch": 4103} {"train_loss": -26.092727661132812, "global_step": 340604, "epoch": 4103} {"train_loss": -25.920196533203125, "global_step": 340605, "epoch": 4103} {"train_loss": -25.93995475769043, "global_step": 340606, "epoch": 4103} {"train_loss": -26.07151222229004, "global_step": 340607, "epoch": 4103} {"train_loss": -25.902124404907227, "global_step": 340608, "epoch": 4103} {"train_loss": -25.96811294555664, "global_step": 340609, "epoch": 4103} {"train_loss": -26.265363693237305, "global_step": 340610, "epoch": 4103} {"train_loss": -25.996923446655273, "global_step": 340611, "epoch": 4103} {"train_loss": -25.983896255493164, "global_step": 340612, "epoch": 4103} {"train_loss": -25.876026153564453, "global_step": 340613, "epoch": 4103} {"train_loss": -26.009069442749023, "global_step": 340614, "epoch": 4103} {"train_loss": -25.88372230529785, "global_step": 340615, "epoch": 4103} {"train_loss": -26.43109130859375, "global_step": 340616, "epoch": 4103} {"train_loss": -26.055429458618164, "global_step": 340617, "epoch": 4103} {"train_loss": -25.80484962463379, "global_step": 340618, "epoch": 4103} {"train_loss": -26.243066787719727, "global_step": 340619, "epoch": 4103} {"train_loss": -26.2607364654541, "global_step": 340620, "epoch": 4103} {"train_loss": -26.19061851501465, "global_step": 340621, "epoch": 4103} {"train_loss": -26.164825439453125, "global_step": 340622, "epoch": 4103} {"train_loss": -26.11592674255371, "global_step": 340623, "epoch": 4103} {"train_loss": -26.348026275634766, "global_step": 340624, "epoch": 4103} {"train_loss": -25.934782028198242, "global_step": 340625, "epoch": 4103} {"train_loss": -26.014001846313477, "global_step": 340626, "epoch": 4103} {"train_loss": -26.16482925415039, "global_step": 340627, "epoch": 4103} {"train_loss": -26.471506118774414, "global_step": 340628, "epoch": 4103} {"train_loss": -25.909997940063477, "global_step": 340629, "epoch": 4103} {"train_loss": -25.972497940063477, "global_step": 340630, "epoch": 4103} {"train_loss": -26.026521682739258, "global_step": 340631, "epoch": 4103, "val_loss": 6611712.0} {"train_loss": -26.0107364654541, "global_step": 340632, "epoch": 4104} {"train_loss": -25.67774772644043, "global_step": 340633, "epoch": 4104} {"train_loss": -25.644515991210938, "global_step": 340634, "epoch": 4104} {"train_loss": -25.420263290405273, "global_step": 340635, "epoch": 4104} {"train_loss": -25.666107177734375, "global_step": 340636, "epoch": 4104} {"train_loss": -25.575666427612305, "global_step": 340637, "epoch": 4104} {"train_loss": -25.958703994750977, "global_step": 340638, "epoch": 4104} {"train_loss": -25.955183029174805, "global_step": 340639, "epoch": 4104} {"train_loss": -25.76753807067871, "global_step": 340640, "epoch": 4104} {"train_loss": -25.306442260742188, "global_step": 340641, "epoch": 4104} {"train_loss": -25.84153175354004, "global_step": 340642, "epoch": 4104} {"train_loss": -26.005603790283203, "global_step": 340643, "epoch": 4104} {"train_loss": -25.33066177368164, "global_step": 340644, "epoch": 4104} {"train_loss": -25.855390548706055, "global_step": 340645, "epoch": 4104} {"train_loss": -25.75093650817871, "global_step": 340646, "epoch": 4104} {"train_loss": -26.036209106445312, "global_step": 340647, "epoch": 4104} {"train_loss": -26.005146026611328, "global_step": 340648, "epoch": 4104} {"train_loss": -25.9205322265625, "global_step": 340649, "epoch": 4104} {"train_loss": -26.020124435424805, "global_step": 340650, "epoch": 4104} {"train_loss": -25.63534927368164, "global_step": 340651, "epoch": 4104} {"train_loss": -25.871017456054688, "global_step": 340652, "epoch": 4104} {"train_loss": -26.085351943969727, "global_step": 340653, "epoch": 4104} {"train_loss": -26.00876235961914, "global_step": 340654, "epoch": 4104} {"train_loss": -26.330337524414062, "global_step": 340655, "epoch": 4104} {"train_loss": -26.13844108581543, "global_step": 340656, "epoch": 4104} {"train_loss": -26.03949546813965, "global_step": 340657, "epoch": 4104} {"train_loss": -25.840621948242188, "global_step": 340658, "epoch": 4104} {"train_loss": -26.18361473083496, "global_step": 340659, "epoch": 4104} {"train_loss": -25.990278244018555, "global_step": 340660, "epoch": 4104} {"train_loss": -26.3498592376709, "global_step": 340661, "epoch": 4104} {"train_loss": -26.432722091674805, "global_step": 340662, "epoch": 4104} {"train_loss": -25.72269630432129, "global_step": 340663, "epoch": 4104} {"train_loss": -25.812255859375, "global_step": 340664, "epoch": 4104} {"train_loss": -26.4771785736084, "global_step": 340665, "epoch": 4104} {"train_loss": -26.108503341674805, "global_step": 340666, "epoch": 4104} {"train_loss": -25.800861358642578, "global_step": 340667, "epoch": 4104} {"train_loss": -26.004541397094727, "global_step": 340668, "epoch": 4104} {"train_loss": -25.979293823242188, "global_step": 340669, "epoch": 4104} {"train_loss": -26.319746017456055, "global_step": 340670, "epoch": 4104} {"train_loss": -25.9377384185791, "global_step": 340671, "epoch": 4104} {"train_loss": -26.180532455444336, "global_step": 340672, "epoch": 4104} {"train_loss": -26.094900131225586, "global_step": 340673, "epoch": 4104} {"train_loss": -26.321680068969727, "global_step": 340674, "epoch": 4104} {"train_loss": -26.247974395751953, "global_step": 340675, "epoch": 4104} {"train_loss": -26.17766761779785, "global_step": 340676, "epoch": 4104} {"train_loss": -26.411630630493164, "global_step": 340677, "epoch": 4104} {"train_loss": -26.196277618408203, "global_step": 340678, "epoch": 4104} {"train_loss": -26.182355880737305, "global_step": 340679, "epoch": 4104} {"train_loss": -26.296289443969727, "global_step": 340680, "epoch": 4104} {"train_loss": -26.1555233001709, "global_step": 340681, "epoch": 4104} {"train_loss": -26.387304306030273, "global_step": 340682, "epoch": 4104} {"train_loss": -26.470361709594727, "global_step": 340683, "epoch": 4104} {"train_loss": -26.303253173828125, "global_step": 340684, "epoch": 4104} {"train_loss": -26.43995475769043, "global_step": 340685, "epoch": 4104} {"train_loss": -25.947586059570312, "global_step": 340686, "epoch": 4104} {"train_loss": -26.20757484436035, "global_step": 340687, "epoch": 4104} {"train_loss": -26.030517578125, "global_step": 340688, "epoch": 4104} {"train_loss": -26.233102798461914, "global_step": 340689, "epoch": 4104} {"train_loss": -26.23932456970215, "global_step": 340690, "epoch": 4104} {"train_loss": -25.72237205505371, "global_step": 340691, "epoch": 4104} {"train_loss": -25.808435440063477, "global_step": 340692, "epoch": 4104} {"train_loss": -26.05085563659668, "global_step": 340693, "epoch": 4104} {"train_loss": -25.905073165893555, "global_step": 340694, "epoch": 4104} {"train_loss": -25.926748275756836, "global_step": 340695, "epoch": 4104} {"train_loss": -26.028772354125977, "global_step": 340696, "epoch": 4104} {"train_loss": -26.055469512939453, "global_step": 340697, "epoch": 4104} {"train_loss": -25.740930557250977, "global_step": 340698, "epoch": 4104} {"train_loss": -26.025609970092773, "global_step": 340699, "epoch": 4104} {"train_loss": -25.913776397705078, "global_step": 340700, "epoch": 4104} {"train_loss": -25.678403854370117, "global_step": 340701, "epoch": 4104} {"train_loss": -25.5578670501709, "global_step": 340702, "epoch": 4104} {"train_loss": -26.136884689331055, "global_step": 340703, "epoch": 4104} {"train_loss": -25.752233505249023, "global_step": 340704, "epoch": 4104} {"train_loss": -26.00921058654785, "global_step": 340705, "epoch": 4104} {"train_loss": -26.35675048828125, "global_step": 340706, "epoch": 4104} {"train_loss": -25.707284927368164, "global_step": 340707, "epoch": 4104} {"train_loss": -25.753686904907227, "global_step": 340708, "epoch": 4104} {"train_loss": -25.588804244995117, "global_step": 340709, "epoch": 4104} {"train_loss": -26.168472290039062, "global_step": 340710, "epoch": 4104} {"train_loss": -26.12299919128418, "global_step": 340711, "epoch": 4104} {"train_loss": -25.521127700805664, "global_step": 340712, "epoch": 4104} {"train_loss": -26.137054443359375, "global_step": 340713, "epoch": 4104} {"train_loss": -26.0041045453175, "global_step": 340714, "epoch": 4104, "val_loss": 6644350.0} {"train_loss": -25.701486587524414, "global_step": 340715, "epoch": 4105} {"train_loss": -25.3902645111084, "global_step": 340716, "epoch": 4105} {"train_loss": -25.904296875, "global_step": 340717, "epoch": 4105} {"train_loss": -25.67563247680664, "global_step": 340718, "epoch": 4105} {"train_loss": -25.726099014282227, "global_step": 340719, "epoch": 4105} {"train_loss": -25.025482177734375, "global_step": 340720, "epoch": 4105} {"train_loss": -25.658185958862305, "global_step": 340721, "epoch": 4105} {"train_loss": -25.42388343811035, "global_step": 340722, "epoch": 4105} {"train_loss": -26.035491943359375, "global_step": 340723, "epoch": 4105} {"train_loss": -25.79457664489746, "global_step": 340724, "epoch": 4105} {"train_loss": -26.06707763671875, "global_step": 340725, "epoch": 4105} {"train_loss": -25.97858238220215, "global_step": 340726, "epoch": 4105} {"train_loss": -26.019779205322266, "global_step": 340727, "epoch": 4105} {"train_loss": -25.658004760742188, "global_step": 340728, "epoch": 4105} {"train_loss": -25.576948165893555, "global_step": 340729, "epoch": 4105} {"train_loss": -26.463897705078125, "global_step": 340730, "epoch": 4105} {"train_loss": -25.8865909576416, "global_step": 340731, "epoch": 4105} {"train_loss": -25.859638214111328, "global_step": 340732, "epoch": 4105} {"train_loss": -26.100238800048828, "global_step": 340733, "epoch": 4105} {"train_loss": -26.0955753326416, "global_step": 340734, "epoch": 4105} {"train_loss": -25.864877700805664, "global_step": 340735, "epoch": 4105} {"train_loss": -26.008865356445312, "global_step": 340736, "epoch": 4105} {"train_loss": -25.759021759033203, "global_step": 340737, "epoch": 4105} {"train_loss": -25.755422592163086, "global_step": 340738, "epoch": 4105} {"train_loss": -26.01601219177246, "global_step": 340739, "epoch": 4105} {"train_loss": -26.012075424194336, "global_step": 340740, "epoch": 4105} {"train_loss": -25.72601890563965, "global_step": 340741, "epoch": 4105} {"train_loss": -26.074390411376953, "global_step": 340742, "epoch": 4105} {"train_loss": -26.229095458984375, "global_step": 340743, "epoch": 4105} {"train_loss": -26.02044677734375, "global_step": 340744, "epoch": 4105} {"train_loss": -25.93354606628418, "global_step": 340745, "epoch": 4105} {"train_loss": -25.687742233276367, "global_step": 340746, "epoch": 4105} {"train_loss": -26.27618980407715, "global_step": 340747, "epoch": 4105} {"train_loss": -25.87502098083496, "global_step": 340748, "epoch": 4105} {"train_loss": -26.09928321838379, "global_step": 340749, "epoch": 4105} {"train_loss": -25.89679527282715, "global_step": 340750, "epoch": 4105} {"train_loss": -26.101205825805664, "global_step": 340751, "epoch": 4105} {"train_loss": -26.396533966064453, "global_step": 340752, "epoch": 4105} {"train_loss": -26.078458786010742, "global_step": 340753, "epoch": 4105} {"train_loss": -25.621484756469727, "global_step": 340754, "epoch": 4105} {"train_loss": -26.108449935913086, "global_step": 340755, "epoch": 4105} {"train_loss": -26.47994041442871, "global_step": 340756, "epoch": 4105} {"train_loss": -26.04176902770996, "global_step": 340757, "epoch": 4105} {"train_loss": -26.515033721923828, "global_step": 340758, "epoch": 4105} {"train_loss": -26.131391525268555, "global_step": 340759, "epoch": 4105} {"train_loss": -26.042083740234375, "global_step": 340760, "epoch": 4105} {"train_loss": -25.688568115234375, "global_step": 340761, "epoch": 4105} {"train_loss": -26.121997833251953, "global_step": 340762, "epoch": 4105} {"train_loss": -26.069379806518555, "global_step": 340763, "epoch": 4105} {"train_loss": -25.7542667388916, "global_step": 340764, "epoch": 4105} {"train_loss": -25.881017684936523, "global_step": 340765, "epoch": 4105} {"train_loss": -25.390485763549805, "global_step": 340766, "epoch": 4105} {"train_loss": -26.17009925842285, "global_step": 340767, "epoch": 4105} {"train_loss": -25.75510025024414, "global_step": 340768, "epoch": 4105} {"train_loss": -25.49681854248047, "global_step": 340769, "epoch": 4105} {"train_loss": -26.17919921875, "global_step": 340770, "epoch": 4105} {"train_loss": -26.174530029296875, "global_step": 340771, "epoch": 4105} {"train_loss": -25.79498291015625, "global_step": 340772, "epoch": 4105} {"train_loss": -25.742795944213867, "global_step": 340773, "epoch": 4105} {"train_loss": -25.952077865600586, "global_step": 340774, "epoch": 4105} {"train_loss": -26.0103702545166, "global_step": 340775, "epoch": 4105} {"train_loss": -25.81339454650879, "global_step": 340776, "epoch": 4105} {"train_loss": -25.82386589050293, "global_step": 340777, "epoch": 4105} {"train_loss": -25.806982040405273, "global_step": 340778, "epoch": 4105} {"train_loss": -25.937707901000977, "global_step": 340779, "epoch": 4105} {"train_loss": -25.68882179260254, "global_step": 340780, "epoch": 4105} {"train_loss": -26.037382125854492, "global_step": 340781, "epoch": 4105} {"train_loss": -25.636402130126953, "global_step": 340782, "epoch": 4105} {"train_loss": -26.0943546295166, "global_step": 340783, "epoch": 4105} {"train_loss": -25.93448257446289, "global_step": 340784, "epoch": 4105} {"train_loss": -26.176481246948242, "global_step": 340785, "epoch": 4105} {"train_loss": -26.306659698486328, "global_step": 340786, "epoch": 4105} {"train_loss": -26.184141159057617, "global_step": 340787, "epoch": 4105} {"train_loss": -25.96160316467285, "global_step": 340788, "epoch": 4105} {"train_loss": -26.236419677734375, "global_step": 340789, "epoch": 4105} {"train_loss": -26.3504695892334, "global_step": 340790, "epoch": 4105} {"train_loss": -26.1293888092041, "global_step": 340791, "epoch": 4105} {"train_loss": -26.0579891204834, "global_step": 340792, "epoch": 4105} {"train_loss": -26.29509925842285, "global_step": 340793, "epoch": 4105} {"train_loss": -26.281448364257812, "global_step": 340794, "epoch": 4105} {"train_loss": -25.8727970123291, "global_step": 340795, "epoch": 4105} {"train_loss": -26.09256362915039, "global_step": 340796, "epoch": 4105} {"train_loss": -25.93682838348021, "global_step": 340797, "epoch": 4105, "val_loss": 6606469.0} {"train_loss": -25.386545181274414, "global_step": 340798, "epoch": 4106} {"train_loss": -26.31048011779785, "global_step": 340799, "epoch": 4106} {"train_loss": -25.584228515625, "global_step": 340800, "epoch": 4106} {"train_loss": -25.76653480529785, "global_step": 340801, "epoch": 4106} {"train_loss": -26.048349380493164, "global_step": 340802, "epoch": 4106} {"train_loss": -26.167224884033203, "global_step": 340803, "epoch": 4106} {"train_loss": -25.699695587158203, "global_step": 340804, "epoch": 4106} {"train_loss": -25.63687515258789, "global_step": 340805, "epoch": 4106} {"train_loss": -25.745737075805664, "global_step": 340806, "epoch": 4106} {"train_loss": -25.6152400970459, "global_step": 340807, "epoch": 4106} {"train_loss": -25.845794677734375, "global_step": 340808, "epoch": 4106} {"train_loss": -25.806737899780273, "global_step": 340809, "epoch": 4106} {"train_loss": -26.04266929626465, "global_step": 340810, "epoch": 4106} {"train_loss": -25.46632194519043, "global_step": 340811, "epoch": 4106} {"train_loss": -25.918975830078125, "global_step": 340812, "epoch": 4106} {"train_loss": -26.043970108032227, "global_step": 340813, "epoch": 4106} {"train_loss": -25.787900924682617, "global_step": 340814, "epoch": 4106} {"train_loss": -25.514982223510742, "global_step": 340815, "epoch": 4106} {"train_loss": -25.997852325439453, "global_step": 340816, "epoch": 4106} {"train_loss": -25.991628646850586, "global_step": 340817, "epoch": 4106} {"train_loss": -26.03983497619629, "global_step": 340818, "epoch": 4106} {"train_loss": -25.986774444580078, "global_step": 340819, "epoch": 4106} {"train_loss": -26.14580726623535, "global_step": 340820, "epoch": 4106} {"train_loss": -26.270544052124023, "global_step": 340821, "epoch": 4106} {"train_loss": -25.858325958251953, "global_step": 340822, "epoch": 4106} {"train_loss": -25.860401153564453, "global_step": 340823, "epoch": 4106} {"train_loss": -25.782201766967773, "global_step": 340824, "epoch": 4106} {"train_loss": -26.001920700073242, "global_step": 340825, "epoch": 4106} {"train_loss": -26.095808029174805, "global_step": 340826, "epoch": 4106} {"train_loss": -26.0211124420166, "global_step": 340827, "epoch": 4106} {"train_loss": -25.937875747680664, "global_step": 340828, "epoch": 4106} {"train_loss": -26.494848251342773, "global_step": 340829, "epoch": 4106} {"train_loss": -26.3009033203125, "global_step": 340830, "epoch": 4106} {"train_loss": -26.181034088134766, "global_step": 340831, "epoch": 4106} {"train_loss": -25.968341827392578, "global_step": 340832, "epoch": 4106} {"train_loss": -26.30033302307129, "global_step": 340833, "epoch": 4106} {"train_loss": -25.893157958984375, "global_step": 340834, "epoch": 4106} {"train_loss": -25.88223648071289, "global_step": 340835, "epoch": 4106} {"train_loss": -26.160633087158203, "global_step": 340836, "epoch": 4106} {"train_loss": -26.07612419128418, "global_step": 340837, "epoch": 4106} {"train_loss": -26.174564361572266, "global_step": 340838, "epoch": 4106} {"train_loss": -25.98615074157715, "global_step": 340839, "epoch": 4106} {"train_loss": -26.248504638671875, "global_step": 340840, "epoch": 4106} {"train_loss": -26.42390251159668, "global_step": 340841, "epoch": 4106} {"train_loss": -26.138092041015625, "global_step": 340842, "epoch": 4106} {"train_loss": -26.085254669189453, "global_step": 340843, "epoch": 4106} {"train_loss": -26.537595748901367, "global_step": 340844, "epoch": 4106} {"train_loss": -26.165882110595703, "global_step": 340845, "epoch": 4106} {"train_loss": -26.307052612304688, "global_step": 340846, "epoch": 4106} {"train_loss": -26.032560348510742, "global_step": 340847, "epoch": 4106} {"train_loss": -26.16255760192871, "global_step": 340848, "epoch": 4106} {"train_loss": -26.533926010131836, "global_step": 340849, "epoch": 4106} {"train_loss": -26.66904067993164, "global_step": 340850, "epoch": 4106} {"train_loss": -26.007404327392578, "global_step": 340851, "epoch": 4106} {"train_loss": -25.903345108032227, "global_step": 340852, "epoch": 4106} {"train_loss": -25.943084716796875, "global_step": 340853, "epoch": 4106} {"train_loss": -25.897748947143555, "global_step": 340854, "epoch": 4106} {"train_loss": -25.697839736938477, "global_step": 340855, "epoch": 4106} {"train_loss": -26.11867332458496, "global_step": 340856, "epoch": 4106} {"train_loss": -25.97926902770996, "global_step": 340857, "epoch": 4106} {"train_loss": -26.074705123901367, "global_step": 340858, "epoch": 4106} {"train_loss": -25.954513549804688, "global_step": 340859, "epoch": 4106} {"train_loss": -26.13242530822754, "global_step": 340860, "epoch": 4106} {"train_loss": -26.547122955322266, "global_step": 340861, "epoch": 4106} {"train_loss": -25.948408126831055, "global_step": 340862, "epoch": 4106} {"train_loss": -25.941070556640625, "global_step": 340863, "epoch": 4106} {"train_loss": -26.25594139099121, "global_step": 340864, "epoch": 4106} {"train_loss": -26.1107177734375, "global_step": 340865, "epoch": 4106} {"train_loss": -26.163135528564453, "global_step": 340866, "epoch": 4106} {"train_loss": -26.348480224609375, "global_step": 340867, "epoch": 4106} {"train_loss": -25.653324127197266, "global_step": 340868, "epoch": 4106} {"train_loss": -25.86493492126465, "global_step": 340869, "epoch": 4106} {"train_loss": -26.292673110961914, "global_step": 340870, "epoch": 4106} {"train_loss": -26.363677978515625, "global_step": 340871, "epoch": 4106} {"train_loss": -26.290021896362305, "global_step": 340872, "epoch": 4106} {"train_loss": -26.2520809173584, "global_step": 340873, "epoch": 4106} {"train_loss": -25.888538360595703, "global_step": 340874, "epoch": 4106} {"train_loss": -26.152429580688477, "global_step": 340875, "epoch": 4106} {"train_loss": -25.900014877319336, "global_step": 340876, "epoch": 4106} {"train_loss": -25.99428367614746, "global_step": 340877, "epoch": 4106} {"train_loss": -26.338226318359375, "global_step": 340878, "epoch": 4106} {"train_loss": -26.227888107299805, "global_step": 340879, "epoch": 4106} {"train_loss": -26.038952563182416, "global_step": 340880, "epoch": 4106, "val_loss": 6602718.0} {"train_loss": -24.926441192626953, "global_step": 340881, "epoch": 4107} {"train_loss": -24.979764938354492, "global_step": 340882, "epoch": 4107} {"train_loss": -25.842376708984375, "global_step": 340883, "epoch": 4107} {"train_loss": -25.7474422454834, "global_step": 340884, "epoch": 4107} {"train_loss": -24.931325912475586, "global_step": 340885, "epoch": 4107} {"train_loss": -25.78899574279785, "global_step": 340886, "epoch": 4107} {"train_loss": -25.91944694519043, "global_step": 340887, "epoch": 4107} {"train_loss": -25.35226821899414, "global_step": 340888, "epoch": 4107} {"train_loss": -25.970947265625, "global_step": 340889, "epoch": 4107} {"train_loss": -26.020009994506836, "global_step": 340890, "epoch": 4107} {"train_loss": -25.91806411743164, "global_step": 340891, "epoch": 4107} {"train_loss": -26.236356735229492, "global_step": 340892, "epoch": 4107} {"train_loss": -26.139434814453125, "global_step": 340893, "epoch": 4107} {"train_loss": -25.788034439086914, "global_step": 340894, "epoch": 4107} {"train_loss": -26.168975830078125, "global_step": 340895, "epoch": 4107} {"train_loss": -26.314123153686523, "global_step": 340896, "epoch": 4107} {"train_loss": -26.055713653564453, "global_step": 340897, "epoch": 4107} {"train_loss": -26.216907501220703, "global_step": 340898, "epoch": 4107} {"train_loss": -26.035741806030273, "global_step": 340899, "epoch": 4107} {"train_loss": -26.011932373046875, "global_step": 340900, "epoch": 4107} {"train_loss": -26.015493392944336, "global_step": 340901, "epoch": 4107} {"train_loss": -26.19764518737793, "global_step": 340902, "epoch": 4107} {"train_loss": -26.410247802734375, "global_step": 340903, "epoch": 4107} {"train_loss": -26.024555206298828, "global_step": 340904, "epoch": 4107} {"train_loss": -26.07779312133789, "global_step": 340905, "epoch": 4107} {"train_loss": -26.421783447265625, "global_step": 340906, "epoch": 4107} {"train_loss": -26.037384033203125, "global_step": 340907, "epoch": 4107} {"train_loss": -25.96280288696289, "global_step": 340908, "epoch": 4107} {"train_loss": -26.24567985534668, "global_step": 340909, "epoch": 4107} {"train_loss": -26.279468536376953, "global_step": 340910, "epoch": 4107} {"train_loss": -25.67020034790039, "global_step": 340911, "epoch": 4107} {"train_loss": -25.94724464416504, "global_step": 340912, "epoch": 4107} {"train_loss": -26.366159439086914, "global_step": 340913, "epoch": 4107} {"train_loss": -25.622289657592773, "global_step": 340914, "epoch": 4107} {"train_loss": -26.252288818359375, "global_step": 340915, "epoch": 4107} {"train_loss": -25.900251388549805, "global_step": 340916, "epoch": 4107} {"train_loss": -26.228723526000977, "global_step": 340917, "epoch": 4107} {"train_loss": -26.397171020507812, "global_step": 340918, "epoch": 4107} {"train_loss": -26.033084869384766, "global_step": 340919, "epoch": 4107} {"train_loss": -25.903045654296875, "global_step": 340920, "epoch": 4107} {"train_loss": -26.079833984375, "global_step": 340921, "epoch": 4107} {"train_loss": -26.131681442260742, "global_step": 340922, "epoch": 4107} {"train_loss": -26.040674209594727, "global_step": 340923, "epoch": 4107} {"train_loss": -26.06960105895996, "global_step": 340924, "epoch": 4107} {"train_loss": -25.823530197143555, "global_step": 340925, "epoch": 4107} {"train_loss": -26.245901107788086, "global_step": 340926, "epoch": 4107} {"train_loss": -26.004220962524414, "global_step": 340927, "epoch": 4107} {"train_loss": -25.355792999267578, "global_step": 340928, "epoch": 4107} {"train_loss": -25.883275985717773, "global_step": 340929, "epoch": 4107} {"train_loss": -26.021360397338867, "global_step": 340930, "epoch": 4107} {"train_loss": -26.0726261138916, "global_step": 340931, "epoch": 4107} {"train_loss": -25.947553634643555, "global_step": 340932, "epoch": 4107} {"train_loss": -26.36343765258789, "global_step": 340933, "epoch": 4107} {"train_loss": -26.146284103393555, "global_step": 340934, "epoch": 4107} {"train_loss": -26.415002822875977, "global_step": 340935, "epoch": 4107} {"train_loss": -26.04444694519043, "global_step": 340936, "epoch": 4107} {"train_loss": -25.896726608276367, "global_step": 340937, "epoch": 4107} {"train_loss": -25.993371963500977, "global_step": 340938, "epoch": 4107} {"train_loss": -26.098464965820312, "global_step": 340939, "epoch": 4107} {"train_loss": -26.133514404296875, "global_step": 340940, "epoch": 4107} {"train_loss": -25.695316314697266, "global_step": 340941, "epoch": 4107} {"train_loss": -25.79043960571289, "global_step": 340942, "epoch": 4107} {"train_loss": -25.46699333190918, "global_step": 340943, "epoch": 4107} {"train_loss": -25.995975494384766, "global_step": 340944, "epoch": 4107} {"train_loss": -26.01031494140625, "global_step": 340945, "epoch": 4107} {"train_loss": -25.899688720703125, "global_step": 340946, "epoch": 4107} {"train_loss": -26.28529930114746, "global_step": 340947, "epoch": 4107} {"train_loss": -26.292037963867188, "global_step": 340948, "epoch": 4107} {"train_loss": -26.156452178955078, "global_step": 340949, "epoch": 4107} {"train_loss": -26.168981552124023, "global_step": 340950, "epoch": 4107} {"train_loss": -26.066129684448242, "global_step": 340951, "epoch": 4107} {"train_loss": -25.94306755065918, "global_step": 340952, "epoch": 4107} {"train_loss": -26.205774307250977, "global_step": 340953, "epoch": 4107} {"train_loss": -26.118497848510742, "global_step": 340954, "epoch": 4107} {"train_loss": -26.028213500976562, "global_step": 340955, "epoch": 4107} {"train_loss": -26.357358932495117, "global_step": 340956, "epoch": 4107} {"train_loss": -25.8720703125, "global_step": 340957, "epoch": 4107} {"train_loss": -25.737335205078125, "global_step": 340958, "epoch": 4107} {"train_loss": -26.198957443237305, "global_step": 340959, "epoch": 4107} {"train_loss": -25.898893356323242, "global_step": 340960, "epoch": 4107} {"train_loss": -26.301733016967773, "global_step": 340961, "epoch": 4107} {"train_loss": -25.75058937072754, "global_step": 340962, "epoch": 4107} {"train_loss": -25.99464455570083, "global_step": 340963, "epoch": 4107, "val_loss": 6592015.5} {"train_loss": -25.89015769958496, "global_step": 340964, "epoch": 4108} {"train_loss": -25.735050201416016, "global_step": 340965, "epoch": 4108} {"train_loss": -25.68304443359375, "global_step": 340966, "epoch": 4108} {"train_loss": -25.681156158447266, "global_step": 340967, "epoch": 4108} {"train_loss": -25.760976791381836, "global_step": 340968, "epoch": 4108} {"train_loss": -25.016857147216797, "global_step": 340969, "epoch": 4108} {"train_loss": -25.49764633178711, "global_step": 340970, "epoch": 4108} {"train_loss": -25.731098175048828, "global_step": 340971, "epoch": 4108} {"train_loss": -25.880102157592773, "global_step": 340972, "epoch": 4108} {"train_loss": -25.674625396728516, "global_step": 340973, "epoch": 4108} {"train_loss": -26.07745933532715, "global_step": 340974, "epoch": 4108} {"train_loss": -25.931604385375977, "global_step": 340975, "epoch": 4108} {"train_loss": -25.767963409423828, "global_step": 340976, "epoch": 4108} {"train_loss": -26.125009536743164, "global_step": 340977, "epoch": 4108} {"train_loss": -25.743732452392578, "global_step": 340978, "epoch": 4108} {"train_loss": -25.319684982299805, "global_step": 340979, "epoch": 4108} {"train_loss": -25.79947853088379, "global_step": 340980, "epoch": 4108} {"train_loss": -25.80074119567871, "global_step": 340981, "epoch": 4108} {"train_loss": -26.1673641204834, "global_step": 340982, "epoch": 4108} {"train_loss": -26.26997184753418, "global_step": 340983, "epoch": 4108} {"train_loss": -25.778528213500977, "global_step": 340984, "epoch": 4108} {"train_loss": -26.279972076416016, "global_step": 340985, "epoch": 4108} {"train_loss": -25.790119171142578, "global_step": 340986, "epoch": 4108} {"train_loss": -26.181110382080078, "global_step": 340987, "epoch": 4108} {"train_loss": -26.177297592163086, "global_step": 340988, "epoch": 4108} {"train_loss": -26.0831241607666, "global_step": 340989, "epoch": 4108} {"train_loss": -25.990955352783203, "global_step": 340990, "epoch": 4108} {"train_loss": -26.49683952331543, "global_step": 340991, "epoch": 4108} {"train_loss": -26.043798446655273, "global_step": 340992, "epoch": 4108} {"train_loss": -25.939695358276367, "global_step": 340993, "epoch": 4108} {"train_loss": -26.126733779907227, "global_step": 340994, "epoch": 4108} {"train_loss": -26.205097198486328, "global_step": 340995, "epoch": 4108} {"train_loss": -26.209630966186523, "global_step": 340996, "epoch": 4108} {"train_loss": -26.05415916442871, "global_step": 340997, "epoch": 4108} {"train_loss": -26.179630279541016, "global_step": 340998, "epoch": 4108} {"train_loss": -25.947229385375977, "global_step": 340999, "epoch": 4108} {"train_loss": -26.05122184753418, "global_step": 341000, "epoch": 4108} {"train_loss": -25.991430282592773, "global_step": 341001, "epoch": 4108} {"train_loss": -26.300079345703125, "global_step": 341002, "epoch": 4108} {"train_loss": -26.462726593017578, "global_step": 341003, "epoch": 4108} {"train_loss": -26.41449546813965, "global_step": 341004, "epoch": 4108} {"train_loss": -26.227933883666992, "global_step": 341005, "epoch": 4108} {"train_loss": -26.069995880126953, "global_step": 341006, "epoch": 4108} {"train_loss": -26.234750747680664, "global_step": 341007, "epoch": 4108} {"train_loss": -26.352783203125, "global_step": 341008, "epoch": 4108} {"train_loss": -26.4566593170166, "global_step": 341009, "epoch": 4108} {"train_loss": -25.999433517456055, "global_step": 341010, "epoch": 4108} {"train_loss": -25.818601608276367, "global_step": 341011, "epoch": 4108} {"train_loss": -25.70305824279785, "global_step": 341012, "epoch": 4108} {"train_loss": -25.534391403198242, "global_step": 341013, "epoch": 4108} {"train_loss": -26.04828453063965, "global_step": 341014, "epoch": 4108} {"train_loss": -26.199670791625977, "global_step": 341015, "epoch": 4108} {"train_loss": -26.078968048095703, "global_step": 341016, "epoch": 4108} {"train_loss": -25.66655921936035, "global_step": 341017, "epoch": 4108} {"train_loss": -25.71405601501465, "global_step": 341018, "epoch": 4108} {"train_loss": -26.02686882019043, "global_step": 341019, "epoch": 4108} {"train_loss": -25.83131217956543, "global_step": 341020, "epoch": 4108} {"train_loss": -25.93243980407715, "global_step": 341021, "epoch": 4108} {"train_loss": -26.05132484436035, "global_step": 341022, "epoch": 4108} {"train_loss": -26.038166046142578, "global_step": 341023, "epoch": 4108} {"train_loss": -26.24895668029785, "global_step": 341024, "epoch": 4108} {"train_loss": -26.379724502563477, "global_step": 341025, "epoch": 4108} {"train_loss": -25.954532623291016, "global_step": 341026, "epoch": 4108} {"train_loss": -26.20940589904785, "global_step": 341027, "epoch": 4108} {"train_loss": -26.388858795166016, "global_step": 341028, "epoch": 4108} {"train_loss": -26.466373443603516, "global_step": 341029, "epoch": 4108} {"train_loss": -26.073591232299805, "global_step": 341030, "epoch": 4108} {"train_loss": -25.279584884643555, "global_step": 341031, "epoch": 4108} {"train_loss": -26.4277286529541, "global_step": 341032, "epoch": 4108} {"train_loss": -26.081024169921875, "global_step": 341033, "epoch": 4108} {"train_loss": -25.388280868530273, "global_step": 341034, "epoch": 4108} {"train_loss": -26.3519287109375, "global_step": 341035, "epoch": 4108} {"train_loss": -25.85248374938965, "global_step": 341036, "epoch": 4108} {"train_loss": -26.453113555908203, "global_step": 341037, "epoch": 4108} {"train_loss": -26.20615577697754, "global_step": 341038, "epoch": 4108} {"train_loss": -26.093948364257812, "global_step": 341039, "epoch": 4108} {"train_loss": -25.73408317565918, "global_step": 341040, "epoch": 4108} {"train_loss": -26.185155868530273, "global_step": 341041, "epoch": 4108} {"train_loss": -25.812910079956055, "global_step": 341042, "epoch": 4108} {"train_loss": -25.50406265258789, "global_step": 341043, "epoch": 4108} {"train_loss": -25.742816925048828, "global_step": 341044, "epoch": 4108} {"train_loss": -26.050439834594727, "global_step": 341045, "epoch": 4108} {"train_loss": -25.98126347093697, "global_step": 341046, "epoch": 4108, "val_loss": 6586588.0} {"train_loss": -24.51795196533203, "global_step": 341047, "epoch": 4109} {"train_loss": -24.736270904541016, "global_step": 341048, "epoch": 4109} {"train_loss": -24.93731689453125, "global_step": 341049, "epoch": 4109} {"train_loss": -24.24702262878418, "global_step": 341050, "epoch": 4109} {"train_loss": -25.50856590270996, "global_step": 341051, "epoch": 4109} {"train_loss": -25.068859100341797, "global_step": 341052, "epoch": 4109} {"train_loss": -25.61907386779785, "global_step": 341053, "epoch": 4109} {"train_loss": -25.208078384399414, "global_step": 341054, "epoch": 4109} {"train_loss": -25.219768524169922, "global_step": 341055, "epoch": 4109} {"train_loss": -25.534961700439453, "global_step": 341056, "epoch": 4109} {"train_loss": -25.547283172607422, "global_step": 341057, "epoch": 4109} {"train_loss": -25.56711769104004, "global_step": 341058, "epoch": 4109} {"train_loss": -25.54820442199707, "global_step": 341059, "epoch": 4109} {"train_loss": -25.199432373046875, "global_step": 341060, "epoch": 4109} {"train_loss": -25.6993465423584, "global_step": 341061, "epoch": 4109} {"train_loss": -25.754486083984375, "global_step": 341062, "epoch": 4109} {"train_loss": -25.38197898864746, "global_step": 341063, "epoch": 4109} {"train_loss": -25.70452880859375, "global_step": 341064, "epoch": 4109} {"train_loss": -25.56175422668457, "global_step": 341065, "epoch": 4109} {"train_loss": -25.623441696166992, "global_step": 341066, "epoch": 4109} {"train_loss": -25.494211196899414, "global_step": 341067, "epoch": 4109} {"train_loss": -25.89043617248535, "global_step": 341068, "epoch": 4109} {"train_loss": -25.60384178161621, "global_step": 341069, "epoch": 4109} {"train_loss": -26.2432804107666, "global_step": 341070, "epoch": 4109} {"train_loss": -25.524702072143555, "global_step": 341071, "epoch": 4109} {"train_loss": -25.814191818237305, "global_step": 341072, "epoch": 4109} {"train_loss": -25.967548370361328, "global_step": 341073, "epoch": 4109} {"train_loss": -25.592370986938477, "global_step": 341074, "epoch": 4109} {"train_loss": -25.963682174682617, "global_step": 341075, "epoch": 4109} {"train_loss": -25.81853675842285, "global_step": 341076, "epoch": 4109} {"train_loss": -26.100223541259766, "global_step": 341077, "epoch": 4109} {"train_loss": -25.817798614501953, "global_step": 341078, "epoch": 4109} {"train_loss": -25.672048568725586, "global_step": 341079, "epoch": 4109} {"train_loss": -26.011962890625, "global_step": 341080, "epoch": 4109} {"train_loss": -25.988666534423828, "global_step": 341081, "epoch": 4109} {"train_loss": -25.934356689453125, "global_step": 341082, "epoch": 4109} {"train_loss": -25.864957809448242, "global_step": 341083, "epoch": 4109} {"train_loss": -26.0136775970459, "global_step": 341084, "epoch": 4109} {"train_loss": -26.262409210205078, "global_step": 341085, "epoch": 4109} {"train_loss": -25.911823272705078, "global_step": 341086, "epoch": 4109} {"train_loss": -26.119726181030273, "global_step": 341087, "epoch": 4109} {"train_loss": -26.093286514282227, "global_step": 341088, "epoch": 4109} {"train_loss": -26.161405563354492, "global_step": 341089, "epoch": 4109} {"train_loss": -26.285375595092773, "global_step": 341090, "epoch": 4109} {"train_loss": -26.154748916625977, "global_step": 341091, "epoch": 4109} {"train_loss": -25.8577880859375, "global_step": 341092, "epoch": 4109} {"train_loss": -26.107858657836914, "global_step": 341093, "epoch": 4109} {"train_loss": -25.80415916442871, "global_step": 341094, "epoch": 4109} {"train_loss": -25.811643600463867, "global_step": 341095, "epoch": 4109} {"train_loss": -26.246702194213867, "global_step": 341096, "epoch": 4109} {"train_loss": -26.1571044921875, "global_step": 341097, "epoch": 4109} {"train_loss": -26.162939071655273, "global_step": 341098, "epoch": 4109} {"train_loss": -25.948944091796875, "global_step": 341099, "epoch": 4109} {"train_loss": -26.412799835205078, "global_step": 341100, "epoch": 4109} {"train_loss": -26.070037841796875, "global_step": 341101, "epoch": 4109} {"train_loss": -26.52204704284668, "global_step": 341102, "epoch": 4109} {"train_loss": -26.11075782775879, "global_step": 341103, "epoch": 4109} {"train_loss": -26.178180694580078, "global_step": 341104, "epoch": 4109} {"train_loss": -26.375417709350586, "global_step": 341105, "epoch": 4109} {"train_loss": -26.072607040405273, "global_step": 341106, "epoch": 4109} {"train_loss": -26.347415924072266, "global_step": 341107, "epoch": 4109} {"train_loss": -26.477766036987305, "global_step": 341108, "epoch": 4109} {"train_loss": -26.009790420532227, "global_step": 341109, "epoch": 4109} {"train_loss": -25.60758399963379, "global_step": 341110, "epoch": 4109} {"train_loss": -25.85602378845215, "global_step": 341111, "epoch": 4109} {"train_loss": -25.51424217224121, "global_step": 341112, "epoch": 4109} {"train_loss": -25.599567413330078, "global_step": 341113, "epoch": 4109} {"train_loss": -25.614171981811523, "global_step": 341114, "epoch": 4109} {"train_loss": -26.20035171508789, "global_step": 341115, "epoch": 4109} {"train_loss": -25.93170166015625, "global_step": 341116, "epoch": 4109} {"train_loss": -26.192899703979492, "global_step": 341117, "epoch": 4109} {"train_loss": -26.221166610717773, "global_step": 341118, "epoch": 4109} {"train_loss": -26.016164779663086, "global_step": 341119, "epoch": 4109} {"train_loss": -26.1507511138916, "global_step": 341120, "epoch": 4109} {"train_loss": -26.33637046813965, "global_step": 341121, "epoch": 4109} {"train_loss": -26.171173095703125, "global_step": 341122, "epoch": 4109} {"train_loss": -26.06785011291504, "global_step": 341123, "epoch": 4109} {"train_loss": -26.07421875, "global_step": 341124, "epoch": 4109} {"train_loss": -26.38319206237793, "global_step": 341125, "epoch": 4109} {"train_loss": -26.0978946685791, "global_step": 341126, "epoch": 4109} {"train_loss": -26.139917373657227, "global_step": 341127, "epoch": 4109} {"train_loss": -26.026105880737305, "global_step": 341128, "epoch": 4109} {"train_loss": -25.854969714061323, "global_step": 341129, "epoch": 4109, "val_loss": 6621101.0} {"train_loss": -25.40541648864746, "global_step": 341130, "epoch": 4110} {"train_loss": -25.2288761138916, "global_step": 341131, "epoch": 4110} {"train_loss": -25.119077682495117, "global_step": 341132, "epoch": 4110} {"train_loss": -25.488861083984375, "global_step": 341133, "epoch": 4110} {"train_loss": -26.092041015625, "global_step": 341134, "epoch": 4110} {"train_loss": -25.797653198242188, "global_step": 341135, "epoch": 4110} {"train_loss": -25.53096580505371, "global_step": 341136, "epoch": 4110} {"train_loss": -26.055511474609375, "global_step": 341137, "epoch": 4110} {"train_loss": -25.848709106445312, "global_step": 341138, "epoch": 4110} {"train_loss": -25.640600204467773, "global_step": 341139, "epoch": 4110} {"train_loss": -26.102575302124023, "global_step": 341140, "epoch": 4110} {"train_loss": -25.9083309173584, "global_step": 341141, "epoch": 4110} {"train_loss": -26.080352783203125, "global_step": 341142, "epoch": 4110} {"train_loss": -25.8570556640625, "global_step": 341143, "epoch": 4110} {"train_loss": -25.731672286987305, "global_step": 341144, "epoch": 4110} {"train_loss": -25.94374656677246, "global_step": 341145, "epoch": 4110} {"train_loss": -25.902868270874023, "global_step": 341146, "epoch": 4110} {"train_loss": -26.22376823425293, "global_step": 341147, "epoch": 4110} {"train_loss": -25.779769897460938, "global_step": 341148, "epoch": 4110} {"train_loss": -26.063922882080078, "global_step": 341149, "epoch": 4110} {"train_loss": -25.994848251342773, "global_step": 341150, "epoch": 4110} {"train_loss": -25.962743759155273, "global_step": 341151, "epoch": 4110} {"train_loss": -26.087604522705078, "global_step": 341152, "epoch": 4110} {"train_loss": -26.055255889892578, "global_step": 341153, "epoch": 4110} {"train_loss": -26.21575355529785, "global_step": 341154, "epoch": 4110} {"train_loss": -26.162811279296875, "global_step": 341155, "epoch": 4110} {"train_loss": -26.09991455078125, "global_step": 341156, "epoch": 4110} {"train_loss": -26.115819931030273, "global_step": 341157, "epoch": 4110} {"train_loss": -26.335830688476562, "global_step": 341158, "epoch": 4110} {"train_loss": -26.3311710357666, "global_step": 341159, "epoch": 4110} {"train_loss": -26.03904151916504, "global_step": 341160, "epoch": 4110} {"train_loss": -26.350126266479492, "global_step": 341161, "epoch": 4110} {"train_loss": -26.057449340820312, "global_step": 341162, "epoch": 4110} {"train_loss": -26.19635009765625, "global_step": 341163, "epoch": 4110} {"train_loss": -26.48420524597168, "global_step": 341164, "epoch": 4110} {"train_loss": -26.0058650970459, "global_step": 341165, "epoch": 4110} {"train_loss": -26.42763328552246, "global_step": 341166, "epoch": 4110} {"train_loss": -26.147886276245117, "global_step": 341167, "epoch": 4110} {"train_loss": -25.86760902404785, "global_step": 341168, "epoch": 4110} {"train_loss": -26.46489906311035, "global_step": 341169, "epoch": 4110} {"train_loss": -26.401578903198242, "global_step": 341170, "epoch": 4110} {"train_loss": -26.328632354736328, "global_step": 341171, "epoch": 4110} {"train_loss": -25.962656021118164, "global_step": 341172, "epoch": 4110} {"train_loss": -25.997028350830078, "global_step": 341173, "epoch": 4110} {"train_loss": -25.99566078186035, "global_step": 341174, "epoch": 4110} {"train_loss": -25.93987464904785, "global_step": 341175, "epoch": 4110} {"train_loss": -25.992380142211914, "global_step": 341176, "epoch": 4110} {"train_loss": -26.200239181518555, "global_step": 341177, "epoch": 4110} {"train_loss": -26.19644546508789, "global_step": 341178, "epoch": 4110} {"train_loss": -26.004444122314453, "global_step": 341179, "epoch": 4110} {"train_loss": -25.712799072265625, "global_step": 341180, "epoch": 4110} {"train_loss": -26.214313507080078, "global_step": 341181, "epoch": 4110} {"train_loss": -26.019805908203125, "global_step": 341182, "epoch": 4110} {"train_loss": -26.297393798828125, "global_step": 341183, "epoch": 4110} {"train_loss": -26.367345809936523, "global_step": 341184, "epoch": 4110} {"train_loss": -26.3511905670166, "global_step": 341185, "epoch": 4110} {"train_loss": -25.722400665283203, "global_step": 341186, "epoch": 4110} {"train_loss": -26.01063346862793, "global_step": 341187, "epoch": 4110} {"train_loss": -26.236845016479492, "global_step": 341188, "epoch": 4110} {"train_loss": -26.4144229888916, "global_step": 341189, "epoch": 4110} {"train_loss": -26.233062744140625, "global_step": 341190, "epoch": 4110} {"train_loss": -26.217538833618164, "global_step": 341191, "epoch": 4110} {"train_loss": -26.47342872619629, "global_step": 341192, "epoch": 4110} {"train_loss": -26.1884822845459, "global_step": 341193, "epoch": 4110} {"train_loss": -26.20071792602539, "global_step": 341194, "epoch": 4110} {"train_loss": -26.07257652282715, "global_step": 341195, "epoch": 4110} {"train_loss": -25.860260009765625, "global_step": 341196, "epoch": 4110} {"train_loss": -25.517499923706055, "global_step": 341197, "epoch": 4110} {"train_loss": -25.32910919189453, "global_step": 341198, "epoch": 4110} {"train_loss": -24.86282730102539, "global_step": 341199, "epoch": 4110} {"train_loss": -24.638460159301758, "global_step": 341200, "epoch": 4110} {"train_loss": -25.908878326416016, "global_step": 341201, "epoch": 4110} {"train_loss": -25.917316436767578, "global_step": 341202, "epoch": 4110} {"train_loss": -25.879438400268555, "global_step": 341203, "epoch": 4110} {"train_loss": -25.728376388549805, "global_step": 341204, "epoch": 4110} {"train_loss": -25.404939651489258, "global_step": 341205, "epoch": 4110} {"train_loss": -25.56805419921875, "global_step": 341206, "epoch": 4110} {"train_loss": -25.704944610595703, "global_step": 341207, "epoch": 4110} {"train_loss": -25.981037139892578, "global_step": 341208, "epoch": 4110} {"train_loss": -25.8244686126709, "global_step": 341209, "epoch": 4110} {"train_loss": -25.688846588134766, "global_step": 341210, "epoch": 4110} {"train_loss": -26.12228775024414, "global_step": 341211, "epoch": 4110} {"train_loss": -25.965464350688887, "global_step": 341212, "epoch": 4110, "val_loss": 6562556.5} {"train_loss": -25.648427963256836, "global_step": 341213, "epoch": 4111} {"train_loss": -25.881256103515625, "global_step": 341214, "epoch": 4111} {"train_loss": -25.3106746673584, "global_step": 341215, "epoch": 4111} {"train_loss": -25.620502471923828, "global_step": 341216, "epoch": 4111} {"train_loss": -25.446578979492188, "global_step": 341217, "epoch": 4111} {"train_loss": -25.65699577331543, "global_step": 341218, "epoch": 4111} {"train_loss": -25.780105590820312, "global_step": 341219, "epoch": 4111} {"train_loss": -25.711246490478516, "global_step": 341220, "epoch": 4111} {"train_loss": -25.416732788085938, "global_step": 341221, "epoch": 4111} {"train_loss": -26.030832290649414, "global_step": 341222, "epoch": 4111} {"train_loss": -25.766443252563477, "global_step": 341223, "epoch": 4111} {"train_loss": -26.00931167602539, "global_step": 341224, "epoch": 4111} {"train_loss": -26.03618812561035, "global_step": 341225, "epoch": 4111} {"train_loss": -26.043750762939453, "global_step": 341226, "epoch": 4111} {"train_loss": -25.8780460357666, "global_step": 341227, "epoch": 4111} {"train_loss": -25.687519073486328, "global_step": 341228, "epoch": 4111} {"train_loss": -25.70001220703125, "global_step": 341229, "epoch": 4111} {"train_loss": -25.833892822265625, "global_step": 341230, "epoch": 4111} {"train_loss": -25.751256942749023, "global_step": 341231, "epoch": 4111} {"train_loss": -26.16852378845215, "global_step": 341232, "epoch": 4111} {"train_loss": -26.068439483642578, "global_step": 341233, "epoch": 4111} {"train_loss": -26.036762237548828, "global_step": 341234, "epoch": 4111} {"train_loss": -26.338104248046875, "global_step": 341235, "epoch": 4111} {"train_loss": -26.124616622924805, "global_step": 341236, "epoch": 4111} {"train_loss": -26.08222007751465, "global_step": 341237, "epoch": 4111} {"train_loss": -26.05660057067871, "global_step": 341238, "epoch": 4111} {"train_loss": -26.139984130859375, "global_step": 341239, "epoch": 4111} {"train_loss": -26.234533309936523, "global_step": 341240, "epoch": 4111} {"train_loss": -26.011526107788086, "global_step": 341241, "epoch": 4111} {"train_loss": -26.016149520874023, "global_step": 341242, "epoch": 4111} {"train_loss": -25.929248809814453, "global_step": 341243, "epoch": 4111} {"train_loss": -26.100934982299805, "global_step": 341244, "epoch": 4111} {"train_loss": -26.277271270751953, "global_step": 341245, "epoch": 4111} {"train_loss": -26.19488525390625, "global_step": 341246, "epoch": 4111} {"train_loss": -25.962665557861328, "global_step": 341247, "epoch": 4111} {"train_loss": -26.139257431030273, "global_step": 341248, "epoch": 4111} {"train_loss": -26.2520694732666, "global_step": 341249, "epoch": 4111} {"train_loss": -26.55476951599121, "global_step": 341250, "epoch": 4111} {"train_loss": -25.848098754882812, "global_step": 341251, "epoch": 4111} {"train_loss": -26.22715187072754, "global_step": 341252, "epoch": 4111} {"train_loss": -26.135208129882812, "global_step": 341253, "epoch": 4111} {"train_loss": -26.138654708862305, "global_step": 341254, "epoch": 4111} {"train_loss": -26.09425926208496, "global_step": 341255, "epoch": 4111} {"train_loss": -26.300922393798828, "global_step": 341256, "epoch": 4111} {"train_loss": -26.156034469604492, "global_step": 341257, "epoch": 4111} {"train_loss": -26.004247665405273, "global_step": 341258, "epoch": 4111} {"train_loss": -26.26215934753418, "global_step": 341259, "epoch": 4111} {"train_loss": -26.352758407592773, "global_step": 341260, "epoch": 4111} {"train_loss": -26.12811851501465, "global_step": 341261, "epoch": 4111} {"train_loss": -25.99940299987793, "global_step": 341262, "epoch": 4111} {"train_loss": -25.49799919128418, "global_step": 341263, "epoch": 4111} {"train_loss": -25.88858985900879, "global_step": 341264, "epoch": 4111} {"train_loss": -26.128530502319336, "global_step": 341265, "epoch": 4111} {"train_loss": -26.05510902404785, "global_step": 341266, "epoch": 4111} {"train_loss": -26.09320640563965, "global_step": 341267, "epoch": 4111} {"train_loss": -26.324567794799805, "global_step": 341268, "epoch": 4111} {"train_loss": -26.6002197265625, "global_step": 341269, "epoch": 4111} {"train_loss": -26.341672897338867, "global_step": 341270, "epoch": 4111} {"train_loss": -25.95062828063965, "global_step": 341271, "epoch": 4111} {"train_loss": -26.01336669921875, "global_step": 341272, "epoch": 4111} {"train_loss": -25.533573150634766, "global_step": 341273, "epoch": 4111} {"train_loss": -25.867507934570312, "global_step": 341274, "epoch": 4111} {"train_loss": -26.170867919921875, "global_step": 341275, "epoch": 4111} {"train_loss": -26.144201278686523, "global_step": 341276, "epoch": 4111} {"train_loss": -26.196807861328125, "global_step": 341277, "epoch": 4111} {"train_loss": -25.995092391967773, "global_step": 341278, "epoch": 4111} {"train_loss": -26.034839630126953, "global_step": 341279, "epoch": 4111} {"train_loss": -25.899972915649414, "global_step": 341280, "epoch": 4111} {"train_loss": -26.402875900268555, "global_step": 341281, "epoch": 4111} {"train_loss": -26.257978439331055, "global_step": 341282, "epoch": 4111} {"train_loss": -25.84345817565918, "global_step": 341283, "epoch": 4111} {"train_loss": -26.44972038269043, "global_step": 341284, "epoch": 4111} {"train_loss": -26.088464736938477, "global_step": 341285, "epoch": 4111} {"train_loss": -26.524200439453125, "global_step": 341286, "epoch": 4111} {"train_loss": -26.119298934936523, "global_step": 341287, "epoch": 4111} {"train_loss": -26.10078239440918, "global_step": 341288, "epoch": 4111} {"train_loss": -25.928335189819336, "global_step": 341289, "epoch": 4111} {"train_loss": -26.32429313659668, "global_step": 341290, "epoch": 4111} {"train_loss": -26.16424560546875, "global_step": 341291, "epoch": 4111} {"train_loss": -25.722700119018555, "global_step": 341292, "epoch": 4111} {"train_loss": -26.372655868530273, "global_step": 341293, "epoch": 4111} {"train_loss": -26.60548210144043, "global_step": 341294, "epoch": 4111} {"train_loss": -26.013719995337798, "global_step": 341295, "epoch": 4111, "val_loss": 6632089.0} {"train_loss": -24.817380905151367, "global_step": 341296, "epoch": 4112} {"train_loss": -25.139440536499023, "global_step": 341297, "epoch": 4112} {"train_loss": -25.221542358398438, "global_step": 341298, "epoch": 4112} {"train_loss": -25.56672477722168, "global_step": 341299, "epoch": 4112} {"train_loss": -25.272825241088867, "global_step": 341300, "epoch": 4112} {"train_loss": -24.848264694213867, "global_step": 341301, "epoch": 4112} {"train_loss": -25.38730812072754, "global_step": 341302, "epoch": 4112} {"train_loss": -25.197254180908203, "global_step": 341303, "epoch": 4112} {"train_loss": -25.087148666381836, "global_step": 341304, "epoch": 4112} {"train_loss": -25.48801612854004, "global_step": 341305, "epoch": 4112} {"train_loss": -25.273542404174805, "global_step": 341306, "epoch": 4112} {"train_loss": -24.692031860351562, "global_step": 341307, "epoch": 4112} {"train_loss": -24.618188858032227, "global_step": 341308, "epoch": 4112} {"train_loss": -25.540071487426758, "global_step": 341309, "epoch": 4112} {"train_loss": -24.981664657592773, "global_step": 341310, "epoch": 4112} {"train_loss": -25.056365966796875, "global_step": 341311, "epoch": 4112} {"train_loss": -25.461551666259766, "global_step": 341312, "epoch": 4112} {"train_loss": -25.695343017578125, "global_step": 341313, "epoch": 4112} {"train_loss": -25.68389892578125, "global_step": 341314, "epoch": 4112} {"train_loss": -25.43233871459961, "global_step": 341315, "epoch": 4112} {"train_loss": -25.419025421142578, "global_step": 341316, "epoch": 4112} {"train_loss": -25.835813522338867, "global_step": 341317, "epoch": 4112} {"train_loss": -25.71283531188965, "global_step": 341318, "epoch": 4112} {"train_loss": -25.71870231628418, "global_step": 341319, "epoch": 4112} {"train_loss": -25.739133834838867, "global_step": 341320, "epoch": 4112} {"train_loss": -25.832172393798828, "global_step": 341321, "epoch": 4112} {"train_loss": -25.7857723236084, "global_step": 341322, "epoch": 4112} {"train_loss": -25.74420166015625, "global_step": 341323, "epoch": 4112} {"train_loss": -25.7061824798584, "global_step": 341324, "epoch": 4112} {"train_loss": -25.791492462158203, "global_step": 341325, "epoch": 4112} {"train_loss": -25.716873168945312, "global_step": 341326, "epoch": 4112} {"train_loss": -25.694461822509766, "global_step": 341327, "epoch": 4112} {"train_loss": -26.1282958984375, "global_step": 341328, "epoch": 4112} {"train_loss": -25.99161720275879, "global_step": 341329, "epoch": 4112} {"train_loss": -25.832929611206055, "global_step": 341330, "epoch": 4112} {"train_loss": -25.9660587310791, "global_step": 341331, "epoch": 4112} {"train_loss": -26.072736740112305, "global_step": 341332, "epoch": 4112} {"train_loss": -25.55997657775879, "global_step": 341333, "epoch": 4112} {"train_loss": -26.068344116210938, "global_step": 341334, "epoch": 4112} {"train_loss": -25.677112579345703, "global_step": 341335, "epoch": 4112} {"train_loss": -26.16248893737793, "global_step": 341336, "epoch": 4112} {"train_loss": -26.14472770690918, "global_step": 341337, "epoch": 4112} {"train_loss": -25.984790802001953, "global_step": 341338, "epoch": 4112} {"train_loss": -26.355560302734375, "global_step": 341339, "epoch": 4112} {"train_loss": -26.361221313476562, "global_step": 341340, "epoch": 4112} {"train_loss": -26.100637435913086, "global_step": 341341, "epoch": 4112} {"train_loss": -25.92609214782715, "global_step": 341342, "epoch": 4112} {"train_loss": -26.140106201171875, "global_step": 341343, "epoch": 4112} {"train_loss": -26.446455001831055, "global_step": 341344, "epoch": 4112} {"train_loss": -26.538297653198242, "global_step": 341345, "epoch": 4112} {"train_loss": -25.77139663696289, "global_step": 341346, "epoch": 4112} {"train_loss": -26.110448837280273, "global_step": 341347, "epoch": 4112} {"train_loss": -26.29115104675293, "global_step": 341348, "epoch": 4112} {"train_loss": -26.114282608032227, "global_step": 341349, "epoch": 4112} {"train_loss": -26.53074073791504, "global_step": 341350, "epoch": 4112} {"train_loss": -26.205337524414062, "global_step": 341351, "epoch": 4112} {"train_loss": -26.06743812561035, "global_step": 341352, "epoch": 4112} {"train_loss": -26.289648056030273, "global_step": 341353, "epoch": 4112} {"train_loss": -26.371749877929688, "global_step": 341354, "epoch": 4112} {"train_loss": -25.93476676940918, "global_step": 341355, "epoch": 4112} {"train_loss": -25.99663734436035, "global_step": 341356, "epoch": 4112} {"train_loss": -25.967960357666016, "global_step": 341357, "epoch": 4112} {"train_loss": -26.216318130493164, "global_step": 341358, "epoch": 4112} {"train_loss": -26.125080108642578, "global_step": 341359, "epoch": 4112} {"train_loss": -26.28034019470215, "global_step": 341360, "epoch": 4112} {"train_loss": -25.679838180541992, "global_step": 341361, "epoch": 4112} {"train_loss": -25.98713493347168, "global_step": 341362, "epoch": 4112} {"train_loss": -25.989179611206055, "global_step": 341363, "epoch": 4112} {"train_loss": -26.56962013244629, "global_step": 341364, "epoch": 4112} {"train_loss": -26.22381019592285, "global_step": 341365, "epoch": 4112} {"train_loss": -26.12562370300293, "global_step": 341366, "epoch": 4112} {"train_loss": -26.282794952392578, "global_step": 341367, "epoch": 4112} {"train_loss": -26.1229190826416, "global_step": 341368, "epoch": 4112} {"train_loss": -26.663726806640625, "global_step": 341369, "epoch": 4112} {"train_loss": -26.130502700805664, "global_step": 341370, "epoch": 4112} {"train_loss": -26.089080810546875, "global_step": 341371, "epoch": 4112} {"train_loss": -26.435077667236328, "global_step": 341372, "epoch": 4112} {"train_loss": -25.932065963745117, "global_step": 341373, "epoch": 4112} {"train_loss": -26.18153953552246, "global_step": 341374, "epoch": 4112} {"train_loss": -25.970157623291016, "global_step": 341375, "epoch": 4112} {"train_loss": -26.131591796875, "global_step": 341376, "epoch": 4112} {"train_loss": -26.03516960144043, "global_step": 341377, "epoch": 4112} {"train_loss": -25.859000631125575, "global_step": 341378, "epoch": 4112, "val_loss": 6570738.0} {"train_loss": -25.295501708984375, "global_step": 341379, "epoch": 4113} {"train_loss": -25.323835372924805, "global_step": 341380, "epoch": 4113} {"train_loss": -24.89213752746582, "global_step": 341381, "epoch": 4113} {"train_loss": -25.115575790405273, "global_step": 341382, "epoch": 4113} {"train_loss": -26.188190460205078, "global_step": 341383, "epoch": 4113} {"train_loss": -25.55726432800293, "global_step": 341384, "epoch": 4113} {"train_loss": -25.365087509155273, "global_step": 341385, "epoch": 4113} {"train_loss": -25.884357452392578, "global_step": 341386, "epoch": 4113} {"train_loss": -25.315046310424805, "global_step": 341387, "epoch": 4113} {"train_loss": -25.705469131469727, "global_step": 341388, "epoch": 4113} {"train_loss": -25.372732162475586, "global_step": 341389, "epoch": 4113} {"train_loss": -25.562253952026367, "global_step": 341390, "epoch": 4113} {"train_loss": -25.615936279296875, "global_step": 341391, "epoch": 4113} {"train_loss": -25.58609390258789, "global_step": 341392, "epoch": 4113} {"train_loss": -25.838525772094727, "global_step": 341393, "epoch": 4113} {"train_loss": -25.50307273864746, "global_step": 341394, "epoch": 4113} {"train_loss": -25.728376388549805, "global_step": 341395, "epoch": 4113} {"train_loss": -25.773529052734375, "global_step": 341396, "epoch": 4113} {"train_loss": -25.800827026367188, "global_step": 341397, "epoch": 4113} {"train_loss": -25.942609786987305, "global_step": 341398, "epoch": 4113} {"train_loss": -25.77201271057129, "global_step": 341399, "epoch": 4113} {"train_loss": -25.791913986206055, "global_step": 341400, "epoch": 4113} {"train_loss": -25.961950302124023, "global_step": 341401, "epoch": 4113} {"train_loss": -25.6645450592041, "global_step": 341402, "epoch": 4113} {"train_loss": -26.02543067932129, "global_step": 341403, "epoch": 4113} {"train_loss": -26.0375919342041, "global_step": 341404, "epoch": 4113} {"train_loss": -25.703662872314453, "global_step": 341405, "epoch": 4113} {"train_loss": -25.797163009643555, "global_step": 341406, "epoch": 4113} {"train_loss": -25.79680824279785, "global_step": 341407, "epoch": 4113} {"train_loss": -25.7645206451416, "global_step": 341408, "epoch": 4113} {"train_loss": -26.267807006835938, "global_step": 341409, "epoch": 4113} {"train_loss": -25.699676513671875, "global_step": 341410, "epoch": 4113} {"train_loss": -25.8099365234375, "global_step": 341411, "epoch": 4113} {"train_loss": -25.762741088867188, "global_step": 341412, "epoch": 4113} {"train_loss": -25.9263858795166, "global_step": 341413, "epoch": 4113} {"train_loss": -26.432844161987305, "global_step": 341414, "epoch": 4113} {"train_loss": -26.018117904663086, "global_step": 341415, "epoch": 4113} {"train_loss": -26.14352798461914, "global_step": 341416, "epoch": 4113} {"train_loss": -26.31739616394043, "global_step": 341417, "epoch": 4113} {"train_loss": -26.34279441833496, "global_step": 341418, "epoch": 4113} {"train_loss": -26.06160545349121, "global_step": 341419, "epoch": 4113} {"train_loss": -26.038862228393555, "global_step": 341420, "epoch": 4113} {"train_loss": -26.346078872680664, "global_step": 341421, "epoch": 4113} {"train_loss": -26.492589950561523, "global_step": 341422, "epoch": 4113} {"train_loss": -25.84388542175293, "global_step": 341423, "epoch": 4113} {"train_loss": -26.13441276550293, "global_step": 341424, "epoch": 4113} {"train_loss": -25.99747657775879, "global_step": 341425, "epoch": 4113} {"train_loss": -26.535480499267578, "global_step": 341426, "epoch": 4113} {"train_loss": -25.94734001159668, "global_step": 341427, "epoch": 4113} {"train_loss": -24.987957000732422, "global_step": 341428, "epoch": 4113} {"train_loss": -25.332286834716797, "global_step": 341429, "epoch": 4113} {"train_loss": -25.30462646484375, "global_step": 341430, "epoch": 4113} {"train_loss": -25.628284454345703, "global_step": 341431, "epoch": 4113} {"train_loss": -25.93537712097168, "global_step": 341432, "epoch": 4113} {"train_loss": -25.754718780517578, "global_step": 341433, "epoch": 4113} {"train_loss": -25.56083869934082, "global_step": 341434, "epoch": 4113} {"train_loss": -25.93263053894043, "global_step": 341435, "epoch": 4113} {"train_loss": -25.940942764282227, "global_step": 341436, "epoch": 4113} {"train_loss": -25.490196228027344, "global_step": 341437, "epoch": 4113} {"train_loss": -26.082550048828125, "global_step": 341438, "epoch": 4113} {"train_loss": -25.842914581298828, "global_step": 341439, "epoch": 4113} {"train_loss": -26.266082763671875, "global_step": 341440, "epoch": 4113} {"train_loss": -25.396371841430664, "global_step": 341441, "epoch": 4113} {"train_loss": -26.063791275024414, "global_step": 341442, "epoch": 4113} {"train_loss": -26.25519371032715, "global_step": 341443, "epoch": 4113} {"train_loss": -25.89983558654785, "global_step": 341444, "epoch": 4113} {"train_loss": -26.197498321533203, "global_step": 341445, "epoch": 4113} {"train_loss": -26.502212524414062, "global_step": 341446, "epoch": 4113} {"train_loss": -26.362390518188477, "global_step": 341447, "epoch": 4113} {"train_loss": -25.896484375, "global_step": 341448, "epoch": 4113} {"train_loss": -25.677648544311523, "global_step": 341449, "epoch": 4113} {"train_loss": -26.3072566986084, "global_step": 341450, "epoch": 4113} {"train_loss": -26.00367546081543, "global_step": 341451, "epoch": 4113} {"train_loss": -26.028400421142578, "global_step": 341452, "epoch": 4113} {"train_loss": -26.45806312561035, "global_step": 341453, "epoch": 4113} {"train_loss": -26.379423141479492, "global_step": 341454, "epoch": 4113} {"train_loss": -26.282928466796875, "global_step": 341455, "epoch": 4113} {"train_loss": -26.04648208618164, "global_step": 341456, "epoch": 4113} {"train_loss": -25.956907272338867, "global_step": 341457, "epoch": 4113} {"train_loss": -26.27776527404785, "global_step": 341458, "epoch": 4113} {"train_loss": -26.606603622436523, "global_step": 341459, "epoch": 4113} {"train_loss": -26.35637855529785, "global_step": 341460, "epoch": 4113} {"train_loss": -25.89302812139672, "global_step": 341461, "epoch": 4113, "val_loss": 6545384.5} {"train_loss": -25.726659774780273, "global_step": 341462, "epoch": 4114} {"train_loss": -25.584074020385742, "global_step": 341463, "epoch": 4114} {"train_loss": -25.613065719604492, "global_step": 341464, "epoch": 4114} {"train_loss": -25.73341178894043, "global_step": 341465, "epoch": 4114} {"train_loss": -26.3151798248291, "global_step": 341466, "epoch": 4114} {"train_loss": -25.20743179321289, "global_step": 341467, "epoch": 4114} {"train_loss": -26.2249813079834, "global_step": 341468, "epoch": 4114} {"train_loss": -25.8603458404541, "global_step": 341469, "epoch": 4114} {"train_loss": -25.9803466796875, "global_step": 341470, "epoch": 4114} {"train_loss": -25.29627799987793, "global_step": 341471, "epoch": 4114} {"train_loss": -25.783905029296875, "global_step": 341472, "epoch": 4114} {"train_loss": -25.949573516845703, "global_step": 341473, "epoch": 4114} {"train_loss": -25.7934513092041, "global_step": 341474, "epoch": 4114} {"train_loss": -26.05908203125, "global_step": 341475, "epoch": 4114} {"train_loss": -25.973037719726562, "global_step": 341476, "epoch": 4114} {"train_loss": -25.88960838317871, "global_step": 341477, "epoch": 4114} {"train_loss": -25.603076934814453, "global_step": 341478, "epoch": 4114} {"train_loss": -26.0889949798584, "global_step": 341479, "epoch": 4114} {"train_loss": -26.63459587097168, "global_step": 341480, "epoch": 4114} {"train_loss": -25.86237144470215, "global_step": 341481, "epoch": 4114} {"train_loss": -26.03346824645996, "global_step": 341482, "epoch": 4114} {"train_loss": -25.867252349853516, "global_step": 341483, "epoch": 4114} {"train_loss": -26.18617820739746, "global_step": 341484, "epoch": 4114} {"train_loss": -25.831144332885742, "global_step": 341485, "epoch": 4114} {"train_loss": -26.21998405456543, "global_step": 341486, "epoch": 4114} {"train_loss": -25.692365646362305, "global_step": 341487, "epoch": 4114} {"train_loss": -25.99148941040039, "global_step": 341488, "epoch": 4114} {"train_loss": -26.30116081237793, "global_step": 341489, "epoch": 4114} {"train_loss": -26.232648849487305, "global_step": 341490, "epoch": 4114} {"train_loss": -26.372114181518555, "global_step": 341491, "epoch": 4114} {"train_loss": -26.383758544921875, "global_step": 341492, "epoch": 4114} {"train_loss": -25.899328231811523, "global_step": 341493, "epoch": 4114} {"train_loss": -26.389129638671875, "global_step": 341494, "epoch": 4114} {"train_loss": -26.08566665649414, "global_step": 341495, "epoch": 4114} {"train_loss": -26.125513076782227, "global_step": 341496, "epoch": 4114} {"train_loss": -26.104581832885742, "global_step": 341497, "epoch": 4114} {"train_loss": -26.18354606628418, "global_step": 341498, "epoch": 4114} {"train_loss": -26.2950382232666, "global_step": 341499, "epoch": 4114} {"train_loss": -26.435346603393555, "global_step": 341500, "epoch": 4114} {"train_loss": -26.52695083618164, "global_step": 341501, "epoch": 4114} {"train_loss": -26.07228660583496, "global_step": 341502, "epoch": 4114} {"train_loss": -26.037397384643555, "global_step": 341503, "epoch": 4114} {"train_loss": -26.283355712890625, "global_step": 341504, "epoch": 4114} {"train_loss": -26.342609405517578, "global_step": 341505, "epoch": 4114} {"train_loss": -26.007654190063477, "global_step": 341506, "epoch": 4114} {"train_loss": -26.24871826171875, "global_step": 341507, "epoch": 4114} {"train_loss": -26.192777633666992, "global_step": 341508, "epoch": 4114} {"train_loss": -25.73193359375, "global_step": 341509, "epoch": 4114} {"train_loss": -25.36763572692871, "global_step": 341510, "epoch": 4114} {"train_loss": -25.351770401000977, "global_step": 341511, "epoch": 4114} {"train_loss": -25.89942741394043, "global_step": 341512, "epoch": 4114} {"train_loss": -26.06113052368164, "global_step": 341513, "epoch": 4114} {"train_loss": -26.109073638916016, "global_step": 341514, "epoch": 4114} {"train_loss": -25.96327018737793, "global_step": 341515, "epoch": 4114} {"train_loss": -25.931568145751953, "global_step": 341516, "epoch": 4114} {"train_loss": -25.914215087890625, "global_step": 341517, "epoch": 4114} {"train_loss": -25.92632484436035, "global_step": 341518, "epoch": 4114} {"train_loss": -25.959125518798828, "global_step": 341519, "epoch": 4114} {"train_loss": -26.231796264648438, "global_step": 341520, "epoch": 4114} {"train_loss": -25.99488639831543, "global_step": 341521, "epoch": 4114} {"train_loss": -25.957849502563477, "global_step": 341522, "epoch": 4114} {"train_loss": -26.321115493774414, "global_step": 341523, "epoch": 4114} {"train_loss": -25.926166534423828, "global_step": 341524, "epoch": 4114} {"train_loss": -26.22417640686035, "global_step": 341525, "epoch": 4114} {"train_loss": -25.567848205566406, "global_step": 341526, "epoch": 4114} {"train_loss": -26.053815841674805, "global_step": 341527, "epoch": 4114} {"train_loss": -26.05848503112793, "global_step": 341528, "epoch": 4114} {"train_loss": -26.25421714782715, "global_step": 341529, "epoch": 4114} {"train_loss": -26.278717041015625, "global_step": 341530, "epoch": 4114} {"train_loss": -25.86553382873535, "global_step": 341531, "epoch": 4114} {"train_loss": -26.544042587280273, "global_step": 341532, "epoch": 4114} {"train_loss": -26.087787628173828, "global_step": 341533, "epoch": 4114} {"train_loss": -26.095102310180664, "global_step": 341534, "epoch": 4114} {"train_loss": -26.214614868164062, "global_step": 341535, "epoch": 4114} {"train_loss": -25.993139266967773, "global_step": 341536, "epoch": 4114} {"train_loss": -26.365697860717773, "global_step": 341537, "epoch": 4114} {"train_loss": -26.14417839050293, "global_step": 341538, "epoch": 4114} {"train_loss": -26.200605392456055, "global_step": 341539, "epoch": 4114} {"train_loss": -26.336627960205078, "global_step": 341540, "epoch": 4114} {"train_loss": -26.01836585998535, "global_step": 341541, "epoch": 4114} {"train_loss": -26.35760498046875, "global_step": 341542, "epoch": 4114} {"train_loss": -25.932239532470703, "global_step": 341543, "epoch": 4114} {"train_loss": -26.02908511334155, "global_step": 341544, "epoch": 4114, "val_loss": 6644597.5} {"train_loss": -25.659292221069336, "global_step": 341545, "epoch": 4115} {"train_loss": -25.592632293701172, "global_step": 341546, "epoch": 4115} {"train_loss": -25.823392868041992, "global_step": 341547, "epoch": 4115} {"train_loss": -25.46986198425293, "global_step": 341548, "epoch": 4115} {"train_loss": -26.110639572143555, "global_step": 341549, "epoch": 4115} {"train_loss": -25.784948348999023, "global_step": 341550, "epoch": 4115} {"train_loss": -25.889501571655273, "global_step": 341551, "epoch": 4115} {"train_loss": -25.645145416259766, "global_step": 341552, "epoch": 4115} {"train_loss": -25.66273307800293, "global_step": 341553, "epoch": 4115} {"train_loss": -25.780988693237305, "global_step": 341554, "epoch": 4115} {"train_loss": -25.844573974609375, "global_step": 341555, "epoch": 4115} {"train_loss": -25.293516159057617, "global_step": 341556, "epoch": 4115} {"train_loss": -26.058496475219727, "global_step": 341557, "epoch": 4115} {"train_loss": -25.81197166442871, "global_step": 341558, "epoch": 4115} {"train_loss": -25.721647262573242, "global_step": 341559, "epoch": 4115} {"train_loss": -25.902755737304688, "global_step": 341560, "epoch": 4115} {"train_loss": -25.59285545349121, "global_step": 341561, "epoch": 4115} {"train_loss": -25.868457794189453, "global_step": 341562, "epoch": 4115} {"train_loss": -25.955078125, "global_step": 341563, "epoch": 4115} {"train_loss": -26.062515258789062, "global_step": 341564, "epoch": 4115} {"train_loss": -26.3175048828125, "global_step": 341565, "epoch": 4115} {"train_loss": -25.9202880859375, "global_step": 341566, "epoch": 4115} {"train_loss": -25.70899772644043, "global_step": 341567, "epoch": 4115} {"train_loss": -26.029190063476562, "global_step": 341568, "epoch": 4115} {"train_loss": -26.031402587890625, "global_step": 341569, "epoch": 4115} {"train_loss": -26.0473575592041, "global_step": 341570, "epoch": 4115} {"train_loss": -26.040283203125, "global_step": 341571, "epoch": 4115} {"train_loss": -26.25998878479004, "global_step": 341572, "epoch": 4115} {"train_loss": -25.854238510131836, "global_step": 341573, "epoch": 4115} {"train_loss": -25.88223648071289, "global_step": 341574, "epoch": 4115} {"train_loss": -26.035261154174805, "global_step": 341575, "epoch": 4115} {"train_loss": -25.847497940063477, "global_step": 341576, "epoch": 4115} {"train_loss": -26.22010612487793, "global_step": 341577, "epoch": 4115} {"train_loss": -26.344425201416016, "global_step": 341578, "epoch": 4115} {"train_loss": -26.099145889282227, "global_step": 341579, "epoch": 4115} {"train_loss": -26.3693790435791, "global_step": 341580, "epoch": 4115} {"train_loss": -26.034345626831055, "global_step": 341581, "epoch": 4115} {"train_loss": -26.19921875, "global_step": 341582, "epoch": 4115} {"train_loss": -26.40177345275879, "global_step": 341583, "epoch": 4115} {"train_loss": -26.348615646362305, "global_step": 341584, "epoch": 4115} {"train_loss": -25.958698272705078, "global_step": 341585, "epoch": 4115} {"train_loss": -26.012134552001953, "global_step": 341586, "epoch": 4115} {"train_loss": -26.1135311126709, "global_step": 341587, "epoch": 4115} {"train_loss": -26.2354679107666, "global_step": 341588, "epoch": 4115} {"train_loss": -25.7990779876709, "global_step": 341589, "epoch": 4115} {"train_loss": -25.994043350219727, "global_step": 341590, "epoch": 4115} {"train_loss": -25.935277938842773, "global_step": 341591, "epoch": 4115} {"train_loss": -25.984479904174805, "global_step": 341592, "epoch": 4115} {"train_loss": -25.403051376342773, "global_step": 341593, "epoch": 4115} {"train_loss": -25.612659454345703, "global_step": 341594, "epoch": 4115} {"train_loss": -26.04775047302246, "global_step": 341595, "epoch": 4115} {"train_loss": -25.82439613342285, "global_step": 341596, "epoch": 4115} {"train_loss": -25.77735710144043, "global_step": 341597, "epoch": 4115} {"train_loss": -25.94921875, "global_step": 341598, "epoch": 4115} {"train_loss": -26.24837303161621, "global_step": 341599, "epoch": 4115} {"train_loss": -25.868032455444336, "global_step": 341600, "epoch": 4115} {"train_loss": -26.4002742767334, "global_step": 341601, "epoch": 4115} {"train_loss": -26.151874542236328, "global_step": 341602, "epoch": 4115} {"train_loss": -25.97446632385254, "global_step": 341603, "epoch": 4115} {"train_loss": -25.979162216186523, "global_step": 341604, "epoch": 4115} {"train_loss": -26.19036293029785, "global_step": 341605, "epoch": 4115} {"train_loss": -26.10125732421875, "global_step": 341606, "epoch": 4115} {"train_loss": -26.188568115234375, "global_step": 341607, "epoch": 4115} {"train_loss": -26.317325592041016, "global_step": 341608, "epoch": 4115} {"train_loss": -26.18537712097168, "global_step": 341609, "epoch": 4115} {"train_loss": -25.968814849853516, "global_step": 341610, "epoch": 4115} {"train_loss": -25.686527252197266, "global_step": 341611, "epoch": 4115} {"train_loss": -26.339221954345703, "global_step": 341612, "epoch": 4115} {"train_loss": -26.142597198486328, "global_step": 341613, "epoch": 4115} {"train_loss": -26.2512264251709, "global_step": 341614, "epoch": 4115} {"train_loss": -26.071334838867188, "global_step": 341615, "epoch": 4115} {"train_loss": -26.076251983642578, "global_step": 341616, "epoch": 4115} {"train_loss": -25.885730743408203, "global_step": 341617, "epoch": 4115} {"train_loss": -26.272130966186523, "global_step": 341618, "epoch": 4115} {"train_loss": -26.23390769958496, "global_step": 341619, "epoch": 4115} {"train_loss": -26.28472900390625, "global_step": 341620, "epoch": 4115} {"train_loss": -26.35589599609375, "global_step": 341621, "epoch": 4115} {"train_loss": -26.0064754486084, "global_step": 341622, "epoch": 4115} {"train_loss": -26.20575523376465, "global_step": 341623, "epoch": 4115} {"train_loss": -26.296594619750977, "global_step": 341624, "epoch": 4115} {"train_loss": -26.0034236907959, "global_step": 341625, "epoch": 4115} {"train_loss": -26.28736686706543, "global_step": 341626, "epoch": 4115} {"train_loss": -26.017149752881153, "global_step": 341627, "epoch": 4115, "val_loss": 6564296.0} {"train_loss": -25.27019500732422, "global_step": 341628, "epoch": 4116} {"train_loss": -24.884521484375, "global_step": 341629, "epoch": 4116} {"train_loss": -25.349546432495117, "global_step": 341630, "epoch": 4116} {"train_loss": -24.87507438659668, "global_step": 341631, "epoch": 4116} {"train_loss": -25.39521598815918, "global_step": 341632, "epoch": 4116} {"train_loss": -25.548749923706055, "global_step": 341633, "epoch": 4116} {"train_loss": -25.306203842163086, "global_step": 341634, "epoch": 4116} {"train_loss": -25.23432159423828, "global_step": 341635, "epoch": 4116} {"train_loss": -25.825464248657227, "global_step": 341636, "epoch": 4116} {"train_loss": -25.74664306640625, "global_step": 341637, "epoch": 4116} {"train_loss": -25.288192749023438, "global_step": 341638, "epoch": 4116} {"train_loss": -25.882675170898438, "global_step": 341639, "epoch": 4116} {"train_loss": -25.21200942993164, "global_step": 341640, "epoch": 4116} {"train_loss": -25.868200302124023, "global_step": 341641, "epoch": 4116} {"train_loss": -25.645872116088867, "global_step": 341642, "epoch": 4116} {"train_loss": -25.444730758666992, "global_step": 341643, "epoch": 4116} {"train_loss": -25.582853317260742, "global_step": 341644, "epoch": 4116} {"train_loss": -26.07875633239746, "global_step": 341645, "epoch": 4116} {"train_loss": -25.726409912109375, "global_step": 341646, "epoch": 4116} {"train_loss": -25.832733154296875, "global_step": 341647, "epoch": 4116} {"train_loss": -26.08210563659668, "global_step": 341648, "epoch": 4116} {"train_loss": -25.821996688842773, "global_step": 341649, "epoch": 4116} {"train_loss": -26.235742568969727, "global_step": 341650, "epoch": 4116} {"train_loss": -25.845413208007812, "global_step": 341651, "epoch": 4116} {"train_loss": -25.967748641967773, "global_step": 341652, "epoch": 4116} {"train_loss": -26.10469627380371, "global_step": 341653, "epoch": 4116} {"train_loss": -26.165332794189453, "global_step": 341654, "epoch": 4116} {"train_loss": -26.138891220092773, "global_step": 341655, "epoch": 4116} {"train_loss": -26.1300048828125, "global_step": 341656, "epoch": 4116} {"train_loss": -26.105609893798828, "global_step": 341657, "epoch": 4116} {"train_loss": -25.978534698486328, "global_step": 341658, "epoch": 4116} {"train_loss": -25.73366355895996, "global_step": 341659, "epoch": 4116} {"train_loss": -25.816364288330078, "global_step": 341660, "epoch": 4116} {"train_loss": -25.960376739501953, "global_step": 341661, "epoch": 4116} {"train_loss": -25.813154220581055, "global_step": 341662, "epoch": 4116} {"train_loss": -26.035053253173828, "global_step": 341663, "epoch": 4116} {"train_loss": -26.293182373046875, "global_step": 341664, "epoch": 4116} {"train_loss": -26.13221549987793, "global_step": 341665, "epoch": 4116} {"train_loss": -26.271503448486328, "global_step": 341666, "epoch": 4116} {"train_loss": -26.1181640625, "global_step": 341667, "epoch": 4116} {"train_loss": -26.39362144470215, "global_step": 341668, "epoch": 4116} {"train_loss": -26.036792755126953, "global_step": 341669, "epoch": 4116} {"train_loss": -26.048999786376953, "global_step": 341670, "epoch": 4116} {"train_loss": -25.959609985351562, "global_step": 341671, "epoch": 4116} {"train_loss": -25.97687339782715, "global_step": 341672, "epoch": 4116} {"train_loss": -26.376556396484375, "global_step": 341673, "epoch": 4116} {"train_loss": -25.677642822265625, "global_step": 341674, "epoch": 4116} {"train_loss": -26.191495895385742, "global_step": 341675, "epoch": 4116} {"train_loss": -25.763525009155273, "global_step": 341676, "epoch": 4116} {"train_loss": -25.903661727905273, "global_step": 341677, "epoch": 4116} {"train_loss": -26.10153579711914, "global_step": 341678, "epoch": 4116} {"train_loss": -26.254928588867188, "global_step": 341679, "epoch": 4116} {"train_loss": -26.020816802978516, "global_step": 341680, "epoch": 4116} {"train_loss": -26.13893699645996, "global_step": 341681, "epoch": 4116} {"train_loss": -26.407114028930664, "global_step": 341682, "epoch": 4116} {"train_loss": -25.959497451782227, "global_step": 341683, "epoch": 4116} {"train_loss": -25.934833526611328, "global_step": 341684, "epoch": 4116} {"train_loss": -26.04901695251465, "global_step": 341685, "epoch": 4116} {"train_loss": -25.810895919799805, "global_step": 341686, "epoch": 4116} {"train_loss": -26.196523666381836, "global_step": 341687, "epoch": 4116} {"train_loss": -25.98988151550293, "global_step": 341688, "epoch": 4116} {"train_loss": -25.784582138061523, "global_step": 341689, "epoch": 4116} {"train_loss": -25.737089157104492, "global_step": 341690, "epoch": 4116} {"train_loss": -25.7259578704834, "global_step": 341691, "epoch": 4116} {"train_loss": -25.914560317993164, "global_step": 341692, "epoch": 4116} {"train_loss": -26.217838287353516, "global_step": 341693, "epoch": 4116} {"train_loss": -26.08228874206543, "global_step": 341694, "epoch": 4116} {"train_loss": -26.172998428344727, "global_step": 341695, "epoch": 4116} {"train_loss": -25.66798210144043, "global_step": 341696, "epoch": 4116} {"train_loss": -25.715539932250977, "global_step": 341697, "epoch": 4116} {"train_loss": -25.949085235595703, "global_step": 341698, "epoch": 4116} {"train_loss": -25.655975341796875, "global_step": 341699, "epoch": 4116} {"train_loss": -25.910627365112305, "global_step": 341700, "epoch": 4116} {"train_loss": -26.04524803161621, "global_step": 341701, "epoch": 4116} {"train_loss": -25.931249618530273, "global_step": 341702, "epoch": 4116} {"train_loss": -26.20343017578125, "global_step": 341703, "epoch": 4116} {"train_loss": -26.21662712097168, "global_step": 341704, "epoch": 4116} {"train_loss": -26.046239852905273, "global_step": 341705, "epoch": 4116} {"train_loss": -25.897403717041016, "global_step": 341706, "epoch": 4116} {"train_loss": -26.149341583251953, "global_step": 341707, "epoch": 4116} {"train_loss": -26.13681983947754, "global_step": 341708, "epoch": 4116} {"train_loss": -26.38522720336914, "global_step": 341709, "epoch": 4116} {"train_loss": -25.88321527228298, "global_step": 341710, "epoch": 4116, "val_loss": 6581898.0} {"train_loss": -25.71148109436035, "global_step": 341711, "epoch": 4117} {"train_loss": -25.72016716003418, "global_step": 341712, "epoch": 4117} {"train_loss": -25.61848258972168, "global_step": 341713, "epoch": 4117} {"train_loss": -25.77142333984375, "global_step": 341714, "epoch": 4117} {"train_loss": -26.1270694732666, "global_step": 341715, "epoch": 4117} {"train_loss": -25.623167037963867, "global_step": 341716, "epoch": 4117} {"train_loss": -26.2182674407959, "global_step": 341717, "epoch": 4117} {"train_loss": -26.15488624572754, "global_step": 341718, "epoch": 4117} {"train_loss": -26.275146484375, "global_step": 341719, "epoch": 4117} {"train_loss": -25.813032150268555, "global_step": 341720, "epoch": 4117} {"train_loss": -25.774402618408203, "global_step": 341721, "epoch": 4117} {"train_loss": -25.502685546875, "global_step": 341722, "epoch": 4117} {"train_loss": -26.312652587890625, "global_step": 341723, "epoch": 4117} {"train_loss": -25.87213134765625, "global_step": 341724, "epoch": 4117} {"train_loss": -26.028762817382812, "global_step": 341725, "epoch": 4117} {"train_loss": -25.920093536376953, "global_step": 341726, "epoch": 4117} {"train_loss": -26.036096572875977, "global_step": 341727, "epoch": 4117} {"train_loss": -25.96685218811035, "global_step": 341728, "epoch": 4117} {"train_loss": -26.10919761657715, "global_step": 341729, "epoch": 4117} {"train_loss": -26.051706314086914, "global_step": 341730, "epoch": 4117} {"train_loss": -26.119831085205078, "global_step": 341731, "epoch": 4117} {"train_loss": -26.106332778930664, "global_step": 341732, "epoch": 4117} {"train_loss": -26.160888671875, "global_step": 341733, "epoch": 4117} {"train_loss": -26.29694175720215, "global_step": 341734, "epoch": 4117} {"train_loss": -26.162185668945312, "global_step": 341735, "epoch": 4117} {"train_loss": -26.455184936523438, "global_step": 341736, "epoch": 4117} {"train_loss": -26.0029296875, "global_step": 341737, "epoch": 4117} {"train_loss": -26.059528350830078, "global_step": 341738, "epoch": 4117} {"train_loss": -25.955657958984375, "global_step": 341739, "epoch": 4117} {"train_loss": -26.064987182617188, "global_step": 341740, "epoch": 4117} {"train_loss": -26.337499618530273, "global_step": 341741, "epoch": 4117} {"train_loss": -26.68084144592285, "global_step": 341742, "epoch": 4117} {"train_loss": -26.45806312561035, "global_step": 341743, "epoch": 4117} {"train_loss": -25.963764190673828, "global_step": 341744, "epoch": 4117} {"train_loss": -25.935415267944336, "global_step": 341745, "epoch": 4117} {"train_loss": -25.22602653503418, "global_step": 341746, "epoch": 4117} {"train_loss": -25.136865615844727, "global_step": 341747, "epoch": 4117} {"train_loss": -25.593494415283203, "global_step": 341748, "epoch": 4117} {"train_loss": -25.9904727935791, "global_step": 341749, "epoch": 4117} {"train_loss": -26.4705810546875, "global_step": 341750, "epoch": 4117} {"train_loss": -25.697589874267578, "global_step": 341751, "epoch": 4117} {"train_loss": -25.929061889648438, "global_step": 341752, "epoch": 4117} {"train_loss": -25.904478073120117, "global_step": 341753, "epoch": 4117} {"train_loss": -26.334577560424805, "global_step": 341754, "epoch": 4117} {"train_loss": -25.858524322509766, "global_step": 341755, "epoch": 4117} {"train_loss": -25.875608444213867, "global_step": 341756, "epoch": 4117} {"train_loss": -26.043188095092773, "global_step": 341757, "epoch": 4117} {"train_loss": -25.847009658813477, "global_step": 341758, "epoch": 4117} {"train_loss": -26.20664405822754, "global_step": 341759, "epoch": 4117} {"train_loss": -25.911365509033203, "global_step": 341760, "epoch": 4117} {"train_loss": -26.065214157104492, "global_step": 341761, "epoch": 4117} {"train_loss": -25.960500717163086, "global_step": 341762, "epoch": 4117} {"train_loss": -26.15771484375, "global_step": 341763, "epoch": 4117} {"train_loss": -26.214574813842773, "global_step": 341764, "epoch": 4117} {"train_loss": -25.849740982055664, "global_step": 341765, "epoch": 4117} {"train_loss": -26.11553382873535, "global_step": 341766, "epoch": 4117} {"train_loss": -26.44111442565918, "global_step": 341767, "epoch": 4117} {"train_loss": -26.110187530517578, "global_step": 341768, "epoch": 4117} {"train_loss": -26.3519344329834, "global_step": 341769, "epoch": 4117} {"train_loss": -25.80911636352539, "global_step": 341770, "epoch": 4117} {"train_loss": -26.320526123046875, "global_step": 341771, "epoch": 4117} {"train_loss": -25.90308952331543, "global_step": 341772, "epoch": 4117} {"train_loss": -25.99212074279785, "global_step": 341773, "epoch": 4117} {"train_loss": -26.01227378845215, "global_step": 341774, "epoch": 4117} {"train_loss": -25.645177841186523, "global_step": 341775, "epoch": 4117} {"train_loss": -25.590848922729492, "global_step": 341776, "epoch": 4117} {"train_loss": -25.806838989257812, "global_step": 341777, "epoch": 4117} {"train_loss": -26.221677780151367, "global_step": 341778, "epoch": 4117} {"train_loss": -25.99668312072754, "global_step": 341779, "epoch": 4117} {"train_loss": -25.320592880249023, "global_step": 341780, "epoch": 4117} {"train_loss": -26.165775299072266, "global_step": 341781, "epoch": 4117} {"train_loss": -25.795766830444336, "global_step": 341782, "epoch": 4117} {"train_loss": -25.770050048828125, "global_step": 341783, "epoch": 4117} {"train_loss": -25.957096099853516, "global_step": 341784, "epoch": 4117} {"train_loss": -26.0098876953125, "global_step": 341785, "epoch": 4117} {"train_loss": -26.13311767578125, "global_step": 341786, "epoch": 4117} {"train_loss": -25.793607711791992, "global_step": 341787, "epoch": 4117} {"train_loss": -26.005224227905273, "global_step": 341788, "epoch": 4117} {"train_loss": -26.07733154296875, "global_step": 341789, "epoch": 4117} {"train_loss": -25.924224853515625, "global_step": 341790, "epoch": 4117} {"train_loss": -26.3602352142334, "global_step": 341791, "epoch": 4117} {"train_loss": -26.2486629486084, "global_step": 341792, "epoch": 4117} {"train_loss": -25.97873752088432, "global_step": 341793, "epoch": 4117, "val_loss": 6632665.0} {"train_loss": -25.414905548095703, "global_step": 341794, "epoch": 4118} {"train_loss": -25.56971549987793, "global_step": 341795, "epoch": 4118} {"train_loss": -24.847885131835938, "global_step": 341796, "epoch": 4118} {"train_loss": -25.55207633972168, "global_step": 341797, "epoch": 4118} {"train_loss": -25.0620174407959, "global_step": 341798, "epoch": 4118} {"train_loss": -25.520055770874023, "global_step": 341799, "epoch": 4118} {"train_loss": -25.159902572631836, "global_step": 341800, "epoch": 4118} {"train_loss": -25.9925537109375, "global_step": 341801, "epoch": 4118} {"train_loss": -25.591489791870117, "global_step": 341802, "epoch": 4118} {"train_loss": -25.45695686340332, "global_step": 341803, "epoch": 4118} {"train_loss": -25.67563247680664, "global_step": 341804, "epoch": 4118} {"train_loss": -25.191255569458008, "global_step": 341805, "epoch": 4118} {"train_loss": -25.687713623046875, "global_step": 341806, "epoch": 4118} {"train_loss": -25.40939712524414, "global_step": 341807, "epoch": 4118} {"train_loss": -26.006879806518555, "global_step": 341808, "epoch": 4118} {"train_loss": -25.60999870300293, "global_step": 341809, "epoch": 4118} {"train_loss": -25.55204963684082, "global_step": 341810, "epoch": 4118} {"train_loss": -25.68259620666504, "global_step": 341811, "epoch": 4118} {"train_loss": -25.4981689453125, "global_step": 341812, "epoch": 4118} {"train_loss": -25.628192901611328, "global_step": 341813, "epoch": 4118} {"train_loss": -26.093469619750977, "global_step": 341814, "epoch": 4118} {"train_loss": -26.075931549072266, "global_step": 341815, "epoch": 4118} {"train_loss": -25.608325958251953, "global_step": 341816, "epoch": 4118} {"train_loss": -25.871885299682617, "global_step": 341817, "epoch": 4118} {"train_loss": -25.77522850036621, "global_step": 341818, "epoch": 4118} {"train_loss": -25.987720489501953, "global_step": 341819, "epoch": 4118} {"train_loss": -26.050018310546875, "global_step": 341820, "epoch": 4118} {"train_loss": -26.033554077148438, "global_step": 341821, "epoch": 4118} {"train_loss": -26.27667236328125, "global_step": 341822, "epoch": 4118} {"train_loss": -26.138080596923828, "global_step": 341823, "epoch": 4118} {"train_loss": -26.03106117248535, "global_step": 341824, "epoch": 4118} {"train_loss": -26.004241943359375, "global_step": 341825, "epoch": 4118} {"train_loss": -26.180627822875977, "global_step": 341826, "epoch": 4118} {"train_loss": -26.0881290435791, "global_step": 341827, "epoch": 4118} {"train_loss": -25.8279972076416, "global_step": 341828, "epoch": 4118} {"train_loss": -26.21625328063965, "global_step": 341829, "epoch": 4118} {"train_loss": -26.092742919921875, "global_step": 341830, "epoch": 4118} {"train_loss": -26.20108985900879, "global_step": 341831, "epoch": 4118} {"train_loss": -26.199491500854492, "global_step": 341832, "epoch": 4118} {"train_loss": -25.733978271484375, "global_step": 341833, "epoch": 4118} {"train_loss": -26.079694747924805, "global_step": 341834, "epoch": 4118} {"train_loss": -26.343358993530273, "global_step": 341835, "epoch": 4118} {"train_loss": -26.127805709838867, "global_step": 341836, "epoch": 4118} {"train_loss": -26.541980743408203, "global_step": 341837, "epoch": 4118} {"train_loss": -26.36785316467285, "global_step": 341838, "epoch": 4118} {"train_loss": -26.41802978515625, "global_step": 341839, "epoch": 4118} {"train_loss": -26.2489013671875, "global_step": 341840, "epoch": 4118} {"train_loss": -26.23310661315918, "global_step": 341841, "epoch": 4118} {"train_loss": -26.06764030456543, "global_step": 341842, "epoch": 4118} {"train_loss": -26.23334312438965, "global_step": 341843, "epoch": 4118} {"train_loss": -26.21143913269043, "global_step": 341844, "epoch": 4118} {"train_loss": -26.351215362548828, "global_step": 341845, "epoch": 4118} {"train_loss": -26.261280059814453, "global_step": 341846, "epoch": 4118} {"train_loss": -26.058454513549805, "global_step": 341847, "epoch": 4118} {"train_loss": -26.098926544189453, "global_step": 341848, "epoch": 4118} {"train_loss": -26.002826690673828, "global_step": 341849, "epoch": 4118} {"train_loss": -25.954954147338867, "global_step": 341850, "epoch": 4118} {"train_loss": -25.864669799804688, "global_step": 341851, "epoch": 4118} {"train_loss": -24.884733200073242, "global_step": 341852, "epoch": 4118} {"train_loss": -24.020313262939453, "global_step": 341853, "epoch": 4118} {"train_loss": -25.513723373413086, "global_step": 341854, "epoch": 4118} {"train_loss": -25.687244415283203, "global_step": 341855, "epoch": 4118} {"train_loss": -25.29647445678711, "global_step": 341856, "epoch": 4118} {"train_loss": -25.895618438720703, "global_step": 341857, "epoch": 4118} {"train_loss": -25.586843490600586, "global_step": 341858, "epoch": 4118} {"train_loss": -25.79693031311035, "global_step": 341859, "epoch": 4118} {"train_loss": -25.671335220336914, "global_step": 341860, "epoch": 4118} {"train_loss": -25.787118911743164, "global_step": 341861, "epoch": 4118} {"train_loss": -25.68709373474121, "global_step": 341862, "epoch": 4118} {"train_loss": -25.78192710876465, "global_step": 341863, "epoch": 4118} {"train_loss": -25.856674194335938, "global_step": 341864, "epoch": 4118} {"train_loss": -25.987943649291992, "global_step": 341865, "epoch": 4118} {"train_loss": -25.78753662109375, "global_step": 341866, "epoch": 4118} {"train_loss": -25.821882247924805, "global_step": 341867, "epoch": 4118} {"train_loss": -26.01869010925293, "global_step": 341868, "epoch": 4118} {"train_loss": -26.086191177368164, "global_step": 341869, "epoch": 4118} {"train_loss": -25.80303955078125, "global_step": 341870, "epoch": 4118} {"train_loss": -26.035354614257812, "global_step": 341871, "epoch": 4118} {"train_loss": -26.083173751831055, "global_step": 341872, "epoch": 4118} {"train_loss": -25.731430053710938, "global_step": 341873, "epoch": 4118} {"train_loss": -26.102121353149414, "global_step": 341874, "epoch": 4118} {"train_loss": -25.75090980529785, "global_step": 341875, "epoch": 4118} {"train_loss": -25.843496759253814, "global_step": 341876, "epoch": 4118, "val_loss": 6580383.0} {"train_loss": -24.84426498413086, "global_step": 341877, "epoch": 4119} {"train_loss": -24.91064453125, "global_step": 341878, "epoch": 4119} {"train_loss": -25.090904235839844, "global_step": 341879, "epoch": 4119} {"train_loss": -25.255756378173828, "global_step": 341880, "epoch": 4119} {"train_loss": -25.010053634643555, "global_step": 341881, "epoch": 4119} {"train_loss": -25.710968017578125, "global_step": 341882, "epoch": 4119} {"train_loss": -25.758142471313477, "global_step": 341883, "epoch": 4119} {"train_loss": -25.386669158935547, "global_step": 341884, "epoch": 4119} {"train_loss": -25.539823532104492, "global_step": 341885, "epoch": 4119} {"train_loss": -25.734846115112305, "global_step": 341886, "epoch": 4119} {"train_loss": -25.48520851135254, "global_step": 341887, "epoch": 4119} {"train_loss": -25.23933219909668, "global_step": 341888, "epoch": 4119} {"train_loss": -26.02373695373535, "global_step": 341889, "epoch": 4119} {"train_loss": -25.592069625854492, "global_step": 341890, "epoch": 4119} {"train_loss": -25.85150718688965, "global_step": 341891, "epoch": 4119} {"train_loss": -25.529481887817383, "global_step": 341892, "epoch": 4119} {"train_loss": -25.804920196533203, "global_step": 341893, "epoch": 4119} {"train_loss": -25.991519927978516, "global_step": 341894, "epoch": 4119} {"train_loss": -25.751184463500977, "global_step": 341895, "epoch": 4119} {"train_loss": -25.98200798034668, "global_step": 341896, "epoch": 4119} {"train_loss": -25.88848876953125, "global_step": 341897, "epoch": 4119} {"train_loss": -25.77949333190918, "global_step": 341898, "epoch": 4119} {"train_loss": -26.11480712890625, "global_step": 341899, "epoch": 4119} {"train_loss": -26.145923614501953, "global_step": 341900, "epoch": 4119} {"train_loss": -26.304473876953125, "global_step": 341901, "epoch": 4119} {"train_loss": -26.1285457611084, "global_step": 341902, "epoch": 4119} {"train_loss": -25.766324996948242, "global_step": 341903, "epoch": 4119} {"train_loss": -26.121274948120117, "global_step": 341904, "epoch": 4119} {"train_loss": -26.125837326049805, "global_step": 341905, "epoch": 4119} {"train_loss": -25.9788818359375, "global_step": 341906, "epoch": 4119} {"train_loss": -25.9450626373291, "global_step": 341907, "epoch": 4119} {"train_loss": -26.16672706604004, "global_step": 341908, "epoch": 4119} {"train_loss": -25.8721923828125, "global_step": 341909, "epoch": 4119} {"train_loss": -26.4681453704834, "global_step": 341910, "epoch": 4119} {"train_loss": -26.226470947265625, "global_step": 341911, "epoch": 4119} {"train_loss": -25.813995361328125, "global_step": 341912, "epoch": 4119} {"train_loss": -26.087982177734375, "global_step": 341913, "epoch": 4119} {"train_loss": -26.150558471679688, "global_step": 341914, "epoch": 4119} {"train_loss": -25.809375762939453, "global_step": 341915, "epoch": 4119} {"train_loss": -26.1798152923584, "global_step": 341916, "epoch": 4119} {"train_loss": -26.39200782775879, "global_step": 341917, "epoch": 4119} {"train_loss": -26.003889083862305, "global_step": 341918, "epoch": 4119} {"train_loss": -26.21323013305664, "global_step": 341919, "epoch": 4119} {"train_loss": -26.44071388244629, "global_step": 341920, "epoch": 4119} {"train_loss": -26.195316314697266, "global_step": 341921, "epoch": 4119} {"train_loss": -25.820083618164062, "global_step": 341922, "epoch": 4119} {"train_loss": -26.5709228515625, "global_step": 341923, "epoch": 4119} {"train_loss": -26.06150245666504, "global_step": 341924, "epoch": 4119} {"train_loss": -26.431034088134766, "global_step": 341925, "epoch": 4119} {"train_loss": -25.985279083251953, "global_step": 341926, "epoch": 4119} {"train_loss": -26.14298439025879, "global_step": 341927, "epoch": 4119} {"train_loss": -26.548694610595703, "global_step": 341928, "epoch": 4119} {"train_loss": -26.260181427001953, "global_step": 341929, "epoch": 4119} {"train_loss": -26.288318634033203, "global_step": 341930, "epoch": 4119} {"train_loss": -26.02817153930664, "global_step": 341931, "epoch": 4119} {"train_loss": -26.210498809814453, "global_step": 341932, "epoch": 4119} {"train_loss": -26.374652862548828, "global_step": 341933, "epoch": 4119} {"train_loss": -26.416669845581055, "global_step": 341934, "epoch": 4119} {"train_loss": -26.246747970581055, "global_step": 341935, "epoch": 4119} {"train_loss": -26.439472198486328, "global_step": 341936, "epoch": 4119} {"train_loss": -26.641082763671875, "global_step": 341937, "epoch": 4119} {"train_loss": -26.017017364501953, "global_step": 341938, "epoch": 4119} {"train_loss": -26.44342041015625, "global_step": 341939, "epoch": 4119} {"train_loss": -26.264612197875977, "global_step": 341940, "epoch": 4119} {"train_loss": -26.179800033569336, "global_step": 341941, "epoch": 4119} {"train_loss": -26.08125114440918, "global_step": 341942, "epoch": 4119} {"train_loss": -26.28824806213379, "global_step": 341943, "epoch": 4119} {"train_loss": -25.891637802124023, "global_step": 341944, "epoch": 4119} {"train_loss": -25.92251968383789, "global_step": 341945, "epoch": 4119} {"train_loss": -25.732574462890625, "global_step": 341946, "epoch": 4119} {"train_loss": -26.252033233642578, "global_step": 341947, "epoch": 4119} {"train_loss": -25.99622917175293, "global_step": 341948, "epoch": 4119} {"train_loss": -26.090839385986328, "global_step": 341949, "epoch": 4119} {"train_loss": -26.103429794311523, "global_step": 341950, "epoch": 4119} {"train_loss": -25.992700576782227, "global_step": 341951, "epoch": 4119} {"train_loss": -26.210912704467773, "global_step": 341952, "epoch": 4119} {"train_loss": -26.093341827392578, "global_step": 341953, "epoch": 4119} {"train_loss": -26.204910278320312, "global_step": 341954, "epoch": 4119} {"train_loss": -26.43427848815918, "global_step": 341955, "epoch": 4119} {"train_loss": -26.09766960144043, "global_step": 341956, "epoch": 4119} {"train_loss": -26.289997100830078, "global_step": 341957, "epoch": 4119} {"train_loss": -26.23914909362793, "global_step": 341958, "epoch": 4119} {"train_loss": -25.992373569902167, "global_step": 341959, "epoch": 4119, "val_loss": 6600648.5} {"train_loss": -23.74068260192871, "global_step": 341960, "epoch": 4120} {"train_loss": -22.32281494140625, "global_step": 341961, "epoch": 4120} {"train_loss": -25.56257438659668, "global_step": 341962, "epoch": 4120} {"train_loss": -23.850502014160156, "global_step": 341963, "epoch": 4120} {"train_loss": -24.54416847229004, "global_step": 341964, "epoch": 4120} {"train_loss": -24.413022994995117, "global_step": 341965, "epoch": 4120} {"train_loss": -24.653797149658203, "global_step": 341966, "epoch": 4120} {"train_loss": -24.206592559814453, "global_step": 341967, "epoch": 4120} {"train_loss": -25.007596969604492, "global_step": 341968, "epoch": 4120} {"train_loss": -25.080018997192383, "global_step": 341969, "epoch": 4120} {"train_loss": -24.84644317626953, "global_step": 341970, "epoch": 4120} {"train_loss": -25.124841690063477, "global_step": 341971, "epoch": 4120} {"train_loss": -25.18062400817871, "global_step": 341972, "epoch": 4120} {"train_loss": -25.030317306518555, "global_step": 341973, "epoch": 4120} {"train_loss": -25.033615112304688, "global_step": 341974, "epoch": 4120} {"train_loss": -25.560688018798828, "global_step": 341975, "epoch": 4120} {"train_loss": -25.518686294555664, "global_step": 341976, "epoch": 4120} {"train_loss": -24.96857452392578, "global_step": 341977, "epoch": 4120} {"train_loss": -25.253610610961914, "global_step": 341978, "epoch": 4120} {"train_loss": -25.72537612915039, "global_step": 341979, "epoch": 4120} {"train_loss": -25.231164932250977, "global_step": 341980, "epoch": 4120} {"train_loss": -25.085723876953125, "global_step": 341981, "epoch": 4120} {"train_loss": -25.591506958007812, "global_step": 341982, "epoch": 4120} {"train_loss": -25.515066146850586, "global_step": 341983, "epoch": 4120} {"train_loss": -25.392324447631836, "global_step": 341984, "epoch": 4120} {"train_loss": -25.446870803833008, "global_step": 341985, "epoch": 4120} {"train_loss": -25.878000259399414, "global_step": 341986, "epoch": 4120} {"train_loss": -25.75508689880371, "global_step": 341987, "epoch": 4120} {"train_loss": -25.319665908813477, "global_step": 341988, "epoch": 4120} {"train_loss": -25.5325927734375, "global_step": 341989, "epoch": 4120} {"train_loss": -25.788782119750977, "global_step": 341990, "epoch": 4120} {"train_loss": -25.703460693359375, "global_step": 341991, "epoch": 4120} {"train_loss": -25.888004302978516, "global_step": 341992, "epoch": 4120} {"train_loss": -25.562463760375977, "global_step": 341993, "epoch": 4120} {"train_loss": -25.60614585876465, "global_step": 341994, "epoch": 4120} {"train_loss": -25.7899112701416, "global_step": 341995, "epoch": 4120} {"train_loss": -25.967294692993164, "global_step": 341996, "epoch": 4120} {"train_loss": -25.83210563659668, "global_step": 341997, "epoch": 4120} {"train_loss": -26.066513061523438, "global_step": 341998, "epoch": 4120} {"train_loss": -26.21343421936035, "global_step": 341999, "epoch": 4120} {"train_loss": -26.37062644958496, "global_step": 342000, "epoch": 4120} {"train_loss": -26.19037437438965, "global_step": 342001, "epoch": 4120} {"train_loss": -25.935394287109375, "global_step": 342002, "epoch": 4120} {"train_loss": -26.34665298461914, "global_step": 342003, "epoch": 4120} {"train_loss": -25.994464874267578, "global_step": 342004, "epoch": 4120} {"train_loss": -26.12509536743164, "global_step": 342005, "epoch": 4120} {"train_loss": -26.10308837890625, "global_step": 342006, "epoch": 4120} {"train_loss": -26.100940704345703, "global_step": 342007, "epoch": 4120} {"train_loss": -25.933795928955078, "global_step": 342008, "epoch": 4120} {"train_loss": -25.605005264282227, "global_step": 342009, "epoch": 4120} {"train_loss": -26.283613204956055, "global_step": 342010, "epoch": 4120} {"train_loss": -26.151031494140625, "global_step": 342011, "epoch": 4120} {"train_loss": -26.100568771362305, "global_step": 342012, "epoch": 4120} {"train_loss": -26.600839614868164, "global_step": 342013, "epoch": 4120} {"train_loss": -26.501428604125977, "global_step": 342014, "epoch": 4120} {"train_loss": -26.061227798461914, "global_step": 342015, "epoch": 4120} {"train_loss": -26.100055694580078, "global_step": 342016, "epoch": 4120} {"train_loss": -26.3626708984375, "global_step": 342017, "epoch": 4120} {"train_loss": -25.900732040405273, "global_step": 342018, "epoch": 4120} {"train_loss": -26.197509765625, "global_step": 342019, "epoch": 4120} {"train_loss": -26.21429443359375, "global_step": 342020, "epoch": 4120} {"train_loss": -26.0305118560791, "global_step": 342021, "epoch": 4120} {"train_loss": -26.25372886657715, "global_step": 342022, "epoch": 4120} {"train_loss": -26.22258949279785, "global_step": 342023, "epoch": 4120} {"train_loss": -26.325971603393555, "global_step": 342024, "epoch": 4120} {"train_loss": -25.87948989868164, "global_step": 342025, "epoch": 4120} {"train_loss": -26.145231246948242, "global_step": 342026, "epoch": 4120} {"train_loss": -25.94288444519043, "global_step": 342027, "epoch": 4120} {"train_loss": -26.12839126586914, "global_step": 342028, "epoch": 4120} {"train_loss": -26.02793312072754, "global_step": 342029, "epoch": 4120} {"train_loss": -26.08237648010254, "global_step": 342030, "epoch": 4120} {"train_loss": -25.940814971923828, "global_step": 342031, "epoch": 4120} {"train_loss": -26.374170303344727, "global_step": 342032, "epoch": 4120} {"train_loss": -26.308460235595703, "global_step": 342033, "epoch": 4120} {"train_loss": -26.478118896484375, "global_step": 342034, "epoch": 4120} {"train_loss": -26.247303009033203, "global_step": 342035, "epoch": 4120} {"train_loss": -26.303552627563477, "global_step": 342036, "epoch": 4120} {"train_loss": -26.227279663085938, "global_step": 342037, "epoch": 4120} {"train_loss": -26.201114654541016, "global_step": 342038, "epoch": 4120} {"train_loss": -26.086719512939453, "global_step": 342039, "epoch": 4120} {"train_loss": -26.0226993560791, "global_step": 342040, "epoch": 4120} {"train_loss": -26.111352920532227, "global_step": 342041, "epoch": 4120} {"train_loss": -25.702445271503496, "global_step": 342042, "epoch": 4120, "val_loss": 6563597.0} {"train_loss": -25.118139266967773, "global_step": 342043, "epoch": 4121} {"train_loss": -25.15754508972168, "global_step": 342044, "epoch": 4121} {"train_loss": -25.296903610229492, "global_step": 342045, "epoch": 4121} {"train_loss": -25.068973541259766, "global_step": 342046, "epoch": 4121} {"train_loss": -25.341093063354492, "global_step": 342047, "epoch": 4121} {"train_loss": -25.884241104125977, "global_step": 342048, "epoch": 4121} {"train_loss": -25.73615074157715, "global_step": 342049, "epoch": 4121} {"train_loss": -25.604095458984375, "global_step": 342050, "epoch": 4121} {"train_loss": -25.586572647094727, "global_step": 342051, "epoch": 4121} {"train_loss": -26.0380916595459, "global_step": 342052, "epoch": 4121} {"train_loss": -26.130847930908203, "global_step": 342053, "epoch": 4121} {"train_loss": -25.691043853759766, "global_step": 342054, "epoch": 4121} {"train_loss": -26.003843307495117, "global_step": 342055, "epoch": 4121} {"train_loss": -25.38907814025879, "global_step": 342056, "epoch": 4121} {"train_loss": -25.66615867614746, "global_step": 342057, "epoch": 4121} {"train_loss": -25.343252182006836, "global_step": 342058, "epoch": 4121} {"train_loss": -25.807165145874023, "global_step": 342059, "epoch": 4121} {"train_loss": -25.718280792236328, "global_step": 342060, "epoch": 4121} {"train_loss": -25.8533878326416, "global_step": 342061, "epoch": 4121} {"train_loss": -26.050399780273438, "global_step": 342062, "epoch": 4121} {"train_loss": -25.38446617126465, "global_step": 342063, "epoch": 4121} {"train_loss": -26.067331314086914, "global_step": 342064, "epoch": 4121} {"train_loss": -25.772878646850586, "global_step": 342065, "epoch": 4121} {"train_loss": -26.002317428588867, "global_step": 342066, "epoch": 4121} {"train_loss": -25.60651206970215, "global_step": 342067, "epoch": 4121} {"train_loss": -26.096546173095703, "global_step": 342068, "epoch": 4121} {"train_loss": -26.027231216430664, "global_step": 342069, "epoch": 4121} {"train_loss": -25.632246017456055, "global_step": 342070, "epoch": 4121} {"train_loss": -25.805835723876953, "global_step": 342071, "epoch": 4121} {"train_loss": -26.15496253967285, "global_step": 342072, "epoch": 4121} {"train_loss": -26.199018478393555, "global_step": 342073, "epoch": 4121} {"train_loss": -26.218963623046875, "global_step": 342074, "epoch": 4121} {"train_loss": -26.0006046295166, "global_step": 342075, "epoch": 4121} {"train_loss": -26.081501007080078, "global_step": 342076, "epoch": 4121} {"train_loss": -26.195356369018555, "global_step": 342077, "epoch": 4121} {"train_loss": -26.043542861938477, "global_step": 342078, "epoch": 4121} {"train_loss": -26.046045303344727, "global_step": 342079, "epoch": 4121} {"train_loss": -26.124738693237305, "global_step": 342080, "epoch": 4121} {"train_loss": -25.562673568725586, "global_step": 342081, "epoch": 4121} {"train_loss": -26.190465927124023, "global_step": 342082, "epoch": 4121} {"train_loss": -26.368030548095703, "global_step": 342083, "epoch": 4121} {"train_loss": -25.943700790405273, "global_step": 342084, "epoch": 4121} {"train_loss": -25.91852378845215, "global_step": 342085, "epoch": 4121} {"train_loss": -26.150182723999023, "global_step": 342086, "epoch": 4121} {"train_loss": -26.128820419311523, "global_step": 342087, "epoch": 4121} {"train_loss": -26.018991470336914, "global_step": 342088, "epoch": 4121} {"train_loss": -26.096622467041016, "global_step": 342089, "epoch": 4121} {"train_loss": -26.390960693359375, "global_step": 342090, "epoch": 4121} {"train_loss": -26.491943359375, "global_step": 342091, "epoch": 4121} {"train_loss": -26.3011474609375, "global_step": 342092, "epoch": 4121} {"train_loss": -26.312788009643555, "global_step": 342093, "epoch": 4121} {"train_loss": -26.4685115814209, "global_step": 342094, "epoch": 4121} {"train_loss": -26.158971786499023, "global_step": 342095, "epoch": 4121} {"train_loss": -26.477643966674805, "global_step": 342096, "epoch": 4121} {"train_loss": -26.03717613220215, "global_step": 342097, "epoch": 4121} {"train_loss": -26.043241500854492, "global_step": 342098, "epoch": 4121} {"train_loss": -26.13984489440918, "global_step": 342099, "epoch": 4121} {"train_loss": -26.137243270874023, "global_step": 342100, "epoch": 4121} {"train_loss": -26.444849014282227, "global_step": 342101, "epoch": 4121} {"train_loss": -26.104154586791992, "global_step": 342102, "epoch": 4121} {"train_loss": -25.453962326049805, "global_step": 342103, "epoch": 4121} {"train_loss": -25.88041114807129, "global_step": 342104, "epoch": 4121} {"train_loss": -25.502328872680664, "global_step": 342105, "epoch": 4121} {"train_loss": -25.890701293945312, "global_step": 342106, "epoch": 4121} {"train_loss": -25.824132919311523, "global_step": 342107, "epoch": 4121} {"train_loss": -25.704517364501953, "global_step": 342108, "epoch": 4121} {"train_loss": -25.913593292236328, "global_step": 342109, "epoch": 4121} {"train_loss": -25.853620529174805, "global_step": 342110, "epoch": 4121} {"train_loss": -25.695154190063477, "global_step": 342111, "epoch": 4121} {"train_loss": -25.883359909057617, "global_step": 342112, "epoch": 4121} {"train_loss": -25.8184814453125, "global_step": 342113, "epoch": 4121} {"train_loss": -26.22283363342285, "global_step": 342114, "epoch": 4121} {"train_loss": -25.850072860717773, "global_step": 342115, "epoch": 4121} {"train_loss": -25.920639038085938, "global_step": 342116, "epoch": 4121} {"train_loss": -26.07147789001465, "global_step": 342117, "epoch": 4121} {"train_loss": -25.89154624938965, "global_step": 342118, "epoch": 4121} {"train_loss": -26.233564376831055, "global_step": 342119, "epoch": 4121} {"train_loss": -25.9427547454834, "global_step": 342120, "epoch": 4121} {"train_loss": -26.040267944335938, "global_step": 342121, "epoch": 4121} {"train_loss": -26.221227645874023, "global_step": 342122, "epoch": 4121} {"train_loss": -25.623809814453125, "global_step": 342123, "epoch": 4121} {"train_loss": -25.830183029174805, "global_step": 342124, "epoch": 4121} {"train_loss": -25.92579747395343, "global_step": 342125, "epoch": 4121, "val_loss": 6579997.5} {"train_loss": -25.52704429626465, "global_step": 342126, "epoch": 4122} {"train_loss": -25.743661880493164, "global_step": 342127, "epoch": 4122} {"train_loss": -26.167633056640625, "global_step": 342128, "epoch": 4122} {"train_loss": -24.999441146850586, "global_step": 342129, "epoch": 4122} {"train_loss": -25.074039459228516, "global_step": 342130, "epoch": 4122} {"train_loss": -26.01832389831543, "global_step": 342131, "epoch": 4122} {"train_loss": -25.51495933532715, "global_step": 342132, "epoch": 4122} {"train_loss": -25.631702423095703, "global_step": 342133, "epoch": 4122} {"train_loss": -26.01443862915039, "global_step": 342134, "epoch": 4122} {"train_loss": -25.706714630126953, "global_step": 342135, "epoch": 4122} {"train_loss": -26.0051212310791, "global_step": 342136, "epoch": 4122} {"train_loss": -25.838781356811523, "global_step": 342137, "epoch": 4122} {"train_loss": -26.014142990112305, "global_step": 342138, "epoch": 4122} {"train_loss": -26.4176025390625, "global_step": 342139, "epoch": 4122} {"train_loss": -26.069665908813477, "global_step": 342140, "epoch": 4122} {"train_loss": -25.9935359954834, "global_step": 342141, "epoch": 4122} {"train_loss": -25.917724609375, "global_step": 342142, "epoch": 4122} {"train_loss": -25.921064376831055, "global_step": 342143, "epoch": 4122} {"train_loss": -25.93841552734375, "global_step": 342144, "epoch": 4122} {"train_loss": -25.918554306030273, "global_step": 342145, "epoch": 4122} {"train_loss": -25.828388214111328, "global_step": 342146, "epoch": 4122} {"train_loss": -26.01593589782715, "global_step": 342147, "epoch": 4122} {"train_loss": -25.72528076171875, "global_step": 342148, "epoch": 4122} {"train_loss": -25.968854904174805, "global_step": 342149, "epoch": 4122} {"train_loss": -25.7387752532959, "global_step": 342150, "epoch": 4122} {"train_loss": -26.20613670349121, "global_step": 342151, "epoch": 4122} {"train_loss": -26.38575553894043, "global_step": 342152, "epoch": 4122} {"train_loss": -25.551864624023438, "global_step": 342153, "epoch": 4122} {"train_loss": -26.060400009155273, "global_step": 342154, "epoch": 4122} {"train_loss": -26.36652946472168, "global_step": 342155, "epoch": 4122} {"train_loss": -26.107166290283203, "global_step": 342156, "epoch": 4122} {"train_loss": -25.998889923095703, "global_step": 342157, "epoch": 4122} {"train_loss": -26.144439697265625, "global_step": 342158, "epoch": 4122} {"train_loss": -25.807830810546875, "global_step": 342159, "epoch": 4122} {"train_loss": -26.252765655517578, "global_step": 342160, "epoch": 4122} {"train_loss": -25.9434871673584, "global_step": 342161, "epoch": 4122} {"train_loss": -25.999597549438477, "global_step": 342162, "epoch": 4122} {"train_loss": -26.098783493041992, "global_step": 342163, "epoch": 4122} {"train_loss": -26.234298706054688, "global_step": 342164, "epoch": 4122} {"train_loss": -25.973363876342773, "global_step": 342165, "epoch": 4122} {"train_loss": -25.9969482421875, "global_step": 342166, "epoch": 4122} {"train_loss": -26.0814208984375, "global_step": 342167, "epoch": 4122} {"train_loss": -26.174774169921875, "global_step": 342168, "epoch": 4122} {"train_loss": -25.902008056640625, "global_step": 342169, "epoch": 4122} {"train_loss": -26.08576011657715, "global_step": 342170, "epoch": 4122} {"train_loss": -26.003515243530273, "global_step": 342171, "epoch": 4122} {"train_loss": -26.112096786499023, "global_step": 342172, "epoch": 4122} {"train_loss": -26.08253288269043, "global_step": 342173, "epoch": 4122} {"train_loss": -25.707168579101562, "global_step": 342174, "epoch": 4122} {"train_loss": -26.41766929626465, "global_step": 342175, "epoch": 4122} {"train_loss": -25.85610008239746, "global_step": 342176, "epoch": 4122} {"train_loss": -25.69122886657715, "global_step": 342177, "epoch": 4122} {"train_loss": -25.6814022064209, "global_step": 342178, "epoch": 4122} {"train_loss": -25.820905685424805, "global_step": 342179, "epoch": 4122} {"train_loss": -26.426671981811523, "global_step": 342180, "epoch": 4122} {"train_loss": -26.061859130859375, "global_step": 342181, "epoch": 4122} {"train_loss": -26.287677764892578, "global_step": 342182, "epoch": 4122} {"train_loss": -25.991043090820312, "global_step": 342183, "epoch": 4122} {"train_loss": -26.11993408203125, "global_step": 342184, "epoch": 4122} {"train_loss": -26.0848331451416, "global_step": 342185, "epoch": 4122} {"train_loss": -26.060028076171875, "global_step": 342186, "epoch": 4122} {"train_loss": -26.263397216796875, "global_step": 342187, "epoch": 4122} {"train_loss": -26.239973068237305, "global_step": 342188, "epoch": 4122} {"train_loss": -26.181528091430664, "global_step": 342189, "epoch": 4122} {"train_loss": -26.200942993164062, "global_step": 342190, "epoch": 4122} {"train_loss": -26.179901123046875, "global_step": 342191, "epoch": 4122} {"train_loss": -26.21030616760254, "global_step": 342192, "epoch": 4122} {"train_loss": -26.28509521484375, "global_step": 342193, "epoch": 4122} {"train_loss": -26.316221237182617, "global_step": 342194, "epoch": 4122} {"train_loss": -26.257444381713867, "global_step": 342195, "epoch": 4122} {"train_loss": -26.37592887878418, "global_step": 342196, "epoch": 4122} {"train_loss": -26.42930030822754, "global_step": 342197, "epoch": 4122} {"train_loss": -26.5435848236084, "global_step": 342198, "epoch": 4122} {"train_loss": -25.832839965820312, "global_step": 342199, "epoch": 4122} {"train_loss": -26.5296688079834, "global_step": 342200, "epoch": 4122} {"train_loss": -25.968158721923828, "global_step": 342201, "epoch": 4122} {"train_loss": -26.473363876342773, "global_step": 342202, "epoch": 4122} {"train_loss": -26.413793563842773, "global_step": 342203, "epoch": 4122} {"train_loss": -26.11077880859375, "global_step": 342204, "epoch": 4122} {"train_loss": -26.1712589263916, "global_step": 342205, "epoch": 4122} {"train_loss": -26.604843139648438, "global_step": 342206, "epoch": 4122} {"train_loss": -26.5040283203125, "global_step": 342207, "epoch": 4122} {"train_loss": -26.056275517107494, "global_step": 342208, "epoch": 4122, "val_loss": 6638269.0} {"train_loss": -25.844858169555664, "global_step": 342209, "epoch": 4123} {"train_loss": -24.304380416870117, "global_step": 342210, "epoch": 4123} {"train_loss": -23.15192222595215, "global_step": 342211, "epoch": 4123} {"train_loss": -23.47672462463379, "global_step": 342212, "epoch": 4123} {"train_loss": -25.067270278930664, "global_step": 342213, "epoch": 4123} {"train_loss": -25.24616050720215, "global_step": 342214, "epoch": 4123} {"train_loss": -24.43768882751465, "global_step": 342215, "epoch": 4123} {"train_loss": -25.44200897216797, "global_step": 342216, "epoch": 4123} {"train_loss": -24.952878952026367, "global_step": 342217, "epoch": 4123} {"train_loss": -25.537321090698242, "global_step": 342218, "epoch": 4123} {"train_loss": -25.61420249938965, "global_step": 342219, "epoch": 4123} {"train_loss": -25.043785095214844, "global_step": 342220, "epoch": 4123} {"train_loss": -25.790998458862305, "global_step": 342221, "epoch": 4123} {"train_loss": -25.511329650878906, "global_step": 342222, "epoch": 4123} {"train_loss": -25.65997314453125, "global_step": 342223, "epoch": 4123} {"train_loss": -25.565704345703125, "global_step": 342224, "epoch": 4123} {"train_loss": -25.973154067993164, "global_step": 342225, "epoch": 4123} {"train_loss": -25.9551944732666, "global_step": 342226, "epoch": 4123} {"train_loss": -25.777389526367188, "global_step": 342227, "epoch": 4123} {"train_loss": -26.140470504760742, "global_step": 342228, "epoch": 4123} {"train_loss": -25.60174560546875, "global_step": 342229, "epoch": 4123} {"train_loss": -25.29867935180664, "global_step": 342230, "epoch": 4123} {"train_loss": -25.802448272705078, "global_step": 342231, "epoch": 4123} {"train_loss": -25.7208194732666, "global_step": 342232, "epoch": 4123} {"train_loss": -25.929712295532227, "global_step": 342233, "epoch": 4123} {"train_loss": -25.665136337280273, "global_step": 342234, "epoch": 4123} {"train_loss": -25.922866821289062, "global_step": 342235, "epoch": 4123} {"train_loss": -25.66534423828125, "global_step": 342236, "epoch": 4123} {"train_loss": -25.9533748626709, "global_step": 342237, "epoch": 4123} {"train_loss": -26.05842399597168, "global_step": 342238, "epoch": 4123} {"train_loss": -25.83074951171875, "global_step": 342239, "epoch": 4123} {"train_loss": -25.8492431640625, "global_step": 342240, "epoch": 4123} {"train_loss": -25.912561416625977, "global_step": 342241, "epoch": 4123} {"train_loss": -26.319005966186523, "global_step": 342242, "epoch": 4123} {"train_loss": -26.0074462890625, "global_step": 342243, "epoch": 4123} {"train_loss": -26.18524169921875, "global_step": 342244, "epoch": 4123} {"train_loss": -26.13825798034668, "global_step": 342245, "epoch": 4123} {"train_loss": -26.380834579467773, "global_step": 342246, "epoch": 4123} {"train_loss": -25.904224395751953, "global_step": 342247, "epoch": 4123} {"train_loss": -25.725427627563477, "global_step": 342248, "epoch": 4123} {"train_loss": -26.005477905273438, "global_step": 342249, "epoch": 4123} {"train_loss": -25.857458114624023, "global_step": 342250, "epoch": 4123} {"train_loss": -26.296857833862305, "global_step": 342251, "epoch": 4123} {"train_loss": -26.31450843811035, "global_step": 342252, "epoch": 4123} {"train_loss": -26.014921188354492, "global_step": 342253, "epoch": 4123} {"train_loss": -26.013792037963867, "global_step": 342254, "epoch": 4123} {"train_loss": -25.885961532592773, "global_step": 342255, "epoch": 4123} {"train_loss": -26.2965030670166, "global_step": 342256, "epoch": 4123} {"train_loss": -26.11836051940918, "global_step": 342257, "epoch": 4123} {"train_loss": -26.100513458251953, "global_step": 342258, "epoch": 4123} {"train_loss": -26.087833404541016, "global_step": 342259, "epoch": 4123} {"train_loss": -26.09205436706543, "global_step": 342260, "epoch": 4123} {"train_loss": -26.53131675720215, "global_step": 342261, "epoch": 4123} {"train_loss": -26.0380802154541, "global_step": 342262, "epoch": 4123} {"train_loss": -25.852563858032227, "global_step": 342263, "epoch": 4123} {"train_loss": -26.5994815826416, "global_step": 342264, "epoch": 4123} {"train_loss": -26.3087215423584, "global_step": 342265, "epoch": 4123} {"train_loss": -26.104154586791992, "global_step": 342266, "epoch": 4123} {"train_loss": -26.595319747924805, "global_step": 342267, "epoch": 4123} {"train_loss": -26.179651260375977, "global_step": 342268, "epoch": 4123} {"train_loss": -26.0280704498291, "global_step": 342269, "epoch": 4123} {"train_loss": -26.38075065612793, "global_step": 342270, "epoch": 4123} {"train_loss": -26.087263107299805, "global_step": 342271, "epoch": 4123} {"train_loss": -26.030059814453125, "global_step": 342272, "epoch": 4123} {"train_loss": -26.183090209960938, "global_step": 342273, "epoch": 4123} {"train_loss": -25.895721435546875, "global_step": 342274, "epoch": 4123} {"train_loss": -26.046228408813477, "global_step": 342275, "epoch": 4123} {"train_loss": -25.63264274597168, "global_step": 342276, "epoch": 4123} {"train_loss": -25.997100830078125, "global_step": 342277, "epoch": 4123} {"train_loss": -25.55686378479004, "global_step": 342278, "epoch": 4123} {"train_loss": -25.882673263549805, "global_step": 342279, "epoch": 4123} {"train_loss": -25.955718994140625, "global_step": 342280, "epoch": 4123} {"train_loss": -26.594043731689453, "global_step": 342281, "epoch": 4123} {"train_loss": -26.388181686401367, "global_step": 342282, "epoch": 4123} {"train_loss": -25.954944610595703, "global_step": 342283, "epoch": 4123} {"train_loss": -26.112735748291016, "global_step": 342284, "epoch": 4123} {"train_loss": -25.734161376953125, "global_step": 342285, "epoch": 4123} {"train_loss": -26.1486873626709, "global_step": 342286, "epoch": 4123} {"train_loss": -26.00282096862793, "global_step": 342287, "epoch": 4123} {"train_loss": -26.252365112304688, "global_step": 342288, "epoch": 4123} {"train_loss": -26.11323356628418, "global_step": 342289, "epoch": 4123} {"train_loss": -26.39015769958496, "global_step": 342290, "epoch": 4123} {"train_loss": -25.851911383939076, "global_step": 342291, "epoch": 4123, "val_loss": 6620891.0} {"train_loss": -25.729694366455078, "global_step": 342292, "epoch": 4124} {"train_loss": -25.632980346679688, "global_step": 342293, "epoch": 4124} {"train_loss": -25.580196380615234, "global_step": 342294, "epoch": 4124} {"train_loss": -25.88998794555664, "global_step": 342295, "epoch": 4124} {"train_loss": -25.98862075805664, "global_step": 342296, "epoch": 4124} {"train_loss": -25.977436065673828, "global_step": 342297, "epoch": 4124} {"train_loss": -26.151123046875, "global_step": 342298, "epoch": 4124} {"train_loss": -25.829782485961914, "global_step": 342299, "epoch": 4124} {"train_loss": -25.713117599487305, "global_step": 342300, "epoch": 4124} {"train_loss": -26.073272705078125, "global_step": 342301, "epoch": 4124} {"train_loss": -25.80128288269043, "global_step": 342302, "epoch": 4124} {"train_loss": -26.286283493041992, "global_step": 342303, "epoch": 4124} {"train_loss": -26.029834747314453, "global_step": 342304, "epoch": 4124} {"train_loss": -25.990018844604492, "global_step": 342305, "epoch": 4124} {"train_loss": -26.294296264648438, "global_step": 342306, "epoch": 4124} {"train_loss": -26.07927894592285, "global_step": 342307, "epoch": 4124} {"train_loss": -26.15643310546875, "global_step": 342308, "epoch": 4124} {"train_loss": -26.029775619506836, "global_step": 342309, "epoch": 4124} {"train_loss": -25.916608810424805, "global_step": 342310, "epoch": 4124} {"train_loss": -25.915491104125977, "global_step": 342311, "epoch": 4124} {"train_loss": -25.78143882751465, "global_step": 342312, "epoch": 4124} {"train_loss": -25.965646743774414, "global_step": 342313, "epoch": 4124} {"train_loss": -26.021896362304688, "global_step": 342314, "epoch": 4124} {"train_loss": -26.254133224487305, "global_step": 342315, "epoch": 4124} {"train_loss": -26.180212020874023, "global_step": 342316, "epoch": 4124} {"train_loss": -25.927108764648438, "global_step": 342317, "epoch": 4124} {"train_loss": -26.307538986206055, "global_step": 342318, "epoch": 4124} {"train_loss": -26.232105255126953, "global_step": 342319, "epoch": 4124} {"train_loss": -26.053424835205078, "global_step": 342320, "epoch": 4124} {"train_loss": -26.094247817993164, "global_step": 342321, "epoch": 4124} {"train_loss": -25.94375991821289, "global_step": 342322, "epoch": 4124} {"train_loss": -26.201337814331055, "global_step": 342323, "epoch": 4124} {"train_loss": -25.998046875, "global_step": 342324, "epoch": 4124} {"train_loss": -26.047094345092773, "global_step": 342325, "epoch": 4124} {"train_loss": -25.690881729125977, "global_step": 342326, "epoch": 4124} {"train_loss": -25.9309024810791, "global_step": 342327, "epoch": 4124} {"train_loss": -26.11439323425293, "global_step": 342328, "epoch": 4124} {"train_loss": -26.123462677001953, "global_step": 342329, "epoch": 4124} {"train_loss": -25.620227813720703, "global_step": 342330, "epoch": 4124} {"train_loss": -25.910877227783203, "global_step": 342331, "epoch": 4124} {"train_loss": -26.129837036132812, "global_step": 342332, "epoch": 4124} {"train_loss": -25.969335556030273, "global_step": 342333, "epoch": 4124} {"train_loss": -25.887434005737305, "global_step": 342334, "epoch": 4124} {"train_loss": -26.192245483398438, "global_step": 342335, "epoch": 4124} {"train_loss": -26.030614852905273, "global_step": 342336, "epoch": 4124} {"train_loss": -25.576099395751953, "global_step": 342337, "epoch": 4124} {"train_loss": -26.567502975463867, "global_step": 342338, "epoch": 4124} {"train_loss": -26.03285026550293, "global_step": 342339, "epoch": 4124} {"train_loss": -26.277143478393555, "global_step": 342340, "epoch": 4124} {"train_loss": -25.779470443725586, "global_step": 342341, "epoch": 4124} {"train_loss": -26.211750030517578, "global_step": 342342, "epoch": 4124} {"train_loss": -26.24017333984375, "global_step": 342343, "epoch": 4124} {"train_loss": -25.916976928710938, "global_step": 342344, "epoch": 4124} {"train_loss": -26.1463680267334, "global_step": 342345, "epoch": 4124} {"train_loss": -26.804645538330078, "global_step": 342346, "epoch": 4124} {"train_loss": -26.176416397094727, "global_step": 342347, "epoch": 4124} {"train_loss": -26.425281524658203, "global_step": 342348, "epoch": 4124} {"train_loss": -26.17658805847168, "global_step": 342349, "epoch": 4124} {"train_loss": -26.22822380065918, "global_step": 342350, "epoch": 4124} {"train_loss": -26.292236328125, "global_step": 342351, "epoch": 4124} {"train_loss": -26.26898193359375, "global_step": 342352, "epoch": 4124} {"train_loss": -26.08955955505371, "global_step": 342353, "epoch": 4124} {"train_loss": -26.340436935424805, "global_step": 342354, "epoch": 4124} {"train_loss": -26.3897762298584, "global_step": 342355, "epoch": 4124} {"train_loss": -25.838647842407227, "global_step": 342356, "epoch": 4124} {"train_loss": -26.105365753173828, "global_step": 342357, "epoch": 4124} {"train_loss": -26.096139907836914, "global_step": 342358, "epoch": 4124} {"train_loss": -26.43623161315918, "global_step": 342359, "epoch": 4124} {"train_loss": -26.176298141479492, "global_step": 342360, "epoch": 4124} {"train_loss": -26.25056266784668, "global_step": 342361, "epoch": 4124} {"train_loss": -25.895191192626953, "global_step": 342362, "epoch": 4124} {"train_loss": -26.241872787475586, "global_step": 342363, "epoch": 4124} {"train_loss": -25.854007720947266, "global_step": 342364, "epoch": 4124} {"train_loss": -26.385360717773438, "global_step": 342365, "epoch": 4124} {"train_loss": -26.139755249023438, "global_step": 342366, "epoch": 4124} {"train_loss": -25.795358657836914, "global_step": 342367, "epoch": 4124} {"train_loss": -25.74989128112793, "global_step": 342368, "epoch": 4124} {"train_loss": -26.341903686523438, "global_step": 342369, "epoch": 4124} {"train_loss": -26.318967819213867, "global_step": 342370, "epoch": 4124} {"train_loss": -25.79811668395996, "global_step": 342371, "epoch": 4124} {"train_loss": -25.64313316345215, "global_step": 342372, "epoch": 4124} {"train_loss": -26.025110244750977, "global_step": 342373, "epoch": 4124} {"train_loss": -26.050603958497565, "global_step": 342374, "epoch": 4124, "val_loss": 6565409.0} {"train_loss": -25.51837730407715, "global_step": 342375, "epoch": 4125} {"train_loss": -25.510404586791992, "global_step": 342376, "epoch": 4125} {"train_loss": -25.74526023864746, "global_step": 342377, "epoch": 4125} {"train_loss": -25.532407760620117, "global_step": 342378, "epoch": 4125} {"train_loss": -25.51609230041504, "global_step": 342379, "epoch": 4125} {"train_loss": -25.859394073486328, "global_step": 342380, "epoch": 4125} {"train_loss": -25.487743377685547, "global_step": 342381, "epoch": 4125} {"train_loss": -25.74566078186035, "global_step": 342382, "epoch": 4125} {"train_loss": -25.60740089416504, "global_step": 342383, "epoch": 4125} {"train_loss": -25.855939865112305, "global_step": 342384, "epoch": 4125} {"train_loss": -25.72592544555664, "global_step": 342385, "epoch": 4125} {"train_loss": -25.64590835571289, "global_step": 342386, "epoch": 4125} {"train_loss": -25.850513458251953, "global_step": 342387, "epoch": 4125} {"train_loss": -25.612659454345703, "global_step": 342388, "epoch": 4125} {"train_loss": -26.13922119140625, "global_step": 342389, "epoch": 4125} {"train_loss": -25.64690589904785, "global_step": 342390, "epoch": 4125} {"train_loss": -25.495832443237305, "global_step": 342391, "epoch": 4125} {"train_loss": -25.53509521484375, "global_step": 342392, "epoch": 4125} {"train_loss": -25.892248153686523, "global_step": 342393, "epoch": 4125} {"train_loss": -25.85384178161621, "global_step": 342394, "epoch": 4125} {"train_loss": -25.831159591674805, "global_step": 342395, "epoch": 4125} {"train_loss": -25.914794921875, "global_step": 342396, "epoch": 4125} {"train_loss": -25.65764808654785, "global_step": 342397, "epoch": 4125} {"train_loss": -26.019824981689453, "global_step": 342398, "epoch": 4125} {"train_loss": -25.71113395690918, "global_step": 342399, "epoch": 4125} {"train_loss": -25.567657470703125, "global_step": 342400, "epoch": 4125} {"train_loss": -26.076990127563477, "global_step": 342401, "epoch": 4125} {"train_loss": -25.607410430908203, "global_step": 342402, "epoch": 4125} {"train_loss": -25.810083389282227, "global_step": 342403, "epoch": 4125} {"train_loss": -25.65279197692871, "global_step": 342404, "epoch": 4125} {"train_loss": -25.9626407623291, "global_step": 342405, "epoch": 4125} {"train_loss": -25.83199119567871, "global_step": 342406, "epoch": 4125} {"train_loss": -26.038175582885742, "global_step": 342407, "epoch": 4125} {"train_loss": -26.2567195892334, "global_step": 342408, "epoch": 4125} {"train_loss": -25.995763778686523, "global_step": 342409, "epoch": 4125} {"train_loss": -25.88068962097168, "global_step": 342410, "epoch": 4125} {"train_loss": -25.872404098510742, "global_step": 342411, "epoch": 4125} {"train_loss": -25.880109786987305, "global_step": 342412, "epoch": 4125} {"train_loss": -26.33882713317871, "global_step": 342413, "epoch": 4125} {"train_loss": -26.313812255859375, "global_step": 342414, "epoch": 4125} {"train_loss": -26.10755729675293, "global_step": 342415, "epoch": 4125} {"train_loss": -26.16388511657715, "global_step": 342416, "epoch": 4125} {"train_loss": -26.195234298706055, "global_step": 342417, "epoch": 4125} {"train_loss": -25.7725772857666, "global_step": 342418, "epoch": 4125} {"train_loss": -26.04703140258789, "global_step": 342419, "epoch": 4125} {"train_loss": -26.106733322143555, "global_step": 342420, "epoch": 4125} {"train_loss": -26.154953002929688, "global_step": 342421, "epoch": 4125} {"train_loss": -26.209394454956055, "global_step": 342422, "epoch": 4125} {"train_loss": -25.888885498046875, "global_step": 342423, "epoch": 4125} {"train_loss": -26.104841232299805, "global_step": 342424, "epoch": 4125} {"train_loss": -25.806995391845703, "global_step": 342425, "epoch": 4125} {"train_loss": -26.057605743408203, "global_step": 342426, "epoch": 4125} {"train_loss": -25.816913604736328, "global_step": 342427, "epoch": 4125} {"train_loss": -26.133024215698242, "global_step": 342428, "epoch": 4125} {"train_loss": -26.278512954711914, "global_step": 342429, "epoch": 4125} {"train_loss": -26.229360580444336, "global_step": 342430, "epoch": 4125} {"train_loss": -26.270261764526367, "global_step": 342431, "epoch": 4125} {"train_loss": -26.23969078063965, "global_step": 342432, "epoch": 4125} {"train_loss": -25.931299209594727, "global_step": 342433, "epoch": 4125} {"train_loss": -26.35546875, "global_step": 342434, "epoch": 4125} {"train_loss": -25.86039161682129, "global_step": 342435, "epoch": 4125} {"train_loss": -26.01765251159668, "global_step": 342436, "epoch": 4125} {"train_loss": -26.127710342407227, "global_step": 342437, "epoch": 4125} {"train_loss": -25.882959365844727, "global_step": 342438, "epoch": 4125} {"train_loss": -26.069726943969727, "global_step": 342439, "epoch": 4125} {"train_loss": -25.996667861938477, "global_step": 342440, "epoch": 4125} {"train_loss": -25.95765495300293, "global_step": 342441, "epoch": 4125} {"train_loss": -25.942291259765625, "global_step": 342442, "epoch": 4125} {"train_loss": -26.135883331298828, "global_step": 342443, "epoch": 4125} {"train_loss": -26.145099639892578, "global_step": 342444, "epoch": 4125} {"train_loss": -26.094369888305664, "global_step": 342445, "epoch": 4125} {"train_loss": -26.58951187133789, "global_step": 342446, "epoch": 4125} {"train_loss": -26.715885162353516, "global_step": 342447, "epoch": 4125} {"train_loss": -25.694807052612305, "global_step": 342448, "epoch": 4125} {"train_loss": -26.23615837097168, "global_step": 342449, "epoch": 4125} {"train_loss": -26.403778076171875, "global_step": 342450, "epoch": 4125} {"train_loss": -25.64668083190918, "global_step": 342451, "epoch": 4125} {"train_loss": -25.882177352905273, "global_step": 342452, "epoch": 4125} {"train_loss": -25.734296798706055, "global_step": 342453, "epoch": 4125} {"train_loss": -26.094970703125, "global_step": 342454, "epoch": 4125} {"train_loss": -26.36542320251465, "global_step": 342455, "epoch": 4125} {"train_loss": -26.054601669311523, "global_step": 342456, "epoch": 4125} {"train_loss": -25.953307094344172, "global_step": 342457, "epoch": 4125, "val_loss": 6604502.5} {"train_loss": -25.940526962280273, "global_step": 342458, "epoch": 4126} {"train_loss": -25.655994415283203, "global_step": 342459, "epoch": 4126} {"train_loss": -25.70894432067871, "global_step": 342460, "epoch": 4126} {"train_loss": -26.07343101501465, "global_step": 342461, "epoch": 4126} {"train_loss": -26.379104614257812, "global_step": 342462, "epoch": 4126} {"train_loss": -25.895776748657227, "global_step": 342463, "epoch": 4126} {"train_loss": -25.95713233947754, "global_step": 342464, "epoch": 4126} {"train_loss": -26.40669822692871, "global_step": 342465, "epoch": 4126} {"train_loss": -26.164081573486328, "global_step": 342466, "epoch": 4126} {"train_loss": -25.601476669311523, "global_step": 342467, "epoch": 4126} {"train_loss": -25.912017822265625, "global_step": 342468, "epoch": 4126} {"train_loss": -26.371057510375977, "global_step": 342469, "epoch": 4126} {"train_loss": -25.68393325805664, "global_step": 342470, "epoch": 4126} {"train_loss": -25.76617431640625, "global_step": 342471, "epoch": 4126} {"train_loss": -26.363515853881836, "global_step": 342472, "epoch": 4126} {"train_loss": -26.03158950805664, "global_step": 342473, "epoch": 4126} {"train_loss": -26.27388572692871, "global_step": 342474, "epoch": 4126} {"train_loss": -26.0770320892334, "global_step": 342475, "epoch": 4126} {"train_loss": -26.20839500427246, "global_step": 342476, "epoch": 4126} {"train_loss": -26.378803253173828, "global_step": 342477, "epoch": 4126} {"train_loss": -26.209653854370117, "global_step": 342478, "epoch": 4126} {"train_loss": -25.884916305541992, "global_step": 342479, "epoch": 4126} {"train_loss": -26.07258415222168, "global_step": 342480, "epoch": 4126} {"train_loss": -26.208728790283203, "global_step": 342481, "epoch": 4126} {"train_loss": -26.3773136138916, "global_step": 342482, "epoch": 4126} {"train_loss": -25.664783477783203, "global_step": 342483, "epoch": 4126} {"train_loss": -26.0789794921875, "global_step": 342484, "epoch": 4126} {"train_loss": -26.373157501220703, "global_step": 342485, "epoch": 4126} {"train_loss": -26.214887619018555, "global_step": 342486, "epoch": 4126} {"train_loss": -25.992416381835938, "global_step": 342487, "epoch": 4126} {"train_loss": -25.837665557861328, "global_step": 342488, "epoch": 4126} {"train_loss": -25.961414337158203, "global_step": 342489, "epoch": 4126} {"train_loss": -26.15045166015625, "global_step": 342490, "epoch": 4126} {"train_loss": -26.1237850189209, "global_step": 342491, "epoch": 4126} {"train_loss": -26.278955459594727, "global_step": 342492, "epoch": 4126} {"train_loss": -26.10322380065918, "global_step": 342493, "epoch": 4126} {"train_loss": -26.404632568359375, "global_step": 342494, "epoch": 4126} {"train_loss": -26.1225643157959, "global_step": 342495, "epoch": 4126} {"train_loss": -26.2288818359375, "global_step": 342496, "epoch": 4126} {"train_loss": -26.285018920898438, "global_step": 342497, "epoch": 4126} {"train_loss": -26.498706817626953, "global_step": 342498, "epoch": 4126} {"train_loss": -26.0166072845459, "global_step": 342499, "epoch": 4126} {"train_loss": -26.05712890625, "global_step": 342500, "epoch": 4126} {"train_loss": -26.427906036376953, "global_step": 342501, "epoch": 4126} {"train_loss": -26.254236221313477, "global_step": 342502, "epoch": 4126} {"train_loss": -25.937225341796875, "global_step": 342503, "epoch": 4126} {"train_loss": -25.719268798828125, "global_step": 342504, "epoch": 4126} {"train_loss": -26.126169204711914, "global_step": 342505, "epoch": 4126} {"train_loss": -26.0156307220459, "global_step": 342506, "epoch": 4126} {"train_loss": -26.076736450195312, "global_step": 342507, "epoch": 4126} {"train_loss": -26.048017501831055, "global_step": 342508, "epoch": 4126} {"train_loss": -26.042856216430664, "global_step": 342509, "epoch": 4126} {"train_loss": -25.613677978515625, "global_step": 342510, "epoch": 4126} {"train_loss": -25.991046905517578, "global_step": 342511, "epoch": 4126} {"train_loss": -26.049072265625, "global_step": 342512, "epoch": 4126} {"train_loss": -26.089099884033203, "global_step": 342513, "epoch": 4126} {"train_loss": -26.443464279174805, "global_step": 342514, "epoch": 4126} {"train_loss": -26.432790756225586, "global_step": 342515, "epoch": 4126} {"train_loss": -26.205835342407227, "global_step": 342516, "epoch": 4126} {"train_loss": -26.367679595947266, "global_step": 342517, "epoch": 4126} {"train_loss": -26.20074462890625, "global_step": 342518, "epoch": 4126} {"train_loss": -26.1049747467041, "global_step": 342519, "epoch": 4126} {"train_loss": -26.55427360534668, "global_step": 342520, "epoch": 4126} {"train_loss": -26.11189079284668, "global_step": 342521, "epoch": 4126} {"train_loss": -26.40289878845215, "global_step": 342522, "epoch": 4126} {"train_loss": -26.2447509765625, "global_step": 342523, "epoch": 4126} {"train_loss": -26.181655883789062, "global_step": 342524, "epoch": 4126} {"train_loss": -25.8840274810791, "global_step": 342525, "epoch": 4126} {"train_loss": -25.824771881103516, "global_step": 342526, "epoch": 4126} {"train_loss": -26.11268424987793, "global_step": 342527, "epoch": 4126} {"train_loss": -25.786712646484375, "global_step": 342528, "epoch": 4126} {"train_loss": -26.287199020385742, "global_step": 342529, "epoch": 4126} {"train_loss": -26.470457077026367, "global_step": 342530, "epoch": 4126} {"train_loss": -25.772886276245117, "global_step": 342531, "epoch": 4126} {"train_loss": -26.189722061157227, "global_step": 342532, "epoch": 4126} {"train_loss": -26.042383193969727, "global_step": 342533, "epoch": 4126} {"train_loss": -26.124784469604492, "global_step": 342534, "epoch": 4126} {"train_loss": -26.052371978759766, "global_step": 342535, "epoch": 4126} {"train_loss": -25.910785675048828, "global_step": 342536, "epoch": 4126} {"train_loss": -26.130939483642578, "global_step": 342537, "epoch": 4126} {"train_loss": -26.060041427612305, "global_step": 342538, "epoch": 4126} {"train_loss": -26.501005172729492, "global_step": 342539, "epoch": 4126} {"train_loss": -26.10797594828778, "global_step": 342540, "epoch": 4126, "val_loss": 6639611.0} {"train_loss": -25.431926727294922, "global_step": 342541, "epoch": 4127} {"train_loss": -25.539220809936523, "global_step": 342542, "epoch": 4127} {"train_loss": -25.698444366455078, "global_step": 342543, "epoch": 4127} {"train_loss": -25.752185821533203, "global_step": 342544, "epoch": 4127} {"train_loss": -25.64801025390625, "global_step": 342545, "epoch": 4127} {"train_loss": -25.3016357421875, "global_step": 342546, "epoch": 4127} {"train_loss": -26.013935089111328, "global_step": 342547, "epoch": 4127} {"train_loss": -25.923486709594727, "global_step": 342548, "epoch": 4127} {"train_loss": -25.640689849853516, "global_step": 342549, "epoch": 4127} {"train_loss": -25.83026695251465, "global_step": 342550, "epoch": 4127} {"train_loss": -26.089923858642578, "global_step": 342551, "epoch": 4127} {"train_loss": -26.00440788269043, "global_step": 342552, "epoch": 4127} {"train_loss": -25.673954010009766, "global_step": 342553, "epoch": 4127} {"train_loss": -25.624094009399414, "global_step": 342554, "epoch": 4127} {"train_loss": -26.192724227905273, "global_step": 342555, "epoch": 4127} {"train_loss": -25.665252685546875, "global_step": 342556, "epoch": 4127} {"train_loss": -26.0631046295166, "global_step": 342557, "epoch": 4127} {"train_loss": -26.033615112304688, "global_step": 342558, "epoch": 4127} {"train_loss": -25.934005737304688, "global_step": 342559, "epoch": 4127} {"train_loss": -25.46101188659668, "global_step": 342560, "epoch": 4127} {"train_loss": -26.0172176361084, "global_step": 342561, "epoch": 4127} {"train_loss": -26.02532958984375, "global_step": 342562, "epoch": 4127} {"train_loss": -25.909360885620117, "global_step": 342563, "epoch": 4127} {"train_loss": -25.656503677368164, "global_step": 342564, "epoch": 4127} {"train_loss": -26.09343910217285, "global_step": 342565, "epoch": 4127} {"train_loss": -26.23943519592285, "global_step": 342566, "epoch": 4127} {"train_loss": -26.23493766784668, "global_step": 342567, "epoch": 4127} {"train_loss": -26.069766998291016, "global_step": 342568, "epoch": 4127} {"train_loss": -26.080215454101562, "global_step": 342569, "epoch": 4127} {"train_loss": -26.349172592163086, "global_step": 342570, "epoch": 4127} {"train_loss": -25.813232421875, "global_step": 342571, "epoch": 4127} {"train_loss": -26.0550594329834, "global_step": 342572, "epoch": 4127} {"train_loss": -25.96668815612793, "global_step": 342573, "epoch": 4127} {"train_loss": -26.22898292541504, "global_step": 342574, "epoch": 4127} {"train_loss": -25.96587562561035, "global_step": 342575, "epoch": 4127} {"train_loss": -25.85687828063965, "global_step": 342576, "epoch": 4127} {"train_loss": -25.8652400970459, "global_step": 342577, "epoch": 4127} {"train_loss": -26.0277042388916, "global_step": 342578, "epoch": 4127} {"train_loss": -25.95503044128418, "global_step": 342579, "epoch": 4127} {"train_loss": -26.16803550720215, "global_step": 342580, "epoch": 4127} {"train_loss": -25.776016235351562, "global_step": 342581, "epoch": 4127} {"train_loss": -26.5554141998291, "global_step": 342582, "epoch": 4127} {"train_loss": -26.26167869567871, "global_step": 342583, "epoch": 4127} {"train_loss": -26.02573585510254, "global_step": 342584, "epoch": 4127} {"train_loss": -26.309667587280273, "global_step": 342585, "epoch": 4127} {"train_loss": -25.96064567565918, "global_step": 342586, "epoch": 4127} {"train_loss": -25.9486083984375, "global_step": 342587, "epoch": 4127} {"train_loss": -25.7750244140625, "global_step": 342588, "epoch": 4127} {"train_loss": -25.772586822509766, "global_step": 342589, "epoch": 4127} {"train_loss": -25.979398727416992, "global_step": 342590, "epoch": 4127} {"train_loss": -25.927764892578125, "global_step": 342591, "epoch": 4127} {"train_loss": -25.908681869506836, "global_step": 342592, "epoch": 4127} {"train_loss": -26.09397315979004, "global_step": 342593, "epoch": 4127} {"train_loss": -25.929059982299805, "global_step": 342594, "epoch": 4127} {"train_loss": -26.231287002563477, "global_step": 342595, "epoch": 4127} {"train_loss": -25.664703369140625, "global_step": 342596, "epoch": 4127} {"train_loss": -26.3421630859375, "global_step": 342597, "epoch": 4127} {"train_loss": -26.00390625, "global_step": 342598, "epoch": 4127} {"train_loss": -26.101530075073242, "global_step": 342599, "epoch": 4127} {"train_loss": -25.96952247619629, "global_step": 342600, "epoch": 4127} {"train_loss": -26.096662521362305, "global_step": 342601, "epoch": 4127} {"train_loss": -26.230276107788086, "global_step": 342602, "epoch": 4127} {"train_loss": -26.181814193725586, "global_step": 342603, "epoch": 4127} {"train_loss": -26.21196937561035, "global_step": 342604, "epoch": 4127} {"train_loss": -26.321380615234375, "global_step": 342605, "epoch": 4127} {"train_loss": -26.103778839111328, "global_step": 342606, "epoch": 4127} {"train_loss": -26.138376235961914, "global_step": 342607, "epoch": 4127} {"train_loss": -26.37324333190918, "global_step": 342608, "epoch": 4127} {"train_loss": -25.942670822143555, "global_step": 342609, "epoch": 4127} {"train_loss": -26.151813507080078, "global_step": 342610, "epoch": 4127} {"train_loss": -26.187274932861328, "global_step": 342611, "epoch": 4127} {"train_loss": -26.317182540893555, "global_step": 342612, "epoch": 4127} {"train_loss": -26.04672622680664, "global_step": 342613, "epoch": 4127} {"train_loss": -25.928241729736328, "global_step": 342614, "epoch": 4127} {"train_loss": -26.268146514892578, "global_step": 342615, "epoch": 4127} {"train_loss": -26.321393966674805, "global_step": 342616, "epoch": 4127} {"train_loss": -25.932388305664062, "global_step": 342617, "epoch": 4127} {"train_loss": -26.2022762298584, "global_step": 342618, "epoch": 4127} {"train_loss": -26.35560417175293, "global_step": 342619, "epoch": 4127} {"train_loss": -26.367273330688477, "global_step": 342620, "epoch": 4127} {"train_loss": -26.217798233032227, "global_step": 342621, "epoch": 4127} {"train_loss": -26.33274269104004, "global_step": 342622, "epoch": 4127} {"train_loss": -26.013280477868506, "global_step": 342623, "epoch": 4127, "val_loss": 6610742.0} {"train_loss": -25.871301651000977, "global_step": 342624, "epoch": 4128} {"train_loss": -25.897321701049805, "global_step": 342625, "epoch": 4128} {"train_loss": -25.950393676757812, "global_step": 342626, "epoch": 4128} {"train_loss": -25.511926651000977, "global_step": 342627, "epoch": 4128} {"train_loss": -25.7025203704834, "global_step": 342628, "epoch": 4128} {"train_loss": -25.88263511657715, "global_step": 342629, "epoch": 4128} {"train_loss": -25.606298446655273, "global_step": 342630, "epoch": 4128} {"train_loss": -25.543012619018555, "global_step": 342631, "epoch": 4128} {"train_loss": -25.838117599487305, "global_step": 342632, "epoch": 4128} {"train_loss": -25.878437042236328, "global_step": 342633, "epoch": 4128} {"train_loss": -25.867965698242188, "global_step": 342634, "epoch": 4128} {"train_loss": -25.719696044921875, "global_step": 342635, "epoch": 4128} {"train_loss": -25.910669326782227, "global_step": 342636, "epoch": 4128} {"train_loss": -25.75184440612793, "global_step": 342637, "epoch": 4128} {"train_loss": -26.034244537353516, "global_step": 342638, "epoch": 4128} {"train_loss": -25.92523193359375, "global_step": 342639, "epoch": 4128} {"train_loss": -26.064498901367188, "global_step": 342640, "epoch": 4128} {"train_loss": -26.07659912109375, "global_step": 342641, "epoch": 4128} {"train_loss": -25.97749137878418, "global_step": 342642, "epoch": 4128} {"train_loss": -26.226179122924805, "global_step": 342643, "epoch": 4128} {"train_loss": -26.042713165283203, "global_step": 342644, "epoch": 4128} {"train_loss": -26.00884437561035, "global_step": 342645, "epoch": 4128} {"train_loss": -26.13507652282715, "global_step": 342646, "epoch": 4128} {"train_loss": -26.06368064880371, "global_step": 342647, "epoch": 4128} {"train_loss": -26.09577751159668, "global_step": 342648, "epoch": 4128} {"train_loss": -26.314762115478516, "global_step": 342649, "epoch": 4128} {"train_loss": -26.214139938354492, "global_step": 342650, "epoch": 4128} {"train_loss": -26.448657989501953, "global_step": 342651, "epoch": 4128} {"train_loss": -26.10443115234375, "global_step": 342652, "epoch": 4128} {"train_loss": -26.186216354370117, "global_step": 342653, "epoch": 4128} {"train_loss": -26.103240966796875, "global_step": 342654, "epoch": 4128} {"train_loss": -26.100000381469727, "global_step": 342655, "epoch": 4128} {"train_loss": -25.94708251953125, "global_step": 342656, "epoch": 4128} {"train_loss": -26.099395751953125, "global_step": 342657, "epoch": 4128} {"train_loss": -26.094287872314453, "global_step": 342658, "epoch": 4128} {"train_loss": -26.1718807220459, "global_step": 342659, "epoch": 4128} {"train_loss": -26.245512008666992, "global_step": 342660, "epoch": 4128} {"train_loss": -26.52739906311035, "global_step": 342661, "epoch": 4128} {"train_loss": -26.2240047454834, "global_step": 342662, "epoch": 4128} {"train_loss": -25.74421501159668, "global_step": 342663, "epoch": 4128} {"train_loss": -25.581754684448242, "global_step": 342664, "epoch": 4128} {"train_loss": -25.305814743041992, "global_step": 342665, "epoch": 4128} {"train_loss": -25.551340103149414, "global_step": 342666, "epoch": 4128} {"train_loss": -25.88605308532715, "global_step": 342667, "epoch": 4128} {"train_loss": -26.017017364501953, "global_step": 342668, "epoch": 4128} {"train_loss": -25.83051109313965, "global_step": 342669, "epoch": 4128} {"train_loss": -26.192468643188477, "global_step": 342670, "epoch": 4128} {"train_loss": -26.103168487548828, "global_step": 342671, "epoch": 4128} {"train_loss": -25.678668975830078, "global_step": 342672, "epoch": 4128} {"train_loss": -25.77565574645996, "global_step": 342673, "epoch": 4128} {"train_loss": -25.793354034423828, "global_step": 342674, "epoch": 4128} {"train_loss": -26.10805320739746, "global_step": 342675, "epoch": 4128} {"train_loss": -25.79932975769043, "global_step": 342676, "epoch": 4128} {"train_loss": -26.123401641845703, "global_step": 342677, "epoch": 4128} {"train_loss": -25.773962020874023, "global_step": 342678, "epoch": 4128} {"train_loss": -26.09937858581543, "global_step": 342679, "epoch": 4128} {"train_loss": -26.145490646362305, "global_step": 342680, "epoch": 4128} {"train_loss": -26.067371368408203, "global_step": 342681, "epoch": 4128} {"train_loss": -25.597450256347656, "global_step": 342682, "epoch": 4128} {"train_loss": -25.950021743774414, "global_step": 342683, "epoch": 4128} {"train_loss": -26.254779815673828, "global_step": 342684, "epoch": 4128} {"train_loss": -26.079742431640625, "global_step": 342685, "epoch": 4128} {"train_loss": -25.784208297729492, "global_step": 342686, "epoch": 4128} {"train_loss": -25.97273063659668, "global_step": 342687, "epoch": 4128} {"train_loss": -26.143863677978516, "global_step": 342688, "epoch": 4128} {"train_loss": -25.89803123474121, "global_step": 342689, "epoch": 4128} {"train_loss": -25.554180145263672, "global_step": 342690, "epoch": 4128} {"train_loss": -26.117294311523438, "global_step": 342691, "epoch": 4128} {"train_loss": -26.24427604675293, "global_step": 342692, "epoch": 4128} {"train_loss": -25.992528915405273, "global_step": 342693, "epoch": 4128} {"train_loss": -26.16729736328125, "global_step": 342694, "epoch": 4128} {"train_loss": -26.197187423706055, "global_step": 342695, "epoch": 4128} {"train_loss": -26.2371768951416, "global_step": 342696, "epoch": 4128} {"train_loss": -26.0698184967041, "global_step": 342697, "epoch": 4128} {"train_loss": -26.07636833190918, "global_step": 342698, "epoch": 4128} {"train_loss": -26.700719833374023, "global_step": 342699, "epoch": 4128} {"train_loss": -26.357770919799805, "global_step": 342700, "epoch": 4128} {"train_loss": -26.067005157470703, "global_step": 342701, "epoch": 4128} {"train_loss": -26.108123779296875, "global_step": 342702, "epoch": 4128} {"train_loss": -26.61089515686035, "global_step": 342703, "epoch": 4128} {"train_loss": -26.359699249267578, "global_step": 342704, "epoch": 4128} {"train_loss": -26.145984649658203, "global_step": 342705, "epoch": 4128} {"train_loss": -26.023313637239387, "global_step": 342706, "epoch": 4128, "val_loss": 6635679.0} {"train_loss": -25.23868751525879, "global_step": 342707, "epoch": 4129} {"train_loss": -24.824792861938477, "global_step": 342708, "epoch": 4129} {"train_loss": -25.24703025817871, "global_step": 342709, "epoch": 4129} {"train_loss": -25.885669708251953, "global_step": 342710, "epoch": 4129} {"train_loss": -25.568323135375977, "global_step": 342711, "epoch": 4129} {"train_loss": -25.63704490661621, "global_step": 342712, "epoch": 4129} {"train_loss": -25.81792640686035, "global_step": 342713, "epoch": 4129} {"train_loss": -25.531518936157227, "global_step": 342714, "epoch": 4129} {"train_loss": -25.96649742126465, "global_step": 342715, "epoch": 4129} {"train_loss": -25.772802352905273, "global_step": 342716, "epoch": 4129} {"train_loss": -26.0648136138916, "global_step": 342717, "epoch": 4129} {"train_loss": -25.61665153503418, "global_step": 342718, "epoch": 4129} {"train_loss": -25.565244674682617, "global_step": 342719, "epoch": 4129} {"train_loss": -25.9108829498291, "global_step": 342720, "epoch": 4129} {"train_loss": -25.99802017211914, "global_step": 342721, "epoch": 4129} {"train_loss": -25.820755004882812, "global_step": 342722, "epoch": 4129} {"train_loss": -25.604297637939453, "global_step": 342723, "epoch": 4129} {"train_loss": -25.90644645690918, "global_step": 342724, "epoch": 4129} {"train_loss": -25.7733097076416, "global_step": 342725, "epoch": 4129} {"train_loss": -26.14182472229004, "global_step": 342726, "epoch": 4129} {"train_loss": -26.13289451599121, "global_step": 342727, "epoch": 4129} {"train_loss": -26.082258224487305, "global_step": 342728, "epoch": 4129} {"train_loss": -25.845361709594727, "global_step": 342729, "epoch": 4129} {"train_loss": -26.125446319580078, "global_step": 342730, "epoch": 4129} {"train_loss": -26.1312255859375, "global_step": 342731, "epoch": 4129} {"train_loss": -25.789417266845703, "global_step": 342732, "epoch": 4129} {"train_loss": -26.050067901611328, "global_step": 342733, "epoch": 4129} {"train_loss": -25.9177303314209, "global_step": 342734, "epoch": 4129} {"train_loss": -26.316770553588867, "global_step": 342735, "epoch": 4129} {"train_loss": -26.071874618530273, "global_step": 342736, "epoch": 4129} {"train_loss": -25.964221954345703, "global_step": 342737, "epoch": 4129} {"train_loss": -25.862445831298828, "global_step": 342738, "epoch": 4129} {"train_loss": -26.282825469970703, "global_step": 342739, "epoch": 4129} {"train_loss": -26.275863647460938, "global_step": 342740, "epoch": 4129} {"train_loss": -25.78561782836914, "global_step": 342741, "epoch": 4129} {"train_loss": -26.508596420288086, "global_step": 342742, "epoch": 4129} {"train_loss": -26.38666343688965, "global_step": 342743, "epoch": 4129} {"train_loss": -25.86246109008789, "global_step": 342744, "epoch": 4129} {"train_loss": -25.894033432006836, "global_step": 342745, "epoch": 4129} {"train_loss": -26.32399559020996, "global_step": 342746, "epoch": 4129} {"train_loss": -26.111860275268555, "global_step": 342747, "epoch": 4129} {"train_loss": -26.150196075439453, "global_step": 342748, "epoch": 4129} {"train_loss": -26.19120216369629, "global_step": 342749, "epoch": 4129} {"train_loss": -26.039514541625977, "global_step": 342750, "epoch": 4129} {"train_loss": -25.89826774597168, "global_step": 342751, "epoch": 4129} {"train_loss": -26.434951782226562, "global_step": 342752, "epoch": 4129} {"train_loss": -26.091955184936523, "global_step": 342753, "epoch": 4129} {"train_loss": -26.194171905517578, "global_step": 342754, "epoch": 4129} {"train_loss": -26.26112174987793, "global_step": 342755, "epoch": 4129} {"train_loss": -26.098169326782227, "global_step": 342756, "epoch": 4129} {"train_loss": -26.35647964477539, "global_step": 342757, "epoch": 4129} {"train_loss": -26.316022872924805, "global_step": 342758, "epoch": 4129} {"train_loss": -26.064407348632812, "global_step": 342759, "epoch": 4129} {"train_loss": -26.192373275756836, "global_step": 342760, "epoch": 4129} {"train_loss": -26.27225685119629, "global_step": 342761, "epoch": 4129} {"train_loss": -26.170013427734375, "global_step": 342762, "epoch": 4129} {"train_loss": -25.956205368041992, "global_step": 342763, "epoch": 4129} {"train_loss": -26.097837448120117, "global_step": 342764, "epoch": 4129} {"train_loss": -26.0076847076416, "global_step": 342765, "epoch": 4129} {"train_loss": -26.42213249206543, "global_step": 342766, "epoch": 4129} {"train_loss": -26.118101119995117, "global_step": 342767, "epoch": 4129} {"train_loss": -26.38931655883789, "global_step": 342768, "epoch": 4129} {"train_loss": -26.33796501159668, "global_step": 342769, "epoch": 4129} {"train_loss": -26.010786056518555, "global_step": 342770, "epoch": 4129} {"train_loss": -26.2624454498291, "global_step": 342771, "epoch": 4129} {"train_loss": -25.985553741455078, "global_step": 342772, "epoch": 4129} {"train_loss": -26.520505905151367, "global_step": 342773, "epoch": 4129} {"train_loss": -26.37542152404785, "global_step": 342774, "epoch": 4129} {"train_loss": -26.511682510375977, "global_step": 342775, "epoch": 4129} {"train_loss": -25.959882736206055, "global_step": 342776, "epoch": 4129} {"train_loss": -26.38979148864746, "global_step": 342777, "epoch": 4129} {"train_loss": -26.58204460144043, "global_step": 342778, "epoch": 4129} {"train_loss": -25.847187042236328, "global_step": 342779, "epoch": 4129} {"train_loss": -26.154699325561523, "global_step": 342780, "epoch": 4129} {"train_loss": -26.342670440673828, "global_step": 342781, "epoch": 4129} {"train_loss": -25.8708553314209, "global_step": 342782, "epoch": 4129} {"train_loss": -26.096729278564453, "global_step": 342783, "epoch": 4129} {"train_loss": -26.01776123046875, "global_step": 342784, "epoch": 4129} {"train_loss": -26.191736221313477, "global_step": 342785, "epoch": 4129} {"train_loss": -26.410940170288086, "global_step": 342786, "epoch": 4129} {"train_loss": -26.012205123901367, "global_step": 342787, "epoch": 4129} {"train_loss": -26.194143295288086, "global_step": 342788, "epoch": 4129} {"train_loss": -26.0512156658862, "global_step": 342789, "epoch": 4129, "val_loss": 6695252.0} {"train_loss": -25.501394271850586, "global_step": 342790, "epoch": 4130} {"train_loss": -24.65618324279785, "global_step": 342791, "epoch": 4130} {"train_loss": -25.553821563720703, "global_step": 342792, "epoch": 4130} {"train_loss": -26.078062057495117, "global_step": 342793, "epoch": 4130} {"train_loss": -25.53519058227539, "global_step": 342794, "epoch": 4130} {"train_loss": -25.161762237548828, "global_step": 342795, "epoch": 4130} {"train_loss": -25.97136878967285, "global_step": 342796, "epoch": 4130} {"train_loss": -25.531723022460938, "global_step": 342797, "epoch": 4130} {"train_loss": -25.473073959350586, "global_step": 342798, "epoch": 4130} {"train_loss": -25.78369140625, "global_step": 342799, "epoch": 4130} {"train_loss": -26.067459106445312, "global_step": 342800, "epoch": 4130} {"train_loss": -25.839731216430664, "global_step": 342801, "epoch": 4130} {"train_loss": -26.057294845581055, "global_step": 342802, "epoch": 4130} {"train_loss": -25.376117706298828, "global_step": 342803, "epoch": 4130} {"train_loss": -25.932697296142578, "global_step": 342804, "epoch": 4130} {"train_loss": -25.790517807006836, "global_step": 342805, "epoch": 4130} {"train_loss": -26.030536651611328, "global_step": 342806, "epoch": 4130} {"train_loss": -25.724592208862305, "global_step": 342807, "epoch": 4130} {"train_loss": -26.044042587280273, "global_step": 342808, "epoch": 4130} {"train_loss": -26.00687026977539, "global_step": 342809, "epoch": 4130} {"train_loss": -25.7559814453125, "global_step": 342810, "epoch": 4130} {"train_loss": -26.2470645904541, "global_step": 342811, "epoch": 4130} {"train_loss": -25.707677841186523, "global_step": 342812, "epoch": 4130} {"train_loss": -26.099369049072266, "global_step": 342813, "epoch": 4130} {"train_loss": -25.959558486938477, "global_step": 342814, "epoch": 4130} {"train_loss": -26.03339958190918, "global_step": 342815, "epoch": 4130} {"train_loss": -25.732563018798828, "global_step": 342816, "epoch": 4130} {"train_loss": -26.03948974609375, "global_step": 342817, "epoch": 4130} {"train_loss": -26.196399688720703, "global_step": 342818, "epoch": 4130} {"train_loss": -25.92095947265625, "global_step": 342819, "epoch": 4130} {"train_loss": -26.193689346313477, "global_step": 342820, "epoch": 4130} {"train_loss": -26.0056209564209, "global_step": 342821, "epoch": 4130} {"train_loss": -25.943145751953125, "global_step": 342822, "epoch": 4130} {"train_loss": -26.446487426757812, "global_step": 342823, "epoch": 4130} {"train_loss": -26.289581298828125, "global_step": 342824, "epoch": 4130} {"train_loss": -26.18873405456543, "global_step": 342825, "epoch": 4130} {"train_loss": -26.342634201049805, "global_step": 342826, "epoch": 4130} {"train_loss": -26.108173370361328, "global_step": 342827, "epoch": 4130} {"train_loss": -26.276357650756836, "global_step": 342828, "epoch": 4130} {"train_loss": -26.17938804626465, "global_step": 342829, "epoch": 4130} {"train_loss": -26.32985496520996, "global_step": 342830, "epoch": 4130} {"train_loss": -26.259811401367188, "global_step": 342831, "epoch": 4130} {"train_loss": -26.07826042175293, "global_step": 342832, "epoch": 4130} {"train_loss": -26.13909912109375, "global_step": 342833, "epoch": 4130} {"train_loss": -26.077072143554688, "global_step": 342834, "epoch": 4130} {"train_loss": -26.266271591186523, "global_step": 342835, "epoch": 4130} {"train_loss": -26.399978637695312, "global_step": 342836, "epoch": 4130} {"train_loss": -26.49683952331543, "global_step": 342837, "epoch": 4130} {"train_loss": -25.91934585571289, "global_step": 342838, "epoch": 4130} {"train_loss": -26.10284423828125, "global_step": 342839, "epoch": 4130} {"train_loss": -25.989316940307617, "global_step": 342840, "epoch": 4130} {"train_loss": -25.806415557861328, "global_step": 342841, "epoch": 4130} {"train_loss": -25.597007751464844, "global_step": 342842, "epoch": 4130} {"train_loss": -25.986249923706055, "global_step": 342843, "epoch": 4130} {"train_loss": -26.02898597717285, "global_step": 342844, "epoch": 4130} {"train_loss": -25.657489776611328, "global_step": 342845, "epoch": 4130} {"train_loss": -26.11707878112793, "global_step": 342846, "epoch": 4130} {"train_loss": -26.327329635620117, "global_step": 342847, "epoch": 4130} {"train_loss": -26.56058120727539, "global_step": 342848, "epoch": 4130} {"train_loss": -26.11872673034668, "global_step": 342849, "epoch": 4130} {"train_loss": -26.07295036315918, "global_step": 342850, "epoch": 4130} {"train_loss": -26.339221954345703, "global_step": 342851, "epoch": 4130} {"train_loss": -25.658933639526367, "global_step": 342852, "epoch": 4130} {"train_loss": -26.113632202148438, "global_step": 342853, "epoch": 4130} {"train_loss": -26.468841552734375, "global_step": 342854, "epoch": 4130} {"train_loss": -26.031482696533203, "global_step": 342855, "epoch": 4130} {"train_loss": -26.217432022094727, "global_step": 342856, "epoch": 4130} {"train_loss": -25.685216903686523, "global_step": 342857, "epoch": 4130} {"train_loss": -26.25819969177246, "global_step": 342858, "epoch": 4130} {"train_loss": -25.76972770690918, "global_step": 342859, "epoch": 4130} {"train_loss": -25.909576416015625, "global_step": 342860, "epoch": 4130} {"train_loss": -25.860004425048828, "global_step": 342861, "epoch": 4130} {"train_loss": -26.37200927734375, "global_step": 342862, "epoch": 4130} {"train_loss": -25.831342697143555, "global_step": 342863, "epoch": 4130} {"train_loss": -25.974990844726562, "global_step": 342864, "epoch": 4130} {"train_loss": -26.036657333374023, "global_step": 342865, "epoch": 4130} {"train_loss": -25.868139266967773, "global_step": 342866, "epoch": 4130} {"train_loss": -26.353839874267578, "global_step": 342867, "epoch": 4130} {"train_loss": -25.90415382385254, "global_step": 342868, "epoch": 4130} {"train_loss": -25.374380111694336, "global_step": 342869, "epoch": 4130} {"train_loss": -26.2995662689209, "global_step": 342870, "epoch": 4130} {"train_loss": -25.66547966003418, "global_step": 342871, "epoch": 4130} {"train_loss": -25.96549714329731, "global_step": 342872, "epoch": 4130, "val_loss": 6510694.5} {"train_loss": -25.855854034423828, "global_step": 342873, "epoch": 4131} {"train_loss": -25.633743286132812, "global_step": 342874, "epoch": 4131} {"train_loss": -25.872385025024414, "global_step": 342875, "epoch": 4131} {"train_loss": -25.886194229125977, "global_step": 342876, "epoch": 4131} {"train_loss": -25.927167892456055, "global_step": 342877, "epoch": 4131} {"train_loss": -25.916364669799805, "global_step": 342878, "epoch": 4131} {"train_loss": -25.937585830688477, "global_step": 342879, "epoch": 4131} {"train_loss": -26.121841430664062, "global_step": 342880, "epoch": 4131} {"train_loss": -25.8976993560791, "global_step": 342881, "epoch": 4131} {"train_loss": -26.165985107421875, "global_step": 342882, "epoch": 4131} {"train_loss": -25.516233444213867, "global_step": 342883, "epoch": 4131} {"train_loss": -25.844867706298828, "global_step": 342884, "epoch": 4131} {"train_loss": -25.96013832092285, "global_step": 342885, "epoch": 4131} {"train_loss": -26.029937744140625, "global_step": 342886, "epoch": 4131} {"train_loss": -25.839019775390625, "global_step": 342887, "epoch": 4131} {"train_loss": -26.094640731811523, "global_step": 342888, "epoch": 4131} {"train_loss": -25.81854820251465, "global_step": 342889, "epoch": 4131} {"train_loss": -25.994415283203125, "global_step": 342890, "epoch": 4131} {"train_loss": -26.20576286315918, "global_step": 342891, "epoch": 4131} {"train_loss": -26.2242488861084, "global_step": 342892, "epoch": 4131} {"train_loss": -25.667449951171875, "global_step": 342893, "epoch": 4131} {"train_loss": -26.161123275756836, "global_step": 342894, "epoch": 4131} {"train_loss": -26.26474380493164, "global_step": 342895, "epoch": 4131} {"train_loss": -25.718427658081055, "global_step": 342896, "epoch": 4131} {"train_loss": -26.098392486572266, "global_step": 342897, "epoch": 4131} {"train_loss": -25.882909774780273, "global_step": 342898, "epoch": 4131} {"train_loss": -26.413196563720703, "global_step": 342899, "epoch": 4131} {"train_loss": -26.228839874267578, "global_step": 342900, "epoch": 4131} {"train_loss": -26.050827026367188, "global_step": 342901, "epoch": 4131} {"train_loss": -26.361982345581055, "global_step": 342902, "epoch": 4131} {"train_loss": -26.1643123626709, "global_step": 342903, "epoch": 4131} {"train_loss": -26.14215660095215, "global_step": 342904, "epoch": 4131} {"train_loss": -26.35127067565918, "global_step": 342905, "epoch": 4131} {"train_loss": -25.84210777282715, "global_step": 342906, "epoch": 4131} {"train_loss": -25.962738037109375, "global_step": 342907, "epoch": 4131} {"train_loss": -26.24835205078125, "global_step": 342908, "epoch": 4131} {"train_loss": -26.169601440429688, "global_step": 342909, "epoch": 4131} {"train_loss": -26.314619064331055, "global_step": 342910, "epoch": 4131} {"train_loss": -26.507593154907227, "global_step": 342911, "epoch": 4131} {"train_loss": -26.328149795532227, "global_step": 342912, "epoch": 4131} {"train_loss": -26.128662109375, "global_step": 342913, "epoch": 4131} {"train_loss": -26.371686935424805, "global_step": 342914, "epoch": 4131} {"train_loss": -26.118688583374023, "global_step": 342915, "epoch": 4131} {"train_loss": -26.425155639648438, "global_step": 342916, "epoch": 4131} {"train_loss": -26.049793243408203, "global_step": 342917, "epoch": 4131} {"train_loss": -26.336292266845703, "global_step": 342918, "epoch": 4131} {"train_loss": -25.9783992767334, "global_step": 342919, "epoch": 4131} {"train_loss": -26.0815372467041, "global_step": 342920, "epoch": 4131} {"train_loss": -25.65345573425293, "global_step": 342921, "epoch": 4131} {"train_loss": -25.922971725463867, "global_step": 342922, "epoch": 4131} {"train_loss": -25.91153907775879, "global_step": 342923, "epoch": 4131} {"train_loss": -26.371353149414062, "global_step": 342924, "epoch": 4131} {"train_loss": -26.260534286499023, "global_step": 342925, "epoch": 4131} {"train_loss": -26.18889808654785, "global_step": 342926, "epoch": 4131} {"train_loss": -26.24972915649414, "global_step": 342927, "epoch": 4131} {"train_loss": -25.73874855041504, "global_step": 342928, "epoch": 4131} {"train_loss": -26.068775177001953, "global_step": 342929, "epoch": 4131} {"train_loss": -26.057836532592773, "global_step": 342930, "epoch": 4131} {"train_loss": -26.068387985229492, "global_step": 342931, "epoch": 4131} {"train_loss": -26.412500381469727, "global_step": 342932, "epoch": 4131} {"train_loss": -26.120086669921875, "global_step": 342933, "epoch": 4131} {"train_loss": -25.9816837310791, "global_step": 342934, "epoch": 4131} {"train_loss": -25.817102432250977, "global_step": 342935, "epoch": 4131} {"train_loss": -26.235260009765625, "global_step": 342936, "epoch": 4131} {"train_loss": -26.15394401550293, "global_step": 342937, "epoch": 4131} {"train_loss": -26.027542114257812, "global_step": 342938, "epoch": 4131} {"train_loss": -25.9642333984375, "global_step": 342939, "epoch": 4131} {"train_loss": -25.986234664916992, "global_step": 342940, "epoch": 4131} {"train_loss": -25.9397029876709, "global_step": 342941, "epoch": 4131} {"train_loss": -25.857309341430664, "global_step": 342942, "epoch": 4131} {"train_loss": -26.25998878479004, "global_step": 342943, "epoch": 4131} {"train_loss": -26.393102645874023, "global_step": 342944, "epoch": 4131} {"train_loss": -26.283432006835938, "global_step": 342945, "epoch": 4131} {"train_loss": -26.112640380859375, "global_step": 342946, "epoch": 4131} {"train_loss": -26.37152671813965, "global_step": 342947, "epoch": 4131} {"train_loss": -26.23835563659668, "global_step": 342948, "epoch": 4131} {"train_loss": -26.1411075592041, "global_step": 342949, "epoch": 4131} {"train_loss": -25.866849899291992, "global_step": 342950, "epoch": 4131} {"train_loss": -26.363937377929688, "global_step": 342951, "epoch": 4131} {"train_loss": -26.156641006469727, "global_step": 342952, "epoch": 4131} {"train_loss": -26.395294189453125, "global_step": 342953, "epoch": 4131} {"train_loss": -26.26780128479004, "global_step": 342954, "epoch": 4131} {"train_loss": -26.10105967234416, "global_step": 342955, "epoch": 4131, "val_loss": 6568343.0} {"train_loss": -25.422008514404297, "global_step": 342956, "epoch": 4132} {"train_loss": -26.0262393951416, "global_step": 342957, "epoch": 4132} {"train_loss": -25.78664207458496, "global_step": 342958, "epoch": 4132} {"train_loss": -25.578336715698242, "global_step": 342959, "epoch": 4132} {"train_loss": -25.600568771362305, "global_step": 342960, "epoch": 4132} {"train_loss": -24.727231979370117, "global_step": 342961, "epoch": 4132} {"train_loss": -25.91351890563965, "global_step": 342962, "epoch": 4132} {"train_loss": -25.84758949279785, "global_step": 342963, "epoch": 4132} {"train_loss": -25.380605697631836, "global_step": 342964, "epoch": 4132} {"train_loss": -25.61407470703125, "global_step": 342965, "epoch": 4132} {"train_loss": -25.944198608398438, "global_step": 342966, "epoch": 4132} {"train_loss": -25.741886138916016, "global_step": 342967, "epoch": 4132} {"train_loss": -26.025959014892578, "global_step": 342968, "epoch": 4132} {"train_loss": -25.902698516845703, "global_step": 342969, "epoch": 4132} {"train_loss": -26.012731552124023, "global_step": 342970, "epoch": 4132} {"train_loss": -25.92258071899414, "global_step": 342971, "epoch": 4132} {"train_loss": -25.99468994140625, "global_step": 342972, "epoch": 4132} {"train_loss": -25.789295196533203, "global_step": 342973, "epoch": 4132} {"train_loss": -26.208234786987305, "global_step": 342974, "epoch": 4132} {"train_loss": -25.6802978515625, "global_step": 342975, "epoch": 4132} {"train_loss": -25.6909236907959, "global_step": 342976, "epoch": 4132} {"train_loss": -25.802692413330078, "global_step": 342977, "epoch": 4132} {"train_loss": -25.483335494995117, "global_step": 342978, "epoch": 4132} {"train_loss": -25.894433975219727, "global_step": 342979, "epoch": 4132} {"train_loss": -25.866474151611328, "global_step": 342980, "epoch": 4132} {"train_loss": -26.335193634033203, "global_step": 342981, "epoch": 4132} {"train_loss": -25.82914161682129, "global_step": 342982, "epoch": 4132} {"train_loss": -25.729028701782227, "global_step": 342983, "epoch": 4132} {"train_loss": -26.082910537719727, "global_step": 342984, "epoch": 4132} {"train_loss": -25.943571090698242, "global_step": 342985, "epoch": 4132} {"train_loss": -26.153379440307617, "global_step": 342986, "epoch": 4132} {"train_loss": -26.038421630859375, "global_step": 342987, "epoch": 4132} {"train_loss": -25.931156158447266, "global_step": 342988, "epoch": 4132} {"train_loss": -26.105213165283203, "global_step": 342989, "epoch": 4132} {"train_loss": -25.7828369140625, "global_step": 342990, "epoch": 4132} {"train_loss": -25.9260311126709, "global_step": 342991, "epoch": 4132} {"train_loss": -26.312164306640625, "global_step": 342992, "epoch": 4132} {"train_loss": -25.887786865234375, "global_step": 342993, "epoch": 4132} {"train_loss": -26.08865737915039, "global_step": 342994, "epoch": 4132} {"train_loss": -26.12586784362793, "global_step": 342995, "epoch": 4132} {"train_loss": -25.901071548461914, "global_step": 342996, "epoch": 4132} {"train_loss": -25.94219398498535, "global_step": 342997, "epoch": 4132} {"train_loss": -26.35968589782715, "global_step": 342998, "epoch": 4132} {"train_loss": -26.38631248474121, "global_step": 342999, "epoch": 4132} {"train_loss": -26.13563346862793, "global_step": 343000, "epoch": 4132} {"train_loss": -26.035207748413086, "global_step": 343001, "epoch": 4132} {"train_loss": -26.146360397338867, "global_step": 343002, "epoch": 4132} {"train_loss": -26.335424423217773, "global_step": 343003, "epoch": 4132} {"train_loss": -25.9381160736084, "global_step": 343004, "epoch": 4132} {"train_loss": -26.39409828186035, "global_step": 343005, "epoch": 4132} {"train_loss": -26.135900497436523, "global_step": 343006, "epoch": 4132} {"train_loss": -26.092756271362305, "global_step": 343007, "epoch": 4132} {"train_loss": -26.432300567626953, "global_step": 343008, "epoch": 4132} {"train_loss": -26.057592391967773, "global_step": 343009, "epoch": 4132} {"train_loss": -26.497709274291992, "global_step": 343010, "epoch": 4132} {"train_loss": -26.400129318237305, "global_step": 343011, "epoch": 4132} {"train_loss": -26.300439834594727, "global_step": 343012, "epoch": 4132} {"train_loss": -25.840595245361328, "global_step": 343013, "epoch": 4132} {"train_loss": -26.18104362487793, "global_step": 343014, "epoch": 4132} {"train_loss": -25.979352951049805, "global_step": 343015, "epoch": 4132} {"train_loss": -26.201635360717773, "global_step": 343016, "epoch": 4132} {"train_loss": -26.323410034179688, "global_step": 343017, "epoch": 4132} {"train_loss": -26.402612686157227, "global_step": 343018, "epoch": 4132} {"train_loss": -26.164718627929688, "global_step": 343019, "epoch": 4132} {"train_loss": -26.391263961791992, "global_step": 343020, "epoch": 4132} {"train_loss": -26.236831665039062, "global_step": 343021, "epoch": 4132} {"train_loss": -25.74257469177246, "global_step": 343022, "epoch": 4132} {"train_loss": -26.28423500061035, "global_step": 343023, "epoch": 4132} {"train_loss": -26.00058937072754, "global_step": 343024, "epoch": 4132} {"train_loss": -25.959030151367188, "global_step": 343025, "epoch": 4132} {"train_loss": -26.05476188659668, "global_step": 343026, "epoch": 4132} {"train_loss": -25.65064811706543, "global_step": 343027, "epoch": 4132} {"train_loss": -25.526966094970703, "global_step": 343028, "epoch": 4132} {"train_loss": -25.63929557800293, "global_step": 343029, "epoch": 4132} {"train_loss": -25.365970611572266, "global_step": 343030, "epoch": 4132} {"train_loss": -26.274459838867188, "global_step": 343031, "epoch": 4132} {"train_loss": -26.185779571533203, "global_step": 343032, "epoch": 4132} {"train_loss": -26.066370010375977, "global_step": 343033, "epoch": 4132} {"train_loss": -25.764007568359375, "global_step": 343034, "epoch": 4132} {"train_loss": -25.631383895874023, "global_step": 343035, "epoch": 4132} {"train_loss": -25.85108757019043, "global_step": 343036, "epoch": 4132} {"train_loss": -25.97675132751465, "global_step": 343037, "epoch": 4132} {"train_loss": -25.9573751012963, "global_step": 343038, "epoch": 4132, "val_loss": 6607088.0} {"train_loss": -24.60999870300293, "global_step": 343039, "epoch": 4133} {"train_loss": -25.62796974182129, "global_step": 343040, "epoch": 4133} {"train_loss": -24.557668685913086, "global_step": 343041, "epoch": 4133} {"train_loss": -25.07618522644043, "global_step": 343042, "epoch": 4133} {"train_loss": -24.879148483276367, "global_step": 343043, "epoch": 4133} {"train_loss": -25.24370002746582, "global_step": 343044, "epoch": 4133} {"train_loss": -25.22542953491211, "global_step": 343045, "epoch": 4133} {"train_loss": -25.25157928466797, "global_step": 343046, "epoch": 4133} {"train_loss": -25.49184799194336, "global_step": 343047, "epoch": 4133} {"train_loss": -25.55487823486328, "global_step": 343048, "epoch": 4133} {"train_loss": -25.14923667907715, "global_step": 343049, "epoch": 4133} {"train_loss": -25.6931209564209, "global_step": 343050, "epoch": 4133} {"train_loss": -25.259445190429688, "global_step": 343051, "epoch": 4133} {"train_loss": -25.19032096862793, "global_step": 343052, "epoch": 4133} {"train_loss": -25.756078720092773, "global_step": 343053, "epoch": 4133} {"train_loss": -25.8414249420166, "global_step": 343054, "epoch": 4133} {"train_loss": -25.70757484436035, "global_step": 343055, "epoch": 4133} {"train_loss": -25.58609390258789, "global_step": 343056, "epoch": 4133} {"train_loss": -25.718372344970703, "global_step": 343057, "epoch": 4133} {"train_loss": -25.877328872680664, "global_step": 343058, "epoch": 4133} {"train_loss": -25.853641510009766, "global_step": 343059, "epoch": 4133} {"train_loss": -25.484846115112305, "global_step": 343060, "epoch": 4133} {"train_loss": -25.99344253540039, "global_step": 343061, "epoch": 4133} {"train_loss": -25.92118263244629, "global_step": 343062, "epoch": 4133} {"train_loss": -25.652637481689453, "global_step": 343063, "epoch": 4133} {"train_loss": -25.7529296875, "global_step": 343064, "epoch": 4133} {"train_loss": -26.114887237548828, "global_step": 343065, "epoch": 4133} {"train_loss": -25.518844604492188, "global_step": 343066, "epoch": 4133} {"train_loss": -25.51414680480957, "global_step": 343067, "epoch": 4133} {"train_loss": -26.139867782592773, "global_step": 343068, "epoch": 4133} {"train_loss": -26.038000106811523, "global_step": 343069, "epoch": 4133} {"train_loss": -26.158740997314453, "global_step": 343070, "epoch": 4133} {"train_loss": -25.947509765625, "global_step": 343071, "epoch": 4133} {"train_loss": -26.1534366607666, "global_step": 343072, "epoch": 4133} {"train_loss": -25.998779296875, "global_step": 343073, "epoch": 4133} {"train_loss": -26.088605880737305, "global_step": 343074, "epoch": 4133} {"train_loss": -26.386066436767578, "global_step": 343075, "epoch": 4133} {"train_loss": -26.029279708862305, "global_step": 343076, "epoch": 4133} {"train_loss": -26.281890869140625, "global_step": 343077, "epoch": 4133} {"train_loss": -25.873382568359375, "global_step": 343078, "epoch": 4133} {"train_loss": -26.13942527770996, "global_step": 343079, "epoch": 4133} {"train_loss": -26.220489501953125, "global_step": 343080, "epoch": 4133} {"train_loss": -26.085058212280273, "global_step": 343081, "epoch": 4133} {"train_loss": -26.251386642456055, "global_step": 343082, "epoch": 4133} {"train_loss": -26.122028350830078, "global_step": 343083, "epoch": 4133} {"train_loss": -26.15165138244629, "global_step": 343084, "epoch": 4133} {"train_loss": -26.14617919921875, "global_step": 343085, "epoch": 4133} {"train_loss": -25.966413497924805, "global_step": 343086, "epoch": 4133} {"train_loss": -26.478195190429688, "global_step": 343087, "epoch": 4133} {"train_loss": -25.964941024780273, "global_step": 343088, "epoch": 4133} {"train_loss": -25.56348991394043, "global_step": 343089, "epoch": 4133} {"train_loss": -26.428787231445312, "global_step": 343090, "epoch": 4133} {"train_loss": -26.28839111328125, "global_step": 343091, "epoch": 4133} {"train_loss": -26.045673370361328, "global_step": 343092, "epoch": 4133} {"train_loss": -25.98335075378418, "global_step": 343093, "epoch": 4133} {"train_loss": -25.8289737701416, "global_step": 343094, "epoch": 4133} {"train_loss": -26.067468643188477, "global_step": 343095, "epoch": 4133} {"train_loss": -26.144189834594727, "global_step": 343096, "epoch": 4133} {"train_loss": -26.4488468170166, "global_step": 343097, "epoch": 4133} {"train_loss": -26.389755249023438, "global_step": 343098, "epoch": 4133} {"train_loss": -26.08430290222168, "global_step": 343099, "epoch": 4133} {"train_loss": -26.593448638916016, "global_step": 343100, "epoch": 4133} {"train_loss": -26.059295654296875, "global_step": 343101, "epoch": 4133} {"train_loss": -26.238208770751953, "global_step": 343102, "epoch": 4133} {"train_loss": -26.247034072875977, "global_step": 343103, "epoch": 4133} {"train_loss": -25.671621322631836, "global_step": 343104, "epoch": 4133} {"train_loss": -25.66135025024414, "global_step": 343105, "epoch": 4133} {"train_loss": -26.128263473510742, "global_step": 343106, "epoch": 4133} {"train_loss": -26.378355026245117, "global_step": 343107, "epoch": 4133} {"train_loss": -25.842670440673828, "global_step": 343108, "epoch": 4133} {"train_loss": -25.81949234008789, "global_step": 343109, "epoch": 4133} {"train_loss": -25.8266544342041, "global_step": 343110, "epoch": 4133} {"train_loss": -26.13579750061035, "global_step": 343111, "epoch": 4133} {"train_loss": -26.257556915283203, "global_step": 343112, "epoch": 4133} {"train_loss": -26.5786190032959, "global_step": 343113, "epoch": 4133} {"train_loss": -26.49811363220215, "global_step": 343114, "epoch": 4133} {"train_loss": -26.357213973999023, "global_step": 343115, "epoch": 4133} {"train_loss": -26.442773818969727, "global_step": 343116, "epoch": 4133} {"train_loss": -25.953872680664062, "global_step": 343117, "epoch": 4133} {"train_loss": -26.004377365112305, "global_step": 343118, "epoch": 4133} {"train_loss": -25.991254806518555, "global_step": 343119, "epoch": 4133} {"train_loss": -26.162322998046875, "global_step": 343120, "epoch": 4133} {"train_loss": -25.89663130978504, "global_step": 343121, "epoch": 4133, "val_loss": 6635091.0} {"train_loss": -26.176984786987305, "global_step": 343122, "epoch": 4134} {"train_loss": -25.964941024780273, "global_step": 343123, "epoch": 4134} {"train_loss": -25.008808135986328, "global_step": 343124, "epoch": 4134} {"train_loss": -25.396656036376953, "global_step": 343125, "epoch": 4134} {"train_loss": -26.010190963745117, "global_step": 343126, "epoch": 4134} {"train_loss": -25.146944046020508, "global_step": 343127, "epoch": 4134} {"train_loss": -25.01392936706543, "global_step": 343128, "epoch": 4134} {"train_loss": -26.154541015625, "global_step": 343129, "epoch": 4134} {"train_loss": -25.608978271484375, "global_step": 343130, "epoch": 4134} {"train_loss": -25.87843132019043, "global_step": 343131, "epoch": 4134} {"train_loss": -25.806365966796875, "global_step": 343132, "epoch": 4134} {"train_loss": -26.181079864501953, "global_step": 343133, "epoch": 4134} {"train_loss": -25.888097763061523, "global_step": 343134, "epoch": 4134} {"train_loss": -26.035110473632812, "global_step": 343135, "epoch": 4134} {"train_loss": -25.621728897094727, "global_step": 343136, "epoch": 4134} {"train_loss": -25.858182907104492, "global_step": 343137, "epoch": 4134} {"train_loss": -25.817541122436523, "global_step": 343138, "epoch": 4134} {"train_loss": -26.065778732299805, "global_step": 343139, "epoch": 4134} {"train_loss": -26.000812530517578, "global_step": 343140, "epoch": 4134} {"train_loss": -26.1618595123291, "global_step": 343141, "epoch": 4134} {"train_loss": -25.423254013061523, "global_step": 343142, "epoch": 4134} {"train_loss": -25.95061683654785, "global_step": 343143, "epoch": 4134} {"train_loss": -26.029020309448242, "global_step": 343144, "epoch": 4134} {"train_loss": -25.781469345092773, "global_step": 343145, "epoch": 4134} {"train_loss": -25.9837646484375, "global_step": 343146, "epoch": 4134} {"train_loss": -26.035114288330078, "global_step": 343147, "epoch": 4134} {"train_loss": -26.082595825195312, "global_step": 343148, "epoch": 4134} {"train_loss": -26.42844009399414, "global_step": 343149, "epoch": 4134} {"train_loss": -26.349782943725586, "global_step": 343150, "epoch": 4134} {"train_loss": -26.084394454956055, "global_step": 343151, "epoch": 4134} {"train_loss": -26.252771377563477, "global_step": 343152, "epoch": 4134} {"train_loss": -26.3436222076416, "global_step": 343153, "epoch": 4134} {"train_loss": -25.970813751220703, "global_step": 343154, "epoch": 4134} {"train_loss": -26.296539306640625, "global_step": 343155, "epoch": 4134} {"train_loss": -26.44996452331543, "global_step": 343156, "epoch": 4134} {"train_loss": -26.146549224853516, "global_step": 343157, "epoch": 4134} {"train_loss": -26.457876205444336, "global_step": 343158, "epoch": 4134} {"train_loss": -26.168359756469727, "global_step": 343159, "epoch": 4134} {"train_loss": -25.974042892456055, "global_step": 343160, "epoch": 4134} {"train_loss": -26.441617965698242, "global_step": 343161, "epoch": 4134} {"train_loss": -25.973669052124023, "global_step": 343162, "epoch": 4134} {"train_loss": -26.522724151611328, "global_step": 343163, "epoch": 4134} {"train_loss": -26.173099517822266, "global_step": 343164, "epoch": 4134} {"train_loss": -25.878942489624023, "global_step": 343165, "epoch": 4134} {"train_loss": -26.18610191345215, "global_step": 343166, "epoch": 4134} {"train_loss": -26.375885009765625, "global_step": 343167, "epoch": 4134} {"train_loss": -26.25360107421875, "global_step": 343168, "epoch": 4134} {"train_loss": -25.89519691467285, "global_step": 343169, "epoch": 4134} {"train_loss": -25.5308895111084, "global_step": 343170, "epoch": 4134} {"train_loss": -25.676557540893555, "global_step": 343171, "epoch": 4134} {"train_loss": -25.614221572875977, "global_step": 343172, "epoch": 4134} {"train_loss": -25.477689743041992, "global_step": 343173, "epoch": 4134} {"train_loss": -25.35013771057129, "global_step": 343174, "epoch": 4134} {"train_loss": -25.7490291595459, "global_step": 343175, "epoch": 4134} {"train_loss": -25.969867706298828, "global_step": 343176, "epoch": 4134} {"train_loss": -25.64497947692871, "global_step": 343177, "epoch": 4134} {"train_loss": -25.993085861206055, "global_step": 343178, "epoch": 4134} {"train_loss": -25.577974319458008, "global_step": 343179, "epoch": 4134} {"train_loss": -26.11199951171875, "global_step": 343180, "epoch": 4134} {"train_loss": -25.657455444335938, "global_step": 343181, "epoch": 4134} {"train_loss": -26.027313232421875, "global_step": 343182, "epoch": 4134} {"train_loss": -26.0188045501709, "global_step": 343183, "epoch": 4134} {"train_loss": -26.261245727539062, "global_step": 343184, "epoch": 4134} {"train_loss": -26.042524337768555, "global_step": 343185, "epoch": 4134} {"train_loss": -26.119873046875, "global_step": 343186, "epoch": 4134} {"train_loss": -26.0533447265625, "global_step": 343187, "epoch": 4134} {"train_loss": -26.257461547851562, "global_step": 343188, "epoch": 4134} {"train_loss": -26.0247745513916, "global_step": 343189, "epoch": 4134} {"train_loss": -26.291234970092773, "global_step": 343190, "epoch": 4134} {"train_loss": -26.151090621948242, "global_step": 343191, "epoch": 4134} {"train_loss": -26.24024772644043, "global_step": 343192, "epoch": 4134} {"train_loss": -26.005035400390625, "global_step": 343193, "epoch": 4134} {"train_loss": -26.234663009643555, "global_step": 343194, "epoch": 4134} {"train_loss": -26.1007080078125, "global_step": 343195, "epoch": 4134} {"train_loss": -26.115482330322266, "global_step": 343196, "epoch": 4134} {"train_loss": -26.21100425720215, "global_step": 343197, "epoch": 4134} {"train_loss": -25.978504180908203, "global_step": 343198, "epoch": 4134} {"train_loss": -26.501203536987305, "global_step": 343199, "epoch": 4134} {"train_loss": -26.0223388671875, "global_step": 343200, "epoch": 4134} {"train_loss": -26.133520126342773, "global_step": 343201, "epoch": 4134} {"train_loss": -26.175817489624023, "global_step": 343202, "epoch": 4134} {"train_loss": -26.278915405273438, "global_step": 343203, "epoch": 4134} {"train_loss": -25.997774285006237, "global_step": 343204, "epoch": 4134, "val_loss": 6519392.0} {"train_loss": -26.14411735534668, "global_step": 343205, "epoch": 4135} {"train_loss": -26.330829620361328, "global_step": 343206, "epoch": 4135} {"train_loss": -26.003026962280273, "global_step": 343207, "epoch": 4135} {"train_loss": -26.009458541870117, "global_step": 343208, "epoch": 4135} {"train_loss": -26.043323516845703, "global_step": 343209, "epoch": 4135} {"train_loss": -25.910886764526367, "global_step": 343210, "epoch": 4135} {"train_loss": -25.314809799194336, "global_step": 343211, "epoch": 4135} {"train_loss": -25.81801414489746, "global_step": 343212, "epoch": 4135} {"train_loss": -26.247827529907227, "global_step": 343213, "epoch": 4135} {"train_loss": -25.326419830322266, "global_step": 343214, "epoch": 4135} {"train_loss": -25.6306095123291, "global_step": 343215, "epoch": 4135} {"train_loss": -26.048282623291016, "global_step": 343216, "epoch": 4135} {"train_loss": -26.28837013244629, "global_step": 343217, "epoch": 4135} {"train_loss": -25.95244789123535, "global_step": 343218, "epoch": 4135} {"train_loss": -26.34861183166504, "global_step": 343219, "epoch": 4135} {"train_loss": -25.810026168823242, "global_step": 343220, "epoch": 4135} {"train_loss": -26.150516510009766, "global_step": 343221, "epoch": 4135} {"train_loss": -26.044479370117188, "global_step": 343222, "epoch": 4135} {"train_loss": -25.792875289916992, "global_step": 343223, "epoch": 4135} {"train_loss": -26.049503326416016, "global_step": 343224, "epoch": 4135} {"train_loss": -26.035938262939453, "global_step": 343225, "epoch": 4135} {"train_loss": -26.21341323852539, "global_step": 343226, "epoch": 4135} {"train_loss": -25.70465087890625, "global_step": 343227, "epoch": 4135} {"train_loss": -25.69000816345215, "global_step": 343228, "epoch": 4135} {"train_loss": -26.18145179748535, "global_step": 343229, "epoch": 4135} {"train_loss": -26.2714900970459, "global_step": 343230, "epoch": 4135} {"train_loss": -26.653732299804688, "global_step": 343231, "epoch": 4135} {"train_loss": -26.20368766784668, "global_step": 343232, "epoch": 4135} {"train_loss": -26.274015426635742, "global_step": 343233, "epoch": 4135} {"train_loss": -26.35772705078125, "global_step": 343234, "epoch": 4135} {"train_loss": -26.063812255859375, "global_step": 343235, "epoch": 4135} {"train_loss": -25.92146873474121, "global_step": 343236, "epoch": 4135} {"train_loss": -26.239322662353516, "global_step": 343237, "epoch": 4135} {"train_loss": -26.02107048034668, "global_step": 343238, "epoch": 4135} {"train_loss": -26.065399169921875, "global_step": 343239, "epoch": 4135} {"train_loss": -26.335041046142578, "global_step": 343240, "epoch": 4135} {"train_loss": -26.1018123626709, "global_step": 343241, "epoch": 4135} {"train_loss": -26.28498649597168, "global_step": 343242, "epoch": 4135} {"train_loss": -25.81879234313965, "global_step": 343243, "epoch": 4135} {"train_loss": -26.3426513671875, "global_step": 343244, "epoch": 4135} {"train_loss": -26.30621910095215, "global_step": 343245, "epoch": 4135} {"train_loss": -26.340696334838867, "global_step": 343246, "epoch": 4135} {"train_loss": -26.536758422851562, "global_step": 343247, "epoch": 4135} {"train_loss": -26.26323890686035, "global_step": 343248, "epoch": 4135} {"train_loss": -26.163593292236328, "global_step": 343249, "epoch": 4135} {"train_loss": -26.30030632019043, "global_step": 343250, "epoch": 4135} {"train_loss": -26.34901237487793, "global_step": 343251, "epoch": 4135} {"train_loss": -26.662017822265625, "global_step": 343252, "epoch": 4135} {"train_loss": -26.131397247314453, "global_step": 343253, "epoch": 4135} {"train_loss": -26.11097526550293, "global_step": 343254, "epoch": 4135} {"train_loss": -26.467248916625977, "global_step": 343255, "epoch": 4135} {"train_loss": -26.352136611938477, "global_step": 343256, "epoch": 4135} {"train_loss": -26.440515518188477, "global_step": 343257, "epoch": 4135} {"train_loss": -26.27686882019043, "global_step": 343258, "epoch": 4135} {"train_loss": -26.191537857055664, "global_step": 343259, "epoch": 4135} {"train_loss": -26.352375030517578, "global_step": 343260, "epoch": 4135} {"train_loss": -25.829669952392578, "global_step": 343261, "epoch": 4135} {"train_loss": -26.030868530273438, "global_step": 343262, "epoch": 4135} {"train_loss": -26.29367446899414, "global_step": 343263, "epoch": 4135} {"train_loss": -25.765344619750977, "global_step": 343264, "epoch": 4135} {"train_loss": -26.176681518554688, "global_step": 343265, "epoch": 4135} {"train_loss": -25.547672271728516, "global_step": 343266, "epoch": 4135} {"train_loss": -25.998340606689453, "global_step": 343267, "epoch": 4135} {"train_loss": -26.00832176208496, "global_step": 343268, "epoch": 4135} {"train_loss": -25.889225006103516, "global_step": 343269, "epoch": 4135} {"train_loss": -25.748762130737305, "global_step": 343270, "epoch": 4135} {"train_loss": -25.666288375854492, "global_step": 343271, "epoch": 4135} {"train_loss": -26.542678833007812, "global_step": 343272, "epoch": 4135} {"train_loss": -26.01849937438965, "global_step": 343273, "epoch": 4135} {"train_loss": -26.330947875976562, "global_step": 343274, "epoch": 4135} {"train_loss": -25.751880645751953, "global_step": 343275, "epoch": 4135} {"train_loss": -26.2445068359375, "global_step": 343276, "epoch": 4135} {"train_loss": -26.12410545349121, "global_step": 343277, "epoch": 4135} {"train_loss": -26.38226890563965, "global_step": 343278, "epoch": 4135} {"train_loss": -25.946731567382812, "global_step": 343279, "epoch": 4135} {"train_loss": -26.211278915405273, "global_step": 343280, "epoch": 4135} {"train_loss": -26.2900333404541, "global_step": 343281, "epoch": 4135} {"train_loss": -25.9863224029541, "global_step": 343282, "epoch": 4135} {"train_loss": -26.358911514282227, "global_step": 343283, "epoch": 4135} {"train_loss": -26.231037139892578, "global_step": 343284, "epoch": 4135} {"train_loss": -25.96822166442871, "global_step": 343285, "epoch": 4135} {"train_loss": -26.092655181884766, "global_step": 343286, "epoch": 4135} {"train_loss": -26.114763099026966, "global_step": 343287, "epoch": 4135, "val_loss": 6590802.5} {"train_loss": -23.96830940246582, "global_step": 343288, "epoch": 4136} {"train_loss": -23.215713500976562, "global_step": 343289, "epoch": 4136} {"train_loss": -24.343130111694336, "global_step": 343290, "epoch": 4136} {"train_loss": -25.295019149780273, "global_step": 343291, "epoch": 4136} {"train_loss": -25.004186630249023, "global_step": 343292, "epoch": 4136} {"train_loss": -24.792770385742188, "global_step": 343293, "epoch": 4136} {"train_loss": -24.938919067382812, "global_step": 343294, "epoch": 4136} {"train_loss": -24.73859977722168, "global_step": 343295, "epoch": 4136} {"train_loss": -25.30305290222168, "global_step": 343296, "epoch": 4136} {"train_loss": -24.952417373657227, "global_step": 343297, "epoch": 4136} {"train_loss": -25.372896194458008, "global_step": 343298, "epoch": 4136} {"train_loss": -25.61863136291504, "global_step": 343299, "epoch": 4136} {"train_loss": -25.244213104248047, "global_step": 343300, "epoch": 4136} {"train_loss": -25.19723892211914, "global_step": 343301, "epoch": 4136} {"train_loss": -25.358736038208008, "global_step": 343302, "epoch": 4136} {"train_loss": -25.50215721130371, "global_step": 343303, "epoch": 4136} {"train_loss": -25.139606475830078, "global_step": 343304, "epoch": 4136} {"train_loss": -25.292009353637695, "global_step": 343305, "epoch": 4136} {"train_loss": -25.59344482421875, "global_step": 343306, "epoch": 4136} {"train_loss": -25.501787185668945, "global_step": 343307, "epoch": 4136} {"train_loss": -25.8868465423584, "global_step": 343308, "epoch": 4136} {"train_loss": -25.78969383239746, "global_step": 343309, "epoch": 4136} {"train_loss": -25.492826461791992, "global_step": 343310, "epoch": 4136} {"train_loss": -25.455915451049805, "global_step": 343311, "epoch": 4136} {"train_loss": -25.64798927307129, "global_step": 343312, "epoch": 4136} {"train_loss": -25.525728225708008, "global_step": 343313, "epoch": 4136} {"train_loss": -25.93116569519043, "global_step": 343314, "epoch": 4136} {"train_loss": -25.7634220123291, "global_step": 343315, "epoch": 4136} {"train_loss": -25.995885848999023, "global_step": 343316, "epoch": 4136} {"train_loss": -25.9858341217041, "global_step": 343317, "epoch": 4136} {"train_loss": -25.76043701171875, "global_step": 343318, "epoch": 4136} {"train_loss": -25.940393447875977, "global_step": 343319, "epoch": 4136} {"train_loss": -26.0662899017334, "global_step": 343320, "epoch": 4136} {"train_loss": -26.125690460205078, "global_step": 343321, "epoch": 4136} {"train_loss": -26.32501220703125, "global_step": 343322, "epoch": 4136} {"train_loss": -25.858617782592773, "global_step": 343323, "epoch": 4136} {"train_loss": -25.888809204101562, "global_step": 343324, "epoch": 4136} {"train_loss": -26.1210994720459, "global_step": 343325, "epoch": 4136} {"train_loss": -26.0296688079834, "global_step": 343326, "epoch": 4136} {"train_loss": -26.296924591064453, "global_step": 343327, "epoch": 4136} {"train_loss": -26.1113338470459, "global_step": 343328, "epoch": 4136} {"train_loss": -26.095121383666992, "global_step": 343329, "epoch": 4136} {"train_loss": -26.229248046875, "global_step": 343330, "epoch": 4136} {"train_loss": -26.078571319580078, "global_step": 343331, "epoch": 4136} {"train_loss": -26.10076904296875, "global_step": 343332, "epoch": 4136} {"train_loss": -25.845294952392578, "global_step": 343333, "epoch": 4136} {"train_loss": -26.3747615814209, "global_step": 343334, "epoch": 4136} {"train_loss": -26.311079025268555, "global_step": 343335, "epoch": 4136} {"train_loss": -26.393518447875977, "global_step": 343336, "epoch": 4136} {"train_loss": -26.23432731628418, "global_step": 343337, "epoch": 4136} {"train_loss": -26.72773551940918, "global_step": 343338, "epoch": 4136} {"train_loss": -26.45635414123535, "global_step": 343339, "epoch": 4136} {"train_loss": -26.184097290039062, "global_step": 343340, "epoch": 4136} {"train_loss": -26.470849990844727, "global_step": 343341, "epoch": 4136} {"train_loss": -26.35004997253418, "global_step": 343342, "epoch": 4136} {"train_loss": -26.385059356689453, "global_step": 343343, "epoch": 4136} {"train_loss": -26.12226676940918, "global_step": 343344, "epoch": 4136} {"train_loss": -26.25031089782715, "global_step": 343345, "epoch": 4136} {"train_loss": -26.279287338256836, "global_step": 343346, "epoch": 4136} {"train_loss": -26.359664916992188, "global_step": 343347, "epoch": 4136} {"train_loss": -25.901514053344727, "global_step": 343348, "epoch": 4136} {"train_loss": -25.882226943969727, "global_step": 343349, "epoch": 4136} {"train_loss": -25.806396484375, "global_step": 343350, "epoch": 4136} {"train_loss": -25.79169273376465, "global_step": 343351, "epoch": 4136} {"train_loss": -26.236331939697266, "global_step": 343352, "epoch": 4136} {"train_loss": -26.22283363342285, "global_step": 343353, "epoch": 4136} {"train_loss": -26.00751304626465, "global_step": 343354, "epoch": 4136} {"train_loss": -26.151264190673828, "global_step": 343355, "epoch": 4136} {"train_loss": -26.273406982421875, "global_step": 343356, "epoch": 4136} {"train_loss": -25.964359283447266, "global_step": 343357, "epoch": 4136} {"train_loss": -26.080575942993164, "global_step": 343358, "epoch": 4136} {"train_loss": -25.920825958251953, "global_step": 343359, "epoch": 4136} {"train_loss": -26.15540885925293, "global_step": 343360, "epoch": 4136} {"train_loss": -25.81329917907715, "global_step": 343361, "epoch": 4136} {"train_loss": -26.018415451049805, "global_step": 343362, "epoch": 4136} {"train_loss": -25.869245529174805, "global_step": 343363, "epoch": 4136} {"train_loss": -26.03012466430664, "global_step": 343364, "epoch": 4136} {"train_loss": -25.68597412109375, "global_step": 343365, "epoch": 4136} {"train_loss": -25.391408920288086, "global_step": 343366, "epoch": 4136} {"train_loss": -25.77628517150879, "global_step": 343367, "epoch": 4136} {"train_loss": -26.013395309448242, "global_step": 343368, "epoch": 4136} {"train_loss": -25.686553955078125, "global_step": 343369, "epoch": 4136} {"train_loss": -25.796124285962208, "global_step": 343370, "epoch": 4136, "val_loss": 6609263.5} {"train_loss": -25.510499954223633, "global_step": 343371, "epoch": 4137} {"train_loss": -24.977725982666016, "global_step": 343372, "epoch": 4137} {"train_loss": -25.53354835510254, "global_step": 343373, "epoch": 4137} {"train_loss": -25.81818199157715, "global_step": 343374, "epoch": 4137} {"train_loss": -25.36866569519043, "global_step": 343375, "epoch": 4137} {"train_loss": -25.711523056030273, "global_step": 343376, "epoch": 4137} {"train_loss": -25.455297470092773, "global_step": 343377, "epoch": 4137} {"train_loss": -25.3704891204834, "global_step": 343378, "epoch": 4137} {"train_loss": -25.220626831054688, "global_step": 343379, "epoch": 4137} {"train_loss": -25.456268310546875, "global_step": 343380, "epoch": 4137} {"train_loss": -25.830976486206055, "global_step": 343381, "epoch": 4137} {"train_loss": -25.800800323486328, "global_step": 343382, "epoch": 4137} {"train_loss": -26.264698028564453, "global_step": 343383, "epoch": 4137} {"train_loss": -25.605911254882812, "global_step": 343384, "epoch": 4137} {"train_loss": -25.694482803344727, "global_step": 343385, "epoch": 4137} {"train_loss": -25.581138610839844, "global_step": 343386, "epoch": 4137} {"train_loss": -25.707096099853516, "global_step": 343387, "epoch": 4137} {"train_loss": -25.90266990661621, "global_step": 343388, "epoch": 4137} {"train_loss": -26.217138290405273, "global_step": 343389, "epoch": 4137} {"train_loss": -25.70465660095215, "global_step": 343390, "epoch": 4137} {"train_loss": -25.58576202392578, "global_step": 343391, "epoch": 4137} {"train_loss": -25.699142456054688, "global_step": 343392, "epoch": 4137} {"train_loss": -25.678089141845703, "global_step": 343393, "epoch": 4137} {"train_loss": -26.212488174438477, "global_step": 343394, "epoch": 4137} {"train_loss": -26.02985191345215, "global_step": 343395, "epoch": 4137} {"train_loss": -25.70203971862793, "global_step": 343396, "epoch": 4137} {"train_loss": -25.641218185424805, "global_step": 343397, "epoch": 4137} {"train_loss": -26.344680786132812, "global_step": 343398, "epoch": 4137} {"train_loss": -26.28773307800293, "global_step": 343399, "epoch": 4137} {"train_loss": -25.9377498626709, "global_step": 343400, "epoch": 4137} {"train_loss": -25.97971534729004, "global_step": 343401, "epoch": 4137} {"train_loss": -26.367938995361328, "global_step": 343402, "epoch": 4137} {"train_loss": -26.126611709594727, "global_step": 343403, "epoch": 4137} {"train_loss": -26.241302490234375, "global_step": 343404, "epoch": 4137} {"train_loss": -26.3245906829834, "global_step": 343405, "epoch": 4137} {"train_loss": -26.54046630859375, "global_step": 343406, "epoch": 4137} {"train_loss": -25.748294830322266, "global_step": 343407, "epoch": 4137} {"train_loss": -26.013036727905273, "global_step": 343408, "epoch": 4137} {"train_loss": -26.590457916259766, "global_step": 343409, "epoch": 4137} {"train_loss": -26.25238609313965, "global_step": 343410, "epoch": 4137} {"train_loss": -26.097888946533203, "global_step": 343411, "epoch": 4137} {"train_loss": -26.387130737304688, "global_step": 343412, "epoch": 4137} {"train_loss": -26.14963150024414, "global_step": 343413, "epoch": 4137} {"train_loss": -26.450214385986328, "global_step": 343414, "epoch": 4137} {"train_loss": -26.19195556640625, "global_step": 343415, "epoch": 4137} {"train_loss": -26.22603416442871, "global_step": 343416, "epoch": 4137} {"train_loss": -26.122068405151367, "global_step": 343417, "epoch": 4137} {"train_loss": -26.01951026916504, "global_step": 343418, "epoch": 4137} {"train_loss": -26.172651290893555, "global_step": 343419, "epoch": 4137} {"train_loss": -26.575626373291016, "global_step": 343420, "epoch": 4137} {"train_loss": -26.3818416595459, "global_step": 343421, "epoch": 4137} {"train_loss": -26.812833786010742, "global_step": 343422, "epoch": 4137} {"train_loss": -26.120025634765625, "global_step": 343423, "epoch": 4137} {"train_loss": -26.4537353515625, "global_step": 343424, "epoch": 4137} {"train_loss": -25.900049209594727, "global_step": 343425, "epoch": 4137} {"train_loss": -26.147626876831055, "global_step": 343426, "epoch": 4137} {"train_loss": -25.622272491455078, "global_step": 343427, "epoch": 4137} {"train_loss": -25.266223907470703, "global_step": 343428, "epoch": 4137} {"train_loss": -25.6542911529541, "global_step": 343429, "epoch": 4137} {"train_loss": -25.837491989135742, "global_step": 343430, "epoch": 4137} {"train_loss": -25.810169219970703, "global_step": 343431, "epoch": 4137} {"train_loss": -25.918720245361328, "global_step": 343432, "epoch": 4137} {"train_loss": -25.99347496032715, "global_step": 343433, "epoch": 4137} {"train_loss": -25.898761749267578, "global_step": 343434, "epoch": 4137} {"train_loss": -25.914886474609375, "global_step": 343435, "epoch": 4137} {"train_loss": -26.12098503112793, "global_step": 343436, "epoch": 4137} {"train_loss": -26.2034854888916, "global_step": 343437, "epoch": 4137} {"train_loss": -25.627613067626953, "global_step": 343438, "epoch": 4137} {"train_loss": -26.064756393432617, "global_step": 343439, "epoch": 4137} {"train_loss": -25.979413986206055, "global_step": 343440, "epoch": 4137} {"train_loss": -26.022809982299805, "global_step": 343441, "epoch": 4137} {"train_loss": -26.125476837158203, "global_step": 343442, "epoch": 4137} {"train_loss": -26.168170928955078, "global_step": 343443, "epoch": 4137} {"train_loss": -26.343158721923828, "global_step": 343444, "epoch": 4137} {"train_loss": -26.302825927734375, "global_step": 343445, "epoch": 4137} {"train_loss": -26.019872665405273, "global_step": 343446, "epoch": 4137} {"train_loss": -26.0305233001709, "global_step": 343447, "epoch": 4137} {"train_loss": -26.40860939025879, "global_step": 343448, "epoch": 4137} {"train_loss": -26.249570846557617, "global_step": 343449, "epoch": 4137} {"train_loss": -26.238290786743164, "global_step": 343450, "epoch": 4137} {"train_loss": -26.40635108947754, "global_step": 343451, "epoch": 4137} {"train_loss": -26.298185348510742, "global_step": 343452, "epoch": 4137} {"train_loss": -25.974930292152496, "global_step": 343453, "epoch": 4137, "val_loss": 6572577.5} {"train_loss": -25.358549118041992, "global_step": 343454, "epoch": 4138} {"train_loss": -25.694656372070312, "global_step": 343455, "epoch": 4138} {"train_loss": -25.64267349243164, "global_step": 343456, "epoch": 4138} {"train_loss": -25.818326950073242, "global_step": 343457, "epoch": 4138} {"train_loss": -25.995777130126953, "global_step": 343458, "epoch": 4138} {"train_loss": -25.408933639526367, "global_step": 343459, "epoch": 4138} {"train_loss": -25.567581176757812, "global_step": 343460, "epoch": 4138} {"train_loss": -25.400127410888672, "global_step": 343461, "epoch": 4138} {"train_loss": -25.557336807250977, "global_step": 343462, "epoch": 4138} {"train_loss": -25.947956085205078, "global_step": 343463, "epoch": 4138} {"train_loss": -26.061206817626953, "global_step": 343464, "epoch": 4138} {"train_loss": -25.8072566986084, "global_step": 343465, "epoch": 4138} {"train_loss": -26.051599502563477, "global_step": 343466, "epoch": 4138} {"train_loss": -25.772993087768555, "global_step": 343467, "epoch": 4138} {"train_loss": -25.71376609802246, "global_step": 343468, "epoch": 4138} {"train_loss": -26.002782821655273, "global_step": 343469, "epoch": 4138} {"train_loss": -25.635046005249023, "global_step": 343470, "epoch": 4138} {"train_loss": -26.104755401611328, "global_step": 343471, "epoch": 4138} {"train_loss": -26.002065658569336, "global_step": 343472, "epoch": 4138} {"train_loss": -26.142423629760742, "global_step": 343473, "epoch": 4138} {"train_loss": -25.87359619140625, "global_step": 343474, "epoch": 4138} {"train_loss": -25.89418601989746, "global_step": 343475, "epoch": 4138} {"train_loss": -25.80379295349121, "global_step": 343476, "epoch": 4138} {"train_loss": -25.920703887939453, "global_step": 343477, "epoch": 4138} {"train_loss": -25.985952377319336, "global_step": 343478, "epoch": 4138} {"train_loss": -25.921674728393555, "global_step": 343479, "epoch": 4138} {"train_loss": -26.002195358276367, "global_step": 343480, "epoch": 4138} {"train_loss": -26.060232162475586, "global_step": 343481, "epoch": 4138} {"train_loss": -26.339038848876953, "global_step": 343482, "epoch": 4138} {"train_loss": -26.130329132080078, "global_step": 343483, "epoch": 4138} {"train_loss": -26.139942169189453, "global_step": 343484, "epoch": 4138} {"train_loss": -26.28253746032715, "global_step": 343485, "epoch": 4138} {"train_loss": -26.116743087768555, "global_step": 343486, "epoch": 4138} {"train_loss": -26.149789810180664, "global_step": 343487, "epoch": 4138} {"train_loss": -26.12456703186035, "global_step": 343488, "epoch": 4138} {"train_loss": -26.02617835998535, "global_step": 343489, "epoch": 4138} {"train_loss": -25.996906280517578, "global_step": 343490, "epoch": 4138} {"train_loss": -26.04485511779785, "global_step": 343491, "epoch": 4138} {"train_loss": -25.61516761779785, "global_step": 343492, "epoch": 4138} {"train_loss": -26.033498764038086, "global_step": 343493, "epoch": 4138} {"train_loss": -25.634765625, "global_step": 343494, "epoch": 4138} {"train_loss": -25.862319946289062, "global_step": 343495, "epoch": 4138} {"train_loss": -26.200428009033203, "global_step": 343496, "epoch": 4138} {"train_loss": -26.184131622314453, "global_step": 343497, "epoch": 4138} {"train_loss": -25.63447380065918, "global_step": 343498, "epoch": 4138} {"train_loss": -26.265796661376953, "global_step": 343499, "epoch": 4138} {"train_loss": -26.07781982421875, "global_step": 343500, "epoch": 4138} {"train_loss": -25.752233505249023, "global_step": 343501, "epoch": 4138} {"train_loss": -25.986774444580078, "global_step": 343502, "epoch": 4138} {"train_loss": -26.001697540283203, "global_step": 343503, "epoch": 4138} {"train_loss": -26.074079513549805, "global_step": 343504, "epoch": 4138} {"train_loss": -25.873626708984375, "global_step": 343505, "epoch": 4138} {"train_loss": -25.989477157592773, "global_step": 343506, "epoch": 4138} {"train_loss": -25.960046768188477, "global_step": 343507, "epoch": 4138} {"train_loss": -25.98086929321289, "global_step": 343508, "epoch": 4138} {"train_loss": -26.147064208984375, "global_step": 343509, "epoch": 4138} {"train_loss": -26.129281997680664, "global_step": 343510, "epoch": 4138} {"train_loss": -26.14716911315918, "global_step": 343511, "epoch": 4138} {"train_loss": -25.88422966003418, "global_step": 343512, "epoch": 4138} {"train_loss": -26.368749618530273, "global_step": 343513, "epoch": 4138} {"train_loss": -26.3743839263916, "global_step": 343514, "epoch": 4138} {"train_loss": -26.0494441986084, "global_step": 343515, "epoch": 4138} {"train_loss": -26.086902618408203, "global_step": 343516, "epoch": 4138} {"train_loss": -25.980060577392578, "global_step": 343517, "epoch": 4138} {"train_loss": -25.886449813842773, "global_step": 343518, "epoch": 4138} {"train_loss": -26.3591365814209, "global_step": 343519, "epoch": 4138} {"train_loss": -26.403553009033203, "global_step": 343520, "epoch": 4138} {"train_loss": -26.256261825561523, "global_step": 343521, "epoch": 4138} {"train_loss": -25.86767578125, "global_step": 343522, "epoch": 4138} {"train_loss": -26.1220703125, "global_step": 343523, "epoch": 4138} {"train_loss": -26.178674697875977, "global_step": 343524, "epoch": 4138} {"train_loss": -26.391529083251953, "global_step": 343525, "epoch": 4138} {"train_loss": -26.070077896118164, "global_step": 343526, "epoch": 4138} {"train_loss": -26.465810775756836, "global_step": 343527, "epoch": 4138} {"train_loss": -26.079099655151367, "global_step": 343528, "epoch": 4138} {"train_loss": -26.232177734375, "global_step": 343529, "epoch": 4138} {"train_loss": -25.865509033203125, "global_step": 343530, "epoch": 4138} {"train_loss": -26.180959701538086, "global_step": 343531, "epoch": 4138} {"train_loss": -26.14015007019043, "global_step": 343532, "epoch": 4138} {"train_loss": -26.27400779724121, "global_step": 343533, "epoch": 4138} {"train_loss": -26.480976104736328, "global_step": 343534, "epoch": 4138} {"train_loss": -26.21339988708496, "global_step": 343535, "epoch": 4138} {"train_loss": -26.014465423951666, "global_step": 343536, "epoch": 4138, "val_loss": 6628566.0} {"train_loss": -24.804096221923828, "global_step": 343537, "epoch": 4139} {"train_loss": -24.904647827148438, "global_step": 343538, "epoch": 4139} {"train_loss": -25.3117618560791, "global_step": 343539, "epoch": 4139} {"train_loss": -25.61384391784668, "global_step": 343540, "epoch": 4139} {"train_loss": -25.18756675720215, "global_step": 343541, "epoch": 4139} {"train_loss": -25.371631622314453, "global_step": 343542, "epoch": 4139} {"train_loss": -25.25144386291504, "global_step": 343543, "epoch": 4139} {"train_loss": -25.44740104675293, "global_step": 343544, "epoch": 4139} {"train_loss": -25.60637855529785, "global_step": 343545, "epoch": 4139} {"train_loss": -25.938739776611328, "global_step": 343546, "epoch": 4139} {"train_loss": -25.662109375, "global_step": 343547, "epoch": 4139} {"train_loss": -25.6628475189209, "global_step": 343548, "epoch": 4139} {"train_loss": -25.4783935546875, "global_step": 343549, "epoch": 4139} {"train_loss": -25.405134201049805, "global_step": 343550, "epoch": 4139} {"train_loss": -25.747095108032227, "global_step": 343551, "epoch": 4139} {"train_loss": -25.909894943237305, "global_step": 343552, "epoch": 4139} {"train_loss": -25.995391845703125, "global_step": 343553, "epoch": 4139} {"train_loss": -25.67789077758789, "global_step": 343554, "epoch": 4139} {"train_loss": -25.87238121032715, "global_step": 343555, "epoch": 4139} {"train_loss": -25.722553253173828, "global_step": 343556, "epoch": 4139} {"train_loss": -25.600421905517578, "global_step": 343557, "epoch": 4139} {"train_loss": -26.00018310546875, "global_step": 343558, "epoch": 4139} {"train_loss": -26.100133895874023, "global_step": 343559, "epoch": 4139} {"train_loss": -26.07240104675293, "global_step": 343560, "epoch": 4139} {"train_loss": -26.18048095703125, "global_step": 343561, "epoch": 4139} {"train_loss": -26.1573486328125, "global_step": 343562, "epoch": 4139} {"train_loss": -26.028989791870117, "global_step": 343563, "epoch": 4139} {"train_loss": -26.01718521118164, "global_step": 343564, "epoch": 4139} {"train_loss": -25.705869674682617, "global_step": 343565, "epoch": 4139} {"train_loss": -26.087430953979492, "global_step": 343566, "epoch": 4139} {"train_loss": -26.242507934570312, "global_step": 343567, "epoch": 4139} {"train_loss": -25.89203453063965, "global_step": 343568, "epoch": 4139} {"train_loss": -25.672809600830078, "global_step": 343569, "epoch": 4139} {"train_loss": -26.239355087280273, "global_step": 343570, "epoch": 4139} {"train_loss": -26.1987361907959, "global_step": 343571, "epoch": 4139} {"train_loss": -25.980289459228516, "global_step": 343572, "epoch": 4139} {"train_loss": -25.92404556274414, "global_step": 343573, "epoch": 4139} {"train_loss": -25.975982666015625, "global_step": 343574, "epoch": 4139} {"train_loss": -25.837940216064453, "global_step": 343575, "epoch": 4139} {"train_loss": -26.21673583984375, "global_step": 343576, "epoch": 4139} {"train_loss": -26.01179313659668, "global_step": 343577, "epoch": 4139} {"train_loss": -26.41373062133789, "global_step": 343578, "epoch": 4139} {"train_loss": -25.948307037353516, "global_step": 343579, "epoch": 4139} {"train_loss": -25.9227294921875, "global_step": 343580, "epoch": 4139} {"train_loss": -26.1433162689209, "global_step": 343581, "epoch": 4139} {"train_loss": -26.3253231048584, "global_step": 343582, "epoch": 4139} {"train_loss": -25.9133243560791, "global_step": 343583, "epoch": 4139} {"train_loss": -25.835065841674805, "global_step": 343584, "epoch": 4139} {"train_loss": -26.151275634765625, "global_step": 343585, "epoch": 4139} {"train_loss": -26.191675186157227, "global_step": 343586, "epoch": 4139} {"train_loss": -26.25608253479004, "global_step": 343587, "epoch": 4139} {"train_loss": -26.55457878112793, "global_step": 343588, "epoch": 4139} {"train_loss": -26.120344161987305, "global_step": 343589, "epoch": 4139} {"train_loss": -26.212421417236328, "global_step": 343590, "epoch": 4139} {"train_loss": -26.225234985351562, "global_step": 343591, "epoch": 4139} {"train_loss": -25.99704933166504, "global_step": 343592, "epoch": 4139} {"train_loss": -26.21497917175293, "global_step": 343593, "epoch": 4139} {"train_loss": -26.227874755859375, "global_step": 343594, "epoch": 4139} {"train_loss": -26.009931564331055, "global_step": 343595, "epoch": 4139} {"train_loss": -26.17011833190918, "global_step": 343596, "epoch": 4139} {"train_loss": -26.24064064025879, "global_step": 343597, "epoch": 4139} {"train_loss": -25.854511260986328, "global_step": 343598, "epoch": 4139} {"train_loss": -26.09853172302246, "global_step": 343599, "epoch": 4139} {"train_loss": -26.17148780822754, "global_step": 343600, "epoch": 4139} {"train_loss": -26.180150985717773, "global_step": 343601, "epoch": 4139} {"train_loss": -26.3419132232666, "global_step": 343602, "epoch": 4139} {"train_loss": -26.320226669311523, "global_step": 343603, "epoch": 4139} {"train_loss": -26.207839965820312, "global_step": 343604, "epoch": 4139} {"train_loss": -26.438404083251953, "global_step": 343605, "epoch": 4139} {"train_loss": -26.03895378112793, "global_step": 343606, "epoch": 4139} {"train_loss": -26.201059341430664, "global_step": 343607, "epoch": 4139} {"train_loss": -26.33744239807129, "global_step": 343608, "epoch": 4139} {"train_loss": -26.08747673034668, "global_step": 343609, "epoch": 4139} {"train_loss": -26.12735939025879, "global_step": 343610, "epoch": 4139} {"train_loss": -26.23164176940918, "global_step": 343611, "epoch": 4139} {"train_loss": -26.044116973876953, "global_step": 343612, "epoch": 4139} {"train_loss": -26.509567260742188, "global_step": 343613, "epoch": 4139} {"train_loss": -26.3380126953125, "global_step": 343614, "epoch": 4139} {"train_loss": -26.2751522064209, "global_step": 343615, "epoch": 4139} {"train_loss": -26.124387741088867, "global_step": 343616, "epoch": 4139} {"train_loss": -26.240503311157227, "global_step": 343617, "epoch": 4139} {"train_loss": -26.1795711517334, "global_step": 343618, "epoch": 4139} {"train_loss": -25.980477022837444, "global_step": 343619, "epoch": 4139, "val_loss": 6609867.0} {"train_loss": -25.838855743408203, "global_step": 343620, "epoch": 4140} {"train_loss": -25.79498291015625, "global_step": 343621, "epoch": 4140} {"train_loss": -25.474470138549805, "global_step": 343622, "epoch": 4140} {"train_loss": -25.580053329467773, "global_step": 343623, "epoch": 4140} {"train_loss": -25.426000595092773, "global_step": 343624, "epoch": 4140} {"train_loss": -25.69086265563965, "global_step": 343625, "epoch": 4140} {"train_loss": -26.020849227905273, "global_step": 343626, "epoch": 4140} {"train_loss": -25.642230987548828, "global_step": 343627, "epoch": 4140} {"train_loss": -26.3709659576416, "global_step": 343628, "epoch": 4140} {"train_loss": -25.618345260620117, "global_step": 343629, "epoch": 4140} {"train_loss": -26.03321647644043, "global_step": 343630, "epoch": 4140} {"train_loss": -25.864938735961914, "global_step": 343631, "epoch": 4140} {"train_loss": -25.78903579711914, "global_step": 343632, "epoch": 4140} {"train_loss": -25.98872184753418, "global_step": 343633, "epoch": 4140} {"train_loss": -26.047840118408203, "global_step": 343634, "epoch": 4140} {"train_loss": -26.32220458984375, "global_step": 343635, "epoch": 4140} {"train_loss": -25.897214889526367, "global_step": 343636, "epoch": 4140} {"train_loss": -25.8719539642334, "global_step": 343637, "epoch": 4140} {"train_loss": -26.05439567565918, "global_step": 343638, "epoch": 4140} {"train_loss": -25.8068790435791, "global_step": 343639, "epoch": 4140} {"train_loss": -25.980268478393555, "global_step": 343640, "epoch": 4140} {"train_loss": -26.14056968688965, "global_step": 343641, "epoch": 4140} {"train_loss": -26.206098556518555, "global_step": 343642, "epoch": 4140} {"train_loss": -26.07112693786621, "global_step": 343643, "epoch": 4140} {"train_loss": -26.130496978759766, "global_step": 343644, "epoch": 4140} {"train_loss": -26.347217559814453, "global_step": 343645, "epoch": 4140} {"train_loss": -25.802942276000977, "global_step": 343646, "epoch": 4140} {"train_loss": -25.89375114440918, "global_step": 343647, "epoch": 4140} {"train_loss": -25.810388565063477, "global_step": 343648, "epoch": 4140} {"train_loss": -26.419126510620117, "global_step": 343649, "epoch": 4140} {"train_loss": -26.304792404174805, "global_step": 343650, "epoch": 4140} {"train_loss": -26.148880004882812, "global_step": 343651, "epoch": 4140} {"train_loss": -26.454334259033203, "global_step": 343652, "epoch": 4140} {"train_loss": -26.273767471313477, "global_step": 343653, "epoch": 4140} {"train_loss": -26.34575843811035, "global_step": 343654, "epoch": 4140} {"train_loss": -25.702472686767578, "global_step": 343655, "epoch": 4140} {"train_loss": -26.06043815612793, "global_step": 343656, "epoch": 4140} {"train_loss": -26.315170288085938, "global_step": 343657, "epoch": 4140} {"train_loss": -26.057336807250977, "global_step": 343658, "epoch": 4140} {"train_loss": -25.925809860229492, "global_step": 343659, "epoch": 4140} {"train_loss": -26.575260162353516, "global_step": 343660, "epoch": 4140} {"train_loss": -26.08379554748535, "global_step": 343661, "epoch": 4140} {"train_loss": -25.68195152282715, "global_step": 343662, "epoch": 4140} {"train_loss": -26.07232666015625, "global_step": 343663, "epoch": 4140} {"train_loss": -25.830747604370117, "global_step": 343664, "epoch": 4140} {"train_loss": -25.8653564453125, "global_step": 343665, "epoch": 4140} {"train_loss": -25.857458114624023, "global_step": 343666, "epoch": 4140} {"train_loss": -25.837854385375977, "global_step": 343667, "epoch": 4140} {"train_loss": -26.10298728942871, "global_step": 343668, "epoch": 4140} {"train_loss": -26.04196548461914, "global_step": 343669, "epoch": 4140} {"train_loss": -26.320356369018555, "global_step": 343670, "epoch": 4140} {"train_loss": -26.42630958557129, "global_step": 343671, "epoch": 4140} {"train_loss": -25.986963272094727, "global_step": 343672, "epoch": 4140} {"train_loss": -25.861536026000977, "global_step": 343673, "epoch": 4140} {"train_loss": -26.506711959838867, "global_step": 343674, "epoch": 4140} {"train_loss": -26.225666046142578, "global_step": 343675, "epoch": 4140} {"train_loss": -25.95562171936035, "global_step": 343676, "epoch": 4140} {"train_loss": -25.634632110595703, "global_step": 343677, "epoch": 4140} {"train_loss": -26.154386520385742, "global_step": 343678, "epoch": 4140} {"train_loss": -26.018232345581055, "global_step": 343679, "epoch": 4140} {"train_loss": -25.83481216430664, "global_step": 343680, "epoch": 4140} {"train_loss": -26.16693115234375, "global_step": 343681, "epoch": 4140} {"train_loss": -25.666746139526367, "global_step": 343682, "epoch": 4140} {"train_loss": -26.007551193237305, "global_step": 343683, "epoch": 4140} {"train_loss": -25.67403221130371, "global_step": 343684, "epoch": 4140} {"train_loss": -26.273529052734375, "global_step": 343685, "epoch": 4140} {"train_loss": -26.152769088745117, "global_step": 343686, "epoch": 4140} {"train_loss": -25.975378036499023, "global_step": 343687, "epoch": 4140} {"train_loss": -25.92754554748535, "global_step": 343688, "epoch": 4140} {"train_loss": -26.022314071655273, "global_step": 343689, "epoch": 4140} {"train_loss": -26.29611587524414, "global_step": 343690, "epoch": 4140} {"train_loss": -26.162153244018555, "global_step": 343691, "epoch": 4140} {"train_loss": -25.94434928894043, "global_step": 343692, "epoch": 4140} {"train_loss": -26.11269187927246, "global_step": 343693, "epoch": 4140} {"train_loss": -26.200592041015625, "global_step": 343694, "epoch": 4140} {"train_loss": -26.097089767456055, "global_step": 343695, "epoch": 4140} {"train_loss": -25.664737701416016, "global_step": 343696, "epoch": 4140} {"train_loss": -26.306427001953125, "global_step": 343697, "epoch": 4140} {"train_loss": -26.248401641845703, "global_step": 343698, "epoch": 4140} {"train_loss": -25.886524200439453, "global_step": 343699, "epoch": 4140} {"train_loss": -26.297855377197266, "global_step": 343700, "epoch": 4140} {"train_loss": -26.016164779663086, "global_step": 343701, "epoch": 4140} {"train_loss": -26.002121086580207, "global_step": 343702, "epoch": 4140, "val_loss": 6552194.0} {"train_loss": -24.947906494140625, "global_step": 343703, "epoch": 4141} {"train_loss": -25.09290885925293, "global_step": 343704, "epoch": 4141} {"train_loss": -25.39212417602539, "global_step": 343705, "epoch": 4141} {"train_loss": -25.34532356262207, "global_step": 343706, "epoch": 4141} {"train_loss": -24.841672897338867, "global_step": 343707, "epoch": 4141} {"train_loss": -25.04090690612793, "global_step": 343708, "epoch": 4141} {"train_loss": -25.660205841064453, "global_step": 343709, "epoch": 4141} {"train_loss": -25.718826293945312, "global_step": 343710, "epoch": 4141} {"train_loss": -25.509565353393555, "global_step": 343711, "epoch": 4141} {"train_loss": -25.7415771484375, "global_step": 343712, "epoch": 4141} {"train_loss": -25.869665145874023, "global_step": 343713, "epoch": 4141} {"train_loss": -25.922388076782227, "global_step": 343714, "epoch": 4141} {"train_loss": -25.806180953979492, "global_step": 343715, "epoch": 4141} {"train_loss": -25.394458770751953, "global_step": 343716, "epoch": 4141} {"train_loss": -25.623748779296875, "global_step": 343717, "epoch": 4141} {"train_loss": -25.82782554626465, "global_step": 343718, "epoch": 4141} {"train_loss": -25.78818702697754, "global_step": 343719, "epoch": 4141} {"train_loss": -26.035181045532227, "global_step": 343720, "epoch": 4141} {"train_loss": -25.591306686401367, "global_step": 343721, "epoch": 4141} {"train_loss": -25.886585235595703, "global_step": 343722, "epoch": 4141} {"train_loss": -25.629718780517578, "global_step": 343723, "epoch": 4141} {"train_loss": -25.86420249938965, "global_step": 343724, "epoch": 4141} {"train_loss": -26.005451202392578, "global_step": 343725, "epoch": 4141} {"train_loss": -25.854536056518555, "global_step": 343726, "epoch": 4141} {"train_loss": -25.8892822265625, "global_step": 343727, "epoch": 4141} {"train_loss": -26.215070724487305, "global_step": 343728, "epoch": 4141} {"train_loss": -26.138919830322266, "global_step": 343729, "epoch": 4141} {"train_loss": -25.67121696472168, "global_step": 343730, "epoch": 4141} {"train_loss": -25.774198532104492, "global_step": 343731, "epoch": 4141} {"train_loss": -26.02296257019043, "global_step": 343732, "epoch": 4141} {"train_loss": -26.129220962524414, "global_step": 343733, "epoch": 4141} {"train_loss": -26.49704360961914, "global_step": 343734, "epoch": 4141} {"train_loss": -25.944568634033203, "global_step": 343735, "epoch": 4141} {"train_loss": -26.12872886657715, "global_step": 343736, "epoch": 4141} {"train_loss": -26.05646324157715, "global_step": 343737, "epoch": 4141} {"train_loss": -25.993804931640625, "global_step": 343738, "epoch": 4141} {"train_loss": -26.42888832092285, "global_step": 343739, "epoch": 4141} {"train_loss": -25.995065689086914, "global_step": 343740, "epoch": 4141} {"train_loss": -25.998300552368164, "global_step": 343741, "epoch": 4141} {"train_loss": -25.820432662963867, "global_step": 343742, "epoch": 4141} {"train_loss": -26.46064567565918, "global_step": 343743, "epoch": 4141} {"train_loss": -26.058399200439453, "global_step": 343744, "epoch": 4141} {"train_loss": -25.979583740234375, "global_step": 343745, "epoch": 4141} {"train_loss": -25.8112850189209, "global_step": 343746, "epoch": 4141} {"train_loss": -26.054950714111328, "global_step": 343747, "epoch": 4141} {"train_loss": -26.32318687438965, "global_step": 343748, "epoch": 4141} {"train_loss": -26.210224151611328, "global_step": 343749, "epoch": 4141} {"train_loss": -26.188873291015625, "global_step": 343750, "epoch": 4141} {"train_loss": -26.2531681060791, "global_step": 343751, "epoch": 4141} {"train_loss": -26.144006729125977, "global_step": 343752, "epoch": 4141} {"train_loss": -26.096454620361328, "global_step": 343753, "epoch": 4141} {"train_loss": -25.8184871673584, "global_step": 343754, "epoch": 4141} {"train_loss": -26.446762084960938, "global_step": 343755, "epoch": 4141} {"train_loss": -26.194995880126953, "global_step": 343756, "epoch": 4141} {"train_loss": -26.059707641601562, "global_step": 343757, "epoch": 4141} {"train_loss": -26.119413375854492, "global_step": 343758, "epoch": 4141} {"train_loss": -25.969038009643555, "global_step": 343759, "epoch": 4141} {"train_loss": -26.312604904174805, "global_step": 343760, "epoch": 4141} {"train_loss": -26.01066017150879, "global_step": 343761, "epoch": 4141} {"train_loss": -26.082778930664062, "global_step": 343762, "epoch": 4141} {"train_loss": -26.21628189086914, "global_step": 343763, "epoch": 4141} {"train_loss": -26.367795944213867, "global_step": 343764, "epoch": 4141} {"train_loss": -26.01654624938965, "global_step": 343765, "epoch": 4141} {"train_loss": -26.2349796295166, "global_step": 343766, "epoch": 4141} {"train_loss": -26.150684356689453, "global_step": 343767, "epoch": 4141} {"train_loss": -26.141483306884766, "global_step": 343768, "epoch": 4141} {"train_loss": -26.311975479125977, "global_step": 343769, "epoch": 4141} {"train_loss": -26.102991104125977, "global_step": 343770, "epoch": 4141} {"train_loss": -26.143726348876953, "global_step": 343771, "epoch": 4141} {"train_loss": -26.448474884033203, "global_step": 343772, "epoch": 4141} {"train_loss": -26.159687042236328, "global_step": 343773, "epoch": 4141} {"train_loss": -26.256946563720703, "global_step": 343774, "epoch": 4141} {"train_loss": -26.006698608398438, "global_step": 343775, "epoch": 4141} {"train_loss": -26.467069625854492, "global_step": 343776, "epoch": 4141} {"train_loss": -26.11590576171875, "global_step": 343777, "epoch": 4141} {"train_loss": -26.124893188476562, "global_step": 343778, "epoch": 4141} {"train_loss": -25.932424545288086, "global_step": 343779, "epoch": 4141} {"train_loss": -26.328245162963867, "global_step": 343780, "epoch": 4141} {"train_loss": -26.160520553588867, "global_step": 343781, "epoch": 4141} {"train_loss": -26.362354278564453, "global_step": 343782, "epoch": 4141} {"train_loss": -26.25382423400879, "global_step": 343783, "epoch": 4141} {"train_loss": -26.14112663269043, "global_step": 343784, "epoch": 4141} {"train_loss": -25.976960078779474, "global_step": 343785, "epoch": 4141, "val_loss": 6685241.0} {"train_loss": -25.463905334472656, "global_step": 343786, "epoch": 4142} {"train_loss": -25.15840721130371, "global_step": 343787, "epoch": 4142} {"train_loss": -25.868473052978516, "global_step": 343788, "epoch": 4142} {"train_loss": -26.0313777923584, "global_step": 343789, "epoch": 4142} {"train_loss": -25.502639770507812, "global_step": 343790, "epoch": 4142} {"train_loss": -25.24872398376465, "global_step": 343791, "epoch": 4142} {"train_loss": -25.7496337890625, "global_step": 343792, "epoch": 4142} {"train_loss": -25.556711196899414, "global_step": 343793, "epoch": 4142} {"train_loss": -25.701047897338867, "global_step": 343794, "epoch": 4142} {"train_loss": -25.72439956665039, "global_step": 343795, "epoch": 4142} {"train_loss": -25.928800582885742, "global_step": 343796, "epoch": 4142} {"train_loss": -25.565515518188477, "global_step": 343797, "epoch": 4142} {"train_loss": -25.537111282348633, "global_step": 343798, "epoch": 4142} {"train_loss": -26.128376007080078, "global_step": 343799, "epoch": 4142} {"train_loss": -25.477947235107422, "global_step": 343800, "epoch": 4142} {"train_loss": -25.85210609436035, "global_step": 343801, "epoch": 4142} {"train_loss": -25.565526962280273, "global_step": 343802, "epoch": 4142} {"train_loss": -25.751483917236328, "global_step": 343803, "epoch": 4142} {"train_loss": -25.772367477416992, "global_step": 343804, "epoch": 4142} {"train_loss": -25.825220108032227, "global_step": 343805, "epoch": 4142} {"train_loss": -25.906591415405273, "global_step": 343806, "epoch": 4142} {"train_loss": -25.967681884765625, "global_step": 343807, "epoch": 4142} {"train_loss": -25.61643409729004, "global_step": 343808, "epoch": 4142} {"train_loss": -25.82427406311035, "global_step": 343809, "epoch": 4142} {"train_loss": -25.885278701782227, "global_step": 343810, "epoch": 4142} {"train_loss": -25.806909561157227, "global_step": 343811, "epoch": 4142} {"train_loss": -25.638763427734375, "global_step": 343812, "epoch": 4142} {"train_loss": -26.245773315429688, "global_step": 343813, "epoch": 4142} {"train_loss": -25.891803741455078, "global_step": 343814, "epoch": 4142} {"train_loss": -25.923315048217773, "global_step": 343815, "epoch": 4142} {"train_loss": -26.076562881469727, "global_step": 343816, "epoch": 4142} {"train_loss": -25.7412166595459, "global_step": 343817, "epoch": 4142} {"train_loss": -25.867658615112305, "global_step": 343818, "epoch": 4142} {"train_loss": -26.393390655517578, "global_step": 343819, "epoch": 4142} {"train_loss": -26.095020294189453, "global_step": 343820, "epoch": 4142} {"train_loss": -26.325464248657227, "global_step": 343821, "epoch": 4142} {"train_loss": -26.38344383239746, "global_step": 343822, "epoch": 4142} {"train_loss": -26.45233154296875, "global_step": 343823, "epoch": 4142} {"train_loss": -26.302698135375977, "global_step": 343824, "epoch": 4142} {"train_loss": -26.166492462158203, "global_step": 343825, "epoch": 4142} {"train_loss": -26.264402389526367, "global_step": 343826, "epoch": 4142} {"train_loss": -26.078582763671875, "global_step": 343827, "epoch": 4142} {"train_loss": -26.090112686157227, "global_step": 343828, "epoch": 4142} {"train_loss": -26.1311092376709, "global_step": 343829, "epoch": 4142} {"train_loss": -26.00589370727539, "global_step": 343830, "epoch": 4142} {"train_loss": -26.394119262695312, "global_step": 343831, "epoch": 4142} {"train_loss": -25.97812843322754, "global_step": 343832, "epoch": 4142} {"train_loss": -26.1551570892334, "global_step": 343833, "epoch": 4142} {"train_loss": -26.283111572265625, "global_step": 343834, "epoch": 4142} {"train_loss": -26.294036865234375, "global_step": 343835, "epoch": 4142} {"train_loss": -26.257049560546875, "global_step": 343836, "epoch": 4142} {"train_loss": -26.175861358642578, "global_step": 343837, "epoch": 4142} {"train_loss": -26.314584732055664, "global_step": 343838, "epoch": 4142} {"train_loss": -26.095062255859375, "global_step": 343839, "epoch": 4142} {"train_loss": -25.982746124267578, "global_step": 343840, "epoch": 4142} {"train_loss": -25.784826278686523, "global_step": 343841, "epoch": 4142} {"train_loss": -25.629491806030273, "global_step": 343842, "epoch": 4142} {"train_loss": -25.754032135009766, "global_step": 343843, "epoch": 4142} {"train_loss": -26.499509811401367, "global_step": 343844, "epoch": 4142} {"train_loss": -26.0864200592041, "global_step": 343845, "epoch": 4142} {"train_loss": -26.067890167236328, "global_step": 343846, "epoch": 4142} {"train_loss": -25.8355712890625, "global_step": 343847, "epoch": 4142} {"train_loss": -26.06308364868164, "global_step": 343848, "epoch": 4142} {"train_loss": -25.674076080322266, "global_step": 343849, "epoch": 4142} {"train_loss": -26.203397750854492, "global_step": 343850, "epoch": 4142} {"train_loss": -26.241552352905273, "global_step": 343851, "epoch": 4142} {"train_loss": -26.603322982788086, "global_step": 343852, "epoch": 4142} {"train_loss": -26.3143310546875, "global_step": 343853, "epoch": 4142} {"train_loss": -26.332746505737305, "global_step": 343854, "epoch": 4142} {"train_loss": -26.491352081298828, "global_step": 343855, "epoch": 4142} {"train_loss": -26.391223907470703, "global_step": 343856, "epoch": 4142} {"train_loss": -26.452661514282227, "global_step": 343857, "epoch": 4142} {"train_loss": -26.02496337890625, "global_step": 343858, "epoch": 4142} {"train_loss": -26.133319854736328, "global_step": 343859, "epoch": 4142} {"train_loss": -26.03391456604004, "global_step": 343860, "epoch": 4142} {"train_loss": -26.4939022064209, "global_step": 343861, "epoch": 4142} {"train_loss": -26.374195098876953, "global_step": 343862, "epoch": 4142} {"train_loss": -26.0435848236084, "global_step": 343863, "epoch": 4142} {"train_loss": -26.107568740844727, "global_step": 343864, "epoch": 4142} {"train_loss": -26.59051513671875, "global_step": 343865, "epoch": 4142} {"train_loss": -26.296039581298828, "global_step": 343866, "epoch": 4142} {"train_loss": -26.096532821655273, "global_step": 343867, "epoch": 4142} {"train_loss": -26.004475306315594, "global_step": 343868, "epoch": 4142, "val_loss": 6618789.0} {"train_loss": -25.440101623535156, "global_step": 343869, "epoch": 4143} {"train_loss": -24.904743194580078, "global_step": 343870, "epoch": 4143} {"train_loss": -24.289047241210938, "global_step": 343871, "epoch": 4143} {"train_loss": -24.045469284057617, "global_step": 343872, "epoch": 4143} {"train_loss": -25.364225387573242, "global_step": 343873, "epoch": 4143} {"train_loss": -24.464778900146484, "global_step": 343874, "epoch": 4143} {"train_loss": -24.904621124267578, "global_step": 343875, "epoch": 4143} {"train_loss": -25.06028175354004, "global_step": 343876, "epoch": 4143} {"train_loss": -25.441364288330078, "global_step": 343877, "epoch": 4143} {"train_loss": -25.303632736206055, "global_step": 343878, "epoch": 4143} {"train_loss": -24.928924560546875, "global_step": 343879, "epoch": 4143} {"train_loss": -24.877641677856445, "global_step": 343880, "epoch": 4143} {"train_loss": -25.14832878112793, "global_step": 343881, "epoch": 4143} {"train_loss": -25.222410202026367, "global_step": 343882, "epoch": 4143} {"train_loss": -25.58770751953125, "global_step": 343883, "epoch": 4143} {"train_loss": -25.284343719482422, "global_step": 343884, "epoch": 4143} {"train_loss": -25.47401237487793, "global_step": 343885, "epoch": 4143} {"train_loss": -25.379165649414062, "global_step": 343886, "epoch": 4143} {"train_loss": -25.383365631103516, "global_step": 343887, "epoch": 4143} {"train_loss": -25.560413360595703, "global_step": 343888, "epoch": 4143} {"train_loss": -25.71284294128418, "global_step": 343889, "epoch": 4143} {"train_loss": -25.87509536743164, "global_step": 343890, "epoch": 4143} {"train_loss": -25.664031982421875, "global_step": 343891, "epoch": 4143} {"train_loss": -25.740741729736328, "global_step": 343892, "epoch": 4143} {"train_loss": -25.549314498901367, "global_step": 343893, "epoch": 4143} {"train_loss": -25.589693069458008, "global_step": 343894, "epoch": 4143} {"train_loss": -25.655029296875, "global_step": 343895, "epoch": 4143} {"train_loss": -25.97279167175293, "global_step": 343896, "epoch": 4143} {"train_loss": -26.153461456298828, "global_step": 343897, "epoch": 4143} {"train_loss": -25.663843154907227, "global_step": 343898, "epoch": 4143} {"train_loss": -25.720617294311523, "global_step": 343899, "epoch": 4143} {"train_loss": -26.3093204498291, "global_step": 343900, "epoch": 4143} {"train_loss": -26.13787269592285, "global_step": 343901, "epoch": 4143} {"train_loss": -25.9454402923584, "global_step": 343902, "epoch": 4143} {"train_loss": -26.142118453979492, "global_step": 343903, "epoch": 4143} {"train_loss": -26.027698516845703, "global_step": 343904, "epoch": 4143} {"train_loss": -25.486492156982422, "global_step": 343905, "epoch": 4143} {"train_loss": -25.971399307250977, "global_step": 343906, "epoch": 4143} {"train_loss": -26.104598999023438, "global_step": 343907, "epoch": 4143} {"train_loss": -26.00086784362793, "global_step": 343908, "epoch": 4143} {"train_loss": -26.044193267822266, "global_step": 343909, "epoch": 4143} {"train_loss": -25.8992862701416, "global_step": 343910, "epoch": 4143} {"train_loss": -26.388813018798828, "global_step": 343911, "epoch": 4143} {"train_loss": -25.995275497436523, "global_step": 343912, "epoch": 4143} {"train_loss": -26.070898056030273, "global_step": 343913, "epoch": 4143} {"train_loss": -26.121023178100586, "global_step": 343914, "epoch": 4143} {"train_loss": -26.029321670532227, "global_step": 343915, "epoch": 4143} {"train_loss": -25.97833824157715, "global_step": 343916, "epoch": 4143} {"train_loss": -25.700439453125, "global_step": 343917, "epoch": 4143} {"train_loss": -26.17889976501465, "global_step": 343918, "epoch": 4143} {"train_loss": -26.19352149963379, "global_step": 343919, "epoch": 4143} {"train_loss": -25.962005615234375, "global_step": 343920, "epoch": 4143} {"train_loss": -26.531354904174805, "global_step": 343921, "epoch": 4143} {"train_loss": -26.338428497314453, "global_step": 343922, "epoch": 4143} {"train_loss": -26.446853637695312, "global_step": 343923, "epoch": 4143} {"train_loss": -26.072824478149414, "global_step": 343924, "epoch": 4143} {"train_loss": -26.416412353515625, "global_step": 343925, "epoch": 4143} {"train_loss": -25.993478775024414, "global_step": 343926, "epoch": 4143} {"train_loss": -26.259801864624023, "global_step": 343927, "epoch": 4143} {"train_loss": -26.8321590423584, "global_step": 343928, "epoch": 4143} {"train_loss": -26.1662540435791, "global_step": 343929, "epoch": 4143} {"train_loss": -26.32958984375, "global_step": 343930, "epoch": 4143} {"train_loss": -26.104034423828125, "global_step": 343931, "epoch": 4143} {"train_loss": -26.110355377197266, "global_step": 343932, "epoch": 4143} {"train_loss": -26.4891414642334, "global_step": 343933, "epoch": 4143} {"train_loss": -26.36116600036621, "global_step": 343934, "epoch": 4143} {"train_loss": -26.320566177368164, "global_step": 343935, "epoch": 4143} {"train_loss": -26.24755859375, "global_step": 343936, "epoch": 4143} {"train_loss": -25.92428970336914, "global_step": 343937, "epoch": 4143} {"train_loss": -26.01852798461914, "global_step": 343938, "epoch": 4143} {"train_loss": -25.895984649658203, "global_step": 343939, "epoch": 4143} {"train_loss": -26.294172286987305, "global_step": 343940, "epoch": 4143} {"train_loss": -26.17347526550293, "global_step": 343941, "epoch": 4143} {"train_loss": -26.06671714782715, "global_step": 343942, "epoch": 4143} {"train_loss": -26.336881637573242, "global_step": 343943, "epoch": 4143} {"train_loss": -26.109838485717773, "global_step": 343944, "epoch": 4143} {"train_loss": -26.291492462158203, "global_step": 343945, "epoch": 4143} {"train_loss": -26.258691787719727, "global_step": 343946, "epoch": 4143} {"train_loss": -26.09120750427246, "global_step": 343947, "epoch": 4143} {"train_loss": -26.045312881469727, "global_step": 343948, "epoch": 4143} {"train_loss": -25.896320343017578, "global_step": 343949, "epoch": 4143} {"train_loss": -25.922744750976562, "global_step": 343950, "epoch": 4143} {"train_loss": -25.850000151668688, "global_step": 343951, "epoch": 4143, "val_loss": 6667983.0} {"train_loss": -24.460731506347656, "global_step": 343952, "epoch": 4144} {"train_loss": -24.76165771484375, "global_step": 343953, "epoch": 4144} {"train_loss": -25.33450698852539, "global_step": 343954, "epoch": 4144} {"train_loss": -25.723453521728516, "global_step": 343955, "epoch": 4144} {"train_loss": -25.989028930664062, "global_step": 343956, "epoch": 4144} {"train_loss": -25.5552921295166, "global_step": 343957, "epoch": 4144} {"train_loss": -25.79779624938965, "global_step": 343958, "epoch": 4144} {"train_loss": -26.022253036499023, "global_step": 343959, "epoch": 4144} {"train_loss": -25.81898307800293, "global_step": 343960, "epoch": 4144} {"train_loss": -25.680496215820312, "global_step": 343961, "epoch": 4144} {"train_loss": -25.68934440612793, "global_step": 343962, "epoch": 4144} {"train_loss": -25.8967342376709, "global_step": 343963, "epoch": 4144} {"train_loss": -25.744604110717773, "global_step": 343964, "epoch": 4144} {"train_loss": -26.01568031311035, "global_step": 343965, "epoch": 4144} {"train_loss": -26.111791610717773, "global_step": 343966, "epoch": 4144} {"train_loss": -25.917898178100586, "global_step": 343967, "epoch": 4144} {"train_loss": -25.661462783813477, "global_step": 343968, "epoch": 4144} {"train_loss": -25.40883445739746, "global_step": 343969, "epoch": 4144} {"train_loss": -26.443525314331055, "global_step": 343970, "epoch": 4144} {"train_loss": -25.89069175720215, "global_step": 343971, "epoch": 4144} {"train_loss": -26.322065353393555, "global_step": 343972, "epoch": 4144} {"train_loss": -25.800323486328125, "global_step": 343973, "epoch": 4144} {"train_loss": -26.108484268188477, "global_step": 343974, "epoch": 4144} {"train_loss": -26.13331413269043, "global_step": 343975, "epoch": 4144} {"train_loss": -25.898849487304688, "global_step": 343976, "epoch": 4144} {"train_loss": -26.146713256835938, "global_step": 343977, "epoch": 4144} {"train_loss": -25.956029891967773, "global_step": 343978, "epoch": 4144} {"train_loss": -26.05901527404785, "global_step": 343979, "epoch": 4144} {"train_loss": -26.01348876953125, "global_step": 343980, "epoch": 4144} {"train_loss": -26.248693466186523, "global_step": 343981, "epoch": 4144} {"train_loss": -26.227949142456055, "global_step": 343982, "epoch": 4144} {"train_loss": -26.025390625, "global_step": 343983, "epoch": 4144} {"train_loss": -26.073318481445312, "global_step": 343984, "epoch": 4144} {"train_loss": -25.914093017578125, "global_step": 343985, "epoch": 4144} {"train_loss": -26.253141403198242, "global_step": 343986, "epoch": 4144} {"train_loss": -25.802078247070312, "global_step": 343987, "epoch": 4144} {"train_loss": -26.0898494720459, "global_step": 343988, "epoch": 4144} {"train_loss": -25.9954891204834, "global_step": 343989, "epoch": 4144} {"train_loss": -26.240171432495117, "global_step": 343990, "epoch": 4144} {"train_loss": -25.732023239135742, "global_step": 343991, "epoch": 4144} {"train_loss": -25.84685707092285, "global_step": 343992, "epoch": 4144} {"train_loss": -26.20405387878418, "global_step": 343993, "epoch": 4144} {"train_loss": -26.466833114624023, "global_step": 343994, "epoch": 4144} {"train_loss": -26.00371742248535, "global_step": 343995, "epoch": 4144} {"train_loss": -25.830896377563477, "global_step": 343996, "epoch": 4144} {"train_loss": -26.22120475769043, "global_step": 343997, "epoch": 4144} {"train_loss": -26.411285400390625, "global_step": 343998, "epoch": 4144} {"train_loss": -26.238004684448242, "global_step": 343999, "epoch": 4144} {"train_loss": -26.468835830688477, "global_step": 344000, "epoch": 4144} {"train_loss": -26.18513298034668, "global_step": 344001, "epoch": 4144} {"train_loss": -26.2714786529541, "global_step": 344002, "epoch": 4144} {"train_loss": -26.326019287109375, "global_step": 344003, "epoch": 4144} {"train_loss": -26.005294799804688, "global_step": 344004, "epoch": 4144} {"train_loss": -26.392704010009766, "global_step": 344005, "epoch": 4144} {"train_loss": -26.431838989257812, "global_step": 344006, "epoch": 4144} {"train_loss": -25.7537899017334, "global_step": 344007, "epoch": 4144} {"train_loss": -25.894811630249023, "global_step": 344008, "epoch": 4144} {"train_loss": -25.667240142822266, "global_step": 344009, "epoch": 4144} {"train_loss": -26.386459350585938, "global_step": 344010, "epoch": 4144} {"train_loss": -25.88191795349121, "global_step": 344011, "epoch": 4144} {"train_loss": -26.179141998291016, "global_step": 344012, "epoch": 4144} {"train_loss": -26.030054092407227, "global_step": 344013, "epoch": 4144} {"train_loss": -26.021764755249023, "global_step": 344014, "epoch": 4144} {"train_loss": -25.987218856811523, "global_step": 344015, "epoch": 4144} {"train_loss": -26.3682918548584, "global_step": 344016, "epoch": 4144} {"train_loss": -25.979333877563477, "global_step": 344017, "epoch": 4144} {"train_loss": -25.802465438842773, "global_step": 344018, "epoch": 4144} {"train_loss": -25.7554931640625, "global_step": 344019, "epoch": 4144} {"train_loss": -26.15303611755371, "global_step": 344020, "epoch": 4144} {"train_loss": -26.425689697265625, "global_step": 344021, "epoch": 4144} {"train_loss": -25.92450523376465, "global_step": 344022, "epoch": 4144} {"train_loss": -26.127288818359375, "global_step": 344023, "epoch": 4144} {"train_loss": -25.962848663330078, "global_step": 344024, "epoch": 4144} {"train_loss": -26.2362117767334, "global_step": 344025, "epoch": 4144} {"train_loss": -26.108877182006836, "global_step": 344026, "epoch": 4144} {"train_loss": -25.80548667907715, "global_step": 344027, "epoch": 4144} {"train_loss": -25.869062423706055, "global_step": 344028, "epoch": 4144} {"train_loss": -26.30242347717285, "global_step": 344029, "epoch": 4144} {"train_loss": -26.07330322265625, "global_step": 344030, "epoch": 4144} {"train_loss": -25.662107467651367, "global_step": 344031, "epoch": 4144} {"train_loss": -26.39759635925293, "global_step": 344032, "epoch": 4144} {"train_loss": -26.338760375976562, "global_step": 344033, "epoch": 4144} {"train_loss": -26.01064916403897, "global_step": 344034, "epoch": 4144, "val_loss": 6612776.5} {"train_loss": -25.597427368164062, "global_step": 344035, "epoch": 4145} {"train_loss": -25.0870418548584, "global_step": 344036, "epoch": 4145} {"train_loss": -25.809284210205078, "global_step": 344037, "epoch": 4145} {"train_loss": -25.575658798217773, "global_step": 344038, "epoch": 4145} {"train_loss": -25.50556755065918, "global_step": 344039, "epoch": 4145} {"train_loss": -25.774328231811523, "global_step": 344040, "epoch": 4145} {"train_loss": -25.915735244750977, "global_step": 344041, "epoch": 4145} {"train_loss": -25.626941680908203, "global_step": 344042, "epoch": 4145} {"train_loss": -25.965635299682617, "global_step": 344043, "epoch": 4145} {"train_loss": -25.713422775268555, "global_step": 344044, "epoch": 4145} {"train_loss": -26.149595260620117, "global_step": 344045, "epoch": 4145} {"train_loss": -25.745420455932617, "global_step": 344046, "epoch": 4145} {"train_loss": -25.7410831451416, "global_step": 344047, "epoch": 4145} {"train_loss": -26.067432403564453, "global_step": 344048, "epoch": 4145} {"train_loss": -25.170848846435547, "global_step": 344049, "epoch": 4145} {"train_loss": -25.98444938659668, "global_step": 344050, "epoch": 4145} {"train_loss": -25.942962646484375, "global_step": 344051, "epoch": 4145} {"train_loss": -26.049041748046875, "global_step": 344052, "epoch": 4145} {"train_loss": -25.60700798034668, "global_step": 344053, "epoch": 4145} {"train_loss": -26.021203994750977, "global_step": 344054, "epoch": 4145} {"train_loss": -25.748281478881836, "global_step": 344055, "epoch": 4145} {"train_loss": -25.945968627929688, "global_step": 344056, "epoch": 4145} {"train_loss": -25.897083282470703, "global_step": 344057, "epoch": 4145} {"train_loss": -26.22918701171875, "global_step": 344058, "epoch": 4145} {"train_loss": -26.13764762878418, "global_step": 344059, "epoch": 4145} {"train_loss": -26.1076602935791, "global_step": 344060, "epoch": 4145} {"train_loss": -25.988544464111328, "global_step": 344061, "epoch": 4145} {"train_loss": -26.005218505859375, "global_step": 344062, "epoch": 4145} {"train_loss": -25.97920036315918, "global_step": 344063, "epoch": 4145} {"train_loss": -25.942426681518555, "global_step": 344064, "epoch": 4145} {"train_loss": -26.106271743774414, "global_step": 344065, "epoch": 4145} {"train_loss": -26.068958282470703, "global_step": 344066, "epoch": 4145} {"train_loss": -26.039844512939453, "global_step": 344067, "epoch": 4145} {"train_loss": -26.262710571289062, "global_step": 344068, "epoch": 4145} {"train_loss": -26.242904663085938, "global_step": 344069, "epoch": 4145} {"train_loss": -26.43488883972168, "global_step": 344070, "epoch": 4145} {"train_loss": -26.288537979125977, "global_step": 344071, "epoch": 4145} {"train_loss": -26.271509170532227, "global_step": 344072, "epoch": 4145} {"train_loss": -26.032018661499023, "global_step": 344073, "epoch": 4145} {"train_loss": -26.057538986206055, "global_step": 344074, "epoch": 4145} {"train_loss": -26.593381881713867, "global_step": 344075, "epoch": 4145} {"train_loss": -26.377735137939453, "global_step": 344076, "epoch": 4145} {"train_loss": -26.422521591186523, "global_step": 344077, "epoch": 4145} {"train_loss": -26.102720260620117, "global_step": 344078, "epoch": 4145} {"train_loss": -26.085880279541016, "global_step": 344079, "epoch": 4145} {"train_loss": -26.338293075561523, "global_step": 344080, "epoch": 4145} {"train_loss": -26.058502197265625, "global_step": 344081, "epoch": 4145} {"train_loss": -26.045080184936523, "global_step": 344082, "epoch": 4145} {"train_loss": -26.113550186157227, "global_step": 344083, "epoch": 4145} {"train_loss": -26.591028213500977, "global_step": 344084, "epoch": 4145} {"train_loss": -25.988828659057617, "global_step": 344085, "epoch": 4145} {"train_loss": -26.131505966186523, "global_step": 344086, "epoch": 4145} {"train_loss": -26.240209579467773, "global_step": 344087, "epoch": 4145} {"train_loss": -25.85565185546875, "global_step": 344088, "epoch": 4145} {"train_loss": -26.343124389648438, "global_step": 344089, "epoch": 4145} {"train_loss": -25.803775787353516, "global_step": 344090, "epoch": 4145} {"train_loss": -26.116174697875977, "global_step": 344091, "epoch": 4145} {"train_loss": -26.276508331298828, "global_step": 344092, "epoch": 4145} {"train_loss": -25.916494369506836, "global_step": 344093, "epoch": 4145} {"train_loss": -26.08009147644043, "global_step": 344094, "epoch": 4145} {"train_loss": -25.972705841064453, "global_step": 344095, "epoch": 4145} {"train_loss": -25.794641494750977, "global_step": 344096, "epoch": 4145} {"train_loss": -26.168188095092773, "global_step": 344097, "epoch": 4145} {"train_loss": -26.25628662109375, "global_step": 344098, "epoch": 4145} {"train_loss": -25.91423988342285, "global_step": 344099, "epoch": 4145} {"train_loss": -26.053070068359375, "global_step": 344100, "epoch": 4145} {"train_loss": -26.178632736206055, "global_step": 344101, "epoch": 4145} {"train_loss": -25.97438621520996, "global_step": 344102, "epoch": 4145} {"train_loss": -26.019916534423828, "global_step": 344103, "epoch": 4145} {"train_loss": -26.183759689331055, "global_step": 344104, "epoch": 4145} {"train_loss": -26.06744384765625, "global_step": 344105, "epoch": 4145} {"train_loss": -26.091724395751953, "global_step": 344106, "epoch": 4145} {"train_loss": -26.56024742126465, "global_step": 344107, "epoch": 4145} {"train_loss": -26.082895278930664, "global_step": 344108, "epoch": 4145} {"train_loss": -26.006433486938477, "global_step": 344109, "epoch": 4145} {"train_loss": -26.130334854125977, "global_step": 344110, "epoch": 4145} {"train_loss": -26.448461532592773, "global_step": 344111, "epoch": 4145} {"train_loss": -26.4175968170166, "global_step": 344112, "epoch": 4145} {"train_loss": -26.404510498046875, "global_step": 344113, "epoch": 4145} {"train_loss": -25.814533233642578, "global_step": 344114, "epoch": 4145} {"train_loss": -26.43366050720215, "global_step": 344115, "epoch": 4145} {"train_loss": -25.891571044921875, "global_step": 344116, "epoch": 4145} {"train_loss": -26.06319592946983, "global_step": 344117, "epoch": 4145, "val_loss": 6647702.5} {"train_loss": -25.609149932861328, "global_step": 344118, "epoch": 4146} {"train_loss": -25.8590087890625, "global_step": 344119, "epoch": 4146} {"train_loss": -25.609445571899414, "global_step": 344120, "epoch": 4146} {"train_loss": -25.779104232788086, "global_step": 344121, "epoch": 4146} {"train_loss": -25.211353302001953, "global_step": 344122, "epoch": 4146} {"train_loss": -26.00373649597168, "global_step": 344123, "epoch": 4146} {"train_loss": -25.509389877319336, "global_step": 344124, "epoch": 4146} {"train_loss": -25.771787643432617, "global_step": 344125, "epoch": 4146} {"train_loss": -26.160770416259766, "global_step": 344126, "epoch": 4146} {"train_loss": -25.605728149414062, "global_step": 344127, "epoch": 4146} {"train_loss": -25.708972930908203, "global_step": 344128, "epoch": 4146} {"train_loss": -26.264114379882812, "global_step": 344129, "epoch": 4146} {"train_loss": -25.4104061126709, "global_step": 344130, "epoch": 4146} {"train_loss": -25.404294967651367, "global_step": 344131, "epoch": 4146} {"train_loss": -25.260845184326172, "global_step": 344132, "epoch": 4146} {"train_loss": -26.076705932617188, "global_step": 344133, "epoch": 4146} {"train_loss": -25.48373794555664, "global_step": 344134, "epoch": 4146} {"train_loss": -25.739383697509766, "global_step": 344135, "epoch": 4146} {"train_loss": -26.097837448120117, "global_step": 344136, "epoch": 4146} {"train_loss": -25.907026290893555, "global_step": 344137, "epoch": 4146} {"train_loss": -26.231409072875977, "global_step": 344138, "epoch": 4146} {"train_loss": -26.24567222595215, "global_step": 344139, "epoch": 4146} {"train_loss": -25.947553634643555, "global_step": 344140, "epoch": 4146} {"train_loss": -26.357013702392578, "global_step": 344141, "epoch": 4146} {"train_loss": -26.127954483032227, "global_step": 344142, "epoch": 4146} {"train_loss": -26.120691299438477, "global_step": 344143, "epoch": 4146} {"train_loss": -25.99525260925293, "global_step": 344144, "epoch": 4146} {"train_loss": -26.0474853515625, "global_step": 344145, "epoch": 4146} {"train_loss": -25.679975509643555, "global_step": 344146, "epoch": 4146} {"train_loss": -25.98931884765625, "global_step": 344147, "epoch": 4146} {"train_loss": -26.134382247924805, "global_step": 344148, "epoch": 4146} {"train_loss": -26.091022491455078, "global_step": 344149, "epoch": 4146} {"train_loss": -26.3867130279541, "global_step": 344150, "epoch": 4146} {"train_loss": -26.100683212280273, "global_step": 344151, "epoch": 4146} {"train_loss": -26.235517501831055, "global_step": 344152, "epoch": 4146} {"train_loss": -25.99715232849121, "global_step": 344153, "epoch": 4146} {"train_loss": -26.50390625, "global_step": 344154, "epoch": 4146} {"train_loss": -26.330881118774414, "global_step": 344155, "epoch": 4146} {"train_loss": -26.55387306213379, "global_step": 344156, "epoch": 4146} {"train_loss": -26.082427978515625, "global_step": 344157, "epoch": 4146} {"train_loss": -26.260883331298828, "global_step": 344158, "epoch": 4146} {"train_loss": -26.1159610748291, "global_step": 344159, "epoch": 4146} {"train_loss": -26.513294219970703, "global_step": 344160, "epoch": 4146} {"train_loss": -26.588903427124023, "global_step": 344161, "epoch": 4146} {"train_loss": -26.13990592956543, "global_step": 344162, "epoch": 4146} {"train_loss": -26.56410789489746, "global_step": 344163, "epoch": 4146} {"train_loss": -26.460378646850586, "global_step": 344164, "epoch": 4146} {"train_loss": -25.87091636657715, "global_step": 344165, "epoch": 4146} {"train_loss": -26.418272018432617, "global_step": 344166, "epoch": 4146} {"train_loss": -26.151453018188477, "global_step": 344167, "epoch": 4146} {"train_loss": -26.23929786682129, "global_step": 344168, "epoch": 4146} {"train_loss": -26.637006759643555, "global_step": 344169, "epoch": 4146} {"train_loss": -26.69757080078125, "global_step": 344170, "epoch": 4146} {"train_loss": -25.8159122467041, "global_step": 344171, "epoch": 4146} {"train_loss": -25.357343673706055, "global_step": 344172, "epoch": 4146} {"train_loss": -25.859907150268555, "global_step": 344173, "epoch": 4146} {"train_loss": -25.9329891204834, "global_step": 344174, "epoch": 4146} {"train_loss": -25.843124389648438, "global_step": 344175, "epoch": 4146} {"train_loss": -24.378376007080078, "global_step": 344176, "epoch": 4146} {"train_loss": -23.556928634643555, "global_step": 344177, "epoch": 4146} {"train_loss": -23.561416625976562, "global_step": 344178, "epoch": 4146} {"train_loss": -25.0927677154541, "global_step": 344179, "epoch": 4146} {"train_loss": -24.967979431152344, "global_step": 344180, "epoch": 4146} {"train_loss": -24.60635757446289, "global_step": 344181, "epoch": 4146} {"train_loss": -25.07550811767578, "global_step": 344182, "epoch": 4146} {"train_loss": -24.553197860717773, "global_step": 344183, "epoch": 4146} {"train_loss": -24.566028594970703, "global_step": 344184, "epoch": 4146} {"train_loss": -25.196643829345703, "global_step": 344185, "epoch": 4146} {"train_loss": -25.04562759399414, "global_step": 344186, "epoch": 4146} {"train_loss": -25.083276748657227, "global_step": 344187, "epoch": 4146} {"train_loss": -25.36313819885254, "global_step": 344188, "epoch": 4146} {"train_loss": -25.21630859375, "global_step": 344189, "epoch": 4146} {"train_loss": -25.004859924316406, "global_step": 344190, "epoch": 4146} {"train_loss": -25.29384422302246, "global_step": 344191, "epoch": 4146} {"train_loss": -25.38481903076172, "global_step": 344192, "epoch": 4146} {"train_loss": -25.558298110961914, "global_step": 344193, "epoch": 4146} {"train_loss": -25.356189727783203, "global_step": 344194, "epoch": 4146} {"train_loss": -25.5120906829834, "global_step": 344195, "epoch": 4146} {"train_loss": -25.60919189453125, "global_step": 344196, "epoch": 4146} {"train_loss": -25.627592086791992, "global_step": 344197, "epoch": 4146} {"train_loss": -25.45716667175293, "global_step": 344198, "epoch": 4146} {"train_loss": -25.52851104736328, "global_step": 344199, "epoch": 4146} {"train_loss": -25.731529718422028, "global_step": 344200, "epoch": 4146, "val_loss": 6641978.0} {"train_loss": -25.471532821655273, "global_step": 344201, "epoch": 4147} {"train_loss": -25.481382369995117, "global_step": 344202, "epoch": 4147} {"train_loss": -25.344486236572266, "global_step": 344203, "epoch": 4147} {"train_loss": -25.381650924682617, "global_step": 344204, "epoch": 4147} {"train_loss": -25.277612686157227, "global_step": 344205, "epoch": 4147} {"train_loss": -25.501956939697266, "global_step": 344206, "epoch": 4147} {"train_loss": -25.624786376953125, "global_step": 344207, "epoch": 4147} {"train_loss": -25.447467803955078, "global_step": 344208, "epoch": 4147} {"train_loss": -25.436155319213867, "global_step": 344209, "epoch": 4147} {"train_loss": -25.651437759399414, "global_step": 344210, "epoch": 4147} {"train_loss": -25.78786277770996, "global_step": 344211, "epoch": 4147} {"train_loss": -25.57615089416504, "global_step": 344212, "epoch": 4147} {"train_loss": -25.626935958862305, "global_step": 344213, "epoch": 4147} {"train_loss": -25.92303466796875, "global_step": 344214, "epoch": 4147} {"train_loss": -25.688390731811523, "global_step": 344215, "epoch": 4147} {"train_loss": -26.0803165435791, "global_step": 344216, "epoch": 4147} {"train_loss": -25.614013671875, "global_step": 344217, "epoch": 4147} {"train_loss": -26.243234634399414, "global_step": 344218, "epoch": 4147} {"train_loss": -25.78733253479004, "global_step": 344219, "epoch": 4147} {"train_loss": -26.00587272644043, "global_step": 344220, "epoch": 4147} {"train_loss": -25.79656982421875, "global_step": 344221, "epoch": 4147} {"train_loss": -26.116901397705078, "global_step": 344222, "epoch": 4147} {"train_loss": -26.22173500061035, "global_step": 344223, "epoch": 4147} {"train_loss": -25.9571590423584, "global_step": 344224, "epoch": 4147} {"train_loss": -26.08447265625, "global_step": 344225, "epoch": 4147} {"train_loss": -26.402408599853516, "global_step": 344226, "epoch": 4147} {"train_loss": -26.319223403930664, "global_step": 344227, "epoch": 4147} {"train_loss": -26.340917587280273, "global_step": 344228, "epoch": 4147} {"train_loss": -26.309234619140625, "global_step": 344229, "epoch": 4147} {"train_loss": -25.967681884765625, "global_step": 344230, "epoch": 4147} {"train_loss": -26.389123916625977, "global_step": 344231, "epoch": 4147} {"train_loss": -26.080005645751953, "global_step": 344232, "epoch": 4147} {"train_loss": -26.216388702392578, "global_step": 344233, "epoch": 4147} {"train_loss": -26.24354362487793, "global_step": 344234, "epoch": 4147} {"train_loss": -26.005666732788086, "global_step": 344235, "epoch": 4147} {"train_loss": -26.166645050048828, "global_step": 344236, "epoch": 4147} {"train_loss": -26.3402099609375, "global_step": 344237, "epoch": 4147} {"train_loss": -26.370996475219727, "global_step": 344238, "epoch": 4147} {"train_loss": -26.427352905273438, "global_step": 344239, "epoch": 4147} {"train_loss": -26.393817901611328, "global_step": 344240, "epoch": 4147} {"train_loss": -26.268049240112305, "global_step": 344241, "epoch": 4147} {"train_loss": -26.211029052734375, "global_step": 344242, "epoch": 4147} {"train_loss": -26.240331649780273, "global_step": 344243, "epoch": 4147} {"train_loss": -26.280780792236328, "global_step": 344244, "epoch": 4147} {"train_loss": -26.31110191345215, "global_step": 344245, "epoch": 4147} {"train_loss": -26.36282730102539, "global_step": 344246, "epoch": 4147} {"train_loss": -26.240039825439453, "global_step": 344247, "epoch": 4147} {"train_loss": -26.542194366455078, "global_step": 344248, "epoch": 4147} {"train_loss": -26.137495040893555, "global_step": 344249, "epoch": 4147} {"train_loss": -26.427825927734375, "global_step": 344250, "epoch": 4147} {"train_loss": -25.781055450439453, "global_step": 344251, "epoch": 4147} {"train_loss": -26.17022705078125, "global_step": 344252, "epoch": 4147} {"train_loss": -25.942296981811523, "global_step": 344253, "epoch": 4147} {"train_loss": -26.526657104492188, "global_step": 344254, "epoch": 4147} {"train_loss": -25.98579978942871, "global_step": 344255, "epoch": 4147} {"train_loss": -26.36920166015625, "global_step": 344256, "epoch": 4147} {"train_loss": -26.066009521484375, "global_step": 344257, "epoch": 4147} {"train_loss": -25.910070419311523, "global_step": 344258, "epoch": 4147} {"train_loss": -25.93879508972168, "global_step": 344259, "epoch": 4147} {"train_loss": -26.01523208618164, "global_step": 344260, "epoch": 4147} {"train_loss": -26.557687759399414, "global_step": 344261, "epoch": 4147} {"train_loss": -25.620141983032227, "global_step": 344262, "epoch": 4147} {"train_loss": -25.572296142578125, "global_step": 344263, "epoch": 4147} {"train_loss": -26.22513771057129, "global_step": 344264, "epoch": 4147} {"train_loss": -25.839868545532227, "global_step": 344265, "epoch": 4147} {"train_loss": -25.944013595581055, "global_step": 344266, "epoch": 4147} {"train_loss": -25.780668258666992, "global_step": 344267, "epoch": 4147} {"train_loss": -25.96466064453125, "global_step": 344268, "epoch": 4147} {"train_loss": -26.233121871948242, "global_step": 344269, "epoch": 4147} {"train_loss": -26.5069580078125, "global_step": 344270, "epoch": 4147} {"train_loss": -26.093585968017578, "global_step": 344271, "epoch": 4147} {"train_loss": -26.02021598815918, "global_step": 344272, "epoch": 4147} {"train_loss": -25.919784545898438, "global_step": 344273, "epoch": 4147} {"train_loss": -26.128009796142578, "global_step": 344274, "epoch": 4147} {"train_loss": -26.5526065826416, "global_step": 344275, "epoch": 4147} {"train_loss": -25.68939781188965, "global_step": 344276, "epoch": 4147} {"train_loss": -26.526966094970703, "global_step": 344277, "epoch": 4147} {"train_loss": -25.806259155273438, "global_step": 344278, "epoch": 4147} {"train_loss": -25.895099639892578, "global_step": 344279, "epoch": 4147} {"train_loss": -25.93280029296875, "global_step": 344280, "epoch": 4147} {"train_loss": -26.157398223876953, "global_step": 344281, "epoch": 4147} {"train_loss": -26.126068115234375, "global_step": 344282, "epoch": 4147} {"train_loss": -26.027704951274824, "global_step": 344283, "epoch": 4147, "val_loss": 6648244.0} {"train_loss": -26.139453887939453, "global_step": 344284, "epoch": 4148} {"train_loss": -25.94950294494629, "global_step": 344285, "epoch": 4148} {"train_loss": -25.734619140625, "global_step": 344286, "epoch": 4148} {"train_loss": -26.20526123046875, "global_step": 344287, "epoch": 4148} {"train_loss": -25.876134872436523, "global_step": 344288, "epoch": 4148} {"train_loss": -25.69269371032715, "global_step": 344289, "epoch": 4148} {"train_loss": -26.188873291015625, "global_step": 344290, "epoch": 4148} {"train_loss": -26.019140243530273, "global_step": 344291, "epoch": 4148} {"train_loss": -26.190521240234375, "global_step": 344292, "epoch": 4148} {"train_loss": -26.13225746154785, "global_step": 344293, "epoch": 4148} {"train_loss": -26.362730026245117, "global_step": 344294, "epoch": 4148} {"train_loss": -26.364521026611328, "global_step": 344295, "epoch": 4148} {"train_loss": -26.218488693237305, "global_step": 344296, "epoch": 4148} {"train_loss": -25.86981201171875, "global_step": 344297, "epoch": 4148} {"train_loss": -26.117923736572266, "global_step": 344298, "epoch": 4148} {"train_loss": -25.964969635009766, "global_step": 344299, "epoch": 4148} {"train_loss": -26.439489364624023, "global_step": 344300, "epoch": 4148} {"train_loss": -26.5124454498291, "global_step": 344301, "epoch": 4148} {"train_loss": -25.804279327392578, "global_step": 344302, "epoch": 4148} {"train_loss": -26.073429107666016, "global_step": 344303, "epoch": 4148} {"train_loss": -26.027982711791992, "global_step": 344304, "epoch": 4148} {"train_loss": -25.895893096923828, "global_step": 344305, "epoch": 4148} {"train_loss": -26.23760986328125, "global_step": 344306, "epoch": 4148} {"train_loss": -26.145938873291016, "global_step": 344307, "epoch": 4148} {"train_loss": -25.988040924072266, "global_step": 344308, "epoch": 4148} {"train_loss": -25.7991886138916, "global_step": 344309, "epoch": 4148} {"train_loss": -25.927520751953125, "global_step": 344310, "epoch": 4148} {"train_loss": -25.727201461791992, "global_step": 344311, "epoch": 4148} {"train_loss": -26.00064468383789, "global_step": 344312, "epoch": 4148} {"train_loss": -25.825300216674805, "global_step": 344313, "epoch": 4148} {"train_loss": -25.66511344909668, "global_step": 344314, "epoch": 4148} {"train_loss": -25.920080184936523, "global_step": 344315, "epoch": 4148} {"train_loss": -25.687475204467773, "global_step": 344316, "epoch": 4148} {"train_loss": -26.07391929626465, "global_step": 344317, "epoch": 4148} {"train_loss": -25.907108306884766, "global_step": 344318, "epoch": 4148} {"train_loss": -26.51255226135254, "global_step": 344319, "epoch": 4148} {"train_loss": -26.29713249206543, "global_step": 344320, "epoch": 4148} {"train_loss": -26.130451202392578, "global_step": 344321, "epoch": 4148} {"train_loss": -25.856735229492188, "global_step": 344322, "epoch": 4148} {"train_loss": -26.4365177154541, "global_step": 344323, "epoch": 4148} {"train_loss": -26.28812599182129, "global_step": 344324, "epoch": 4148} {"train_loss": -26.177875518798828, "global_step": 344325, "epoch": 4148} {"train_loss": -26.051010131835938, "global_step": 344326, "epoch": 4148} {"train_loss": -26.023962020874023, "global_step": 344327, "epoch": 4148} {"train_loss": -25.96674919128418, "global_step": 344328, "epoch": 4148} {"train_loss": -25.995819091796875, "global_step": 344329, "epoch": 4148} {"train_loss": -26.22613525390625, "global_step": 344330, "epoch": 4148} {"train_loss": -25.8085880279541, "global_step": 344331, "epoch": 4148} {"train_loss": -26.311710357666016, "global_step": 344332, "epoch": 4148} {"train_loss": -26.133838653564453, "global_step": 344333, "epoch": 4148} {"train_loss": -26.297290802001953, "global_step": 344334, "epoch": 4148} {"train_loss": -26.504444122314453, "global_step": 344335, "epoch": 4148} {"train_loss": -25.9742431640625, "global_step": 344336, "epoch": 4148} {"train_loss": -26.080184936523438, "global_step": 344337, "epoch": 4148} {"train_loss": -25.911588668823242, "global_step": 344338, "epoch": 4148} {"train_loss": -26.11823844909668, "global_step": 344339, "epoch": 4148} {"train_loss": -26.466962814331055, "global_step": 344340, "epoch": 4148} {"train_loss": -26.189565658569336, "global_step": 344341, "epoch": 4148} {"train_loss": -26.49237060546875, "global_step": 344342, "epoch": 4148} {"train_loss": -26.038488388061523, "global_step": 344343, "epoch": 4148} {"train_loss": -26.055496215820312, "global_step": 344344, "epoch": 4148} {"train_loss": -25.80921745300293, "global_step": 344345, "epoch": 4148} {"train_loss": -26.48805046081543, "global_step": 344346, "epoch": 4148} {"train_loss": -26.38300132751465, "global_step": 344347, "epoch": 4148} {"train_loss": -25.916797637939453, "global_step": 344348, "epoch": 4148} {"train_loss": -25.773584365844727, "global_step": 344349, "epoch": 4148} {"train_loss": -26.043277740478516, "global_step": 344350, "epoch": 4148} {"train_loss": -26.178943634033203, "global_step": 344351, "epoch": 4148} {"train_loss": -26.08198356628418, "global_step": 344352, "epoch": 4148} {"train_loss": -26.038421630859375, "global_step": 344353, "epoch": 4148} {"train_loss": -26.08180046081543, "global_step": 344354, "epoch": 4148} {"train_loss": -26.23578453063965, "global_step": 344355, "epoch": 4148} {"train_loss": -26.24928092956543, "global_step": 344356, "epoch": 4148} {"train_loss": -26.336551666259766, "global_step": 344357, "epoch": 4148} {"train_loss": -26.46002197265625, "global_step": 344358, "epoch": 4148} {"train_loss": -26.246601104736328, "global_step": 344359, "epoch": 4148} {"train_loss": -26.285551071166992, "global_step": 344360, "epoch": 4148} {"train_loss": -26.316923141479492, "global_step": 344361, "epoch": 4148} {"train_loss": -26.264026641845703, "global_step": 344362, "epoch": 4148} {"train_loss": -26.1986141204834, "global_step": 344363, "epoch": 4148} {"train_loss": -26.585407257080078, "global_step": 344364, "epoch": 4148} {"train_loss": -25.96310806274414, "global_step": 344365, "epoch": 4148} {"train_loss": -26.122769688985432, "global_step": 344366, "epoch": 4148, "val_loss": 6642918.0} {"train_loss": -25.994455337524414, "global_step": 344367, "epoch": 4149} {"train_loss": -25.283090591430664, "global_step": 344368, "epoch": 4149} {"train_loss": -25.385427474975586, "global_step": 344369, "epoch": 4149} {"train_loss": -24.73076820373535, "global_step": 344370, "epoch": 4149} {"train_loss": -25.407438278198242, "global_step": 344371, "epoch": 4149} {"train_loss": -25.316999435424805, "global_step": 344372, "epoch": 4149} {"train_loss": -25.991973876953125, "global_step": 344373, "epoch": 4149} {"train_loss": -25.490270614624023, "global_step": 344374, "epoch": 4149} {"train_loss": -25.626422882080078, "global_step": 344375, "epoch": 4149} {"train_loss": -25.765233993530273, "global_step": 344376, "epoch": 4149} {"train_loss": -25.532136917114258, "global_step": 344377, "epoch": 4149} {"train_loss": -25.21819496154785, "global_step": 344378, "epoch": 4149} {"train_loss": -25.952829360961914, "global_step": 344379, "epoch": 4149} {"train_loss": -25.635839462280273, "global_step": 344380, "epoch": 4149} {"train_loss": -25.887937545776367, "global_step": 344381, "epoch": 4149} {"train_loss": -25.518470764160156, "global_step": 344382, "epoch": 4149} {"train_loss": -25.683881759643555, "global_step": 344383, "epoch": 4149} {"train_loss": -25.595985412597656, "global_step": 344384, "epoch": 4149} {"train_loss": -25.799331665039062, "global_step": 344385, "epoch": 4149} {"train_loss": -26.351728439331055, "global_step": 344386, "epoch": 4149} {"train_loss": -26.10499382019043, "global_step": 344387, "epoch": 4149} {"train_loss": -26.052570343017578, "global_step": 344388, "epoch": 4149} {"train_loss": -26.197158813476562, "global_step": 344389, "epoch": 4149} {"train_loss": -26.18927001953125, "global_step": 344390, "epoch": 4149} {"train_loss": -25.994070053100586, "global_step": 344391, "epoch": 4149} {"train_loss": -26.10701560974121, "global_step": 344392, "epoch": 4149} {"train_loss": -26.07001304626465, "global_step": 344393, "epoch": 4149} {"train_loss": -26.300983428955078, "global_step": 344394, "epoch": 4149} {"train_loss": -25.930011749267578, "global_step": 344395, "epoch": 4149} {"train_loss": -26.065149307250977, "global_step": 344396, "epoch": 4149} {"train_loss": -26.04986000061035, "global_step": 344397, "epoch": 4149} {"train_loss": -26.17681312561035, "global_step": 344398, "epoch": 4149} {"train_loss": -25.509170532226562, "global_step": 344399, "epoch": 4149} {"train_loss": -26.243635177612305, "global_step": 344400, "epoch": 4149} {"train_loss": -26.182905197143555, "global_step": 344401, "epoch": 4149} {"train_loss": -25.877212524414062, "global_step": 344402, "epoch": 4149} {"train_loss": -26.265592575073242, "global_step": 344403, "epoch": 4149} {"train_loss": -25.96646499633789, "global_step": 344404, "epoch": 4149} {"train_loss": -26.398427963256836, "global_step": 344405, "epoch": 4149} {"train_loss": -26.0391845703125, "global_step": 344406, "epoch": 4149} {"train_loss": -26.409326553344727, "global_step": 344407, "epoch": 4149} {"train_loss": -25.891950607299805, "global_step": 344408, "epoch": 4149} {"train_loss": -25.894474029541016, "global_step": 344409, "epoch": 4149} {"train_loss": -26.20623779296875, "global_step": 344410, "epoch": 4149} {"train_loss": -26.052692413330078, "global_step": 344411, "epoch": 4149} {"train_loss": -25.961530685424805, "global_step": 344412, "epoch": 4149} {"train_loss": -25.895416259765625, "global_step": 344413, "epoch": 4149} {"train_loss": -26.0562801361084, "global_step": 344414, "epoch": 4149} {"train_loss": -26.720382690429688, "global_step": 344415, "epoch": 4149} {"train_loss": -26.271692276000977, "global_step": 344416, "epoch": 4149} {"train_loss": -26.47333335876465, "global_step": 344417, "epoch": 4149} {"train_loss": -26.149560928344727, "global_step": 344418, "epoch": 4149} {"train_loss": -26.008108139038086, "global_step": 344419, "epoch": 4149} {"train_loss": -26.1386661529541, "global_step": 344420, "epoch": 4149} {"train_loss": -25.55959129333496, "global_step": 344421, "epoch": 4149} {"train_loss": -25.765161514282227, "global_step": 344422, "epoch": 4149} {"train_loss": -25.72726821899414, "global_step": 344423, "epoch": 4149} {"train_loss": -25.664148330688477, "global_step": 344424, "epoch": 4149} {"train_loss": -26.245473861694336, "global_step": 344425, "epoch": 4149} {"train_loss": -25.79001808166504, "global_step": 344426, "epoch": 4149} {"train_loss": -25.64388084411621, "global_step": 344427, "epoch": 4149} {"train_loss": -26.065418243408203, "global_step": 344428, "epoch": 4149} {"train_loss": -26.124235153198242, "global_step": 344429, "epoch": 4149} {"train_loss": -26.05531120300293, "global_step": 344430, "epoch": 4149} {"train_loss": -25.762388229370117, "global_step": 344431, "epoch": 4149} {"train_loss": -26.531034469604492, "global_step": 344432, "epoch": 4149} {"train_loss": -25.659473419189453, "global_step": 344433, "epoch": 4149} {"train_loss": -26.121856689453125, "global_step": 344434, "epoch": 4149} {"train_loss": -25.779340744018555, "global_step": 344435, "epoch": 4149} {"train_loss": -25.696182250976562, "global_step": 344436, "epoch": 4149} {"train_loss": -25.989852905273438, "global_step": 344437, "epoch": 4149} {"train_loss": -25.982975006103516, "global_step": 344438, "epoch": 4149} {"train_loss": -25.84564781188965, "global_step": 344439, "epoch": 4149} {"train_loss": -26.046152114868164, "global_step": 344440, "epoch": 4149} {"train_loss": -26.08121681213379, "global_step": 344441, "epoch": 4149} {"train_loss": -26.14115333557129, "global_step": 344442, "epoch": 4149} {"train_loss": -25.668079376220703, "global_step": 344443, "epoch": 4149} {"train_loss": -26.073379516601562, "global_step": 344444, "epoch": 4149} {"train_loss": -26.041025161743164, "global_step": 344445, "epoch": 4149} {"train_loss": -26.460073471069336, "global_step": 344446, "epoch": 4149} {"train_loss": -26.1046142578125, "global_step": 344447, "epoch": 4149} {"train_loss": -26.16556167602539, "global_step": 344448, "epoch": 4149} {"train_loss": -25.941809504865162, "global_step": 344449, "epoch": 4149, "val_loss": 6669064.5} {"train_loss": -25.545902252197266, "global_step": 344450, "epoch": 4150} {"train_loss": -25.78643226623535, "global_step": 344451, "epoch": 4150} {"train_loss": -26.157346725463867, "global_step": 344452, "epoch": 4150} {"train_loss": -25.24155616760254, "global_step": 344453, "epoch": 4150} {"train_loss": -25.746479034423828, "global_step": 344454, "epoch": 4150} {"train_loss": -25.912107467651367, "global_step": 344455, "epoch": 4150} {"train_loss": -25.801483154296875, "global_step": 344456, "epoch": 4150} {"train_loss": -25.522558212280273, "global_step": 344457, "epoch": 4150} {"train_loss": -25.572675704956055, "global_step": 344458, "epoch": 4150} {"train_loss": -25.666778564453125, "global_step": 344459, "epoch": 4150} {"train_loss": -26.10249137878418, "global_step": 344460, "epoch": 4150} {"train_loss": -25.672727584838867, "global_step": 344461, "epoch": 4150} {"train_loss": -25.569093704223633, "global_step": 344462, "epoch": 4150} {"train_loss": -26.115346908569336, "global_step": 344463, "epoch": 4150} {"train_loss": -25.6538028717041, "global_step": 344464, "epoch": 4150} {"train_loss": -25.97779655456543, "global_step": 344465, "epoch": 4150} {"train_loss": -26.059558868408203, "global_step": 344466, "epoch": 4150} {"train_loss": -25.767780303955078, "global_step": 344467, "epoch": 4150} {"train_loss": -25.680246353149414, "global_step": 344468, "epoch": 4150} {"train_loss": -26.270172119140625, "global_step": 344469, "epoch": 4150} {"train_loss": -25.912567138671875, "global_step": 344470, "epoch": 4150} {"train_loss": -26.157562255859375, "global_step": 344471, "epoch": 4150} {"train_loss": -26.002002716064453, "global_step": 344472, "epoch": 4150} {"train_loss": -26.28948402404785, "global_step": 344473, "epoch": 4150} {"train_loss": -25.971044540405273, "global_step": 344474, "epoch": 4150} {"train_loss": -25.86354637145996, "global_step": 344475, "epoch": 4150} {"train_loss": -25.9406681060791, "global_step": 344476, "epoch": 4150} {"train_loss": -26.084318161010742, "global_step": 344477, "epoch": 4150} {"train_loss": -26.341766357421875, "global_step": 344478, "epoch": 4150} {"train_loss": -26.112634658813477, "global_step": 344479, "epoch": 4150} {"train_loss": -25.438114166259766, "global_step": 344480, "epoch": 4150} {"train_loss": -26.46339988708496, "global_step": 344481, "epoch": 4150} {"train_loss": -26.116363525390625, "global_step": 344482, "epoch": 4150} {"train_loss": -25.9429988861084, "global_step": 344483, "epoch": 4150} {"train_loss": -26.208520889282227, "global_step": 344484, "epoch": 4150} {"train_loss": -26.12668800354004, "global_step": 344485, "epoch": 4150} {"train_loss": -26.50969886779785, "global_step": 344486, "epoch": 4150} {"train_loss": -26.163557052612305, "global_step": 344487, "epoch": 4150} {"train_loss": -26.288116455078125, "global_step": 344488, "epoch": 4150} {"train_loss": -26.380170822143555, "global_step": 344489, "epoch": 4150} {"train_loss": -26.215681076049805, "global_step": 344490, "epoch": 4150} {"train_loss": -25.829370498657227, "global_step": 344491, "epoch": 4150} {"train_loss": -26.352874755859375, "global_step": 344492, "epoch": 4150} {"train_loss": -26.07095718383789, "global_step": 344493, "epoch": 4150} {"train_loss": -26.20794105529785, "global_step": 344494, "epoch": 4150} {"train_loss": -26.279821395874023, "global_step": 344495, "epoch": 4150} {"train_loss": -26.37347412109375, "global_step": 344496, "epoch": 4150} {"train_loss": -26.4992733001709, "global_step": 344497, "epoch": 4150} {"train_loss": -26.28586769104004, "global_step": 344498, "epoch": 4150} {"train_loss": -26.210865020751953, "global_step": 344499, "epoch": 4150} {"train_loss": -26.143239974975586, "global_step": 344500, "epoch": 4150} {"train_loss": -26.33550453186035, "global_step": 344501, "epoch": 4150} {"train_loss": -26.282150268554688, "global_step": 344502, "epoch": 4150} {"train_loss": -25.975805282592773, "global_step": 344503, "epoch": 4150} {"train_loss": -25.898283004760742, "global_step": 344504, "epoch": 4150} {"train_loss": -26.285598754882812, "global_step": 344505, "epoch": 4150} {"train_loss": -25.7487735748291, "global_step": 344506, "epoch": 4150} {"train_loss": -25.983112335205078, "global_step": 344507, "epoch": 4150} {"train_loss": -25.65584373474121, "global_step": 344508, "epoch": 4150} {"train_loss": -25.736316680908203, "global_step": 344509, "epoch": 4150} {"train_loss": -26.215499877929688, "global_step": 344510, "epoch": 4150} {"train_loss": -26.086811065673828, "global_step": 344511, "epoch": 4150} {"train_loss": -25.98267936706543, "global_step": 344512, "epoch": 4150} {"train_loss": -26.045459747314453, "global_step": 344513, "epoch": 4150} {"train_loss": -26.25970458984375, "global_step": 344514, "epoch": 4150} {"train_loss": -26.016921997070312, "global_step": 344515, "epoch": 4150} {"train_loss": -25.87105369567871, "global_step": 344516, "epoch": 4150} {"train_loss": -26.137969970703125, "global_step": 344517, "epoch": 4150} {"train_loss": -25.99131202697754, "global_step": 344518, "epoch": 4150} {"train_loss": -25.976211547851562, "global_step": 344519, "epoch": 4150} {"train_loss": -26.258703231811523, "global_step": 344520, "epoch": 4150} {"train_loss": -25.87994384765625, "global_step": 344521, "epoch": 4150} {"train_loss": -25.876325607299805, "global_step": 344522, "epoch": 4150} {"train_loss": -25.974218368530273, "global_step": 344523, "epoch": 4150} {"train_loss": -26.267414093017578, "global_step": 344524, "epoch": 4150} {"train_loss": -26.52918815612793, "global_step": 344525, "epoch": 4150} {"train_loss": -26.40924072265625, "global_step": 344526, "epoch": 4150} {"train_loss": -26.09852409362793, "global_step": 344527, "epoch": 4150} {"train_loss": -25.697107315063477, "global_step": 344528, "epoch": 4150} {"train_loss": -25.9752140045166, "global_step": 344529, "epoch": 4150} {"train_loss": -26.662012100219727, "global_step": 344530, "epoch": 4150} {"train_loss": -26.330053329467773, "global_step": 344531, "epoch": 4150} {"train_loss": -26.02110853539892, "global_step": 344532, "epoch": 4150, "train/sim_max_reward_0": 1.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4500000": 1.0, "test/sim_max_reward_4500001": 1.0, "test/sim_max_reward_4500002": 1.0, "test/sim_max_reward_4500003": 1.0, "test/sim_max_reward_4500004": 1.0, "test/sim_max_reward_4500005": 1.0, "test/sim_max_reward_4500006": 1.0, "test/sim_max_reward_4500007": 0.0, "test/sim_max_reward_4500008": 1.0, "test/sim_max_reward_4500009": 1.0, "test/sim_max_reward_4500010": 1.0, "test/sim_max_reward_4500011": 1.0, "test/sim_max_reward_4500012": 1.0, "test/sim_max_reward_4500013": 0.0, "test/sim_max_reward_4500014": 1.0, "test/sim_max_reward_4500015": 1.0, "test/sim_max_reward_4500016": 1.0, "test/sim_max_reward_4500017": 1.0, "test/sim_max_reward_4500018": 1.0, "test/sim_max_reward_4500019": 1.0, "test/sim_max_reward_4500020": 1.0, "test/sim_max_reward_4500021": 1.0, "train/mean_score": 1.0, "test/mean_score": 0.9090909090909091, "val_loss": 6632287.0} {"train_loss": -25.764230728149414, "global_step": 344533, "epoch": 4151} {"train_loss": -25.34691619873047, "global_step": 344534, "epoch": 4151} {"train_loss": -25.60003089904785, "global_step": 344535, "epoch": 4151} {"train_loss": -25.4913387298584, "global_step": 344536, "epoch": 4151} {"train_loss": -26.043195724487305, "global_step": 344537, "epoch": 4151} {"train_loss": -25.712244033813477, "global_step": 344538, "epoch": 4151} {"train_loss": -25.253618240356445, "global_step": 344539, "epoch": 4151} {"train_loss": -25.773420333862305, "global_step": 344540, "epoch": 4151} {"train_loss": -25.97896385192871, "global_step": 344541, "epoch": 4151} {"train_loss": -25.444862365722656, "global_step": 344542, "epoch": 4151} {"train_loss": -26.16582679748535, "global_step": 344543, "epoch": 4151} {"train_loss": -25.95668601989746, "global_step": 344544, "epoch": 4151} {"train_loss": -26.33991813659668, "global_step": 344545, "epoch": 4151} {"train_loss": -25.9815673828125, "global_step": 344546, "epoch": 4151} {"train_loss": -26.005329132080078, "global_step": 344547, "epoch": 4151} {"train_loss": -26.19708251953125, "global_step": 344548, "epoch": 4151} {"train_loss": -26.0402774810791, "global_step": 344549, "epoch": 4151} {"train_loss": -26.054960250854492, "global_step": 344550, "epoch": 4151} {"train_loss": -26.223377227783203, "global_step": 344551, "epoch": 4151} {"train_loss": -26.368396759033203, "global_step": 344552, "epoch": 4151} {"train_loss": -26.03388786315918, "global_step": 344553, "epoch": 4151} {"train_loss": -26.2862491607666, "global_step": 344554, "epoch": 4151} {"train_loss": -26.301111221313477, "global_step": 344555, "epoch": 4151} {"train_loss": -26.21685791015625, "global_step": 344556, "epoch": 4151} {"train_loss": -26.209909439086914, "global_step": 344557, "epoch": 4151} {"train_loss": -26.055402755737305, "global_step": 344558, "epoch": 4151} {"train_loss": -26.265121459960938, "global_step": 344559, "epoch": 4151} {"train_loss": -26.335071563720703, "global_step": 344560, "epoch": 4151} {"train_loss": -25.834156036376953, "global_step": 344561, "epoch": 4151} {"train_loss": -25.836069107055664, "global_step": 344562, "epoch": 4151} {"train_loss": -25.8494873046875, "global_step": 344563, "epoch": 4151} {"train_loss": -26.207752227783203, "global_step": 344564, "epoch": 4151} {"train_loss": -26.216373443603516, "global_step": 344565, "epoch": 4151} {"train_loss": -26.035375595092773, "global_step": 344566, "epoch": 4151} {"train_loss": -26.158039093017578, "global_step": 344567, "epoch": 4151} {"train_loss": -26.06694984436035, "global_step": 344568, "epoch": 4151} {"train_loss": -26.09760856628418, "global_step": 344569, "epoch": 4151} {"train_loss": -26.248779296875, "global_step": 344570, "epoch": 4151} {"train_loss": -26.130346298217773, "global_step": 344571, "epoch": 4151} {"train_loss": -26.42764663696289, "global_step": 344572, "epoch": 4151} {"train_loss": -26.298608779907227, "global_step": 344573, "epoch": 4151} {"train_loss": -26.268512725830078, "global_step": 344574, "epoch": 4151} {"train_loss": -26.358137130737305, "global_step": 344575, "epoch": 4151} {"train_loss": -25.70682716369629, "global_step": 344576, "epoch": 4151} {"train_loss": -26.13862419128418, "global_step": 344577, "epoch": 4151} {"train_loss": -26.606348037719727, "global_step": 344578, "epoch": 4151} {"train_loss": -25.9895076751709, "global_step": 344579, "epoch": 4151} {"train_loss": -26.017972946166992, "global_step": 344580, "epoch": 4151} {"train_loss": -26.315692901611328, "global_step": 344581, "epoch": 4151} {"train_loss": -25.701175689697266, "global_step": 344582, "epoch": 4151} {"train_loss": -26.034170150756836, "global_step": 344583, "epoch": 4151} {"train_loss": -25.90144920349121, "global_step": 344584, "epoch": 4151} {"train_loss": -26.011566162109375, "global_step": 344585, "epoch": 4151} {"train_loss": -26.316944122314453, "global_step": 344586, "epoch": 4151} {"train_loss": -25.763751983642578, "global_step": 344587, "epoch": 4151} {"train_loss": -26.026782989501953, "global_step": 344588, "epoch": 4151} {"train_loss": -26.104883193969727, "global_step": 344589, "epoch": 4151} {"train_loss": -25.5145206451416, "global_step": 344590, "epoch": 4151} {"train_loss": -25.448171615600586, "global_step": 344591, "epoch": 4151} {"train_loss": -25.55174446105957, "global_step": 344592, "epoch": 4151} {"train_loss": -25.834924697875977, "global_step": 344593, "epoch": 4151} {"train_loss": -25.682601928710938, "global_step": 344594, "epoch": 4151} {"train_loss": -25.849853515625, "global_step": 344595, "epoch": 4151} {"train_loss": -25.860708236694336, "global_step": 344596, "epoch": 4151} {"train_loss": -25.75489616394043, "global_step": 344597, "epoch": 4151} {"train_loss": -25.652536392211914, "global_step": 344598, "epoch": 4151} {"train_loss": -25.508787155151367, "global_step": 344599, "epoch": 4151} {"train_loss": -25.73884391784668, "global_step": 344600, "epoch": 4151} {"train_loss": -26.21990394592285, "global_step": 344601, "epoch": 4151} {"train_loss": -26.069503784179688, "global_step": 344602, "epoch": 4151} {"train_loss": -26.201038360595703, "global_step": 344603, "epoch": 4151} {"train_loss": -25.820178985595703, "global_step": 344604, "epoch": 4151} {"train_loss": -26.056507110595703, "global_step": 344605, "epoch": 4151} {"train_loss": -26.00559425354004, "global_step": 344606, "epoch": 4151} {"train_loss": -25.8229923248291, "global_step": 344607, "epoch": 4151} {"train_loss": -25.530099868774414, "global_step": 344608, "epoch": 4151} {"train_loss": -26.231250762939453, "global_step": 344609, "epoch": 4151} {"train_loss": -25.758085250854492, "global_step": 344610, "epoch": 4151} {"train_loss": -26.29558753967285, "global_step": 344611, "epoch": 4151} {"train_loss": -25.973539352416992, "global_step": 344612, "epoch": 4151} {"train_loss": -26.247283935546875, "global_step": 344613, "epoch": 4151} {"train_loss": -25.91510581970215, "global_step": 344614, "epoch": 4151} {"train_loss": -25.980799732438054, "global_step": 344615, "epoch": 4151, "val_loss": 6703759.0} {"train_loss": -26.085845947265625, "global_step": 344616, "epoch": 4152} {"train_loss": -25.386442184448242, "global_step": 344617, "epoch": 4152} {"train_loss": -25.716794967651367, "global_step": 344618, "epoch": 4152} {"train_loss": -25.630298614501953, "global_step": 344619, "epoch": 4152} {"train_loss": -25.674097061157227, "global_step": 344620, "epoch": 4152} {"train_loss": -25.826684951782227, "global_step": 344621, "epoch": 4152} {"train_loss": -25.633209228515625, "global_step": 344622, "epoch": 4152} {"train_loss": -25.7398738861084, "global_step": 344623, "epoch": 4152} {"train_loss": -25.839452743530273, "global_step": 344624, "epoch": 4152} {"train_loss": -25.80084228515625, "global_step": 344625, "epoch": 4152} {"train_loss": -25.96030044555664, "global_step": 344626, "epoch": 4152} {"train_loss": -26.166828155517578, "global_step": 344627, "epoch": 4152} {"train_loss": -25.84130859375, "global_step": 344628, "epoch": 4152} {"train_loss": -25.47835350036621, "global_step": 344629, "epoch": 4152} {"train_loss": -25.659215927124023, "global_step": 344630, "epoch": 4152} {"train_loss": -25.523208618164062, "global_step": 344631, "epoch": 4152} {"train_loss": -25.862186431884766, "global_step": 344632, "epoch": 4152} {"train_loss": -26.245513916015625, "global_step": 344633, "epoch": 4152} {"train_loss": -25.942646026611328, "global_step": 344634, "epoch": 4152} {"train_loss": -25.617971420288086, "global_step": 344635, "epoch": 4152} {"train_loss": -26.17860984802246, "global_step": 344636, "epoch": 4152} {"train_loss": -26.258609771728516, "global_step": 344637, "epoch": 4152} {"train_loss": -26.27667236328125, "global_step": 344638, "epoch": 4152} {"train_loss": -26.452062606811523, "global_step": 344639, "epoch": 4152} {"train_loss": -26.109821319580078, "global_step": 344640, "epoch": 4152} {"train_loss": -26.05999755859375, "global_step": 344641, "epoch": 4152} {"train_loss": -26.253225326538086, "global_step": 344642, "epoch": 4152} {"train_loss": -25.7122859954834, "global_step": 344643, "epoch": 4152} {"train_loss": -26.046432495117188, "global_step": 344644, "epoch": 4152} {"train_loss": -25.834630966186523, "global_step": 344645, "epoch": 4152} {"train_loss": -26.107309341430664, "global_step": 344646, "epoch": 4152} {"train_loss": -26.19166374206543, "global_step": 344647, "epoch": 4152} {"train_loss": -26.43461036682129, "global_step": 344648, "epoch": 4152} {"train_loss": -26.2885799407959, "global_step": 344649, "epoch": 4152} {"train_loss": -26.207548141479492, "global_step": 344650, "epoch": 4152} {"train_loss": -25.77284812927246, "global_step": 344651, "epoch": 4152} {"train_loss": -25.990020751953125, "global_step": 344652, "epoch": 4152} {"train_loss": -26.321369171142578, "global_step": 344653, "epoch": 4152} {"train_loss": -25.897130966186523, "global_step": 344654, "epoch": 4152} {"train_loss": -26.295734405517578, "global_step": 344655, "epoch": 4152} {"train_loss": -26.183568954467773, "global_step": 344656, "epoch": 4152} {"train_loss": -26.212451934814453, "global_step": 344657, "epoch": 4152} {"train_loss": -26.336475372314453, "global_step": 344658, "epoch": 4152} {"train_loss": -25.840391159057617, "global_step": 344659, "epoch": 4152} {"train_loss": -26.352954864501953, "global_step": 344660, "epoch": 4152} {"train_loss": -26.08527183532715, "global_step": 344661, "epoch": 4152} {"train_loss": -26.56854820251465, "global_step": 344662, "epoch": 4152} {"train_loss": -26.184661865234375, "global_step": 344663, "epoch": 4152} {"train_loss": -25.62006950378418, "global_step": 344664, "epoch": 4152} {"train_loss": -25.643600463867188, "global_step": 344665, "epoch": 4152} {"train_loss": -25.302417755126953, "global_step": 344666, "epoch": 4152} {"train_loss": -25.93976402282715, "global_step": 344667, "epoch": 4152} {"train_loss": -26.255712509155273, "global_step": 344668, "epoch": 4152} {"train_loss": -25.26873016357422, "global_step": 344669, "epoch": 4152} {"train_loss": -25.44856834411621, "global_step": 344670, "epoch": 4152} {"train_loss": -26.274890899658203, "global_step": 344671, "epoch": 4152} {"train_loss": -25.378808975219727, "global_step": 344672, "epoch": 4152} {"train_loss": -25.723981857299805, "global_step": 344673, "epoch": 4152} {"train_loss": -25.711307525634766, "global_step": 344674, "epoch": 4152} {"train_loss": -26.25823402404785, "global_step": 344675, "epoch": 4152} {"train_loss": -25.586898803710938, "global_step": 344676, "epoch": 4152} {"train_loss": -25.982519149780273, "global_step": 344677, "epoch": 4152} {"train_loss": -26.33391761779785, "global_step": 344678, "epoch": 4152} {"train_loss": -25.92134666442871, "global_step": 344679, "epoch": 4152} {"train_loss": -25.8342342376709, "global_step": 344680, "epoch": 4152} {"train_loss": -25.82293128967285, "global_step": 344681, "epoch": 4152} {"train_loss": -26.068891525268555, "global_step": 344682, "epoch": 4152} {"train_loss": -26.401227951049805, "global_step": 344683, "epoch": 4152} {"train_loss": -26.1964111328125, "global_step": 344684, "epoch": 4152} {"train_loss": -25.989904403686523, "global_step": 344685, "epoch": 4152} {"train_loss": -26.261449813842773, "global_step": 344686, "epoch": 4152} {"train_loss": -25.8872127532959, "global_step": 344687, "epoch": 4152} {"train_loss": -26.2503719329834, "global_step": 344688, "epoch": 4152} {"train_loss": -26.06939125061035, "global_step": 344689, "epoch": 4152} {"train_loss": -26.0809268951416, "global_step": 344690, "epoch": 4152} {"train_loss": -25.7687931060791, "global_step": 344691, "epoch": 4152} {"train_loss": -26.483203887939453, "global_step": 344692, "epoch": 4152} {"train_loss": -26.306745529174805, "global_step": 344693, "epoch": 4152} {"train_loss": -26.169713973999023, "global_step": 344694, "epoch": 4152} {"train_loss": -26.057952880859375, "global_step": 344695, "epoch": 4152} {"train_loss": -25.910879135131836, "global_step": 344696, "epoch": 4152} {"train_loss": -26.132184982299805, "global_step": 344697, "epoch": 4152} {"train_loss": -25.97854857846915, "global_step": 344698, "epoch": 4152, "val_loss": 6682579.5} {"train_loss": -25.836416244506836, "global_step": 344699, "epoch": 4153} {"train_loss": -25.960712432861328, "global_step": 344700, "epoch": 4153} {"train_loss": -26.020212173461914, "global_step": 344701, "epoch": 4153} {"train_loss": -25.44144058227539, "global_step": 344702, "epoch": 4153} {"train_loss": -25.8326358795166, "global_step": 344703, "epoch": 4153} {"train_loss": -25.745161056518555, "global_step": 344704, "epoch": 4153} {"train_loss": -25.989164352416992, "global_step": 344705, "epoch": 4153} {"train_loss": -26.083831787109375, "global_step": 344706, "epoch": 4153} {"train_loss": -25.933563232421875, "global_step": 344707, "epoch": 4153} {"train_loss": -25.9343204498291, "global_step": 344708, "epoch": 4153} {"train_loss": -25.771947860717773, "global_step": 344709, "epoch": 4153} {"train_loss": -26.24066162109375, "global_step": 344710, "epoch": 4153} {"train_loss": -25.83342933654785, "global_step": 344711, "epoch": 4153} {"train_loss": -25.582605361938477, "global_step": 344712, "epoch": 4153} {"train_loss": -25.998779296875, "global_step": 344713, "epoch": 4153} {"train_loss": -26.1075382232666, "global_step": 344714, "epoch": 4153} {"train_loss": -25.47986602783203, "global_step": 344715, "epoch": 4153} {"train_loss": -25.784076690673828, "global_step": 344716, "epoch": 4153} {"train_loss": -25.61162757873535, "global_step": 344717, "epoch": 4153} {"train_loss": -25.73665428161621, "global_step": 344718, "epoch": 4153} {"train_loss": -26.114694595336914, "global_step": 344719, "epoch": 4153} {"train_loss": -25.889190673828125, "global_step": 344720, "epoch": 4153} {"train_loss": -25.970869064331055, "global_step": 344721, "epoch": 4153} {"train_loss": -26.0751895904541, "global_step": 344722, "epoch": 4153} {"train_loss": -25.846515655517578, "global_step": 344723, "epoch": 4153} {"train_loss": -25.512025833129883, "global_step": 344724, "epoch": 4153} {"train_loss": -25.603790283203125, "global_step": 344725, "epoch": 4153} {"train_loss": -26.277990341186523, "global_step": 344726, "epoch": 4153} {"train_loss": -25.68671989440918, "global_step": 344727, "epoch": 4153} {"train_loss": -26.317829132080078, "global_step": 344728, "epoch": 4153} {"train_loss": -26.054372787475586, "global_step": 344729, "epoch": 4153} {"train_loss": -26.426456451416016, "global_step": 344730, "epoch": 4153} {"train_loss": -26.20358657836914, "global_step": 344731, "epoch": 4153} {"train_loss": -26.039779663085938, "global_step": 344732, "epoch": 4153} {"train_loss": -26.139692306518555, "global_step": 344733, "epoch": 4153} {"train_loss": -25.883243560791016, "global_step": 344734, "epoch": 4153} {"train_loss": -26.011932373046875, "global_step": 344735, "epoch": 4153} {"train_loss": -26.281879425048828, "global_step": 344736, "epoch": 4153} {"train_loss": -26.366910934448242, "global_step": 344737, "epoch": 4153} {"train_loss": -26.153589248657227, "global_step": 344738, "epoch": 4153} {"train_loss": -26.17889404296875, "global_step": 344739, "epoch": 4153} {"train_loss": -25.840635299682617, "global_step": 344740, "epoch": 4153} {"train_loss": -26.425891876220703, "global_step": 344741, "epoch": 4153} {"train_loss": -26.4984188079834, "global_step": 344742, "epoch": 4153} {"train_loss": -26.25994300842285, "global_step": 344743, "epoch": 4153} {"train_loss": -25.85682487487793, "global_step": 344744, "epoch": 4153} {"train_loss": -26.073938369750977, "global_step": 344745, "epoch": 4153} {"train_loss": -26.017541885375977, "global_step": 344746, "epoch": 4153} {"train_loss": -26.1002140045166, "global_step": 344747, "epoch": 4153} {"train_loss": -25.95503044128418, "global_step": 344748, "epoch": 4153} {"train_loss": -26.126453399658203, "global_step": 344749, "epoch": 4153} {"train_loss": -26.007095336914062, "global_step": 344750, "epoch": 4153} {"train_loss": -26.60751724243164, "global_step": 344751, "epoch": 4153} {"train_loss": -26.511966705322266, "global_step": 344752, "epoch": 4153} {"train_loss": -26.35453224182129, "global_step": 344753, "epoch": 4153} {"train_loss": -26.204483032226562, "global_step": 344754, "epoch": 4153} {"train_loss": -26.3823184967041, "global_step": 344755, "epoch": 4153} {"train_loss": -26.091787338256836, "global_step": 344756, "epoch": 4153} {"train_loss": -26.524784088134766, "global_step": 344757, "epoch": 4153} {"train_loss": -26.322385787963867, "global_step": 344758, "epoch": 4153} {"train_loss": -26.25349235534668, "global_step": 344759, "epoch": 4153} {"train_loss": -26.44769287109375, "global_step": 344760, "epoch": 4153} {"train_loss": -26.373260498046875, "global_step": 344761, "epoch": 4153} {"train_loss": -26.062665939331055, "global_step": 344762, "epoch": 4153} {"train_loss": -26.195287704467773, "global_step": 344763, "epoch": 4153} {"train_loss": -26.417724609375, "global_step": 344764, "epoch": 4153} {"train_loss": -26.255477905273438, "global_step": 344765, "epoch": 4153} {"train_loss": -26.133493423461914, "global_step": 344766, "epoch": 4153} {"train_loss": -26.4527587890625, "global_step": 344767, "epoch": 4153} {"train_loss": -26.301355361938477, "global_step": 344768, "epoch": 4153} {"train_loss": -26.251087188720703, "global_step": 344769, "epoch": 4153} {"train_loss": -26.063003540039062, "global_step": 344770, "epoch": 4153} {"train_loss": -26.259241104125977, "global_step": 344771, "epoch": 4153} {"train_loss": -26.26714515686035, "global_step": 344772, "epoch": 4153} {"train_loss": -26.310760498046875, "global_step": 344773, "epoch": 4153} {"train_loss": -26.216394424438477, "global_step": 344774, "epoch": 4153} {"train_loss": -26.03059196472168, "global_step": 344775, "epoch": 4153} {"train_loss": -26.440465927124023, "global_step": 344776, "epoch": 4153} {"train_loss": -26.143774032592773, "global_step": 344777, "epoch": 4153} {"train_loss": -25.888477325439453, "global_step": 344778, "epoch": 4153} {"train_loss": -25.875003814697266, "global_step": 344779, "epoch": 4153} {"train_loss": -25.695119857788086, "global_step": 344780, "epoch": 4153} {"train_loss": -26.094507768929724, "global_step": 344781, "epoch": 4153, "val_loss": 6723448.0} {"train_loss": -25.015262603759766, "global_step": 344782, "epoch": 4154} {"train_loss": -23.58538818359375, "global_step": 344783, "epoch": 4154} {"train_loss": -23.750642776489258, "global_step": 344784, "epoch": 4154} {"train_loss": -25.17314338684082, "global_step": 344785, "epoch": 4154} {"train_loss": -24.68182945251465, "global_step": 344786, "epoch": 4154} {"train_loss": -24.704866409301758, "global_step": 344787, "epoch": 4154} {"train_loss": -25.349966049194336, "global_step": 344788, "epoch": 4154} {"train_loss": -24.608829498291016, "global_step": 344789, "epoch": 4154} {"train_loss": -25.268102645874023, "global_step": 344790, "epoch": 4154} {"train_loss": -25.014209747314453, "global_step": 344791, "epoch": 4154} {"train_loss": -24.496076583862305, "global_step": 344792, "epoch": 4154} {"train_loss": -25.225631713867188, "global_step": 344793, "epoch": 4154} {"train_loss": -25.081449508666992, "global_step": 344794, "epoch": 4154} {"train_loss": -25.134220123291016, "global_step": 344795, "epoch": 4154} {"train_loss": -25.464859008789062, "global_step": 344796, "epoch": 4154} {"train_loss": -25.17177963256836, "global_step": 344797, "epoch": 4154} {"train_loss": -24.952669143676758, "global_step": 344798, "epoch": 4154} {"train_loss": -25.274219512939453, "global_step": 344799, "epoch": 4154} {"train_loss": -25.713483810424805, "global_step": 344800, "epoch": 4154} {"train_loss": -25.59784507751465, "global_step": 344801, "epoch": 4154} {"train_loss": -25.48287010192871, "global_step": 344802, "epoch": 4154} {"train_loss": -25.711109161376953, "global_step": 344803, "epoch": 4154} {"train_loss": -25.33420753479004, "global_step": 344804, "epoch": 4154} {"train_loss": -25.828907012939453, "global_step": 344805, "epoch": 4154} {"train_loss": -25.55201530456543, "global_step": 344806, "epoch": 4154} {"train_loss": -25.358409881591797, "global_step": 344807, "epoch": 4154} {"train_loss": -25.77423095703125, "global_step": 344808, "epoch": 4154} {"train_loss": -25.458559036254883, "global_step": 344809, "epoch": 4154} {"train_loss": -25.737258911132812, "global_step": 344810, "epoch": 4154} {"train_loss": -25.808862686157227, "global_step": 344811, "epoch": 4154} {"train_loss": -25.674570083618164, "global_step": 344812, "epoch": 4154} {"train_loss": -26.3029842376709, "global_step": 344813, "epoch": 4154} {"train_loss": -26.05726432800293, "global_step": 344814, "epoch": 4154} {"train_loss": -25.754199981689453, "global_step": 344815, "epoch": 4154} {"train_loss": -26.2757625579834, "global_step": 344816, "epoch": 4154} {"train_loss": -26.09449577331543, "global_step": 344817, "epoch": 4154} {"train_loss": -26.11980628967285, "global_step": 344818, "epoch": 4154} {"train_loss": -26.203781127929688, "global_step": 344819, "epoch": 4154} {"train_loss": -25.92597007751465, "global_step": 344820, "epoch": 4154} {"train_loss": -25.88649559020996, "global_step": 344821, "epoch": 4154} {"train_loss": -26.10452651977539, "global_step": 344822, "epoch": 4154} {"train_loss": -25.851882934570312, "global_step": 344823, "epoch": 4154} {"train_loss": -25.891096115112305, "global_step": 344824, "epoch": 4154} {"train_loss": -26.2601375579834, "global_step": 344825, "epoch": 4154} {"train_loss": -25.758325576782227, "global_step": 344826, "epoch": 4154} {"train_loss": -25.929224014282227, "global_step": 344827, "epoch": 4154} {"train_loss": -25.72262954711914, "global_step": 344828, "epoch": 4154} {"train_loss": -26.254194259643555, "global_step": 344829, "epoch": 4154} {"train_loss": -26.202259063720703, "global_step": 344830, "epoch": 4154} {"train_loss": -26.066396713256836, "global_step": 344831, "epoch": 4154} {"train_loss": -25.97244644165039, "global_step": 344832, "epoch": 4154} {"train_loss": -26.321374893188477, "global_step": 344833, "epoch": 4154} {"train_loss": -26.23487663269043, "global_step": 344834, "epoch": 4154} {"train_loss": -26.227888107299805, "global_step": 344835, "epoch": 4154} {"train_loss": -26.268436431884766, "global_step": 344836, "epoch": 4154} {"train_loss": -26.172040939331055, "global_step": 344837, "epoch": 4154} {"train_loss": -26.51934242248535, "global_step": 344838, "epoch": 4154} {"train_loss": -26.633777618408203, "global_step": 344839, "epoch": 4154} {"train_loss": -26.473119735717773, "global_step": 344840, "epoch": 4154} {"train_loss": -26.01789665222168, "global_step": 344841, "epoch": 4154} {"train_loss": -26.40339469909668, "global_step": 344842, "epoch": 4154} {"train_loss": -25.859338760375977, "global_step": 344843, "epoch": 4154} {"train_loss": -26.372201919555664, "global_step": 344844, "epoch": 4154} {"train_loss": -26.089658737182617, "global_step": 344845, "epoch": 4154} {"train_loss": -26.6699275970459, "global_step": 344846, "epoch": 4154} {"train_loss": -26.28696060180664, "global_step": 344847, "epoch": 4154} {"train_loss": -26.256811141967773, "global_step": 344848, "epoch": 4154} {"train_loss": -26.303796768188477, "global_step": 344849, "epoch": 4154} {"train_loss": -26.156543731689453, "global_step": 344850, "epoch": 4154} {"train_loss": -26.208740234375, "global_step": 344851, "epoch": 4154} {"train_loss": -26.601200103759766, "global_step": 344852, "epoch": 4154} {"train_loss": -26.31084632873535, "global_step": 344853, "epoch": 4154} {"train_loss": -26.31328773498535, "global_step": 344854, "epoch": 4154} {"train_loss": -25.90887451171875, "global_step": 344855, "epoch": 4154} {"train_loss": -26.05118179321289, "global_step": 344856, "epoch": 4154} {"train_loss": -26.004575729370117, "global_step": 344857, "epoch": 4154} {"train_loss": -26.07465934753418, "global_step": 344858, "epoch": 4154} {"train_loss": -26.1849308013916, "global_step": 344859, "epoch": 4154} {"train_loss": -25.965839385986328, "global_step": 344860, "epoch": 4154} {"train_loss": -26.24810218811035, "global_step": 344861, "epoch": 4154} {"train_loss": -26.204076766967773, "global_step": 344862, "epoch": 4154} {"train_loss": -26.195302963256836, "global_step": 344863, "epoch": 4154} {"train_loss": -25.770836795669005, "global_step": 344864, "epoch": 4154, "val_loss": 6597093.0} {"train_loss": -24.85174560546875, "global_step": 344865, "epoch": 4155} {"train_loss": -22.370412826538086, "global_step": 344866, "epoch": 4155} {"train_loss": -19.964893341064453, "global_step": 344867, "epoch": 4155} {"train_loss": -20.474756240844727, "global_step": 344868, "epoch": 4155} {"train_loss": -24.276283264160156, "global_step": 344869, "epoch": 4155} {"train_loss": -22.999326705932617, "global_step": 344870, "epoch": 4155} {"train_loss": -24.457921981811523, "global_step": 344871, "epoch": 4155} {"train_loss": -23.843244552612305, "global_step": 344872, "epoch": 4155} {"train_loss": -24.112899780273438, "global_step": 344873, "epoch": 4155} {"train_loss": -24.629526138305664, "global_step": 344874, "epoch": 4155} {"train_loss": -24.026296615600586, "global_step": 344875, "epoch": 4155} {"train_loss": -24.13922691345215, "global_step": 344876, "epoch": 4155} {"train_loss": -24.46590805053711, "global_step": 344877, "epoch": 4155} {"train_loss": -24.9086856842041, "global_step": 344878, "epoch": 4155} {"train_loss": -24.749582290649414, "global_step": 344879, "epoch": 4155} {"train_loss": -24.384986877441406, "global_step": 344880, "epoch": 4155} {"train_loss": -24.517864227294922, "global_step": 344881, "epoch": 4155} {"train_loss": -24.494060516357422, "global_step": 344882, "epoch": 4155} {"train_loss": -24.80007553100586, "global_step": 344883, "epoch": 4155} {"train_loss": -24.366525650024414, "global_step": 344884, "epoch": 4155} {"train_loss": -24.705251693725586, "global_step": 344885, "epoch": 4155} {"train_loss": -24.820144653320312, "global_step": 344886, "epoch": 4155} {"train_loss": -24.570642471313477, "global_step": 344887, "epoch": 4155} {"train_loss": -24.96095848083496, "global_step": 344888, "epoch": 4155} {"train_loss": -25.442684173583984, "global_step": 344889, "epoch": 4155} {"train_loss": -25.08465003967285, "global_step": 344890, "epoch": 4155} {"train_loss": -25.255268096923828, "global_step": 344891, "epoch": 4155} {"train_loss": -25.7269287109375, "global_step": 344892, "epoch": 4155} {"train_loss": -25.296438217163086, "global_step": 344893, "epoch": 4155} {"train_loss": -25.49139976501465, "global_step": 344894, "epoch": 4155} {"train_loss": -24.799577713012695, "global_step": 344895, "epoch": 4155} {"train_loss": -24.481998443603516, "global_step": 344896, "epoch": 4155} {"train_loss": -25.266759872436523, "global_step": 344897, "epoch": 4155} {"train_loss": -25.216543197631836, "global_step": 344898, "epoch": 4155} {"train_loss": -25.547616958618164, "global_step": 344899, "epoch": 4155} {"train_loss": -25.56244468688965, "global_step": 344900, "epoch": 4155} {"train_loss": -25.517301559448242, "global_step": 344901, "epoch": 4155} {"train_loss": -25.435302734375, "global_step": 344902, "epoch": 4155} {"train_loss": -25.530725479125977, "global_step": 344903, "epoch": 4155} {"train_loss": -25.611328125, "global_step": 344904, "epoch": 4155} {"train_loss": -25.49629020690918, "global_step": 344905, "epoch": 4155} {"train_loss": -25.923389434814453, "global_step": 344906, "epoch": 4155} {"train_loss": -25.701587677001953, "global_step": 344907, "epoch": 4155} {"train_loss": -25.807615280151367, "global_step": 344908, "epoch": 4155} {"train_loss": -25.961389541625977, "global_step": 344909, "epoch": 4155} {"train_loss": -25.74750328063965, "global_step": 344910, "epoch": 4155} {"train_loss": -25.703535079956055, "global_step": 344911, "epoch": 4155} {"train_loss": -26.072622299194336, "global_step": 344912, "epoch": 4155} {"train_loss": -26.015653610229492, "global_step": 344913, "epoch": 4155} {"train_loss": -25.863910675048828, "global_step": 344914, "epoch": 4155} {"train_loss": -25.689111709594727, "global_step": 344915, "epoch": 4155} {"train_loss": -25.760297775268555, "global_step": 344916, "epoch": 4155} {"train_loss": -26.157867431640625, "global_step": 344917, "epoch": 4155} {"train_loss": -25.893630981445312, "global_step": 344918, "epoch": 4155} {"train_loss": -25.965452194213867, "global_step": 344919, "epoch": 4155} {"train_loss": -25.710235595703125, "global_step": 344920, "epoch": 4155} {"train_loss": -25.84921646118164, "global_step": 344921, "epoch": 4155} {"train_loss": -25.809310913085938, "global_step": 344922, "epoch": 4155} {"train_loss": -26.00858497619629, "global_step": 344923, "epoch": 4155} {"train_loss": -26.119586944580078, "global_step": 344924, "epoch": 4155} {"train_loss": -26.16644859313965, "global_step": 344925, "epoch": 4155} {"train_loss": -26.06448745727539, "global_step": 344926, "epoch": 4155} {"train_loss": -26.320499420166016, "global_step": 344927, "epoch": 4155} {"train_loss": -25.428808212280273, "global_step": 344928, "epoch": 4155} {"train_loss": -26.343900680541992, "global_step": 344929, "epoch": 4155} {"train_loss": -25.53327751159668, "global_step": 344930, "epoch": 4155} {"train_loss": -25.9773006439209, "global_step": 344931, "epoch": 4155} {"train_loss": -25.75949478149414, "global_step": 344932, "epoch": 4155} {"train_loss": -25.905521392822266, "global_step": 344933, "epoch": 4155} {"train_loss": -25.937061309814453, "global_step": 344934, "epoch": 4155} {"train_loss": -25.706212997436523, "global_step": 344935, "epoch": 4155} {"train_loss": -26.13570213317871, "global_step": 344936, "epoch": 4155} {"train_loss": -26.221372604370117, "global_step": 344937, "epoch": 4155} {"train_loss": -26.21101188659668, "global_step": 344938, "epoch": 4155} {"train_loss": -25.621912002563477, "global_step": 344939, "epoch": 4155} {"train_loss": -25.853046417236328, "global_step": 344940, "epoch": 4155} {"train_loss": -25.8787841796875, "global_step": 344941, "epoch": 4155} {"train_loss": -25.933887481689453, "global_step": 344942, "epoch": 4155} {"train_loss": -26.420812606811523, "global_step": 344943, "epoch": 4155} {"train_loss": -25.81990623474121, "global_step": 344944, "epoch": 4155} {"train_loss": -25.950824737548828, "global_step": 344945, "epoch": 4155} {"train_loss": -26.256193161010742, "global_step": 344946, "epoch": 4155} {"train_loss": -25.252476565809136, "global_step": 344947, "epoch": 4155, "val_loss": 6638298.0} {"train_loss": -25.825483322143555, "global_step": 344948, "epoch": 4156} {"train_loss": -25.86515235900879, "global_step": 344949, "epoch": 4156} {"train_loss": -25.8233699798584, "global_step": 344950, "epoch": 4156} {"train_loss": -25.559370040893555, "global_step": 344951, "epoch": 4156} {"train_loss": -25.867557525634766, "global_step": 344952, "epoch": 4156} {"train_loss": -25.233179092407227, "global_step": 344953, "epoch": 4156} {"train_loss": -25.633649826049805, "global_step": 344954, "epoch": 4156} {"train_loss": -25.93641471862793, "global_step": 344955, "epoch": 4156} {"train_loss": -26.094884872436523, "global_step": 344956, "epoch": 4156} {"train_loss": -25.838953018188477, "global_step": 344957, "epoch": 4156} {"train_loss": -25.61879539489746, "global_step": 344958, "epoch": 4156} {"train_loss": -25.733747482299805, "global_step": 344959, "epoch": 4156} {"train_loss": -25.96259880065918, "global_step": 344960, "epoch": 4156} {"train_loss": -25.965478897094727, "global_step": 344961, "epoch": 4156} {"train_loss": -26.220703125, "global_step": 344962, "epoch": 4156} {"train_loss": -26.04729652404785, "global_step": 344963, "epoch": 4156} {"train_loss": -25.801300048828125, "global_step": 344964, "epoch": 4156} {"train_loss": -25.766645431518555, "global_step": 344965, "epoch": 4156} {"train_loss": -25.9600887298584, "global_step": 344966, "epoch": 4156} {"train_loss": -25.79694938659668, "global_step": 344967, "epoch": 4156} {"train_loss": -25.760324478149414, "global_step": 344968, "epoch": 4156} {"train_loss": -25.946813583374023, "global_step": 344969, "epoch": 4156} {"train_loss": -26.280902862548828, "global_step": 344970, "epoch": 4156} {"train_loss": -26.194091796875, "global_step": 344971, "epoch": 4156} {"train_loss": -26.274160385131836, "global_step": 344972, "epoch": 4156} {"train_loss": -26.049091339111328, "global_step": 344973, "epoch": 4156} {"train_loss": -26.0045166015625, "global_step": 344974, "epoch": 4156} {"train_loss": -26.171436309814453, "global_step": 344975, "epoch": 4156} {"train_loss": -26.289697647094727, "global_step": 344976, "epoch": 4156} {"train_loss": -26.45796012878418, "global_step": 344977, "epoch": 4156} {"train_loss": -25.9417667388916, "global_step": 344978, "epoch": 4156} {"train_loss": -25.984045028686523, "global_step": 344979, "epoch": 4156} {"train_loss": -25.960437774658203, "global_step": 344980, "epoch": 4156} {"train_loss": -25.8817081451416, "global_step": 344981, "epoch": 4156} {"train_loss": -26.007003784179688, "global_step": 344982, "epoch": 4156} {"train_loss": -26.39857292175293, "global_step": 344983, "epoch": 4156} {"train_loss": -25.833744049072266, "global_step": 344984, "epoch": 4156} {"train_loss": -26.27296257019043, "global_step": 344985, "epoch": 4156} {"train_loss": -26.18828773498535, "global_step": 344986, "epoch": 4156} {"train_loss": -26.403278350830078, "global_step": 344987, "epoch": 4156} {"train_loss": -25.9255428314209, "global_step": 344988, "epoch": 4156} {"train_loss": -26.178625106811523, "global_step": 344989, "epoch": 4156} {"train_loss": -26.25421142578125, "global_step": 344990, "epoch": 4156} {"train_loss": -26.403228759765625, "global_step": 344991, "epoch": 4156} {"train_loss": -26.167346954345703, "global_step": 344992, "epoch": 4156} {"train_loss": -26.11090087890625, "global_step": 344993, "epoch": 4156} {"train_loss": -25.941049575805664, "global_step": 344994, "epoch": 4156} {"train_loss": -26.35480308532715, "global_step": 344995, "epoch": 4156} {"train_loss": -26.3392333984375, "global_step": 344996, "epoch": 4156} {"train_loss": -25.799951553344727, "global_step": 344997, "epoch": 4156} {"train_loss": -26.51807975769043, "global_step": 344998, "epoch": 4156} {"train_loss": -26.322656631469727, "global_step": 344999, "epoch": 4156} {"train_loss": -25.98408317565918, "global_step": 345000, "epoch": 4156} {"train_loss": -26.064468383789062, "global_step": 345001, "epoch": 4156} {"train_loss": -26.16111183166504, "global_step": 345002, "epoch": 4156} {"train_loss": -26.10645866394043, "global_step": 345003, "epoch": 4156} {"train_loss": -25.802444458007812, "global_step": 345004, "epoch": 4156} {"train_loss": -26.167606353759766, "global_step": 345005, "epoch": 4156} {"train_loss": -26.116485595703125, "global_step": 345006, "epoch": 4156} {"train_loss": -25.979328155517578, "global_step": 345007, "epoch": 4156} {"train_loss": -26.19207763671875, "global_step": 345008, "epoch": 4156} {"train_loss": -26.364501953125, "global_step": 345009, "epoch": 4156} {"train_loss": -25.80313491821289, "global_step": 345010, "epoch": 4156} {"train_loss": -25.814619064331055, "global_step": 345011, "epoch": 4156} {"train_loss": -26.048263549804688, "global_step": 345012, "epoch": 4156} {"train_loss": -26.0600643157959, "global_step": 345013, "epoch": 4156} {"train_loss": -25.980894088745117, "global_step": 345014, "epoch": 4156} {"train_loss": -26.3056697845459, "global_step": 345015, "epoch": 4156} {"train_loss": -25.828094482421875, "global_step": 345016, "epoch": 4156} {"train_loss": -25.841079711914062, "global_step": 345017, "epoch": 4156} {"train_loss": -26.232633590698242, "global_step": 345018, "epoch": 4156} {"train_loss": -25.892892837524414, "global_step": 345019, "epoch": 4156} {"train_loss": -26.005075454711914, "global_step": 345020, "epoch": 4156} {"train_loss": -26.013166427612305, "global_step": 345021, "epoch": 4156} {"train_loss": -26.203826904296875, "global_step": 345022, "epoch": 4156} {"train_loss": -25.658273696899414, "global_step": 345023, "epoch": 4156} {"train_loss": -26.38126564025879, "global_step": 345024, "epoch": 4156} {"train_loss": -26.207489013671875, "global_step": 345025, "epoch": 4156} {"train_loss": -25.938556671142578, "global_step": 345026, "epoch": 4156} {"train_loss": -26.166107177734375, "global_step": 345027, "epoch": 4156} {"train_loss": -25.886533737182617, "global_step": 345028, "epoch": 4156} {"train_loss": -25.757354736328125, "global_step": 345029, "epoch": 4156} {"train_loss": -26.03532251105251, "global_step": 345030, "epoch": 4156, "val_loss": 6520474.0} {"train_loss": -25.877704620361328, "global_step": 345031, "epoch": 4157} {"train_loss": -24.811527252197266, "global_step": 345032, "epoch": 4157} {"train_loss": -23.779186248779297, "global_step": 345033, "epoch": 4157} {"train_loss": -24.620513916015625, "global_step": 345034, "epoch": 4157} {"train_loss": -25.50495719909668, "global_step": 345035, "epoch": 4157} {"train_loss": -25.082056045532227, "global_step": 345036, "epoch": 4157} {"train_loss": -25.33428192138672, "global_step": 345037, "epoch": 4157} {"train_loss": -25.44893455505371, "global_step": 345038, "epoch": 4157} {"train_loss": -25.207719802856445, "global_step": 345039, "epoch": 4157} {"train_loss": -25.6290225982666, "global_step": 345040, "epoch": 4157} {"train_loss": -25.209209442138672, "global_step": 345041, "epoch": 4157} {"train_loss": -25.66289710998535, "global_step": 345042, "epoch": 4157} {"train_loss": -25.4841365814209, "global_step": 345043, "epoch": 4157} {"train_loss": -25.320425033569336, "global_step": 345044, "epoch": 4157} {"train_loss": -25.812713623046875, "global_step": 345045, "epoch": 4157} {"train_loss": -25.612598419189453, "global_step": 345046, "epoch": 4157} {"train_loss": -26.026294708251953, "global_step": 345047, "epoch": 4157} {"train_loss": -25.71553611755371, "global_step": 345048, "epoch": 4157} {"train_loss": -25.787677764892578, "global_step": 345049, "epoch": 4157} {"train_loss": -25.605871200561523, "global_step": 345050, "epoch": 4157} {"train_loss": -25.666339874267578, "global_step": 345051, "epoch": 4157} {"train_loss": -25.7432918548584, "global_step": 345052, "epoch": 4157} {"train_loss": -26.00510025024414, "global_step": 345053, "epoch": 4157} {"train_loss": -26.16106605529785, "global_step": 345054, "epoch": 4157} {"train_loss": -25.991506576538086, "global_step": 345055, "epoch": 4157} {"train_loss": -25.86964225769043, "global_step": 345056, "epoch": 4157} {"train_loss": -26.0029354095459, "global_step": 345057, "epoch": 4157} {"train_loss": -26.041458129882812, "global_step": 345058, "epoch": 4157} {"train_loss": -25.9183292388916, "global_step": 345059, "epoch": 4157} {"train_loss": -26.175098419189453, "global_step": 345060, "epoch": 4157} {"train_loss": -26.38840675354004, "global_step": 345061, "epoch": 4157} {"train_loss": -25.87912368774414, "global_step": 345062, "epoch": 4157} {"train_loss": -25.924680709838867, "global_step": 345063, "epoch": 4157} {"train_loss": -26.235305786132812, "global_step": 345064, "epoch": 4157} {"train_loss": -26.154071807861328, "global_step": 345065, "epoch": 4157} {"train_loss": -26.5767765045166, "global_step": 345066, "epoch": 4157} {"train_loss": -25.88019371032715, "global_step": 345067, "epoch": 4157} {"train_loss": -26.276609420776367, "global_step": 345068, "epoch": 4157} {"train_loss": -26.172956466674805, "global_step": 345069, "epoch": 4157} {"train_loss": -26.380598068237305, "global_step": 345070, "epoch": 4157} {"train_loss": -26.354755401611328, "global_step": 345071, "epoch": 4157} {"train_loss": -26.256824493408203, "global_step": 345072, "epoch": 4157} {"train_loss": -26.03130531311035, "global_step": 345073, "epoch": 4157} {"train_loss": -26.05254554748535, "global_step": 345074, "epoch": 4157} {"train_loss": -25.675085067749023, "global_step": 345075, "epoch": 4157} {"train_loss": -26.028295516967773, "global_step": 345076, "epoch": 4157} {"train_loss": -26.457000732421875, "global_step": 345077, "epoch": 4157} {"train_loss": -26.200048446655273, "global_step": 345078, "epoch": 4157} {"train_loss": -25.778833389282227, "global_step": 345079, "epoch": 4157} {"train_loss": -26.45061683654785, "global_step": 345080, "epoch": 4157} {"train_loss": -26.682453155517578, "global_step": 345081, "epoch": 4157} {"train_loss": -25.76838493347168, "global_step": 345082, "epoch": 4157} {"train_loss": -26.020292282104492, "global_step": 345083, "epoch": 4157} {"train_loss": -25.57075309753418, "global_step": 345084, "epoch": 4157} {"train_loss": -26.56227684020996, "global_step": 345085, "epoch": 4157} {"train_loss": -25.850906372070312, "global_step": 345086, "epoch": 4157} {"train_loss": -26.013355255126953, "global_step": 345087, "epoch": 4157} {"train_loss": -26.078100204467773, "global_step": 345088, "epoch": 4157} {"train_loss": -25.93994140625, "global_step": 345089, "epoch": 4157} {"train_loss": -26.361509323120117, "global_step": 345090, "epoch": 4157} {"train_loss": -26.191761016845703, "global_step": 345091, "epoch": 4157} {"train_loss": -26.497150421142578, "global_step": 345092, "epoch": 4157} {"train_loss": -26.13750648498535, "global_step": 345093, "epoch": 4157} {"train_loss": -25.60963249206543, "global_step": 345094, "epoch": 4157} {"train_loss": -26.3356990814209, "global_step": 345095, "epoch": 4157} {"train_loss": -26.133886337280273, "global_step": 345096, "epoch": 4157} {"train_loss": -26.50762367248535, "global_step": 345097, "epoch": 4157} {"train_loss": -25.803247451782227, "global_step": 345098, "epoch": 4157} {"train_loss": -26.289642333984375, "global_step": 345099, "epoch": 4157} {"train_loss": -25.996673583984375, "global_step": 345100, "epoch": 4157} {"train_loss": -26.389265060424805, "global_step": 345101, "epoch": 4157} {"train_loss": -25.976667404174805, "global_step": 345102, "epoch": 4157} {"train_loss": -26.004898071289062, "global_step": 345103, "epoch": 4157} {"train_loss": -26.0250244140625, "global_step": 345104, "epoch": 4157} {"train_loss": -26.15997314453125, "global_step": 345105, "epoch": 4157} {"train_loss": -26.4343318939209, "global_step": 345106, "epoch": 4157} {"train_loss": -26.020627975463867, "global_step": 345107, "epoch": 4157} {"train_loss": -25.808835983276367, "global_step": 345108, "epoch": 4157} {"train_loss": -26.38227653503418, "global_step": 345109, "epoch": 4157} {"train_loss": -26.23310661315918, "global_step": 345110, "epoch": 4157} {"train_loss": -26.334692001342773, "global_step": 345111, "epoch": 4157} {"train_loss": -26.026647567749023, "global_step": 345112, "epoch": 4157} {"train_loss": -25.928930926035687, "global_step": 345113, "epoch": 4157, "val_loss": 6601944.0} {"train_loss": -25.244169235229492, "global_step": 345114, "epoch": 4158} {"train_loss": -25.640125274658203, "global_step": 345115, "epoch": 4158} {"train_loss": -25.565031051635742, "global_step": 345116, "epoch": 4158} {"train_loss": -25.471210479736328, "global_step": 345117, "epoch": 4158} {"train_loss": -25.584182739257812, "global_step": 345118, "epoch": 4158} {"train_loss": -25.361989974975586, "global_step": 345119, "epoch": 4158} {"train_loss": -25.8353271484375, "global_step": 345120, "epoch": 4158} {"train_loss": -26.205671310424805, "global_step": 345121, "epoch": 4158} {"train_loss": -25.73670768737793, "global_step": 345122, "epoch": 4158} {"train_loss": -25.893802642822266, "global_step": 345123, "epoch": 4158} {"train_loss": -25.66668128967285, "global_step": 345124, "epoch": 4158} {"train_loss": -25.675342559814453, "global_step": 345125, "epoch": 4158} {"train_loss": -26.070056915283203, "global_step": 345126, "epoch": 4158} {"train_loss": -25.96022605895996, "global_step": 345127, "epoch": 4158} {"train_loss": -25.825937271118164, "global_step": 345128, "epoch": 4158} {"train_loss": -25.881820678710938, "global_step": 345129, "epoch": 4158} {"train_loss": -25.602075576782227, "global_step": 345130, "epoch": 4158} {"train_loss": -25.975921630859375, "global_step": 345131, "epoch": 4158} {"train_loss": -25.568227767944336, "global_step": 345132, "epoch": 4158} {"train_loss": -25.82337760925293, "global_step": 345133, "epoch": 4158} {"train_loss": -25.67036247253418, "global_step": 345134, "epoch": 4158} {"train_loss": -25.91713523864746, "global_step": 345135, "epoch": 4158} {"train_loss": -25.5175838470459, "global_step": 345136, "epoch": 4158} {"train_loss": -25.85210609436035, "global_step": 345137, "epoch": 4158} {"train_loss": -25.964120864868164, "global_step": 345138, "epoch": 4158} {"train_loss": -26.172840118408203, "global_step": 345139, "epoch": 4158} {"train_loss": -26.005615234375, "global_step": 345140, "epoch": 4158} {"train_loss": -25.73691749572754, "global_step": 345141, "epoch": 4158} {"train_loss": -25.389556884765625, "global_step": 345142, "epoch": 4158} {"train_loss": -25.895355224609375, "global_step": 345143, "epoch": 4158} {"train_loss": -26.095478057861328, "global_step": 345144, "epoch": 4158} {"train_loss": -26.075244903564453, "global_step": 345145, "epoch": 4158} {"train_loss": -25.773710250854492, "global_step": 345146, "epoch": 4158} {"train_loss": -26.3812313079834, "global_step": 345147, "epoch": 4158} {"train_loss": -26.03240966796875, "global_step": 345148, "epoch": 4158} {"train_loss": -26.303787231445312, "global_step": 345149, "epoch": 4158} {"train_loss": -25.990930557250977, "global_step": 345150, "epoch": 4158} {"train_loss": -26.46323013305664, "global_step": 345151, "epoch": 4158} {"train_loss": -26.216552734375, "global_step": 345152, "epoch": 4158} {"train_loss": -26.18513298034668, "global_step": 345153, "epoch": 4158} {"train_loss": -26.18134117126465, "global_step": 345154, "epoch": 4158} {"train_loss": -26.492826461791992, "global_step": 345155, "epoch": 4158} {"train_loss": -25.853534698486328, "global_step": 345156, "epoch": 4158} {"train_loss": -26.025121688842773, "global_step": 345157, "epoch": 4158} {"train_loss": -26.62442398071289, "global_step": 345158, "epoch": 4158} {"train_loss": -26.22256851196289, "global_step": 345159, "epoch": 4158} {"train_loss": -26.392969131469727, "global_step": 345160, "epoch": 4158} {"train_loss": -26.196706771850586, "global_step": 345161, "epoch": 4158} {"train_loss": -26.30994987487793, "global_step": 345162, "epoch": 4158} {"train_loss": -25.898193359375, "global_step": 345163, "epoch": 4158} {"train_loss": -26.11882972717285, "global_step": 345164, "epoch": 4158} {"train_loss": -26.271703720092773, "global_step": 345165, "epoch": 4158} {"train_loss": -26.452560424804688, "global_step": 345166, "epoch": 4158} {"train_loss": -26.0484619140625, "global_step": 345167, "epoch": 4158} {"train_loss": -26.121490478515625, "global_step": 345168, "epoch": 4158} {"train_loss": -26.52765464782715, "global_step": 345169, "epoch": 4158} {"train_loss": -26.223424911499023, "global_step": 345170, "epoch": 4158} {"train_loss": -26.13384437561035, "global_step": 345171, "epoch": 4158} {"train_loss": -26.08429527282715, "global_step": 345172, "epoch": 4158} {"train_loss": -25.761432647705078, "global_step": 345173, "epoch": 4158} {"train_loss": -25.967777252197266, "global_step": 345174, "epoch": 4158} {"train_loss": -26.187849044799805, "global_step": 345175, "epoch": 4158} {"train_loss": -25.962858200073242, "global_step": 345176, "epoch": 4158} {"train_loss": -26.016565322875977, "global_step": 345177, "epoch": 4158} {"train_loss": -26.23859214782715, "global_step": 345178, "epoch": 4158} {"train_loss": -26.02882194519043, "global_step": 345179, "epoch": 4158} {"train_loss": -25.6965274810791, "global_step": 345180, "epoch": 4158} {"train_loss": -26.176624298095703, "global_step": 345181, "epoch": 4158} {"train_loss": -26.01956558227539, "global_step": 345182, "epoch": 4158} {"train_loss": -26.203760147094727, "global_step": 345183, "epoch": 4158} {"train_loss": -25.96857261657715, "global_step": 345184, "epoch": 4158} {"train_loss": -26.183948516845703, "global_step": 345185, "epoch": 4158} {"train_loss": -26.126733779907227, "global_step": 345186, "epoch": 4158} {"train_loss": -26.39809226989746, "global_step": 345187, "epoch": 4158} {"train_loss": -26.328882217407227, "global_step": 345188, "epoch": 4158} {"train_loss": -26.18958854675293, "global_step": 345189, "epoch": 4158} {"train_loss": -26.369245529174805, "global_step": 345190, "epoch": 4158} {"train_loss": -25.828018188476562, "global_step": 345191, "epoch": 4158} {"train_loss": -25.95369529724121, "global_step": 345192, "epoch": 4158} {"train_loss": -25.98026466369629, "global_step": 345193, "epoch": 4158} {"train_loss": -26.28472328186035, "global_step": 345194, "epoch": 4158} {"train_loss": -25.794326782226562, "global_step": 345195, "epoch": 4158} {"train_loss": -25.996456605842315, "global_step": 345196, "epoch": 4158, "val_loss": 6603654.0} {"train_loss": -24.42596435546875, "global_step": 345197, "epoch": 4159} {"train_loss": -24.770423889160156, "global_step": 345198, "epoch": 4159} {"train_loss": -24.668989181518555, "global_step": 345199, "epoch": 4159} {"train_loss": -25.103496551513672, "global_step": 345200, "epoch": 4159} {"train_loss": -25.567440032958984, "global_step": 345201, "epoch": 4159} {"train_loss": -25.766752243041992, "global_step": 345202, "epoch": 4159} {"train_loss": -25.467679977416992, "global_step": 345203, "epoch": 4159} {"train_loss": -25.363723754882812, "global_step": 345204, "epoch": 4159} {"train_loss": -25.777851104736328, "global_step": 345205, "epoch": 4159} {"train_loss": -25.54216194152832, "global_step": 345206, "epoch": 4159} {"train_loss": -25.549192428588867, "global_step": 345207, "epoch": 4159} {"train_loss": -25.523330688476562, "global_step": 345208, "epoch": 4159} {"train_loss": -25.714460372924805, "global_step": 345209, "epoch": 4159} {"train_loss": -25.636266708374023, "global_step": 345210, "epoch": 4159} {"train_loss": -25.535654067993164, "global_step": 345211, "epoch": 4159} {"train_loss": -25.64389991760254, "global_step": 345212, "epoch": 4159} {"train_loss": -25.439363479614258, "global_step": 345213, "epoch": 4159} {"train_loss": -25.57966423034668, "global_step": 345214, "epoch": 4159} {"train_loss": -25.72150993347168, "global_step": 345215, "epoch": 4159} {"train_loss": -26.269208908081055, "global_step": 345216, "epoch": 4159} {"train_loss": -25.47666358947754, "global_step": 345217, "epoch": 4159} {"train_loss": -25.38865852355957, "global_step": 345218, "epoch": 4159} {"train_loss": -25.8924617767334, "global_step": 345219, "epoch": 4159} {"train_loss": -25.698810577392578, "global_step": 345220, "epoch": 4159} {"train_loss": -25.599149703979492, "global_step": 345221, "epoch": 4159} {"train_loss": -25.585342407226562, "global_step": 345222, "epoch": 4159} {"train_loss": -25.872949600219727, "global_step": 345223, "epoch": 4159} {"train_loss": -25.667850494384766, "global_step": 345224, "epoch": 4159} {"train_loss": -25.89039421081543, "global_step": 345225, "epoch": 4159} {"train_loss": -25.728376388549805, "global_step": 345226, "epoch": 4159} {"train_loss": -25.738845825195312, "global_step": 345227, "epoch": 4159} {"train_loss": -26.320087432861328, "global_step": 345228, "epoch": 4159} {"train_loss": -25.947446823120117, "global_step": 345229, "epoch": 4159} {"train_loss": -26.065317153930664, "global_step": 345230, "epoch": 4159} {"train_loss": -25.944549560546875, "global_step": 345231, "epoch": 4159} {"train_loss": -25.882749557495117, "global_step": 345232, "epoch": 4159} {"train_loss": -25.824512481689453, "global_step": 345233, "epoch": 4159} {"train_loss": -26.06574821472168, "global_step": 345234, "epoch": 4159} {"train_loss": -26.08192253112793, "global_step": 345235, "epoch": 4159} {"train_loss": -26.191076278686523, "global_step": 345236, "epoch": 4159} {"train_loss": -26.145263671875, "global_step": 345237, "epoch": 4159} {"train_loss": -25.91778564453125, "global_step": 345238, "epoch": 4159} {"train_loss": -26.077863693237305, "global_step": 345239, "epoch": 4159} {"train_loss": -26.084440231323242, "global_step": 345240, "epoch": 4159} {"train_loss": -25.816909790039062, "global_step": 345241, "epoch": 4159} {"train_loss": -25.91350746154785, "global_step": 345242, "epoch": 4159} {"train_loss": -25.956298828125, "global_step": 345243, "epoch": 4159} {"train_loss": -26.20655632019043, "global_step": 345244, "epoch": 4159} {"train_loss": -25.79816246032715, "global_step": 345245, "epoch": 4159} {"train_loss": -25.851318359375, "global_step": 345246, "epoch": 4159} {"train_loss": -25.767105102539062, "global_step": 345247, "epoch": 4159} {"train_loss": -25.557043075561523, "global_step": 345248, "epoch": 4159} {"train_loss": -25.99078941345215, "global_step": 345249, "epoch": 4159} {"train_loss": -25.78983497619629, "global_step": 345250, "epoch": 4159} {"train_loss": -26.1890926361084, "global_step": 345251, "epoch": 4159} {"train_loss": -26.28812599182129, "global_step": 345252, "epoch": 4159} {"train_loss": -25.842893600463867, "global_step": 345253, "epoch": 4159} {"train_loss": -26.035205841064453, "global_step": 345254, "epoch": 4159} {"train_loss": -26.05353355407715, "global_step": 345255, "epoch": 4159} {"train_loss": -26.03622817993164, "global_step": 345256, "epoch": 4159} {"train_loss": -26.2394962310791, "global_step": 345257, "epoch": 4159} {"train_loss": -26.3596134185791, "global_step": 345258, "epoch": 4159} {"train_loss": -26.0722713470459, "global_step": 345259, "epoch": 4159} {"train_loss": -26.328536987304688, "global_step": 345260, "epoch": 4159} {"train_loss": -26.503829956054688, "global_step": 345261, "epoch": 4159} {"train_loss": -26.443899154663086, "global_step": 345262, "epoch": 4159} {"train_loss": -26.09967613220215, "global_step": 345263, "epoch": 4159} {"train_loss": -26.2690372467041, "global_step": 345264, "epoch": 4159} {"train_loss": -26.060556411743164, "global_step": 345265, "epoch": 4159} {"train_loss": -26.381383895874023, "global_step": 345266, "epoch": 4159} {"train_loss": -26.31458854675293, "global_step": 345267, "epoch": 4159} {"train_loss": -26.27264976501465, "global_step": 345268, "epoch": 4159} {"train_loss": -26.241174697875977, "global_step": 345269, "epoch": 4159} {"train_loss": -25.947498321533203, "global_step": 345270, "epoch": 4159} {"train_loss": -26.035541534423828, "global_step": 345271, "epoch": 4159} {"train_loss": -26.555078506469727, "global_step": 345272, "epoch": 4159} {"train_loss": -26.007293701171875, "global_step": 345273, "epoch": 4159} {"train_loss": -26.16151237487793, "global_step": 345274, "epoch": 4159} {"train_loss": -26.40252113342285, "global_step": 345275, "epoch": 4159} {"train_loss": -25.87482261657715, "global_step": 345276, "epoch": 4159} {"train_loss": -26.45448112487793, "global_step": 345277, "epoch": 4159} {"train_loss": -26.40707778930664, "global_step": 345278, "epoch": 4159} {"train_loss": -25.86976494846574, "global_step": 345279, "epoch": 4159, "val_loss": 6593800.0} {"train_loss": -26.06694984436035, "global_step": 345280, "epoch": 4160} {"train_loss": -26.085275650024414, "global_step": 345281, "epoch": 4160} {"train_loss": -25.5185604095459, "global_step": 345282, "epoch": 4160} {"train_loss": -25.844873428344727, "global_step": 345283, "epoch": 4160} {"train_loss": -25.4572811126709, "global_step": 345284, "epoch": 4160} {"train_loss": -25.311687469482422, "global_step": 345285, "epoch": 4160} {"train_loss": -25.60908317565918, "global_step": 345286, "epoch": 4160} {"train_loss": -25.7576847076416, "global_step": 345287, "epoch": 4160} {"train_loss": -25.875864028930664, "global_step": 345288, "epoch": 4160} {"train_loss": -25.641525268554688, "global_step": 345289, "epoch": 4160} {"train_loss": -25.8355655670166, "global_step": 345290, "epoch": 4160} {"train_loss": -26.10500144958496, "global_step": 345291, "epoch": 4160} {"train_loss": -25.187536239624023, "global_step": 345292, "epoch": 4160} {"train_loss": -26.040021896362305, "global_step": 345293, "epoch": 4160} {"train_loss": -25.6716365814209, "global_step": 345294, "epoch": 4160} {"train_loss": -25.87652015686035, "global_step": 345295, "epoch": 4160} {"train_loss": -25.867080688476562, "global_step": 345296, "epoch": 4160} {"train_loss": -25.75623893737793, "global_step": 345297, "epoch": 4160} {"train_loss": -25.661808013916016, "global_step": 345298, "epoch": 4160} {"train_loss": -25.933202743530273, "global_step": 345299, "epoch": 4160} {"train_loss": -25.60915184020996, "global_step": 345300, "epoch": 4160} {"train_loss": -26.153928756713867, "global_step": 345301, "epoch": 4160} {"train_loss": -26.095870971679688, "global_step": 345302, "epoch": 4160} {"train_loss": -25.801593780517578, "global_step": 345303, "epoch": 4160} {"train_loss": -26.133169174194336, "global_step": 345304, "epoch": 4160} {"train_loss": -25.8653564453125, "global_step": 345305, "epoch": 4160} {"train_loss": -25.56203269958496, "global_step": 345306, "epoch": 4160} {"train_loss": -25.819448471069336, "global_step": 345307, "epoch": 4160} {"train_loss": -26.240345001220703, "global_step": 345308, "epoch": 4160} {"train_loss": -25.999319076538086, "global_step": 345309, "epoch": 4160} {"train_loss": -25.77813148498535, "global_step": 345310, "epoch": 4160} {"train_loss": -25.9992733001709, "global_step": 345311, "epoch": 4160} {"train_loss": -26.057159423828125, "global_step": 345312, "epoch": 4160} {"train_loss": -25.97792625427246, "global_step": 345313, "epoch": 4160} {"train_loss": -26.2167911529541, "global_step": 345314, "epoch": 4160} {"train_loss": -26.01772117614746, "global_step": 345315, "epoch": 4160} {"train_loss": -26.255640029907227, "global_step": 345316, "epoch": 4160} {"train_loss": -26.185056686401367, "global_step": 345317, "epoch": 4160} {"train_loss": -26.500213623046875, "global_step": 345318, "epoch": 4160} {"train_loss": -25.95503807067871, "global_step": 345319, "epoch": 4160} {"train_loss": -26.422882080078125, "global_step": 345320, "epoch": 4160} {"train_loss": -26.606542587280273, "global_step": 345321, "epoch": 4160} {"train_loss": -26.110828399658203, "global_step": 345322, "epoch": 4160} {"train_loss": -26.55474281311035, "global_step": 345323, "epoch": 4160} {"train_loss": -26.546356201171875, "global_step": 345324, "epoch": 4160} {"train_loss": -26.081350326538086, "global_step": 345325, "epoch": 4160} {"train_loss": -26.696720123291016, "global_step": 345326, "epoch": 4160} {"train_loss": -26.38214683532715, "global_step": 345327, "epoch": 4160} {"train_loss": -26.376148223876953, "global_step": 345328, "epoch": 4160} {"train_loss": -26.10256004333496, "global_step": 345329, "epoch": 4160} {"train_loss": -26.543874740600586, "global_step": 345330, "epoch": 4160} {"train_loss": -26.389867782592773, "global_step": 345331, "epoch": 4160} {"train_loss": -25.754674911499023, "global_step": 345332, "epoch": 4160} {"train_loss": -25.952163696289062, "global_step": 345333, "epoch": 4160} {"train_loss": -26.2406005859375, "global_step": 345334, "epoch": 4160} {"train_loss": -26.269811630249023, "global_step": 345335, "epoch": 4160} {"train_loss": -26.17805290222168, "global_step": 345336, "epoch": 4160} {"train_loss": -25.945783615112305, "global_step": 345337, "epoch": 4160} {"train_loss": -25.83929443359375, "global_step": 345338, "epoch": 4160} {"train_loss": -25.415674209594727, "global_step": 345339, "epoch": 4160} {"train_loss": -25.856531143188477, "global_step": 345340, "epoch": 4160} {"train_loss": -25.891204833984375, "global_step": 345341, "epoch": 4160} {"train_loss": -25.7225341796875, "global_step": 345342, "epoch": 4160} {"train_loss": -25.59844970703125, "global_step": 345343, "epoch": 4160} {"train_loss": -25.874267578125, "global_step": 345344, "epoch": 4160} {"train_loss": -25.774229049682617, "global_step": 345345, "epoch": 4160} {"train_loss": -25.98676109313965, "global_step": 345346, "epoch": 4160} {"train_loss": -26.18446159362793, "global_step": 345347, "epoch": 4160} {"train_loss": -26.149824142456055, "global_step": 345348, "epoch": 4160} {"train_loss": -26.349578857421875, "global_step": 345349, "epoch": 4160} {"train_loss": -26.10395622253418, "global_step": 345350, "epoch": 4160} {"train_loss": -25.730377197265625, "global_step": 345351, "epoch": 4160} {"train_loss": -26.22576332092285, "global_step": 345352, "epoch": 4160} {"train_loss": -26.199316024780273, "global_step": 345353, "epoch": 4160} {"train_loss": -26.208921432495117, "global_step": 345354, "epoch": 4160} {"train_loss": -26.176105499267578, "global_step": 345355, "epoch": 4160} {"train_loss": -26.1001033782959, "global_step": 345356, "epoch": 4160} {"train_loss": -26.24799919128418, "global_step": 345357, "epoch": 4160} {"train_loss": -26.08514976501465, "global_step": 345358, "epoch": 4160} {"train_loss": -26.14246940612793, "global_step": 345359, "epoch": 4160} {"train_loss": -26.330350875854492, "global_step": 345360, "epoch": 4160} {"train_loss": -25.888879776000977, "global_step": 345361, "epoch": 4160} {"train_loss": -25.99973621138607, "global_step": 345362, "epoch": 4160, "val_loss": 6591534.0} {"train_loss": -25.4869384765625, "global_step": 345363, "epoch": 4161} {"train_loss": -25.76630973815918, "global_step": 345364, "epoch": 4161} {"train_loss": -26.21612548828125, "global_step": 345365, "epoch": 4161} {"train_loss": -25.582420349121094, "global_step": 345366, "epoch": 4161} {"train_loss": -26.1724796295166, "global_step": 345367, "epoch": 4161} {"train_loss": -25.718154907226562, "global_step": 345368, "epoch": 4161} {"train_loss": -25.65290641784668, "global_step": 345369, "epoch": 4161} {"train_loss": -25.563474655151367, "global_step": 345370, "epoch": 4161} {"train_loss": -25.860260009765625, "global_step": 345371, "epoch": 4161} {"train_loss": -25.989521026611328, "global_step": 345372, "epoch": 4161} {"train_loss": -26.192651748657227, "global_step": 345373, "epoch": 4161} {"train_loss": -25.6779727935791, "global_step": 345374, "epoch": 4161} {"train_loss": -25.621173858642578, "global_step": 345375, "epoch": 4161} {"train_loss": -26.08786392211914, "global_step": 345376, "epoch": 4161} {"train_loss": -25.348112106323242, "global_step": 345377, "epoch": 4161} {"train_loss": -25.963550567626953, "global_step": 345378, "epoch": 4161} {"train_loss": -25.453704833984375, "global_step": 345379, "epoch": 4161} {"train_loss": -25.7974853515625, "global_step": 345380, "epoch": 4161} {"train_loss": -26.082382202148438, "global_step": 345381, "epoch": 4161} {"train_loss": -25.719518661499023, "global_step": 345382, "epoch": 4161} {"train_loss": -25.883779525756836, "global_step": 345383, "epoch": 4161} {"train_loss": -26.174015045166016, "global_step": 345384, "epoch": 4161} {"train_loss": -25.788660049438477, "global_step": 345385, "epoch": 4161} {"train_loss": -26.187353134155273, "global_step": 345386, "epoch": 4161} {"train_loss": -26.462873458862305, "global_step": 345387, "epoch": 4161} {"train_loss": -26.165363311767578, "global_step": 345388, "epoch": 4161} {"train_loss": -25.82322120666504, "global_step": 345389, "epoch": 4161} {"train_loss": -26.06418228149414, "global_step": 345390, "epoch": 4161} {"train_loss": -26.06959342956543, "global_step": 345391, "epoch": 4161} {"train_loss": -26.086999893188477, "global_step": 345392, "epoch": 4161} {"train_loss": -26.160232543945312, "global_step": 345393, "epoch": 4161} {"train_loss": -26.102548599243164, "global_step": 345394, "epoch": 4161} {"train_loss": -26.239913940429688, "global_step": 345395, "epoch": 4161} {"train_loss": -26.3635196685791, "global_step": 345396, "epoch": 4161} {"train_loss": -26.141538619995117, "global_step": 345397, "epoch": 4161} {"train_loss": -26.192676544189453, "global_step": 345398, "epoch": 4161} {"train_loss": -25.9942684173584, "global_step": 345399, "epoch": 4161} {"train_loss": -26.192148208618164, "global_step": 345400, "epoch": 4161} {"train_loss": -26.61716651916504, "global_step": 345401, "epoch": 4161} {"train_loss": -25.91729736328125, "global_step": 345402, "epoch": 4161} {"train_loss": -26.03677749633789, "global_step": 345403, "epoch": 4161} {"train_loss": -26.306379318237305, "global_step": 345404, "epoch": 4161} {"train_loss": -26.2205810546875, "global_step": 345405, "epoch": 4161} {"train_loss": -26.49114418029785, "global_step": 345406, "epoch": 4161} {"train_loss": -26.23597526550293, "global_step": 345407, "epoch": 4161} {"train_loss": -26.2238826751709, "global_step": 345408, "epoch": 4161} {"train_loss": -26.224576950073242, "global_step": 345409, "epoch": 4161} {"train_loss": -26.220539093017578, "global_step": 345410, "epoch": 4161} {"train_loss": -26.00308609008789, "global_step": 345411, "epoch": 4161} {"train_loss": -26.142114639282227, "global_step": 345412, "epoch": 4161} {"train_loss": -26.28354263305664, "global_step": 345413, "epoch": 4161} {"train_loss": -26.079980850219727, "global_step": 345414, "epoch": 4161} {"train_loss": -26.17641258239746, "global_step": 345415, "epoch": 4161} {"train_loss": -26.60003089904785, "global_step": 345416, "epoch": 4161} {"train_loss": -26.236597061157227, "global_step": 345417, "epoch": 4161} {"train_loss": -26.475797653198242, "global_step": 345418, "epoch": 4161} {"train_loss": -26.617145538330078, "global_step": 345419, "epoch": 4161} {"train_loss": -26.4845027923584, "global_step": 345420, "epoch": 4161} {"train_loss": -26.526172637939453, "global_step": 345421, "epoch": 4161} {"train_loss": -26.213525772094727, "global_step": 345422, "epoch": 4161} {"train_loss": -26.332311630249023, "global_step": 345423, "epoch": 4161} {"train_loss": -26.425403594970703, "global_step": 345424, "epoch": 4161} {"train_loss": -26.198694229125977, "global_step": 345425, "epoch": 4161} {"train_loss": -26.24382972717285, "global_step": 345426, "epoch": 4161} {"train_loss": -26.26372718811035, "global_step": 345427, "epoch": 4161} {"train_loss": -26.25931739807129, "global_step": 345428, "epoch": 4161} {"train_loss": -26.296106338500977, "global_step": 345429, "epoch": 4161} {"train_loss": -26.112165451049805, "global_step": 345430, "epoch": 4161} {"train_loss": -26.268335342407227, "global_step": 345431, "epoch": 4161} {"train_loss": -26.424060821533203, "global_step": 345432, "epoch": 4161} {"train_loss": -26.335229873657227, "global_step": 345433, "epoch": 4161} {"train_loss": -26.305225372314453, "global_step": 345434, "epoch": 4161} {"train_loss": -25.933820724487305, "global_step": 345435, "epoch": 4161} {"train_loss": -25.829761505126953, "global_step": 345436, "epoch": 4161} {"train_loss": -26.091100692749023, "global_step": 345437, "epoch": 4161} {"train_loss": -25.526479721069336, "global_step": 345438, "epoch": 4161} {"train_loss": -25.81268882751465, "global_step": 345439, "epoch": 4161} {"train_loss": -26.204395294189453, "global_step": 345440, "epoch": 4161} {"train_loss": -26.429859161376953, "global_step": 345441, "epoch": 4161} {"train_loss": -25.91948890686035, "global_step": 345442, "epoch": 4161} {"train_loss": -26.402673721313477, "global_step": 345443, "epoch": 4161} {"train_loss": -26.301227569580078, "global_step": 345444, "epoch": 4161} {"train_loss": -26.110884172370636, "global_step": 345445, "epoch": 4161, "val_loss": 6571023.0} {"train_loss": -24.925296783447266, "global_step": 345446, "epoch": 4162} {"train_loss": -25.093400955200195, "global_step": 345447, "epoch": 4162} {"train_loss": -25.228242874145508, "global_step": 345448, "epoch": 4162} {"train_loss": -25.301740646362305, "global_step": 345449, "epoch": 4162} {"train_loss": -25.756641387939453, "global_step": 345450, "epoch": 4162} {"train_loss": -25.383686065673828, "global_step": 345451, "epoch": 4162} {"train_loss": -25.545812606811523, "global_step": 345452, "epoch": 4162} {"train_loss": -25.642499923706055, "global_step": 345453, "epoch": 4162} {"train_loss": -25.79608154296875, "global_step": 345454, "epoch": 4162} {"train_loss": -25.695016860961914, "global_step": 345455, "epoch": 4162} {"train_loss": -25.518606185913086, "global_step": 345456, "epoch": 4162} {"train_loss": -25.592300415039062, "global_step": 345457, "epoch": 4162} {"train_loss": -25.94422721862793, "global_step": 345458, "epoch": 4162} {"train_loss": -25.46345329284668, "global_step": 345459, "epoch": 4162} {"train_loss": -25.542482376098633, "global_step": 345460, "epoch": 4162} {"train_loss": -25.844465255737305, "global_step": 345461, "epoch": 4162} {"train_loss": -25.598346710205078, "global_step": 345462, "epoch": 4162} {"train_loss": -25.81452751159668, "global_step": 345463, "epoch": 4162} {"train_loss": -25.451337814331055, "global_step": 345464, "epoch": 4162} {"train_loss": -25.60100746154785, "global_step": 345465, "epoch": 4162} {"train_loss": -25.784351348876953, "global_step": 345466, "epoch": 4162} {"train_loss": -25.98707389831543, "global_step": 345467, "epoch": 4162} {"train_loss": -25.810766220092773, "global_step": 345468, "epoch": 4162} {"train_loss": -25.604202270507812, "global_step": 345469, "epoch": 4162} {"train_loss": -25.676559448242188, "global_step": 345470, "epoch": 4162} {"train_loss": -25.717716217041016, "global_step": 345471, "epoch": 4162} {"train_loss": -26.033781051635742, "global_step": 345472, "epoch": 4162} {"train_loss": -26.4665470123291, "global_step": 345473, "epoch": 4162} {"train_loss": -26.064218521118164, "global_step": 345474, "epoch": 4162} {"train_loss": -25.994159698486328, "global_step": 345475, "epoch": 4162} {"train_loss": -25.85627555847168, "global_step": 345476, "epoch": 4162} {"train_loss": -26.053369522094727, "global_step": 345477, "epoch": 4162} {"train_loss": -26.01835060119629, "global_step": 345478, "epoch": 4162} {"train_loss": -26.1608829498291, "global_step": 345479, "epoch": 4162} {"train_loss": -26.424467086791992, "global_step": 345480, "epoch": 4162} {"train_loss": -25.846887588500977, "global_step": 345481, "epoch": 4162} {"train_loss": -25.968616485595703, "global_step": 345482, "epoch": 4162} {"train_loss": -25.924457550048828, "global_step": 345483, "epoch": 4162} {"train_loss": -26.128528594970703, "global_step": 345484, "epoch": 4162} {"train_loss": -26.084009170532227, "global_step": 345485, "epoch": 4162} {"train_loss": -26.3092041015625, "global_step": 345486, "epoch": 4162} {"train_loss": -26.535837173461914, "global_step": 345487, "epoch": 4162} {"train_loss": -25.93623161315918, "global_step": 345488, "epoch": 4162} {"train_loss": -25.95550537109375, "global_step": 345489, "epoch": 4162} {"train_loss": -26.326711654663086, "global_step": 345490, "epoch": 4162} {"train_loss": -26.08807945251465, "global_step": 345491, "epoch": 4162} {"train_loss": -26.241180419921875, "global_step": 345492, "epoch": 4162} {"train_loss": -26.282560348510742, "global_step": 345493, "epoch": 4162} {"train_loss": -26.269983291625977, "global_step": 345494, "epoch": 4162} {"train_loss": -26.40850257873535, "global_step": 345495, "epoch": 4162} {"train_loss": -26.287872314453125, "global_step": 345496, "epoch": 4162} {"train_loss": -26.352949142456055, "global_step": 345497, "epoch": 4162} {"train_loss": -26.18332862854004, "global_step": 345498, "epoch": 4162} {"train_loss": -26.09041404724121, "global_step": 345499, "epoch": 4162} {"train_loss": -26.34661293029785, "global_step": 345500, "epoch": 4162} {"train_loss": -26.38376235961914, "global_step": 345501, "epoch": 4162} {"train_loss": -26.27972984313965, "global_step": 345502, "epoch": 4162} {"train_loss": -25.927810668945312, "global_step": 345503, "epoch": 4162} {"train_loss": -26.34107780456543, "global_step": 345504, "epoch": 4162} {"train_loss": -26.004507064819336, "global_step": 345505, "epoch": 4162} {"train_loss": -26.2960262298584, "global_step": 345506, "epoch": 4162} {"train_loss": -25.935094833374023, "global_step": 345507, "epoch": 4162} {"train_loss": -26.06056022644043, "global_step": 345508, "epoch": 4162} {"train_loss": -26.01544761657715, "global_step": 345509, "epoch": 4162} {"train_loss": -26.2884521484375, "global_step": 345510, "epoch": 4162} {"train_loss": -26.201690673828125, "global_step": 345511, "epoch": 4162} {"train_loss": -26.33561134338379, "global_step": 345512, "epoch": 4162} {"train_loss": -25.458343505859375, "global_step": 345513, "epoch": 4162} {"train_loss": -25.882949829101562, "global_step": 345514, "epoch": 4162} {"train_loss": -25.664630889892578, "global_step": 345515, "epoch": 4162} {"train_loss": -26.250341415405273, "global_step": 345516, "epoch": 4162} {"train_loss": -25.8551082611084, "global_step": 345517, "epoch": 4162} {"train_loss": -26.25730323791504, "global_step": 345518, "epoch": 4162} {"train_loss": -26.3512020111084, "global_step": 345519, "epoch": 4162} {"train_loss": -25.90372085571289, "global_step": 345520, "epoch": 4162} {"train_loss": -25.929494857788086, "global_step": 345521, "epoch": 4162} {"train_loss": -26.140644073486328, "global_step": 345522, "epoch": 4162} {"train_loss": -25.807737350463867, "global_step": 345523, "epoch": 4162} {"train_loss": -25.984298706054688, "global_step": 345524, "epoch": 4162} {"train_loss": -25.777673721313477, "global_step": 345525, "epoch": 4162} {"train_loss": -26.088346481323242, "global_step": 345526, "epoch": 4162} {"train_loss": -25.570837020874023, "global_step": 345527, "epoch": 4162} {"train_loss": -25.90900609579431, "global_step": 345528, "epoch": 4162, "val_loss": 6598561.5} {"train_loss": -24.320646286010742, "global_step": 345529, "epoch": 4163} {"train_loss": -24.619421005249023, "global_step": 345530, "epoch": 4163} {"train_loss": -25.84479331970215, "global_step": 345531, "epoch": 4163} {"train_loss": -24.8968563079834, "global_step": 345532, "epoch": 4163} {"train_loss": -24.91632652282715, "global_step": 345533, "epoch": 4163} {"train_loss": -25.161956787109375, "global_step": 345534, "epoch": 4163} {"train_loss": -24.89575958251953, "global_step": 345535, "epoch": 4163} {"train_loss": -25.627248764038086, "global_step": 345536, "epoch": 4163} {"train_loss": -25.046091079711914, "global_step": 345537, "epoch": 4163} {"train_loss": -25.38081932067871, "global_step": 345538, "epoch": 4163} {"train_loss": -25.685888290405273, "global_step": 345539, "epoch": 4163} {"train_loss": -25.502216339111328, "global_step": 345540, "epoch": 4163} {"train_loss": -24.936105728149414, "global_step": 345541, "epoch": 4163} {"train_loss": -25.363367080688477, "global_step": 345542, "epoch": 4163} {"train_loss": -25.5434513092041, "global_step": 345543, "epoch": 4163} {"train_loss": -25.607065200805664, "global_step": 345544, "epoch": 4163} {"train_loss": -25.482940673828125, "global_step": 345545, "epoch": 4163} {"train_loss": -25.782428741455078, "global_step": 345546, "epoch": 4163} {"train_loss": -25.493528366088867, "global_step": 345547, "epoch": 4163} {"train_loss": -25.48492431640625, "global_step": 345548, "epoch": 4163} {"train_loss": -25.394861221313477, "global_step": 345549, "epoch": 4163} {"train_loss": -25.614721298217773, "global_step": 345550, "epoch": 4163} {"train_loss": -25.739145278930664, "global_step": 345551, "epoch": 4163} {"train_loss": -25.520750045776367, "global_step": 345552, "epoch": 4163} {"train_loss": -25.76716423034668, "global_step": 345553, "epoch": 4163} {"train_loss": -25.834333419799805, "global_step": 345554, "epoch": 4163} {"train_loss": -26.00615882873535, "global_step": 345555, "epoch": 4163} {"train_loss": -25.8631649017334, "global_step": 345556, "epoch": 4163} {"train_loss": -26.064870834350586, "global_step": 345557, "epoch": 4163} {"train_loss": -26.237964630126953, "global_step": 345558, "epoch": 4163} {"train_loss": -25.783979415893555, "global_step": 345559, "epoch": 4163} {"train_loss": -26.118860244750977, "global_step": 345560, "epoch": 4163} {"train_loss": -25.741912841796875, "global_step": 345561, "epoch": 4163} {"train_loss": -25.906330108642578, "global_step": 345562, "epoch": 4163} {"train_loss": -26.341779708862305, "global_step": 345563, "epoch": 4163} {"train_loss": -25.711206436157227, "global_step": 345564, "epoch": 4163} {"train_loss": -26.126550674438477, "global_step": 345565, "epoch": 4163} {"train_loss": -26.14137077331543, "global_step": 345566, "epoch": 4163} {"train_loss": -26.137226104736328, "global_step": 345567, "epoch": 4163} {"train_loss": -26.211416244506836, "global_step": 345568, "epoch": 4163} {"train_loss": -26.70119285583496, "global_step": 345569, "epoch": 4163} {"train_loss": -26.343603134155273, "global_step": 345570, "epoch": 4163} {"train_loss": -26.107202529907227, "global_step": 345571, "epoch": 4163} {"train_loss": -25.934986114501953, "global_step": 345572, "epoch": 4163} {"train_loss": -26.520483016967773, "global_step": 345573, "epoch": 4163} {"train_loss": -26.541595458984375, "global_step": 345574, "epoch": 4163} {"train_loss": -26.2900333404541, "global_step": 345575, "epoch": 4163} {"train_loss": -26.413135528564453, "global_step": 345576, "epoch": 4163} {"train_loss": -26.102746963500977, "global_step": 345577, "epoch": 4163} {"train_loss": -26.06485939025879, "global_step": 345578, "epoch": 4163} {"train_loss": -26.147689819335938, "global_step": 345579, "epoch": 4163} {"train_loss": -26.1462345123291, "global_step": 345580, "epoch": 4163} {"train_loss": -26.501073837280273, "global_step": 345581, "epoch": 4163} {"train_loss": -26.095600128173828, "global_step": 345582, "epoch": 4163} {"train_loss": -26.23345947265625, "global_step": 345583, "epoch": 4163} {"train_loss": -26.331689834594727, "global_step": 345584, "epoch": 4163} {"train_loss": -26.225141525268555, "global_step": 345585, "epoch": 4163} {"train_loss": -25.92482566833496, "global_step": 345586, "epoch": 4163} {"train_loss": -26.28883171081543, "global_step": 345587, "epoch": 4163} {"train_loss": -26.559314727783203, "global_step": 345588, "epoch": 4163} {"train_loss": -26.202184677124023, "global_step": 345589, "epoch": 4163} {"train_loss": -26.360004425048828, "global_step": 345590, "epoch": 4163} {"train_loss": -25.897815704345703, "global_step": 345591, "epoch": 4163} {"train_loss": -26.14613151550293, "global_step": 345592, "epoch": 4163} {"train_loss": -26.056884765625, "global_step": 345593, "epoch": 4163} {"train_loss": -26.336713790893555, "global_step": 345594, "epoch": 4163} {"train_loss": -25.993793487548828, "global_step": 345595, "epoch": 4163} {"train_loss": -26.525653839111328, "global_step": 345596, "epoch": 4163} {"train_loss": -26.40677261352539, "global_step": 345597, "epoch": 4163} {"train_loss": -26.068130493164062, "global_step": 345598, "epoch": 4163} {"train_loss": -26.176467895507812, "global_step": 345599, "epoch": 4163} {"train_loss": -26.167022705078125, "global_step": 345600, "epoch": 4163} {"train_loss": -26.00608253479004, "global_step": 345601, "epoch": 4163} {"train_loss": -26.264074325561523, "global_step": 345602, "epoch": 4163} {"train_loss": -26.448225021362305, "global_step": 345603, "epoch": 4163} {"train_loss": -26.083221435546875, "global_step": 345604, "epoch": 4163} {"train_loss": -26.068252563476562, "global_step": 345605, "epoch": 4163} {"train_loss": -26.260486602783203, "global_step": 345606, "epoch": 4163} {"train_loss": -26.512853622436523, "global_step": 345607, "epoch": 4163} {"train_loss": -26.03672218322754, "global_step": 345608, "epoch": 4163} {"train_loss": -26.1798038482666, "global_step": 345609, "epoch": 4163} {"train_loss": -25.90779685974121, "global_step": 345610, "epoch": 4163} {"train_loss": -25.90738066707749, "global_step": 345611, "epoch": 4163, "val_loss": 6598457.0} {"train_loss": -21.628122329711914, "global_step": 345612, "epoch": 4164} {"train_loss": -20.0191707611084, "global_step": 345613, "epoch": 4164} {"train_loss": -23.26865577697754, "global_step": 345614, "epoch": 4164} {"train_loss": -23.886001586914062, "global_step": 345615, "epoch": 4164} {"train_loss": -23.248762130737305, "global_step": 345616, "epoch": 4164} {"train_loss": -23.90790367126465, "global_step": 345617, "epoch": 4164} {"train_loss": -24.572484970092773, "global_step": 345618, "epoch": 4164} {"train_loss": -24.598737716674805, "global_step": 345619, "epoch": 4164} {"train_loss": -24.775815963745117, "global_step": 345620, "epoch": 4164} {"train_loss": -24.398405075073242, "global_step": 345621, "epoch": 4164} {"train_loss": -24.779897689819336, "global_step": 345622, "epoch": 4164} {"train_loss": -24.231557846069336, "global_step": 345623, "epoch": 4164} {"train_loss": -24.445833206176758, "global_step": 345624, "epoch": 4164} {"train_loss": -24.769062042236328, "global_step": 345625, "epoch": 4164} {"train_loss": -25.053390502929688, "global_step": 345626, "epoch": 4164} {"train_loss": -25.196582794189453, "global_step": 345627, "epoch": 4164} {"train_loss": -24.90437889099121, "global_step": 345628, "epoch": 4164} {"train_loss": -24.9243106842041, "global_step": 345629, "epoch": 4164} {"train_loss": -25.097253799438477, "global_step": 345630, "epoch": 4164} {"train_loss": -24.843982696533203, "global_step": 345631, "epoch": 4164} {"train_loss": -25.25080108642578, "global_step": 345632, "epoch": 4164} {"train_loss": -24.799409866333008, "global_step": 345633, "epoch": 4164} {"train_loss": -24.978376388549805, "global_step": 345634, "epoch": 4164} {"train_loss": -25.31380271911621, "global_step": 345635, "epoch": 4164} {"train_loss": -25.406097412109375, "global_step": 345636, "epoch": 4164} {"train_loss": -25.364484786987305, "global_step": 345637, "epoch": 4164} {"train_loss": -25.199411392211914, "global_step": 345638, "epoch": 4164} {"train_loss": -25.515676498413086, "global_step": 345639, "epoch": 4164} {"train_loss": -25.70428466796875, "global_step": 345640, "epoch": 4164} {"train_loss": -25.423809051513672, "global_step": 345641, "epoch": 4164} {"train_loss": -25.28702163696289, "global_step": 345642, "epoch": 4164} {"train_loss": -25.64170265197754, "global_step": 345643, "epoch": 4164} {"train_loss": -25.279695510864258, "global_step": 345644, "epoch": 4164} {"train_loss": -25.486494064331055, "global_step": 345645, "epoch": 4164} {"train_loss": -25.785593032836914, "global_step": 345646, "epoch": 4164} {"train_loss": -25.45425796508789, "global_step": 345647, "epoch": 4164} {"train_loss": -26.040699005126953, "global_step": 345648, "epoch": 4164} {"train_loss": -25.839405059814453, "global_step": 345649, "epoch": 4164} {"train_loss": -25.728559494018555, "global_step": 345650, "epoch": 4164} {"train_loss": -25.964624404907227, "global_step": 345651, "epoch": 4164} {"train_loss": -25.716455459594727, "global_step": 345652, "epoch": 4164} {"train_loss": -26.018457412719727, "global_step": 345653, "epoch": 4164} {"train_loss": -25.79981803894043, "global_step": 345654, "epoch": 4164} {"train_loss": -25.985767364501953, "global_step": 345655, "epoch": 4164} {"train_loss": -25.828115463256836, "global_step": 345656, "epoch": 4164} {"train_loss": -26.090106964111328, "global_step": 345657, "epoch": 4164} {"train_loss": -26.204526901245117, "global_step": 345658, "epoch": 4164} {"train_loss": -25.84498405456543, "global_step": 345659, "epoch": 4164} {"train_loss": -26.333087921142578, "global_step": 345660, "epoch": 4164} {"train_loss": -25.999242782592773, "global_step": 345661, "epoch": 4164} {"train_loss": -26.183246612548828, "global_step": 345662, "epoch": 4164} {"train_loss": -25.856403350830078, "global_step": 345663, "epoch": 4164} {"train_loss": -25.99240493774414, "global_step": 345664, "epoch": 4164} {"train_loss": -26.53510093688965, "global_step": 345665, "epoch": 4164} {"train_loss": -26.18900489807129, "global_step": 345666, "epoch": 4164} {"train_loss": -26.191421508789062, "global_step": 345667, "epoch": 4164} {"train_loss": -26.12636375427246, "global_step": 345668, "epoch": 4164} {"train_loss": -26.239160537719727, "global_step": 345669, "epoch": 4164} {"train_loss": -25.991674423217773, "global_step": 345670, "epoch": 4164} {"train_loss": -26.1691837310791, "global_step": 345671, "epoch": 4164} {"train_loss": -26.250049591064453, "global_step": 345672, "epoch": 4164} {"train_loss": -26.645544052124023, "global_step": 345673, "epoch": 4164} {"train_loss": -26.116769790649414, "global_step": 345674, "epoch": 4164} {"train_loss": -26.381977081298828, "global_step": 345675, "epoch": 4164} {"train_loss": -26.131277084350586, "global_step": 345676, "epoch": 4164} {"train_loss": -26.164661407470703, "global_step": 345677, "epoch": 4164} {"train_loss": -26.25821304321289, "global_step": 345678, "epoch": 4164} {"train_loss": -26.263486862182617, "global_step": 345679, "epoch": 4164} {"train_loss": -26.350833892822266, "global_step": 345680, "epoch": 4164} {"train_loss": -26.159467697143555, "global_step": 345681, "epoch": 4164} {"train_loss": -26.249235153198242, "global_step": 345682, "epoch": 4164} {"train_loss": -26.237777709960938, "global_step": 345683, "epoch": 4164} {"train_loss": -26.38519287109375, "global_step": 345684, "epoch": 4164} {"train_loss": -26.38775634765625, "global_step": 345685, "epoch": 4164} {"train_loss": -26.3319034576416, "global_step": 345686, "epoch": 4164} {"train_loss": -26.090911865234375, "global_step": 345687, "epoch": 4164} {"train_loss": -26.364898681640625, "global_step": 345688, "epoch": 4164} {"train_loss": -26.13360595703125, "global_step": 345689, "epoch": 4164} {"train_loss": -26.224706649780273, "global_step": 345690, "epoch": 4164} {"train_loss": -26.179235458374023, "global_step": 345691, "epoch": 4164} {"train_loss": -26.0443058013916, "global_step": 345692, "epoch": 4164} {"train_loss": -26.454395294189453, "global_step": 345693, "epoch": 4164} {"train_loss": -25.504061250801545, "global_step": 345694, "epoch": 4164, "val_loss": 6560277.0} {"train_loss": -25.8112850189209, "global_step": 345695, "epoch": 4165} {"train_loss": -25.796438217163086, "global_step": 345696, "epoch": 4165} {"train_loss": -26.0098934173584, "global_step": 345697, "epoch": 4165} {"train_loss": -26.100513458251953, "global_step": 345698, "epoch": 4165} {"train_loss": -25.85944938659668, "global_step": 345699, "epoch": 4165} {"train_loss": -26.364038467407227, "global_step": 345700, "epoch": 4165} {"train_loss": -26.119497299194336, "global_step": 345701, "epoch": 4165} {"train_loss": -26.329492568969727, "global_step": 345702, "epoch": 4165} {"train_loss": -25.578731536865234, "global_step": 345703, "epoch": 4165} {"train_loss": -26.08609390258789, "global_step": 345704, "epoch": 4165} {"train_loss": -25.885313034057617, "global_step": 345705, "epoch": 4165} {"train_loss": -26.093093872070312, "global_step": 345706, "epoch": 4165} {"train_loss": -26.110498428344727, "global_step": 345707, "epoch": 4165} {"train_loss": -26.392353057861328, "global_step": 345708, "epoch": 4165} {"train_loss": -26.19343376159668, "global_step": 345709, "epoch": 4165} {"train_loss": -26.21070671081543, "global_step": 345710, "epoch": 4165} {"train_loss": -26.23200798034668, "global_step": 345711, "epoch": 4165} {"train_loss": -25.81709098815918, "global_step": 345712, "epoch": 4165} {"train_loss": -25.968521118164062, "global_step": 345713, "epoch": 4165} {"train_loss": -25.994903564453125, "global_step": 345714, "epoch": 4165} {"train_loss": -25.6447696685791, "global_step": 345715, "epoch": 4165} {"train_loss": -26.595951080322266, "global_step": 345716, "epoch": 4165} {"train_loss": -26.530073165893555, "global_step": 345717, "epoch": 4165} {"train_loss": -25.91556739807129, "global_step": 345718, "epoch": 4165} {"train_loss": -25.99775505065918, "global_step": 345719, "epoch": 4165} {"train_loss": -26.445831298828125, "global_step": 345720, "epoch": 4165} {"train_loss": -26.197473526000977, "global_step": 345721, "epoch": 4165} {"train_loss": -25.519168853759766, "global_step": 345722, "epoch": 4165} {"train_loss": -25.718175888061523, "global_step": 345723, "epoch": 4165} {"train_loss": -26.393735885620117, "global_step": 345724, "epoch": 4165} {"train_loss": -26.199024200439453, "global_step": 345725, "epoch": 4165} {"train_loss": -26.055402755737305, "global_step": 345726, "epoch": 4165} {"train_loss": -26.318710327148438, "global_step": 345727, "epoch": 4165} {"train_loss": -26.251739501953125, "global_step": 345728, "epoch": 4165} {"train_loss": -26.586057662963867, "global_step": 345729, "epoch": 4165} {"train_loss": -25.8574161529541, "global_step": 345730, "epoch": 4165} {"train_loss": -26.167606353759766, "global_step": 345731, "epoch": 4165} {"train_loss": -26.22047233581543, "global_step": 345732, "epoch": 4165} {"train_loss": -26.03822135925293, "global_step": 345733, "epoch": 4165} {"train_loss": -25.869871139526367, "global_step": 345734, "epoch": 4165} {"train_loss": -26.183380126953125, "global_step": 345735, "epoch": 4165} {"train_loss": -26.2105770111084, "global_step": 345736, "epoch": 4165} {"train_loss": -26.058073043823242, "global_step": 345737, "epoch": 4165} {"train_loss": -26.49579429626465, "global_step": 345738, "epoch": 4165} {"train_loss": -25.824176788330078, "global_step": 345739, "epoch": 4165} {"train_loss": -26.064895629882812, "global_step": 345740, "epoch": 4165} {"train_loss": -26.028173446655273, "global_step": 345741, "epoch": 4165} {"train_loss": -26.07996940612793, "global_step": 345742, "epoch": 4165} {"train_loss": -25.88730239868164, "global_step": 345743, "epoch": 4165} {"train_loss": -26.343765258789062, "global_step": 345744, "epoch": 4165} {"train_loss": -25.992084503173828, "global_step": 345745, "epoch": 4165} {"train_loss": -25.590763092041016, "global_step": 345746, "epoch": 4165} {"train_loss": -26.044998168945312, "global_step": 345747, "epoch": 4165} {"train_loss": -25.99065589904785, "global_step": 345748, "epoch": 4165} {"train_loss": -26.177021026611328, "global_step": 345749, "epoch": 4165} {"train_loss": -26.311267852783203, "global_step": 345750, "epoch": 4165} {"train_loss": -26.085718154907227, "global_step": 345751, "epoch": 4165} {"train_loss": -25.992658615112305, "global_step": 345752, "epoch": 4165} {"train_loss": -25.877185821533203, "global_step": 345753, "epoch": 4165} {"train_loss": -26.280902862548828, "global_step": 345754, "epoch": 4165} {"train_loss": -26.13447380065918, "global_step": 345755, "epoch": 4165} {"train_loss": -26.179733276367188, "global_step": 345756, "epoch": 4165} {"train_loss": -26.114721298217773, "global_step": 345757, "epoch": 4165} {"train_loss": -26.4282283782959, "global_step": 345758, "epoch": 4165} {"train_loss": -26.221715927124023, "global_step": 345759, "epoch": 4165} {"train_loss": -26.29437828063965, "global_step": 345760, "epoch": 4165} {"train_loss": -26.154666900634766, "global_step": 345761, "epoch": 4165} {"train_loss": -26.3259220123291, "global_step": 345762, "epoch": 4165} {"train_loss": -26.219812393188477, "global_step": 345763, "epoch": 4165} {"train_loss": -26.135873794555664, "global_step": 345764, "epoch": 4165} {"train_loss": -26.1833438873291, "global_step": 345765, "epoch": 4165} {"train_loss": -26.208539962768555, "global_step": 345766, "epoch": 4165} {"train_loss": -26.126754760742188, "global_step": 345767, "epoch": 4165} {"train_loss": -25.777286529541016, "global_step": 345768, "epoch": 4165} {"train_loss": -26.1292781829834, "global_step": 345769, "epoch": 4165} {"train_loss": -25.8764705657959, "global_step": 345770, "epoch": 4165} {"train_loss": -26.41591453552246, "global_step": 345771, "epoch": 4165} {"train_loss": -26.287195205688477, "global_step": 345772, "epoch": 4165} {"train_loss": -26.3748836517334, "global_step": 345773, "epoch": 4165} {"train_loss": -26.08942985534668, "global_step": 345774, "epoch": 4165} {"train_loss": -26.463886260986328, "global_step": 345775, "epoch": 4165} {"train_loss": -26.220014572143555, "global_step": 345776, "epoch": 4165} {"train_loss": -26.126346128532685, "global_step": 345777, "epoch": 4165, "val_loss": 6527065.5} {"train_loss": -25.275497436523438, "global_step": 345778, "epoch": 4166} {"train_loss": -25.3005313873291, "global_step": 345779, "epoch": 4166} {"train_loss": -25.701263427734375, "global_step": 345780, "epoch": 4166} {"train_loss": -25.1676082611084, "global_step": 345781, "epoch": 4166} {"train_loss": -25.6984806060791, "global_step": 345782, "epoch": 4166} {"train_loss": -25.959625244140625, "global_step": 345783, "epoch": 4166} {"train_loss": -25.694721221923828, "global_step": 345784, "epoch": 4166} {"train_loss": -25.747961044311523, "global_step": 345785, "epoch": 4166} {"train_loss": -26.028295516967773, "global_step": 345786, "epoch": 4166} {"train_loss": -25.762243270874023, "global_step": 345787, "epoch": 4166} {"train_loss": -26.10438346862793, "global_step": 345788, "epoch": 4166} {"train_loss": -25.84408950805664, "global_step": 345789, "epoch": 4166} {"train_loss": -25.75798988342285, "global_step": 345790, "epoch": 4166} {"train_loss": -26.371597290039062, "global_step": 345791, "epoch": 4166} {"train_loss": -26.059839248657227, "global_step": 345792, "epoch": 4166} {"train_loss": -25.92315673828125, "global_step": 345793, "epoch": 4166} {"train_loss": -25.756582260131836, "global_step": 345794, "epoch": 4166} {"train_loss": -26.102293014526367, "global_step": 345795, "epoch": 4166} {"train_loss": -26.009769439697266, "global_step": 345796, "epoch": 4166} {"train_loss": -25.81233787536621, "global_step": 345797, "epoch": 4166} {"train_loss": -25.727924346923828, "global_step": 345798, "epoch": 4166} {"train_loss": -25.979965209960938, "global_step": 345799, "epoch": 4166} {"train_loss": -26.036909103393555, "global_step": 345800, "epoch": 4166} {"train_loss": -26.06471061706543, "global_step": 345801, "epoch": 4166} {"train_loss": -25.92719078063965, "global_step": 345802, "epoch": 4166} {"train_loss": -25.95867919921875, "global_step": 345803, "epoch": 4166} {"train_loss": -25.96808433532715, "global_step": 345804, "epoch": 4166} {"train_loss": -26.027099609375, "global_step": 345805, "epoch": 4166} {"train_loss": -26.002649307250977, "global_step": 345806, "epoch": 4166} {"train_loss": -25.941028594970703, "global_step": 345807, "epoch": 4166} {"train_loss": -26.627180099487305, "global_step": 345808, "epoch": 4166} {"train_loss": -26.228607177734375, "global_step": 345809, "epoch": 4166} {"train_loss": -26.395471572875977, "global_step": 345810, "epoch": 4166} {"train_loss": -25.93255615234375, "global_step": 345811, "epoch": 4166} {"train_loss": -26.152847290039062, "global_step": 345812, "epoch": 4166} {"train_loss": -25.836612701416016, "global_step": 345813, "epoch": 4166} {"train_loss": -26.388813018798828, "global_step": 345814, "epoch": 4166} {"train_loss": -26.586532592773438, "global_step": 345815, "epoch": 4166} {"train_loss": -26.089557647705078, "global_step": 345816, "epoch": 4166} {"train_loss": -25.871387481689453, "global_step": 345817, "epoch": 4166} {"train_loss": -26.621896743774414, "global_step": 345818, "epoch": 4166} {"train_loss": -26.16143798828125, "global_step": 345819, "epoch": 4166} {"train_loss": -26.082141876220703, "global_step": 345820, "epoch": 4166} {"train_loss": -26.50691032409668, "global_step": 345821, "epoch": 4166} {"train_loss": -26.13767433166504, "global_step": 345822, "epoch": 4166} {"train_loss": -26.122222900390625, "global_step": 345823, "epoch": 4166} {"train_loss": -26.33003807067871, "global_step": 345824, "epoch": 4166} {"train_loss": -25.9981632232666, "global_step": 345825, "epoch": 4166} {"train_loss": -26.206693649291992, "global_step": 345826, "epoch": 4166} {"train_loss": -26.171924591064453, "global_step": 345827, "epoch": 4166} {"train_loss": -26.03492546081543, "global_step": 345828, "epoch": 4166} {"train_loss": -26.040802001953125, "global_step": 345829, "epoch": 4166} {"train_loss": -25.95387077331543, "global_step": 345830, "epoch": 4166} {"train_loss": -25.93052101135254, "global_step": 345831, "epoch": 4166} {"train_loss": -25.406461715698242, "global_step": 345832, "epoch": 4166} {"train_loss": -25.950607299804688, "global_step": 345833, "epoch": 4166} {"train_loss": -26.51953125, "global_step": 345834, "epoch": 4166} {"train_loss": -25.95380973815918, "global_step": 345835, "epoch": 4166} {"train_loss": -26.271764755249023, "global_step": 345836, "epoch": 4166} {"train_loss": -26.20855140686035, "global_step": 345837, "epoch": 4166} {"train_loss": -26.207427978515625, "global_step": 345838, "epoch": 4166} {"train_loss": -26.294797897338867, "global_step": 345839, "epoch": 4166} {"train_loss": -26.412158966064453, "global_step": 345840, "epoch": 4166} {"train_loss": -25.969959259033203, "global_step": 345841, "epoch": 4166} {"train_loss": -25.943988800048828, "global_step": 345842, "epoch": 4166} {"train_loss": -26.34967041015625, "global_step": 345843, "epoch": 4166} {"train_loss": -25.926101684570312, "global_step": 345844, "epoch": 4166} {"train_loss": -26.2841739654541, "global_step": 345845, "epoch": 4166} {"train_loss": -25.878538131713867, "global_step": 345846, "epoch": 4166} {"train_loss": -25.99538230895996, "global_step": 345847, "epoch": 4166} {"train_loss": -26.11846351623535, "global_step": 345848, "epoch": 4166} {"train_loss": -26.08429527282715, "global_step": 345849, "epoch": 4166} {"train_loss": -26.2329158782959, "global_step": 345850, "epoch": 4166} {"train_loss": -26.38804054260254, "global_step": 345851, "epoch": 4166} {"train_loss": -25.97236442565918, "global_step": 345852, "epoch": 4166} {"train_loss": -25.802331924438477, "global_step": 345853, "epoch": 4166} {"train_loss": -26.297775268554688, "global_step": 345854, "epoch": 4166} {"train_loss": -26.29667091369629, "global_step": 345855, "epoch": 4166} {"train_loss": -26.025283813476562, "global_step": 345856, "epoch": 4166} {"train_loss": -25.678747177124023, "global_step": 345857, "epoch": 4166} {"train_loss": -26.218473434448242, "global_step": 345858, "epoch": 4166} {"train_loss": -25.880788803100586, "global_step": 345859, "epoch": 4166} {"train_loss": -26.041000343230834, "global_step": 345860, "epoch": 4166, "val_loss": 6567498.0} {"train_loss": -24.902067184448242, "global_step": 345861, "epoch": 4167} {"train_loss": -23.385637283325195, "global_step": 345862, "epoch": 4167} {"train_loss": -24.169513702392578, "global_step": 345863, "epoch": 4167} {"train_loss": -26.038909912109375, "global_step": 345864, "epoch": 4167} {"train_loss": -25.744033813476562, "global_step": 345865, "epoch": 4167} {"train_loss": -24.96744155883789, "global_step": 345866, "epoch": 4167} {"train_loss": -25.320594787597656, "global_step": 345867, "epoch": 4167} {"train_loss": -25.370222091674805, "global_step": 345868, "epoch": 4167} {"train_loss": -25.37589454650879, "global_step": 345869, "epoch": 4167} {"train_loss": -25.517398834228516, "global_step": 345870, "epoch": 4167} {"train_loss": -25.3103084564209, "global_step": 345871, "epoch": 4167} {"train_loss": -25.542953491210938, "global_step": 345872, "epoch": 4167} {"train_loss": -25.531091690063477, "global_step": 345873, "epoch": 4167} {"train_loss": -25.726612091064453, "global_step": 345874, "epoch": 4167} {"train_loss": -25.692472457885742, "global_step": 345875, "epoch": 4167} {"train_loss": -26.00836753845215, "global_step": 345876, "epoch": 4167} {"train_loss": -25.87955093383789, "global_step": 345877, "epoch": 4167} {"train_loss": -26.039457321166992, "global_step": 345878, "epoch": 4167} {"train_loss": -25.676776885986328, "global_step": 345879, "epoch": 4167} {"train_loss": -25.988073348999023, "global_step": 345880, "epoch": 4167} {"train_loss": -25.75834083557129, "global_step": 345881, "epoch": 4167} {"train_loss": -26.095544815063477, "global_step": 345882, "epoch": 4167} {"train_loss": -26.0191593170166, "global_step": 345883, "epoch": 4167} {"train_loss": -26.149560928344727, "global_step": 345884, "epoch": 4167} {"train_loss": -25.586896896362305, "global_step": 345885, "epoch": 4167} {"train_loss": -25.949939727783203, "global_step": 345886, "epoch": 4167} {"train_loss": -26.05234718322754, "global_step": 345887, "epoch": 4167} {"train_loss": -26.111143112182617, "global_step": 345888, "epoch": 4167} {"train_loss": -25.543659210205078, "global_step": 345889, "epoch": 4167} {"train_loss": -25.92084312438965, "global_step": 345890, "epoch": 4167} {"train_loss": -26.132705688476562, "global_step": 345891, "epoch": 4167} {"train_loss": -26.141021728515625, "global_step": 345892, "epoch": 4167} {"train_loss": -26.069202423095703, "global_step": 345893, "epoch": 4167} {"train_loss": -26.539411544799805, "global_step": 345894, "epoch": 4167} {"train_loss": -25.668760299682617, "global_step": 345895, "epoch": 4167} {"train_loss": -25.87106704711914, "global_step": 345896, "epoch": 4167} {"train_loss": -26.01533317565918, "global_step": 345897, "epoch": 4167} {"train_loss": -25.822046279907227, "global_step": 345898, "epoch": 4167} {"train_loss": -25.881744384765625, "global_step": 345899, "epoch": 4167} {"train_loss": -25.56556510925293, "global_step": 345900, "epoch": 4167} {"train_loss": -25.530805587768555, "global_step": 345901, "epoch": 4167} {"train_loss": -25.867624282836914, "global_step": 345902, "epoch": 4167} {"train_loss": -26.290739059448242, "global_step": 345903, "epoch": 4167} {"train_loss": -26.156620025634766, "global_step": 345904, "epoch": 4167} {"train_loss": -25.965478897094727, "global_step": 345905, "epoch": 4167} {"train_loss": -26.16456413269043, "global_step": 345906, "epoch": 4167} {"train_loss": -25.96701431274414, "global_step": 345907, "epoch": 4167} {"train_loss": -26.27351188659668, "global_step": 345908, "epoch": 4167} {"train_loss": -26.1491641998291, "global_step": 345909, "epoch": 4167} {"train_loss": -26.108749389648438, "global_step": 345910, "epoch": 4167} {"train_loss": -25.98614501953125, "global_step": 345911, "epoch": 4167} {"train_loss": -26.149866104125977, "global_step": 345912, "epoch": 4167} {"train_loss": -26.530893325805664, "global_step": 345913, "epoch": 4167} {"train_loss": -26.435338973999023, "global_step": 345914, "epoch": 4167} {"train_loss": -26.59454917907715, "global_step": 345915, "epoch": 4167} {"train_loss": -26.297870635986328, "global_step": 345916, "epoch": 4167} {"train_loss": -26.236169815063477, "global_step": 345917, "epoch": 4167} {"train_loss": -26.5085506439209, "global_step": 345918, "epoch": 4167} {"train_loss": -26.52678871154785, "global_step": 345919, "epoch": 4167} {"train_loss": -25.99444580078125, "global_step": 345920, "epoch": 4167} {"train_loss": -26.17975425720215, "global_step": 345921, "epoch": 4167} {"train_loss": -26.13685417175293, "global_step": 345922, "epoch": 4167} {"train_loss": -26.52129554748535, "global_step": 345923, "epoch": 4167} {"train_loss": -26.2320499420166, "global_step": 345924, "epoch": 4167} {"train_loss": -26.456090927124023, "global_step": 345925, "epoch": 4167} {"train_loss": -26.13848876953125, "global_step": 345926, "epoch": 4167} {"train_loss": -26.22492027282715, "global_step": 345927, "epoch": 4167} {"train_loss": -26.475454330444336, "global_step": 345928, "epoch": 4167} {"train_loss": -26.2713623046875, "global_step": 345929, "epoch": 4167} {"train_loss": -26.531265258789062, "global_step": 345930, "epoch": 4167} {"train_loss": -26.274478912353516, "global_step": 345931, "epoch": 4167} {"train_loss": -26.234088897705078, "global_step": 345932, "epoch": 4167} {"train_loss": -26.48638916015625, "global_step": 345933, "epoch": 4167} {"train_loss": -26.420995712280273, "global_step": 345934, "epoch": 4167} {"train_loss": -26.488317489624023, "global_step": 345935, "epoch": 4167} {"train_loss": -26.1428279876709, "global_step": 345936, "epoch": 4167} {"train_loss": -26.481098175048828, "global_step": 345937, "epoch": 4167} {"train_loss": -26.584314346313477, "global_step": 345938, "epoch": 4167} {"train_loss": -26.512765884399414, "global_step": 345939, "epoch": 4167} {"train_loss": -25.910322189331055, "global_step": 345940, "epoch": 4167} {"train_loss": -26.568592071533203, "global_step": 345941, "epoch": 4167} {"train_loss": -25.931638717651367, "global_step": 345942, "epoch": 4167} {"train_loss": -25.98594667825354, "global_step": 345943, "epoch": 4167, "val_loss": 6619283.0} {"train_loss": -25.731351852416992, "global_step": 345944, "epoch": 4168} {"train_loss": -25.425827026367188, "global_step": 345945, "epoch": 4168} {"train_loss": -24.865440368652344, "global_step": 345946, "epoch": 4168} {"train_loss": -24.59182357788086, "global_step": 345947, "epoch": 4168} {"train_loss": -25.217517852783203, "global_step": 345948, "epoch": 4168} {"train_loss": -25.498281478881836, "global_step": 345949, "epoch": 4168} {"train_loss": -25.562145233154297, "global_step": 345950, "epoch": 4168} {"train_loss": -25.455286026000977, "global_step": 345951, "epoch": 4168} {"train_loss": -25.703161239624023, "global_step": 345952, "epoch": 4168} {"train_loss": -25.726688385009766, "global_step": 345953, "epoch": 4168} {"train_loss": -25.85865592956543, "global_step": 345954, "epoch": 4168} {"train_loss": -25.81099510192871, "global_step": 345955, "epoch": 4168} {"train_loss": -25.531906127929688, "global_step": 345956, "epoch": 4168} {"train_loss": -26.08955192565918, "global_step": 345957, "epoch": 4168} {"train_loss": -25.627592086791992, "global_step": 345958, "epoch": 4168} {"train_loss": -25.76862144470215, "global_step": 345959, "epoch": 4168} {"train_loss": -26.17401123046875, "global_step": 345960, "epoch": 4168} {"train_loss": -25.924671173095703, "global_step": 345961, "epoch": 4168} {"train_loss": -25.99881362915039, "global_step": 345962, "epoch": 4168} {"train_loss": -25.657312393188477, "global_step": 345963, "epoch": 4168} {"train_loss": -25.781723022460938, "global_step": 345964, "epoch": 4168} {"train_loss": -25.678619384765625, "global_step": 345965, "epoch": 4168} {"train_loss": -26.085107803344727, "global_step": 345966, "epoch": 4168} {"train_loss": -26.318689346313477, "global_step": 345967, "epoch": 4168} {"train_loss": -25.5029239654541, "global_step": 345968, "epoch": 4168} {"train_loss": -25.940881729125977, "global_step": 345969, "epoch": 4168} {"train_loss": -26.16486167907715, "global_step": 345970, "epoch": 4168} {"train_loss": -26.16385269165039, "global_step": 345971, "epoch": 4168} {"train_loss": -25.85186195373535, "global_step": 345972, "epoch": 4168} {"train_loss": -25.824201583862305, "global_step": 345973, "epoch": 4168} {"train_loss": -26.1446475982666, "global_step": 345974, "epoch": 4168} {"train_loss": -26.363056182861328, "global_step": 345975, "epoch": 4168} {"train_loss": -26.2778263092041, "global_step": 345976, "epoch": 4168} {"train_loss": -26.45783805847168, "global_step": 345977, "epoch": 4168} {"train_loss": -26.517837524414062, "global_step": 345978, "epoch": 4168} {"train_loss": -26.10626220703125, "global_step": 345979, "epoch": 4168} {"train_loss": -26.476398468017578, "global_step": 345980, "epoch": 4168} {"train_loss": -25.96042251586914, "global_step": 345981, "epoch": 4168} {"train_loss": -26.34567642211914, "global_step": 345982, "epoch": 4168} {"train_loss": -26.2479248046875, "global_step": 345983, "epoch": 4168} {"train_loss": -26.322751998901367, "global_step": 345984, "epoch": 4168} {"train_loss": -26.433013916015625, "global_step": 345985, "epoch": 4168} {"train_loss": -26.26506996154785, "global_step": 345986, "epoch": 4168} {"train_loss": -26.010610580444336, "global_step": 345987, "epoch": 4168} {"train_loss": -26.389759063720703, "global_step": 345988, "epoch": 4168} {"train_loss": -26.469928741455078, "global_step": 345989, "epoch": 4168} {"train_loss": -26.229724884033203, "global_step": 345990, "epoch": 4168} {"train_loss": -26.13104248046875, "global_step": 345991, "epoch": 4168} {"train_loss": -26.219701766967773, "global_step": 345992, "epoch": 4168} {"train_loss": -26.641035079956055, "global_step": 345993, "epoch": 4168} {"train_loss": -26.145170211791992, "global_step": 345994, "epoch": 4168} {"train_loss": -26.5517520904541, "global_step": 345995, "epoch": 4168} {"train_loss": -26.21222496032715, "global_step": 345996, "epoch": 4168} {"train_loss": -26.1525936126709, "global_step": 345997, "epoch": 4168} {"train_loss": -25.980504989624023, "global_step": 345998, "epoch": 4168} {"train_loss": -26.208770751953125, "global_step": 345999, "epoch": 4168} {"train_loss": -26.21725845336914, "global_step": 346000, "epoch": 4168} {"train_loss": -26.00227165222168, "global_step": 346001, "epoch": 4168} {"train_loss": -26.147756576538086, "global_step": 346002, "epoch": 4168} {"train_loss": -26.12900733947754, "global_step": 346003, "epoch": 4168} {"train_loss": -26.276086807250977, "global_step": 346004, "epoch": 4168} {"train_loss": -25.859277725219727, "global_step": 346005, "epoch": 4168} {"train_loss": -26.369998931884766, "global_step": 346006, "epoch": 4168} {"train_loss": -26.236114501953125, "global_step": 346007, "epoch": 4168} {"train_loss": -26.313642501831055, "global_step": 346008, "epoch": 4168} {"train_loss": -26.108922958374023, "global_step": 346009, "epoch": 4168} {"train_loss": -26.1412353515625, "global_step": 346010, "epoch": 4168} {"train_loss": -26.21126365661621, "global_step": 346011, "epoch": 4168} {"train_loss": -26.132307052612305, "global_step": 346012, "epoch": 4168} {"train_loss": -26.66591453552246, "global_step": 346013, "epoch": 4168} {"train_loss": -26.511627197265625, "global_step": 346014, "epoch": 4168} {"train_loss": -26.546491622924805, "global_step": 346015, "epoch": 4168} {"train_loss": -26.4296932220459, "global_step": 346016, "epoch": 4168} {"train_loss": -26.28230857849121, "global_step": 346017, "epoch": 4168} {"train_loss": -26.2170352935791, "global_step": 346018, "epoch": 4168} {"train_loss": -25.963459014892578, "global_step": 346019, "epoch": 4168} {"train_loss": -26.414356231689453, "global_step": 346020, "epoch": 4168} {"train_loss": -26.113080978393555, "global_step": 346021, "epoch": 4168} {"train_loss": -25.718433380126953, "global_step": 346022, "epoch": 4168} {"train_loss": -26.20587730407715, "global_step": 346023, "epoch": 4168} {"train_loss": -26.445144653320312, "global_step": 346024, "epoch": 4168} {"train_loss": -26.24703025817871, "global_step": 346025, "epoch": 4168} {"train_loss": -26.04189711880971, "global_step": 346026, "epoch": 4168, "val_loss": 6616276.5} {"train_loss": -24.413190841674805, "global_step": 346027, "epoch": 4169} {"train_loss": -23.739587783813477, "global_step": 346028, "epoch": 4169} {"train_loss": -25.00991439819336, "global_step": 346029, "epoch": 4169} {"train_loss": -24.98836326599121, "global_step": 346030, "epoch": 4169} {"train_loss": -24.732603073120117, "global_step": 346031, "epoch": 4169} {"train_loss": -24.088171005249023, "global_step": 346032, "epoch": 4169} {"train_loss": -25.131010055541992, "global_step": 346033, "epoch": 4169} {"train_loss": -24.953855514526367, "global_step": 346034, "epoch": 4169} {"train_loss": -25.18910789489746, "global_step": 346035, "epoch": 4169} {"train_loss": -25.03325843811035, "global_step": 346036, "epoch": 4169} {"train_loss": -24.870121002197266, "global_step": 346037, "epoch": 4169} {"train_loss": -24.796340942382812, "global_step": 346038, "epoch": 4169} {"train_loss": -25.17899513244629, "global_step": 346039, "epoch": 4169} {"train_loss": -25.39959144592285, "global_step": 346040, "epoch": 4169} {"train_loss": -25.41959571838379, "global_step": 346041, "epoch": 4169} {"train_loss": -25.633636474609375, "global_step": 346042, "epoch": 4169} {"train_loss": -25.42720603942871, "global_step": 346043, "epoch": 4169} {"train_loss": -25.190216064453125, "global_step": 346044, "epoch": 4169} {"train_loss": -25.73252296447754, "global_step": 346045, "epoch": 4169} {"train_loss": -25.274555206298828, "global_step": 346046, "epoch": 4169} {"train_loss": -25.40801429748535, "global_step": 346047, "epoch": 4169} {"train_loss": -25.481719970703125, "global_step": 346048, "epoch": 4169} {"train_loss": -25.455549240112305, "global_step": 346049, "epoch": 4169} {"train_loss": -25.617477416992188, "global_step": 346050, "epoch": 4169} {"train_loss": -25.600576400756836, "global_step": 346051, "epoch": 4169} {"train_loss": -25.629541397094727, "global_step": 346052, "epoch": 4169} {"train_loss": -25.444076538085938, "global_step": 346053, "epoch": 4169} {"train_loss": -25.9622859954834, "global_step": 346054, "epoch": 4169} {"train_loss": -25.710494995117188, "global_step": 346055, "epoch": 4169} {"train_loss": -26.175085067749023, "global_step": 346056, "epoch": 4169} {"train_loss": -25.616479873657227, "global_step": 346057, "epoch": 4169} {"train_loss": -25.86402702331543, "global_step": 346058, "epoch": 4169} {"train_loss": -26.141162872314453, "global_step": 346059, "epoch": 4169} {"train_loss": -26.144287109375, "global_step": 346060, "epoch": 4169} {"train_loss": -25.625207901000977, "global_step": 346061, "epoch": 4169} {"train_loss": -25.903467178344727, "global_step": 346062, "epoch": 4169} {"train_loss": -26.059707641601562, "global_step": 346063, "epoch": 4169} {"train_loss": -25.657474517822266, "global_step": 346064, "epoch": 4169} {"train_loss": -26.014081954956055, "global_step": 346065, "epoch": 4169} {"train_loss": -26.214914321899414, "global_step": 346066, "epoch": 4169} {"train_loss": -26.289716720581055, "global_step": 346067, "epoch": 4169} {"train_loss": -26.05967140197754, "global_step": 346068, "epoch": 4169} {"train_loss": -25.866779327392578, "global_step": 346069, "epoch": 4169} {"train_loss": -26.13665199279785, "global_step": 346070, "epoch": 4169} {"train_loss": -26.06623649597168, "global_step": 346071, "epoch": 4169} {"train_loss": -26.103458404541016, "global_step": 346072, "epoch": 4169} {"train_loss": -26.2749080657959, "global_step": 346073, "epoch": 4169} {"train_loss": -26.207616806030273, "global_step": 346074, "epoch": 4169} {"train_loss": -25.71539306640625, "global_step": 346075, "epoch": 4169} {"train_loss": -26.131622314453125, "global_step": 346076, "epoch": 4169} {"train_loss": -26.204849243164062, "global_step": 346077, "epoch": 4169} {"train_loss": -26.378082275390625, "global_step": 346078, "epoch": 4169} {"train_loss": -26.0830020904541, "global_step": 346079, "epoch": 4169} {"train_loss": -26.183347702026367, "global_step": 346080, "epoch": 4169} {"train_loss": -26.427885055541992, "global_step": 346081, "epoch": 4169} {"train_loss": -26.366498947143555, "global_step": 346082, "epoch": 4169} {"train_loss": -26.712865829467773, "global_step": 346083, "epoch": 4169} {"train_loss": -26.484121322631836, "global_step": 346084, "epoch": 4169} {"train_loss": -26.28046989440918, "global_step": 346085, "epoch": 4169} {"train_loss": -26.48701286315918, "global_step": 346086, "epoch": 4169} {"train_loss": -26.256153106689453, "global_step": 346087, "epoch": 4169} {"train_loss": -26.264902114868164, "global_step": 346088, "epoch": 4169} {"train_loss": -26.159841537475586, "global_step": 346089, "epoch": 4169} {"train_loss": -26.359882354736328, "global_step": 346090, "epoch": 4169} {"train_loss": -25.655780792236328, "global_step": 346091, "epoch": 4169} {"train_loss": -26.36701774597168, "global_step": 346092, "epoch": 4169} {"train_loss": -26.111602783203125, "global_step": 346093, "epoch": 4169} {"train_loss": -25.946027755737305, "global_step": 346094, "epoch": 4169} {"train_loss": -26.26466941833496, "global_step": 346095, "epoch": 4169} {"train_loss": -26.024206161499023, "global_step": 346096, "epoch": 4169} {"train_loss": -25.590543746948242, "global_step": 346097, "epoch": 4169} {"train_loss": -25.513599395751953, "global_step": 346098, "epoch": 4169} {"train_loss": -26.549880981445312, "global_step": 346099, "epoch": 4169} {"train_loss": -25.89231300354004, "global_step": 346100, "epoch": 4169} {"train_loss": -25.02497100830078, "global_step": 346101, "epoch": 4169} {"train_loss": -25.821216583251953, "global_step": 346102, "epoch": 4169} {"train_loss": -25.33259391784668, "global_step": 346103, "epoch": 4169} {"train_loss": -25.347034454345703, "global_step": 346104, "epoch": 4169} {"train_loss": -26.074878692626953, "global_step": 346105, "epoch": 4169} {"train_loss": -25.730886459350586, "global_step": 346106, "epoch": 4169} {"train_loss": -25.858118057250977, "global_step": 346107, "epoch": 4169} {"train_loss": -25.803577423095703, "global_step": 346108, "epoch": 4169} {"train_loss": -25.73076252764966, "global_step": 346109, "epoch": 4169, "val_loss": 6647471.0} {"train_loss": -24.241384506225586, "global_step": 346110, "epoch": 4170} {"train_loss": -24.366260528564453, "global_step": 346111, "epoch": 4170} {"train_loss": -25.937271118164062, "global_step": 346112, "epoch": 4170} {"train_loss": -24.956817626953125, "global_step": 346113, "epoch": 4170} {"train_loss": -25.02467918395996, "global_step": 346114, "epoch": 4170} {"train_loss": -25.641576766967773, "global_step": 346115, "epoch": 4170} {"train_loss": -24.994417190551758, "global_step": 346116, "epoch": 4170} {"train_loss": -25.931018829345703, "global_step": 346117, "epoch": 4170} {"train_loss": -25.098526000976562, "global_step": 346118, "epoch": 4170} {"train_loss": -25.50986671447754, "global_step": 346119, "epoch": 4170} {"train_loss": -25.564899444580078, "global_step": 346120, "epoch": 4170} {"train_loss": -25.650121688842773, "global_step": 346121, "epoch": 4170} {"train_loss": -25.604711532592773, "global_step": 346122, "epoch": 4170} {"train_loss": -25.73627281188965, "global_step": 346123, "epoch": 4170} {"train_loss": -25.7113037109375, "global_step": 346124, "epoch": 4170} {"train_loss": -26.101520538330078, "global_step": 346125, "epoch": 4170} {"train_loss": -25.65302848815918, "global_step": 346126, "epoch": 4170} {"train_loss": -26.294208526611328, "global_step": 346127, "epoch": 4170} {"train_loss": -25.763397216796875, "global_step": 346128, "epoch": 4170} {"train_loss": -25.801136016845703, "global_step": 346129, "epoch": 4170} {"train_loss": -25.864831924438477, "global_step": 346130, "epoch": 4170} {"train_loss": -25.800870895385742, "global_step": 346131, "epoch": 4170} {"train_loss": -26.02752113342285, "global_step": 346132, "epoch": 4170} {"train_loss": -25.908859252929688, "global_step": 346133, "epoch": 4170} {"train_loss": -25.90192985534668, "global_step": 346134, "epoch": 4170} {"train_loss": -26.227323532104492, "global_step": 346135, "epoch": 4170} {"train_loss": -26.12653160095215, "global_step": 346136, "epoch": 4170} {"train_loss": -26.007125854492188, "global_step": 346137, "epoch": 4170} {"train_loss": -25.745153427124023, "global_step": 346138, "epoch": 4170} {"train_loss": -25.609277725219727, "global_step": 346139, "epoch": 4170} {"train_loss": -26.269454956054688, "global_step": 346140, "epoch": 4170} {"train_loss": -25.928958892822266, "global_step": 346141, "epoch": 4170} {"train_loss": -25.997522354125977, "global_step": 346142, "epoch": 4170} {"train_loss": -26.230512619018555, "global_step": 346143, "epoch": 4170} {"train_loss": -26.384305953979492, "global_step": 346144, "epoch": 4170} {"train_loss": -25.874988555908203, "global_step": 346145, "epoch": 4170} {"train_loss": -26.1841983795166, "global_step": 346146, "epoch": 4170} {"train_loss": -26.18251609802246, "global_step": 346147, "epoch": 4170} {"train_loss": -26.058988571166992, "global_step": 346148, "epoch": 4170} {"train_loss": -26.443899154663086, "global_step": 346149, "epoch": 4170} {"train_loss": -25.996906280517578, "global_step": 346150, "epoch": 4170} {"train_loss": -26.303760528564453, "global_step": 346151, "epoch": 4170} {"train_loss": -26.394269943237305, "global_step": 346152, "epoch": 4170} {"train_loss": -26.38458824157715, "global_step": 346153, "epoch": 4170} {"train_loss": -26.339242935180664, "global_step": 346154, "epoch": 4170} {"train_loss": -26.320459365844727, "global_step": 346155, "epoch": 4170} {"train_loss": -26.19137954711914, "global_step": 346156, "epoch": 4170} {"train_loss": -26.302932739257812, "global_step": 346157, "epoch": 4170} {"train_loss": -26.470239639282227, "global_step": 346158, "epoch": 4170} {"train_loss": -26.262643814086914, "global_step": 346159, "epoch": 4170} {"train_loss": -26.1363525390625, "global_step": 346160, "epoch": 4170} {"train_loss": -25.821002960205078, "global_step": 346161, "epoch": 4170} {"train_loss": -26.0334415435791, "global_step": 346162, "epoch": 4170} {"train_loss": -26.191320419311523, "global_step": 346163, "epoch": 4170} {"train_loss": -26.266469955444336, "global_step": 346164, "epoch": 4170} {"train_loss": -25.90589714050293, "global_step": 346165, "epoch": 4170} {"train_loss": -26.177600860595703, "global_step": 346166, "epoch": 4170} {"train_loss": -26.54597282409668, "global_step": 346167, "epoch": 4170} {"train_loss": -25.818998336791992, "global_step": 346168, "epoch": 4170} {"train_loss": -26.423095703125, "global_step": 346169, "epoch": 4170} {"train_loss": -26.168655395507812, "global_step": 346170, "epoch": 4170} {"train_loss": -26.31861686706543, "global_step": 346171, "epoch": 4170} {"train_loss": -26.07177734375, "global_step": 346172, "epoch": 4170} {"train_loss": -26.524457931518555, "global_step": 346173, "epoch": 4170} {"train_loss": -26.421905517578125, "global_step": 346174, "epoch": 4170} {"train_loss": -26.230859756469727, "global_step": 346175, "epoch": 4170} {"train_loss": -26.442214965820312, "global_step": 346176, "epoch": 4170} {"train_loss": -26.414264678955078, "global_step": 346177, "epoch": 4170} {"train_loss": -26.20716667175293, "global_step": 346178, "epoch": 4170} {"train_loss": -26.325260162353516, "global_step": 346179, "epoch": 4170} {"train_loss": -26.31207847595215, "global_step": 346180, "epoch": 4170} {"train_loss": -26.513916015625, "global_step": 346181, "epoch": 4170} {"train_loss": -26.307607650756836, "global_step": 346182, "epoch": 4170} {"train_loss": -26.162694931030273, "global_step": 346183, "epoch": 4170} {"train_loss": -26.24619483947754, "global_step": 346184, "epoch": 4170} {"train_loss": -26.155689239501953, "global_step": 346185, "epoch": 4170} {"train_loss": -26.12735939025879, "global_step": 346186, "epoch": 4170} {"train_loss": -26.0425968170166, "global_step": 346187, "epoch": 4170} {"train_loss": -26.263381958007812, "global_step": 346188, "epoch": 4170} {"train_loss": -26.375268936157227, "global_step": 346189, "epoch": 4170} {"train_loss": -26.310766220092773, "global_step": 346190, "epoch": 4170} {"train_loss": -26.182321548461914, "global_step": 346191, "epoch": 4170} {"train_loss": -26.012982770621058, "global_step": 346192, "epoch": 4170, "val_loss": 6562852.0} {"train_loss": -25.8040828704834, "global_step": 346193, "epoch": 4171} {"train_loss": -25.086376190185547, "global_step": 346194, "epoch": 4171} {"train_loss": -26.09389305114746, "global_step": 346195, "epoch": 4171} {"train_loss": -25.724706649780273, "global_step": 346196, "epoch": 4171} {"train_loss": -25.18253517150879, "global_step": 346197, "epoch": 4171} {"train_loss": -24.800731658935547, "global_step": 346198, "epoch": 4171} {"train_loss": -25.88201332092285, "global_step": 346199, "epoch": 4171} {"train_loss": -25.92707633972168, "global_step": 346200, "epoch": 4171} {"train_loss": -25.8525333404541, "global_step": 346201, "epoch": 4171} {"train_loss": -25.75079917907715, "global_step": 346202, "epoch": 4171} {"train_loss": -25.9224796295166, "global_step": 346203, "epoch": 4171} {"train_loss": -25.7071590423584, "global_step": 346204, "epoch": 4171} {"train_loss": -25.884536743164062, "global_step": 346205, "epoch": 4171} {"train_loss": -25.978330612182617, "global_step": 346206, "epoch": 4171} {"train_loss": -26.028736114501953, "global_step": 346207, "epoch": 4171} {"train_loss": -26.231128692626953, "global_step": 346208, "epoch": 4171} {"train_loss": -26.148725509643555, "global_step": 346209, "epoch": 4171} {"train_loss": -26.1597843170166, "global_step": 346210, "epoch": 4171} {"train_loss": -26.37238121032715, "global_step": 346211, "epoch": 4171} {"train_loss": -25.593839645385742, "global_step": 346212, "epoch": 4171} {"train_loss": -26.05610466003418, "global_step": 346213, "epoch": 4171} {"train_loss": -26.038288116455078, "global_step": 346214, "epoch": 4171} {"train_loss": -26.195749282836914, "global_step": 346215, "epoch": 4171} {"train_loss": -25.924650192260742, "global_step": 346216, "epoch": 4171} {"train_loss": -26.196462631225586, "global_step": 346217, "epoch": 4171} {"train_loss": -26.037458419799805, "global_step": 346218, "epoch": 4171} {"train_loss": -25.974451065063477, "global_step": 346219, "epoch": 4171} {"train_loss": -26.16181755065918, "global_step": 346220, "epoch": 4171} {"train_loss": -26.310688018798828, "global_step": 346221, "epoch": 4171} {"train_loss": -26.117944717407227, "global_step": 346222, "epoch": 4171} {"train_loss": -26.03501319885254, "global_step": 346223, "epoch": 4171} {"train_loss": -26.268346786499023, "global_step": 346224, "epoch": 4171} {"train_loss": -26.051435470581055, "global_step": 346225, "epoch": 4171} {"train_loss": -25.986255645751953, "global_step": 346226, "epoch": 4171} {"train_loss": -26.163049697875977, "global_step": 346227, "epoch": 4171} {"train_loss": -26.20318031311035, "global_step": 346228, "epoch": 4171} {"train_loss": -26.39106559753418, "global_step": 346229, "epoch": 4171} {"train_loss": -26.457305908203125, "global_step": 346230, "epoch": 4171} {"train_loss": -26.36171531677246, "global_step": 346231, "epoch": 4171} {"train_loss": -26.1175479888916, "global_step": 346232, "epoch": 4171} {"train_loss": -26.203109741210938, "global_step": 346233, "epoch": 4171} {"train_loss": -26.3386287689209, "global_step": 346234, "epoch": 4171} {"train_loss": -26.345367431640625, "global_step": 346235, "epoch": 4171} {"train_loss": -26.15884780883789, "global_step": 346236, "epoch": 4171} {"train_loss": -26.02814292907715, "global_step": 346237, "epoch": 4171} {"train_loss": -26.246591567993164, "global_step": 346238, "epoch": 4171} {"train_loss": -26.32710075378418, "global_step": 346239, "epoch": 4171} {"train_loss": -26.411224365234375, "global_step": 346240, "epoch": 4171} {"train_loss": -26.049930572509766, "global_step": 346241, "epoch": 4171} {"train_loss": -26.323322296142578, "global_step": 346242, "epoch": 4171} {"train_loss": -25.92963218688965, "global_step": 346243, "epoch": 4171} {"train_loss": -26.28704833984375, "global_step": 346244, "epoch": 4171} {"train_loss": -26.21768569946289, "global_step": 346245, "epoch": 4171} {"train_loss": -26.26316261291504, "global_step": 346246, "epoch": 4171} {"train_loss": -25.850263595581055, "global_step": 346247, "epoch": 4171} {"train_loss": -25.934789657592773, "global_step": 346248, "epoch": 4171} {"train_loss": -25.875452041625977, "global_step": 346249, "epoch": 4171} {"train_loss": -26.14216423034668, "global_step": 346250, "epoch": 4171} {"train_loss": -25.997167587280273, "global_step": 346251, "epoch": 4171} {"train_loss": -26.046960830688477, "global_step": 346252, "epoch": 4171} {"train_loss": -26.112035751342773, "global_step": 346253, "epoch": 4171} {"train_loss": -26.282087326049805, "global_step": 346254, "epoch": 4171} {"train_loss": -26.587072372436523, "global_step": 346255, "epoch": 4171} {"train_loss": -26.44764518737793, "global_step": 346256, "epoch": 4171} {"train_loss": -26.198139190673828, "global_step": 346257, "epoch": 4171} {"train_loss": -26.428516387939453, "global_step": 346258, "epoch": 4171} {"train_loss": -26.353330612182617, "global_step": 346259, "epoch": 4171} {"train_loss": -26.08977699279785, "global_step": 346260, "epoch": 4171} {"train_loss": -25.700876235961914, "global_step": 346261, "epoch": 4171} {"train_loss": -25.000690460205078, "global_step": 346262, "epoch": 4171} {"train_loss": -25.0627384185791, "global_step": 346263, "epoch": 4171} {"train_loss": -25.104833602905273, "global_step": 346264, "epoch": 4171} {"train_loss": -25.583242416381836, "global_step": 346265, "epoch": 4171} {"train_loss": -25.904083251953125, "global_step": 346266, "epoch": 4171} {"train_loss": -25.898456573486328, "global_step": 346267, "epoch": 4171} {"train_loss": -25.6541805267334, "global_step": 346268, "epoch": 4171} {"train_loss": -25.890674591064453, "global_step": 346269, "epoch": 4171} {"train_loss": -25.54963493347168, "global_step": 346270, "epoch": 4171} {"train_loss": -25.920618057250977, "global_step": 346271, "epoch": 4171} {"train_loss": -25.989797592163086, "global_step": 346272, "epoch": 4171} {"train_loss": -25.8774356842041, "global_step": 346273, "epoch": 4171} {"train_loss": -25.646020889282227, "global_step": 346274, "epoch": 4171} {"train_loss": -26.020879837403815, "global_step": 346275, "epoch": 4171, "val_loss": 6608540.0} {"train_loss": -25.234506607055664, "global_step": 346276, "epoch": 4172} {"train_loss": -25.611438751220703, "global_step": 346277, "epoch": 4172} {"train_loss": -25.499155044555664, "global_step": 346278, "epoch": 4172} {"train_loss": -25.686498641967773, "global_step": 346279, "epoch": 4172} {"train_loss": -25.09552001953125, "global_step": 346280, "epoch": 4172} {"train_loss": -25.262983322143555, "global_step": 346281, "epoch": 4172} {"train_loss": -25.804107666015625, "global_step": 346282, "epoch": 4172} {"train_loss": -25.557788848876953, "global_step": 346283, "epoch": 4172} {"train_loss": -25.375490188598633, "global_step": 346284, "epoch": 4172} {"train_loss": -25.749059677124023, "global_step": 346285, "epoch": 4172} {"train_loss": -25.876113891601562, "global_step": 346286, "epoch": 4172} {"train_loss": -25.683454513549805, "global_step": 346287, "epoch": 4172} {"train_loss": -26.035364151000977, "global_step": 346288, "epoch": 4172} {"train_loss": -25.723876953125, "global_step": 346289, "epoch": 4172} {"train_loss": -25.867456436157227, "global_step": 346290, "epoch": 4172} {"train_loss": -25.728673934936523, "global_step": 346291, "epoch": 4172} {"train_loss": -26.079694747924805, "global_step": 346292, "epoch": 4172} {"train_loss": -25.877731323242188, "global_step": 346293, "epoch": 4172} {"train_loss": -25.641265869140625, "global_step": 346294, "epoch": 4172} {"train_loss": -25.901769638061523, "global_step": 346295, "epoch": 4172} {"train_loss": -25.96172523498535, "global_step": 346296, "epoch": 4172} {"train_loss": -26.08942222595215, "global_step": 346297, "epoch": 4172} {"train_loss": -26.054269790649414, "global_step": 346298, "epoch": 4172} {"train_loss": -26.178510665893555, "global_step": 346299, "epoch": 4172} {"train_loss": -26.16513442993164, "global_step": 346300, "epoch": 4172} {"train_loss": -25.790973663330078, "global_step": 346301, "epoch": 4172} {"train_loss": -26.014362335205078, "global_step": 346302, "epoch": 4172} {"train_loss": -26.58893394470215, "global_step": 346303, "epoch": 4172} {"train_loss": -26.178293228149414, "global_step": 346304, "epoch": 4172} {"train_loss": -26.51922607421875, "global_step": 346305, "epoch": 4172} {"train_loss": -26.41756248474121, "global_step": 346306, "epoch": 4172} {"train_loss": -26.35148048400879, "global_step": 346307, "epoch": 4172} {"train_loss": -25.78644371032715, "global_step": 346308, "epoch": 4172} {"train_loss": -26.0284366607666, "global_step": 346309, "epoch": 4172} {"train_loss": -26.255456924438477, "global_step": 346310, "epoch": 4172} {"train_loss": -26.14643669128418, "global_step": 346311, "epoch": 4172} {"train_loss": -26.456750869750977, "global_step": 346312, "epoch": 4172} {"train_loss": -26.092992782592773, "global_step": 346313, "epoch": 4172} {"train_loss": -26.2181396484375, "global_step": 346314, "epoch": 4172} {"train_loss": -26.26201820373535, "global_step": 346315, "epoch": 4172} {"train_loss": -26.249082565307617, "global_step": 346316, "epoch": 4172} {"train_loss": -26.163909912109375, "global_step": 346317, "epoch": 4172} {"train_loss": -26.36223793029785, "global_step": 346318, "epoch": 4172} {"train_loss": -26.299823760986328, "global_step": 346319, "epoch": 4172} {"train_loss": -26.436960220336914, "global_step": 346320, "epoch": 4172} {"train_loss": -26.404306411743164, "global_step": 346321, "epoch": 4172} {"train_loss": -26.44917869567871, "global_step": 346322, "epoch": 4172} {"train_loss": -26.20148277282715, "global_step": 346323, "epoch": 4172} {"train_loss": -26.146442413330078, "global_step": 346324, "epoch": 4172} {"train_loss": -26.614334106445312, "global_step": 346325, "epoch": 4172} {"train_loss": -26.479080200195312, "global_step": 346326, "epoch": 4172} {"train_loss": -26.14592933654785, "global_step": 346327, "epoch": 4172} {"train_loss": -26.620941162109375, "global_step": 346328, "epoch": 4172} {"train_loss": -26.370107650756836, "global_step": 346329, "epoch": 4172} {"train_loss": -26.32623291015625, "global_step": 346330, "epoch": 4172} {"train_loss": -26.74970817565918, "global_step": 346331, "epoch": 4172} {"train_loss": -26.160253524780273, "global_step": 346332, "epoch": 4172} {"train_loss": -25.925390243530273, "global_step": 346333, "epoch": 4172} {"train_loss": -25.894323348999023, "global_step": 346334, "epoch": 4172} {"train_loss": -26.199289321899414, "global_step": 346335, "epoch": 4172} {"train_loss": -26.341922760009766, "global_step": 346336, "epoch": 4172} {"train_loss": -26.49948501586914, "global_step": 346337, "epoch": 4172} {"train_loss": -26.355833053588867, "global_step": 346338, "epoch": 4172} {"train_loss": -26.534637451171875, "global_step": 346339, "epoch": 4172} {"train_loss": -26.322729110717773, "global_step": 346340, "epoch": 4172} {"train_loss": -26.5202693939209, "global_step": 346341, "epoch": 4172} {"train_loss": -26.051776885986328, "global_step": 346342, "epoch": 4172} {"train_loss": -26.319538116455078, "global_step": 346343, "epoch": 4172} {"train_loss": -26.25496482849121, "global_step": 346344, "epoch": 4172} {"train_loss": -26.0604305267334, "global_step": 346345, "epoch": 4172} {"train_loss": -26.1097469329834, "global_step": 346346, "epoch": 4172} {"train_loss": -26.164411544799805, "global_step": 346347, "epoch": 4172} {"train_loss": -26.3270206451416, "global_step": 346348, "epoch": 4172} {"train_loss": -26.013696670532227, "global_step": 346349, "epoch": 4172} {"train_loss": -25.92914390563965, "global_step": 346350, "epoch": 4172} {"train_loss": -26.459394454956055, "global_step": 346351, "epoch": 4172} {"train_loss": -26.129636764526367, "global_step": 346352, "epoch": 4172} {"train_loss": -26.379846572875977, "global_step": 346353, "epoch": 4172} {"train_loss": -25.74069595336914, "global_step": 346354, "epoch": 4172} {"train_loss": -26.110315322875977, "global_step": 346355, "epoch": 4172} {"train_loss": -26.174650192260742, "global_step": 346356, "epoch": 4172} {"train_loss": -26.29835319519043, "global_step": 346357, "epoch": 4172} {"train_loss": -26.096734747829206, "global_step": 346358, "epoch": 4172, "val_loss": 6539556.5} {"train_loss": -25.543546676635742, "global_step": 346359, "epoch": 4173} {"train_loss": -25.797460556030273, "global_step": 346360, "epoch": 4173} {"train_loss": -25.79781150817871, "global_step": 346361, "epoch": 4173} {"train_loss": -26.175764083862305, "global_step": 346362, "epoch": 4173} {"train_loss": -25.540159225463867, "global_step": 346363, "epoch": 4173} {"train_loss": -26.079259872436523, "global_step": 346364, "epoch": 4173} {"train_loss": -25.978132247924805, "global_step": 346365, "epoch": 4173} {"train_loss": -25.85723876953125, "global_step": 346366, "epoch": 4173} {"train_loss": -26.1141357421875, "global_step": 346367, "epoch": 4173} {"train_loss": -25.98542594909668, "global_step": 346368, "epoch": 4173} {"train_loss": -25.974546432495117, "global_step": 346369, "epoch": 4173} {"train_loss": -25.96787452697754, "global_step": 346370, "epoch": 4173} {"train_loss": -25.88185691833496, "global_step": 346371, "epoch": 4173} {"train_loss": -25.868207931518555, "global_step": 346372, "epoch": 4173} {"train_loss": -25.890050888061523, "global_step": 346373, "epoch": 4173} {"train_loss": -25.985675811767578, "global_step": 346374, "epoch": 4173} {"train_loss": -26.12824058532715, "global_step": 346375, "epoch": 4173} {"train_loss": -25.8961238861084, "global_step": 346376, "epoch": 4173} {"train_loss": -26.185211181640625, "global_step": 346377, "epoch": 4173} {"train_loss": -26.005359649658203, "global_step": 346378, "epoch": 4173} {"train_loss": -25.703428268432617, "global_step": 346379, "epoch": 4173} {"train_loss": -25.908523559570312, "global_step": 346380, "epoch": 4173} {"train_loss": -26.1073055267334, "global_step": 346381, "epoch": 4173} {"train_loss": -26.068342208862305, "global_step": 346382, "epoch": 4173} {"train_loss": -26.196409225463867, "global_step": 346383, "epoch": 4173} {"train_loss": -26.358570098876953, "global_step": 346384, "epoch": 4173} {"train_loss": -26.372949600219727, "global_step": 346385, "epoch": 4173} {"train_loss": -26.466054916381836, "global_step": 346386, "epoch": 4173} {"train_loss": -26.05666160583496, "global_step": 346387, "epoch": 4173} {"train_loss": -26.235639572143555, "global_step": 346388, "epoch": 4173} {"train_loss": -26.54937171936035, "global_step": 346389, "epoch": 4173} {"train_loss": -25.92995262145996, "global_step": 346390, "epoch": 4173} {"train_loss": -26.148624420166016, "global_step": 346391, "epoch": 4173} {"train_loss": -26.537076950073242, "global_step": 346392, "epoch": 4173} {"train_loss": -26.473834991455078, "global_step": 346393, "epoch": 4173} {"train_loss": -26.6433048248291, "global_step": 346394, "epoch": 4173} {"train_loss": -26.17616081237793, "global_step": 346395, "epoch": 4173} {"train_loss": -26.470335006713867, "global_step": 346396, "epoch": 4173} {"train_loss": -26.453516006469727, "global_step": 346397, "epoch": 4173} {"train_loss": -26.402389526367188, "global_step": 346398, "epoch": 4173} {"train_loss": -26.3686580657959, "global_step": 346399, "epoch": 4173} {"train_loss": -26.397705078125, "global_step": 346400, "epoch": 4173} {"train_loss": -26.401050567626953, "global_step": 346401, "epoch": 4173} {"train_loss": -26.335987091064453, "global_step": 346402, "epoch": 4173} {"train_loss": -26.363080978393555, "global_step": 346403, "epoch": 4173} {"train_loss": -26.484827041625977, "global_step": 346404, "epoch": 4173} {"train_loss": -26.34067726135254, "global_step": 346405, "epoch": 4173} {"train_loss": -26.23243522644043, "global_step": 346406, "epoch": 4173} {"train_loss": -26.15690040588379, "global_step": 346407, "epoch": 4173} {"train_loss": -26.20487403869629, "global_step": 346408, "epoch": 4173} {"train_loss": -26.11612319946289, "global_step": 346409, "epoch": 4173} {"train_loss": -26.164794921875, "global_step": 346410, "epoch": 4173} {"train_loss": -26.002307891845703, "global_step": 346411, "epoch": 4173} {"train_loss": -26.122156143188477, "global_step": 346412, "epoch": 4173} {"train_loss": -25.88252067565918, "global_step": 346413, "epoch": 4173} {"train_loss": -25.966083526611328, "global_step": 346414, "epoch": 4173} {"train_loss": -26.0181884765625, "global_step": 346415, "epoch": 4173} {"train_loss": -25.897247314453125, "global_step": 346416, "epoch": 4173} {"train_loss": -26.324148178100586, "global_step": 346417, "epoch": 4173} {"train_loss": -26.28240966796875, "global_step": 346418, "epoch": 4173} {"train_loss": -25.84402847290039, "global_step": 346419, "epoch": 4173} {"train_loss": -26.56757926940918, "global_step": 346420, "epoch": 4173} {"train_loss": -26.261795043945312, "global_step": 346421, "epoch": 4173} {"train_loss": -26.134796142578125, "global_step": 346422, "epoch": 4173} {"train_loss": -25.1852970123291, "global_step": 346423, "epoch": 4173} {"train_loss": -25.55933380126953, "global_step": 346424, "epoch": 4173} {"train_loss": -25.51555061340332, "global_step": 346425, "epoch": 4173} {"train_loss": -26.097583770751953, "global_step": 346426, "epoch": 4173} {"train_loss": -25.589313507080078, "global_step": 346427, "epoch": 4173} {"train_loss": -25.642765045166016, "global_step": 346428, "epoch": 4173} {"train_loss": -25.932392120361328, "global_step": 346429, "epoch": 4173} {"train_loss": -26.028345108032227, "global_step": 346430, "epoch": 4173} {"train_loss": -25.944385528564453, "global_step": 346431, "epoch": 4173} {"train_loss": -26.1391658782959, "global_step": 346432, "epoch": 4173} {"train_loss": -25.612314224243164, "global_step": 346433, "epoch": 4173} {"train_loss": -26.11880874633789, "global_step": 346434, "epoch": 4173} {"train_loss": -25.817941665649414, "global_step": 346435, "epoch": 4173} {"train_loss": -25.952301025390625, "global_step": 346436, "epoch": 4173} {"train_loss": -26.184009552001953, "global_step": 346437, "epoch": 4173} {"train_loss": -26.0992488861084, "global_step": 346438, "epoch": 4173} {"train_loss": -26.23139762878418, "global_step": 346439, "epoch": 4173} {"train_loss": -26.2383975982666, "global_step": 346440, "epoch": 4173} {"train_loss": -26.114082750067652, "global_step": 346441, "epoch": 4173, "val_loss": 6545984.5} {"train_loss": -24.1315975189209, "global_step": 346442, "epoch": 4174} {"train_loss": -24.3001766204834, "global_step": 346443, "epoch": 4174} {"train_loss": -24.003110885620117, "global_step": 346444, "epoch": 4174} {"train_loss": -25.565603256225586, "global_step": 346445, "epoch": 4174} {"train_loss": -23.927541732788086, "global_step": 346446, "epoch": 4174} {"train_loss": -25.80446434020996, "global_step": 346447, "epoch": 4174} {"train_loss": -24.701454162597656, "global_step": 346448, "epoch": 4174} {"train_loss": -25.556264877319336, "global_step": 346449, "epoch": 4174} {"train_loss": -25.15789794921875, "global_step": 346450, "epoch": 4174} {"train_loss": -25.516021728515625, "global_step": 346451, "epoch": 4174} {"train_loss": -25.604772567749023, "global_step": 346452, "epoch": 4174} {"train_loss": -25.393346786499023, "global_step": 346453, "epoch": 4174} {"train_loss": -25.53829002380371, "global_step": 346454, "epoch": 4174} {"train_loss": -25.53872299194336, "global_step": 346455, "epoch": 4174} {"train_loss": -25.582420349121094, "global_step": 346456, "epoch": 4174} {"train_loss": -25.345523834228516, "global_step": 346457, "epoch": 4174} {"train_loss": -25.886062622070312, "global_step": 346458, "epoch": 4174} {"train_loss": -25.736364364624023, "global_step": 346459, "epoch": 4174} {"train_loss": -25.481555938720703, "global_step": 346460, "epoch": 4174} {"train_loss": -25.774429321289062, "global_step": 346461, "epoch": 4174} {"train_loss": -25.9226131439209, "global_step": 346462, "epoch": 4174} {"train_loss": -25.744726181030273, "global_step": 346463, "epoch": 4174} {"train_loss": -25.934722900390625, "global_step": 346464, "epoch": 4174} {"train_loss": -25.712751388549805, "global_step": 346465, "epoch": 4174} {"train_loss": -25.671878814697266, "global_step": 346466, "epoch": 4174} {"train_loss": -26.068607330322266, "global_step": 346467, "epoch": 4174} {"train_loss": -25.874536514282227, "global_step": 346468, "epoch": 4174} {"train_loss": -25.911291122436523, "global_step": 346469, "epoch": 4174} {"train_loss": -25.554523468017578, "global_step": 346470, "epoch": 4174} {"train_loss": -26.000293731689453, "global_step": 346471, "epoch": 4174} {"train_loss": -26.209747314453125, "global_step": 346472, "epoch": 4174} {"train_loss": -26.015539169311523, "global_step": 346473, "epoch": 4174} {"train_loss": -25.880863189697266, "global_step": 346474, "epoch": 4174} {"train_loss": -26.0025634765625, "global_step": 346475, "epoch": 4174} {"train_loss": -26.005054473876953, "global_step": 346476, "epoch": 4174} {"train_loss": -25.831501007080078, "global_step": 346477, "epoch": 4174} {"train_loss": -26.28369140625, "global_step": 346478, "epoch": 4174} {"train_loss": -26.109792709350586, "global_step": 346479, "epoch": 4174} {"train_loss": -26.095678329467773, "global_step": 346480, "epoch": 4174} {"train_loss": -26.30364990234375, "global_step": 346481, "epoch": 4174} {"train_loss": -26.005054473876953, "global_step": 346482, "epoch": 4174} {"train_loss": -26.307226181030273, "global_step": 346483, "epoch": 4174} {"train_loss": -26.621618270874023, "global_step": 346484, "epoch": 4174} {"train_loss": -26.36287498474121, "global_step": 346485, "epoch": 4174} {"train_loss": -26.053333282470703, "global_step": 346486, "epoch": 4174} {"train_loss": -26.10089111328125, "global_step": 346487, "epoch": 4174} {"train_loss": -26.21006202697754, "global_step": 346488, "epoch": 4174} {"train_loss": -26.267126083374023, "global_step": 346489, "epoch": 4174} {"train_loss": -26.270166397094727, "global_step": 346490, "epoch": 4174} {"train_loss": -26.330734252929688, "global_step": 346491, "epoch": 4174} {"train_loss": -25.893354415893555, "global_step": 346492, "epoch": 4174} {"train_loss": -26.25904655456543, "global_step": 346493, "epoch": 4174} {"train_loss": -26.332061767578125, "global_step": 346494, "epoch": 4174} {"train_loss": -26.519458770751953, "global_step": 346495, "epoch": 4174} {"train_loss": -25.91400718688965, "global_step": 346496, "epoch": 4174} {"train_loss": -26.06782341003418, "global_step": 346497, "epoch": 4174} {"train_loss": -26.10749626159668, "global_step": 346498, "epoch": 4174} {"train_loss": -26.1217041015625, "global_step": 346499, "epoch": 4174} {"train_loss": -26.418411254882812, "global_step": 346500, "epoch": 4174} {"train_loss": -26.45074462890625, "global_step": 346501, "epoch": 4174} {"train_loss": -26.57484245300293, "global_step": 346502, "epoch": 4174} {"train_loss": -26.158111572265625, "global_step": 346503, "epoch": 4174} {"train_loss": -26.074289321899414, "global_step": 346504, "epoch": 4174} {"train_loss": -25.99091911315918, "global_step": 346505, "epoch": 4174} {"train_loss": -26.428003311157227, "global_step": 346506, "epoch": 4174} {"train_loss": -26.33430290222168, "global_step": 346507, "epoch": 4174} {"train_loss": -25.75634765625, "global_step": 346508, "epoch": 4174} {"train_loss": -26.166532516479492, "global_step": 346509, "epoch": 4174} {"train_loss": -25.837942123413086, "global_step": 346510, "epoch": 4174} {"train_loss": -26.146697998046875, "global_step": 346511, "epoch": 4174} {"train_loss": -26.18418312072754, "global_step": 346512, "epoch": 4174} {"train_loss": -25.746057510375977, "global_step": 346513, "epoch": 4174} {"train_loss": -26.702655792236328, "global_step": 346514, "epoch": 4174} {"train_loss": -26.10125160217285, "global_step": 346515, "epoch": 4174} {"train_loss": -26.376861572265625, "global_step": 346516, "epoch": 4174} {"train_loss": -26.30622673034668, "global_step": 346517, "epoch": 4174} {"train_loss": -26.162002563476562, "global_step": 346518, "epoch": 4174} {"train_loss": -26.293914794921875, "global_step": 346519, "epoch": 4174} {"train_loss": -26.125295639038086, "global_step": 346520, "epoch": 4174} {"train_loss": -26.220035552978516, "global_step": 346521, "epoch": 4174} {"train_loss": -26.325056076049805, "global_step": 346522, "epoch": 4174} {"train_loss": -26.44161033630371, "global_step": 346523, "epoch": 4174} {"train_loss": -25.916881791080336, "global_step": 346524, "epoch": 4174, "val_loss": 6577728.5} {"train_loss": -25.462926864624023, "global_step": 346525, "epoch": 4175} {"train_loss": -25.338254928588867, "global_step": 346526, "epoch": 4175} {"train_loss": -24.781709671020508, "global_step": 346527, "epoch": 4175} {"train_loss": -25.106918334960938, "global_step": 346528, "epoch": 4175} {"train_loss": -25.437692642211914, "global_step": 346529, "epoch": 4175} {"train_loss": -25.47348403930664, "global_step": 346530, "epoch": 4175} {"train_loss": -25.840789794921875, "global_step": 346531, "epoch": 4175} {"train_loss": -25.763874053955078, "global_step": 346532, "epoch": 4175} {"train_loss": -25.243839263916016, "global_step": 346533, "epoch": 4175} {"train_loss": -25.857282638549805, "global_step": 346534, "epoch": 4175} {"train_loss": -25.901081085205078, "global_step": 346535, "epoch": 4175} {"train_loss": -25.751361846923828, "global_step": 346536, "epoch": 4175} {"train_loss": -25.810394287109375, "global_step": 346537, "epoch": 4175} {"train_loss": -25.74384117126465, "global_step": 346538, "epoch": 4175} {"train_loss": -25.989974975585938, "global_step": 346539, "epoch": 4175} {"train_loss": -25.8803653717041, "global_step": 346540, "epoch": 4175} {"train_loss": -25.99018669128418, "global_step": 346541, "epoch": 4175} {"train_loss": -26.477619171142578, "global_step": 346542, "epoch": 4175} {"train_loss": -25.952306747436523, "global_step": 346543, "epoch": 4175} {"train_loss": -25.770889282226562, "global_step": 346544, "epoch": 4175} {"train_loss": -25.854955673217773, "global_step": 346545, "epoch": 4175} {"train_loss": -25.6237735748291, "global_step": 346546, "epoch": 4175} {"train_loss": -25.6581974029541, "global_step": 346547, "epoch": 4175} {"train_loss": -26.358753204345703, "global_step": 346548, "epoch": 4175} {"train_loss": -25.807270050048828, "global_step": 346549, "epoch": 4175} {"train_loss": -25.957056045532227, "global_step": 346550, "epoch": 4175} {"train_loss": -25.70171546936035, "global_step": 346551, "epoch": 4175} {"train_loss": -25.8875732421875, "global_step": 346552, "epoch": 4175} {"train_loss": -25.979394912719727, "global_step": 346553, "epoch": 4175} {"train_loss": -25.797155380249023, "global_step": 346554, "epoch": 4175} {"train_loss": -25.90631675720215, "global_step": 346555, "epoch": 4175} {"train_loss": -26.469879150390625, "global_step": 346556, "epoch": 4175} {"train_loss": -26.038549423217773, "global_step": 346557, "epoch": 4175} {"train_loss": -25.839282989501953, "global_step": 346558, "epoch": 4175} {"train_loss": -25.82546043395996, "global_step": 346559, "epoch": 4175} {"train_loss": -26.147598266601562, "global_step": 346560, "epoch": 4175} {"train_loss": -25.98195457458496, "global_step": 346561, "epoch": 4175} {"train_loss": -25.874908447265625, "global_step": 346562, "epoch": 4175} {"train_loss": -26.01555824279785, "global_step": 346563, "epoch": 4175} {"train_loss": -25.877826690673828, "global_step": 346564, "epoch": 4175} {"train_loss": -26.131784439086914, "global_step": 346565, "epoch": 4175} {"train_loss": -25.72539710998535, "global_step": 346566, "epoch": 4175} {"train_loss": -26.108814239501953, "global_step": 346567, "epoch": 4175} {"train_loss": -26.21335220336914, "global_step": 346568, "epoch": 4175} {"train_loss": -26.01169204711914, "global_step": 346569, "epoch": 4175} {"train_loss": -26.0533447265625, "global_step": 346570, "epoch": 4175} {"train_loss": -26.412214279174805, "global_step": 346571, "epoch": 4175} {"train_loss": -25.916248321533203, "global_step": 346572, "epoch": 4175} {"train_loss": -26.019315719604492, "global_step": 346573, "epoch": 4175} {"train_loss": -25.883045196533203, "global_step": 346574, "epoch": 4175} {"train_loss": -26.12384605407715, "global_step": 346575, "epoch": 4175} {"train_loss": -26.094043731689453, "global_step": 346576, "epoch": 4175} {"train_loss": -26.084869384765625, "global_step": 346577, "epoch": 4175} {"train_loss": -26.313322067260742, "global_step": 346578, "epoch": 4175} {"train_loss": -26.497150421142578, "global_step": 346579, "epoch": 4175} {"train_loss": -25.8691349029541, "global_step": 346580, "epoch": 4175} {"train_loss": -26.203886032104492, "global_step": 346581, "epoch": 4175} {"train_loss": -26.483179092407227, "global_step": 346582, "epoch": 4175} {"train_loss": -26.53139305114746, "global_step": 346583, "epoch": 4175} {"train_loss": -26.06552505493164, "global_step": 346584, "epoch": 4175} {"train_loss": -26.397418975830078, "global_step": 346585, "epoch": 4175} {"train_loss": -26.212528228759766, "global_step": 346586, "epoch": 4175} {"train_loss": -26.3663272857666, "global_step": 346587, "epoch": 4175} {"train_loss": -26.178363800048828, "global_step": 346588, "epoch": 4175} {"train_loss": -26.11452293395996, "global_step": 346589, "epoch": 4175} {"train_loss": -26.09744644165039, "global_step": 346590, "epoch": 4175} {"train_loss": -26.402374267578125, "global_step": 346591, "epoch": 4175} {"train_loss": -26.07105827331543, "global_step": 346592, "epoch": 4175} {"train_loss": -26.13922691345215, "global_step": 346593, "epoch": 4175} {"train_loss": -26.283849716186523, "global_step": 346594, "epoch": 4175} {"train_loss": -26.15435791015625, "global_step": 346595, "epoch": 4175} {"train_loss": -26.290796279907227, "global_step": 346596, "epoch": 4175} {"train_loss": -25.94196128845215, "global_step": 346597, "epoch": 4175} {"train_loss": -26.458951950073242, "global_step": 346598, "epoch": 4175} {"train_loss": -26.212316513061523, "global_step": 346599, "epoch": 4175} {"train_loss": -26.530029296875, "global_step": 346600, "epoch": 4175} {"train_loss": -26.327091217041016, "global_step": 346601, "epoch": 4175} {"train_loss": -26.372608184814453, "global_step": 346602, "epoch": 4175} {"train_loss": -26.6048583984375, "global_step": 346603, "epoch": 4175} {"train_loss": -26.22650718688965, "global_step": 346604, "epoch": 4175} {"train_loss": -26.300146102905273, "global_step": 346605, "epoch": 4175} {"train_loss": -26.567808151245117, "global_step": 346606, "epoch": 4175} {"train_loss": -26.031730743775885, "global_step": 346607, "epoch": 4175, "val_loss": 6553610.0} {"train_loss": -25.404834747314453, "global_step": 346608, "epoch": 4176} {"train_loss": -24.757246017456055, "global_step": 346609, "epoch": 4176} {"train_loss": -24.823776245117188, "global_step": 346610, "epoch": 4176} {"train_loss": -25.187213897705078, "global_step": 346611, "epoch": 4176} {"train_loss": -24.945585250854492, "global_step": 346612, "epoch": 4176} {"train_loss": -25.143985748291016, "global_step": 346613, "epoch": 4176} {"train_loss": -25.670185089111328, "global_step": 346614, "epoch": 4176} {"train_loss": -24.684738159179688, "global_step": 346615, "epoch": 4176} {"train_loss": -25.562040328979492, "global_step": 346616, "epoch": 4176} {"train_loss": -25.382328033447266, "global_step": 346617, "epoch": 4176} {"train_loss": -25.677515029907227, "global_step": 346618, "epoch": 4176} {"train_loss": -25.455860137939453, "global_step": 346619, "epoch": 4176} {"train_loss": -25.714643478393555, "global_step": 346620, "epoch": 4176} {"train_loss": -25.7269229888916, "global_step": 346621, "epoch": 4176} {"train_loss": -25.52267074584961, "global_step": 346622, "epoch": 4176} {"train_loss": -25.340118408203125, "global_step": 346623, "epoch": 4176} {"train_loss": -25.572599411010742, "global_step": 346624, "epoch": 4176} {"train_loss": -26.15738296508789, "global_step": 346625, "epoch": 4176} {"train_loss": -25.917041778564453, "global_step": 346626, "epoch": 4176} {"train_loss": -25.95366859436035, "global_step": 346627, "epoch": 4176} {"train_loss": -25.52100944519043, "global_step": 346628, "epoch": 4176} {"train_loss": -25.726911544799805, "global_step": 346629, "epoch": 4176} {"train_loss": -25.839277267456055, "global_step": 346630, "epoch": 4176} {"train_loss": -26.04825782775879, "global_step": 346631, "epoch": 4176} {"train_loss": -25.8360538482666, "global_step": 346632, "epoch": 4176} {"train_loss": -25.636981964111328, "global_step": 346633, "epoch": 4176} {"train_loss": -25.958173751831055, "global_step": 346634, "epoch": 4176} {"train_loss": -26.308258056640625, "global_step": 346635, "epoch": 4176} {"train_loss": -25.855152130126953, "global_step": 346636, "epoch": 4176} {"train_loss": -26.152902603149414, "global_step": 346637, "epoch": 4176} {"train_loss": -26.1639404296875, "global_step": 346638, "epoch": 4176} {"train_loss": -25.947101593017578, "global_step": 346639, "epoch": 4176} {"train_loss": -25.9617977142334, "global_step": 346640, "epoch": 4176} {"train_loss": -26.14373207092285, "global_step": 346641, "epoch": 4176} {"train_loss": -26.292816162109375, "global_step": 346642, "epoch": 4176} {"train_loss": -26.336668014526367, "global_step": 346643, "epoch": 4176} {"train_loss": -26.110864639282227, "global_step": 346644, "epoch": 4176} {"train_loss": -26.180814743041992, "global_step": 346645, "epoch": 4176} {"train_loss": -26.462507247924805, "global_step": 346646, "epoch": 4176} {"train_loss": -26.344085693359375, "global_step": 346647, "epoch": 4176} {"train_loss": -25.96575927734375, "global_step": 346648, "epoch": 4176} {"train_loss": -26.510517120361328, "global_step": 346649, "epoch": 4176} {"train_loss": -26.290002822875977, "global_step": 346650, "epoch": 4176} {"train_loss": -26.136083602905273, "global_step": 346651, "epoch": 4176} {"train_loss": -26.508865356445312, "global_step": 346652, "epoch": 4176} {"train_loss": -26.227041244506836, "global_step": 346653, "epoch": 4176} {"train_loss": -26.32499122619629, "global_step": 346654, "epoch": 4176} {"train_loss": -26.411224365234375, "global_step": 346655, "epoch": 4176} {"train_loss": -26.4001522064209, "global_step": 346656, "epoch": 4176} {"train_loss": -25.834272384643555, "global_step": 346657, "epoch": 4176} {"train_loss": -25.694232940673828, "global_step": 346658, "epoch": 4176} {"train_loss": -25.957677841186523, "global_step": 346659, "epoch": 4176} {"train_loss": -26.3698673248291, "global_step": 346660, "epoch": 4176} {"train_loss": -26.089923858642578, "global_step": 346661, "epoch": 4176} {"train_loss": -26.17178726196289, "global_step": 346662, "epoch": 4176} {"train_loss": -26.081893920898438, "global_step": 346663, "epoch": 4176} {"train_loss": -26.351892471313477, "global_step": 346664, "epoch": 4176} {"train_loss": -26.463830947875977, "global_step": 346665, "epoch": 4176} {"train_loss": -25.9649600982666, "global_step": 346666, "epoch": 4176} {"train_loss": -25.892099380493164, "global_step": 346667, "epoch": 4176} {"train_loss": -26.07196044921875, "global_step": 346668, "epoch": 4176} {"train_loss": -26.3662109375, "global_step": 346669, "epoch": 4176} {"train_loss": -26.378787994384766, "global_step": 346670, "epoch": 4176} {"train_loss": -26.413105010986328, "global_step": 346671, "epoch": 4176} {"train_loss": -26.132654190063477, "global_step": 346672, "epoch": 4176} {"train_loss": -25.84552001953125, "global_step": 346673, "epoch": 4176} {"train_loss": -25.672138214111328, "global_step": 346674, "epoch": 4176} {"train_loss": -26.103748321533203, "global_step": 346675, "epoch": 4176} {"train_loss": -25.97150993347168, "global_step": 346676, "epoch": 4176} {"train_loss": -25.652185440063477, "global_step": 346677, "epoch": 4176} {"train_loss": -25.85133171081543, "global_step": 346678, "epoch": 4176} {"train_loss": -25.9595947265625, "global_step": 346679, "epoch": 4176} {"train_loss": -26.29668617248535, "global_step": 346680, "epoch": 4176} {"train_loss": -25.568164825439453, "global_step": 346681, "epoch": 4176} {"train_loss": -26.17561912536621, "global_step": 346682, "epoch": 4176} {"train_loss": -26.110916137695312, "global_step": 346683, "epoch": 4176} {"train_loss": -25.825475692749023, "global_step": 346684, "epoch": 4176} {"train_loss": -26.03350830078125, "global_step": 346685, "epoch": 4176} {"train_loss": -26.236799240112305, "global_step": 346686, "epoch": 4176} {"train_loss": -26.214773178100586, "global_step": 346687, "epoch": 4176} {"train_loss": -26.043415069580078, "global_step": 346688, "epoch": 4176} {"train_loss": -26.012975692749023, "global_step": 346689, "epoch": 4176} {"train_loss": -25.934130220528107, "global_step": 346690, "epoch": 4176, "val_loss": 6574842.0} {"train_loss": -25.414838790893555, "global_step": 346691, "epoch": 4177} {"train_loss": -25.48175048828125, "global_step": 346692, "epoch": 4177} {"train_loss": -25.363868713378906, "global_step": 346693, "epoch": 4177} {"train_loss": -25.39982795715332, "global_step": 346694, "epoch": 4177} {"train_loss": -25.759973526000977, "global_step": 346695, "epoch": 4177} {"train_loss": -25.66615104675293, "global_step": 346696, "epoch": 4177} {"train_loss": -25.887609481811523, "global_step": 346697, "epoch": 4177} {"train_loss": -25.633819580078125, "global_step": 346698, "epoch": 4177} {"train_loss": -25.97039222717285, "global_step": 346699, "epoch": 4177} {"train_loss": -26.144943237304688, "global_step": 346700, "epoch": 4177} {"train_loss": -25.681961059570312, "global_step": 346701, "epoch": 4177} {"train_loss": -25.702529907226562, "global_step": 346702, "epoch": 4177} {"train_loss": -25.942901611328125, "global_step": 346703, "epoch": 4177} {"train_loss": -25.98028564453125, "global_step": 346704, "epoch": 4177} {"train_loss": -26.124494552612305, "global_step": 346705, "epoch": 4177} {"train_loss": -25.763748168945312, "global_step": 346706, "epoch": 4177} {"train_loss": -25.740589141845703, "global_step": 346707, "epoch": 4177} {"train_loss": -26.23772621154785, "global_step": 346708, "epoch": 4177} {"train_loss": -26.106048583984375, "global_step": 346709, "epoch": 4177} {"train_loss": -26.190515518188477, "global_step": 346710, "epoch": 4177} {"train_loss": -26.248188018798828, "global_step": 346711, "epoch": 4177} {"train_loss": -26.115034103393555, "global_step": 346712, "epoch": 4177} {"train_loss": -25.921911239624023, "global_step": 346713, "epoch": 4177} {"train_loss": -25.95086097717285, "global_step": 346714, "epoch": 4177} {"train_loss": -26.09317970275879, "global_step": 346715, "epoch": 4177} {"train_loss": -26.036191940307617, "global_step": 346716, "epoch": 4177} {"train_loss": -26.312137603759766, "global_step": 346717, "epoch": 4177} {"train_loss": -26.206912994384766, "global_step": 346718, "epoch": 4177} {"train_loss": -26.390796661376953, "global_step": 346719, "epoch": 4177} {"train_loss": -26.07404136657715, "global_step": 346720, "epoch": 4177} {"train_loss": -26.056867599487305, "global_step": 346721, "epoch": 4177} {"train_loss": -26.26405906677246, "global_step": 346722, "epoch": 4177} {"train_loss": -26.5615291595459, "global_step": 346723, "epoch": 4177} {"train_loss": -25.879621505737305, "global_step": 346724, "epoch": 4177} {"train_loss": -26.31003189086914, "global_step": 346725, "epoch": 4177} {"train_loss": -26.264612197875977, "global_step": 346726, "epoch": 4177} {"train_loss": -26.07098388671875, "global_step": 346727, "epoch": 4177} {"train_loss": -26.221771240234375, "global_step": 346728, "epoch": 4177} {"train_loss": -26.225744247436523, "global_step": 346729, "epoch": 4177} {"train_loss": -26.32672691345215, "global_step": 346730, "epoch": 4177} {"train_loss": -26.285022735595703, "global_step": 346731, "epoch": 4177} {"train_loss": -26.380390167236328, "global_step": 346732, "epoch": 4177} {"train_loss": -26.337186813354492, "global_step": 346733, "epoch": 4177} {"train_loss": -26.347501754760742, "global_step": 346734, "epoch": 4177} {"train_loss": -26.302001953125, "global_step": 346735, "epoch": 4177} {"train_loss": -26.316640853881836, "global_step": 346736, "epoch": 4177} {"train_loss": -26.374500274658203, "global_step": 346737, "epoch": 4177} {"train_loss": -26.081403732299805, "global_step": 346738, "epoch": 4177} {"train_loss": -26.459674835205078, "global_step": 346739, "epoch": 4177} {"train_loss": -26.5808048248291, "global_step": 346740, "epoch": 4177} {"train_loss": -26.19080924987793, "global_step": 346741, "epoch": 4177} {"train_loss": -26.1972713470459, "global_step": 346742, "epoch": 4177} {"train_loss": -26.292478561401367, "global_step": 346743, "epoch": 4177} {"train_loss": -26.383447647094727, "global_step": 346744, "epoch": 4177} {"train_loss": -26.31243896484375, "global_step": 346745, "epoch": 4177} {"train_loss": -26.1350154876709, "global_step": 346746, "epoch": 4177} {"train_loss": -26.175962448120117, "global_step": 346747, "epoch": 4177} {"train_loss": -26.2943115234375, "global_step": 346748, "epoch": 4177} {"train_loss": -26.1142520904541, "global_step": 346749, "epoch": 4177} {"train_loss": -26.247455596923828, "global_step": 346750, "epoch": 4177} {"train_loss": -26.03438377380371, "global_step": 346751, "epoch": 4177} {"train_loss": -26.08640480041504, "global_step": 346752, "epoch": 4177} {"train_loss": -25.777435302734375, "global_step": 346753, "epoch": 4177} {"train_loss": -25.91318130493164, "global_step": 346754, "epoch": 4177} {"train_loss": -25.775915145874023, "global_step": 346755, "epoch": 4177} {"train_loss": -25.380041122436523, "global_step": 346756, "epoch": 4177} {"train_loss": -26.077335357666016, "global_step": 346757, "epoch": 4177} {"train_loss": -26.507211685180664, "global_step": 346758, "epoch": 4177} {"train_loss": -26.0524845123291, "global_step": 346759, "epoch": 4177} {"train_loss": -25.813817977905273, "global_step": 346760, "epoch": 4177} {"train_loss": -25.53228187561035, "global_step": 346761, "epoch": 4177} {"train_loss": -25.682849884033203, "global_step": 346762, "epoch": 4177} {"train_loss": -25.989288330078125, "global_step": 346763, "epoch": 4177} {"train_loss": -26.0696964263916, "global_step": 346764, "epoch": 4177} {"train_loss": -26.16596031188965, "global_step": 346765, "epoch": 4177} {"train_loss": -26.273221969604492, "global_step": 346766, "epoch": 4177} {"train_loss": -25.6136417388916, "global_step": 346767, "epoch": 4177} {"train_loss": -25.915435791015625, "global_step": 346768, "epoch": 4177} {"train_loss": -26.234790802001953, "global_step": 346769, "epoch": 4177} {"train_loss": -26.04788589477539, "global_step": 346770, "epoch": 4177} {"train_loss": -26.5821590423584, "global_step": 346771, "epoch": 4177} {"train_loss": -26.42921257019043, "global_step": 346772, "epoch": 4177} {"train_loss": -26.051861636609917, "global_step": 346773, "epoch": 4177, "val_loss": 6565154.0} {"train_loss": -25.448352813720703, "global_step": 346774, "epoch": 4178} {"train_loss": -25.362985610961914, "global_step": 346775, "epoch": 4178} {"train_loss": -25.976476669311523, "global_step": 346776, "epoch": 4178} {"train_loss": -25.53597068786621, "global_step": 346777, "epoch": 4178} {"train_loss": -25.618234634399414, "global_step": 346778, "epoch": 4178} {"train_loss": -25.733673095703125, "global_step": 346779, "epoch": 4178} {"train_loss": -25.487192153930664, "global_step": 346780, "epoch": 4178} {"train_loss": -25.966787338256836, "global_step": 346781, "epoch": 4178} {"train_loss": -25.997098922729492, "global_step": 346782, "epoch": 4178} {"train_loss": -25.979719161987305, "global_step": 346783, "epoch": 4178} {"train_loss": -25.81342124938965, "global_step": 346784, "epoch": 4178} {"train_loss": -26.232975006103516, "global_step": 346785, "epoch": 4178} {"train_loss": -25.965925216674805, "global_step": 346786, "epoch": 4178} {"train_loss": -25.956073760986328, "global_step": 346787, "epoch": 4178} {"train_loss": -25.963903427124023, "global_step": 346788, "epoch": 4178} {"train_loss": -25.898839950561523, "global_step": 346789, "epoch": 4178} {"train_loss": -26.014944076538086, "global_step": 346790, "epoch": 4178} {"train_loss": -26.07892417907715, "global_step": 346791, "epoch": 4178} {"train_loss": -26.047204971313477, "global_step": 346792, "epoch": 4178} {"train_loss": -26.278369903564453, "global_step": 346793, "epoch": 4178} {"train_loss": -26.203516006469727, "global_step": 346794, "epoch": 4178} {"train_loss": -26.274139404296875, "global_step": 346795, "epoch": 4178} {"train_loss": -26.26226806640625, "global_step": 346796, "epoch": 4178} {"train_loss": -26.165578842163086, "global_step": 346797, "epoch": 4178} {"train_loss": -26.189910888671875, "global_step": 346798, "epoch": 4178} {"train_loss": -26.48321533203125, "global_step": 346799, "epoch": 4178} {"train_loss": -26.147985458374023, "global_step": 346800, "epoch": 4178} {"train_loss": -26.353240966796875, "global_step": 346801, "epoch": 4178} {"train_loss": -26.128677368164062, "global_step": 346802, "epoch": 4178} {"train_loss": -26.1575984954834, "global_step": 346803, "epoch": 4178} {"train_loss": -26.065139770507812, "global_step": 346804, "epoch": 4178} {"train_loss": -26.0804500579834, "global_step": 346805, "epoch": 4178} {"train_loss": -26.183530807495117, "global_step": 346806, "epoch": 4178} {"train_loss": -26.400232315063477, "global_step": 346807, "epoch": 4178} {"train_loss": -26.444334030151367, "global_step": 346808, "epoch": 4178} {"train_loss": -26.201831817626953, "global_step": 346809, "epoch": 4178} {"train_loss": -25.896650314331055, "global_step": 346810, "epoch": 4178} {"train_loss": -26.433130264282227, "global_step": 346811, "epoch": 4178} {"train_loss": -26.46204948425293, "global_step": 346812, "epoch": 4178} {"train_loss": -26.25028419494629, "global_step": 346813, "epoch": 4178} {"train_loss": -26.1359920501709, "global_step": 346814, "epoch": 4178} {"train_loss": -26.440439224243164, "global_step": 346815, "epoch": 4178} {"train_loss": -26.37386131286621, "global_step": 346816, "epoch": 4178} {"train_loss": -26.276792526245117, "global_step": 346817, "epoch": 4178} {"train_loss": -26.40667152404785, "global_step": 346818, "epoch": 4178} {"train_loss": -26.21303367614746, "global_step": 346819, "epoch": 4178} {"train_loss": -26.3615665435791, "global_step": 346820, "epoch": 4178} {"train_loss": -26.296131134033203, "global_step": 346821, "epoch": 4178} {"train_loss": -26.88468360900879, "global_step": 346822, "epoch": 4178} {"train_loss": -26.56125259399414, "global_step": 346823, "epoch": 4178} {"train_loss": -26.159765243530273, "global_step": 346824, "epoch": 4178} {"train_loss": -26.229467391967773, "global_step": 346825, "epoch": 4178} {"train_loss": -26.191299438476562, "global_step": 346826, "epoch": 4178} {"train_loss": -25.8136043548584, "global_step": 346827, "epoch": 4178} {"train_loss": -26.105737686157227, "global_step": 346828, "epoch": 4178} {"train_loss": -26.155323028564453, "global_step": 346829, "epoch": 4178} {"train_loss": -26.199783325195312, "global_step": 346830, "epoch": 4178} {"train_loss": -26.29570960998535, "global_step": 346831, "epoch": 4178} {"train_loss": -26.131000518798828, "global_step": 346832, "epoch": 4178} {"train_loss": -26.402027130126953, "global_step": 346833, "epoch": 4178} {"train_loss": -26.061986923217773, "global_step": 346834, "epoch": 4178} {"train_loss": -26.256549835205078, "global_step": 346835, "epoch": 4178} {"train_loss": -26.44561767578125, "global_step": 346836, "epoch": 4178} {"train_loss": -25.95013427734375, "global_step": 346837, "epoch": 4178} {"train_loss": -26.0079402923584, "global_step": 346838, "epoch": 4178} {"train_loss": -26.646100997924805, "global_step": 346839, "epoch": 4178} {"train_loss": -26.320478439331055, "global_step": 346840, "epoch": 4178} {"train_loss": -26.543476104736328, "global_step": 346841, "epoch": 4178} {"train_loss": -25.9769287109375, "global_step": 346842, "epoch": 4178} {"train_loss": -26.253143310546875, "global_step": 346843, "epoch": 4178} {"train_loss": -26.47825050354004, "global_step": 346844, "epoch": 4178} {"train_loss": -26.309309005737305, "global_step": 346845, "epoch": 4178} {"train_loss": -26.370370864868164, "global_step": 346846, "epoch": 4178} {"train_loss": -25.6630802154541, "global_step": 346847, "epoch": 4178} {"train_loss": -25.916894912719727, "global_step": 346848, "epoch": 4178} {"train_loss": -26.282882690429688, "global_step": 346849, "epoch": 4178} {"train_loss": -26.250211715698242, "global_step": 346850, "epoch": 4178} {"train_loss": -26.244592666625977, "global_step": 346851, "epoch": 4178} {"train_loss": -26.126195907592773, "global_step": 346852, "epoch": 4178} {"train_loss": -25.902929306030273, "global_step": 346853, "epoch": 4178} {"train_loss": -25.998661041259766, "global_step": 346854, "epoch": 4178} {"train_loss": -26.257413864135742, "global_step": 346855, "epoch": 4178} {"train_loss": -26.160539052572595, "global_step": 346856, "epoch": 4178, "val_loss": 6573714.0} {"train_loss": -25.838422775268555, "global_step": 346857, "epoch": 4179} {"train_loss": -25.54795265197754, "global_step": 346858, "epoch": 4179} {"train_loss": -25.72015380859375, "global_step": 346859, "epoch": 4179} {"train_loss": -25.752182006835938, "global_step": 346860, "epoch": 4179} {"train_loss": -25.673276901245117, "global_step": 346861, "epoch": 4179} {"train_loss": -25.956586837768555, "global_step": 346862, "epoch": 4179} {"train_loss": -26.31167984008789, "global_step": 346863, "epoch": 4179} {"train_loss": -25.613683700561523, "global_step": 346864, "epoch": 4179} {"train_loss": -25.5881404876709, "global_step": 346865, "epoch": 4179} {"train_loss": -26.5328369140625, "global_step": 346866, "epoch": 4179} {"train_loss": -26.002573013305664, "global_step": 346867, "epoch": 4179} {"train_loss": -26.02069664001465, "global_step": 346868, "epoch": 4179} {"train_loss": -26.12953758239746, "global_step": 346869, "epoch": 4179} {"train_loss": -25.953083038330078, "global_step": 346870, "epoch": 4179} {"train_loss": -26.0665340423584, "global_step": 346871, "epoch": 4179} {"train_loss": -26.19418716430664, "global_step": 346872, "epoch": 4179} {"train_loss": -26.083972930908203, "global_step": 346873, "epoch": 4179} {"train_loss": -26.305753707885742, "global_step": 346874, "epoch": 4179} {"train_loss": -26.3486385345459, "global_step": 346875, "epoch": 4179} {"train_loss": -26.106882095336914, "global_step": 346876, "epoch": 4179} {"train_loss": -26.100439071655273, "global_step": 346877, "epoch": 4179} {"train_loss": -26.010711669921875, "global_step": 346878, "epoch": 4179} {"train_loss": -26.27170753479004, "global_step": 346879, "epoch": 4179} {"train_loss": -26.423694610595703, "global_step": 346880, "epoch": 4179} {"train_loss": -26.34608268737793, "global_step": 346881, "epoch": 4179} {"train_loss": -26.0245304107666, "global_step": 346882, "epoch": 4179} {"train_loss": -26.131437301635742, "global_step": 346883, "epoch": 4179} {"train_loss": -25.980024337768555, "global_step": 346884, "epoch": 4179} {"train_loss": -26.278945922851562, "global_step": 346885, "epoch": 4179} {"train_loss": -26.023115158081055, "global_step": 346886, "epoch": 4179} {"train_loss": -25.470539093017578, "global_step": 346887, "epoch": 4179} {"train_loss": -26.062957763671875, "global_step": 346888, "epoch": 4179} {"train_loss": -25.751272201538086, "global_step": 346889, "epoch": 4179} {"train_loss": -25.85092544555664, "global_step": 346890, "epoch": 4179} {"train_loss": -26.132593154907227, "global_step": 346891, "epoch": 4179} {"train_loss": -26.03510093688965, "global_step": 346892, "epoch": 4179} {"train_loss": -26.206024169921875, "global_step": 346893, "epoch": 4179} {"train_loss": -25.865116119384766, "global_step": 346894, "epoch": 4179} {"train_loss": -26.379440307617188, "global_step": 346895, "epoch": 4179} {"train_loss": -25.860980987548828, "global_step": 346896, "epoch": 4179} {"train_loss": -26.139936447143555, "global_step": 346897, "epoch": 4179} {"train_loss": -26.055219650268555, "global_step": 346898, "epoch": 4179} {"train_loss": -26.437204360961914, "global_step": 346899, "epoch": 4179} {"train_loss": -25.91775894165039, "global_step": 346900, "epoch": 4179} {"train_loss": -26.25799560546875, "global_step": 346901, "epoch": 4179} {"train_loss": -26.397815704345703, "global_step": 346902, "epoch": 4179} {"train_loss": -25.966276168823242, "global_step": 346903, "epoch": 4179} {"train_loss": -26.64503288269043, "global_step": 346904, "epoch": 4179} {"train_loss": -26.563730239868164, "global_step": 346905, "epoch": 4179} {"train_loss": -26.076801300048828, "global_step": 346906, "epoch": 4179} {"train_loss": -26.0356502532959, "global_step": 346907, "epoch": 4179} {"train_loss": -26.098255157470703, "global_step": 346908, "epoch": 4179} {"train_loss": -26.320703506469727, "global_step": 346909, "epoch": 4179} {"train_loss": -26.220895767211914, "global_step": 346910, "epoch": 4179} {"train_loss": -26.523115158081055, "global_step": 346911, "epoch": 4179} {"train_loss": -26.007083892822266, "global_step": 346912, "epoch": 4179} {"train_loss": -25.81308364868164, "global_step": 346913, "epoch": 4179} {"train_loss": -25.594884872436523, "global_step": 346914, "epoch": 4179} {"train_loss": -26.14180564880371, "global_step": 346915, "epoch": 4179} {"train_loss": -26.078184127807617, "global_step": 346916, "epoch": 4179} {"train_loss": -25.853317260742188, "global_step": 346917, "epoch": 4179} {"train_loss": -26.077733993530273, "global_step": 346918, "epoch": 4179} {"train_loss": -25.74822425842285, "global_step": 346919, "epoch": 4179} {"train_loss": -26.01710319519043, "global_step": 346920, "epoch": 4179} {"train_loss": -26.224225997924805, "global_step": 346921, "epoch": 4179} {"train_loss": -26.098575592041016, "global_step": 346922, "epoch": 4179} {"train_loss": -25.682172775268555, "global_step": 346923, "epoch": 4179} {"train_loss": -26.266952514648438, "global_step": 346924, "epoch": 4179} {"train_loss": -26.297622680664062, "global_step": 346925, "epoch": 4179} {"train_loss": -26.3006534576416, "global_step": 346926, "epoch": 4179} {"train_loss": -25.9835262298584, "global_step": 346927, "epoch": 4179} {"train_loss": -26.326282501220703, "global_step": 346928, "epoch": 4179} {"train_loss": -26.232751846313477, "global_step": 346929, "epoch": 4179} {"train_loss": -26.124774932861328, "global_step": 346930, "epoch": 4179} {"train_loss": -26.181812286376953, "global_step": 346931, "epoch": 4179} {"train_loss": -26.173852920532227, "global_step": 346932, "epoch": 4179} {"train_loss": -26.40791893005371, "global_step": 346933, "epoch": 4179} {"train_loss": -26.048933029174805, "global_step": 346934, "epoch": 4179} {"train_loss": -26.481067657470703, "global_step": 346935, "epoch": 4179} {"train_loss": -26.253604888916016, "global_step": 346936, "epoch": 4179} {"train_loss": -26.267868041992188, "global_step": 346937, "epoch": 4179} {"train_loss": -26.167837142944336, "global_step": 346938, "epoch": 4179} {"train_loss": -26.089959983366082, "global_step": 346939, "epoch": 4179, "val_loss": 6630764.0} {"train_loss": -25.973356246948242, "global_step": 346940, "epoch": 4180} {"train_loss": -26.103137969970703, "global_step": 346941, "epoch": 4180} {"train_loss": -25.662866592407227, "global_step": 346942, "epoch": 4180} {"train_loss": -25.991910934448242, "global_step": 346943, "epoch": 4180} {"train_loss": -26.00152015686035, "global_step": 346944, "epoch": 4180} {"train_loss": -25.38120460510254, "global_step": 346945, "epoch": 4180} {"train_loss": -25.22974967956543, "global_step": 346946, "epoch": 4180} {"train_loss": -25.518400192260742, "global_step": 346947, "epoch": 4180} {"train_loss": -25.823156356811523, "global_step": 346948, "epoch": 4180} {"train_loss": -25.63483238220215, "global_step": 346949, "epoch": 4180} {"train_loss": -25.84528160095215, "global_step": 346950, "epoch": 4180} {"train_loss": -25.94001579284668, "global_step": 346951, "epoch": 4180} {"train_loss": -26.007431030273438, "global_step": 346952, "epoch": 4180} {"train_loss": -25.82489013671875, "global_step": 346953, "epoch": 4180} {"train_loss": -25.738269805908203, "global_step": 346954, "epoch": 4180} {"train_loss": -25.888290405273438, "global_step": 346955, "epoch": 4180} {"train_loss": -26.13579750061035, "global_step": 346956, "epoch": 4180} {"train_loss": -26.476892471313477, "global_step": 346957, "epoch": 4180} {"train_loss": -25.768903732299805, "global_step": 346958, "epoch": 4180} {"train_loss": -25.884368896484375, "global_step": 346959, "epoch": 4180} {"train_loss": -25.985279083251953, "global_step": 346960, "epoch": 4180} {"train_loss": -25.89019203186035, "global_step": 346961, "epoch": 4180} {"train_loss": -26.180280685424805, "global_step": 346962, "epoch": 4180} {"train_loss": -26.226917266845703, "global_step": 346963, "epoch": 4180} {"train_loss": -26.288837432861328, "global_step": 346964, "epoch": 4180} {"train_loss": -26.234638214111328, "global_step": 346965, "epoch": 4180} {"train_loss": -25.912073135375977, "global_step": 346966, "epoch": 4180} {"train_loss": -26.22926902770996, "global_step": 346967, "epoch": 4180} {"train_loss": -26.02083396911621, "global_step": 346968, "epoch": 4180} {"train_loss": -26.25526237487793, "global_step": 346969, "epoch": 4180} {"train_loss": -26.396299362182617, "global_step": 346970, "epoch": 4180} {"train_loss": -26.10573387145996, "global_step": 346971, "epoch": 4180} {"train_loss": -26.122533798217773, "global_step": 346972, "epoch": 4180} {"train_loss": -26.394031524658203, "global_step": 346973, "epoch": 4180} {"train_loss": -26.145633697509766, "global_step": 346974, "epoch": 4180} {"train_loss": -26.303796768188477, "global_step": 346975, "epoch": 4180} {"train_loss": -26.2242374420166, "global_step": 346976, "epoch": 4180} {"train_loss": -26.266326904296875, "global_step": 346977, "epoch": 4180} {"train_loss": -26.37811851501465, "global_step": 346978, "epoch": 4180} {"train_loss": -26.23373794555664, "global_step": 346979, "epoch": 4180} {"train_loss": -26.427152633666992, "global_step": 346980, "epoch": 4180} {"train_loss": -26.364225387573242, "global_step": 346981, "epoch": 4180} {"train_loss": -26.513097763061523, "global_step": 346982, "epoch": 4180} {"train_loss": -26.281784057617188, "global_step": 346983, "epoch": 4180} {"train_loss": -26.33009147644043, "global_step": 346984, "epoch": 4180} {"train_loss": -26.338550567626953, "global_step": 346985, "epoch": 4180} {"train_loss": -26.265851974487305, "global_step": 346986, "epoch": 4180} {"train_loss": -26.428211212158203, "global_step": 346987, "epoch": 4180} {"train_loss": -25.84368896484375, "global_step": 346988, "epoch": 4180} {"train_loss": -25.94679069519043, "global_step": 346989, "epoch": 4180} {"train_loss": -26.45130729675293, "global_step": 346990, "epoch": 4180} {"train_loss": -26.587411880493164, "global_step": 346991, "epoch": 4180} {"train_loss": -26.02223014831543, "global_step": 346992, "epoch": 4180} {"train_loss": -26.03814125061035, "global_step": 346993, "epoch": 4180} {"train_loss": -26.118173599243164, "global_step": 346994, "epoch": 4180} {"train_loss": -26.604007720947266, "global_step": 346995, "epoch": 4180} {"train_loss": -26.15357780456543, "global_step": 346996, "epoch": 4180} {"train_loss": -25.918161392211914, "global_step": 346997, "epoch": 4180} {"train_loss": -25.596158981323242, "global_step": 346998, "epoch": 4180} {"train_loss": -25.930850982666016, "global_step": 346999, "epoch": 4180} {"train_loss": -25.84514808654785, "global_step": 347000, "epoch": 4180} {"train_loss": -26.208648681640625, "global_step": 347001, "epoch": 4180} {"train_loss": -26.265151977539062, "global_step": 347002, "epoch": 4180} {"train_loss": -26.297346115112305, "global_step": 347003, "epoch": 4180} {"train_loss": -26.019399642944336, "global_step": 347004, "epoch": 4180} {"train_loss": -25.82996940612793, "global_step": 347005, "epoch": 4180} {"train_loss": -26.326919555664062, "global_step": 347006, "epoch": 4180} {"train_loss": -26.17975425720215, "global_step": 347007, "epoch": 4180} {"train_loss": -26.358062744140625, "global_step": 347008, "epoch": 4180} {"train_loss": -26.660430908203125, "global_step": 347009, "epoch": 4180} {"train_loss": -25.973636627197266, "global_step": 347010, "epoch": 4180} {"train_loss": -25.87933349609375, "global_step": 347011, "epoch": 4180} {"train_loss": -25.937124252319336, "global_step": 347012, "epoch": 4180} {"train_loss": -26.153635025024414, "global_step": 347013, "epoch": 4180} {"train_loss": -26.193145751953125, "global_step": 347014, "epoch": 4180} {"train_loss": -26.020004272460938, "global_step": 347015, "epoch": 4180} {"train_loss": -25.853490829467773, "global_step": 347016, "epoch": 4180} {"train_loss": -25.907489776611328, "global_step": 347017, "epoch": 4180} {"train_loss": -26.308252334594727, "global_step": 347018, "epoch": 4180} {"train_loss": -26.443044662475586, "global_step": 347019, "epoch": 4180} {"train_loss": -25.728500366210938, "global_step": 347020, "epoch": 4180} {"train_loss": -26.284921646118164, "global_step": 347021, "epoch": 4180} {"train_loss": -26.081437145371034, "global_step": 347022, "epoch": 4180, "val_loss": 6577523.0} {"train_loss": -25.481779098510742, "global_step": 347023, "epoch": 4181} {"train_loss": -25.55849266052246, "global_step": 347024, "epoch": 4181} {"train_loss": -25.742029190063477, "global_step": 347025, "epoch": 4181} {"train_loss": -25.80165672302246, "global_step": 347026, "epoch": 4181} {"train_loss": -25.77387809753418, "global_step": 347027, "epoch": 4181} {"train_loss": -26.079450607299805, "global_step": 347028, "epoch": 4181} {"train_loss": -26.190887451171875, "global_step": 347029, "epoch": 4181} {"train_loss": -26.155475616455078, "global_step": 347030, "epoch": 4181} {"train_loss": -26.43544578552246, "global_step": 347031, "epoch": 4181} {"train_loss": -25.960529327392578, "global_step": 347032, "epoch": 4181} {"train_loss": -26.425750732421875, "global_step": 347033, "epoch": 4181} {"train_loss": -25.780990600585938, "global_step": 347034, "epoch": 4181} {"train_loss": -25.7277774810791, "global_step": 347035, "epoch": 4181} {"train_loss": -26.072711944580078, "global_step": 347036, "epoch": 4181} {"train_loss": -26.122852325439453, "global_step": 347037, "epoch": 4181} {"train_loss": -26.25347328186035, "global_step": 347038, "epoch": 4181} {"train_loss": -25.970361709594727, "global_step": 347039, "epoch": 4181} {"train_loss": -26.11411476135254, "global_step": 347040, "epoch": 4181} {"train_loss": -26.212060928344727, "global_step": 347041, "epoch": 4181} {"train_loss": -26.238195419311523, "global_step": 347042, "epoch": 4181} {"train_loss": -26.120166778564453, "global_step": 347043, "epoch": 4181} {"train_loss": -25.946393966674805, "global_step": 347044, "epoch": 4181} {"train_loss": -26.13285255432129, "global_step": 347045, "epoch": 4181} {"train_loss": -26.2509708404541, "global_step": 347046, "epoch": 4181} {"train_loss": -26.36671257019043, "global_step": 347047, "epoch": 4181} {"train_loss": -26.30208396911621, "global_step": 347048, "epoch": 4181} {"train_loss": -25.77570152282715, "global_step": 347049, "epoch": 4181} {"train_loss": -26.30547523498535, "global_step": 347050, "epoch": 4181} {"train_loss": -26.327360153198242, "global_step": 347051, "epoch": 4181} {"train_loss": -26.601886749267578, "global_step": 347052, "epoch": 4181} {"train_loss": -25.850854873657227, "global_step": 347053, "epoch": 4181} {"train_loss": -26.2697696685791, "global_step": 347054, "epoch": 4181} {"train_loss": -25.723718643188477, "global_step": 347055, "epoch": 4181} {"train_loss": -26.348087310791016, "global_step": 347056, "epoch": 4181} {"train_loss": -26.227811813354492, "global_step": 347057, "epoch": 4181} {"train_loss": -26.368854522705078, "global_step": 347058, "epoch": 4181} {"train_loss": -26.164642333984375, "global_step": 347059, "epoch": 4181} {"train_loss": -26.55620765686035, "global_step": 347060, "epoch": 4181} {"train_loss": -26.22528076171875, "global_step": 347061, "epoch": 4181} {"train_loss": -26.506122589111328, "global_step": 347062, "epoch": 4181} {"train_loss": -25.832763671875, "global_step": 347063, "epoch": 4181} {"train_loss": -25.91839027404785, "global_step": 347064, "epoch": 4181} {"train_loss": -25.586299896240234, "global_step": 347065, "epoch": 4181} {"train_loss": -25.6241512298584, "global_step": 347066, "epoch": 4181} {"train_loss": -26.113758087158203, "global_step": 347067, "epoch": 4181} {"train_loss": -25.736249923706055, "global_step": 347068, "epoch": 4181} {"train_loss": -25.873456954956055, "global_step": 347069, "epoch": 4181} {"train_loss": -25.994070053100586, "global_step": 347070, "epoch": 4181} {"train_loss": -25.468517303466797, "global_step": 347071, "epoch": 4181} {"train_loss": -26.235382080078125, "global_step": 347072, "epoch": 4181} {"train_loss": -25.96881675720215, "global_step": 347073, "epoch": 4181} {"train_loss": -26.277179718017578, "global_step": 347074, "epoch": 4181} {"train_loss": -26.178241729736328, "global_step": 347075, "epoch": 4181} {"train_loss": -25.9440860748291, "global_step": 347076, "epoch": 4181} {"train_loss": -25.72211265563965, "global_step": 347077, "epoch": 4181} {"train_loss": -26.12409782409668, "global_step": 347078, "epoch": 4181} {"train_loss": -26.154870986938477, "global_step": 347079, "epoch": 4181} {"train_loss": -25.961511611938477, "global_step": 347080, "epoch": 4181} {"train_loss": -25.9014835357666, "global_step": 347081, "epoch": 4181} {"train_loss": -25.76066017150879, "global_step": 347082, "epoch": 4181} {"train_loss": -26.12247657775879, "global_step": 347083, "epoch": 4181} {"train_loss": -26.40374183654785, "global_step": 347084, "epoch": 4181} {"train_loss": -25.946380615234375, "global_step": 347085, "epoch": 4181} {"train_loss": -25.904027938842773, "global_step": 347086, "epoch": 4181} {"train_loss": -25.9006290435791, "global_step": 347087, "epoch": 4181} {"train_loss": -26.17815589904785, "global_step": 347088, "epoch": 4181} {"train_loss": -26.102432250976562, "global_step": 347089, "epoch": 4181} {"train_loss": -26.229278564453125, "global_step": 347090, "epoch": 4181} {"train_loss": -26.06689453125, "global_step": 347091, "epoch": 4181} {"train_loss": -26.12342643737793, "global_step": 347092, "epoch": 4181} {"train_loss": -26.351226806640625, "global_step": 347093, "epoch": 4181} {"train_loss": -25.905139923095703, "global_step": 347094, "epoch": 4181} {"train_loss": -26.217105865478516, "global_step": 347095, "epoch": 4181} {"train_loss": -26.025625228881836, "global_step": 347096, "epoch": 4181} {"train_loss": -26.3670711517334, "global_step": 347097, "epoch": 4181} {"train_loss": -25.99380874633789, "global_step": 347098, "epoch": 4181} {"train_loss": -25.9506893157959, "global_step": 347099, "epoch": 4181} {"train_loss": -26.164335250854492, "global_step": 347100, "epoch": 4181} {"train_loss": -26.468338012695312, "global_step": 347101, "epoch": 4181} {"train_loss": -26.420541763305664, "global_step": 347102, "epoch": 4181} {"train_loss": -26.262470245361328, "global_step": 347103, "epoch": 4181} {"train_loss": -26.108753204345703, "global_step": 347104, "epoch": 4181} {"train_loss": -26.060513668749707, "global_step": 347105, "epoch": 4181, "val_loss": 6606992.0} {"train_loss": -25.52615737915039, "global_step": 347106, "epoch": 4182} {"train_loss": -25.074071884155273, "global_step": 347107, "epoch": 4182} {"train_loss": -25.84099769592285, "global_step": 347108, "epoch": 4182} {"train_loss": -25.341833114624023, "global_step": 347109, "epoch": 4182} {"train_loss": -25.598190307617188, "global_step": 347110, "epoch": 4182} {"train_loss": -25.591094970703125, "global_step": 347111, "epoch": 4182} {"train_loss": -25.843732833862305, "global_step": 347112, "epoch": 4182} {"train_loss": -26.227279663085938, "global_step": 347113, "epoch": 4182} {"train_loss": -25.756933212280273, "global_step": 347114, "epoch": 4182} {"train_loss": -25.557947158813477, "global_step": 347115, "epoch": 4182} {"train_loss": -25.91704750061035, "global_step": 347116, "epoch": 4182} {"train_loss": -25.71445083618164, "global_step": 347117, "epoch": 4182} {"train_loss": -26.08149528503418, "global_step": 347118, "epoch": 4182} {"train_loss": -25.67246437072754, "global_step": 347119, "epoch": 4182} {"train_loss": -25.97486686706543, "global_step": 347120, "epoch": 4182} {"train_loss": -26.31028175354004, "global_step": 347121, "epoch": 4182} {"train_loss": -26.031965255737305, "global_step": 347122, "epoch": 4182} {"train_loss": -26.28899574279785, "global_step": 347123, "epoch": 4182} {"train_loss": -25.784255981445312, "global_step": 347124, "epoch": 4182} {"train_loss": -26.069751739501953, "global_step": 347125, "epoch": 4182} {"train_loss": -26.242691040039062, "global_step": 347126, "epoch": 4182} {"train_loss": -26.097522735595703, "global_step": 347127, "epoch": 4182} {"train_loss": -25.6859188079834, "global_step": 347128, "epoch": 4182} {"train_loss": -26.234853744506836, "global_step": 347129, "epoch": 4182} {"train_loss": -25.99811363220215, "global_step": 347130, "epoch": 4182} {"train_loss": -26.124048233032227, "global_step": 347131, "epoch": 4182} {"train_loss": -26.072223663330078, "global_step": 347132, "epoch": 4182} {"train_loss": -26.172149658203125, "global_step": 347133, "epoch": 4182} {"train_loss": -26.319751739501953, "global_step": 347134, "epoch": 4182} {"train_loss": -25.976211547851562, "global_step": 347135, "epoch": 4182} {"train_loss": -26.211233139038086, "global_step": 347136, "epoch": 4182} {"train_loss": -25.801712036132812, "global_step": 347137, "epoch": 4182} {"train_loss": -26.062856674194336, "global_step": 347138, "epoch": 4182} {"train_loss": -26.19965934753418, "global_step": 347139, "epoch": 4182} {"train_loss": -26.276935577392578, "global_step": 347140, "epoch": 4182} {"train_loss": -25.96649742126465, "global_step": 347141, "epoch": 4182} {"train_loss": -26.143842697143555, "global_step": 347142, "epoch": 4182} {"train_loss": -26.3922061920166, "global_step": 347143, "epoch": 4182} {"train_loss": -26.17905616760254, "global_step": 347144, "epoch": 4182} {"train_loss": -26.273656845092773, "global_step": 347145, "epoch": 4182} {"train_loss": -26.3162784576416, "global_step": 347146, "epoch": 4182} {"train_loss": -26.170612335205078, "global_step": 347147, "epoch": 4182} {"train_loss": -26.42755699157715, "global_step": 347148, "epoch": 4182} {"train_loss": -26.31854248046875, "global_step": 347149, "epoch": 4182} {"train_loss": -26.198383331298828, "global_step": 347150, "epoch": 4182} {"train_loss": -26.4357852935791, "global_step": 347151, "epoch": 4182} {"train_loss": -26.32634925842285, "global_step": 347152, "epoch": 4182} {"train_loss": -26.43060302734375, "global_step": 347153, "epoch": 4182} {"train_loss": -26.514236450195312, "global_step": 347154, "epoch": 4182} {"train_loss": -26.172657012939453, "global_step": 347155, "epoch": 4182} {"train_loss": -26.3333683013916, "global_step": 347156, "epoch": 4182} {"train_loss": -26.410877227783203, "global_step": 347157, "epoch": 4182} {"train_loss": -26.358617782592773, "global_step": 347158, "epoch": 4182} {"train_loss": -26.31355094909668, "global_step": 347159, "epoch": 4182} {"train_loss": -26.080249786376953, "global_step": 347160, "epoch": 4182} {"train_loss": -26.38498878479004, "global_step": 347161, "epoch": 4182} {"train_loss": -26.638229370117188, "global_step": 347162, "epoch": 4182} {"train_loss": -26.353561401367188, "global_step": 347163, "epoch": 4182} {"train_loss": -26.02386474609375, "global_step": 347164, "epoch": 4182} {"train_loss": -25.791492462158203, "global_step": 347165, "epoch": 4182} {"train_loss": -25.803186416625977, "global_step": 347166, "epoch": 4182} {"train_loss": -26.045013427734375, "global_step": 347167, "epoch": 4182} {"train_loss": -26.006616592407227, "global_step": 347168, "epoch": 4182} {"train_loss": -25.835208892822266, "global_step": 347169, "epoch": 4182} {"train_loss": -26.294952392578125, "global_step": 347170, "epoch": 4182} {"train_loss": -25.93745231628418, "global_step": 347171, "epoch": 4182} {"train_loss": -26.181238174438477, "global_step": 347172, "epoch": 4182} {"train_loss": -25.975208282470703, "global_step": 347173, "epoch": 4182} {"train_loss": -25.910053253173828, "global_step": 347174, "epoch": 4182} {"train_loss": -25.885181427001953, "global_step": 347175, "epoch": 4182} {"train_loss": -26.407567977905273, "global_step": 347176, "epoch": 4182} {"train_loss": -26.492218017578125, "global_step": 347177, "epoch": 4182} {"train_loss": -26.252573013305664, "global_step": 347178, "epoch": 4182} {"train_loss": -26.259033203125, "global_step": 347179, "epoch": 4182} {"train_loss": -26.1715145111084, "global_step": 347180, "epoch": 4182} {"train_loss": -26.170358657836914, "global_step": 347181, "epoch": 4182} {"train_loss": -26.349523544311523, "global_step": 347182, "epoch": 4182} {"train_loss": -26.054676055908203, "global_step": 347183, "epoch": 4182} {"train_loss": -25.973844528198242, "global_step": 347184, "epoch": 4182} {"train_loss": -26.129261016845703, "global_step": 347185, "epoch": 4182} {"train_loss": -26.355825424194336, "global_step": 347186, "epoch": 4182} {"train_loss": -26.147619247436523, "global_step": 347187, "epoch": 4182} {"train_loss": -26.08700897032956, "global_step": 347188, "epoch": 4182, "val_loss": 6598489.0} {"train_loss": -25.422399520874023, "global_step": 347189, "epoch": 4183} {"train_loss": -25.77703285217285, "global_step": 347190, "epoch": 4183} {"train_loss": -25.038463592529297, "global_step": 347191, "epoch": 4183} {"train_loss": -25.153268814086914, "global_step": 347192, "epoch": 4183} {"train_loss": -25.373422622680664, "global_step": 347193, "epoch": 4183} {"train_loss": -25.533536911010742, "global_step": 347194, "epoch": 4183} {"train_loss": -25.530019760131836, "global_step": 347195, "epoch": 4183} {"train_loss": -25.44296646118164, "global_step": 347196, "epoch": 4183} {"train_loss": -25.748001098632812, "global_step": 347197, "epoch": 4183} {"train_loss": -25.911273956298828, "global_step": 347198, "epoch": 4183} {"train_loss": -25.235321044921875, "global_step": 347199, "epoch": 4183} {"train_loss": -25.74517250061035, "global_step": 347200, "epoch": 4183} {"train_loss": -26.052770614624023, "global_step": 347201, "epoch": 4183} {"train_loss": -25.818119049072266, "global_step": 347202, "epoch": 4183} {"train_loss": -25.688074111938477, "global_step": 347203, "epoch": 4183} {"train_loss": -25.588550567626953, "global_step": 347204, "epoch": 4183} {"train_loss": -25.912851333618164, "global_step": 347205, "epoch": 4183} {"train_loss": -25.665817260742188, "global_step": 347206, "epoch": 4183} {"train_loss": -26.108978271484375, "global_step": 347207, "epoch": 4183} {"train_loss": -25.79298210144043, "global_step": 347208, "epoch": 4183} {"train_loss": -25.956857681274414, "global_step": 347209, "epoch": 4183} {"train_loss": -25.461933135986328, "global_step": 347210, "epoch": 4183} {"train_loss": -25.80027198791504, "global_step": 347211, "epoch": 4183} {"train_loss": -25.977529525756836, "global_step": 347212, "epoch": 4183} {"train_loss": -26.0105037689209, "global_step": 347213, "epoch": 4183} {"train_loss": -25.944843292236328, "global_step": 347214, "epoch": 4183} {"train_loss": -26.23024559020996, "global_step": 347215, "epoch": 4183} {"train_loss": -25.8406982421875, "global_step": 347216, "epoch": 4183} {"train_loss": -25.995038986206055, "global_step": 347217, "epoch": 4183} {"train_loss": -26.11441993713379, "global_step": 347218, "epoch": 4183} {"train_loss": -25.731781005859375, "global_step": 347219, "epoch": 4183} {"train_loss": -26.21314811706543, "global_step": 347220, "epoch": 4183} {"train_loss": -26.622182846069336, "global_step": 347221, "epoch": 4183} {"train_loss": -25.94742202758789, "global_step": 347222, "epoch": 4183} {"train_loss": -26.3305606842041, "global_step": 347223, "epoch": 4183} {"train_loss": -26.5919189453125, "global_step": 347224, "epoch": 4183} {"train_loss": -25.930322647094727, "global_step": 347225, "epoch": 4183} {"train_loss": -26.32895278930664, "global_step": 347226, "epoch": 4183} {"train_loss": -26.072988510131836, "global_step": 347227, "epoch": 4183} {"train_loss": -26.5826358795166, "global_step": 347228, "epoch": 4183} {"train_loss": -26.196731567382812, "global_step": 347229, "epoch": 4183} {"train_loss": -26.05170249938965, "global_step": 347230, "epoch": 4183} {"train_loss": -26.206205368041992, "global_step": 347231, "epoch": 4183} {"train_loss": -26.122116088867188, "global_step": 347232, "epoch": 4183} {"train_loss": -25.80124282836914, "global_step": 347233, "epoch": 4183} {"train_loss": -26.407262802124023, "global_step": 347234, "epoch": 4183} {"train_loss": -26.182180404663086, "global_step": 347235, "epoch": 4183} {"train_loss": -26.07779884338379, "global_step": 347236, "epoch": 4183} {"train_loss": -26.384841918945312, "global_step": 347237, "epoch": 4183} {"train_loss": -26.018911361694336, "global_step": 347238, "epoch": 4183} {"train_loss": -25.970306396484375, "global_step": 347239, "epoch": 4183} {"train_loss": -26.325942993164062, "global_step": 347240, "epoch": 4183} {"train_loss": -26.15186882019043, "global_step": 347241, "epoch": 4183} {"train_loss": -26.369733810424805, "global_step": 347242, "epoch": 4183} {"train_loss": -26.526111602783203, "global_step": 347243, "epoch": 4183} {"train_loss": -26.2076416015625, "global_step": 347244, "epoch": 4183} {"train_loss": -26.67555046081543, "global_step": 347245, "epoch": 4183} {"train_loss": -26.036518096923828, "global_step": 347246, "epoch": 4183} {"train_loss": -26.064538955688477, "global_step": 347247, "epoch": 4183} {"train_loss": -26.476255416870117, "global_step": 347248, "epoch": 4183} {"train_loss": -26.145416259765625, "global_step": 347249, "epoch": 4183} {"train_loss": -26.262903213500977, "global_step": 347250, "epoch": 4183} {"train_loss": -26.153573989868164, "global_step": 347251, "epoch": 4183} {"train_loss": -26.39606285095215, "global_step": 347252, "epoch": 4183} {"train_loss": -26.0933895111084, "global_step": 347253, "epoch": 4183} {"train_loss": -26.05219078063965, "global_step": 347254, "epoch": 4183} {"train_loss": -25.89828872680664, "global_step": 347255, "epoch": 4183} {"train_loss": -26.236413955688477, "global_step": 347256, "epoch": 4183} {"train_loss": -25.694604873657227, "global_step": 347257, "epoch": 4183} {"train_loss": -25.4995174407959, "global_step": 347258, "epoch": 4183} {"train_loss": -25.173757553100586, "global_step": 347259, "epoch": 4183} {"train_loss": -25.83664321899414, "global_step": 347260, "epoch": 4183} {"train_loss": -26.164443969726562, "global_step": 347261, "epoch": 4183} {"train_loss": -26.045856475830078, "global_step": 347262, "epoch": 4183} {"train_loss": -25.932373046875, "global_step": 347263, "epoch": 4183} {"train_loss": -25.75005531311035, "global_step": 347264, "epoch": 4183} {"train_loss": -26.4982967376709, "global_step": 347265, "epoch": 4183} {"train_loss": -26.034473419189453, "global_step": 347266, "epoch": 4183} {"train_loss": -25.799283981323242, "global_step": 347267, "epoch": 4183} {"train_loss": -25.799152374267578, "global_step": 347268, "epoch": 4183} {"train_loss": -26.51020622253418, "global_step": 347269, "epoch": 4183} {"train_loss": -26.382421493530273, "global_step": 347270, "epoch": 4183} {"train_loss": -25.99021162469703, "global_step": 347271, "epoch": 4183, "val_loss": 6618904.0} {"train_loss": -26.067047119140625, "global_step": 347272, "epoch": 4184} {"train_loss": -25.786956787109375, "global_step": 347273, "epoch": 4184} {"train_loss": -25.829730987548828, "global_step": 347274, "epoch": 4184} {"train_loss": -25.993534088134766, "global_step": 347275, "epoch": 4184} {"train_loss": -25.868253707885742, "global_step": 347276, "epoch": 4184} {"train_loss": -26.23404312133789, "global_step": 347277, "epoch": 4184} {"train_loss": -25.96510124206543, "global_step": 347278, "epoch": 4184} {"train_loss": -26.091238021850586, "global_step": 347279, "epoch": 4184} {"train_loss": -25.8697509765625, "global_step": 347280, "epoch": 4184} {"train_loss": -25.830677032470703, "global_step": 347281, "epoch": 4184} {"train_loss": -25.8968448638916, "global_step": 347282, "epoch": 4184} {"train_loss": -25.94056510925293, "global_step": 347283, "epoch": 4184} {"train_loss": -26.278858184814453, "global_step": 347284, "epoch": 4184} {"train_loss": -26.135168075561523, "global_step": 347285, "epoch": 4184} {"train_loss": -25.872161865234375, "global_step": 347286, "epoch": 4184} {"train_loss": -26.387073516845703, "global_step": 347287, "epoch": 4184} {"train_loss": -26.24204444885254, "global_step": 347288, "epoch": 4184} {"train_loss": -25.980300903320312, "global_step": 347289, "epoch": 4184} {"train_loss": -25.968795776367188, "global_step": 347290, "epoch": 4184} {"train_loss": -26.44394874572754, "global_step": 347291, "epoch": 4184} {"train_loss": -26.2557315826416, "global_step": 347292, "epoch": 4184} {"train_loss": -26.19795036315918, "global_step": 347293, "epoch": 4184} {"train_loss": -26.18648338317871, "global_step": 347294, "epoch": 4184} {"train_loss": -26.22774314880371, "global_step": 347295, "epoch": 4184} {"train_loss": -26.509092330932617, "global_step": 347296, "epoch": 4184} {"train_loss": -26.078176498413086, "global_step": 347297, "epoch": 4184} {"train_loss": -26.354928970336914, "global_step": 347298, "epoch": 4184} {"train_loss": -26.328779220581055, "global_step": 347299, "epoch": 4184} {"train_loss": -26.51801109313965, "global_step": 347300, "epoch": 4184} {"train_loss": -26.262338638305664, "global_step": 347301, "epoch": 4184} {"train_loss": -26.027719497680664, "global_step": 347302, "epoch": 4184} {"train_loss": -26.20001792907715, "global_step": 347303, "epoch": 4184} {"train_loss": -26.209949493408203, "global_step": 347304, "epoch": 4184} {"train_loss": -26.549665451049805, "global_step": 347305, "epoch": 4184} {"train_loss": -26.150049209594727, "global_step": 347306, "epoch": 4184} {"train_loss": -26.1296329498291, "global_step": 347307, "epoch": 4184} {"train_loss": -26.456586837768555, "global_step": 347308, "epoch": 4184} {"train_loss": -26.246252059936523, "global_step": 347309, "epoch": 4184} {"train_loss": -26.338764190673828, "global_step": 347310, "epoch": 4184} {"train_loss": -26.275060653686523, "global_step": 347311, "epoch": 4184} {"train_loss": -25.996496200561523, "global_step": 347312, "epoch": 4184} {"train_loss": -26.95966911315918, "global_step": 347313, "epoch": 4184} {"train_loss": -26.41175651550293, "global_step": 347314, "epoch": 4184} {"train_loss": -26.300189971923828, "global_step": 347315, "epoch": 4184} {"train_loss": -26.411184310913086, "global_step": 347316, "epoch": 4184} {"train_loss": -26.2741641998291, "global_step": 347317, "epoch": 4184} {"train_loss": -26.57330322265625, "global_step": 347318, "epoch": 4184} {"train_loss": -26.164859771728516, "global_step": 347319, "epoch": 4184} {"train_loss": -25.97430419921875, "global_step": 347320, "epoch": 4184} {"train_loss": -26.20685386657715, "global_step": 347321, "epoch": 4184} {"train_loss": -26.116607666015625, "global_step": 347322, "epoch": 4184} {"train_loss": -26.283618927001953, "global_step": 347323, "epoch": 4184} {"train_loss": -26.132965087890625, "global_step": 347324, "epoch": 4184} {"train_loss": -25.84662437438965, "global_step": 347325, "epoch": 4184} {"train_loss": -25.592809677124023, "global_step": 347326, "epoch": 4184} {"train_loss": -25.008865356445312, "global_step": 347327, "epoch": 4184} {"train_loss": -25.858600616455078, "global_step": 347328, "epoch": 4184} {"train_loss": -26.194555282592773, "global_step": 347329, "epoch": 4184} {"train_loss": -26.196319580078125, "global_step": 347330, "epoch": 4184} {"train_loss": -26.01806640625, "global_step": 347331, "epoch": 4184} {"train_loss": -26.077177047729492, "global_step": 347332, "epoch": 4184} {"train_loss": -26.227872848510742, "global_step": 347333, "epoch": 4184} {"train_loss": -26.630126953125, "global_step": 347334, "epoch": 4184} {"train_loss": -26.161569595336914, "global_step": 347335, "epoch": 4184} {"train_loss": -26.0505428314209, "global_step": 347336, "epoch": 4184} {"train_loss": -26.299762725830078, "global_step": 347337, "epoch": 4184} {"train_loss": -26.155487060546875, "global_step": 347338, "epoch": 4184} {"train_loss": -26.15669059753418, "global_step": 347339, "epoch": 4184} {"train_loss": -26.434982299804688, "global_step": 347340, "epoch": 4184} {"train_loss": -26.1898250579834, "global_step": 347341, "epoch": 4184} {"train_loss": -26.009693145751953, "global_step": 347342, "epoch": 4184} {"train_loss": -26.275537490844727, "global_step": 347343, "epoch": 4184} {"train_loss": -25.934057235717773, "global_step": 347344, "epoch": 4184} {"train_loss": -26.16326904296875, "global_step": 347345, "epoch": 4184} {"train_loss": -26.19846534729004, "global_step": 347346, "epoch": 4184} {"train_loss": -26.153268814086914, "global_step": 347347, "epoch": 4184} {"train_loss": -26.08730125427246, "global_step": 347348, "epoch": 4184} {"train_loss": -26.140302658081055, "global_step": 347349, "epoch": 4184} {"train_loss": -26.572769165039062, "global_step": 347350, "epoch": 4184} {"train_loss": -26.092802047729492, "global_step": 347351, "epoch": 4184} {"train_loss": -26.300800323486328, "global_step": 347352, "epoch": 4184} {"train_loss": -26.253681182861328, "global_step": 347353, "epoch": 4184} {"train_loss": -26.164407982883684, "global_step": 347354, "epoch": 4184, "val_loss": 6614684.5} {"train_loss": -25.234495162963867, "global_step": 347355, "epoch": 4185} {"train_loss": -25.22355079650879, "global_step": 347356, "epoch": 4185} {"train_loss": -24.809179306030273, "global_step": 347357, "epoch": 4185} {"train_loss": -24.69040298461914, "global_step": 347358, "epoch": 4185} {"train_loss": -25.560300827026367, "global_step": 347359, "epoch": 4185} {"train_loss": -25.60310173034668, "global_step": 347360, "epoch": 4185} {"train_loss": -25.132505416870117, "global_step": 347361, "epoch": 4185} {"train_loss": -24.977174758911133, "global_step": 347362, "epoch": 4185} {"train_loss": -26.111616134643555, "global_step": 347363, "epoch": 4185} {"train_loss": -25.165246963500977, "global_step": 347364, "epoch": 4185} {"train_loss": -25.547443389892578, "global_step": 347365, "epoch": 4185} {"train_loss": -25.37650489807129, "global_step": 347366, "epoch": 4185} {"train_loss": -25.7078914642334, "global_step": 347367, "epoch": 4185} {"train_loss": -25.70025634765625, "global_step": 347368, "epoch": 4185} {"train_loss": -25.9123592376709, "global_step": 347369, "epoch": 4185} {"train_loss": -25.60721778869629, "global_step": 347370, "epoch": 4185} {"train_loss": -25.701562881469727, "global_step": 347371, "epoch": 4185} {"train_loss": -25.785314559936523, "global_step": 347372, "epoch": 4185} {"train_loss": -25.75672721862793, "global_step": 347373, "epoch": 4185} {"train_loss": -26.096357345581055, "global_step": 347374, "epoch": 4185} {"train_loss": -25.95379066467285, "global_step": 347375, "epoch": 4185} {"train_loss": -26.160974502563477, "global_step": 347376, "epoch": 4185} {"train_loss": -25.838165283203125, "global_step": 347377, "epoch": 4185} {"train_loss": -25.66814613342285, "global_step": 347378, "epoch": 4185} {"train_loss": -26.096296310424805, "global_step": 347379, "epoch": 4185} {"train_loss": -25.940643310546875, "global_step": 347380, "epoch": 4185} {"train_loss": -26.231201171875, "global_step": 347381, "epoch": 4185} {"train_loss": -26.4373722076416, "global_step": 347382, "epoch": 4185} {"train_loss": -26.366689682006836, "global_step": 347383, "epoch": 4185} {"train_loss": -26.293537139892578, "global_step": 347384, "epoch": 4185} {"train_loss": -25.963037490844727, "global_step": 347385, "epoch": 4185} {"train_loss": -25.938602447509766, "global_step": 347386, "epoch": 4185} {"train_loss": -25.913854598999023, "global_step": 347387, "epoch": 4185} {"train_loss": -26.1357421875, "global_step": 347388, "epoch": 4185} {"train_loss": -26.04296875, "global_step": 347389, "epoch": 4185} {"train_loss": -26.42660903930664, "global_step": 347390, "epoch": 4185} {"train_loss": -26.227685928344727, "global_step": 347391, "epoch": 4185} {"train_loss": -26.21095085144043, "global_step": 347392, "epoch": 4185} {"train_loss": -26.58086585998535, "global_step": 347393, "epoch": 4185} {"train_loss": -26.49078369140625, "global_step": 347394, "epoch": 4185} {"train_loss": -26.15168571472168, "global_step": 347395, "epoch": 4185} {"train_loss": -26.35150146484375, "global_step": 347396, "epoch": 4185} {"train_loss": -26.21919059753418, "global_step": 347397, "epoch": 4185} {"train_loss": -26.431867599487305, "global_step": 347398, "epoch": 4185} {"train_loss": -26.7236385345459, "global_step": 347399, "epoch": 4185} {"train_loss": -26.218122482299805, "global_step": 347400, "epoch": 4185} {"train_loss": -26.44405174255371, "global_step": 347401, "epoch": 4185} {"train_loss": -26.245893478393555, "global_step": 347402, "epoch": 4185} {"train_loss": -25.91875648498535, "global_step": 347403, "epoch": 4185} {"train_loss": -26.317792892456055, "global_step": 347404, "epoch": 4185} {"train_loss": -26.1590633392334, "global_step": 347405, "epoch": 4185} {"train_loss": -26.432714462280273, "global_step": 347406, "epoch": 4185} {"train_loss": -25.909860610961914, "global_step": 347407, "epoch": 4185} {"train_loss": -25.766523361206055, "global_step": 347408, "epoch": 4185} {"train_loss": -25.22051429748535, "global_step": 347409, "epoch": 4185} {"train_loss": -24.950794219970703, "global_step": 347410, "epoch": 4185} {"train_loss": -25.519744873046875, "global_step": 347411, "epoch": 4185} {"train_loss": -25.65956687927246, "global_step": 347412, "epoch": 4185} {"train_loss": -26.048526763916016, "global_step": 347413, "epoch": 4185} {"train_loss": -25.8270263671875, "global_step": 347414, "epoch": 4185} {"train_loss": -26.1971435546875, "global_step": 347415, "epoch": 4185} {"train_loss": -26.220563888549805, "global_step": 347416, "epoch": 4185} {"train_loss": -26.106042861938477, "global_step": 347417, "epoch": 4185} {"train_loss": -25.844409942626953, "global_step": 347418, "epoch": 4185} {"train_loss": -26.160154342651367, "global_step": 347419, "epoch": 4185} {"train_loss": -26.04323387145996, "global_step": 347420, "epoch": 4185} {"train_loss": -26.18070411682129, "global_step": 347421, "epoch": 4185} {"train_loss": -26.13652992248535, "global_step": 347422, "epoch": 4185} {"train_loss": -26.250385284423828, "global_step": 347423, "epoch": 4185} {"train_loss": -26.180418014526367, "global_step": 347424, "epoch": 4185} {"train_loss": -25.926904678344727, "global_step": 347425, "epoch": 4185} {"train_loss": -26.243818283081055, "global_step": 347426, "epoch": 4185} {"train_loss": -25.757877349853516, "global_step": 347427, "epoch": 4185} {"train_loss": -25.6627140045166, "global_step": 347428, "epoch": 4185} {"train_loss": -25.92571449279785, "global_step": 347429, "epoch": 4185} {"train_loss": -25.693384170532227, "global_step": 347430, "epoch": 4185} {"train_loss": -26.0107421875, "global_step": 347431, "epoch": 4185} {"train_loss": -25.95867347717285, "global_step": 347432, "epoch": 4185} {"train_loss": -26.072834014892578, "global_step": 347433, "epoch": 4185} {"train_loss": -25.838653564453125, "global_step": 347434, "epoch": 4185} {"train_loss": -26.344385147094727, "global_step": 347435, "epoch": 4185} {"train_loss": -26.18050193786621, "global_step": 347436, "epoch": 4185} {"train_loss": -25.94372140355857, "global_step": 347437, "epoch": 4185, "val_loss": 6668166.5} {"train_loss": -25.84130859375, "global_step": 347438, "epoch": 4186} {"train_loss": -25.672956466674805, "global_step": 347439, "epoch": 4186} {"train_loss": -25.140703201293945, "global_step": 347440, "epoch": 4186} {"train_loss": -25.503721237182617, "global_step": 347441, "epoch": 4186} {"train_loss": -25.231054306030273, "global_step": 347442, "epoch": 4186} {"train_loss": -25.525617599487305, "global_step": 347443, "epoch": 4186} {"train_loss": -25.406768798828125, "global_step": 347444, "epoch": 4186} {"train_loss": -25.61118507385254, "global_step": 347445, "epoch": 4186} {"train_loss": -25.630273818969727, "global_step": 347446, "epoch": 4186} {"train_loss": -25.369417190551758, "global_step": 347447, "epoch": 4186} {"train_loss": -25.452287673950195, "global_step": 347448, "epoch": 4186} {"train_loss": -25.85383415222168, "global_step": 347449, "epoch": 4186} {"train_loss": -25.402219772338867, "global_step": 347450, "epoch": 4186} {"train_loss": -25.458322525024414, "global_step": 347451, "epoch": 4186} {"train_loss": -25.943267822265625, "global_step": 347452, "epoch": 4186} {"train_loss": -25.8431339263916, "global_step": 347453, "epoch": 4186} {"train_loss": -25.681232452392578, "global_step": 347454, "epoch": 4186} {"train_loss": -25.76898193359375, "global_step": 347455, "epoch": 4186} {"train_loss": -25.7529354095459, "global_step": 347456, "epoch": 4186} {"train_loss": -26.179452896118164, "global_step": 347457, "epoch": 4186} {"train_loss": -25.715106964111328, "global_step": 347458, "epoch": 4186} {"train_loss": -26.007654190063477, "global_step": 347459, "epoch": 4186} {"train_loss": -25.957090377807617, "global_step": 347460, "epoch": 4186} {"train_loss": -25.956472396850586, "global_step": 347461, "epoch": 4186} {"train_loss": -25.787616729736328, "global_step": 347462, "epoch": 4186} {"train_loss": -26.18635368347168, "global_step": 347463, "epoch": 4186} {"train_loss": -26.175703048706055, "global_step": 347464, "epoch": 4186} {"train_loss": -25.8601131439209, "global_step": 347465, "epoch": 4186} {"train_loss": -26.416015625, "global_step": 347466, "epoch": 4186} {"train_loss": -26.255355834960938, "global_step": 347467, "epoch": 4186} {"train_loss": -26.191614151000977, "global_step": 347468, "epoch": 4186} {"train_loss": -26.024463653564453, "global_step": 347469, "epoch": 4186} {"train_loss": -26.33450698852539, "global_step": 347470, "epoch": 4186} {"train_loss": -26.266260147094727, "global_step": 347471, "epoch": 4186} {"train_loss": -26.354406356811523, "global_step": 347472, "epoch": 4186} {"train_loss": -26.17291259765625, "global_step": 347473, "epoch": 4186} {"train_loss": -26.226318359375, "global_step": 347474, "epoch": 4186} {"train_loss": -26.33717155456543, "global_step": 347475, "epoch": 4186} {"train_loss": -26.51277732849121, "global_step": 347476, "epoch": 4186} {"train_loss": -25.847639083862305, "global_step": 347477, "epoch": 4186} {"train_loss": -26.296466827392578, "global_step": 347478, "epoch": 4186} {"train_loss": -26.183185577392578, "global_step": 347479, "epoch": 4186} {"train_loss": -26.262531280517578, "global_step": 347480, "epoch": 4186} {"train_loss": -26.28468894958496, "global_step": 347481, "epoch": 4186} {"train_loss": -26.22397232055664, "global_step": 347482, "epoch": 4186} {"train_loss": -25.905303955078125, "global_step": 347483, "epoch": 4186} {"train_loss": -26.245588302612305, "global_step": 347484, "epoch": 4186} {"train_loss": -26.1608943939209, "global_step": 347485, "epoch": 4186} {"train_loss": -26.325714111328125, "global_step": 347486, "epoch": 4186} {"train_loss": -25.964675903320312, "global_step": 347487, "epoch": 4186} {"train_loss": -25.94970703125, "global_step": 347488, "epoch": 4186} {"train_loss": -25.44643211364746, "global_step": 347489, "epoch": 4186} {"train_loss": -25.178939819335938, "global_step": 347490, "epoch": 4186} {"train_loss": -25.46795082092285, "global_step": 347491, "epoch": 4186} {"train_loss": -26.079303741455078, "global_step": 347492, "epoch": 4186} {"train_loss": -25.608673095703125, "global_step": 347493, "epoch": 4186} {"train_loss": -26.30256462097168, "global_step": 347494, "epoch": 4186} {"train_loss": -25.862024307250977, "global_step": 347495, "epoch": 4186} {"train_loss": -26.05360221862793, "global_step": 347496, "epoch": 4186} {"train_loss": -26.139236450195312, "global_step": 347497, "epoch": 4186} {"train_loss": -25.91920280456543, "global_step": 347498, "epoch": 4186} {"train_loss": -26.181812286376953, "global_step": 347499, "epoch": 4186} {"train_loss": -25.874740600585938, "global_step": 347500, "epoch": 4186} {"train_loss": -26.009418487548828, "global_step": 347501, "epoch": 4186} {"train_loss": -26.367584228515625, "global_step": 347502, "epoch": 4186} {"train_loss": -26.263946533203125, "global_step": 347503, "epoch": 4186} {"train_loss": -26.18514060974121, "global_step": 347504, "epoch": 4186} {"train_loss": -26.037525177001953, "global_step": 347505, "epoch": 4186} {"train_loss": -26.25343894958496, "global_step": 347506, "epoch": 4186} {"train_loss": -26.150604248046875, "global_step": 347507, "epoch": 4186} {"train_loss": -26.40936279296875, "global_step": 347508, "epoch": 4186} {"train_loss": -26.388608932495117, "global_step": 347509, "epoch": 4186} {"train_loss": -26.189077377319336, "global_step": 347510, "epoch": 4186} {"train_loss": -26.06696891784668, "global_step": 347511, "epoch": 4186} {"train_loss": -26.30055046081543, "global_step": 347512, "epoch": 4186} {"train_loss": -26.308979034423828, "global_step": 347513, "epoch": 4186} {"train_loss": -26.055252075195312, "global_step": 347514, "epoch": 4186} {"train_loss": -26.41944694519043, "global_step": 347515, "epoch": 4186} {"train_loss": -26.336828231811523, "global_step": 347516, "epoch": 4186} {"train_loss": -26.220563888549805, "global_step": 347517, "epoch": 4186} {"train_loss": -26.53736686706543, "global_step": 347518, "epoch": 4186} {"train_loss": -26.6430606842041, "global_step": 347519, "epoch": 4186} {"train_loss": -25.998742919370354, "global_step": 347520, "epoch": 4186, "val_loss": 6729116.0} {"train_loss": -25.694568634033203, "global_step": 347521, "epoch": 4187} {"train_loss": -26.11380958557129, "global_step": 347522, "epoch": 4187} {"train_loss": -26.003686904907227, "global_step": 347523, "epoch": 4187} {"train_loss": -25.784107208251953, "global_step": 347524, "epoch": 4187} {"train_loss": -26.167768478393555, "global_step": 347525, "epoch": 4187} {"train_loss": -25.655353546142578, "global_step": 347526, "epoch": 4187} {"train_loss": -25.852466583251953, "global_step": 347527, "epoch": 4187} {"train_loss": -25.669544219970703, "global_step": 347528, "epoch": 4187} {"train_loss": -25.89423942565918, "global_step": 347529, "epoch": 4187} {"train_loss": -25.915273666381836, "global_step": 347530, "epoch": 4187} {"train_loss": -25.627958297729492, "global_step": 347531, "epoch": 4187} {"train_loss": -25.63008689880371, "global_step": 347532, "epoch": 4187} {"train_loss": -25.7940616607666, "global_step": 347533, "epoch": 4187} {"train_loss": -26.29298210144043, "global_step": 347534, "epoch": 4187} {"train_loss": -26.131549835205078, "global_step": 347535, "epoch": 4187} {"train_loss": -26.20309829711914, "global_step": 347536, "epoch": 4187} {"train_loss": -25.952960968017578, "global_step": 347537, "epoch": 4187} {"train_loss": -25.826261520385742, "global_step": 347538, "epoch": 4187} {"train_loss": -25.840009689331055, "global_step": 347539, "epoch": 4187} {"train_loss": -26.098419189453125, "global_step": 347540, "epoch": 4187} {"train_loss": -26.001190185546875, "global_step": 347541, "epoch": 4187} {"train_loss": -26.157245635986328, "global_step": 347542, "epoch": 4187} {"train_loss": -26.123620986938477, "global_step": 347543, "epoch": 4187} {"train_loss": -26.202136993408203, "global_step": 347544, "epoch": 4187} {"train_loss": -26.257532119750977, "global_step": 347545, "epoch": 4187} {"train_loss": -26.429468154907227, "global_step": 347546, "epoch": 4187} {"train_loss": -26.244037628173828, "global_step": 347547, "epoch": 4187} {"train_loss": -26.1075496673584, "global_step": 347548, "epoch": 4187} {"train_loss": -25.91670036315918, "global_step": 347549, "epoch": 4187} {"train_loss": -26.328033447265625, "global_step": 347550, "epoch": 4187} {"train_loss": -26.32611656188965, "global_step": 347551, "epoch": 4187} {"train_loss": -26.243215560913086, "global_step": 347552, "epoch": 4187} {"train_loss": -26.106372833251953, "global_step": 347553, "epoch": 4187} {"train_loss": -26.499414443969727, "global_step": 347554, "epoch": 4187} {"train_loss": -26.171117782592773, "global_step": 347555, "epoch": 4187} {"train_loss": -26.468719482421875, "global_step": 347556, "epoch": 4187} {"train_loss": -26.442060470581055, "global_step": 347557, "epoch": 4187} {"train_loss": -25.984806060791016, "global_step": 347558, "epoch": 4187} {"train_loss": -25.951690673828125, "global_step": 347559, "epoch": 4187} {"train_loss": -26.2447452545166, "global_step": 347560, "epoch": 4187} {"train_loss": -26.282682418823242, "global_step": 347561, "epoch": 4187} {"train_loss": -26.211767196655273, "global_step": 347562, "epoch": 4187} {"train_loss": -25.98712730407715, "global_step": 347563, "epoch": 4187} {"train_loss": -26.558048248291016, "global_step": 347564, "epoch": 4187} {"train_loss": -26.035505294799805, "global_step": 347565, "epoch": 4187} {"train_loss": -26.132421493530273, "global_step": 347566, "epoch": 4187} {"train_loss": -26.027820587158203, "global_step": 347567, "epoch": 4187} {"train_loss": -26.259307861328125, "global_step": 347568, "epoch": 4187} {"train_loss": -26.357641220092773, "global_step": 347569, "epoch": 4187} {"train_loss": -26.234500885009766, "global_step": 347570, "epoch": 4187} {"train_loss": -26.65817642211914, "global_step": 347571, "epoch": 4187} {"train_loss": -26.65102195739746, "global_step": 347572, "epoch": 4187} {"train_loss": -26.511205673217773, "global_step": 347573, "epoch": 4187} {"train_loss": -26.14275550842285, "global_step": 347574, "epoch": 4187} {"train_loss": -26.344898223876953, "global_step": 347575, "epoch": 4187} {"train_loss": -26.369070053100586, "global_step": 347576, "epoch": 4187} {"train_loss": -26.304819107055664, "global_step": 347577, "epoch": 4187} {"train_loss": -26.3358211517334, "global_step": 347578, "epoch": 4187} {"train_loss": -26.639209747314453, "global_step": 347579, "epoch": 4187} {"train_loss": -26.554956436157227, "global_step": 347580, "epoch": 4187} {"train_loss": -26.3930606842041, "global_step": 347581, "epoch": 4187} {"train_loss": -26.057607650756836, "global_step": 347582, "epoch": 4187} {"train_loss": -25.733922958374023, "global_step": 347583, "epoch": 4187} {"train_loss": -25.664274215698242, "global_step": 347584, "epoch": 4187} {"train_loss": -26.2786808013916, "global_step": 347585, "epoch": 4187} {"train_loss": -25.858179092407227, "global_step": 347586, "epoch": 4187} {"train_loss": -25.83363151550293, "global_step": 347587, "epoch": 4187} {"train_loss": -25.99957847595215, "global_step": 347588, "epoch": 4187} {"train_loss": -25.836095809936523, "global_step": 347589, "epoch": 4187} {"train_loss": -25.9720458984375, "global_step": 347590, "epoch": 4187} {"train_loss": -25.903705596923828, "global_step": 347591, "epoch": 4187} {"train_loss": -26.365827560424805, "global_step": 347592, "epoch": 4187} {"train_loss": -26.112878799438477, "global_step": 347593, "epoch": 4187} {"train_loss": -26.059417724609375, "global_step": 347594, "epoch": 4187} {"train_loss": -26.309717178344727, "global_step": 347595, "epoch": 4187} {"train_loss": -26.2310848236084, "global_step": 347596, "epoch": 4187} {"train_loss": -25.871313095092773, "global_step": 347597, "epoch": 4187} {"train_loss": -25.91521644592285, "global_step": 347598, "epoch": 4187} {"train_loss": -25.744598388671875, "global_step": 347599, "epoch": 4187} {"train_loss": -25.978641510009766, "global_step": 347600, "epoch": 4187} {"train_loss": -26.083953857421875, "global_step": 347601, "epoch": 4187} {"train_loss": -26.551544189453125, "global_step": 347602, "epoch": 4187} {"train_loss": -26.11054843305105, "global_step": 347603, "epoch": 4187, "val_loss": 6651176.0} {"train_loss": -26.16913414001465, "global_step": 347604, "epoch": 4188} {"train_loss": -25.505674362182617, "global_step": 347605, "epoch": 4188} {"train_loss": -25.833642959594727, "global_step": 347606, "epoch": 4188} {"train_loss": -26.08478355407715, "global_step": 347607, "epoch": 4188} {"train_loss": -26.5655517578125, "global_step": 347608, "epoch": 4188} {"train_loss": -25.523195266723633, "global_step": 347609, "epoch": 4188} {"train_loss": -25.484527587890625, "global_step": 347610, "epoch": 4188} {"train_loss": -25.610742568969727, "global_step": 347611, "epoch": 4188} {"train_loss": -25.95232582092285, "global_step": 347612, "epoch": 4188} {"train_loss": -25.969013214111328, "global_step": 347613, "epoch": 4188} {"train_loss": -26.064146041870117, "global_step": 347614, "epoch": 4188} {"train_loss": -26.01886558532715, "global_step": 347615, "epoch": 4188} {"train_loss": -25.67656898498535, "global_step": 347616, "epoch": 4188} {"train_loss": -26.041013717651367, "global_step": 347617, "epoch": 4188} {"train_loss": -26.18708610534668, "global_step": 347618, "epoch": 4188} {"train_loss": -26.350650787353516, "global_step": 347619, "epoch": 4188} {"train_loss": -26.240528106689453, "global_step": 347620, "epoch": 4188} {"train_loss": -25.82843589782715, "global_step": 347621, "epoch": 4188} {"train_loss": -26.2396297454834, "global_step": 347622, "epoch": 4188} {"train_loss": -25.864730834960938, "global_step": 347623, "epoch": 4188} {"train_loss": -26.11866569519043, "global_step": 347624, "epoch": 4188} {"train_loss": -26.47186851501465, "global_step": 347625, "epoch": 4188} {"train_loss": -26.482389450073242, "global_step": 347626, "epoch": 4188} {"train_loss": -25.97161865234375, "global_step": 347627, "epoch": 4188} {"train_loss": -25.86372184753418, "global_step": 347628, "epoch": 4188} {"train_loss": -26.141498565673828, "global_step": 347629, "epoch": 4188} {"train_loss": -25.977148056030273, "global_step": 347630, "epoch": 4188} {"train_loss": -25.84283447265625, "global_step": 347631, "epoch": 4188} {"train_loss": -26.398136138916016, "global_step": 347632, "epoch": 4188} {"train_loss": -26.434741973876953, "global_step": 347633, "epoch": 4188} {"train_loss": -26.235610961914062, "global_step": 347634, "epoch": 4188} {"train_loss": -26.41120719909668, "global_step": 347635, "epoch": 4188} {"train_loss": -26.154193878173828, "global_step": 347636, "epoch": 4188} {"train_loss": -26.400426864624023, "global_step": 347637, "epoch": 4188} {"train_loss": -26.337696075439453, "global_step": 347638, "epoch": 4188} {"train_loss": -26.214380264282227, "global_step": 347639, "epoch": 4188} {"train_loss": -26.10112953186035, "global_step": 347640, "epoch": 4188} {"train_loss": -25.973159790039062, "global_step": 347641, "epoch": 4188} {"train_loss": -26.37447166442871, "global_step": 347642, "epoch": 4188} {"train_loss": -26.296615600585938, "global_step": 347643, "epoch": 4188} {"train_loss": -26.279743194580078, "global_step": 347644, "epoch": 4188} {"train_loss": -26.040760040283203, "global_step": 347645, "epoch": 4188} {"train_loss": -26.417394638061523, "global_step": 347646, "epoch": 4188} {"train_loss": -26.459436416625977, "global_step": 347647, "epoch": 4188} {"train_loss": -26.315998077392578, "global_step": 347648, "epoch": 4188} {"train_loss": -26.76955223083496, "global_step": 347649, "epoch": 4188} {"train_loss": -26.39251136779785, "global_step": 347650, "epoch": 4188} {"train_loss": -26.054433822631836, "global_step": 347651, "epoch": 4188} {"train_loss": -26.447484970092773, "global_step": 347652, "epoch": 4188} {"train_loss": -26.4729061126709, "global_step": 347653, "epoch": 4188} {"train_loss": -26.33990478515625, "global_step": 347654, "epoch": 4188} {"train_loss": -26.40387535095215, "global_step": 347655, "epoch": 4188} {"train_loss": -26.21584129333496, "global_step": 347656, "epoch": 4188} {"train_loss": -26.162668228149414, "global_step": 347657, "epoch": 4188} {"train_loss": -26.508956909179688, "global_step": 347658, "epoch": 4188} {"train_loss": -26.20148277282715, "global_step": 347659, "epoch": 4188} {"train_loss": -26.36665916442871, "global_step": 347660, "epoch": 4188} {"train_loss": -26.163129806518555, "global_step": 347661, "epoch": 4188} {"train_loss": -26.57257652282715, "global_step": 347662, "epoch": 4188} {"train_loss": -26.038883209228516, "global_step": 347663, "epoch": 4188} {"train_loss": -26.342077255249023, "global_step": 347664, "epoch": 4188} {"train_loss": -25.915725708007812, "global_step": 347665, "epoch": 4188} {"train_loss": -26.274381637573242, "global_step": 347666, "epoch": 4188} {"train_loss": -26.043058395385742, "global_step": 347667, "epoch": 4188} {"train_loss": -26.23833656311035, "global_step": 347668, "epoch": 4188} {"train_loss": -25.499664306640625, "global_step": 347669, "epoch": 4188} {"train_loss": -25.270408630371094, "global_step": 347670, "epoch": 4188} {"train_loss": -25.495376586914062, "global_step": 347671, "epoch": 4188} {"train_loss": -25.65778160095215, "global_step": 347672, "epoch": 4188} {"train_loss": -25.6923885345459, "global_step": 347673, "epoch": 4188} {"train_loss": -25.723352432250977, "global_step": 347674, "epoch": 4188} {"train_loss": -26.10676383972168, "global_step": 347675, "epoch": 4188} {"train_loss": -25.68549156188965, "global_step": 347676, "epoch": 4188} {"train_loss": -25.639957427978516, "global_step": 347677, "epoch": 4188} {"train_loss": -25.998432159423828, "global_step": 347678, "epoch": 4188} {"train_loss": -25.721424102783203, "global_step": 347679, "epoch": 4188} {"train_loss": -25.710996627807617, "global_step": 347680, "epoch": 4188} {"train_loss": -25.68044090270996, "global_step": 347681, "epoch": 4188} {"train_loss": -25.870880126953125, "global_step": 347682, "epoch": 4188} {"train_loss": -26.045324325561523, "global_step": 347683, "epoch": 4188} {"train_loss": -25.923513412475586, "global_step": 347684, "epoch": 4188} {"train_loss": -25.716577529907227, "global_step": 347685, "epoch": 4188} {"train_loss": -26.081845593739704, "global_step": 347686, "epoch": 4188, "val_loss": 6568934.0} {"train_loss": -26.0500545501709, "global_step": 347687, "epoch": 4189} {"train_loss": -25.447301864624023, "global_step": 347688, "epoch": 4189} {"train_loss": -25.6835880279541, "global_step": 347689, "epoch": 4189} {"train_loss": -25.74232292175293, "global_step": 347690, "epoch": 4189} {"train_loss": -25.779348373413086, "global_step": 347691, "epoch": 4189} {"train_loss": -25.90521240234375, "global_step": 347692, "epoch": 4189} {"train_loss": -25.671100616455078, "global_step": 347693, "epoch": 4189} {"train_loss": -25.9614315032959, "global_step": 347694, "epoch": 4189} {"train_loss": -25.85992431640625, "global_step": 347695, "epoch": 4189} {"train_loss": -25.71961784362793, "global_step": 347696, "epoch": 4189} {"train_loss": -26.288599014282227, "global_step": 347697, "epoch": 4189} {"train_loss": -26.008258819580078, "global_step": 347698, "epoch": 4189} {"train_loss": -26.058385848999023, "global_step": 347699, "epoch": 4189} {"train_loss": -25.72527503967285, "global_step": 347700, "epoch": 4189} {"train_loss": -26.007871627807617, "global_step": 347701, "epoch": 4189} {"train_loss": -26.222822189331055, "global_step": 347702, "epoch": 4189} {"train_loss": -26.465356826782227, "global_step": 347703, "epoch": 4189} {"train_loss": -26.07032585144043, "global_step": 347704, "epoch": 4189} {"train_loss": -25.629013061523438, "global_step": 347705, "epoch": 4189} {"train_loss": -25.850217819213867, "global_step": 347706, "epoch": 4189} {"train_loss": -26.233129501342773, "global_step": 347707, "epoch": 4189} {"train_loss": -25.873401641845703, "global_step": 347708, "epoch": 4189} {"train_loss": -25.864377975463867, "global_step": 347709, "epoch": 4189} {"train_loss": -26.515701293945312, "global_step": 347710, "epoch": 4189} {"train_loss": -26.176483154296875, "global_step": 347711, "epoch": 4189} {"train_loss": -26.463947296142578, "global_step": 347712, "epoch": 4189} {"train_loss": -26.077207565307617, "global_step": 347713, "epoch": 4189} {"train_loss": -26.282217025756836, "global_step": 347714, "epoch": 4189} {"train_loss": -26.12822914123535, "global_step": 347715, "epoch": 4189} {"train_loss": -26.319318771362305, "global_step": 347716, "epoch": 4189} {"train_loss": -25.94356346130371, "global_step": 347717, "epoch": 4189} {"train_loss": -25.6494083404541, "global_step": 347718, "epoch": 4189} {"train_loss": -26.1109619140625, "global_step": 347719, "epoch": 4189} {"train_loss": -26.137561798095703, "global_step": 347720, "epoch": 4189} {"train_loss": -25.8665714263916, "global_step": 347721, "epoch": 4189} {"train_loss": -26.038623809814453, "global_step": 347722, "epoch": 4189} {"train_loss": -26.3155517578125, "global_step": 347723, "epoch": 4189} {"train_loss": -25.600439071655273, "global_step": 347724, "epoch": 4189} {"train_loss": -25.75714683532715, "global_step": 347725, "epoch": 4189} {"train_loss": -26.012304306030273, "global_step": 347726, "epoch": 4189} {"train_loss": -26.226598739624023, "global_step": 347727, "epoch": 4189} {"train_loss": -25.6976261138916, "global_step": 347728, "epoch": 4189} {"train_loss": -26.010345458984375, "global_step": 347729, "epoch": 4189} {"train_loss": -26.299657821655273, "global_step": 347730, "epoch": 4189} {"train_loss": -26.203027725219727, "global_step": 347731, "epoch": 4189} {"train_loss": -26.1651611328125, "global_step": 347732, "epoch": 4189} {"train_loss": -26.228515625, "global_step": 347733, "epoch": 4189} {"train_loss": -26.1422061920166, "global_step": 347734, "epoch": 4189} {"train_loss": -26.121286392211914, "global_step": 347735, "epoch": 4189} {"train_loss": -26.4069766998291, "global_step": 347736, "epoch": 4189} {"train_loss": -26.117279052734375, "global_step": 347737, "epoch": 4189} {"train_loss": -26.40790367126465, "global_step": 347738, "epoch": 4189} {"train_loss": -26.057453155517578, "global_step": 347739, "epoch": 4189} {"train_loss": -26.405181884765625, "global_step": 347740, "epoch": 4189} {"train_loss": -26.461206436157227, "global_step": 347741, "epoch": 4189} {"train_loss": -26.4965877532959, "global_step": 347742, "epoch": 4189} {"train_loss": -26.17850112915039, "global_step": 347743, "epoch": 4189} {"train_loss": -26.337186813354492, "global_step": 347744, "epoch": 4189} {"train_loss": -26.072309494018555, "global_step": 347745, "epoch": 4189} {"train_loss": -26.46149253845215, "global_step": 347746, "epoch": 4189} {"train_loss": -26.306171417236328, "global_step": 347747, "epoch": 4189} {"train_loss": -26.17237663269043, "global_step": 347748, "epoch": 4189} {"train_loss": -26.640155792236328, "global_step": 347749, "epoch": 4189} {"train_loss": -26.325132369995117, "global_step": 347750, "epoch": 4189} {"train_loss": -26.28376579284668, "global_step": 347751, "epoch": 4189} {"train_loss": -26.132848739624023, "global_step": 347752, "epoch": 4189} {"train_loss": -26.40272331237793, "global_step": 347753, "epoch": 4189} {"train_loss": -26.419057846069336, "global_step": 347754, "epoch": 4189} {"train_loss": -26.564916610717773, "global_step": 347755, "epoch": 4189} {"train_loss": -26.059106826782227, "global_step": 347756, "epoch": 4189} {"train_loss": -26.12879753112793, "global_step": 347757, "epoch": 4189} {"train_loss": -26.085956573486328, "global_step": 347758, "epoch": 4189} {"train_loss": -26.748321533203125, "global_step": 347759, "epoch": 4189} {"train_loss": -26.241968154907227, "global_step": 347760, "epoch": 4189} {"train_loss": -26.43287467956543, "global_step": 347761, "epoch": 4189} {"train_loss": -26.026901245117188, "global_step": 347762, "epoch": 4189} {"train_loss": -25.875, "global_step": 347763, "epoch": 4189} {"train_loss": -25.299358367919922, "global_step": 347764, "epoch": 4189} {"train_loss": -24.972034454345703, "global_step": 347765, "epoch": 4189} {"train_loss": -25.660497665405273, "global_step": 347766, "epoch": 4189} {"train_loss": -26.0286865234375, "global_step": 347767, "epoch": 4189} {"train_loss": -26.106122970581055, "global_step": 347768, "epoch": 4189} {"train_loss": -26.094311610761896, "global_step": 347769, "epoch": 4189, "val_loss": 6673597.0} {"train_loss": -25.674118041992188, "global_step": 347770, "epoch": 4190} {"train_loss": -25.87875747680664, "global_step": 347771, "epoch": 4190} {"train_loss": -25.334150314331055, "global_step": 347772, "epoch": 4190} {"train_loss": -25.786060333251953, "global_step": 347773, "epoch": 4190} {"train_loss": -25.476072311401367, "global_step": 347774, "epoch": 4190} {"train_loss": -25.864212036132812, "global_step": 347775, "epoch": 4190} {"train_loss": -25.464557647705078, "global_step": 347776, "epoch": 4190} {"train_loss": -25.914569854736328, "global_step": 347777, "epoch": 4190} {"train_loss": -25.391162872314453, "global_step": 347778, "epoch": 4190} {"train_loss": -25.773481369018555, "global_step": 347779, "epoch": 4190} {"train_loss": -25.98972511291504, "global_step": 347780, "epoch": 4190} {"train_loss": -25.769712448120117, "global_step": 347781, "epoch": 4190} {"train_loss": -25.7307071685791, "global_step": 347782, "epoch": 4190} {"train_loss": -25.616872787475586, "global_step": 347783, "epoch": 4190} {"train_loss": -26.1800479888916, "global_step": 347784, "epoch": 4190} {"train_loss": -25.64423942565918, "global_step": 347785, "epoch": 4190} {"train_loss": -26.097400665283203, "global_step": 347786, "epoch": 4190} {"train_loss": -26.1773738861084, "global_step": 347787, "epoch": 4190} {"train_loss": -25.91425132751465, "global_step": 347788, "epoch": 4190} {"train_loss": -26.216711044311523, "global_step": 347789, "epoch": 4190} {"train_loss": -25.84348487854004, "global_step": 347790, "epoch": 4190} {"train_loss": -25.969512939453125, "global_step": 347791, "epoch": 4190} {"train_loss": -25.729215621948242, "global_step": 347792, "epoch": 4190} {"train_loss": -25.802946090698242, "global_step": 347793, "epoch": 4190} {"train_loss": -25.831878662109375, "global_step": 347794, "epoch": 4190} {"train_loss": -25.59748649597168, "global_step": 347795, "epoch": 4190} {"train_loss": -26.1325740814209, "global_step": 347796, "epoch": 4190} {"train_loss": -25.983612060546875, "global_step": 347797, "epoch": 4190} {"train_loss": -25.786890029907227, "global_step": 347798, "epoch": 4190} {"train_loss": -26.4674015045166, "global_step": 347799, "epoch": 4190} {"train_loss": -25.824338912963867, "global_step": 347800, "epoch": 4190} {"train_loss": -26.366697311401367, "global_step": 347801, "epoch": 4190} {"train_loss": -26.239831924438477, "global_step": 347802, "epoch": 4190} {"train_loss": -26.199628829956055, "global_step": 347803, "epoch": 4190} {"train_loss": -25.949243545532227, "global_step": 347804, "epoch": 4190} {"train_loss": -26.155975341796875, "global_step": 347805, "epoch": 4190} {"train_loss": -26.12799072265625, "global_step": 347806, "epoch": 4190} {"train_loss": -26.180448532104492, "global_step": 347807, "epoch": 4190} {"train_loss": -26.5849609375, "global_step": 347808, "epoch": 4190} {"train_loss": -26.13434410095215, "global_step": 347809, "epoch": 4190} {"train_loss": -26.378620147705078, "global_step": 347810, "epoch": 4190} {"train_loss": -26.0936279296875, "global_step": 347811, "epoch": 4190} {"train_loss": -26.124439239501953, "global_step": 347812, "epoch": 4190} {"train_loss": -26.048786163330078, "global_step": 347813, "epoch": 4190} {"train_loss": -26.203393936157227, "global_step": 347814, "epoch": 4190} {"train_loss": -26.256378173828125, "global_step": 347815, "epoch": 4190} {"train_loss": -26.631452560424805, "global_step": 347816, "epoch": 4190} {"train_loss": -26.265233993530273, "global_step": 347817, "epoch": 4190} {"train_loss": -26.30560874938965, "global_step": 347818, "epoch": 4190} {"train_loss": -26.454015731811523, "global_step": 347819, "epoch": 4190} {"train_loss": -26.55240249633789, "global_step": 347820, "epoch": 4190} {"train_loss": -26.299123764038086, "global_step": 347821, "epoch": 4190} {"train_loss": -26.582624435424805, "global_step": 347822, "epoch": 4190} {"train_loss": -26.265893936157227, "global_step": 347823, "epoch": 4190} {"train_loss": -26.346607208251953, "global_step": 347824, "epoch": 4190} {"train_loss": -26.515954971313477, "global_step": 347825, "epoch": 4190} {"train_loss": -26.472753524780273, "global_step": 347826, "epoch": 4190} {"train_loss": -26.48565101623535, "global_step": 347827, "epoch": 4190} {"train_loss": -26.163471221923828, "global_step": 347828, "epoch": 4190} {"train_loss": -26.518253326416016, "global_step": 347829, "epoch": 4190} {"train_loss": -26.04932975769043, "global_step": 347830, "epoch": 4190} {"train_loss": -26.09535026550293, "global_step": 347831, "epoch": 4190} {"train_loss": -26.18295669555664, "global_step": 347832, "epoch": 4190} {"train_loss": -26.40818214416504, "global_step": 347833, "epoch": 4190} {"train_loss": -26.04292106628418, "global_step": 347834, "epoch": 4190} {"train_loss": -25.92685890197754, "global_step": 347835, "epoch": 4190} {"train_loss": -26.336694717407227, "global_step": 347836, "epoch": 4190} {"train_loss": -26.228742599487305, "global_step": 347837, "epoch": 4190} {"train_loss": -26.088031768798828, "global_step": 347838, "epoch": 4190} {"train_loss": -26.284149169921875, "global_step": 347839, "epoch": 4190} {"train_loss": -26.017414093017578, "global_step": 347840, "epoch": 4190} {"train_loss": -25.79352378845215, "global_step": 347841, "epoch": 4190} {"train_loss": -25.743627548217773, "global_step": 347842, "epoch": 4190} {"train_loss": -25.660968780517578, "global_step": 347843, "epoch": 4190} {"train_loss": -25.880353927612305, "global_step": 347844, "epoch": 4190} {"train_loss": -26.018896102905273, "global_step": 347845, "epoch": 4190} {"train_loss": -25.859912872314453, "global_step": 347846, "epoch": 4190} {"train_loss": -25.763019561767578, "global_step": 347847, "epoch": 4190} {"train_loss": -25.80817222595215, "global_step": 347848, "epoch": 4190} {"train_loss": -25.95670509338379, "global_step": 347849, "epoch": 4190} {"train_loss": -25.61838722229004, "global_step": 347850, "epoch": 4190} {"train_loss": -25.776037216186523, "global_step": 347851, "epoch": 4190} {"train_loss": -26.027992363435676, "global_step": 347852, "epoch": 4190, "val_loss": 6644660.0} {"train_loss": -24.356388092041016, "global_step": 347853, "epoch": 4191} {"train_loss": -25.600845336914062, "global_step": 347854, "epoch": 4191} {"train_loss": -24.640806198120117, "global_step": 347855, "epoch": 4191} {"train_loss": -24.894330978393555, "global_step": 347856, "epoch": 4191} {"train_loss": -25.006454467773438, "global_step": 347857, "epoch": 4191} {"train_loss": -25.622806549072266, "global_step": 347858, "epoch": 4191} {"train_loss": -25.29786491394043, "global_step": 347859, "epoch": 4191} {"train_loss": -25.6392765045166, "global_step": 347860, "epoch": 4191} {"train_loss": -25.329692840576172, "global_step": 347861, "epoch": 4191} {"train_loss": -25.43112564086914, "global_step": 347862, "epoch": 4191} {"train_loss": -25.47047996520996, "global_step": 347863, "epoch": 4191} {"train_loss": -26.111799240112305, "global_step": 347864, "epoch": 4191} {"train_loss": -25.584659576416016, "global_step": 347865, "epoch": 4191} {"train_loss": -25.690420150756836, "global_step": 347866, "epoch": 4191} {"train_loss": -25.81776237487793, "global_step": 347867, "epoch": 4191} {"train_loss": -25.990280151367188, "global_step": 347868, "epoch": 4191} {"train_loss": -25.864118576049805, "global_step": 347869, "epoch": 4191} {"train_loss": -25.992597579956055, "global_step": 347870, "epoch": 4191} {"train_loss": -25.910490036010742, "global_step": 347871, "epoch": 4191} {"train_loss": -25.532556533813477, "global_step": 347872, "epoch": 4191} {"train_loss": -25.99640464782715, "global_step": 347873, "epoch": 4191} {"train_loss": -25.68501091003418, "global_step": 347874, "epoch": 4191} {"train_loss": -26.215198516845703, "global_step": 347875, "epoch": 4191} {"train_loss": -25.77851676940918, "global_step": 347876, "epoch": 4191} {"train_loss": -26.036664962768555, "global_step": 347877, "epoch": 4191} {"train_loss": -25.796630859375, "global_step": 347878, "epoch": 4191} {"train_loss": -26.070993423461914, "global_step": 347879, "epoch": 4191} {"train_loss": -26.292028427124023, "global_step": 347880, "epoch": 4191} {"train_loss": -25.65299415588379, "global_step": 347881, "epoch": 4191} {"train_loss": -25.86249351501465, "global_step": 347882, "epoch": 4191} {"train_loss": -25.733322143554688, "global_step": 347883, "epoch": 4191} {"train_loss": -25.808486938476562, "global_step": 347884, "epoch": 4191} {"train_loss": -25.848005294799805, "global_step": 347885, "epoch": 4191} {"train_loss": -25.745655059814453, "global_step": 347886, "epoch": 4191} {"train_loss": -26.089405059814453, "global_step": 347887, "epoch": 4191} {"train_loss": -26.14240074157715, "global_step": 347888, "epoch": 4191} {"train_loss": -26.004150390625, "global_step": 347889, "epoch": 4191} {"train_loss": -25.710981369018555, "global_step": 347890, "epoch": 4191} {"train_loss": -26.374195098876953, "global_step": 347891, "epoch": 4191} {"train_loss": -26.14432144165039, "global_step": 347892, "epoch": 4191} {"train_loss": -26.326770782470703, "global_step": 347893, "epoch": 4191} {"train_loss": -26.147689819335938, "global_step": 347894, "epoch": 4191} {"train_loss": -26.586963653564453, "global_step": 347895, "epoch": 4191} {"train_loss": -25.74286460876465, "global_step": 347896, "epoch": 4191} {"train_loss": -26.03272819519043, "global_step": 347897, "epoch": 4191} {"train_loss": -26.232044219970703, "global_step": 347898, "epoch": 4191} {"train_loss": -26.425622940063477, "global_step": 347899, "epoch": 4191} {"train_loss": -26.220050811767578, "global_step": 347900, "epoch": 4191} {"train_loss": -26.483402252197266, "global_step": 347901, "epoch": 4191} {"train_loss": -26.250259399414062, "global_step": 347902, "epoch": 4191} {"train_loss": -26.02033805847168, "global_step": 347903, "epoch": 4191} {"train_loss": -25.95685386657715, "global_step": 347904, "epoch": 4191} {"train_loss": -26.408069610595703, "global_step": 347905, "epoch": 4191} {"train_loss": -26.185094833374023, "global_step": 347906, "epoch": 4191} {"train_loss": -25.9249324798584, "global_step": 347907, "epoch": 4191} {"train_loss": -25.982776641845703, "global_step": 347908, "epoch": 4191} {"train_loss": -26.221134185791016, "global_step": 347909, "epoch": 4191} {"train_loss": -26.131031036376953, "global_step": 347910, "epoch": 4191} {"train_loss": -25.728219985961914, "global_step": 347911, "epoch": 4191} {"train_loss": -25.529251098632812, "global_step": 347912, "epoch": 4191} {"train_loss": -25.67774772644043, "global_step": 347913, "epoch": 4191} {"train_loss": -25.466283798217773, "global_step": 347914, "epoch": 4191} {"train_loss": -26.0113582611084, "global_step": 347915, "epoch": 4191} {"train_loss": -26.163116455078125, "global_step": 347916, "epoch": 4191} {"train_loss": -25.72513771057129, "global_step": 347917, "epoch": 4191} {"train_loss": -26.018781661987305, "global_step": 347918, "epoch": 4191} {"train_loss": -26.155303955078125, "global_step": 347919, "epoch": 4191} {"train_loss": -26.09767723083496, "global_step": 347920, "epoch": 4191} {"train_loss": -26.133939743041992, "global_step": 347921, "epoch": 4191} {"train_loss": -25.890979766845703, "global_step": 347922, "epoch": 4191} {"train_loss": -26.364404678344727, "global_step": 347923, "epoch": 4191} {"train_loss": -25.902917861938477, "global_step": 347924, "epoch": 4191} {"train_loss": -26.229543685913086, "global_step": 347925, "epoch": 4191} {"train_loss": -25.917821884155273, "global_step": 347926, "epoch": 4191} {"train_loss": -26.24018669128418, "global_step": 347927, "epoch": 4191} {"train_loss": -26.42474365234375, "global_step": 347928, "epoch": 4191} {"train_loss": -26.09769058227539, "global_step": 347929, "epoch": 4191} {"train_loss": -26.44683265686035, "global_step": 347930, "epoch": 4191} {"train_loss": -26.645288467407227, "global_step": 347931, "epoch": 4191} {"train_loss": -25.926528930664062, "global_step": 347932, "epoch": 4191} {"train_loss": -26.436243057250977, "global_step": 347933, "epoch": 4191} {"train_loss": -26.392431259155273, "global_step": 347934, "epoch": 4191} {"train_loss": -25.908727209252046, "global_step": 347935, "epoch": 4191, "val_loss": 6705727.0} {"train_loss": -25.861358642578125, "global_step": 347936, "epoch": 4192} {"train_loss": -25.643798828125, "global_step": 347937, "epoch": 4192} {"train_loss": -25.661340713500977, "global_step": 347938, "epoch": 4192} {"train_loss": -25.8576717376709, "global_step": 347939, "epoch": 4192} {"train_loss": -25.496875762939453, "global_step": 347940, "epoch": 4192} {"train_loss": -25.753210067749023, "global_step": 347941, "epoch": 4192} {"train_loss": -25.91935157775879, "global_step": 347942, "epoch": 4192} {"train_loss": -26.0467472076416, "global_step": 347943, "epoch": 4192} {"train_loss": -25.43239974975586, "global_step": 347944, "epoch": 4192} {"train_loss": -25.922698974609375, "global_step": 347945, "epoch": 4192} {"train_loss": -26.089017868041992, "global_step": 347946, "epoch": 4192} {"train_loss": -25.923919677734375, "global_step": 347947, "epoch": 4192} {"train_loss": -25.928129196166992, "global_step": 347948, "epoch": 4192} {"train_loss": -25.855207443237305, "global_step": 347949, "epoch": 4192} {"train_loss": -25.9204044342041, "global_step": 347950, "epoch": 4192} {"train_loss": -26.200641632080078, "global_step": 347951, "epoch": 4192} {"train_loss": -25.938302993774414, "global_step": 347952, "epoch": 4192} {"train_loss": -25.976266860961914, "global_step": 347953, "epoch": 4192} {"train_loss": -26.077783584594727, "global_step": 347954, "epoch": 4192} {"train_loss": -25.803918838500977, "global_step": 347955, "epoch": 4192} {"train_loss": -25.96351432800293, "global_step": 347956, "epoch": 4192} {"train_loss": -25.944944381713867, "global_step": 347957, "epoch": 4192} {"train_loss": -26.122547149658203, "global_step": 347958, "epoch": 4192} {"train_loss": -26.1621036529541, "global_step": 347959, "epoch": 4192} {"train_loss": -25.903085708618164, "global_step": 347960, "epoch": 4192} {"train_loss": -25.910400390625, "global_step": 347961, "epoch": 4192} {"train_loss": -26.2052001953125, "global_step": 347962, "epoch": 4192} {"train_loss": -26.103607177734375, "global_step": 347963, "epoch": 4192} {"train_loss": -26.280149459838867, "global_step": 347964, "epoch": 4192} {"train_loss": -26.296716690063477, "global_step": 347965, "epoch": 4192} {"train_loss": -26.144062042236328, "global_step": 347966, "epoch": 4192} {"train_loss": -26.4130802154541, "global_step": 347967, "epoch": 4192} {"train_loss": -26.298643112182617, "global_step": 347968, "epoch": 4192} {"train_loss": -25.836286544799805, "global_step": 347969, "epoch": 4192} {"train_loss": -25.964221954345703, "global_step": 347970, "epoch": 4192} {"train_loss": -26.252866744995117, "global_step": 347971, "epoch": 4192} {"train_loss": -26.025226593017578, "global_step": 347972, "epoch": 4192} {"train_loss": -26.12100601196289, "global_step": 347973, "epoch": 4192} {"train_loss": -26.476654052734375, "global_step": 347974, "epoch": 4192} {"train_loss": -26.241785049438477, "global_step": 347975, "epoch": 4192} {"train_loss": -26.224933624267578, "global_step": 347976, "epoch": 4192} {"train_loss": -26.1638126373291, "global_step": 347977, "epoch": 4192} {"train_loss": -26.32179832458496, "global_step": 347978, "epoch": 4192} {"train_loss": -26.415063858032227, "global_step": 347979, "epoch": 4192} {"train_loss": -26.163000106811523, "global_step": 347980, "epoch": 4192} {"train_loss": -26.1298828125, "global_step": 347981, "epoch": 4192} {"train_loss": -25.988065719604492, "global_step": 347982, "epoch": 4192} {"train_loss": -26.2742919921875, "global_step": 347983, "epoch": 4192} {"train_loss": -26.0571346282959, "global_step": 347984, "epoch": 4192} {"train_loss": -26.4111270904541, "global_step": 347985, "epoch": 4192} {"train_loss": -26.162628173828125, "global_step": 347986, "epoch": 4192} {"train_loss": -26.44850730895996, "global_step": 347987, "epoch": 4192} {"train_loss": -26.6114444732666, "global_step": 347988, "epoch": 4192} {"train_loss": -25.944717407226562, "global_step": 347989, "epoch": 4192} {"train_loss": -26.203481674194336, "global_step": 347990, "epoch": 4192} {"train_loss": -26.460901260375977, "global_step": 347991, "epoch": 4192} {"train_loss": -26.227127075195312, "global_step": 347992, "epoch": 4192} {"train_loss": -26.083906173706055, "global_step": 347993, "epoch": 4192} {"train_loss": -26.24799919128418, "global_step": 347994, "epoch": 4192} {"train_loss": -26.217151641845703, "global_step": 347995, "epoch": 4192} {"train_loss": -26.330881118774414, "global_step": 347996, "epoch": 4192} {"train_loss": -25.782575607299805, "global_step": 347997, "epoch": 4192} {"train_loss": -25.912891387939453, "global_step": 347998, "epoch": 4192} {"train_loss": -26.035985946655273, "global_step": 347999, "epoch": 4192} {"train_loss": -26.019834518432617, "global_step": 348000, "epoch": 4192} {"train_loss": -26.29762077331543, "global_step": 348001, "epoch": 4192} {"train_loss": -25.42580795288086, "global_step": 348002, "epoch": 4192} {"train_loss": -25.734989166259766, "global_step": 348003, "epoch": 4192} {"train_loss": -25.882720947265625, "global_step": 348004, "epoch": 4192} {"train_loss": -26.036588668823242, "global_step": 348005, "epoch": 4192} {"train_loss": -25.577360153198242, "global_step": 348006, "epoch": 4192} {"train_loss": -25.967496871948242, "global_step": 348007, "epoch": 4192} {"train_loss": -26.069360733032227, "global_step": 348008, "epoch": 4192} {"train_loss": -25.847646713256836, "global_step": 348009, "epoch": 4192} {"train_loss": -25.787769317626953, "global_step": 348010, "epoch": 4192} {"train_loss": -25.955093383789062, "global_step": 348011, "epoch": 4192} {"train_loss": -25.93705177307129, "global_step": 348012, "epoch": 4192} {"train_loss": -26.024938583374023, "global_step": 348013, "epoch": 4192} {"train_loss": -26.25713539123535, "global_step": 348014, "epoch": 4192} {"train_loss": -26.00857925415039, "global_step": 348015, "epoch": 4192} {"train_loss": -26.10527992248535, "global_step": 348016, "epoch": 4192} {"train_loss": -25.68880271911621, "global_step": 348017, "epoch": 4192} {"train_loss": -26.05702522002071, "global_step": 348018, "epoch": 4192, "val_loss": 6688830.0} {"train_loss": -24.84061050415039, "global_step": 348019, "epoch": 4193} {"train_loss": -25.837482452392578, "global_step": 348020, "epoch": 4193} {"train_loss": -25.03386878967285, "global_step": 348021, "epoch": 4193} {"train_loss": -25.366931915283203, "global_step": 348022, "epoch": 4193} {"train_loss": -25.538150787353516, "global_step": 348023, "epoch": 4193} {"train_loss": -25.898122787475586, "global_step": 348024, "epoch": 4193} {"train_loss": -25.62314796447754, "global_step": 348025, "epoch": 4193} {"train_loss": -25.90549087524414, "global_step": 348026, "epoch": 4193} {"train_loss": -25.390701293945312, "global_step": 348027, "epoch": 4193} {"train_loss": -25.84698486328125, "global_step": 348028, "epoch": 4193} {"train_loss": -25.332857131958008, "global_step": 348029, "epoch": 4193} {"train_loss": -25.680225372314453, "global_step": 348030, "epoch": 4193} {"train_loss": -25.935047149658203, "global_step": 348031, "epoch": 4193} {"train_loss": -25.800565719604492, "global_step": 348032, "epoch": 4193} {"train_loss": -25.68878746032715, "global_step": 348033, "epoch": 4193} {"train_loss": -26.20627784729004, "global_step": 348034, "epoch": 4193} {"train_loss": -26.1658935546875, "global_step": 348035, "epoch": 4193} {"train_loss": -26.0592098236084, "global_step": 348036, "epoch": 4193} {"train_loss": -26.023517608642578, "global_step": 348037, "epoch": 4193} {"train_loss": -25.883544921875, "global_step": 348038, "epoch": 4193} {"train_loss": -25.793249130249023, "global_step": 348039, "epoch": 4193} {"train_loss": -25.94710350036621, "global_step": 348040, "epoch": 4193} {"train_loss": -26.016942977905273, "global_step": 348041, "epoch": 4193} {"train_loss": -26.13677978515625, "global_step": 348042, "epoch": 4193} {"train_loss": -26.054880142211914, "global_step": 348043, "epoch": 4193} {"train_loss": -26.310596466064453, "global_step": 348044, "epoch": 4193} {"train_loss": -26.148630142211914, "global_step": 348045, "epoch": 4193} {"train_loss": -26.03891944885254, "global_step": 348046, "epoch": 4193} {"train_loss": -26.13811683654785, "global_step": 348047, "epoch": 4193} {"train_loss": -26.299116134643555, "global_step": 348048, "epoch": 4193} {"train_loss": -26.008813858032227, "global_step": 348049, "epoch": 4193} {"train_loss": -26.01193618774414, "global_step": 348050, "epoch": 4193} {"train_loss": -25.936460494995117, "global_step": 348051, "epoch": 4193} {"train_loss": -25.986282348632812, "global_step": 348052, "epoch": 4193} {"train_loss": -26.25309181213379, "global_step": 348053, "epoch": 4193} {"train_loss": -26.112720489501953, "global_step": 348054, "epoch": 4193} {"train_loss": -26.694570541381836, "global_step": 348055, "epoch": 4193} {"train_loss": -26.09968376159668, "global_step": 348056, "epoch": 4193} {"train_loss": -26.203954696655273, "global_step": 348057, "epoch": 4193} {"train_loss": -26.82244300842285, "global_step": 348058, "epoch": 4193} {"train_loss": -26.146778106689453, "global_step": 348059, "epoch": 4193} {"train_loss": -26.05802345275879, "global_step": 348060, "epoch": 4193} {"train_loss": -25.6837100982666, "global_step": 348061, "epoch": 4193} {"train_loss": -26.15447998046875, "global_step": 348062, "epoch": 4193} {"train_loss": -25.601404190063477, "global_step": 348063, "epoch": 4193} {"train_loss": -25.609960556030273, "global_step": 348064, "epoch": 4193} {"train_loss": -25.259033203125, "global_step": 348065, "epoch": 4193} {"train_loss": -25.344465255737305, "global_step": 348066, "epoch": 4193} {"train_loss": -26.05573081970215, "global_step": 348067, "epoch": 4193} {"train_loss": -26.328168869018555, "global_step": 348068, "epoch": 4193} {"train_loss": -25.51711082458496, "global_step": 348069, "epoch": 4193} {"train_loss": -25.802358627319336, "global_step": 348070, "epoch": 4193} {"train_loss": -25.85801124572754, "global_step": 348071, "epoch": 4193} {"train_loss": -25.857791900634766, "global_step": 348072, "epoch": 4193} {"train_loss": -25.91335105895996, "global_step": 348073, "epoch": 4193} {"train_loss": -26.226581573486328, "global_step": 348074, "epoch": 4193} {"train_loss": -25.657012939453125, "global_step": 348075, "epoch": 4193} {"train_loss": -25.898590087890625, "global_step": 348076, "epoch": 4193} {"train_loss": -25.752063751220703, "global_step": 348077, "epoch": 4193} {"train_loss": -25.635107040405273, "global_step": 348078, "epoch": 4193} {"train_loss": -26.116430282592773, "global_step": 348079, "epoch": 4193} {"train_loss": -25.892683029174805, "global_step": 348080, "epoch": 4193} {"train_loss": -26.032445907592773, "global_step": 348081, "epoch": 4193} {"train_loss": -25.877460479736328, "global_step": 348082, "epoch": 4193} {"train_loss": -25.834808349609375, "global_step": 348083, "epoch": 4193} {"train_loss": -26.06686782836914, "global_step": 348084, "epoch": 4193} {"train_loss": -26.08875846862793, "global_step": 348085, "epoch": 4193} {"train_loss": -25.908044815063477, "global_step": 348086, "epoch": 4193} {"train_loss": -26.32073402404785, "global_step": 348087, "epoch": 4193} {"train_loss": -25.943145751953125, "global_step": 348088, "epoch": 4193} {"train_loss": -25.921436309814453, "global_step": 348089, "epoch": 4193} {"train_loss": -25.79694938659668, "global_step": 348090, "epoch": 4193} {"train_loss": -26.331928253173828, "global_step": 348091, "epoch": 4193} {"train_loss": -26.231367111206055, "global_step": 348092, "epoch": 4193} {"train_loss": -26.185062408447266, "global_step": 348093, "epoch": 4193} {"train_loss": -26.354801177978516, "global_step": 348094, "epoch": 4193} {"train_loss": -26.126239776611328, "global_step": 348095, "epoch": 4193} {"train_loss": -26.01800537109375, "global_step": 348096, "epoch": 4193} {"train_loss": -26.08674430847168, "global_step": 348097, "epoch": 4193} {"train_loss": -25.922040939331055, "global_step": 348098, "epoch": 4193} {"train_loss": -26.6192626953125, "global_step": 348099, "epoch": 4193} {"train_loss": -26.228656768798828, "global_step": 348100, "epoch": 4193} {"train_loss": -25.939941727971455, "global_step": 348101, "epoch": 4193, "val_loss": 6684226.0} {"train_loss": -25.96346092224121, "global_step": 348102, "epoch": 4194} {"train_loss": -25.84905433654785, "global_step": 348103, "epoch": 4194} {"train_loss": -26.02076530456543, "global_step": 348104, "epoch": 4194} {"train_loss": -25.47822380065918, "global_step": 348105, "epoch": 4194} {"train_loss": -26.101743698120117, "global_step": 348106, "epoch": 4194} {"train_loss": -25.513269424438477, "global_step": 348107, "epoch": 4194} {"train_loss": -26.04840660095215, "global_step": 348108, "epoch": 4194} {"train_loss": -26.090173721313477, "global_step": 348109, "epoch": 4194} {"train_loss": -26.029687881469727, "global_step": 348110, "epoch": 4194} {"train_loss": -25.755359649658203, "global_step": 348111, "epoch": 4194} {"train_loss": -25.932546615600586, "global_step": 348112, "epoch": 4194} {"train_loss": -25.9715576171875, "global_step": 348113, "epoch": 4194} {"train_loss": -26.0339298248291, "global_step": 348114, "epoch": 4194} {"train_loss": -25.759979248046875, "global_step": 348115, "epoch": 4194} {"train_loss": -26.285085678100586, "global_step": 348116, "epoch": 4194} {"train_loss": -26.1004638671875, "global_step": 348117, "epoch": 4194} {"train_loss": -26.1611385345459, "global_step": 348118, "epoch": 4194} {"train_loss": -25.99190330505371, "global_step": 348119, "epoch": 4194} {"train_loss": -26.17105484008789, "global_step": 348120, "epoch": 4194} {"train_loss": -25.704450607299805, "global_step": 348121, "epoch": 4194} {"train_loss": -26.09339714050293, "global_step": 348122, "epoch": 4194} {"train_loss": -25.68179702758789, "global_step": 348123, "epoch": 4194} {"train_loss": -26.166278839111328, "global_step": 348124, "epoch": 4194} {"train_loss": -25.884180068969727, "global_step": 348125, "epoch": 4194} {"train_loss": -25.738943099975586, "global_step": 348126, "epoch": 4194} {"train_loss": -26.08194923400879, "global_step": 348127, "epoch": 4194} {"train_loss": -25.589426040649414, "global_step": 348128, "epoch": 4194} {"train_loss": -25.7907657623291, "global_step": 348129, "epoch": 4194} {"train_loss": -26.237539291381836, "global_step": 348130, "epoch": 4194} {"train_loss": -26.344547271728516, "global_step": 348131, "epoch": 4194} {"train_loss": -26.018903732299805, "global_step": 348132, "epoch": 4194} {"train_loss": -26.49173355102539, "global_step": 348133, "epoch": 4194} {"train_loss": -26.315231323242188, "global_step": 348134, "epoch": 4194} {"train_loss": -26.1621150970459, "global_step": 348135, "epoch": 4194} {"train_loss": -26.218774795532227, "global_step": 348136, "epoch": 4194} {"train_loss": -25.82105827331543, "global_step": 348137, "epoch": 4194} {"train_loss": -26.200763702392578, "global_step": 348138, "epoch": 4194} {"train_loss": -26.454599380493164, "global_step": 348139, "epoch": 4194} {"train_loss": -26.34278678894043, "global_step": 348140, "epoch": 4194} {"train_loss": -26.68868064880371, "global_step": 348141, "epoch": 4194} {"train_loss": -26.674184799194336, "global_step": 348142, "epoch": 4194} {"train_loss": -26.0948543548584, "global_step": 348143, "epoch": 4194} {"train_loss": -26.40266990661621, "global_step": 348144, "epoch": 4194} {"train_loss": -26.232324600219727, "global_step": 348145, "epoch": 4194} {"train_loss": -26.323368072509766, "global_step": 348146, "epoch": 4194} {"train_loss": -26.132787704467773, "global_step": 348147, "epoch": 4194} {"train_loss": -26.240705490112305, "global_step": 348148, "epoch": 4194} {"train_loss": -26.11261558532715, "global_step": 348149, "epoch": 4194} {"train_loss": -26.057947158813477, "global_step": 348150, "epoch": 4194} {"train_loss": -26.30327796936035, "global_step": 348151, "epoch": 4194} {"train_loss": -26.4184513092041, "global_step": 348152, "epoch": 4194} {"train_loss": -26.3067569732666, "global_step": 348153, "epoch": 4194} {"train_loss": -26.129638671875, "global_step": 348154, "epoch": 4194} {"train_loss": -26.29168128967285, "global_step": 348155, "epoch": 4194} {"train_loss": -26.584848403930664, "global_step": 348156, "epoch": 4194} {"train_loss": -26.185937881469727, "global_step": 348157, "epoch": 4194} {"train_loss": -26.26539421081543, "global_step": 348158, "epoch": 4194} {"train_loss": -26.5637264251709, "global_step": 348159, "epoch": 4194} {"train_loss": -26.474576950073242, "global_step": 348160, "epoch": 4194} {"train_loss": -26.210840225219727, "global_step": 348161, "epoch": 4194} {"train_loss": -26.475431442260742, "global_step": 348162, "epoch": 4194} {"train_loss": -25.976282119750977, "global_step": 348163, "epoch": 4194} {"train_loss": -26.17072868347168, "global_step": 348164, "epoch": 4194} {"train_loss": -26.16831398010254, "global_step": 348165, "epoch": 4194} {"train_loss": -26.31524085998535, "global_step": 348166, "epoch": 4194} {"train_loss": -26.371774673461914, "global_step": 348167, "epoch": 4194} {"train_loss": -25.992889404296875, "global_step": 348168, "epoch": 4194} {"train_loss": -26.18538475036621, "global_step": 348169, "epoch": 4194} {"train_loss": -26.125028610229492, "global_step": 348170, "epoch": 4194} {"train_loss": -25.8222713470459, "global_step": 348171, "epoch": 4194} {"train_loss": -25.665390014648438, "global_step": 348172, "epoch": 4194} {"train_loss": -25.76246452331543, "global_step": 348173, "epoch": 4194} {"train_loss": -26.119516372680664, "global_step": 348174, "epoch": 4194} {"train_loss": -26.29327392578125, "global_step": 348175, "epoch": 4194} {"train_loss": -26.182178497314453, "global_step": 348176, "epoch": 4194} {"train_loss": -26.03193473815918, "global_step": 348177, "epoch": 4194} {"train_loss": -25.997161865234375, "global_step": 348178, "epoch": 4194} {"train_loss": -26.17512321472168, "global_step": 348179, "epoch": 4194} {"train_loss": -26.306568145751953, "global_step": 348180, "epoch": 4194} {"train_loss": -26.405588150024414, "global_step": 348181, "epoch": 4194} {"train_loss": -26.3801326751709, "global_step": 348182, "epoch": 4194} {"train_loss": -26.1735782623291, "global_step": 348183, "epoch": 4194} {"train_loss": -26.142567255410803, "global_step": 348184, "epoch": 4194, "val_loss": 6718077.0} {"train_loss": -25.0413875579834, "global_step": 348185, "epoch": 4195} {"train_loss": -25.80677604675293, "global_step": 348186, "epoch": 4195} {"train_loss": -25.24786376953125, "global_step": 348187, "epoch": 4195} {"train_loss": -25.77850914001465, "global_step": 348188, "epoch": 4195} {"train_loss": -25.562829971313477, "global_step": 348189, "epoch": 4195} {"train_loss": -25.594396591186523, "global_step": 348190, "epoch": 4195} {"train_loss": -26.027196884155273, "global_step": 348191, "epoch": 4195} {"train_loss": -25.654211044311523, "global_step": 348192, "epoch": 4195} {"train_loss": -25.569135665893555, "global_step": 348193, "epoch": 4195} {"train_loss": -26.079877853393555, "global_step": 348194, "epoch": 4195} {"train_loss": -25.354745864868164, "global_step": 348195, "epoch": 4195} {"train_loss": -25.214353561401367, "global_step": 348196, "epoch": 4195} {"train_loss": -25.8549747467041, "global_step": 348197, "epoch": 4195} {"train_loss": -25.811187744140625, "global_step": 348198, "epoch": 4195} {"train_loss": -25.896209716796875, "global_step": 348199, "epoch": 4195} {"train_loss": -25.902917861938477, "global_step": 348200, "epoch": 4195} {"train_loss": -25.42496109008789, "global_step": 348201, "epoch": 4195} {"train_loss": -26.042455673217773, "global_step": 348202, "epoch": 4195} {"train_loss": -26.203760147094727, "global_step": 348203, "epoch": 4195} {"train_loss": -26.07074546813965, "global_step": 348204, "epoch": 4195} {"train_loss": -25.687070846557617, "global_step": 348205, "epoch": 4195} {"train_loss": -26.270843505859375, "global_step": 348206, "epoch": 4195} {"train_loss": -26.04131507873535, "global_step": 348207, "epoch": 4195} {"train_loss": -25.69985008239746, "global_step": 348208, "epoch": 4195} {"train_loss": -26.020498275756836, "global_step": 348209, "epoch": 4195} {"train_loss": -25.911787033081055, "global_step": 348210, "epoch": 4195} {"train_loss": -25.74080467224121, "global_step": 348211, "epoch": 4195} {"train_loss": -26.12385368347168, "global_step": 348212, "epoch": 4195} {"train_loss": -26.091962814331055, "global_step": 348213, "epoch": 4195} {"train_loss": -25.880908966064453, "global_step": 348214, "epoch": 4195} {"train_loss": -26.42169761657715, "global_step": 348215, "epoch": 4195} {"train_loss": -26.286584854125977, "global_step": 348216, "epoch": 4195} {"train_loss": -26.052183151245117, "global_step": 348217, "epoch": 4195} {"train_loss": -25.9279842376709, "global_step": 348218, "epoch": 4195} {"train_loss": -25.9997615814209, "global_step": 348219, "epoch": 4195} {"train_loss": -25.628747940063477, "global_step": 348220, "epoch": 4195} {"train_loss": -26.032062530517578, "global_step": 348221, "epoch": 4195} {"train_loss": -26.16983413696289, "global_step": 348222, "epoch": 4195} {"train_loss": -26.2069149017334, "global_step": 348223, "epoch": 4195} {"train_loss": -26.119577407836914, "global_step": 348224, "epoch": 4195} {"train_loss": -26.329389572143555, "global_step": 348225, "epoch": 4195} {"train_loss": -26.31732177734375, "global_step": 348226, "epoch": 4195} {"train_loss": -26.117904663085938, "global_step": 348227, "epoch": 4195} {"train_loss": -26.302459716796875, "global_step": 348228, "epoch": 4195} {"train_loss": -26.203144073486328, "global_step": 348229, "epoch": 4195} {"train_loss": -26.244985580444336, "global_step": 348230, "epoch": 4195} {"train_loss": -26.37489128112793, "global_step": 348231, "epoch": 4195} {"train_loss": -26.38263511657715, "global_step": 348232, "epoch": 4195} {"train_loss": -26.3438777923584, "global_step": 348233, "epoch": 4195} {"train_loss": -26.1617374420166, "global_step": 348234, "epoch": 4195} {"train_loss": -26.72474479675293, "global_step": 348235, "epoch": 4195} {"train_loss": -26.593048095703125, "global_step": 348236, "epoch": 4195} {"train_loss": -26.200824737548828, "global_step": 348237, "epoch": 4195} {"train_loss": -25.830005645751953, "global_step": 348238, "epoch": 4195} {"train_loss": -26.077198028564453, "global_step": 348239, "epoch": 4195} {"train_loss": -26.411884307861328, "global_step": 348240, "epoch": 4195} {"train_loss": -26.032794952392578, "global_step": 348241, "epoch": 4195} {"train_loss": -26.030187606811523, "global_step": 348242, "epoch": 4195} {"train_loss": -26.112579345703125, "global_step": 348243, "epoch": 4195} {"train_loss": -26.098745346069336, "global_step": 348244, "epoch": 4195} {"train_loss": -26.097797393798828, "global_step": 348245, "epoch": 4195} {"train_loss": -26.2590274810791, "global_step": 348246, "epoch": 4195} {"train_loss": -26.225229263305664, "global_step": 348247, "epoch": 4195} {"train_loss": -26.3178653717041, "global_step": 348248, "epoch": 4195} {"train_loss": -26.011154174804688, "global_step": 348249, "epoch": 4195} {"train_loss": -26.707401275634766, "global_step": 348250, "epoch": 4195} {"train_loss": -25.95344352722168, "global_step": 348251, "epoch": 4195} {"train_loss": -26.732410430908203, "global_step": 348252, "epoch": 4195} {"train_loss": -26.396146774291992, "global_step": 348253, "epoch": 4195} {"train_loss": -26.04541015625, "global_step": 348254, "epoch": 4195} {"train_loss": -26.2453556060791, "global_step": 348255, "epoch": 4195} {"train_loss": -26.153772354125977, "global_step": 348256, "epoch": 4195} {"train_loss": -26.2393741607666, "global_step": 348257, "epoch": 4195} {"train_loss": -26.10737419128418, "global_step": 348258, "epoch": 4195} {"train_loss": -25.93781852722168, "global_step": 348259, "epoch": 4195} {"train_loss": -26.09016990661621, "global_step": 348260, "epoch": 4195} {"train_loss": -26.07094383239746, "global_step": 348261, "epoch": 4195} {"train_loss": -26.232437133789062, "global_step": 348262, "epoch": 4195} {"train_loss": -26.369861602783203, "global_step": 348263, "epoch": 4195} {"train_loss": -26.353961944580078, "global_step": 348264, "epoch": 4195} {"train_loss": -26.413715362548828, "global_step": 348265, "epoch": 4195} {"train_loss": -26.31317710876465, "global_step": 348266, "epoch": 4195} {"train_loss": -26.056406940322326, "global_step": 348267, "epoch": 4195, "val_loss": 6666127.0} {"train_loss": -25.405569076538086, "global_step": 348268, "epoch": 4196} {"train_loss": -25.68665885925293, "global_step": 348269, "epoch": 4196} {"train_loss": -25.976993560791016, "global_step": 348270, "epoch": 4196} {"train_loss": -25.372461318969727, "global_step": 348271, "epoch": 4196} {"train_loss": -25.18769645690918, "global_step": 348272, "epoch": 4196} {"train_loss": -24.747282028198242, "global_step": 348273, "epoch": 4196} {"train_loss": -25.841232299804688, "global_step": 348274, "epoch": 4196} {"train_loss": -24.906156539916992, "global_step": 348275, "epoch": 4196} {"train_loss": -25.279809951782227, "global_step": 348276, "epoch": 4196} {"train_loss": -25.36765480041504, "global_step": 348277, "epoch": 4196} {"train_loss": -25.48837661743164, "global_step": 348278, "epoch": 4196} {"train_loss": -25.98451042175293, "global_step": 348279, "epoch": 4196} {"train_loss": -25.773853302001953, "global_step": 348280, "epoch": 4196} {"train_loss": -25.990686416625977, "global_step": 348281, "epoch": 4196} {"train_loss": -25.805768966674805, "global_step": 348282, "epoch": 4196} {"train_loss": -25.759729385375977, "global_step": 348283, "epoch": 4196} {"train_loss": -26.174795150756836, "global_step": 348284, "epoch": 4196} {"train_loss": -25.718353271484375, "global_step": 348285, "epoch": 4196} {"train_loss": -25.88880729675293, "global_step": 348286, "epoch": 4196} {"train_loss": -25.685382843017578, "global_step": 348287, "epoch": 4196} {"train_loss": -25.71832275390625, "global_step": 348288, "epoch": 4196} {"train_loss": -26.148975372314453, "global_step": 348289, "epoch": 4196} {"train_loss": -26.293018341064453, "global_step": 348290, "epoch": 4196} {"train_loss": -25.937681198120117, "global_step": 348291, "epoch": 4196} {"train_loss": -25.969297409057617, "global_step": 348292, "epoch": 4196} {"train_loss": -25.895999908447266, "global_step": 348293, "epoch": 4196} {"train_loss": -26.231836318969727, "global_step": 348294, "epoch": 4196} {"train_loss": -26.50726890563965, "global_step": 348295, "epoch": 4196} {"train_loss": -26.360340118408203, "global_step": 348296, "epoch": 4196} {"train_loss": -25.99907875061035, "global_step": 348297, "epoch": 4196} {"train_loss": -25.861160278320312, "global_step": 348298, "epoch": 4196} {"train_loss": -26.38848876953125, "global_step": 348299, "epoch": 4196} {"train_loss": -26.23920249938965, "global_step": 348300, "epoch": 4196} {"train_loss": -26.255659103393555, "global_step": 348301, "epoch": 4196} {"train_loss": -26.25275993347168, "global_step": 348302, "epoch": 4196} {"train_loss": -26.279285430908203, "global_step": 348303, "epoch": 4196} {"train_loss": -26.166152954101562, "global_step": 348304, "epoch": 4196} {"train_loss": -26.14629554748535, "global_step": 348305, "epoch": 4196} {"train_loss": -26.13140296936035, "global_step": 348306, "epoch": 4196} {"train_loss": -26.253803253173828, "global_step": 348307, "epoch": 4196} {"train_loss": -26.225011825561523, "global_step": 348308, "epoch": 4196} {"train_loss": -26.361637115478516, "global_step": 348309, "epoch": 4196} {"train_loss": -26.07794761657715, "global_step": 348310, "epoch": 4196} {"train_loss": -26.663991928100586, "global_step": 348311, "epoch": 4196} {"train_loss": -26.160537719726562, "global_step": 348312, "epoch": 4196} {"train_loss": -26.371618270874023, "global_step": 348313, "epoch": 4196} {"train_loss": -26.112524032592773, "global_step": 348314, "epoch": 4196} {"train_loss": -26.083227157592773, "global_step": 348315, "epoch": 4196} {"train_loss": -25.530759811401367, "global_step": 348316, "epoch": 4196} {"train_loss": -26.292394638061523, "global_step": 348317, "epoch": 4196} {"train_loss": -26.40620231628418, "global_step": 348318, "epoch": 4196} {"train_loss": -25.54372215270996, "global_step": 348319, "epoch": 4196} {"train_loss": -25.91737937927246, "global_step": 348320, "epoch": 4196} {"train_loss": -25.986997604370117, "global_step": 348321, "epoch": 4196} {"train_loss": -25.8842830657959, "global_step": 348322, "epoch": 4196} {"train_loss": -25.918262481689453, "global_step": 348323, "epoch": 4196} {"train_loss": -26.003971099853516, "global_step": 348324, "epoch": 4196} {"train_loss": -25.560476303100586, "global_step": 348325, "epoch": 4196} {"train_loss": -26.190885543823242, "global_step": 348326, "epoch": 4196} {"train_loss": -25.9622745513916, "global_step": 348327, "epoch": 4196} {"train_loss": -26.206024169921875, "global_step": 348328, "epoch": 4196} {"train_loss": -26.284515380859375, "global_step": 348329, "epoch": 4196} {"train_loss": -26.17057228088379, "global_step": 348330, "epoch": 4196} {"train_loss": -26.077686309814453, "global_step": 348331, "epoch": 4196} {"train_loss": -26.331708908081055, "global_step": 348332, "epoch": 4196} {"train_loss": -25.690908432006836, "global_step": 348333, "epoch": 4196} {"train_loss": -25.965274810791016, "global_step": 348334, "epoch": 4196} {"train_loss": -26.323455810546875, "global_step": 348335, "epoch": 4196} {"train_loss": -26.144886016845703, "global_step": 348336, "epoch": 4196} {"train_loss": -26.07193946838379, "global_step": 348337, "epoch": 4196} {"train_loss": -26.105451583862305, "global_step": 348338, "epoch": 4196} {"train_loss": -26.2544002532959, "global_step": 348339, "epoch": 4196} {"train_loss": -26.33186912536621, "global_step": 348340, "epoch": 4196} {"train_loss": -26.499242782592773, "global_step": 348341, "epoch": 4196} {"train_loss": -26.290790557861328, "global_step": 348342, "epoch": 4196} {"train_loss": -26.270105361938477, "global_step": 348343, "epoch": 4196} {"train_loss": -26.303607940673828, "global_step": 348344, "epoch": 4196} {"train_loss": -26.624982833862305, "global_step": 348345, "epoch": 4196} {"train_loss": -25.901845932006836, "global_step": 348346, "epoch": 4196} {"train_loss": -26.07374382019043, "global_step": 348347, "epoch": 4196} {"train_loss": -25.88791275024414, "global_step": 348348, "epoch": 4196} {"train_loss": -26.259801864624023, "global_step": 348349, "epoch": 4196} {"train_loss": -25.988122365560876, "global_step": 348350, "epoch": 4196, "val_loss": 6629579.5} {"train_loss": -25.291122436523438, "global_step": 348351, "epoch": 4197} {"train_loss": -25.517929077148438, "global_step": 348352, "epoch": 4197} {"train_loss": -25.540372848510742, "global_step": 348353, "epoch": 4197} {"train_loss": -25.601598739624023, "global_step": 348354, "epoch": 4197} {"train_loss": -25.495084762573242, "global_step": 348355, "epoch": 4197} {"train_loss": -25.570058822631836, "global_step": 348356, "epoch": 4197} {"train_loss": -25.631860733032227, "global_step": 348357, "epoch": 4197} {"train_loss": -25.53859519958496, "global_step": 348358, "epoch": 4197} {"train_loss": -25.79306411743164, "global_step": 348359, "epoch": 4197} {"train_loss": -25.707006454467773, "global_step": 348360, "epoch": 4197} {"train_loss": -25.817554473876953, "global_step": 348361, "epoch": 4197} {"train_loss": -25.6728572845459, "global_step": 348362, "epoch": 4197} {"train_loss": -25.6896915435791, "global_step": 348363, "epoch": 4197} {"train_loss": -25.94915771484375, "global_step": 348364, "epoch": 4197} {"train_loss": -26.085479736328125, "global_step": 348365, "epoch": 4197} {"train_loss": -26.110570907592773, "global_step": 348366, "epoch": 4197} {"train_loss": -25.788623809814453, "global_step": 348367, "epoch": 4197} {"train_loss": -25.63588523864746, "global_step": 348368, "epoch": 4197} {"train_loss": -25.937185287475586, "global_step": 348369, "epoch": 4197} {"train_loss": -25.67957878112793, "global_step": 348370, "epoch": 4197} {"train_loss": -25.626867294311523, "global_step": 348371, "epoch": 4197} {"train_loss": -25.669921875, "global_step": 348372, "epoch": 4197} {"train_loss": -26.109638214111328, "global_step": 348373, "epoch": 4197} {"train_loss": -25.88873863220215, "global_step": 348374, "epoch": 4197} {"train_loss": -25.920196533203125, "global_step": 348375, "epoch": 4197} {"train_loss": -26.016571044921875, "global_step": 348376, "epoch": 4197} {"train_loss": -26.145313262939453, "global_step": 348377, "epoch": 4197} {"train_loss": -25.640079498291016, "global_step": 348378, "epoch": 4197} {"train_loss": -25.878143310546875, "global_step": 348379, "epoch": 4197} {"train_loss": -25.949731826782227, "global_step": 348380, "epoch": 4197} {"train_loss": -26.345605850219727, "global_step": 348381, "epoch": 4197} {"train_loss": -25.936145782470703, "global_step": 348382, "epoch": 4197} {"train_loss": -26.33167839050293, "global_step": 348383, "epoch": 4197} {"train_loss": -26.325687408447266, "global_step": 348384, "epoch": 4197} {"train_loss": -25.87289810180664, "global_step": 348385, "epoch": 4197} {"train_loss": -26.38909912109375, "global_step": 348386, "epoch": 4197} {"train_loss": -25.758352279663086, "global_step": 348387, "epoch": 4197} {"train_loss": -26.066919326782227, "global_step": 348388, "epoch": 4197} {"train_loss": -26.11702537536621, "global_step": 348389, "epoch": 4197} {"train_loss": -26.29545021057129, "global_step": 348390, "epoch": 4197} {"train_loss": -26.3275146484375, "global_step": 348391, "epoch": 4197} {"train_loss": -26.072290420532227, "global_step": 348392, "epoch": 4197} {"train_loss": -26.278766632080078, "global_step": 348393, "epoch": 4197} {"train_loss": -26.37060546875, "global_step": 348394, "epoch": 4197} {"train_loss": -26.262678146362305, "global_step": 348395, "epoch": 4197} {"train_loss": -26.383747100830078, "global_step": 348396, "epoch": 4197} {"train_loss": -26.173709869384766, "global_step": 348397, "epoch": 4197} {"train_loss": -26.38362693786621, "global_step": 348398, "epoch": 4197} {"train_loss": -26.17188835144043, "global_step": 348399, "epoch": 4197} {"train_loss": -26.550580978393555, "global_step": 348400, "epoch": 4197} {"train_loss": -26.12689781188965, "global_step": 348401, "epoch": 4197} {"train_loss": -25.72761344909668, "global_step": 348402, "epoch": 4197} {"train_loss": -26.463788986206055, "global_step": 348403, "epoch": 4197} {"train_loss": -25.941648483276367, "global_step": 348404, "epoch": 4197} {"train_loss": -26.15363883972168, "global_step": 348405, "epoch": 4197} {"train_loss": -26.40064811706543, "global_step": 348406, "epoch": 4197} {"train_loss": -26.284290313720703, "global_step": 348407, "epoch": 4197} {"train_loss": -26.21906089782715, "global_step": 348408, "epoch": 4197} {"train_loss": -26.50736427307129, "global_step": 348409, "epoch": 4197} {"train_loss": -26.079421997070312, "global_step": 348410, "epoch": 4197} {"train_loss": -26.593048095703125, "global_step": 348411, "epoch": 4197} {"train_loss": -26.146284103393555, "global_step": 348412, "epoch": 4197} {"train_loss": -26.301929473876953, "global_step": 348413, "epoch": 4197} {"train_loss": -26.232873916625977, "global_step": 348414, "epoch": 4197} {"train_loss": -25.883941650390625, "global_step": 348415, "epoch": 4197} {"train_loss": -25.936853408813477, "global_step": 348416, "epoch": 4197} {"train_loss": -26.222631454467773, "global_step": 348417, "epoch": 4197} {"train_loss": -26.123554229736328, "global_step": 348418, "epoch": 4197} {"train_loss": -26.463531494140625, "global_step": 348419, "epoch": 4197} {"train_loss": -26.583099365234375, "global_step": 348420, "epoch": 4197} {"train_loss": -26.587860107421875, "global_step": 348421, "epoch": 4197} {"train_loss": -26.308237075805664, "global_step": 348422, "epoch": 4197} {"train_loss": -26.114099502563477, "global_step": 348423, "epoch": 4197} {"train_loss": -25.849958419799805, "global_step": 348424, "epoch": 4197} {"train_loss": -26.264719009399414, "global_step": 348425, "epoch": 4197} {"train_loss": -26.16578483581543, "global_step": 348426, "epoch": 4197} {"train_loss": -25.636693954467773, "global_step": 348427, "epoch": 4197} {"train_loss": -26.030872344970703, "global_step": 348428, "epoch": 4197} {"train_loss": -26.622106552124023, "global_step": 348429, "epoch": 4197} {"train_loss": -26.497211456298828, "global_step": 348430, "epoch": 4197} {"train_loss": -26.00337791442871, "global_step": 348431, "epoch": 4197} {"train_loss": -26.1804141998291, "global_step": 348432, "epoch": 4197} {"train_loss": -26.051855156220586, "global_step": 348433, "epoch": 4197, "val_loss": 6754207.5} {"train_loss": -25.556888580322266, "global_step": 348434, "epoch": 4198} {"train_loss": -25.305845260620117, "global_step": 348435, "epoch": 4198} {"train_loss": -25.465999603271484, "global_step": 348436, "epoch": 4198} {"train_loss": -25.606855392456055, "global_step": 348437, "epoch": 4198} {"train_loss": -25.63770866394043, "global_step": 348438, "epoch": 4198} {"train_loss": -25.671802520751953, "global_step": 348439, "epoch": 4198} {"train_loss": -25.77210807800293, "global_step": 348440, "epoch": 4198} {"train_loss": -25.95941162109375, "global_step": 348441, "epoch": 4198} {"train_loss": -25.773725509643555, "global_step": 348442, "epoch": 4198} {"train_loss": -25.70094108581543, "global_step": 348443, "epoch": 4198} {"train_loss": -25.718048095703125, "global_step": 348444, "epoch": 4198} {"train_loss": -25.878095626831055, "global_step": 348445, "epoch": 4198} {"train_loss": -26.2061824798584, "global_step": 348446, "epoch": 4198} {"train_loss": -25.574506759643555, "global_step": 348447, "epoch": 4198} {"train_loss": -25.836212158203125, "global_step": 348448, "epoch": 4198} {"train_loss": -25.941492080688477, "global_step": 348449, "epoch": 4198} {"train_loss": -25.34256362915039, "global_step": 348450, "epoch": 4198} {"train_loss": -25.60232925415039, "global_step": 348451, "epoch": 4198} {"train_loss": -25.983789443969727, "global_step": 348452, "epoch": 4198} {"train_loss": -25.466976165771484, "global_step": 348453, "epoch": 4198} {"train_loss": -26.146289825439453, "global_step": 348454, "epoch": 4198} {"train_loss": -25.932403564453125, "global_step": 348455, "epoch": 4198} {"train_loss": -26.091466903686523, "global_step": 348456, "epoch": 4198} {"train_loss": -26.152185440063477, "global_step": 348457, "epoch": 4198} {"train_loss": -26.200275421142578, "global_step": 348458, "epoch": 4198} {"train_loss": -25.72998046875, "global_step": 348459, "epoch": 4198} {"train_loss": -26.09382438659668, "global_step": 348460, "epoch": 4198} {"train_loss": -25.945966720581055, "global_step": 348461, "epoch": 4198} {"train_loss": -25.876585006713867, "global_step": 348462, "epoch": 4198} {"train_loss": -26.30518913269043, "global_step": 348463, "epoch": 4198} {"train_loss": -26.458423614501953, "global_step": 348464, "epoch": 4198} {"train_loss": -26.1453914642334, "global_step": 348465, "epoch": 4198} {"train_loss": -26.645700454711914, "global_step": 348466, "epoch": 4198} {"train_loss": -26.721908569335938, "global_step": 348467, "epoch": 4198} {"train_loss": -26.17959976196289, "global_step": 348468, "epoch": 4198} {"train_loss": -26.167234420776367, "global_step": 348469, "epoch": 4198} {"train_loss": -26.14702796936035, "global_step": 348470, "epoch": 4198} {"train_loss": -26.229394912719727, "global_step": 348471, "epoch": 4198} {"train_loss": -26.714569091796875, "global_step": 348472, "epoch": 4198} {"train_loss": -26.54969596862793, "global_step": 348473, "epoch": 4198} {"train_loss": -26.195775985717773, "global_step": 348474, "epoch": 4198} {"train_loss": -26.234678268432617, "global_step": 348475, "epoch": 4198} {"train_loss": -26.311634063720703, "global_step": 348476, "epoch": 4198} {"train_loss": -26.227415084838867, "global_step": 348477, "epoch": 4198} {"train_loss": -26.437061309814453, "global_step": 348478, "epoch": 4198} {"train_loss": -26.426984786987305, "global_step": 348479, "epoch": 4198} {"train_loss": -25.952590942382812, "global_step": 348480, "epoch": 4198} {"train_loss": -26.479644775390625, "global_step": 348481, "epoch": 4198} {"train_loss": -25.97226905822754, "global_step": 348482, "epoch": 4198} {"train_loss": -26.451642990112305, "global_step": 348483, "epoch": 4198} {"train_loss": -26.006744384765625, "global_step": 348484, "epoch": 4198} {"train_loss": -25.97481346130371, "global_step": 348485, "epoch": 4198} {"train_loss": -25.286718368530273, "global_step": 348486, "epoch": 4198} {"train_loss": -24.477569580078125, "global_step": 348487, "epoch": 4198} {"train_loss": -23.5131778717041, "global_step": 348488, "epoch": 4198} {"train_loss": -24.976003646850586, "global_step": 348489, "epoch": 4198} {"train_loss": -25.239164352416992, "global_step": 348490, "epoch": 4198} {"train_loss": -25.61930274963379, "global_step": 348491, "epoch": 4198} {"train_loss": -24.6862735748291, "global_step": 348492, "epoch": 4198} {"train_loss": -25.614120483398438, "global_step": 348493, "epoch": 4198} {"train_loss": -25.023435592651367, "global_step": 348494, "epoch": 4198} {"train_loss": -25.81134605407715, "global_step": 348495, "epoch": 4198} {"train_loss": -25.22662353515625, "global_step": 348496, "epoch": 4198} {"train_loss": -25.651025772094727, "global_step": 348497, "epoch": 4198} {"train_loss": -25.73053550720215, "global_step": 348498, "epoch": 4198} {"train_loss": -25.498533248901367, "global_step": 348499, "epoch": 4198} {"train_loss": -25.584125518798828, "global_step": 348500, "epoch": 4198} {"train_loss": -25.65156364440918, "global_step": 348501, "epoch": 4198} {"train_loss": -25.976293563842773, "global_step": 348502, "epoch": 4198} {"train_loss": -25.9348087310791, "global_step": 348503, "epoch": 4198} {"train_loss": -25.633054733276367, "global_step": 348504, "epoch": 4198} {"train_loss": -25.563594818115234, "global_step": 348505, "epoch": 4198} {"train_loss": -25.991296768188477, "global_step": 348506, "epoch": 4198} {"train_loss": -25.813074111938477, "global_step": 348507, "epoch": 4198} {"train_loss": -25.979053497314453, "global_step": 348508, "epoch": 4198} {"train_loss": -25.76642417907715, "global_step": 348509, "epoch": 4198} {"train_loss": -25.7982234954834, "global_step": 348510, "epoch": 4198} {"train_loss": -25.621814727783203, "global_step": 348511, "epoch": 4198} {"train_loss": -25.775033950805664, "global_step": 348512, "epoch": 4198} {"train_loss": -25.94618034362793, "global_step": 348513, "epoch": 4198} {"train_loss": -26.29681968688965, "global_step": 348514, "epoch": 4198} {"train_loss": -26.36037254333496, "global_step": 348515, "epoch": 4198} {"train_loss": -25.852245767432525, "global_step": 348516, "epoch": 4198, "val_loss": 6761462.0} {"train_loss": -26.17597007751465, "global_step": 348517, "epoch": 4199} {"train_loss": -25.905338287353516, "global_step": 348518, "epoch": 4199} {"train_loss": -26.268177032470703, "global_step": 348519, "epoch": 4199} {"train_loss": -26.088306427001953, "global_step": 348520, "epoch": 4199} {"train_loss": -25.751205444335938, "global_step": 348521, "epoch": 4199} {"train_loss": -25.810094833374023, "global_step": 348522, "epoch": 4199} {"train_loss": -26.0294132232666, "global_step": 348523, "epoch": 4199} {"train_loss": -25.789203643798828, "global_step": 348524, "epoch": 4199} {"train_loss": -26.138635635375977, "global_step": 348525, "epoch": 4199} {"train_loss": -26.12641716003418, "global_step": 348526, "epoch": 4199} {"train_loss": -25.63446044921875, "global_step": 348527, "epoch": 4199} {"train_loss": -25.813526153564453, "global_step": 348528, "epoch": 4199} {"train_loss": -25.59736442565918, "global_step": 348529, "epoch": 4199} {"train_loss": -25.8955078125, "global_step": 348530, "epoch": 4199} {"train_loss": -26.031753540039062, "global_step": 348531, "epoch": 4199} {"train_loss": -26.112756729125977, "global_step": 348532, "epoch": 4199} {"train_loss": -26.34149742126465, "global_step": 348533, "epoch": 4199} {"train_loss": -25.86016273498535, "global_step": 348534, "epoch": 4199} {"train_loss": -26.208703994750977, "global_step": 348535, "epoch": 4199} {"train_loss": -25.831939697265625, "global_step": 348536, "epoch": 4199} {"train_loss": -26.368127822875977, "global_step": 348537, "epoch": 4199} {"train_loss": -25.77473258972168, "global_step": 348538, "epoch": 4199} {"train_loss": -26.07691764831543, "global_step": 348539, "epoch": 4199} {"train_loss": -25.827472686767578, "global_step": 348540, "epoch": 4199} {"train_loss": -26.024824142456055, "global_step": 348541, "epoch": 4199} {"train_loss": -26.399580001831055, "global_step": 348542, "epoch": 4199} {"train_loss": -26.145719528198242, "global_step": 348543, "epoch": 4199} {"train_loss": -26.117895126342773, "global_step": 348544, "epoch": 4199} {"train_loss": -26.320459365844727, "global_step": 348545, "epoch": 4199} {"train_loss": -25.92340660095215, "global_step": 348546, "epoch": 4199} {"train_loss": -26.056415557861328, "global_step": 348547, "epoch": 4199} {"train_loss": -26.05695152282715, "global_step": 348548, "epoch": 4199} {"train_loss": -26.19281005859375, "global_step": 348549, "epoch": 4199} {"train_loss": -25.98615074157715, "global_step": 348550, "epoch": 4199} {"train_loss": -25.650054931640625, "global_step": 348551, "epoch": 4199} {"train_loss": -26.17579460144043, "global_step": 348552, "epoch": 4199} {"train_loss": -25.94927406311035, "global_step": 348553, "epoch": 4199} {"train_loss": -26.154529571533203, "global_step": 348554, "epoch": 4199} {"train_loss": -26.054767608642578, "global_step": 348555, "epoch": 4199} {"train_loss": -26.13117790222168, "global_step": 348556, "epoch": 4199} {"train_loss": -26.132984161376953, "global_step": 348557, "epoch": 4199} {"train_loss": -26.50958251953125, "global_step": 348558, "epoch": 4199} {"train_loss": -26.461694717407227, "global_step": 348559, "epoch": 4199} {"train_loss": -26.224767684936523, "global_step": 348560, "epoch": 4199} {"train_loss": -26.394775390625, "global_step": 348561, "epoch": 4199} {"train_loss": -26.264944076538086, "global_step": 348562, "epoch": 4199} {"train_loss": -26.259912490844727, "global_step": 348563, "epoch": 4199} {"train_loss": -26.2761173248291, "global_step": 348564, "epoch": 4199} {"train_loss": -26.269168853759766, "global_step": 348565, "epoch": 4199} {"train_loss": -26.06374168395996, "global_step": 348566, "epoch": 4199} {"train_loss": -26.58786964416504, "global_step": 348567, "epoch": 4199} {"train_loss": -26.295385360717773, "global_step": 348568, "epoch": 4199} {"train_loss": -26.06416130065918, "global_step": 348569, "epoch": 4199} {"train_loss": -26.233163833618164, "global_step": 348570, "epoch": 4199} {"train_loss": -26.28553581237793, "global_step": 348571, "epoch": 4199} {"train_loss": -26.256702423095703, "global_step": 348572, "epoch": 4199} {"train_loss": -26.69233512878418, "global_step": 348573, "epoch": 4199} {"train_loss": -26.314496994018555, "global_step": 348574, "epoch": 4199} {"train_loss": -26.64896583557129, "global_step": 348575, "epoch": 4199} {"train_loss": -25.818058013916016, "global_step": 348576, "epoch": 4199} {"train_loss": -25.926773071289062, "global_step": 348577, "epoch": 4199} {"train_loss": -25.94544792175293, "global_step": 348578, "epoch": 4199} {"train_loss": -25.656370162963867, "global_step": 348579, "epoch": 4199} {"train_loss": -25.88374900817871, "global_step": 348580, "epoch": 4199} {"train_loss": -26.22144889831543, "global_step": 348581, "epoch": 4199} {"train_loss": -25.966659545898438, "global_step": 348582, "epoch": 4199} {"train_loss": -25.601154327392578, "global_step": 348583, "epoch": 4199} {"train_loss": -25.237796783447266, "global_step": 348584, "epoch": 4199} {"train_loss": -26.15297508239746, "global_step": 348585, "epoch": 4199} {"train_loss": -26.28485107421875, "global_step": 348586, "epoch": 4199} {"train_loss": -25.248563766479492, "global_step": 348587, "epoch": 4199} {"train_loss": -25.907012939453125, "global_step": 348588, "epoch": 4199} {"train_loss": -25.8615665435791, "global_step": 348589, "epoch": 4199} {"train_loss": -25.730289459228516, "global_step": 348590, "epoch": 4199} {"train_loss": -26.037952423095703, "global_step": 348591, "epoch": 4199} {"train_loss": -25.87933921813965, "global_step": 348592, "epoch": 4199} {"train_loss": -26.142343521118164, "global_step": 348593, "epoch": 4199} {"train_loss": -26.0889949798584, "global_step": 348594, "epoch": 4199} {"train_loss": -25.864084243774414, "global_step": 348595, "epoch": 4199} {"train_loss": -26.142541885375977, "global_step": 348596, "epoch": 4199} {"train_loss": -26.529077529907227, "global_step": 348597, "epoch": 4199} {"train_loss": -25.927846908569336, "global_step": 348598, "epoch": 4199} {"train_loss": -26.070599245737835, "global_step": 348599, "epoch": 4199, "val_loss": 6680762.0} {"train_loss": -25.731781005859375, "global_step": 348600, "epoch": 4200} {"train_loss": -25.86665153503418, "global_step": 348601, "epoch": 4200} {"train_loss": -25.866107940673828, "global_step": 348602, "epoch": 4200} {"train_loss": -25.783384323120117, "global_step": 348603, "epoch": 4200} {"train_loss": -25.88525390625, "global_step": 348604, "epoch": 4200} {"train_loss": -25.838653564453125, "global_step": 348605, "epoch": 4200} {"train_loss": -25.842206954956055, "global_step": 348606, "epoch": 4200} {"train_loss": -25.987701416015625, "global_step": 348607, "epoch": 4200} {"train_loss": -25.77423095703125, "global_step": 348608, "epoch": 4200} {"train_loss": -25.919897079467773, "global_step": 348609, "epoch": 4200} {"train_loss": -25.93999671936035, "global_step": 348610, "epoch": 4200} {"train_loss": -25.638702392578125, "global_step": 348611, "epoch": 4200} {"train_loss": -25.921125411987305, "global_step": 348612, "epoch": 4200} {"train_loss": -25.926427841186523, "global_step": 348613, "epoch": 4200} {"train_loss": -26.108386993408203, "global_step": 348614, "epoch": 4200} {"train_loss": -25.992298126220703, "global_step": 348615, "epoch": 4200} {"train_loss": -26.210376739501953, "global_step": 348616, "epoch": 4200} {"train_loss": -26.301233291625977, "global_step": 348617, "epoch": 4200} {"train_loss": -26.392576217651367, "global_step": 348618, "epoch": 4200} {"train_loss": -26.02088737487793, "global_step": 348619, "epoch": 4200} {"train_loss": -25.912506103515625, "global_step": 348620, "epoch": 4200} {"train_loss": -25.797266006469727, "global_step": 348621, "epoch": 4200} {"train_loss": -26.045413970947266, "global_step": 348622, "epoch": 4200} {"train_loss": -26.15839958190918, "global_step": 348623, "epoch": 4200} {"train_loss": -26.25831413269043, "global_step": 348624, "epoch": 4200} {"train_loss": -26.049774169921875, "global_step": 348625, "epoch": 4200} {"train_loss": -26.090749740600586, "global_step": 348626, "epoch": 4200} {"train_loss": -25.880508422851562, "global_step": 348627, "epoch": 4200} {"train_loss": -26.319873809814453, "global_step": 348628, "epoch": 4200} {"train_loss": -26.012775421142578, "global_step": 348629, "epoch": 4200} {"train_loss": -26.244104385375977, "global_step": 348630, "epoch": 4200} {"train_loss": -26.589344024658203, "global_step": 348631, "epoch": 4200} {"train_loss": -26.436994552612305, "global_step": 348632, "epoch": 4200} {"train_loss": -26.490421295166016, "global_step": 348633, "epoch": 4200} {"train_loss": -26.31452751159668, "global_step": 348634, "epoch": 4200} {"train_loss": -26.36219596862793, "global_step": 348635, "epoch": 4200} {"train_loss": -26.152875900268555, "global_step": 348636, "epoch": 4200} {"train_loss": -26.183765411376953, "global_step": 348637, "epoch": 4200} {"train_loss": -26.53426170349121, "global_step": 348638, "epoch": 4200} {"train_loss": -26.457401275634766, "global_step": 348639, "epoch": 4200} {"train_loss": -25.97498893737793, "global_step": 348640, "epoch": 4200} {"train_loss": -26.6513729095459, "global_step": 348641, "epoch": 4200} {"train_loss": -26.74513053894043, "global_step": 348642, "epoch": 4200} {"train_loss": -25.874479293823242, "global_step": 348643, "epoch": 4200} {"train_loss": -26.604019165039062, "global_step": 348644, "epoch": 4200} {"train_loss": -26.256444931030273, "global_step": 348645, "epoch": 4200} {"train_loss": -26.284772872924805, "global_step": 348646, "epoch": 4200} {"train_loss": -26.38343620300293, "global_step": 348647, "epoch": 4200} {"train_loss": -26.30224609375, "global_step": 348648, "epoch": 4200} {"train_loss": -26.399734497070312, "global_step": 348649, "epoch": 4200} {"train_loss": -26.517868041992188, "global_step": 348650, "epoch": 4200} {"train_loss": -26.18987464904785, "global_step": 348651, "epoch": 4200} {"train_loss": -26.353857040405273, "global_step": 348652, "epoch": 4200} {"train_loss": -25.826644897460938, "global_step": 348653, "epoch": 4200} {"train_loss": -26.480640411376953, "global_step": 348654, "epoch": 4200} {"train_loss": -26.113611221313477, "global_step": 348655, "epoch": 4200} {"train_loss": -26.06373405456543, "global_step": 348656, "epoch": 4200} {"train_loss": -26.247817993164062, "global_step": 348657, "epoch": 4200} {"train_loss": -26.031103134155273, "global_step": 348658, "epoch": 4200} {"train_loss": -26.095178604125977, "global_step": 348659, "epoch": 4200} {"train_loss": -26.001407623291016, "global_step": 348660, "epoch": 4200} {"train_loss": -26.183584213256836, "global_step": 348661, "epoch": 4200} {"train_loss": -25.680734634399414, "global_step": 348662, "epoch": 4200} {"train_loss": -25.769071578979492, "global_step": 348663, "epoch": 4200} {"train_loss": -26.28792381286621, "global_step": 348664, "epoch": 4200} {"train_loss": -26.4288330078125, "global_step": 348665, "epoch": 4200} {"train_loss": -26.441747665405273, "global_step": 348666, "epoch": 4200} {"train_loss": -26.06178855895996, "global_step": 348667, "epoch": 4200} {"train_loss": -26.472929000854492, "global_step": 348668, "epoch": 4200} {"train_loss": -26.142887115478516, "global_step": 348669, "epoch": 4200} {"train_loss": -26.03876304626465, "global_step": 348670, "epoch": 4200} {"train_loss": -26.10908317565918, "global_step": 348671, "epoch": 4200} {"train_loss": -26.04599380493164, "global_step": 348672, "epoch": 4200} {"train_loss": -25.840024948120117, "global_step": 348673, "epoch": 4200} {"train_loss": -26.41704750061035, "global_step": 348674, "epoch": 4200} {"train_loss": -25.80096435546875, "global_step": 348675, "epoch": 4200} {"train_loss": -26.181203842163086, "global_step": 348676, "epoch": 4200} {"train_loss": -26.096338272094727, "global_step": 348677, "epoch": 4200} {"train_loss": -25.800519943237305, "global_step": 348678, "epoch": 4200} {"train_loss": -26.044803619384766, "global_step": 348679, "epoch": 4200} {"train_loss": -26.0180721282959, "global_step": 348680, "epoch": 4200} {"train_loss": -26.05605125427246, "global_step": 348681, "epoch": 4200} {"train_loss": -26.136013536568147, "global_step": 348682, "epoch": 4200, "train/sim_max_reward_0": 1.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4500000": 1.0, "test/sim_max_reward_4500001": 1.0, "test/sim_max_reward_4500002": 1.0, "test/sim_max_reward_4500003": 1.0, "test/sim_max_reward_4500004": 1.0, "test/sim_max_reward_4500005": 1.0, "test/sim_max_reward_4500006": 1.0, "test/sim_max_reward_4500007": 1.0, "test/sim_max_reward_4500008": 1.0, "test/sim_max_reward_4500009": 1.0, "test/sim_max_reward_4500010": 1.0, "test/sim_max_reward_4500011": 1.0, "test/sim_max_reward_4500012": 1.0, "test/sim_max_reward_4500013": 1.0, "test/sim_max_reward_4500014": 1.0, "test/sim_max_reward_4500015": 1.0, "test/sim_max_reward_4500016": 1.0, "test/sim_max_reward_4500017": 1.0, "test/sim_max_reward_4500018": 0.0, "test/sim_max_reward_4500019": 1.0, "test/sim_max_reward_4500020": 1.0, "test/sim_max_reward_4500021": 1.0, "train/mean_score": 1.0, "test/mean_score": 0.9545454545454546, "val_loss": 6716359.0} {"train_loss": -25.352231979370117, "global_step": 348683, "epoch": 4201} {"train_loss": -25.814855575561523, "global_step": 348684, "epoch": 4201} {"train_loss": -25.383155822753906, "global_step": 348685, "epoch": 4201} {"train_loss": -25.678510665893555, "global_step": 348686, "epoch": 4201} {"train_loss": -25.82858657836914, "global_step": 348687, "epoch": 4201} {"train_loss": -25.60947608947754, "global_step": 348688, "epoch": 4201} {"train_loss": -25.142303466796875, "global_step": 348689, "epoch": 4201} {"train_loss": -25.782577514648438, "global_step": 348690, "epoch": 4201} {"train_loss": -25.715845108032227, "global_step": 348691, "epoch": 4201} {"train_loss": -25.91912841796875, "global_step": 348692, "epoch": 4201} {"train_loss": -25.834508895874023, "global_step": 348693, "epoch": 4201} {"train_loss": -25.59885597229004, "global_step": 348694, "epoch": 4201} {"train_loss": -26.043981552124023, "global_step": 348695, "epoch": 4201} {"train_loss": -25.846555709838867, "global_step": 348696, "epoch": 4201} {"train_loss": -25.550504684448242, "global_step": 348697, "epoch": 4201} {"train_loss": -25.97955322265625, "global_step": 348698, "epoch": 4201} {"train_loss": -25.84468650817871, "global_step": 348699, "epoch": 4201} {"train_loss": -25.98335075378418, "global_step": 348700, "epoch": 4201} {"train_loss": -25.627044677734375, "global_step": 348701, "epoch": 4201} {"train_loss": -25.793888092041016, "global_step": 348702, "epoch": 4201} {"train_loss": -25.835830688476562, "global_step": 348703, "epoch": 4201} {"train_loss": -26.34978675842285, "global_step": 348704, "epoch": 4201} {"train_loss": -26.135950088500977, "global_step": 348705, "epoch": 4201} {"train_loss": -25.856021881103516, "global_step": 348706, "epoch": 4201} {"train_loss": -26.176252365112305, "global_step": 348707, "epoch": 4201} {"train_loss": -26.08808708190918, "global_step": 348708, "epoch": 4201} {"train_loss": -25.881900787353516, "global_step": 348709, "epoch": 4201} {"train_loss": -26.407297134399414, "global_step": 348710, "epoch": 4201} {"train_loss": -26.286258697509766, "global_step": 348711, "epoch": 4201} {"train_loss": -26.540393829345703, "global_step": 348712, "epoch": 4201} {"train_loss": -25.918079376220703, "global_step": 348713, "epoch": 4201} {"train_loss": -26.018579483032227, "global_step": 348714, "epoch": 4201} {"train_loss": -26.475061416625977, "global_step": 348715, "epoch": 4201} {"train_loss": -25.824426651000977, "global_step": 348716, "epoch": 4201} {"train_loss": -26.141265869140625, "global_step": 348717, "epoch": 4201} {"train_loss": -26.253192901611328, "global_step": 348718, "epoch": 4201} {"train_loss": -26.06610107421875, "global_step": 348719, "epoch": 4201} {"train_loss": -26.35443115234375, "global_step": 348720, "epoch": 4201} {"train_loss": -26.34035301208496, "global_step": 348721, "epoch": 4201} {"train_loss": -26.12754249572754, "global_step": 348722, "epoch": 4201} {"train_loss": -25.9927921295166, "global_step": 348723, "epoch": 4201} {"train_loss": -26.288440704345703, "global_step": 348724, "epoch": 4201} {"train_loss": -26.395984649658203, "global_step": 348725, "epoch": 4201} {"train_loss": -26.192983627319336, "global_step": 348726, "epoch": 4201} {"train_loss": -26.272506713867188, "global_step": 348727, "epoch": 4201} {"train_loss": -26.32355308532715, "global_step": 348728, "epoch": 4201} {"train_loss": -26.301116943359375, "global_step": 348729, "epoch": 4201} {"train_loss": -26.165403366088867, "global_step": 348730, "epoch": 4201} {"train_loss": -25.730457305908203, "global_step": 348731, "epoch": 4201} {"train_loss": -25.926313400268555, "global_step": 348732, "epoch": 4201} {"train_loss": -26.363956451416016, "global_step": 348733, "epoch": 4201} {"train_loss": -25.900192260742188, "global_step": 348734, "epoch": 4201} {"train_loss": -25.64914894104004, "global_step": 348735, "epoch": 4201} {"train_loss": -25.960540771484375, "global_step": 348736, "epoch": 4201} {"train_loss": -26.213647842407227, "global_step": 348737, "epoch": 4201} {"train_loss": -26.351364135742188, "global_step": 348738, "epoch": 4201} {"train_loss": -26.117124557495117, "global_step": 348739, "epoch": 4201} {"train_loss": -26.064794540405273, "global_step": 348740, "epoch": 4201} {"train_loss": -26.27384376525879, "global_step": 348741, "epoch": 4201} {"train_loss": -26.206363677978516, "global_step": 348742, "epoch": 4201} {"train_loss": -26.368127822875977, "global_step": 348743, "epoch": 4201} {"train_loss": -26.300994873046875, "global_step": 348744, "epoch": 4201} {"train_loss": -26.08536720275879, "global_step": 348745, "epoch": 4201} {"train_loss": -26.12886619567871, "global_step": 348746, "epoch": 4201} {"train_loss": -26.089038848876953, "global_step": 348747, "epoch": 4201} {"train_loss": -26.367084503173828, "global_step": 348748, "epoch": 4201} {"train_loss": -26.635644912719727, "global_step": 348749, "epoch": 4201} {"train_loss": -26.22463035583496, "global_step": 348750, "epoch": 4201} {"train_loss": -26.353290557861328, "global_step": 348751, "epoch": 4201} {"train_loss": -26.637317657470703, "global_step": 348752, "epoch": 4201} {"train_loss": -26.367345809936523, "global_step": 348753, "epoch": 4201} {"train_loss": -26.270395278930664, "global_step": 348754, "epoch": 4201} {"train_loss": -26.286548614501953, "global_step": 348755, "epoch": 4201} {"train_loss": -26.5173397064209, "global_step": 348756, "epoch": 4201} {"train_loss": -26.013498306274414, "global_step": 348757, "epoch": 4201} {"train_loss": -26.539398193359375, "global_step": 348758, "epoch": 4201} {"train_loss": -26.411224365234375, "global_step": 348759, "epoch": 4201} {"train_loss": -26.173383712768555, "global_step": 348760, "epoch": 4201} {"train_loss": -26.319324493408203, "global_step": 348761, "epoch": 4201} {"train_loss": -26.49492835998535, "global_step": 348762, "epoch": 4201} {"train_loss": -26.316970825195312, "global_step": 348763, "epoch": 4201} {"train_loss": -26.279422760009766, "global_step": 348764, "epoch": 4201} {"train_loss": -26.113043957445996, "global_step": 348765, "epoch": 4201, "val_loss": 6798440.0} {"train_loss": -25.748010635375977, "global_step": 348766, "epoch": 4202} {"train_loss": -26.1422176361084, "global_step": 348767, "epoch": 4202} {"train_loss": -25.84686851501465, "global_step": 348768, "epoch": 4202} {"train_loss": -25.676843643188477, "global_step": 348769, "epoch": 4202} {"train_loss": -25.394086837768555, "global_step": 348770, "epoch": 4202} {"train_loss": -25.592866897583008, "global_step": 348771, "epoch": 4202} {"train_loss": -25.13285255432129, "global_step": 348772, "epoch": 4202} {"train_loss": -25.895788192749023, "global_step": 348773, "epoch": 4202} {"train_loss": -25.862899780273438, "global_step": 348774, "epoch": 4202} {"train_loss": -25.7349796295166, "global_step": 348775, "epoch": 4202} {"train_loss": -25.842321395874023, "global_step": 348776, "epoch": 4202} {"train_loss": -25.674482345581055, "global_step": 348777, "epoch": 4202} {"train_loss": -25.77581214904785, "global_step": 348778, "epoch": 4202} {"train_loss": -25.796628952026367, "global_step": 348779, "epoch": 4202} {"train_loss": -25.935678482055664, "global_step": 348780, "epoch": 4202} {"train_loss": -26.120847702026367, "global_step": 348781, "epoch": 4202} {"train_loss": -25.514806747436523, "global_step": 348782, "epoch": 4202} {"train_loss": -25.59663963317871, "global_step": 348783, "epoch": 4202} {"train_loss": -25.91289710998535, "global_step": 348784, "epoch": 4202} {"train_loss": -26.403247833251953, "global_step": 348785, "epoch": 4202} {"train_loss": -26.219913482666016, "global_step": 348786, "epoch": 4202} {"train_loss": -25.701684951782227, "global_step": 348787, "epoch": 4202} {"train_loss": -26.27815818786621, "global_step": 348788, "epoch": 4202} {"train_loss": -25.82044792175293, "global_step": 348789, "epoch": 4202} {"train_loss": -26.289337158203125, "global_step": 348790, "epoch": 4202} {"train_loss": -26.14606285095215, "global_step": 348791, "epoch": 4202} {"train_loss": -25.956867218017578, "global_step": 348792, "epoch": 4202} {"train_loss": -25.60544204711914, "global_step": 348793, "epoch": 4202} {"train_loss": -26.253339767456055, "global_step": 348794, "epoch": 4202} {"train_loss": -25.77691078186035, "global_step": 348795, "epoch": 4202} {"train_loss": -26.409198760986328, "global_step": 348796, "epoch": 4202} {"train_loss": -26.43218421936035, "global_step": 348797, "epoch": 4202} {"train_loss": -25.9359073638916, "global_step": 348798, "epoch": 4202} {"train_loss": -25.969404220581055, "global_step": 348799, "epoch": 4202} {"train_loss": -26.200769424438477, "global_step": 348800, "epoch": 4202} {"train_loss": -25.893630981445312, "global_step": 348801, "epoch": 4202} {"train_loss": -26.330060958862305, "global_step": 348802, "epoch": 4202} {"train_loss": -26.31141471862793, "global_step": 348803, "epoch": 4202} {"train_loss": -26.0869140625, "global_step": 348804, "epoch": 4202} {"train_loss": -26.092559814453125, "global_step": 348805, "epoch": 4202} {"train_loss": -26.293476104736328, "global_step": 348806, "epoch": 4202} {"train_loss": -25.955121994018555, "global_step": 348807, "epoch": 4202} {"train_loss": -26.41731071472168, "global_step": 348808, "epoch": 4202} {"train_loss": -26.00626564025879, "global_step": 348809, "epoch": 4202} {"train_loss": -25.83642578125, "global_step": 348810, "epoch": 4202} {"train_loss": -26.32682228088379, "global_step": 348811, "epoch": 4202} {"train_loss": -26.107473373413086, "global_step": 348812, "epoch": 4202} {"train_loss": -26.102624893188477, "global_step": 348813, "epoch": 4202} {"train_loss": -26.27149772644043, "global_step": 348814, "epoch": 4202} {"train_loss": -26.655054092407227, "global_step": 348815, "epoch": 4202} {"train_loss": -26.282636642456055, "global_step": 348816, "epoch": 4202} {"train_loss": -26.113645553588867, "global_step": 348817, "epoch": 4202} {"train_loss": -26.249298095703125, "global_step": 348818, "epoch": 4202} {"train_loss": -26.12147331237793, "global_step": 348819, "epoch": 4202} {"train_loss": -26.365034103393555, "global_step": 348820, "epoch": 4202} {"train_loss": -26.642011642456055, "global_step": 348821, "epoch": 4202} {"train_loss": -26.32868003845215, "global_step": 348822, "epoch": 4202} {"train_loss": -25.953937530517578, "global_step": 348823, "epoch": 4202} {"train_loss": -26.446552276611328, "global_step": 348824, "epoch": 4202} {"train_loss": -26.1619930267334, "global_step": 348825, "epoch": 4202} {"train_loss": -26.38783073425293, "global_step": 348826, "epoch": 4202} {"train_loss": -26.208703994750977, "global_step": 348827, "epoch": 4202} {"train_loss": -26.149805068969727, "global_step": 348828, "epoch": 4202} {"train_loss": -26.4075870513916, "global_step": 348829, "epoch": 4202} {"train_loss": -26.332544326782227, "global_step": 348830, "epoch": 4202} {"train_loss": -25.958759307861328, "global_step": 348831, "epoch": 4202} {"train_loss": -25.685590744018555, "global_step": 348832, "epoch": 4202} {"train_loss": -25.926603317260742, "global_step": 348833, "epoch": 4202} {"train_loss": -25.861425399780273, "global_step": 348834, "epoch": 4202} {"train_loss": -25.882856369018555, "global_step": 348835, "epoch": 4202} {"train_loss": -26.54279136657715, "global_step": 348836, "epoch": 4202} {"train_loss": -26.282806396484375, "global_step": 348837, "epoch": 4202} {"train_loss": -26.298498153686523, "global_step": 348838, "epoch": 4202} {"train_loss": -26.2992000579834, "global_step": 348839, "epoch": 4202} {"train_loss": -25.77978515625, "global_step": 348840, "epoch": 4202} {"train_loss": -26.16619873046875, "global_step": 348841, "epoch": 4202} {"train_loss": -25.870849609375, "global_step": 348842, "epoch": 4202} {"train_loss": -25.873931884765625, "global_step": 348843, "epoch": 4202} {"train_loss": -26.311126708984375, "global_step": 348844, "epoch": 4202} {"train_loss": -25.886341094970703, "global_step": 348845, "epoch": 4202} {"train_loss": -26.170562744140625, "global_step": 348846, "epoch": 4202} {"train_loss": -26.262388229370117, "global_step": 348847, "epoch": 4202} {"train_loss": -26.032189955194312, "global_step": 348848, "epoch": 4202, "val_loss": 6765597.0} {"train_loss": -23.9428768157959, "global_step": 348849, "epoch": 4203} {"train_loss": -25.383764266967773, "global_step": 348850, "epoch": 4203} {"train_loss": -25.38852310180664, "global_step": 348851, "epoch": 4203} {"train_loss": -25.61343765258789, "global_step": 348852, "epoch": 4203} {"train_loss": -25.04520606994629, "global_step": 348853, "epoch": 4203} {"train_loss": -25.027141571044922, "global_step": 348854, "epoch": 4203} {"train_loss": -24.831159591674805, "global_step": 348855, "epoch": 4203} {"train_loss": -25.277708053588867, "global_step": 348856, "epoch": 4203} {"train_loss": -25.10701560974121, "global_step": 348857, "epoch": 4203} {"train_loss": -25.006479263305664, "global_step": 348858, "epoch": 4203} {"train_loss": -25.6044864654541, "global_step": 348859, "epoch": 4203} {"train_loss": -25.454336166381836, "global_step": 348860, "epoch": 4203} {"train_loss": -25.593507766723633, "global_step": 348861, "epoch": 4203} {"train_loss": -25.628650665283203, "global_step": 348862, "epoch": 4203} {"train_loss": -25.88726806640625, "global_step": 348863, "epoch": 4203} {"train_loss": -25.686609268188477, "global_step": 348864, "epoch": 4203} {"train_loss": -25.877349853515625, "global_step": 348865, "epoch": 4203} {"train_loss": -25.544498443603516, "global_step": 348866, "epoch": 4203} {"train_loss": -25.74725341796875, "global_step": 348867, "epoch": 4203} {"train_loss": -25.92266845703125, "global_step": 348868, "epoch": 4203} {"train_loss": -26.252344131469727, "global_step": 348869, "epoch": 4203} {"train_loss": -26.003543853759766, "global_step": 348870, "epoch": 4203} {"train_loss": -25.936756134033203, "global_step": 348871, "epoch": 4203} {"train_loss": -26.34779167175293, "global_step": 348872, "epoch": 4203} {"train_loss": -25.94597816467285, "global_step": 348873, "epoch": 4203} {"train_loss": -25.88987159729004, "global_step": 348874, "epoch": 4203} {"train_loss": -26.152088165283203, "global_step": 348875, "epoch": 4203} {"train_loss": -26.131134033203125, "global_step": 348876, "epoch": 4203} {"train_loss": -25.780969619750977, "global_step": 348877, "epoch": 4203} {"train_loss": -26.20966911315918, "global_step": 348878, "epoch": 4203} {"train_loss": -25.96429443359375, "global_step": 348879, "epoch": 4203} {"train_loss": -26.0362606048584, "global_step": 348880, "epoch": 4203} {"train_loss": -26.3465633392334, "global_step": 348881, "epoch": 4203} {"train_loss": -25.97721290588379, "global_step": 348882, "epoch": 4203} {"train_loss": -25.961912155151367, "global_step": 348883, "epoch": 4203} {"train_loss": -26.133634567260742, "global_step": 348884, "epoch": 4203} {"train_loss": -26.257038116455078, "global_step": 348885, "epoch": 4203} {"train_loss": -26.039676666259766, "global_step": 348886, "epoch": 4203} {"train_loss": -26.199026107788086, "global_step": 348887, "epoch": 4203} {"train_loss": -26.090436935424805, "global_step": 348888, "epoch": 4203} {"train_loss": -26.108016967773438, "global_step": 348889, "epoch": 4203} {"train_loss": -25.532285690307617, "global_step": 348890, "epoch": 4203} {"train_loss": -26.053842544555664, "global_step": 348891, "epoch": 4203} {"train_loss": -25.96811866760254, "global_step": 348892, "epoch": 4203} {"train_loss": -26.123411178588867, "global_step": 348893, "epoch": 4203} {"train_loss": -25.68403434753418, "global_step": 348894, "epoch": 4203} {"train_loss": -25.68268394470215, "global_step": 348895, "epoch": 4203} {"train_loss": -26.053730010986328, "global_step": 348896, "epoch": 4203} {"train_loss": -25.912799835205078, "global_step": 348897, "epoch": 4203} {"train_loss": -25.77559471130371, "global_step": 348898, "epoch": 4203} {"train_loss": -26.210407257080078, "global_step": 348899, "epoch": 4203} {"train_loss": -26.028547286987305, "global_step": 348900, "epoch": 4203} {"train_loss": -25.824499130249023, "global_step": 348901, "epoch": 4203} {"train_loss": -26.3920841217041, "global_step": 348902, "epoch": 4203} {"train_loss": -26.038053512573242, "global_step": 348903, "epoch": 4203} {"train_loss": -26.114643096923828, "global_step": 348904, "epoch": 4203} {"train_loss": -26.415380477905273, "global_step": 348905, "epoch": 4203} {"train_loss": -26.44464111328125, "global_step": 348906, "epoch": 4203} {"train_loss": -26.055622100830078, "global_step": 348907, "epoch": 4203} {"train_loss": -26.167861938476562, "global_step": 348908, "epoch": 4203} {"train_loss": -26.18896484375, "global_step": 348909, "epoch": 4203} {"train_loss": -26.249744415283203, "global_step": 348910, "epoch": 4203} {"train_loss": -26.00672721862793, "global_step": 348911, "epoch": 4203} {"train_loss": -25.987394332885742, "global_step": 348912, "epoch": 4203} {"train_loss": -26.461034774780273, "global_step": 348913, "epoch": 4203} {"train_loss": -26.17087173461914, "global_step": 348914, "epoch": 4203} {"train_loss": -26.186811447143555, "global_step": 348915, "epoch": 4203} {"train_loss": -26.055652618408203, "global_step": 348916, "epoch": 4203} {"train_loss": -26.097824096679688, "global_step": 348917, "epoch": 4203} {"train_loss": -26.16849708557129, "global_step": 348918, "epoch": 4203} {"train_loss": -26.403095245361328, "global_step": 348919, "epoch": 4203} {"train_loss": -26.265918731689453, "global_step": 348920, "epoch": 4203} {"train_loss": -26.3138370513916, "global_step": 348921, "epoch": 4203} {"train_loss": -26.07339859008789, "global_step": 348922, "epoch": 4203} {"train_loss": -26.337549209594727, "global_step": 348923, "epoch": 4203} {"train_loss": -26.613073348999023, "global_step": 348924, "epoch": 4203} {"train_loss": -26.425384521484375, "global_step": 348925, "epoch": 4203} {"train_loss": -26.274524688720703, "global_step": 348926, "epoch": 4203} {"train_loss": -26.203943252563477, "global_step": 348927, "epoch": 4203} {"train_loss": -26.114978790283203, "global_step": 348928, "epoch": 4203} {"train_loss": -26.21955680847168, "global_step": 348929, "epoch": 4203} {"train_loss": -26.47696304321289, "global_step": 348930, "epoch": 4203} {"train_loss": -25.933690932859857, "global_step": 348931, "epoch": 4203, "val_loss": 6682546.0} {"train_loss": -25.90826988220215, "global_step": 348932, "epoch": 4204} {"train_loss": -25.705799102783203, "global_step": 348933, "epoch": 4204} {"train_loss": -26.043899536132812, "global_step": 348934, "epoch": 4204} {"train_loss": -25.69732666015625, "global_step": 348935, "epoch": 4204} {"train_loss": -25.864294052124023, "global_step": 348936, "epoch": 4204} {"train_loss": -25.851892471313477, "global_step": 348937, "epoch": 4204} {"train_loss": -25.88330078125, "global_step": 348938, "epoch": 4204} {"train_loss": -26.058202743530273, "global_step": 348939, "epoch": 4204} {"train_loss": -26.087543487548828, "global_step": 348940, "epoch": 4204} {"train_loss": -25.893457412719727, "global_step": 348941, "epoch": 4204} {"train_loss": -26.23585319519043, "global_step": 348942, "epoch": 4204} {"train_loss": -25.877573013305664, "global_step": 348943, "epoch": 4204} {"train_loss": -26.165746688842773, "global_step": 348944, "epoch": 4204} {"train_loss": -26.1497802734375, "global_step": 348945, "epoch": 4204} {"train_loss": -25.747928619384766, "global_step": 348946, "epoch": 4204} {"train_loss": -26.24610710144043, "global_step": 348947, "epoch": 4204} {"train_loss": -25.927417755126953, "global_step": 348948, "epoch": 4204} {"train_loss": -26.39068031311035, "global_step": 348949, "epoch": 4204} {"train_loss": -25.997406005859375, "global_step": 348950, "epoch": 4204} {"train_loss": -25.795440673828125, "global_step": 348951, "epoch": 4204} {"train_loss": -26.11919593811035, "global_step": 348952, "epoch": 4204} {"train_loss": -26.249958038330078, "global_step": 348953, "epoch": 4204} {"train_loss": -25.881900787353516, "global_step": 348954, "epoch": 4204} {"train_loss": -26.168643951416016, "global_step": 348955, "epoch": 4204} {"train_loss": -26.4539794921875, "global_step": 348956, "epoch": 4204} {"train_loss": -26.011945724487305, "global_step": 348957, "epoch": 4204} {"train_loss": -26.293411254882812, "global_step": 348958, "epoch": 4204} {"train_loss": -26.417346954345703, "global_step": 348959, "epoch": 4204} {"train_loss": -25.620328903198242, "global_step": 348960, "epoch": 4204} {"train_loss": -26.03217887878418, "global_step": 348961, "epoch": 4204} {"train_loss": -26.572925567626953, "global_step": 348962, "epoch": 4204} {"train_loss": -26.01698112487793, "global_step": 348963, "epoch": 4204} {"train_loss": -26.351877212524414, "global_step": 348964, "epoch": 4204} {"train_loss": -26.172407150268555, "global_step": 348965, "epoch": 4204} {"train_loss": -26.325275421142578, "global_step": 348966, "epoch": 4204} {"train_loss": -25.873504638671875, "global_step": 348967, "epoch": 4204} {"train_loss": -25.985803604125977, "global_step": 348968, "epoch": 4204} {"train_loss": -26.2947998046875, "global_step": 348969, "epoch": 4204} {"train_loss": -26.690317153930664, "global_step": 348970, "epoch": 4204} {"train_loss": -26.216541290283203, "global_step": 348971, "epoch": 4204} {"train_loss": -26.50738525390625, "global_step": 348972, "epoch": 4204} {"train_loss": -26.258920669555664, "global_step": 348973, "epoch": 4204} {"train_loss": -26.394880294799805, "global_step": 348974, "epoch": 4204} {"train_loss": -26.34018325805664, "global_step": 348975, "epoch": 4204} {"train_loss": -26.03236198425293, "global_step": 348976, "epoch": 4204} {"train_loss": -26.178747177124023, "global_step": 348977, "epoch": 4204} {"train_loss": -25.624231338500977, "global_step": 348978, "epoch": 4204} {"train_loss": -26.579071044921875, "global_step": 348979, "epoch": 4204} {"train_loss": -26.446744918823242, "global_step": 348980, "epoch": 4204} {"train_loss": -26.608713150024414, "global_step": 348981, "epoch": 4204} {"train_loss": -25.71443748474121, "global_step": 348982, "epoch": 4204} {"train_loss": -26.3207950592041, "global_step": 348983, "epoch": 4204} {"train_loss": -25.790882110595703, "global_step": 348984, "epoch": 4204} {"train_loss": -26.18645668029785, "global_step": 348985, "epoch": 4204} {"train_loss": -25.97780418395996, "global_step": 348986, "epoch": 4204} {"train_loss": -26.356159210205078, "global_step": 348987, "epoch": 4204} {"train_loss": -26.090906143188477, "global_step": 348988, "epoch": 4204} {"train_loss": -25.43568992614746, "global_step": 348989, "epoch": 4204} {"train_loss": -25.351301193237305, "global_step": 348990, "epoch": 4204} {"train_loss": -26.15399742126465, "global_step": 348991, "epoch": 4204} {"train_loss": -25.891889572143555, "global_step": 348992, "epoch": 4204} {"train_loss": -25.708398818969727, "global_step": 348993, "epoch": 4204} {"train_loss": -26.2935791015625, "global_step": 348994, "epoch": 4204} {"train_loss": -25.742908477783203, "global_step": 348995, "epoch": 4204} {"train_loss": -26.182031631469727, "global_step": 348996, "epoch": 4204} {"train_loss": -26.11102294921875, "global_step": 348997, "epoch": 4204} {"train_loss": -25.502897262573242, "global_step": 348998, "epoch": 4204} {"train_loss": -26.393972396850586, "global_step": 348999, "epoch": 4204} {"train_loss": -26.252588272094727, "global_step": 349000, "epoch": 4204} {"train_loss": -26.251590728759766, "global_step": 349001, "epoch": 4204} {"train_loss": -26.13152503967285, "global_step": 349002, "epoch": 4204} {"train_loss": -26.294919967651367, "global_step": 349003, "epoch": 4204} {"train_loss": -26.16631507873535, "global_step": 349004, "epoch": 4204} {"train_loss": -26.14453125, "global_step": 349005, "epoch": 4204} {"train_loss": -26.086750030517578, "global_step": 349006, "epoch": 4204} {"train_loss": -25.946863174438477, "global_step": 349007, "epoch": 4204} {"train_loss": -26.02263832092285, "global_step": 349008, "epoch": 4204} {"train_loss": -26.334264755249023, "global_step": 349009, "epoch": 4204} {"train_loss": -26.491254806518555, "global_step": 349010, "epoch": 4204} {"train_loss": -26.021528244018555, "global_step": 349011, "epoch": 4204} {"train_loss": -26.29644775390625, "global_step": 349012, "epoch": 4204} {"train_loss": -26.234012603759766, "global_step": 349013, "epoch": 4204} {"train_loss": -26.11392765734569, "global_step": 349014, "epoch": 4204, "val_loss": 6682535.0} {"train_loss": -26.23075294494629, "global_step": 349015, "epoch": 4205} {"train_loss": -25.85261344909668, "global_step": 349016, "epoch": 4205} {"train_loss": -25.120166778564453, "global_step": 349017, "epoch": 4205} {"train_loss": -24.993392944335938, "global_step": 349018, "epoch": 4205} {"train_loss": -25.752607345581055, "global_step": 349019, "epoch": 4205} {"train_loss": -26.13232421875, "global_step": 349020, "epoch": 4205} {"train_loss": -25.201173782348633, "global_step": 349021, "epoch": 4205} {"train_loss": -25.207387924194336, "global_step": 349022, "epoch": 4205} {"train_loss": -25.99072265625, "global_step": 349023, "epoch": 4205} {"train_loss": -25.70991325378418, "global_step": 349024, "epoch": 4205} {"train_loss": -25.72157096862793, "global_step": 349025, "epoch": 4205} {"train_loss": -25.642288208007812, "global_step": 349026, "epoch": 4205} {"train_loss": -25.774417877197266, "global_step": 349027, "epoch": 4205} {"train_loss": -26.153711318969727, "global_step": 349028, "epoch": 4205} {"train_loss": -25.480337142944336, "global_step": 349029, "epoch": 4205} {"train_loss": -26.059589385986328, "global_step": 349030, "epoch": 4205} {"train_loss": -25.790882110595703, "global_step": 349031, "epoch": 4205} {"train_loss": -25.59872817993164, "global_step": 349032, "epoch": 4205} {"train_loss": -25.78411865234375, "global_step": 349033, "epoch": 4205} {"train_loss": -25.945392608642578, "global_step": 349034, "epoch": 4205} {"train_loss": -25.972187042236328, "global_step": 349035, "epoch": 4205} {"train_loss": -26.049001693725586, "global_step": 349036, "epoch": 4205} {"train_loss": -25.75457191467285, "global_step": 349037, "epoch": 4205} {"train_loss": -25.914541244506836, "global_step": 349038, "epoch": 4205} {"train_loss": -26.12464714050293, "global_step": 349039, "epoch": 4205} {"train_loss": -26.364370346069336, "global_step": 349040, "epoch": 4205} {"train_loss": -26.15763282775879, "global_step": 349041, "epoch": 4205} {"train_loss": -26.255849838256836, "global_step": 349042, "epoch": 4205} {"train_loss": -26.066394805908203, "global_step": 349043, "epoch": 4205} {"train_loss": -25.93275260925293, "global_step": 349044, "epoch": 4205} {"train_loss": -25.9009952545166, "global_step": 349045, "epoch": 4205} {"train_loss": -26.15179443359375, "global_step": 349046, "epoch": 4205} {"train_loss": -26.080602645874023, "global_step": 349047, "epoch": 4205} {"train_loss": -25.925220489501953, "global_step": 349048, "epoch": 4205} {"train_loss": -26.441364288330078, "global_step": 349049, "epoch": 4205} {"train_loss": -25.97063636779785, "global_step": 349050, "epoch": 4205} {"train_loss": -26.071725845336914, "global_step": 349051, "epoch": 4205} {"train_loss": -26.414838790893555, "global_step": 349052, "epoch": 4205} {"train_loss": -26.128171920776367, "global_step": 349053, "epoch": 4205} {"train_loss": -26.008996963500977, "global_step": 349054, "epoch": 4205} {"train_loss": -25.8572998046875, "global_step": 349055, "epoch": 4205} {"train_loss": -26.35163688659668, "global_step": 349056, "epoch": 4205} {"train_loss": -26.187376022338867, "global_step": 349057, "epoch": 4205} {"train_loss": -26.261417388916016, "global_step": 349058, "epoch": 4205} {"train_loss": -26.38154411315918, "global_step": 349059, "epoch": 4205} {"train_loss": -26.56062126159668, "global_step": 349060, "epoch": 4205} {"train_loss": -26.32160758972168, "global_step": 349061, "epoch": 4205} {"train_loss": -26.290098190307617, "global_step": 349062, "epoch": 4205} {"train_loss": -25.91875648498535, "global_step": 349063, "epoch": 4205} {"train_loss": -26.262983322143555, "global_step": 349064, "epoch": 4205} {"train_loss": -26.300195693969727, "global_step": 349065, "epoch": 4205} {"train_loss": -26.39455223083496, "global_step": 349066, "epoch": 4205} {"train_loss": -26.270893096923828, "global_step": 349067, "epoch": 4205} {"train_loss": -26.476835250854492, "global_step": 349068, "epoch": 4205} {"train_loss": -25.885847091674805, "global_step": 349069, "epoch": 4205} {"train_loss": -25.939218521118164, "global_step": 349070, "epoch": 4205} {"train_loss": -25.99064064025879, "global_step": 349071, "epoch": 4205} {"train_loss": -26.10273551940918, "global_step": 349072, "epoch": 4205} {"train_loss": -25.87208366394043, "global_step": 349073, "epoch": 4205} {"train_loss": -25.96405601501465, "global_step": 349074, "epoch": 4205} {"train_loss": -26.05543327331543, "global_step": 349075, "epoch": 4205} {"train_loss": -26.092498779296875, "global_step": 349076, "epoch": 4205} {"train_loss": -26.47548484802246, "global_step": 349077, "epoch": 4205} {"train_loss": -26.01348876953125, "global_step": 349078, "epoch": 4205} {"train_loss": -26.211637496948242, "global_step": 349079, "epoch": 4205} {"train_loss": -26.1136474609375, "global_step": 349080, "epoch": 4205} {"train_loss": -25.61512565612793, "global_step": 349081, "epoch": 4205} {"train_loss": -25.942846298217773, "global_step": 349082, "epoch": 4205} {"train_loss": -25.813404083251953, "global_step": 349083, "epoch": 4205} {"train_loss": -26.278730392456055, "global_step": 349084, "epoch": 4205} {"train_loss": -25.7996826171875, "global_step": 349085, "epoch": 4205} {"train_loss": -25.65728759765625, "global_step": 349086, "epoch": 4205} {"train_loss": -25.785308837890625, "global_step": 349087, "epoch": 4205} {"train_loss": -25.319746017456055, "global_step": 349088, "epoch": 4205} {"train_loss": -25.85651206970215, "global_step": 349089, "epoch": 4205} {"train_loss": -25.74371337890625, "global_step": 349090, "epoch": 4205} {"train_loss": -25.24062728881836, "global_step": 349091, "epoch": 4205} {"train_loss": -26.18887710571289, "global_step": 349092, "epoch": 4205} {"train_loss": -25.767114639282227, "global_step": 349093, "epoch": 4205} {"train_loss": -26.21710777282715, "global_step": 349094, "epoch": 4205} {"train_loss": -25.24102020263672, "global_step": 349095, "epoch": 4205} {"train_loss": -26.228307723999023, "global_step": 349096, "epoch": 4205} {"train_loss": -25.9354230811797, "global_step": 349097, "epoch": 4205, "val_loss": 6708435.5} {"train_loss": -24.813352584838867, "global_step": 349098, "epoch": 4206} {"train_loss": -25.185169219970703, "global_step": 349099, "epoch": 4206} {"train_loss": -25.65034294128418, "global_step": 349100, "epoch": 4206} {"train_loss": -25.23328971862793, "global_step": 349101, "epoch": 4206} {"train_loss": -25.21908950805664, "global_step": 349102, "epoch": 4206} {"train_loss": -25.709936141967773, "global_step": 349103, "epoch": 4206} {"train_loss": -25.37851905822754, "global_step": 349104, "epoch": 4206} {"train_loss": -25.816120147705078, "global_step": 349105, "epoch": 4206} {"train_loss": -24.983442306518555, "global_step": 349106, "epoch": 4206} {"train_loss": -25.893354415893555, "global_step": 349107, "epoch": 4206} {"train_loss": -26.055124282836914, "global_step": 349108, "epoch": 4206} {"train_loss": -25.834857940673828, "global_step": 349109, "epoch": 4206} {"train_loss": -25.75477409362793, "global_step": 349110, "epoch": 4206} {"train_loss": -25.477746963500977, "global_step": 349111, "epoch": 4206} {"train_loss": -25.938404083251953, "global_step": 349112, "epoch": 4206} {"train_loss": -25.62604331970215, "global_step": 349113, "epoch": 4206} {"train_loss": -25.825117111206055, "global_step": 349114, "epoch": 4206} {"train_loss": -25.936925888061523, "global_step": 349115, "epoch": 4206} {"train_loss": -26.0808162689209, "global_step": 349116, "epoch": 4206} {"train_loss": -25.694150924682617, "global_step": 349117, "epoch": 4206} {"train_loss": -26.079755783081055, "global_step": 349118, "epoch": 4206} {"train_loss": -25.944177627563477, "global_step": 349119, "epoch": 4206} {"train_loss": -26.046300888061523, "global_step": 349120, "epoch": 4206} {"train_loss": -25.850833892822266, "global_step": 349121, "epoch": 4206} {"train_loss": -26.150476455688477, "global_step": 349122, "epoch": 4206} {"train_loss": -26.05615234375, "global_step": 349123, "epoch": 4206} {"train_loss": -26.00160026550293, "global_step": 349124, "epoch": 4206} {"train_loss": -26.039566040039062, "global_step": 349125, "epoch": 4206} {"train_loss": -26.618030548095703, "global_step": 349126, "epoch": 4206} {"train_loss": -26.26641845703125, "global_step": 349127, "epoch": 4206} {"train_loss": -26.27329444885254, "global_step": 349128, "epoch": 4206} {"train_loss": -26.385440826416016, "global_step": 349129, "epoch": 4206} {"train_loss": -26.106962203979492, "global_step": 349130, "epoch": 4206} {"train_loss": -26.182031631469727, "global_step": 349131, "epoch": 4206} {"train_loss": -26.41914176940918, "global_step": 349132, "epoch": 4206} {"train_loss": -26.15912437438965, "global_step": 349133, "epoch": 4206} {"train_loss": -26.46803092956543, "global_step": 349134, "epoch": 4206} {"train_loss": -26.06851577758789, "global_step": 349135, "epoch": 4206} {"train_loss": -26.1088809967041, "global_step": 349136, "epoch": 4206} {"train_loss": -26.195907592773438, "global_step": 349137, "epoch": 4206} {"train_loss": -26.2264461517334, "global_step": 349138, "epoch": 4206} {"train_loss": -26.183141708374023, "global_step": 349139, "epoch": 4206} {"train_loss": -26.05592155456543, "global_step": 349140, "epoch": 4206} {"train_loss": -26.58518409729004, "global_step": 349141, "epoch": 4206} {"train_loss": -26.01462173461914, "global_step": 349142, "epoch": 4206} {"train_loss": -26.471418380737305, "global_step": 349143, "epoch": 4206} {"train_loss": -26.143774032592773, "global_step": 349144, "epoch": 4206} {"train_loss": -25.607812881469727, "global_step": 349145, "epoch": 4206} {"train_loss": -26.233829498291016, "global_step": 349146, "epoch": 4206} {"train_loss": -26.074453353881836, "global_step": 349147, "epoch": 4206} {"train_loss": -26.381826400756836, "global_step": 349148, "epoch": 4206} {"train_loss": -25.948699951171875, "global_step": 349149, "epoch": 4206} {"train_loss": -25.793975830078125, "global_step": 349150, "epoch": 4206} {"train_loss": -26.1105899810791, "global_step": 349151, "epoch": 4206} {"train_loss": -26.34970474243164, "global_step": 349152, "epoch": 4206} {"train_loss": -26.275821685791016, "global_step": 349153, "epoch": 4206} {"train_loss": -26.319355010986328, "global_step": 349154, "epoch": 4206} {"train_loss": -26.358549118041992, "global_step": 349155, "epoch": 4206} {"train_loss": -26.42948341369629, "global_step": 349156, "epoch": 4206} {"train_loss": -26.477766036987305, "global_step": 349157, "epoch": 4206} {"train_loss": -26.361282348632812, "global_step": 349158, "epoch": 4206} {"train_loss": -26.057544708251953, "global_step": 349159, "epoch": 4206} {"train_loss": -26.343494415283203, "global_step": 349160, "epoch": 4206} {"train_loss": -26.387014389038086, "global_step": 349161, "epoch": 4206} {"train_loss": -25.85357093811035, "global_step": 349162, "epoch": 4206} {"train_loss": -25.82581901550293, "global_step": 349163, "epoch": 4206} {"train_loss": -26.56089210510254, "global_step": 349164, "epoch": 4206} {"train_loss": -26.140928268432617, "global_step": 349165, "epoch": 4206} {"train_loss": -26.1532039642334, "global_step": 349166, "epoch": 4206} {"train_loss": -26.22357177734375, "global_step": 349167, "epoch": 4206} {"train_loss": -25.92188835144043, "global_step": 349168, "epoch": 4206} {"train_loss": -25.972949981689453, "global_step": 349169, "epoch": 4206} {"train_loss": -26.26361656188965, "global_step": 349170, "epoch": 4206} {"train_loss": -26.202966690063477, "global_step": 349171, "epoch": 4206} {"train_loss": -25.8929386138916, "global_step": 349172, "epoch": 4206} {"train_loss": -25.89984130859375, "global_step": 349173, "epoch": 4206} {"train_loss": -26.161298751831055, "global_step": 349174, "epoch": 4206} {"train_loss": -26.291461944580078, "global_step": 349175, "epoch": 4206} {"train_loss": -26.339130401611328, "global_step": 349176, "epoch": 4206} {"train_loss": -26.168048858642578, "global_step": 349177, "epoch": 4206} {"train_loss": -26.243127822875977, "global_step": 349178, "epoch": 4206} {"train_loss": -25.97809410095215, "global_step": 349179, "epoch": 4206} {"train_loss": -26.051667868372906, "global_step": 349180, "epoch": 4206, "val_loss": 6702469.0} {"train_loss": -26.319700241088867, "global_step": 349181, "epoch": 4207} {"train_loss": -26.064855575561523, "global_step": 349182, "epoch": 4207} {"train_loss": -25.857349395751953, "global_step": 349183, "epoch": 4207} {"train_loss": -25.758453369140625, "global_step": 349184, "epoch": 4207} {"train_loss": -25.67499351501465, "global_step": 349185, "epoch": 4207} {"train_loss": -25.83935546875, "global_step": 349186, "epoch": 4207} {"train_loss": -26.101272583007812, "global_step": 349187, "epoch": 4207} {"train_loss": -26.081689834594727, "global_step": 349188, "epoch": 4207} {"train_loss": -25.718124389648438, "global_step": 349189, "epoch": 4207} {"train_loss": -26.201940536499023, "global_step": 349190, "epoch": 4207} {"train_loss": -26.303564071655273, "global_step": 349191, "epoch": 4207} {"train_loss": -26.181928634643555, "global_step": 349192, "epoch": 4207} {"train_loss": -25.793399810791016, "global_step": 349193, "epoch": 4207} {"train_loss": -26.18047523498535, "global_step": 349194, "epoch": 4207} {"train_loss": -26.377227783203125, "global_step": 349195, "epoch": 4207} {"train_loss": -26.173450469970703, "global_step": 349196, "epoch": 4207} {"train_loss": -25.908777236938477, "global_step": 349197, "epoch": 4207} {"train_loss": -26.019062042236328, "global_step": 349198, "epoch": 4207} {"train_loss": -25.936420440673828, "global_step": 349199, "epoch": 4207} {"train_loss": -26.1468563079834, "global_step": 349200, "epoch": 4207} {"train_loss": -25.976383209228516, "global_step": 349201, "epoch": 4207} {"train_loss": -26.07960319519043, "global_step": 349202, "epoch": 4207} {"train_loss": -26.02151870727539, "global_step": 349203, "epoch": 4207} {"train_loss": -25.824268341064453, "global_step": 349204, "epoch": 4207} {"train_loss": -26.376562118530273, "global_step": 349205, "epoch": 4207} {"train_loss": -26.142065048217773, "global_step": 349206, "epoch": 4207} {"train_loss": -26.12993812561035, "global_step": 349207, "epoch": 4207} {"train_loss": -26.07906150817871, "global_step": 349208, "epoch": 4207} {"train_loss": -25.958099365234375, "global_step": 349209, "epoch": 4207} {"train_loss": -26.15284538269043, "global_step": 349210, "epoch": 4207} {"train_loss": -26.3963623046875, "global_step": 349211, "epoch": 4207} {"train_loss": -25.855749130249023, "global_step": 349212, "epoch": 4207} {"train_loss": -26.3890438079834, "global_step": 349213, "epoch": 4207} {"train_loss": -26.01710319519043, "global_step": 349214, "epoch": 4207} {"train_loss": -26.166479110717773, "global_step": 349215, "epoch": 4207} {"train_loss": -25.806427001953125, "global_step": 349216, "epoch": 4207} {"train_loss": -26.15289878845215, "global_step": 349217, "epoch": 4207} {"train_loss": -26.2103214263916, "global_step": 349218, "epoch": 4207} {"train_loss": -25.996856689453125, "global_step": 349219, "epoch": 4207} {"train_loss": -26.37152099609375, "global_step": 349220, "epoch": 4207} {"train_loss": -26.274036407470703, "global_step": 349221, "epoch": 4207} {"train_loss": -26.082304000854492, "global_step": 349222, "epoch": 4207} {"train_loss": -25.786916732788086, "global_step": 349223, "epoch": 4207} {"train_loss": -26.110315322875977, "global_step": 349224, "epoch": 4207} {"train_loss": -26.134634017944336, "global_step": 349225, "epoch": 4207} {"train_loss": -25.85053825378418, "global_step": 349226, "epoch": 4207} {"train_loss": -26.418439865112305, "global_step": 349227, "epoch": 4207} {"train_loss": -26.126850128173828, "global_step": 349228, "epoch": 4207} {"train_loss": -26.22669792175293, "global_step": 349229, "epoch": 4207} {"train_loss": -26.380407333374023, "global_step": 349230, "epoch": 4207} {"train_loss": -25.61097526550293, "global_step": 349231, "epoch": 4207} {"train_loss": -26.37128257751465, "global_step": 349232, "epoch": 4207} {"train_loss": -26.12566566467285, "global_step": 349233, "epoch": 4207} {"train_loss": -26.040952682495117, "global_step": 349234, "epoch": 4207} {"train_loss": -26.11024284362793, "global_step": 349235, "epoch": 4207} {"train_loss": -26.061981201171875, "global_step": 349236, "epoch": 4207} {"train_loss": -26.42708396911621, "global_step": 349237, "epoch": 4207} {"train_loss": -26.035444259643555, "global_step": 349238, "epoch": 4207} {"train_loss": -26.538818359375, "global_step": 349239, "epoch": 4207} {"train_loss": -26.113828659057617, "global_step": 349240, "epoch": 4207} {"train_loss": -26.18413734436035, "global_step": 349241, "epoch": 4207} {"train_loss": -26.322500228881836, "global_step": 349242, "epoch": 4207} {"train_loss": -26.194604873657227, "global_step": 349243, "epoch": 4207} {"train_loss": -26.255752563476562, "global_step": 349244, "epoch": 4207} {"train_loss": -26.450897216796875, "global_step": 349245, "epoch": 4207} {"train_loss": -26.52100944519043, "global_step": 349246, "epoch": 4207} {"train_loss": -26.057592391967773, "global_step": 349247, "epoch": 4207} {"train_loss": -26.522613525390625, "global_step": 349248, "epoch": 4207} {"train_loss": -26.21964454650879, "global_step": 349249, "epoch": 4207} {"train_loss": -26.248809814453125, "global_step": 349250, "epoch": 4207} {"train_loss": -25.9504337310791, "global_step": 349251, "epoch": 4207} {"train_loss": -26.037189483642578, "global_step": 349252, "epoch": 4207} {"train_loss": -26.34238624572754, "global_step": 349253, "epoch": 4207} {"train_loss": -25.960529327392578, "global_step": 349254, "epoch": 4207} {"train_loss": -25.801923751831055, "global_step": 349255, "epoch": 4207} {"train_loss": -26.10929298400879, "global_step": 349256, "epoch": 4207} {"train_loss": -26.361881256103516, "global_step": 349257, "epoch": 4207} {"train_loss": -26.371875762939453, "global_step": 349258, "epoch": 4207} {"train_loss": -26.175018310546875, "global_step": 349259, "epoch": 4207} {"train_loss": -26.075305938720703, "global_step": 349260, "epoch": 4207} {"train_loss": -26.345233917236328, "global_step": 349261, "epoch": 4207} {"train_loss": -25.967527389526367, "global_step": 349262, "epoch": 4207} {"train_loss": -26.12003965262907, "global_step": 349263, "epoch": 4207, "val_loss": 6685259.0} {"train_loss": -26.120925903320312, "global_step": 349264, "epoch": 4208} {"train_loss": -25.800474166870117, "global_step": 349265, "epoch": 4208} {"train_loss": -26.016260147094727, "global_step": 349266, "epoch": 4208} {"train_loss": -26.188983917236328, "global_step": 349267, "epoch": 4208} {"train_loss": -25.747953414916992, "global_step": 349268, "epoch": 4208} {"train_loss": -25.89932632446289, "global_step": 349269, "epoch": 4208} {"train_loss": -26.045495986938477, "global_step": 349270, "epoch": 4208} {"train_loss": -25.92368507385254, "global_step": 349271, "epoch": 4208} {"train_loss": -26.208606719970703, "global_step": 349272, "epoch": 4208} {"train_loss": -25.852985382080078, "global_step": 349273, "epoch": 4208} {"train_loss": -25.08218765258789, "global_step": 349274, "epoch": 4208} {"train_loss": -25.869495391845703, "global_step": 349275, "epoch": 4208} {"train_loss": -26.147916793823242, "global_step": 349276, "epoch": 4208} {"train_loss": -25.83237648010254, "global_step": 349277, "epoch": 4208} {"train_loss": -25.63128089904785, "global_step": 349278, "epoch": 4208} {"train_loss": -26.167789459228516, "global_step": 349279, "epoch": 4208} {"train_loss": -25.928180694580078, "global_step": 349280, "epoch": 4208} {"train_loss": -26.00284767150879, "global_step": 349281, "epoch": 4208} {"train_loss": -26.074121475219727, "global_step": 349282, "epoch": 4208} {"train_loss": -26.033432006835938, "global_step": 349283, "epoch": 4208} {"train_loss": -25.85906410217285, "global_step": 349284, "epoch": 4208} {"train_loss": -26.17709732055664, "global_step": 349285, "epoch": 4208} {"train_loss": -25.97430992126465, "global_step": 349286, "epoch": 4208} {"train_loss": -26.266937255859375, "global_step": 349287, "epoch": 4208} {"train_loss": -25.763458251953125, "global_step": 349288, "epoch": 4208} {"train_loss": -25.966785430908203, "global_step": 349289, "epoch": 4208} {"train_loss": -26.498371124267578, "global_step": 349290, "epoch": 4208} {"train_loss": -26.02036476135254, "global_step": 349291, "epoch": 4208} {"train_loss": -25.856412887573242, "global_step": 349292, "epoch": 4208} {"train_loss": -25.732563018798828, "global_step": 349293, "epoch": 4208} {"train_loss": -26.2034969329834, "global_step": 349294, "epoch": 4208} {"train_loss": -25.64994239807129, "global_step": 349295, "epoch": 4208} {"train_loss": -26.269779205322266, "global_step": 349296, "epoch": 4208} {"train_loss": -26.148853302001953, "global_step": 349297, "epoch": 4208} {"train_loss": -25.8458194732666, "global_step": 349298, "epoch": 4208} {"train_loss": -26.342803955078125, "global_step": 349299, "epoch": 4208} {"train_loss": -26.48896598815918, "global_step": 349300, "epoch": 4208} {"train_loss": -26.117918014526367, "global_step": 349301, "epoch": 4208} {"train_loss": -26.170455932617188, "global_step": 349302, "epoch": 4208} {"train_loss": -26.317026138305664, "global_step": 349303, "epoch": 4208} {"train_loss": -26.30356788635254, "global_step": 349304, "epoch": 4208} {"train_loss": -26.265918731689453, "global_step": 349305, "epoch": 4208} {"train_loss": -26.23982048034668, "global_step": 349306, "epoch": 4208} {"train_loss": -26.203479766845703, "global_step": 349307, "epoch": 4208} {"train_loss": -26.0509090423584, "global_step": 349308, "epoch": 4208} {"train_loss": -26.65960693359375, "global_step": 349309, "epoch": 4208} {"train_loss": -26.274356842041016, "global_step": 349310, "epoch": 4208} {"train_loss": -26.089893341064453, "global_step": 349311, "epoch": 4208} {"train_loss": -26.18828773498535, "global_step": 349312, "epoch": 4208} {"train_loss": -26.105066299438477, "global_step": 349313, "epoch": 4208} {"train_loss": -26.0488224029541, "global_step": 349314, "epoch": 4208} {"train_loss": -25.842145919799805, "global_step": 349315, "epoch": 4208} {"train_loss": -25.886640548706055, "global_step": 349316, "epoch": 4208} {"train_loss": -26.43476676940918, "global_step": 349317, "epoch": 4208} {"train_loss": -26.33530044555664, "global_step": 349318, "epoch": 4208} {"train_loss": -26.160480499267578, "global_step": 349319, "epoch": 4208} {"train_loss": -25.885156631469727, "global_step": 349320, "epoch": 4208} {"train_loss": -26.36932945251465, "global_step": 349321, "epoch": 4208} {"train_loss": -26.15456199645996, "global_step": 349322, "epoch": 4208} {"train_loss": -25.943115234375, "global_step": 349323, "epoch": 4208} {"train_loss": -26.40420913696289, "global_step": 349324, "epoch": 4208} {"train_loss": -26.332111358642578, "global_step": 349325, "epoch": 4208} {"train_loss": -25.7176456451416, "global_step": 349326, "epoch": 4208} {"train_loss": -26.0883846282959, "global_step": 349327, "epoch": 4208} {"train_loss": -26.564071655273438, "global_step": 349328, "epoch": 4208} {"train_loss": -26.258100509643555, "global_step": 349329, "epoch": 4208} {"train_loss": -26.313703536987305, "global_step": 349330, "epoch": 4208} {"train_loss": -26.2962703704834, "global_step": 349331, "epoch": 4208} {"train_loss": -26.229089736938477, "global_step": 349332, "epoch": 4208} {"train_loss": -26.12091064453125, "global_step": 349333, "epoch": 4208} {"train_loss": -26.05743980407715, "global_step": 349334, "epoch": 4208} {"train_loss": -26.2702693939209, "global_step": 349335, "epoch": 4208} {"train_loss": -26.097171783447266, "global_step": 349336, "epoch": 4208} {"train_loss": -26.159448623657227, "global_step": 349337, "epoch": 4208} {"train_loss": -26.2222957611084, "global_step": 349338, "epoch": 4208} {"train_loss": -26.240222930908203, "global_step": 349339, "epoch": 4208} {"train_loss": -25.97541618347168, "global_step": 349340, "epoch": 4208} {"train_loss": -26.320383071899414, "global_step": 349341, "epoch": 4208} {"train_loss": -26.135028839111328, "global_step": 349342, "epoch": 4208} {"train_loss": -26.045690536499023, "global_step": 349343, "epoch": 4208} {"train_loss": -25.988061904907227, "global_step": 349344, "epoch": 4208} {"train_loss": -25.806997299194336, "global_step": 349345, "epoch": 4208} {"train_loss": -26.082102097660663, "global_step": 349346, "epoch": 4208, "val_loss": 6679490.0} {"train_loss": -25.975366592407227, "global_step": 349347, "epoch": 4209} {"train_loss": -25.628950119018555, "global_step": 349348, "epoch": 4209} {"train_loss": -25.536487579345703, "global_step": 349349, "epoch": 4209} {"train_loss": -25.418371200561523, "global_step": 349350, "epoch": 4209} {"train_loss": -25.6040096282959, "global_step": 349351, "epoch": 4209} {"train_loss": -26.196340560913086, "global_step": 349352, "epoch": 4209} {"train_loss": -25.626667022705078, "global_step": 349353, "epoch": 4209} {"train_loss": -26.170215606689453, "global_step": 349354, "epoch": 4209} {"train_loss": -25.713342666625977, "global_step": 349355, "epoch": 4209} {"train_loss": -25.88637351989746, "global_step": 349356, "epoch": 4209} {"train_loss": -26.119537353515625, "global_step": 349357, "epoch": 4209} {"train_loss": -26.554426193237305, "global_step": 349358, "epoch": 4209} {"train_loss": -26.064056396484375, "global_step": 349359, "epoch": 4209} {"train_loss": -26.31422233581543, "global_step": 349360, "epoch": 4209} {"train_loss": -25.886693954467773, "global_step": 349361, "epoch": 4209} {"train_loss": -26.029218673706055, "global_step": 349362, "epoch": 4209} {"train_loss": -26.11115074157715, "global_step": 349363, "epoch": 4209} {"train_loss": -26.31203269958496, "global_step": 349364, "epoch": 4209} {"train_loss": -26.15561866760254, "global_step": 349365, "epoch": 4209} {"train_loss": -25.926034927368164, "global_step": 349366, "epoch": 4209} {"train_loss": -26.18204116821289, "global_step": 349367, "epoch": 4209} {"train_loss": -26.04559326171875, "global_step": 349368, "epoch": 4209} {"train_loss": -25.994464874267578, "global_step": 349369, "epoch": 4209} {"train_loss": -26.133563995361328, "global_step": 349370, "epoch": 4209} {"train_loss": -26.17641258239746, "global_step": 349371, "epoch": 4209} {"train_loss": -26.3929386138916, "global_step": 349372, "epoch": 4209} {"train_loss": -26.346723556518555, "global_step": 349373, "epoch": 4209} {"train_loss": -26.1479549407959, "global_step": 349374, "epoch": 4209} {"train_loss": -26.368955612182617, "global_step": 349375, "epoch": 4209} {"train_loss": -26.00331687927246, "global_step": 349376, "epoch": 4209} {"train_loss": -26.052398681640625, "global_step": 349377, "epoch": 4209} {"train_loss": -26.029022216796875, "global_step": 349378, "epoch": 4209} {"train_loss": -26.297351837158203, "global_step": 349379, "epoch": 4209} {"train_loss": -26.273900985717773, "global_step": 349380, "epoch": 4209} {"train_loss": -26.282461166381836, "global_step": 349381, "epoch": 4209} {"train_loss": -26.30214500427246, "global_step": 349382, "epoch": 4209} {"train_loss": -25.931869506835938, "global_step": 349383, "epoch": 4209} {"train_loss": -26.38154411315918, "global_step": 349384, "epoch": 4209} {"train_loss": -26.11162757873535, "global_step": 349385, "epoch": 4209} {"train_loss": -26.060516357421875, "global_step": 349386, "epoch": 4209} {"train_loss": -26.1164493560791, "global_step": 349387, "epoch": 4209} {"train_loss": -26.520496368408203, "global_step": 349388, "epoch": 4209} {"train_loss": -26.113208770751953, "global_step": 349389, "epoch": 4209} {"train_loss": -26.27046012878418, "global_step": 349390, "epoch": 4209} {"train_loss": -26.558734893798828, "global_step": 349391, "epoch": 4209} {"train_loss": -26.581085205078125, "global_step": 349392, "epoch": 4209} {"train_loss": -26.32023048400879, "global_step": 349393, "epoch": 4209} {"train_loss": -26.2366943359375, "global_step": 349394, "epoch": 4209} {"train_loss": -26.41482925415039, "global_step": 349395, "epoch": 4209} {"train_loss": -26.57964515686035, "global_step": 349396, "epoch": 4209} {"train_loss": -26.00300407409668, "global_step": 349397, "epoch": 4209} {"train_loss": -26.123205184936523, "global_step": 349398, "epoch": 4209} {"train_loss": -26.13226318359375, "global_step": 349399, "epoch": 4209} {"train_loss": -25.370849609375, "global_step": 349400, "epoch": 4209} {"train_loss": -24.804718017578125, "global_step": 349401, "epoch": 4209} {"train_loss": -25.233015060424805, "global_step": 349402, "epoch": 4209} {"train_loss": -25.276813507080078, "global_step": 349403, "epoch": 4209} {"train_loss": -25.79764747619629, "global_step": 349404, "epoch": 4209} {"train_loss": -25.476770401000977, "global_step": 349405, "epoch": 4209} {"train_loss": -25.327688217163086, "global_step": 349406, "epoch": 4209} {"train_loss": -26.056262969970703, "global_step": 349407, "epoch": 4209} {"train_loss": -25.57960319519043, "global_step": 349408, "epoch": 4209} {"train_loss": -26.024152755737305, "global_step": 349409, "epoch": 4209} {"train_loss": -26.06839370727539, "global_step": 349410, "epoch": 4209} {"train_loss": -25.710132598876953, "global_step": 349411, "epoch": 4209} {"train_loss": -26.01397705078125, "global_step": 349412, "epoch": 4209} {"train_loss": -26.042022705078125, "global_step": 349413, "epoch": 4209} {"train_loss": -26.151840209960938, "global_step": 349414, "epoch": 4209} {"train_loss": -26.086469650268555, "global_step": 349415, "epoch": 4209} {"train_loss": -25.60322380065918, "global_step": 349416, "epoch": 4209} {"train_loss": -25.997089385986328, "global_step": 349417, "epoch": 4209} {"train_loss": -26.082386016845703, "global_step": 349418, "epoch": 4209} {"train_loss": -26.015783309936523, "global_step": 349419, "epoch": 4209} {"train_loss": -26.056867599487305, "global_step": 349420, "epoch": 4209} {"train_loss": -26.381505966186523, "global_step": 349421, "epoch": 4209} {"train_loss": -26.308425903320312, "global_step": 349422, "epoch": 4209} {"train_loss": -26.178564071655273, "global_step": 349423, "epoch": 4209} {"train_loss": -26.191516876220703, "global_step": 349424, "epoch": 4209} {"train_loss": -25.664993286132812, "global_step": 349425, "epoch": 4209} {"train_loss": -26.044864654541016, "global_step": 349426, "epoch": 4209} {"train_loss": -25.754064559936523, "global_step": 349427, "epoch": 4209} {"train_loss": -26.20781898498535, "global_step": 349428, "epoch": 4209} {"train_loss": -26.043658681662684, "global_step": 349429, "epoch": 4209, "val_loss": 6721494.0} {"train_loss": -25.702478408813477, "global_step": 349430, "epoch": 4210} {"train_loss": -26.04444694519043, "global_step": 349431, "epoch": 4210} {"train_loss": -25.619003295898438, "global_step": 349432, "epoch": 4210} {"train_loss": -26.179288864135742, "global_step": 349433, "epoch": 4210} {"train_loss": -25.9492130279541, "global_step": 349434, "epoch": 4210} {"train_loss": -25.818359375, "global_step": 349435, "epoch": 4210} {"train_loss": -25.93756103515625, "global_step": 349436, "epoch": 4210} {"train_loss": -26.08363151550293, "global_step": 349437, "epoch": 4210} {"train_loss": -25.985754013061523, "global_step": 349438, "epoch": 4210} {"train_loss": -25.866077423095703, "global_step": 349439, "epoch": 4210} {"train_loss": -26.056203842163086, "global_step": 349440, "epoch": 4210} {"train_loss": -25.889158248901367, "global_step": 349441, "epoch": 4210} {"train_loss": -26.377593994140625, "global_step": 349442, "epoch": 4210} {"train_loss": -26.128747940063477, "global_step": 349443, "epoch": 4210} {"train_loss": -26.111364364624023, "global_step": 349444, "epoch": 4210} {"train_loss": -26.193634033203125, "global_step": 349445, "epoch": 4210} {"train_loss": -26.2785701751709, "global_step": 349446, "epoch": 4210} {"train_loss": -26.469074249267578, "global_step": 349447, "epoch": 4210} {"train_loss": -26.328458786010742, "global_step": 349448, "epoch": 4210} {"train_loss": -25.899717330932617, "global_step": 349449, "epoch": 4210} {"train_loss": -26.009876251220703, "global_step": 349450, "epoch": 4210} {"train_loss": -25.861984252929688, "global_step": 349451, "epoch": 4210} {"train_loss": -26.073755264282227, "global_step": 349452, "epoch": 4210} {"train_loss": -26.006250381469727, "global_step": 349453, "epoch": 4210} {"train_loss": -25.86048698425293, "global_step": 349454, "epoch": 4210} {"train_loss": -26.069726943969727, "global_step": 349455, "epoch": 4210} {"train_loss": -25.8559513092041, "global_step": 349456, "epoch": 4210} {"train_loss": -26.228469848632812, "global_step": 349457, "epoch": 4210} {"train_loss": -26.046667098999023, "global_step": 349458, "epoch": 4210} {"train_loss": -26.273706436157227, "global_step": 349459, "epoch": 4210} {"train_loss": -26.350576400756836, "global_step": 349460, "epoch": 4210} {"train_loss": -26.3460636138916, "global_step": 349461, "epoch": 4210} {"train_loss": -26.060678482055664, "global_step": 349462, "epoch": 4210} {"train_loss": -26.279172897338867, "global_step": 349463, "epoch": 4210} {"train_loss": -25.698535919189453, "global_step": 349464, "epoch": 4210} {"train_loss": -26.234878540039062, "global_step": 349465, "epoch": 4210} {"train_loss": -26.02509880065918, "global_step": 349466, "epoch": 4210} {"train_loss": -26.1929874420166, "global_step": 349467, "epoch": 4210} {"train_loss": -26.4053955078125, "global_step": 349468, "epoch": 4210} {"train_loss": -26.249954223632812, "global_step": 349469, "epoch": 4210} {"train_loss": -26.087148666381836, "global_step": 349470, "epoch": 4210} {"train_loss": -26.66475486755371, "global_step": 349471, "epoch": 4210} {"train_loss": -26.6223201751709, "global_step": 349472, "epoch": 4210} {"train_loss": -25.960920333862305, "global_step": 349473, "epoch": 4210} {"train_loss": -25.953479766845703, "global_step": 349474, "epoch": 4210} {"train_loss": -25.65061378479004, "global_step": 349475, "epoch": 4210} {"train_loss": -25.893274307250977, "global_step": 349476, "epoch": 4210} {"train_loss": -25.63209342956543, "global_step": 349477, "epoch": 4210} {"train_loss": -26.2098445892334, "global_step": 349478, "epoch": 4210} {"train_loss": -26.53787612915039, "global_step": 349479, "epoch": 4210} {"train_loss": -26.47821617126465, "global_step": 349480, "epoch": 4210} {"train_loss": -26.113937377929688, "global_step": 349481, "epoch": 4210} {"train_loss": -26.010114669799805, "global_step": 349482, "epoch": 4210} {"train_loss": -26.15357780456543, "global_step": 349483, "epoch": 4210} {"train_loss": -26.227582931518555, "global_step": 349484, "epoch": 4210} {"train_loss": -26.126001358032227, "global_step": 349485, "epoch": 4210} {"train_loss": -26.046239852905273, "global_step": 349486, "epoch": 4210} {"train_loss": -26.345815658569336, "global_step": 349487, "epoch": 4210} {"train_loss": -26.56050682067871, "global_step": 349488, "epoch": 4210} {"train_loss": -26.25933837890625, "global_step": 349489, "epoch": 4210} {"train_loss": -26.0087833404541, "global_step": 349490, "epoch": 4210} {"train_loss": -25.948347091674805, "global_step": 349491, "epoch": 4210} {"train_loss": -26.151174545288086, "global_step": 349492, "epoch": 4210} {"train_loss": -26.51091957092285, "global_step": 349493, "epoch": 4210} {"train_loss": -25.745115280151367, "global_step": 349494, "epoch": 4210} {"train_loss": -25.7324275970459, "global_step": 349495, "epoch": 4210} {"train_loss": -26.206912994384766, "global_step": 349496, "epoch": 4210} {"train_loss": -25.92213249206543, "global_step": 349497, "epoch": 4210} {"train_loss": -26.177526473999023, "global_step": 349498, "epoch": 4210} {"train_loss": -26.4818115234375, "global_step": 349499, "epoch": 4210} {"train_loss": -26.330097198486328, "global_step": 349500, "epoch": 4210} {"train_loss": -26.462438583374023, "global_step": 349501, "epoch": 4210} {"train_loss": -26.454023361206055, "global_step": 349502, "epoch": 4210} {"train_loss": -26.32050132751465, "global_step": 349503, "epoch": 4210} {"train_loss": -26.216760635375977, "global_step": 349504, "epoch": 4210} {"train_loss": -26.35685157775879, "global_step": 349505, "epoch": 4210} {"train_loss": -26.295398712158203, "global_step": 349506, "epoch": 4210} {"train_loss": -26.10140037536621, "global_step": 349507, "epoch": 4210} {"train_loss": -26.175825119018555, "global_step": 349508, "epoch": 4210} {"train_loss": -26.216726303100586, "global_step": 349509, "epoch": 4210} {"train_loss": -26.081439971923828, "global_step": 349510, "epoch": 4210} {"train_loss": -26.971120834350586, "global_step": 349511, "epoch": 4210} {"train_loss": -26.16066824671734, "global_step": 349512, "epoch": 4210, "val_loss": 6665550.5} {"train_loss": -24.706716537475586, "global_step": 349513, "epoch": 4211} {"train_loss": -25.399526596069336, "global_step": 349514, "epoch": 4211} {"train_loss": -25.111038208007812, "global_step": 349515, "epoch": 4211} {"train_loss": -25.396928787231445, "global_step": 349516, "epoch": 4211} {"train_loss": -25.212356567382812, "global_step": 349517, "epoch": 4211} {"train_loss": -24.94521141052246, "global_step": 349518, "epoch": 4211} {"train_loss": -25.293241500854492, "global_step": 349519, "epoch": 4211} {"train_loss": -25.647924423217773, "global_step": 349520, "epoch": 4211} {"train_loss": -25.330032348632812, "global_step": 349521, "epoch": 4211} {"train_loss": -25.575897216796875, "global_step": 349522, "epoch": 4211} {"train_loss": -25.459508895874023, "global_step": 349523, "epoch": 4211} {"train_loss": -25.17285919189453, "global_step": 349524, "epoch": 4211} {"train_loss": -25.492155075073242, "global_step": 349525, "epoch": 4211} {"train_loss": -25.430435180664062, "global_step": 349526, "epoch": 4211} {"train_loss": -25.6740779876709, "global_step": 349527, "epoch": 4211} {"train_loss": -25.631223678588867, "global_step": 349528, "epoch": 4211} {"train_loss": -25.476327896118164, "global_step": 349529, "epoch": 4211} {"train_loss": -25.674671173095703, "global_step": 349530, "epoch": 4211} {"train_loss": -25.53679847717285, "global_step": 349531, "epoch": 4211} {"train_loss": -25.5449275970459, "global_step": 349532, "epoch": 4211} {"train_loss": -25.806201934814453, "global_step": 349533, "epoch": 4211} {"train_loss": -26.07684898376465, "global_step": 349534, "epoch": 4211} {"train_loss": -25.92922019958496, "global_step": 349535, "epoch": 4211} {"train_loss": -25.764753341674805, "global_step": 349536, "epoch": 4211} {"train_loss": -25.9322566986084, "global_step": 349537, "epoch": 4211} {"train_loss": -25.747644424438477, "global_step": 349538, "epoch": 4211} {"train_loss": -26.146352767944336, "global_step": 349539, "epoch": 4211} {"train_loss": -25.874683380126953, "global_step": 349540, "epoch": 4211} {"train_loss": -26.082340240478516, "global_step": 349541, "epoch": 4211} {"train_loss": -25.95277976989746, "global_step": 349542, "epoch": 4211} {"train_loss": -26.030792236328125, "global_step": 349543, "epoch": 4211} {"train_loss": -25.919103622436523, "global_step": 349544, "epoch": 4211} {"train_loss": -26.41352653503418, "global_step": 349545, "epoch": 4211} {"train_loss": -26.09795570373535, "global_step": 349546, "epoch": 4211} {"train_loss": -26.12843132019043, "global_step": 349547, "epoch": 4211} {"train_loss": -26.055591583251953, "global_step": 349548, "epoch": 4211} {"train_loss": -26.04300308227539, "global_step": 349549, "epoch": 4211} {"train_loss": -26.478668212890625, "global_step": 349550, "epoch": 4211} {"train_loss": -26.089385986328125, "global_step": 349551, "epoch": 4211} {"train_loss": -26.053363800048828, "global_step": 349552, "epoch": 4211} {"train_loss": -25.86846923828125, "global_step": 349553, "epoch": 4211} {"train_loss": -26.14849853515625, "global_step": 349554, "epoch": 4211} {"train_loss": -26.18708610534668, "global_step": 349555, "epoch": 4211} {"train_loss": -26.2833194732666, "global_step": 349556, "epoch": 4211} {"train_loss": -26.2775821685791, "global_step": 349557, "epoch": 4211} {"train_loss": -26.03425407409668, "global_step": 349558, "epoch": 4211} {"train_loss": -26.33704948425293, "global_step": 349559, "epoch": 4211} {"train_loss": -26.228307723999023, "global_step": 349560, "epoch": 4211} {"train_loss": -26.172210693359375, "global_step": 349561, "epoch": 4211} {"train_loss": -26.260969161987305, "global_step": 349562, "epoch": 4211} {"train_loss": -26.169286727905273, "global_step": 349563, "epoch": 4211} {"train_loss": -26.306562423706055, "global_step": 349564, "epoch": 4211} {"train_loss": -26.051773071289062, "global_step": 349565, "epoch": 4211} {"train_loss": -25.970447540283203, "global_step": 349566, "epoch": 4211} {"train_loss": -26.01362419128418, "global_step": 349567, "epoch": 4211} {"train_loss": -26.167505264282227, "global_step": 349568, "epoch": 4211} {"train_loss": -25.951353073120117, "global_step": 349569, "epoch": 4211} {"train_loss": -26.5234432220459, "global_step": 349570, "epoch": 4211} {"train_loss": -26.01677894592285, "global_step": 349571, "epoch": 4211} {"train_loss": -26.34357261657715, "global_step": 349572, "epoch": 4211} {"train_loss": -26.211889266967773, "global_step": 349573, "epoch": 4211} {"train_loss": -25.9442195892334, "global_step": 349574, "epoch": 4211} {"train_loss": -25.704410552978516, "global_step": 349575, "epoch": 4211} {"train_loss": -26.02957534790039, "global_step": 349576, "epoch": 4211} {"train_loss": -26.254186630249023, "global_step": 349577, "epoch": 4211} {"train_loss": -25.876129150390625, "global_step": 349578, "epoch": 4211} {"train_loss": -25.74765968322754, "global_step": 349579, "epoch": 4211} {"train_loss": -24.940359115600586, "global_step": 349580, "epoch": 4211} {"train_loss": -25.318531036376953, "global_step": 349581, "epoch": 4211} {"train_loss": -25.554763793945312, "global_step": 349582, "epoch": 4211} {"train_loss": -25.8084774017334, "global_step": 349583, "epoch": 4211} {"train_loss": -25.989883422851562, "global_step": 349584, "epoch": 4211} {"train_loss": -25.898334503173828, "global_step": 349585, "epoch": 4211} {"train_loss": -26.454883575439453, "global_step": 349586, "epoch": 4211} {"train_loss": -25.912601470947266, "global_step": 349587, "epoch": 4211} {"train_loss": -26.03277015686035, "global_step": 349588, "epoch": 4211} {"train_loss": -26.103961944580078, "global_step": 349589, "epoch": 4211} {"train_loss": -25.927167892456055, "global_step": 349590, "epoch": 4211} {"train_loss": -26.09419059753418, "global_step": 349591, "epoch": 4211} {"train_loss": -25.95391273498535, "global_step": 349592, "epoch": 4211} {"train_loss": -25.99482536315918, "global_step": 349593, "epoch": 4211} {"train_loss": -26.112075805664062, "global_step": 349594, "epoch": 4211} {"train_loss": -25.87955998799887, "global_step": 349595, "epoch": 4211, "val_loss": 6729179.0} {"train_loss": -24.885860443115234, "global_step": 349596, "epoch": 4212} {"train_loss": -25.16629981994629, "global_step": 349597, "epoch": 4212} {"train_loss": -25.326377868652344, "global_step": 349598, "epoch": 4212} {"train_loss": -25.32892608642578, "global_step": 349599, "epoch": 4212} {"train_loss": -25.293256759643555, "global_step": 349600, "epoch": 4212} {"train_loss": -25.348230361938477, "global_step": 349601, "epoch": 4212} {"train_loss": -24.926950454711914, "global_step": 349602, "epoch": 4212} {"train_loss": -25.49432945251465, "global_step": 349603, "epoch": 4212} {"train_loss": -25.44487762451172, "global_step": 349604, "epoch": 4212} {"train_loss": -25.60796546936035, "global_step": 349605, "epoch": 4212} {"train_loss": -25.314756393432617, "global_step": 349606, "epoch": 4212} {"train_loss": -25.20092010498047, "global_step": 349607, "epoch": 4212} {"train_loss": -25.784692764282227, "global_step": 349608, "epoch": 4212} {"train_loss": -25.62700843811035, "global_step": 349609, "epoch": 4212} {"train_loss": -25.40677261352539, "global_step": 349610, "epoch": 4212} {"train_loss": -25.721349716186523, "global_step": 349611, "epoch": 4212} {"train_loss": -25.659738540649414, "global_step": 349612, "epoch": 4212} {"train_loss": -25.403127670288086, "global_step": 349613, "epoch": 4212} {"train_loss": -25.830480575561523, "global_step": 349614, "epoch": 4212} {"train_loss": -25.74140739440918, "global_step": 349615, "epoch": 4212} {"train_loss": -25.655548095703125, "global_step": 349616, "epoch": 4212} {"train_loss": -26.094003677368164, "global_step": 349617, "epoch": 4212} {"train_loss": -25.721654891967773, "global_step": 349618, "epoch": 4212} {"train_loss": -26.059158325195312, "global_step": 349619, "epoch": 4212} {"train_loss": -26.06849479675293, "global_step": 349620, "epoch": 4212} {"train_loss": -26.049884796142578, "global_step": 349621, "epoch": 4212} {"train_loss": -26.082929611206055, "global_step": 349622, "epoch": 4212} {"train_loss": -26.421533584594727, "global_step": 349623, "epoch": 4212} {"train_loss": -26.3378849029541, "global_step": 349624, "epoch": 4212} {"train_loss": -26.150903701782227, "global_step": 349625, "epoch": 4212} {"train_loss": -25.99152183532715, "global_step": 349626, "epoch": 4212} {"train_loss": -26.505868911743164, "global_step": 349627, "epoch": 4212} {"train_loss": -26.156513214111328, "global_step": 349628, "epoch": 4212} {"train_loss": -26.317975997924805, "global_step": 349629, "epoch": 4212} {"train_loss": -26.0343074798584, "global_step": 349630, "epoch": 4212} {"train_loss": -26.242843627929688, "global_step": 349631, "epoch": 4212} {"train_loss": -26.2312068939209, "global_step": 349632, "epoch": 4212} {"train_loss": -26.490238189697266, "global_step": 349633, "epoch": 4212} {"train_loss": -26.21083641052246, "global_step": 349634, "epoch": 4212} {"train_loss": -26.2396297454834, "global_step": 349635, "epoch": 4212} {"train_loss": -26.5024356842041, "global_step": 349636, "epoch": 4212} {"train_loss": -26.329313278198242, "global_step": 349637, "epoch": 4212} {"train_loss": -26.056842803955078, "global_step": 349638, "epoch": 4212} {"train_loss": -26.413137435913086, "global_step": 349639, "epoch": 4212} {"train_loss": -26.401172637939453, "global_step": 349640, "epoch": 4212} {"train_loss": -26.128454208374023, "global_step": 349641, "epoch": 4212} {"train_loss": -26.412321090698242, "global_step": 349642, "epoch": 4212} {"train_loss": -26.227081298828125, "global_step": 349643, "epoch": 4212} {"train_loss": -26.4773006439209, "global_step": 349644, "epoch": 4212} {"train_loss": -26.5483341217041, "global_step": 349645, "epoch": 4212} {"train_loss": -26.305150985717773, "global_step": 349646, "epoch": 4212} {"train_loss": -26.438262939453125, "global_step": 349647, "epoch": 4212} {"train_loss": -26.23175621032715, "global_step": 349648, "epoch": 4212} {"train_loss": -25.62668228149414, "global_step": 349649, "epoch": 4212} {"train_loss": -26.24106788635254, "global_step": 349650, "epoch": 4212} {"train_loss": -25.956518173217773, "global_step": 349651, "epoch": 4212} {"train_loss": -26.397241592407227, "global_step": 349652, "epoch": 4212} {"train_loss": -26.08164405822754, "global_step": 349653, "epoch": 4212} {"train_loss": -25.609479904174805, "global_step": 349654, "epoch": 4212} {"train_loss": -26.38331413269043, "global_step": 349655, "epoch": 4212} {"train_loss": -26.083616256713867, "global_step": 349656, "epoch": 4212} {"train_loss": -26.01189613342285, "global_step": 349657, "epoch": 4212} {"train_loss": -25.595348358154297, "global_step": 349658, "epoch": 4212} {"train_loss": -26.046186447143555, "global_step": 349659, "epoch": 4212} {"train_loss": -25.904144287109375, "global_step": 349660, "epoch": 4212} {"train_loss": -26.512231826782227, "global_step": 349661, "epoch": 4212} {"train_loss": -26.256086349487305, "global_step": 349662, "epoch": 4212} {"train_loss": -25.551593780517578, "global_step": 349663, "epoch": 4212} {"train_loss": -25.543371200561523, "global_step": 349664, "epoch": 4212} {"train_loss": -26.161298751831055, "global_step": 349665, "epoch": 4212} {"train_loss": -25.669153213500977, "global_step": 349666, "epoch": 4212} {"train_loss": -25.988208770751953, "global_step": 349667, "epoch": 4212} {"train_loss": -26.420934677124023, "global_step": 349668, "epoch": 4212} {"train_loss": -26.0759220123291, "global_step": 349669, "epoch": 4212} {"train_loss": -25.837738037109375, "global_step": 349670, "epoch": 4212} {"train_loss": -25.986291885375977, "global_step": 349671, "epoch": 4212} {"train_loss": -25.996442794799805, "global_step": 349672, "epoch": 4212} {"train_loss": -26.195068359375, "global_step": 349673, "epoch": 4212} {"train_loss": -26.1527156829834, "global_step": 349674, "epoch": 4212} {"train_loss": -26.098800659179688, "global_step": 349675, "epoch": 4212} {"train_loss": -26.179779052734375, "global_step": 349676, "epoch": 4212} {"train_loss": -26.302536010742188, "global_step": 349677, "epoch": 4212} {"train_loss": -25.960389976041863, "global_step": 349678, "epoch": 4212, "val_loss": 6598697.0} {"train_loss": -26.090803146362305, "global_step": 349679, "epoch": 4213} {"train_loss": -25.330482482910156, "global_step": 349680, "epoch": 4213} {"train_loss": -25.781482696533203, "global_step": 349681, "epoch": 4213} {"train_loss": -25.36110496520996, "global_step": 349682, "epoch": 4213} {"train_loss": -25.764907836914062, "global_step": 349683, "epoch": 4213} {"train_loss": -25.636091232299805, "global_step": 349684, "epoch": 4213} {"train_loss": -25.899112701416016, "global_step": 349685, "epoch": 4213} {"train_loss": -26.014989852905273, "global_step": 349686, "epoch": 4213} {"train_loss": -25.81817054748535, "global_step": 349687, "epoch": 4213} {"train_loss": -25.819013595581055, "global_step": 349688, "epoch": 4213} {"train_loss": -25.968399047851562, "global_step": 349689, "epoch": 4213} {"train_loss": -25.977203369140625, "global_step": 349690, "epoch": 4213} {"train_loss": -25.737897872924805, "global_step": 349691, "epoch": 4213} {"train_loss": -25.9016056060791, "global_step": 349692, "epoch": 4213} {"train_loss": -25.833524703979492, "global_step": 349693, "epoch": 4213} {"train_loss": -25.86310386657715, "global_step": 349694, "epoch": 4213} {"train_loss": -26.1099853515625, "global_step": 349695, "epoch": 4213} {"train_loss": -25.9208927154541, "global_step": 349696, "epoch": 4213} {"train_loss": -26.086179733276367, "global_step": 349697, "epoch": 4213} {"train_loss": -26.252283096313477, "global_step": 349698, "epoch": 4213} {"train_loss": -26.1286678314209, "global_step": 349699, "epoch": 4213} {"train_loss": -25.814870834350586, "global_step": 349700, "epoch": 4213} {"train_loss": -26.2628173828125, "global_step": 349701, "epoch": 4213} {"train_loss": -26.112945556640625, "global_step": 349702, "epoch": 4213} {"train_loss": -26.066259384155273, "global_step": 349703, "epoch": 4213} {"train_loss": -26.173690795898438, "global_step": 349704, "epoch": 4213} {"train_loss": -26.21518898010254, "global_step": 349705, "epoch": 4213} {"train_loss": -26.046371459960938, "global_step": 349706, "epoch": 4213} {"train_loss": -26.152801513671875, "global_step": 349707, "epoch": 4213} {"train_loss": -25.855436325073242, "global_step": 349708, "epoch": 4213} {"train_loss": -26.297632217407227, "global_step": 349709, "epoch": 4213} {"train_loss": -26.157575607299805, "global_step": 349710, "epoch": 4213} {"train_loss": -26.089340209960938, "global_step": 349711, "epoch": 4213} {"train_loss": -26.466415405273438, "global_step": 349712, "epoch": 4213} {"train_loss": -26.26193618774414, "global_step": 349713, "epoch": 4213} {"train_loss": -26.601608276367188, "global_step": 349714, "epoch": 4213} {"train_loss": -25.990158081054688, "global_step": 349715, "epoch": 4213} {"train_loss": -25.90699577331543, "global_step": 349716, "epoch": 4213} {"train_loss": -26.146076202392578, "global_step": 349717, "epoch": 4213} {"train_loss": -26.228925704956055, "global_step": 349718, "epoch": 4213} {"train_loss": -25.915283203125, "global_step": 349719, "epoch": 4213} {"train_loss": -26.789331436157227, "global_step": 349720, "epoch": 4213} {"train_loss": -26.4608154296875, "global_step": 349721, "epoch": 4213} {"train_loss": -26.49163246154785, "global_step": 349722, "epoch": 4213} {"train_loss": -26.112619400024414, "global_step": 349723, "epoch": 4213} {"train_loss": -26.56488037109375, "global_step": 349724, "epoch": 4213} {"train_loss": -26.266681671142578, "global_step": 349725, "epoch": 4213} {"train_loss": -26.336292266845703, "global_step": 349726, "epoch": 4213} {"train_loss": -26.062122344970703, "global_step": 349727, "epoch": 4213} {"train_loss": -26.109806060791016, "global_step": 349728, "epoch": 4213} {"train_loss": -26.252180099487305, "global_step": 349729, "epoch": 4213} {"train_loss": -26.743518829345703, "global_step": 349730, "epoch": 4213} {"train_loss": -26.2820987701416, "global_step": 349731, "epoch": 4213} {"train_loss": -26.405689239501953, "global_step": 349732, "epoch": 4213} {"train_loss": -26.321308135986328, "global_step": 349733, "epoch": 4213} {"train_loss": -26.35251235961914, "global_step": 349734, "epoch": 4213} {"train_loss": -26.10220718383789, "global_step": 349735, "epoch": 4213} {"train_loss": -25.99332618713379, "global_step": 349736, "epoch": 4213} {"train_loss": -26.440351486206055, "global_step": 349737, "epoch": 4213} {"train_loss": -26.138525009155273, "global_step": 349738, "epoch": 4213} {"train_loss": -26.28729820251465, "global_step": 349739, "epoch": 4213} {"train_loss": -26.588537216186523, "global_step": 349740, "epoch": 4213} {"train_loss": -26.50667381286621, "global_step": 349741, "epoch": 4213} {"train_loss": -26.240142822265625, "global_step": 349742, "epoch": 4213} {"train_loss": -26.095972061157227, "global_step": 349743, "epoch": 4213} {"train_loss": -26.347604751586914, "global_step": 349744, "epoch": 4213} {"train_loss": -26.3181209564209, "global_step": 349745, "epoch": 4213} {"train_loss": -26.230121612548828, "global_step": 349746, "epoch": 4213} {"train_loss": -26.55681800842285, "global_step": 349747, "epoch": 4213} {"train_loss": -26.26944923400879, "global_step": 349748, "epoch": 4213} {"train_loss": -26.220569610595703, "global_step": 349749, "epoch": 4213} {"train_loss": -26.356943130493164, "global_step": 349750, "epoch": 4213} {"train_loss": -26.15338134765625, "global_step": 349751, "epoch": 4213} {"train_loss": -26.033679962158203, "global_step": 349752, "epoch": 4213} {"train_loss": -26.44447135925293, "global_step": 349753, "epoch": 4213} {"train_loss": -26.32370376586914, "global_step": 349754, "epoch": 4213} {"train_loss": -26.175222396850586, "global_step": 349755, "epoch": 4213} {"train_loss": -26.60456657409668, "global_step": 349756, "epoch": 4213} {"train_loss": -26.182031631469727, "global_step": 349757, "epoch": 4213} {"train_loss": -26.67072868347168, "global_step": 349758, "epoch": 4213} {"train_loss": -26.51239013671875, "global_step": 349759, "epoch": 4213} {"train_loss": -26.0435791015625, "global_step": 349760, "epoch": 4213} {"train_loss": -26.158515493553804, "global_step": 349761, "epoch": 4213, "val_loss": 6617329.0} {"train_loss": -25.71014976501465, "global_step": 349762, "epoch": 4214} {"train_loss": -24.60317039489746, "global_step": 349763, "epoch": 4214} {"train_loss": -20.892797470092773, "global_step": 349764, "epoch": 4214} {"train_loss": -17.8734188079834, "global_step": 349765, "epoch": 4214} {"train_loss": -20.04726219177246, "global_step": 349766, "epoch": 4214} {"train_loss": -24.241174697875977, "global_step": 349767, "epoch": 4214} {"train_loss": -22.564720153808594, "global_step": 349768, "epoch": 4214} {"train_loss": -23.390783309936523, "global_step": 349769, "epoch": 4214} {"train_loss": -23.500886917114258, "global_step": 349770, "epoch": 4214} {"train_loss": -23.22214126586914, "global_step": 349771, "epoch": 4214} {"train_loss": -23.44014549255371, "global_step": 349772, "epoch": 4214} {"train_loss": -24.155065536499023, "global_step": 349773, "epoch": 4214} {"train_loss": -23.589298248291016, "global_step": 349774, "epoch": 4214} {"train_loss": -24.511747360229492, "global_step": 349775, "epoch": 4214} {"train_loss": -24.030027389526367, "global_step": 349776, "epoch": 4214} {"train_loss": -23.52103042602539, "global_step": 349777, "epoch": 4214} {"train_loss": -24.0792236328125, "global_step": 349778, "epoch": 4214} {"train_loss": -24.877243041992188, "global_step": 349779, "epoch": 4214} {"train_loss": -24.334091186523438, "global_step": 349780, "epoch": 4214} {"train_loss": -24.354228973388672, "global_step": 349781, "epoch": 4214} {"train_loss": -24.529293060302734, "global_step": 349782, "epoch": 4214} {"train_loss": -24.296527862548828, "global_step": 349783, "epoch": 4214} {"train_loss": -24.76832389831543, "global_step": 349784, "epoch": 4214} {"train_loss": -24.76548194885254, "global_step": 349785, "epoch": 4214} {"train_loss": -24.703872680664062, "global_step": 349786, "epoch": 4214} {"train_loss": -24.745092391967773, "global_step": 349787, "epoch": 4214} {"train_loss": -24.90740966796875, "global_step": 349788, "epoch": 4214} {"train_loss": -24.75428581237793, "global_step": 349789, "epoch": 4214} {"train_loss": -24.85639762878418, "global_step": 349790, "epoch": 4214} {"train_loss": -25.40669059753418, "global_step": 349791, "epoch": 4214} {"train_loss": -24.9901065826416, "global_step": 349792, "epoch": 4214} {"train_loss": -24.810321807861328, "global_step": 349793, "epoch": 4214} {"train_loss": -24.981555938720703, "global_step": 349794, "epoch": 4214} {"train_loss": -25.30719566345215, "global_step": 349795, "epoch": 4214} {"train_loss": -25.227502822875977, "global_step": 349796, "epoch": 4214} {"train_loss": -25.013532638549805, "global_step": 349797, "epoch": 4214} {"train_loss": -25.620819091796875, "global_step": 349798, "epoch": 4214} {"train_loss": -25.41433334350586, "global_step": 349799, "epoch": 4214} {"train_loss": -25.593881607055664, "global_step": 349800, "epoch": 4214} {"train_loss": -25.639556884765625, "global_step": 349801, "epoch": 4214} {"train_loss": -25.6019344329834, "global_step": 349802, "epoch": 4214} {"train_loss": -25.288877487182617, "global_step": 349803, "epoch": 4214} {"train_loss": -25.625476837158203, "global_step": 349804, "epoch": 4214} {"train_loss": -25.6160831451416, "global_step": 349805, "epoch": 4214} {"train_loss": -25.584230422973633, "global_step": 349806, "epoch": 4214} {"train_loss": -26.150781631469727, "global_step": 349807, "epoch": 4214} {"train_loss": -26.145029067993164, "global_step": 349808, "epoch": 4214} {"train_loss": -25.89777946472168, "global_step": 349809, "epoch": 4214} {"train_loss": -25.955795288085938, "global_step": 349810, "epoch": 4214} {"train_loss": -25.50880241394043, "global_step": 349811, "epoch": 4214} {"train_loss": -25.8758544921875, "global_step": 349812, "epoch": 4214} {"train_loss": -26.216297149658203, "global_step": 349813, "epoch": 4214} {"train_loss": -25.82491111755371, "global_step": 349814, "epoch": 4214} {"train_loss": -26.336084365844727, "global_step": 349815, "epoch": 4214} {"train_loss": -25.6221866607666, "global_step": 349816, "epoch": 4214} {"train_loss": -25.768157958984375, "global_step": 349817, "epoch": 4214} {"train_loss": -26.0580997467041, "global_step": 349818, "epoch": 4214} {"train_loss": -26.474136352539062, "global_step": 349819, "epoch": 4214} {"train_loss": -26.100067138671875, "global_step": 349820, "epoch": 4214} {"train_loss": -26.460214614868164, "global_step": 349821, "epoch": 4214} {"train_loss": -25.990304946899414, "global_step": 349822, "epoch": 4214} {"train_loss": -25.805334091186523, "global_step": 349823, "epoch": 4214} {"train_loss": -26.180418014526367, "global_step": 349824, "epoch": 4214} {"train_loss": -25.980548858642578, "global_step": 349825, "epoch": 4214} {"train_loss": -26.368000030517578, "global_step": 349826, "epoch": 4214} {"train_loss": -26.315143585205078, "global_step": 349827, "epoch": 4214} {"train_loss": -26.20082664489746, "global_step": 349828, "epoch": 4214} {"train_loss": -26.090845108032227, "global_step": 349829, "epoch": 4214} {"train_loss": -26.375503540039062, "global_step": 349830, "epoch": 4214} {"train_loss": -26.186574935913086, "global_step": 349831, "epoch": 4214} {"train_loss": -26.289270401000977, "global_step": 349832, "epoch": 4214} {"train_loss": -26.287256240844727, "global_step": 349833, "epoch": 4214} {"train_loss": -26.38427734375, "global_step": 349834, "epoch": 4214} {"train_loss": -26.5011043548584, "global_step": 349835, "epoch": 4214} {"train_loss": -26.628101348876953, "global_step": 349836, "epoch": 4214} {"train_loss": -26.005651473999023, "global_step": 349837, "epoch": 4214} {"train_loss": -26.4121036529541, "global_step": 349838, "epoch": 4214} {"train_loss": -26.18739891052246, "global_step": 349839, "epoch": 4214} {"train_loss": -26.544172286987305, "global_step": 349840, "epoch": 4214} {"train_loss": -26.488447189331055, "global_step": 349841, "epoch": 4214} {"train_loss": -26.41816520690918, "global_step": 349842, "epoch": 4214} {"train_loss": -26.336191177368164, "global_step": 349843, "epoch": 4214} {"train_loss": -25.169969765536756, "global_step": 349844, "epoch": 4214, "val_loss": 6554546.0} {"train_loss": -25.588998794555664, "global_step": 349845, "epoch": 4215} {"train_loss": -24.838045120239258, "global_step": 349846, "epoch": 4215} {"train_loss": -25.80011558532715, "global_step": 349847, "epoch": 4215} {"train_loss": -25.879444122314453, "global_step": 349848, "epoch": 4215} {"train_loss": -25.429841995239258, "global_step": 349849, "epoch": 4215} {"train_loss": -25.841562271118164, "global_step": 349850, "epoch": 4215} {"train_loss": -26.207990646362305, "global_step": 349851, "epoch": 4215} {"train_loss": -25.616491317749023, "global_step": 349852, "epoch": 4215} {"train_loss": -25.834308624267578, "global_step": 349853, "epoch": 4215} {"train_loss": -25.7899169921875, "global_step": 349854, "epoch": 4215} {"train_loss": -26.041629791259766, "global_step": 349855, "epoch": 4215} {"train_loss": -25.881635665893555, "global_step": 349856, "epoch": 4215} {"train_loss": -25.86345863342285, "global_step": 349857, "epoch": 4215} {"train_loss": -25.981414794921875, "global_step": 349858, "epoch": 4215} {"train_loss": -25.940814971923828, "global_step": 349859, "epoch": 4215} {"train_loss": -25.725189208984375, "global_step": 349860, "epoch": 4215} {"train_loss": -25.9947452545166, "global_step": 349861, "epoch": 4215} {"train_loss": -25.939655303955078, "global_step": 349862, "epoch": 4215} {"train_loss": -25.751760482788086, "global_step": 349863, "epoch": 4215} {"train_loss": -25.898611068725586, "global_step": 349864, "epoch": 4215} {"train_loss": -26.163663864135742, "global_step": 349865, "epoch": 4215} {"train_loss": -25.954633712768555, "global_step": 349866, "epoch": 4215} {"train_loss": -25.69367790222168, "global_step": 349867, "epoch": 4215} {"train_loss": -26.10634422302246, "global_step": 349868, "epoch": 4215} {"train_loss": -26.44663429260254, "global_step": 349869, "epoch": 4215} {"train_loss": -26.272634506225586, "global_step": 349870, "epoch": 4215} {"train_loss": -25.997699737548828, "global_step": 349871, "epoch": 4215} {"train_loss": -26.188154220581055, "global_step": 349872, "epoch": 4215} {"train_loss": -26.139089584350586, "global_step": 349873, "epoch": 4215} {"train_loss": -26.355192184448242, "global_step": 349874, "epoch": 4215} {"train_loss": -25.97980308532715, "global_step": 349875, "epoch": 4215} {"train_loss": -26.10104751586914, "global_step": 349876, "epoch": 4215} {"train_loss": -26.25282859802246, "global_step": 349877, "epoch": 4215} {"train_loss": -26.02732276916504, "global_step": 349878, "epoch": 4215} {"train_loss": -26.282018661499023, "global_step": 349879, "epoch": 4215} {"train_loss": -26.523523330688477, "global_step": 349880, "epoch": 4215} {"train_loss": -26.481611251831055, "global_step": 349881, "epoch": 4215} {"train_loss": -26.521533966064453, "global_step": 349882, "epoch": 4215} {"train_loss": -26.157257080078125, "global_step": 349883, "epoch": 4215} {"train_loss": -26.012832641601562, "global_step": 349884, "epoch": 4215} {"train_loss": -25.912351608276367, "global_step": 349885, "epoch": 4215} {"train_loss": -26.5129337310791, "global_step": 349886, "epoch": 4215} {"train_loss": -26.55716323852539, "global_step": 349887, "epoch": 4215} {"train_loss": -25.81072425842285, "global_step": 349888, "epoch": 4215} {"train_loss": -26.219635009765625, "global_step": 349889, "epoch": 4215} {"train_loss": -26.194807052612305, "global_step": 349890, "epoch": 4215} {"train_loss": -26.02229118347168, "global_step": 349891, "epoch": 4215} {"train_loss": -26.165863037109375, "global_step": 349892, "epoch": 4215} {"train_loss": -26.473127365112305, "global_step": 349893, "epoch": 4215} {"train_loss": -26.117948532104492, "global_step": 349894, "epoch": 4215} {"train_loss": -25.95050621032715, "global_step": 349895, "epoch": 4215} {"train_loss": -26.063831329345703, "global_step": 349896, "epoch": 4215} {"train_loss": -26.241357803344727, "global_step": 349897, "epoch": 4215} {"train_loss": -26.36490249633789, "global_step": 349898, "epoch": 4215} {"train_loss": -25.891332626342773, "global_step": 349899, "epoch": 4215} {"train_loss": -26.047006607055664, "global_step": 349900, "epoch": 4215} {"train_loss": -26.436079025268555, "global_step": 349901, "epoch": 4215} {"train_loss": -26.40662956237793, "global_step": 349902, "epoch": 4215} {"train_loss": -26.074859619140625, "global_step": 349903, "epoch": 4215} {"train_loss": -26.259674072265625, "global_step": 349904, "epoch": 4215} {"train_loss": -26.271381378173828, "global_step": 349905, "epoch": 4215} {"train_loss": -25.822092056274414, "global_step": 349906, "epoch": 4215} {"train_loss": -26.350921630859375, "global_step": 349907, "epoch": 4215} {"train_loss": -26.163166046142578, "global_step": 349908, "epoch": 4215} {"train_loss": -26.126943588256836, "global_step": 349909, "epoch": 4215} {"train_loss": -26.06561279296875, "global_step": 349910, "epoch": 4215} {"train_loss": -26.399337768554688, "global_step": 349911, "epoch": 4215} {"train_loss": -26.2017822265625, "global_step": 349912, "epoch": 4215} {"train_loss": -26.579431533813477, "global_step": 349913, "epoch": 4215} {"train_loss": -26.476877212524414, "global_step": 349914, "epoch": 4215} {"train_loss": -26.582839965820312, "global_step": 349915, "epoch": 4215} {"train_loss": -26.372638702392578, "global_step": 349916, "epoch": 4215} {"train_loss": -26.305694580078125, "global_step": 349917, "epoch": 4215} {"train_loss": -26.4074764251709, "global_step": 349918, "epoch": 4215} {"train_loss": -26.294361114501953, "global_step": 349919, "epoch": 4215} {"train_loss": -26.562299728393555, "global_step": 349920, "epoch": 4215} {"train_loss": -26.225515365600586, "global_step": 349921, "epoch": 4215} {"train_loss": -26.667966842651367, "global_step": 349922, "epoch": 4215} {"train_loss": -26.432147979736328, "global_step": 349923, "epoch": 4215} {"train_loss": -26.3190860748291, "global_step": 349924, "epoch": 4215} {"train_loss": -26.171613693237305, "global_step": 349925, "epoch": 4215} {"train_loss": -26.506750106811523, "global_step": 349926, "epoch": 4215} {"train_loss": -26.14462861670069, "global_step": 349927, "epoch": 4215, "val_loss": 6560803.5} {"train_loss": -25.013559341430664, "global_step": 349928, "epoch": 4216} {"train_loss": -25.610570907592773, "global_step": 349929, "epoch": 4216} {"train_loss": -25.671728134155273, "global_step": 349930, "epoch": 4216} {"train_loss": -25.666507720947266, "global_step": 349931, "epoch": 4216} {"train_loss": -25.595619201660156, "global_step": 349932, "epoch": 4216} {"train_loss": -25.56382942199707, "global_step": 349933, "epoch": 4216} {"train_loss": -25.646799087524414, "global_step": 349934, "epoch": 4216} {"train_loss": -25.81196403503418, "global_step": 349935, "epoch": 4216} {"train_loss": -25.518842697143555, "global_step": 349936, "epoch": 4216} {"train_loss": -25.824567794799805, "global_step": 349937, "epoch": 4216} {"train_loss": -25.424222946166992, "global_step": 349938, "epoch": 4216} {"train_loss": -25.85527992248535, "global_step": 349939, "epoch": 4216} {"train_loss": -25.493656158447266, "global_step": 349940, "epoch": 4216} {"train_loss": -25.639997482299805, "global_step": 349941, "epoch": 4216} {"train_loss": -25.723600387573242, "global_step": 349942, "epoch": 4216} {"train_loss": -26.104345321655273, "global_step": 349943, "epoch": 4216} {"train_loss": -26.016122817993164, "global_step": 349944, "epoch": 4216} {"train_loss": -25.93194007873535, "global_step": 349945, "epoch": 4216} {"train_loss": -25.45039939880371, "global_step": 349946, "epoch": 4216} {"train_loss": -25.535621643066406, "global_step": 349947, "epoch": 4216} {"train_loss": -26.115100860595703, "global_step": 349948, "epoch": 4216} {"train_loss": -26.050947189331055, "global_step": 349949, "epoch": 4216} {"train_loss": -26.183752059936523, "global_step": 349950, "epoch": 4216} {"train_loss": -25.971399307250977, "global_step": 349951, "epoch": 4216} {"train_loss": -25.877973556518555, "global_step": 349952, "epoch": 4216} {"train_loss": -26.252777099609375, "global_step": 349953, "epoch": 4216} {"train_loss": -26.20707130432129, "global_step": 349954, "epoch": 4216} {"train_loss": -26.050308227539062, "global_step": 349955, "epoch": 4216} {"train_loss": -26.09181022644043, "global_step": 349956, "epoch": 4216} {"train_loss": -25.72665786743164, "global_step": 349957, "epoch": 4216} {"train_loss": -25.87540626525879, "global_step": 349958, "epoch": 4216} {"train_loss": -26.167407989501953, "global_step": 349959, "epoch": 4216} {"train_loss": -26.0634708404541, "global_step": 349960, "epoch": 4216} {"train_loss": -25.932363510131836, "global_step": 349961, "epoch": 4216} {"train_loss": -26.412748336791992, "global_step": 349962, "epoch": 4216} {"train_loss": -26.40973472595215, "global_step": 349963, "epoch": 4216} {"train_loss": -26.21964454650879, "global_step": 349964, "epoch": 4216} {"train_loss": -26.662616729736328, "global_step": 349965, "epoch": 4216} {"train_loss": -26.423681259155273, "global_step": 349966, "epoch": 4216} {"train_loss": -26.402517318725586, "global_step": 349967, "epoch": 4216} {"train_loss": -25.912710189819336, "global_step": 349968, "epoch": 4216} {"train_loss": -26.284194946289062, "global_step": 349969, "epoch": 4216} {"train_loss": -26.009475708007812, "global_step": 349970, "epoch": 4216} {"train_loss": -26.194610595703125, "global_step": 349971, "epoch": 4216} {"train_loss": -26.293365478515625, "global_step": 349972, "epoch": 4216} {"train_loss": -26.327960968017578, "global_step": 349973, "epoch": 4216} {"train_loss": -26.124652862548828, "global_step": 349974, "epoch": 4216} {"train_loss": -26.234390258789062, "global_step": 349975, "epoch": 4216} {"train_loss": -26.136808395385742, "global_step": 349976, "epoch": 4216} {"train_loss": -26.47894859313965, "global_step": 349977, "epoch": 4216} {"train_loss": -26.256458282470703, "global_step": 349978, "epoch": 4216} {"train_loss": -26.322912216186523, "global_step": 349979, "epoch": 4216} {"train_loss": -25.96756362915039, "global_step": 349980, "epoch": 4216} {"train_loss": -26.233489990234375, "global_step": 349981, "epoch": 4216} {"train_loss": -26.28912353515625, "global_step": 349982, "epoch": 4216} {"train_loss": -26.0688533782959, "global_step": 349983, "epoch": 4216} {"train_loss": -26.180835723876953, "global_step": 349984, "epoch": 4216} {"train_loss": -26.232778549194336, "global_step": 349985, "epoch": 4216} {"train_loss": -26.38665199279785, "global_step": 349986, "epoch": 4216} {"train_loss": -26.4674129486084, "global_step": 349987, "epoch": 4216} {"train_loss": -26.767560958862305, "global_step": 349988, "epoch": 4216} {"train_loss": -26.2855167388916, "global_step": 349989, "epoch": 4216} {"train_loss": -26.25650978088379, "global_step": 349990, "epoch": 4216} {"train_loss": -26.3243465423584, "global_step": 349991, "epoch": 4216} {"train_loss": -26.38532066345215, "global_step": 349992, "epoch": 4216} {"train_loss": -26.52594566345215, "global_step": 349993, "epoch": 4216} {"train_loss": -26.561452865600586, "global_step": 349994, "epoch": 4216} {"train_loss": -26.20491600036621, "global_step": 349995, "epoch": 4216} {"train_loss": -26.251325607299805, "global_step": 349996, "epoch": 4216} {"train_loss": -26.43536376953125, "global_step": 349997, "epoch": 4216} {"train_loss": -26.258411407470703, "global_step": 349998, "epoch": 4216} {"train_loss": -26.49082374572754, "global_step": 349999, "epoch": 4216} {"train_loss": -26.672077178955078, "global_step": 350000, "epoch": 4216} {"train_loss": -26.2502384185791, "global_step": 350001, "epoch": 4216} {"train_loss": -26.4176025390625, "global_step": 350002, "epoch": 4216} {"train_loss": -26.480695724487305, "global_step": 350003, "epoch": 4216} {"train_loss": -26.16425895690918, "global_step": 350004, "epoch": 4216} {"train_loss": -26.435150146484375, "global_step": 350005, "epoch": 4216} {"train_loss": -26.522306442260742, "global_step": 350006, "epoch": 4216} {"train_loss": -26.4007511138916, "global_step": 350007, "epoch": 4216} {"train_loss": -26.517526626586914, "global_step": 350008, "epoch": 4216} {"train_loss": -26.470077514648438, "global_step": 350009, "epoch": 4216} {"train_loss": -26.12317708026932, "global_step": 350010, "epoch": 4216, "val_loss": 6596397.5} {"train_loss": -26.10818862915039, "global_step": 350011, "epoch": 4217} {"train_loss": -26.354461669921875, "global_step": 350012, "epoch": 4217} {"train_loss": -25.899383544921875, "global_step": 350013, "epoch": 4217} {"train_loss": -25.942035675048828, "global_step": 350014, "epoch": 4217} {"train_loss": -25.858861923217773, "global_step": 350015, "epoch": 4217} {"train_loss": -26.5345458984375, "global_step": 350016, "epoch": 4217} {"train_loss": -25.771265029907227, "global_step": 350017, "epoch": 4217} {"train_loss": -25.854345321655273, "global_step": 350018, "epoch": 4217} {"train_loss": -26.336225509643555, "global_step": 350019, "epoch": 4217} {"train_loss": -25.938526153564453, "global_step": 350020, "epoch": 4217} {"train_loss": -26.18818473815918, "global_step": 350021, "epoch": 4217} {"train_loss": -25.765399932861328, "global_step": 350022, "epoch": 4217} {"train_loss": -25.826313018798828, "global_step": 350023, "epoch": 4217} {"train_loss": -26.01557731628418, "global_step": 350024, "epoch": 4217} {"train_loss": -26.07560157775879, "global_step": 350025, "epoch": 4217} {"train_loss": -26.233184814453125, "global_step": 350026, "epoch": 4217} {"train_loss": -25.812911987304688, "global_step": 350027, "epoch": 4217} {"train_loss": -25.943511962890625, "global_step": 350028, "epoch": 4217} {"train_loss": -25.952402114868164, "global_step": 350029, "epoch": 4217} {"train_loss": -26.15516471862793, "global_step": 350030, "epoch": 4217} {"train_loss": -25.75337028503418, "global_step": 350031, "epoch": 4217} {"train_loss": -26.12262535095215, "global_step": 350032, "epoch": 4217} {"train_loss": -26.369287490844727, "global_step": 350033, "epoch": 4217} {"train_loss": -25.97511100769043, "global_step": 350034, "epoch": 4217} {"train_loss": -26.46255874633789, "global_step": 350035, "epoch": 4217} {"train_loss": -26.216217041015625, "global_step": 350036, "epoch": 4217} {"train_loss": -26.160430908203125, "global_step": 350037, "epoch": 4217} {"train_loss": -26.406152725219727, "global_step": 350038, "epoch": 4217} {"train_loss": -26.231637954711914, "global_step": 350039, "epoch": 4217} {"train_loss": -26.307666778564453, "global_step": 350040, "epoch": 4217} {"train_loss": -26.253698348999023, "global_step": 350041, "epoch": 4217} {"train_loss": -25.996809005737305, "global_step": 350042, "epoch": 4217} {"train_loss": -25.964258193969727, "global_step": 350043, "epoch": 4217} {"train_loss": -26.215147018432617, "global_step": 350044, "epoch": 4217} {"train_loss": -25.772083282470703, "global_step": 350045, "epoch": 4217} {"train_loss": -26.3398494720459, "global_step": 350046, "epoch": 4217} {"train_loss": -25.885486602783203, "global_step": 350047, "epoch": 4217} {"train_loss": -26.117074966430664, "global_step": 350048, "epoch": 4217} {"train_loss": -26.121564865112305, "global_step": 350049, "epoch": 4217} {"train_loss": -25.91757583618164, "global_step": 350050, "epoch": 4217} {"train_loss": -26.212915420532227, "global_step": 350051, "epoch": 4217} {"train_loss": -25.576908111572266, "global_step": 350052, "epoch": 4217} {"train_loss": -26.283262252807617, "global_step": 350053, "epoch": 4217} {"train_loss": -26.06129264831543, "global_step": 350054, "epoch": 4217} {"train_loss": -26.280841827392578, "global_step": 350055, "epoch": 4217} {"train_loss": -25.953699111938477, "global_step": 350056, "epoch": 4217} {"train_loss": -26.131824493408203, "global_step": 350057, "epoch": 4217} {"train_loss": -26.191553115844727, "global_step": 350058, "epoch": 4217} {"train_loss": -26.31201171875, "global_step": 350059, "epoch": 4217} {"train_loss": -26.453039169311523, "global_step": 350060, "epoch": 4217} {"train_loss": -26.25922203063965, "global_step": 350061, "epoch": 4217} {"train_loss": -26.33155632019043, "global_step": 350062, "epoch": 4217} {"train_loss": -26.12617301940918, "global_step": 350063, "epoch": 4217} {"train_loss": -26.0551700592041, "global_step": 350064, "epoch": 4217} {"train_loss": -25.838491439819336, "global_step": 350065, "epoch": 4217} {"train_loss": -26.290857315063477, "global_step": 350066, "epoch": 4217} {"train_loss": -26.12567710876465, "global_step": 350067, "epoch": 4217} {"train_loss": -26.546239852905273, "global_step": 350068, "epoch": 4217} {"train_loss": -26.244409561157227, "global_step": 350069, "epoch": 4217} {"train_loss": -26.153844833374023, "global_step": 350070, "epoch": 4217} {"train_loss": -26.227537155151367, "global_step": 350071, "epoch": 4217} {"train_loss": -26.111120223999023, "global_step": 350072, "epoch": 4217} {"train_loss": -26.25469398498535, "global_step": 350073, "epoch": 4217} {"train_loss": -26.264484405517578, "global_step": 350074, "epoch": 4217} {"train_loss": -26.074758529663086, "global_step": 350075, "epoch": 4217} {"train_loss": -26.515928268432617, "global_step": 350076, "epoch": 4217} {"train_loss": -26.329193115234375, "global_step": 350077, "epoch": 4217} {"train_loss": -26.361719131469727, "global_step": 350078, "epoch": 4217} {"train_loss": -26.075220108032227, "global_step": 350079, "epoch": 4217} {"train_loss": -26.22590446472168, "global_step": 350080, "epoch": 4217} {"train_loss": -25.982501983642578, "global_step": 350081, "epoch": 4217} {"train_loss": -26.0003604888916, "global_step": 350082, "epoch": 4217} {"train_loss": -26.2255859375, "global_step": 350083, "epoch": 4217} {"train_loss": -25.699981689453125, "global_step": 350084, "epoch": 4217} {"train_loss": -26.1256103515625, "global_step": 350085, "epoch": 4217} {"train_loss": -26.011789321899414, "global_step": 350086, "epoch": 4217} {"train_loss": -25.887548446655273, "global_step": 350087, "epoch": 4217} {"train_loss": -25.81830406188965, "global_step": 350088, "epoch": 4217} {"train_loss": -25.852231979370117, "global_step": 350089, "epoch": 4217} {"train_loss": -26.009384155273438, "global_step": 350090, "epoch": 4217} {"train_loss": -25.645233154296875, "global_step": 350091, "epoch": 4217} {"train_loss": -25.846729278564453, "global_step": 350092, "epoch": 4217} {"train_loss": -26.101658350013825, "global_step": 350093, "epoch": 4217, "val_loss": 6587143.0} {"train_loss": -25.876245498657227, "global_step": 350094, "epoch": 4218} {"train_loss": -25.183012008666992, "global_step": 350095, "epoch": 4218} {"train_loss": -25.20643424987793, "global_step": 350096, "epoch": 4218} {"train_loss": -25.885150909423828, "global_step": 350097, "epoch": 4218} {"train_loss": -25.35785484313965, "global_step": 350098, "epoch": 4218} {"train_loss": -24.697738647460938, "global_step": 350099, "epoch": 4218} {"train_loss": -25.792673110961914, "global_step": 350100, "epoch": 4218} {"train_loss": -25.149389266967773, "global_step": 350101, "epoch": 4218} {"train_loss": -25.325090408325195, "global_step": 350102, "epoch": 4218} {"train_loss": -25.564136505126953, "global_step": 350103, "epoch": 4218} {"train_loss": -25.648040771484375, "global_step": 350104, "epoch": 4218} {"train_loss": -26.001422882080078, "global_step": 350105, "epoch": 4218} {"train_loss": -25.544248580932617, "global_step": 350106, "epoch": 4218} {"train_loss": -25.6740779876709, "global_step": 350107, "epoch": 4218} {"train_loss": -25.71611976623535, "global_step": 350108, "epoch": 4218} {"train_loss": -25.490427017211914, "global_step": 350109, "epoch": 4218} {"train_loss": -25.83479118347168, "global_step": 350110, "epoch": 4218} {"train_loss": -26.340646743774414, "global_step": 350111, "epoch": 4218} {"train_loss": -25.741531372070312, "global_step": 350112, "epoch": 4218} {"train_loss": -26.014917373657227, "global_step": 350113, "epoch": 4218} {"train_loss": -25.888324737548828, "global_step": 350114, "epoch": 4218} {"train_loss": -26.02370262145996, "global_step": 350115, "epoch": 4218} {"train_loss": -26.156457901000977, "global_step": 350116, "epoch": 4218} {"train_loss": -26.125944137573242, "global_step": 350117, "epoch": 4218} {"train_loss": -26.126174926757812, "global_step": 350118, "epoch": 4218} {"train_loss": -26.003280639648438, "global_step": 350119, "epoch": 4218} {"train_loss": -26.132123947143555, "global_step": 350120, "epoch": 4218} {"train_loss": -25.882415771484375, "global_step": 350121, "epoch": 4218} {"train_loss": -25.860706329345703, "global_step": 350122, "epoch": 4218} {"train_loss": -25.95686912536621, "global_step": 350123, "epoch": 4218} {"train_loss": -25.684823989868164, "global_step": 350124, "epoch": 4218} {"train_loss": -26.294330596923828, "global_step": 350125, "epoch": 4218} {"train_loss": -25.78781509399414, "global_step": 350126, "epoch": 4218} {"train_loss": -25.929859161376953, "global_step": 350127, "epoch": 4218} {"train_loss": -26.33673667907715, "global_step": 350128, "epoch": 4218} {"train_loss": -25.9288330078125, "global_step": 350129, "epoch": 4218} {"train_loss": -26.118976593017578, "global_step": 350130, "epoch": 4218} {"train_loss": -26.182453155517578, "global_step": 350131, "epoch": 4218} {"train_loss": -26.155139923095703, "global_step": 350132, "epoch": 4218} {"train_loss": -25.98138427734375, "global_step": 350133, "epoch": 4218} {"train_loss": -26.396875381469727, "global_step": 350134, "epoch": 4218} {"train_loss": -26.53546714782715, "global_step": 350135, "epoch": 4218} {"train_loss": -26.1224422454834, "global_step": 350136, "epoch": 4218} {"train_loss": -26.061847686767578, "global_step": 350137, "epoch": 4218} {"train_loss": -26.3685359954834, "global_step": 350138, "epoch": 4218} {"train_loss": -26.310028076171875, "global_step": 350139, "epoch": 4218} {"train_loss": -26.340219497680664, "global_step": 350140, "epoch": 4218} {"train_loss": -26.043527603149414, "global_step": 350141, "epoch": 4218} {"train_loss": -26.301288604736328, "global_step": 350142, "epoch": 4218} {"train_loss": -26.42473793029785, "global_step": 350143, "epoch": 4218} {"train_loss": -25.984434127807617, "global_step": 350144, "epoch": 4218} {"train_loss": -26.3389949798584, "global_step": 350145, "epoch": 4218} {"train_loss": -26.036651611328125, "global_step": 350146, "epoch": 4218} {"train_loss": -26.298416137695312, "global_step": 350147, "epoch": 4218} {"train_loss": -26.11280632019043, "global_step": 350148, "epoch": 4218} {"train_loss": -26.63698387145996, "global_step": 350149, "epoch": 4218} {"train_loss": -26.55332374572754, "global_step": 350150, "epoch": 4218} {"train_loss": -26.323286056518555, "global_step": 350151, "epoch": 4218} {"train_loss": -25.873859405517578, "global_step": 350152, "epoch": 4218} {"train_loss": -26.1829891204834, "global_step": 350153, "epoch": 4218} {"train_loss": -26.4567813873291, "global_step": 350154, "epoch": 4218} {"train_loss": -25.929920196533203, "global_step": 350155, "epoch": 4218} {"train_loss": -26.362518310546875, "global_step": 350156, "epoch": 4218} {"train_loss": -26.3187255859375, "global_step": 350157, "epoch": 4218} {"train_loss": -26.58331298828125, "global_step": 350158, "epoch": 4218} {"train_loss": -26.622821807861328, "global_step": 350159, "epoch": 4218} {"train_loss": -26.239316940307617, "global_step": 350160, "epoch": 4218} {"train_loss": -26.055805206298828, "global_step": 350161, "epoch": 4218} {"train_loss": -26.226444244384766, "global_step": 350162, "epoch": 4218} {"train_loss": -26.306594848632812, "global_step": 350163, "epoch": 4218} {"train_loss": -26.460159301757812, "global_step": 350164, "epoch": 4218} {"train_loss": -26.41486930847168, "global_step": 350165, "epoch": 4218} {"train_loss": -26.29926872253418, "global_step": 350166, "epoch": 4218} {"train_loss": -26.290699005126953, "global_step": 350167, "epoch": 4218} {"train_loss": -26.55891227722168, "global_step": 350168, "epoch": 4218} {"train_loss": -26.1895751953125, "global_step": 350169, "epoch": 4218} {"train_loss": -26.455289840698242, "global_step": 350170, "epoch": 4218} {"train_loss": -26.076528549194336, "global_step": 350171, "epoch": 4218} {"train_loss": -26.256757736206055, "global_step": 350172, "epoch": 4218} {"train_loss": -26.0552978515625, "global_step": 350173, "epoch": 4218} {"train_loss": -26.0707950592041, "global_step": 350174, "epoch": 4218} {"train_loss": -26.3834285736084, "global_step": 350175, "epoch": 4218} {"train_loss": -26.06649601028626, "global_step": 350176, "epoch": 4218, "val_loss": 6580298.5} {"train_loss": -25.130878448486328, "global_step": 350177, "epoch": 4219} {"train_loss": -24.384777069091797, "global_step": 350178, "epoch": 4219} {"train_loss": -25.010141372680664, "global_step": 350179, "epoch": 4219} {"train_loss": -24.607534408569336, "global_step": 350180, "epoch": 4219} {"train_loss": -25.603498458862305, "global_step": 350181, "epoch": 4219} {"train_loss": -24.508893966674805, "global_step": 350182, "epoch": 4219} {"train_loss": -25.638385772705078, "global_step": 350183, "epoch": 4219} {"train_loss": -24.87487030029297, "global_step": 350184, "epoch": 4219} {"train_loss": -25.57553482055664, "global_step": 350185, "epoch": 4219} {"train_loss": -25.388559341430664, "global_step": 350186, "epoch": 4219} {"train_loss": -25.857446670532227, "global_step": 350187, "epoch": 4219} {"train_loss": -25.514223098754883, "global_step": 350188, "epoch": 4219} {"train_loss": -25.733884811401367, "global_step": 350189, "epoch": 4219} {"train_loss": -25.623327255249023, "global_step": 350190, "epoch": 4219} {"train_loss": -25.797754287719727, "global_step": 350191, "epoch": 4219} {"train_loss": -25.759536743164062, "global_step": 350192, "epoch": 4219} {"train_loss": -25.62637710571289, "global_step": 350193, "epoch": 4219} {"train_loss": -26.036121368408203, "global_step": 350194, "epoch": 4219} {"train_loss": -25.609756469726562, "global_step": 350195, "epoch": 4219} {"train_loss": -25.68886375427246, "global_step": 350196, "epoch": 4219} {"train_loss": -25.84490394592285, "global_step": 350197, "epoch": 4219} {"train_loss": -25.9478816986084, "global_step": 350198, "epoch": 4219} {"train_loss": -25.709548950195312, "global_step": 350199, "epoch": 4219} {"train_loss": -25.78057861328125, "global_step": 350200, "epoch": 4219} {"train_loss": -25.766294479370117, "global_step": 350201, "epoch": 4219} {"train_loss": -26.228540420532227, "global_step": 350202, "epoch": 4219} {"train_loss": -26.126148223876953, "global_step": 350203, "epoch": 4219} {"train_loss": -25.920888900756836, "global_step": 350204, "epoch": 4219} {"train_loss": -25.800745010375977, "global_step": 350205, "epoch": 4219} {"train_loss": -26.1700382232666, "global_step": 350206, "epoch": 4219} {"train_loss": -25.712512969970703, "global_step": 350207, "epoch": 4219} {"train_loss": -25.603565216064453, "global_step": 350208, "epoch": 4219} {"train_loss": -25.876617431640625, "global_step": 350209, "epoch": 4219} {"train_loss": -26.18768882751465, "global_step": 350210, "epoch": 4219} {"train_loss": -25.76788902282715, "global_step": 350211, "epoch": 4219} {"train_loss": -25.86972427368164, "global_step": 350212, "epoch": 4219} {"train_loss": -26.087560653686523, "global_step": 350213, "epoch": 4219} {"train_loss": -26.274255752563477, "global_step": 350214, "epoch": 4219} {"train_loss": -26.35396385192871, "global_step": 350215, "epoch": 4219} {"train_loss": -26.082395553588867, "global_step": 350216, "epoch": 4219} {"train_loss": -26.095874786376953, "global_step": 350217, "epoch": 4219} {"train_loss": -26.46553611755371, "global_step": 350218, "epoch": 4219} {"train_loss": -26.425939559936523, "global_step": 350219, "epoch": 4219} {"train_loss": -26.479389190673828, "global_step": 350220, "epoch": 4219} {"train_loss": -26.449176788330078, "global_step": 350221, "epoch": 4219} {"train_loss": -26.464984893798828, "global_step": 350222, "epoch": 4219} {"train_loss": -26.13677978515625, "global_step": 350223, "epoch": 4219} {"train_loss": -26.39632225036621, "global_step": 350224, "epoch": 4219} {"train_loss": -26.481840133666992, "global_step": 350225, "epoch": 4219} {"train_loss": -26.364948272705078, "global_step": 350226, "epoch": 4219} {"train_loss": -26.3333797454834, "global_step": 350227, "epoch": 4219} {"train_loss": -26.067651748657227, "global_step": 350228, "epoch": 4219} {"train_loss": -26.47686767578125, "global_step": 350229, "epoch": 4219} {"train_loss": -26.519607543945312, "global_step": 350230, "epoch": 4219} {"train_loss": -26.473712921142578, "global_step": 350231, "epoch": 4219} {"train_loss": -26.442930221557617, "global_step": 350232, "epoch": 4219} {"train_loss": -26.4058837890625, "global_step": 350233, "epoch": 4219} {"train_loss": -26.442230224609375, "global_step": 350234, "epoch": 4219} {"train_loss": -26.402820587158203, "global_step": 350235, "epoch": 4219} {"train_loss": -26.646596908569336, "global_step": 350236, "epoch": 4219} {"train_loss": -26.136371612548828, "global_step": 350237, "epoch": 4219} {"train_loss": -26.335046768188477, "global_step": 350238, "epoch": 4219} {"train_loss": -26.083438873291016, "global_step": 350239, "epoch": 4219} {"train_loss": -25.420486450195312, "global_step": 350240, "epoch": 4219} {"train_loss": -25.619176864624023, "global_step": 350241, "epoch": 4219} {"train_loss": -25.932209014892578, "global_step": 350242, "epoch": 4219} {"train_loss": -26.259536743164062, "global_step": 350243, "epoch": 4219} {"train_loss": -25.370410919189453, "global_step": 350244, "epoch": 4219} {"train_loss": -25.62774658203125, "global_step": 350245, "epoch": 4219} {"train_loss": -25.85453224182129, "global_step": 350246, "epoch": 4219} {"train_loss": -25.298524856567383, "global_step": 350247, "epoch": 4219} {"train_loss": -25.79206657409668, "global_step": 350248, "epoch": 4219} {"train_loss": -25.92344093322754, "global_step": 350249, "epoch": 4219} {"train_loss": -25.755773544311523, "global_step": 350250, "epoch": 4219} {"train_loss": -25.828857421875, "global_step": 350251, "epoch": 4219} {"train_loss": -26.010486602783203, "global_step": 350252, "epoch": 4219} {"train_loss": -25.609899520874023, "global_step": 350253, "epoch": 4219} {"train_loss": -26.102075576782227, "global_step": 350254, "epoch": 4219} {"train_loss": -25.933420181274414, "global_step": 350255, "epoch": 4219} {"train_loss": -26.220703125, "global_step": 350256, "epoch": 4219} {"train_loss": -25.84292984008789, "global_step": 350257, "epoch": 4219} {"train_loss": -26.20890235900879, "global_step": 350258, "epoch": 4219} {"train_loss": -25.917470702205797, "global_step": 350259, "epoch": 4219, "val_loss": 6544968.0} {"train_loss": -25.289382934570312, "global_step": 350260, "epoch": 4220} {"train_loss": -25.809762954711914, "global_step": 350261, "epoch": 4220} {"train_loss": -25.912031173706055, "global_step": 350262, "epoch": 4220} {"train_loss": -25.34304428100586, "global_step": 350263, "epoch": 4220} {"train_loss": -25.319976806640625, "global_step": 350264, "epoch": 4220} {"train_loss": -25.727436065673828, "global_step": 350265, "epoch": 4220} {"train_loss": -25.6863956451416, "global_step": 350266, "epoch": 4220} {"train_loss": -25.6451473236084, "global_step": 350267, "epoch": 4220} {"train_loss": -25.817977905273438, "global_step": 350268, "epoch": 4220} {"train_loss": -25.730056762695312, "global_step": 350269, "epoch": 4220} {"train_loss": -25.732440948486328, "global_step": 350270, "epoch": 4220} {"train_loss": -25.876813888549805, "global_step": 350271, "epoch": 4220} {"train_loss": -26.034635543823242, "global_step": 350272, "epoch": 4220} {"train_loss": -26.123065948486328, "global_step": 350273, "epoch": 4220} {"train_loss": -25.548032760620117, "global_step": 350274, "epoch": 4220} {"train_loss": -25.964704513549805, "global_step": 350275, "epoch": 4220} {"train_loss": -26.066991806030273, "global_step": 350276, "epoch": 4220} {"train_loss": -25.82440185546875, "global_step": 350277, "epoch": 4220} {"train_loss": -25.8048152923584, "global_step": 350278, "epoch": 4220} {"train_loss": -26.028066635131836, "global_step": 350279, "epoch": 4220} {"train_loss": -25.780012130737305, "global_step": 350280, "epoch": 4220} {"train_loss": -25.924224853515625, "global_step": 350281, "epoch": 4220} {"train_loss": -25.887943267822266, "global_step": 350282, "epoch": 4220} {"train_loss": -25.82402992248535, "global_step": 350283, "epoch": 4220} {"train_loss": -25.970184326171875, "global_step": 350284, "epoch": 4220} {"train_loss": -25.671466827392578, "global_step": 350285, "epoch": 4220} {"train_loss": -26.19976806640625, "global_step": 350286, "epoch": 4220} {"train_loss": -26.244592666625977, "global_step": 350287, "epoch": 4220} {"train_loss": -25.965932846069336, "global_step": 350288, "epoch": 4220} {"train_loss": -26.50973892211914, "global_step": 350289, "epoch": 4220} {"train_loss": -26.509428024291992, "global_step": 350290, "epoch": 4220} {"train_loss": -26.113508224487305, "global_step": 350291, "epoch": 4220} {"train_loss": -26.104467391967773, "global_step": 350292, "epoch": 4220} {"train_loss": -26.546863555908203, "global_step": 350293, "epoch": 4220} {"train_loss": -26.254247665405273, "global_step": 350294, "epoch": 4220} {"train_loss": -26.091108322143555, "global_step": 350295, "epoch": 4220} {"train_loss": -26.387434005737305, "global_step": 350296, "epoch": 4220} {"train_loss": -25.92392349243164, "global_step": 350297, "epoch": 4220} {"train_loss": -26.278167724609375, "global_step": 350298, "epoch": 4220} {"train_loss": -26.32813835144043, "global_step": 350299, "epoch": 4220} {"train_loss": -26.660785675048828, "global_step": 350300, "epoch": 4220} {"train_loss": -25.905927658081055, "global_step": 350301, "epoch": 4220} {"train_loss": -26.30976676940918, "global_step": 350302, "epoch": 4220} {"train_loss": -26.145700454711914, "global_step": 350303, "epoch": 4220} {"train_loss": -26.27314567565918, "global_step": 350304, "epoch": 4220} {"train_loss": -25.988473892211914, "global_step": 350305, "epoch": 4220} {"train_loss": -26.57162857055664, "global_step": 350306, "epoch": 4220} {"train_loss": -26.501855850219727, "global_step": 350307, "epoch": 4220} {"train_loss": -26.016357421875, "global_step": 350308, "epoch": 4220} {"train_loss": -26.54996681213379, "global_step": 350309, "epoch": 4220} {"train_loss": -26.52545166015625, "global_step": 350310, "epoch": 4220} {"train_loss": -26.420013427734375, "global_step": 350311, "epoch": 4220} {"train_loss": -26.26702880859375, "global_step": 350312, "epoch": 4220} {"train_loss": -26.275251388549805, "global_step": 350313, "epoch": 4220} {"train_loss": -26.18509292602539, "global_step": 350314, "epoch": 4220} {"train_loss": -26.481603622436523, "global_step": 350315, "epoch": 4220} {"train_loss": -26.14900779724121, "global_step": 350316, "epoch": 4220} {"train_loss": -25.994861602783203, "global_step": 350317, "epoch": 4220} {"train_loss": -25.652917861938477, "global_step": 350318, "epoch": 4220} {"train_loss": -26.261035919189453, "global_step": 350319, "epoch": 4220} {"train_loss": -26.35257911682129, "global_step": 350320, "epoch": 4220} {"train_loss": -26.264331817626953, "global_step": 350321, "epoch": 4220} {"train_loss": -26.1689453125, "global_step": 350322, "epoch": 4220} {"train_loss": -26.159997940063477, "global_step": 350323, "epoch": 4220} {"train_loss": -26.261632919311523, "global_step": 350324, "epoch": 4220} {"train_loss": -26.197912216186523, "global_step": 350325, "epoch": 4220} {"train_loss": -26.38751220703125, "global_step": 350326, "epoch": 4220} {"train_loss": -26.333959579467773, "global_step": 350327, "epoch": 4220} {"train_loss": -26.671894073486328, "global_step": 350328, "epoch": 4220} {"train_loss": -26.415868759155273, "global_step": 350329, "epoch": 4220} {"train_loss": -26.153675079345703, "global_step": 350330, "epoch": 4220} {"train_loss": -26.220029830932617, "global_step": 350331, "epoch": 4220} {"train_loss": -26.07826042175293, "global_step": 350332, "epoch": 4220} {"train_loss": -26.271642684936523, "global_step": 350333, "epoch": 4220} {"train_loss": -26.02741813659668, "global_step": 350334, "epoch": 4220} {"train_loss": -25.9790096282959, "global_step": 350335, "epoch": 4220} {"train_loss": -26.111581802368164, "global_step": 350336, "epoch": 4220} {"train_loss": -25.964160919189453, "global_step": 350337, "epoch": 4220} {"train_loss": -26.24334144592285, "global_step": 350338, "epoch": 4220} {"train_loss": -26.10377311706543, "global_step": 350339, "epoch": 4220} {"train_loss": -26.30666160583496, "global_step": 350340, "epoch": 4220} {"train_loss": -25.555625915527344, "global_step": 350341, "epoch": 4220} {"train_loss": -26.088395888546863, "global_step": 350342, "epoch": 4220, "val_loss": 6735634.5} {"train_loss": -25.21164894104004, "global_step": 350343, "epoch": 4221} {"train_loss": -25.214685440063477, "global_step": 350344, "epoch": 4221} {"train_loss": -25.5598087310791, "global_step": 350345, "epoch": 4221} {"train_loss": -25.738000869750977, "global_step": 350346, "epoch": 4221} {"train_loss": -26.077253341674805, "global_step": 350347, "epoch": 4221} {"train_loss": -26.00257682800293, "global_step": 350348, "epoch": 4221} {"train_loss": -25.47002601623535, "global_step": 350349, "epoch": 4221} {"train_loss": -26.003036499023438, "global_step": 350350, "epoch": 4221} {"train_loss": -26.1402530670166, "global_step": 350351, "epoch": 4221} {"train_loss": -25.906240463256836, "global_step": 350352, "epoch": 4221} {"train_loss": -25.953466415405273, "global_step": 350353, "epoch": 4221} {"train_loss": -25.91895866394043, "global_step": 350354, "epoch": 4221} {"train_loss": -26.35028076171875, "global_step": 350355, "epoch": 4221} {"train_loss": -26.155790328979492, "global_step": 350356, "epoch": 4221} {"train_loss": -25.848134994506836, "global_step": 350357, "epoch": 4221} {"train_loss": -26.130918502807617, "global_step": 350358, "epoch": 4221} {"train_loss": -25.96405029296875, "global_step": 350359, "epoch": 4221} {"train_loss": -25.93067741394043, "global_step": 350360, "epoch": 4221} {"train_loss": -25.710004806518555, "global_step": 350361, "epoch": 4221} {"train_loss": -25.668249130249023, "global_step": 350362, "epoch": 4221} {"train_loss": -26.0441837310791, "global_step": 350363, "epoch": 4221} {"train_loss": -26.052600860595703, "global_step": 350364, "epoch": 4221} {"train_loss": -26.15388298034668, "global_step": 350365, "epoch": 4221} {"train_loss": -25.791797637939453, "global_step": 350366, "epoch": 4221} {"train_loss": -26.22501564025879, "global_step": 350367, "epoch": 4221} {"train_loss": -26.03839683532715, "global_step": 350368, "epoch": 4221} {"train_loss": -25.696701049804688, "global_step": 350369, "epoch": 4221} {"train_loss": -26.329360961914062, "global_step": 350370, "epoch": 4221} {"train_loss": -25.997053146362305, "global_step": 350371, "epoch": 4221} {"train_loss": -25.63821792602539, "global_step": 350372, "epoch": 4221} {"train_loss": -26.343017578125, "global_step": 350373, "epoch": 4221} {"train_loss": -26.031238555908203, "global_step": 350374, "epoch": 4221} {"train_loss": -25.998533248901367, "global_step": 350375, "epoch": 4221} {"train_loss": -26.13937759399414, "global_step": 350376, "epoch": 4221} {"train_loss": -26.11578941345215, "global_step": 350377, "epoch": 4221} {"train_loss": -26.107934951782227, "global_step": 350378, "epoch": 4221} {"train_loss": -26.218286514282227, "global_step": 350379, "epoch": 4221} {"train_loss": -26.469961166381836, "global_step": 350380, "epoch": 4221} {"train_loss": -26.314701080322266, "global_step": 350381, "epoch": 4221} {"train_loss": -26.01889991760254, "global_step": 350382, "epoch": 4221} {"train_loss": -26.170019149780273, "global_step": 350383, "epoch": 4221} {"train_loss": -26.510395050048828, "global_step": 350384, "epoch": 4221} {"train_loss": -26.0405216217041, "global_step": 350385, "epoch": 4221} {"train_loss": -25.984241485595703, "global_step": 350386, "epoch": 4221} {"train_loss": -26.390832901000977, "global_step": 350387, "epoch": 4221} {"train_loss": -26.17889976501465, "global_step": 350388, "epoch": 4221} {"train_loss": -26.457843780517578, "global_step": 350389, "epoch": 4221} {"train_loss": -26.274322509765625, "global_step": 350390, "epoch": 4221} {"train_loss": -26.3889217376709, "global_step": 350391, "epoch": 4221} {"train_loss": -26.256189346313477, "global_step": 350392, "epoch": 4221} {"train_loss": -26.374868392944336, "global_step": 350393, "epoch": 4221} {"train_loss": -26.475767135620117, "global_step": 350394, "epoch": 4221} {"train_loss": -26.378589630126953, "global_step": 350395, "epoch": 4221} {"train_loss": -26.260498046875, "global_step": 350396, "epoch": 4221} {"train_loss": -26.285675048828125, "global_step": 350397, "epoch": 4221} {"train_loss": -26.468610763549805, "global_step": 350398, "epoch": 4221} {"train_loss": -26.491491317749023, "global_step": 350399, "epoch": 4221} {"train_loss": -26.444120407104492, "global_step": 350400, "epoch": 4221} {"train_loss": -26.457172393798828, "global_step": 350401, "epoch": 4221} {"train_loss": -26.569366455078125, "global_step": 350402, "epoch": 4221} {"train_loss": -26.531330108642578, "global_step": 350403, "epoch": 4221} {"train_loss": -26.574417114257812, "global_step": 350404, "epoch": 4221} {"train_loss": -26.17941665649414, "global_step": 350405, "epoch": 4221} {"train_loss": -26.0677547454834, "global_step": 350406, "epoch": 4221} {"train_loss": -26.220264434814453, "global_step": 350407, "epoch": 4221} {"train_loss": -25.6533145904541, "global_step": 350408, "epoch": 4221} {"train_loss": -25.923828125, "global_step": 350409, "epoch": 4221} {"train_loss": -26.068273544311523, "global_step": 350410, "epoch": 4221} {"train_loss": -26.667896270751953, "global_step": 350411, "epoch": 4221} {"train_loss": -26.3709774017334, "global_step": 350412, "epoch": 4221} {"train_loss": -26.143518447875977, "global_step": 350413, "epoch": 4221} {"train_loss": -26.41425895690918, "global_step": 350414, "epoch": 4221} {"train_loss": -26.40687370300293, "global_step": 350415, "epoch": 4221} {"train_loss": -26.346017837524414, "global_step": 350416, "epoch": 4221} {"train_loss": -26.173248291015625, "global_step": 350417, "epoch": 4221} {"train_loss": -26.156726837158203, "global_step": 350418, "epoch": 4221} {"train_loss": -26.29141616821289, "global_step": 350419, "epoch": 4221} {"train_loss": -26.3559627532959, "global_step": 350420, "epoch": 4221} {"train_loss": -26.253843307495117, "global_step": 350421, "epoch": 4221} {"train_loss": -26.144775390625, "global_step": 350422, "epoch": 4221} {"train_loss": -26.185104370117188, "global_step": 350423, "epoch": 4221} {"train_loss": -26.283905029296875, "global_step": 350424, "epoch": 4221} {"train_loss": -26.147076985922205, "global_step": 350425, "epoch": 4221, "val_loss": 6752959.0} {"train_loss": -25.24663734436035, "global_step": 350426, "epoch": 4222} {"train_loss": -24.94437599182129, "global_step": 350427, "epoch": 4222} {"train_loss": -24.43424415588379, "global_step": 350428, "epoch": 4222} {"train_loss": -24.5696964263916, "global_step": 350429, "epoch": 4222} {"train_loss": -25.08070945739746, "global_step": 350430, "epoch": 4222} {"train_loss": -24.38873291015625, "global_step": 350431, "epoch": 4222} {"train_loss": -25.252119064331055, "global_step": 350432, "epoch": 4222} {"train_loss": -24.9591007232666, "global_step": 350433, "epoch": 4222} {"train_loss": -24.693613052368164, "global_step": 350434, "epoch": 4222} {"train_loss": -24.86077308654785, "global_step": 350435, "epoch": 4222} {"train_loss": -24.72211265563965, "global_step": 350436, "epoch": 4222} {"train_loss": -25.471038818359375, "global_step": 350437, "epoch": 4222} {"train_loss": -25.250402450561523, "global_step": 350438, "epoch": 4222} {"train_loss": -25.537281036376953, "global_step": 350439, "epoch": 4222} {"train_loss": -25.17978858947754, "global_step": 350440, "epoch": 4222} {"train_loss": -25.826257705688477, "global_step": 350441, "epoch": 4222} {"train_loss": -25.03400230407715, "global_step": 350442, "epoch": 4222} {"train_loss": -25.65570068359375, "global_step": 350443, "epoch": 4222} {"train_loss": -25.703344345092773, "global_step": 350444, "epoch": 4222} {"train_loss": -25.526323318481445, "global_step": 350445, "epoch": 4222} {"train_loss": -25.754974365234375, "global_step": 350446, "epoch": 4222} {"train_loss": -25.70025062561035, "global_step": 350447, "epoch": 4222} {"train_loss": -25.597089767456055, "global_step": 350448, "epoch": 4222} {"train_loss": -26.0505428314209, "global_step": 350449, "epoch": 4222} {"train_loss": -25.631086349487305, "global_step": 350450, "epoch": 4222} {"train_loss": -25.69996452331543, "global_step": 350451, "epoch": 4222} {"train_loss": -25.80647087097168, "global_step": 350452, "epoch": 4222} {"train_loss": -25.78948402404785, "global_step": 350453, "epoch": 4222} {"train_loss": -26.095922470092773, "global_step": 350454, "epoch": 4222} {"train_loss": -26.006513595581055, "global_step": 350455, "epoch": 4222} {"train_loss": -25.648889541625977, "global_step": 350456, "epoch": 4222} {"train_loss": -25.882984161376953, "global_step": 350457, "epoch": 4222} {"train_loss": -25.917591094970703, "global_step": 350458, "epoch": 4222} {"train_loss": -26.078351974487305, "global_step": 350459, "epoch": 4222} {"train_loss": -25.7238712310791, "global_step": 350460, "epoch": 4222} {"train_loss": -25.918872833251953, "global_step": 350461, "epoch": 4222} {"train_loss": -26.266138076782227, "global_step": 350462, "epoch": 4222} {"train_loss": -26.16156005859375, "global_step": 350463, "epoch": 4222} {"train_loss": -26.09515380859375, "global_step": 350464, "epoch": 4222} {"train_loss": -26.320220947265625, "global_step": 350465, "epoch": 4222} {"train_loss": -26.17498207092285, "global_step": 350466, "epoch": 4222} {"train_loss": -26.089582443237305, "global_step": 350467, "epoch": 4222} {"train_loss": -26.221471786499023, "global_step": 350468, "epoch": 4222} {"train_loss": -26.442121505737305, "global_step": 350469, "epoch": 4222} {"train_loss": -26.329641342163086, "global_step": 350470, "epoch": 4222} {"train_loss": -26.189435958862305, "global_step": 350471, "epoch": 4222} {"train_loss": -26.54241943359375, "global_step": 350472, "epoch": 4222} {"train_loss": -26.3233585357666, "global_step": 350473, "epoch": 4222} {"train_loss": -26.455657958984375, "global_step": 350474, "epoch": 4222} {"train_loss": -26.013629913330078, "global_step": 350475, "epoch": 4222} {"train_loss": -26.269323348999023, "global_step": 350476, "epoch": 4222} {"train_loss": -26.302152633666992, "global_step": 350477, "epoch": 4222} {"train_loss": -26.277868270874023, "global_step": 350478, "epoch": 4222} {"train_loss": -26.205236434936523, "global_step": 350479, "epoch": 4222} {"train_loss": -26.379613876342773, "global_step": 350480, "epoch": 4222} {"train_loss": -26.3275089263916, "global_step": 350481, "epoch": 4222} {"train_loss": -26.23902702331543, "global_step": 350482, "epoch": 4222} {"train_loss": -26.462482452392578, "global_step": 350483, "epoch": 4222} {"train_loss": -26.53896141052246, "global_step": 350484, "epoch": 4222} {"train_loss": -26.097204208374023, "global_step": 350485, "epoch": 4222} {"train_loss": -26.36353874206543, "global_step": 350486, "epoch": 4222} {"train_loss": -26.089582443237305, "global_step": 350487, "epoch": 4222} {"train_loss": -26.165700912475586, "global_step": 350488, "epoch": 4222} {"train_loss": -26.595056533813477, "global_step": 350489, "epoch": 4222} {"train_loss": -26.785980224609375, "global_step": 350490, "epoch": 4222} {"train_loss": -26.126455307006836, "global_step": 350491, "epoch": 4222} {"train_loss": -26.352630615234375, "global_step": 350492, "epoch": 4222} {"train_loss": -26.22944450378418, "global_step": 350493, "epoch": 4222} {"train_loss": -26.063398361206055, "global_step": 350494, "epoch": 4222} {"train_loss": -26.542316436767578, "global_step": 350495, "epoch": 4222} {"train_loss": -26.677276611328125, "global_step": 350496, "epoch": 4222} {"train_loss": -26.398273468017578, "global_step": 350497, "epoch": 4222} {"train_loss": -26.340299606323242, "global_step": 350498, "epoch": 4222} {"train_loss": -26.136816024780273, "global_step": 350499, "epoch": 4222} {"train_loss": -26.565887451171875, "global_step": 350500, "epoch": 4222} {"train_loss": -26.49727439880371, "global_step": 350501, "epoch": 4222} {"train_loss": -26.153705596923828, "global_step": 350502, "epoch": 4222} {"train_loss": -26.21254539489746, "global_step": 350503, "epoch": 4222} {"train_loss": -26.162504196166992, "global_step": 350504, "epoch": 4222} {"train_loss": -26.03718376159668, "global_step": 350505, "epoch": 4222} {"train_loss": -26.158660888671875, "global_step": 350506, "epoch": 4222} {"train_loss": -26.156116485595703, "global_step": 350507, "epoch": 4222} {"train_loss": -25.894400033606104, "global_step": 350508, "epoch": 4222, "val_loss": 6645882.5} {"train_loss": -25.37129020690918, "global_step": 350509, "epoch": 4223} {"train_loss": -23.597702026367188, "global_step": 350510, "epoch": 4223} {"train_loss": -23.362592697143555, "global_step": 350511, "epoch": 4223} {"train_loss": -24.302824020385742, "global_step": 350512, "epoch": 4223} {"train_loss": -25.546005249023438, "global_step": 350513, "epoch": 4223} {"train_loss": -24.445947647094727, "global_step": 350514, "epoch": 4223} {"train_loss": -24.871002197265625, "global_step": 350515, "epoch": 4223} {"train_loss": -25.22379493713379, "global_step": 350516, "epoch": 4223} {"train_loss": -24.464874267578125, "global_step": 350517, "epoch": 4223} {"train_loss": -25.409080505371094, "global_step": 350518, "epoch": 4223} {"train_loss": -25.239267349243164, "global_step": 350519, "epoch": 4223} {"train_loss": -25.040618896484375, "global_step": 350520, "epoch": 4223} {"train_loss": -25.141462326049805, "global_step": 350521, "epoch": 4223} {"train_loss": -25.55667495727539, "global_step": 350522, "epoch": 4223} {"train_loss": -24.901762008666992, "global_step": 350523, "epoch": 4223} {"train_loss": -25.318588256835938, "global_step": 350524, "epoch": 4223} {"train_loss": -25.7554931640625, "global_step": 350525, "epoch": 4223} {"train_loss": -25.55198860168457, "global_step": 350526, "epoch": 4223} {"train_loss": -25.543079376220703, "global_step": 350527, "epoch": 4223} {"train_loss": -25.871850967407227, "global_step": 350528, "epoch": 4223} {"train_loss": -25.70221519470215, "global_step": 350529, "epoch": 4223} {"train_loss": -26.158578872680664, "global_step": 350530, "epoch": 4223} {"train_loss": -25.584508895874023, "global_step": 350531, "epoch": 4223} {"train_loss": -25.670392990112305, "global_step": 350532, "epoch": 4223} {"train_loss": -25.480300903320312, "global_step": 350533, "epoch": 4223} {"train_loss": -25.819334030151367, "global_step": 350534, "epoch": 4223} {"train_loss": -26.247900009155273, "global_step": 350535, "epoch": 4223} {"train_loss": -25.789697647094727, "global_step": 350536, "epoch": 4223} {"train_loss": -26.13632583618164, "global_step": 350537, "epoch": 4223} {"train_loss": -25.6549015045166, "global_step": 350538, "epoch": 4223} {"train_loss": -25.575138092041016, "global_step": 350539, "epoch": 4223} {"train_loss": -25.733081817626953, "global_step": 350540, "epoch": 4223} {"train_loss": -26.054859161376953, "global_step": 350541, "epoch": 4223} {"train_loss": -25.703689575195312, "global_step": 350542, "epoch": 4223} {"train_loss": -25.67108154296875, "global_step": 350543, "epoch": 4223} {"train_loss": -25.72659683227539, "global_step": 350544, "epoch": 4223} {"train_loss": -25.64780616760254, "global_step": 350545, "epoch": 4223} {"train_loss": -25.740650177001953, "global_step": 350546, "epoch": 4223} {"train_loss": -25.974945068359375, "global_step": 350547, "epoch": 4223} {"train_loss": -25.87025260925293, "global_step": 350548, "epoch": 4223} {"train_loss": -26.10269546508789, "global_step": 350549, "epoch": 4223} {"train_loss": -26.223968505859375, "global_step": 350550, "epoch": 4223} {"train_loss": -26.27833366394043, "global_step": 350551, "epoch": 4223} {"train_loss": -26.178022384643555, "global_step": 350552, "epoch": 4223} {"train_loss": -25.99734878540039, "global_step": 350553, "epoch": 4223} {"train_loss": -26.6519718170166, "global_step": 350554, "epoch": 4223} {"train_loss": -26.509714126586914, "global_step": 350555, "epoch": 4223} {"train_loss": -26.6122989654541, "global_step": 350556, "epoch": 4223} {"train_loss": -26.38262939453125, "global_step": 350557, "epoch": 4223} {"train_loss": -26.46878433227539, "global_step": 350558, "epoch": 4223} {"train_loss": -26.51307487487793, "global_step": 350559, "epoch": 4223} {"train_loss": -26.290451049804688, "global_step": 350560, "epoch": 4223} {"train_loss": -26.151844024658203, "global_step": 350561, "epoch": 4223} {"train_loss": -26.358362197875977, "global_step": 350562, "epoch": 4223} {"train_loss": -26.20615005493164, "global_step": 350563, "epoch": 4223} {"train_loss": -26.255481719970703, "global_step": 350564, "epoch": 4223} {"train_loss": -26.424097061157227, "global_step": 350565, "epoch": 4223} {"train_loss": -26.525543212890625, "global_step": 350566, "epoch": 4223} {"train_loss": -26.11927604675293, "global_step": 350567, "epoch": 4223} {"train_loss": -26.47760581970215, "global_step": 350568, "epoch": 4223} {"train_loss": -26.326440811157227, "global_step": 350569, "epoch": 4223} {"train_loss": -26.180078506469727, "global_step": 350570, "epoch": 4223} {"train_loss": -26.405475616455078, "global_step": 350571, "epoch": 4223} {"train_loss": -26.191497802734375, "global_step": 350572, "epoch": 4223} {"train_loss": -26.081695556640625, "global_step": 350573, "epoch": 4223} {"train_loss": -26.62101173400879, "global_step": 350574, "epoch": 4223} {"train_loss": -25.844562530517578, "global_step": 350575, "epoch": 4223} {"train_loss": -25.885040283203125, "global_step": 350576, "epoch": 4223} {"train_loss": -25.708240509033203, "global_step": 350577, "epoch": 4223} {"train_loss": -25.769433975219727, "global_step": 350578, "epoch": 4223} {"train_loss": -26.254255294799805, "global_step": 350579, "epoch": 4223} {"train_loss": -25.659061431884766, "global_step": 350580, "epoch": 4223} {"train_loss": -26.129865646362305, "global_step": 350581, "epoch": 4223} {"train_loss": -25.921436309814453, "global_step": 350582, "epoch": 4223} {"train_loss": -26.311288833618164, "global_step": 350583, "epoch": 4223} {"train_loss": -26.138019561767578, "global_step": 350584, "epoch": 4223} {"train_loss": -26.163557052612305, "global_step": 350585, "epoch": 4223} {"train_loss": -26.194732666015625, "global_step": 350586, "epoch": 4223} {"train_loss": -26.377161026000977, "global_step": 350587, "epoch": 4223} {"train_loss": -26.197986602783203, "global_step": 350588, "epoch": 4223} {"train_loss": -26.607929229736328, "global_step": 350589, "epoch": 4223} {"train_loss": -26.08750343322754, "global_step": 350590, "epoch": 4223} {"train_loss": -25.83445769620229, "global_step": 350591, "epoch": 4223, "val_loss": 6759279.0} {"train_loss": -26.011892318725586, "global_step": 350592, "epoch": 4224} {"train_loss": -26.182321548461914, "global_step": 350593, "epoch": 4224} {"train_loss": -25.878250122070312, "global_step": 350594, "epoch": 4224} {"train_loss": -25.98300552368164, "global_step": 350595, "epoch": 4224} {"train_loss": -25.902719497680664, "global_step": 350596, "epoch": 4224} {"train_loss": -25.53873062133789, "global_step": 350597, "epoch": 4224} {"train_loss": -25.54893684387207, "global_step": 350598, "epoch": 4224} {"train_loss": -25.81991958618164, "global_step": 350599, "epoch": 4224} {"train_loss": -26.235965728759766, "global_step": 350600, "epoch": 4224} {"train_loss": -25.705228805541992, "global_step": 350601, "epoch": 4224} {"train_loss": -25.81223487854004, "global_step": 350602, "epoch": 4224} {"train_loss": -25.899169921875, "global_step": 350603, "epoch": 4224} {"train_loss": -26.068883895874023, "global_step": 350604, "epoch": 4224} {"train_loss": -25.917524337768555, "global_step": 350605, "epoch": 4224} {"train_loss": -26.246490478515625, "global_step": 350606, "epoch": 4224} {"train_loss": -26.45548439025879, "global_step": 350607, "epoch": 4224} {"train_loss": -25.9913387298584, "global_step": 350608, "epoch": 4224} {"train_loss": -25.993885040283203, "global_step": 350609, "epoch": 4224} {"train_loss": -26.047346115112305, "global_step": 350610, "epoch": 4224} {"train_loss": -25.578550338745117, "global_step": 350611, "epoch": 4224} {"train_loss": -26.097949981689453, "global_step": 350612, "epoch": 4224} {"train_loss": -26.181257247924805, "global_step": 350613, "epoch": 4224} {"train_loss": -25.87164306640625, "global_step": 350614, "epoch": 4224} {"train_loss": -26.107223510742188, "global_step": 350615, "epoch": 4224} {"train_loss": -25.845563888549805, "global_step": 350616, "epoch": 4224} {"train_loss": -26.072494506835938, "global_step": 350617, "epoch": 4224} {"train_loss": -25.930484771728516, "global_step": 350618, "epoch": 4224} {"train_loss": -26.11191749572754, "global_step": 350619, "epoch": 4224} {"train_loss": -26.071317672729492, "global_step": 350620, "epoch": 4224} {"train_loss": -26.515369415283203, "global_step": 350621, "epoch": 4224} {"train_loss": -25.676237106323242, "global_step": 350622, "epoch": 4224} {"train_loss": -26.28218650817871, "global_step": 350623, "epoch": 4224} {"train_loss": -26.279958724975586, "global_step": 350624, "epoch": 4224} {"train_loss": -26.042409896850586, "global_step": 350625, "epoch": 4224} {"train_loss": -25.6876277923584, "global_step": 350626, "epoch": 4224} {"train_loss": -25.903532028198242, "global_step": 350627, "epoch": 4224} {"train_loss": -26.68658447265625, "global_step": 350628, "epoch": 4224} {"train_loss": -25.899097442626953, "global_step": 350629, "epoch": 4224} {"train_loss": -25.627490997314453, "global_step": 350630, "epoch": 4224} {"train_loss": -26.135547637939453, "global_step": 350631, "epoch": 4224} {"train_loss": -26.106168746948242, "global_step": 350632, "epoch": 4224} {"train_loss": -26.38173484802246, "global_step": 350633, "epoch": 4224} {"train_loss": -26.308507919311523, "global_step": 350634, "epoch": 4224} {"train_loss": -26.415191650390625, "global_step": 350635, "epoch": 4224} {"train_loss": -26.1812686920166, "global_step": 350636, "epoch": 4224} {"train_loss": -26.04755210876465, "global_step": 350637, "epoch": 4224} {"train_loss": -26.525196075439453, "global_step": 350638, "epoch": 4224} {"train_loss": -26.332677841186523, "global_step": 350639, "epoch": 4224} {"train_loss": -26.20331382751465, "global_step": 350640, "epoch": 4224} {"train_loss": -26.280298233032227, "global_step": 350641, "epoch": 4224} {"train_loss": -26.199804306030273, "global_step": 350642, "epoch": 4224} {"train_loss": -26.3118839263916, "global_step": 350643, "epoch": 4224} {"train_loss": -26.387317657470703, "global_step": 350644, "epoch": 4224} {"train_loss": -26.04829978942871, "global_step": 350645, "epoch": 4224} {"train_loss": -26.061115264892578, "global_step": 350646, "epoch": 4224} {"train_loss": -26.265417098999023, "global_step": 350647, "epoch": 4224} {"train_loss": -26.319915771484375, "global_step": 350648, "epoch": 4224} {"train_loss": -26.34720802307129, "global_step": 350649, "epoch": 4224} {"train_loss": -26.458044052124023, "global_step": 350650, "epoch": 4224} {"train_loss": -25.987329483032227, "global_step": 350651, "epoch": 4224} {"train_loss": -26.44736671447754, "global_step": 350652, "epoch": 4224} {"train_loss": -26.2813777923584, "global_step": 350653, "epoch": 4224} {"train_loss": -26.144821166992188, "global_step": 350654, "epoch": 4224} {"train_loss": -25.602659225463867, "global_step": 350655, "epoch": 4224} {"train_loss": -26.177413940429688, "global_step": 350656, "epoch": 4224} {"train_loss": -26.459918975830078, "global_step": 350657, "epoch": 4224} {"train_loss": -26.441944122314453, "global_step": 350658, "epoch": 4224} {"train_loss": -26.06402015686035, "global_step": 350659, "epoch": 4224} {"train_loss": -26.034042358398438, "global_step": 350660, "epoch": 4224} {"train_loss": -26.197851181030273, "global_step": 350661, "epoch": 4224} {"train_loss": -26.326492309570312, "global_step": 350662, "epoch": 4224} {"train_loss": -26.117258071899414, "global_step": 350663, "epoch": 4224} {"train_loss": -25.960485458374023, "global_step": 350664, "epoch": 4224} {"train_loss": -26.340978622436523, "global_step": 350665, "epoch": 4224} {"train_loss": -26.453344345092773, "global_step": 350666, "epoch": 4224} {"train_loss": -25.99833106994629, "global_step": 350667, "epoch": 4224} {"train_loss": -26.185407638549805, "global_step": 350668, "epoch": 4224} {"train_loss": -26.46649742126465, "global_step": 350669, "epoch": 4224} {"train_loss": -26.755908966064453, "global_step": 350670, "epoch": 4224} {"train_loss": -26.27618408203125, "global_step": 350671, "epoch": 4224} {"train_loss": -26.45149040222168, "global_step": 350672, "epoch": 4224} {"train_loss": -26.266767501831055, "global_step": 350673, "epoch": 4224} {"train_loss": -26.124303564967878, "global_step": 350674, "epoch": 4224, "val_loss": 6760017.0} {"train_loss": -25.02236557006836, "global_step": 350675, "epoch": 4225} {"train_loss": -25.319229125976562, "global_step": 350676, "epoch": 4225} {"train_loss": -25.36404037475586, "global_step": 350677, "epoch": 4225} {"train_loss": -25.041473388671875, "global_step": 350678, "epoch": 4225} {"train_loss": -25.958484649658203, "global_step": 350679, "epoch": 4225} {"train_loss": -25.449443817138672, "global_step": 350680, "epoch": 4225} {"train_loss": -25.46918296813965, "global_step": 350681, "epoch": 4225} {"train_loss": -25.078046798706055, "global_step": 350682, "epoch": 4225} {"train_loss": -25.200531005859375, "global_step": 350683, "epoch": 4225} {"train_loss": -25.6357479095459, "global_step": 350684, "epoch": 4225} {"train_loss": -25.575428009033203, "global_step": 350685, "epoch": 4225} {"train_loss": -25.473403930664062, "global_step": 350686, "epoch": 4225} {"train_loss": -24.86823081970215, "global_step": 350687, "epoch": 4225} {"train_loss": -25.37173843383789, "global_step": 350688, "epoch": 4225} {"train_loss": -25.617919921875, "global_step": 350689, "epoch": 4225} {"train_loss": -25.373855590820312, "global_step": 350690, "epoch": 4225} {"train_loss": -25.616790771484375, "global_step": 350691, "epoch": 4225} {"train_loss": -25.14279556274414, "global_step": 350692, "epoch": 4225} {"train_loss": -25.200946807861328, "global_step": 350693, "epoch": 4225} {"train_loss": -25.552724838256836, "global_step": 350694, "epoch": 4225} {"train_loss": -25.76949119567871, "global_step": 350695, "epoch": 4225} {"train_loss": -25.841495513916016, "global_step": 350696, "epoch": 4225} {"train_loss": -25.619964599609375, "global_step": 350697, "epoch": 4225} {"train_loss": -25.61285972595215, "global_step": 350698, "epoch": 4225} {"train_loss": -25.789493560791016, "global_step": 350699, "epoch": 4225} {"train_loss": -26.070947647094727, "global_step": 350700, "epoch": 4225} {"train_loss": -26.315113067626953, "global_step": 350701, "epoch": 4225} {"train_loss": -25.92254638671875, "global_step": 350702, "epoch": 4225} {"train_loss": -25.901519775390625, "global_step": 350703, "epoch": 4225} {"train_loss": -26.280561447143555, "global_step": 350704, "epoch": 4225} {"train_loss": -26.24421501159668, "global_step": 350705, "epoch": 4225} {"train_loss": -26.01413917541504, "global_step": 350706, "epoch": 4225} {"train_loss": -26.168121337890625, "global_step": 350707, "epoch": 4225} {"train_loss": -25.97671890258789, "global_step": 350708, "epoch": 4225} {"train_loss": -26.154560089111328, "global_step": 350709, "epoch": 4225} {"train_loss": -26.3131160736084, "global_step": 350710, "epoch": 4225} {"train_loss": -25.99688148498535, "global_step": 350711, "epoch": 4225} {"train_loss": -26.138843536376953, "global_step": 350712, "epoch": 4225} {"train_loss": -26.215356826782227, "global_step": 350713, "epoch": 4225} {"train_loss": -26.189453125, "global_step": 350714, "epoch": 4225} {"train_loss": -26.251285552978516, "global_step": 350715, "epoch": 4225} {"train_loss": -26.119171142578125, "global_step": 350716, "epoch": 4225} {"train_loss": -26.071882247924805, "global_step": 350717, "epoch": 4225} {"train_loss": -26.204910278320312, "global_step": 350718, "epoch": 4225} {"train_loss": -26.26969337463379, "global_step": 350719, "epoch": 4225} {"train_loss": -26.208209991455078, "global_step": 350720, "epoch": 4225} {"train_loss": -26.265050888061523, "global_step": 350721, "epoch": 4225} {"train_loss": -26.48921012878418, "global_step": 350722, "epoch": 4225} {"train_loss": -26.13498878479004, "global_step": 350723, "epoch": 4225} {"train_loss": -26.228668212890625, "global_step": 350724, "epoch": 4225} {"train_loss": -26.298297882080078, "global_step": 350725, "epoch": 4225} {"train_loss": -25.914392471313477, "global_step": 350726, "epoch": 4225} {"train_loss": -26.289627075195312, "global_step": 350727, "epoch": 4225} {"train_loss": -26.516225814819336, "global_step": 350728, "epoch": 4225} {"train_loss": -26.687341690063477, "global_step": 350729, "epoch": 4225} {"train_loss": -26.2440128326416, "global_step": 350730, "epoch": 4225} {"train_loss": -26.849225997924805, "global_step": 350731, "epoch": 4225} {"train_loss": -26.208154678344727, "global_step": 350732, "epoch": 4225} {"train_loss": -25.87384605407715, "global_step": 350733, "epoch": 4225} {"train_loss": -26.215164184570312, "global_step": 350734, "epoch": 4225} {"train_loss": -26.350173950195312, "global_step": 350735, "epoch": 4225} {"train_loss": -26.211750030517578, "global_step": 350736, "epoch": 4225} {"train_loss": -26.168720245361328, "global_step": 350737, "epoch": 4225} {"train_loss": -26.291568756103516, "global_step": 350738, "epoch": 4225} {"train_loss": -26.226215362548828, "global_step": 350739, "epoch": 4225} {"train_loss": -26.45806312561035, "global_step": 350740, "epoch": 4225} {"train_loss": -25.913043975830078, "global_step": 350741, "epoch": 4225} {"train_loss": -25.559419631958008, "global_step": 350742, "epoch": 4225} {"train_loss": -26.5837459564209, "global_step": 350743, "epoch": 4225} {"train_loss": -25.527257919311523, "global_step": 350744, "epoch": 4225} {"train_loss": -26.04804801940918, "global_step": 350745, "epoch": 4225} {"train_loss": -25.901336669921875, "global_step": 350746, "epoch": 4225} {"train_loss": -25.68471336364746, "global_step": 350747, "epoch": 4225} {"train_loss": -25.61476707458496, "global_step": 350748, "epoch": 4225} {"train_loss": -25.704824447631836, "global_step": 350749, "epoch": 4225} {"train_loss": -25.874786376953125, "global_step": 350750, "epoch": 4225} {"train_loss": -25.9770450592041, "global_step": 350751, "epoch": 4225} {"train_loss": -25.362520217895508, "global_step": 350752, "epoch": 4225} {"train_loss": -26.1271915435791, "global_step": 350753, "epoch": 4225} {"train_loss": -25.659107208251953, "global_step": 350754, "epoch": 4225} {"train_loss": -26.243844985961914, "global_step": 350755, "epoch": 4225} {"train_loss": -25.809894561767578, "global_step": 350756, "epoch": 4225} {"train_loss": -25.912383412740315, "global_step": 350757, "epoch": 4225, "val_loss": 6671810.0} {"train_loss": -25.89717674255371, "global_step": 350758, "epoch": 4226} {"train_loss": -25.633056640625, "global_step": 350759, "epoch": 4226} {"train_loss": -25.810016632080078, "global_step": 350760, "epoch": 4226} {"train_loss": -25.3710994720459, "global_step": 350761, "epoch": 4226} {"train_loss": -25.489028930664062, "global_step": 350762, "epoch": 4226} {"train_loss": -24.58747100830078, "global_step": 350763, "epoch": 4226} {"train_loss": -24.99024772644043, "global_step": 350764, "epoch": 4226} {"train_loss": -25.849964141845703, "global_step": 350765, "epoch": 4226} {"train_loss": -25.409955978393555, "global_step": 350766, "epoch": 4226} {"train_loss": -25.77378273010254, "global_step": 350767, "epoch": 4226} {"train_loss": -25.096939086914062, "global_step": 350768, "epoch": 4226} {"train_loss": -25.56966209411621, "global_step": 350769, "epoch": 4226} {"train_loss": -25.825698852539062, "global_step": 350770, "epoch": 4226} {"train_loss": -25.584278106689453, "global_step": 350771, "epoch": 4226} {"train_loss": -25.987375259399414, "global_step": 350772, "epoch": 4226} {"train_loss": -25.676986694335938, "global_step": 350773, "epoch": 4226} {"train_loss": -26.16303825378418, "global_step": 350774, "epoch": 4226} {"train_loss": -25.82681655883789, "global_step": 350775, "epoch": 4226} {"train_loss": -26.156782150268555, "global_step": 350776, "epoch": 4226} {"train_loss": -25.8712215423584, "global_step": 350777, "epoch": 4226} {"train_loss": -26.287006378173828, "global_step": 350778, "epoch": 4226} {"train_loss": -25.903034210205078, "global_step": 350779, "epoch": 4226} {"train_loss": -26.1347713470459, "global_step": 350780, "epoch": 4226} {"train_loss": -26.1426944732666, "global_step": 350781, "epoch": 4226} {"train_loss": -26.3872127532959, "global_step": 350782, "epoch": 4226} {"train_loss": -26.15570640563965, "global_step": 350783, "epoch": 4226} {"train_loss": -26.43914222717285, "global_step": 350784, "epoch": 4226} {"train_loss": -26.7711238861084, "global_step": 350785, "epoch": 4226} {"train_loss": -25.93471336364746, "global_step": 350786, "epoch": 4226} {"train_loss": -26.227426528930664, "global_step": 350787, "epoch": 4226} {"train_loss": -26.478168487548828, "global_step": 350788, "epoch": 4226} {"train_loss": -26.136062622070312, "global_step": 350789, "epoch": 4226} {"train_loss": -26.703672409057617, "global_step": 350790, "epoch": 4226} {"train_loss": -25.8572940826416, "global_step": 350791, "epoch": 4226} {"train_loss": -26.3432674407959, "global_step": 350792, "epoch": 4226} {"train_loss": -26.285846710205078, "global_step": 350793, "epoch": 4226} {"train_loss": -26.285873413085938, "global_step": 350794, "epoch": 4226} {"train_loss": -26.447467803955078, "global_step": 350795, "epoch": 4226} {"train_loss": -26.068639755249023, "global_step": 350796, "epoch": 4226} {"train_loss": -26.049875259399414, "global_step": 350797, "epoch": 4226} {"train_loss": -26.06702995300293, "global_step": 350798, "epoch": 4226} {"train_loss": -26.173233032226562, "global_step": 350799, "epoch": 4226} {"train_loss": -25.904874801635742, "global_step": 350800, "epoch": 4226} {"train_loss": -26.52632713317871, "global_step": 350801, "epoch": 4226} {"train_loss": -26.0095272064209, "global_step": 350802, "epoch": 4226} {"train_loss": -26.382186889648438, "global_step": 350803, "epoch": 4226} {"train_loss": -26.158649444580078, "global_step": 350804, "epoch": 4226} {"train_loss": -26.19407081604004, "global_step": 350805, "epoch": 4226} {"train_loss": -26.080427169799805, "global_step": 350806, "epoch": 4226} {"train_loss": -26.298309326171875, "global_step": 350807, "epoch": 4226} {"train_loss": -26.41042137145996, "global_step": 350808, "epoch": 4226} {"train_loss": -26.29090690612793, "global_step": 350809, "epoch": 4226} {"train_loss": -26.688379287719727, "global_step": 350810, "epoch": 4226} {"train_loss": -26.077741622924805, "global_step": 350811, "epoch": 4226} {"train_loss": -26.45221519470215, "global_step": 350812, "epoch": 4226} {"train_loss": -26.362268447875977, "global_step": 350813, "epoch": 4226} {"train_loss": -26.460081100463867, "global_step": 350814, "epoch": 4226} {"train_loss": -26.359460830688477, "global_step": 350815, "epoch": 4226} {"train_loss": -26.5166072845459, "global_step": 350816, "epoch": 4226} {"train_loss": -26.3796329498291, "global_step": 350817, "epoch": 4226} {"train_loss": -26.4190673828125, "global_step": 350818, "epoch": 4226} {"train_loss": -25.861547470092773, "global_step": 350819, "epoch": 4226} {"train_loss": -26.319814682006836, "global_step": 350820, "epoch": 4226} {"train_loss": -26.16267204284668, "global_step": 350821, "epoch": 4226} {"train_loss": -26.225072860717773, "global_step": 350822, "epoch": 4226} {"train_loss": -26.194189071655273, "global_step": 350823, "epoch": 4226} {"train_loss": -26.30606460571289, "global_step": 350824, "epoch": 4226} {"train_loss": -26.482641220092773, "global_step": 350825, "epoch": 4226} {"train_loss": -25.77021598815918, "global_step": 350826, "epoch": 4226} {"train_loss": -26.15127944946289, "global_step": 350827, "epoch": 4226} {"train_loss": -25.9776554107666, "global_step": 350828, "epoch": 4226} {"train_loss": -26.10784339904785, "global_step": 350829, "epoch": 4226} {"train_loss": -26.190229415893555, "global_step": 350830, "epoch": 4226} {"train_loss": -26.276111602783203, "global_step": 350831, "epoch": 4226} {"train_loss": -26.079694747924805, "global_step": 350832, "epoch": 4226} {"train_loss": -26.004026412963867, "global_step": 350833, "epoch": 4226} {"train_loss": -26.574005126953125, "global_step": 350834, "epoch": 4226} {"train_loss": -26.020044326782227, "global_step": 350835, "epoch": 4226} {"train_loss": -26.152307510375977, "global_step": 350836, "epoch": 4226} {"train_loss": -25.969409942626953, "global_step": 350837, "epoch": 4226} {"train_loss": -26.099720001220703, "global_step": 350838, "epoch": 4226} {"train_loss": -26.099151611328125, "global_step": 350839, "epoch": 4226} {"train_loss": -26.070456539291932, "global_step": 350840, "epoch": 4226, "val_loss": 6648230.0} {"train_loss": -25.142780303955078, "global_step": 350841, "epoch": 4227} {"train_loss": -25.753543853759766, "global_step": 350842, "epoch": 4227} {"train_loss": -25.159399032592773, "global_step": 350843, "epoch": 4227} {"train_loss": -25.98769187927246, "global_step": 350844, "epoch": 4227} {"train_loss": -25.148984909057617, "global_step": 350845, "epoch": 4227} {"train_loss": -25.705718994140625, "global_step": 350846, "epoch": 4227} {"train_loss": -25.547616958618164, "global_step": 350847, "epoch": 4227} {"train_loss": -25.755207061767578, "global_step": 350848, "epoch": 4227} {"train_loss": -25.760196685791016, "global_step": 350849, "epoch": 4227} {"train_loss": -26.02984046936035, "global_step": 350850, "epoch": 4227} {"train_loss": -26.08327293395996, "global_step": 350851, "epoch": 4227} {"train_loss": -26.06437110900879, "global_step": 350852, "epoch": 4227} {"train_loss": -25.773908615112305, "global_step": 350853, "epoch": 4227} {"train_loss": -25.824995040893555, "global_step": 350854, "epoch": 4227} {"train_loss": -26.2612247467041, "global_step": 350855, "epoch": 4227} {"train_loss": -25.975910186767578, "global_step": 350856, "epoch": 4227} {"train_loss": -26.025354385375977, "global_step": 350857, "epoch": 4227} {"train_loss": -26.301300048828125, "global_step": 350858, "epoch": 4227} {"train_loss": -26.112668991088867, "global_step": 350859, "epoch": 4227} {"train_loss": -26.007410049438477, "global_step": 350860, "epoch": 4227} {"train_loss": -26.091064453125, "global_step": 350861, "epoch": 4227} {"train_loss": -26.101831436157227, "global_step": 350862, "epoch": 4227} {"train_loss": -25.930810928344727, "global_step": 350863, "epoch": 4227} {"train_loss": -25.976318359375, "global_step": 350864, "epoch": 4227} {"train_loss": -25.7335205078125, "global_step": 350865, "epoch": 4227} {"train_loss": -26.17989158630371, "global_step": 350866, "epoch": 4227} {"train_loss": -26.08576774597168, "global_step": 350867, "epoch": 4227} {"train_loss": -26.38020133972168, "global_step": 350868, "epoch": 4227} {"train_loss": -26.549341201782227, "global_step": 350869, "epoch": 4227} {"train_loss": -26.023029327392578, "global_step": 350870, "epoch": 4227} {"train_loss": -26.457075119018555, "global_step": 350871, "epoch": 4227} {"train_loss": -26.25628662109375, "global_step": 350872, "epoch": 4227} {"train_loss": -26.27863121032715, "global_step": 350873, "epoch": 4227} {"train_loss": -26.02155876159668, "global_step": 350874, "epoch": 4227} {"train_loss": -26.225671768188477, "global_step": 350875, "epoch": 4227} {"train_loss": -26.383554458618164, "global_step": 350876, "epoch": 4227} {"train_loss": -26.238239288330078, "global_step": 350877, "epoch": 4227} {"train_loss": -26.419626235961914, "global_step": 350878, "epoch": 4227} {"train_loss": -26.318195343017578, "global_step": 350879, "epoch": 4227} {"train_loss": -26.14131736755371, "global_step": 350880, "epoch": 4227} {"train_loss": -26.376129150390625, "global_step": 350881, "epoch": 4227} {"train_loss": -26.509429931640625, "global_step": 350882, "epoch": 4227} {"train_loss": -26.133153915405273, "global_step": 350883, "epoch": 4227} {"train_loss": -25.898883819580078, "global_step": 350884, "epoch": 4227} {"train_loss": -26.078641891479492, "global_step": 350885, "epoch": 4227} {"train_loss": -25.769750595092773, "global_step": 350886, "epoch": 4227} {"train_loss": -26.028091430664062, "global_step": 350887, "epoch": 4227} {"train_loss": -26.595029830932617, "global_step": 350888, "epoch": 4227} {"train_loss": -26.12774085998535, "global_step": 350889, "epoch": 4227} {"train_loss": -25.625391006469727, "global_step": 350890, "epoch": 4227} {"train_loss": -26.471790313720703, "global_step": 350891, "epoch": 4227} {"train_loss": -25.958526611328125, "global_step": 350892, "epoch": 4227} {"train_loss": -25.739059448242188, "global_step": 350893, "epoch": 4227} {"train_loss": -25.95282554626465, "global_step": 350894, "epoch": 4227} {"train_loss": -26.1574764251709, "global_step": 350895, "epoch": 4227} {"train_loss": -25.98768424987793, "global_step": 350896, "epoch": 4227} {"train_loss": -26.16436767578125, "global_step": 350897, "epoch": 4227} {"train_loss": -26.0218448638916, "global_step": 350898, "epoch": 4227} {"train_loss": -25.769968032836914, "global_step": 350899, "epoch": 4227} {"train_loss": -26.15390396118164, "global_step": 350900, "epoch": 4227} {"train_loss": -25.750619888305664, "global_step": 350901, "epoch": 4227} {"train_loss": -26.263641357421875, "global_step": 350902, "epoch": 4227} {"train_loss": -25.891931533813477, "global_step": 350903, "epoch": 4227} {"train_loss": -26.053730010986328, "global_step": 350904, "epoch": 4227} {"train_loss": -25.94392204284668, "global_step": 350905, "epoch": 4227} {"train_loss": -26.134435653686523, "global_step": 350906, "epoch": 4227} {"train_loss": -25.696857452392578, "global_step": 350907, "epoch": 4227} {"train_loss": -25.870819091796875, "global_step": 350908, "epoch": 4227} {"train_loss": -25.630544662475586, "global_step": 350909, "epoch": 4227} {"train_loss": -26.075002670288086, "global_step": 350910, "epoch": 4227} {"train_loss": -26.262348175048828, "global_step": 350911, "epoch": 4227} {"train_loss": -26.078229904174805, "global_step": 350912, "epoch": 4227} {"train_loss": -25.787601470947266, "global_step": 350913, "epoch": 4227} {"train_loss": -25.866748809814453, "global_step": 350914, "epoch": 4227} {"train_loss": -25.9157772064209, "global_step": 350915, "epoch": 4227} {"train_loss": -26.40693473815918, "global_step": 350916, "epoch": 4227} {"train_loss": -26.103260040283203, "global_step": 350917, "epoch": 4227} {"train_loss": -26.1983699798584, "global_step": 350918, "epoch": 4227} {"train_loss": -25.935535430908203, "global_step": 350919, "epoch": 4227} {"train_loss": -26.507516860961914, "global_step": 350920, "epoch": 4227} {"train_loss": -25.933429718017578, "global_step": 350921, "epoch": 4227} {"train_loss": -26.22364616394043, "global_step": 350922, "epoch": 4227} {"train_loss": -26.032050259142036, "global_step": 350923, "epoch": 4227, "val_loss": 6686707.0} {"train_loss": -25.95371437072754, "global_step": 350924, "epoch": 4228} {"train_loss": -26.083311080932617, "global_step": 350925, "epoch": 4228} {"train_loss": -26.35894203186035, "global_step": 350926, "epoch": 4228} {"train_loss": -26.155725479125977, "global_step": 350927, "epoch": 4228} {"train_loss": -26.003698348999023, "global_step": 350928, "epoch": 4228} {"train_loss": -26.056171417236328, "global_step": 350929, "epoch": 4228} {"train_loss": -25.7255859375, "global_step": 350930, "epoch": 4228} {"train_loss": -26.133596420288086, "global_step": 350931, "epoch": 4228} {"train_loss": -26.0340576171875, "global_step": 350932, "epoch": 4228} {"train_loss": -25.72200584411621, "global_step": 350933, "epoch": 4228} {"train_loss": -26.2634220123291, "global_step": 350934, "epoch": 4228} {"train_loss": -26.014570236206055, "global_step": 350935, "epoch": 4228} {"train_loss": -26.164377212524414, "global_step": 350936, "epoch": 4228} {"train_loss": -25.587682723999023, "global_step": 350937, "epoch": 4228} {"train_loss": -26.564044952392578, "global_step": 350938, "epoch": 4228} {"train_loss": -26.117938995361328, "global_step": 350939, "epoch": 4228} {"train_loss": -25.9808406829834, "global_step": 350940, "epoch": 4228} {"train_loss": -25.829532623291016, "global_step": 350941, "epoch": 4228} {"train_loss": -26.336746215820312, "global_step": 350942, "epoch": 4228} {"train_loss": -25.946924209594727, "global_step": 350943, "epoch": 4228} {"train_loss": -25.936960220336914, "global_step": 350944, "epoch": 4228} {"train_loss": -25.892230987548828, "global_step": 350945, "epoch": 4228} {"train_loss": -26.10560417175293, "global_step": 350946, "epoch": 4228} {"train_loss": -25.808984756469727, "global_step": 350947, "epoch": 4228} {"train_loss": -26.11545753479004, "global_step": 350948, "epoch": 4228} {"train_loss": -26.518268585205078, "global_step": 350949, "epoch": 4228} {"train_loss": -26.138004302978516, "global_step": 350950, "epoch": 4228} {"train_loss": -26.188451766967773, "global_step": 350951, "epoch": 4228} {"train_loss": -26.047927856445312, "global_step": 350952, "epoch": 4228} {"train_loss": -26.35575294494629, "global_step": 350953, "epoch": 4228} {"train_loss": -25.89082145690918, "global_step": 350954, "epoch": 4228} {"train_loss": -26.2869815826416, "global_step": 350955, "epoch": 4228} {"train_loss": -26.522449493408203, "global_step": 350956, "epoch": 4228} {"train_loss": -26.606430053710938, "global_step": 350957, "epoch": 4228} {"train_loss": -26.442121505737305, "global_step": 350958, "epoch": 4228} {"train_loss": -26.23206901550293, "global_step": 350959, "epoch": 4228} {"train_loss": -26.270421981811523, "global_step": 350960, "epoch": 4228} {"train_loss": -26.036283493041992, "global_step": 350961, "epoch": 4228} {"train_loss": -25.966339111328125, "global_step": 350962, "epoch": 4228} {"train_loss": -26.0772647857666, "global_step": 350963, "epoch": 4228} {"train_loss": -26.122983932495117, "global_step": 350964, "epoch": 4228} {"train_loss": -26.25575065612793, "global_step": 350965, "epoch": 4228} {"train_loss": -26.13396644592285, "global_step": 350966, "epoch": 4228} {"train_loss": -26.423267364501953, "global_step": 350967, "epoch": 4228} {"train_loss": -26.174762725830078, "global_step": 350968, "epoch": 4228} {"train_loss": -26.162622451782227, "global_step": 350969, "epoch": 4228} {"train_loss": -26.397476196289062, "global_step": 350970, "epoch": 4228} {"train_loss": -26.475387573242188, "global_step": 350971, "epoch": 4228} {"train_loss": -26.401823043823242, "global_step": 350972, "epoch": 4228} {"train_loss": -26.33546257019043, "global_step": 350973, "epoch": 4228} {"train_loss": -26.218597412109375, "global_step": 350974, "epoch": 4228} {"train_loss": -26.344776153564453, "global_step": 350975, "epoch": 4228} {"train_loss": -26.381872177124023, "global_step": 350976, "epoch": 4228} {"train_loss": -26.485010147094727, "global_step": 350977, "epoch": 4228} {"train_loss": -26.382858276367188, "global_step": 350978, "epoch": 4228} {"train_loss": -26.4451904296875, "global_step": 350979, "epoch": 4228} {"train_loss": -25.932287216186523, "global_step": 350980, "epoch": 4228} {"train_loss": -26.346561431884766, "global_step": 350981, "epoch": 4228} {"train_loss": -26.097639083862305, "global_step": 350982, "epoch": 4228} {"train_loss": -26.099653244018555, "global_step": 350983, "epoch": 4228} {"train_loss": -26.083154678344727, "global_step": 350984, "epoch": 4228} {"train_loss": -26.381275177001953, "global_step": 350985, "epoch": 4228} {"train_loss": -26.796783447265625, "global_step": 350986, "epoch": 4228} {"train_loss": -26.443323135375977, "global_step": 350987, "epoch": 4228} {"train_loss": -25.79892921447754, "global_step": 350988, "epoch": 4228} {"train_loss": -26.323383331298828, "global_step": 350989, "epoch": 4228} {"train_loss": -26.250104904174805, "global_step": 350990, "epoch": 4228} {"train_loss": -26.34637451171875, "global_step": 350991, "epoch": 4228} {"train_loss": -26.026708602905273, "global_step": 350992, "epoch": 4228} {"train_loss": -26.133798599243164, "global_step": 350993, "epoch": 4228} {"train_loss": -26.1385555267334, "global_step": 350994, "epoch": 4228} {"train_loss": -26.233963012695312, "global_step": 350995, "epoch": 4228} {"train_loss": -26.194751739501953, "global_step": 350996, "epoch": 4228} {"train_loss": -25.975133895874023, "global_step": 350997, "epoch": 4228} {"train_loss": -26.184537887573242, "global_step": 350998, "epoch": 4228} {"train_loss": -26.10190200805664, "global_step": 350999, "epoch": 4228} {"train_loss": -26.129714965820312, "global_step": 351000, "epoch": 4228} {"train_loss": -25.985370635986328, "global_step": 351001, "epoch": 4228} {"train_loss": -26.40583610534668, "global_step": 351002, "epoch": 4228} {"train_loss": -25.962421417236328, "global_step": 351003, "epoch": 4228} {"train_loss": -26.077844619750977, "global_step": 351004, "epoch": 4228} {"train_loss": -26.446491241455078, "global_step": 351005, "epoch": 4228} {"train_loss": -26.17549590604851, "global_step": 351006, "epoch": 4228, "val_loss": 6688670.0} {"train_loss": -26.066055297851562, "global_step": 351007, "epoch": 4229} {"train_loss": -25.430130004882812, "global_step": 351008, "epoch": 4229} {"train_loss": -25.689849853515625, "global_step": 351009, "epoch": 4229} {"train_loss": -25.531652450561523, "global_step": 351010, "epoch": 4229} {"train_loss": -25.953388214111328, "global_step": 351011, "epoch": 4229} {"train_loss": -25.979703903198242, "global_step": 351012, "epoch": 4229} {"train_loss": -25.486679077148438, "global_step": 351013, "epoch": 4229} {"train_loss": -25.57343864440918, "global_step": 351014, "epoch": 4229} {"train_loss": -25.657514572143555, "global_step": 351015, "epoch": 4229} {"train_loss": -25.387935638427734, "global_step": 351016, "epoch": 4229} {"train_loss": -26.0998592376709, "global_step": 351017, "epoch": 4229} {"train_loss": -25.7755184173584, "global_step": 351018, "epoch": 4229} {"train_loss": -25.75058364868164, "global_step": 351019, "epoch": 4229} {"train_loss": -25.616241455078125, "global_step": 351020, "epoch": 4229} {"train_loss": -25.854089736938477, "global_step": 351021, "epoch": 4229} {"train_loss": -25.93271827697754, "global_step": 351022, "epoch": 4229} {"train_loss": -25.847457885742188, "global_step": 351023, "epoch": 4229} {"train_loss": -26.049978256225586, "global_step": 351024, "epoch": 4229} {"train_loss": -25.797195434570312, "global_step": 351025, "epoch": 4229} {"train_loss": -25.674850463867188, "global_step": 351026, "epoch": 4229} {"train_loss": -26.099164962768555, "global_step": 351027, "epoch": 4229} {"train_loss": -26.149023056030273, "global_step": 351028, "epoch": 4229} {"train_loss": -26.0429630279541, "global_step": 351029, "epoch": 4229} {"train_loss": -26.08759117126465, "global_step": 351030, "epoch": 4229} {"train_loss": -26.21161460876465, "global_step": 351031, "epoch": 4229} {"train_loss": -25.84372901916504, "global_step": 351032, "epoch": 4229} {"train_loss": -26.295103073120117, "global_step": 351033, "epoch": 4229} {"train_loss": -26.048782348632812, "global_step": 351034, "epoch": 4229} {"train_loss": -25.936487197875977, "global_step": 351035, "epoch": 4229} {"train_loss": -26.28687858581543, "global_step": 351036, "epoch": 4229} {"train_loss": -26.337207794189453, "global_step": 351037, "epoch": 4229} {"train_loss": -26.449010848999023, "global_step": 351038, "epoch": 4229} {"train_loss": -26.322980880737305, "global_step": 351039, "epoch": 4229} {"train_loss": -26.237659454345703, "global_step": 351040, "epoch": 4229} {"train_loss": -26.141759872436523, "global_step": 351041, "epoch": 4229} {"train_loss": -26.33649253845215, "global_step": 351042, "epoch": 4229} {"train_loss": -26.445363998413086, "global_step": 351043, "epoch": 4229} {"train_loss": -26.628692626953125, "global_step": 351044, "epoch": 4229} {"train_loss": -26.2157039642334, "global_step": 351045, "epoch": 4229} {"train_loss": -26.395837783813477, "global_step": 351046, "epoch": 4229} {"train_loss": -26.581817626953125, "global_step": 351047, "epoch": 4229} {"train_loss": -26.305419921875, "global_step": 351048, "epoch": 4229} {"train_loss": -26.2269229888916, "global_step": 351049, "epoch": 4229} {"train_loss": -26.18694496154785, "global_step": 351050, "epoch": 4229} {"train_loss": -26.01209831237793, "global_step": 351051, "epoch": 4229} {"train_loss": -26.6422176361084, "global_step": 351052, "epoch": 4229} {"train_loss": -26.13136100769043, "global_step": 351053, "epoch": 4229} {"train_loss": -26.306333541870117, "global_step": 351054, "epoch": 4229} {"train_loss": -26.354400634765625, "global_step": 351055, "epoch": 4229} {"train_loss": -26.34016227722168, "global_step": 351056, "epoch": 4229} {"train_loss": -26.502485275268555, "global_step": 351057, "epoch": 4229} {"train_loss": -26.121450424194336, "global_step": 351058, "epoch": 4229} {"train_loss": -25.798358917236328, "global_step": 351059, "epoch": 4229} {"train_loss": -25.7557430267334, "global_step": 351060, "epoch": 4229} {"train_loss": -25.968780517578125, "global_step": 351061, "epoch": 4229} {"train_loss": -26.16143798828125, "global_step": 351062, "epoch": 4229} {"train_loss": -26.0010986328125, "global_step": 351063, "epoch": 4229} {"train_loss": -25.99319839477539, "global_step": 351064, "epoch": 4229} {"train_loss": -26.268157958984375, "global_step": 351065, "epoch": 4229} {"train_loss": -25.636463165283203, "global_step": 351066, "epoch": 4229} {"train_loss": -25.41267967224121, "global_step": 351067, "epoch": 4229} {"train_loss": -25.630395889282227, "global_step": 351068, "epoch": 4229} {"train_loss": -25.5377140045166, "global_step": 351069, "epoch": 4229} {"train_loss": -26.436511993408203, "global_step": 351070, "epoch": 4229} {"train_loss": -25.827070236206055, "global_step": 351071, "epoch": 4229} {"train_loss": -25.73390007019043, "global_step": 351072, "epoch": 4229} {"train_loss": -25.713315963745117, "global_step": 351073, "epoch": 4229} {"train_loss": -25.764272689819336, "global_step": 351074, "epoch": 4229} {"train_loss": -25.895465850830078, "global_step": 351075, "epoch": 4229} {"train_loss": -26.022565841674805, "global_step": 351076, "epoch": 4229} {"train_loss": -26.053207397460938, "global_step": 351077, "epoch": 4229} {"train_loss": -25.866241455078125, "global_step": 351078, "epoch": 4229} {"train_loss": -25.697851181030273, "global_step": 351079, "epoch": 4229} {"train_loss": -25.981473922729492, "global_step": 351080, "epoch": 4229} {"train_loss": -25.91171646118164, "global_step": 351081, "epoch": 4229} {"train_loss": -26.075342178344727, "global_step": 351082, "epoch": 4229} {"train_loss": -26.30609703063965, "global_step": 351083, "epoch": 4229} {"train_loss": -26.303991317749023, "global_step": 351084, "epoch": 4229} {"train_loss": -25.919885635375977, "global_step": 351085, "epoch": 4229} {"train_loss": -26.192609786987305, "global_step": 351086, "epoch": 4229} {"train_loss": -26.0972957611084, "global_step": 351087, "epoch": 4229} {"train_loss": -26.046091079711914, "global_step": 351088, "epoch": 4229} {"train_loss": -26.02082668442324, "global_step": 351089, "epoch": 4229, "val_loss": 6739955.0} {"train_loss": -25.63356590270996, "global_step": 351090, "epoch": 4230} {"train_loss": -25.930545806884766, "global_step": 351091, "epoch": 4230} {"train_loss": -25.7474365234375, "global_step": 351092, "epoch": 4230} {"train_loss": -26.111331939697266, "global_step": 351093, "epoch": 4230} {"train_loss": -26.049291610717773, "global_step": 351094, "epoch": 4230} {"train_loss": -25.745264053344727, "global_step": 351095, "epoch": 4230} {"train_loss": -26.25048828125, "global_step": 351096, "epoch": 4230} {"train_loss": -25.977783203125, "global_step": 351097, "epoch": 4230} {"train_loss": -25.823226928710938, "global_step": 351098, "epoch": 4230} {"train_loss": -26.044540405273438, "global_step": 351099, "epoch": 4230} {"train_loss": -26.009098052978516, "global_step": 351100, "epoch": 4230} {"train_loss": -26.17203712463379, "global_step": 351101, "epoch": 4230} {"train_loss": -26.29115867614746, "global_step": 351102, "epoch": 4230} {"train_loss": -25.90388298034668, "global_step": 351103, "epoch": 4230} {"train_loss": -26.00564956665039, "global_step": 351104, "epoch": 4230} {"train_loss": -25.94598960876465, "global_step": 351105, "epoch": 4230} {"train_loss": -25.718063354492188, "global_step": 351106, "epoch": 4230} {"train_loss": -25.892194747924805, "global_step": 351107, "epoch": 4230} {"train_loss": -25.7716121673584, "global_step": 351108, "epoch": 4230} {"train_loss": -25.922204971313477, "global_step": 351109, "epoch": 4230} {"train_loss": -26.14023208618164, "global_step": 351110, "epoch": 4230} {"train_loss": -26.17181968688965, "global_step": 351111, "epoch": 4230} {"train_loss": -26.243600845336914, "global_step": 351112, "epoch": 4230} {"train_loss": -26.19150733947754, "global_step": 351113, "epoch": 4230} {"train_loss": -25.97145652770996, "global_step": 351114, "epoch": 4230} {"train_loss": -26.26666831970215, "global_step": 351115, "epoch": 4230} {"train_loss": -26.058347702026367, "global_step": 351116, "epoch": 4230} {"train_loss": -26.438190460205078, "global_step": 351117, "epoch": 4230} {"train_loss": -25.732746124267578, "global_step": 351118, "epoch": 4230} {"train_loss": -26.039762496948242, "global_step": 351119, "epoch": 4230} {"train_loss": -25.9281063079834, "global_step": 351120, "epoch": 4230} {"train_loss": -26.224689483642578, "global_step": 351121, "epoch": 4230} {"train_loss": -25.175613403320312, "global_step": 351122, "epoch": 4230} {"train_loss": -26.24846839904785, "global_step": 351123, "epoch": 4230} {"train_loss": -26.33192253112793, "global_step": 351124, "epoch": 4230} {"train_loss": -26.3784122467041, "global_step": 351125, "epoch": 4230} {"train_loss": -26.072385787963867, "global_step": 351126, "epoch": 4230} {"train_loss": -26.162124633789062, "global_step": 351127, "epoch": 4230} {"train_loss": -26.019575119018555, "global_step": 351128, "epoch": 4230} {"train_loss": -26.092498779296875, "global_step": 351129, "epoch": 4230} {"train_loss": -25.7852783203125, "global_step": 351130, "epoch": 4230} {"train_loss": -26.215757369995117, "global_step": 351131, "epoch": 4230} {"train_loss": -26.179035186767578, "global_step": 351132, "epoch": 4230} {"train_loss": -25.90742301940918, "global_step": 351133, "epoch": 4230} {"train_loss": -26.34065055847168, "global_step": 351134, "epoch": 4230} {"train_loss": -25.905134201049805, "global_step": 351135, "epoch": 4230} {"train_loss": -26.266942977905273, "global_step": 351136, "epoch": 4230} {"train_loss": -26.30231285095215, "global_step": 351137, "epoch": 4230} {"train_loss": -25.93109130859375, "global_step": 351138, "epoch": 4230} {"train_loss": -26.10711669921875, "global_step": 351139, "epoch": 4230} {"train_loss": -26.631799697875977, "global_step": 351140, "epoch": 4230} {"train_loss": -26.44656753540039, "global_step": 351141, "epoch": 4230} {"train_loss": -26.1192626953125, "global_step": 351142, "epoch": 4230} {"train_loss": -25.95926856994629, "global_step": 351143, "epoch": 4230} {"train_loss": -26.26837158203125, "global_step": 351144, "epoch": 4230} {"train_loss": -25.895017623901367, "global_step": 351145, "epoch": 4230} {"train_loss": -26.455907821655273, "global_step": 351146, "epoch": 4230} {"train_loss": -26.28411293029785, "global_step": 351147, "epoch": 4230} {"train_loss": -26.182849884033203, "global_step": 351148, "epoch": 4230} {"train_loss": -25.906620025634766, "global_step": 351149, "epoch": 4230} {"train_loss": -26.74126625061035, "global_step": 351150, "epoch": 4230} {"train_loss": -26.10955238342285, "global_step": 351151, "epoch": 4230} {"train_loss": -26.362003326416016, "global_step": 351152, "epoch": 4230} {"train_loss": -26.190662384033203, "global_step": 351153, "epoch": 4230} {"train_loss": -26.099775314331055, "global_step": 351154, "epoch": 4230} {"train_loss": -26.49598503112793, "global_step": 351155, "epoch": 4230} {"train_loss": -26.482101440429688, "global_step": 351156, "epoch": 4230} {"train_loss": -26.048526763916016, "global_step": 351157, "epoch": 4230} {"train_loss": -26.280057907104492, "global_step": 351158, "epoch": 4230} {"train_loss": -26.24740982055664, "global_step": 351159, "epoch": 4230} {"train_loss": -26.503692626953125, "global_step": 351160, "epoch": 4230} {"train_loss": -25.99420738220215, "global_step": 351161, "epoch": 4230} {"train_loss": -26.058643341064453, "global_step": 351162, "epoch": 4230} {"train_loss": -25.865625381469727, "global_step": 351163, "epoch": 4230} {"train_loss": -26.453022003173828, "global_step": 351164, "epoch": 4230} {"train_loss": -26.116323471069336, "global_step": 351165, "epoch": 4230} {"train_loss": -26.575109481811523, "global_step": 351166, "epoch": 4230} {"train_loss": -26.003751754760742, "global_step": 351167, "epoch": 4230} {"train_loss": -26.165796279907227, "global_step": 351168, "epoch": 4230} {"train_loss": -26.30490493774414, "global_step": 351169, "epoch": 4230} {"train_loss": -26.21463966369629, "global_step": 351170, "epoch": 4230} {"train_loss": -26.344785690307617, "global_step": 351171, "epoch": 4230} {"train_loss": -26.130171833268133, "global_step": 351172, "epoch": 4230, "val_loss": 6672440.0} {"train_loss": -25.9320068359375, "global_step": 351173, "epoch": 4231} {"train_loss": -25.8878231048584, "global_step": 351174, "epoch": 4231} {"train_loss": -25.64969825744629, "global_step": 351175, "epoch": 4231} {"train_loss": -26.05134391784668, "global_step": 351176, "epoch": 4231} {"train_loss": -25.66912841796875, "global_step": 351177, "epoch": 4231} {"train_loss": -25.743209838867188, "global_step": 351178, "epoch": 4231} {"train_loss": -25.969120025634766, "global_step": 351179, "epoch": 4231} {"train_loss": -25.57421112060547, "global_step": 351180, "epoch": 4231} {"train_loss": -25.64618492126465, "global_step": 351181, "epoch": 4231} {"train_loss": -25.936054229736328, "global_step": 351182, "epoch": 4231} {"train_loss": -25.596088409423828, "global_step": 351183, "epoch": 4231} {"train_loss": -26.022846221923828, "global_step": 351184, "epoch": 4231} {"train_loss": -26.049774169921875, "global_step": 351185, "epoch": 4231} {"train_loss": -25.955841064453125, "global_step": 351186, "epoch": 4231} {"train_loss": -26.030744552612305, "global_step": 351187, "epoch": 4231} {"train_loss": -26.01356315612793, "global_step": 351188, "epoch": 4231} {"train_loss": -26.154294967651367, "global_step": 351189, "epoch": 4231} {"train_loss": -25.695505142211914, "global_step": 351190, "epoch": 4231} {"train_loss": -25.810327529907227, "global_step": 351191, "epoch": 4231} {"train_loss": -25.64332389831543, "global_step": 351192, "epoch": 4231} {"train_loss": -26.290149688720703, "global_step": 351193, "epoch": 4231} {"train_loss": -26.365070343017578, "global_step": 351194, "epoch": 4231} {"train_loss": -26.071481704711914, "global_step": 351195, "epoch": 4231} {"train_loss": -26.268878936767578, "global_step": 351196, "epoch": 4231} {"train_loss": -26.413040161132812, "global_step": 351197, "epoch": 4231} {"train_loss": -25.9648494720459, "global_step": 351198, "epoch": 4231} {"train_loss": -26.190479278564453, "global_step": 351199, "epoch": 4231} {"train_loss": -25.766143798828125, "global_step": 351200, "epoch": 4231} {"train_loss": -26.53415870666504, "global_step": 351201, "epoch": 4231} {"train_loss": -26.56062889099121, "global_step": 351202, "epoch": 4231} {"train_loss": -26.065927505493164, "global_step": 351203, "epoch": 4231} {"train_loss": -26.42055320739746, "global_step": 351204, "epoch": 4231} {"train_loss": -26.2919864654541, "global_step": 351205, "epoch": 4231} {"train_loss": -26.187931060791016, "global_step": 351206, "epoch": 4231} {"train_loss": -26.117963790893555, "global_step": 351207, "epoch": 4231} {"train_loss": -26.391260147094727, "global_step": 351208, "epoch": 4231} {"train_loss": -26.533185958862305, "global_step": 351209, "epoch": 4231} {"train_loss": -26.595233917236328, "global_step": 351210, "epoch": 4231} {"train_loss": -26.298017501831055, "global_step": 351211, "epoch": 4231} {"train_loss": -25.904760360717773, "global_step": 351212, "epoch": 4231} {"train_loss": -26.39141273498535, "global_step": 351213, "epoch": 4231} {"train_loss": -26.34210777282715, "global_step": 351214, "epoch": 4231} {"train_loss": -26.438337326049805, "global_step": 351215, "epoch": 4231} {"train_loss": -26.157489776611328, "global_step": 351216, "epoch": 4231} {"train_loss": -26.159841537475586, "global_step": 351217, "epoch": 4231} {"train_loss": -26.22031593322754, "global_step": 351218, "epoch": 4231} {"train_loss": -26.21347999572754, "global_step": 351219, "epoch": 4231} {"train_loss": -26.33979606628418, "global_step": 351220, "epoch": 4231} {"train_loss": -26.33880615234375, "global_step": 351221, "epoch": 4231} {"train_loss": -26.22757339477539, "global_step": 351222, "epoch": 4231} {"train_loss": -25.696197509765625, "global_step": 351223, "epoch": 4231} {"train_loss": -25.99880027770996, "global_step": 351224, "epoch": 4231} {"train_loss": -26.064319610595703, "global_step": 351225, "epoch": 4231} {"train_loss": -26.048505783081055, "global_step": 351226, "epoch": 4231} {"train_loss": -26.501001358032227, "global_step": 351227, "epoch": 4231} {"train_loss": -26.540435791015625, "global_step": 351228, "epoch": 4231} {"train_loss": -26.385944366455078, "global_step": 351229, "epoch": 4231} {"train_loss": -26.47515869140625, "global_step": 351230, "epoch": 4231} {"train_loss": -26.12873649597168, "global_step": 351231, "epoch": 4231} {"train_loss": -25.773008346557617, "global_step": 351232, "epoch": 4231} {"train_loss": -26.198944091796875, "global_step": 351233, "epoch": 4231} {"train_loss": -26.602313995361328, "global_step": 351234, "epoch": 4231} {"train_loss": -26.111591339111328, "global_step": 351235, "epoch": 4231} {"train_loss": -25.9548397064209, "global_step": 351236, "epoch": 4231} {"train_loss": -26.067209243774414, "global_step": 351237, "epoch": 4231} {"train_loss": -26.2823486328125, "global_step": 351238, "epoch": 4231} {"train_loss": -26.042877197265625, "global_step": 351239, "epoch": 4231} {"train_loss": -26.3122501373291, "global_step": 351240, "epoch": 4231} {"train_loss": -26.550342559814453, "global_step": 351241, "epoch": 4231} {"train_loss": -26.194181442260742, "global_step": 351242, "epoch": 4231} {"train_loss": -25.94952964782715, "global_step": 351243, "epoch": 4231} {"train_loss": -26.292150497436523, "global_step": 351244, "epoch": 4231} {"train_loss": -25.397598266601562, "global_step": 351245, "epoch": 4231} {"train_loss": -25.286184310913086, "global_step": 351246, "epoch": 4231} {"train_loss": -25.511898040771484, "global_step": 351247, "epoch": 4231} {"train_loss": -25.714618682861328, "global_step": 351248, "epoch": 4231} {"train_loss": -26.03680419921875, "global_step": 351249, "epoch": 4231} {"train_loss": -25.48805046081543, "global_step": 351250, "epoch": 4231} {"train_loss": -26.0329647064209, "global_step": 351251, "epoch": 4231} {"train_loss": -25.87574577331543, "global_step": 351252, "epoch": 4231} {"train_loss": -25.891498565673828, "global_step": 351253, "epoch": 4231} {"train_loss": -26.220706939697266, "global_step": 351254, "epoch": 4231} {"train_loss": -26.09705706676805, "global_step": 351255, "epoch": 4231, "val_loss": 6654884.0} {"train_loss": -25.041427612304688, "global_step": 351256, "epoch": 4232} {"train_loss": -25.375045776367188, "global_step": 351257, "epoch": 4232} {"train_loss": -25.580732345581055, "global_step": 351258, "epoch": 4232} {"train_loss": -25.719541549682617, "global_step": 351259, "epoch": 4232} {"train_loss": -25.522207260131836, "global_step": 351260, "epoch": 4232} {"train_loss": -25.723535537719727, "global_step": 351261, "epoch": 4232} {"train_loss": -25.689193725585938, "global_step": 351262, "epoch": 4232} {"train_loss": -25.910451889038086, "global_step": 351263, "epoch": 4232} {"train_loss": -25.63604736328125, "global_step": 351264, "epoch": 4232} {"train_loss": -25.602338790893555, "global_step": 351265, "epoch": 4232} {"train_loss": -26.141738891601562, "global_step": 351266, "epoch": 4232} {"train_loss": -25.659717559814453, "global_step": 351267, "epoch": 4232} {"train_loss": -26.04514503479004, "global_step": 351268, "epoch": 4232} {"train_loss": -26.23048210144043, "global_step": 351269, "epoch": 4232} {"train_loss": -26.475234985351562, "global_step": 351270, "epoch": 4232} {"train_loss": -26.03944969177246, "global_step": 351271, "epoch": 4232} {"train_loss": -26.08831214904785, "global_step": 351272, "epoch": 4232} {"train_loss": -26.273406982421875, "global_step": 351273, "epoch": 4232} {"train_loss": -26.32802391052246, "global_step": 351274, "epoch": 4232} {"train_loss": -26.3292236328125, "global_step": 351275, "epoch": 4232} {"train_loss": -25.89845085144043, "global_step": 351276, "epoch": 4232} {"train_loss": -25.927234649658203, "global_step": 351277, "epoch": 4232} {"train_loss": -26.025365829467773, "global_step": 351278, "epoch": 4232} {"train_loss": -26.12293815612793, "global_step": 351279, "epoch": 4232} {"train_loss": -26.23046875, "global_step": 351280, "epoch": 4232} {"train_loss": -25.976703643798828, "global_step": 351281, "epoch": 4232} {"train_loss": -26.088836669921875, "global_step": 351282, "epoch": 4232} {"train_loss": -26.176116943359375, "global_step": 351283, "epoch": 4232} {"train_loss": -26.219324111938477, "global_step": 351284, "epoch": 4232} {"train_loss": -26.193790435791016, "global_step": 351285, "epoch": 4232} {"train_loss": -26.476490020751953, "global_step": 351286, "epoch": 4232} {"train_loss": -26.2716007232666, "global_step": 351287, "epoch": 4232} {"train_loss": -26.24749755859375, "global_step": 351288, "epoch": 4232} {"train_loss": -26.119970321655273, "global_step": 351289, "epoch": 4232} {"train_loss": -26.06770133972168, "global_step": 351290, "epoch": 4232} {"train_loss": -26.264005661010742, "global_step": 351291, "epoch": 4232} {"train_loss": -26.293994903564453, "global_step": 351292, "epoch": 4232} {"train_loss": -26.23188591003418, "global_step": 351293, "epoch": 4232} {"train_loss": -26.495197296142578, "global_step": 351294, "epoch": 4232} {"train_loss": -26.214941024780273, "global_step": 351295, "epoch": 4232} {"train_loss": -26.118244171142578, "global_step": 351296, "epoch": 4232} {"train_loss": -26.4057674407959, "global_step": 351297, "epoch": 4232} {"train_loss": -26.380537033081055, "global_step": 351298, "epoch": 4232} {"train_loss": -25.980443954467773, "global_step": 351299, "epoch": 4232} {"train_loss": -26.498321533203125, "global_step": 351300, "epoch": 4232} {"train_loss": -26.4007625579834, "global_step": 351301, "epoch": 4232} {"train_loss": -26.175344467163086, "global_step": 351302, "epoch": 4232} {"train_loss": -26.565969467163086, "global_step": 351303, "epoch": 4232} {"train_loss": -26.636938095092773, "global_step": 351304, "epoch": 4232} {"train_loss": -26.3048038482666, "global_step": 351305, "epoch": 4232} {"train_loss": -26.325117111206055, "global_step": 351306, "epoch": 4232} {"train_loss": -26.68178367614746, "global_step": 351307, "epoch": 4232} {"train_loss": -26.222875595092773, "global_step": 351308, "epoch": 4232} {"train_loss": -26.71075439453125, "global_step": 351309, "epoch": 4232} {"train_loss": -26.17363929748535, "global_step": 351310, "epoch": 4232} {"train_loss": -26.11359214782715, "global_step": 351311, "epoch": 4232} {"train_loss": -26.251562118530273, "global_step": 351312, "epoch": 4232} {"train_loss": -26.77095603942871, "global_step": 351313, "epoch": 4232} {"train_loss": -26.456985473632812, "global_step": 351314, "epoch": 4232} {"train_loss": -26.25225257873535, "global_step": 351315, "epoch": 4232} {"train_loss": -25.66864585876465, "global_step": 351316, "epoch": 4232} {"train_loss": -25.465070724487305, "global_step": 351317, "epoch": 4232} {"train_loss": -25.589101791381836, "global_step": 351318, "epoch": 4232} {"train_loss": -25.97150230407715, "global_step": 351319, "epoch": 4232} {"train_loss": -25.383512496948242, "global_step": 351320, "epoch": 4232} {"train_loss": -25.732925415039062, "global_step": 351321, "epoch": 4232} {"train_loss": -26.378385543823242, "global_step": 351322, "epoch": 4232} {"train_loss": -25.713577270507812, "global_step": 351323, "epoch": 4232} {"train_loss": -26.317184448242188, "global_step": 351324, "epoch": 4232} {"train_loss": -26.098981857299805, "global_step": 351325, "epoch": 4232} {"train_loss": -25.76963233947754, "global_step": 351326, "epoch": 4232} {"train_loss": -26.472599029541016, "global_step": 351327, "epoch": 4232} {"train_loss": -25.91004753112793, "global_step": 351328, "epoch": 4232} {"train_loss": -26.379980087280273, "global_step": 351329, "epoch": 4232} {"train_loss": -26.206029891967773, "global_step": 351330, "epoch": 4232} {"train_loss": -26.18946647644043, "global_step": 351331, "epoch": 4232} {"train_loss": -26.160083770751953, "global_step": 351332, "epoch": 4232} {"train_loss": -25.914478302001953, "global_step": 351333, "epoch": 4232} {"train_loss": -26.17594337463379, "global_step": 351334, "epoch": 4232} {"train_loss": -26.062910079956055, "global_step": 351335, "epoch": 4232} {"train_loss": -26.117177963256836, "global_step": 351336, "epoch": 4232} {"train_loss": -26.320402145385742, "global_step": 351337, "epoch": 4232} {"train_loss": -26.10946744895843, "global_step": 351338, "epoch": 4232, "val_loss": 6684835.0} {"train_loss": -24.30037498474121, "global_step": 351339, "epoch": 4233} {"train_loss": -24.979698181152344, "global_step": 351340, "epoch": 4233} {"train_loss": -25.738794326782227, "global_step": 351341, "epoch": 4233} {"train_loss": -25.710712432861328, "global_step": 351342, "epoch": 4233} {"train_loss": -25.71991539001465, "global_step": 351343, "epoch": 4233} {"train_loss": -25.329015731811523, "global_step": 351344, "epoch": 4233} {"train_loss": -25.290605545043945, "global_step": 351345, "epoch": 4233} {"train_loss": -25.481863021850586, "global_step": 351346, "epoch": 4233} {"train_loss": -25.505353927612305, "global_step": 351347, "epoch": 4233} {"train_loss": -25.9366512298584, "global_step": 351348, "epoch": 4233} {"train_loss": -25.665985107421875, "global_step": 351349, "epoch": 4233} {"train_loss": -25.796552658081055, "global_step": 351350, "epoch": 4233} {"train_loss": -25.696456909179688, "global_step": 351351, "epoch": 4233} {"train_loss": -25.878950119018555, "global_step": 351352, "epoch": 4233} {"train_loss": -25.5714111328125, "global_step": 351353, "epoch": 4233} {"train_loss": -26.194019317626953, "global_step": 351354, "epoch": 4233} {"train_loss": -25.375032424926758, "global_step": 351355, "epoch": 4233} {"train_loss": -25.954248428344727, "global_step": 351356, "epoch": 4233} {"train_loss": -26.128461837768555, "global_step": 351357, "epoch": 4233} {"train_loss": -26.10105323791504, "global_step": 351358, "epoch": 4233} {"train_loss": -25.835128784179688, "global_step": 351359, "epoch": 4233} {"train_loss": -26.25592041015625, "global_step": 351360, "epoch": 4233} {"train_loss": -26.378406524658203, "global_step": 351361, "epoch": 4233} {"train_loss": -26.229467391967773, "global_step": 351362, "epoch": 4233} {"train_loss": -26.149457931518555, "global_step": 351363, "epoch": 4233} {"train_loss": -26.103900909423828, "global_step": 351364, "epoch": 4233} {"train_loss": -26.092065811157227, "global_step": 351365, "epoch": 4233} {"train_loss": -26.140722274780273, "global_step": 351366, "epoch": 4233} {"train_loss": -26.087493896484375, "global_step": 351367, "epoch": 4233} {"train_loss": -25.83509635925293, "global_step": 351368, "epoch": 4233} {"train_loss": -25.920194625854492, "global_step": 351369, "epoch": 4233} {"train_loss": -26.265409469604492, "global_step": 351370, "epoch": 4233} {"train_loss": -26.177160263061523, "global_step": 351371, "epoch": 4233} {"train_loss": -25.98927879333496, "global_step": 351372, "epoch": 4233} {"train_loss": -25.822040557861328, "global_step": 351373, "epoch": 4233} {"train_loss": -25.9467830657959, "global_step": 351374, "epoch": 4233} {"train_loss": -26.51422119140625, "global_step": 351375, "epoch": 4233} {"train_loss": -26.052099227905273, "global_step": 351376, "epoch": 4233} {"train_loss": -26.490087509155273, "global_step": 351377, "epoch": 4233} {"train_loss": -26.038419723510742, "global_step": 351378, "epoch": 4233} {"train_loss": -26.350238800048828, "global_step": 351379, "epoch": 4233} {"train_loss": -26.14185905456543, "global_step": 351380, "epoch": 4233} {"train_loss": -25.95517349243164, "global_step": 351381, "epoch": 4233} {"train_loss": -26.126937866210938, "global_step": 351382, "epoch": 4233} {"train_loss": -26.090158462524414, "global_step": 351383, "epoch": 4233} {"train_loss": -26.6767635345459, "global_step": 351384, "epoch": 4233} {"train_loss": -26.30291748046875, "global_step": 351385, "epoch": 4233} {"train_loss": -25.858551025390625, "global_step": 351386, "epoch": 4233} {"train_loss": -26.1719913482666, "global_step": 351387, "epoch": 4233} {"train_loss": -26.137842178344727, "global_step": 351388, "epoch": 4233} {"train_loss": -26.218799591064453, "global_step": 351389, "epoch": 4233} {"train_loss": -26.003238677978516, "global_step": 351390, "epoch": 4233} {"train_loss": -26.2664737701416, "global_step": 351391, "epoch": 4233} {"train_loss": -26.02750587463379, "global_step": 351392, "epoch": 4233} {"train_loss": -26.215213775634766, "global_step": 351393, "epoch": 4233} {"train_loss": -26.330738067626953, "global_step": 351394, "epoch": 4233} {"train_loss": -26.100996017456055, "global_step": 351395, "epoch": 4233} {"train_loss": -26.229894638061523, "global_step": 351396, "epoch": 4233} {"train_loss": -26.11328125, "global_step": 351397, "epoch": 4233} {"train_loss": -26.375242233276367, "global_step": 351398, "epoch": 4233} {"train_loss": -25.892974853515625, "global_step": 351399, "epoch": 4233} {"train_loss": -26.16819190979004, "global_step": 351400, "epoch": 4233} {"train_loss": -26.319244384765625, "global_step": 351401, "epoch": 4233} {"train_loss": -26.279937744140625, "global_step": 351402, "epoch": 4233} {"train_loss": -26.005224227905273, "global_step": 351403, "epoch": 4233} {"train_loss": -26.45237159729004, "global_step": 351404, "epoch": 4233} {"train_loss": -26.49018669128418, "global_step": 351405, "epoch": 4233} {"train_loss": -26.330053329467773, "global_step": 351406, "epoch": 4233} {"train_loss": -26.0421085357666, "global_step": 351407, "epoch": 4233} {"train_loss": -26.391279220581055, "global_step": 351408, "epoch": 4233} {"train_loss": -26.268579483032227, "global_step": 351409, "epoch": 4233} {"train_loss": -26.183629989624023, "global_step": 351410, "epoch": 4233} {"train_loss": -26.020309448242188, "global_step": 351411, "epoch": 4233} {"train_loss": -26.264545440673828, "global_step": 351412, "epoch": 4233} {"train_loss": -26.818592071533203, "global_step": 351413, "epoch": 4233} {"train_loss": -25.978839874267578, "global_step": 351414, "epoch": 4233} {"train_loss": -26.11716079711914, "global_step": 351415, "epoch": 4233} {"train_loss": -25.54590606689453, "global_step": 351416, "epoch": 4233} {"train_loss": -26.627063751220703, "global_step": 351417, "epoch": 4233} {"train_loss": -26.2132511138916, "global_step": 351418, "epoch": 4233} {"train_loss": -26.0626163482666, "global_step": 351419, "epoch": 4233} {"train_loss": -25.7119140625, "global_step": 351420, "epoch": 4233} {"train_loss": -26.04276454879577, "global_step": 351421, "epoch": 4233, "val_loss": 6723411.0} {"train_loss": -23.754098892211914, "global_step": 351422, "epoch": 4234} {"train_loss": -24.615781784057617, "global_step": 351423, "epoch": 4234} {"train_loss": -25.345977783203125, "global_step": 351424, "epoch": 4234} {"train_loss": -24.8621768951416, "global_step": 351425, "epoch": 4234} {"train_loss": -25.08589744567871, "global_step": 351426, "epoch": 4234} {"train_loss": -24.484153747558594, "global_step": 351427, "epoch": 4234} {"train_loss": -25.10788345336914, "global_step": 351428, "epoch": 4234} {"train_loss": -24.93096351623535, "global_step": 351429, "epoch": 4234} {"train_loss": -25.14264488220215, "global_step": 351430, "epoch": 4234} {"train_loss": -25.414169311523438, "global_step": 351431, "epoch": 4234} {"train_loss": -25.21405601501465, "global_step": 351432, "epoch": 4234} {"train_loss": -25.356754302978516, "global_step": 351433, "epoch": 4234} {"train_loss": -25.323749542236328, "global_step": 351434, "epoch": 4234} {"train_loss": -25.225025177001953, "global_step": 351435, "epoch": 4234} {"train_loss": -25.54976463317871, "global_step": 351436, "epoch": 4234} {"train_loss": -25.4995174407959, "global_step": 351437, "epoch": 4234} {"train_loss": -25.57614517211914, "global_step": 351438, "epoch": 4234} {"train_loss": -25.698596954345703, "global_step": 351439, "epoch": 4234} {"train_loss": -25.687591552734375, "global_step": 351440, "epoch": 4234} {"train_loss": -25.53046989440918, "global_step": 351441, "epoch": 4234} {"train_loss": -26.06873893737793, "global_step": 351442, "epoch": 4234} {"train_loss": -26.032394409179688, "global_step": 351443, "epoch": 4234} {"train_loss": -25.576278686523438, "global_step": 351444, "epoch": 4234} {"train_loss": -25.7103271484375, "global_step": 351445, "epoch": 4234} {"train_loss": -26.07465171813965, "global_step": 351446, "epoch": 4234} {"train_loss": -26.018033981323242, "global_step": 351447, "epoch": 4234} {"train_loss": -25.8094482421875, "global_step": 351448, "epoch": 4234} {"train_loss": -25.84921646118164, "global_step": 351449, "epoch": 4234} {"train_loss": -26.148176193237305, "global_step": 351450, "epoch": 4234} {"train_loss": -25.863752365112305, "global_step": 351451, "epoch": 4234} {"train_loss": -26.066421508789062, "global_step": 351452, "epoch": 4234} {"train_loss": -26.01373863220215, "global_step": 351453, "epoch": 4234} {"train_loss": -26.270200729370117, "global_step": 351454, "epoch": 4234} {"train_loss": -25.857975006103516, "global_step": 351455, "epoch": 4234} {"train_loss": -26.15292739868164, "global_step": 351456, "epoch": 4234} {"train_loss": -26.066516876220703, "global_step": 351457, "epoch": 4234} {"train_loss": -25.9486026763916, "global_step": 351458, "epoch": 4234} {"train_loss": -26.01333999633789, "global_step": 351459, "epoch": 4234} {"train_loss": -25.856231689453125, "global_step": 351460, "epoch": 4234} {"train_loss": -26.184778213500977, "global_step": 351461, "epoch": 4234} {"train_loss": -26.042774200439453, "global_step": 351462, "epoch": 4234} {"train_loss": -25.90872573852539, "global_step": 351463, "epoch": 4234} {"train_loss": -26.276391983032227, "global_step": 351464, "epoch": 4234} {"train_loss": -26.0327091217041, "global_step": 351465, "epoch": 4234} {"train_loss": -26.1647891998291, "global_step": 351466, "epoch": 4234} {"train_loss": -26.69415283203125, "global_step": 351467, "epoch": 4234} {"train_loss": -26.233173370361328, "global_step": 351468, "epoch": 4234} {"train_loss": -25.9614315032959, "global_step": 351469, "epoch": 4234} {"train_loss": -26.086938858032227, "global_step": 351470, "epoch": 4234} {"train_loss": -26.35031509399414, "global_step": 351471, "epoch": 4234} {"train_loss": -26.116077423095703, "global_step": 351472, "epoch": 4234} {"train_loss": -25.994129180908203, "global_step": 351473, "epoch": 4234} {"train_loss": -26.1208553314209, "global_step": 351474, "epoch": 4234} {"train_loss": -26.185504913330078, "global_step": 351475, "epoch": 4234} {"train_loss": -26.213459014892578, "global_step": 351476, "epoch": 4234} {"train_loss": -26.044849395751953, "global_step": 351477, "epoch": 4234} {"train_loss": -26.26767349243164, "global_step": 351478, "epoch": 4234} {"train_loss": -25.934186935424805, "global_step": 351479, "epoch": 4234} {"train_loss": -26.094099044799805, "global_step": 351480, "epoch": 4234} {"train_loss": -26.15860939025879, "global_step": 351481, "epoch": 4234} {"train_loss": -26.03285789489746, "global_step": 351482, "epoch": 4234} {"train_loss": -25.59660530090332, "global_step": 351483, "epoch": 4234} {"train_loss": -26.380468368530273, "global_step": 351484, "epoch": 4234} {"train_loss": -26.30625343322754, "global_step": 351485, "epoch": 4234} {"train_loss": -25.832971572875977, "global_step": 351486, "epoch": 4234} {"train_loss": -26.1623592376709, "global_step": 351487, "epoch": 4234} {"train_loss": -25.777658462524414, "global_step": 351488, "epoch": 4234} {"train_loss": -25.744354248046875, "global_step": 351489, "epoch": 4234} {"train_loss": -25.829435348510742, "global_step": 351490, "epoch": 4234} {"train_loss": -26.2023868560791, "global_step": 351491, "epoch": 4234} {"train_loss": -26.236997604370117, "global_step": 351492, "epoch": 4234} {"train_loss": -25.914386749267578, "global_step": 351493, "epoch": 4234} {"train_loss": -26.11423110961914, "global_step": 351494, "epoch": 4234} {"train_loss": -25.9580078125, "global_step": 351495, "epoch": 4234} {"train_loss": -26.51287269592285, "global_step": 351496, "epoch": 4234} {"train_loss": -26.0993595123291, "global_step": 351497, "epoch": 4234} {"train_loss": -26.24958610534668, "global_step": 351498, "epoch": 4234} {"train_loss": -26.076446533203125, "global_step": 351499, "epoch": 4234} {"train_loss": -26.022537231445312, "global_step": 351500, "epoch": 4234} {"train_loss": -25.968976974487305, "global_step": 351501, "epoch": 4234} {"train_loss": -26.021087646484375, "global_step": 351502, "epoch": 4234} {"train_loss": -25.788482666015625, "global_step": 351503, "epoch": 4234} {"train_loss": -25.83838451339538, "global_step": 351504, "epoch": 4234, "val_loss": 6717919.0} {"train_loss": -25.55927085876465, "global_step": 351505, "epoch": 4235} {"train_loss": -25.401958465576172, "global_step": 351506, "epoch": 4235} {"train_loss": -25.285938262939453, "global_step": 351507, "epoch": 4235} {"train_loss": -25.66306495666504, "global_step": 351508, "epoch": 4235} {"train_loss": -25.257038116455078, "global_step": 351509, "epoch": 4235} {"train_loss": -26.00029945373535, "global_step": 351510, "epoch": 4235} {"train_loss": -25.895654678344727, "global_step": 351511, "epoch": 4235} {"train_loss": -25.831022262573242, "global_step": 351512, "epoch": 4235} {"train_loss": -25.62489891052246, "global_step": 351513, "epoch": 4235} {"train_loss": -25.751617431640625, "global_step": 351514, "epoch": 4235} {"train_loss": -25.736103057861328, "global_step": 351515, "epoch": 4235} {"train_loss": -25.672027587890625, "global_step": 351516, "epoch": 4235} {"train_loss": -26.188552856445312, "global_step": 351517, "epoch": 4235} {"train_loss": -25.751691818237305, "global_step": 351518, "epoch": 4235} {"train_loss": -25.902667999267578, "global_step": 351519, "epoch": 4235} {"train_loss": -25.76710319519043, "global_step": 351520, "epoch": 4235} {"train_loss": -25.949201583862305, "global_step": 351521, "epoch": 4235} {"train_loss": -26.06512451171875, "global_step": 351522, "epoch": 4235} {"train_loss": -25.74203872680664, "global_step": 351523, "epoch": 4235} {"train_loss": -25.88067626953125, "global_step": 351524, "epoch": 4235} {"train_loss": -26.345808029174805, "global_step": 351525, "epoch": 4235} {"train_loss": -25.90288734436035, "global_step": 351526, "epoch": 4235} {"train_loss": -26.249486923217773, "global_step": 351527, "epoch": 4235} {"train_loss": -25.807188034057617, "global_step": 351528, "epoch": 4235} {"train_loss": -25.782934188842773, "global_step": 351529, "epoch": 4235} {"train_loss": -26.348834991455078, "global_step": 351530, "epoch": 4235} {"train_loss": -26.614139556884766, "global_step": 351531, "epoch": 4235} {"train_loss": -26.00471305847168, "global_step": 351532, "epoch": 4235} {"train_loss": -26.14054298400879, "global_step": 351533, "epoch": 4235} {"train_loss": -26.356428146362305, "global_step": 351534, "epoch": 4235} {"train_loss": -26.401702880859375, "global_step": 351535, "epoch": 4235} {"train_loss": -26.235076904296875, "global_step": 351536, "epoch": 4235} {"train_loss": -26.16501808166504, "global_step": 351537, "epoch": 4235} {"train_loss": -26.36179542541504, "global_step": 351538, "epoch": 4235} {"train_loss": -26.21550941467285, "global_step": 351539, "epoch": 4235} {"train_loss": -26.08112907409668, "global_step": 351540, "epoch": 4235} {"train_loss": -26.5135498046875, "global_step": 351541, "epoch": 4235} {"train_loss": -26.29949951171875, "global_step": 351542, "epoch": 4235} {"train_loss": -26.152204513549805, "global_step": 351543, "epoch": 4235} {"train_loss": -26.367528915405273, "global_step": 351544, "epoch": 4235} {"train_loss": -26.297901153564453, "global_step": 351545, "epoch": 4235} {"train_loss": -26.082605361938477, "global_step": 351546, "epoch": 4235} {"train_loss": -26.369449615478516, "global_step": 351547, "epoch": 4235} {"train_loss": -26.692834854125977, "global_step": 351548, "epoch": 4235} {"train_loss": -26.15692138671875, "global_step": 351549, "epoch": 4235} {"train_loss": -26.42146873474121, "global_step": 351550, "epoch": 4235} {"train_loss": -25.834943771362305, "global_step": 351551, "epoch": 4235} {"train_loss": -26.34636878967285, "global_step": 351552, "epoch": 4235} {"train_loss": -26.46816062927246, "global_step": 351553, "epoch": 4235} {"train_loss": -26.49531364440918, "global_step": 351554, "epoch": 4235} {"train_loss": -26.041296005249023, "global_step": 351555, "epoch": 4235} {"train_loss": -26.518890380859375, "global_step": 351556, "epoch": 4235} {"train_loss": -25.854642868041992, "global_step": 351557, "epoch": 4235} {"train_loss": -26.26917839050293, "global_step": 351558, "epoch": 4235} {"train_loss": -26.42707633972168, "global_step": 351559, "epoch": 4235} {"train_loss": -26.399250030517578, "global_step": 351560, "epoch": 4235} {"train_loss": -26.2961483001709, "global_step": 351561, "epoch": 4235} {"train_loss": -26.400785446166992, "global_step": 351562, "epoch": 4235} {"train_loss": -26.16571617126465, "global_step": 351563, "epoch": 4235} {"train_loss": -26.260404586791992, "global_step": 351564, "epoch": 4235} {"train_loss": -26.157323837280273, "global_step": 351565, "epoch": 4235} {"train_loss": -26.20001220703125, "global_step": 351566, "epoch": 4235} {"train_loss": -25.917285919189453, "global_step": 351567, "epoch": 4235} {"train_loss": -25.532928466796875, "global_step": 351568, "epoch": 4235} {"train_loss": -24.723913192749023, "global_step": 351569, "epoch": 4235} {"train_loss": -25.489595413208008, "global_step": 351570, "epoch": 4235} {"train_loss": -25.96161460876465, "global_step": 351571, "epoch": 4235} {"train_loss": -25.951929092407227, "global_step": 351572, "epoch": 4235} {"train_loss": -25.390104293823242, "global_step": 351573, "epoch": 4235} {"train_loss": -25.93910789489746, "global_step": 351574, "epoch": 4235} {"train_loss": -25.95301628112793, "global_step": 351575, "epoch": 4235} {"train_loss": -25.587125778198242, "global_step": 351576, "epoch": 4235} {"train_loss": -26.087158203125, "global_step": 351577, "epoch": 4235} {"train_loss": -25.76987648010254, "global_step": 351578, "epoch": 4235} {"train_loss": -25.88763427734375, "global_step": 351579, "epoch": 4235} {"train_loss": -25.902734756469727, "global_step": 351580, "epoch": 4235} {"train_loss": -25.796527862548828, "global_step": 351581, "epoch": 4235} {"train_loss": -26.003950119018555, "global_step": 351582, "epoch": 4235} {"train_loss": -26.17331886291504, "global_step": 351583, "epoch": 4235} {"train_loss": -26.011301040649414, "global_step": 351584, "epoch": 4235} {"train_loss": -25.900617599487305, "global_step": 351585, "epoch": 4235} {"train_loss": -26.087121963500977, "global_step": 351586, "epoch": 4235} {"train_loss": -26.017447758869952, "global_step": 351587, "epoch": 4235, "val_loss": 6689586.0} {"train_loss": -25.713367462158203, "global_step": 351588, "epoch": 4236} {"train_loss": -26.05958366394043, "global_step": 351589, "epoch": 4236} {"train_loss": -25.8840274810791, "global_step": 351590, "epoch": 4236} {"train_loss": -25.98974609375, "global_step": 351591, "epoch": 4236} {"train_loss": -26.191177368164062, "global_step": 351592, "epoch": 4236} {"train_loss": -25.979623794555664, "global_step": 351593, "epoch": 4236} {"train_loss": -26.248559951782227, "global_step": 351594, "epoch": 4236} {"train_loss": -25.89923095703125, "global_step": 351595, "epoch": 4236} {"train_loss": -25.802967071533203, "global_step": 351596, "epoch": 4236} {"train_loss": -26.11688232421875, "global_step": 351597, "epoch": 4236} {"train_loss": -26.03264808654785, "global_step": 351598, "epoch": 4236} {"train_loss": -26.150409698486328, "global_step": 351599, "epoch": 4236} {"train_loss": -25.95130729675293, "global_step": 351600, "epoch": 4236} {"train_loss": -26.236841201782227, "global_step": 351601, "epoch": 4236} {"train_loss": -26.469629287719727, "global_step": 351602, "epoch": 4236} {"train_loss": -26.014785766601562, "global_step": 351603, "epoch": 4236} {"train_loss": -26.373809814453125, "global_step": 351604, "epoch": 4236} {"train_loss": -26.56954002380371, "global_step": 351605, "epoch": 4236} {"train_loss": -26.002002716064453, "global_step": 351606, "epoch": 4236} {"train_loss": -26.177204132080078, "global_step": 351607, "epoch": 4236} {"train_loss": -25.860809326171875, "global_step": 351608, "epoch": 4236} {"train_loss": -25.92732048034668, "global_step": 351609, "epoch": 4236} {"train_loss": -26.007535934448242, "global_step": 351610, "epoch": 4236} {"train_loss": -26.235492706298828, "global_step": 351611, "epoch": 4236} {"train_loss": -26.13702392578125, "global_step": 351612, "epoch": 4236} {"train_loss": -26.022750854492188, "global_step": 351613, "epoch": 4236} {"train_loss": -26.381454467773438, "global_step": 351614, "epoch": 4236} {"train_loss": -25.907079696655273, "global_step": 351615, "epoch": 4236} {"train_loss": -26.11005973815918, "global_step": 351616, "epoch": 4236} {"train_loss": -26.26651382446289, "global_step": 351617, "epoch": 4236} {"train_loss": -26.24403953552246, "global_step": 351618, "epoch": 4236} {"train_loss": -26.59126091003418, "global_step": 351619, "epoch": 4236} {"train_loss": -26.293149948120117, "global_step": 351620, "epoch": 4236} {"train_loss": -26.065832138061523, "global_step": 351621, "epoch": 4236} {"train_loss": -26.256702423095703, "global_step": 351622, "epoch": 4236} {"train_loss": -26.365955352783203, "global_step": 351623, "epoch": 4236} {"train_loss": -26.193740844726562, "global_step": 351624, "epoch": 4236} {"train_loss": -26.49500846862793, "global_step": 351625, "epoch": 4236} {"train_loss": -26.22395896911621, "global_step": 351626, "epoch": 4236} {"train_loss": -26.240936279296875, "global_step": 351627, "epoch": 4236} {"train_loss": -26.049833297729492, "global_step": 351628, "epoch": 4236} {"train_loss": -26.2777156829834, "global_step": 351629, "epoch": 4236} {"train_loss": -26.175840377807617, "global_step": 351630, "epoch": 4236} {"train_loss": -26.490161895751953, "global_step": 351631, "epoch": 4236} {"train_loss": -25.8751277923584, "global_step": 351632, "epoch": 4236} {"train_loss": -26.343097686767578, "global_step": 351633, "epoch": 4236} {"train_loss": -26.2099552154541, "global_step": 351634, "epoch": 4236} {"train_loss": -26.511770248413086, "global_step": 351635, "epoch": 4236} {"train_loss": -26.26263427734375, "global_step": 351636, "epoch": 4236} {"train_loss": -26.24616050720215, "global_step": 351637, "epoch": 4236} {"train_loss": -26.16583251953125, "global_step": 351638, "epoch": 4236} {"train_loss": -26.3007755279541, "global_step": 351639, "epoch": 4236} {"train_loss": -26.16575050354004, "global_step": 351640, "epoch": 4236} {"train_loss": -26.094945907592773, "global_step": 351641, "epoch": 4236} {"train_loss": -26.181720733642578, "global_step": 351642, "epoch": 4236} {"train_loss": -26.323577880859375, "global_step": 351643, "epoch": 4236} {"train_loss": -25.878095626831055, "global_step": 351644, "epoch": 4236} {"train_loss": -26.058828353881836, "global_step": 351645, "epoch": 4236} {"train_loss": -26.20279884338379, "global_step": 351646, "epoch": 4236} {"train_loss": -25.88484001159668, "global_step": 351647, "epoch": 4236} {"train_loss": -26.469512939453125, "global_step": 351648, "epoch": 4236} {"train_loss": -26.35205078125, "global_step": 351649, "epoch": 4236} {"train_loss": -25.659963607788086, "global_step": 351650, "epoch": 4236} {"train_loss": -26.1613826751709, "global_step": 351651, "epoch": 4236} {"train_loss": -26.1173095703125, "global_step": 351652, "epoch": 4236} {"train_loss": -26.181325912475586, "global_step": 351653, "epoch": 4236} {"train_loss": -26.39008140563965, "global_step": 351654, "epoch": 4236} {"train_loss": -26.4456844329834, "global_step": 351655, "epoch": 4236} {"train_loss": -26.422760009765625, "global_step": 351656, "epoch": 4236} {"train_loss": -26.07598304748535, "global_step": 351657, "epoch": 4236} {"train_loss": -26.111936569213867, "global_step": 351658, "epoch": 4236} {"train_loss": -26.39509391784668, "global_step": 351659, "epoch": 4236} {"train_loss": -26.208520889282227, "global_step": 351660, "epoch": 4236} {"train_loss": -26.057373046875, "global_step": 351661, "epoch": 4236} {"train_loss": -26.3304386138916, "global_step": 351662, "epoch": 4236} {"train_loss": -25.8474063873291, "global_step": 351663, "epoch": 4236} {"train_loss": -26.366596221923828, "global_step": 351664, "epoch": 4236} {"train_loss": -26.62190055847168, "global_step": 351665, "epoch": 4236} {"train_loss": -26.39546775817871, "global_step": 351666, "epoch": 4236} {"train_loss": -26.05142593383789, "global_step": 351667, "epoch": 4236} {"train_loss": -26.73179054260254, "global_step": 351668, "epoch": 4236} {"train_loss": -26.2658634185791, "global_step": 351669, "epoch": 4236} {"train_loss": -26.183563875864788, "global_step": 351670, "epoch": 4236, "val_loss": 6665316.0} {"train_loss": -26.127002716064453, "global_step": 351671, "epoch": 4237} {"train_loss": -25.686914443969727, "global_step": 351672, "epoch": 4237} {"train_loss": -25.87874412536621, "global_step": 351673, "epoch": 4237} {"train_loss": -25.9637451171875, "global_step": 351674, "epoch": 4237} {"train_loss": -25.930654525756836, "global_step": 351675, "epoch": 4237} {"train_loss": -25.81525230407715, "global_step": 351676, "epoch": 4237} {"train_loss": -26.033063888549805, "global_step": 351677, "epoch": 4237} {"train_loss": -25.740264892578125, "global_step": 351678, "epoch": 4237} {"train_loss": -26.067462921142578, "global_step": 351679, "epoch": 4237} {"train_loss": -25.999067306518555, "global_step": 351680, "epoch": 4237} {"train_loss": -26.07305335998535, "global_step": 351681, "epoch": 4237} {"train_loss": -26.218114852905273, "global_step": 351682, "epoch": 4237} {"train_loss": -25.815061569213867, "global_step": 351683, "epoch": 4237} {"train_loss": -25.99322509765625, "global_step": 351684, "epoch": 4237} {"train_loss": -26.17926025390625, "global_step": 351685, "epoch": 4237} {"train_loss": -26.38429069519043, "global_step": 351686, "epoch": 4237} {"train_loss": -26.32721519470215, "global_step": 351687, "epoch": 4237} {"train_loss": -26.293771743774414, "global_step": 351688, "epoch": 4237} {"train_loss": -25.9969425201416, "global_step": 351689, "epoch": 4237} {"train_loss": -25.86052894592285, "global_step": 351690, "epoch": 4237} {"train_loss": -26.157148361206055, "global_step": 351691, "epoch": 4237} {"train_loss": -25.944934844970703, "global_step": 351692, "epoch": 4237} {"train_loss": -25.97574806213379, "global_step": 351693, "epoch": 4237} {"train_loss": -26.20245361328125, "global_step": 351694, "epoch": 4237} {"train_loss": -26.338048934936523, "global_step": 351695, "epoch": 4237} {"train_loss": -26.028705596923828, "global_step": 351696, "epoch": 4237} {"train_loss": -25.945478439331055, "global_step": 351697, "epoch": 4237} {"train_loss": -26.169281005859375, "global_step": 351698, "epoch": 4237} {"train_loss": -26.0438232421875, "global_step": 351699, "epoch": 4237} {"train_loss": -26.382726669311523, "global_step": 351700, "epoch": 4237} {"train_loss": -26.294126510620117, "global_step": 351701, "epoch": 4237} {"train_loss": -26.488500595092773, "global_step": 351702, "epoch": 4237} {"train_loss": -26.2900333404541, "global_step": 351703, "epoch": 4237} {"train_loss": -26.20166015625, "global_step": 351704, "epoch": 4237} {"train_loss": -26.198978424072266, "global_step": 351705, "epoch": 4237} {"train_loss": -26.265304565429688, "global_step": 351706, "epoch": 4237} {"train_loss": -26.399932861328125, "global_step": 351707, "epoch": 4237} {"train_loss": -26.298248291015625, "global_step": 351708, "epoch": 4237} {"train_loss": -26.353168487548828, "global_step": 351709, "epoch": 4237} {"train_loss": -26.288373947143555, "global_step": 351710, "epoch": 4237} {"train_loss": -25.837182998657227, "global_step": 351711, "epoch": 4237} {"train_loss": -26.453195571899414, "global_step": 351712, "epoch": 4237} {"train_loss": -26.014795303344727, "global_step": 351713, "epoch": 4237} {"train_loss": -26.731409072875977, "global_step": 351714, "epoch": 4237} {"train_loss": -26.46917724609375, "global_step": 351715, "epoch": 4237} {"train_loss": -26.033660888671875, "global_step": 351716, "epoch": 4237} {"train_loss": -26.3398494720459, "global_step": 351717, "epoch": 4237} {"train_loss": -25.983118057250977, "global_step": 351718, "epoch": 4237} {"train_loss": -25.77157974243164, "global_step": 351719, "epoch": 4237} {"train_loss": -26.18402099609375, "global_step": 351720, "epoch": 4237} {"train_loss": -26.282135009765625, "global_step": 351721, "epoch": 4237} {"train_loss": -26.107351303100586, "global_step": 351722, "epoch": 4237} {"train_loss": -26.3673095703125, "global_step": 351723, "epoch": 4237} {"train_loss": -26.02789306640625, "global_step": 351724, "epoch": 4237} {"train_loss": -26.265777587890625, "global_step": 351725, "epoch": 4237} {"train_loss": -26.009891510009766, "global_step": 351726, "epoch": 4237} {"train_loss": -26.03498649597168, "global_step": 351727, "epoch": 4237} {"train_loss": -25.87434959411621, "global_step": 351728, "epoch": 4237} {"train_loss": -26.125593185424805, "global_step": 351729, "epoch": 4237} {"train_loss": -26.0399227142334, "global_step": 351730, "epoch": 4237} {"train_loss": -25.818668365478516, "global_step": 351731, "epoch": 4237} {"train_loss": -25.674692153930664, "global_step": 351732, "epoch": 4237} {"train_loss": -26.403553009033203, "global_step": 351733, "epoch": 4237} {"train_loss": -26.238693237304688, "global_step": 351734, "epoch": 4237} {"train_loss": -26.169126510620117, "global_step": 351735, "epoch": 4237} {"train_loss": -26.299116134643555, "global_step": 351736, "epoch": 4237} {"train_loss": -26.092309951782227, "global_step": 351737, "epoch": 4237} {"train_loss": -25.923324584960938, "global_step": 351738, "epoch": 4237} {"train_loss": -25.483320236206055, "global_step": 351739, "epoch": 4237} {"train_loss": -25.988574981689453, "global_step": 351740, "epoch": 4237} {"train_loss": -26.00123405456543, "global_step": 351741, "epoch": 4237} {"train_loss": -26.1457462310791, "global_step": 351742, "epoch": 4237} {"train_loss": -26.15673828125, "global_step": 351743, "epoch": 4237} {"train_loss": -25.83551025390625, "global_step": 351744, "epoch": 4237} {"train_loss": -25.957605361938477, "global_step": 351745, "epoch": 4237} {"train_loss": -26.111631393432617, "global_step": 351746, "epoch": 4237} {"train_loss": -26.260791778564453, "global_step": 351747, "epoch": 4237} {"train_loss": -26.457233428955078, "global_step": 351748, "epoch": 4237} {"train_loss": -25.96160888671875, "global_step": 351749, "epoch": 4237} {"train_loss": -26.684478759765625, "global_step": 351750, "epoch": 4237} {"train_loss": -26.07464027404785, "global_step": 351751, "epoch": 4237} {"train_loss": -26.428552627563477, "global_step": 351752, "epoch": 4237} {"train_loss": -26.12955304800746, "global_step": 351753, "epoch": 4237, "val_loss": 6712608.0} {"train_loss": -25.482961654663086, "global_step": 351754, "epoch": 4238} {"train_loss": -25.365110397338867, "global_step": 351755, "epoch": 4238} {"train_loss": -25.658802032470703, "global_step": 351756, "epoch": 4238} {"train_loss": -25.36876106262207, "global_step": 351757, "epoch": 4238} {"train_loss": -25.493398666381836, "global_step": 351758, "epoch": 4238} {"train_loss": -25.684783935546875, "global_step": 351759, "epoch": 4238} {"train_loss": -25.679731369018555, "global_step": 351760, "epoch": 4238} {"train_loss": -25.858631134033203, "global_step": 351761, "epoch": 4238} {"train_loss": -25.818973541259766, "global_step": 351762, "epoch": 4238} {"train_loss": -26.095884323120117, "global_step": 351763, "epoch": 4238} {"train_loss": -25.944028854370117, "global_step": 351764, "epoch": 4238} {"train_loss": -25.658727645874023, "global_step": 351765, "epoch": 4238} {"train_loss": -26.226789474487305, "global_step": 351766, "epoch": 4238} {"train_loss": -25.93310546875, "global_step": 351767, "epoch": 4238} {"train_loss": -25.718725204467773, "global_step": 351768, "epoch": 4238} {"train_loss": -26.128707885742188, "global_step": 351769, "epoch": 4238} {"train_loss": -26.167142868041992, "global_step": 351770, "epoch": 4238} {"train_loss": -26.243215560913086, "global_step": 351771, "epoch": 4238} {"train_loss": -25.892292022705078, "global_step": 351772, "epoch": 4238} {"train_loss": -25.828149795532227, "global_step": 351773, "epoch": 4238} {"train_loss": -26.022802352905273, "global_step": 351774, "epoch": 4238} {"train_loss": -26.148786544799805, "global_step": 351775, "epoch": 4238} {"train_loss": -25.66059684753418, "global_step": 351776, "epoch": 4238} {"train_loss": -26.160261154174805, "global_step": 351777, "epoch": 4238} {"train_loss": -25.710525512695312, "global_step": 351778, "epoch": 4238} {"train_loss": -26.047637939453125, "global_step": 351779, "epoch": 4238} {"train_loss": -26.294269561767578, "global_step": 351780, "epoch": 4238} {"train_loss": -26.647748947143555, "global_step": 351781, "epoch": 4238} {"train_loss": -26.361042022705078, "global_step": 351782, "epoch": 4238} {"train_loss": -26.10627555847168, "global_step": 351783, "epoch": 4238} {"train_loss": -25.88417625427246, "global_step": 351784, "epoch": 4238} {"train_loss": -26.247777938842773, "global_step": 351785, "epoch": 4238} {"train_loss": -26.386737823486328, "global_step": 351786, "epoch": 4238} {"train_loss": -25.58636474609375, "global_step": 351787, "epoch": 4238} {"train_loss": -26.187841415405273, "global_step": 351788, "epoch": 4238} {"train_loss": -26.172046661376953, "global_step": 351789, "epoch": 4238} {"train_loss": -26.536300659179688, "global_step": 351790, "epoch": 4238} {"train_loss": -26.298877716064453, "global_step": 351791, "epoch": 4238} {"train_loss": -26.500720977783203, "global_step": 351792, "epoch": 4238} {"train_loss": -26.25412940979004, "global_step": 351793, "epoch": 4238} {"train_loss": -26.4072265625, "global_step": 351794, "epoch": 4238} {"train_loss": -26.21112632751465, "global_step": 351795, "epoch": 4238} {"train_loss": -26.26885986328125, "global_step": 351796, "epoch": 4238} {"train_loss": -26.347082138061523, "global_step": 351797, "epoch": 4238} {"train_loss": -25.851362228393555, "global_step": 351798, "epoch": 4238} {"train_loss": -26.234771728515625, "global_step": 351799, "epoch": 4238} {"train_loss": -26.470172882080078, "global_step": 351800, "epoch": 4238} {"train_loss": -26.058801651000977, "global_step": 351801, "epoch": 4238} {"train_loss": -26.11940574645996, "global_step": 351802, "epoch": 4238} {"train_loss": -26.59000015258789, "global_step": 351803, "epoch": 4238} {"train_loss": -26.366058349609375, "global_step": 351804, "epoch": 4238} {"train_loss": -26.202228546142578, "global_step": 351805, "epoch": 4238} {"train_loss": -26.109027862548828, "global_step": 351806, "epoch": 4238} {"train_loss": -25.578195571899414, "global_step": 351807, "epoch": 4238} {"train_loss": -25.804807662963867, "global_step": 351808, "epoch": 4238} {"train_loss": -25.80419921875, "global_step": 351809, "epoch": 4238} {"train_loss": -26.29572868347168, "global_step": 351810, "epoch": 4238} {"train_loss": -26.29903221130371, "global_step": 351811, "epoch": 4238} {"train_loss": -26.23492431640625, "global_step": 351812, "epoch": 4238} {"train_loss": -25.661813735961914, "global_step": 351813, "epoch": 4238} {"train_loss": -26.169836044311523, "global_step": 351814, "epoch": 4238} {"train_loss": -26.087482452392578, "global_step": 351815, "epoch": 4238} {"train_loss": -26.074018478393555, "global_step": 351816, "epoch": 4238} {"train_loss": -25.861597061157227, "global_step": 351817, "epoch": 4238} {"train_loss": -26.240381240844727, "global_step": 351818, "epoch": 4238} {"train_loss": -26.446338653564453, "global_step": 351819, "epoch": 4238} {"train_loss": -25.853384017944336, "global_step": 351820, "epoch": 4238} {"train_loss": -25.823911666870117, "global_step": 351821, "epoch": 4238} {"train_loss": -26.091663360595703, "global_step": 351822, "epoch": 4238} {"train_loss": -26.26289176940918, "global_step": 351823, "epoch": 4238} {"train_loss": -26.223764419555664, "global_step": 351824, "epoch": 4238} {"train_loss": -26.344512939453125, "global_step": 351825, "epoch": 4238} {"train_loss": -26.50116539001465, "global_step": 351826, "epoch": 4238} {"train_loss": -25.770360946655273, "global_step": 351827, "epoch": 4238} {"train_loss": -25.728559494018555, "global_step": 351828, "epoch": 4238} {"train_loss": -26.211999893188477, "global_step": 351829, "epoch": 4238} {"train_loss": -26.3942928314209, "global_step": 351830, "epoch": 4238} {"train_loss": -26.21198081970215, "global_step": 351831, "epoch": 4238} {"train_loss": -26.291486740112305, "global_step": 351832, "epoch": 4238} {"train_loss": -26.334381103515625, "global_step": 351833, "epoch": 4238} {"train_loss": -26.14137077331543, "global_step": 351834, "epoch": 4238} {"train_loss": -25.903791427612305, "global_step": 351835, "epoch": 4238} {"train_loss": -26.046678175409156, "global_step": 351836, "epoch": 4238, "val_loss": 6716162.5} {"train_loss": -25.80706787109375, "global_step": 351837, "epoch": 4239} {"train_loss": -25.85371971130371, "global_step": 351838, "epoch": 4239} {"train_loss": -25.925491333007812, "global_step": 351839, "epoch": 4239} {"train_loss": -25.797748565673828, "global_step": 351840, "epoch": 4239} {"train_loss": -26.1700496673584, "global_step": 351841, "epoch": 4239} {"train_loss": -26.092544555664062, "global_step": 351842, "epoch": 4239} {"train_loss": -25.304821014404297, "global_step": 351843, "epoch": 4239} {"train_loss": -26.090539932250977, "global_step": 351844, "epoch": 4239} {"train_loss": -26.229944229125977, "global_step": 351845, "epoch": 4239} {"train_loss": -25.699995040893555, "global_step": 351846, "epoch": 4239} {"train_loss": -25.88986587524414, "global_step": 351847, "epoch": 4239} {"train_loss": -26.0180721282959, "global_step": 351848, "epoch": 4239} {"train_loss": -26.26972770690918, "global_step": 351849, "epoch": 4239} {"train_loss": -26.195423126220703, "global_step": 351850, "epoch": 4239} {"train_loss": -25.7613468170166, "global_step": 351851, "epoch": 4239} {"train_loss": -25.97657585144043, "global_step": 351852, "epoch": 4239} {"train_loss": -25.9300537109375, "global_step": 351853, "epoch": 4239} {"train_loss": -25.846242904663086, "global_step": 351854, "epoch": 4239} {"train_loss": -26.289581298828125, "global_step": 351855, "epoch": 4239} {"train_loss": -26.09112548828125, "global_step": 351856, "epoch": 4239} {"train_loss": -26.121915817260742, "global_step": 351857, "epoch": 4239} {"train_loss": -26.011938095092773, "global_step": 351858, "epoch": 4239} {"train_loss": -25.862863540649414, "global_step": 351859, "epoch": 4239} {"train_loss": -26.189258575439453, "global_step": 351860, "epoch": 4239} {"train_loss": -26.055530548095703, "global_step": 351861, "epoch": 4239} {"train_loss": -26.114013671875, "global_step": 351862, "epoch": 4239} {"train_loss": -26.299787521362305, "global_step": 351863, "epoch": 4239} {"train_loss": -26.10967445373535, "global_step": 351864, "epoch": 4239} {"train_loss": -26.3284912109375, "global_step": 351865, "epoch": 4239} {"train_loss": -26.308454513549805, "global_step": 351866, "epoch": 4239} {"train_loss": -26.134891510009766, "global_step": 351867, "epoch": 4239} {"train_loss": -26.3409423828125, "global_step": 351868, "epoch": 4239} {"train_loss": -26.460418701171875, "global_step": 351869, "epoch": 4239} {"train_loss": -26.33603286743164, "global_step": 351870, "epoch": 4239} {"train_loss": -26.002887725830078, "global_step": 351871, "epoch": 4239} {"train_loss": -26.092792510986328, "global_step": 351872, "epoch": 4239} {"train_loss": -26.50581932067871, "global_step": 351873, "epoch": 4239} {"train_loss": -26.421186447143555, "global_step": 351874, "epoch": 4239} {"train_loss": -26.344562530517578, "global_step": 351875, "epoch": 4239} {"train_loss": -26.632831573486328, "global_step": 351876, "epoch": 4239} {"train_loss": -26.414947509765625, "global_step": 351877, "epoch": 4239} {"train_loss": -26.561569213867188, "global_step": 351878, "epoch": 4239} {"train_loss": -26.50888442993164, "global_step": 351879, "epoch": 4239} {"train_loss": -26.2064151763916, "global_step": 351880, "epoch": 4239} {"train_loss": -26.390182495117188, "global_step": 351881, "epoch": 4239} {"train_loss": -26.148778915405273, "global_step": 351882, "epoch": 4239} {"train_loss": -26.32069206237793, "global_step": 351883, "epoch": 4239} {"train_loss": -26.017730712890625, "global_step": 351884, "epoch": 4239} {"train_loss": -26.438337326049805, "global_step": 351885, "epoch": 4239} {"train_loss": -26.53101921081543, "global_step": 351886, "epoch": 4239} {"train_loss": -26.420812606811523, "global_step": 351887, "epoch": 4239} {"train_loss": -26.10563087463379, "global_step": 351888, "epoch": 4239} {"train_loss": -26.639862060546875, "global_step": 351889, "epoch": 4239} {"train_loss": -26.351781845092773, "global_step": 351890, "epoch": 4239} {"train_loss": -26.082815170288086, "global_step": 351891, "epoch": 4239} {"train_loss": -26.369321823120117, "global_step": 351892, "epoch": 4239} {"train_loss": -26.340314865112305, "global_step": 351893, "epoch": 4239} {"train_loss": -25.977497100830078, "global_step": 351894, "epoch": 4239} {"train_loss": -26.355274200439453, "global_step": 351895, "epoch": 4239} {"train_loss": -26.278812408447266, "global_step": 351896, "epoch": 4239} {"train_loss": -26.290637969970703, "global_step": 351897, "epoch": 4239} {"train_loss": -26.333728790283203, "global_step": 351898, "epoch": 4239} {"train_loss": -26.536108016967773, "global_step": 351899, "epoch": 4239} {"train_loss": -26.243432998657227, "global_step": 351900, "epoch": 4239} {"train_loss": -26.08319091796875, "global_step": 351901, "epoch": 4239} {"train_loss": -26.03339958190918, "global_step": 351902, "epoch": 4239} {"train_loss": -26.110809326171875, "global_step": 351903, "epoch": 4239} {"train_loss": -26.174884796142578, "global_step": 351904, "epoch": 4239} {"train_loss": -26.29328727722168, "global_step": 351905, "epoch": 4239} {"train_loss": -26.352811813354492, "global_step": 351906, "epoch": 4239} {"train_loss": -26.46479606628418, "global_step": 351907, "epoch": 4239} {"train_loss": -26.6900634765625, "global_step": 351908, "epoch": 4239} {"train_loss": -26.02662467956543, "global_step": 351909, "epoch": 4239} {"train_loss": -26.682575225830078, "global_step": 351910, "epoch": 4239} {"train_loss": -25.964391708374023, "global_step": 351911, "epoch": 4239} {"train_loss": -26.1200008392334, "global_step": 351912, "epoch": 4239} {"train_loss": -26.26837158203125, "global_step": 351913, "epoch": 4239} {"train_loss": -26.5426025390625, "global_step": 351914, "epoch": 4239} {"train_loss": -26.143468856811523, "global_step": 351915, "epoch": 4239} {"train_loss": -26.499235153198242, "global_step": 351916, "epoch": 4239} {"train_loss": -26.076669692993164, "global_step": 351917, "epoch": 4239} {"train_loss": -26.263446807861328, "global_step": 351918, "epoch": 4239} {"train_loss": -26.182651611695807, "global_step": 351919, "epoch": 4239, "val_loss": 6686847.0} {"train_loss": -25.798786163330078, "global_step": 351920, "epoch": 4240} {"train_loss": -25.90785026550293, "global_step": 351921, "epoch": 4240} {"train_loss": -26.223575592041016, "global_step": 351922, "epoch": 4240} {"train_loss": -25.992450714111328, "global_step": 351923, "epoch": 4240} {"train_loss": -25.902328491210938, "global_step": 351924, "epoch": 4240} {"train_loss": -25.938739776611328, "global_step": 351925, "epoch": 4240} {"train_loss": -25.634687423706055, "global_step": 351926, "epoch": 4240} {"train_loss": -26.177366256713867, "global_step": 351927, "epoch": 4240} {"train_loss": -26.11745262145996, "global_step": 351928, "epoch": 4240} {"train_loss": -26.014638900756836, "global_step": 351929, "epoch": 4240} {"train_loss": -26.085607528686523, "global_step": 351930, "epoch": 4240} {"train_loss": -26.005329132080078, "global_step": 351931, "epoch": 4240} {"train_loss": -26.276931762695312, "global_step": 351932, "epoch": 4240} {"train_loss": -26.05207633972168, "global_step": 351933, "epoch": 4240} {"train_loss": -26.208194732666016, "global_step": 351934, "epoch": 4240} {"train_loss": -26.351831436157227, "global_step": 351935, "epoch": 4240} {"train_loss": -25.931659698486328, "global_step": 351936, "epoch": 4240} {"train_loss": -26.24517250061035, "global_step": 351937, "epoch": 4240} {"train_loss": -26.004785537719727, "global_step": 351938, "epoch": 4240} {"train_loss": -26.4454345703125, "global_step": 351939, "epoch": 4240} {"train_loss": -25.7036075592041, "global_step": 351940, "epoch": 4240} {"train_loss": -26.222558975219727, "global_step": 351941, "epoch": 4240} {"train_loss": -26.157581329345703, "global_step": 351942, "epoch": 4240} {"train_loss": -26.164350509643555, "global_step": 351943, "epoch": 4240} {"train_loss": -26.39200210571289, "global_step": 351944, "epoch": 4240} {"train_loss": -26.235254287719727, "global_step": 351945, "epoch": 4240} {"train_loss": -26.24886131286621, "global_step": 351946, "epoch": 4240} {"train_loss": -26.272581100463867, "global_step": 351947, "epoch": 4240} {"train_loss": -26.09454917907715, "global_step": 351948, "epoch": 4240} {"train_loss": -26.406925201416016, "global_step": 351949, "epoch": 4240} {"train_loss": -26.05985450744629, "global_step": 351950, "epoch": 4240} {"train_loss": -26.288211822509766, "global_step": 351951, "epoch": 4240} {"train_loss": -26.21135902404785, "global_step": 351952, "epoch": 4240} {"train_loss": -26.09455680847168, "global_step": 351953, "epoch": 4240} {"train_loss": -26.752948760986328, "global_step": 351954, "epoch": 4240} {"train_loss": -26.20391845703125, "global_step": 351955, "epoch": 4240} {"train_loss": -26.02996826171875, "global_step": 351956, "epoch": 4240} {"train_loss": -26.06460952758789, "global_step": 351957, "epoch": 4240} {"train_loss": -26.377058029174805, "global_step": 351958, "epoch": 4240} {"train_loss": -26.457168579101562, "global_step": 351959, "epoch": 4240} {"train_loss": -26.277257919311523, "global_step": 351960, "epoch": 4240} {"train_loss": -25.579214096069336, "global_step": 351961, "epoch": 4240} {"train_loss": -25.873083114624023, "global_step": 351962, "epoch": 4240} {"train_loss": -25.79859733581543, "global_step": 351963, "epoch": 4240} {"train_loss": -25.93434715270996, "global_step": 351964, "epoch": 4240} {"train_loss": -25.99055290222168, "global_step": 351965, "epoch": 4240} {"train_loss": -26.306140899658203, "global_step": 351966, "epoch": 4240} {"train_loss": -26.250532150268555, "global_step": 351967, "epoch": 4240} {"train_loss": -26.335412979125977, "global_step": 351968, "epoch": 4240} {"train_loss": -26.0019588470459, "global_step": 351969, "epoch": 4240} {"train_loss": -26.235849380493164, "global_step": 351970, "epoch": 4240} {"train_loss": -26.6878719329834, "global_step": 351971, "epoch": 4240} {"train_loss": -26.22884178161621, "global_step": 351972, "epoch": 4240} {"train_loss": -26.398035049438477, "global_step": 351973, "epoch": 4240} {"train_loss": -26.396076202392578, "global_step": 351974, "epoch": 4240} {"train_loss": -26.894775390625, "global_step": 351975, "epoch": 4240} {"train_loss": -26.358367919921875, "global_step": 351976, "epoch": 4240} {"train_loss": -26.017480850219727, "global_step": 351977, "epoch": 4240} {"train_loss": -26.08408546447754, "global_step": 351978, "epoch": 4240} {"train_loss": -26.082914352416992, "global_step": 351979, "epoch": 4240} {"train_loss": -26.367801666259766, "global_step": 351980, "epoch": 4240} {"train_loss": -26.224939346313477, "global_step": 351981, "epoch": 4240} {"train_loss": -26.24820899963379, "global_step": 351982, "epoch": 4240} {"train_loss": -26.437061309814453, "global_step": 351983, "epoch": 4240} {"train_loss": -26.354047775268555, "global_step": 351984, "epoch": 4240} {"train_loss": -26.291095733642578, "global_step": 351985, "epoch": 4240} {"train_loss": -26.209264755249023, "global_step": 351986, "epoch": 4240} {"train_loss": -26.21441650390625, "global_step": 351987, "epoch": 4240} {"train_loss": -26.210208892822266, "global_step": 351988, "epoch": 4240} {"train_loss": -26.164337158203125, "global_step": 351989, "epoch": 4240} {"train_loss": -26.196691513061523, "global_step": 351990, "epoch": 4240} {"train_loss": -26.426177978515625, "global_step": 351991, "epoch": 4240} {"train_loss": -26.243087768554688, "global_step": 351992, "epoch": 4240} {"train_loss": -26.142337799072266, "global_step": 351993, "epoch": 4240} {"train_loss": -25.98779296875, "global_step": 351994, "epoch": 4240} {"train_loss": -25.99006462097168, "global_step": 351995, "epoch": 4240} {"train_loss": -26.452417373657227, "global_step": 351996, "epoch": 4240} {"train_loss": -26.091815948486328, "global_step": 351997, "epoch": 4240} {"train_loss": -26.485675811767578, "global_step": 351998, "epoch": 4240} {"train_loss": -25.9946231842041, "global_step": 351999, "epoch": 4240} {"train_loss": -26.295236587524414, "global_step": 352000, "epoch": 4240} {"train_loss": -26.281885147094727, "global_step": 352001, "epoch": 4240} {"train_loss": -26.1853182229651, "global_step": 352002, "epoch": 4240, "val_loss": 6678110.0} {"train_loss": -25.42356300354004, "global_step": 352003, "epoch": 4241} {"train_loss": -25.365896224975586, "global_step": 352004, "epoch": 4241} {"train_loss": -24.91608238220215, "global_step": 352005, "epoch": 4241} {"train_loss": -25.79804039001465, "global_step": 352006, "epoch": 4241} {"train_loss": -25.288835525512695, "global_step": 352007, "epoch": 4241} {"train_loss": -24.814146041870117, "global_step": 352008, "epoch": 4241} {"train_loss": -26.032262802124023, "global_step": 352009, "epoch": 4241} {"train_loss": -25.612751007080078, "global_step": 352010, "epoch": 4241} {"train_loss": -25.694421768188477, "global_step": 352011, "epoch": 4241} {"train_loss": -25.618459701538086, "global_step": 352012, "epoch": 4241} {"train_loss": -25.57395362854004, "global_step": 352013, "epoch": 4241} {"train_loss": -25.427444458007812, "global_step": 352014, "epoch": 4241} {"train_loss": -25.84058952331543, "global_step": 352015, "epoch": 4241} {"train_loss": -25.63503074645996, "global_step": 352016, "epoch": 4241} {"train_loss": -25.408618927001953, "global_step": 352017, "epoch": 4241} {"train_loss": -25.43084144592285, "global_step": 352018, "epoch": 4241} {"train_loss": -25.851287841796875, "global_step": 352019, "epoch": 4241} {"train_loss": -25.705249786376953, "global_step": 352020, "epoch": 4241} {"train_loss": -25.960163116455078, "global_step": 352021, "epoch": 4241} {"train_loss": -26.181028366088867, "global_step": 352022, "epoch": 4241} {"train_loss": -26.04429054260254, "global_step": 352023, "epoch": 4241} {"train_loss": -26.189889907836914, "global_step": 352024, "epoch": 4241} {"train_loss": -25.951557159423828, "global_step": 352025, "epoch": 4241} {"train_loss": -25.959341049194336, "global_step": 352026, "epoch": 4241} {"train_loss": -25.926401138305664, "global_step": 352027, "epoch": 4241} {"train_loss": -26.1052303314209, "global_step": 352028, "epoch": 4241} {"train_loss": -25.815759658813477, "global_step": 352029, "epoch": 4241} {"train_loss": -25.92766761779785, "global_step": 352030, "epoch": 4241} {"train_loss": -25.723623275756836, "global_step": 352031, "epoch": 4241} {"train_loss": -26.401599884033203, "global_step": 352032, "epoch": 4241} {"train_loss": -25.914575576782227, "global_step": 352033, "epoch": 4241} {"train_loss": -25.8198299407959, "global_step": 352034, "epoch": 4241} {"train_loss": -26.02911949157715, "global_step": 352035, "epoch": 4241} {"train_loss": -25.856006622314453, "global_step": 352036, "epoch": 4241} {"train_loss": -26.163557052612305, "global_step": 352037, "epoch": 4241} {"train_loss": -26.260595321655273, "global_step": 352038, "epoch": 4241} {"train_loss": -25.85186195373535, "global_step": 352039, "epoch": 4241} {"train_loss": -26.21817398071289, "global_step": 352040, "epoch": 4241} {"train_loss": -26.03373146057129, "global_step": 352041, "epoch": 4241} {"train_loss": -26.33636474609375, "global_step": 352042, "epoch": 4241} {"train_loss": -26.259923934936523, "global_step": 352043, "epoch": 4241} {"train_loss": -26.224933624267578, "global_step": 352044, "epoch": 4241} {"train_loss": -26.10434341430664, "global_step": 352045, "epoch": 4241} {"train_loss": -26.591461181640625, "global_step": 352046, "epoch": 4241} {"train_loss": -26.407567977905273, "global_step": 352047, "epoch": 4241} {"train_loss": -26.136127471923828, "global_step": 352048, "epoch": 4241} {"train_loss": -26.107873916625977, "global_step": 352049, "epoch": 4241} {"train_loss": -26.050189971923828, "global_step": 352050, "epoch": 4241} {"train_loss": -26.147403717041016, "global_step": 352051, "epoch": 4241} {"train_loss": -26.161880493164062, "global_step": 352052, "epoch": 4241} {"train_loss": -26.15809440612793, "global_step": 352053, "epoch": 4241} {"train_loss": -25.909637451171875, "global_step": 352054, "epoch": 4241} {"train_loss": -26.145063400268555, "global_step": 352055, "epoch": 4241} {"train_loss": -26.0231876373291, "global_step": 352056, "epoch": 4241} {"train_loss": -26.214569091796875, "global_step": 352057, "epoch": 4241} {"train_loss": -26.368335723876953, "global_step": 352058, "epoch": 4241} {"train_loss": -26.364469528198242, "global_step": 352059, "epoch": 4241} {"train_loss": -26.58331298828125, "global_step": 352060, "epoch": 4241} {"train_loss": -26.148086547851562, "global_step": 352061, "epoch": 4241} {"train_loss": -26.489103317260742, "global_step": 352062, "epoch": 4241} {"train_loss": -26.58997917175293, "global_step": 352063, "epoch": 4241} {"train_loss": -25.90142822265625, "global_step": 352064, "epoch": 4241} {"train_loss": -26.282663345336914, "global_step": 352065, "epoch": 4241} {"train_loss": -26.642675399780273, "global_step": 352066, "epoch": 4241} {"train_loss": -26.1622314453125, "global_step": 352067, "epoch": 4241} {"train_loss": -26.4024600982666, "global_step": 352068, "epoch": 4241} {"train_loss": -26.1483211517334, "global_step": 352069, "epoch": 4241} {"train_loss": -26.13525390625, "global_step": 352070, "epoch": 4241} {"train_loss": -26.072019577026367, "global_step": 352071, "epoch": 4241} {"train_loss": -25.940887451171875, "global_step": 352072, "epoch": 4241} {"train_loss": -25.2358455657959, "global_step": 352073, "epoch": 4241} {"train_loss": -25.942529678344727, "global_step": 352074, "epoch": 4241} {"train_loss": -25.349042892456055, "global_step": 352075, "epoch": 4241} {"train_loss": -25.971302032470703, "global_step": 352076, "epoch": 4241} {"train_loss": -26.07305908203125, "global_step": 352077, "epoch": 4241} {"train_loss": -25.96868324279785, "global_step": 352078, "epoch": 4241} {"train_loss": -25.96707534790039, "global_step": 352079, "epoch": 4241} {"train_loss": -26.010547637939453, "global_step": 352080, "epoch": 4241} {"train_loss": -25.97110366821289, "global_step": 352081, "epoch": 4241} {"train_loss": -26.0521240234375, "global_step": 352082, "epoch": 4241} {"train_loss": -26.366540908813477, "global_step": 352083, "epoch": 4241} {"train_loss": -25.8245792388916, "global_step": 352084, "epoch": 4241} {"train_loss": -25.966898768781178, "global_step": 352085, "epoch": 4241, "val_loss": 6648954.0} {"train_loss": -25.381668090820312, "global_step": 352086, "epoch": 4242} {"train_loss": -25.764541625976562, "global_step": 352087, "epoch": 4242} {"train_loss": -25.659269332885742, "global_step": 352088, "epoch": 4242} {"train_loss": -25.58418083190918, "global_step": 352089, "epoch": 4242} {"train_loss": -25.398740768432617, "global_step": 352090, "epoch": 4242} {"train_loss": -25.7723388671875, "global_step": 352091, "epoch": 4242} {"train_loss": -25.14004898071289, "global_step": 352092, "epoch": 4242} {"train_loss": -25.94051170349121, "global_step": 352093, "epoch": 4242} {"train_loss": -25.52617073059082, "global_step": 352094, "epoch": 4242} {"train_loss": -25.656625747680664, "global_step": 352095, "epoch": 4242} {"train_loss": -25.64522361755371, "global_step": 352096, "epoch": 4242} {"train_loss": -25.685821533203125, "global_step": 352097, "epoch": 4242} {"train_loss": -25.948394775390625, "global_step": 352098, "epoch": 4242} {"train_loss": -25.639158248901367, "global_step": 352099, "epoch": 4242} {"train_loss": -26.19454002380371, "global_step": 352100, "epoch": 4242} {"train_loss": -25.97292137145996, "global_step": 352101, "epoch": 4242} {"train_loss": -26.1048526763916, "global_step": 352102, "epoch": 4242} {"train_loss": -25.57950210571289, "global_step": 352103, "epoch": 4242} {"train_loss": -26.075109481811523, "global_step": 352104, "epoch": 4242} {"train_loss": -26.059894561767578, "global_step": 352105, "epoch": 4242} {"train_loss": -26.486135482788086, "global_step": 352106, "epoch": 4242} {"train_loss": -25.975147247314453, "global_step": 352107, "epoch": 4242} {"train_loss": -26.0959529876709, "global_step": 352108, "epoch": 4242} {"train_loss": -26.54791831970215, "global_step": 352109, "epoch": 4242} {"train_loss": -25.908557891845703, "global_step": 352110, "epoch": 4242} {"train_loss": -25.858097076416016, "global_step": 352111, "epoch": 4242} {"train_loss": -25.799285888671875, "global_step": 352112, "epoch": 4242} {"train_loss": -26.27618408203125, "global_step": 352113, "epoch": 4242} {"train_loss": -26.48198890686035, "global_step": 352114, "epoch": 4242} {"train_loss": -25.878559112548828, "global_step": 352115, "epoch": 4242} {"train_loss": -25.851703643798828, "global_step": 352116, "epoch": 4242} {"train_loss": -26.3256893157959, "global_step": 352117, "epoch": 4242} {"train_loss": -26.145751953125, "global_step": 352118, "epoch": 4242} {"train_loss": -26.368457794189453, "global_step": 352119, "epoch": 4242} {"train_loss": -26.17896842956543, "global_step": 352120, "epoch": 4242} {"train_loss": -25.91688346862793, "global_step": 352121, "epoch": 4242} {"train_loss": -26.24517822265625, "global_step": 352122, "epoch": 4242} {"train_loss": -26.385944366455078, "global_step": 352123, "epoch": 4242} {"train_loss": -26.516254425048828, "global_step": 352124, "epoch": 4242} {"train_loss": -26.6762638092041, "global_step": 352125, "epoch": 4242} {"train_loss": -26.179798126220703, "global_step": 352126, "epoch": 4242} {"train_loss": -26.418249130249023, "global_step": 352127, "epoch": 4242} {"train_loss": -26.081928253173828, "global_step": 352128, "epoch": 4242} {"train_loss": -26.20241355895996, "global_step": 352129, "epoch": 4242} {"train_loss": -26.363264083862305, "global_step": 352130, "epoch": 4242} {"train_loss": -26.301471710205078, "global_step": 352131, "epoch": 4242} {"train_loss": -26.5303955078125, "global_step": 352132, "epoch": 4242} {"train_loss": -26.109460830688477, "global_step": 352133, "epoch": 4242} {"train_loss": -25.677515029907227, "global_step": 352134, "epoch": 4242} {"train_loss": -26.162267684936523, "global_step": 352135, "epoch": 4242} {"train_loss": -26.281248092651367, "global_step": 352136, "epoch": 4242} {"train_loss": -26.289936065673828, "global_step": 352137, "epoch": 4242} {"train_loss": -26.488428115844727, "global_step": 352138, "epoch": 4242} {"train_loss": -25.942615509033203, "global_step": 352139, "epoch": 4242} {"train_loss": -25.950719833374023, "global_step": 352140, "epoch": 4242} {"train_loss": -26.275787353515625, "global_step": 352141, "epoch": 4242} {"train_loss": -26.257801055908203, "global_step": 352142, "epoch": 4242} {"train_loss": -26.12371253967285, "global_step": 352143, "epoch": 4242} {"train_loss": -26.32599449157715, "global_step": 352144, "epoch": 4242} {"train_loss": -26.144872665405273, "global_step": 352145, "epoch": 4242} {"train_loss": -26.23809242248535, "global_step": 352146, "epoch": 4242} {"train_loss": -26.100088119506836, "global_step": 352147, "epoch": 4242} {"train_loss": -26.046234130859375, "global_step": 352148, "epoch": 4242} {"train_loss": -26.16643714904785, "global_step": 352149, "epoch": 4242} {"train_loss": -25.861474990844727, "global_step": 352150, "epoch": 4242} {"train_loss": -25.847448348999023, "global_step": 352151, "epoch": 4242} {"train_loss": -25.702850341796875, "global_step": 352152, "epoch": 4242} {"train_loss": -26.289350509643555, "global_step": 352153, "epoch": 4242} {"train_loss": -25.81145668029785, "global_step": 352154, "epoch": 4242} {"train_loss": -26.309736251831055, "global_step": 352155, "epoch": 4242} {"train_loss": -26.11366081237793, "global_step": 352156, "epoch": 4242} {"train_loss": -26.210468292236328, "global_step": 352157, "epoch": 4242} {"train_loss": -25.948993682861328, "global_step": 352158, "epoch": 4242} {"train_loss": -26.10882568359375, "global_step": 352159, "epoch": 4242} {"train_loss": -26.04524040222168, "global_step": 352160, "epoch": 4242} {"train_loss": -26.590961456298828, "global_step": 352161, "epoch": 4242} {"train_loss": -26.405963897705078, "global_step": 352162, "epoch": 4242} {"train_loss": -26.25701332092285, "global_step": 352163, "epoch": 4242} {"train_loss": -26.26654624938965, "global_step": 352164, "epoch": 4242} {"train_loss": -26.07488441467285, "global_step": 352165, "epoch": 4242} {"train_loss": -26.017614364624023, "global_step": 352166, "epoch": 4242} {"train_loss": -26.216724395751953, "global_step": 352167, "epoch": 4242} {"train_loss": -26.07661681577384, "global_step": 352168, "epoch": 4242, "val_loss": 6757907.0} {"train_loss": -25.51615333557129, "global_step": 352169, "epoch": 4243} {"train_loss": -25.644689559936523, "global_step": 352170, "epoch": 4243} {"train_loss": -25.6276912689209, "global_step": 352171, "epoch": 4243} {"train_loss": -25.91229248046875, "global_step": 352172, "epoch": 4243} {"train_loss": -25.593740463256836, "global_step": 352173, "epoch": 4243} {"train_loss": -25.758716583251953, "global_step": 352174, "epoch": 4243} {"train_loss": -25.820470809936523, "global_step": 352175, "epoch": 4243} {"train_loss": -25.9714412689209, "global_step": 352176, "epoch": 4243} {"train_loss": -25.894800186157227, "global_step": 352177, "epoch": 4243} {"train_loss": -25.789920806884766, "global_step": 352178, "epoch": 4243} {"train_loss": -26.24698257446289, "global_step": 352179, "epoch": 4243} {"train_loss": -25.413915634155273, "global_step": 352180, "epoch": 4243} {"train_loss": -25.827863693237305, "global_step": 352181, "epoch": 4243} {"train_loss": -26.223852157592773, "global_step": 352182, "epoch": 4243} {"train_loss": -25.880285263061523, "global_step": 352183, "epoch": 4243} {"train_loss": -26.22672462463379, "global_step": 352184, "epoch": 4243} {"train_loss": -25.993045806884766, "global_step": 352185, "epoch": 4243} {"train_loss": -26.256107330322266, "global_step": 352186, "epoch": 4243} {"train_loss": -26.477880477905273, "global_step": 352187, "epoch": 4243} {"train_loss": -25.972064971923828, "global_step": 352188, "epoch": 4243} {"train_loss": -25.626916885375977, "global_step": 352189, "epoch": 4243} {"train_loss": -26.18572998046875, "global_step": 352190, "epoch": 4243} {"train_loss": -26.307849884033203, "global_step": 352191, "epoch": 4243} {"train_loss": -26.503406524658203, "global_step": 352192, "epoch": 4243} {"train_loss": -26.325347900390625, "global_step": 352193, "epoch": 4243} {"train_loss": -26.427860260009766, "global_step": 352194, "epoch": 4243} {"train_loss": -26.033857345581055, "global_step": 352195, "epoch": 4243} {"train_loss": -26.278661727905273, "global_step": 352196, "epoch": 4243} {"train_loss": -26.43450927734375, "global_step": 352197, "epoch": 4243} {"train_loss": -25.968114852905273, "global_step": 352198, "epoch": 4243} {"train_loss": -26.03509521484375, "global_step": 352199, "epoch": 4243} {"train_loss": -26.305500030517578, "global_step": 352200, "epoch": 4243} {"train_loss": -26.14435386657715, "global_step": 352201, "epoch": 4243} {"train_loss": -26.476858139038086, "global_step": 352202, "epoch": 4243} {"train_loss": -26.342041015625, "global_step": 352203, "epoch": 4243} {"train_loss": -26.49968910217285, "global_step": 352204, "epoch": 4243} {"train_loss": -26.5600528717041, "global_step": 352205, "epoch": 4243} {"train_loss": -25.865243911743164, "global_step": 352206, "epoch": 4243} {"train_loss": -26.492597579956055, "global_step": 352207, "epoch": 4243} {"train_loss": -26.238250732421875, "global_step": 352208, "epoch": 4243} {"train_loss": -26.363666534423828, "global_step": 352209, "epoch": 4243} {"train_loss": -26.196929931640625, "global_step": 352210, "epoch": 4243} {"train_loss": -26.011205673217773, "global_step": 352211, "epoch": 4243} {"train_loss": -25.8575496673584, "global_step": 352212, "epoch": 4243} {"train_loss": -25.650556564331055, "global_step": 352213, "epoch": 4243} {"train_loss": -25.924482345581055, "global_step": 352214, "epoch": 4243} {"train_loss": -26.335241317749023, "global_step": 352215, "epoch": 4243} {"train_loss": -25.713720321655273, "global_step": 352216, "epoch": 4243} {"train_loss": -25.70367431640625, "global_step": 352217, "epoch": 4243} {"train_loss": -25.646875381469727, "global_step": 352218, "epoch": 4243} {"train_loss": -26.019489288330078, "global_step": 352219, "epoch": 4243} {"train_loss": -26.36421775817871, "global_step": 352220, "epoch": 4243} {"train_loss": -25.915430068969727, "global_step": 352221, "epoch": 4243} {"train_loss": -26.36676597595215, "global_step": 352222, "epoch": 4243} {"train_loss": -25.717313766479492, "global_step": 352223, "epoch": 4243} {"train_loss": -26.29669761657715, "global_step": 352224, "epoch": 4243} {"train_loss": -26.0800724029541, "global_step": 352225, "epoch": 4243} {"train_loss": -26.349252700805664, "global_step": 352226, "epoch": 4243} {"train_loss": -26.201894760131836, "global_step": 352227, "epoch": 4243} {"train_loss": -26.024572372436523, "global_step": 352228, "epoch": 4243} {"train_loss": -25.925140380859375, "global_step": 352229, "epoch": 4243} {"train_loss": -26.271869659423828, "global_step": 352230, "epoch": 4243} {"train_loss": -26.27317237854004, "global_step": 352231, "epoch": 4243} {"train_loss": -26.270801544189453, "global_step": 352232, "epoch": 4243} {"train_loss": -26.80047035217285, "global_step": 352233, "epoch": 4243} {"train_loss": -26.147680282592773, "global_step": 352234, "epoch": 4243} {"train_loss": -26.0638427734375, "global_step": 352235, "epoch": 4243} {"train_loss": -26.185327529907227, "global_step": 352236, "epoch": 4243} {"train_loss": -25.838239669799805, "global_step": 352237, "epoch": 4243} {"train_loss": -26.278608322143555, "global_step": 352238, "epoch": 4243} {"train_loss": -26.359167098999023, "global_step": 352239, "epoch": 4243} {"train_loss": -26.132659912109375, "global_step": 352240, "epoch": 4243} {"train_loss": -26.338245391845703, "global_step": 352241, "epoch": 4243} {"train_loss": -26.679182052612305, "global_step": 352242, "epoch": 4243} {"train_loss": -26.22281837463379, "global_step": 352243, "epoch": 4243} {"train_loss": -26.420822143554688, "global_step": 352244, "epoch": 4243} {"train_loss": -26.18769645690918, "global_step": 352245, "epoch": 4243} {"train_loss": -26.298276901245117, "global_step": 352246, "epoch": 4243} {"train_loss": -26.3082275390625, "global_step": 352247, "epoch": 4243} {"train_loss": -25.800344467163086, "global_step": 352248, "epoch": 4243} {"train_loss": -25.563873291015625, "global_step": 352249, "epoch": 4243} {"train_loss": -25.645233154296875, "global_step": 352250, "epoch": 4243} {"train_loss": -26.09458569446242, "global_step": 352251, "epoch": 4243, "val_loss": 6698119.5} {"train_loss": -18.07880973815918, "global_step": 352252, "epoch": 4244} {"train_loss": -21.311731338500977, "global_step": 352253, "epoch": 4244} {"train_loss": -21.07212257385254, "global_step": 352254, "epoch": 4244} {"train_loss": -22.945697784423828, "global_step": 352255, "epoch": 4244} {"train_loss": -21.950693130493164, "global_step": 352256, "epoch": 4244} {"train_loss": -23.54311752319336, "global_step": 352257, "epoch": 4244} {"train_loss": -23.83124351501465, "global_step": 352258, "epoch": 4244} {"train_loss": -23.3963680267334, "global_step": 352259, "epoch": 4244} {"train_loss": -23.73518943786621, "global_step": 352260, "epoch": 4244} {"train_loss": -24.379276275634766, "global_step": 352261, "epoch": 4244} {"train_loss": -24.3203067779541, "global_step": 352262, "epoch": 4244} {"train_loss": -23.98644256591797, "global_step": 352263, "epoch": 4244} {"train_loss": -23.81218910217285, "global_step": 352264, "epoch": 4244} {"train_loss": -24.043533325195312, "global_step": 352265, "epoch": 4244} {"train_loss": -24.212751388549805, "global_step": 352266, "epoch": 4244} {"train_loss": -24.190082550048828, "global_step": 352267, "epoch": 4244} {"train_loss": -24.386037826538086, "global_step": 352268, "epoch": 4244} {"train_loss": -24.509918212890625, "global_step": 352269, "epoch": 4244} {"train_loss": -24.280899047851562, "global_step": 352270, "epoch": 4244} {"train_loss": -24.337818145751953, "global_step": 352271, "epoch": 4244} {"train_loss": -24.547266006469727, "global_step": 352272, "epoch": 4244} {"train_loss": -24.36086082458496, "global_step": 352273, "epoch": 4244} {"train_loss": -24.53525733947754, "global_step": 352274, "epoch": 4244} {"train_loss": -24.614187240600586, "global_step": 352275, "epoch": 4244} {"train_loss": -25.007034301757812, "global_step": 352276, "epoch": 4244} {"train_loss": -24.633989334106445, "global_step": 352277, "epoch": 4244} {"train_loss": -24.69561195373535, "global_step": 352278, "epoch": 4244} {"train_loss": -24.742578506469727, "global_step": 352279, "epoch": 4244} {"train_loss": -25.125850677490234, "global_step": 352280, "epoch": 4244} {"train_loss": -24.847440719604492, "global_step": 352281, "epoch": 4244} {"train_loss": -24.88543128967285, "global_step": 352282, "epoch": 4244} {"train_loss": -25.09571647644043, "global_step": 352283, "epoch": 4244} {"train_loss": -25.198955535888672, "global_step": 352284, "epoch": 4244} {"train_loss": -25.289270401000977, "global_step": 352285, "epoch": 4244} {"train_loss": -25.25457763671875, "global_step": 352286, "epoch": 4244} {"train_loss": -25.400510787963867, "global_step": 352287, "epoch": 4244} {"train_loss": -25.308725357055664, "global_step": 352288, "epoch": 4244} {"train_loss": -25.284902572631836, "global_step": 352289, "epoch": 4244} {"train_loss": -25.3819580078125, "global_step": 352290, "epoch": 4244} {"train_loss": -25.4190731048584, "global_step": 352291, "epoch": 4244} {"train_loss": -25.389394760131836, "global_step": 352292, "epoch": 4244} {"train_loss": -25.38322639465332, "global_step": 352293, "epoch": 4244} {"train_loss": -25.484960556030273, "global_step": 352294, "epoch": 4244} {"train_loss": -25.636707305908203, "global_step": 352295, "epoch": 4244} {"train_loss": -25.754384994506836, "global_step": 352296, "epoch": 4244} {"train_loss": -25.780004501342773, "global_step": 352297, "epoch": 4244} {"train_loss": -25.416248321533203, "global_step": 352298, "epoch": 4244} {"train_loss": -25.881200790405273, "global_step": 352299, "epoch": 4244} {"train_loss": -25.840423583984375, "global_step": 352300, "epoch": 4244} {"train_loss": -25.4581356048584, "global_step": 352301, "epoch": 4244} {"train_loss": -25.901660919189453, "global_step": 352302, "epoch": 4244} {"train_loss": -25.897912979125977, "global_step": 352303, "epoch": 4244} {"train_loss": -26.048877716064453, "global_step": 352304, "epoch": 4244} {"train_loss": -25.819692611694336, "global_step": 352305, "epoch": 4244} {"train_loss": -25.84613037109375, "global_step": 352306, "epoch": 4244} {"train_loss": -25.721036911010742, "global_step": 352307, "epoch": 4244} {"train_loss": -26.204669952392578, "global_step": 352308, "epoch": 4244} {"train_loss": -26.0086612701416, "global_step": 352309, "epoch": 4244} {"train_loss": -26.1939697265625, "global_step": 352310, "epoch": 4244} {"train_loss": -26.168127059936523, "global_step": 352311, "epoch": 4244} {"train_loss": -26.05866813659668, "global_step": 352312, "epoch": 4244} {"train_loss": -26.237668991088867, "global_step": 352313, "epoch": 4244} {"train_loss": -26.232397079467773, "global_step": 352314, "epoch": 4244} {"train_loss": -26.043664932250977, "global_step": 352315, "epoch": 4244} {"train_loss": -26.178808212280273, "global_step": 352316, "epoch": 4244} {"train_loss": -26.107166290283203, "global_step": 352317, "epoch": 4244} {"train_loss": -26.397790908813477, "global_step": 352318, "epoch": 4244} {"train_loss": -26.19698143005371, "global_step": 352319, "epoch": 4244} {"train_loss": -26.599390029907227, "global_step": 352320, "epoch": 4244} {"train_loss": -26.2337703704834, "global_step": 352321, "epoch": 4244} {"train_loss": -26.068281173706055, "global_step": 352322, "epoch": 4244} {"train_loss": -26.244068145751953, "global_step": 352323, "epoch": 4244} {"train_loss": -26.34711265563965, "global_step": 352324, "epoch": 4244} {"train_loss": -26.377197265625, "global_step": 352325, "epoch": 4244} {"train_loss": -26.483495712280273, "global_step": 352326, "epoch": 4244} {"train_loss": -26.33941650390625, "global_step": 352327, "epoch": 4244} {"train_loss": -26.53533935546875, "global_step": 352328, "epoch": 4244} {"train_loss": -26.23200035095215, "global_step": 352329, "epoch": 4244} {"train_loss": -25.827911376953125, "global_step": 352330, "epoch": 4244} {"train_loss": -26.23837661743164, "global_step": 352331, "epoch": 4244} {"train_loss": -26.028120040893555, "global_step": 352332, "epoch": 4244} {"train_loss": -26.619476318359375, "global_step": 352333, "epoch": 4244} {"train_loss": -25.116361181420015, "global_step": 352334, "epoch": 4244, "val_loss": 7061991.0} {"train_loss": -24.433563232421875, "global_step": 352335, "epoch": 4245} {"train_loss": -22.731420516967773, "global_step": 352336, "epoch": 4245} {"train_loss": -25.031835556030273, "global_step": 352337, "epoch": 4245} {"train_loss": -25.24941062927246, "global_step": 352338, "epoch": 4245} {"train_loss": -24.530363082885742, "global_step": 352339, "epoch": 4245} {"train_loss": -24.993417739868164, "global_step": 352340, "epoch": 4245} {"train_loss": -24.590604782104492, "global_step": 352341, "epoch": 4245} {"train_loss": -25.332059860229492, "global_step": 352342, "epoch": 4245} {"train_loss": -25.206632614135742, "global_step": 352343, "epoch": 4245} {"train_loss": -25.137475967407227, "global_step": 352344, "epoch": 4245} {"train_loss": -25.341941833496094, "global_step": 352345, "epoch": 4245} {"train_loss": -25.26423454284668, "global_step": 352346, "epoch": 4245} {"train_loss": -25.4216251373291, "global_step": 352347, "epoch": 4245} {"train_loss": -25.407682418823242, "global_step": 352348, "epoch": 4245} {"train_loss": -25.64290428161621, "global_step": 352349, "epoch": 4245} {"train_loss": -25.559606552124023, "global_step": 352350, "epoch": 4245} {"train_loss": -25.299352645874023, "global_step": 352351, "epoch": 4245} {"train_loss": -25.57660484313965, "global_step": 352352, "epoch": 4245} {"train_loss": -25.485013961791992, "global_step": 352353, "epoch": 4245} {"train_loss": -25.528499603271484, "global_step": 352354, "epoch": 4245} {"train_loss": -25.602705001831055, "global_step": 352355, "epoch": 4245} {"train_loss": -25.670576095581055, "global_step": 352356, "epoch": 4245} {"train_loss": -25.265138626098633, "global_step": 352357, "epoch": 4245} {"train_loss": -25.835031509399414, "global_step": 352358, "epoch": 4245} {"train_loss": -25.850866317749023, "global_step": 352359, "epoch": 4245} {"train_loss": -25.75496482849121, "global_step": 352360, "epoch": 4245} {"train_loss": -25.66361427307129, "global_step": 352361, "epoch": 4245} {"train_loss": -25.625268936157227, "global_step": 352362, "epoch": 4245} {"train_loss": -26.004459381103516, "global_step": 352363, "epoch": 4245} {"train_loss": -25.96563148498535, "global_step": 352364, "epoch": 4245} {"train_loss": -26.054208755493164, "global_step": 352365, "epoch": 4245} {"train_loss": -26.142410278320312, "global_step": 352366, "epoch": 4245} {"train_loss": -25.814374923706055, "global_step": 352367, "epoch": 4245} {"train_loss": -25.939197540283203, "global_step": 352368, "epoch": 4245} {"train_loss": -25.752063751220703, "global_step": 352369, "epoch": 4245} {"train_loss": -26.206052780151367, "global_step": 352370, "epoch": 4245} {"train_loss": -25.69190788269043, "global_step": 352371, "epoch": 4245} {"train_loss": -25.971881866455078, "global_step": 352372, "epoch": 4245} {"train_loss": -26.116180419921875, "global_step": 352373, "epoch": 4245} {"train_loss": -25.770694732666016, "global_step": 352374, "epoch": 4245} {"train_loss": -25.9566707611084, "global_step": 352375, "epoch": 4245} {"train_loss": -26.224964141845703, "global_step": 352376, "epoch": 4245} {"train_loss": -25.970966339111328, "global_step": 352377, "epoch": 4245} {"train_loss": -26.007322311401367, "global_step": 352378, "epoch": 4245} {"train_loss": -26.527135848999023, "global_step": 352379, "epoch": 4245} {"train_loss": -26.0684871673584, "global_step": 352380, "epoch": 4245} {"train_loss": -25.918710708618164, "global_step": 352381, "epoch": 4245} {"train_loss": -26.086048126220703, "global_step": 352382, "epoch": 4245} {"train_loss": -26.114776611328125, "global_step": 352383, "epoch": 4245} {"train_loss": -26.128259658813477, "global_step": 352384, "epoch": 4245} {"train_loss": -26.172760009765625, "global_step": 352385, "epoch": 4245} {"train_loss": -26.295063018798828, "global_step": 352386, "epoch": 4245} {"train_loss": -26.076135635375977, "global_step": 352387, "epoch": 4245} {"train_loss": -26.851598739624023, "global_step": 352388, "epoch": 4245} {"train_loss": -26.470762252807617, "global_step": 352389, "epoch": 4245} {"train_loss": -26.239593505859375, "global_step": 352390, "epoch": 4245} {"train_loss": -26.130054473876953, "global_step": 352391, "epoch": 4245} {"train_loss": -26.533267974853516, "global_step": 352392, "epoch": 4245} {"train_loss": -26.323339462280273, "global_step": 352393, "epoch": 4245} {"train_loss": -25.9442138671875, "global_step": 352394, "epoch": 4245} {"train_loss": -25.75372886657715, "global_step": 352395, "epoch": 4245} {"train_loss": -25.85944938659668, "global_step": 352396, "epoch": 4245} {"train_loss": -26.354846954345703, "global_step": 352397, "epoch": 4245} {"train_loss": -26.196569442749023, "global_step": 352398, "epoch": 4245} {"train_loss": -26.482437133789062, "global_step": 352399, "epoch": 4245} {"train_loss": -25.964466094970703, "global_step": 352400, "epoch": 4245} {"train_loss": -26.346769332885742, "global_step": 352401, "epoch": 4245} {"train_loss": -26.211334228515625, "global_step": 352402, "epoch": 4245} {"train_loss": -26.477603912353516, "global_step": 352403, "epoch": 4245} {"train_loss": -25.979650497436523, "global_step": 352404, "epoch": 4245} {"train_loss": -26.415220260620117, "global_step": 352405, "epoch": 4245} {"train_loss": -26.19978141784668, "global_step": 352406, "epoch": 4245} {"train_loss": -26.31464195251465, "global_step": 352407, "epoch": 4245} {"train_loss": -26.292434692382812, "global_step": 352408, "epoch": 4245} {"train_loss": -26.547536849975586, "global_step": 352409, "epoch": 4245} {"train_loss": -26.46803092956543, "global_step": 352410, "epoch": 4245} {"train_loss": -27.04266929626465, "global_step": 352411, "epoch": 4245} {"train_loss": -26.645755767822266, "global_step": 352412, "epoch": 4245} {"train_loss": -26.359786987304688, "global_step": 352413, "epoch": 4245} {"train_loss": -26.4487361907959, "global_step": 352414, "epoch": 4245} {"train_loss": -26.6956844329834, "global_step": 352415, "epoch": 4245} {"train_loss": -26.38010025024414, "global_step": 352416, "epoch": 4245} {"train_loss": -25.89169734357351, "global_step": 352417, "epoch": 4245, "val_loss": 6884787.0} {"train_loss": -25.915502548217773, "global_step": 352418, "epoch": 4246} {"train_loss": -25.75775146484375, "global_step": 352419, "epoch": 4246} {"train_loss": -26.024255752563477, "global_step": 352420, "epoch": 4246} {"train_loss": -25.9647216796875, "global_step": 352421, "epoch": 4246} {"train_loss": -26.099903106689453, "global_step": 352422, "epoch": 4246} {"train_loss": -25.276762008666992, "global_step": 352423, "epoch": 4246} {"train_loss": -25.790851593017578, "global_step": 352424, "epoch": 4246} {"train_loss": -25.887296676635742, "global_step": 352425, "epoch": 4246} {"train_loss": -26.015451431274414, "global_step": 352426, "epoch": 4246} {"train_loss": -25.782596588134766, "global_step": 352427, "epoch": 4246} {"train_loss": -25.6842041015625, "global_step": 352428, "epoch": 4246} {"train_loss": -26.233083724975586, "global_step": 352429, "epoch": 4246} {"train_loss": -25.490102767944336, "global_step": 352430, "epoch": 4246} {"train_loss": -26.120361328125, "global_step": 352431, "epoch": 4246} {"train_loss": -25.75482749938965, "global_step": 352432, "epoch": 4246} {"train_loss": -25.555795669555664, "global_step": 352433, "epoch": 4246} {"train_loss": -25.68086814880371, "global_step": 352434, "epoch": 4246} {"train_loss": -26.257705688476562, "global_step": 352435, "epoch": 4246} {"train_loss": -25.758148193359375, "global_step": 352436, "epoch": 4246} {"train_loss": -26.060779571533203, "global_step": 352437, "epoch": 4246} {"train_loss": -25.939863204956055, "global_step": 352438, "epoch": 4246} {"train_loss": -26.021841049194336, "global_step": 352439, "epoch": 4246} {"train_loss": -25.948118209838867, "global_step": 352440, "epoch": 4246} {"train_loss": -26.05083656311035, "global_step": 352441, "epoch": 4246} {"train_loss": -25.924596786499023, "global_step": 352442, "epoch": 4246} {"train_loss": -26.040128707885742, "global_step": 352443, "epoch": 4246} {"train_loss": -25.78938865661621, "global_step": 352444, "epoch": 4246} {"train_loss": -26.06397819519043, "global_step": 352445, "epoch": 4246} {"train_loss": -25.956506729125977, "global_step": 352446, "epoch": 4246} {"train_loss": -25.859724044799805, "global_step": 352447, "epoch": 4246} {"train_loss": -25.84454917907715, "global_step": 352448, "epoch": 4246} {"train_loss": -26.137739181518555, "global_step": 352449, "epoch": 4246} {"train_loss": -26.335477828979492, "global_step": 352450, "epoch": 4246} {"train_loss": -26.152423858642578, "global_step": 352451, "epoch": 4246} {"train_loss": -26.100690841674805, "global_step": 352452, "epoch": 4246} {"train_loss": -26.457752227783203, "global_step": 352453, "epoch": 4246} {"train_loss": -26.082935333251953, "global_step": 352454, "epoch": 4246} {"train_loss": -26.668561935424805, "global_step": 352455, "epoch": 4246} {"train_loss": -25.751184463500977, "global_step": 352456, "epoch": 4246} {"train_loss": -26.238428115844727, "global_step": 352457, "epoch": 4246} {"train_loss": -26.14116859436035, "global_step": 352458, "epoch": 4246} {"train_loss": -26.147785186767578, "global_step": 352459, "epoch": 4246} {"train_loss": -26.33428955078125, "global_step": 352460, "epoch": 4246} {"train_loss": -26.46473503112793, "global_step": 352461, "epoch": 4246} {"train_loss": -26.363561630249023, "global_step": 352462, "epoch": 4246} {"train_loss": -26.430816650390625, "global_step": 352463, "epoch": 4246} {"train_loss": -26.396100997924805, "global_step": 352464, "epoch": 4246} {"train_loss": -26.3417911529541, "global_step": 352465, "epoch": 4246} {"train_loss": -26.222143173217773, "global_step": 352466, "epoch": 4246} {"train_loss": -26.06122398376465, "global_step": 352467, "epoch": 4246} {"train_loss": -26.1994686126709, "global_step": 352468, "epoch": 4246} {"train_loss": -26.594717025756836, "global_step": 352469, "epoch": 4246} {"train_loss": -26.563642501831055, "global_step": 352470, "epoch": 4246} {"train_loss": -26.41719627380371, "global_step": 352471, "epoch": 4246} {"train_loss": -26.308643341064453, "global_step": 352472, "epoch": 4246} {"train_loss": -26.110822677612305, "global_step": 352473, "epoch": 4246} {"train_loss": -25.901147842407227, "global_step": 352474, "epoch": 4246} {"train_loss": -25.582263946533203, "global_step": 352475, "epoch": 4246} {"train_loss": -25.778364181518555, "global_step": 352476, "epoch": 4246} {"train_loss": -26.404626846313477, "global_step": 352477, "epoch": 4246} {"train_loss": -26.027984619140625, "global_step": 352478, "epoch": 4246} {"train_loss": -25.821395874023438, "global_step": 352479, "epoch": 4246} {"train_loss": -26.18408203125, "global_step": 352480, "epoch": 4246} {"train_loss": -26.10236930847168, "global_step": 352481, "epoch": 4246} {"train_loss": -26.252216339111328, "global_step": 352482, "epoch": 4246} {"train_loss": -26.0317440032959, "global_step": 352483, "epoch": 4246} {"train_loss": -25.803613662719727, "global_step": 352484, "epoch": 4246} {"train_loss": -26.228607177734375, "global_step": 352485, "epoch": 4246} {"train_loss": -26.28546714782715, "global_step": 352486, "epoch": 4246} {"train_loss": -26.07691764831543, "global_step": 352487, "epoch": 4246} {"train_loss": -26.005849838256836, "global_step": 352488, "epoch": 4246} {"train_loss": -26.238616943359375, "global_step": 352489, "epoch": 4246} {"train_loss": -26.5798282623291, "global_step": 352490, "epoch": 4246} {"train_loss": -26.176361083984375, "global_step": 352491, "epoch": 4246} {"train_loss": -26.40760612487793, "global_step": 352492, "epoch": 4246} {"train_loss": -26.258209228515625, "global_step": 352493, "epoch": 4246} {"train_loss": -26.0987548828125, "global_step": 352494, "epoch": 4246} {"train_loss": -25.846195220947266, "global_step": 352495, "epoch": 4246} {"train_loss": -26.138952255249023, "global_step": 352496, "epoch": 4246} {"train_loss": -26.4133358001709, "global_step": 352497, "epoch": 4246} {"train_loss": -26.231653213500977, "global_step": 352498, "epoch": 4246} {"train_loss": -26.107513427734375, "global_step": 352499, "epoch": 4246} {"train_loss": -26.091340191393012, "global_step": 352500, "epoch": 4246, "val_loss": 6977603.5} {"train_loss": -26.191205978393555, "global_step": 352501, "epoch": 4247} {"train_loss": -26.377378463745117, "global_step": 352502, "epoch": 4247} {"train_loss": -26.19972038269043, "global_step": 352503, "epoch": 4247} {"train_loss": -26.231525421142578, "global_step": 352504, "epoch": 4247} {"train_loss": -26.006622314453125, "global_step": 352505, "epoch": 4247} {"train_loss": -26.027006149291992, "global_step": 352506, "epoch": 4247} {"train_loss": -26.071765899658203, "global_step": 352507, "epoch": 4247} {"train_loss": -26.015487670898438, "global_step": 352508, "epoch": 4247} {"train_loss": -26.285398483276367, "global_step": 352509, "epoch": 4247} {"train_loss": -26.2535457611084, "global_step": 352510, "epoch": 4247} {"train_loss": -25.53085708618164, "global_step": 352511, "epoch": 4247} {"train_loss": -26.026838302612305, "global_step": 352512, "epoch": 4247} {"train_loss": -25.93646812438965, "global_step": 352513, "epoch": 4247} {"train_loss": -25.995603561401367, "global_step": 352514, "epoch": 4247} {"train_loss": -25.837249755859375, "global_step": 352515, "epoch": 4247} {"train_loss": -25.774194717407227, "global_step": 352516, "epoch": 4247} {"train_loss": -25.914350509643555, "global_step": 352517, "epoch": 4247} {"train_loss": -26.089923858642578, "global_step": 352518, "epoch": 4247} {"train_loss": -25.753345489501953, "global_step": 352519, "epoch": 4247} {"train_loss": -26.25139808654785, "global_step": 352520, "epoch": 4247} {"train_loss": -25.759801864624023, "global_step": 352521, "epoch": 4247} {"train_loss": -25.834787368774414, "global_step": 352522, "epoch": 4247} {"train_loss": -25.90424919128418, "global_step": 352523, "epoch": 4247} {"train_loss": -26.242223739624023, "global_step": 352524, "epoch": 4247} {"train_loss": -25.739988327026367, "global_step": 352525, "epoch": 4247} {"train_loss": -26.10861587524414, "global_step": 352526, "epoch": 4247} {"train_loss": -26.03426170349121, "global_step": 352527, "epoch": 4247} {"train_loss": -26.498395919799805, "global_step": 352528, "epoch": 4247} {"train_loss": -26.329191207885742, "global_step": 352529, "epoch": 4247} {"train_loss": -25.9752197265625, "global_step": 352530, "epoch": 4247} {"train_loss": -26.443204879760742, "global_step": 352531, "epoch": 4247} {"train_loss": -26.105085372924805, "global_step": 352532, "epoch": 4247} {"train_loss": -26.074438095092773, "global_step": 352533, "epoch": 4247} {"train_loss": -26.5813045501709, "global_step": 352534, "epoch": 4247} {"train_loss": -26.241809844970703, "global_step": 352535, "epoch": 4247} {"train_loss": -26.31658363342285, "global_step": 352536, "epoch": 4247} {"train_loss": -26.293493270874023, "global_step": 352537, "epoch": 4247} {"train_loss": -26.131244659423828, "global_step": 352538, "epoch": 4247} {"train_loss": -26.320383071899414, "global_step": 352539, "epoch": 4247} {"train_loss": -26.251310348510742, "global_step": 352540, "epoch": 4247} {"train_loss": -26.113000869750977, "global_step": 352541, "epoch": 4247} {"train_loss": -26.376388549804688, "global_step": 352542, "epoch": 4247} {"train_loss": -26.093536376953125, "global_step": 352543, "epoch": 4247} {"train_loss": -26.086807250976562, "global_step": 352544, "epoch": 4247} {"train_loss": -26.267780303955078, "global_step": 352545, "epoch": 4247} {"train_loss": -26.4095401763916, "global_step": 352546, "epoch": 4247} {"train_loss": -27.14593505859375, "global_step": 352547, "epoch": 4247} {"train_loss": -26.38160514831543, "global_step": 352548, "epoch": 4247} {"train_loss": -26.229644775390625, "global_step": 352549, "epoch": 4247} {"train_loss": -26.469207763671875, "global_step": 352550, "epoch": 4247} {"train_loss": -26.233600616455078, "global_step": 352551, "epoch": 4247} {"train_loss": -26.476318359375, "global_step": 352552, "epoch": 4247} {"train_loss": -26.290191650390625, "global_step": 352553, "epoch": 4247} {"train_loss": -26.28252601623535, "global_step": 352554, "epoch": 4247} {"train_loss": -25.97395133972168, "global_step": 352555, "epoch": 4247} {"train_loss": -25.910343170166016, "global_step": 352556, "epoch": 4247} {"train_loss": -26.129377365112305, "global_step": 352557, "epoch": 4247} {"train_loss": -25.94598388671875, "global_step": 352558, "epoch": 4247} {"train_loss": -26.05231285095215, "global_step": 352559, "epoch": 4247} {"train_loss": -25.994892120361328, "global_step": 352560, "epoch": 4247} {"train_loss": -26.1885986328125, "global_step": 352561, "epoch": 4247} {"train_loss": -26.236120223999023, "global_step": 352562, "epoch": 4247} {"train_loss": -26.36672019958496, "global_step": 352563, "epoch": 4247} {"train_loss": -26.107404708862305, "global_step": 352564, "epoch": 4247} {"train_loss": -26.262414932250977, "global_step": 352565, "epoch": 4247} {"train_loss": -26.04384422302246, "global_step": 352566, "epoch": 4247} {"train_loss": -26.173553466796875, "global_step": 352567, "epoch": 4247} {"train_loss": -26.234155654907227, "global_step": 352568, "epoch": 4247} {"train_loss": -26.232030868530273, "global_step": 352569, "epoch": 4247} {"train_loss": -26.287189483642578, "global_step": 352570, "epoch": 4247} {"train_loss": -26.39129066467285, "global_step": 352571, "epoch": 4247} {"train_loss": -26.269861221313477, "global_step": 352572, "epoch": 4247} {"train_loss": -26.577672958374023, "global_step": 352573, "epoch": 4247} {"train_loss": -26.570539474487305, "global_step": 352574, "epoch": 4247} {"train_loss": -26.19527244567871, "global_step": 352575, "epoch": 4247} {"train_loss": -26.382659912109375, "global_step": 352576, "epoch": 4247} {"train_loss": -26.145421981811523, "global_step": 352577, "epoch": 4247} {"train_loss": -26.149810791015625, "global_step": 352578, "epoch": 4247} {"train_loss": -25.80194091796875, "global_step": 352579, "epoch": 4247} {"train_loss": -26.663177490234375, "global_step": 352580, "epoch": 4247} {"train_loss": -26.4410457611084, "global_step": 352581, "epoch": 4247} {"train_loss": -25.98175621032715, "global_step": 352582, "epoch": 4247} {"train_loss": -26.176810850580054, "global_step": 352583, "epoch": 4247, "val_loss": 6938029.0} {"train_loss": -25.222015380859375, "global_step": 352584, "epoch": 4248} {"train_loss": -24.66901206970215, "global_step": 352585, "epoch": 4248} {"train_loss": -25.705642700195312, "global_step": 352586, "epoch": 4248} {"train_loss": -25.49381446838379, "global_step": 352587, "epoch": 4248} {"train_loss": -24.916589736938477, "global_step": 352588, "epoch": 4248} {"train_loss": -25.667373657226562, "global_step": 352589, "epoch": 4248} {"train_loss": -25.45671844482422, "global_step": 352590, "epoch": 4248} {"train_loss": -25.712278366088867, "global_step": 352591, "epoch": 4248} {"train_loss": -25.271438598632812, "global_step": 352592, "epoch": 4248} {"train_loss": -25.46068000793457, "global_step": 352593, "epoch": 4248} {"train_loss": -25.813756942749023, "global_step": 352594, "epoch": 4248} {"train_loss": -25.739593505859375, "global_step": 352595, "epoch": 4248} {"train_loss": -25.727283477783203, "global_step": 352596, "epoch": 4248} {"train_loss": -26.061155319213867, "global_step": 352597, "epoch": 4248} {"train_loss": -26.3029727935791, "global_step": 352598, "epoch": 4248} {"train_loss": -25.83759880065918, "global_step": 352599, "epoch": 4248} {"train_loss": -25.841968536376953, "global_step": 352600, "epoch": 4248} {"train_loss": -26.051610946655273, "global_step": 352601, "epoch": 4248} {"train_loss": -26.083471298217773, "global_step": 352602, "epoch": 4248} {"train_loss": -26.239154815673828, "global_step": 352603, "epoch": 4248} {"train_loss": -25.884689331054688, "global_step": 352604, "epoch": 4248} {"train_loss": -26.271337509155273, "global_step": 352605, "epoch": 4248} {"train_loss": -26.225133895874023, "global_step": 352606, "epoch": 4248} {"train_loss": -25.747039794921875, "global_step": 352607, "epoch": 4248} {"train_loss": -26.350976943969727, "global_step": 352608, "epoch": 4248} {"train_loss": -26.446699142456055, "global_step": 352609, "epoch": 4248} {"train_loss": -26.025400161743164, "global_step": 352610, "epoch": 4248} {"train_loss": -26.033126831054688, "global_step": 352611, "epoch": 4248} {"train_loss": -25.976348876953125, "global_step": 352612, "epoch": 4248} {"train_loss": -26.389205932617188, "global_step": 352613, "epoch": 4248} {"train_loss": -26.401968002319336, "global_step": 352614, "epoch": 4248} {"train_loss": -25.883438110351562, "global_step": 352615, "epoch": 4248} {"train_loss": -26.086505889892578, "global_step": 352616, "epoch": 4248} {"train_loss": -26.182392120361328, "global_step": 352617, "epoch": 4248} {"train_loss": -26.138507843017578, "global_step": 352618, "epoch": 4248} {"train_loss": -26.456531524658203, "global_step": 352619, "epoch": 4248} {"train_loss": -26.22029685974121, "global_step": 352620, "epoch": 4248} {"train_loss": -26.466588973999023, "global_step": 352621, "epoch": 4248} {"train_loss": -26.19862174987793, "global_step": 352622, "epoch": 4248} {"train_loss": -26.114990234375, "global_step": 352623, "epoch": 4248} {"train_loss": -26.179641723632812, "global_step": 352624, "epoch": 4248} {"train_loss": -26.2667179107666, "global_step": 352625, "epoch": 4248} {"train_loss": -26.2421817779541, "global_step": 352626, "epoch": 4248} {"train_loss": -26.43157958984375, "global_step": 352627, "epoch": 4248} {"train_loss": -26.2360782623291, "global_step": 352628, "epoch": 4248} {"train_loss": -25.996686935424805, "global_step": 352629, "epoch": 4248} {"train_loss": -26.383085250854492, "global_step": 352630, "epoch": 4248} {"train_loss": -26.20206069946289, "global_step": 352631, "epoch": 4248} {"train_loss": -26.194665908813477, "global_step": 352632, "epoch": 4248} {"train_loss": -25.926794052124023, "global_step": 352633, "epoch": 4248} {"train_loss": -26.069128036499023, "global_step": 352634, "epoch": 4248} {"train_loss": -26.19854736328125, "global_step": 352635, "epoch": 4248} {"train_loss": -26.306467056274414, "global_step": 352636, "epoch": 4248} {"train_loss": -26.123306274414062, "global_step": 352637, "epoch": 4248} {"train_loss": -25.759557723999023, "global_step": 352638, "epoch": 4248} {"train_loss": -25.98530387878418, "global_step": 352639, "epoch": 4248} {"train_loss": -25.870710372924805, "global_step": 352640, "epoch": 4248} {"train_loss": -25.0009708404541, "global_step": 352641, "epoch": 4248} {"train_loss": -25.972623825073242, "global_step": 352642, "epoch": 4248} {"train_loss": -26.018842697143555, "global_step": 352643, "epoch": 4248} {"train_loss": -26.11787223815918, "global_step": 352644, "epoch": 4248} {"train_loss": -25.49482536315918, "global_step": 352645, "epoch": 4248} {"train_loss": -25.826459884643555, "global_step": 352646, "epoch": 4248} {"train_loss": -26.04033851623535, "global_step": 352647, "epoch": 4248} {"train_loss": -26.332910537719727, "global_step": 352648, "epoch": 4248} {"train_loss": -25.99171257019043, "global_step": 352649, "epoch": 4248} {"train_loss": -26.434072494506836, "global_step": 352650, "epoch": 4248} {"train_loss": -26.240217208862305, "global_step": 352651, "epoch": 4248} {"train_loss": -26.3801326751709, "global_step": 352652, "epoch": 4248} {"train_loss": -26.256067276000977, "global_step": 352653, "epoch": 4248} {"train_loss": -26.242069244384766, "global_step": 352654, "epoch": 4248} {"train_loss": -26.09906578063965, "global_step": 352655, "epoch": 4248} {"train_loss": -26.410144805908203, "global_step": 352656, "epoch": 4248} {"train_loss": -26.00703239440918, "global_step": 352657, "epoch": 4248} {"train_loss": -26.310474395751953, "global_step": 352658, "epoch": 4248} {"train_loss": -26.182209014892578, "global_step": 352659, "epoch": 4248} {"train_loss": -26.34307289123535, "global_step": 352660, "epoch": 4248} {"train_loss": -26.18079948425293, "global_step": 352661, "epoch": 4248} {"train_loss": -26.669198989868164, "global_step": 352662, "epoch": 4248} {"train_loss": -26.021778106689453, "global_step": 352663, "epoch": 4248} {"train_loss": -26.135833740234375, "global_step": 352664, "epoch": 4248} {"train_loss": -26.227506637573242, "global_step": 352665, "epoch": 4248} {"train_loss": -26.047682635755425, "global_step": 352666, "epoch": 4248, "val_loss": 6944150.0} {"train_loss": -25.458982467651367, "global_step": 352667, "epoch": 4249} {"train_loss": -25.22101402282715, "global_step": 352668, "epoch": 4249} {"train_loss": -25.684391021728516, "global_step": 352669, "epoch": 4249} {"train_loss": -25.529272079467773, "global_step": 352670, "epoch": 4249} {"train_loss": -26.10623550415039, "global_step": 352671, "epoch": 4249} {"train_loss": -25.42432403564453, "global_step": 352672, "epoch": 4249} {"train_loss": -25.738025665283203, "global_step": 352673, "epoch": 4249} {"train_loss": -25.734607696533203, "global_step": 352674, "epoch": 4249} {"train_loss": -25.836612701416016, "global_step": 352675, "epoch": 4249} {"train_loss": -25.522815704345703, "global_step": 352676, "epoch": 4249} {"train_loss": -25.7191219329834, "global_step": 352677, "epoch": 4249} {"train_loss": -25.603809356689453, "global_step": 352678, "epoch": 4249} {"train_loss": -25.303693771362305, "global_step": 352679, "epoch": 4249} {"train_loss": -25.77667808532715, "global_step": 352680, "epoch": 4249} {"train_loss": -25.264875411987305, "global_step": 352681, "epoch": 4249} {"train_loss": -25.68769645690918, "global_step": 352682, "epoch": 4249} {"train_loss": -25.974655151367188, "global_step": 352683, "epoch": 4249} {"train_loss": -25.68841552734375, "global_step": 352684, "epoch": 4249} {"train_loss": -25.69122886657715, "global_step": 352685, "epoch": 4249} {"train_loss": -26.247180938720703, "global_step": 352686, "epoch": 4249} {"train_loss": -25.939367294311523, "global_step": 352687, "epoch": 4249} {"train_loss": -25.891775131225586, "global_step": 352688, "epoch": 4249} {"train_loss": -26.13125991821289, "global_step": 352689, "epoch": 4249} {"train_loss": -25.78949546813965, "global_step": 352690, "epoch": 4249} {"train_loss": -26.149106979370117, "global_step": 352691, "epoch": 4249} {"train_loss": -26.37308120727539, "global_step": 352692, "epoch": 4249} {"train_loss": -26.28363037109375, "global_step": 352693, "epoch": 4249} {"train_loss": -26.411548614501953, "global_step": 352694, "epoch": 4249} {"train_loss": -26.253137588500977, "global_step": 352695, "epoch": 4249} {"train_loss": -25.795276641845703, "global_step": 352696, "epoch": 4249} {"train_loss": -26.15472412109375, "global_step": 352697, "epoch": 4249} {"train_loss": -26.09375, "global_step": 352698, "epoch": 4249} {"train_loss": -25.775619506835938, "global_step": 352699, "epoch": 4249} {"train_loss": -25.682600021362305, "global_step": 352700, "epoch": 4249} {"train_loss": -25.986236572265625, "global_step": 352701, "epoch": 4249} {"train_loss": -26.0670166015625, "global_step": 352702, "epoch": 4249} {"train_loss": -25.921859741210938, "global_step": 352703, "epoch": 4249} {"train_loss": -26.192243576049805, "global_step": 352704, "epoch": 4249} {"train_loss": -25.744922637939453, "global_step": 352705, "epoch": 4249} {"train_loss": -26.170948028564453, "global_step": 352706, "epoch": 4249} {"train_loss": -26.210880279541016, "global_step": 352707, "epoch": 4249} {"train_loss": -26.354177474975586, "global_step": 352708, "epoch": 4249} {"train_loss": -25.993234634399414, "global_step": 352709, "epoch": 4249} {"train_loss": -26.156970977783203, "global_step": 352710, "epoch": 4249} {"train_loss": -26.137348175048828, "global_step": 352711, "epoch": 4249} {"train_loss": -26.323474884033203, "global_step": 352712, "epoch": 4249} {"train_loss": -26.311176300048828, "global_step": 352713, "epoch": 4249} {"train_loss": -26.653711318969727, "global_step": 352714, "epoch": 4249} {"train_loss": -26.040557861328125, "global_step": 352715, "epoch": 4249} {"train_loss": -26.050281524658203, "global_step": 352716, "epoch": 4249} {"train_loss": -26.583032608032227, "global_step": 352717, "epoch": 4249} {"train_loss": -26.41615104675293, "global_step": 352718, "epoch": 4249} {"train_loss": -25.995752334594727, "global_step": 352719, "epoch": 4249} {"train_loss": -25.968175888061523, "global_step": 352720, "epoch": 4249} {"train_loss": -26.57269287109375, "global_step": 352721, "epoch": 4249} {"train_loss": -26.015432357788086, "global_step": 352722, "epoch": 4249} {"train_loss": -25.947046279907227, "global_step": 352723, "epoch": 4249} {"train_loss": -26.274860382080078, "global_step": 352724, "epoch": 4249} {"train_loss": -26.35744285583496, "global_step": 352725, "epoch": 4249} {"train_loss": -25.88239860534668, "global_step": 352726, "epoch": 4249} {"train_loss": -26.352848052978516, "global_step": 352727, "epoch": 4249} {"train_loss": -26.255659103393555, "global_step": 352728, "epoch": 4249} {"train_loss": -26.711166381835938, "global_step": 352729, "epoch": 4249} {"train_loss": -26.57124900817871, "global_step": 352730, "epoch": 4249} {"train_loss": -26.545032501220703, "global_step": 352731, "epoch": 4249} {"train_loss": -26.368854522705078, "global_step": 352732, "epoch": 4249} {"train_loss": -26.290159225463867, "global_step": 352733, "epoch": 4249} {"train_loss": -25.9874324798584, "global_step": 352734, "epoch": 4249} {"train_loss": -25.798694610595703, "global_step": 352735, "epoch": 4249} {"train_loss": -26.56812858581543, "global_step": 352736, "epoch": 4249} {"train_loss": -26.490381240844727, "global_step": 352737, "epoch": 4249} {"train_loss": -26.458560943603516, "global_step": 352738, "epoch": 4249} {"train_loss": -25.936767578125, "global_step": 352739, "epoch": 4249} {"train_loss": -26.577789306640625, "global_step": 352740, "epoch": 4249} {"train_loss": -26.287778854370117, "global_step": 352741, "epoch": 4249} {"train_loss": -26.5489501953125, "global_step": 352742, "epoch": 4249} {"train_loss": -26.5146484375, "global_step": 352743, "epoch": 4249} {"train_loss": -26.169677734375, "global_step": 352744, "epoch": 4249} {"train_loss": -25.896366119384766, "global_step": 352745, "epoch": 4249} {"train_loss": -26.201236724853516, "global_step": 352746, "epoch": 4249} {"train_loss": -25.998062133789062, "global_step": 352747, "epoch": 4249} {"train_loss": -25.822362899780273, "global_step": 352748, "epoch": 4249} {"train_loss": -26.0534719444183, "global_step": 352749, "epoch": 4249, "val_loss": 7025636.0} {"train_loss": -25.83591079711914, "global_step": 352750, "epoch": 4250} {"train_loss": -25.479883193969727, "global_step": 352751, "epoch": 4250} {"train_loss": -25.402124404907227, "global_step": 352752, "epoch": 4250} {"train_loss": -25.05279541015625, "global_step": 352753, "epoch": 4250} {"train_loss": -25.594867706298828, "global_step": 352754, "epoch": 4250} {"train_loss": -25.307628631591797, "global_step": 352755, "epoch": 4250} {"train_loss": -25.513774871826172, "global_step": 352756, "epoch": 4250} {"train_loss": -26.028553009033203, "global_step": 352757, "epoch": 4250} {"train_loss": -25.669403076171875, "global_step": 352758, "epoch": 4250} {"train_loss": -26.121540069580078, "global_step": 352759, "epoch": 4250} {"train_loss": -25.83790397644043, "global_step": 352760, "epoch": 4250} {"train_loss": -26.060712814331055, "global_step": 352761, "epoch": 4250} {"train_loss": -26.01913833618164, "global_step": 352762, "epoch": 4250} {"train_loss": -25.948144912719727, "global_step": 352763, "epoch": 4250} {"train_loss": -25.724567413330078, "global_step": 352764, "epoch": 4250} {"train_loss": -26.14825439453125, "global_step": 352765, "epoch": 4250} {"train_loss": -25.992965698242188, "global_step": 352766, "epoch": 4250} {"train_loss": -26.15545082092285, "global_step": 352767, "epoch": 4250} {"train_loss": -26.09516716003418, "global_step": 352768, "epoch": 4250} {"train_loss": -26.261022567749023, "global_step": 352769, "epoch": 4250} {"train_loss": -25.553247451782227, "global_step": 352770, "epoch": 4250} {"train_loss": -26.263397216796875, "global_step": 352771, "epoch": 4250} {"train_loss": -26.0583438873291, "global_step": 352772, "epoch": 4250} {"train_loss": -26.352697372436523, "global_step": 352773, "epoch": 4250} {"train_loss": -25.853271484375, "global_step": 352774, "epoch": 4250} {"train_loss": -26.091703414916992, "global_step": 352775, "epoch": 4250} {"train_loss": -26.035358428955078, "global_step": 352776, "epoch": 4250} {"train_loss": -26.04585075378418, "global_step": 352777, "epoch": 4250} {"train_loss": -25.99615478515625, "global_step": 352778, "epoch": 4250} {"train_loss": -26.04770278930664, "global_step": 352779, "epoch": 4250} {"train_loss": -25.820783615112305, "global_step": 352780, "epoch": 4250} {"train_loss": -26.403249740600586, "global_step": 352781, "epoch": 4250} {"train_loss": -25.9058895111084, "global_step": 352782, "epoch": 4250} {"train_loss": -25.816314697265625, "global_step": 352783, "epoch": 4250} {"train_loss": -26.245466232299805, "global_step": 352784, "epoch": 4250} {"train_loss": -26.201141357421875, "global_step": 352785, "epoch": 4250} {"train_loss": -26.043588638305664, "global_step": 352786, "epoch": 4250} {"train_loss": -26.040679931640625, "global_step": 352787, "epoch": 4250} {"train_loss": -26.42414665222168, "global_step": 352788, "epoch": 4250} {"train_loss": -26.180898666381836, "global_step": 352789, "epoch": 4250} {"train_loss": -26.163156509399414, "global_step": 352790, "epoch": 4250} {"train_loss": -26.39680290222168, "global_step": 352791, "epoch": 4250} {"train_loss": -26.381256103515625, "global_step": 352792, "epoch": 4250} {"train_loss": -26.213459014892578, "global_step": 352793, "epoch": 4250} {"train_loss": -26.160688400268555, "global_step": 352794, "epoch": 4250} {"train_loss": -26.196395874023438, "global_step": 352795, "epoch": 4250} {"train_loss": -26.482711791992188, "global_step": 352796, "epoch": 4250} {"train_loss": -26.48763084411621, "global_step": 352797, "epoch": 4250} {"train_loss": -26.27939224243164, "global_step": 352798, "epoch": 4250} {"train_loss": -26.27976417541504, "global_step": 352799, "epoch": 4250} {"train_loss": -26.50244140625, "global_step": 352800, "epoch": 4250} {"train_loss": -26.090497970581055, "global_step": 352801, "epoch": 4250} {"train_loss": -26.246051788330078, "global_step": 352802, "epoch": 4250} {"train_loss": -26.297409057617188, "global_step": 352803, "epoch": 4250} {"train_loss": -26.053882598876953, "global_step": 352804, "epoch": 4250} {"train_loss": -26.2004451751709, "global_step": 352805, "epoch": 4250} {"train_loss": -26.329450607299805, "global_step": 352806, "epoch": 4250} {"train_loss": -26.77754020690918, "global_step": 352807, "epoch": 4250} {"train_loss": -26.737817764282227, "global_step": 352808, "epoch": 4250} {"train_loss": -26.40557289123535, "global_step": 352809, "epoch": 4250} {"train_loss": -26.60220718383789, "global_step": 352810, "epoch": 4250} {"train_loss": -26.502246856689453, "global_step": 352811, "epoch": 4250} {"train_loss": -26.368377685546875, "global_step": 352812, "epoch": 4250} {"train_loss": -26.326648712158203, "global_step": 352813, "epoch": 4250} {"train_loss": -26.08009147644043, "global_step": 352814, "epoch": 4250} {"train_loss": -26.160451889038086, "global_step": 352815, "epoch": 4250} {"train_loss": -26.114709854125977, "global_step": 352816, "epoch": 4250} {"train_loss": -26.40285301208496, "global_step": 352817, "epoch": 4250} {"train_loss": -26.12959098815918, "global_step": 352818, "epoch": 4250} {"train_loss": -25.987546920776367, "global_step": 352819, "epoch": 4250} {"train_loss": -26.41107177734375, "global_step": 352820, "epoch": 4250} {"train_loss": -26.293298721313477, "global_step": 352821, "epoch": 4250} {"train_loss": -26.015487670898438, "global_step": 352822, "epoch": 4250} {"train_loss": -26.260913848876953, "global_step": 352823, "epoch": 4250} {"train_loss": -26.526395797729492, "global_step": 352824, "epoch": 4250} {"train_loss": -26.36271095275879, "global_step": 352825, "epoch": 4250} {"train_loss": -26.052526473999023, "global_step": 352826, "epoch": 4250} {"train_loss": -25.615570068359375, "global_step": 352827, "epoch": 4250} {"train_loss": -26.375593185424805, "global_step": 352828, "epoch": 4250} {"train_loss": -26.183958053588867, "global_step": 352829, "epoch": 4250} {"train_loss": -26.02374267578125, "global_step": 352830, "epoch": 4250} {"train_loss": -26.414875030517578, "global_step": 352831, "epoch": 4250} {"train_loss": -26.113758569740387, "global_step": 352832, "epoch": 4250, "train/sim_max_reward_0": 1.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4500000": 1.0, "test/sim_max_reward_4500001": 1.0, "test/sim_max_reward_4500002": 1.0, "test/sim_max_reward_4500003": 1.0, "test/sim_max_reward_4500004": 1.0, "test/sim_max_reward_4500005": 1.0, "test/sim_max_reward_4500006": 1.0, "test/sim_max_reward_4500007": 0.0, "test/sim_max_reward_4500008": 1.0, "test/sim_max_reward_4500009": 1.0, "test/sim_max_reward_4500010": 1.0, "test/sim_max_reward_4500011": 1.0, "test/sim_max_reward_4500012": 1.0, "test/sim_max_reward_4500013": 0.0, "test/sim_max_reward_4500014": 1.0, "test/sim_max_reward_4500015": 1.0, "test/sim_max_reward_4500016": 1.0, "test/sim_max_reward_4500017": 1.0, "test/sim_max_reward_4500018": 1.0, "test/sim_max_reward_4500019": 1.0, "test/sim_max_reward_4500020": 1.0, "test/sim_max_reward_4500021": 1.0, "train/mean_score": 1.0, "test/mean_score": 0.9090909090909091, "val_loss": 6956238.0} {"train_loss": -24.980466842651367, "global_step": 352833, "epoch": 4251} {"train_loss": -25.566930770874023, "global_step": 352834, "epoch": 4251} {"train_loss": -24.725500106811523, "global_step": 352835, "epoch": 4251} {"train_loss": -25.36408805847168, "global_step": 352836, "epoch": 4251} {"train_loss": -25.084232330322266, "global_step": 352837, "epoch": 4251} {"train_loss": -24.98133659362793, "global_step": 352838, "epoch": 4251} {"train_loss": -25.576101303100586, "global_step": 352839, "epoch": 4251} {"train_loss": -25.82488441467285, "global_step": 352840, "epoch": 4251} {"train_loss": -25.239572525024414, "global_step": 352841, "epoch": 4251} {"train_loss": -25.599002838134766, "global_step": 352842, "epoch": 4251} {"train_loss": -24.935489654541016, "global_step": 352843, "epoch": 4251} {"train_loss": -25.77683448791504, "global_step": 352844, "epoch": 4251} {"train_loss": -25.25819206237793, "global_step": 352845, "epoch": 4251} {"train_loss": -25.70464515686035, "global_step": 352846, "epoch": 4251} {"train_loss": -25.76502799987793, "global_step": 352847, "epoch": 4251} {"train_loss": -25.628173828125, "global_step": 352848, "epoch": 4251} {"train_loss": -25.983041763305664, "global_step": 352849, "epoch": 4251} {"train_loss": -25.3053035736084, "global_step": 352850, "epoch": 4251} {"train_loss": -25.70279884338379, "global_step": 352851, "epoch": 4251} {"train_loss": -25.5612850189209, "global_step": 352852, "epoch": 4251} {"train_loss": -25.956531524658203, "global_step": 352853, "epoch": 4251} {"train_loss": -26.131916046142578, "global_step": 352854, "epoch": 4251} {"train_loss": -25.703983306884766, "global_step": 352855, "epoch": 4251} {"train_loss": -25.50535774230957, "global_step": 352856, "epoch": 4251} {"train_loss": -26.3665828704834, "global_step": 352857, "epoch": 4251} {"train_loss": -25.866071701049805, "global_step": 352858, "epoch": 4251} {"train_loss": -26.244104385375977, "global_step": 352859, "epoch": 4251} {"train_loss": -25.953454971313477, "global_step": 352860, "epoch": 4251} {"train_loss": -25.832300186157227, "global_step": 352861, "epoch": 4251} {"train_loss": -25.784757614135742, "global_step": 352862, "epoch": 4251} {"train_loss": -26.503986358642578, "global_step": 352863, "epoch": 4251} {"train_loss": -26.10282325744629, "global_step": 352864, "epoch": 4251} {"train_loss": -26.197378158569336, "global_step": 352865, "epoch": 4251} {"train_loss": -26.2512264251709, "global_step": 352866, "epoch": 4251} {"train_loss": -26.129947662353516, "global_step": 352867, "epoch": 4251} {"train_loss": -26.21271324157715, "global_step": 352868, "epoch": 4251} {"train_loss": -25.986557006835938, "global_step": 352869, "epoch": 4251} {"train_loss": -25.977405548095703, "global_step": 352870, "epoch": 4251} {"train_loss": -25.834318161010742, "global_step": 352871, "epoch": 4251} {"train_loss": -26.089040756225586, "global_step": 352872, "epoch": 4251} {"train_loss": -26.5366153717041, "global_step": 352873, "epoch": 4251} {"train_loss": -26.122058868408203, "global_step": 352874, "epoch": 4251} {"train_loss": -26.4009952545166, "global_step": 352875, "epoch": 4251} {"train_loss": -26.330799102783203, "global_step": 352876, "epoch": 4251} {"train_loss": -26.36130142211914, "global_step": 352877, "epoch": 4251} {"train_loss": -26.503793716430664, "global_step": 352878, "epoch": 4251} {"train_loss": -26.62464714050293, "global_step": 352879, "epoch": 4251} {"train_loss": -26.396228790283203, "global_step": 352880, "epoch": 4251} {"train_loss": -26.728107452392578, "global_step": 352881, "epoch": 4251} {"train_loss": -26.340970993041992, "global_step": 352882, "epoch": 4251} {"train_loss": -26.618335723876953, "global_step": 352883, "epoch": 4251} {"train_loss": -26.325353622436523, "global_step": 352884, "epoch": 4251} {"train_loss": -26.27125358581543, "global_step": 352885, "epoch": 4251} {"train_loss": -26.32146644592285, "global_step": 352886, "epoch": 4251} {"train_loss": -26.348962783813477, "global_step": 352887, "epoch": 4251} {"train_loss": -25.953937530517578, "global_step": 352888, "epoch": 4251} {"train_loss": -26.207000732421875, "global_step": 352889, "epoch": 4251} {"train_loss": -26.290332794189453, "global_step": 352890, "epoch": 4251} {"train_loss": -26.186939239501953, "global_step": 352891, "epoch": 4251} {"train_loss": -26.435840606689453, "global_step": 352892, "epoch": 4251} {"train_loss": -26.23328971862793, "global_step": 352893, "epoch": 4251} {"train_loss": -26.70823097229004, "global_step": 352894, "epoch": 4251} {"train_loss": -26.36386489868164, "global_step": 352895, "epoch": 4251} {"train_loss": -26.42494010925293, "global_step": 352896, "epoch": 4251} {"train_loss": -26.18574333190918, "global_step": 352897, "epoch": 4251} {"train_loss": -26.203113555908203, "global_step": 352898, "epoch": 4251} {"train_loss": -26.50634765625, "global_step": 352899, "epoch": 4251} {"train_loss": -26.325037002563477, "global_step": 352900, "epoch": 4251} {"train_loss": -26.478132247924805, "global_step": 352901, "epoch": 4251} {"train_loss": -26.018762588500977, "global_step": 352902, "epoch": 4251} {"train_loss": -26.23744773864746, "global_step": 352903, "epoch": 4251} {"train_loss": -25.566205978393555, "global_step": 352904, "epoch": 4251} {"train_loss": -24.88437271118164, "global_step": 352905, "epoch": 4251} {"train_loss": -25.720285415649414, "global_step": 352906, "epoch": 4251} {"train_loss": -26.270185470581055, "global_step": 352907, "epoch": 4251} {"train_loss": -25.6502685546875, "global_step": 352908, "epoch": 4251} {"train_loss": -25.639820098876953, "global_step": 352909, "epoch": 4251} {"train_loss": -26.41827392578125, "global_step": 352910, "epoch": 4251} {"train_loss": -26.341089248657227, "global_step": 352911, "epoch": 4251} {"train_loss": -26.16021156311035, "global_step": 352912, "epoch": 4251} {"train_loss": -26.170202255249023, "global_step": 352913, "epoch": 4251} {"train_loss": -25.905521392822266, "global_step": 352914, "epoch": 4251} {"train_loss": -25.982652572264154, "global_step": 352915, "epoch": 4251, "val_loss": 6912528.5} {"train_loss": -25.268726348876953, "global_step": 352916, "epoch": 4252} {"train_loss": -26.0, "global_step": 352917, "epoch": 4252} {"train_loss": -25.69037437438965, "global_step": 352918, "epoch": 4252} {"train_loss": -25.857593536376953, "global_step": 352919, "epoch": 4252} {"train_loss": -25.705305099487305, "global_step": 352920, "epoch": 4252} {"train_loss": -25.817346572875977, "global_step": 352921, "epoch": 4252} {"train_loss": -25.86745262145996, "global_step": 352922, "epoch": 4252} {"train_loss": -25.703109741210938, "global_step": 352923, "epoch": 4252} {"train_loss": -25.8365421295166, "global_step": 352924, "epoch": 4252} {"train_loss": -25.7816219329834, "global_step": 352925, "epoch": 4252} {"train_loss": -26.07425880432129, "global_step": 352926, "epoch": 4252} {"train_loss": -25.576045989990234, "global_step": 352927, "epoch": 4252} {"train_loss": -25.87591552734375, "global_step": 352928, "epoch": 4252} {"train_loss": -26.126611709594727, "global_step": 352929, "epoch": 4252} {"train_loss": -26.00800895690918, "global_step": 352930, "epoch": 4252} {"train_loss": -26.326034545898438, "global_step": 352931, "epoch": 4252} {"train_loss": -25.57200050354004, "global_step": 352932, "epoch": 4252} {"train_loss": -26.257709503173828, "global_step": 352933, "epoch": 4252} {"train_loss": -25.90215492248535, "global_step": 352934, "epoch": 4252} {"train_loss": -26.360509872436523, "global_step": 352935, "epoch": 4252} {"train_loss": -26.310941696166992, "global_step": 352936, "epoch": 4252} {"train_loss": -25.703763961791992, "global_step": 352937, "epoch": 4252} {"train_loss": -25.953893661499023, "global_step": 352938, "epoch": 4252} {"train_loss": -26.0157470703125, "global_step": 352939, "epoch": 4252} {"train_loss": -25.979894638061523, "global_step": 352940, "epoch": 4252} {"train_loss": -26.0842342376709, "global_step": 352941, "epoch": 4252} {"train_loss": -26.14532470703125, "global_step": 352942, "epoch": 4252} {"train_loss": -26.047290802001953, "global_step": 352943, "epoch": 4252} {"train_loss": -26.066999435424805, "global_step": 352944, "epoch": 4252} {"train_loss": -26.386194229125977, "global_step": 352945, "epoch": 4252} {"train_loss": -25.9438419342041, "global_step": 352946, "epoch": 4252} {"train_loss": -26.743921279907227, "global_step": 352947, "epoch": 4252} {"train_loss": -26.068689346313477, "global_step": 352948, "epoch": 4252} {"train_loss": -25.882837295532227, "global_step": 352949, "epoch": 4252} {"train_loss": -25.9713191986084, "global_step": 352950, "epoch": 4252} {"train_loss": -26.256900787353516, "global_step": 352951, "epoch": 4252} {"train_loss": -26.307083129882812, "global_step": 352952, "epoch": 4252} {"train_loss": -26.454181671142578, "global_step": 352953, "epoch": 4252} {"train_loss": -26.391958236694336, "global_step": 352954, "epoch": 4252} {"train_loss": -26.18928337097168, "global_step": 352955, "epoch": 4252} {"train_loss": -26.135009765625, "global_step": 352956, "epoch": 4252} {"train_loss": -26.196584701538086, "global_step": 352957, "epoch": 4252} {"train_loss": -26.3947811126709, "global_step": 352958, "epoch": 4252} {"train_loss": -26.384937286376953, "global_step": 352959, "epoch": 4252} {"train_loss": -25.988744735717773, "global_step": 352960, "epoch": 4252} {"train_loss": -26.108301162719727, "global_step": 352961, "epoch": 4252} {"train_loss": -26.34222984313965, "global_step": 352962, "epoch": 4252} {"train_loss": -25.89334487915039, "global_step": 352963, "epoch": 4252} {"train_loss": -25.9399471282959, "global_step": 352964, "epoch": 4252} {"train_loss": -26.582548141479492, "global_step": 352965, "epoch": 4252} {"train_loss": -26.47966957092285, "global_step": 352966, "epoch": 4252} {"train_loss": -26.275583267211914, "global_step": 352967, "epoch": 4252} {"train_loss": -26.266157150268555, "global_step": 352968, "epoch": 4252} {"train_loss": -26.270751953125, "global_step": 352969, "epoch": 4252} {"train_loss": -25.911945343017578, "global_step": 352970, "epoch": 4252} {"train_loss": -25.989233016967773, "global_step": 352971, "epoch": 4252} {"train_loss": -25.78336524963379, "global_step": 352972, "epoch": 4252} {"train_loss": -25.87839698791504, "global_step": 352973, "epoch": 4252} {"train_loss": -26.189855575561523, "global_step": 352974, "epoch": 4252} {"train_loss": -26.098615646362305, "global_step": 352975, "epoch": 4252} {"train_loss": -26.212446212768555, "global_step": 352976, "epoch": 4252} {"train_loss": -26.144392013549805, "global_step": 352977, "epoch": 4252} {"train_loss": -26.0816650390625, "global_step": 352978, "epoch": 4252} {"train_loss": -26.091724395751953, "global_step": 352979, "epoch": 4252} {"train_loss": -25.923078536987305, "global_step": 352980, "epoch": 4252} {"train_loss": -26.310461044311523, "global_step": 352981, "epoch": 4252} {"train_loss": -25.809864044189453, "global_step": 352982, "epoch": 4252} {"train_loss": -25.863061904907227, "global_step": 352983, "epoch": 4252} {"train_loss": -26.159666061401367, "global_step": 352984, "epoch": 4252} {"train_loss": -25.912540435791016, "global_step": 352985, "epoch": 4252} {"train_loss": -26.180723190307617, "global_step": 352986, "epoch": 4252} {"train_loss": -26.113574981689453, "global_step": 352987, "epoch": 4252} {"train_loss": -25.928876876831055, "global_step": 352988, "epoch": 4252} {"train_loss": -26.2196044921875, "global_step": 352989, "epoch": 4252} {"train_loss": -25.926496505737305, "global_step": 352990, "epoch": 4252} {"train_loss": -25.99195671081543, "global_step": 352991, "epoch": 4252} {"train_loss": -26.230222702026367, "global_step": 352992, "epoch": 4252} {"train_loss": -25.954303741455078, "global_step": 352993, "epoch": 4252} {"train_loss": -26.50672721862793, "global_step": 352994, "epoch": 4252} {"train_loss": -26.066442489624023, "global_step": 352995, "epoch": 4252} {"train_loss": -25.888574600219727, "global_step": 352996, "epoch": 4252} {"train_loss": -26.117237091064453, "global_step": 352997, "epoch": 4252} {"train_loss": -26.04688306601651, "global_step": 352998, "epoch": 4252, "val_loss": 7028038.0} {"train_loss": -25.768842697143555, "global_step": 352999, "epoch": 4253} {"train_loss": -25.663671493530273, "global_step": 353000, "epoch": 4253} {"train_loss": -25.86109733581543, "global_step": 353001, "epoch": 4253} {"train_loss": -26.079833984375, "global_step": 353002, "epoch": 4253} {"train_loss": -25.984119415283203, "global_step": 353003, "epoch": 4253} {"train_loss": -25.868305206298828, "global_step": 353004, "epoch": 4253} {"train_loss": -25.717878341674805, "global_step": 353005, "epoch": 4253} {"train_loss": -26.148914337158203, "global_step": 353006, "epoch": 4253} {"train_loss": -25.42720603942871, "global_step": 353007, "epoch": 4253} {"train_loss": -26.07554054260254, "global_step": 353008, "epoch": 4253} {"train_loss": -26.327539443969727, "global_step": 353009, "epoch": 4253} {"train_loss": -26.241668701171875, "global_step": 353010, "epoch": 4253} {"train_loss": -25.91057777404785, "global_step": 353011, "epoch": 4253} {"train_loss": -26.146596908569336, "global_step": 353012, "epoch": 4253} {"train_loss": -25.92486000061035, "global_step": 353013, "epoch": 4253} {"train_loss": -26.428556442260742, "global_step": 353014, "epoch": 4253} {"train_loss": -26.453027725219727, "global_step": 353015, "epoch": 4253} {"train_loss": -25.93377113342285, "global_step": 353016, "epoch": 4253} {"train_loss": -26.28571128845215, "global_step": 353017, "epoch": 4253} {"train_loss": -25.98075294494629, "global_step": 353018, "epoch": 4253} {"train_loss": -26.2548885345459, "global_step": 353019, "epoch": 4253} {"train_loss": -26.0862979888916, "global_step": 353020, "epoch": 4253} {"train_loss": -26.278278350830078, "global_step": 353021, "epoch": 4253} {"train_loss": -26.52058219909668, "global_step": 353022, "epoch": 4253} {"train_loss": -26.458051681518555, "global_step": 353023, "epoch": 4253} {"train_loss": -26.46683692932129, "global_step": 353024, "epoch": 4253} {"train_loss": -26.31119155883789, "global_step": 353025, "epoch": 4253} {"train_loss": -25.912878036499023, "global_step": 353026, "epoch": 4253} {"train_loss": -26.116819381713867, "global_step": 353027, "epoch": 4253} {"train_loss": -25.726428985595703, "global_step": 353028, "epoch": 4253} {"train_loss": -26.260461807250977, "global_step": 353029, "epoch": 4253} {"train_loss": -26.251962661743164, "global_step": 353030, "epoch": 4253} {"train_loss": -26.13828468322754, "global_step": 353031, "epoch": 4253} {"train_loss": -26.178329467773438, "global_step": 353032, "epoch": 4253} {"train_loss": -25.89356803894043, "global_step": 353033, "epoch": 4253} {"train_loss": -26.559057235717773, "global_step": 353034, "epoch": 4253} {"train_loss": -26.245380401611328, "global_step": 353035, "epoch": 4253} {"train_loss": -25.987207412719727, "global_step": 353036, "epoch": 4253} {"train_loss": -26.02532958984375, "global_step": 353037, "epoch": 4253} {"train_loss": -25.973358154296875, "global_step": 353038, "epoch": 4253} {"train_loss": -25.851255416870117, "global_step": 353039, "epoch": 4253} {"train_loss": -25.9487247467041, "global_step": 353040, "epoch": 4253} {"train_loss": -26.353723526000977, "global_step": 353041, "epoch": 4253} {"train_loss": -25.7680606842041, "global_step": 353042, "epoch": 4253} {"train_loss": -25.7463321685791, "global_step": 353043, "epoch": 4253} {"train_loss": -25.786518096923828, "global_step": 353044, "epoch": 4253} {"train_loss": -26.227893829345703, "global_step": 353045, "epoch": 4253} {"train_loss": -26.46738052368164, "global_step": 353046, "epoch": 4253} {"train_loss": -26.013029098510742, "global_step": 353047, "epoch": 4253} {"train_loss": -26.2257022857666, "global_step": 353048, "epoch": 4253} {"train_loss": -26.397705078125, "global_step": 353049, "epoch": 4253} {"train_loss": -26.285802841186523, "global_step": 353050, "epoch": 4253} {"train_loss": -26.52813148498535, "global_step": 353051, "epoch": 4253} {"train_loss": -26.620437622070312, "global_step": 353052, "epoch": 4253} {"train_loss": -26.297027587890625, "global_step": 353053, "epoch": 4253} {"train_loss": -26.1811580657959, "global_step": 353054, "epoch": 4253} {"train_loss": -25.974567413330078, "global_step": 353055, "epoch": 4253} {"train_loss": -26.214635848999023, "global_step": 353056, "epoch": 4253} {"train_loss": -26.121906280517578, "global_step": 353057, "epoch": 4253} {"train_loss": -25.825225830078125, "global_step": 353058, "epoch": 4253} {"train_loss": -26.2336483001709, "global_step": 353059, "epoch": 4253} {"train_loss": -26.14927101135254, "global_step": 353060, "epoch": 4253} {"train_loss": -26.75713539123535, "global_step": 353061, "epoch": 4253} {"train_loss": -26.224531173706055, "global_step": 353062, "epoch": 4253} {"train_loss": -26.059589385986328, "global_step": 353063, "epoch": 4253} {"train_loss": -26.207782745361328, "global_step": 353064, "epoch": 4253} {"train_loss": -26.178741455078125, "global_step": 353065, "epoch": 4253} {"train_loss": -26.4517765045166, "global_step": 353066, "epoch": 4253} {"train_loss": -26.302875518798828, "global_step": 353067, "epoch": 4253} {"train_loss": -25.71932029724121, "global_step": 353068, "epoch": 4253} {"train_loss": -26.09917640686035, "global_step": 353069, "epoch": 4253} {"train_loss": -26.221235275268555, "global_step": 353070, "epoch": 4253} {"train_loss": -26.348424911499023, "global_step": 353071, "epoch": 4253} {"train_loss": -25.8499755859375, "global_step": 353072, "epoch": 4253} {"train_loss": -26.427167892456055, "global_step": 353073, "epoch": 4253} {"train_loss": -26.447729110717773, "global_step": 353074, "epoch": 4253} {"train_loss": -26.4350528717041, "global_step": 353075, "epoch": 4253} {"train_loss": -26.457111358642578, "global_step": 353076, "epoch": 4253} {"train_loss": -26.00362205505371, "global_step": 353077, "epoch": 4253} {"train_loss": -25.878387451171875, "global_step": 353078, "epoch": 4253} {"train_loss": -26.047012329101562, "global_step": 353079, "epoch": 4253} {"train_loss": -25.46906852722168, "global_step": 353080, "epoch": 4253} {"train_loss": -26.1294323565012, "global_step": 353081, "epoch": 4253, "val_loss": 6915081.0} {"train_loss": -25.051359176635742, "global_step": 353082, "epoch": 4254} {"train_loss": -25.113346099853516, "global_step": 353083, "epoch": 4254} {"train_loss": -24.73731803894043, "global_step": 353084, "epoch": 4254} {"train_loss": -24.32733917236328, "global_step": 353085, "epoch": 4254} {"train_loss": -24.930492401123047, "global_step": 353086, "epoch": 4254} {"train_loss": -25.67724609375, "global_step": 353087, "epoch": 4254} {"train_loss": -25.092132568359375, "global_step": 353088, "epoch": 4254} {"train_loss": -25.342111587524414, "global_step": 353089, "epoch": 4254} {"train_loss": -24.94303321838379, "global_step": 353090, "epoch": 4254} {"train_loss": -24.591405868530273, "global_step": 353091, "epoch": 4254} {"train_loss": -25.216184616088867, "global_step": 353092, "epoch": 4254} {"train_loss": -25.45582389831543, "global_step": 353093, "epoch": 4254} {"train_loss": -25.261505126953125, "global_step": 353094, "epoch": 4254} {"train_loss": -25.343557357788086, "global_step": 353095, "epoch": 4254} {"train_loss": -25.04118537902832, "global_step": 353096, "epoch": 4254} {"train_loss": -25.113805770874023, "global_step": 353097, "epoch": 4254} {"train_loss": -25.217145919799805, "global_step": 353098, "epoch": 4254} {"train_loss": -25.108854293823242, "global_step": 353099, "epoch": 4254} {"train_loss": -25.28071403503418, "global_step": 353100, "epoch": 4254} {"train_loss": -25.459205627441406, "global_step": 353101, "epoch": 4254} {"train_loss": -25.550830841064453, "global_step": 353102, "epoch": 4254} {"train_loss": -25.49861717224121, "global_step": 353103, "epoch": 4254} {"train_loss": -25.6917667388916, "global_step": 353104, "epoch": 4254} {"train_loss": -25.939289093017578, "global_step": 353105, "epoch": 4254} {"train_loss": -25.351848602294922, "global_step": 353106, "epoch": 4254} {"train_loss": -25.8913631439209, "global_step": 353107, "epoch": 4254} {"train_loss": -25.82440185546875, "global_step": 353108, "epoch": 4254} {"train_loss": -25.518224716186523, "global_step": 353109, "epoch": 4254} {"train_loss": -25.708209991455078, "global_step": 353110, "epoch": 4254} {"train_loss": -25.926166534423828, "global_step": 353111, "epoch": 4254} {"train_loss": -25.96284294128418, "global_step": 353112, "epoch": 4254} {"train_loss": -25.753442764282227, "global_step": 353113, "epoch": 4254} {"train_loss": -25.7349796295166, "global_step": 353114, "epoch": 4254} {"train_loss": -25.862524032592773, "global_step": 353115, "epoch": 4254} {"train_loss": -25.944202423095703, "global_step": 353116, "epoch": 4254} {"train_loss": -25.88861656188965, "global_step": 353117, "epoch": 4254} {"train_loss": -26.087848663330078, "global_step": 353118, "epoch": 4254} {"train_loss": -25.957916259765625, "global_step": 353119, "epoch": 4254} {"train_loss": -26.237369537353516, "global_step": 353120, "epoch": 4254} {"train_loss": -25.575992584228516, "global_step": 353121, "epoch": 4254} {"train_loss": -25.816659927368164, "global_step": 353122, "epoch": 4254} {"train_loss": -26.154027938842773, "global_step": 353123, "epoch": 4254} {"train_loss": -26.080808639526367, "global_step": 353124, "epoch": 4254} {"train_loss": -25.926040649414062, "global_step": 353125, "epoch": 4254} {"train_loss": -26.147069931030273, "global_step": 353126, "epoch": 4254} {"train_loss": -26.52254295349121, "global_step": 353127, "epoch": 4254} {"train_loss": -26.096052169799805, "global_step": 353128, "epoch": 4254} {"train_loss": -26.095808029174805, "global_step": 353129, "epoch": 4254} {"train_loss": -26.30012321472168, "global_step": 353130, "epoch": 4254} {"train_loss": -26.165369033813477, "global_step": 353131, "epoch": 4254} {"train_loss": -26.20530128479004, "global_step": 353132, "epoch": 4254} {"train_loss": -26.40325355529785, "global_step": 353133, "epoch": 4254} {"train_loss": -26.040180206298828, "global_step": 353134, "epoch": 4254} {"train_loss": -26.331701278686523, "global_step": 353135, "epoch": 4254} {"train_loss": -26.3548526763916, "global_step": 353136, "epoch": 4254} {"train_loss": -26.015295028686523, "global_step": 353137, "epoch": 4254} {"train_loss": -26.150409698486328, "global_step": 353138, "epoch": 4254} {"train_loss": -26.59181022644043, "global_step": 353139, "epoch": 4254} {"train_loss": -26.334375381469727, "global_step": 353140, "epoch": 4254} {"train_loss": -26.10272216796875, "global_step": 353141, "epoch": 4254} {"train_loss": -26.5748291015625, "global_step": 353142, "epoch": 4254} {"train_loss": -26.17819595336914, "global_step": 353143, "epoch": 4254} {"train_loss": -25.905364990234375, "global_step": 353144, "epoch": 4254} {"train_loss": -26.308378219604492, "global_step": 353145, "epoch": 4254} {"train_loss": -26.265661239624023, "global_step": 353146, "epoch": 4254} {"train_loss": -26.163745880126953, "global_step": 353147, "epoch": 4254} {"train_loss": -26.35910987854004, "global_step": 353148, "epoch": 4254} {"train_loss": -25.979459762573242, "global_step": 353149, "epoch": 4254} {"train_loss": -25.7219181060791, "global_step": 353150, "epoch": 4254} {"train_loss": -25.903478622436523, "global_step": 353151, "epoch": 4254} {"train_loss": -26.611068725585938, "global_step": 353152, "epoch": 4254} {"train_loss": -26.621845245361328, "global_step": 353153, "epoch": 4254} {"train_loss": -26.199182510375977, "global_step": 353154, "epoch": 4254} {"train_loss": -26.186767578125, "global_step": 353155, "epoch": 4254} {"train_loss": -26.243255615234375, "global_step": 353156, "epoch": 4254} {"train_loss": -26.19208335876465, "global_step": 353157, "epoch": 4254} {"train_loss": -26.15468406677246, "global_step": 353158, "epoch": 4254} {"train_loss": -26.68195152282715, "global_step": 353159, "epoch": 4254} {"train_loss": -26.503040313720703, "global_step": 353160, "epoch": 4254} {"train_loss": -26.292905807495117, "global_step": 353161, "epoch": 4254} {"train_loss": -26.234088897705078, "global_step": 353162, "epoch": 4254} {"train_loss": -26.633020401000977, "global_step": 353163, "epoch": 4254} {"train_loss": -25.87210905695536, "global_step": 353164, "epoch": 4254, "val_loss": 6808091.0} {"train_loss": -25.935251235961914, "global_step": 353165, "epoch": 4255} {"train_loss": -25.675628662109375, "global_step": 353166, "epoch": 4255} {"train_loss": -26.02302360534668, "global_step": 353167, "epoch": 4255} {"train_loss": -25.752843856811523, "global_step": 353168, "epoch": 4255} {"train_loss": -25.9239501953125, "global_step": 353169, "epoch": 4255} {"train_loss": -25.864765167236328, "global_step": 353170, "epoch": 4255} {"train_loss": -25.867300033569336, "global_step": 353171, "epoch": 4255} {"train_loss": -25.909912109375, "global_step": 353172, "epoch": 4255} {"train_loss": -25.796110153198242, "global_step": 353173, "epoch": 4255} {"train_loss": -25.761260986328125, "global_step": 353174, "epoch": 4255} {"train_loss": -26.119979858398438, "global_step": 353175, "epoch": 4255} {"train_loss": -25.933618545532227, "global_step": 353176, "epoch": 4255} {"train_loss": -26.04718017578125, "global_step": 353177, "epoch": 4255} {"train_loss": -25.5808162689209, "global_step": 353178, "epoch": 4255} {"train_loss": -25.67791175842285, "global_step": 353179, "epoch": 4255} {"train_loss": -25.825231552124023, "global_step": 353180, "epoch": 4255} {"train_loss": -25.5320987701416, "global_step": 353181, "epoch": 4255} {"train_loss": -25.82185173034668, "global_step": 353182, "epoch": 4255} {"train_loss": -25.838123321533203, "global_step": 353183, "epoch": 4255} {"train_loss": -25.93134117126465, "global_step": 353184, "epoch": 4255} {"train_loss": -26.34446144104004, "global_step": 353185, "epoch": 4255} {"train_loss": -26.037967681884766, "global_step": 353186, "epoch": 4255} {"train_loss": -25.91779899597168, "global_step": 353187, "epoch": 4255} {"train_loss": -25.956928253173828, "global_step": 353188, "epoch": 4255} {"train_loss": -25.9750919342041, "global_step": 353189, "epoch": 4255} {"train_loss": -26.450927734375, "global_step": 353190, "epoch": 4255} {"train_loss": -26.250274658203125, "global_step": 353191, "epoch": 4255} {"train_loss": -26.217206954956055, "global_step": 353192, "epoch": 4255} {"train_loss": -26.3477840423584, "global_step": 353193, "epoch": 4255} {"train_loss": -26.138288497924805, "global_step": 353194, "epoch": 4255} {"train_loss": -26.10888671875, "global_step": 353195, "epoch": 4255} {"train_loss": -26.02109146118164, "global_step": 353196, "epoch": 4255} {"train_loss": -26.541181564331055, "global_step": 353197, "epoch": 4255} {"train_loss": -26.22771644592285, "global_step": 353198, "epoch": 4255} {"train_loss": -26.660511016845703, "global_step": 353199, "epoch": 4255} {"train_loss": -26.267805099487305, "global_step": 353200, "epoch": 4255} {"train_loss": -26.15886878967285, "global_step": 353201, "epoch": 4255} {"train_loss": -26.11908531188965, "global_step": 353202, "epoch": 4255} {"train_loss": -26.480243682861328, "global_step": 353203, "epoch": 4255} {"train_loss": -26.3920955657959, "global_step": 353204, "epoch": 4255} {"train_loss": -26.253705978393555, "global_step": 353205, "epoch": 4255} {"train_loss": -26.062198638916016, "global_step": 353206, "epoch": 4255} {"train_loss": -26.165699005126953, "global_step": 353207, "epoch": 4255} {"train_loss": -26.23321533203125, "global_step": 353208, "epoch": 4255} {"train_loss": -26.326465606689453, "global_step": 353209, "epoch": 4255} {"train_loss": -26.181533813476562, "global_step": 353210, "epoch": 4255} {"train_loss": -26.714258193969727, "global_step": 353211, "epoch": 4255} {"train_loss": -26.30196189880371, "global_step": 353212, "epoch": 4255} {"train_loss": -26.04109001159668, "global_step": 353213, "epoch": 4255} {"train_loss": -26.293323516845703, "global_step": 353214, "epoch": 4255} {"train_loss": -26.483779907226562, "global_step": 353215, "epoch": 4255} {"train_loss": -26.41261100769043, "global_step": 353216, "epoch": 4255} {"train_loss": -26.815305709838867, "global_step": 353217, "epoch": 4255} {"train_loss": -25.828229904174805, "global_step": 353218, "epoch": 4255} {"train_loss": -26.55706214904785, "global_step": 353219, "epoch": 4255} {"train_loss": -26.06122398376465, "global_step": 353220, "epoch": 4255} {"train_loss": -26.188581466674805, "global_step": 353221, "epoch": 4255} {"train_loss": -25.823511123657227, "global_step": 353222, "epoch": 4255} {"train_loss": -25.849340438842773, "global_step": 353223, "epoch": 4255} {"train_loss": -26.1383113861084, "global_step": 353224, "epoch": 4255} {"train_loss": -25.73516845703125, "global_step": 353225, "epoch": 4255} {"train_loss": -24.984588623046875, "global_step": 353226, "epoch": 4255} {"train_loss": -25.116788864135742, "global_step": 353227, "epoch": 4255} {"train_loss": -25.83919334411621, "global_step": 353228, "epoch": 4255} {"train_loss": -26.262939453125, "global_step": 353229, "epoch": 4255} {"train_loss": -25.826068878173828, "global_step": 353230, "epoch": 4255} {"train_loss": -25.838134765625, "global_step": 353231, "epoch": 4255} {"train_loss": -25.956811904907227, "global_step": 353232, "epoch": 4255} {"train_loss": -25.873931884765625, "global_step": 353233, "epoch": 4255} {"train_loss": -25.972808837890625, "global_step": 353234, "epoch": 4255} {"train_loss": -25.857030868530273, "global_step": 353235, "epoch": 4255} {"train_loss": -26.231470108032227, "global_step": 353236, "epoch": 4255} {"train_loss": -25.860000610351562, "global_step": 353237, "epoch": 4255} {"train_loss": -25.881134033203125, "global_step": 353238, "epoch": 4255} {"train_loss": -25.923120498657227, "global_step": 353239, "epoch": 4255} {"train_loss": -25.790771484375, "global_step": 353240, "epoch": 4255} {"train_loss": -25.74239158630371, "global_step": 353241, "epoch": 4255} {"train_loss": -25.894498825073242, "global_step": 353242, "epoch": 4255} {"train_loss": -26.192373275756836, "global_step": 353243, "epoch": 4255} {"train_loss": -25.748083114624023, "global_step": 353244, "epoch": 4255} {"train_loss": -25.877105712890625, "global_step": 353245, "epoch": 4255} {"train_loss": -26.09981346130371, "global_step": 353246, "epoch": 4255} {"train_loss": -26.03057964738593, "global_step": 353247, "epoch": 4255, "val_loss": 6824486.0} {"train_loss": -26.158445358276367, "global_step": 353248, "epoch": 4256} {"train_loss": -25.71821403503418, "global_step": 353249, "epoch": 4256} {"train_loss": -25.833663940429688, "global_step": 353250, "epoch": 4256} {"train_loss": -26.03468132019043, "global_step": 353251, "epoch": 4256} {"train_loss": -25.790851593017578, "global_step": 353252, "epoch": 4256} {"train_loss": -25.953657150268555, "global_step": 353253, "epoch": 4256} {"train_loss": -25.728235244750977, "global_step": 353254, "epoch": 4256} {"train_loss": -25.972339630126953, "global_step": 353255, "epoch": 4256} {"train_loss": -26.387409210205078, "global_step": 353256, "epoch": 4256} {"train_loss": -26.3111572265625, "global_step": 353257, "epoch": 4256} {"train_loss": -26.0336971282959, "global_step": 353258, "epoch": 4256} {"train_loss": -26.350250244140625, "global_step": 353259, "epoch": 4256} {"train_loss": -26.31683349609375, "global_step": 353260, "epoch": 4256} {"train_loss": -26.44329833984375, "global_step": 353261, "epoch": 4256} {"train_loss": -26.062353134155273, "global_step": 353262, "epoch": 4256} {"train_loss": -26.373462677001953, "global_step": 353263, "epoch": 4256} {"train_loss": -25.956893920898438, "global_step": 353264, "epoch": 4256} {"train_loss": -26.15213394165039, "global_step": 353265, "epoch": 4256} {"train_loss": -26.295059204101562, "global_step": 353266, "epoch": 4256} {"train_loss": -25.908863067626953, "global_step": 353267, "epoch": 4256} {"train_loss": -26.279699325561523, "global_step": 353268, "epoch": 4256} {"train_loss": -26.40630531311035, "global_step": 353269, "epoch": 4256} {"train_loss": -25.64938735961914, "global_step": 353270, "epoch": 4256} {"train_loss": -26.237323760986328, "global_step": 353271, "epoch": 4256} {"train_loss": -26.450946807861328, "global_step": 353272, "epoch": 4256} {"train_loss": -25.928049087524414, "global_step": 353273, "epoch": 4256} {"train_loss": -26.284143447875977, "global_step": 353274, "epoch": 4256} {"train_loss": -25.95762062072754, "global_step": 353275, "epoch": 4256} {"train_loss": -25.8670597076416, "global_step": 353276, "epoch": 4256} {"train_loss": -26.45393943786621, "global_step": 353277, "epoch": 4256} {"train_loss": -26.352827072143555, "global_step": 353278, "epoch": 4256} {"train_loss": -25.835901260375977, "global_step": 353279, "epoch": 4256} {"train_loss": -26.379791259765625, "global_step": 353280, "epoch": 4256} {"train_loss": -25.9871826171875, "global_step": 353281, "epoch": 4256} {"train_loss": -26.48545265197754, "global_step": 353282, "epoch": 4256} {"train_loss": -26.383813858032227, "global_step": 353283, "epoch": 4256} {"train_loss": -26.0382080078125, "global_step": 353284, "epoch": 4256} {"train_loss": -26.574813842773438, "global_step": 353285, "epoch": 4256} {"train_loss": -26.393482208251953, "global_step": 353286, "epoch": 4256} {"train_loss": -26.46417236328125, "global_step": 353287, "epoch": 4256} {"train_loss": -26.529010772705078, "global_step": 353288, "epoch": 4256} {"train_loss": -26.120838165283203, "global_step": 353289, "epoch": 4256} {"train_loss": -26.372577667236328, "global_step": 353290, "epoch": 4256} {"train_loss": -26.313251495361328, "global_step": 353291, "epoch": 4256} {"train_loss": -26.296186447143555, "global_step": 353292, "epoch": 4256} {"train_loss": -26.275442123413086, "global_step": 353293, "epoch": 4256} {"train_loss": -26.4552059173584, "global_step": 353294, "epoch": 4256} {"train_loss": -26.197708129882812, "global_step": 353295, "epoch": 4256} {"train_loss": -26.16388511657715, "global_step": 353296, "epoch": 4256} {"train_loss": -26.678272247314453, "global_step": 353297, "epoch": 4256} {"train_loss": -26.130231857299805, "global_step": 353298, "epoch": 4256} {"train_loss": -26.02618408203125, "global_step": 353299, "epoch": 4256} {"train_loss": -25.958465576171875, "global_step": 353300, "epoch": 4256} {"train_loss": -26.199270248413086, "global_step": 353301, "epoch": 4256} {"train_loss": -25.91074562072754, "global_step": 353302, "epoch": 4256} {"train_loss": -26.165979385375977, "global_step": 353303, "epoch": 4256} {"train_loss": -26.368249893188477, "global_step": 353304, "epoch": 4256} {"train_loss": -26.088653564453125, "global_step": 353305, "epoch": 4256} {"train_loss": -25.840906143188477, "global_step": 353306, "epoch": 4256} {"train_loss": -25.860090255737305, "global_step": 353307, "epoch": 4256} {"train_loss": -26.0174617767334, "global_step": 353308, "epoch": 4256} {"train_loss": -26.532384872436523, "global_step": 353309, "epoch": 4256} {"train_loss": -26.132551193237305, "global_step": 353310, "epoch": 4256} {"train_loss": -26.081619262695312, "global_step": 353311, "epoch": 4256} {"train_loss": -25.794300079345703, "global_step": 353312, "epoch": 4256} {"train_loss": -26.564483642578125, "global_step": 353313, "epoch": 4256} {"train_loss": -26.2205867767334, "global_step": 353314, "epoch": 4256} {"train_loss": -25.859838485717773, "global_step": 353315, "epoch": 4256} {"train_loss": -26.189489364624023, "global_step": 353316, "epoch": 4256} {"train_loss": -26.041818618774414, "global_step": 353317, "epoch": 4256} {"train_loss": -26.194583892822266, "global_step": 353318, "epoch": 4256} {"train_loss": -26.143634796142578, "global_step": 353319, "epoch": 4256} {"train_loss": -25.854736328125, "global_step": 353320, "epoch": 4256} {"train_loss": -25.889636993408203, "global_step": 353321, "epoch": 4256} {"train_loss": -26.40936279296875, "global_step": 353322, "epoch": 4256} {"train_loss": -26.232030868530273, "global_step": 353323, "epoch": 4256} {"train_loss": -26.167150497436523, "global_step": 353324, "epoch": 4256} {"train_loss": -26.3784236907959, "global_step": 353325, "epoch": 4256} {"train_loss": -26.418827056884766, "global_step": 353326, "epoch": 4256} {"train_loss": -26.037145614624023, "global_step": 353327, "epoch": 4256} {"train_loss": -26.036054611206055, "global_step": 353328, "epoch": 4256} {"train_loss": -25.761474609375, "global_step": 353329, "epoch": 4256} {"train_loss": -26.166422832443054, "global_step": 353330, "epoch": 4256, "val_loss": 6747263.0} {"train_loss": -25.744678497314453, "global_step": 353331, "epoch": 4257} {"train_loss": -26.04366111755371, "global_step": 353332, "epoch": 4257} {"train_loss": -25.460899353027344, "global_step": 353333, "epoch": 4257} {"train_loss": -25.20036506652832, "global_step": 353334, "epoch": 4257} {"train_loss": -25.93413734436035, "global_step": 353335, "epoch": 4257} {"train_loss": -25.897403717041016, "global_step": 353336, "epoch": 4257} {"train_loss": -25.990814208984375, "global_step": 353337, "epoch": 4257} {"train_loss": -25.786996841430664, "global_step": 353338, "epoch": 4257} {"train_loss": -25.56619644165039, "global_step": 353339, "epoch": 4257} {"train_loss": -25.85724449157715, "global_step": 353340, "epoch": 4257} {"train_loss": -25.840829849243164, "global_step": 353341, "epoch": 4257} {"train_loss": -25.885175704956055, "global_step": 353342, "epoch": 4257} {"train_loss": -26.12152671813965, "global_step": 353343, "epoch": 4257} {"train_loss": -25.87105369567871, "global_step": 353344, "epoch": 4257} {"train_loss": -26.131635665893555, "global_step": 353345, "epoch": 4257} {"train_loss": -26.02189064025879, "global_step": 353346, "epoch": 4257} {"train_loss": -25.669340133666992, "global_step": 353347, "epoch": 4257} {"train_loss": -25.966144561767578, "global_step": 353348, "epoch": 4257} {"train_loss": -26.1394100189209, "global_step": 353349, "epoch": 4257} {"train_loss": -26.122350692749023, "global_step": 353350, "epoch": 4257} {"train_loss": -26.279138565063477, "global_step": 353351, "epoch": 4257} {"train_loss": -25.774322509765625, "global_step": 353352, "epoch": 4257} {"train_loss": -26.24237632751465, "global_step": 353353, "epoch": 4257} {"train_loss": -26.27789306640625, "global_step": 353354, "epoch": 4257} {"train_loss": -26.03387451171875, "global_step": 353355, "epoch": 4257} {"train_loss": -26.03240966796875, "global_step": 353356, "epoch": 4257} {"train_loss": -25.901342391967773, "global_step": 353357, "epoch": 4257} {"train_loss": -26.122028350830078, "global_step": 353358, "epoch": 4257} {"train_loss": -26.377378463745117, "global_step": 353359, "epoch": 4257} {"train_loss": -26.203699111938477, "global_step": 353360, "epoch": 4257} {"train_loss": -26.251306533813477, "global_step": 353361, "epoch": 4257} {"train_loss": -26.28742790222168, "global_step": 353362, "epoch": 4257} {"train_loss": -26.055349349975586, "global_step": 353363, "epoch": 4257} {"train_loss": -26.11517906188965, "global_step": 353364, "epoch": 4257} {"train_loss": -26.32159423828125, "global_step": 353365, "epoch": 4257} {"train_loss": -26.23725700378418, "global_step": 353366, "epoch": 4257} {"train_loss": -26.12147331237793, "global_step": 353367, "epoch": 4257} {"train_loss": -26.261005401611328, "global_step": 353368, "epoch": 4257} {"train_loss": -26.162830352783203, "global_step": 353369, "epoch": 4257} {"train_loss": -26.120258331298828, "global_step": 353370, "epoch": 4257} {"train_loss": -26.07413673400879, "global_step": 353371, "epoch": 4257} {"train_loss": -25.739133834838867, "global_step": 353372, "epoch": 4257} {"train_loss": -24.955795288085938, "global_step": 353373, "epoch": 4257} {"train_loss": -24.779987335205078, "global_step": 353374, "epoch": 4257} {"train_loss": -26.259557723999023, "global_step": 353375, "epoch": 4257} {"train_loss": -26.0950927734375, "global_step": 353376, "epoch": 4257} {"train_loss": -25.76124382019043, "global_step": 353377, "epoch": 4257} {"train_loss": -25.741315841674805, "global_step": 353378, "epoch": 4257} {"train_loss": -25.700916290283203, "global_step": 353379, "epoch": 4257} {"train_loss": -25.738574981689453, "global_step": 353380, "epoch": 4257} {"train_loss": -26.258203506469727, "global_step": 353381, "epoch": 4257} {"train_loss": -26.018524169921875, "global_step": 353382, "epoch": 4257} {"train_loss": -26.251367568969727, "global_step": 353383, "epoch": 4257} {"train_loss": -25.813024520874023, "global_step": 353384, "epoch": 4257} {"train_loss": -26.17317008972168, "global_step": 353385, "epoch": 4257} {"train_loss": -25.992712020874023, "global_step": 353386, "epoch": 4257} {"train_loss": -25.839889526367188, "global_step": 353387, "epoch": 4257} {"train_loss": -26.19223403930664, "global_step": 353388, "epoch": 4257} {"train_loss": -25.99142837524414, "global_step": 353389, "epoch": 4257} {"train_loss": -25.934284210205078, "global_step": 353390, "epoch": 4257} {"train_loss": -25.97616958618164, "global_step": 353391, "epoch": 4257} {"train_loss": -25.869831085205078, "global_step": 353392, "epoch": 4257} {"train_loss": -26.52613639831543, "global_step": 353393, "epoch": 4257} {"train_loss": -26.1179256439209, "global_step": 353394, "epoch": 4257} {"train_loss": -26.09659194946289, "global_step": 353395, "epoch": 4257} {"train_loss": -26.107177734375, "global_step": 353396, "epoch": 4257} {"train_loss": -25.958133697509766, "global_step": 353397, "epoch": 4257} {"train_loss": -26.061267852783203, "global_step": 353398, "epoch": 4257} {"train_loss": -26.084524154663086, "global_step": 353399, "epoch": 4257} {"train_loss": -26.275272369384766, "global_step": 353400, "epoch": 4257} {"train_loss": -26.29975700378418, "global_step": 353401, "epoch": 4257} {"train_loss": -26.47382926940918, "global_step": 353402, "epoch": 4257} {"train_loss": -25.938566207885742, "global_step": 353403, "epoch": 4257} {"train_loss": -26.464603424072266, "global_step": 353404, "epoch": 4257} {"train_loss": -26.452234268188477, "global_step": 353405, "epoch": 4257} {"train_loss": -26.249963760375977, "global_step": 353406, "epoch": 4257} {"train_loss": -25.920974731445312, "global_step": 353407, "epoch": 4257} {"train_loss": -26.68072509765625, "global_step": 353408, "epoch": 4257} {"train_loss": -26.223163604736328, "global_step": 353409, "epoch": 4257} {"train_loss": -26.1326961517334, "global_step": 353410, "epoch": 4257} {"train_loss": -26.14023208618164, "global_step": 353411, "epoch": 4257} {"train_loss": -26.200672149658203, "global_step": 353412, "epoch": 4257} {"train_loss": -26.03156475848462, "global_step": 353413, "epoch": 4257, "val_loss": 6714227.0} {"train_loss": -26.17095375061035, "global_step": 353414, "epoch": 4258} {"train_loss": -25.616174697875977, "global_step": 353415, "epoch": 4258} {"train_loss": -25.8409481048584, "global_step": 353416, "epoch": 4258} {"train_loss": -25.611572265625, "global_step": 353417, "epoch": 4258} {"train_loss": -25.81255531311035, "global_step": 353418, "epoch": 4258} {"train_loss": -25.969919204711914, "global_step": 353419, "epoch": 4258} {"train_loss": -26.35370445251465, "global_step": 353420, "epoch": 4258} {"train_loss": -25.834552764892578, "global_step": 353421, "epoch": 4258} {"train_loss": -25.766071319580078, "global_step": 353422, "epoch": 4258} {"train_loss": -26.141845703125, "global_step": 353423, "epoch": 4258} {"train_loss": -26.346288681030273, "global_step": 353424, "epoch": 4258} {"train_loss": -25.683917999267578, "global_step": 353425, "epoch": 4258} {"train_loss": -26.169767379760742, "global_step": 353426, "epoch": 4258} {"train_loss": -25.9128475189209, "global_step": 353427, "epoch": 4258} {"train_loss": -26.431608200073242, "global_step": 353428, "epoch": 4258} {"train_loss": -26.050161361694336, "global_step": 353429, "epoch": 4258} {"train_loss": -26.20331382751465, "global_step": 353430, "epoch": 4258} {"train_loss": -25.850019454956055, "global_step": 353431, "epoch": 4258} {"train_loss": -26.022266387939453, "global_step": 353432, "epoch": 4258} {"train_loss": -26.056781768798828, "global_step": 353433, "epoch": 4258} {"train_loss": -25.809446334838867, "global_step": 353434, "epoch": 4258} {"train_loss": -25.994064331054688, "global_step": 353435, "epoch": 4258} {"train_loss": -26.0162296295166, "global_step": 353436, "epoch": 4258} {"train_loss": -26.691314697265625, "global_step": 353437, "epoch": 4258} {"train_loss": -25.962305068969727, "global_step": 353438, "epoch": 4258} {"train_loss": -26.041913986206055, "global_step": 353439, "epoch": 4258} {"train_loss": -26.361785888671875, "global_step": 353440, "epoch": 4258} {"train_loss": -26.1779727935791, "global_step": 353441, "epoch": 4258} {"train_loss": -26.00298500061035, "global_step": 353442, "epoch": 4258} {"train_loss": -26.183364868164062, "global_step": 353443, "epoch": 4258} {"train_loss": -26.44187355041504, "global_step": 353444, "epoch": 4258} {"train_loss": -26.067020416259766, "global_step": 353445, "epoch": 4258} {"train_loss": -25.9896297454834, "global_step": 353446, "epoch": 4258} {"train_loss": -26.073230743408203, "global_step": 353447, "epoch": 4258} {"train_loss": -25.925724029541016, "global_step": 353448, "epoch": 4258} {"train_loss": -25.670654296875, "global_step": 353449, "epoch": 4258} {"train_loss": -26.105756759643555, "global_step": 353450, "epoch": 4258} {"train_loss": -26.164844512939453, "global_step": 353451, "epoch": 4258} {"train_loss": -25.907032012939453, "global_step": 353452, "epoch": 4258} {"train_loss": -26.479267120361328, "global_step": 353453, "epoch": 4258} {"train_loss": -26.258651733398438, "global_step": 353454, "epoch": 4258} {"train_loss": -26.118677139282227, "global_step": 353455, "epoch": 4258} {"train_loss": -26.064817428588867, "global_step": 353456, "epoch": 4258} {"train_loss": -26.072357177734375, "global_step": 353457, "epoch": 4258} {"train_loss": -26.04365348815918, "global_step": 353458, "epoch": 4258} {"train_loss": -26.5159969329834, "global_step": 353459, "epoch": 4258} {"train_loss": -26.4665584564209, "global_step": 353460, "epoch": 4258} {"train_loss": -25.92380714416504, "global_step": 353461, "epoch": 4258} {"train_loss": -26.343341827392578, "global_step": 353462, "epoch": 4258} {"train_loss": -26.122161865234375, "global_step": 353463, "epoch": 4258} {"train_loss": -26.258996963500977, "global_step": 353464, "epoch": 4258} {"train_loss": -26.472461700439453, "global_step": 353465, "epoch": 4258} {"train_loss": -26.431299209594727, "global_step": 353466, "epoch": 4258} {"train_loss": -26.2450008392334, "global_step": 353467, "epoch": 4258} {"train_loss": -26.5507869720459, "global_step": 353468, "epoch": 4258} {"train_loss": -26.59490394592285, "global_step": 353469, "epoch": 4258} {"train_loss": -26.391128540039062, "global_step": 353470, "epoch": 4258} {"train_loss": -26.262741088867188, "global_step": 353471, "epoch": 4258} {"train_loss": -26.40252113342285, "global_step": 353472, "epoch": 4258} {"train_loss": -26.253116607666016, "global_step": 353473, "epoch": 4258} {"train_loss": -26.087308883666992, "global_step": 353474, "epoch": 4258} {"train_loss": -26.591705322265625, "global_step": 353475, "epoch": 4258} {"train_loss": -26.347265243530273, "global_step": 353476, "epoch": 4258} {"train_loss": -26.329822540283203, "global_step": 353477, "epoch": 4258} {"train_loss": -26.432952880859375, "global_step": 353478, "epoch": 4258} {"train_loss": -26.379159927368164, "global_step": 353479, "epoch": 4258} {"train_loss": -26.137439727783203, "global_step": 353480, "epoch": 4258} {"train_loss": -26.440649032592773, "global_step": 353481, "epoch": 4258} {"train_loss": -26.182615280151367, "global_step": 353482, "epoch": 4258} {"train_loss": -26.7265682220459, "global_step": 353483, "epoch": 4258} {"train_loss": -26.11981201171875, "global_step": 353484, "epoch": 4258} {"train_loss": -26.207334518432617, "global_step": 353485, "epoch": 4258} {"train_loss": -25.72562026977539, "global_step": 353486, "epoch": 4258} {"train_loss": -26.000076293945312, "global_step": 353487, "epoch": 4258} {"train_loss": -25.5296573638916, "global_step": 353488, "epoch": 4258} {"train_loss": -26.090957641601562, "global_step": 353489, "epoch": 4258} {"train_loss": -26.031436920166016, "global_step": 353490, "epoch": 4258} {"train_loss": -25.901840209960938, "global_step": 353491, "epoch": 4258} {"train_loss": -26.109699249267578, "global_step": 353492, "epoch": 4258} {"train_loss": -25.809240341186523, "global_step": 353493, "epoch": 4258} {"train_loss": -26.369787216186523, "global_step": 353494, "epoch": 4258} {"train_loss": -25.71840476989746, "global_step": 353495, "epoch": 4258} {"train_loss": -26.1321253489299, "global_step": 353496, "epoch": 4258, "val_loss": 6714316.0} {"train_loss": -25.425539016723633, "global_step": 353497, "epoch": 4259} {"train_loss": -25.50039291381836, "global_step": 353498, "epoch": 4259} {"train_loss": -25.772008895874023, "global_step": 353499, "epoch": 4259} {"train_loss": -25.408926010131836, "global_step": 353500, "epoch": 4259} {"train_loss": -26.076013565063477, "global_step": 353501, "epoch": 4259} {"train_loss": -25.396657943725586, "global_step": 353502, "epoch": 4259} {"train_loss": -25.556058883666992, "global_step": 353503, "epoch": 4259} {"train_loss": -25.804418563842773, "global_step": 353504, "epoch": 4259} {"train_loss": -26.052061080932617, "global_step": 353505, "epoch": 4259} {"train_loss": -25.660785675048828, "global_step": 353506, "epoch": 4259} {"train_loss": -25.94282341003418, "global_step": 353507, "epoch": 4259} {"train_loss": -26.00397300720215, "global_step": 353508, "epoch": 4259} {"train_loss": -25.817657470703125, "global_step": 353509, "epoch": 4259} {"train_loss": -25.6466064453125, "global_step": 353510, "epoch": 4259} {"train_loss": -25.94333839416504, "global_step": 353511, "epoch": 4259} {"train_loss": -25.814014434814453, "global_step": 353512, "epoch": 4259} {"train_loss": -25.774768829345703, "global_step": 353513, "epoch": 4259} {"train_loss": -25.610563278198242, "global_step": 353514, "epoch": 4259} {"train_loss": -25.811172485351562, "global_step": 353515, "epoch": 4259} {"train_loss": -26.293441772460938, "global_step": 353516, "epoch": 4259} {"train_loss": -25.921295166015625, "global_step": 353517, "epoch": 4259} {"train_loss": -25.69122314453125, "global_step": 353518, "epoch": 4259} {"train_loss": -26.086877822875977, "global_step": 353519, "epoch": 4259} {"train_loss": -26.132953643798828, "global_step": 353520, "epoch": 4259} {"train_loss": -26.398584365844727, "global_step": 353521, "epoch": 4259} {"train_loss": -25.915027618408203, "global_step": 353522, "epoch": 4259} {"train_loss": -26.0638484954834, "global_step": 353523, "epoch": 4259} {"train_loss": -26.31635093688965, "global_step": 353524, "epoch": 4259} {"train_loss": -26.151227951049805, "global_step": 353525, "epoch": 4259} {"train_loss": -26.1146297454834, "global_step": 353526, "epoch": 4259} {"train_loss": -26.212438583374023, "global_step": 353527, "epoch": 4259} {"train_loss": -26.244327545166016, "global_step": 353528, "epoch": 4259} {"train_loss": -26.305707931518555, "global_step": 353529, "epoch": 4259} {"train_loss": -26.141759872436523, "global_step": 353530, "epoch": 4259} {"train_loss": -26.19434928894043, "global_step": 353531, "epoch": 4259} {"train_loss": -26.044326782226562, "global_step": 353532, "epoch": 4259} {"train_loss": -25.918615341186523, "global_step": 353533, "epoch": 4259} {"train_loss": -26.134443283081055, "global_step": 353534, "epoch": 4259} {"train_loss": -26.175352096557617, "global_step": 353535, "epoch": 4259} {"train_loss": -26.304712295532227, "global_step": 353536, "epoch": 4259} {"train_loss": -26.295557022094727, "global_step": 353537, "epoch": 4259} {"train_loss": -26.2443790435791, "global_step": 353538, "epoch": 4259} {"train_loss": -26.240039825439453, "global_step": 353539, "epoch": 4259} {"train_loss": -26.435636520385742, "global_step": 353540, "epoch": 4259} {"train_loss": -26.467695236206055, "global_step": 353541, "epoch": 4259} {"train_loss": -26.472156524658203, "global_step": 353542, "epoch": 4259} {"train_loss": -26.24708366394043, "global_step": 353543, "epoch": 4259} {"train_loss": -26.4843807220459, "global_step": 353544, "epoch": 4259} {"train_loss": -26.355880737304688, "global_step": 353545, "epoch": 4259} {"train_loss": -26.347766876220703, "global_step": 353546, "epoch": 4259} {"train_loss": -26.517255783081055, "global_step": 353547, "epoch": 4259} {"train_loss": -26.529052734375, "global_step": 353548, "epoch": 4259} {"train_loss": -26.20499610900879, "global_step": 353549, "epoch": 4259} {"train_loss": -25.91780662536621, "global_step": 353550, "epoch": 4259} {"train_loss": -25.88178062438965, "global_step": 353551, "epoch": 4259} {"train_loss": -26.207599639892578, "global_step": 353552, "epoch": 4259} {"train_loss": -25.5482120513916, "global_step": 353553, "epoch": 4259} {"train_loss": -25.761457443237305, "global_step": 353554, "epoch": 4259} {"train_loss": -25.85541343688965, "global_step": 353555, "epoch": 4259} {"train_loss": -26.21137046813965, "global_step": 353556, "epoch": 4259} {"train_loss": -26.05523681640625, "global_step": 353557, "epoch": 4259} {"train_loss": -26.037580490112305, "global_step": 353558, "epoch": 4259} {"train_loss": -25.71052360534668, "global_step": 353559, "epoch": 4259} {"train_loss": -25.86762046813965, "global_step": 353560, "epoch": 4259} {"train_loss": -26.193161010742188, "global_step": 353561, "epoch": 4259} {"train_loss": -25.716093063354492, "global_step": 353562, "epoch": 4259} {"train_loss": -25.9820556640625, "global_step": 353563, "epoch": 4259} {"train_loss": -26.275800704956055, "global_step": 353564, "epoch": 4259} {"train_loss": -25.925973892211914, "global_step": 353565, "epoch": 4259} {"train_loss": -25.925113677978516, "global_step": 353566, "epoch": 4259} {"train_loss": -26.049697875976562, "global_step": 353567, "epoch": 4259} {"train_loss": -26.06869888305664, "global_step": 353568, "epoch": 4259} {"train_loss": -26.247058868408203, "global_step": 353569, "epoch": 4259} {"train_loss": -26.29691505432129, "global_step": 353570, "epoch": 4259} {"train_loss": -26.19999122619629, "global_step": 353571, "epoch": 4259} {"train_loss": -25.46366310119629, "global_step": 353572, "epoch": 4259} {"train_loss": -26.041208267211914, "global_step": 353573, "epoch": 4259} {"train_loss": -26.242273330688477, "global_step": 353574, "epoch": 4259} {"train_loss": -25.908111572265625, "global_step": 353575, "epoch": 4259} {"train_loss": -25.782602310180664, "global_step": 353576, "epoch": 4259} {"train_loss": -26.304162979125977, "global_step": 353577, "epoch": 4259} {"train_loss": -26.456989288330078, "global_step": 353578, "epoch": 4259} {"train_loss": -26.042537137686487, "global_step": 353579, "epoch": 4259, "val_loss": 6644571.0} {"train_loss": -25.94287109375, "global_step": 353580, "epoch": 4260} {"train_loss": -25.001760482788086, "global_step": 353581, "epoch": 4260} {"train_loss": -25.91658592224121, "global_step": 353582, "epoch": 4260} {"train_loss": -25.776718139648438, "global_step": 353583, "epoch": 4260} {"train_loss": -25.813190460205078, "global_step": 353584, "epoch": 4260} {"train_loss": -25.7075138092041, "global_step": 353585, "epoch": 4260} {"train_loss": -25.846548080444336, "global_step": 353586, "epoch": 4260} {"train_loss": -26.247802734375, "global_step": 353587, "epoch": 4260} {"train_loss": -25.995542526245117, "global_step": 353588, "epoch": 4260} {"train_loss": -25.975482940673828, "global_step": 353589, "epoch": 4260} {"train_loss": -26.055570602416992, "global_step": 353590, "epoch": 4260} {"train_loss": -25.880176544189453, "global_step": 353591, "epoch": 4260} {"train_loss": -25.977304458618164, "global_step": 353592, "epoch": 4260} {"train_loss": -26.418180465698242, "global_step": 353593, "epoch": 4260} {"train_loss": -25.974699020385742, "global_step": 353594, "epoch": 4260} {"train_loss": -26.26633644104004, "global_step": 353595, "epoch": 4260} {"train_loss": -25.95905876159668, "global_step": 353596, "epoch": 4260} {"train_loss": -26.339338302612305, "global_step": 353597, "epoch": 4260} {"train_loss": -26.335662841796875, "global_step": 353598, "epoch": 4260} {"train_loss": -25.919233322143555, "global_step": 353599, "epoch": 4260} {"train_loss": -26.309598922729492, "global_step": 353600, "epoch": 4260} {"train_loss": -26.5366153717041, "global_step": 353601, "epoch": 4260} {"train_loss": -26.34626579284668, "global_step": 353602, "epoch": 4260} {"train_loss": -26.23097038269043, "global_step": 353603, "epoch": 4260} {"train_loss": -26.256275177001953, "global_step": 353604, "epoch": 4260} {"train_loss": -26.30198097229004, "global_step": 353605, "epoch": 4260} {"train_loss": -25.826696395874023, "global_step": 353606, "epoch": 4260} {"train_loss": -26.107797622680664, "global_step": 353607, "epoch": 4260} {"train_loss": -26.072179794311523, "global_step": 353608, "epoch": 4260} {"train_loss": -26.564306259155273, "global_step": 353609, "epoch": 4260} {"train_loss": -26.018177032470703, "global_step": 353610, "epoch": 4260} {"train_loss": -26.530439376831055, "global_step": 353611, "epoch": 4260} {"train_loss": -26.014801025390625, "global_step": 353612, "epoch": 4260} {"train_loss": -26.357440948486328, "global_step": 353613, "epoch": 4260} {"train_loss": -26.40284538269043, "global_step": 353614, "epoch": 4260} {"train_loss": -26.6075439453125, "global_step": 353615, "epoch": 4260} {"train_loss": -26.471729278564453, "global_step": 353616, "epoch": 4260} {"train_loss": -26.51813316345215, "global_step": 353617, "epoch": 4260} {"train_loss": -26.003644943237305, "global_step": 353618, "epoch": 4260} {"train_loss": -26.106103897094727, "global_step": 353619, "epoch": 4260} {"train_loss": -26.07032585144043, "global_step": 353620, "epoch": 4260} {"train_loss": -26.193378448486328, "global_step": 353621, "epoch": 4260} {"train_loss": -26.193567276000977, "global_step": 353622, "epoch": 4260} {"train_loss": -26.394760131835938, "global_step": 353623, "epoch": 4260} {"train_loss": -26.26324462890625, "global_step": 353624, "epoch": 4260} {"train_loss": -26.46504020690918, "global_step": 353625, "epoch": 4260} {"train_loss": -26.20263671875, "global_step": 353626, "epoch": 4260} {"train_loss": -26.423383712768555, "global_step": 353627, "epoch": 4260} {"train_loss": -26.3786563873291, "global_step": 353628, "epoch": 4260} {"train_loss": -26.223651885986328, "global_step": 353629, "epoch": 4260} {"train_loss": -26.084732055664062, "global_step": 353630, "epoch": 4260} {"train_loss": -26.343048095703125, "global_step": 353631, "epoch": 4260} {"train_loss": -25.891172409057617, "global_step": 353632, "epoch": 4260} {"train_loss": -25.31484031677246, "global_step": 353633, "epoch": 4260} {"train_loss": -25.71320915222168, "global_step": 353634, "epoch": 4260} {"train_loss": -25.844013214111328, "global_step": 353635, "epoch": 4260} {"train_loss": -25.693344116210938, "global_step": 353636, "epoch": 4260} {"train_loss": -25.771167755126953, "global_step": 353637, "epoch": 4260} {"train_loss": -26.22015380859375, "global_step": 353638, "epoch": 4260} {"train_loss": -26.06861686706543, "global_step": 353639, "epoch": 4260} {"train_loss": -25.625629425048828, "global_step": 353640, "epoch": 4260} {"train_loss": -25.6904239654541, "global_step": 353641, "epoch": 4260} {"train_loss": -26.038549423217773, "global_step": 353642, "epoch": 4260} {"train_loss": -26.02918815612793, "global_step": 353643, "epoch": 4260} {"train_loss": -26.193201065063477, "global_step": 353644, "epoch": 4260} {"train_loss": -26.0809326171875, "global_step": 353645, "epoch": 4260} {"train_loss": -26.14218521118164, "global_step": 353646, "epoch": 4260} {"train_loss": -26.126737594604492, "global_step": 353647, "epoch": 4260} {"train_loss": -26.069244384765625, "global_step": 353648, "epoch": 4260} {"train_loss": -26.3309268951416, "global_step": 353649, "epoch": 4260} {"train_loss": -26.124347686767578, "global_step": 353650, "epoch": 4260} {"train_loss": -26.195953369140625, "global_step": 353651, "epoch": 4260} {"train_loss": -25.7529354095459, "global_step": 353652, "epoch": 4260} {"train_loss": -26.566431045532227, "global_step": 353653, "epoch": 4260} {"train_loss": -26.369794845581055, "global_step": 353654, "epoch": 4260} {"train_loss": -26.13058853149414, "global_step": 353655, "epoch": 4260} {"train_loss": -26.23368263244629, "global_step": 353656, "epoch": 4260} {"train_loss": -26.263113021850586, "global_step": 353657, "epoch": 4260} {"train_loss": -26.366056442260742, "global_step": 353658, "epoch": 4260} {"train_loss": -26.18824577331543, "global_step": 353659, "epoch": 4260} {"train_loss": -26.295888900756836, "global_step": 353660, "epoch": 4260} {"train_loss": -25.952381134033203, "global_step": 353661, "epoch": 4260} {"train_loss": -26.099618521081396, "global_step": 353662, "epoch": 4260, "val_loss": 6742003.0} {"train_loss": -25.39089012145996, "global_step": 353663, "epoch": 4261} {"train_loss": -25.331985473632812, "global_step": 353664, "epoch": 4261} {"train_loss": -26.22196388244629, "global_step": 353665, "epoch": 4261} {"train_loss": -25.731149673461914, "global_step": 353666, "epoch": 4261} {"train_loss": -25.55486488342285, "global_step": 353667, "epoch": 4261} {"train_loss": -26.016433715820312, "global_step": 353668, "epoch": 4261} {"train_loss": -25.763427734375, "global_step": 353669, "epoch": 4261} {"train_loss": -25.684040069580078, "global_step": 353670, "epoch": 4261} {"train_loss": -26.27811622619629, "global_step": 353671, "epoch": 4261} {"train_loss": -26.142160415649414, "global_step": 353672, "epoch": 4261} {"train_loss": -26.4249324798584, "global_step": 353673, "epoch": 4261} {"train_loss": -25.86358070373535, "global_step": 353674, "epoch": 4261} {"train_loss": -26.752431869506836, "global_step": 353675, "epoch": 4261} {"train_loss": -26.014204025268555, "global_step": 353676, "epoch": 4261} {"train_loss": -25.9185733795166, "global_step": 353677, "epoch": 4261} {"train_loss": -25.944921493530273, "global_step": 353678, "epoch": 4261} {"train_loss": -25.971302032470703, "global_step": 353679, "epoch": 4261} {"train_loss": -26.3436222076416, "global_step": 353680, "epoch": 4261} {"train_loss": -26.191009521484375, "global_step": 353681, "epoch": 4261} {"train_loss": -26.068714141845703, "global_step": 353682, "epoch": 4261} {"train_loss": -26.391590118408203, "global_step": 353683, "epoch": 4261} {"train_loss": -26.021011352539062, "global_step": 353684, "epoch": 4261} {"train_loss": -26.04559326171875, "global_step": 353685, "epoch": 4261} {"train_loss": -26.315946578979492, "global_step": 353686, "epoch": 4261} {"train_loss": -26.122854232788086, "global_step": 353687, "epoch": 4261} {"train_loss": -26.2819881439209, "global_step": 353688, "epoch": 4261} {"train_loss": -26.139081954956055, "global_step": 353689, "epoch": 4261} {"train_loss": -26.538793563842773, "global_step": 353690, "epoch": 4261} {"train_loss": -26.45210075378418, "global_step": 353691, "epoch": 4261} {"train_loss": -26.339908599853516, "global_step": 353692, "epoch": 4261} {"train_loss": -26.294788360595703, "global_step": 353693, "epoch": 4261} {"train_loss": -26.47770118713379, "global_step": 353694, "epoch": 4261} {"train_loss": -26.03644371032715, "global_step": 353695, "epoch": 4261} {"train_loss": -26.48239517211914, "global_step": 353696, "epoch": 4261} {"train_loss": -26.156219482421875, "global_step": 353697, "epoch": 4261} {"train_loss": -26.430957794189453, "global_step": 353698, "epoch": 4261} {"train_loss": -26.206754684448242, "global_step": 353699, "epoch": 4261} {"train_loss": -25.885498046875, "global_step": 353700, "epoch": 4261} {"train_loss": -26.545333862304688, "global_step": 353701, "epoch": 4261} {"train_loss": -26.266950607299805, "global_step": 353702, "epoch": 4261} {"train_loss": -26.072980880737305, "global_step": 353703, "epoch": 4261} {"train_loss": -26.314008712768555, "global_step": 353704, "epoch": 4261} {"train_loss": -26.195764541625977, "global_step": 353705, "epoch": 4261} {"train_loss": -26.07854652404785, "global_step": 353706, "epoch": 4261} {"train_loss": -25.83176040649414, "global_step": 353707, "epoch": 4261} {"train_loss": -26.0051326751709, "global_step": 353708, "epoch": 4261} {"train_loss": -26.23674964904785, "global_step": 353709, "epoch": 4261} {"train_loss": -26.496463775634766, "global_step": 353710, "epoch": 4261} {"train_loss": -26.36102867126465, "global_step": 353711, "epoch": 4261} {"train_loss": -26.538970947265625, "global_step": 353712, "epoch": 4261} {"train_loss": -26.5501766204834, "global_step": 353713, "epoch": 4261} {"train_loss": -26.641315460205078, "global_step": 353714, "epoch": 4261} {"train_loss": -26.16196060180664, "global_step": 353715, "epoch": 4261} {"train_loss": -26.434925079345703, "global_step": 353716, "epoch": 4261} {"train_loss": -26.229705810546875, "global_step": 353717, "epoch": 4261} {"train_loss": -26.17658805847168, "global_step": 353718, "epoch": 4261} {"train_loss": -26.295988082885742, "global_step": 353719, "epoch": 4261} {"train_loss": -26.3580379486084, "global_step": 353720, "epoch": 4261} {"train_loss": -26.120529174804688, "global_step": 353721, "epoch": 4261} {"train_loss": -26.248743057250977, "global_step": 353722, "epoch": 4261} {"train_loss": -26.39690589904785, "global_step": 353723, "epoch": 4261} {"train_loss": -26.41845703125, "global_step": 353724, "epoch": 4261} {"train_loss": -26.092557907104492, "global_step": 353725, "epoch": 4261} {"train_loss": -26.333093643188477, "global_step": 353726, "epoch": 4261} {"train_loss": -26.271665573120117, "global_step": 353727, "epoch": 4261} {"train_loss": -26.268356323242188, "global_step": 353728, "epoch": 4261} {"train_loss": -26.084320068359375, "global_step": 353729, "epoch": 4261} {"train_loss": -26.268232345581055, "global_step": 353730, "epoch": 4261} {"train_loss": -26.02947425842285, "global_step": 353731, "epoch": 4261} {"train_loss": -26.5635986328125, "global_step": 353732, "epoch": 4261} {"train_loss": -26.17816734313965, "global_step": 353733, "epoch": 4261} {"train_loss": -26.104877471923828, "global_step": 353734, "epoch": 4261} {"train_loss": -26.40692710876465, "global_step": 353735, "epoch": 4261} {"train_loss": -26.2965030670166, "global_step": 353736, "epoch": 4261} {"train_loss": -26.029281616210938, "global_step": 353737, "epoch": 4261} {"train_loss": -26.27408218383789, "global_step": 353738, "epoch": 4261} {"train_loss": -26.22173500061035, "global_step": 353739, "epoch": 4261} {"train_loss": -26.064889907836914, "global_step": 353740, "epoch": 4261} {"train_loss": -26.23089599609375, "global_step": 353741, "epoch": 4261} {"train_loss": -26.13556480407715, "global_step": 353742, "epoch": 4261} {"train_loss": -25.648788452148438, "global_step": 353743, "epoch": 4261} {"train_loss": -26.034351348876953, "global_step": 353744, "epoch": 4261} {"train_loss": -26.18706036763019, "global_step": 353745, "epoch": 4261, "val_loss": 6699002.0} {"train_loss": -24.891016006469727, "global_step": 353746, "epoch": 4262} {"train_loss": -24.691972732543945, "global_step": 353747, "epoch": 4262} {"train_loss": -25.24302101135254, "global_step": 353748, "epoch": 4262} {"train_loss": -25.26212501525879, "global_step": 353749, "epoch": 4262} {"train_loss": -25.587512969970703, "global_step": 353750, "epoch": 4262} {"train_loss": -25.548547744750977, "global_step": 353751, "epoch": 4262} {"train_loss": -25.645526885986328, "global_step": 353752, "epoch": 4262} {"train_loss": -25.44569969177246, "global_step": 353753, "epoch": 4262} {"train_loss": -25.65642738342285, "global_step": 353754, "epoch": 4262} {"train_loss": -25.638391494750977, "global_step": 353755, "epoch": 4262} {"train_loss": -25.636463165283203, "global_step": 353756, "epoch": 4262} {"train_loss": -25.72271728515625, "global_step": 353757, "epoch": 4262} {"train_loss": -25.600202560424805, "global_step": 353758, "epoch": 4262} {"train_loss": -25.786792755126953, "global_step": 353759, "epoch": 4262} {"train_loss": -25.747617721557617, "global_step": 353760, "epoch": 4262} {"train_loss": -25.8577880859375, "global_step": 353761, "epoch": 4262} {"train_loss": -25.544004440307617, "global_step": 353762, "epoch": 4262} {"train_loss": -25.64130973815918, "global_step": 353763, "epoch": 4262} {"train_loss": -25.9588623046875, "global_step": 353764, "epoch": 4262} {"train_loss": -25.960474014282227, "global_step": 353765, "epoch": 4262} {"train_loss": -25.89691734313965, "global_step": 353766, "epoch": 4262} {"train_loss": -25.853342056274414, "global_step": 353767, "epoch": 4262} {"train_loss": -25.802648544311523, "global_step": 353768, "epoch": 4262} {"train_loss": -25.959863662719727, "global_step": 353769, "epoch": 4262} {"train_loss": -26.49716567993164, "global_step": 353770, "epoch": 4262} {"train_loss": -26.273595809936523, "global_step": 353771, "epoch": 4262} {"train_loss": -26.061548233032227, "global_step": 353772, "epoch": 4262} {"train_loss": -26.162256240844727, "global_step": 353773, "epoch": 4262} {"train_loss": -26.067401885986328, "global_step": 353774, "epoch": 4262} {"train_loss": -26.225662231445312, "global_step": 353775, "epoch": 4262} {"train_loss": -26.030118942260742, "global_step": 353776, "epoch": 4262} {"train_loss": -25.945905685424805, "global_step": 353777, "epoch": 4262} {"train_loss": -26.10674476623535, "global_step": 353778, "epoch": 4262} {"train_loss": -26.313058853149414, "global_step": 353779, "epoch": 4262} {"train_loss": -26.024206161499023, "global_step": 353780, "epoch": 4262} {"train_loss": -26.021127700805664, "global_step": 353781, "epoch": 4262} {"train_loss": -26.068578720092773, "global_step": 353782, "epoch": 4262} {"train_loss": -26.064599990844727, "global_step": 353783, "epoch": 4262} {"train_loss": -26.347370147705078, "global_step": 353784, "epoch": 4262} {"train_loss": -26.342695236206055, "global_step": 353785, "epoch": 4262} {"train_loss": -26.34966468811035, "global_step": 353786, "epoch": 4262} {"train_loss": -26.004514694213867, "global_step": 353787, "epoch": 4262} {"train_loss": -26.284137725830078, "global_step": 353788, "epoch": 4262} {"train_loss": -26.394134521484375, "global_step": 353789, "epoch": 4262} {"train_loss": -26.36663246154785, "global_step": 353790, "epoch": 4262} {"train_loss": -26.328845977783203, "global_step": 353791, "epoch": 4262} {"train_loss": -26.269277572631836, "global_step": 353792, "epoch": 4262} {"train_loss": -26.55889320373535, "global_step": 353793, "epoch": 4262} {"train_loss": -26.100982666015625, "global_step": 353794, "epoch": 4262} {"train_loss": -26.1239013671875, "global_step": 353795, "epoch": 4262} {"train_loss": -26.6220645904541, "global_step": 353796, "epoch": 4262} {"train_loss": -26.079486846923828, "global_step": 353797, "epoch": 4262} {"train_loss": -26.511737823486328, "global_step": 353798, "epoch": 4262} {"train_loss": -26.286060333251953, "global_step": 353799, "epoch": 4262} {"train_loss": -26.634428024291992, "global_step": 353800, "epoch": 4262} {"train_loss": -26.397430419921875, "global_step": 353801, "epoch": 4262} {"train_loss": -26.487104415893555, "global_step": 353802, "epoch": 4262} {"train_loss": -26.426593780517578, "global_step": 353803, "epoch": 4262} {"train_loss": -26.345081329345703, "global_step": 353804, "epoch": 4262} {"train_loss": -26.19196128845215, "global_step": 353805, "epoch": 4262} {"train_loss": -25.802560806274414, "global_step": 353806, "epoch": 4262} {"train_loss": -26.188098907470703, "global_step": 353807, "epoch": 4262} {"train_loss": -26.181903839111328, "global_step": 353808, "epoch": 4262} {"train_loss": -26.46674156188965, "global_step": 353809, "epoch": 4262} {"train_loss": -25.521808624267578, "global_step": 353810, "epoch": 4262} {"train_loss": -25.535839080810547, "global_step": 353811, "epoch": 4262} {"train_loss": -25.4434814453125, "global_step": 353812, "epoch": 4262} {"train_loss": -25.54155921936035, "global_step": 353813, "epoch": 4262} {"train_loss": -25.463865280151367, "global_step": 353814, "epoch": 4262} {"train_loss": -25.72516441345215, "global_step": 353815, "epoch": 4262} {"train_loss": -25.99140739440918, "global_step": 353816, "epoch": 4262} {"train_loss": -26.062732696533203, "global_step": 353817, "epoch": 4262} {"train_loss": -25.392091751098633, "global_step": 353818, "epoch": 4262} {"train_loss": -25.845144271850586, "global_step": 353819, "epoch": 4262} {"train_loss": -25.69941520690918, "global_step": 353820, "epoch": 4262} {"train_loss": -25.69085121154785, "global_step": 353821, "epoch": 4262} {"train_loss": -25.87579917907715, "global_step": 353822, "epoch": 4262} {"train_loss": -25.947858810424805, "global_step": 353823, "epoch": 4262} {"train_loss": -26.225610733032227, "global_step": 353824, "epoch": 4262} {"train_loss": -25.509782791137695, "global_step": 353825, "epoch": 4262} {"train_loss": -26.47820472717285, "global_step": 353826, "epoch": 4262} {"train_loss": -26.133588790893555, "global_step": 353827, "epoch": 4262} {"train_loss": -25.950433616178582, "global_step": 353828, "epoch": 4262, "val_loss": 6694008.0} {"train_loss": -25.543960571289062, "global_step": 353829, "epoch": 4263} {"train_loss": -25.862516403198242, "global_step": 353830, "epoch": 4263} {"train_loss": -25.813425064086914, "global_step": 353831, "epoch": 4263} {"train_loss": -25.846853256225586, "global_step": 353832, "epoch": 4263} {"train_loss": -26.05877685546875, "global_step": 353833, "epoch": 4263} {"train_loss": -25.958642959594727, "global_step": 353834, "epoch": 4263} {"train_loss": -25.69492530822754, "global_step": 353835, "epoch": 4263} {"train_loss": -26.04266929626465, "global_step": 353836, "epoch": 4263} {"train_loss": -25.984704971313477, "global_step": 353837, "epoch": 4263} {"train_loss": -26.222156524658203, "global_step": 353838, "epoch": 4263} {"train_loss": -26.6384220123291, "global_step": 353839, "epoch": 4263} {"train_loss": -26.21539878845215, "global_step": 353840, "epoch": 4263} {"train_loss": -26.175495147705078, "global_step": 353841, "epoch": 4263} {"train_loss": -26.28631019592285, "global_step": 353842, "epoch": 4263} {"train_loss": -26.511280059814453, "global_step": 353843, "epoch": 4263} {"train_loss": -26.12015151977539, "global_step": 353844, "epoch": 4263} {"train_loss": -26.416898727416992, "global_step": 353845, "epoch": 4263} {"train_loss": -26.572101593017578, "global_step": 353846, "epoch": 4263} {"train_loss": -25.90478515625, "global_step": 353847, "epoch": 4263} {"train_loss": -26.311767578125, "global_step": 353848, "epoch": 4263} {"train_loss": -26.681934356689453, "global_step": 353849, "epoch": 4263} {"train_loss": -26.252487182617188, "global_step": 353850, "epoch": 4263} {"train_loss": -26.213897705078125, "global_step": 353851, "epoch": 4263} {"train_loss": -26.115018844604492, "global_step": 353852, "epoch": 4263} {"train_loss": -26.49737548828125, "global_step": 353853, "epoch": 4263} {"train_loss": -26.273252487182617, "global_step": 353854, "epoch": 4263} {"train_loss": -26.32240104675293, "global_step": 353855, "epoch": 4263} {"train_loss": -26.309864044189453, "global_step": 353856, "epoch": 4263} {"train_loss": -26.786848068237305, "global_step": 353857, "epoch": 4263} {"train_loss": -26.609373092651367, "global_step": 353858, "epoch": 4263} {"train_loss": -26.313262939453125, "global_step": 353859, "epoch": 4263} {"train_loss": -26.62967300415039, "global_step": 353860, "epoch": 4263} {"train_loss": -26.2122802734375, "global_step": 353861, "epoch": 4263} {"train_loss": -26.490453720092773, "global_step": 353862, "epoch": 4263} {"train_loss": -26.44496726989746, "global_step": 353863, "epoch": 4263} {"train_loss": -26.04877281188965, "global_step": 353864, "epoch": 4263} {"train_loss": -26.518396377563477, "global_step": 353865, "epoch": 4263} {"train_loss": -26.236753463745117, "global_step": 353866, "epoch": 4263} {"train_loss": -26.223617553710938, "global_step": 353867, "epoch": 4263} {"train_loss": -26.26938247680664, "global_step": 353868, "epoch": 4263} {"train_loss": -26.2416934967041, "global_step": 353869, "epoch": 4263} {"train_loss": -26.175764083862305, "global_step": 353870, "epoch": 4263} {"train_loss": -26.218921661376953, "global_step": 353871, "epoch": 4263} {"train_loss": -26.052820205688477, "global_step": 353872, "epoch": 4263} {"train_loss": -26.304718017578125, "global_step": 353873, "epoch": 4263} {"train_loss": -25.9853572845459, "global_step": 353874, "epoch": 4263} {"train_loss": -26.041400909423828, "global_step": 353875, "epoch": 4263} {"train_loss": -26.20050048828125, "global_step": 353876, "epoch": 4263} {"train_loss": -25.8858642578125, "global_step": 353877, "epoch": 4263} {"train_loss": -25.87042236328125, "global_step": 353878, "epoch": 4263} {"train_loss": -26.481359481811523, "global_step": 353879, "epoch": 4263} {"train_loss": -25.32230567932129, "global_step": 353880, "epoch": 4263} {"train_loss": -26.274829864501953, "global_step": 353881, "epoch": 4263} {"train_loss": -26.06867790222168, "global_step": 353882, "epoch": 4263} {"train_loss": -26.09834098815918, "global_step": 353883, "epoch": 4263} {"train_loss": -26.256494522094727, "global_step": 353884, "epoch": 4263} {"train_loss": -25.579998016357422, "global_step": 353885, "epoch": 4263} {"train_loss": -26.01546287536621, "global_step": 353886, "epoch": 4263} {"train_loss": -26.141605377197266, "global_step": 353887, "epoch": 4263} {"train_loss": -26.541996002197266, "global_step": 353888, "epoch": 4263} {"train_loss": -25.922510147094727, "global_step": 353889, "epoch": 4263} {"train_loss": -25.695938110351562, "global_step": 353890, "epoch": 4263} {"train_loss": -26.30230140686035, "global_step": 353891, "epoch": 4263} {"train_loss": -25.8447265625, "global_step": 353892, "epoch": 4263} {"train_loss": -26.128705978393555, "global_step": 353893, "epoch": 4263} {"train_loss": -26.369958877563477, "global_step": 353894, "epoch": 4263} {"train_loss": -26.171710968017578, "global_step": 353895, "epoch": 4263} {"train_loss": -26.389896392822266, "global_step": 353896, "epoch": 4263} {"train_loss": -26.065998077392578, "global_step": 353897, "epoch": 4263} {"train_loss": -26.20220375061035, "global_step": 353898, "epoch": 4263} {"train_loss": -26.09071922302246, "global_step": 353899, "epoch": 4263} {"train_loss": -26.545379638671875, "global_step": 353900, "epoch": 4263} {"train_loss": -26.887510299682617, "global_step": 353901, "epoch": 4263} {"train_loss": -26.348834991455078, "global_step": 353902, "epoch": 4263} {"train_loss": -26.88152503967285, "global_step": 353903, "epoch": 4263} {"train_loss": -26.5078067779541, "global_step": 353904, "epoch": 4263} {"train_loss": -26.051025390625, "global_step": 353905, "epoch": 4263} {"train_loss": -26.6142578125, "global_step": 353906, "epoch": 4263} {"train_loss": -26.332305908203125, "global_step": 353907, "epoch": 4263} {"train_loss": -26.30994987487793, "global_step": 353908, "epoch": 4263} {"train_loss": -26.294696807861328, "global_step": 353909, "epoch": 4263} {"train_loss": -26.141895294189453, "global_step": 353910, "epoch": 4263} {"train_loss": -26.21628595834755, "global_step": 353911, "epoch": 4263, "val_loss": 6770323.0} {"train_loss": -25.320167541503906, "global_step": 353912, "epoch": 4264} {"train_loss": -24.685636520385742, "global_step": 353913, "epoch": 4264} {"train_loss": -25.144315719604492, "global_step": 353914, "epoch": 4264} {"train_loss": -25.01093864440918, "global_step": 353915, "epoch": 4264} {"train_loss": -24.81800651550293, "global_step": 353916, "epoch": 4264} {"train_loss": -25.142925262451172, "global_step": 353917, "epoch": 4264} {"train_loss": -25.789472579956055, "global_step": 353918, "epoch": 4264} {"train_loss": -25.068334579467773, "global_step": 353919, "epoch": 4264} {"train_loss": -25.571044921875, "global_step": 353920, "epoch": 4264} {"train_loss": -25.416685104370117, "global_step": 353921, "epoch": 4264} {"train_loss": -25.753589630126953, "global_step": 353922, "epoch": 4264} {"train_loss": -25.8862361907959, "global_step": 353923, "epoch": 4264} {"train_loss": -25.6649112701416, "global_step": 353924, "epoch": 4264} {"train_loss": -25.489042282104492, "global_step": 353925, "epoch": 4264} {"train_loss": -25.45546531677246, "global_step": 353926, "epoch": 4264} {"train_loss": -26.04868507385254, "global_step": 353927, "epoch": 4264} {"train_loss": -25.734466552734375, "global_step": 353928, "epoch": 4264} {"train_loss": -25.394474029541016, "global_step": 353929, "epoch": 4264} {"train_loss": -26.01943016052246, "global_step": 353930, "epoch": 4264} {"train_loss": -25.44740867614746, "global_step": 353931, "epoch": 4264} {"train_loss": -26.097705841064453, "global_step": 353932, "epoch": 4264} {"train_loss": -25.825849533081055, "global_step": 353933, "epoch": 4264} {"train_loss": -26.05353355407715, "global_step": 353934, "epoch": 4264} {"train_loss": -25.856796264648438, "global_step": 353935, "epoch": 4264} {"train_loss": -25.670907974243164, "global_step": 353936, "epoch": 4264} {"train_loss": -26.069189071655273, "global_step": 353937, "epoch": 4264} {"train_loss": -25.722578048706055, "global_step": 353938, "epoch": 4264} {"train_loss": -26.00412368774414, "global_step": 353939, "epoch": 4264} {"train_loss": -25.816715240478516, "global_step": 353940, "epoch": 4264} {"train_loss": -25.60109519958496, "global_step": 353941, "epoch": 4264} {"train_loss": -26.427637100219727, "global_step": 353942, "epoch": 4264} {"train_loss": -26.214853286743164, "global_step": 353943, "epoch": 4264} {"train_loss": -26.062610626220703, "global_step": 353944, "epoch": 4264} {"train_loss": -26.21234130859375, "global_step": 353945, "epoch": 4264} {"train_loss": -26.12397575378418, "global_step": 353946, "epoch": 4264} {"train_loss": -25.873184204101562, "global_step": 353947, "epoch": 4264} {"train_loss": -25.9381046295166, "global_step": 353948, "epoch": 4264} {"train_loss": -26.19662857055664, "global_step": 353949, "epoch": 4264} {"train_loss": -25.891565322875977, "global_step": 353950, "epoch": 4264} {"train_loss": -26.02594566345215, "global_step": 353951, "epoch": 4264} {"train_loss": -26.004959106445312, "global_step": 353952, "epoch": 4264} {"train_loss": -26.653839111328125, "global_step": 353953, "epoch": 4264} {"train_loss": -26.086851119995117, "global_step": 353954, "epoch": 4264} {"train_loss": -26.581741333007812, "global_step": 353955, "epoch": 4264} {"train_loss": -26.387548446655273, "global_step": 353956, "epoch": 4264} {"train_loss": -26.12748146057129, "global_step": 353957, "epoch": 4264} {"train_loss": -25.925561904907227, "global_step": 353958, "epoch": 4264} {"train_loss": -26.02461814880371, "global_step": 353959, "epoch": 4264} {"train_loss": -26.324438095092773, "global_step": 353960, "epoch": 4264} {"train_loss": -26.110034942626953, "global_step": 353961, "epoch": 4264} {"train_loss": -26.155487060546875, "global_step": 353962, "epoch": 4264} {"train_loss": -25.987812042236328, "global_step": 353963, "epoch": 4264} {"train_loss": -26.64021873474121, "global_step": 353964, "epoch": 4264} {"train_loss": -26.398487091064453, "global_step": 353965, "epoch": 4264} {"train_loss": -26.305692672729492, "global_step": 353966, "epoch": 4264} {"train_loss": -26.33868980407715, "global_step": 353967, "epoch": 4264} {"train_loss": -25.8016414642334, "global_step": 353968, "epoch": 4264} {"train_loss": -26.474843978881836, "global_step": 353969, "epoch": 4264} {"train_loss": -25.874404907226562, "global_step": 353970, "epoch": 4264} {"train_loss": -26.350299835205078, "global_step": 353971, "epoch": 4264} {"train_loss": -26.165863037109375, "global_step": 353972, "epoch": 4264} {"train_loss": -26.53521728515625, "global_step": 353973, "epoch": 4264} {"train_loss": -26.32478141784668, "global_step": 353974, "epoch": 4264} {"train_loss": -26.4427547454834, "global_step": 353975, "epoch": 4264} {"train_loss": -26.34003257751465, "global_step": 353976, "epoch": 4264} {"train_loss": -26.641098022460938, "global_step": 353977, "epoch": 4264} {"train_loss": -26.357519149780273, "global_step": 353978, "epoch": 4264} {"train_loss": -26.119714736938477, "global_step": 353979, "epoch": 4264} {"train_loss": -26.555585861206055, "global_step": 353980, "epoch": 4264} {"train_loss": -25.790769577026367, "global_step": 353981, "epoch": 4264} {"train_loss": -25.946935653686523, "global_step": 353982, "epoch": 4264} {"train_loss": -25.596378326416016, "global_step": 353983, "epoch": 4264} {"train_loss": -26.108068466186523, "global_step": 353984, "epoch": 4264} {"train_loss": -25.9306583404541, "global_step": 353985, "epoch": 4264} {"train_loss": -26.137836456298828, "global_step": 353986, "epoch": 4264} {"train_loss": -26.370458602905273, "global_step": 353987, "epoch": 4264} {"train_loss": -26.29291343688965, "global_step": 353988, "epoch": 4264} {"train_loss": -26.042606353759766, "global_step": 353989, "epoch": 4264} {"train_loss": -26.303964614868164, "global_step": 353990, "epoch": 4264} {"train_loss": -26.464017868041992, "global_step": 353991, "epoch": 4264} {"train_loss": -26.30225944519043, "global_step": 353992, "epoch": 4264} {"train_loss": -26.513824462890625, "global_step": 353993, "epoch": 4264} {"train_loss": -25.981412336050745, "global_step": 353994, "epoch": 4264, "val_loss": 6717893.0} {"train_loss": -26.235204696655273, "global_step": 353995, "epoch": 4265} {"train_loss": -26.146209716796875, "global_step": 353996, "epoch": 4265} {"train_loss": -25.7025089263916, "global_step": 353997, "epoch": 4265} {"train_loss": -25.9025821685791, "global_step": 353998, "epoch": 4265} {"train_loss": -26.0665340423584, "global_step": 353999, "epoch": 4265} {"train_loss": -26.0908260345459, "global_step": 354000, "epoch": 4265} {"train_loss": -26.40852165222168, "global_step": 354001, "epoch": 4265} {"train_loss": -25.989459991455078, "global_step": 354002, "epoch": 4265} {"train_loss": -25.8844051361084, "global_step": 354003, "epoch": 4265} {"train_loss": -26.293432235717773, "global_step": 354004, "epoch": 4265} {"train_loss": -25.8616886138916, "global_step": 354005, "epoch": 4265} {"train_loss": -26.118244171142578, "global_step": 354006, "epoch": 4265} {"train_loss": -26.202463150024414, "global_step": 354007, "epoch": 4265} {"train_loss": -25.98349380493164, "global_step": 354008, "epoch": 4265} {"train_loss": -25.665369033813477, "global_step": 354009, "epoch": 4265} {"train_loss": -25.975448608398438, "global_step": 354010, "epoch": 4265} {"train_loss": -25.543861389160156, "global_step": 354011, "epoch": 4265} {"train_loss": -26.10407829284668, "global_step": 354012, "epoch": 4265} {"train_loss": -25.74567985534668, "global_step": 354013, "epoch": 4265} {"train_loss": -26.157184600830078, "global_step": 354014, "epoch": 4265} {"train_loss": -26.208810806274414, "global_step": 354015, "epoch": 4265} {"train_loss": -26.411977767944336, "global_step": 354016, "epoch": 4265} {"train_loss": -26.19455909729004, "global_step": 354017, "epoch": 4265} {"train_loss": -26.1121768951416, "global_step": 354018, "epoch": 4265} {"train_loss": -26.303503036499023, "global_step": 354019, "epoch": 4265} {"train_loss": -26.225757598876953, "global_step": 354020, "epoch": 4265} {"train_loss": -25.738447189331055, "global_step": 354021, "epoch": 4265} {"train_loss": -25.610675811767578, "global_step": 354022, "epoch": 4265} {"train_loss": -26.25893211364746, "global_step": 354023, "epoch": 4265} {"train_loss": -26.263769149780273, "global_step": 354024, "epoch": 4265} {"train_loss": -25.850341796875, "global_step": 354025, "epoch": 4265} {"train_loss": -25.82069969177246, "global_step": 354026, "epoch": 4265} {"train_loss": -26.100879669189453, "global_step": 354027, "epoch": 4265} {"train_loss": -26.278528213500977, "global_step": 354028, "epoch": 4265} {"train_loss": -25.808340072631836, "global_step": 354029, "epoch": 4265} {"train_loss": -26.114837646484375, "global_step": 354030, "epoch": 4265} {"train_loss": -26.29802894592285, "global_step": 354031, "epoch": 4265} {"train_loss": -26.245655059814453, "global_step": 354032, "epoch": 4265} {"train_loss": -26.26934814453125, "global_step": 354033, "epoch": 4265} {"train_loss": -26.16901206970215, "global_step": 354034, "epoch": 4265} {"train_loss": -25.9757080078125, "global_step": 354035, "epoch": 4265} {"train_loss": -25.97041130065918, "global_step": 354036, "epoch": 4265} {"train_loss": -26.3696231842041, "global_step": 354037, "epoch": 4265} {"train_loss": -26.3467960357666, "global_step": 354038, "epoch": 4265} {"train_loss": -26.592365264892578, "global_step": 354039, "epoch": 4265} {"train_loss": -26.0418643951416, "global_step": 354040, "epoch": 4265} {"train_loss": -26.569843292236328, "global_step": 354041, "epoch": 4265} {"train_loss": -26.366281509399414, "global_step": 354042, "epoch": 4265} {"train_loss": -25.679004669189453, "global_step": 354043, "epoch": 4265} {"train_loss": -26.054580688476562, "global_step": 354044, "epoch": 4265} {"train_loss": -26.029626846313477, "global_step": 354045, "epoch": 4265} {"train_loss": -26.11018943786621, "global_step": 354046, "epoch": 4265} {"train_loss": -25.944293975830078, "global_step": 354047, "epoch": 4265} {"train_loss": -26.281843185424805, "global_step": 354048, "epoch": 4265} {"train_loss": -26.42620277404785, "global_step": 354049, "epoch": 4265} {"train_loss": -26.050430297851562, "global_step": 354050, "epoch": 4265} {"train_loss": -25.89307975769043, "global_step": 354051, "epoch": 4265} {"train_loss": -25.983686447143555, "global_step": 354052, "epoch": 4265} {"train_loss": -25.925748825073242, "global_step": 354053, "epoch": 4265} {"train_loss": -26.2838134765625, "global_step": 354054, "epoch": 4265} {"train_loss": -26.443933486938477, "global_step": 354055, "epoch": 4265} {"train_loss": -26.370010375976562, "global_step": 354056, "epoch": 4265} {"train_loss": -26.224124908447266, "global_step": 354057, "epoch": 4265} {"train_loss": -26.437219619750977, "global_step": 354058, "epoch": 4265} {"train_loss": -26.11960792541504, "global_step": 354059, "epoch": 4265} {"train_loss": -26.318273544311523, "global_step": 354060, "epoch": 4265} {"train_loss": -26.2007999420166, "global_step": 354061, "epoch": 4265} {"train_loss": -26.102405548095703, "global_step": 354062, "epoch": 4265} {"train_loss": -26.182294845581055, "global_step": 354063, "epoch": 4265} {"train_loss": -26.3431339263916, "global_step": 354064, "epoch": 4265} {"train_loss": -26.40034294128418, "global_step": 354065, "epoch": 4265} {"train_loss": -26.780134201049805, "global_step": 354066, "epoch": 4265} {"train_loss": -26.592498779296875, "global_step": 354067, "epoch": 4265} {"train_loss": -26.423730850219727, "global_step": 354068, "epoch": 4265} {"train_loss": -26.135095596313477, "global_step": 354069, "epoch": 4265} {"train_loss": -25.803125381469727, "global_step": 354070, "epoch": 4265} {"train_loss": -26.541772842407227, "global_step": 354071, "epoch": 4265} {"train_loss": -26.069501876831055, "global_step": 354072, "epoch": 4265} {"train_loss": -26.158863067626953, "global_step": 354073, "epoch": 4265} {"train_loss": -26.36311149597168, "global_step": 354074, "epoch": 4265} {"train_loss": -26.564111709594727, "global_step": 354075, "epoch": 4265} {"train_loss": -26.319568634033203, "global_step": 354076, "epoch": 4265} {"train_loss": -26.146040100649177, "global_step": 354077, "epoch": 4265, "val_loss": 6657448.5} {"train_loss": -26.093984603881836, "global_step": 354078, "epoch": 4266} {"train_loss": -26.059274673461914, "global_step": 354079, "epoch": 4266} {"train_loss": -25.694091796875, "global_step": 354080, "epoch": 4266} {"train_loss": -26.106714248657227, "global_step": 354081, "epoch": 4266} {"train_loss": -26.0399112701416, "global_step": 354082, "epoch": 4266} {"train_loss": -25.99161720275879, "global_step": 354083, "epoch": 4266} {"train_loss": -26.001026153564453, "global_step": 354084, "epoch": 4266} {"train_loss": -26.085363388061523, "global_step": 354085, "epoch": 4266} {"train_loss": -26.091083526611328, "global_step": 354086, "epoch": 4266} {"train_loss": -26.18719482421875, "global_step": 354087, "epoch": 4266} {"train_loss": -25.82918357849121, "global_step": 354088, "epoch": 4266} {"train_loss": -25.891775131225586, "global_step": 354089, "epoch": 4266} {"train_loss": -25.85120964050293, "global_step": 354090, "epoch": 4266} {"train_loss": -25.840417861938477, "global_step": 354091, "epoch": 4266} {"train_loss": -26.334735870361328, "global_step": 354092, "epoch": 4266} {"train_loss": -26.193201065063477, "global_step": 354093, "epoch": 4266} {"train_loss": -26.214202880859375, "global_step": 354094, "epoch": 4266} {"train_loss": -26.53101921081543, "global_step": 354095, "epoch": 4266} {"train_loss": -26.582563400268555, "global_step": 354096, "epoch": 4266} {"train_loss": -25.977331161499023, "global_step": 354097, "epoch": 4266} {"train_loss": -26.018966674804688, "global_step": 354098, "epoch": 4266} {"train_loss": -26.28919792175293, "global_step": 354099, "epoch": 4266} {"train_loss": -25.72719383239746, "global_step": 354100, "epoch": 4266} {"train_loss": -26.284128189086914, "global_step": 354101, "epoch": 4266} {"train_loss": -26.06890296936035, "global_step": 354102, "epoch": 4266} {"train_loss": -26.124210357666016, "global_step": 354103, "epoch": 4266} {"train_loss": -25.9000244140625, "global_step": 354104, "epoch": 4266} {"train_loss": -25.86908531188965, "global_step": 354105, "epoch": 4266} {"train_loss": -26.134862899780273, "global_step": 354106, "epoch": 4266} {"train_loss": -26.226669311523438, "global_step": 354107, "epoch": 4266} {"train_loss": -26.189416885375977, "global_step": 354108, "epoch": 4266} {"train_loss": -26.178314208984375, "global_step": 354109, "epoch": 4266} {"train_loss": -25.8961124420166, "global_step": 354110, "epoch": 4266} {"train_loss": -25.966510772705078, "global_step": 354111, "epoch": 4266} {"train_loss": -26.166067123413086, "global_step": 354112, "epoch": 4266} {"train_loss": -26.072473526000977, "global_step": 354113, "epoch": 4266} {"train_loss": -26.283893585205078, "global_step": 354114, "epoch": 4266} {"train_loss": -25.59912872314453, "global_step": 354115, "epoch": 4266} {"train_loss": -25.829980850219727, "global_step": 354116, "epoch": 4266} {"train_loss": -26.11629295349121, "global_step": 354117, "epoch": 4266} {"train_loss": -26.01460075378418, "global_step": 354118, "epoch": 4266} {"train_loss": -25.768024444580078, "global_step": 354119, "epoch": 4266} {"train_loss": -25.778074264526367, "global_step": 354120, "epoch": 4266} {"train_loss": -26.15070152282715, "global_step": 354121, "epoch": 4266} {"train_loss": -26.244342803955078, "global_step": 354122, "epoch": 4266} {"train_loss": -26.089818954467773, "global_step": 354123, "epoch": 4266} {"train_loss": -26.08734130859375, "global_step": 354124, "epoch": 4266} {"train_loss": -25.742048263549805, "global_step": 354125, "epoch": 4266} {"train_loss": -26.19232749938965, "global_step": 354126, "epoch": 4266} {"train_loss": -25.938695907592773, "global_step": 354127, "epoch": 4266} {"train_loss": -26.25420570373535, "global_step": 354128, "epoch": 4266} {"train_loss": -26.306991577148438, "global_step": 354129, "epoch": 4266} {"train_loss": -26.119165420532227, "global_step": 354130, "epoch": 4266} {"train_loss": -26.207319259643555, "global_step": 354131, "epoch": 4266} {"train_loss": -26.115041732788086, "global_step": 354132, "epoch": 4266} {"train_loss": -25.954792022705078, "global_step": 354133, "epoch": 4266} {"train_loss": -25.971988677978516, "global_step": 354134, "epoch": 4266} {"train_loss": -26.492477416992188, "global_step": 354135, "epoch": 4266} {"train_loss": -26.48567771911621, "global_step": 354136, "epoch": 4266} {"train_loss": -26.413944244384766, "global_step": 354137, "epoch": 4266} {"train_loss": -26.2665958404541, "global_step": 354138, "epoch": 4266} {"train_loss": -26.484619140625, "global_step": 354139, "epoch": 4266} {"train_loss": -26.31129264831543, "global_step": 354140, "epoch": 4266} {"train_loss": -26.090539932250977, "global_step": 354141, "epoch": 4266} {"train_loss": -26.488874435424805, "global_step": 354142, "epoch": 4266} {"train_loss": -26.1142578125, "global_step": 354143, "epoch": 4266} {"train_loss": -26.386707305908203, "global_step": 354144, "epoch": 4266} {"train_loss": -26.299179077148438, "global_step": 354145, "epoch": 4266} {"train_loss": -26.041168212890625, "global_step": 354146, "epoch": 4266} {"train_loss": -26.137619018554688, "global_step": 354147, "epoch": 4266} {"train_loss": -26.09954833984375, "global_step": 354148, "epoch": 4266} {"train_loss": -26.066059112548828, "global_step": 354149, "epoch": 4266} {"train_loss": -26.2490291595459, "global_step": 354150, "epoch": 4266} {"train_loss": -26.158538818359375, "global_step": 354151, "epoch": 4266} {"train_loss": -26.523792266845703, "global_step": 354152, "epoch": 4266} {"train_loss": -25.864614486694336, "global_step": 354153, "epoch": 4266} {"train_loss": -26.361536026000977, "global_step": 354154, "epoch": 4266} {"train_loss": -26.169082641601562, "global_step": 354155, "epoch": 4266} {"train_loss": -26.20819091796875, "global_step": 354156, "epoch": 4266} {"train_loss": -26.0405216217041, "global_step": 354157, "epoch": 4266} {"train_loss": -25.713760375976562, "global_step": 354158, "epoch": 4266} {"train_loss": -26.542932510375977, "global_step": 354159, "epoch": 4266} {"train_loss": -26.112048114638732, "global_step": 354160, "epoch": 4266, "val_loss": 6723374.5} {"train_loss": -26.333332061767578, "global_step": 354161, "epoch": 4267} {"train_loss": -26.128828048706055, "global_step": 354162, "epoch": 4267} {"train_loss": -25.90606117248535, "global_step": 354163, "epoch": 4267} {"train_loss": -25.50484275817871, "global_step": 354164, "epoch": 4267} {"train_loss": -25.166240692138672, "global_step": 354165, "epoch": 4267} {"train_loss": -25.465585708618164, "global_step": 354166, "epoch": 4267} {"train_loss": -25.387252807617188, "global_step": 354167, "epoch": 4267} {"train_loss": -25.228540420532227, "global_step": 354168, "epoch": 4267} {"train_loss": -24.46601676940918, "global_step": 354169, "epoch": 4267} {"train_loss": -25.264244079589844, "global_step": 354170, "epoch": 4267} {"train_loss": -25.64106559753418, "global_step": 354171, "epoch": 4267} {"train_loss": -25.4039363861084, "global_step": 354172, "epoch": 4267} {"train_loss": -25.701984405517578, "global_step": 354173, "epoch": 4267} {"train_loss": -25.65445899963379, "global_step": 354174, "epoch": 4267} {"train_loss": -25.321149826049805, "global_step": 354175, "epoch": 4267} {"train_loss": -25.687091827392578, "global_step": 354176, "epoch": 4267} {"train_loss": -25.623779296875, "global_step": 354177, "epoch": 4267} {"train_loss": -25.784610748291016, "global_step": 354178, "epoch": 4267} {"train_loss": -25.902124404907227, "global_step": 354179, "epoch": 4267} {"train_loss": -25.550710678100586, "global_step": 354180, "epoch": 4267} {"train_loss": -25.856204986572266, "global_step": 354181, "epoch": 4267} {"train_loss": -25.8453369140625, "global_step": 354182, "epoch": 4267} {"train_loss": -25.938796997070312, "global_step": 354183, "epoch": 4267} {"train_loss": -25.83099365234375, "global_step": 354184, "epoch": 4267} {"train_loss": -25.71795082092285, "global_step": 354185, "epoch": 4267} {"train_loss": -26.029998779296875, "global_step": 354186, "epoch": 4267} {"train_loss": -25.90790367126465, "global_step": 354187, "epoch": 4267} {"train_loss": -25.839426040649414, "global_step": 354188, "epoch": 4267} {"train_loss": -26.18291664123535, "global_step": 354189, "epoch": 4267} {"train_loss": -26.20326042175293, "global_step": 354190, "epoch": 4267} {"train_loss": -25.91663932800293, "global_step": 354191, "epoch": 4267} {"train_loss": -26.03989601135254, "global_step": 354192, "epoch": 4267} {"train_loss": -26.1679630279541, "global_step": 354193, "epoch": 4267} {"train_loss": -25.868932723999023, "global_step": 354194, "epoch": 4267} {"train_loss": -26.128660202026367, "global_step": 354195, "epoch": 4267} {"train_loss": -25.991235733032227, "global_step": 354196, "epoch": 4267} {"train_loss": -26.06231117248535, "global_step": 354197, "epoch": 4267} {"train_loss": -25.800384521484375, "global_step": 354198, "epoch": 4267} {"train_loss": -26.107513427734375, "global_step": 354199, "epoch": 4267} {"train_loss": -26.06191062927246, "global_step": 354200, "epoch": 4267} {"train_loss": -26.373640060424805, "global_step": 354201, "epoch": 4267} {"train_loss": -26.38014793395996, "global_step": 354202, "epoch": 4267} {"train_loss": -26.342376708984375, "global_step": 354203, "epoch": 4267} {"train_loss": -26.211095809936523, "global_step": 354204, "epoch": 4267} {"train_loss": -26.245447158813477, "global_step": 354205, "epoch": 4267} {"train_loss": -25.89926528930664, "global_step": 354206, "epoch": 4267} {"train_loss": -25.802820205688477, "global_step": 354207, "epoch": 4267} {"train_loss": -26.293838500976562, "global_step": 354208, "epoch": 4267} {"train_loss": -26.312238693237305, "global_step": 354209, "epoch": 4267} {"train_loss": -26.06998634338379, "global_step": 354210, "epoch": 4267} {"train_loss": -25.961002349853516, "global_step": 354211, "epoch": 4267} {"train_loss": -26.202056884765625, "global_step": 354212, "epoch": 4267} {"train_loss": -26.521408081054688, "global_step": 354213, "epoch": 4267} {"train_loss": -26.44184684753418, "global_step": 354214, "epoch": 4267} {"train_loss": -26.26105308532715, "global_step": 354215, "epoch": 4267} {"train_loss": -26.218969345092773, "global_step": 354216, "epoch": 4267} {"train_loss": -26.3366756439209, "global_step": 354217, "epoch": 4267} {"train_loss": -26.427764892578125, "global_step": 354218, "epoch": 4267} {"train_loss": -26.4746150970459, "global_step": 354219, "epoch": 4267} {"train_loss": -26.19354820251465, "global_step": 354220, "epoch": 4267} {"train_loss": -26.2292423248291, "global_step": 354221, "epoch": 4267} {"train_loss": -26.36376953125, "global_step": 354222, "epoch": 4267} {"train_loss": -26.659652709960938, "global_step": 354223, "epoch": 4267} {"train_loss": -26.07278823852539, "global_step": 354224, "epoch": 4267} {"train_loss": -26.278553009033203, "global_step": 354225, "epoch": 4267} {"train_loss": -25.78204917907715, "global_step": 354226, "epoch": 4267} {"train_loss": -25.517377853393555, "global_step": 354227, "epoch": 4267} {"train_loss": -26.050220489501953, "global_step": 354228, "epoch": 4267} {"train_loss": -26.283496856689453, "global_step": 354229, "epoch": 4267} {"train_loss": -26.14291763305664, "global_step": 354230, "epoch": 4267} {"train_loss": -26.168134689331055, "global_step": 354231, "epoch": 4267} {"train_loss": -25.945005416870117, "global_step": 354232, "epoch": 4267} {"train_loss": -25.82379722595215, "global_step": 354233, "epoch": 4267} {"train_loss": -25.15093994140625, "global_step": 354234, "epoch": 4267} {"train_loss": -25.992313385009766, "global_step": 354235, "epoch": 4267} {"train_loss": -25.802167892456055, "global_step": 354236, "epoch": 4267} {"train_loss": -26.28712272644043, "global_step": 354237, "epoch": 4267} {"train_loss": -25.61628532409668, "global_step": 354238, "epoch": 4267} {"train_loss": -25.969348907470703, "global_step": 354239, "epoch": 4267} {"train_loss": -25.955778121948242, "global_step": 354240, "epoch": 4267} {"train_loss": -25.9068660736084, "global_step": 354241, "epoch": 4267} {"train_loss": -26.263532638549805, "global_step": 354242, "epoch": 4267} {"train_loss": -25.955647893698817, "global_step": 354243, "epoch": 4267, "val_loss": 6687918.0} {"train_loss": -25.184404373168945, "global_step": 354244, "epoch": 4268} {"train_loss": -25.31635093688965, "global_step": 354245, "epoch": 4268} {"train_loss": -25.424833297729492, "global_step": 354246, "epoch": 4268} {"train_loss": -25.9189510345459, "global_step": 354247, "epoch": 4268} {"train_loss": -25.491613388061523, "global_step": 354248, "epoch": 4268} {"train_loss": -25.772815704345703, "global_step": 354249, "epoch": 4268} {"train_loss": -25.8718318939209, "global_step": 354250, "epoch": 4268} {"train_loss": -25.53261947631836, "global_step": 354251, "epoch": 4268} {"train_loss": -25.59722900390625, "global_step": 354252, "epoch": 4268} {"train_loss": -25.81034278869629, "global_step": 354253, "epoch": 4268} {"train_loss": -25.467674255371094, "global_step": 354254, "epoch": 4268} {"train_loss": -26.077489852905273, "global_step": 354255, "epoch": 4268} {"train_loss": -25.84714126586914, "global_step": 354256, "epoch": 4268} {"train_loss": -26.313690185546875, "global_step": 354257, "epoch": 4268} {"train_loss": -26.057714462280273, "global_step": 354258, "epoch": 4268} {"train_loss": -26.292577743530273, "global_step": 354259, "epoch": 4268} {"train_loss": -26.038488388061523, "global_step": 354260, "epoch": 4268} {"train_loss": -25.7939453125, "global_step": 354261, "epoch": 4268} {"train_loss": -25.88833999633789, "global_step": 354262, "epoch": 4268} {"train_loss": -25.903799057006836, "global_step": 354263, "epoch": 4268} {"train_loss": -26.085895538330078, "global_step": 354264, "epoch": 4268} {"train_loss": -25.677627563476562, "global_step": 354265, "epoch": 4268} {"train_loss": -26.118549346923828, "global_step": 354266, "epoch": 4268} {"train_loss": -26.221567153930664, "global_step": 354267, "epoch": 4268} {"train_loss": -26.14740562438965, "global_step": 354268, "epoch": 4268} {"train_loss": -25.83086585998535, "global_step": 354269, "epoch": 4268} {"train_loss": -26.277738571166992, "global_step": 354270, "epoch": 4268} {"train_loss": -26.0885066986084, "global_step": 354271, "epoch": 4268} {"train_loss": -25.9937686920166, "global_step": 354272, "epoch": 4268} {"train_loss": -26.32480239868164, "global_step": 354273, "epoch": 4268} {"train_loss": -26.531835556030273, "global_step": 354274, "epoch": 4268} {"train_loss": -26.2205753326416, "global_step": 354275, "epoch": 4268} {"train_loss": -26.167577743530273, "global_step": 354276, "epoch": 4268} {"train_loss": -26.364721298217773, "global_step": 354277, "epoch": 4268} {"train_loss": -26.234058380126953, "global_step": 354278, "epoch": 4268} {"train_loss": -25.9202823638916, "global_step": 354279, "epoch": 4268} {"train_loss": -26.170995712280273, "global_step": 354280, "epoch": 4268} {"train_loss": -26.10968017578125, "global_step": 354281, "epoch": 4268} {"train_loss": -26.2314510345459, "global_step": 354282, "epoch": 4268} {"train_loss": -26.136707305908203, "global_step": 354283, "epoch": 4268} {"train_loss": -26.064847946166992, "global_step": 354284, "epoch": 4268} {"train_loss": -26.770544052124023, "global_step": 354285, "epoch": 4268} {"train_loss": -26.34488868713379, "global_step": 354286, "epoch": 4268} {"train_loss": -26.438831329345703, "global_step": 354287, "epoch": 4268} {"train_loss": -26.316516876220703, "global_step": 354288, "epoch": 4268} {"train_loss": -26.38686180114746, "global_step": 354289, "epoch": 4268} {"train_loss": -26.49906349182129, "global_step": 354290, "epoch": 4268} {"train_loss": -26.226898193359375, "global_step": 354291, "epoch": 4268} {"train_loss": -26.76690101623535, "global_step": 354292, "epoch": 4268} {"train_loss": -26.031814575195312, "global_step": 354293, "epoch": 4268} {"train_loss": -25.78473472595215, "global_step": 354294, "epoch": 4268} {"train_loss": -26.43655776977539, "global_step": 354295, "epoch": 4268} {"train_loss": -26.452550888061523, "global_step": 354296, "epoch": 4268} {"train_loss": -25.903491973876953, "global_step": 354297, "epoch": 4268} {"train_loss": -26.28388023376465, "global_step": 354298, "epoch": 4268} {"train_loss": -26.271320343017578, "global_step": 354299, "epoch": 4268} {"train_loss": -26.0977783203125, "global_step": 354300, "epoch": 4268} {"train_loss": -26.207351684570312, "global_step": 354301, "epoch": 4268} {"train_loss": -26.274616241455078, "global_step": 354302, "epoch": 4268} {"train_loss": -26.277359008789062, "global_step": 354303, "epoch": 4268} {"train_loss": -26.055566787719727, "global_step": 354304, "epoch": 4268} {"train_loss": -26.376230239868164, "global_step": 354305, "epoch": 4268} {"train_loss": -26.282302856445312, "global_step": 354306, "epoch": 4268} {"train_loss": -26.313257217407227, "global_step": 354307, "epoch": 4268} {"train_loss": -26.145557403564453, "global_step": 354308, "epoch": 4268} {"train_loss": -26.24761390686035, "global_step": 354309, "epoch": 4268} {"train_loss": -26.16294288635254, "global_step": 354310, "epoch": 4268} {"train_loss": -26.28037452697754, "global_step": 354311, "epoch": 4268} {"train_loss": -26.456369400024414, "global_step": 354312, "epoch": 4268} {"train_loss": -26.009668350219727, "global_step": 354313, "epoch": 4268} {"train_loss": -26.344282150268555, "global_step": 354314, "epoch": 4268} {"train_loss": -26.209354400634766, "global_step": 354315, "epoch": 4268} {"train_loss": -25.97553825378418, "global_step": 354316, "epoch": 4268} {"train_loss": -25.925586700439453, "global_step": 354317, "epoch": 4268} {"train_loss": -26.41053581237793, "global_step": 354318, "epoch": 4268} {"train_loss": -26.375579833984375, "global_step": 354319, "epoch": 4268} {"train_loss": -26.392181396484375, "global_step": 354320, "epoch": 4268} {"train_loss": -25.86594581604004, "global_step": 354321, "epoch": 4268} {"train_loss": -26.507980346679688, "global_step": 354322, "epoch": 4268} {"train_loss": -26.41570472717285, "global_step": 354323, "epoch": 4268} {"train_loss": -26.124771118164062, "global_step": 354324, "epoch": 4268} {"train_loss": -26.284122467041016, "global_step": 354325, "epoch": 4268} {"train_loss": -26.11250263811594, "global_step": 354326, "epoch": 4268, "val_loss": 6689806.0} {"train_loss": -25.465944290161133, "global_step": 354327, "epoch": 4269} {"train_loss": -25.42190170288086, "global_step": 354328, "epoch": 4269} {"train_loss": -25.514768600463867, "global_step": 354329, "epoch": 4269} {"train_loss": -25.90032386779785, "global_step": 354330, "epoch": 4269} {"train_loss": -25.7109432220459, "global_step": 354331, "epoch": 4269} {"train_loss": -25.65639305114746, "global_step": 354332, "epoch": 4269} {"train_loss": -26.1715030670166, "global_step": 354333, "epoch": 4269} {"train_loss": -25.186861038208008, "global_step": 354334, "epoch": 4269} {"train_loss": -25.970800399780273, "global_step": 354335, "epoch": 4269} {"train_loss": -25.78351402282715, "global_step": 354336, "epoch": 4269} {"train_loss": -25.825580596923828, "global_step": 354337, "epoch": 4269} {"train_loss": -25.534093856811523, "global_step": 354338, "epoch": 4269} {"train_loss": -25.908954620361328, "global_step": 354339, "epoch": 4269} {"train_loss": -25.888050079345703, "global_step": 354340, "epoch": 4269} {"train_loss": -26.23956298828125, "global_step": 354341, "epoch": 4269} {"train_loss": -25.89095115661621, "global_step": 354342, "epoch": 4269} {"train_loss": -25.990543365478516, "global_step": 354343, "epoch": 4269} {"train_loss": -25.791223526000977, "global_step": 354344, "epoch": 4269} {"train_loss": -26.088590621948242, "global_step": 354345, "epoch": 4269} {"train_loss": -26.049427032470703, "global_step": 354346, "epoch": 4269} {"train_loss": -26.2270450592041, "global_step": 354347, "epoch": 4269} {"train_loss": -26.425525665283203, "global_step": 354348, "epoch": 4269} {"train_loss": -25.82965660095215, "global_step": 354349, "epoch": 4269} {"train_loss": -26.539655685424805, "global_step": 354350, "epoch": 4269} {"train_loss": -26.033788681030273, "global_step": 354351, "epoch": 4269} {"train_loss": -25.88140869140625, "global_step": 354352, "epoch": 4269} {"train_loss": -25.997018814086914, "global_step": 354353, "epoch": 4269} {"train_loss": -26.099103927612305, "global_step": 354354, "epoch": 4269} {"train_loss": -26.220239639282227, "global_step": 354355, "epoch": 4269} {"train_loss": -26.247968673706055, "global_step": 354356, "epoch": 4269} {"train_loss": -26.312408447265625, "global_step": 354357, "epoch": 4269} {"train_loss": -26.236631393432617, "global_step": 354358, "epoch": 4269} {"train_loss": -26.467954635620117, "global_step": 354359, "epoch": 4269} {"train_loss": -26.345203399658203, "global_step": 354360, "epoch": 4269} {"train_loss": -26.235692977905273, "global_step": 354361, "epoch": 4269} {"train_loss": -26.171680450439453, "global_step": 354362, "epoch": 4269} {"train_loss": -26.683446884155273, "global_step": 354363, "epoch": 4269} {"train_loss": -26.1802921295166, "global_step": 354364, "epoch": 4269} {"train_loss": -26.06966209411621, "global_step": 354365, "epoch": 4269} {"train_loss": -26.4243221282959, "global_step": 354366, "epoch": 4269} {"train_loss": -26.314105987548828, "global_step": 354367, "epoch": 4269} {"train_loss": -26.302377700805664, "global_step": 354368, "epoch": 4269} {"train_loss": -26.51759147644043, "global_step": 354369, "epoch": 4269} {"train_loss": -26.595117568969727, "global_step": 354370, "epoch": 4269} {"train_loss": -26.266935348510742, "global_step": 354371, "epoch": 4269} {"train_loss": -26.187427520751953, "global_step": 354372, "epoch": 4269} {"train_loss": -25.487592697143555, "global_step": 354373, "epoch": 4269} {"train_loss": -25.03653335571289, "global_step": 354374, "epoch": 4269} {"train_loss": -23.863170623779297, "global_step": 354375, "epoch": 4269} {"train_loss": -25.763105392456055, "global_step": 354376, "epoch": 4269} {"train_loss": -26.27858543395996, "global_step": 354377, "epoch": 4269} {"train_loss": -25.2274169921875, "global_step": 354378, "epoch": 4269} {"train_loss": -26.516693115234375, "global_step": 354379, "epoch": 4269} {"train_loss": -25.85992431640625, "global_step": 354380, "epoch": 4269} {"train_loss": -25.858198165893555, "global_step": 354381, "epoch": 4269} {"train_loss": -25.58442497253418, "global_step": 354382, "epoch": 4269} {"train_loss": -25.888959884643555, "global_step": 354383, "epoch": 4269} {"train_loss": -26.305524826049805, "global_step": 354384, "epoch": 4269} {"train_loss": -25.845117568969727, "global_step": 354385, "epoch": 4269} {"train_loss": -25.78938102722168, "global_step": 354386, "epoch": 4269} {"train_loss": -26.031232833862305, "global_step": 354387, "epoch": 4269} {"train_loss": -25.836002349853516, "global_step": 354388, "epoch": 4269} {"train_loss": -25.572357177734375, "global_step": 354389, "epoch": 4269} {"train_loss": -25.923904418945312, "global_step": 354390, "epoch": 4269} {"train_loss": -25.530500411987305, "global_step": 354391, "epoch": 4269} {"train_loss": -26.164859771728516, "global_step": 354392, "epoch": 4269} {"train_loss": -26.206384658813477, "global_step": 354393, "epoch": 4269} {"train_loss": -26.208648681640625, "global_step": 354394, "epoch": 4269} {"train_loss": -26.00813865661621, "global_step": 354395, "epoch": 4269} {"train_loss": -25.997358322143555, "global_step": 354396, "epoch": 4269} {"train_loss": -26.138874053955078, "global_step": 354397, "epoch": 4269} {"train_loss": -26.233686447143555, "global_step": 354398, "epoch": 4269} {"train_loss": -26.737714767456055, "global_step": 354399, "epoch": 4269} {"train_loss": -25.948637008666992, "global_step": 354400, "epoch": 4269} {"train_loss": -26.0059871673584, "global_step": 354401, "epoch": 4269} {"train_loss": -25.697294235229492, "global_step": 354402, "epoch": 4269} {"train_loss": -26.141239166259766, "global_step": 354403, "epoch": 4269} {"train_loss": -26.51710319519043, "global_step": 354404, "epoch": 4269} {"train_loss": -26.214391708374023, "global_step": 354405, "epoch": 4269} {"train_loss": -26.329931259155273, "global_step": 354406, "epoch": 4269} {"train_loss": -26.247201919555664, "global_step": 354407, "epoch": 4269} {"train_loss": -26.072874069213867, "global_step": 354408, "epoch": 4269} {"train_loss": -25.992019032857502, "global_step": 354409, "epoch": 4269, "val_loss": 6693191.0} {"train_loss": -25.64276123046875, "global_step": 354410, "epoch": 4270} {"train_loss": -25.90876579284668, "global_step": 354411, "epoch": 4270} {"train_loss": -25.545133590698242, "global_step": 354412, "epoch": 4270} {"train_loss": -25.8206729888916, "global_step": 354413, "epoch": 4270} {"train_loss": -25.896345138549805, "global_step": 354414, "epoch": 4270} {"train_loss": -25.9115047454834, "global_step": 354415, "epoch": 4270} {"train_loss": -26.027551651000977, "global_step": 354416, "epoch": 4270} {"train_loss": -25.979413986206055, "global_step": 354417, "epoch": 4270} {"train_loss": -25.302751541137695, "global_step": 354418, "epoch": 4270} {"train_loss": -25.938766479492188, "global_step": 354419, "epoch": 4270} {"train_loss": -26.09775733947754, "global_step": 354420, "epoch": 4270} {"train_loss": -25.72147560119629, "global_step": 354421, "epoch": 4270} {"train_loss": -25.921201705932617, "global_step": 354422, "epoch": 4270} {"train_loss": -25.950971603393555, "global_step": 354423, "epoch": 4270} {"train_loss": -26.18821144104004, "global_step": 354424, "epoch": 4270} {"train_loss": -26.02430534362793, "global_step": 354425, "epoch": 4270} {"train_loss": -25.673181533813477, "global_step": 354426, "epoch": 4270} {"train_loss": -25.8571720123291, "global_step": 354427, "epoch": 4270} {"train_loss": -26.13104248046875, "global_step": 354428, "epoch": 4270} {"train_loss": -26.388525009155273, "global_step": 354429, "epoch": 4270} {"train_loss": -26.059803009033203, "global_step": 354430, "epoch": 4270} {"train_loss": -26.280271530151367, "global_step": 354431, "epoch": 4270} {"train_loss": -26.309940338134766, "global_step": 354432, "epoch": 4270} {"train_loss": -26.014570236206055, "global_step": 354433, "epoch": 4270} {"train_loss": -26.290063858032227, "global_step": 354434, "epoch": 4270} {"train_loss": -25.97881507873535, "global_step": 354435, "epoch": 4270} {"train_loss": -26.245275497436523, "global_step": 354436, "epoch": 4270} {"train_loss": -26.134565353393555, "global_step": 354437, "epoch": 4270} {"train_loss": -26.06267738342285, "global_step": 354438, "epoch": 4270} {"train_loss": -25.999540328979492, "global_step": 354439, "epoch": 4270} {"train_loss": -26.067493438720703, "global_step": 354440, "epoch": 4270} {"train_loss": -26.062448501586914, "global_step": 354441, "epoch": 4270} {"train_loss": -26.14436149597168, "global_step": 354442, "epoch": 4270} {"train_loss": -26.072534561157227, "global_step": 354443, "epoch": 4270} {"train_loss": -26.435277938842773, "global_step": 354444, "epoch": 4270} {"train_loss": -26.353322982788086, "global_step": 354445, "epoch": 4270} {"train_loss": -26.3033504486084, "global_step": 354446, "epoch": 4270} {"train_loss": -26.131650924682617, "global_step": 354447, "epoch": 4270} {"train_loss": -25.835485458374023, "global_step": 354448, "epoch": 4270} {"train_loss": -25.697723388671875, "global_step": 354449, "epoch": 4270} {"train_loss": -25.964557647705078, "global_step": 354450, "epoch": 4270} {"train_loss": -25.9088134765625, "global_step": 354451, "epoch": 4270} {"train_loss": -26.378461837768555, "global_step": 354452, "epoch": 4270} {"train_loss": -26.312559127807617, "global_step": 354453, "epoch": 4270} {"train_loss": -26.3128662109375, "global_step": 354454, "epoch": 4270} {"train_loss": -26.18657875061035, "global_step": 354455, "epoch": 4270} {"train_loss": -25.90937614440918, "global_step": 354456, "epoch": 4270} {"train_loss": -25.79631996154785, "global_step": 354457, "epoch": 4270} {"train_loss": -26.378454208374023, "global_step": 354458, "epoch": 4270} {"train_loss": -26.1629581451416, "global_step": 354459, "epoch": 4270} {"train_loss": -26.436141967773438, "global_step": 354460, "epoch": 4270} {"train_loss": -26.130033493041992, "global_step": 354461, "epoch": 4270} {"train_loss": -26.654279708862305, "global_step": 354462, "epoch": 4270} {"train_loss": -26.472564697265625, "global_step": 354463, "epoch": 4270} {"train_loss": -26.30807876586914, "global_step": 354464, "epoch": 4270} {"train_loss": -26.87058448791504, "global_step": 354465, "epoch": 4270} {"train_loss": -26.57378578186035, "global_step": 354466, "epoch": 4270} {"train_loss": -26.30731773376465, "global_step": 354467, "epoch": 4270} {"train_loss": -25.958532333374023, "global_step": 354468, "epoch": 4270} {"train_loss": -26.122976303100586, "global_step": 354469, "epoch": 4270} {"train_loss": -26.19662857055664, "global_step": 354470, "epoch": 4270} {"train_loss": -25.9832820892334, "global_step": 354471, "epoch": 4270} {"train_loss": -26.10812759399414, "global_step": 354472, "epoch": 4270} {"train_loss": -26.32600212097168, "global_step": 354473, "epoch": 4270} {"train_loss": -25.906787872314453, "global_step": 354474, "epoch": 4270} {"train_loss": -25.628803253173828, "global_step": 354475, "epoch": 4270} {"train_loss": -26.19669532775879, "global_step": 354476, "epoch": 4270} {"train_loss": -26.093225479125977, "global_step": 354477, "epoch": 4270} {"train_loss": -26.413394927978516, "global_step": 354478, "epoch": 4270} {"train_loss": -26.56028175354004, "global_step": 354479, "epoch": 4270} {"train_loss": -26.021350860595703, "global_step": 354480, "epoch": 4270} {"train_loss": -26.4597110748291, "global_step": 354481, "epoch": 4270} {"train_loss": -26.174543380737305, "global_step": 354482, "epoch": 4270} {"train_loss": -26.104650497436523, "global_step": 354483, "epoch": 4270} {"train_loss": -26.494779586791992, "global_step": 354484, "epoch": 4270} {"train_loss": -26.2823486328125, "global_step": 354485, "epoch": 4270} {"train_loss": -26.164594650268555, "global_step": 354486, "epoch": 4270} {"train_loss": -26.127466201782227, "global_step": 354487, "epoch": 4270} {"train_loss": -25.8436336517334, "global_step": 354488, "epoch": 4270} {"train_loss": -25.925519943237305, "global_step": 354489, "epoch": 4270} {"train_loss": -26.587421417236328, "global_step": 354490, "epoch": 4270} {"train_loss": -26.383527755737305, "global_step": 354491, "epoch": 4270} {"train_loss": -26.105799686477845, "global_step": 354492, "epoch": 4270, "val_loss": 6685266.0} {"train_loss": -25.548290252685547, "global_step": 354493, "epoch": 4271} {"train_loss": -25.632516860961914, "global_step": 354494, "epoch": 4271} {"train_loss": -25.7055606842041, "global_step": 354495, "epoch": 4271} {"train_loss": -25.673583984375, "global_step": 354496, "epoch": 4271} {"train_loss": -25.950284957885742, "global_step": 354497, "epoch": 4271} {"train_loss": -25.994054794311523, "global_step": 354498, "epoch": 4271} {"train_loss": -25.83868980407715, "global_step": 354499, "epoch": 4271} {"train_loss": -25.949634552001953, "global_step": 354500, "epoch": 4271} {"train_loss": -25.99951171875, "global_step": 354501, "epoch": 4271} {"train_loss": -25.719507217407227, "global_step": 354502, "epoch": 4271} {"train_loss": -25.950361251831055, "global_step": 354503, "epoch": 4271} {"train_loss": -25.88619041442871, "global_step": 354504, "epoch": 4271} {"train_loss": -26.0235595703125, "global_step": 354505, "epoch": 4271} {"train_loss": -25.833576202392578, "global_step": 354506, "epoch": 4271} {"train_loss": -25.73125648498535, "global_step": 354507, "epoch": 4271} {"train_loss": -25.99016761779785, "global_step": 354508, "epoch": 4271} {"train_loss": -26.10309410095215, "global_step": 354509, "epoch": 4271} {"train_loss": -26.21809196472168, "global_step": 354510, "epoch": 4271} {"train_loss": -26.093408584594727, "global_step": 354511, "epoch": 4271} {"train_loss": -26.462610244750977, "global_step": 354512, "epoch": 4271} {"train_loss": -26.072223663330078, "global_step": 354513, "epoch": 4271} {"train_loss": -26.19927978515625, "global_step": 354514, "epoch": 4271} {"train_loss": -26.000051498413086, "global_step": 354515, "epoch": 4271} {"train_loss": -26.513660430908203, "global_step": 354516, "epoch": 4271} {"train_loss": -26.359882354736328, "global_step": 354517, "epoch": 4271} {"train_loss": -26.213865280151367, "global_step": 354518, "epoch": 4271} {"train_loss": -26.307767868041992, "global_step": 354519, "epoch": 4271} {"train_loss": -26.414533615112305, "global_step": 354520, "epoch": 4271} {"train_loss": -26.347503662109375, "global_step": 354521, "epoch": 4271} {"train_loss": -26.54363441467285, "global_step": 354522, "epoch": 4271} {"train_loss": -26.298425674438477, "global_step": 354523, "epoch": 4271} {"train_loss": -26.236328125, "global_step": 354524, "epoch": 4271} {"train_loss": -26.23103141784668, "global_step": 354525, "epoch": 4271} {"train_loss": -26.331090927124023, "global_step": 354526, "epoch": 4271} {"train_loss": -26.257287979125977, "global_step": 354527, "epoch": 4271} {"train_loss": -26.597431182861328, "global_step": 354528, "epoch": 4271} {"train_loss": -26.450214385986328, "global_step": 354529, "epoch": 4271} {"train_loss": -26.1433048248291, "global_step": 354530, "epoch": 4271} {"train_loss": -26.83491325378418, "global_step": 354531, "epoch": 4271} {"train_loss": -26.391590118408203, "global_step": 354532, "epoch": 4271} {"train_loss": -26.727985382080078, "global_step": 354533, "epoch": 4271} {"train_loss": -26.643224716186523, "global_step": 354534, "epoch": 4271} {"train_loss": -26.1697998046875, "global_step": 354535, "epoch": 4271} {"train_loss": -26.46787452697754, "global_step": 354536, "epoch": 4271} {"train_loss": -26.415302276611328, "global_step": 354537, "epoch": 4271} {"train_loss": -26.251840591430664, "global_step": 354538, "epoch": 4271} {"train_loss": -26.782575607299805, "global_step": 354539, "epoch": 4271} {"train_loss": -26.53192710876465, "global_step": 354540, "epoch": 4271} {"train_loss": -26.62763023376465, "global_step": 354541, "epoch": 4271} {"train_loss": -26.428098678588867, "global_step": 354542, "epoch": 4271} {"train_loss": -26.282209396362305, "global_step": 354543, "epoch": 4271} {"train_loss": -26.4172420501709, "global_step": 354544, "epoch": 4271} {"train_loss": -26.075759887695312, "global_step": 354545, "epoch": 4271} {"train_loss": -25.88240623474121, "global_step": 354546, "epoch": 4271} {"train_loss": -25.99857521057129, "global_step": 354547, "epoch": 4271} {"train_loss": -26.356775283813477, "global_step": 354548, "epoch": 4271} {"train_loss": -26.1298885345459, "global_step": 354549, "epoch": 4271} {"train_loss": -26.29410171508789, "global_step": 354550, "epoch": 4271} {"train_loss": -25.3710994720459, "global_step": 354551, "epoch": 4271} {"train_loss": -25.59844398498535, "global_step": 354552, "epoch": 4271} {"train_loss": -24.929889678955078, "global_step": 354553, "epoch": 4271} {"train_loss": -25.559141159057617, "global_step": 354554, "epoch": 4271} {"train_loss": -25.927108764648438, "global_step": 354555, "epoch": 4271} {"train_loss": -25.7821044921875, "global_step": 354556, "epoch": 4271} {"train_loss": -26.47480583190918, "global_step": 354557, "epoch": 4271} {"train_loss": -26.422590255737305, "global_step": 354558, "epoch": 4271} {"train_loss": -25.955121994018555, "global_step": 354559, "epoch": 4271} {"train_loss": -26.017852783203125, "global_step": 354560, "epoch": 4271} {"train_loss": -26.271093368530273, "global_step": 354561, "epoch": 4271} {"train_loss": -25.7901611328125, "global_step": 354562, "epoch": 4271} {"train_loss": -26.126220703125, "global_step": 354563, "epoch": 4271} {"train_loss": -26.391407012939453, "global_step": 354564, "epoch": 4271} {"train_loss": -26.264968872070312, "global_step": 354565, "epoch": 4271} {"train_loss": -25.81591796875, "global_step": 354566, "epoch": 4271} {"train_loss": -26.24387550354004, "global_step": 354567, "epoch": 4271} {"train_loss": -26.266128540039062, "global_step": 354568, "epoch": 4271} {"train_loss": -26.145849227905273, "global_step": 354569, "epoch": 4271} {"train_loss": -26.247791290283203, "global_step": 354570, "epoch": 4271} {"train_loss": -26.055097579956055, "global_step": 354571, "epoch": 4271} {"train_loss": -26.257436752319336, "global_step": 354572, "epoch": 4271} {"train_loss": -26.2056884765625, "global_step": 354573, "epoch": 4271} {"train_loss": -26.318801879882812, "global_step": 354574, "epoch": 4271} {"train_loss": -26.15655575028385, "global_step": 354575, "epoch": 4271, "val_loss": 6589114.0} {"train_loss": -25.898508071899414, "global_step": 354576, "epoch": 4272} {"train_loss": -26.032678604125977, "global_step": 354577, "epoch": 4272} {"train_loss": -26.008716583251953, "global_step": 354578, "epoch": 4272} {"train_loss": -25.939599990844727, "global_step": 354579, "epoch": 4272} {"train_loss": -25.74444580078125, "global_step": 354580, "epoch": 4272} {"train_loss": -26.007598876953125, "global_step": 354581, "epoch": 4272} {"train_loss": -26.08907127380371, "global_step": 354582, "epoch": 4272} {"train_loss": -25.896240234375, "global_step": 354583, "epoch": 4272} {"train_loss": -26.236785888671875, "global_step": 354584, "epoch": 4272} {"train_loss": -26.0024471282959, "global_step": 354585, "epoch": 4272} {"train_loss": -26.143903732299805, "global_step": 354586, "epoch": 4272} {"train_loss": -25.92340660095215, "global_step": 354587, "epoch": 4272} {"train_loss": -26.264923095703125, "global_step": 354588, "epoch": 4272} {"train_loss": -26.049335479736328, "global_step": 354589, "epoch": 4272} {"train_loss": -26.062408447265625, "global_step": 354590, "epoch": 4272} {"train_loss": -25.56705093383789, "global_step": 354591, "epoch": 4272} {"train_loss": -26.311920166015625, "global_step": 354592, "epoch": 4272} {"train_loss": -26.32254409790039, "global_step": 354593, "epoch": 4272} {"train_loss": -25.69070816040039, "global_step": 354594, "epoch": 4272} {"train_loss": -26.1522216796875, "global_step": 354595, "epoch": 4272} {"train_loss": -26.298688888549805, "global_step": 354596, "epoch": 4272} {"train_loss": -25.919967651367188, "global_step": 354597, "epoch": 4272} {"train_loss": -25.973859786987305, "global_step": 354598, "epoch": 4272} {"train_loss": -26.18867301940918, "global_step": 354599, "epoch": 4272} {"train_loss": -26.467426300048828, "global_step": 354600, "epoch": 4272} {"train_loss": -25.7381591796875, "global_step": 354601, "epoch": 4272} {"train_loss": -26.06107521057129, "global_step": 354602, "epoch": 4272} {"train_loss": -26.35699462890625, "global_step": 354603, "epoch": 4272} {"train_loss": -26.52729606628418, "global_step": 354604, "epoch": 4272} {"train_loss": -26.09303092956543, "global_step": 354605, "epoch": 4272} {"train_loss": -26.351276397705078, "global_step": 354606, "epoch": 4272} {"train_loss": -26.570783615112305, "global_step": 354607, "epoch": 4272} {"train_loss": -26.29836082458496, "global_step": 354608, "epoch": 4272} {"train_loss": -26.539670944213867, "global_step": 354609, "epoch": 4272} {"train_loss": -26.08622169494629, "global_step": 354610, "epoch": 4272} {"train_loss": -26.375747680664062, "global_step": 354611, "epoch": 4272} {"train_loss": -25.9002742767334, "global_step": 354612, "epoch": 4272} {"train_loss": -26.296316146850586, "global_step": 354613, "epoch": 4272} {"train_loss": -25.686450958251953, "global_step": 354614, "epoch": 4272} {"train_loss": -25.97991943359375, "global_step": 354615, "epoch": 4272} {"train_loss": -26.1950740814209, "global_step": 354616, "epoch": 4272} {"train_loss": -26.43501091003418, "global_step": 354617, "epoch": 4272} {"train_loss": -26.118688583374023, "global_step": 354618, "epoch": 4272} {"train_loss": -26.051435470581055, "global_step": 354619, "epoch": 4272} {"train_loss": -26.262693405151367, "global_step": 354620, "epoch": 4272} {"train_loss": -26.14312171936035, "global_step": 354621, "epoch": 4272} {"train_loss": -26.201993942260742, "global_step": 354622, "epoch": 4272} {"train_loss": -26.386266708374023, "global_step": 354623, "epoch": 4272} {"train_loss": -25.850889205932617, "global_step": 354624, "epoch": 4272} {"train_loss": -26.3229923248291, "global_step": 354625, "epoch": 4272} {"train_loss": -26.331958770751953, "global_step": 354626, "epoch": 4272} {"train_loss": -26.44935417175293, "global_step": 354627, "epoch": 4272} {"train_loss": -25.9178409576416, "global_step": 354628, "epoch": 4272} {"train_loss": -26.43303871154785, "global_step": 354629, "epoch": 4272} {"train_loss": -25.98093605041504, "global_step": 354630, "epoch": 4272} {"train_loss": -26.249561309814453, "global_step": 354631, "epoch": 4272} {"train_loss": -26.58774757385254, "global_step": 354632, "epoch": 4272} {"train_loss": -26.4360294342041, "global_step": 354633, "epoch": 4272} {"train_loss": -25.977924346923828, "global_step": 354634, "epoch": 4272} {"train_loss": -26.071985244750977, "global_step": 354635, "epoch": 4272} {"train_loss": -25.971643447875977, "global_step": 354636, "epoch": 4272} {"train_loss": -26.26692008972168, "global_step": 354637, "epoch": 4272} {"train_loss": -26.21284294128418, "global_step": 354638, "epoch": 4272} {"train_loss": -26.274930953979492, "global_step": 354639, "epoch": 4272} {"train_loss": -26.019025802612305, "global_step": 354640, "epoch": 4272} {"train_loss": -26.57599449157715, "global_step": 354641, "epoch": 4272} {"train_loss": -26.38738441467285, "global_step": 354642, "epoch": 4272} {"train_loss": -26.463918685913086, "global_step": 354643, "epoch": 4272} {"train_loss": -26.314538955688477, "global_step": 354644, "epoch": 4272} {"train_loss": -26.340606689453125, "global_step": 354645, "epoch": 4272} {"train_loss": -26.45204734802246, "global_step": 354646, "epoch": 4272} {"train_loss": -25.84346580505371, "global_step": 354647, "epoch": 4272} {"train_loss": -26.07020378112793, "global_step": 354648, "epoch": 4272} {"train_loss": -25.961841583251953, "global_step": 354649, "epoch": 4272} {"train_loss": -26.31483268737793, "global_step": 354650, "epoch": 4272} {"train_loss": -25.67852783203125, "global_step": 354651, "epoch": 4272} {"train_loss": -24.919448852539062, "global_step": 354652, "epoch": 4272} {"train_loss": -25.80552101135254, "global_step": 354653, "epoch": 4272} {"train_loss": -26.084985733032227, "global_step": 354654, "epoch": 4272} {"train_loss": -25.93826675415039, "global_step": 354655, "epoch": 4272} {"train_loss": -26.095678329467773, "global_step": 354656, "epoch": 4272} {"train_loss": -25.959455490112305, "global_step": 354657, "epoch": 4272} {"train_loss": -26.130378332482763, "global_step": 354658, "epoch": 4272, "val_loss": 6640614.0} {"train_loss": -25.604135513305664, "global_step": 354659, "epoch": 4273} {"train_loss": -26.090057373046875, "global_step": 354660, "epoch": 4273} {"train_loss": -26.154821395874023, "global_step": 354661, "epoch": 4273} {"train_loss": -25.508895874023438, "global_step": 354662, "epoch": 4273} {"train_loss": -25.382192611694336, "global_step": 354663, "epoch": 4273} {"train_loss": -25.410898208618164, "global_step": 354664, "epoch": 4273} {"train_loss": -25.349040985107422, "global_step": 354665, "epoch": 4273} {"train_loss": -25.436079025268555, "global_step": 354666, "epoch": 4273} {"train_loss": -25.195188522338867, "global_step": 354667, "epoch": 4273} {"train_loss": -25.110742568969727, "global_step": 354668, "epoch": 4273} {"train_loss": -25.50027847290039, "global_step": 354669, "epoch": 4273} {"train_loss": -25.474706649780273, "global_step": 354670, "epoch": 4273} {"train_loss": -26.043567657470703, "global_step": 354671, "epoch": 4273} {"train_loss": -25.72450828552246, "global_step": 354672, "epoch": 4273} {"train_loss": -26.06015968322754, "global_step": 354673, "epoch": 4273} {"train_loss": -25.580259323120117, "global_step": 354674, "epoch": 4273} {"train_loss": -25.30073356628418, "global_step": 354675, "epoch": 4273} {"train_loss": -25.77071189880371, "global_step": 354676, "epoch": 4273} {"train_loss": -25.714874267578125, "global_step": 354677, "epoch": 4273} {"train_loss": -26.01997947692871, "global_step": 354678, "epoch": 4273} {"train_loss": -25.6910343170166, "global_step": 354679, "epoch": 4273} {"train_loss": -25.775344848632812, "global_step": 354680, "epoch": 4273} {"train_loss": -25.870264053344727, "global_step": 354681, "epoch": 4273} {"train_loss": -25.9250545501709, "global_step": 354682, "epoch": 4273} {"train_loss": -26.21185874938965, "global_step": 354683, "epoch": 4273} {"train_loss": -25.6988582611084, "global_step": 354684, "epoch": 4273} {"train_loss": -26.167469024658203, "global_step": 354685, "epoch": 4273} {"train_loss": -25.99293327331543, "global_step": 354686, "epoch": 4273} {"train_loss": -25.6031436920166, "global_step": 354687, "epoch": 4273} {"train_loss": -26.110477447509766, "global_step": 354688, "epoch": 4273} {"train_loss": -25.916364669799805, "global_step": 354689, "epoch": 4273} {"train_loss": -25.788183212280273, "global_step": 354690, "epoch": 4273} {"train_loss": -26.1424503326416, "global_step": 354691, "epoch": 4273} {"train_loss": -26.17341423034668, "global_step": 354692, "epoch": 4273} {"train_loss": -26.498010635375977, "global_step": 354693, "epoch": 4273} {"train_loss": -26.415029525756836, "global_step": 354694, "epoch": 4273} {"train_loss": -26.044355392456055, "global_step": 354695, "epoch": 4273} {"train_loss": -26.4152889251709, "global_step": 354696, "epoch": 4273} {"train_loss": -26.35419273376465, "global_step": 354697, "epoch": 4273} {"train_loss": -26.00665283203125, "global_step": 354698, "epoch": 4273} {"train_loss": -26.288116455078125, "global_step": 354699, "epoch": 4273} {"train_loss": -26.622995376586914, "global_step": 354700, "epoch": 4273} {"train_loss": -26.273544311523438, "global_step": 354701, "epoch": 4273} {"train_loss": -26.486738204956055, "global_step": 354702, "epoch": 4273} {"train_loss": -26.450836181640625, "global_step": 354703, "epoch": 4273} {"train_loss": -26.608936309814453, "global_step": 354704, "epoch": 4273} {"train_loss": -26.32429313659668, "global_step": 354705, "epoch": 4273} {"train_loss": -26.179166793823242, "global_step": 354706, "epoch": 4273} {"train_loss": -26.212072372436523, "global_step": 354707, "epoch": 4273} {"train_loss": -25.696582794189453, "global_step": 354708, "epoch": 4273} {"train_loss": -26.02168846130371, "global_step": 354709, "epoch": 4273} {"train_loss": -26.67690086364746, "global_step": 354710, "epoch": 4273} {"train_loss": -26.173114776611328, "global_step": 354711, "epoch": 4273} {"train_loss": -26.17426872253418, "global_step": 354712, "epoch": 4273} {"train_loss": -26.195093154907227, "global_step": 354713, "epoch": 4273} {"train_loss": -26.678653717041016, "global_step": 354714, "epoch": 4273} {"train_loss": -26.242795944213867, "global_step": 354715, "epoch": 4273} {"train_loss": -26.652891159057617, "global_step": 354716, "epoch": 4273} {"train_loss": -26.488773345947266, "global_step": 354717, "epoch": 4273} {"train_loss": -26.580957412719727, "global_step": 354718, "epoch": 4273} {"train_loss": -26.2180118560791, "global_step": 354719, "epoch": 4273} {"train_loss": -26.279590606689453, "global_step": 354720, "epoch": 4273} {"train_loss": -26.1435489654541, "global_step": 354721, "epoch": 4273} {"train_loss": -26.11531639099121, "global_step": 354722, "epoch": 4273} {"train_loss": -26.278539657592773, "global_step": 354723, "epoch": 4273} {"train_loss": -26.2949161529541, "global_step": 354724, "epoch": 4273} {"train_loss": -26.134668350219727, "global_step": 354725, "epoch": 4273} {"train_loss": -25.79218864440918, "global_step": 354726, "epoch": 4273} {"train_loss": -26.1474666595459, "global_step": 354727, "epoch": 4273} {"train_loss": -26.286874771118164, "global_step": 354728, "epoch": 4273} {"train_loss": -26.253799438476562, "global_step": 354729, "epoch": 4273} {"train_loss": -26.06788444519043, "global_step": 354730, "epoch": 4273} {"train_loss": -25.99491310119629, "global_step": 354731, "epoch": 4273} {"train_loss": -26.369495391845703, "global_step": 354732, "epoch": 4273} {"train_loss": -26.130659103393555, "global_step": 354733, "epoch": 4273} {"train_loss": -26.200963973999023, "global_step": 354734, "epoch": 4273} {"train_loss": -26.173730850219727, "global_step": 354735, "epoch": 4273} {"train_loss": -26.313873291015625, "global_step": 354736, "epoch": 4273} {"train_loss": -25.833608627319336, "global_step": 354737, "epoch": 4273} {"train_loss": -26.644346237182617, "global_step": 354738, "epoch": 4273} {"train_loss": -26.310016632080078, "global_step": 354739, "epoch": 4273} {"train_loss": -26.12310791015625, "global_step": 354740, "epoch": 4273} {"train_loss": -26.044879384787684, "global_step": 354741, "epoch": 4273, "val_loss": 6697248.0} {"train_loss": -24.257251739501953, "global_step": 354742, "epoch": 4274} {"train_loss": -24.155780792236328, "global_step": 354743, "epoch": 4274} {"train_loss": -23.580198287963867, "global_step": 354744, "epoch": 4274} {"train_loss": -23.4466495513916, "global_step": 354745, "epoch": 4274} {"train_loss": -23.888776779174805, "global_step": 354746, "epoch": 4274} {"train_loss": -24.517778396606445, "global_step": 354747, "epoch": 4274} {"train_loss": -24.045480728149414, "global_step": 354748, "epoch": 4274} {"train_loss": -25.14372444152832, "global_step": 354749, "epoch": 4274} {"train_loss": -24.993223190307617, "global_step": 354750, "epoch": 4274} {"train_loss": -25.217756271362305, "global_step": 354751, "epoch": 4274} {"train_loss": -24.890783309936523, "global_step": 354752, "epoch": 4274} {"train_loss": -25.324609756469727, "global_step": 354753, "epoch": 4274} {"train_loss": -25.33112144470215, "global_step": 354754, "epoch": 4274} {"train_loss": -25.232297897338867, "global_step": 354755, "epoch": 4274} {"train_loss": -25.667530059814453, "global_step": 354756, "epoch": 4274} {"train_loss": -25.669721603393555, "global_step": 354757, "epoch": 4274} {"train_loss": -25.352176666259766, "global_step": 354758, "epoch": 4274} {"train_loss": -25.619916915893555, "global_step": 354759, "epoch": 4274} {"train_loss": -25.33936882019043, "global_step": 354760, "epoch": 4274} {"train_loss": -25.727148056030273, "global_step": 354761, "epoch": 4274} {"train_loss": -25.704797744750977, "global_step": 354762, "epoch": 4274} {"train_loss": -25.505693435668945, "global_step": 354763, "epoch": 4274} {"train_loss": -25.677947998046875, "global_step": 354764, "epoch": 4274} {"train_loss": -25.85477066040039, "global_step": 354765, "epoch": 4274} {"train_loss": -25.529245376586914, "global_step": 354766, "epoch": 4274} {"train_loss": -25.52861976623535, "global_step": 354767, "epoch": 4274} {"train_loss": -25.807050704956055, "global_step": 354768, "epoch": 4274} {"train_loss": -26.085468292236328, "global_step": 354769, "epoch": 4274} {"train_loss": -25.748554229736328, "global_step": 354770, "epoch": 4274} {"train_loss": -26.12910270690918, "global_step": 354771, "epoch": 4274} {"train_loss": -25.73273277282715, "global_step": 354772, "epoch": 4274} {"train_loss": -25.605810165405273, "global_step": 354773, "epoch": 4274} {"train_loss": -26.086822509765625, "global_step": 354774, "epoch": 4274} {"train_loss": -25.643146514892578, "global_step": 354775, "epoch": 4274} {"train_loss": -26.167926788330078, "global_step": 354776, "epoch": 4274} {"train_loss": -26.14716911315918, "global_step": 354777, "epoch": 4274} {"train_loss": -26.139596939086914, "global_step": 354778, "epoch": 4274} {"train_loss": -26.119932174682617, "global_step": 354779, "epoch": 4274} {"train_loss": -26.04071044921875, "global_step": 354780, "epoch": 4274} {"train_loss": -26.027484893798828, "global_step": 354781, "epoch": 4274} {"train_loss": -26.140338897705078, "global_step": 354782, "epoch": 4274} {"train_loss": -26.464059829711914, "global_step": 354783, "epoch": 4274} {"train_loss": -26.047697067260742, "global_step": 354784, "epoch": 4274} {"train_loss": -26.37723159790039, "global_step": 354785, "epoch": 4274} {"train_loss": -26.100284576416016, "global_step": 354786, "epoch": 4274} {"train_loss": -26.022062301635742, "global_step": 354787, "epoch": 4274} {"train_loss": -26.373395919799805, "global_step": 354788, "epoch": 4274} {"train_loss": -26.109540939331055, "global_step": 354789, "epoch": 4274} {"train_loss": -26.198400497436523, "global_step": 354790, "epoch": 4274} {"train_loss": -26.589330673217773, "global_step": 354791, "epoch": 4274} {"train_loss": -26.12190818786621, "global_step": 354792, "epoch": 4274} {"train_loss": -26.417449951171875, "global_step": 354793, "epoch": 4274} {"train_loss": -26.034753799438477, "global_step": 354794, "epoch": 4274} {"train_loss": -26.564451217651367, "global_step": 354795, "epoch": 4274} {"train_loss": -26.247222900390625, "global_step": 354796, "epoch": 4274} {"train_loss": -26.721715927124023, "global_step": 354797, "epoch": 4274} {"train_loss": -26.763532638549805, "global_step": 354798, "epoch": 4274} {"train_loss": -26.046720504760742, "global_step": 354799, "epoch": 4274} {"train_loss": -26.091032028198242, "global_step": 354800, "epoch": 4274} {"train_loss": -26.12143325805664, "global_step": 354801, "epoch": 4274} {"train_loss": -26.282846450805664, "global_step": 354802, "epoch": 4274} {"train_loss": -25.95698356628418, "global_step": 354803, "epoch": 4274} {"train_loss": -25.64004898071289, "global_step": 354804, "epoch": 4274} {"train_loss": -25.846433639526367, "global_step": 354805, "epoch": 4274} {"train_loss": -26.182403564453125, "global_step": 354806, "epoch": 4274} {"train_loss": -25.962064743041992, "global_step": 354807, "epoch": 4274} {"train_loss": -25.87786293029785, "global_step": 354808, "epoch": 4274} {"train_loss": -26.10150146484375, "global_step": 354809, "epoch": 4274} {"train_loss": -25.99837303161621, "global_step": 354810, "epoch": 4274} {"train_loss": -25.745132446289062, "global_step": 354811, "epoch": 4274} {"train_loss": -26.223041534423828, "global_step": 354812, "epoch": 4274} {"train_loss": -26.000110626220703, "global_step": 354813, "epoch": 4274} {"train_loss": -26.232624053955078, "global_step": 354814, "epoch": 4274} {"train_loss": -26.642227172851562, "global_step": 354815, "epoch": 4274} {"train_loss": -26.010114669799805, "global_step": 354816, "epoch": 4274} {"train_loss": -26.09486198425293, "global_step": 354817, "epoch": 4274} {"train_loss": -26.005218505859375, "global_step": 354818, "epoch": 4274} {"train_loss": -26.087194442749023, "global_step": 354819, "epoch": 4274} {"train_loss": -26.13214111328125, "global_step": 354820, "epoch": 4274} {"train_loss": -25.795190811157227, "global_step": 354821, "epoch": 4274} {"train_loss": -25.5477352142334, "global_step": 354822, "epoch": 4274} {"train_loss": -26.105422973632812, "global_step": 354823, "epoch": 4274} {"train_loss": -25.757632772606538, "global_step": 354824, "epoch": 4274, "val_loss": 6617700.0} {"train_loss": -25.91983413696289, "global_step": 354825, "epoch": 4275} {"train_loss": -25.46636390686035, "global_step": 354826, "epoch": 4275} {"train_loss": -26.315006256103516, "global_step": 354827, "epoch": 4275} {"train_loss": -25.578805923461914, "global_step": 354828, "epoch": 4275} {"train_loss": -25.1038761138916, "global_step": 354829, "epoch": 4275} {"train_loss": -25.292375564575195, "global_step": 354830, "epoch": 4275} {"train_loss": -25.904142379760742, "global_step": 354831, "epoch": 4275} {"train_loss": -25.27137565612793, "global_step": 354832, "epoch": 4275} {"train_loss": -25.41383934020996, "global_step": 354833, "epoch": 4275} {"train_loss": -25.941572189331055, "global_step": 354834, "epoch": 4275} {"train_loss": -25.793729782104492, "global_step": 354835, "epoch": 4275} {"train_loss": -25.750503540039062, "global_step": 354836, "epoch": 4275} {"train_loss": -25.938135147094727, "global_step": 354837, "epoch": 4275} {"train_loss": -25.5848388671875, "global_step": 354838, "epoch": 4275} {"train_loss": -25.691205978393555, "global_step": 354839, "epoch": 4275} {"train_loss": -26.13984489440918, "global_step": 354840, "epoch": 4275} {"train_loss": -26.101776123046875, "global_step": 354841, "epoch": 4275} {"train_loss": -26.16517448425293, "global_step": 354842, "epoch": 4275} {"train_loss": -26.387502670288086, "global_step": 354843, "epoch": 4275} {"train_loss": -26.312116622924805, "global_step": 354844, "epoch": 4275} {"train_loss": -25.910612106323242, "global_step": 354845, "epoch": 4275} {"train_loss": -26.109216690063477, "global_step": 354846, "epoch": 4275} {"train_loss": -26.0632381439209, "global_step": 354847, "epoch": 4275} {"train_loss": -25.83680534362793, "global_step": 354848, "epoch": 4275} {"train_loss": -26.173202514648438, "global_step": 354849, "epoch": 4275} {"train_loss": -25.855382919311523, "global_step": 354850, "epoch": 4275} {"train_loss": -25.883996963500977, "global_step": 354851, "epoch": 4275} {"train_loss": -26.062824249267578, "global_step": 354852, "epoch": 4275} {"train_loss": -26.238739013671875, "global_step": 354853, "epoch": 4275} {"train_loss": -25.915760040283203, "global_step": 354854, "epoch": 4275} {"train_loss": -26.29725456237793, "global_step": 354855, "epoch": 4275} {"train_loss": -26.573638916015625, "global_step": 354856, "epoch": 4275} {"train_loss": -26.24811363220215, "global_step": 354857, "epoch": 4275} {"train_loss": -26.02373695373535, "global_step": 354858, "epoch": 4275} {"train_loss": -26.121801376342773, "global_step": 354859, "epoch": 4275} {"train_loss": -26.343915939331055, "global_step": 354860, "epoch": 4275} {"train_loss": -26.41370964050293, "global_step": 354861, "epoch": 4275} {"train_loss": -26.285364151000977, "global_step": 354862, "epoch": 4275} {"train_loss": -26.401371002197266, "global_step": 354863, "epoch": 4275} {"train_loss": -26.285110473632812, "global_step": 354864, "epoch": 4275} {"train_loss": -26.158239364624023, "global_step": 354865, "epoch": 4275} {"train_loss": -26.025604248046875, "global_step": 354866, "epoch": 4275} {"train_loss": -26.235157012939453, "global_step": 354867, "epoch": 4275} {"train_loss": -26.176639556884766, "global_step": 354868, "epoch": 4275} {"train_loss": -26.020612716674805, "global_step": 354869, "epoch": 4275} {"train_loss": -26.140119552612305, "global_step": 354870, "epoch": 4275} {"train_loss": -26.35357666015625, "global_step": 354871, "epoch": 4275} {"train_loss": -26.1309814453125, "global_step": 354872, "epoch": 4275} {"train_loss": -26.10194206237793, "global_step": 354873, "epoch": 4275} {"train_loss": -26.304590225219727, "global_step": 354874, "epoch": 4275} {"train_loss": -26.3375301361084, "global_step": 354875, "epoch": 4275} {"train_loss": -26.0378360748291, "global_step": 354876, "epoch": 4275} {"train_loss": -26.126300811767578, "global_step": 354877, "epoch": 4275} {"train_loss": -26.59303855895996, "global_step": 354878, "epoch": 4275} {"train_loss": -26.447574615478516, "global_step": 354879, "epoch": 4275} {"train_loss": -25.96343994140625, "global_step": 354880, "epoch": 4275} {"train_loss": -26.187341690063477, "global_step": 354881, "epoch": 4275} {"train_loss": -26.328088760375977, "global_step": 354882, "epoch": 4275} {"train_loss": -26.35979652404785, "global_step": 354883, "epoch": 4275} {"train_loss": -26.244281768798828, "global_step": 354884, "epoch": 4275} {"train_loss": -26.164846420288086, "global_step": 354885, "epoch": 4275} {"train_loss": -26.230606079101562, "global_step": 354886, "epoch": 4275} {"train_loss": -26.311603546142578, "global_step": 354887, "epoch": 4275} {"train_loss": -26.38372230529785, "global_step": 354888, "epoch": 4275} {"train_loss": -26.101734161376953, "global_step": 354889, "epoch": 4275} {"train_loss": -26.322370529174805, "global_step": 354890, "epoch": 4275} {"train_loss": -26.162683486938477, "global_step": 354891, "epoch": 4275} {"train_loss": -26.530017852783203, "global_step": 354892, "epoch": 4275} {"train_loss": -26.549823760986328, "global_step": 354893, "epoch": 4275} {"train_loss": -26.0606689453125, "global_step": 354894, "epoch": 4275} {"train_loss": -26.22736167907715, "global_step": 354895, "epoch": 4275} {"train_loss": -26.375818252563477, "global_step": 354896, "epoch": 4275} {"train_loss": -26.477874755859375, "global_step": 354897, "epoch": 4275} {"train_loss": -26.552637100219727, "global_step": 354898, "epoch": 4275} {"train_loss": -26.362476348876953, "global_step": 354899, "epoch": 4275} {"train_loss": -26.193008422851562, "global_step": 354900, "epoch": 4275} {"train_loss": -26.516454696655273, "global_step": 354901, "epoch": 4275} {"train_loss": -26.30144691467285, "global_step": 354902, "epoch": 4275} {"train_loss": -26.522674560546875, "global_step": 354903, "epoch": 4275} {"train_loss": -26.19959831237793, "global_step": 354904, "epoch": 4275} {"train_loss": -26.237455368041992, "global_step": 354905, "epoch": 4275} {"train_loss": -26.142541885375977, "global_step": 354906, "epoch": 4275} {"train_loss": -26.11639445661062, "global_step": 354907, "epoch": 4275, "val_loss": 6627534.0} {"train_loss": -25.911197662353516, "global_step": 354908, "epoch": 4276} {"train_loss": -25.08979034423828, "global_step": 354909, "epoch": 4276} {"train_loss": -25.058942794799805, "global_step": 354910, "epoch": 4276} {"train_loss": -24.764028549194336, "global_step": 354911, "epoch": 4276} {"train_loss": -25.57203483581543, "global_step": 354912, "epoch": 4276} {"train_loss": -25.613534927368164, "global_step": 354913, "epoch": 4276} {"train_loss": -25.44037437438965, "global_step": 354914, "epoch": 4276} {"train_loss": -25.49915885925293, "global_step": 354915, "epoch": 4276} {"train_loss": -25.59259605407715, "global_step": 354916, "epoch": 4276} {"train_loss": -25.909692764282227, "global_step": 354917, "epoch": 4276} {"train_loss": -25.9538631439209, "global_step": 354918, "epoch": 4276} {"train_loss": -26.14982032775879, "global_step": 354919, "epoch": 4276} {"train_loss": -25.745441436767578, "global_step": 354920, "epoch": 4276} {"train_loss": -25.28936767578125, "global_step": 354921, "epoch": 4276} {"train_loss": -25.7913761138916, "global_step": 354922, "epoch": 4276} {"train_loss": -25.806360244750977, "global_step": 354923, "epoch": 4276} {"train_loss": -25.740222930908203, "global_step": 354924, "epoch": 4276} {"train_loss": -26.06266212463379, "global_step": 354925, "epoch": 4276} {"train_loss": -25.739322662353516, "global_step": 354926, "epoch": 4276} {"train_loss": -25.711368560791016, "global_step": 354927, "epoch": 4276} {"train_loss": -25.6209659576416, "global_step": 354928, "epoch": 4276} {"train_loss": -26.100278854370117, "global_step": 354929, "epoch": 4276} {"train_loss": -25.996511459350586, "global_step": 354930, "epoch": 4276} {"train_loss": -25.83376121520996, "global_step": 354931, "epoch": 4276} {"train_loss": -25.54410743713379, "global_step": 354932, "epoch": 4276} {"train_loss": -25.969385147094727, "global_step": 354933, "epoch": 4276} {"train_loss": -25.835840225219727, "global_step": 354934, "epoch": 4276} {"train_loss": -26.281911849975586, "global_step": 354935, "epoch": 4276} {"train_loss": -25.756513595581055, "global_step": 354936, "epoch": 4276} {"train_loss": -26.12684440612793, "global_step": 354937, "epoch": 4276} {"train_loss": -26.08930778503418, "global_step": 354938, "epoch": 4276} {"train_loss": -25.915191650390625, "global_step": 354939, "epoch": 4276} {"train_loss": -26.559036254882812, "global_step": 354940, "epoch": 4276} {"train_loss": -26.289859771728516, "global_step": 354941, "epoch": 4276} {"train_loss": -26.49024772644043, "global_step": 354942, "epoch": 4276} {"train_loss": -26.663862228393555, "global_step": 354943, "epoch": 4276} {"train_loss": -26.348264694213867, "global_step": 354944, "epoch": 4276} {"train_loss": -26.276525497436523, "global_step": 354945, "epoch": 4276} {"train_loss": -26.2049617767334, "global_step": 354946, "epoch": 4276} {"train_loss": -26.0604305267334, "global_step": 354947, "epoch": 4276} {"train_loss": -25.988611221313477, "global_step": 354948, "epoch": 4276} {"train_loss": -26.256427764892578, "global_step": 354949, "epoch": 4276} {"train_loss": -26.07413673400879, "global_step": 354950, "epoch": 4276} {"train_loss": -25.9422664642334, "global_step": 354951, "epoch": 4276} {"train_loss": -26.32568359375, "global_step": 354952, "epoch": 4276} {"train_loss": -26.46942710876465, "global_step": 354953, "epoch": 4276} {"train_loss": -26.095258712768555, "global_step": 354954, "epoch": 4276} {"train_loss": -26.553720474243164, "global_step": 354955, "epoch": 4276} {"train_loss": -26.388397216796875, "global_step": 354956, "epoch": 4276} {"train_loss": -26.423059463500977, "global_step": 354957, "epoch": 4276} {"train_loss": -26.03165626525879, "global_step": 354958, "epoch": 4276} {"train_loss": -26.349552154541016, "global_step": 354959, "epoch": 4276} {"train_loss": -26.58070182800293, "global_step": 354960, "epoch": 4276} {"train_loss": -26.247512817382812, "global_step": 354961, "epoch": 4276} {"train_loss": -26.50909423828125, "global_step": 354962, "epoch": 4276} {"train_loss": -26.374746322631836, "global_step": 354963, "epoch": 4276} {"train_loss": -26.226755142211914, "global_step": 354964, "epoch": 4276} {"train_loss": -26.336593627929688, "global_step": 354965, "epoch": 4276} {"train_loss": -26.30718421936035, "global_step": 354966, "epoch": 4276} {"train_loss": -26.331090927124023, "global_step": 354967, "epoch": 4276} {"train_loss": -26.255268096923828, "global_step": 354968, "epoch": 4276} {"train_loss": -26.464658737182617, "global_step": 354969, "epoch": 4276} {"train_loss": -26.33546257019043, "global_step": 354970, "epoch": 4276} {"train_loss": -26.466236114501953, "global_step": 354971, "epoch": 4276} {"train_loss": -26.17365837097168, "global_step": 354972, "epoch": 4276} {"train_loss": -26.358030319213867, "global_step": 354973, "epoch": 4276} {"train_loss": -26.525678634643555, "global_step": 354974, "epoch": 4276} {"train_loss": -26.157093048095703, "global_step": 354975, "epoch": 4276} {"train_loss": -25.867055892944336, "global_step": 354976, "epoch": 4276} {"train_loss": -25.909147262573242, "global_step": 354977, "epoch": 4276} {"train_loss": -25.254934310913086, "global_step": 354978, "epoch": 4276} {"train_loss": -23.795255661010742, "global_step": 354979, "epoch": 4276} {"train_loss": -23.842681884765625, "global_step": 354980, "epoch": 4276} {"train_loss": -24.39299201965332, "global_step": 354981, "epoch": 4276} {"train_loss": -25.910614013671875, "global_step": 354982, "epoch": 4276} {"train_loss": -25.50979995727539, "global_step": 354983, "epoch": 4276} {"train_loss": -25.275943756103516, "global_step": 354984, "epoch": 4276} {"train_loss": -25.600265502929688, "global_step": 354985, "epoch": 4276} {"train_loss": -25.854145050048828, "global_step": 354986, "epoch": 4276} {"train_loss": -25.59276008605957, "global_step": 354987, "epoch": 4276} {"train_loss": -25.62941551208496, "global_step": 354988, "epoch": 4276} {"train_loss": -25.754430770874023, "global_step": 354989, "epoch": 4276} {"train_loss": -25.919638783098705, "global_step": 354990, "epoch": 4276, "val_loss": 6614759.5} {"train_loss": -25.338062286376953, "global_step": 354991, "epoch": 4277} {"train_loss": -25.710987091064453, "global_step": 354992, "epoch": 4277} {"train_loss": -25.44968605041504, "global_step": 354993, "epoch": 4277} {"train_loss": -25.49600601196289, "global_step": 354994, "epoch": 4277} {"train_loss": -25.830963134765625, "global_step": 354995, "epoch": 4277} {"train_loss": -25.455202102661133, "global_step": 354996, "epoch": 4277} {"train_loss": -25.410856246948242, "global_step": 354997, "epoch": 4277} {"train_loss": -25.839242935180664, "global_step": 354998, "epoch": 4277} {"train_loss": -25.465078353881836, "global_step": 354999, "epoch": 4277} {"train_loss": -25.860380172729492, "global_step": 355000, "epoch": 4277} {"train_loss": -25.504499435424805, "global_step": 355001, "epoch": 4277} {"train_loss": -25.52324676513672, "global_step": 355002, "epoch": 4277} {"train_loss": -25.8608341217041, "global_step": 355003, "epoch": 4277} {"train_loss": -25.903156280517578, "global_step": 355004, "epoch": 4277} {"train_loss": -25.66517448425293, "global_step": 355005, "epoch": 4277} {"train_loss": -25.829288482666016, "global_step": 355006, "epoch": 4277} {"train_loss": -25.8802433013916, "global_step": 355007, "epoch": 4277} {"train_loss": -25.902795791625977, "global_step": 355008, "epoch": 4277} {"train_loss": -26.341495513916016, "global_step": 355009, "epoch": 4277} {"train_loss": -26.03009605407715, "global_step": 355010, "epoch": 4277} {"train_loss": -26.253814697265625, "global_step": 355011, "epoch": 4277} {"train_loss": -25.935373306274414, "global_step": 355012, "epoch": 4277} {"train_loss": -26.385297775268555, "global_step": 355013, "epoch": 4277} {"train_loss": -26.202392578125, "global_step": 355014, "epoch": 4277} {"train_loss": -25.85674476623535, "global_step": 355015, "epoch": 4277} {"train_loss": -25.860822677612305, "global_step": 355016, "epoch": 4277} {"train_loss": -26.16938591003418, "global_step": 355017, "epoch": 4277} {"train_loss": -26.334909439086914, "global_step": 355018, "epoch": 4277} {"train_loss": -26.108230590820312, "global_step": 355019, "epoch": 4277} {"train_loss": -26.170730590820312, "global_step": 355020, "epoch": 4277} {"train_loss": -26.142715454101562, "global_step": 355021, "epoch": 4277} {"train_loss": -26.102746963500977, "global_step": 355022, "epoch": 4277} {"train_loss": -26.3629150390625, "global_step": 355023, "epoch": 4277} {"train_loss": -26.248931884765625, "global_step": 355024, "epoch": 4277} {"train_loss": -26.3916072845459, "global_step": 355025, "epoch": 4277} {"train_loss": -26.425662994384766, "global_step": 355026, "epoch": 4277} {"train_loss": -26.356775283813477, "global_step": 355027, "epoch": 4277} {"train_loss": -26.252826690673828, "global_step": 355028, "epoch": 4277} {"train_loss": -26.735992431640625, "global_step": 355029, "epoch": 4277} {"train_loss": -26.510656356811523, "global_step": 355030, "epoch": 4277} {"train_loss": -26.572519302368164, "global_step": 355031, "epoch": 4277} {"train_loss": -26.23097038269043, "global_step": 355032, "epoch": 4277} {"train_loss": -26.77762794494629, "global_step": 355033, "epoch": 4277} {"train_loss": -26.741607666015625, "global_step": 355034, "epoch": 4277} {"train_loss": -26.228565216064453, "global_step": 355035, "epoch": 4277} {"train_loss": -26.113712310791016, "global_step": 355036, "epoch": 4277} {"train_loss": -26.214752197265625, "global_step": 355037, "epoch": 4277} {"train_loss": -26.54144859313965, "global_step": 355038, "epoch": 4277} {"train_loss": -25.95516014099121, "global_step": 355039, "epoch": 4277} {"train_loss": -26.45151138305664, "global_step": 355040, "epoch": 4277} {"train_loss": -26.69019889831543, "global_step": 355041, "epoch": 4277} {"train_loss": -26.175018310546875, "global_step": 355042, "epoch": 4277} {"train_loss": -26.2773494720459, "global_step": 355043, "epoch": 4277} {"train_loss": -26.02081871032715, "global_step": 355044, "epoch": 4277} {"train_loss": -26.167795181274414, "global_step": 355045, "epoch": 4277} {"train_loss": -25.793912887573242, "global_step": 355046, "epoch": 4277} {"train_loss": -25.27066993713379, "global_step": 355047, "epoch": 4277} {"train_loss": -26.18572998046875, "global_step": 355048, "epoch": 4277} {"train_loss": -26.192773818969727, "global_step": 355049, "epoch": 4277} {"train_loss": -25.96491050720215, "global_step": 355050, "epoch": 4277} {"train_loss": -25.78407859802246, "global_step": 355051, "epoch": 4277} {"train_loss": -26.292871475219727, "global_step": 355052, "epoch": 4277} {"train_loss": -25.977949142456055, "global_step": 355053, "epoch": 4277} {"train_loss": -26.4112491607666, "global_step": 355054, "epoch": 4277} {"train_loss": -26.2625675201416, "global_step": 355055, "epoch": 4277} {"train_loss": -26.03558349609375, "global_step": 355056, "epoch": 4277} {"train_loss": -25.938013076782227, "global_step": 355057, "epoch": 4277} {"train_loss": -26.143680572509766, "global_step": 355058, "epoch": 4277} {"train_loss": -26.085844039916992, "global_step": 355059, "epoch": 4277} {"train_loss": -26.238004684448242, "global_step": 355060, "epoch": 4277} {"train_loss": -26.14324378967285, "global_step": 355061, "epoch": 4277} {"train_loss": -26.16758155822754, "global_step": 355062, "epoch": 4277} {"train_loss": -25.836654663085938, "global_step": 355063, "epoch": 4277} {"train_loss": -26.496557235717773, "global_step": 355064, "epoch": 4277} {"train_loss": -26.271284103393555, "global_step": 355065, "epoch": 4277} {"train_loss": -26.093658447265625, "global_step": 355066, "epoch": 4277} {"train_loss": -26.172138214111328, "global_step": 355067, "epoch": 4277} {"train_loss": -26.15700340270996, "global_step": 355068, "epoch": 4277} {"train_loss": -26.267908096313477, "global_step": 355069, "epoch": 4277} {"train_loss": -26.27138328552246, "global_step": 355070, "epoch": 4277} {"train_loss": -26.35407066345215, "global_step": 355071, "epoch": 4277} {"train_loss": -25.980512619018555, "global_step": 355072, "epoch": 4277} {"train_loss": -26.089760607983692, "global_step": 355073, "epoch": 4277, "val_loss": 6563792.0} {"train_loss": -26.00208854675293, "global_step": 355074, "epoch": 4278} {"train_loss": -26.068470001220703, "global_step": 355075, "epoch": 4278} {"train_loss": -26.226993560791016, "global_step": 355076, "epoch": 4278} {"train_loss": -25.529211044311523, "global_step": 355077, "epoch": 4278} {"train_loss": -25.233877182006836, "global_step": 355078, "epoch": 4278} {"train_loss": -26.093793869018555, "global_step": 355079, "epoch": 4278} {"train_loss": -25.96895408630371, "global_step": 355080, "epoch": 4278} {"train_loss": -25.96931266784668, "global_step": 355081, "epoch": 4278} {"train_loss": -25.290796279907227, "global_step": 355082, "epoch": 4278} {"train_loss": -25.650548934936523, "global_step": 355083, "epoch": 4278} {"train_loss": -26.0926570892334, "global_step": 355084, "epoch": 4278} {"train_loss": -26.10638999938965, "global_step": 355085, "epoch": 4278} {"train_loss": -25.97572135925293, "global_step": 355086, "epoch": 4278} {"train_loss": -26.1191349029541, "global_step": 355087, "epoch": 4278} {"train_loss": -25.782445907592773, "global_step": 355088, "epoch": 4278} {"train_loss": -25.87149429321289, "global_step": 355089, "epoch": 4278} {"train_loss": -26.036575317382812, "global_step": 355090, "epoch": 4278} {"train_loss": -26.233495712280273, "global_step": 355091, "epoch": 4278} {"train_loss": -26.39347267150879, "global_step": 355092, "epoch": 4278} {"train_loss": -26.172876358032227, "global_step": 355093, "epoch": 4278} {"train_loss": -26.367095947265625, "global_step": 355094, "epoch": 4278} {"train_loss": -26.39857292175293, "global_step": 355095, "epoch": 4278} {"train_loss": -25.791608810424805, "global_step": 355096, "epoch": 4278} {"train_loss": -26.25826072692871, "global_step": 355097, "epoch": 4278} {"train_loss": -26.374866485595703, "global_step": 355098, "epoch": 4278} {"train_loss": -26.049869537353516, "global_step": 355099, "epoch": 4278} {"train_loss": -25.9617919921875, "global_step": 355100, "epoch": 4278} {"train_loss": -26.322589874267578, "global_step": 355101, "epoch": 4278} {"train_loss": -26.25225257873535, "global_step": 355102, "epoch": 4278} {"train_loss": -26.198150634765625, "global_step": 355103, "epoch": 4278} {"train_loss": -26.80805015563965, "global_step": 355104, "epoch": 4278} {"train_loss": -25.825830459594727, "global_step": 355105, "epoch": 4278} {"train_loss": -26.256546020507812, "global_step": 355106, "epoch": 4278} {"train_loss": -26.386005401611328, "global_step": 355107, "epoch": 4278} {"train_loss": -26.477025985717773, "global_step": 355108, "epoch": 4278} {"train_loss": -26.3148136138916, "global_step": 355109, "epoch": 4278} {"train_loss": -26.139875411987305, "global_step": 355110, "epoch": 4278} {"train_loss": -26.604658126831055, "global_step": 355111, "epoch": 4278} {"train_loss": -26.418380737304688, "global_step": 355112, "epoch": 4278} {"train_loss": -26.1634521484375, "global_step": 355113, "epoch": 4278} {"train_loss": -26.450286865234375, "global_step": 355114, "epoch": 4278} {"train_loss": -26.20663833618164, "global_step": 355115, "epoch": 4278} {"train_loss": -26.278778076171875, "global_step": 355116, "epoch": 4278} {"train_loss": -26.499786376953125, "global_step": 355117, "epoch": 4278} {"train_loss": -26.2712345123291, "global_step": 355118, "epoch": 4278} {"train_loss": -26.3530216217041, "global_step": 355119, "epoch": 4278} {"train_loss": -26.355243682861328, "global_step": 355120, "epoch": 4278} {"train_loss": -26.5003662109375, "global_step": 355121, "epoch": 4278} {"train_loss": -26.375030517578125, "global_step": 355122, "epoch": 4278} {"train_loss": -26.41302490234375, "global_step": 355123, "epoch": 4278} {"train_loss": -26.43304443359375, "global_step": 355124, "epoch": 4278} {"train_loss": -25.97369956970215, "global_step": 355125, "epoch": 4278} {"train_loss": -26.534170150756836, "global_step": 355126, "epoch": 4278} {"train_loss": -26.35175132751465, "global_step": 355127, "epoch": 4278} {"train_loss": -26.28464698791504, "global_step": 355128, "epoch": 4278} {"train_loss": -26.524030685424805, "global_step": 355129, "epoch": 4278} {"train_loss": -26.269367218017578, "global_step": 355130, "epoch": 4278} {"train_loss": -25.963865280151367, "global_step": 355131, "epoch": 4278} {"train_loss": -25.778823852539062, "global_step": 355132, "epoch": 4278} {"train_loss": -26.122894287109375, "global_step": 355133, "epoch": 4278} {"train_loss": -26.57203483581543, "global_step": 355134, "epoch": 4278} {"train_loss": -25.821447372436523, "global_step": 355135, "epoch": 4278} {"train_loss": -26.45627212524414, "global_step": 355136, "epoch": 4278} {"train_loss": -26.0675048828125, "global_step": 355137, "epoch": 4278} {"train_loss": -26.456857681274414, "global_step": 355138, "epoch": 4278} {"train_loss": -26.0650634765625, "global_step": 355139, "epoch": 4278} {"train_loss": -26.05048179626465, "global_step": 355140, "epoch": 4278} {"train_loss": -26.14206314086914, "global_step": 355141, "epoch": 4278} {"train_loss": -25.865503311157227, "global_step": 355142, "epoch": 4278} {"train_loss": -25.73493766784668, "global_step": 355143, "epoch": 4278} {"train_loss": -26.033002853393555, "global_step": 355144, "epoch": 4278} {"train_loss": -25.727041244506836, "global_step": 355145, "epoch": 4278} {"train_loss": -26.18168067932129, "global_step": 355146, "epoch": 4278} {"train_loss": -26.135549545288086, "global_step": 355147, "epoch": 4278} {"train_loss": -26.487699508666992, "global_step": 355148, "epoch": 4278} {"train_loss": -26.475244522094727, "global_step": 355149, "epoch": 4278} {"train_loss": -26.1358642578125, "global_step": 355150, "epoch": 4278} {"train_loss": -26.033430099487305, "global_step": 355151, "epoch": 4278} {"train_loss": -26.02255630493164, "global_step": 355152, "epoch": 4278} {"train_loss": -26.063688278198242, "global_step": 355153, "epoch": 4278} {"train_loss": -26.073339462280273, "global_step": 355154, "epoch": 4278} {"train_loss": -26.31867027282715, "global_step": 355155, "epoch": 4278} {"train_loss": -26.158907097506237, "global_step": 355156, "epoch": 4278, "val_loss": 6741144.0} {"train_loss": -25.465290069580078, "global_step": 355157, "epoch": 4279} {"train_loss": -25.99245262145996, "global_step": 355158, "epoch": 4279} {"train_loss": -26.106794357299805, "global_step": 355159, "epoch": 4279} {"train_loss": -25.98871421813965, "global_step": 355160, "epoch": 4279} {"train_loss": -25.621374130249023, "global_step": 355161, "epoch": 4279} {"train_loss": -25.814289093017578, "global_step": 355162, "epoch": 4279} {"train_loss": -25.672887802124023, "global_step": 355163, "epoch": 4279} {"train_loss": -26.07948112487793, "global_step": 355164, "epoch": 4279} {"train_loss": -26.209320068359375, "global_step": 355165, "epoch": 4279} {"train_loss": -25.802539825439453, "global_step": 355166, "epoch": 4279} {"train_loss": -25.74051856994629, "global_step": 355167, "epoch": 4279} {"train_loss": -25.807580947875977, "global_step": 355168, "epoch": 4279} {"train_loss": -26.1177921295166, "global_step": 355169, "epoch": 4279} {"train_loss": -25.956220626831055, "global_step": 355170, "epoch": 4279} {"train_loss": -26.17315101623535, "global_step": 355171, "epoch": 4279} {"train_loss": -25.7069149017334, "global_step": 355172, "epoch": 4279} {"train_loss": -25.43267250061035, "global_step": 355173, "epoch": 4279} {"train_loss": -25.91120719909668, "global_step": 355174, "epoch": 4279} {"train_loss": -26.25149917602539, "global_step": 355175, "epoch": 4279} {"train_loss": -26.294605255126953, "global_step": 355176, "epoch": 4279} {"train_loss": -26.509435653686523, "global_step": 355177, "epoch": 4279} {"train_loss": -26.0111083984375, "global_step": 355178, "epoch": 4279} {"train_loss": -26.140384674072266, "global_step": 355179, "epoch": 4279} {"train_loss": -26.303674697875977, "global_step": 355180, "epoch": 4279} {"train_loss": -25.955785751342773, "global_step": 355181, "epoch": 4279} {"train_loss": -25.94727897644043, "global_step": 355182, "epoch": 4279} {"train_loss": -25.85747718811035, "global_step": 355183, "epoch": 4279} {"train_loss": -25.704212188720703, "global_step": 355184, "epoch": 4279} {"train_loss": -25.907073974609375, "global_step": 355185, "epoch": 4279} {"train_loss": -26.35820960998535, "global_step": 355186, "epoch": 4279} {"train_loss": -26.342853546142578, "global_step": 355187, "epoch": 4279} {"train_loss": -26.405065536499023, "global_step": 355188, "epoch": 4279} {"train_loss": -26.4180965423584, "global_step": 355189, "epoch": 4279} {"train_loss": -26.193710327148438, "global_step": 355190, "epoch": 4279} {"train_loss": -25.824506759643555, "global_step": 355191, "epoch": 4279} {"train_loss": -26.173583984375, "global_step": 355192, "epoch": 4279} {"train_loss": -26.231159210205078, "global_step": 355193, "epoch": 4279} {"train_loss": -26.32880973815918, "global_step": 355194, "epoch": 4279} {"train_loss": -25.791248321533203, "global_step": 355195, "epoch": 4279} {"train_loss": -26.164310455322266, "global_step": 355196, "epoch": 4279} {"train_loss": -26.27483558654785, "global_step": 355197, "epoch": 4279} {"train_loss": -26.264921188354492, "global_step": 355198, "epoch": 4279} {"train_loss": -26.363239288330078, "global_step": 355199, "epoch": 4279} {"train_loss": -26.577112197875977, "global_step": 355200, "epoch": 4279} {"train_loss": -25.96882438659668, "global_step": 355201, "epoch": 4279} {"train_loss": -25.8507137298584, "global_step": 355202, "epoch": 4279} {"train_loss": -25.879262924194336, "global_step": 355203, "epoch": 4279} {"train_loss": -26.608814239501953, "global_step": 355204, "epoch": 4279} {"train_loss": -26.50615882873535, "global_step": 355205, "epoch": 4279} {"train_loss": -26.235998153686523, "global_step": 355206, "epoch": 4279} {"train_loss": -26.012165069580078, "global_step": 355207, "epoch": 4279} {"train_loss": -26.0358829498291, "global_step": 355208, "epoch": 4279} {"train_loss": -26.131031036376953, "global_step": 355209, "epoch": 4279} {"train_loss": -26.054758071899414, "global_step": 355210, "epoch": 4279} {"train_loss": -26.184789657592773, "global_step": 355211, "epoch": 4279} {"train_loss": -25.818090438842773, "global_step": 355212, "epoch": 4279} {"train_loss": -26.40932273864746, "global_step": 355213, "epoch": 4279} {"train_loss": -26.163196563720703, "global_step": 355214, "epoch": 4279} {"train_loss": -26.153308868408203, "global_step": 355215, "epoch": 4279} {"train_loss": -26.09748649597168, "global_step": 355216, "epoch": 4279} {"train_loss": -26.36663818359375, "global_step": 355217, "epoch": 4279} {"train_loss": -26.24482536315918, "global_step": 355218, "epoch": 4279} {"train_loss": -26.215885162353516, "global_step": 355219, "epoch": 4279} {"train_loss": -26.075611114501953, "global_step": 355220, "epoch": 4279} {"train_loss": -26.217803955078125, "global_step": 355221, "epoch": 4279} {"train_loss": -26.514789581298828, "global_step": 355222, "epoch": 4279} {"train_loss": -26.380298614501953, "global_step": 355223, "epoch": 4279} {"train_loss": -26.35370445251465, "global_step": 355224, "epoch": 4279} {"train_loss": -26.44459342956543, "global_step": 355225, "epoch": 4279} {"train_loss": -26.68497657775879, "global_step": 355226, "epoch": 4279} {"train_loss": -26.220792770385742, "global_step": 355227, "epoch": 4279} {"train_loss": -26.2467041015625, "global_step": 355228, "epoch": 4279} {"train_loss": -26.305761337280273, "global_step": 355229, "epoch": 4279} {"train_loss": -26.105695724487305, "global_step": 355230, "epoch": 4279} {"train_loss": -26.441144943237305, "global_step": 355231, "epoch": 4279} {"train_loss": -26.23249626159668, "global_step": 355232, "epoch": 4279} {"train_loss": -26.245885848999023, "global_step": 355233, "epoch": 4279} {"train_loss": -26.433551788330078, "global_step": 355234, "epoch": 4279} {"train_loss": -26.475330352783203, "global_step": 355235, "epoch": 4279} {"train_loss": -26.240991592407227, "global_step": 355236, "epoch": 4279} {"train_loss": -26.444440841674805, "global_step": 355237, "epoch": 4279} {"train_loss": -26.333988189697266, "global_step": 355238, "epoch": 4279} {"train_loss": -26.139119320605175, "global_step": 355239, "epoch": 4279, "val_loss": 6637154.5} {"train_loss": -24.956830978393555, "global_step": 355240, "epoch": 4280} {"train_loss": -24.905624389648438, "global_step": 355241, "epoch": 4280} {"train_loss": -24.099641799926758, "global_step": 355242, "epoch": 4280} {"train_loss": -24.70522689819336, "global_step": 355243, "epoch": 4280} {"train_loss": -24.910842895507812, "global_step": 355244, "epoch": 4280} {"train_loss": -24.913320541381836, "global_step": 355245, "epoch": 4280} {"train_loss": -25.096298217773438, "global_step": 355246, "epoch": 4280} {"train_loss": -25.531932830810547, "global_step": 355247, "epoch": 4280} {"train_loss": -25.45477867126465, "global_step": 355248, "epoch": 4280} {"train_loss": -25.561704635620117, "global_step": 355249, "epoch": 4280} {"train_loss": -25.498254776000977, "global_step": 355250, "epoch": 4280} {"train_loss": -25.890161514282227, "global_step": 355251, "epoch": 4280} {"train_loss": -25.585309982299805, "global_step": 355252, "epoch": 4280} {"train_loss": -25.7042236328125, "global_step": 355253, "epoch": 4280} {"train_loss": -25.824676513671875, "global_step": 355254, "epoch": 4280} {"train_loss": -25.6817684173584, "global_step": 355255, "epoch": 4280} {"train_loss": -26.025714874267578, "global_step": 355256, "epoch": 4280} {"train_loss": -25.859588623046875, "global_step": 355257, "epoch": 4280} {"train_loss": -25.83796501159668, "global_step": 355258, "epoch": 4280} {"train_loss": -25.603620529174805, "global_step": 355259, "epoch": 4280} {"train_loss": -25.47933006286621, "global_step": 355260, "epoch": 4280} {"train_loss": -25.85401725769043, "global_step": 355261, "epoch": 4280} {"train_loss": -25.752307891845703, "global_step": 355262, "epoch": 4280} {"train_loss": -25.96854019165039, "global_step": 355263, "epoch": 4280} {"train_loss": -26.21710205078125, "global_step": 355264, "epoch": 4280} {"train_loss": -26.019287109375, "global_step": 355265, "epoch": 4280} {"train_loss": -26.142255783081055, "global_step": 355266, "epoch": 4280} {"train_loss": -25.91552734375, "global_step": 355267, "epoch": 4280} {"train_loss": -26.295185089111328, "global_step": 355268, "epoch": 4280} {"train_loss": -26.139013290405273, "global_step": 355269, "epoch": 4280} {"train_loss": -25.913089752197266, "global_step": 355270, "epoch": 4280} {"train_loss": -26.124128341674805, "global_step": 355271, "epoch": 4280} {"train_loss": -26.097614288330078, "global_step": 355272, "epoch": 4280} {"train_loss": -25.977033615112305, "global_step": 355273, "epoch": 4280} {"train_loss": -26.550552368164062, "global_step": 355274, "epoch": 4280} {"train_loss": -26.223508834838867, "global_step": 355275, "epoch": 4280} {"train_loss": -26.518033981323242, "global_step": 355276, "epoch": 4280} {"train_loss": -26.234851837158203, "global_step": 355277, "epoch": 4280} {"train_loss": -26.5114803314209, "global_step": 355278, "epoch": 4280} {"train_loss": -26.395950317382812, "global_step": 355279, "epoch": 4280} {"train_loss": -26.31580924987793, "global_step": 355280, "epoch": 4280} {"train_loss": -26.39129066467285, "global_step": 355281, "epoch": 4280} {"train_loss": -26.408771514892578, "global_step": 355282, "epoch": 4280} {"train_loss": -26.002378463745117, "global_step": 355283, "epoch": 4280} {"train_loss": -26.244613647460938, "global_step": 355284, "epoch": 4280} {"train_loss": -26.048816680908203, "global_step": 355285, "epoch": 4280} {"train_loss": -26.443212509155273, "global_step": 355286, "epoch": 4280} {"train_loss": -26.219945907592773, "global_step": 355287, "epoch": 4280} {"train_loss": -26.015380859375, "global_step": 355288, "epoch": 4280} {"train_loss": -26.3780460357666, "global_step": 355289, "epoch": 4280} {"train_loss": -26.147724151611328, "global_step": 355290, "epoch": 4280} {"train_loss": -26.336515426635742, "global_step": 355291, "epoch": 4280} {"train_loss": -26.10914421081543, "global_step": 355292, "epoch": 4280} {"train_loss": -26.519500732421875, "global_step": 355293, "epoch": 4280} {"train_loss": -26.66377067565918, "global_step": 355294, "epoch": 4280} {"train_loss": -26.0789794921875, "global_step": 355295, "epoch": 4280} {"train_loss": -26.4847412109375, "global_step": 355296, "epoch": 4280} {"train_loss": -26.580718994140625, "global_step": 355297, "epoch": 4280} {"train_loss": -26.3751220703125, "global_step": 355298, "epoch": 4280} {"train_loss": -26.55426025390625, "global_step": 355299, "epoch": 4280} {"train_loss": -26.11275291442871, "global_step": 355300, "epoch": 4280} {"train_loss": -26.407032012939453, "global_step": 355301, "epoch": 4280} {"train_loss": -26.514188766479492, "global_step": 355302, "epoch": 4280} {"train_loss": -26.27535057067871, "global_step": 355303, "epoch": 4280} {"train_loss": -25.9674015045166, "global_step": 355304, "epoch": 4280} {"train_loss": -26.17949867248535, "global_step": 355305, "epoch": 4280} {"train_loss": -25.9207706451416, "global_step": 355306, "epoch": 4280} {"train_loss": -26.306852340698242, "global_step": 355307, "epoch": 4280} {"train_loss": -26.732446670532227, "global_step": 355308, "epoch": 4280} {"train_loss": -26.2777099609375, "global_step": 355309, "epoch": 4280} {"train_loss": -26.20513343811035, "global_step": 355310, "epoch": 4280} {"train_loss": -25.533849716186523, "global_step": 355311, "epoch": 4280} {"train_loss": -25.92328453063965, "global_step": 355312, "epoch": 4280} {"train_loss": -26.17477798461914, "global_step": 355313, "epoch": 4280} {"train_loss": -26.236602783203125, "global_step": 355314, "epoch": 4280} {"train_loss": -26.360742568969727, "global_step": 355315, "epoch": 4280} {"train_loss": -25.836578369140625, "global_step": 355316, "epoch": 4280} {"train_loss": -25.806243896484375, "global_step": 355317, "epoch": 4280} {"train_loss": -26.3304443359375, "global_step": 355318, "epoch": 4280} {"train_loss": -26.2860107421875, "global_step": 355319, "epoch": 4280} {"train_loss": -25.739904403686523, "global_step": 355320, "epoch": 4280} {"train_loss": -25.601354598999023, "global_step": 355321, "epoch": 4280} {"train_loss": -25.972392829067736, "global_step": 355322, "epoch": 4280, "val_loss": 6650927.0} {"train_loss": -25.23337173461914, "global_step": 355323, "epoch": 4281} {"train_loss": -25.62286376953125, "global_step": 355324, "epoch": 4281} {"train_loss": -25.644681930541992, "global_step": 355325, "epoch": 4281} {"train_loss": -25.232004165649414, "global_step": 355326, "epoch": 4281} {"train_loss": -25.938383102416992, "global_step": 355327, "epoch": 4281} {"train_loss": -25.603071212768555, "global_step": 355328, "epoch": 4281} {"train_loss": -25.497636795043945, "global_step": 355329, "epoch": 4281} {"train_loss": -25.94266128540039, "global_step": 355330, "epoch": 4281} {"train_loss": -25.685138702392578, "global_step": 355331, "epoch": 4281} {"train_loss": -25.679935455322266, "global_step": 355332, "epoch": 4281} {"train_loss": -25.530685424804688, "global_step": 355333, "epoch": 4281} {"train_loss": -25.429874420166016, "global_step": 355334, "epoch": 4281} {"train_loss": -25.504846572875977, "global_step": 355335, "epoch": 4281} {"train_loss": -26.560123443603516, "global_step": 355336, "epoch": 4281} {"train_loss": -25.66741371154785, "global_step": 355337, "epoch": 4281} {"train_loss": -25.512439727783203, "global_step": 355338, "epoch": 4281} {"train_loss": -25.971805572509766, "global_step": 355339, "epoch": 4281} {"train_loss": -25.819629669189453, "global_step": 355340, "epoch": 4281} {"train_loss": -25.677881240844727, "global_step": 355341, "epoch": 4281} {"train_loss": -25.84503746032715, "global_step": 355342, "epoch": 4281} {"train_loss": -26.235151290893555, "global_step": 355343, "epoch": 4281} {"train_loss": -26.057126998901367, "global_step": 355344, "epoch": 4281} {"train_loss": -26.11911392211914, "global_step": 355345, "epoch": 4281} {"train_loss": -25.92428970336914, "global_step": 355346, "epoch": 4281} {"train_loss": -26.270233154296875, "global_step": 355347, "epoch": 4281} {"train_loss": -26.15022850036621, "global_step": 355348, "epoch": 4281} {"train_loss": -25.90675163269043, "global_step": 355349, "epoch": 4281} {"train_loss": -26.222824096679688, "global_step": 355350, "epoch": 4281} {"train_loss": -26.383764266967773, "global_step": 355351, "epoch": 4281} {"train_loss": -26.024831771850586, "global_step": 355352, "epoch": 4281} {"train_loss": -25.788497924804688, "global_step": 355353, "epoch": 4281} {"train_loss": -26.146780014038086, "global_step": 355354, "epoch": 4281} {"train_loss": -26.283111572265625, "global_step": 355355, "epoch": 4281} {"train_loss": -25.831695556640625, "global_step": 355356, "epoch": 4281} {"train_loss": -26.6538028717041, "global_step": 355357, "epoch": 4281} {"train_loss": -26.25250244140625, "global_step": 355358, "epoch": 4281} {"train_loss": -26.136877059936523, "global_step": 355359, "epoch": 4281} {"train_loss": -26.176870346069336, "global_step": 355360, "epoch": 4281} {"train_loss": -26.158111572265625, "global_step": 355361, "epoch": 4281} {"train_loss": -26.317930221557617, "global_step": 355362, "epoch": 4281} {"train_loss": -26.228683471679688, "global_step": 355363, "epoch": 4281} {"train_loss": -26.139190673828125, "global_step": 355364, "epoch": 4281} {"train_loss": -26.125986099243164, "global_step": 355365, "epoch": 4281} {"train_loss": -26.163040161132812, "global_step": 355366, "epoch": 4281} {"train_loss": -25.966339111328125, "global_step": 355367, "epoch": 4281} {"train_loss": -26.5289249420166, "global_step": 355368, "epoch": 4281} {"train_loss": -25.953556060791016, "global_step": 355369, "epoch": 4281} {"train_loss": -26.3616943359375, "global_step": 355370, "epoch": 4281} {"train_loss": -26.205724716186523, "global_step": 355371, "epoch": 4281} {"train_loss": -26.055383682250977, "global_step": 355372, "epoch": 4281} {"train_loss": -26.136005401611328, "global_step": 355373, "epoch": 4281} {"train_loss": -26.082141876220703, "global_step": 355374, "epoch": 4281} {"train_loss": -26.3670711517334, "global_step": 355375, "epoch": 4281} {"train_loss": -26.22673988342285, "global_step": 355376, "epoch": 4281} {"train_loss": -26.64252281188965, "global_step": 355377, "epoch": 4281} {"train_loss": -26.27625846862793, "global_step": 355378, "epoch": 4281} {"train_loss": -26.45857810974121, "global_step": 355379, "epoch": 4281} {"train_loss": -26.477985382080078, "global_step": 355380, "epoch": 4281} {"train_loss": -26.515928268432617, "global_step": 355381, "epoch": 4281} {"train_loss": -26.10271644592285, "global_step": 355382, "epoch": 4281} {"train_loss": -26.235721588134766, "global_step": 355383, "epoch": 4281} {"train_loss": -26.248395919799805, "global_step": 355384, "epoch": 4281} {"train_loss": -26.258569717407227, "global_step": 355385, "epoch": 4281} {"train_loss": -26.048261642456055, "global_step": 355386, "epoch": 4281} {"train_loss": -26.0579891204834, "global_step": 355387, "epoch": 4281} {"train_loss": -26.231658935546875, "global_step": 355388, "epoch": 4281} {"train_loss": -26.19681167602539, "global_step": 355389, "epoch": 4281} {"train_loss": -26.523117065429688, "global_step": 355390, "epoch": 4281} {"train_loss": -26.01568603515625, "global_step": 355391, "epoch": 4281} {"train_loss": -25.931324005126953, "global_step": 355392, "epoch": 4281} {"train_loss": -25.879438400268555, "global_step": 355393, "epoch": 4281} {"train_loss": -26.159042358398438, "global_step": 355394, "epoch": 4281} {"train_loss": -26.465911865234375, "global_step": 355395, "epoch": 4281} {"train_loss": -26.028400421142578, "global_step": 355396, "epoch": 4281} {"train_loss": -26.13397216796875, "global_step": 355397, "epoch": 4281} {"train_loss": -26.112262725830078, "global_step": 355398, "epoch": 4281} {"train_loss": -26.229883193969727, "global_step": 355399, "epoch": 4281} {"train_loss": -25.56781578063965, "global_step": 355400, "epoch": 4281} {"train_loss": -26.197107315063477, "global_step": 355401, "epoch": 4281} {"train_loss": -26.142719268798828, "global_step": 355402, "epoch": 4281} {"train_loss": -25.893619537353516, "global_step": 355403, "epoch": 4281} {"train_loss": -25.943878173828125, "global_step": 355404, "epoch": 4281} {"train_loss": -26.050067993531744, "global_step": 355405, "epoch": 4281, "val_loss": 6748823.5} {"train_loss": -25.96111488342285, "global_step": 355406, "epoch": 4282} {"train_loss": -25.85658073425293, "global_step": 355407, "epoch": 4282} {"train_loss": -25.596708297729492, "global_step": 355408, "epoch": 4282} {"train_loss": -25.99859046936035, "global_step": 355409, "epoch": 4282} {"train_loss": -25.828821182250977, "global_step": 355410, "epoch": 4282} {"train_loss": -26.0925235748291, "global_step": 355411, "epoch": 4282} {"train_loss": -25.519393920898438, "global_step": 355412, "epoch": 4282} {"train_loss": -26.090234756469727, "global_step": 355413, "epoch": 4282} {"train_loss": -25.860919952392578, "global_step": 355414, "epoch": 4282} {"train_loss": -25.642593383789062, "global_step": 355415, "epoch": 4282} {"train_loss": -26.19886589050293, "global_step": 355416, "epoch": 4282} {"train_loss": -26.130786895751953, "global_step": 355417, "epoch": 4282} {"train_loss": -25.546066284179688, "global_step": 355418, "epoch": 4282} {"train_loss": -26.001230239868164, "global_step": 355419, "epoch": 4282} {"train_loss": -26.121301651000977, "global_step": 355420, "epoch": 4282} {"train_loss": -26.301422119140625, "global_step": 355421, "epoch": 4282} {"train_loss": -26.285573959350586, "global_step": 355422, "epoch": 4282} {"train_loss": -26.061477661132812, "global_step": 355423, "epoch": 4282} {"train_loss": -25.920001983642578, "global_step": 355424, "epoch": 4282} {"train_loss": -25.7608699798584, "global_step": 355425, "epoch": 4282} {"train_loss": -25.974853515625, "global_step": 355426, "epoch": 4282} {"train_loss": -26.035755157470703, "global_step": 355427, "epoch": 4282} {"train_loss": -25.751331329345703, "global_step": 355428, "epoch": 4282} {"train_loss": -26.27099609375, "global_step": 355429, "epoch": 4282} {"train_loss": -26.3331356048584, "global_step": 355430, "epoch": 4282} {"train_loss": -25.783939361572266, "global_step": 355431, "epoch": 4282} {"train_loss": -25.8850040435791, "global_step": 355432, "epoch": 4282} {"train_loss": -26.398725509643555, "global_step": 355433, "epoch": 4282} {"train_loss": -25.945058822631836, "global_step": 355434, "epoch": 4282} {"train_loss": -26.232141494750977, "global_step": 355435, "epoch": 4282} {"train_loss": -25.944665908813477, "global_step": 355436, "epoch": 4282} {"train_loss": -26.4553279876709, "global_step": 355437, "epoch": 4282} {"train_loss": -26.333120346069336, "global_step": 355438, "epoch": 4282} {"train_loss": -26.21990394592285, "global_step": 355439, "epoch": 4282} {"train_loss": -26.09613037109375, "global_step": 355440, "epoch": 4282} {"train_loss": -26.4635009765625, "global_step": 355441, "epoch": 4282} {"train_loss": -25.96347999572754, "global_step": 355442, "epoch": 4282} {"train_loss": -26.162153244018555, "global_step": 355443, "epoch": 4282} {"train_loss": -26.461591720581055, "global_step": 355444, "epoch": 4282} {"train_loss": -26.45206069946289, "global_step": 355445, "epoch": 4282} {"train_loss": -26.42158317565918, "global_step": 355446, "epoch": 4282} {"train_loss": -26.2127742767334, "global_step": 355447, "epoch": 4282} {"train_loss": -26.31846046447754, "global_step": 355448, "epoch": 4282} {"train_loss": -25.801416397094727, "global_step": 355449, "epoch": 4282} {"train_loss": -26.288415908813477, "global_step": 355450, "epoch": 4282} {"train_loss": -25.792688369750977, "global_step": 355451, "epoch": 4282} {"train_loss": -26.139219284057617, "global_step": 355452, "epoch": 4282} {"train_loss": -26.226016998291016, "global_step": 355453, "epoch": 4282} {"train_loss": -25.956029891967773, "global_step": 355454, "epoch": 4282} {"train_loss": -26.187097549438477, "global_step": 355455, "epoch": 4282} {"train_loss": -26.060394287109375, "global_step": 355456, "epoch": 4282} {"train_loss": -25.91474723815918, "global_step": 355457, "epoch": 4282} {"train_loss": -26.23783302307129, "global_step": 355458, "epoch": 4282} {"train_loss": -25.929443359375, "global_step": 355459, "epoch": 4282} {"train_loss": -26.241559982299805, "global_step": 355460, "epoch": 4282} {"train_loss": -26.3786678314209, "global_step": 355461, "epoch": 4282} {"train_loss": -26.482879638671875, "global_step": 355462, "epoch": 4282} {"train_loss": -26.212873458862305, "global_step": 355463, "epoch": 4282} {"train_loss": -26.46242332458496, "global_step": 355464, "epoch": 4282} {"train_loss": -26.189786911010742, "global_step": 355465, "epoch": 4282} {"train_loss": -26.39827537536621, "global_step": 355466, "epoch": 4282} {"train_loss": -26.114013671875, "global_step": 355467, "epoch": 4282} {"train_loss": -26.249374389648438, "global_step": 355468, "epoch": 4282} {"train_loss": -25.67036247253418, "global_step": 355469, "epoch": 4282} {"train_loss": -26.119037628173828, "global_step": 355470, "epoch": 4282} {"train_loss": -26.222131729125977, "global_step": 355471, "epoch": 4282} {"train_loss": -26.178369522094727, "global_step": 355472, "epoch": 4282} {"train_loss": -26.302173614501953, "global_step": 355473, "epoch": 4282} {"train_loss": -26.077808380126953, "global_step": 355474, "epoch": 4282} {"train_loss": -26.43837547302246, "global_step": 355475, "epoch": 4282} {"train_loss": -26.294660568237305, "global_step": 355476, "epoch": 4282} {"train_loss": -26.38258934020996, "global_step": 355477, "epoch": 4282} {"train_loss": -26.26519775390625, "global_step": 355478, "epoch": 4282} {"train_loss": -26.378555297851562, "global_step": 355479, "epoch": 4282} {"train_loss": -25.967639923095703, "global_step": 355480, "epoch": 4282} {"train_loss": -26.37127113342285, "global_step": 355481, "epoch": 4282} {"train_loss": -26.269088745117188, "global_step": 355482, "epoch": 4282} {"train_loss": -26.1817569732666, "global_step": 355483, "epoch": 4282} {"train_loss": -26.30909538269043, "global_step": 355484, "epoch": 4282} {"train_loss": -26.27937126159668, "global_step": 355485, "epoch": 4282} {"train_loss": -26.469684600830078, "global_step": 355486, "epoch": 4282} {"train_loss": -26.42938232421875, "global_step": 355487, "epoch": 4282} {"train_loss": -26.135814138205653, "global_step": 355488, "epoch": 4282, "val_loss": 6694538.5} {"train_loss": -24.195077896118164, "global_step": 355489, "epoch": 4283} {"train_loss": -23.81890869140625, "global_step": 355490, "epoch": 4283} {"train_loss": -25.27430534362793, "global_step": 355491, "epoch": 4283} {"train_loss": -24.652423858642578, "global_step": 355492, "epoch": 4283} {"train_loss": -25.675140380859375, "global_step": 355493, "epoch": 4283} {"train_loss": -25.766096115112305, "global_step": 355494, "epoch": 4283} {"train_loss": -25.293691635131836, "global_step": 355495, "epoch": 4283} {"train_loss": -25.708606719970703, "global_step": 355496, "epoch": 4283} {"train_loss": -25.315963745117188, "global_step": 355497, "epoch": 4283} {"train_loss": -25.485952377319336, "global_step": 355498, "epoch": 4283} {"train_loss": -25.156688690185547, "global_step": 355499, "epoch": 4283} {"train_loss": -25.43906593322754, "global_step": 355500, "epoch": 4283} {"train_loss": -25.321056365966797, "global_step": 355501, "epoch": 4283} {"train_loss": -25.325580596923828, "global_step": 355502, "epoch": 4283} {"train_loss": -25.688079833984375, "global_step": 355503, "epoch": 4283} {"train_loss": -25.794113159179688, "global_step": 355504, "epoch": 4283} {"train_loss": -25.56522560119629, "global_step": 355505, "epoch": 4283} {"train_loss": -25.635833740234375, "global_step": 355506, "epoch": 4283} {"train_loss": -25.589191436767578, "global_step": 355507, "epoch": 4283} {"train_loss": -25.336837768554688, "global_step": 355508, "epoch": 4283} {"train_loss": -25.69208335876465, "global_step": 355509, "epoch": 4283} {"train_loss": -25.78009605407715, "global_step": 355510, "epoch": 4283} {"train_loss": -25.76409912109375, "global_step": 355511, "epoch": 4283} {"train_loss": -25.883502960205078, "global_step": 355512, "epoch": 4283} {"train_loss": -25.809803009033203, "global_step": 355513, "epoch": 4283} {"train_loss": -25.395009994506836, "global_step": 355514, "epoch": 4283} {"train_loss": -25.926715850830078, "global_step": 355515, "epoch": 4283} {"train_loss": -26.030670166015625, "global_step": 355516, "epoch": 4283} {"train_loss": -25.80230712890625, "global_step": 355517, "epoch": 4283} {"train_loss": -25.93414878845215, "global_step": 355518, "epoch": 4283} {"train_loss": -25.839731216430664, "global_step": 355519, "epoch": 4283} {"train_loss": -26.229389190673828, "global_step": 355520, "epoch": 4283} {"train_loss": -25.544391632080078, "global_step": 355521, "epoch": 4283} {"train_loss": -26.096851348876953, "global_step": 355522, "epoch": 4283} {"train_loss": -25.793420791625977, "global_step": 355523, "epoch": 4283} {"train_loss": -25.8695011138916, "global_step": 355524, "epoch": 4283} {"train_loss": -26.07330894470215, "global_step": 355525, "epoch": 4283} {"train_loss": -26.194005966186523, "global_step": 355526, "epoch": 4283} {"train_loss": -25.987146377563477, "global_step": 355527, "epoch": 4283} {"train_loss": -26.355127334594727, "global_step": 355528, "epoch": 4283} {"train_loss": -26.171789169311523, "global_step": 355529, "epoch": 4283} {"train_loss": -25.909894943237305, "global_step": 355530, "epoch": 4283} {"train_loss": -26.739179611206055, "global_step": 355531, "epoch": 4283} {"train_loss": -26.239904403686523, "global_step": 355532, "epoch": 4283} {"train_loss": -26.147626876831055, "global_step": 355533, "epoch": 4283} {"train_loss": -26.305927276611328, "global_step": 355534, "epoch": 4283} {"train_loss": -26.55109214782715, "global_step": 355535, "epoch": 4283} {"train_loss": -26.154987335205078, "global_step": 355536, "epoch": 4283} {"train_loss": -26.416074752807617, "global_step": 355537, "epoch": 4283} {"train_loss": -26.633773803710938, "global_step": 355538, "epoch": 4283} {"train_loss": -26.42542839050293, "global_step": 355539, "epoch": 4283} {"train_loss": -26.30792236328125, "global_step": 355540, "epoch": 4283} {"train_loss": -26.39679527282715, "global_step": 355541, "epoch": 4283} {"train_loss": -26.506473541259766, "global_step": 355542, "epoch": 4283} {"train_loss": -26.576908111572266, "global_step": 355543, "epoch": 4283} {"train_loss": -25.91517448425293, "global_step": 355544, "epoch": 4283} {"train_loss": -25.78230094909668, "global_step": 355545, "epoch": 4283} {"train_loss": -26.24138832092285, "global_step": 355546, "epoch": 4283} {"train_loss": -26.316980361938477, "global_step": 355547, "epoch": 4283} {"train_loss": -26.431650161743164, "global_step": 355548, "epoch": 4283} {"train_loss": -26.269275665283203, "global_step": 355549, "epoch": 4283} {"train_loss": -26.505374908447266, "global_step": 355550, "epoch": 4283} {"train_loss": -25.92994499206543, "global_step": 355551, "epoch": 4283} {"train_loss": -26.19903564453125, "global_step": 355552, "epoch": 4283} {"train_loss": -26.026037216186523, "global_step": 355553, "epoch": 4283} {"train_loss": -26.095138549804688, "global_step": 355554, "epoch": 4283} {"train_loss": -25.97216796875, "global_step": 355555, "epoch": 4283} {"train_loss": -25.904367446899414, "global_step": 355556, "epoch": 4283} {"train_loss": -25.906179428100586, "global_step": 355557, "epoch": 4283} {"train_loss": -26.079816818237305, "global_step": 355558, "epoch": 4283} {"train_loss": -26.212757110595703, "global_step": 355559, "epoch": 4283} {"train_loss": -26.2911434173584, "global_step": 355560, "epoch": 4283} {"train_loss": -25.732778549194336, "global_step": 355561, "epoch": 4283} {"train_loss": -26.23005485534668, "global_step": 355562, "epoch": 4283} {"train_loss": -26.178152084350586, "global_step": 355563, "epoch": 4283} {"train_loss": -26.189411163330078, "global_step": 355564, "epoch": 4283} {"train_loss": -26.162933349609375, "global_step": 355565, "epoch": 4283} {"train_loss": -26.47114372253418, "global_step": 355566, "epoch": 4283} {"train_loss": -26.06300163269043, "global_step": 355567, "epoch": 4283} {"train_loss": -26.284503936767578, "global_step": 355568, "epoch": 4283} {"train_loss": -25.75642204284668, "global_step": 355569, "epoch": 4283} {"train_loss": -26.195438385009766, "global_step": 355570, "epoch": 4283} {"train_loss": -25.92298829411886, "global_step": 355571, "epoch": 4283, "val_loss": 6618171.5} {"train_loss": -25.622007369995117, "global_step": 355572, "epoch": 4284} {"train_loss": -25.570343017578125, "global_step": 355573, "epoch": 4284} {"train_loss": -25.656972885131836, "global_step": 355574, "epoch": 4284} {"train_loss": -25.7630558013916, "global_step": 355575, "epoch": 4284} {"train_loss": -25.62989616394043, "global_step": 355576, "epoch": 4284} {"train_loss": -24.938175201416016, "global_step": 355577, "epoch": 4284} {"train_loss": -25.307153701782227, "global_step": 355578, "epoch": 4284} {"train_loss": -25.765172958374023, "global_step": 355579, "epoch": 4284} {"train_loss": -26.033884048461914, "global_step": 355580, "epoch": 4284} {"train_loss": -25.665897369384766, "global_step": 355581, "epoch": 4284} {"train_loss": -25.73843765258789, "global_step": 355582, "epoch": 4284} {"train_loss": -25.673603057861328, "global_step": 355583, "epoch": 4284} {"train_loss": -25.779571533203125, "global_step": 355584, "epoch": 4284} {"train_loss": -25.712125778198242, "global_step": 355585, "epoch": 4284} {"train_loss": -25.747385025024414, "global_step": 355586, "epoch": 4284} {"train_loss": -25.771503448486328, "global_step": 355587, "epoch": 4284} {"train_loss": -25.448278427124023, "global_step": 355588, "epoch": 4284} {"train_loss": -26.167407989501953, "global_step": 355589, "epoch": 4284} {"train_loss": -25.8557186126709, "global_step": 355590, "epoch": 4284} {"train_loss": -25.731510162353516, "global_step": 355591, "epoch": 4284} {"train_loss": -25.765710830688477, "global_step": 355592, "epoch": 4284} {"train_loss": -26.364425659179688, "global_step": 355593, "epoch": 4284} {"train_loss": -26.122699737548828, "global_step": 355594, "epoch": 4284} {"train_loss": -25.914077758789062, "global_step": 355595, "epoch": 4284} {"train_loss": -26.127166748046875, "global_step": 355596, "epoch": 4284} {"train_loss": -25.840988159179688, "global_step": 355597, "epoch": 4284} {"train_loss": -26.053552627563477, "global_step": 355598, "epoch": 4284} {"train_loss": -26.056135177612305, "global_step": 355599, "epoch": 4284} {"train_loss": -26.105728149414062, "global_step": 355600, "epoch": 4284} {"train_loss": -26.100143432617188, "global_step": 355601, "epoch": 4284} {"train_loss": -26.230194091796875, "global_step": 355602, "epoch": 4284} {"train_loss": -26.385025024414062, "global_step": 355603, "epoch": 4284} {"train_loss": -26.418058395385742, "global_step": 355604, "epoch": 4284} {"train_loss": -26.12990379333496, "global_step": 355605, "epoch": 4284} {"train_loss": -26.482702255249023, "global_step": 355606, "epoch": 4284} {"train_loss": -26.13348960876465, "global_step": 355607, "epoch": 4284} {"train_loss": -26.368772506713867, "global_step": 355608, "epoch": 4284} {"train_loss": -26.47237205505371, "global_step": 355609, "epoch": 4284} {"train_loss": -26.204381942749023, "global_step": 355610, "epoch": 4284} {"train_loss": -26.227224349975586, "global_step": 355611, "epoch": 4284} {"train_loss": -26.588132858276367, "global_step": 355612, "epoch": 4284} {"train_loss": -26.49854850769043, "global_step": 355613, "epoch": 4284} {"train_loss": -26.599044799804688, "global_step": 355614, "epoch": 4284} {"train_loss": -26.306650161743164, "global_step": 355615, "epoch": 4284} {"train_loss": -26.216815948486328, "global_step": 355616, "epoch": 4284} {"train_loss": -26.14996337890625, "global_step": 355617, "epoch": 4284} {"train_loss": -26.353168487548828, "global_step": 355618, "epoch": 4284} {"train_loss": -26.34388542175293, "global_step": 355619, "epoch": 4284} {"train_loss": -26.156208038330078, "global_step": 355620, "epoch": 4284} {"train_loss": -26.426929473876953, "global_step": 355621, "epoch": 4284} {"train_loss": -25.99213218688965, "global_step": 355622, "epoch": 4284} {"train_loss": -26.12095069885254, "global_step": 355623, "epoch": 4284} {"train_loss": -26.38067054748535, "global_step": 355624, "epoch": 4284} {"train_loss": -25.904027938842773, "global_step": 355625, "epoch": 4284} {"train_loss": -25.742456436157227, "global_step": 355626, "epoch": 4284} {"train_loss": -25.522977828979492, "global_step": 355627, "epoch": 4284} {"train_loss": -25.990949630737305, "global_step": 355628, "epoch": 4284} {"train_loss": -26.393829345703125, "global_step": 355629, "epoch": 4284} {"train_loss": -26.13922119140625, "global_step": 355630, "epoch": 4284} {"train_loss": -26.309452056884766, "global_step": 355631, "epoch": 4284} {"train_loss": -26.1458797454834, "global_step": 355632, "epoch": 4284} {"train_loss": -25.760095596313477, "global_step": 355633, "epoch": 4284} {"train_loss": -26.177976608276367, "global_step": 355634, "epoch": 4284} {"train_loss": -26.02020263671875, "global_step": 355635, "epoch": 4284} {"train_loss": -26.052658081054688, "global_step": 355636, "epoch": 4284} {"train_loss": -26.399877548217773, "global_step": 355637, "epoch": 4284} {"train_loss": -26.34983253479004, "global_step": 355638, "epoch": 4284} {"train_loss": -26.436063766479492, "global_step": 355639, "epoch": 4284} {"train_loss": -26.301742553710938, "global_step": 355640, "epoch": 4284} {"train_loss": -26.375158309936523, "global_step": 355641, "epoch": 4284} {"train_loss": -26.156293869018555, "global_step": 355642, "epoch": 4284} {"train_loss": -26.3062744140625, "global_step": 355643, "epoch": 4284} {"train_loss": -26.395893096923828, "global_step": 355644, "epoch": 4284} {"train_loss": -26.198474884033203, "global_step": 355645, "epoch": 4284} {"train_loss": -26.343225479125977, "global_step": 355646, "epoch": 4284} {"train_loss": -26.2863826751709, "global_step": 355647, "epoch": 4284} {"train_loss": -26.715930938720703, "global_step": 355648, "epoch": 4284} {"train_loss": -26.283594131469727, "global_step": 355649, "epoch": 4284} {"train_loss": -26.3067569732666, "global_step": 355650, "epoch": 4284} {"train_loss": -26.284727096557617, "global_step": 355651, "epoch": 4284} {"train_loss": -26.511890411376953, "global_step": 355652, "epoch": 4284} {"train_loss": -26.210403442382812, "global_step": 355653, "epoch": 4284} {"train_loss": -26.112849201064513, "global_step": 355654, "epoch": 4284, "val_loss": 6638221.0} {"train_loss": -25.65262794494629, "global_step": 355655, "epoch": 4285} {"train_loss": -26.052221298217773, "global_step": 355656, "epoch": 4285} {"train_loss": -25.698434829711914, "global_step": 355657, "epoch": 4285} {"train_loss": -25.847009658813477, "global_step": 355658, "epoch": 4285} {"train_loss": -26.082122802734375, "global_step": 355659, "epoch": 4285} {"train_loss": -25.905780792236328, "global_step": 355660, "epoch": 4285} {"train_loss": -26.32118034362793, "global_step": 355661, "epoch": 4285} {"train_loss": -26.364089965820312, "global_step": 355662, "epoch": 4285} {"train_loss": -26.2030029296875, "global_step": 355663, "epoch": 4285} {"train_loss": -25.982696533203125, "global_step": 355664, "epoch": 4285} {"train_loss": -25.92030143737793, "global_step": 355665, "epoch": 4285} {"train_loss": -25.62347412109375, "global_step": 355666, "epoch": 4285} {"train_loss": -26.229345321655273, "global_step": 355667, "epoch": 4285} {"train_loss": -26.089685440063477, "global_step": 355668, "epoch": 4285} {"train_loss": -26.147912979125977, "global_step": 355669, "epoch": 4285} {"train_loss": -26.12114906311035, "global_step": 355670, "epoch": 4285} {"train_loss": -26.1704158782959, "global_step": 355671, "epoch": 4285} {"train_loss": -26.112470626831055, "global_step": 355672, "epoch": 4285} {"train_loss": -26.397314071655273, "global_step": 355673, "epoch": 4285} {"train_loss": -26.04926872253418, "global_step": 355674, "epoch": 4285} {"train_loss": -26.130781173706055, "global_step": 355675, "epoch": 4285} {"train_loss": -26.16546058654785, "global_step": 355676, "epoch": 4285} {"train_loss": -26.074289321899414, "global_step": 355677, "epoch": 4285} {"train_loss": -26.60153579711914, "global_step": 355678, "epoch": 4285} {"train_loss": -25.704730987548828, "global_step": 355679, "epoch": 4285} {"train_loss": -26.291440963745117, "global_step": 355680, "epoch": 4285} {"train_loss": -26.199499130249023, "global_step": 355681, "epoch": 4285} {"train_loss": -26.545368194580078, "global_step": 355682, "epoch": 4285} {"train_loss": -26.445173263549805, "global_step": 355683, "epoch": 4285} {"train_loss": -26.07305908203125, "global_step": 355684, "epoch": 4285} {"train_loss": -26.2139892578125, "global_step": 355685, "epoch": 4285} {"train_loss": -26.15299415588379, "global_step": 355686, "epoch": 4285} {"train_loss": -25.696674346923828, "global_step": 355687, "epoch": 4285} {"train_loss": -26.432327270507812, "global_step": 355688, "epoch": 4285} {"train_loss": -26.152206420898438, "global_step": 355689, "epoch": 4285} {"train_loss": -26.084075927734375, "global_step": 355690, "epoch": 4285} {"train_loss": -25.493520736694336, "global_step": 355691, "epoch": 4285} {"train_loss": -26.481229782104492, "global_step": 355692, "epoch": 4285} {"train_loss": -26.306013107299805, "global_step": 355693, "epoch": 4285} {"train_loss": -25.874555587768555, "global_step": 355694, "epoch": 4285} {"train_loss": -26.11368751525879, "global_step": 355695, "epoch": 4285} {"train_loss": -25.841663360595703, "global_step": 355696, "epoch": 4285} {"train_loss": -25.901609420776367, "global_step": 355697, "epoch": 4285} {"train_loss": -25.93878746032715, "global_step": 355698, "epoch": 4285} {"train_loss": -26.243194580078125, "global_step": 355699, "epoch": 4285} {"train_loss": -26.016687393188477, "global_step": 355700, "epoch": 4285} {"train_loss": -26.294116973876953, "global_step": 355701, "epoch": 4285} {"train_loss": -25.706207275390625, "global_step": 355702, "epoch": 4285} {"train_loss": -26.46588134765625, "global_step": 355703, "epoch": 4285} {"train_loss": -26.180124282836914, "global_step": 355704, "epoch": 4285} {"train_loss": -26.12163734436035, "global_step": 355705, "epoch": 4285} {"train_loss": -26.129287719726562, "global_step": 355706, "epoch": 4285} {"train_loss": -26.022541046142578, "global_step": 355707, "epoch": 4285} {"train_loss": -26.553579330444336, "global_step": 355708, "epoch": 4285} {"train_loss": -26.44581413269043, "global_step": 355709, "epoch": 4285} {"train_loss": -25.96817398071289, "global_step": 355710, "epoch": 4285} {"train_loss": -25.768789291381836, "global_step": 355711, "epoch": 4285} {"train_loss": -26.291940689086914, "global_step": 355712, "epoch": 4285} {"train_loss": -26.238813400268555, "global_step": 355713, "epoch": 4285} {"train_loss": -26.446704864501953, "global_step": 355714, "epoch": 4285} {"train_loss": -26.119049072265625, "global_step": 355715, "epoch": 4285} {"train_loss": -26.14124870300293, "global_step": 355716, "epoch": 4285} {"train_loss": -26.306976318359375, "global_step": 355717, "epoch": 4285} {"train_loss": -26.5563907623291, "global_step": 355718, "epoch": 4285} {"train_loss": -26.068622589111328, "global_step": 355719, "epoch": 4285} {"train_loss": -25.95364761352539, "global_step": 355720, "epoch": 4285} {"train_loss": -25.9517765045166, "global_step": 355721, "epoch": 4285} {"train_loss": -26.3324031829834, "global_step": 355722, "epoch": 4285} {"train_loss": -26.201440811157227, "global_step": 355723, "epoch": 4285} {"train_loss": -26.391590118408203, "global_step": 355724, "epoch": 4285} {"train_loss": -26.355833053588867, "global_step": 355725, "epoch": 4285} {"train_loss": -26.421924591064453, "global_step": 355726, "epoch": 4285} {"train_loss": -26.201711654663086, "global_step": 355727, "epoch": 4285} {"train_loss": -26.303110122680664, "global_step": 355728, "epoch": 4285} {"train_loss": -26.282073974609375, "global_step": 355729, "epoch": 4285} {"train_loss": -26.643285751342773, "global_step": 355730, "epoch": 4285} {"train_loss": -26.052570343017578, "global_step": 355731, "epoch": 4285} {"train_loss": -26.40511131286621, "global_step": 355732, "epoch": 4285} {"train_loss": -25.67974281311035, "global_step": 355733, "epoch": 4285} {"train_loss": -26.371601104736328, "global_step": 355734, "epoch": 4285} {"train_loss": -25.943069458007812, "global_step": 355735, "epoch": 4285} {"train_loss": -26.196853637695312, "global_step": 355736, "epoch": 4285} {"train_loss": -26.147721049297285, "global_step": 355737, "epoch": 4285, "val_loss": 6640108.0} {"train_loss": -24.55215072631836, "global_step": 355738, "epoch": 4286} {"train_loss": -24.43222999572754, "global_step": 355739, "epoch": 4286} {"train_loss": -24.937097549438477, "global_step": 355740, "epoch": 4286} {"train_loss": -24.307315826416016, "global_step": 355741, "epoch": 4286} {"train_loss": -24.97138023376465, "global_step": 355742, "epoch": 4286} {"train_loss": -24.912450790405273, "global_step": 355743, "epoch": 4286} {"train_loss": -24.79828453063965, "global_step": 355744, "epoch": 4286} {"train_loss": -24.981882095336914, "global_step": 355745, "epoch": 4286} {"train_loss": -25.228113174438477, "global_step": 355746, "epoch": 4286} {"train_loss": -25.12727928161621, "global_step": 355747, "epoch": 4286} {"train_loss": -25.444839477539062, "global_step": 355748, "epoch": 4286} {"train_loss": -25.34786033630371, "global_step": 355749, "epoch": 4286} {"train_loss": -25.320592880249023, "global_step": 355750, "epoch": 4286} {"train_loss": -25.590726852416992, "global_step": 355751, "epoch": 4286} {"train_loss": -25.26279067993164, "global_step": 355752, "epoch": 4286} {"train_loss": -25.327085494995117, "global_step": 355753, "epoch": 4286} {"train_loss": -25.4958553314209, "global_step": 355754, "epoch": 4286} {"train_loss": -25.308340072631836, "global_step": 355755, "epoch": 4286} {"train_loss": -25.693805694580078, "global_step": 355756, "epoch": 4286} {"train_loss": -25.35157012939453, "global_step": 355757, "epoch": 4286} {"train_loss": -25.474506378173828, "global_step": 355758, "epoch": 4286} {"train_loss": -25.83349609375, "global_step": 355759, "epoch": 4286} {"train_loss": -25.592815399169922, "global_step": 355760, "epoch": 4286} {"train_loss": -25.54646873474121, "global_step": 355761, "epoch": 4286} {"train_loss": -25.561765670776367, "global_step": 355762, "epoch": 4286} {"train_loss": -25.95147132873535, "global_step": 355763, "epoch": 4286} {"train_loss": -25.62848472595215, "global_step": 355764, "epoch": 4286} {"train_loss": -25.700403213500977, "global_step": 355765, "epoch": 4286} {"train_loss": -25.6048641204834, "global_step": 355766, "epoch": 4286} {"train_loss": -25.873615264892578, "global_step": 355767, "epoch": 4286} {"train_loss": -25.959089279174805, "global_step": 355768, "epoch": 4286} {"train_loss": -26.296335220336914, "global_step": 355769, "epoch": 4286} {"train_loss": -26.302276611328125, "global_step": 355770, "epoch": 4286} {"train_loss": -26.018335342407227, "global_step": 355771, "epoch": 4286} {"train_loss": -26.127588272094727, "global_step": 355772, "epoch": 4286} {"train_loss": -25.845075607299805, "global_step": 355773, "epoch": 4286} {"train_loss": -26.149555206298828, "global_step": 355774, "epoch": 4286} {"train_loss": -26.11787223815918, "global_step": 355775, "epoch": 4286} {"train_loss": -26.301986694335938, "global_step": 355776, "epoch": 4286} {"train_loss": -26.166135787963867, "global_step": 355777, "epoch": 4286} {"train_loss": -26.12269401550293, "global_step": 355778, "epoch": 4286} {"train_loss": -26.356115341186523, "global_step": 355779, "epoch": 4286} {"train_loss": -26.240217208862305, "global_step": 355780, "epoch": 4286} {"train_loss": -26.134857177734375, "global_step": 355781, "epoch": 4286} {"train_loss": -25.957311630249023, "global_step": 355782, "epoch": 4286} {"train_loss": -26.256162643432617, "global_step": 355783, "epoch": 4286} {"train_loss": -26.46937370300293, "global_step": 355784, "epoch": 4286} {"train_loss": -25.98737907409668, "global_step": 355785, "epoch": 4286} {"train_loss": -26.52247428894043, "global_step": 355786, "epoch": 4286} {"train_loss": -26.364337921142578, "global_step": 355787, "epoch": 4286} {"train_loss": -26.16144371032715, "global_step": 355788, "epoch": 4286} {"train_loss": -26.07200050354004, "global_step": 355789, "epoch": 4286} {"train_loss": -26.20621681213379, "global_step": 355790, "epoch": 4286} {"train_loss": -26.173492431640625, "global_step": 355791, "epoch": 4286} {"train_loss": -26.165021896362305, "global_step": 355792, "epoch": 4286} {"train_loss": -26.181493759155273, "global_step": 355793, "epoch": 4286} {"train_loss": -26.427295684814453, "global_step": 355794, "epoch": 4286} {"train_loss": -26.106830596923828, "global_step": 355795, "epoch": 4286} {"train_loss": -26.344650268554688, "global_step": 355796, "epoch": 4286} {"train_loss": -26.3317928314209, "global_step": 355797, "epoch": 4286} {"train_loss": -26.01047706604004, "global_step": 355798, "epoch": 4286} {"train_loss": -26.33696937561035, "global_step": 355799, "epoch": 4286} {"train_loss": -25.91156005859375, "global_step": 355800, "epoch": 4286} {"train_loss": -26.227705001831055, "global_step": 355801, "epoch": 4286} {"train_loss": -26.248565673828125, "global_step": 355802, "epoch": 4286} {"train_loss": -26.094350814819336, "global_step": 355803, "epoch": 4286} {"train_loss": -26.2601261138916, "global_step": 355804, "epoch": 4286} {"train_loss": -26.397253036499023, "global_step": 355805, "epoch": 4286} {"train_loss": -26.416234970092773, "global_step": 355806, "epoch": 4286} {"train_loss": -26.267324447631836, "global_step": 355807, "epoch": 4286} {"train_loss": -25.986068725585938, "global_step": 355808, "epoch": 4286} {"train_loss": -26.000730514526367, "global_step": 355809, "epoch": 4286} {"train_loss": -26.296173095703125, "global_step": 355810, "epoch": 4286} {"train_loss": -26.0048828125, "global_step": 355811, "epoch": 4286} {"train_loss": -25.73883056640625, "global_step": 355812, "epoch": 4286} {"train_loss": -25.838394165039062, "global_step": 355813, "epoch": 4286} {"train_loss": -26.521284103393555, "global_step": 355814, "epoch": 4286} {"train_loss": -26.105804443359375, "global_step": 355815, "epoch": 4286} {"train_loss": -26.103174209594727, "global_step": 355816, "epoch": 4286} {"train_loss": -26.320226669311523, "global_step": 355817, "epoch": 4286} {"train_loss": -26.371021270751953, "global_step": 355818, "epoch": 4286} {"train_loss": -25.957935333251953, "global_step": 355819, "epoch": 4286} {"train_loss": -25.873060732002717, "global_step": 355820, "epoch": 4286, "val_loss": 6700716.0} {"train_loss": -25.1910457611084, "global_step": 355821, "epoch": 4287} {"train_loss": -25.29962730407715, "global_step": 355822, "epoch": 4287} {"train_loss": -25.234312057495117, "global_step": 355823, "epoch": 4287} {"train_loss": -25.273725509643555, "global_step": 355824, "epoch": 4287} {"train_loss": -25.841360092163086, "global_step": 355825, "epoch": 4287} {"train_loss": -25.857040405273438, "global_step": 355826, "epoch": 4287} {"train_loss": -25.973432540893555, "global_step": 355827, "epoch": 4287} {"train_loss": -25.88685417175293, "global_step": 355828, "epoch": 4287} {"train_loss": -26.267765045166016, "global_step": 355829, "epoch": 4287} {"train_loss": -25.90907096862793, "global_step": 355830, "epoch": 4287} {"train_loss": -25.78399085998535, "global_step": 355831, "epoch": 4287} {"train_loss": -25.776166915893555, "global_step": 355832, "epoch": 4287} {"train_loss": -26.00678062438965, "global_step": 355833, "epoch": 4287} {"train_loss": -26.019668579101562, "global_step": 355834, "epoch": 4287} {"train_loss": -25.991851806640625, "global_step": 355835, "epoch": 4287} {"train_loss": -26.0241641998291, "global_step": 355836, "epoch": 4287} {"train_loss": -26.008588790893555, "global_step": 355837, "epoch": 4287} {"train_loss": -25.809616088867188, "global_step": 355838, "epoch": 4287} {"train_loss": -25.98736572265625, "global_step": 355839, "epoch": 4287} {"train_loss": -25.637451171875, "global_step": 355840, "epoch": 4287} {"train_loss": -26.3234806060791, "global_step": 355841, "epoch": 4287} {"train_loss": -26.251501083374023, "global_step": 355842, "epoch": 4287} {"train_loss": -26.089859008789062, "global_step": 355843, "epoch": 4287} {"train_loss": -26.05841064453125, "global_step": 355844, "epoch": 4287} {"train_loss": -25.948095321655273, "global_step": 355845, "epoch": 4287} {"train_loss": -26.346288681030273, "global_step": 355846, "epoch": 4287} {"train_loss": -26.1252498626709, "global_step": 355847, "epoch": 4287} {"train_loss": -26.0323543548584, "global_step": 355848, "epoch": 4287} {"train_loss": -26.42487907409668, "global_step": 355849, "epoch": 4287} {"train_loss": -26.013349533081055, "global_step": 355850, "epoch": 4287} {"train_loss": -25.961750030517578, "global_step": 355851, "epoch": 4287} {"train_loss": -26.47100257873535, "global_step": 355852, "epoch": 4287} {"train_loss": -26.367910385131836, "global_step": 355853, "epoch": 4287} {"train_loss": -25.939176559448242, "global_step": 355854, "epoch": 4287} {"train_loss": -25.6202449798584, "global_step": 355855, "epoch": 4287} {"train_loss": -26.376745223999023, "global_step": 355856, "epoch": 4287} {"train_loss": -26.35040855407715, "global_step": 355857, "epoch": 4287} {"train_loss": -26.19318962097168, "global_step": 355858, "epoch": 4287} {"train_loss": -26.179288864135742, "global_step": 355859, "epoch": 4287} {"train_loss": -26.584802627563477, "global_step": 355860, "epoch": 4287} {"train_loss": -26.24152183532715, "global_step": 355861, "epoch": 4287} {"train_loss": -26.26887321472168, "global_step": 355862, "epoch": 4287} {"train_loss": -26.106698989868164, "global_step": 355863, "epoch": 4287} {"train_loss": -26.256916046142578, "global_step": 355864, "epoch": 4287} {"train_loss": -26.260089874267578, "global_step": 355865, "epoch": 4287} {"train_loss": -26.21543312072754, "global_step": 355866, "epoch": 4287} {"train_loss": -26.423526763916016, "global_step": 355867, "epoch": 4287} {"train_loss": -26.374814987182617, "global_step": 355868, "epoch": 4287} {"train_loss": -26.0819149017334, "global_step": 355869, "epoch": 4287} {"train_loss": -26.582080841064453, "global_step": 355870, "epoch": 4287} {"train_loss": -26.226276397705078, "global_step": 355871, "epoch": 4287} {"train_loss": -26.511621475219727, "global_step": 355872, "epoch": 4287} {"train_loss": -26.650970458984375, "global_step": 355873, "epoch": 4287} {"train_loss": -26.455907821655273, "global_step": 355874, "epoch": 4287} {"train_loss": -26.014301300048828, "global_step": 355875, "epoch": 4287} {"train_loss": -26.287647247314453, "global_step": 355876, "epoch": 4287} {"train_loss": -26.200849533081055, "global_step": 355877, "epoch": 4287} {"train_loss": -26.006072998046875, "global_step": 355878, "epoch": 4287} {"train_loss": -26.4162654876709, "global_step": 355879, "epoch": 4287} {"train_loss": -26.237091064453125, "global_step": 355880, "epoch": 4287} {"train_loss": -26.3685245513916, "global_step": 355881, "epoch": 4287} {"train_loss": -26.45908546447754, "global_step": 355882, "epoch": 4287} {"train_loss": -26.724279403686523, "global_step": 355883, "epoch": 4287} {"train_loss": -26.3934326171875, "global_step": 355884, "epoch": 4287} {"train_loss": -26.159082412719727, "global_step": 355885, "epoch": 4287} {"train_loss": -26.2606258392334, "global_step": 355886, "epoch": 4287} {"train_loss": -26.448993682861328, "global_step": 355887, "epoch": 4287} {"train_loss": -26.193395614624023, "global_step": 355888, "epoch": 4287} {"train_loss": -26.520254135131836, "global_step": 355889, "epoch": 4287} {"train_loss": -26.20560073852539, "global_step": 355890, "epoch": 4287} {"train_loss": -26.508207321166992, "global_step": 355891, "epoch": 4287} {"train_loss": -26.294849395751953, "global_step": 355892, "epoch": 4287} {"train_loss": -26.434995651245117, "global_step": 355893, "epoch": 4287} {"train_loss": -25.92030143737793, "global_step": 355894, "epoch": 4287} {"train_loss": -26.52801513671875, "global_step": 355895, "epoch": 4287} {"train_loss": -26.28045654296875, "global_step": 355896, "epoch": 4287} {"train_loss": -26.476003646850586, "global_step": 355897, "epoch": 4287} {"train_loss": -26.200658798217773, "global_step": 355898, "epoch": 4287} {"train_loss": -25.974124908447266, "global_step": 355899, "epoch": 4287} {"train_loss": -26.255659103393555, "global_step": 355900, "epoch": 4287} {"train_loss": -26.1216983795166, "global_step": 355901, "epoch": 4287} {"train_loss": -25.902545928955078, "global_step": 355902, "epoch": 4287} {"train_loss": -26.139773679066852, "global_step": 355903, "epoch": 4287, "val_loss": 6628515.0} {"train_loss": -25.254459381103516, "global_step": 355904, "epoch": 4288} {"train_loss": -25.173954010009766, "global_step": 355905, "epoch": 4288} {"train_loss": -25.35634422302246, "global_step": 355906, "epoch": 4288} {"train_loss": -25.780542373657227, "global_step": 355907, "epoch": 4288} {"train_loss": -25.497121810913086, "global_step": 355908, "epoch": 4288} {"train_loss": -25.701374053955078, "global_step": 355909, "epoch": 4288} {"train_loss": -25.67165184020996, "global_step": 355910, "epoch": 4288} {"train_loss": -25.234045028686523, "global_step": 355911, "epoch": 4288} {"train_loss": -25.492321014404297, "global_step": 355912, "epoch": 4288} {"train_loss": -25.930469512939453, "global_step": 355913, "epoch": 4288} {"train_loss": -25.158323287963867, "global_step": 355914, "epoch": 4288} {"train_loss": -25.87649917602539, "global_step": 355915, "epoch": 4288} {"train_loss": -25.385875701904297, "global_step": 355916, "epoch": 4288} {"train_loss": -26.011762619018555, "global_step": 355917, "epoch": 4288} {"train_loss": -25.8107967376709, "global_step": 355918, "epoch": 4288} {"train_loss": -25.690082550048828, "global_step": 355919, "epoch": 4288} {"train_loss": -25.948572158813477, "global_step": 355920, "epoch": 4288} {"train_loss": -25.770660400390625, "global_step": 355921, "epoch": 4288} {"train_loss": -26.1002197265625, "global_step": 355922, "epoch": 4288} {"train_loss": -25.90192985534668, "global_step": 355923, "epoch": 4288} {"train_loss": -25.75687026977539, "global_step": 355924, "epoch": 4288} {"train_loss": -26.262659072875977, "global_step": 355925, "epoch": 4288} {"train_loss": -25.909711837768555, "global_step": 355926, "epoch": 4288} {"train_loss": -26.1566219329834, "global_step": 355927, "epoch": 4288} {"train_loss": -26.000226974487305, "global_step": 355928, "epoch": 4288} {"train_loss": -26.234176635742188, "global_step": 355929, "epoch": 4288} {"train_loss": -25.80533790588379, "global_step": 355930, "epoch": 4288} {"train_loss": -26.184463500976562, "global_step": 355931, "epoch": 4288} {"train_loss": -25.732547760009766, "global_step": 355932, "epoch": 4288} {"train_loss": -25.804880142211914, "global_step": 355933, "epoch": 4288} {"train_loss": -26.294599533081055, "global_step": 355934, "epoch": 4288} {"train_loss": -26.026098251342773, "global_step": 355935, "epoch": 4288} {"train_loss": -25.898889541625977, "global_step": 355936, "epoch": 4288} {"train_loss": -26.340314865112305, "global_step": 355937, "epoch": 4288} {"train_loss": -26.369810104370117, "global_step": 355938, "epoch": 4288} {"train_loss": -26.1776065826416, "global_step": 355939, "epoch": 4288} {"train_loss": -26.157339096069336, "global_step": 355940, "epoch": 4288} {"train_loss": -26.15583610534668, "global_step": 355941, "epoch": 4288} {"train_loss": -26.54937171936035, "global_step": 355942, "epoch": 4288} {"train_loss": -26.36263084411621, "global_step": 355943, "epoch": 4288} {"train_loss": -26.44610595703125, "global_step": 355944, "epoch": 4288} {"train_loss": -26.113988876342773, "global_step": 355945, "epoch": 4288} {"train_loss": -26.435815811157227, "global_step": 355946, "epoch": 4288} {"train_loss": -26.487070083618164, "global_step": 355947, "epoch": 4288} {"train_loss": -26.7099609375, "global_step": 355948, "epoch": 4288} {"train_loss": -26.250930786132812, "global_step": 355949, "epoch": 4288} {"train_loss": -26.10004997253418, "global_step": 355950, "epoch": 4288} {"train_loss": -26.37272071838379, "global_step": 355951, "epoch": 4288} {"train_loss": -26.34405517578125, "global_step": 355952, "epoch": 4288} {"train_loss": -26.344436645507812, "global_step": 355953, "epoch": 4288} {"train_loss": -26.096435546875, "global_step": 355954, "epoch": 4288} {"train_loss": -26.135974884033203, "global_step": 355955, "epoch": 4288} {"train_loss": -26.15671157836914, "global_step": 355956, "epoch": 4288} {"train_loss": -26.41716957092285, "global_step": 355957, "epoch": 4288} {"train_loss": -26.79804801940918, "global_step": 355958, "epoch": 4288} {"train_loss": -26.424793243408203, "global_step": 355959, "epoch": 4288} {"train_loss": -26.843957901000977, "global_step": 355960, "epoch": 4288} {"train_loss": -26.407373428344727, "global_step": 355961, "epoch": 4288} {"train_loss": -25.77406883239746, "global_step": 355962, "epoch": 4288} {"train_loss": -26.353422164916992, "global_step": 355963, "epoch": 4288} {"train_loss": -26.191099166870117, "global_step": 355964, "epoch": 4288} {"train_loss": -26.28089714050293, "global_step": 355965, "epoch": 4288} {"train_loss": -26.245386123657227, "global_step": 355966, "epoch": 4288} {"train_loss": -26.437164306640625, "global_step": 355967, "epoch": 4288} {"train_loss": -26.507720947265625, "global_step": 355968, "epoch": 4288} {"train_loss": -26.23297119140625, "global_step": 355969, "epoch": 4288} {"train_loss": -26.57623291015625, "global_step": 355970, "epoch": 4288} {"train_loss": -26.043622970581055, "global_step": 355971, "epoch": 4288} {"train_loss": -25.869359970092773, "global_step": 355972, "epoch": 4288} {"train_loss": -26.012577056884766, "global_step": 355973, "epoch": 4288} {"train_loss": -26.1634578704834, "global_step": 355974, "epoch": 4288} {"train_loss": -26.292444229125977, "global_step": 355975, "epoch": 4288} {"train_loss": -25.999841690063477, "global_step": 355976, "epoch": 4288} {"train_loss": -26.358793258666992, "global_step": 355977, "epoch": 4288} {"train_loss": -26.070388793945312, "global_step": 355978, "epoch": 4288} {"train_loss": -26.222219467163086, "global_step": 355979, "epoch": 4288} {"train_loss": -26.203414916992188, "global_step": 355980, "epoch": 4288} {"train_loss": -26.148462295532227, "global_step": 355981, "epoch": 4288} {"train_loss": -26.35820960998535, "global_step": 355982, "epoch": 4288} {"train_loss": -26.4957218170166, "global_step": 355983, "epoch": 4288} {"train_loss": -26.002262115478516, "global_step": 355984, "epoch": 4288} {"train_loss": -26.331298828125, "global_step": 355985, "epoch": 4288} {"train_loss": -26.086679182856916, "global_step": 355986, "epoch": 4288, "val_loss": 6567717.0} {"train_loss": -25.7674617767334, "global_step": 355987, "epoch": 4289} {"train_loss": -26.183195114135742, "global_step": 355988, "epoch": 4289} {"train_loss": -26.520923614501953, "global_step": 355989, "epoch": 4289} {"train_loss": -25.963489532470703, "global_step": 355990, "epoch": 4289} {"train_loss": -26.067291259765625, "global_step": 355991, "epoch": 4289} {"train_loss": -25.851459503173828, "global_step": 355992, "epoch": 4289} {"train_loss": -26.26972770690918, "global_step": 355993, "epoch": 4289} {"train_loss": -26.115808486938477, "global_step": 355994, "epoch": 4289} {"train_loss": -26.335662841796875, "global_step": 355995, "epoch": 4289} {"train_loss": -26.522705078125, "global_step": 355996, "epoch": 4289} {"train_loss": -26.149093627929688, "global_step": 355997, "epoch": 4289} {"train_loss": -26.35406494140625, "global_step": 355998, "epoch": 4289} {"train_loss": -26.339567184448242, "global_step": 355999, "epoch": 4289} {"train_loss": -26.431859970092773, "global_step": 356000, "epoch": 4289} {"train_loss": -26.630126953125, "global_step": 356001, "epoch": 4289} {"train_loss": -25.94487953186035, "global_step": 356002, "epoch": 4289} {"train_loss": -26.3680477142334, "global_step": 356003, "epoch": 4289} {"train_loss": -26.38642692565918, "global_step": 356004, "epoch": 4289} {"train_loss": -25.99749755859375, "global_step": 356005, "epoch": 4289} {"train_loss": -26.47650718688965, "global_step": 356006, "epoch": 4289} {"train_loss": -26.20878028869629, "global_step": 356007, "epoch": 4289} {"train_loss": -26.226001739501953, "global_step": 356008, "epoch": 4289} {"train_loss": -26.360158920288086, "global_step": 356009, "epoch": 4289} {"train_loss": -26.048999786376953, "global_step": 356010, "epoch": 4289} {"train_loss": -26.03913688659668, "global_step": 356011, "epoch": 4289} {"train_loss": -26.12835121154785, "global_step": 356012, "epoch": 4289} {"train_loss": -26.416568756103516, "global_step": 356013, "epoch": 4289} {"train_loss": -26.36639976501465, "global_step": 356014, "epoch": 4289} {"train_loss": -26.231428146362305, "global_step": 356015, "epoch": 4289} {"train_loss": -25.921375274658203, "global_step": 356016, "epoch": 4289} {"train_loss": -26.46475601196289, "global_step": 356017, "epoch": 4289} {"train_loss": -26.323932647705078, "global_step": 356018, "epoch": 4289} {"train_loss": -26.257741928100586, "global_step": 356019, "epoch": 4289} {"train_loss": -25.79705810546875, "global_step": 356020, "epoch": 4289} {"train_loss": -26.23078727722168, "global_step": 356021, "epoch": 4289} {"train_loss": -26.171899795532227, "global_step": 356022, "epoch": 4289} {"train_loss": -26.0948543548584, "global_step": 356023, "epoch": 4289} {"train_loss": -25.92658805847168, "global_step": 356024, "epoch": 4289} {"train_loss": -26.271820068359375, "global_step": 356025, "epoch": 4289} {"train_loss": -26.246967315673828, "global_step": 356026, "epoch": 4289} {"train_loss": -26.234222412109375, "global_step": 356027, "epoch": 4289} {"train_loss": -26.338897705078125, "global_step": 356028, "epoch": 4289} {"train_loss": -26.437841415405273, "global_step": 356029, "epoch": 4289} {"train_loss": -26.27790641784668, "global_step": 356030, "epoch": 4289} {"train_loss": -26.27118492126465, "global_step": 356031, "epoch": 4289} {"train_loss": -26.318775177001953, "global_step": 356032, "epoch": 4289} {"train_loss": -26.340702056884766, "global_step": 356033, "epoch": 4289} {"train_loss": -26.275617599487305, "global_step": 356034, "epoch": 4289} {"train_loss": -26.36905860900879, "global_step": 356035, "epoch": 4289} {"train_loss": -25.98516273498535, "global_step": 356036, "epoch": 4289} {"train_loss": -25.961008071899414, "global_step": 356037, "epoch": 4289} {"train_loss": -25.85284996032715, "global_step": 356038, "epoch": 4289} {"train_loss": -25.91707420349121, "global_step": 356039, "epoch": 4289} {"train_loss": -26.0797176361084, "global_step": 356040, "epoch": 4289} {"train_loss": -25.645116806030273, "global_step": 356041, "epoch": 4289} {"train_loss": -26.27802848815918, "global_step": 356042, "epoch": 4289} {"train_loss": -25.7857666015625, "global_step": 356043, "epoch": 4289} {"train_loss": -26.076557159423828, "global_step": 356044, "epoch": 4289} {"train_loss": -26.067541122436523, "global_step": 356045, "epoch": 4289} {"train_loss": -26.023107528686523, "global_step": 356046, "epoch": 4289} {"train_loss": -26.083765029907227, "global_step": 356047, "epoch": 4289} {"train_loss": -26.468961715698242, "global_step": 356048, "epoch": 4289} {"train_loss": -26.10977554321289, "global_step": 356049, "epoch": 4289} {"train_loss": -25.93743324279785, "global_step": 356050, "epoch": 4289} {"train_loss": -26.0189208984375, "global_step": 356051, "epoch": 4289} {"train_loss": -26.182205200195312, "global_step": 356052, "epoch": 4289} {"train_loss": -25.894073486328125, "global_step": 356053, "epoch": 4289} {"train_loss": -26.215972900390625, "global_step": 356054, "epoch": 4289} {"train_loss": -26.17340660095215, "global_step": 356055, "epoch": 4289} {"train_loss": -26.438074111938477, "global_step": 356056, "epoch": 4289} {"train_loss": -25.928457260131836, "global_step": 356057, "epoch": 4289} {"train_loss": -26.201141357421875, "global_step": 356058, "epoch": 4289} {"train_loss": -26.54273796081543, "global_step": 356059, "epoch": 4289} {"train_loss": -26.343036651611328, "global_step": 356060, "epoch": 4289} {"train_loss": -26.306039810180664, "global_step": 356061, "epoch": 4289} {"train_loss": -26.05829429626465, "global_step": 356062, "epoch": 4289} {"train_loss": -26.05586051940918, "global_step": 356063, "epoch": 4289} {"train_loss": -26.404870986938477, "global_step": 356064, "epoch": 4289} {"train_loss": -26.317697525024414, "global_step": 356065, "epoch": 4289} {"train_loss": -26.5739803314209, "global_step": 356066, "epoch": 4289} {"train_loss": -26.124267578125, "global_step": 356067, "epoch": 4289} {"train_loss": -25.9870548248291, "global_step": 356068, "epoch": 4289} {"train_loss": -26.189951172794203, "global_step": 356069, "epoch": 4289, "val_loss": 6665409.0} {"train_loss": -26.008703231811523, "global_step": 356070, "epoch": 4290} {"train_loss": -25.795923233032227, "global_step": 356071, "epoch": 4290} {"train_loss": -25.430419921875, "global_step": 356072, "epoch": 4290} {"train_loss": -25.5658016204834, "global_step": 356073, "epoch": 4290} {"train_loss": -25.402088165283203, "global_step": 356074, "epoch": 4290} {"train_loss": -25.76498794555664, "global_step": 356075, "epoch": 4290} {"train_loss": -25.83052635192871, "global_step": 356076, "epoch": 4290} {"train_loss": -25.6155948638916, "global_step": 356077, "epoch": 4290} {"train_loss": -25.912601470947266, "global_step": 356078, "epoch": 4290} {"train_loss": -25.865873336791992, "global_step": 356079, "epoch": 4290} {"train_loss": -26.30340576171875, "global_step": 356080, "epoch": 4290} {"train_loss": -25.90838050842285, "global_step": 356081, "epoch": 4290} {"train_loss": -26.265039443969727, "global_step": 356082, "epoch": 4290} {"train_loss": -25.821807861328125, "global_step": 356083, "epoch": 4290} {"train_loss": -26.113784790039062, "global_step": 356084, "epoch": 4290} {"train_loss": -26.046918869018555, "global_step": 356085, "epoch": 4290} {"train_loss": -25.813528060913086, "global_step": 356086, "epoch": 4290} {"train_loss": -26.09463882446289, "global_step": 356087, "epoch": 4290} {"train_loss": -25.898193359375, "global_step": 356088, "epoch": 4290} {"train_loss": -26.258869171142578, "global_step": 356089, "epoch": 4290} {"train_loss": -26.016300201416016, "global_step": 356090, "epoch": 4290} {"train_loss": -26.28597068786621, "global_step": 356091, "epoch": 4290} {"train_loss": -26.3253173828125, "global_step": 356092, "epoch": 4290} {"train_loss": -26.343408584594727, "global_step": 356093, "epoch": 4290} {"train_loss": -26.4271183013916, "global_step": 356094, "epoch": 4290} {"train_loss": -26.198942184448242, "global_step": 356095, "epoch": 4290} {"train_loss": -26.07208824157715, "global_step": 356096, "epoch": 4290} {"train_loss": -25.906702041625977, "global_step": 356097, "epoch": 4290} {"train_loss": -26.51321792602539, "global_step": 356098, "epoch": 4290} {"train_loss": -26.377456665039062, "global_step": 356099, "epoch": 4290} {"train_loss": -26.552249908447266, "global_step": 356100, "epoch": 4290} {"train_loss": -26.26019287109375, "global_step": 356101, "epoch": 4290} {"train_loss": -26.225305557250977, "global_step": 356102, "epoch": 4290} {"train_loss": -26.28858757019043, "global_step": 356103, "epoch": 4290} {"train_loss": -26.575759887695312, "global_step": 356104, "epoch": 4290} {"train_loss": -26.415517807006836, "global_step": 356105, "epoch": 4290} {"train_loss": -26.317304611206055, "global_step": 356106, "epoch": 4290} {"train_loss": -26.33437156677246, "global_step": 356107, "epoch": 4290} {"train_loss": -26.607385635375977, "global_step": 356108, "epoch": 4290} {"train_loss": -26.344186782836914, "global_step": 356109, "epoch": 4290} {"train_loss": -26.457183837890625, "global_step": 356110, "epoch": 4290} {"train_loss": -26.2519588470459, "global_step": 356111, "epoch": 4290} {"train_loss": -25.705785751342773, "global_step": 356112, "epoch": 4290} {"train_loss": -25.912582397460938, "global_step": 356113, "epoch": 4290} {"train_loss": -26.37860107421875, "global_step": 356114, "epoch": 4290} {"train_loss": -26.154592514038086, "global_step": 356115, "epoch": 4290} {"train_loss": -26.256244659423828, "global_step": 356116, "epoch": 4290} {"train_loss": -26.16067886352539, "global_step": 356117, "epoch": 4290} {"train_loss": -26.384695053100586, "global_step": 356118, "epoch": 4290} {"train_loss": -26.33589744567871, "global_step": 356119, "epoch": 4290} {"train_loss": -26.534717559814453, "global_step": 356120, "epoch": 4290} {"train_loss": -26.233190536499023, "global_step": 356121, "epoch": 4290} {"train_loss": -26.160003662109375, "global_step": 356122, "epoch": 4290} {"train_loss": -26.15824317932129, "global_step": 356123, "epoch": 4290} {"train_loss": -26.011371612548828, "global_step": 356124, "epoch": 4290} {"train_loss": -26.146656036376953, "global_step": 356125, "epoch": 4290} {"train_loss": -26.697189331054688, "global_step": 356126, "epoch": 4290} {"train_loss": -26.59552574157715, "global_step": 356127, "epoch": 4290} {"train_loss": -25.93684959411621, "global_step": 356128, "epoch": 4290} {"train_loss": -26.59437370300293, "global_step": 356129, "epoch": 4290} {"train_loss": -26.120380401611328, "global_step": 356130, "epoch": 4290} {"train_loss": -26.285125732421875, "global_step": 356131, "epoch": 4290} {"train_loss": -25.8914737701416, "global_step": 356132, "epoch": 4290} {"train_loss": -25.99430274963379, "global_step": 356133, "epoch": 4290} {"train_loss": -26.00141716003418, "global_step": 356134, "epoch": 4290} {"train_loss": -26.20240592956543, "global_step": 356135, "epoch": 4290} {"train_loss": -25.99481201171875, "global_step": 356136, "epoch": 4290} {"train_loss": -26.250226974487305, "global_step": 356137, "epoch": 4290} {"train_loss": -26.223743438720703, "global_step": 356138, "epoch": 4290} {"train_loss": -26.209726333618164, "global_step": 356139, "epoch": 4290} {"train_loss": -26.305103302001953, "global_step": 356140, "epoch": 4290} {"train_loss": -26.037240982055664, "global_step": 356141, "epoch": 4290} {"train_loss": -26.3463077545166, "global_step": 356142, "epoch": 4290} {"train_loss": -26.370819091796875, "global_step": 356143, "epoch": 4290} {"train_loss": -26.5664005279541, "global_step": 356144, "epoch": 4290} {"train_loss": -26.389455795288086, "global_step": 356145, "epoch": 4290} {"train_loss": -26.301172256469727, "global_step": 356146, "epoch": 4290} {"train_loss": -26.07911491394043, "global_step": 356147, "epoch": 4290} {"train_loss": -26.201749801635742, "global_step": 356148, "epoch": 4290} {"train_loss": -26.484525680541992, "global_step": 356149, "epoch": 4290} {"train_loss": -26.408056259155273, "global_step": 356150, "epoch": 4290} {"train_loss": -26.189014434814453, "global_step": 356151, "epoch": 4290} {"train_loss": -26.168122211134577, "global_step": 356152, "epoch": 4290, "val_loss": 6673383.0} {"train_loss": -25.69989585876465, "global_step": 356153, "epoch": 4291} {"train_loss": -25.712177276611328, "global_step": 356154, "epoch": 4291} {"train_loss": -25.110483169555664, "global_step": 356155, "epoch": 4291} {"train_loss": -25.3450984954834, "global_step": 356156, "epoch": 4291} {"train_loss": -25.23189353942871, "global_step": 356157, "epoch": 4291} {"train_loss": -25.58884620666504, "global_step": 356158, "epoch": 4291} {"train_loss": -25.4928035736084, "global_step": 356159, "epoch": 4291} {"train_loss": -25.809619903564453, "global_step": 356160, "epoch": 4291} {"train_loss": -25.596208572387695, "global_step": 356161, "epoch": 4291} {"train_loss": -25.444259643554688, "global_step": 356162, "epoch": 4291} {"train_loss": -26.22128677368164, "global_step": 356163, "epoch": 4291} {"train_loss": -25.44374656677246, "global_step": 356164, "epoch": 4291} {"train_loss": -25.75533103942871, "global_step": 356165, "epoch": 4291} {"train_loss": -25.463932037353516, "global_step": 356166, "epoch": 4291} {"train_loss": -25.45039939880371, "global_step": 356167, "epoch": 4291} {"train_loss": -25.61927604675293, "global_step": 356168, "epoch": 4291} {"train_loss": -25.834033966064453, "global_step": 356169, "epoch": 4291} {"train_loss": -26.2667179107666, "global_step": 356170, "epoch": 4291} {"train_loss": -26.22991943359375, "global_step": 356171, "epoch": 4291} {"train_loss": -25.955759048461914, "global_step": 356172, "epoch": 4291} {"train_loss": -25.93682861328125, "global_step": 356173, "epoch": 4291} {"train_loss": -26.074111938476562, "global_step": 356174, "epoch": 4291} {"train_loss": -25.743494033813477, "global_step": 356175, "epoch": 4291} {"train_loss": -26.002294540405273, "global_step": 356176, "epoch": 4291} {"train_loss": -25.90949058532715, "global_step": 356177, "epoch": 4291} {"train_loss": -26.049406051635742, "global_step": 356178, "epoch": 4291} {"train_loss": -26.251012802124023, "global_step": 356179, "epoch": 4291} {"train_loss": -26.29608154296875, "global_step": 356180, "epoch": 4291} {"train_loss": -25.818952560424805, "global_step": 356181, "epoch": 4291} {"train_loss": -26.050983428955078, "global_step": 356182, "epoch": 4291} {"train_loss": -26.476810455322266, "global_step": 356183, "epoch": 4291} {"train_loss": -26.0854549407959, "global_step": 356184, "epoch": 4291} {"train_loss": -26.03363037109375, "global_step": 356185, "epoch": 4291} {"train_loss": -26.16143798828125, "global_step": 356186, "epoch": 4291} {"train_loss": -26.125070571899414, "global_step": 356187, "epoch": 4291} {"train_loss": -26.161252975463867, "global_step": 356188, "epoch": 4291} {"train_loss": -26.084308624267578, "global_step": 356189, "epoch": 4291} {"train_loss": -26.205820083618164, "global_step": 356190, "epoch": 4291} {"train_loss": -26.36823844909668, "global_step": 356191, "epoch": 4291} {"train_loss": -25.93486976623535, "global_step": 356192, "epoch": 4291} {"train_loss": -26.398523330688477, "global_step": 356193, "epoch": 4291} {"train_loss": -26.05731773376465, "global_step": 356194, "epoch": 4291} {"train_loss": -26.296762466430664, "global_step": 356195, "epoch": 4291} {"train_loss": -26.592960357666016, "global_step": 356196, "epoch": 4291} {"train_loss": -26.769296646118164, "global_step": 356197, "epoch": 4291} {"train_loss": -25.785364151000977, "global_step": 356198, "epoch": 4291} {"train_loss": -26.71294593811035, "global_step": 356199, "epoch": 4291} {"train_loss": -26.080707550048828, "global_step": 356200, "epoch": 4291} {"train_loss": -26.358747482299805, "global_step": 356201, "epoch": 4291} {"train_loss": -26.06429100036621, "global_step": 356202, "epoch": 4291} {"train_loss": -26.582733154296875, "global_step": 356203, "epoch": 4291} {"train_loss": -26.145843505859375, "global_step": 356204, "epoch": 4291} {"train_loss": -26.15315055847168, "global_step": 356205, "epoch": 4291} {"train_loss": -26.098556518554688, "global_step": 356206, "epoch": 4291} {"train_loss": -26.05267906188965, "global_step": 356207, "epoch": 4291} {"train_loss": -25.842361450195312, "global_step": 356208, "epoch": 4291} {"train_loss": -26.209863662719727, "global_step": 356209, "epoch": 4291} {"train_loss": -26.3083553314209, "global_step": 356210, "epoch": 4291} {"train_loss": -26.27126121520996, "global_step": 356211, "epoch": 4291} {"train_loss": -26.145938873291016, "global_step": 356212, "epoch": 4291} {"train_loss": -25.987934112548828, "global_step": 356213, "epoch": 4291} {"train_loss": -26.406156539916992, "global_step": 356214, "epoch": 4291} {"train_loss": -26.0320987701416, "global_step": 356215, "epoch": 4291} {"train_loss": -26.499237060546875, "global_step": 356216, "epoch": 4291} {"train_loss": -26.31829261779785, "global_step": 356217, "epoch": 4291} {"train_loss": -26.423980712890625, "global_step": 356218, "epoch": 4291} {"train_loss": -26.254871368408203, "global_step": 356219, "epoch": 4291} {"train_loss": -26.414026260375977, "global_step": 356220, "epoch": 4291} {"train_loss": -26.27907371520996, "global_step": 356221, "epoch": 4291} {"train_loss": -26.71575927734375, "global_step": 356222, "epoch": 4291} {"train_loss": -26.372806549072266, "global_step": 356223, "epoch": 4291} {"train_loss": -26.50732421875, "global_step": 356224, "epoch": 4291} {"train_loss": -26.07893943786621, "global_step": 356225, "epoch": 4291} {"train_loss": -26.125141143798828, "global_step": 356226, "epoch": 4291} {"train_loss": -26.1700382232666, "global_step": 356227, "epoch": 4291} {"train_loss": -26.35732078552246, "global_step": 356228, "epoch": 4291} {"train_loss": -26.335357666015625, "global_step": 356229, "epoch": 4291} {"train_loss": -26.362457275390625, "global_step": 356230, "epoch": 4291} {"train_loss": -26.052587509155273, "global_step": 356231, "epoch": 4291} {"train_loss": -26.056201934814453, "global_step": 356232, "epoch": 4291} {"train_loss": -26.0662784576416, "global_step": 356233, "epoch": 4291} {"train_loss": -26.337690353393555, "global_step": 356234, "epoch": 4291} {"train_loss": -26.099991442209266, "global_step": 356235, "epoch": 4291, "val_loss": 6563484.0} {"train_loss": -25.8575439453125, "global_step": 356236, "epoch": 4292} {"train_loss": -25.912504196166992, "global_step": 356237, "epoch": 4292} {"train_loss": -26.256011962890625, "global_step": 356238, "epoch": 4292} {"train_loss": -25.997690200805664, "global_step": 356239, "epoch": 4292} {"train_loss": -25.597875595092773, "global_step": 356240, "epoch": 4292} {"train_loss": -25.780487060546875, "global_step": 356241, "epoch": 4292} {"train_loss": -25.702850341796875, "global_step": 356242, "epoch": 4292} {"train_loss": -25.787439346313477, "global_step": 356243, "epoch": 4292} {"train_loss": -25.981245040893555, "global_step": 356244, "epoch": 4292} {"train_loss": -26.084686279296875, "global_step": 356245, "epoch": 4292} {"train_loss": -25.831989288330078, "global_step": 356246, "epoch": 4292} {"train_loss": -25.95564842224121, "global_step": 356247, "epoch": 4292} {"train_loss": -25.822675704956055, "global_step": 356248, "epoch": 4292} {"train_loss": -26.378341674804688, "global_step": 356249, "epoch": 4292} {"train_loss": -26.543548583984375, "global_step": 356250, "epoch": 4292} {"train_loss": -26.08365821838379, "global_step": 356251, "epoch": 4292} {"train_loss": -25.680028915405273, "global_step": 356252, "epoch": 4292} {"train_loss": -26.173282623291016, "global_step": 356253, "epoch": 4292} {"train_loss": -26.105121612548828, "global_step": 356254, "epoch": 4292} {"train_loss": -26.309722900390625, "global_step": 356255, "epoch": 4292} {"train_loss": -26.107959747314453, "global_step": 356256, "epoch": 4292} {"train_loss": -26.1801700592041, "global_step": 356257, "epoch": 4292} {"train_loss": -25.960538864135742, "global_step": 356258, "epoch": 4292} {"train_loss": -26.20998191833496, "global_step": 356259, "epoch": 4292} {"train_loss": -25.909814834594727, "global_step": 356260, "epoch": 4292} {"train_loss": -25.836267471313477, "global_step": 356261, "epoch": 4292} {"train_loss": -26.51555824279785, "global_step": 356262, "epoch": 4292} {"train_loss": -25.985260009765625, "global_step": 356263, "epoch": 4292} {"train_loss": -26.026966094970703, "global_step": 356264, "epoch": 4292} {"train_loss": -25.83249855041504, "global_step": 356265, "epoch": 4292} {"train_loss": -26.189929962158203, "global_step": 356266, "epoch": 4292} {"train_loss": -26.273792266845703, "global_step": 356267, "epoch": 4292} {"train_loss": -26.05511474609375, "global_step": 356268, "epoch": 4292} {"train_loss": -26.1370792388916, "global_step": 356269, "epoch": 4292} {"train_loss": -26.386655807495117, "global_step": 356270, "epoch": 4292} {"train_loss": -26.210397720336914, "global_step": 356271, "epoch": 4292} {"train_loss": -26.245285034179688, "global_step": 356272, "epoch": 4292} {"train_loss": -26.31073570251465, "global_step": 356273, "epoch": 4292} {"train_loss": -26.618574142456055, "global_step": 356274, "epoch": 4292} {"train_loss": -26.511749267578125, "global_step": 356275, "epoch": 4292} {"train_loss": -26.094440460205078, "global_step": 356276, "epoch": 4292} {"train_loss": -26.797224044799805, "global_step": 356277, "epoch": 4292} {"train_loss": -26.492679595947266, "global_step": 356278, "epoch": 4292} {"train_loss": -26.50054359436035, "global_step": 356279, "epoch": 4292} {"train_loss": -26.39214515686035, "global_step": 356280, "epoch": 4292} {"train_loss": -26.841999053955078, "global_step": 356281, "epoch": 4292} {"train_loss": -26.31459617614746, "global_step": 356282, "epoch": 4292} {"train_loss": -26.362812042236328, "global_step": 356283, "epoch": 4292} {"train_loss": -26.388845443725586, "global_step": 356284, "epoch": 4292} {"train_loss": -26.277301788330078, "global_step": 356285, "epoch": 4292} {"train_loss": -26.256362915039062, "global_step": 356286, "epoch": 4292} {"train_loss": -26.2934627532959, "global_step": 356287, "epoch": 4292} {"train_loss": -26.38226890563965, "global_step": 356288, "epoch": 4292} {"train_loss": -26.142230987548828, "global_step": 356289, "epoch": 4292} {"train_loss": -26.200546264648438, "global_step": 356290, "epoch": 4292} {"train_loss": -26.408884048461914, "global_step": 356291, "epoch": 4292} {"train_loss": -26.141265869140625, "global_step": 356292, "epoch": 4292} {"train_loss": -26.718713760375977, "global_step": 356293, "epoch": 4292} {"train_loss": -26.337656021118164, "global_step": 356294, "epoch": 4292} {"train_loss": -26.667882919311523, "global_step": 356295, "epoch": 4292} {"train_loss": -26.371856689453125, "global_step": 356296, "epoch": 4292} {"train_loss": -26.412073135375977, "global_step": 356297, "epoch": 4292} {"train_loss": -26.482412338256836, "global_step": 356298, "epoch": 4292} {"train_loss": -26.183134078979492, "global_step": 356299, "epoch": 4292} {"train_loss": -25.96894645690918, "global_step": 356300, "epoch": 4292} {"train_loss": -25.693429946899414, "global_step": 356301, "epoch": 4292} {"train_loss": -25.777494430541992, "global_step": 356302, "epoch": 4292} {"train_loss": -26.11441421508789, "global_step": 356303, "epoch": 4292} {"train_loss": -26.199003219604492, "global_step": 356304, "epoch": 4292} {"train_loss": -26.089466094970703, "global_step": 356305, "epoch": 4292} {"train_loss": -26.282352447509766, "global_step": 356306, "epoch": 4292} {"train_loss": -25.565359115600586, "global_step": 356307, "epoch": 4292} {"train_loss": -26.314044952392578, "global_step": 356308, "epoch": 4292} {"train_loss": -26.083921432495117, "global_step": 356309, "epoch": 4292} {"train_loss": -25.7662296295166, "global_step": 356310, "epoch": 4292} {"train_loss": -26.307443618774414, "global_step": 356311, "epoch": 4292} {"train_loss": -26.221454620361328, "global_step": 356312, "epoch": 4292} {"train_loss": -26.22889518737793, "global_step": 356313, "epoch": 4292} {"train_loss": -25.773229598999023, "global_step": 356314, "epoch": 4292} {"train_loss": -26.363346099853516, "global_step": 356315, "epoch": 4292} {"train_loss": -26.316137313842773, "global_step": 356316, "epoch": 4292} {"train_loss": -26.299184799194336, "global_step": 356317, "epoch": 4292} {"train_loss": -26.181964667446643, "global_step": 356318, "epoch": 4292, "val_loss": 6688113.0} {"train_loss": -25.533292770385742, "global_step": 356319, "epoch": 4293} {"train_loss": -24.758398056030273, "global_step": 356320, "epoch": 4293} {"train_loss": -25.19277572631836, "global_step": 356321, "epoch": 4293} {"train_loss": -25.07908821105957, "global_step": 356322, "epoch": 4293} {"train_loss": -24.791454315185547, "global_step": 356323, "epoch": 4293} {"train_loss": -24.712011337280273, "global_step": 356324, "epoch": 4293} {"train_loss": -25.331327438354492, "global_step": 356325, "epoch": 4293} {"train_loss": -25.37090492248535, "global_step": 356326, "epoch": 4293} {"train_loss": -25.52182960510254, "global_step": 356327, "epoch": 4293} {"train_loss": -25.766284942626953, "global_step": 356328, "epoch": 4293} {"train_loss": -25.821674346923828, "global_step": 356329, "epoch": 4293} {"train_loss": -25.934995651245117, "global_step": 356330, "epoch": 4293} {"train_loss": -25.705829620361328, "global_step": 356331, "epoch": 4293} {"train_loss": -25.947927474975586, "global_step": 356332, "epoch": 4293} {"train_loss": -25.924734115600586, "global_step": 356333, "epoch": 4293} {"train_loss": -25.81083106994629, "global_step": 356334, "epoch": 4293} {"train_loss": -25.609882354736328, "global_step": 356335, "epoch": 4293} {"train_loss": -25.997411727905273, "global_step": 356336, "epoch": 4293} {"train_loss": -25.75935935974121, "global_step": 356337, "epoch": 4293} {"train_loss": -26.2396240234375, "global_step": 356338, "epoch": 4293} {"train_loss": -25.56598472595215, "global_step": 356339, "epoch": 4293} {"train_loss": -25.76222038269043, "global_step": 356340, "epoch": 4293} {"train_loss": -25.937524795532227, "global_step": 356341, "epoch": 4293} {"train_loss": -26.2310848236084, "global_step": 356342, "epoch": 4293} {"train_loss": -25.985050201416016, "global_step": 356343, "epoch": 4293} {"train_loss": -26.005285263061523, "global_step": 356344, "epoch": 4293} {"train_loss": -26.174427032470703, "global_step": 356345, "epoch": 4293} {"train_loss": -26.132312774658203, "global_step": 356346, "epoch": 4293} {"train_loss": -26.30817222595215, "global_step": 356347, "epoch": 4293} {"train_loss": -25.752119064331055, "global_step": 356348, "epoch": 4293} {"train_loss": -26.152454376220703, "global_step": 356349, "epoch": 4293} {"train_loss": -25.876850128173828, "global_step": 356350, "epoch": 4293} {"train_loss": -26.324295043945312, "global_step": 356351, "epoch": 4293} {"train_loss": -26.406951904296875, "global_step": 356352, "epoch": 4293} {"train_loss": -26.3071231842041, "global_step": 356353, "epoch": 4293} {"train_loss": -26.60981559753418, "global_step": 356354, "epoch": 4293} {"train_loss": -26.5185604095459, "global_step": 356355, "epoch": 4293} {"train_loss": -25.985504150390625, "global_step": 356356, "epoch": 4293} {"train_loss": -26.257247924804688, "global_step": 356357, "epoch": 4293} {"train_loss": -26.144378662109375, "global_step": 356358, "epoch": 4293} {"train_loss": -26.253646850585938, "global_step": 356359, "epoch": 4293} {"train_loss": -26.297760009765625, "global_step": 356360, "epoch": 4293} {"train_loss": -26.26161003112793, "global_step": 356361, "epoch": 4293} {"train_loss": -26.152206420898438, "global_step": 356362, "epoch": 4293} {"train_loss": -26.201797485351562, "global_step": 356363, "epoch": 4293} {"train_loss": -26.3621768951416, "global_step": 356364, "epoch": 4293} {"train_loss": -26.497480392456055, "global_step": 356365, "epoch": 4293} {"train_loss": -26.173053741455078, "global_step": 356366, "epoch": 4293} {"train_loss": -26.276504516601562, "global_step": 356367, "epoch": 4293} {"train_loss": -26.696157455444336, "global_step": 356368, "epoch": 4293} {"train_loss": -26.216659545898438, "global_step": 356369, "epoch": 4293} {"train_loss": -26.478063583374023, "global_step": 356370, "epoch": 4293} {"train_loss": -26.346723556518555, "global_step": 356371, "epoch": 4293} {"train_loss": -26.117019653320312, "global_step": 356372, "epoch": 4293} {"train_loss": -26.189634323120117, "global_step": 356373, "epoch": 4293} {"train_loss": -26.498273849487305, "global_step": 356374, "epoch": 4293} {"train_loss": -26.575702667236328, "global_step": 356375, "epoch": 4293} {"train_loss": -26.572071075439453, "global_step": 356376, "epoch": 4293} {"train_loss": -26.12825584411621, "global_step": 356377, "epoch": 4293} {"train_loss": -26.108957290649414, "global_step": 356378, "epoch": 4293} {"train_loss": -26.09858512878418, "global_step": 356379, "epoch": 4293} {"train_loss": -25.8581600189209, "global_step": 356380, "epoch": 4293} {"train_loss": -25.9311580657959, "global_step": 356381, "epoch": 4293} {"train_loss": -26.394582748413086, "global_step": 356382, "epoch": 4293} {"train_loss": -26.1824893951416, "global_step": 356383, "epoch": 4293} {"train_loss": -26.411130905151367, "global_step": 356384, "epoch": 4293} {"train_loss": -26.037921905517578, "global_step": 356385, "epoch": 4293} {"train_loss": -25.9812068939209, "global_step": 356386, "epoch": 4293} {"train_loss": -26.05047035217285, "global_step": 356387, "epoch": 4293} {"train_loss": -25.403690338134766, "global_step": 356388, "epoch": 4293} {"train_loss": -25.502206802368164, "global_step": 356389, "epoch": 4293} {"train_loss": -25.743091583251953, "global_step": 356390, "epoch": 4293} {"train_loss": -26.342029571533203, "global_step": 356391, "epoch": 4293} {"train_loss": -25.863306045532227, "global_step": 356392, "epoch": 4293} {"train_loss": -25.946603775024414, "global_step": 356393, "epoch": 4293} {"train_loss": -25.40104866027832, "global_step": 356394, "epoch": 4293} {"train_loss": -25.36264419555664, "global_step": 356395, "epoch": 4293} {"train_loss": -26.043704986572266, "global_step": 356396, "epoch": 4293} {"train_loss": -26.079626083374023, "global_step": 356397, "epoch": 4293} {"train_loss": -26.105316162109375, "global_step": 356398, "epoch": 4293} {"train_loss": -25.699573516845703, "global_step": 356399, "epoch": 4293} {"train_loss": -26.462310791015625, "global_step": 356400, "epoch": 4293} {"train_loss": -25.963339886033392, "global_step": 356401, "epoch": 4293, "val_loss": 6650780.0} {"train_loss": -25.634368896484375, "global_step": 356402, "epoch": 4294} {"train_loss": -25.518159866333008, "global_step": 356403, "epoch": 4294} {"train_loss": -25.375410079956055, "global_step": 356404, "epoch": 4294} {"train_loss": -25.32920265197754, "global_step": 356405, "epoch": 4294} {"train_loss": -25.2540340423584, "global_step": 356406, "epoch": 4294} {"train_loss": -25.623779296875, "global_step": 356407, "epoch": 4294} {"train_loss": -25.424335479736328, "global_step": 356408, "epoch": 4294} {"train_loss": -25.12651252746582, "global_step": 356409, "epoch": 4294} {"train_loss": -25.956998825073242, "global_step": 356410, "epoch": 4294} {"train_loss": -25.672515869140625, "global_step": 356411, "epoch": 4294} {"train_loss": -25.38266944885254, "global_step": 356412, "epoch": 4294} {"train_loss": -25.952234268188477, "global_step": 356413, "epoch": 4294} {"train_loss": -26.110986709594727, "global_step": 356414, "epoch": 4294} {"train_loss": -25.658283233642578, "global_step": 356415, "epoch": 4294} {"train_loss": -25.8651180267334, "global_step": 356416, "epoch": 4294} {"train_loss": -25.97857093811035, "global_step": 356417, "epoch": 4294} {"train_loss": -25.796655654907227, "global_step": 356418, "epoch": 4294} {"train_loss": -26.387475967407227, "global_step": 356419, "epoch": 4294} {"train_loss": -26.01942253112793, "global_step": 356420, "epoch": 4294} {"train_loss": -26.2445125579834, "global_step": 356421, "epoch": 4294} {"train_loss": -25.899688720703125, "global_step": 356422, "epoch": 4294} {"train_loss": -26.204870223999023, "global_step": 356423, "epoch": 4294} {"train_loss": -26.239431381225586, "global_step": 356424, "epoch": 4294} {"train_loss": -26.162954330444336, "global_step": 356425, "epoch": 4294} {"train_loss": -26.05967140197754, "global_step": 356426, "epoch": 4294} {"train_loss": -26.027725219726562, "global_step": 356427, "epoch": 4294} {"train_loss": -26.417694091796875, "global_step": 356428, "epoch": 4294} {"train_loss": -26.3244686126709, "global_step": 356429, "epoch": 4294} {"train_loss": -26.134557723999023, "global_step": 356430, "epoch": 4294} {"train_loss": -26.497547149658203, "global_step": 356431, "epoch": 4294} {"train_loss": -26.235193252563477, "global_step": 356432, "epoch": 4294} {"train_loss": -26.046051025390625, "global_step": 356433, "epoch": 4294} {"train_loss": -26.218225479125977, "global_step": 356434, "epoch": 4294} {"train_loss": -26.296186447143555, "global_step": 356435, "epoch": 4294} {"train_loss": -26.348459243774414, "global_step": 356436, "epoch": 4294} {"train_loss": -25.95826530456543, "global_step": 356437, "epoch": 4294} {"train_loss": -26.4555721282959, "global_step": 356438, "epoch": 4294} {"train_loss": -26.410242080688477, "global_step": 356439, "epoch": 4294} {"train_loss": -26.030126571655273, "global_step": 356440, "epoch": 4294} {"train_loss": -26.555761337280273, "global_step": 356441, "epoch": 4294} {"train_loss": -26.177270889282227, "global_step": 356442, "epoch": 4294} {"train_loss": -25.870407104492188, "global_step": 356443, "epoch": 4294} {"train_loss": -25.773603439331055, "global_step": 356444, "epoch": 4294} {"train_loss": -26.31049919128418, "global_step": 356445, "epoch": 4294} {"train_loss": -26.612905502319336, "global_step": 356446, "epoch": 4294} {"train_loss": -26.23102378845215, "global_step": 356447, "epoch": 4294} {"train_loss": -25.83723258972168, "global_step": 356448, "epoch": 4294} {"train_loss": -26.16437339782715, "global_step": 356449, "epoch": 4294} {"train_loss": -26.350610733032227, "global_step": 356450, "epoch": 4294} {"train_loss": -26.39585304260254, "global_step": 356451, "epoch": 4294} {"train_loss": -26.29534339904785, "global_step": 356452, "epoch": 4294} {"train_loss": -26.343053817749023, "global_step": 356453, "epoch": 4294} {"train_loss": -26.504779815673828, "global_step": 356454, "epoch": 4294} {"train_loss": -25.801069259643555, "global_step": 356455, "epoch": 4294} {"train_loss": -25.903823852539062, "global_step": 356456, "epoch": 4294} {"train_loss": -26.105701446533203, "global_step": 356457, "epoch": 4294} {"train_loss": -26.5761775970459, "global_step": 356458, "epoch": 4294} {"train_loss": -26.053258895874023, "global_step": 356459, "epoch": 4294} {"train_loss": -26.374719619750977, "global_step": 356460, "epoch": 4294} {"train_loss": -26.16925621032715, "global_step": 356461, "epoch": 4294} {"train_loss": -26.57588768005371, "global_step": 356462, "epoch": 4294} {"train_loss": -26.431781768798828, "global_step": 356463, "epoch": 4294} {"train_loss": -26.62795066833496, "global_step": 356464, "epoch": 4294} {"train_loss": -26.136804580688477, "global_step": 356465, "epoch": 4294} {"train_loss": -26.30780029296875, "global_step": 356466, "epoch": 4294} {"train_loss": -26.102670669555664, "global_step": 356467, "epoch": 4294} {"train_loss": -26.234317779541016, "global_step": 356468, "epoch": 4294} {"train_loss": -26.26894187927246, "global_step": 356469, "epoch": 4294} {"train_loss": -26.125568389892578, "global_step": 356470, "epoch": 4294} {"train_loss": -25.9666805267334, "global_step": 356471, "epoch": 4294} {"train_loss": -26.38348388671875, "global_step": 356472, "epoch": 4294} {"train_loss": -26.199750900268555, "global_step": 356473, "epoch": 4294} {"train_loss": -26.41097068786621, "global_step": 356474, "epoch": 4294} {"train_loss": -26.463476181030273, "global_step": 356475, "epoch": 4294} {"train_loss": -26.245309829711914, "global_step": 356476, "epoch": 4294} {"train_loss": -26.304773330688477, "global_step": 356477, "epoch": 4294} {"train_loss": -26.221017837524414, "global_step": 356478, "epoch": 4294} {"train_loss": -26.604475021362305, "global_step": 356479, "epoch": 4294} {"train_loss": -26.764677047729492, "global_step": 356480, "epoch": 4294} {"train_loss": -26.437576293945312, "global_step": 356481, "epoch": 4294} {"train_loss": -25.987598419189453, "global_step": 356482, "epoch": 4294} {"train_loss": -25.771764755249023, "global_step": 356483, "epoch": 4294} {"train_loss": -26.091304434351173, "global_step": 356484, "epoch": 4294, "val_loss": 6566291.0} {"train_loss": -24.969532012939453, "global_step": 356485, "epoch": 4295} {"train_loss": -25.214536666870117, "global_step": 356486, "epoch": 4295} {"train_loss": -25.072181701660156, "global_step": 356487, "epoch": 4295} {"train_loss": -25.303186416625977, "global_step": 356488, "epoch": 4295} {"train_loss": -25.284887313842773, "global_step": 356489, "epoch": 4295} {"train_loss": -25.346115112304688, "global_step": 356490, "epoch": 4295} {"train_loss": -25.767663955688477, "global_step": 356491, "epoch": 4295} {"train_loss": -25.40067481994629, "global_step": 356492, "epoch": 4295} {"train_loss": -25.817901611328125, "global_step": 356493, "epoch": 4295} {"train_loss": -25.083267211914062, "global_step": 356494, "epoch": 4295} {"train_loss": -25.746057510375977, "global_step": 356495, "epoch": 4295} {"train_loss": -25.522008895874023, "global_step": 356496, "epoch": 4295} {"train_loss": -25.715192794799805, "global_step": 356497, "epoch": 4295} {"train_loss": -25.444822311401367, "global_step": 356498, "epoch": 4295} {"train_loss": -25.711545944213867, "global_step": 356499, "epoch": 4295} {"train_loss": -25.479110717773438, "global_step": 356500, "epoch": 4295} {"train_loss": -26.270002365112305, "global_step": 356501, "epoch": 4295} {"train_loss": -25.802448272705078, "global_step": 356502, "epoch": 4295} {"train_loss": -26.017913818359375, "global_step": 356503, "epoch": 4295} {"train_loss": -26.068906784057617, "global_step": 356504, "epoch": 4295} {"train_loss": -25.952383041381836, "global_step": 356505, "epoch": 4295} {"train_loss": -26.161386489868164, "global_step": 356506, "epoch": 4295} {"train_loss": -25.87763023376465, "global_step": 356507, "epoch": 4295} {"train_loss": -25.902658462524414, "global_step": 356508, "epoch": 4295} {"train_loss": -25.845123291015625, "global_step": 356509, "epoch": 4295} {"train_loss": -26.026647567749023, "global_step": 356510, "epoch": 4295} {"train_loss": -26.17926597595215, "global_step": 356511, "epoch": 4295} {"train_loss": -25.889387130737305, "global_step": 356512, "epoch": 4295} {"train_loss": -26.17530632019043, "global_step": 356513, "epoch": 4295} {"train_loss": -25.783811569213867, "global_step": 356514, "epoch": 4295} {"train_loss": -25.80570411682129, "global_step": 356515, "epoch": 4295} {"train_loss": -25.573266983032227, "global_step": 356516, "epoch": 4295} {"train_loss": -26.039159774780273, "global_step": 356517, "epoch": 4295} {"train_loss": -26.437915802001953, "global_step": 356518, "epoch": 4295} {"train_loss": -25.90424919128418, "global_step": 356519, "epoch": 4295} {"train_loss": -25.766630172729492, "global_step": 356520, "epoch": 4295} {"train_loss": -25.875350952148438, "global_step": 356521, "epoch": 4295} {"train_loss": -26.08281898498535, "global_step": 356522, "epoch": 4295} {"train_loss": -26.408660888671875, "global_step": 356523, "epoch": 4295} {"train_loss": -26.3471736907959, "global_step": 356524, "epoch": 4295} {"train_loss": -25.99065589904785, "global_step": 356525, "epoch": 4295} {"train_loss": -26.04612159729004, "global_step": 356526, "epoch": 4295} {"train_loss": -26.647491455078125, "global_step": 356527, "epoch": 4295} {"train_loss": -26.124353408813477, "global_step": 356528, "epoch": 4295} {"train_loss": -26.03338050842285, "global_step": 356529, "epoch": 4295} {"train_loss": -26.56223487854004, "global_step": 356530, "epoch": 4295} {"train_loss": -26.34443473815918, "global_step": 356531, "epoch": 4295} {"train_loss": -26.108346939086914, "global_step": 356532, "epoch": 4295} {"train_loss": -26.388044357299805, "global_step": 356533, "epoch": 4295} {"train_loss": -26.152099609375, "global_step": 356534, "epoch": 4295} {"train_loss": -26.4434757232666, "global_step": 356535, "epoch": 4295} {"train_loss": -26.32964515686035, "global_step": 356536, "epoch": 4295} {"train_loss": -26.4322509765625, "global_step": 356537, "epoch": 4295} {"train_loss": -25.911848068237305, "global_step": 356538, "epoch": 4295} {"train_loss": -26.0943660736084, "global_step": 356539, "epoch": 4295} {"train_loss": -26.593610763549805, "global_step": 356540, "epoch": 4295} {"train_loss": -26.5052490234375, "global_step": 356541, "epoch": 4295} {"train_loss": -26.52414321899414, "global_step": 356542, "epoch": 4295} {"train_loss": -26.43998146057129, "global_step": 356543, "epoch": 4295} {"train_loss": -26.402206420898438, "global_step": 356544, "epoch": 4295} {"train_loss": -26.533029556274414, "global_step": 356545, "epoch": 4295} {"train_loss": -26.684988021850586, "global_step": 356546, "epoch": 4295} {"train_loss": -26.02457618713379, "global_step": 356547, "epoch": 4295} {"train_loss": -26.153669357299805, "global_step": 356548, "epoch": 4295} {"train_loss": -26.16189956665039, "global_step": 356549, "epoch": 4295} {"train_loss": -26.0205078125, "global_step": 356550, "epoch": 4295} {"train_loss": -26.282974243164062, "global_step": 356551, "epoch": 4295} {"train_loss": -26.15879249572754, "global_step": 356552, "epoch": 4295} {"train_loss": -26.27984046936035, "global_step": 356553, "epoch": 4295} {"train_loss": -26.15456199645996, "global_step": 356554, "epoch": 4295} {"train_loss": -25.6989688873291, "global_step": 356555, "epoch": 4295} {"train_loss": -25.06719398498535, "global_step": 356556, "epoch": 4295} {"train_loss": -25.012998580932617, "global_step": 356557, "epoch": 4295} {"train_loss": -25.129825592041016, "global_step": 356558, "epoch": 4295} {"train_loss": -26.016498565673828, "global_step": 356559, "epoch": 4295} {"train_loss": -25.95685386657715, "global_step": 356560, "epoch": 4295} {"train_loss": -25.878087997436523, "global_step": 356561, "epoch": 4295} {"train_loss": -25.613428115844727, "global_step": 356562, "epoch": 4295} {"train_loss": -26.178815841674805, "global_step": 356563, "epoch": 4295} {"train_loss": -25.321487426757812, "global_step": 356564, "epoch": 4295} {"train_loss": -25.9283390045166, "global_step": 356565, "epoch": 4295} {"train_loss": -25.66485595703125, "global_step": 356566, "epoch": 4295} {"train_loss": -25.931115299822338, "global_step": 356567, "epoch": 4295, "val_loss": 6617669.0} {"train_loss": -25.000579833984375, "global_step": 356568, "epoch": 4296} {"train_loss": -25.314794540405273, "global_step": 356569, "epoch": 4296} {"train_loss": -24.9836368560791, "global_step": 356570, "epoch": 4296} {"train_loss": -25.400365829467773, "global_step": 356571, "epoch": 4296} {"train_loss": -25.287961959838867, "global_step": 356572, "epoch": 4296} {"train_loss": -25.633502960205078, "global_step": 356573, "epoch": 4296} {"train_loss": -25.354860305786133, "global_step": 356574, "epoch": 4296} {"train_loss": -25.710296630859375, "global_step": 356575, "epoch": 4296} {"train_loss": -25.724340438842773, "global_step": 356576, "epoch": 4296} {"train_loss": -25.822158813476562, "global_step": 356577, "epoch": 4296} {"train_loss": -25.69202995300293, "global_step": 356578, "epoch": 4296} {"train_loss": -25.56940269470215, "global_step": 356579, "epoch": 4296} {"train_loss": -25.73602294921875, "global_step": 356580, "epoch": 4296} {"train_loss": -25.8701114654541, "global_step": 356581, "epoch": 4296} {"train_loss": -25.923986434936523, "global_step": 356582, "epoch": 4296} {"train_loss": -25.80292320251465, "global_step": 356583, "epoch": 4296} {"train_loss": -25.706497192382812, "global_step": 356584, "epoch": 4296} {"train_loss": -25.847028732299805, "global_step": 356585, "epoch": 4296} {"train_loss": -26.128690719604492, "global_step": 356586, "epoch": 4296} {"train_loss": -25.993860244750977, "global_step": 356587, "epoch": 4296} {"train_loss": -26.159027099609375, "global_step": 356588, "epoch": 4296} {"train_loss": -26.219009399414062, "global_step": 356589, "epoch": 4296} {"train_loss": -26.157825469970703, "global_step": 356590, "epoch": 4296} {"train_loss": -26.099456787109375, "global_step": 356591, "epoch": 4296} {"train_loss": -26.155237197875977, "global_step": 356592, "epoch": 4296} {"train_loss": -26.011219024658203, "global_step": 356593, "epoch": 4296} {"train_loss": -25.93372917175293, "global_step": 356594, "epoch": 4296} {"train_loss": -26.20654296875, "global_step": 356595, "epoch": 4296} {"train_loss": -26.33233070373535, "global_step": 356596, "epoch": 4296} {"train_loss": -26.273971557617188, "global_step": 356597, "epoch": 4296} {"train_loss": -26.41145133972168, "global_step": 356598, "epoch": 4296} {"train_loss": -26.363677978515625, "global_step": 356599, "epoch": 4296} {"train_loss": -26.248838424682617, "global_step": 356600, "epoch": 4296} {"train_loss": -26.197330474853516, "global_step": 356601, "epoch": 4296} {"train_loss": -26.452306747436523, "global_step": 356602, "epoch": 4296} {"train_loss": -26.644367218017578, "global_step": 356603, "epoch": 4296} {"train_loss": -26.170751571655273, "global_step": 356604, "epoch": 4296} {"train_loss": -26.155792236328125, "global_step": 356605, "epoch": 4296} {"train_loss": -26.686986923217773, "global_step": 356606, "epoch": 4296} {"train_loss": -26.506397247314453, "global_step": 356607, "epoch": 4296} {"train_loss": -26.633283615112305, "global_step": 356608, "epoch": 4296} {"train_loss": -26.1645450592041, "global_step": 356609, "epoch": 4296} {"train_loss": -26.34235954284668, "global_step": 356610, "epoch": 4296} {"train_loss": -26.457401275634766, "global_step": 356611, "epoch": 4296} {"train_loss": -26.39924430847168, "global_step": 356612, "epoch": 4296} {"train_loss": -25.739948272705078, "global_step": 356613, "epoch": 4296} {"train_loss": -25.976293563842773, "global_step": 356614, "epoch": 4296} {"train_loss": -26.397653579711914, "global_step": 356615, "epoch": 4296} {"train_loss": -26.390827178955078, "global_step": 356616, "epoch": 4296} {"train_loss": -25.98923110961914, "global_step": 356617, "epoch": 4296} {"train_loss": -25.811477661132812, "global_step": 356618, "epoch": 4296} {"train_loss": -25.999744415283203, "global_step": 356619, "epoch": 4296} {"train_loss": -26.434890747070312, "global_step": 356620, "epoch": 4296} {"train_loss": -25.68340492248535, "global_step": 356621, "epoch": 4296} {"train_loss": -25.96409034729004, "global_step": 356622, "epoch": 4296} {"train_loss": -25.9438533782959, "global_step": 356623, "epoch": 4296} {"train_loss": -26.2076473236084, "global_step": 356624, "epoch": 4296} {"train_loss": -26.43033790588379, "global_step": 356625, "epoch": 4296} {"train_loss": -26.29014015197754, "global_step": 356626, "epoch": 4296} {"train_loss": -26.1113338470459, "global_step": 356627, "epoch": 4296} {"train_loss": -26.44256591796875, "global_step": 356628, "epoch": 4296} {"train_loss": -26.05181312561035, "global_step": 356629, "epoch": 4296} {"train_loss": -26.366159439086914, "global_step": 356630, "epoch": 4296} {"train_loss": -26.26126480102539, "global_step": 356631, "epoch": 4296} {"train_loss": -26.323043823242188, "global_step": 356632, "epoch": 4296} {"train_loss": -26.20804214477539, "global_step": 356633, "epoch": 4296} {"train_loss": -26.334516525268555, "global_step": 356634, "epoch": 4296} {"train_loss": -26.30164909362793, "global_step": 356635, "epoch": 4296} {"train_loss": -26.22021484375, "global_step": 356636, "epoch": 4296} {"train_loss": -26.342559814453125, "global_step": 356637, "epoch": 4296} {"train_loss": -26.39528465270996, "global_step": 356638, "epoch": 4296} {"train_loss": -26.54096794128418, "global_step": 356639, "epoch": 4296} {"train_loss": -26.274877548217773, "global_step": 356640, "epoch": 4296} {"train_loss": -26.07977294921875, "global_step": 356641, "epoch": 4296} {"train_loss": -26.170629501342773, "global_step": 356642, "epoch": 4296} {"train_loss": -26.166259765625, "global_step": 356643, "epoch": 4296} {"train_loss": -26.151824951171875, "global_step": 356644, "epoch": 4296} {"train_loss": -26.130537033081055, "global_step": 356645, "epoch": 4296} {"train_loss": -26.4273681640625, "global_step": 356646, "epoch": 4296} {"train_loss": -26.010568618774414, "global_step": 356647, "epoch": 4296} {"train_loss": -26.673004150390625, "global_step": 356648, "epoch": 4296} {"train_loss": -26.135839462280273, "global_step": 356649, "epoch": 4296} {"train_loss": -26.075546586369892, "global_step": 356650, "epoch": 4296, "val_loss": 6617935.0} {"train_loss": -25.617603302001953, "global_step": 356651, "epoch": 4297} {"train_loss": -25.40132713317871, "global_step": 356652, "epoch": 4297} {"train_loss": -24.56174659729004, "global_step": 356653, "epoch": 4297} {"train_loss": -25.209609985351562, "global_step": 356654, "epoch": 4297} {"train_loss": -25.784015655517578, "global_step": 356655, "epoch": 4297} {"train_loss": -24.67906951904297, "global_step": 356656, "epoch": 4297} {"train_loss": -25.56048583984375, "global_step": 356657, "epoch": 4297} {"train_loss": -25.21709632873535, "global_step": 356658, "epoch": 4297} {"train_loss": -25.523900985717773, "global_step": 356659, "epoch": 4297} {"train_loss": -25.514137268066406, "global_step": 356660, "epoch": 4297} {"train_loss": -25.02569007873535, "global_step": 356661, "epoch": 4297} {"train_loss": -25.511524200439453, "global_step": 356662, "epoch": 4297} {"train_loss": -25.757862091064453, "global_step": 356663, "epoch": 4297} {"train_loss": -25.55889892578125, "global_step": 356664, "epoch": 4297} {"train_loss": -25.55683708190918, "global_step": 356665, "epoch": 4297} {"train_loss": -25.631025314331055, "global_step": 356666, "epoch": 4297} {"train_loss": -25.534109115600586, "global_step": 356667, "epoch": 4297} {"train_loss": -26.044422149658203, "global_step": 356668, "epoch": 4297} {"train_loss": -26.0594425201416, "global_step": 356669, "epoch": 4297} {"train_loss": -25.8260440826416, "global_step": 356670, "epoch": 4297} {"train_loss": -25.954587936401367, "global_step": 356671, "epoch": 4297} {"train_loss": -25.99153709411621, "global_step": 356672, "epoch": 4297} {"train_loss": -25.76148796081543, "global_step": 356673, "epoch": 4297} {"train_loss": -26.063358306884766, "global_step": 356674, "epoch": 4297} {"train_loss": -26.278491973876953, "global_step": 356675, "epoch": 4297} {"train_loss": -25.52984046936035, "global_step": 356676, "epoch": 4297} {"train_loss": -26.069122314453125, "global_step": 356677, "epoch": 4297} {"train_loss": -26.0124454498291, "global_step": 356678, "epoch": 4297} {"train_loss": -25.827625274658203, "global_step": 356679, "epoch": 4297} {"train_loss": -26.410175323486328, "global_step": 356680, "epoch": 4297} {"train_loss": -26.0465087890625, "global_step": 356681, "epoch": 4297} {"train_loss": -26.196578979492188, "global_step": 356682, "epoch": 4297} {"train_loss": -26.063831329345703, "global_step": 356683, "epoch": 4297} {"train_loss": -26.622098922729492, "global_step": 356684, "epoch": 4297} {"train_loss": -26.17005729675293, "global_step": 356685, "epoch": 4297} {"train_loss": -26.496307373046875, "global_step": 356686, "epoch": 4297} {"train_loss": -26.02191162109375, "global_step": 356687, "epoch": 4297} {"train_loss": -26.201934814453125, "global_step": 356688, "epoch": 4297} {"train_loss": -26.15082359313965, "global_step": 356689, "epoch": 4297} {"train_loss": -26.400068283081055, "global_step": 356690, "epoch": 4297} {"train_loss": -26.272754669189453, "global_step": 356691, "epoch": 4297} {"train_loss": -26.447851181030273, "global_step": 356692, "epoch": 4297} {"train_loss": -26.614221572875977, "global_step": 356693, "epoch": 4297} {"train_loss": -26.400854110717773, "global_step": 356694, "epoch": 4297} {"train_loss": -26.408430099487305, "global_step": 356695, "epoch": 4297} {"train_loss": -26.380115509033203, "global_step": 356696, "epoch": 4297} {"train_loss": -26.31431007385254, "global_step": 356697, "epoch": 4297} {"train_loss": -26.49622917175293, "global_step": 356698, "epoch": 4297} {"train_loss": -26.059253692626953, "global_step": 356699, "epoch": 4297} {"train_loss": -26.31902503967285, "global_step": 356700, "epoch": 4297} {"train_loss": -26.496068954467773, "global_step": 356701, "epoch": 4297} {"train_loss": -26.442846298217773, "global_step": 356702, "epoch": 4297} {"train_loss": -26.340723037719727, "global_step": 356703, "epoch": 4297} {"train_loss": -26.320470809936523, "global_step": 356704, "epoch": 4297} {"train_loss": -26.1119441986084, "global_step": 356705, "epoch": 4297} {"train_loss": -26.027318954467773, "global_step": 356706, "epoch": 4297} {"train_loss": -26.215717315673828, "global_step": 356707, "epoch": 4297} {"train_loss": -25.98664665222168, "global_step": 356708, "epoch": 4297} {"train_loss": -25.95733642578125, "global_step": 356709, "epoch": 4297} {"train_loss": -26.5075626373291, "global_step": 356710, "epoch": 4297} {"train_loss": -26.430255889892578, "global_step": 356711, "epoch": 4297} {"train_loss": -26.38348388671875, "global_step": 356712, "epoch": 4297} {"train_loss": -26.65884780883789, "global_step": 356713, "epoch": 4297} {"train_loss": -26.5026798248291, "global_step": 356714, "epoch": 4297} {"train_loss": -26.361133575439453, "global_step": 356715, "epoch": 4297} {"train_loss": -26.127161026000977, "global_step": 356716, "epoch": 4297} {"train_loss": -26.21523094177246, "global_step": 356717, "epoch": 4297} {"train_loss": -26.27459144592285, "global_step": 356718, "epoch": 4297} {"train_loss": -26.454248428344727, "global_step": 356719, "epoch": 4297} {"train_loss": -26.771392822265625, "global_step": 356720, "epoch": 4297} {"train_loss": -26.330839157104492, "global_step": 356721, "epoch": 4297} {"train_loss": -26.290815353393555, "global_step": 356722, "epoch": 4297} {"train_loss": -26.314697265625, "global_step": 356723, "epoch": 4297} {"train_loss": -26.617273330688477, "global_step": 356724, "epoch": 4297} {"train_loss": -26.50372886657715, "global_step": 356725, "epoch": 4297} {"train_loss": -26.22749137878418, "global_step": 356726, "epoch": 4297} {"train_loss": -26.444869995117188, "global_step": 356727, "epoch": 4297} {"train_loss": -26.670867919921875, "global_step": 356728, "epoch": 4297} {"train_loss": -26.36447525024414, "global_step": 356729, "epoch": 4297} {"train_loss": -26.685888290405273, "global_step": 356730, "epoch": 4297} {"train_loss": -26.1290340423584, "global_step": 356731, "epoch": 4297} {"train_loss": -25.981603622436523, "global_step": 356732, "epoch": 4297} {"train_loss": -26.07837663213891, "global_step": 356733, "epoch": 4297, "val_loss": 6654008.5} {"train_loss": -25.838809967041016, "global_step": 356734, "epoch": 4298} {"train_loss": -25.984647750854492, "global_step": 356735, "epoch": 4298} {"train_loss": -24.84452247619629, "global_step": 356736, "epoch": 4298} {"train_loss": -25.11179542541504, "global_step": 356737, "epoch": 4298} {"train_loss": -25.84097671508789, "global_step": 356738, "epoch": 4298} {"train_loss": -25.8570499420166, "global_step": 356739, "epoch": 4298} {"train_loss": -25.6709041595459, "global_step": 356740, "epoch": 4298} {"train_loss": -25.689252853393555, "global_step": 356741, "epoch": 4298} {"train_loss": -25.4862003326416, "global_step": 356742, "epoch": 4298} {"train_loss": -26.045942306518555, "global_step": 356743, "epoch": 4298} {"train_loss": -26.04184913635254, "global_step": 356744, "epoch": 4298} {"train_loss": -25.91278648376465, "global_step": 356745, "epoch": 4298} {"train_loss": -25.829858779907227, "global_step": 356746, "epoch": 4298} {"train_loss": -25.753942489624023, "global_step": 356747, "epoch": 4298} {"train_loss": -25.78912925720215, "global_step": 356748, "epoch": 4298} {"train_loss": -26.26142692565918, "global_step": 356749, "epoch": 4298} {"train_loss": -26.22303581237793, "global_step": 356750, "epoch": 4298} {"train_loss": -26.00766372680664, "global_step": 356751, "epoch": 4298} {"train_loss": -26.05364418029785, "global_step": 356752, "epoch": 4298} {"train_loss": -26.351337432861328, "global_step": 356753, "epoch": 4298} {"train_loss": -26.010528564453125, "global_step": 356754, "epoch": 4298} {"train_loss": -25.82166862487793, "global_step": 356755, "epoch": 4298} {"train_loss": -26.059528350830078, "global_step": 356756, "epoch": 4298} {"train_loss": -26.03850746154785, "global_step": 356757, "epoch": 4298} {"train_loss": -26.100255966186523, "global_step": 356758, "epoch": 4298} {"train_loss": -25.936298370361328, "global_step": 356759, "epoch": 4298} {"train_loss": -26.076465606689453, "global_step": 356760, "epoch": 4298} {"train_loss": -26.0661563873291, "global_step": 356761, "epoch": 4298} {"train_loss": -25.938400268554688, "global_step": 356762, "epoch": 4298} {"train_loss": -26.02480125427246, "global_step": 356763, "epoch": 4298} {"train_loss": -26.35755729675293, "global_step": 356764, "epoch": 4298} {"train_loss": -25.98981285095215, "global_step": 356765, "epoch": 4298} {"train_loss": -26.078399658203125, "global_step": 356766, "epoch": 4298} {"train_loss": -25.976842880249023, "global_step": 356767, "epoch": 4298} {"train_loss": -26.21224021911621, "global_step": 356768, "epoch": 4298} {"train_loss": -26.464313507080078, "global_step": 356769, "epoch": 4298} {"train_loss": -26.34173583984375, "global_step": 356770, "epoch": 4298} {"train_loss": -26.49538230895996, "global_step": 356771, "epoch": 4298} {"train_loss": -26.321863174438477, "global_step": 356772, "epoch": 4298} {"train_loss": -26.2268009185791, "global_step": 356773, "epoch": 4298} {"train_loss": -26.4115047454834, "global_step": 356774, "epoch": 4298} {"train_loss": -26.148405075073242, "global_step": 356775, "epoch": 4298} {"train_loss": -26.110849380493164, "global_step": 356776, "epoch": 4298} {"train_loss": -26.295486450195312, "global_step": 356777, "epoch": 4298} {"train_loss": -25.999128341674805, "global_step": 356778, "epoch": 4298} {"train_loss": -26.307748794555664, "global_step": 356779, "epoch": 4298} {"train_loss": -26.22429847717285, "global_step": 356780, "epoch": 4298} {"train_loss": -26.01690673828125, "global_step": 356781, "epoch": 4298} {"train_loss": -26.154693603515625, "global_step": 356782, "epoch": 4298} {"train_loss": -26.5878963470459, "global_step": 356783, "epoch": 4298} {"train_loss": -26.30732536315918, "global_step": 356784, "epoch": 4298} {"train_loss": -26.2514591217041, "global_step": 356785, "epoch": 4298} {"train_loss": -26.147287368774414, "global_step": 356786, "epoch": 4298} {"train_loss": -26.251394271850586, "global_step": 356787, "epoch": 4298} {"train_loss": -26.122669219970703, "global_step": 356788, "epoch": 4298} {"train_loss": -26.58253288269043, "global_step": 356789, "epoch": 4298} {"train_loss": -26.303762435913086, "global_step": 356790, "epoch": 4298} {"train_loss": -26.58582878112793, "global_step": 356791, "epoch": 4298} {"train_loss": -26.09175682067871, "global_step": 356792, "epoch": 4298} {"train_loss": -26.35308265686035, "global_step": 356793, "epoch": 4298} {"train_loss": -26.599592208862305, "global_step": 356794, "epoch": 4298} {"train_loss": -26.094308853149414, "global_step": 356795, "epoch": 4298} {"train_loss": -26.11701011657715, "global_step": 356796, "epoch": 4298} {"train_loss": -26.10651206970215, "global_step": 356797, "epoch": 4298} {"train_loss": -26.393310546875, "global_step": 356798, "epoch": 4298} {"train_loss": -25.868261337280273, "global_step": 356799, "epoch": 4298} {"train_loss": -25.827783584594727, "global_step": 356800, "epoch": 4298} {"train_loss": -25.659574508666992, "global_step": 356801, "epoch": 4298} {"train_loss": -26.179203033447266, "global_step": 356802, "epoch": 4298} {"train_loss": -26.0561580657959, "global_step": 356803, "epoch": 4298} {"train_loss": -25.864582061767578, "global_step": 356804, "epoch": 4298} {"train_loss": -26.038116455078125, "global_step": 356805, "epoch": 4298} {"train_loss": -26.04168128967285, "global_step": 356806, "epoch": 4298} {"train_loss": -25.738061904907227, "global_step": 356807, "epoch": 4298} {"train_loss": -26.300012588500977, "global_step": 356808, "epoch": 4298} {"train_loss": -26.113605499267578, "global_step": 356809, "epoch": 4298} {"train_loss": -26.075727462768555, "global_step": 356810, "epoch": 4298} {"train_loss": -26.288711547851562, "global_step": 356811, "epoch": 4298} {"train_loss": -26.584516525268555, "global_step": 356812, "epoch": 4298} {"train_loss": -26.43018913269043, "global_step": 356813, "epoch": 4298} {"train_loss": -26.4047794342041, "global_step": 356814, "epoch": 4298} {"train_loss": -26.245712280273438, "global_step": 356815, "epoch": 4298} {"train_loss": -26.082599180290497, "global_step": 356816, "epoch": 4298, "val_loss": 6666513.0} {"train_loss": -25.58704948425293, "global_step": 356817, "epoch": 4299} {"train_loss": -25.749521255493164, "global_step": 356818, "epoch": 4299} {"train_loss": -25.581222534179688, "global_step": 356819, "epoch": 4299} {"train_loss": -25.49967384338379, "global_step": 356820, "epoch": 4299} {"train_loss": -26.088871002197266, "global_step": 356821, "epoch": 4299} {"train_loss": -25.91926383972168, "global_step": 356822, "epoch": 4299} {"train_loss": -25.947858810424805, "global_step": 356823, "epoch": 4299} {"train_loss": -25.9489803314209, "global_step": 356824, "epoch": 4299} {"train_loss": -26.135046005249023, "global_step": 356825, "epoch": 4299} {"train_loss": -25.696584701538086, "global_step": 356826, "epoch": 4299} {"train_loss": -26.0659236907959, "global_step": 356827, "epoch": 4299} {"train_loss": -26.097442626953125, "global_step": 356828, "epoch": 4299} {"train_loss": -26.434951782226562, "global_step": 356829, "epoch": 4299} {"train_loss": -25.982833862304688, "global_step": 356830, "epoch": 4299} {"train_loss": -26.49127197265625, "global_step": 356831, "epoch": 4299} {"train_loss": -26.16940689086914, "global_step": 356832, "epoch": 4299} {"train_loss": -26.190265655517578, "global_step": 356833, "epoch": 4299} {"train_loss": -26.275970458984375, "global_step": 356834, "epoch": 4299} {"train_loss": -25.914264678955078, "global_step": 356835, "epoch": 4299} {"train_loss": -26.304340362548828, "global_step": 356836, "epoch": 4299} {"train_loss": -26.3313045501709, "global_step": 356837, "epoch": 4299} {"train_loss": -25.973285675048828, "global_step": 356838, "epoch": 4299} {"train_loss": -26.417179107666016, "global_step": 356839, "epoch": 4299} {"train_loss": -26.43867301940918, "global_step": 356840, "epoch": 4299} {"train_loss": -26.368671417236328, "global_step": 356841, "epoch": 4299} {"train_loss": -26.40572166442871, "global_step": 356842, "epoch": 4299} {"train_loss": -26.534082412719727, "global_step": 356843, "epoch": 4299} {"train_loss": -26.24979019165039, "global_step": 356844, "epoch": 4299} {"train_loss": -26.401315689086914, "global_step": 356845, "epoch": 4299} {"train_loss": -26.179550170898438, "global_step": 356846, "epoch": 4299} {"train_loss": -26.227127075195312, "global_step": 356847, "epoch": 4299} {"train_loss": -26.781238555908203, "global_step": 356848, "epoch": 4299} {"train_loss": -26.260406494140625, "global_step": 356849, "epoch": 4299} {"train_loss": -26.581836700439453, "global_step": 356850, "epoch": 4299} {"train_loss": -26.216415405273438, "global_step": 356851, "epoch": 4299} {"train_loss": -26.228979110717773, "global_step": 356852, "epoch": 4299} {"train_loss": -26.728429794311523, "global_step": 356853, "epoch": 4299} {"train_loss": -26.214975357055664, "global_step": 356854, "epoch": 4299} {"train_loss": -26.082324981689453, "global_step": 356855, "epoch": 4299} {"train_loss": -26.197036743164062, "global_step": 356856, "epoch": 4299} {"train_loss": -26.319021224975586, "global_step": 356857, "epoch": 4299} {"train_loss": -26.352834701538086, "global_step": 356858, "epoch": 4299} {"train_loss": -26.24240493774414, "global_step": 356859, "epoch": 4299} {"train_loss": -26.02109146118164, "global_step": 356860, "epoch": 4299} {"train_loss": -25.63433265686035, "global_step": 356861, "epoch": 4299} {"train_loss": -26.373701095581055, "global_step": 356862, "epoch": 4299} {"train_loss": -26.431781768798828, "global_step": 356863, "epoch": 4299} {"train_loss": -26.017065048217773, "global_step": 356864, "epoch": 4299} {"train_loss": -26.35231590270996, "global_step": 356865, "epoch": 4299} {"train_loss": -26.18147087097168, "global_step": 356866, "epoch": 4299} {"train_loss": -25.578205108642578, "global_step": 356867, "epoch": 4299} {"train_loss": -25.955524444580078, "global_step": 356868, "epoch": 4299} {"train_loss": -25.72334098815918, "global_step": 356869, "epoch": 4299} {"train_loss": -26.07526206970215, "global_step": 356870, "epoch": 4299} {"train_loss": -25.85273551940918, "global_step": 356871, "epoch": 4299} {"train_loss": -26.066614151000977, "global_step": 356872, "epoch": 4299} {"train_loss": -26.104307174682617, "global_step": 356873, "epoch": 4299} {"train_loss": -25.963245391845703, "global_step": 356874, "epoch": 4299} {"train_loss": -26.095029830932617, "global_step": 356875, "epoch": 4299} {"train_loss": -25.72757911682129, "global_step": 356876, "epoch": 4299} {"train_loss": -26.190750122070312, "global_step": 356877, "epoch": 4299} {"train_loss": -25.973663330078125, "global_step": 356878, "epoch": 4299} {"train_loss": -26.03721046447754, "global_step": 356879, "epoch": 4299} {"train_loss": -26.195783615112305, "global_step": 356880, "epoch": 4299} {"train_loss": -25.936542510986328, "global_step": 356881, "epoch": 4299} {"train_loss": -26.153318405151367, "global_step": 356882, "epoch": 4299} {"train_loss": -26.450780868530273, "global_step": 356883, "epoch": 4299} {"train_loss": -26.181421279907227, "global_step": 356884, "epoch": 4299} {"train_loss": -26.255615234375, "global_step": 356885, "epoch": 4299} {"train_loss": -26.160123825073242, "global_step": 356886, "epoch": 4299} {"train_loss": -26.280195236206055, "global_step": 356887, "epoch": 4299} {"train_loss": -25.994739532470703, "global_step": 356888, "epoch": 4299} {"train_loss": -26.237913131713867, "global_step": 356889, "epoch": 4299} {"train_loss": -26.275846481323242, "global_step": 356890, "epoch": 4299} {"train_loss": -26.140859603881836, "global_step": 356891, "epoch": 4299} {"train_loss": -26.076404571533203, "global_step": 356892, "epoch": 4299} {"train_loss": -26.2919864654541, "global_step": 356893, "epoch": 4299} {"train_loss": -26.33367347717285, "global_step": 356894, "epoch": 4299} {"train_loss": -26.230382919311523, "global_step": 356895, "epoch": 4299} {"train_loss": -26.059614181518555, "global_step": 356896, "epoch": 4299} {"train_loss": -26.401487350463867, "global_step": 356897, "epoch": 4299} {"train_loss": -26.64932632446289, "global_step": 356898, "epoch": 4299} {"train_loss": -26.16081194130771, "global_step": 356899, "epoch": 4299, "val_loss": 6628286.0} {"train_loss": -26.481464385986328, "global_step": 356900, "epoch": 4300} {"train_loss": -26.091663360595703, "global_step": 356901, "epoch": 4300} {"train_loss": -26.197351455688477, "global_step": 356902, "epoch": 4300} {"train_loss": -25.7735538482666, "global_step": 356903, "epoch": 4300} {"train_loss": -26.446186065673828, "global_step": 356904, "epoch": 4300} {"train_loss": -26.031293869018555, "global_step": 356905, "epoch": 4300} {"train_loss": -26.388959884643555, "global_step": 356906, "epoch": 4300} {"train_loss": -26.018774032592773, "global_step": 356907, "epoch": 4300} {"train_loss": -26.127927780151367, "global_step": 356908, "epoch": 4300} {"train_loss": -26.073755264282227, "global_step": 356909, "epoch": 4300} {"train_loss": -26.53192710876465, "global_step": 356910, "epoch": 4300} {"train_loss": -26.39681053161621, "global_step": 356911, "epoch": 4300} {"train_loss": -26.171972274780273, "global_step": 356912, "epoch": 4300} {"train_loss": -26.294921875, "global_step": 356913, "epoch": 4300} {"train_loss": -26.683521270751953, "global_step": 356914, "epoch": 4300} {"train_loss": -26.50751304626465, "global_step": 356915, "epoch": 4300} {"train_loss": -26.56476402282715, "global_step": 356916, "epoch": 4300} {"train_loss": -26.49786376953125, "global_step": 356917, "epoch": 4300} {"train_loss": -26.46100425720215, "global_step": 356918, "epoch": 4300} {"train_loss": -26.590429306030273, "global_step": 356919, "epoch": 4300} {"train_loss": -26.3874454498291, "global_step": 356920, "epoch": 4300} {"train_loss": -26.04657554626465, "global_step": 356921, "epoch": 4300} {"train_loss": -25.9387264251709, "global_step": 356922, "epoch": 4300} {"train_loss": -26.133874893188477, "global_step": 356923, "epoch": 4300} {"train_loss": -25.69952392578125, "global_step": 356924, "epoch": 4300} {"train_loss": -24.792327880859375, "global_step": 356925, "epoch": 4300} {"train_loss": -25.655975341796875, "global_step": 356926, "epoch": 4300} {"train_loss": -26.11345863342285, "global_step": 356927, "epoch": 4300} {"train_loss": -25.329557418823242, "global_step": 356928, "epoch": 4300} {"train_loss": -24.74903678894043, "global_step": 356929, "epoch": 4300} {"train_loss": -25.612796783447266, "global_step": 356930, "epoch": 4300} {"train_loss": -25.656522750854492, "global_step": 356931, "epoch": 4300} {"train_loss": -25.667688369750977, "global_step": 356932, "epoch": 4300} {"train_loss": -25.531475067138672, "global_step": 356933, "epoch": 4300} {"train_loss": -25.77522087097168, "global_step": 356934, "epoch": 4300} {"train_loss": -25.253833770751953, "global_step": 356935, "epoch": 4300} {"train_loss": -25.283872604370117, "global_step": 356936, "epoch": 4300} {"train_loss": -25.557037353515625, "global_step": 356937, "epoch": 4300} {"train_loss": -25.95819664001465, "global_step": 356938, "epoch": 4300} {"train_loss": -25.460857391357422, "global_step": 356939, "epoch": 4300} {"train_loss": -25.968469619750977, "global_step": 356940, "epoch": 4300} {"train_loss": -25.637556076049805, "global_step": 356941, "epoch": 4300} {"train_loss": -25.797178268432617, "global_step": 356942, "epoch": 4300} {"train_loss": -25.614791870117188, "global_step": 356943, "epoch": 4300} {"train_loss": -25.853763580322266, "global_step": 356944, "epoch": 4300} {"train_loss": -26.125091552734375, "global_step": 356945, "epoch": 4300} {"train_loss": -25.92121696472168, "global_step": 356946, "epoch": 4300} {"train_loss": -25.83353042602539, "global_step": 356947, "epoch": 4300} {"train_loss": -26.209381103515625, "global_step": 356948, "epoch": 4300} {"train_loss": -25.540685653686523, "global_step": 356949, "epoch": 4300} {"train_loss": -26.146194458007812, "global_step": 356950, "epoch": 4300} {"train_loss": -26.026525497436523, "global_step": 356951, "epoch": 4300} {"train_loss": -26.06083106994629, "global_step": 356952, "epoch": 4300} {"train_loss": -25.91554069519043, "global_step": 356953, "epoch": 4300} {"train_loss": -26.04483985900879, "global_step": 356954, "epoch": 4300} {"train_loss": -26.23048973083496, "global_step": 356955, "epoch": 4300} {"train_loss": -26.5690860748291, "global_step": 356956, "epoch": 4300} {"train_loss": -26.31096839904785, "global_step": 356957, "epoch": 4300} {"train_loss": -26.26316261291504, "global_step": 356958, "epoch": 4300} {"train_loss": -26.55750846862793, "global_step": 356959, "epoch": 4300} {"train_loss": -26.253137588500977, "global_step": 356960, "epoch": 4300} {"train_loss": -26.262298583984375, "global_step": 356961, "epoch": 4300} {"train_loss": -26.262653350830078, "global_step": 356962, "epoch": 4300} {"train_loss": -25.908863067626953, "global_step": 356963, "epoch": 4300} {"train_loss": -25.595401763916016, "global_step": 356964, "epoch": 4300} {"train_loss": -26.004785537719727, "global_step": 356965, "epoch": 4300} {"train_loss": -25.91143226623535, "global_step": 356966, "epoch": 4300} {"train_loss": -25.8132266998291, "global_step": 356967, "epoch": 4300} {"train_loss": -25.963882446289062, "global_step": 356968, "epoch": 4300} {"train_loss": -26.01869773864746, "global_step": 356969, "epoch": 4300} {"train_loss": -26.13105583190918, "global_step": 356970, "epoch": 4300} {"train_loss": -26.000858306884766, "global_step": 356971, "epoch": 4300} {"train_loss": -25.52497673034668, "global_step": 356972, "epoch": 4300} {"train_loss": -25.768192291259766, "global_step": 356973, "epoch": 4300} {"train_loss": -26.045080184936523, "global_step": 356974, "epoch": 4300} {"train_loss": -25.94661521911621, "global_step": 356975, "epoch": 4300} {"train_loss": -25.888086318969727, "global_step": 356976, "epoch": 4300} {"train_loss": -26.212656021118164, "global_step": 356977, "epoch": 4300} {"train_loss": -26.31888198852539, "global_step": 356978, "epoch": 4300} {"train_loss": -26.0495548248291, "global_step": 356979, "epoch": 4300} {"train_loss": -26.318267822265625, "global_step": 356980, "epoch": 4300} {"train_loss": -26.3322811126709, "global_step": 356981, "epoch": 4300} {"train_loss": -26.002605208431383, "global_step": 356982, "epoch": 4300, "train/sim_max_reward_0": 1.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4500000": 1.0, "test/sim_max_reward_4500001": 1.0, "test/sim_max_reward_4500002": 1.0, "test/sim_max_reward_4500003": 1.0, "test/sim_max_reward_4500004": 1.0, "test/sim_max_reward_4500005": 1.0, "test/sim_max_reward_4500006": 1.0, "test/sim_max_reward_4500007": 0.0, "test/sim_max_reward_4500008": 1.0, "test/sim_max_reward_4500009": 1.0, "test/sim_max_reward_4500010": 1.0, "test/sim_max_reward_4500011": 1.0, "test/sim_max_reward_4500012": 1.0, "test/sim_max_reward_4500013": 0.0, "test/sim_max_reward_4500014": 1.0, "test/sim_max_reward_4500015": 1.0, "test/sim_max_reward_4500016": 1.0, "test/sim_max_reward_4500017": 1.0, "test/sim_max_reward_4500018": 1.0, "test/sim_max_reward_4500019": 1.0, "test/sim_max_reward_4500020": 1.0, "test/sim_max_reward_4500021": 1.0, "train/mean_score": 1.0, "test/mean_score": 0.9090909090909091, "val_loss": 6605963.5} {"train_loss": -25.83213233947754, "global_step": 356983, "epoch": 4301} {"train_loss": -24.685400009155273, "global_step": 356984, "epoch": 4301} {"train_loss": -25.339017868041992, "global_step": 356985, "epoch": 4301} {"train_loss": -25.830799102783203, "global_step": 356986, "epoch": 4301} {"train_loss": -25.312286376953125, "global_step": 356987, "epoch": 4301} {"train_loss": -25.075748443603516, "global_step": 356988, "epoch": 4301} {"train_loss": -25.7210750579834, "global_step": 356989, "epoch": 4301} {"train_loss": -25.886886596679688, "global_step": 356990, "epoch": 4301} {"train_loss": -25.628950119018555, "global_step": 356991, "epoch": 4301} {"train_loss": -26.082294464111328, "global_step": 356992, "epoch": 4301} {"train_loss": -25.55921745300293, "global_step": 356993, "epoch": 4301} {"train_loss": -25.954511642456055, "global_step": 356994, "epoch": 4301} {"train_loss": -25.7353572845459, "global_step": 356995, "epoch": 4301} {"train_loss": -25.862232208251953, "global_step": 356996, "epoch": 4301} {"train_loss": -25.961515426635742, "global_step": 356997, "epoch": 4301} {"train_loss": -25.290456771850586, "global_step": 356998, "epoch": 4301} {"train_loss": -25.88993263244629, "global_step": 356999, "epoch": 4301} {"train_loss": -26.22173500061035, "global_step": 357000, "epoch": 4301} {"train_loss": -25.991928100585938, "global_step": 357001, "epoch": 4301} {"train_loss": -25.98193359375, "global_step": 357002, "epoch": 4301} {"train_loss": -25.959701538085938, "global_step": 357003, "epoch": 4301} {"train_loss": -26.290481567382812, "global_step": 357004, "epoch": 4301} {"train_loss": -26.32635498046875, "global_step": 357005, "epoch": 4301} {"train_loss": -26.248510360717773, "global_step": 357006, "epoch": 4301} {"train_loss": -26.297780990600586, "global_step": 357007, "epoch": 4301} {"train_loss": -26.001306533813477, "global_step": 357008, "epoch": 4301} {"train_loss": -25.867828369140625, "global_step": 357009, "epoch": 4301} {"train_loss": -26.31475830078125, "global_step": 357010, "epoch": 4301} {"train_loss": -25.941619873046875, "global_step": 357011, "epoch": 4301} {"train_loss": -26.130651473999023, "global_step": 357012, "epoch": 4301} {"train_loss": -26.125473022460938, "global_step": 357013, "epoch": 4301} {"train_loss": -26.592884063720703, "global_step": 357014, "epoch": 4301} {"train_loss": -26.260541915893555, "global_step": 357015, "epoch": 4301} {"train_loss": -26.37238883972168, "global_step": 357016, "epoch": 4301} {"train_loss": -26.30326271057129, "global_step": 357017, "epoch": 4301} {"train_loss": -26.565942764282227, "global_step": 357018, "epoch": 4301} {"train_loss": -26.424230575561523, "global_step": 357019, "epoch": 4301} {"train_loss": -26.51513671875, "global_step": 357020, "epoch": 4301} {"train_loss": -26.465076446533203, "global_step": 357021, "epoch": 4301} {"train_loss": -26.58795166015625, "global_step": 357022, "epoch": 4301} {"train_loss": -26.566272735595703, "global_step": 357023, "epoch": 4301} {"train_loss": -26.58991050720215, "global_step": 357024, "epoch": 4301} {"train_loss": -26.326135635375977, "global_step": 357025, "epoch": 4301} {"train_loss": -26.245655059814453, "global_step": 357026, "epoch": 4301} {"train_loss": -26.249120712280273, "global_step": 357027, "epoch": 4301} {"train_loss": -26.619062423706055, "global_step": 357028, "epoch": 4301} {"train_loss": -26.688491821289062, "global_step": 357029, "epoch": 4301} {"train_loss": -26.180917739868164, "global_step": 357030, "epoch": 4301} {"train_loss": -26.285892486572266, "global_step": 357031, "epoch": 4301} {"train_loss": -26.516508102416992, "global_step": 357032, "epoch": 4301} {"train_loss": -26.35410499572754, "global_step": 357033, "epoch": 4301} {"train_loss": -26.725177764892578, "global_step": 357034, "epoch": 4301} {"train_loss": -26.481521606445312, "global_step": 357035, "epoch": 4301} {"train_loss": -25.96112632751465, "global_step": 357036, "epoch": 4301} {"train_loss": -25.931127548217773, "global_step": 357037, "epoch": 4301} {"train_loss": -25.976581573486328, "global_step": 357038, "epoch": 4301} {"train_loss": -26.003753662109375, "global_step": 357039, "epoch": 4301} {"train_loss": -26.173505783081055, "global_step": 357040, "epoch": 4301} {"train_loss": -25.755634307861328, "global_step": 357041, "epoch": 4301} {"train_loss": -26.017663955688477, "global_step": 357042, "epoch": 4301} {"train_loss": -26.130701065063477, "global_step": 357043, "epoch": 4301} {"train_loss": -26.353544235229492, "global_step": 357044, "epoch": 4301} {"train_loss": -26.017486572265625, "global_step": 357045, "epoch": 4301} {"train_loss": -26.069379806518555, "global_step": 357046, "epoch": 4301} {"train_loss": -26.033308029174805, "global_step": 357047, "epoch": 4301} {"train_loss": -26.333066940307617, "global_step": 357048, "epoch": 4301} {"train_loss": -26.25894546508789, "global_step": 357049, "epoch": 4301} {"train_loss": -26.3603515625, "global_step": 357050, "epoch": 4301} {"train_loss": -26.050750732421875, "global_step": 357051, "epoch": 4301} {"train_loss": -25.992176055908203, "global_step": 357052, "epoch": 4301} {"train_loss": -26.022693634033203, "global_step": 357053, "epoch": 4301} {"train_loss": -26.091327667236328, "global_step": 357054, "epoch": 4301} {"train_loss": -25.847501754760742, "global_step": 357055, "epoch": 4301} {"train_loss": -26.6104793548584, "global_step": 357056, "epoch": 4301} {"train_loss": -26.33257484436035, "global_step": 357057, "epoch": 4301} {"train_loss": -26.31489372253418, "global_step": 357058, "epoch": 4301} {"train_loss": -26.296777725219727, "global_step": 357059, "epoch": 4301} {"train_loss": -26.31231117248535, "global_step": 357060, "epoch": 4301} {"train_loss": -26.316884994506836, "global_step": 357061, "epoch": 4301} {"train_loss": -26.38483238220215, "global_step": 357062, "epoch": 4301} {"train_loss": -26.295486450195312, "global_step": 357063, "epoch": 4301} {"train_loss": -26.177221298217773, "global_step": 357064, "epoch": 4301} {"train_loss": -26.1358504927302, "global_step": 357065, "epoch": 4301, "val_loss": 6564520.0} {"train_loss": -25.68770408630371, "global_step": 357066, "epoch": 4302} {"train_loss": -25.596935272216797, "global_step": 357067, "epoch": 4302} {"train_loss": -25.789670944213867, "global_step": 357068, "epoch": 4302} {"train_loss": -25.671545028686523, "global_step": 357069, "epoch": 4302} {"train_loss": -26.265539169311523, "global_step": 357070, "epoch": 4302} {"train_loss": -25.626678466796875, "global_step": 357071, "epoch": 4302} {"train_loss": -25.78891944885254, "global_step": 357072, "epoch": 4302} {"train_loss": -25.435930252075195, "global_step": 357073, "epoch": 4302} {"train_loss": -26.074995040893555, "global_step": 357074, "epoch": 4302} {"train_loss": -26.119186401367188, "global_step": 357075, "epoch": 4302} {"train_loss": -25.659866333007812, "global_step": 357076, "epoch": 4302} {"train_loss": -25.81355094909668, "global_step": 357077, "epoch": 4302} {"train_loss": -26.0295352935791, "global_step": 357078, "epoch": 4302} {"train_loss": -25.92209243774414, "global_step": 357079, "epoch": 4302} {"train_loss": -26.005767822265625, "global_step": 357080, "epoch": 4302} {"train_loss": -25.926116943359375, "global_step": 357081, "epoch": 4302} {"train_loss": -26.37946891784668, "global_step": 357082, "epoch": 4302} {"train_loss": -25.994482040405273, "global_step": 357083, "epoch": 4302} {"train_loss": -25.930200576782227, "global_step": 357084, "epoch": 4302} {"train_loss": -26.227508544921875, "global_step": 357085, "epoch": 4302} {"train_loss": -26.0266170501709, "global_step": 357086, "epoch": 4302} {"train_loss": -26.055191040039062, "global_step": 357087, "epoch": 4302} {"train_loss": -25.90956687927246, "global_step": 357088, "epoch": 4302} {"train_loss": -26.341541290283203, "global_step": 357089, "epoch": 4302} {"train_loss": -25.612640380859375, "global_step": 357090, "epoch": 4302} {"train_loss": -26.04583168029785, "global_step": 357091, "epoch": 4302} {"train_loss": -26.23052406311035, "global_step": 357092, "epoch": 4302} {"train_loss": -26.454187393188477, "global_step": 357093, "epoch": 4302} {"train_loss": -26.317020416259766, "global_step": 357094, "epoch": 4302} {"train_loss": -26.175519943237305, "global_step": 357095, "epoch": 4302} {"train_loss": -26.260284423828125, "global_step": 357096, "epoch": 4302} {"train_loss": -26.4068660736084, "global_step": 357097, "epoch": 4302} {"train_loss": -25.93486976623535, "global_step": 357098, "epoch": 4302} {"train_loss": -26.06683349609375, "global_step": 357099, "epoch": 4302} {"train_loss": -26.1023006439209, "global_step": 357100, "epoch": 4302} {"train_loss": -26.0651798248291, "global_step": 357101, "epoch": 4302} {"train_loss": -26.349720001220703, "global_step": 357102, "epoch": 4302} {"train_loss": -26.511123657226562, "global_step": 357103, "epoch": 4302} {"train_loss": -26.529767990112305, "global_step": 357104, "epoch": 4302} {"train_loss": -26.277835845947266, "global_step": 357105, "epoch": 4302} {"train_loss": -26.465015411376953, "global_step": 357106, "epoch": 4302} {"train_loss": -26.072412490844727, "global_step": 357107, "epoch": 4302} {"train_loss": -26.55402946472168, "global_step": 357108, "epoch": 4302} {"train_loss": -26.204442977905273, "global_step": 357109, "epoch": 4302} {"train_loss": -26.04237174987793, "global_step": 357110, "epoch": 4302} {"train_loss": -26.09351921081543, "global_step": 357111, "epoch": 4302} {"train_loss": -26.118619918823242, "global_step": 357112, "epoch": 4302} {"train_loss": -26.311811447143555, "global_step": 357113, "epoch": 4302} {"train_loss": -26.198612213134766, "global_step": 357114, "epoch": 4302} {"train_loss": -25.958730697631836, "global_step": 357115, "epoch": 4302} {"train_loss": -25.698225021362305, "global_step": 357116, "epoch": 4302} {"train_loss": -25.6260929107666, "global_step": 357117, "epoch": 4302} {"train_loss": -26.486652374267578, "global_step": 357118, "epoch": 4302} {"train_loss": -25.97369956970215, "global_step": 357119, "epoch": 4302} {"train_loss": -25.685888290405273, "global_step": 357120, "epoch": 4302} {"train_loss": -26.142385482788086, "global_step": 357121, "epoch": 4302} {"train_loss": -26.483448028564453, "global_step": 357122, "epoch": 4302} {"train_loss": -26.22015380859375, "global_step": 357123, "epoch": 4302} {"train_loss": -25.881345748901367, "global_step": 357124, "epoch": 4302} {"train_loss": -26.37000846862793, "global_step": 357125, "epoch": 4302} {"train_loss": -25.936649322509766, "global_step": 357126, "epoch": 4302} {"train_loss": -26.2901554107666, "global_step": 357127, "epoch": 4302} {"train_loss": -26.14847183227539, "global_step": 357128, "epoch": 4302} {"train_loss": -26.585336685180664, "global_step": 357129, "epoch": 4302} {"train_loss": -26.199554443359375, "global_step": 357130, "epoch": 4302} {"train_loss": -26.339141845703125, "global_step": 357131, "epoch": 4302} {"train_loss": -26.122526168823242, "global_step": 357132, "epoch": 4302} {"train_loss": -26.231781005859375, "global_step": 357133, "epoch": 4302} {"train_loss": -25.85011100769043, "global_step": 357134, "epoch": 4302} {"train_loss": -26.447919845581055, "global_step": 357135, "epoch": 4302} {"train_loss": -26.345489501953125, "global_step": 357136, "epoch": 4302} {"train_loss": -25.992700576782227, "global_step": 357137, "epoch": 4302} {"train_loss": -25.930316925048828, "global_step": 357138, "epoch": 4302} {"train_loss": -26.3687801361084, "global_step": 357139, "epoch": 4302} {"train_loss": -26.232648849487305, "global_step": 357140, "epoch": 4302} {"train_loss": -26.397306442260742, "global_step": 357141, "epoch": 4302} {"train_loss": -26.132715225219727, "global_step": 357142, "epoch": 4302} {"train_loss": -26.290536880493164, "global_step": 357143, "epoch": 4302} {"train_loss": -26.321950912475586, "global_step": 357144, "epoch": 4302} {"train_loss": -26.215238571166992, "global_step": 357145, "epoch": 4302} {"train_loss": -26.262298583984375, "global_step": 357146, "epoch": 4302} {"train_loss": -26.58782958984375, "global_step": 357147, "epoch": 4302} {"train_loss": -26.109843518360552, "global_step": 357148, "epoch": 4302, "val_loss": 6597390.5} {"train_loss": -26.049768447875977, "global_step": 357149, "epoch": 4303} {"train_loss": -25.787235260009766, "global_step": 357150, "epoch": 4303} {"train_loss": -25.6188907623291, "global_step": 357151, "epoch": 4303} {"train_loss": -25.81222915649414, "global_step": 357152, "epoch": 4303} {"train_loss": -26.21059226989746, "global_step": 357153, "epoch": 4303} {"train_loss": -26.033109664916992, "global_step": 357154, "epoch": 4303} {"train_loss": -25.82538414001465, "global_step": 357155, "epoch": 4303} {"train_loss": -25.752511978149414, "global_step": 357156, "epoch": 4303} {"train_loss": -25.815750122070312, "global_step": 357157, "epoch": 4303} {"train_loss": -26.28681755065918, "global_step": 357158, "epoch": 4303} {"train_loss": -25.853351593017578, "global_step": 357159, "epoch": 4303} {"train_loss": -26.007217407226562, "global_step": 357160, "epoch": 4303} {"train_loss": -25.80702781677246, "global_step": 357161, "epoch": 4303} {"train_loss": -26.24395179748535, "global_step": 357162, "epoch": 4303} {"train_loss": -25.737628936767578, "global_step": 357163, "epoch": 4303} {"train_loss": -26.105884552001953, "global_step": 357164, "epoch": 4303} {"train_loss": -25.806623458862305, "global_step": 357165, "epoch": 4303} {"train_loss": -26.130964279174805, "global_step": 357166, "epoch": 4303} {"train_loss": -26.58442497253418, "global_step": 357167, "epoch": 4303} {"train_loss": -26.1673641204834, "global_step": 357168, "epoch": 4303} {"train_loss": -26.44764518737793, "global_step": 357169, "epoch": 4303} {"train_loss": -26.114587783813477, "global_step": 357170, "epoch": 4303} {"train_loss": -26.046125411987305, "global_step": 357171, "epoch": 4303} {"train_loss": -26.464078903198242, "global_step": 357172, "epoch": 4303} {"train_loss": -26.179370880126953, "global_step": 357173, "epoch": 4303} {"train_loss": -25.93329429626465, "global_step": 357174, "epoch": 4303} {"train_loss": -26.123754501342773, "global_step": 357175, "epoch": 4303} {"train_loss": -26.237960815429688, "global_step": 357176, "epoch": 4303} {"train_loss": -26.371063232421875, "global_step": 357177, "epoch": 4303} {"train_loss": -25.845788955688477, "global_step": 357178, "epoch": 4303} {"train_loss": -26.2773380279541, "global_step": 357179, "epoch": 4303} {"train_loss": -26.333715438842773, "global_step": 357180, "epoch": 4303} {"train_loss": -26.292272567749023, "global_step": 357181, "epoch": 4303} {"train_loss": -26.811872482299805, "global_step": 357182, "epoch": 4303} {"train_loss": -26.32373046875, "global_step": 357183, "epoch": 4303} {"train_loss": -26.398427963256836, "global_step": 357184, "epoch": 4303} {"train_loss": -26.436262130737305, "global_step": 357185, "epoch": 4303} {"train_loss": -26.395933151245117, "global_step": 357186, "epoch": 4303} {"train_loss": -26.4151668548584, "global_step": 357187, "epoch": 4303} {"train_loss": -26.351530075073242, "global_step": 357188, "epoch": 4303} {"train_loss": -26.2460880279541, "global_step": 357189, "epoch": 4303} {"train_loss": -26.00811767578125, "global_step": 357190, "epoch": 4303} {"train_loss": -26.03216552734375, "global_step": 357191, "epoch": 4303} {"train_loss": -26.559995651245117, "global_step": 357192, "epoch": 4303} {"train_loss": -26.517526626586914, "global_step": 357193, "epoch": 4303} {"train_loss": -26.33381462097168, "global_step": 357194, "epoch": 4303} {"train_loss": -26.257612228393555, "global_step": 357195, "epoch": 4303} {"train_loss": -26.217426300048828, "global_step": 357196, "epoch": 4303} {"train_loss": -26.39280128479004, "global_step": 357197, "epoch": 4303} {"train_loss": -26.077350616455078, "global_step": 357198, "epoch": 4303} {"train_loss": -26.49884605407715, "global_step": 357199, "epoch": 4303} {"train_loss": -26.148574829101562, "global_step": 357200, "epoch": 4303} {"train_loss": -25.986570358276367, "global_step": 357201, "epoch": 4303} {"train_loss": -25.53890037536621, "global_step": 357202, "epoch": 4303} {"train_loss": -25.931913375854492, "global_step": 357203, "epoch": 4303} {"train_loss": -25.770795822143555, "global_step": 357204, "epoch": 4303} {"train_loss": -26.410663604736328, "global_step": 357205, "epoch": 4303} {"train_loss": -26.107587814331055, "global_step": 357206, "epoch": 4303} {"train_loss": -25.967565536499023, "global_step": 357207, "epoch": 4303} {"train_loss": -26.055988311767578, "global_step": 357208, "epoch": 4303} {"train_loss": -26.115041732788086, "global_step": 357209, "epoch": 4303} {"train_loss": -25.946353912353516, "global_step": 357210, "epoch": 4303} {"train_loss": -25.81451988220215, "global_step": 357211, "epoch": 4303} {"train_loss": -25.843488693237305, "global_step": 357212, "epoch": 4303} {"train_loss": -25.729965209960938, "global_step": 357213, "epoch": 4303} {"train_loss": -26.046497344970703, "global_step": 357214, "epoch": 4303} {"train_loss": -25.948644638061523, "global_step": 357215, "epoch": 4303} {"train_loss": -25.784696578979492, "global_step": 357216, "epoch": 4303} {"train_loss": -25.891651153564453, "global_step": 357217, "epoch": 4303} {"train_loss": -26.040369033813477, "global_step": 357218, "epoch": 4303} {"train_loss": -26.31935691833496, "global_step": 357219, "epoch": 4303} {"train_loss": -25.605792999267578, "global_step": 357220, "epoch": 4303} {"train_loss": -26.522016525268555, "global_step": 357221, "epoch": 4303} {"train_loss": -26.139759063720703, "global_step": 357222, "epoch": 4303} {"train_loss": -26.3355655670166, "global_step": 357223, "epoch": 4303} {"train_loss": -26.100622177124023, "global_step": 357224, "epoch": 4303} {"train_loss": -26.1669979095459, "global_step": 357225, "epoch": 4303} {"train_loss": -26.215087890625, "global_step": 357226, "epoch": 4303} {"train_loss": -26.2188720703125, "global_step": 357227, "epoch": 4303} {"train_loss": -26.018102645874023, "global_step": 357228, "epoch": 4303} {"train_loss": -26.405149459838867, "global_step": 357229, "epoch": 4303} {"train_loss": -25.869855880737305, "global_step": 357230, "epoch": 4303} {"train_loss": -26.113984533103114, "global_step": 357231, "epoch": 4303, "val_loss": 6631015.0} {"train_loss": -25.954914093017578, "global_step": 357232, "epoch": 4304} {"train_loss": -26.068897247314453, "global_step": 357233, "epoch": 4304} {"train_loss": -25.9478702545166, "global_step": 357234, "epoch": 4304} {"train_loss": -26.09937858581543, "global_step": 357235, "epoch": 4304} {"train_loss": -25.276891708374023, "global_step": 357236, "epoch": 4304} {"train_loss": -25.329843521118164, "global_step": 357237, "epoch": 4304} {"train_loss": -26.13177490234375, "global_step": 357238, "epoch": 4304} {"train_loss": -25.402841567993164, "global_step": 357239, "epoch": 4304} {"train_loss": -25.71710777282715, "global_step": 357240, "epoch": 4304} {"train_loss": -25.53451156616211, "global_step": 357241, "epoch": 4304} {"train_loss": -25.9742488861084, "global_step": 357242, "epoch": 4304} {"train_loss": -25.558019638061523, "global_step": 357243, "epoch": 4304} {"train_loss": -26.356359481811523, "global_step": 357244, "epoch": 4304} {"train_loss": -25.34895896911621, "global_step": 357245, "epoch": 4304} {"train_loss": -25.80763053894043, "global_step": 357246, "epoch": 4304} {"train_loss": -26.113956451416016, "global_step": 357247, "epoch": 4304} {"train_loss": -25.90478515625, "global_step": 357248, "epoch": 4304} {"train_loss": -25.637048721313477, "global_step": 357249, "epoch": 4304} {"train_loss": -26.26905632019043, "global_step": 357250, "epoch": 4304} {"train_loss": -25.808935165405273, "global_step": 357251, "epoch": 4304} {"train_loss": -25.934707641601562, "global_step": 357252, "epoch": 4304} {"train_loss": -26.050506591796875, "global_step": 357253, "epoch": 4304} {"train_loss": -26.50385093688965, "global_step": 357254, "epoch": 4304} {"train_loss": -26.00394058227539, "global_step": 357255, "epoch": 4304} {"train_loss": -26.103748321533203, "global_step": 357256, "epoch": 4304} {"train_loss": -25.919330596923828, "global_step": 357257, "epoch": 4304} {"train_loss": -26.255075454711914, "global_step": 357258, "epoch": 4304} {"train_loss": -26.350982666015625, "global_step": 357259, "epoch": 4304} {"train_loss": -26.16010093688965, "global_step": 357260, "epoch": 4304} {"train_loss": -26.16095542907715, "global_step": 357261, "epoch": 4304} {"train_loss": -26.07671546936035, "global_step": 357262, "epoch": 4304} {"train_loss": -26.57355308532715, "global_step": 357263, "epoch": 4304} {"train_loss": -26.3299617767334, "global_step": 357264, "epoch": 4304} {"train_loss": -26.4323673248291, "global_step": 357265, "epoch": 4304} {"train_loss": -26.14264488220215, "global_step": 357266, "epoch": 4304} {"train_loss": -26.36240005493164, "global_step": 357267, "epoch": 4304} {"train_loss": -26.554656982421875, "global_step": 357268, "epoch": 4304} {"train_loss": -26.05136489868164, "global_step": 357269, "epoch": 4304} {"train_loss": -26.414846420288086, "global_step": 357270, "epoch": 4304} {"train_loss": -26.382465362548828, "global_step": 357271, "epoch": 4304} {"train_loss": -26.160268783569336, "global_step": 357272, "epoch": 4304} {"train_loss": -26.297147750854492, "global_step": 357273, "epoch": 4304} {"train_loss": -26.173974990844727, "global_step": 357274, "epoch": 4304} {"train_loss": -26.53194236755371, "global_step": 357275, "epoch": 4304} {"train_loss": -26.473352432250977, "global_step": 357276, "epoch": 4304} {"train_loss": -26.11690330505371, "global_step": 357277, "epoch": 4304} {"train_loss": -26.254627227783203, "global_step": 357278, "epoch": 4304} {"train_loss": -26.005887985229492, "global_step": 357279, "epoch": 4304} {"train_loss": -26.297531127929688, "global_step": 357280, "epoch": 4304} {"train_loss": -26.40851402282715, "global_step": 357281, "epoch": 4304} {"train_loss": -26.213598251342773, "global_step": 357282, "epoch": 4304} {"train_loss": -26.56171226501465, "global_step": 357283, "epoch": 4304} {"train_loss": -26.257505416870117, "global_step": 357284, "epoch": 4304} {"train_loss": -26.295263290405273, "global_step": 357285, "epoch": 4304} {"train_loss": -26.632537841796875, "global_step": 357286, "epoch": 4304} {"train_loss": -26.462360382080078, "global_step": 357287, "epoch": 4304} {"train_loss": -26.24590492248535, "global_step": 357288, "epoch": 4304} {"train_loss": -25.85324478149414, "global_step": 357289, "epoch": 4304} {"train_loss": -26.0511474609375, "global_step": 357290, "epoch": 4304} {"train_loss": -26.10860252380371, "global_step": 357291, "epoch": 4304} {"train_loss": -25.728103637695312, "global_step": 357292, "epoch": 4304} {"train_loss": -26.384754180908203, "global_step": 357293, "epoch": 4304} {"train_loss": -26.28401756286621, "global_step": 357294, "epoch": 4304} {"train_loss": -26.087371826171875, "global_step": 357295, "epoch": 4304} {"train_loss": -26.121374130249023, "global_step": 357296, "epoch": 4304} {"train_loss": -26.14645767211914, "global_step": 357297, "epoch": 4304} {"train_loss": -26.2233943939209, "global_step": 357298, "epoch": 4304} {"train_loss": -26.2281551361084, "global_step": 357299, "epoch": 4304} {"train_loss": -25.931354522705078, "global_step": 357300, "epoch": 4304} {"train_loss": -25.688024520874023, "global_step": 357301, "epoch": 4304} {"train_loss": -25.714344024658203, "global_step": 357302, "epoch": 4304} {"train_loss": -25.164670944213867, "global_step": 357303, "epoch": 4304} {"train_loss": -25.956378936767578, "global_step": 357304, "epoch": 4304} {"train_loss": -25.99481201171875, "global_step": 357305, "epoch": 4304} {"train_loss": -26.187143325805664, "global_step": 357306, "epoch": 4304} {"train_loss": -25.871191024780273, "global_step": 357307, "epoch": 4304} {"train_loss": -26.221424102783203, "global_step": 357308, "epoch": 4304} {"train_loss": -26.31194496154785, "global_step": 357309, "epoch": 4304} {"train_loss": -26.642698287963867, "global_step": 357310, "epoch": 4304} {"train_loss": -26.138906478881836, "global_step": 357311, "epoch": 4304} {"train_loss": -26.4073543548584, "global_step": 357312, "epoch": 4304} {"train_loss": -26.324939727783203, "global_step": 357313, "epoch": 4304} {"train_loss": -26.082714747233563, "global_step": 357314, "epoch": 4304, "val_loss": 6631044.0} {"train_loss": -25.894311904907227, "global_step": 357315, "epoch": 4305} {"train_loss": -25.778894424438477, "global_step": 357316, "epoch": 4305} {"train_loss": -26.135822296142578, "global_step": 357317, "epoch": 4305} {"train_loss": -25.784875869750977, "global_step": 357318, "epoch": 4305} {"train_loss": -25.94075584411621, "global_step": 357319, "epoch": 4305} {"train_loss": -26.446212768554688, "global_step": 357320, "epoch": 4305} {"train_loss": -26.272497177124023, "global_step": 357321, "epoch": 4305} {"train_loss": -26.072233200073242, "global_step": 357322, "epoch": 4305} {"train_loss": -26.014699935913086, "global_step": 357323, "epoch": 4305} {"train_loss": -26.488065719604492, "global_step": 357324, "epoch": 4305} {"train_loss": -26.586023330688477, "global_step": 357325, "epoch": 4305} {"train_loss": -25.656082153320312, "global_step": 357326, "epoch": 4305} {"train_loss": -26.368194580078125, "global_step": 357327, "epoch": 4305} {"train_loss": -26.428640365600586, "global_step": 357328, "epoch": 4305} {"train_loss": -26.347949981689453, "global_step": 357329, "epoch": 4305} {"train_loss": -26.131006240844727, "global_step": 357330, "epoch": 4305} {"train_loss": -26.376916885375977, "global_step": 357331, "epoch": 4305} {"train_loss": -26.029499053955078, "global_step": 357332, "epoch": 4305} {"train_loss": -26.28072166442871, "global_step": 357333, "epoch": 4305} {"train_loss": -26.15262222290039, "global_step": 357334, "epoch": 4305} {"train_loss": -26.313678741455078, "global_step": 357335, "epoch": 4305} {"train_loss": -26.428131103515625, "global_step": 357336, "epoch": 4305} {"train_loss": -26.203596115112305, "global_step": 357337, "epoch": 4305} {"train_loss": -26.370731353759766, "global_step": 357338, "epoch": 4305} {"train_loss": -26.58747673034668, "global_step": 357339, "epoch": 4305} {"train_loss": -26.469114303588867, "global_step": 357340, "epoch": 4305} {"train_loss": -26.054895401000977, "global_step": 357341, "epoch": 4305} {"train_loss": -26.3785457611084, "global_step": 357342, "epoch": 4305} {"train_loss": -26.215091705322266, "global_step": 357343, "epoch": 4305} {"train_loss": -26.1529598236084, "global_step": 357344, "epoch": 4305} {"train_loss": -26.589969635009766, "global_step": 357345, "epoch": 4305} {"train_loss": -26.510395050048828, "global_step": 357346, "epoch": 4305} {"train_loss": -26.194595336914062, "global_step": 357347, "epoch": 4305} {"train_loss": -26.493284225463867, "global_step": 357348, "epoch": 4305} {"train_loss": -26.292139053344727, "global_step": 357349, "epoch": 4305} {"train_loss": -26.133636474609375, "global_step": 357350, "epoch": 4305} {"train_loss": -26.1680850982666, "global_step": 357351, "epoch": 4305} {"train_loss": -26.385517120361328, "global_step": 357352, "epoch": 4305} {"train_loss": -26.349506378173828, "global_step": 357353, "epoch": 4305} {"train_loss": -26.513837814331055, "global_step": 357354, "epoch": 4305} {"train_loss": -26.22551918029785, "global_step": 357355, "epoch": 4305} {"train_loss": -26.178955078125, "global_step": 357356, "epoch": 4305} {"train_loss": -26.892908096313477, "global_step": 357357, "epoch": 4305} {"train_loss": -26.24106788635254, "global_step": 357358, "epoch": 4305} {"train_loss": -26.49653434753418, "global_step": 357359, "epoch": 4305} {"train_loss": -26.63040542602539, "global_step": 357360, "epoch": 4305} {"train_loss": -26.65865135192871, "global_step": 357361, "epoch": 4305} {"train_loss": -26.609054565429688, "global_step": 357362, "epoch": 4305} {"train_loss": -26.386594772338867, "global_step": 357363, "epoch": 4305} {"train_loss": -26.011728286743164, "global_step": 357364, "epoch": 4305} {"train_loss": -26.283462524414062, "global_step": 357365, "epoch": 4305} {"train_loss": -26.532745361328125, "global_step": 357366, "epoch": 4305} {"train_loss": -26.41400718688965, "global_step": 357367, "epoch": 4305} {"train_loss": -26.10263442993164, "global_step": 357368, "epoch": 4305} {"train_loss": -25.892309188842773, "global_step": 357369, "epoch": 4305} {"train_loss": -25.90479850769043, "global_step": 357370, "epoch": 4305} {"train_loss": -25.524784088134766, "global_step": 357371, "epoch": 4305} {"train_loss": -25.161136627197266, "global_step": 357372, "epoch": 4305} {"train_loss": -25.6398983001709, "global_step": 357373, "epoch": 4305} {"train_loss": -25.30047035217285, "global_step": 357374, "epoch": 4305} {"train_loss": -25.82795524597168, "global_step": 357375, "epoch": 4305} {"train_loss": -26.197250366210938, "global_step": 357376, "epoch": 4305} {"train_loss": -25.910831451416016, "global_step": 357377, "epoch": 4305} {"train_loss": -26.37201499938965, "global_step": 357378, "epoch": 4305} {"train_loss": -26.249357223510742, "global_step": 357379, "epoch": 4305} {"train_loss": -26.22385597229004, "global_step": 357380, "epoch": 4305} {"train_loss": -26.344324111938477, "global_step": 357381, "epoch": 4305} {"train_loss": -26.2551326751709, "global_step": 357382, "epoch": 4305} {"train_loss": -26.476194381713867, "global_step": 357383, "epoch": 4305} {"train_loss": -26.124698638916016, "global_step": 357384, "epoch": 4305} {"train_loss": -25.90785026550293, "global_step": 357385, "epoch": 4305} {"train_loss": -26.231800079345703, "global_step": 357386, "epoch": 4305} {"train_loss": -25.880590438842773, "global_step": 357387, "epoch": 4305} {"train_loss": -26.54511070251465, "global_step": 357388, "epoch": 4305} {"train_loss": -26.071765899658203, "global_step": 357389, "epoch": 4305} {"train_loss": -25.853246688842773, "global_step": 357390, "epoch": 4305} {"train_loss": -26.299121856689453, "global_step": 357391, "epoch": 4305} {"train_loss": -26.36138343811035, "global_step": 357392, "epoch": 4305} {"train_loss": -26.097793579101562, "global_step": 357393, "epoch": 4305} {"train_loss": -26.428686141967773, "global_step": 357394, "epoch": 4305} {"train_loss": -26.3963565826416, "global_step": 357395, "epoch": 4305} {"train_loss": -26.164371490478516, "global_step": 357396, "epoch": 4305} {"train_loss": -26.224533012114374, "global_step": 357397, "epoch": 4305, "val_loss": 6652645.0} {"train_loss": -26.224782943725586, "global_step": 357398, "epoch": 4306} {"train_loss": -25.74309730529785, "global_step": 357399, "epoch": 4306} {"train_loss": -25.720457077026367, "global_step": 357400, "epoch": 4306} {"train_loss": -25.6173152923584, "global_step": 357401, "epoch": 4306} {"train_loss": -25.44624137878418, "global_step": 357402, "epoch": 4306} {"train_loss": -25.883398056030273, "global_step": 357403, "epoch": 4306} {"train_loss": -25.70953369140625, "global_step": 357404, "epoch": 4306} {"train_loss": -25.98959732055664, "global_step": 357405, "epoch": 4306} {"train_loss": -25.80864906311035, "global_step": 357406, "epoch": 4306} {"train_loss": -26.17352867126465, "global_step": 357407, "epoch": 4306} {"train_loss": -25.689777374267578, "global_step": 357408, "epoch": 4306} {"train_loss": -26.036584854125977, "global_step": 357409, "epoch": 4306} {"train_loss": -26.150272369384766, "global_step": 357410, "epoch": 4306} {"train_loss": -26.05230712890625, "global_step": 357411, "epoch": 4306} {"train_loss": -25.59840202331543, "global_step": 357412, "epoch": 4306} {"train_loss": -26.266748428344727, "global_step": 357413, "epoch": 4306} {"train_loss": -26.110158920288086, "global_step": 357414, "epoch": 4306} {"train_loss": -26.426239013671875, "global_step": 357415, "epoch": 4306} {"train_loss": -25.76887321472168, "global_step": 357416, "epoch": 4306} {"train_loss": -26.0310001373291, "global_step": 357417, "epoch": 4306} {"train_loss": -26.21571159362793, "global_step": 357418, "epoch": 4306} {"train_loss": -26.03592300415039, "global_step": 357419, "epoch": 4306} {"train_loss": -26.499286651611328, "global_step": 357420, "epoch": 4306} {"train_loss": -26.128864288330078, "global_step": 357421, "epoch": 4306} {"train_loss": -25.9858341217041, "global_step": 357422, "epoch": 4306} {"train_loss": -25.842304229736328, "global_step": 357423, "epoch": 4306} {"train_loss": -25.9001522064209, "global_step": 357424, "epoch": 4306} {"train_loss": -26.302656173706055, "global_step": 357425, "epoch": 4306} {"train_loss": -25.8384952545166, "global_step": 357426, "epoch": 4306} {"train_loss": -26.095645904541016, "global_step": 357427, "epoch": 4306} {"train_loss": -26.272857666015625, "global_step": 357428, "epoch": 4306} {"train_loss": -26.52081298828125, "global_step": 357429, "epoch": 4306} {"train_loss": -25.984210968017578, "global_step": 357430, "epoch": 4306} {"train_loss": -26.2585506439209, "global_step": 357431, "epoch": 4306} {"train_loss": -26.305871963500977, "global_step": 357432, "epoch": 4306} {"train_loss": -25.67681312561035, "global_step": 357433, "epoch": 4306} {"train_loss": -25.571123123168945, "global_step": 357434, "epoch": 4306} {"train_loss": -26.441457748413086, "global_step": 357435, "epoch": 4306} {"train_loss": -26.055830001831055, "global_step": 357436, "epoch": 4306} {"train_loss": -25.948856353759766, "global_step": 357437, "epoch": 4306} {"train_loss": -26.16214942932129, "global_step": 357438, "epoch": 4306} {"train_loss": -25.9592342376709, "global_step": 357439, "epoch": 4306} {"train_loss": -26.138446807861328, "global_step": 357440, "epoch": 4306} {"train_loss": -26.058237075805664, "global_step": 357441, "epoch": 4306} {"train_loss": -25.93108558654785, "global_step": 357442, "epoch": 4306} {"train_loss": -25.6522274017334, "global_step": 357443, "epoch": 4306} {"train_loss": -26.31013298034668, "global_step": 357444, "epoch": 4306} {"train_loss": -26.309844970703125, "global_step": 357445, "epoch": 4306} {"train_loss": -25.780841827392578, "global_step": 357446, "epoch": 4306} {"train_loss": -26.32246208190918, "global_step": 357447, "epoch": 4306} {"train_loss": -26.4694766998291, "global_step": 357448, "epoch": 4306} {"train_loss": -26.21648597717285, "global_step": 357449, "epoch": 4306} {"train_loss": -26.147382736206055, "global_step": 357450, "epoch": 4306} {"train_loss": -26.063573837280273, "global_step": 357451, "epoch": 4306} {"train_loss": -26.090625762939453, "global_step": 357452, "epoch": 4306} {"train_loss": -26.446075439453125, "global_step": 357453, "epoch": 4306} {"train_loss": -26.12360191345215, "global_step": 357454, "epoch": 4306} {"train_loss": -26.275592803955078, "global_step": 357455, "epoch": 4306} {"train_loss": -26.042245864868164, "global_step": 357456, "epoch": 4306} {"train_loss": -26.74932861328125, "global_step": 357457, "epoch": 4306} {"train_loss": -26.1420841217041, "global_step": 357458, "epoch": 4306} {"train_loss": -26.580041885375977, "global_step": 357459, "epoch": 4306} {"train_loss": -26.2851619720459, "global_step": 357460, "epoch": 4306} {"train_loss": -25.9345645904541, "global_step": 357461, "epoch": 4306} {"train_loss": -26.151365280151367, "global_step": 357462, "epoch": 4306} {"train_loss": -26.5601806640625, "global_step": 357463, "epoch": 4306} {"train_loss": -26.583219528198242, "global_step": 357464, "epoch": 4306} {"train_loss": -25.82147789001465, "global_step": 357465, "epoch": 4306} {"train_loss": -26.2064151763916, "global_step": 357466, "epoch": 4306} {"train_loss": -25.8825626373291, "global_step": 357467, "epoch": 4306} {"train_loss": -26.439285278320312, "global_step": 357468, "epoch": 4306} {"train_loss": -26.197647094726562, "global_step": 357469, "epoch": 4306} {"train_loss": -26.347198486328125, "global_step": 357470, "epoch": 4306} {"train_loss": -26.325849533081055, "global_step": 357471, "epoch": 4306} {"train_loss": -25.938846588134766, "global_step": 357472, "epoch": 4306} {"train_loss": -26.2712345123291, "global_step": 357473, "epoch": 4306} {"train_loss": -26.351211547851562, "global_step": 357474, "epoch": 4306} {"train_loss": -26.51337242126465, "global_step": 357475, "epoch": 4306} {"train_loss": -26.1314697265625, "global_step": 357476, "epoch": 4306} {"train_loss": -26.016376495361328, "global_step": 357477, "epoch": 4306} {"train_loss": -26.386533737182617, "global_step": 357478, "epoch": 4306} {"train_loss": -26.427337646484375, "global_step": 357479, "epoch": 4306} {"train_loss": -26.120749760823077, "global_step": 357480, "epoch": 4306, "val_loss": 6633498.0} {"train_loss": -26.30859375, "global_step": 357481, "epoch": 4307} {"train_loss": -25.923126220703125, "global_step": 357482, "epoch": 4307} {"train_loss": -26.447553634643555, "global_step": 357483, "epoch": 4307} {"train_loss": -25.787485122680664, "global_step": 357484, "epoch": 4307} {"train_loss": -26.258344650268555, "global_step": 357485, "epoch": 4307} {"train_loss": -26.027257919311523, "global_step": 357486, "epoch": 4307} {"train_loss": -25.58039665222168, "global_step": 357487, "epoch": 4307} {"train_loss": -26.062673568725586, "global_step": 357488, "epoch": 4307} {"train_loss": -26.254331588745117, "global_step": 357489, "epoch": 4307} {"train_loss": -26.57474708557129, "global_step": 357490, "epoch": 4307} {"train_loss": -25.868011474609375, "global_step": 357491, "epoch": 4307} {"train_loss": -26.252161026000977, "global_step": 357492, "epoch": 4307} {"train_loss": -26.239089965820312, "global_step": 357493, "epoch": 4307} {"train_loss": -26.27545166015625, "global_step": 357494, "epoch": 4307} {"train_loss": -26.47015380859375, "global_step": 357495, "epoch": 4307} {"train_loss": -26.120838165283203, "global_step": 357496, "epoch": 4307} {"train_loss": -26.50581169128418, "global_step": 357497, "epoch": 4307} {"train_loss": -26.082046508789062, "global_step": 357498, "epoch": 4307} {"train_loss": -26.034347534179688, "global_step": 357499, "epoch": 4307} {"train_loss": -26.210203170776367, "global_step": 357500, "epoch": 4307} {"train_loss": -26.135730743408203, "global_step": 357501, "epoch": 4307} {"train_loss": -25.64483642578125, "global_step": 357502, "epoch": 4307} {"train_loss": -26.309534072875977, "global_step": 357503, "epoch": 4307} {"train_loss": -26.270009994506836, "global_step": 357504, "epoch": 4307} {"train_loss": -25.688261032104492, "global_step": 357505, "epoch": 4307} {"train_loss": -26.303070068359375, "global_step": 357506, "epoch": 4307} {"train_loss": -26.222015380859375, "global_step": 357507, "epoch": 4307} {"train_loss": -26.490991592407227, "global_step": 357508, "epoch": 4307} {"train_loss": -26.162622451782227, "global_step": 357509, "epoch": 4307} {"train_loss": -26.12063980102539, "global_step": 357510, "epoch": 4307} {"train_loss": -26.383655548095703, "global_step": 357511, "epoch": 4307} {"train_loss": -26.494298934936523, "global_step": 357512, "epoch": 4307} {"train_loss": -26.083332061767578, "global_step": 357513, "epoch": 4307} {"train_loss": -25.953536987304688, "global_step": 357514, "epoch": 4307} {"train_loss": -26.586090087890625, "global_step": 357515, "epoch": 4307} {"train_loss": -26.118757247924805, "global_step": 357516, "epoch": 4307} {"train_loss": -26.257360458374023, "global_step": 357517, "epoch": 4307} {"train_loss": -26.0090274810791, "global_step": 357518, "epoch": 4307} {"train_loss": -26.158124923706055, "global_step": 357519, "epoch": 4307} {"train_loss": -26.352298736572266, "global_step": 357520, "epoch": 4307} {"train_loss": -26.041479110717773, "global_step": 357521, "epoch": 4307} {"train_loss": -26.133520126342773, "global_step": 357522, "epoch": 4307} {"train_loss": -26.036161422729492, "global_step": 357523, "epoch": 4307} {"train_loss": -26.559574127197266, "global_step": 357524, "epoch": 4307} {"train_loss": -26.045166015625, "global_step": 357525, "epoch": 4307} {"train_loss": -26.2819766998291, "global_step": 357526, "epoch": 4307} {"train_loss": -26.38970947265625, "global_step": 357527, "epoch": 4307} {"train_loss": -26.451923370361328, "global_step": 357528, "epoch": 4307} {"train_loss": -26.036224365234375, "global_step": 357529, "epoch": 4307} {"train_loss": -26.157636642456055, "global_step": 357530, "epoch": 4307} {"train_loss": -26.22735595703125, "global_step": 357531, "epoch": 4307} {"train_loss": -25.960681915283203, "global_step": 357532, "epoch": 4307} {"train_loss": -26.234872817993164, "global_step": 357533, "epoch": 4307} {"train_loss": -25.990888595581055, "global_step": 357534, "epoch": 4307} {"train_loss": -26.21906089782715, "global_step": 357535, "epoch": 4307} {"train_loss": -25.873010635375977, "global_step": 357536, "epoch": 4307} {"train_loss": -26.22883415222168, "global_step": 357537, "epoch": 4307} {"train_loss": -26.322778701782227, "global_step": 357538, "epoch": 4307} {"train_loss": -26.190473556518555, "global_step": 357539, "epoch": 4307} {"train_loss": -26.04828453063965, "global_step": 357540, "epoch": 4307} {"train_loss": -26.115264892578125, "global_step": 357541, "epoch": 4307} {"train_loss": -26.133554458618164, "global_step": 357542, "epoch": 4307} {"train_loss": -26.183923721313477, "global_step": 357543, "epoch": 4307} {"train_loss": -26.21889305114746, "global_step": 357544, "epoch": 4307} {"train_loss": -26.3270206451416, "global_step": 357545, "epoch": 4307} {"train_loss": -26.33158302307129, "global_step": 357546, "epoch": 4307} {"train_loss": -26.273496627807617, "global_step": 357547, "epoch": 4307} {"train_loss": -26.157567977905273, "global_step": 357548, "epoch": 4307} {"train_loss": -26.25567626953125, "global_step": 357549, "epoch": 4307} {"train_loss": -26.167341232299805, "global_step": 357550, "epoch": 4307} {"train_loss": -26.195301055908203, "global_step": 357551, "epoch": 4307} {"train_loss": -26.152326583862305, "global_step": 357552, "epoch": 4307} {"train_loss": -26.06879997253418, "global_step": 357553, "epoch": 4307} {"train_loss": -26.07008171081543, "global_step": 357554, "epoch": 4307} {"train_loss": -26.442602157592773, "global_step": 357555, "epoch": 4307} {"train_loss": -26.150482177734375, "global_step": 357556, "epoch": 4307} {"train_loss": -26.115924835205078, "global_step": 357557, "epoch": 4307} {"train_loss": -26.305740356445312, "global_step": 357558, "epoch": 4307} {"train_loss": -26.17131996154785, "global_step": 357559, "epoch": 4307} {"train_loss": -26.060718536376953, "global_step": 357560, "epoch": 4307} {"train_loss": -26.5100154876709, "global_step": 357561, "epoch": 4307} {"train_loss": -26.330799102783203, "global_step": 357562, "epoch": 4307} {"train_loss": -26.157902683120177, "global_step": 357563, "epoch": 4307, "val_loss": 6650106.0} {"train_loss": -25.683752059936523, "global_step": 357564, "epoch": 4308} {"train_loss": -24.652019500732422, "global_step": 357565, "epoch": 4308} {"train_loss": -25.762372970581055, "global_step": 357566, "epoch": 4308} {"train_loss": -25.9862060546875, "global_step": 357567, "epoch": 4308} {"train_loss": -25.314979553222656, "global_step": 357568, "epoch": 4308} {"train_loss": -26.307952880859375, "global_step": 357569, "epoch": 4308} {"train_loss": -25.41878890991211, "global_step": 357570, "epoch": 4308} {"train_loss": -26.060937881469727, "global_step": 357571, "epoch": 4308} {"train_loss": -25.9464168548584, "global_step": 357572, "epoch": 4308} {"train_loss": -25.928510665893555, "global_step": 357573, "epoch": 4308} {"train_loss": -25.964340209960938, "global_step": 357574, "epoch": 4308} {"train_loss": -25.964981079101562, "global_step": 357575, "epoch": 4308} {"train_loss": -25.59708595275879, "global_step": 357576, "epoch": 4308} {"train_loss": -26.118093490600586, "global_step": 357577, "epoch": 4308} {"train_loss": -25.800451278686523, "global_step": 357578, "epoch": 4308} {"train_loss": -25.813085556030273, "global_step": 357579, "epoch": 4308} {"train_loss": -26.25764274597168, "global_step": 357580, "epoch": 4308} {"train_loss": -26.251134872436523, "global_step": 357581, "epoch": 4308} {"train_loss": -26.1287899017334, "global_step": 357582, "epoch": 4308} {"train_loss": -26.6015625, "global_step": 357583, "epoch": 4308} {"train_loss": -26.1711483001709, "global_step": 357584, "epoch": 4308} {"train_loss": -26.149389266967773, "global_step": 357585, "epoch": 4308} {"train_loss": -26.37555503845215, "global_step": 357586, "epoch": 4308} {"train_loss": -26.182310104370117, "global_step": 357587, "epoch": 4308} {"train_loss": -25.93462562561035, "global_step": 357588, "epoch": 4308} {"train_loss": -26.13477897644043, "global_step": 357589, "epoch": 4308} {"train_loss": -26.08125877380371, "global_step": 357590, "epoch": 4308} {"train_loss": -26.088348388671875, "global_step": 357591, "epoch": 4308} {"train_loss": -26.36448097229004, "global_step": 357592, "epoch": 4308} {"train_loss": -26.390371322631836, "global_step": 357593, "epoch": 4308} {"train_loss": -26.465667724609375, "global_step": 357594, "epoch": 4308} {"train_loss": -26.21644401550293, "global_step": 357595, "epoch": 4308} {"train_loss": -26.4049015045166, "global_step": 357596, "epoch": 4308} {"train_loss": -26.3099308013916, "global_step": 357597, "epoch": 4308} {"train_loss": -26.471948623657227, "global_step": 357598, "epoch": 4308} {"train_loss": -26.44159507751465, "global_step": 357599, "epoch": 4308} {"train_loss": -25.728628158569336, "global_step": 357600, "epoch": 4308} {"train_loss": -26.065221786499023, "global_step": 357601, "epoch": 4308} {"train_loss": -26.5047664642334, "global_step": 357602, "epoch": 4308} {"train_loss": -25.778186798095703, "global_step": 357603, "epoch": 4308} {"train_loss": -26.324462890625, "global_step": 357604, "epoch": 4308} {"train_loss": -26.312814712524414, "global_step": 357605, "epoch": 4308} {"train_loss": -25.811954498291016, "global_step": 357606, "epoch": 4308} {"train_loss": -25.858972549438477, "global_step": 357607, "epoch": 4308} {"train_loss": -26.120471954345703, "global_step": 357608, "epoch": 4308} {"train_loss": -26.256399154663086, "global_step": 357609, "epoch": 4308} {"train_loss": -26.482288360595703, "global_step": 357610, "epoch": 4308} {"train_loss": -26.251508712768555, "global_step": 357611, "epoch": 4308} {"train_loss": -26.5521183013916, "global_step": 357612, "epoch": 4308} {"train_loss": -26.592737197875977, "global_step": 357613, "epoch": 4308} {"train_loss": -26.6802978515625, "global_step": 357614, "epoch": 4308} {"train_loss": -26.425094604492188, "global_step": 357615, "epoch": 4308} {"train_loss": -26.155593872070312, "global_step": 357616, "epoch": 4308} {"train_loss": -26.39796257019043, "global_step": 357617, "epoch": 4308} {"train_loss": -25.892736434936523, "global_step": 357618, "epoch": 4308} {"train_loss": -26.190778732299805, "global_step": 357619, "epoch": 4308} {"train_loss": -26.44902992248535, "global_step": 357620, "epoch": 4308} {"train_loss": -26.227222442626953, "global_step": 357621, "epoch": 4308} {"train_loss": -26.386621475219727, "global_step": 357622, "epoch": 4308} {"train_loss": -26.496112823486328, "global_step": 357623, "epoch": 4308} {"train_loss": -26.22080421447754, "global_step": 357624, "epoch": 4308} {"train_loss": -26.416828155517578, "global_step": 357625, "epoch": 4308} {"train_loss": -26.256677627563477, "global_step": 357626, "epoch": 4308} {"train_loss": -25.9848690032959, "global_step": 357627, "epoch": 4308} {"train_loss": -26.615201950073242, "global_step": 357628, "epoch": 4308} {"train_loss": -26.34964370727539, "global_step": 357629, "epoch": 4308} {"train_loss": -26.226282119750977, "global_step": 357630, "epoch": 4308} {"train_loss": -26.211694717407227, "global_step": 357631, "epoch": 4308} {"train_loss": -26.555896759033203, "global_step": 357632, "epoch": 4308} {"train_loss": -26.363447189331055, "global_step": 357633, "epoch": 4308} {"train_loss": -26.451047897338867, "global_step": 357634, "epoch": 4308} {"train_loss": -26.1523380279541, "global_step": 357635, "epoch": 4308} {"train_loss": -26.28145408630371, "global_step": 357636, "epoch": 4308} {"train_loss": -26.194311141967773, "global_step": 357637, "epoch": 4308} {"train_loss": -26.45551109313965, "global_step": 357638, "epoch": 4308} {"train_loss": -26.09077262878418, "global_step": 357639, "epoch": 4308} {"train_loss": -26.04144859313965, "global_step": 357640, "epoch": 4308} {"train_loss": -26.372228622436523, "global_step": 357641, "epoch": 4308} {"train_loss": -26.095788955688477, "global_step": 357642, "epoch": 4308} {"train_loss": -26.2189884185791, "global_step": 357643, "epoch": 4308} {"train_loss": -26.26349449157715, "global_step": 357644, "epoch": 4308} {"train_loss": -26.080978393554688, "global_step": 357645, "epoch": 4308} {"train_loss": -26.161407539643438, "global_step": 357646, "epoch": 4308, "val_loss": 6621136.0} {"train_loss": -25.73614501953125, "global_step": 357647, "epoch": 4309} {"train_loss": -25.668323516845703, "global_step": 357648, "epoch": 4309} {"train_loss": -25.51315689086914, "global_step": 357649, "epoch": 4309} {"train_loss": -25.21103286743164, "global_step": 357650, "epoch": 4309} {"train_loss": -25.519010543823242, "global_step": 357651, "epoch": 4309} {"train_loss": -24.764724731445312, "global_step": 357652, "epoch": 4309} {"train_loss": -25.57147789001465, "global_step": 357653, "epoch": 4309} {"train_loss": -25.97376823425293, "global_step": 357654, "epoch": 4309} {"train_loss": -26.046106338500977, "global_step": 357655, "epoch": 4309} {"train_loss": -25.801090240478516, "global_step": 357656, "epoch": 4309} {"train_loss": -25.564355850219727, "global_step": 357657, "epoch": 4309} {"train_loss": -25.67131996154785, "global_step": 357658, "epoch": 4309} {"train_loss": -25.792285919189453, "global_step": 357659, "epoch": 4309} {"train_loss": -25.768783569335938, "global_step": 357660, "epoch": 4309} {"train_loss": -25.90448570251465, "global_step": 357661, "epoch": 4309} {"train_loss": -25.945453643798828, "global_step": 357662, "epoch": 4309} {"train_loss": -25.878355026245117, "global_step": 357663, "epoch": 4309} {"train_loss": -26.443588256835938, "global_step": 357664, "epoch": 4309} {"train_loss": -26.001211166381836, "global_step": 357665, "epoch": 4309} {"train_loss": -26.132373809814453, "global_step": 357666, "epoch": 4309} {"train_loss": -25.96457862854004, "global_step": 357667, "epoch": 4309} {"train_loss": -25.76593017578125, "global_step": 357668, "epoch": 4309} {"train_loss": -26.283613204956055, "global_step": 357669, "epoch": 4309} {"train_loss": -26.066747665405273, "global_step": 357670, "epoch": 4309} {"train_loss": -25.670392990112305, "global_step": 357671, "epoch": 4309} {"train_loss": -26.069738388061523, "global_step": 357672, "epoch": 4309} {"train_loss": -26.435260772705078, "global_step": 357673, "epoch": 4309} {"train_loss": -26.138708114624023, "global_step": 357674, "epoch": 4309} {"train_loss": -25.8411865234375, "global_step": 357675, "epoch": 4309} {"train_loss": -26.133020401000977, "global_step": 357676, "epoch": 4309} {"train_loss": -26.34161949157715, "global_step": 357677, "epoch": 4309} {"train_loss": -26.045881271362305, "global_step": 357678, "epoch": 4309} {"train_loss": -26.309219360351562, "global_step": 357679, "epoch": 4309} {"train_loss": -26.380634307861328, "global_step": 357680, "epoch": 4309} {"train_loss": -26.343896865844727, "global_step": 357681, "epoch": 4309} {"train_loss": -26.18421745300293, "global_step": 357682, "epoch": 4309} {"train_loss": -26.481983184814453, "global_step": 357683, "epoch": 4309} {"train_loss": -26.306140899658203, "global_step": 357684, "epoch": 4309} {"train_loss": -26.45685386657715, "global_step": 357685, "epoch": 4309} {"train_loss": -26.2496395111084, "global_step": 357686, "epoch": 4309} {"train_loss": -26.249486923217773, "global_step": 357687, "epoch": 4309} {"train_loss": -26.582538604736328, "global_step": 357688, "epoch": 4309} {"train_loss": -26.59735107421875, "global_step": 357689, "epoch": 4309} {"train_loss": -26.29986000061035, "global_step": 357690, "epoch": 4309} {"train_loss": -26.437841415405273, "global_step": 357691, "epoch": 4309} {"train_loss": -26.19419288635254, "global_step": 357692, "epoch": 4309} {"train_loss": -26.280187606811523, "global_step": 357693, "epoch": 4309} {"train_loss": -26.144489288330078, "global_step": 357694, "epoch": 4309} {"train_loss": -26.11016273498535, "global_step": 357695, "epoch": 4309} {"train_loss": -26.248510360717773, "global_step": 357696, "epoch": 4309} {"train_loss": -26.149213790893555, "global_step": 357697, "epoch": 4309} {"train_loss": -25.99953269958496, "global_step": 357698, "epoch": 4309} {"train_loss": -26.1300048828125, "global_step": 357699, "epoch": 4309} {"train_loss": -26.166547775268555, "global_step": 357700, "epoch": 4309} {"train_loss": -26.4931697845459, "global_step": 357701, "epoch": 4309} {"train_loss": -26.195987701416016, "global_step": 357702, "epoch": 4309} {"train_loss": -26.314279556274414, "global_step": 357703, "epoch": 4309} {"train_loss": -26.159849166870117, "global_step": 357704, "epoch": 4309} {"train_loss": -26.510740280151367, "global_step": 357705, "epoch": 4309} {"train_loss": -26.539819717407227, "global_step": 357706, "epoch": 4309} {"train_loss": -25.91029930114746, "global_step": 357707, "epoch": 4309} {"train_loss": -26.36151123046875, "global_step": 357708, "epoch": 4309} {"train_loss": -26.299854278564453, "global_step": 357709, "epoch": 4309} {"train_loss": -25.72755241394043, "global_step": 357710, "epoch": 4309} {"train_loss": -25.839929580688477, "global_step": 357711, "epoch": 4309} {"train_loss": -25.59864616394043, "global_step": 357712, "epoch": 4309} {"train_loss": -26.126745223999023, "global_step": 357713, "epoch": 4309} {"train_loss": -25.920516967773438, "global_step": 357714, "epoch": 4309} {"train_loss": -26.053756713867188, "global_step": 357715, "epoch": 4309} {"train_loss": -25.739643096923828, "global_step": 357716, "epoch": 4309} {"train_loss": -26.0383243560791, "global_step": 357717, "epoch": 4309} {"train_loss": -26.12367057800293, "global_step": 357718, "epoch": 4309} {"train_loss": -25.87762451171875, "global_step": 357719, "epoch": 4309} {"train_loss": -26.134021759033203, "global_step": 357720, "epoch": 4309} {"train_loss": -26.062833786010742, "global_step": 357721, "epoch": 4309} {"train_loss": -25.9094295501709, "global_step": 357722, "epoch": 4309} {"train_loss": -26.413854598999023, "global_step": 357723, "epoch": 4309} {"train_loss": -26.048856735229492, "global_step": 357724, "epoch": 4309} {"train_loss": -25.874765396118164, "global_step": 357725, "epoch": 4309} {"train_loss": -25.926380157470703, "global_step": 357726, "epoch": 4309} {"train_loss": -26.463729858398438, "global_step": 357727, "epoch": 4309} {"train_loss": -25.88746452331543, "global_step": 357728, "epoch": 4309} {"train_loss": -26.06665657227298, "global_step": 357729, "epoch": 4309, "val_loss": 6625055.5} {"train_loss": -25.326250076293945, "global_step": 357730, "epoch": 4310} {"train_loss": -25.27898406982422, "global_step": 357731, "epoch": 4310} {"train_loss": -25.677820205688477, "global_step": 357732, "epoch": 4310} {"train_loss": -25.582843780517578, "global_step": 357733, "epoch": 4310} {"train_loss": -25.7015323638916, "global_step": 357734, "epoch": 4310} {"train_loss": -25.8394832611084, "global_step": 357735, "epoch": 4310} {"train_loss": -25.57625389099121, "global_step": 357736, "epoch": 4310} {"train_loss": -25.631961822509766, "global_step": 357737, "epoch": 4310} {"train_loss": -26.2467098236084, "global_step": 357738, "epoch": 4310} {"train_loss": -26.16617774963379, "global_step": 357739, "epoch": 4310} {"train_loss": -25.928442001342773, "global_step": 357740, "epoch": 4310} {"train_loss": -25.984655380249023, "global_step": 357741, "epoch": 4310} {"train_loss": -25.70745849609375, "global_step": 357742, "epoch": 4310} {"train_loss": -25.939443588256836, "global_step": 357743, "epoch": 4310} {"train_loss": -26.261640548706055, "global_step": 357744, "epoch": 4310} {"train_loss": -26.17828941345215, "global_step": 357745, "epoch": 4310} {"train_loss": -26.2123966217041, "global_step": 357746, "epoch": 4310} {"train_loss": -26.29150390625, "global_step": 357747, "epoch": 4310} {"train_loss": -26.195587158203125, "global_step": 357748, "epoch": 4310} {"train_loss": -25.918066024780273, "global_step": 357749, "epoch": 4310} {"train_loss": -25.827173233032227, "global_step": 357750, "epoch": 4310} {"train_loss": -26.35888671875, "global_step": 357751, "epoch": 4310} {"train_loss": -26.08258056640625, "global_step": 357752, "epoch": 4310} {"train_loss": -25.957616806030273, "global_step": 357753, "epoch": 4310} {"train_loss": -26.291034698486328, "global_step": 357754, "epoch": 4310} {"train_loss": -26.370275497436523, "global_step": 357755, "epoch": 4310} {"train_loss": -26.274240493774414, "global_step": 357756, "epoch": 4310} {"train_loss": -26.31270408630371, "global_step": 357757, "epoch": 4310} {"train_loss": -26.163944244384766, "global_step": 357758, "epoch": 4310} {"train_loss": -26.18928337097168, "global_step": 357759, "epoch": 4310} {"train_loss": -26.266510009765625, "global_step": 357760, "epoch": 4310} {"train_loss": -26.30796241760254, "global_step": 357761, "epoch": 4310} {"train_loss": -26.14853858947754, "global_step": 357762, "epoch": 4310} {"train_loss": -26.420026779174805, "global_step": 357763, "epoch": 4310} {"train_loss": -26.621219635009766, "global_step": 357764, "epoch": 4310} {"train_loss": -26.214719772338867, "global_step": 357765, "epoch": 4310} {"train_loss": -26.418109893798828, "global_step": 357766, "epoch": 4310} {"train_loss": -26.422870635986328, "global_step": 357767, "epoch": 4310} {"train_loss": -26.453481674194336, "global_step": 357768, "epoch": 4310} {"train_loss": -26.515884399414062, "global_step": 357769, "epoch": 4310} {"train_loss": -26.325220108032227, "global_step": 357770, "epoch": 4310} {"train_loss": -26.356006622314453, "global_step": 357771, "epoch": 4310} {"train_loss": -26.06402587890625, "global_step": 357772, "epoch": 4310} {"train_loss": -26.31119728088379, "global_step": 357773, "epoch": 4310} {"train_loss": -26.420642852783203, "global_step": 357774, "epoch": 4310} {"train_loss": -26.68802261352539, "global_step": 357775, "epoch": 4310} {"train_loss": -26.329681396484375, "global_step": 357776, "epoch": 4310} {"train_loss": -26.463117599487305, "global_step": 357777, "epoch": 4310} {"train_loss": -26.15875244140625, "global_step": 357778, "epoch": 4310} {"train_loss": -26.443603515625, "global_step": 357779, "epoch": 4310} {"train_loss": -26.312671661376953, "global_step": 357780, "epoch": 4310} {"train_loss": -26.088953018188477, "global_step": 357781, "epoch": 4310} {"train_loss": -25.973962783813477, "global_step": 357782, "epoch": 4310} {"train_loss": -25.83355140686035, "global_step": 357783, "epoch": 4310} {"train_loss": -25.83522605895996, "global_step": 357784, "epoch": 4310} {"train_loss": -25.648212432861328, "global_step": 357785, "epoch": 4310} {"train_loss": -25.795278549194336, "global_step": 357786, "epoch": 4310} {"train_loss": -25.98109245300293, "global_step": 357787, "epoch": 4310} {"train_loss": -26.543903350830078, "global_step": 357788, "epoch": 4310} {"train_loss": -26.2006778717041, "global_step": 357789, "epoch": 4310} {"train_loss": -26.343618392944336, "global_step": 357790, "epoch": 4310} {"train_loss": -26.170211791992188, "global_step": 357791, "epoch": 4310} {"train_loss": -26.2059268951416, "global_step": 357792, "epoch": 4310} {"train_loss": -26.37284278869629, "global_step": 357793, "epoch": 4310} {"train_loss": -26.27092933654785, "global_step": 357794, "epoch": 4310} {"train_loss": -26.19190788269043, "global_step": 357795, "epoch": 4310} {"train_loss": -26.287586212158203, "global_step": 357796, "epoch": 4310} {"train_loss": -26.3804988861084, "global_step": 357797, "epoch": 4310} {"train_loss": -26.179391860961914, "global_step": 357798, "epoch": 4310} {"train_loss": -26.271575927734375, "global_step": 357799, "epoch": 4310} {"train_loss": -26.305166244506836, "global_step": 357800, "epoch": 4310} {"train_loss": -26.310962677001953, "global_step": 357801, "epoch": 4310} {"train_loss": -26.060338973999023, "global_step": 357802, "epoch": 4310} {"train_loss": -26.161046981811523, "global_step": 357803, "epoch": 4310} {"train_loss": -26.323450088500977, "global_step": 357804, "epoch": 4310} {"train_loss": -26.514692306518555, "global_step": 357805, "epoch": 4310} {"train_loss": -26.077672958374023, "global_step": 357806, "epoch": 4310} {"train_loss": -26.442163467407227, "global_step": 357807, "epoch": 4310} {"train_loss": -26.409778594970703, "global_step": 357808, "epoch": 4310} {"train_loss": -26.62361717224121, "global_step": 357809, "epoch": 4310} {"train_loss": -26.532379150390625, "global_step": 357810, "epoch": 4310} {"train_loss": -26.234582901000977, "global_step": 357811, "epoch": 4310} {"train_loss": -26.166804187269097, "global_step": 357812, "epoch": 4310, "val_loss": 6581077.0} {"train_loss": -25.75042152404785, "global_step": 357813, "epoch": 4311} {"train_loss": -26.224084854125977, "global_step": 357814, "epoch": 4311} {"train_loss": -26.590673446655273, "global_step": 357815, "epoch": 4311} {"train_loss": -26.248762130737305, "global_step": 357816, "epoch": 4311} {"train_loss": -26.074106216430664, "global_step": 357817, "epoch": 4311} {"train_loss": -25.452260971069336, "global_step": 357818, "epoch": 4311} {"train_loss": -25.9565486907959, "global_step": 357819, "epoch": 4311} {"train_loss": -26.55513572692871, "global_step": 357820, "epoch": 4311} {"train_loss": -26.098209381103516, "global_step": 357821, "epoch": 4311} {"train_loss": -25.76356315612793, "global_step": 357822, "epoch": 4311} {"train_loss": -26.253253936767578, "global_step": 357823, "epoch": 4311} {"train_loss": -26.131818771362305, "global_step": 357824, "epoch": 4311} {"train_loss": -25.906280517578125, "global_step": 357825, "epoch": 4311} {"train_loss": -26.125818252563477, "global_step": 357826, "epoch": 4311} {"train_loss": -26.48163414001465, "global_step": 357827, "epoch": 4311} {"train_loss": -26.047119140625, "global_step": 357828, "epoch": 4311} {"train_loss": -25.92945671081543, "global_step": 357829, "epoch": 4311} {"train_loss": -26.131271362304688, "global_step": 357830, "epoch": 4311} {"train_loss": -26.062164306640625, "global_step": 357831, "epoch": 4311} {"train_loss": -26.01801109313965, "global_step": 357832, "epoch": 4311} {"train_loss": -25.971216201782227, "global_step": 357833, "epoch": 4311} {"train_loss": -26.33814811706543, "global_step": 357834, "epoch": 4311} {"train_loss": -26.12948989868164, "global_step": 357835, "epoch": 4311} {"train_loss": -26.267927169799805, "global_step": 357836, "epoch": 4311} {"train_loss": -26.4952449798584, "global_step": 357837, "epoch": 4311} {"train_loss": -26.486881256103516, "global_step": 357838, "epoch": 4311} {"train_loss": -26.312225341796875, "global_step": 357839, "epoch": 4311} {"train_loss": -25.90521240234375, "global_step": 357840, "epoch": 4311} {"train_loss": -26.434406280517578, "global_step": 357841, "epoch": 4311} {"train_loss": -26.2632999420166, "global_step": 357842, "epoch": 4311} {"train_loss": -26.3084774017334, "global_step": 357843, "epoch": 4311} {"train_loss": -26.0859432220459, "global_step": 357844, "epoch": 4311} {"train_loss": -26.390417098999023, "global_step": 357845, "epoch": 4311} {"train_loss": -26.269330978393555, "global_step": 357846, "epoch": 4311} {"train_loss": -26.08660316467285, "global_step": 357847, "epoch": 4311} {"train_loss": -26.02370262145996, "global_step": 357848, "epoch": 4311} {"train_loss": -26.307159423828125, "global_step": 357849, "epoch": 4311} {"train_loss": -26.199451446533203, "global_step": 357850, "epoch": 4311} {"train_loss": -26.431446075439453, "global_step": 357851, "epoch": 4311} {"train_loss": -26.20639991760254, "global_step": 357852, "epoch": 4311} {"train_loss": -26.342987060546875, "global_step": 357853, "epoch": 4311} {"train_loss": -26.31568717956543, "global_step": 357854, "epoch": 4311} {"train_loss": -26.558679580688477, "global_step": 357855, "epoch": 4311} {"train_loss": -26.537927627563477, "global_step": 357856, "epoch": 4311} {"train_loss": -26.58405876159668, "global_step": 357857, "epoch": 4311} {"train_loss": -26.417560577392578, "global_step": 357858, "epoch": 4311} {"train_loss": -26.503326416015625, "global_step": 357859, "epoch": 4311} {"train_loss": -26.298994064331055, "global_step": 357860, "epoch": 4311} {"train_loss": -26.596664428710938, "global_step": 357861, "epoch": 4311} {"train_loss": -26.562469482421875, "global_step": 357862, "epoch": 4311} {"train_loss": -26.35223960876465, "global_step": 357863, "epoch": 4311} {"train_loss": -26.309799194335938, "global_step": 357864, "epoch": 4311} {"train_loss": -26.048248291015625, "global_step": 357865, "epoch": 4311} {"train_loss": -26.365299224853516, "global_step": 357866, "epoch": 4311} {"train_loss": -26.811288833618164, "global_step": 357867, "epoch": 4311} {"train_loss": -26.172027587890625, "global_step": 357868, "epoch": 4311} {"train_loss": -26.43381690979004, "global_step": 357869, "epoch": 4311} {"train_loss": -26.4885196685791, "global_step": 357870, "epoch": 4311} {"train_loss": -26.250659942626953, "global_step": 357871, "epoch": 4311} {"train_loss": -26.503950119018555, "global_step": 357872, "epoch": 4311} {"train_loss": -26.192773818969727, "global_step": 357873, "epoch": 4311} {"train_loss": -26.425817489624023, "global_step": 357874, "epoch": 4311} {"train_loss": -26.317615509033203, "global_step": 357875, "epoch": 4311} {"train_loss": -26.668954849243164, "global_step": 357876, "epoch": 4311} {"train_loss": -25.96774673461914, "global_step": 357877, "epoch": 4311} {"train_loss": -26.2813663482666, "global_step": 357878, "epoch": 4311} {"train_loss": -26.38916015625, "global_step": 357879, "epoch": 4311} {"train_loss": -26.61250114440918, "global_step": 357880, "epoch": 4311} {"train_loss": -26.499479293823242, "global_step": 357881, "epoch": 4311} {"train_loss": -26.40009117126465, "global_step": 357882, "epoch": 4311} {"train_loss": -26.01511001586914, "global_step": 357883, "epoch": 4311} {"train_loss": -26.020126342773438, "global_step": 357884, "epoch": 4311} {"train_loss": -26.028295516967773, "global_step": 357885, "epoch": 4311} {"train_loss": -26.0821475982666, "global_step": 357886, "epoch": 4311} {"train_loss": -25.76325798034668, "global_step": 357887, "epoch": 4311} {"train_loss": -25.88907814025879, "global_step": 357888, "epoch": 4311} {"train_loss": -25.596359252929688, "global_step": 357889, "epoch": 4311} {"train_loss": -25.6081600189209, "global_step": 357890, "epoch": 4311} {"train_loss": -25.51898765563965, "global_step": 357891, "epoch": 4311} {"train_loss": -25.773115158081055, "global_step": 357892, "epoch": 4311} {"train_loss": -26.023279190063477, "global_step": 357893, "epoch": 4311} {"train_loss": -25.890146255493164, "global_step": 357894, "epoch": 4311} {"train_loss": -26.210737113493035, "global_step": 357895, "epoch": 4311, "val_loss": 6673634.0} {"train_loss": -25.88514518737793, "global_step": 357896, "epoch": 4312} {"train_loss": -25.593427658081055, "global_step": 357897, "epoch": 4312} {"train_loss": -26.00233268737793, "global_step": 357898, "epoch": 4312} {"train_loss": -25.906757354736328, "global_step": 357899, "epoch": 4312} {"train_loss": -25.92774772644043, "global_step": 357900, "epoch": 4312} {"train_loss": -25.598417282104492, "global_step": 357901, "epoch": 4312} {"train_loss": -26.008060455322266, "global_step": 357902, "epoch": 4312} {"train_loss": -25.89093017578125, "global_step": 357903, "epoch": 4312} {"train_loss": -25.693063735961914, "global_step": 357904, "epoch": 4312} {"train_loss": -25.55006980895996, "global_step": 357905, "epoch": 4312} {"train_loss": -26.345590591430664, "global_step": 357906, "epoch": 4312} {"train_loss": -26.053979873657227, "global_step": 357907, "epoch": 4312} {"train_loss": -26.024866104125977, "global_step": 357908, "epoch": 4312} {"train_loss": -26.12064552307129, "global_step": 357909, "epoch": 4312} {"train_loss": -26.106796264648438, "global_step": 357910, "epoch": 4312} {"train_loss": -26.055551528930664, "global_step": 357911, "epoch": 4312} {"train_loss": -26.083524703979492, "global_step": 357912, "epoch": 4312} {"train_loss": -26.404882431030273, "global_step": 357913, "epoch": 4312} {"train_loss": -26.38007926940918, "global_step": 357914, "epoch": 4312} {"train_loss": -26.199872970581055, "global_step": 357915, "epoch": 4312} {"train_loss": -26.099517822265625, "global_step": 357916, "epoch": 4312} {"train_loss": -26.148895263671875, "global_step": 357917, "epoch": 4312} {"train_loss": -26.220458984375, "global_step": 357918, "epoch": 4312} {"train_loss": -26.363672256469727, "global_step": 357919, "epoch": 4312} {"train_loss": -26.241718292236328, "global_step": 357920, "epoch": 4312} {"train_loss": -26.056852340698242, "global_step": 357921, "epoch": 4312} {"train_loss": -26.06648063659668, "global_step": 357922, "epoch": 4312} {"train_loss": -26.306472778320312, "global_step": 357923, "epoch": 4312} {"train_loss": -26.300811767578125, "global_step": 357924, "epoch": 4312} {"train_loss": -26.447351455688477, "global_step": 357925, "epoch": 4312} {"train_loss": -26.65679359436035, "global_step": 357926, "epoch": 4312} {"train_loss": -26.164321899414062, "global_step": 357927, "epoch": 4312} {"train_loss": -26.846603393554688, "global_step": 357928, "epoch": 4312} {"train_loss": -26.433881759643555, "global_step": 357929, "epoch": 4312} {"train_loss": -26.46162223815918, "global_step": 357930, "epoch": 4312} {"train_loss": -26.717477798461914, "global_step": 357931, "epoch": 4312} {"train_loss": -26.279937744140625, "global_step": 357932, "epoch": 4312} {"train_loss": -26.57339859008789, "global_step": 357933, "epoch": 4312} {"train_loss": -26.38203239440918, "global_step": 357934, "epoch": 4312} {"train_loss": -26.716083526611328, "global_step": 357935, "epoch": 4312} {"train_loss": -26.4515323638916, "global_step": 357936, "epoch": 4312} {"train_loss": -26.164905548095703, "global_step": 357937, "epoch": 4312} {"train_loss": -26.354379653930664, "global_step": 357938, "epoch": 4312} {"train_loss": -25.702619552612305, "global_step": 357939, "epoch": 4312} {"train_loss": -24.784330368041992, "global_step": 357940, "epoch": 4312} {"train_loss": -23.881591796875, "global_step": 357941, "epoch": 4312} {"train_loss": -23.437891006469727, "global_step": 357942, "epoch": 4312} {"train_loss": -24.942426681518555, "global_step": 357943, "epoch": 4312} {"train_loss": -25.070404052734375, "global_step": 357944, "epoch": 4312} {"train_loss": -25.677459716796875, "global_step": 357945, "epoch": 4312} {"train_loss": -24.910465240478516, "global_step": 357946, "epoch": 4312} {"train_loss": -25.938495635986328, "global_step": 357947, "epoch": 4312} {"train_loss": -25.8419189453125, "global_step": 357948, "epoch": 4312} {"train_loss": -25.639036178588867, "global_step": 357949, "epoch": 4312} {"train_loss": -25.433073043823242, "global_step": 357950, "epoch": 4312} {"train_loss": -26.06422233581543, "global_step": 357951, "epoch": 4312} {"train_loss": -25.63323402404785, "global_step": 357952, "epoch": 4312} {"train_loss": -26.036396026611328, "global_step": 357953, "epoch": 4312} {"train_loss": -25.81614112854004, "global_step": 357954, "epoch": 4312} {"train_loss": -26.200653076171875, "global_step": 357955, "epoch": 4312} {"train_loss": -25.98176383972168, "global_step": 357956, "epoch": 4312} {"train_loss": -25.8409481048584, "global_step": 357957, "epoch": 4312} {"train_loss": -25.798704147338867, "global_step": 357958, "epoch": 4312} {"train_loss": -25.823795318603516, "global_step": 357959, "epoch": 4312} {"train_loss": -25.621122360229492, "global_step": 357960, "epoch": 4312} {"train_loss": -25.790857315063477, "global_step": 357961, "epoch": 4312} {"train_loss": -26.084089279174805, "global_step": 357962, "epoch": 4312} {"train_loss": -25.959125518798828, "global_step": 357963, "epoch": 4312} {"train_loss": -26.361509323120117, "global_step": 357964, "epoch": 4312} {"train_loss": -25.668548583984375, "global_step": 357965, "epoch": 4312} {"train_loss": -26.249731063842773, "global_step": 357966, "epoch": 4312} {"train_loss": -26.17207145690918, "global_step": 357967, "epoch": 4312} {"train_loss": -26.018362045288086, "global_step": 357968, "epoch": 4312} {"train_loss": -26.226856231689453, "global_step": 357969, "epoch": 4312} {"train_loss": -26.3272762298584, "global_step": 357970, "epoch": 4312} {"train_loss": -25.8445987701416, "global_step": 357971, "epoch": 4312} {"train_loss": -26.45440101623535, "global_step": 357972, "epoch": 4312} {"train_loss": -26.02919578552246, "global_step": 357973, "epoch": 4312} {"train_loss": -25.802892684936523, "global_step": 357974, "epoch": 4312} {"train_loss": -26.360382080078125, "global_step": 357975, "epoch": 4312} {"train_loss": -26.145526885986328, "global_step": 357976, "epoch": 4312} {"train_loss": -26.343189239501953, "global_step": 357977, "epoch": 4312} {"train_loss": -25.979908127382576, "global_step": 357978, "epoch": 4312, "val_loss": 6642510.0} {"train_loss": -25.753494262695312, "global_step": 357979, "epoch": 4313} {"train_loss": -24.618898391723633, "global_step": 357980, "epoch": 4313} {"train_loss": -24.887784957885742, "global_step": 357981, "epoch": 4313} {"train_loss": -25.8488712310791, "global_step": 357982, "epoch": 4313} {"train_loss": -25.3159236907959, "global_step": 357983, "epoch": 4313} {"train_loss": -26.012075424194336, "global_step": 357984, "epoch": 4313} {"train_loss": -25.9259033203125, "global_step": 357985, "epoch": 4313} {"train_loss": -25.926313400268555, "global_step": 357986, "epoch": 4313} {"train_loss": -25.314105987548828, "global_step": 357987, "epoch": 4313} {"train_loss": -26.115436553955078, "global_step": 357988, "epoch": 4313} {"train_loss": -25.9934139251709, "global_step": 357989, "epoch": 4313} {"train_loss": -26.03291893005371, "global_step": 357990, "epoch": 4313} {"train_loss": -26.201934814453125, "global_step": 357991, "epoch": 4313} {"train_loss": -25.95814323425293, "global_step": 357992, "epoch": 4313} {"train_loss": -25.926610946655273, "global_step": 357993, "epoch": 4313} {"train_loss": -25.841779708862305, "global_step": 357994, "epoch": 4313} {"train_loss": -25.966745376586914, "global_step": 357995, "epoch": 4313} {"train_loss": -25.725677490234375, "global_step": 357996, "epoch": 4313} {"train_loss": -26.22541618347168, "global_step": 357997, "epoch": 4313} {"train_loss": -26.21339225769043, "global_step": 357998, "epoch": 4313} {"train_loss": -25.886682510375977, "global_step": 357999, "epoch": 4313} {"train_loss": -25.988012313842773, "global_step": 358000, "epoch": 4313} {"train_loss": -26.165042877197266, "global_step": 358001, "epoch": 4313} {"train_loss": -26.077619552612305, "global_step": 358002, "epoch": 4313} {"train_loss": -26.330062866210938, "global_step": 358003, "epoch": 4313} {"train_loss": -25.51936149597168, "global_step": 358004, "epoch": 4313} {"train_loss": -26.28754997253418, "global_step": 358005, "epoch": 4313} {"train_loss": -26.211694717407227, "global_step": 358006, "epoch": 4313} {"train_loss": -25.995849609375, "global_step": 358007, "epoch": 4313} {"train_loss": -26.329193115234375, "global_step": 358008, "epoch": 4313} {"train_loss": -26.03309440612793, "global_step": 358009, "epoch": 4313} {"train_loss": -26.299530029296875, "global_step": 358010, "epoch": 4313} {"train_loss": -25.895727157592773, "global_step": 358011, "epoch": 4313} {"train_loss": -26.24452018737793, "global_step": 358012, "epoch": 4313} {"train_loss": -26.063323974609375, "global_step": 358013, "epoch": 4313} {"train_loss": -25.97946548461914, "global_step": 358014, "epoch": 4313} {"train_loss": -26.473270416259766, "global_step": 358015, "epoch": 4313} {"train_loss": -26.44235610961914, "global_step": 358016, "epoch": 4313} {"train_loss": -26.45193862915039, "global_step": 358017, "epoch": 4313} {"train_loss": -26.348196029663086, "global_step": 358018, "epoch": 4313} {"train_loss": -26.2725887298584, "global_step": 358019, "epoch": 4313} {"train_loss": -26.178150177001953, "global_step": 358020, "epoch": 4313} {"train_loss": -26.044469833374023, "global_step": 358021, "epoch": 4313} {"train_loss": -26.46063804626465, "global_step": 358022, "epoch": 4313} {"train_loss": -26.418304443359375, "global_step": 358023, "epoch": 4313} {"train_loss": -26.395282745361328, "global_step": 358024, "epoch": 4313} {"train_loss": -26.396886825561523, "global_step": 358025, "epoch": 4313} {"train_loss": -26.675048828125, "global_step": 358026, "epoch": 4313} {"train_loss": -26.32990074157715, "global_step": 358027, "epoch": 4313} {"train_loss": -25.945358276367188, "global_step": 358028, "epoch": 4313} {"train_loss": -26.328205108642578, "global_step": 358029, "epoch": 4313} {"train_loss": -26.731937408447266, "global_step": 358030, "epoch": 4313} {"train_loss": -26.519683837890625, "global_step": 358031, "epoch": 4313} {"train_loss": -26.28106689453125, "global_step": 358032, "epoch": 4313} {"train_loss": -26.266586303710938, "global_step": 358033, "epoch": 4313} {"train_loss": -26.339630126953125, "global_step": 358034, "epoch": 4313} {"train_loss": -26.72413444519043, "global_step": 358035, "epoch": 4313} {"train_loss": -26.00339698791504, "global_step": 358036, "epoch": 4313} {"train_loss": -26.167236328125, "global_step": 358037, "epoch": 4313} {"train_loss": -26.445459365844727, "global_step": 358038, "epoch": 4313} {"train_loss": -26.569700241088867, "global_step": 358039, "epoch": 4313} {"train_loss": -26.5085391998291, "global_step": 358040, "epoch": 4313} {"train_loss": -26.617761611938477, "global_step": 358041, "epoch": 4313} {"train_loss": -26.50882339477539, "global_step": 358042, "epoch": 4313} {"train_loss": -26.3006534576416, "global_step": 358043, "epoch": 4313} {"train_loss": -26.11322593688965, "global_step": 358044, "epoch": 4313} {"train_loss": -26.174829483032227, "global_step": 358045, "epoch": 4313} {"train_loss": -26.70221519470215, "global_step": 358046, "epoch": 4313} {"train_loss": -26.379291534423828, "global_step": 358047, "epoch": 4313} {"train_loss": -26.390966415405273, "global_step": 358048, "epoch": 4313} {"train_loss": -26.611557006835938, "global_step": 358049, "epoch": 4313} {"train_loss": -26.185911178588867, "global_step": 358050, "epoch": 4313} {"train_loss": -26.41737937927246, "global_step": 358051, "epoch": 4313} {"train_loss": -26.090503692626953, "global_step": 358052, "epoch": 4313} {"train_loss": -26.02979850769043, "global_step": 358053, "epoch": 4313} {"train_loss": -26.300718307495117, "global_step": 358054, "epoch": 4313} {"train_loss": -26.489973068237305, "global_step": 358055, "epoch": 4313} {"train_loss": -26.227258682250977, "global_step": 358056, "epoch": 4313} {"train_loss": -26.240476608276367, "global_step": 358057, "epoch": 4313} {"train_loss": -25.654748916625977, "global_step": 358058, "epoch": 4313} {"train_loss": -25.57796859741211, "global_step": 358059, "epoch": 4313} {"train_loss": -26.299718856811523, "global_step": 358060, "epoch": 4313} {"train_loss": -26.15621785083449, "global_step": 358061, "epoch": 4313, "val_loss": 6579996.0} {"train_loss": -25.07914161682129, "global_step": 358062, "epoch": 4314} {"train_loss": -25.114479064941406, "global_step": 358063, "epoch": 4314} {"train_loss": -25.8291015625, "global_step": 358064, "epoch": 4314} {"train_loss": -25.119064331054688, "global_step": 358065, "epoch": 4314} {"train_loss": -25.880298614501953, "global_step": 358066, "epoch": 4314} {"train_loss": -25.42203712463379, "global_step": 358067, "epoch": 4314} {"train_loss": -25.708166122436523, "global_step": 358068, "epoch": 4314} {"train_loss": -25.529117584228516, "global_step": 358069, "epoch": 4314} {"train_loss": -25.856918334960938, "global_step": 358070, "epoch": 4314} {"train_loss": -25.624601364135742, "global_step": 358071, "epoch": 4314} {"train_loss": -25.917449951171875, "global_step": 358072, "epoch": 4314} {"train_loss": -25.431161880493164, "global_step": 358073, "epoch": 4314} {"train_loss": -25.796682357788086, "global_step": 358074, "epoch": 4314} {"train_loss": -25.88714599609375, "global_step": 358075, "epoch": 4314} {"train_loss": -26.17449951171875, "global_step": 358076, "epoch": 4314} {"train_loss": -25.50625228881836, "global_step": 358077, "epoch": 4314} {"train_loss": -25.929548263549805, "global_step": 358078, "epoch": 4314} {"train_loss": -25.9097843170166, "global_step": 358079, "epoch": 4314} {"train_loss": -25.9945068359375, "global_step": 358080, "epoch": 4314} {"train_loss": -25.851612091064453, "global_step": 358081, "epoch": 4314} {"train_loss": -25.5672664642334, "global_step": 358082, "epoch": 4314} {"train_loss": -26.005786895751953, "global_step": 358083, "epoch": 4314} {"train_loss": -26.33559226989746, "global_step": 358084, "epoch": 4314} {"train_loss": -25.96323585510254, "global_step": 358085, "epoch": 4314} {"train_loss": -26.187957763671875, "global_step": 358086, "epoch": 4314} {"train_loss": -26.040613174438477, "global_step": 358087, "epoch": 4314} {"train_loss": -26.250940322875977, "global_step": 358088, "epoch": 4314} {"train_loss": -26.18915367126465, "global_step": 358089, "epoch": 4314} {"train_loss": -26.192670822143555, "global_step": 358090, "epoch": 4314} {"train_loss": -26.612333297729492, "global_step": 358091, "epoch": 4314} {"train_loss": -26.15852165222168, "global_step": 358092, "epoch": 4314} {"train_loss": -26.3064022064209, "global_step": 358093, "epoch": 4314} {"train_loss": -26.53352928161621, "global_step": 358094, "epoch": 4314} {"train_loss": -26.07354164123535, "global_step": 358095, "epoch": 4314} {"train_loss": -26.144357681274414, "global_step": 358096, "epoch": 4314} {"train_loss": -26.33416175842285, "global_step": 358097, "epoch": 4314} {"train_loss": -26.17780113220215, "global_step": 358098, "epoch": 4314} {"train_loss": -26.560516357421875, "global_step": 358099, "epoch": 4314} {"train_loss": -26.00836181640625, "global_step": 358100, "epoch": 4314} {"train_loss": -26.4581241607666, "global_step": 358101, "epoch": 4314} {"train_loss": -26.226194381713867, "global_step": 358102, "epoch": 4314} {"train_loss": -26.31302833557129, "global_step": 358103, "epoch": 4314} {"train_loss": -26.412002563476562, "global_step": 358104, "epoch": 4314} {"train_loss": -26.283935546875, "global_step": 358105, "epoch": 4314} {"train_loss": -26.188379287719727, "global_step": 358106, "epoch": 4314} {"train_loss": -26.541563034057617, "global_step": 358107, "epoch": 4314} {"train_loss": -26.571857452392578, "global_step": 358108, "epoch": 4314} {"train_loss": -25.938922882080078, "global_step": 358109, "epoch": 4314} {"train_loss": -26.54854393005371, "global_step": 358110, "epoch": 4314} {"train_loss": -26.30511474609375, "global_step": 358111, "epoch": 4314} {"train_loss": -25.932897567749023, "global_step": 358112, "epoch": 4314} {"train_loss": -26.09784507751465, "global_step": 358113, "epoch": 4314} {"train_loss": -26.58453941345215, "global_step": 358114, "epoch": 4314} {"train_loss": -26.448795318603516, "global_step": 358115, "epoch": 4314} {"train_loss": -26.09929847717285, "global_step": 358116, "epoch": 4314} {"train_loss": -26.325429916381836, "global_step": 358117, "epoch": 4314} {"train_loss": -25.892913818359375, "global_step": 358118, "epoch": 4314} {"train_loss": -26.58835220336914, "global_step": 358119, "epoch": 4314} {"train_loss": -26.339996337890625, "global_step": 358120, "epoch": 4314} {"train_loss": -26.60160255432129, "global_step": 358121, "epoch": 4314} {"train_loss": -26.04646110534668, "global_step": 358122, "epoch": 4314} {"train_loss": -26.6597957611084, "global_step": 358123, "epoch": 4314} {"train_loss": -26.63673973083496, "global_step": 358124, "epoch": 4314} {"train_loss": -26.379179000854492, "global_step": 358125, "epoch": 4314} {"train_loss": -26.570547103881836, "global_step": 358126, "epoch": 4314} {"train_loss": -26.493051528930664, "global_step": 358127, "epoch": 4314} {"train_loss": -26.43363380432129, "global_step": 358128, "epoch": 4314} {"train_loss": -25.771575927734375, "global_step": 358129, "epoch": 4314} {"train_loss": -26.36870765686035, "global_step": 358130, "epoch": 4314} {"train_loss": -26.138111114501953, "global_step": 358131, "epoch": 4314} {"train_loss": -26.29855728149414, "global_step": 358132, "epoch": 4314} {"train_loss": -26.290781021118164, "global_step": 358133, "epoch": 4314} {"train_loss": -26.317285537719727, "global_step": 358134, "epoch": 4314} {"train_loss": -26.149646759033203, "global_step": 358135, "epoch": 4314} {"train_loss": -26.394678115844727, "global_step": 358136, "epoch": 4314} {"train_loss": -25.397695541381836, "global_step": 358137, "epoch": 4314} {"train_loss": -23.988754272460938, "global_step": 358138, "epoch": 4314} {"train_loss": -23.562501907348633, "global_step": 358139, "epoch": 4314} {"train_loss": -24.826934814453125, "global_step": 358140, "epoch": 4314} {"train_loss": -26.072132110595703, "global_step": 358141, "epoch": 4314} {"train_loss": -25.593494415283203, "global_step": 358142, "epoch": 4314} {"train_loss": -26.053319931030273, "global_step": 358143, "epoch": 4314} {"train_loss": -26.05216768563512, "global_step": 358144, "epoch": 4314, "val_loss": 6553074.0} {"train_loss": -24.644460678100586, "global_step": 358145, "epoch": 4315} {"train_loss": -25.66983985900879, "global_step": 358146, "epoch": 4315} {"train_loss": -24.847015380859375, "global_step": 358147, "epoch": 4315} {"train_loss": -25.829391479492188, "global_step": 358148, "epoch": 4315} {"train_loss": -25.598268508911133, "global_step": 358149, "epoch": 4315} {"train_loss": -25.565542221069336, "global_step": 358150, "epoch": 4315} {"train_loss": -25.47416877746582, "global_step": 358151, "epoch": 4315} {"train_loss": -25.693058013916016, "global_step": 358152, "epoch": 4315} {"train_loss": -25.309772491455078, "global_step": 358153, "epoch": 4315} {"train_loss": -25.825841903686523, "global_step": 358154, "epoch": 4315} {"train_loss": -25.847864151000977, "global_step": 358155, "epoch": 4315} {"train_loss": -26.012176513671875, "global_step": 358156, "epoch": 4315} {"train_loss": -25.524349212646484, "global_step": 358157, "epoch": 4315} {"train_loss": -25.97530174255371, "global_step": 358158, "epoch": 4315} {"train_loss": -25.680822372436523, "global_step": 358159, "epoch": 4315} {"train_loss": -25.618452072143555, "global_step": 358160, "epoch": 4315} {"train_loss": -25.754377365112305, "global_step": 358161, "epoch": 4315} {"train_loss": -25.14606285095215, "global_step": 358162, "epoch": 4315} {"train_loss": -25.672576904296875, "global_step": 358163, "epoch": 4315} {"train_loss": -26.060590744018555, "global_step": 358164, "epoch": 4315} {"train_loss": -25.923547744750977, "global_step": 358165, "epoch": 4315} {"train_loss": -25.9468936920166, "global_step": 358166, "epoch": 4315} {"train_loss": -26.18168067932129, "global_step": 358167, "epoch": 4315} {"train_loss": -26.537445068359375, "global_step": 358168, "epoch": 4315} {"train_loss": -26.042404174804688, "global_step": 358169, "epoch": 4315} {"train_loss": -25.846012115478516, "global_step": 358170, "epoch": 4315} {"train_loss": -26.45586585998535, "global_step": 358171, "epoch": 4315} {"train_loss": -25.837970733642578, "global_step": 358172, "epoch": 4315} {"train_loss": -26.096357345581055, "global_step": 358173, "epoch": 4315} {"train_loss": -26.130661010742188, "global_step": 358174, "epoch": 4315} {"train_loss": -26.282567977905273, "global_step": 358175, "epoch": 4315} {"train_loss": -25.731367111206055, "global_step": 358176, "epoch": 4315} {"train_loss": -26.24847412109375, "global_step": 358177, "epoch": 4315} {"train_loss": -25.879987716674805, "global_step": 358178, "epoch": 4315} {"train_loss": -26.085336685180664, "global_step": 358179, "epoch": 4315} {"train_loss": -26.3228816986084, "global_step": 358180, "epoch": 4315} {"train_loss": -26.2296085357666, "global_step": 358181, "epoch": 4315} {"train_loss": -26.047189712524414, "global_step": 358182, "epoch": 4315} {"train_loss": -26.094675064086914, "global_step": 358183, "epoch": 4315} {"train_loss": -26.17023277282715, "global_step": 358184, "epoch": 4315} {"train_loss": -26.208480834960938, "global_step": 358185, "epoch": 4315} {"train_loss": -26.211530685424805, "global_step": 358186, "epoch": 4315} {"train_loss": -26.35135841369629, "global_step": 358187, "epoch": 4315} {"train_loss": -26.2496337890625, "global_step": 358188, "epoch": 4315} {"train_loss": -26.468191146850586, "global_step": 358189, "epoch": 4315} {"train_loss": -26.25996971130371, "global_step": 358190, "epoch": 4315} {"train_loss": -26.268115997314453, "global_step": 358191, "epoch": 4315} {"train_loss": -26.026296615600586, "global_step": 358192, "epoch": 4315} {"train_loss": -26.08921241760254, "global_step": 358193, "epoch": 4315} {"train_loss": -26.21619987487793, "global_step": 358194, "epoch": 4315} {"train_loss": -25.960514068603516, "global_step": 358195, "epoch": 4315} {"train_loss": -26.418859481811523, "global_step": 358196, "epoch": 4315} {"train_loss": -26.28834342956543, "global_step": 358197, "epoch": 4315} {"train_loss": -26.31683349609375, "global_step": 358198, "epoch": 4315} {"train_loss": -26.2620906829834, "global_step": 358199, "epoch": 4315} {"train_loss": -26.29005241394043, "global_step": 358200, "epoch": 4315} {"train_loss": -26.489990234375, "global_step": 358201, "epoch": 4315} {"train_loss": -26.32697105407715, "global_step": 358202, "epoch": 4315} {"train_loss": -26.326879501342773, "global_step": 358203, "epoch": 4315} {"train_loss": -26.316816329956055, "global_step": 358204, "epoch": 4315} {"train_loss": -26.335147857666016, "global_step": 358205, "epoch": 4315} {"train_loss": -26.366474151611328, "global_step": 358206, "epoch": 4315} {"train_loss": -26.538227081298828, "global_step": 358207, "epoch": 4315} {"train_loss": -26.715139389038086, "global_step": 358208, "epoch": 4315} {"train_loss": -26.208654403686523, "global_step": 358209, "epoch": 4315} {"train_loss": -26.500823974609375, "global_step": 358210, "epoch": 4315} {"train_loss": -26.545942306518555, "global_step": 358211, "epoch": 4315} {"train_loss": -26.59075927734375, "global_step": 358212, "epoch": 4315} {"train_loss": -26.47854995727539, "global_step": 358213, "epoch": 4315} {"train_loss": -26.26409339904785, "global_step": 358214, "epoch": 4315} {"train_loss": -26.39063835144043, "global_step": 358215, "epoch": 4315} {"train_loss": -26.467748641967773, "global_step": 358216, "epoch": 4315} {"train_loss": -26.474218368530273, "global_step": 358217, "epoch": 4315} {"train_loss": -26.310346603393555, "global_step": 358218, "epoch": 4315} {"train_loss": -26.211023330688477, "global_step": 358219, "epoch": 4315} {"train_loss": -26.345197677612305, "global_step": 358220, "epoch": 4315} {"train_loss": -26.45464515686035, "global_step": 358221, "epoch": 4315} {"train_loss": -26.1968994140625, "global_step": 358222, "epoch": 4315} {"train_loss": -25.984128952026367, "global_step": 358223, "epoch": 4315} {"train_loss": -26.473974227905273, "global_step": 358224, "epoch": 4315} {"train_loss": -26.203641891479492, "global_step": 358225, "epoch": 4315} {"train_loss": -25.978408813476562, "global_step": 358226, "epoch": 4315} {"train_loss": -26.091942752700255, "global_step": 358227, "epoch": 4315, "val_loss": 6530146.0} {"train_loss": -24.8216552734375, "global_step": 358228, "epoch": 4316} {"train_loss": -23.671918869018555, "global_step": 358229, "epoch": 4316} {"train_loss": -23.682619094848633, "global_step": 358230, "epoch": 4316} {"train_loss": -25.159961700439453, "global_step": 358231, "epoch": 4316} {"train_loss": -24.38777732849121, "global_step": 358232, "epoch": 4316} {"train_loss": -24.290241241455078, "global_step": 358233, "epoch": 4316} {"train_loss": -25.17359161376953, "global_step": 358234, "epoch": 4316} {"train_loss": -24.283157348632812, "global_step": 358235, "epoch": 4316} {"train_loss": -24.673900604248047, "global_step": 358236, "epoch": 4316} {"train_loss": -25.11676025390625, "global_step": 358237, "epoch": 4316} {"train_loss": -24.917097091674805, "global_step": 358238, "epoch": 4316} {"train_loss": -24.881528854370117, "global_step": 358239, "epoch": 4316} {"train_loss": -25.188833236694336, "global_step": 358240, "epoch": 4316} {"train_loss": -25.110748291015625, "global_step": 358241, "epoch": 4316} {"train_loss": -25.42477035522461, "global_step": 358242, "epoch": 4316} {"train_loss": -25.532888412475586, "global_step": 358243, "epoch": 4316} {"train_loss": -25.74609375, "global_step": 358244, "epoch": 4316} {"train_loss": -25.485946655273438, "global_step": 358245, "epoch": 4316} {"train_loss": -25.534000396728516, "global_step": 358246, "epoch": 4316} {"train_loss": -25.434524536132812, "global_step": 358247, "epoch": 4316} {"train_loss": -25.59989356994629, "global_step": 358248, "epoch": 4316} {"train_loss": -25.77826499938965, "global_step": 358249, "epoch": 4316} {"train_loss": -25.343652725219727, "global_step": 358250, "epoch": 4316} {"train_loss": -25.697986602783203, "global_step": 358251, "epoch": 4316} {"train_loss": -25.797870635986328, "global_step": 358252, "epoch": 4316} {"train_loss": -25.76967430114746, "global_step": 358253, "epoch": 4316} {"train_loss": -26.131702423095703, "global_step": 358254, "epoch": 4316} {"train_loss": -26.08478355407715, "global_step": 358255, "epoch": 4316} {"train_loss": -25.958032608032227, "global_step": 358256, "epoch": 4316} {"train_loss": -25.744794845581055, "global_step": 358257, "epoch": 4316} {"train_loss": -26.059629440307617, "global_step": 358258, "epoch": 4316} {"train_loss": -25.971893310546875, "global_step": 358259, "epoch": 4316} {"train_loss": -25.91597557067871, "global_step": 358260, "epoch": 4316} {"train_loss": -25.974960327148438, "global_step": 358261, "epoch": 4316} {"train_loss": -26.248361587524414, "global_step": 358262, "epoch": 4316} {"train_loss": -26.130155563354492, "global_step": 358263, "epoch": 4316} {"train_loss": -26.08502197265625, "global_step": 358264, "epoch": 4316} {"train_loss": -26.132904052734375, "global_step": 358265, "epoch": 4316} {"train_loss": -26.000690460205078, "global_step": 358266, "epoch": 4316} {"train_loss": -26.128644943237305, "global_step": 358267, "epoch": 4316} {"train_loss": -25.98392677307129, "global_step": 358268, "epoch": 4316} {"train_loss": -26.563161849975586, "global_step": 358269, "epoch": 4316} {"train_loss": -26.451766967773438, "global_step": 358270, "epoch": 4316} {"train_loss": -26.21565818786621, "global_step": 358271, "epoch": 4316} {"train_loss": -26.066381454467773, "global_step": 358272, "epoch": 4316} {"train_loss": -26.332794189453125, "global_step": 358273, "epoch": 4316} {"train_loss": -26.39032554626465, "global_step": 358274, "epoch": 4316} {"train_loss": -25.975149154663086, "global_step": 358275, "epoch": 4316} {"train_loss": -26.2520751953125, "global_step": 358276, "epoch": 4316} {"train_loss": -26.948766708374023, "global_step": 358277, "epoch": 4316} {"train_loss": -26.294294357299805, "global_step": 358278, "epoch": 4316} {"train_loss": -26.538116455078125, "global_step": 358279, "epoch": 4316} {"train_loss": -26.3314208984375, "global_step": 358280, "epoch": 4316} {"train_loss": -26.325061798095703, "global_step": 358281, "epoch": 4316} {"train_loss": -26.461761474609375, "global_step": 358282, "epoch": 4316} {"train_loss": -26.391265869140625, "global_step": 358283, "epoch": 4316} {"train_loss": -26.248828887939453, "global_step": 358284, "epoch": 4316} {"train_loss": -26.225107192993164, "global_step": 358285, "epoch": 4316} {"train_loss": -26.349090576171875, "global_step": 358286, "epoch": 4316} {"train_loss": -26.617578506469727, "global_step": 358287, "epoch": 4316} {"train_loss": -26.154626846313477, "global_step": 358288, "epoch": 4316} {"train_loss": -26.347625732421875, "global_step": 358289, "epoch": 4316} {"train_loss": -26.200092315673828, "global_step": 358290, "epoch": 4316} {"train_loss": -25.96790885925293, "global_step": 358291, "epoch": 4316} {"train_loss": -25.58034324645996, "global_step": 358292, "epoch": 4316} {"train_loss": -26.148544311523438, "global_step": 358293, "epoch": 4316} {"train_loss": -26.228870391845703, "global_step": 358294, "epoch": 4316} {"train_loss": -26.159353256225586, "global_step": 358295, "epoch": 4316} {"train_loss": -26.283065795898438, "global_step": 358296, "epoch": 4316} {"train_loss": -25.8753719329834, "global_step": 358297, "epoch": 4316} {"train_loss": -25.762784957885742, "global_step": 358298, "epoch": 4316} {"train_loss": -26.62505531311035, "global_step": 358299, "epoch": 4316} {"train_loss": -26.221176147460938, "global_step": 358300, "epoch": 4316} {"train_loss": -25.834142684936523, "global_step": 358301, "epoch": 4316} {"train_loss": -25.825525283813477, "global_step": 358302, "epoch": 4316} {"train_loss": -26.22564697265625, "global_step": 358303, "epoch": 4316} {"train_loss": -26.176910400390625, "global_step": 358304, "epoch": 4316} {"train_loss": -26.514089584350586, "global_step": 358305, "epoch": 4316} {"train_loss": -25.627029418945312, "global_step": 358306, "epoch": 4316} {"train_loss": -26.524307250976562, "global_step": 358307, "epoch": 4316} {"train_loss": -25.938879013061523, "global_step": 358308, "epoch": 4316} {"train_loss": -26.486328125, "global_step": 358309, "epoch": 4316} {"train_loss": -25.841017941394483, "global_step": 358310, "epoch": 4316, "val_loss": 6472018.0} {"train_loss": -25.1279239654541, "global_step": 358311, "epoch": 4317} {"train_loss": -25.762781143188477, "global_step": 358312, "epoch": 4317} {"train_loss": -24.531644821166992, "global_step": 358313, "epoch": 4317} {"train_loss": -25.545686721801758, "global_step": 358314, "epoch": 4317} {"train_loss": -25.606115341186523, "global_step": 358315, "epoch": 4317} {"train_loss": -25.680164337158203, "global_step": 358316, "epoch": 4317} {"train_loss": -25.83904457092285, "global_step": 358317, "epoch": 4317} {"train_loss": -25.1796932220459, "global_step": 358318, "epoch": 4317} {"train_loss": -25.8604736328125, "global_step": 358319, "epoch": 4317} {"train_loss": -25.390666961669922, "global_step": 358320, "epoch": 4317} {"train_loss": -25.885833740234375, "global_step": 358321, "epoch": 4317} {"train_loss": -25.491657257080078, "global_step": 358322, "epoch": 4317} {"train_loss": -25.6893310546875, "global_step": 358323, "epoch": 4317} {"train_loss": -26.0291690826416, "global_step": 358324, "epoch": 4317} {"train_loss": -25.80537223815918, "global_step": 358325, "epoch": 4317} {"train_loss": -25.842498779296875, "global_step": 358326, "epoch": 4317} {"train_loss": -25.889209747314453, "global_step": 358327, "epoch": 4317} {"train_loss": -26.29438591003418, "global_step": 358328, "epoch": 4317} {"train_loss": -25.846866607666016, "global_step": 358329, "epoch": 4317} {"train_loss": -25.968809127807617, "global_step": 358330, "epoch": 4317} {"train_loss": -26.11810874938965, "global_step": 358331, "epoch": 4317} {"train_loss": -25.832611083984375, "global_step": 358332, "epoch": 4317} {"train_loss": -26.286487579345703, "global_step": 358333, "epoch": 4317} {"train_loss": -26.121408462524414, "global_step": 358334, "epoch": 4317} {"train_loss": -25.857379913330078, "global_step": 358335, "epoch": 4317} {"train_loss": -25.772733688354492, "global_step": 358336, "epoch": 4317} {"train_loss": -26.297269821166992, "global_step": 358337, "epoch": 4317} {"train_loss": -25.936201095581055, "global_step": 358338, "epoch": 4317} {"train_loss": -26.266454696655273, "global_step": 358339, "epoch": 4317} {"train_loss": -26.085418701171875, "global_step": 358340, "epoch": 4317} {"train_loss": -26.316314697265625, "global_step": 358341, "epoch": 4317} {"train_loss": -26.280553817749023, "global_step": 358342, "epoch": 4317} {"train_loss": -26.02888298034668, "global_step": 358343, "epoch": 4317} {"train_loss": -26.234533309936523, "global_step": 358344, "epoch": 4317} {"train_loss": -26.324758529663086, "global_step": 358345, "epoch": 4317} {"train_loss": -26.005634307861328, "global_step": 358346, "epoch": 4317} {"train_loss": -26.003772735595703, "global_step": 358347, "epoch": 4317} {"train_loss": -26.228504180908203, "global_step": 358348, "epoch": 4317} {"train_loss": -26.464160919189453, "global_step": 358349, "epoch": 4317} {"train_loss": -26.120563507080078, "global_step": 358350, "epoch": 4317} {"train_loss": -26.623260498046875, "global_step": 358351, "epoch": 4317} {"train_loss": -26.295459747314453, "global_step": 358352, "epoch": 4317} {"train_loss": -26.17098045349121, "global_step": 358353, "epoch": 4317} {"train_loss": -26.32977294921875, "global_step": 358354, "epoch": 4317} {"train_loss": -26.35296630859375, "global_step": 358355, "epoch": 4317} {"train_loss": -26.389768600463867, "global_step": 358356, "epoch": 4317} {"train_loss": -26.266576766967773, "global_step": 358357, "epoch": 4317} {"train_loss": -26.29115104675293, "global_step": 358358, "epoch": 4317} {"train_loss": -26.335905075073242, "global_step": 358359, "epoch": 4317} {"train_loss": -26.348514556884766, "global_step": 358360, "epoch": 4317} {"train_loss": -25.722888946533203, "global_step": 358361, "epoch": 4317} {"train_loss": -25.61893653869629, "global_step": 358362, "epoch": 4317} {"train_loss": -26.135236740112305, "global_step": 358363, "epoch": 4317} {"train_loss": -25.964893341064453, "global_step": 358364, "epoch": 4317} {"train_loss": -26.287036895751953, "global_step": 358365, "epoch": 4317} {"train_loss": -26.447641372680664, "global_step": 358366, "epoch": 4317} {"train_loss": -26.245046615600586, "global_step": 358367, "epoch": 4317} {"train_loss": -25.882001876831055, "global_step": 358368, "epoch": 4317} {"train_loss": -26.104150772094727, "global_step": 358369, "epoch": 4317} {"train_loss": -26.34571647644043, "global_step": 358370, "epoch": 4317} {"train_loss": -26.109663009643555, "global_step": 358371, "epoch": 4317} {"train_loss": -26.769439697265625, "global_step": 358372, "epoch": 4317} {"train_loss": -26.498197555541992, "global_step": 358373, "epoch": 4317} {"train_loss": -26.370223999023438, "global_step": 358374, "epoch": 4317} {"train_loss": -26.19573402404785, "global_step": 358375, "epoch": 4317} {"train_loss": -26.20391845703125, "global_step": 358376, "epoch": 4317} {"train_loss": -26.5924072265625, "global_step": 358377, "epoch": 4317} {"train_loss": -26.51801109313965, "global_step": 358378, "epoch": 4317} {"train_loss": -26.222885131835938, "global_step": 358379, "epoch": 4317} {"train_loss": -26.169660568237305, "global_step": 358380, "epoch": 4317} {"train_loss": -26.39274024963379, "global_step": 358381, "epoch": 4317} {"train_loss": -26.40445327758789, "global_step": 358382, "epoch": 4317} {"train_loss": -26.36783790588379, "global_step": 358383, "epoch": 4317} {"train_loss": -26.173023223876953, "global_step": 358384, "epoch": 4317} {"train_loss": -26.271154403686523, "global_step": 358385, "epoch": 4317} {"train_loss": -26.012195587158203, "global_step": 358386, "epoch": 4317} {"train_loss": -26.492755889892578, "global_step": 358387, "epoch": 4317} {"train_loss": -26.286270141601562, "global_step": 358388, "epoch": 4317} {"train_loss": -26.063556671142578, "global_step": 358389, "epoch": 4317} {"train_loss": -26.1578369140625, "global_step": 358390, "epoch": 4317} {"train_loss": -26.11740493774414, "global_step": 358391, "epoch": 4317} {"train_loss": -26.4404354095459, "global_step": 358392, "epoch": 4317} {"train_loss": -26.117744193019636, "global_step": 358393, "epoch": 4317, "val_loss": 6593464.0} {"train_loss": -22.470956802368164, "global_step": 358394, "epoch": 4318} {"train_loss": -24.853553771972656, "global_step": 358395, "epoch": 4318} {"train_loss": -25.9061222076416, "global_step": 358396, "epoch": 4318} {"train_loss": -25.0576229095459, "global_step": 358397, "epoch": 4318} {"train_loss": -25.599103927612305, "global_step": 358398, "epoch": 4318} {"train_loss": -25.563495635986328, "global_step": 358399, "epoch": 4318} {"train_loss": -25.821252822875977, "global_step": 358400, "epoch": 4318} {"train_loss": -25.34891128540039, "global_step": 358401, "epoch": 4318} {"train_loss": -25.369709014892578, "global_step": 358402, "epoch": 4318} {"train_loss": -25.368383407592773, "global_step": 358403, "epoch": 4318} {"train_loss": -24.99269676208496, "global_step": 358404, "epoch": 4318} {"train_loss": -25.30869483947754, "global_step": 358405, "epoch": 4318} {"train_loss": -25.52564239501953, "global_step": 358406, "epoch": 4318} {"train_loss": -25.516464233398438, "global_step": 358407, "epoch": 4318} {"train_loss": -25.898218154907227, "global_step": 358408, "epoch": 4318} {"train_loss": -25.8362979888916, "global_step": 358409, "epoch": 4318} {"train_loss": -25.84229850769043, "global_step": 358410, "epoch": 4318} {"train_loss": -25.866933822631836, "global_step": 358411, "epoch": 4318} {"train_loss": -26.1469783782959, "global_step": 358412, "epoch": 4318} {"train_loss": -26.050207138061523, "global_step": 358413, "epoch": 4318} {"train_loss": -25.857572555541992, "global_step": 358414, "epoch": 4318} {"train_loss": -26.17791748046875, "global_step": 358415, "epoch": 4318} {"train_loss": -25.7661190032959, "global_step": 358416, "epoch": 4318} {"train_loss": -25.994613647460938, "global_step": 358417, "epoch": 4318} {"train_loss": -26.049299240112305, "global_step": 358418, "epoch": 4318} {"train_loss": -25.687423706054688, "global_step": 358419, "epoch": 4318} {"train_loss": -25.84429359436035, "global_step": 358420, "epoch": 4318} {"train_loss": -26.498849868774414, "global_step": 358421, "epoch": 4318} {"train_loss": -25.881895065307617, "global_step": 358422, "epoch": 4318} {"train_loss": -26.372217178344727, "global_step": 358423, "epoch": 4318} {"train_loss": -25.578235626220703, "global_step": 358424, "epoch": 4318} {"train_loss": -26.0540828704834, "global_step": 358425, "epoch": 4318} {"train_loss": -26.5800838470459, "global_step": 358426, "epoch": 4318} {"train_loss": -26.092803955078125, "global_step": 358427, "epoch": 4318} {"train_loss": -25.959272384643555, "global_step": 358428, "epoch": 4318} {"train_loss": -26.419754028320312, "global_step": 358429, "epoch": 4318} {"train_loss": -26.233449935913086, "global_step": 358430, "epoch": 4318} {"train_loss": -26.214645385742188, "global_step": 358431, "epoch": 4318} {"train_loss": -26.2016658782959, "global_step": 358432, "epoch": 4318} {"train_loss": -26.519412994384766, "global_step": 358433, "epoch": 4318} {"train_loss": -26.235523223876953, "global_step": 358434, "epoch": 4318} {"train_loss": -25.931188583374023, "global_step": 358435, "epoch": 4318} {"train_loss": -25.841114044189453, "global_step": 358436, "epoch": 4318} {"train_loss": -26.31673240661621, "global_step": 358437, "epoch": 4318} {"train_loss": -26.13755226135254, "global_step": 358438, "epoch": 4318} {"train_loss": -26.639028549194336, "global_step": 358439, "epoch": 4318} {"train_loss": -26.198108673095703, "global_step": 358440, "epoch": 4318} {"train_loss": -26.282379150390625, "global_step": 358441, "epoch": 4318} {"train_loss": -26.30375099182129, "global_step": 358442, "epoch": 4318} {"train_loss": -25.985502243041992, "global_step": 358443, "epoch": 4318} {"train_loss": -25.895263671875, "global_step": 358444, "epoch": 4318} {"train_loss": -26.231128692626953, "global_step": 358445, "epoch": 4318} {"train_loss": -26.015430450439453, "global_step": 358446, "epoch": 4318} {"train_loss": -26.21044921875, "global_step": 358447, "epoch": 4318} {"train_loss": -26.42484474182129, "global_step": 358448, "epoch": 4318} {"train_loss": -26.42469596862793, "global_step": 358449, "epoch": 4318} {"train_loss": -25.90923500061035, "global_step": 358450, "epoch": 4318} {"train_loss": -26.170133590698242, "global_step": 358451, "epoch": 4318} {"train_loss": -26.519102096557617, "global_step": 358452, "epoch": 4318} {"train_loss": -26.134469985961914, "global_step": 358453, "epoch": 4318} {"train_loss": -26.06085205078125, "global_step": 358454, "epoch": 4318} {"train_loss": -25.84222984313965, "global_step": 358455, "epoch": 4318} {"train_loss": -26.03497886657715, "global_step": 358456, "epoch": 4318} {"train_loss": -25.9706974029541, "global_step": 358457, "epoch": 4318} {"train_loss": -26.165130615234375, "global_step": 358458, "epoch": 4318} {"train_loss": -26.157934188842773, "global_step": 358459, "epoch": 4318} {"train_loss": -26.215930938720703, "global_step": 358460, "epoch": 4318} {"train_loss": -26.160917282104492, "global_step": 358461, "epoch": 4318} {"train_loss": -26.08086585998535, "global_step": 358462, "epoch": 4318} {"train_loss": -26.128202438354492, "global_step": 358463, "epoch": 4318} {"train_loss": -26.306232452392578, "global_step": 358464, "epoch": 4318} {"train_loss": -26.313032150268555, "global_step": 358465, "epoch": 4318} {"train_loss": -26.29432487487793, "global_step": 358466, "epoch": 4318} {"train_loss": -26.09819984436035, "global_step": 358467, "epoch": 4318} {"train_loss": -26.15158462524414, "global_step": 358468, "epoch": 4318} {"train_loss": -26.25348472595215, "global_step": 358469, "epoch": 4318} {"train_loss": -26.342077255249023, "global_step": 358470, "epoch": 4318} {"train_loss": -26.16181755065918, "global_step": 358471, "epoch": 4318} {"train_loss": -25.6853084564209, "global_step": 358472, "epoch": 4318} {"train_loss": -25.922977447509766, "global_step": 358473, "epoch": 4318} {"train_loss": -25.95216178894043, "global_step": 358474, "epoch": 4318} {"train_loss": -26.078353881835938, "global_step": 358475, "epoch": 4318} {"train_loss": -25.95911579821483, "global_step": 358476, "epoch": 4318, "val_loss": 6605301.5} {"train_loss": -25.24378776550293, "global_step": 358477, "epoch": 4319} {"train_loss": -25.658048629760742, "global_step": 358478, "epoch": 4319} {"train_loss": -26.050161361694336, "global_step": 358479, "epoch": 4319} {"train_loss": -25.66529655456543, "global_step": 358480, "epoch": 4319} {"train_loss": -26.054431915283203, "global_step": 358481, "epoch": 4319} {"train_loss": -25.8857479095459, "global_step": 358482, "epoch": 4319} {"train_loss": -26.045957565307617, "global_step": 358483, "epoch": 4319} {"train_loss": -25.902196884155273, "global_step": 358484, "epoch": 4319} {"train_loss": -26.268014907836914, "global_step": 358485, "epoch": 4319} {"train_loss": -25.789215087890625, "global_step": 358486, "epoch": 4319} {"train_loss": -25.784894943237305, "global_step": 358487, "epoch": 4319} {"train_loss": -25.73429298400879, "global_step": 358488, "epoch": 4319} {"train_loss": -26.11176109313965, "global_step": 358489, "epoch": 4319} {"train_loss": -25.953516006469727, "global_step": 358490, "epoch": 4319} {"train_loss": -25.861303329467773, "global_step": 358491, "epoch": 4319} {"train_loss": -26.439538955688477, "global_step": 358492, "epoch": 4319} {"train_loss": -26.371200561523438, "global_step": 358493, "epoch": 4319} {"train_loss": -25.7041015625, "global_step": 358494, "epoch": 4319} {"train_loss": -26.59375, "global_step": 358495, "epoch": 4319} {"train_loss": -26.388639450073242, "global_step": 358496, "epoch": 4319} {"train_loss": -26.612218856811523, "global_step": 358497, "epoch": 4319} {"train_loss": -26.784765243530273, "global_step": 358498, "epoch": 4319} {"train_loss": -26.34925651550293, "global_step": 358499, "epoch": 4319} {"train_loss": -26.45599365234375, "global_step": 358500, "epoch": 4319} {"train_loss": -26.16163444519043, "global_step": 358501, "epoch": 4319} {"train_loss": -25.94795036315918, "global_step": 358502, "epoch": 4319} {"train_loss": -26.221155166625977, "global_step": 358503, "epoch": 4319} {"train_loss": -26.34096336364746, "global_step": 358504, "epoch": 4319} {"train_loss": -26.649856567382812, "global_step": 358505, "epoch": 4319} {"train_loss": -26.279687881469727, "global_step": 358506, "epoch": 4319} {"train_loss": -26.294912338256836, "global_step": 358507, "epoch": 4319} {"train_loss": -26.158878326416016, "global_step": 358508, "epoch": 4319} {"train_loss": -26.34979820251465, "global_step": 358509, "epoch": 4319} {"train_loss": -26.14959144592285, "global_step": 358510, "epoch": 4319} {"train_loss": -26.437408447265625, "global_step": 358511, "epoch": 4319} {"train_loss": -26.34198570251465, "global_step": 358512, "epoch": 4319} {"train_loss": -26.5060977935791, "global_step": 358513, "epoch": 4319} {"train_loss": -26.413101196289062, "global_step": 358514, "epoch": 4319} {"train_loss": -26.450307846069336, "global_step": 358515, "epoch": 4319} {"train_loss": -26.412506103515625, "global_step": 358516, "epoch": 4319} {"train_loss": -26.36865234375, "global_step": 358517, "epoch": 4319} {"train_loss": -26.459644317626953, "global_step": 358518, "epoch": 4319} {"train_loss": -26.528844833374023, "global_step": 358519, "epoch": 4319} {"train_loss": -26.496902465820312, "global_step": 358520, "epoch": 4319} {"train_loss": -26.184162139892578, "global_step": 358521, "epoch": 4319} {"train_loss": -26.326704025268555, "global_step": 358522, "epoch": 4319} {"train_loss": -26.27119255065918, "global_step": 358523, "epoch": 4319} {"train_loss": -26.296005249023438, "global_step": 358524, "epoch": 4319} {"train_loss": -26.08029556274414, "global_step": 358525, "epoch": 4319} {"train_loss": -26.63007164001465, "global_step": 358526, "epoch": 4319} {"train_loss": -26.683868408203125, "global_step": 358527, "epoch": 4319} {"train_loss": -26.031116485595703, "global_step": 358528, "epoch": 4319} {"train_loss": -26.329578399658203, "global_step": 358529, "epoch": 4319} {"train_loss": -25.63227653503418, "global_step": 358530, "epoch": 4319} {"train_loss": -26.017078399658203, "global_step": 358531, "epoch": 4319} {"train_loss": -25.81744956970215, "global_step": 358532, "epoch": 4319} {"train_loss": -26.04129409790039, "global_step": 358533, "epoch": 4319} {"train_loss": -25.8487606048584, "global_step": 358534, "epoch": 4319} {"train_loss": -26.002729415893555, "global_step": 358535, "epoch": 4319} {"train_loss": -26.46893310546875, "global_step": 358536, "epoch": 4319} {"train_loss": -26.1107120513916, "global_step": 358537, "epoch": 4319} {"train_loss": -26.12677001953125, "global_step": 358538, "epoch": 4319} {"train_loss": -26.296899795532227, "global_step": 358539, "epoch": 4319} {"train_loss": -26.489110946655273, "global_step": 358540, "epoch": 4319} {"train_loss": -25.826557159423828, "global_step": 358541, "epoch": 4319} {"train_loss": -26.4520206451416, "global_step": 358542, "epoch": 4319} {"train_loss": -25.80245018005371, "global_step": 358543, "epoch": 4319} {"train_loss": -26.172595977783203, "global_step": 358544, "epoch": 4319} {"train_loss": -25.9649658203125, "global_step": 358545, "epoch": 4319} {"train_loss": -26.080942153930664, "global_step": 358546, "epoch": 4319} {"train_loss": -25.70320701599121, "global_step": 358547, "epoch": 4319} {"train_loss": -26.151098251342773, "global_step": 358548, "epoch": 4319} {"train_loss": -26.188276290893555, "global_step": 358549, "epoch": 4319} {"train_loss": -25.603717803955078, "global_step": 358550, "epoch": 4319} {"train_loss": -26.563501358032227, "global_step": 358551, "epoch": 4319} {"train_loss": -25.794723510742188, "global_step": 358552, "epoch": 4319} {"train_loss": -25.86895751953125, "global_step": 358553, "epoch": 4319} {"train_loss": -26.029157638549805, "global_step": 358554, "epoch": 4319} {"train_loss": -25.97324562072754, "global_step": 358555, "epoch": 4319} {"train_loss": -26.11911392211914, "global_step": 358556, "epoch": 4319} {"train_loss": -25.68743324279785, "global_step": 358557, "epoch": 4319} {"train_loss": -26.215173721313477, "global_step": 358558, "epoch": 4319} {"train_loss": -26.16179771882942, "global_step": 358559, "epoch": 4319, "val_loss": 6585302.0} {"train_loss": -25.70209312438965, "global_step": 358560, "epoch": 4320} {"train_loss": -25.774765014648438, "global_step": 358561, "epoch": 4320} {"train_loss": -25.08721923828125, "global_step": 358562, "epoch": 4320} {"train_loss": -26.111921310424805, "global_step": 358563, "epoch": 4320} {"train_loss": -25.952228546142578, "global_step": 358564, "epoch": 4320} {"train_loss": -25.772058486938477, "global_step": 358565, "epoch": 4320} {"train_loss": -25.958555221557617, "global_step": 358566, "epoch": 4320} {"train_loss": -25.890933990478516, "global_step": 358567, "epoch": 4320} {"train_loss": -25.627607345581055, "global_step": 358568, "epoch": 4320} {"train_loss": -25.7958984375, "global_step": 358569, "epoch": 4320} {"train_loss": -26.28384780883789, "global_step": 358570, "epoch": 4320} {"train_loss": -25.674686431884766, "global_step": 358571, "epoch": 4320} {"train_loss": -26.310699462890625, "global_step": 358572, "epoch": 4320} {"train_loss": -26.00678825378418, "global_step": 358573, "epoch": 4320} {"train_loss": -26.05983543395996, "global_step": 358574, "epoch": 4320} {"train_loss": -25.93299674987793, "global_step": 358575, "epoch": 4320} {"train_loss": -26.2086181640625, "global_step": 358576, "epoch": 4320} {"train_loss": -26.19587516784668, "global_step": 358577, "epoch": 4320} {"train_loss": -25.827716827392578, "global_step": 358578, "epoch": 4320} {"train_loss": -26.206924438476562, "global_step": 358579, "epoch": 4320} {"train_loss": -26.286151885986328, "global_step": 358580, "epoch": 4320} {"train_loss": -26.338598251342773, "global_step": 358581, "epoch": 4320} {"train_loss": -26.460391998291016, "global_step": 358582, "epoch": 4320} {"train_loss": -26.161468505859375, "global_step": 358583, "epoch": 4320} {"train_loss": -26.08194923400879, "global_step": 358584, "epoch": 4320} {"train_loss": -25.931020736694336, "global_step": 358585, "epoch": 4320} {"train_loss": -26.65435791015625, "global_step": 358586, "epoch": 4320} {"train_loss": -26.1954345703125, "global_step": 358587, "epoch": 4320} {"train_loss": -26.45208168029785, "global_step": 358588, "epoch": 4320} {"train_loss": -26.166339874267578, "global_step": 358589, "epoch": 4320} {"train_loss": -26.537643432617188, "global_step": 358590, "epoch": 4320} {"train_loss": -26.235517501831055, "global_step": 358591, "epoch": 4320} {"train_loss": -26.409143447875977, "global_step": 358592, "epoch": 4320} {"train_loss": -26.42380142211914, "global_step": 358593, "epoch": 4320} {"train_loss": -26.502334594726562, "global_step": 358594, "epoch": 4320} {"train_loss": -26.6500301361084, "global_step": 358595, "epoch": 4320} {"train_loss": -26.37744140625, "global_step": 358596, "epoch": 4320} {"train_loss": -26.105194091796875, "global_step": 358597, "epoch": 4320} {"train_loss": -26.2960205078125, "global_step": 358598, "epoch": 4320} {"train_loss": -26.28957176208496, "global_step": 358599, "epoch": 4320} {"train_loss": -26.334625244140625, "global_step": 358600, "epoch": 4320} {"train_loss": -26.536895751953125, "global_step": 358601, "epoch": 4320} {"train_loss": -26.53301429748535, "global_step": 358602, "epoch": 4320} {"train_loss": -26.320295333862305, "global_step": 358603, "epoch": 4320} {"train_loss": -26.59834861755371, "global_step": 358604, "epoch": 4320} {"train_loss": -26.503036499023438, "global_step": 358605, "epoch": 4320} {"train_loss": -26.03571891784668, "global_step": 358606, "epoch": 4320} {"train_loss": -26.345508575439453, "global_step": 358607, "epoch": 4320} {"train_loss": -26.36750602722168, "global_step": 358608, "epoch": 4320} {"train_loss": -26.255102157592773, "global_step": 358609, "epoch": 4320} {"train_loss": -26.3432674407959, "global_step": 358610, "epoch": 4320} {"train_loss": -26.22669792175293, "global_step": 358611, "epoch": 4320} {"train_loss": -25.977060317993164, "global_step": 358612, "epoch": 4320} {"train_loss": -26.36737060546875, "global_step": 358613, "epoch": 4320} {"train_loss": -26.318313598632812, "global_step": 358614, "epoch": 4320} {"train_loss": -25.991485595703125, "global_step": 358615, "epoch": 4320} {"train_loss": -26.627912521362305, "global_step": 358616, "epoch": 4320} {"train_loss": -26.0615291595459, "global_step": 358617, "epoch": 4320} {"train_loss": -26.137741088867188, "global_step": 358618, "epoch": 4320} {"train_loss": -26.196935653686523, "global_step": 358619, "epoch": 4320} {"train_loss": -25.89251136779785, "global_step": 358620, "epoch": 4320} {"train_loss": -26.390607833862305, "global_step": 358621, "epoch": 4320} {"train_loss": -26.416828155517578, "global_step": 358622, "epoch": 4320} {"train_loss": -26.288251876831055, "global_step": 358623, "epoch": 4320} {"train_loss": -26.204883575439453, "global_step": 358624, "epoch": 4320} {"train_loss": -26.174091339111328, "global_step": 358625, "epoch": 4320} {"train_loss": -26.117101669311523, "global_step": 358626, "epoch": 4320} {"train_loss": -25.928564071655273, "global_step": 358627, "epoch": 4320} {"train_loss": -26.053430557250977, "global_step": 358628, "epoch": 4320} {"train_loss": -26.061309814453125, "global_step": 358629, "epoch": 4320} {"train_loss": -26.3920841217041, "global_step": 358630, "epoch": 4320} {"train_loss": -26.039037704467773, "global_step": 358631, "epoch": 4320} {"train_loss": -25.856618881225586, "global_step": 358632, "epoch": 4320} {"train_loss": -26.189483642578125, "global_step": 358633, "epoch": 4320} {"train_loss": -26.095285415649414, "global_step": 358634, "epoch": 4320} {"train_loss": -26.533735275268555, "global_step": 358635, "epoch": 4320} {"train_loss": -26.099164962768555, "global_step": 358636, "epoch": 4320} {"train_loss": -25.833221435546875, "global_step": 358637, "epoch": 4320} {"train_loss": -26.332677841186523, "global_step": 358638, "epoch": 4320} {"train_loss": -26.143310546875, "global_step": 358639, "epoch": 4320} {"train_loss": -25.989288330078125, "global_step": 358640, "epoch": 4320} {"train_loss": -25.8676700592041, "global_step": 358641, "epoch": 4320} {"train_loss": -26.166593275874494, "global_step": 358642, "epoch": 4320, "val_loss": 6518401.0} {"train_loss": -24.99951934814453, "global_step": 358643, "epoch": 4321} {"train_loss": -25.049497604370117, "global_step": 358644, "epoch": 4321} {"train_loss": -25.455902099609375, "global_step": 358645, "epoch": 4321} {"train_loss": -24.84688377380371, "global_step": 358646, "epoch": 4321} {"train_loss": -25.24567413330078, "global_step": 358647, "epoch": 4321} {"train_loss": -25.104360580444336, "global_step": 358648, "epoch": 4321} {"train_loss": -25.138341903686523, "global_step": 358649, "epoch": 4321} {"train_loss": -25.695297241210938, "global_step": 358650, "epoch": 4321} {"train_loss": -25.205657958984375, "global_step": 358651, "epoch": 4321} {"train_loss": -25.21908950805664, "global_step": 358652, "epoch": 4321} {"train_loss": -25.744083404541016, "global_step": 358653, "epoch": 4321} {"train_loss": -25.654682159423828, "global_step": 358654, "epoch": 4321} {"train_loss": -25.96112060546875, "global_step": 358655, "epoch": 4321} {"train_loss": -25.50114631652832, "global_step": 358656, "epoch": 4321} {"train_loss": -25.50339698791504, "global_step": 358657, "epoch": 4321} {"train_loss": -25.71925926208496, "global_step": 358658, "epoch": 4321} {"train_loss": -25.467010498046875, "global_step": 358659, "epoch": 4321} {"train_loss": -25.752038955688477, "global_step": 358660, "epoch": 4321} {"train_loss": -25.993152618408203, "global_step": 358661, "epoch": 4321} {"train_loss": -26.02044105529785, "global_step": 358662, "epoch": 4321} {"train_loss": -26.00054359436035, "global_step": 358663, "epoch": 4321} {"train_loss": -25.87371826171875, "global_step": 358664, "epoch": 4321} {"train_loss": -26.20176124572754, "global_step": 358665, "epoch": 4321} {"train_loss": -25.60520362854004, "global_step": 358666, "epoch": 4321} {"train_loss": -26.125457763671875, "global_step": 358667, "epoch": 4321} {"train_loss": -26.150583267211914, "global_step": 358668, "epoch": 4321} {"train_loss": -25.805469512939453, "global_step": 358669, "epoch": 4321} {"train_loss": -25.8642520904541, "global_step": 358670, "epoch": 4321} {"train_loss": -26.09878921508789, "global_step": 358671, "epoch": 4321} {"train_loss": -26.122455596923828, "global_step": 358672, "epoch": 4321} {"train_loss": -26.382841110229492, "global_step": 358673, "epoch": 4321} {"train_loss": -26.38099479675293, "global_step": 358674, "epoch": 4321} {"train_loss": -25.8236141204834, "global_step": 358675, "epoch": 4321} {"train_loss": -25.841917037963867, "global_step": 358676, "epoch": 4321} {"train_loss": -25.862213134765625, "global_step": 358677, "epoch": 4321} {"train_loss": -25.926549911499023, "global_step": 358678, "epoch": 4321} {"train_loss": -25.66668128967285, "global_step": 358679, "epoch": 4321} {"train_loss": -25.75189208984375, "global_step": 358680, "epoch": 4321} {"train_loss": -26.062183380126953, "global_step": 358681, "epoch": 4321} {"train_loss": -26.217945098876953, "global_step": 358682, "epoch": 4321} {"train_loss": -26.23828125, "global_step": 358683, "epoch": 4321} {"train_loss": -26.24016761779785, "global_step": 358684, "epoch": 4321} {"train_loss": -26.097036361694336, "global_step": 358685, "epoch": 4321} {"train_loss": -26.60161781311035, "global_step": 358686, "epoch": 4321} {"train_loss": -26.751184463500977, "global_step": 358687, "epoch": 4321} {"train_loss": -26.15485191345215, "global_step": 358688, "epoch": 4321} {"train_loss": -26.505054473876953, "global_step": 358689, "epoch": 4321} {"train_loss": -26.36783218383789, "global_step": 358690, "epoch": 4321} {"train_loss": -26.42083168029785, "global_step": 358691, "epoch": 4321} {"train_loss": -26.0943603515625, "global_step": 358692, "epoch": 4321} {"train_loss": -26.105670928955078, "global_step": 358693, "epoch": 4321} {"train_loss": -26.649280548095703, "global_step": 358694, "epoch": 4321} {"train_loss": -26.785085678100586, "global_step": 358695, "epoch": 4321} {"train_loss": -26.231597900390625, "global_step": 358696, "epoch": 4321} {"train_loss": -26.10516357421875, "global_step": 358697, "epoch": 4321} {"train_loss": -26.17548179626465, "global_step": 358698, "epoch": 4321} {"train_loss": -26.799945831298828, "global_step": 358699, "epoch": 4321} {"train_loss": -25.86097526550293, "global_step": 358700, "epoch": 4321} {"train_loss": -26.313217163085938, "global_step": 358701, "epoch": 4321} {"train_loss": -26.096445083618164, "global_step": 358702, "epoch": 4321} {"train_loss": -26.294702529907227, "global_step": 358703, "epoch": 4321} {"train_loss": -26.29888343811035, "global_step": 358704, "epoch": 4321} {"train_loss": -26.471776962280273, "global_step": 358705, "epoch": 4321} {"train_loss": -25.955825805664062, "global_step": 358706, "epoch": 4321} {"train_loss": -26.24030113220215, "global_step": 358707, "epoch": 4321} {"train_loss": -26.158660888671875, "global_step": 358708, "epoch": 4321} {"train_loss": -26.41815185546875, "global_step": 358709, "epoch": 4321} {"train_loss": -26.374164581298828, "global_step": 358710, "epoch": 4321} {"train_loss": -26.516677856445312, "global_step": 358711, "epoch": 4321} {"train_loss": -26.034711837768555, "global_step": 358712, "epoch": 4321} {"train_loss": -26.557754516601562, "global_step": 358713, "epoch": 4321} {"train_loss": -26.369138717651367, "global_step": 358714, "epoch": 4321} {"train_loss": -26.484399795532227, "global_step": 358715, "epoch": 4321} {"train_loss": -26.7033748626709, "global_step": 358716, "epoch": 4321} {"train_loss": -26.440759658813477, "global_step": 358717, "epoch": 4321} {"train_loss": -26.483551025390625, "global_step": 358718, "epoch": 4321} {"train_loss": -26.331445693969727, "global_step": 358719, "epoch": 4321} {"train_loss": -26.30850601196289, "global_step": 358720, "epoch": 4321} {"train_loss": -26.75140953063965, "global_step": 358721, "epoch": 4321} {"train_loss": -26.33447265625, "global_step": 358722, "epoch": 4321} {"train_loss": -26.2999324798584, "global_step": 358723, "epoch": 4321} {"train_loss": -26.18865394592285, "global_step": 358724, "epoch": 4321} {"train_loss": -26.044740676879883, "global_step": 358725, "epoch": 4321, "val_loss": 6663860.5} {"train_loss": -24.827131271362305, "global_step": 358726, "epoch": 4322} {"train_loss": -25.2451229095459, "global_step": 358727, "epoch": 4322} {"train_loss": -25.04067611694336, "global_step": 358728, "epoch": 4322} {"train_loss": -25.364850997924805, "global_step": 358729, "epoch": 4322} {"train_loss": -25.69374656677246, "global_step": 358730, "epoch": 4322} {"train_loss": -25.31304931640625, "global_step": 358731, "epoch": 4322} {"train_loss": -25.074209213256836, "global_step": 358732, "epoch": 4322} {"train_loss": -25.7045841217041, "global_step": 358733, "epoch": 4322} {"train_loss": -25.41414451599121, "global_step": 358734, "epoch": 4322} {"train_loss": -25.34035301208496, "global_step": 358735, "epoch": 4322} {"train_loss": -25.560100555419922, "global_step": 358736, "epoch": 4322} {"train_loss": -25.570890426635742, "global_step": 358737, "epoch": 4322} {"train_loss": -25.770095825195312, "global_step": 358738, "epoch": 4322} {"train_loss": -25.716873168945312, "global_step": 358739, "epoch": 4322} {"train_loss": -25.876447677612305, "global_step": 358740, "epoch": 4322} {"train_loss": -25.953046798706055, "global_step": 358741, "epoch": 4322} {"train_loss": -25.763402938842773, "global_step": 358742, "epoch": 4322} {"train_loss": -25.839553833007812, "global_step": 358743, "epoch": 4322} {"train_loss": -25.63641929626465, "global_step": 358744, "epoch": 4322} {"train_loss": -25.832380294799805, "global_step": 358745, "epoch": 4322} {"train_loss": -26.0035400390625, "global_step": 358746, "epoch": 4322} {"train_loss": -26.010801315307617, "global_step": 358747, "epoch": 4322} {"train_loss": -26.256391525268555, "global_step": 358748, "epoch": 4322} {"train_loss": -25.91845703125, "global_step": 358749, "epoch": 4322} {"train_loss": -26.064924240112305, "global_step": 358750, "epoch": 4322} {"train_loss": -25.97600746154785, "global_step": 358751, "epoch": 4322} {"train_loss": -25.947528839111328, "global_step": 358752, "epoch": 4322} {"train_loss": -26.33514404296875, "global_step": 358753, "epoch": 4322} {"train_loss": -26.066137313842773, "global_step": 358754, "epoch": 4322} {"train_loss": -26.192487716674805, "global_step": 358755, "epoch": 4322} {"train_loss": -26.20947265625, "global_step": 358756, "epoch": 4322} {"train_loss": -26.114736557006836, "global_step": 358757, "epoch": 4322} {"train_loss": -26.054519653320312, "global_step": 358758, "epoch": 4322} {"train_loss": -25.956064224243164, "global_step": 358759, "epoch": 4322} {"train_loss": -26.2110538482666, "global_step": 358760, "epoch": 4322} {"train_loss": -26.554401397705078, "global_step": 358761, "epoch": 4322} {"train_loss": -26.178369522094727, "global_step": 358762, "epoch": 4322} {"train_loss": -26.42084312438965, "global_step": 358763, "epoch": 4322} {"train_loss": -25.855487823486328, "global_step": 358764, "epoch": 4322} {"train_loss": -26.277069091796875, "global_step": 358765, "epoch": 4322} {"train_loss": -26.22076988220215, "global_step": 358766, "epoch": 4322} {"train_loss": -26.38449478149414, "global_step": 358767, "epoch": 4322} {"train_loss": -25.839374542236328, "global_step": 358768, "epoch": 4322} {"train_loss": -26.09930419921875, "global_step": 358769, "epoch": 4322} {"train_loss": -26.33962059020996, "global_step": 358770, "epoch": 4322} {"train_loss": -26.240997314453125, "global_step": 358771, "epoch": 4322} {"train_loss": -26.150060653686523, "global_step": 358772, "epoch": 4322} {"train_loss": -26.36427116394043, "global_step": 358773, "epoch": 4322} {"train_loss": -25.89982032775879, "global_step": 358774, "epoch": 4322} {"train_loss": -26.465091705322266, "global_step": 358775, "epoch": 4322} {"train_loss": -26.621658325195312, "global_step": 358776, "epoch": 4322} {"train_loss": -26.70703125, "global_step": 358777, "epoch": 4322} {"train_loss": -26.556543350219727, "global_step": 358778, "epoch": 4322} {"train_loss": -26.2270565032959, "global_step": 358779, "epoch": 4322} {"train_loss": -26.236515045166016, "global_step": 358780, "epoch": 4322} {"train_loss": -26.286468505859375, "global_step": 358781, "epoch": 4322} {"train_loss": -26.440481185913086, "global_step": 358782, "epoch": 4322} {"train_loss": -26.325775146484375, "global_step": 358783, "epoch": 4322} {"train_loss": -26.532779693603516, "global_step": 358784, "epoch": 4322} {"train_loss": -26.167875289916992, "global_step": 358785, "epoch": 4322} {"train_loss": -26.451675415039062, "global_step": 358786, "epoch": 4322} {"train_loss": -26.895389556884766, "global_step": 358787, "epoch": 4322} {"train_loss": -26.238000869750977, "global_step": 358788, "epoch": 4322} {"train_loss": -26.09596824645996, "global_step": 358789, "epoch": 4322} {"train_loss": -26.28230094909668, "global_step": 358790, "epoch": 4322} {"train_loss": -26.490814208984375, "global_step": 358791, "epoch": 4322} {"train_loss": -26.169584274291992, "global_step": 358792, "epoch": 4322} {"train_loss": -26.096853256225586, "global_step": 358793, "epoch": 4322} {"train_loss": -26.316558837890625, "global_step": 358794, "epoch": 4322} {"train_loss": -26.430450439453125, "global_step": 358795, "epoch": 4322} {"train_loss": -26.629873275756836, "global_step": 358796, "epoch": 4322} {"train_loss": -26.14713478088379, "global_step": 358797, "epoch": 4322} {"train_loss": -26.37135887145996, "global_step": 358798, "epoch": 4322} {"train_loss": -26.36181640625, "global_step": 358799, "epoch": 4322} {"train_loss": -26.041656494140625, "global_step": 358800, "epoch": 4322} {"train_loss": -26.33437156677246, "global_step": 358801, "epoch": 4322} {"train_loss": -26.193552017211914, "global_step": 358802, "epoch": 4322} {"train_loss": -26.61456871032715, "global_step": 358803, "epoch": 4322} {"train_loss": -26.323896408081055, "global_step": 358804, "epoch": 4322} {"train_loss": -26.145593643188477, "global_step": 358805, "epoch": 4322} {"train_loss": -26.34698486328125, "global_step": 358806, "epoch": 4322} {"train_loss": -26.340055465698242, "global_step": 358807, "epoch": 4322} {"train_loss": -26.098770509283227, "global_step": 358808, "epoch": 4322, "val_loss": 6516092.0} {"train_loss": -25.72257423400879, "global_step": 358809, "epoch": 4323} {"train_loss": -25.30643081665039, "global_step": 358810, "epoch": 4323} {"train_loss": -26.215635299682617, "global_step": 358811, "epoch": 4323} {"train_loss": -25.513090133666992, "global_step": 358812, "epoch": 4323} {"train_loss": -25.723560333251953, "global_step": 358813, "epoch": 4323} {"train_loss": -25.92927360534668, "global_step": 358814, "epoch": 4323} {"train_loss": -25.656784057617188, "global_step": 358815, "epoch": 4323} {"train_loss": -25.726179122924805, "global_step": 358816, "epoch": 4323} {"train_loss": -25.75929069519043, "global_step": 358817, "epoch": 4323} {"train_loss": -25.73651695251465, "global_step": 358818, "epoch": 4323} {"train_loss": -26.068023681640625, "global_step": 358819, "epoch": 4323} {"train_loss": -25.973440170288086, "global_step": 358820, "epoch": 4323} {"train_loss": -26.30950927734375, "global_step": 358821, "epoch": 4323} {"train_loss": -25.96817970275879, "global_step": 358822, "epoch": 4323} {"train_loss": -25.77634620666504, "global_step": 358823, "epoch": 4323} {"train_loss": -25.949981689453125, "global_step": 358824, "epoch": 4323} {"train_loss": -25.85015869140625, "global_step": 358825, "epoch": 4323} {"train_loss": -26.315885543823242, "global_step": 358826, "epoch": 4323} {"train_loss": -25.89876365661621, "global_step": 358827, "epoch": 4323} {"train_loss": -25.8751220703125, "global_step": 358828, "epoch": 4323} {"train_loss": -26.277185440063477, "global_step": 358829, "epoch": 4323} {"train_loss": -25.994491577148438, "global_step": 358830, "epoch": 4323} {"train_loss": -25.962656021118164, "global_step": 358831, "epoch": 4323} {"train_loss": -25.93476676940918, "global_step": 358832, "epoch": 4323} {"train_loss": -26.36781120300293, "global_step": 358833, "epoch": 4323} {"train_loss": -26.192663192749023, "global_step": 358834, "epoch": 4323} {"train_loss": -26.562124252319336, "global_step": 358835, "epoch": 4323} {"train_loss": -26.230331420898438, "global_step": 358836, "epoch": 4323} {"train_loss": -26.0233154296875, "global_step": 358837, "epoch": 4323} {"train_loss": -26.2735652923584, "global_step": 358838, "epoch": 4323} {"train_loss": -26.069448471069336, "global_step": 358839, "epoch": 4323} {"train_loss": -26.37653160095215, "global_step": 358840, "epoch": 4323} {"train_loss": -26.226232528686523, "global_step": 358841, "epoch": 4323} {"train_loss": -26.082904815673828, "global_step": 358842, "epoch": 4323} {"train_loss": -26.244787216186523, "global_step": 358843, "epoch": 4323} {"train_loss": -26.25225830078125, "global_step": 358844, "epoch": 4323} {"train_loss": -26.10233497619629, "global_step": 358845, "epoch": 4323} {"train_loss": -26.444171905517578, "global_step": 358846, "epoch": 4323} {"train_loss": -26.176944732666016, "global_step": 358847, "epoch": 4323} {"train_loss": -26.14911460876465, "global_step": 358848, "epoch": 4323} {"train_loss": -25.968372344970703, "global_step": 358849, "epoch": 4323} {"train_loss": -26.621841430664062, "global_step": 358850, "epoch": 4323} {"train_loss": -26.4951229095459, "global_step": 358851, "epoch": 4323} {"train_loss": -26.700733184814453, "global_step": 358852, "epoch": 4323} {"train_loss": -25.883380889892578, "global_step": 358853, "epoch": 4323} {"train_loss": -26.28666114807129, "global_step": 358854, "epoch": 4323} {"train_loss": -26.42962074279785, "global_step": 358855, "epoch": 4323} {"train_loss": -26.59330177307129, "global_step": 358856, "epoch": 4323} {"train_loss": -25.953964233398438, "global_step": 358857, "epoch": 4323} {"train_loss": -25.6850643157959, "global_step": 358858, "epoch": 4323} {"train_loss": -26.33343505859375, "global_step": 358859, "epoch": 4323} {"train_loss": -26.385583877563477, "global_step": 358860, "epoch": 4323} {"train_loss": -26.590307235717773, "global_step": 358861, "epoch": 4323} {"train_loss": -26.05511474609375, "global_step": 358862, "epoch": 4323} {"train_loss": -26.1862850189209, "global_step": 358863, "epoch": 4323} {"train_loss": -26.083927154541016, "global_step": 358864, "epoch": 4323} {"train_loss": -25.882246017456055, "global_step": 358865, "epoch": 4323} {"train_loss": -26.619434356689453, "global_step": 358866, "epoch": 4323} {"train_loss": -26.515623092651367, "global_step": 358867, "epoch": 4323} {"train_loss": -26.30487060546875, "global_step": 358868, "epoch": 4323} {"train_loss": -26.368528366088867, "global_step": 358869, "epoch": 4323} {"train_loss": -26.242712020874023, "global_step": 358870, "epoch": 4323} {"train_loss": -26.554880142211914, "global_step": 358871, "epoch": 4323} {"train_loss": -26.213775634765625, "global_step": 358872, "epoch": 4323} {"train_loss": -26.329938888549805, "global_step": 358873, "epoch": 4323} {"train_loss": -25.718647003173828, "global_step": 358874, "epoch": 4323} {"train_loss": -26.07867431640625, "global_step": 358875, "epoch": 4323} {"train_loss": -26.337127685546875, "global_step": 358876, "epoch": 4323} {"train_loss": -26.012786865234375, "global_step": 358877, "epoch": 4323} {"train_loss": -26.41965103149414, "global_step": 358878, "epoch": 4323} {"train_loss": -26.104711532592773, "global_step": 358879, "epoch": 4323} {"train_loss": -26.5498046875, "global_step": 358880, "epoch": 4323} {"train_loss": -25.92469596862793, "global_step": 358881, "epoch": 4323} {"train_loss": -26.394916534423828, "global_step": 358882, "epoch": 4323} {"train_loss": -26.489501953125, "global_step": 358883, "epoch": 4323} {"train_loss": -26.21343421936035, "global_step": 358884, "epoch": 4323} {"train_loss": -26.344623565673828, "global_step": 358885, "epoch": 4323} {"train_loss": -26.10566520690918, "global_step": 358886, "epoch": 4323} {"train_loss": -26.081134796142578, "global_step": 358887, "epoch": 4323} {"train_loss": -25.559640884399414, "global_step": 358888, "epoch": 4323} {"train_loss": -24.912084579467773, "global_step": 358889, "epoch": 4323} {"train_loss": -25.225788116455078, "global_step": 358890, "epoch": 4323} {"train_loss": -26.107358587793556, "global_step": 358891, "epoch": 4323, "val_loss": 6618130.0} {"train_loss": -24.871639251708984, "global_step": 358892, "epoch": 4324} {"train_loss": -25.71961784362793, "global_step": 358893, "epoch": 4324} {"train_loss": -24.86081314086914, "global_step": 358894, "epoch": 4324} {"train_loss": -25.356441497802734, "global_step": 358895, "epoch": 4324} {"train_loss": -25.271085739135742, "global_step": 358896, "epoch": 4324} {"train_loss": -25.6817569732666, "global_step": 358897, "epoch": 4324} {"train_loss": -25.312650680541992, "global_step": 358898, "epoch": 4324} {"train_loss": -25.175077438354492, "global_step": 358899, "epoch": 4324} {"train_loss": -25.376008987426758, "global_step": 358900, "epoch": 4324} {"train_loss": -25.196918487548828, "global_step": 358901, "epoch": 4324} {"train_loss": -25.666284561157227, "global_step": 358902, "epoch": 4324} {"train_loss": -25.245025634765625, "global_step": 358903, "epoch": 4324} {"train_loss": -25.385704040527344, "global_step": 358904, "epoch": 4324} {"train_loss": -25.479839324951172, "global_step": 358905, "epoch": 4324} {"train_loss": -25.860824584960938, "global_step": 358906, "epoch": 4324} {"train_loss": -25.812116622924805, "global_step": 358907, "epoch": 4324} {"train_loss": -25.84418296813965, "global_step": 358908, "epoch": 4324} {"train_loss": -25.73602294921875, "global_step": 358909, "epoch": 4324} {"train_loss": -26.002639770507812, "global_step": 358910, "epoch": 4324} {"train_loss": -25.465124130249023, "global_step": 358911, "epoch": 4324} {"train_loss": -25.846389770507812, "global_step": 358912, "epoch": 4324} {"train_loss": -25.591527938842773, "global_step": 358913, "epoch": 4324} {"train_loss": -25.849781036376953, "global_step": 358914, "epoch": 4324} {"train_loss": -25.89226722717285, "global_step": 358915, "epoch": 4324} {"train_loss": -26.09535026550293, "global_step": 358916, "epoch": 4324} {"train_loss": -26.080066680908203, "global_step": 358917, "epoch": 4324} {"train_loss": -26.109033584594727, "global_step": 358918, "epoch": 4324} {"train_loss": -25.923736572265625, "global_step": 358919, "epoch": 4324} {"train_loss": -26.173526763916016, "global_step": 358920, "epoch": 4324} {"train_loss": -26.046955108642578, "global_step": 358921, "epoch": 4324} {"train_loss": -25.79608154296875, "global_step": 358922, "epoch": 4324} {"train_loss": -26.128955841064453, "global_step": 358923, "epoch": 4324} {"train_loss": -26.432418823242188, "global_step": 358924, "epoch": 4324} {"train_loss": -26.110809326171875, "global_step": 358925, "epoch": 4324} {"train_loss": -26.03946876525879, "global_step": 358926, "epoch": 4324} {"train_loss": -26.014883041381836, "global_step": 358927, "epoch": 4324} {"train_loss": -26.407363891601562, "global_step": 358928, "epoch": 4324} {"train_loss": -26.369421005249023, "global_step": 358929, "epoch": 4324} {"train_loss": -26.09946632385254, "global_step": 358930, "epoch": 4324} {"train_loss": -26.181257247924805, "global_step": 358931, "epoch": 4324} {"train_loss": -26.368183135986328, "global_step": 358932, "epoch": 4324} {"train_loss": -26.367116928100586, "global_step": 358933, "epoch": 4324} {"train_loss": -26.51771354675293, "global_step": 358934, "epoch": 4324} {"train_loss": -26.6574649810791, "global_step": 358935, "epoch": 4324} {"train_loss": -26.26091957092285, "global_step": 358936, "epoch": 4324} {"train_loss": -26.378894805908203, "global_step": 358937, "epoch": 4324} {"train_loss": -26.305744171142578, "global_step": 358938, "epoch": 4324} {"train_loss": -26.6414852142334, "global_step": 358939, "epoch": 4324} {"train_loss": -26.550159454345703, "global_step": 358940, "epoch": 4324} {"train_loss": -26.448822021484375, "global_step": 358941, "epoch": 4324} {"train_loss": -26.30255126953125, "global_step": 358942, "epoch": 4324} {"train_loss": -25.834308624267578, "global_step": 358943, "epoch": 4324} {"train_loss": -25.7752742767334, "global_step": 358944, "epoch": 4324} {"train_loss": -25.592283248901367, "global_step": 358945, "epoch": 4324} {"train_loss": -25.86685562133789, "global_step": 358946, "epoch": 4324} {"train_loss": -26.300134658813477, "global_step": 358947, "epoch": 4324} {"train_loss": -25.955352783203125, "global_step": 358948, "epoch": 4324} {"train_loss": -26.532825469970703, "global_step": 358949, "epoch": 4324} {"train_loss": -26.139636993408203, "global_step": 358950, "epoch": 4324} {"train_loss": -26.380481719970703, "global_step": 358951, "epoch": 4324} {"train_loss": -26.24546241760254, "global_step": 358952, "epoch": 4324} {"train_loss": -26.306884765625, "global_step": 358953, "epoch": 4324} {"train_loss": -26.371417999267578, "global_step": 358954, "epoch": 4324} {"train_loss": -26.185632705688477, "global_step": 358955, "epoch": 4324} {"train_loss": -26.41327476501465, "global_step": 358956, "epoch": 4324} {"train_loss": -26.2662353515625, "global_step": 358957, "epoch": 4324} {"train_loss": -26.33176040649414, "global_step": 358958, "epoch": 4324} {"train_loss": -26.150999069213867, "global_step": 358959, "epoch": 4324} {"train_loss": -26.291461944580078, "global_step": 358960, "epoch": 4324} {"train_loss": -26.305753707885742, "global_step": 358961, "epoch": 4324} {"train_loss": -26.228302001953125, "global_step": 358962, "epoch": 4324} {"train_loss": -26.371353149414062, "global_step": 358963, "epoch": 4324} {"train_loss": -26.397531509399414, "global_step": 358964, "epoch": 4324} {"train_loss": -26.264856338500977, "global_step": 358965, "epoch": 4324} {"train_loss": -26.487762451171875, "global_step": 358966, "epoch": 4324} {"train_loss": -26.055200576782227, "global_step": 358967, "epoch": 4324} {"train_loss": -26.310998916625977, "global_step": 358968, "epoch": 4324} {"train_loss": -26.275781631469727, "global_step": 358969, "epoch": 4324} {"train_loss": -26.439239501953125, "global_step": 358970, "epoch": 4324} {"train_loss": -26.316421508789062, "global_step": 358971, "epoch": 4324} {"train_loss": -26.272241592407227, "global_step": 358972, "epoch": 4324} {"train_loss": -26.024967193603516, "global_step": 358973, "epoch": 4324} {"train_loss": -26.02532173064818, "global_step": 358974, "epoch": 4324, "val_loss": 6499850.0} {"train_loss": -26.080310821533203, "global_step": 358975, "epoch": 4325} {"train_loss": -26.217687606811523, "global_step": 358976, "epoch": 4325} {"train_loss": -26.35426139831543, "global_step": 358977, "epoch": 4325} {"train_loss": -26.55535316467285, "global_step": 358978, "epoch": 4325} {"train_loss": -26.209396362304688, "global_step": 358979, "epoch": 4325} {"train_loss": -26.08112144470215, "global_step": 358980, "epoch": 4325} {"train_loss": -25.867136001586914, "global_step": 358981, "epoch": 4325} {"train_loss": -26.516021728515625, "global_step": 358982, "epoch": 4325} {"train_loss": -26.279983520507812, "global_step": 358983, "epoch": 4325} {"train_loss": -26.122739791870117, "global_step": 358984, "epoch": 4325} {"train_loss": -26.539447784423828, "global_step": 358985, "epoch": 4325} {"train_loss": -26.750598907470703, "global_step": 358986, "epoch": 4325} {"train_loss": -26.242197036743164, "global_step": 358987, "epoch": 4325} {"train_loss": -26.5372371673584, "global_step": 358988, "epoch": 4325} {"train_loss": -26.200794219970703, "global_step": 358989, "epoch": 4325} {"train_loss": -26.486677169799805, "global_step": 358990, "epoch": 4325} {"train_loss": -26.374292373657227, "global_step": 358991, "epoch": 4325} {"train_loss": -26.274566650390625, "global_step": 358992, "epoch": 4325} {"train_loss": -26.325162887573242, "global_step": 358993, "epoch": 4325} {"train_loss": -26.14740562438965, "global_step": 358994, "epoch": 4325} {"train_loss": -26.275487899780273, "global_step": 358995, "epoch": 4325} {"train_loss": -26.51192283630371, "global_step": 358996, "epoch": 4325} {"train_loss": -26.58941650390625, "global_step": 358997, "epoch": 4325} {"train_loss": -26.2199764251709, "global_step": 358998, "epoch": 4325} {"train_loss": -26.852252960205078, "global_step": 358999, "epoch": 4325} {"train_loss": -26.191076278686523, "global_step": 359000, "epoch": 4325} {"train_loss": -26.016300201416016, "global_step": 359001, "epoch": 4325} {"train_loss": -26.012800216674805, "global_step": 359002, "epoch": 4325} {"train_loss": -26.13852310180664, "global_step": 359003, "epoch": 4325} {"train_loss": -26.38581657409668, "global_step": 359004, "epoch": 4325} {"train_loss": -26.177780151367188, "global_step": 359005, "epoch": 4325} {"train_loss": -26.374311447143555, "global_step": 359006, "epoch": 4325} {"train_loss": -26.42044448852539, "global_step": 359007, "epoch": 4325} {"train_loss": -26.301916122436523, "global_step": 359008, "epoch": 4325} {"train_loss": -26.188547134399414, "global_step": 359009, "epoch": 4325} {"train_loss": -26.706647872924805, "global_step": 359010, "epoch": 4325} {"train_loss": -26.408178329467773, "global_step": 359011, "epoch": 4325} {"train_loss": -26.627960205078125, "global_step": 359012, "epoch": 4325} {"train_loss": -26.299604415893555, "global_step": 359013, "epoch": 4325} {"train_loss": -26.37696647644043, "global_step": 359014, "epoch": 4325} {"train_loss": -26.50311279296875, "global_step": 359015, "epoch": 4325} {"train_loss": -26.57025146484375, "global_step": 359016, "epoch": 4325} {"train_loss": -26.77752685546875, "global_step": 359017, "epoch": 4325} {"train_loss": -26.443359375, "global_step": 359018, "epoch": 4325} {"train_loss": -26.3367977142334, "global_step": 359019, "epoch": 4325} {"train_loss": -26.181095123291016, "global_step": 359020, "epoch": 4325} {"train_loss": -26.2808895111084, "global_step": 359021, "epoch": 4325} {"train_loss": -26.297895431518555, "global_step": 359022, "epoch": 4325} {"train_loss": -26.312753677368164, "global_step": 359023, "epoch": 4325} {"train_loss": -26.491479873657227, "global_step": 359024, "epoch": 4325} {"train_loss": -26.0889835357666, "global_step": 359025, "epoch": 4325} {"train_loss": -26.34332275390625, "global_step": 359026, "epoch": 4325} {"train_loss": -26.137250900268555, "global_step": 359027, "epoch": 4325} {"train_loss": -26.34455680847168, "global_step": 359028, "epoch": 4325} {"train_loss": -26.34052848815918, "global_step": 359029, "epoch": 4325} {"train_loss": -26.34148597717285, "global_step": 359030, "epoch": 4325} {"train_loss": -26.632715225219727, "global_step": 359031, "epoch": 4325} {"train_loss": -26.13591957092285, "global_step": 359032, "epoch": 4325} {"train_loss": -26.3371524810791, "global_step": 359033, "epoch": 4325} {"train_loss": -26.290822982788086, "global_step": 359034, "epoch": 4325} {"train_loss": -26.06806755065918, "global_step": 359035, "epoch": 4325} {"train_loss": -26.095136642456055, "global_step": 359036, "epoch": 4325} {"train_loss": -26.1383113861084, "global_step": 359037, "epoch": 4325} {"train_loss": -26.5958251953125, "global_step": 359038, "epoch": 4325} {"train_loss": -26.41469383239746, "global_step": 359039, "epoch": 4325} {"train_loss": -26.119787216186523, "global_step": 359040, "epoch": 4325} {"train_loss": -25.978656768798828, "global_step": 359041, "epoch": 4325} {"train_loss": -26.300018310546875, "global_step": 359042, "epoch": 4325} {"train_loss": -26.330032348632812, "global_step": 359043, "epoch": 4325} {"train_loss": -26.256790161132812, "global_step": 359044, "epoch": 4325} {"train_loss": -26.409381866455078, "global_step": 359045, "epoch": 4325} {"train_loss": -26.13877296447754, "global_step": 359046, "epoch": 4325} {"train_loss": -26.224576950073242, "global_step": 359047, "epoch": 4325} {"train_loss": -26.243732452392578, "global_step": 359048, "epoch": 4325} {"train_loss": -26.409317016601562, "global_step": 359049, "epoch": 4325} {"train_loss": -26.29145622253418, "global_step": 359050, "epoch": 4325} {"train_loss": -26.3046875, "global_step": 359051, "epoch": 4325} {"train_loss": -26.313024520874023, "global_step": 359052, "epoch": 4325} {"train_loss": -26.387771606445312, "global_step": 359053, "epoch": 4325} {"train_loss": -26.191593170166016, "global_step": 359054, "epoch": 4325} {"train_loss": -26.22028160095215, "global_step": 359055, "epoch": 4325} {"train_loss": -26.346908569335938, "global_step": 359056, "epoch": 4325} {"train_loss": -26.32938249427152, "global_step": 359057, "epoch": 4325, "val_loss": 6598158.5} {"train_loss": -25.98699378967285, "global_step": 359058, "epoch": 4326} {"train_loss": -25.883941650390625, "global_step": 359059, "epoch": 4326} {"train_loss": -25.592517852783203, "global_step": 359060, "epoch": 4326} {"train_loss": -25.51450538635254, "global_step": 359061, "epoch": 4326} {"train_loss": -25.282678604125977, "global_step": 359062, "epoch": 4326} {"train_loss": -25.947980880737305, "global_step": 359063, "epoch": 4326} {"train_loss": -25.702985763549805, "global_step": 359064, "epoch": 4326} {"train_loss": -25.035602569580078, "global_step": 359065, "epoch": 4326} {"train_loss": -25.415027618408203, "global_step": 359066, "epoch": 4326} {"train_loss": -25.76214027404785, "global_step": 359067, "epoch": 4326} {"train_loss": -25.560720443725586, "global_step": 359068, "epoch": 4326} {"train_loss": -25.599945068359375, "global_step": 359069, "epoch": 4326} {"train_loss": -25.50973892211914, "global_step": 359070, "epoch": 4326} {"train_loss": -25.619327545166016, "global_step": 359071, "epoch": 4326} {"train_loss": -25.730947494506836, "global_step": 359072, "epoch": 4326} {"train_loss": -25.43181800842285, "global_step": 359073, "epoch": 4326} {"train_loss": -26.085290908813477, "global_step": 359074, "epoch": 4326} {"train_loss": -26.0537166595459, "global_step": 359075, "epoch": 4326} {"train_loss": -25.7827091217041, "global_step": 359076, "epoch": 4326} {"train_loss": -26.197195053100586, "global_step": 359077, "epoch": 4326} {"train_loss": -26.14629554748535, "global_step": 359078, "epoch": 4326} {"train_loss": -26.184600830078125, "global_step": 359079, "epoch": 4326} {"train_loss": -25.505603790283203, "global_step": 359080, "epoch": 4326} {"train_loss": -26.04697608947754, "global_step": 359081, "epoch": 4326} {"train_loss": -26.329065322875977, "global_step": 359082, "epoch": 4326} {"train_loss": -25.724945068359375, "global_step": 359083, "epoch": 4326} {"train_loss": -25.774938583374023, "global_step": 359084, "epoch": 4326} {"train_loss": -26.169233322143555, "global_step": 359085, "epoch": 4326} {"train_loss": -25.9368896484375, "global_step": 359086, "epoch": 4326} {"train_loss": -26.4609432220459, "global_step": 359087, "epoch": 4326} {"train_loss": -25.812519073486328, "global_step": 359088, "epoch": 4326} {"train_loss": -26.334243774414062, "global_step": 359089, "epoch": 4326} {"train_loss": -26.56439781188965, "global_step": 359090, "epoch": 4326} {"train_loss": -26.743200302124023, "global_step": 359091, "epoch": 4326} {"train_loss": -26.046051025390625, "global_step": 359092, "epoch": 4326} {"train_loss": -26.478607177734375, "global_step": 359093, "epoch": 4326} {"train_loss": -26.562253952026367, "global_step": 359094, "epoch": 4326} {"train_loss": -26.325342178344727, "global_step": 359095, "epoch": 4326} {"train_loss": -26.41400146484375, "global_step": 359096, "epoch": 4326} {"train_loss": -26.366315841674805, "global_step": 359097, "epoch": 4326} {"train_loss": -26.46860694885254, "global_step": 359098, "epoch": 4326} {"train_loss": -26.509241104125977, "global_step": 359099, "epoch": 4326} {"train_loss": -26.617645263671875, "global_step": 359100, "epoch": 4326} {"train_loss": -26.757604598999023, "global_step": 359101, "epoch": 4326} {"train_loss": -26.377918243408203, "global_step": 359102, "epoch": 4326} {"train_loss": -26.209646224975586, "global_step": 359103, "epoch": 4326} {"train_loss": -26.383243560791016, "global_step": 359104, "epoch": 4326} {"train_loss": -26.48611831665039, "global_step": 359105, "epoch": 4326} {"train_loss": -26.677209854125977, "global_step": 359106, "epoch": 4326} {"train_loss": -26.47321891784668, "global_step": 359107, "epoch": 4326} {"train_loss": -26.8282413482666, "global_step": 359108, "epoch": 4326} {"train_loss": -26.543537139892578, "global_step": 359109, "epoch": 4326} {"train_loss": -26.44547462463379, "global_step": 359110, "epoch": 4326} {"train_loss": -26.704809188842773, "global_step": 359111, "epoch": 4326} {"train_loss": -26.470083236694336, "global_step": 359112, "epoch": 4326} {"train_loss": -26.050275802612305, "global_step": 359113, "epoch": 4326} {"train_loss": -25.9538631439209, "global_step": 359114, "epoch": 4326} {"train_loss": -25.77479362487793, "global_step": 359115, "epoch": 4326} {"train_loss": -26.310516357421875, "global_step": 359116, "epoch": 4326} {"train_loss": -25.741220474243164, "global_step": 359117, "epoch": 4326} {"train_loss": -25.906721115112305, "global_step": 359118, "epoch": 4326} {"train_loss": -25.706314086914062, "global_step": 359119, "epoch": 4326} {"train_loss": -26.027753829956055, "global_step": 359120, "epoch": 4326} {"train_loss": -26.249448776245117, "global_step": 359121, "epoch": 4326} {"train_loss": -26.032562255859375, "global_step": 359122, "epoch": 4326} {"train_loss": -26.033981323242188, "global_step": 359123, "epoch": 4326} {"train_loss": -25.9621524810791, "global_step": 359124, "epoch": 4326} {"train_loss": -26.056232452392578, "global_step": 359125, "epoch": 4326} {"train_loss": -25.690427780151367, "global_step": 359126, "epoch": 4326} {"train_loss": -25.784521102905273, "global_step": 359127, "epoch": 4326} {"train_loss": -25.7036190032959, "global_step": 359128, "epoch": 4326} {"train_loss": -26.332929611206055, "global_step": 359129, "epoch": 4326} {"train_loss": -26.165372848510742, "global_step": 359130, "epoch": 4326} {"train_loss": -26.16143226623535, "global_step": 359131, "epoch": 4326} {"train_loss": -26.07784080505371, "global_step": 359132, "epoch": 4326} {"train_loss": -26.322484970092773, "global_step": 359133, "epoch": 4326} {"train_loss": -26.171308517456055, "global_step": 359134, "epoch": 4326} {"train_loss": -26.557037353515625, "global_step": 359135, "epoch": 4326} {"train_loss": -26.1252384185791, "global_step": 359136, "epoch": 4326} {"train_loss": -26.049631118774414, "global_step": 359137, "epoch": 4326} {"train_loss": -26.447921752929688, "global_step": 359138, "epoch": 4326} {"train_loss": -26.4774112701416, "global_step": 359139, "epoch": 4326} {"train_loss": -26.089137847165027, "global_step": 359140, "epoch": 4326, "val_loss": 6482813.5} {"train_loss": -25.70261001586914, "global_step": 359141, "epoch": 4327} {"train_loss": -24.979019165039062, "global_step": 359142, "epoch": 4327} {"train_loss": -25.70490074157715, "global_step": 359143, "epoch": 4327} {"train_loss": -25.710840225219727, "global_step": 359144, "epoch": 4327} {"train_loss": -25.87189292907715, "global_step": 359145, "epoch": 4327} {"train_loss": -25.340972900390625, "global_step": 359146, "epoch": 4327} {"train_loss": -25.391382217407227, "global_step": 359147, "epoch": 4327} {"train_loss": -25.8154239654541, "global_step": 359148, "epoch": 4327} {"train_loss": -25.64802360534668, "global_step": 359149, "epoch": 4327} {"train_loss": -25.795480728149414, "global_step": 359150, "epoch": 4327} {"train_loss": -26.00030517578125, "global_step": 359151, "epoch": 4327} {"train_loss": -25.695661544799805, "global_step": 359152, "epoch": 4327} {"train_loss": -26.131153106689453, "global_step": 359153, "epoch": 4327} {"train_loss": -25.991064071655273, "global_step": 359154, "epoch": 4327} {"train_loss": -25.458505630493164, "global_step": 359155, "epoch": 4327} {"train_loss": -26.0908203125, "global_step": 359156, "epoch": 4327} {"train_loss": -25.402074813842773, "global_step": 359157, "epoch": 4327} {"train_loss": -25.827619552612305, "global_step": 359158, "epoch": 4327} {"train_loss": -25.816608428955078, "global_step": 359159, "epoch": 4327} {"train_loss": -25.9722900390625, "global_step": 359160, "epoch": 4327} {"train_loss": -26.022567749023438, "global_step": 359161, "epoch": 4327} {"train_loss": -26.255313873291016, "global_step": 359162, "epoch": 4327} {"train_loss": -25.994592666625977, "global_step": 359163, "epoch": 4327} {"train_loss": -26.156057357788086, "global_step": 359164, "epoch": 4327} {"train_loss": -25.772443771362305, "global_step": 359165, "epoch": 4327} {"train_loss": -26.0615177154541, "global_step": 359166, "epoch": 4327} {"train_loss": -26.073415756225586, "global_step": 359167, "epoch": 4327} {"train_loss": -26.025253295898438, "global_step": 359168, "epoch": 4327} {"train_loss": -26.00063133239746, "global_step": 359169, "epoch": 4327} {"train_loss": -26.19501304626465, "global_step": 359170, "epoch": 4327} {"train_loss": -25.866674423217773, "global_step": 359171, "epoch": 4327} {"train_loss": -26.059146881103516, "global_step": 359172, "epoch": 4327} {"train_loss": -26.13336753845215, "global_step": 359173, "epoch": 4327} {"train_loss": -26.312744140625, "global_step": 359174, "epoch": 4327} {"train_loss": -26.040058135986328, "global_step": 359175, "epoch": 4327} {"train_loss": -26.215253829956055, "global_step": 359176, "epoch": 4327} {"train_loss": -26.1448974609375, "global_step": 359177, "epoch": 4327} {"train_loss": -25.68231201171875, "global_step": 359178, "epoch": 4327} {"train_loss": -26.260517120361328, "global_step": 359179, "epoch": 4327} {"train_loss": -26.1219539642334, "global_step": 359180, "epoch": 4327} {"train_loss": -26.497928619384766, "global_step": 359181, "epoch": 4327} {"train_loss": -26.408069610595703, "global_step": 359182, "epoch": 4327} {"train_loss": -26.626983642578125, "global_step": 359183, "epoch": 4327} {"train_loss": -26.528934478759766, "global_step": 359184, "epoch": 4327} {"train_loss": -26.123123168945312, "global_step": 359185, "epoch": 4327} {"train_loss": -26.216644287109375, "global_step": 359186, "epoch": 4327} {"train_loss": -26.470203399658203, "global_step": 359187, "epoch": 4327} {"train_loss": -26.571802139282227, "global_step": 359188, "epoch": 4327} {"train_loss": -26.3953800201416, "global_step": 359189, "epoch": 4327} {"train_loss": -26.350879669189453, "global_step": 359190, "epoch": 4327} {"train_loss": -26.233356475830078, "global_step": 359191, "epoch": 4327} {"train_loss": -26.703781127929688, "global_step": 359192, "epoch": 4327} {"train_loss": -26.461212158203125, "global_step": 359193, "epoch": 4327} {"train_loss": -26.41377067565918, "global_step": 359194, "epoch": 4327} {"train_loss": -26.319400787353516, "global_step": 359195, "epoch": 4327} {"train_loss": -26.64472007751465, "global_step": 359196, "epoch": 4327} {"train_loss": -26.423725128173828, "global_step": 359197, "epoch": 4327} {"train_loss": -26.567453384399414, "global_step": 359198, "epoch": 4327} {"train_loss": -26.05555534362793, "global_step": 359199, "epoch": 4327} {"train_loss": -26.15033531188965, "global_step": 359200, "epoch": 4327} {"train_loss": -25.821380615234375, "global_step": 359201, "epoch": 4327} {"train_loss": -26.107269287109375, "global_step": 359202, "epoch": 4327} {"train_loss": -26.397247314453125, "global_step": 359203, "epoch": 4327} {"train_loss": -25.634485244750977, "global_step": 359204, "epoch": 4327} {"train_loss": -25.85888671875, "global_step": 359205, "epoch": 4327} {"train_loss": -26.459089279174805, "global_step": 359206, "epoch": 4327} {"train_loss": -26.3785343170166, "global_step": 359207, "epoch": 4327} {"train_loss": -26.228139877319336, "global_step": 359208, "epoch": 4327} {"train_loss": -26.562097549438477, "global_step": 359209, "epoch": 4327} {"train_loss": -26.07578468322754, "global_step": 359210, "epoch": 4327} {"train_loss": -26.59480094909668, "global_step": 359211, "epoch": 4327} {"train_loss": -26.331090927124023, "global_step": 359212, "epoch": 4327} {"train_loss": -26.231475830078125, "global_step": 359213, "epoch": 4327} {"train_loss": -26.19428062438965, "global_step": 359214, "epoch": 4327} {"train_loss": -26.316818237304688, "global_step": 359215, "epoch": 4327} {"train_loss": -26.095077514648438, "global_step": 359216, "epoch": 4327} {"train_loss": -25.918989181518555, "global_step": 359217, "epoch": 4327} {"train_loss": -26.25372886657715, "global_step": 359218, "epoch": 4327} {"train_loss": -26.05449867248535, "global_step": 359219, "epoch": 4327} {"train_loss": -25.561689376831055, "global_step": 359220, "epoch": 4327} {"train_loss": -26.20553970336914, "global_step": 359221, "epoch": 4327} {"train_loss": -26.206430435180664, "global_step": 359222, "epoch": 4327} {"train_loss": -26.078425809561487, "global_step": 359223, "epoch": 4327, "val_loss": 6544510.5} {"train_loss": -24.557043075561523, "global_step": 359224, "epoch": 4328} {"train_loss": -25.07731056213379, "global_step": 359225, "epoch": 4328} {"train_loss": -25.278982162475586, "global_step": 359226, "epoch": 4328} {"train_loss": -25.90496253967285, "global_step": 359227, "epoch": 4328} {"train_loss": -25.378782272338867, "global_step": 359228, "epoch": 4328} {"train_loss": -25.37782859802246, "global_step": 359229, "epoch": 4328} {"train_loss": -25.712369918823242, "global_step": 359230, "epoch": 4328} {"train_loss": -25.564176559448242, "global_step": 359231, "epoch": 4328} {"train_loss": -25.775217056274414, "global_step": 359232, "epoch": 4328} {"train_loss": -26.111608505249023, "global_step": 359233, "epoch": 4328} {"train_loss": -25.759851455688477, "global_step": 359234, "epoch": 4328} {"train_loss": -25.85859489440918, "global_step": 359235, "epoch": 4328} {"train_loss": -25.671812057495117, "global_step": 359236, "epoch": 4328} {"train_loss": -25.96209144592285, "global_step": 359237, "epoch": 4328} {"train_loss": -26.108224868774414, "global_step": 359238, "epoch": 4328} {"train_loss": -25.424480438232422, "global_step": 359239, "epoch": 4328} {"train_loss": -25.960187911987305, "global_step": 359240, "epoch": 4328} {"train_loss": -26.081090927124023, "global_step": 359241, "epoch": 4328} {"train_loss": -25.888967514038086, "global_step": 359242, "epoch": 4328} {"train_loss": -25.590011596679688, "global_step": 359243, "epoch": 4328} {"train_loss": -25.739822387695312, "global_step": 359244, "epoch": 4328} {"train_loss": -26.145883560180664, "global_step": 359245, "epoch": 4328} {"train_loss": -26.021366119384766, "global_step": 359246, "epoch": 4328} {"train_loss": -26.21677017211914, "global_step": 359247, "epoch": 4328} {"train_loss": -26.120935440063477, "global_step": 359248, "epoch": 4328} {"train_loss": -26.102375030517578, "global_step": 359249, "epoch": 4328} {"train_loss": -26.375823974609375, "global_step": 359250, "epoch": 4328} {"train_loss": -26.264196395874023, "global_step": 359251, "epoch": 4328} {"train_loss": -25.972997665405273, "global_step": 359252, "epoch": 4328} {"train_loss": -26.296838760375977, "global_step": 359253, "epoch": 4328} {"train_loss": -26.141401290893555, "global_step": 359254, "epoch": 4328} {"train_loss": -26.40447425842285, "global_step": 359255, "epoch": 4328} {"train_loss": -26.37116813659668, "global_step": 359256, "epoch": 4328} {"train_loss": -26.286157608032227, "global_step": 359257, "epoch": 4328} {"train_loss": -26.411762237548828, "global_step": 359258, "epoch": 4328} {"train_loss": -26.20855712890625, "global_step": 359259, "epoch": 4328} {"train_loss": -26.35261344909668, "global_step": 359260, "epoch": 4328} {"train_loss": -26.3931884765625, "global_step": 359261, "epoch": 4328} {"train_loss": -26.46015739440918, "global_step": 359262, "epoch": 4328} {"train_loss": -26.48211669921875, "global_step": 359263, "epoch": 4328} {"train_loss": -26.589996337890625, "global_step": 359264, "epoch": 4328} {"train_loss": -26.142688751220703, "global_step": 359265, "epoch": 4328} {"train_loss": -26.183216094970703, "global_step": 359266, "epoch": 4328} {"train_loss": -26.325666427612305, "global_step": 359267, "epoch": 4328} {"train_loss": -26.38442039489746, "global_step": 359268, "epoch": 4328} {"train_loss": -26.15716552734375, "global_step": 359269, "epoch": 4328} {"train_loss": -26.290897369384766, "global_step": 359270, "epoch": 4328} {"train_loss": -26.733356475830078, "global_step": 359271, "epoch": 4328} {"train_loss": -26.298019409179688, "global_step": 359272, "epoch": 4328} {"train_loss": -26.26198387145996, "global_step": 359273, "epoch": 4328} {"train_loss": -26.185407638549805, "global_step": 359274, "epoch": 4328} {"train_loss": -26.228336334228516, "global_step": 359275, "epoch": 4328} {"train_loss": -26.607099533081055, "global_step": 359276, "epoch": 4328} {"train_loss": -26.18303871154785, "global_step": 359277, "epoch": 4328} {"train_loss": -26.326568603515625, "global_step": 359278, "epoch": 4328} {"train_loss": -26.381444931030273, "global_step": 359279, "epoch": 4328} {"train_loss": -26.70149803161621, "global_step": 359280, "epoch": 4328} {"train_loss": -26.29642105102539, "global_step": 359281, "epoch": 4328} {"train_loss": -26.413745880126953, "global_step": 359282, "epoch": 4328} {"train_loss": -26.215368270874023, "global_step": 359283, "epoch": 4328} {"train_loss": -26.314788818359375, "global_step": 359284, "epoch": 4328} {"train_loss": -25.538843154907227, "global_step": 359285, "epoch": 4328} {"train_loss": -25.909393310546875, "global_step": 359286, "epoch": 4328} {"train_loss": -26.390380859375, "global_step": 359287, "epoch": 4328} {"train_loss": -26.2227840423584, "global_step": 359288, "epoch": 4328} {"train_loss": -26.204198837280273, "global_step": 359289, "epoch": 4328} {"train_loss": -26.792774200439453, "global_step": 359290, "epoch": 4328} {"train_loss": -25.91316032409668, "global_step": 359291, "epoch": 4328} {"train_loss": -26.36127281188965, "global_step": 359292, "epoch": 4328} {"train_loss": -26.104434967041016, "global_step": 359293, "epoch": 4328} {"train_loss": -26.538593292236328, "global_step": 359294, "epoch": 4328} {"train_loss": -26.508092880249023, "global_step": 359295, "epoch": 4328} {"train_loss": -25.65350341796875, "global_step": 359296, "epoch": 4328} {"train_loss": -26.206439971923828, "global_step": 359297, "epoch": 4328} {"train_loss": -26.2866268157959, "global_step": 359298, "epoch": 4328} {"train_loss": -26.398086547851562, "global_step": 359299, "epoch": 4328} {"train_loss": -25.96630859375, "global_step": 359300, "epoch": 4328} {"train_loss": -26.356504440307617, "global_step": 359301, "epoch": 4328} {"train_loss": -26.508237838745117, "global_step": 359302, "epoch": 4328} {"train_loss": -26.185094833374023, "global_step": 359303, "epoch": 4328} {"train_loss": -26.501501083374023, "global_step": 359304, "epoch": 4328} {"train_loss": -26.395063400268555, "global_step": 359305, "epoch": 4328} {"train_loss": -26.109937943607928, "global_step": 359306, "epoch": 4328, "val_loss": 6557495.0} {"train_loss": -24.158720016479492, "global_step": 359307, "epoch": 4329} {"train_loss": -21.654388427734375, "global_step": 359308, "epoch": 4329} {"train_loss": -23.59101104736328, "global_step": 359309, "epoch": 4329} {"train_loss": -25.150705337524414, "global_step": 359310, "epoch": 4329} {"train_loss": -22.94281578063965, "global_step": 359311, "epoch": 4329} {"train_loss": -24.392383575439453, "global_step": 359312, "epoch": 4329} {"train_loss": -25.023181915283203, "global_step": 359313, "epoch": 4329} {"train_loss": -24.620738983154297, "global_step": 359314, "epoch": 4329} {"train_loss": -24.958635330200195, "global_step": 359315, "epoch": 4329} {"train_loss": -24.961334228515625, "global_step": 359316, "epoch": 4329} {"train_loss": -24.793378829956055, "global_step": 359317, "epoch": 4329} {"train_loss": -24.833337783813477, "global_step": 359318, "epoch": 4329} {"train_loss": -25.7132568359375, "global_step": 359319, "epoch": 4329} {"train_loss": -25.014617919921875, "global_step": 359320, "epoch": 4329} {"train_loss": -24.99903678894043, "global_step": 359321, "epoch": 4329} {"train_loss": -25.112730026245117, "global_step": 359322, "epoch": 4329} {"train_loss": -24.95918083190918, "global_step": 359323, "epoch": 4329} {"train_loss": -25.22467041015625, "global_step": 359324, "epoch": 4329} {"train_loss": -25.221118927001953, "global_step": 359325, "epoch": 4329} {"train_loss": -25.189573287963867, "global_step": 359326, "epoch": 4329} {"train_loss": -25.40938377380371, "global_step": 359327, "epoch": 4329} {"train_loss": -25.191753387451172, "global_step": 359328, "epoch": 4329} {"train_loss": -25.269094467163086, "global_step": 359329, "epoch": 4329} {"train_loss": -25.557926177978516, "global_step": 359330, "epoch": 4329} {"train_loss": -25.469165802001953, "global_step": 359331, "epoch": 4329} {"train_loss": -25.207998275756836, "global_step": 359332, "epoch": 4329} {"train_loss": -25.323240280151367, "global_step": 359333, "epoch": 4329} {"train_loss": -25.46832275390625, "global_step": 359334, "epoch": 4329} {"train_loss": -25.61025047302246, "global_step": 359335, "epoch": 4329} {"train_loss": -25.66851234436035, "global_step": 359336, "epoch": 4329} {"train_loss": -25.95344352722168, "global_step": 359337, "epoch": 4329} {"train_loss": -25.97076988220215, "global_step": 359338, "epoch": 4329} {"train_loss": -25.53871726989746, "global_step": 359339, "epoch": 4329} {"train_loss": -26.1966609954834, "global_step": 359340, "epoch": 4329} {"train_loss": -25.98306655883789, "global_step": 359341, "epoch": 4329} {"train_loss": -25.848379135131836, "global_step": 359342, "epoch": 4329} {"train_loss": -25.94759178161621, "global_step": 359343, "epoch": 4329} {"train_loss": -25.999670028686523, "global_step": 359344, "epoch": 4329} {"train_loss": -25.973560333251953, "global_step": 359345, "epoch": 4329} {"train_loss": -26.13850212097168, "global_step": 359346, "epoch": 4329} {"train_loss": -26.146820068359375, "global_step": 359347, "epoch": 4329} {"train_loss": -26.177499771118164, "global_step": 359348, "epoch": 4329} {"train_loss": -26.462732315063477, "global_step": 359349, "epoch": 4329} {"train_loss": -26.160388946533203, "global_step": 359350, "epoch": 4329} {"train_loss": -25.94623374938965, "global_step": 359351, "epoch": 4329} {"train_loss": -26.101606369018555, "global_step": 359352, "epoch": 4329} {"train_loss": -25.953113555908203, "global_step": 359353, "epoch": 4329} {"train_loss": -26.24971580505371, "global_step": 359354, "epoch": 4329} {"train_loss": -26.438373565673828, "global_step": 359355, "epoch": 4329} {"train_loss": -26.48681640625, "global_step": 359356, "epoch": 4329} {"train_loss": -26.366369247436523, "global_step": 359357, "epoch": 4329} {"train_loss": -26.56696891784668, "global_step": 359358, "epoch": 4329} {"train_loss": -26.537668228149414, "global_step": 359359, "epoch": 4329} {"train_loss": -26.271991729736328, "global_step": 359360, "epoch": 4329} {"train_loss": -26.47308349609375, "global_step": 359361, "epoch": 4329} {"train_loss": -26.502470016479492, "global_step": 359362, "epoch": 4329} {"train_loss": -26.56448745727539, "global_step": 359363, "epoch": 4329} {"train_loss": -26.46950340270996, "global_step": 359364, "epoch": 4329} {"train_loss": -26.522809982299805, "global_step": 359365, "epoch": 4329} {"train_loss": -26.162921905517578, "global_step": 359366, "epoch": 4329} {"train_loss": -26.033212661743164, "global_step": 359367, "epoch": 4329} {"train_loss": -26.402875900268555, "global_step": 359368, "epoch": 4329} {"train_loss": -26.74761390686035, "global_step": 359369, "epoch": 4329} {"train_loss": -26.4932804107666, "global_step": 359370, "epoch": 4329} {"train_loss": -26.384140014648438, "global_step": 359371, "epoch": 4329} {"train_loss": -26.077905654907227, "global_step": 359372, "epoch": 4329} {"train_loss": -26.47173500061035, "global_step": 359373, "epoch": 4329} {"train_loss": -26.471649169921875, "global_step": 359374, "epoch": 4329} {"train_loss": -26.397253036499023, "global_step": 359375, "epoch": 4329} {"train_loss": -26.2979679107666, "global_step": 359376, "epoch": 4329} {"train_loss": -26.313735961914062, "global_step": 359377, "epoch": 4329} {"train_loss": -26.52911949157715, "global_step": 359378, "epoch": 4329} {"train_loss": -26.605833053588867, "global_step": 359379, "epoch": 4329} {"train_loss": -26.4016170501709, "global_step": 359380, "epoch": 4329} {"train_loss": -26.39728355407715, "global_step": 359381, "epoch": 4329} {"train_loss": -26.343130111694336, "global_step": 359382, "epoch": 4329} {"train_loss": -26.56416893005371, "global_step": 359383, "epoch": 4329} {"train_loss": -26.463953018188477, "global_step": 359384, "epoch": 4329} {"train_loss": -26.469165802001953, "global_step": 359385, "epoch": 4329} {"train_loss": -26.445987701416016, "global_step": 359386, "epoch": 4329} {"train_loss": -26.333545684814453, "global_step": 359387, "epoch": 4329} {"train_loss": -26.59482765197754, "global_step": 359388, "epoch": 4329} {"train_loss": -25.7861098783562, "global_step": 359389, "epoch": 4329, "val_loss": 6587347.5} {"train_loss": -25.16412925720215, "global_step": 359390, "epoch": 4330} {"train_loss": -24.184537887573242, "global_step": 359391, "epoch": 4330} {"train_loss": -25.2617244720459, "global_step": 359392, "epoch": 4330} {"train_loss": -25.188751220703125, "global_step": 359393, "epoch": 4330} {"train_loss": -24.678619384765625, "global_step": 359394, "epoch": 4330} {"train_loss": -25.211692810058594, "global_step": 359395, "epoch": 4330} {"train_loss": -24.98388671875, "global_step": 359396, "epoch": 4330} {"train_loss": -25.63044548034668, "global_step": 359397, "epoch": 4330} {"train_loss": -25.888898849487305, "global_step": 359398, "epoch": 4330} {"train_loss": -25.216594696044922, "global_step": 359399, "epoch": 4330} {"train_loss": -25.329574584960938, "global_step": 359400, "epoch": 4330} {"train_loss": -25.16359519958496, "global_step": 359401, "epoch": 4330} {"train_loss": -26.039350509643555, "global_step": 359402, "epoch": 4330} {"train_loss": -25.55765151977539, "global_step": 359403, "epoch": 4330} {"train_loss": -25.7014102935791, "global_step": 359404, "epoch": 4330} {"train_loss": -25.52747344970703, "global_step": 359405, "epoch": 4330} {"train_loss": -25.37349510192871, "global_step": 359406, "epoch": 4330} {"train_loss": -25.873441696166992, "global_step": 359407, "epoch": 4330} {"train_loss": -25.795568466186523, "global_step": 359408, "epoch": 4330} {"train_loss": -25.853361129760742, "global_step": 359409, "epoch": 4330} {"train_loss": -25.569398880004883, "global_step": 359410, "epoch": 4330} {"train_loss": -25.785009384155273, "global_step": 359411, "epoch": 4330} {"train_loss": -25.978185653686523, "global_step": 359412, "epoch": 4330} {"train_loss": -25.777170181274414, "global_step": 359413, "epoch": 4330} {"train_loss": -25.90723991394043, "global_step": 359414, "epoch": 4330} {"train_loss": -25.89362144470215, "global_step": 359415, "epoch": 4330} {"train_loss": -26.28400993347168, "global_step": 359416, "epoch": 4330} {"train_loss": -26.34307289123535, "global_step": 359417, "epoch": 4330} {"train_loss": -26.171527862548828, "global_step": 359418, "epoch": 4330} {"train_loss": -26.29345703125, "global_step": 359419, "epoch": 4330} {"train_loss": -26.47174072265625, "global_step": 359420, "epoch": 4330} {"train_loss": -26.3049373626709, "global_step": 359421, "epoch": 4330} {"train_loss": -26.103498458862305, "global_step": 359422, "epoch": 4330} {"train_loss": -26.113813400268555, "global_step": 359423, "epoch": 4330} {"train_loss": -26.166370391845703, "global_step": 359424, "epoch": 4330} {"train_loss": -26.002660751342773, "global_step": 359425, "epoch": 4330} {"train_loss": -26.045392990112305, "global_step": 359426, "epoch": 4330} {"train_loss": -26.132909774780273, "global_step": 359427, "epoch": 4330} {"train_loss": -26.19134521484375, "global_step": 359428, "epoch": 4330} {"train_loss": -26.363422393798828, "global_step": 359429, "epoch": 4330} {"train_loss": -26.39027214050293, "global_step": 359430, "epoch": 4330} {"train_loss": -26.191726684570312, "global_step": 359431, "epoch": 4330} {"train_loss": -26.28378677368164, "global_step": 359432, "epoch": 4330} {"train_loss": -26.332599639892578, "global_step": 359433, "epoch": 4330} {"train_loss": -26.08835220336914, "global_step": 359434, "epoch": 4330} {"train_loss": -26.126449584960938, "global_step": 359435, "epoch": 4330} {"train_loss": -26.554914474487305, "global_step": 359436, "epoch": 4330} {"train_loss": -26.584863662719727, "global_step": 359437, "epoch": 4330} {"train_loss": -26.270116806030273, "global_step": 359438, "epoch": 4330} {"train_loss": -26.284757614135742, "global_step": 359439, "epoch": 4330} {"train_loss": -26.379079818725586, "global_step": 359440, "epoch": 4330} {"train_loss": -26.18241310119629, "global_step": 359441, "epoch": 4330} {"train_loss": -26.70846939086914, "global_step": 359442, "epoch": 4330} {"train_loss": -26.68427848815918, "global_step": 359443, "epoch": 4330} {"train_loss": -26.307886123657227, "global_step": 359444, "epoch": 4330} {"train_loss": -26.435367584228516, "global_step": 359445, "epoch": 4330} {"train_loss": -26.688364028930664, "global_step": 359446, "epoch": 4330} {"train_loss": -26.31902503967285, "global_step": 359447, "epoch": 4330} {"train_loss": -26.377201080322266, "global_step": 359448, "epoch": 4330} {"train_loss": -26.677587509155273, "global_step": 359449, "epoch": 4330} {"train_loss": -26.38140869140625, "global_step": 359450, "epoch": 4330} {"train_loss": -26.715316772460938, "global_step": 359451, "epoch": 4330} {"train_loss": -26.225927352905273, "global_step": 359452, "epoch": 4330} {"train_loss": -26.33976173400879, "global_step": 359453, "epoch": 4330} {"train_loss": -26.251489639282227, "global_step": 359454, "epoch": 4330} {"train_loss": -26.283796310424805, "global_step": 359455, "epoch": 4330} {"train_loss": -26.245580673217773, "global_step": 359456, "epoch": 4330} {"train_loss": -26.664264678955078, "global_step": 359457, "epoch": 4330} {"train_loss": -26.475727081298828, "global_step": 359458, "epoch": 4330} {"train_loss": -26.153263092041016, "global_step": 359459, "epoch": 4330} {"train_loss": -26.594396591186523, "global_step": 359460, "epoch": 4330} {"train_loss": -26.457624435424805, "global_step": 359461, "epoch": 4330} {"train_loss": -26.390295028686523, "global_step": 359462, "epoch": 4330} {"train_loss": -26.338043212890625, "global_step": 359463, "epoch": 4330} {"train_loss": -26.314733505249023, "global_step": 359464, "epoch": 4330} {"train_loss": -26.106292724609375, "global_step": 359465, "epoch": 4330} {"train_loss": -25.226608276367188, "global_step": 359466, "epoch": 4330} {"train_loss": -25.49651336669922, "global_step": 359467, "epoch": 4330} {"train_loss": -25.3000431060791, "global_step": 359468, "epoch": 4330} {"train_loss": -26.23443603515625, "global_step": 359469, "epoch": 4330} {"train_loss": -26.057458877563477, "global_step": 359470, "epoch": 4330} {"train_loss": -26.836441040039062, "global_step": 359471, "epoch": 4330} {"train_loss": -26.041190204850164, "global_step": 359472, "epoch": 4330, "val_loss": 6812516.0} {"train_loss": -25.21610450744629, "global_step": 359473, "epoch": 4331} {"train_loss": -25.12360382080078, "global_step": 359474, "epoch": 4331} {"train_loss": -25.1978759765625, "global_step": 359475, "epoch": 4331} {"train_loss": -24.887598037719727, "global_step": 359476, "epoch": 4331} {"train_loss": -25.588266372680664, "global_step": 359477, "epoch": 4331} {"train_loss": -25.26368522644043, "global_step": 359478, "epoch": 4331} {"train_loss": -24.900419235229492, "global_step": 359479, "epoch": 4331} {"train_loss": -25.823139190673828, "global_step": 359480, "epoch": 4331} {"train_loss": -25.52894401550293, "global_step": 359481, "epoch": 4331} {"train_loss": -25.395395278930664, "global_step": 359482, "epoch": 4331} {"train_loss": -25.114906311035156, "global_step": 359483, "epoch": 4331} {"train_loss": -25.086471557617188, "global_step": 359484, "epoch": 4331} {"train_loss": -25.481821060180664, "global_step": 359485, "epoch": 4331} {"train_loss": -25.752918243408203, "global_step": 359486, "epoch": 4331} {"train_loss": -25.745010375976562, "global_step": 359487, "epoch": 4331} {"train_loss": -25.8531436920166, "global_step": 359488, "epoch": 4331} {"train_loss": -25.52823829650879, "global_step": 359489, "epoch": 4331} {"train_loss": -25.7100830078125, "global_step": 359490, "epoch": 4331} {"train_loss": -25.60200309753418, "global_step": 359491, "epoch": 4331} {"train_loss": -25.54514503479004, "global_step": 359492, "epoch": 4331} {"train_loss": -26.358856201171875, "global_step": 359493, "epoch": 4331} {"train_loss": -25.75372886657715, "global_step": 359494, "epoch": 4331} {"train_loss": -26.22161293029785, "global_step": 359495, "epoch": 4331} {"train_loss": -26.195669174194336, "global_step": 359496, "epoch": 4331} {"train_loss": -26.167844772338867, "global_step": 359497, "epoch": 4331} {"train_loss": -26.089492797851562, "global_step": 359498, "epoch": 4331} {"train_loss": -25.903766632080078, "global_step": 359499, "epoch": 4331} {"train_loss": -26.342294692993164, "global_step": 359500, "epoch": 4331} {"train_loss": -26.15345573425293, "global_step": 359501, "epoch": 4331} {"train_loss": -26.148603439331055, "global_step": 359502, "epoch": 4331} {"train_loss": -26.21785545349121, "global_step": 359503, "epoch": 4331} {"train_loss": -26.4007625579834, "global_step": 359504, "epoch": 4331} {"train_loss": -26.46332359313965, "global_step": 359505, "epoch": 4331} {"train_loss": -26.2238826751709, "global_step": 359506, "epoch": 4331} {"train_loss": -25.95942497253418, "global_step": 359507, "epoch": 4331} {"train_loss": -26.353900909423828, "global_step": 359508, "epoch": 4331} {"train_loss": -26.22174644470215, "global_step": 359509, "epoch": 4331} {"train_loss": -26.27583122253418, "global_step": 359510, "epoch": 4331} {"train_loss": -26.018457412719727, "global_step": 359511, "epoch": 4331} {"train_loss": -26.599843978881836, "global_step": 359512, "epoch": 4331} {"train_loss": -26.438573837280273, "global_step": 359513, "epoch": 4331} {"train_loss": -26.121076583862305, "global_step": 359514, "epoch": 4331} {"train_loss": -26.732379913330078, "global_step": 359515, "epoch": 4331} {"train_loss": -26.406803131103516, "global_step": 359516, "epoch": 4331} {"train_loss": -26.2994327545166, "global_step": 359517, "epoch": 4331} {"train_loss": -26.3671932220459, "global_step": 359518, "epoch": 4331} {"train_loss": -26.488061904907227, "global_step": 359519, "epoch": 4331} {"train_loss": -26.364538192749023, "global_step": 359520, "epoch": 4331} {"train_loss": -26.32843589782715, "global_step": 359521, "epoch": 4331} {"train_loss": -26.585906982421875, "global_step": 359522, "epoch": 4331} {"train_loss": -26.406208038330078, "global_step": 359523, "epoch": 4331} {"train_loss": -26.319202423095703, "global_step": 359524, "epoch": 4331} {"train_loss": -26.29827880859375, "global_step": 359525, "epoch": 4331} {"train_loss": -26.592243194580078, "global_step": 359526, "epoch": 4331} {"train_loss": -26.199487686157227, "global_step": 359527, "epoch": 4331} {"train_loss": -26.535587310791016, "global_step": 359528, "epoch": 4331} {"train_loss": -26.66853904724121, "global_step": 359529, "epoch": 4331} {"train_loss": -26.448789596557617, "global_step": 359530, "epoch": 4331} {"train_loss": -26.28944206237793, "global_step": 359531, "epoch": 4331} {"train_loss": -26.29091453552246, "global_step": 359532, "epoch": 4331} {"train_loss": -26.384754180908203, "global_step": 359533, "epoch": 4331} {"train_loss": -26.464963912963867, "global_step": 359534, "epoch": 4331} {"train_loss": -26.42095947265625, "global_step": 359535, "epoch": 4331} {"train_loss": -26.398733139038086, "global_step": 359536, "epoch": 4331} {"train_loss": -25.972766876220703, "global_step": 359537, "epoch": 4331} {"train_loss": -25.947162628173828, "global_step": 359538, "epoch": 4331} {"train_loss": -26.02362060546875, "global_step": 359539, "epoch": 4331} {"train_loss": -25.86402702331543, "global_step": 359540, "epoch": 4331} {"train_loss": -26.283798217773438, "global_step": 359541, "epoch": 4331} {"train_loss": -25.702436447143555, "global_step": 359542, "epoch": 4331} {"train_loss": -26.275232315063477, "global_step": 359543, "epoch": 4331} {"train_loss": -25.588191986083984, "global_step": 359544, "epoch": 4331} {"train_loss": -25.11981201171875, "global_step": 359545, "epoch": 4331} {"train_loss": -25.85158348083496, "global_step": 359546, "epoch": 4331} {"train_loss": -25.948049545288086, "global_step": 359547, "epoch": 4331} {"train_loss": -25.938032150268555, "global_step": 359548, "epoch": 4331} {"train_loss": -25.725767135620117, "global_step": 359549, "epoch": 4331} {"train_loss": -26.13651466369629, "global_step": 359550, "epoch": 4331} {"train_loss": -26.14796257019043, "global_step": 359551, "epoch": 4331} {"train_loss": -26.021764755249023, "global_step": 359552, "epoch": 4331} {"train_loss": -25.851964950561523, "global_step": 359553, "epoch": 4331} {"train_loss": -26.40814781188965, "global_step": 359554, "epoch": 4331} {"train_loss": -26.01817478042051, "global_step": 359555, "epoch": 4331, "val_loss": 6595495.0} {"train_loss": -25.47734832763672, "global_step": 359556, "epoch": 4332} {"train_loss": -25.6856689453125, "global_step": 359557, "epoch": 4332} {"train_loss": -25.800769805908203, "global_step": 359558, "epoch": 4332} {"train_loss": -25.62029457092285, "global_step": 359559, "epoch": 4332} {"train_loss": -25.59633445739746, "global_step": 359560, "epoch": 4332} {"train_loss": -25.499597549438477, "global_step": 359561, "epoch": 4332} {"train_loss": -25.637256622314453, "global_step": 359562, "epoch": 4332} {"train_loss": -26.008642196655273, "global_step": 359563, "epoch": 4332} {"train_loss": -25.893400192260742, "global_step": 359564, "epoch": 4332} {"train_loss": -25.90167808532715, "global_step": 359565, "epoch": 4332} {"train_loss": -26.059606552124023, "global_step": 359566, "epoch": 4332} {"train_loss": -26.03891372680664, "global_step": 359567, "epoch": 4332} {"train_loss": -26.004575729370117, "global_step": 359568, "epoch": 4332} {"train_loss": -25.77125358581543, "global_step": 359569, "epoch": 4332} {"train_loss": -26.014972686767578, "global_step": 359570, "epoch": 4332} {"train_loss": -26.052387237548828, "global_step": 359571, "epoch": 4332} {"train_loss": -25.83627700805664, "global_step": 359572, "epoch": 4332} {"train_loss": -25.878782272338867, "global_step": 359573, "epoch": 4332} {"train_loss": -26.294286727905273, "global_step": 359574, "epoch": 4332} {"train_loss": -26.165191650390625, "global_step": 359575, "epoch": 4332} {"train_loss": -26.08833122253418, "global_step": 359576, "epoch": 4332} {"train_loss": -26.546955108642578, "global_step": 359577, "epoch": 4332} {"train_loss": -26.149616241455078, "global_step": 359578, "epoch": 4332} {"train_loss": -26.02935218811035, "global_step": 359579, "epoch": 4332} {"train_loss": -25.967206954956055, "global_step": 359580, "epoch": 4332} {"train_loss": -26.300886154174805, "global_step": 359581, "epoch": 4332} {"train_loss": -26.02634620666504, "global_step": 359582, "epoch": 4332} {"train_loss": -25.925779342651367, "global_step": 359583, "epoch": 4332} {"train_loss": -26.199426651000977, "global_step": 359584, "epoch": 4332} {"train_loss": -26.05828857421875, "global_step": 359585, "epoch": 4332} {"train_loss": -25.97275733947754, "global_step": 359586, "epoch": 4332} {"train_loss": -26.134626388549805, "global_step": 359587, "epoch": 4332} {"train_loss": -25.8459529876709, "global_step": 359588, "epoch": 4332} {"train_loss": -26.546039581298828, "global_step": 359589, "epoch": 4332} {"train_loss": -25.884296417236328, "global_step": 359590, "epoch": 4332} {"train_loss": -26.137409210205078, "global_step": 359591, "epoch": 4332} {"train_loss": -26.1794490814209, "global_step": 359592, "epoch": 4332} {"train_loss": -26.03516960144043, "global_step": 359593, "epoch": 4332} {"train_loss": -26.3707275390625, "global_step": 359594, "epoch": 4332} {"train_loss": -26.450586318969727, "global_step": 359595, "epoch": 4332} {"train_loss": -26.37430763244629, "global_step": 359596, "epoch": 4332} {"train_loss": -26.6700382232666, "global_step": 359597, "epoch": 4332} {"train_loss": -26.361616134643555, "global_step": 359598, "epoch": 4332} {"train_loss": -26.5042724609375, "global_step": 359599, "epoch": 4332} {"train_loss": -26.247282028198242, "global_step": 359600, "epoch": 4332} {"train_loss": -26.41106605529785, "global_step": 359601, "epoch": 4332} {"train_loss": -26.0194091796875, "global_step": 359602, "epoch": 4332} {"train_loss": -26.165796279907227, "global_step": 359603, "epoch": 4332} {"train_loss": -26.52719497680664, "global_step": 359604, "epoch": 4332} {"train_loss": -26.655914306640625, "global_step": 359605, "epoch": 4332} {"train_loss": -26.595373153686523, "global_step": 359606, "epoch": 4332} {"train_loss": -26.540597915649414, "global_step": 359607, "epoch": 4332} {"train_loss": -26.539356231689453, "global_step": 359608, "epoch": 4332} {"train_loss": -26.73078727722168, "global_step": 359609, "epoch": 4332} {"train_loss": -26.256864547729492, "global_step": 359610, "epoch": 4332} {"train_loss": -26.309539794921875, "global_step": 359611, "epoch": 4332} {"train_loss": -26.41582679748535, "global_step": 359612, "epoch": 4332} {"train_loss": -26.45486831665039, "global_step": 359613, "epoch": 4332} {"train_loss": -26.461261749267578, "global_step": 359614, "epoch": 4332} {"train_loss": -26.3160343170166, "global_step": 359615, "epoch": 4332} {"train_loss": -25.86292839050293, "global_step": 359616, "epoch": 4332} {"train_loss": -26.338748931884766, "global_step": 359617, "epoch": 4332} {"train_loss": -26.38810157775879, "global_step": 359618, "epoch": 4332} {"train_loss": -26.236103057861328, "global_step": 359619, "epoch": 4332} {"train_loss": -26.20296287536621, "global_step": 359620, "epoch": 4332} {"train_loss": -26.187341690063477, "global_step": 359621, "epoch": 4332} {"train_loss": -26.663837432861328, "global_step": 359622, "epoch": 4332} {"train_loss": -26.23280143737793, "global_step": 359623, "epoch": 4332} {"train_loss": -26.462085723876953, "global_step": 359624, "epoch": 4332} {"train_loss": -26.27553367614746, "global_step": 359625, "epoch": 4332} {"train_loss": -26.600263595581055, "global_step": 359626, "epoch": 4332} {"train_loss": -26.617963790893555, "global_step": 359627, "epoch": 4332} {"train_loss": -26.637165069580078, "global_step": 359628, "epoch": 4332} {"train_loss": -26.324237823486328, "global_step": 359629, "epoch": 4332} {"train_loss": -26.445056915283203, "global_step": 359630, "epoch": 4332} {"train_loss": -26.450544357299805, "global_step": 359631, "epoch": 4332} {"train_loss": -25.941999435424805, "global_step": 359632, "epoch": 4332} {"train_loss": -26.20586585998535, "global_step": 359633, "epoch": 4332} {"train_loss": -26.452558517456055, "global_step": 359634, "epoch": 4332} {"train_loss": -25.955381393432617, "global_step": 359635, "epoch": 4332} {"train_loss": -26.42234230041504, "global_step": 359636, "epoch": 4332} {"train_loss": -26.314044952392578, "global_step": 359637, "epoch": 4332} {"train_loss": -26.194951252764966, "global_step": 359638, "epoch": 4332, "val_loss": 6489027.0} {"train_loss": -23.667583465576172, "global_step": 359639, "epoch": 4333} {"train_loss": -23.008380889892578, "global_step": 359640, "epoch": 4333} {"train_loss": -23.801559448242188, "global_step": 359641, "epoch": 4333} {"train_loss": -23.930036544799805, "global_step": 359642, "epoch": 4333} {"train_loss": -25.55909538269043, "global_step": 359643, "epoch": 4333} {"train_loss": -24.43461036682129, "global_step": 359644, "epoch": 4333} {"train_loss": -24.464370727539062, "global_step": 359645, "epoch": 4333} {"train_loss": -25.07071876525879, "global_step": 359646, "epoch": 4333} {"train_loss": -25.26434326171875, "global_step": 359647, "epoch": 4333} {"train_loss": -24.901275634765625, "global_step": 359648, "epoch": 4333} {"train_loss": -25.367841720581055, "global_step": 359649, "epoch": 4333} {"train_loss": -25.17418098449707, "global_step": 359650, "epoch": 4333} {"train_loss": -25.32684326171875, "global_step": 359651, "epoch": 4333} {"train_loss": -25.278425216674805, "global_step": 359652, "epoch": 4333} {"train_loss": -25.645360946655273, "global_step": 359653, "epoch": 4333} {"train_loss": -25.572423934936523, "global_step": 359654, "epoch": 4333} {"train_loss": -25.82484245300293, "global_step": 359655, "epoch": 4333} {"train_loss": -25.69227409362793, "global_step": 359656, "epoch": 4333} {"train_loss": -25.57916831970215, "global_step": 359657, "epoch": 4333} {"train_loss": -25.86163330078125, "global_step": 359658, "epoch": 4333} {"train_loss": -25.449386596679688, "global_step": 359659, "epoch": 4333} {"train_loss": -25.653913497924805, "global_step": 359660, "epoch": 4333} {"train_loss": -25.85964012145996, "global_step": 359661, "epoch": 4333} {"train_loss": -26.01239013671875, "global_step": 359662, "epoch": 4333} {"train_loss": -25.638273239135742, "global_step": 359663, "epoch": 4333} {"train_loss": -25.856679916381836, "global_step": 359664, "epoch": 4333} {"train_loss": -25.778722763061523, "global_step": 359665, "epoch": 4333} {"train_loss": -26.16306495666504, "global_step": 359666, "epoch": 4333} {"train_loss": -26.080286026000977, "global_step": 359667, "epoch": 4333} {"train_loss": -25.68299674987793, "global_step": 359668, "epoch": 4333} {"train_loss": -26.35918617248535, "global_step": 359669, "epoch": 4333} {"train_loss": -26.352935791015625, "global_step": 359670, "epoch": 4333} {"train_loss": -25.8282413482666, "global_step": 359671, "epoch": 4333} {"train_loss": -25.70985221862793, "global_step": 359672, "epoch": 4333} {"train_loss": -26.248798370361328, "global_step": 359673, "epoch": 4333} {"train_loss": -26.078765869140625, "global_step": 359674, "epoch": 4333} {"train_loss": -26.09541130065918, "global_step": 359675, "epoch": 4333} {"train_loss": -25.899744033813477, "global_step": 359676, "epoch": 4333} {"train_loss": -26.140066146850586, "global_step": 359677, "epoch": 4333} {"train_loss": -25.992650985717773, "global_step": 359678, "epoch": 4333} {"train_loss": -25.81606101989746, "global_step": 359679, "epoch": 4333} {"train_loss": -25.854135513305664, "global_step": 359680, "epoch": 4333} {"train_loss": -26.1821346282959, "global_step": 359681, "epoch": 4333} {"train_loss": -26.40142822265625, "global_step": 359682, "epoch": 4333} {"train_loss": -26.07696533203125, "global_step": 359683, "epoch": 4333} {"train_loss": -25.89432716369629, "global_step": 359684, "epoch": 4333} {"train_loss": -26.23394203186035, "global_step": 359685, "epoch": 4333} {"train_loss": -26.464038848876953, "global_step": 359686, "epoch": 4333} {"train_loss": -26.1757755279541, "global_step": 359687, "epoch": 4333} {"train_loss": -25.82329750061035, "global_step": 359688, "epoch": 4333} {"train_loss": -26.1202449798584, "global_step": 359689, "epoch": 4333} {"train_loss": -26.29108238220215, "global_step": 359690, "epoch": 4333} {"train_loss": -26.189685821533203, "global_step": 359691, "epoch": 4333} {"train_loss": -26.33086585998535, "global_step": 359692, "epoch": 4333} {"train_loss": -25.87135887145996, "global_step": 359693, "epoch": 4333} {"train_loss": -26.257658004760742, "global_step": 359694, "epoch": 4333} {"train_loss": -26.327844619750977, "global_step": 359695, "epoch": 4333} {"train_loss": -26.316137313842773, "global_step": 359696, "epoch": 4333} {"train_loss": -25.806028366088867, "global_step": 359697, "epoch": 4333} {"train_loss": -26.02902603149414, "global_step": 359698, "epoch": 4333} {"train_loss": -26.11159324645996, "global_step": 359699, "epoch": 4333} {"train_loss": -26.117969512939453, "global_step": 359700, "epoch": 4333} {"train_loss": -26.151975631713867, "global_step": 359701, "epoch": 4333} {"train_loss": -26.57037925720215, "global_step": 359702, "epoch": 4333} {"train_loss": -26.39641761779785, "global_step": 359703, "epoch": 4333} {"train_loss": -26.484724044799805, "global_step": 359704, "epoch": 4333} {"train_loss": -26.52560806274414, "global_step": 359705, "epoch": 4333} {"train_loss": -26.371856689453125, "global_step": 359706, "epoch": 4333} {"train_loss": -25.96746826171875, "global_step": 359707, "epoch": 4333} {"train_loss": -25.952808380126953, "global_step": 359708, "epoch": 4333} {"train_loss": -26.31849479675293, "global_step": 359709, "epoch": 4333} {"train_loss": -26.353330612182617, "global_step": 359710, "epoch": 4333} {"train_loss": -26.078067779541016, "global_step": 359711, "epoch": 4333} {"train_loss": -25.69318199157715, "global_step": 359712, "epoch": 4333} {"train_loss": -25.762496948242188, "global_step": 359713, "epoch": 4333} {"train_loss": -25.9835147857666, "global_step": 359714, "epoch": 4333} {"train_loss": -25.8550968170166, "global_step": 359715, "epoch": 4333} {"train_loss": -26.170881271362305, "global_step": 359716, "epoch": 4333} {"train_loss": -26.21150016784668, "global_step": 359717, "epoch": 4333} {"train_loss": -26.100238800048828, "global_step": 359718, "epoch": 4333} {"train_loss": -26.596128463745117, "global_step": 359719, "epoch": 4333} {"train_loss": -25.89851188659668, "global_step": 359720, "epoch": 4333} {"train_loss": -25.815458941172405, "global_step": 359721, "epoch": 4333, "val_loss": 6572064.0} {"train_loss": -26.226648330688477, "global_step": 359722, "epoch": 4334} {"train_loss": -25.773401260375977, "global_step": 359723, "epoch": 4334} {"train_loss": -26.001821517944336, "global_step": 359724, "epoch": 4334} {"train_loss": -26.03628921508789, "global_step": 359725, "epoch": 4334} {"train_loss": -25.78769302368164, "global_step": 359726, "epoch": 4334} {"train_loss": -26.209186553955078, "global_step": 359727, "epoch": 4334} {"train_loss": -25.853424072265625, "global_step": 359728, "epoch": 4334} {"train_loss": -26.08778190612793, "global_step": 359729, "epoch": 4334} {"train_loss": -25.878314971923828, "global_step": 359730, "epoch": 4334} {"train_loss": -26.354047775268555, "global_step": 359731, "epoch": 4334} {"train_loss": -26.304224014282227, "global_step": 359732, "epoch": 4334} {"train_loss": -26.32659339904785, "global_step": 359733, "epoch": 4334} {"train_loss": -26.2707462310791, "global_step": 359734, "epoch": 4334} {"train_loss": -26.317846298217773, "global_step": 359735, "epoch": 4334} {"train_loss": -26.55953025817871, "global_step": 359736, "epoch": 4334} {"train_loss": -26.30872917175293, "global_step": 359737, "epoch": 4334} {"train_loss": -26.132434844970703, "global_step": 359738, "epoch": 4334} {"train_loss": -26.1765079498291, "global_step": 359739, "epoch": 4334} {"train_loss": -26.21002769470215, "global_step": 359740, "epoch": 4334} {"train_loss": -26.322967529296875, "global_step": 359741, "epoch": 4334} {"train_loss": -26.1046142578125, "global_step": 359742, "epoch": 4334} {"train_loss": -25.99655532836914, "global_step": 359743, "epoch": 4334} {"train_loss": -26.0357666015625, "global_step": 359744, "epoch": 4334} {"train_loss": -26.001508712768555, "global_step": 359745, "epoch": 4334} {"train_loss": -25.84992027282715, "global_step": 359746, "epoch": 4334} {"train_loss": -26.232446670532227, "global_step": 359747, "epoch": 4334} {"train_loss": -25.962711334228516, "global_step": 359748, "epoch": 4334} {"train_loss": -26.498193740844727, "global_step": 359749, "epoch": 4334} {"train_loss": -26.247528076171875, "global_step": 359750, "epoch": 4334} {"train_loss": -26.213642120361328, "global_step": 359751, "epoch": 4334} {"train_loss": -26.244550704956055, "global_step": 359752, "epoch": 4334} {"train_loss": -26.52225685119629, "global_step": 359753, "epoch": 4334} {"train_loss": -26.445343017578125, "global_step": 359754, "epoch": 4334} {"train_loss": -26.34396743774414, "global_step": 359755, "epoch": 4334} {"train_loss": -26.26356315612793, "global_step": 359756, "epoch": 4334} {"train_loss": -26.427249908447266, "global_step": 359757, "epoch": 4334} {"train_loss": -26.4074764251709, "global_step": 359758, "epoch": 4334} {"train_loss": -26.381641387939453, "global_step": 359759, "epoch": 4334} {"train_loss": -26.3821964263916, "global_step": 359760, "epoch": 4334} {"train_loss": -25.866241455078125, "global_step": 359761, "epoch": 4334} {"train_loss": -26.58462905883789, "global_step": 359762, "epoch": 4334} {"train_loss": -26.508453369140625, "global_step": 359763, "epoch": 4334} {"train_loss": -26.673507690429688, "global_step": 359764, "epoch": 4334} {"train_loss": -26.197132110595703, "global_step": 359765, "epoch": 4334} {"train_loss": -26.43194007873535, "global_step": 359766, "epoch": 4334} {"train_loss": -26.509973526000977, "global_step": 359767, "epoch": 4334} {"train_loss": -26.36652183532715, "global_step": 359768, "epoch": 4334} {"train_loss": -26.577228546142578, "global_step": 359769, "epoch": 4334} {"train_loss": -26.073612213134766, "global_step": 359770, "epoch": 4334} {"train_loss": -26.708005905151367, "global_step": 359771, "epoch": 4334} {"train_loss": -26.437793731689453, "global_step": 359772, "epoch": 4334} {"train_loss": -26.739444732666016, "global_step": 359773, "epoch": 4334} {"train_loss": -26.25898551940918, "global_step": 359774, "epoch": 4334} {"train_loss": -26.460474014282227, "global_step": 359775, "epoch": 4334} {"train_loss": -26.253263473510742, "global_step": 359776, "epoch": 4334} {"train_loss": -26.463464736938477, "global_step": 359777, "epoch": 4334} {"train_loss": -26.44479751586914, "global_step": 359778, "epoch": 4334} {"train_loss": -26.52253532409668, "global_step": 359779, "epoch": 4334} {"train_loss": -26.276142120361328, "global_step": 359780, "epoch": 4334} {"train_loss": -26.596343994140625, "global_step": 359781, "epoch": 4334} {"train_loss": -26.3667049407959, "global_step": 359782, "epoch": 4334} {"train_loss": -26.47220230102539, "global_step": 359783, "epoch": 4334} {"train_loss": -26.40943717956543, "global_step": 359784, "epoch": 4334} {"train_loss": -26.4558048248291, "global_step": 359785, "epoch": 4334} {"train_loss": -26.281946182250977, "global_step": 359786, "epoch": 4334} {"train_loss": -26.525375366210938, "global_step": 359787, "epoch": 4334} {"train_loss": -26.32545280456543, "global_step": 359788, "epoch": 4334} {"train_loss": -26.422943115234375, "global_step": 359789, "epoch": 4334} {"train_loss": -26.1273136138916, "global_step": 359790, "epoch": 4334} {"train_loss": -25.868112564086914, "global_step": 359791, "epoch": 4334} {"train_loss": -26.4106502532959, "global_step": 359792, "epoch": 4334} {"train_loss": -26.643125534057617, "global_step": 359793, "epoch": 4334} {"train_loss": -26.1265926361084, "global_step": 359794, "epoch": 4334} {"train_loss": -25.82146644592285, "global_step": 359795, "epoch": 4334} {"train_loss": -26.052778244018555, "global_step": 359796, "epoch": 4334} {"train_loss": -26.004791259765625, "global_step": 359797, "epoch": 4334} {"train_loss": -25.839130401611328, "global_step": 359798, "epoch": 4334} {"train_loss": -26.12835693359375, "global_step": 359799, "epoch": 4334} {"train_loss": -25.969221115112305, "global_step": 359800, "epoch": 4334} {"train_loss": -26.060291290283203, "global_step": 359801, "epoch": 4334} {"train_loss": -26.147016525268555, "global_step": 359802, "epoch": 4334} {"train_loss": -25.7901611328125, "global_step": 359803, "epoch": 4334} {"train_loss": -26.24782755288733, "global_step": 359804, "epoch": 4334, "val_loss": 6585607.0} {"train_loss": -25.520797729492188, "global_step": 359805, "epoch": 4335} {"train_loss": -25.864545822143555, "global_step": 359806, "epoch": 4335} {"train_loss": -25.701416015625, "global_step": 359807, "epoch": 4335} {"train_loss": -25.5452823638916, "global_step": 359808, "epoch": 4335} {"train_loss": -25.85445213317871, "global_step": 359809, "epoch": 4335} {"train_loss": -26.087894439697266, "global_step": 359810, "epoch": 4335} {"train_loss": -25.539871215820312, "global_step": 359811, "epoch": 4335} {"train_loss": -25.461536407470703, "global_step": 359812, "epoch": 4335} {"train_loss": -25.49090003967285, "global_step": 359813, "epoch": 4335} {"train_loss": -26.130889892578125, "global_step": 359814, "epoch": 4335} {"train_loss": -25.78013038635254, "global_step": 359815, "epoch": 4335} {"train_loss": -25.953022003173828, "global_step": 359816, "epoch": 4335} {"train_loss": -25.533607482910156, "global_step": 359817, "epoch": 4335} {"train_loss": -26.040903091430664, "global_step": 359818, "epoch": 4335} {"train_loss": -25.81780433654785, "global_step": 359819, "epoch": 4335} {"train_loss": -26.322193145751953, "global_step": 359820, "epoch": 4335} {"train_loss": -26.05324363708496, "global_step": 359821, "epoch": 4335} {"train_loss": -25.761560440063477, "global_step": 359822, "epoch": 4335} {"train_loss": -26.198190689086914, "global_step": 359823, "epoch": 4335} {"train_loss": -26.01582145690918, "global_step": 359824, "epoch": 4335} {"train_loss": -26.111547470092773, "global_step": 359825, "epoch": 4335} {"train_loss": -26.055877685546875, "global_step": 359826, "epoch": 4335} {"train_loss": -26.306753158569336, "global_step": 359827, "epoch": 4335} {"train_loss": -26.124603271484375, "global_step": 359828, "epoch": 4335} {"train_loss": -26.335615158081055, "global_step": 359829, "epoch": 4335} {"train_loss": -26.5263671875, "global_step": 359830, "epoch": 4335} {"train_loss": -26.444747924804688, "global_step": 359831, "epoch": 4335} {"train_loss": -26.358850479125977, "global_step": 359832, "epoch": 4335} {"train_loss": -26.29633903503418, "global_step": 359833, "epoch": 4335} {"train_loss": -26.70804786682129, "global_step": 359834, "epoch": 4335} {"train_loss": -26.298603057861328, "global_step": 359835, "epoch": 4335} {"train_loss": -25.947589874267578, "global_step": 359836, "epoch": 4335} {"train_loss": -26.171247482299805, "global_step": 359837, "epoch": 4335} {"train_loss": -26.05535316467285, "global_step": 359838, "epoch": 4335} {"train_loss": -26.2255802154541, "global_step": 359839, "epoch": 4335} {"train_loss": -26.081018447875977, "global_step": 359840, "epoch": 4335} {"train_loss": -26.04109001159668, "global_step": 359841, "epoch": 4335} {"train_loss": -26.334402084350586, "global_step": 359842, "epoch": 4335} {"train_loss": -26.219684600830078, "global_step": 359843, "epoch": 4335} {"train_loss": -26.13197135925293, "global_step": 359844, "epoch": 4335} {"train_loss": -26.270471572875977, "global_step": 359845, "epoch": 4335} {"train_loss": -26.2576904296875, "global_step": 359846, "epoch": 4335} {"train_loss": -26.10089683532715, "global_step": 359847, "epoch": 4335} {"train_loss": -26.08954429626465, "global_step": 359848, "epoch": 4335} {"train_loss": -26.43280601501465, "global_step": 359849, "epoch": 4335} {"train_loss": -26.50374412536621, "global_step": 359850, "epoch": 4335} {"train_loss": -26.224462509155273, "global_step": 359851, "epoch": 4335} {"train_loss": -26.053430557250977, "global_step": 359852, "epoch": 4335} {"train_loss": -26.46347427368164, "global_step": 359853, "epoch": 4335} {"train_loss": -26.20576286315918, "global_step": 359854, "epoch": 4335} {"train_loss": -26.29389762878418, "global_step": 359855, "epoch": 4335} {"train_loss": -25.8378963470459, "global_step": 359856, "epoch": 4335} {"train_loss": -25.80803871154785, "global_step": 359857, "epoch": 4335} {"train_loss": -26.0530948638916, "global_step": 359858, "epoch": 4335} {"train_loss": -26.466176986694336, "global_step": 359859, "epoch": 4335} {"train_loss": -25.881591796875, "global_step": 359860, "epoch": 4335} {"train_loss": -25.234716415405273, "global_step": 359861, "epoch": 4335} {"train_loss": -24.903663635253906, "global_step": 359862, "epoch": 4335} {"train_loss": -25.911121368408203, "global_step": 359863, "epoch": 4335} {"train_loss": -26.037153244018555, "global_step": 359864, "epoch": 4335} {"train_loss": -25.72376823425293, "global_step": 359865, "epoch": 4335} {"train_loss": -25.87251091003418, "global_step": 359866, "epoch": 4335} {"train_loss": -25.7343807220459, "global_step": 359867, "epoch": 4335} {"train_loss": -26.052692413330078, "global_step": 359868, "epoch": 4335} {"train_loss": -25.990320205688477, "global_step": 359869, "epoch": 4335} {"train_loss": -26.00642967224121, "global_step": 359870, "epoch": 4335} {"train_loss": -26.298248291015625, "global_step": 359871, "epoch": 4335} {"train_loss": -25.950490951538086, "global_step": 359872, "epoch": 4335} {"train_loss": -25.7418212890625, "global_step": 359873, "epoch": 4335} {"train_loss": -25.857919692993164, "global_step": 359874, "epoch": 4335} {"train_loss": -25.940174102783203, "global_step": 359875, "epoch": 4335} {"train_loss": -26.336164474487305, "global_step": 359876, "epoch": 4335} {"train_loss": -26.116262435913086, "global_step": 359877, "epoch": 4335} {"train_loss": -25.609472274780273, "global_step": 359878, "epoch": 4335} {"train_loss": -26.402667999267578, "global_step": 359879, "epoch": 4335} {"train_loss": -25.95509147644043, "global_step": 359880, "epoch": 4335} {"train_loss": -26.60190773010254, "global_step": 359881, "epoch": 4335} {"train_loss": -25.978317260742188, "global_step": 359882, "epoch": 4335} {"train_loss": -26.025449752807617, "global_step": 359883, "epoch": 4335} {"train_loss": -26.596338272094727, "global_step": 359884, "epoch": 4335} {"train_loss": -26.107946395874023, "global_step": 359885, "epoch": 4335} {"train_loss": -26.390018463134766, "global_step": 359886, "epoch": 4335} {"train_loss": -26.04900258994964, "global_step": 359887, "epoch": 4335, "val_loss": 6502403.0} {"train_loss": -25.930871963500977, "global_step": 359888, "epoch": 4336} {"train_loss": -25.89095115661621, "global_step": 359889, "epoch": 4336} {"train_loss": -25.843820571899414, "global_step": 359890, "epoch": 4336} {"train_loss": -26.05586051940918, "global_step": 359891, "epoch": 4336} {"train_loss": -26.099639892578125, "global_step": 359892, "epoch": 4336} {"train_loss": -26.075580596923828, "global_step": 359893, "epoch": 4336} {"train_loss": -26.07330322265625, "global_step": 359894, "epoch": 4336} {"train_loss": -25.998123168945312, "global_step": 359895, "epoch": 4336} {"train_loss": -25.858661651611328, "global_step": 359896, "epoch": 4336} {"train_loss": -25.92899513244629, "global_step": 359897, "epoch": 4336} {"train_loss": -25.943180084228516, "global_step": 359898, "epoch": 4336} {"train_loss": -26.257169723510742, "global_step": 359899, "epoch": 4336} {"train_loss": -26.128625869750977, "global_step": 359900, "epoch": 4336} {"train_loss": -26.307926177978516, "global_step": 359901, "epoch": 4336} {"train_loss": -25.6807918548584, "global_step": 359902, "epoch": 4336} {"train_loss": -26.160846710205078, "global_step": 359903, "epoch": 4336} {"train_loss": -26.37239646911621, "global_step": 359904, "epoch": 4336} {"train_loss": -26.10422706604004, "global_step": 359905, "epoch": 4336} {"train_loss": -26.212310791015625, "global_step": 359906, "epoch": 4336} {"train_loss": -26.200159072875977, "global_step": 359907, "epoch": 4336} {"train_loss": -26.27312660217285, "global_step": 359908, "epoch": 4336} {"train_loss": -26.526229858398438, "global_step": 359909, "epoch": 4336} {"train_loss": -26.577280044555664, "global_step": 359910, "epoch": 4336} {"train_loss": -26.5954647064209, "global_step": 359911, "epoch": 4336} {"train_loss": -25.991439819335938, "global_step": 359912, "epoch": 4336} {"train_loss": -26.4604549407959, "global_step": 359913, "epoch": 4336} {"train_loss": -26.167438507080078, "global_step": 359914, "epoch": 4336} {"train_loss": -26.616107940673828, "global_step": 359915, "epoch": 4336} {"train_loss": -26.0321044921875, "global_step": 359916, "epoch": 4336} {"train_loss": -26.40044593811035, "global_step": 359917, "epoch": 4336} {"train_loss": -26.627471923828125, "global_step": 359918, "epoch": 4336} {"train_loss": -26.6707820892334, "global_step": 359919, "epoch": 4336} {"train_loss": -26.6540470123291, "global_step": 359920, "epoch": 4336} {"train_loss": -26.529254913330078, "global_step": 359921, "epoch": 4336} {"train_loss": -26.418859481811523, "global_step": 359922, "epoch": 4336} {"train_loss": -26.4384708404541, "global_step": 359923, "epoch": 4336} {"train_loss": -26.529123306274414, "global_step": 359924, "epoch": 4336} {"train_loss": -26.71754264831543, "global_step": 359925, "epoch": 4336} {"train_loss": -26.240278244018555, "global_step": 359926, "epoch": 4336} {"train_loss": -26.061172485351562, "global_step": 359927, "epoch": 4336} {"train_loss": -26.279850006103516, "global_step": 359928, "epoch": 4336} {"train_loss": -26.19753074645996, "global_step": 359929, "epoch": 4336} {"train_loss": -26.465137481689453, "global_step": 359930, "epoch": 4336} {"train_loss": -25.893295288085938, "global_step": 359931, "epoch": 4336} {"train_loss": -26.012624740600586, "global_step": 359932, "epoch": 4336} {"train_loss": -25.897663116455078, "global_step": 359933, "epoch": 4336} {"train_loss": -26.19927406311035, "global_step": 359934, "epoch": 4336} {"train_loss": -26.073612213134766, "global_step": 359935, "epoch": 4336} {"train_loss": -25.551908493041992, "global_step": 359936, "epoch": 4336} {"train_loss": -25.901975631713867, "global_step": 359937, "epoch": 4336} {"train_loss": -26.0856876373291, "global_step": 359938, "epoch": 4336} {"train_loss": -25.943578720092773, "global_step": 359939, "epoch": 4336} {"train_loss": -25.853185653686523, "global_step": 359940, "epoch": 4336} {"train_loss": -26.121545791625977, "global_step": 359941, "epoch": 4336} {"train_loss": -26.143152236938477, "global_step": 359942, "epoch": 4336} {"train_loss": -26.33282470703125, "global_step": 359943, "epoch": 4336} {"train_loss": -25.795202255249023, "global_step": 359944, "epoch": 4336} {"train_loss": -25.655858993530273, "global_step": 359945, "epoch": 4336} {"train_loss": -26.161848068237305, "global_step": 359946, "epoch": 4336} {"train_loss": -26.003894805908203, "global_step": 359947, "epoch": 4336} {"train_loss": -26.246023178100586, "global_step": 359948, "epoch": 4336} {"train_loss": -26.137052536010742, "global_step": 359949, "epoch": 4336} {"train_loss": -26.31062889099121, "global_step": 359950, "epoch": 4336} {"train_loss": -26.122411727905273, "global_step": 359951, "epoch": 4336} {"train_loss": -25.75308609008789, "global_step": 359952, "epoch": 4336} {"train_loss": -26.427383422851562, "global_step": 359953, "epoch": 4336} {"train_loss": -26.316442489624023, "global_step": 359954, "epoch": 4336} {"train_loss": -26.367895126342773, "global_step": 359955, "epoch": 4336} {"train_loss": -25.8951358795166, "global_step": 359956, "epoch": 4336} {"train_loss": -26.317127227783203, "global_step": 359957, "epoch": 4336} {"train_loss": -26.563217163085938, "global_step": 359958, "epoch": 4336} {"train_loss": -26.016448974609375, "global_step": 359959, "epoch": 4336} {"train_loss": -25.913970947265625, "global_step": 359960, "epoch": 4336} {"train_loss": -26.347349166870117, "global_step": 359961, "epoch": 4336} {"train_loss": -26.449060440063477, "global_step": 359962, "epoch": 4336} {"train_loss": -25.938337326049805, "global_step": 359963, "epoch": 4336} {"train_loss": -25.977991104125977, "global_step": 359964, "epoch": 4336} {"train_loss": -25.9677734375, "global_step": 359965, "epoch": 4336} {"train_loss": -26.10504150390625, "global_step": 359966, "epoch": 4336} {"train_loss": -26.51717185974121, "global_step": 359967, "epoch": 4336} {"train_loss": -26.352523803710938, "global_step": 359968, "epoch": 4336} {"train_loss": -26.188129425048828, "global_step": 359969, "epoch": 4336} {"train_loss": -26.171694330422277, "global_step": 359970, "epoch": 4336, "val_loss": 6662677.5} {"train_loss": -26.079757690429688, "global_step": 359971, "epoch": 4337} {"train_loss": -26.110702514648438, "global_step": 359972, "epoch": 4337} {"train_loss": -26.26746940612793, "global_step": 359973, "epoch": 4337} {"train_loss": -26.076913833618164, "global_step": 359974, "epoch": 4337} {"train_loss": -25.8681697845459, "global_step": 359975, "epoch": 4337} {"train_loss": -26.084735870361328, "global_step": 359976, "epoch": 4337} {"train_loss": -26.140705108642578, "global_step": 359977, "epoch": 4337} {"train_loss": -25.725366592407227, "global_step": 359978, "epoch": 4337} {"train_loss": -26.41226577758789, "global_step": 359979, "epoch": 4337} {"train_loss": -25.769174575805664, "global_step": 359980, "epoch": 4337} {"train_loss": -25.932409286499023, "global_step": 359981, "epoch": 4337} {"train_loss": -26.055891036987305, "global_step": 359982, "epoch": 4337} {"train_loss": -26.011301040649414, "global_step": 359983, "epoch": 4337} {"train_loss": -25.854846954345703, "global_step": 359984, "epoch": 4337} {"train_loss": -26.227521896362305, "global_step": 359985, "epoch": 4337} {"train_loss": -26.33717918395996, "global_step": 359986, "epoch": 4337} {"train_loss": -26.033954620361328, "global_step": 359987, "epoch": 4337} {"train_loss": -26.03643798828125, "global_step": 359988, "epoch": 4337} {"train_loss": -26.3055477142334, "global_step": 359989, "epoch": 4337} {"train_loss": -26.400129318237305, "global_step": 359990, "epoch": 4337} {"train_loss": -26.391080856323242, "global_step": 359991, "epoch": 4337} {"train_loss": -26.178125381469727, "global_step": 359992, "epoch": 4337} {"train_loss": -26.106372833251953, "global_step": 359993, "epoch": 4337} {"train_loss": -26.428680419921875, "global_step": 359994, "epoch": 4337} {"train_loss": -26.381717681884766, "global_step": 359995, "epoch": 4337} {"train_loss": -26.188526153564453, "global_step": 359996, "epoch": 4337} {"train_loss": -26.216962814331055, "global_step": 359997, "epoch": 4337} {"train_loss": -26.499103546142578, "global_step": 359998, "epoch": 4337} {"train_loss": -26.55280876159668, "global_step": 359999, "epoch": 4337} {"train_loss": -26.305871963500977, "global_step": 360000, "epoch": 4337} {"train_loss": -26.665266036987305, "global_step": 360001, "epoch": 4337} {"train_loss": -26.73655128479004, "global_step": 360002, "epoch": 4337} {"train_loss": -26.0018367767334, "global_step": 360003, "epoch": 4337} {"train_loss": -26.5425968170166, "global_step": 360004, "epoch": 4337} {"train_loss": -26.595239639282227, "global_step": 360005, "epoch": 4337} {"train_loss": -26.622394561767578, "global_step": 360006, "epoch": 4337} {"train_loss": -26.422317504882812, "global_step": 360007, "epoch": 4337} {"train_loss": -26.726682662963867, "global_step": 360008, "epoch": 4337} {"train_loss": -26.497663497924805, "global_step": 360009, "epoch": 4337} {"train_loss": -26.632858276367188, "global_step": 360010, "epoch": 4337} {"train_loss": -26.526464462280273, "global_step": 360011, "epoch": 4337} {"train_loss": -26.28792381286621, "global_step": 360012, "epoch": 4337} {"train_loss": -26.13006019592285, "global_step": 360013, "epoch": 4337} {"train_loss": -26.287744522094727, "global_step": 360014, "epoch": 4337} {"train_loss": -26.010028839111328, "global_step": 360015, "epoch": 4337} {"train_loss": -26.437850952148438, "global_step": 360016, "epoch": 4337} {"train_loss": -26.656599044799805, "global_step": 360017, "epoch": 4337} {"train_loss": -26.63752555847168, "global_step": 360018, "epoch": 4337} {"train_loss": -26.269311904907227, "global_step": 360019, "epoch": 4337} {"train_loss": -26.299362182617188, "global_step": 360020, "epoch": 4337} {"train_loss": -25.422292709350586, "global_step": 360021, "epoch": 4337} {"train_loss": -25.7390079498291, "global_step": 360022, "epoch": 4337} {"train_loss": -25.455913543701172, "global_step": 360023, "epoch": 4337} {"train_loss": -26.72914695739746, "global_step": 360024, "epoch": 4337} {"train_loss": -25.79522705078125, "global_step": 360025, "epoch": 4337} {"train_loss": -25.671674728393555, "global_step": 360026, "epoch": 4337} {"train_loss": -26.50381851196289, "global_step": 360027, "epoch": 4337} {"train_loss": -25.790143966674805, "global_step": 360028, "epoch": 4337} {"train_loss": -26.461095809936523, "global_step": 360029, "epoch": 4337} {"train_loss": -25.7375431060791, "global_step": 360030, "epoch": 4337} {"train_loss": -25.86322021484375, "global_step": 360031, "epoch": 4337} {"train_loss": -25.933828353881836, "global_step": 360032, "epoch": 4337} {"train_loss": -26.115049362182617, "global_step": 360033, "epoch": 4337} {"train_loss": -25.956815719604492, "global_step": 360034, "epoch": 4337} {"train_loss": -26.02691078186035, "global_step": 360035, "epoch": 4337} {"train_loss": -26.114791870117188, "global_step": 360036, "epoch": 4337} {"train_loss": -26.19169044494629, "global_step": 360037, "epoch": 4337} {"train_loss": -25.915851593017578, "global_step": 360038, "epoch": 4337} {"train_loss": -25.873010635375977, "global_step": 360039, "epoch": 4337} {"train_loss": -25.80426025390625, "global_step": 360040, "epoch": 4337} {"train_loss": -25.918867111206055, "global_step": 360041, "epoch": 4337} {"train_loss": -25.999425888061523, "global_step": 360042, "epoch": 4337} {"train_loss": -25.771825790405273, "global_step": 360043, "epoch": 4337} {"train_loss": -26.16377067565918, "global_step": 360044, "epoch": 4337} {"train_loss": -26.242944717407227, "global_step": 360045, "epoch": 4337} {"train_loss": -26.19021987915039, "global_step": 360046, "epoch": 4337} {"train_loss": -25.695636749267578, "global_step": 360047, "epoch": 4337} {"train_loss": -26.152999877929688, "global_step": 360048, "epoch": 4337} {"train_loss": -25.95123863220215, "global_step": 360049, "epoch": 4337} {"train_loss": -26.269882202148438, "global_step": 360050, "epoch": 4337} {"train_loss": -25.99880027770996, "global_step": 360051, "epoch": 4337} {"train_loss": -25.798023223876953, "global_step": 360052, "epoch": 4337} {"train_loss": -26.174934272306512, "global_step": 360053, "epoch": 4337, "val_loss": 6620220.5} {"train_loss": -25.30392837524414, "global_step": 360054, "epoch": 4338} {"train_loss": -25.876483917236328, "global_step": 360055, "epoch": 4338} {"train_loss": -25.16330337524414, "global_step": 360056, "epoch": 4338} {"train_loss": -25.343839645385742, "global_step": 360057, "epoch": 4338} {"train_loss": -25.0670223236084, "global_step": 360058, "epoch": 4338} {"train_loss": -25.227123260498047, "global_step": 360059, "epoch": 4338} {"train_loss": -25.09071159362793, "global_step": 360060, "epoch": 4338} {"train_loss": -25.82131004333496, "global_step": 360061, "epoch": 4338} {"train_loss": -25.75251579284668, "global_step": 360062, "epoch": 4338} {"train_loss": -25.487504959106445, "global_step": 360063, "epoch": 4338} {"train_loss": -25.743698120117188, "global_step": 360064, "epoch": 4338} {"train_loss": -25.988971710205078, "global_step": 360065, "epoch": 4338} {"train_loss": -25.752063751220703, "global_step": 360066, "epoch": 4338} {"train_loss": -25.875415802001953, "global_step": 360067, "epoch": 4338} {"train_loss": -26.306310653686523, "global_step": 360068, "epoch": 4338} {"train_loss": -25.933889389038086, "global_step": 360069, "epoch": 4338} {"train_loss": -25.915250778198242, "global_step": 360070, "epoch": 4338} {"train_loss": -26.026233673095703, "global_step": 360071, "epoch": 4338} {"train_loss": -26.1640682220459, "global_step": 360072, "epoch": 4338} {"train_loss": -25.867996215820312, "global_step": 360073, "epoch": 4338} {"train_loss": -26.149017333984375, "global_step": 360074, "epoch": 4338} {"train_loss": -25.957611083984375, "global_step": 360075, "epoch": 4338} {"train_loss": -25.984375, "global_step": 360076, "epoch": 4338} {"train_loss": -26.176055908203125, "global_step": 360077, "epoch": 4338} {"train_loss": -26.102582931518555, "global_step": 360078, "epoch": 4338} {"train_loss": -25.961206436157227, "global_step": 360079, "epoch": 4338} {"train_loss": -26.497446060180664, "global_step": 360080, "epoch": 4338} {"train_loss": -25.96647071838379, "global_step": 360081, "epoch": 4338} {"train_loss": -26.294082641601562, "global_step": 360082, "epoch": 4338} {"train_loss": -25.99560546875, "global_step": 360083, "epoch": 4338} {"train_loss": -26.292129516601562, "global_step": 360084, "epoch": 4338} {"train_loss": -25.969289779663086, "global_step": 360085, "epoch": 4338} {"train_loss": -26.157611846923828, "global_step": 360086, "epoch": 4338} {"train_loss": -26.086740493774414, "global_step": 360087, "epoch": 4338} {"train_loss": -26.22116470336914, "global_step": 360088, "epoch": 4338} {"train_loss": -26.066442489624023, "global_step": 360089, "epoch": 4338} {"train_loss": -25.93023109436035, "global_step": 360090, "epoch": 4338} {"train_loss": -26.558332443237305, "global_step": 360091, "epoch": 4338} {"train_loss": -26.3240966796875, "global_step": 360092, "epoch": 4338} {"train_loss": -26.093952178955078, "global_step": 360093, "epoch": 4338} {"train_loss": -26.504602432250977, "global_step": 360094, "epoch": 4338} {"train_loss": -26.51026725769043, "global_step": 360095, "epoch": 4338} {"train_loss": -26.5553035736084, "global_step": 360096, "epoch": 4338} {"train_loss": -26.296478271484375, "global_step": 360097, "epoch": 4338} {"train_loss": -26.0289306640625, "global_step": 360098, "epoch": 4338} {"train_loss": -26.567615509033203, "global_step": 360099, "epoch": 4338} {"train_loss": -26.325971603393555, "global_step": 360100, "epoch": 4338} {"train_loss": -26.592493057250977, "global_step": 360101, "epoch": 4338} {"train_loss": -26.430023193359375, "global_step": 360102, "epoch": 4338} {"train_loss": -26.012069702148438, "global_step": 360103, "epoch": 4338} {"train_loss": -26.3074951171875, "global_step": 360104, "epoch": 4338} {"train_loss": -26.451520919799805, "global_step": 360105, "epoch": 4338} {"train_loss": -26.164770126342773, "global_step": 360106, "epoch": 4338} {"train_loss": -26.209131240844727, "global_step": 360107, "epoch": 4338} {"train_loss": -26.1407470703125, "global_step": 360108, "epoch": 4338} {"train_loss": -26.580829620361328, "global_step": 360109, "epoch": 4338} {"train_loss": -26.154937744140625, "global_step": 360110, "epoch": 4338} {"train_loss": -26.368871688842773, "global_step": 360111, "epoch": 4338} {"train_loss": -26.153905868530273, "global_step": 360112, "epoch": 4338} {"train_loss": -26.453388214111328, "global_step": 360113, "epoch": 4338} {"train_loss": -26.37635612487793, "global_step": 360114, "epoch": 4338} {"train_loss": -26.413272857666016, "global_step": 360115, "epoch": 4338} {"train_loss": -25.790958404541016, "global_step": 360116, "epoch": 4338} {"train_loss": -25.775653839111328, "global_step": 360117, "epoch": 4338} {"train_loss": -25.66095542907715, "global_step": 360118, "epoch": 4338} {"train_loss": -26.166915893554688, "global_step": 360119, "epoch": 4338} {"train_loss": -26.331640243530273, "global_step": 360120, "epoch": 4338} {"train_loss": -26.029356002807617, "global_step": 360121, "epoch": 4338} {"train_loss": -26.1395263671875, "global_step": 360122, "epoch": 4338} {"train_loss": -26.150588989257812, "global_step": 360123, "epoch": 4338} {"train_loss": -26.414854049682617, "global_step": 360124, "epoch": 4338} {"train_loss": -26.394775390625, "global_step": 360125, "epoch": 4338} {"train_loss": -25.99855613708496, "global_step": 360126, "epoch": 4338} {"train_loss": -26.204309463500977, "global_step": 360127, "epoch": 4338} {"train_loss": -25.860504150390625, "global_step": 360128, "epoch": 4338} {"train_loss": -26.53909683227539, "global_step": 360129, "epoch": 4338} {"train_loss": -25.98736572265625, "global_step": 360130, "epoch": 4338} {"train_loss": -25.887479782104492, "global_step": 360131, "epoch": 4338} {"train_loss": -26.008853912353516, "global_step": 360132, "epoch": 4338} {"train_loss": -26.396167755126953, "global_step": 360133, "epoch": 4338} {"train_loss": -26.21011734008789, "global_step": 360134, "epoch": 4338} {"train_loss": -26.290876388549805, "global_step": 360135, "epoch": 4338} {"train_loss": -26.098730156220586, "global_step": 360136, "epoch": 4338, "val_loss": 6553192.0} {"train_loss": -25.952051162719727, "global_step": 360137, "epoch": 4339} {"train_loss": -26.145187377929688, "global_step": 360138, "epoch": 4339} {"train_loss": -26.3118953704834, "global_step": 360139, "epoch": 4339} {"train_loss": -25.959238052368164, "global_step": 360140, "epoch": 4339} {"train_loss": -25.916696548461914, "global_step": 360141, "epoch": 4339} {"train_loss": -25.875314712524414, "global_step": 360142, "epoch": 4339} {"train_loss": -25.77411460876465, "global_step": 360143, "epoch": 4339} {"train_loss": -26.201642990112305, "global_step": 360144, "epoch": 4339} {"train_loss": -26.30463981628418, "global_step": 360145, "epoch": 4339} {"train_loss": -26.129535675048828, "global_step": 360146, "epoch": 4339} {"train_loss": -26.1483154296875, "global_step": 360147, "epoch": 4339} {"train_loss": -25.814350128173828, "global_step": 360148, "epoch": 4339} {"train_loss": -25.990406036376953, "global_step": 360149, "epoch": 4339} {"train_loss": -25.838048934936523, "global_step": 360150, "epoch": 4339} {"train_loss": -26.0339298248291, "global_step": 360151, "epoch": 4339} {"train_loss": -26.127206802368164, "global_step": 360152, "epoch": 4339} {"train_loss": -25.66340446472168, "global_step": 360153, "epoch": 4339} {"train_loss": -25.957181930541992, "global_step": 360154, "epoch": 4339} {"train_loss": -26.373016357421875, "global_step": 360155, "epoch": 4339} {"train_loss": -26.479211807250977, "global_step": 360156, "epoch": 4339} {"train_loss": -26.0051326751709, "global_step": 360157, "epoch": 4339} {"train_loss": -26.236164093017578, "global_step": 360158, "epoch": 4339} {"train_loss": -26.146087646484375, "global_step": 360159, "epoch": 4339} {"train_loss": -26.45364761352539, "global_step": 360160, "epoch": 4339} {"train_loss": -26.10552406311035, "global_step": 360161, "epoch": 4339} {"train_loss": -26.1041316986084, "global_step": 360162, "epoch": 4339} {"train_loss": -26.239765167236328, "global_step": 360163, "epoch": 4339} {"train_loss": -26.345508575439453, "global_step": 360164, "epoch": 4339} {"train_loss": -26.24957847595215, "global_step": 360165, "epoch": 4339} {"train_loss": -26.112768173217773, "global_step": 360166, "epoch": 4339} {"train_loss": -25.97633171081543, "global_step": 360167, "epoch": 4339} {"train_loss": -26.504196166992188, "global_step": 360168, "epoch": 4339} {"train_loss": -26.375574111938477, "global_step": 360169, "epoch": 4339} {"train_loss": -26.400922775268555, "global_step": 360170, "epoch": 4339} {"train_loss": -26.359100341796875, "global_step": 360171, "epoch": 4339} {"train_loss": -26.19232177734375, "global_step": 360172, "epoch": 4339} {"train_loss": -26.372634887695312, "global_step": 360173, "epoch": 4339} {"train_loss": -25.72251319885254, "global_step": 360174, "epoch": 4339} {"train_loss": -26.007770538330078, "global_step": 360175, "epoch": 4339} {"train_loss": -26.080244064331055, "global_step": 360176, "epoch": 4339} {"train_loss": -26.38088035583496, "global_step": 360177, "epoch": 4339} {"train_loss": -26.164525985717773, "global_step": 360178, "epoch": 4339} {"train_loss": -26.12662124633789, "global_step": 360179, "epoch": 4339} {"train_loss": -26.146093368530273, "global_step": 360180, "epoch": 4339} {"train_loss": -26.46864128112793, "global_step": 360181, "epoch": 4339} {"train_loss": -26.0925235748291, "global_step": 360182, "epoch": 4339} {"train_loss": -26.433027267456055, "global_step": 360183, "epoch": 4339} {"train_loss": -26.496509552001953, "global_step": 360184, "epoch": 4339} {"train_loss": -26.223957061767578, "global_step": 360185, "epoch": 4339} {"train_loss": -26.09808921813965, "global_step": 360186, "epoch": 4339} {"train_loss": -26.073760986328125, "global_step": 360187, "epoch": 4339} {"train_loss": -26.1439208984375, "global_step": 360188, "epoch": 4339} {"train_loss": -26.453046798706055, "global_step": 360189, "epoch": 4339} {"train_loss": -26.168170928955078, "global_step": 360190, "epoch": 4339} {"train_loss": -25.84270668029785, "global_step": 360191, "epoch": 4339} {"train_loss": -26.070363998413086, "global_step": 360192, "epoch": 4339} {"train_loss": -26.171112060546875, "global_step": 360193, "epoch": 4339} {"train_loss": -26.027698516845703, "global_step": 360194, "epoch": 4339} {"train_loss": -26.060331344604492, "global_step": 360195, "epoch": 4339} {"train_loss": -26.358850479125977, "global_step": 360196, "epoch": 4339} {"train_loss": -26.32832908630371, "global_step": 360197, "epoch": 4339} {"train_loss": -26.224390029907227, "global_step": 360198, "epoch": 4339} {"train_loss": -26.074560165405273, "global_step": 360199, "epoch": 4339} {"train_loss": -26.4848575592041, "global_step": 360200, "epoch": 4339} {"train_loss": -26.427732467651367, "global_step": 360201, "epoch": 4339} {"train_loss": -26.26899528503418, "global_step": 360202, "epoch": 4339} {"train_loss": -26.173410415649414, "global_step": 360203, "epoch": 4339} {"train_loss": -26.226593017578125, "global_step": 360204, "epoch": 4339} {"train_loss": -26.580358505249023, "global_step": 360205, "epoch": 4339} {"train_loss": -26.598669052124023, "global_step": 360206, "epoch": 4339} {"train_loss": -26.24274253845215, "global_step": 360207, "epoch": 4339} {"train_loss": -26.397815704345703, "global_step": 360208, "epoch": 4339} {"train_loss": -26.291967391967773, "global_step": 360209, "epoch": 4339} {"train_loss": -26.42563247680664, "global_step": 360210, "epoch": 4339} {"train_loss": -26.797504425048828, "global_step": 360211, "epoch": 4339} {"train_loss": -25.94683837890625, "global_step": 360212, "epoch": 4339} {"train_loss": -26.35506248474121, "global_step": 360213, "epoch": 4339} {"train_loss": -26.671051025390625, "global_step": 360214, "epoch": 4339} {"train_loss": -26.419736862182617, "global_step": 360215, "epoch": 4339} {"train_loss": -26.506072998046875, "global_step": 360216, "epoch": 4339} {"train_loss": -26.215986251831055, "global_step": 360217, "epoch": 4339} {"train_loss": -26.154895782470703, "global_step": 360218, "epoch": 4339} {"train_loss": -26.20765552750553, "global_step": 360219, "epoch": 4339, "val_loss": 6546170.0} {"train_loss": -22.42983055114746, "global_step": 360220, "epoch": 4340} {"train_loss": -23.73019790649414, "global_step": 360221, "epoch": 4340} {"train_loss": -23.465831756591797, "global_step": 360222, "epoch": 4340} {"train_loss": -23.94222068786621, "global_step": 360223, "epoch": 4340} {"train_loss": -24.935468673706055, "global_step": 360224, "epoch": 4340} {"train_loss": -24.307546615600586, "global_step": 360225, "epoch": 4340} {"train_loss": -23.953258514404297, "global_step": 360226, "epoch": 4340} {"train_loss": -24.586790084838867, "global_step": 360227, "epoch": 4340} {"train_loss": -24.477516174316406, "global_step": 360228, "epoch": 4340} {"train_loss": -24.980403900146484, "global_step": 360229, "epoch": 4340} {"train_loss": -24.864431381225586, "global_step": 360230, "epoch": 4340} {"train_loss": -24.668787002563477, "global_step": 360231, "epoch": 4340} {"train_loss": -25.302404403686523, "global_step": 360232, "epoch": 4340} {"train_loss": -24.905248641967773, "global_step": 360233, "epoch": 4340} {"train_loss": -25.14118194580078, "global_step": 360234, "epoch": 4340} {"train_loss": -25.553897857666016, "global_step": 360235, "epoch": 4340} {"train_loss": -25.280393600463867, "global_step": 360236, "epoch": 4340} {"train_loss": -25.09012222290039, "global_step": 360237, "epoch": 4340} {"train_loss": -25.513065338134766, "global_step": 360238, "epoch": 4340} {"train_loss": -25.36313819885254, "global_step": 360239, "epoch": 4340} {"train_loss": -25.18180274963379, "global_step": 360240, "epoch": 4340} {"train_loss": -25.248462677001953, "global_step": 360241, "epoch": 4340} {"train_loss": -25.53999137878418, "global_step": 360242, "epoch": 4340} {"train_loss": -25.527795791625977, "global_step": 360243, "epoch": 4340} {"train_loss": -25.431100845336914, "global_step": 360244, "epoch": 4340} {"train_loss": -25.03241539001465, "global_step": 360245, "epoch": 4340} {"train_loss": -25.500476837158203, "global_step": 360246, "epoch": 4340} {"train_loss": -25.806644439697266, "global_step": 360247, "epoch": 4340} {"train_loss": -25.767663955688477, "global_step": 360248, "epoch": 4340} {"train_loss": -25.67405128479004, "global_step": 360249, "epoch": 4340} {"train_loss": -26.024185180664062, "global_step": 360250, "epoch": 4340} {"train_loss": -25.672882080078125, "global_step": 360251, "epoch": 4340} {"train_loss": -25.959518432617188, "global_step": 360252, "epoch": 4340} {"train_loss": -25.985288619995117, "global_step": 360253, "epoch": 4340} {"train_loss": -26.01468276977539, "global_step": 360254, "epoch": 4340} {"train_loss": -26.243249893188477, "global_step": 360255, "epoch": 4340} {"train_loss": -26.230451583862305, "global_step": 360256, "epoch": 4340} {"train_loss": -25.9161376953125, "global_step": 360257, "epoch": 4340} {"train_loss": -26.136220932006836, "global_step": 360258, "epoch": 4340} {"train_loss": -25.995834350585938, "global_step": 360259, "epoch": 4340} {"train_loss": -26.248397827148438, "global_step": 360260, "epoch": 4340} {"train_loss": -25.94183349609375, "global_step": 360261, "epoch": 4340} {"train_loss": -25.810718536376953, "global_step": 360262, "epoch": 4340} {"train_loss": -26.333784103393555, "global_step": 360263, "epoch": 4340} {"train_loss": -26.260772705078125, "global_step": 360264, "epoch": 4340} {"train_loss": -26.1863956451416, "global_step": 360265, "epoch": 4340} {"train_loss": -26.016891479492188, "global_step": 360266, "epoch": 4340} {"train_loss": -26.177276611328125, "global_step": 360267, "epoch": 4340} {"train_loss": -26.035978317260742, "global_step": 360268, "epoch": 4340} {"train_loss": -26.322677612304688, "global_step": 360269, "epoch": 4340} {"train_loss": -26.288705825805664, "global_step": 360270, "epoch": 4340} {"train_loss": -26.081207275390625, "global_step": 360271, "epoch": 4340} {"train_loss": -26.050642013549805, "global_step": 360272, "epoch": 4340} {"train_loss": -26.158981323242188, "global_step": 360273, "epoch": 4340} {"train_loss": -26.284826278686523, "global_step": 360274, "epoch": 4340} {"train_loss": -26.314626693725586, "global_step": 360275, "epoch": 4340} {"train_loss": -26.31862449645996, "global_step": 360276, "epoch": 4340} {"train_loss": -25.897607803344727, "global_step": 360277, "epoch": 4340} {"train_loss": -26.356901168823242, "global_step": 360278, "epoch": 4340} {"train_loss": -26.271045684814453, "global_step": 360279, "epoch": 4340} {"train_loss": -25.81351089477539, "global_step": 360280, "epoch": 4340} {"train_loss": -25.945999145507812, "global_step": 360281, "epoch": 4340} {"train_loss": -25.468189239501953, "global_step": 360282, "epoch": 4340} {"train_loss": -26.247486114501953, "global_step": 360283, "epoch": 4340} {"train_loss": -26.446271896362305, "global_step": 360284, "epoch": 4340} {"train_loss": -26.116199493408203, "global_step": 360285, "epoch": 4340} {"train_loss": -26.052392959594727, "global_step": 360286, "epoch": 4340} {"train_loss": -26.235021591186523, "global_step": 360287, "epoch": 4340} {"train_loss": -26.2165584564209, "global_step": 360288, "epoch": 4340} {"train_loss": -26.468393325805664, "global_step": 360289, "epoch": 4340} {"train_loss": -26.355518341064453, "global_step": 360290, "epoch": 4340} {"train_loss": -26.396448135375977, "global_step": 360291, "epoch": 4340} {"train_loss": -26.678802490234375, "global_step": 360292, "epoch": 4340} {"train_loss": -26.75274658203125, "global_step": 360293, "epoch": 4340} {"train_loss": -26.33112144470215, "global_step": 360294, "epoch": 4340} {"train_loss": -26.372848510742188, "global_step": 360295, "epoch": 4340} {"train_loss": -26.57771873474121, "global_step": 360296, "epoch": 4340} {"train_loss": -26.25446128845215, "global_step": 360297, "epoch": 4340} {"train_loss": -26.21211051940918, "global_step": 360298, "epoch": 4340} {"train_loss": -26.725982666015625, "global_step": 360299, "epoch": 4340} {"train_loss": -25.88947105407715, "global_step": 360300, "epoch": 4340} {"train_loss": -26.013599395751953, "global_step": 360301, "epoch": 4340} {"train_loss": -25.717117907053016, "global_step": 360302, "epoch": 4340, "val_loss": 6603791.0} {"train_loss": -26.342252731323242, "global_step": 360303, "epoch": 4341} {"train_loss": -25.980798721313477, "global_step": 360304, "epoch": 4341} {"train_loss": -26.251108169555664, "global_step": 360305, "epoch": 4341} {"train_loss": -26.2637996673584, "global_step": 360306, "epoch": 4341} {"train_loss": -25.98628044128418, "global_step": 360307, "epoch": 4341} {"train_loss": -26.417158126831055, "global_step": 360308, "epoch": 4341} {"train_loss": -26.0414981842041, "global_step": 360309, "epoch": 4341} {"train_loss": -26.38887596130371, "global_step": 360310, "epoch": 4341} {"train_loss": -26.4185733795166, "global_step": 360311, "epoch": 4341} {"train_loss": -26.136951446533203, "global_step": 360312, "epoch": 4341} {"train_loss": -26.290109634399414, "global_step": 360313, "epoch": 4341} {"train_loss": -26.533496856689453, "global_step": 360314, "epoch": 4341} {"train_loss": -26.294458389282227, "global_step": 360315, "epoch": 4341} {"train_loss": -26.197675704956055, "global_step": 360316, "epoch": 4341} {"train_loss": -26.143857955932617, "global_step": 360317, "epoch": 4341} {"train_loss": -25.8837833404541, "global_step": 360318, "epoch": 4341} {"train_loss": -26.306543350219727, "global_step": 360319, "epoch": 4341} {"train_loss": -25.922870635986328, "global_step": 360320, "epoch": 4341} {"train_loss": -26.42219352722168, "global_step": 360321, "epoch": 4341} {"train_loss": -26.178577423095703, "global_step": 360322, "epoch": 4341} {"train_loss": -26.363977432250977, "global_step": 360323, "epoch": 4341} {"train_loss": -25.7864990234375, "global_step": 360324, "epoch": 4341} {"train_loss": -26.082447052001953, "global_step": 360325, "epoch": 4341} {"train_loss": -26.204343795776367, "global_step": 360326, "epoch": 4341} {"train_loss": -26.323816299438477, "global_step": 360327, "epoch": 4341} {"train_loss": -26.3859920501709, "global_step": 360328, "epoch": 4341} {"train_loss": -26.369552612304688, "global_step": 360329, "epoch": 4341} {"train_loss": -26.239423751831055, "global_step": 360330, "epoch": 4341} {"train_loss": -26.595890045166016, "global_step": 360331, "epoch": 4341} {"train_loss": -26.36567497253418, "global_step": 360332, "epoch": 4341} {"train_loss": -26.283390045166016, "global_step": 360333, "epoch": 4341} {"train_loss": -26.44242286682129, "global_step": 360334, "epoch": 4341} {"train_loss": -26.387027740478516, "global_step": 360335, "epoch": 4341} {"train_loss": -26.435129165649414, "global_step": 360336, "epoch": 4341} {"train_loss": -26.025571823120117, "global_step": 360337, "epoch": 4341} {"train_loss": -26.277008056640625, "global_step": 360338, "epoch": 4341} {"train_loss": -26.12176513671875, "global_step": 360339, "epoch": 4341} {"train_loss": -26.446868896484375, "global_step": 360340, "epoch": 4341} {"train_loss": -26.142822265625, "global_step": 360341, "epoch": 4341} {"train_loss": -26.25160026550293, "global_step": 360342, "epoch": 4341} {"train_loss": -26.89206314086914, "global_step": 360343, "epoch": 4341} {"train_loss": -25.99017906188965, "global_step": 360344, "epoch": 4341} {"train_loss": -26.20134925842285, "global_step": 360345, "epoch": 4341} {"train_loss": -26.312925338745117, "global_step": 360346, "epoch": 4341} {"train_loss": -26.612018585205078, "global_step": 360347, "epoch": 4341} {"train_loss": -26.198759078979492, "global_step": 360348, "epoch": 4341} {"train_loss": -25.65077018737793, "global_step": 360349, "epoch": 4341} {"train_loss": -26.024951934814453, "global_step": 360350, "epoch": 4341} {"train_loss": -26.056623458862305, "global_step": 360351, "epoch": 4341} {"train_loss": -26.190860748291016, "global_step": 360352, "epoch": 4341} {"train_loss": -25.994770050048828, "global_step": 360353, "epoch": 4341} {"train_loss": -25.76481056213379, "global_step": 360354, "epoch": 4341} {"train_loss": -26.00945472717285, "global_step": 360355, "epoch": 4341} {"train_loss": -26.296051025390625, "global_step": 360356, "epoch": 4341} {"train_loss": -26.19110679626465, "global_step": 360357, "epoch": 4341} {"train_loss": -25.497533798217773, "global_step": 360358, "epoch": 4341} {"train_loss": -25.59438133239746, "global_step": 360359, "epoch": 4341} {"train_loss": -25.667236328125, "global_step": 360360, "epoch": 4341} {"train_loss": -26.088659286499023, "global_step": 360361, "epoch": 4341} {"train_loss": -25.974491119384766, "global_step": 360362, "epoch": 4341} {"train_loss": -25.988800048828125, "global_step": 360363, "epoch": 4341} {"train_loss": -26.502735137939453, "global_step": 360364, "epoch": 4341} {"train_loss": -25.95435905456543, "global_step": 360365, "epoch": 4341} {"train_loss": -26.334157943725586, "global_step": 360366, "epoch": 4341} {"train_loss": -26.06172752380371, "global_step": 360367, "epoch": 4341} {"train_loss": -26.394742965698242, "global_step": 360368, "epoch": 4341} {"train_loss": -26.170007705688477, "global_step": 360369, "epoch": 4341} {"train_loss": -26.48227882385254, "global_step": 360370, "epoch": 4341} {"train_loss": -26.100574493408203, "global_step": 360371, "epoch": 4341} {"train_loss": -25.833087921142578, "global_step": 360372, "epoch": 4341} {"train_loss": -26.49652671813965, "global_step": 360373, "epoch": 4341} {"train_loss": -26.0330753326416, "global_step": 360374, "epoch": 4341} {"train_loss": -25.96100425720215, "global_step": 360375, "epoch": 4341} {"train_loss": -26.361530303955078, "global_step": 360376, "epoch": 4341} {"train_loss": -26.206253051757812, "global_step": 360377, "epoch": 4341} {"train_loss": -26.2503604888916, "global_step": 360378, "epoch": 4341} {"train_loss": -26.3846492767334, "global_step": 360379, "epoch": 4341} {"train_loss": -26.333404541015625, "global_step": 360380, "epoch": 4341} {"train_loss": -26.281681060791016, "global_step": 360381, "epoch": 4341} {"train_loss": -26.379318237304688, "global_step": 360382, "epoch": 4341} {"train_loss": -26.14971923828125, "global_step": 360383, "epoch": 4341} {"train_loss": -26.53179359436035, "global_step": 360384, "epoch": 4341} {"train_loss": -26.176489289984644, "global_step": 360385, "epoch": 4341, "val_loss": 6634696.0} {"train_loss": -25.543079376220703, "global_step": 360386, "epoch": 4342} {"train_loss": -26.007190704345703, "global_step": 360387, "epoch": 4342} {"train_loss": -25.996557235717773, "global_step": 360388, "epoch": 4342} {"train_loss": -26.002042770385742, "global_step": 360389, "epoch": 4342} {"train_loss": -25.748870849609375, "global_step": 360390, "epoch": 4342} {"train_loss": -25.89472007751465, "global_step": 360391, "epoch": 4342} {"train_loss": -26.087844848632812, "global_step": 360392, "epoch": 4342} {"train_loss": -25.53435707092285, "global_step": 360393, "epoch": 4342} {"train_loss": -25.144712448120117, "global_step": 360394, "epoch": 4342} {"train_loss": -25.869359970092773, "global_step": 360395, "epoch": 4342} {"train_loss": -26.32758140563965, "global_step": 360396, "epoch": 4342} {"train_loss": -25.578655242919922, "global_step": 360397, "epoch": 4342} {"train_loss": -26.303924560546875, "global_step": 360398, "epoch": 4342} {"train_loss": -26.1578311920166, "global_step": 360399, "epoch": 4342} {"train_loss": -26.388324737548828, "global_step": 360400, "epoch": 4342} {"train_loss": -26.233610153198242, "global_step": 360401, "epoch": 4342} {"train_loss": -25.865636825561523, "global_step": 360402, "epoch": 4342} {"train_loss": -25.989835739135742, "global_step": 360403, "epoch": 4342} {"train_loss": -26.25775146484375, "global_step": 360404, "epoch": 4342} {"train_loss": -26.5314998626709, "global_step": 360405, "epoch": 4342} {"train_loss": -26.233640670776367, "global_step": 360406, "epoch": 4342} {"train_loss": -26.13091468811035, "global_step": 360407, "epoch": 4342} {"train_loss": -26.36090087890625, "global_step": 360408, "epoch": 4342} {"train_loss": -26.3017578125, "global_step": 360409, "epoch": 4342} {"train_loss": -26.431989669799805, "global_step": 360410, "epoch": 4342} {"train_loss": -26.289098739624023, "global_step": 360411, "epoch": 4342} {"train_loss": -25.929738998413086, "global_step": 360412, "epoch": 4342} {"train_loss": -26.738019943237305, "global_step": 360413, "epoch": 4342} {"train_loss": -26.26239013671875, "global_step": 360414, "epoch": 4342} {"train_loss": -26.2160587310791, "global_step": 360415, "epoch": 4342} {"train_loss": -26.49690818786621, "global_step": 360416, "epoch": 4342} {"train_loss": -26.4514102935791, "global_step": 360417, "epoch": 4342} {"train_loss": -26.278705596923828, "global_step": 360418, "epoch": 4342} {"train_loss": -26.52628517150879, "global_step": 360419, "epoch": 4342} {"train_loss": -26.17255973815918, "global_step": 360420, "epoch": 4342} {"train_loss": -26.597000122070312, "global_step": 360421, "epoch": 4342} {"train_loss": -26.507150650024414, "global_step": 360422, "epoch": 4342} {"train_loss": -26.533979415893555, "global_step": 360423, "epoch": 4342} {"train_loss": -26.4383544921875, "global_step": 360424, "epoch": 4342} {"train_loss": -26.565845489501953, "global_step": 360425, "epoch": 4342} {"train_loss": -26.293354034423828, "global_step": 360426, "epoch": 4342} {"train_loss": -26.370019912719727, "global_step": 360427, "epoch": 4342} {"train_loss": -26.546289443969727, "global_step": 360428, "epoch": 4342} {"train_loss": -26.521530151367188, "global_step": 360429, "epoch": 4342} {"train_loss": -26.44233512878418, "global_step": 360430, "epoch": 4342} {"train_loss": -26.379714965820312, "global_step": 360431, "epoch": 4342} {"train_loss": -26.073577880859375, "global_step": 360432, "epoch": 4342} {"train_loss": -26.12464714050293, "global_step": 360433, "epoch": 4342} {"train_loss": -25.7069091796875, "global_step": 360434, "epoch": 4342} {"train_loss": -26.224292755126953, "global_step": 360435, "epoch": 4342} {"train_loss": -26.063627243041992, "global_step": 360436, "epoch": 4342} {"train_loss": -26.482166290283203, "global_step": 360437, "epoch": 4342} {"train_loss": -26.19476890563965, "global_step": 360438, "epoch": 4342} {"train_loss": -25.857770919799805, "global_step": 360439, "epoch": 4342} {"train_loss": -26.13651466369629, "global_step": 360440, "epoch": 4342} {"train_loss": -26.168659210205078, "global_step": 360441, "epoch": 4342} {"train_loss": -26.26588249206543, "global_step": 360442, "epoch": 4342} {"train_loss": -26.31890869140625, "global_step": 360443, "epoch": 4342} {"train_loss": -26.13777732849121, "global_step": 360444, "epoch": 4342} {"train_loss": -26.09722328186035, "global_step": 360445, "epoch": 4342} {"train_loss": -26.49567985534668, "global_step": 360446, "epoch": 4342} {"train_loss": -26.212085723876953, "global_step": 360447, "epoch": 4342} {"train_loss": -26.12466812133789, "global_step": 360448, "epoch": 4342} {"train_loss": -26.117563247680664, "global_step": 360449, "epoch": 4342} {"train_loss": -25.829980850219727, "global_step": 360450, "epoch": 4342} {"train_loss": -26.132083892822266, "global_step": 360451, "epoch": 4342} {"train_loss": -26.209003448486328, "global_step": 360452, "epoch": 4342} {"train_loss": -26.458276748657227, "global_step": 360453, "epoch": 4342} {"train_loss": -26.430036544799805, "global_step": 360454, "epoch": 4342} {"train_loss": -26.18439292907715, "global_step": 360455, "epoch": 4342} {"train_loss": -26.0313720703125, "global_step": 360456, "epoch": 4342} {"train_loss": -26.306350708007812, "global_step": 360457, "epoch": 4342} {"train_loss": -26.691125869750977, "global_step": 360458, "epoch": 4342} {"train_loss": -26.271753311157227, "global_step": 360459, "epoch": 4342} {"train_loss": -25.96000099182129, "global_step": 360460, "epoch": 4342} {"train_loss": -26.40131187438965, "global_step": 360461, "epoch": 4342} {"train_loss": -26.125091552734375, "global_step": 360462, "epoch": 4342} {"train_loss": -26.633014678955078, "global_step": 360463, "epoch": 4342} {"train_loss": -26.868289947509766, "global_step": 360464, "epoch": 4342} {"train_loss": -26.529403686523438, "global_step": 360465, "epoch": 4342} {"train_loss": -26.345077514648438, "global_step": 360466, "epoch": 4342} {"train_loss": -26.227340698242188, "global_step": 360467, "epoch": 4342} {"train_loss": -26.232444142720784, "global_step": 360468, "epoch": 4342, "val_loss": 6616919.0} {"train_loss": -25.468013763427734, "global_step": 360469, "epoch": 4343} {"train_loss": -25.294660568237305, "global_step": 360470, "epoch": 4343} {"train_loss": -25.6003475189209, "global_step": 360471, "epoch": 4343} {"train_loss": -25.3652400970459, "global_step": 360472, "epoch": 4343} {"train_loss": -26.067569732666016, "global_step": 360473, "epoch": 4343} {"train_loss": -26.0620059967041, "global_step": 360474, "epoch": 4343} {"train_loss": -25.661169052124023, "global_step": 360475, "epoch": 4343} {"train_loss": -25.22784423828125, "global_step": 360476, "epoch": 4343} {"train_loss": -25.520278930664062, "global_step": 360477, "epoch": 4343} {"train_loss": -26.206830978393555, "global_step": 360478, "epoch": 4343} {"train_loss": -25.754623413085938, "global_step": 360479, "epoch": 4343} {"train_loss": -26.1209716796875, "global_step": 360480, "epoch": 4343} {"train_loss": -26.08290672302246, "global_step": 360481, "epoch": 4343} {"train_loss": -25.605976104736328, "global_step": 360482, "epoch": 4343} {"train_loss": -25.954721450805664, "global_step": 360483, "epoch": 4343} {"train_loss": -26.331830978393555, "global_step": 360484, "epoch": 4343} {"train_loss": -26.379316329956055, "global_step": 360485, "epoch": 4343} {"train_loss": -25.99100685119629, "global_step": 360486, "epoch": 4343} {"train_loss": -26.35542869567871, "global_step": 360487, "epoch": 4343} {"train_loss": -26.048791885375977, "global_step": 360488, "epoch": 4343} {"train_loss": -25.86476707458496, "global_step": 360489, "epoch": 4343} {"train_loss": -26.117938995361328, "global_step": 360490, "epoch": 4343} {"train_loss": -26.13933753967285, "global_step": 360491, "epoch": 4343} {"train_loss": -25.747961044311523, "global_step": 360492, "epoch": 4343} {"train_loss": -26.234695434570312, "global_step": 360493, "epoch": 4343} {"train_loss": -25.839038848876953, "global_step": 360494, "epoch": 4343} {"train_loss": -26.35989761352539, "global_step": 360495, "epoch": 4343} {"train_loss": -25.987516403198242, "global_step": 360496, "epoch": 4343} {"train_loss": -25.89508628845215, "global_step": 360497, "epoch": 4343} {"train_loss": -26.2659854888916, "global_step": 360498, "epoch": 4343} {"train_loss": -26.53315544128418, "global_step": 360499, "epoch": 4343} {"train_loss": -26.19707679748535, "global_step": 360500, "epoch": 4343} {"train_loss": -26.3765811920166, "global_step": 360501, "epoch": 4343} {"train_loss": -26.132659912109375, "global_step": 360502, "epoch": 4343} {"train_loss": -26.100757598876953, "global_step": 360503, "epoch": 4343} {"train_loss": -26.4244327545166, "global_step": 360504, "epoch": 4343} {"train_loss": -26.385522842407227, "global_step": 360505, "epoch": 4343} {"train_loss": -26.460325241088867, "global_step": 360506, "epoch": 4343} {"train_loss": -26.210468292236328, "global_step": 360507, "epoch": 4343} {"train_loss": -26.11386489868164, "global_step": 360508, "epoch": 4343} {"train_loss": -26.170124053955078, "global_step": 360509, "epoch": 4343} {"train_loss": -25.92890739440918, "global_step": 360510, "epoch": 4343} {"train_loss": -26.257892608642578, "global_step": 360511, "epoch": 4343} {"train_loss": -26.134479522705078, "global_step": 360512, "epoch": 4343} {"train_loss": -26.517805099487305, "global_step": 360513, "epoch": 4343} {"train_loss": -26.42872428894043, "global_step": 360514, "epoch": 4343} {"train_loss": -26.478734970092773, "global_step": 360515, "epoch": 4343} {"train_loss": -26.12177848815918, "global_step": 360516, "epoch": 4343} {"train_loss": -26.226293563842773, "global_step": 360517, "epoch": 4343} {"train_loss": -25.98293113708496, "global_step": 360518, "epoch": 4343} {"train_loss": -26.15534782409668, "global_step": 360519, "epoch": 4343} {"train_loss": -26.205799102783203, "global_step": 360520, "epoch": 4343} {"train_loss": -26.186553955078125, "global_step": 360521, "epoch": 4343} {"train_loss": -25.996030807495117, "global_step": 360522, "epoch": 4343} {"train_loss": -26.399921417236328, "global_step": 360523, "epoch": 4343} {"train_loss": -26.327850341796875, "global_step": 360524, "epoch": 4343} {"train_loss": -26.04768180847168, "global_step": 360525, "epoch": 4343} {"train_loss": -25.90388298034668, "global_step": 360526, "epoch": 4343} {"train_loss": -26.571136474609375, "global_step": 360527, "epoch": 4343} {"train_loss": -26.231739044189453, "global_step": 360528, "epoch": 4343} {"train_loss": -26.301172256469727, "global_step": 360529, "epoch": 4343} {"train_loss": -26.003026962280273, "global_step": 360530, "epoch": 4343} {"train_loss": -26.230789184570312, "global_step": 360531, "epoch": 4343} {"train_loss": -26.114063262939453, "global_step": 360532, "epoch": 4343} {"train_loss": -26.237756729125977, "global_step": 360533, "epoch": 4343} {"train_loss": -26.641132354736328, "global_step": 360534, "epoch": 4343} {"train_loss": -26.305908203125, "global_step": 360535, "epoch": 4343} {"train_loss": -26.253583908081055, "global_step": 360536, "epoch": 4343} {"train_loss": -26.41643714904785, "global_step": 360537, "epoch": 4343} {"train_loss": -26.4754695892334, "global_step": 360538, "epoch": 4343} {"train_loss": -26.428909301757812, "global_step": 360539, "epoch": 4343} {"train_loss": -26.45475196838379, "global_step": 360540, "epoch": 4343} {"train_loss": -26.42120933532715, "global_step": 360541, "epoch": 4343} {"train_loss": -26.26304054260254, "global_step": 360542, "epoch": 4343} {"train_loss": -26.4739933013916, "global_step": 360543, "epoch": 4343} {"train_loss": -26.4196720123291, "global_step": 360544, "epoch": 4343} {"train_loss": -26.37513542175293, "global_step": 360545, "epoch": 4343} {"train_loss": -26.433008193969727, "global_step": 360546, "epoch": 4343} {"train_loss": -26.78462791442871, "global_step": 360547, "epoch": 4343} {"train_loss": -26.061100006103516, "global_step": 360548, "epoch": 4343} {"train_loss": -26.426483154296875, "global_step": 360549, "epoch": 4343} {"train_loss": -26.547513961791992, "global_step": 360550, "epoch": 4343} {"train_loss": -26.16272763171828, "global_step": 360551, "epoch": 4343, "val_loss": 6655292.5} {"train_loss": -26.10389518737793, "global_step": 360552, "epoch": 4344} {"train_loss": -25.96283531188965, "global_step": 360553, "epoch": 4344} {"train_loss": -26.138540267944336, "global_step": 360554, "epoch": 4344} {"train_loss": -26.327600479125977, "global_step": 360555, "epoch": 4344} {"train_loss": -25.570470809936523, "global_step": 360556, "epoch": 4344} {"train_loss": -26.165206909179688, "global_step": 360557, "epoch": 4344} {"train_loss": -25.952245712280273, "global_step": 360558, "epoch": 4344} {"train_loss": -25.9055118560791, "global_step": 360559, "epoch": 4344} {"train_loss": -25.915014266967773, "global_step": 360560, "epoch": 4344} {"train_loss": -26.16916275024414, "global_step": 360561, "epoch": 4344} {"train_loss": -25.720703125, "global_step": 360562, "epoch": 4344} {"train_loss": -25.851755142211914, "global_step": 360563, "epoch": 4344} {"train_loss": -26.31367301940918, "global_step": 360564, "epoch": 4344} {"train_loss": -25.599328994750977, "global_step": 360565, "epoch": 4344} {"train_loss": -25.808734893798828, "global_step": 360566, "epoch": 4344} {"train_loss": -26.37286376953125, "global_step": 360567, "epoch": 4344} {"train_loss": -26.2293758392334, "global_step": 360568, "epoch": 4344} {"train_loss": -26.01934814453125, "global_step": 360569, "epoch": 4344} {"train_loss": -26.281641006469727, "global_step": 360570, "epoch": 4344} {"train_loss": -26.282550811767578, "global_step": 360571, "epoch": 4344} {"train_loss": -26.128772735595703, "global_step": 360572, "epoch": 4344} {"train_loss": -26.291614532470703, "global_step": 360573, "epoch": 4344} {"train_loss": -26.167001724243164, "global_step": 360574, "epoch": 4344} {"train_loss": -26.40064811706543, "global_step": 360575, "epoch": 4344} {"train_loss": -25.78775978088379, "global_step": 360576, "epoch": 4344} {"train_loss": -26.332387924194336, "global_step": 360577, "epoch": 4344} {"train_loss": -26.15640640258789, "global_step": 360578, "epoch": 4344} {"train_loss": -26.053152084350586, "global_step": 360579, "epoch": 4344} {"train_loss": -26.291967391967773, "global_step": 360580, "epoch": 4344} {"train_loss": -26.341012954711914, "global_step": 360581, "epoch": 4344} {"train_loss": -26.4876766204834, "global_step": 360582, "epoch": 4344} {"train_loss": -26.276325225830078, "global_step": 360583, "epoch": 4344} {"train_loss": -26.631879806518555, "global_step": 360584, "epoch": 4344} {"train_loss": -26.34262466430664, "global_step": 360585, "epoch": 4344} {"train_loss": -26.423437118530273, "global_step": 360586, "epoch": 4344} {"train_loss": -26.310302734375, "global_step": 360587, "epoch": 4344} {"train_loss": -26.082294464111328, "global_step": 360588, "epoch": 4344} {"train_loss": -26.644428253173828, "global_step": 360589, "epoch": 4344} {"train_loss": -26.21551513671875, "global_step": 360590, "epoch": 4344} {"train_loss": -26.294498443603516, "global_step": 360591, "epoch": 4344} {"train_loss": -26.369516372680664, "global_step": 360592, "epoch": 4344} {"train_loss": -26.18501091003418, "global_step": 360593, "epoch": 4344} {"train_loss": -26.604761123657227, "global_step": 360594, "epoch": 4344} {"train_loss": -26.292346954345703, "global_step": 360595, "epoch": 4344} {"train_loss": -26.443634033203125, "global_step": 360596, "epoch": 4344} {"train_loss": -26.102705001831055, "global_step": 360597, "epoch": 4344} {"train_loss": -26.34712791442871, "global_step": 360598, "epoch": 4344} {"train_loss": -26.342859268188477, "global_step": 360599, "epoch": 4344} {"train_loss": -26.171483993530273, "global_step": 360600, "epoch": 4344} {"train_loss": -26.46099281311035, "global_step": 360601, "epoch": 4344} {"train_loss": -25.97220802307129, "global_step": 360602, "epoch": 4344} {"train_loss": -26.139163970947266, "global_step": 360603, "epoch": 4344} {"train_loss": -26.4619140625, "global_step": 360604, "epoch": 4344} {"train_loss": -26.357620239257812, "global_step": 360605, "epoch": 4344} {"train_loss": -26.586334228515625, "global_step": 360606, "epoch": 4344} {"train_loss": -26.243427276611328, "global_step": 360607, "epoch": 4344} {"train_loss": -25.69147300720215, "global_step": 360608, "epoch": 4344} {"train_loss": -26.433359146118164, "global_step": 360609, "epoch": 4344} {"train_loss": -26.045637130737305, "global_step": 360610, "epoch": 4344} {"train_loss": -26.205102920532227, "global_step": 360611, "epoch": 4344} {"train_loss": -25.95753288269043, "global_step": 360612, "epoch": 4344} {"train_loss": -26.469839096069336, "global_step": 360613, "epoch": 4344} {"train_loss": -26.1710205078125, "global_step": 360614, "epoch": 4344} {"train_loss": -26.143756866455078, "global_step": 360615, "epoch": 4344} {"train_loss": -25.905414581298828, "global_step": 360616, "epoch": 4344} {"train_loss": -26.23072624206543, "global_step": 360617, "epoch": 4344} {"train_loss": -25.830997467041016, "global_step": 360618, "epoch": 4344} {"train_loss": -26.068384170532227, "global_step": 360619, "epoch": 4344} {"train_loss": -26.318470001220703, "global_step": 360620, "epoch": 4344} {"train_loss": -26.34912109375, "global_step": 360621, "epoch": 4344} {"train_loss": -25.7448787689209, "global_step": 360622, "epoch": 4344} {"train_loss": -25.39204978942871, "global_step": 360623, "epoch": 4344} {"train_loss": -25.233623504638672, "global_step": 360624, "epoch": 4344} {"train_loss": -25.744482040405273, "global_step": 360625, "epoch": 4344} {"train_loss": -25.93427848815918, "global_step": 360626, "epoch": 4344} {"train_loss": -26.027639389038086, "global_step": 360627, "epoch": 4344} {"train_loss": -25.832284927368164, "global_step": 360628, "epoch": 4344} {"train_loss": -25.704681396484375, "global_step": 360629, "epoch": 4344} {"train_loss": -25.827289581298828, "global_step": 360630, "epoch": 4344} {"train_loss": -26.208240509033203, "global_step": 360631, "epoch": 4344} {"train_loss": -26.507781982421875, "global_step": 360632, "epoch": 4344} {"train_loss": -26.222244262695312, "global_step": 360633, "epoch": 4344} {"train_loss": -26.144224672432404, "global_step": 360634, "epoch": 4344, "val_loss": 6650585.0} {"train_loss": -25.641876220703125, "global_step": 360635, "epoch": 4345} {"train_loss": -25.53321075439453, "global_step": 360636, "epoch": 4345} {"train_loss": -26.051008224487305, "global_step": 360637, "epoch": 4345} {"train_loss": -25.89044189453125, "global_step": 360638, "epoch": 4345} {"train_loss": -26.158832550048828, "global_step": 360639, "epoch": 4345} {"train_loss": -25.95209312438965, "global_step": 360640, "epoch": 4345} {"train_loss": -25.81805992126465, "global_step": 360641, "epoch": 4345} {"train_loss": -26.535181045532227, "global_step": 360642, "epoch": 4345} {"train_loss": -26.00140953063965, "global_step": 360643, "epoch": 4345} {"train_loss": -25.5338191986084, "global_step": 360644, "epoch": 4345} {"train_loss": -25.8289794921875, "global_step": 360645, "epoch": 4345} {"train_loss": -26.270856857299805, "global_step": 360646, "epoch": 4345} {"train_loss": -25.932281494140625, "global_step": 360647, "epoch": 4345} {"train_loss": -25.8369197845459, "global_step": 360648, "epoch": 4345} {"train_loss": -25.79770851135254, "global_step": 360649, "epoch": 4345} {"train_loss": -25.93299674987793, "global_step": 360650, "epoch": 4345} {"train_loss": -26.439191818237305, "global_step": 360651, "epoch": 4345} {"train_loss": -26.1259765625, "global_step": 360652, "epoch": 4345} {"train_loss": -25.88150405883789, "global_step": 360653, "epoch": 4345} {"train_loss": -25.935728073120117, "global_step": 360654, "epoch": 4345} {"train_loss": -26.364837646484375, "global_step": 360655, "epoch": 4345} {"train_loss": -26.12171745300293, "global_step": 360656, "epoch": 4345} {"train_loss": -26.1605281829834, "global_step": 360657, "epoch": 4345} {"train_loss": -26.4656925201416, "global_step": 360658, "epoch": 4345} {"train_loss": -26.303863525390625, "global_step": 360659, "epoch": 4345} {"train_loss": -26.012075424194336, "global_step": 360660, "epoch": 4345} {"train_loss": -26.581012725830078, "global_step": 360661, "epoch": 4345} {"train_loss": -26.18121337890625, "global_step": 360662, "epoch": 4345} {"train_loss": -26.52613639831543, "global_step": 360663, "epoch": 4345} {"train_loss": -26.078474044799805, "global_step": 360664, "epoch": 4345} {"train_loss": -26.498676300048828, "global_step": 360665, "epoch": 4345} {"train_loss": -26.512802124023438, "global_step": 360666, "epoch": 4345} {"train_loss": -26.414548873901367, "global_step": 360667, "epoch": 4345} {"train_loss": -26.56928825378418, "global_step": 360668, "epoch": 4345} {"train_loss": -26.216419219970703, "global_step": 360669, "epoch": 4345} {"train_loss": -26.461278915405273, "global_step": 360670, "epoch": 4345} {"train_loss": -26.402286529541016, "global_step": 360671, "epoch": 4345} {"train_loss": -26.414886474609375, "global_step": 360672, "epoch": 4345} {"train_loss": -26.21152687072754, "global_step": 360673, "epoch": 4345} {"train_loss": -26.2155704498291, "global_step": 360674, "epoch": 4345} {"train_loss": -26.604736328125, "global_step": 360675, "epoch": 4345} {"train_loss": -26.458175659179688, "global_step": 360676, "epoch": 4345} {"train_loss": -26.3664608001709, "global_step": 360677, "epoch": 4345} {"train_loss": -26.1468505859375, "global_step": 360678, "epoch": 4345} {"train_loss": -26.3500919342041, "global_step": 360679, "epoch": 4345} {"train_loss": -26.67048454284668, "global_step": 360680, "epoch": 4345} {"train_loss": -26.387943267822266, "global_step": 360681, "epoch": 4345} {"train_loss": -26.5645694732666, "global_step": 360682, "epoch": 4345} {"train_loss": -26.676685333251953, "global_step": 360683, "epoch": 4345} {"train_loss": -26.348968505859375, "global_step": 360684, "epoch": 4345} {"train_loss": -26.542804718017578, "global_step": 360685, "epoch": 4345} {"train_loss": -26.3792667388916, "global_step": 360686, "epoch": 4345} {"train_loss": -26.32783317565918, "global_step": 360687, "epoch": 4345} {"train_loss": -26.00003433227539, "global_step": 360688, "epoch": 4345} {"train_loss": -25.90814208984375, "global_step": 360689, "epoch": 4345} {"train_loss": -25.500200271606445, "global_step": 360690, "epoch": 4345} {"train_loss": -24.884368896484375, "global_step": 360691, "epoch": 4345} {"train_loss": -24.141420364379883, "global_step": 360692, "epoch": 4345} {"train_loss": -25.002456665039062, "global_step": 360693, "epoch": 4345} {"train_loss": -25.923603057861328, "global_step": 360694, "epoch": 4345} {"train_loss": -24.670019149780273, "global_step": 360695, "epoch": 4345} {"train_loss": -25.519861221313477, "global_step": 360696, "epoch": 4345} {"train_loss": -25.639556884765625, "global_step": 360697, "epoch": 4345} {"train_loss": -26.10230827331543, "global_step": 360698, "epoch": 4345} {"train_loss": -25.7696590423584, "global_step": 360699, "epoch": 4345} {"train_loss": -25.894123077392578, "global_step": 360700, "epoch": 4345} {"train_loss": -25.960988998413086, "global_step": 360701, "epoch": 4345} {"train_loss": -25.98273277282715, "global_step": 360702, "epoch": 4345} {"train_loss": -26.006677627563477, "global_step": 360703, "epoch": 4345} {"train_loss": -25.734235763549805, "global_step": 360704, "epoch": 4345} {"train_loss": -25.98370361328125, "global_step": 360705, "epoch": 4345} {"train_loss": -25.862218856811523, "global_step": 360706, "epoch": 4345} {"train_loss": -26.662012100219727, "global_step": 360707, "epoch": 4345} {"train_loss": -26.6252498626709, "global_step": 360708, "epoch": 4345} {"train_loss": -25.903762817382812, "global_step": 360709, "epoch": 4345} {"train_loss": -26.133039474487305, "global_step": 360710, "epoch": 4345} {"train_loss": -25.79787254333496, "global_step": 360711, "epoch": 4345} {"train_loss": -25.75411033630371, "global_step": 360712, "epoch": 4345} {"train_loss": -26.052087783813477, "global_step": 360713, "epoch": 4345} {"train_loss": -26.447757720947266, "global_step": 360714, "epoch": 4345} {"train_loss": -25.958948135375977, "global_step": 360715, "epoch": 4345} {"train_loss": -26.301313400268555, "global_step": 360716, "epoch": 4345} {"train_loss": -26.076908571174346, "global_step": 360717, "epoch": 4345, "val_loss": 6618201.5} {"train_loss": -25.7216739654541, "global_step": 360718, "epoch": 4346} {"train_loss": -26.109479904174805, "global_step": 360719, "epoch": 4346} {"train_loss": -25.35453987121582, "global_step": 360720, "epoch": 4346} {"train_loss": -26.066757202148438, "global_step": 360721, "epoch": 4346} {"train_loss": -25.608869552612305, "global_step": 360722, "epoch": 4346} {"train_loss": -25.384244918823242, "global_step": 360723, "epoch": 4346} {"train_loss": -25.908599853515625, "global_step": 360724, "epoch": 4346} {"train_loss": -25.9185733795166, "global_step": 360725, "epoch": 4346} {"train_loss": -25.951007843017578, "global_step": 360726, "epoch": 4346} {"train_loss": -25.90250015258789, "global_step": 360727, "epoch": 4346} {"train_loss": -26.070144653320312, "global_step": 360728, "epoch": 4346} {"train_loss": -25.74078941345215, "global_step": 360729, "epoch": 4346} {"train_loss": -26.228673934936523, "global_step": 360730, "epoch": 4346} {"train_loss": -26.275171279907227, "global_step": 360731, "epoch": 4346} {"train_loss": -25.887821197509766, "global_step": 360732, "epoch": 4346} {"train_loss": -26.158618927001953, "global_step": 360733, "epoch": 4346} {"train_loss": -25.713056564331055, "global_step": 360734, "epoch": 4346} {"train_loss": -26.464282989501953, "global_step": 360735, "epoch": 4346} {"train_loss": -26.244409561157227, "global_step": 360736, "epoch": 4346} {"train_loss": -26.44239616394043, "global_step": 360737, "epoch": 4346} {"train_loss": -25.880598068237305, "global_step": 360738, "epoch": 4346} {"train_loss": -25.9207763671875, "global_step": 360739, "epoch": 4346} {"train_loss": -25.955480575561523, "global_step": 360740, "epoch": 4346} {"train_loss": -26.317075729370117, "global_step": 360741, "epoch": 4346} {"train_loss": -25.80438232421875, "global_step": 360742, "epoch": 4346} {"train_loss": -25.97535514831543, "global_step": 360743, "epoch": 4346} {"train_loss": -26.247882843017578, "global_step": 360744, "epoch": 4346} {"train_loss": -26.075864791870117, "global_step": 360745, "epoch": 4346} {"train_loss": -26.696552276611328, "global_step": 360746, "epoch": 4346} {"train_loss": -26.064916610717773, "global_step": 360747, "epoch": 4346} {"train_loss": -25.994659423828125, "global_step": 360748, "epoch": 4346} {"train_loss": -26.003698348999023, "global_step": 360749, "epoch": 4346} {"train_loss": -26.408557891845703, "global_step": 360750, "epoch": 4346} {"train_loss": -26.42239761352539, "global_step": 360751, "epoch": 4346} {"train_loss": -26.19346046447754, "global_step": 360752, "epoch": 4346} {"train_loss": -26.375598907470703, "global_step": 360753, "epoch": 4346} {"train_loss": -26.376943588256836, "global_step": 360754, "epoch": 4346} {"train_loss": -26.553089141845703, "global_step": 360755, "epoch": 4346} {"train_loss": -26.449604034423828, "global_step": 360756, "epoch": 4346} {"train_loss": -26.09119987487793, "global_step": 360757, "epoch": 4346} {"train_loss": -26.414941787719727, "global_step": 360758, "epoch": 4346} {"train_loss": -26.6842041015625, "global_step": 360759, "epoch": 4346} {"train_loss": -26.42724609375, "global_step": 360760, "epoch": 4346} {"train_loss": -26.644580841064453, "global_step": 360761, "epoch": 4346} {"train_loss": -26.41730308532715, "global_step": 360762, "epoch": 4346} {"train_loss": -26.766925811767578, "global_step": 360763, "epoch": 4346} {"train_loss": -26.286334991455078, "global_step": 360764, "epoch": 4346} {"train_loss": -26.638532638549805, "global_step": 360765, "epoch": 4346} {"train_loss": -26.385284423828125, "global_step": 360766, "epoch": 4346} {"train_loss": -26.322254180908203, "global_step": 360767, "epoch": 4346} {"train_loss": -26.09242057800293, "global_step": 360768, "epoch": 4346} {"train_loss": -26.405851364135742, "global_step": 360769, "epoch": 4346} {"train_loss": -26.23883056640625, "global_step": 360770, "epoch": 4346} {"train_loss": -25.819787979125977, "global_step": 360771, "epoch": 4346} {"train_loss": -26.274463653564453, "global_step": 360772, "epoch": 4346} {"train_loss": -26.02311134338379, "global_step": 360773, "epoch": 4346} {"train_loss": -26.48793601989746, "global_step": 360774, "epoch": 4346} {"train_loss": -26.304922103881836, "global_step": 360775, "epoch": 4346} {"train_loss": -26.448333740234375, "global_step": 360776, "epoch": 4346} {"train_loss": -26.23798942565918, "global_step": 360777, "epoch": 4346} {"train_loss": -26.48828125, "global_step": 360778, "epoch": 4346} {"train_loss": -26.309438705444336, "global_step": 360779, "epoch": 4346} {"train_loss": -26.243642807006836, "global_step": 360780, "epoch": 4346} {"train_loss": -26.3843936920166, "global_step": 360781, "epoch": 4346} {"train_loss": -26.324085235595703, "global_step": 360782, "epoch": 4346} {"train_loss": -26.587387084960938, "global_step": 360783, "epoch": 4346} {"train_loss": -26.230283737182617, "global_step": 360784, "epoch": 4346} {"train_loss": -26.31049156188965, "global_step": 360785, "epoch": 4346} {"train_loss": -26.409204483032227, "global_step": 360786, "epoch": 4346} {"train_loss": -26.514240264892578, "global_step": 360787, "epoch": 4346} {"train_loss": -26.35646629333496, "global_step": 360788, "epoch": 4346} {"train_loss": -26.358030319213867, "global_step": 360789, "epoch": 4346} {"train_loss": -26.42388916015625, "global_step": 360790, "epoch": 4346} {"train_loss": -26.36018180847168, "global_step": 360791, "epoch": 4346} {"train_loss": -26.36797523498535, "global_step": 360792, "epoch": 4346} {"train_loss": -26.660703659057617, "global_step": 360793, "epoch": 4346} {"train_loss": -26.375898361206055, "global_step": 360794, "epoch": 4346} {"train_loss": -26.43658447265625, "global_step": 360795, "epoch": 4346} {"train_loss": -26.519046783447266, "global_step": 360796, "epoch": 4346} {"train_loss": -26.195068359375, "global_step": 360797, "epoch": 4346} {"train_loss": -26.2954044342041, "global_step": 360798, "epoch": 4346} {"train_loss": -26.298322677612305, "global_step": 360799, "epoch": 4346} {"train_loss": -26.239339460809546, "global_step": 360800, "epoch": 4346, "val_loss": 6576088.0} {"train_loss": -26.15327262878418, "global_step": 360801, "epoch": 4347} {"train_loss": -25.69854736328125, "global_step": 360802, "epoch": 4347} {"train_loss": -26.011178970336914, "global_step": 360803, "epoch": 4347} {"train_loss": -25.86029624938965, "global_step": 360804, "epoch": 4347} {"train_loss": -25.92401695251465, "global_step": 360805, "epoch": 4347} {"train_loss": -25.567285537719727, "global_step": 360806, "epoch": 4347} {"train_loss": -25.659772872924805, "global_step": 360807, "epoch": 4347} {"train_loss": -26.025360107421875, "global_step": 360808, "epoch": 4347} {"train_loss": -25.85993003845215, "global_step": 360809, "epoch": 4347} {"train_loss": -25.82337760925293, "global_step": 360810, "epoch": 4347} {"train_loss": -25.9477596282959, "global_step": 360811, "epoch": 4347} {"train_loss": -26.038818359375, "global_step": 360812, "epoch": 4347} {"train_loss": -25.939849853515625, "global_step": 360813, "epoch": 4347} {"train_loss": -25.573625564575195, "global_step": 360814, "epoch": 4347} {"train_loss": -26.012928009033203, "global_step": 360815, "epoch": 4347} {"train_loss": -26.333703994750977, "global_step": 360816, "epoch": 4347} {"train_loss": -25.99448013305664, "global_step": 360817, "epoch": 4347} {"train_loss": -26.194990158081055, "global_step": 360818, "epoch": 4347} {"train_loss": -26.171899795532227, "global_step": 360819, "epoch": 4347} {"train_loss": -25.984601974487305, "global_step": 360820, "epoch": 4347} {"train_loss": -25.918039321899414, "global_step": 360821, "epoch": 4347} {"train_loss": -26.192068099975586, "global_step": 360822, "epoch": 4347} {"train_loss": -26.130842208862305, "global_step": 360823, "epoch": 4347} {"train_loss": -26.0495548248291, "global_step": 360824, "epoch": 4347} {"train_loss": -26.307470321655273, "global_step": 360825, "epoch": 4347} {"train_loss": -26.218061447143555, "global_step": 360826, "epoch": 4347} {"train_loss": -26.10930824279785, "global_step": 360827, "epoch": 4347} {"train_loss": -26.402606964111328, "global_step": 360828, "epoch": 4347} {"train_loss": -26.302595138549805, "global_step": 360829, "epoch": 4347} {"train_loss": -26.51642417907715, "global_step": 360830, "epoch": 4347} {"train_loss": -26.622406005859375, "global_step": 360831, "epoch": 4347} {"train_loss": -26.175016403198242, "global_step": 360832, "epoch": 4347} {"train_loss": -26.11223793029785, "global_step": 360833, "epoch": 4347} {"train_loss": -26.3327579498291, "global_step": 360834, "epoch": 4347} {"train_loss": -26.627859115600586, "global_step": 360835, "epoch": 4347} {"train_loss": -26.521717071533203, "global_step": 360836, "epoch": 4347} {"train_loss": -26.507720947265625, "global_step": 360837, "epoch": 4347} {"train_loss": -26.15949821472168, "global_step": 360838, "epoch": 4347} {"train_loss": -26.548120498657227, "global_step": 360839, "epoch": 4347} {"train_loss": -26.31229591369629, "global_step": 360840, "epoch": 4347} {"train_loss": -26.37550163269043, "global_step": 360841, "epoch": 4347} {"train_loss": -26.097171783447266, "global_step": 360842, "epoch": 4347} {"train_loss": -26.1220645904541, "global_step": 360843, "epoch": 4347} {"train_loss": -26.253223419189453, "global_step": 360844, "epoch": 4347} {"train_loss": -26.5050048828125, "global_step": 360845, "epoch": 4347} {"train_loss": -26.3924503326416, "global_step": 360846, "epoch": 4347} {"train_loss": -25.88722038269043, "global_step": 360847, "epoch": 4347} {"train_loss": -26.560331344604492, "global_step": 360848, "epoch": 4347} {"train_loss": -26.386367797851562, "global_step": 360849, "epoch": 4347} {"train_loss": -26.3446102142334, "global_step": 360850, "epoch": 4347} {"train_loss": -26.519941329956055, "global_step": 360851, "epoch": 4347} {"train_loss": -26.26651382446289, "global_step": 360852, "epoch": 4347} {"train_loss": -26.216480255126953, "global_step": 360853, "epoch": 4347} {"train_loss": -26.12504005432129, "global_step": 360854, "epoch": 4347} {"train_loss": -26.10430908203125, "global_step": 360855, "epoch": 4347} {"train_loss": -26.714004516601562, "global_step": 360856, "epoch": 4347} {"train_loss": -26.073022842407227, "global_step": 360857, "epoch": 4347} {"train_loss": -26.113962173461914, "global_step": 360858, "epoch": 4347} {"train_loss": -26.378950119018555, "global_step": 360859, "epoch": 4347} {"train_loss": -26.540632247924805, "global_step": 360860, "epoch": 4347} {"train_loss": -26.485136032104492, "global_step": 360861, "epoch": 4347} {"train_loss": -26.43926429748535, "global_step": 360862, "epoch": 4347} {"train_loss": -26.42083168029785, "global_step": 360863, "epoch": 4347} {"train_loss": -26.681610107421875, "global_step": 360864, "epoch": 4347} {"train_loss": -26.217405319213867, "global_step": 360865, "epoch": 4347} {"train_loss": -26.24637794494629, "global_step": 360866, "epoch": 4347} {"train_loss": -26.474365234375, "global_step": 360867, "epoch": 4347} {"train_loss": -26.327070236206055, "global_step": 360868, "epoch": 4347} {"train_loss": -26.266157150268555, "global_step": 360869, "epoch": 4347} {"train_loss": -26.173660278320312, "global_step": 360870, "epoch": 4347} {"train_loss": -26.4127197265625, "global_step": 360871, "epoch": 4347} {"train_loss": -25.946191787719727, "global_step": 360872, "epoch": 4347} {"train_loss": -25.7984619140625, "global_step": 360873, "epoch": 4347} {"train_loss": -25.920682907104492, "global_step": 360874, "epoch": 4347} {"train_loss": -25.85550308227539, "global_step": 360875, "epoch": 4347} {"train_loss": -26.0054988861084, "global_step": 360876, "epoch": 4347} {"train_loss": -26.456830978393555, "global_step": 360877, "epoch": 4347} {"train_loss": -26.393218994140625, "global_step": 360878, "epoch": 4347} {"train_loss": -25.9044132232666, "global_step": 360879, "epoch": 4347} {"train_loss": -26.33251953125, "global_step": 360880, "epoch": 4347} {"train_loss": -26.38788414001465, "global_step": 360881, "epoch": 4347} {"train_loss": -26.177770614624023, "global_step": 360882, "epoch": 4347} {"train_loss": -26.20461443246129, "global_step": 360883, "epoch": 4347, "val_loss": 6708836.0} {"train_loss": -26.1995849609375, "global_step": 360884, "epoch": 4348} {"train_loss": -25.77057456970215, "global_step": 360885, "epoch": 4348} {"train_loss": -25.84637451171875, "global_step": 360886, "epoch": 4348} {"train_loss": -25.51207733154297, "global_step": 360887, "epoch": 4348} {"train_loss": -25.8139705657959, "global_step": 360888, "epoch": 4348} {"train_loss": -25.87306022644043, "global_step": 360889, "epoch": 4348} {"train_loss": -25.944721221923828, "global_step": 360890, "epoch": 4348} {"train_loss": -25.799640655517578, "global_step": 360891, "epoch": 4348} {"train_loss": -25.780073165893555, "global_step": 360892, "epoch": 4348} {"train_loss": -26.1825008392334, "global_step": 360893, "epoch": 4348} {"train_loss": -25.973730087280273, "global_step": 360894, "epoch": 4348} {"train_loss": -25.5770206451416, "global_step": 360895, "epoch": 4348} {"train_loss": -26.03055763244629, "global_step": 360896, "epoch": 4348} {"train_loss": -25.83314323425293, "global_step": 360897, "epoch": 4348} {"train_loss": -26.118295669555664, "global_step": 360898, "epoch": 4348} {"train_loss": -26.110401153564453, "global_step": 360899, "epoch": 4348} {"train_loss": -26.331527709960938, "global_step": 360900, "epoch": 4348} {"train_loss": -25.9766788482666, "global_step": 360901, "epoch": 4348} {"train_loss": -26.16045570373535, "global_step": 360902, "epoch": 4348} {"train_loss": -25.885900497436523, "global_step": 360903, "epoch": 4348} {"train_loss": -26.277841567993164, "global_step": 360904, "epoch": 4348} {"train_loss": -26.193456649780273, "global_step": 360905, "epoch": 4348} {"train_loss": -26.287229537963867, "global_step": 360906, "epoch": 4348} {"train_loss": -26.45051383972168, "global_step": 360907, "epoch": 4348} {"train_loss": -26.230649948120117, "global_step": 360908, "epoch": 4348} {"train_loss": -25.96161460876465, "global_step": 360909, "epoch": 4348} {"train_loss": -26.5960693359375, "global_step": 360910, "epoch": 4348} {"train_loss": -26.452573776245117, "global_step": 360911, "epoch": 4348} {"train_loss": -26.481964111328125, "global_step": 360912, "epoch": 4348} {"train_loss": -26.492773056030273, "global_step": 360913, "epoch": 4348} {"train_loss": -26.408435821533203, "global_step": 360914, "epoch": 4348} {"train_loss": -26.15240478515625, "global_step": 360915, "epoch": 4348} {"train_loss": -26.10914421081543, "global_step": 360916, "epoch": 4348} {"train_loss": -26.32838249206543, "global_step": 360917, "epoch": 4348} {"train_loss": -25.95098876953125, "global_step": 360918, "epoch": 4348} {"train_loss": -26.315946578979492, "global_step": 360919, "epoch": 4348} {"train_loss": -26.466293334960938, "global_step": 360920, "epoch": 4348} {"train_loss": -26.26470947265625, "global_step": 360921, "epoch": 4348} {"train_loss": -25.621597290039062, "global_step": 360922, "epoch": 4348} {"train_loss": -25.556577682495117, "global_step": 360923, "epoch": 4348} {"train_loss": -25.99957847595215, "global_step": 360924, "epoch": 4348} {"train_loss": -25.91493034362793, "global_step": 360925, "epoch": 4348} {"train_loss": -26.50653648376465, "global_step": 360926, "epoch": 4348} {"train_loss": -25.80841636657715, "global_step": 360927, "epoch": 4348} {"train_loss": -25.57729721069336, "global_step": 360928, "epoch": 4348} {"train_loss": -25.963342666625977, "global_step": 360929, "epoch": 4348} {"train_loss": -26.40943717956543, "global_step": 360930, "epoch": 4348} {"train_loss": -26.077682495117188, "global_step": 360931, "epoch": 4348} {"train_loss": -25.943744659423828, "global_step": 360932, "epoch": 4348} {"train_loss": -25.898527145385742, "global_step": 360933, "epoch": 4348} {"train_loss": -26.00819206237793, "global_step": 360934, "epoch": 4348} {"train_loss": -26.181821823120117, "global_step": 360935, "epoch": 4348} {"train_loss": -26.309850692749023, "global_step": 360936, "epoch": 4348} {"train_loss": -25.726537704467773, "global_step": 360937, "epoch": 4348} {"train_loss": -25.91058349609375, "global_step": 360938, "epoch": 4348} {"train_loss": -26.2535457611084, "global_step": 360939, "epoch": 4348} {"train_loss": -25.83564567565918, "global_step": 360940, "epoch": 4348} {"train_loss": -25.83730125427246, "global_step": 360941, "epoch": 4348} {"train_loss": -25.622995376586914, "global_step": 360942, "epoch": 4348} {"train_loss": -26.200841903686523, "global_step": 360943, "epoch": 4348} {"train_loss": -25.834569931030273, "global_step": 360944, "epoch": 4348} {"train_loss": -26.29047203063965, "global_step": 360945, "epoch": 4348} {"train_loss": -26.214996337890625, "global_step": 360946, "epoch": 4348} {"train_loss": -25.944183349609375, "global_step": 360947, "epoch": 4348} {"train_loss": -26.217105865478516, "global_step": 360948, "epoch": 4348} {"train_loss": -26.444101333618164, "global_step": 360949, "epoch": 4348} {"train_loss": -26.42585563659668, "global_step": 360950, "epoch": 4348} {"train_loss": -25.595245361328125, "global_step": 360951, "epoch": 4348} {"train_loss": -26.241186141967773, "global_step": 360952, "epoch": 4348} {"train_loss": -26.042306900024414, "global_step": 360953, "epoch": 4348} {"train_loss": -26.373193740844727, "global_step": 360954, "epoch": 4348} {"train_loss": -26.316083908081055, "global_step": 360955, "epoch": 4348} {"train_loss": -26.261999130249023, "global_step": 360956, "epoch": 4348} {"train_loss": -26.436925888061523, "global_step": 360957, "epoch": 4348} {"train_loss": -26.209686279296875, "global_step": 360958, "epoch": 4348} {"train_loss": -26.459461212158203, "global_step": 360959, "epoch": 4348} {"train_loss": -26.73084831237793, "global_step": 360960, "epoch": 4348} {"train_loss": -26.179494857788086, "global_step": 360961, "epoch": 4348} {"train_loss": -26.421222686767578, "global_step": 360962, "epoch": 4348} {"train_loss": -26.1451416015625, "global_step": 360963, "epoch": 4348} {"train_loss": -26.32624626159668, "global_step": 360964, "epoch": 4348} {"train_loss": -26.231210708618164, "global_step": 360965, "epoch": 4348} {"train_loss": -26.121416965162897, "global_step": 360966, "epoch": 4348, "val_loss": 6606631.0} {"train_loss": -25.841388702392578, "global_step": 360967, "epoch": 4349} {"train_loss": -26.364782333374023, "global_step": 360968, "epoch": 4349} {"train_loss": -26.022008895874023, "global_step": 360969, "epoch": 4349} {"train_loss": -25.972776412963867, "global_step": 360970, "epoch": 4349} {"train_loss": -26.003009796142578, "global_step": 360971, "epoch": 4349} {"train_loss": -26.3471622467041, "global_step": 360972, "epoch": 4349} {"train_loss": -26.496337890625, "global_step": 360973, "epoch": 4349} {"train_loss": -26.265085220336914, "global_step": 360974, "epoch": 4349} {"train_loss": -26.014041900634766, "global_step": 360975, "epoch": 4349} {"train_loss": -26.09799575805664, "global_step": 360976, "epoch": 4349} {"train_loss": -25.8719425201416, "global_step": 360977, "epoch": 4349} {"train_loss": -26.065183639526367, "global_step": 360978, "epoch": 4349} {"train_loss": -26.294647216796875, "global_step": 360979, "epoch": 4349} {"train_loss": -26.125761032104492, "global_step": 360980, "epoch": 4349} {"train_loss": -25.8168888092041, "global_step": 360981, "epoch": 4349} {"train_loss": -25.902612686157227, "global_step": 360982, "epoch": 4349} {"train_loss": -25.861785888671875, "global_step": 360983, "epoch": 4349} {"train_loss": -25.590585708618164, "global_step": 360984, "epoch": 4349} {"train_loss": -26.366910934448242, "global_step": 360985, "epoch": 4349} {"train_loss": -26.036544799804688, "global_step": 360986, "epoch": 4349} {"train_loss": -26.283039093017578, "global_step": 360987, "epoch": 4349} {"train_loss": -26.02833366394043, "global_step": 360988, "epoch": 4349} {"train_loss": -26.095417022705078, "global_step": 360989, "epoch": 4349} {"train_loss": -25.632116317749023, "global_step": 360990, "epoch": 4349} {"train_loss": -25.826963424682617, "global_step": 360991, "epoch": 4349} {"train_loss": -25.783308029174805, "global_step": 360992, "epoch": 4349} {"train_loss": -26.281604766845703, "global_step": 360993, "epoch": 4349} {"train_loss": -26.2363338470459, "global_step": 360994, "epoch": 4349} {"train_loss": -25.694965362548828, "global_step": 360995, "epoch": 4349} {"train_loss": -26.200103759765625, "global_step": 360996, "epoch": 4349} {"train_loss": -25.940256118774414, "global_step": 360997, "epoch": 4349} {"train_loss": -26.163679122924805, "global_step": 360998, "epoch": 4349} {"train_loss": -26.209491729736328, "global_step": 360999, "epoch": 4349} {"train_loss": -26.299610137939453, "global_step": 361000, "epoch": 4349} {"train_loss": -25.981311798095703, "global_step": 361001, "epoch": 4349} {"train_loss": -26.785837173461914, "global_step": 361002, "epoch": 4349} {"train_loss": -25.95734977722168, "global_step": 361003, "epoch": 4349} {"train_loss": -26.15290641784668, "global_step": 361004, "epoch": 4349} {"train_loss": -26.273183822631836, "global_step": 361005, "epoch": 4349} {"train_loss": -25.9508056640625, "global_step": 361006, "epoch": 4349} {"train_loss": -26.379140853881836, "global_step": 361007, "epoch": 4349} {"train_loss": -26.258197784423828, "global_step": 361008, "epoch": 4349} {"train_loss": -26.375946044921875, "global_step": 361009, "epoch": 4349} {"train_loss": -26.29957389831543, "global_step": 361010, "epoch": 4349} {"train_loss": -26.096759796142578, "global_step": 361011, "epoch": 4349} {"train_loss": -26.060773849487305, "global_step": 361012, "epoch": 4349} {"train_loss": -25.923551559448242, "global_step": 361013, "epoch": 4349} {"train_loss": -26.345487594604492, "global_step": 361014, "epoch": 4349} {"train_loss": -26.171354293823242, "global_step": 361015, "epoch": 4349} {"train_loss": -26.247968673706055, "global_step": 361016, "epoch": 4349} {"train_loss": -26.112791061401367, "global_step": 361017, "epoch": 4349} {"train_loss": -26.2047061920166, "global_step": 361018, "epoch": 4349} {"train_loss": -26.138708114624023, "global_step": 361019, "epoch": 4349} {"train_loss": -26.02219009399414, "global_step": 361020, "epoch": 4349} {"train_loss": -26.427106857299805, "global_step": 361021, "epoch": 4349} {"train_loss": -26.691436767578125, "global_step": 361022, "epoch": 4349} {"train_loss": -26.168798446655273, "global_step": 361023, "epoch": 4349} {"train_loss": -26.56490135192871, "global_step": 361024, "epoch": 4349} {"train_loss": -26.456586837768555, "global_step": 361025, "epoch": 4349} {"train_loss": -26.459089279174805, "global_step": 361026, "epoch": 4349} {"train_loss": -26.515405654907227, "global_step": 361027, "epoch": 4349} {"train_loss": -26.358678817749023, "global_step": 361028, "epoch": 4349} {"train_loss": -26.28192710876465, "global_step": 361029, "epoch": 4349} {"train_loss": -26.1342830657959, "global_step": 361030, "epoch": 4349} {"train_loss": -26.732465744018555, "global_step": 361031, "epoch": 4349} {"train_loss": -25.859663009643555, "global_step": 361032, "epoch": 4349} {"train_loss": -26.24281120300293, "global_step": 361033, "epoch": 4349} {"train_loss": -26.014511108398438, "global_step": 361034, "epoch": 4349} {"train_loss": -26.447595596313477, "global_step": 361035, "epoch": 4349} {"train_loss": -26.424596786499023, "global_step": 361036, "epoch": 4349} {"train_loss": -26.1248722076416, "global_step": 361037, "epoch": 4349} {"train_loss": -26.353845596313477, "global_step": 361038, "epoch": 4349} {"train_loss": -26.55813980102539, "global_step": 361039, "epoch": 4349} {"train_loss": -26.369049072265625, "global_step": 361040, "epoch": 4349} {"train_loss": -25.98870849609375, "global_step": 361041, "epoch": 4349} {"train_loss": -26.518299102783203, "global_step": 361042, "epoch": 4349} {"train_loss": -26.3327579498291, "global_step": 361043, "epoch": 4349} {"train_loss": -26.313129425048828, "global_step": 361044, "epoch": 4349} {"train_loss": -26.34622573852539, "global_step": 361045, "epoch": 4349} {"train_loss": -26.24237060546875, "global_step": 361046, "epoch": 4349} {"train_loss": -26.458179473876953, "global_step": 361047, "epoch": 4349} {"train_loss": -25.99421501159668, "global_step": 361048, "epoch": 4349} {"train_loss": -26.182905909526777, "global_step": 361049, "epoch": 4349, "val_loss": 6593852.0} {"train_loss": -25.95248794555664, "global_step": 361050, "epoch": 4350} {"train_loss": -25.707563400268555, "global_step": 361051, "epoch": 4350} {"train_loss": -26.07809829711914, "global_step": 361052, "epoch": 4350} {"train_loss": -26.21124839782715, "global_step": 361053, "epoch": 4350} {"train_loss": -26.043020248413086, "global_step": 361054, "epoch": 4350} {"train_loss": -25.923816680908203, "global_step": 361055, "epoch": 4350} {"train_loss": -26.114038467407227, "global_step": 361056, "epoch": 4350} {"train_loss": -25.8721923828125, "global_step": 361057, "epoch": 4350} {"train_loss": -25.906036376953125, "global_step": 361058, "epoch": 4350} {"train_loss": -26.109710693359375, "global_step": 361059, "epoch": 4350} {"train_loss": -26.017202377319336, "global_step": 361060, "epoch": 4350} {"train_loss": -25.900775909423828, "global_step": 361061, "epoch": 4350} {"train_loss": -26.223651885986328, "global_step": 361062, "epoch": 4350} {"train_loss": -25.902612686157227, "global_step": 361063, "epoch": 4350} {"train_loss": -26.320758819580078, "global_step": 361064, "epoch": 4350} {"train_loss": -25.993091583251953, "global_step": 361065, "epoch": 4350} {"train_loss": -26.0028076171875, "global_step": 361066, "epoch": 4350} {"train_loss": -26.244476318359375, "global_step": 361067, "epoch": 4350} {"train_loss": -26.310516357421875, "global_step": 361068, "epoch": 4350} {"train_loss": -26.054040908813477, "global_step": 361069, "epoch": 4350} {"train_loss": -26.652088165283203, "global_step": 361070, "epoch": 4350} {"train_loss": -25.835180282592773, "global_step": 361071, "epoch": 4350} {"train_loss": -25.97523307800293, "global_step": 361072, "epoch": 4350} {"train_loss": -26.21527099609375, "global_step": 361073, "epoch": 4350} {"train_loss": -26.385456085205078, "global_step": 361074, "epoch": 4350} {"train_loss": -26.307941436767578, "global_step": 361075, "epoch": 4350} {"train_loss": -26.535192489624023, "global_step": 361076, "epoch": 4350} {"train_loss": -26.41743278503418, "global_step": 361077, "epoch": 4350} {"train_loss": -26.549396514892578, "global_step": 361078, "epoch": 4350} {"train_loss": -26.453338623046875, "global_step": 361079, "epoch": 4350} {"train_loss": -26.546300888061523, "global_step": 361080, "epoch": 4350} {"train_loss": -26.15771484375, "global_step": 361081, "epoch": 4350} {"train_loss": -26.503149032592773, "global_step": 361082, "epoch": 4350} {"train_loss": -26.549137115478516, "global_step": 361083, "epoch": 4350} {"train_loss": -26.052997589111328, "global_step": 361084, "epoch": 4350} {"train_loss": -25.911392211914062, "global_step": 361085, "epoch": 4350} {"train_loss": -26.667455673217773, "global_step": 361086, "epoch": 4350} {"train_loss": -25.815500259399414, "global_step": 361087, "epoch": 4350} {"train_loss": -26.127685546875, "global_step": 361088, "epoch": 4350} {"train_loss": -25.516395568847656, "global_step": 361089, "epoch": 4350} {"train_loss": -25.9267520904541, "global_step": 361090, "epoch": 4350} {"train_loss": -26.41985511779785, "global_step": 361091, "epoch": 4350} {"train_loss": -25.833398818969727, "global_step": 361092, "epoch": 4350} {"train_loss": -25.927753448486328, "global_step": 361093, "epoch": 4350} {"train_loss": -25.770822525024414, "global_step": 361094, "epoch": 4350} {"train_loss": -25.744464874267578, "global_step": 361095, "epoch": 4350} {"train_loss": -25.78462028503418, "global_step": 361096, "epoch": 4350} {"train_loss": -25.847131729125977, "global_step": 361097, "epoch": 4350} {"train_loss": -25.9882755279541, "global_step": 361098, "epoch": 4350} {"train_loss": -26.168378829956055, "global_step": 361099, "epoch": 4350} {"train_loss": -25.929126739501953, "global_step": 361100, "epoch": 4350} {"train_loss": -26.328662872314453, "global_step": 361101, "epoch": 4350} {"train_loss": -25.72422218322754, "global_step": 361102, "epoch": 4350} {"train_loss": -26.158960342407227, "global_step": 361103, "epoch": 4350} {"train_loss": -26.184646606445312, "global_step": 361104, "epoch": 4350} {"train_loss": -25.773096084594727, "global_step": 361105, "epoch": 4350} {"train_loss": -26.245981216430664, "global_step": 361106, "epoch": 4350} {"train_loss": -26.19668960571289, "global_step": 361107, "epoch": 4350} {"train_loss": -26.115121841430664, "global_step": 361108, "epoch": 4350} {"train_loss": -26.15070915222168, "global_step": 361109, "epoch": 4350} {"train_loss": -26.216089248657227, "global_step": 361110, "epoch": 4350} {"train_loss": -26.063922882080078, "global_step": 361111, "epoch": 4350} {"train_loss": -26.170209884643555, "global_step": 361112, "epoch": 4350} {"train_loss": -26.232086181640625, "global_step": 361113, "epoch": 4350} {"train_loss": -26.498092651367188, "global_step": 361114, "epoch": 4350} {"train_loss": -26.0120906829834, "global_step": 361115, "epoch": 4350} {"train_loss": -26.367908477783203, "global_step": 361116, "epoch": 4350} {"train_loss": -26.486103057861328, "global_step": 361117, "epoch": 4350} {"train_loss": -26.35446548461914, "global_step": 361118, "epoch": 4350} {"train_loss": -26.27274513244629, "global_step": 361119, "epoch": 4350} {"train_loss": -26.496448516845703, "global_step": 361120, "epoch": 4350} {"train_loss": -26.795166015625, "global_step": 361121, "epoch": 4350} {"train_loss": -26.362619400024414, "global_step": 361122, "epoch": 4350} {"train_loss": -26.719152450561523, "global_step": 361123, "epoch": 4350} {"train_loss": -26.822906494140625, "global_step": 361124, "epoch": 4350} {"train_loss": -26.087512969970703, "global_step": 361125, "epoch": 4350} {"train_loss": -26.54937744140625, "global_step": 361126, "epoch": 4350} {"train_loss": -26.4556884765625, "global_step": 361127, "epoch": 4350} {"train_loss": -26.39750099182129, "global_step": 361128, "epoch": 4350} {"train_loss": -26.204315185546875, "global_step": 361129, "epoch": 4350} {"train_loss": -26.507171630859375, "global_step": 361130, "epoch": 4350} {"train_loss": -26.197057723999023, "global_step": 361131, "epoch": 4350} {"train_loss": -26.18434811787433, "global_step": 361132, "epoch": 4350, "train/sim_max_reward_0": 1.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4500000": 1.0, "test/sim_max_reward_4500001": 1.0, "test/sim_max_reward_4500002": 1.0, "test/sim_max_reward_4500003": 1.0, "test/sim_max_reward_4500004": 1.0, "test/sim_max_reward_4500005": 1.0, "test/sim_max_reward_4500006": 1.0, "test/sim_max_reward_4500007": 0.0, "test/sim_max_reward_4500008": 1.0, "test/sim_max_reward_4500009": 1.0, "test/sim_max_reward_4500010": 1.0, "test/sim_max_reward_4500011": 1.0, "test/sim_max_reward_4500012": 1.0, "test/sim_max_reward_4500013": 1.0, "test/sim_max_reward_4500014": 1.0, "test/sim_max_reward_4500015": 1.0, "test/sim_max_reward_4500016": 1.0, "test/sim_max_reward_4500017": 1.0, "test/sim_max_reward_4500018": 1.0, "test/sim_max_reward_4500019": 0.0, "test/sim_max_reward_4500020": 1.0, "test/sim_max_reward_4500021": 1.0, "train/mean_score": 1.0, "test/mean_score": 0.9090909090909091, "val_loss": 6556158.0} {"train_loss": -26.23055076599121, "global_step": 361133, "epoch": 4351} {"train_loss": -25.648483276367188, "global_step": 361134, "epoch": 4351} {"train_loss": -26.226306915283203, "global_step": 361135, "epoch": 4351} {"train_loss": -25.862262725830078, "global_step": 361136, "epoch": 4351} {"train_loss": -25.51019859313965, "global_step": 361137, "epoch": 4351} {"train_loss": -25.994693756103516, "global_step": 361138, "epoch": 4351} {"train_loss": -26.02813148498535, "global_step": 361139, "epoch": 4351} {"train_loss": -26.0103759765625, "global_step": 361140, "epoch": 4351} {"train_loss": -25.881362915039062, "global_step": 361141, "epoch": 4351} {"train_loss": -25.819360733032227, "global_step": 361142, "epoch": 4351} {"train_loss": -25.85152244567871, "global_step": 361143, "epoch": 4351} {"train_loss": -26.042572021484375, "global_step": 361144, "epoch": 4351} {"train_loss": -26.025007247924805, "global_step": 361145, "epoch": 4351} {"train_loss": -26.00105094909668, "global_step": 361146, "epoch": 4351} {"train_loss": -26.113447189331055, "global_step": 361147, "epoch": 4351} {"train_loss": -26.2362117767334, "global_step": 361148, "epoch": 4351} {"train_loss": -26.4498348236084, "global_step": 361149, "epoch": 4351} {"train_loss": -26.206872940063477, "global_step": 361150, "epoch": 4351} {"train_loss": -26.17841911315918, "global_step": 361151, "epoch": 4351} {"train_loss": -26.12217140197754, "global_step": 361152, "epoch": 4351} {"train_loss": -26.164508819580078, "global_step": 361153, "epoch": 4351} {"train_loss": -26.168914794921875, "global_step": 361154, "epoch": 4351} {"train_loss": -26.197021484375, "global_step": 361155, "epoch": 4351} {"train_loss": -26.016950607299805, "global_step": 361156, "epoch": 4351} {"train_loss": -26.37919044494629, "global_step": 361157, "epoch": 4351} {"train_loss": -26.677961349487305, "global_step": 361158, "epoch": 4351} {"train_loss": -26.100996017456055, "global_step": 361159, "epoch": 4351} {"train_loss": -25.95880126953125, "global_step": 361160, "epoch": 4351} {"train_loss": -26.326635360717773, "global_step": 361161, "epoch": 4351} {"train_loss": -26.359649658203125, "global_step": 361162, "epoch": 4351} {"train_loss": -26.54743003845215, "global_step": 361163, "epoch": 4351} {"train_loss": -26.275732040405273, "global_step": 361164, "epoch": 4351} {"train_loss": -26.17645263671875, "global_step": 361165, "epoch": 4351} {"train_loss": -26.18537712097168, "global_step": 361166, "epoch": 4351} {"train_loss": -26.311925888061523, "global_step": 361167, "epoch": 4351} {"train_loss": -26.15057373046875, "global_step": 361168, "epoch": 4351} {"train_loss": -26.559606552124023, "global_step": 361169, "epoch": 4351} {"train_loss": -26.169830322265625, "global_step": 361170, "epoch": 4351} {"train_loss": -26.30872917175293, "global_step": 361171, "epoch": 4351} {"train_loss": -25.844684600830078, "global_step": 361172, "epoch": 4351} {"train_loss": -26.5709171295166, "global_step": 361173, "epoch": 4351} {"train_loss": -26.446313858032227, "global_step": 361174, "epoch": 4351} {"train_loss": -26.04056167602539, "global_step": 361175, "epoch": 4351} {"train_loss": -26.1506404876709, "global_step": 361176, "epoch": 4351} {"train_loss": -26.204669952392578, "global_step": 361177, "epoch": 4351} {"train_loss": -26.525604248046875, "global_step": 361178, "epoch": 4351} {"train_loss": -26.457605361938477, "global_step": 361179, "epoch": 4351} {"train_loss": -26.406896591186523, "global_step": 361180, "epoch": 4351} {"train_loss": -26.093576431274414, "global_step": 361181, "epoch": 4351} {"train_loss": -26.180761337280273, "global_step": 361182, "epoch": 4351} {"train_loss": -26.135425567626953, "global_step": 361183, "epoch": 4351} {"train_loss": -26.1025390625, "global_step": 361184, "epoch": 4351} {"train_loss": -26.37116813659668, "global_step": 361185, "epoch": 4351} {"train_loss": -25.684326171875, "global_step": 361186, "epoch": 4351} {"train_loss": -26.130537033081055, "global_step": 361187, "epoch": 4351} {"train_loss": -26.17441177368164, "global_step": 361188, "epoch": 4351} {"train_loss": -26.44538688659668, "global_step": 361189, "epoch": 4351} {"train_loss": -26.16383171081543, "global_step": 361190, "epoch": 4351} {"train_loss": -26.17829704284668, "global_step": 361191, "epoch": 4351} {"train_loss": -26.120914459228516, "global_step": 361192, "epoch": 4351} {"train_loss": -26.2750244140625, "global_step": 361193, "epoch": 4351} {"train_loss": -25.878742218017578, "global_step": 361194, "epoch": 4351} {"train_loss": -26.643884658813477, "global_step": 361195, "epoch": 4351} {"train_loss": -25.913537979125977, "global_step": 361196, "epoch": 4351} {"train_loss": -26.070301055908203, "global_step": 361197, "epoch": 4351} {"train_loss": -25.76787757873535, "global_step": 361198, "epoch": 4351} {"train_loss": -26.272985458374023, "global_step": 361199, "epoch": 4351} {"train_loss": -26.45330238342285, "global_step": 361200, "epoch": 4351} {"train_loss": -25.914697647094727, "global_step": 361201, "epoch": 4351} {"train_loss": -26.10041618347168, "global_step": 361202, "epoch": 4351} {"train_loss": -26.09702491760254, "global_step": 361203, "epoch": 4351} {"train_loss": -26.3355655670166, "global_step": 361204, "epoch": 4351} {"train_loss": -26.23178482055664, "global_step": 361205, "epoch": 4351} {"train_loss": -26.10695457458496, "global_step": 361206, "epoch": 4351} {"train_loss": -26.0092830657959, "global_step": 361207, "epoch": 4351} {"train_loss": -26.546552658081055, "global_step": 361208, "epoch": 4351} {"train_loss": -26.22995948791504, "global_step": 361209, "epoch": 4351} {"train_loss": -26.091598510742188, "global_step": 361210, "epoch": 4351} {"train_loss": -26.299072265625, "global_step": 361211, "epoch": 4351} {"train_loss": -26.62359046936035, "global_step": 361212, "epoch": 4351} {"train_loss": -26.703550338745117, "global_step": 361213, "epoch": 4351} {"train_loss": -26.366479873657227, "global_step": 361214, "epoch": 4351} {"train_loss": -26.199314600013825, "global_step": 361215, "epoch": 4351, "val_loss": 6636812.0} {"train_loss": -25.942798614501953, "global_step": 361216, "epoch": 4352} {"train_loss": -26.182727813720703, "global_step": 361217, "epoch": 4352} {"train_loss": -26.450550079345703, "global_step": 361218, "epoch": 4352} {"train_loss": -26.091751098632812, "global_step": 361219, "epoch": 4352} {"train_loss": -26.2320613861084, "global_step": 361220, "epoch": 4352} {"train_loss": -26.164209365844727, "global_step": 361221, "epoch": 4352} {"train_loss": -26.128576278686523, "global_step": 361222, "epoch": 4352} {"train_loss": -26.228445053100586, "global_step": 361223, "epoch": 4352} {"train_loss": -26.313262939453125, "global_step": 361224, "epoch": 4352} {"train_loss": -26.103113174438477, "global_step": 361225, "epoch": 4352} {"train_loss": -26.45499610900879, "global_step": 361226, "epoch": 4352} {"train_loss": -26.240568161010742, "global_step": 361227, "epoch": 4352} {"train_loss": -26.363561630249023, "global_step": 361228, "epoch": 4352} {"train_loss": -26.024749755859375, "global_step": 361229, "epoch": 4352} {"train_loss": -25.979522705078125, "global_step": 361230, "epoch": 4352} {"train_loss": -26.121570587158203, "global_step": 361231, "epoch": 4352} {"train_loss": -26.4404354095459, "global_step": 361232, "epoch": 4352} {"train_loss": -26.234760284423828, "global_step": 361233, "epoch": 4352} {"train_loss": -26.113325119018555, "global_step": 361234, "epoch": 4352} {"train_loss": -26.21613883972168, "global_step": 361235, "epoch": 4352} {"train_loss": -26.341171264648438, "global_step": 361236, "epoch": 4352} {"train_loss": -26.135822296142578, "global_step": 361237, "epoch": 4352} {"train_loss": -25.96787452697754, "global_step": 361238, "epoch": 4352} {"train_loss": -26.460412979125977, "global_step": 361239, "epoch": 4352} {"train_loss": -26.31996726989746, "global_step": 361240, "epoch": 4352} {"train_loss": -25.965391159057617, "global_step": 361241, "epoch": 4352} {"train_loss": -26.555349349975586, "global_step": 361242, "epoch": 4352} {"train_loss": -26.368438720703125, "global_step": 361243, "epoch": 4352} {"train_loss": -26.126880645751953, "global_step": 361244, "epoch": 4352} {"train_loss": -25.725317001342773, "global_step": 361245, "epoch": 4352} {"train_loss": -26.53205680847168, "global_step": 361246, "epoch": 4352} {"train_loss": -26.08027458190918, "global_step": 361247, "epoch": 4352} {"train_loss": -26.106048583984375, "global_step": 361248, "epoch": 4352} {"train_loss": -26.372608184814453, "global_step": 361249, "epoch": 4352} {"train_loss": -26.319232940673828, "global_step": 361250, "epoch": 4352} {"train_loss": -26.383533477783203, "global_step": 361251, "epoch": 4352} {"train_loss": -26.452625274658203, "global_step": 361252, "epoch": 4352} {"train_loss": -26.581159591674805, "global_step": 361253, "epoch": 4352} {"train_loss": -26.790912628173828, "global_step": 361254, "epoch": 4352} {"train_loss": -26.456012725830078, "global_step": 361255, "epoch": 4352} {"train_loss": -26.302631378173828, "global_step": 361256, "epoch": 4352} {"train_loss": -26.472076416015625, "global_step": 361257, "epoch": 4352} {"train_loss": -26.102270126342773, "global_step": 361258, "epoch": 4352} {"train_loss": -26.323469161987305, "global_step": 361259, "epoch": 4352} {"train_loss": -26.42702293395996, "global_step": 361260, "epoch": 4352} {"train_loss": -26.442459106445312, "global_step": 361261, "epoch": 4352} {"train_loss": -25.949569702148438, "global_step": 361262, "epoch": 4352} {"train_loss": -26.55489158630371, "global_step": 361263, "epoch": 4352} {"train_loss": -26.11188316345215, "global_step": 361264, "epoch": 4352} {"train_loss": -26.224084854125977, "global_step": 361265, "epoch": 4352} {"train_loss": -26.225385665893555, "global_step": 361266, "epoch": 4352} {"train_loss": -26.265399932861328, "global_step": 361267, "epoch": 4352} {"train_loss": -26.32513999938965, "global_step": 361268, "epoch": 4352} {"train_loss": -26.365909576416016, "global_step": 361269, "epoch": 4352} {"train_loss": -26.36136245727539, "global_step": 361270, "epoch": 4352} {"train_loss": -26.198993682861328, "global_step": 361271, "epoch": 4352} {"train_loss": -26.112354278564453, "global_step": 361272, "epoch": 4352} {"train_loss": -26.588876724243164, "global_step": 361273, "epoch": 4352} {"train_loss": -25.953393936157227, "global_step": 361274, "epoch": 4352} {"train_loss": -26.337446212768555, "global_step": 361275, "epoch": 4352} {"train_loss": -26.190820693969727, "global_step": 361276, "epoch": 4352} {"train_loss": -26.26966667175293, "global_step": 361277, "epoch": 4352} {"train_loss": -25.737497329711914, "global_step": 361278, "epoch": 4352} {"train_loss": -26.0966796875, "global_step": 361279, "epoch": 4352} {"train_loss": -26.37032127380371, "global_step": 361280, "epoch": 4352} {"train_loss": -26.092443466186523, "global_step": 361281, "epoch": 4352} {"train_loss": -26.138593673706055, "global_step": 361282, "epoch": 4352} {"train_loss": -25.80836296081543, "global_step": 361283, "epoch": 4352} {"train_loss": -26.377668380737305, "global_step": 361284, "epoch": 4352} {"train_loss": -25.785552978515625, "global_step": 361285, "epoch": 4352} {"train_loss": -25.592435836791992, "global_step": 361286, "epoch": 4352} {"train_loss": -26.202680587768555, "global_step": 361287, "epoch": 4352} {"train_loss": -26.097198486328125, "global_step": 361288, "epoch": 4352} {"train_loss": -26.428613662719727, "global_step": 361289, "epoch": 4352} {"train_loss": -26.1646785736084, "global_step": 361290, "epoch": 4352} {"train_loss": -26.12750816345215, "global_step": 361291, "epoch": 4352} {"train_loss": -26.668848037719727, "global_step": 361292, "epoch": 4352} {"train_loss": -26.1744327545166, "global_step": 361293, "epoch": 4352} {"train_loss": -26.197723388671875, "global_step": 361294, "epoch": 4352} {"train_loss": -26.615192413330078, "global_step": 361295, "epoch": 4352} {"train_loss": -25.976408004760742, "global_step": 361296, "epoch": 4352} {"train_loss": -26.44146728515625, "global_step": 361297, "epoch": 4352} {"train_loss": -26.230176397116786, "global_step": 361298, "epoch": 4352, "val_loss": 6486589.5} {"train_loss": -25.495397567749023, "global_step": 361299, "epoch": 4353} {"train_loss": -26.051727294921875, "global_step": 361300, "epoch": 4353} {"train_loss": -25.743820190429688, "global_step": 361301, "epoch": 4353} {"train_loss": -25.620344161987305, "global_step": 361302, "epoch": 4353} {"train_loss": -25.8781681060791, "global_step": 361303, "epoch": 4353} {"train_loss": -25.94158935546875, "global_step": 361304, "epoch": 4353} {"train_loss": -26.18787956237793, "global_step": 361305, "epoch": 4353} {"train_loss": -26.124225616455078, "global_step": 361306, "epoch": 4353} {"train_loss": -25.783239364624023, "global_step": 361307, "epoch": 4353} {"train_loss": -26.15887451171875, "global_step": 361308, "epoch": 4353} {"train_loss": -25.7642822265625, "global_step": 361309, "epoch": 4353} {"train_loss": -25.966135025024414, "global_step": 361310, "epoch": 4353} {"train_loss": -26.40205192565918, "global_step": 361311, "epoch": 4353} {"train_loss": -25.966995239257812, "global_step": 361312, "epoch": 4353} {"train_loss": -26.07758903503418, "global_step": 361313, "epoch": 4353} {"train_loss": -26.03042984008789, "global_step": 361314, "epoch": 4353} {"train_loss": -25.968505859375, "global_step": 361315, "epoch": 4353} {"train_loss": -25.974958419799805, "global_step": 361316, "epoch": 4353} {"train_loss": -26.401952743530273, "global_step": 361317, "epoch": 4353} {"train_loss": -25.700138092041016, "global_step": 361318, "epoch": 4353} {"train_loss": -26.18842887878418, "global_step": 361319, "epoch": 4353} {"train_loss": -26.052398681640625, "global_step": 361320, "epoch": 4353} {"train_loss": -25.87006187438965, "global_step": 361321, "epoch": 4353} {"train_loss": -26.064130783081055, "global_step": 361322, "epoch": 4353} {"train_loss": -26.475263595581055, "global_step": 361323, "epoch": 4353} {"train_loss": -26.107168197631836, "global_step": 361324, "epoch": 4353} {"train_loss": -26.475187301635742, "global_step": 361325, "epoch": 4353} {"train_loss": -26.104787826538086, "global_step": 361326, "epoch": 4353} {"train_loss": -26.067325592041016, "global_step": 361327, "epoch": 4353} {"train_loss": -26.17084312438965, "global_step": 361328, "epoch": 4353} {"train_loss": -26.4931583404541, "global_step": 361329, "epoch": 4353} {"train_loss": -26.119293212890625, "global_step": 361330, "epoch": 4353} {"train_loss": -26.32451820373535, "global_step": 361331, "epoch": 4353} {"train_loss": -26.289901733398438, "global_step": 361332, "epoch": 4353} {"train_loss": -26.106470108032227, "global_step": 361333, "epoch": 4353} {"train_loss": -26.247114181518555, "global_step": 361334, "epoch": 4353} {"train_loss": -26.192352294921875, "global_step": 361335, "epoch": 4353} {"train_loss": -26.54776954650879, "global_step": 361336, "epoch": 4353} {"train_loss": -26.277484893798828, "global_step": 361337, "epoch": 4353} {"train_loss": -26.324691772460938, "global_step": 361338, "epoch": 4353} {"train_loss": -26.77631187438965, "global_step": 361339, "epoch": 4353} {"train_loss": -26.413339614868164, "global_step": 361340, "epoch": 4353} {"train_loss": -26.803525924682617, "global_step": 361341, "epoch": 4353} {"train_loss": -26.206579208374023, "global_step": 361342, "epoch": 4353} {"train_loss": -26.6256160736084, "global_step": 361343, "epoch": 4353} {"train_loss": -26.301239013671875, "global_step": 361344, "epoch": 4353} {"train_loss": -26.523534774780273, "global_step": 361345, "epoch": 4353} {"train_loss": -26.245630264282227, "global_step": 361346, "epoch": 4353} {"train_loss": -26.4585018157959, "global_step": 361347, "epoch": 4353} {"train_loss": -26.265979766845703, "global_step": 361348, "epoch": 4353} {"train_loss": -26.44380760192871, "global_step": 361349, "epoch": 4353} {"train_loss": -25.69329833984375, "global_step": 361350, "epoch": 4353} {"train_loss": -26.174686431884766, "global_step": 361351, "epoch": 4353} {"train_loss": -26.348764419555664, "global_step": 361352, "epoch": 4353} {"train_loss": -26.554162979125977, "global_step": 361353, "epoch": 4353} {"train_loss": -26.331262588500977, "global_step": 361354, "epoch": 4353} {"train_loss": -26.25421714782715, "global_step": 361355, "epoch": 4353} {"train_loss": -26.3247013092041, "global_step": 361356, "epoch": 4353} {"train_loss": -26.438562393188477, "global_step": 361357, "epoch": 4353} {"train_loss": -26.5069637298584, "global_step": 361358, "epoch": 4353} {"train_loss": -26.11102294921875, "global_step": 361359, "epoch": 4353} {"train_loss": -26.093488693237305, "global_step": 361360, "epoch": 4353} {"train_loss": -26.3255615234375, "global_step": 361361, "epoch": 4353} {"train_loss": -26.20893669128418, "global_step": 361362, "epoch": 4353} {"train_loss": -26.13343620300293, "global_step": 361363, "epoch": 4353} {"train_loss": -26.200536727905273, "global_step": 361364, "epoch": 4353} {"train_loss": -26.067325592041016, "global_step": 361365, "epoch": 4353} {"train_loss": -26.5296688079834, "global_step": 361366, "epoch": 4353} {"train_loss": -26.306501388549805, "global_step": 361367, "epoch": 4353} {"train_loss": -26.32649040222168, "global_step": 361368, "epoch": 4353} {"train_loss": -25.8079833984375, "global_step": 361369, "epoch": 4353} {"train_loss": -26.371112823486328, "global_step": 361370, "epoch": 4353} {"train_loss": -26.2287540435791, "global_step": 361371, "epoch": 4353} {"train_loss": -26.589004516601562, "global_step": 361372, "epoch": 4353} {"train_loss": -26.13617515563965, "global_step": 361373, "epoch": 4353} {"train_loss": -26.108154296875, "global_step": 361374, "epoch": 4353} {"train_loss": -26.3858699798584, "global_step": 361375, "epoch": 4353} {"train_loss": -26.458398818969727, "global_step": 361376, "epoch": 4353} {"train_loss": -26.11512565612793, "global_step": 361377, "epoch": 4353} {"train_loss": -26.485015869140625, "global_step": 361378, "epoch": 4353} {"train_loss": -26.273609161376953, "global_step": 361379, "epoch": 4353} {"train_loss": -26.428136825561523, "global_step": 361380, "epoch": 4353} {"train_loss": -26.209509470376624, "global_step": 361381, "epoch": 4353, "val_loss": 6604872.0} {"train_loss": -26.3663272857666, "global_step": 361382, "epoch": 4354} {"train_loss": -25.817102432250977, "global_step": 361383, "epoch": 4354} {"train_loss": -26.530912399291992, "global_step": 361384, "epoch": 4354} {"train_loss": -26.070159912109375, "global_step": 361385, "epoch": 4354} {"train_loss": -25.865680694580078, "global_step": 361386, "epoch": 4354} {"train_loss": -25.791004180908203, "global_step": 361387, "epoch": 4354} {"train_loss": -26.312402725219727, "global_step": 361388, "epoch": 4354} {"train_loss": -26.434736251831055, "global_step": 361389, "epoch": 4354} {"train_loss": -25.83424949645996, "global_step": 361390, "epoch": 4354} {"train_loss": -26.436914443969727, "global_step": 361391, "epoch": 4354} {"train_loss": -26.090314865112305, "global_step": 361392, "epoch": 4354} {"train_loss": -26.125513076782227, "global_step": 361393, "epoch": 4354} {"train_loss": -25.991147994995117, "global_step": 361394, "epoch": 4354} {"train_loss": -26.027389526367188, "global_step": 361395, "epoch": 4354} {"train_loss": -26.115570068359375, "global_step": 361396, "epoch": 4354} {"train_loss": -25.680713653564453, "global_step": 361397, "epoch": 4354} {"train_loss": -25.65348243713379, "global_step": 361398, "epoch": 4354} {"train_loss": -25.89117431640625, "global_step": 361399, "epoch": 4354} {"train_loss": -25.62641716003418, "global_step": 361400, "epoch": 4354} {"train_loss": -26.066165924072266, "global_step": 361401, "epoch": 4354} {"train_loss": -26.12088394165039, "global_step": 361402, "epoch": 4354} {"train_loss": -26.16525650024414, "global_step": 361403, "epoch": 4354} {"train_loss": -26.38624382019043, "global_step": 361404, "epoch": 4354} {"train_loss": -26.109577178955078, "global_step": 361405, "epoch": 4354} {"train_loss": -25.825775146484375, "global_step": 361406, "epoch": 4354} {"train_loss": -26.469924926757812, "global_step": 361407, "epoch": 4354} {"train_loss": -26.2387752532959, "global_step": 361408, "epoch": 4354} {"train_loss": -25.882177352905273, "global_step": 361409, "epoch": 4354} {"train_loss": -26.2172908782959, "global_step": 361410, "epoch": 4354} {"train_loss": -26.358139038085938, "global_step": 361411, "epoch": 4354} {"train_loss": -26.155414581298828, "global_step": 361412, "epoch": 4354} {"train_loss": -26.221662521362305, "global_step": 361413, "epoch": 4354} {"train_loss": -26.188190460205078, "global_step": 361414, "epoch": 4354} {"train_loss": -26.036792755126953, "global_step": 361415, "epoch": 4354} {"train_loss": -26.533889770507812, "global_step": 361416, "epoch": 4354} {"train_loss": -26.281896591186523, "global_step": 361417, "epoch": 4354} {"train_loss": -26.35603141784668, "global_step": 361418, "epoch": 4354} {"train_loss": -26.377948760986328, "global_step": 361419, "epoch": 4354} {"train_loss": -26.538434982299805, "global_step": 361420, "epoch": 4354} {"train_loss": -26.46390151977539, "global_step": 361421, "epoch": 4354} {"train_loss": -26.078033447265625, "global_step": 361422, "epoch": 4354} {"train_loss": -26.55939292907715, "global_step": 361423, "epoch": 4354} {"train_loss": -26.85386085510254, "global_step": 361424, "epoch": 4354} {"train_loss": -26.492040634155273, "global_step": 361425, "epoch": 4354} {"train_loss": -26.42791748046875, "global_step": 361426, "epoch": 4354} {"train_loss": -26.498920440673828, "global_step": 361427, "epoch": 4354} {"train_loss": -26.655887603759766, "global_step": 361428, "epoch": 4354} {"train_loss": -26.7904052734375, "global_step": 361429, "epoch": 4354} {"train_loss": -26.322378158569336, "global_step": 361430, "epoch": 4354} {"train_loss": -26.14896583557129, "global_step": 361431, "epoch": 4354} {"train_loss": -26.836963653564453, "global_step": 361432, "epoch": 4354} {"train_loss": -25.96461296081543, "global_step": 361433, "epoch": 4354} {"train_loss": -25.485855102539062, "global_step": 361434, "epoch": 4354} {"train_loss": -24.788345336914062, "global_step": 361435, "epoch": 4354} {"train_loss": -25.40272331237793, "global_step": 361436, "epoch": 4354} {"train_loss": -25.633106231689453, "global_step": 361437, "epoch": 4354} {"train_loss": -25.713134765625, "global_step": 361438, "epoch": 4354} {"train_loss": -26.374540328979492, "global_step": 361439, "epoch": 4354} {"train_loss": -26.047094345092773, "global_step": 361440, "epoch": 4354} {"train_loss": -26.296354293823242, "global_step": 361441, "epoch": 4354} {"train_loss": -26.083133697509766, "global_step": 361442, "epoch": 4354} {"train_loss": -26.30073356628418, "global_step": 361443, "epoch": 4354} {"train_loss": -25.659955978393555, "global_step": 361444, "epoch": 4354} {"train_loss": -25.616382598876953, "global_step": 361445, "epoch": 4354} {"train_loss": -26.275861740112305, "global_step": 361446, "epoch": 4354} {"train_loss": -25.991607666015625, "global_step": 361447, "epoch": 4354} {"train_loss": -26.301923751831055, "global_step": 361448, "epoch": 4354} {"train_loss": -26.241500854492188, "global_step": 361449, "epoch": 4354} {"train_loss": -26.204578399658203, "global_step": 361450, "epoch": 4354} {"train_loss": -25.808887481689453, "global_step": 361451, "epoch": 4354} {"train_loss": -26.445114135742188, "global_step": 361452, "epoch": 4354} {"train_loss": -26.105087280273438, "global_step": 361453, "epoch": 4354} {"train_loss": -26.426965713500977, "global_step": 361454, "epoch": 4354} {"train_loss": -26.022159576416016, "global_step": 361455, "epoch": 4354} {"train_loss": -26.3028564453125, "global_step": 361456, "epoch": 4354} {"train_loss": -26.442930221557617, "global_step": 361457, "epoch": 4354} {"train_loss": -26.469884872436523, "global_step": 361458, "epoch": 4354} {"train_loss": -26.518112182617188, "global_step": 361459, "epoch": 4354} {"train_loss": -26.355619430541992, "global_step": 361460, "epoch": 4354} {"train_loss": -26.400894165039062, "global_step": 361461, "epoch": 4354} {"train_loss": -25.76311683654785, "global_step": 361462, "epoch": 4354} {"train_loss": -26.292236328125, "global_step": 361463, "epoch": 4354} {"train_loss": -26.15723807553211, "global_step": 361464, "epoch": 4354, "val_loss": 6678609.0} {"train_loss": -25.99713706970215, "global_step": 361465, "epoch": 4355} {"train_loss": -24.93474578857422, "global_step": 361466, "epoch": 4355} {"train_loss": -24.61824607849121, "global_step": 361467, "epoch": 4355} {"train_loss": -25.28748893737793, "global_step": 361468, "epoch": 4355} {"train_loss": -25.686725616455078, "global_step": 361469, "epoch": 4355} {"train_loss": -25.879871368408203, "global_step": 361470, "epoch": 4355} {"train_loss": -25.22049331665039, "global_step": 361471, "epoch": 4355} {"train_loss": -25.775232315063477, "global_step": 361472, "epoch": 4355} {"train_loss": -25.621152877807617, "global_step": 361473, "epoch": 4355} {"train_loss": -25.913049697875977, "global_step": 361474, "epoch": 4355} {"train_loss": -25.953643798828125, "global_step": 361475, "epoch": 4355} {"train_loss": -25.97625160217285, "global_step": 361476, "epoch": 4355} {"train_loss": -25.74590492248535, "global_step": 361477, "epoch": 4355} {"train_loss": -26.073896408081055, "global_step": 361478, "epoch": 4355} {"train_loss": -25.81764030456543, "global_step": 361479, "epoch": 4355} {"train_loss": -26.106435775756836, "global_step": 361480, "epoch": 4355} {"train_loss": -25.85255241394043, "global_step": 361481, "epoch": 4355} {"train_loss": -26.1077823638916, "global_step": 361482, "epoch": 4355} {"train_loss": -26.360509872436523, "global_step": 361483, "epoch": 4355} {"train_loss": -25.825183868408203, "global_step": 361484, "epoch": 4355} {"train_loss": -26.08937644958496, "global_step": 361485, "epoch": 4355} {"train_loss": -25.79136085510254, "global_step": 361486, "epoch": 4355} {"train_loss": -25.65923500061035, "global_step": 361487, "epoch": 4355} {"train_loss": -25.633764266967773, "global_step": 361488, "epoch": 4355} {"train_loss": -25.68701171875, "global_step": 361489, "epoch": 4355} {"train_loss": -25.865741729736328, "global_step": 361490, "epoch": 4355} {"train_loss": -26.368408203125, "global_step": 361491, "epoch": 4355} {"train_loss": -26.253061294555664, "global_step": 361492, "epoch": 4355} {"train_loss": -26.0648193359375, "global_step": 361493, "epoch": 4355} {"train_loss": -26.23000144958496, "global_step": 361494, "epoch": 4355} {"train_loss": -25.86248207092285, "global_step": 361495, "epoch": 4355} {"train_loss": -26.25959587097168, "global_step": 361496, "epoch": 4355} {"train_loss": -26.15057945251465, "global_step": 361497, "epoch": 4355} {"train_loss": -26.351211547851562, "global_step": 361498, "epoch": 4355} {"train_loss": -26.28493309020996, "global_step": 361499, "epoch": 4355} {"train_loss": -26.033292770385742, "global_step": 361500, "epoch": 4355} {"train_loss": -26.245147705078125, "global_step": 361501, "epoch": 4355} {"train_loss": -26.151044845581055, "global_step": 361502, "epoch": 4355} {"train_loss": -26.300512313842773, "global_step": 361503, "epoch": 4355} {"train_loss": -26.386274337768555, "global_step": 361504, "epoch": 4355} {"train_loss": -26.5072078704834, "global_step": 361505, "epoch": 4355} {"train_loss": -26.35694694519043, "global_step": 361506, "epoch": 4355} {"train_loss": -26.07093620300293, "global_step": 361507, "epoch": 4355} {"train_loss": -26.38209342956543, "global_step": 361508, "epoch": 4355} {"train_loss": -26.128158569335938, "global_step": 361509, "epoch": 4355} {"train_loss": -26.6451416015625, "global_step": 361510, "epoch": 4355} {"train_loss": -26.601917266845703, "global_step": 361511, "epoch": 4355} {"train_loss": -26.5831298828125, "global_step": 361512, "epoch": 4355} {"train_loss": -26.308277130126953, "global_step": 361513, "epoch": 4355} {"train_loss": -26.322370529174805, "global_step": 361514, "epoch": 4355} {"train_loss": -26.439191818237305, "global_step": 361515, "epoch": 4355} {"train_loss": -26.11041831970215, "global_step": 361516, "epoch": 4355} {"train_loss": -26.013233184814453, "global_step": 361517, "epoch": 4355} {"train_loss": -26.9089298248291, "global_step": 361518, "epoch": 4355} {"train_loss": -26.475021362304688, "global_step": 361519, "epoch": 4355} {"train_loss": -26.297077178955078, "global_step": 361520, "epoch": 4355} {"train_loss": -26.199054718017578, "global_step": 361521, "epoch": 4355} {"train_loss": -25.892988204956055, "global_step": 361522, "epoch": 4355} {"train_loss": -26.481185913085938, "global_step": 361523, "epoch": 4355} {"train_loss": -25.886062622070312, "global_step": 361524, "epoch": 4355} {"train_loss": -26.48095703125, "global_step": 361525, "epoch": 4355} {"train_loss": -26.31520652770996, "global_step": 361526, "epoch": 4355} {"train_loss": -26.488632202148438, "global_step": 361527, "epoch": 4355} {"train_loss": -26.19970703125, "global_step": 361528, "epoch": 4355} {"train_loss": -26.290098190307617, "global_step": 361529, "epoch": 4355} {"train_loss": -26.109373092651367, "global_step": 361530, "epoch": 4355} {"train_loss": -26.408905029296875, "global_step": 361531, "epoch": 4355} {"train_loss": -26.198822021484375, "global_step": 361532, "epoch": 4355} {"train_loss": -26.542051315307617, "global_step": 361533, "epoch": 4355} {"train_loss": -26.530515670776367, "global_step": 361534, "epoch": 4355} {"train_loss": -26.823108673095703, "global_step": 361535, "epoch": 4355} {"train_loss": -26.093713760375977, "global_step": 361536, "epoch": 4355} {"train_loss": -26.600461959838867, "global_step": 361537, "epoch": 4355} {"train_loss": -26.127721786499023, "global_step": 361538, "epoch": 4355} {"train_loss": -26.267658233642578, "global_step": 361539, "epoch": 4355} {"train_loss": -26.540328979492188, "global_step": 361540, "epoch": 4355} {"train_loss": -26.38934326171875, "global_step": 361541, "epoch": 4355} {"train_loss": -26.166370391845703, "global_step": 361542, "epoch": 4355} {"train_loss": -25.9846248626709, "global_step": 361543, "epoch": 4355} {"train_loss": -25.987226486206055, "global_step": 361544, "epoch": 4355} {"train_loss": -26.074438095092773, "global_step": 361545, "epoch": 4355} {"train_loss": -26.27070426940918, "global_step": 361546, "epoch": 4355} {"train_loss": -26.12836026570883, "global_step": 361547, "epoch": 4355, "val_loss": 6555411.0} {"train_loss": -25.485103607177734, "global_step": 361548, "epoch": 4356} {"train_loss": -25.612573623657227, "global_step": 361549, "epoch": 4356} {"train_loss": -26.191394805908203, "global_step": 361550, "epoch": 4356} {"train_loss": -25.899616241455078, "global_step": 361551, "epoch": 4356} {"train_loss": -25.545013427734375, "global_step": 361552, "epoch": 4356} {"train_loss": -25.507070541381836, "global_step": 361553, "epoch": 4356} {"train_loss": -25.813495635986328, "global_step": 361554, "epoch": 4356} {"train_loss": -25.198665618896484, "global_step": 361555, "epoch": 4356} {"train_loss": -25.491111755371094, "global_step": 361556, "epoch": 4356} {"train_loss": -25.751684188842773, "global_step": 361557, "epoch": 4356} {"train_loss": -25.831628799438477, "global_step": 361558, "epoch": 4356} {"train_loss": -25.51224136352539, "global_step": 361559, "epoch": 4356} {"train_loss": -25.694971084594727, "global_step": 361560, "epoch": 4356} {"train_loss": -25.70405387878418, "global_step": 361561, "epoch": 4356} {"train_loss": -26.10993003845215, "global_step": 361562, "epoch": 4356} {"train_loss": -25.870731353759766, "global_step": 361563, "epoch": 4356} {"train_loss": -25.85284996032715, "global_step": 361564, "epoch": 4356} {"train_loss": -25.614765167236328, "global_step": 361565, "epoch": 4356} {"train_loss": -25.971389770507812, "global_step": 361566, "epoch": 4356} {"train_loss": -25.956836700439453, "global_step": 361567, "epoch": 4356} {"train_loss": -26.07671546936035, "global_step": 361568, "epoch": 4356} {"train_loss": -25.9908504486084, "global_step": 361569, "epoch": 4356} {"train_loss": -25.98310661315918, "global_step": 361570, "epoch": 4356} {"train_loss": -25.77646255493164, "global_step": 361571, "epoch": 4356} {"train_loss": -26.120532989501953, "global_step": 361572, "epoch": 4356} {"train_loss": -26.176923751831055, "global_step": 361573, "epoch": 4356} {"train_loss": -25.744415283203125, "global_step": 361574, "epoch": 4356} {"train_loss": -26.25632667541504, "global_step": 361575, "epoch": 4356} {"train_loss": -26.0860595703125, "global_step": 361576, "epoch": 4356} {"train_loss": -26.198226928710938, "global_step": 361577, "epoch": 4356} {"train_loss": -26.28407096862793, "global_step": 361578, "epoch": 4356} {"train_loss": -26.000364303588867, "global_step": 361579, "epoch": 4356} {"train_loss": -26.482654571533203, "global_step": 361580, "epoch": 4356} {"train_loss": -25.998626708984375, "global_step": 361581, "epoch": 4356} {"train_loss": -25.969457626342773, "global_step": 361582, "epoch": 4356} {"train_loss": -26.155988693237305, "global_step": 361583, "epoch": 4356} {"train_loss": -26.572467803955078, "global_step": 361584, "epoch": 4356} {"train_loss": -26.634260177612305, "global_step": 361585, "epoch": 4356} {"train_loss": -26.584630966186523, "global_step": 361586, "epoch": 4356} {"train_loss": -26.270755767822266, "global_step": 361587, "epoch": 4356} {"train_loss": -26.302734375, "global_step": 361588, "epoch": 4356} {"train_loss": -26.216968536376953, "global_step": 361589, "epoch": 4356} {"train_loss": -26.282928466796875, "global_step": 361590, "epoch": 4356} {"train_loss": -26.639799118041992, "global_step": 361591, "epoch": 4356} {"train_loss": -26.301563262939453, "global_step": 361592, "epoch": 4356} {"train_loss": -26.204425811767578, "global_step": 361593, "epoch": 4356} {"train_loss": -26.563268661499023, "global_step": 361594, "epoch": 4356} {"train_loss": -26.5528564453125, "global_step": 361595, "epoch": 4356} {"train_loss": -26.23337745666504, "global_step": 361596, "epoch": 4356} {"train_loss": -26.40199089050293, "global_step": 361597, "epoch": 4356} {"train_loss": -26.52850341796875, "global_step": 361598, "epoch": 4356} {"train_loss": -26.506183624267578, "global_step": 361599, "epoch": 4356} {"train_loss": -26.7533016204834, "global_step": 361600, "epoch": 4356} {"train_loss": -26.447479248046875, "global_step": 361601, "epoch": 4356} {"train_loss": -26.32781410217285, "global_step": 361602, "epoch": 4356} {"train_loss": -26.42682456970215, "global_step": 361603, "epoch": 4356} {"train_loss": -26.529027938842773, "global_step": 361604, "epoch": 4356} {"train_loss": -25.57590675354004, "global_step": 361605, "epoch": 4356} {"train_loss": -25.521644592285156, "global_step": 361606, "epoch": 4356} {"train_loss": -26.8408145904541, "global_step": 361607, "epoch": 4356} {"train_loss": -25.80049705505371, "global_step": 361608, "epoch": 4356} {"train_loss": -25.234882354736328, "global_step": 361609, "epoch": 4356} {"train_loss": -25.998737335205078, "global_step": 361610, "epoch": 4356} {"train_loss": -25.705900192260742, "global_step": 361611, "epoch": 4356} {"train_loss": -25.837635040283203, "global_step": 361612, "epoch": 4356} {"train_loss": -25.94593620300293, "global_step": 361613, "epoch": 4356} {"train_loss": -25.974103927612305, "global_step": 361614, "epoch": 4356} {"train_loss": -26.14599609375, "global_step": 361615, "epoch": 4356} {"train_loss": -26.354511260986328, "global_step": 361616, "epoch": 4356} {"train_loss": -25.804044723510742, "global_step": 361617, "epoch": 4356} {"train_loss": -26.103601455688477, "global_step": 361618, "epoch": 4356} {"train_loss": -25.99953269958496, "global_step": 361619, "epoch": 4356} {"train_loss": -26.353803634643555, "global_step": 361620, "epoch": 4356} {"train_loss": -26.267578125, "global_step": 361621, "epoch": 4356} {"train_loss": -26.03460121154785, "global_step": 361622, "epoch": 4356} {"train_loss": -26.24810218811035, "global_step": 361623, "epoch": 4356} {"train_loss": -26.139989852905273, "global_step": 361624, "epoch": 4356} {"train_loss": -25.920499801635742, "global_step": 361625, "epoch": 4356} {"train_loss": -26.23394203186035, "global_step": 361626, "epoch": 4356} {"train_loss": -26.201730728149414, "global_step": 361627, "epoch": 4356} {"train_loss": -26.203733444213867, "global_step": 361628, "epoch": 4356} {"train_loss": -26.032251358032227, "global_step": 361629, "epoch": 4356} {"train_loss": -26.07236556547234, "global_step": 361630, "epoch": 4356, "val_loss": 6663561.0} {"train_loss": -25.7812442779541, "global_step": 361631, "epoch": 4357} {"train_loss": -25.40110206604004, "global_step": 361632, "epoch": 4357} {"train_loss": -25.971227645874023, "global_step": 361633, "epoch": 4357} {"train_loss": -25.75242042541504, "global_step": 361634, "epoch": 4357} {"train_loss": -25.75115966796875, "global_step": 361635, "epoch": 4357} {"train_loss": -25.93623924255371, "global_step": 361636, "epoch": 4357} {"train_loss": -25.50714111328125, "global_step": 361637, "epoch": 4357} {"train_loss": -26.302082061767578, "global_step": 361638, "epoch": 4357} {"train_loss": -25.97332191467285, "global_step": 361639, "epoch": 4357} {"train_loss": -25.981664657592773, "global_step": 361640, "epoch": 4357} {"train_loss": -26.237308502197266, "global_step": 361641, "epoch": 4357} {"train_loss": -25.8759765625, "global_step": 361642, "epoch": 4357} {"train_loss": -25.858442306518555, "global_step": 361643, "epoch": 4357} {"train_loss": -25.932300567626953, "global_step": 361644, "epoch": 4357} {"train_loss": -26.121347427368164, "global_step": 361645, "epoch": 4357} {"train_loss": -26.2684326171875, "global_step": 361646, "epoch": 4357} {"train_loss": -26.604299545288086, "global_step": 361647, "epoch": 4357} {"train_loss": -26.349945068359375, "global_step": 361648, "epoch": 4357} {"train_loss": -25.9526309967041, "global_step": 361649, "epoch": 4357} {"train_loss": -26.279937744140625, "global_step": 361650, "epoch": 4357} {"train_loss": -26.270477294921875, "global_step": 361651, "epoch": 4357} {"train_loss": -26.079254150390625, "global_step": 361652, "epoch": 4357} {"train_loss": -26.0616455078125, "global_step": 361653, "epoch": 4357} {"train_loss": -26.27277183532715, "global_step": 361654, "epoch": 4357} {"train_loss": -26.45185661315918, "global_step": 361655, "epoch": 4357} {"train_loss": -26.383365631103516, "global_step": 361656, "epoch": 4357} {"train_loss": -26.38106346130371, "global_step": 361657, "epoch": 4357} {"train_loss": -26.173120498657227, "global_step": 361658, "epoch": 4357} {"train_loss": -26.354673385620117, "global_step": 361659, "epoch": 4357} {"train_loss": -26.058990478515625, "global_step": 361660, "epoch": 4357} {"train_loss": -26.267017364501953, "global_step": 361661, "epoch": 4357} {"train_loss": -26.262012481689453, "global_step": 361662, "epoch": 4357} {"train_loss": -25.974592208862305, "global_step": 361663, "epoch": 4357} {"train_loss": -26.0815372467041, "global_step": 361664, "epoch": 4357} {"train_loss": -26.15179443359375, "global_step": 361665, "epoch": 4357} {"train_loss": -25.978857040405273, "global_step": 361666, "epoch": 4357} {"train_loss": -26.059293746948242, "global_step": 361667, "epoch": 4357} {"train_loss": -26.561803817749023, "global_step": 361668, "epoch": 4357} {"train_loss": -26.40400505065918, "global_step": 361669, "epoch": 4357} {"train_loss": -26.335546493530273, "global_step": 361670, "epoch": 4357} {"train_loss": -26.60125160217285, "global_step": 361671, "epoch": 4357} {"train_loss": -26.497058868408203, "global_step": 361672, "epoch": 4357} {"train_loss": -26.491952896118164, "global_step": 361673, "epoch": 4357} {"train_loss": -26.1248722076416, "global_step": 361674, "epoch": 4357} {"train_loss": -26.574125289916992, "global_step": 361675, "epoch": 4357} {"train_loss": -26.296701431274414, "global_step": 361676, "epoch": 4357} {"train_loss": -26.551237106323242, "global_step": 361677, "epoch": 4357} {"train_loss": -26.475940704345703, "global_step": 361678, "epoch": 4357} {"train_loss": -26.032682418823242, "global_step": 361679, "epoch": 4357} {"train_loss": -26.497854232788086, "global_step": 361680, "epoch": 4357} {"train_loss": -26.950855255126953, "global_step": 361681, "epoch": 4357} {"train_loss": -26.66334342956543, "global_step": 361682, "epoch": 4357} {"train_loss": -26.4479923248291, "global_step": 361683, "epoch": 4357} {"train_loss": -26.17571449279785, "global_step": 361684, "epoch": 4357} {"train_loss": -26.176198959350586, "global_step": 361685, "epoch": 4357} {"train_loss": -26.444929122924805, "global_step": 361686, "epoch": 4357} {"train_loss": -25.9710636138916, "global_step": 361687, "epoch": 4357} {"train_loss": -26.34921646118164, "global_step": 361688, "epoch": 4357} {"train_loss": -26.085342407226562, "global_step": 361689, "epoch": 4357} {"train_loss": -26.134906768798828, "global_step": 361690, "epoch": 4357} {"train_loss": -26.118207931518555, "global_step": 361691, "epoch": 4357} {"train_loss": -26.290639877319336, "global_step": 361692, "epoch": 4357} {"train_loss": -26.01300048828125, "global_step": 361693, "epoch": 4357} {"train_loss": -26.115787506103516, "global_step": 361694, "epoch": 4357} {"train_loss": -26.10774040222168, "global_step": 361695, "epoch": 4357} {"train_loss": -25.93967056274414, "global_step": 361696, "epoch": 4357} {"train_loss": -26.39483070373535, "global_step": 361697, "epoch": 4357} {"train_loss": -26.376861572265625, "global_step": 361698, "epoch": 4357} {"train_loss": -25.836973190307617, "global_step": 361699, "epoch": 4357} {"train_loss": -25.980619430541992, "global_step": 361700, "epoch": 4357} {"train_loss": -26.36566734313965, "global_step": 361701, "epoch": 4357} {"train_loss": -26.055084228515625, "global_step": 361702, "epoch": 4357} {"train_loss": -26.38176918029785, "global_step": 361703, "epoch": 4357} {"train_loss": -26.169164657592773, "global_step": 361704, "epoch": 4357} {"train_loss": -26.047941207885742, "global_step": 361705, "epoch": 4357} {"train_loss": -26.438541412353516, "global_step": 361706, "epoch": 4357} {"train_loss": -25.967132568359375, "global_step": 361707, "epoch": 4357} {"train_loss": -26.305639266967773, "global_step": 361708, "epoch": 4357} {"train_loss": -26.235898971557617, "global_step": 361709, "epoch": 4357} {"train_loss": -25.905029296875, "global_step": 361710, "epoch": 4357} {"train_loss": -26.249475479125977, "global_step": 361711, "epoch": 4357} {"train_loss": -26.111845016479492, "global_step": 361712, "epoch": 4357} {"train_loss": -26.186492069658026, "global_step": 361713, "epoch": 4357, "val_loss": 6631612.0} {"train_loss": -25.241872787475586, "global_step": 361714, "epoch": 4358} {"train_loss": -25.933462142944336, "global_step": 361715, "epoch": 4358} {"train_loss": -25.82718849182129, "global_step": 361716, "epoch": 4358} {"train_loss": -25.549890518188477, "global_step": 361717, "epoch": 4358} {"train_loss": -25.680078506469727, "global_step": 361718, "epoch": 4358} {"train_loss": -25.676361083984375, "global_step": 361719, "epoch": 4358} {"train_loss": -25.6824893951416, "global_step": 361720, "epoch": 4358} {"train_loss": -25.647464752197266, "global_step": 361721, "epoch": 4358} {"train_loss": -26.160974502563477, "global_step": 361722, "epoch": 4358} {"train_loss": -25.858692169189453, "global_step": 361723, "epoch": 4358} {"train_loss": -26.12930679321289, "global_step": 361724, "epoch": 4358} {"train_loss": -26.100305557250977, "global_step": 361725, "epoch": 4358} {"train_loss": -25.881345748901367, "global_step": 361726, "epoch": 4358} {"train_loss": -26.11045265197754, "global_step": 361727, "epoch": 4358} {"train_loss": -26.021915435791016, "global_step": 361728, "epoch": 4358} {"train_loss": -25.87647819519043, "global_step": 361729, "epoch": 4358} {"train_loss": -26.040796279907227, "global_step": 361730, "epoch": 4358} {"train_loss": -26.153827667236328, "global_step": 361731, "epoch": 4358} {"train_loss": -26.203107833862305, "global_step": 361732, "epoch": 4358} {"train_loss": -26.3599796295166, "global_step": 361733, "epoch": 4358} {"train_loss": -26.436201095581055, "global_step": 361734, "epoch": 4358} {"train_loss": -26.410932540893555, "global_step": 361735, "epoch": 4358} {"train_loss": -25.926502227783203, "global_step": 361736, "epoch": 4358} {"train_loss": -26.383569717407227, "global_step": 361737, "epoch": 4358} {"train_loss": -26.18778419494629, "global_step": 361738, "epoch": 4358} {"train_loss": -26.173431396484375, "global_step": 361739, "epoch": 4358} {"train_loss": -26.6253662109375, "global_step": 361740, "epoch": 4358} {"train_loss": -26.45780372619629, "global_step": 361741, "epoch": 4358} {"train_loss": -26.325836181640625, "global_step": 361742, "epoch": 4358} {"train_loss": -26.538999557495117, "global_step": 361743, "epoch": 4358} {"train_loss": -26.140625, "global_step": 361744, "epoch": 4358} {"train_loss": -26.075220108032227, "global_step": 361745, "epoch": 4358} {"train_loss": -26.401432037353516, "global_step": 361746, "epoch": 4358} {"train_loss": -26.142898559570312, "global_step": 361747, "epoch": 4358} {"train_loss": -26.387298583984375, "global_step": 361748, "epoch": 4358} {"train_loss": -26.33005714416504, "global_step": 361749, "epoch": 4358} {"train_loss": -26.4206485748291, "global_step": 361750, "epoch": 4358} {"train_loss": -26.597797393798828, "global_step": 361751, "epoch": 4358} {"train_loss": -26.927637100219727, "global_step": 361752, "epoch": 4358} {"train_loss": -26.39847183227539, "global_step": 361753, "epoch": 4358} {"train_loss": -26.40529441833496, "global_step": 361754, "epoch": 4358} {"train_loss": -26.31329917907715, "global_step": 361755, "epoch": 4358} {"train_loss": -26.280858993530273, "global_step": 361756, "epoch": 4358} {"train_loss": -26.4709529876709, "global_step": 361757, "epoch": 4358} {"train_loss": -26.567291259765625, "global_step": 361758, "epoch": 4358} {"train_loss": -26.41602897644043, "global_step": 361759, "epoch": 4358} {"train_loss": -26.411788940429688, "global_step": 361760, "epoch": 4358} {"train_loss": -26.52658462524414, "global_step": 361761, "epoch": 4358} {"train_loss": -26.274118423461914, "global_step": 361762, "epoch": 4358} {"train_loss": -26.448410034179688, "global_step": 361763, "epoch": 4358} {"train_loss": -26.316274642944336, "global_step": 361764, "epoch": 4358} {"train_loss": -26.234867095947266, "global_step": 361765, "epoch": 4358} {"train_loss": -26.06884765625, "global_step": 361766, "epoch": 4358} {"train_loss": -26.39208984375, "global_step": 361767, "epoch": 4358} {"train_loss": -26.08088493347168, "global_step": 361768, "epoch": 4358} {"train_loss": -26.37141990661621, "global_step": 361769, "epoch": 4358} {"train_loss": -26.8173885345459, "global_step": 361770, "epoch": 4358} {"train_loss": -26.5113468170166, "global_step": 361771, "epoch": 4358} {"train_loss": -26.7218074798584, "global_step": 361772, "epoch": 4358} {"train_loss": -26.720739364624023, "global_step": 361773, "epoch": 4358} {"train_loss": -26.45284080505371, "global_step": 361774, "epoch": 4358} {"train_loss": -26.541996002197266, "global_step": 361775, "epoch": 4358} {"train_loss": -26.281469345092773, "global_step": 361776, "epoch": 4358} {"train_loss": -26.420196533203125, "global_step": 361777, "epoch": 4358} {"train_loss": -26.24446678161621, "global_step": 361778, "epoch": 4358} {"train_loss": -25.99371910095215, "global_step": 361779, "epoch": 4358} {"train_loss": -25.920827865600586, "global_step": 361780, "epoch": 4358} {"train_loss": -26.20001792907715, "global_step": 361781, "epoch": 4358} {"train_loss": -25.966245651245117, "global_step": 361782, "epoch": 4358} {"train_loss": -26.199682235717773, "global_step": 361783, "epoch": 4358} {"train_loss": -25.966527938842773, "global_step": 361784, "epoch": 4358} {"train_loss": -26.3268985748291, "global_step": 361785, "epoch": 4358} {"train_loss": -26.230148315429688, "global_step": 361786, "epoch": 4358} {"train_loss": -25.8725643157959, "global_step": 361787, "epoch": 4358} {"train_loss": -26.3111572265625, "global_step": 361788, "epoch": 4358} {"train_loss": -26.51169776916504, "global_step": 361789, "epoch": 4358} {"train_loss": -26.220706939697266, "global_step": 361790, "epoch": 4358} {"train_loss": -26.244007110595703, "global_step": 361791, "epoch": 4358} {"train_loss": -26.5078182220459, "global_step": 361792, "epoch": 4358} {"train_loss": -26.276304244995117, "global_step": 361793, "epoch": 4358} {"train_loss": -26.45924186706543, "global_step": 361794, "epoch": 4358} {"train_loss": -25.977102279663086, "global_step": 361795, "epoch": 4358} {"train_loss": -26.24113632110228, "global_step": 361796, "epoch": 4358, "val_loss": 6565253.0} {"train_loss": -25.77654457092285, "global_step": 361797, "epoch": 4359} {"train_loss": -26.00957679748535, "global_step": 361798, "epoch": 4359} {"train_loss": -25.912633895874023, "global_step": 361799, "epoch": 4359} {"train_loss": -25.8288516998291, "global_step": 361800, "epoch": 4359} {"train_loss": -25.947866439819336, "global_step": 361801, "epoch": 4359} {"train_loss": -25.917089462280273, "global_step": 361802, "epoch": 4359} {"train_loss": -25.672800064086914, "global_step": 361803, "epoch": 4359} {"train_loss": -26.163333892822266, "global_step": 361804, "epoch": 4359} {"train_loss": -26.008289337158203, "global_step": 361805, "epoch": 4359} {"train_loss": -25.941129684448242, "global_step": 361806, "epoch": 4359} {"train_loss": -26.36379051208496, "global_step": 361807, "epoch": 4359} {"train_loss": -26.228200912475586, "global_step": 361808, "epoch": 4359} {"train_loss": -26.51645278930664, "global_step": 361809, "epoch": 4359} {"train_loss": -26.17860221862793, "global_step": 361810, "epoch": 4359} {"train_loss": -25.98005485534668, "global_step": 361811, "epoch": 4359} {"train_loss": -26.106847763061523, "global_step": 361812, "epoch": 4359} {"train_loss": -26.40619468688965, "global_step": 361813, "epoch": 4359} {"train_loss": -25.967016220092773, "global_step": 361814, "epoch": 4359} {"train_loss": -26.6044979095459, "global_step": 361815, "epoch": 4359} {"train_loss": -26.213642120361328, "global_step": 361816, "epoch": 4359} {"train_loss": -25.906509399414062, "global_step": 361817, "epoch": 4359} {"train_loss": -26.032514572143555, "global_step": 361818, "epoch": 4359} {"train_loss": -26.35674476623535, "global_step": 361819, "epoch": 4359} {"train_loss": -26.448522567749023, "global_step": 361820, "epoch": 4359} {"train_loss": -26.479978561401367, "global_step": 361821, "epoch": 4359} {"train_loss": -26.14301872253418, "global_step": 361822, "epoch": 4359} {"train_loss": -25.757598876953125, "global_step": 361823, "epoch": 4359} {"train_loss": -26.29227638244629, "global_step": 361824, "epoch": 4359} {"train_loss": -26.308242797851562, "global_step": 361825, "epoch": 4359} {"train_loss": -26.54290771484375, "global_step": 361826, "epoch": 4359} {"train_loss": -26.213659286499023, "global_step": 361827, "epoch": 4359} {"train_loss": -26.147785186767578, "global_step": 361828, "epoch": 4359} {"train_loss": -26.319250106811523, "global_step": 361829, "epoch": 4359} {"train_loss": -25.88703727722168, "global_step": 361830, "epoch": 4359} {"train_loss": -26.185148239135742, "global_step": 361831, "epoch": 4359} {"train_loss": -26.50381851196289, "global_step": 361832, "epoch": 4359} {"train_loss": -26.068761825561523, "global_step": 361833, "epoch": 4359} {"train_loss": -26.3695125579834, "global_step": 361834, "epoch": 4359} {"train_loss": -26.167774200439453, "global_step": 361835, "epoch": 4359} {"train_loss": -26.2276668548584, "global_step": 361836, "epoch": 4359} {"train_loss": -26.265277862548828, "global_step": 361837, "epoch": 4359} {"train_loss": -26.030553817749023, "global_step": 361838, "epoch": 4359} {"train_loss": -25.997024536132812, "global_step": 361839, "epoch": 4359} {"train_loss": -26.393890380859375, "global_step": 361840, "epoch": 4359} {"train_loss": -26.366474151611328, "global_step": 361841, "epoch": 4359} {"train_loss": -26.14185905456543, "global_step": 361842, "epoch": 4359} {"train_loss": -26.2359561920166, "global_step": 361843, "epoch": 4359} {"train_loss": -26.317886352539062, "global_step": 361844, "epoch": 4359} {"train_loss": -26.21299171447754, "global_step": 361845, "epoch": 4359} {"train_loss": -26.141845703125, "global_step": 361846, "epoch": 4359} {"train_loss": -26.281225204467773, "global_step": 361847, "epoch": 4359} {"train_loss": -26.451358795166016, "global_step": 361848, "epoch": 4359} {"train_loss": -26.048505783081055, "global_step": 361849, "epoch": 4359} {"train_loss": -26.187244415283203, "global_step": 361850, "epoch": 4359} {"train_loss": -26.2733097076416, "global_step": 361851, "epoch": 4359} {"train_loss": -26.12931251525879, "global_step": 361852, "epoch": 4359} {"train_loss": -26.39512062072754, "global_step": 361853, "epoch": 4359} {"train_loss": -26.48590660095215, "global_step": 361854, "epoch": 4359} {"train_loss": -26.500045776367188, "global_step": 361855, "epoch": 4359} {"train_loss": -26.25032615661621, "global_step": 361856, "epoch": 4359} {"train_loss": -25.96912956237793, "global_step": 361857, "epoch": 4359} {"train_loss": -26.285053253173828, "global_step": 361858, "epoch": 4359} {"train_loss": -26.10776138305664, "global_step": 361859, "epoch": 4359} {"train_loss": -26.292749404907227, "global_step": 361860, "epoch": 4359} {"train_loss": -26.1608943939209, "global_step": 361861, "epoch": 4359} {"train_loss": -26.370798110961914, "global_step": 361862, "epoch": 4359} {"train_loss": -26.249374389648438, "global_step": 361863, "epoch": 4359} {"train_loss": -26.32107925415039, "global_step": 361864, "epoch": 4359} {"train_loss": -26.282068252563477, "global_step": 361865, "epoch": 4359} {"train_loss": -26.524572372436523, "global_step": 361866, "epoch": 4359} {"train_loss": -26.116437911987305, "global_step": 361867, "epoch": 4359} {"train_loss": -26.2532958984375, "global_step": 361868, "epoch": 4359} {"train_loss": -26.042654037475586, "global_step": 361869, "epoch": 4359} {"train_loss": -26.591083526611328, "global_step": 361870, "epoch": 4359} {"train_loss": -26.286951065063477, "global_step": 361871, "epoch": 4359} {"train_loss": -26.064685821533203, "global_step": 361872, "epoch": 4359} {"train_loss": -26.1324520111084, "global_step": 361873, "epoch": 4359} {"train_loss": -25.977924346923828, "global_step": 361874, "epoch": 4359} {"train_loss": -26.29075050354004, "global_step": 361875, "epoch": 4359} {"train_loss": -26.133825302124023, "global_step": 361876, "epoch": 4359} {"train_loss": -26.182453155517578, "global_step": 361877, "epoch": 4359} {"train_loss": -26.442251205444336, "global_step": 361878, "epoch": 4359} {"train_loss": -26.187803957835737, "global_step": 361879, "epoch": 4359, "val_loss": 6645687.0} {"train_loss": -25.10816764831543, "global_step": 361880, "epoch": 4360} {"train_loss": -24.209680557250977, "global_step": 361881, "epoch": 4360} {"train_loss": -25.35031509399414, "global_step": 361882, "epoch": 4360} {"train_loss": -25.46048355102539, "global_step": 361883, "epoch": 4360} {"train_loss": -25.58519744873047, "global_step": 361884, "epoch": 4360} {"train_loss": -25.593326568603516, "global_step": 361885, "epoch": 4360} {"train_loss": -25.29011344909668, "global_step": 361886, "epoch": 4360} {"train_loss": -26.07061195373535, "global_step": 361887, "epoch": 4360} {"train_loss": -25.511844635009766, "global_step": 361888, "epoch": 4360} {"train_loss": -26.047094345092773, "global_step": 361889, "epoch": 4360} {"train_loss": -25.84247398376465, "global_step": 361890, "epoch": 4360} {"train_loss": -25.609838485717773, "global_step": 361891, "epoch": 4360} {"train_loss": -25.66481590270996, "global_step": 361892, "epoch": 4360} {"train_loss": -25.864398956298828, "global_step": 361893, "epoch": 4360} {"train_loss": -25.95557975769043, "global_step": 361894, "epoch": 4360} {"train_loss": -26.055540084838867, "global_step": 361895, "epoch": 4360} {"train_loss": -26.13816261291504, "global_step": 361896, "epoch": 4360} {"train_loss": -26.15998649597168, "global_step": 361897, "epoch": 4360} {"train_loss": -25.832183837890625, "global_step": 361898, "epoch": 4360} {"train_loss": -26.1372127532959, "global_step": 361899, "epoch": 4360} {"train_loss": -25.82551383972168, "global_step": 361900, "epoch": 4360} {"train_loss": -26.16171646118164, "global_step": 361901, "epoch": 4360} {"train_loss": -26.351261138916016, "global_step": 361902, "epoch": 4360} {"train_loss": -26.12440299987793, "global_step": 361903, "epoch": 4360} {"train_loss": -25.9985408782959, "global_step": 361904, "epoch": 4360} {"train_loss": -26.1418514251709, "global_step": 361905, "epoch": 4360} {"train_loss": -26.06061363220215, "global_step": 361906, "epoch": 4360} {"train_loss": -26.3413143157959, "global_step": 361907, "epoch": 4360} {"train_loss": -26.008838653564453, "global_step": 361908, "epoch": 4360} {"train_loss": -26.0333251953125, "global_step": 361909, "epoch": 4360} {"train_loss": -26.01936912536621, "global_step": 361910, "epoch": 4360} {"train_loss": -26.299238204956055, "global_step": 361911, "epoch": 4360} {"train_loss": -26.321949005126953, "global_step": 361912, "epoch": 4360} {"train_loss": -26.141386032104492, "global_step": 361913, "epoch": 4360} {"train_loss": -26.235483169555664, "global_step": 361914, "epoch": 4360} {"train_loss": -26.1910400390625, "global_step": 361915, "epoch": 4360} {"train_loss": -26.00946044921875, "global_step": 361916, "epoch": 4360} {"train_loss": -26.210851669311523, "global_step": 361917, "epoch": 4360} {"train_loss": -26.367956161499023, "global_step": 361918, "epoch": 4360} {"train_loss": -26.315725326538086, "global_step": 361919, "epoch": 4360} {"train_loss": -26.894989013671875, "global_step": 361920, "epoch": 4360} {"train_loss": -26.55438232421875, "global_step": 361921, "epoch": 4360} {"train_loss": -26.533594131469727, "global_step": 361922, "epoch": 4360} {"train_loss": -26.638090133666992, "global_step": 361923, "epoch": 4360} {"train_loss": -26.127655029296875, "global_step": 361924, "epoch": 4360} {"train_loss": -26.321155548095703, "global_step": 361925, "epoch": 4360} {"train_loss": -26.58552360534668, "global_step": 361926, "epoch": 4360} {"train_loss": -25.981908798217773, "global_step": 361927, "epoch": 4360} {"train_loss": -26.322479248046875, "global_step": 361928, "epoch": 4360} {"train_loss": -26.268768310546875, "global_step": 361929, "epoch": 4360} {"train_loss": -26.500532150268555, "global_step": 361930, "epoch": 4360} {"train_loss": -26.467426300048828, "global_step": 361931, "epoch": 4360} {"train_loss": -26.285375595092773, "global_step": 361932, "epoch": 4360} {"train_loss": -26.312274932861328, "global_step": 361933, "epoch": 4360} {"train_loss": -26.14771842956543, "global_step": 361934, "epoch": 4360} {"train_loss": -26.570404052734375, "global_step": 361935, "epoch": 4360} {"train_loss": -26.270984649658203, "global_step": 361936, "epoch": 4360} {"train_loss": -26.089948654174805, "global_step": 361937, "epoch": 4360} {"train_loss": -26.289371490478516, "global_step": 361938, "epoch": 4360} {"train_loss": -26.732473373413086, "global_step": 361939, "epoch": 4360} {"train_loss": -26.413537979125977, "global_step": 361940, "epoch": 4360} {"train_loss": -26.34269142150879, "global_step": 361941, "epoch": 4360} {"train_loss": -25.951770782470703, "global_step": 361942, "epoch": 4360} {"train_loss": -26.339923858642578, "global_step": 361943, "epoch": 4360} {"train_loss": -26.067203521728516, "global_step": 361944, "epoch": 4360} {"train_loss": -26.527618408203125, "global_step": 361945, "epoch": 4360} {"train_loss": -26.27300453186035, "global_step": 361946, "epoch": 4360} {"train_loss": -26.253904342651367, "global_step": 361947, "epoch": 4360} {"train_loss": -25.709293365478516, "global_step": 361948, "epoch": 4360} {"train_loss": -26.090696334838867, "global_step": 361949, "epoch": 4360} {"train_loss": -26.412485122680664, "global_step": 361950, "epoch": 4360} {"train_loss": -26.45890235900879, "global_step": 361951, "epoch": 4360} {"train_loss": -25.795028686523438, "global_step": 361952, "epoch": 4360} {"train_loss": -26.09244728088379, "global_step": 361953, "epoch": 4360} {"train_loss": -26.22846031188965, "global_step": 361954, "epoch": 4360} {"train_loss": -26.085006713867188, "global_step": 361955, "epoch": 4360} {"train_loss": -26.130277633666992, "global_step": 361956, "epoch": 4360} {"train_loss": -26.387481689453125, "global_step": 361957, "epoch": 4360} {"train_loss": -26.560657501220703, "global_step": 361958, "epoch": 4360} {"train_loss": -26.280874252319336, "global_step": 361959, "epoch": 4360} {"train_loss": -26.432668685913086, "global_step": 361960, "epoch": 4360} {"train_loss": -26.41920280456543, "global_step": 361961, "epoch": 4360} {"train_loss": -26.1189125474677, "global_step": 361962, "epoch": 4360, "val_loss": 6555531.0} {"train_loss": -25.977014541625977, "global_step": 361963, "epoch": 4361} {"train_loss": -26.06158447265625, "global_step": 361964, "epoch": 4361} {"train_loss": -26.166540145874023, "global_step": 361965, "epoch": 4361} {"train_loss": -25.79176139831543, "global_step": 361966, "epoch": 4361} {"train_loss": -25.77118492126465, "global_step": 361967, "epoch": 4361} {"train_loss": -25.73410987854004, "global_step": 361968, "epoch": 4361} {"train_loss": -26.27130699157715, "global_step": 361969, "epoch": 4361} {"train_loss": -26.159475326538086, "global_step": 361970, "epoch": 4361} {"train_loss": -26.018224716186523, "global_step": 361971, "epoch": 4361} {"train_loss": -26.351037979125977, "global_step": 361972, "epoch": 4361} {"train_loss": -26.28901481628418, "global_step": 361973, "epoch": 4361} {"train_loss": -26.61651039123535, "global_step": 361974, "epoch": 4361} {"train_loss": -26.067340850830078, "global_step": 361975, "epoch": 4361} {"train_loss": -26.53840446472168, "global_step": 361976, "epoch": 4361} {"train_loss": -26.1005859375, "global_step": 361977, "epoch": 4361} {"train_loss": -26.07577896118164, "global_step": 361978, "epoch": 4361} {"train_loss": -26.0964298248291, "global_step": 361979, "epoch": 4361} {"train_loss": -26.238372802734375, "global_step": 361980, "epoch": 4361} {"train_loss": -26.22109031677246, "global_step": 361981, "epoch": 4361} {"train_loss": -26.048452377319336, "global_step": 361982, "epoch": 4361} {"train_loss": -26.292333602905273, "global_step": 361983, "epoch": 4361} {"train_loss": -26.570165634155273, "global_step": 361984, "epoch": 4361} {"train_loss": -25.879776000976562, "global_step": 361985, "epoch": 4361} {"train_loss": -26.200973510742188, "global_step": 361986, "epoch": 4361} {"train_loss": -26.0738468170166, "global_step": 361987, "epoch": 4361} {"train_loss": -26.50433349609375, "global_step": 361988, "epoch": 4361} {"train_loss": -26.36761474609375, "global_step": 361989, "epoch": 4361} {"train_loss": -26.1715145111084, "global_step": 361990, "epoch": 4361} {"train_loss": -26.451007843017578, "global_step": 361991, "epoch": 4361} {"train_loss": -26.32002830505371, "global_step": 361992, "epoch": 4361} {"train_loss": -26.5223331451416, "global_step": 361993, "epoch": 4361} {"train_loss": -26.54566764831543, "global_step": 361994, "epoch": 4361} {"train_loss": -26.325986862182617, "global_step": 361995, "epoch": 4361} {"train_loss": -26.442548751831055, "global_step": 361996, "epoch": 4361} {"train_loss": -26.100690841674805, "global_step": 361997, "epoch": 4361} {"train_loss": -26.1887149810791, "global_step": 361998, "epoch": 4361} {"train_loss": -26.499011993408203, "global_step": 361999, "epoch": 4361} {"train_loss": -26.423303604125977, "global_step": 362000, "epoch": 4361} {"train_loss": -26.363162994384766, "global_step": 362001, "epoch": 4361} {"train_loss": -25.921056747436523, "global_step": 362002, "epoch": 4361} {"train_loss": -26.641559600830078, "global_step": 362003, "epoch": 4361} {"train_loss": -26.195068359375, "global_step": 362004, "epoch": 4361} {"train_loss": -26.185354232788086, "global_step": 362005, "epoch": 4361} {"train_loss": -26.40345573425293, "global_step": 362006, "epoch": 4361} {"train_loss": -26.092945098876953, "global_step": 362007, "epoch": 4361} {"train_loss": -26.26844596862793, "global_step": 362008, "epoch": 4361} {"train_loss": -26.724365234375, "global_step": 362009, "epoch": 4361} {"train_loss": -26.59881019592285, "global_step": 362010, "epoch": 4361} {"train_loss": -26.173871994018555, "global_step": 362011, "epoch": 4361} {"train_loss": -26.171905517578125, "global_step": 362012, "epoch": 4361} {"train_loss": -26.40620231628418, "global_step": 362013, "epoch": 4361} {"train_loss": -26.363080978393555, "global_step": 362014, "epoch": 4361} {"train_loss": -26.36382484436035, "global_step": 362015, "epoch": 4361} {"train_loss": -26.15863609313965, "global_step": 362016, "epoch": 4361} {"train_loss": -26.171247482299805, "global_step": 362017, "epoch": 4361} {"train_loss": -26.33009147644043, "global_step": 362018, "epoch": 4361} {"train_loss": -26.304662704467773, "global_step": 362019, "epoch": 4361} {"train_loss": -26.409406661987305, "global_step": 362020, "epoch": 4361} {"train_loss": -26.192859649658203, "global_step": 362021, "epoch": 4361} {"train_loss": -26.426782608032227, "global_step": 362022, "epoch": 4361} {"train_loss": -26.187536239624023, "global_step": 362023, "epoch": 4361} {"train_loss": -26.4097900390625, "global_step": 362024, "epoch": 4361} {"train_loss": -26.429670333862305, "global_step": 362025, "epoch": 4361} {"train_loss": -26.34756851196289, "global_step": 362026, "epoch": 4361} {"train_loss": -26.6147518157959, "global_step": 362027, "epoch": 4361} {"train_loss": -26.61402702331543, "global_step": 362028, "epoch": 4361} {"train_loss": -26.423974990844727, "global_step": 362029, "epoch": 4361} {"train_loss": -26.460895538330078, "global_step": 362030, "epoch": 4361} {"train_loss": -26.614856719970703, "global_step": 362031, "epoch": 4361} {"train_loss": -26.501483917236328, "global_step": 362032, "epoch": 4361} {"train_loss": -26.355649948120117, "global_step": 362033, "epoch": 4361} {"train_loss": -25.9097843170166, "global_step": 362034, "epoch": 4361} {"train_loss": -26.122943878173828, "global_step": 362035, "epoch": 4361} {"train_loss": -26.469770431518555, "global_step": 362036, "epoch": 4361} {"train_loss": -25.967599868774414, "global_step": 362037, "epoch": 4361} {"train_loss": -26.049945831298828, "global_step": 362038, "epoch": 4361} {"train_loss": -26.256311416625977, "global_step": 362039, "epoch": 4361} {"train_loss": -26.328577041625977, "global_step": 362040, "epoch": 4361} {"train_loss": -26.03420066833496, "global_step": 362041, "epoch": 4361} {"train_loss": -26.1236629486084, "global_step": 362042, "epoch": 4361} {"train_loss": -26.444562911987305, "global_step": 362043, "epoch": 4361} {"train_loss": -26.550434112548828, "global_step": 362044, "epoch": 4361} {"train_loss": -26.269146310277733, "global_step": 362045, "epoch": 4361, "val_loss": 6658611.5} {"train_loss": -25.889408111572266, "global_step": 362046, "epoch": 4362} {"train_loss": -25.40291976928711, "global_step": 362047, "epoch": 4362} {"train_loss": -25.60013198852539, "global_step": 362048, "epoch": 4362} {"train_loss": -25.261741638183594, "global_step": 362049, "epoch": 4362} {"train_loss": -25.46051597595215, "global_step": 362050, "epoch": 4362} {"train_loss": -25.838220596313477, "global_step": 362051, "epoch": 4362} {"train_loss": -25.58391571044922, "global_step": 362052, "epoch": 4362} {"train_loss": -25.99313735961914, "global_step": 362053, "epoch": 4362} {"train_loss": -25.544906616210938, "global_step": 362054, "epoch": 4362} {"train_loss": -25.681900024414062, "global_step": 362055, "epoch": 4362} {"train_loss": -25.9507999420166, "global_step": 362056, "epoch": 4362} {"train_loss": -25.851261138916016, "global_step": 362057, "epoch": 4362} {"train_loss": -25.741260528564453, "global_step": 362058, "epoch": 4362} {"train_loss": -25.825000762939453, "global_step": 362059, "epoch": 4362} {"train_loss": -26.15418815612793, "global_step": 362060, "epoch": 4362} {"train_loss": -25.586496353149414, "global_step": 362061, "epoch": 4362} {"train_loss": -26.15826416015625, "global_step": 362062, "epoch": 4362} {"train_loss": -26.08138084411621, "global_step": 362063, "epoch": 4362} {"train_loss": -25.915143966674805, "global_step": 362064, "epoch": 4362} {"train_loss": -25.980005264282227, "global_step": 362065, "epoch": 4362} {"train_loss": -25.91541862487793, "global_step": 362066, "epoch": 4362} {"train_loss": -26.32501220703125, "global_step": 362067, "epoch": 4362} {"train_loss": -25.9288272857666, "global_step": 362068, "epoch": 4362} {"train_loss": -25.754796981811523, "global_step": 362069, "epoch": 4362} {"train_loss": -26.442785263061523, "global_step": 362070, "epoch": 4362} {"train_loss": -26.381567001342773, "global_step": 362071, "epoch": 4362} {"train_loss": -25.948179244995117, "global_step": 362072, "epoch": 4362} {"train_loss": -26.096033096313477, "global_step": 362073, "epoch": 4362} {"train_loss": -26.133581161499023, "global_step": 362074, "epoch": 4362} {"train_loss": -26.08954429626465, "global_step": 362075, "epoch": 4362} {"train_loss": -25.868717193603516, "global_step": 362076, "epoch": 4362} {"train_loss": -26.38126564025879, "global_step": 362077, "epoch": 4362} {"train_loss": -26.397912979125977, "global_step": 362078, "epoch": 4362} {"train_loss": -25.873046875, "global_step": 362079, "epoch": 4362} {"train_loss": -26.382770538330078, "global_step": 362080, "epoch": 4362} {"train_loss": -26.701440811157227, "global_step": 362081, "epoch": 4362} {"train_loss": -26.185056686401367, "global_step": 362082, "epoch": 4362} {"train_loss": -26.140104293823242, "global_step": 362083, "epoch": 4362} {"train_loss": -26.400861740112305, "global_step": 362084, "epoch": 4362} {"train_loss": -26.221078872680664, "global_step": 362085, "epoch": 4362} {"train_loss": -26.073516845703125, "global_step": 362086, "epoch": 4362} {"train_loss": -26.174779891967773, "global_step": 362087, "epoch": 4362} {"train_loss": -26.241870880126953, "global_step": 362088, "epoch": 4362} {"train_loss": -26.679845809936523, "global_step": 362089, "epoch": 4362} {"train_loss": -26.486791610717773, "global_step": 362090, "epoch": 4362} {"train_loss": -26.245025634765625, "global_step": 362091, "epoch": 4362} {"train_loss": -26.398822784423828, "global_step": 362092, "epoch": 4362} {"train_loss": -26.4971981048584, "global_step": 362093, "epoch": 4362} {"train_loss": -26.774755477905273, "global_step": 362094, "epoch": 4362} {"train_loss": -26.582067489624023, "global_step": 362095, "epoch": 4362} {"train_loss": -26.444950103759766, "global_step": 362096, "epoch": 4362} {"train_loss": -26.324176788330078, "global_step": 362097, "epoch": 4362} {"train_loss": -26.317642211914062, "global_step": 362098, "epoch": 4362} {"train_loss": -26.154836654663086, "global_step": 362099, "epoch": 4362} {"train_loss": -26.1058292388916, "global_step": 362100, "epoch": 4362} {"train_loss": -26.282251358032227, "global_step": 362101, "epoch": 4362} {"train_loss": -26.181842803955078, "global_step": 362102, "epoch": 4362} {"train_loss": -25.9888858795166, "global_step": 362103, "epoch": 4362} {"train_loss": -26.128681182861328, "global_step": 362104, "epoch": 4362} {"train_loss": -26.328506469726562, "global_step": 362105, "epoch": 4362} {"train_loss": -26.300134658813477, "global_step": 362106, "epoch": 4362} {"train_loss": -26.330280303955078, "global_step": 362107, "epoch": 4362} {"train_loss": -26.473493576049805, "global_step": 362108, "epoch": 4362} {"train_loss": -26.8906307220459, "global_step": 362109, "epoch": 4362} {"train_loss": -26.271209716796875, "global_step": 362110, "epoch": 4362} {"train_loss": -26.451679229736328, "global_step": 362111, "epoch": 4362} {"train_loss": -26.167219161987305, "global_step": 362112, "epoch": 4362} {"train_loss": -26.594894409179688, "global_step": 362113, "epoch": 4362} {"train_loss": -26.498489379882812, "global_step": 362114, "epoch": 4362} {"train_loss": -26.309789657592773, "global_step": 362115, "epoch": 4362} {"train_loss": -25.763635635375977, "global_step": 362116, "epoch": 4362} {"train_loss": -25.3173885345459, "global_step": 362117, "epoch": 4362} {"train_loss": -25.630895614624023, "global_step": 362118, "epoch": 4362} {"train_loss": -26.014392852783203, "global_step": 362119, "epoch": 4362} {"train_loss": -25.955732345581055, "global_step": 362120, "epoch": 4362} {"train_loss": -26.407316207885742, "global_step": 362121, "epoch": 4362} {"train_loss": -25.74491310119629, "global_step": 362122, "epoch": 4362} {"train_loss": -26.425962448120117, "global_step": 362123, "epoch": 4362} {"train_loss": -26.398534774780273, "global_step": 362124, "epoch": 4362} {"train_loss": -26.000879287719727, "global_step": 362125, "epoch": 4362} {"train_loss": -25.9508056640625, "global_step": 362126, "epoch": 4362} {"train_loss": -26.10566520690918, "global_step": 362127, "epoch": 4362} {"train_loss": -26.108029629810748, "global_step": 362128, "epoch": 4362, "val_loss": 6522642.0} {"train_loss": -25.6226863861084, "global_step": 362129, "epoch": 4363} {"train_loss": -26.38625144958496, "global_step": 362130, "epoch": 4363} {"train_loss": -26.092206954956055, "global_step": 362131, "epoch": 4363} {"train_loss": -25.997241973876953, "global_step": 362132, "epoch": 4363} {"train_loss": -26.092756271362305, "global_step": 362133, "epoch": 4363} {"train_loss": -26.118635177612305, "global_step": 362134, "epoch": 4363} {"train_loss": -25.539844512939453, "global_step": 362135, "epoch": 4363} {"train_loss": -26.223962783813477, "global_step": 362136, "epoch": 4363} {"train_loss": -26.382648468017578, "global_step": 362137, "epoch": 4363} {"train_loss": -26.009374618530273, "global_step": 362138, "epoch": 4363} {"train_loss": -26.302953720092773, "global_step": 362139, "epoch": 4363} {"train_loss": -26.10222816467285, "global_step": 362140, "epoch": 4363} {"train_loss": -26.501657485961914, "global_step": 362141, "epoch": 4363} {"train_loss": -26.178192138671875, "global_step": 362142, "epoch": 4363} {"train_loss": -25.90314292907715, "global_step": 362143, "epoch": 4363} {"train_loss": -26.107263565063477, "global_step": 362144, "epoch": 4363} {"train_loss": -25.995059967041016, "global_step": 362145, "epoch": 4363} {"train_loss": -26.24002456665039, "global_step": 362146, "epoch": 4363} {"train_loss": -25.837512969970703, "global_step": 362147, "epoch": 4363} {"train_loss": -26.132837295532227, "global_step": 362148, "epoch": 4363} {"train_loss": -25.8399715423584, "global_step": 362149, "epoch": 4363} {"train_loss": -25.909408569335938, "global_step": 362150, "epoch": 4363} {"train_loss": -26.289539337158203, "global_step": 362151, "epoch": 4363} {"train_loss": -26.369709014892578, "global_step": 362152, "epoch": 4363} {"train_loss": -26.4931583404541, "global_step": 362153, "epoch": 4363} {"train_loss": -26.194355010986328, "global_step": 362154, "epoch": 4363} {"train_loss": -26.61567497253418, "global_step": 362155, "epoch": 4363} {"train_loss": -26.44907569885254, "global_step": 362156, "epoch": 4363} {"train_loss": -26.4775390625, "global_step": 362157, "epoch": 4363} {"train_loss": -26.704425811767578, "global_step": 362158, "epoch": 4363} {"train_loss": -26.39361572265625, "global_step": 362159, "epoch": 4363} {"train_loss": -26.610809326171875, "global_step": 362160, "epoch": 4363} {"train_loss": -26.13313102722168, "global_step": 362161, "epoch": 4363} {"train_loss": -26.506011962890625, "global_step": 362162, "epoch": 4363} {"train_loss": -26.516803741455078, "global_step": 362163, "epoch": 4363} {"train_loss": -26.604337692260742, "global_step": 362164, "epoch": 4363} {"train_loss": -26.625782012939453, "global_step": 362165, "epoch": 4363} {"train_loss": -26.107587814331055, "global_step": 362166, "epoch": 4363} {"train_loss": -26.55521583557129, "global_step": 362167, "epoch": 4363} {"train_loss": -26.531381607055664, "global_step": 362168, "epoch": 4363} {"train_loss": -26.38202476501465, "global_step": 362169, "epoch": 4363} {"train_loss": -26.170331954956055, "global_step": 362170, "epoch": 4363} {"train_loss": -26.709609985351562, "global_step": 362171, "epoch": 4363} {"train_loss": -26.34356117248535, "global_step": 362172, "epoch": 4363} {"train_loss": -26.014734268188477, "global_step": 362173, "epoch": 4363} {"train_loss": -26.493457794189453, "global_step": 362174, "epoch": 4363} {"train_loss": -26.482202529907227, "global_step": 362175, "epoch": 4363} {"train_loss": -26.469568252563477, "global_step": 362176, "epoch": 4363} {"train_loss": -26.597558975219727, "global_step": 362177, "epoch": 4363} {"train_loss": -26.55093765258789, "global_step": 362178, "epoch": 4363} {"train_loss": -26.337244033813477, "global_step": 362179, "epoch": 4363} {"train_loss": -26.425384521484375, "global_step": 362180, "epoch": 4363} {"train_loss": -26.484766006469727, "global_step": 362181, "epoch": 4363} {"train_loss": -26.423175811767578, "global_step": 362182, "epoch": 4363} {"train_loss": -26.639127731323242, "global_step": 362183, "epoch": 4363} {"train_loss": -26.160688400268555, "global_step": 362184, "epoch": 4363} {"train_loss": -26.185388565063477, "global_step": 362185, "epoch": 4363} {"train_loss": -26.063003540039062, "global_step": 362186, "epoch": 4363} {"train_loss": -26.000341415405273, "global_step": 362187, "epoch": 4363} {"train_loss": -26.679065704345703, "global_step": 362188, "epoch": 4363} {"train_loss": -26.263660430908203, "global_step": 362189, "epoch": 4363} {"train_loss": -26.19333267211914, "global_step": 362190, "epoch": 4363} {"train_loss": -26.3297176361084, "global_step": 362191, "epoch": 4363} {"train_loss": -26.359968185424805, "global_step": 362192, "epoch": 4363} {"train_loss": -26.701627731323242, "global_step": 362193, "epoch": 4363} {"train_loss": -26.475482940673828, "global_step": 362194, "epoch": 4363} {"train_loss": -26.055206298828125, "global_step": 362195, "epoch": 4363} {"train_loss": -25.446096420288086, "global_step": 362196, "epoch": 4363} {"train_loss": -25.734220504760742, "global_step": 362197, "epoch": 4363} {"train_loss": -26.167987823486328, "global_step": 362198, "epoch": 4363} {"train_loss": -25.985254287719727, "global_step": 362199, "epoch": 4363} {"train_loss": -26.552297592163086, "global_step": 362200, "epoch": 4363} {"train_loss": -26.06576919555664, "global_step": 362201, "epoch": 4363} {"train_loss": -26.100561141967773, "global_step": 362202, "epoch": 4363} {"train_loss": -26.09596824645996, "global_step": 362203, "epoch": 4363} {"train_loss": -26.148691177368164, "global_step": 362204, "epoch": 4363} {"train_loss": -26.2845458984375, "global_step": 362205, "epoch": 4363} {"train_loss": -26.387876510620117, "global_step": 362206, "epoch": 4363} {"train_loss": -26.226877212524414, "global_step": 362207, "epoch": 4363} {"train_loss": -26.095050811767578, "global_step": 362208, "epoch": 4363} {"train_loss": -25.838708877563477, "global_step": 362209, "epoch": 4363} {"train_loss": -26.29813003540039, "global_step": 362210, "epoch": 4363} {"train_loss": -26.274606934512953, "global_step": 362211, "epoch": 4363, "val_loss": 6548004.5} {"train_loss": -25.587467193603516, "global_step": 362212, "epoch": 4364} {"train_loss": -25.123580932617188, "global_step": 362213, "epoch": 4364} {"train_loss": -25.881977081298828, "global_step": 362214, "epoch": 4364} {"train_loss": -26.007904052734375, "global_step": 362215, "epoch": 4364} {"train_loss": -25.471689224243164, "global_step": 362216, "epoch": 4364} {"train_loss": -25.445772171020508, "global_step": 362217, "epoch": 4364} {"train_loss": -26.01993179321289, "global_step": 362218, "epoch": 4364} {"train_loss": -25.65753746032715, "global_step": 362219, "epoch": 4364} {"train_loss": -25.505176544189453, "global_step": 362220, "epoch": 4364} {"train_loss": -26.1781063079834, "global_step": 362221, "epoch": 4364} {"train_loss": -25.957040786743164, "global_step": 362222, "epoch": 4364} {"train_loss": -25.627185821533203, "global_step": 362223, "epoch": 4364} {"train_loss": -25.76093101501465, "global_step": 362224, "epoch": 4364} {"train_loss": -25.968250274658203, "global_step": 362225, "epoch": 4364} {"train_loss": -25.676715850830078, "global_step": 362226, "epoch": 4364} {"train_loss": -26.124738693237305, "global_step": 362227, "epoch": 4364} {"train_loss": -25.660694122314453, "global_step": 362228, "epoch": 4364} {"train_loss": -26.052753448486328, "global_step": 362229, "epoch": 4364} {"train_loss": -26.2523136138916, "global_step": 362230, "epoch": 4364} {"train_loss": -26.336362838745117, "global_step": 362231, "epoch": 4364} {"train_loss": -26.10862159729004, "global_step": 362232, "epoch": 4364} {"train_loss": -26.085378646850586, "global_step": 362233, "epoch": 4364} {"train_loss": -26.10590171813965, "global_step": 362234, "epoch": 4364} {"train_loss": -25.88148307800293, "global_step": 362235, "epoch": 4364} {"train_loss": -26.537885665893555, "global_step": 362236, "epoch": 4364} {"train_loss": -26.06666374206543, "global_step": 362237, "epoch": 4364} {"train_loss": -26.3173770904541, "global_step": 362238, "epoch": 4364} {"train_loss": -26.048358917236328, "global_step": 362239, "epoch": 4364} {"train_loss": -26.242292404174805, "global_step": 362240, "epoch": 4364} {"train_loss": -25.950536727905273, "global_step": 362241, "epoch": 4364} {"train_loss": -26.66265869140625, "global_step": 362242, "epoch": 4364} {"train_loss": -26.39253807067871, "global_step": 362243, "epoch": 4364} {"train_loss": -26.638172149658203, "global_step": 362244, "epoch": 4364} {"train_loss": -26.676090240478516, "global_step": 362245, "epoch": 4364} {"train_loss": -26.397388458251953, "global_step": 362246, "epoch": 4364} {"train_loss": -26.641942977905273, "global_step": 362247, "epoch": 4364} {"train_loss": -26.522876739501953, "global_step": 362248, "epoch": 4364} {"train_loss": -26.416288375854492, "global_step": 362249, "epoch": 4364} {"train_loss": -26.38494300842285, "global_step": 362250, "epoch": 4364} {"train_loss": -26.48179054260254, "global_step": 362251, "epoch": 4364} {"train_loss": -26.454345703125, "global_step": 362252, "epoch": 4364} {"train_loss": -26.3444766998291, "global_step": 362253, "epoch": 4364} {"train_loss": -26.695911407470703, "global_step": 362254, "epoch": 4364} {"train_loss": -26.320697784423828, "global_step": 362255, "epoch": 4364} {"train_loss": -26.002826690673828, "global_step": 362256, "epoch": 4364} {"train_loss": -26.30721092224121, "global_step": 362257, "epoch": 4364} {"train_loss": -26.422088623046875, "global_step": 362258, "epoch": 4364} {"train_loss": -26.407499313354492, "global_step": 362259, "epoch": 4364} {"train_loss": -26.78534507751465, "global_step": 362260, "epoch": 4364} {"train_loss": -26.793378829956055, "global_step": 362261, "epoch": 4364} {"train_loss": -26.405746459960938, "global_step": 362262, "epoch": 4364} {"train_loss": -26.597497940063477, "global_step": 362263, "epoch": 4364} {"train_loss": -26.291372299194336, "global_step": 362264, "epoch": 4364} {"train_loss": -26.523727416992188, "global_step": 362265, "epoch": 4364} {"train_loss": -25.997350692749023, "global_step": 362266, "epoch": 4364} {"train_loss": -25.168554306030273, "global_step": 362267, "epoch": 4364} {"train_loss": -24.00575828552246, "global_step": 362268, "epoch": 4364} {"train_loss": -25.5335636138916, "global_step": 362269, "epoch": 4364} {"train_loss": -25.670730590820312, "global_step": 362270, "epoch": 4364} {"train_loss": -25.507495880126953, "global_step": 362271, "epoch": 4364} {"train_loss": -25.44300651550293, "global_step": 362272, "epoch": 4364} {"train_loss": -25.70404624938965, "global_step": 362273, "epoch": 4364} {"train_loss": -26.01862144470215, "global_step": 362274, "epoch": 4364} {"train_loss": -25.903366088867188, "global_step": 362275, "epoch": 4364} {"train_loss": -25.903207778930664, "global_step": 362276, "epoch": 4364} {"train_loss": -25.9266300201416, "global_step": 362277, "epoch": 4364} {"train_loss": -25.560800552368164, "global_step": 362278, "epoch": 4364} {"train_loss": -26.405038833618164, "global_step": 362279, "epoch": 4364} {"train_loss": -26.22743034362793, "global_step": 362280, "epoch": 4364} {"train_loss": -26.034650802612305, "global_step": 362281, "epoch": 4364} {"train_loss": -25.94766616821289, "global_step": 362282, "epoch": 4364} {"train_loss": -26.386005401611328, "global_step": 362283, "epoch": 4364} {"train_loss": -26.213125228881836, "global_step": 362284, "epoch": 4364} {"train_loss": -26.35902976989746, "global_step": 362285, "epoch": 4364} {"train_loss": -26.276594161987305, "global_step": 362286, "epoch": 4364} {"train_loss": -26.065704345703125, "global_step": 362287, "epoch": 4364} {"train_loss": -26.3929443359375, "global_step": 362288, "epoch": 4364} {"train_loss": -25.89497947692871, "global_step": 362289, "epoch": 4364} {"train_loss": -26.24078369140625, "global_step": 362290, "epoch": 4364} {"train_loss": -25.9287166595459, "global_step": 362291, "epoch": 4364} {"train_loss": -25.795743942260742, "global_step": 362292, "epoch": 4364} {"train_loss": -26.192535400390625, "global_step": 362293, "epoch": 4364} {"train_loss": -26.099636123841066, "global_step": 362294, "epoch": 4364, "val_loss": 6538857.5} {"train_loss": -25.813495635986328, "global_step": 362295, "epoch": 4365} {"train_loss": -25.741382598876953, "global_step": 362296, "epoch": 4365} {"train_loss": -25.903242111206055, "global_step": 362297, "epoch": 4365} {"train_loss": -25.94708251953125, "global_step": 362298, "epoch": 4365} {"train_loss": -26.1860408782959, "global_step": 362299, "epoch": 4365} {"train_loss": -26.106185913085938, "global_step": 362300, "epoch": 4365} {"train_loss": -25.8883113861084, "global_step": 362301, "epoch": 4365} {"train_loss": -26.183530807495117, "global_step": 362302, "epoch": 4365} {"train_loss": -26.01605224609375, "global_step": 362303, "epoch": 4365} {"train_loss": -25.755308151245117, "global_step": 362304, "epoch": 4365} {"train_loss": -26.142316818237305, "global_step": 362305, "epoch": 4365} {"train_loss": -25.99183464050293, "global_step": 362306, "epoch": 4365} {"train_loss": -26.04615592956543, "global_step": 362307, "epoch": 4365} {"train_loss": -25.8557186126709, "global_step": 362308, "epoch": 4365} {"train_loss": -26.186511993408203, "global_step": 362309, "epoch": 4365} {"train_loss": -25.907318115234375, "global_step": 362310, "epoch": 4365} {"train_loss": -25.641016006469727, "global_step": 362311, "epoch": 4365} {"train_loss": -26.23650550842285, "global_step": 362312, "epoch": 4365} {"train_loss": -26.374210357666016, "global_step": 362313, "epoch": 4365} {"train_loss": -25.98908805847168, "global_step": 362314, "epoch": 4365} {"train_loss": -26.423627853393555, "global_step": 362315, "epoch": 4365} {"train_loss": -26.381000518798828, "global_step": 362316, "epoch": 4365} {"train_loss": -26.26434326171875, "global_step": 362317, "epoch": 4365} {"train_loss": -26.257190704345703, "global_step": 362318, "epoch": 4365} {"train_loss": -26.124658584594727, "global_step": 362319, "epoch": 4365} {"train_loss": -26.415014266967773, "global_step": 362320, "epoch": 4365} {"train_loss": -26.435449600219727, "global_step": 362321, "epoch": 4365} {"train_loss": -26.359771728515625, "global_step": 362322, "epoch": 4365} {"train_loss": -26.524900436401367, "global_step": 362323, "epoch": 4365} {"train_loss": -26.62391471862793, "global_step": 362324, "epoch": 4365} {"train_loss": -26.222064971923828, "global_step": 362325, "epoch": 4365} {"train_loss": -26.373580932617188, "global_step": 362326, "epoch": 4365} {"train_loss": -26.766164779663086, "global_step": 362327, "epoch": 4365} {"train_loss": -26.379196166992188, "global_step": 362328, "epoch": 4365} {"train_loss": -26.1962833404541, "global_step": 362329, "epoch": 4365} {"train_loss": -26.256799697875977, "global_step": 362330, "epoch": 4365} {"train_loss": -26.37213706970215, "global_step": 362331, "epoch": 4365} {"train_loss": -26.49675941467285, "global_step": 362332, "epoch": 4365} {"train_loss": -26.292251586914062, "global_step": 362333, "epoch": 4365} {"train_loss": -26.62105369567871, "global_step": 362334, "epoch": 4365} {"train_loss": -26.261219024658203, "global_step": 362335, "epoch": 4365} {"train_loss": -26.328876495361328, "global_step": 362336, "epoch": 4365} {"train_loss": -26.30316162109375, "global_step": 362337, "epoch": 4365} {"train_loss": -26.10116958618164, "global_step": 362338, "epoch": 4365} {"train_loss": -26.587787628173828, "global_step": 362339, "epoch": 4365} {"train_loss": -26.439687728881836, "global_step": 362340, "epoch": 4365} {"train_loss": -26.500579833984375, "global_step": 362341, "epoch": 4365} {"train_loss": -26.706953048706055, "global_step": 362342, "epoch": 4365} {"train_loss": -26.204538345336914, "global_step": 362343, "epoch": 4365} {"train_loss": -26.09467887878418, "global_step": 362344, "epoch": 4365} {"train_loss": -26.50821304321289, "global_step": 362345, "epoch": 4365} {"train_loss": -26.469608306884766, "global_step": 362346, "epoch": 4365} {"train_loss": -25.7769775390625, "global_step": 362347, "epoch": 4365} {"train_loss": -26.203908920288086, "global_step": 362348, "epoch": 4365} {"train_loss": -26.35076904296875, "global_step": 362349, "epoch": 4365} {"train_loss": -26.3868408203125, "global_step": 362350, "epoch": 4365} {"train_loss": -26.5534610748291, "global_step": 362351, "epoch": 4365} {"train_loss": -25.988880157470703, "global_step": 362352, "epoch": 4365} {"train_loss": -26.118616104125977, "global_step": 362353, "epoch": 4365} {"train_loss": -25.670658111572266, "global_step": 362354, "epoch": 4365} {"train_loss": -25.65471839904785, "global_step": 362355, "epoch": 4365} {"train_loss": -26.384124755859375, "global_step": 362356, "epoch": 4365} {"train_loss": -26.134450912475586, "global_step": 362357, "epoch": 4365} {"train_loss": -26.608871459960938, "global_step": 362358, "epoch": 4365} {"train_loss": -25.681049346923828, "global_step": 362359, "epoch": 4365} {"train_loss": -25.697668075561523, "global_step": 362360, "epoch": 4365} {"train_loss": -26.12322998046875, "global_step": 362361, "epoch": 4365} {"train_loss": -25.97816276550293, "global_step": 362362, "epoch": 4365} {"train_loss": -25.726980209350586, "global_step": 362363, "epoch": 4365} {"train_loss": -25.945158004760742, "global_step": 362364, "epoch": 4365} {"train_loss": -26.582599639892578, "global_step": 362365, "epoch": 4365} {"train_loss": -26.008228302001953, "global_step": 362366, "epoch": 4365} {"train_loss": -26.17659568786621, "global_step": 362367, "epoch": 4365} {"train_loss": -26.271711349487305, "global_step": 362368, "epoch": 4365} {"train_loss": -26.288843154907227, "global_step": 362369, "epoch": 4365} {"train_loss": -26.08045768737793, "global_step": 362370, "epoch": 4365} {"train_loss": -25.8060302734375, "global_step": 362371, "epoch": 4365} {"train_loss": -26.546056747436523, "global_step": 362372, "epoch": 4365} {"train_loss": -26.2309513092041, "global_step": 362373, "epoch": 4365} {"train_loss": -26.35245132446289, "global_step": 362374, "epoch": 4365} {"train_loss": -26.391489028930664, "global_step": 362375, "epoch": 4365} {"train_loss": -26.176679611206055, "global_step": 362376, "epoch": 4365} {"train_loss": -26.20450640299234, "global_step": 362377, "epoch": 4365, "val_loss": 6651454.0} {"train_loss": -25.649396896362305, "global_step": 362378, "epoch": 4366} {"train_loss": -25.784976959228516, "global_step": 362379, "epoch": 4366} {"train_loss": -25.852399826049805, "global_step": 362380, "epoch": 4366} {"train_loss": -25.797199249267578, "global_step": 362381, "epoch": 4366} {"train_loss": -25.396366119384766, "global_step": 362382, "epoch": 4366} {"train_loss": -25.905736923217773, "global_step": 362383, "epoch": 4366} {"train_loss": -26.064603805541992, "global_step": 362384, "epoch": 4366} {"train_loss": -26.06635856628418, "global_step": 362385, "epoch": 4366} {"train_loss": -25.94227409362793, "global_step": 362386, "epoch": 4366} {"train_loss": -25.700382232666016, "global_step": 362387, "epoch": 4366} {"train_loss": -26.1584529876709, "global_step": 362388, "epoch": 4366} {"train_loss": -26.0640926361084, "global_step": 362389, "epoch": 4366} {"train_loss": -25.821136474609375, "global_step": 362390, "epoch": 4366} {"train_loss": -26.232519149780273, "global_step": 362391, "epoch": 4366} {"train_loss": -25.885528564453125, "global_step": 362392, "epoch": 4366} {"train_loss": -25.97519874572754, "global_step": 362393, "epoch": 4366} {"train_loss": -26.068622589111328, "global_step": 362394, "epoch": 4366} {"train_loss": -26.133153915405273, "global_step": 362395, "epoch": 4366} {"train_loss": -26.292661666870117, "global_step": 362396, "epoch": 4366} {"train_loss": -26.113859176635742, "global_step": 362397, "epoch": 4366} {"train_loss": -26.204364776611328, "global_step": 362398, "epoch": 4366} {"train_loss": -26.137311935424805, "global_step": 362399, "epoch": 4366} {"train_loss": -26.33963966369629, "global_step": 362400, "epoch": 4366} {"train_loss": -26.0657958984375, "global_step": 362401, "epoch": 4366} {"train_loss": -26.38321304321289, "global_step": 362402, "epoch": 4366} {"train_loss": -26.3782958984375, "global_step": 362403, "epoch": 4366} {"train_loss": -26.15744972229004, "global_step": 362404, "epoch": 4366} {"train_loss": -26.280963897705078, "global_step": 362405, "epoch": 4366} {"train_loss": -26.265783309936523, "global_step": 362406, "epoch": 4366} {"train_loss": -26.182662963867188, "global_step": 362407, "epoch": 4366} {"train_loss": -25.863744735717773, "global_step": 362408, "epoch": 4366} {"train_loss": -26.419803619384766, "global_step": 362409, "epoch": 4366} {"train_loss": -25.81552505493164, "global_step": 362410, "epoch": 4366} {"train_loss": -26.4306697845459, "global_step": 362411, "epoch": 4366} {"train_loss": -26.45026969909668, "global_step": 362412, "epoch": 4366} {"train_loss": -26.109872817993164, "global_step": 362413, "epoch": 4366} {"train_loss": -26.3957576751709, "global_step": 362414, "epoch": 4366} {"train_loss": -26.180517196655273, "global_step": 362415, "epoch": 4366} {"train_loss": -26.075754165649414, "global_step": 362416, "epoch": 4366} {"train_loss": -26.14740562438965, "global_step": 362417, "epoch": 4366} {"train_loss": -25.803892135620117, "global_step": 362418, "epoch": 4366} {"train_loss": -26.043933868408203, "global_step": 362419, "epoch": 4366} {"train_loss": -26.06281852722168, "global_step": 362420, "epoch": 4366} {"train_loss": -26.623106002807617, "global_step": 362421, "epoch": 4366} {"train_loss": -25.976831436157227, "global_step": 362422, "epoch": 4366} {"train_loss": -26.173431396484375, "global_step": 362423, "epoch": 4366} {"train_loss": -26.1561279296875, "global_step": 362424, "epoch": 4366} {"train_loss": -26.116735458374023, "global_step": 362425, "epoch": 4366} {"train_loss": -26.06378746032715, "global_step": 362426, "epoch": 4366} {"train_loss": -26.45577049255371, "global_step": 362427, "epoch": 4366} {"train_loss": -26.34296989440918, "global_step": 362428, "epoch": 4366} {"train_loss": -26.306583404541016, "global_step": 362429, "epoch": 4366} {"train_loss": -26.232990264892578, "global_step": 362430, "epoch": 4366} {"train_loss": -26.4150333404541, "global_step": 362431, "epoch": 4366} {"train_loss": -26.540576934814453, "global_step": 362432, "epoch": 4366} {"train_loss": -26.172779083251953, "global_step": 362433, "epoch": 4366} {"train_loss": -26.30389976501465, "global_step": 362434, "epoch": 4366} {"train_loss": -26.46113395690918, "global_step": 362435, "epoch": 4366} {"train_loss": -25.950305938720703, "global_step": 362436, "epoch": 4366} {"train_loss": -26.136993408203125, "global_step": 362437, "epoch": 4366} {"train_loss": -25.904401779174805, "global_step": 362438, "epoch": 4366} {"train_loss": -26.31416130065918, "global_step": 362439, "epoch": 4366} {"train_loss": -26.660675048828125, "global_step": 362440, "epoch": 4366} {"train_loss": -25.967283248901367, "global_step": 362441, "epoch": 4366} {"train_loss": -26.198699951171875, "global_step": 362442, "epoch": 4366} {"train_loss": -26.445947647094727, "global_step": 362443, "epoch": 4366} {"train_loss": -26.5180721282959, "global_step": 362444, "epoch": 4366} {"train_loss": -26.073471069335938, "global_step": 362445, "epoch": 4366} {"train_loss": -26.212615966796875, "global_step": 362446, "epoch": 4366} {"train_loss": -26.326154708862305, "global_step": 362447, "epoch": 4366} {"train_loss": -26.46476173400879, "global_step": 362448, "epoch": 4366} {"train_loss": -26.14729118347168, "global_step": 362449, "epoch": 4366} {"train_loss": -26.179916381835938, "global_step": 362450, "epoch": 4366} {"train_loss": -26.323755264282227, "global_step": 362451, "epoch": 4366} {"train_loss": -26.301517486572266, "global_step": 362452, "epoch": 4366} {"train_loss": -26.05721092224121, "global_step": 362453, "epoch": 4366} {"train_loss": -25.897052764892578, "global_step": 362454, "epoch": 4366} {"train_loss": -26.02840232849121, "global_step": 362455, "epoch": 4366} {"train_loss": -26.284582138061523, "global_step": 362456, "epoch": 4366} {"train_loss": -25.98194694519043, "global_step": 362457, "epoch": 4366} {"train_loss": -25.805206298828125, "global_step": 362458, "epoch": 4366} {"train_loss": -25.951934814453125, "global_step": 362459, "epoch": 4366} {"train_loss": -26.142527499830866, "global_step": 362460, "epoch": 4366, "val_loss": 6565409.0} {"train_loss": -25.4277400970459, "global_step": 362461, "epoch": 4367} {"train_loss": -25.435476303100586, "global_step": 362462, "epoch": 4367} {"train_loss": -25.762121200561523, "global_step": 362463, "epoch": 4367} {"train_loss": -25.343496322631836, "global_step": 362464, "epoch": 4367} {"train_loss": -25.27874183654785, "global_step": 362465, "epoch": 4367} {"train_loss": -25.472822189331055, "global_step": 362466, "epoch": 4367} {"train_loss": -25.469486236572266, "global_step": 362467, "epoch": 4367} {"train_loss": -25.84981346130371, "global_step": 362468, "epoch": 4367} {"train_loss": -25.443527221679688, "global_step": 362469, "epoch": 4367} {"train_loss": -25.88458251953125, "global_step": 362470, "epoch": 4367} {"train_loss": -25.5958251953125, "global_step": 362471, "epoch": 4367} {"train_loss": -26.013975143432617, "global_step": 362472, "epoch": 4367} {"train_loss": -25.59366226196289, "global_step": 362473, "epoch": 4367} {"train_loss": -26.076770782470703, "global_step": 362474, "epoch": 4367} {"train_loss": -25.4329776763916, "global_step": 362475, "epoch": 4367} {"train_loss": -25.822484970092773, "global_step": 362476, "epoch": 4367} {"train_loss": -25.950117111206055, "global_step": 362477, "epoch": 4367} {"train_loss": -26.01019287109375, "global_step": 362478, "epoch": 4367} {"train_loss": -26.165878295898438, "global_step": 362479, "epoch": 4367} {"train_loss": -26.242101669311523, "global_step": 362480, "epoch": 4367} {"train_loss": -25.771764755249023, "global_step": 362481, "epoch": 4367} {"train_loss": -25.91944694519043, "global_step": 362482, "epoch": 4367} {"train_loss": -26.15079116821289, "global_step": 362483, "epoch": 4367} {"train_loss": -26.43684196472168, "global_step": 362484, "epoch": 4367} {"train_loss": -26.445667266845703, "global_step": 362485, "epoch": 4367} {"train_loss": -25.901105880737305, "global_step": 362486, "epoch": 4367} {"train_loss": -26.2755184173584, "global_step": 362487, "epoch": 4367} {"train_loss": -26.555166244506836, "global_step": 362488, "epoch": 4367} {"train_loss": -26.511432647705078, "global_step": 362489, "epoch": 4367} {"train_loss": -26.532485961914062, "global_step": 362490, "epoch": 4367} {"train_loss": -26.3226261138916, "global_step": 362491, "epoch": 4367} {"train_loss": -26.5250244140625, "global_step": 362492, "epoch": 4367} {"train_loss": -26.397846221923828, "global_step": 362493, "epoch": 4367} {"train_loss": -26.427759170532227, "global_step": 362494, "epoch": 4367} {"train_loss": -26.447345733642578, "global_step": 362495, "epoch": 4367} {"train_loss": -26.507171630859375, "global_step": 362496, "epoch": 4367} {"train_loss": -26.246540069580078, "global_step": 362497, "epoch": 4367} {"train_loss": -26.368412017822266, "global_step": 362498, "epoch": 4367} {"train_loss": -26.587860107421875, "global_step": 362499, "epoch": 4367} {"train_loss": -26.462488174438477, "global_step": 362500, "epoch": 4367} {"train_loss": -26.47355079650879, "global_step": 362501, "epoch": 4367} {"train_loss": -26.82672119140625, "global_step": 362502, "epoch": 4367} {"train_loss": -26.688098907470703, "global_step": 362503, "epoch": 4367} {"train_loss": -26.39451026916504, "global_step": 362504, "epoch": 4367} {"train_loss": -26.460647583007812, "global_step": 362505, "epoch": 4367} {"train_loss": -26.761646270751953, "global_step": 362506, "epoch": 4367} {"train_loss": -26.51795768737793, "global_step": 362507, "epoch": 4367} {"train_loss": -26.1995849609375, "global_step": 362508, "epoch": 4367} {"train_loss": -26.412168502807617, "global_step": 362509, "epoch": 4367} {"train_loss": -26.74822998046875, "global_step": 362510, "epoch": 4367} {"train_loss": -26.0968017578125, "global_step": 362511, "epoch": 4367} {"train_loss": -26.302350997924805, "global_step": 362512, "epoch": 4367} {"train_loss": -26.36249351501465, "global_step": 362513, "epoch": 4367} {"train_loss": -26.40399742126465, "global_step": 362514, "epoch": 4367} {"train_loss": -26.593042373657227, "global_step": 362515, "epoch": 4367} {"train_loss": -25.7939510345459, "global_step": 362516, "epoch": 4367} {"train_loss": -25.29885482788086, "global_step": 362517, "epoch": 4367} {"train_loss": -25.915266036987305, "global_step": 362518, "epoch": 4367} {"train_loss": -26.310583114624023, "global_step": 362519, "epoch": 4367} {"train_loss": -26.053083419799805, "global_step": 362520, "epoch": 4367} {"train_loss": -26.749832153320312, "global_step": 362521, "epoch": 4367} {"train_loss": -26.5834903717041, "global_step": 362522, "epoch": 4367} {"train_loss": -25.789594650268555, "global_step": 362523, "epoch": 4367} {"train_loss": -26.674713134765625, "global_step": 362524, "epoch": 4367} {"train_loss": -25.88397789001465, "global_step": 362525, "epoch": 4367} {"train_loss": -26.236265182495117, "global_step": 362526, "epoch": 4367} {"train_loss": -25.92169761657715, "global_step": 362527, "epoch": 4367} {"train_loss": -26.084142684936523, "global_step": 362528, "epoch": 4367} {"train_loss": -25.95151138305664, "global_step": 362529, "epoch": 4367} {"train_loss": -26.30348014831543, "global_step": 362530, "epoch": 4367} {"train_loss": -26.808151245117188, "global_step": 362531, "epoch": 4367} {"train_loss": -26.26045036315918, "global_step": 362532, "epoch": 4367} {"train_loss": -26.316797256469727, "global_step": 362533, "epoch": 4367} {"train_loss": -26.13907814025879, "global_step": 362534, "epoch": 4367} {"train_loss": -26.448816299438477, "global_step": 362535, "epoch": 4367} {"train_loss": -26.21846580505371, "global_step": 362536, "epoch": 4367} {"train_loss": -26.110586166381836, "global_step": 362537, "epoch": 4367} {"train_loss": -26.33315086364746, "global_step": 362538, "epoch": 4367} {"train_loss": -26.72580909729004, "global_step": 362539, "epoch": 4367} {"train_loss": -26.1298828125, "global_step": 362540, "epoch": 4367} {"train_loss": -26.056934356689453, "global_step": 362541, "epoch": 4367} {"train_loss": -26.429676055908203, "global_step": 362542, "epoch": 4367} {"train_loss": -26.175949832043017, "global_step": 362543, "epoch": 4367, "val_loss": 6558064.0} {"train_loss": -25.88534927368164, "global_step": 362544, "epoch": 4368} {"train_loss": -24.889911651611328, "global_step": 362545, "epoch": 4368} {"train_loss": -24.952957153320312, "global_step": 362546, "epoch": 4368} {"train_loss": -25.888595581054688, "global_step": 362547, "epoch": 4368} {"train_loss": -25.986845016479492, "global_step": 362548, "epoch": 4368} {"train_loss": -25.31317710876465, "global_step": 362549, "epoch": 4368} {"train_loss": -25.690778732299805, "global_step": 362550, "epoch": 4368} {"train_loss": -26.052793502807617, "global_step": 362551, "epoch": 4368} {"train_loss": -25.28582763671875, "global_step": 362552, "epoch": 4368} {"train_loss": -25.717975616455078, "global_step": 362553, "epoch": 4368} {"train_loss": -25.839338302612305, "global_step": 362554, "epoch": 4368} {"train_loss": -26.007184982299805, "global_step": 362555, "epoch": 4368} {"train_loss": -26.114652633666992, "global_step": 362556, "epoch": 4368} {"train_loss": -25.71611976623535, "global_step": 362557, "epoch": 4368} {"train_loss": -25.953821182250977, "global_step": 362558, "epoch": 4368} {"train_loss": -26.14755630493164, "global_step": 362559, "epoch": 4368} {"train_loss": -25.766620635986328, "global_step": 362560, "epoch": 4368} {"train_loss": -26.133472442626953, "global_step": 362561, "epoch": 4368} {"train_loss": -26.081823348999023, "global_step": 362562, "epoch": 4368} {"train_loss": -25.89556884765625, "global_step": 362563, "epoch": 4368} {"train_loss": -25.98841667175293, "global_step": 362564, "epoch": 4368} {"train_loss": -26.139636993408203, "global_step": 362565, "epoch": 4368} {"train_loss": -25.99527931213379, "global_step": 362566, "epoch": 4368} {"train_loss": -26.057886123657227, "global_step": 362567, "epoch": 4368} {"train_loss": -26.228107452392578, "global_step": 362568, "epoch": 4368} {"train_loss": -26.0353946685791, "global_step": 362569, "epoch": 4368} {"train_loss": -26.203073501586914, "global_step": 362570, "epoch": 4368} {"train_loss": -26.2571964263916, "global_step": 362571, "epoch": 4368} {"train_loss": -26.357641220092773, "global_step": 362572, "epoch": 4368} {"train_loss": -26.496152877807617, "global_step": 362573, "epoch": 4368} {"train_loss": -25.93094253540039, "global_step": 362574, "epoch": 4368} {"train_loss": -26.456729888916016, "global_step": 362575, "epoch": 4368} {"train_loss": -26.280996322631836, "global_step": 362576, "epoch": 4368} {"train_loss": -26.826990127563477, "global_step": 362577, "epoch": 4368} {"train_loss": -26.381183624267578, "global_step": 362578, "epoch": 4368} {"train_loss": -26.340229034423828, "global_step": 362579, "epoch": 4368} {"train_loss": -26.25629234313965, "global_step": 362580, "epoch": 4368} {"train_loss": -26.332626342773438, "global_step": 362581, "epoch": 4368} {"train_loss": -26.309295654296875, "global_step": 362582, "epoch": 4368} {"train_loss": -26.233524322509766, "global_step": 362583, "epoch": 4368} {"train_loss": -26.432214736938477, "global_step": 362584, "epoch": 4368} {"train_loss": -26.360151290893555, "global_step": 362585, "epoch": 4368} {"train_loss": -26.66908073425293, "global_step": 362586, "epoch": 4368} {"train_loss": -26.5808048248291, "global_step": 362587, "epoch": 4368} {"train_loss": -26.349903106689453, "global_step": 362588, "epoch": 4368} {"train_loss": -26.530353546142578, "global_step": 362589, "epoch": 4368} {"train_loss": -26.404638290405273, "global_step": 362590, "epoch": 4368} {"train_loss": -26.600341796875, "global_step": 362591, "epoch": 4368} {"train_loss": -26.16620445251465, "global_step": 362592, "epoch": 4368} {"train_loss": -26.507282257080078, "global_step": 362593, "epoch": 4368} {"train_loss": -26.222959518432617, "global_step": 362594, "epoch": 4368} {"train_loss": -26.66462516784668, "global_step": 362595, "epoch": 4368} {"train_loss": -26.173818588256836, "global_step": 362596, "epoch": 4368} {"train_loss": -26.266727447509766, "global_step": 362597, "epoch": 4368} {"train_loss": -26.241870880126953, "global_step": 362598, "epoch": 4368} {"train_loss": -26.553009033203125, "global_step": 362599, "epoch": 4368} {"train_loss": -26.146116256713867, "global_step": 362600, "epoch": 4368} {"train_loss": -26.1881046295166, "global_step": 362601, "epoch": 4368} {"train_loss": -25.752302169799805, "global_step": 362602, "epoch": 4368} {"train_loss": -25.337644577026367, "global_step": 362603, "epoch": 4368} {"train_loss": -24.55306053161621, "global_step": 362604, "epoch": 4368} {"train_loss": -24.412073135375977, "global_step": 362605, "epoch": 4368} {"train_loss": -25.180130004882812, "global_step": 362606, "epoch": 4368} {"train_loss": -26.296192169189453, "global_step": 362607, "epoch": 4368} {"train_loss": -25.484495162963867, "global_step": 362608, "epoch": 4368} {"train_loss": -25.736169815063477, "global_step": 362609, "epoch": 4368} {"train_loss": -25.84503173828125, "global_step": 362610, "epoch": 4368} {"train_loss": -25.6966609954834, "global_step": 362611, "epoch": 4368} {"train_loss": -26.143537521362305, "global_step": 362612, "epoch": 4368} {"train_loss": -26.162918090820312, "global_step": 362613, "epoch": 4368} {"train_loss": -25.923450469970703, "global_step": 362614, "epoch": 4368} {"train_loss": -25.766788482666016, "global_step": 362615, "epoch": 4368} {"train_loss": -25.926740646362305, "global_step": 362616, "epoch": 4368} {"train_loss": -26.024860382080078, "global_step": 362617, "epoch": 4368} {"train_loss": -25.88629150390625, "global_step": 362618, "epoch": 4368} {"train_loss": -26.33747673034668, "global_step": 362619, "epoch": 4368} {"train_loss": -26.0987606048584, "global_step": 362620, "epoch": 4368} {"train_loss": -26.33148765563965, "global_step": 362621, "epoch": 4368} {"train_loss": -26.123998641967773, "global_step": 362622, "epoch": 4368} {"train_loss": -26.22295570373535, "global_step": 362623, "epoch": 4368} {"train_loss": -26.38690757751465, "global_step": 362624, "epoch": 4368} {"train_loss": -26.102048873901367, "global_step": 362625, "epoch": 4368} {"train_loss": -26.039337594825103, "global_step": 362626, "epoch": 4368, "val_loss": 6592199.0} {"train_loss": -25.414403915405273, "global_step": 362627, "epoch": 4369} {"train_loss": -25.59482765197754, "global_step": 362628, "epoch": 4369} {"train_loss": -26.12298583984375, "global_step": 362629, "epoch": 4369} {"train_loss": -25.388334274291992, "global_step": 362630, "epoch": 4369} {"train_loss": -26.198034286499023, "global_step": 362631, "epoch": 4369} {"train_loss": -25.86124038696289, "global_step": 362632, "epoch": 4369} {"train_loss": -25.988452911376953, "global_step": 362633, "epoch": 4369} {"train_loss": -25.92401695251465, "global_step": 362634, "epoch": 4369} {"train_loss": -25.96759605407715, "global_step": 362635, "epoch": 4369} {"train_loss": -25.39564323425293, "global_step": 362636, "epoch": 4369} {"train_loss": -26.046483993530273, "global_step": 362637, "epoch": 4369} {"train_loss": -25.78200340270996, "global_step": 362638, "epoch": 4369} {"train_loss": -26.036054611206055, "global_step": 362639, "epoch": 4369} {"train_loss": -25.700437545776367, "global_step": 362640, "epoch": 4369} {"train_loss": -26.00188636779785, "global_step": 362641, "epoch": 4369} {"train_loss": -25.879724502563477, "global_step": 362642, "epoch": 4369} {"train_loss": -26.306798934936523, "global_step": 362643, "epoch": 4369} {"train_loss": -26.165342330932617, "global_step": 362644, "epoch": 4369} {"train_loss": -26.157873153686523, "global_step": 362645, "epoch": 4369} {"train_loss": -26.24909782409668, "global_step": 362646, "epoch": 4369} {"train_loss": -26.048858642578125, "global_step": 362647, "epoch": 4369} {"train_loss": -25.8923282623291, "global_step": 362648, "epoch": 4369} {"train_loss": -26.523263931274414, "global_step": 362649, "epoch": 4369} {"train_loss": -26.016454696655273, "global_step": 362650, "epoch": 4369} {"train_loss": -26.216903686523438, "global_step": 362651, "epoch": 4369} {"train_loss": -25.975345611572266, "global_step": 362652, "epoch": 4369} {"train_loss": -26.3547306060791, "global_step": 362653, "epoch": 4369} {"train_loss": -26.331409454345703, "global_step": 362654, "epoch": 4369} {"train_loss": -26.377613067626953, "global_step": 362655, "epoch": 4369} {"train_loss": -26.346805572509766, "global_step": 362656, "epoch": 4369} {"train_loss": -26.402240753173828, "global_step": 362657, "epoch": 4369} {"train_loss": -26.3409423828125, "global_step": 362658, "epoch": 4369} {"train_loss": -26.53763771057129, "global_step": 362659, "epoch": 4369} {"train_loss": -26.52359962463379, "global_step": 362660, "epoch": 4369} {"train_loss": -26.939884185791016, "global_step": 362661, "epoch": 4369} {"train_loss": -26.20560073852539, "global_step": 362662, "epoch": 4369} {"train_loss": -26.53822135925293, "global_step": 362663, "epoch": 4369} {"train_loss": -26.445295333862305, "global_step": 362664, "epoch": 4369} {"train_loss": -26.4903564453125, "global_step": 362665, "epoch": 4369} {"train_loss": -26.650800704956055, "global_step": 362666, "epoch": 4369} {"train_loss": -26.37798500061035, "global_step": 362667, "epoch": 4369} {"train_loss": -26.436782836914062, "global_step": 362668, "epoch": 4369} {"train_loss": -26.68332862854004, "global_step": 362669, "epoch": 4369} {"train_loss": -26.519758224487305, "global_step": 362670, "epoch": 4369} {"train_loss": -26.555316925048828, "global_step": 362671, "epoch": 4369} {"train_loss": -26.65968894958496, "global_step": 362672, "epoch": 4369} {"train_loss": -26.546728134155273, "global_step": 362673, "epoch": 4369} {"train_loss": -26.53534507751465, "global_step": 362674, "epoch": 4369} {"train_loss": -26.22238540649414, "global_step": 362675, "epoch": 4369} {"train_loss": -26.136564254760742, "global_step": 362676, "epoch": 4369} {"train_loss": -26.7283878326416, "global_step": 362677, "epoch": 4369} {"train_loss": -26.187902450561523, "global_step": 362678, "epoch": 4369} {"train_loss": -25.760290145874023, "global_step": 362679, "epoch": 4369} {"train_loss": -25.548566818237305, "global_step": 362680, "epoch": 4369} {"train_loss": -25.29007911682129, "global_step": 362681, "epoch": 4369} {"train_loss": -24.121028900146484, "global_step": 362682, "epoch": 4369} {"train_loss": -24.510726928710938, "global_step": 362683, "epoch": 4369} {"train_loss": -25.439992904663086, "global_step": 362684, "epoch": 4369} {"train_loss": -25.85906982421875, "global_step": 362685, "epoch": 4369} {"train_loss": -24.960424423217773, "global_step": 362686, "epoch": 4369} {"train_loss": -25.885772705078125, "global_step": 362687, "epoch": 4369} {"train_loss": -25.92438316345215, "global_step": 362688, "epoch": 4369} {"train_loss": -25.804922103881836, "global_step": 362689, "epoch": 4369} {"train_loss": -25.901248931884766, "global_step": 362690, "epoch": 4369} {"train_loss": -25.8531494140625, "global_step": 362691, "epoch": 4369} {"train_loss": -25.295242309570312, "global_step": 362692, "epoch": 4369} {"train_loss": -26.406097412109375, "global_step": 362693, "epoch": 4369} {"train_loss": -26.081533432006836, "global_step": 362694, "epoch": 4369} {"train_loss": -25.878864288330078, "global_step": 362695, "epoch": 4369} {"train_loss": -26.248437881469727, "global_step": 362696, "epoch": 4369} {"train_loss": -26.276575088500977, "global_step": 362697, "epoch": 4369} {"train_loss": -26.17374038696289, "global_step": 362698, "epoch": 4369} {"train_loss": -26.22039794921875, "global_step": 362699, "epoch": 4369} {"train_loss": -25.975255966186523, "global_step": 362700, "epoch": 4369} {"train_loss": -26.0933895111084, "global_step": 362701, "epoch": 4369} {"train_loss": -26.52085304260254, "global_step": 362702, "epoch": 4369} {"train_loss": -26.32123374938965, "global_step": 362703, "epoch": 4369} {"train_loss": -26.264036178588867, "global_step": 362704, "epoch": 4369} {"train_loss": -26.092878341674805, "global_step": 362705, "epoch": 4369} {"train_loss": -26.275497436523438, "global_step": 362706, "epoch": 4369} {"train_loss": -26.08003044128418, "global_step": 362707, "epoch": 4369} {"train_loss": -26.167652130126953, "global_step": 362708, "epoch": 4369} {"train_loss": -26.07799417426787, "global_step": 362709, "epoch": 4369, "val_loss": 6599390.0} {"train_loss": -25.870763778686523, "global_step": 362710, "epoch": 4370} {"train_loss": -26.22641372680664, "global_step": 362711, "epoch": 4370} {"train_loss": -26.1549072265625, "global_step": 362712, "epoch": 4370} {"train_loss": -26.288000106811523, "global_step": 362713, "epoch": 4370} {"train_loss": -26.200681686401367, "global_step": 362714, "epoch": 4370} {"train_loss": -26.0582218170166, "global_step": 362715, "epoch": 4370} {"train_loss": -25.739898681640625, "global_step": 362716, "epoch": 4370} {"train_loss": -26.019367218017578, "global_step": 362717, "epoch": 4370} {"train_loss": -26.053937911987305, "global_step": 362718, "epoch": 4370} {"train_loss": -26.320602416992188, "global_step": 362719, "epoch": 4370} {"train_loss": -26.211965560913086, "global_step": 362720, "epoch": 4370} {"train_loss": -26.5405216217041, "global_step": 362721, "epoch": 4370} {"train_loss": -26.04890251159668, "global_step": 362722, "epoch": 4370} {"train_loss": -26.272003173828125, "global_step": 362723, "epoch": 4370} {"train_loss": -26.066492080688477, "global_step": 362724, "epoch": 4370} {"train_loss": -26.2208194732666, "global_step": 362725, "epoch": 4370} {"train_loss": -26.619110107421875, "global_step": 362726, "epoch": 4370} {"train_loss": -26.10479736328125, "global_step": 362727, "epoch": 4370} {"train_loss": -26.329254150390625, "global_step": 362728, "epoch": 4370} {"train_loss": -26.395349502563477, "global_step": 362729, "epoch": 4370} {"train_loss": -26.379941940307617, "global_step": 362730, "epoch": 4370} {"train_loss": -26.239355087280273, "global_step": 362731, "epoch": 4370} {"train_loss": -26.251026153564453, "global_step": 362732, "epoch": 4370} {"train_loss": -26.40154457092285, "global_step": 362733, "epoch": 4370} {"train_loss": -26.2326717376709, "global_step": 362734, "epoch": 4370} {"train_loss": -26.408166885375977, "global_step": 362735, "epoch": 4370} {"train_loss": -26.3811092376709, "global_step": 362736, "epoch": 4370} {"train_loss": -26.0759220123291, "global_step": 362737, "epoch": 4370} {"train_loss": -26.291284561157227, "global_step": 362738, "epoch": 4370} {"train_loss": -26.242862701416016, "global_step": 362739, "epoch": 4370} {"train_loss": -26.06658935546875, "global_step": 362740, "epoch": 4370} {"train_loss": -26.483488082885742, "global_step": 362741, "epoch": 4370} {"train_loss": -26.32464599609375, "global_step": 362742, "epoch": 4370} {"train_loss": -26.18190574645996, "global_step": 362743, "epoch": 4370} {"train_loss": -26.29339027404785, "global_step": 362744, "epoch": 4370} {"train_loss": -26.187952041625977, "global_step": 362745, "epoch": 4370} {"train_loss": -26.515033721923828, "global_step": 362746, "epoch": 4370} {"train_loss": -26.560049057006836, "global_step": 362747, "epoch": 4370} {"train_loss": -26.38762855529785, "global_step": 362748, "epoch": 4370} {"train_loss": -26.467193603515625, "global_step": 362749, "epoch": 4370} {"train_loss": -26.319198608398438, "global_step": 362750, "epoch": 4370} {"train_loss": -26.147794723510742, "global_step": 362751, "epoch": 4370} {"train_loss": -26.63986587524414, "global_step": 362752, "epoch": 4370} {"train_loss": -26.62228775024414, "global_step": 362753, "epoch": 4370} {"train_loss": -26.316946029663086, "global_step": 362754, "epoch": 4370} {"train_loss": -26.45570945739746, "global_step": 362755, "epoch": 4370} {"train_loss": -26.80076026916504, "global_step": 362756, "epoch": 4370} {"train_loss": -26.59638023376465, "global_step": 362757, "epoch": 4370} {"train_loss": -26.61451530456543, "global_step": 362758, "epoch": 4370} {"train_loss": -26.119068145751953, "global_step": 362759, "epoch": 4370} {"train_loss": -26.426862716674805, "global_step": 362760, "epoch": 4370} {"train_loss": -26.241718292236328, "global_step": 362761, "epoch": 4370} {"train_loss": -26.444761276245117, "global_step": 362762, "epoch": 4370} {"train_loss": -26.501630783081055, "global_step": 362763, "epoch": 4370} {"train_loss": -26.30897331237793, "global_step": 362764, "epoch": 4370} {"train_loss": -26.185352325439453, "global_step": 362765, "epoch": 4370} {"train_loss": -25.64668846130371, "global_step": 362766, "epoch": 4370} {"train_loss": -26.332416534423828, "global_step": 362767, "epoch": 4370} {"train_loss": -26.220462799072266, "global_step": 362768, "epoch": 4370} {"train_loss": -26.309558868408203, "global_step": 362769, "epoch": 4370} {"train_loss": -26.35269546508789, "global_step": 362770, "epoch": 4370} {"train_loss": -26.457059860229492, "global_step": 362771, "epoch": 4370} {"train_loss": -26.139007568359375, "global_step": 362772, "epoch": 4370} {"train_loss": -26.205785751342773, "global_step": 362773, "epoch": 4370} {"train_loss": -26.639480590820312, "global_step": 362774, "epoch": 4370} {"train_loss": -26.706937789916992, "global_step": 362775, "epoch": 4370} {"train_loss": -26.556486129760742, "global_step": 362776, "epoch": 4370} {"train_loss": -26.39838981628418, "global_step": 362777, "epoch": 4370} {"train_loss": -26.571054458618164, "global_step": 362778, "epoch": 4370} {"train_loss": -26.580968856811523, "global_step": 362779, "epoch": 4370} {"train_loss": -26.1300048828125, "global_step": 362780, "epoch": 4370} {"train_loss": -26.42191505432129, "global_step": 362781, "epoch": 4370} {"train_loss": -26.636255264282227, "global_step": 362782, "epoch": 4370} {"train_loss": -26.55329704284668, "global_step": 362783, "epoch": 4370} {"train_loss": -26.339567184448242, "global_step": 362784, "epoch": 4370} {"train_loss": -26.23609733581543, "global_step": 362785, "epoch": 4370} {"train_loss": -26.5769100189209, "global_step": 362786, "epoch": 4370} {"train_loss": -26.13492202758789, "global_step": 362787, "epoch": 4370} {"train_loss": -26.310522079467773, "global_step": 362788, "epoch": 4370} {"train_loss": -26.5839786529541, "global_step": 362789, "epoch": 4370} {"train_loss": -26.13434410095215, "global_step": 362790, "epoch": 4370} {"train_loss": -26.396942138671875, "global_step": 362791, "epoch": 4370} {"train_loss": -26.31762311544763, "global_step": 362792, "epoch": 4370, "val_loss": 6634855.0} {"train_loss": -24.689002990722656, "global_step": 362793, "epoch": 4371} {"train_loss": -25.111587524414062, "global_step": 362794, "epoch": 4371} {"train_loss": -25.860000610351562, "global_step": 362795, "epoch": 4371} {"train_loss": -25.28426170349121, "global_step": 362796, "epoch": 4371} {"train_loss": -25.4085636138916, "global_step": 362797, "epoch": 4371} {"train_loss": -25.573347091674805, "global_step": 362798, "epoch": 4371} {"train_loss": -26.039886474609375, "global_step": 362799, "epoch": 4371} {"train_loss": -25.705432891845703, "global_step": 362800, "epoch": 4371} {"train_loss": -26.05634880065918, "global_step": 362801, "epoch": 4371} {"train_loss": -26.04721450805664, "global_step": 362802, "epoch": 4371} {"train_loss": -25.820470809936523, "global_step": 362803, "epoch": 4371} {"train_loss": -25.91119956970215, "global_step": 362804, "epoch": 4371} {"train_loss": -26.02300453186035, "global_step": 362805, "epoch": 4371} {"train_loss": -25.90412712097168, "global_step": 362806, "epoch": 4371} {"train_loss": -25.853818893432617, "global_step": 362807, "epoch": 4371} {"train_loss": -25.85560417175293, "global_step": 362808, "epoch": 4371} {"train_loss": -26.118331909179688, "global_step": 362809, "epoch": 4371} {"train_loss": -26.004169464111328, "global_step": 362810, "epoch": 4371} {"train_loss": -26.4397029876709, "global_step": 362811, "epoch": 4371} {"train_loss": -25.949430465698242, "global_step": 362812, "epoch": 4371} {"train_loss": -25.962682723999023, "global_step": 362813, "epoch": 4371} {"train_loss": -26.049570083618164, "global_step": 362814, "epoch": 4371} {"train_loss": -26.098031997680664, "global_step": 362815, "epoch": 4371} {"train_loss": -26.250385284423828, "global_step": 362816, "epoch": 4371} {"train_loss": -25.851734161376953, "global_step": 362817, "epoch": 4371} {"train_loss": -26.4196720123291, "global_step": 362818, "epoch": 4371} {"train_loss": -25.845413208007812, "global_step": 362819, "epoch": 4371} {"train_loss": -26.0336856842041, "global_step": 362820, "epoch": 4371} {"train_loss": -26.143518447875977, "global_step": 362821, "epoch": 4371} {"train_loss": -26.574216842651367, "global_step": 362822, "epoch": 4371} {"train_loss": -25.856103897094727, "global_step": 362823, "epoch": 4371} {"train_loss": -26.515512466430664, "global_step": 362824, "epoch": 4371} {"train_loss": -26.249479293823242, "global_step": 362825, "epoch": 4371} {"train_loss": -26.431562423706055, "global_step": 362826, "epoch": 4371} {"train_loss": -25.95578384399414, "global_step": 362827, "epoch": 4371} {"train_loss": -26.31319236755371, "global_step": 362828, "epoch": 4371} {"train_loss": -25.78565788269043, "global_step": 362829, "epoch": 4371} {"train_loss": -26.510578155517578, "global_step": 362830, "epoch": 4371} {"train_loss": -26.43560791015625, "global_step": 362831, "epoch": 4371} {"train_loss": -26.525394439697266, "global_step": 362832, "epoch": 4371} {"train_loss": -26.24200439453125, "global_step": 362833, "epoch": 4371} {"train_loss": -26.166187286376953, "global_step": 362834, "epoch": 4371} {"train_loss": -26.17982292175293, "global_step": 362835, "epoch": 4371} {"train_loss": -26.00213623046875, "global_step": 362836, "epoch": 4371} {"train_loss": -26.292938232421875, "global_step": 362837, "epoch": 4371} {"train_loss": -26.396581649780273, "global_step": 362838, "epoch": 4371} {"train_loss": -26.193878173828125, "global_step": 362839, "epoch": 4371} {"train_loss": -26.596271514892578, "global_step": 362840, "epoch": 4371} {"train_loss": -26.433279037475586, "global_step": 362841, "epoch": 4371} {"train_loss": -26.43049430847168, "global_step": 362842, "epoch": 4371} {"train_loss": -26.183897018432617, "global_step": 362843, "epoch": 4371} {"train_loss": -26.55535888671875, "global_step": 362844, "epoch": 4371} {"train_loss": -26.39801597595215, "global_step": 362845, "epoch": 4371} {"train_loss": -26.34173011779785, "global_step": 362846, "epoch": 4371} {"train_loss": -26.324859619140625, "global_step": 362847, "epoch": 4371} {"train_loss": -26.158370971679688, "global_step": 362848, "epoch": 4371} {"train_loss": -26.510969161987305, "global_step": 362849, "epoch": 4371} {"train_loss": -26.535303115844727, "global_step": 362850, "epoch": 4371} {"train_loss": -26.408727645874023, "global_step": 362851, "epoch": 4371} {"train_loss": -26.278430938720703, "global_step": 362852, "epoch": 4371} {"train_loss": -26.046253204345703, "global_step": 362853, "epoch": 4371} {"train_loss": -26.357227325439453, "global_step": 362854, "epoch": 4371} {"train_loss": -26.224533081054688, "global_step": 362855, "epoch": 4371} {"train_loss": -26.6839656829834, "global_step": 362856, "epoch": 4371} {"train_loss": -26.419464111328125, "global_step": 362857, "epoch": 4371} {"train_loss": -26.134519577026367, "global_step": 362858, "epoch": 4371} {"train_loss": -26.2896785736084, "global_step": 362859, "epoch": 4371} {"train_loss": -26.18340492248535, "global_step": 362860, "epoch": 4371} {"train_loss": -26.30179786682129, "global_step": 362861, "epoch": 4371} {"train_loss": -26.4061336517334, "global_step": 362862, "epoch": 4371} {"train_loss": -26.523590087890625, "global_step": 362863, "epoch": 4371} {"train_loss": -26.12091064453125, "global_step": 362864, "epoch": 4371} {"train_loss": -26.286453247070312, "global_step": 362865, "epoch": 4371} {"train_loss": -25.99867057800293, "global_step": 362866, "epoch": 4371} {"train_loss": -26.593503952026367, "global_step": 362867, "epoch": 4371} {"train_loss": -26.027006149291992, "global_step": 362868, "epoch": 4371} {"train_loss": -26.07025146484375, "global_step": 362869, "epoch": 4371} {"train_loss": -26.355539321899414, "global_step": 362870, "epoch": 4371} {"train_loss": -26.456212997436523, "global_step": 362871, "epoch": 4371} {"train_loss": -26.304590225219727, "global_step": 362872, "epoch": 4371} {"train_loss": -26.13065528869629, "global_step": 362873, "epoch": 4371} {"train_loss": -26.3636417388916, "global_step": 362874, "epoch": 4371} {"train_loss": -26.165372113147413, "global_step": 362875, "epoch": 4371, "val_loss": 6627325.5} {"train_loss": -25.95344352722168, "global_step": 362876, "epoch": 4372} {"train_loss": -25.942691802978516, "global_step": 362877, "epoch": 4372} {"train_loss": -26.044483184814453, "global_step": 362878, "epoch": 4372} {"train_loss": -25.983692169189453, "global_step": 362879, "epoch": 4372} {"train_loss": -25.521671295166016, "global_step": 362880, "epoch": 4372} {"train_loss": -26.18006706237793, "global_step": 362881, "epoch": 4372} {"train_loss": -25.963031768798828, "global_step": 362882, "epoch": 4372} {"train_loss": -25.932804107666016, "global_step": 362883, "epoch": 4372} {"train_loss": -25.91131591796875, "global_step": 362884, "epoch": 4372} {"train_loss": -25.884963989257812, "global_step": 362885, "epoch": 4372} {"train_loss": -25.895109176635742, "global_step": 362886, "epoch": 4372} {"train_loss": -25.926435470581055, "global_step": 362887, "epoch": 4372} {"train_loss": -26.088048934936523, "global_step": 362888, "epoch": 4372} {"train_loss": -26.115753173828125, "global_step": 362889, "epoch": 4372} {"train_loss": -25.601526260375977, "global_step": 362890, "epoch": 4372} {"train_loss": -25.99720573425293, "global_step": 362891, "epoch": 4372} {"train_loss": -25.479177474975586, "global_step": 362892, "epoch": 4372} {"train_loss": -26.209217071533203, "global_step": 362893, "epoch": 4372} {"train_loss": -25.608518600463867, "global_step": 362894, "epoch": 4372} {"train_loss": -25.714752197265625, "global_step": 362895, "epoch": 4372} {"train_loss": -26.157094955444336, "global_step": 362896, "epoch": 4372} {"train_loss": -26.3337459564209, "global_step": 362897, "epoch": 4372} {"train_loss": -26.426990509033203, "global_step": 362898, "epoch": 4372} {"train_loss": -25.944446563720703, "global_step": 362899, "epoch": 4372} {"train_loss": -26.40689468383789, "global_step": 362900, "epoch": 4372} {"train_loss": -25.797611236572266, "global_step": 362901, "epoch": 4372} {"train_loss": -26.355548858642578, "global_step": 362902, "epoch": 4372} {"train_loss": -26.400388717651367, "global_step": 362903, "epoch": 4372} {"train_loss": -26.148914337158203, "global_step": 362904, "epoch": 4372} {"train_loss": -26.241689682006836, "global_step": 362905, "epoch": 4372} {"train_loss": -26.486780166625977, "global_step": 362906, "epoch": 4372} {"train_loss": -26.262393951416016, "global_step": 362907, "epoch": 4372} {"train_loss": -26.382068634033203, "global_step": 362908, "epoch": 4372} {"train_loss": -26.320505142211914, "global_step": 362909, "epoch": 4372} {"train_loss": -26.29779624938965, "global_step": 362910, "epoch": 4372} {"train_loss": -26.537084579467773, "global_step": 362911, "epoch": 4372} {"train_loss": -26.04351234436035, "global_step": 362912, "epoch": 4372} {"train_loss": -26.17634391784668, "global_step": 362913, "epoch": 4372} {"train_loss": -26.44297218322754, "global_step": 362914, "epoch": 4372} {"train_loss": -26.518823623657227, "global_step": 362915, "epoch": 4372} {"train_loss": -26.622241973876953, "global_step": 362916, "epoch": 4372} {"train_loss": -26.459989547729492, "global_step": 362917, "epoch": 4372} {"train_loss": -26.67557144165039, "global_step": 362918, "epoch": 4372} {"train_loss": -26.419782638549805, "global_step": 362919, "epoch": 4372} {"train_loss": -26.355213165283203, "global_step": 362920, "epoch": 4372} {"train_loss": -26.210281372070312, "global_step": 362921, "epoch": 4372} {"train_loss": -26.376998901367188, "global_step": 362922, "epoch": 4372} {"train_loss": -26.2547664642334, "global_step": 362923, "epoch": 4372} {"train_loss": -26.471311569213867, "global_step": 362924, "epoch": 4372} {"train_loss": -26.3609619140625, "global_step": 362925, "epoch": 4372} {"train_loss": -26.495100021362305, "global_step": 362926, "epoch": 4372} {"train_loss": -26.472354888916016, "global_step": 362927, "epoch": 4372} {"train_loss": -26.18475914001465, "global_step": 362928, "epoch": 4372} {"train_loss": -26.40827751159668, "global_step": 362929, "epoch": 4372} {"train_loss": -26.762372970581055, "global_step": 362930, "epoch": 4372} {"train_loss": -26.493513107299805, "global_step": 362931, "epoch": 4372} {"train_loss": -26.442697525024414, "global_step": 362932, "epoch": 4372} {"train_loss": -26.687829971313477, "global_step": 362933, "epoch": 4372} {"train_loss": -26.163095474243164, "global_step": 362934, "epoch": 4372} {"train_loss": -26.1781063079834, "global_step": 362935, "epoch": 4372} {"train_loss": -26.28655433654785, "global_step": 362936, "epoch": 4372} {"train_loss": -26.216156005859375, "global_step": 362937, "epoch": 4372} {"train_loss": -26.07756996154785, "global_step": 362938, "epoch": 4372} {"train_loss": -26.285200119018555, "global_step": 362939, "epoch": 4372} {"train_loss": -26.086353302001953, "global_step": 362940, "epoch": 4372} {"train_loss": -26.12983512878418, "global_step": 362941, "epoch": 4372} {"train_loss": -25.935791015625, "global_step": 362942, "epoch": 4372} {"train_loss": -25.7048282623291, "global_step": 362943, "epoch": 4372} {"train_loss": -25.8752498626709, "global_step": 362944, "epoch": 4372} {"train_loss": -26.727737426757812, "global_step": 362945, "epoch": 4372} {"train_loss": -26.013824462890625, "global_step": 362946, "epoch": 4372} {"train_loss": -26.095855712890625, "global_step": 362947, "epoch": 4372} {"train_loss": -26.194229125976562, "global_step": 362948, "epoch": 4372} {"train_loss": -26.308837890625, "global_step": 362949, "epoch": 4372} {"train_loss": -26.12640380859375, "global_step": 362950, "epoch": 4372} {"train_loss": -26.20650291442871, "global_step": 362951, "epoch": 4372} {"train_loss": -26.022064208984375, "global_step": 362952, "epoch": 4372} {"train_loss": -26.349185943603516, "global_step": 362953, "epoch": 4372} {"train_loss": -26.384387969970703, "global_step": 362954, "epoch": 4372} {"train_loss": -26.235828399658203, "global_step": 362955, "epoch": 4372} {"train_loss": -26.365156173706055, "global_step": 362956, "epoch": 4372} {"train_loss": -25.9290828704834, "global_step": 362957, "epoch": 4372} {"train_loss": -26.21470387010689, "global_step": 362958, "epoch": 4372, "val_loss": 6624455.0} {"train_loss": -25.61602210998535, "global_step": 362959, "epoch": 4373} {"train_loss": -26.02880859375, "global_step": 362960, "epoch": 4373} {"train_loss": -25.998188018798828, "global_step": 362961, "epoch": 4373} {"train_loss": -25.61240577697754, "global_step": 362962, "epoch": 4373} {"train_loss": -25.8225154876709, "global_step": 362963, "epoch": 4373} {"train_loss": -25.693115234375, "global_step": 362964, "epoch": 4373} {"train_loss": -25.94012451171875, "global_step": 362965, "epoch": 4373} {"train_loss": -25.928451538085938, "global_step": 362966, "epoch": 4373} {"train_loss": -26.08307456970215, "global_step": 362967, "epoch": 4373} {"train_loss": -25.834854125976562, "global_step": 362968, "epoch": 4373} {"train_loss": -25.947744369506836, "global_step": 362969, "epoch": 4373} {"train_loss": -25.896087646484375, "global_step": 362970, "epoch": 4373} {"train_loss": -25.9666805267334, "global_step": 362971, "epoch": 4373} {"train_loss": -25.854907989501953, "global_step": 362972, "epoch": 4373} {"train_loss": -25.84218406677246, "global_step": 362973, "epoch": 4373} {"train_loss": -26.119482040405273, "global_step": 362974, "epoch": 4373} {"train_loss": -26.027774810791016, "global_step": 362975, "epoch": 4373} {"train_loss": -26.20253562927246, "global_step": 362976, "epoch": 4373} {"train_loss": -26.106403350830078, "global_step": 362977, "epoch": 4373} {"train_loss": -26.18255615234375, "global_step": 362978, "epoch": 4373} {"train_loss": -26.00013542175293, "global_step": 362979, "epoch": 4373} {"train_loss": -26.081384658813477, "global_step": 362980, "epoch": 4373} {"train_loss": -26.644012451171875, "global_step": 362981, "epoch": 4373} {"train_loss": -26.059921264648438, "global_step": 362982, "epoch": 4373} {"train_loss": -26.45358657836914, "global_step": 362983, "epoch": 4373} {"train_loss": -26.16181755065918, "global_step": 362984, "epoch": 4373} {"train_loss": -26.088708877563477, "global_step": 362985, "epoch": 4373} {"train_loss": -26.23404884338379, "global_step": 362986, "epoch": 4373} {"train_loss": -26.074499130249023, "global_step": 362987, "epoch": 4373} {"train_loss": -26.392919540405273, "global_step": 362988, "epoch": 4373} {"train_loss": -26.270023345947266, "global_step": 362989, "epoch": 4373} {"train_loss": -26.0429744720459, "global_step": 362990, "epoch": 4373} {"train_loss": -26.22589111328125, "global_step": 362991, "epoch": 4373} {"train_loss": -26.143310546875, "global_step": 362992, "epoch": 4373} {"train_loss": -26.36910057067871, "global_step": 362993, "epoch": 4373} {"train_loss": -26.310470581054688, "global_step": 362994, "epoch": 4373} {"train_loss": -26.235031127929688, "global_step": 362995, "epoch": 4373} {"train_loss": -26.421659469604492, "global_step": 362996, "epoch": 4373} {"train_loss": -26.461597442626953, "global_step": 362997, "epoch": 4373} {"train_loss": -26.51470375061035, "global_step": 362998, "epoch": 4373} {"train_loss": -26.266937255859375, "global_step": 362999, "epoch": 4373} {"train_loss": -26.403669357299805, "global_step": 363000, "epoch": 4373} {"train_loss": -26.589075088500977, "global_step": 363001, "epoch": 4373} {"train_loss": -26.23453712463379, "global_step": 363002, "epoch": 4373} {"train_loss": -26.48360252380371, "global_step": 363003, "epoch": 4373} {"train_loss": -26.415985107421875, "global_step": 363004, "epoch": 4373} {"train_loss": -26.526111602783203, "global_step": 363005, "epoch": 4373} {"train_loss": -26.355894088745117, "global_step": 363006, "epoch": 4373} {"train_loss": -25.856647491455078, "global_step": 363007, "epoch": 4373} {"train_loss": -26.102514266967773, "global_step": 363008, "epoch": 4373} {"train_loss": -26.38822364807129, "global_step": 363009, "epoch": 4373} {"train_loss": -26.199934005737305, "global_step": 363010, "epoch": 4373} {"train_loss": -26.49555015563965, "global_step": 363011, "epoch": 4373} {"train_loss": -26.096206665039062, "global_step": 363012, "epoch": 4373} {"train_loss": -26.21160888671875, "global_step": 363013, "epoch": 4373} {"train_loss": -26.315475463867188, "global_step": 363014, "epoch": 4373} {"train_loss": -26.465240478515625, "global_step": 363015, "epoch": 4373} {"train_loss": -26.832067489624023, "global_step": 363016, "epoch": 4373} {"train_loss": -26.091094970703125, "global_step": 363017, "epoch": 4373} {"train_loss": -26.153263092041016, "global_step": 363018, "epoch": 4373} {"train_loss": -26.17354393005371, "global_step": 363019, "epoch": 4373} {"train_loss": -26.129791259765625, "global_step": 363020, "epoch": 4373} {"train_loss": -26.135889053344727, "global_step": 363021, "epoch": 4373} {"train_loss": -26.4534912109375, "global_step": 363022, "epoch": 4373} {"train_loss": -26.46964454650879, "global_step": 363023, "epoch": 4373} {"train_loss": -26.390155792236328, "global_step": 363024, "epoch": 4373} {"train_loss": -26.277664184570312, "global_step": 363025, "epoch": 4373} {"train_loss": -26.0433406829834, "global_step": 363026, "epoch": 4373} {"train_loss": -26.311023712158203, "global_step": 363027, "epoch": 4373} {"train_loss": -26.444726943969727, "global_step": 363028, "epoch": 4373} {"train_loss": -26.5473575592041, "global_step": 363029, "epoch": 4373} {"train_loss": -26.29803466796875, "global_step": 363030, "epoch": 4373} {"train_loss": -25.849628448486328, "global_step": 363031, "epoch": 4373} {"train_loss": -26.37981605529785, "global_step": 363032, "epoch": 4373} {"train_loss": -25.878528594970703, "global_step": 363033, "epoch": 4373} {"train_loss": -26.473438262939453, "global_step": 363034, "epoch": 4373} {"train_loss": -26.017663955688477, "global_step": 363035, "epoch": 4373} {"train_loss": -26.425336837768555, "global_step": 363036, "epoch": 4373} {"train_loss": -26.54657554626465, "global_step": 363037, "epoch": 4373} {"train_loss": -26.156753540039062, "global_step": 363038, "epoch": 4373} {"train_loss": -26.63384437561035, "global_step": 363039, "epoch": 4373} {"train_loss": -26.664915084838867, "global_step": 363040, "epoch": 4373} {"train_loss": -26.22037841613034, "global_step": 363041, "epoch": 4373, "val_loss": 6546070.5} {"train_loss": -25.325881958007812, "global_step": 363042, "epoch": 4374} {"train_loss": -25.295846939086914, "global_step": 363043, "epoch": 4374} {"train_loss": -25.504484176635742, "global_step": 363044, "epoch": 4374} {"train_loss": -25.482452392578125, "global_step": 363045, "epoch": 4374} {"train_loss": -25.61370849609375, "global_step": 363046, "epoch": 4374} {"train_loss": -26.055124282836914, "global_step": 363047, "epoch": 4374} {"train_loss": -25.719236373901367, "global_step": 363048, "epoch": 4374} {"train_loss": -25.011049270629883, "global_step": 363049, "epoch": 4374} {"train_loss": -26.005390167236328, "global_step": 363050, "epoch": 4374} {"train_loss": -25.782392501831055, "global_step": 363051, "epoch": 4374} {"train_loss": -25.537839889526367, "global_step": 363052, "epoch": 4374} {"train_loss": -26.157621383666992, "global_step": 363053, "epoch": 4374} {"train_loss": -25.502553939819336, "global_step": 363054, "epoch": 4374} {"train_loss": -26.02192497253418, "global_step": 363055, "epoch": 4374} {"train_loss": -25.850332260131836, "global_step": 363056, "epoch": 4374} {"train_loss": -25.742883682250977, "global_step": 363057, "epoch": 4374} {"train_loss": -26.034162521362305, "global_step": 363058, "epoch": 4374} {"train_loss": -26.011743545532227, "global_step": 363059, "epoch": 4374} {"train_loss": -26.222497940063477, "global_step": 363060, "epoch": 4374} {"train_loss": -25.66029167175293, "global_step": 363061, "epoch": 4374} {"train_loss": -25.926227569580078, "global_step": 363062, "epoch": 4374} {"train_loss": -26.0567626953125, "global_step": 363063, "epoch": 4374} {"train_loss": -25.9945068359375, "global_step": 363064, "epoch": 4374} {"train_loss": -25.44081687927246, "global_step": 363065, "epoch": 4374} {"train_loss": -26.176794052124023, "global_step": 363066, "epoch": 4374} {"train_loss": -26.296167373657227, "global_step": 363067, "epoch": 4374} {"train_loss": -26.348876953125, "global_step": 363068, "epoch": 4374} {"train_loss": -26.089597702026367, "global_step": 363069, "epoch": 4374} {"train_loss": -26.075475692749023, "global_step": 363070, "epoch": 4374} {"train_loss": -25.82929039001465, "global_step": 363071, "epoch": 4374} {"train_loss": -25.743860244750977, "global_step": 363072, "epoch": 4374} {"train_loss": -25.9976806640625, "global_step": 363073, "epoch": 4374} {"train_loss": -26.173852920532227, "global_step": 363074, "epoch": 4374} {"train_loss": -26.251184463500977, "global_step": 363075, "epoch": 4374} {"train_loss": -26.125961303710938, "global_step": 363076, "epoch": 4374} {"train_loss": -25.952978134155273, "global_step": 363077, "epoch": 4374} {"train_loss": -26.423803329467773, "global_step": 363078, "epoch": 4374} {"train_loss": -26.15576171875, "global_step": 363079, "epoch": 4374} {"train_loss": -26.424081802368164, "global_step": 363080, "epoch": 4374} {"train_loss": -26.4210147857666, "global_step": 363081, "epoch": 4374} {"train_loss": -26.647451400756836, "global_step": 363082, "epoch": 4374} {"train_loss": -26.417999267578125, "global_step": 363083, "epoch": 4374} {"train_loss": -26.26509666442871, "global_step": 363084, "epoch": 4374} {"train_loss": -26.49263572692871, "global_step": 363085, "epoch": 4374} {"train_loss": -26.520471572875977, "global_step": 363086, "epoch": 4374} {"train_loss": -26.393985748291016, "global_step": 363087, "epoch": 4374} {"train_loss": -26.58595085144043, "global_step": 363088, "epoch": 4374} {"train_loss": -26.06979751586914, "global_step": 363089, "epoch": 4374} {"train_loss": -26.647674560546875, "global_step": 363090, "epoch": 4374} {"train_loss": -26.364789962768555, "global_step": 363091, "epoch": 4374} {"train_loss": -26.438024520874023, "global_step": 363092, "epoch": 4374} {"train_loss": -26.338134765625, "global_step": 363093, "epoch": 4374} {"train_loss": -26.66792106628418, "global_step": 363094, "epoch": 4374} {"train_loss": -26.675073623657227, "global_step": 363095, "epoch": 4374} {"train_loss": -26.579980850219727, "global_step": 363096, "epoch": 4374} {"train_loss": -26.40350341796875, "global_step": 363097, "epoch": 4374} {"train_loss": -26.521604537963867, "global_step": 363098, "epoch": 4374} {"train_loss": -26.5209903717041, "global_step": 363099, "epoch": 4374} {"train_loss": -26.6516056060791, "global_step": 363100, "epoch": 4374} {"train_loss": -26.631195068359375, "global_step": 363101, "epoch": 4374} {"train_loss": -26.050939559936523, "global_step": 363102, "epoch": 4374} {"train_loss": -26.23046875, "global_step": 363103, "epoch": 4374} {"train_loss": -26.165700912475586, "global_step": 363104, "epoch": 4374} {"train_loss": -26.797285079956055, "global_step": 363105, "epoch": 4374} {"train_loss": -26.536197662353516, "global_step": 363106, "epoch": 4374} {"train_loss": -26.5301456451416, "global_step": 363107, "epoch": 4374} {"train_loss": -26.26056480407715, "global_step": 363108, "epoch": 4374} {"train_loss": -26.021406173706055, "global_step": 363109, "epoch": 4374} {"train_loss": -26.384113311767578, "global_step": 363110, "epoch": 4374} {"train_loss": -26.79973793029785, "global_step": 363111, "epoch": 4374} {"train_loss": -26.249906539916992, "global_step": 363112, "epoch": 4374} {"train_loss": -26.384967803955078, "global_step": 363113, "epoch": 4374} {"train_loss": -26.35322380065918, "global_step": 363114, "epoch": 4374} {"train_loss": -26.479583740234375, "global_step": 363115, "epoch": 4374} {"train_loss": -26.05010986328125, "global_step": 363116, "epoch": 4374} {"train_loss": -26.508544921875, "global_step": 363117, "epoch": 4374} {"train_loss": -26.497587203979492, "global_step": 363118, "epoch": 4374} {"train_loss": -26.224761962890625, "global_step": 363119, "epoch": 4374} {"train_loss": -26.576801300048828, "global_step": 363120, "epoch": 4374} {"train_loss": -26.357446670532227, "global_step": 363121, "epoch": 4374} {"train_loss": -26.014301300048828, "global_step": 363122, "epoch": 4374} {"train_loss": -26.224714279174805, "global_step": 363123, "epoch": 4374} {"train_loss": -26.17087274574372, "global_step": 363124, "epoch": 4374, "val_loss": 6558461.0} {"train_loss": -25.954776763916016, "global_step": 363125, "epoch": 4375} {"train_loss": -26.13327407836914, "global_step": 363126, "epoch": 4375} {"train_loss": -25.722166061401367, "global_step": 363127, "epoch": 4375} {"train_loss": -25.968570709228516, "global_step": 363128, "epoch": 4375} {"train_loss": -26.255517959594727, "global_step": 363129, "epoch": 4375} {"train_loss": -25.950525283813477, "global_step": 363130, "epoch": 4375} {"train_loss": -26.217023849487305, "global_step": 363131, "epoch": 4375} {"train_loss": -26.390533447265625, "global_step": 363132, "epoch": 4375} {"train_loss": -26.311023712158203, "global_step": 363133, "epoch": 4375} {"train_loss": -26.33230972290039, "global_step": 363134, "epoch": 4375} {"train_loss": -26.27004051208496, "global_step": 363135, "epoch": 4375} {"train_loss": -26.039432525634766, "global_step": 363136, "epoch": 4375} {"train_loss": -25.864065170288086, "global_step": 363137, "epoch": 4375} {"train_loss": -26.134521484375, "global_step": 363138, "epoch": 4375} {"train_loss": -26.09653663635254, "global_step": 363139, "epoch": 4375} {"train_loss": -26.07703971862793, "global_step": 363140, "epoch": 4375} {"train_loss": -26.361408233642578, "global_step": 363141, "epoch": 4375} {"train_loss": -26.195911407470703, "global_step": 363142, "epoch": 4375} {"train_loss": -26.006210327148438, "global_step": 363143, "epoch": 4375} {"train_loss": -26.217588424682617, "global_step": 363144, "epoch": 4375} {"train_loss": -26.361743927001953, "global_step": 363145, "epoch": 4375} {"train_loss": -26.334365844726562, "global_step": 363146, "epoch": 4375} {"train_loss": -25.83411979675293, "global_step": 363147, "epoch": 4375} {"train_loss": -26.191757202148438, "global_step": 363148, "epoch": 4375} {"train_loss": -26.91876792907715, "global_step": 363149, "epoch": 4375} {"train_loss": -26.38815689086914, "global_step": 363150, "epoch": 4375} {"train_loss": -26.245849609375, "global_step": 363151, "epoch": 4375} {"train_loss": -26.2294864654541, "global_step": 363152, "epoch": 4375} {"train_loss": -26.06429100036621, "global_step": 363153, "epoch": 4375} {"train_loss": -26.44895362854004, "global_step": 363154, "epoch": 4375} {"train_loss": -26.690412521362305, "global_step": 363155, "epoch": 4375} {"train_loss": -26.381139755249023, "global_step": 363156, "epoch": 4375} {"train_loss": -26.536029815673828, "global_step": 363157, "epoch": 4375} {"train_loss": -26.33686637878418, "global_step": 363158, "epoch": 4375} {"train_loss": -26.601186752319336, "global_step": 363159, "epoch": 4375} {"train_loss": -26.068166732788086, "global_step": 363160, "epoch": 4375} {"train_loss": -26.51715087890625, "global_step": 363161, "epoch": 4375} {"train_loss": -26.193517684936523, "global_step": 363162, "epoch": 4375} {"train_loss": -26.60910987854004, "global_step": 363163, "epoch": 4375} {"train_loss": -26.41175651550293, "global_step": 363164, "epoch": 4375} {"train_loss": -26.241254806518555, "global_step": 363165, "epoch": 4375} {"train_loss": -26.119171142578125, "global_step": 363166, "epoch": 4375} {"train_loss": -26.18577003479004, "global_step": 363167, "epoch": 4375} {"train_loss": -26.08509635925293, "global_step": 363168, "epoch": 4375} {"train_loss": -26.47480583190918, "global_step": 363169, "epoch": 4375} {"train_loss": -26.820043563842773, "global_step": 363170, "epoch": 4375} {"train_loss": -26.1058349609375, "global_step": 363171, "epoch": 4375} {"train_loss": -26.5412540435791, "global_step": 363172, "epoch": 4375} {"train_loss": -26.481403350830078, "global_step": 363173, "epoch": 4375} {"train_loss": -26.45046043395996, "global_step": 363174, "epoch": 4375} {"train_loss": -26.542402267456055, "global_step": 363175, "epoch": 4375} {"train_loss": -26.376474380493164, "global_step": 363176, "epoch": 4375} {"train_loss": -26.35337257385254, "global_step": 363177, "epoch": 4375} {"train_loss": -26.10784912109375, "global_step": 363178, "epoch": 4375} {"train_loss": -25.53377342224121, "global_step": 363179, "epoch": 4375} {"train_loss": -25.485807418823242, "global_step": 363180, "epoch": 4375} {"train_loss": -25.691675186157227, "global_step": 363181, "epoch": 4375} {"train_loss": -26.1230411529541, "global_step": 363182, "epoch": 4375} {"train_loss": -26.038440704345703, "global_step": 363183, "epoch": 4375} {"train_loss": -26.10430335998535, "global_step": 363184, "epoch": 4375} {"train_loss": -25.979284286499023, "global_step": 363185, "epoch": 4375} {"train_loss": -26.116092681884766, "global_step": 363186, "epoch": 4375} {"train_loss": -26.24020767211914, "global_step": 363187, "epoch": 4375} {"train_loss": -26.461923599243164, "global_step": 363188, "epoch": 4375} {"train_loss": -26.215423583984375, "global_step": 363189, "epoch": 4375} {"train_loss": -25.94879150390625, "global_step": 363190, "epoch": 4375} {"train_loss": -26.032270431518555, "global_step": 363191, "epoch": 4375} {"train_loss": -26.162841796875, "global_step": 363192, "epoch": 4375} {"train_loss": -26.190778732299805, "global_step": 363193, "epoch": 4375} {"train_loss": -26.055801391601562, "global_step": 363194, "epoch": 4375} {"train_loss": -26.532276153564453, "global_step": 363195, "epoch": 4375} {"train_loss": -26.620391845703125, "global_step": 363196, "epoch": 4375} {"train_loss": -26.209909439086914, "global_step": 363197, "epoch": 4375} {"train_loss": -25.94379234313965, "global_step": 363198, "epoch": 4375} {"train_loss": -26.52276611328125, "global_step": 363199, "epoch": 4375} {"train_loss": -26.01703453063965, "global_step": 363200, "epoch": 4375} {"train_loss": -25.94110107421875, "global_step": 363201, "epoch": 4375} {"train_loss": -25.98175621032715, "global_step": 363202, "epoch": 4375} {"train_loss": -26.496662139892578, "global_step": 363203, "epoch": 4375} {"train_loss": -26.332990646362305, "global_step": 363204, "epoch": 4375} {"train_loss": -26.495960235595703, "global_step": 363205, "epoch": 4375} {"train_loss": -25.945804595947266, "global_step": 363206, "epoch": 4375} {"train_loss": -26.242215099104914, "global_step": 363207, "epoch": 4375, "val_loss": 6658732.5} {"train_loss": -25.545705795288086, "global_step": 363208, "epoch": 4376} {"train_loss": -25.181119918823242, "global_step": 363209, "epoch": 4376} {"train_loss": -25.19072914123535, "global_step": 363210, "epoch": 4376} {"train_loss": -25.46784782409668, "global_step": 363211, "epoch": 4376} {"train_loss": -25.747573852539062, "global_step": 363212, "epoch": 4376} {"train_loss": -25.28019905090332, "global_step": 363213, "epoch": 4376} {"train_loss": -25.551225662231445, "global_step": 363214, "epoch": 4376} {"train_loss": -25.978809356689453, "global_step": 363215, "epoch": 4376} {"train_loss": -25.83473014831543, "global_step": 363216, "epoch": 4376} {"train_loss": -26.02630615234375, "global_step": 363217, "epoch": 4376} {"train_loss": -25.963623046875, "global_step": 363218, "epoch": 4376} {"train_loss": -25.869373321533203, "global_step": 363219, "epoch": 4376} {"train_loss": -25.784534454345703, "global_step": 363220, "epoch": 4376} {"train_loss": -25.783649444580078, "global_step": 363221, "epoch": 4376} {"train_loss": -25.703845977783203, "global_step": 363222, "epoch": 4376} {"train_loss": -25.117252349853516, "global_step": 363223, "epoch": 4376} {"train_loss": -26.0753116607666, "global_step": 363224, "epoch": 4376} {"train_loss": -26.18128776550293, "global_step": 363225, "epoch": 4376} {"train_loss": -25.763202667236328, "global_step": 363226, "epoch": 4376} {"train_loss": -25.986316680908203, "global_step": 363227, "epoch": 4376} {"train_loss": -26.0389461517334, "global_step": 363228, "epoch": 4376} {"train_loss": -26.347951889038086, "global_step": 363229, "epoch": 4376} {"train_loss": -26.27555274963379, "global_step": 363230, "epoch": 4376} {"train_loss": -25.913837432861328, "global_step": 363231, "epoch": 4376} {"train_loss": -26.050512313842773, "global_step": 363232, "epoch": 4376} {"train_loss": -25.75323486328125, "global_step": 363233, "epoch": 4376} {"train_loss": -26.114362716674805, "global_step": 363234, "epoch": 4376} {"train_loss": -26.405683517456055, "global_step": 363235, "epoch": 4376} {"train_loss": -26.09331703186035, "global_step": 363236, "epoch": 4376} {"train_loss": -26.1480655670166, "global_step": 363237, "epoch": 4376} {"train_loss": -26.064289093017578, "global_step": 363238, "epoch": 4376} {"train_loss": -26.719213485717773, "global_step": 363239, "epoch": 4376} {"train_loss": -26.062345504760742, "global_step": 363240, "epoch": 4376} {"train_loss": -26.136194229125977, "global_step": 363241, "epoch": 4376} {"train_loss": -26.581897735595703, "global_step": 363242, "epoch": 4376} {"train_loss": -26.336294174194336, "global_step": 363243, "epoch": 4376} {"train_loss": -26.14348793029785, "global_step": 363244, "epoch": 4376} {"train_loss": -26.313690185546875, "global_step": 363245, "epoch": 4376} {"train_loss": -26.106388092041016, "global_step": 363246, "epoch": 4376} {"train_loss": -26.021848678588867, "global_step": 363247, "epoch": 4376} {"train_loss": -25.94122314453125, "global_step": 363248, "epoch": 4376} {"train_loss": -25.56015396118164, "global_step": 363249, "epoch": 4376} {"train_loss": -26.408567428588867, "global_step": 363250, "epoch": 4376} {"train_loss": -26.269851684570312, "global_step": 363251, "epoch": 4376} {"train_loss": -26.21650505065918, "global_step": 363252, "epoch": 4376} {"train_loss": -25.937177658081055, "global_step": 363253, "epoch": 4376} {"train_loss": -26.36295509338379, "global_step": 363254, "epoch": 4376} {"train_loss": -26.116474151611328, "global_step": 363255, "epoch": 4376} {"train_loss": -26.591293334960938, "global_step": 363256, "epoch": 4376} {"train_loss": -26.2642879486084, "global_step": 363257, "epoch": 4376} {"train_loss": -25.97197914123535, "global_step": 363258, "epoch": 4376} {"train_loss": -26.751068115234375, "global_step": 363259, "epoch": 4376} {"train_loss": -26.456867218017578, "global_step": 363260, "epoch": 4376} {"train_loss": -26.1995906829834, "global_step": 363261, "epoch": 4376} {"train_loss": -26.2779483795166, "global_step": 363262, "epoch": 4376} {"train_loss": -26.54656982421875, "global_step": 363263, "epoch": 4376} {"train_loss": -26.119550704956055, "global_step": 363264, "epoch": 4376} {"train_loss": -26.231597900390625, "global_step": 363265, "epoch": 4376} {"train_loss": -26.616012573242188, "global_step": 363266, "epoch": 4376} {"train_loss": -26.342676162719727, "global_step": 363267, "epoch": 4376} {"train_loss": -26.318960189819336, "global_step": 363268, "epoch": 4376} {"train_loss": -26.321216583251953, "global_step": 363269, "epoch": 4376} {"train_loss": -26.381128311157227, "global_step": 363270, "epoch": 4376} {"train_loss": -26.69361686706543, "global_step": 363271, "epoch": 4376} {"train_loss": -26.456201553344727, "global_step": 363272, "epoch": 4376} {"train_loss": -26.330251693725586, "global_step": 363273, "epoch": 4376} {"train_loss": -26.413654327392578, "global_step": 363274, "epoch": 4376} {"train_loss": -26.27504539489746, "global_step": 363275, "epoch": 4376} {"train_loss": -26.36031150817871, "global_step": 363276, "epoch": 4376} {"train_loss": -26.050312042236328, "global_step": 363277, "epoch": 4376} {"train_loss": -26.225006103515625, "global_step": 363278, "epoch": 4376} {"train_loss": -26.31037712097168, "global_step": 363279, "epoch": 4376} {"train_loss": -26.2967586517334, "global_step": 363280, "epoch": 4376} {"train_loss": -25.99896240234375, "global_step": 363281, "epoch": 4376} {"train_loss": -26.201129913330078, "global_step": 363282, "epoch": 4376} {"train_loss": -26.138147354125977, "global_step": 363283, "epoch": 4376} {"train_loss": -26.50567626953125, "global_step": 363284, "epoch": 4376} {"train_loss": -26.480255126953125, "global_step": 363285, "epoch": 4376} {"train_loss": -25.93300437927246, "global_step": 363286, "epoch": 4376} {"train_loss": -26.3770809173584, "global_step": 363287, "epoch": 4376} {"train_loss": -26.194665908813477, "global_step": 363288, "epoch": 4376} {"train_loss": -26.337339401245117, "global_step": 363289, "epoch": 4376} {"train_loss": -26.10641132492617, "global_step": 363290, "epoch": 4376, "val_loss": 6601093.0} {"train_loss": -26.16056251525879, "global_step": 363291, "epoch": 4377} {"train_loss": -26.034866333007812, "global_step": 363292, "epoch": 4377} {"train_loss": -26.332855224609375, "global_step": 363293, "epoch": 4377} {"train_loss": -26.186559677124023, "global_step": 363294, "epoch": 4377} {"train_loss": -26.19935417175293, "global_step": 363295, "epoch": 4377} {"train_loss": -26.81854248046875, "global_step": 363296, "epoch": 4377} {"train_loss": -26.25553321838379, "global_step": 363297, "epoch": 4377} {"train_loss": -26.10602378845215, "global_step": 363298, "epoch": 4377} {"train_loss": -26.048049926757812, "global_step": 363299, "epoch": 4377} {"train_loss": -26.201995849609375, "global_step": 363300, "epoch": 4377} {"train_loss": -26.09773063659668, "global_step": 363301, "epoch": 4377} {"train_loss": -25.973587036132812, "global_step": 363302, "epoch": 4377} {"train_loss": -26.231836318969727, "global_step": 363303, "epoch": 4377} {"train_loss": -26.33707046508789, "global_step": 363304, "epoch": 4377} {"train_loss": -26.561750411987305, "global_step": 363305, "epoch": 4377} {"train_loss": -26.511693954467773, "global_step": 363306, "epoch": 4377} {"train_loss": -26.297901153564453, "global_step": 363307, "epoch": 4377} {"train_loss": -26.22216796875, "global_step": 363308, "epoch": 4377} {"train_loss": -26.382705688476562, "global_step": 363309, "epoch": 4377} {"train_loss": -26.6241397857666, "global_step": 363310, "epoch": 4377} {"train_loss": -26.38763427734375, "global_step": 363311, "epoch": 4377} {"train_loss": -26.381458282470703, "global_step": 363312, "epoch": 4377} {"train_loss": -26.259693145751953, "global_step": 363313, "epoch": 4377} {"train_loss": -26.431386947631836, "global_step": 363314, "epoch": 4377} {"train_loss": -26.19126319885254, "global_step": 363315, "epoch": 4377} {"train_loss": -26.281736373901367, "global_step": 363316, "epoch": 4377} {"train_loss": -26.7028865814209, "global_step": 363317, "epoch": 4377} {"train_loss": -26.584110260009766, "global_step": 363318, "epoch": 4377} {"train_loss": -26.486230850219727, "global_step": 363319, "epoch": 4377} {"train_loss": -26.48048210144043, "global_step": 363320, "epoch": 4377} {"train_loss": -26.1081485748291, "global_step": 363321, "epoch": 4377} {"train_loss": -26.40448570251465, "global_step": 363322, "epoch": 4377} {"train_loss": -26.155902862548828, "global_step": 363323, "epoch": 4377} {"train_loss": -26.33868408203125, "global_step": 363324, "epoch": 4377} {"train_loss": -26.3264102935791, "global_step": 363325, "epoch": 4377} {"train_loss": -26.4672794342041, "global_step": 363326, "epoch": 4377} {"train_loss": -26.158212661743164, "global_step": 363327, "epoch": 4377} {"train_loss": -26.672225952148438, "global_step": 363328, "epoch": 4377} {"train_loss": -26.36594009399414, "global_step": 363329, "epoch": 4377} {"train_loss": -25.911956787109375, "global_step": 363330, "epoch": 4377} {"train_loss": -25.71534538269043, "global_step": 363331, "epoch": 4377} {"train_loss": -25.858022689819336, "global_step": 363332, "epoch": 4377} {"train_loss": -25.8076229095459, "global_step": 363333, "epoch": 4377} {"train_loss": -25.63630485534668, "global_step": 363334, "epoch": 4377} {"train_loss": -26.208419799804688, "global_step": 363335, "epoch": 4377} {"train_loss": -26.216705322265625, "global_step": 363336, "epoch": 4377} {"train_loss": -26.049177169799805, "global_step": 363337, "epoch": 4377} {"train_loss": -26.315820693969727, "global_step": 363338, "epoch": 4377} {"train_loss": -26.485868453979492, "global_step": 363339, "epoch": 4377} {"train_loss": -26.374008178710938, "global_step": 363340, "epoch": 4377} {"train_loss": -25.945388793945312, "global_step": 363341, "epoch": 4377} {"train_loss": -26.60176658630371, "global_step": 363342, "epoch": 4377} {"train_loss": -26.13922691345215, "global_step": 363343, "epoch": 4377} {"train_loss": -25.841522216796875, "global_step": 363344, "epoch": 4377} {"train_loss": -26.146352767944336, "global_step": 363345, "epoch": 4377} {"train_loss": -26.1717472076416, "global_step": 363346, "epoch": 4377} {"train_loss": -26.702478408813477, "global_step": 363347, "epoch": 4377} {"train_loss": -25.58403205871582, "global_step": 363348, "epoch": 4377} {"train_loss": -26.188962936401367, "global_step": 363349, "epoch": 4377} {"train_loss": -26.103519439697266, "global_step": 363350, "epoch": 4377} {"train_loss": -26.23565101623535, "global_step": 363351, "epoch": 4377} {"train_loss": -26.183095932006836, "global_step": 363352, "epoch": 4377} {"train_loss": -26.1927433013916, "global_step": 363353, "epoch": 4377} {"train_loss": -26.753950119018555, "global_step": 363354, "epoch": 4377} {"train_loss": -26.540668487548828, "global_step": 363355, "epoch": 4377} {"train_loss": -26.464111328125, "global_step": 363356, "epoch": 4377} {"train_loss": -26.4731388092041, "global_step": 363357, "epoch": 4377} {"train_loss": -26.42213249206543, "global_step": 363358, "epoch": 4377} {"train_loss": -26.206518173217773, "global_step": 363359, "epoch": 4377} {"train_loss": -26.4752140045166, "global_step": 363360, "epoch": 4377} {"train_loss": -26.5661563873291, "global_step": 363361, "epoch": 4377} {"train_loss": -26.316268920898438, "global_step": 363362, "epoch": 4377} {"train_loss": -26.420682907104492, "global_step": 363363, "epoch": 4377} {"train_loss": -26.16766357421875, "global_step": 363364, "epoch": 4377} {"train_loss": -26.482202529907227, "global_step": 363365, "epoch": 4377} {"train_loss": -26.38117027282715, "global_step": 363366, "epoch": 4377} {"train_loss": -26.244699478149414, "global_step": 363367, "epoch": 4377} {"train_loss": -26.31451416015625, "global_step": 363368, "epoch": 4377} {"train_loss": -26.44268798828125, "global_step": 363369, "epoch": 4377} {"train_loss": -26.3723201751709, "global_step": 363370, "epoch": 4377} {"train_loss": -26.876667022705078, "global_step": 363371, "epoch": 4377} {"train_loss": -26.216711044311523, "global_step": 363372, "epoch": 4377} {"train_loss": -26.290361978921545, "global_step": 363373, "epoch": 4377, "val_loss": 6576739.5} {"train_loss": -25.82964515686035, "global_step": 363374, "epoch": 4378} {"train_loss": -24.505033493041992, "global_step": 363375, "epoch": 4378} {"train_loss": -24.50406265258789, "global_step": 363376, "epoch": 4378} {"train_loss": -25.01509666442871, "global_step": 363377, "epoch": 4378} {"train_loss": -26.412763595581055, "global_step": 363378, "epoch": 4378} {"train_loss": -25.8355712890625, "global_step": 363379, "epoch": 4378} {"train_loss": -25.79804801940918, "global_step": 363380, "epoch": 4378} {"train_loss": -25.35502052307129, "global_step": 363381, "epoch": 4378} {"train_loss": -25.977853775024414, "global_step": 363382, "epoch": 4378} {"train_loss": -25.888193130493164, "global_step": 363383, "epoch": 4378} {"train_loss": -25.943506240844727, "global_step": 363384, "epoch": 4378} {"train_loss": -25.773096084594727, "global_step": 363385, "epoch": 4378} {"train_loss": -25.9117374420166, "global_step": 363386, "epoch": 4378} {"train_loss": -26.290740966796875, "global_step": 363387, "epoch": 4378} {"train_loss": -25.856225967407227, "global_step": 363388, "epoch": 4378} {"train_loss": -25.963043212890625, "global_step": 363389, "epoch": 4378} {"train_loss": -25.934228897094727, "global_step": 363390, "epoch": 4378} {"train_loss": -26.150598526000977, "global_step": 363391, "epoch": 4378} {"train_loss": -25.929019927978516, "global_step": 363392, "epoch": 4378} {"train_loss": -25.87991714477539, "global_step": 363393, "epoch": 4378} {"train_loss": -25.9527587890625, "global_step": 363394, "epoch": 4378} {"train_loss": -26.345056533813477, "global_step": 363395, "epoch": 4378} {"train_loss": -26.29146385192871, "global_step": 363396, "epoch": 4378} {"train_loss": -26.30794334411621, "global_step": 363397, "epoch": 4378} {"train_loss": -26.237445831298828, "global_step": 363398, "epoch": 4378} {"train_loss": -26.334766387939453, "global_step": 363399, "epoch": 4378} {"train_loss": -26.388721466064453, "global_step": 363400, "epoch": 4378} {"train_loss": -26.509252548217773, "global_step": 363401, "epoch": 4378} {"train_loss": -26.410797119140625, "global_step": 363402, "epoch": 4378} {"train_loss": -26.11939811706543, "global_step": 363403, "epoch": 4378} {"train_loss": -26.116743087768555, "global_step": 363404, "epoch": 4378} {"train_loss": -26.742279052734375, "global_step": 363405, "epoch": 4378} {"train_loss": -26.427946090698242, "global_step": 363406, "epoch": 4378} {"train_loss": -26.485151290893555, "global_step": 363407, "epoch": 4378} {"train_loss": -26.241743087768555, "global_step": 363408, "epoch": 4378} {"train_loss": -26.210851669311523, "global_step": 363409, "epoch": 4378} {"train_loss": -26.59541130065918, "global_step": 363410, "epoch": 4378} {"train_loss": -26.240997314453125, "global_step": 363411, "epoch": 4378} {"train_loss": -26.42681884765625, "global_step": 363412, "epoch": 4378} {"train_loss": -26.5896053314209, "global_step": 363413, "epoch": 4378} {"train_loss": -26.280750274658203, "global_step": 363414, "epoch": 4378} {"train_loss": -26.44394874572754, "global_step": 363415, "epoch": 4378} {"train_loss": -26.511947631835938, "global_step": 363416, "epoch": 4378} {"train_loss": -26.42776870727539, "global_step": 363417, "epoch": 4378} {"train_loss": -26.412961959838867, "global_step": 363418, "epoch": 4378} {"train_loss": -26.618635177612305, "global_step": 363419, "epoch": 4378} {"train_loss": -26.342086791992188, "global_step": 363420, "epoch": 4378} {"train_loss": -26.586225509643555, "global_step": 363421, "epoch": 4378} {"train_loss": -26.75986671447754, "global_step": 363422, "epoch": 4378} {"train_loss": -26.589380264282227, "global_step": 363423, "epoch": 4378} {"train_loss": -26.185779571533203, "global_step": 363424, "epoch": 4378} {"train_loss": -26.588714599609375, "global_step": 363425, "epoch": 4378} {"train_loss": -26.172550201416016, "global_step": 363426, "epoch": 4378} {"train_loss": -26.205963134765625, "global_step": 363427, "epoch": 4378} {"train_loss": -26.031085968017578, "global_step": 363428, "epoch": 4378} {"train_loss": -26.23927116394043, "global_step": 363429, "epoch": 4378} {"train_loss": -26.229711532592773, "global_step": 363430, "epoch": 4378} {"train_loss": -26.545560836791992, "global_step": 363431, "epoch": 4378} {"train_loss": -26.44025993347168, "global_step": 363432, "epoch": 4378} {"train_loss": -26.219778060913086, "global_step": 363433, "epoch": 4378} {"train_loss": -26.18275260925293, "global_step": 363434, "epoch": 4378} {"train_loss": -26.355655670166016, "global_step": 363435, "epoch": 4378} {"train_loss": -26.268823623657227, "global_step": 363436, "epoch": 4378} {"train_loss": -26.77170181274414, "global_step": 363437, "epoch": 4378} {"train_loss": -26.439767837524414, "global_step": 363438, "epoch": 4378} {"train_loss": -26.259016036987305, "global_step": 363439, "epoch": 4378} {"train_loss": -26.50284194946289, "global_step": 363440, "epoch": 4378} {"train_loss": -26.57233238220215, "global_step": 363441, "epoch": 4378} {"train_loss": -26.42527198791504, "global_step": 363442, "epoch": 4378} {"train_loss": -26.209918975830078, "global_step": 363443, "epoch": 4378} {"train_loss": -26.475122451782227, "global_step": 363444, "epoch": 4378} {"train_loss": -26.221302032470703, "global_step": 363445, "epoch": 4378} {"train_loss": -26.11231803894043, "global_step": 363446, "epoch": 4378} {"train_loss": -25.75123405456543, "global_step": 363447, "epoch": 4378} {"train_loss": -26.30043601989746, "global_step": 363448, "epoch": 4378} {"train_loss": -26.3737735748291, "global_step": 363449, "epoch": 4378} {"train_loss": -26.340375900268555, "global_step": 363450, "epoch": 4378} {"train_loss": -26.621862411499023, "global_step": 363451, "epoch": 4378} {"train_loss": -26.456403732299805, "global_step": 363452, "epoch": 4378} {"train_loss": -26.744842529296875, "global_step": 363453, "epoch": 4378} {"train_loss": -26.21339988708496, "global_step": 363454, "epoch": 4378} {"train_loss": -26.198169708251953, "global_step": 363455, "epoch": 4378} {"train_loss": -26.221611988113587, "global_step": 363456, "epoch": 4378, "val_loss": 6642453.5} {"train_loss": -25.95163917541504, "global_step": 363457, "epoch": 4379} {"train_loss": -25.560556411743164, "global_step": 363458, "epoch": 4379} {"train_loss": -25.7594051361084, "global_step": 363459, "epoch": 4379} {"train_loss": -25.88233757019043, "global_step": 363460, "epoch": 4379} {"train_loss": -26.011249542236328, "global_step": 363461, "epoch": 4379} {"train_loss": -25.95932960510254, "global_step": 363462, "epoch": 4379} {"train_loss": -25.799362182617188, "global_step": 363463, "epoch": 4379} {"train_loss": -25.7343692779541, "global_step": 363464, "epoch": 4379} {"train_loss": -26.472089767456055, "global_step": 363465, "epoch": 4379} {"train_loss": -26.057117462158203, "global_step": 363466, "epoch": 4379} {"train_loss": -26.280200958251953, "global_step": 363467, "epoch": 4379} {"train_loss": -26.445646286010742, "global_step": 363468, "epoch": 4379} {"train_loss": -26.147430419921875, "global_step": 363469, "epoch": 4379} {"train_loss": -26.169164657592773, "global_step": 363470, "epoch": 4379} {"train_loss": -26.098678588867188, "global_step": 363471, "epoch": 4379} {"train_loss": -26.412357330322266, "global_step": 363472, "epoch": 4379} {"train_loss": -26.311843872070312, "global_step": 363473, "epoch": 4379} {"train_loss": -25.862842559814453, "global_step": 363474, "epoch": 4379} {"train_loss": -26.239744186401367, "global_step": 363475, "epoch": 4379} {"train_loss": -26.704126358032227, "global_step": 363476, "epoch": 4379} {"train_loss": -26.06089210510254, "global_step": 363477, "epoch": 4379} {"train_loss": -26.37041664123535, "global_step": 363478, "epoch": 4379} {"train_loss": -26.018722534179688, "global_step": 363479, "epoch": 4379} {"train_loss": -26.3342342376709, "global_step": 363480, "epoch": 4379} {"train_loss": -26.026010513305664, "global_step": 363481, "epoch": 4379} {"train_loss": -26.21685791015625, "global_step": 363482, "epoch": 4379} {"train_loss": -26.217710494995117, "global_step": 363483, "epoch": 4379} {"train_loss": -25.91840934753418, "global_step": 363484, "epoch": 4379} {"train_loss": -26.244735717773438, "global_step": 363485, "epoch": 4379} {"train_loss": -26.088428497314453, "global_step": 363486, "epoch": 4379} {"train_loss": -26.268163681030273, "global_step": 363487, "epoch": 4379} {"train_loss": -26.369977951049805, "global_step": 363488, "epoch": 4379} {"train_loss": -26.22283935546875, "global_step": 363489, "epoch": 4379} {"train_loss": -26.3984432220459, "global_step": 363490, "epoch": 4379} {"train_loss": -26.60444450378418, "global_step": 363491, "epoch": 4379} {"train_loss": -25.88510513305664, "global_step": 363492, "epoch": 4379} {"train_loss": -26.28436851501465, "global_step": 363493, "epoch": 4379} {"train_loss": -26.63381004333496, "global_step": 363494, "epoch": 4379} {"train_loss": -26.441650390625, "global_step": 363495, "epoch": 4379} {"train_loss": -26.468698501586914, "global_step": 363496, "epoch": 4379} {"train_loss": -26.6817569732666, "global_step": 363497, "epoch": 4379} {"train_loss": -26.29558753967285, "global_step": 363498, "epoch": 4379} {"train_loss": -26.207611083984375, "global_step": 363499, "epoch": 4379} {"train_loss": -26.076322555541992, "global_step": 363500, "epoch": 4379} {"train_loss": -26.434072494506836, "global_step": 363501, "epoch": 4379} {"train_loss": -26.434091567993164, "global_step": 363502, "epoch": 4379} {"train_loss": -26.28291130065918, "global_step": 363503, "epoch": 4379} {"train_loss": -26.247314453125, "global_step": 363504, "epoch": 4379} {"train_loss": -26.72135353088379, "global_step": 363505, "epoch": 4379} {"train_loss": -26.374963760375977, "global_step": 363506, "epoch": 4379} {"train_loss": -26.333967208862305, "global_step": 363507, "epoch": 4379} {"train_loss": -26.145238876342773, "global_step": 363508, "epoch": 4379} {"train_loss": -26.418119430541992, "global_step": 363509, "epoch": 4379} {"train_loss": -26.501617431640625, "global_step": 363510, "epoch": 4379} {"train_loss": -26.244726181030273, "global_step": 363511, "epoch": 4379} {"train_loss": -26.466657638549805, "global_step": 363512, "epoch": 4379} {"train_loss": -26.52162742614746, "global_step": 363513, "epoch": 4379} {"train_loss": -26.605823516845703, "global_step": 363514, "epoch": 4379} {"train_loss": -26.518091201782227, "global_step": 363515, "epoch": 4379} {"train_loss": -26.623188018798828, "global_step": 363516, "epoch": 4379} {"train_loss": -26.28879165649414, "global_step": 363517, "epoch": 4379} {"train_loss": -26.19219398498535, "global_step": 363518, "epoch": 4379} {"train_loss": -26.25616455078125, "global_step": 363519, "epoch": 4379} {"train_loss": -26.361286163330078, "global_step": 363520, "epoch": 4379} {"train_loss": -26.46265983581543, "global_step": 363521, "epoch": 4379} {"train_loss": -26.842248916625977, "global_step": 363522, "epoch": 4379} {"train_loss": -26.375350952148438, "global_step": 363523, "epoch": 4379} {"train_loss": -25.949262619018555, "global_step": 363524, "epoch": 4379} {"train_loss": -25.997791290283203, "global_step": 363525, "epoch": 4379} {"train_loss": -26.21722412109375, "global_step": 363526, "epoch": 4379} {"train_loss": -26.679906845092773, "global_step": 363527, "epoch": 4379} {"train_loss": -26.032623291015625, "global_step": 363528, "epoch": 4379} {"train_loss": -25.8306941986084, "global_step": 363529, "epoch": 4379} {"train_loss": -26.848173141479492, "global_step": 363530, "epoch": 4379} {"train_loss": -26.524295806884766, "global_step": 363531, "epoch": 4379} {"train_loss": -25.9078426361084, "global_step": 363532, "epoch": 4379} {"train_loss": -26.19379997253418, "global_step": 363533, "epoch": 4379} {"train_loss": -26.09857749938965, "global_step": 363534, "epoch": 4379} {"train_loss": -26.120325088500977, "global_step": 363535, "epoch": 4379} {"train_loss": -26.416168212890625, "global_step": 363536, "epoch": 4379} {"train_loss": -26.013193130493164, "global_step": 363537, "epoch": 4379} {"train_loss": -25.91657066345215, "global_step": 363538, "epoch": 4379} {"train_loss": -26.25726387299687, "global_step": 363539, "epoch": 4379, "val_loss": 6625246.0} {"train_loss": -25.052017211914062, "global_step": 363540, "epoch": 4380} {"train_loss": -24.746337890625, "global_step": 363541, "epoch": 4380} {"train_loss": -23.770082473754883, "global_step": 363542, "epoch": 4380} {"train_loss": -25.117143630981445, "global_step": 363543, "epoch": 4380} {"train_loss": -25.06000328063965, "global_step": 363544, "epoch": 4380} {"train_loss": -25.903127670288086, "global_step": 363545, "epoch": 4380} {"train_loss": -25.307695388793945, "global_step": 363546, "epoch": 4380} {"train_loss": -25.720081329345703, "global_step": 363547, "epoch": 4380} {"train_loss": -25.4237060546875, "global_step": 363548, "epoch": 4380} {"train_loss": -25.803369522094727, "global_step": 363549, "epoch": 4380} {"train_loss": -25.662260055541992, "global_step": 363550, "epoch": 4380} {"train_loss": -25.962060928344727, "global_step": 363551, "epoch": 4380} {"train_loss": -25.626367568969727, "global_step": 363552, "epoch": 4380} {"train_loss": -26.28553581237793, "global_step": 363553, "epoch": 4380} {"train_loss": -25.927947998046875, "global_step": 363554, "epoch": 4380} {"train_loss": -26.163965225219727, "global_step": 363555, "epoch": 4380} {"train_loss": -25.84040641784668, "global_step": 363556, "epoch": 4380} {"train_loss": -25.606847763061523, "global_step": 363557, "epoch": 4380} {"train_loss": -26.090497970581055, "global_step": 363558, "epoch": 4380} {"train_loss": -25.877649307250977, "global_step": 363559, "epoch": 4380} {"train_loss": -25.9222412109375, "global_step": 363560, "epoch": 4380} {"train_loss": -25.798986434936523, "global_step": 363561, "epoch": 4380} {"train_loss": -25.789173126220703, "global_step": 363562, "epoch": 4380} {"train_loss": -25.865554809570312, "global_step": 363563, "epoch": 4380} {"train_loss": -26.290607452392578, "global_step": 363564, "epoch": 4380} {"train_loss": -26.0112361907959, "global_step": 363565, "epoch": 4380} {"train_loss": -26.6040096282959, "global_step": 363566, "epoch": 4380} {"train_loss": -26.138935089111328, "global_step": 363567, "epoch": 4380} {"train_loss": -26.022504806518555, "global_step": 363568, "epoch": 4380} {"train_loss": -26.186182022094727, "global_step": 363569, "epoch": 4380} {"train_loss": -26.296884536743164, "global_step": 363570, "epoch": 4380} {"train_loss": -26.188690185546875, "global_step": 363571, "epoch": 4380} {"train_loss": -26.206256866455078, "global_step": 363572, "epoch": 4380} {"train_loss": -26.114837646484375, "global_step": 363573, "epoch": 4380} {"train_loss": -26.14988136291504, "global_step": 363574, "epoch": 4380} {"train_loss": -26.148868560791016, "global_step": 363575, "epoch": 4380} {"train_loss": -26.768766403198242, "global_step": 363576, "epoch": 4380} {"train_loss": -26.581918716430664, "global_step": 363577, "epoch": 4380} {"train_loss": -26.231689453125, "global_step": 363578, "epoch": 4380} {"train_loss": -26.372854232788086, "global_step": 363579, "epoch": 4380} {"train_loss": -26.547901153564453, "global_step": 363580, "epoch": 4380} {"train_loss": -26.108123779296875, "global_step": 363581, "epoch": 4380} {"train_loss": -25.90386390686035, "global_step": 363582, "epoch": 4380} {"train_loss": -26.250762939453125, "global_step": 363583, "epoch": 4380} {"train_loss": -26.43656349182129, "global_step": 363584, "epoch": 4380} {"train_loss": -26.47491455078125, "global_step": 363585, "epoch": 4380} {"train_loss": -26.366851806640625, "global_step": 363586, "epoch": 4380} {"train_loss": -26.4221134185791, "global_step": 363587, "epoch": 4380} {"train_loss": -26.074106216430664, "global_step": 363588, "epoch": 4380} {"train_loss": -26.3090763092041, "global_step": 363589, "epoch": 4380} {"train_loss": -26.01604652404785, "global_step": 363590, "epoch": 4380} {"train_loss": -26.066946029663086, "global_step": 363591, "epoch": 4380} {"train_loss": -26.315185546875, "global_step": 363592, "epoch": 4380} {"train_loss": -26.496496200561523, "global_step": 363593, "epoch": 4380} {"train_loss": -26.605249404907227, "global_step": 363594, "epoch": 4380} {"train_loss": -26.575485229492188, "global_step": 363595, "epoch": 4380} {"train_loss": -26.40150260925293, "global_step": 363596, "epoch": 4380} {"train_loss": -26.647390365600586, "global_step": 363597, "epoch": 4380} {"train_loss": -26.33402442932129, "global_step": 363598, "epoch": 4380} {"train_loss": -26.370929718017578, "global_step": 363599, "epoch": 4380} {"train_loss": -26.582569122314453, "global_step": 363600, "epoch": 4380} {"train_loss": -26.42726707458496, "global_step": 363601, "epoch": 4380} {"train_loss": -26.206024169921875, "global_step": 363602, "epoch": 4380} {"train_loss": -26.60711097717285, "global_step": 363603, "epoch": 4380} {"train_loss": -26.479639053344727, "global_step": 363604, "epoch": 4380} {"train_loss": -26.6229248046875, "global_step": 363605, "epoch": 4380} {"train_loss": -25.867475509643555, "global_step": 363606, "epoch": 4380} {"train_loss": -26.33418083190918, "global_step": 363607, "epoch": 4380} {"train_loss": -26.374853134155273, "global_step": 363608, "epoch": 4380} {"train_loss": -26.29030418395996, "global_step": 363609, "epoch": 4380} {"train_loss": -26.355396270751953, "global_step": 363610, "epoch": 4380} {"train_loss": -26.201452255249023, "global_step": 363611, "epoch": 4380} {"train_loss": -26.449695587158203, "global_step": 363612, "epoch": 4380} {"train_loss": -26.317197799682617, "global_step": 363613, "epoch": 4380} {"train_loss": -26.453454971313477, "global_step": 363614, "epoch": 4380} {"train_loss": -26.023298263549805, "global_step": 363615, "epoch": 4380} {"train_loss": -26.408496856689453, "global_step": 363616, "epoch": 4380} {"train_loss": -26.34821891784668, "global_step": 363617, "epoch": 4380} {"train_loss": -26.181934356689453, "global_step": 363618, "epoch": 4380} {"train_loss": -26.296295166015625, "global_step": 363619, "epoch": 4380} {"train_loss": -26.26888084411621, "global_step": 363620, "epoch": 4380} {"train_loss": -26.212554931640625, "global_step": 363621, "epoch": 4380} {"train_loss": -26.111892470394274, "global_step": 363622, "epoch": 4380, "val_loss": 6595396.0} {"train_loss": -24.92914390563965, "global_step": 363623, "epoch": 4381} {"train_loss": -25.97638511657715, "global_step": 363624, "epoch": 4381} {"train_loss": -25.49409294128418, "global_step": 363625, "epoch": 4381} {"train_loss": -25.750680923461914, "global_step": 363626, "epoch": 4381} {"train_loss": -26.024648666381836, "global_step": 363627, "epoch": 4381} {"train_loss": -26.3842830657959, "global_step": 363628, "epoch": 4381} {"train_loss": -26.263818740844727, "global_step": 363629, "epoch": 4381} {"train_loss": -25.823867797851562, "global_step": 363630, "epoch": 4381} {"train_loss": -25.554656982421875, "global_step": 363631, "epoch": 4381} {"train_loss": -26.12274742126465, "global_step": 363632, "epoch": 4381} {"train_loss": -26.030750274658203, "global_step": 363633, "epoch": 4381} {"train_loss": -26.15460777282715, "global_step": 363634, "epoch": 4381} {"train_loss": -26.02003288269043, "global_step": 363635, "epoch": 4381} {"train_loss": -26.31833839416504, "global_step": 363636, "epoch": 4381} {"train_loss": -26.52815818786621, "global_step": 363637, "epoch": 4381} {"train_loss": -26.077112197875977, "global_step": 363638, "epoch": 4381} {"train_loss": -25.914575576782227, "global_step": 363639, "epoch": 4381} {"train_loss": -25.880704879760742, "global_step": 363640, "epoch": 4381} {"train_loss": -26.123340606689453, "global_step": 363641, "epoch": 4381} {"train_loss": -26.28633689880371, "global_step": 363642, "epoch": 4381} {"train_loss": -26.252042770385742, "global_step": 363643, "epoch": 4381} {"train_loss": -25.882421493530273, "global_step": 363644, "epoch": 4381} {"train_loss": -25.99611473083496, "global_step": 363645, "epoch": 4381} {"train_loss": -26.281147003173828, "global_step": 363646, "epoch": 4381} {"train_loss": -26.597579956054688, "global_step": 363647, "epoch": 4381} {"train_loss": -26.291440963745117, "global_step": 363648, "epoch": 4381} {"train_loss": -26.25970458984375, "global_step": 363649, "epoch": 4381} {"train_loss": -26.307870864868164, "global_step": 363650, "epoch": 4381} {"train_loss": -25.95181655883789, "global_step": 363651, "epoch": 4381} {"train_loss": -26.614561080932617, "global_step": 363652, "epoch": 4381} {"train_loss": -26.251907348632812, "global_step": 363653, "epoch": 4381} {"train_loss": -26.29593276977539, "global_step": 363654, "epoch": 4381} {"train_loss": -25.914936065673828, "global_step": 363655, "epoch": 4381} {"train_loss": -25.773468017578125, "global_step": 363656, "epoch": 4381} {"train_loss": -26.222171783447266, "global_step": 363657, "epoch": 4381} {"train_loss": -25.480581283569336, "global_step": 363658, "epoch": 4381} {"train_loss": -25.82734489440918, "global_step": 363659, "epoch": 4381} {"train_loss": -26.44122314453125, "global_step": 363660, "epoch": 4381} {"train_loss": -25.706567764282227, "global_step": 363661, "epoch": 4381} {"train_loss": -26.527969360351562, "global_step": 363662, "epoch": 4381} {"train_loss": -26.301807403564453, "global_step": 363663, "epoch": 4381} {"train_loss": -25.92917251586914, "global_step": 363664, "epoch": 4381} {"train_loss": -26.2084903717041, "global_step": 363665, "epoch": 4381} {"train_loss": -26.310361862182617, "global_step": 363666, "epoch": 4381} {"train_loss": -26.028295516967773, "global_step": 363667, "epoch": 4381} {"train_loss": -26.201120376586914, "global_step": 363668, "epoch": 4381} {"train_loss": -26.33310890197754, "global_step": 363669, "epoch": 4381} {"train_loss": -26.419754028320312, "global_step": 363670, "epoch": 4381} {"train_loss": -26.30340576171875, "global_step": 363671, "epoch": 4381} {"train_loss": -25.95464515686035, "global_step": 363672, "epoch": 4381} {"train_loss": -26.181610107421875, "global_step": 363673, "epoch": 4381} {"train_loss": -26.066869735717773, "global_step": 363674, "epoch": 4381} {"train_loss": -26.4289493560791, "global_step": 363675, "epoch": 4381} {"train_loss": -26.451663970947266, "global_step": 363676, "epoch": 4381} {"train_loss": -25.643747329711914, "global_step": 363677, "epoch": 4381} {"train_loss": -25.832548141479492, "global_step": 363678, "epoch": 4381} {"train_loss": -26.214231491088867, "global_step": 363679, "epoch": 4381} {"train_loss": -25.795560836791992, "global_step": 363680, "epoch": 4381} {"train_loss": -26.513029098510742, "global_step": 363681, "epoch": 4381} {"train_loss": -26.286865234375, "global_step": 363682, "epoch": 4381} {"train_loss": -26.14558219909668, "global_step": 363683, "epoch": 4381} {"train_loss": -26.183130264282227, "global_step": 363684, "epoch": 4381} {"train_loss": -26.887311935424805, "global_step": 363685, "epoch": 4381} {"train_loss": -26.19288444519043, "global_step": 363686, "epoch": 4381} {"train_loss": -26.493188858032227, "global_step": 363687, "epoch": 4381} {"train_loss": -26.328092575073242, "global_step": 363688, "epoch": 4381} {"train_loss": -26.521711349487305, "global_step": 363689, "epoch": 4381} {"train_loss": -26.6702823638916, "global_step": 363690, "epoch": 4381} {"train_loss": -26.461999893188477, "global_step": 363691, "epoch": 4381} {"train_loss": -26.05616569519043, "global_step": 363692, "epoch": 4381} {"train_loss": -26.369348526000977, "global_step": 363693, "epoch": 4381} {"train_loss": -26.583948135375977, "global_step": 363694, "epoch": 4381} {"train_loss": -26.5363712310791, "global_step": 363695, "epoch": 4381} {"train_loss": -26.341089248657227, "global_step": 363696, "epoch": 4381} {"train_loss": -26.0626220703125, "global_step": 363697, "epoch": 4381} {"train_loss": -26.207489013671875, "global_step": 363698, "epoch": 4381} {"train_loss": -26.40945816040039, "global_step": 363699, "epoch": 4381} {"train_loss": -25.921527862548828, "global_step": 363700, "epoch": 4381} {"train_loss": -26.32452392578125, "global_step": 363701, "epoch": 4381} {"train_loss": -26.253036499023438, "global_step": 363702, "epoch": 4381} {"train_loss": -26.2752628326416, "global_step": 363703, "epoch": 4381} {"train_loss": -26.2762508392334, "global_step": 363704, "epoch": 4381} {"train_loss": -26.170605510114186, "global_step": 363705, "epoch": 4381, "val_loss": 6621375.0} {"train_loss": -26.140050888061523, "global_step": 363706, "epoch": 4382} {"train_loss": -25.379117965698242, "global_step": 363707, "epoch": 4382} {"train_loss": -25.459781646728516, "global_step": 363708, "epoch": 4382} {"train_loss": -25.914081573486328, "global_step": 363709, "epoch": 4382} {"train_loss": -25.21147918701172, "global_step": 363710, "epoch": 4382} {"train_loss": -25.564632415771484, "global_step": 363711, "epoch": 4382} {"train_loss": -25.937952041625977, "global_step": 363712, "epoch": 4382} {"train_loss": -26.006610870361328, "global_step": 363713, "epoch": 4382} {"train_loss": -25.685144424438477, "global_step": 363714, "epoch": 4382} {"train_loss": -25.85487174987793, "global_step": 363715, "epoch": 4382} {"train_loss": -25.943647384643555, "global_step": 363716, "epoch": 4382} {"train_loss": -25.35633659362793, "global_step": 363717, "epoch": 4382} {"train_loss": -25.999591827392578, "global_step": 363718, "epoch": 4382} {"train_loss": -25.988666534423828, "global_step": 363719, "epoch": 4382} {"train_loss": -25.707502365112305, "global_step": 363720, "epoch": 4382} {"train_loss": -25.673721313476562, "global_step": 363721, "epoch": 4382} {"train_loss": -25.983966827392578, "global_step": 363722, "epoch": 4382} {"train_loss": -25.32195472717285, "global_step": 363723, "epoch": 4382} {"train_loss": -25.7844295501709, "global_step": 363724, "epoch": 4382} {"train_loss": -25.94329833984375, "global_step": 363725, "epoch": 4382} {"train_loss": -25.745092391967773, "global_step": 363726, "epoch": 4382} {"train_loss": -25.770776748657227, "global_step": 363727, "epoch": 4382} {"train_loss": -25.86882972717285, "global_step": 363728, "epoch": 4382} {"train_loss": -26.126943588256836, "global_step": 363729, "epoch": 4382} {"train_loss": -25.966711044311523, "global_step": 363730, "epoch": 4382} {"train_loss": -25.959381103515625, "global_step": 363731, "epoch": 4382} {"train_loss": -26.16609001159668, "global_step": 363732, "epoch": 4382} {"train_loss": -26.434858322143555, "global_step": 363733, "epoch": 4382} {"train_loss": -25.53350067138672, "global_step": 363734, "epoch": 4382} {"train_loss": -26.13027000427246, "global_step": 363735, "epoch": 4382} {"train_loss": -25.86446189880371, "global_step": 363736, "epoch": 4382} {"train_loss": -25.954511642456055, "global_step": 363737, "epoch": 4382} {"train_loss": -25.862518310546875, "global_step": 363738, "epoch": 4382} {"train_loss": -26.16767692565918, "global_step": 363739, "epoch": 4382} {"train_loss": -25.7960147857666, "global_step": 363740, "epoch": 4382} {"train_loss": -26.397558212280273, "global_step": 363741, "epoch": 4382} {"train_loss": -26.551504135131836, "global_step": 363742, "epoch": 4382} {"train_loss": -26.43793296813965, "global_step": 363743, "epoch": 4382} {"train_loss": -26.528242111206055, "global_step": 363744, "epoch": 4382} {"train_loss": -26.08393669128418, "global_step": 363745, "epoch": 4382} {"train_loss": -26.109724044799805, "global_step": 363746, "epoch": 4382} {"train_loss": -26.583951950073242, "global_step": 363747, "epoch": 4382} {"train_loss": -26.446496963500977, "global_step": 363748, "epoch": 4382} {"train_loss": -26.253686904907227, "global_step": 363749, "epoch": 4382} {"train_loss": -26.212324142456055, "global_step": 363750, "epoch": 4382} {"train_loss": -26.606769561767578, "global_step": 363751, "epoch": 4382} {"train_loss": -26.718780517578125, "global_step": 363752, "epoch": 4382} {"train_loss": -26.441137313842773, "global_step": 363753, "epoch": 4382} {"train_loss": -26.500492095947266, "global_step": 363754, "epoch": 4382} {"train_loss": -26.54437828063965, "global_step": 363755, "epoch": 4382} {"train_loss": -26.187957763671875, "global_step": 363756, "epoch": 4382} {"train_loss": -26.234375, "global_step": 363757, "epoch": 4382} {"train_loss": -25.972631454467773, "global_step": 363758, "epoch": 4382} {"train_loss": -26.1138916015625, "global_step": 363759, "epoch": 4382} {"train_loss": -26.720523834228516, "global_step": 363760, "epoch": 4382} {"train_loss": -26.360639572143555, "global_step": 363761, "epoch": 4382} {"train_loss": -25.4804630279541, "global_step": 363762, "epoch": 4382} {"train_loss": -26.019697189331055, "global_step": 363763, "epoch": 4382} {"train_loss": -26.112146377563477, "global_step": 363764, "epoch": 4382} {"train_loss": -26.266271591186523, "global_step": 363765, "epoch": 4382} {"train_loss": -26.439014434814453, "global_step": 363766, "epoch": 4382} {"train_loss": -26.00174331665039, "global_step": 363767, "epoch": 4382} {"train_loss": -26.1535701751709, "global_step": 363768, "epoch": 4382} {"train_loss": -26.517017364501953, "global_step": 363769, "epoch": 4382} {"train_loss": -26.150131225585938, "global_step": 363770, "epoch": 4382} {"train_loss": -26.156524658203125, "global_step": 363771, "epoch": 4382} {"train_loss": -25.92938804626465, "global_step": 363772, "epoch": 4382} {"train_loss": -26.570133209228516, "global_step": 363773, "epoch": 4382} {"train_loss": -26.005170822143555, "global_step": 363774, "epoch": 4382} {"train_loss": -26.397802352905273, "global_step": 363775, "epoch": 4382} {"train_loss": -26.114843368530273, "global_step": 363776, "epoch": 4382} {"train_loss": -26.22075843811035, "global_step": 363777, "epoch": 4382} {"train_loss": -26.2156982421875, "global_step": 363778, "epoch": 4382} {"train_loss": -25.97141456604004, "global_step": 363779, "epoch": 4382} {"train_loss": -26.421829223632812, "global_step": 363780, "epoch": 4382} {"train_loss": -26.022924423217773, "global_step": 363781, "epoch": 4382} {"train_loss": -26.155563354492188, "global_step": 363782, "epoch": 4382} {"train_loss": -26.05106544494629, "global_step": 363783, "epoch": 4382} {"train_loss": -25.7952938079834, "global_step": 363784, "epoch": 4382} {"train_loss": -26.511627197265625, "global_step": 363785, "epoch": 4382} {"train_loss": -26.23137855529785, "global_step": 363786, "epoch": 4382} {"train_loss": -26.194629669189453, "global_step": 363787, "epoch": 4382} {"train_loss": -26.083944803260895, "global_step": 363788, "epoch": 4382, "val_loss": 6618966.0} {"train_loss": -25.820478439331055, "global_step": 363789, "epoch": 4383} {"train_loss": -25.58466339111328, "global_step": 363790, "epoch": 4383} {"train_loss": -25.43012809753418, "global_step": 363791, "epoch": 4383} {"train_loss": -25.292095184326172, "global_step": 363792, "epoch": 4383} {"train_loss": -25.236831665039062, "global_step": 363793, "epoch": 4383} {"train_loss": -25.654077529907227, "global_step": 363794, "epoch": 4383} {"train_loss": -25.830835342407227, "global_step": 363795, "epoch": 4383} {"train_loss": -25.760278701782227, "global_step": 363796, "epoch": 4383} {"train_loss": -25.78204917907715, "global_step": 363797, "epoch": 4383} {"train_loss": -26.163000106811523, "global_step": 363798, "epoch": 4383} {"train_loss": -26.196521759033203, "global_step": 363799, "epoch": 4383} {"train_loss": -25.85556983947754, "global_step": 363800, "epoch": 4383} {"train_loss": -26.148527145385742, "global_step": 363801, "epoch": 4383} {"train_loss": -25.962610244750977, "global_step": 363802, "epoch": 4383} {"train_loss": -25.815237045288086, "global_step": 363803, "epoch": 4383} {"train_loss": -26.397619247436523, "global_step": 363804, "epoch": 4383} {"train_loss": -26.434667587280273, "global_step": 363805, "epoch": 4383} {"train_loss": -25.698877334594727, "global_step": 363806, "epoch": 4383} {"train_loss": -25.890012741088867, "global_step": 363807, "epoch": 4383} {"train_loss": -26.076948165893555, "global_step": 363808, "epoch": 4383} {"train_loss": -26.120153427124023, "global_step": 363809, "epoch": 4383} {"train_loss": -26.0656795501709, "global_step": 363810, "epoch": 4383} {"train_loss": -26.347522735595703, "global_step": 363811, "epoch": 4383} {"train_loss": -26.391448974609375, "global_step": 363812, "epoch": 4383} {"train_loss": -25.728052139282227, "global_step": 363813, "epoch": 4383} {"train_loss": -26.472333908081055, "global_step": 363814, "epoch": 4383} {"train_loss": -26.14235496520996, "global_step": 363815, "epoch": 4383} {"train_loss": -26.263568878173828, "global_step": 363816, "epoch": 4383} {"train_loss": -26.1834774017334, "global_step": 363817, "epoch": 4383} {"train_loss": -26.293676376342773, "global_step": 363818, "epoch": 4383} {"train_loss": -26.061681747436523, "global_step": 363819, "epoch": 4383} {"train_loss": -26.702056884765625, "global_step": 363820, "epoch": 4383} {"train_loss": -26.27335548400879, "global_step": 363821, "epoch": 4383} {"train_loss": -26.182159423828125, "global_step": 363822, "epoch": 4383} {"train_loss": -26.012109756469727, "global_step": 363823, "epoch": 4383} {"train_loss": -26.393491744995117, "global_step": 363824, "epoch": 4383} {"train_loss": -26.676000595092773, "global_step": 363825, "epoch": 4383} {"train_loss": -26.357196807861328, "global_step": 363826, "epoch": 4383} {"train_loss": -26.432416915893555, "global_step": 363827, "epoch": 4383} {"train_loss": -26.87506675720215, "global_step": 363828, "epoch": 4383} {"train_loss": -26.410730361938477, "global_step": 363829, "epoch": 4383} {"train_loss": -26.634246826171875, "global_step": 363830, "epoch": 4383} {"train_loss": -26.39121437072754, "global_step": 363831, "epoch": 4383} {"train_loss": -26.457061767578125, "global_step": 363832, "epoch": 4383} {"train_loss": -26.613086700439453, "global_step": 363833, "epoch": 4383} {"train_loss": -26.47469139099121, "global_step": 363834, "epoch": 4383} {"train_loss": -26.44734764099121, "global_step": 363835, "epoch": 4383} {"train_loss": -26.571979522705078, "global_step": 363836, "epoch": 4383} {"train_loss": -26.522855758666992, "global_step": 363837, "epoch": 4383} {"train_loss": -26.23427391052246, "global_step": 363838, "epoch": 4383} {"train_loss": -26.634037017822266, "global_step": 363839, "epoch": 4383} {"train_loss": -26.242218017578125, "global_step": 363840, "epoch": 4383} {"train_loss": -25.996870040893555, "global_step": 363841, "epoch": 4383} {"train_loss": -25.281579971313477, "global_step": 363842, "epoch": 4383} {"train_loss": -24.71562957763672, "global_step": 363843, "epoch": 4383} {"train_loss": -24.04316520690918, "global_step": 363844, "epoch": 4383} {"train_loss": -25.171733856201172, "global_step": 363845, "epoch": 4383} {"train_loss": -25.678625106811523, "global_step": 363846, "epoch": 4383} {"train_loss": -25.53775978088379, "global_step": 363847, "epoch": 4383} {"train_loss": -25.46741485595703, "global_step": 363848, "epoch": 4383} {"train_loss": -25.793033599853516, "global_step": 363849, "epoch": 4383} {"train_loss": -25.150781631469727, "global_step": 363850, "epoch": 4383} {"train_loss": -26.390979766845703, "global_step": 363851, "epoch": 4383} {"train_loss": -25.29241371154785, "global_step": 363852, "epoch": 4383} {"train_loss": -26.129596710205078, "global_step": 363853, "epoch": 4383} {"train_loss": -25.456153869628906, "global_step": 363854, "epoch": 4383} {"train_loss": -25.86041831970215, "global_step": 363855, "epoch": 4383} {"train_loss": -25.619680404663086, "global_step": 363856, "epoch": 4383} {"train_loss": -25.5748348236084, "global_step": 363857, "epoch": 4383} {"train_loss": -25.592031478881836, "global_step": 363858, "epoch": 4383} {"train_loss": -25.57593536376953, "global_step": 363859, "epoch": 4383} {"train_loss": -26.110151290893555, "global_step": 363860, "epoch": 4383} {"train_loss": -25.963153839111328, "global_step": 363861, "epoch": 4383} {"train_loss": -26.209156036376953, "global_step": 363862, "epoch": 4383} {"train_loss": -25.836471557617188, "global_step": 363863, "epoch": 4383} {"train_loss": -25.82244873046875, "global_step": 363864, "epoch": 4383} {"train_loss": -26.055089950561523, "global_step": 363865, "epoch": 4383} {"train_loss": -26.361602783203125, "global_step": 363866, "epoch": 4383} {"train_loss": -25.8590030670166, "global_step": 363867, "epoch": 4383} {"train_loss": -26.160247802734375, "global_step": 363868, "epoch": 4383} {"train_loss": -25.876026153564453, "global_step": 363869, "epoch": 4383} {"train_loss": -26.249042510986328, "global_step": 363870, "epoch": 4383} {"train_loss": -25.991638666175934, "global_step": 363871, "epoch": 4383, "val_loss": 6640239.0} {"train_loss": -25.734882354736328, "global_step": 363872, "epoch": 4384} {"train_loss": -25.944482803344727, "global_step": 363873, "epoch": 4384} {"train_loss": -25.626358032226562, "global_step": 363874, "epoch": 4384} {"train_loss": -25.9324951171875, "global_step": 363875, "epoch": 4384} {"train_loss": -25.932363510131836, "global_step": 363876, "epoch": 4384} {"train_loss": -25.793079376220703, "global_step": 363877, "epoch": 4384} {"train_loss": -25.876996994018555, "global_step": 363878, "epoch": 4384} {"train_loss": -26.090076446533203, "global_step": 363879, "epoch": 4384} {"train_loss": -25.795358657836914, "global_step": 363880, "epoch": 4384} {"train_loss": -25.95088005065918, "global_step": 363881, "epoch": 4384} {"train_loss": -25.885379791259766, "global_step": 363882, "epoch": 4384} {"train_loss": -25.99226951599121, "global_step": 363883, "epoch": 4384} {"train_loss": -26.298187255859375, "global_step": 363884, "epoch": 4384} {"train_loss": -25.895544052124023, "global_step": 363885, "epoch": 4384} {"train_loss": -26.162038803100586, "global_step": 363886, "epoch": 4384} {"train_loss": -26.27235221862793, "global_step": 363887, "epoch": 4384} {"train_loss": -26.622791290283203, "global_step": 363888, "epoch": 4384} {"train_loss": -26.378538131713867, "global_step": 363889, "epoch": 4384} {"train_loss": -26.28769874572754, "global_step": 363890, "epoch": 4384} {"train_loss": -26.47382926940918, "global_step": 363891, "epoch": 4384} {"train_loss": -26.007450103759766, "global_step": 363892, "epoch": 4384} {"train_loss": -26.306859970092773, "global_step": 363893, "epoch": 4384} {"train_loss": -26.050281524658203, "global_step": 363894, "epoch": 4384} {"train_loss": -26.187591552734375, "global_step": 363895, "epoch": 4384} {"train_loss": -26.667865753173828, "global_step": 363896, "epoch": 4384} {"train_loss": -26.288557052612305, "global_step": 363897, "epoch": 4384} {"train_loss": -26.597503662109375, "global_step": 363898, "epoch": 4384} {"train_loss": -26.59791374206543, "global_step": 363899, "epoch": 4384} {"train_loss": -26.078454971313477, "global_step": 363900, "epoch": 4384} {"train_loss": -26.138071060180664, "global_step": 363901, "epoch": 4384} {"train_loss": -26.651086807250977, "global_step": 363902, "epoch": 4384} {"train_loss": -26.49067497253418, "global_step": 363903, "epoch": 4384} {"train_loss": -26.73969078063965, "global_step": 363904, "epoch": 4384} {"train_loss": -26.035144805908203, "global_step": 363905, "epoch": 4384} {"train_loss": -26.727094650268555, "global_step": 363906, "epoch": 4384} {"train_loss": -26.228002548217773, "global_step": 363907, "epoch": 4384} {"train_loss": -26.181055068969727, "global_step": 363908, "epoch": 4384} {"train_loss": -26.487882614135742, "global_step": 363909, "epoch": 4384} {"train_loss": -26.571699142456055, "global_step": 363910, "epoch": 4384} {"train_loss": -26.509973526000977, "global_step": 363911, "epoch": 4384} {"train_loss": -26.3955078125, "global_step": 363912, "epoch": 4384} {"train_loss": -26.7407169342041, "global_step": 363913, "epoch": 4384} {"train_loss": -26.502643585205078, "global_step": 363914, "epoch": 4384} {"train_loss": -26.71938133239746, "global_step": 363915, "epoch": 4384} {"train_loss": -26.67633628845215, "global_step": 363916, "epoch": 4384} {"train_loss": -26.768537521362305, "global_step": 363917, "epoch": 4384} {"train_loss": -25.959314346313477, "global_step": 363918, "epoch": 4384} {"train_loss": -26.291223526000977, "global_step": 363919, "epoch": 4384} {"train_loss": -26.4018497467041, "global_step": 363920, "epoch": 4384} {"train_loss": -26.66254997253418, "global_step": 363921, "epoch": 4384} {"train_loss": -26.38690185546875, "global_step": 363922, "epoch": 4384} {"train_loss": -26.50956153869629, "global_step": 363923, "epoch": 4384} {"train_loss": -26.570804595947266, "global_step": 363924, "epoch": 4384} {"train_loss": -26.593595504760742, "global_step": 363925, "epoch": 4384} {"train_loss": -26.444555282592773, "global_step": 363926, "epoch": 4384} {"train_loss": -26.390180587768555, "global_step": 363927, "epoch": 4384} {"train_loss": -26.32356071472168, "global_step": 363928, "epoch": 4384} {"train_loss": -25.962018966674805, "global_step": 363929, "epoch": 4384} {"train_loss": -26.014631271362305, "global_step": 363930, "epoch": 4384} {"train_loss": -26.324573516845703, "global_step": 363931, "epoch": 4384} {"train_loss": -26.15289306640625, "global_step": 363932, "epoch": 4384} {"train_loss": -26.25394058227539, "global_step": 363933, "epoch": 4384} {"train_loss": -26.211593627929688, "global_step": 363934, "epoch": 4384} {"train_loss": -25.773487091064453, "global_step": 363935, "epoch": 4384} {"train_loss": -26.503393173217773, "global_step": 363936, "epoch": 4384} {"train_loss": -26.107166290283203, "global_step": 363937, "epoch": 4384} {"train_loss": -26.521549224853516, "global_step": 363938, "epoch": 4384} {"train_loss": -26.19978141784668, "global_step": 363939, "epoch": 4384} {"train_loss": -26.24065589904785, "global_step": 363940, "epoch": 4384} {"train_loss": -26.412328720092773, "global_step": 363941, "epoch": 4384} {"train_loss": -26.579816818237305, "global_step": 363942, "epoch": 4384} {"train_loss": -26.427900314331055, "global_step": 363943, "epoch": 4384} {"train_loss": -26.45538330078125, "global_step": 363944, "epoch": 4384} {"train_loss": -26.698923110961914, "global_step": 363945, "epoch": 4384} {"train_loss": -26.540037155151367, "global_step": 363946, "epoch": 4384} {"train_loss": -26.094762802124023, "global_step": 363947, "epoch": 4384} {"train_loss": -26.068506240844727, "global_step": 363948, "epoch": 4384} {"train_loss": -26.256723403930664, "global_step": 363949, "epoch": 4384} {"train_loss": -26.009613037109375, "global_step": 363950, "epoch": 4384} {"train_loss": -25.815204620361328, "global_step": 363951, "epoch": 4384} {"train_loss": -25.92389488220215, "global_step": 363952, "epoch": 4384} {"train_loss": -25.89661979675293, "global_step": 363953, "epoch": 4384} {"train_loss": -26.29075211214732, "global_step": 363954, "epoch": 4384, "val_loss": 6630092.0} {"train_loss": -23.77496910095215, "global_step": 363955, "epoch": 4385} {"train_loss": -24.746631622314453, "global_step": 363956, "epoch": 4385} {"train_loss": -24.745908737182617, "global_step": 363957, "epoch": 4385} {"train_loss": -25.137365341186523, "global_step": 363958, "epoch": 4385} {"train_loss": -24.604206085205078, "global_step": 363959, "epoch": 4385} {"train_loss": -25.171310424804688, "global_step": 363960, "epoch": 4385} {"train_loss": -24.370439529418945, "global_step": 363961, "epoch": 4385} {"train_loss": -25.00873374938965, "global_step": 363962, "epoch": 4385} {"train_loss": -25.420272827148438, "global_step": 363963, "epoch": 4385} {"train_loss": -24.6200008392334, "global_step": 363964, "epoch": 4385} {"train_loss": -25.38541603088379, "global_step": 363965, "epoch": 4385} {"train_loss": -25.611860275268555, "global_step": 363966, "epoch": 4385} {"train_loss": -25.181381225585938, "global_step": 363967, "epoch": 4385} {"train_loss": -25.832473754882812, "global_step": 363968, "epoch": 4385} {"train_loss": -25.898717880249023, "global_step": 363969, "epoch": 4385} {"train_loss": -25.521141052246094, "global_step": 363970, "epoch": 4385} {"train_loss": -25.649200439453125, "global_step": 363971, "epoch": 4385} {"train_loss": -25.84564208984375, "global_step": 363972, "epoch": 4385} {"train_loss": -25.67939567565918, "global_step": 363973, "epoch": 4385} {"train_loss": -25.934045791625977, "global_step": 363974, "epoch": 4385} {"train_loss": -25.80942153930664, "global_step": 363975, "epoch": 4385} {"train_loss": -25.6798038482666, "global_step": 363976, "epoch": 4385} {"train_loss": -25.626020431518555, "global_step": 363977, "epoch": 4385} {"train_loss": -26.089765548706055, "global_step": 363978, "epoch": 4385} {"train_loss": -25.8851375579834, "global_step": 363979, "epoch": 4385} {"train_loss": -25.91471290588379, "global_step": 363980, "epoch": 4385} {"train_loss": -26.059873580932617, "global_step": 363981, "epoch": 4385} {"train_loss": -25.881067276000977, "global_step": 363982, "epoch": 4385} {"train_loss": -26.28838539123535, "global_step": 363983, "epoch": 4385} {"train_loss": -26.296283721923828, "global_step": 363984, "epoch": 4385} {"train_loss": -26.375473022460938, "global_step": 363985, "epoch": 4385} {"train_loss": -26.164648056030273, "global_step": 363986, "epoch": 4385} {"train_loss": -26.2277889251709, "global_step": 363987, "epoch": 4385} {"train_loss": -26.1076717376709, "global_step": 363988, "epoch": 4385} {"train_loss": -26.28622817993164, "global_step": 363989, "epoch": 4385} {"train_loss": -26.195871353149414, "global_step": 363990, "epoch": 4385} {"train_loss": -25.90724754333496, "global_step": 363991, "epoch": 4385} {"train_loss": -26.353668212890625, "global_step": 363992, "epoch": 4385} {"train_loss": -26.048110961914062, "global_step": 363993, "epoch": 4385} {"train_loss": -26.426284790039062, "global_step": 363994, "epoch": 4385} {"train_loss": -26.216785430908203, "global_step": 363995, "epoch": 4385} {"train_loss": -26.316314697265625, "global_step": 363996, "epoch": 4385} {"train_loss": -26.298215866088867, "global_step": 363997, "epoch": 4385} {"train_loss": -26.2148494720459, "global_step": 363998, "epoch": 4385} {"train_loss": -26.93617820739746, "global_step": 363999, "epoch": 4385} {"train_loss": -26.534931182861328, "global_step": 364000, "epoch": 4385} {"train_loss": -26.369461059570312, "global_step": 364001, "epoch": 4385} {"train_loss": -26.04904556274414, "global_step": 364002, "epoch": 4385} {"train_loss": -26.14883804321289, "global_step": 364003, "epoch": 4385} {"train_loss": -26.184335708618164, "global_step": 364004, "epoch": 4385} {"train_loss": -26.340805053710938, "global_step": 364005, "epoch": 4385} {"train_loss": -26.212671279907227, "global_step": 364006, "epoch": 4385} {"train_loss": -26.173358917236328, "global_step": 364007, "epoch": 4385} {"train_loss": -25.92791748046875, "global_step": 364008, "epoch": 4385} {"train_loss": -26.09327507019043, "global_step": 364009, "epoch": 4385} {"train_loss": -26.00636100769043, "global_step": 364010, "epoch": 4385} {"train_loss": -26.158130645751953, "global_step": 364011, "epoch": 4385} {"train_loss": -26.337491989135742, "global_step": 364012, "epoch": 4385} {"train_loss": -26.245569229125977, "global_step": 364013, "epoch": 4385} {"train_loss": -26.090503692626953, "global_step": 364014, "epoch": 4385} {"train_loss": -26.48829460144043, "global_step": 364015, "epoch": 4385} {"train_loss": -26.524799346923828, "global_step": 364016, "epoch": 4385} {"train_loss": -26.233213424682617, "global_step": 364017, "epoch": 4385} {"train_loss": -26.7928524017334, "global_step": 364018, "epoch": 4385} {"train_loss": -26.5826416015625, "global_step": 364019, "epoch": 4385} {"train_loss": -26.552032470703125, "global_step": 364020, "epoch": 4385} {"train_loss": -26.427322387695312, "global_step": 364021, "epoch": 4385} {"train_loss": -26.39423942565918, "global_step": 364022, "epoch": 4385} {"train_loss": -26.35589599609375, "global_step": 364023, "epoch": 4385} {"train_loss": -26.8521728515625, "global_step": 364024, "epoch": 4385} {"train_loss": -26.42640495300293, "global_step": 364025, "epoch": 4385} {"train_loss": -26.65175437927246, "global_step": 364026, "epoch": 4385} {"train_loss": -26.485509872436523, "global_step": 364027, "epoch": 4385} {"train_loss": -26.306344985961914, "global_step": 364028, "epoch": 4385} {"train_loss": -26.596099853515625, "global_step": 364029, "epoch": 4385} {"train_loss": -26.519271850585938, "global_step": 364030, "epoch": 4385} {"train_loss": -26.806875228881836, "global_step": 364031, "epoch": 4385} {"train_loss": -26.40741539001465, "global_step": 364032, "epoch": 4385} {"train_loss": -26.254104614257812, "global_step": 364033, "epoch": 4385} {"train_loss": -26.504180908203125, "global_step": 364034, "epoch": 4385} {"train_loss": -26.468948364257812, "global_step": 364035, "epoch": 4385} {"train_loss": -26.741199493408203, "global_step": 364036, "epoch": 4385} {"train_loss": -26.02148706367217, "global_step": 364037, "epoch": 4385, "val_loss": 6577779.0} {"train_loss": -26.0987548828125, "global_step": 364038, "epoch": 4386} {"train_loss": -25.905858993530273, "global_step": 364039, "epoch": 4386} {"train_loss": -25.402864456176758, "global_step": 364040, "epoch": 4386} {"train_loss": -26.156982421875, "global_step": 364041, "epoch": 4386} {"train_loss": -26.275754928588867, "global_step": 364042, "epoch": 4386} {"train_loss": -26.23567771911621, "global_step": 364043, "epoch": 4386} {"train_loss": -25.8017520904541, "global_step": 364044, "epoch": 4386} {"train_loss": -25.877471923828125, "global_step": 364045, "epoch": 4386} {"train_loss": -25.966150283813477, "global_step": 364046, "epoch": 4386} {"train_loss": -26.24367332458496, "global_step": 364047, "epoch": 4386} {"train_loss": -25.87507438659668, "global_step": 364048, "epoch": 4386} {"train_loss": -25.713825225830078, "global_step": 364049, "epoch": 4386} {"train_loss": -26.049701690673828, "global_step": 364050, "epoch": 4386} {"train_loss": -26.436614990234375, "global_step": 364051, "epoch": 4386} {"train_loss": -25.856943130493164, "global_step": 364052, "epoch": 4386} {"train_loss": -26.22675895690918, "global_step": 364053, "epoch": 4386} {"train_loss": -26.212223052978516, "global_step": 364054, "epoch": 4386} {"train_loss": -26.14737319946289, "global_step": 364055, "epoch": 4386} {"train_loss": -25.881025314331055, "global_step": 364056, "epoch": 4386} {"train_loss": -25.572973251342773, "global_step": 364057, "epoch": 4386} {"train_loss": -26.235746383666992, "global_step": 364058, "epoch": 4386} {"train_loss": -26.135177612304688, "global_step": 364059, "epoch": 4386} {"train_loss": -26.23581314086914, "global_step": 364060, "epoch": 4386} {"train_loss": -26.24823570251465, "global_step": 364061, "epoch": 4386} {"train_loss": -26.258106231689453, "global_step": 364062, "epoch": 4386} {"train_loss": -25.990976333618164, "global_step": 364063, "epoch": 4386} {"train_loss": -26.30596923828125, "global_step": 364064, "epoch": 4386} {"train_loss": -26.4990291595459, "global_step": 364065, "epoch": 4386} {"train_loss": -26.507678985595703, "global_step": 364066, "epoch": 4386} {"train_loss": -26.65626335144043, "global_step": 364067, "epoch": 4386} {"train_loss": -26.699726104736328, "global_step": 364068, "epoch": 4386} {"train_loss": -26.122879028320312, "global_step": 364069, "epoch": 4386} {"train_loss": -25.981998443603516, "global_step": 364070, "epoch": 4386} {"train_loss": -26.65473747253418, "global_step": 364071, "epoch": 4386} {"train_loss": -26.064682006835938, "global_step": 364072, "epoch": 4386} {"train_loss": -26.555402755737305, "global_step": 364073, "epoch": 4386} {"train_loss": -25.875951766967773, "global_step": 364074, "epoch": 4386} {"train_loss": -26.474287033081055, "global_step": 364075, "epoch": 4386} {"train_loss": -26.536243438720703, "global_step": 364076, "epoch": 4386} {"train_loss": -26.16607093811035, "global_step": 364077, "epoch": 4386} {"train_loss": -26.27577018737793, "global_step": 364078, "epoch": 4386} {"train_loss": -26.301300048828125, "global_step": 364079, "epoch": 4386} {"train_loss": -26.052717208862305, "global_step": 364080, "epoch": 4386} {"train_loss": -26.52521324157715, "global_step": 364081, "epoch": 4386} {"train_loss": -26.359161376953125, "global_step": 364082, "epoch": 4386} {"train_loss": -26.193958282470703, "global_step": 364083, "epoch": 4386} {"train_loss": -26.111494064331055, "global_step": 364084, "epoch": 4386} {"train_loss": -26.22763442993164, "global_step": 364085, "epoch": 4386} {"train_loss": -26.182886123657227, "global_step": 364086, "epoch": 4386} {"train_loss": -26.758747100830078, "global_step": 364087, "epoch": 4386} {"train_loss": -26.63302993774414, "global_step": 364088, "epoch": 4386} {"train_loss": -26.651611328125, "global_step": 364089, "epoch": 4386} {"train_loss": -26.214385986328125, "global_step": 364090, "epoch": 4386} {"train_loss": -26.601612091064453, "global_step": 364091, "epoch": 4386} {"train_loss": -26.209741592407227, "global_step": 364092, "epoch": 4386} {"train_loss": -26.501102447509766, "global_step": 364093, "epoch": 4386} {"train_loss": -26.601669311523438, "global_step": 364094, "epoch": 4386} {"train_loss": -26.18353271484375, "global_step": 364095, "epoch": 4386} {"train_loss": -26.257694244384766, "global_step": 364096, "epoch": 4386} {"train_loss": -26.56545066833496, "global_step": 364097, "epoch": 4386} {"train_loss": -26.740819931030273, "global_step": 364098, "epoch": 4386} {"train_loss": -26.26987648010254, "global_step": 364099, "epoch": 4386} {"train_loss": -26.065893173217773, "global_step": 364100, "epoch": 4386} {"train_loss": -26.331119537353516, "global_step": 364101, "epoch": 4386} {"train_loss": -26.077539443969727, "global_step": 364102, "epoch": 4386} {"train_loss": -25.857999801635742, "global_step": 364103, "epoch": 4386} {"train_loss": -26.023340225219727, "global_step": 364104, "epoch": 4386} {"train_loss": -25.920516967773438, "global_step": 364105, "epoch": 4386} {"train_loss": -25.970874786376953, "global_step": 364106, "epoch": 4386} {"train_loss": -26.439733505249023, "global_step": 364107, "epoch": 4386} {"train_loss": -26.199512481689453, "global_step": 364108, "epoch": 4386} {"train_loss": -26.21097183227539, "global_step": 364109, "epoch": 4386} {"train_loss": -26.469350814819336, "global_step": 364110, "epoch": 4386} {"train_loss": -25.992048263549805, "global_step": 364111, "epoch": 4386} {"train_loss": -26.399911880493164, "global_step": 364112, "epoch": 4386} {"train_loss": -26.45241355895996, "global_step": 364113, "epoch": 4386} {"train_loss": -26.47077751159668, "global_step": 364114, "epoch": 4386} {"train_loss": -26.40530776977539, "global_step": 364115, "epoch": 4386} {"train_loss": -26.17109489440918, "global_step": 364116, "epoch": 4386} {"train_loss": -26.1716251373291, "global_step": 364117, "epoch": 4386} {"train_loss": -26.177526473999023, "global_step": 364118, "epoch": 4386} {"train_loss": -26.313329696655273, "global_step": 364119, "epoch": 4386} {"train_loss": -26.23783435591732, "global_step": 364120, "epoch": 4386, "val_loss": 6587039.0} {"train_loss": -24.98738670349121, "global_step": 364121, "epoch": 4387} {"train_loss": -25.64458656311035, "global_step": 364122, "epoch": 4387} {"train_loss": -25.161048889160156, "global_step": 364123, "epoch": 4387} {"train_loss": -25.128129959106445, "global_step": 364124, "epoch": 4387} {"train_loss": -25.224096298217773, "global_step": 364125, "epoch": 4387} {"train_loss": -25.40239906311035, "global_step": 364126, "epoch": 4387} {"train_loss": -25.483142852783203, "global_step": 364127, "epoch": 4387} {"train_loss": -25.8244686126709, "global_step": 364128, "epoch": 4387} {"train_loss": -25.569759368896484, "global_step": 364129, "epoch": 4387} {"train_loss": -25.38209342956543, "global_step": 364130, "epoch": 4387} {"train_loss": -25.80328941345215, "global_step": 364131, "epoch": 4387} {"train_loss": -25.679981231689453, "global_step": 364132, "epoch": 4387} {"train_loss": -25.8918514251709, "global_step": 364133, "epoch": 4387} {"train_loss": -25.759931564331055, "global_step": 364134, "epoch": 4387} {"train_loss": -25.763212203979492, "global_step": 364135, "epoch": 4387} {"train_loss": -25.9385986328125, "global_step": 364136, "epoch": 4387} {"train_loss": -25.933151245117188, "global_step": 364137, "epoch": 4387} {"train_loss": -25.731306076049805, "global_step": 364138, "epoch": 4387} {"train_loss": -26.020889282226562, "global_step": 364139, "epoch": 4387} {"train_loss": -26.31418800354004, "global_step": 364140, "epoch": 4387} {"train_loss": -25.85761070251465, "global_step": 364141, "epoch": 4387} {"train_loss": -25.96921730041504, "global_step": 364142, "epoch": 4387} {"train_loss": -26.137451171875, "global_step": 364143, "epoch": 4387} {"train_loss": -26.5716495513916, "global_step": 364144, "epoch": 4387} {"train_loss": -26.29204750061035, "global_step": 364145, "epoch": 4387} {"train_loss": -26.189117431640625, "global_step": 364146, "epoch": 4387} {"train_loss": -26.47071647644043, "global_step": 364147, "epoch": 4387} {"train_loss": -26.007389068603516, "global_step": 364148, "epoch": 4387} {"train_loss": -26.3575496673584, "global_step": 364149, "epoch": 4387} {"train_loss": -26.065902709960938, "global_step": 364150, "epoch": 4387} {"train_loss": -25.985837936401367, "global_step": 364151, "epoch": 4387} {"train_loss": -26.211912155151367, "global_step": 364152, "epoch": 4387} {"train_loss": -26.16583251953125, "global_step": 364153, "epoch": 4387} {"train_loss": -26.250473022460938, "global_step": 364154, "epoch": 4387} {"train_loss": -25.888166427612305, "global_step": 364155, "epoch": 4387} {"train_loss": -26.577661514282227, "global_step": 364156, "epoch": 4387} {"train_loss": -26.431360244750977, "global_step": 364157, "epoch": 4387} {"train_loss": -26.270008087158203, "global_step": 364158, "epoch": 4387} {"train_loss": -26.68720817565918, "global_step": 364159, "epoch": 4387} {"train_loss": -26.749948501586914, "global_step": 364160, "epoch": 4387} {"train_loss": -25.9565372467041, "global_step": 364161, "epoch": 4387} {"train_loss": -26.239501953125, "global_step": 364162, "epoch": 4387} {"train_loss": -26.194198608398438, "global_step": 364163, "epoch": 4387} {"train_loss": -26.5700740814209, "global_step": 364164, "epoch": 4387} {"train_loss": -26.124975204467773, "global_step": 364165, "epoch": 4387} {"train_loss": -26.40151023864746, "global_step": 364166, "epoch": 4387} {"train_loss": -26.2657413482666, "global_step": 364167, "epoch": 4387} {"train_loss": -25.761938095092773, "global_step": 364168, "epoch": 4387} {"train_loss": -26.390533447265625, "global_step": 364169, "epoch": 4387} {"train_loss": -26.19647789001465, "global_step": 364170, "epoch": 4387} {"train_loss": -25.72028923034668, "global_step": 364171, "epoch": 4387} {"train_loss": -26.080524444580078, "global_step": 364172, "epoch": 4387} {"train_loss": -25.936315536499023, "global_step": 364173, "epoch": 4387} {"train_loss": -26.34818458557129, "global_step": 364174, "epoch": 4387} {"train_loss": -26.357542037963867, "global_step": 364175, "epoch": 4387} {"train_loss": -25.59067726135254, "global_step": 364176, "epoch": 4387} {"train_loss": -26.349340438842773, "global_step": 364177, "epoch": 4387} {"train_loss": -26.298215866088867, "global_step": 364178, "epoch": 4387} {"train_loss": -25.874948501586914, "global_step": 364179, "epoch": 4387} {"train_loss": -26.060598373413086, "global_step": 364180, "epoch": 4387} {"train_loss": -26.193042755126953, "global_step": 364181, "epoch": 4387} {"train_loss": -26.3291015625, "global_step": 364182, "epoch": 4387} {"train_loss": -26.167036056518555, "global_step": 364183, "epoch": 4387} {"train_loss": -26.12042808532715, "global_step": 364184, "epoch": 4387} {"train_loss": -26.34820556640625, "global_step": 364185, "epoch": 4387} {"train_loss": -25.785480499267578, "global_step": 364186, "epoch": 4387} {"train_loss": -26.28415298461914, "global_step": 364187, "epoch": 4387} {"train_loss": -26.568464279174805, "global_step": 364188, "epoch": 4387} {"train_loss": -26.22084617614746, "global_step": 364189, "epoch": 4387} {"train_loss": -26.593008041381836, "global_step": 364190, "epoch": 4387} {"train_loss": -26.384851455688477, "global_step": 364191, "epoch": 4387} {"train_loss": -26.250137329101562, "global_step": 364192, "epoch": 4387} {"train_loss": -26.22865104675293, "global_step": 364193, "epoch": 4387} {"train_loss": -26.47852897644043, "global_step": 364194, "epoch": 4387} {"train_loss": -26.2686767578125, "global_step": 364195, "epoch": 4387} {"train_loss": -26.380264282226562, "global_step": 364196, "epoch": 4387} {"train_loss": -26.3699893951416, "global_step": 364197, "epoch": 4387} {"train_loss": -26.213531494140625, "global_step": 364198, "epoch": 4387} {"train_loss": -26.7066650390625, "global_step": 364199, "epoch": 4387} {"train_loss": -26.2668399810791, "global_step": 364200, "epoch": 4387} {"train_loss": -26.42816734313965, "global_step": 364201, "epoch": 4387} {"train_loss": -26.36419105529785, "global_step": 364202, "epoch": 4387} {"train_loss": -26.093613750963325, "global_step": 364203, "epoch": 4387, "val_loss": 6639104.5} {"train_loss": -25.554344177246094, "global_step": 364204, "epoch": 4388} {"train_loss": -25.537109375, "global_step": 364205, "epoch": 4388} {"train_loss": -26.058624267578125, "global_step": 364206, "epoch": 4388} {"train_loss": -25.933975219726562, "global_step": 364207, "epoch": 4388} {"train_loss": -26.319812774658203, "global_step": 364208, "epoch": 4388} {"train_loss": -26.398151397705078, "global_step": 364209, "epoch": 4388} {"train_loss": -25.882749557495117, "global_step": 364210, "epoch": 4388} {"train_loss": -26.13648796081543, "global_step": 364211, "epoch": 4388} {"train_loss": -26.327604293823242, "global_step": 364212, "epoch": 4388} {"train_loss": -26.1042423248291, "global_step": 364213, "epoch": 4388} {"train_loss": -26.099218368530273, "global_step": 364214, "epoch": 4388} {"train_loss": -26.214303970336914, "global_step": 364215, "epoch": 4388} {"train_loss": -26.346853256225586, "global_step": 364216, "epoch": 4388} {"train_loss": -26.25210952758789, "global_step": 364217, "epoch": 4388} {"train_loss": -26.12506675720215, "global_step": 364218, "epoch": 4388} {"train_loss": -26.48469352722168, "global_step": 364219, "epoch": 4388} {"train_loss": -26.299591064453125, "global_step": 364220, "epoch": 4388} {"train_loss": -26.158782958984375, "global_step": 364221, "epoch": 4388} {"train_loss": -26.210880279541016, "global_step": 364222, "epoch": 4388} {"train_loss": -25.885725021362305, "global_step": 364223, "epoch": 4388} {"train_loss": -25.853811264038086, "global_step": 364224, "epoch": 4388} {"train_loss": -26.623022079467773, "global_step": 364225, "epoch": 4388} {"train_loss": -26.353525161743164, "global_step": 364226, "epoch": 4388} {"train_loss": -25.897470474243164, "global_step": 364227, "epoch": 4388} {"train_loss": -26.19536781311035, "global_step": 364228, "epoch": 4388} {"train_loss": -26.243316650390625, "global_step": 364229, "epoch": 4388} {"train_loss": -25.951147079467773, "global_step": 364230, "epoch": 4388} {"train_loss": -26.176660537719727, "global_step": 364231, "epoch": 4388} {"train_loss": -26.08375358581543, "global_step": 364232, "epoch": 4388} {"train_loss": -26.102468490600586, "global_step": 364233, "epoch": 4388} {"train_loss": -26.077619552612305, "global_step": 364234, "epoch": 4388} {"train_loss": -26.371490478515625, "global_step": 364235, "epoch": 4388} {"train_loss": -26.258621215820312, "global_step": 364236, "epoch": 4388} {"train_loss": -26.237287521362305, "global_step": 364237, "epoch": 4388} {"train_loss": -26.13594627380371, "global_step": 364238, "epoch": 4388} {"train_loss": -26.384824752807617, "global_step": 364239, "epoch": 4388} {"train_loss": -26.738330841064453, "global_step": 364240, "epoch": 4388} {"train_loss": -26.523853302001953, "global_step": 364241, "epoch": 4388} {"train_loss": -26.618228912353516, "global_step": 364242, "epoch": 4388} {"train_loss": -26.798303604125977, "global_step": 364243, "epoch": 4388} {"train_loss": -26.723785400390625, "global_step": 364244, "epoch": 4388} {"train_loss": -26.377124786376953, "global_step": 364245, "epoch": 4388} {"train_loss": -25.907440185546875, "global_step": 364246, "epoch": 4388} {"train_loss": -27.117938995361328, "global_step": 364247, "epoch": 4388} {"train_loss": -26.456897735595703, "global_step": 364248, "epoch": 4388} {"train_loss": -26.591205596923828, "global_step": 364249, "epoch": 4388} {"train_loss": -26.58823013305664, "global_step": 364250, "epoch": 4388} {"train_loss": -26.036252975463867, "global_step": 364251, "epoch": 4388} {"train_loss": -26.090351104736328, "global_step": 364252, "epoch": 4388} {"train_loss": -25.918716430664062, "global_step": 364253, "epoch": 4388} {"train_loss": -26.184167861938477, "global_step": 364254, "epoch": 4388} {"train_loss": -25.817169189453125, "global_step": 364255, "epoch": 4388} {"train_loss": -25.91790199279785, "global_step": 364256, "epoch": 4388} {"train_loss": -26.346603393554688, "global_step": 364257, "epoch": 4388} {"train_loss": -26.07305335998535, "global_step": 364258, "epoch": 4388} {"train_loss": -26.33469009399414, "global_step": 364259, "epoch": 4388} {"train_loss": -26.370508193969727, "global_step": 364260, "epoch": 4388} {"train_loss": -26.372095108032227, "global_step": 364261, "epoch": 4388} {"train_loss": -26.33209800720215, "global_step": 364262, "epoch": 4388} {"train_loss": -26.057453155517578, "global_step": 364263, "epoch": 4388} {"train_loss": -26.389209747314453, "global_step": 364264, "epoch": 4388} {"train_loss": -26.350494384765625, "global_step": 364265, "epoch": 4388} {"train_loss": -26.159204483032227, "global_step": 364266, "epoch": 4388} {"train_loss": -26.220996856689453, "global_step": 364267, "epoch": 4388} {"train_loss": -26.2141056060791, "global_step": 364268, "epoch": 4388} {"train_loss": -26.436887741088867, "global_step": 364269, "epoch": 4388} {"train_loss": -26.613101959228516, "global_step": 364270, "epoch": 4388} {"train_loss": -26.360260009765625, "global_step": 364271, "epoch": 4388} {"train_loss": -26.343250274658203, "global_step": 364272, "epoch": 4388} {"train_loss": -26.332962036132812, "global_step": 364273, "epoch": 4388} {"train_loss": -25.955204010009766, "global_step": 364274, "epoch": 4388} {"train_loss": -26.063756942749023, "global_step": 364275, "epoch": 4388} {"train_loss": -26.20198631286621, "global_step": 364276, "epoch": 4388} {"train_loss": -26.352949142456055, "global_step": 364277, "epoch": 4388} {"train_loss": -26.603124618530273, "global_step": 364278, "epoch": 4388} {"train_loss": -26.321502685546875, "global_step": 364279, "epoch": 4388} {"train_loss": -26.41529655456543, "global_step": 364280, "epoch": 4388} {"train_loss": -26.6743221282959, "global_step": 364281, "epoch": 4388} {"train_loss": -26.222692489624023, "global_step": 364282, "epoch": 4388} {"train_loss": -25.809507369995117, "global_step": 364283, "epoch": 4388} {"train_loss": -25.876691818237305, "global_step": 364284, "epoch": 4388} {"train_loss": -26.199777603149414, "global_step": 364285, "epoch": 4388} {"train_loss": -26.247183581432665, "global_step": 364286, "epoch": 4388, "val_loss": 6601940.5} {"train_loss": -25.566144943237305, "global_step": 364287, "epoch": 4389} {"train_loss": -25.224512100219727, "global_step": 364288, "epoch": 4389} {"train_loss": -25.387136459350586, "global_step": 364289, "epoch": 4389} {"train_loss": -25.943119049072266, "global_step": 364290, "epoch": 4389} {"train_loss": -25.653289794921875, "global_step": 364291, "epoch": 4389} {"train_loss": -25.38962745666504, "global_step": 364292, "epoch": 4389} {"train_loss": -25.77139663696289, "global_step": 364293, "epoch": 4389} {"train_loss": -26.060504913330078, "global_step": 364294, "epoch": 4389} {"train_loss": -25.99814224243164, "global_step": 364295, "epoch": 4389} {"train_loss": -26.20844078063965, "global_step": 364296, "epoch": 4389} {"train_loss": -26.001684188842773, "global_step": 364297, "epoch": 4389} {"train_loss": -25.941574096679688, "global_step": 364298, "epoch": 4389} {"train_loss": -26.190113067626953, "global_step": 364299, "epoch": 4389} {"train_loss": -26.046533584594727, "global_step": 364300, "epoch": 4389} {"train_loss": -26.176206588745117, "global_step": 364301, "epoch": 4389} {"train_loss": -26.408981323242188, "global_step": 364302, "epoch": 4389} {"train_loss": -25.958097457885742, "global_step": 364303, "epoch": 4389} {"train_loss": -26.09553337097168, "global_step": 364304, "epoch": 4389} {"train_loss": -26.143457412719727, "global_step": 364305, "epoch": 4389} {"train_loss": -26.25661277770996, "global_step": 364306, "epoch": 4389} {"train_loss": -26.23064613342285, "global_step": 364307, "epoch": 4389} {"train_loss": -26.23598289489746, "global_step": 364308, "epoch": 4389} {"train_loss": -26.030126571655273, "global_step": 364309, "epoch": 4389} {"train_loss": -26.3759765625, "global_step": 364310, "epoch": 4389} {"train_loss": -26.09814453125, "global_step": 364311, "epoch": 4389} {"train_loss": -26.14967155456543, "global_step": 364312, "epoch": 4389} {"train_loss": -26.7265682220459, "global_step": 364313, "epoch": 4389} {"train_loss": -26.486494064331055, "global_step": 364314, "epoch": 4389} {"train_loss": -26.385242462158203, "global_step": 364315, "epoch": 4389} {"train_loss": -25.95479393005371, "global_step": 364316, "epoch": 4389} {"train_loss": -26.3077392578125, "global_step": 364317, "epoch": 4389} {"train_loss": -26.54375648498535, "global_step": 364318, "epoch": 4389} {"train_loss": -26.328367233276367, "global_step": 364319, "epoch": 4389} {"train_loss": -26.484821319580078, "global_step": 364320, "epoch": 4389} {"train_loss": -26.102115631103516, "global_step": 364321, "epoch": 4389} {"train_loss": -26.357969284057617, "global_step": 364322, "epoch": 4389} {"train_loss": -26.27197265625, "global_step": 364323, "epoch": 4389} {"train_loss": -26.5750789642334, "global_step": 364324, "epoch": 4389} {"train_loss": -26.401382446289062, "global_step": 364325, "epoch": 4389} {"train_loss": -26.484899520874023, "global_step": 364326, "epoch": 4389} {"train_loss": -26.608335494995117, "global_step": 364327, "epoch": 4389} {"train_loss": -26.67449951171875, "global_step": 364328, "epoch": 4389} {"train_loss": -26.38356590270996, "global_step": 364329, "epoch": 4389} {"train_loss": -25.91547966003418, "global_step": 364330, "epoch": 4389} {"train_loss": -25.99234390258789, "global_step": 364331, "epoch": 4389} {"train_loss": -26.802473068237305, "global_step": 364332, "epoch": 4389} {"train_loss": -26.31509780883789, "global_step": 364333, "epoch": 4389} {"train_loss": -26.526853561401367, "global_step": 364334, "epoch": 4389} {"train_loss": -26.049442291259766, "global_step": 364335, "epoch": 4389} {"train_loss": -26.35951805114746, "global_step": 364336, "epoch": 4389} {"train_loss": -26.410083770751953, "global_step": 364337, "epoch": 4389} {"train_loss": -25.7076358795166, "global_step": 364338, "epoch": 4389} {"train_loss": -26.23628807067871, "global_step": 364339, "epoch": 4389} {"train_loss": -26.49116325378418, "global_step": 364340, "epoch": 4389} {"train_loss": -26.1450138092041, "global_step": 364341, "epoch": 4389} {"train_loss": -26.40553855895996, "global_step": 364342, "epoch": 4389} {"train_loss": -26.19089698791504, "global_step": 364343, "epoch": 4389} {"train_loss": -26.286935806274414, "global_step": 364344, "epoch": 4389} {"train_loss": -26.402746200561523, "global_step": 364345, "epoch": 4389} {"train_loss": -26.48274040222168, "global_step": 364346, "epoch": 4389} {"train_loss": -26.190643310546875, "global_step": 364347, "epoch": 4389} {"train_loss": -26.208404541015625, "global_step": 364348, "epoch": 4389} {"train_loss": -26.307111740112305, "global_step": 364349, "epoch": 4389} {"train_loss": -25.856481552124023, "global_step": 364350, "epoch": 4389} {"train_loss": -26.338275909423828, "global_step": 364351, "epoch": 4389} {"train_loss": -25.910491943359375, "global_step": 364352, "epoch": 4389} {"train_loss": -26.568647384643555, "global_step": 364353, "epoch": 4389} {"train_loss": -26.2779483795166, "global_step": 364354, "epoch": 4389} {"train_loss": -26.108327865600586, "global_step": 364355, "epoch": 4389} {"train_loss": -26.2692928314209, "global_step": 364356, "epoch": 4389} {"train_loss": -26.263696670532227, "global_step": 364357, "epoch": 4389} {"train_loss": -26.200162887573242, "global_step": 364358, "epoch": 4389} {"train_loss": -26.1708984375, "global_step": 364359, "epoch": 4389} {"train_loss": -26.118146896362305, "global_step": 364360, "epoch": 4389} {"train_loss": -26.411157608032227, "global_step": 364361, "epoch": 4389} {"train_loss": -25.76029396057129, "global_step": 364362, "epoch": 4389} {"train_loss": -25.879194259643555, "global_step": 364363, "epoch": 4389} {"train_loss": -26.28626823425293, "global_step": 364364, "epoch": 4389} {"train_loss": -26.022485733032227, "global_step": 364365, "epoch": 4389} {"train_loss": -26.487716674804688, "global_step": 364366, "epoch": 4389} {"train_loss": -26.192657470703125, "global_step": 364367, "epoch": 4389} {"train_loss": -25.891143798828125, "global_step": 364368, "epoch": 4389} {"train_loss": -26.157291596194348, "global_step": 364369, "epoch": 4389, "val_loss": 6556373.0} {"train_loss": -25.9429874420166, "global_step": 364370, "epoch": 4390} {"train_loss": -25.699167251586914, "global_step": 364371, "epoch": 4390} {"train_loss": -25.553861618041992, "global_step": 364372, "epoch": 4390} {"train_loss": -25.253637313842773, "global_step": 364373, "epoch": 4390} {"train_loss": -25.755823135375977, "global_step": 364374, "epoch": 4390} {"train_loss": -25.81693458557129, "global_step": 364375, "epoch": 4390} {"train_loss": -25.90028953552246, "global_step": 364376, "epoch": 4390} {"train_loss": -26.275257110595703, "global_step": 364377, "epoch": 4390} {"train_loss": -26.637964248657227, "global_step": 364378, "epoch": 4390} {"train_loss": -26.280527114868164, "global_step": 364379, "epoch": 4390} {"train_loss": -25.844945907592773, "global_step": 364380, "epoch": 4390} {"train_loss": -26.077951431274414, "global_step": 364381, "epoch": 4390} {"train_loss": -25.922407150268555, "global_step": 364382, "epoch": 4390} {"train_loss": -26.1075382232666, "global_step": 364383, "epoch": 4390} {"train_loss": -25.75538444519043, "global_step": 364384, "epoch": 4390} {"train_loss": -25.953439712524414, "global_step": 364385, "epoch": 4390} {"train_loss": -26.2053165435791, "global_step": 364386, "epoch": 4390} {"train_loss": -26.270978927612305, "global_step": 364387, "epoch": 4390} {"train_loss": -26.348012924194336, "global_step": 364388, "epoch": 4390} {"train_loss": -26.35281753540039, "global_step": 364389, "epoch": 4390} {"train_loss": -26.042587280273438, "global_step": 364390, "epoch": 4390} {"train_loss": -26.070722579956055, "global_step": 364391, "epoch": 4390} {"train_loss": -26.372159957885742, "global_step": 364392, "epoch": 4390} {"train_loss": -26.147876739501953, "global_step": 364393, "epoch": 4390} {"train_loss": -26.46388053894043, "global_step": 364394, "epoch": 4390} {"train_loss": -26.06583023071289, "global_step": 364395, "epoch": 4390} {"train_loss": -25.889114379882812, "global_step": 364396, "epoch": 4390} {"train_loss": -26.155384063720703, "global_step": 364397, "epoch": 4390} {"train_loss": -26.38980484008789, "global_step": 364398, "epoch": 4390} {"train_loss": -26.3594913482666, "global_step": 364399, "epoch": 4390} {"train_loss": -26.09844970703125, "global_step": 364400, "epoch": 4390} {"train_loss": -26.253808975219727, "global_step": 364401, "epoch": 4390} {"train_loss": -26.200937271118164, "global_step": 364402, "epoch": 4390} {"train_loss": -26.26289176940918, "global_step": 364403, "epoch": 4390} {"train_loss": -26.4811954498291, "global_step": 364404, "epoch": 4390} {"train_loss": -26.379669189453125, "global_step": 364405, "epoch": 4390} {"train_loss": -26.111007690429688, "global_step": 364406, "epoch": 4390} {"train_loss": -26.13102149963379, "global_step": 364407, "epoch": 4390} {"train_loss": -26.08448600769043, "global_step": 364408, "epoch": 4390} {"train_loss": -26.237821578979492, "global_step": 364409, "epoch": 4390} {"train_loss": -26.262664794921875, "global_step": 364410, "epoch": 4390} {"train_loss": -26.3518123626709, "global_step": 364411, "epoch": 4390} {"train_loss": -26.079452514648438, "global_step": 364412, "epoch": 4390} {"train_loss": -25.487985610961914, "global_step": 364413, "epoch": 4390} {"train_loss": -25.992048263549805, "global_step": 364414, "epoch": 4390} {"train_loss": -25.745328903198242, "global_step": 364415, "epoch": 4390} {"train_loss": -25.17288589477539, "global_step": 364416, "epoch": 4390} {"train_loss": -25.17962646484375, "global_step": 364417, "epoch": 4390} {"train_loss": -25.09674644470215, "global_step": 364418, "epoch": 4390} {"train_loss": -26.365238189697266, "global_step": 364419, "epoch": 4390} {"train_loss": -25.994571685791016, "global_step": 364420, "epoch": 4390} {"train_loss": -25.650365829467773, "global_step": 364421, "epoch": 4390} {"train_loss": -25.94111442565918, "global_step": 364422, "epoch": 4390} {"train_loss": -26.235107421875, "global_step": 364423, "epoch": 4390} {"train_loss": -26.23552894592285, "global_step": 364424, "epoch": 4390} {"train_loss": -26.018386840820312, "global_step": 364425, "epoch": 4390} {"train_loss": -26.17612648010254, "global_step": 364426, "epoch": 4390} {"train_loss": -26.359792709350586, "global_step": 364427, "epoch": 4390} {"train_loss": -26.02084732055664, "global_step": 364428, "epoch": 4390} {"train_loss": -26.502918243408203, "global_step": 364429, "epoch": 4390} {"train_loss": -25.877790451049805, "global_step": 364430, "epoch": 4390} {"train_loss": -26.50555419921875, "global_step": 364431, "epoch": 4390} {"train_loss": -26.680952072143555, "global_step": 364432, "epoch": 4390} {"train_loss": -26.358951568603516, "global_step": 364433, "epoch": 4390} {"train_loss": -26.466962814331055, "global_step": 364434, "epoch": 4390} {"train_loss": -26.252643585205078, "global_step": 364435, "epoch": 4390} {"train_loss": -26.2130184173584, "global_step": 364436, "epoch": 4390} {"train_loss": -25.923480987548828, "global_step": 364437, "epoch": 4390} {"train_loss": -26.291929244995117, "global_step": 364438, "epoch": 4390} {"train_loss": -26.387039184570312, "global_step": 364439, "epoch": 4390} {"train_loss": -26.422149658203125, "global_step": 364440, "epoch": 4390} {"train_loss": -26.31141471862793, "global_step": 364441, "epoch": 4390} {"train_loss": -26.475143432617188, "global_step": 364442, "epoch": 4390} {"train_loss": -26.467731475830078, "global_step": 364443, "epoch": 4390} {"train_loss": -26.312931060791016, "global_step": 364444, "epoch": 4390} {"train_loss": -26.357227325439453, "global_step": 364445, "epoch": 4390} {"train_loss": -25.840307235717773, "global_step": 364446, "epoch": 4390} {"train_loss": -25.164281845092773, "global_step": 364447, "epoch": 4390} {"train_loss": -25.00196647644043, "global_step": 364448, "epoch": 4390} {"train_loss": -25.240522384643555, "global_step": 364449, "epoch": 4390} {"train_loss": -26.593570709228516, "global_step": 364450, "epoch": 4390} {"train_loss": -26.053192138671875, "global_step": 364451, "epoch": 4390} {"train_loss": -26.08015696973686, "global_step": 364452, "epoch": 4390, "val_loss": 6578222.0} {"train_loss": -25.354379653930664, "global_step": 364453, "epoch": 4391} {"train_loss": -25.66255760192871, "global_step": 364454, "epoch": 4391} {"train_loss": -24.754039764404297, "global_step": 364455, "epoch": 4391} {"train_loss": -25.3829345703125, "global_step": 364456, "epoch": 4391} {"train_loss": -25.67234230041504, "global_step": 364457, "epoch": 4391} {"train_loss": -25.29330062866211, "global_step": 364458, "epoch": 4391} {"train_loss": -25.40361785888672, "global_step": 364459, "epoch": 4391} {"train_loss": -25.471290588378906, "global_step": 364460, "epoch": 4391} {"train_loss": -25.887739181518555, "global_step": 364461, "epoch": 4391} {"train_loss": -25.504947662353516, "global_step": 364462, "epoch": 4391} {"train_loss": -25.484357833862305, "global_step": 364463, "epoch": 4391} {"train_loss": -25.66236686706543, "global_step": 364464, "epoch": 4391} {"train_loss": -25.553977966308594, "global_step": 364465, "epoch": 4391} {"train_loss": -25.85548973083496, "global_step": 364466, "epoch": 4391} {"train_loss": -25.546314239501953, "global_step": 364467, "epoch": 4391} {"train_loss": -25.81711769104004, "global_step": 364468, "epoch": 4391} {"train_loss": -25.843719482421875, "global_step": 364469, "epoch": 4391} {"train_loss": -26.002582550048828, "global_step": 364470, "epoch": 4391} {"train_loss": -25.93263053894043, "global_step": 364471, "epoch": 4391} {"train_loss": -25.395797729492188, "global_step": 364472, "epoch": 4391} {"train_loss": -26.219465255737305, "global_step": 364473, "epoch": 4391} {"train_loss": -25.767438888549805, "global_step": 364474, "epoch": 4391} {"train_loss": -25.9050235748291, "global_step": 364475, "epoch": 4391} {"train_loss": -25.62038230895996, "global_step": 364476, "epoch": 4391} {"train_loss": -25.853864669799805, "global_step": 364477, "epoch": 4391} {"train_loss": -26.41512107849121, "global_step": 364478, "epoch": 4391} {"train_loss": -25.774545669555664, "global_step": 364479, "epoch": 4391} {"train_loss": -25.865203857421875, "global_step": 364480, "epoch": 4391} {"train_loss": -26.327306747436523, "global_step": 364481, "epoch": 4391} {"train_loss": -25.972951889038086, "global_step": 364482, "epoch": 4391} {"train_loss": -26.079458236694336, "global_step": 364483, "epoch": 4391} {"train_loss": -26.124155044555664, "global_step": 364484, "epoch": 4391} {"train_loss": -26.290430068969727, "global_step": 364485, "epoch": 4391} {"train_loss": -26.265289306640625, "global_step": 364486, "epoch": 4391} {"train_loss": -26.154165267944336, "global_step": 364487, "epoch": 4391} {"train_loss": -26.0292911529541, "global_step": 364488, "epoch": 4391} {"train_loss": -26.623096466064453, "global_step": 364489, "epoch": 4391} {"train_loss": -26.226232528686523, "global_step": 364490, "epoch": 4391} {"train_loss": -26.0161190032959, "global_step": 364491, "epoch": 4391} {"train_loss": -26.186904907226562, "global_step": 364492, "epoch": 4391} {"train_loss": -26.228595733642578, "global_step": 364493, "epoch": 4391} {"train_loss": -26.417724609375, "global_step": 364494, "epoch": 4391} {"train_loss": -26.39740562438965, "global_step": 364495, "epoch": 4391} {"train_loss": -26.56097984313965, "global_step": 364496, "epoch": 4391} {"train_loss": -26.7307071685791, "global_step": 364497, "epoch": 4391} {"train_loss": -26.682260513305664, "global_step": 364498, "epoch": 4391} {"train_loss": -26.3674373626709, "global_step": 364499, "epoch": 4391} {"train_loss": -26.58216667175293, "global_step": 364500, "epoch": 4391} {"train_loss": -26.4548397064209, "global_step": 364501, "epoch": 4391} {"train_loss": -26.453378677368164, "global_step": 364502, "epoch": 4391} {"train_loss": -26.580224990844727, "global_step": 364503, "epoch": 4391} {"train_loss": -26.201404571533203, "global_step": 364504, "epoch": 4391} {"train_loss": -26.490095138549805, "global_step": 364505, "epoch": 4391} {"train_loss": -26.60101890563965, "global_step": 364506, "epoch": 4391} {"train_loss": -26.537174224853516, "global_step": 364507, "epoch": 4391} {"train_loss": -26.124311447143555, "global_step": 364508, "epoch": 4391} {"train_loss": -26.338830947875977, "global_step": 364509, "epoch": 4391} {"train_loss": -26.254840850830078, "global_step": 364510, "epoch": 4391} {"train_loss": -26.997955322265625, "global_step": 364511, "epoch": 4391} {"train_loss": -26.351001739501953, "global_step": 364512, "epoch": 4391} {"train_loss": -26.10206413269043, "global_step": 364513, "epoch": 4391} {"train_loss": -26.296072006225586, "global_step": 364514, "epoch": 4391} {"train_loss": -26.337743759155273, "global_step": 364515, "epoch": 4391} {"train_loss": -26.167999267578125, "global_step": 364516, "epoch": 4391} {"train_loss": -26.21685791015625, "global_step": 364517, "epoch": 4391} {"train_loss": -26.16693687438965, "global_step": 364518, "epoch": 4391} {"train_loss": -26.49659538269043, "global_step": 364519, "epoch": 4391} {"train_loss": -26.633176803588867, "global_step": 364520, "epoch": 4391} {"train_loss": -25.930871963500977, "global_step": 364521, "epoch": 4391} {"train_loss": -26.307397842407227, "global_step": 364522, "epoch": 4391} {"train_loss": -26.0996150970459, "global_step": 364523, "epoch": 4391} {"train_loss": -26.263410568237305, "global_step": 364524, "epoch": 4391} {"train_loss": -26.432409286499023, "global_step": 364525, "epoch": 4391} {"train_loss": -26.184402465820312, "global_step": 364526, "epoch": 4391} {"train_loss": -26.15789794921875, "global_step": 364527, "epoch": 4391} {"train_loss": -26.337793350219727, "global_step": 364528, "epoch": 4391} {"train_loss": -26.394800186157227, "global_step": 364529, "epoch": 4391} {"train_loss": -26.08310317993164, "global_step": 364530, "epoch": 4391} {"train_loss": -26.012903213500977, "global_step": 364531, "epoch": 4391} {"train_loss": -26.0511531829834, "global_step": 364532, "epoch": 4391} {"train_loss": -26.35188102722168, "global_step": 364533, "epoch": 4391} {"train_loss": -26.467041015625, "global_step": 364534, "epoch": 4391} {"train_loss": -26.10532585971327, "global_step": 364535, "epoch": 4391, "val_loss": 6639571.0} {"train_loss": -24.650798797607422, "global_step": 364536, "epoch": 4392} {"train_loss": -25.67042350769043, "global_step": 364537, "epoch": 4392} {"train_loss": -25.728612899780273, "global_step": 364538, "epoch": 4392} {"train_loss": -25.9094295501709, "global_step": 364539, "epoch": 4392} {"train_loss": -25.36724853515625, "global_step": 364540, "epoch": 4392} {"train_loss": -25.37879753112793, "global_step": 364541, "epoch": 4392} {"train_loss": -25.5985050201416, "global_step": 364542, "epoch": 4392} {"train_loss": -25.5684757232666, "global_step": 364543, "epoch": 4392} {"train_loss": -24.97907829284668, "global_step": 364544, "epoch": 4392} {"train_loss": -26.178220748901367, "global_step": 364545, "epoch": 4392} {"train_loss": -25.262653350830078, "global_step": 364546, "epoch": 4392} {"train_loss": -25.604644775390625, "global_step": 364547, "epoch": 4392} {"train_loss": -26.316497802734375, "global_step": 364548, "epoch": 4392} {"train_loss": -25.618436813354492, "global_step": 364549, "epoch": 4392} {"train_loss": -25.4379825592041, "global_step": 364550, "epoch": 4392} {"train_loss": -25.91153335571289, "global_step": 364551, "epoch": 4392} {"train_loss": -25.76409912109375, "global_step": 364552, "epoch": 4392} {"train_loss": -25.942096710205078, "global_step": 364553, "epoch": 4392} {"train_loss": -25.496564865112305, "global_step": 364554, "epoch": 4392} {"train_loss": -25.986867904663086, "global_step": 364555, "epoch": 4392} {"train_loss": -25.870004653930664, "global_step": 364556, "epoch": 4392} {"train_loss": -25.960376739501953, "global_step": 364557, "epoch": 4392} {"train_loss": -26.24757957458496, "global_step": 364558, "epoch": 4392} {"train_loss": -25.998443603515625, "global_step": 364559, "epoch": 4392} {"train_loss": -26.3786678314209, "global_step": 364560, "epoch": 4392} {"train_loss": -25.948455810546875, "global_step": 364561, "epoch": 4392} {"train_loss": -26.137969970703125, "global_step": 364562, "epoch": 4392} {"train_loss": -26.07102394104004, "global_step": 364563, "epoch": 4392} {"train_loss": -26.098712921142578, "global_step": 364564, "epoch": 4392} {"train_loss": -26.282888412475586, "global_step": 364565, "epoch": 4392} {"train_loss": -26.260385513305664, "global_step": 364566, "epoch": 4392} {"train_loss": -26.403289794921875, "global_step": 364567, "epoch": 4392} {"train_loss": -26.069477081298828, "global_step": 364568, "epoch": 4392} {"train_loss": -26.449787139892578, "global_step": 364569, "epoch": 4392} {"train_loss": -26.341094970703125, "global_step": 364570, "epoch": 4392} {"train_loss": -26.224517822265625, "global_step": 364571, "epoch": 4392} {"train_loss": -26.447677612304688, "global_step": 364572, "epoch": 4392} {"train_loss": -25.979022979736328, "global_step": 364573, "epoch": 4392} {"train_loss": -26.274677276611328, "global_step": 364574, "epoch": 4392} {"train_loss": -26.519378662109375, "global_step": 364575, "epoch": 4392} {"train_loss": -26.390783309936523, "global_step": 364576, "epoch": 4392} {"train_loss": -26.226032257080078, "global_step": 364577, "epoch": 4392} {"train_loss": -26.36517333984375, "global_step": 364578, "epoch": 4392} {"train_loss": -26.087575912475586, "global_step": 364579, "epoch": 4392} {"train_loss": -25.96097183227539, "global_step": 364580, "epoch": 4392} {"train_loss": -26.18622398376465, "global_step": 364581, "epoch": 4392} {"train_loss": -26.09181785583496, "global_step": 364582, "epoch": 4392} {"train_loss": -26.521484375, "global_step": 364583, "epoch": 4392} {"train_loss": -26.5352783203125, "global_step": 364584, "epoch": 4392} {"train_loss": -26.30414390563965, "global_step": 364585, "epoch": 4392} {"train_loss": -26.318159103393555, "global_step": 364586, "epoch": 4392} {"train_loss": -26.17685890197754, "global_step": 364587, "epoch": 4392} {"train_loss": -26.141096115112305, "global_step": 364588, "epoch": 4392} {"train_loss": -26.143537521362305, "global_step": 364589, "epoch": 4392} {"train_loss": -26.42677116394043, "global_step": 364590, "epoch": 4392} {"train_loss": -26.567703247070312, "global_step": 364591, "epoch": 4392} {"train_loss": -26.536375045776367, "global_step": 364592, "epoch": 4392} {"train_loss": -26.10003662109375, "global_step": 364593, "epoch": 4392} {"train_loss": -26.392541885375977, "global_step": 364594, "epoch": 4392} {"train_loss": -26.105667114257812, "global_step": 364595, "epoch": 4392} {"train_loss": -26.230722427368164, "global_step": 364596, "epoch": 4392} {"train_loss": -26.39896583557129, "global_step": 364597, "epoch": 4392} {"train_loss": -25.9913387298584, "global_step": 364598, "epoch": 4392} {"train_loss": -26.566791534423828, "global_step": 364599, "epoch": 4392} {"train_loss": -26.246633529663086, "global_step": 364600, "epoch": 4392} {"train_loss": -26.7183837890625, "global_step": 364601, "epoch": 4392} {"train_loss": -26.23768424987793, "global_step": 364602, "epoch": 4392} {"train_loss": -26.223608016967773, "global_step": 364603, "epoch": 4392} {"train_loss": -26.43463706970215, "global_step": 364604, "epoch": 4392} {"train_loss": -26.212726593017578, "global_step": 364605, "epoch": 4392} {"train_loss": -26.070295333862305, "global_step": 364606, "epoch": 4392} {"train_loss": -26.22647476196289, "global_step": 364607, "epoch": 4392} {"train_loss": -26.392709732055664, "global_step": 364608, "epoch": 4392} {"train_loss": -26.302175521850586, "global_step": 364609, "epoch": 4392} {"train_loss": -26.204593658447266, "global_step": 364610, "epoch": 4392} {"train_loss": -26.403385162353516, "global_step": 364611, "epoch": 4392} {"train_loss": -26.563196182250977, "global_step": 364612, "epoch": 4392} {"train_loss": -25.99610710144043, "global_step": 364613, "epoch": 4392} {"train_loss": -26.42972183227539, "global_step": 364614, "epoch": 4392} {"train_loss": -26.1028995513916, "global_step": 364615, "epoch": 4392} {"train_loss": -26.27411460876465, "global_step": 364616, "epoch": 4392} {"train_loss": -26.43841552734375, "global_step": 364617, "epoch": 4392} {"train_loss": -26.100235766675098, "global_step": 364618, "epoch": 4392, "val_loss": 6563771.5} {"train_loss": -26.280567169189453, "global_step": 364619, "epoch": 4393} {"train_loss": -26.14021873474121, "global_step": 364620, "epoch": 4393} {"train_loss": -26.132415771484375, "global_step": 364621, "epoch": 4393} {"train_loss": -25.950397491455078, "global_step": 364622, "epoch": 4393} {"train_loss": -26.176725387573242, "global_step": 364623, "epoch": 4393} {"train_loss": -26.295551300048828, "global_step": 364624, "epoch": 4393} {"train_loss": -25.88412857055664, "global_step": 364625, "epoch": 4393} {"train_loss": -26.093902587890625, "global_step": 364626, "epoch": 4393} {"train_loss": -26.205368041992188, "global_step": 364627, "epoch": 4393} {"train_loss": -26.085538864135742, "global_step": 364628, "epoch": 4393} {"train_loss": -26.352529525756836, "global_step": 364629, "epoch": 4393} {"train_loss": -26.178730010986328, "global_step": 364630, "epoch": 4393} {"train_loss": -25.879623413085938, "global_step": 364631, "epoch": 4393} {"train_loss": -26.438276290893555, "global_step": 364632, "epoch": 4393} {"train_loss": -25.8878231048584, "global_step": 364633, "epoch": 4393} {"train_loss": -26.428747177124023, "global_step": 364634, "epoch": 4393} {"train_loss": -26.1882381439209, "global_step": 364635, "epoch": 4393} {"train_loss": -25.95106315612793, "global_step": 364636, "epoch": 4393} {"train_loss": -26.16596031188965, "global_step": 364637, "epoch": 4393} {"train_loss": -26.350406646728516, "global_step": 364638, "epoch": 4393} {"train_loss": -26.152509689331055, "global_step": 364639, "epoch": 4393} {"train_loss": -26.6098575592041, "global_step": 364640, "epoch": 4393} {"train_loss": -26.646787643432617, "global_step": 364641, "epoch": 4393} {"train_loss": -26.537689208984375, "global_step": 364642, "epoch": 4393} {"train_loss": -26.134366989135742, "global_step": 364643, "epoch": 4393} {"train_loss": -26.142934799194336, "global_step": 364644, "epoch": 4393} {"train_loss": -26.327377319335938, "global_step": 364645, "epoch": 4393} {"train_loss": -26.3527889251709, "global_step": 364646, "epoch": 4393} {"train_loss": -26.24379539489746, "global_step": 364647, "epoch": 4393} {"train_loss": -26.660308837890625, "global_step": 364648, "epoch": 4393} {"train_loss": -26.558298110961914, "global_step": 364649, "epoch": 4393} {"train_loss": -26.080249786376953, "global_step": 364650, "epoch": 4393} {"train_loss": -26.31085777282715, "global_step": 364651, "epoch": 4393} {"train_loss": -26.232336044311523, "global_step": 364652, "epoch": 4393} {"train_loss": -26.399438858032227, "global_step": 364653, "epoch": 4393} {"train_loss": -26.429330825805664, "global_step": 364654, "epoch": 4393} {"train_loss": -26.01532554626465, "global_step": 364655, "epoch": 4393} {"train_loss": -26.25728416442871, "global_step": 364656, "epoch": 4393} {"train_loss": -26.182111740112305, "global_step": 364657, "epoch": 4393} {"train_loss": -26.021162033081055, "global_step": 364658, "epoch": 4393} {"train_loss": -26.52735710144043, "global_step": 364659, "epoch": 4393} {"train_loss": -26.3978214263916, "global_step": 364660, "epoch": 4393} {"train_loss": -26.21101951599121, "global_step": 364661, "epoch": 4393} {"train_loss": -25.90106201171875, "global_step": 364662, "epoch": 4393} {"train_loss": -26.13128662109375, "global_step": 364663, "epoch": 4393} {"train_loss": -25.979001998901367, "global_step": 364664, "epoch": 4393} {"train_loss": -26.303176879882812, "global_step": 364665, "epoch": 4393} {"train_loss": -26.169931411743164, "global_step": 364666, "epoch": 4393} {"train_loss": -26.463775634765625, "global_step": 364667, "epoch": 4393} {"train_loss": -26.455427169799805, "global_step": 364668, "epoch": 4393} {"train_loss": -26.34119987487793, "global_step": 364669, "epoch": 4393} {"train_loss": -26.702924728393555, "global_step": 364670, "epoch": 4393} {"train_loss": -26.54974937438965, "global_step": 364671, "epoch": 4393} {"train_loss": -26.441299438476562, "global_step": 364672, "epoch": 4393} {"train_loss": -25.96748161315918, "global_step": 364673, "epoch": 4393} {"train_loss": -26.5378475189209, "global_step": 364674, "epoch": 4393} {"train_loss": -26.134824752807617, "global_step": 364675, "epoch": 4393} {"train_loss": -26.447050094604492, "global_step": 364676, "epoch": 4393} {"train_loss": -26.252227783203125, "global_step": 364677, "epoch": 4393} {"train_loss": -26.494104385375977, "global_step": 364678, "epoch": 4393} {"train_loss": -26.11687660217285, "global_step": 364679, "epoch": 4393} {"train_loss": -26.376428604125977, "global_step": 364680, "epoch": 4393} {"train_loss": -26.548669815063477, "global_step": 364681, "epoch": 4393} {"train_loss": -26.391199111938477, "global_step": 364682, "epoch": 4393} {"train_loss": -26.373632431030273, "global_step": 364683, "epoch": 4393} {"train_loss": -26.338836669921875, "global_step": 364684, "epoch": 4393} {"train_loss": -26.442869186401367, "global_step": 364685, "epoch": 4393} {"train_loss": -26.591032028198242, "global_step": 364686, "epoch": 4393} {"train_loss": -26.563562393188477, "global_step": 364687, "epoch": 4393} {"train_loss": -26.445158004760742, "global_step": 364688, "epoch": 4393} {"train_loss": -26.430158615112305, "global_step": 364689, "epoch": 4393} {"train_loss": -26.702173233032227, "global_step": 364690, "epoch": 4393} {"train_loss": -26.494016647338867, "global_step": 364691, "epoch": 4393} {"train_loss": -26.177093505859375, "global_step": 364692, "epoch": 4393} {"train_loss": -26.53733253479004, "global_step": 364693, "epoch": 4393} {"train_loss": -26.686614990234375, "global_step": 364694, "epoch": 4393} {"train_loss": -26.4637393951416, "global_step": 364695, "epoch": 4393} {"train_loss": -26.62395668029785, "global_step": 364696, "epoch": 4393} {"train_loss": -26.236652374267578, "global_step": 364697, "epoch": 4393} {"train_loss": -26.443281173706055, "global_step": 364698, "epoch": 4393} {"train_loss": -26.048376083374023, "global_step": 364699, "epoch": 4393} {"train_loss": -26.219024658203125, "global_step": 364700, "epoch": 4393} {"train_loss": -26.305819408003106, "global_step": 364701, "epoch": 4393, "val_loss": 6707749.5} {"train_loss": -24.38033676147461, "global_step": 364702, "epoch": 4394} {"train_loss": -23.699247360229492, "global_step": 364703, "epoch": 4394} {"train_loss": -24.99416732788086, "global_step": 364704, "epoch": 4394} {"train_loss": -24.708438873291016, "global_step": 364705, "epoch": 4394} {"train_loss": -25.026723861694336, "global_step": 364706, "epoch": 4394} {"train_loss": -25.655609130859375, "global_step": 364707, "epoch": 4394} {"train_loss": -25.54007339477539, "global_step": 364708, "epoch": 4394} {"train_loss": -25.301610946655273, "global_step": 364709, "epoch": 4394} {"train_loss": -25.6641902923584, "global_step": 364710, "epoch": 4394} {"train_loss": -25.199499130249023, "global_step": 364711, "epoch": 4394} {"train_loss": -25.519241333007812, "global_step": 364712, "epoch": 4394} {"train_loss": -25.229209899902344, "global_step": 364713, "epoch": 4394} {"train_loss": -25.464536666870117, "global_step": 364714, "epoch": 4394} {"train_loss": -25.599822998046875, "global_step": 364715, "epoch": 4394} {"train_loss": -25.60184669494629, "global_step": 364716, "epoch": 4394} {"train_loss": -25.563852310180664, "global_step": 364717, "epoch": 4394} {"train_loss": -25.92756462097168, "global_step": 364718, "epoch": 4394} {"train_loss": -25.866790771484375, "global_step": 364719, "epoch": 4394} {"train_loss": -25.986175537109375, "global_step": 364720, "epoch": 4394} {"train_loss": -26.0565185546875, "global_step": 364721, "epoch": 4394} {"train_loss": -25.937915802001953, "global_step": 364722, "epoch": 4394} {"train_loss": -26.13153076171875, "global_step": 364723, "epoch": 4394} {"train_loss": -25.45113182067871, "global_step": 364724, "epoch": 4394} {"train_loss": -25.9925537109375, "global_step": 364725, "epoch": 4394} {"train_loss": -26.169904708862305, "global_step": 364726, "epoch": 4394} {"train_loss": -26.32345962524414, "global_step": 364727, "epoch": 4394} {"train_loss": -26.19964599609375, "global_step": 364728, "epoch": 4394} {"train_loss": -25.889062881469727, "global_step": 364729, "epoch": 4394} {"train_loss": -26.08990478515625, "global_step": 364730, "epoch": 4394} {"train_loss": -25.930078506469727, "global_step": 364731, "epoch": 4394} {"train_loss": -26.036163330078125, "global_step": 364732, "epoch": 4394} {"train_loss": -26.12798500061035, "global_step": 364733, "epoch": 4394} {"train_loss": -26.346059799194336, "global_step": 364734, "epoch": 4394} {"train_loss": -26.120044708251953, "global_step": 364735, "epoch": 4394} {"train_loss": -25.965490341186523, "global_step": 364736, "epoch": 4394} {"train_loss": -26.2724666595459, "global_step": 364737, "epoch": 4394} {"train_loss": -26.233051300048828, "global_step": 364738, "epoch": 4394} {"train_loss": -26.053922653198242, "global_step": 364739, "epoch": 4394} {"train_loss": -26.359342575073242, "global_step": 364740, "epoch": 4394} {"train_loss": -26.211841583251953, "global_step": 364741, "epoch": 4394} {"train_loss": -26.12237548828125, "global_step": 364742, "epoch": 4394} {"train_loss": -26.201190948486328, "global_step": 364743, "epoch": 4394} {"train_loss": -26.171899795532227, "global_step": 364744, "epoch": 4394} {"train_loss": -26.387256622314453, "global_step": 364745, "epoch": 4394} {"train_loss": -26.140243530273438, "global_step": 364746, "epoch": 4394} {"train_loss": -25.955158233642578, "global_step": 364747, "epoch": 4394} {"train_loss": -26.408512115478516, "global_step": 364748, "epoch": 4394} {"train_loss": -26.6345272064209, "global_step": 364749, "epoch": 4394} {"train_loss": -26.72749137878418, "global_step": 364750, "epoch": 4394} {"train_loss": -26.607879638671875, "global_step": 364751, "epoch": 4394} {"train_loss": -26.53127098083496, "global_step": 364752, "epoch": 4394} {"train_loss": -26.78240966796875, "global_step": 364753, "epoch": 4394} {"train_loss": -26.492435455322266, "global_step": 364754, "epoch": 4394} {"train_loss": -26.7591609954834, "global_step": 364755, "epoch": 4394} {"train_loss": -26.28740882873535, "global_step": 364756, "epoch": 4394} {"train_loss": -26.42731285095215, "global_step": 364757, "epoch": 4394} {"train_loss": -26.071928024291992, "global_step": 364758, "epoch": 4394} {"train_loss": -26.3538875579834, "global_step": 364759, "epoch": 4394} {"train_loss": -26.437524795532227, "global_step": 364760, "epoch": 4394} {"train_loss": -26.1484317779541, "global_step": 364761, "epoch": 4394} {"train_loss": -26.65559196472168, "global_step": 364762, "epoch": 4394} {"train_loss": -26.274473190307617, "global_step": 364763, "epoch": 4394} {"train_loss": -25.947996139526367, "global_step": 364764, "epoch": 4394} {"train_loss": -26.209848403930664, "global_step": 364765, "epoch": 4394} {"train_loss": -26.304187774658203, "global_step": 364766, "epoch": 4394} {"train_loss": -26.2700252532959, "global_step": 364767, "epoch": 4394} {"train_loss": -26.255029678344727, "global_step": 364768, "epoch": 4394} {"train_loss": -26.337080001831055, "global_step": 364769, "epoch": 4394} {"train_loss": -26.579858779907227, "global_step": 364770, "epoch": 4394} {"train_loss": -26.298629760742188, "global_step": 364771, "epoch": 4394} {"train_loss": -25.963525772094727, "global_step": 364772, "epoch": 4394} {"train_loss": -25.912311553955078, "global_step": 364773, "epoch": 4394} {"train_loss": -26.27729606628418, "global_step": 364774, "epoch": 4394} {"train_loss": -26.19060707092285, "global_step": 364775, "epoch": 4394} {"train_loss": -25.91643714904785, "global_step": 364776, "epoch": 4394} {"train_loss": -26.329980850219727, "global_step": 364777, "epoch": 4394} {"train_loss": -26.36090087890625, "global_step": 364778, "epoch": 4394} {"train_loss": -26.048986434936523, "global_step": 364779, "epoch": 4394} {"train_loss": -26.404977798461914, "global_step": 364780, "epoch": 4394} {"train_loss": -26.651594161987305, "global_step": 364781, "epoch": 4394} {"train_loss": -25.974658966064453, "global_step": 364782, "epoch": 4394} {"train_loss": -26.32032585144043, "global_step": 364783, "epoch": 4394} {"train_loss": -25.9993352085711, "global_step": 364784, "epoch": 4394, "val_loss": 6555440.0} {"train_loss": -26.31583595275879, "global_step": 364785, "epoch": 4395} {"train_loss": -25.6589412689209, "global_step": 364786, "epoch": 4395} {"train_loss": -25.34684181213379, "global_step": 364787, "epoch": 4395} {"train_loss": -25.82513427734375, "global_step": 364788, "epoch": 4395} {"train_loss": -25.61094093322754, "global_step": 364789, "epoch": 4395} {"train_loss": -25.581493377685547, "global_step": 364790, "epoch": 4395} {"train_loss": -25.852142333984375, "global_step": 364791, "epoch": 4395} {"train_loss": -26.15036392211914, "global_step": 364792, "epoch": 4395} {"train_loss": -26.1444034576416, "global_step": 364793, "epoch": 4395} {"train_loss": -26.020471572875977, "global_step": 364794, "epoch": 4395} {"train_loss": -26.050992965698242, "global_step": 364795, "epoch": 4395} {"train_loss": -26.092824935913086, "global_step": 364796, "epoch": 4395} {"train_loss": -26.063602447509766, "global_step": 364797, "epoch": 4395} {"train_loss": -26.155384063720703, "global_step": 364798, "epoch": 4395} {"train_loss": -25.843297958374023, "global_step": 364799, "epoch": 4395} {"train_loss": -25.983509063720703, "global_step": 364800, "epoch": 4395} {"train_loss": -25.979480743408203, "global_step": 364801, "epoch": 4395} {"train_loss": -26.23223304748535, "global_step": 364802, "epoch": 4395} {"train_loss": -26.155109405517578, "global_step": 364803, "epoch": 4395} {"train_loss": -26.579809188842773, "global_step": 364804, "epoch": 4395} {"train_loss": -26.171833038330078, "global_step": 364805, "epoch": 4395} {"train_loss": -26.11475944519043, "global_step": 364806, "epoch": 4395} {"train_loss": -26.376928329467773, "global_step": 364807, "epoch": 4395} {"train_loss": -26.349905014038086, "global_step": 364808, "epoch": 4395} {"train_loss": -26.04988670349121, "global_step": 364809, "epoch": 4395} {"train_loss": -26.210779190063477, "global_step": 364810, "epoch": 4395} {"train_loss": -26.460241317749023, "global_step": 364811, "epoch": 4395} {"train_loss": -26.331562042236328, "global_step": 364812, "epoch": 4395} {"train_loss": -26.54303550720215, "global_step": 364813, "epoch": 4395} {"train_loss": -26.484619140625, "global_step": 364814, "epoch": 4395} {"train_loss": -26.397321701049805, "global_step": 364815, "epoch": 4395} {"train_loss": -26.43763542175293, "global_step": 364816, "epoch": 4395} {"train_loss": -26.282934188842773, "global_step": 364817, "epoch": 4395} {"train_loss": -26.19199562072754, "global_step": 364818, "epoch": 4395} {"train_loss": -26.30224609375, "global_step": 364819, "epoch": 4395} {"train_loss": -26.246795654296875, "global_step": 364820, "epoch": 4395} {"train_loss": -26.515249252319336, "global_step": 364821, "epoch": 4395} {"train_loss": -26.135522842407227, "global_step": 364822, "epoch": 4395} {"train_loss": -26.694726943969727, "global_step": 364823, "epoch": 4395} {"train_loss": -26.428028106689453, "global_step": 364824, "epoch": 4395} {"train_loss": -26.138782501220703, "global_step": 364825, "epoch": 4395} {"train_loss": -26.49332046508789, "global_step": 364826, "epoch": 4395} {"train_loss": -26.679128646850586, "global_step": 364827, "epoch": 4395} {"train_loss": -26.390165328979492, "global_step": 364828, "epoch": 4395} {"train_loss": -26.63652992248535, "global_step": 364829, "epoch": 4395} {"train_loss": -26.656667709350586, "global_step": 364830, "epoch": 4395} {"train_loss": -26.469568252563477, "global_step": 364831, "epoch": 4395} {"train_loss": -26.357568740844727, "global_step": 364832, "epoch": 4395} {"train_loss": -26.18865394592285, "global_step": 364833, "epoch": 4395} {"train_loss": -26.222028732299805, "global_step": 364834, "epoch": 4395} {"train_loss": -26.1077880859375, "global_step": 364835, "epoch": 4395} {"train_loss": -26.73138427734375, "global_step": 364836, "epoch": 4395} {"train_loss": -26.095783233642578, "global_step": 364837, "epoch": 4395} {"train_loss": -26.161834716796875, "global_step": 364838, "epoch": 4395} {"train_loss": -26.349624633789062, "global_step": 364839, "epoch": 4395} {"train_loss": -26.387853622436523, "global_step": 364840, "epoch": 4395} {"train_loss": -26.788742065429688, "global_step": 364841, "epoch": 4395} {"train_loss": -26.405176162719727, "global_step": 364842, "epoch": 4395} {"train_loss": -26.145801544189453, "global_step": 364843, "epoch": 4395} {"train_loss": -26.594762802124023, "global_step": 364844, "epoch": 4395} {"train_loss": -26.160888671875, "global_step": 364845, "epoch": 4395} {"train_loss": -26.56696891784668, "global_step": 364846, "epoch": 4395} {"train_loss": -26.123971939086914, "global_step": 364847, "epoch": 4395} {"train_loss": -26.233417510986328, "global_step": 364848, "epoch": 4395} {"train_loss": -26.45770263671875, "global_step": 364849, "epoch": 4395} {"train_loss": -26.2436580657959, "global_step": 364850, "epoch": 4395} {"train_loss": -26.384286880493164, "global_step": 364851, "epoch": 4395} {"train_loss": -26.07489013671875, "global_step": 364852, "epoch": 4395} {"train_loss": -26.29990005493164, "global_step": 364853, "epoch": 4395} {"train_loss": -26.7186336517334, "global_step": 364854, "epoch": 4395} {"train_loss": -26.0495662689209, "global_step": 364855, "epoch": 4395} {"train_loss": -26.173303604125977, "global_step": 364856, "epoch": 4395} {"train_loss": -26.40081787109375, "global_step": 364857, "epoch": 4395} {"train_loss": -26.24700355529785, "global_step": 364858, "epoch": 4395} {"train_loss": -25.928319931030273, "global_step": 364859, "epoch": 4395} {"train_loss": -26.362274169921875, "global_step": 364860, "epoch": 4395} {"train_loss": -26.513410568237305, "global_step": 364861, "epoch": 4395} {"train_loss": -25.941076278686523, "global_step": 364862, "epoch": 4395} {"train_loss": -26.5445613861084, "global_step": 364863, "epoch": 4395} {"train_loss": -26.20517921447754, "global_step": 364864, "epoch": 4395} {"train_loss": -26.19807243347168, "global_step": 364865, "epoch": 4395} {"train_loss": -26.122272491455078, "global_step": 364866, "epoch": 4395} {"train_loss": -26.24579790414098, "global_step": 364867, "epoch": 4395, "val_loss": 6768265.0} {"train_loss": -25.02391242980957, "global_step": 364868, "epoch": 4396} {"train_loss": -25.08061981201172, "global_step": 364869, "epoch": 4396} {"train_loss": -25.267465591430664, "global_step": 364870, "epoch": 4396} {"train_loss": -25.00117301940918, "global_step": 364871, "epoch": 4396} {"train_loss": -25.35065269470215, "global_step": 364872, "epoch": 4396} {"train_loss": -25.236312866210938, "global_step": 364873, "epoch": 4396} {"train_loss": -24.573944091796875, "global_step": 364874, "epoch": 4396} {"train_loss": -25.813735961914062, "global_step": 364875, "epoch": 4396} {"train_loss": -25.069656372070312, "global_step": 364876, "epoch": 4396} {"train_loss": -25.245046615600586, "global_step": 364877, "epoch": 4396} {"train_loss": -25.242834091186523, "global_step": 364878, "epoch": 4396} {"train_loss": -25.569473266601562, "global_step": 364879, "epoch": 4396} {"train_loss": -25.00935935974121, "global_step": 364880, "epoch": 4396} {"train_loss": -25.524808883666992, "global_step": 364881, "epoch": 4396} {"train_loss": -25.131399154663086, "global_step": 364882, "epoch": 4396} {"train_loss": -25.107213973999023, "global_step": 364883, "epoch": 4396} {"train_loss": -25.882802963256836, "global_step": 364884, "epoch": 4396} {"train_loss": -25.31390953063965, "global_step": 364885, "epoch": 4396} {"train_loss": -25.71027946472168, "global_step": 364886, "epoch": 4396} {"train_loss": -25.743444442749023, "global_step": 364887, "epoch": 4396} {"train_loss": -25.60011100769043, "global_step": 364888, "epoch": 4396} {"train_loss": -25.590253829956055, "global_step": 364889, "epoch": 4396} {"train_loss": -25.620344161987305, "global_step": 364890, "epoch": 4396} {"train_loss": -25.8853759765625, "global_step": 364891, "epoch": 4396} {"train_loss": -26.110708236694336, "global_step": 364892, "epoch": 4396} {"train_loss": -25.453962326049805, "global_step": 364893, "epoch": 4396} {"train_loss": -25.774921417236328, "global_step": 364894, "epoch": 4396} {"train_loss": -25.922948837280273, "global_step": 364895, "epoch": 4396} {"train_loss": -25.820404052734375, "global_step": 364896, "epoch": 4396} {"train_loss": -26.050989151000977, "global_step": 364897, "epoch": 4396} {"train_loss": -25.991674423217773, "global_step": 364898, "epoch": 4396} {"train_loss": -26.169483184814453, "global_step": 364899, "epoch": 4396} {"train_loss": -26.349546432495117, "global_step": 364900, "epoch": 4396} {"train_loss": -26.163007736206055, "global_step": 364901, "epoch": 4396} {"train_loss": -26.412322998046875, "global_step": 364902, "epoch": 4396} {"train_loss": -26.43916893005371, "global_step": 364903, "epoch": 4396} {"train_loss": -26.035205841064453, "global_step": 364904, "epoch": 4396} {"train_loss": -26.078699111938477, "global_step": 364905, "epoch": 4396} {"train_loss": -26.73780632019043, "global_step": 364906, "epoch": 4396} {"train_loss": -26.067182540893555, "global_step": 364907, "epoch": 4396} {"train_loss": -26.318769454956055, "global_step": 364908, "epoch": 4396} {"train_loss": -26.11012077331543, "global_step": 364909, "epoch": 4396} {"train_loss": -26.38319206237793, "global_step": 364910, "epoch": 4396} {"train_loss": -26.1330509185791, "global_step": 364911, "epoch": 4396} {"train_loss": -26.306562423706055, "global_step": 364912, "epoch": 4396} {"train_loss": -26.084890365600586, "global_step": 364913, "epoch": 4396} {"train_loss": -25.98444175720215, "global_step": 364914, "epoch": 4396} {"train_loss": -26.34307289123535, "global_step": 364915, "epoch": 4396} {"train_loss": -26.57425880432129, "global_step": 364916, "epoch": 4396} {"train_loss": -26.32095718383789, "global_step": 364917, "epoch": 4396} {"train_loss": -26.27923011779785, "global_step": 364918, "epoch": 4396} {"train_loss": -26.434268951416016, "global_step": 364919, "epoch": 4396} {"train_loss": -26.300048828125, "global_step": 364920, "epoch": 4396} {"train_loss": -26.652307510375977, "global_step": 364921, "epoch": 4396} {"train_loss": -26.502084732055664, "global_step": 364922, "epoch": 4396} {"train_loss": -26.36480712890625, "global_step": 364923, "epoch": 4396} {"train_loss": -26.478673934936523, "global_step": 364924, "epoch": 4396} {"train_loss": -26.412261962890625, "global_step": 364925, "epoch": 4396} {"train_loss": -26.544958114624023, "global_step": 364926, "epoch": 4396} {"train_loss": -26.427276611328125, "global_step": 364927, "epoch": 4396} {"train_loss": -26.31892967224121, "global_step": 364928, "epoch": 4396} {"train_loss": -26.788793563842773, "global_step": 364929, "epoch": 4396} {"train_loss": -26.50978660583496, "global_step": 364930, "epoch": 4396} {"train_loss": -26.55158805847168, "global_step": 364931, "epoch": 4396} {"train_loss": -26.567081451416016, "global_step": 364932, "epoch": 4396} {"train_loss": -26.431427001953125, "global_step": 364933, "epoch": 4396} {"train_loss": -26.529211044311523, "global_step": 364934, "epoch": 4396} {"train_loss": -26.648645401000977, "global_step": 364935, "epoch": 4396} {"train_loss": -26.779748916625977, "global_step": 364936, "epoch": 4396} {"train_loss": -26.446691513061523, "global_step": 364937, "epoch": 4396} {"train_loss": -26.024290084838867, "global_step": 364938, "epoch": 4396} {"train_loss": -26.790983200073242, "global_step": 364939, "epoch": 4396} {"train_loss": -26.458850860595703, "global_step": 364940, "epoch": 4396} {"train_loss": -26.367755889892578, "global_step": 364941, "epoch": 4396} {"train_loss": -26.675312042236328, "global_step": 364942, "epoch": 4396} {"train_loss": -26.430139541625977, "global_step": 364943, "epoch": 4396} {"train_loss": -26.0175838470459, "global_step": 364944, "epoch": 4396} {"train_loss": -25.8717098236084, "global_step": 364945, "epoch": 4396} {"train_loss": -26.001510620117188, "global_step": 364946, "epoch": 4396} {"train_loss": -25.73187255859375, "global_step": 364947, "epoch": 4396} {"train_loss": -25.975309371948242, "global_step": 364948, "epoch": 4396} {"train_loss": -26.276447296142578, "global_step": 364949, "epoch": 4396} {"train_loss": -26.00679576827819, "global_step": 364950, "epoch": 4396, "val_loss": 6549991.0} {"train_loss": -25.64491081237793, "global_step": 364951, "epoch": 4397} {"train_loss": -24.933298110961914, "global_step": 364952, "epoch": 4397} {"train_loss": -25.440343856811523, "global_step": 364953, "epoch": 4397} {"train_loss": -26.311277389526367, "global_step": 364954, "epoch": 4397} {"train_loss": -26.028045654296875, "global_step": 364955, "epoch": 4397} {"train_loss": -25.74907875061035, "global_step": 364956, "epoch": 4397} {"train_loss": -26.119108200073242, "global_step": 364957, "epoch": 4397} {"train_loss": -26.0635929107666, "global_step": 364958, "epoch": 4397} {"train_loss": -25.668989181518555, "global_step": 364959, "epoch": 4397} {"train_loss": -25.5693302154541, "global_step": 364960, "epoch": 4397} {"train_loss": -25.763715744018555, "global_step": 364961, "epoch": 4397} {"train_loss": -25.95234489440918, "global_step": 364962, "epoch": 4397} {"train_loss": -25.9843807220459, "global_step": 364963, "epoch": 4397} {"train_loss": -26.299488067626953, "global_step": 364964, "epoch": 4397} {"train_loss": -26.192602157592773, "global_step": 364965, "epoch": 4397} {"train_loss": -25.73438835144043, "global_step": 364966, "epoch": 4397} {"train_loss": -26.179611206054688, "global_step": 364967, "epoch": 4397} {"train_loss": -26.099445343017578, "global_step": 364968, "epoch": 4397} {"train_loss": -26.276914596557617, "global_step": 364969, "epoch": 4397} {"train_loss": -25.9782657623291, "global_step": 364970, "epoch": 4397} {"train_loss": -26.27178955078125, "global_step": 364971, "epoch": 4397} {"train_loss": -26.226470947265625, "global_step": 364972, "epoch": 4397} {"train_loss": -26.12662124633789, "global_step": 364973, "epoch": 4397} {"train_loss": -26.195697784423828, "global_step": 364974, "epoch": 4397} {"train_loss": -26.088031768798828, "global_step": 364975, "epoch": 4397} {"train_loss": -26.458099365234375, "global_step": 364976, "epoch": 4397} {"train_loss": -26.287343978881836, "global_step": 364977, "epoch": 4397} {"train_loss": -26.4260196685791, "global_step": 364978, "epoch": 4397} {"train_loss": -26.468793869018555, "global_step": 364979, "epoch": 4397} {"train_loss": -26.48309326171875, "global_step": 364980, "epoch": 4397} {"train_loss": -26.364978790283203, "global_step": 364981, "epoch": 4397} {"train_loss": -26.114185333251953, "global_step": 364982, "epoch": 4397} {"train_loss": -26.464635848999023, "global_step": 364983, "epoch": 4397} {"train_loss": -26.390119552612305, "global_step": 364984, "epoch": 4397} {"train_loss": -26.5116024017334, "global_step": 364985, "epoch": 4397} {"train_loss": -26.446063995361328, "global_step": 364986, "epoch": 4397} {"train_loss": -26.258209228515625, "global_step": 364987, "epoch": 4397} {"train_loss": -26.291889190673828, "global_step": 364988, "epoch": 4397} {"train_loss": -26.457839965820312, "global_step": 364989, "epoch": 4397} {"train_loss": -26.14141845703125, "global_step": 364990, "epoch": 4397} {"train_loss": -26.264347076416016, "global_step": 364991, "epoch": 4397} {"train_loss": -26.3944034576416, "global_step": 364992, "epoch": 4397} {"train_loss": -26.647199630737305, "global_step": 364993, "epoch": 4397} {"train_loss": -26.703948974609375, "global_step": 364994, "epoch": 4397} {"train_loss": -26.158288955688477, "global_step": 364995, "epoch": 4397} {"train_loss": -26.095264434814453, "global_step": 364996, "epoch": 4397} {"train_loss": -26.167072296142578, "global_step": 364997, "epoch": 4397} {"train_loss": -26.01800537109375, "global_step": 364998, "epoch": 4397} {"train_loss": -26.570241928100586, "global_step": 364999, "epoch": 4397} {"train_loss": -26.095422744750977, "global_step": 365000, "epoch": 4397} {"train_loss": -26.37446403503418, "global_step": 365001, "epoch": 4397} {"train_loss": -26.46967124938965, "global_step": 365002, "epoch": 4397} {"train_loss": -26.168472290039062, "global_step": 365003, "epoch": 4397} {"train_loss": -26.479007720947266, "global_step": 365004, "epoch": 4397} {"train_loss": -26.20053482055664, "global_step": 365005, "epoch": 4397} {"train_loss": -26.70832633972168, "global_step": 365006, "epoch": 4397} {"train_loss": -26.201520919799805, "global_step": 365007, "epoch": 4397} {"train_loss": -26.290283203125, "global_step": 365008, "epoch": 4397} {"train_loss": -26.4290771484375, "global_step": 365009, "epoch": 4397} {"train_loss": -26.22211265563965, "global_step": 365010, "epoch": 4397} {"train_loss": -26.330957412719727, "global_step": 365011, "epoch": 4397} {"train_loss": -26.585132598876953, "global_step": 365012, "epoch": 4397} {"train_loss": -26.361373901367188, "global_step": 365013, "epoch": 4397} {"train_loss": -26.174875259399414, "global_step": 365014, "epoch": 4397} {"train_loss": -26.666412353515625, "global_step": 365015, "epoch": 4397} {"train_loss": -26.34186363220215, "global_step": 365016, "epoch": 4397} {"train_loss": -26.4409122467041, "global_step": 365017, "epoch": 4397} {"train_loss": -25.938602447509766, "global_step": 365018, "epoch": 4397} {"train_loss": -26.73282814025879, "global_step": 365019, "epoch": 4397} {"train_loss": -26.30213737487793, "global_step": 365020, "epoch": 4397} {"train_loss": -25.720914840698242, "global_step": 365021, "epoch": 4397} {"train_loss": -25.812091827392578, "global_step": 365022, "epoch": 4397} {"train_loss": -26.26055335998535, "global_step": 365023, "epoch": 4397} {"train_loss": -26.550439834594727, "global_step": 365024, "epoch": 4397} {"train_loss": -25.871244430541992, "global_step": 365025, "epoch": 4397} {"train_loss": -26.166486740112305, "global_step": 365026, "epoch": 4397} {"train_loss": -26.475738525390625, "global_step": 365027, "epoch": 4397} {"train_loss": -26.35255241394043, "global_step": 365028, "epoch": 4397} {"train_loss": -26.480382919311523, "global_step": 365029, "epoch": 4397} {"train_loss": -26.443134307861328, "global_step": 365030, "epoch": 4397} {"train_loss": -26.280853271484375, "global_step": 365031, "epoch": 4397} {"train_loss": -26.6062068939209, "global_step": 365032, "epoch": 4397} {"train_loss": -26.22419141286827, "global_step": 365033, "epoch": 4397, "val_loss": 6634147.0} {"train_loss": -26.12812614440918, "global_step": 365034, "epoch": 4398} {"train_loss": -25.437808990478516, "global_step": 365035, "epoch": 4398} {"train_loss": -24.79253578186035, "global_step": 365036, "epoch": 4398} {"train_loss": -25.831323623657227, "global_step": 365037, "epoch": 4398} {"train_loss": -25.107641220092773, "global_step": 365038, "epoch": 4398} {"train_loss": -25.662158966064453, "global_step": 365039, "epoch": 4398} {"train_loss": -25.954029083251953, "global_step": 365040, "epoch": 4398} {"train_loss": -25.4591007232666, "global_step": 365041, "epoch": 4398} {"train_loss": -25.9080753326416, "global_step": 365042, "epoch": 4398} {"train_loss": -25.791975021362305, "global_step": 365043, "epoch": 4398} {"train_loss": -25.66206932067871, "global_step": 365044, "epoch": 4398} {"train_loss": -26.220727920532227, "global_step": 365045, "epoch": 4398} {"train_loss": -26.124439239501953, "global_step": 365046, "epoch": 4398} {"train_loss": -25.800100326538086, "global_step": 365047, "epoch": 4398} {"train_loss": -26.157621383666992, "global_step": 365048, "epoch": 4398} {"train_loss": -25.853656768798828, "global_step": 365049, "epoch": 4398} {"train_loss": -25.889745712280273, "global_step": 365050, "epoch": 4398} {"train_loss": -26.00482177734375, "global_step": 365051, "epoch": 4398} {"train_loss": -26.294519424438477, "global_step": 365052, "epoch": 4398} {"train_loss": -25.82695960998535, "global_step": 365053, "epoch": 4398} {"train_loss": -26.005887985229492, "global_step": 365054, "epoch": 4398} {"train_loss": -26.158170700073242, "global_step": 365055, "epoch": 4398} {"train_loss": -26.30667495727539, "global_step": 365056, "epoch": 4398} {"train_loss": -26.11056900024414, "global_step": 365057, "epoch": 4398} {"train_loss": -26.0400447845459, "global_step": 365058, "epoch": 4398} {"train_loss": -26.131662368774414, "global_step": 365059, "epoch": 4398} {"train_loss": -26.235504150390625, "global_step": 365060, "epoch": 4398} {"train_loss": -26.186908721923828, "global_step": 365061, "epoch": 4398} {"train_loss": -26.535511016845703, "global_step": 365062, "epoch": 4398} {"train_loss": -26.362812042236328, "global_step": 365063, "epoch": 4398} {"train_loss": -26.60507583618164, "global_step": 365064, "epoch": 4398} {"train_loss": -26.567493438720703, "global_step": 365065, "epoch": 4398} {"train_loss": -26.385623931884766, "global_step": 365066, "epoch": 4398} {"train_loss": -26.488128662109375, "global_step": 365067, "epoch": 4398} {"train_loss": -26.328964233398438, "global_step": 365068, "epoch": 4398} {"train_loss": -26.442670822143555, "global_step": 365069, "epoch": 4398} {"train_loss": -26.53631019592285, "global_step": 365070, "epoch": 4398} {"train_loss": -26.89753532409668, "global_step": 365071, "epoch": 4398} {"train_loss": -26.077289581298828, "global_step": 365072, "epoch": 4398} {"train_loss": -25.841989517211914, "global_step": 365073, "epoch": 4398} {"train_loss": -26.031370162963867, "global_step": 365074, "epoch": 4398} {"train_loss": -25.95355796813965, "global_step": 365075, "epoch": 4398} {"train_loss": -25.927555084228516, "global_step": 365076, "epoch": 4398} {"train_loss": -26.42715835571289, "global_step": 365077, "epoch": 4398} {"train_loss": -26.097427368164062, "global_step": 365078, "epoch": 4398} {"train_loss": -26.31056022644043, "global_step": 365079, "epoch": 4398} {"train_loss": -26.154052734375, "global_step": 365080, "epoch": 4398} {"train_loss": -26.404577255249023, "global_step": 365081, "epoch": 4398} {"train_loss": -25.924793243408203, "global_step": 365082, "epoch": 4398} {"train_loss": -25.988615036010742, "global_step": 365083, "epoch": 4398} {"train_loss": -26.03708267211914, "global_step": 365084, "epoch": 4398} {"train_loss": -26.08428955078125, "global_step": 365085, "epoch": 4398} {"train_loss": -26.347549438476562, "global_step": 365086, "epoch": 4398} {"train_loss": -26.3719425201416, "global_step": 365087, "epoch": 4398} {"train_loss": -26.33914566040039, "global_step": 365088, "epoch": 4398} {"train_loss": -26.62531852722168, "global_step": 365089, "epoch": 4398} {"train_loss": -26.20794677734375, "global_step": 365090, "epoch": 4398} {"train_loss": -26.51222038269043, "global_step": 365091, "epoch": 4398} {"train_loss": -26.086511611938477, "global_step": 365092, "epoch": 4398} {"train_loss": -26.209814071655273, "global_step": 365093, "epoch": 4398} {"train_loss": -26.152990341186523, "global_step": 365094, "epoch": 4398} {"train_loss": -26.3079891204834, "global_step": 365095, "epoch": 4398} {"train_loss": -26.308612823486328, "global_step": 365096, "epoch": 4398} {"train_loss": -26.264066696166992, "global_step": 365097, "epoch": 4398} {"train_loss": -26.210845947265625, "global_step": 365098, "epoch": 4398} {"train_loss": -26.416162490844727, "global_step": 365099, "epoch": 4398} {"train_loss": -26.544452667236328, "global_step": 365100, "epoch": 4398} {"train_loss": -25.7734375, "global_step": 365101, "epoch": 4398} {"train_loss": -26.2822322845459, "global_step": 365102, "epoch": 4398} {"train_loss": -26.349838256835938, "global_step": 365103, "epoch": 4398} {"train_loss": -26.4165096282959, "global_step": 365104, "epoch": 4398} {"train_loss": -26.387176513671875, "global_step": 365105, "epoch": 4398} {"train_loss": -26.230438232421875, "global_step": 365106, "epoch": 4398} {"train_loss": -26.573163986206055, "global_step": 365107, "epoch": 4398} {"train_loss": -26.38153648376465, "global_step": 365108, "epoch": 4398} {"train_loss": -26.58454704284668, "global_step": 365109, "epoch": 4398} {"train_loss": -26.14715576171875, "global_step": 365110, "epoch": 4398} {"train_loss": -26.159177780151367, "global_step": 365111, "epoch": 4398} {"train_loss": -26.166223526000977, "global_step": 365112, "epoch": 4398} {"train_loss": -26.15943717956543, "global_step": 365113, "epoch": 4398} {"train_loss": -26.61273765563965, "global_step": 365114, "epoch": 4398} {"train_loss": -26.84844970703125, "global_step": 365115, "epoch": 4398} {"train_loss": -26.183449182165674, "global_step": 365116, "epoch": 4398, "val_loss": 6582214.0} {"train_loss": -25.812101364135742, "global_step": 365117, "epoch": 4399} {"train_loss": -25.733240127563477, "global_step": 365118, "epoch": 4399} {"train_loss": -25.710424423217773, "global_step": 365119, "epoch": 4399} {"train_loss": -25.985097885131836, "global_step": 365120, "epoch": 4399} {"train_loss": -25.86100196838379, "global_step": 365121, "epoch": 4399} {"train_loss": -26.051761627197266, "global_step": 365122, "epoch": 4399} {"train_loss": -25.744598388671875, "global_step": 365123, "epoch": 4399} {"train_loss": -26.1046142578125, "global_step": 365124, "epoch": 4399} {"train_loss": -26.11683464050293, "global_step": 365125, "epoch": 4399} {"train_loss": -25.7582950592041, "global_step": 365126, "epoch": 4399} {"train_loss": -26.203577041625977, "global_step": 365127, "epoch": 4399} {"train_loss": -25.776538848876953, "global_step": 365128, "epoch": 4399} {"train_loss": -26.040252685546875, "global_step": 365129, "epoch": 4399} {"train_loss": -26.139480590820312, "global_step": 365130, "epoch": 4399} {"train_loss": -26.229116439819336, "global_step": 365131, "epoch": 4399} {"train_loss": -25.94691276550293, "global_step": 365132, "epoch": 4399} {"train_loss": -26.563730239868164, "global_step": 365133, "epoch": 4399} {"train_loss": -25.925872802734375, "global_step": 365134, "epoch": 4399} {"train_loss": -26.417516708374023, "global_step": 365135, "epoch": 4399} {"train_loss": -26.02069664001465, "global_step": 365136, "epoch": 4399} {"train_loss": -26.447952270507812, "global_step": 365137, "epoch": 4399} {"train_loss": -26.24785804748535, "global_step": 365138, "epoch": 4399} {"train_loss": -26.175962448120117, "global_step": 365139, "epoch": 4399} {"train_loss": -26.492868423461914, "global_step": 365140, "epoch": 4399} {"train_loss": -26.217609405517578, "global_step": 365141, "epoch": 4399} {"train_loss": -26.230600357055664, "global_step": 365142, "epoch": 4399} {"train_loss": -26.89638328552246, "global_step": 365143, "epoch": 4399} {"train_loss": -26.314023971557617, "global_step": 365144, "epoch": 4399} {"train_loss": -26.452219009399414, "global_step": 365145, "epoch": 4399} {"train_loss": -26.38653564453125, "global_step": 365146, "epoch": 4399} {"train_loss": -26.01654052734375, "global_step": 365147, "epoch": 4399} {"train_loss": -26.414106369018555, "global_step": 365148, "epoch": 4399} {"train_loss": -26.605213165283203, "global_step": 365149, "epoch": 4399} {"train_loss": -26.41015625, "global_step": 365150, "epoch": 4399} {"train_loss": -26.382984161376953, "global_step": 365151, "epoch": 4399} {"train_loss": -26.71906089782715, "global_step": 365152, "epoch": 4399} {"train_loss": -26.49395751953125, "global_step": 365153, "epoch": 4399} {"train_loss": -26.35820960998535, "global_step": 365154, "epoch": 4399} {"train_loss": -26.566186904907227, "global_step": 365155, "epoch": 4399} {"train_loss": -26.761266708374023, "global_step": 365156, "epoch": 4399} {"train_loss": -26.71966552734375, "global_step": 365157, "epoch": 4399} {"train_loss": -26.669677734375, "global_step": 365158, "epoch": 4399} {"train_loss": -26.615375518798828, "global_step": 365159, "epoch": 4399} {"train_loss": -26.43409538269043, "global_step": 365160, "epoch": 4399} {"train_loss": -26.3386173248291, "global_step": 365161, "epoch": 4399} {"train_loss": -26.714567184448242, "global_step": 365162, "epoch": 4399} {"train_loss": -26.488611221313477, "global_step": 365163, "epoch": 4399} {"train_loss": -26.35283851623535, "global_step": 365164, "epoch": 4399} {"train_loss": -26.827543258666992, "global_step": 365165, "epoch": 4399} {"train_loss": -26.538375854492188, "global_step": 365166, "epoch": 4399} {"train_loss": -26.329748153686523, "global_step": 365167, "epoch": 4399} {"train_loss": -26.52899742126465, "global_step": 365168, "epoch": 4399} {"train_loss": -25.79021644592285, "global_step": 365169, "epoch": 4399} {"train_loss": -25.656116485595703, "global_step": 365170, "epoch": 4399} {"train_loss": -25.406408309936523, "global_step": 365171, "epoch": 4399} {"train_loss": -26.13431167602539, "global_step": 365172, "epoch": 4399} {"train_loss": -26.3560733795166, "global_step": 365173, "epoch": 4399} {"train_loss": -26.66766929626465, "global_step": 365174, "epoch": 4399} {"train_loss": -25.708362579345703, "global_step": 365175, "epoch": 4399} {"train_loss": -25.896961212158203, "global_step": 365176, "epoch": 4399} {"train_loss": -26.495176315307617, "global_step": 365177, "epoch": 4399} {"train_loss": -25.905691146850586, "global_step": 365178, "epoch": 4399} {"train_loss": -26.233478546142578, "global_step": 365179, "epoch": 4399} {"train_loss": -25.92488670349121, "global_step": 365180, "epoch": 4399} {"train_loss": -26.35732078552246, "global_step": 365181, "epoch": 4399} {"train_loss": -26.117521286010742, "global_step": 365182, "epoch": 4399} {"train_loss": -26.408512115478516, "global_step": 365183, "epoch": 4399} {"train_loss": -26.301084518432617, "global_step": 365184, "epoch": 4399} {"train_loss": -26.04254150390625, "global_step": 365185, "epoch": 4399} {"train_loss": -26.3282413482666, "global_step": 365186, "epoch": 4399} {"train_loss": -26.30499839782715, "global_step": 365187, "epoch": 4399} {"train_loss": -26.023096084594727, "global_step": 365188, "epoch": 4399} {"train_loss": -26.00752067565918, "global_step": 365189, "epoch": 4399} {"train_loss": -26.371326446533203, "global_step": 365190, "epoch": 4399} {"train_loss": -26.45273208618164, "global_step": 365191, "epoch": 4399} {"train_loss": -26.590234756469727, "global_step": 365192, "epoch": 4399} {"train_loss": -26.060102462768555, "global_step": 365193, "epoch": 4399} {"train_loss": -26.299543380737305, "global_step": 365194, "epoch": 4399} {"train_loss": -26.17030143737793, "global_step": 365195, "epoch": 4399} {"train_loss": -26.673425674438477, "global_step": 365196, "epoch": 4399} {"train_loss": -26.535171508789062, "global_step": 365197, "epoch": 4399} {"train_loss": -26.497678756713867, "global_step": 365198, "epoch": 4399} {"train_loss": -26.272685223315136, "global_step": 365199, "epoch": 4399, "val_loss": 6615543.5} {"train_loss": -25.80023193359375, "global_step": 365200, "epoch": 4400} {"train_loss": -25.67095947265625, "global_step": 365201, "epoch": 4400} {"train_loss": -26.361743927001953, "global_step": 365202, "epoch": 4400} {"train_loss": -25.775415420532227, "global_step": 365203, "epoch": 4400} {"train_loss": -25.848770141601562, "global_step": 365204, "epoch": 4400} {"train_loss": -26.146167755126953, "global_step": 365205, "epoch": 4400} {"train_loss": -25.614404678344727, "global_step": 365206, "epoch": 4400} {"train_loss": -26.21087646484375, "global_step": 365207, "epoch": 4400} {"train_loss": -25.592477798461914, "global_step": 365208, "epoch": 4400} {"train_loss": -25.646148681640625, "global_step": 365209, "epoch": 4400} {"train_loss": -25.839569091796875, "global_step": 365210, "epoch": 4400} {"train_loss": -25.85610008239746, "global_step": 365211, "epoch": 4400} {"train_loss": -25.908491134643555, "global_step": 365212, "epoch": 4400} {"train_loss": -25.933734893798828, "global_step": 365213, "epoch": 4400} {"train_loss": -26.003034591674805, "global_step": 365214, "epoch": 4400} {"train_loss": -25.867109298706055, "global_step": 365215, "epoch": 4400} {"train_loss": -25.908117294311523, "global_step": 365216, "epoch": 4400} {"train_loss": -26.164106369018555, "global_step": 365217, "epoch": 4400} {"train_loss": -25.9551944732666, "global_step": 365218, "epoch": 4400} {"train_loss": -26.1700439453125, "global_step": 365219, "epoch": 4400} {"train_loss": -26.0555362701416, "global_step": 365220, "epoch": 4400} {"train_loss": -26.11115074157715, "global_step": 365221, "epoch": 4400} {"train_loss": -26.38486099243164, "global_step": 365222, "epoch": 4400} {"train_loss": -26.243534088134766, "global_step": 365223, "epoch": 4400} {"train_loss": -26.03700065612793, "global_step": 365224, "epoch": 4400} {"train_loss": -26.14666175842285, "global_step": 365225, "epoch": 4400} {"train_loss": -26.46537208557129, "global_step": 365226, "epoch": 4400} {"train_loss": -26.17290687561035, "global_step": 365227, "epoch": 4400} {"train_loss": -26.396650314331055, "global_step": 365228, "epoch": 4400} {"train_loss": -26.3098087310791, "global_step": 365229, "epoch": 4400} {"train_loss": -26.221830368041992, "global_step": 365230, "epoch": 4400} {"train_loss": -26.39637565612793, "global_step": 365231, "epoch": 4400} {"train_loss": -26.3581600189209, "global_step": 365232, "epoch": 4400} {"train_loss": -26.269189834594727, "global_step": 365233, "epoch": 4400} {"train_loss": -26.251562118530273, "global_step": 365234, "epoch": 4400} {"train_loss": -26.4591121673584, "global_step": 365235, "epoch": 4400} {"train_loss": -26.210824966430664, "global_step": 365236, "epoch": 4400} {"train_loss": -26.495695114135742, "global_step": 365237, "epoch": 4400} {"train_loss": -26.326208114624023, "global_step": 365238, "epoch": 4400} {"train_loss": -26.17998695373535, "global_step": 365239, "epoch": 4400} {"train_loss": -26.306720733642578, "global_step": 365240, "epoch": 4400} {"train_loss": -26.288549423217773, "global_step": 365241, "epoch": 4400} {"train_loss": -26.9066104888916, "global_step": 365242, "epoch": 4400} {"train_loss": -26.67542839050293, "global_step": 365243, "epoch": 4400} {"train_loss": -26.744720458984375, "global_step": 365244, "epoch": 4400} {"train_loss": -26.245954513549805, "global_step": 365245, "epoch": 4400} {"train_loss": -26.23664665222168, "global_step": 365246, "epoch": 4400} {"train_loss": -26.01295280456543, "global_step": 365247, "epoch": 4400} {"train_loss": -26.641904830932617, "global_step": 365248, "epoch": 4400} {"train_loss": -26.23965835571289, "global_step": 365249, "epoch": 4400} {"train_loss": -26.01959228515625, "global_step": 365250, "epoch": 4400} {"train_loss": -25.860340118408203, "global_step": 365251, "epoch": 4400} {"train_loss": -26.011816024780273, "global_step": 365252, "epoch": 4400} {"train_loss": -26.7458553314209, "global_step": 365253, "epoch": 4400} {"train_loss": -26.661060333251953, "global_step": 365254, "epoch": 4400} {"train_loss": -26.432510375976562, "global_step": 365255, "epoch": 4400} {"train_loss": -25.778167724609375, "global_step": 365256, "epoch": 4400} {"train_loss": -26.351734161376953, "global_step": 365257, "epoch": 4400} {"train_loss": -26.28376579284668, "global_step": 365258, "epoch": 4400} {"train_loss": -26.01218605041504, "global_step": 365259, "epoch": 4400} {"train_loss": -25.948444366455078, "global_step": 365260, "epoch": 4400} {"train_loss": -26.42195701599121, "global_step": 365261, "epoch": 4400} {"train_loss": -26.415342330932617, "global_step": 365262, "epoch": 4400} {"train_loss": -26.64569664001465, "global_step": 365263, "epoch": 4400} {"train_loss": -26.228973388671875, "global_step": 365264, "epoch": 4400} {"train_loss": -26.082223892211914, "global_step": 365265, "epoch": 4400} {"train_loss": -26.317157745361328, "global_step": 365266, "epoch": 4400} {"train_loss": -26.138885498046875, "global_step": 365267, "epoch": 4400} {"train_loss": -26.207839965820312, "global_step": 365268, "epoch": 4400} {"train_loss": -26.255163192749023, "global_step": 365269, "epoch": 4400} {"train_loss": -26.753095626831055, "global_step": 365270, "epoch": 4400} {"train_loss": -26.47998046875, "global_step": 365271, "epoch": 4400} {"train_loss": -26.069915771484375, "global_step": 365272, "epoch": 4400} {"train_loss": -26.485090255737305, "global_step": 365273, "epoch": 4400} {"train_loss": -26.49342155456543, "global_step": 365274, "epoch": 4400} {"train_loss": -26.521717071533203, "global_step": 365275, "epoch": 4400} {"train_loss": -26.530597686767578, "global_step": 365276, "epoch": 4400} {"train_loss": -26.62347412109375, "global_step": 365277, "epoch": 4400} {"train_loss": -26.614423751831055, "global_step": 365278, "epoch": 4400} {"train_loss": -26.424055099487305, "global_step": 365279, "epoch": 4400} {"train_loss": -26.803064346313477, "global_step": 365280, "epoch": 4400} {"train_loss": -26.462194442749023, "global_step": 365281, "epoch": 4400} {"train_loss": -26.23210185407156, "global_step": 365282, "epoch": 4400, "train/sim_max_reward_0": 1.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 0.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4500000": 1.0, "test/sim_max_reward_4500001": 1.0, "test/sim_max_reward_4500002": 1.0, "test/sim_max_reward_4500003": 1.0, "test/sim_max_reward_4500004": 1.0, "test/sim_max_reward_4500005": 1.0, "test/sim_max_reward_4500006": 1.0, "test/sim_max_reward_4500007": 0.0, "test/sim_max_reward_4500008": 1.0, "test/sim_max_reward_4500009": 1.0, "test/sim_max_reward_4500010": 1.0, "test/sim_max_reward_4500011": 1.0, "test/sim_max_reward_4500012": 1.0, "test/sim_max_reward_4500013": 0.0, "test/sim_max_reward_4500014": 1.0, "test/sim_max_reward_4500015": 1.0, "test/sim_max_reward_4500016": 1.0, "test/sim_max_reward_4500017": 1.0, "test/sim_max_reward_4500018": 1.0, "test/sim_max_reward_4500019": 1.0, "test/sim_max_reward_4500020": 1.0, "test/sim_max_reward_4500021": 1.0, "train/mean_score": 0.8333333333333334, "test/mean_score": 0.9090909090909091, "val_loss": 6505151.0} {"train_loss": -26.126972198486328, "global_step": 365283, "epoch": 4401} {"train_loss": -25.76956558227539, "global_step": 365284, "epoch": 4401} {"train_loss": -25.322669982910156, "global_step": 365285, "epoch": 4401} {"train_loss": -24.927391052246094, "global_step": 365286, "epoch": 4401} {"train_loss": -25.541418075561523, "global_step": 365287, "epoch": 4401} {"train_loss": -25.736957550048828, "global_step": 365288, "epoch": 4401} {"train_loss": -24.667444229125977, "global_step": 365289, "epoch": 4401} {"train_loss": -24.78309440612793, "global_step": 365290, "epoch": 4401} {"train_loss": -25.81180191040039, "global_step": 365291, "epoch": 4401} {"train_loss": -25.274961471557617, "global_step": 365292, "epoch": 4401} {"train_loss": -25.55788803100586, "global_step": 365293, "epoch": 4401} {"train_loss": -25.2275390625, "global_step": 365294, "epoch": 4401} {"train_loss": -26.01362419128418, "global_step": 365295, "epoch": 4401} {"train_loss": -24.8675537109375, "global_step": 365296, "epoch": 4401} {"train_loss": -25.868804931640625, "global_step": 365297, "epoch": 4401} {"train_loss": -25.30764389038086, "global_step": 365298, "epoch": 4401} {"train_loss": -25.626956939697266, "global_step": 365299, "epoch": 4401} {"train_loss": -25.882232666015625, "global_step": 365300, "epoch": 4401} {"train_loss": -25.851642608642578, "global_step": 365301, "epoch": 4401} {"train_loss": -25.8178653717041, "global_step": 365302, "epoch": 4401} {"train_loss": -25.817890167236328, "global_step": 365303, "epoch": 4401} {"train_loss": -25.975317001342773, "global_step": 365304, "epoch": 4401} {"train_loss": -26.08574867248535, "global_step": 365305, "epoch": 4401} {"train_loss": -26.52227783203125, "global_step": 365306, "epoch": 4401} {"train_loss": -25.89875602722168, "global_step": 365307, "epoch": 4401} {"train_loss": -25.918140411376953, "global_step": 365308, "epoch": 4401} {"train_loss": -25.8026180267334, "global_step": 365309, "epoch": 4401} {"train_loss": -25.893341064453125, "global_step": 365310, "epoch": 4401} {"train_loss": -26.08454704284668, "global_step": 365311, "epoch": 4401} {"train_loss": -25.864978790283203, "global_step": 365312, "epoch": 4401} {"train_loss": -25.805755615234375, "global_step": 365313, "epoch": 4401} {"train_loss": -26.456012725830078, "global_step": 365314, "epoch": 4401} {"train_loss": -26.281787872314453, "global_step": 365315, "epoch": 4401} {"train_loss": -26.18293571472168, "global_step": 365316, "epoch": 4401} {"train_loss": -26.218265533447266, "global_step": 365317, "epoch": 4401} {"train_loss": -26.477338790893555, "global_step": 365318, "epoch": 4401} {"train_loss": -26.102630615234375, "global_step": 365319, "epoch": 4401} {"train_loss": -26.570886611938477, "global_step": 365320, "epoch": 4401} {"train_loss": -26.14523696899414, "global_step": 365321, "epoch": 4401} {"train_loss": -26.404266357421875, "global_step": 365322, "epoch": 4401} {"train_loss": -26.209028244018555, "global_step": 365323, "epoch": 4401} {"train_loss": -26.06955337524414, "global_step": 365324, "epoch": 4401} {"train_loss": -26.218067169189453, "global_step": 365325, "epoch": 4401} {"train_loss": -26.193878173828125, "global_step": 365326, "epoch": 4401} {"train_loss": -26.290159225463867, "global_step": 365327, "epoch": 4401} {"train_loss": -26.336572647094727, "global_step": 365328, "epoch": 4401} {"train_loss": -26.358015060424805, "global_step": 365329, "epoch": 4401} {"train_loss": -25.988767623901367, "global_step": 365330, "epoch": 4401} {"train_loss": -26.268217086791992, "global_step": 365331, "epoch": 4401} {"train_loss": -26.415319442749023, "global_step": 365332, "epoch": 4401} {"train_loss": -26.05466651916504, "global_step": 365333, "epoch": 4401} {"train_loss": -26.701745986938477, "global_step": 365334, "epoch": 4401} {"train_loss": -26.290985107421875, "global_step": 365335, "epoch": 4401} {"train_loss": -26.282751083374023, "global_step": 365336, "epoch": 4401} {"train_loss": -26.71209144592285, "global_step": 365337, "epoch": 4401} {"train_loss": -26.208908081054688, "global_step": 365338, "epoch": 4401} {"train_loss": -26.15449333190918, "global_step": 365339, "epoch": 4401} {"train_loss": -26.359363555908203, "global_step": 365340, "epoch": 4401} {"train_loss": -26.308765411376953, "global_step": 365341, "epoch": 4401} {"train_loss": -26.32053565979004, "global_step": 365342, "epoch": 4401} {"train_loss": -26.426305770874023, "global_step": 365343, "epoch": 4401} {"train_loss": -26.160797119140625, "global_step": 365344, "epoch": 4401} {"train_loss": -26.353830337524414, "global_step": 365345, "epoch": 4401} {"train_loss": -26.396839141845703, "global_step": 365346, "epoch": 4401} {"train_loss": -26.707996368408203, "global_step": 365347, "epoch": 4401} {"train_loss": -26.12623405456543, "global_step": 365348, "epoch": 4401} {"train_loss": -26.513614654541016, "global_step": 365349, "epoch": 4401} {"train_loss": -26.326156616210938, "global_step": 365350, "epoch": 4401} {"train_loss": -25.956466674804688, "global_step": 365351, "epoch": 4401} {"train_loss": -26.433979034423828, "global_step": 365352, "epoch": 4401} {"train_loss": -26.364593505859375, "global_step": 365353, "epoch": 4401} {"train_loss": -26.2833194732666, "global_step": 365354, "epoch": 4401} {"train_loss": -26.31843376159668, "global_step": 365355, "epoch": 4401} {"train_loss": -26.285871505737305, "global_step": 365356, "epoch": 4401} {"train_loss": -26.615966796875, "global_step": 365357, "epoch": 4401} {"train_loss": -26.17853355407715, "global_step": 365358, "epoch": 4401} {"train_loss": -26.30889320373535, "global_step": 365359, "epoch": 4401} {"train_loss": -26.228336334228516, "global_step": 365360, "epoch": 4401} {"train_loss": -26.012495040893555, "global_step": 365361, "epoch": 4401} {"train_loss": -26.47532081604004, "global_step": 365362, "epoch": 4401} {"train_loss": -26.30108642578125, "global_step": 365363, "epoch": 4401} {"train_loss": -26.296558380126953, "global_step": 365364, "epoch": 4401} {"train_loss": -26.058718784745917, "global_step": 365365, "epoch": 4401, "val_loss": 6537103.0} {"train_loss": -23.961931228637695, "global_step": 365366, "epoch": 4402} {"train_loss": -23.713817596435547, "global_step": 365367, "epoch": 4402} {"train_loss": -25.270397186279297, "global_step": 365368, "epoch": 4402} {"train_loss": -24.750730514526367, "global_step": 365369, "epoch": 4402} {"train_loss": -25.210647583007812, "global_step": 365370, "epoch": 4402} {"train_loss": -24.90451431274414, "global_step": 365371, "epoch": 4402} {"train_loss": -26.215803146362305, "global_step": 365372, "epoch": 4402} {"train_loss": -25.00868034362793, "global_step": 365373, "epoch": 4402} {"train_loss": -25.681943893432617, "global_step": 365374, "epoch": 4402} {"train_loss": -25.428720474243164, "global_step": 365375, "epoch": 4402} {"train_loss": -25.747486114501953, "global_step": 365376, "epoch": 4402} {"train_loss": -25.63202476501465, "global_step": 365377, "epoch": 4402} {"train_loss": -25.86783218383789, "global_step": 365378, "epoch": 4402} {"train_loss": -25.640430450439453, "global_step": 365379, "epoch": 4402} {"train_loss": -25.771936416625977, "global_step": 365380, "epoch": 4402} {"train_loss": -25.498987197875977, "global_step": 365381, "epoch": 4402} {"train_loss": -25.362308502197266, "global_step": 365382, "epoch": 4402} {"train_loss": -25.86322593688965, "global_step": 365383, "epoch": 4402} {"train_loss": -25.84681510925293, "global_step": 365384, "epoch": 4402} {"train_loss": -25.688947677612305, "global_step": 365385, "epoch": 4402} {"train_loss": -25.93927001953125, "global_step": 365386, "epoch": 4402} {"train_loss": -25.9375, "global_step": 365387, "epoch": 4402} {"train_loss": -25.940656661987305, "global_step": 365388, "epoch": 4402} {"train_loss": -26.095020294189453, "global_step": 365389, "epoch": 4402} {"train_loss": -25.9773006439209, "global_step": 365390, "epoch": 4402} {"train_loss": -26.135787963867188, "global_step": 365391, "epoch": 4402} {"train_loss": -25.53912353515625, "global_step": 365392, "epoch": 4402} {"train_loss": -25.878036499023438, "global_step": 365393, "epoch": 4402} {"train_loss": -26.279296875, "global_step": 365394, "epoch": 4402} {"train_loss": -26.03863525390625, "global_step": 365395, "epoch": 4402} {"train_loss": -26.093774795532227, "global_step": 365396, "epoch": 4402} {"train_loss": -26.302127838134766, "global_step": 365397, "epoch": 4402} {"train_loss": -26.1310977935791, "global_step": 365398, "epoch": 4402} {"train_loss": -26.352231979370117, "global_step": 365399, "epoch": 4402} {"train_loss": -26.10016441345215, "global_step": 365400, "epoch": 4402} {"train_loss": -26.156469345092773, "global_step": 365401, "epoch": 4402} {"train_loss": -26.08758544921875, "global_step": 365402, "epoch": 4402} {"train_loss": -26.050329208374023, "global_step": 365403, "epoch": 4402} {"train_loss": -26.36564064025879, "global_step": 365404, "epoch": 4402} {"train_loss": -26.3792781829834, "global_step": 365405, "epoch": 4402} {"train_loss": -26.15476417541504, "global_step": 365406, "epoch": 4402} {"train_loss": -26.240781784057617, "global_step": 365407, "epoch": 4402} {"train_loss": -26.445270538330078, "global_step": 365408, "epoch": 4402} {"train_loss": -26.634016036987305, "global_step": 365409, "epoch": 4402} {"train_loss": -26.29401206970215, "global_step": 365410, "epoch": 4402} {"train_loss": -26.565763473510742, "global_step": 365411, "epoch": 4402} {"train_loss": -26.588336944580078, "global_step": 365412, "epoch": 4402} {"train_loss": -26.434036254882812, "global_step": 365413, "epoch": 4402} {"train_loss": -26.6577091217041, "global_step": 365414, "epoch": 4402} {"train_loss": -26.461584091186523, "global_step": 365415, "epoch": 4402} {"train_loss": -26.526880264282227, "global_step": 365416, "epoch": 4402} {"train_loss": -26.226293563842773, "global_step": 365417, "epoch": 4402} {"train_loss": -26.501113891601562, "global_step": 365418, "epoch": 4402} {"train_loss": -26.328054428100586, "global_step": 365419, "epoch": 4402} {"train_loss": -26.46514320373535, "global_step": 365420, "epoch": 4402} {"train_loss": -26.226877212524414, "global_step": 365421, "epoch": 4402} {"train_loss": -26.645811080932617, "global_step": 365422, "epoch": 4402} {"train_loss": -26.458303451538086, "global_step": 365423, "epoch": 4402} {"train_loss": -26.431060791015625, "global_step": 365424, "epoch": 4402} {"train_loss": -26.622304916381836, "global_step": 365425, "epoch": 4402} {"train_loss": -26.550140380859375, "global_step": 365426, "epoch": 4402} {"train_loss": -26.185394287109375, "global_step": 365427, "epoch": 4402} {"train_loss": -26.464826583862305, "global_step": 365428, "epoch": 4402} {"train_loss": -26.232135772705078, "global_step": 365429, "epoch": 4402} {"train_loss": -26.136356353759766, "global_step": 365430, "epoch": 4402} {"train_loss": -26.325733184814453, "global_step": 365431, "epoch": 4402} {"train_loss": -26.407556533813477, "global_step": 365432, "epoch": 4402} {"train_loss": -26.599302291870117, "global_step": 365433, "epoch": 4402} {"train_loss": -26.6571044921875, "global_step": 365434, "epoch": 4402} {"train_loss": -26.715452194213867, "global_step": 365435, "epoch": 4402} {"train_loss": -26.12432861328125, "global_step": 365436, "epoch": 4402} {"train_loss": -26.416513442993164, "global_step": 365437, "epoch": 4402} {"train_loss": -26.436193466186523, "global_step": 365438, "epoch": 4402} {"train_loss": -26.81867790222168, "global_step": 365439, "epoch": 4402} {"train_loss": -26.540143966674805, "global_step": 365440, "epoch": 4402} {"train_loss": -26.140369415283203, "global_step": 365441, "epoch": 4402} {"train_loss": -26.38870620727539, "global_step": 365442, "epoch": 4402} {"train_loss": -26.175933837890625, "global_step": 365443, "epoch": 4402} {"train_loss": -26.285785675048828, "global_step": 365444, "epoch": 4402} {"train_loss": -26.585174560546875, "global_step": 365445, "epoch": 4402} {"train_loss": -26.17841148376465, "global_step": 365446, "epoch": 4402} {"train_loss": -26.423974990844727, "global_step": 365447, "epoch": 4402} {"train_loss": -26.07784744630377, "global_step": 365448, "epoch": 4402, "val_loss": 6574433.0} {"train_loss": -25.643823623657227, "global_step": 365449, "epoch": 4403} {"train_loss": -25.81123924255371, "global_step": 365450, "epoch": 4403} {"train_loss": -25.57846450805664, "global_step": 365451, "epoch": 4403} {"train_loss": -25.518632888793945, "global_step": 365452, "epoch": 4403} {"train_loss": -25.779937744140625, "global_step": 365453, "epoch": 4403} {"train_loss": -25.253393173217773, "global_step": 365454, "epoch": 4403} {"train_loss": -25.417057037353516, "global_step": 365455, "epoch": 4403} {"train_loss": -25.636627197265625, "global_step": 365456, "epoch": 4403} {"train_loss": -25.7302188873291, "global_step": 365457, "epoch": 4403} {"train_loss": -25.723722457885742, "global_step": 365458, "epoch": 4403} {"train_loss": -25.416898727416992, "global_step": 365459, "epoch": 4403} {"train_loss": -25.942901611328125, "global_step": 365460, "epoch": 4403} {"train_loss": -26.18316078186035, "global_step": 365461, "epoch": 4403} {"train_loss": -25.822717666625977, "global_step": 365462, "epoch": 4403} {"train_loss": -25.588754653930664, "global_step": 365463, "epoch": 4403} {"train_loss": -25.742109298706055, "global_step": 365464, "epoch": 4403} {"train_loss": -25.58443260192871, "global_step": 365465, "epoch": 4403} {"train_loss": -26.124082565307617, "global_step": 365466, "epoch": 4403} {"train_loss": -25.886869430541992, "global_step": 365467, "epoch": 4403} {"train_loss": -26.066598892211914, "global_step": 365468, "epoch": 4403} {"train_loss": -26.27923011779785, "global_step": 365469, "epoch": 4403} {"train_loss": -26.187061309814453, "global_step": 365470, "epoch": 4403} {"train_loss": -26.29945182800293, "global_step": 365471, "epoch": 4403} {"train_loss": -26.1014404296875, "global_step": 365472, "epoch": 4403} {"train_loss": -26.1324405670166, "global_step": 365473, "epoch": 4403} {"train_loss": -26.16956901550293, "global_step": 365474, "epoch": 4403} {"train_loss": -26.101882934570312, "global_step": 365475, "epoch": 4403} {"train_loss": -25.798852920532227, "global_step": 365476, "epoch": 4403} {"train_loss": -25.690032958984375, "global_step": 365477, "epoch": 4403} {"train_loss": -26.242826461791992, "global_step": 365478, "epoch": 4403} {"train_loss": -26.03742790222168, "global_step": 365479, "epoch": 4403} {"train_loss": -26.309293746948242, "global_step": 365480, "epoch": 4403} {"train_loss": -25.9852237701416, "global_step": 365481, "epoch": 4403} {"train_loss": -26.51592445373535, "global_step": 365482, "epoch": 4403} {"train_loss": -26.032270431518555, "global_step": 365483, "epoch": 4403} {"train_loss": -26.457477569580078, "global_step": 365484, "epoch": 4403} {"train_loss": -26.532983779907227, "global_step": 365485, "epoch": 4403} {"train_loss": -26.6253719329834, "global_step": 365486, "epoch": 4403} {"train_loss": -26.511062622070312, "global_step": 365487, "epoch": 4403} {"train_loss": -26.626312255859375, "global_step": 365488, "epoch": 4403} {"train_loss": -26.682825088500977, "global_step": 365489, "epoch": 4403} {"train_loss": -26.34177589416504, "global_step": 365490, "epoch": 4403} {"train_loss": -26.437061309814453, "global_step": 365491, "epoch": 4403} {"train_loss": -26.46368980407715, "global_step": 365492, "epoch": 4403} {"train_loss": -26.669143676757812, "global_step": 365493, "epoch": 4403} {"train_loss": -26.238855361938477, "global_step": 365494, "epoch": 4403} {"train_loss": -26.44805908203125, "global_step": 365495, "epoch": 4403} {"train_loss": -26.527267456054688, "global_step": 365496, "epoch": 4403} {"train_loss": -26.17280387878418, "global_step": 365497, "epoch": 4403} {"train_loss": -26.08583641052246, "global_step": 365498, "epoch": 4403} {"train_loss": -26.564315795898438, "global_step": 365499, "epoch": 4403} {"train_loss": -26.609027862548828, "global_step": 365500, "epoch": 4403} {"train_loss": -26.18269157409668, "global_step": 365501, "epoch": 4403} {"train_loss": -26.339771270751953, "global_step": 365502, "epoch": 4403} {"train_loss": -26.04422378540039, "global_step": 365503, "epoch": 4403} {"train_loss": -26.67279624938965, "global_step": 365504, "epoch": 4403} {"train_loss": -26.323596954345703, "global_step": 365505, "epoch": 4403} {"train_loss": -26.597137451171875, "global_step": 365506, "epoch": 4403} {"train_loss": -26.463775634765625, "global_step": 365507, "epoch": 4403} {"train_loss": -26.12603759765625, "global_step": 365508, "epoch": 4403} {"train_loss": -26.12940788269043, "global_step": 365509, "epoch": 4403} {"train_loss": -26.55457878112793, "global_step": 365510, "epoch": 4403} {"train_loss": -26.594390869140625, "global_step": 365511, "epoch": 4403} {"train_loss": -26.1424617767334, "global_step": 365512, "epoch": 4403} {"train_loss": -26.52802085876465, "global_step": 365513, "epoch": 4403} {"train_loss": -26.284582138061523, "global_step": 365514, "epoch": 4403} {"train_loss": -26.298065185546875, "global_step": 365515, "epoch": 4403} {"train_loss": -26.178022384643555, "global_step": 365516, "epoch": 4403} {"train_loss": -26.35970115661621, "global_step": 365517, "epoch": 4403} {"train_loss": -26.21767234802246, "global_step": 365518, "epoch": 4403} {"train_loss": -26.05893325805664, "global_step": 365519, "epoch": 4403} {"train_loss": -26.634857177734375, "global_step": 365520, "epoch": 4403} {"train_loss": -26.250059127807617, "global_step": 365521, "epoch": 4403} {"train_loss": -26.25274658203125, "global_step": 365522, "epoch": 4403} {"train_loss": -26.54836082458496, "global_step": 365523, "epoch": 4403} {"train_loss": -26.251972198486328, "global_step": 365524, "epoch": 4403} {"train_loss": -26.498998641967773, "global_step": 365525, "epoch": 4403} {"train_loss": -26.272293090820312, "global_step": 365526, "epoch": 4403} {"train_loss": -26.384618759155273, "global_step": 365527, "epoch": 4403} {"train_loss": -26.501489639282227, "global_step": 365528, "epoch": 4403} {"train_loss": -26.590200424194336, "global_step": 365529, "epoch": 4403} {"train_loss": -26.54364013671875, "global_step": 365530, "epoch": 4403} {"train_loss": -26.185838676360717, "global_step": 365531, "epoch": 4403, "val_loss": 6527356.0} {"train_loss": -25.164142608642578, "global_step": 365532, "epoch": 4404} {"train_loss": -25.59908676147461, "global_step": 365533, "epoch": 4404} {"train_loss": -25.761219024658203, "global_step": 365534, "epoch": 4404} {"train_loss": -25.52011489868164, "global_step": 365535, "epoch": 4404} {"train_loss": -26.18828773498535, "global_step": 365536, "epoch": 4404} {"train_loss": -26.13569450378418, "global_step": 365537, "epoch": 4404} {"train_loss": -25.752578735351562, "global_step": 365538, "epoch": 4404} {"train_loss": -25.811330795288086, "global_step": 365539, "epoch": 4404} {"train_loss": -25.881128311157227, "global_step": 365540, "epoch": 4404} {"train_loss": -25.992660522460938, "global_step": 365541, "epoch": 4404} {"train_loss": -25.913129806518555, "global_step": 365542, "epoch": 4404} {"train_loss": -25.923368453979492, "global_step": 365543, "epoch": 4404} {"train_loss": -26.133508682250977, "global_step": 365544, "epoch": 4404} {"train_loss": -26.198352813720703, "global_step": 365545, "epoch": 4404} {"train_loss": -25.95961570739746, "global_step": 365546, "epoch": 4404} {"train_loss": -26.408567428588867, "global_step": 365547, "epoch": 4404} {"train_loss": -26.099945068359375, "global_step": 365548, "epoch": 4404} {"train_loss": -26.161865234375, "global_step": 365549, "epoch": 4404} {"train_loss": -26.311389923095703, "global_step": 365550, "epoch": 4404} {"train_loss": -26.11927604675293, "global_step": 365551, "epoch": 4404} {"train_loss": -26.253820419311523, "global_step": 365552, "epoch": 4404} {"train_loss": -25.93604850769043, "global_step": 365553, "epoch": 4404} {"train_loss": -26.03143882751465, "global_step": 365554, "epoch": 4404} {"train_loss": -26.27189064025879, "global_step": 365555, "epoch": 4404} {"train_loss": -25.841693878173828, "global_step": 365556, "epoch": 4404} {"train_loss": -26.0362491607666, "global_step": 365557, "epoch": 4404} {"train_loss": -26.38630485534668, "global_step": 365558, "epoch": 4404} {"train_loss": -26.31244468688965, "global_step": 365559, "epoch": 4404} {"train_loss": -26.377857208251953, "global_step": 365560, "epoch": 4404} {"train_loss": -25.985309600830078, "global_step": 365561, "epoch": 4404} {"train_loss": -26.231597900390625, "global_step": 365562, "epoch": 4404} {"train_loss": -26.240568161010742, "global_step": 365563, "epoch": 4404} {"train_loss": -26.305566787719727, "global_step": 365564, "epoch": 4404} {"train_loss": -26.619464874267578, "global_step": 365565, "epoch": 4404} {"train_loss": -26.82692527770996, "global_step": 365566, "epoch": 4404} {"train_loss": -26.452138900756836, "global_step": 365567, "epoch": 4404} {"train_loss": -26.68379783630371, "global_step": 365568, "epoch": 4404} {"train_loss": -26.313623428344727, "global_step": 365569, "epoch": 4404} {"train_loss": -26.532318115234375, "global_step": 365570, "epoch": 4404} {"train_loss": -26.332717895507812, "global_step": 365571, "epoch": 4404} {"train_loss": -26.57159423828125, "global_step": 365572, "epoch": 4404} {"train_loss": -26.527753829956055, "global_step": 365573, "epoch": 4404} {"train_loss": -26.32988929748535, "global_step": 365574, "epoch": 4404} {"train_loss": -26.016714096069336, "global_step": 365575, "epoch": 4404} {"train_loss": -26.30683708190918, "global_step": 365576, "epoch": 4404} {"train_loss": -26.18256950378418, "global_step": 365577, "epoch": 4404} {"train_loss": -26.640241622924805, "global_step": 365578, "epoch": 4404} {"train_loss": -26.289020538330078, "global_step": 365579, "epoch": 4404} {"train_loss": -26.830368041992188, "global_step": 365580, "epoch": 4404} {"train_loss": -26.076269149780273, "global_step": 365581, "epoch": 4404} {"train_loss": -26.07203483581543, "global_step": 365582, "epoch": 4404} {"train_loss": -26.689870834350586, "global_step": 365583, "epoch": 4404} {"train_loss": -26.437381744384766, "global_step": 365584, "epoch": 4404} {"train_loss": -26.06812858581543, "global_step": 365585, "epoch": 4404} {"train_loss": -26.140920639038086, "global_step": 365586, "epoch": 4404} {"train_loss": -26.20149040222168, "global_step": 365587, "epoch": 4404} {"train_loss": -26.287710189819336, "global_step": 365588, "epoch": 4404} {"train_loss": -26.040149688720703, "global_step": 365589, "epoch": 4404} {"train_loss": -26.18588638305664, "global_step": 365590, "epoch": 4404} {"train_loss": -26.035308837890625, "global_step": 365591, "epoch": 4404} {"train_loss": -26.498004913330078, "global_step": 365592, "epoch": 4404} {"train_loss": -25.99163818359375, "global_step": 365593, "epoch": 4404} {"train_loss": -26.06609535217285, "global_step": 365594, "epoch": 4404} {"train_loss": -25.7094783782959, "global_step": 365595, "epoch": 4404} {"train_loss": -26.32990837097168, "global_step": 365596, "epoch": 4404} {"train_loss": -25.977964401245117, "global_step": 365597, "epoch": 4404} {"train_loss": -26.271093368530273, "global_step": 365598, "epoch": 4404} {"train_loss": -25.958759307861328, "global_step": 365599, "epoch": 4404} {"train_loss": -26.138147354125977, "global_step": 365600, "epoch": 4404} {"train_loss": -26.41082191467285, "global_step": 365601, "epoch": 4404} {"train_loss": -26.535369873046875, "global_step": 365602, "epoch": 4404} {"train_loss": -26.432165145874023, "global_step": 365603, "epoch": 4404} {"train_loss": -26.419204711914062, "global_step": 365604, "epoch": 4404} {"train_loss": -26.577787399291992, "global_step": 365605, "epoch": 4404} {"train_loss": -26.20930290222168, "global_step": 365606, "epoch": 4404} {"train_loss": -26.08296012878418, "global_step": 365607, "epoch": 4404} {"train_loss": -26.535480499267578, "global_step": 365608, "epoch": 4404} {"train_loss": -26.191373825073242, "global_step": 365609, "epoch": 4404} {"train_loss": -26.193662643432617, "global_step": 365610, "epoch": 4404} {"train_loss": -26.036401748657227, "global_step": 365611, "epoch": 4404} {"train_loss": -26.20159912109375, "global_step": 365612, "epoch": 4404} {"train_loss": -26.5528621673584, "global_step": 365613, "epoch": 4404} {"train_loss": -26.202324189335467, "global_step": 365614, "epoch": 4404, "val_loss": 6606725.0} {"train_loss": -26.23772621154785, "global_step": 365615, "epoch": 4405} {"train_loss": -26.00252342224121, "global_step": 365616, "epoch": 4405} {"train_loss": -26.017770767211914, "global_step": 365617, "epoch": 4405} {"train_loss": -25.990331649780273, "global_step": 365618, "epoch": 4405} {"train_loss": -26.224536895751953, "global_step": 365619, "epoch": 4405} {"train_loss": -26.18010902404785, "global_step": 365620, "epoch": 4405} {"train_loss": -26.653717041015625, "global_step": 365621, "epoch": 4405} {"train_loss": -26.107227325439453, "global_step": 365622, "epoch": 4405} {"train_loss": -26.30694007873535, "global_step": 365623, "epoch": 4405} {"train_loss": -26.261022567749023, "global_step": 365624, "epoch": 4405} {"train_loss": -26.358245849609375, "global_step": 365625, "epoch": 4405} {"train_loss": -26.526960372924805, "global_step": 365626, "epoch": 4405} {"train_loss": -26.30307388305664, "global_step": 365627, "epoch": 4405} {"train_loss": -26.16652488708496, "global_step": 365628, "epoch": 4405} {"train_loss": -26.45440101623535, "global_step": 365629, "epoch": 4405} {"train_loss": -26.26190185546875, "global_step": 365630, "epoch": 4405} {"train_loss": -26.399118423461914, "global_step": 365631, "epoch": 4405} {"train_loss": -25.983631134033203, "global_step": 365632, "epoch": 4405} {"train_loss": -26.321203231811523, "global_step": 365633, "epoch": 4405} {"train_loss": -26.447925567626953, "global_step": 365634, "epoch": 4405} {"train_loss": -26.12039566040039, "global_step": 365635, "epoch": 4405} {"train_loss": -26.59419822692871, "global_step": 365636, "epoch": 4405} {"train_loss": -26.163015365600586, "global_step": 365637, "epoch": 4405} {"train_loss": -26.277210235595703, "global_step": 365638, "epoch": 4405} {"train_loss": -26.180219650268555, "global_step": 365639, "epoch": 4405} {"train_loss": -26.566991806030273, "global_step": 365640, "epoch": 4405} {"train_loss": -26.529916763305664, "global_step": 365641, "epoch": 4405} {"train_loss": -26.16678237915039, "global_step": 365642, "epoch": 4405} {"train_loss": -26.408679962158203, "global_step": 365643, "epoch": 4405} {"train_loss": -26.015241622924805, "global_step": 365644, "epoch": 4405} {"train_loss": -26.212482452392578, "global_step": 365645, "epoch": 4405} {"train_loss": -26.237409591674805, "global_step": 365646, "epoch": 4405} {"train_loss": -26.202472686767578, "global_step": 365647, "epoch": 4405} {"train_loss": -26.188383102416992, "global_step": 365648, "epoch": 4405} {"train_loss": -26.638986587524414, "global_step": 365649, "epoch": 4405} {"train_loss": -25.985570907592773, "global_step": 365650, "epoch": 4405} {"train_loss": -26.34840202331543, "global_step": 365651, "epoch": 4405} {"train_loss": -26.12161636352539, "global_step": 365652, "epoch": 4405} {"train_loss": -26.40557861328125, "global_step": 365653, "epoch": 4405} {"train_loss": -26.3185977935791, "global_step": 365654, "epoch": 4405} {"train_loss": -26.360254287719727, "global_step": 365655, "epoch": 4405} {"train_loss": -26.433385848999023, "global_step": 365656, "epoch": 4405} {"train_loss": -26.86907958984375, "global_step": 365657, "epoch": 4405} {"train_loss": -26.256591796875, "global_step": 365658, "epoch": 4405} {"train_loss": -25.993558883666992, "global_step": 365659, "epoch": 4405} {"train_loss": -26.43049430847168, "global_step": 365660, "epoch": 4405} {"train_loss": -26.26922035217285, "global_step": 365661, "epoch": 4405} {"train_loss": -26.21067237854004, "global_step": 365662, "epoch": 4405} {"train_loss": -26.21283531188965, "global_step": 365663, "epoch": 4405} {"train_loss": -26.485157012939453, "global_step": 365664, "epoch": 4405} {"train_loss": -26.2631778717041, "global_step": 365665, "epoch": 4405} {"train_loss": -26.752471923828125, "global_step": 365666, "epoch": 4405} {"train_loss": -26.504785537719727, "global_step": 365667, "epoch": 4405} {"train_loss": -26.422962188720703, "global_step": 365668, "epoch": 4405} {"train_loss": -26.077157974243164, "global_step": 365669, "epoch": 4405} {"train_loss": -26.2752685546875, "global_step": 365670, "epoch": 4405} {"train_loss": -26.170093536376953, "global_step": 365671, "epoch": 4405} {"train_loss": -26.6324462890625, "global_step": 365672, "epoch": 4405} {"train_loss": -26.013916015625, "global_step": 365673, "epoch": 4405} {"train_loss": -26.263151168823242, "global_step": 365674, "epoch": 4405} {"train_loss": -26.200153350830078, "global_step": 365675, "epoch": 4405} {"train_loss": -26.44427490234375, "global_step": 365676, "epoch": 4405} {"train_loss": -26.385360717773438, "global_step": 365677, "epoch": 4405} {"train_loss": -26.387887954711914, "global_step": 365678, "epoch": 4405} {"train_loss": -26.1654052734375, "global_step": 365679, "epoch": 4405} {"train_loss": -26.6314697265625, "global_step": 365680, "epoch": 4405} {"train_loss": -26.506006240844727, "global_step": 365681, "epoch": 4405} {"train_loss": -26.415632247924805, "global_step": 365682, "epoch": 4405} {"train_loss": -26.40569496154785, "global_step": 365683, "epoch": 4405} {"train_loss": -26.118688583374023, "global_step": 365684, "epoch": 4405} {"train_loss": -26.32051658630371, "global_step": 365685, "epoch": 4405} {"train_loss": -26.741727828979492, "global_step": 365686, "epoch": 4405} {"train_loss": -26.321979522705078, "global_step": 365687, "epoch": 4405} {"train_loss": -26.7889347076416, "global_step": 365688, "epoch": 4405} {"train_loss": -26.384464263916016, "global_step": 365689, "epoch": 4405} {"train_loss": -26.277618408203125, "global_step": 365690, "epoch": 4405} {"train_loss": -26.368911743164062, "global_step": 365691, "epoch": 4405} {"train_loss": -26.735021591186523, "global_step": 365692, "epoch": 4405} {"train_loss": -26.334680557250977, "global_step": 365693, "epoch": 4405} {"train_loss": -26.154027938842773, "global_step": 365694, "epoch": 4405} {"train_loss": -26.57773208618164, "global_step": 365695, "epoch": 4405} {"train_loss": -26.45352554321289, "global_step": 365696, "epoch": 4405} {"train_loss": -26.325237940592938, "global_step": 365697, "epoch": 4405, "val_loss": 6501519.5} {"train_loss": -25.53700065612793, "global_step": 365698, "epoch": 4406} {"train_loss": -24.86480712890625, "global_step": 365699, "epoch": 4406} {"train_loss": -25.007247924804688, "global_step": 365700, "epoch": 4406} {"train_loss": -25.394514083862305, "global_step": 365701, "epoch": 4406} {"train_loss": -25.955617904663086, "global_step": 365702, "epoch": 4406} {"train_loss": -26.20098876953125, "global_step": 365703, "epoch": 4406} {"train_loss": -25.537683486938477, "global_step": 365704, "epoch": 4406} {"train_loss": -26.34929847717285, "global_step": 365705, "epoch": 4406} {"train_loss": -25.70087242126465, "global_step": 365706, "epoch": 4406} {"train_loss": -25.55364227294922, "global_step": 365707, "epoch": 4406} {"train_loss": -26.050128936767578, "global_step": 365708, "epoch": 4406} {"train_loss": -25.579893112182617, "global_step": 365709, "epoch": 4406} {"train_loss": -25.76118278503418, "global_step": 365710, "epoch": 4406} {"train_loss": -25.805089950561523, "global_step": 365711, "epoch": 4406} {"train_loss": -25.822834014892578, "global_step": 365712, "epoch": 4406} {"train_loss": -26.217639923095703, "global_step": 365713, "epoch": 4406} {"train_loss": -26.096466064453125, "global_step": 365714, "epoch": 4406} {"train_loss": -26.233922958374023, "global_step": 365715, "epoch": 4406} {"train_loss": -26.1584415435791, "global_step": 365716, "epoch": 4406} {"train_loss": -26.07636833190918, "global_step": 365717, "epoch": 4406} {"train_loss": -26.223127365112305, "global_step": 365718, "epoch": 4406} {"train_loss": -26.0690975189209, "global_step": 365719, "epoch": 4406} {"train_loss": -26.26792335510254, "global_step": 365720, "epoch": 4406} {"train_loss": -25.9957218170166, "global_step": 365721, "epoch": 4406} {"train_loss": -25.894285202026367, "global_step": 365722, "epoch": 4406} {"train_loss": -26.069507598876953, "global_step": 365723, "epoch": 4406} {"train_loss": -26.274564743041992, "global_step": 365724, "epoch": 4406} {"train_loss": -26.59561538696289, "global_step": 365725, "epoch": 4406} {"train_loss": -26.26801872253418, "global_step": 365726, "epoch": 4406} {"train_loss": -26.296817779541016, "global_step": 365727, "epoch": 4406} {"train_loss": -26.20393943786621, "global_step": 365728, "epoch": 4406} {"train_loss": -26.061059951782227, "global_step": 365729, "epoch": 4406} {"train_loss": -26.259180068969727, "global_step": 365730, "epoch": 4406} {"train_loss": -26.1307430267334, "global_step": 365731, "epoch": 4406} {"train_loss": -26.465961456298828, "global_step": 365732, "epoch": 4406} {"train_loss": -26.541645050048828, "global_step": 365733, "epoch": 4406} {"train_loss": -25.950204849243164, "global_step": 365734, "epoch": 4406} {"train_loss": -26.386798858642578, "global_step": 365735, "epoch": 4406} {"train_loss": -26.181249618530273, "global_step": 365736, "epoch": 4406} {"train_loss": -26.613622665405273, "global_step": 365737, "epoch": 4406} {"train_loss": -25.91057777404785, "global_step": 365738, "epoch": 4406} {"train_loss": -26.367633819580078, "global_step": 365739, "epoch": 4406} {"train_loss": -26.7298583984375, "global_step": 365740, "epoch": 4406} {"train_loss": -26.1790771484375, "global_step": 365741, "epoch": 4406} {"train_loss": -26.485809326171875, "global_step": 365742, "epoch": 4406} {"train_loss": -26.7276554107666, "global_step": 365743, "epoch": 4406} {"train_loss": -26.154870986938477, "global_step": 365744, "epoch": 4406} {"train_loss": -25.7574520111084, "global_step": 365745, "epoch": 4406} {"train_loss": -25.803115844726562, "global_step": 365746, "epoch": 4406} {"train_loss": -26.437803268432617, "global_step": 365747, "epoch": 4406} {"train_loss": -26.162145614624023, "global_step": 365748, "epoch": 4406} {"train_loss": -26.435766220092773, "global_step": 365749, "epoch": 4406} {"train_loss": -26.166507720947266, "global_step": 365750, "epoch": 4406} {"train_loss": -26.333587646484375, "global_step": 365751, "epoch": 4406} {"train_loss": -26.144287109375, "global_step": 365752, "epoch": 4406} {"train_loss": -26.32513999938965, "global_step": 365753, "epoch": 4406} {"train_loss": -26.50946044921875, "global_step": 365754, "epoch": 4406} {"train_loss": -26.4128360748291, "global_step": 365755, "epoch": 4406} {"train_loss": -26.049732208251953, "global_step": 365756, "epoch": 4406} {"train_loss": -26.36159324645996, "global_step": 365757, "epoch": 4406} {"train_loss": -26.06206703186035, "global_step": 365758, "epoch": 4406} {"train_loss": -26.32606315612793, "global_step": 365759, "epoch": 4406} {"train_loss": -26.287311553955078, "global_step": 365760, "epoch": 4406} {"train_loss": -26.46343994140625, "global_step": 365761, "epoch": 4406} {"train_loss": -26.306198120117188, "global_step": 365762, "epoch": 4406} {"train_loss": -26.458820343017578, "global_step": 365763, "epoch": 4406} {"train_loss": -26.523212432861328, "global_step": 365764, "epoch": 4406} {"train_loss": -26.407190322875977, "global_step": 365765, "epoch": 4406} {"train_loss": -26.33503532409668, "global_step": 365766, "epoch": 4406} {"train_loss": -26.49525260925293, "global_step": 365767, "epoch": 4406} {"train_loss": -26.46466064453125, "global_step": 365768, "epoch": 4406} {"train_loss": -26.441858291625977, "global_step": 365769, "epoch": 4406} {"train_loss": -26.541675567626953, "global_step": 365770, "epoch": 4406} {"train_loss": -26.4638614654541, "global_step": 365771, "epoch": 4406} {"train_loss": -26.66023063659668, "global_step": 365772, "epoch": 4406} {"train_loss": -26.516977310180664, "global_step": 365773, "epoch": 4406} {"train_loss": -26.432600021362305, "global_step": 365774, "epoch": 4406} {"train_loss": -26.20367431640625, "global_step": 365775, "epoch": 4406} {"train_loss": -25.887903213500977, "global_step": 365776, "epoch": 4406} {"train_loss": -26.096668243408203, "global_step": 365777, "epoch": 4406} {"train_loss": -26.180377960205078, "global_step": 365778, "epoch": 4406} {"train_loss": -26.317264556884766, "global_step": 365779, "epoch": 4406} {"train_loss": -26.165871677628484, "global_step": 365780, "epoch": 4406, "val_loss": 6538933.0} {"train_loss": -25.458044052124023, "global_step": 365781, "epoch": 4407} {"train_loss": -25.22407341003418, "global_step": 365782, "epoch": 4407} {"train_loss": -25.816226959228516, "global_step": 365783, "epoch": 4407} {"train_loss": -25.839679718017578, "global_step": 365784, "epoch": 4407} {"train_loss": -26.2098331451416, "global_step": 365785, "epoch": 4407} {"train_loss": -25.586774826049805, "global_step": 365786, "epoch": 4407} {"train_loss": -25.777963638305664, "global_step": 365787, "epoch": 4407} {"train_loss": -25.574810028076172, "global_step": 365788, "epoch": 4407} {"train_loss": -25.53231430053711, "global_step": 365789, "epoch": 4407} {"train_loss": -26.080305099487305, "global_step": 365790, "epoch": 4407} {"train_loss": -25.682947158813477, "global_step": 365791, "epoch": 4407} {"train_loss": -26.009143829345703, "global_step": 365792, "epoch": 4407} {"train_loss": -26.151086807250977, "global_step": 365793, "epoch": 4407} {"train_loss": -26.11488151550293, "global_step": 365794, "epoch": 4407} {"train_loss": -26.283985137939453, "global_step": 365795, "epoch": 4407} {"train_loss": -26.225812911987305, "global_step": 365796, "epoch": 4407} {"train_loss": -26.196149826049805, "global_step": 365797, "epoch": 4407} {"train_loss": -26.38819694519043, "global_step": 365798, "epoch": 4407} {"train_loss": -26.085607528686523, "global_step": 365799, "epoch": 4407} {"train_loss": -26.41278076171875, "global_step": 365800, "epoch": 4407} {"train_loss": -26.175012588500977, "global_step": 365801, "epoch": 4407} {"train_loss": -26.34329605102539, "global_step": 365802, "epoch": 4407} {"train_loss": -25.99033546447754, "global_step": 365803, "epoch": 4407} {"train_loss": -26.34278678894043, "global_step": 365804, "epoch": 4407} {"train_loss": -26.286466598510742, "global_step": 365805, "epoch": 4407} {"train_loss": -25.99627113342285, "global_step": 365806, "epoch": 4407} {"train_loss": -25.953474044799805, "global_step": 365807, "epoch": 4407} {"train_loss": -26.158329010009766, "global_step": 365808, "epoch": 4407} {"train_loss": -26.442235946655273, "global_step": 365809, "epoch": 4407} {"train_loss": -26.6438045501709, "global_step": 365810, "epoch": 4407} {"train_loss": -26.223983764648438, "global_step": 365811, "epoch": 4407} {"train_loss": -26.19162940979004, "global_step": 365812, "epoch": 4407} {"train_loss": -26.262409210205078, "global_step": 365813, "epoch": 4407} {"train_loss": -26.4305477142334, "global_step": 365814, "epoch": 4407} {"train_loss": -26.33210563659668, "global_step": 365815, "epoch": 4407} {"train_loss": -26.28447914123535, "global_step": 365816, "epoch": 4407} {"train_loss": -26.7312068939209, "global_step": 365817, "epoch": 4407} {"train_loss": -26.326257705688477, "global_step": 365818, "epoch": 4407} {"train_loss": -26.29778480529785, "global_step": 365819, "epoch": 4407} {"train_loss": -26.12298011779785, "global_step": 365820, "epoch": 4407} {"train_loss": -26.702173233032227, "global_step": 365821, "epoch": 4407} {"train_loss": -26.110626220703125, "global_step": 365822, "epoch": 4407} {"train_loss": -26.257543563842773, "global_step": 365823, "epoch": 4407} {"train_loss": -26.38050651550293, "global_step": 365824, "epoch": 4407} {"train_loss": -26.514490127563477, "global_step": 365825, "epoch": 4407} {"train_loss": -26.440967559814453, "global_step": 365826, "epoch": 4407} {"train_loss": -26.663732528686523, "global_step": 365827, "epoch": 4407} {"train_loss": -26.322738647460938, "global_step": 365828, "epoch": 4407} {"train_loss": -26.363788604736328, "global_step": 365829, "epoch": 4407} {"train_loss": -26.39283561706543, "global_step": 365830, "epoch": 4407} {"train_loss": -26.35249900817871, "global_step": 365831, "epoch": 4407} {"train_loss": -26.070703506469727, "global_step": 365832, "epoch": 4407} {"train_loss": -26.395069122314453, "global_step": 365833, "epoch": 4407} {"train_loss": -26.514667510986328, "global_step": 365834, "epoch": 4407} {"train_loss": -26.11515235900879, "global_step": 365835, "epoch": 4407} {"train_loss": -26.0460205078125, "global_step": 365836, "epoch": 4407} {"train_loss": -26.604841232299805, "global_step": 365837, "epoch": 4407} {"train_loss": -26.572397232055664, "global_step": 365838, "epoch": 4407} {"train_loss": -26.243188858032227, "global_step": 365839, "epoch": 4407} {"train_loss": -26.15791130065918, "global_step": 365840, "epoch": 4407} {"train_loss": -26.115234375, "global_step": 365841, "epoch": 4407} {"train_loss": -26.455575942993164, "global_step": 365842, "epoch": 4407} {"train_loss": -25.94537353515625, "global_step": 365843, "epoch": 4407} {"train_loss": -26.379507064819336, "global_step": 365844, "epoch": 4407} {"train_loss": -26.350696563720703, "global_step": 365845, "epoch": 4407} {"train_loss": -25.836334228515625, "global_step": 365846, "epoch": 4407} {"train_loss": -25.90220069885254, "global_step": 365847, "epoch": 4407} {"train_loss": -25.885095596313477, "global_step": 365848, "epoch": 4407} {"train_loss": -26.144454956054688, "global_step": 365849, "epoch": 4407} {"train_loss": -25.984207153320312, "global_step": 365850, "epoch": 4407} {"train_loss": -25.95525550842285, "global_step": 365851, "epoch": 4407} {"train_loss": -26.20404052734375, "global_step": 365852, "epoch": 4407} {"train_loss": -26.058027267456055, "global_step": 365853, "epoch": 4407} {"train_loss": -25.90533447265625, "global_step": 365854, "epoch": 4407} {"train_loss": -25.81072998046875, "global_step": 365855, "epoch": 4407} {"train_loss": -25.31412696838379, "global_step": 365856, "epoch": 4407} {"train_loss": -25.8597469329834, "global_step": 365857, "epoch": 4407} {"train_loss": -26.2718563079834, "global_step": 365858, "epoch": 4407} {"train_loss": -25.73601722717285, "global_step": 365859, "epoch": 4407} {"train_loss": -26.083593368530273, "global_step": 365860, "epoch": 4407} {"train_loss": -26.21047019958496, "global_step": 365861, "epoch": 4407} {"train_loss": -26.074527740478516, "global_step": 365862, "epoch": 4407} {"train_loss": -26.153208307473058, "global_step": 365863, "epoch": 4407, "val_loss": 6587201.0} {"train_loss": -26.259658813476562, "global_step": 365864, "epoch": 4408} {"train_loss": -26.095489501953125, "global_step": 365865, "epoch": 4408} {"train_loss": -25.451353073120117, "global_step": 365866, "epoch": 4408} {"train_loss": -26.008459091186523, "global_step": 365867, "epoch": 4408} {"train_loss": -25.9208984375, "global_step": 365868, "epoch": 4408} {"train_loss": -25.764801025390625, "global_step": 365869, "epoch": 4408} {"train_loss": -26.2774658203125, "global_step": 365870, "epoch": 4408} {"train_loss": -26.0578556060791, "global_step": 365871, "epoch": 4408} {"train_loss": -25.77480125427246, "global_step": 365872, "epoch": 4408} {"train_loss": -26.130447387695312, "global_step": 365873, "epoch": 4408} {"train_loss": -26.02544593811035, "global_step": 365874, "epoch": 4408} {"train_loss": -25.917272567749023, "global_step": 365875, "epoch": 4408} {"train_loss": -26.05317497253418, "global_step": 365876, "epoch": 4408} {"train_loss": -26.07535171508789, "global_step": 365877, "epoch": 4408} {"train_loss": -25.986677169799805, "global_step": 365878, "epoch": 4408} {"train_loss": -25.965087890625, "global_step": 365879, "epoch": 4408} {"train_loss": -26.451953887939453, "global_step": 365880, "epoch": 4408} {"train_loss": -26.323144912719727, "global_step": 365881, "epoch": 4408} {"train_loss": -26.340085983276367, "global_step": 365882, "epoch": 4408} {"train_loss": -26.285369873046875, "global_step": 365883, "epoch": 4408} {"train_loss": -26.126880645751953, "global_step": 365884, "epoch": 4408} {"train_loss": -26.32010841369629, "global_step": 365885, "epoch": 4408} {"train_loss": -26.29828453063965, "global_step": 365886, "epoch": 4408} {"train_loss": -26.39222526550293, "global_step": 365887, "epoch": 4408} {"train_loss": -26.191640853881836, "global_step": 365888, "epoch": 4408} {"train_loss": -26.186389923095703, "global_step": 365889, "epoch": 4408} {"train_loss": -26.56972312927246, "global_step": 365890, "epoch": 4408} {"train_loss": -26.66702651977539, "global_step": 365891, "epoch": 4408} {"train_loss": -26.355396270751953, "global_step": 365892, "epoch": 4408} {"train_loss": -25.99100685119629, "global_step": 365893, "epoch": 4408} {"train_loss": -26.123743057250977, "global_step": 365894, "epoch": 4408} {"train_loss": -26.5776424407959, "global_step": 365895, "epoch": 4408} {"train_loss": -26.442651748657227, "global_step": 365896, "epoch": 4408} {"train_loss": -26.128925323486328, "global_step": 365897, "epoch": 4408} {"train_loss": -26.101179122924805, "global_step": 365898, "epoch": 4408} {"train_loss": -26.244306564331055, "global_step": 365899, "epoch": 4408} {"train_loss": -26.4467716217041, "global_step": 365900, "epoch": 4408} {"train_loss": -26.408491134643555, "global_step": 365901, "epoch": 4408} {"train_loss": -26.122323989868164, "global_step": 365902, "epoch": 4408} {"train_loss": -26.477344512939453, "global_step": 365903, "epoch": 4408} {"train_loss": -26.50537109375, "global_step": 365904, "epoch": 4408} {"train_loss": -26.568639755249023, "global_step": 365905, "epoch": 4408} {"train_loss": -26.293354034423828, "global_step": 365906, "epoch": 4408} {"train_loss": -26.428913116455078, "global_step": 365907, "epoch": 4408} {"train_loss": -26.67279624938965, "global_step": 365908, "epoch": 4408} {"train_loss": -26.19417381286621, "global_step": 365909, "epoch": 4408} {"train_loss": -26.505056381225586, "global_step": 365910, "epoch": 4408} {"train_loss": -26.784223556518555, "global_step": 365911, "epoch": 4408} {"train_loss": -25.753559112548828, "global_step": 365912, "epoch": 4408} {"train_loss": -25.604516983032227, "global_step": 365913, "epoch": 4408} {"train_loss": -25.57215118408203, "global_step": 365914, "epoch": 4408} {"train_loss": -24.81202507019043, "global_step": 365915, "epoch": 4408} {"train_loss": -25.60639762878418, "global_step": 365916, "epoch": 4408} {"train_loss": -25.662137985229492, "global_step": 365917, "epoch": 4408} {"train_loss": -26.00172233581543, "global_step": 365918, "epoch": 4408} {"train_loss": -26.135334014892578, "global_step": 365919, "epoch": 4408} {"train_loss": -25.900909423828125, "global_step": 365920, "epoch": 4408} {"train_loss": -26.46369743347168, "global_step": 365921, "epoch": 4408} {"train_loss": -26.001708984375, "global_step": 365922, "epoch": 4408} {"train_loss": -26.28411865234375, "global_step": 365923, "epoch": 4408} {"train_loss": -25.823139190673828, "global_step": 365924, "epoch": 4408} {"train_loss": -26.464813232421875, "global_step": 365925, "epoch": 4408} {"train_loss": -26.057336807250977, "global_step": 365926, "epoch": 4408} {"train_loss": -26.34663200378418, "global_step": 365927, "epoch": 4408} {"train_loss": -26.168954849243164, "global_step": 365928, "epoch": 4408} {"train_loss": -26.152658462524414, "global_step": 365929, "epoch": 4408} {"train_loss": -26.092496871948242, "global_step": 365930, "epoch": 4408} {"train_loss": -26.471872329711914, "global_step": 365931, "epoch": 4408} {"train_loss": -26.22336769104004, "global_step": 365932, "epoch": 4408} {"train_loss": -26.031356811523438, "global_step": 365933, "epoch": 4408} {"train_loss": -26.32818031311035, "global_step": 365934, "epoch": 4408} {"train_loss": -26.708906173706055, "global_step": 365935, "epoch": 4408} {"train_loss": -26.502172470092773, "global_step": 365936, "epoch": 4408} {"train_loss": -26.702762603759766, "global_step": 365937, "epoch": 4408} {"train_loss": -26.28631019592285, "global_step": 365938, "epoch": 4408} {"train_loss": -26.660934448242188, "global_step": 365939, "epoch": 4408} {"train_loss": -26.304080963134766, "global_step": 365940, "epoch": 4408} {"train_loss": -26.269184112548828, "global_step": 365941, "epoch": 4408} {"train_loss": -26.361974716186523, "global_step": 365942, "epoch": 4408} {"train_loss": -26.257505416870117, "global_step": 365943, "epoch": 4408} {"train_loss": -26.517486572265625, "global_step": 365944, "epoch": 4408} {"train_loss": -26.450891494750977, "global_step": 365945, "epoch": 4408} {"train_loss": -26.20565832666604, "global_step": 365946, "epoch": 4408, "val_loss": 6512872.0} {"train_loss": -25.999170303344727, "global_step": 365947, "epoch": 4409} {"train_loss": -26.077905654907227, "global_step": 365948, "epoch": 4409} {"train_loss": -25.91001319885254, "global_step": 365949, "epoch": 4409} {"train_loss": -25.78223991394043, "global_step": 365950, "epoch": 4409} {"train_loss": -25.934293746948242, "global_step": 365951, "epoch": 4409} {"train_loss": -25.8719539642334, "global_step": 365952, "epoch": 4409} {"train_loss": -25.935443878173828, "global_step": 365953, "epoch": 4409} {"train_loss": -26.008697509765625, "global_step": 365954, "epoch": 4409} {"train_loss": -25.683988571166992, "global_step": 365955, "epoch": 4409} {"train_loss": -25.6181697845459, "global_step": 365956, "epoch": 4409} {"train_loss": -25.867475509643555, "global_step": 365957, "epoch": 4409} {"train_loss": -26.324939727783203, "global_step": 365958, "epoch": 4409} {"train_loss": -26.186132431030273, "global_step": 365959, "epoch": 4409} {"train_loss": -26.226041793823242, "global_step": 365960, "epoch": 4409} {"train_loss": -26.100866317749023, "global_step": 365961, "epoch": 4409} {"train_loss": -25.905689239501953, "global_step": 365962, "epoch": 4409} {"train_loss": -26.35701560974121, "global_step": 365963, "epoch": 4409} {"train_loss": -26.164709091186523, "global_step": 365964, "epoch": 4409} {"train_loss": -26.487043380737305, "global_step": 365965, "epoch": 4409} {"train_loss": -26.29095458984375, "global_step": 365966, "epoch": 4409} {"train_loss": -26.48236656188965, "global_step": 365967, "epoch": 4409} {"train_loss": -25.941162109375, "global_step": 365968, "epoch": 4409} {"train_loss": -26.43368911743164, "global_step": 365969, "epoch": 4409} {"train_loss": -26.4113712310791, "global_step": 365970, "epoch": 4409} {"train_loss": -26.307287216186523, "global_step": 365971, "epoch": 4409} {"train_loss": -26.2517032623291, "global_step": 365972, "epoch": 4409} {"train_loss": -26.410049438476562, "global_step": 365973, "epoch": 4409} {"train_loss": -26.274728775024414, "global_step": 365974, "epoch": 4409} {"train_loss": -26.148847579956055, "global_step": 365975, "epoch": 4409} {"train_loss": -26.353757858276367, "global_step": 365976, "epoch": 4409} {"train_loss": -26.31694984436035, "global_step": 365977, "epoch": 4409} {"train_loss": -26.324417114257812, "global_step": 365978, "epoch": 4409} {"train_loss": -26.062864303588867, "global_step": 365979, "epoch": 4409} {"train_loss": -26.143524169921875, "global_step": 365980, "epoch": 4409} {"train_loss": -26.465356826782227, "global_step": 365981, "epoch": 4409} {"train_loss": -26.17547607421875, "global_step": 365982, "epoch": 4409} {"train_loss": -26.509389877319336, "global_step": 365983, "epoch": 4409} {"train_loss": -26.11201286315918, "global_step": 365984, "epoch": 4409} {"train_loss": -26.48444938659668, "global_step": 365985, "epoch": 4409} {"train_loss": -26.58719825744629, "global_step": 365986, "epoch": 4409} {"train_loss": -26.652099609375, "global_step": 365987, "epoch": 4409} {"train_loss": -26.6412296295166, "global_step": 365988, "epoch": 4409} {"train_loss": -25.843524932861328, "global_step": 365989, "epoch": 4409} {"train_loss": -26.53318214416504, "global_step": 365990, "epoch": 4409} {"train_loss": -26.30912208557129, "global_step": 365991, "epoch": 4409} {"train_loss": -26.186767578125, "global_step": 365992, "epoch": 4409} {"train_loss": -26.217817306518555, "global_step": 365993, "epoch": 4409} {"train_loss": -25.66127586364746, "global_step": 365994, "epoch": 4409} {"train_loss": -26.644092559814453, "global_step": 365995, "epoch": 4409} {"train_loss": -26.199298858642578, "global_step": 365996, "epoch": 4409} {"train_loss": -26.436368942260742, "global_step": 365997, "epoch": 4409} {"train_loss": -26.438953399658203, "global_step": 365998, "epoch": 4409} {"train_loss": -26.35392189025879, "global_step": 365999, "epoch": 4409} {"train_loss": -26.324844360351562, "global_step": 366000, "epoch": 4409} {"train_loss": -26.607641220092773, "global_step": 366001, "epoch": 4409} {"train_loss": -25.87196159362793, "global_step": 366002, "epoch": 4409} {"train_loss": -25.7181396484375, "global_step": 366003, "epoch": 4409} {"train_loss": -26.37006187438965, "global_step": 366004, "epoch": 4409} {"train_loss": -26.127887725830078, "global_step": 366005, "epoch": 4409} {"train_loss": -26.548120498657227, "global_step": 366006, "epoch": 4409} {"train_loss": -26.47651481628418, "global_step": 366007, "epoch": 4409} {"train_loss": -26.502302169799805, "global_step": 366008, "epoch": 4409} {"train_loss": -26.941373825073242, "global_step": 366009, "epoch": 4409} {"train_loss": -26.130895614624023, "global_step": 366010, "epoch": 4409} {"train_loss": -26.235090255737305, "global_step": 366011, "epoch": 4409} {"train_loss": -26.187408447265625, "global_step": 366012, "epoch": 4409} {"train_loss": -26.34120750427246, "global_step": 366013, "epoch": 4409} {"train_loss": -26.5179386138916, "global_step": 366014, "epoch": 4409} {"train_loss": -26.46407127380371, "global_step": 366015, "epoch": 4409} {"train_loss": -26.360107421875, "global_step": 366016, "epoch": 4409} {"train_loss": -26.21337890625, "global_step": 366017, "epoch": 4409} {"train_loss": -25.858917236328125, "global_step": 366018, "epoch": 4409} {"train_loss": -26.5867977142334, "global_step": 366019, "epoch": 4409} {"train_loss": -26.449951171875, "global_step": 366020, "epoch": 4409} {"train_loss": -26.383594512939453, "global_step": 366021, "epoch": 4409} {"train_loss": -26.03366470336914, "global_step": 366022, "epoch": 4409} {"train_loss": -26.39312744140625, "global_step": 366023, "epoch": 4409} {"train_loss": -26.237775802612305, "global_step": 366024, "epoch": 4409} {"train_loss": -26.481414794921875, "global_step": 366025, "epoch": 4409} {"train_loss": -26.770238876342773, "global_step": 366026, "epoch": 4409} {"train_loss": -26.518386840820312, "global_step": 366027, "epoch": 4409} {"train_loss": -26.11457633972168, "global_step": 366028, "epoch": 4409} {"train_loss": -26.260059310729247, "global_step": 366029, "epoch": 4409, "val_loss": 6518490.0} {"train_loss": -26.0745792388916, "global_step": 366030, "epoch": 4410} {"train_loss": -25.8504581451416, "global_step": 366031, "epoch": 4410} {"train_loss": -26.064130783081055, "global_step": 366032, "epoch": 4410} {"train_loss": -25.960397720336914, "global_step": 366033, "epoch": 4410} {"train_loss": -26.033843994140625, "global_step": 366034, "epoch": 4410} {"train_loss": -26.105854034423828, "global_step": 366035, "epoch": 4410} {"train_loss": -26.01112174987793, "global_step": 366036, "epoch": 4410} {"train_loss": -26.294570922851562, "global_step": 366037, "epoch": 4410} {"train_loss": -26.38671875, "global_step": 366038, "epoch": 4410} {"train_loss": -26.62885093688965, "global_step": 366039, "epoch": 4410} {"train_loss": -26.237415313720703, "global_step": 366040, "epoch": 4410} {"train_loss": -26.08014488220215, "global_step": 366041, "epoch": 4410} {"train_loss": -26.224227905273438, "global_step": 366042, "epoch": 4410} {"train_loss": -25.87782096862793, "global_step": 366043, "epoch": 4410} {"train_loss": -26.462732315063477, "global_step": 366044, "epoch": 4410} {"train_loss": -26.531452178955078, "global_step": 366045, "epoch": 4410} {"train_loss": -25.625085830688477, "global_step": 366046, "epoch": 4410} {"train_loss": -26.5994873046875, "global_step": 366047, "epoch": 4410} {"train_loss": -26.314289093017578, "global_step": 366048, "epoch": 4410} {"train_loss": -25.797582626342773, "global_step": 366049, "epoch": 4410} {"train_loss": -26.020658493041992, "global_step": 366050, "epoch": 4410} {"train_loss": -26.356735229492188, "global_step": 366051, "epoch": 4410} {"train_loss": -26.172800064086914, "global_step": 366052, "epoch": 4410} {"train_loss": -25.991168975830078, "global_step": 366053, "epoch": 4410} {"train_loss": -26.08241844177246, "global_step": 366054, "epoch": 4410} {"train_loss": -26.275928497314453, "global_step": 366055, "epoch": 4410} {"train_loss": -25.988210678100586, "global_step": 366056, "epoch": 4410} {"train_loss": -26.49863624572754, "global_step": 366057, "epoch": 4410} {"train_loss": -26.133237838745117, "global_step": 366058, "epoch": 4410} {"train_loss": -26.5794620513916, "global_step": 366059, "epoch": 4410} {"train_loss": -26.22056007385254, "global_step": 366060, "epoch": 4410} {"train_loss": -26.068540573120117, "global_step": 366061, "epoch": 4410} {"train_loss": -25.6206111907959, "global_step": 366062, "epoch": 4410} {"train_loss": -26.595083236694336, "global_step": 366063, "epoch": 4410} {"train_loss": -26.383010864257812, "global_step": 366064, "epoch": 4410} {"train_loss": -26.27290153503418, "global_step": 366065, "epoch": 4410} {"train_loss": -26.16083335876465, "global_step": 366066, "epoch": 4410} {"train_loss": -26.160749435424805, "global_step": 366067, "epoch": 4410} {"train_loss": -26.043792724609375, "global_step": 366068, "epoch": 4410} {"train_loss": -26.38653564453125, "global_step": 366069, "epoch": 4410} {"train_loss": -26.009918212890625, "global_step": 366070, "epoch": 4410} {"train_loss": -26.37690544128418, "global_step": 366071, "epoch": 4410} {"train_loss": -26.38946533203125, "global_step": 366072, "epoch": 4410} {"train_loss": -26.521352767944336, "global_step": 366073, "epoch": 4410} {"train_loss": -26.450464248657227, "global_step": 366074, "epoch": 4410} {"train_loss": -26.47222328186035, "global_step": 366075, "epoch": 4410} {"train_loss": -26.2235107421875, "global_step": 366076, "epoch": 4410} {"train_loss": -26.10001564025879, "global_step": 366077, "epoch": 4410} {"train_loss": -26.428390502929688, "global_step": 366078, "epoch": 4410} {"train_loss": -26.490509033203125, "global_step": 366079, "epoch": 4410} {"train_loss": -26.378156661987305, "global_step": 366080, "epoch": 4410} {"train_loss": -26.477697372436523, "global_step": 366081, "epoch": 4410} {"train_loss": -26.2733154296875, "global_step": 366082, "epoch": 4410} {"train_loss": -26.621002197265625, "global_step": 366083, "epoch": 4410} {"train_loss": -26.66607093811035, "global_step": 366084, "epoch": 4410} {"train_loss": -26.347875595092773, "global_step": 366085, "epoch": 4410} {"train_loss": -26.19439125061035, "global_step": 366086, "epoch": 4410} {"train_loss": -26.4910831451416, "global_step": 366087, "epoch": 4410} {"train_loss": -26.8123722076416, "global_step": 366088, "epoch": 4410} {"train_loss": -26.448017120361328, "global_step": 366089, "epoch": 4410} {"train_loss": -26.375585556030273, "global_step": 366090, "epoch": 4410} {"train_loss": -26.5133113861084, "global_step": 366091, "epoch": 4410} {"train_loss": -26.580596923828125, "global_step": 366092, "epoch": 4410} {"train_loss": -26.694482803344727, "global_step": 366093, "epoch": 4410} {"train_loss": -26.635034561157227, "global_step": 366094, "epoch": 4410} {"train_loss": -26.209325790405273, "global_step": 366095, "epoch": 4410} {"train_loss": -26.225940704345703, "global_step": 366096, "epoch": 4410} {"train_loss": -26.067657470703125, "global_step": 366097, "epoch": 4410} {"train_loss": -26.49454116821289, "global_step": 366098, "epoch": 4410} {"train_loss": -26.018115997314453, "global_step": 366099, "epoch": 4410} {"train_loss": -25.9615478515625, "global_step": 366100, "epoch": 4410} {"train_loss": -26.246265411376953, "global_step": 366101, "epoch": 4410} {"train_loss": -26.301990509033203, "global_step": 366102, "epoch": 4410} {"train_loss": -25.926776885986328, "global_step": 366103, "epoch": 4410} {"train_loss": -26.66242790222168, "global_step": 366104, "epoch": 4410} {"train_loss": -26.3834171295166, "global_step": 366105, "epoch": 4410} {"train_loss": -26.477529525756836, "global_step": 366106, "epoch": 4410} {"train_loss": -26.301877975463867, "global_step": 366107, "epoch": 4410} {"train_loss": -26.106800079345703, "global_step": 366108, "epoch": 4410} {"train_loss": -26.7054500579834, "global_step": 366109, "epoch": 4410} {"train_loss": -25.947101593017578, "global_step": 366110, "epoch": 4410} {"train_loss": -25.953683853149414, "global_step": 366111, "epoch": 4410} {"train_loss": -26.26414094488305, "global_step": 366112, "epoch": 4410, "val_loss": 6602784.0} {"train_loss": -25.139169692993164, "global_step": 366113, "epoch": 4411} {"train_loss": -25.940582275390625, "global_step": 366114, "epoch": 4411} {"train_loss": -25.398460388183594, "global_step": 366115, "epoch": 4411} {"train_loss": -25.858625411987305, "global_step": 366116, "epoch": 4411} {"train_loss": -25.93890953063965, "global_step": 366117, "epoch": 4411} {"train_loss": -25.760343551635742, "global_step": 366118, "epoch": 4411} {"train_loss": -26.203702926635742, "global_step": 366119, "epoch": 4411} {"train_loss": -25.652379989624023, "global_step": 366120, "epoch": 4411} {"train_loss": -26.19114112854004, "global_step": 366121, "epoch": 4411} {"train_loss": -25.799779891967773, "global_step": 366122, "epoch": 4411} {"train_loss": -25.273569107055664, "global_step": 366123, "epoch": 4411} {"train_loss": -26.496801376342773, "global_step": 366124, "epoch": 4411} {"train_loss": -25.603626251220703, "global_step": 366125, "epoch": 4411} {"train_loss": -25.918933868408203, "global_step": 366126, "epoch": 4411} {"train_loss": -26.08843994140625, "global_step": 366127, "epoch": 4411} {"train_loss": -25.910497665405273, "global_step": 366128, "epoch": 4411} {"train_loss": -26.038898468017578, "global_step": 366129, "epoch": 4411} {"train_loss": -25.843088150024414, "global_step": 366130, "epoch": 4411} {"train_loss": -25.873199462890625, "global_step": 366131, "epoch": 4411} {"train_loss": -26.028213500976562, "global_step": 366132, "epoch": 4411} {"train_loss": -25.87565040588379, "global_step": 366133, "epoch": 4411} {"train_loss": -25.8099365234375, "global_step": 366134, "epoch": 4411} {"train_loss": -26.129932403564453, "global_step": 366135, "epoch": 4411} {"train_loss": -26.3273983001709, "global_step": 366136, "epoch": 4411} {"train_loss": -26.114999771118164, "global_step": 366137, "epoch": 4411} {"train_loss": -25.91670036315918, "global_step": 366138, "epoch": 4411} {"train_loss": -25.82488441467285, "global_step": 366139, "epoch": 4411} {"train_loss": -26.140356063842773, "global_step": 366140, "epoch": 4411} {"train_loss": -26.22488784790039, "global_step": 366141, "epoch": 4411} {"train_loss": -26.295520782470703, "global_step": 366142, "epoch": 4411} {"train_loss": -26.35542106628418, "global_step": 366143, "epoch": 4411} {"train_loss": -26.005420684814453, "global_step": 366144, "epoch": 4411} {"train_loss": -26.402090072631836, "global_step": 366145, "epoch": 4411} {"train_loss": -26.162511825561523, "global_step": 366146, "epoch": 4411} {"train_loss": -26.151575088500977, "global_step": 366147, "epoch": 4411} {"train_loss": -26.1968936920166, "global_step": 366148, "epoch": 4411} {"train_loss": -26.306989669799805, "global_step": 366149, "epoch": 4411} {"train_loss": -26.166400909423828, "global_step": 366150, "epoch": 4411} {"train_loss": -26.596288681030273, "global_step": 366151, "epoch": 4411} {"train_loss": -26.24152946472168, "global_step": 366152, "epoch": 4411} {"train_loss": -26.18475341796875, "global_step": 366153, "epoch": 4411} {"train_loss": -26.56307029724121, "global_step": 366154, "epoch": 4411} {"train_loss": -26.58742332458496, "global_step": 366155, "epoch": 4411} {"train_loss": -26.468769073486328, "global_step": 366156, "epoch": 4411} {"train_loss": -26.54111671447754, "global_step": 366157, "epoch": 4411} {"train_loss": -26.61873435974121, "global_step": 366158, "epoch": 4411} {"train_loss": -26.261884689331055, "global_step": 366159, "epoch": 4411} {"train_loss": -26.46058464050293, "global_step": 366160, "epoch": 4411} {"train_loss": -26.668807983398438, "global_step": 366161, "epoch": 4411} {"train_loss": -26.700397491455078, "global_step": 366162, "epoch": 4411} {"train_loss": -26.62247085571289, "global_step": 366163, "epoch": 4411} {"train_loss": -26.298765182495117, "global_step": 366164, "epoch": 4411} {"train_loss": -26.187345504760742, "global_step": 366165, "epoch": 4411} {"train_loss": -26.27515983581543, "global_step": 366166, "epoch": 4411} {"train_loss": -26.012104034423828, "global_step": 366167, "epoch": 4411} {"train_loss": -25.384859085083008, "global_step": 366168, "epoch": 4411} {"train_loss": -25.51045036315918, "global_step": 366169, "epoch": 4411} {"train_loss": -25.952722549438477, "global_step": 366170, "epoch": 4411} {"train_loss": -25.992765426635742, "global_step": 366171, "epoch": 4411} {"train_loss": -25.914356231689453, "global_step": 366172, "epoch": 4411} {"train_loss": -25.812885284423828, "global_step": 366173, "epoch": 4411} {"train_loss": -26.28181266784668, "global_step": 366174, "epoch": 4411} {"train_loss": -25.673053741455078, "global_step": 366175, "epoch": 4411} {"train_loss": -26.593067169189453, "global_step": 366176, "epoch": 4411} {"train_loss": -26.197248458862305, "global_step": 366177, "epoch": 4411} {"train_loss": -25.92816734313965, "global_step": 366178, "epoch": 4411} {"train_loss": -25.922088623046875, "global_step": 366179, "epoch": 4411} {"train_loss": -26.093591690063477, "global_step": 366180, "epoch": 4411} {"train_loss": -26.278827667236328, "global_step": 366181, "epoch": 4411} {"train_loss": -26.25225830078125, "global_step": 366182, "epoch": 4411} {"train_loss": -25.97220802307129, "global_step": 366183, "epoch": 4411} {"train_loss": -26.265050888061523, "global_step": 366184, "epoch": 4411} {"train_loss": -26.551380157470703, "global_step": 366185, "epoch": 4411} {"train_loss": -26.318317413330078, "global_step": 366186, "epoch": 4411} {"train_loss": -26.4949893951416, "global_step": 366187, "epoch": 4411} {"train_loss": -26.168838500976562, "global_step": 366188, "epoch": 4411} {"train_loss": -26.08318519592285, "global_step": 366189, "epoch": 4411} {"train_loss": -26.2147274017334, "global_step": 366190, "epoch": 4411} {"train_loss": -26.056364059448242, "global_step": 366191, "epoch": 4411} {"train_loss": -26.071027755737305, "global_step": 366192, "epoch": 4411} {"train_loss": -26.663623809814453, "global_step": 366193, "epoch": 4411} {"train_loss": -25.940231323242188, "global_step": 366194, "epoch": 4411} {"train_loss": -26.089971910040063, "global_step": 366195, "epoch": 4411, "val_loss": 6503531.0} {"train_loss": -26.509565353393555, "global_step": 366196, "epoch": 4412} {"train_loss": -25.711362838745117, "global_step": 366197, "epoch": 4412} {"train_loss": -26.099878311157227, "global_step": 366198, "epoch": 4412} {"train_loss": -26.139371871948242, "global_step": 366199, "epoch": 4412} {"train_loss": -26.13724708557129, "global_step": 366200, "epoch": 4412} {"train_loss": -26.22003746032715, "global_step": 366201, "epoch": 4412} {"train_loss": -26.237857818603516, "global_step": 366202, "epoch": 4412} {"train_loss": -26.0071964263916, "global_step": 366203, "epoch": 4412} {"train_loss": -26.248779296875, "global_step": 366204, "epoch": 4412} {"train_loss": -26.5047607421875, "global_step": 366205, "epoch": 4412} {"train_loss": -26.165515899658203, "global_step": 366206, "epoch": 4412} {"train_loss": -26.135395050048828, "global_step": 366207, "epoch": 4412} {"train_loss": -26.057464599609375, "global_step": 366208, "epoch": 4412} {"train_loss": -26.21548843383789, "global_step": 366209, "epoch": 4412} {"train_loss": -26.2448787689209, "global_step": 366210, "epoch": 4412} {"train_loss": -26.154260635375977, "global_step": 366211, "epoch": 4412} {"train_loss": -26.451688766479492, "global_step": 366212, "epoch": 4412} {"train_loss": -26.37192153930664, "global_step": 366213, "epoch": 4412} {"train_loss": -26.2645206451416, "global_step": 366214, "epoch": 4412} {"train_loss": -26.14076042175293, "global_step": 366215, "epoch": 4412} {"train_loss": -26.558256149291992, "global_step": 366216, "epoch": 4412} {"train_loss": -26.16937828063965, "global_step": 366217, "epoch": 4412} {"train_loss": -26.480884552001953, "global_step": 366218, "epoch": 4412} {"train_loss": -26.28546142578125, "global_step": 366219, "epoch": 4412} {"train_loss": -26.434423446655273, "global_step": 366220, "epoch": 4412} {"train_loss": -26.29469108581543, "global_step": 366221, "epoch": 4412} {"train_loss": -26.297590255737305, "global_step": 366222, "epoch": 4412} {"train_loss": -25.837299346923828, "global_step": 366223, "epoch": 4412} {"train_loss": -26.3892822265625, "global_step": 366224, "epoch": 4412} {"train_loss": -26.46622085571289, "global_step": 366225, "epoch": 4412} {"train_loss": -26.231693267822266, "global_step": 366226, "epoch": 4412} {"train_loss": -26.200986862182617, "global_step": 366227, "epoch": 4412} {"train_loss": -26.084217071533203, "global_step": 366228, "epoch": 4412} {"train_loss": -26.416528701782227, "global_step": 366229, "epoch": 4412} {"train_loss": -26.219451904296875, "global_step": 366230, "epoch": 4412} {"train_loss": -26.243213653564453, "global_step": 366231, "epoch": 4412} {"train_loss": -26.413501739501953, "global_step": 366232, "epoch": 4412} {"train_loss": -26.37334632873535, "global_step": 366233, "epoch": 4412} {"train_loss": -26.167760848999023, "global_step": 366234, "epoch": 4412} {"train_loss": -25.717975616455078, "global_step": 366235, "epoch": 4412} {"train_loss": -26.137805938720703, "global_step": 366236, "epoch": 4412} {"train_loss": -26.31096839904785, "global_step": 366237, "epoch": 4412} {"train_loss": -26.061767578125, "global_step": 366238, "epoch": 4412} {"train_loss": -26.084699630737305, "global_step": 366239, "epoch": 4412} {"train_loss": -26.190296173095703, "global_step": 366240, "epoch": 4412} {"train_loss": -26.21245765686035, "global_step": 366241, "epoch": 4412} {"train_loss": -25.839019775390625, "global_step": 366242, "epoch": 4412} {"train_loss": -26.057714462280273, "global_step": 366243, "epoch": 4412} {"train_loss": -26.453786849975586, "global_step": 366244, "epoch": 4412} {"train_loss": -26.11115837097168, "global_step": 366245, "epoch": 4412} {"train_loss": -26.650121688842773, "global_step": 366246, "epoch": 4412} {"train_loss": -26.266714096069336, "global_step": 366247, "epoch": 4412} {"train_loss": -26.189905166625977, "global_step": 366248, "epoch": 4412} {"train_loss": -26.451223373413086, "global_step": 366249, "epoch": 4412} {"train_loss": -26.23295021057129, "global_step": 366250, "epoch": 4412} {"train_loss": -26.325082778930664, "global_step": 366251, "epoch": 4412} {"train_loss": -26.407917022705078, "global_step": 366252, "epoch": 4412} {"train_loss": -26.65265464782715, "global_step": 366253, "epoch": 4412} {"train_loss": -26.341552734375, "global_step": 366254, "epoch": 4412} {"train_loss": -26.35967445373535, "global_step": 366255, "epoch": 4412} {"train_loss": -26.434736251831055, "global_step": 366256, "epoch": 4412} {"train_loss": -26.41168212890625, "global_step": 366257, "epoch": 4412} {"train_loss": -26.14576530456543, "global_step": 366258, "epoch": 4412} {"train_loss": -26.60239028930664, "global_step": 366259, "epoch": 4412} {"train_loss": -26.60719108581543, "global_step": 366260, "epoch": 4412} {"train_loss": -26.186756134033203, "global_step": 366261, "epoch": 4412} {"train_loss": -26.63870620727539, "global_step": 366262, "epoch": 4412} {"train_loss": -26.346637725830078, "global_step": 366263, "epoch": 4412} {"train_loss": -26.686017990112305, "global_step": 366264, "epoch": 4412} {"train_loss": -26.725082397460938, "global_step": 366265, "epoch": 4412} {"train_loss": -26.48724937438965, "global_step": 366266, "epoch": 4412} {"train_loss": -26.199146270751953, "global_step": 366267, "epoch": 4412} {"train_loss": -25.99519157409668, "global_step": 366268, "epoch": 4412} {"train_loss": -26.01570701599121, "global_step": 366269, "epoch": 4412} {"train_loss": -26.468170166015625, "global_step": 366270, "epoch": 4412} {"train_loss": -26.29610252380371, "global_step": 366271, "epoch": 4412} {"train_loss": -26.304458618164062, "global_step": 366272, "epoch": 4412} {"train_loss": -26.58709144592285, "global_step": 366273, "epoch": 4412} {"train_loss": -26.601343154907227, "global_step": 366274, "epoch": 4412} {"train_loss": -26.142492294311523, "global_step": 366275, "epoch": 4412} {"train_loss": -26.65814781188965, "global_step": 366276, "epoch": 4412} {"train_loss": -26.304479598999023, "global_step": 366277, "epoch": 4412} {"train_loss": -26.292660632765436, "global_step": 366278, "epoch": 4412, "val_loss": 6555923.0} {"train_loss": -25.526121139526367, "global_step": 366279, "epoch": 4413} {"train_loss": -24.916860580444336, "global_step": 366280, "epoch": 4413} {"train_loss": -25.184329986572266, "global_step": 366281, "epoch": 4413} {"train_loss": -25.599695205688477, "global_step": 366282, "epoch": 4413} {"train_loss": -25.642536163330078, "global_step": 366283, "epoch": 4413} {"train_loss": -25.46050453186035, "global_step": 366284, "epoch": 4413} {"train_loss": -25.084745407104492, "global_step": 366285, "epoch": 4413} {"train_loss": -26.080188751220703, "global_step": 366286, "epoch": 4413} {"train_loss": -25.3781795501709, "global_step": 366287, "epoch": 4413} {"train_loss": -25.66839599609375, "global_step": 366288, "epoch": 4413} {"train_loss": -26.064001083374023, "global_step": 366289, "epoch": 4413} {"train_loss": -25.471128463745117, "global_step": 366290, "epoch": 4413} {"train_loss": -26.1165714263916, "global_step": 366291, "epoch": 4413} {"train_loss": -26.04839515686035, "global_step": 366292, "epoch": 4413} {"train_loss": -25.837080001831055, "global_step": 366293, "epoch": 4413} {"train_loss": -25.88067054748535, "global_step": 366294, "epoch": 4413} {"train_loss": -25.891666412353516, "global_step": 366295, "epoch": 4413} {"train_loss": -26.028564453125, "global_step": 366296, "epoch": 4413} {"train_loss": -26.10194206237793, "global_step": 366297, "epoch": 4413} {"train_loss": -26.125659942626953, "global_step": 366298, "epoch": 4413} {"train_loss": -25.981521606445312, "global_step": 366299, "epoch": 4413} {"train_loss": -25.86382484436035, "global_step": 366300, "epoch": 4413} {"train_loss": -26.106733322143555, "global_step": 366301, "epoch": 4413} {"train_loss": -26.126474380493164, "global_step": 366302, "epoch": 4413} {"train_loss": -26.161697387695312, "global_step": 366303, "epoch": 4413} {"train_loss": -25.998926162719727, "global_step": 366304, "epoch": 4413} {"train_loss": -25.991607666015625, "global_step": 366305, "epoch": 4413} {"train_loss": -26.6208553314209, "global_step": 366306, "epoch": 4413} {"train_loss": -25.817747116088867, "global_step": 366307, "epoch": 4413} {"train_loss": -26.136838912963867, "global_step": 366308, "epoch": 4413} {"train_loss": -26.634790420532227, "global_step": 366309, "epoch": 4413} {"train_loss": -26.478300094604492, "global_step": 366310, "epoch": 4413} {"train_loss": -26.495248794555664, "global_step": 366311, "epoch": 4413} {"train_loss": -26.589385986328125, "global_step": 366312, "epoch": 4413} {"train_loss": -26.36640739440918, "global_step": 366313, "epoch": 4413} {"train_loss": -26.242664337158203, "global_step": 366314, "epoch": 4413} {"train_loss": -26.964588165283203, "global_step": 366315, "epoch": 4413} {"train_loss": -26.29731559753418, "global_step": 366316, "epoch": 4413} {"train_loss": -26.61515235900879, "global_step": 366317, "epoch": 4413} {"train_loss": -26.207677841186523, "global_step": 366318, "epoch": 4413} {"train_loss": -26.9652042388916, "global_step": 366319, "epoch": 4413} {"train_loss": -26.450132369995117, "global_step": 366320, "epoch": 4413} {"train_loss": -26.631132125854492, "global_step": 366321, "epoch": 4413} {"train_loss": -26.387149810791016, "global_step": 366322, "epoch": 4413} {"train_loss": -26.436487197875977, "global_step": 366323, "epoch": 4413} {"train_loss": -26.562097549438477, "global_step": 366324, "epoch": 4413} {"train_loss": -26.90046501159668, "global_step": 366325, "epoch": 4413} {"train_loss": -26.636768341064453, "global_step": 366326, "epoch": 4413} {"train_loss": -26.489532470703125, "global_step": 366327, "epoch": 4413} {"train_loss": -26.284637451171875, "global_step": 366328, "epoch": 4413} {"train_loss": -26.603626251220703, "global_step": 366329, "epoch": 4413} {"train_loss": -26.46771240234375, "global_step": 366330, "epoch": 4413} {"train_loss": -26.38522720336914, "global_step": 366331, "epoch": 4413} {"train_loss": -26.457441329956055, "global_step": 366332, "epoch": 4413} {"train_loss": -26.275543212890625, "global_step": 366333, "epoch": 4413} {"train_loss": -26.086652755737305, "global_step": 366334, "epoch": 4413} {"train_loss": -26.458789825439453, "global_step": 366335, "epoch": 4413} {"train_loss": -26.38238525390625, "global_step": 366336, "epoch": 4413} {"train_loss": -26.316486358642578, "global_step": 366337, "epoch": 4413} {"train_loss": -26.2932186126709, "global_step": 366338, "epoch": 4413} {"train_loss": -26.046878814697266, "global_step": 366339, "epoch": 4413} {"train_loss": -26.584228515625, "global_step": 366340, "epoch": 4413} {"train_loss": -26.431243896484375, "global_step": 366341, "epoch": 4413} {"train_loss": -25.980741500854492, "global_step": 366342, "epoch": 4413} {"train_loss": -26.03891372680664, "global_step": 366343, "epoch": 4413} {"train_loss": -26.500640869140625, "global_step": 366344, "epoch": 4413} {"train_loss": -26.33979606628418, "global_step": 366345, "epoch": 4413} {"train_loss": -26.506027221679688, "global_step": 366346, "epoch": 4413} {"train_loss": -26.08295249938965, "global_step": 366347, "epoch": 4413} {"train_loss": -25.995895385742188, "global_step": 366348, "epoch": 4413} {"train_loss": -26.520496368408203, "global_step": 366349, "epoch": 4413} {"train_loss": -26.458112716674805, "global_step": 366350, "epoch": 4413} {"train_loss": -26.073822021484375, "global_step": 366351, "epoch": 4413} {"train_loss": -25.735248565673828, "global_step": 366352, "epoch": 4413} {"train_loss": -25.878955841064453, "global_step": 366353, "epoch": 4413} {"train_loss": -26.0357666015625, "global_step": 366354, "epoch": 4413} {"train_loss": -26.084197998046875, "global_step": 366355, "epoch": 4413} {"train_loss": -26.010101318359375, "global_step": 366356, "epoch": 4413} {"train_loss": -25.792102813720703, "global_step": 366357, "epoch": 4413} {"train_loss": -26.11195182800293, "global_step": 366358, "epoch": 4413} {"train_loss": -26.30512046813965, "global_step": 366359, "epoch": 4413} {"train_loss": -26.436721801757812, "global_step": 366360, "epoch": 4413} {"train_loss": -26.156495220689887, "global_step": 366361, "epoch": 4413, "val_loss": 6546481.0} {"train_loss": -25.410375595092773, "global_step": 366362, "epoch": 4414} {"train_loss": -25.827505111694336, "global_step": 366363, "epoch": 4414} {"train_loss": -26.020715713500977, "global_step": 366364, "epoch": 4414} {"train_loss": -26.264623641967773, "global_step": 366365, "epoch": 4414} {"train_loss": -25.859140396118164, "global_step": 366366, "epoch": 4414} {"train_loss": -26.094629287719727, "global_step": 366367, "epoch": 4414} {"train_loss": -25.983108520507812, "global_step": 366368, "epoch": 4414} {"train_loss": -25.795013427734375, "global_step": 366369, "epoch": 4414} {"train_loss": -26.14544105529785, "global_step": 366370, "epoch": 4414} {"train_loss": -25.928455352783203, "global_step": 366371, "epoch": 4414} {"train_loss": -25.814207077026367, "global_step": 366372, "epoch": 4414} {"train_loss": -25.76580810546875, "global_step": 366373, "epoch": 4414} {"train_loss": -25.87857437133789, "global_step": 366374, "epoch": 4414} {"train_loss": -26.087982177734375, "global_step": 366375, "epoch": 4414} {"train_loss": -26.0228271484375, "global_step": 366376, "epoch": 4414} {"train_loss": -26.076101303100586, "global_step": 366377, "epoch": 4414} {"train_loss": -26.5333194732666, "global_step": 366378, "epoch": 4414} {"train_loss": -26.374364852905273, "global_step": 366379, "epoch": 4414} {"train_loss": -26.168781280517578, "global_step": 366380, "epoch": 4414} {"train_loss": -26.542285919189453, "global_step": 366381, "epoch": 4414} {"train_loss": -26.073774337768555, "global_step": 366382, "epoch": 4414} {"train_loss": -25.93511390686035, "global_step": 366383, "epoch": 4414} {"train_loss": -26.34296989440918, "global_step": 366384, "epoch": 4414} {"train_loss": -26.336149215698242, "global_step": 366385, "epoch": 4414} {"train_loss": -26.136640548706055, "global_step": 366386, "epoch": 4414} {"train_loss": -26.32541847229004, "global_step": 366387, "epoch": 4414} {"train_loss": -25.921789169311523, "global_step": 366388, "epoch": 4414} {"train_loss": -26.358060836791992, "global_step": 366389, "epoch": 4414} {"train_loss": -26.352170944213867, "global_step": 366390, "epoch": 4414} {"train_loss": -26.3505802154541, "global_step": 366391, "epoch": 4414} {"train_loss": -25.971296310424805, "global_step": 366392, "epoch": 4414} {"train_loss": -26.673084259033203, "global_step": 366393, "epoch": 4414} {"train_loss": -26.632110595703125, "global_step": 366394, "epoch": 4414} {"train_loss": -25.8934326171875, "global_step": 366395, "epoch": 4414} {"train_loss": -26.46913719177246, "global_step": 366396, "epoch": 4414} {"train_loss": -26.13262939453125, "global_step": 366397, "epoch": 4414} {"train_loss": -26.560546875, "global_step": 366398, "epoch": 4414} {"train_loss": -26.325597763061523, "global_step": 366399, "epoch": 4414} {"train_loss": -26.58027458190918, "global_step": 366400, "epoch": 4414} {"train_loss": -26.431854248046875, "global_step": 366401, "epoch": 4414} {"train_loss": -26.52984046936035, "global_step": 366402, "epoch": 4414} {"train_loss": -26.390058517456055, "global_step": 366403, "epoch": 4414} {"train_loss": -26.8301944732666, "global_step": 366404, "epoch": 4414} {"train_loss": -26.743988037109375, "global_step": 366405, "epoch": 4414} {"train_loss": -26.572158813476562, "global_step": 366406, "epoch": 4414} {"train_loss": -26.23768424987793, "global_step": 366407, "epoch": 4414} {"train_loss": -26.507770538330078, "global_step": 366408, "epoch": 4414} {"train_loss": -26.76023292541504, "global_step": 366409, "epoch": 4414} {"train_loss": -26.80877113342285, "global_step": 366410, "epoch": 4414} {"train_loss": -26.07441520690918, "global_step": 366411, "epoch": 4414} {"train_loss": -26.341339111328125, "global_step": 366412, "epoch": 4414} {"train_loss": -26.08917236328125, "global_step": 366413, "epoch": 4414} {"train_loss": -26.593036651611328, "global_step": 366414, "epoch": 4414} {"train_loss": -26.215240478515625, "global_step": 366415, "epoch": 4414} {"train_loss": -26.397192001342773, "global_step": 366416, "epoch": 4414} {"train_loss": -26.513336181640625, "global_step": 366417, "epoch": 4414} {"train_loss": -26.500986099243164, "global_step": 366418, "epoch": 4414} {"train_loss": -25.973840713500977, "global_step": 366419, "epoch": 4414} {"train_loss": -26.388547897338867, "global_step": 366420, "epoch": 4414} {"train_loss": -26.195783615112305, "global_step": 366421, "epoch": 4414} {"train_loss": -26.634313583374023, "global_step": 366422, "epoch": 4414} {"train_loss": -26.564453125, "global_step": 366423, "epoch": 4414} {"train_loss": -26.14356803894043, "global_step": 366424, "epoch": 4414} {"train_loss": -26.61028480529785, "global_step": 366425, "epoch": 4414} {"train_loss": -26.501569747924805, "global_step": 366426, "epoch": 4414} {"train_loss": -26.398283004760742, "global_step": 366427, "epoch": 4414} {"train_loss": -26.06792640686035, "global_step": 366428, "epoch": 4414} {"train_loss": -26.1297664642334, "global_step": 366429, "epoch": 4414} {"train_loss": -26.153701782226562, "global_step": 366430, "epoch": 4414} {"train_loss": -26.221166610717773, "global_step": 366431, "epoch": 4414} {"train_loss": -26.29429054260254, "global_step": 366432, "epoch": 4414} {"train_loss": -26.49226951599121, "global_step": 366433, "epoch": 4414} {"train_loss": -26.318586349487305, "global_step": 366434, "epoch": 4414} {"train_loss": -26.799863815307617, "global_step": 366435, "epoch": 4414} {"train_loss": -26.844762802124023, "global_step": 366436, "epoch": 4414} {"train_loss": -26.44697380065918, "global_step": 366437, "epoch": 4414} {"train_loss": -26.45619010925293, "global_step": 366438, "epoch": 4414} {"train_loss": -26.46063804626465, "global_step": 366439, "epoch": 4414} {"train_loss": -26.34796142578125, "global_step": 366440, "epoch": 4414} {"train_loss": -26.415327072143555, "global_step": 366441, "epoch": 4414} {"train_loss": -26.18012046813965, "global_step": 366442, "epoch": 4414} {"train_loss": -26.275114059448242, "global_step": 366443, "epoch": 4414} {"train_loss": -26.290091755878496, "global_step": 366444, "epoch": 4414, "val_loss": 6492794.0} {"train_loss": -25.0340576171875, "global_step": 366445, "epoch": 4415} {"train_loss": -24.726255416870117, "global_step": 366446, "epoch": 4415} {"train_loss": -25.403457641601562, "global_step": 366447, "epoch": 4415} {"train_loss": -25.632816314697266, "global_step": 366448, "epoch": 4415} {"train_loss": -25.5670223236084, "global_step": 366449, "epoch": 4415} {"train_loss": -25.17549705505371, "global_step": 366450, "epoch": 4415} {"train_loss": -25.437055587768555, "global_step": 366451, "epoch": 4415} {"train_loss": -25.3256778717041, "global_step": 366452, "epoch": 4415} {"train_loss": -25.56443214416504, "global_step": 366453, "epoch": 4415} {"train_loss": -26.355606079101562, "global_step": 366454, "epoch": 4415} {"train_loss": -25.709802627563477, "global_step": 366455, "epoch": 4415} {"train_loss": -25.930042266845703, "global_step": 366456, "epoch": 4415} {"train_loss": -25.884693145751953, "global_step": 366457, "epoch": 4415} {"train_loss": -25.697967529296875, "global_step": 366458, "epoch": 4415} {"train_loss": -25.906660079956055, "global_step": 366459, "epoch": 4415} {"train_loss": -25.508432388305664, "global_step": 366460, "epoch": 4415} {"train_loss": -26.146514892578125, "global_step": 366461, "epoch": 4415} {"train_loss": -26.011022567749023, "global_step": 366462, "epoch": 4415} {"train_loss": -26.05840492248535, "global_step": 366463, "epoch": 4415} {"train_loss": -25.75374412536621, "global_step": 366464, "epoch": 4415} {"train_loss": -26.35614585876465, "global_step": 366465, "epoch": 4415} {"train_loss": -25.992935180664062, "global_step": 366466, "epoch": 4415} {"train_loss": -26.139617919921875, "global_step": 366467, "epoch": 4415} {"train_loss": -25.938568115234375, "global_step": 366468, "epoch": 4415} {"train_loss": -25.99542808532715, "global_step": 366469, "epoch": 4415} {"train_loss": -26.200321197509766, "global_step": 366470, "epoch": 4415} {"train_loss": -26.465667724609375, "global_step": 366471, "epoch": 4415} {"train_loss": -26.1812744140625, "global_step": 366472, "epoch": 4415} {"train_loss": -26.476032257080078, "global_step": 366473, "epoch": 4415} {"train_loss": -26.228612899780273, "global_step": 366474, "epoch": 4415} {"train_loss": -26.75321388244629, "global_step": 366475, "epoch": 4415} {"train_loss": -26.48008155822754, "global_step": 366476, "epoch": 4415} {"train_loss": -26.304595947265625, "global_step": 366477, "epoch": 4415} {"train_loss": -26.384557723999023, "global_step": 366478, "epoch": 4415} {"train_loss": -26.13991355895996, "global_step": 366479, "epoch": 4415} {"train_loss": -26.13654899597168, "global_step": 366480, "epoch": 4415} {"train_loss": -26.26832389831543, "global_step": 366481, "epoch": 4415} {"train_loss": -26.5674991607666, "global_step": 366482, "epoch": 4415} {"train_loss": -26.381855010986328, "global_step": 366483, "epoch": 4415} {"train_loss": -26.47955322265625, "global_step": 366484, "epoch": 4415} {"train_loss": -26.310766220092773, "global_step": 366485, "epoch": 4415} {"train_loss": -27.088422775268555, "global_step": 366486, "epoch": 4415} {"train_loss": -26.368932723999023, "global_step": 366487, "epoch": 4415} {"train_loss": -27.074243545532227, "global_step": 366488, "epoch": 4415} {"train_loss": -26.632129669189453, "global_step": 366489, "epoch": 4415} {"train_loss": -26.397924423217773, "global_step": 366490, "epoch": 4415} {"train_loss": -26.19891357421875, "global_step": 366491, "epoch": 4415} {"train_loss": -26.049718856811523, "global_step": 366492, "epoch": 4415} {"train_loss": -25.507410049438477, "global_step": 366493, "epoch": 4415} {"train_loss": -25.997716903686523, "global_step": 366494, "epoch": 4415} {"train_loss": -26.44607925415039, "global_step": 366495, "epoch": 4415} {"train_loss": -26.17072868347168, "global_step": 366496, "epoch": 4415} {"train_loss": -25.974180221557617, "global_step": 366497, "epoch": 4415} {"train_loss": -26.453779220581055, "global_step": 366498, "epoch": 4415} {"train_loss": -26.151723861694336, "global_step": 366499, "epoch": 4415} {"train_loss": -26.369176864624023, "global_step": 366500, "epoch": 4415} {"train_loss": -26.159576416015625, "global_step": 366501, "epoch": 4415} {"train_loss": -26.43787956237793, "global_step": 366502, "epoch": 4415} {"train_loss": -26.294485092163086, "global_step": 366503, "epoch": 4415} {"train_loss": -25.90700340270996, "global_step": 366504, "epoch": 4415} {"train_loss": -26.15645408630371, "global_step": 366505, "epoch": 4415} {"train_loss": -26.288543701171875, "global_step": 366506, "epoch": 4415} {"train_loss": -25.9775333404541, "global_step": 366507, "epoch": 4415} {"train_loss": -26.3749942779541, "global_step": 366508, "epoch": 4415} {"train_loss": -26.37757682800293, "global_step": 366509, "epoch": 4415} {"train_loss": -26.038604736328125, "global_step": 366510, "epoch": 4415} {"train_loss": -26.163671493530273, "global_step": 366511, "epoch": 4415} {"train_loss": -26.1016902923584, "global_step": 366512, "epoch": 4415} {"train_loss": -26.20778465270996, "global_step": 366513, "epoch": 4415} {"train_loss": -26.00922203063965, "global_step": 366514, "epoch": 4415} {"train_loss": -26.52583122253418, "global_step": 366515, "epoch": 4415} {"train_loss": -25.83747673034668, "global_step": 366516, "epoch": 4415} {"train_loss": -26.432676315307617, "global_step": 366517, "epoch": 4415} {"train_loss": -26.751636505126953, "global_step": 366518, "epoch": 4415} {"train_loss": -26.842416763305664, "global_step": 366519, "epoch": 4415} {"train_loss": -26.563013076782227, "global_step": 366520, "epoch": 4415} {"train_loss": -26.7474308013916, "global_step": 366521, "epoch": 4415} {"train_loss": -26.2958984375, "global_step": 366522, "epoch": 4415} {"train_loss": -26.52888298034668, "global_step": 366523, "epoch": 4415} {"train_loss": -26.224225997924805, "global_step": 366524, "epoch": 4415} {"train_loss": -26.521162033081055, "global_step": 366525, "epoch": 4415} {"train_loss": -26.694738388061523, "global_step": 366526, "epoch": 4415} {"train_loss": -26.146897212568536, "global_step": 366527, "epoch": 4415, "val_loss": 6494282.5} {"train_loss": -25.152193069458008, "global_step": 366528, "epoch": 4416} {"train_loss": -25.28846549987793, "global_step": 366529, "epoch": 4416} {"train_loss": -25.54800033569336, "global_step": 366530, "epoch": 4416} {"train_loss": -25.989627838134766, "global_step": 366531, "epoch": 4416} {"train_loss": -25.27510643005371, "global_step": 366532, "epoch": 4416} {"train_loss": -25.061002731323242, "global_step": 366533, "epoch": 4416} {"train_loss": -25.233673095703125, "global_step": 366534, "epoch": 4416} {"train_loss": -25.950729370117188, "global_step": 366535, "epoch": 4416} {"train_loss": -25.66421890258789, "global_step": 366536, "epoch": 4416} {"train_loss": -25.73530387878418, "global_step": 366537, "epoch": 4416} {"train_loss": -25.961334228515625, "global_step": 366538, "epoch": 4416} {"train_loss": -25.72024917602539, "global_step": 366539, "epoch": 4416} {"train_loss": -25.620115280151367, "global_step": 366540, "epoch": 4416} {"train_loss": -25.9012508392334, "global_step": 366541, "epoch": 4416} {"train_loss": -26.04408073425293, "global_step": 366542, "epoch": 4416} {"train_loss": -26.047000885009766, "global_step": 366543, "epoch": 4416} {"train_loss": -26.325092315673828, "global_step": 366544, "epoch": 4416} {"train_loss": -26.050527572631836, "global_step": 366545, "epoch": 4416} {"train_loss": -25.915756225585938, "global_step": 366546, "epoch": 4416} {"train_loss": -25.85255241394043, "global_step": 366547, "epoch": 4416} {"train_loss": -26.3781795501709, "global_step": 366548, "epoch": 4416} {"train_loss": -26.12208366394043, "global_step": 366549, "epoch": 4416} {"train_loss": -25.9043025970459, "global_step": 366550, "epoch": 4416} {"train_loss": -25.950729370117188, "global_step": 366551, "epoch": 4416} {"train_loss": -26.04608726501465, "global_step": 366552, "epoch": 4416} {"train_loss": -25.552961349487305, "global_step": 366553, "epoch": 4416} {"train_loss": -26.040130615234375, "global_step": 366554, "epoch": 4416} {"train_loss": -26.281848907470703, "global_step": 366555, "epoch": 4416} {"train_loss": -25.94439697265625, "global_step": 366556, "epoch": 4416} {"train_loss": -26.37489128112793, "global_step": 366557, "epoch": 4416} {"train_loss": -26.079065322875977, "global_step": 366558, "epoch": 4416} {"train_loss": -26.247114181518555, "global_step": 366559, "epoch": 4416} {"train_loss": -26.457361221313477, "global_step": 366560, "epoch": 4416} {"train_loss": -26.157384872436523, "global_step": 366561, "epoch": 4416} {"train_loss": -26.56386375427246, "global_step": 366562, "epoch": 4416} {"train_loss": -25.993091583251953, "global_step": 366563, "epoch": 4416} {"train_loss": -26.527231216430664, "global_step": 366564, "epoch": 4416} {"train_loss": -26.031482696533203, "global_step": 366565, "epoch": 4416} {"train_loss": -26.37566566467285, "global_step": 366566, "epoch": 4416} {"train_loss": -26.35759925842285, "global_step": 366567, "epoch": 4416} {"train_loss": -26.4986572265625, "global_step": 366568, "epoch": 4416} {"train_loss": -26.354528427124023, "global_step": 366569, "epoch": 4416} {"train_loss": -26.5080509185791, "global_step": 366570, "epoch": 4416} {"train_loss": -26.605789184570312, "global_step": 366571, "epoch": 4416} {"train_loss": -26.447711944580078, "global_step": 366572, "epoch": 4416} {"train_loss": -26.2703857421875, "global_step": 366573, "epoch": 4416} {"train_loss": -26.525863647460938, "global_step": 366574, "epoch": 4416} {"train_loss": -26.61292839050293, "global_step": 366575, "epoch": 4416} {"train_loss": -26.534381866455078, "global_step": 366576, "epoch": 4416} {"train_loss": -26.188581466674805, "global_step": 366577, "epoch": 4416} {"train_loss": -26.281208038330078, "global_step": 366578, "epoch": 4416} {"train_loss": -25.96393394470215, "global_step": 366579, "epoch": 4416} {"train_loss": -25.867767333984375, "global_step": 366580, "epoch": 4416} {"train_loss": -26.6633243560791, "global_step": 366581, "epoch": 4416} {"train_loss": -26.199661254882812, "global_step": 366582, "epoch": 4416} {"train_loss": -25.994775772094727, "global_step": 366583, "epoch": 4416} {"train_loss": -26.321142196655273, "global_step": 366584, "epoch": 4416} {"train_loss": -26.394763946533203, "global_step": 366585, "epoch": 4416} {"train_loss": -26.158262252807617, "global_step": 366586, "epoch": 4416} {"train_loss": -26.490997314453125, "global_step": 366587, "epoch": 4416} {"train_loss": -26.3745059967041, "global_step": 366588, "epoch": 4416} {"train_loss": -26.23542594909668, "global_step": 366589, "epoch": 4416} {"train_loss": -26.68683433532715, "global_step": 366590, "epoch": 4416} {"train_loss": -26.03263282775879, "global_step": 366591, "epoch": 4416} {"train_loss": -26.152496337890625, "global_step": 366592, "epoch": 4416} {"train_loss": -26.130582809448242, "global_step": 366593, "epoch": 4416} {"train_loss": -26.576984405517578, "global_step": 366594, "epoch": 4416} {"train_loss": -26.194555282592773, "global_step": 366595, "epoch": 4416} {"train_loss": -26.62055015563965, "global_step": 366596, "epoch": 4416} {"train_loss": -26.169065475463867, "global_step": 366597, "epoch": 4416} {"train_loss": -26.4091739654541, "global_step": 366598, "epoch": 4416} {"train_loss": -26.446426391601562, "global_step": 366599, "epoch": 4416} {"train_loss": -26.305160522460938, "global_step": 366600, "epoch": 4416} {"train_loss": -25.675861358642578, "global_step": 366601, "epoch": 4416} {"train_loss": -25.873275756835938, "global_step": 366602, "epoch": 4416} {"train_loss": -26.210296630859375, "global_step": 366603, "epoch": 4416} {"train_loss": -26.366107940673828, "global_step": 366604, "epoch": 4416} {"train_loss": -26.29656410217285, "global_step": 366605, "epoch": 4416} {"train_loss": -26.268051147460938, "global_step": 366606, "epoch": 4416} {"train_loss": -26.4608097076416, "global_step": 366607, "epoch": 4416} {"train_loss": -26.17067527770996, "global_step": 366608, "epoch": 4416} {"train_loss": -26.524805068969727, "global_step": 366609, "epoch": 4416} {"train_loss": -26.11069996385689, "global_step": 366610, "epoch": 4416, "val_loss": 6646724.0} {"train_loss": -25.842416763305664, "global_step": 366611, "epoch": 4417} {"train_loss": -25.206567764282227, "global_step": 366612, "epoch": 4417} {"train_loss": -26.053741455078125, "global_step": 366613, "epoch": 4417} {"train_loss": -25.347227096557617, "global_step": 366614, "epoch": 4417} {"train_loss": -25.329374313354492, "global_step": 366615, "epoch": 4417} {"train_loss": -24.8920955657959, "global_step": 366616, "epoch": 4417} {"train_loss": -25.397659301757812, "global_step": 366617, "epoch": 4417} {"train_loss": -25.614805221557617, "global_step": 366618, "epoch": 4417} {"train_loss": -25.949155807495117, "global_step": 366619, "epoch": 4417} {"train_loss": -25.336679458618164, "global_step": 366620, "epoch": 4417} {"train_loss": -25.47650718688965, "global_step": 366621, "epoch": 4417} {"train_loss": -25.13908576965332, "global_step": 366622, "epoch": 4417} {"train_loss": -25.6032772064209, "global_step": 366623, "epoch": 4417} {"train_loss": -25.650476455688477, "global_step": 366624, "epoch": 4417} {"train_loss": -25.94410514831543, "global_step": 366625, "epoch": 4417} {"train_loss": -25.413400650024414, "global_step": 366626, "epoch": 4417} {"train_loss": -25.595434188842773, "global_step": 366627, "epoch": 4417} {"train_loss": -25.901914596557617, "global_step": 366628, "epoch": 4417} {"train_loss": -25.766843795776367, "global_step": 366629, "epoch": 4417} {"train_loss": -26.0858211517334, "global_step": 366630, "epoch": 4417} {"train_loss": -25.789499282836914, "global_step": 366631, "epoch": 4417} {"train_loss": -25.743680953979492, "global_step": 366632, "epoch": 4417} {"train_loss": -25.806049346923828, "global_step": 366633, "epoch": 4417} {"train_loss": -25.931629180908203, "global_step": 366634, "epoch": 4417} {"train_loss": -26.066349029541016, "global_step": 366635, "epoch": 4417} {"train_loss": -25.972497940063477, "global_step": 366636, "epoch": 4417} {"train_loss": -25.997106552124023, "global_step": 366637, "epoch": 4417} {"train_loss": -26.402612686157227, "global_step": 366638, "epoch": 4417} {"train_loss": -25.97086524963379, "global_step": 366639, "epoch": 4417} {"train_loss": -25.925445556640625, "global_step": 366640, "epoch": 4417} {"train_loss": -26.35371971130371, "global_step": 366641, "epoch": 4417} {"train_loss": -26.3437442779541, "global_step": 366642, "epoch": 4417} {"train_loss": -25.860830307006836, "global_step": 366643, "epoch": 4417} {"train_loss": -26.3050594329834, "global_step": 366644, "epoch": 4417} {"train_loss": -26.565195083618164, "global_step": 366645, "epoch": 4417} {"train_loss": -26.33896827697754, "global_step": 366646, "epoch": 4417} {"train_loss": -26.400449752807617, "global_step": 366647, "epoch": 4417} {"train_loss": -26.864587783813477, "global_step": 366648, "epoch": 4417} {"train_loss": -26.248865127563477, "global_step": 366649, "epoch": 4417} {"train_loss": -26.680509567260742, "global_step": 366650, "epoch": 4417} {"train_loss": -26.25754737854004, "global_step": 366651, "epoch": 4417} {"train_loss": -26.375600814819336, "global_step": 366652, "epoch": 4417} {"train_loss": -26.164920806884766, "global_step": 366653, "epoch": 4417} {"train_loss": -26.450178146362305, "global_step": 366654, "epoch": 4417} {"train_loss": -26.408674240112305, "global_step": 366655, "epoch": 4417} {"train_loss": -26.615888595581055, "global_step": 366656, "epoch": 4417} {"train_loss": -26.670495986938477, "global_step": 366657, "epoch": 4417} {"train_loss": -26.3055362701416, "global_step": 366658, "epoch": 4417} {"train_loss": -26.26445960998535, "global_step": 366659, "epoch": 4417} {"train_loss": -26.2264404296875, "global_step": 366660, "epoch": 4417} {"train_loss": -26.569324493408203, "global_step": 366661, "epoch": 4417} {"train_loss": -26.58745765686035, "global_step": 366662, "epoch": 4417} {"train_loss": -25.697803497314453, "global_step": 366663, "epoch": 4417} {"train_loss": -25.93312644958496, "global_step": 366664, "epoch": 4417} {"train_loss": -26.532608032226562, "global_step": 366665, "epoch": 4417} {"train_loss": -26.278696060180664, "global_step": 366666, "epoch": 4417} {"train_loss": -26.57712745666504, "global_step": 366667, "epoch": 4417} {"train_loss": -26.65754508972168, "global_step": 366668, "epoch": 4417} {"train_loss": -26.361234664916992, "global_step": 366669, "epoch": 4417} {"train_loss": -26.600271224975586, "global_step": 366670, "epoch": 4417} {"train_loss": -25.76053810119629, "global_step": 366671, "epoch": 4417} {"train_loss": -26.357791900634766, "global_step": 366672, "epoch": 4417} {"train_loss": -25.239042282104492, "global_step": 366673, "epoch": 4417} {"train_loss": -25.52850914001465, "global_step": 366674, "epoch": 4417} {"train_loss": -25.47418212890625, "global_step": 366675, "epoch": 4417} {"train_loss": -26.118865966796875, "global_step": 366676, "epoch": 4417} {"train_loss": -25.714649200439453, "global_step": 366677, "epoch": 4417} {"train_loss": -26.262937545776367, "global_step": 366678, "epoch": 4417} {"train_loss": -26.054214477539062, "global_step": 366679, "epoch": 4417} {"train_loss": -26.23604393005371, "global_step": 366680, "epoch": 4417} {"train_loss": -26.285364151000977, "global_step": 366681, "epoch": 4417} {"train_loss": -25.832666397094727, "global_step": 366682, "epoch": 4417} {"train_loss": -26.253116607666016, "global_step": 366683, "epoch": 4417} {"train_loss": -25.977283477783203, "global_step": 366684, "epoch": 4417} {"train_loss": -26.145837783813477, "global_step": 366685, "epoch": 4417} {"train_loss": -26.028308868408203, "global_step": 366686, "epoch": 4417} {"train_loss": -25.786935806274414, "global_step": 366687, "epoch": 4417} {"train_loss": -26.382537841796875, "global_step": 366688, "epoch": 4417} {"train_loss": -26.251708984375, "global_step": 366689, "epoch": 4417} {"train_loss": -26.301488876342773, "global_step": 366690, "epoch": 4417} {"train_loss": -26.280399322509766, "global_step": 366691, "epoch": 4417} {"train_loss": -26.434309005737305, "global_step": 366692, "epoch": 4417} {"train_loss": -26.04007339477539, "global_step": 366693, "epoch": 4417, "val_loss": 6550107.0} {"train_loss": -25.734113693237305, "global_step": 366694, "epoch": 4418} {"train_loss": -25.551511764526367, "global_step": 366695, "epoch": 4418} {"train_loss": -26.357831954956055, "global_step": 366696, "epoch": 4418} {"train_loss": -25.65021324157715, "global_step": 366697, "epoch": 4418} {"train_loss": -25.804128646850586, "global_step": 366698, "epoch": 4418} {"train_loss": -26.107086181640625, "global_step": 366699, "epoch": 4418} {"train_loss": -25.98636817932129, "global_step": 366700, "epoch": 4418} {"train_loss": -26.271249771118164, "global_step": 366701, "epoch": 4418} {"train_loss": -26.12261390686035, "global_step": 366702, "epoch": 4418} {"train_loss": -26.400257110595703, "global_step": 366703, "epoch": 4418} {"train_loss": -26.318546295166016, "global_step": 366704, "epoch": 4418} {"train_loss": -26.210046768188477, "global_step": 366705, "epoch": 4418} {"train_loss": -26.09766960144043, "global_step": 366706, "epoch": 4418} {"train_loss": -26.301008224487305, "global_step": 366707, "epoch": 4418} {"train_loss": -25.905685424804688, "global_step": 366708, "epoch": 4418} {"train_loss": -26.05438804626465, "global_step": 366709, "epoch": 4418} {"train_loss": -26.30950355529785, "global_step": 366710, "epoch": 4418} {"train_loss": -26.014434814453125, "global_step": 366711, "epoch": 4418} {"train_loss": -26.396289825439453, "global_step": 366712, "epoch": 4418} {"train_loss": -26.70273208618164, "global_step": 366713, "epoch": 4418} {"train_loss": -26.11713218688965, "global_step": 366714, "epoch": 4418} {"train_loss": -26.28169059753418, "global_step": 366715, "epoch": 4418} {"train_loss": -25.85553550720215, "global_step": 366716, "epoch": 4418} {"train_loss": -26.178668975830078, "global_step": 366717, "epoch": 4418} {"train_loss": -26.507354736328125, "global_step": 366718, "epoch": 4418} {"train_loss": -26.251331329345703, "global_step": 366719, "epoch": 4418} {"train_loss": -26.50892448425293, "global_step": 366720, "epoch": 4418} {"train_loss": -26.341693878173828, "global_step": 366721, "epoch": 4418} {"train_loss": -26.516019821166992, "global_step": 366722, "epoch": 4418} {"train_loss": -26.586050033569336, "global_step": 366723, "epoch": 4418} {"train_loss": -26.090564727783203, "global_step": 366724, "epoch": 4418} {"train_loss": -26.48463249206543, "global_step": 366725, "epoch": 4418} {"train_loss": -26.251758575439453, "global_step": 366726, "epoch": 4418} {"train_loss": -26.649795532226562, "global_step": 366727, "epoch": 4418} {"train_loss": -26.662311553955078, "global_step": 366728, "epoch": 4418} {"train_loss": -26.144729614257812, "global_step": 366729, "epoch": 4418} {"train_loss": -26.37803077697754, "global_step": 366730, "epoch": 4418} {"train_loss": -26.422515869140625, "global_step": 366731, "epoch": 4418} {"train_loss": -26.569486618041992, "global_step": 366732, "epoch": 4418} {"train_loss": -26.613943099975586, "global_step": 366733, "epoch": 4418} {"train_loss": -26.300504684448242, "global_step": 366734, "epoch": 4418} {"train_loss": -26.2165470123291, "global_step": 366735, "epoch": 4418} {"train_loss": -26.303686141967773, "global_step": 366736, "epoch": 4418} {"train_loss": -26.562177658081055, "global_step": 366737, "epoch": 4418} {"train_loss": -26.682767868041992, "global_step": 366738, "epoch": 4418} {"train_loss": -26.529199600219727, "global_step": 366739, "epoch": 4418} {"train_loss": -26.40778923034668, "global_step": 366740, "epoch": 4418} {"train_loss": -26.637781143188477, "global_step": 366741, "epoch": 4418} {"train_loss": -26.588346481323242, "global_step": 366742, "epoch": 4418} {"train_loss": -26.790502548217773, "global_step": 366743, "epoch": 4418} {"train_loss": -26.617055892944336, "global_step": 366744, "epoch": 4418} {"train_loss": -26.125701904296875, "global_step": 366745, "epoch": 4418} {"train_loss": -26.490478515625, "global_step": 366746, "epoch": 4418} {"train_loss": -26.526386260986328, "global_step": 366747, "epoch": 4418} {"train_loss": -26.63808250427246, "global_step": 366748, "epoch": 4418} {"train_loss": -26.037134170532227, "global_step": 366749, "epoch": 4418} {"train_loss": -26.232751846313477, "global_step": 366750, "epoch": 4418} {"train_loss": -26.50447654724121, "global_step": 366751, "epoch": 4418} {"train_loss": -26.682266235351562, "global_step": 366752, "epoch": 4418} {"train_loss": -26.603900909423828, "global_step": 366753, "epoch": 4418} {"train_loss": -26.29006004333496, "global_step": 366754, "epoch": 4418} {"train_loss": -26.25589942932129, "global_step": 366755, "epoch": 4418} {"train_loss": -26.006086349487305, "global_step": 366756, "epoch": 4418} {"train_loss": -26.074951171875, "global_step": 366757, "epoch": 4418} {"train_loss": -26.644262313842773, "global_step": 366758, "epoch": 4418} {"train_loss": -25.825952529907227, "global_step": 366759, "epoch": 4418} {"train_loss": -26.030506134033203, "global_step": 366760, "epoch": 4418} {"train_loss": -26.44935417175293, "global_step": 366761, "epoch": 4418} {"train_loss": -26.100095748901367, "global_step": 366762, "epoch": 4418} {"train_loss": -25.8010311126709, "global_step": 366763, "epoch": 4418} {"train_loss": -26.018054962158203, "global_step": 366764, "epoch": 4418} {"train_loss": -26.329797744750977, "global_step": 366765, "epoch": 4418} {"train_loss": -25.70119285583496, "global_step": 366766, "epoch": 4418} {"train_loss": -25.99104118347168, "global_step": 366767, "epoch": 4418} {"train_loss": -25.877485275268555, "global_step": 366768, "epoch": 4418} {"train_loss": -25.987531661987305, "global_step": 366769, "epoch": 4418} {"train_loss": -26.15189552307129, "global_step": 366770, "epoch": 4418} {"train_loss": -26.21124839782715, "global_step": 366771, "epoch": 4418} {"train_loss": -26.227582931518555, "global_step": 366772, "epoch": 4418} {"train_loss": -26.14335060119629, "global_step": 366773, "epoch": 4418} {"train_loss": -26.493200302124023, "global_step": 366774, "epoch": 4418} {"train_loss": -25.821369171142578, "global_step": 366775, "epoch": 4418} {"train_loss": -26.2702814354954, "global_step": 366776, "epoch": 4418, "val_loss": 6634868.0} {"train_loss": -26.2183895111084, "global_step": 366777, "epoch": 4419} {"train_loss": -25.62223243713379, "global_step": 366778, "epoch": 4419} {"train_loss": -25.74600601196289, "global_step": 366779, "epoch": 4419} {"train_loss": -26.151824951171875, "global_step": 366780, "epoch": 4419} {"train_loss": -25.47892189025879, "global_step": 366781, "epoch": 4419} {"train_loss": -25.776046752929688, "global_step": 366782, "epoch": 4419} {"train_loss": -25.7719783782959, "global_step": 366783, "epoch": 4419} {"train_loss": -25.564517974853516, "global_step": 366784, "epoch": 4419} {"train_loss": -26.113996505737305, "global_step": 366785, "epoch": 4419} {"train_loss": -25.587072372436523, "global_step": 366786, "epoch": 4419} {"train_loss": -25.4826717376709, "global_step": 366787, "epoch": 4419} {"train_loss": -26.213834762573242, "global_step": 366788, "epoch": 4419} {"train_loss": -26.150400161743164, "global_step": 366789, "epoch": 4419} {"train_loss": -26.21078872680664, "global_step": 366790, "epoch": 4419} {"train_loss": -25.93385124206543, "global_step": 366791, "epoch": 4419} {"train_loss": -25.905370712280273, "global_step": 366792, "epoch": 4419} {"train_loss": -25.873031616210938, "global_step": 366793, "epoch": 4419} {"train_loss": -26.208295822143555, "global_step": 366794, "epoch": 4419} {"train_loss": -26.148969650268555, "global_step": 366795, "epoch": 4419} {"train_loss": -26.212940216064453, "global_step": 366796, "epoch": 4419} {"train_loss": -25.899805068969727, "global_step": 366797, "epoch": 4419} {"train_loss": -26.0710391998291, "global_step": 366798, "epoch": 4419} {"train_loss": -26.637670516967773, "global_step": 366799, "epoch": 4419} {"train_loss": -26.148971557617188, "global_step": 366800, "epoch": 4419} {"train_loss": -26.524097442626953, "global_step": 366801, "epoch": 4419} {"train_loss": -26.350515365600586, "global_step": 366802, "epoch": 4419} {"train_loss": -26.572126388549805, "global_step": 366803, "epoch": 4419} {"train_loss": -26.5325984954834, "global_step": 366804, "epoch": 4419} {"train_loss": -26.235931396484375, "global_step": 366805, "epoch": 4419} {"train_loss": -26.43512535095215, "global_step": 366806, "epoch": 4419} {"train_loss": -26.145172119140625, "global_step": 366807, "epoch": 4419} {"train_loss": -26.090879440307617, "global_step": 366808, "epoch": 4419} {"train_loss": -26.595579147338867, "global_step": 366809, "epoch": 4419} {"train_loss": -26.240966796875, "global_step": 366810, "epoch": 4419} {"train_loss": -26.764013290405273, "global_step": 366811, "epoch": 4419} {"train_loss": -26.57050132751465, "global_step": 366812, "epoch": 4419} {"train_loss": -26.2297420501709, "global_step": 366813, "epoch": 4419} {"train_loss": -26.452619552612305, "global_step": 366814, "epoch": 4419} {"train_loss": -26.389190673828125, "global_step": 366815, "epoch": 4419} {"train_loss": -26.546899795532227, "global_step": 366816, "epoch": 4419} {"train_loss": -26.265974044799805, "global_step": 366817, "epoch": 4419} {"train_loss": -26.03277587890625, "global_step": 366818, "epoch": 4419} {"train_loss": -25.6547908782959, "global_step": 366819, "epoch": 4419} {"train_loss": -25.962244033813477, "global_step": 366820, "epoch": 4419} {"train_loss": -25.637861251831055, "global_step": 366821, "epoch": 4419} {"train_loss": -25.941991806030273, "global_step": 366822, "epoch": 4419} {"train_loss": -25.68366050720215, "global_step": 366823, "epoch": 4419} {"train_loss": -26.38747215270996, "global_step": 366824, "epoch": 4419} {"train_loss": -25.605804443359375, "global_step": 366825, "epoch": 4419} {"train_loss": -26.065460205078125, "global_step": 366826, "epoch": 4419} {"train_loss": -26.02784538269043, "global_step": 366827, "epoch": 4419} {"train_loss": -26.180429458618164, "global_step": 366828, "epoch": 4419} {"train_loss": -26.08857536315918, "global_step": 366829, "epoch": 4419} {"train_loss": -25.864013671875, "global_step": 366830, "epoch": 4419} {"train_loss": -26.462743759155273, "global_step": 366831, "epoch": 4419} {"train_loss": -26.061582565307617, "global_step": 366832, "epoch": 4419} {"train_loss": -26.56756019592285, "global_step": 366833, "epoch": 4419} {"train_loss": -26.271381378173828, "global_step": 366834, "epoch": 4419} {"train_loss": -26.137746810913086, "global_step": 366835, "epoch": 4419} {"train_loss": -26.119077682495117, "global_step": 366836, "epoch": 4419} {"train_loss": -25.753538131713867, "global_step": 366837, "epoch": 4419} {"train_loss": -26.009923934936523, "global_step": 366838, "epoch": 4419} {"train_loss": -26.1418514251709, "global_step": 366839, "epoch": 4419} {"train_loss": -26.227445602416992, "global_step": 366840, "epoch": 4419} {"train_loss": -26.211084365844727, "global_step": 366841, "epoch": 4419} {"train_loss": -25.967573165893555, "global_step": 366842, "epoch": 4419} {"train_loss": -26.459009170532227, "global_step": 366843, "epoch": 4419} {"train_loss": -25.969818115234375, "global_step": 366844, "epoch": 4419} {"train_loss": -26.41873550415039, "global_step": 366845, "epoch": 4419} {"train_loss": -26.181640625, "global_step": 366846, "epoch": 4419} {"train_loss": -26.531538009643555, "global_step": 366847, "epoch": 4419} {"train_loss": -26.364179611206055, "global_step": 366848, "epoch": 4419} {"train_loss": -26.11493492126465, "global_step": 366849, "epoch": 4419} {"train_loss": -26.56037712097168, "global_step": 366850, "epoch": 4419} {"train_loss": -26.527957916259766, "global_step": 366851, "epoch": 4419} {"train_loss": -26.381994247436523, "global_step": 366852, "epoch": 4419} {"train_loss": -26.338499069213867, "global_step": 366853, "epoch": 4419} {"train_loss": -26.426959991455078, "global_step": 366854, "epoch": 4419} {"train_loss": -26.657958984375, "global_step": 366855, "epoch": 4419} {"train_loss": -26.413543701171875, "global_step": 366856, "epoch": 4419} {"train_loss": -27.07561683654785, "global_step": 366857, "epoch": 4419} {"train_loss": -26.64515495300293, "global_step": 366858, "epoch": 4419} {"train_loss": -26.16331886383424, "global_step": 366859, "epoch": 4419, "val_loss": 6624345.0} {"train_loss": -25.477067947387695, "global_step": 366860, "epoch": 4420} {"train_loss": -25.96282958984375, "global_step": 366861, "epoch": 4420} {"train_loss": -26.142444610595703, "global_step": 366862, "epoch": 4420} {"train_loss": -25.647214889526367, "global_step": 366863, "epoch": 4420} {"train_loss": -25.958301544189453, "global_step": 366864, "epoch": 4420} {"train_loss": -26.7270565032959, "global_step": 366865, "epoch": 4420} {"train_loss": -26.146162033081055, "global_step": 366866, "epoch": 4420} {"train_loss": -26.19461441040039, "global_step": 366867, "epoch": 4420} {"train_loss": -26.011157989501953, "global_step": 366868, "epoch": 4420} {"train_loss": -26.049985885620117, "global_step": 366869, "epoch": 4420} {"train_loss": -25.93659019470215, "global_step": 366870, "epoch": 4420} {"train_loss": -25.9740047454834, "global_step": 366871, "epoch": 4420} {"train_loss": -26.358173370361328, "global_step": 366872, "epoch": 4420} {"train_loss": -26.14404296875, "global_step": 366873, "epoch": 4420} {"train_loss": -26.01630973815918, "global_step": 366874, "epoch": 4420} {"train_loss": -26.00535011291504, "global_step": 366875, "epoch": 4420} {"train_loss": -26.441268920898438, "global_step": 366876, "epoch": 4420} {"train_loss": -26.542978286743164, "global_step": 366877, "epoch": 4420} {"train_loss": -26.198516845703125, "global_step": 366878, "epoch": 4420} {"train_loss": -26.439105987548828, "global_step": 366879, "epoch": 4420} {"train_loss": -26.32497215270996, "global_step": 366880, "epoch": 4420} {"train_loss": -26.19968032836914, "global_step": 366881, "epoch": 4420} {"train_loss": -26.421112060546875, "global_step": 366882, "epoch": 4420} {"train_loss": -25.917057037353516, "global_step": 366883, "epoch": 4420} {"train_loss": -26.337228775024414, "global_step": 366884, "epoch": 4420} {"train_loss": -26.408309936523438, "global_step": 366885, "epoch": 4420} {"train_loss": -26.498403549194336, "global_step": 366886, "epoch": 4420} {"train_loss": -26.37200927734375, "global_step": 366887, "epoch": 4420} {"train_loss": -26.349288940429688, "global_step": 366888, "epoch": 4420} {"train_loss": -26.172271728515625, "global_step": 366889, "epoch": 4420} {"train_loss": -26.214801788330078, "global_step": 366890, "epoch": 4420} {"train_loss": -26.67685317993164, "global_step": 366891, "epoch": 4420} {"train_loss": -26.715728759765625, "global_step": 366892, "epoch": 4420} {"train_loss": -26.500839233398438, "global_step": 366893, "epoch": 4420} {"train_loss": -26.590042114257812, "global_step": 366894, "epoch": 4420} {"train_loss": -26.329456329345703, "global_step": 366895, "epoch": 4420} {"train_loss": -26.259601593017578, "global_step": 366896, "epoch": 4420} {"train_loss": -26.160261154174805, "global_step": 366897, "epoch": 4420} {"train_loss": -26.523944854736328, "global_step": 366898, "epoch": 4420} {"train_loss": -26.3653621673584, "global_step": 366899, "epoch": 4420} {"train_loss": -26.385313034057617, "global_step": 366900, "epoch": 4420} {"train_loss": -26.703027725219727, "global_step": 366901, "epoch": 4420} {"train_loss": -26.543415069580078, "global_step": 366902, "epoch": 4420} {"train_loss": -26.375797271728516, "global_step": 366903, "epoch": 4420} {"train_loss": -26.330224990844727, "global_step": 366904, "epoch": 4420} {"train_loss": -26.210376739501953, "global_step": 366905, "epoch": 4420} {"train_loss": -25.915969848632812, "global_step": 366906, "epoch": 4420} {"train_loss": -25.877521514892578, "global_step": 366907, "epoch": 4420} {"train_loss": -25.438371658325195, "global_step": 366908, "epoch": 4420} {"train_loss": -25.42407989501953, "global_step": 366909, "epoch": 4420} {"train_loss": -25.756622314453125, "global_step": 366910, "epoch": 4420} {"train_loss": -25.956274032592773, "global_step": 366911, "epoch": 4420} {"train_loss": -26.287988662719727, "global_step": 366912, "epoch": 4420} {"train_loss": -25.92044448852539, "global_step": 366913, "epoch": 4420} {"train_loss": -26.115692138671875, "global_step": 366914, "epoch": 4420} {"train_loss": -26.117828369140625, "global_step": 366915, "epoch": 4420} {"train_loss": -25.971364974975586, "global_step": 366916, "epoch": 4420} {"train_loss": -26.096948623657227, "global_step": 366917, "epoch": 4420} {"train_loss": -26.083831787109375, "global_step": 366918, "epoch": 4420} {"train_loss": -26.51474380493164, "global_step": 366919, "epoch": 4420} {"train_loss": -25.972265243530273, "global_step": 366920, "epoch": 4420} {"train_loss": -25.941694259643555, "global_step": 366921, "epoch": 4420} {"train_loss": -26.2872314453125, "global_step": 366922, "epoch": 4420} {"train_loss": -25.984495162963867, "global_step": 366923, "epoch": 4420} {"train_loss": -26.3005313873291, "global_step": 366924, "epoch": 4420} {"train_loss": -26.315826416015625, "global_step": 366925, "epoch": 4420} {"train_loss": -26.608245849609375, "global_step": 366926, "epoch": 4420} {"train_loss": -26.162145614624023, "global_step": 366927, "epoch": 4420} {"train_loss": -26.092878341674805, "global_step": 366928, "epoch": 4420} {"train_loss": -26.129392623901367, "global_step": 366929, "epoch": 4420} {"train_loss": -26.362272262573242, "global_step": 366930, "epoch": 4420} {"train_loss": -26.459882736206055, "global_step": 366931, "epoch": 4420} {"train_loss": -26.162267684936523, "global_step": 366932, "epoch": 4420} {"train_loss": -26.093402862548828, "global_step": 366933, "epoch": 4420} {"train_loss": -26.473791122436523, "global_step": 366934, "epoch": 4420} {"train_loss": -26.934350967407227, "global_step": 366935, "epoch": 4420} {"train_loss": -26.280420303344727, "global_step": 366936, "epoch": 4420} {"train_loss": -26.284061431884766, "global_step": 366937, "epoch": 4420} {"train_loss": -26.35407829284668, "global_step": 366938, "epoch": 4420} {"train_loss": -26.51667594909668, "global_step": 366939, "epoch": 4420} {"train_loss": -26.546777725219727, "global_step": 366940, "epoch": 4420} {"train_loss": -26.55274772644043, "global_step": 366941, "epoch": 4420} {"train_loss": -26.241087281560322, "global_step": 366942, "epoch": 4420, "val_loss": 6511025.5} {"train_loss": -25.210189819335938, "global_step": 366943, "epoch": 4421} {"train_loss": -25.864349365234375, "global_step": 366944, "epoch": 4421} {"train_loss": -25.6108341217041, "global_step": 366945, "epoch": 4421} {"train_loss": -25.632665634155273, "global_step": 366946, "epoch": 4421} {"train_loss": -26.087295532226562, "global_step": 366947, "epoch": 4421} {"train_loss": -25.990476608276367, "global_step": 366948, "epoch": 4421} {"train_loss": -25.7717227935791, "global_step": 366949, "epoch": 4421} {"train_loss": -25.592941284179688, "global_step": 366950, "epoch": 4421} {"train_loss": -25.89306640625, "global_step": 366951, "epoch": 4421} {"train_loss": -25.864734649658203, "global_step": 366952, "epoch": 4421} {"train_loss": -26.07687759399414, "global_step": 366953, "epoch": 4421} {"train_loss": -25.9427433013916, "global_step": 366954, "epoch": 4421} {"train_loss": -26.0125789642334, "global_step": 366955, "epoch": 4421} {"train_loss": -26.29829216003418, "global_step": 366956, "epoch": 4421} {"train_loss": -25.890024185180664, "global_step": 366957, "epoch": 4421} {"train_loss": -26.253660202026367, "global_step": 366958, "epoch": 4421} {"train_loss": -26.225513458251953, "global_step": 366959, "epoch": 4421} {"train_loss": -26.2453556060791, "global_step": 366960, "epoch": 4421} {"train_loss": -26.182294845581055, "global_step": 366961, "epoch": 4421} {"train_loss": -25.788549423217773, "global_step": 366962, "epoch": 4421} {"train_loss": -26.150976181030273, "global_step": 366963, "epoch": 4421} {"train_loss": -26.052753448486328, "global_step": 366964, "epoch": 4421} {"train_loss": -25.968006134033203, "global_step": 366965, "epoch": 4421} {"train_loss": -26.485248565673828, "global_step": 366966, "epoch": 4421} {"train_loss": -25.834501266479492, "global_step": 366967, "epoch": 4421} {"train_loss": -26.526655197143555, "global_step": 366968, "epoch": 4421} {"train_loss": -26.04731559753418, "global_step": 366969, "epoch": 4421} {"train_loss": -26.239477157592773, "global_step": 366970, "epoch": 4421} {"train_loss": -26.41583251953125, "global_step": 366971, "epoch": 4421} {"train_loss": -26.299116134643555, "global_step": 366972, "epoch": 4421} {"train_loss": -26.02728271484375, "global_step": 366973, "epoch": 4421} {"train_loss": -26.491479873657227, "global_step": 366974, "epoch": 4421} {"train_loss": -26.473865509033203, "global_step": 366975, "epoch": 4421} {"train_loss": -26.043867111206055, "global_step": 366976, "epoch": 4421} {"train_loss": -26.040075302124023, "global_step": 366977, "epoch": 4421} {"train_loss": -26.5949649810791, "global_step": 366978, "epoch": 4421} {"train_loss": -26.11795425415039, "global_step": 366979, "epoch": 4421} {"train_loss": -26.458471298217773, "global_step": 366980, "epoch": 4421} {"train_loss": -26.165151596069336, "global_step": 366981, "epoch": 4421} {"train_loss": -26.5563907623291, "global_step": 366982, "epoch": 4421} {"train_loss": -26.547779083251953, "global_step": 366983, "epoch": 4421} {"train_loss": -26.354658126831055, "global_step": 366984, "epoch": 4421} {"train_loss": -26.087421417236328, "global_step": 366985, "epoch": 4421} {"train_loss": -26.278461456298828, "global_step": 366986, "epoch": 4421} {"train_loss": -26.6470890045166, "global_step": 366987, "epoch": 4421} {"train_loss": -26.43899917602539, "global_step": 366988, "epoch": 4421} {"train_loss": -26.43733787536621, "global_step": 366989, "epoch": 4421} {"train_loss": -26.54448890686035, "global_step": 366990, "epoch": 4421} {"train_loss": -26.356225967407227, "global_step": 366991, "epoch": 4421} {"train_loss": -26.796661376953125, "global_step": 366992, "epoch": 4421} {"train_loss": -26.5750675201416, "global_step": 366993, "epoch": 4421} {"train_loss": -26.497175216674805, "global_step": 366994, "epoch": 4421} {"train_loss": -26.786108016967773, "global_step": 366995, "epoch": 4421} {"train_loss": -26.105642318725586, "global_step": 366996, "epoch": 4421} {"train_loss": -26.588964462280273, "global_step": 366997, "epoch": 4421} {"train_loss": -26.567121505737305, "global_step": 366998, "epoch": 4421} {"train_loss": -26.697772979736328, "global_step": 366999, "epoch": 4421} {"train_loss": -26.242511749267578, "global_step": 367000, "epoch": 4421} {"train_loss": -26.476587295532227, "global_step": 367001, "epoch": 4421} {"train_loss": -26.6707820892334, "global_step": 367002, "epoch": 4421} {"train_loss": -26.306848526000977, "global_step": 367003, "epoch": 4421} {"train_loss": -26.43934440612793, "global_step": 367004, "epoch": 4421} {"train_loss": -26.464130401611328, "global_step": 367005, "epoch": 4421} {"train_loss": -26.360050201416016, "global_step": 367006, "epoch": 4421} {"train_loss": -26.323272705078125, "global_step": 367007, "epoch": 4421} {"train_loss": -26.521947860717773, "global_step": 367008, "epoch": 4421} {"train_loss": -26.936676025390625, "global_step": 367009, "epoch": 4421} {"train_loss": -26.46388053894043, "global_step": 367010, "epoch": 4421} {"train_loss": -26.55625343322754, "global_step": 367011, "epoch": 4421} {"train_loss": -26.721698760986328, "global_step": 367012, "epoch": 4421} {"train_loss": -26.36625099182129, "global_step": 367013, "epoch": 4421} {"train_loss": -26.79729652404785, "global_step": 367014, "epoch": 4421} {"train_loss": -26.3238468170166, "global_step": 367015, "epoch": 4421} {"train_loss": -26.524871826171875, "global_step": 367016, "epoch": 4421} {"train_loss": -26.521778106689453, "global_step": 367017, "epoch": 4421} {"train_loss": -26.1798152923584, "global_step": 367018, "epoch": 4421} {"train_loss": -25.970922470092773, "global_step": 367019, "epoch": 4421} {"train_loss": -25.61284828186035, "global_step": 367020, "epoch": 4421} {"train_loss": -25.5897274017334, "global_step": 367021, "epoch": 4421} {"train_loss": -25.81568717956543, "global_step": 367022, "epoch": 4421} {"train_loss": -26.359243392944336, "global_step": 367023, "epoch": 4421} {"train_loss": -26.29817771911621, "global_step": 367024, "epoch": 4421} {"train_loss": -26.241421389292523, "global_step": 367025, "epoch": 4421, "val_loss": 6512642.0} {"train_loss": -23.346647262573242, "global_step": 367026, "epoch": 4422} {"train_loss": -24.11848258972168, "global_step": 367027, "epoch": 4422} {"train_loss": -24.706768035888672, "global_step": 367028, "epoch": 4422} {"train_loss": -23.519973754882812, "global_step": 367029, "epoch": 4422} {"train_loss": -24.97606658935547, "global_step": 367030, "epoch": 4422} {"train_loss": -25.299097061157227, "global_step": 367031, "epoch": 4422} {"train_loss": -23.920860290527344, "global_step": 367032, "epoch": 4422} {"train_loss": -24.698883056640625, "global_step": 367033, "epoch": 4422} {"train_loss": -25.40254020690918, "global_step": 367034, "epoch": 4422} {"train_loss": -24.927112579345703, "global_step": 367035, "epoch": 4422} {"train_loss": -25.220439910888672, "global_step": 367036, "epoch": 4422} {"train_loss": -25.311222076416016, "global_step": 367037, "epoch": 4422} {"train_loss": -25.577348709106445, "global_step": 367038, "epoch": 4422} {"train_loss": -25.40532684326172, "global_step": 367039, "epoch": 4422} {"train_loss": -25.324478149414062, "global_step": 367040, "epoch": 4422} {"train_loss": -25.535388946533203, "global_step": 367041, "epoch": 4422} {"train_loss": -25.500411987304688, "global_step": 367042, "epoch": 4422} {"train_loss": -25.76946449279785, "global_step": 367043, "epoch": 4422} {"train_loss": -25.43279266357422, "global_step": 367044, "epoch": 4422} {"train_loss": -25.633153915405273, "global_step": 367045, "epoch": 4422} {"train_loss": -25.9276123046875, "global_step": 367046, "epoch": 4422} {"train_loss": -25.850467681884766, "global_step": 367047, "epoch": 4422} {"train_loss": -26.01185417175293, "global_step": 367048, "epoch": 4422} {"train_loss": -25.920637130737305, "global_step": 367049, "epoch": 4422} {"train_loss": -25.754064559936523, "global_step": 367050, "epoch": 4422} {"train_loss": -25.99933433532715, "global_step": 367051, "epoch": 4422} {"train_loss": -26.102767944335938, "global_step": 367052, "epoch": 4422} {"train_loss": -25.956165313720703, "global_step": 367053, "epoch": 4422} {"train_loss": -26.236251831054688, "global_step": 367054, "epoch": 4422} {"train_loss": -25.919050216674805, "global_step": 367055, "epoch": 4422} {"train_loss": -25.960607528686523, "global_step": 367056, "epoch": 4422} {"train_loss": -26.095752716064453, "global_step": 367057, "epoch": 4422} {"train_loss": -26.19563102722168, "global_step": 367058, "epoch": 4422} {"train_loss": -26.10581398010254, "global_step": 367059, "epoch": 4422} {"train_loss": -25.82622718811035, "global_step": 367060, "epoch": 4422} {"train_loss": -25.865304946899414, "global_step": 367061, "epoch": 4422} {"train_loss": -25.973791122436523, "global_step": 367062, "epoch": 4422} {"train_loss": -26.428770065307617, "global_step": 367063, "epoch": 4422} {"train_loss": -25.95236587524414, "global_step": 367064, "epoch": 4422} {"train_loss": -26.15619468688965, "global_step": 367065, "epoch": 4422} {"train_loss": -25.922086715698242, "global_step": 367066, "epoch": 4422} {"train_loss": -26.31929588317871, "global_step": 367067, "epoch": 4422} {"train_loss": -26.060474395751953, "global_step": 367068, "epoch": 4422} {"train_loss": -26.16521644592285, "global_step": 367069, "epoch": 4422} {"train_loss": -26.156253814697266, "global_step": 367070, "epoch": 4422} {"train_loss": -26.431381225585938, "global_step": 367071, "epoch": 4422} {"train_loss": -26.182159423828125, "global_step": 367072, "epoch": 4422} {"train_loss": -26.073652267456055, "global_step": 367073, "epoch": 4422} {"train_loss": -26.04090690612793, "global_step": 367074, "epoch": 4422} {"train_loss": -26.058908462524414, "global_step": 367075, "epoch": 4422} {"train_loss": -26.381031036376953, "global_step": 367076, "epoch": 4422} {"train_loss": -26.016218185424805, "global_step": 367077, "epoch": 4422} {"train_loss": -25.980310440063477, "global_step": 367078, "epoch": 4422} {"train_loss": -26.468555450439453, "global_step": 367079, "epoch": 4422} {"train_loss": -26.262226104736328, "global_step": 367080, "epoch": 4422} {"train_loss": -26.602807998657227, "global_step": 367081, "epoch": 4422} {"train_loss": -25.94317626953125, "global_step": 367082, "epoch": 4422} {"train_loss": -26.207868576049805, "global_step": 367083, "epoch": 4422} {"train_loss": -26.083606719970703, "global_step": 367084, "epoch": 4422} {"train_loss": -26.197925567626953, "global_step": 367085, "epoch": 4422} {"train_loss": -26.223041534423828, "global_step": 367086, "epoch": 4422} {"train_loss": -26.194372177124023, "global_step": 367087, "epoch": 4422} {"train_loss": -25.98748779296875, "global_step": 367088, "epoch": 4422} {"train_loss": -25.96742057800293, "global_step": 367089, "epoch": 4422} {"train_loss": -26.02072525024414, "global_step": 367090, "epoch": 4422} {"train_loss": -25.614084243774414, "global_step": 367091, "epoch": 4422} {"train_loss": -26.142963409423828, "global_step": 367092, "epoch": 4422} {"train_loss": -26.29608154296875, "global_step": 367093, "epoch": 4422} {"train_loss": -25.94258689880371, "global_step": 367094, "epoch": 4422} {"train_loss": -25.94904899597168, "global_step": 367095, "epoch": 4422} {"train_loss": -26.592670440673828, "global_step": 367096, "epoch": 4422} {"train_loss": -26.303537368774414, "global_step": 367097, "epoch": 4422} {"train_loss": -26.494190216064453, "global_step": 367098, "epoch": 4422} {"train_loss": -26.406558990478516, "global_step": 367099, "epoch": 4422} {"train_loss": -26.113367080688477, "global_step": 367100, "epoch": 4422} {"train_loss": -26.212039947509766, "global_step": 367101, "epoch": 4422} {"train_loss": -26.167804718017578, "global_step": 367102, "epoch": 4422} {"train_loss": -26.26372718811035, "global_step": 367103, "epoch": 4422} {"train_loss": -26.520069122314453, "global_step": 367104, "epoch": 4422} {"train_loss": -26.510852813720703, "global_step": 367105, "epoch": 4422} {"train_loss": -26.195667266845703, "global_step": 367106, "epoch": 4422} {"train_loss": -26.469446182250977, "global_step": 367107, "epoch": 4422} {"train_loss": -25.85186326360128, "global_step": 367108, "epoch": 4422, "val_loss": 6699497.0} {"train_loss": -26.104053497314453, "global_step": 367109, "epoch": 4423} {"train_loss": -25.9132022857666, "global_step": 367110, "epoch": 4423} {"train_loss": -26.092321395874023, "global_step": 367111, "epoch": 4423} {"train_loss": -26.57566261291504, "global_step": 367112, "epoch": 4423} {"train_loss": -25.896747589111328, "global_step": 367113, "epoch": 4423} {"train_loss": -25.907705307006836, "global_step": 367114, "epoch": 4423} {"train_loss": -26.26858901977539, "global_step": 367115, "epoch": 4423} {"train_loss": -25.979232788085938, "global_step": 367116, "epoch": 4423} {"train_loss": -26.124759674072266, "global_step": 367117, "epoch": 4423} {"train_loss": -26.288190841674805, "global_step": 367118, "epoch": 4423} {"train_loss": -26.286706924438477, "global_step": 367119, "epoch": 4423} {"train_loss": -26.20245361328125, "global_step": 367120, "epoch": 4423} {"train_loss": -26.241891860961914, "global_step": 367121, "epoch": 4423} {"train_loss": -26.120553970336914, "global_step": 367122, "epoch": 4423} {"train_loss": -26.21013832092285, "global_step": 367123, "epoch": 4423} {"train_loss": -25.99366569519043, "global_step": 367124, "epoch": 4423} {"train_loss": -26.4294376373291, "global_step": 367125, "epoch": 4423} {"train_loss": -26.193220138549805, "global_step": 367126, "epoch": 4423} {"train_loss": -26.182662963867188, "global_step": 367127, "epoch": 4423} {"train_loss": -26.25544548034668, "global_step": 367128, "epoch": 4423} {"train_loss": -26.743391036987305, "global_step": 367129, "epoch": 4423} {"train_loss": -26.236801147460938, "global_step": 367130, "epoch": 4423} {"train_loss": -26.3671932220459, "global_step": 367131, "epoch": 4423} {"train_loss": -26.30854606628418, "global_step": 367132, "epoch": 4423} {"train_loss": -26.209863662719727, "global_step": 367133, "epoch": 4423} {"train_loss": -26.543554306030273, "global_step": 367134, "epoch": 4423} {"train_loss": -26.286163330078125, "global_step": 367135, "epoch": 4423} {"train_loss": -26.303516387939453, "global_step": 367136, "epoch": 4423} {"train_loss": -26.016082763671875, "global_step": 367137, "epoch": 4423} {"train_loss": -26.275588989257812, "global_step": 367138, "epoch": 4423} {"train_loss": -26.311248779296875, "global_step": 367139, "epoch": 4423} {"train_loss": -26.282215118408203, "global_step": 367140, "epoch": 4423} {"train_loss": -26.2320556640625, "global_step": 367141, "epoch": 4423} {"train_loss": -26.235998153686523, "global_step": 367142, "epoch": 4423} {"train_loss": -26.405797958374023, "global_step": 367143, "epoch": 4423} {"train_loss": -26.519607543945312, "global_step": 367144, "epoch": 4423} {"train_loss": -26.597949981689453, "global_step": 367145, "epoch": 4423} {"train_loss": -26.337207794189453, "global_step": 367146, "epoch": 4423} {"train_loss": -26.197986602783203, "global_step": 367147, "epoch": 4423} {"train_loss": -26.07027244567871, "global_step": 367148, "epoch": 4423} {"train_loss": -26.383121490478516, "global_step": 367149, "epoch": 4423} {"train_loss": -26.501882553100586, "global_step": 367150, "epoch": 4423} {"train_loss": -26.375486373901367, "global_step": 367151, "epoch": 4423} {"train_loss": -26.496801376342773, "global_step": 367152, "epoch": 4423} {"train_loss": -26.396581649780273, "global_step": 367153, "epoch": 4423} {"train_loss": -26.581830978393555, "global_step": 367154, "epoch": 4423} {"train_loss": -26.39719581604004, "global_step": 367155, "epoch": 4423} {"train_loss": -26.618396759033203, "global_step": 367156, "epoch": 4423} {"train_loss": -26.254507064819336, "global_step": 367157, "epoch": 4423} {"train_loss": -26.8121395111084, "global_step": 367158, "epoch": 4423} {"train_loss": -26.374914169311523, "global_step": 367159, "epoch": 4423} {"train_loss": -25.960468292236328, "global_step": 367160, "epoch": 4423} {"train_loss": -26.400007247924805, "global_step": 367161, "epoch": 4423} {"train_loss": -25.922632217407227, "global_step": 367162, "epoch": 4423} {"train_loss": -26.162084579467773, "global_step": 367163, "epoch": 4423} {"train_loss": -26.457061767578125, "global_step": 367164, "epoch": 4423} {"train_loss": -26.569843292236328, "global_step": 367165, "epoch": 4423} {"train_loss": -26.343732833862305, "global_step": 367166, "epoch": 4423} {"train_loss": -26.1711483001709, "global_step": 367167, "epoch": 4423} {"train_loss": -25.97212028503418, "global_step": 367168, "epoch": 4423} {"train_loss": -25.6539363861084, "global_step": 367169, "epoch": 4423} {"train_loss": -25.982885360717773, "global_step": 367170, "epoch": 4423} {"train_loss": -26.17158317565918, "global_step": 367171, "epoch": 4423} {"train_loss": -25.68497085571289, "global_step": 367172, "epoch": 4423} {"train_loss": -25.786407470703125, "global_step": 367173, "epoch": 4423} {"train_loss": -26.111663818359375, "global_step": 367174, "epoch": 4423} {"train_loss": -26.0239315032959, "global_step": 367175, "epoch": 4423} {"train_loss": -25.41904067993164, "global_step": 367176, "epoch": 4423} {"train_loss": -26.265409469604492, "global_step": 367177, "epoch": 4423} {"train_loss": -26.347366333007812, "global_step": 367178, "epoch": 4423} {"train_loss": -26.20547866821289, "global_step": 367179, "epoch": 4423} {"train_loss": -25.749731063842773, "global_step": 367180, "epoch": 4423} {"train_loss": -26.281543731689453, "global_step": 367181, "epoch": 4423} {"train_loss": -25.96417808532715, "global_step": 367182, "epoch": 4423} {"train_loss": -26.367918014526367, "global_step": 367183, "epoch": 4423} {"train_loss": -26.3623104095459, "global_step": 367184, "epoch": 4423} {"train_loss": -26.43110466003418, "global_step": 367185, "epoch": 4423} {"train_loss": -26.613065719604492, "global_step": 367186, "epoch": 4423} {"train_loss": -26.32435417175293, "global_step": 367187, "epoch": 4423} {"train_loss": -26.35431480407715, "global_step": 367188, "epoch": 4423} {"train_loss": -26.612112045288086, "global_step": 367189, "epoch": 4423} {"train_loss": -26.581100463867188, "global_step": 367190, "epoch": 4423} {"train_loss": -26.257831964148096, "global_step": 367191, "epoch": 4423, "val_loss": 6621733.0} {"train_loss": -25.39652442932129, "global_step": 367192, "epoch": 4424} {"train_loss": -25.379322052001953, "global_step": 367193, "epoch": 4424} {"train_loss": -25.465187072753906, "global_step": 367194, "epoch": 4424} {"train_loss": -25.387615203857422, "global_step": 367195, "epoch": 4424} {"train_loss": -25.8735408782959, "global_step": 367196, "epoch": 4424} {"train_loss": -25.75419044494629, "global_step": 367197, "epoch": 4424} {"train_loss": -25.856016159057617, "global_step": 367198, "epoch": 4424} {"train_loss": -25.860727310180664, "global_step": 367199, "epoch": 4424} {"train_loss": -25.43802833557129, "global_step": 367200, "epoch": 4424} {"train_loss": -26.282224655151367, "global_step": 367201, "epoch": 4424} {"train_loss": -25.881412506103516, "global_step": 367202, "epoch": 4424} {"train_loss": -25.785968780517578, "global_step": 367203, "epoch": 4424} {"train_loss": -26.144275665283203, "global_step": 367204, "epoch": 4424} {"train_loss": -25.84417152404785, "global_step": 367205, "epoch": 4424} {"train_loss": -26.430774688720703, "global_step": 367206, "epoch": 4424} {"train_loss": -25.92819595336914, "global_step": 367207, "epoch": 4424} {"train_loss": -25.727521896362305, "global_step": 367208, "epoch": 4424} {"train_loss": -26.344482421875, "global_step": 367209, "epoch": 4424} {"train_loss": -26.353031158447266, "global_step": 367210, "epoch": 4424} {"train_loss": -26.18839454650879, "global_step": 367211, "epoch": 4424} {"train_loss": -26.02223777770996, "global_step": 367212, "epoch": 4424} {"train_loss": -26.295886993408203, "global_step": 367213, "epoch": 4424} {"train_loss": -26.36939811706543, "global_step": 367214, "epoch": 4424} {"train_loss": -26.449682235717773, "global_step": 367215, "epoch": 4424} {"train_loss": -26.4952392578125, "global_step": 367216, "epoch": 4424} {"train_loss": -26.506818771362305, "global_step": 367217, "epoch": 4424} {"train_loss": -26.472156524658203, "global_step": 367218, "epoch": 4424} {"train_loss": -26.457239151000977, "global_step": 367219, "epoch": 4424} {"train_loss": -26.408674240112305, "global_step": 367220, "epoch": 4424} {"train_loss": -26.273035049438477, "global_step": 367221, "epoch": 4424} {"train_loss": -26.108728408813477, "global_step": 367222, "epoch": 4424} {"train_loss": -26.368066787719727, "global_step": 367223, "epoch": 4424} {"train_loss": -26.628936767578125, "global_step": 367224, "epoch": 4424} {"train_loss": -26.19305419921875, "global_step": 367225, "epoch": 4424} {"train_loss": -26.504796981811523, "global_step": 367226, "epoch": 4424} {"train_loss": -26.354084014892578, "global_step": 367227, "epoch": 4424} {"train_loss": -26.449182510375977, "global_step": 367228, "epoch": 4424} {"train_loss": -26.70094108581543, "global_step": 367229, "epoch": 4424} {"train_loss": -26.406375885009766, "global_step": 367230, "epoch": 4424} {"train_loss": -26.068113327026367, "global_step": 367231, "epoch": 4424} {"train_loss": -26.333295822143555, "global_step": 367232, "epoch": 4424} {"train_loss": -26.61688232421875, "global_step": 367233, "epoch": 4424} {"train_loss": -26.732624053955078, "global_step": 367234, "epoch": 4424} {"train_loss": -26.50123405456543, "global_step": 367235, "epoch": 4424} {"train_loss": -26.496444702148438, "global_step": 367236, "epoch": 4424} {"train_loss": -26.07452392578125, "global_step": 367237, "epoch": 4424} {"train_loss": -26.41411781311035, "global_step": 367238, "epoch": 4424} {"train_loss": -26.133275985717773, "global_step": 367239, "epoch": 4424} {"train_loss": -26.38636589050293, "global_step": 367240, "epoch": 4424} {"train_loss": -26.037649154663086, "global_step": 367241, "epoch": 4424} {"train_loss": -26.210926055908203, "global_step": 367242, "epoch": 4424} {"train_loss": -26.55661392211914, "global_step": 367243, "epoch": 4424} {"train_loss": -26.72402000427246, "global_step": 367244, "epoch": 4424} {"train_loss": -26.469959259033203, "global_step": 367245, "epoch": 4424} {"train_loss": -26.643207550048828, "global_step": 367246, "epoch": 4424} {"train_loss": -26.222074508666992, "global_step": 367247, "epoch": 4424} {"train_loss": -26.10243034362793, "global_step": 367248, "epoch": 4424} {"train_loss": -26.472742080688477, "global_step": 367249, "epoch": 4424} {"train_loss": -26.14922523498535, "global_step": 367250, "epoch": 4424} {"train_loss": -26.26344108581543, "global_step": 367251, "epoch": 4424} {"train_loss": -26.161823272705078, "global_step": 367252, "epoch": 4424} {"train_loss": -25.958524703979492, "global_step": 367253, "epoch": 4424} {"train_loss": -25.917200088500977, "global_step": 367254, "epoch": 4424} {"train_loss": -26.164581298828125, "global_step": 367255, "epoch": 4424} {"train_loss": -26.55205726623535, "global_step": 367256, "epoch": 4424} {"train_loss": -26.140888214111328, "global_step": 367257, "epoch": 4424} {"train_loss": -26.377710342407227, "global_step": 367258, "epoch": 4424} {"train_loss": -25.951324462890625, "global_step": 367259, "epoch": 4424} {"train_loss": -26.434478759765625, "global_step": 367260, "epoch": 4424} {"train_loss": -26.774625778198242, "global_step": 367261, "epoch": 4424} {"train_loss": -26.417219161987305, "global_step": 367262, "epoch": 4424} {"train_loss": -26.401382446289062, "global_step": 367263, "epoch": 4424} {"train_loss": -26.048582077026367, "global_step": 367264, "epoch": 4424} {"train_loss": -26.28657341003418, "global_step": 367265, "epoch": 4424} {"train_loss": -26.2817440032959, "global_step": 367266, "epoch": 4424} {"train_loss": -26.287845611572266, "global_step": 367267, "epoch": 4424} {"train_loss": -26.073348999023438, "global_step": 367268, "epoch": 4424} {"train_loss": -26.320266723632812, "global_step": 367269, "epoch": 4424} {"train_loss": -26.33865737915039, "global_step": 367270, "epoch": 4424} {"train_loss": -25.98211097717285, "global_step": 367271, "epoch": 4424} {"train_loss": -25.93634605407715, "global_step": 367272, "epoch": 4424} {"train_loss": -26.31792640686035, "global_step": 367273, "epoch": 4424} {"train_loss": -26.206680481692395, "global_step": 367274, "epoch": 4424, "val_loss": 6711369.0} {"train_loss": -23.81968116760254, "global_step": 367275, "epoch": 4425} {"train_loss": -24.857099533081055, "global_step": 367276, "epoch": 4425} {"train_loss": -24.64897346496582, "global_step": 367277, "epoch": 4425} {"train_loss": -24.321884155273438, "global_step": 367278, "epoch": 4425} {"train_loss": -24.81330680847168, "global_step": 367279, "epoch": 4425} {"train_loss": -25.027997970581055, "global_step": 367280, "epoch": 4425} {"train_loss": -25.422407150268555, "global_step": 367281, "epoch": 4425} {"train_loss": -25.017990112304688, "global_step": 367282, "epoch": 4425} {"train_loss": -25.57277488708496, "global_step": 367283, "epoch": 4425} {"train_loss": -25.0954532623291, "global_step": 367284, "epoch": 4425} {"train_loss": -25.02017593383789, "global_step": 367285, "epoch": 4425} {"train_loss": -25.783803939819336, "global_step": 367286, "epoch": 4425} {"train_loss": -25.552204132080078, "global_step": 367287, "epoch": 4425} {"train_loss": -25.677276611328125, "global_step": 367288, "epoch": 4425} {"train_loss": -25.80830192565918, "global_step": 367289, "epoch": 4425} {"train_loss": -25.531457901000977, "global_step": 367290, "epoch": 4425} {"train_loss": -25.450239181518555, "global_step": 367291, "epoch": 4425} {"train_loss": -25.71722984313965, "global_step": 367292, "epoch": 4425} {"train_loss": -25.668426513671875, "global_step": 367293, "epoch": 4425} {"train_loss": -25.5711727142334, "global_step": 367294, "epoch": 4425} {"train_loss": -25.71890640258789, "global_step": 367295, "epoch": 4425} {"train_loss": -25.437101364135742, "global_step": 367296, "epoch": 4425} {"train_loss": -25.939453125, "global_step": 367297, "epoch": 4425} {"train_loss": -25.84042739868164, "global_step": 367298, "epoch": 4425} {"train_loss": -25.8006649017334, "global_step": 367299, "epoch": 4425} {"train_loss": -25.65846824645996, "global_step": 367300, "epoch": 4425} {"train_loss": -25.810251235961914, "global_step": 367301, "epoch": 4425} {"train_loss": -25.771087646484375, "global_step": 367302, "epoch": 4425} {"train_loss": -26.318384170532227, "global_step": 367303, "epoch": 4425} {"train_loss": -26.20533561706543, "global_step": 367304, "epoch": 4425} {"train_loss": -26.02740478515625, "global_step": 367305, "epoch": 4425} {"train_loss": -25.870960235595703, "global_step": 367306, "epoch": 4425} {"train_loss": -26.20283317565918, "global_step": 367307, "epoch": 4425} {"train_loss": -26.236652374267578, "global_step": 367308, "epoch": 4425} {"train_loss": -26.068811416625977, "global_step": 367309, "epoch": 4425} {"train_loss": -25.797590255737305, "global_step": 367310, "epoch": 4425} {"train_loss": -26.1704044342041, "global_step": 367311, "epoch": 4425} {"train_loss": -26.09565544128418, "global_step": 367312, "epoch": 4425} {"train_loss": -26.38679313659668, "global_step": 367313, "epoch": 4425} {"train_loss": -26.11872673034668, "global_step": 367314, "epoch": 4425} {"train_loss": -26.16816520690918, "global_step": 367315, "epoch": 4425} {"train_loss": -26.294601440429688, "global_step": 367316, "epoch": 4425} {"train_loss": -26.193586349487305, "global_step": 367317, "epoch": 4425} {"train_loss": -26.56572914123535, "global_step": 367318, "epoch": 4425} {"train_loss": -26.557998657226562, "global_step": 367319, "epoch": 4425} {"train_loss": -26.210302352905273, "global_step": 367320, "epoch": 4425} {"train_loss": -26.420124053955078, "global_step": 367321, "epoch": 4425} {"train_loss": -26.121631622314453, "global_step": 367322, "epoch": 4425} {"train_loss": -26.246784210205078, "global_step": 367323, "epoch": 4425} {"train_loss": -26.110797882080078, "global_step": 367324, "epoch": 4425} {"train_loss": -26.154584884643555, "global_step": 367325, "epoch": 4425} {"train_loss": -26.366409301757812, "global_step": 367326, "epoch": 4425} {"train_loss": -26.534406661987305, "global_step": 367327, "epoch": 4425} {"train_loss": -26.183578491210938, "global_step": 367328, "epoch": 4425} {"train_loss": -26.220773696899414, "global_step": 367329, "epoch": 4425} {"train_loss": -26.514883041381836, "global_step": 367330, "epoch": 4425} {"train_loss": -26.28138542175293, "global_step": 367331, "epoch": 4425} {"train_loss": -26.64211082458496, "global_step": 367332, "epoch": 4425} {"train_loss": -26.888166427612305, "global_step": 367333, "epoch": 4425} {"train_loss": -26.4677677154541, "global_step": 367334, "epoch": 4425} {"train_loss": -26.470861434936523, "global_step": 367335, "epoch": 4425} {"train_loss": -26.47782325744629, "global_step": 367336, "epoch": 4425} {"train_loss": -26.17463493347168, "global_step": 367337, "epoch": 4425} {"train_loss": -26.371597290039062, "global_step": 367338, "epoch": 4425} {"train_loss": -25.980838775634766, "global_step": 367339, "epoch": 4425} {"train_loss": -26.71565055847168, "global_step": 367340, "epoch": 4425} {"train_loss": -26.66306495666504, "global_step": 367341, "epoch": 4425} {"train_loss": -26.407957077026367, "global_step": 367342, "epoch": 4425} {"train_loss": -26.407934188842773, "global_step": 367343, "epoch": 4425} {"train_loss": -26.301252365112305, "global_step": 367344, "epoch": 4425} {"train_loss": -26.34380531311035, "global_step": 367345, "epoch": 4425} {"train_loss": -26.121694564819336, "global_step": 367346, "epoch": 4425} {"train_loss": -26.384122848510742, "global_step": 367347, "epoch": 4425} {"train_loss": -26.588428497314453, "global_step": 367348, "epoch": 4425} {"train_loss": -26.556608200073242, "global_step": 367349, "epoch": 4425} {"train_loss": -26.708654403686523, "global_step": 367350, "epoch": 4425} {"train_loss": -26.408676147460938, "global_step": 367351, "epoch": 4425} {"train_loss": -26.313617706298828, "global_step": 367352, "epoch": 4425} {"train_loss": -26.306964874267578, "global_step": 367353, "epoch": 4425} {"train_loss": -26.478139877319336, "global_step": 367354, "epoch": 4425} {"train_loss": -26.209936141967773, "global_step": 367355, "epoch": 4425} {"train_loss": -25.983306884765625, "global_step": 367356, "epoch": 4425} {"train_loss": -26.0101490480354, "global_step": 367357, "epoch": 4425, "val_loss": 6624803.0} {"train_loss": -25.17291831970215, "global_step": 367358, "epoch": 4426} {"train_loss": -24.670204162597656, "global_step": 367359, "epoch": 4426} {"train_loss": -24.464590072631836, "global_step": 367360, "epoch": 4426} {"train_loss": -25.074304580688477, "global_step": 367361, "epoch": 4426} {"train_loss": -25.081640243530273, "global_step": 367362, "epoch": 4426} {"train_loss": -25.22945213317871, "global_step": 367363, "epoch": 4426} {"train_loss": -25.45438575744629, "global_step": 367364, "epoch": 4426} {"train_loss": -24.923185348510742, "global_step": 367365, "epoch": 4426} {"train_loss": -24.972919464111328, "global_step": 367366, "epoch": 4426} {"train_loss": -25.501264572143555, "global_step": 367367, "epoch": 4426} {"train_loss": -25.24286651611328, "global_step": 367368, "epoch": 4426} {"train_loss": -25.60369300842285, "global_step": 367369, "epoch": 4426} {"train_loss": -25.477216720581055, "global_step": 367370, "epoch": 4426} {"train_loss": -25.88763427734375, "global_step": 367371, "epoch": 4426} {"train_loss": -25.651580810546875, "global_step": 367372, "epoch": 4426} {"train_loss": -25.73590087890625, "global_step": 367373, "epoch": 4426} {"train_loss": -25.747472763061523, "global_step": 367374, "epoch": 4426} {"train_loss": -25.73113441467285, "global_step": 367375, "epoch": 4426} {"train_loss": -25.94550895690918, "global_step": 367376, "epoch": 4426} {"train_loss": -25.634841918945312, "global_step": 367377, "epoch": 4426} {"train_loss": -26.19121742248535, "global_step": 367378, "epoch": 4426} {"train_loss": -25.719074249267578, "global_step": 367379, "epoch": 4426} {"train_loss": -25.935317993164062, "global_step": 367380, "epoch": 4426} {"train_loss": -26.051849365234375, "global_step": 367381, "epoch": 4426} {"train_loss": -25.971832275390625, "global_step": 367382, "epoch": 4426} {"train_loss": -26.243961334228516, "global_step": 367383, "epoch": 4426} {"train_loss": -25.691129684448242, "global_step": 367384, "epoch": 4426} {"train_loss": -26.272504806518555, "global_step": 367385, "epoch": 4426} {"train_loss": -26.3005313873291, "global_step": 367386, "epoch": 4426} {"train_loss": -26.496814727783203, "global_step": 367387, "epoch": 4426} {"train_loss": -25.956541061401367, "global_step": 367388, "epoch": 4426} {"train_loss": -26.28670310974121, "global_step": 367389, "epoch": 4426} {"train_loss": -26.094192504882812, "global_step": 367390, "epoch": 4426} {"train_loss": -26.51742935180664, "global_step": 367391, "epoch": 4426} {"train_loss": -26.051172256469727, "global_step": 367392, "epoch": 4426} {"train_loss": -26.80121421813965, "global_step": 367393, "epoch": 4426} {"train_loss": -26.488540649414062, "global_step": 367394, "epoch": 4426} {"train_loss": -26.444631576538086, "global_step": 367395, "epoch": 4426} {"train_loss": -26.2357234954834, "global_step": 367396, "epoch": 4426} {"train_loss": -26.687833786010742, "global_step": 367397, "epoch": 4426} {"train_loss": -26.411725997924805, "global_step": 367398, "epoch": 4426} {"train_loss": -26.608509063720703, "global_step": 367399, "epoch": 4426} {"train_loss": -26.204023361206055, "global_step": 367400, "epoch": 4426} {"train_loss": -26.408618927001953, "global_step": 367401, "epoch": 4426} {"train_loss": -26.645002365112305, "global_step": 367402, "epoch": 4426} {"train_loss": -26.34902000427246, "global_step": 367403, "epoch": 4426} {"train_loss": -26.387500762939453, "global_step": 367404, "epoch": 4426} {"train_loss": -26.406164169311523, "global_step": 367405, "epoch": 4426} {"train_loss": -26.639432907104492, "global_step": 367406, "epoch": 4426} {"train_loss": -26.25132179260254, "global_step": 367407, "epoch": 4426} {"train_loss": -26.822290420532227, "global_step": 367408, "epoch": 4426} {"train_loss": -26.23148536682129, "global_step": 367409, "epoch": 4426} {"train_loss": -26.776004791259766, "global_step": 367410, "epoch": 4426} {"train_loss": -26.423904418945312, "global_step": 367411, "epoch": 4426} {"train_loss": -26.577655792236328, "global_step": 367412, "epoch": 4426} {"train_loss": -26.20026206970215, "global_step": 367413, "epoch": 4426} {"train_loss": -26.63004493713379, "global_step": 367414, "epoch": 4426} {"train_loss": -26.612491607666016, "global_step": 367415, "epoch": 4426} {"train_loss": -26.037418365478516, "global_step": 367416, "epoch": 4426} {"train_loss": -26.214014053344727, "global_step": 367417, "epoch": 4426} {"train_loss": -25.915739059448242, "global_step": 367418, "epoch": 4426} {"train_loss": -25.852649688720703, "global_step": 367419, "epoch": 4426} {"train_loss": -26.288015365600586, "global_step": 367420, "epoch": 4426} {"train_loss": -26.49395179748535, "global_step": 367421, "epoch": 4426} {"train_loss": -25.828948974609375, "global_step": 367422, "epoch": 4426} {"train_loss": -25.365325927734375, "global_step": 367423, "epoch": 4426} {"train_loss": -25.62200355529785, "global_step": 367424, "epoch": 4426} {"train_loss": -25.76258659362793, "global_step": 367425, "epoch": 4426} {"train_loss": -25.935285568237305, "global_step": 367426, "epoch": 4426} {"train_loss": -25.993183135986328, "global_step": 367427, "epoch": 4426} {"train_loss": -25.937774658203125, "global_step": 367428, "epoch": 4426} {"train_loss": -26.2591609954834, "global_step": 367429, "epoch": 4426} {"train_loss": -26.006681442260742, "global_step": 367430, "epoch": 4426} {"train_loss": -26.527313232421875, "global_step": 367431, "epoch": 4426} {"train_loss": -26.03529167175293, "global_step": 367432, "epoch": 4426} {"train_loss": -26.049213409423828, "global_step": 367433, "epoch": 4426} {"train_loss": -25.874963760375977, "global_step": 367434, "epoch": 4426} {"train_loss": -26.23317527770996, "global_step": 367435, "epoch": 4426} {"train_loss": -25.97965431213379, "global_step": 367436, "epoch": 4426} {"train_loss": -25.95587730407715, "global_step": 367437, "epoch": 4426} {"train_loss": -26.228788375854492, "global_step": 367438, "epoch": 4426} {"train_loss": -26.32358169555664, "global_step": 367439, "epoch": 4426} {"train_loss": -26.021673708076936, "global_step": 367440, "epoch": 4426, "val_loss": 6737119.5} {"train_loss": -25.28985023498535, "global_step": 367441, "epoch": 4427} {"train_loss": -25.53891944885254, "global_step": 367442, "epoch": 4427} {"train_loss": -25.629730224609375, "global_step": 367443, "epoch": 4427} {"train_loss": -25.720239639282227, "global_step": 367444, "epoch": 4427} {"train_loss": -25.764692306518555, "global_step": 367445, "epoch": 4427} {"train_loss": -25.8220157623291, "global_step": 367446, "epoch": 4427} {"train_loss": -25.808828353881836, "global_step": 367447, "epoch": 4427} {"train_loss": -26.02564811706543, "global_step": 367448, "epoch": 4427} {"train_loss": -25.989850997924805, "global_step": 367449, "epoch": 4427} {"train_loss": -25.820865631103516, "global_step": 367450, "epoch": 4427} {"train_loss": -25.775344848632812, "global_step": 367451, "epoch": 4427} {"train_loss": -25.782583236694336, "global_step": 367452, "epoch": 4427} {"train_loss": -25.650938034057617, "global_step": 367453, "epoch": 4427} {"train_loss": -26.36226463317871, "global_step": 367454, "epoch": 4427} {"train_loss": -25.981536865234375, "global_step": 367455, "epoch": 4427} {"train_loss": -26.047056198120117, "global_step": 367456, "epoch": 4427} {"train_loss": -26.1225528717041, "global_step": 367457, "epoch": 4427} {"train_loss": -26.046142578125, "global_step": 367458, "epoch": 4427} {"train_loss": -26.02886390686035, "global_step": 367459, "epoch": 4427} {"train_loss": -26.04816246032715, "global_step": 367460, "epoch": 4427} {"train_loss": -26.196741104125977, "global_step": 367461, "epoch": 4427} {"train_loss": -25.992612838745117, "global_step": 367462, "epoch": 4427} {"train_loss": -26.16650390625, "global_step": 367463, "epoch": 4427} {"train_loss": -26.425256729125977, "global_step": 367464, "epoch": 4427} {"train_loss": -26.428115844726562, "global_step": 367465, "epoch": 4427} {"train_loss": -26.268421173095703, "global_step": 367466, "epoch": 4427} {"train_loss": -25.9544620513916, "global_step": 367467, "epoch": 4427} {"train_loss": -26.309864044189453, "global_step": 367468, "epoch": 4427} {"train_loss": -26.580617904663086, "global_step": 367469, "epoch": 4427} {"train_loss": -26.311370849609375, "global_step": 367470, "epoch": 4427} {"train_loss": -26.341705322265625, "global_step": 367471, "epoch": 4427} {"train_loss": -26.32972526550293, "global_step": 367472, "epoch": 4427} {"train_loss": -26.54620933532715, "global_step": 367473, "epoch": 4427} {"train_loss": -26.322057723999023, "global_step": 367474, "epoch": 4427} {"train_loss": -26.574201583862305, "global_step": 367475, "epoch": 4427} {"train_loss": -25.89409828186035, "global_step": 367476, "epoch": 4427} {"train_loss": -26.38905143737793, "global_step": 367477, "epoch": 4427} {"train_loss": -26.205270767211914, "global_step": 367478, "epoch": 4427} {"train_loss": -26.727869033813477, "global_step": 367479, "epoch": 4427} {"train_loss": -26.14503288269043, "global_step": 367480, "epoch": 4427} {"train_loss": -26.2498779296875, "global_step": 367481, "epoch": 4427} {"train_loss": -26.43316650390625, "global_step": 367482, "epoch": 4427} {"train_loss": -26.467044830322266, "global_step": 367483, "epoch": 4427} {"train_loss": -26.628116607666016, "global_step": 367484, "epoch": 4427} {"train_loss": -26.37013053894043, "global_step": 367485, "epoch": 4427} {"train_loss": -26.26824951171875, "global_step": 367486, "epoch": 4427} {"train_loss": -26.285287857055664, "global_step": 367487, "epoch": 4427} {"train_loss": -26.563512802124023, "global_step": 367488, "epoch": 4427} {"train_loss": -26.125263214111328, "global_step": 367489, "epoch": 4427} {"train_loss": -26.423383712768555, "global_step": 367490, "epoch": 4427} {"train_loss": -26.237585067749023, "global_step": 367491, "epoch": 4427} {"train_loss": -26.040283203125, "global_step": 367492, "epoch": 4427} {"train_loss": -25.94964599609375, "global_step": 367493, "epoch": 4427} {"train_loss": -26.320234298706055, "global_step": 367494, "epoch": 4427} {"train_loss": -26.421268463134766, "global_step": 367495, "epoch": 4427} {"train_loss": -26.279117584228516, "global_step": 367496, "epoch": 4427} {"train_loss": -26.321460723876953, "global_step": 367497, "epoch": 4427} {"train_loss": -26.580738067626953, "global_step": 367498, "epoch": 4427} {"train_loss": -26.242141723632812, "global_step": 367499, "epoch": 4427} {"train_loss": -26.561880111694336, "global_step": 367500, "epoch": 4427} {"train_loss": -26.505598068237305, "global_step": 367501, "epoch": 4427} {"train_loss": -26.72617530822754, "global_step": 367502, "epoch": 4427} {"train_loss": -25.944290161132812, "global_step": 367503, "epoch": 4427} {"train_loss": -26.274744033813477, "global_step": 367504, "epoch": 4427} {"train_loss": -26.91395378112793, "global_step": 367505, "epoch": 4427} {"train_loss": -26.092212677001953, "global_step": 367506, "epoch": 4427} {"train_loss": -26.760766983032227, "global_step": 367507, "epoch": 4427} {"train_loss": -26.40932273864746, "global_step": 367508, "epoch": 4427} {"train_loss": -26.31693458557129, "global_step": 367509, "epoch": 4427} {"train_loss": -26.264806747436523, "global_step": 367510, "epoch": 4427} {"train_loss": -26.756444931030273, "global_step": 367511, "epoch": 4427} {"train_loss": -26.095813751220703, "global_step": 367512, "epoch": 4427} {"train_loss": -26.381811141967773, "global_step": 367513, "epoch": 4427} {"train_loss": -26.778553009033203, "global_step": 367514, "epoch": 4427} {"train_loss": -26.287382125854492, "global_step": 367515, "epoch": 4427} {"train_loss": -26.649381637573242, "global_step": 367516, "epoch": 4427} {"train_loss": -26.209259033203125, "global_step": 367517, "epoch": 4427} {"train_loss": -26.67774772644043, "global_step": 367518, "epoch": 4427} {"train_loss": -26.269861221313477, "global_step": 367519, "epoch": 4427} {"train_loss": -26.513547897338867, "global_step": 367520, "epoch": 4427} {"train_loss": -26.196048736572266, "global_step": 367521, "epoch": 4427} {"train_loss": -25.980077743530273, "global_step": 367522, "epoch": 4427} {"train_loss": -26.232330942728435, "global_step": 367523, "epoch": 4427, "val_loss": 6701761.0} {"train_loss": -26.188344955444336, "global_step": 367524, "epoch": 4428} {"train_loss": -25.902204513549805, "global_step": 367525, "epoch": 4428} {"train_loss": -26.1881160736084, "global_step": 367526, "epoch": 4428} {"train_loss": -26.016698837280273, "global_step": 367527, "epoch": 4428} {"train_loss": -26.01496696472168, "global_step": 367528, "epoch": 4428} {"train_loss": -25.965320587158203, "global_step": 367529, "epoch": 4428} {"train_loss": -26.556720733642578, "global_step": 367530, "epoch": 4428} {"train_loss": -26.11895751953125, "global_step": 367531, "epoch": 4428} {"train_loss": -26.244958877563477, "global_step": 367532, "epoch": 4428} {"train_loss": -26.118656158447266, "global_step": 367533, "epoch": 4428} {"train_loss": -25.9271183013916, "global_step": 367534, "epoch": 4428} {"train_loss": -26.447397232055664, "global_step": 367535, "epoch": 4428} {"train_loss": -25.771337509155273, "global_step": 367536, "epoch": 4428} {"train_loss": -25.75336265563965, "global_step": 367537, "epoch": 4428} {"train_loss": -26.061172485351562, "global_step": 367538, "epoch": 4428} {"train_loss": -26.132217407226562, "global_step": 367539, "epoch": 4428} {"train_loss": -25.887420654296875, "global_step": 367540, "epoch": 4428} {"train_loss": -26.46466636657715, "global_step": 367541, "epoch": 4428} {"train_loss": -26.519947052001953, "global_step": 367542, "epoch": 4428} {"train_loss": -26.30543327331543, "global_step": 367543, "epoch": 4428} {"train_loss": -26.294891357421875, "global_step": 367544, "epoch": 4428} {"train_loss": -26.630979537963867, "global_step": 367545, "epoch": 4428} {"train_loss": -26.14926528930664, "global_step": 367546, "epoch": 4428} {"train_loss": -26.205463409423828, "global_step": 367547, "epoch": 4428} {"train_loss": -26.300397872924805, "global_step": 367548, "epoch": 4428} {"train_loss": -25.993295669555664, "global_step": 367549, "epoch": 4428} {"train_loss": -26.3292236328125, "global_step": 367550, "epoch": 4428} {"train_loss": -26.170507431030273, "global_step": 367551, "epoch": 4428} {"train_loss": -26.022235870361328, "global_step": 367552, "epoch": 4428} {"train_loss": -26.168317794799805, "global_step": 367553, "epoch": 4428} {"train_loss": -26.129867553710938, "global_step": 367554, "epoch": 4428} {"train_loss": -26.36467933654785, "global_step": 367555, "epoch": 4428} {"train_loss": -26.098142623901367, "global_step": 367556, "epoch": 4428} {"train_loss": -26.530628204345703, "global_step": 367557, "epoch": 4428} {"train_loss": -26.431415557861328, "global_step": 367558, "epoch": 4428} {"train_loss": -26.404083251953125, "global_step": 367559, "epoch": 4428} {"train_loss": -26.3647518157959, "global_step": 367560, "epoch": 4428} {"train_loss": -26.4377498626709, "global_step": 367561, "epoch": 4428} {"train_loss": -26.644567489624023, "global_step": 367562, "epoch": 4428} {"train_loss": -26.1971492767334, "global_step": 367563, "epoch": 4428} {"train_loss": -26.674402236938477, "global_step": 367564, "epoch": 4428} {"train_loss": -26.2928409576416, "global_step": 367565, "epoch": 4428} {"train_loss": -26.499433517456055, "global_step": 367566, "epoch": 4428} {"train_loss": -26.38043212890625, "global_step": 367567, "epoch": 4428} {"train_loss": -26.421829223632812, "global_step": 367568, "epoch": 4428} {"train_loss": -26.38724708557129, "global_step": 367569, "epoch": 4428} {"train_loss": -26.076126098632812, "global_step": 367570, "epoch": 4428} {"train_loss": -26.44879722595215, "global_step": 367571, "epoch": 4428} {"train_loss": -26.293912887573242, "global_step": 367572, "epoch": 4428} {"train_loss": -26.550649642944336, "global_step": 367573, "epoch": 4428} {"train_loss": -26.32991600036621, "global_step": 367574, "epoch": 4428} {"train_loss": -26.114294052124023, "global_step": 367575, "epoch": 4428} {"train_loss": -26.27825927734375, "global_step": 367576, "epoch": 4428} {"train_loss": -26.549381256103516, "global_step": 367577, "epoch": 4428} {"train_loss": -26.141565322875977, "global_step": 367578, "epoch": 4428} {"train_loss": -26.3489933013916, "global_step": 367579, "epoch": 4428} {"train_loss": -26.6721248626709, "global_step": 367580, "epoch": 4428} {"train_loss": -26.373380661010742, "global_step": 367581, "epoch": 4428} {"train_loss": -26.531553268432617, "global_step": 367582, "epoch": 4428} {"train_loss": -26.1414737701416, "global_step": 367583, "epoch": 4428} {"train_loss": -26.365375518798828, "global_step": 367584, "epoch": 4428} {"train_loss": -26.544281005859375, "global_step": 367585, "epoch": 4428} {"train_loss": -26.5185546875, "global_step": 367586, "epoch": 4428} {"train_loss": -26.778287887573242, "global_step": 367587, "epoch": 4428} {"train_loss": -26.477191925048828, "global_step": 367588, "epoch": 4428} {"train_loss": -26.682083129882812, "global_step": 367589, "epoch": 4428} {"train_loss": -26.270843505859375, "global_step": 367590, "epoch": 4428} {"train_loss": -26.130361557006836, "global_step": 367591, "epoch": 4428} {"train_loss": -26.587934494018555, "global_step": 367592, "epoch": 4428} {"train_loss": -26.618879318237305, "global_step": 367593, "epoch": 4428} {"train_loss": -26.511938095092773, "global_step": 367594, "epoch": 4428} {"train_loss": -26.131855010986328, "global_step": 367595, "epoch": 4428} {"train_loss": -26.151935577392578, "global_step": 367596, "epoch": 4428} {"train_loss": -25.8721923828125, "global_step": 367597, "epoch": 4428} {"train_loss": -26.039825439453125, "global_step": 367598, "epoch": 4428} {"train_loss": -25.921987533569336, "global_step": 367599, "epoch": 4428} {"train_loss": -25.745716094970703, "global_step": 367600, "epoch": 4428} {"train_loss": -26.275022506713867, "global_step": 367601, "epoch": 4428} {"train_loss": -26.217309951782227, "global_step": 367602, "epoch": 4428} {"train_loss": -25.59130096435547, "global_step": 367603, "epoch": 4428} {"train_loss": -25.85773277282715, "global_step": 367604, "epoch": 4428} {"train_loss": -26.59168815612793, "global_step": 367605, "epoch": 4428} {"train_loss": -26.27393483541098, "global_step": 367606, "epoch": 4428, "val_loss": 6691971.0} {"train_loss": -25.543302536010742, "global_step": 367607, "epoch": 4429} {"train_loss": -25.179040908813477, "global_step": 367608, "epoch": 4429} {"train_loss": -25.39418601989746, "global_step": 367609, "epoch": 4429} {"train_loss": -25.25884246826172, "global_step": 367610, "epoch": 4429} {"train_loss": -25.833242416381836, "global_step": 367611, "epoch": 4429} {"train_loss": -25.317270278930664, "global_step": 367612, "epoch": 4429} {"train_loss": -25.633045196533203, "global_step": 367613, "epoch": 4429} {"train_loss": -25.716541290283203, "global_step": 367614, "epoch": 4429} {"train_loss": -25.949356079101562, "global_step": 367615, "epoch": 4429} {"train_loss": -25.64203453063965, "global_step": 367616, "epoch": 4429} {"train_loss": -25.870849609375, "global_step": 367617, "epoch": 4429} {"train_loss": -25.673294067382812, "global_step": 367618, "epoch": 4429} {"train_loss": -25.79866600036621, "global_step": 367619, "epoch": 4429} {"train_loss": -25.74171257019043, "global_step": 367620, "epoch": 4429} {"train_loss": -25.8535213470459, "global_step": 367621, "epoch": 4429} {"train_loss": -25.944412231445312, "global_step": 367622, "epoch": 4429} {"train_loss": -26.081750869750977, "global_step": 367623, "epoch": 4429} {"train_loss": -26.194931030273438, "global_step": 367624, "epoch": 4429} {"train_loss": -26.08424949645996, "global_step": 367625, "epoch": 4429} {"train_loss": -26.141687393188477, "global_step": 367626, "epoch": 4429} {"train_loss": -26.264211654663086, "global_step": 367627, "epoch": 4429} {"train_loss": -25.910415649414062, "global_step": 367628, "epoch": 4429} {"train_loss": -26.129098892211914, "global_step": 367629, "epoch": 4429} {"train_loss": -26.33526039123535, "global_step": 367630, "epoch": 4429} {"train_loss": -26.295785903930664, "global_step": 367631, "epoch": 4429} {"train_loss": -26.07352066040039, "global_step": 367632, "epoch": 4429} {"train_loss": -26.2835750579834, "global_step": 367633, "epoch": 4429} {"train_loss": -26.284269332885742, "global_step": 367634, "epoch": 4429} {"train_loss": -26.222700119018555, "global_step": 367635, "epoch": 4429} {"train_loss": -26.262231826782227, "global_step": 367636, "epoch": 4429} {"train_loss": -26.03765869140625, "global_step": 367637, "epoch": 4429} {"train_loss": -26.38075065612793, "global_step": 367638, "epoch": 4429} {"train_loss": -26.1539306640625, "global_step": 367639, "epoch": 4429} {"train_loss": -26.21731948852539, "global_step": 367640, "epoch": 4429} {"train_loss": -26.512182235717773, "global_step": 367641, "epoch": 4429} {"train_loss": -26.342199325561523, "global_step": 367642, "epoch": 4429} {"train_loss": -26.31781005859375, "global_step": 367643, "epoch": 4429} {"train_loss": -26.247425079345703, "global_step": 367644, "epoch": 4429} {"train_loss": -26.47757339477539, "global_step": 367645, "epoch": 4429} {"train_loss": -26.478124618530273, "global_step": 367646, "epoch": 4429} {"train_loss": -26.617456436157227, "global_step": 367647, "epoch": 4429} {"train_loss": -26.27997398376465, "global_step": 367648, "epoch": 4429} {"train_loss": -26.308774948120117, "global_step": 367649, "epoch": 4429} {"train_loss": -25.867582321166992, "global_step": 367650, "epoch": 4429} {"train_loss": -26.04871940612793, "global_step": 367651, "epoch": 4429} {"train_loss": -26.28995132446289, "global_step": 367652, "epoch": 4429} {"train_loss": -26.408935546875, "global_step": 367653, "epoch": 4429} {"train_loss": -26.05474853515625, "global_step": 367654, "epoch": 4429} {"train_loss": -26.297468185424805, "global_step": 367655, "epoch": 4429} {"train_loss": -26.29123878479004, "global_step": 367656, "epoch": 4429} {"train_loss": -26.67982292175293, "global_step": 367657, "epoch": 4429} {"train_loss": -26.40399169921875, "global_step": 367658, "epoch": 4429} {"train_loss": -26.549291610717773, "global_step": 367659, "epoch": 4429} {"train_loss": -26.343658447265625, "global_step": 367660, "epoch": 4429} {"train_loss": -26.681482315063477, "global_step": 367661, "epoch": 4429} {"train_loss": -26.303647994995117, "global_step": 367662, "epoch": 4429} {"train_loss": -26.448450088500977, "global_step": 367663, "epoch": 4429} {"train_loss": -26.58759117126465, "global_step": 367664, "epoch": 4429} {"train_loss": -26.642486572265625, "global_step": 367665, "epoch": 4429} {"train_loss": -26.85780143737793, "global_step": 367666, "epoch": 4429} {"train_loss": -26.492345809936523, "global_step": 367667, "epoch": 4429} {"train_loss": -26.396787643432617, "global_step": 367668, "epoch": 4429} {"train_loss": -26.631010055541992, "global_step": 367669, "epoch": 4429} {"train_loss": -26.622638702392578, "global_step": 367670, "epoch": 4429} {"train_loss": -26.530261993408203, "global_step": 367671, "epoch": 4429} {"train_loss": -26.296850204467773, "global_step": 367672, "epoch": 4429} {"train_loss": -26.316619873046875, "global_step": 367673, "epoch": 4429} {"train_loss": -26.831960678100586, "global_step": 367674, "epoch": 4429} {"train_loss": -26.5703067779541, "global_step": 367675, "epoch": 4429} {"train_loss": -26.549245834350586, "global_step": 367676, "epoch": 4429} {"train_loss": -26.441314697265625, "global_step": 367677, "epoch": 4429} {"train_loss": -26.543659210205078, "global_step": 367678, "epoch": 4429} {"train_loss": -26.409643173217773, "global_step": 367679, "epoch": 4429} {"train_loss": -26.22074317932129, "global_step": 367680, "epoch": 4429} {"train_loss": -26.278213500976562, "global_step": 367681, "epoch": 4429} {"train_loss": -26.79727554321289, "global_step": 367682, "epoch": 4429} {"train_loss": -26.430429458618164, "global_step": 367683, "epoch": 4429} {"train_loss": -26.442626953125, "global_step": 367684, "epoch": 4429} {"train_loss": -26.348011016845703, "global_step": 367685, "epoch": 4429} {"train_loss": -26.30633544921875, "global_step": 367686, "epoch": 4429} {"train_loss": -26.679950714111328, "global_step": 367687, "epoch": 4429} {"train_loss": -26.519866943359375, "global_step": 367688, "epoch": 4429} {"train_loss": -26.23433425627559, "global_step": 367689, "epoch": 4429, "val_loss": 6592661.5} {"train_loss": -25.622791290283203, "global_step": 367690, "epoch": 4430} {"train_loss": -24.81161880493164, "global_step": 367691, "epoch": 4430} {"train_loss": -24.568073272705078, "global_step": 367692, "epoch": 4430} {"train_loss": -25.176013946533203, "global_step": 367693, "epoch": 4430} {"train_loss": -25.054838180541992, "global_step": 367694, "epoch": 4430} {"train_loss": -24.581918716430664, "global_step": 367695, "epoch": 4430} {"train_loss": -25.531557083129883, "global_step": 367696, "epoch": 4430} {"train_loss": -25.317289352416992, "global_step": 367697, "epoch": 4430} {"train_loss": -25.898534774780273, "global_step": 367698, "epoch": 4430} {"train_loss": -25.118330001831055, "global_step": 367699, "epoch": 4430} {"train_loss": -25.92245864868164, "global_step": 367700, "epoch": 4430} {"train_loss": -25.646718978881836, "global_step": 367701, "epoch": 4430} {"train_loss": -25.157724380493164, "global_step": 367702, "epoch": 4430} {"train_loss": -25.85174560546875, "global_step": 367703, "epoch": 4430} {"train_loss": -25.368684768676758, "global_step": 367704, "epoch": 4430} {"train_loss": -25.627267837524414, "global_step": 367705, "epoch": 4430} {"train_loss": -25.860986709594727, "global_step": 367706, "epoch": 4430} {"train_loss": -25.533178329467773, "global_step": 367707, "epoch": 4430} {"train_loss": -25.86800193786621, "global_step": 367708, "epoch": 4430} {"train_loss": -25.723968505859375, "global_step": 367709, "epoch": 4430} {"train_loss": -25.985143661499023, "global_step": 367710, "epoch": 4430} {"train_loss": -25.724084854125977, "global_step": 367711, "epoch": 4430} {"train_loss": -25.723499298095703, "global_step": 367712, "epoch": 4430} {"train_loss": -25.937597274780273, "global_step": 367713, "epoch": 4430} {"train_loss": -25.71207618713379, "global_step": 367714, "epoch": 4430} {"train_loss": -25.959762573242188, "global_step": 367715, "epoch": 4430} {"train_loss": -25.952594757080078, "global_step": 367716, "epoch": 4430} {"train_loss": -26.41664695739746, "global_step": 367717, "epoch": 4430} {"train_loss": -25.939855575561523, "global_step": 367718, "epoch": 4430} {"train_loss": -26.053686141967773, "global_step": 367719, "epoch": 4430} {"train_loss": -26.081323623657227, "global_step": 367720, "epoch": 4430} {"train_loss": -26.10200309753418, "global_step": 367721, "epoch": 4430} {"train_loss": -25.86130714416504, "global_step": 367722, "epoch": 4430} {"train_loss": -26.476255416870117, "global_step": 367723, "epoch": 4430} {"train_loss": -26.52088737487793, "global_step": 367724, "epoch": 4430} {"train_loss": -26.354999542236328, "global_step": 367725, "epoch": 4430} {"train_loss": -26.1315860748291, "global_step": 367726, "epoch": 4430} {"train_loss": -26.30006980895996, "global_step": 367727, "epoch": 4430} {"train_loss": -26.56864356994629, "global_step": 367728, "epoch": 4430} {"train_loss": -26.267423629760742, "global_step": 367729, "epoch": 4430} {"train_loss": -26.391284942626953, "global_step": 367730, "epoch": 4430} {"train_loss": -26.04813003540039, "global_step": 367731, "epoch": 4430} {"train_loss": -26.485794067382812, "global_step": 367732, "epoch": 4430} {"train_loss": -26.312469482421875, "global_step": 367733, "epoch": 4430} {"train_loss": -26.640613555908203, "global_step": 367734, "epoch": 4430} {"train_loss": -26.168188095092773, "global_step": 367735, "epoch": 4430} {"train_loss": -26.693464279174805, "global_step": 367736, "epoch": 4430} {"train_loss": -27.014123916625977, "global_step": 367737, "epoch": 4430} {"train_loss": -26.500513076782227, "global_step": 367738, "epoch": 4430} {"train_loss": -26.507801055908203, "global_step": 367739, "epoch": 4430} {"train_loss": -26.096576690673828, "global_step": 367740, "epoch": 4430} {"train_loss": -26.4075927734375, "global_step": 367741, "epoch": 4430} {"train_loss": -26.24689292907715, "global_step": 367742, "epoch": 4430} {"train_loss": -26.449567794799805, "global_step": 367743, "epoch": 4430} {"train_loss": -26.419769287109375, "global_step": 367744, "epoch": 4430} {"train_loss": -26.49399185180664, "global_step": 367745, "epoch": 4430} {"train_loss": -26.32379150390625, "global_step": 367746, "epoch": 4430} {"train_loss": -26.220138549804688, "global_step": 367747, "epoch": 4430} {"train_loss": -26.409650802612305, "global_step": 367748, "epoch": 4430} {"train_loss": -26.5430850982666, "global_step": 367749, "epoch": 4430} {"train_loss": -26.552148818969727, "global_step": 367750, "epoch": 4430} {"train_loss": -26.43568992614746, "global_step": 367751, "epoch": 4430} {"train_loss": -26.112958908081055, "global_step": 367752, "epoch": 4430} {"train_loss": -26.41072654724121, "global_step": 367753, "epoch": 4430} {"train_loss": -26.204742431640625, "global_step": 367754, "epoch": 4430} {"train_loss": -26.06157875061035, "global_step": 367755, "epoch": 4430} {"train_loss": -25.325103759765625, "global_step": 367756, "epoch": 4430} {"train_loss": -25.594175338745117, "global_step": 367757, "epoch": 4430} {"train_loss": -26.338674545288086, "global_step": 367758, "epoch": 4430} {"train_loss": -25.540740966796875, "global_step": 367759, "epoch": 4430} {"train_loss": -25.75629234313965, "global_step": 367760, "epoch": 4430} {"train_loss": -25.360265731811523, "global_step": 367761, "epoch": 4430} {"train_loss": -25.531513214111328, "global_step": 367762, "epoch": 4430} {"train_loss": -25.57386589050293, "global_step": 367763, "epoch": 4430} {"train_loss": -26.149900436401367, "global_step": 367764, "epoch": 4430} {"train_loss": -25.226789474487305, "global_step": 367765, "epoch": 4430} {"train_loss": -25.958166122436523, "global_step": 367766, "epoch": 4430} {"train_loss": -26.012592315673828, "global_step": 367767, "epoch": 4430} {"train_loss": -25.774145126342773, "global_step": 367768, "epoch": 4430} {"train_loss": -25.811737060546875, "global_step": 367769, "epoch": 4430} {"train_loss": -26.07105827331543, "global_step": 367770, "epoch": 4430} {"train_loss": -26.16036033630371, "global_step": 367771, "epoch": 4430} {"train_loss": -25.966591869492127, "global_step": 367772, "epoch": 4430, "val_loss": 6715974.0} {"train_loss": -25.305612564086914, "global_step": 367773, "epoch": 4431} {"train_loss": -25.883804321289062, "global_step": 367774, "epoch": 4431} {"train_loss": -25.738178253173828, "global_step": 367775, "epoch": 4431} {"train_loss": -25.407922744750977, "global_step": 367776, "epoch": 4431} {"train_loss": -26.21180534362793, "global_step": 367777, "epoch": 4431} {"train_loss": -25.453401565551758, "global_step": 367778, "epoch": 4431} {"train_loss": -25.837644577026367, "global_step": 367779, "epoch": 4431} {"train_loss": -25.771520614624023, "global_step": 367780, "epoch": 4431} {"train_loss": -26.261795043945312, "global_step": 367781, "epoch": 4431} {"train_loss": -26.037311553955078, "global_step": 367782, "epoch": 4431} {"train_loss": -25.786962509155273, "global_step": 367783, "epoch": 4431} {"train_loss": -25.857074737548828, "global_step": 367784, "epoch": 4431} {"train_loss": -26.243783950805664, "global_step": 367785, "epoch": 4431} {"train_loss": -26.015522003173828, "global_step": 367786, "epoch": 4431} {"train_loss": -26.010236740112305, "global_step": 367787, "epoch": 4431} {"train_loss": -26.062347412109375, "global_step": 367788, "epoch": 4431} {"train_loss": -26.105520248413086, "global_step": 367789, "epoch": 4431} {"train_loss": -26.274755477905273, "global_step": 367790, "epoch": 4431} {"train_loss": -26.102619171142578, "global_step": 367791, "epoch": 4431} {"train_loss": -26.446619033813477, "global_step": 367792, "epoch": 4431} {"train_loss": -26.128515243530273, "global_step": 367793, "epoch": 4431} {"train_loss": -26.023273468017578, "global_step": 367794, "epoch": 4431} {"train_loss": -26.375946044921875, "global_step": 367795, "epoch": 4431} {"train_loss": -26.017215728759766, "global_step": 367796, "epoch": 4431} {"train_loss": -26.189558029174805, "global_step": 367797, "epoch": 4431} {"train_loss": -26.3029727935791, "global_step": 367798, "epoch": 4431} {"train_loss": -26.052448272705078, "global_step": 367799, "epoch": 4431} {"train_loss": -26.382080078125, "global_step": 367800, "epoch": 4431} {"train_loss": -26.473068237304688, "global_step": 367801, "epoch": 4431} {"train_loss": -26.2746639251709, "global_step": 367802, "epoch": 4431} {"train_loss": -25.99124526977539, "global_step": 367803, "epoch": 4431} {"train_loss": -26.695432662963867, "global_step": 367804, "epoch": 4431} {"train_loss": -26.55560302734375, "global_step": 367805, "epoch": 4431} {"train_loss": -26.317169189453125, "global_step": 367806, "epoch": 4431} {"train_loss": -26.471460342407227, "global_step": 367807, "epoch": 4431} {"train_loss": -26.39029312133789, "global_step": 367808, "epoch": 4431} {"train_loss": -26.535053253173828, "global_step": 367809, "epoch": 4431} {"train_loss": -26.829181671142578, "global_step": 367810, "epoch": 4431} {"train_loss": -26.90864372253418, "global_step": 367811, "epoch": 4431} {"train_loss": -26.587055206298828, "global_step": 367812, "epoch": 4431} {"train_loss": -26.6795654296875, "global_step": 367813, "epoch": 4431} {"train_loss": -26.57098960876465, "global_step": 367814, "epoch": 4431} {"train_loss": -26.632062911987305, "global_step": 367815, "epoch": 4431} {"train_loss": -26.518407821655273, "global_step": 367816, "epoch": 4431} {"train_loss": -26.71461296081543, "global_step": 367817, "epoch": 4431} {"train_loss": -26.256494522094727, "global_step": 367818, "epoch": 4431} {"train_loss": -26.620025634765625, "global_step": 367819, "epoch": 4431} {"train_loss": -26.585798263549805, "global_step": 367820, "epoch": 4431} {"train_loss": -26.240209579467773, "global_step": 367821, "epoch": 4431} {"train_loss": -26.462249755859375, "global_step": 367822, "epoch": 4431} {"train_loss": -26.733556747436523, "global_step": 367823, "epoch": 4431} {"train_loss": -26.853290557861328, "global_step": 367824, "epoch": 4431} {"train_loss": -25.952550888061523, "global_step": 367825, "epoch": 4431} {"train_loss": -25.793874740600586, "global_step": 367826, "epoch": 4431} {"train_loss": -25.506818771362305, "global_step": 367827, "epoch": 4431} {"train_loss": -26.293899536132812, "global_step": 367828, "epoch": 4431} {"train_loss": -26.057104110717773, "global_step": 367829, "epoch": 4431} {"train_loss": -26.353809356689453, "global_step": 367830, "epoch": 4431} {"train_loss": -26.381113052368164, "global_step": 367831, "epoch": 4431} {"train_loss": -26.431217193603516, "global_step": 367832, "epoch": 4431} {"train_loss": -26.426593780517578, "global_step": 367833, "epoch": 4431} {"train_loss": -26.094587326049805, "global_step": 367834, "epoch": 4431} {"train_loss": -25.6413516998291, "global_step": 367835, "epoch": 4431} {"train_loss": -25.948556900024414, "global_step": 367836, "epoch": 4431} {"train_loss": -26.18998146057129, "global_step": 367837, "epoch": 4431} {"train_loss": -25.912256240844727, "global_step": 367838, "epoch": 4431} {"train_loss": -25.735349655151367, "global_step": 367839, "epoch": 4431} {"train_loss": -25.942106246948242, "global_step": 367840, "epoch": 4431} {"train_loss": -26.107572555541992, "global_step": 367841, "epoch": 4431} {"train_loss": -26.118030548095703, "global_step": 367842, "epoch": 4431} {"train_loss": -25.78621482849121, "global_step": 367843, "epoch": 4431} {"train_loss": -25.60170555114746, "global_step": 367844, "epoch": 4431} {"train_loss": -26.218276977539062, "global_step": 367845, "epoch": 4431} {"train_loss": -26.044797897338867, "global_step": 367846, "epoch": 4431} {"train_loss": -26.24733543395996, "global_step": 367847, "epoch": 4431} {"train_loss": -25.975738525390625, "global_step": 367848, "epoch": 4431} {"train_loss": -26.14106559753418, "global_step": 367849, "epoch": 4431} {"train_loss": -26.06805992126465, "global_step": 367850, "epoch": 4431} {"train_loss": -26.440876007080078, "global_step": 367851, "epoch": 4431} {"train_loss": -26.213382720947266, "global_step": 367852, "epoch": 4431} {"train_loss": -26.17475700378418, "global_step": 367853, "epoch": 4431} {"train_loss": -26.260522842407227, "global_step": 367854, "epoch": 4431} {"train_loss": -26.211752075746833, "global_step": 367855, "epoch": 4431, "val_loss": 6771989.0} {"train_loss": -25.520416259765625, "global_step": 367856, "epoch": 4432} {"train_loss": -25.959081649780273, "global_step": 367857, "epoch": 4432} {"train_loss": -25.29995346069336, "global_step": 367858, "epoch": 4432} {"train_loss": -25.493444442749023, "global_step": 367859, "epoch": 4432} {"train_loss": -25.627307891845703, "global_step": 367860, "epoch": 4432} {"train_loss": -25.7260684967041, "global_step": 367861, "epoch": 4432} {"train_loss": -25.60092544555664, "global_step": 367862, "epoch": 4432} {"train_loss": -25.988784790039062, "global_step": 367863, "epoch": 4432} {"train_loss": -25.927274703979492, "global_step": 367864, "epoch": 4432} {"train_loss": -26.07958984375, "global_step": 367865, "epoch": 4432} {"train_loss": -26.26211929321289, "global_step": 367866, "epoch": 4432} {"train_loss": -26.440908432006836, "global_step": 367867, "epoch": 4432} {"train_loss": -25.963537216186523, "global_step": 367868, "epoch": 4432} {"train_loss": -26.55256462097168, "global_step": 367869, "epoch": 4432} {"train_loss": -26.033002853393555, "global_step": 367870, "epoch": 4432} {"train_loss": -26.334558486938477, "global_step": 367871, "epoch": 4432} {"train_loss": -26.307050704956055, "global_step": 367872, "epoch": 4432} {"train_loss": -26.570560455322266, "global_step": 367873, "epoch": 4432} {"train_loss": -25.967041015625, "global_step": 367874, "epoch": 4432} {"train_loss": -26.280370712280273, "global_step": 367875, "epoch": 4432} {"train_loss": -26.536029815673828, "global_step": 367876, "epoch": 4432} {"train_loss": -26.38715934753418, "global_step": 367877, "epoch": 4432} {"train_loss": -25.956939697265625, "global_step": 367878, "epoch": 4432} {"train_loss": -26.245756149291992, "global_step": 367879, "epoch": 4432} {"train_loss": -26.093399047851562, "global_step": 367880, "epoch": 4432} {"train_loss": -26.705556869506836, "global_step": 367881, "epoch": 4432} {"train_loss": -26.564489364624023, "global_step": 367882, "epoch": 4432} {"train_loss": -26.012516021728516, "global_step": 367883, "epoch": 4432} {"train_loss": -26.085372924804688, "global_step": 367884, "epoch": 4432} {"train_loss": -26.562015533447266, "global_step": 367885, "epoch": 4432} {"train_loss": -26.089712142944336, "global_step": 367886, "epoch": 4432} {"train_loss": -26.0809268951416, "global_step": 367887, "epoch": 4432} {"train_loss": -26.489999771118164, "global_step": 367888, "epoch": 4432} {"train_loss": -26.534093856811523, "global_step": 367889, "epoch": 4432} {"train_loss": -26.726892471313477, "global_step": 367890, "epoch": 4432} {"train_loss": -26.02923011779785, "global_step": 367891, "epoch": 4432} {"train_loss": -26.310888290405273, "global_step": 367892, "epoch": 4432} {"train_loss": -26.246448516845703, "global_step": 367893, "epoch": 4432} {"train_loss": -26.675500869750977, "global_step": 367894, "epoch": 4432} {"train_loss": -26.597448348999023, "global_step": 367895, "epoch": 4432} {"train_loss": -26.39869499206543, "global_step": 367896, "epoch": 4432} {"train_loss": -26.4947452545166, "global_step": 367897, "epoch": 4432} {"train_loss": -26.55926513671875, "global_step": 367898, "epoch": 4432} {"train_loss": -26.200448989868164, "global_step": 367899, "epoch": 4432} {"train_loss": -26.327014923095703, "global_step": 367900, "epoch": 4432} {"train_loss": -26.209508895874023, "global_step": 367901, "epoch": 4432} {"train_loss": -25.935840606689453, "global_step": 367902, "epoch": 4432} {"train_loss": -25.913806915283203, "global_step": 367903, "epoch": 4432} {"train_loss": -26.27743911743164, "global_step": 367904, "epoch": 4432} {"train_loss": -25.958444595336914, "global_step": 367905, "epoch": 4432} {"train_loss": -25.769611358642578, "global_step": 367906, "epoch": 4432} {"train_loss": -26.39731216430664, "global_step": 367907, "epoch": 4432} {"train_loss": -26.22930335998535, "global_step": 367908, "epoch": 4432} {"train_loss": -26.61516761779785, "global_step": 367909, "epoch": 4432} {"train_loss": -26.280134201049805, "global_step": 367910, "epoch": 4432} {"train_loss": -26.361204147338867, "global_step": 367911, "epoch": 4432} {"train_loss": -26.65540885925293, "global_step": 367912, "epoch": 4432} {"train_loss": -26.775793075561523, "global_step": 367913, "epoch": 4432} {"train_loss": -26.45450782775879, "global_step": 367914, "epoch": 4432} {"train_loss": -26.700647354125977, "global_step": 367915, "epoch": 4432} {"train_loss": -26.432287216186523, "global_step": 367916, "epoch": 4432} {"train_loss": -26.490497589111328, "global_step": 367917, "epoch": 4432} {"train_loss": -26.33640480041504, "global_step": 367918, "epoch": 4432} {"train_loss": -26.346603393554688, "global_step": 367919, "epoch": 4432} {"train_loss": -26.966419219970703, "global_step": 367920, "epoch": 4432} {"train_loss": -26.592618942260742, "global_step": 367921, "epoch": 4432} {"train_loss": -26.288532257080078, "global_step": 367922, "epoch": 4432} {"train_loss": -26.436716079711914, "global_step": 367923, "epoch": 4432} {"train_loss": -26.848907470703125, "global_step": 367924, "epoch": 4432} {"train_loss": -26.35279655456543, "global_step": 367925, "epoch": 4432} {"train_loss": -26.53668785095215, "global_step": 367926, "epoch": 4432} {"train_loss": -26.52105712890625, "global_step": 367927, "epoch": 4432} {"train_loss": -26.38849449157715, "global_step": 367928, "epoch": 4432} {"train_loss": -26.5576114654541, "global_step": 367929, "epoch": 4432} {"train_loss": -26.350561141967773, "global_step": 367930, "epoch": 4432} {"train_loss": -26.308317184448242, "global_step": 367931, "epoch": 4432} {"train_loss": -26.19305992126465, "global_step": 367932, "epoch": 4432} {"train_loss": -26.543121337890625, "global_step": 367933, "epoch": 4432} {"train_loss": -26.302783966064453, "global_step": 367934, "epoch": 4432} {"train_loss": -26.42770767211914, "global_step": 367935, "epoch": 4432} {"train_loss": -26.284818649291992, "global_step": 367936, "epoch": 4432} {"train_loss": -26.458703994750977, "global_step": 367937, "epoch": 4432} {"train_loss": -26.28416502619364, "global_step": 367938, "epoch": 4432, "val_loss": 6596941.5} {"train_loss": -26.27581214904785, "global_step": 367939, "epoch": 4433} {"train_loss": -25.96430778503418, "global_step": 367940, "epoch": 4433} {"train_loss": -25.925628662109375, "global_step": 367941, "epoch": 4433} {"train_loss": -25.99664306640625, "global_step": 367942, "epoch": 4433} {"train_loss": -25.52467155456543, "global_step": 367943, "epoch": 4433} {"train_loss": -26.147003173828125, "global_step": 367944, "epoch": 4433} {"train_loss": -26.337453842163086, "global_step": 367945, "epoch": 4433} {"train_loss": -25.758747100830078, "global_step": 367946, "epoch": 4433} {"train_loss": -26.03791618347168, "global_step": 367947, "epoch": 4433} {"train_loss": -25.690174102783203, "global_step": 367948, "epoch": 4433} {"train_loss": -25.849111557006836, "global_step": 367949, "epoch": 4433} {"train_loss": -25.83595085144043, "global_step": 367950, "epoch": 4433} {"train_loss": -25.953353881835938, "global_step": 367951, "epoch": 4433} {"train_loss": -26.052719116210938, "global_step": 367952, "epoch": 4433} {"train_loss": -26.38374137878418, "global_step": 367953, "epoch": 4433} {"train_loss": -26.21146583557129, "global_step": 367954, "epoch": 4433} {"train_loss": -26.30116081237793, "global_step": 367955, "epoch": 4433} {"train_loss": -26.2967529296875, "global_step": 367956, "epoch": 4433} {"train_loss": -26.296222686767578, "global_step": 367957, "epoch": 4433} {"train_loss": -26.443084716796875, "global_step": 367958, "epoch": 4433} {"train_loss": -26.410144805908203, "global_step": 367959, "epoch": 4433} {"train_loss": -26.40635108947754, "global_step": 367960, "epoch": 4433} {"train_loss": -26.3708438873291, "global_step": 367961, "epoch": 4433} {"train_loss": -26.603723526000977, "global_step": 367962, "epoch": 4433} {"train_loss": -26.90435218811035, "global_step": 367963, "epoch": 4433} {"train_loss": -26.510290145874023, "global_step": 367964, "epoch": 4433} {"train_loss": -26.477252960205078, "global_step": 367965, "epoch": 4433} {"train_loss": -25.999744415283203, "global_step": 367966, "epoch": 4433} {"train_loss": -26.279541015625, "global_step": 367967, "epoch": 4433} {"train_loss": -26.182971954345703, "global_step": 367968, "epoch": 4433} {"train_loss": -26.347442626953125, "global_step": 367969, "epoch": 4433} {"train_loss": -26.220495223999023, "global_step": 367970, "epoch": 4433} {"train_loss": -26.520954132080078, "global_step": 367971, "epoch": 4433} {"train_loss": -26.167221069335938, "global_step": 367972, "epoch": 4433} {"train_loss": -26.271595001220703, "global_step": 367973, "epoch": 4433} {"train_loss": -26.177160263061523, "global_step": 367974, "epoch": 4433} {"train_loss": -26.47269630432129, "global_step": 367975, "epoch": 4433} {"train_loss": -26.7759952545166, "global_step": 367976, "epoch": 4433} {"train_loss": -26.624286651611328, "global_step": 367977, "epoch": 4433} {"train_loss": -26.695804595947266, "global_step": 367978, "epoch": 4433} {"train_loss": -26.347082138061523, "global_step": 367979, "epoch": 4433} {"train_loss": -26.5993709564209, "global_step": 367980, "epoch": 4433} {"train_loss": -26.483795166015625, "global_step": 367981, "epoch": 4433} {"train_loss": -26.5325927734375, "global_step": 367982, "epoch": 4433} {"train_loss": -26.634735107421875, "global_step": 367983, "epoch": 4433} {"train_loss": -26.489776611328125, "global_step": 367984, "epoch": 4433} {"train_loss": -26.481298446655273, "global_step": 367985, "epoch": 4433} {"train_loss": -26.39678955078125, "global_step": 367986, "epoch": 4433} {"train_loss": -26.580060958862305, "global_step": 367987, "epoch": 4433} {"train_loss": -26.65607261657715, "global_step": 367988, "epoch": 4433} {"train_loss": -26.44646644592285, "global_step": 367989, "epoch": 4433} {"train_loss": -26.384296417236328, "global_step": 367990, "epoch": 4433} {"train_loss": -26.1098690032959, "global_step": 367991, "epoch": 4433} {"train_loss": -26.28993034362793, "global_step": 367992, "epoch": 4433} {"train_loss": -25.684614181518555, "global_step": 367993, "epoch": 4433} {"train_loss": -26.616626739501953, "global_step": 367994, "epoch": 4433} {"train_loss": -26.370153427124023, "global_step": 367995, "epoch": 4433} {"train_loss": -26.3586483001709, "global_step": 367996, "epoch": 4433} {"train_loss": -25.982563018798828, "global_step": 367997, "epoch": 4433} {"train_loss": -26.05921745300293, "global_step": 367998, "epoch": 4433} {"train_loss": -26.175973892211914, "global_step": 367999, "epoch": 4433} {"train_loss": -26.651416778564453, "global_step": 368000, "epoch": 4433} {"train_loss": -26.10371971130371, "global_step": 368001, "epoch": 4433} {"train_loss": -26.361988067626953, "global_step": 368002, "epoch": 4433} {"train_loss": -26.0965518951416, "global_step": 368003, "epoch": 4433} {"train_loss": -26.33245277404785, "global_step": 368004, "epoch": 4433} {"train_loss": -26.167667388916016, "global_step": 368005, "epoch": 4433} {"train_loss": -26.17555809020996, "global_step": 368006, "epoch": 4433} {"train_loss": -26.24028968811035, "global_step": 368007, "epoch": 4433} {"train_loss": -26.209354400634766, "global_step": 368008, "epoch": 4433} {"train_loss": -26.105926513671875, "global_step": 368009, "epoch": 4433} {"train_loss": -26.442411422729492, "global_step": 368010, "epoch": 4433} {"train_loss": -26.544757843017578, "global_step": 368011, "epoch": 4433} {"train_loss": -26.197309494018555, "global_step": 368012, "epoch": 4433} {"train_loss": -26.7199764251709, "global_step": 368013, "epoch": 4433} {"train_loss": -26.14485740661621, "global_step": 368014, "epoch": 4433} {"train_loss": -26.280292510986328, "global_step": 368015, "epoch": 4433} {"train_loss": -26.531452178955078, "global_step": 368016, "epoch": 4433} {"train_loss": -26.595947265625, "global_step": 368017, "epoch": 4433} {"train_loss": -26.537450790405273, "global_step": 368018, "epoch": 4433} {"train_loss": -26.582006454467773, "global_step": 368019, "epoch": 4433} {"train_loss": -26.548818588256836, "global_step": 368020, "epoch": 4433} {"train_loss": -26.308814519859222, "global_step": 368021, "epoch": 4433, "val_loss": 6671339.5} {"train_loss": -25.70467185974121, "global_step": 368022, "epoch": 4434} {"train_loss": -24.67656707763672, "global_step": 368023, "epoch": 4434} {"train_loss": -24.95123291015625, "global_step": 368024, "epoch": 4434} {"train_loss": -26.124835968017578, "global_step": 368025, "epoch": 4434} {"train_loss": -25.362241744995117, "global_step": 368026, "epoch": 4434} {"train_loss": -25.62684440612793, "global_step": 368027, "epoch": 4434} {"train_loss": -25.79372215270996, "global_step": 368028, "epoch": 4434} {"train_loss": -25.170320510864258, "global_step": 368029, "epoch": 4434} {"train_loss": -26.086050033569336, "global_step": 368030, "epoch": 4434} {"train_loss": -25.512388229370117, "global_step": 368031, "epoch": 4434} {"train_loss": -25.273395538330078, "global_step": 368032, "epoch": 4434} {"train_loss": -25.730518341064453, "global_step": 368033, "epoch": 4434} {"train_loss": -25.793628692626953, "global_step": 368034, "epoch": 4434} {"train_loss": -25.658777236938477, "global_step": 368035, "epoch": 4434} {"train_loss": -25.983198165893555, "global_step": 368036, "epoch": 4434} {"train_loss": -25.852502822875977, "global_step": 368037, "epoch": 4434} {"train_loss": -25.90424156188965, "global_step": 368038, "epoch": 4434} {"train_loss": -25.7224178314209, "global_step": 368039, "epoch": 4434} {"train_loss": -25.94146156311035, "global_step": 368040, "epoch": 4434} {"train_loss": -26.191614151000977, "global_step": 368041, "epoch": 4434} {"train_loss": -26.22144889831543, "global_step": 368042, "epoch": 4434} {"train_loss": -26.185483932495117, "global_step": 368043, "epoch": 4434} {"train_loss": -25.974088668823242, "global_step": 368044, "epoch": 4434} {"train_loss": -26.02838706970215, "global_step": 368045, "epoch": 4434} {"train_loss": -26.210636138916016, "global_step": 368046, "epoch": 4434} {"train_loss": -26.386865615844727, "global_step": 368047, "epoch": 4434} {"train_loss": -26.267292022705078, "global_step": 368048, "epoch": 4434} {"train_loss": -26.117746353149414, "global_step": 368049, "epoch": 4434} {"train_loss": -25.710012435913086, "global_step": 368050, "epoch": 4434} {"train_loss": -26.244787216186523, "global_step": 368051, "epoch": 4434} {"train_loss": -26.296594619750977, "global_step": 368052, "epoch": 4434} {"train_loss": -25.91364097595215, "global_step": 368053, "epoch": 4434} {"train_loss": -26.455230712890625, "global_step": 368054, "epoch": 4434} {"train_loss": -26.2713623046875, "global_step": 368055, "epoch": 4434} {"train_loss": -26.318716049194336, "global_step": 368056, "epoch": 4434} {"train_loss": -26.010334014892578, "global_step": 368057, "epoch": 4434} {"train_loss": -26.672760009765625, "global_step": 368058, "epoch": 4434} {"train_loss": -26.486555099487305, "global_step": 368059, "epoch": 4434} {"train_loss": -25.808425903320312, "global_step": 368060, "epoch": 4434} {"train_loss": -26.179906845092773, "global_step": 368061, "epoch": 4434} {"train_loss": -26.3572998046875, "global_step": 368062, "epoch": 4434} {"train_loss": -26.42072105407715, "global_step": 368063, "epoch": 4434} {"train_loss": -26.653217315673828, "global_step": 368064, "epoch": 4434} {"train_loss": -26.2003116607666, "global_step": 368065, "epoch": 4434} {"train_loss": -26.64950942993164, "global_step": 368066, "epoch": 4434} {"train_loss": -26.170740127563477, "global_step": 368067, "epoch": 4434} {"train_loss": -26.628173828125, "global_step": 368068, "epoch": 4434} {"train_loss": -26.5637264251709, "global_step": 368069, "epoch": 4434} {"train_loss": -26.444543838500977, "global_step": 368070, "epoch": 4434} {"train_loss": -26.461130142211914, "global_step": 368071, "epoch": 4434} {"train_loss": -26.266244888305664, "global_step": 368072, "epoch": 4434} {"train_loss": -26.611988067626953, "global_step": 368073, "epoch": 4434} {"train_loss": -26.26966667175293, "global_step": 368074, "epoch": 4434} {"train_loss": -26.593856811523438, "global_step": 368075, "epoch": 4434} {"train_loss": -26.325347900390625, "global_step": 368076, "epoch": 4434} {"train_loss": -26.318445205688477, "global_step": 368077, "epoch": 4434} {"train_loss": -26.142942428588867, "global_step": 368078, "epoch": 4434} {"train_loss": -25.915454864501953, "global_step": 368079, "epoch": 4434} {"train_loss": -26.091842651367188, "global_step": 368080, "epoch": 4434} {"train_loss": -26.331995010375977, "global_step": 368081, "epoch": 4434} {"train_loss": -26.305234909057617, "global_step": 368082, "epoch": 4434} {"train_loss": -26.58664321899414, "global_step": 368083, "epoch": 4434} {"train_loss": -26.57987403869629, "global_step": 368084, "epoch": 4434} {"train_loss": -26.485519409179688, "global_step": 368085, "epoch": 4434} {"train_loss": -26.25957679748535, "global_step": 368086, "epoch": 4434} {"train_loss": -26.78364372253418, "global_step": 368087, "epoch": 4434} {"train_loss": -26.586469650268555, "global_step": 368088, "epoch": 4434} {"train_loss": -26.527454376220703, "global_step": 368089, "epoch": 4434} {"train_loss": -26.56293296813965, "global_step": 368090, "epoch": 4434} {"train_loss": -26.660791397094727, "global_step": 368091, "epoch": 4434} {"train_loss": -26.47832679748535, "global_step": 368092, "epoch": 4434} {"train_loss": -26.542163848876953, "global_step": 368093, "epoch": 4434} {"train_loss": -26.532629013061523, "global_step": 368094, "epoch": 4434} {"train_loss": -26.607757568359375, "global_step": 368095, "epoch": 4434} {"train_loss": -27.054275512695312, "global_step": 368096, "epoch": 4434} {"train_loss": -26.51789665222168, "global_step": 368097, "epoch": 4434} {"train_loss": -26.2474308013916, "global_step": 368098, "epoch": 4434} {"train_loss": -26.495031356811523, "global_step": 368099, "epoch": 4434} {"train_loss": -26.31292152404785, "global_step": 368100, "epoch": 4434} {"train_loss": -25.943830490112305, "global_step": 368101, "epoch": 4434} {"train_loss": -26.35223388671875, "global_step": 368102, "epoch": 4434} {"train_loss": -26.24692153930664, "global_step": 368103, "epoch": 4434} {"train_loss": -26.1867882142584, "global_step": 368104, "epoch": 4434, "val_loss": 6715017.0} {"train_loss": -25.865936279296875, "global_step": 368105, "epoch": 4435} {"train_loss": -25.263134002685547, "global_step": 368106, "epoch": 4435} {"train_loss": -25.37929344177246, "global_step": 368107, "epoch": 4435} {"train_loss": -25.326406478881836, "global_step": 368108, "epoch": 4435} {"train_loss": -26.159818649291992, "global_step": 368109, "epoch": 4435} {"train_loss": -25.457483291625977, "global_step": 368110, "epoch": 4435} {"train_loss": -25.068939208984375, "global_step": 368111, "epoch": 4435} {"train_loss": -24.660825729370117, "global_step": 368112, "epoch": 4435} {"train_loss": -25.852752685546875, "global_step": 368113, "epoch": 4435} {"train_loss": -25.348569869995117, "global_step": 368114, "epoch": 4435} {"train_loss": -25.307825088500977, "global_step": 368115, "epoch": 4435} {"train_loss": -25.964292526245117, "global_step": 368116, "epoch": 4435} {"train_loss": -25.45863151550293, "global_step": 368117, "epoch": 4435} {"train_loss": -25.928205490112305, "global_step": 368118, "epoch": 4435} {"train_loss": -25.648422241210938, "global_step": 368119, "epoch": 4435} {"train_loss": -25.684467315673828, "global_step": 368120, "epoch": 4435} {"train_loss": -25.84002113342285, "global_step": 368121, "epoch": 4435} {"train_loss": -25.811542510986328, "global_step": 368122, "epoch": 4435} {"train_loss": -26.07488441467285, "global_step": 368123, "epoch": 4435} {"train_loss": -25.888385772705078, "global_step": 368124, "epoch": 4435} {"train_loss": -25.79522705078125, "global_step": 368125, "epoch": 4435} {"train_loss": -25.920028686523438, "global_step": 368126, "epoch": 4435} {"train_loss": -25.874252319335938, "global_step": 368127, "epoch": 4435} {"train_loss": -25.753433227539062, "global_step": 368128, "epoch": 4435} {"train_loss": -25.8400936126709, "global_step": 368129, "epoch": 4435} {"train_loss": -26.624433517456055, "global_step": 368130, "epoch": 4435} {"train_loss": -26.004226684570312, "global_step": 368131, "epoch": 4435} {"train_loss": -26.034717559814453, "global_step": 368132, "epoch": 4435} {"train_loss": -26.058032989501953, "global_step": 368133, "epoch": 4435} {"train_loss": -26.372802734375, "global_step": 368134, "epoch": 4435} {"train_loss": -26.23726463317871, "global_step": 368135, "epoch": 4435} {"train_loss": -26.14234733581543, "global_step": 368136, "epoch": 4435} {"train_loss": -25.994876861572266, "global_step": 368137, "epoch": 4435} {"train_loss": -26.246047973632812, "global_step": 368138, "epoch": 4435} {"train_loss": -26.38714027404785, "global_step": 368139, "epoch": 4435} {"train_loss": -26.366735458374023, "global_step": 368140, "epoch": 4435} {"train_loss": -26.42132568359375, "global_step": 368141, "epoch": 4435} {"train_loss": -25.969533920288086, "global_step": 368142, "epoch": 4435} {"train_loss": -26.206390380859375, "global_step": 368143, "epoch": 4435} {"train_loss": -26.781707763671875, "global_step": 368144, "epoch": 4435} {"train_loss": -26.123645782470703, "global_step": 368145, "epoch": 4435} {"train_loss": -26.57273292541504, "global_step": 368146, "epoch": 4435} {"train_loss": -26.61614990234375, "global_step": 368147, "epoch": 4435} {"train_loss": -26.495849609375, "global_step": 368148, "epoch": 4435} {"train_loss": -26.445966720581055, "global_step": 368149, "epoch": 4435} {"train_loss": -26.579620361328125, "global_step": 368150, "epoch": 4435} {"train_loss": -26.577178955078125, "global_step": 368151, "epoch": 4435} {"train_loss": -26.44272232055664, "global_step": 368152, "epoch": 4435} {"train_loss": -26.66663932800293, "global_step": 368153, "epoch": 4435} {"train_loss": -26.460773468017578, "global_step": 368154, "epoch": 4435} {"train_loss": -26.51031494140625, "global_step": 368155, "epoch": 4435} {"train_loss": -26.562580108642578, "global_step": 368156, "epoch": 4435} {"train_loss": -26.443679809570312, "global_step": 368157, "epoch": 4435} {"train_loss": -26.7646427154541, "global_step": 368158, "epoch": 4435} {"train_loss": -26.137115478515625, "global_step": 368159, "epoch": 4435} {"train_loss": -26.06742286682129, "global_step": 368160, "epoch": 4435} {"train_loss": -25.92011833190918, "global_step": 368161, "epoch": 4435} {"train_loss": -26.34568214416504, "global_step": 368162, "epoch": 4435} {"train_loss": -26.56879997253418, "global_step": 368163, "epoch": 4435} {"train_loss": -26.270099639892578, "global_step": 368164, "epoch": 4435} {"train_loss": -26.143024444580078, "global_step": 368165, "epoch": 4435} {"train_loss": -26.38629722595215, "global_step": 368166, "epoch": 4435} {"train_loss": -26.024246215820312, "global_step": 368167, "epoch": 4435} {"train_loss": -26.23288345336914, "global_step": 368168, "epoch": 4435} {"train_loss": -26.050031661987305, "global_step": 368169, "epoch": 4435} {"train_loss": -26.411203384399414, "global_step": 368170, "epoch": 4435} {"train_loss": -26.332239151000977, "global_step": 368171, "epoch": 4435} {"train_loss": -26.046308517456055, "global_step": 368172, "epoch": 4435} {"train_loss": -26.09124755859375, "global_step": 368173, "epoch": 4435} {"train_loss": -26.512128829956055, "global_step": 368174, "epoch": 4435} {"train_loss": -26.3530330657959, "global_step": 368175, "epoch": 4435} {"train_loss": -26.416400909423828, "global_step": 368176, "epoch": 4435} {"train_loss": -26.245649337768555, "global_step": 368177, "epoch": 4435} {"train_loss": -26.191633224487305, "global_step": 368178, "epoch": 4435} {"train_loss": -26.23935317993164, "global_step": 368179, "epoch": 4435} {"train_loss": -26.63777732849121, "global_step": 368180, "epoch": 4435} {"train_loss": -26.601490020751953, "global_step": 368181, "epoch": 4435} {"train_loss": -26.30413246154785, "global_step": 368182, "epoch": 4435} {"train_loss": -26.52349853515625, "global_step": 368183, "epoch": 4435} {"train_loss": -26.58902359008789, "global_step": 368184, "epoch": 4435} {"train_loss": -26.273090362548828, "global_step": 368185, "epoch": 4435} {"train_loss": -26.41636085510254, "global_step": 368186, "epoch": 4435} {"train_loss": -26.1387343349227, "global_step": 368187, "epoch": 4435, "val_loss": 6636057.0} {"train_loss": -25.446718215942383, "global_step": 368188, "epoch": 4436} {"train_loss": -25.569311141967773, "global_step": 368189, "epoch": 4436} {"train_loss": -25.965408325195312, "global_step": 368190, "epoch": 4436} {"train_loss": -25.7911319732666, "global_step": 368191, "epoch": 4436} {"train_loss": -25.673049926757812, "global_step": 368192, "epoch": 4436} {"train_loss": -25.712289810180664, "global_step": 368193, "epoch": 4436} {"train_loss": -26.302494049072266, "global_step": 368194, "epoch": 4436} {"train_loss": -25.827682495117188, "global_step": 368195, "epoch": 4436} {"train_loss": -26.229352951049805, "global_step": 368196, "epoch": 4436} {"train_loss": -26.000141143798828, "global_step": 368197, "epoch": 4436} {"train_loss": -25.78301429748535, "global_step": 368198, "epoch": 4436} {"train_loss": -26.336767196655273, "global_step": 368199, "epoch": 4436} {"train_loss": -26.3698673248291, "global_step": 368200, "epoch": 4436} {"train_loss": -26.063690185546875, "global_step": 368201, "epoch": 4436} {"train_loss": -26.295886993408203, "global_step": 368202, "epoch": 4436} {"train_loss": -26.031030654907227, "global_step": 368203, "epoch": 4436} {"train_loss": -26.121936798095703, "global_step": 368204, "epoch": 4436} {"train_loss": -25.937768936157227, "global_step": 368205, "epoch": 4436} {"train_loss": -26.2038516998291, "global_step": 368206, "epoch": 4436} {"train_loss": -26.51068115234375, "global_step": 368207, "epoch": 4436} {"train_loss": -26.25583267211914, "global_step": 368208, "epoch": 4436} {"train_loss": -26.4377498626709, "global_step": 368209, "epoch": 4436} {"train_loss": -26.084897994995117, "global_step": 368210, "epoch": 4436} {"train_loss": -26.4386043548584, "global_step": 368211, "epoch": 4436} {"train_loss": -26.087263107299805, "global_step": 368212, "epoch": 4436} {"train_loss": -26.25885009765625, "global_step": 368213, "epoch": 4436} {"train_loss": -26.454008102416992, "global_step": 368214, "epoch": 4436} {"train_loss": -26.237552642822266, "global_step": 368215, "epoch": 4436} {"train_loss": -26.08924674987793, "global_step": 368216, "epoch": 4436} {"train_loss": -26.04666519165039, "global_step": 368217, "epoch": 4436} {"train_loss": -26.09761619567871, "global_step": 368218, "epoch": 4436} {"train_loss": -26.244476318359375, "global_step": 368219, "epoch": 4436} {"train_loss": -26.340320587158203, "global_step": 368220, "epoch": 4436} {"train_loss": -26.242414474487305, "global_step": 368221, "epoch": 4436} {"train_loss": -26.3315372467041, "global_step": 368222, "epoch": 4436} {"train_loss": -26.438739776611328, "global_step": 368223, "epoch": 4436} {"train_loss": -26.227575302124023, "global_step": 368224, "epoch": 4436} {"train_loss": -26.703571319580078, "global_step": 368225, "epoch": 4436} {"train_loss": -26.48347282409668, "global_step": 368226, "epoch": 4436} {"train_loss": -26.49777603149414, "global_step": 368227, "epoch": 4436} {"train_loss": -26.234777450561523, "global_step": 368228, "epoch": 4436} {"train_loss": -26.732168197631836, "global_step": 368229, "epoch": 4436} {"train_loss": -26.710065841674805, "global_step": 368230, "epoch": 4436} {"train_loss": -26.420642852783203, "global_step": 368231, "epoch": 4436} {"train_loss": -26.617353439331055, "global_step": 368232, "epoch": 4436} {"train_loss": -26.789554595947266, "global_step": 368233, "epoch": 4436} {"train_loss": -26.391706466674805, "global_step": 368234, "epoch": 4436} {"train_loss": -26.41632080078125, "global_step": 368235, "epoch": 4436} {"train_loss": -26.31928062438965, "global_step": 368236, "epoch": 4436} {"train_loss": -26.250812530517578, "global_step": 368237, "epoch": 4436} {"train_loss": -26.748159408569336, "global_step": 368238, "epoch": 4436} {"train_loss": -26.782140731811523, "global_step": 368239, "epoch": 4436} {"train_loss": -26.603546142578125, "global_step": 368240, "epoch": 4436} {"train_loss": -26.50519371032715, "global_step": 368241, "epoch": 4436} {"train_loss": -26.583768844604492, "global_step": 368242, "epoch": 4436} {"train_loss": -26.619037628173828, "global_step": 368243, "epoch": 4436} {"train_loss": -26.39097023010254, "global_step": 368244, "epoch": 4436} {"train_loss": -26.718799591064453, "global_step": 368245, "epoch": 4436} {"train_loss": -26.627227783203125, "global_step": 368246, "epoch": 4436} {"train_loss": -26.846471786499023, "global_step": 368247, "epoch": 4436} {"train_loss": -26.57818603515625, "global_step": 368248, "epoch": 4436} {"train_loss": -25.93726921081543, "global_step": 368249, "epoch": 4436} {"train_loss": -25.39657974243164, "global_step": 368250, "epoch": 4436} {"train_loss": -24.655746459960938, "global_step": 368251, "epoch": 4436} {"train_loss": -25.37567138671875, "global_step": 368252, "epoch": 4436} {"train_loss": -26.171966552734375, "global_step": 368253, "epoch": 4436} {"train_loss": -25.887042999267578, "global_step": 368254, "epoch": 4436} {"train_loss": -26.160663604736328, "global_step": 368255, "epoch": 4436} {"train_loss": -26.165998458862305, "global_step": 368256, "epoch": 4436} {"train_loss": -26.347736358642578, "global_step": 368257, "epoch": 4436} {"train_loss": -26.31989097595215, "global_step": 368258, "epoch": 4436} {"train_loss": -25.95746421813965, "global_step": 368259, "epoch": 4436} {"train_loss": -25.851057052612305, "global_step": 368260, "epoch": 4436} {"train_loss": -26.10743522644043, "global_step": 368261, "epoch": 4436} {"train_loss": -26.285816192626953, "global_step": 368262, "epoch": 4436} {"train_loss": -26.22414207458496, "global_step": 368263, "epoch": 4436} {"train_loss": -26.03199577331543, "global_step": 368264, "epoch": 4436} {"train_loss": -26.15939712524414, "global_step": 368265, "epoch": 4436} {"train_loss": -26.597097396850586, "global_step": 368266, "epoch": 4436} {"train_loss": -26.05661392211914, "global_step": 368267, "epoch": 4436} {"train_loss": -26.061737060546875, "global_step": 368268, "epoch": 4436} {"train_loss": -26.218198776245117, "global_step": 368269, "epoch": 4436} {"train_loss": -26.233765705522284, "global_step": 368270, "epoch": 4436, "val_loss": 6719623.5} {"train_loss": -26.020862579345703, "global_step": 368271, "epoch": 4437} {"train_loss": -25.823644638061523, "global_step": 368272, "epoch": 4437} {"train_loss": -26.117399215698242, "global_step": 368273, "epoch": 4437} {"train_loss": -25.921783447265625, "global_step": 368274, "epoch": 4437} {"train_loss": -25.39713478088379, "global_step": 368275, "epoch": 4437} {"train_loss": -26.02887535095215, "global_step": 368276, "epoch": 4437} {"train_loss": -26.308523178100586, "global_step": 368277, "epoch": 4437} {"train_loss": -26.021820068359375, "global_step": 368278, "epoch": 4437} {"train_loss": -25.78597068786621, "global_step": 368279, "epoch": 4437} {"train_loss": -25.8203182220459, "global_step": 368280, "epoch": 4437} {"train_loss": -26.18914794921875, "global_step": 368281, "epoch": 4437} {"train_loss": -25.869617462158203, "global_step": 368282, "epoch": 4437} {"train_loss": -26.37700843811035, "global_step": 368283, "epoch": 4437} {"train_loss": -26.227109909057617, "global_step": 368284, "epoch": 4437} {"train_loss": -25.96234130859375, "global_step": 368285, "epoch": 4437} {"train_loss": -26.198740005493164, "global_step": 368286, "epoch": 4437} {"train_loss": -26.371536254882812, "global_step": 368287, "epoch": 4437} {"train_loss": -26.078317642211914, "global_step": 368288, "epoch": 4437} {"train_loss": -26.2142333984375, "global_step": 368289, "epoch": 4437} {"train_loss": -26.540130615234375, "global_step": 368290, "epoch": 4437} {"train_loss": -26.758255004882812, "global_step": 368291, "epoch": 4437} {"train_loss": -26.42291259765625, "global_step": 368292, "epoch": 4437} {"train_loss": -26.1376953125, "global_step": 368293, "epoch": 4437} {"train_loss": -25.98679542541504, "global_step": 368294, "epoch": 4437} {"train_loss": -26.184667587280273, "global_step": 368295, "epoch": 4437} {"train_loss": -26.3336181640625, "global_step": 368296, "epoch": 4437} {"train_loss": -26.4288387298584, "global_step": 368297, "epoch": 4437} {"train_loss": -26.494495391845703, "global_step": 368298, "epoch": 4437} {"train_loss": -25.978403091430664, "global_step": 368299, "epoch": 4437} {"train_loss": -26.554941177368164, "global_step": 368300, "epoch": 4437} {"train_loss": -26.579931259155273, "global_step": 368301, "epoch": 4437} {"train_loss": -26.83941078186035, "global_step": 368302, "epoch": 4437} {"train_loss": -25.89552116394043, "global_step": 368303, "epoch": 4437} {"train_loss": -26.59028434753418, "global_step": 368304, "epoch": 4437} {"train_loss": -25.949142456054688, "global_step": 368305, "epoch": 4437} {"train_loss": -26.33034324645996, "global_step": 368306, "epoch": 4437} {"train_loss": -26.254892349243164, "global_step": 368307, "epoch": 4437} {"train_loss": -26.299835205078125, "global_step": 368308, "epoch": 4437} {"train_loss": -26.169687271118164, "global_step": 368309, "epoch": 4437} {"train_loss": -26.233016967773438, "global_step": 368310, "epoch": 4437} {"train_loss": -26.61651611328125, "global_step": 368311, "epoch": 4437} {"train_loss": -26.405242919921875, "global_step": 368312, "epoch": 4437} {"train_loss": -26.137460708618164, "global_step": 368313, "epoch": 4437} {"train_loss": -26.05718994140625, "global_step": 368314, "epoch": 4437} {"train_loss": -25.897785186767578, "global_step": 368315, "epoch": 4437} {"train_loss": -26.472457885742188, "global_step": 368316, "epoch": 4437} {"train_loss": -26.131855010986328, "global_step": 368317, "epoch": 4437} {"train_loss": -26.782073974609375, "global_step": 368318, "epoch": 4437} {"train_loss": -26.575536727905273, "global_step": 368319, "epoch": 4437} {"train_loss": -26.08536720275879, "global_step": 368320, "epoch": 4437} {"train_loss": -26.234222412109375, "global_step": 368321, "epoch": 4437} {"train_loss": -26.549884796142578, "global_step": 368322, "epoch": 4437} {"train_loss": -26.490604400634766, "global_step": 368323, "epoch": 4437} {"train_loss": -26.269376754760742, "global_step": 368324, "epoch": 4437} {"train_loss": -25.7643985748291, "global_step": 368325, "epoch": 4437} {"train_loss": -26.302061080932617, "global_step": 368326, "epoch": 4437} {"train_loss": -26.125547409057617, "global_step": 368327, "epoch": 4437} {"train_loss": -26.009628295898438, "global_step": 368328, "epoch": 4437} {"train_loss": -26.189151763916016, "global_step": 368329, "epoch": 4437} {"train_loss": -26.26593589782715, "global_step": 368330, "epoch": 4437} {"train_loss": -26.581924438476562, "global_step": 368331, "epoch": 4437} {"train_loss": -26.30292320251465, "global_step": 368332, "epoch": 4437} {"train_loss": -26.298694610595703, "global_step": 368333, "epoch": 4437} {"train_loss": -26.556671142578125, "global_step": 368334, "epoch": 4437} {"train_loss": -26.43973731994629, "global_step": 368335, "epoch": 4437} {"train_loss": -26.729419708251953, "global_step": 368336, "epoch": 4437} {"train_loss": -26.564306259155273, "global_step": 368337, "epoch": 4437} {"train_loss": -26.372955322265625, "global_step": 368338, "epoch": 4437} {"train_loss": -26.4396915435791, "global_step": 368339, "epoch": 4437} {"train_loss": -26.02068519592285, "global_step": 368340, "epoch": 4437} {"train_loss": -26.498083114624023, "global_step": 368341, "epoch": 4437} {"train_loss": -26.347461700439453, "global_step": 368342, "epoch": 4437} {"train_loss": -26.3345890045166, "global_step": 368343, "epoch": 4437} {"train_loss": -26.358118057250977, "global_step": 368344, "epoch": 4437} {"train_loss": -26.53302001953125, "global_step": 368345, "epoch": 4437} {"train_loss": -26.458251953125, "global_step": 368346, "epoch": 4437} {"train_loss": -26.278858184814453, "global_step": 368347, "epoch": 4437} {"train_loss": -26.51169204711914, "global_step": 368348, "epoch": 4437} {"train_loss": -26.621490478515625, "global_step": 368349, "epoch": 4437} {"train_loss": -26.473236083984375, "global_step": 368350, "epoch": 4437} {"train_loss": -26.531940460205078, "global_step": 368351, "epoch": 4437} {"train_loss": -26.575342178344727, "global_step": 368352, "epoch": 4437} {"train_loss": -26.280159134462654, "global_step": 368353, "epoch": 4437, "val_loss": 6663289.5} {"train_loss": -26.34380531311035, "global_step": 368354, "epoch": 4438} {"train_loss": -25.292110443115234, "global_step": 368355, "epoch": 4438} {"train_loss": -25.08819580078125, "global_step": 368356, "epoch": 4438} {"train_loss": -25.491445541381836, "global_step": 368357, "epoch": 4438} {"train_loss": -26.175092697143555, "global_step": 368358, "epoch": 4438} {"train_loss": -25.46221351623535, "global_step": 368359, "epoch": 4438} {"train_loss": -25.86213493347168, "global_step": 368360, "epoch": 4438} {"train_loss": -26.43537712097168, "global_step": 368361, "epoch": 4438} {"train_loss": -26.102951049804688, "global_step": 368362, "epoch": 4438} {"train_loss": -26.234588623046875, "global_step": 368363, "epoch": 4438} {"train_loss": -26.196699142456055, "global_step": 368364, "epoch": 4438} {"train_loss": -26.254653930664062, "global_step": 368365, "epoch": 4438} {"train_loss": -26.334836959838867, "global_step": 368366, "epoch": 4438} {"train_loss": -26.034168243408203, "global_step": 368367, "epoch": 4438} {"train_loss": -25.809431076049805, "global_step": 368368, "epoch": 4438} {"train_loss": -25.970239639282227, "global_step": 368369, "epoch": 4438} {"train_loss": -26.02880859375, "global_step": 368370, "epoch": 4438} {"train_loss": -26.202392578125, "global_step": 368371, "epoch": 4438} {"train_loss": -26.409475326538086, "global_step": 368372, "epoch": 4438} {"train_loss": -26.072437286376953, "global_step": 368373, "epoch": 4438} {"train_loss": -26.428762435913086, "global_step": 368374, "epoch": 4438} {"train_loss": -26.173023223876953, "global_step": 368375, "epoch": 4438} {"train_loss": -26.318683624267578, "global_step": 368376, "epoch": 4438} {"train_loss": -26.10096549987793, "global_step": 368377, "epoch": 4438} {"train_loss": -26.01474952697754, "global_step": 368378, "epoch": 4438} {"train_loss": -26.554035186767578, "global_step": 368379, "epoch": 4438} {"train_loss": -26.222471237182617, "global_step": 368380, "epoch": 4438} {"train_loss": -26.14592933654785, "global_step": 368381, "epoch": 4438} {"train_loss": -26.299924850463867, "global_step": 368382, "epoch": 4438} {"train_loss": -26.5283260345459, "global_step": 368383, "epoch": 4438} {"train_loss": -26.431598663330078, "global_step": 368384, "epoch": 4438} {"train_loss": -25.9765682220459, "global_step": 368385, "epoch": 4438} {"train_loss": -26.545255661010742, "global_step": 368386, "epoch": 4438} {"train_loss": -26.39350700378418, "global_step": 368387, "epoch": 4438} {"train_loss": -26.27056884765625, "global_step": 368388, "epoch": 4438} {"train_loss": -26.41220474243164, "global_step": 368389, "epoch": 4438} {"train_loss": -26.479101181030273, "global_step": 368390, "epoch": 4438} {"train_loss": -26.408782958984375, "global_step": 368391, "epoch": 4438} {"train_loss": -26.835906982421875, "global_step": 368392, "epoch": 4438} {"train_loss": -26.275924682617188, "global_step": 368393, "epoch": 4438} {"train_loss": -26.357873916625977, "global_step": 368394, "epoch": 4438} {"train_loss": -26.454742431640625, "global_step": 368395, "epoch": 4438} {"train_loss": -26.434534072875977, "global_step": 368396, "epoch": 4438} {"train_loss": -26.486845016479492, "global_step": 368397, "epoch": 4438} {"train_loss": -26.216718673706055, "global_step": 368398, "epoch": 4438} {"train_loss": -26.534597396850586, "global_step": 368399, "epoch": 4438} {"train_loss": -26.393142700195312, "global_step": 368400, "epoch": 4438} {"train_loss": -26.258020401000977, "global_step": 368401, "epoch": 4438} {"train_loss": -26.382064819335938, "global_step": 368402, "epoch": 4438} {"train_loss": -26.956100463867188, "global_step": 368403, "epoch": 4438} {"train_loss": -26.58868980407715, "global_step": 368404, "epoch": 4438} {"train_loss": -26.621816635131836, "global_step": 368405, "epoch": 4438} {"train_loss": -26.690698623657227, "global_step": 368406, "epoch": 4438} {"train_loss": -26.644983291625977, "global_step": 368407, "epoch": 4438} {"train_loss": -26.534326553344727, "global_step": 368408, "epoch": 4438} {"train_loss": -26.255090713500977, "global_step": 368409, "epoch": 4438} {"train_loss": -26.18825340270996, "global_step": 368410, "epoch": 4438} {"train_loss": -25.798669815063477, "global_step": 368411, "epoch": 4438} {"train_loss": -25.511795043945312, "global_step": 368412, "epoch": 4438} {"train_loss": -24.938413619995117, "global_step": 368413, "epoch": 4438} {"train_loss": -25.617956161499023, "global_step": 368414, "epoch": 4438} {"train_loss": -25.584178924560547, "global_step": 368415, "epoch": 4438} {"train_loss": -26.061010360717773, "global_step": 368416, "epoch": 4438} {"train_loss": -25.792160034179688, "global_step": 368417, "epoch": 4438} {"train_loss": -25.990026473999023, "global_step": 368418, "epoch": 4438} {"train_loss": -25.783018112182617, "global_step": 368419, "epoch": 4438} {"train_loss": -26.074066162109375, "global_step": 368420, "epoch": 4438} {"train_loss": -26.14185905456543, "global_step": 368421, "epoch": 4438} {"train_loss": -26.204931259155273, "global_step": 368422, "epoch": 4438} {"train_loss": -25.91651725769043, "global_step": 368423, "epoch": 4438} {"train_loss": -25.951013565063477, "global_step": 368424, "epoch": 4438} {"train_loss": -25.87998390197754, "global_step": 368425, "epoch": 4438} {"train_loss": -26.2734432220459, "global_step": 368426, "epoch": 4438} {"train_loss": -26.273595809936523, "global_step": 368427, "epoch": 4438} {"train_loss": -26.08365249633789, "global_step": 368428, "epoch": 4438} {"train_loss": -26.170276641845703, "global_step": 368429, "epoch": 4438} {"train_loss": -26.189477920532227, "global_step": 368430, "epoch": 4438} {"train_loss": -26.48282814025879, "global_step": 368431, "epoch": 4438} {"train_loss": -26.583240509033203, "global_step": 368432, "epoch": 4438} {"train_loss": -26.186513900756836, "global_step": 368433, "epoch": 4438} {"train_loss": -26.002155303955078, "global_step": 368434, "epoch": 4438} {"train_loss": -26.03924560546875, "global_step": 368435, "epoch": 4438} {"train_loss": -26.17398636599621, "global_step": 368436, "epoch": 4438, "val_loss": 6588847.0} {"train_loss": -25.848163604736328, "global_step": 368437, "epoch": 4439} {"train_loss": -25.493314743041992, "global_step": 368438, "epoch": 4439} {"train_loss": -26.003631591796875, "global_step": 368439, "epoch": 4439} {"train_loss": -25.857084274291992, "global_step": 368440, "epoch": 4439} {"train_loss": -26.115015029907227, "global_step": 368441, "epoch": 4439} {"train_loss": -25.854969024658203, "global_step": 368442, "epoch": 4439} {"train_loss": -26.171201705932617, "global_step": 368443, "epoch": 4439} {"train_loss": -25.958337783813477, "global_step": 368444, "epoch": 4439} {"train_loss": -26.239608764648438, "global_step": 368445, "epoch": 4439} {"train_loss": -26.451608657836914, "global_step": 368446, "epoch": 4439} {"train_loss": -25.95041275024414, "global_step": 368447, "epoch": 4439} {"train_loss": -26.274396896362305, "global_step": 368448, "epoch": 4439} {"train_loss": -26.336505889892578, "global_step": 368449, "epoch": 4439} {"train_loss": -26.706439971923828, "global_step": 368450, "epoch": 4439} {"train_loss": -26.1715030670166, "global_step": 368451, "epoch": 4439} {"train_loss": -26.655338287353516, "global_step": 368452, "epoch": 4439} {"train_loss": -26.460824966430664, "global_step": 368453, "epoch": 4439} {"train_loss": -26.435333251953125, "global_step": 368454, "epoch": 4439} {"train_loss": -26.143518447875977, "global_step": 368455, "epoch": 4439} {"train_loss": -26.441577911376953, "global_step": 368456, "epoch": 4439} {"train_loss": -26.254837036132812, "global_step": 368457, "epoch": 4439} {"train_loss": -26.50239372253418, "global_step": 368458, "epoch": 4439} {"train_loss": -26.424259185791016, "global_step": 368459, "epoch": 4439} {"train_loss": -26.300830841064453, "global_step": 368460, "epoch": 4439} {"train_loss": -26.117467880249023, "global_step": 368461, "epoch": 4439} {"train_loss": -26.514806747436523, "global_step": 368462, "epoch": 4439} {"train_loss": -26.50732421875, "global_step": 368463, "epoch": 4439} {"train_loss": -26.41672706604004, "global_step": 368464, "epoch": 4439} {"train_loss": -26.5766658782959, "global_step": 368465, "epoch": 4439} {"train_loss": -26.10261344909668, "global_step": 368466, "epoch": 4439} {"train_loss": -26.642221450805664, "global_step": 368467, "epoch": 4439} {"train_loss": -26.325443267822266, "global_step": 368468, "epoch": 4439} {"train_loss": -26.478046417236328, "global_step": 368469, "epoch": 4439} {"train_loss": -26.45258140563965, "global_step": 368470, "epoch": 4439} {"train_loss": -26.47216796875, "global_step": 368471, "epoch": 4439} {"train_loss": -26.698766708374023, "global_step": 368472, "epoch": 4439} {"train_loss": -26.358917236328125, "global_step": 368473, "epoch": 4439} {"train_loss": -26.391498565673828, "global_step": 368474, "epoch": 4439} {"train_loss": -26.30879020690918, "global_step": 368475, "epoch": 4439} {"train_loss": -26.342031478881836, "global_step": 368476, "epoch": 4439} {"train_loss": -26.33513832092285, "global_step": 368477, "epoch": 4439} {"train_loss": -26.6195011138916, "global_step": 368478, "epoch": 4439} {"train_loss": -26.7952880859375, "global_step": 368479, "epoch": 4439} {"train_loss": -26.437726974487305, "global_step": 368480, "epoch": 4439} {"train_loss": -26.411787033081055, "global_step": 368481, "epoch": 4439} {"train_loss": -26.717254638671875, "global_step": 368482, "epoch": 4439} {"train_loss": -26.27703857421875, "global_step": 368483, "epoch": 4439} {"train_loss": -26.343536376953125, "global_step": 368484, "epoch": 4439} {"train_loss": -26.38239097595215, "global_step": 368485, "epoch": 4439} {"train_loss": -26.039306640625, "global_step": 368486, "epoch": 4439} {"train_loss": -25.94869041442871, "global_step": 368487, "epoch": 4439} {"train_loss": -25.82073402404785, "global_step": 368488, "epoch": 4439} {"train_loss": -26.1529598236084, "global_step": 368489, "epoch": 4439} {"train_loss": -26.188217163085938, "global_step": 368490, "epoch": 4439} {"train_loss": -25.966535568237305, "global_step": 368491, "epoch": 4439} {"train_loss": -26.126569747924805, "global_step": 368492, "epoch": 4439} {"train_loss": -26.4732666015625, "global_step": 368493, "epoch": 4439} {"train_loss": -25.993408203125, "global_step": 368494, "epoch": 4439} {"train_loss": -25.9398193359375, "global_step": 368495, "epoch": 4439} {"train_loss": -26.442651748657227, "global_step": 368496, "epoch": 4439} {"train_loss": -26.114953994750977, "global_step": 368497, "epoch": 4439} {"train_loss": -26.31251335144043, "global_step": 368498, "epoch": 4439} {"train_loss": -26.067554473876953, "global_step": 368499, "epoch": 4439} {"train_loss": -26.159687042236328, "global_step": 368500, "epoch": 4439} {"train_loss": -26.50982093811035, "global_step": 368501, "epoch": 4439} {"train_loss": -26.041101455688477, "global_step": 368502, "epoch": 4439} {"train_loss": -26.155506134033203, "global_step": 368503, "epoch": 4439} {"train_loss": -26.601770401000977, "global_step": 368504, "epoch": 4439} {"train_loss": -26.32211685180664, "global_step": 368505, "epoch": 4439} {"train_loss": -26.24308204650879, "global_step": 368506, "epoch": 4439} {"train_loss": -26.07761573791504, "global_step": 368507, "epoch": 4439} {"train_loss": -26.37057876586914, "global_step": 368508, "epoch": 4439} {"train_loss": -26.470809936523438, "global_step": 368509, "epoch": 4439} {"train_loss": -26.1895694732666, "global_step": 368510, "epoch": 4439} {"train_loss": -26.0611629486084, "global_step": 368511, "epoch": 4439} {"train_loss": -26.152423858642578, "global_step": 368512, "epoch": 4439} {"train_loss": -26.5286808013916, "global_step": 368513, "epoch": 4439} {"train_loss": -26.21295738220215, "global_step": 368514, "epoch": 4439} {"train_loss": -26.731521606445312, "global_step": 368515, "epoch": 4439} {"train_loss": -26.4093074798584, "global_step": 368516, "epoch": 4439} {"train_loss": -25.98404312133789, "global_step": 368517, "epoch": 4439} {"train_loss": -26.35529899597168, "global_step": 368518, "epoch": 4439} {"train_loss": -26.281689080847315, "global_step": 368519, "epoch": 4439, "val_loss": 6598725.0} {"train_loss": -25.971750259399414, "global_step": 368520, "epoch": 4440} {"train_loss": -25.715734481811523, "global_step": 368521, "epoch": 4440} {"train_loss": -26.10154151916504, "global_step": 368522, "epoch": 4440} {"train_loss": -25.886457443237305, "global_step": 368523, "epoch": 4440} {"train_loss": -26.056589126586914, "global_step": 368524, "epoch": 4440} {"train_loss": -26.240320205688477, "global_step": 368525, "epoch": 4440} {"train_loss": -25.998300552368164, "global_step": 368526, "epoch": 4440} {"train_loss": -25.90947914123535, "global_step": 368527, "epoch": 4440} {"train_loss": -26.251977920532227, "global_step": 368528, "epoch": 4440} {"train_loss": -25.895105361938477, "global_step": 368529, "epoch": 4440} {"train_loss": -26.160125732421875, "global_step": 368530, "epoch": 4440} {"train_loss": -26.407583236694336, "global_step": 368531, "epoch": 4440} {"train_loss": -26.081403732299805, "global_step": 368532, "epoch": 4440} {"train_loss": -25.80560874938965, "global_step": 368533, "epoch": 4440} {"train_loss": -25.927274703979492, "global_step": 368534, "epoch": 4440} {"train_loss": -26.107349395751953, "global_step": 368535, "epoch": 4440} {"train_loss": -25.95594596862793, "global_step": 368536, "epoch": 4440} {"train_loss": -25.818593978881836, "global_step": 368537, "epoch": 4440} {"train_loss": -26.19744873046875, "global_step": 368538, "epoch": 4440} {"train_loss": -26.4583740234375, "global_step": 368539, "epoch": 4440} {"train_loss": -26.22901725769043, "global_step": 368540, "epoch": 4440} {"train_loss": -26.151351928710938, "global_step": 368541, "epoch": 4440} {"train_loss": -26.091724395751953, "global_step": 368542, "epoch": 4440} {"train_loss": -25.97599220275879, "global_step": 368543, "epoch": 4440} {"train_loss": -26.32745933532715, "global_step": 368544, "epoch": 4440} {"train_loss": -26.375158309936523, "global_step": 368545, "epoch": 4440} {"train_loss": -26.06471061706543, "global_step": 368546, "epoch": 4440} {"train_loss": -26.2838077545166, "global_step": 368547, "epoch": 4440} {"train_loss": -26.244037628173828, "global_step": 368548, "epoch": 4440} {"train_loss": -26.164016723632812, "global_step": 368549, "epoch": 4440} {"train_loss": -26.284433364868164, "global_step": 368550, "epoch": 4440} {"train_loss": -25.781665802001953, "global_step": 368551, "epoch": 4440} {"train_loss": -26.364404678344727, "global_step": 368552, "epoch": 4440} {"train_loss": -26.287555694580078, "global_step": 368553, "epoch": 4440} {"train_loss": -26.40500831604004, "global_step": 368554, "epoch": 4440} {"train_loss": -26.381488800048828, "global_step": 368555, "epoch": 4440} {"train_loss": -26.055591583251953, "global_step": 368556, "epoch": 4440} {"train_loss": -26.50774574279785, "global_step": 368557, "epoch": 4440} {"train_loss": -26.529027938842773, "global_step": 368558, "epoch": 4440} {"train_loss": -26.23324966430664, "global_step": 368559, "epoch": 4440} {"train_loss": -26.68488121032715, "global_step": 368560, "epoch": 4440} {"train_loss": -26.04859733581543, "global_step": 368561, "epoch": 4440} {"train_loss": -26.647052764892578, "global_step": 368562, "epoch": 4440} {"train_loss": -26.502878189086914, "global_step": 368563, "epoch": 4440} {"train_loss": -26.51388931274414, "global_step": 368564, "epoch": 4440} {"train_loss": -26.5756893157959, "global_step": 368565, "epoch": 4440} {"train_loss": -26.61170768737793, "global_step": 368566, "epoch": 4440} {"train_loss": -26.53377342224121, "global_step": 368567, "epoch": 4440} {"train_loss": -26.45210838317871, "global_step": 368568, "epoch": 4440} {"train_loss": -26.2323055267334, "global_step": 368569, "epoch": 4440} {"train_loss": -26.471418380737305, "global_step": 368570, "epoch": 4440} {"train_loss": -26.4512996673584, "global_step": 368571, "epoch": 4440} {"train_loss": -26.54364013671875, "global_step": 368572, "epoch": 4440} {"train_loss": -26.41680908203125, "global_step": 368573, "epoch": 4440} {"train_loss": -26.139373779296875, "global_step": 368574, "epoch": 4440} {"train_loss": -26.693988800048828, "global_step": 368575, "epoch": 4440} {"train_loss": -26.182743072509766, "global_step": 368576, "epoch": 4440} {"train_loss": -26.30194664001465, "global_step": 368577, "epoch": 4440} {"train_loss": -26.7852783203125, "global_step": 368578, "epoch": 4440} {"train_loss": -26.22981834411621, "global_step": 368579, "epoch": 4440} {"train_loss": -26.082630157470703, "global_step": 368580, "epoch": 4440} {"train_loss": -25.955591201782227, "global_step": 368581, "epoch": 4440} {"train_loss": -26.538177490234375, "global_step": 368582, "epoch": 4440} {"train_loss": -26.1956844329834, "global_step": 368583, "epoch": 4440} {"train_loss": -26.364988327026367, "global_step": 368584, "epoch": 4440} {"train_loss": -25.92848014831543, "global_step": 368585, "epoch": 4440} {"train_loss": -26.11771011352539, "global_step": 368586, "epoch": 4440} {"train_loss": -26.421722412109375, "global_step": 368587, "epoch": 4440} {"train_loss": -26.458026885986328, "global_step": 368588, "epoch": 4440} {"train_loss": -26.463476181030273, "global_step": 368589, "epoch": 4440} {"train_loss": -26.2385311126709, "global_step": 368590, "epoch": 4440} {"train_loss": -26.3649959564209, "global_step": 368591, "epoch": 4440} {"train_loss": -26.7929630279541, "global_step": 368592, "epoch": 4440} {"train_loss": -26.36578369140625, "global_step": 368593, "epoch": 4440} {"train_loss": -26.13018798828125, "global_step": 368594, "epoch": 4440} {"train_loss": -26.400684356689453, "global_step": 368595, "epoch": 4440} {"train_loss": -26.506591796875, "global_step": 368596, "epoch": 4440} {"train_loss": -25.858123779296875, "global_step": 368597, "epoch": 4440} {"train_loss": -26.2713623046875, "global_step": 368598, "epoch": 4440} {"train_loss": -26.34502601623535, "global_step": 368599, "epoch": 4440} {"train_loss": -26.4705867767334, "global_step": 368600, "epoch": 4440} {"train_loss": -26.214502334594727, "global_step": 368601, "epoch": 4440} {"train_loss": -26.259814963283308, "global_step": 368602, "epoch": 4440, "val_loss": 6686147.0} {"train_loss": -25.977828979492188, "global_step": 368603, "epoch": 4441} {"train_loss": -25.98721694946289, "global_step": 368604, "epoch": 4441} {"train_loss": -25.9102725982666, "global_step": 368605, "epoch": 4441} {"train_loss": -25.6658935546875, "global_step": 368606, "epoch": 4441} {"train_loss": -26.022403717041016, "global_step": 368607, "epoch": 4441} {"train_loss": -26.117374420166016, "global_step": 368608, "epoch": 4441} {"train_loss": -26.01318359375, "global_step": 368609, "epoch": 4441} {"train_loss": -25.822906494140625, "global_step": 368610, "epoch": 4441} {"train_loss": -25.998157501220703, "global_step": 368611, "epoch": 4441} {"train_loss": -25.654638290405273, "global_step": 368612, "epoch": 4441} {"train_loss": -26.43405532836914, "global_step": 368613, "epoch": 4441} {"train_loss": -26.084247589111328, "global_step": 368614, "epoch": 4441} {"train_loss": -25.997516632080078, "global_step": 368615, "epoch": 4441} {"train_loss": -26.02414321899414, "global_step": 368616, "epoch": 4441} {"train_loss": -26.185516357421875, "global_step": 368617, "epoch": 4441} {"train_loss": -26.357654571533203, "global_step": 368618, "epoch": 4441} {"train_loss": -26.0775089263916, "global_step": 368619, "epoch": 4441} {"train_loss": -26.54334831237793, "global_step": 368620, "epoch": 4441} {"train_loss": -26.05299949645996, "global_step": 368621, "epoch": 4441} {"train_loss": -26.259458541870117, "global_step": 368622, "epoch": 4441} {"train_loss": -26.27967643737793, "global_step": 368623, "epoch": 4441} {"train_loss": -26.492401123046875, "global_step": 368624, "epoch": 4441} {"train_loss": -26.45123863220215, "global_step": 368625, "epoch": 4441} {"train_loss": -26.359235763549805, "global_step": 368626, "epoch": 4441} {"train_loss": -26.070388793945312, "global_step": 368627, "epoch": 4441} {"train_loss": -26.029632568359375, "global_step": 368628, "epoch": 4441} {"train_loss": -26.225378036499023, "global_step": 368629, "epoch": 4441} {"train_loss": -26.374164581298828, "global_step": 368630, "epoch": 4441} {"train_loss": -26.347919464111328, "global_step": 368631, "epoch": 4441} {"train_loss": -26.483509063720703, "global_step": 368632, "epoch": 4441} {"train_loss": -26.494770050048828, "global_step": 368633, "epoch": 4441} {"train_loss": -26.39313316345215, "global_step": 368634, "epoch": 4441} {"train_loss": -26.18977165222168, "global_step": 368635, "epoch": 4441} {"train_loss": -26.456586837768555, "global_step": 368636, "epoch": 4441} {"train_loss": -26.321081161499023, "global_step": 368637, "epoch": 4441} {"train_loss": -26.276660919189453, "global_step": 368638, "epoch": 4441} {"train_loss": -26.146833419799805, "global_step": 368639, "epoch": 4441} {"train_loss": -26.142301559448242, "global_step": 368640, "epoch": 4441} {"train_loss": -26.4561710357666, "global_step": 368641, "epoch": 4441} {"train_loss": -26.12653160095215, "global_step": 368642, "epoch": 4441} {"train_loss": -26.322956085205078, "global_step": 368643, "epoch": 4441} {"train_loss": -26.226926803588867, "global_step": 368644, "epoch": 4441} {"train_loss": -26.546674728393555, "global_step": 368645, "epoch": 4441} {"train_loss": -26.181476593017578, "global_step": 368646, "epoch": 4441} {"train_loss": -26.482202529907227, "global_step": 368647, "epoch": 4441} {"train_loss": -26.4132080078125, "global_step": 368648, "epoch": 4441} {"train_loss": -26.75553321838379, "global_step": 368649, "epoch": 4441} {"train_loss": -26.497329711914062, "global_step": 368650, "epoch": 4441} {"train_loss": -26.52703285217285, "global_step": 368651, "epoch": 4441} {"train_loss": -26.361526489257812, "global_step": 368652, "epoch": 4441} {"train_loss": -26.639734268188477, "global_step": 368653, "epoch": 4441} {"train_loss": -26.426237106323242, "global_step": 368654, "epoch": 4441} {"train_loss": -26.203588485717773, "global_step": 368655, "epoch": 4441} {"train_loss": -26.55244255065918, "global_step": 368656, "epoch": 4441} {"train_loss": -26.643354415893555, "global_step": 368657, "epoch": 4441} {"train_loss": -25.75709342956543, "global_step": 368658, "epoch": 4441} {"train_loss": -25.90858268737793, "global_step": 368659, "epoch": 4441} {"train_loss": -25.628400802612305, "global_step": 368660, "epoch": 4441} {"train_loss": -26.147693634033203, "global_step": 368661, "epoch": 4441} {"train_loss": -26.01420021057129, "global_step": 368662, "epoch": 4441} {"train_loss": -26.250776290893555, "global_step": 368663, "epoch": 4441} {"train_loss": -26.183069229125977, "global_step": 368664, "epoch": 4441} {"train_loss": -26.12479591369629, "global_step": 368665, "epoch": 4441} {"train_loss": -25.92816734313965, "global_step": 368666, "epoch": 4441} {"train_loss": -26.50445556640625, "global_step": 368667, "epoch": 4441} {"train_loss": -26.128381729125977, "global_step": 368668, "epoch": 4441} {"train_loss": -25.818944931030273, "global_step": 368669, "epoch": 4441} {"train_loss": -25.73691177368164, "global_step": 368670, "epoch": 4441} {"train_loss": -25.834142684936523, "global_step": 368671, "epoch": 4441} {"train_loss": -26.032331466674805, "global_step": 368672, "epoch": 4441} {"train_loss": -26.1766300201416, "global_step": 368673, "epoch": 4441} {"train_loss": -25.781829833984375, "global_step": 368674, "epoch": 4441} {"train_loss": -25.945697784423828, "global_step": 368675, "epoch": 4441} {"train_loss": -26.46683692932129, "global_step": 368676, "epoch": 4441} {"train_loss": -25.771259307861328, "global_step": 368677, "epoch": 4441} {"train_loss": -26.450326919555664, "global_step": 368678, "epoch": 4441} {"train_loss": -25.970483779907227, "global_step": 368679, "epoch": 4441} {"train_loss": -26.189504623413086, "global_step": 368680, "epoch": 4441} {"train_loss": -25.956256866455078, "global_step": 368681, "epoch": 4441} {"train_loss": -26.220905303955078, "global_step": 368682, "epoch": 4441} {"train_loss": -26.270681381225586, "global_step": 368683, "epoch": 4441} {"train_loss": -26.651159286499023, "global_step": 368684, "epoch": 4441} {"train_loss": -26.202810517276625, "global_step": 368685, "epoch": 4441, "val_loss": 6663889.0} {"train_loss": -25.8913516998291, "global_step": 368686, "epoch": 4442} {"train_loss": -26.230224609375, "global_step": 368687, "epoch": 4442} {"train_loss": -25.834440231323242, "global_step": 368688, "epoch": 4442} {"train_loss": -25.976551055908203, "global_step": 368689, "epoch": 4442} {"train_loss": -25.774768829345703, "global_step": 368690, "epoch": 4442} {"train_loss": -26.004552841186523, "global_step": 368691, "epoch": 4442} {"train_loss": -26.136951446533203, "global_step": 368692, "epoch": 4442} {"train_loss": -26.384668350219727, "global_step": 368693, "epoch": 4442} {"train_loss": -26.2451229095459, "global_step": 368694, "epoch": 4442} {"train_loss": -26.066274642944336, "global_step": 368695, "epoch": 4442} {"train_loss": -25.825265884399414, "global_step": 368696, "epoch": 4442} {"train_loss": -26.294408798217773, "global_step": 368697, "epoch": 4442} {"train_loss": -26.121753692626953, "global_step": 368698, "epoch": 4442} {"train_loss": -26.387720108032227, "global_step": 368699, "epoch": 4442} {"train_loss": -25.894561767578125, "global_step": 368700, "epoch": 4442} {"train_loss": -26.007160186767578, "global_step": 368701, "epoch": 4442} {"train_loss": -25.94709587097168, "global_step": 368702, "epoch": 4442} {"train_loss": -26.473371505737305, "global_step": 368703, "epoch": 4442} {"train_loss": -26.6053466796875, "global_step": 368704, "epoch": 4442} {"train_loss": -26.54078483581543, "global_step": 368705, "epoch": 4442} {"train_loss": -26.220993041992188, "global_step": 368706, "epoch": 4442} {"train_loss": -26.27216148376465, "global_step": 368707, "epoch": 4442} {"train_loss": -26.2567195892334, "global_step": 368708, "epoch": 4442} {"train_loss": -26.351104736328125, "global_step": 368709, "epoch": 4442} {"train_loss": -26.462299346923828, "global_step": 368710, "epoch": 4442} {"train_loss": -26.27387809753418, "global_step": 368711, "epoch": 4442} {"train_loss": -26.144424438476562, "global_step": 368712, "epoch": 4442} {"train_loss": -26.37847900390625, "global_step": 368713, "epoch": 4442} {"train_loss": -26.339948654174805, "global_step": 368714, "epoch": 4442} {"train_loss": -26.577655792236328, "global_step": 368715, "epoch": 4442} {"train_loss": -26.62501335144043, "global_step": 368716, "epoch": 4442} {"train_loss": -26.363819122314453, "global_step": 368717, "epoch": 4442} {"train_loss": -26.510944366455078, "global_step": 368718, "epoch": 4442} {"train_loss": -26.27979850769043, "global_step": 368719, "epoch": 4442} {"train_loss": -26.291385650634766, "global_step": 368720, "epoch": 4442} {"train_loss": -26.43105125427246, "global_step": 368721, "epoch": 4442} {"train_loss": -26.094533920288086, "global_step": 368722, "epoch": 4442} {"train_loss": -26.107099533081055, "global_step": 368723, "epoch": 4442} {"train_loss": -26.543630599975586, "global_step": 368724, "epoch": 4442} {"train_loss": -26.327987670898438, "global_step": 368725, "epoch": 4442} {"train_loss": -26.291776657104492, "global_step": 368726, "epoch": 4442} {"train_loss": -26.219806671142578, "global_step": 368727, "epoch": 4442} {"train_loss": -26.571792602539062, "global_step": 368728, "epoch": 4442} {"train_loss": -26.6780948638916, "global_step": 368729, "epoch": 4442} {"train_loss": -26.498016357421875, "global_step": 368730, "epoch": 4442} {"train_loss": -26.515594482421875, "global_step": 368731, "epoch": 4442} {"train_loss": -26.470260620117188, "global_step": 368732, "epoch": 4442} {"train_loss": -26.394561767578125, "global_step": 368733, "epoch": 4442} {"train_loss": -26.504545211791992, "global_step": 368734, "epoch": 4442} {"train_loss": -26.453516006469727, "global_step": 368735, "epoch": 4442} {"train_loss": -26.309463500976562, "global_step": 368736, "epoch": 4442} {"train_loss": -26.5246524810791, "global_step": 368737, "epoch": 4442} {"train_loss": -26.162031173706055, "global_step": 368738, "epoch": 4442} {"train_loss": -26.265954971313477, "global_step": 368739, "epoch": 4442} {"train_loss": -26.87298011779785, "global_step": 368740, "epoch": 4442} {"train_loss": -26.40625, "global_step": 368741, "epoch": 4442} {"train_loss": -26.82081413269043, "global_step": 368742, "epoch": 4442} {"train_loss": -26.90007972717285, "global_step": 368743, "epoch": 4442} {"train_loss": -26.94013023376465, "global_step": 368744, "epoch": 4442} {"train_loss": -26.5334415435791, "global_step": 368745, "epoch": 4442} {"train_loss": -26.721221923828125, "global_step": 368746, "epoch": 4442} {"train_loss": -26.650543212890625, "global_step": 368747, "epoch": 4442} {"train_loss": -26.345600128173828, "global_step": 368748, "epoch": 4442} {"train_loss": -26.79925537109375, "global_step": 368749, "epoch": 4442} {"train_loss": -26.22389030456543, "global_step": 368750, "epoch": 4442} {"train_loss": -26.49537467956543, "global_step": 368751, "epoch": 4442} {"train_loss": -26.72572135925293, "global_step": 368752, "epoch": 4442} {"train_loss": -26.3294734954834, "global_step": 368753, "epoch": 4442} {"train_loss": -26.4603271484375, "global_step": 368754, "epoch": 4442} {"train_loss": -26.69415283203125, "global_step": 368755, "epoch": 4442} {"train_loss": -26.4561710357666, "global_step": 368756, "epoch": 4442} {"train_loss": -25.95525550842285, "global_step": 368757, "epoch": 4442} {"train_loss": -25.899600982666016, "global_step": 368758, "epoch": 4442} {"train_loss": -25.33856773376465, "global_step": 368759, "epoch": 4442} {"train_loss": -25.785749435424805, "global_step": 368760, "epoch": 4442} {"train_loss": -25.6375732421875, "global_step": 368761, "epoch": 4442} {"train_loss": -25.51288414001465, "global_step": 368762, "epoch": 4442} {"train_loss": -26.62985610961914, "global_step": 368763, "epoch": 4442} {"train_loss": -26.151220321655273, "global_step": 368764, "epoch": 4442} {"train_loss": -26.222925186157227, "global_step": 368765, "epoch": 4442} {"train_loss": -26.370580673217773, "global_step": 368766, "epoch": 4442} {"train_loss": -26.185138702392578, "global_step": 368767, "epoch": 4442} {"train_loss": -26.298426455762012, "global_step": 368768, "epoch": 4442, "val_loss": 6622576.0} {"train_loss": -26.1610164642334, "global_step": 368769, "epoch": 4443} {"train_loss": -25.743661880493164, "global_step": 368770, "epoch": 4443} {"train_loss": -25.49083709716797, "global_step": 368771, "epoch": 4443} {"train_loss": -26.097299575805664, "global_step": 368772, "epoch": 4443} {"train_loss": -26.037357330322266, "global_step": 368773, "epoch": 4443} {"train_loss": -25.793493270874023, "global_step": 368774, "epoch": 4443} {"train_loss": -26.02007484436035, "global_step": 368775, "epoch": 4443} {"train_loss": -25.644617080688477, "global_step": 368776, "epoch": 4443} {"train_loss": -25.9285831451416, "global_step": 368777, "epoch": 4443} {"train_loss": -26.345233917236328, "global_step": 368778, "epoch": 4443} {"train_loss": -25.377120971679688, "global_step": 368779, "epoch": 4443} {"train_loss": -26.24979019165039, "global_step": 368780, "epoch": 4443} {"train_loss": -25.788679122924805, "global_step": 368781, "epoch": 4443} {"train_loss": -26.35059928894043, "global_step": 368782, "epoch": 4443} {"train_loss": -26.286880493164062, "global_step": 368783, "epoch": 4443} {"train_loss": -26.05304527282715, "global_step": 368784, "epoch": 4443} {"train_loss": -26.143619537353516, "global_step": 368785, "epoch": 4443} {"train_loss": -26.608734130859375, "global_step": 368786, "epoch": 4443} {"train_loss": -26.70682716369629, "global_step": 368787, "epoch": 4443} {"train_loss": -26.20619010925293, "global_step": 368788, "epoch": 4443} {"train_loss": -26.548095703125, "global_step": 368789, "epoch": 4443} {"train_loss": -26.278562545776367, "global_step": 368790, "epoch": 4443} {"train_loss": -26.617712020874023, "global_step": 368791, "epoch": 4443} {"train_loss": -26.761581420898438, "global_step": 368792, "epoch": 4443} {"train_loss": -26.14019203186035, "global_step": 368793, "epoch": 4443} {"train_loss": -26.664962768554688, "global_step": 368794, "epoch": 4443} {"train_loss": -26.68039321899414, "global_step": 368795, "epoch": 4443} {"train_loss": -26.540740966796875, "global_step": 368796, "epoch": 4443} {"train_loss": -26.404041290283203, "global_step": 368797, "epoch": 4443} {"train_loss": -26.610876083374023, "global_step": 368798, "epoch": 4443} {"train_loss": -26.49298667907715, "global_step": 368799, "epoch": 4443} {"train_loss": -26.452722549438477, "global_step": 368800, "epoch": 4443} {"train_loss": -26.116291046142578, "global_step": 368801, "epoch": 4443} {"train_loss": -26.50909423828125, "global_step": 368802, "epoch": 4443} {"train_loss": -26.126300811767578, "global_step": 368803, "epoch": 4443} {"train_loss": -26.771392822265625, "global_step": 368804, "epoch": 4443} {"train_loss": -26.270126342773438, "global_step": 368805, "epoch": 4443} {"train_loss": -26.696247100830078, "global_step": 368806, "epoch": 4443} {"train_loss": -26.49017906188965, "global_step": 368807, "epoch": 4443} {"train_loss": -26.2264461517334, "global_step": 368808, "epoch": 4443} {"train_loss": -26.46876335144043, "global_step": 368809, "epoch": 4443} {"train_loss": -26.759540557861328, "global_step": 368810, "epoch": 4443} {"train_loss": -26.047077178955078, "global_step": 368811, "epoch": 4443} {"train_loss": -26.049808502197266, "global_step": 368812, "epoch": 4443} {"train_loss": -26.8209228515625, "global_step": 368813, "epoch": 4443} {"train_loss": -26.083871841430664, "global_step": 368814, "epoch": 4443} {"train_loss": -26.42962074279785, "global_step": 368815, "epoch": 4443} {"train_loss": -26.571491241455078, "global_step": 368816, "epoch": 4443} {"train_loss": -26.420276641845703, "global_step": 368817, "epoch": 4443} {"train_loss": -26.589996337890625, "global_step": 368818, "epoch": 4443} {"train_loss": -26.354665756225586, "global_step": 368819, "epoch": 4443} {"train_loss": -26.203445434570312, "global_step": 368820, "epoch": 4443} {"train_loss": -26.35274314880371, "global_step": 368821, "epoch": 4443} {"train_loss": -26.4160099029541, "global_step": 368822, "epoch": 4443} {"train_loss": -26.77320671081543, "global_step": 368823, "epoch": 4443} {"train_loss": -26.019590377807617, "global_step": 368824, "epoch": 4443} {"train_loss": -25.909591674804688, "global_step": 368825, "epoch": 4443} {"train_loss": -26.06427001953125, "global_step": 368826, "epoch": 4443} {"train_loss": -26.086578369140625, "global_step": 368827, "epoch": 4443} {"train_loss": -26.364627838134766, "global_step": 368828, "epoch": 4443} {"train_loss": -26.373687744140625, "global_step": 368829, "epoch": 4443} {"train_loss": -26.703845977783203, "global_step": 368830, "epoch": 4443} {"train_loss": -26.185346603393555, "global_step": 368831, "epoch": 4443} {"train_loss": -26.271961212158203, "global_step": 368832, "epoch": 4443} {"train_loss": -26.654550552368164, "global_step": 368833, "epoch": 4443} {"train_loss": -26.46135902404785, "global_step": 368834, "epoch": 4443} {"train_loss": -26.58330726623535, "global_step": 368835, "epoch": 4443} {"train_loss": -26.541980743408203, "global_step": 368836, "epoch": 4443} {"train_loss": -26.411457061767578, "global_step": 368837, "epoch": 4443} {"train_loss": -26.460012435913086, "global_step": 368838, "epoch": 4443} {"train_loss": -26.039941787719727, "global_step": 368839, "epoch": 4443} {"train_loss": -26.341779708862305, "global_step": 368840, "epoch": 4443} {"train_loss": -26.54136085510254, "global_step": 368841, "epoch": 4443} {"train_loss": -25.99952507019043, "global_step": 368842, "epoch": 4443} {"train_loss": -26.352453231811523, "global_step": 368843, "epoch": 4443} {"train_loss": -26.009626388549805, "global_step": 368844, "epoch": 4443} {"train_loss": -26.495838165283203, "global_step": 368845, "epoch": 4443} {"train_loss": -25.87774658203125, "global_step": 368846, "epoch": 4443} {"train_loss": -26.260557174682617, "global_step": 368847, "epoch": 4443} {"train_loss": -26.34808921813965, "global_step": 368848, "epoch": 4443} {"train_loss": -26.514841079711914, "global_step": 368849, "epoch": 4443} {"train_loss": -26.296432495117188, "global_step": 368850, "epoch": 4443} {"train_loss": -26.310415934367352, "global_step": 368851, "epoch": 4443, "val_loss": 6685090.0} {"train_loss": -25.336349487304688, "global_step": 368852, "epoch": 4444} {"train_loss": -25.64829444885254, "global_step": 368853, "epoch": 4444} {"train_loss": -25.74700355529785, "global_step": 368854, "epoch": 4444} {"train_loss": -25.8408203125, "global_step": 368855, "epoch": 4444} {"train_loss": -25.55299949645996, "global_step": 368856, "epoch": 4444} {"train_loss": -25.30132293701172, "global_step": 368857, "epoch": 4444} {"train_loss": -25.57728385925293, "global_step": 368858, "epoch": 4444} {"train_loss": -25.91365623474121, "global_step": 368859, "epoch": 4444} {"train_loss": -26.005842208862305, "global_step": 368860, "epoch": 4444} {"train_loss": -25.659719467163086, "global_step": 368861, "epoch": 4444} {"train_loss": -25.98211097717285, "global_step": 368862, "epoch": 4444} {"train_loss": -25.613061904907227, "global_step": 368863, "epoch": 4444} {"train_loss": -26.0277156829834, "global_step": 368864, "epoch": 4444} {"train_loss": -26.046051025390625, "global_step": 368865, "epoch": 4444} {"train_loss": -26.4599552154541, "global_step": 368866, "epoch": 4444} {"train_loss": -26.062170028686523, "global_step": 368867, "epoch": 4444} {"train_loss": -26.591445922851562, "global_step": 368868, "epoch": 4444} {"train_loss": -26.076513290405273, "global_step": 368869, "epoch": 4444} {"train_loss": -25.618438720703125, "global_step": 368870, "epoch": 4444} {"train_loss": -25.955698013305664, "global_step": 368871, "epoch": 4444} {"train_loss": -25.82942008972168, "global_step": 368872, "epoch": 4444} {"train_loss": -26.25909423828125, "global_step": 368873, "epoch": 4444} {"train_loss": -25.879074096679688, "global_step": 368874, "epoch": 4444} {"train_loss": -26.168537139892578, "global_step": 368875, "epoch": 4444} {"train_loss": -26.482938766479492, "global_step": 368876, "epoch": 4444} {"train_loss": -26.2774600982666, "global_step": 368877, "epoch": 4444} {"train_loss": -26.196033477783203, "global_step": 368878, "epoch": 4444} {"train_loss": -26.026336669921875, "global_step": 368879, "epoch": 4444} {"train_loss": -26.714426040649414, "global_step": 368880, "epoch": 4444} {"train_loss": -26.361621856689453, "global_step": 368881, "epoch": 4444} {"train_loss": -26.43060302734375, "global_step": 368882, "epoch": 4444} {"train_loss": -26.06058120727539, "global_step": 368883, "epoch": 4444} {"train_loss": -26.165180206298828, "global_step": 368884, "epoch": 4444} {"train_loss": -26.551990509033203, "global_step": 368885, "epoch": 4444} {"train_loss": -26.381122589111328, "global_step": 368886, "epoch": 4444} {"train_loss": -26.0028133392334, "global_step": 368887, "epoch": 4444} {"train_loss": -26.427778244018555, "global_step": 368888, "epoch": 4444} {"train_loss": -26.726272583007812, "global_step": 368889, "epoch": 4444} {"train_loss": -26.692243576049805, "global_step": 368890, "epoch": 4444} {"train_loss": -26.44486427307129, "global_step": 368891, "epoch": 4444} {"train_loss": -26.04656410217285, "global_step": 368892, "epoch": 4444} {"train_loss": -26.50881004333496, "global_step": 368893, "epoch": 4444} {"train_loss": -26.419485092163086, "global_step": 368894, "epoch": 4444} {"train_loss": -26.540225982666016, "global_step": 368895, "epoch": 4444} {"train_loss": -26.604047775268555, "global_step": 368896, "epoch": 4444} {"train_loss": -26.209177017211914, "global_step": 368897, "epoch": 4444} {"train_loss": -26.404956817626953, "global_step": 368898, "epoch": 4444} {"train_loss": -26.247892379760742, "global_step": 368899, "epoch": 4444} {"train_loss": -26.3134765625, "global_step": 368900, "epoch": 4444} {"train_loss": -26.275772094726562, "global_step": 368901, "epoch": 4444} {"train_loss": -25.87920570373535, "global_step": 368902, "epoch": 4444} {"train_loss": -25.936735153198242, "global_step": 368903, "epoch": 4444} {"train_loss": -26.23232078552246, "global_step": 368904, "epoch": 4444} {"train_loss": -26.1086368560791, "global_step": 368905, "epoch": 4444} {"train_loss": -26.3966007232666, "global_step": 368906, "epoch": 4444} {"train_loss": -26.236743927001953, "global_step": 368907, "epoch": 4444} {"train_loss": -26.233869552612305, "global_step": 368908, "epoch": 4444} {"train_loss": -26.546842575073242, "global_step": 368909, "epoch": 4444} {"train_loss": -26.21131706237793, "global_step": 368910, "epoch": 4444} {"train_loss": -25.940536499023438, "global_step": 368911, "epoch": 4444} {"train_loss": -26.57794761657715, "global_step": 368912, "epoch": 4444} {"train_loss": -26.471790313720703, "global_step": 368913, "epoch": 4444} {"train_loss": -26.098636627197266, "global_step": 368914, "epoch": 4444} {"train_loss": -26.542896270751953, "global_step": 368915, "epoch": 4444} {"train_loss": -26.21856117248535, "global_step": 368916, "epoch": 4444} {"train_loss": -26.2222843170166, "global_step": 368917, "epoch": 4444} {"train_loss": -26.53173828125, "global_step": 368918, "epoch": 4444} {"train_loss": -26.41958999633789, "global_step": 368919, "epoch": 4444} {"train_loss": -26.2023868560791, "global_step": 368920, "epoch": 4444} {"train_loss": -25.862873077392578, "global_step": 368921, "epoch": 4444} {"train_loss": -25.501182556152344, "global_step": 368922, "epoch": 4444} {"train_loss": -25.22035026550293, "global_step": 368923, "epoch": 4444} {"train_loss": -25.912189483642578, "global_step": 368924, "epoch": 4444} {"train_loss": -26.369115829467773, "global_step": 368925, "epoch": 4444} {"train_loss": -25.601964950561523, "global_step": 368926, "epoch": 4444} {"train_loss": -26.500381469726562, "global_step": 368927, "epoch": 4444} {"train_loss": -25.663633346557617, "global_step": 368928, "epoch": 4444} {"train_loss": -26.343679428100586, "global_step": 368929, "epoch": 4444} {"train_loss": -26.4160213470459, "global_step": 368930, "epoch": 4444} {"train_loss": -25.981760025024414, "global_step": 368931, "epoch": 4444} {"train_loss": -26.553747177124023, "global_step": 368932, "epoch": 4444} {"train_loss": -25.701675415039062, "global_step": 368933, "epoch": 4444} {"train_loss": -26.130960947059723, "global_step": 368934, "epoch": 4444, "val_loss": 6557112.5} {"train_loss": -25.288589477539062, "global_step": 368935, "epoch": 4445} {"train_loss": -25.405736923217773, "global_step": 368936, "epoch": 4445} {"train_loss": -25.616384506225586, "global_step": 368937, "epoch": 4445} {"train_loss": -25.645105361938477, "global_step": 368938, "epoch": 4445} {"train_loss": -25.320741653442383, "global_step": 368939, "epoch": 4445} {"train_loss": -25.556753158569336, "global_step": 368940, "epoch": 4445} {"train_loss": -25.7097225189209, "global_step": 368941, "epoch": 4445} {"train_loss": -26.106481552124023, "global_step": 368942, "epoch": 4445} {"train_loss": -25.81707763671875, "global_step": 368943, "epoch": 4445} {"train_loss": -25.920080184936523, "global_step": 368944, "epoch": 4445} {"train_loss": -26.033994674682617, "global_step": 368945, "epoch": 4445} {"train_loss": -25.753467559814453, "global_step": 368946, "epoch": 4445} {"train_loss": -26.15984535217285, "global_step": 368947, "epoch": 4445} {"train_loss": -26.020803451538086, "global_step": 368948, "epoch": 4445} {"train_loss": -25.99521255493164, "global_step": 368949, "epoch": 4445} {"train_loss": -26.21100425720215, "global_step": 368950, "epoch": 4445} {"train_loss": -26.33909034729004, "global_step": 368951, "epoch": 4445} {"train_loss": -25.73377799987793, "global_step": 368952, "epoch": 4445} {"train_loss": -26.545312881469727, "global_step": 368953, "epoch": 4445} {"train_loss": -26.443429946899414, "global_step": 368954, "epoch": 4445} {"train_loss": -26.097726821899414, "global_step": 368955, "epoch": 4445} {"train_loss": -26.020736694335938, "global_step": 368956, "epoch": 4445} {"train_loss": -26.474287033081055, "global_step": 368957, "epoch": 4445} {"train_loss": -26.3381404876709, "global_step": 368958, "epoch": 4445} {"train_loss": -26.369226455688477, "global_step": 368959, "epoch": 4445} {"train_loss": -26.64002799987793, "global_step": 368960, "epoch": 4445} {"train_loss": -26.14588737487793, "global_step": 368961, "epoch": 4445} {"train_loss": -26.379011154174805, "global_step": 368962, "epoch": 4445} {"train_loss": -26.600873947143555, "global_step": 368963, "epoch": 4445} {"train_loss": -26.60922622680664, "global_step": 368964, "epoch": 4445} {"train_loss": -26.635162353515625, "global_step": 368965, "epoch": 4445} {"train_loss": -26.329498291015625, "global_step": 368966, "epoch": 4445} {"train_loss": -26.507648468017578, "global_step": 368967, "epoch": 4445} {"train_loss": -26.075775146484375, "global_step": 368968, "epoch": 4445} {"train_loss": -26.309171676635742, "global_step": 368969, "epoch": 4445} {"train_loss": -26.60114860534668, "global_step": 368970, "epoch": 4445} {"train_loss": -26.483972549438477, "global_step": 368971, "epoch": 4445} {"train_loss": -26.76679039001465, "global_step": 368972, "epoch": 4445} {"train_loss": -26.54256248474121, "global_step": 368973, "epoch": 4445} {"train_loss": -26.419336318969727, "global_step": 368974, "epoch": 4445} {"train_loss": -26.4973087310791, "global_step": 368975, "epoch": 4445} {"train_loss": -26.81329345703125, "global_step": 368976, "epoch": 4445} {"train_loss": -26.672077178955078, "global_step": 368977, "epoch": 4445} {"train_loss": -26.3741397857666, "global_step": 368978, "epoch": 4445} {"train_loss": -26.650211334228516, "global_step": 368979, "epoch": 4445} {"train_loss": -26.6536808013916, "global_step": 368980, "epoch": 4445} {"train_loss": -26.465246200561523, "global_step": 368981, "epoch": 4445} {"train_loss": -26.164936065673828, "global_step": 368982, "epoch": 4445} {"train_loss": -26.487903594970703, "global_step": 368983, "epoch": 4445} {"train_loss": -26.674365997314453, "global_step": 368984, "epoch": 4445} {"train_loss": -26.364294052124023, "global_step": 368985, "epoch": 4445} {"train_loss": -26.530607223510742, "global_step": 368986, "epoch": 4445} {"train_loss": -26.511768341064453, "global_step": 368987, "epoch": 4445} {"train_loss": -26.715335845947266, "global_step": 368988, "epoch": 4445} {"train_loss": -26.443897247314453, "global_step": 368989, "epoch": 4445} {"train_loss": -26.493078231811523, "global_step": 368990, "epoch": 4445} {"train_loss": -26.271697998046875, "global_step": 368991, "epoch": 4445} {"train_loss": -26.733869552612305, "global_step": 368992, "epoch": 4445} {"train_loss": -26.58643913269043, "global_step": 368993, "epoch": 4445} {"train_loss": -26.430301666259766, "global_step": 368994, "epoch": 4445} {"train_loss": -26.393285751342773, "global_step": 368995, "epoch": 4445} {"train_loss": -26.7482967376709, "global_step": 368996, "epoch": 4445} {"train_loss": -26.64107322692871, "global_step": 368997, "epoch": 4445} {"train_loss": -26.51091957092285, "global_step": 368998, "epoch": 4445} {"train_loss": -26.647510528564453, "global_step": 368999, "epoch": 4445} {"train_loss": -26.576135635375977, "global_step": 369000, "epoch": 4445} {"train_loss": -26.61081886291504, "global_step": 369001, "epoch": 4445} {"train_loss": -26.387557983398438, "global_step": 369002, "epoch": 4445} {"train_loss": -26.722747802734375, "global_step": 369003, "epoch": 4445} {"train_loss": -26.4918270111084, "global_step": 369004, "epoch": 4445} {"train_loss": -26.138874053955078, "global_step": 369005, "epoch": 4445} {"train_loss": -26.82012939453125, "global_step": 369006, "epoch": 4445} {"train_loss": -26.166467666625977, "global_step": 369007, "epoch": 4445} {"train_loss": -26.25640296936035, "global_step": 369008, "epoch": 4445} {"train_loss": -26.23246192932129, "global_step": 369009, "epoch": 4445} {"train_loss": -25.659086227416992, "global_step": 369010, "epoch": 4445} {"train_loss": -23.854887008666992, "global_step": 369011, "epoch": 4445} {"train_loss": -20.74467658996582, "global_step": 369012, "epoch": 4445} {"train_loss": -23.335176467895508, "global_step": 369013, "epoch": 4445} {"train_loss": -25.487789154052734, "global_step": 369014, "epoch": 4445} {"train_loss": -24.624311447143555, "global_step": 369015, "epoch": 4445} {"train_loss": -24.913589477539062, "global_step": 369016, "epoch": 4445} {"train_loss": -26.119528919817455, "global_step": 369017, "epoch": 4445, "val_loss": 6672795.5} {"train_loss": -24.200439453125, "global_step": 369018, "epoch": 4446} {"train_loss": -24.77006721496582, "global_step": 369019, "epoch": 4446} {"train_loss": -24.847562789916992, "global_step": 369020, "epoch": 4446} {"train_loss": -24.58328628540039, "global_step": 369021, "epoch": 4446} {"train_loss": -24.83106803894043, "global_step": 369022, "epoch": 4446} {"train_loss": -24.848163604736328, "global_step": 369023, "epoch": 4446} {"train_loss": -25.199262619018555, "global_step": 369024, "epoch": 4446} {"train_loss": -24.85662841796875, "global_step": 369025, "epoch": 4446} {"train_loss": -24.6954402923584, "global_step": 369026, "epoch": 4446} {"train_loss": -25.15622329711914, "global_step": 369027, "epoch": 4446} {"train_loss": -25.067934036254883, "global_step": 369028, "epoch": 4446} {"train_loss": -25.131805419921875, "global_step": 369029, "epoch": 4446} {"train_loss": -25.261966705322266, "global_step": 369030, "epoch": 4446} {"train_loss": -24.94867515563965, "global_step": 369031, "epoch": 4446} {"train_loss": -25.49788475036621, "global_step": 369032, "epoch": 4446} {"train_loss": -25.14289665222168, "global_step": 369033, "epoch": 4446} {"train_loss": -25.21820640563965, "global_step": 369034, "epoch": 4446} {"train_loss": -25.589879989624023, "global_step": 369035, "epoch": 4446} {"train_loss": -25.779748916625977, "global_step": 369036, "epoch": 4446} {"train_loss": -25.22688102722168, "global_step": 369037, "epoch": 4446} {"train_loss": -25.89413833618164, "global_step": 369038, "epoch": 4446} {"train_loss": -25.924585342407227, "global_step": 369039, "epoch": 4446} {"train_loss": -25.496780395507812, "global_step": 369040, "epoch": 4446} {"train_loss": -25.604022979736328, "global_step": 369041, "epoch": 4446} {"train_loss": -25.700727462768555, "global_step": 369042, "epoch": 4446} {"train_loss": -25.579702377319336, "global_step": 369043, "epoch": 4446} {"train_loss": -25.78888511657715, "global_step": 369044, "epoch": 4446} {"train_loss": -26.17203712463379, "global_step": 369045, "epoch": 4446} {"train_loss": -25.4593505859375, "global_step": 369046, "epoch": 4446} {"train_loss": -25.771474838256836, "global_step": 369047, "epoch": 4446} {"train_loss": -25.99576187133789, "global_step": 369048, "epoch": 4446} {"train_loss": -26.06428337097168, "global_step": 369049, "epoch": 4446} {"train_loss": -26.211185455322266, "global_step": 369050, "epoch": 4446} {"train_loss": -25.6475772857666, "global_step": 369051, "epoch": 4446} {"train_loss": -25.642114639282227, "global_step": 369052, "epoch": 4446} {"train_loss": -26.066129684448242, "global_step": 369053, "epoch": 4446} {"train_loss": -25.848499298095703, "global_step": 369054, "epoch": 4446} {"train_loss": -25.9211368560791, "global_step": 369055, "epoch": 4446} {"train_loss": -26.16997718811035, "global_step": 369056, "epoch": 4446} {"train_loss": -26.06434440612793, "global_step": 369057, "epoch": 4446} {"train_loss": -26.283594131469727, "global_step": 369058, "epoch": 4446} {"train_loss": -26.555646896362305, "global_step": 369059, "epoch": 4446} {"train_loss": -26.15681266784668, "global_step": 369060, "epoch": 4446} {"train_loss": -26.282331466674805, "global_step": 369061, "epoch": 4446} {"train_loss": -26.750782012939453, "global_step": 369062, "epoch": 4446} {"train_loss": -26.15142250061035, "global_step": 369063, "epoch": 4446} {"train_loss": -26.009729385375977, "global_step": 369064, "epoch": 4446} {"train_loss": -26.419275283813477, "global_step": 369065, "epoch": 4446} {"train_loss": -26.331220626831055, "global_step": 369066, "epoch": 4446} {"train_loss": -26.3917236328125, "global_step": 369067, "epoch": 4446} {"train_loss": -26.43242835998535, "global_step": 369068, "epoch": 4446} {"train_loss": -26.043701171875, "global_step": 369069, "epoch": 4446} {"train_loss": -26.55559730529785, "global_step": 369070, "epoch": 4446} {"train_loss": -26.339801788330078, "global_step": 369071, "epoch": 4446} {"train_loss": -26.2598934173584, "global_step": 369072, "epoch": 4446} {"train_loss": -26.300704956054688, "global_step": 369073, "epoch": 4446} {"train_loss": -26.5028076171875, "global_step": 369074, "epoch": 4446} {"train_loss": -26.424829483032227, "global_step": 369075, "epoch": 4446} {"train_loss": -26.35573387145996, "global_step": 369076, "epoch": 4446} {"train_loss": -26.269977569580078, "global_step": 369077, "epoch": 4446} {"train_loss": -26.649505615234375, "global_step": 369078, "epoch": 4446} {"train_loss": -26.31648826599121, "global_step": 369079, "epoch": 4446} {"train_loss": -26.5322265625, "global_step": 369080, "epoch": 4446} {"train_loss": -26.584577560424805, "global_step": 369081, "epoch": 4446} {"train_loss": -26.8753719329834, "global_step": 369082, "epoch": 4446} {"train_loss": -26.61078453063965, "global_step": 369083, "epoch": 4446} {"train_loss": -26.75069236755371, "global_step": 369084, "epoch": 4446} {"train_loss": -26.736286163330078, "global_step": 369085, "epoch": 4446} {"train_loss": -26.325885772705078, "global_step": 369086, "epoch": 4446} {"train_loss": -25.986846923828125, "global_step": 369087, "epoch": 4446} {"train_loss": -26.73817253112793, "global_step": 369088, "epoch": 4446} {"train_loss": -26.473703384399414, "global_step": 369089, "epoch": 4446} {"train_loss": -26.347692489624023, "global_step": 369090, "epoch": 4446} {"train_loss": -26.729736328125, "global_step": 369091, "epoch": 4446} {"train_loss": -25.98689079284668, "global_step": 369092, "epoch": 4446} {"train_loss": -26.53664207458496, "global_step": 369093, "epoch": 4446} {"train_loss": -26.433027267456055, "global_step": 369094, "epoch": 4446} {"train_loss": -26.551767349243164, "global_step": 369095, "epoch": 4446} {"train_loss": -26.693851470947266, "global_step": 369096, "epoch": 4446} {"train_loss": -26.761343002319336, "global_step": 369097, "epoch": 4446} {"train_loss": -26.38897132873535, "global_step": 369098, "epoch": 4446} {"train_loss": -26.77170753479004, "global_step": 369099, "epoch": 4446} {"train_loss": -25.951418244695088, "global_step": 369100, "epoch": 4446, "val_loss": 6700967.0} {"train_loss": -26.049863815307617, "global_step": 369101, "epoch": 4447} {"train_loss": -25.721363067626953, "global_step": 369102, "epoch": 4447} {"train_loss": -26.308719635009766, "global_step": 369103, "epoch": 4447} {"train_loss": -25.79182243347168, "global_step": 369104, "epoch": 4447} {"train_loss": -25.167724609375, "global_step": 369105, "epoch": 4447} {"train_loss": -25.778661727905273, "global_step": 369106, "epoch": 4447} {"train_loss": -25.9808406829834, "global_step": 369107, "epoch": 4447} {"train_loss": -25.726287841796875, "global_step": 369108, "epoch": 4447} {"train_loss": -26.247241973876953, "global_step": 369109, "epoch": 4447} {"train_loss": -25.929107666015625, "global_step": 369110, "epoch": 4447} {"train_loss": -26.318761825561523, "global_step": 369111, "epoch": 4447} {"train_loss": -26.046995162963867, "global_step": 369112, "epoch": 4447} {"train_loss": -25.9262752532959, "global_step": 369113, "epoch": 4447} {"train_loss": -26.282608032226562, "global_step": 369114, "epoch": 4447} {"train_loss": -25.9644718170166, "global_step": 369115, "epoch": 4447} {"train_loss": -26.371633529663086, "global_step": 369116, "epoch": 4447} {"train_loss": -26.120874404907227, "global_step": 369117, "epoch": 4447} {"train_loss": -26.2435359954834, "global_step": 369118, "epoch": 4447} {"train_loss": -25.82854652404785, "global_step": 369119, "epoch": 4447} {"train_loss": -26.883041381835938, "global_step": 369120, "epoch": 4447} {"train_loss": -26.460912704467773, "global_step": 369121, "epoch": 4447} {"train_loss": -26.2763614654541, "global_step": 369122, "epoch": 4447} {"train_loss": -26.593042373657227, "global_step": 369123, "epoch": 4447} {"train_loss": -26.027353286743164, "global_step": 369124, "epoch": 4447} {"train_loss": -26.410175323486328, "global_step": 369125, "epoch": 4447} {"train_loss": -26.610782623291016, "global_step": 369126, "epoch": 4447} {"train_loss": -26.645034790039062, "global_step": 369127, "epoch": 4447} {"train_loss": -26.516407012939453, "global_step": 369128, "epoch": 4447} {"train_loss": -26.42609214782715, "global_step": 369129, "epoch": 4447} {"train_loss": -26.522409439086914, "global_step": 369130, "epoch": 4447} {"train_loss": -26.2278995513916, "global_step": 369131, "epoch": 4447} {"train_loss": -26.44867515563965, "global_step": 369132, "epoch": 4447} {"train_loss": -26.689523696899414, "global_step": 369133, "epoch": 4447} {"train_loss": -26.389074325561523, "global_step": 369134, "epoch": 4447} {"train_loss": -26.639373779296875, "global_step": 369135, "epoch": 4447} {"train_loss": -26.73676109313965, "global_step": 369136, "epoch": 4447} {"train_loss": -26.689834594726562, "global_step": 369137, "epoch": 4447} {"train_loss": -26.65253257751465, "global_step": 369138, "epoch": 4447} {"train_loss": -26.323205947875977, "global_step": 369139, "epoch": 4447} {"train_loss": -26.11726188659668, "global_step": 369140, "epoch": 4447} {"train_loss": -26.602136611938477, "global_step": 369141, "epoch": 4447} {"train_loss": -26.237207412719727, "global_step": 369142, "epoch": 4447} {"train_loss": -26.821853637695312, "global_step": 369143, "epoch": 4447} {"train_loss": -26.245391845703125, "global_step": 369144, "epoch": 4447} {"train_loss": -26.23225975036621, "global_step": 369145, "epoch": 4447} {"train_loss": -26.318084716796875, "global_step": 369146, "epoch": 4447} {"train_loss": -26.342676162719727, "global_step": 369147, "epoch": 4447} {"train_loss": -25.916574478149414, "global_step": 369148, "epoch": 4447} {"train_loss": -26.48480796813965, "global_step": 369149, "epoch": 4447} {"train_loss": -26.5451717376709, "global_step": 369150, "epoch": 4447} {"train_loss": -26.013242721557617, "global_step": 369151, "epoch": 4447} {"train_loss": -25.725629806518555, "global_step": 369152, "epoch": 4447} {"train_loss": -26.52863883972168, "global_step": 369153, "epoch": 4447} {"train_loss": -25.908782958984375, "global_step": 369154, "epoch": 4447} {"train_loss": -26.435422897338867, "global_step": 369155, "epoch": 4447} {"train_loss": -26.21510887145996, "global_step": 369156, "epoch": 4447} {"train_loss": -26.167367935180664, "global_step": 369157, "epoch": 4447} {"train_loss": -26.381229400634766, "global_step": 369158, "epoch": 4447} {"train_loss": -26.237165451049805, "global_step": 369159, "epoch": 4447} {"train_loss": -26.14752197265625, "global_step": 369160, "epoch": 4447} {"train_loss": -26.379383087158203, "global_step": 369161, "epoch": 4447} {"train_loss": -26.593809127807617, "global_step": 369162, "epoch": 4447} {"train_loss": -26.383808135986328, "global_step": 369163, "epoch": 4447} {"train_loss": -26.546247482299805, "global_step": 369164, "epoch": 4447} {"train_loss": -26.747974395751953, "global_step": 369165, "epoch": 4447} {"train_loss": -26.178213119506836, "global_step": 369166, "epoch": 4447} {"train_loss": -26.1597843170166, "global_step": 369167, "epoch": 4447} {"train_loss": -26.2322998046875, "global_step": 369168, "epoch": 4447} {"train_loss": -26.49445915222168, "global_step": 369169, "epoch": 4447} {"train_loss": -26.282339096069336, "global_step": 369170, "epoch": 4447} {"train_loss": -26.50667381286621, "global_step": 369171, "epoch": 4447} {"train_loss": -26.121475219726562, "global_step": 369172, "epoch": 4447} {"train_loss": -26.291244506835938, "global_step": 369173, "epoch": 4447} {"train_loss": -25.953022003173828, "global_step": 369174, "epoch": 4447} {"train_loss": -26.450315475463867, "global_step": 369175, "epoch": 4447} {"train_loss": -26.247350692749023, "global_step": 369176, "epoch": 4447} {"train_loss": -26.547760009765625, "global_step": 369177, "epoch": 4447} {"train_loss": -26.09543800354004, "global_step": 369178, "epoch": 4447} {"train_loss": -25.84004783630371, "global_step": 369179, "epoch": 4447} {"train_loss": -26.420820236206055, "global_step": 369180, "epoch": 4447} {"train_loss": -26.394514083862305, "global_step": 369181, "epoch": 4447} {"train_loss": -26.522735595703125, "global_step": 369182, "epoch": 4447} {"train_loss": -26.294905719986883, "global_step": 369183, "epoch": 4447, "val_loss": 6676804.0} {"train_loss": -25.289670944213867, "global_step": 369184, "epoch": 4448} {"train_loss": -25.267669677734375, "global_step": 369185, "epoch": 4448} {"train_loss": -26.197973251342773, "global_step": 369186, "epoch": 4448} {"train_loss": -25.221830368041992, "global_step": 369187, "epoch": 4448} {"train_loss": -25.60407829284668, "global_step": 369188, "epoch": 4448} {"train_loss": -25.27461814880371, "global_step": 369189, "epoch": 4448} {"train_loss": -25.96844482421875, "global_step": 369190, "epoch": 4448} {"train_loss": -25.62775230407715, "global_step": 369191, "epoch": 4448} {"train_loss": -25.659122467041016, "global_step": 369192, "epoch": 4448} {"train_loss": -25.89845085144043, "global_step": 369193, "epoch": 4448} {"train_loss": -25.999927520751953, "global_step": 369194, "epoch": 4448} {"train_loss": -25.585102081298828, "global_step": 369195, "epoch": 4448} {"train_loss": -26.221511840820312, "global_step": 369196, "epoch": 4448} {"train_loss": -25.996374130249023, "global_step": 369197, "epoch": 4448} {"train_loss": -26.0398006439209, "global_step": 369198, "epoch": 4448} {"train_loss": -26.12823486328125, "global_step": 369199, "epoch": 4448} {"train_loss": -25.823896408081055, "global_step": 369200, "epoch": 4448} {"train_loss": -26.0479736328125, "global_step": 369201, "epoch": 4448} {"train_loss": -26.313947677612305, "global_step": 369202, "epoch": 4448} {"train_loss": -26.235095977783203, "global_step": 369203, "epoch": 4448} {"train_loss": -26.107532501220703, "global_step": 369204, "epoch": 4448} {"train_loss": -26.1621036529541, "global_step": 369205, "epoch": 4448} {"train_loss": -25.840152740478516, "global_step": 369206, "epoch": 4448} {"train_loss": -26.182825088500977, "global_step": 369207, "epoch": 4448} {"train_loss": -26.160058975219727, "global_step": 369208, "epoch": 4448} {"train_loss": -26.20703125, "global_step": 369209, "epoch": 4448} {"train_loss": -26.04469108581543, "global_step": 369210, "epoch": 4448} {"train_loss": -26.331571578979492, "global_step": 369211, "epoch": 4448} {"train_loss": -26.45503044128418, "global_step": 369212, "epoch": 4448} {"train_loss": -26.195234298706055, "global_step": 369213, "epoch": 4448} {"train_loss": -26.136398315429688, "global_step": 369214, "epoch": 4448} {"train_loss": -26.33660888671875, "global_step": 369215, "epoch": 4448} {"train_loss": -26.323217391967773, "global_step": 369216, "epoch": 4448} {"train_loss": -26.391082763671875, "global_step": 369217, "epoch": 4448} {"train_loss": -26.232038497924805, "global_step": 369218, "epoch": 4448} {"train_loss": -26.339170455932617, "global_step": 369219, "epoch": 4448} {"train_loss": -26.35648536682129, "global_step": 369220, "epoch": 4448} {"train_loss": -26.36823081970215, "global_step": 369221, "epoch": 4448} {"train_loss": -26.481557846069336, "global_step": 369222, "epoch": 4448} {"train_loss": -26.564252853393555, "global_step": 369223, "epoch": 4448} {"train_loss": -26.652301788330078, "global_step": 369224, "epoch": 4448} {"train_loss": -26.815780639648438, "global_step": 369225, "epoch": 4448} {"train_loss": -26.3684024810791, "global_step": 369226, "epoch": 4448} {"train_loss": -26.41813087463379, "global_step": 369227, "epoch": 4448} {"train_loss": -26.399322509765625, "global_step": 369228, "epoch": 4448} {"train_loss": -26.612503051757812, "global_step": 369229, "epoch": 4448} {"train_loss": -26.259687423706055, "global_step": 369230, "epoch": 4448} {"train_loss": -26.32840919494629, "global_step": 369231, "epoch": 4448} {"train_loss": -26.378448486328125, "global_step": 369232, "epoch": 4448} {"train_loss": -26.657318115234375, "global_step": 369233, "epoch": 4448} {"train_loss": -26.636335372924805, "global_step": 369234, "epoch": 4448} {"train_loss": -26.518362045288086, "global_step": 369235, "epoch": 4448} {"train_loss": -26.2559871673584, "global_step": 369236, "epoch": 4448} {"train_loss": -26.501789093017578, "global_step": 369237, "epoch": 4448} {"train_loss": -26.36358070373535, "global_step": 369238, "epoch": 4448} {"train_loss": -26.14810562133789, "global_step": 369239, "epoch": 4448} {"train_loss": -26.132238388061523, "global_step": 369240, "epoch": 4448} {"train_loss": -26.33931541442871, "global_step": 369241, "epoch": 4448} {"train_loss": -26.58827018737793, "global_step": 369242, "epoch": 4448} {"train_loss": -26.466215133666992, "global_step": 369243, "epoch": 4448} {"train_loss": -26.421911239624023, "global_step": 369244, "epoch": 4448} {"train_loss": -26.4134464263916, "global_step": 369245, "epoch": 4448} {"train_loss": -26.49995231628418, "global_step": 369246, "epoch": 4448} {"train_loss": -26.28232765197754, "global_step": 369247, "epoch": 4448} {"train_loss": -26.603967666625977, "global_step": 369248, "epoch": 4448} {"train_loss": -26.1660099029541, "global_step": 369249, "epoch": 4448} {"train_loss": -26.734573364257812, "global_step": 369250, "epoch": 4448} {"train_loss": -26.36136245727539, "global_step": 369251, "epoch": 4448} {"train_loss": -26.34271812438965, "global_step": 369252, "epoch": 4448} {"train_loss": -26.315521240234375, "global_step": 369253, "epoch": 4448} {"train_loss": -26.349279403686523, "global_step": 369254, "epoch": 4448} {"train_loss": -26.265766143798828, "global_step": 369255, "epoch": 4448} {"train_loss": -26.382614135742188, "global_step": 369256, "epoch": 4448} {"train_loss": -26.46148681640625, "global_step": 369257, "epoch": 4448} {"train_loss": -26.396656036376953, "global_step": 369258, "epoch": 4448} {"train_loss": -26.720853805541992, "global_step": 369259, "epoch": 4448} {"train_loss": -26.559833526611328, "global_step": 369260, "epoch": 4448} {"train_loss": -25.974639892578125, "global_step": 369261, "epoch": 4448} {"train_loss": -26.17429542541504, "global_step": 369262, "epoch": 4448} {"train_loss": -25.852582931518555, "global_step": 369263, "epoch": 4448} {"train_loss": -26.2596435546875, "global_step": 369264, "epoch": 4448} {"train_loss": -26.800067901611328, "global_step": 369265, "epoch": 4448} {"train_loss": -26.238191190972387, "global_step": 369266, "epoch": 4448, "val_loss": 6768681.0} {"train_loss": -25.612485885620117, "global_step": 369267, "epoch": 4449} {"train_loss": -25.766281127929688, "global_step": 369268, "epoch": 4449} {"train_loss": -26.103017807006836, "global_step": 369269, "epoch": 4449} {"train_loss": -26.19205665588379, "global_step": 369270, "epoch": 4449} {"train_loss": -25.830432891845703, "global_step": 369271, "epoch": 4449} {"train_loss": -26.166275024414062, "global_step": 369272, "epoch": 4449} {"train_loss": -25.621931076049805, "global_step": 369273, "epoch": 4449} {"train_loss": -25.788618087768555, "global_step": 369274, "epoch": 4449} {"train_loss": -26.3051700592041, "global_step": 369275, "epoch": 4449} {"train_loss": -26.109888076782227, "global_step": 369276, "epoch": 4449} {"train_loss": -26.441465377807617, "global_step": 369277, "epoch": 4449} {"train_loss": -25.979084014892578, "global_step": 369278, "epoch": 4449} {"train_loss": -26.62896728515625, "global_step": 369279, "epoch": 4449} {"train_loss": -25.859521865844727, "global_step": 369280, "epoch": 4449} {"train_loss": -25.937036514282227, "global_step": 369281, "epoch": 4449} {"train_loss": -26.146005630493164, "global_step": 369282, "epoch": 4449} {"train_loss": -26.15045166015625, "global_step": 369283, "epoch": 4449} {"train_loss": -26.116296768188477, "global_step": 369284, "epoch": 4449} {"train_loss": -26.197988510131836, "global_step": 369285, "epoch": 4449} {"train_loss": -26.0024356842041, "global_step": 369286, "epoch": 4449} {"train_loss": -26.39100456237793, "global_step": 369287, "epoch": 4449} {"train_loss": -26.15522575378418, "global_step": 369288, "epoch": 4449} {"train_loss": -26.2063045501709, "global_step": 369289, "epoch": 4449} {"train_loss": -25.854644775390625, "global_step": 369290, "epoch": 4449} {"train_loss": -26.255298614501953, "global_step": 369291, "epoch": 4449} {"train_loss": -25.7650203704834, "global_step": 369292, "epoch": 4449} {"train_loss": -26.398969650268555, "global_step": 369293, "epoch": 4449} {"train_loss": -26.202844619750977, "global_step": 369294, "epoch": 4449} {"train_loss": -26.5484676361084, "global_step": 369295, "epoch": 4449} {"train_loss": -26.217824935913086, "global_step": 369296, "epoch": 4449} {"train_loss": -26.4852237701416, "global_step": 369297, "epoch": 4449} {"train_loss": -26.18695640563965, "global_step": 369298, "epoch": 4449} {"train_loss": -26.234466552734375, "global_step": 369299, "epoch": 4449} {"train_loss": -26.55097770690918, "global_step": 369300, "epoch": 4449} {"train_loss": -25.9971866607666, "global_step": 369301, "epoch": 4449} {"train_loss": -26.7384090423584, "global_step": 369302, "epoch": 4449} {"train_loss": -26.641504287719727, "global_step": 369303, "epoch": 4449} {"train_loss": -26.169147491455078, "global_step": 369304, "epoch": 4449} {"train_loss": -26.204578399658203, "global_step": 369305, "epoch": 4449} {"train_loss": -26.441898345947266, "global_step": 369306, "epoch": 4449} {"train_loss": -26.37025260925293, "global_step": 369307, "epoch": 4449} {"train_loss": -26.178319931030273, "global_step": 369308, "epoch": 4449} {"train_loss": -26.133453369140625, "global_step": 369309, "epoch": 4449} {"train_loss": -26.330930709838867, "global_step": 369310, "epoch": 4449} {"train_loss": -26.499588012695312, "global_step": 369311, "epoch": 4449} {"train_loss": -26.07868003845215, "global_step": 369312, "epoch": 4449} {"train_loss": -26.133747100830078, "global_step": 369313, "epoch": 4449} {"train_loss": -26.266571044921875, "global_step": 369314, "epoch": 4449} {"train_loss": -26.35076904296875, "global_step": 369315, "epoch": 4449} {"train_loss": -26.3160343170166, "global_step": 369316, "epoch": 4449} {"train_loss": -26.43033218383789, "global_step": 369317, "epoch": 4449} {"train_loss": -26.575469970703125, "global_step": 369318, "epoch": 4449} {"train_loss": -25.99517822265625, "global_step": 369319, "epoch": 4449} {"train_loss": -26.60418128967285, "global_step": 369320, "epoch": 4449} {"train_loss": -26.61020851135254, "global_step": 369321, "epoch": 4449} {"train_loss": -26.608001708984375, "global_step": 369322, "epoch": 4449} {"train_loss": -26.24384880065918, "global_step": 369323, "epoch": 4449} {"train_loss": -26.727075576782227, "global_step": 369324, "epoch": 4449} {"train_loss": -26.69770622253418, "global_step": 369325, "epoch": 4449} {"train_loss": -26.5452938079834, "global_step": 369326, "epoch": 4449} {"train_loss": -26.34038734436035, "global_step": 369327, "epoch": 4449} {"train_loss": -26.551122665405273, "global_step": 369328, "epoch": 4449} {"train_loss": -26.538761138916016, "global_step": 369329, "epoch": 4449} {"train_loss": -26.211774826049805, "global_step": 369330, "epoch": 4449} {"train_loss": -26.39227867126465, "global_step": 369331, "epoch": 4449} {"train_loss": -26.3644962310791, "global_step": 369332, "epoch": 4449} {"train_loss": -26.72437858581543, "global_step": 369333, "epoch": 4449} {"train_loss": -26.811410903930664, "global_step": 369334, "epoch": 4449} {"train_loss": -26.80133628845215, "global_step": 369335, "epoch": 4449} {"train_loss": -26.40802574157715, "global_step": 369336, "epoch": 4449} {"train_loss": -26.695362091064453, "global_step": 369337, "epoch": 4449} {"train_loss": -26.298749923706055, "global_step": 369338, "epoch": 4449} {"train_loss": -26.499853134155273, "global_step": 369339, "epoch": 4449} {"train_loss": -26.614105224609375, "global_step": 369340, "epoch": 4449} {"train_loss": -26.17339515686035, "global_step": 369341, "epoch": 4449} {"train_loss": -26.394468307495117, "global_step": 369342, "epoch": 4449} {"train_loss": -26.3341007232666, "global_step": 369343, "epoch": 4449} {"train_loss": -26.716236114501953, "global_step": 369344, "epoch": 4449} {"train_loss": -26.298547744750977, "global_step": 369345, "epoch": 4449} {"train_loss": -26.6643123626709, "global_step": 369346, "epoch": 4449} {"train_loss": -26.580570220947266, "global_step": 369347, "epoch": 4449} {"train_loss": -26.85434341430664, "global_step": 369348, "epoch": 4449} {"train_loss": -26.329086050929792, "global_step": 369349, "epoch": 4449, "val_loss": 6662193.0} {"train_loss": -26.300382614135742, "global_step": 369350, "epoch": 4450} {"train_loss": -26.0709171295166, "global_step": 369351, "epoch": 4450} {"train_loss": -25.971891403198242, "global_step": 369352, "epoch": 4450} {"train_loss": -25.852807998657227, "global_step": 369353, "epoch": 4450} {"train_loss": -26.017032623291016, "global_step": 369354, "epoch": 4450} {"train_loss": -25.957372665405273, "global_step": 369355, "epoch": 4450} {"train_loss": -25.96758460998535, "global_step": 369356, "epoch": 4450} {"train_loss": -25.8734130859375, "global_step": 369357, "epoch": 4450} {"train_loss": -26.177053451538086, "global_step": 369358, "epoch": 4450} {"train_loss": -26.300756454467773, "global_step": 369359, "epoch": 4450} {"train_loss": -26.157079696655273, "global_step": 369360, "epoch": 4450} {"train_loss": -26.057952880859375, "global_step": 369361, "epoch": 4450} {"train_loss": -26.39227294921875, "global_step": 369362, "epoch": 4450} {"train_loss": -26.10222816467285, "global_step": 369363, "epoch": 4450} {"train_loss": -26.298065185546875, "global_step": 369364, "epoch": 4450} {"train_loss": -26.30073356628418, "global_step": 369365, "epoch": 4450} {"train_loss": -26.483510971069336, "global_step": 369366, "epoch": 4450} {"train_loss": -26.188573837280273, "global_step": 369367, "epoch": 4450} {"train_loss": -25.969480514526367, "global_step": 369368, "epoch": 4450} {"train_loss": -26.590124130249023, "global_step": 369369, "epoch": 4450} {"train_loss": -26.659381866455078, "global_step": 369370, "epoch": 4450} {"train_loss": -26.498626708984375, "global_step": 369371, "epoch": 4450} {"train_loss": -26.659116744995117, "global_step": 369372, "epoch": 4450} {"train_loss": -26.673267364501953, "global_step": 369373, "epoch": 4450} {"train_loss": -26.327350616455078, "global_step": 369374, "epoch": 4450} {"train_loss": -26.43771743774414, "global_step": 369375, "epoch": 4450} {"train_loss": -25.973011016845703, "global_step": 369376, "epoch": 4450} {"train_loss": -26.16196632385254, "global_step": 369377, "epoch": 4450} {"train_loss": -26.79066276550293, "global_step": 369378, "epoch": 4450} {"train_loss": -26.139179229736328, "global_step": 369379, "epoch": 4450} {"train_loss": -26.510473251342773, "global_step": 369380, "epoch": 4450} {"train_loss": -26.5487060546875, "global_step": 369381, "epoch": 4450} {"train_loss": -26.610158920288086, "global_step": 369382, "epoch": 4450} {"train_loss": -26.407196044921875, "global_step": 369383, "epoch": 4450} {"train_loss": -26.161832809448242, "global_step": 369384, "epoch": 4450} {"train_loss": -26.271209716796875, "global_step": 369385, "epoch": 4450} {"train_loss": -26.291614532470703, "global_step": 369386, "epoch": 4450} {"train_loss": -26.2469482421875, "global_step": 369387, "epoch": 4450} {"train_loss": -26.20708656311035, "global_step": 369388, "epoch": 4450} {"train_loss": -26.46088218688965, "global_step": 369389, "epoch": 4450} {"train_loss": -26.41046714782715, "global_step": 369390, "epoch": 4450} {"train_loss": -26.643402099609375, "global_step": 369391, "epoch": 4450} {"train_loss": -26.52179527282715, "global_step": 369392, "epoch": 4450} {"train_loss": -26.912168502807617, "global_step": 369393, "epoch": 4450} {"train_loss": -26.30948829650879, "global_step": 369394, "epoch": 4450} {"train_loss": -26.34553337097168, "global_step": 369395, "epoch": 4450} {"train_loss": -26.410131454467773, "global_step": 369396, "epoch": 4450} {"train_loss": -26.238203048706055, "global_step": 369397, "epoch": 4450} {"train_loss": -26.439294815063477, "global_step": 369398, "epoch": 4450} {"train_loss": -26.663373947143555, "global_step": 369399, "epoch": 4450} {"train_loss": -26.501846313476562, "global_step": 369400, "epoch": 4450} {"train_loss": -26.740198135375977, "global_step": 369401, "epoch": 4450} {"train_loss": -26.187280654907227, "global_step": 369402, "epoch": 4450} {"train_loss": -26.5329647064209, "global_step": 369403, "epoch": 4450} {"train_loss": -26.463165283203125, "global_step": 369404, "epoch": 4450} {"train_loss": -26.47947120666504, "global_step": 369405, "epoch": 4450} {"train_loss": -26.171875, "global_step": 369406, "epoch": 4450} {"train_loss": -26.791669845581055, "global_step": 369407, "epoch": 4450} {"train_loss": -26.429044723510742, "global_step": 369408, "epoch": 4450} {"train_loss": -26.358076095581055, "global_step": 369409, "epoch": 4450} {"train_loss": -26.567487716674805, "global_step": 369410, "epoch": 4450} {"train_loss": -26.616168975830078, "global_step": 369411, "epoch": 4450} {"train_loss": -26.37550163269043, "global_step": 369412, "epoch": 4450} {"train_loss": -26.12216567993164, "global_step": 369413, "epoch": 4450} {"train_loss": -26.00714683532715, "global_step": 369414, "epoch": 4450} {"train_loss": -26.299840927124023, "global_step": 369415, "epoch": 4450} {"train_loss": -26.32977867126465, "global_step": 369416, "epoch": 4450} {"train_loss": -25.479734420776367, "global_step": 369417, "epoch": 4450} {"train_loss": -26.064197540283203, "global_step": 369418, "epoch": 4450} {"train_loss": -26.306325912475586, "global_step": 369419, "epoch": 4450} {"train_loss": -25.8551025390625, "global_step": 369420, "epoch": 4450} {"train_loss": -26.425323486328125, "global_step": 369421, "epoch": 4450} {"train_loss": -26.621078491210938, "global_step": 369422, "epoch": 4450} {"train_loss": -26.20977783203125, "global_step": 369423, "epoch": 4450} {"train_loss": -26.11201286315918, "global_step": 369424, "epoch": 4450} {"train_loss": -26.198169708251953, "global_step": 369425, "epoch": 4450} {"train_loss": -26.222869873046875, "global_step": 369426, "epoch": 4450} {"train_loss": -26.696613311767578, "global_step": 369427, "epoch": 4450} {"train_loss": -26.45294761657715, "global_step": 369428, "epoch": 4450} {"train_loss": -26.096057891845703, "global_step": 369429, "epoch": 4450} {"train_loss": -26.107385635375977, "global_step": 369430, "epoch": 4450} {"train_loss": -26.52961540222168, "global_step": 369431, "epoch": 4450} {"train_loss": -26.33153338604663, "global_step": 369432, "epoch": 4450, "train/sim_max_reward_0": 1.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4500000": 1.0, "test/sim_max_reward_4500001": 1.0, "test/sim_max_reward_4500002": 1.0, "test/sim_max_reward_4500003": 1.0, "test/sim_max_reward_4500004": 1.0, "test/sim_max_reward_4500005": 1.0, "test/sim_max_reward_4500006": 1.0, "test/sim_max_reward_4500007": 0.0, "test/sim_max_reward_4500008": 1.0, "test/sim_max_reward_4500009": 1.0, "test/sim_max_reward_4500010": 1.0, "test/sim_max_reward_4500011": 1.0, "test/sim_max_reward_4500012": 1.0, "test/sim_max_reward_4500013": 0.0, "test/sim_max_reward_4500014": 1.0, "test/sim_max_reward_4500015": 1.0, "test/sim_max_reward_4500016": 1.0, "test/sim_max_reward_4500017": 1.0, "test/sim_max_reward_4500018": 1.0, "test/sim_max_reward_4500019": 0.0, "test/sim_max_reward_4500020": 1.0, "test/sim_max_reward_4500021": 1.0, "train/mean_score": 1.0, "test/mean_score": 0.8636363636363636, "val_loss": 6670677.0} {"train_loss": -25.74222183227539, "global_step": 369433, "epoch": 4451} {"train_loss": -26.308969497680664, "global_step": 369434, "epoch": 4451} {"train_loss": -26.211124420166016, "global_step": 369435, "epoch": 4451} {"train_loss": -26.1507568359375, "global_step": 369436, "epoch": 4451} {"train_loss": -25.555395126342773, "global_step": 369437, "epoch": 4451} {"train_loss": -25.987173080444336, "global_step": 369438, "epoch": 4451} {"train_loss": -25.88506507873535, "global_step": 369439, "epoch": 4451} {"train_loss": -26.3857364654541, "global_step": 369440, "epoch": 4451} {"train_loss": -25.61663246154785, "global_step": 369441, "epoch": 4451} {"train_loss": -26.1676082611084, "global_step": 369442, "epoch": 4451} {"train_loss": -26.10672950744629, "global_step": 369443, "epoch": 4451} {"train_loss": -26.05393409729004, "global_step": 369444, "epoch": 4451} {"train_loss": -26.15114402770996, "global_step": 369445, "epoch": 4451} {"train_loss": -26.345550537109375, "global_step": 369446, "epoch": 4451} {"train_loss": -26.429906845092773, "global_step": 369447, "epoch": 4451} {"train_loss": -26.11667251586914, "global_step": 369448, "epoch": 4451} {"train_loss": -26.11543083190918, "global_step": 369449, "epoch": 4451} {"train_loss": -26.51324462890625, "global_step": 369450, "epoch": 4451} {"train_loss": -25.908777236938477, "global_step": 369451, "epoch": 4451} {"train_loss": -26.422143936157227, "global_step": 369452, "epoch": 4451} {"train_loss": -26.534032821655273, "global_step": 369453, "epoch": 4451} {"train_loss": -25.98479652404785, "global_step": 369454, "epoch": 4451} {"train_loss": -26.325641632080078, "global_step": 369455, "epoch": 4451} {"train_loss": -26.41102409362793, "global_step": 369456, "epoch": 4451} {"train_loss": -26.549346923828125, "global_step": 369457, "epoch": 4451} {"train_loss": -26.03995704650879, "global_step": 369458, "epoch": 4451} {"train_loss": -26.684194564819336, "global_step": 369459, "epoch": 4451} {"train_loss": -26.423004150390625, "global_step": 369460, "epoch": 4451} {"train_loss": -26.39994239807129, "global_step": 369461, "epoch": 4451} {"train_loss": -26.001239776611328, "global_step": 369462, "epoch": 4451} {"train_loss": -26.729034423828125, "global_step": 369463, "epoch": 4451} {"train_loss": -26.371816635131836, "global_step": 369464, "epoch": 4451} {"train_loss": -26.45026969909668, "global_step": 369465, "epoch": 4451} {"train_loss": -26.447559356689453, "global_step": 369466, "epoch": 4451} {"train_loss": -26.33119773864746, "global_step": 369467, "epoch": 4451} {"train_loss": -26.64776611328125, "global_step": 369468, "epoch": 4451} {"train_loss": -26.77325439453125, "global_step": 369469, "epoch": 4451} {"train_loss": -26.579633712768555, "global_step": 369470, "epoch": 4451} {"train_loss": -26.4907169342041, "global_step": 369471, "epoch": 4451} {"train_loss": -26.475290298461914, "global_step": 369472, "epoch": 4451} {"train_loss": -26.492572784423828, "global_step": 369473, "epoch": 4451} {"train_loss": -26.178380966186523, "global_step": 369474, "epoch": 4451} {"train_loss": -25.96014404296875, "global_step": 369475, "epoch": 4451} {"train_loss": -26.464380264282227, "global_step": 369476, "epoch": 4451} {"train_loss": -26.448266983032227, "global_step": 369477, "epoch": 4451} {"train_loss": -26.17041015625, "global_step": 369478, "epoch": 4451} {"train_loss": -26.340330123901367, "global_step": 369479, "epoch": 4451} {"train_loss": -26.300085067749023, "global_step": 369480, "epoch": 4451} {"train_loss": -26.502317428588867, "global_step": 369481, "epoch": 4451} {"train_loss": -26.262420654296875, "global_step": 369482, "epoch": 4451} {"train_loss": -26.560606002807617, "global_step": 369483, "epoch": 4451} {"train_loss": -26.54422950744629, "global_step": 369484, "epoch": 4451} {"train_loss": -26.073776245117188, "global_step": 369485, "epoch": 4451} {"train_loss": -26.659122467041016, "global_step": 369486, "epoch": 4451} {"train_loss": -26.37139320373535, "global_step": 369487, "epoch": 4451} {"train_loss": -26.199365615844727, "global_step": 369488, "epoch": 4451} {"train_loss": -26.568349838256836, "global_step": 369489, "epoch": 4451} {"train_loss": -26.23870849609375, "global_step": 369490, "epoch": 4451} {"train_loss": -26.577533721923828, "global_step": 369491, "epoch": 4451} {"train_loss": -26.419708251953125, "global_step": 369492, "epoch": 4451} {"train_loss": -26.168973922729492, "global_step": 369493, "epoch": 4451} {"train_loss": -26.489139556884766, "global_step": 369494, "epoch": 4451} {"train_loss": -25.978315353393555, "global_step": 369495, "epoch": 4451} {"train_loss": -26.048675537109375, "global_step": 369496, "epoch": 4451} {"train_loss": -26.50946044921875, "global_step": 369497, "epoch": 4451} {"train_loss": -26.142236709594727, "global_step": 369498, "epoch": 4451} {"train_loss": -26.20867347717285, "global_step": 369499, "epoch": 4451} {"train_loss": -25.99983787536621, "global_step": 369500, "epoch": 4451} {"train_loss": -26.478443145751953, "global_step": 369501, "epoch": 4451} {"train_loss": -26.3817195892334, "global_step": 369502, "epoch": 4451} {"train_loss": -26.455663681030273, "global_step": 369503, "epoch": 4451} {"train_loss": -26.802865982055664, "global_step": 369504, "epoch": 4451} {"train_loss": -26.070890426635742, "global_step": 369505, "epoch": 4451} {"train_loss": -26.439788818359375, "global_step": 369506, "epoch": 4451} {"train_loss": -26.45590591430664, "global_step": 369507, "epoch": 4451} {"train_loss": -26.302352905273438, "global_step": 369508, "epoch": 4451} {"train_loss": -26.393213272094727, "global_step": 369509, "epoch": 4451} {"train_loss": -26.348148345947266, "global_step": 369510, "epoch": 4451} {"train_loss": -26.2618465423584, "global_step": 369511, "epoch": 4451} {"train_loss": -26.17388916015625, "global_step": 369512, "epoch": 4451} {"train_loss": -26.385046005249023, "global_step": 369513, "epoch": 4451} {"train_loss": -26.24356460571289, "global_step": 369514, "epoch": 4451} {"train_loss": -26.31696719433888, "global_step": 369515, "epoch": 4451, "val_loss": 6702335.5} {"train_loss": -25.18086051940918, "global_step": 369516, "epoch": 4452} {"train_loss": -25.970428466796875, "global_step": 369517, "epoch": 4452} {"train_loss": -24.71456527709961, "global_step": 369518, "epoch": 4452} {"train_loss": -25.307188034057617, "global_step": 369519, "epoch": 4452} {"train_loss": -25.007055282592773, "global_step": 369520, "epoch": 4452} {"train_loss": -25.771499633789062, "global_step": 369521, "epoch": 4452} {"train_loss": -24.869346618652344, "global_step": 369522, "epoch": 4452} {"train_loss": -25.334775924682617, "global_step": 369523, "epoch": 4452} {"train_loss": -25.59990119934082, "global_step": 369524, "epoch": 4452} {"train_loss": -25.22185707092285, "global_step": 369525, "epoch": 4452} {"train_loss": -25.507902145385742, "global_step": 369526, "epoch": 4452} {"train_loss": -26.234283447265625, "global_step": 369527, "epoch": 4452} {"train_loss": -25.664609909057617, "global_step": 369528, "epoch": 4452} {"train_loss": -25.626087188720703, "global_step": 369529, "epoch": 4452} {"train_loss": -25.739994049072266, "global_step": 369530, "epoch": 4452} {"train_loss": -25.910205841064453, "global_step": 369531, "epoch": 4452} {"train_loss": -25.50115966796875, "global_step": 369532, "epoch": 4452} {"train_loss": -25.720361709594727, "global_step": 369533, "epoch": 4452} {"train_loss": -25.930622100830078, "global_step": 369534, "epoch": 4452} {"train_loss": -25.997533798217773, "global_step": 369535, "epoch": 4452} {"train_loss": -25.44955825805664, "global_step": 369536, "epoch": 4452} {"train_loss": -25.958606719970703, "global_step": 369537, "epoch": 4452} {"train_loss": -25.704364776611328, "global_step": 369538, "epoch": 4452} {"train_loss": -25.733381271362305, "global_step": 369539, "epoch": 4452} {"train_loss": -26.026092529296875, "global_step": 369540, "epoch": 4452} {"train_loss": -26.127668380737305, "global_step": 369541, "epoch": 4452} {"train_loss": -25.9364013671875, "global_step": 369542, "epoch": 4452} {"train_loss": -25.836048126220703, "global_step": 369543, "epoch": 4452} {"train_loss": -26.055601119995117, "global_step": 369544, "epoch": 4452} {"train_loss": -26.4200439453125, "global_step": 369545, "epoch": 4452} {"train_loss": -26.168094635009766, "global_step": 369546, "epoch": 4452} {"train_loss": -26.27007484436035, "global_step": 369547, "epoch": 4452} {"train_loss": -26.230321884155273, "global_step": 369548, "epoch": 4452} {"train_loss": -25.887439727783203, "global_step": 369549, "epoch": 4452} {"train_loss": -26.005369186401367, "global_step": 369550, "epoch": 4452} {"train_loss": -26.197433471679688, "global_step": 369551, "epoch": 4452} {"train_loss": -25.981491088867188, "global_step": 369552, "epoch": 4452} {"train_loss": -26.102436065673828, "global_step": 369553, "epoch": 4452} {"train_loss": -26.12799644470215, "global_step": 369554, "epoch": 4452} {"train_loss": -26.247974395751953, "global_step": 369555, "epoch": 4452} {"train_loss": -26.334064483642578, "global_step": 369556, "epoch": 4452} {"train_loss": -25.990381240844727, "global_step": 369557, "epoch": 4452} {"train_loss": -26.524887084960938, "global_step": 369558, "epoch": 4452} {"train_loss": -26.1655216217041, "global_step": 369559, "epoch": 4452} {"train_loss": -26.08625602722168, "global_step": 369560, "epoch": 4452} {"train_loss": -26.448694229125977, "global_step": 369561, "epoch": 4452} {"train_loss": -26.502954483032227, "global_step": 369562, "epoch": 4452} {"train_loss": -26.65679359436035, "global_step": 369563, "epoch": 4452} {"train_loss": -26.806982040405273, "global_step": 369564, "epoch": 4452} {"train_loss": -26.4063720703125, "global_step": 369565, "epoch": 4452} {"train_loss": -26.361114501953125, "global_step": 369566, "epoch": 4452} {"train_loss": -26.17462158203125, "global_step": 369567, "epoch": 4452} {"train_loss": -26.01592445373535, "global_step": 369568, "epoch": 4452} {"train_loss": -26.23651123046875, "global_step": 369569, "epoch": 4452} {"train_loss": -26.607168197631836, "global_step": 369570, "epoch": 4452} {"train_loss": -25.793066024780273, "global_step": 369571, "epoch": 4452} {"train_loss": -26.142719268798828, "global_step": 369572, "epoch": 4452} {"train_loss": -26.42555809020996, "global_step": 369573, "epoch": 4452} {"train_loss": -26.1160888671875, "global_step": 369574, "epoch": 4452} {"train_loss": -26.019092559814453, "global_step": 369575, "epoch": 4452} {"train_loss": -25.9023380279541, "global_step": 369576, "epoch": 4452} {"train_loss": -26.021020889282227, "global_step": 369577, "epoch": 4452} {"train_loss": -26.737436294555664, "global_step": 369578, "epoch": 4452} {"train_loss": -26.09531021118164, "global_step": 369579, "epoch": 4452} {"train_loss": -25.59473991394043, "global_step": 369580, "epoch": 4452} {"train_loss": -26.30915641784668, "global_step": 369581, "epoch": 4452} {"train_loss": -26.30946922302246, "global_step": 369582, "epoch": 4452} {"train_loss": -26.17702293395996, "global_step": 369583, "epoch": 4452} {"train_loss": -26.176050186157227, "global_step": 369584, "epoch": 4452} {"train_loss": -26.65509033203125, "global_step": 369585, "epoch": 4452} {"train_loss": -26.236831665039062, "global_step": 369586, "epoch": 4452} {"train_loss": -26.87898063659668, "global_step": 369587, "epoch": 4452} {"train_loss": -26.170475006103516, "global_step": 369588, "epoch": 4452} {"train_loss": -26.3966121673584, "global_step": 369589, "epoch": 4452} {"train_loss": -26.463241577148438, "global_step": 369590, "epoch": 4452} {"train_loss": -26.442276000976562, "global_step": 369591, "epoch": 4452} {"train_loss": -26.741382598876953, "global_step": 369592, "epoch": 4452} {"train_loss": -26.559675216674805, "global_step": 369593, "epoch": 4452} {"train_loss": -26.708724975585938, "global_step": 369594, "epoch": 4452} {"train_loss": -26.595355987548828, "global_step": 369595, "epoch": 4452} {"train_loss": -26.562530517578125, "global_step": 369596, "epoch": 4452} {"train_loss": -26.753284454345703, "global_step": 369597, "epoch": 4452} {"train_loss": -26.08067696353039, "global_step": 369598, "epoch": 4452, "val_loss": 6683142.0} {"train_loss": -26.1086483001709, "global_step": 369599, "epoch": 4453} {"train_loss": -26.119779586791992, "global_step": 369600, "epoch": 4453} {"train_loss": -26.715612411499023, "global_step": 369601, "epoch": 4453} {"train_loss": -26.11249351501465, "global_step": 369602, "epoch": 4453} {"train_loss": -26.293872833251953, "global_step": 369603, "epoch": 4453} {"train_loss": -26.34442138671875, "global_step": 369604, "epoch": 4453} {"train_loss": -25.895627975463867, "global_step": 369605, "epoch": 4453} {"train_loss": -26.348770141601562, "global_step": 369606, "epoch": 4453} {"train_loss": -26.445581436157227, "global_step": 369607, "epoch": 4453} {"train_loss": -26.316055297851562, "global_step": 369608, "epoch": 4453} {"train_loss": -26.26995277404785, "global_step": 369609, "epoch": 4453} {"train_loss": -26.18159294128418, "global_step": 369610, "epoch": 4453} {"train_loss": -26.47612953186035, "global_step": 369611, "epoch": 4453} {"train_loss": -26.594648361206055, "global_step": 369612, "epoch": 4453} {"train_loss": -26.0687313079834, "global_step": 369613, "epoch": 4453} {"train_loss": -26.3918514251709, "global_step": 369614, "epoch": 4453} {"train_loss": -26.21061134338379, "global_step": 369615, "epoch": 4453} {"train_loss": -26.928836822509766, "global_step": 369616, "epoch": 4453} {"train_loss": -26.1447811126709, "global_step": 369617, "epoch": 4453} {"train_loss": -26.350250244140625, "global_step": 369618, "epoch": 4453} {"train_loss": -26.1241397857666, "global_step": 369619, "epoch": 4453} {"train_loss": -26.021421432495117, "global_step": 369620, "epoch": 4453} {"train_loss": -25.990116119384766, "global_step": 369621, "epoch": 4453} {"train_loss": -26.50037956237793, "global_step": 369622, "epoch": 4453} {"train_loss": -26.399560928344727, "global_step": 369623, "epoch": 4453} {"train_loss": -26.182641983032227, "global_step": 369624, "epoch": 4453} {"train_loss": -26.465665817260742, "global_step": 369625, "epoch": 4453} {"train_loss": -26.32159996032715, "global_step": 369626, "epoch": 4453} {"train_loss": -26.180999755859375, "global_step": 369627, "epoch": 4453} {"train_loss": -26.20123863220215, "global_step": 369628, "epoch": 4453} {"train_loss": -26.432209014892578, "global_step": 369629, "epoch": 4453} {"train_loss": -26.68722915649414, "global_step": 369630, "epoch": 4453} {"train_loss": -26.34527587890625, "global_step": 369631, "epoch": 4453} {"train_loss": -26.50469398498535, "global_step": 369632, "epoch": 4453} {"train_loss": -26.433094024658203, "global_step": 369633, "epoch": 4453} {"train_loss": -26.347396850585938, "global_step": 369634, "epoch": 4453} {"train_loss": -26.518095016479492, "global_step": 369635, "epoch": 4453} {"train_loss": -26.36097526550293, "global_step": 369636, "epoch": 4453} {"train_loss": -26.446426391601562, "global_step": 369637, "epoch": 4453} {"train_loss": -26.576379776000977, "global_step": 369638, "epoch": 4453} {"train_loss": -26.590967178344727, "global_step": 369639, "epoch": 4453} {"train_loss": -26.418378829956055, "global_step": 369640, "epoch": 4453} {"train_loss": -26.21185302734375, "global_step": 369641, "epoch": 4453} {"train_loss": -26.422834396362305, "global_step": 369642, "epoch": 4453} {"train_loss": -26.458398818969727, "global_step": 369643, "epoch": 4453} {"train_loss": -26.30902671813965, "global_step": 369644, "epoch": 4453} {"train_loss": -26.620264053344727, "global_step": 369645, "epoch": 4453} {"train_loss": -26.608484268188477, "global_step": 369646, "epoch": 4453} {"train_loss": -26.429244995117188, "global_step": 369647, "epoch": 4453} {"train_loss": -26.355192184448242, "global_step": 369648, "epoch": 4453} {"train_loss": -26.760379791259766, "global_step": 369649, "epoch": 4453} {"train_loss": -26.54837989807129, "global_step": 369650, "epoch": 4453} {"train_loss": -26.096771240234375, "global_step": 369651, "epoch": 4453} {"train_loss": -26.43960952758789, "global_step": 369652, "epoch": 4453} {"train_loss": -26.596418380737305, "global_step": 369653, "epoch": 4453} {"train_loss": -26.268278121948242, "global_step": 369654, "epoch": 4453} {"train_loss": -26.097623825073242, "global_step": 369655, "epoch": 4453} {"train_loss": -25.528339385986328, "global_step": 369656, "epoch": 4453} {"train_loss": -25.05848503112793, "global_step": 369657, "epoch": 4453} {"train_loss": -24.565580368041992, "global_step": 369658, "epoch": 4453} {"train_loss": -26.01478385925293, "global_step": 369659, "epoch": 4453} {"train_loss": -26.033552169799805, "global_step": 369660, "epoch": 4453} {"train_loss": -25.43109703063965, "global_step": 369661, "epoch": 4453} {"train_loss": -25.531583786010742, "global_step": 369662, "epoch": 4453} {"train_loss": -25.93157386779785, "global_step": 369663, "epoch": 4453} {"train_loss": -25.899168014526367, "global_step": 369664, "epoch": 4453} {"train_loss": -25.24672508239746, "global_step": 369665, "epoch": 4453} {"train_loss": -25.918378829956055, "global_step": 369666, "epoch": 4453} {"train_loss": -26.019805908203125, "global_step": 369667, "epoch": 4453} {"train_loss": -25.56050682067871, "global_step": 369668, "epoch": 4453} {"train_loss": -25.732019424438477, "global_step": 369669, "epoch": 4453} {"train_loss": -25.803150177001953, "global_step": 369670, "epoch": 4453} {"train_loss": -25.771390914916992, "global_step": 369671, "epoch": 4453} {"train_loss": -25.974613189697266, "global_step": 369672, "epoch": 4453} {"train_loss": -25.979528427124023, "global_step": 369673, "epoch": 4453} {"train_loss": -25.979557037353516, "global_step": 369674, "epoch": 4453} {"train_loss": -26.219043731689453, "global_step": 369675, "epoch": 4453} {"train_loss": -25.821735382080078, "global_step": 369676, "epoch": 4453} {"train_loss": -26.446247100830078, "global_step": 369677, "epoch": 4453} {"train_loss": -25.938276290893555, "global_step": 369678, "epoch": 4453} {"train_loss": -26.335668563842773, "global_step": 369679, "epoch": 4453} {"train_loss": -26.042221069335938, "global_step": 369680, "epoch": 4453} {"train_loss": -26.188184990940325, "global_step": 369681, "epoch": 4453, "val_loss": 6724407.5} {"train_loss": -25.776941299438477, "global_step": 369682, "epoch": 4454} {"train_loss": -25.910863876342773, "global_step": 369683, "epoch": 4454} {"train_loss": -25.75257682800293, "global_step": 369684, "epoch": 4454} {"train_loss": -26.039108276367188, "global_step": 369685, "epoch": 4454} {"train_loss": -25.870264053344727, "global_step": 369686, "epoch": 4454} {"train_loss": -25.978796005249023, "global_step": 369687, "epoch": 4454} {"train_loss": -25.894567489624023, "global_step": 369688, "epoch": 4454} {"train_loss": -26.199462890625, "global_step": 369689, "epoch": 4454} {"train_loss": -25.860675811767578, "global_step": 369690, "epoch": 4454} {"train_loss": -26.346027374267578, "global_step": 369691, "epoch": 4454} {"train_loss": -25.90955924987793, "global_step": 369692, "epoch": 4454} {"train_loss": -25.998889923095703, "global_step": 369693, "epoch": 4454} {"train_loss": -25.832971572875977, "global_step": 369694, "epoch": 4454} {"train_loss": -26.33009147644043, "global_step": 369695, "epoch": 4454} {"train_loss": -26.336633682250977, "global_step": 369696, "epoch": 4454} {"train_loss": -26.175580978393555, "global_step": 369697, "epoch": 4454} {"train_loss": -26.214963912963867, "global_step": 369698, "epoch": 4454} {"train_loss": -26.213043212890625, "global_step": 369699, "epoch": 4454} {"train_loss": -25.984851837158203, "global_step": 369700, "epoch": 4454} {"train_loss": -26.457660675048828, "global_step": 369701, "epoch": 4454} {"train_loss": -26.400259017944336, "global_step": 369702, "epoch": 4454} {"train_loss": -26.359821319580078, "global_step": 369703, "epoch": 4454} {"train_loss": -26.213443756103516, "global_step": 369704, "epoch": 4454} {"train_loss": -26.203083038330078, "global_step": 369705, "epoch": 4454} {"train_loss": -26.000722885131836, "global_step": 369706, "epoch": 4454} {"train_loss": -26.370925903320312, "global_step": 369707, "epoch": 4454} {"train_loss": -26.5229434967041, "global_step": 369708, "epoch": 4454} {"train_loss": -26.466506958007812, "global_step": 369709, "epoch": 4454} {"train_loss": -26.40654945373535, "global_step": 369710, "epoch": 4454} {"train_loss": -26.51349449157715, "global_step": 369711, "epoch": 4454} {"train_loss": -26.146020889282227, "global_step": 369712, "epoch": 4454} {"train_loss": -26.70053482055664, "global_step": 369713, "epoch": 4454} {"train_loss": -26.6276912689209, "global_step": 369714, "epoch": 4454} {"train_loss": -26.205102920532227, "global_step": 369715, "epoch": 4454} {"train_loss": -26.187885284423828, "global_step": 369716, "epoch": 4454} {"train_loss": -26.80234146118164, "global_step": 369717, "epoch": 4454} {"train_loss": -26.507648468017578, "global_step": 369718, "epoch": 4454} {"train_loss": -26.195249557495117, "global_step": 369719, "epoch": 4454} {"train_loss": -26.690418243408203, "global_step": 369720, "epoch": 4454} {"train_loss": -26.170867919921875, "global_step": 369721, "epoch": 4454} {"train_loss": -26.70134925842285, "global_step": 369722, "epoch": 4454} {"train_loss": -26.536054611206055, "global_step": 369723, "epoch": 4454} {"train_loss": -26.951562881469727, "global_step": 369724, "epoch": 4454} {"train_loss": -26.49009132385254, "global_step": 369725, "epoch": 4454} {"train_loss": -26.294721603393555, "global_step": 369726, "epoch": 4454} {"train_loss": -27.035568237304688, "global_step": 369727, "epoch": 4454} {"train_loss": -26.4331111907959, "global_step": 369728, "epoch": 4454} {"train_loss": -26.689863204956055, "global_step": 369729, "epoch": 4454} {"train_loss": -26.236204147338867, "global_step": 369730, "epoch": 4454} {"train_loss": -26.64912986755371, "global_step": 369731, "epoch": 4454} {"train_loss": -26.6005916595459, "global_step": 369732, "epoch": 4454} {"train_loss": -26.85565757751465, "global_step": 369733, "epoch": 4454} {"train_loss": -26.142108917236328, "global_step": 369734, "epoch": 4454} {"train_loss": -26.012258529663086, "global_step": 369735, "epoch": 4454} {"train_loss": -25.727344512939453, "global_step": 369736, "epoch": 4454} {"train_loss": -26.019256591796875, "global_step": 369737, "epoch": 4454} {"train_loss": -26.308841705322266, "global_step": 369738, "epoch": 4454} {"train_loss": -26.341251373291016, "global_step": 369739, "epoch": 4454} {"train_loss": -25.74794578552246, "global_step": 369740, "epoch": 4454} {"train_loss": -26.335824966430664, "global_step": 369741, "epoch": 4454} {"train_loss": -25.770898818969727, "global_step": 369742, "epoch": 4454} {"train_loss": -26.081159591674805, "global_step": 369743, "epoch": 4454} {"train_loss": -26.348419189453125, "global_step": 369744, "epoch": 4454} {"train_loss": -25.788434982299805, "global_step": 369745, "epoch": 4454} {"train_loss": -26.30006217956543, "global_step": 369746, "epoch": 4454} {"train_loss": -26.417682647705078, "global_step": 369747, "epoch": 4454} {"train_loss": -25.92706298828125, "global_step": 369748, "epoch": 4454} {"train_loss": -25.783918380737305, "global_step": 369749, "epoch": 4454} {"train_loss": -26.235061645507812, "global_step": 369750, "epoch": 4454} {"train_loss": -26.467031478881836, "global_step": 369751, "epoch": 4454} {"train_loss": -25.87764549255371, "global_step": 369752, "epoch": 4454} {"train_loss": -26.534469604492188, "global_step": 369753, "epoch": 4454} {"train_loss": -26.19935417175293, "global_step": 369754, "epoch": 4454} {"train_loss": -26.592273712158203, "global_step": 369755, "epoch": 4454} {"train_loss": -26.153730392456055, "global_step": 369756, "epoch": 4454} {"train_loss": -26.229475021362305, "global_step": 369757, "epoch": 4454} {"train_loss": -26.10036277770996, "global_step": 369758, "epoch": 4454} {"train_loss": -26.64558219909668, "global_step": 369759, "epoch": 4454} {"train_loss": -26.189172744750977, "global_step": 369760, "epoch": 4454} {"train_loss": -26.5020694732666, "global_step": 369761, "epoch": 4454} {"train_loss": -26.366296768188477, "global_step": 369762, "epoch": 4454} {"train_loss": -26.019590377807617, "global_step": 369763, "epoch": 4454} {"train_loss": -26.257945325001177, "global_step": 369764, "epoch": 4454, "val_loss": 6619028.0} {"train_loss": -25.1469669342041, "global_step": 369765, "epoch": 4455} {"train_loss": -25.01898193359375, "global_step": 369766, "epoch": 4455} {"train_loss": -25.48150062561035, "global_step": 369767, "epoch": 4455} {"train_loss": -25.445898056030273, "global_step": 369768, "epoch": 4455} {"train_loss": -25.734006881713867, "global_step": 369769, "epoch": 4455} {"train_loss": -25.261219024658203, "global_step": 369770, "epoch": 4455} {"train_loss": -25.798664093017578, "global_step": 369771, "epoch": 4455} {"train_loss": -25.839094161987305, "global_step": 369772, "epoch": 4455} {"train_loss": -25.570737838745117, "global_step": 369773, "epoch": 4455} {"train_loss": -26.0661678314209, "global_step": 369774, "epoch": 4455} {"train_loss": -25.724889755249023, "global_step": 369775, "epoch": 4455} {"train_loss": -26.33576774597168, "global_step": 369776, "epoch": 4455} {"train_loss": -25.870901107788086, "global_step": 369777, "epoch": 4455} {"train_loss": -25.928131103515625, "global_step": 369778, "epoch": 4455} {"train_loss": -26.308990478515625, "global_step": 369779, "epoch": 4455} {"train_loss": -25.928197860717773, "global_step": 369780, "epoch": 4455} {"train_loss": -26.137897491455078, "global_step": 369781, "epoch": 4455} {"train_loss": -26.351224899291992, "global_step": 369782, "epoch": 4455} {"train_loss": -26.271442413330078, "global_step": 369783, "epoch": 4455} {"train_loss": -26.09539794921875, "global_step": 369784, "epoch": 4455} {"train_loss": -26.379297256469727, "global_step": 369785, "epoch": 4455} {"train_loss": -25.996274948120117, "global_step": 369786, "epoch": 4455} {"train_loss": -26.19236183166504, "global_step": 369787, "epoch": 4455} {"train_loss": -26.348417282104492, "global_step": 369788, "epoch": 4455} {"train_loss": -26.40976905822754, "global_step": 369789, "epoch": 4455} {"train_loss": -26.415334701538086, "global_step": 369790, "epoch": 4455} {"train_loss": -26.242725372314453, "global_step": 369791, "epoch": 4455} {"train_loss": -26.698400497436523, "global_step": 369792, "epoch": 4455} {"train_loss": -26.3693790435791, "global_step": 369793, "epoch": 4455} {"train_loss": -26.627744674682617, "global_step": 369794, "epoch": 4455} {"train_loss": -26.43857765197754, "global_step": 369795, "epoch": 4455} {"train_loss": -26.383197784423828, "global_step": 369796, "epoch": 4455} {"train_loss": -26.58967399597168, "global_step": 369797, "epoch": 4455} {"train_loss": -26.784597396850586, "global_step": 369798, "epoch": 4455} {"train_loss": -26.50520133972168, "global_step": 369799, "epoch": 4455} {"train_loss": -26.484527587890625, "global_step": 369800, "epoch": 4455} {"train_loss": -26.617755889892578, "global_step": 369801, "epoch": 4455} {"train_loss": -26.458892822265625, "global_step": 369802, "epoch": 4455} {"train_loss": -26.748437881469727, "global_step": 369803, "epoch": 4455} {"train_loss": -26.79291343688965, "global_step": 369804, "epoch": 4455} {"train_loss": -26.668149948120117, "global_step": 369805, "epoch": 4455} {"train_loss": -26.466949462890625, "global_step": 369806, "epoch": 4455} {"train_loss": -26.611684799194336, "global_step": 369807, "epoch": 4455} {"train_loss": -26.64449119567871, "global_step": 369808, "epoch": 4455} {"train_loss": -26.25640869140625, "global_step": 369809, "epoch": 4455} {"train_loss": -26.332183837890625, "global_step": 369810, "epoch": 4455} {"train_loss": -26.317052841186523, "global_step": 369811, "epoch": 4455} {"train_loss": -26.203134536743164, "global_step": 369812, "epoch": 4455} {"train_loss": -26.527700424194336, "global_step": 369813, "epoch": 4455} {"train_loss": -26.66470718383789, "global_step": 369814, "epoch": 4455} {"train_loss": -26.505224227905273, "global_step": 369815, "epoch": 4455} {"train_loss": -26.533166885375977, "global_step": 369816, "epoch": 4455} {"train_loss": -26.10166358947754, "global_step": 369817, "epoch": 4455} {"train_loss": -26.205677032470703, "global_step": 369818, "epoch": 4455} {"train_loss": -26.600982666015625, "global_step": 369819, "epoch": 4455} {"train_loss": -26.18478775024414, "global_step": 369820, "epoch": 4455} {"train_loss": -26.43888282775879, "global_step": 369821, "epoch": 4455} {"train_loss": -26.296894073486328, "global_step": 369822, "epoch": 4455} {"train_loss": -26.28667640686035, "global_step": 369823, "epoch": 4455} {"train_loss": -26.647001266479492, "global_step": 369824, "epoch": 4455} {"train_loss": -26.32480239868164, "global_step": 369825, "epoch": 4455} {"train_loss": -26.06264305114746, "global_step": 369826, "epoch": 4455} {"train_loss": -26.418289184570312, "global_step": 369827, "epoch": 4455} {"train_loss": -26.553821563720703, "global_step": 369828, "epoch": 4455} {"train_loss": -26.13751792907715, "global_step": 369829, "epoch": 4455} {"train_loss": -26.536376953125, "global_step": 369830, "epoch": 4455} {"train_loss": -26.37835121154785, "global_step": 369831, "epoch": 4455} {"train_loss": -26.291967391967773, "global_step": 369832, "epoch": 4455} {"train_loss": -26.578277587890625, "global_step": 369833, "epoch": 4455} {"train_loss": -26.463027954101562, "global_step": 369834, "epoch": 4455} {"train_loss": -26.710412979125977, "global_step": 369835, "epoch": 4455} {"train_loss": -26.324132919311523, "global_step": 369836, "epoch": 4455} {"train_loss": -26.57161521911621, "global_step": 369837, "epoch": 4455} {"train_loss": -26.350849151611328, "global_step": 369838, "epoch": 4455} {"train_loss": -26.639606475830078, "global_step": 369839, "epoch": 4455} {"train_loss": -26.548141479492188, "global_step": 369840, "epoch": 4455} {"train_loss": -26.55665397644043, "global_step": 369841, "epoch": 4455} {"train_loss": -26.345230102539062, "global_step": 369842, "epoch": 4455} {"train_loss": -26.295507431030273, "global_step": 369843, "epoch": 4455} {"train_loss": -26.473230361938477, "global_step": 369844, "epoch": 4455} {"train_loss": -26.280790328979492, "global_step": 369845, "epoch": 4455} {"train_loss": -26.277997970581055, "global_step": 369846, "epoch": 4455} {"train_loss": -26.28275294476245, "global_step": 369847, "epoch": 4455, "val_loss": 6613964.0} {"train_loss": -24.454124450683594, "global_step": 369848, "epoch": 4456} {"train_loss": -23.181116104125977, "global_step": 369849, "epoch": 4456} {"train_loss": -23.401897430419922, "global_step": 369850, "epoch": 4456} {"train_loss": -25.75439453125, "global_step": 369851, "epoch": 4456} {"train_loss": -25.286396026611328, "global_step": 369852, "epoch": 4456} {"train_loss": -24.980512619018555, "global_step": 369853, "epoch": 4456} {"train_loss": -25.182205200195312, "global_step": 369854, "epoch": 4456} {"train_loss": -25.360706329345703, "global_step": 369855, "epoch": 4456} {"train_loss": -25.269634246826172, "global_step": 369856, "epoch": 4456} {"train_loss": -25.681089401245117, "global_step": 369857, "epoch": 4456} {"train_loss": -24.74017906188965, "global_step": 369858, "epoch": 4456} {"train_loss": -25.802875518798828, "global_step": 369859, "epoch": 4456} {"train_loss": -25.594783782958984, "global_step": 369860, "epoch": 4456} {"train_loss": -25.18975067138672, "global_step": 369861, "epoch": 4456} {"train_loss": -25.403474807739258, "global_step": 369862, "epoch": 4456} {"train_loss": -25.744461059570312, "global_step": 369863, "epoch": 4456} {"train_loss": -25.7264404296875, "global_step": 369864, "epoch": 4456} {"train_loss": -25.2613525390625, "global_step": 369865, "epoch": 4456} {"train_loss": -25.594242095947266, "global_step": 369866, "epoch": 4456} {"train_loss": -26.063207626342773, "global_step": 369867, "epoch": 4456} {"train_loss": -25.824462890625, "global_step": 369868, "epoch": 4456} {"train_loss": -26.091745376586914, "global_step": 369869, "epoch": 4456} {"train_loss": -25.990087509155273, "global_step": 369870, "epoch": 4456} {"train_loss": -26.043521881103516, "global_step": 369871, "epoch": 4456} {"train_loss": -25.799833297729492, "global_step": 369872, "epoch": 4456} {"train_loss": -26.19329833984375, "global_step": 369873, "epoch": 4456} {"train_loss": -25.65436363220215, "global_step": 369874, "epoch": 4456} {"train_loss": -26.288862228393555, "global_step": 369875, "epoch": 4456} {"train_loss": -25.72723388671875, "global_step": 369876, "epoch": 4456} {"train_loss": -26.307357788085938, "global_step": 369877, "epoch": 4456} {"train_loss": -26.291309356689453, "global_step": 369878, "epoch": 4456} {"train_loss": -25.91629409790039, "global_step": 369879, "epoch": 4456} {"train_loss": -25.966861724853516, "global_step": 369880, "epoch": 4456} {"train_loss": -26.446929931640625, "global_step": 369881, "epoch": 4456} {"train_loss": -26.02412223815918, "global_step": 369882, "epoch": 4456} {"train_loss": -26.068761825561523, "global_step": 369883, "epoch": 4456} {"train_loss": -26.093647003173828, "global_step": 369884, "epoch": 4456} {"train_loss": -26.351333618164062, "global_step": 369885, "epoch": 4456} {"train_loss": -26.413654327392578, "global_step": 369886, "epoch": 4456} {"train_loss": -26.349878311157227, "global_step": 369887, "epoch": 4456} {"train_loss": -26.434232711791992, "global_step": 369888, "epoch": 4456} {"train_loss": -26.41470718383789, "global_step": 369889, "epoch": 4456} {"train_loss": -26.329730987548828, "global_step": 369890, "epoch": 4456} {"train_loss": -26.441904067993164, "global_step": 369891, "epoch": 4456} {"train_loss": -26.6251277923584, "global_step": 369892, "epoch": 4456} {"train_loss": -26.3537654876709, "global_step": 369893, "epoch": 4456} {"train_loss": -26.47714614868164, "global_step": 369894, "epoch": 4456} {"train_loss": -26.33624267578125, "global_step": 369895, "epoch": 4456} {"train_loss": -26.2580509185791, "global_step": 369896, "epoch": 4456} {"train_loss": -26.71451759338379, "global_step": 369897, "epoch": 4456} {"train_loss": -26.612625122070312, "global_step": 369898, "epoch": 4456} {"train_loss": -26.342580795288086, "global_step": 369899, "epoch": 4456} {"train_loss": -26.31573486328125, "global_step": 369900, "epoch": 4456} {"train_loss": -26.648395538330078, "global_step": 369901, "epoch": 4456} {"train_loss": -26.475055694580078, "global_step": 369902, "epoch": 4456} {"train_loss": -26.343259811401367, "global_step": 369903, "epoch": 4456} {"train_loss": -26.220294952392578, "global_step": 369904, "epoch": 4456} {"train_loss": -26.7813663482666, "global_step": 369905, "epoch": 4456} {"train_loss": -26.351057052612305, "global_step": 369906, "epoch": 4456} {"train_loss": -26.505231857299805, "global_step": 369907, "epoch": 4456} {"train_loss": -26.47857093811035, "global_step": 369908, "epoch": 4456} {"train_loss": -26.276752471923828, "global_step": 369909, "epoch": 4456} {"train_loss": -26.39013671875, "global_step": 369910, "epoch": 4456} {"train_loss": -26.684314727783203, "global_step": 369911, "epoch": 4456} {"train_loss": -26.4325008392334, "global_step": 369912, "epoch": 4456} {"train_loss": -26.66813087463379, "global_step": 369913, "epoch": 4456} {"train_loss": -26.07731056213379, "global_step": 369914, "epoch": 4456} {"train_loss": -26.991724014282227, "global_step": 369915, "epoch": 4456} {"train_loss": -27.052392959594727, "global_step": 369916, "epoch": 4456} {"train_loss": -26.029272079467773, "global_step": 369917, "epoch": 4456} {"train_loss": -26.92121696472168, "global_step": 369918, "epoch": 4456} {"train_loss": -26.45549964904785, "global_step": 369919, "epoch": 4456} {"train_loss": -25.91092300415039, "global_step": 369920, "epoch": 4456} {"train_loss": -26.37257194519043, "global_step": 369921, "epoch": 4456} {"train_loss": -26.632617950439453, "global_step": 369922, "epoch": 4456} {"train_loss": -26.233877182006836, "global_step": 369923, "epoch": 4456} {"train_loss": -26.386676788330078, "global_step": 369924, "epoch": 4456} {"train_loss": -26.10639762878418, "global_step": 369925, "epoch": 4456} {"train_loss": -26.15542984008789, "global_step": 369926, "epoch": 4456} {"train_loss": -26.322080612182617, "global_step": 369927, "epoch": 4456} {"train_loss": -26.52544593811035, "global_step": 369928, "epoch": 4456} {"train_loss": -26.304141998291016, "global_step": 369929, "epoch": 4456} {"train_loss": -26.045563157782496, "global_step": 369930, "epoch": 4456, "val_loss": 6685071.5} {"train_loss": -25.78523063659668, "global_step": 369931, "epoch": 4457} {"train_loss": -25.570810317993164, "global_step": 369932, "epoch": 4457} {"train_loss": -24.68284034729004, "global_step": 369933, "epoch": 4457} {"train_loss": -25.0747013092041, "global_step": 369934, "epoch": 4457} {"train_loss": -25.439701080322266, "global_step": 369935, "epoch": 4457} {"train_loss": -25.84808921813965, "global_step": 369936, "epoch": 4457} {"train_loss": -26.008371353149414, "global_step": 369937, "epoch": 4457} {"train_loss": -25.694021224975586, "global_step": 369938, "epoch": 4457} {"train_loss": -25.661762237548828, "global_step": 369939, "epoch": 4457} {"train_loss": -25.959430694580078, "global_step": 369940, "epoch": 4457} {"train_loss": -25.961536407470703, "global_step": 369941, "epoch": 4457} {"train_loss": -26.428571701049805, "global_step": 369942, "epoch": 4457} {"train_loss": -26.076902389526367, "global_step": 369943, "epoch": 4457} {"train_loss": -25.889846801757812, "global_step": 369944, "epoch": 4457} {"train_loss": -26.25074577331543, "global_step": 369945, "epoch": 4457} {"train_loss": -25.868661880493164, "global_step": 369946, "epoch": 4457} {"train_loss": -26.214218139648438, "global_step": 369947, "epoch": 4457} {"train_loss": -25.765491485595703, "global_step": 369948, "epoch": 4457} {"train_loss": -26.549957275390625, "global_step": 369949, "epoch": 4457} {"train_loss": -26.023040771484375, "global_step": 369950, "epoch": 4457} {"train_loss": -26.02326774597168, "global_step": 369951, "epoch": 4457} {"train_loss": -26.053186416625977, "global_step": 369952, "epoch": 4457} {"train_loss": -26.1261043548584, "global_step": 369953, "epoch": 4457} {"train_loss": -26.154809951782227, "global_step": 369954, "epoch": 4457} {"train_loss": -26.094268798828125, "global_step": 369955, "epoch": 4457} {"train_loss": -26.110498428344727, "global_step": 369956, "epoch": 4457} {"train_loss": -26.20869255065918, "global_step": 369957, "epoch": 4457} {"train_loss": -26.547718048095703, "global_step": 369958, "epoch": 4457} {"train_loss": -26.301904678344727, "global_step": 369959, "epoch": 4457} {"train_loss": -26.511014938354492, "global_step": 369960, "epoch": 4457} {"train_loss": -26.57124137878418, "global_step": 369961, "epoch": 4457} {"train_loss": -26.300582885742188, "global_step": 369962, "epoch": 4457} {"train_loss": -26.306684494018555, "global_step": 369963, "epoch": 4457} {"train_loss": -26.664655685424805, "global_step": 369964, "epoch": 4457} {"train_loss": -26.251361846923828, "global_step": 369965, "epoch": 4457} {"train_loss": -26.354352951049805, "global_step": 369966, "epoch": 4457} {"train_loss": -26.49591636657715, "global_step": 369967, "epoch": 4457} {"train_loss": -26.532567977905273, "global_step": 369968, "epoch": 4457} {"train_loss": -26.269580841064453, "global_step": 369969, "epoch": 4457} {"train_loss": -26.694013595581055, "global_step": 369970, "epoch": 4457} {"train_loss": -26.578521728515625, "global_step": 369971, "epoch": 4457} {"train_loss": -26.3277530670166, "global_step": 369972, "epoch": 4457} {"train_loss": -26.768756866455078, "global_step": 369973, "epoch": 4457} {"train_loss": -26.40125846862793, "global_step": 369974, "epoch": 4457} {"train_loss": -26.460769653320312, "global_step": 369975, "epoch": 4457} {"train_loss": -26.235570907592773, "global_step": 369976, "epoch": 4457} {"train_loss": -26.3789005279541, "global_step": 369977, "epoch": 4457} {"train_loss": -26.586444854736328, "global_step": 369978, "epoch": 4457} {"train_loss": -26.536273956298828, "global_step": 369979, "epoch": 4457} {"train_loss": -26.5024471282959, "global_step": 369980, "epoch": 4457} {"train_loss": -26.4375057220459, "global_step": 369981, "epoch": 4457} {"train_loss": -26.638324737548828, "global_step": 369982, "epoch": 4457} {"train_loss": -26.633203506469727, "global_step": 369983, "epoch": 4457} {"train_loss": -26.216245651245117, "global_step": 369984, "epoch": 4457} {"train_loss": -26.3806095123291, "global_step": 369985, "epoch": 4457} {"train_loss": -26.046619415283203, "global_step": 369986, "epoch": 4457} {"train_loss": -26.274642944335938, "global_step": 369987, "epoch": 4457} {"train_loss": -26.693090438842773, "global_step": 369988, "epoch": 4457} {"train_loss": -26.66461753845215, "global_step": 369989, "epoch": 4457} {"train_loss": -26.564268112182617, "global_step": 369990, "epoch": 4457} {"train_loss": -26.352283477783203, "global_step": 369991, "epoch": 4457} {"train_loss": -26.848569869995117, "global_step": 369992, "epoch": 4457} {"train_loss": -26.57869529724121, "global_step": 369993, "epoch": 4457} {"train_loss": -26.38397789001465, "global_step": 369994, "epoch": 4457} {"train_loss": -26.89374351501465, "global_step": 369995, "epoch": 4457} {"train_loss": -26.89777946472168, "global_step": 369996, "epoch": 4457} {"train_loss": -26.657947540283203, "global_step": 369997, "epoch": 4457} {"train_loss": -26.635089874267578, "global_step": 369998, "epoch": 4457} {"train_loss": -26.38492202758789, "global_step": 369999, "epoch": 4457} {"train_loss": -26.62615966796875, "global_step": 370000, "epoch": 4457} {"train_loss": -26.443714141845703, "global_step": 370001, "epoch": 4457} {"train_loss": -26.60004234313965, "global_step": 370002, "epoch": 4457} {"train_loss": -26.331769943237305, "global_step": 370003, "epoch": 4457} {"train_loss": -26.429462432861328, "global_step": 370004, "epoch": 4457} {"train_loss": -26.491718292236328, "global_step": 370005, "epoch": 4457} {"train_loss": -26.4002628326416, "global_step": 370006, "epoch": 4457} {"train_loss": -26.815570831298828, "global_step": 370007, "epoch": 4457} {"train_loss": -26.343591690063477, "global_step": 370008, "epoch": 4457} {"train_loss": -26.47275733947754, "global_step": 370009, "epoch": 4457} {"train_loss": -26.29339027404785, "global_step": 370010, "epoch": 4457} {"train_loss": -26.7641544342041, "global_step": 370011, "epoch": 4457} {"train_loss": -26.218042373657227, "global_step": 370012, "epoch": 4457} {"train_loss": -26.294385404471893, "global_step": 370013, "epoch": 4457, "val_loss": 6609936.0} {"train_loss": -25.65787696838379, "global_step": 370014, "epoch": 4458} {"train_loss": -25.7781925201416, "global_step": 370015, "epoch": 4458} {"train_loss": -25.406436920166016, "global_step": 370016, "epoch": 4458} {"train_loss": -23.94099235534668, "global_step": 370017, "epoch": 4458} {"train_loss": -24.88098907470703, "global_step": 370018, "epoch": 4458} {"train_loss": -26.11451530456543, "global_step": 370019, "epoch": 4458} {"train_loss": -25.66871452331543, "global_step": 370020, "epoch": 4458} {"train_loss": -25.33690643310547, "global_step": 370021, "epoch": 4458} {"train_loss": -26.02705192565918, "global_step": 370022, "epoch": 4458} {"train_loss": -25.669809341430664, "global_step": 370023, "epoch": 4458} {"train_loss": -26.056921005249023, "global_step": 370024, "epoch": 4458} {"train_loss": -26.174652099609375, "global_step": 370025, "epoch": 4458} {"train_loss": -26.3083553314209, "global_step": 370026, "epoch": 4458} {"train_loss": -26.10259437561035, "global_step": 370027, "epoch": 4458} {"train_loss": -26.10687828063965, "global_step": 370028, "epoch": 4458} {"train_loss": -26.232192993164062, "global_step": 370029, "epoch": 4458} {"train_loss": -26.063379287719727, "global_step": 370030, "epoch": 4458} {"train_loss": -25.6640682220459, "global_step": 370031, "epoch": 4458} {"train_loss": -26.192306518554688, "global_step": 370032, "epoch": 4458} {"train_loss": -26.010663986206055, "global_step": 370033, "epoch": 4458} {"train_loss": -26.348621368408203, "global_step": 370034, "epoch": 4458} {"train_loss": -26.099084854125977, "global_step": 370035, "epoch": 4458} {"train_loss": -26.438720703125, "global_step": 370036, "epoch": 4458} {"train_loss": -26.2811336517334, "global_step": 370037, "epoch": 4458} {"train_loss": -26.407835006713867, "global_step": 370038, "epoch": 4458} {"train_loss": -26.438684463500977, "global_step": 370039, "epoch": 4458} {"train_loss": -26.144092559814453, "global_step": 370040, "epoch": 4458} {"train_loss": -26.542499542236328, "global_step": 370041, "epoch": 4458} {"train_loss": -26.51283073425293, "global_step": 370042, "epoch": 4458} {"train_loss": -26.339689254760742, "global_step": 370043, "epoch": 4458} {"train_loss": -26.238571166992188, "global_step": 370044, "epoch": 4458} {"train_loss": -26.508758544921875, "global_step": 370045, "epoch": 4458} {"train_loss": -26.23529052734375, "global_step": 370046, "epoch": 4458} {"train_loss": -26.582239151000977, "global_step": 370047, "epoch": 4458} {"train_loss": -26.654285430908203, "global_step": 370048, "epoch": 4458} {"train_loss": -26.434560775756836, "global_step": 370049, "epoch": 4458} {"train_loss": -26.376489639282227, "global_step": 370050, "epoch": 4458} {"train_loss": -26.531564712524414, "global_step": 370051, "epoch": 4458} {"train_loss": -26.820356369018555, "global_step": 370052, "epoch": 4458} {"train_loss": -26.432538986206055, "global_step": 370053, "epoch": 4458} {"train_loss": -26.432580947875977, "global_step": 370054, "epoch": 4458} {"train_loss": -26.852874755859375, "global_step": 370055, "epoch": 4458} {"train_loss": -26.130125045776367, "global_step": 370056, "epoch": 4458} {"train_loss": -26.386377334594727, "global_step": 370057, "epoch": 4458} {"train_loss": -26.242267608642578, "global_step": 370058, "epoch": 4458} {"train_loss": -26.205835342407227, "global_step": 370059, "epoch": 4458} {"train_loss": -26.37043571472168, "global_step": 370060, "epoch": 4458} {"train_loss": -26.561115264892578, "global_step": 370061, "epoch": 4458} {"train_loss": -26.455549240112305, "global_step": 370062, "epoch": 4458} {"train_loss": -26.653417587280273, "global_step": 370063, "epoch": 4458} {"train_loss": -26.390735626220703, "global_step": 370064, "epoch": 4458} {"train_loss": -26.6295166015625, "global_step": 370065, "epoch": 4458} {"train_loss": -26.6224422454834, "global_step": 370066, "epoch": 4458} {"train_loss": -26.196008682250977, "global_step": 370067, "epoch": 4458} {"train_loss": -25.952756881713867, "global_step": 370068, "epoch": 4458} {"train_loss": -26.493555068969727, "global_step": 370069, "epoch": 4458} {"train_loss": -26.44287109375, "global_step": 370070, "epoch": 4458} {"train_loss": -26.501754760742188, "global_step": 370071, "epoch": 4458} {"train_loss": -26.44276237487793, "global_step": 370072, "epoch": 4458} {"train_loss": -26.24825096130371, "global_step": 370073, "epoch": 4458} {"train_loss": -26.354162216186523, "global_step": 370074, "epoch": 4458} {"train_loss": -26.385339736938477, "global_step": 370075, "epoch": 4458} {"train_loss": -26.534347534179688, "global_step": 370076, "epoch": 4458} {"train_loss": -26.59234046936035, "global_step": 370077, "epoch": 4458} {"train_loss": -26.34769630432129, "global_step": 370078, "epoch": 4458} {"train_loss": -26.23902702331543, "global_step": 370079, "epoch": 4458} {"train_loss": -26.636005401611328, "global_step": 370080, "epoch": 4458} {"train_loss": -26.548511505126953, "global_step": 370081, "epoch": 4458} {"train_loss": -26.397720336914062, "global_step": 370082, "epoch": 4458} {"train_loss": -26.471729278564453, "global_step": 370083, "epoch": 4458} {"train_loss": -26.370685577392578, "global_step": 370084, "epoch": 4458} {"train_loss": -26.573169708251953, "global_step": 370085, "epoch": 4458} {"train_loss": -26.421594619750977, "global_step": 370086, "epoch": 4458} {"train_loss": -26.84161376953125, "global_step": 370087, "epoch": 4458} {"train_loss": -26.682147979736328, "global_step": 370088, "epoch": 4458} {"train_loss": -26.695348739624023, "global_step": 370089, "epoch": 4458} {"train_loss": -27.040180206298828, "global_step": 370090, "epoch": 4458} {"train_loss": -26.508869171142578, "global_step": 370091, "epoch": 4458} {"train_loss": -26.55875015258789, "global_step": 370092, "epoch": 4458} {"train_loss": -26.443714141845703, "global_step": 370093, "epoch": 4458} {"train_loss": -26.651803970336914, "global_step": 370094, "epoch": 4458} {"train_loss": -26.63022804260254, "global_step": 370095, "epoch": 4458} {"train_loss": -26.296051002410522, "global_step": 370096, "epoch": 4458, "val_loss": 6595707.0} {"train_loss": -26.406469345092773, "global_step": 370097, "epoch": 4459} {"train_loss": -25.621612548828125, "global_step": 370098, "epoch": 4459} {"train_loss": -25.582979202270508, "global_step": 370099, "epoch": 4459} {"train_loss": -25.340965270996094, "global_step": 370100, "epoch": 4459} {"train_loss": -23.685836791992188, "global_step": 370101, "epoch": 4459} {"train_loss": -23.640195846557617, "global_step": 370102, "epoch": 4459} {"train_loss": -24.897846221923828, "global_step": 370103, "epoch": 4459} {"train_loss": -25.278165817260742, "global_step": 370104, "epoch": 4459} {"train_loss": -23.671649932861328, "global_step": 370105, "epoch": 4459} {"train_loss": -25.409231185913086, "global_step": 370106, "epoch": 4459} {"train_loss": -25.0682430267334, "global_step": 370107, "epoch": 4459} {"train_loss": -25.961471557617188, "global_step": 370108, "epoch": 4459} {"train_loss": -24.608457565307617, "global_step": 370109, "epoch": 4459} {"train_loss": -25.36528968811035, "global_step": 370110, "epoch": 4459} {"train_loss": -25.383014678955078, "global_step": 370111, "epoch": 4459} {"train_loss": -25.8236026763916, "global_step": 370112, "epoch": 4459} {"train_loss": -25.20881462097168, "global_step": 370113, "epoch": 4459} {"train_loss": -25.682662963867188, "global_step": 370114, "epoch": 4459} {"train_loss": -25.85433006286621, "global_step": 370115, "epoch": 4459} {"train_loss": -25.365047454833984, "global_step": 370116, "epoch": 4459} {"train_loss": -25.682754516601562, "global_step": 370117, "epoch": 4459} {"train_loss": -25.61468505859375, "global_step": 370118, "epoch": 4459} {"train_loss": -25.904937744140625, "global_step": 370119, "epoch": 4459} {"train_loss": -26.239730834960938, "global_step": 370120, "epoch": 4459} {"train_loss": -26.020353317260742, "global_step": 370121, "epoch": 4459} {"train_loss": -25.58406639099121, "global_step": 370122, "epoch": 4459} {"train_loss": -25.99799919128418, "global_step": 370123, "epoch": 4459} {"train_loss": -25.50211524963379, "global_step": 370124, "epoch": 4459} {"train_loss": -25.710250854492188, "global_step": 370125, "epoch": 4459} {"train_loss": -26.221948623657227, "global_step": 370126, "epoch": 4459} {"train_loss": -25.97614097595215, "global_step": 370127, "epoch": 4459} {"train_loss": -26.05604362487793, "global_step": 370128, "epoch": 4459} {"train_loss": -26.052459716796875, "global_step": 370129, "epoch": 4459} {"train_loss": -26.135839462280273, "global_step": 370130, "epoch": 4459} {"train_loss": -25.638280868530273, "global_step": 370131, "epoch": 4459} {"train_loss": -26.051599502563477, "global_step": 370132, "epoch": 4459} {"train_loss": -26.34626579284668, "global_step": 370133, "epoch": 4459} {"train_loss": -26.03407096862793, "global_step": 370134, "epoch": 4459} {"train_loss": -26.11494255065918, "global_step": 370135, "epoch": 4459} {"train_loss": -26.2244815826416, "global_step": 370136, "epoch": 4459} {"train_loss": -26.306379318237305, "global_step": 370137, "epoch": 4459} {"train_loss": -26.5820369720459, "global_step": 370138, "epoch": 4459} {"train_loss": -26.38319206237793, "global_step": 370139, "epoch": 4459} {"train_loss": -26.349939346313477, "global_step": 370140, "epoch": 4459} {"train_loss": -26.4789981842041, "global_step": 370141, "epoch": 4459} {"train_loss": -26.026123046875, "global_step": 370142, "epoch": 4459} {"train_loss": -26.42018699645996, "global_step": 370143, "epoch": 4459} {"train_loss": -26.200489044189453, "global_step": 370144, "epoch": 4459} {"train_loss": -26.597543716430664, "global_step": 370145, "epoch": 4459} {"train_loss": -26.247262954711914, "global_step": 370146, "epoch": 4459} {"train_loss": -26.41908073425293, "global_step": 370147, "epoch": 4459} {"train_loss": -26.386808395385742, "global_step": 370148, "epoch": 4459} {"train_loss": -26.052228927612305, "global_step": 370149, "epoch": 4459} {"train_loss": -26.447967529296875, "global_step": 370150, "epoch": 4459} {"train_loss": -26.472644805908203, "global_step": 370151, "epoch": 4459} {"train_loss": -26.44303321838379, "global_step": 370152, "epoch": 4459} {"train_loss": -26.1653995513916, "global_step": 370153, "epoch": 4459} {"train_loss": -26.66969871520996, "global_step": 370154, "epoch": 4459} {"train_loss": -26.422046661376953, "global_step": 370155, "epoch": 4459} {"train_loss": -26.100814819335938, "global_step": 370156, "epoch": 4459} {"train_loss": -26.746076583862305, "global_step": 370157, "epoch": 4459} {"train_loss": -26.309385299682617, "global_step": 370158, "epoch": 4459} {"train_loss": -26.91458511352539, "global_step": 370159, "epoch": 4459} {"train_loss": -26.741830825805664, "global_step": 370160, "epoch": 4459} {"train_loss": -26.355499267578125, "global_step": 370161, "epoch": 4459} {"train_loss": -26.457874298095703, "global_step": 370162, "epoch": 4459} {"train_loss": -26.14288902282715, "global_step": 370163, "epoch": 4459} {"train_loss": -26.7371826171875, "global_step": 370164, "epoch": 4459} {"train_loss": -26.175500869750977, "global_step": 370165, "epoch": 4459} {"train_loss": -26.94942283630371, "global_step": 370166, "epoch": 4459} {"train_loss": -26.236738204956055, "global_step": 370167, "epoch": 4459} {"train_loss": -26.578968048095703, "global_step": 370168, "epoch": 4459} {"train_loss": -26.1480655670166, "global_step": 370169, "epoch": 4459} {"train_loss": -26.26191520690918, "global_step": 370170, "epoch": 4459} {"train_loss": -26.37118911743164, "global_step": 370171, "epoch": 4459} {"train_loss": -26.440759658813477, "global_step": 370172, "epoch": 4459} {"train_loss": -26.178821563720703, "global_step": 370173, "epoch": 4459} {"train_loss": -26.334857940673828, "global_step": 370174, "epoch": 4459} {"train_loss": -26.306509017944336, "global_step": 370175, "epoch": 4459} {"train_loss": -26.50824546813965, "global_step": 370176, "epoch": 4459} {"train_loss": -26.7119197845459, "global_step": 370177, "epoch": 4459} {"train_loss": -25.742523193359375, "global_step": 370178, "epoch": 4459} {"train_loss": -25.98812055013266, "global_step": 370179, "epoch": 4459, "val_loss": 6544282.5} {"train_loss": -25.835437774658203, "global_step": 370180, "epoch": 4460} {"train_loss": -25.987924575805664, "global_step": 370181, "epoch": 4460} {"train_loss": -26.095077514648438, "global_step": 370182, "epoch": 4460} {"train_loss": -26.03801918029785, "global_step": 370183, "epoch": 4460} {"train_loss": -25.90357780456543, "global_step": 370184, "epoch": 4460} {"train_loss": -26.074600219726562, "global_step": 370185, "epoch": 4460} {"train_loss": -26.266921997070312, "global_step": 370186, "epoch": 4460} {"train_loss": -26.252262115478516, "global_step": 370187, "epoch": 4460} {"train_loss": -25.871784210205078, "global_step": 370188, "epoch": 4460} {"train_loss": -25.655988693237305, "global_step": 370189, "epoch": 4460} {"train_loss": -26.137638092041016, "global_step": 370190, "epoch": 4460} {"train_loss": -25.870349884033203, "global_step": 370191, "epoch": 4460} {"train_loss": -25.787521362304688, "global_step": 370192, "epoch": 4460} {"train_loss": -26.19708251953125, "global_step": 370193, "epoch": 4460} {"train_loss": -26.20745849609375, "global_step": 370194, "epoch": 4460} {"train_loss": -26.2855281829834, "global_step": 370195, "epoch": 4460} {"train_loss": -26.077228546142578, "global_step": 370196, "epoch": 4460} {"train_loss": -26.16908836364746, "global_step": 370197, "epoch": 4460} {"train_loss": -25.844030380249023, "global_step": 370198, "epoch": 4460} {"train_loss": -26.37464714050293, "global_step": 370199, "epoch": 4460} {"train_loss": -26.410932540893555, "global_step": 370200, "epoch": 4460} {"train_loss": -26.579742431640625, "global_step": 370201, "epoch": 4460} {"train_loss": -26.1106014251709, "global_step": 370202, "epoch": 4460} {"train_loss": -26.68708610534668, "global_step": 370203, "epoch": 4460} {"train_loss": -25.9547061920166, "global_step": 370204, "epoch": 4460} {"train_loss": -26.1652774810791, "global_step": 370205, "epoch": 4460} {"train_loss": -26.31524658203125, "global_step": 370206, "epoch": 4460} {"train_loss": -26.33544921875, "global_step": 370207, "epoch": 4460} {"train_loss": -26.55575942993164, "global_step": 370208, "epoch": 4460} {"train_loss": -26.424560546875, "global_step": 370209, "epoch": 4460} {"train_loss": -26.469003677368164, "global_step": 370210, "epoch": 4460} {"train_loss": -26.267841339111328, "global_step": 370211, "epoch": 4460} {"train_loss": -26.5793399810791, "global_step": 370212, "epoch": 4460} {"train_loss": -26.41693115234375, "global_step": 370213, "epoch": 4460} {"train_loss": -26.603748321533203, "global_step": 370214, "epoch": 4460} {"train_loss": -26.720123291015625, "global_step": 370215, "epoch": 4460} {"train_loss": -26.586318969726562, "global_step": 370216, "epoch": 4460} {"train_loss": -26.468128204345703, "global_step": 370217, "epoch": 4460} {"train_loss": -26.596485137939453, "global_step": 370218, "epoch": 4460} {"train_loss": -26.634164810180664, "global_step": 370219, "epoch": 4460} {"train_loss": -26.995054244995117, "global_step": 370220, "epoch": 4460} {"train_loss": -26.253339767456055, "global_step": 370221, "epoch": 4460} {"train_loss": -26.445220947265625, "global_step": 370222, "epoch": 4460} {"train_loss": -26.850341796875, "global_step": 370223, "epoch": 4460} {"train_loss": -26.4454288482666, "global_step": 370224, "epoch": 4460} {"train_loss": -26.286640167236328, "global_step": 370225, "epoch": 4460} {"train_loss": -26.251239776611328, "global_step": 370226, "epoch": 4460} {"train_loss": -26.205432891845703, "global_step": 370227, "epoch": 4460} {"train_loss": -26.0322265625, "global_step": 370228, "epoch": 4460} {"train_loss": -25.965723037719727, "global_step": 370229, "epoch": 4460} {"train_loss": -25.91633415222168, "global_step": 370230, "epoch": 4460} {"train_loss": -26.20069694519043, "global_step": 370231, "epoch": 4460} {"train_loss": -25.723907470703125, "global_step": 370232, "epoch": 4460} {"train_loss": -26.17466163635254, "global_step": 370233, "epoch": 4460} {"train_loss": -26.55243492126465, "global_step": 370234, "epoch": 4460} {"train_loss": -26.039541244506836, "global_step": 370235, "epoch": 4460} {"train_loss": -25.933185577392578, "global_step": 370236, "epoch": 4460} {"train_loss": -26.257009506225586, "global_step": 370237, "epoch": 4460} {"train_loss": -26.670515060424805, "global_step": 370238, "epoch": 4460} {"train_loss": -26.27667808532715, "global_step": 370239, "epoch": 4460} {"train_loss": -25.754596710205078, "global_step": 370240, "epoch": 4460} {"train_loss": -26.456954956054688, "global_step": 370241, "epoch": 4460} {"train_loss": -26.28750991821289, "global_step": 370242, "epoch": 4460} {"train_loss": -25.703876495361328, "global_step": 370243, "epoch": 4460} {"train_loss": -26.226911544799805, "global_step": 370244, "epoch": 4460} {"train_loss": -26.46357536315918, "global_step": 370245, "epoch": 4460} {"train_loss": -26.206151962280273, "global_step": 370246, "epoch": 4460} {"train_loss": -26.362043380737305, "global_step": 370247, "epoch": 4460} {"train_loss": -26.291723251342773, "global_step": 370248, "epoch": 4460} {"train_loss": -26.194971084594727, "global_step": 370249, "epoch": 4460} {"train_loss": -26.37476921081543, "global_step": 370250, "epoch": 4460} {"train_loss": -25.965368270874023, "global_step": 370251, "epoch": 4460} {"train_loss": -26.431140899658203, "global_step": 370252, "epoch": 4460} {"train_loss": -26.37704849243164, "global_step": 370253, "epoch": 4460} {"train_loss": -26.294336318969727, "global_step": 370254, "epoch": 4460} {"train_loss": -26.853424072265625, "global_step": 370255, "epoch": 4460} {"train_loss": -26.566022872924805, "global_step": 370256, "epoch": 4460} {"train_loss": -26.2766056060791, "global_step": 370257, "epoch": 4460} {"train_loss": -26.11952781677246, "global_step": 370258, "epoch": 4460} {"train_loss": -26.4731502532959, "global_step": 370259, "epoch": 4460} {"train_loss": -26.1874942779541, "global_step": 370260, "epoch": 4460} {"train_loss": -26.430255889892578, "global_step": 370261, "epoch": 4460} {"train_loss": -26.257389987807677, "global_step": 370262, "epoch": 4460, "val_loss": 6671106.0} {"train_loss": -26.355504989624023, "global_step": 370263, "epoch": 4461} {"train_loss": -25.90471839904785, "global_step": 370264, "epoch": 4461} {"train_loss": -26.5880069732666, "global_step": 370265, "epoch": 4461} {"train_loss": -26.540515899658203, "global_step": 370266, "epoch": 4461} {"train_loss": -25.896259307861328, "global_step": 370267, "epoch": 4461} {"train_loss": -26.081073760986328, "global_step": 370268, "epoch": 4461} {"train_loss": -26.283105850219727, "global_step": 370269, "epoch": 4461} {"train_loss": -26.190814971923828, "global_step": 370270, "epoch": 4461} {"train_loss": -26.201004028320312, "global_step": 370271, "epoch": 4461} {"train_loss": -25.57455825805664, "global_step": 370272, "epoch": 4461} {"train_loss": -25.4823055267334, "global_step": 370273, "epoch": 4461} {"train_loss": -26.11635398864746, "global_step": 370274, "epoch": 4461} {"train_loss": -25.740148544311523, "global_step": 370275, "epoch": 4461} {"train_loss": -25.7031307220459, "global_step": 370276, "epoch": 4461} {"train_loss": -25.90349769592285, "global_step": 370277, "epoch": 4461} {"train_loss": -25.62729835510254, "global_step": 370278, "epoch": 4461} {"train_loss": -26.440963745117188, "global_step": 370279, "epoch": 4461} {"train_loss": -25.615814208984375, "global_step": 370280, "epoch": 4461} {"train_loss": -25.592082977294922, "global_step": 370281, "epoch": 4461} {"train_loss": -25.810415267944336, "global_step": 370282, "epoch": 4461} {"train_loss": -25.940073013305664, "global_step": 370283, "epoch": 4461} {"train_loss": -25.969024658203125, "global_step": 370284, "epoch": 4461} {"train_loss": -25.817285537719727, "global_step": 370285, "epoch": 4461} {"train_loss": -26.217071533203125, "global_step": 370286, "epoch": 4461} {"train_loss": -26.050512313842773, "global_step": 370287, "epoch": 4461} {"train_loss": -25.996084213256836, "global_step": 370288, "epoch": 4461} {"train_loss": -26.47308921813965, "global_step": 370289, "epoch": 4461} {"train_loss": -26.196741104125977, "global_step": 370290, "epoch": 4461} {"train_loss": -26.594274520874023, "global_step": 370291, "epoch": 4461} {"train_loss": -25.934463500976562, "global_step": 370292, "epoch": 4461} {"train_loss": -26.51141929626465, "global_step": 370293, "epoch": 4461} {"train_loss": -26.391576766967773, "global_step": 370294, "epoch": 4461} {"train_loss": -26.11333656311035, "global_step": 370295, "epoch": 4461} {"train_loss": -26.419591903686523, "global_step": 370296, "epoch": 4461} {"train_loss": -26.382654190063477, "global_step": 370297, "epoch": 4461} {"train_loss": -26.023452758789062, "global_step": 370298, "epoch": 4461} {"train_loss": -26.23137855529785, "global_step": 370299, "epoch": 4461} {"train_loss": -26.22736167907715, "global_step": 370300, "epoch": 4461} {"train_loss": -26.20846939086914, "global_step": 370301, "epoch": 4461} {"train_loss": -26.30396842956543, "global_step": 370302, "epoch": 4461} {"train_loss": -26.623315811157227, "global_step": 370303, "epoch": 4461} {"train_loss": -26.26392936706543, "global_step": 370304, "epoch": 4461} {"train_loss": -26.443044662475586, "global_step": 370305, "epoch": 4461} {"train_loss": -26.130401611328125, "global_step": 370306, "epoch": 4461} {"train_loss": -26.486215591430664, "global_step": 370307, "epoch": 4461} {"train_loss": -26.19424819946289, "global_step": 370308, "epoch": 4461} {"train_loss": -26.669544219970703, "global_step": 370309, "epoch": 4461} {"train_loss": -26.186609268188477, "global_step": 370310, "epoch": 4461} {"train_loss": -26.526458740234375, "global_step": 370311, "epoch": 4461} {"train_loss": -26.5408935546875, "global_step": 370312, "epoch": 4461} {"train_loss": -26.50116539001465, "global_step": 370313, "epoch": 4461} {"train_loss": -26.48288917541504, "global_step": 370314, "epoch": 4461} {"train_loss": -26.41033363342285, "global_step": 370315, "epoch": 4461} {"train_loss": -26.466825485229492, "global_step": 370316, "epoch": 4461} {"train_loss": -26.414060592651367, "global_step": 370317, "epoch": 4461} {"train_loss": -26.304691314697266, "global_step": 370318, "epoch": 4461} {"train_loss": -25.805456161499023, "global_step": 370319, "epoch": 4461} {"train_loss": -26.237768173217773, "global_step": 370320, "epoch": 4461} {"train_loss": -26.2491455078125, "global_step": 370321, "epoch": 4461} {"train_loss": -25.90285301208496, "global_step": 370322, "epoch": 4461} {"train_loss": -25.95037269592285, "global_step": 370323, "epoch": 4461} {"train_loss": -26.493366241455078, "global_step": 370324, "epoch": 4461} {"train_loss": -26.5592041015625, "global_step": 370325, "epoch": 4461} {"train_loss": -26.09697914123535, "global_step": 370326, "epoch": 4461} {"train_loss": -25.6865177154541, "global_step": 370327, "epoch": 4461} {"train_loss": -26.35065269470215, "global_step": 370328, "epoch": 4461} {"train_loss": -26.38507080078125, "global_step": 370329, "epoch": 4461} {"train_loss": -26.58802604675293, "global_step": 370330, "epoch": 4461} {"train_loss": -26.30707359313965, "global_step": 370331, "epoch": 4461} {"train_loss": -26.0655574798584, "global_step": 370332, "epoch": 4461} {"train_loss": -26.607053756713867, "global_step": 370333, "epoch": 4461} {"train_loss": -26.743133544921875, "global_step": 370334, "epoch": 4461} {"train_loss": -26.037267684936523, "global_step": 370335, "epoch": 4461} {"train_loss": -26.058761596679688, "global_step": 370336, "epoch": 4461} {"train_loss": -26.45940589904785, "global_step": 370337, "epoch": 4461} {"train_loss": -26.561063766479492, "global_step": 370338, "epoch": 4461} {"train_loss": -26.485944747924805, "global_step": 370339, "epoch": 4461} {"train_loss": -26.53934097290039, "global_step": 370340, "epoch": 4461} {"train_loss": -26.498632431030273, "global_step": 370341, "epoch": 4461} {"train_loss": -26.87918472290039, "global_step": 370342, "epoch": 4461} {"train_loss": -26.414356231689453, "global_step": 370343, "epoch": 4461} {"train_loss": -26.6253604888916, "global_step": 370344, "epoch": 4461} {"train_loss": -26.24416689125888, "global_step": 370345, "epoch": 4461, "val_loss": 6617905.0} {"train_loss": -26.02347183227539, "global_step": 370346, "epoch": 4462} {"train_loss": -25.652196884155273, "global_step": 370347, "epoch": 4462} {"train_loss": -25.915929794311523, "global_step": 370348, "epoch": 4462} {"train_loss": -26.229284286499023, "global_step": 370349, "epoch": 4462} {"train_loss": -26.04618263244629, "global_step": 370350, "epoch": 4462} {"train_loss": -26.510498046875, "global_step": 370351, "epoch": 4462} {"train_loss": -26.021072387695312, "global_step": 370352, "epoch": 4462} {"train_loss": -26.217924118041992, "global_step": 370353, "epoch": 4462} {"train_loss": -26.80231285095215, "global_step": 370354, "epoch": 4462} {"train_loss": -26.026697158813477, "global_step": 370355, "epoch": 4462} {"train_loss": -26.318878173828125, "global_step": 370356, "epoch": 4462} {"train_loss": -26.244617462158203, "global_step": 370357, "epoch": 4462} {"train_loss": -26.221271514892578, "global_step": 370358, "epoch": 4462} {"train_loss": -25.932952880859375, "global_step": 370359, "epoch": 4462} {"train_loss": -26.293304443359375, "global_step": 370360, "epoch": 4462} {"train_loss": -26.333097457885742, "global_step": 370361, "epoch": 4462} {"train_loss": -26.304624557495117, "global_step": 370362, "epoch": 4462} {"train_loss": -26.082799911499023, "global_step": 370363, "epoch": 4462} {"train_loss": -25.939151763916016, "global_step": 370364, "epoch": 4462} {"train_loss": -26.141433715820312, "global_step": 370365, "epoch": 4462} {"train_loss": -26.078702926635742, "global_step": 370366, "epoch": 4462} {"train_loss": -26.4835147857666, "global_step": 370367, "epoch": 4462} {"train_loss": -26.443485260009766, "global_step": 370368, "epoch": 4462} {"train_loss": -26.401596069335938, "global_step": 370369, "epoch": 4462} {"train_loss": -26.367841720581055, "global_step": 370370, "epoch": 4462} {"train_loss": -26.276391983032227, "global_step": 370371, "epoch": 4462} {"train_loss": -26.1940860748291, "global_step": 370372, "epoch": 4462} {"train_loss": -26.71904945373535, "global_step": 370373, "epoch": 4462} {"train_loss": -26.06537437438965, "global_step": 370374, "epoch": 4462} {"train_loss": -26.324752807617188, "global_step": 370375, "epoch": 4462} {"train_loss": -26.086048126220703, "global_step": 370376, "epoch": 4462} {"train_loss": -26.3697566986084, "global_step": 370377, "epoch": 4462} {"train_loss": -26.255399703979492, "global_step": 370378, "epoch": 4462} {"train_loss": -26.3199405670166, "global_step": 370379, "epoch": 4462} {"train_loss": -26.426557540893555, "global_step": 370380, "epoch": 4462} {"train_loss": -26.351003646850586, "global_step": 370381, "epoch": 4462} {"train_loss": -26.167133331298828, "global_step": 370382, "epoch": 4462} {"train_loss": -26.121856689453125, "global_step": 370383, "epoch": 4462} {"train_loss": -26.247568130493164, "global_step": 370384, "epoch": 4462} {"train_loss": -26.23512077331543, "global_step": 370385, "epoch": 4462} {"train_loss": -26.514450073242188, "global_step": 370386, "epoch": 4462} {"train_loss": -26.672948837280273, "global_step": 370387, "epoch": 4462} {"train_loss": -26.59296226501465, "global_step": 370388, "epoch": 4462} {"train_loss": -26.514074325561523, "global_step": 370389, "epoch": 4462} {"train_loss": -26.230493545532227, "global_step": 370390, "epoch": 4462} {"train_loss": -26.448400497436523, "global_step": 370391, "epoch": 4462} {"train_loss": -26.58810806274414, "global_step": 370392, "epoch": 4462} {"train_loss": -26.1827449798584, "global_step": 370393, "epoch": 4462} {"train_loss": -26.384321212768555, "global_step": 370394, "epoch": 4462} {"train_loss": -26.310108184814453, "global_step": 370395, "epoch": 4462} {"train_loss": -26.344327926635742, "global_step": 370396, "epoch": 4462} {"train_loss": -26.479339599609375, "global_step": 370397, "epoch": 4462} {"train_loss": -26.552515029907227, "global_step": 370398, "epoch": 4462} {"train_loss": -26.346099853515625, "global_step": 370399, "epoch": 4462} {"train_loss": -26.601947784423828, "global_step": 370400, "epoch": 4462} {"train_loss": -26.2651309967041, "global_step": 370401, "epoch": 4462} {"train_loss": -26.4199161529541, "global_step": 370402, "epoch": 4462} {"train_loss": -26.45785903930664, "global_step": 370403, "epoch": 4462} {"train_loss": -26.17230796813965, "global_step": 370404, "epoch": 4462} {"train_loss": -26.265417098999023, "global_step": 370405, "epoch": 4462} {"train_loss": -26.475202560424805, "global_step": 370406, "epoch": 4462} {"train_loss": -26.407102584838867, "global_step": 370407, "epoch": 4462} {"train_loss": -26.599699020385742, "global_step": 370408, "epoch": 4462} {"train_loss": -26.70111656188965, "global_step": 370409, "epoch": 4462} {"train_loss": -26.705286026000977, "global_step": 370410, "epoch": 4462} {"train_loss": -26.031269073486328, "global_step": 370411, "epoch": 4462} {"train_loss": -26.70020866394043, "global_step": 370412, "epoch": 4462} {"train_loss": -26.627592086791992, "global_step": 370413, "epoch": 4462} {"train_loss": -26.76852798461914, "global_step": 370414, "epoch": 4462} {"train_loss": -26.66779136657715, "global_step": 370415, "epoch": 4462} {"train_loss": -26.8503360748291, "global_step": 370416, "epoch": 4462} {"train_loss": -26.774118423461914, "global_step": 370417, "epoch": 4462} {"train_loss": -26.330963134765625, "global_step": 370418, "epoch": 4462} {"train_loss": -26.761999130249023, "global_step": 370419, "epoch": 4462} {"train_loss": -26.047607421875, "global_step": 370420, "epoch": 4462} {"train_loss": -26.122318267822266, "global_step": 370421, "epoch": 4462} {"train_loss": -26.58843421936035, "global_step": 370422, "epoch": 4462} {"train_loss": -26.366718292236328, "global_step": 370423, "epoch": 4462} {"train_loss": -26.314783096313477, "global_step": 370424, "epoch": 4462} {"train_loss": -26.599868774414062, "global_step": 370425, "epoch": 4462} {"train_loss": -26.576765060424805, "global_step": 370426, "epoch": 4462} {"train_loss": -26.263097763061523, "global_step": 370427, "epoch": 4462} {"train_loss": -26.348419901836348, "global_step": 370428, "epoch": 4462, "val_loss": 6625971.5} {"train_loss": -25.050575256347656, "global_step": 370429, "epoch": 4463} {"train_loss": -23.152189254760742, "global_step": 370430, "epoch": 4463} {"train_loss": -22.3039493560791, "global_step": 370431, "epoch": 4463} {"train_loss": -24.059864044189453, "global_step": 370432, "epoch": 4463} {"train_loss": -24.643735885620117, "global_step": 370433, "epoch": 4463} {"train_loss": -24.22669219970703, "global_step": 370434, "epoch": 4463} {"train_loss": -24.63242530822754, "global_step": 370435, "epoch": 4463} {"train_loss": -25.151630401611328, "global_step": 370436, "epoch": 4463} {"train_loss": -24.71023941040039, "global_step": 370437, "epoch": 4463} {"train_loss": -25.53668212890625, "global_step": 370438, "epoch": 4463} {"train_loss": -24.512649536132812, "global_step": 370439, "epoch": 4463} {"train_loss": -25.2879581451416, "global_step": 370440, "epoch": 4463} {"train_loss": -25.554595947265625, "global_step": 370441, "epoch": 4463} {"train_loss": -25.079633712768555, "global_step": 370442, "epoch": 4463} {"train_loss": -25.683969497680664, "global_step": 370443, "epoch": 4463} {"train_loss": -25.054508209228516, "global_step": 370444, "epoch": 4463} {"train_loss": -25.247983932495117, "global_step": 370445, "epoch": 4463} {"train_loss": -25.245899200439453, "global_step": 370446, "epoch": 4463} {"train_loss": -25.61785888671875, "global_step": 370447, "epoch": 4463} {"train_loss": -26.006254196166992, "global_step": 370448, "epoch": 4463} {"train_loss": -25.45364761352539, "global_step": 370449, "epoch": 4463} {"train_loss": -25.83796501159668, "global_step": 370450, "epoch": 4463} {"train_loss": -25.911436080932617, "global_step": 370451, "epoch": 4463} {"train_loss": -25.895339965820312, "global_step": 370452, "epoch": 4463} {"train_loss": -25.78896141052246, "global_step": 370453, "epoch": 4463} {"train_loss": -25.66033935546875, "global_step": 370454, "epoch": 4463} {"train_loss": -25.79104995727539, "global_step": 370455, "epoch": 4463} {"train_loss": -25.770124435424805, "global_step": 370456, "epoch": 4463} {"train_loss": -25.794157028198242, "global_step": 370457, "epoch": 4463} {"train_loss": -26.05560874938965, "global_step": 370458, "epoch": 4463} {"train_loss": -25.929914474487305, "global_step": 370459, "epoch": 4463} {"train_loss": -26.465612411499023, "global_step": 370460, "epoch": 4463} {"train_loss": -26.114126205444336, "global_step": 370461, "epoch": 4463} {"train_loss": -26.061359405517578, "global_step": 370462, "epoch": 4463} {"train_loss": -26.225927352905273, "global_step": 370463, "epoch": 4463} {"train_loss": -26.165021896362305, "global_step": 370464, "epoch": 4463} {"train_loss": -26.12066078186035, "global_step": 370465, "epoch": 4463} {"train_loss": -26.204843521118164, "global_step": 370466, "epoch": 4463} {"train_loss": -26.248098373413086, "global_step": 370467, "epoch": 4463} {"train_loss": -26.14994239807129, "global_step": 370468, "epoch": 4463} {"train_loss": -26.531009674072266, "global_step": 370469, "epoch": 4463} {"train_loss": -26.1806640625, "global_step": 370470, "epoch": 4463} {"train_loss": -26.072111129760742, "global_step": 370471, "epoch": 4463} {"train_loss": -26.1632022857666, "global_step": 370472, "epoch": 4463} {"train_loss": -26.094507217407227, "global_step": 370473, "epoch": 4463} {"train_loss": -26.187353134155273, "global_step": 370474, "epoch": 4463} {"train_loss": -26.55373191833496, "global_step": 370475, "epoch": 4463} {"train_loss": -26.336231231689453, "global_step": 370476, "epoch": 4463} {"train_loss": -26.453657150268555, "global_step": 370477, "epoch": 4463} {"train_loss": -26.151243209838867, "global_step": 370478, "epoch": 4463} {"train_loss": -26.224475860595703, "global_step": 370479, "epoch": 4463} {"train_loss": -26.42231559753418, "global_step": 370480, "epoch": 4463} {"train_loss": -26.110883712768555, "global_step": 370481, "epoch": 4463} {"train_loss": -26.25595474243164, "global_step": 370482, "epoch": 4463} {"train_loss": -26.209253311157227, "global_step": 370483, "epoch": 4463} {"train_loss": -26.018796920776367, "global_step": 370484, "epoch": 4463} {"train_loss": -26.326171875, "global_step": 370485, "epoch": 4463} {"train_loss": -26.40675163269043, "global_step": 370486, "epoch": 4463} {"train_loss": -26.330337524414062, "global_step": 370487, "epoch": 4463} {"train_loss": -26.53378677368164, "global_step": 370488, "epoch": 4463} {"train_loss": -26.22417640686035, "global_step": 370489, "epoch": 4463} {"train_loss": -26.366132736206055, "global_step": 370490, "epoch": 4463} {"train_loss": -26.44173240661621, "global_step": 370491, "epoch": 4463} {"train_loss": -26.4354248046875, "global_step": 370492, "epoch": 4463} {"train_loss": -26.12117576599121, "global_step": 370493, "epoch": 4463} {"train_loss": -26.450159072875977, "global_step": 370494, "epoch": 4463} {"train_loss": -26.663496017456055, "global_step": 370495, "epoch": 4463} {"train_loss": -26.294103622436523, "global_step": 370496, "epoch": 4463} {"train_loss": -27.01726722717285, "global_step": 370497, "epoch": 4463} {"train_loss": -26.3773193359375, "global_step": 370498, "epoch": 4463} {"train_loss": -26.7288761138916, "global_step": 370499, "epoch": 4463} {"train_loss": -26.30609130859375, "global_step": 370500, "epoch": 4463} {"train_loss": -26.478759765625, "global_step": 370501, "epoch": 4463} {"train_loss": -26.594778060913086, "global_step": 370502, "epoch": 4463} {"train_loss": -26.812116622924805, "global_step": 370503, "epoch": 4463} {"train_loss": -26.376371383666992, "global_step": 370504, "epoch": 4463} {"train_loss": -26.71588706970215, "global_step": 370505, "epoch": 4463} {"train_loss": -26.690032958984375, "global_step": 370506, "epoch": 4463} {"train_loss": -26.371686935424805, "global_step": 370507, "epoch": 4463} {"train_loss": -26.684722900390625, "global_step": 370508, "epoch": 4463} {"train_loss": -26.46803092956543, "global_step": 370509, "epoch": 4463} {"train_loss": -26.625131607055664, "global_step": 370510, "epoch": 4463} {"train_loss": -25.919279466192407, "global_step": 370511, "epoch": 4463, "val_loss": 6607348.0} {"train_loss": -26.30109977722168, "global_step": 370512, "epoch": 4464} {"train_loss": -25.669910430908203, "global_step": 370513, "epoch": 4464} {"train_loss": -25.929122924804688, "global_step": 370514, "epoch": 4464} {"train_loss": -26.066434860229492, "global_step": 370515, "epoch": 4464} {"train_loss": -25.967145919799805, "global_step": 370516, "epoch": 4464} {"train_loss": -26.113941192626953, "global_step": 370517, "epoch": 4464} {"train_loss": -26.135095596313477, "global_step": 370518, "epoch": 4464} {"train_loss": -26.131427764892578, "global_step": 370519, "epoch": 4464} {"train_loss": -26.016952514648438, "global_step": 370520, "epoch": 4464} {"train_loss": -26.083349227905273, "global_step": 370521, "epoch": 4464} {"train_loss": -26.26956558227539, "global_step": 370522, "epoch": 4464} {"train_loss": -26.210742950439453, "global_step": 370523, "epoch": 4464} {"train_loss": -25.843826293945312, "global_step": 370524, "epoch": 4464} {"train_loss": -25.96278190612793, "global_step": 370525, "epoch": 4464} {"train_loss": -26.162973403930664, "global_step": 370526, "epoch": 4464} {"train_loss": -26.443952560424805, "global_step": 370527, "epoch": 4464} {"train_loss": -26.279281616210938, "global_step": 370528, "epoch": 4464} {"train_loss": -26.105487823486328, "global_step": 370529, "epoch": 4464} {"train_loss": -26.394742965698242, "global_step": 370530, "epoch": 4464} {"train_loss": -26.11631202697754, "global_step": 370531, "epoch": 4464} {"train_loss": -26.17398452758789, "global_step": 370532, "epoch": 4464} {"train_loss": -26.191146850585938, "global_step": 370533, "epoch": 4464} {"train_loss": -26.084558486938477, "global_step": 370534, "epoch": 4464} {"train_loss": -26.492603302001953, "global_step": 370535, "epoch": 4464} {"train_loss": -26.503955841064453, "global_step": 370536, "epoch": 4464} {"train_loss": -26.328351974487305, "global_step": 370537, "epoch": 4464} {"train_loss": -26.396642684936523, "global_step": 370538, "epoch": 4464} {"train_loss": -26.51799964904785, "global_step": 370539, "epoch": 4464} {"train_loss": -26.57979393005371, "global_step": 370540, "epoch": 4464} {"train_loss": -26.343734741210938, "global_step": 370541, "epoch": 4464} {"train_loss": -26.506549835205078, "global_step": 370542, "epoch": 4464} {"train_loss": -26.2504940032959, "global_step": 370543, "epoch": 4464} {"train_loss": -26.26325798034668, "global_step": 370544, "epoch": 4464} {"train_loss": -26.115217208862305, "global_step": 370545, "epoch": 4464} {"train_loss": -25.918359756469727, "global_step": 370546, "epoch": 4464} {"train_loss": -26.837177276611328, "global_step": 370547, "epoch": 4464} {"train_loss": -26.593759536743164, "global_step": 370548, "epoch": 4464} {"train_loss": -26.05838394165039, "global_step": 370549, "epoch": 4464} {"train_loss": -26.408700942993164, "global_step": 370550, "epoch": 4464} {"train_loss": -26.19940757751465, "global_step": 370551, "epoch": 4464} {"train_loss": -26.496763229370117, "global_step": 370552, "epoch": 4464} {"train_loss": -26.45489501953125, "global_step": 370553, "epoch": 4464} {"train_loss": -26.324695587158203, "global_step": 370554, "epoch": 4464} {"train_loss": -26.403339385986328, "global_step": 370555, "epoch": 4464} {"train_loss": -26.5845947265625, "global_step": 370556, "epoch": 4464} {"train_loss": -26.24212646484375, "global_step": 370557, "epoch": 4464} {"train_loss": -26.550439834594727, "global_step": 370558, "epoch": 4464} {"train_loss": -26.58540916442871, "global_step": 370559, "epoch": 4464} {"train_loss": -26.33064079284668, "global_step": 370560, "epoch": 4464} {"train_loss": -26.41655921936035, "global_step": 370561, "epoch": 4464} {"train_loss": -26.574207305908203, "global_step": 370562, "epoch": 4464} {"train_loss": -26.32337760925293, "global_step": 370563, "epoch": 4464} {"train_loss": -26.530914306640625, "global_step": 370564, "epoch": 4464} {"train_loss": -26.468402862548828, "global_step": 370565, "epoch": 4464} {"train_loss": -26.189319610595703, "global_step": 370566, "epoch": 4464} {"train_loss": -26.67463493347168, "global_step": 370567, "epoch": 4464} {"train_loss": -26.453413009643555, "global_step": 370568, "epoch": 4464} {"train_loss": -26.4389705657959, "global_step": 370569, "epoch": 4464} {"train_loss": -26.235681533813477, "global_step": 370570, "epoch": 4464} {"train_loss": -26.163190841674805, "global_step": 370571, "epoch": 4464} {"train_loss": -26.504846572875977, "global_step": 370572, "epoch": 4464} {"train_loss": -26.404150009155273, "global_step": 370573, "epoch": 4464} {"train_loss": -26.17127799987793, "global_step": 370574, "epoch": 4464} {"train_loss": -26.275537490844727, "global_step": 370575, "epoch": 4464} {"train_loss": -26.2569522857666, "global_step": 370576, "epoch": 4464} {"train_loss": -25.925073623657227, "global_step": 370577, "epoch": 4464} {"train_loss": -26.64237403869629, "global_step": 370578, "epoch": 4464} {"train_loss": -26.41788673400879, "global_step": 370579, "epoch": 4464} {"train_loss": -26.395715713500977, "global_step": 370580, "epoch": 4464} {"train_loss": -26.29441261291504, "global_step": 370581, "epoch": 4464} {"train_loss": -26.412384033203125, "global_step": 370582, "epoch": 4464} {"train_loss": -26.609479904174805, "global_step": 370583, "epoch": 4464} {"train_loss": -26.393598556518555, "global_step": 370584, "epoch": 4464} {"train_loss": -26.507038116455078, "global_step": 370585, "epoch": 4464} {"train_loss": -26.604450225830078, "global_step": 370586, "epoch": 4464} {"train_loss": -26.5915584564209, "global_step": 370587, "epoch": 4464} {"train_loss": -26.467023849487305, "global_step": 370588, "epoch": 4464} {"train_loss": -26.46649169921875, "global_step": 370589, "epoch": 4464} {"train_loss": -26.35160255432129, "global_step": 370590, "epoch": 4464} {"train_loss": -26.224714279174805, "global_step": 370591, "epoch": 4464} {"train_loss": -26.51022720336914, "global_step": 370592, "epoch": 4464} {"train_loss": -26.891834259033203, "global_step": 370593, "epoch": 4464} {"train_loss": -26.33839988708496, "global_step": 370594, "epoch": 4464, "val_loss": 6704369.0} {"train_loss": -26.27178955078125, "global_step": 370595, "epoch": 4465} {"train_loss": -26.01190757751465, "global_step": 370596, "epoch": 4465} {"train_loss": -25.801584243774414, "global_step": 370597, "epoch": 4465} {"train_loss": -25.6417236328125, "global_step": 370598, "epoch": 4465} {"train_loss": -25.826404571533203, "global_step": 370599, "epoch": 4465} {"train_loss": -25.667438507080078, "global_step": 370600, "epoch": 4465} {"train_loss": -26.170883178710938, "global_step": 370601, "epoch": 4465} {"train_loss": -26.049039840698242, "global_step": 370602, "epoch": 4465} {"train_loss": -26.018896102905273, "global_step": 370603, "epoch": 4465} {"train_loss": -25.91766357421875, "global_step": 370604, "epoch": 4465} {"train_loss": -25.948827743530273, "global_step": 370605, "epoch": 4465} {"train_loss": -26.199554443359375, "global_step": 370606, "epoch": 4465} {"train_loss": -25.99505043029785, "global_step": 370607, "epoch": 4465} {"train_loss": -26.135358810424805, "global_step": 370608, "epoch": 4465} {"train_loss": -26.1025390625, "global_step": 370609, "epoch": 4465} {"train_loss": -26.131641387939453, "global_step": 370610, "epoch": 4465} {"train_loss": -26.483631134033203, "global_step": 370611, "epoch": 4465} {"train_loss": -26.3789119720459, "global_step": 370612, "epoch": 4465} {"train_loss": -26.401330947875977, "global_step": 370613, "epoch": 4465} {"train_loss": -26.119165420532227, "global_step": 370614, "epoch": 4465} {"train_loss": -26.464284896850586, "global_step": 370615, "epoch": 4465} {"train_loss": -26.61408042907715, "global_step": 370616, "epoch": 4465} {"train_loss": -26.52638053894043, "global_step": 370617, "epoch": 4465} {"train_loss": -26.242231369018555, "global_step": 370618, "epoch": 4465} {"train_loss": -26.34592056274414, "global_step": 370619, "epoch": 4465} {"train_loss": -26.684030532836914, "global_step": 370620, "epoch": 4465} {"train_loss": -26.225635528564453, "global_step": 370621, "epoch": 4465} {"train_loss": -26.226911544799805, "global_step": 370622, "epoch": 4465} {"train_loss": -26.252126693725586, "global_step": 370623, "epoch": 4465} {"train_loss": -25.76980972290039, "global_step": 370624, "epoch": 4465} {"train_loss": -26.0617733001709, "global_step": 370625, "epoch": 4465} {"train_loss": -26.661893844604492, "global_step": 370626, "epoch": 4465} {"train_loss": -26.698389053344727, "global_step": 370627, "epoch": 4465} {"train_loss": -26.024932861328125, "global_step": 370628, "epoch": 4465} {"train_loss": -26.023344039916992, "global_step": 370629, "epoch": 4465} {"train_loss": -26.463821411132812, "global_step": 370630, "epoch": 4465} {"train_loss": -26.5086612701416, "global_step": 370631, "epoch": 4465} {"train_loss": -26.54718017578125, "global_step": 370632, "epoch": 4465} {"train_loss": -26.2510986328125, "global_step": 370633, "epoch": 4465} {"train_loss": -26.496435165405273, "global_step": 370634, "epoch": 4465} {"train_loss": -26.65730094909668, "global_step": 370635, "epoch": 4465} {"train_loss": -26.194976806640625, "global_step": 370636, "epoch": 4465} {"train_loss": -26.434814453125, "global_step": 370637, "epoch": 4465} {"train_loss": -26.65625, "global_step": 370638, "epoch": 4465} {"train_loss": -26.44569206237793, "global_step": 370639, "epoch": 4465} {"train_loss": -26.553607940673828, "global_step": 370640, "epoch": 4465} {"train_loss": -26.367605209350586, "global_step": 370641, "epoch": 4465} {"train_loss": -26.44329261779785, "global_step": 370642, "epoch": 4465} {"train_loss": -26.425128936767578, "global_step": 370643, "epoch": 4465} {"train_loss": -26.2405948638916, "global_step": 370644, "epoch": 4465} {"train_loss": -26.731403350830078, "global_step": 370645, "epoch": 4465} {"train_loss": -26.501667022705078, "global_step": 370646, "epoch": 4465} {"train_loss": -26.418201446533203, "global_step": 370647, "epoch": 4465} {"train_loss": -26.561450958251953, "global_step": 370648, "epoch": 4465} {"train_loss": -26.487375259399414, "global_step": 370649, "epoch": 4465} {"train_loss": -26.385427474975586, "global_step": 370650, "epoch": 4465} {"train_loss": -26.40201187133789, "global_step": 370651, "epoch": 4465} {"train_loss": -26.5341854095459, "global_step": 370652, "epoch": 4465} {"train_loss": -26.788862228393555, "global_step": 370653, "epoch": 4465} {"train_loss": -26.294437408447266, "global_step": 370654, "epoch": 4465} {"train_loss": -26.688444137573242, "global_step": 370655, "epoch": 4465} {"train_loss": -26.662687301635742, "global_step": 370656, "epoch": 4465} {"train_loss": -26.64326286315918, "global_step": 370657, "epoch": 4465} {"train_loss": -26.943288803100586, "global_step": 370658, "epoch": 4465} {"train_loss": -26.58734130859375, "global_step": 370659, "epoch": 4465} {"train_loss": -26.426273345947266, "global_step": 370660, "epoch": 4465} {"train_loss": -26.714628219604492, "global_step": 370661, "epoch": 4465} {"train_loss": -26.862646102905273, "global_step": 370662, "epoch": 4465} {"train_loss": -26.58589744567871, "global_step": 370663, "epoch": 4465} {"train_loss": -26.32730484008789, "global_step": 370664, "epoch": 4465} {"train_loss": -26.306427001953125, "global_step": 370665, "epoch": 4465} {"train_loss": -26.11944580078125, "global_step": 370666, "epoch": 4465} {"train_loss": -26.001911163330078, "global_step": 370667, "epoch": 4465} {"train_loss": -26.059675216674805, "global_step": 370668, "epoch": 4465} {"train_loss": -26.66043472290039, "global_step": 370669, "epoch": 4465} {"train_loss": -26.33123779296875, "global_step": 370670, "epoch": 4465} {"train_loss": -25.833404541015625, "global_step": 370671, "epoch": 4465} {"train_loss": -26.4783992767334, "global_step": 370672, "epoch": 4465} {"train_loss": -26.22024917602539, "global_step": 370673, "epoch": 4465} {"train_loss": -26.239892959594727, "global_step": 370674, "epoch": 4465} {"train_loss": -26.529592514038086, "global_step": 370675, "epoch": 4465} {"train_loss": -26.50837516784668, "global_step": 370676, "epoch": 4465} {"train_loss": -26.327494311045452, "global_step": 370677, "epoch": 4465, "val_loss": 6631543.5} {"train_loss": -26.120193481445312, "global_step": 370678, "epoch": 4466} {"train_loss": -25.822240829467773, "global_step": 370679, "epoch": 4466} {"train_loss": -25.349462509155273, "global_step": 370680, "epoch": 4466} {"train_loss": -25.77544593811035, "global_step": 370681, "epoch": 4466} {"train_loss": -26.075031280517578, "global_step": 370682, "epoch": 4466} {"train_loss": -26.102758407592773, "global_step": 370683, "epoch": 4466} {"train_loss": -26.05549430847168, "global_step": 370684, "epoch": 4466} {"train_loss": -26.1937313079834, "global_step": 370685, "epoch": 4466} {"train_loss": -26.16048240661621, "global_step": 370686, "epoch": 4466} {"train_loss": -25.886566162109375, "global_step": 370687, "epoch": 4466} {"train_loss": -25.8204345703125, "global_step": 370688, "epoch": 4466} {"train_loss": -26.3121280670166, "global_step": 370689, "epoch": 4466} {"train_loss": -25.83416748046875, "global_step": 370690, "epoch": 4466} {"train_loss": -26.280988693237305, "global_step": 370691, "epoch": 4466} {"train_loss": -26.381845474243164, "global_step": 370692, "epoch": 4466} {"train_loss": -26.5443172454834, "global_step": 370693, "epoch": 4466} {"train_loss": -26.246387481689453, "global_step": 370694, "epoch": 4466} {"train_loss": -26.33271598815918, "global_step": 370695, "epoch": 4466} {"train_loss": -26.250110626220703, "global_step": 370696, "epoch": 4466} {"train_loss": -26.459875106811523, "global_step": 370697, "epoch": 4466} {"train_loss": -26.256378173828125, "global_step": 370698, "epoch": 4466} {"train_loss": -26.356611251831055, "global_step": 370699, "epoch": 4466} {"train_loss": -26.376623153686523, "global_step": 370700, "epoch": 4466} {"train_loss": -26.35468101501465, "global_step": 370701, "epoch": 4466} {"train_loss": -26.50733757019043, "global_step": 370702, "epoch": 4466} {"train_loss": -26.16103172302246, "global_step": 370703, "epoch": 4466} {"train_loss": -26.28973388671875, "global_step": 370704, "epoch": 4466} {"train_loss": -26.329984664916992, "global_step": 370705, "epoch": 4466} {"train_loss": -26.38514518737793, "global_step": 370706, "epoch": 4466} {"train_loss": -26.18438720703125, "global_step": 370707, "epoch": 4466} {"train_loss": -26.33401870727539, "global_step": 370708, "epoch": 4466} {"train_loss": -26.598052978515625, "global_step": 370709, "epoch": 4466} {"train_loss": -26.75445556640625, "global_step": 370710, "epoch": 4466} {"train_loss": -26.614904403686523, "global_step": 370711, "epoch": 4466} {"train_loss": -26.815021514892578, "global_step": 370712, "epoch": 4466} {"train_loss": -26.224655151367188, "global_step": 370713, "epoch": 4466} {"train_loss": -26.728586196899414, "global_step": 370714, "epoch": 4466} {"train_loss": -26.853620529174805, "global_step": 370715, "epoch": 4466} {"train_loss": -26.363574981689453, "global_step": 370716, "epoch": 4466} {"train_loss": -26.47641372680664, "global_step": 370717, "epoch": 4466} {"train_loss": -26.719884872436523, "global_step": 370718, "epoch": 4466} {"train_loss": -27.003528594970703, "global_step": 370719, "epoch": 4466} {"train_loss": -26.677576065063477, "global_step": 370720, "epoch": 4466} {"train_loss": -26.811939239501953, "global_step": 370721, "epoch": 4466} {"train_loss": -26.430255889892578, "global_step": 370722, "epoch": 4466} {"train_loss": -26.73612403869629, "global_step": 370723, "epoch": 4466} {"train_loss": -26.525537490844727, "global_step": 370724, "epoch": 4466} {"train_loss": -26.4124755859375, "global_step": 370725, "epoch": 4466} {"train_loss": -26.50226402282715, "global_step": 370726, "epoch": 4466} {"train_loss": -26.472156524658203, "global_step": 370727, "epoch": 4466} {"train_loss": -26.41497230529785, "global_step": 370728, "epoch": 4466} {"train_loss": -26.42103385925293, "global_step": 370729, "epoch": 4466} {"train_loss": -26.83772850036621, "global_step": 370730, "epoch": 4466} {"train_loss": -26.479764938354492, "global_step": 370731, "epoch": 4466} {"train_loss": -26.664724349975586, "global_step": 370732, "epoch": 4466} {"train_loss": -26.33282470703125, "global_step": 370733, "epoch": 4466} {"train_loss": -26.449848175048828, "global_step": 370734, "epoch": 4466} {"train_loss": -26.234100341796875, "global_step": 370735, "epoch": 4466} {"train_loss": -26.2189884185791, "global_step": 370736, "epoch": 4466} {"train_loss": -26.399328231811523, "global_step": 370737, "epoch": 4466} {"train_loss": -26.535541534423828, "global_step": 370738, "epoch": 4466} {"train_loss": -26.36867332458496, "global_step": 370739, "epoch": 4466} {"train_loss": -25.9798641204834, "global_step": 370740, "epoch": 4466} {"train_loss": -26.186065673828125, "global_step": 370741, "epoch": 4466} {"train_loss": -26.119054794311523, "global_step": 370742, "epoch": 4466} {"train_loss": -26.124799728393555, "global_step": 370743, "epoch": 4466} {"train_loss": -26.73158073425293, "global_step": 370744, "epoch": 4466} {"train_loss": -26.36030387878418, "global_step": 370745, "epoch": 4466} {"train_loss": -26.93195152282715, "global_step": 370746, "epoch": 4466} {"train_loss": -26.520904541015625, "global_step": 370747, "epoch": 4466} {"train_loss": -26.05220603942871, "global_step": 370748, "epoch": 4466} {"train_loss": -26.476720809936523, "global_step": 370749, "epoch": 4466} {"train_loss": -26.21954917907715, "global_step": 370750, "epoch": 4466} {"train_loss": -26.3162841796875, "global_step": 370751, "epoch": 4466} {"train_loss": -26.49928092956543, "global_step": 370752, "epoch": 4466} {"train_loss": -25.896787643432617, "global_step": 370753, "epoch": 4466} {"train_loss": -26.409093856811523, "global_step": 370754, "epoch": 4466} {"train_loss": -26.199872970581055, "global_step": 370755, "epoch": 4466} {"train_loss": -26.563817977905273, "global_step": 370756, "epoch": 4466} {"train_loss": -26.42181396484375, "global_step": 370757, "epoch": 4466} {"train_loss": -26.336719512939453, "global_step": 370758, "epoch": 4466} {"train_loss": -26.4420223236084, "global_step": 370759, "epoch": 4466} {"train_loss": -26.378091398491918, "global_step": 370760, "epoch": 4466, "val_loss": 6672936.0} {"train_loss": -25.374155044555664, "global_step": 370761, "epoch": 4467} {"train_loss": -25.52481460571289, "global_step": 370762, "epoch": 4467} {"train_loss": -25.121427536010742, "global_step": 370763, "epoch": 4467} {"train_loss": -25.8541259765625, "global_step": 370764, "epoch": 4467} {"train_loss": -25.76551628112793, "global_step": 370765, "epoch": 4467} {"train_loss": -26.4258975982666, "global_step": 370766, "epoch": 4467} {"train_loss": -25.53614616394043, "global_step": 370767, "epoch": 4467} {"train_loss": -25.847864151000977, "global_step": 370768, "epoch": 4467} {"train_loss": -26.075666427612305, "global_step": 370769, "epoch": 4467} {"train_loss": -26.10662269592285, "global_step": 370770, "epoch": 4467} {"train_loss": -25.65889549255371, "global_step": 370771, "epoch": 4467} {"train_loss": -25.77191734313965, "global_step": 370772, "epoch": 4467} {"train_loss": -26.37952995300293, "global_step": 370773, "epoch": 4467} {"train_loss": -25.841968536376953, "global_step": 370774, "epoch": 4467} {"train_loss": -26.418760299682617, "global_step": 370775, "epoch": 4467} {"train_loss": -26.122100830078125, "global_step": 370776, "epoch": 4467} {"train_loss": -26.114049911499023, "global_step": 370777, "epoch": 4467} {"train_loss": -26.08582878112793, "global_step": 370778, "epoch": 4467} {"train_loss": -26.048627853393555, "global_step": 370779, "epoch": 4467} {"train_loss": -25.95599365234375, "global_step": 370780, "epoch": 4467} {"train_loss": -26.175567626953125, "global_step": 370781, "epoch": 4467} {"train_loss": -26.310134887695312, "global_step": 370782, "epoch": 4467} {"train_loss": -26.040409088134766, "global_step": 370783, "epoch": 4467} {"train_loss": -26.62818717956543, "global_step": 370784, "epoch": 4467} {"train_loss": -26.199329376220703, "global_step": 370785, "epoch": 4467} {"train_loss": -26.04974937438965, "global_step": 370786, "epoch": 4467} {"train_loss": -26.546283721923828, "global_step": 370787, "epoch": 4467} {"train_loss": -26.22730827331543, "global_step": 370788, "epoch": 4467} {"train_loss": -26.544485092163086, "global_step": 370789, "epoch": 4467} {"train_loss": -26.2631778717041, "global_step": 370790, "epoch": 4467} {"train_loss": -26.38319206237793, "global_step": 370791, "epoch": 4467} {"train_loss": -26.339920043945312, "global_step": 370792, "epoch": 4467} {"train_loss": -26.865522384643555, "global_step": 370793, "epoch": 4467} {"train_loss": -26.328033447265625, "global_step": 370794, "epoch": 4467} {"train_loss": -26.412952423095703, "global_step": 370795, "epoch": 4467} {"train_loss": -26.283777236938477, "global_step": 370796, "epoch": 4467} {"train_loss": -26.65810203552246, "global_step": 370797, "epoch": 4467} {"train_loss": -26.669586181640625, "global_step": 370798, "epoch": 4467} {"train_loss": -26.21076774597168, "global_step": 370799, "epoch": 4467} {"train_loss": -26.311756134033203, "global_step": 370800, "epoch": 4467} {"train_loss": -26.58550453186035, "global_step": 370801, "epoch": 4467} {"train_loss": -26.598682403564453, "global_step": 370802, "epoch": 4467} {"train_loss": -26.1982421875, "global_step": 370803, "epoch": 4467} {"train_loss": -26.35174560546875, "global_step": 370804, "epoch": 4467} {"train_loss": -26.40315055847168, "global_step": 370805, "epoch": 4467} {"train_loss": -26.278348922729492, "global_step": 370806, "epoch": 4467} {"train_loss": -26.307697296142578, "global_step": 370807, "epoch": 4467} {"train_loss": -26.45186424255371, "global_step": 370808, "epoch": 4467} {"train_loss": -26.25885581970215, "global_step": 370809, "epoch": 4467} {"train_loss": -26.3030948638916, "global_step": 370810, "epoch": 4467} {"train_loss": -26.427444458007812, "global_step": 370811, "epoch": 4467} {"train_loss": -26.3389949798584, "global_step": 370812, "epoch": 4467} {"train_loss": -26.73647117614746, "global_step": 370813, "epoch": 4467} {"train_loss": -26.436721801757812, "global_step": 370814, "epoch": 4467} {"train_loss": -26.103199005126953, "global_step": 370815, "epoch": 4467} {"train_loss": -26.20650291442871, "global_step": 370816, "epoch": 4467} {"train_loss": -26.400928497314453, "global_step": 370817, "epoch": 4467} {"train_loss": -26.1502685546875, "global_step": 370818, "epoch": 4467} {"train_loss": -26.299530029296875, "global_step": 370819, "epoch": 4467} {"train_loss": -26.48377799987793, "global_step": 370820, "epoch": 4467} {"train_loss": -26.30352783203125, "global_step": 370821, "epoch": 4467} {"train_loss": -26.064804077148438, "global_step": 370822, "epoch": 4467} {"train_loss": -26.47196388244629, "global_step": 370823, "epoch": 4467} {"train_loss": -26.540267944335938, "global_step": 370824, "epoch": 4467} {"train_loss": -26.4227352142334, "global_step": 370825, "epoch": 4467} {"train_loss": -26.6135311126709, "global_step": 370826, "epoch": 4467} {"train_loss": -26.25666618347168, "global_step": 370827, "epoch": 4467} {"train_loss": -26.779743194580078, "global_step": 370828, "epoch": 4467} {"train_loss": -26.43739128112793, "global_step": 370829, "epoch": 4467} {"train_loss": -26.835575103759766, "global_step": 370830, "epoch": 4467} {"train_loss": -26.30354118347168, "global_step": 370831, "epoch": 4467} {"train_loss": -26.370635986328125, "global_step": 370832, "epoch": 4467} {"train_loss": -26.249027252197266, "global_step": 370833, "epoch": 4467} {"train_loss": -26.542285919189453, "global_step": 370834, "epoch": 4467} {"train_loss": -26.20246696472168, "global_step": 370835, "epoch": 4467} {"train_loss": -25.86402702331543, "global_step": 370836, "epoch": 4467} {"train_loss": -26.346616744995117, "global_step": 370837, "epoch": 4467} {"train_loss": -26.146820068359375, "global_step": 370838, "epoch": 4467} {"train_loss": -26.556476593017578, "global_step": 370839, "epoch": 4467} {"train_loss": -26.1303653717041, "global_step": 370840, "epoch": 4467} {"train_loss": -26.313587188720703, "global_step": 370841, "epoch": 4467} {"train_loss": -26.185827255249023, "global_step": 370842, "epoch": 4467} {"train_loss": -26.253352843135236, "global_step": 370843, "epoch": 4467, "val_loss": 6741811.0} {"train_loss": -25.841306686401367, "global_step": 370844, "epoch": 4468} {"train_loss": -25.850452423095703, "global_step": 370845, "epoch": 4468} {"train_loss": -26.26515007019043, "global_step": 370846, "epoch": 4468} {"train_loss": -26.320215225219727, "global_step": 370847, "epoch": 4468} {"train_loss": -26.177335739135742, "global_step": 370848, "epoch": 4468} {"train_loss": -26.067590713500977, "global_step": 370849, "epoch": 4468} {"train_loss": -26.253250122070312, "global_step": 370850, "epoch": 4468} {"train_loss": -26.364240646362305, "global_step": 370851, "epoch": 4468} {"train_loss": -25.93348503112793, "global_step": 370852, "epoch": 4468} {"train_loss": -26.42304039001465, "global_step": 370853, "epoch": 4468} {"train_loss": -25.96564292907715, "global_step": 370854, "epoch": 4468} {"train_loss": -26.41251564025879, "global_step": 370855, "epoch": 4468} {"train_loss": -26.259002685546875, "global_step": 370856, "epoch": 4468} {"train_loss": -26.516677856445312, "global_step": 370857, "epoch": 4468} {"train_loss": -26.4145450592041, "global_step": 370858, "epoch": 4468} {"train_loss": -26.196796417236328, "global_step": 370859, "epoch": 4468} {"train_loss": -26.395837783813477, "global_step": 370860, "epoch": 4468} {"train_loss": -25.984663009643555, "global_step": 370861, "epoch": 4468} {"train_loss": -26.212324142456055, "global_step": 370862, "epoch": 4468} {"train_loss": -26.419469833374023, "global_step": 370863, "epoch": 4468} {"train_loss": -26.54581069946289, "global_step": 370864, "epoch": 4468} {"train_loss": -26.340208053588867, "global_step": 370865, "epoch": 4468} {"train_loss": -26.213260650634766, "global_step": 370866, "epoch": 4468} {"train_loss": -26.411924362182617, "global_step": 370867, "epoch": 4468} {"train_loss": -26.097522735595703, "global_step": 370868, "epoch": 4468} {"train_loss": -26.081008911132812, "global_step": 370869, "epoch": 4468} {"train_loss": -26.419824600219727, "global_step": 370870, "epoch": 4468} {"train_loss": -26.376819610595703, "global_step": 370871, "epoch": 4468} {"train_loss": -26.06965446472168, "global_step": 370872, "epoch": 4468} {"train_loss": -26.857351303100586, "global_step": 370873, "epoch": 4468} {"train_loss": -26.04444694519043, "global_step": 370874, "epoch": 4468} {"train_loss": -26.23996925354004, "global_step": 370875, "epoch": 4468} {"train_loss": -26.014911651611328, "global_step": 370876, "epoch": 4468} {"train_loss": -26.019330978393555, "global_step": 370877, "epoch": 4468} {"train_loss": -26.360136032104492, "global_step": 370878, "epoch": 4468} {"train_loss": -26.220962524414062, "global_step": 370879, "epoch": 4468} {"train_loss": -26.40302848815918, "global_step": 370880, "epoch": 4468} {"train_loss": -26.44696044921875, "global_step": 370881, "epoch": 4468} {"train_loss": -26.691787719726562, "global_step": 370882, "epoch": 4468} {"train_loss": -26.070051193237305, "global_step": 370883, "epoch": 4468} {"train_loss": -26.524118423461914, "global_step": 370884, "epoch": 4468} {"train_loss": -25.968175888061523, "global_step": 370885, "epoch": 4468} {"train_loss": -26.31440544128418, "global_step": 370886, "epoch": 4468} {"train_loss": -26.318958282470703, "global_step": 370887, "epoch": 4468} {"train_loss": -26.112319946289062, "global_step": 370888, "epoch": 4468} {"train_loss": -26.375598907470703, "global_step": 370889, "epoch": 4468} {"train_loss": -26.278512954711914, "global_step": 370890, "epoch": 4468} {"train_loss": -26.426044464111328, "global_step": 370891, "epoch": 4468} {"train_loss": -26.499069213867188, "global_step": 370892, "epoch": 4468} {"train_loss": -25.81928825378418, "global_step": 370893, "epoch": 4468} {"train_loss": -26.384862899780273, "global_step": 370894, "epoch": 4468} {"train_loss": -26.151174545288086, "global_step": 370895, "epoch": 4468} {"train_loss": -26.41535758972168, "global_step": 370896, "epoch": 4468} {"train_loss": -26.416980743408203, "global_step": 370897, "epoch": 4468} {"train_loss": -26.035247802734375, "global_step": 370898, "epoch": 4468} {"train_loss": -26.33466911315918, "global_step": 370899, "epoch": 4468} {"train_loss": -26.430830001831055, "global_step": 370900, "epoch": 4468} {"train_loss": -26.616479873657227, "global_step": 370901, "epoch": 4468} {"train_loss": -26.205835342407227, "global_step": 370902, "epoch": 4468} {"train_loss": -26.121118545532227, "global_step": 370903, "epoch": 4468} {"train_loss": -26.426544189453125, "global_step": 370904, "epoch": 4468} {"train_loss": -26.398773193359375, "global_step": 370905, "epoch": 4468} {"train_loss": -26.238080978393555, "global_step": 370906, "epoch": 4468} {"train_loss": -26.199201583862305, "global_step": 370907, "epoch": 4468} {"train_loss": -26.584630966186523, "global_step": 370908, "epoch": 4468} {"train_loss": -26.715900421142578, "global_step": 370909, "epoch": 4468} {"train_loss": -26.311792373657227, "global_step": 370910, "epoch": 4468} {"train_loss": -26.806324005126953, "global_step": 370911, "epoch": 4468} {"train_loss": -26.40607261657715, "global_step": 370912, "epoch": 4468} {"train_loss": -26.45222282409668, "global_step": 370913, "epoch": 4468} {"train_loss": -26.308002471923828, "global_step": 370914, "epoch": 4468} {"train_loss": -26.602460861206055, "global_step": 370915, "epoch": 4468} {"train_loss": -26.177526473999023, "global_step": 370916, "epoch": 4468} {"train_loss": -26.925291061401367, "global_step": 370917, "epoch": 4468} {"train_loss": -26.553403854370117, "global_step": 370918, "epoch": 4468} {"train_loss": -26.265954971313477, "global_step": 370919, "epoch": 4468} {"train_loss": -26.480194091796875, "global_step": 370920, "epoch": 4468} {"train_loss": -26.59942054748535, "global_step": 370921, "epoch": 4468} {"train_loss": -26.41282081604004, "global_step": 370922, "epoch": 4468} {"train_loss": -26.848424911499023, "global_step": 370923, "epoch": 4468} {"train_loss": -26.60430908203125, "global_step": 370924, "epoch": 4468} {"train_loss": -26.43252944946289, "global_step": 370925, "epoch": 4468} {"train_loss": -26.33292294697589, "global_step": 370926, "epoch": 4468, "val_loss": 6641549.0} {"train_loss": -25.459970474243164, "global_step": 370927, "epoch": 4469} {"train_loss": -25.807920455932617, "global_step": 370928, "epoch": 4469} {"train_loss": -25.837209701538086, "global_step": 370929, "epoch": 4469} {"train_loss": -26.163894653320312, "global_step": 370930, "epoch": 4469} {"train_loss": -26.19502067565918, "global_step": 370931, "epoch": 4469} {"train_loss": -25.940664291381836, "global_step": 370932, "epoch": 4469} {"train_loss": -25.596759796142578, "global_step": 370933, "epoch": 4469} {"train_loss": -25.984851837158203, "global_step": 370934, "epoch": 4469} {"train_loss": -25.70393943786621, "global_step": 370935, "epoch": 4469} {"train_loss": -25.797094345092773, "global_step": 370936, "epoch": 4469} {"train_loss": -25.6903133392334, "global_step": 370937, "epoch": 4469} {"train_loss": -25.869108200073242, "global_step": 370938, "epoch": 4469} {"train_loss": -25.594532012939453, "global_step": 370939, "epoch": 4469} {"train_loss": -25.541296005249023, "global_step": 370940, "epoch": 4469} {"train_loss": -25.776508331298828, "global_step": 370941, "epoch": 4469} {"train_loss": -26.056360244750977, "global_step": 370942, "epoch": 4469} {"train_loss": -26.01140785217285, "global_step": 370943, "epoch": 4469} {"train_loss": -25.719924926757812, "global_step": 370944, "epoch": 4469} {"train_loss": -26.236801147460938, "global_step": 370945, "epoch": 4469} {"train_loss": -26.01058006286621, "global_step": 370946, "epoch": 4469} {"train_loss": -26.399280548095703, "global_step": 370947, "epoch": 4469} {"train_loss": -25.73529624938965, "global_step": 370948, "epoch": 4469} {"train_loss": -25.6358642578125, "global_step": 370949, "epoch": 4469} {"train_loss": -26.263961791992188, "global_step": 370950, "epoch": 4469} {"train_loss": -26.038970947265625, "global_step": 370951, "epoch": 4469} {"train_loss": -26.123004913330078, "global_step": 370952, "epoch": 4469} {"train_loss": -26.099721908569336, "global_step": 370953, "epoch": 4469} {"train_loss": -26.19959831237793, "global_step": 370954, "epoch": 4469} {"train_loss": -26.06377601623535, "global_step": 370955, "epoch": 4469} {"train_loss": -26.54255485534668, "global_step": 370956, "epoch": 4469} {"train_loss": -26.323272705078125, "global_step": 370957, "epoch": 4469} {"train_loss": -26.25739097595215, "global_step": 370958, "epoch": 4469} {"train_loss": -26.32265281677246, "global_step": 370959, "epoch": 4469} {"train_loss": -26.3817195892334, "global_step": 370960, "epoch": 4469} {"train_loss": -26.34063720703125, "global_step": 370961, "epoch": 4469} {"train_loss": -26.35065269470215, "global_step": 370962, "epoch": 4469} {"train_loss": -26.424789428710938, "global_step": 370963, "epoch": 4469} {"train_loss": -26.13669776916504, "global_step": 370964, "epoch": 4469} {"train_loss": -26.35935401916504, "global_step": 370965, "epoch": 4469} {"train_loss": -26.534605026245117, "global_step": 370966, "epoch": 4469} {"train_loss": -26.273351669311523, "global_step": 370967, "epoch": 4469} {"train_loss": -26.080921173095703, "global_step": 370968, "epoch": 4469} {"train_loss": -26.537607192993164, "global_step": 370969, "epoch": 4469} {"train_loss": -26.07614517211914, "global_step": 370970, "epoch": 4469} {"train_loss": -26.344989776611328, "global_step": 370971, "epoch": 4469} {"train_loss": -26.643543243408203, "global_step": 370972, "epoch": 4469} {"train_loss": -26.6772518157959, "global_step": 370973, "epoch": 4469} {"train_loss": -26.718164443969727, "global_step": 370974, "epoch": 4469} {"train_loss": -26.91963768005371, "global_step": 370975, "epoch": 4469} {"train_loss": -26.959089279174805, "global_step": 370976, "epoch": 4469} {"train_loss": -26.726520538330078, "global_step": 370977, "epoch": 4469} {"train_loss": -26.05311393737793, "global_step": 370978, "epoch": 4469} {"train_loss": -26.1473331451416, "global_step": 370979, "epoch": 4469} {"train_loss": -26.485021591186523, "global_step": 370980, "epoch": 4469} {"train_loss": -26.401885986328125, "global_step": 370981, "epoch": 4469} {"train_loss": -26.26582145690918, "global_step": 370982, "epoch": 4469} {"train_loss": -26.35847282409668, "global_step": 370983, "epoch": 4469} {"train_loss": -26.559417724609375, "global_step": 370984, "epoch": 4469} {"train_loss": -26.318923950195312, "global_step": 370985, "epoch": 4469} {"train_loss": -26.33188819885254, "global_step": 370986, "epoch": 4469} {"train_loss": -26.422595977783203, "global_step": 370987, "epoch": 4469} {"train_loss": -26.481109619140625, "global_step": 370988, "epoch": 4469} {"train_loss": -26.415283203125, "global_step": 370989, "epoch": 4469} {"train_loss": -26.396930694580078, "global_step": 370990, "epoch": 4469} {"train_loss": -26.69276237487793, "global_step": 370991, "epoch": 4469} {"train_loss": -26.288299560546875, "global_step": 370992, "epoch": 4469} {"train_loss": -25.987476348876953, "global_step": 370993, "epoch": 4469} {"train_loss": -26.334558486938477, "global_step": 370994, "epoch": 4469} {"train_loss": -25.811969757080078, "global_step": 370995, "epoch": 4469} {"train_loss": -26.46674919128418, "global_step": 370996, "epoch": 4469} {"train_loss": -26.446231842041016, "global_step": 370997, "epoch": 4469} {"train_loss": -26.142597198486328, "global_step": 370998, "epoch": 4469} {"train_loss": -26.32037353515625, "global_step": 370999, "epoch": 4469} {"train_loss": -26.57673454284668, "global_step": 371000, "epoch": 4469} {"train_loss": -26.793615341186523, "global_step": 371001, "epoch": 4469} {"train_loss": -26.58099365234375, "global_step": 371002, "epoch": 4469} {"train_loss": -26.683258056640625, "global_step": 371003, "epoch": 4469} {"train_loss": -26.02362632751465, "global_step": 371004, "epoch": 4469} {"train_loss": -26.336450576782227, "global_step": 371005, "epoch": 4469} {"train_loss": -26.1568660736084, "global_step": 371006, "epoch": 4469} {"train_loss": -26.1859130859375, "global_step": 371007, "epoch": 4469} {"train_loss": -26.1948299407959, "global_step": 371008, "epoch": 4469} {"train_loss": -26.211293645651942, "global_step": 371009, "epoch": 4469, "val_loss": 6604091.0} {"train_loss": -24.227386474609375, "global_step": 371010, "epoch": 4470} {"train_loss": -23.044099807739258, "global_step": 371011, "epoch": 4470} {"train_loss": -25.53877067565918, "global_step": 371012, "epoch": 4470} {"train_loss": -25.36574363708496, "global_step": 371013, "epoch": 4470} {"train_loss": -25.439552307128906, "global_step": 371014, "epoch": 4470} {"train_loss": -24.969390869140625, "global_step": 371015, "epoch": 4470} {"train_loss": -25.779897689819336, "global_step": 371016, "epoch": 4470} {"train_loss": -24.850759506225586, "global_step": 371017, "epoch": 4470} {"train_loss": -25.93544578552246, "global_step": 371018, "epoch": 4470} {"train_loss": -25.267303466796875, "global_step": 371019, "epoch": 4470} {"train_loss": -25.40048599243164, "global_step": 371020, "epoch": 4470} {"train_loss": -25.446130752563477, "global_step": 371021, "epoch": 4470} {"train_loss": -25.532424926757812, "global_step": 371022, "epoch": 4470} {"train_loss": -25.43975257873535, "global_step": 371023, "epoch": 4470} {"train_loss": -25.860116958618164, "global_step": 371024, "epoch": 4470} {"train_loss": -26.105060577392578, "global_step": 371025, "epoch": 4470} {"train_loss": -25.560211181640625, "global_step": 371026, "epoch": 4470} {"train_loss": -25.55777931213379, "global_step": 371027, "epoch": 4470} {"train_loss": -25.7875919342041, "global_step": 371028, "epoch": 4470} {"train_loss": -26.091907501220703, "global_step": 371029, "epoch": 4470} {"train_loss": -25.891260147094727, "global_step": 371030, "epoch": 4470} {"train_loss": -26.006134033203125, "global_step": 371031, "epoch": 4470} {"train_loss": -25.997507095336914, "global_step": 371032, "epoch": 4470} {"train_loss": -26.129547119140625, "global_step": 371033, "epoch": 4470} {"train_loss": -26.13508415222168, "global_step": 371034, "epoch": 4470} {"train_loss": -25.900609970092773, "global_step": 371035, "epoch": 4470} {"train_loss": -26.31077003479004, "global_step": 371036, "epoch": 4470} {"train_loss": -26.07071304321289, "global_step": 371037, "epoch": 4470} {"train_loss": -26.381195068359375, "global_step": 371038, "epoch": 4470} {"train_loss": -26.12678337097168, "global_step": 371039, "epoch": 4470} {"train_loss": -26.16414451599121, "global_step": 371040, "epoch": 4470} {"train_loss": -26.428003311157227, "global_step": 371041, "epoch": 4470} {"train_loss": -26.273529052734375, "global_step": 371042, "epoch": 4470} {"train_loss": -25.954336166381836, "global_step": 371043, "epoch": 4470} {"train_loss": -26.21626091003418, "global_step": 371044, "epoch": 4470} {"train_loss": -26.055936813354492, "global_step": 371045, "epoch": 4470} {"train_loss": -26.6717529296875, "global_step": 371046, "epoch": 4470} {"train_loss": -26.090042114257812, "global_step": 371047, "epoch": 4470} {"train_loss": -26.43043327331543, "global_step": 371048, "epoch": 4470} {"train_loss": -26.72381019592285, "global_step": 371049, "epoch": 4470} {"train_loss": -26.011457443237305, "global_step": 371050, "epoch": 4470} {"train_loss": -26.506269454956055, "global_step": 371051, "epoch": 4470} {"train_loss": -26.090063095092773, "global_step": 371052, "epoch": 4470} {"train_loss": -26.35321617126465, "global_step": 371053, "epoch": 4470} {"train_loss": -26.256549835205078, "global_step": 371054, "epoch": 4470} {"train_loss": -26.25977897644043, "global_step": 371055, "epoch": 4470} {"train_loss": -26.410444259643555, "global_step": 371056, "epoch": 4470} {"train_loss": -26.3548583984375, "global_step": 371057, "epoch": 4470} {"train_loss": -26.643396377563477, "global_step": 371058, "epoch": 4470} {"train_loss": -26.27911376953125, "global_step": 371059, "epoch": 4470} {"train_loss": -26.003339767456055, "global_step": 371060, "epoch": 4470} {"train_loss": -26.524417877197266, "global_step": 371061, "epoch": 4470} {"train_loss": -26.18674659729004, "global_step": 371062, "epoch": 4470} {"train_loss": -26.08798599243164, "global_step": 371063, "epoch": 4470} {"train_loss": -26.040990829467773, "global_step": 371064, "epoch": 4470} {"train_loss": -25.89898109436035, "global_step": 371065, "epoch": 4470} {"train_loss": -26.149778366088867, "global_step": 371066, "epoch": 4470} {"train_loss": -26.4423828125, "global_step": 371067, "epoch": 4470} {"train_loss": -26.115619659423828, "global_step": 371068, "epoch": 4470} {"train_loss": -26.214231491088867, "global_step": 371069, "epoch": 4470} {"train_loss": -26.3732967376709, "global_step": 371070, "epoch": 4470} {"train_loss": -26.31768798828125, "global_step": 371071, "epoch": 4470} {"train_loss": -26.294660568237305, "global_step": 371072, "epoch": 4470} {"train_loss": -26.180988311767578, "global_step": 371073, "epoch": 4470} {"train_loss": -26.456085205078125, "global_step": 371074, "epoch": 4470} {"train_loss": -25.96795654296875, "global_step": 371075, "epoch": 4470} {"train_loss": -26.42494010925293, "global_step": 371076, "epoch": 4470} {"train_loss": -26.392105102539062, "global_step": 371077, "epoch": 4470} {"train_loss": -26.460540771484375, "global_step": 371078, "epoch": 4470} {"train_loss": -26.000146865844727, "global_step": 371079, "epoch": 4470} {"train_loss": -26.61528968811035, "global_step": 371080, "epoch": 4470} {"train_loss": -26.293359756469727, "global_step": 371081, "epoch": 4470} {"train_loss": -26.186145782470703, "global_step": 371082, "epoch": 4470} {"train_loss": -26.21381950378418, "global_step": 371083, "epoch": 4470} {"train_loss": -26.429929733276367, "global_step": 371084, "epoch": 4470} {"train_loss": -26.331008911132812, "global_step": 371085, "epoch": 4470} {"train_loss": -26.355756759643555, "global_step": 371086, "epoch": 4470} {"train_loss": -26.401641845703125, "global_step": 371087, "epoch": 4470} {"train_loss": -26.356800079345703, "global_step": 371088, "epoch": 4470} {"train_loss": -26.679182052612305, "global_step": 371089, "epoch": 4470} {"train_loss": -26.482629776000977, "global_step": 371090, "epoch": 4470} {"train_loss": -26.25165367126465, "global_step": 371091, "epoch": 4470} {"train_loss": -26.06029133624341, "global_step": 371092, "epoch": 4470, "val_loss": 6532035.5} {"train_loss": -26.168638229370117, "global_step": 371093, "epoch": 4471} {"train_loss": -25.97134780883789, "global_step": 371094, "epoch": 4471} {"train_loss": -25.94532585144043, "global_step": 371095, "epoch": 4471} {"train_loss": -26.402673721313477, "global_step": 371096, "epoch": 4471} {"train_loss": -25.867237091064453, "global_step": 371097, "epoch": 4471} {"train_loss": -25.962772369384766, "global_step": 371098, "epoch": 4471} {"train_loss": -26.33552360534668, "global_step": 371099, "epoch": 4471} {"train_loss": -25.525970458984375, "global_step": 371100, "epoch": 4471} {"train_loss": -26.239917755126953, "global_step": 371101, "epoch": 4471} {"train_loss": -26.306232452392578, "global_step": 371102, "epoch": 4471} {"train_loss": -25.994491577148438, "global_step": 371103, "epoch": 4471} {"train_loss": -26.289794921875, "global_step": 371104, "epoch": 4471} {"train_loss": -26.372364044189453, "global_step": 371105, "epoch": 4471} {"train_loss": -25.81477165222168, "global_step": 371106, "epoch": 4471} {"train_loss": -25.575719833374023, "global_step": 371107, "epoch": 4471} {"train_loss": -26.291208267211914, "global_step": 371108, "epoch": 4471} {"train_loss": -26.075891494750977, "global_step": 371109, "epoch": 4471} {"train_loss": -26.22645378112793, "global_step": 371110, "epoch": 4471} {"train_loss": -26.358617782592773, "global_step": 371111, "epoch": 4471} {"train_loss": -26.58090591430664, "global_step": 371112, "epoch": 4471} {"train_loss": -26.081018447875977, "global_step": 371113, "epoch": 4471} {"train_loss": -26.3378849029541, "global_step": 371114, "epoch": 4471} {"train_loss": -26.35137367248535, "global_step": 371115, "epoch": 4471} {"train_loss": -26.312549591064453, "global_step": 371116, "epoch": 4471} {"train_loss": -26.240015029907227, "global_step": 371117, "epoch": 4471} {"train_loss": -26.430927276611328, "global_step": 371118, "epoch": 4471} {"train_loss": -26.5242977142334, "global_step": 371119, "epoch": 4471} {"train_loss": -26.303991317749023, "global_step": 371120, "epoch": 4471} {"train_loss": -26.21494483947754, "global_step": 371121, "epoch": 4471} {"train_loss": -26.233503341674805, "global_step": 371122, "epoch": 4471} {"train_loss": -26.279712677001953, "global_step": 371123, "epoch": 4471} {"train_loss": -26.125446319580078, "global_step": 371124, "epoch": 4471} {"train_loss": -26.405874252319336, "global_step": 371125, "epoch": 4471} {"train_loss": -26.380950927734375, "global_step": 371126, "epoch": 4471} {"train_loss": -26.497161865234375, "global_step": 371127, "epoch": 4471} {"train_loss": -26.1802978515625, "global_step": 371128, "epoch": 4471} {"train_loss": -26.72979164123535, "global_step": 371129, "epoch": 4471} {"train_loss": -26.17388916015625, "global_step": 371130, "epoch": 4471} {"train_loss": -26.397144317626953, "global_step": 371131, "epoch": 4471} {"train_loss": -26.31220817565918, "global_step": 371132, "epoch": 4471} {"train_loss": -26.440610885620117, "global_step": 371133, "epoch": 4471} {"train_loss": -26.591999053955078, "global_step": 371134, "epoch": 4471} {"train_loss": -26.381610870361328, "global_step": 371135, "epoch": 4471} {"train_loss": -26.48456382751465, "global_step": 371136, "epoch": 4471} {"train_loss": -26.351871490478516, "global_step": 371137, "epoch": 4471} {"train_loss": -26.673120498657227, "global_step": 371138, "epoch": 4471} {"train_loss": -26.642629623413086, "global_step": 371139, "epoch": 4471} {"train_loss": -26.739185333251953, "global_step": 371140, "epoch": 4471} {"train_loss": -26.61203384399414, "global_step": 371141, "epoch": 4471} {"train_loss": -26.245136260986328, "global_step": 371142, "epoch": 4471} {"train_loss": -26.726703643798828, "global_step": 371143, "epoch": 4471} {"train_loss": -26.576696395874023, "global_step": 371144, "epoch": 4471} {"train_loss": -26.426071166992188, "global_step": 371145, "epoch": 4471} {"train_loss": -26.645252227783203, "global_step": 371146, "epoch": 4471} {"train_loss": -26.4585018157959, "global_step": 371147, "epoch": 4471} {"train_loss": -26.49016761779785, "global_step": 371148, "epoch": 4471} {"train_loss": -26.21272087097168, "global_step": 371149, "epoch": 4471} {"train_loss": -26.714435577392578, "global_step": 371150, "epoch": 4471} {"train_loss": -26.3626766204834, "global_step": 371151, "epoch": 4471} {"train_loss": -26.341968536376953, "global_step": 371152, "epoch": 4471} {"train_loss": -26.474029541015625, "global_step": 371153, "epoch": 4471} {"train_loss": -26.574132919311523, "global_step": 371154, "epoch": 4471} {"train_loss": -26.39983558654785, "global_step": 371155, "epoch": 4471} {"train_loss": -25.625364303588867, "global_step": 371156, "epoch": 4471} {"train_loss": -25.884403228759766, "global_step": 371157, "epoch": 4471} {"train_loss": -26.52129554748535, "global_step": 371158, "epoch": 4471} {"train_loss": -26.13287353515625, "global_step": 371159, "epoch": 4471} {"train_loss": -26.070775985717773, "global_step": 371160, "epoch": 4471} {"train_loss": -25.717166900634766, "global_step": 371161, "epoch": 4471} {"train_loss": -25.87225341796875, "global_step": 371162, "epoch": 4471} {"train_loss": -26.174835205078125, "global_step": 371163, "epoch": 4471} {"train_loss": -26.19553565979004, "global_step": 371164, "epoch": 4471} {"train_loss": -26.130630493164062, "global_step": 371165, "epoch": 4471} {"train_loss": -25.720808029174805, "global_step": 371166, "epoch": 4471} {"train_loss": -26.3739070892334, "global_step": 371167, "epoch": 4471} {"train_loss": -26.28609275817871, "global_step": 371168, "epoch": 4471} {"train_loss": -26.599512100219727, "global_step": 371169, "epoch": 4471} {"train_loss": -26.65389060974121, "global_step": 371170, "epoch": 4471} {"train_loss": -26.38437843322754, "global_step": 371171, "epoch": 4471} {"train_loss": -26.20295524597168, "global_step": 371172, "epoch": 4471} {"train_loss": -26.149112701416016, "global_step": 371173, "epoch": 4471} {"train_loss": -26.2230224609375, "global_step": 371174, "epoch": 4471} {"train_loss": -26.275463311068982, "global_step": 371175, "epoch": 4471, "val_loss": 6630129.0} {"train_loss": -26.002471923828125, "global_step": 371176, "epoch": 4472} {"train_loss": -26.413761138916016, "global_step": 371177, "epoch": 4472} {"train_loss": -26.119140625, "global_step": 371178, "epoch": 4472} {"train_loss": -26.242145538330078, "global_step": 371179, "epoch": 4472} {"train_loss": -26.16228675842285, "global_step": 371180, "epoch": 4472} {"train_loss": -25.877838134765625, "global_step": 371181, "epoch": 4472} {"train_loss": -25.640201568603516, "global_step": 371182, "epoch": 4472} {"train_loss": -26.352710723876953, "global_step": 371183, "epoch": 4472} {"train_loss": -25.929412841796875, "global_step": 371184, "epoch": 4472} {"train_loss": -25.850500106811523, "global_step": 371185, "epoch": 4472} {"train_loss": -26.293319702148438, "global_step": 371186, "epoch": 4472} {"train_loss": -26.20487403869629, "global_step": 371187, "epoch": 4472} {"train_loss": -26.454837799072266, "global_step": 371188, "epoch": 4472} {"train_loss": -26.24482536315918, "global_step": 371189, "epoch": 4472} {"train_loss": -25.966161727905273, "global_step": 371190, "epoch": 4472} {"train_loss": -26.041894912719727, "global_step": 371191, "epoch": 4472} {"train_loss": -26.530841827392578, "global_step": 371192, "epoch": 4472} {"train_loss": -25.9626407623291, "global_step": 371193, "epoch": 4472} {"train_loss": -26.504743576049805, "global_step": 371194, "epoch": 4472} {"train_loss": -26.46954345703125, "global_step": 371195, "epoch": 4472} {"train_loss": -26.302371978759766, "global_step": 371196, "epoch": 4472} {"train_loss": -26.43182373046875, "global_step": 371197, "epoch": 4472} {"train_loss": -26.74997329711914, "global_step": 371198, "epoch": 4472} {"train_loss": -26.091358184814453, "global_step": 371199, "epoch": 4472} {"train_loss": -26.663328170776367, "global_step": 371200, "epoch": 4472} {"train_loss": -26.36995506286621, "global_step": 371201, "epoch": 4472} {"train_loss": -26.448408126831055, "global_step": 371202, "epoch": 4472} {"train_loss": -26.5323429107666, "global_step": 371203, "epoch": 4472} {"train_loss": -26.48758888244629, "global_step": 371204, "epoch": 4472} {"train_loss": -26.38837242126465, "global_step": 371205, "epoch": 4472} {"train_loss": -26.5492000579834, "global_step": 371206, "epoch": 4472} {"train_loss": -26.46418571472168, "global_step": 371207, "epoch": 4472} {"train_loss": -26.16151237487793, "global_step": 371208, "epoch": 4472} {"train_loss": -26.435083389282227, "global_step": 371209, "epoch": 4472} {"train_loss": -26.497716903686523, "global_step": 371210, "epoch": 4472} {"train_loss": -26.133581161499023, "global_step": 371211, "epoch": 4472} {"train_loss": -26.51580238342285, "global_step": 371212, "epoch": 4472} {"train_loss": -26.21808433532715, "global_step": 371213, "epoch": 4472} {"train_loss": -26.32048988342285, "global_step": 371214, "epoch": 4472} {"train_loss": -26.117456436157227, "global_step": 371215, "epoch": 4472} {"train_loss": -26.71125602722168, "global_step": 371216, "epoch": 4472} {"train_loss": -26.3797550201416, "global_step": 371217, "epoch": 4472} {"train_loss": -26.3764591217041, "global_step": 371218, "epoch": 4472} {"train_loss": -26.3934326171875, "global_step": 371219, "epoch": 4472} {"train_loss": -26.417251586914062, "global_step": 371220, "epoch": 4472} {"train_loss": -26.420164108276367, "global_step": 371221, "epoch": 4472} {"train_loss": -26.419340133666992, "global_step": 371222, "epoch": 4472} {"train_loss": -26.23154067993164, "global_step": 371223, "epoch": 4472} {"train_loss": -26.473241806030273, "global_step": 371224, "epoch": 4472} {"train_loss": -26.406024932861328, "global_step": 371225, "epoch": 4472} {"train_loss": -26.93072509765625, "global_step": 371226, "epoch": 4472} {"train_loss": -26.4415340423584, "global_step": 371227, "epoch": 4472} {"train_loss": -26.363910675048828, "global_step": 371228, "epoch": 4472} {"train_loss": -26.7154541015625, "global_step": 371229, "epoch": 4472} {"train_loss": -26.599084854125977, "global_step": 371230, "epoch": 4472} {"train_loss": -26.414987564086914, "global_step": 371231, "epoch": 4472} {"train_loss": -26.063852310180664, "global_step": 371232, "epoch": 4472} {"train_loss": -26.206113815307617, "global_step": 371233, "epoch": 4472} {"train_loss": -26.234033584594727, "global_step": 371234, "epoch": 4472} {"train_loss": -26.769750595092773, "global_step": 371235, "epoch": 4472} {"train_loss": -26.417219161987305, "global_step": 371236, "epoch": 4472} {"train_loss": -26.583654403686523, "global_step": 371237, "epoch": 4472} {"train_loss": -26.66290283203125, "global_step": 371238, "epoch": 4472} {"train_loss": -26.356725692749023, "global_step": 371239, "epoch": 4472} {"train_loss": -26.723785400390625, "global_step": 371240, "epoch": 4472} {"train_loss": -26.854724884033203, "global_step": 371241, "epoch": 4472} {"train_loss": -26.272790908813477, "global_step": 371242, "epoch": 4472} {"train_loss": -26.534971237182617, "global_step": 371243, "epoch": 4472} {"train_loss": -26.3978271484375, "global_step": 371244, "epoch": 4472} {"train_loss": -26.58392906188965, "global_step": 371245, "epoch": 4472} {"train_loss": -26.61859703063965, "global_step": 371246, "epoch": 4472} {"train_loss": -26.27888298034668, "global_step": 371247, "epoch": 4472} {"train_loss": -26.1667423248291, "global_step": 371248, "epoch": 4472} {"train_loss": -26.172399520874023, "global_step": 371249, "epoch": 4472} {"train_loss": -26.450153350830078, "global_step": 371250, "epoch": 4472} {"train_loss": -25.957672119140625, "global_step": 371251, "epoch": 4472} {"train_loss": -26.416013717651367, "global_step": 371252, "epoch": 4472} {"train_loss": -26.426755905151367, "global_step": 371253, "epoch": 4472} {"train_loss": -26.18313980102539, "global_step": 371254, "epoch": 4472} {"train_loss": -26.249420166015625, "global_step": 371255, "epoch": 4472} {"train_loss": -26.112567901611328, "global_step": 371256, "epoch": 4472} {"train_loss": -26.16302490234375, "global_step": 371257, "epoch": 4472} {"train_loss": -26.37364771279944, "global_step": 371258, "epoch": 4472, "val_loss": 6656299.0} {"train_loss": -24.284894943237305, "global_step": 371259, "epoch": 4473} {"train_loss": -25.34895133972168, "global_step": 371260, "epoch": 4473} {"train_loss": -25.537311553955078, "global_step": 371261, "epoch": 4473} {"train_loss": -25.537368774414062, "global_step": 371262, "epoch": 4473} {"train_loss": -24.981666564941406, "global_step": 371263, "epoch": 4473} {"train_loss": -25.483678817749023, "global_step": 371264, "epoch": 4473} {"train_loss": -25.483983993530273, "global_step": 371265, "epoch": 4473} {"train_loss": -25.245946884155273, "global_step": 371266, "epoch": 4473} {"train_loss": -25.4434871673584, "global_step": 371267, "epoch": 4473} {"train_loss": -25.776269912719727, "global_step": 371268, "epoch": 4473} {"train_loss": -25.241703033447266, "global_step": 371269, "epoch": 4473} {"train_loss": -25.574542999267578, "global_step": 371270, "epoch": 4473} {"train_loss": -25.63334083557129, "global_step": 371271, "epoch": 4473} {"train_loss": -25.709503173828125, "global_step": 371272, "epoch": 4473} {"train_loss": -25.79212760925293, "global_step": 371273, "epoch": 4473} {"train_loss": -25.443201065063477, "global_step": 371274, "epoch": 4473} {"train_loss": -25.523427963256836, "global_step": 371275, "epoch": 4473} {"train_loss": -25.47267723083496, "global_step": 371276, "epoch": 4473} {"train_loss": -26.004011154174805, "global_step": 371277, "epoch": 4473} {"train_loss": -25.553125381469727, "global_step": 371278, "epoch": 4473} {"train_loss": -26.000385284423828, "global_step": 371279, "epoch": 4473} {"train_loss": -25.80023765563965, "global_step": 371280, "epoch": 4473} {"train_loss": -25.93731117248535, "global_step": 371281, "epoch": 4473} {"train_loss": -26.07350730895996, "global_step": 371282, "epoch": 4473} {"train_loss": -26.221372604370117, "global_step": 371283, "epoch": 4473} {"train_loss": -26.043943405151367, "global_step": 371284, "epoch": 4473} {"train_loss": -26.09096336364746, "global_step": 371285, "epoch": 4473} {"train_loss": -26.19424819946289, "global_step": 371286, "epoch": 4473} {"train_loss": -26.052173614501953, "global_step": 371287, "epoch": 4473} {"train_loss": -26.241714477539062, "global_step": 371288, "epoch": 4473} {"train_loss": -26.064605712890625, "global_step": 371289, "epoch": 4473} {"train_loss": -26.332971572875977, "global_step": 371290, "epoch": 4473} {"train_loss": -26.175214767456055, "global_step": 371291, "epoch": 4473} {"train_loss": -25.961217880249023, "global_step": 371292, "epoch": 4473} {"train_loss": -26.281286239624023, "global_step": 371293, "epoch": 4473} {"train_loss": -26.60929298400879, "global_step": 371294, "epoch": 4473} {"train_loss": -26.54605484008789, "global_step": 371295, "epoch": 4473} {"train_loss": -26.35164451599121, "global_step": 371296, "epoch": 4473} {"train_loss": -26.37485122680664, "global_step": 371297, "epoch": 4473} {"train_loss": -26.0655460357666, "global_step": 371298, "epoch": 4473} {"train_loss": -26.390552520751953, "global_step": 371299, "epoch": 4473} {"train_loss": -26.364912033081055, "global_step": 371300, "epoch": 4473} {"train_loss": -26.689233779907227, "global_step": 371301, "epoch": 4473} {"train_loss": -26.381103515625, "global_step": 371302, "epoch": 4473} {"train_loss": -25.942068099975586, "global_step": 371303, "epoch": 4473} {"train_loss": -26.753650665283203, "global_step": 371304, "epoch": 4473} {"train_loss": -26.494659423828125, "global_step": 371305, "epoch": 4473} {"train_loss": -26.066192626953125, "global_step": 371306, "epoch": 4473} {"train_loss": -26.5459041595459, "global_step": 371307, "epoch": 4473} {"train_loss": -26.320037841796875, "global_step": 371308, "epoch": 4473} {"train_loss": -26.328723907470703, "global_step": 371309, "epoch": 4473} {"train_loss": -26.290348052978516, "global_step": 371310, "epoch": 4473} {"train_loss": -26.21126365661621, "global_step": 371311, "epoch": 4473} {"train_loss": -26.318405151367188, "global_step": 371312, "epoch": 4473} {"train_loss": -26.704893112182617, "global_step": 371313, "epoch": 4473} {"train_loss": -26.2910099029541, "global_step": 371314, "epoch": 4473} {"train_loss": -26.193359375, "global_step": 371315, "epoch": 4473} {"train_loss": -26.487579345703125, "global_step": 371316, "epoch": 4473} {"train_loss": -26.327594757080078, "global_step": 371317, "epoch": 4473} {"train_loss": -26.5725154876709, "global_step": 371318, "epoch": 4473} {"train_loss": -26.48382568359375, "global_step": 371319, "epoch": 4473} {"train_loss": -26.67658042907715, "global_step": 371320, "epoch": 4473} {"train_loss": -26.633527755737305, "global_step": 371321, "epoch": 4473} {"train_loss": -26.508676528930664, "global_step": 371322, "epoch": 4473} {"train_loss": -26.256372451782227, "global_step": 371323, "epoch": 4473} {"train_loss": -26.52435302734375, "global_step": 371324, "epoch": 4473} {"train_loss": -26.18459129333496, "global_step": 371325, "epoch": 4473} {"train_loss": -26.853052139282227, "global_step": 371326, "epoch": 4473} {"train_loss": -26.098392486572266, "global_step": 371327, "epoch": 4473} {"train_loss": -25.668567657470703, "global_step": 371328, "epoch": 4473} {"train_loss": -25.601154327392578, "global_step": 371329, "epoch": 4473} {"train_loss": -26.09584617614746, "global_step": 371330, "epoch": 4473} {"train_loss": -25.946264266967773, "global_step": 371331, "epoch": 4473} {"train_loss": -26.548765182495117, "global_step": 371332, "epoch": 4473} {"train_loss": -26.2744197845459, "global_step": 371333, "epoch": 4473} {"train_loss": -26.261194229125977, "global_step": 371334, "epoch": 4473} {"train_loss": -26.113615036010742, "global_step": 371335, "epoch": 4473} {"train_loss": -25.82637596130371, "global_step": 371336, "epoch": 4473} {"train_loss": -26.25575065612793, "global_step": 371337, "epoch": 4473} {"train_loss": -26.4603214263916, "global_step": 371338, "epoch": 4473} {"train_loss": -26.540557861328125, "global_step": 371339, "epoch": 4473} {"train_loss": -26.095306396484375, "global_step": 371340, "epoch": 4473} {"train_loss": -26.080401799764978, "global_step": 371341, "epoch": 4473, "val_loss": 6752902.5} {"train_loss": -26.266681671142578, "global_step": 371342, "epoch": 4474} {"train_loss": -25.959936141967773, "global_step": 371343, "epoch": 4474} {"train_loss": -26.1141300201416, "global_step": 371344, "epoch": 4474} {"train_loss": -26.073474884033203, "global_step": 371345, "epoch": 4474} {"train_loss": -26.16322898864746, "global_step": 371346, "epoch": 4474} {"train_loss": -25.94172477722168, "global_step": 371347, "epoch": 4474} {"train_loss": -26.188873291015625, "global_step": 371348, "epoch": 4474} {"train_loss": -26.05269432067871, "global_step": 371349, "epoch": 4474} {"train_loss": -26.20917320251465, "global_step": 371350, "epoch": 4474} {"train_loss": -26.50164794921875, "global_step": 371351, "epoch": 4474} {"train_loss": -26.14466667175293, "global_step": 371352, "epoch": 4474} {"train_loss": -26.06873893737793, "global_step": 371353, "epoch": 4474} {"train_loss": -25.939422607421875, "global_step": 371354, "epoch": 4474} {"train_loss": -26.111352920532227, "global_step": 371355, "epoch": 4474} {"train_loss": -26.35822868347168, "global_step": 371356, "epoch": 4474} {"train_loss": -26.091718673706055, "global_step": 371357, "epoch": 4474} {"train_loss": -26.333829879760742, "global_step": 371358, "epoch": 4474} {"train_loss": -26.17396354675293, "global_step": 371359, "epoch": 4474} {"train_loss": -25.880680084228516, "global_step": 371360, "epoch": 4474} {"train_loss": -26.11103630065918, "global_step": 371361, "epoch": 4474} {"train_loss": -26.557270050048828, "global_step": 371362, "epoch": 4474} {"train_loss": -26.28010368347168, "global_step": 371363, "epoch": 4474} {"train_loss": -26.29998207092285, "global_step": 371364, "epoch": 4474} {"train_loss": -26.395694732666016, "global_step": 371365, "epoch": 4474} {"train_loss": -26.387781143188477, "global_step": 371366, "epoch": 4474} {"train_loss": -25.951526641845703, "global_step": 371367, "epoch": 4474} {"train_loss": -26.284513473510742, "global_step": 371368, "epoch": 4474} {"train_loss": -26.335681915283203, "global_step": 371369, "epoch": 4474} {"train_loss": -26.592626571655273, "global_step": 371370, "epoch": 4474} {"train_loss": -26.336505889892578, "global_step": 371371, "epoch": 4474} {"train_loss": -26.119558334350586, "global_step": 371372, "epoch": 4474} {"train_loss": -26.571340560913086, "global_step": 371373, "epoch": 4474} {"train_loss": -26.952774047851562, "global_step": 371374, "epoch": 4474} {"train_loss": -26.469318389892578, "global_step": 371375, "epoch": 4474} {"train_loss": -26.432790756225586, "global_step": 371376, "epoch": 4474} {"train_loss": -26.57636833190918, "global_step": 371377, "epoch": 4474} {"train_loss": -26.468982696533203, "global_step": 371378, "epoch": 4474} {"train_loss": -26.053497314453125, "global_step": 371379, "epoch": 4474} {"train_loss": -26.352537155151367, "global_step": 371380, "epoch": 4474} {"train_loss": -25.692874908447266, "global_step": 371381, "epoch": 4474} {"train_loss": -25.732440948486328, "global_step": 371382, "epoch": 4474} {"train_loss": -25.81012535095215, "global_step": 371383, "epoch": 4474} {"train_loss": -26.183008193969727, "global_step": 371384, "epoch": 4474} {"train_loss": -26.492151260375977, "global_step": 371385, "epoch": 4474} {"train_loss": -26.027868270874023, "global_step": 371386, "epoch": 4474} {"train_loss": -26.52044677734375, "global_step": 371387, "epoch": 4474} {"train_loss": -26.420705795288086, "global_step": 371388, "epoch": 4474} {"train_loss": -26.73417091369629, "global_step": 371389, "epoch": 4474} {"train_loss": -26.19707679748535, "global_step": 371390, "epoch": 4474} {"train_loss": -26.666431427001953, "global_step": 371391, "epoch": 4474} {"train_loss": -26.283496856689453, "global_step": 371392, "epoch": 4474} {"train_loss": -26.686878204345703, "global_step": 371393, "epoch": 4474} {"train_loss": -26.537466049194336, "global_step": 371394, "epoch": 4474} {"train_loss": -26.298023223876953, "global_step": 371395, "epoch": 4474} {"train_loss": -26.67217445373535, "global_step": 371396, "epoch": 4474} {"train_loss": -26.29457664489746, "global_step": 371397, "epoch": 4474} {"train_loss": -26.096647262573242, "global_step": 371398, "epoch": 4474} {"train_loss": -26.59195899963379, "global_step": 371399, "epoch": 4474} {"train_loss": -26.191190719604492, "global_step": 371400, "epoch": 4474} {"train_loss": -26.374460220336914, "global_step": 371401, "epoch": 4474} {"train_loss": -26.292383193969727, "global_step": 371402, "epoch": 4474} {"train_loss": -26.133209228515625, "global_step": 371403, "epoch": 4474} {"train_loss": -26.608936309814453, "global_step": 371404, "epoch": 4474} {"train_loss": -26.697040557861328, "global_step": 371405, "epoch": 4474} {"train_loss": -26.478809356689453, "global_step": 371406, "epoch": 4474} {"train_loss": -26.983118057250977, "global_step": 371407, "epoch": 4474} {"train_loss": -26.668899536132812, "global_step": 371408, "epoch": 4474} {"train_loss": -26.748966217041016, "global_step": 371409, "epoch": 4474} {"train_loss": -26.601531982421875, "global_step": 371410, "epoch": 4474} {"train_loss": -26.762365341186523, "global_step": 371411, "epoch": 4474} {"train_loss": -26.384546279907227, "global_step": 371412, "epoch": 4474} {"train_loss": -26.60224723815918, "global_step": 371413, "epoch": 4474} {"train_loss": -26.6347599029541, "global_step": 371414, "epoch": 4474} {"train_loss": -26.720855712890625, "global_step": 371415, "epoch": 4474} {"train_loss": -26.73402214050293, "global_step": 371416, "epoch": 4474} {"train_loss": -26.08978843688965, "global_step": 371417, "epoch": 4474} {"train_loss": -25.244640350341797, "global_step": 371418, "epoch": 4474} {"train_loss": -23.5605525970459, "global_step": 371419, "epoch": 4474} {"train_loss": -23.559707641601562, "global_step": 371420, "epoch": 4474} {"train_loss": -25.13740348815918, "global_step": 371421, "epoch": 4474} {"train_loss": -24.927291870117188, "global_step": 371422, "epoch": 4474} {"train_loss": -25.224319458007812, "global_step": 371423, "epoch": 4474} {"train_loss": -26.20133475797722, "global_step": 371424, "epoch": 4474, "val_loss": 6612339.0} {"train_loss": -24.648283004760742, "global_step": 371425, "epoch": 4475} {"train_loss": -25.43110466003418, "global_step": 371426, "epoch": 4475} {"train_loss": -25.05445671081543, "global_step": 371427, "epoch": 4475} {"train_loss": -25.244821548461914, "global_step": 371428, "epoch": 4475} {"train_loss": -24.836942672729492, "global_step": 371429, "epoch": 4475} {"train_loss": -25.253936767578125, "global_step": 371430, "epoch": 4475} {"train_loss": -25.31365966796875, "global_step": 371431, "epoch": 4475} {"train_loss": -24.983198165893555, "global_step": 371432, "epoch": 4475} {"train_loss": -25.334285736083984, "global_step": 371433, "epoch": 4475} {"train_loss": -25.206418991088867, "global_step": 371434, "epoch": 4475} {"train_loss": -25.634185791015625, "global_step": 371435, "epoch": 4475} {"train_loss": -25.352859497070312, "global_step": 371436, "epoch": 4475} {"train_loss": -25.3298282623291, "global_step": 371437, "epoch": 4475} {"train_loss": -25.360837936401367, "global_step": 371438, "epoch": 4475} {"train_loss": -25.679168701171875, "global_step": 371439, "epoch": 4475} {"train_loss": -25.221755981445312, "global_step": 371440, "epoch": 4475} {"train_loss": -25.8902645111084, "global_step": 371441, "epoch": 4475} {"train_loss": -26.02445411682129, "global_step": 371442, "epoch": 4475} {"train_loss": -26.090925216674805, "global_step": 371443, "epoch": 4475} {"train_loss": -25.46205711364746, "global_step": 371444, "epoch": 4475} {"train_loss": -25.586759567260742, "global_step": 371445, "epoch": 4475} {"train_loss": -25.43544578552246, "global_step": 371446, "epoch": 4475} {"train_loss": -25.594125747680664, "global_step": 371447, "epoch": 4475} {"train_loss": -25.86093521118164, "global_step": 371448, "epoch": 4475} {"train_loss": -26.211896896362305, "global_step": 371449, "epoch": 4475} {"train_loss": -26.118743896484375, "global_step": 371450, "epoch": 4475} {"train_loss": -25.799945831298828, "global_step": 371451, "epoch": 4475} {"train_loss": -26.04994010925293, "global_step": 371452, "epoch": 4475} {"train_loss": -25.493057250976562, "global_step": 371453, "epoch": 4475} {"train_loss": -26.173078536987305, "global_step": 371454, "epoch": 4475} {"train_loss": -26.239728927612305, "global_step": 371455, "epoch": 4475} {"train_loss": -26.153366088867188, "global_step": 371456, "epoch": 4475} {"train_loss": -26.40057945251465, "global_step": 371457, "epoch": 4475} {"train_loss": -25.903400421142578, "global_step": 371458, "epoch": 4475} {"train_loss": -26.5122013092041, "global_step": 371459, "epoch": 4475} {"train_loss": -26.22466468811035, "global_step": 371460, "epoch": 4475} {"train_loss": -26.040449142456055, "global_step": 371461, "epoch": 4475} {"train_loss": -26.271747589111328, "global_step": 371462, "epoch": 4475} {"train_loss": -26.421483993530273, "global_step": 371463, "epoch": 4475} {"train_loss": -26.188085556030273, "global_step": 371464, "epoch": 4475} {"train_loss": -26.211225509643555, "global_step": 371465, "epoch": 4475} {"train_loss": -26.06361198425293, "global_step": 371466, "epoch": 4475} {"train_loss": -26.293548583984375, "global_step": 371467, "epoch": 4475} {"train_loss": -26.121084213256836, "global_step": 371468, "epoch": 4475} {"train_loss": -26.35662841796875, "global_step": 371469, "epoch": 4475} {"train_loss": -26.391992568969727, "global_step": 371470, "epoch": 4475} {"train_loss": -26.471830368041992, "global_step": 371471, "epoch": 4475} {"train_loss": -26.52437400817871, "global_step": 371472, "epoch": 4475} {"train_loss": -26.32095718383789, "global_step": 371473, "epoch": 4475} {"train_loss": -26.22041130065918, "global_step": 371474, "epoch": 4475} {"train_loss": -26.454084396362305, "global_step": 371475, "epoch": 4475} {"train_loss": -26.169050216674805, "global_step": 371476, "epoch": 4475} {"train_loss": -26.286840438842773, "global_step": 371477, "epoch": 4475} {"train_loss": -26.67962074279785, "global_step": 371478, "epoch": 4475} {"train_loss": -26.2139892578125, "global_step": 371479, "epoch": 4475} {"train_loss": -26.2109317779541, "global_step": 371480, "epoch": 4475} {"train_loss": -26.75678062438965, "global_step": 371481, "epoch": 4475} {"train_loss": -26.366165161132812, "global_step": 371482, "epoch": 4475} {"train_loss": -26.556324005126953, "global_step": 371483, "epoch": 4475} {"train_loss": -26.220901489257812, "global_step": 371484, "epoch": 4475} {"train_loss": -26.435745239257812, "global_step": 371485, "epoch": 4475} {"train_loss": -26.64276123046875, "global_step": 371486, "epoch": 4475} {"train_loss": -26.3515625, "global_step": 371487, "epoch": 4475} {"train_loss": -26.333484649658203, "global_step": 371488, "epoch": 4475} {"train_loss": -26.149656295776367, "global_step": 371489, "epoch": 4475} {"train_loss": -26.4763240814209, "global_step": 371490, "epoch": 4475} {"train_loss": -26.346593856811523, "global_step": 371491, "epoch": 4475} {"train_loss": -26.549274444580078, "global_step": 371492, "epoch": 4475} {"train_loss": -26.41326332092285, "global_step": 371493, "epoch": 4475} {"train_loss": -26.408735275268555, "global_step": 371494, "epoch": 4475} {"train_loss": -26.550872802734375, "global_step": 371495, "epoch": 4475} {"train_loss": -26.437397003173828, "global_step": 371496, "epoch": 4475} {"train_loss": -26.59088706970215, "global_step": 371497, "epoch": 4475} {"train_loss": -26.515058517456055, "global_step": 371498, "epoch": 4475} {"train_loss": -26.57354736328125, "global_step": 371499, "epoch": 4475} {"train_loss": -26.53618812561035, "global_step": 371500, "epoch": 4475} {"train_loss": -26.934661865234375, "global_step": 371501, "epoch": 4475} {"train_loss": -26.8099365234375, "global_step": 371502, "epoch": 4475} {"train_loss": -26.300580978393555, "global_step": 371503, "epoch": 4475} {"train_loss": -26.187864303588867, "global_step": 371504, "epoch": 4475} {"train_loss": -26.41796875, "global_step": 371505, "epoch": 4475} {"train_loss": -26.599023818969727, "global_step": 371506, "epoch": 4475} {"train_loss": -26.064837237438525, "global_step": 371507, "epoch": 4475, "val_loss": 6637918.0} {"train_loss": -24.994070053100586, "global_step": 371508, "epoch": 4476} {"train_loss": -23.085731506347656, "global_step": 371509, "epoch": 4476} {"train_loss": -24.862476348876953, "global_step": 371510, "epoch": 4476} {"train_loss": -25.74579429626465, "global_step": 371511, "epoch": 4476} {"train_loss": -25.80341148376465, "global_step": 371512, "epoch": 4476} {"train_loss": -25.7253360748291, "global_step": 371513, "epoch": 4476} {"train_loss": -25.822813034057617, "global_step": 371514, "epoch": 4476} {"train_loss": -25.8370418548584, "global_step": 371515, "epoch": 4476} {"train_loss": -26.126972198486328, "global_step": 371516, "epoch": 4476} {"train_loss": -26.081594467163086, "global_step": 371517, "epoch": 4476} {"train_loss": -26.210500717163086, "global_step": 371518, "epoch": 4476} {"train_loss": -25.896215438842773, "global_step": 371519, "epoch": 4476} {"train_loss": -26.251373291015625, "global_step": 371520, "epoch": 4476} {"train_loss": -26.422842025756836, "global_step": 371521, "epoch": 4476} {"train_loss": -26.28242301940918, "global_step": 371522, "epoch": 4476} {"train_loss": -26.15433120727539, "global_step": 371523, "epoch": 4476} {"train_loss": -26.4487247467041, "global_step": 371524, "epoch": 4476} {"train_loss": -26.35089111328125, "global_step": 371525, "epoch": 4476} {"train_loss": -26.148883819580078, "global_step": 371526, "epoch": 4476} {"train_loss": -26.374937057495117, "global_step": 371527, "epoch": 4476} {"train_loss": -26.442920684814453, "global_step": 371528, "epoch": 4476} {"train_loss": -26.121912002563477, "global_step": 371529, "epoch": 4476} {"train_loss": -26.414356231689453, "global_step": 371530, "epoch": 4476} {"train_loss": -26.331680297851562, "global_step": 371531, "epoch": 4476} {"train_loss": -26.143375396728516, "global_step": 371532, "epoch": 4476} {"train_loss": -26.471542358398438, "global_step": 371533, "epoch": 4476} {"train_loss": -25.94631004333496, "global_step": 371534, "epoch": 4476} {"train_loss": -26.335723876953125, "global_step": 371535, "epoch": 4476} {"train_loss": -26.8575382232666, "global_step": 371536, "epoch": 4476} {"train_loss": -26.388458251953125, "global_step": 371537, "epoch": 4476} {"train_loss": -26.517175674438477, "global_step": 371538, "epoch": 4476} {"train_loss": -26.80611228942871, "global_step": 371539, "epoch": 4476} {"train_loss": -26.73935890197754, "global_step": 371540, "epoch": 4476} {"train_loss": -26.421741485595703, "global_step": 371541, "epoch": 4476} {"train_loss": -26.582494735717773, "global_step": 371542, "epoch": 4476} {"train_loss": -26.112003326416016, "global_step": 371543, "epoch": 4476} {"train_loss": -26.41265869140625, "global_step": 371544, "epoch": 4476} {"train_loss": -26.6483211517334, "global_step": 371545, "epoch": 4476} {"train_loss": -26.788251876831055, "global_step": 371546, "epoch": 4476} {"train_loss": -26.31599235534668, "global_step": 371547, "epoch": 4476} {"train_loss": -26.456350326538086, "global_step": 371548, "epoch": 4476} {"train_loss": -26.78342056274414, "global_step": 371549, "epoch": 4476} {"train_loss": -26.32474708557129, "global_step": 371550, "epoch": 4476} {"train_loss": -26.472064971923828, "global_step": 371551, "epoch": 4476} {"train_loss": -26.425220489501953, "global_step": 371552, "epoch": 4476} {"train_loss": -26.357288360595703, "global_step": 371553, "epoch": 4476} {"train_loss": -25.990320205688477, "global_step": 371554, "epoch": 4476} {"train_loss": -26.4542236328125, "global_step": 371555, "epoch": 4476} {"train_loss": -26.514739990234375, "global_step": 371556, "epoch": 4476} {"train_loss": -26.197195053100586, "global_step": 371557, "epoch": 4476} {"train_loss": -26.84992790222168, "global_step": 371558, "epoch": 4476} {"train_loss": -26.05206298828125, "global_step": 371559, "epoch": 4476} {"train_loss": -26.436552047729492, "global_step": 371560, "epoch": 4476} {"train_loss": -26.621185302734375, "global_step": 371561, "epoch": 4476} {"train_loss": -26.45802116394043, "global_step": 371562, "epoch": 4476} {"train_loss": -26.39664077758789, "global_step": 371563, "epoch": 4476} {"train_loss": -26.207111358642578, "global_step": 371564, "epoch": 4476} {"train_loss": -26.207605361938477, "global_step": 371565, "epoch": 4476} {"train_loss": -26.578083038330078, "global_step": 371566, "epoch": 4476} {"train_loss": -26.701562881469727, "global_step": 371567, "epoch": 4476} {"train_loss": -26.497852325439453, "global_step": 371568, "epoch": 4476} {"train_loss": -26.441877365112305, "global_step": 371569, "epoch": 4476} {"train_loss": -26.495641708374023, "global_step": 371570, "epoch": 4476} {"train_loss": -26.218748092651367, "global_step": 371571, "epoch": 4476} {"train_loss": -26.526823043823242, "global_step": 371572, "epoch": 4476} {"train_loss": -26.547134399414062, "global_step": 371573, "epoch": 4476} {"train_loss": -26.649555206298828, "global_step": 371574, "epoch": 4476} {"train_loss": -26.266759872436523, "global_step": 371575, "epoch": 4476} {"train_loss": -26.29865837097168, "global_step": 371576, "epoch": 4476} {"train_loss": -26.398584365844727, "global_step": 371577, "epoch": 4476} {"train_loss": -26.406097412109375, "global_step": 371578, "epoch": 4476} {"train_loss": -25.961700439453125, "global_step": 371579, "epoch": 4476} {"train_loss": -26.080854415893555, "global_step": 371580, "epoch": 4476} {"train_loss": -25.90682029724121, "global_step": 371581, "epoch": 4476} {"train_loss": -26.7310733795166, "global_step": 371582, "epoch": 4476} {"train_loss": -26.490509033203125, "global_step": 371583, "epoch": 4476} {"train_loss": -26.48679542541504, "global_step": 371584, "epoch": 4476} {"train_loss": -25.954355239868164, "global_step": 371585, "epoch": 4476} {"train_loss": -26.7298583984375, "global_step": 371586, "epoch": 4476} {"train_loss": -26.284799575805664, "global_step": 371587, "epoch": 4476} {"train_loss": -26.38606834411621, "global_step": 371588, "epoch": 4476} {"train_loss": -26.252710342407227, "global_step": 371589, "epoch": 4476} {"train_loss": -26.27680148848568, "global_step": 371590, "epoch": 4476, "val_loss": 6615388.5} {"train_loss": -25.499053955078125, "global_step": 371591, "epoch": 4477} {"train_loss": -25.7500057220459, "global_step": 371592, "epoch": 4477} {"train_loss": -26.138452529907227, "global_step": 371593, "epoch": 4477} {"train_loss": -25.3513240814209, "global_step": 371594, "epoch": 4477} {"train_loss": -25.994672775268555, "global_step": 371595, "epoch": 4477} {"train_loss": -25.934375762939453, "global_step": 371596, "epoch": 4477} {"train_loss": -25.62967872619629, "global_step": 371597, "epoch": 4477} {"train_loss": -25.546932220458984, "global_step": 371598, "epoch": 4477} {"train_loss": -26.004858016967773, "global_step": 371599, "epoch": 4477} {"train_loss": -25.57216453552246, "global_step": 371600, "epoch": 4477} {"train_loss": -25.842575073242188, "global_step": 371601, "epoch": 4477} {"train_loss": -26.206281661987305, "global_step": 371602, "epoch": 4477} {"train_loss": -25.962814331054688, "global_step": 371603, "epoch": 4477} {"train_loss": -26.0955810546875, "global_step": 371604, "epoch": 4477} {"train_loss": -26.22486686706543, "global_step": 371605, "epoch": 4477} {"train_loss": -25.98592185974121, "global_step": 371606, "epoch": 4477} {"train_loss": -25.775238037109375, "global_step": 371607, "epoch": 4477} {"train_loss": -26.22112464904785, "global_step": 371608, "epoch": 4477} {"train_loss": -26.344985961914062, "global_step": 371609, "epoch": 4477} {"train_loss": -25.937124252319336, "global_step": 371610, "epoch": 4477} {"train_loss": -26.374780654907227, "global_step": 371611, "epoch": 4477} {"train_loss": -25.941913604736328, "global_step": 371612, "epoch": 4477} {"train_loss": -26.1071720123291, "global_step": 371613, "epoch": 4477} {"train_loss": -26.146188735961914, "global_step": 371614, "epoch": 4477} {"train_loss": -26.2961368560791, "global_step": 371615, "epoch": 4477} {"train_loss": -26.267627716064453, "global_step": 371616, "epoch": 4477} {"train_loss": -26.524518966674805, "global_step": 371617, "epoch": 4477} {"train_loss": -26.364200592041016, "global_step": 371618, "epoch": 4477} {"train_loss": -26.02923011779785, "global_step": 371619, "epoch": 4477} {"train_loss": -26.4571533203125, "global_step": 371620, "epoch": 4477} {"train_loss": -26.695667266845703, "global_step": 371621, "epoch": 4477} {"train_loss": -26.449506759643555, "global_step": 371622, "epoch": 4477} {"train_loss": -25.9558162689209, "global_step": 371623, "epoch": 4477} {"train_loss": -26.487293243408203, "global_step": 371624, "epoch": 4477} {"train_loss": -26.405805587768555, "global_step": 371625, "epoch": 4477} {"train_loss": -26.100189208984375, "global_step": 371626, "epoch": 4477} {"train_loss": -26.45255470275879, "global_step": 371627, "epoch": 4477} {"train_loss": -26.810916900634766, "global_step": 371628, "epoch": 4477} {"train_loss": -26.69647789001465, "global_step": 371629, "epoch": 4477} {"train_loss": -26.320877075195312, "global_step": 371630, "epoch": 4477} {"train_loss": -26.492963790893555, "global_step": 371631, "epoch": 4477} {"train_loss": -26.694753646850586, "global_step": 371632, "epoch": 4477} {"train_loss": -26.26018714904785, "global_step": 371633, "epoch": 4477} {"train_loss": -26.22991943359375, "global_step": 371634, "epoch": 4477} {"train_loss": -26.4798641204834, "global_step": 371635, "epoch": 4477} {"train_loss": -26.4116153717041, "global_step": 371636, "epoch": 4477} {"train_loss": -26.5748348236084, "global_step": 371637, "epoch": 4477} {"train_loss": -26.44856834411621, "global_step": 371638, "epoch": 4477} {"train_loss": -26.7863826751709, "global_step": 371639, "epoch": 4477} {"train_loss": -26.41619873046875, "global_step": 371640, "epoch": 4477} {"train_loss": -26.421436309814453, "global_step": 371641, "epoch": 4477} {"train_loss": -26.479333877563477, "global_step": 371642, "epoch": 4477} {"train_loss": -26.7700138092041, "global_step": 371643, "epoch": 4477} {"train_loss": -26.5152645111084, "global_step": 371644, "epoch": 4477} {"train_loss": -26.613662719726562, "global_step": 371645, "epoch": 4477} {"train_loss": -26.144636154174805, "global_step": 371646, "epoch": 4477} {"train_loss": -26.695068359375, "global_step": 371647, "epoch": 4477} {"train_loss": -26.188440322875977, "global_step": 371648, "epoch": 4477} {"train_loss": -26.375232696533203, "global_step": 371649, "epoch": 4477} {"train_loss": -26.69483757019043, "global_step": 371650, "epoch": 4477} {"train_loss": -26.687747955322266, "global_step": 371651, "epoch": 4477} {"train_loss": -26.90342140197754, "global_step": 371652, "epoch": 4477} {"train_loss": -26.57612419128418, "global_step": 371653, "epoch": 4477} {"train_loss": -26.396711349487305, "global_step": 371654, "epoch": 4477} {"train_loss": -26.133869171142578, "global_step": 371655, "epoch": 4477} {"train_loss": -26.465606689453125, "global_step": 371656, "epoch": 4477} {"train_loss": -26.753366470336914, "global_step": 371657, "epoch": 4477} {"train_loss": -26.4816837310791, "global_step": 371658, "epoch": 4477} {"train_loss": -26.165151596069336, "global_step": 371659, "epoch": 4477} {"train_loss": -26.575637817382812, "global_step": 371660, "epoch": 4477} {"train_loss": -26.140344619750977, "global_step": 371661, "epoch": 4477} {"train_loss": -26.706390380859375, "global_step": 371662, "epoch": 4477} {"train_loss": -26.34650230407715, "global_step": 371663, "epoch": 4477} {"train_loss": -26.284332275390625, "global_step": 371664, "epoch": 4477} {"train_loss": -26.72283363342285, "global_step": 371665, "epoch": 4477} {"train_loss": -26.52950096130371, "global_step": 371666, "epoch": 4477} {"train_loss": -26.500595092773438, "global_step": 371667, "epoch": 4477} {"train_loss": -26.631006240844727, "global_step": 371668, "epoch": 4477} {"train_loss": -26.599660873413086, "global_step": 371669, "epoch": 4477} {"train_loss": -26.050537109375, "global_step": 371670, "epoch": 4477} {"train_loss": -26.43585777282715, "global_step": 371671, "epoch": 4477} {"train_loss": -26.5056095123291, "global_step": 371672, "epoch": 4477} {"train_loss": -26.300346328551512, "global_step": 371673, "epoch": 4477, "val_loss": 6738122.0} {"train_loss": -26.3299617767334, "global_step": 371674, "epoch": 4478} {"train_loss": -25.720840454101562, "global_step": 371675, "epoch": 4478} {"train_loss": -26.024351119995117, "global_step": 371676, "epoch": 4478} {"train_loss": -25.27275276184082, "global_step": 371677, "epoch": 4478} {"train_loss": -25.730756759643555, "global_step": 371678, "epoch": 4478} {"train_loss": -25.803348541259766, "global_step": 371679, "epoch": 4478} {"train_loss": -26.21578025817871, "global_step": 371680, "epoch": 4478} {"train_loss": -25.921628952026367, "global_step": 371681, "epoch": 4478} {"train_loss": -25.954442977905273, "global_step": 371682, "epoch": 4478} {"train_loss": -25.184307098388672, "global_step": 371683, "epoch": 4478} {"train_loss": -26.2869873046875, "global_step": 371684, "epoch": 4478} {"train_loss": -25.905786514282227, "global_step": 371685, "epoch": 4478} {"train_loss": -25.703521728515625, "global_step": 371686, "epoch": 4478} {"train_loss": -25.957014083862305, "global_step": 371687, "epoch": 4478} {"train_loss": -25.97393226623535, "global_step": 371688, "epoch": 4478} {"train_loss": -26.015949249267578, "global_step": 371689, "epoch": 4478} {"train_loss": -26.044992446899414, "global_step": 371690, "epoch": 4478} {"train_loss": -26.14898681640625, "global_step": 371691, "epoch": 4478} {"train_loss": -26.004175186157227, "global_step": 371692, "epoch": 4478} {"train_loss": -26.319345474243164, "global_step": 371693, "epoch": 4478} {"train_loss": -26.229171752929688, "global_step": 371694, "epoch": 4478} {"train_loss": -25.8840389251709, "global_step": 371695, "epoch": 4478} {"train_loss": -26.37604331970215, "global_step": 371696, "epoch": 4478} {"train_loss": -26.189697265625, "global_step": 371697, "epoch": 4478} {"train_loss": -26.267080307006836, "global_step": 371698, "epoch": 4478} {"train_loss": -26.1937198638916, "global_step": 371699, "epoch": 4478} {"train_loss": -26.131458282470703, "global_step": 371700, "epoch": 4478} {"train_loss": -26.094074249267578, "global_step": 371701, "epoch": 4478} {"train_loss": -26.10309410095215, "global_step": 371702, "epoch": 4478} {"train_loss": -26.47389030456543, "global_step": 371703, "epoch": 4478} {"train_loss": -26.376829147338867, "global_step": 371704, "epoch": 4478} {"train_loss": -26.206348419189453, "global_step": 371705, "epoch": 4478} {"train_loss": -26.026718139648438, "global_step": 371706, "epoch": 4478} {"train_loss": -26.459949493408203, "global_step": 371707, "epoch": 4478} {"train_loss": -26.356149673461914, "global_step": 371708, "epoch": 4478} {"train_loss": -26.568326950073242, "global_step": 371709, "epoch": 4478} {"train_loss": -26.094858169555664, "global_step": 371710, "epoch": 4478} {"train_loss": -26.451948165893555, "global_step": 371711, "epoch": 4478} {"train_loss": -26.267953872680664, "global_step": 371712, "epoch": 4478} {"train_loss": -26.899229049682617, "global_step": 371713, "epoch": 4478} {"train_loss": -26.261011123657227, "global_step": 371714, "epoch": 4478} {"train_loss": -26.672449111938477, "global_step": 371715, "epoch": 4478} {"train_loss": -26.617834091186523, "global_step": 371716, "epoch": 4478} {"train_loss": -26.359888076782227, "global_step": 371717, "epoch": 4478} {"train_loss": -26.14582633972168, "global_step": 371718, "epoch": 4478} {"train_loss": -26.17518424987793, "global_step": 371719, "epoch": 4478} {"train_loss": -25.58639907836914, "global_step": 371720, "epoch": 4478} {"train_loss": -26.194507598876953, "global_step": 371721, "epoch": 4478} {"train_loss": -26.527441024780273, "global_step": 371722, "epoch": 4478} {"train_loss": -25.817487716674805, "global_step": 371723, "epoch": 4478} {"train_loss": -26.601455688476562, "global_step": 371724, "epoch": 4478} {"train_loss": -26.573638916015625, "global_step": 371725, "epoch": 4478} {"train_loss": -26.134002685546875, "global_step": 371726, "epoch": 4478} {"train_loss": -26.69483757019043, "global_step": 371727, "epoch": 4478} {"train_loss": -26.206266403198242, "global_step": 371728, "epoch": 4478} {"train_loss": -26.31475830078125, "global_step": 371729, "epoch": 4478} {"train_loss": -26.377439498901367, "global_step": 371730, "epoch": 4478} {"train_loss": -26.522687911987305, "global_step": 371731, "epoch": 4478} {"train_loss": -26.40394401550293, "global_step": 371732, "epoch": 4478} {"train_loss": -26.325763702392578, "global_step": 371733, "epoch": 4478} {"train_loss": -26.617643356323242, "global_step": 371734, "epoch": 4478} {"train_loss": -26.446964263916016, "global_step": 371735, "epoch": 4478} {"train_loss": -26.4996280670166, "global_step": 371736, "epoch": 4478} {"train_loss": -26.413129806518555, "global_step": 371737, "epoch": 4478} {"train_loss": -26.46626091003418, "global_step": 371738, "epoch": 4478} {"train_loss": -26.824087142944336, "global_step": 371739, "epoch": 4478} {"train_loss": -26.441022872924805, "global_step": 371740, "epoch": 4478} {"train_loss": -26.279300689697266, "global_step": 371741, "epoch": 4478} {"train_loss": -26.426074981689453, "global_step": 371742, "epoch": 4478} {"train_loss": -26.493452072143555, "global_step": 371743, "epoch": 4478} {"train_loss": -26.471296310424805, "global_step": 371744, "epoch": 4478} {"train_loss": -26.183324813842773, "global_step": 371745, "epoch": 4478} {"train_loss": -26.613332748413086, "global_step": 371746, "epoch": 4478} {"train_loss": -26.5156307220459, "global_step": 371747, "epoch": 4478} {"train_loss": -26.721670150756836, "global_step": 371748, "epoch": 4478} {"train_loss": -26.630115509033203, "global_step": 371749, "epoch": 4478} {"train_loss": -26.1944637298584, "global_step": 371750, "epoch": 4478} {"train_loss": -26.678869247436523, "global_step": 371751, "epoch": 4478} {"train_loss": -26.970373153686523, "global_step": 371752, "epoch": 4478} {"train_loss": -26.693140029907227, "global_step": 371753, "epoch": 4478} {"train_loss": -26.239002227783203, "global_step": 371754, "epoch": 4478} {"train_loss": -26.28713035583496, "global_step": 371755, "epoch": 4478} {"train_loss": -26.272394019437122, "global_step": 371756, "epoch": 4478, "val_loss": 6681316.0} {"train_loss": -25.744348526000977, "global_step": 371757, "epoch": 4479} {"train_loss": -25.646411895751953, "global_step": 371758, "epoch": 4479} {"train_loss": -25.423864364624023, "global_step": 371759, "epoch": 4479} {"train_loss": -24.69089698791504, "global_step": 371760, "epoch": 4479} {"train_loss": -25.27692413330078, "global_step": 371761, "epoch": 4479} {"train_loss": -25.893329620361328, "global_step": 371762, "epoch": 4479} {"train_loss": -25.583097457885742, "global_step": 371763, "epoch": 4479} {"train_loss": -25.813207626342773, "global_step": 371764, "epoch": 4479} {"train_loss": -25.84861183166504, "global_step": 371765, "epoch": 4479} {"train_loss": -25.678693771362305, "global_step": 371766, "epoch": 4479} {"train_loss": -26.062936782836914, "global_step": 371767, "epoch": 4479} {"train_loss": -25.3730525970459, "global_step": 371768, "epoch": 4479} {"train_loss": -25.613971710205078, "global_step": 371769, "epoch": 4479} {"train_loss": -25.854215621948242, "global_step": 371770, "epoch": 4479} {"train_loss": -25.66486167907715, "global_step": 371771, "epoch": 4479} {"train_loss": -25.707284927368164, "global_step": 371772, "epoch": 4479} {"train_loss": -25.989492416381836, "global_step": 371773, "epoch": 4479} {"train_loss": -25.854373931884766, "global_step": 371774, "epoch": 4479} {"train_loss": -26.064239501953125, "global_step": 371775, "epoch": 4479} {"train_loss": -26.090124130249023, "global_step": 371776, "epoch": 4479} {"train_loss": -25.972003936767578, "global_step": 371777, "epoch": 4479} {"train_loss": -26.125646591186523, "global_step": 371778, "epoch": 4479} {"train_loss": -26.013931274414062, "global_step": 371779, "epoch": 4479} {"train_loss": -26.033756256103516, "global_step": 371780, "epoch": 4479} {"train_loss": -26.1799373626709, "global_step": 371781, "epoch": 4479} {"train_loss": -26.063568115234375, "global_step": 371782, "epoch": 4479} {"train_loss": -26.21816062927246, "global_step": 371783, "epoch": 4479} {"train_loss": -25.74175453186035, "global_step": 371784, "epoch": 4479} {"train_loss": -26.301725387573242, "global_step": 371785, "epoch": 4479} {"train_loss": -26.050765991210938, "global_step": 371786, "epoch": 4479} {"train_loss": -26.640522003173828, "global_step": 371787, "epoch": 4479} {"train_loss": -26.284711837768555, "global_step": 371788, "epoch": 4479} {"train_loss": -26.787799835205078, "global_step": 371789, "epoch": 4479} {"train_loss": -26.465850830078125, "global_step": 371790, "epoch": 4479} {"train_loss": -26.22951316833496, "global_step": 371791, "epoch": 4479} {"train_loss": -26.078710556030273, "global_step": 371792, "epoch": 4479} {"train_loss": -26.472806930541992, "global_step": 371793, "epoch": 4479} {"train_loss": -26.775379180908203, "global_step": 371794, "epoch": 4479} {"train_loss": -26.347272872924805, "global_step": 371795, "epoch": 4479} {"train_loss": -26.53706932067871, "global_step": 371796, "epoch": 4479} {"train_loss": -26.082624435424805, "global_step": 371797, "epoch": 4479} {"train_loss": -26.211889266967773, "global_step": 371798, "epoch": 4479} {"train_loss": -26.274246215820312, "global_step": 371799, "epoch": 4479} {"train_loss": -26.475915908813477, "global_step": 371800, "epoch": 4479} {"train_loss": -26.59650230407715, "global_step": 371801, "epoch": 4479} {"train_loss": -26.563207626342773, "global_step": 371802, "epoch": 4479} {"train_loss": -26.480655670166016, "global_step": 371803, "epoch": 4479} {"train_loss": -26.52878189086914, "global_step": 371804, "epoch": 4479} {"train_loss": -26.374984741210938, "global_step": 371805, "epoch": 4479} {"train_loss": -26.47000503540039, "global_step": 371806, "epoch": 4479} {"train_loss": -26.3214111328125, "global_step": 371807, "epoch": 4479} {"train_loss": -26.914459228515625, "global_step": 371808, "epoch": 4479} {"train_loss": -26.229572296142578, "global_step": 371809, "epoch": 4479} {"train_loss": -26.328977584838867, "global_step": 371810, "epoch": 4479} {"train_loss": -26.513410568237305, "global_step": 371811, "epoch": 4479} {"train_loss": -26.697620391845703, "global_step": 371812, "epoch": 4479} {"train_loss": -26.479345321655273, "global_step": 371813, "epoch": 4479} {"train_loss": -26.380828857421875, "global_step": 371814, "epoch": 4479} {"train_loss": -26.341327667236328, "global_step": 371815, "epoch": 4479} {"train_loss": -26.43697166442871, "global_step": 371816, "epoch": 4479} {"train_loss": -26.38848304748535, "global_step": 371817, "epoch": 4479} {"train_loss": -26.531579971313477, "global_step": 371818, "epoch": 4479} {"train_loss": -26.473981857299805, "global_step": 371819, "epoch": 4479} {"train_loss": -26.000598907470703, "global_step": 371820, "epoch": 4479} {"train_loss": -26.395421981811523, "global_step": 371821, "epoch": 4479} {"train_loss": -26.091115951538086, "global_step": 371822, "epoch": 4479} {"train_loss": -26.229145050048828, "global_step": 371823, "epoch": 4479} {"train_loss": -26.084314346313477, "global_step": 371824, "epoch": 4479} {"train_loss": -26.152257919311523, "global_step": 371825, "epoch": 4479} {"train_loss": -25.234872817993164, "global_step": 371826, "epoch": 4479} {"train_loss": -25.074440002441406, "global_step": 371827, "epoch": 4479} {"train_loss": -25.667621612548828, "global_step": 371828, "epoch": 4479} {"train_loss": -25.51910972595215, "global_step": 371829, "epoch": 4479} {"train_loss": -26.49123191833496, "global_step": 371830, "epoch": 4479} {"train_loss": -26.037649154663086, "global_step": 371831, "epoch": 4479} {"train_loss": -25.987274169921875, "global_step": 371832, "epoch": 4479} {"train_loss": -26.474695205688477, "global_step": 371833, "epoch": 4479} {"train_loss": -26.118173599243164, "global_step": 371834, "epoch": 4479} {"train_loss": -26.339887619018555, "global_step": 371835, "epoch": 4479} {"train_loss": -26.155689239501953, "global_step": 371836, "epoch": 4479} {"train_loss": -26.052005767822266, "global_step": 371837, "epoch": 4479} {"train_loss": -26.134809494018555, "global_step": 371838, "epoch": 4479} {"train_loss": -26.105883035315088, "global_step": 371839, "epoch": 4479, "val_loss": 6648902.0} {"train_loss": -25.899871826171875, "global_step": 371840, "epoch": 4480} {"train_loss": -25.588848114013672, "global_step": 371841, "epoch": 4480} {"train_loss": -25.986303329467773, "global_step": 371842, "epoch": 4480} {"train_loss": -25.603225708007812, "global_step": 371843, "epoch": 4480} {"train_loss": -25.90288734436035, "global_step": 371844, "epoch": 4480} {"train_loss": -25.81333351135254, "global_step": 371845, "epoch": 4480} {"train_loss": -26.0908203125, "global_step": 371846, "epoch": 4480} {"train_loss": -25.895721435546875, "global_step": 371847, "epoch": 4480} {"train_loss": -26.11393165588379, "global_step": 371848, "epoch": 4480} {"train_loss": -25.864511489868164, "global_step": 371849, "epoch": 4480} {"train_loss": -25.946582794189453, "global_step": 371850, "epoch": 4480} {"train_loss": -25.697824478149414, "global_step": 371851, "epoch": 4480} {"train_loss": -25.965051651000977, "global_step": 371852, "epoch": 4480} {"train_loss": -25.982526779174805, "global_step": 371853, "epoch": 4480} {"train_loss": -26.150177001953125, "global_step": 371854, "epoch": 4480} {"train_loss": -26.010894775390625, "global_step": 371855, "epoch": 4480} {"train_loss": -26.218158721923828, "global_step": 371856, "epoch": 4480} {"train_loss": -25.72298240661621, "global_step": 371857, "epoch": 4480} {"train_loss": -26.354816436767578, "global_step": 371858, "epoch": 4480} {"train_loss": -26.186742782592773, "global_step": 371859, "epoch": 4480} {"train_loss": -26.050329208374023, "global_step": 371860, "epoch": 4480} {"train_loss": -26.117053985595703, "global_step": 371861, "epoch": 4480} {"train_loss": -26.3347225189209, "global_step": 371862, "epoch": 4480} {"train_loss": -26.21510887145996, "global_step": 371863, "epoch": 4480} {"train_loss": -25.91510581970215, "global_step": 371864, "epoch": 4480} {"train_loss": -26.480756759643555, "global_step": 371865, "epoch": 4480} {"train_loss": -26.361913681030273, "global_step": 371866, "epoch": 4480} {"train_loss": -26.4906063079834, "global_step": 371867, "epoch": 4480} {"train_loss": -25.86610221862793, "global_step": 371868, "epoch": 4480} {"train_loss": -26.20868492126465, "global_step": 371869, "epoch": 4480} {"train_loss": -26.18171501159668, "global_step": 371870, "epoch": 4480} {"train_loss": -26.42461585998535, "global_step": 371871, "epoch": 4480} {"train_loss": -26.137069702148438, "global_step": 371872, "epoch": 4480} {"train_loss": -26.33108901977539, "global_step": 371873, "epoch": 4480} {"train_loss": -26.42339515686035, "global_step": 371874, "epoch": 4480} {"train_loss": -26.278772354125977, "global_step": 371875, "epoch": 4480} {"train_loss": -26.240528106689453, "global_step": 371876, "epoch": 4480} {"train_loss": -26.453222274780273, "global_step": 371877, "epoch": 4480} {"train_loss": -26.177961349487305, "global_step": 371878, "epoch": 4480} {"train_loss": -26.63563346862793, "global_step": 371879, "epoch": 4480} {"train_loss": -26.628345489501953, "global_step": 371880, "epoch": 4480} {"train_loss": -26.29701042175293, "global_step": 371881, "epoch": 4480} {"train_loss": -26.47857666015625, "global_step": 371882, "epoch": 4480} {"train_loss": -26.680341720581055, "global_step": 371883, "epoch": 4480} {"train_loss": -26.386945724487305, "global_step": 371884, "epoch": 4480} {"train_loss": -26.69312858581543, "global_step": 371885, "epoch": 4480} {"train_loss": -26.323108673095703, "global_step": 371886, "epoch": 4480} {"train_loss": -26.573368072509766, "global_step": 371887, "epoch": 4480} {"train_loss": -26.366867065429688, "global_step": 371888, "epoch": 4480} {"train_loss": -26.596967697143555, "global_step": 371889, "epoch": 4480} {"train_loss": -26.610172271728516, "global_step": 371890, "epoch": 4480} {"train_loss": -26.684101104736328, "global_step": 371891, "epoch": 4480} {"train_loss": -26.305883407592773, "global_step": 371892, "epoch": 4480} {"train_loss": -26.695966720581055, "global_step": 371893, "epoch": 4480} {"train_loss": -26.77251625061035, "global_step": 371894, "epoch": 4480} {"train_loss": -26.4345703125, "global_step": 371895, "epoch": 4480} {"train_loss": -26.77473258972168, "global_step": 371896, "epoch": 4480} {"train_loss": -26.568689346313477, "global_step": 371897, "epoch": 4480} {"train_loss": -26.783674240112305, "global_step": 371898, "epoch": 4480} {"train_loss": -26.428680419921875, "global_step": 371899, "epoch": 4480} {"train_loss": -26.252309799194336, "global_step": 371900, "epoch": 4480} {"train_loss": -26.34986686706543, "global_step": 371901, "epoch": 4480} {"train_loss": -26.696943283081055, "global_step": 371902, "epoch": 4480} {"train_loss": -26.489673614501953, "global_step": 371903, "epoch": 4480} {"train_loss": -26.418298721313477, "global_step": 371904, "epoch": 4480} {"train_loss": -26.64263343811035, "global_step": 371905, "epoch": 4480} {"train_loss": -26.34126853942871, "global_step": 371906, "epoch": 4480} {"train_loss": -26.421594619750977, "global_step": 371907, "epoch": 4480} {"train_loss": -26.415430068969727, "global_step": 371908, "epoch": 4480} {"train_loss": -26.530805587768555, "global_step": 371909, "epoch": 4480} {"train_loss": -25.76211929321289, "global_step": 371910, "epoch": 4480} {"train_loss": -25.789396286010742, "global_step": 371911, "epoch": 4480} {"train_loss": -25.88694190979004, "global_step": 371912, "epoch": 4480} {"train_loss": -25.343280792236328, "global_step": 371913, "epoch": 4480} {"train_loss": -25.562589645385742, "global_step": 371914, "epoch": 4480} {"train_loss": -25.618741989135742, "global_step": 371915, "epoch": 4480} {"train_loss": -26.470386505126953, "global_step": 371916, "epoch": 4480} {"train_loss": -25.793283462524414, "global_step": 371917, "epoch": 4480} {"train_loss": -26.139270782470703, "global_step": 371918, "epoch": 4480} {"train_loss": -26.4169864654541, "global_step": 371919, "epoch": 4480} {"train_loss": -26.024383544921875, "global_step": 371920, "epoch": 4480} {"train_loss": -26.169538497924805, "global_step": 371921, "epoch": 4480} {"train_loss": -26.23136341140931, "global_step": 371922, "epoch": 4480, "val_loss": 6693090.0} {"train_loss": -25.88938331604004, "global_step": 371923, "epoch": 4481} {"train_loss": -25.64841079711914, "global_step": 371924, "epoch": 4481} {"train_loss": -26.003644943237305, "global_step": 371925, "epoch": 4481} {"train_loss": -26.207416534423828, "global_step": 371926, "epoch": 4481} {"train_loss": -26.208600997924805, "global_step": 371927, "epoch": 4481} {"train_loss": -25.423513412475586, "global_step": 371928, "epoch": 4481} {"train_loss": -26.200729370117188, "global_step": 371929, "epoch": 4481} {"train_loss": -25.672256469726562, "global_step": 371930, "epoch": 4481} {"train_loss": -26.165571212768555, "global_step": 371931, "epoch": 4481} {"train_loss": -25.800735473632812, "global_step": 371932, "epoch": 4481} {"train_loss": -25.858396530151367, "global_step": 371933, "epoch": 4481} {"train_loss": -25.850269317626953, "global_step": 371934, "epoch": 4481} {"train_loss": -25.974639892578125, "global_step": 371935, "epoch": 4481} {"train_loss": -26.0545597076416, "global_step": 371936, "epoch": 4481} {"train_loss": -25.975234985351562, "global_step": 371937, "epoch": 4481} {"train_loss": -26.362268447875977, "global_step": 371938, "epoch": 4481} {"train_loss": -26.523975372314453, "global_step": 371939, "epoch": 4481} {"train_loss": -26.048933029174805, "global_step": 371940, "epoch": 4481} {"train_loss": -26.545347213745117, "global_step": 371941, "epoch": 4481} {"train_loss": -26.207178115844727, "global_step": 371942, "epoch": 4481} {"train_loss": -26.281036376953125, "global_step": 371943, "epoch": 4481} {"train_loss": -26.294143676757812, "global_step": 371944, "epoch": 4481} {"train_loss": -26.055450439453125, "global_step": 371945, "epoch": 4481} {"train_loss": -26.38837242126465, "global_step": 371946, "epoch": 4481} {"train_loss": -26.631580352783203, "global_step": 371947, "epoch": 4481} {"train_loss": -26.41594886779785, "global_step": 371948, "epoch": 4481} {"train_loss": -26.498685836791992, "global_step": 371949, "epoch": 4481} {"train_loss": -26.619216918945312, "global_step": 371950, "epoch": 4481} {"train_loss": -26.24309730529785, "global_step": 371951, "epoch": 4481} {"train_loss": -26.730566024780273, "global_step": 371952, "epoch": 4481} {"train_loss": -26.493579864501953, "global_step": 371953, "epoch": 4481} {"train_loss": -26.41263198852539, "global_step": 371954, "epoch": 4481} {"train_loss": -26.42960548400879, "global_step": 371955, "epoch": 4481} {"train_loss": -26.74518394470215, "global_step": 371956, "epoch": 4481} {"train_loss": -26.456953048706055, "global_step": 371957, "epoch": 4481} {"train_loss": -26.70026206970215, "global_step": 371958, "epoch": 4481} {"train_loss": -26.38459587097168, "global_step": 371959, "epoch": 4481} {"train_loss": -26.423078536987305, "global_step": 371960, "epoch": 4481} {"train_loss": -26.255643844604492, "global_step": 371961, "epoch": 4481} {"train_loss": -26.260892868041992, "global_step": 371962, "epoch": 4481} {"train_loss": -26.473630905151367, "global_step": 371963, "epoch": 4481} {"train_loss": -26.58211326599121, "global_step": 371964, "epoch": 4481} {"train_loss": -26.667484283447266, "global_step": 371965, "epoch": 4481} {"train_loss": -26.498611450195312, "global_step": 371966, "epoch": 4481} {"train_loss": -26.69540786743164, "global_step": 371967, "epoch": 4481} {"train_loss": -26.169157028198242, "global_step": 371968, "epoch": 4481} {"train_loss": -26.01349449157715, "global_step": 371969, "epoch": 4481} {"train_loss": -26.537647247314453, "global_step": 371970, "epoch": 4481} {"train_loss": -26.275014877319336, "global_step": 371971, "epoch": 4481} {"train_loss": -26.43910026550293, "global_step": 371972, "epoch": 4481} {"train_loss": -26.399658203125, "global_step": 371973, "epoch": 4481} {"train_loss": -26.298934936523438, "global_step": 371974, "epoch": 4481} {"train_loss": -26.784521102905273, "global_step": 371975, "epoch": 4481} {"train_loss": -26.61820411682129, "global_step": 371976, "epoch": 4481} {"train_loss": -26.17665672302246, "global_step": 371977, "epoch": 4481} {"train_loss": -26.511083602905273, "global_step": 371978, "epoch": 4481} {"train_loss": -26.677595138549805, "global_step": 371979, "epoch": 4481} {"train_loss": -26.334003448486328, "global_step": 371980, "epoch": 4481} {"train_loss": -25.943527221679688, "global_step": 371981, "epoch": 4481} {"train_loss": -26.342315673828125, "global_step": 371982, "epoch": 4481} {"train_loss": -26.07703971862793, "global_step": 371983, "epoch": 4481} {"train_loss": -26.685230255126953, "global_step": 371984, "epoch": 4481} {"train_loss": -26.440326690673828, "global_step": 371985, "epoch": 4481} {"train_loss": -26.687854766845703, "global_step": 371986, "epoch": 4481} {"train_loss": -26.336149215698242, "global_step": 371987, "epoch": 4481} {"train_loss": -26.5185546875, "global_step": 371988, "epoch": 4481} {"train_loss": -26.176496505737305, "global_step": 371989, "epoch": 4481} {"train_loss": -26.32355308532715, "global_step": 371990, "epoch": 4481} {"train_loss": -26.513479232788086, "global_step": 371991, "epoch": 4481} {"train_loss": -26.25324058532715, "global_step": 371992, "epoch": 4481} {"train_loss": -25.962615966796875, "global_step": 371993, "epoch": 4481} {"train_loss": -26.313861846923828, "global_step": 371994, "epoch": 4481} {"train_loss": -25.7896728515625, "global_step": 371995, "epoch": 4481} {"train_loss": -26.359975814819336, "global_step": 371996, "epoch": 4481} {"train_loss": -26.318408966064453, "global_step": 371997, "epoch": 4481} {"train_loss": -26.508197784423828, "global_step": 371998, "epoch": 4481} {"train_loss": -26.273193359375, "global_step": 371999, "epoch": 4481} {"train_loss": -26.355146408081055, "global_step": 372000, "epoch": 4481} {"train_loss": -26.254804611206055, "global_step": 372001, "epoch": 4481} {"train_loss": -25.725244522094727, "global_step": 372002, "epoch": 4481} {"train_loss": -26.027074813842773, "global_step": 372003, "epoch": 4481} {"train_loss": -26.280797958374023, "global_step": 372004, "epoch": 4481} {"train_loss": -26.301905689469304, "global_step": 372005, "epoch": 4481, "val_loss": 6658895.0} {"train_loss": -25.800674438476562, "global_step": 372006, "epoch": 4482} {"train_loss": -25.857391357421875, "global_step": 372007, "epoch": 4482} {"train_loss": -25.86330223083496, "global_step": 372008, "epoch": 4482} {"train_loss": -25.92520523071289, "global_step": 372009, "epoch": 4482} {"train_loss": -26.332853317260742, "global_step": 372010, "epoch": 4482} {"train_loss": -26.16395378112793, "global_step": 372011, "epoch": 4482} {"train_loss": -25.935007095336914, "global_step": 372012, "epoch": 4482} {"train_loss": -25.812742233276367, "global_step": 372013, "epoch": 4482} {"train_loss": -26.219995498657227, "global_step": 372014, "epoch": 4482} {"train_loss": -26.034570693969727, "global_step": 372015, "epoch": 4482} {"train_loss": -26.304519653320312, "global_step": 372016, "epoch": 4482} {"train_loss": -26.33259391784668, "global_step": 372017, "epoch": 4482} {"train_loss": -26.250507354736328, "global_step": 372018, "epoch": 4482} {"train_loss": -26.544225692749023, "global_step": 372019, "epoch": 4482} {"train_loss": -26.324914932250977, "global_step": 372020, "epoch": 4482} {"train_loss": -26.472015380859375, "global_step": 372021, "epoch": 4482} {"train_loss": -25.981420516967773, "global_step": 372022, "epoch": 4482} {"train_loss": -25.998859405517578, "global_step": 372023, "epoch": 4482} {"train_loss": -26.008697509765625, "global_step": 372024, "epoch": 4482} {"train_loss": -26.474048614501953, "global_step": 372025, "epoch": 4482} {"train_loss": -26.339075088500977, "global_step": 372026, "epoch": 4482} {"train_loss": -26.67120361328125, "global_step": 372027, "epoch": 4482} {"train_loss": -26.442413330078125, "global_step": 372028, "epoch": 4482} {"train_loss": -26.117517471313477, "global_step": 372029, "epoch": 4482} {"train_loss": -26.438282012939453, "global_step": 372030, "epoch": 4482} {"train_loss": -26.432586669921875, "global_step": 372031, "epoch": 4482} {"train_loss": -26.598413467407227, "global_step": 372032, "epoch": 4482} {"train_loss": -26.382104873657227, "global_step": 372033, "epoch": 4482} {"train_loss": -26.75681495666504, "global_step": 372034, "epoch": 4482} {"train_loss": -26.254531860351562, "global_step": 372035, "epoch": 4482} {"train_loss": -26.209394454956055, "global_step": 372036, "epoch": 4482} {"train_loss": -26.183740615844727, "global_step": 372037, "epoch": 4482} {"train_loss": -26.43192481994629, "global_step": 372038, "epoch": 4482} {"train_loss": -26.571577072143555, "global_step": 372039, "epoch": 4482} {"train_loss": -26.842849731445312, "global_step": 372040, "epoch": 4482} {"train_loss": -26.663105010986328, "global_step": 372041, "epoch": 4482} {"train_loss": -26.51325798034668, "global_step": 372042, "epoch": 4482} {"train_loss": -26.825544357299805, "global_step": 372043, "epoch": 4482} {"train_loss": -26.708654403686523, "global_step": 372044, "epoch": 4482} {"train_loss": -26.360370635986328, "global_step": 372045, "epoch": 4482} {"train_loss": -26.5074462890625, "global_step": 372046, "epoch": 4482} {"train_loss": -26.650466918945312, "global_step": 372047, "epoch": 4482} {"train_loss": -26.5853328704834, "global_step": 372048, "epoch": 4482} {"train_loss": -26.541067123413086, "global_step": 372049, "epoch": 4482} {"train_loss": -26.4051513671875, "global_step": 372050, "epoch": 4482} {"train_loss": -26.863372802734375, "global_step": 372051, "epoch": 4482} {"train_loss": -26.408994674682617, "global_step": 372052, "epoch": 4482} {"train_loss": -26.044757843017578, "global_step": 372053, "epoch": 4482} {"train_loss": -26.668521881103516, "global_step": 372054, "epoch": 4482} {"train_loss": -25.866455078125, "global_step": 372055, "epoch": 4482} {"train_loss": -26.503873825073242, "global_step": 372056, "epoch": 4482} {"train_loss": -26.465625762939453, "global_step": 372057, "epoch": 4482} {"train_loss": -26.1679630279541, "global_step": 372058, "epoch": 4482} {"train_loss": -26.506086349487305, "global_step": 372059, "epoch": 4482} {"train_loss": -26.767139434814453, "global_step": 372060, "epoch": 4482} {"train_loss": -26.670440673828125, "global_step": 372061, "epoch": 4482} {"train_loss": -26.187152862548828, "global_step": 372062, "epoch": 4482} {"train_loss": -26.6739559173584, "global_step": 372063, "epoch": 4482} {"train_loss": -26.52985954284668, "global_step": 372064, "epoch": 4482} {"train_loss": -26.423261642456055, "global_step": 372065, "epoch": 4482} {"train_loss": -26.988723754882812, "global_step": 372066, "epoch": 4482} {"train_loss": -26.661758422851562, "global_step": 372067, "epoch": 4482} {"train_loss": -26.81101417541504, "global_step": 372068, "epoch": 4482} {"train_loss": -26.367773056030273, "global_step": 372069, "epoch": 4482} {"train_loss": -26.522939682006836, "global_step": 372070, "epoch": 4482} {"train_loss": -26.685651779174805, "global_step": 372071, "epoch": 4482} {"train_loss": -26.500843048095703, "global_step": 372072, "epoch": 4482} {"train_loss": -26.76832389831543, "global_step": 372073, "epoch": 4482} {"train_loss": -26.237546920776367, "global_step": 372074, "epoch": 4482} {"train_loss": -26.622467041015625, "global_step": 372075, "epoch": 4482} {"train_loss": -26.4669132232666, "global_step": 372076, "epoch": 4482} {"train_loss": -26.630456924438477, "global_step": 372077, "epoch": 4482} {"train_loss": -26.597410202026367, "global_step": 372078, "epoch": 4482} {"train_loss": -26.271162033081055, "global_step": 372079, "epoch": 4482} {"train_loss": -26.65768814086914, "global_step": 372080, "epoch": 4482} {"train_loss": -26.432851791381836, "global_step": 372081, "epoch": 4482} {"train_loss": -26.451923370361328, "global_step": 372082, "epoch": 4482} {"train_loss": -26.57453727722168, "global_step": 372083, "epoch": 4482} {"train_loss": -26.226409912109375, "global_step": 372084, "epoch": 4482} {"train_loss": -26.294525146484375, "global_step": 372085, "epoch": 4482} {"train_loss": -26.582590103149414, "global_step": 372086, "epoch": 4482} {"train_loss": -26.305633544921875, "global_step": 372087, "epoch": 4482} {"train_loss": -26.380073524383178, "global_step": 372088, "epoch": 4482, "val_loss": 6611428.0} {"train_loss": -25.550046920776367, "global_step": 372089, "epoch": 4483} {"train_loss": -25.210529327392578, "global_step": 372090, "epoch": 4483} {"train_loss": -25.31089973449707, "global_step": 372091, "epoch": 4483} {"train_loss": -25.862646102905273, "global_step": 372092, "epoch": 4483} {"train_loss": -25.860809326171875, "global_step": 372093, "epoch": 4483} {"train_loss": -26.255828857421875, "global_step": 372094, "epoch": 4483} {"train_loss": -25.862903594970703, "global_step": 372095, "epoch": 4483} {"train_loss": -26.112537384033203, "global_step": 372096, "epoch": 4483} {"train_loss": -26.27753257751465, "global_step": 372097, "epoch": 4483} {"train_loss": -26.426477432250977, "global_step": 372098, "epoch": 4483} {"train_loss": -25.98910903930664, "global_step": 372099, "epoch": 4483} {"train_loss": -26.232084274291992, "global_step": 372100, "epoch": 4483} {"train_loss": -26.417423248291016, "global_step": 372101, "epoch": 4483} {"train_loss": -25.989171981811523, "global_step": 372102, "epoch": 4483} {"train_loss": -26.13184928894043, "global_step": 372103, "epoch": 4483} {"train_loss": -26.3270206451416, "global_step": 372104, "epoch": 4483} {"train_loss": -25.981998443603516, "global_step": 372105, "epoch": 4483} {"train_loss": -26.0366268157959, "global_step": 372106, "epoch": 4483} {"train_loss": -26.384750366210938, "global_step": 372107, "epoch": 4483} {"train_loss": -26.136545181274414, "global_step": 372108, "epoch": 4483} {"train_loss": -26.30840492248535, "global_step": 372109, "epoch": 4483} {"train_loss": -26.138525009155273, "global_step": 372110, "epoch": 4483} {"train_loss": -26.807336807250977, "global_step": 372111, "epoch": 4483} {"train_loss": -26.30386734008789, "global_step": 372112, "epoch": 4483} {"train_loss": -26.436429977416992, "global_step": 372113, "epoch": 4483} {"train_loss": -26.35059928894043, "global_step": 372114, "epoch": 4483} {"train_loss": -26.322168350219727, "global_step": 372115, "epoch": 4483} {"train_loss": -26.15150260925293, "global_step": 372116, "epoch": 4483} {"train_loss": -26.1184139251709, "global_step": 372117, "epoch": 4483} {"train_loss": -26.69654655456543, "global_step": 372118, "epoch": 4483} {"train_loss": -26.677234649658203, "global_step": 372119, "epoch": 4483} {"train_loss": -26.874937057495117, "global_step": 372120, "epoch": 4483} {"train_loss": -26.385089874267578, "global_step": 372121, "epoch": 4483} {"train_loss": -26.639942169189453, "global_step": 372122, "epoch": 4483} {"train_loss": -26.51531982421875, "global_step": 372123, "epoch": 4483} {"train_loss": -26.376785278320312, "global_step": 372124, "epoch": 4483} {"train_loss": -27.172245025634766, "global_step": 372125, "epoch": 4483} {"train_loss": -26.271087646484375, "global_step": 372126, "epoch": 4483} {"train_loss": -26.195768356323242, "global_step": 372127, "epoch": 4483} {"train_loss": -26.199737548828125, "global_step": 372128, "epoch": 4483} {"train_loss": -26.6217041015625, "global_step": 372129, "epoch": 4483} {"train_loss": -26.4655704498291, "global_step": 372130, "epoch": 4483} {"train_loss": -26.655954360961914, "global_step": 372131, "epoch": 4483} {"train_loss": -26.575641632080078, "global_step": 372132, "epoch": 4483} {"train_loss": -26.36398696899414, "global_step": 372133, "epoch": 4483} {"train_loss": -26.413049697875977, "global_step": 372134, "epoch": 4483} {"train_loss": -26.52469253540039, "global_step": 372135, "epoch": 4483} {"train_loss": -26.404129028320312, "global_step": 372136, "epoch": 4483} {"train_loss": -26.517807006835938, "global_step": 372137, "epoch": 4483} {"train_loss": -25.883451461791992, "global_step": 372138, "epoch": 4483} {"train_loss": -26.786148071289062, "global_step": 372139, "epoch": 4483} {"train_loss": -26.57839012145996, "global_step": 372140, "epoch": 4483} {"train_loss": -26.262609481811523, "global_step": 372141, "epoch": 4483} {"train_loss": -26.19423484802246, "global_step": 372142, "epoch": 4483} {"train_loss": -26.462400436401367, "global_step": 372143, "epoch": 4483} {"train_loss": -26.230396270751953, "global_step": 372144, "epoch": 4483} {"train_loss": -26.56354331970215, "global_step": 372145, "epoch": 4483} {"train_loss": -26.230749130249023, "global_step": 372146, "epoch": 4483} {"train_loss": -25.664880752563477, "global_step": 372147, "epoch": 4483} {"train_loss": -25.977859497070312, "global_step": 372148, "epoch": 4483} {"train_loss": -25.033559799194336, "global_step": 372149, "epoch": 4483} {"train_loss": -25.276277542114258, "global_step": 372150, "epoch": 4483} {"train_loss": -26.307905197143555, "global_step": 372151, "epoch": 4483} {"train_loss": -26.126144409179688, "global_step": 372152, "epoch": 4483} {"train_loss": -25.80967140197754, "global_step": 372153, "epoch": 4483} {"train_loss": -25.90919303894043, "global_step": 372154, "epoch": 4483} {"train_loss": -26.152496337890625, "global_step": 372155, "epoch": 4483} {"train_loss": -26.0338191986084, "global_step": 372156, "epoch": 4483} {"train_loss": -26.30491065979004, "global_step": 372157, "epoch": 4483} {"train_loss": -26.13530921936035, "global_step": 372158, "epoch": 4483} {"train_loss": -26.244171142578125, "global_step": 372159, "epoch": 4483} {"train_loss": -26.164077758789062, "global_step": 372160, "epoch": 4483} {"train_loss": -25.763004302978516, "global_step": 372161, "epoch": 4483} {"train_loss": -26.27066993713379, "global_step": 372162, "epoch": 4483} {"train_loss": -26.237659454345703, "global_step": 372163, "epoch": 4483} {"train_loss": -26.196136474609375, "global_step": 372164, "epoch": 4483} {"train_loss": -26.17435646057129, "global_step": 372165, "epoch": 4483} {"train_loss": -25.85162353515625, "global_step": 372166, "epoch": 4483} {"train_loss": -25.83501625061035, "global_step": 372167, "epoch": 4483} {"train_loss": -26.456375122070312, "global_step": 372168, "epoch": 4483} {"train_loss": -26.031118392944336, "global_step": 372169, "epoch": 4483} {"train_loss": -26.367650985717773, "global_step": 372170, "epoch": 4483} {"train_loss": -26.220422468989728, "global_step": 372171, "epoch": 4483, "val_loss": 6588302.0} {"train_loss": -25.796323776245117, "global_step": 372172, "epoch": 4484} {"train_loss": -25.6129150390625, "global_step": 372173, "epoch": 4484} {"train_loss": -25.920673370361328, "global_step": 372174, "epoch": 4484} {"train_loss": -25.286781311035156, "global_step": 372175, "epoch": 4484} {"train_loss": -25.866992950439453, "global_step": 372176, "epoch": 4484} {"train_loss": -25.7539005279541, "global_step": 372177, "epoch": 4484} {"train_loss": -25.97309684753418, "global_step": 372178, "epoch": 4484} {"train_loss": -26.42730140686035, "global_step": 372179, "epoch": 4484} {"train_loss": -25.93108558654785, "global_step": 372180, "epoch": 4484} {"train_loss": -26.095184326171875, "global_step": 372181, "epoch": 4484} {"train_loss": -25.991552352905273, "global_step": 372182, "epoch": 4484} {"train_loss": -25.396610260009766, "global_step": 372183, "epoch": 4484} {"train_loss": -26.083744049072266, "global_step": 372184, "epoch": 4484} {"train_loss": -26.255386352539062, "global_step": 372185, "epoch": 4484} {"train_loss": -26.057432174682617, "global_step": 372186, "epoch": 4484} {"train_loss": -26.218616485595703, "global_step": 372187, "epoch": 4484} {"train_loss": -26.429595947265625, "global_step": 372188, "epoch": 4484} {"train_loss": -26.442441940307617, "global_step": 372189, "epoch": 4484} {"train_loss": -26.26544761657715, "global_step": 372190, "epoch": 4484} {"train_loss": -25.581247329711914, "global_step": 372191, "epoch": 4484} {"train_loss": -26.318740844726562, "global_step": 372192, "epoch": 4484} {"train_loss": -26.08954429626465, "global_step": 372193, "epoch": 4484} {"train_loss": -26.6825008392334, "global_step": 372194, "epoch": 4484} {"train_loss": -26.17508888244629, "global_step": 372195, "epoch": 4484} {"train_loss": -26.692352294921875, "global_step": 372196, "epoch": 4484} {"train_loss": -26.348657608032227, "global_step": 372197, "epoch": 4484} {"train_loss": -26.493122100830078, "global_step": 372198, "epoch": 4484} {"train_loss": -26.05085563659668, "global_step": 372199, "epoch": 4484} {"train_loss": -26.681264877319336, "global_step": 372200, "epoch": 4484} {"train_loss": -26.20326805114746, "global_step": 372201, "epoch": 4484} {"train_loss": -26.365325927734375, "global_step": 372202, "epoch": 4484} {"train_loss": -26.41460609436035, "global_step": 372203, "epoch": 4484} {"train_loss": -26.292465209960938, "global_step": 372204, "epoch": 4484} {"train_loss": -26.550037384033203, "global_step": 372205, "epoch": 4484} {"train_loss": -26.363012313842773, "global_step": 372206, "epoch": 4484} {"train_loss": -26.794525146484375, "global_step": 372207, "epoch": 4484} {"train_loss": -26.59309196472168, "global_step": 372208, "epoch": 4484} {"train_loss": -26.711627960205078, "global_step": 372209, "epoch": 4484} {"train_loss": -26.455541610717773, "global_step": 372210, "epoch": 4484} {"train_loss": -26.47481346130371, "global_step": 372211, "epoch": 4484} {"train_loss": -26.3928279876709, "global_step": 372212, "epoch": 4484} {"train_loss": -26.743825912475586, "global_step": 372213, "epoch": 4484} {"train_loss": -26.645099639892578, "global_step": 372214, "epoch": 4484} {"train_loss": -26.750782012939453, "global_step": 372215, "epoch": 4484} {"train_loss": -26.581134796142578, "global_step": 372216, "epoch": 4484} {"train_loss": -26.47767448425293, "global_step": 372217, "epoch": 4484} {"train_loss": -26.832901000976562, "global_step": 372218, "epoch": 4484} {"train_loss": -26.439294815063477, "global_step": 372219, "epoch": 4484} {"train_loss": -26.920639038085938, "global_step": 372220, "epoch": 4484} {"train_loss": -26.756818771362305, "global_step": 372221, "epoch": 4484} {"train_loss": -26.382160186767578, "global_step": 372222, "epoch": 4484} {"train_loss": -26.565031051635742, "global_step": 372223, "epoch": 4484} {"train_loss": -26.471405029296875, "global_step": 372224, "epoch": 4484} {"train_loss": -26.44764518737793, "global_step": 372225, "epoch": 4484} {"train_loss": -26.239826202392578, "global_step": 372226, "epoch": 4484} {"train_loss": -26.056201934814453, "global_step": 372227, "epoch": 4484} {"train_loss": -26.28670310974121, "global_step": 372228, "epoch": 4484} {"train_loss": -26.484731674194336, "global_step": 372229, "epoch": 4484} {"train_loss": -26.047128677368164, "global_step": 372230, "epoch": 4484} {"train_loss": -26.467056274414062, "global_step": 372231, "epoch": 4484} {"train_loss": -25.99029541015625, "global_step": 372232, "epoch": 4484} {"train_loss": -26.322860717773438, "global_step": 372233, "epoch": 4484} {"train_loss": -26.75774574279785, "global_step": 372234, "epoch": 4484} {"train_loss": -26.433395385742188, "global_step": 372235, "epoch": 4484} {"train_loss": -26.614139556884766, "global_step": 372236, "epoch": 4484} {"train_loss": -26.499948501586914, "global_step": 372237, "epoch": 4484} {"train_loss": -26.345874786376953, "global_step": 372238, "epoch": 4484} {"train_loss": -26.595142364501953, "global_step": 372239, "epoch": 4484} {"train_loss": -26.544641494750977, "global_step": 372240, "epoch": 4484} {"train_loss": -26.43755531311035, "global_step": 372241, "epoch": 4484} {"train_loss": -26.339303970336914, "global_step": 372242, "epoch": 4484} {"train_loss": -26.736364364624023, "global_step": 372243, "epoch": 4484} {"train_loss": -26.158069610595703, "global_step": 372244, "epoch": 4484} {"train_loss": -26.239410400390625, "global_step": 372245, "epoch": 4484} {"train_loss": -26.587247848510742, "global_step": 372246, "epoch": 4484} {"train_loss": -25.873722076416016, "global_step": 372247, "epoch": 4484} {"train_loss": -26.305042266845703, "global_step": 372248, "epoch": 4484} {"train_loss": -26.511219024658203, "global_step": 372249, "epoch": 4484} {"train_loss": -26.538848876953125, "global_step": 372250, "epoch": 4484} {"train_loss": -26.70684814453125, "global_step": 372251, "epoch": 4484} {"train_loss": -26.47903823852539, "global_step": 372252, "epoch": 4484} {"train_loss": -26.651355743408203, "global_step": 372253, "epoch": 4484} {"train_loss": -26.338069823851068, "global_step": 372254, "epoch": 4484, "val_loss": 6693407.5} {"train_loss": -25.865680694580078, "global_step": 372255, "epoch": 4485} {"train_loss": -25.864459991455078, "global_step": 372256, "epoch": 4485} {"train_loss": -25.77103042602539, "global_step": 372257, "epoch": 4485} {"train_loss": -25.899765014648438, "global_step": 372258, "epoch": 4485} {"train_loss": -25.75439453125, "global_step": 372259, "epoch": 4485} {"train_loss": -26.1230525970459, "global_step": 372260, "epoch": 4485} {"train_loss": -26.086156845092773, "global_step": 372261, "epoch": 4485} {"train_loss": -25.69140625, "global_step": 372262, "epoch": 4485} {"train_loss": -26.08871841430664, "global_step": 372263, "epoch": 4485} {"train_loss": -26.274658203125, "global_step": 372264, "epoch": 4485} {"train_loss": -25.678796768188477, "global_step": 372265, "epoch": 4485} {"train_loss": -26.4292049407959, "global_step": 372266, "epoch": 4485} {"train_loss": -26.02654457092285, "global_step": 372267, "epoch": 4485} {"train_loss": -25.932111740112305, "global_step": 372268, "epoch": 4485} {"train_loss": -26.285587310791016, "global_step": 372269, "epoch": 4485} {"train_loss": -26.215076446533203, "global_step": 372270, "epoch": 4485} {"train_loss": -25.846786499023438, "global_step": 372271, "epoch": 4485} {"train_loss": -26.206769943237305, "global_step": 372272, "epoch": 4485} {"train_loss": -26.236286163330078, "global_step": 372273, "epoch": 4485} {"train_loss": -26.26827049255371, "global_step": 372274, "epoch": 4485} {"train_loss": -25.99712562561035, "global_step": 372275, "epoch": 4485} {"train_loss": -26.313501358032227, "global_step": 372276, "epoch": 4485} {"train_loss": -26.234663009643555, "global_step": 372277, "epoch": 4485} {"train_loss": -25.977380752563477, "global_step": 372278, "epoch": 4485} {"train_loss": -26.2557373046875, "global_step": 372279, "epoch": 4485} {"train_loss": -26.378082275390625, "global_step": 372280, "epoch": 4485} {"train_loss": -26.383329391479492, "global_step": 372281, "epoch": 4485} {"train_loss": -26.52434730529785, "global_step": 372282, "epoch": 4485} {"train_loss": -26.15389060974121, "global_step": 372283, "epoch": 4485} {"train_loss": -26.621021270751953, "global_step": 372284, "epoch": 4485} {"train_loss": -26.413177490234375, "global_step": 372285, "epoch": 4485} {"train_loss": -26.179550170898438, "global_step": 372286, "epoch": 4485} {"train_loss": -25.949193954467773, "global_step": 372287, "epoch": 4485} {"train_loss": -26.078571319580078, "global_step": 372288, "epoch": 4485} {"train_loss": -26.194107055664062, "global_step": 372289, "epoch": 4485} {"train_loss": -26.48788833618164, "global_step": 372290, "epoch": 4485} {"train_loss": -26.296539306640625, "global_step": 372291, "epoch": 4485} {"train_loss": -26.736234664916992, "global_step": 372292, "epoch": 4485} {"train_loss": -26.511865615844727, "global_step": 372293, "epoch": 4485} {"train_loss": -26.090330123901367, "global_step": 372294, "epoch": 4485} {"train_loss": -26.357275009155273, "global_step": 372295, "epoch": 4485} {"train_loss": -26.154829025268555, "global_step": 372296, "epoch": 4485} {"train_loss": -26.589649200439453, "global_step": 372297, "epoch": 4485} {"train_loss": -26.28460693359375, "global_step": 372298, "epoch": 4485} {"train_loss": -26.458723068237305, "global_step": 372299, "epoch": 4485} {"train_loss": -26.7632999420166, "global_step": 372300, "epoch": 4485} {"train_loss": -26.600360870361328, "global_step": 372301, "epoch": 4485} {"train_loss": -26.80545997619629, "global_step": 372302, "epoch": 4485} {"train_loss": -26.64117431640625, "global_step": 372303, "epoch": 4485} {"train_loss": -26.407556533813477, "global_step": 372304, "epoch": 4485} {"train_loss": -26.7108154296875, "global_step": 372305, "epoch": 4485} {"train_loss": -26.4533748626709, "global_step": 372306, "epoch": 4485} {"train_loss": -26.035572052001953, "global_step": 372307, "epoch": 4485} {"train_loss": -26.666370391845703, "global_step": 372308, "epoch": 4485} {"train_loss": -26.532123565673828, "global_step": 372309, "epoch": 4485} {"train_loss": -26.5870418548584, "global_step": 372310, "epoch": 4485} {"train_loss": -26.611257553100586, "global_step": 372311, "epoch": 4485} {"train_loss": -26.3009033203125, "global_step": 372312, "epoch": 4485} {"train_loss": -26.33819007873535, "global_step": 372313, "epoch": 4485} {"train_loss": -26.308887481689453, "global_step": 372314, "epoch": 4485} {"train_loss": -26.549152374267578, "global_step": 372315, "epoch": 4485} {"train_loss": -26.01387596130371, "global_step": 372316, "epoch": 4485} {"train_loss": -25.674026489257812, "global_step": 372317, "epoch": 4485} {"train_loss": -25.70064353942871, "global_step": 372318, "epoch": 4485} {"train_loss": -26.59455680847168, "global_step": 372319, "epoch": 4485} {"train_loss": -26.54546546936035, "global_step": 372320, "epoch": 4485} {"train_loss": -26.593551635742188, "global_step": 372321, "epoch": 4485} {"train_loss": -26.649383544921875, "global_step": 372322, "epoch": 4485} {"train_loss": -26.411046981811523, "global_step": 372323, "epoch": 4485} {"train_loss": -26.173187255859375, "global_step": 372324, "epoch": 4485} {"train_loss": -26.422321319580078, "global_step": 372325, "epoch": 4485} {"train_loss": -26.454069137573242, "global_step": 372326, "epoch": 4485} {"train_loss": -26.635969161987305, "global_step": 372327, "epoch": 4485} {"train_loss": -26.627939224243164, "global_step": 372328, "epoch": 4485} {"train_loss": -26.51641845703125, "global_step": 372329, "epoch": 4485} {"train_loss": -26.449010848999023, "global_step": 372330, "epoch": 4485} {"train_loss": -26.18242835998535, "global_step": 372331, "epoch": 4485} {"train_loss": -25.731897354125977, "global_step": 372332, "epoch": 4485} {"train_loss": -25.039480209350586, "global_step": 372333, "epoch": 4485} {"train_loss": -24.83542823791504, "global_step": 372334, "epoch": 4485} {"train_loss": -26.095550537109375, "global_step": 372335, "epoch": 4485} {"train_loss": -26.272043228149414, "global_step": 372336, "epoch": 4485} {"train_loss": -26.239043155348444, "global_step": 372337, "epoch": 4485, "val_loss": 6759770.0} {"train_loss": -25.131694793701172, "global_step": 372338, "epoch": 4486} {"train_loss": -25.309865951538086, "global_step": 372339, "epoch": 4486} {"train_loss": -25.1478271484375, "global_step": 372340, "epoch": 4486} {"train_loss": -24.382444381713867, "global_step": 372341, "epoch": 4486} {"train_loss": -25.065784454345703, "global_step": 372342, "epoch": 4486} {"train_loss": -25.520435333251953, "global_step": 372343, "epoch": 4486} {"train_loss": -25.387619018554688, "global_step": 372344, "epoch": 4486} {"train_loss": -25.63943862915039, "global_step": 372345, "epoch": 4486} {"train_loss": -25.336658477783203, "global_step": 372346, "epoch": 4486} {"train_loss": -25.228551864624023, "global_step": 372347, "epoch": 4486} {"train_loss": -25.49444007873535, "global_step": 372348, "epoch": 4486} {"train_loss": -25.687707901000977, "global_step": 372349, "epoch": 4486} {"train_loss": -25.843677520751953, "global_step": 372350, "epoch": 4486} {"train_loss": -25.470428466796875, "global_step": 372351, "epoch": 4486} {"train_loss": -25.737455368041992, "global_step": 372352, "epoch": 4486} {"train_loss": -25.57480812072754, "global_step": 372353, "epoch": 4486} {"train_loss": -25.86957359313965, "global_step": 372354, "epoch": 4486} {"train_loss": -25.63608169555664, "global_step": 372355, "epoch": 4486} {"train_loss": -25.381797790527344, "global_step": 372356, "epoch": 4486} {"train_loss": -25.367223739624023, "global_step": 372357, "epoch": 4486} {"train_loss": -25.917394638061523, "global_step": 372358, "epoch": 4486} {"train_loss": -26.064741134643555, "global_step": 372359, "epoch": 4486} {"train_loss": -26.013525009155273, "global_step": 372360, "epoch": 4486} {"train_loss": -26.07636833190918, "global_step": 372361, "epoch": 4486} {"train_loss": -25.800214767456055, "global_step": 372362, "epoch": 4486} {"train_loss": -26.303770065307617, "global_step": 372363, "epoch": 4486} {"train_loss": -25.728605270385742, "global_step": 372364, "epoch": 4486} {"train_loss": -25.796499252319336, "global_step": 372365, "epoch": 4486} {"train_loss": -26.168167114257812, "global_step": 372366, "epoch": 4486} {"train_loss": -26.1718807220459, "global_step": 372367, "epoch": 4486} {"train_loss": -25.949970245361328, "global_step": 372368, "epoch": 4486} {"train_loss": -26.371219635009766, "global_step": 372369, "epoch": 4486} {"train_loss": -26.023618698120117, "global_step": 372370, "epoch": 4486} {"train_loss": -26.297338485717773, "global_step": 372371, "epoch": 4486} {"train_loss": -26.424381256103516, "global_step": 372372, "epoch": 4486} {"train_loss": -26.217742919921875, "global_step": 372373, "epoch": 4486} {"train_loss": -26.1047420501709, "global_step": 372374, "epoch": 4486} {"train_loss": -26.133197784423828, "global_step": 372375, "epoch": 4486} {"train_loss": -26.421417236328125, "global_step": 372376, "epoch": 4486} {"train_loss": -26.5902042388916, "global_step": 372377, "epoch": 4486} {"train_loss": -26.197071075439453, "global_step": 372378, "epoch": 4486} {"train_loss": -26.49409294128418, "global_step": 372379, "epoch": 4486} {"train_loss": -26.48455238342285, "global_step": 372380, "epoch": 4486} {"train_loss": -26.728979110717773, "global_step": 372381, "epoch": 4486} {"train_loss": -26.25165367126465, "global_step": 372382, "epoch": 4486} {"train_loss": -26.538976669311523, "global_step": 372383, "epoch": 4486} {"train_loss": -26.559906005859375, "global_step": 372384, "epoch": 4486} {"train_loss": -26.356977462768555, "global_step": 372385, "epoch": 4486} {"train_loss": -26.437088012695312, "global_step": 372386, "epoch": 4486} {"train_loss": -26.22483253479004, "global_step": 372387, "epoch": 4486} {"train_loss": -26.49519920349121, "global_step": 372388, "epoch": 4486} {"train_loss": -26.363082885742188, "global_step": 372389, "epoch": 4486} {"train_loss": -26.1414794921875, "global_step": 372390, "epoch": 4486} {"train_loss": -26.1143741607666, "global_step": 372391, "epoch": 4486} {"train_loss": -25.9366512298584, "global_step": 372392, "epoch": 4486} {"train_loss": -25.487045288085938, "global_step": 372393, "epoch": 4486} {"train_loss": -26.246295928955078, "global_step": 372394, "epoch": 4486} {"train_loss": -26.133100509643555, "global_step": 372395, "epoch": 4486} {"train_loss": -26.214065551757812, "global_step": 372396, "epoch": 4486} {"train_loss": -26.03370475769043, "global_step": 372397, "epoch": 4486} {"train_loss": -26.630048751831055, "global_step": 372398, "epoch": 4486} {"train_loss": -26.19935417175293, "global_step": 372399, "epoch": 4486} {"train_loss": -26.39395523071289, "global_step": 372400, "epoch": 4486} {"train_loss": -26.472021102905273, "global_step": 372401, "epoch": 4486} {"train_loss": -26.207956314086914, "global_step": 372402, "epoch": 4486} {"train_loss": -25.806516647338867, "global_step": 372403, "epoch": 4486} {"train_loss": -26.53314781188965, "global_step": 372404, "epoch": 4486} {"train_loss": -26.233728408813477, "global_step": 372405, "epoch": 4486} {"train_loss": -25.93964958190918, "global_step": 372406, "epoch": 4486} {"train_loss": -26.332502365112305, "global_step": 372407, "epoch": 4486} {"train_loss": -26.253515243530273, "global_step": 372408, "epoch": 4486} {"train_loss": -26.81338882446289, "global_step": 372409, "epoch": 4486} {"train_loss": -26.256000518798828, "global_step": 372410, "epoch": 4486} {"train_loss": -26.35481071472168, "global_step": 372411, "epoch": 4486} {"train_loss": -26.388107299804688, "global_step": 372412, "epoch": 4486} {"train_loss": -26.461212158203125, "global_step": 372413, "epoch": 4486} {"train_loss": -26.458730697631836, "global_step": 372414, "epoch": 4486} {"train_loss": -25.909015655517578, "global_step": 372415, "epoch": 4486} {"train_loss": -26.12939453125, "global_step": 372416, "epoch": 4486} {"train_loss": -26.25067138671875, "global_step": 372417, "epoch": 4486} {"train_loss": -26.377017974853516, "global_step": 372418, "epoch": 4486} {"train_loss": -26.4335994720459, "global_step": 372419, "epoch": 4486} {"train_loss": -26.03932233603604, "global_step": 372420, "epoch": 4486, "val_loss": 6641240.0} {"train_loss": -25.840055465698242, "global_step": 372421, "epoch": 4487} {"train_loss": -25.832538604736328, "global_step": 372422, "epoch": 4487} {"train_loss": -25.4212703704834, "global_step": 372423, "epoch": 4487} {"train_loss": -25.579137802124023, "global_step": 372424, "epoch": 4487} {"train_loss": -26.206201553344727, "global_step": 372425, "epoch": 4487} {"train_loss": -25.74053382873535, "global_step": 372426, "epoch": 4487} {"train_loss": -25.910675048828125, "global_step": 372427, "epoch": 4487} {"train_loss": -26.058414459228516, "global_step": 372428, "epoch": 4487} {"train_loss": -26.36139488220215, "global_step": 372429, "epoch": 4487} {"train_loss": -25.725448608398438, "global_step": 372430, "epoch": 4487} {"train_loss": -25.656707763671875, "global_step": 372431, "epoch": 4487} {"train_loss": -26.037622451782227, "global_step": 372432, "epoch": 4487} {"train_loss": -26.180395126342773, "global_step": 372433, "epoch": 4487} {"train_loss": -25.632726669311523, "global_step": 372434, "epoch": 4487} {"train_loss": -26.33587074279785, "global_step": 372435, "epoch": 4487} {"train_loss": -26.16558265686035, "global_step": 372436, "epoch": 4487} {"train_loss": -26.160873413085938, "global_step": 372437, "epoch": 4487} {"train_loss": -25.914810180664062, "global_step": 372438, "epoch": 4487} {"train_loss": -26.050024032592773, "global_step": 372439, "epoch": 4487} {"train_loss": -26.263608932495117, "global_step": 372440, "epoch": 4487} {"train_loss": -26.175037384033203, "global_step": 372441, "epoch": 4487} {"train_loss": -26.54214859008789, "global_step": 372442, "epoch": 4487} {"train_loss": -25.848712921142578, "global_step": 372443, "epoch": 4487} {"train_loss": -26.28226661682129, "global_step": 372444, "epoch": 4487} {"train_loss": -26.217090606689453, "global_step": 372445, "epoch": 4487} {"train_loss": -26.384052276611328, "global_step": 372446, "epoch": 4487} {"train_loss": -26.531036376953125, "global_step": 372447, "epoch": 4487} {"train_loss": -26.441370010375977, "global_step": 372448, "epoch": 4487} {"train_loss": -26.448749542236328, "global_step": 372449, "epoch": 4487} {"train_loss": -26.318510055541992, "global_step": 372450, "epoch": 4487} {"train_loss": -26.128299713134766, "global_step": 372451, "epoch": 4487} {"train_loss": -26.78074073791504, "global_step": 372452, "epoch": 4487} {"train_loss": -26.54443359375, "global_step": 372453, "epoch": 4487} {"train_loss": -26.46234703063965, "global_step": 372454, "epoch": 4487} {"train_loss": -26.391876220703125, "global_step": 372455, "epoch": 4487} {"train_loss": -26.611963272094727, "global_step": 372456, "epoch": 4487} {"train_loss": -26.733373641967773, "global_step": 372457, "epoch": 4487} {"train_loss": -26.066686630249023, "global_step": 372458, "epoch": 4487} {"train_loss": -26.63802146911621, "global_step": 372459, "epoch": 4487} {"train_loss": -26.365121841430664, "global_step": 372460, "epoch": 4487} {"train_loss": -26.087635040283203, "global_step": 372461, "epoch": 4487} {"train_loss": -26.377994537353516, "global_step": 372462, "epoch": 4487} {"train_loss": -26.777912139892578, "global_step": 372463, "epoch": 4487} {"train_loss": -26.498823165893555, "global_step": 372464, "epoch": 4487} {"train_loss": -26.29427146911621, "global_step": 372465, "epoch": 4487} {"train_loss": -26.0532169342041, "global_step": 372466, "epoch": 4487} {"train_loss": -25.909320831298828, "global_step": 372467, "epoch": 4487} {"train_loss": -26.365461349487305, "global_step": 372468, "epoch": 4487} {"train_loss": -26.01346206665039, "global_step": 372469, "epoch": 4487} {"train_loss": -26.167530059814453, "global_step": 372470, "epoch": 4487} {"train_loss": -26.614892959594727, "global_step": 372471, "epoch": 4487} {"train_loss": -26.3761043548584, "global_step": 372472, "epoch": 4487} {"train_loss": -26.17412757873535, "global_step": 372473, "epoch": 4487} {"train_loss": -26.14168357849121, "global_step": 372474, "epoch": 4487} {"train_loss": -26.423547744750977, "global_step": 372475, "epoch": 4487} {"train_loss": -26.49118423461914, "global_step": 372476, "epoch": 4487} {"train_loss": -26.20733070373535, "global_step": 372477, "epoch": 4487} {"train_loss": -26.439319610595703, "global_step": 372478, "epoch": 4487} {"train_loss": -26.283008575439453, "global_step": 372479, "epoch": 4487} {"train_loss": -26.860595703125, "global_step": 372480, "epoch": 4487} {"train_loss": -26.439496994018555, "global_step": 372481, "epoch": 4487} {"train_loss": -26.400365829467773, "global_step": 372482, "epoch": 4487} {"train_loss": -26.702016830444336, "global_step": 372483, "epoch": 4487} {"train_loss": -26.176837921142578, "global_step": 372484, "epoch": 4487} {"train_loss": -26.50750732421875, "global_step": 372485, "epoch": 4487} {"train_loss": -26.416797637939453, "global_step": 372486, "epoch": 4487} {"train_loss": -26.51848793029785, "global_step": 372487, "epoch": 4487} {"train_loss": -26.161413192749023, "global_step": 372488, "epoch": 4487} {"train_loss": -26.001062393188477, "global_step": 372489, "epoch": 4487} {"train_loss": -26.038867950439453, "global_step": 372490, "epoch": 4487} {"train_loss": -26.276662826538086, "global_step": 372491, "epoch": 4487} {"train_loss": -26.49237632751465, "global_step": 372492, "epoch": 4487} {"train_loss": -26.679243087768555, "global_step": 372493, "epoch": 4487} {"train_loss": -26.452335357666016, "global_step": 372494, "epoch": 4487} {"train_loss": -26.408254623413086, "global_step": 372495, "epoch": 4487} {"train_loss": -26.509723663330078, "global_step": 372496, "epoch": 4487} {"train_loss": -26.697736740112305, "global_step": 372497, "epoch": 4487} {"train_loss": -26.375165939331055, "global_step": 372498, "epoch": 4487} {"train_loss": -26.69280433654785, "global_step": 372499, "epoch": 4487} {"train_loss": -26.353620529174805, "global_step": 372500, "epoch": 4487} {"train_loss": -26.37238121032715, "global_step": 372501, "epoch": 4487} {"train_loss": -26.705244064331055, "global_step": 372502, "epoch": 4487} {"train_loss": -26.301238898771356, "global_step": 372503, "epoch": 4487, "val_loss": 6654132.5} {"train_loss": -26.27972412109375, "global_step": 372504, "epoch": 4488} {"train_loss": -25.7302303314209, "global_step": 372505, "epoch": 4488} {"train_loss": -25.392911911010742, "global_step": 372506, "epoch": 4488} {"train_loss": -25.086084365844727, "global_step": 372507, "epoch": 4488} {"train_loss": -26.16619873046875, "global_step": 372508, "epoch": 4488} {"train_loss": -26.1363582611084, "global_step": 372509, "epoch": 4488} {"train_loss": -25.669647216796875, "global_step": 372510, "epoch": 4488} {"train_loss": -25.768606185913086, "global_step": 372511, "epoch": 4488} {"train_loss": -26.040868759155273, "global_step": 372512, "epoch": 4488} {"train_loss": -26.320600509643555, "global_step": 372513, "epoch": 4488} {"train_loss": -26.245182037353516, "global_step": 372514, "epoch": 4488} {"train_loss": -26.2702693939209, "global_step": 372515, "epoch": 4488} {"train_loss": -26.183151245117188, "global_step": 372516, "epoch": 4488} {"train_loss": -26.30828285217285, "global_step": 372517, "epoch": 4488} {"train_loss": -26.622297286987305, "global_step": 372518, "epoch": 4488} {"train_loss": -26.1112060546875, "global_step": 372519, "epoch": 4488} {"train_loss": -26.199304580688477, "global_step": 372520, "epoch": 4488} {"train_loss": -25.96674919128418, "global_step": 372521, "epoch": 4488} {"train_loss": -26.14837074279785, "global_step": 372522, "epoch": 4488} {"train_loss": -25.934494018554688, "global_step": 372523, "epoch": 4488} {"train_loss": -26.141645431518555, "global_step": 372524, "epoch": 4488} {"train_loss": -26.23779296875, "global_step": 372525, "epoch": 4488} {"train_loss": -26.453123092651367, "global_step": 372526, "epoch": 4488} {"train_loss": -26.284570693969727, "global_step": 372527, "epoch": 4488} {"train_loss": -26.266387939453125, "global_step": 372528, "epoch": 4488} {"train_loss": -26.403955459594727, "global_step": 372529, "epoch": 4488} {"train_loss": -26.356122970581055, "global_step": 372530, "epoch": 4488} {"train_loss": -26.234277725219727, "global_step": 372531, "epoch": 4488} {"train_loss": -26.682458877563477, "global_step": 372532, "epoch": 4488} {"train_loss": -26.313323974609375, "global_step": 372533, "epoch": 4488} {"train_loss": -26.706506729125977, "global_step": 372534, "epoch": 4488} {"train_loss": -26.073606491088867, "global_step": 372535, "epoch": 4488} {"train_loss": -26.72393226623535, "global_step": 372536, "epoch": 4488} {"train_loss": -26.384138107299805, "global_step": 372537, "epoch": 4488} {"train_loss": -26.212621688842773, "global_step": 372538, "epoch": 4488} {"train_loss": -26.5841007232666, "global_step": 372539, "epoch": 4488} {"train_loss": -26.68146324157715, "global_step": 372540, "epoch": 4488} {"train_loss": -26.45241355895996, "global_step": 372541, "epoch": 4488} {"train_loss": -26.463001251220703, "global_step": 372542, "epoch": 4488} {"train_loss": -26.350555419921875, "global_step": 372543, "epoch": 4488} {"train_loss": -26.594022750854492, "global_step": 372544, "epoch": 4488} {"train_loss": -26.388776779174805, "global_step": 372545, "epoch": 4488} {"train_loss": -26.805112838745117, "global_step": 372546, "epoch": 4488} {"train_loss": -26.432708740234375, "global_step": 372547, "epoch": 4488} {"train_loss": -26.42001724243164, "global_step": 372548, "epoch": 4488} {"train_loss": -26.133718490600586, "global_step": 372549, "epoch": 4488} {"train_loss": -26.22283935546875, "global_step": 372550, "epoch": 4488} {"train_loss": -26.42610740661621, "global_step": 372551, "epoch": 4488} {"train_loss": -26.69537353515625, "global_step": 372552, "epoch": 4488} {"train_loss": -26.26093101501465, "global_step": 372553, "epoch": 4488} {"train_loss": -26.9565372467041, "global_step": 372554, "epoch": 4488} {"train_loss": -26.513507843017578, "global_step": 372555, "epoch": 4488} {"train_loss": -26.56678581237793, "global_step": 372556, "epoch": 4488} {"train_loss": -26.621152877807617, "global_step": 372557, "epoch": 4488} {"train_loss": -26.45672035217285, "global_step": 372558, "epoch": 4488} {"train_loss": -26.544662475585938, "global_step": 372559, "epoch": 4488} {"train_loss": -26.222620010375977, "global_step": 372560, "epoch": 4488} {"train_loss": -26.323583602905273, "global_step": 372561, "epoch": 4488} {"train_loss": -26.30413246154785, "global_step": 372562, "epoch": 4488} {"train_loss": -26.588769912719727, "global_step": 372563, "epoch": 4488} {"train_loss": -26.6146297454834, "global_step": 372564, "epoch": 4488} {"train_loss": -26.83650016784668, "global_step": 372565, "epoch": 4488} {"train_loss": -26.163251876831055, "global_step": 372566, "epoch": 4488} {"train_loss": -26.56787109375, "global_step": 372567, "epoch": 4488} {"train_loss": -26.4676456451416, "global_step": 372568, "epoch": 4488} {"train_loss": -26.685653686523438, "global_step": 372569, "epoch": 4488} {"train_loss": -26.476776123046875, "global_step": 372570, "epoch": 4488} {"train_loss": -26.129352569580078, "global_step": 372571, "epoch": 4488} {"train_loss": -26.137800216674805, "global_step": 372572, "epoch": 4488} {"train_loss": -26.259069442749023, "global_step": 372573, "epoch": 4488} {"train_loss": -26.41362953186035, "global_step": 372574, "epoch": 4488} {"train_loss": -26.663862228393555, "global_step": 372575, "epoch": 4488} {"train_loss": -26.467920303344727, "global_step": 372576, "epoch": 4488} {"train_loss": -26.495832443237305, "global_step": 372577, "epoch": 4488} {"train_loss": -26.569995880126953, "global_step": 372578, "epoch": 4488} {"train_loss": -26.255157470703125, "global_step": 372579, "epoch": 4488} {"train_loss": -26.802885055541992, "global_step": 372580, "epoch": 4488} {"train_loss": -26.59393310546875, "global_step": 372581, "epoch": 4488} {"train_loss": -26.568775177001953, "global_step": 372582, "epoch": 4488} {"train_loss": -26.466461181640625, "global_step": 372583, "epoch": 4488} {"train_loss": -26.904327392578125, "global_step": 372584, "epoch": 4488} {"train_loss": -26.168806076049805, "global_step": 372585, "epoch": 4488} {"train_loss": -26.3494024851236, "global_step": 372586, "epoch": 4488, "val_loss": 6628175.0} {"train_loss": -25.46021842956543, "global_step": 372587, "epoch": 4489} {"train_loss": -25.476024627685547, "global_step": 372588, "epoch": 4489} {"train_loss": -26.207197189331055, "global_step": 372589, "epoch": 4489} {"train_loss": -25.512990951538086, "global_step": 372590, "epoch": 4489} {"train_loss": -26.121850967407227, "global_step": 372591, "epoch": 4489} {"train_loss": -26.1016845703125, "global_step": 372592, "epoch": 4489} {"train_loss": -25.55088233947754, "global_step": 372593, "epoch": 4489} {"train_loss": -25.61958122253418, "global_step": 372594, "epoch": 4489} {"train_loss": -25.519559860229492, "global_step": 372595, "epoch": 4489} {"train_loss": -26.2507266998291, "global_step": 372596, "epoch": 4489} {"train_loss": -25.604848861694336, "global_step": 372597, "epoch": 4489} {"train_loss": -25.95319175720215, "global_step": 372598, "epoch": 4489} {"train_loss": -25.918426513671875, "global_step": 372599, "epoch": 4489} {"train_loss": -26.162633895874023, "global_step": 372600, "epoch": 4489} {"train_loss": -25.819433212280273, "global_step": 372601, "epoch": 4489} {"train_loss": -25.9466495513916, "global_step": 372602, "epoch": 4489} {"train_loss": -25.923917770385742, "global_step": 372603, "epoch": 4489} {"train_loss": -26.153533935546875, "global_step": 372604, "epoch": 4489} {"train_loss": -25.81634521484375, "global_step": 372605, "epoch": 4489} {"train_loss": -26.24216079711914, "global_step": 372606, "epoch": 4489} {"train_loss": -25.804105758666992, "global_step": 372607, "epoch": 4489} {"train_loss": -26.43045997619629, "global_step": 372608, "epoch": 4489} {"train_loss": -25.898456573486328, "global_step": 372609, "epoch": 4489} {"train_loss": -26.186187744140625, "global_step": 372610, "epoch": 4489} {"train_loss": -26.283924102783203, "global_step": 372611, "epoch": 4489} {"train_loss": -26.27699089050293, "global_step": 372612, "epoch": 4489} {"train_loss": -26.3050537109375, "global_step": 372613, "epoch": 4489} {"train_loss": -26.495771408081055, "global_step": 372614, "epoch": 4489} {"train_loss": -26.063623428344727, "global_step": 372615, "epoch": 4489} {"train_loss": -26.01131248474121, "global_step": 372616, "epoch": 4489} {"train_loss": -26.45667839050293, "global_step": 372617, "epoch": 4489} {"train_loss": -26.261945724487305, "global_step": 372618, "epoch": 4489} {"train_loss": -26.49610710144043, "global_step": 372619, "epoch": 4489} {"train_loss": -26.34820556640625, "global_step": 372620, "epoch": 4489} {"train_loss": -26.279926300048828, "global_step": 372621, "epoch": 4489} {"train_loss": -26.44415855407715, "global_step": 372622, "epoch": 4489} {"train_loss": -26.120885848999023, "global_step": 372623, "epoch": 4489} {"train_loss": -26.650806427001953, "global_step": 372624, "epoch": 4489} {"train_loss": -26.156814575195312, "global_step": 372625, "epoch": 4489} {"train_loss": -26.214950561523438, "global_step": 372626, "epoch": 4489} {"train_loss": -26.545141220092773, "global_step": 372627, "epoch": 4489} {"train_loss": -26.709218978881836, "global_step": 372628, "epoch": 4489} {"train_loss": -26.383853912353516, "global_step": 372629, "epoch": 4489} {"train_loss": -26.599552154541016, "global_step": 372630, "epoch": 4489} {"train_loss": -26.538232803344727, "global_step": 372631, "epoch": 4489} {"train_loss": -26.43170738220215, "global_step": 372632, "epoch": 4489} {"train_loss": -26.52948570251465, "global_step": 372633, "epoch": 4489} {"train_loss": -26.7370662689209, "global_step": 372634, "epoch": 4489} {"train_loss": -26.60260581970215, "global_step": 372635, "epoch": 4489} {"train_loss": -26.8179931640625, "global_step": 372636, "epoch": 4489} {"train_loss": -26.484100341796875, "global_step": 372637, "epoch": 4489} {"train_loss": -26.577234268188477, "global_step": 372638, "epoch": 4489} {"train_loss": -26.547529220581055, "global_step": 372639, "epoch": 4489} {"train_loss": -26.677387237548828, "global_step": 372640, "epoch": 4489} {"train_loss": -26.476404190063477, "global_step": 372641, "epoch": 4489} {"train_loss": -26.543933868408203, "global_step": 372642, "epoch": 4489} {"train_loss": -26.728803634643555, "global_step": 372643, "epoch": 4489} {"train_loss": -26.71487808227539, "global_step": 372644, "epoch": 4489} {"train_loss": -26.303836822509766, "global_step": 372645, "epoch": 4489} {"train_loss": -26.068265914916992, "global_step": 372646, "epoch": 4489} {"train_loss": -26.27678871154785, "global_step": 372647, "epoch": 4489} {"train_loss": -26.358484268188477, "global_step": 372648, "epoch": 4489} {"train_loss": -26.630353927612305, "global_step": 372649, "epoch": 4489} {"train_loss": -26.9091854095459, "global_step": 372650, "epoch": 4489} {"train_loss": -26.553333282470703, "global_step": 372651, "epoch": 4489} {"train_loss": -26.07464599609375, "global_step": 372652, "epoch": 4489} {"train_loss": -25.827224731445312, "global_step": 372653, "epoch": 4489} {"train_loss": -25.694290161132812, "global_step": 372654, "epoch": 4489} {"train_loss": -26.030059814453125, "global_step": 372655, "epoch": 4489} {"train_loss": -25.876333236694336, "global_step": 372656, "epoch": 4489} {"train_loss": -26.5504150390625, "global_step": 372657, "epoch": 4489} {"train_loss": -26.414793014526367, "global_step": 372658, "epoch": 4489} {"train_loss": -26.353422164916992, "global_step": 372659, "epoch": 4489} {"train_loss": -26.31866455078125, "global_step": 372660, "epoch": 4489} {"train_loss": -26.482757568359375, "global_step": 372661, "epoch": 4489} {"train_loss": -26.533063888549805, "global_step": 372662, "epoch": 4489} {"train_loss": -26.43096923828125, "global_step": 372663, "epoch": 4489} {"train_loss": -26.355762481689453, "global_step": 372664, "epoch": 4489} {"train_loss": -26.62080955505371, "global_step": 372665, "epoch": 4489} {"train_loss": -26.452253341674805, "global_step": 372666, "epoch": 4489} {"train_loss": -26.5983829498291, "global_step": 372667, "epoch": 4489} {"train_loss": -26.3978328704834, "global_step": 372668, "epoch": 4489} {"train_loss": -26.25699114512248, "global_step": 372669, "epoch": 4489, "val_loss": 6541295.0} {"train_loss": -25.332931518554688, "global_step": 372670, "epoch": 4490} {"train_loss": -25.7254695892334, "global_step": 372671, "epoch": 4490} {"train_loss": -25.766000747680664, "global_step": 372672, "epoch": 4490} {"train_loss": -25.501171112060547, "global_step": 372673, "epoch": 4490} {"train_loss": -24.890108108520508, "global_step": 372674, "epoch": 4490} {"train_loss": -25.39068603515625, "global_step": 372675, "epoch": 4490} {"train_loss": -25.478740692138672, "global_step": 372676, "epoch": 4490} {"train_loss": -25.42127227783203, "global_step": 372677, "epoch": 4490} {"train_loss": -25.43646240234375, "global_step": 372678, "epoch": 4490} {"train_loss": -25.90525245666504, "global_step": 372679, "epoch": 4490} {"train_loss": -25.73752784729004, "global_step": 372680, "epoch": 4490} {"train_loss": -25.563344955444336, "global_step": 372681, "epoch": 4490} {"train_loss": -26.10340690612793, "global_step": 372682, "epoch": 4490} {"train_loss": -26.074926376342773, "global_step": 372683, "epoch": 4490} {"train_loss": -26.11395835876465, "global_step": 372684, "epoch": 4490} {"train_loss": -25.914255142211914, "global_step": 372685, "epoch": 4490} {"train_loss": -26.092193603515625, "global_step": 372686, "epoch": 4490} {"train_loss": -25.66938591003418, "global_step": 372687, "epoch": 4490} {"train_loss": -25.888355255126953, "global_step": 372688, "epoch": 4490} {"train_loss": -26.170385360717773, "global_step": 372689, "epoch": 4490} {"train_loss": -26.152210235595703, "global_step": 372690, "epoch": 4490} {"train_loss": -26.383214950561523, "global_step": 372691, "epoch": 4490} {"train_loss": -26.33721923828125, "global_step": 372692, "epoch": 4490} {"train_loss": -26.20328140258789, "global_step": 372693, "epoch": 4490} {"train_loss": -26.146066665649414, "global_step": 372694, "epoch": 4490} {"train_loss": -26.550962448120117, "global_step": 372695, "epoch": 4490} {"train_loss": -26.086820602416992, "global_step": 372696, "epoch": 4490} {"train_loss": -25.935583114624023, "global_step": 372697, "epoch": 4490} {"train_loss": -26.20684242248535, "global_step": 372698, "epoch": 4490} {"train_loss": -26.593353271484375, "global_step": 372699, "epoch": 4490} {"train_loss": -26.130573272705078, "global_step": 372700, "epoch": 4490} {"train_loss": -26.19059181213379, "global_step": 372701, "epoch": 4490} {"train_loss": -26.07219886779785, "global_step": 372702, "epoch": 4490} {"train_loss": -26.05885887145996, "global_step": 372703, "epoch": 4490} {"train_loss": -26.30323600769043, "global_step": 372704, "epoch": 4490} {"train_loss": -26.300077438354492, "global_step": 372705, "epoch": 4490} {"train_loss": -26.496662139892578, "global_step": 372706, "epoch": 4490} {"train_loss": -26.558435440063477, "global_step": 372707, "epoch": 4490} {"train_loss": -26.261463165283203, "global_step": 372708, "epoch": 4490} {"train_loss": -26.45684242248535, "global_step": 372709, "epoch": 4490} {"train_loss": -26.5928955078125, "global_step": 372710, "epoch": 4490} {"train_loss": -26.551300048828125, "global_step": 372711, "epoch": 4490} {"train_loss": -26.62152099609375, "global_step": 372712, "epoch": 4490} {"train_loss": -26.465585708618164, "global_step": 372713, "epoch": 4490} {"train_loss": -26.55682945251465, "global_step": 372714, "epoch": 4490} {"train_loss": -26.341962814331055, "global_step": 372715, "epoch": 4490} {"train_loss": -26.180438995361328, "global_step": 372716, "epoch": 4490} {"train_loss": -25.985509872436523, "global_step": 372717, "epoch": 4490} {"train_loss": -26.65071678161621, "global_step": 372718, "epoch": 4490} {"train_loss": -26.598440170288086, "global_step": 372719, "epoch": 4490} {"train_loss": -26.416540145874023, "global_step": 372720, "epoch": 4490} {"train_loss": -26.204910278320312, "global_step": 372721, "epoch": 4490} {"train_loss": -26.59626579284668, "global_step": 372722, "epoch": 4490} {"train_loss": -26.331253051757812, "global_step": 372723, "epoch": 4490} {"train_loss": -26.494007110595703, "global_step": 372724, "epoch": 4490} {"train_loss": -26.89480972290039, "global_step": 372725, "epoch": 4490} {"train_loss": -26.108413696289062, "global_step": 372726, "epoch": 4490} {"train_loss": -26.616748809814453, "global_step": 372727, "epoch": 4490} {"train_loss": -26.533262252807617, "global_step": 372728, "epoch": 4490} {"train_loss": -26.456470489501953, "global_step": 372729, "epoch": 4490} {"train_loss": -26.385028839111328, "global_step": 372730, "epoch": 4490} {"train_loss": -26.42972755432129, "global_step": 372731, "epoch": 4490} {"train_loss": -26.7392635345459, "global_step": 372732, "epoch": 4490} {"train_loss": -26.512250900268555, "global_step": 372733, "epoch": 4490} {"train_loss": -26.82822608947754, "global_step": 372734, "epoch": 4490} {"train_loss": -26.780786514282227, "global_step": 372735, "epoch": 4490} {"train_loss": -26.047698974609375, "global_step": 372736, "epoch": 4490} {"train_loss": -26.192529678344727, "global_step": 372737, "epoch": 4490} {"train_loss": -25.914825439453125, "global_step": 372738, "epoch": 4490} {"train_loss": -26.084741592407227, "global_step": 372739, "epoch": 4490} {"train_loss": -26.401611328125, "global_step": 372740, "epoch": 4490} {"train_loss": -26.429296493530273, "global_step": 372741, "epoch": 4490} {"train_loss": -26.36232566833496, "global_step": 372742, "epoch": 4490} {"train_loss": -26.479970932006836, "global_step": 372743, "epoch": 4490} {"train_loss": -26.614002227783203, "global_step": 372744, "epoch": 4490} {"train_loss": -26.15411376953125, "global_step": 372745, "epoch": 4490} {"train_loss": -26.7403621673584, "global_step": 372746, "epoch": 4490} {"train_loss": -26.372055053710938, "global_step": 372747, "epoch": 4490} {"train_loss": -26.475046157836914, "global_step": 372748, "epoch": 4490} {"train_loss": -26.593158721923828, "global_step": 372749, "epoch": 4490} {"train_loss": -26.39320945739746, "global_step": 372750, "epoch": 4490} {"train_loss": -26.984619140625, "global_step": 372751, "epoch": 4490} {"train_loss": -26.245135066020918, "global_step": 372752, "epoch": 4490, "val_loss": 6652531.0} {"train_loss": -25.342496871948242, "global_step": 372753, "epoch": 4491} {"train_loss": -25.981725692749023, "global_step": 372754, "epoch": 4491} {"train_loss": -25.785303115844727, "global_step": 372755, "epoch": 4491} {"train_loss": -25.43069839477539, "global_step": 372756, "epoch": 4491} {"train_loss": -25.18475341796875, "global_step": 372757, "epoch": 4491} {"train_loss": -25.85627555847168, "global_step": 372758, "epoch": 4491} {"train_loss": -26.428579330444336, "global_step": 372759, "epoch": 4491} {"train_loss": -25.697498321533203, "global_step": 372760, "epoch": 4491} {"train_loss": -26.118627548217773, "global_step": 372761, "epoch": 4491} {"train_loss": -26.25619888305664, "global_step": 372762, "epoch": 4491} {"train_loss": -26.095111846923828, "global_step": 372763, "epoch": 4491} {"train_loss": -26.29446792602539, "global_step": 372764, "epoch": 4491} {"train_loss": -26.244094848632812, "global_step": 372765, "epoch": 4491} {"train_loss": -26.180212020874023, "global_step": 372766, "epoch": 4491} {"train_loss": -25.95322036743164, "global_step": 372767, "epoch": 4491} {"train_loss": -26.05668067932129, "global_step": 372768, "epoch": 4491} {"train_loss": -26.14710807800293, "global_step": 372769, "epoch": 4491} {"train_loss": -25.8614559173584, "global_step": 372770, "epoch": 4491} {"train_loss": -26.21282386779785, "global_step": 372771, "epoch": 4491} {"train_loss": -26.2305908203125, "global_step": 372772, "epoch": 4491} {"train_loss": -26.159753799438477, "global_step": 372773, "epoch": 4491} {"train_loss": -26.021392822265625, "global_step": 372774, "epoch": 4491} {"train_loss": -26.041065216064453, "global_step": 372775, "epoch": 4491} {"train_loss": -26.345014572143555, "global_step": 372776, "epoch": 4491} {"train_loss": -26.094701766967773, "global_step": 372777, "epoch": 4491} {"train_loss": -26.494909286499023, "global_step": 372778, "epoch": 4491} {"train_loss": -26.361921310424805, "global_step": 372779, "epoch": 4491} {"train_loss": -26.16973876953125, "global_step": 372780, "epoch": 4491} {"train_loss": -26.74484634399414, "global_step": 372781, "epoch": 4491} {"train_loss": -26.48090934753418, "global_step": 372782, "epoch": 4491} {"train_loss": -26.2076416015625, "global_step": 372783, "epoch": 4491} {"train_loss": -26.189807891845703, "global_step": 372784, "epoch": 4491} {"train_loss": -26.670806884765625, "global_step": 372785, "epoch": 4491} {"train_loss": -26.2435359954834, "global_step": 372786, "epoch": 4491} {"train_loss": -26.402240753173828, "global_step": 372787, "epoch": 4491} {"train_loss": -26.23636817932129, "global_step": 372788, "epoch": 4491} {"train_loss": -26.450031280517578, "global_step": 372789, "epoch": 4491} {"train_loss": -26.511127471923828, "global_step": 372790, "epoch": 4491} {"train_loss": -26.162870407104492, "global_step": 372791, "epoch": 4491} {"train_loss": -26.524524688720703, "global_step": 372792, "epoch": 4491} {"train_loss": -26.7762451171875, "global_step": 372793, "epoch": 4491} {"train_loss": -26.751501083374023, "global_step": 372794, "epoch": 4491} {"train_loss": -26.304340362548828, "global_step": 372795, "epoch": 4491} {"train_loss": -26.46302604675293, "global_step": 372796, "epoch": 4491} {"train_loss": -26.90897560119629, "global_step": 372797, "epoch": 4491} {"train_loss": -26.342248916625977, "global_step": 372798, "epoch": 4491} {"train_loss": -26.284887313842773, "global_step": 372799, "epoch": 4491} {"train_loss": -26.717727661132812, "global_step": 372800, "epoch": 4491} {"train_loss": -26.5775203704834, "global_step": 372801, "epoch": 4491} {"train_loss": -26.44475746154785, "global_step": 372802, "epoch": 4491} {"train_loss": -26.285261154174805, "global_step": 372803, "epoch": 4491} {"train_loss": -26.728849411010742, "global_step": 372804, "epoch": 4491} {"train_loss": -26.446659088134766, "global_step": 372805, "epoch": 4491} {"train_loss": -26.45413589477539, "global_step": 372806, "epoch": 4491} {"train_loss": -26.35943031311035, "global_step": 372807, "epoch": 4491} {"train_loss": -26.5695858001709, "global_step": 372808, "epoch": 4491} {"train_loss": -26.152774810791016, "global_step": 372809, "epoch": 4491} {"train_loss": -26.439990997314453, "global_step": 372810, "epoch": 4491} {"train_loss": -26.753738403320312, "global_step": 372811, "epoch": 4491} {"train_loss": -26.571949005126953, "global_step": 372812, "epoch": 4491} {"train_loss": -26.29571533203125, "global_step": 372813, "epoch": 4491} {"train_loss": -26.43123435974121, "global_step": 372814, "epoch": 4491} {"train_loss": -26.391345977783203, "global_step": 372815, "epoch": 4491} {"train_loss": -26.38150405883789, "global_step": 372816, "epoch": 4491} {"train_loss": -26.421194076538086, "global_step": 372817, "epoch": 4491} {"train_loss": -26.374439239501953, "global_step": 372818, "epoch": 4491} {"train_loss": -26.504505157470703, "global_step": 372819, "epoch": 4491} {"train_loss": -26.549285888671875, "global_step": 372820, "epoch": 4491} {"train_loss": -26.695974349975586, "global_step": 372821, "epoch": 4491} {"train_loss": -26.306915283203125, "global_step": 372822, "epoch": 4491} {"train_loss": -26.51422691345215, "global_step": 372823, "epoch": 4491} {"train_loss": -26.168628692626953, "global_step": 372824, "epoch": 4491} {"train_loss": -26.0815372467041, "global_step": 372825, "epoch": 4491} {"train_loss": -26.353490829467773, "global_step": 372826, "epoch": 4491} {"train_loss": -26.214502334594727, "global_step": 372827, "epoch": 4491} {"train_loss": -26.076345443725586, "global_step": 372828, "epoch": 4491} {"train_loss": -26.304706573486328, "global_step": 372829, "epoch": 4491} {"train_loss": -25.976470947265625, "global_step": 372830, "epoch": 4491} {"train_loss": -26.387176513671875, "global_step": 372831, "epoch": 4491} {"train_loss": -26.33534049987793, "global_step": 372832, "epoch": 4491} {"train_loss": -26.429107666015625, "global_step": 372833, "epoch": 4491} {"train_loss": -26.076025009155273, "global_step": 372834, "epoch": 4491} {"train_loss": -26.279075530638178, "global_step": 372835, "epoch": 4491, "val_loss": 6711952.0} {"train_loss": -25.889892578125, "global_step": 372836, "epoch": 4492} {"train_loss": -25.896814346313477, "global_step": 372837, "epoch": 4492} {"train_loss": -26.368133544921875, "global_step": 372838, "epoch": 4492} {"train_loss": -25.809240341186523, "global_step": 372839, "epoch": 4492} {"train_loss": -25.571325302124023, "global_step": 372840, "epoch": 4492} {"train_loss": -26.251495361328125, "global_step": 372841, "epoch": 4492} {"train_loss": -26.04218101501465, "global_step": 372842, "epoch": 4492} {"train_loss": -25.4617862701416, "global_step": 372843, "epoch": 4492} {"train_loss": -25.953784942626953, "global_step": 372844, "epoch": 4492} {"train_loss": -26.35623550415039, "global_step": 372845, "epoch": 4492} {"train_loss": -26.007455825805664, "global_step": 372846, "epoch": 4492} {"train_loss": -26.337207794189453, "global_step": 372847, "epoch": 4492} {"train_loss": -25.877893447875977, "global_step": 372848, "epoch": 4492} {"train_loss": -26.1058349609375, "global_step": 372849, "epoch": 4492} {"train_loss": -25.9403018951416, "global_step": 372850, "epoch": 4492} {"train_loss": -26.222858428955078, "global_step": 372851, "epoch": 4492} {"train_loss": -26.625951766967773, "global_step": 372852, "epoch": 4492} {"train_loss": -26.053054809570312, "global_step": 372853, "epoch": 4492} {"train_loss": -26.250965118408203, "global_step": 372854, "epoch": 4492} {"train_loss": -26.235870361328125, "global_step": 372855, "epoch": 4492} {"train_loss": -26.013381958007812, "global_step": 372856, "epoch": 4492} {"train_loss": -26.159351348876953, "global_step": 372857, "epoch": 4492} {"train_loss": -26.57013511657715, "global_step": 372858, "epoch": 4492} {"train_loss": -26.4088134765625, "global_step": 372859, "epoch": 4492} {"train_loss": -26.314355850219727, "global_step": 372860, "epoch": 4492} {"train_loss": -26.48394203186035, "global_step": 372861, "epoch": 4492} {"train_loss": -26.312042236328125, "global_step": 372862, "epoch": 4492} {"train_loss": -26.47381019592285, "global_step": 372863, "epoch": 4492} {"train_loss": -26.70155143737793, "global_step": 372864, "epoch": 4492} {"train_loss": -26.612812042236328, "global_step": 372865, "epoch": 4492} {"train_loss": -26.44366455078125, "global_step": 372866, "epoch": 4492} {"train_loss": -26.423551559448242, "global_step": 372867, "epoch": 4492} {"train_loss": -26.450971603393555, "global_step": 372868, "epoch": 4492} {"train_loss": -26.54862403869629, "global_step": 372869, "epoch": 4492} {"train_loss": -26.3689022064209, "global_step": 372870, "epoch": 4492} {"train_loss": -26.5599422454834, "global_step": 372871, "epoch": 4492} {"train_loss": -26.134519577026367, "global_step": 372872, "epoch": 4492} {"train_loss": -26.447265625, "global_step": 372873, "epoch": 4492} {"train_loss": -26.807758331298828, "global_step": 372874, "epoch": 4492} {"train_loss": -26.548694610595703, "global_step": 372875, "epoch": 4492} {"train_loss": -26.30927085876465, "global_step": 372876, "epoch": 4492} {"train_loss": -26.43817138671875, "global_step": 372877, "epoch": 4492} {"train_loss": -26.314289093017578, "global_step": 372878, "epoch": 4492} {"train_loss": -26.219924926757812, "global_step": 372879, "epoch": 4492} {"train_loss": -26.440872192382812, "global_step": 372880, "epoch": 4492} {"train_loss": -25.9259090423584, "global_step": 372881, "epoch": 4492} {"train_loss": -26.555627822875977, "global_step": 372882, "epoch": 4492} {"train_loss": -26.431598663330078, "global_step": 372883, "epoch": 4492} {"train_loss": -26.1151180267334, "global_step": 372884, "epoch": 4492} {"train_loss": -26.020919799804688, "global_step": 372885, "epoch": 4492} {"train_loss": -26.613147735595703, "global_step": 372886, "epoch": 4492} {"train_loss": -26.338226318359375, "global_step": 372887, "epoch": 4492} {"train_loss": -25.991256713867188, "global_step": 372888, "epoch": 4492} {"train_loss": -26.42500114440918, "global_step": 372889, "epoch": 4492} {"train_loss": -26.259565353393555, "global_step": 372890, "epoch": 4492} {"train_loss": -26.5693416595459, "global_step": 372891, "epoch": 4492} {"train_loss": -25.958826065063477, "global_step": 372892, "epoch": 4492} {"train_loss": -25.97307777404785, "global_step": 372893, "epoch": 4492} {"train_loss": -26.280908584594727, "global_step": 372894, "epoch": 4492} {"train_loss": -26.18120765686035, "global_step": 372895, "epoch": 4492} {"train_loss": -26.652929306030273, "global_step": 372896, "epoch": 4492} {"train_loss": -26.150232315063477, "global_step": 372897, "epoch": 4492} {"train_loss": -26.322763442993164, "global_step": 372898, "epoch": 4492} {"train_loss": -26.181116104125977, "global_step": 372899, "epoch": 4492} {"train_loss": -26.036197662353516, "global_step": 372900, "epoch": 4492} {"train_loss": -26.566848754882812, "global_step": 372901, "epoch": 4492} {"train_loss": -26.615198135375977, "global_step": 372902, "epoch": 4492} {"train_loss": -26.053638458251953, "global_step": 372903, "epoch": 4492} {"train_loss": -26.393787384033203, "global_step": 372904, "epoch": 4492} {"train_loss": -26.388782501220703, "global_step": 372905, "epoch": 4492} {"train_loss": -26.110876083374023, "global_step": 372906, "epoch": 4492} {"train_loss": -26.201120376586914, "global_step": 372907, "epoch": 4492} {"train_loss": -26.434560775756836, "global_step": 372908, "epoch": 4492} {"train_loss": -26.225011825561523, "global_step": 372909, "epoch": 4492} {"train_loss": -26.37308692932129, "global_step": 372910, "epoch": 4492} {"train_loss": -26.595569610595703, "global_step": 372911, "epoch": 4492} {"train_loss": -26.232025146484375, "global_step": 372912, "epoch": 4492} {"train_loss": -26.364181518554688, "global_step": 372913, "epoch": 4492} {"train_loss": -26.204519271850586, "global_step": 372914, "epoch": 4492} {"train_loss": -26.338369369506836, "global_step": 372915, "epoch": 4492} {"train_loss": -26.309036254882812, "global_step": 372916, "epoch": 4492} {"train_loss": -26.455358505249023, "global_step": 372917, "epoch": 4492} {"train_loss": -26.266151152461408, "global_step": 372918, "epoch": 4492, "val_loss": 6622904.0} {"train_loss": -26.09745216369629, "global_step": 372919, "epoch": 4493} {"train_loss": -25.68475914001465, "global_step": 372920, "epoch": 4493} {"train_loss": -26.038583755493164, "global_step": 372921, "epoch": 4493} {"train_loss": -25.942773818969727, "global_step": 372922, "epoch": 4493} {"train_loss": -26.155908584594727, "global_step": 372923, "epoch": 4493} {"train_loss": -26.096012115478516, "global_step": 372924, "epoch": 4493} {"train_loss": -26.2406005859375, "global_step": 372925, "epoch": 4493} {"train_loss": -26.292072296142578, "global_step": 372926, "epoch": 4493} {"train_loss": -25.753280639648438, "global_step": 372927, "epoch": 4493} {"train_loss": -25.976919174194336, "global_step": 372928, "epoch": 4493} {"train_loss": -25.93072509765625, "global_step": 372929, "epoch": 4493} {"train_loss": -25.98615074157715, "global_step": 372930, "epoch": 4493} {"train_loss": -26.128143310546875, "global_step": 372931, "epoch": 4493} {"train_loss": -26.356115341186523, "global_step": 372932, "epoch": 4493} {"train_loss": -26.393157958984375, "global_step": 372933, "epoch": 4493} {"train_loss": -26.13368034362793, "global_step": 372934, "epoch": 4493} {"train_loss": -26.382104873657227, "global_step": 372935, "epoch": 4493} {"train_loss": -26.513608932495117, "global_step": 372936, "epoch": 4493} {"train_loss": -26.548675537109375, "global_step": 372937, "epoch": 4493} {"train_loss": -26.544788360595703, "global_step": 372938, "epoch": 4493} {"train_loss": -26.410125732421875, "global_step": 372939, "epoch": 4493} {"train_loss": -26.22285270690918, "global_step": 372940, "epoch": 4493} {"train_loss": -26.141996383666992, "global_step": 372941, "epoch": 4493} {"train_loss": -26.649036407470703, "global_step": 372942, "epoch": 4493} {"train_loss": -26.516332626342773, "global_step": 372943, "epoch": 4493} {"train_loss": -26.24169921875, "global_step": 372944, "epoch": 4493} {"train_loss": -26.89861488342285, "global_step": 372945, "epoch": 4493} {"train_loss": -26.324132919311523, "global_step": 372946, "epoch": 4493} {"train_loss": -26.315942764282227, "global_step": 372947, "epoch": 4493} {"train_loss": -26.12763786315918, "global_step": 372948, "epoch": 4493} {"train_loss": -26.444921493530273, "global_step": 372949, "epoch": 4493} {"train_loss": -26.46596336364746, "global_step": 372950, "epoch": 4493} {"train_loss": -26.5505428314209, "global_step": 372951, "epoch": 4493} {"train_loss": -26.477705001831055, "global_step": 372952, "epoch": 4493} {"train_loss": -26.44229507446289, "global_step": 372953, "epoch": 4493} {"train_loss": -26.3878231048584, "global_step": 372954, "epoch": 4493} {"train_loss": -26.497838973999023, "global_step": 372955, "epoch": 4493} {"train_loss": -26.715015411376953, "global_step": 372956, "epoch": 4493} {"train_loss": -26.42779541015625, "global_step": 372957, "epoch": 4493} {"train_loss": -26.625659942626953, "global_step": 372958, "epoch": 4493} {"train_loss": -26.569137573242188, "global_step": 372959, "epoch": 4493} {"train_loss": -26.719074249267578, "global_step": 372960, "epoch": 4493} {"train_loss": -26.839441299438477, "global_step": 372961, "epoch": 4493} {"train_loss": -26.927188873291016, "global_step": 372962, "epoch": 4493} {"train_loss": -26.32832145690918, "global_step": 372963, "epoch": 4493} {"train_loss": -26.389272689819336, "global_step": 372964, "epoch": 4493} {"train_loss": -26.534576416015625, "global_step": 372965, "epoch": 4493} {"train_loss": -26.093536376953125, "global_step": 372966, "epoch": 4493} {"train_loss": -26.155506134033203, "global_step": 372967, "epoch": 4493} {"train_loss": -26.106266021728516, "global_step": 372968, "epoch": 4493} {"train_loss": -26.755945205688477, "global_step": 372969, "epoch": 4493} {"train_loss": -26.54638671875, "global_step": 372970, "epoch": 4493} {"train_loss": -26.906848907470703, "global_step": 372971, "epoch": 4493} {"train_loss": -26.735675811767578, "global_step": 372972, "epoch": 4493} {"train_loss": -26.39381217956543, "global_step": 372973, "epoch": 4493} {"train_loss": -26.71563720703125, "global_step": 372974, "epoch": 4493} {"train_loss": -26.951208114624023, "global_step": 372975, "epoch": 4493} {"train_loss": -26.4934024810791, "global_step": 372976, "epoch": 4493} {"train_loss": -26.690235137939453, "global_step": 372977, "epoch": 4493} {"train_loss": -26.740558624267578, "global_step": 372978, "epoch": 4493} {"train_loss": -26.210342407226562, "global_step": 372979, "epoch": 4493} {"train_loss": -26.05911636352539, "global_step": 372980, "epoch": 4493} {"train_loss": -24.923236846923828, "global_step": 372981, "epoch": 4493} {"train_loss": -24.754962921142578, "global_step": 372982, "epoch": 4493} {"train_loss": -25.23480224609375, "global_step": 372983, "epoch": 4493} {"train_loss": -25.834430694580078, "global_step": 372984, "epoch": 4493} {"train_loss": -25.961872100830078, "global_step": 372985, "epoch": 4493} {"train_loss": -25.741046905517578, "global_step": 372986, "epoch": 4493} {"train_loss": -26.271503448486328, "global_step": 372987, "epoch": 4493} {"train_loss": -25.630054473876953, "global_step": 372988, "epoch": 4493} {"train_loss": -25.877460479736328, "global_step": 372989, "epoch": 4493} {"train_loss": -26.564620971679688, "global_step": 372990, "epoch": 4493} {"train_loss": -25.461801528930664, "global_step": 372991, "epoch": 4493} {"train_loss": -26.192068099975586, "global_step": 372992, "epoch": 4493} {"train_loss": -25.884016036987305, "global_step": 372993, "epoch": 4493} {"train_loss": -25.93354606628418, "global_step": 372994, "epoch": 4493} {"train_loss": -26.13176918029785, "global_step": 372995, "epoch": 4493} {"train_loss": -26.026342391967773, "global_step": 372996, "epoch": 4493} {"train_loss": -25.9375057220459, "global_step": 372997, "epoch": 4493} {"train_loss": -25.82820701599121, "global_step": 372998, "epoch": 4493} {"train_loss": -25.814685821533203, "global_step": 372999, "epoch": 4493} {"train_loss": -26.175947189331055, "global_step": 373000, "epoch": 4493} {"train_loss": -26.25346330849521, "global_step": 373001, "epoch": 4493, "val_loss": 6554986.5} {"train_loss": -25.40020751953125, "global_step": 373002, "epoch": 4494} {"train_loss": -25.718164443969727, "global_step": 373003, "epoch": 4494} {"train_loss": -25.545028686523438, "global_step": 373004, "epoch": 4494} {"train_loss": -25.659809112548828, "global_step": 373005, "epoch": 4494} {"train_loss": -25.92365837097168, "global_step": 373006, "epoch": 4494} {"train_loss": -25.99024772644043, "global_step": 373007, "epoch": 4494} {"train_loss": -26.0226993560791, "global_step": 373008, "epoch": 4494} {"train_loss": -26.223770141601562, "global_step": 373009, "epoch": 4494} {"train_loss": -26.314916610717773, "global_step": 373010, "epoch": 4494} {"train_loss": -25.9429931640625, "global_step": 373011, "epoch": 4494} {"train_loss": -26.645904541015625, "global_step": 373012, "epoch": 4494} {"train_loss": -26.124982833862305, "global_step": 373013, "epoch": 4494} {"train_loss": -26.1702823638916, "global_step": 373014, "epoch": 4494} {"train_loss": -26.094785690307617, "global_step": 373015, "epoch": 4494} {"train_loss": -26.482574462890625, "global_step": 373016, "epoch": 4494} {"train_loss": -26.163114547729492, "global_step": 373017, "epoch": 4494} {"train_loss": -26.162128448486328, "global_step": 373018, "epoch": 4494} {"train_loss": -26.356739044189453, "global_step": 373019, "epoch": 4494} {"train_loss": -26.40143394470215, "global_step": 373020, "epoch": 4494} {"train_loss": -26.132177352905273, "global_step": 373021, "epoch": 4494} {"train_loss": -26.3424129486084, "global_step": 373022, "epoch": 4494} {"train_loss": -26.45454216003418, "global_step": 373023, "epoch": 4494} {"train_loss": -26.47138786315918, "global_step": 373024, "epoch": 4494} {"train_loss": -26.20867919921875, "global_step": 373025, "epoch": 4494} {"train_loss": -26.147165298461914, "global_step": 373026, "epoch": 4494} {"train_loss": -25.997114181518555, "global_step": 373027, "epoch": 4494} {"train_loss": -26.45917320251465, "global_step": 373028, "epoch": 4494} {"train_loss": -26.084522247314453, "global_step": 373029, "epoch": 4494} {"train_loss": -26.438709259033203, "global_step": 373030, "epoch": 4494} {"train_loss": -26.380598068237305, "global_step": 373031, "epoch": 4494} {"train_loss": -26.51436424255371, "global_step": 373032, "epoch": 4494} {"train_loss": -26.279022216796875, "global_step": 373033, "epoch": 4494} {"train_loss": -26.27678871154785, "global_step": 373034, "epoch": 4494} {"train_loss": -26.49091911315918, "global_step": 373035, "epoch": 4494} {"train_loss": -26.5601749420166, "global_step": 373036, "epoch": 4494} {"train_loss": -26.498615264892578, "global_step": 373037, "epoch": 4494} {"train_loss": -26.477828979492188, "global_step": 373038, "epoch": 4494} {"train_loss": -26.56622886657715, "global_step": 373039, "epoch": 4494} {"train_loss": -26.722381591796875, "global_step": 373040, "epoch": 4494} {"train_loss": -26.655582427978516, "global_step": 373041, "epoch": 4494} {"train_loss": -26.474288940429688, "global_step": 373042, "epoch": 4494} {"train_loss": -26.25018882751465, "global_step": 373043, "epoch": 4494} {"train_loss": -26.582977294921875, "global_step": 373044, "epoch": 4494} {"train_loss": -26.70782470703125, "global_step": 373045, "epoch": 4494} {"train_loss": -26.443822860717773, "global_step": 373046, "epoch": 4494} {"train_loss": -26.753864288330078, "global_step": 373047, "epoch": 4494} {"train_loss": -26.56373405456543, "global_step": 373048, "epoch": 4494} {"train_loss": -26.349767684936523, "global_step": 373049, "epoch": 4494} {"train_loss": -26.330280303955078, "global_step": 373050, "epoch": 4494} {"train_loss": -25.984745025634766, "global_step": 373051, "epoch": 4494} {"train_loss": -26.473556518554688, "global_step": 373052, "epoch": 4494} {"train_loss": -26.369592666625977, "global_step": 373053, "epoch": 4494} {"train_loss": -26.157012939453125, "global_step": 373054, "epoch": 4494} {"train_loss": -26.38580322265625, "global_step": 373055, "epoch": 4494} {"train_loss": -26.425710678100586, "global_step": 373056, "epoch": 4494} {"train_loss": -25.98060417175293, "global_step": 373057, "epoch": 4494} {"train_loss": -26.5198974609375, "global_step": 373058, "epoch": 4494} {"train_loss": -26.35297966003418, "global_step": 373059, "epoch": 4494} {"train_loss": -26.572906494140625, "global_step": 373060, "epoch": 4494} {"train_loss": -26.00278091430664, "global_step": 373061, "epoch": 4494} {"train_loss": -25.862409591674805, "global_step": 373062, "epoch": 4494} {"train_loss": -26.296222686767578, "global_step": 373063, "epoch": 4494} {"train_loss": -26.53139305114746, "global_step": 373064, "epoch": 4494} {"train_loss": -26.12648582458496, "global_step": 373065, "epoch": 4494} {"train_loss": -26.424158096313477, "global_step": 373066, "epoch": 4494} {"train_loss": -26.579320907592773, "global_step": 373067, "epoch": 4494} {"train_loss": -26.250165939331055, "global_step": 373068, "epoch": 4494} {"train_loss": -26.284027099609375, "global_step": 373069, "epoch": 4494} {"train_loss": -26.257944107055664, "global_step": 373070, "epoch": 4494} {"train_loss": -26.24810218811035, "global_step": 373071, "epoch": 4494} {"train_loss": -26.208267211914062, "global_step": 373072, "epoch": 4494} {"train_loss": -26.45612907409668, "global_step": 373073, "epoch": 4494} {"train_loss": -25.84708023071289, "global_step": 373074, "epoch": 4494} {"train_loss": -26.387399673461914, "global_step": 373075, "epoch": 4494} {"train_loss": -26.22748374938965, "global_step": 373076, "epoch": 4494} {"train_loss": -26.195520401000977, "global_step": 373077, "epoch": 4494} {"train_loss": -26.5607852935791, "global_step": 373078, "epoch": 4494} {"train_loss": -26.45314598083496, "global_step": 373079, "epoch": 4494} {"train_loss": -26.042652130126953, "global_step": 373080, "epoch": 4494} {"train_loss": -26.384815216064453, "global_step": 373081, "epoch": 4494} {"train_loss": -26.492385864257812, "global_step": 373082, "epoch": 4494} {"train_loss": -26.296340942382812, "global_step": 373083, "epoch": 4494} {"train_loss": -26.277417745934912, "global_step": 373084, "epoch": 4494, "val_loss": 6566951.0} {"train_loss": -25.698612213134766, "global_step": 373085, "epoch": 4495} {"train_loss": -25.35774803161621, "global_step": 373086, "epoch": 4495} {"train_loss": -26.01173210144043, "global_step": 373087, "epoch": 4495} {"train_loss": -25.627729415893555, "global_step": 373088, "epoch": 4495} {"train_loss": -25.762989044189453, "global_step": 373089, "epoch": 4495} {"train_loss": -26.130590438842773, "global_step": 373090, "epoch": 4495} {"train_loss": -25.9242000579834, "global_step": 373091, "epoch": 4495} {"train_loss": -26.020109176635742, "global_step": 373092, "epoch": 4495} {"train_loss": -25.617380142211914, "global_step": 373093, "epoch": 4495} {"train_loss": -25.85431480407715, "global_step": 373094, "epoch": 4495} {"train_loss": -26.324996948242188, "global_step": 373095, "epoch": 4495} {"train_loss": -25.613561630249023, "global_step": 373096, "epoch": 4495} {"train_loss": -26.302825927734375, "global_step": 373097, "epoch": 4495} {"train_loss": -26.138172149658203, "global_step": 373098, "epoch": 4495} {"train_loss": -26.18256950378418, "global_step": 373099, "epoch": 4495} {"train_loss": -26.226322174072266, "global_step": 373100, "epoch": 4495} {"train_loss": -26.4539737701416, "global_step": 373101, "epoch": 4495} {"train_loss": -26.386627197265625, "global_step": 373102, "epoch": 4495} {"train_loss": -26.39084243774414, "global_step": 373103, "epoch": 4495} {"train_loss": -26.053943634033203, "global_step": 373104, "epoch": 4495} {"train_loss": -26.464887619018555, "global_step": 373105, "epoch": 4495} {"train_loss": -26.16053581237793, "global_step": 373106, "epoch": 4495} {"train_loss": -26.483434677124023, "global_step": 373107, "epoch": 4495} {"train_loss": -26.22528076171875, "global_step": 373108, "epoch": 4495} {"train_loss": -26.24470329284668, "global_step": 373109, "epoch": 4495} {"train_loss": -26.297021865844727, "global_step": 373110, "epoch": 4495} {"train_loss": -26.6868953704834, "global_step": 373111, "epoch": 4495} {"train_loss": -26.241546630859375, "global_step": 373112, "epoch": 4495} {"train_loss": -26.116668701171875, "global_step": 373113, "epoch": 4495} {"train_loss": -26.027973175048828, "global_step": 373114, "epoch": 4495} {"train_loss": -26.834918975830078, "global_step": 373115, "epoch": 4495} {"train_loss": -26.72542381286621, "global_step": 373116, "epoch": 4495} {"train_loss": -26.491165161132812, "global_step": 373117, "epoch": 4495} {"train_loss": -26.259241104125977, "global_step": 373118, "epoch": 4495} {"train_loss": -26.210968017578125, "global_step": 373119, "epoch": 4495} {"train_loss": -26.241918563842773, "global_step": 373120, "epoch": 4495} {"train_loss": -26.55707359313965, "global_step": 373121, "epoch": 4495} {"train_loss": -26.663705825805664, "global_step": 373122, "epoch": 4495} {"train_loss": -26.4434814453125, "global_step": 373123, "epoch": 4495} {"train_loss": -26.2071475982666, "global_step": 373124, "epoch": 4495} {"train_loss": -26.684598922729492, "global_step": 373125, "epoch": 4495} {"train_loss": -26.2362117767334, "global_step": 373126, "epoch": 4495} {"train_loss": -26.55255126953125, "global_step": 373127, "epoch": 4495} {"train_loss": -26.22966957092285, "global_step": 373128, "epoch": 4495} {"train_loss": -26.4206600189209, "global_step": 373129, "epoch": 4495} {"train_loss": -26.377933502197266, "global_step": 373130, "epoch": 4495} {"train_loss": -26.13405418395996, "global_step": 373131, "epoch": 4495} {"train_loss": -26.3421630859375, "global_step": 373132, "epoch": 4495} {"train_loss": -26.382272720336914, "global_step": 373133, "epoch": 4495} {"train_loss": -26.820165634155273, "global_step": 373134, "epoch": 4495} {"train_loss": -26.405532836914062, "global_step": 373135, "epoch": 4495} {"train_loss": -26.214752197265625, "global_step": 373136, "epoch": 4495} {"train_loss": -26.36345863342285, "global_step": 373137, "epoch": 4495} {"train_loss": -26.346908569335938, "global_step": 373138, "epoch": 4495} {"train_loss": -26.73455810546875, "global_step": 373139, "epoch": 4495} {"train_loss": -26.74616813659668, "global_step": 373140, "epoch": 4495} {"train_loss": -26.632471084594727, "global_step": 373141, "epoch": 4495} {"train_loss": -26.120136260986328, "global_step": 373142, "epoch": 4495} {"train_loss": -26.681568145751953, "global_step": 373143, "epoch": 4495} {"train_loss": -26.748132705688477, "global_step": 373144, "epoch": 4495} {"train_loss": -26.361968994140625, "global_step": 373145, "epoch": 4495} {"train_loss": -26.638845443725586, "global_step": 373146, "epoch": 4495} {"train_loss": -26.4852352142334, "global_step": 373147, "epoch": 4495} {"train_loss": -26.779333114624023, "global_step": 373148, "epoch": 4495} {"train_loss": -26.434585571289062, "global_step": 373149, "epoch": 4495} {"train_loss": -26.555042266845703, "global_step": 373150, "epoch": 4495} {"train_loss": -26.521528244018555, "global_step": 373151, "epoch": 4495} {"train_loss": -26.36594009399414, "global_step": 373152, "epoch": 4495} {"train_loss": -26.50404930114746, "global_step": 373153, "epoch": 4495} {"train_loss": -26.471094131469727, "global_step": 373154, "epoch": 4495} {"train_loss": -26.1889705657959, "global_step": 373155, "epoch": 4495} {"train_loss": -26.324554443359375, "global_step": 373156, "epoch": 4495} {"train_loss": -26.468860626220703, "global_step": 373157, "epoch": 4495} {"train_loss": -26.10165786743164, "global_step": 373158, "epoch": 4495} {"train_loss": -26.403961181640625, "global_step": 373159, "epoch": 4495} {"train_loss": -26.77890396118164, "global_step": 373160, "epoch": 4495} {"train_loss": -26.59046745300293, "global_step": 373161, "epoch": 4495} {"train_loss": -26.326797485351562, "global_step": 373162, "epoch": 4495} {"train_loss": -26.456806182861328, "global_step": 373163, "epoch": 4495} {"train_loss": -26.33984375, "global_step": 373164, "epoch": 4495} {"train_loss": -26.475101470947266, "global_step": 373165, "epoch": 4495} {"train_loss": -26.162738800048828, "global_step": 373166, "epoch": 4495} {"train_loss": -26.335195656282355, "global_step": 373167, "epoch": 4495, "val_loss": 6791605.0} {"train_loss": -24.423276901245117, "global_step": 373168, "epoch": 4496} {"train_loss": -25.691205978393555, "global_step": 373169, "epoch": 4496} {"train_loss": -25.336469650268555, "global_step": 373170, "epoch": 4496} {"train_loss": -24.94028663635254, "global_step": 373171, "epoch": 4496} {"train_loss": -26.015729904174805, "global_step": 373172, "epoch": 4496} {"train_loss": -24.544940948486328, "global_step": 373173, "epoch": 4496} {"train_loss": -25.6975040435791, "global_step": 373174, "epoch": 4496} {"train_loss": -25.576990127563477, "global_step": 373175, "epoch": 4496} {"train_loss": -25.545211791992188, "global_step": 373176, "epoch": 4496} {"train_loss": -25.70562171936035, "global_step": 373177, "epoch": 4496} {"train_loss": -25.9064998626709, "global_step": 373178, "epoch": 4496} {"train_loss": -25.89322280883789, "global_step": 373179, "epoch": 4496} {"train_loss": -25.756439208984375, "global_step": 373180, "epoch": 4496} {"train_loss": -25.828641891479492, "global_step": 373181, "epoch": 4496} {"train_loss": -26.094480514526367, "global_step": 373182, "epoch": 4496} {"train_loss": -25.760944366455078, "global_step": 373183, "epoch": 4496} {"train_loss": -25.804075241088867, "global_step": 373184, "epoch": 4496} {"train_loss": -26.13703727722168, "global_step": 373185, "epoch": 4496} {"train_loss": -25.643396377563477, "global_step": 373186, "epoch": 4496} {"train_loss": -26.037551879882812, "global_step": 373187, "epoch": 4496} {"train_loss": -25.783573150634766, "global_step": 373188, "epoch": 4496} {"train_loss": -26.128225326538086, "global_step": 373189, "epoch": 4496} {"train_loss": -26.070526123046875, "global_step": 373190, "epoch": 4496} {"train_loss": -26.27520179748535, "global_step": 373191, "epoch": 4496} {"train_loss": -26.1092529296875, "global_step": 373192, "epoch": 4496} {"train_loss": -25.757780075073242, "global_step": 373193, "epoch": 4496} {"train_loss": -25.8951358795166, "global_step": 373194, "epoch": 4496} {"train_loss": -26.39851951599121, "global_step": 373195, "epoch": 4496} {"train_loss": -25.861862182617188, "global_step": 373196, "epoch": 4496} {"train_loss": -26.157602310180664, "global_step": 373197, "epoch": 4496} {"train_loss": -26.347076416015625, "global_step": 373198, "epoch": 4496} {"train_loss": -26.268808364868164, "global_step": 373199, "epoch": 4496} {"train_loss": -26.288480758666992, "global_step": 373200, "epoch": 4496} {"train_loss": -26.435962677001953, "global_step": 373201, "epoch": 4496} {"train_loss": -26.55063819885254, "global_step": 373202, "epoch": 4496} {"train_loss": -26.767627716064453, "global_step": 373203, "epoch": 4496} {"train_loss": -26.231658935546875, "global_step": 373204, "epoch": 4496} {"train_loss": -26.61553382873535, "global_step": 373205, "epoch": 4496} {"train_loss": -26.629718780517578, "global_step": 373206, "epoch": 4496} {"train_loss": -26.661828994750977, "global_step": 373207, "epoch": 4496} {"train_loss": -26.340896606445312, "global_step": 373208, "epoch": 4496} {"train_loss": -26.466140747070312, "global_step": 373209, "epoch": 4496} {"train_loss": -26.48211097717285, "global_step": 373210, "epoch": 4496} {"train_loss": -26.723468780517578, "global_step": 373211, "epoch": 4496} {"train_loss": -26.66745376586914, "global_step": 373212, "epoch": 4496} {"train_loss": -27.03828239440918, "global_step": 373213, "epoch": 4496} {"train_loss": -26.59357261657715, "global_step": 373214, "epoch": 4496} {"train_loss": -26.212690353393555, "global_step": 373215, "epoch": 4496} {"train_loss": -26.420917510986328, "global_step": 373216, "epoch": 4496} {"train_loss": -26.6416015625, "global_step": 373217, "epoch": 4496} {"train_loss": -26.183917999267578, "global_step": 373218, "epoch": 4496} {"train_loss": -26.206466674804688, "global_step": 373219, "epoch": 4496} {"train_loss": -26.110748291015625, "global_step": 373220, "epoch": 4496} {"train_loss": -26.52386474609375, "global_step": 373221, "epoch": 4496} {"train_loss": -26.12798500061035, "global_step": 373222, "epoch": 4496} {"train_loss": -26.207141876220703, "global_step": 373223, "epoch": 4496} {"train_loss": -26.38185691833496, "global_step": 373224, "epoch": 4496} {"train_loss": -26.25397300720215, "global_step": 373225, "epoch": 4496} {"train_loss": -26.149341583251953, "global_step": 373226, "epoch": 4496} {"train_loss": -26.709753036499023, "global_step": 373227, "epoch": 4496} {"train_loss": -26.42384147644043, "global_step": 373228, "epoch": 4496} {"train_loss": -26.648529052734375, "global_step": 373229, "epoch": 4496} {"train_loss": -26.57050895690918, "global_step": 373230, "epoch": 4496} {"train_loss": -26.424978256225586, "global_step": 373231, "epoch": 4496} {"train_loss": -26.25189208984375, "global_step": 373232, "epoch": 4496} {"train_loss": -26.038476943969727, "global_step": 373233, "epoch": 4496} {"train_loss": -26.344507217407227, "global_step": 373234, "epoch": 4496} {"train_loss": -26.217992782592773, "global_step": 373235, "epoch": 4496} {"train_loss": -26.619367599487305, "global_step": 373236, "epoch": 4496} {"train_loss": -26.142852783203125, "global_step": 373237, "epoch": 4496} {"train_loss": -26.409814834594727, "global_step": 373238, "epoch": 4496} {"train_loss": -25.970184326171875, "global_step": 373239, "epoch": 4496} {"train_loss": -26.2607479095459, "global_step": 373240, "epoch": 4496} {"train_loss": -26.458200454711914, "global_step": 373241, "epoch": 4496} {"train_loss": -26.23087501525879, "global_step": 373242, "epoch": 4496} {"train_loss": -26.3850040435791, "global_step": 373243, "epoch": 4496} {"train_loss": -25.999774932861328, "global_step": 373244, "epoch": 4496} {"train_loss": -26.160953521728516, "global_step": 373245, "epoch": 4496} {"train_loss": -26.683719635009766, "global_step": 373246, "epoch": 4496} {"train_loss": -25.994781494140625, "global_step": 373247, "epoch": 4496} {"train_loss": -26.259626388549805, "global_step": 373248, "epoch": 4496} {"train_loss": -26.310199737548828, "global_step": 373249, "epoch": 4496} {"train_loss": -26.155052874461713, "global_step": 373250, "epoch": 4496, "val_loss": 6567579.0} {"train_loss": -25.129558563232422, "global_step": 373251, "epoch": 4497} {"train_loss": -25.867919921875, "global_step": 373252, "epoch": 4497} {"train_loss": -25.833465576171875, "global_step": 373253, "epoch": 4497} {"train_loss": -25.25214195251465, "global_step": 373254, "epoch": 4497} {"train_loss": -25.60093116760254, "global_step": 373255, "epoch": 4497} {"train_loss": -26.030492782592773, "global_step": 373256, "epoch": 4497} {"train_loss": -25.2480525970459, "global_step": 373257, "epoch": 4497} {"train_loss": -25.800718307495117, "global_step": 373258, "epoch": 4497} {"train_loss": -25.714353561401367, "global_step": 373259, "epoch": 4497} {"train_loss": -25.909635543823242, "global_step": 373260, "epoch": 4497} {"train_loss": -26.113386154174805, "global_step": 373261, "epoch": 4497} {"train_loss": -25.72638511657715, "global_step": 373262, "epoch": 4497} {"train_loss": -25.825504302978516, "global_step": 373263, "epoch": 4497} {"train_loss": -25.942188262939453, "global_step": 373264, "epoch": 4497} {"train_loss": -26.0844669342041, "global_step": 373265, "epoch": 4497} {"train_loss": -25.919111251831055, "global_step": 373266, "epoch": 4497} {"train_loss": -26.286426544189453, "global_step": 373267, "epoch": 4497} {"train_loss": -26.14533805847168, "global_step": 373268, "epoch": 4497} {"train_loss": -26.399011611938477, "global_step": 373269, "epoch": 4497} {"train_loss": -26.305212020874023, "global_step": 373270, "epoch": 4497} {"train_loss": -26.10906982421875, "global_step": 373271, "epoch": 4497} {"train_loss": -25.958560943603516, "global_step": 373272, "epoch": 4497} {"train_loss": -26.357892990112305, "global_step": 373273, "epoch": 4497} {"train_loss": -26.172826766967773, "global_step": 373274, "epoch": 4497} {"train_loss": -26.189258575439453, "global_step": 373275, "epoch": 4497} {"train_loss": -25.941761016845703, "global_step": 373276, "epoch": 4497} {"train_loss": -26.252527236938477, "global_step": 373277, "epoch": 4497} {"train_loss": -26.285125732421875, "global_step": 373278, "epoch": 4497} {"train_loss": -26.54815673828125, "global_step": 373279, "epoch": 4497} {"train_loss": -26.46489906311035, "global_step": 373280, "epoch": 4497} {"train_loss": -25.96331214904785, "global_step": 373281, "epoch": 4497} {"train_loss": -26.748031616210938, "global_step": 373282, "epoch": 4497} {"train_loss": -26.279315948486328, "global_step": 373283, "epoch": 4497} {"train_loss": -26.388187408447266, "global_step": 373284, "epoch": 4497} {"train_loss": -26.727996826171875, "global_step": 373285, "epoch": 4497} {"train_loss": -26.3980712890625, "global_step": 373286, "epoch": 4497} {"train_loss": -26.415693283081055, "global_step": 373287, "epoch": 4497} {"train_loss": -26.11921501159668, "global_step": 373288, "epoch": 4497} {"train_loss": -25.983078002929688, "global_step": 373289, "epoch": 4497} {"train_loss": -26.26227378845215, "global_step": 373290, "epoch": 4497} {"train_loss": -26.250940322875977, "global_step": 373291, "epoch": 4497} {"train_loss": -26.330947875976562, "global_step": 373292, "epoch": 4497} {"train_loss": -26.636701583862305, "global_step": 373293, "epoch": 4497} {"train_loss": -26.74349021911621, "global_step": 373294, "epoch": 4497} {"train_loss": -26.582441329956055, "global_step": 373295, "epoch": 4497} {"train_loss": -26.662494659423828, "global_step": 373296, "epoch": 4497} {"train_loss": -26.293354034423828, "global_step": 373297, "epoch": 4497} {"train_loss": -26.184986114501953, "global_step": 373298, "epoch": 4497} {"train_loss": -26.41916275024414, "global_step": 373299, "epoch": 4497} {"train_loss": -26.635650634765625, "global_step": 373300, "epoch": 4497} {"train_loss": -26.762088775634766, "global_step": 373301, "epoch": 4497} {"train_loss": -26.8790340423584, "global_step": 373302, "epoch": 4497} {"train_loss": -26.509902954101562, "global_step": 373303, "epoch": 4497} {"train_loss": -26.55401039123535, "global_step": 373304, "epoch": 4497} {"train_loss": -26.40838623046875, "global_step": 373305, "epoch": 4497} {"train_loss": -25.863910675048828, "global_step": 373306, "epoch": 4497} {"train_loss": -25.195798873901367, "global_step": 373307, "epoch": 4497} {"train_loss": -24.718168258666992, "global_step": 373308, "epoch": 4497} {"train_loss": -25.271015167236328, "global_step": 373309, "epoch": 4497} {"train_loss": -26.273605346679688, "global_step": 373310, "epoch": 4497} {"train_loss": -26.03643798828125, "global_step": 373311, "epoch": 4497} {"train_loss": -26.000410079956055, "global_step": 373312, "epoch": 4497} {"train_loss": -26.088348388671875, "global_step": 373313, "epoch": 4497} {"train_loss": -26.02535057067871, "global_step": 373314, "epoch": 4497} {"train_loss": -25.932025909423828, "global_step": 373315, "epoch": 4497} {"train_loss": -26.196557998657227, "global_step": 373316, "epoch": 4497} {"train_loss": -25.850677490234375, "global_step": 373317, "epoch": 4497} {"train_loss": -26.042871475219727, "global_step": 373318, "epoch": 4497} {"train_loss": -25.87908935546875, "global_step": 373319, "epoch": 4497} {"train_loss": -26.353485107421875, "global_step": 373320, "epoch": 4497} {"train_loss": -25.865859985351562, "global_step": 373321, "epoch": 4497} {"train_loss": -26.080062866210938, "global_step": 373322, "epoch": 4497} {"train_loss": -26.132596969604492, "global_step": 373323, "epoch": 4497} {"train_loss": -26.34486961364746, "global_step": 373324, "epoch": 4497} {"train_loss": -26.257831573486328, "global_step": 373325, "epoch": 4497} {"train_loss": -25.922138214111328, "global_step": 373326, "epoch": 4497} {"train_loss": -25.907459259033203, "global_step": 373327, "epoch": 4497} {"train_loss": -26.666357040405273, "global_step": 373328, "epoch": 4497} {"train_loss": -26.557214736938477, "global_step": 373329, "epoch": 4497} {"train_loss": -26.727584838867188, "global_step": 373330, "epoch": 4497} {"train_loss": -26.2689208984375, "global_step": 373331, "epoch": 4497} {"train_loss": -26.13364601135254, "global_step": 373332, "epoch": 4497} {"train_loss": -26.130910298910486, "global_step": 373333, "epoch": 4497, "val_loss": 6597829.5} {"train_loss": -26.27540397644043, "global_step": 373334, "epoch": 4498} {"train_loss": -26.437225341796875, "global_step": 373335, "epoch": 4498} {"train_loss": -26.152616500854492, "global_step": 373336, "epoch": 4498} {"train_loss": -26.056095123291016, "global_step": 373337, "epoch": 4498} {"train_loss": -26.243555068969727, "global_step": 373338, "epoch": 4498} {"train_loss": -26.26918601989746, "global_step": 373339, "epoch": 4498} {"train_loss": -25.996524810791016, "global_step": 373340, "epoch": 4498} {"train_loss": -26.148305892944336, "global_step": 373341, "epoch": 4498} {"train_loss": -26.464141845703125, "global_step": 373342, "epoch": 4498} {"train_loss": -26.08890724182129, "global_step": 373343, "epoch": 4498} {"train_loss": -26.518503189086914, "global_step": 373344, "epoch": 4498} {"train_loss": -26.53228187561035, "global_step": 373345, "epoch": 4498} {"train_loss": -26.37558937072754, "global_step": 373346, "epoch": 4498} {"train_loss": -26.659259796142578, "global_step": 373347, "epoch": 4498} {"train_loss": -26.40927505493164, "global_step": 373348, "epoch": 4498} {"train_loss": -26.32191276550293, "global_step": 373349, "epoch": 4498} {"train_loss": -26.30071449279785, "global_step": 373350, "epoch": 4498} {"train_loss": -26.560815811157227, "global_step": 373351, "epoch": 4498} {"train_loss": -26.230131149291992, "global_step": 373352, "epoch": 4498} {"train_loss": -26.739370346069336, "global_step": 373353, "epoch": 4498} {"train_loss": -26.486387252807617, "global_step": 373354, "epoch": 4498} {"train_loss": -26.2843074798584, "global_step": 373355, "epoch": 4498} {"train_loss": -26.56036949157715, "global_step": 373356, "epoch": 4498} {"train_loss": -26.368505477905273, "global_step": 373357, "epoch": 4498} {"train_loss": -26.515249252319336, "global_step": 373358, "epoch": 4498} {"train_loss": -26.696002960205078, "global_step": 373359, "epoch": 4498} {"train_loss": -26.316696166992188, "global_step": 373360, "epoch": 4498} {"train_loss": -26.649490356445312, "global_step": 373361, "epoch": 4498} {"train_loss": -26.36408805847168, "global_step": 373362, "epoch": 4498} {"train_loss": -26.402109146118164, "global_step": 373363, "epoch": 4498} {"train_loss": -26.130619049072266, "global_step": 373364, "epoch": 4498} {"train_loss": -26.464948654174805, "global_step": 373365, "epoch": 4498} {"train_loss": -26.599348068237305, "global_step": 373366, "epoch": 4498} {"train_loss": -26.55155372619629, "global_step": 373367, "epoch": 4498} {"train_loss": -26.668806076049805, "global_step": 373368, "epoch": 4498} {"train_loss": -26.18910026550293, "global_step": 373369, "epoch": 4498} {"train_loss": -26.602087020874023, "global_step": 373370, "epoch": 4498} {"train_loss": -26.502405166625977, "global_step": 373371, "epoch": 4498} {"train_loss": -26.58649253845215, "global_step": 373372, "epoch": 4498} {"train_loss": -26.543624877929688, "global_step": 373373, "epoch": 4498} {"train_loss": -26.269392013549805, "global_step": 373374, "epoch": 4498} {"train_loss": -26.17146873474121, "global_step": 373375, "epoch": 4498} {"train_loss": -26.149221420288086, "global_step": 373376, "epoch": 4498} {"train_loss": -25.703598022460938, "global_step": 373377, "epoch": 4498} {"train_loss": -25.600645065307617, "global_step": 373378, "epoch": 4498} {"train_loss": -26.772735595703125, "global_step": 373379, "epoch": 4498} {"train_loss": -26.236907958984375, "global_step": 373380, "epoch": 4498} {"train_loss": -25.724334716796875, "global_step": 373381, "epoch": 4498} {"train_loss": -26.265979766845703, "global_step": 373382, "epoch": 4498} {"train_loss": -25.785261154174805, "global_step": 373383, "epoch": 4498} {"train_loss": -25.875442504882812, "global_step": 373384, "epoch": 4498} {"train_loss": -26.07258415222168, "global_step": 373385, "epoch": 4498} {"train_loss": -26.04916763305664, "global_step": 373386, "epoch": 4498} {"train_loss": -26.171125411987305, "global_step": 373387, "epoch": 4498} {"train_loss": -25.851064682006836, "global_step": 373388, "epoch": 4498} {"train_loss": -26.222370147705078, "global_step": 373389, "epoch": 4498} {"train_loss": -26.076831817626953, "global_step": 373390, "epoch": 4498} {"train_loss": -26.147871017456055, "global_step": 373391, "epoch": 4498} {"train_loss": -26.13037109375, "global_step": 373392, "epoch": 4498} {"train_loss": -26.522418975830078, "global_step": 373393, "epoch": 4498} {"train_loss": -26.06131935119629, "global_step": 373394, "epoch": 4498} {"train_loss": -26.303125381469727, "global_step": 373395, "epoch": 4498} {"train_loss": -26.409467697143555, "global_step": 373396, "epoch": 4498} {"train_loss": -26.550235748291016, "global_step": 373397, "epoch": 4498} {"train_loss": -26.419300079345703, "global_step": 373398, "epoch": 4498} {"train_loss": -26.360387802124023, "global_step": 373399, "epoch": 4498} {"train_loss": -26.363224029541016, "global_step": 373400, "epoch": 4498} {"train_loss": -26.011999130249023, "global_step": 373401, "epoch": 4498} {"train_loss": -26.599475860595703, "global_step": 373402, "epoch": 4498} {"train_loss": -26.041034698486328, "global_step": 373403, "epoch": 4498} {"train_loss": -26.158706665039062, "global_step": 373404, "epoch": 4498} {"train_loss": -26.43427085876465, "global_step": 373405, "epoch": 4498} {"train_loss": -26.061798095703125, "global_step": 373406, "epoch": 4498} {"train_loss": -26.631072998046875, "global_step": 373407, "epoch": 4498} {"train_loss": -26.148584365844727, "global_step": 373408, "epoch": 4498} {"train_loss": -26.177566528320312, "global_step": 373409, "epoch": 4498} {"train_loss": -26.3914852142334, "global_step": 373410, "epoch": 4498} {"train_loss": -26.378210067749023, "global_step": 373411, "epoch": 4498} {"train_loss": -26.334253311157227, "global_step": 373412, "epoch": 4498} {"train_loss": -26.4831485748291, "global_step": 373413, "epoch": 4498} {"train_loss": -26.279722213745117, "global_step": 373414, "epoch": 4498} {"train_loss": -26.67157554626465, "global_step": 373415, "epoch": 4498} {"train_loss": -26.312144612691487, "global_step": 373416, "epoch": 4498, "val_loss": 6520432.0} {"train_loss": -25.527719497680664, "global_step": 373417, "epoch": 4499} {"train_loss": -25.51376724243164, "global_step": 373418, "epoch": 4499} {"train_loss": -25.7818603515625, "global_step": 373419, "epoch": 4499} {"train_loss": -26.2830753326416, "global_step": 373420, "epoch": 4499} {"train_loss": -26.18235206604004, "global_step": 373421, "epoch": 4499} {"train_loss": -25.74363136291504, "global_step": 373422, "epoch": 4499} {"train_loss": -26.174259185791016, "global_step": 373423, "epoch": 4499} {"train_loss": -25.801610946655273, "global_step": 373424, "epoch": 4499} {"train_loss": -26.278823852539062, "global_step": 373425, "epoch": 4499} {"train_loss": -25.819183349609375, "global_step": 373426, "epoch": 4499} {"train_loss": -26.216415405273438, "global_step": 373427, "epoch": 4499} {"train_loss": -26.527631759643555, "global_step": 373428, "epoch": 4499} {"train_loss": -25.98154640197754, "global_step": 373429, "epoch": 4499} {"train_loss": -26.100488662719727, "global_step": 373430, "epoch": 4499} {"train_loss": -26.50213050842285, "global_step": 373431, "epoch": 4499} {"train_loss": -26.052412033081055, "global_step": 373432, "epoch": 4499} {"train_loss": -26.108549118041992, "global_step": 373433, "epoch": 4499} {"train_loss": -26.251220703125, "global_step": 373434, "epoch": 4499} {"train_loss": -26.48370361328125, "global_step": 373435, "epoch": 4499} {"train_loss": -26.27337074279785, "global_step": 373436, "epoch": 4499} {"train_loss": -26.175439834594727, "global_step": 373437, "epoch": 4499} {"train_loss": -26.0876407623291, "global_step": 373438, "epoch": 4499} {"train_loss": -26.360273361206055, "global_step": 373439, "epoch": 4499} {"train_loss": -26.15494155883789, "global_step": 373440, "epoch": 4499} {"train_loss": -26.161767959594727, "global_step": 373441, "epoch": 4499} {"train_loss": -26.451282501220703, "global_step": 373442, "epoch": 4499} {"train_loss": -26.30681800842285, "global_step": 373443, "epoch": 4499} {"train_loss": -26.045209884643555, "global_step": 373444, "epoch": 4499} {"train_loss": -26.54840660095215, "global_step": 373445, "epoch": 4499} {"train_loss": -26.254241943359375, "global_step": 373446, "epoch": 4499} {"train_loss": -26.671533584594727, "global_step": 373447, "epoch": 4499} {"train_loss": -26.140832901000977, "global_step": 373448, "epoch": 4499} {"train_loss": -26.533512115478516, "global_step": 373449, "epoch": 4499} {"train_loss": -26.55853843688965, "global_step": 373450, "epoch": 4499} {"train_loss": -26.51838493347168, "global_step": 373451, "epoch": 4499} {"train_loss": -26.52630043029785, "global_step": 373452, "epoch": 4499} {"train_loss": -26.33441162109375, "global_step": 373453, "epoch": 4499} {"train_loss": -26.516462326049805, "global_step": 373454, "epoch": 4499} {"train_loss": -26.324268341064453, "global_step": 373455, "epoch": 4499} {"train_loss": -26.331588745117188, "global_step": 373456, "epoch": 4499} {"train_loss": -26.20319938659668, "global_step": 373457, "epoch": 4499} {"train_loss": -26.75933265686035, "global_step": 373458, "epoch": 4499} {"train_loss": -26.18012809753418, "global_step": 373459, "epoch": 4499} {"train_loss": -26.61464500427246, "global_step": 373460, "epoch": 4499} {"train_loss": -26.753034591674805, "global_step": 373461, "epoch": 4499} {"train_loss": -26.528594970703125, "global_step": 373462, "epoch": 4499} {"train_loss": -26.36041259765625, "global_step": 373463, "epoch": 4499} {"train_loss": -26.654088973999023, "global_step": 373464, "epoch": 4499} {"train_loss": -26.550201416015625, "global_step": 373465, "epoch": 4499} {"train_loss": -26.35745620727539, "global_step": 373466, "epoch": 4499} {"train_loss": -26.172992706298828, "global_step": 373467, "epoch": 4499} {"train_loss": -26.266443252563477, "global_step": 373468, "epoch": 4499} {"train_loss": -25.8546085357666, "global_step": 373469, "epoch": 4499} {"train_loss": -25.84393882751465, "global_step": 373470, "epoch": 4499} {"train_loss": -26.254743576049805, "global_step": 373471, "epoch": 4499} {"train_loss": -26.252241134643555, "global_step": 373472, "epoch": 4499} {"train_loss": -26.603702545166016, "global_step": 373473, "epoch": 4499} {"train_loss": -26.10837173461914, "global_step": 373474, "epoch": 4499} {"train_loss": -26.012704849243164, "global_step": 373475, "epoch": 4499} {"train_loss": -26.24991226196289, "global_step": 373476, "epoch": 4499} {"train_loss": -26.338958740234375, "global_step": 373477, "epoch": 4499} {"train_loss": -26.138818740844727, "global_step": 373478, "epoch": 4499} {"train_loss": -26.68155860900879, "global_step": 373479, "epoch": 4499} {"train_loss": -26.36181640625, "global_step": 373480, "epoch": 4499} {"train_loss": -26.342548370361328, "global_step": 373481, "epoch": 4499} {"train_loss": -26.617273330688477, "global_step": 373482, "epoch": 4499} {"train_loss": -26.663660049438477, "global_step": 373483, "epoch": 4499} {"train_loss": -26.43072509765625, "global_step": 373484, "epoch": 4499} {"train_loss": -26.68168067932129, "global_step": 373485, "epoch": 4499} {"train_loss": -26.291492462158203, "global_step": 373486, "epoch": 4499} {"train_loss": -26.37665367126465, "global_step": 373487, "epoch": 4499} {"train_loss": -26.736499786376953, "global_step": 373488, "epoch": 4499} {"train_loss": -26.73042106628418, "global_step": 373489, "epoch": 4499} {"train_loss": -26.17685890197754, "global_step": 373490, "epoch": 4499} {"train_loss": -26.551944732666016, "global_step": 373491, "epoch": 4499} {"train_loss": -26.292377471923828, "global_step": 373492, "epoch": 4499} {"train_loss": -26.527128219604492, "global_step": 373493, "epoch": 4499} {"train_loss": -26.31525993347168, "global_step": 373494, "epoch": 4499} {"train_loss": -26.45389747619629, "global_step": 373495, "epoch": 4499} {"train_loss": -26.3109130859375, "global_step": 373496, "epoch": 4499} {"train_loss": -26.366315841674805, "global_step": 373497, "epoch": 4499} {"train_loss": -26.751209259033203, "global_step": 373498, "epoch": 4499} {"train_loss": -26.31199257632336, "global_step": 373499, "epoch": 4499, "val_loss": 6629114.0} {"train_loss": -26.242237091064453, "global_step": 373500, "epoch": 4500} {"train_loss": -25.91371726989746, "global_step": 373501, "epoch": 4500} {"train_loss": -26.093271255493164, "global_step": 373502, "epoch": 4500} {"train_loss": -26.080472946166992, "global_step": 373503, "epoch": 4500} {"train_loss": -26.056934356689453, "global_step": 373504, "epoch": 4500} {"train_loss": -25.740278244018555, "global_step": 373505, "epoch": 4500} {"train_loss": -25.712512969970703, "global_step": 373506, "epoch": 4500} {"train_loss": -25.814966201782227, "global_step": 373507, "epoch": 4500} {"train_loss": -26.001495361328125, "global_step": 373508, "epoch": 4500} {"train_loss": -26.174116134643555, "global_step": 373509, "epoch": 4500} {"train_loss": -26.332660675048828, "global_step": 373510, "epoch": 4500} {"train_loss": -25.739728927612305, "global_step": 373511, "epoch": 4500} {"train_loss": -26.560749053955078, "global_step": 373512, "epoch": 4500} {"train_loss": -25.97637367248535, "global_step": 373513, "epoch": 4500} {"train_loss": -26.224170684814453, "global_step": 373514, "epoch": 4500} {"train_loss": -26.205753326416016, "global_step": 373515, "epoch": 4500} {"train_loss": -26.500873565673828, "global_step": 373516, "epoch": 4500} {"train_loss": -26.154972076416016, "global_step": 373517, "epoch": 4500} {"train_loss": -26.337543487548828, "global_step": 373518, "epoch": 4500} {"train_loss": -26.475799560546875, "global_step": 373519, "epoch": 4500} {"train_loss": -26.327880859375, "global_step": 373520, "epoch": 4500} {"train_loss": -26.468286514282227, "global_step": 373521, "epoch": 4500} {"train_loss": -26.24336051940918, "global_step": 373522, "epoch": 4500} {"train_loss": -26.36077308654785, "global_step": 373523, "epoch": 4500} {"train_loss": -26.49799919128418, "global_step": 373524, "epoch": 4500} {"train_loss": -26.4007568359375, "global_step": 373525, "epoch": 4500} {"train_loss": -26.35956382751465, "global_step": 373526, "epoch": 4500} {"train_loss": -26.206287384033203, "global_step": 373527, "epoch": 4500} {"train_loss": -26.19925308227539, "global_step": 373528, "epoch": 4500} {"train_loss": -26.522924423217773, "global_step": 373529, "epoch": 4500} {"train_loss": -26.416156768798828, "global_step": 373530, "epoch": 4500} {"train_loss": -26.418075561523438, "global_step": 373531, "epoch": 4500} {"train_loss": -26.45306396484375, "global_step": 373532, "epoch": 4500} {"train_loss": -26.58258056640625, "global_step": 373533, "epoch": 4500} {"train_loss": -26.54007911682129, "global_step": 373534, "epoch": 4500} {"train_loss": -26.33160972595215, "global_step": 373535, "epoch": 4500} {"train_loss": -26.625293731689453, "global_step": 373536, "epoch": 4500} {"train_loss": -26.384479522705078, "global_step": 373537, "epoch": 4500} {"train_loss": -26.31363296508789, "global_step": 373538, "epoch": 4500} {"train_loss": -26.764984130859375, "global_step": 373539, "epoch": 4500} {"train_loss": -26.440534591674805, "global_step": 373540, "epoch": 4500} {"train_loss": -26.482091903686523, "global_step": 373541, "epoch": 4500} {"train_loss": -26.1486759185791, "global_step": 373542, "epoch": 4500} {"train_loss": -26.832075119018555, "global_step": 373543, "epoch": 4500} {"train_loss": -26.51889419555664, "global_step": 373544, "epoch": 4500} {"train_loss": -26.401243209838867, "global_step": 373545, "epoch": 4500} {"train_loss": -26.127180099487305, "global_step": 373546, "epoch": 4500} {"train_loss": -26.304975509643555, "global_step": 373547, "epoch": 4500} {"train_loss": -26.895238876342773, "global_step": 373548, "epoch": 4500} {"train_loss": -26.485666275024414, "global_step": 373549, "epoch": 4500} {"train_loss": -26.602201461791992, "global_step": 373550, "epoch": 4500} {"train_loss": -26.547388076782227, "global_step": 373551, "epoch": 4500} {"train_loss": -26.186996459960938, "global_step": 373552, "epoch": 4500} {"train_loss": -26.07916259765625, "global_step": 373553, "epoch": 4500} {"train_loss": -25.92732048034668, "global_step": 373554, "epoch": 4500} {"train_loss": -25.934354782104492, "global_step": 373555, "epoch": 4500} {"train_loss": -26.384368896484375, "global_step": 373556, "epoch": 4500} {"train_loss": -26.476404190063477, "global_step": 373557, "epoch": 4500} {"train_loss": -26.560012817382812, "global_step": 373558, "epoch": 4500} {"train_loss": -26.8596134185791, "global_step": 373559, "epoch": 4500} {"train_loss": -26.18800163269043, "global_step": 373560, "epoch": 4500} {"train_loss": -26.4923095703125, "global_step": 373561, "epoch": 4500} {"train_loss": -26.383865356445312, "global_step": 373562, "epoch": 4500} {"train_loss": -26.605701446533203, "global_step": 373563, "epoch": 4500} {"train_loss": -26.582077026367188, "global_step": 373564, "epoch": 4500} {"train_loss": -26.177526473999023, "global_step": 373565, "epoch": 4500} {"train_loss": -26.627073287963867, "global_step": 373566, "epoch": 4500} {"train_loss": -26.52840232849121, "global_step": 373567, "epoch": 4500} {"train_loss": -26.517288208007812, "global_step": 373568, "epoch": 4500} {"train_loss": -26.605215072631836, "global_step": 373569, "epoch": 4500} {"train_loss": -26.30429458618164, "global_step": 373570, "epoch": 4500} {"train_loss": -26.097925186157227, "global_step": 373571, "epoch": 4500} {"train_loss": -26.108524322509766, "global_step": 373572, "epoch": 4500} {"train_loss": -26.162389755249023, "global_step": 373573, "epoch": 4500} {"train_loss": -26.854700088500977, "global_step": 373574, "epoch": 4500} {"train_loss": -26.546131134033203, "global_step": 373575, "epoch": 4500} {"train_loss": -26.4967041015625, "global_step": 373576, "epoch": 4500} {"train_loss": -26.66339683532715, "global_step": 373577, "epoch": 4500} {"train_loss": -26.75690269470215, "global_step": 373578, "epoch": 4500} {"train_loss": -26.592077255249023, "global_step": 373579, "epoch": 4500} {"train_loss": -26.549823760986328, "global_step": 373580, "epoch": 4500} {"train_loss": -26.432941436767578, "global_step": 373581, "epoch": 4500} {"train_loss": -26.358016760952502, "global_step": 373582, "epoch": 4500, "train/sim_max_reward_0": 1.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4500000": 1.0, "test/sim_max_reward_4500001": 1.0, "test/sim_max_reward_4500002": 1.0, "test/sim_max_reward_4500003": 1.0, "test/sim_max_reward_4500004": 1.0, "test/sim_max_reward_4500005": 1.0, "test/sim_max_reward_4500006": 1.0, "test/sim_max_reward_4500007": 0.0, "test/sim_max_reward_4500008": 1.0, "test/sim_max_reward_4500009": 1.0, "test/sim_max_reward_4500010": 1.0, "test/sim_max_reward_4500011": 1.0, "test/sim_max_reward_4500012": 1.0, "test/sim_max_reward_4500013": 1.0, "test/sim_max_reward_4500014": 1.0, "test/sim_max_reward_4500015": 1.0, "test/sim_max_reward_4500016": 1.0, "test/sim_max_reward_4500017": 1.0, "test/sim_max_reward_4500018": 0.0, "test/sim_max_reward_4500019": 0.0, "test/sim_max_reward_4500020": 1.0, "test/sim_max_reward_4500021": 1.0, "train/mean_score": 1.0, "test/mean_score": 0.8636363636363636, "val_loss": 6602695.5} {"train_loss": -26.189496994018555, "global_step": 373583, "epoch": 4501} {"train_loss": -26.43659782409668, "global_step": 373584, "epoch": 4501} {"train_loss": -26.170995712280273, "global_step": 373585, "epoch": 4501} {"train_loss": -25.69927406311035, "global_step": 373586, "epoch": 4501} {"train_loss": -26.1849365234375, "global_step": 373587, "epoch": 4501} {"train_loss": -25.214359283447266, "global_step": 373588, "epoch": 4501} {"train_loss": -25.880420684814453, "global_step": 373589, "epoch": 4501} {"train_loss": -26.220352172851562, "global_step": 373590, "epoch": 4501} {"train_loss": -26.2244873046875, "global_step": 373591, "epoch": 4501} {"train_loss": -25.938215255737305, "global_step": 373592, "epoch": 4501} {"train_loss": -26.1740779876709, "global_step": 373593, "epoch": 4501} {"train_loss": -25.6165771484375, "global_step": 373594, "epoch": 4501} {"train_loss": -26.353002548217773, "global_step": 373595, "epoch": 4501} {"train_loss": -26.190587997436523, "global_step": 373596, "epoch": 4501} {"train_loss": -26.1840877532959, "global_step": 373597, "epoch": 4501} {"train_loss": -26.105499267578125, "global_step": 373598, "epoch": 4501} {"train_loss": -26.4183406829834, "global_step": 373599, "epoch": 4501} {"train_loss": -26.45779800415039, "global_step": 373600, "epoch": 4501} {"train_loss": -26.197004318237305, "global_step": 373601, "epoch": 4501} {"train_loss": -25.984460830688477, "global_step": 373602, "epoch": 4501} {"train_loss": -26.543243408203125, "global_step": 373603, "epoch": 4501} {"train_loss": -25.981109619140625, "global_step": 373604, "epoch": 4501} {"train_loss": -26.3133487701416, "global_step": 373605, "epoch": 4501} {"train_loss": -26.163434982299805, "global_step": 373606, "epoch": 4501} {"train_loss": -26.6303653717041, "global_step": 373607, "epoch": 4501} {"train_loss": -25.96306800842285, "global_step": 373608, "epoch": 4501} {"train_loss": -26.098302841186523, "global_step": 373609, "epoch": 4501} {"train_loss": -26.116952896118164, "global_step": 373610, "epoch": 4501} {"train_loss": -26.263456344604492, "global_step": 373611, "epoch": 4501} {"train_loss": -26.39106559753418, "global_step": 373612, "epoch": 4501} {"train_loss": -26.37847900390625, "global_step": 373613, "epoch": 4501} {"train_loss": -26.618085861206055, "global_step": 373614, "epoch": 4501} {"train_loss": -25.88702392578125, "global_step": 373615, "epoch": 4501} {"train_loss": -26.08540916442871, "global_step": 373616, "epoch": 4501} {"train_loss": -26.5950927734375, "global_step": 373617, "epoch": 4501} {"train_loss": -26.586088180541992, "global_step": 373618, "epoch": 4501} {"train_loss": -26.289276123046875, "global_step": 373619, "epoch": 4501} {"train_loss": -26.590076446533203, "global_step": 373620, "epoch": 4501} {"train_loss": -26.40281105041504, "global_step": 373621, "epoch": 4501} {"train_loss": -26.437604904174805, "global_step": 373622, "epoch": 4501} {"train_loss": -26.585830688476562, "global_step": 373623, "epoch": 4501} {"train_loss": -26.64898681640625, "global_step": 373624, "epoch": 4501} {"train_loss": -26.44416618347168, "global_step": 373625, "epoch": 4501} {"train_loss": -26.407928466796875, "global_step": 373626, "epoch": 4501} {"train_loss": -26.67229652404785, "global_step": 373627, "epoch": 4501} {"train_loss": -26.45330810546875, "global_step": 373628, "epoch": 4501} {"train_loss": -26.48516273498535, "global_step": 373629, "epoch": 4501} {"train_loss": -26.5953426361084, "global_step": 373630, "epoch": 4501} {"train_loss": -26.589649200439453, "global_step": 373631, "epoch": 4501} {"train_loss": -26.282323837280273, "global_step": 373632, "epoch": 4501} {"train_loss": -26.32527732849121, "global_step": 373633, "epoch": 4501} {"train_loss": -26.476318359375, "global_step": 373634, "epoch": 4501} {"train_loss": -25.5379638671875, "global_step": 373635, "epoch": 4501} {"train_loss": -23.9355525970459, "global_step": 373636, "epoch": 4501} {"train_loss": -24.852888107299805, "global_step": 373637, "epoch": 4501} {"train_loss": -26.155370712280273, "global_step": 373638, "epoch": 4501} {"train_loss": -25.016759872436523, "global_step": 373639, "epoch": 4501} {"train_loss": -25.746021270751953, "global_step": 373640, "epoch": 4501} {"train_loss": -25.896345138549805, "global_step": 373641, "epoch": 4501} {"train_loss": -26.498687744140625, "global_step": 373642, "epoch": 4501} {"train_loss": -25.67046546936035, "global_step": 373643, "epoch": 4501} {"train_loss": -26.028335571289062, "global_step": 373644, "epoch": 4501} {"train_loss": -26.20064353942871, "global_step": 373645, "epoch": 4501} {"train_loss": -26.221149444580078, "global_step": 373646, "epoch": 4501} {"train_loss": -25.831832885742188, "global_step": 373647, "epoch": 4501} {"train_loss": -26.12727928161621, "global_step": 373648, "epoch": 4501} {"train_loss": -26.025390625, "global_step": 373649, "epoch": 4501} {"train_loss": -25.856494903564453, "global_step": 373650, "epoch": 4501} {"train_loss": -26.059926986694336, "global_step": 373651, "epoch": 4501} {"train_loss": -26.192106246948242, "global_step": 373652, "epoch": 4501} {"train_loss": -26.28350257873535, "global_step": 373653, "epoch": 4501} {"train_loss": -26.293415069580078, "global_step": 373654, "epoch": 4501} {"train_loss": -26.388151168823242, "global_step": 373655, "epoch": 4501} {"train_loss": -26.123929977416992, "global_step": 373656, "epoch": 4501} {"train_loss": -26.46199607849121, "global_step": 373657, "epoch": 4501} {"train_loss": -26.28692054748535, "global_step": 373658, "epoch": 4501} {"train_loss": -26.519521713256836, "global_step": 373659, "epoch": 4501} {"train_loss": -26.56593894958496, "global_step": 373660, "epoch": 4501} {"train_loss": -26.306760787963867, "global_step": 373661, "epoch": 4501} {"train_loss": -26.345050811767578, "global_step": 373662, "epoch": 4501} {"train_loss": -26.370838165283203, "global_step": 373663, "epoch": 4501} {"train_loss": -26.490100860595703, "global_step": 373664, "epoch": 4501} {"train_loss": -26.16870719266225, "global_step": 373665, "epoch": 4501, "val_loss": 6669297.5} {"train_loss": -26.027420043945312, "global_step": 373666, "epoch": 4502} {"train_loss": -25.600299835205078, "global_step": 373667, "epoch": 4502} {"train_loss": -26.231176376342773, "global_step": 373668, "epoch": 4502} {"train_loss": -26.023395538330078, "global_step": 373669, "epoch": 4502} {"train_loss": -26.33075523376465, "global_step": 373670, "epoch": 4502} {"train_loss": -25.712427139282227, "global_step": 373671, "epoch": 4502} {"train_loss": -26.03363609313965, "global_step": 373672, "epoch": 4502} {"train_loss": -26.018735885620117, "global_step": 373673, "epoch": 4502} {"train_loss": -25.63897132873535, "global_step": 373674, "epoch": 4502} {"train_loss": -26.140527725219727, "global_step": 373675, "epoch": 4502} {"train_loss": -25.991392135620117, "global_step": 373676, "epoch": 4502} {"train_loss": -26.0761775970459, "global_step": 373677, "epoch": 4502} {"train_loss": -26.280750274658203, "global_step": 373678, "epoch": 4502} {"train_loss": -26.26348876953125, "global_step": 373679, "epoch": 4502} {"train_loss": -26.06060791015625, "global_step": 373680, "epoch": 4502} {"train_loss": -26.109973907470703, "global_step": 373681, "epoch": 4502} {"train_loss": -25.924991607666016, "global_step": 373682, "epoch": 4502} {"train_loss": -26.206531524658203, "global_step": 373683, "epoch": 4502} {"train_loss": -26.388864517211914, "global_step": 373684, "epoch": 4502} {"train_loss": -26.119342803955078, "global_step": 373685, "epoch": 4502} {"train_loss": -26.002532958984375, "global_step": 373686, "epoch": 4502} {"train_loss": -26.6966609954834, "global_step": 373687, "epoch": 4502} {"train_loss": -26.460357666015625, "global_step": 373688, "epoch": 4502} {"train_loss": -26.524621963500977, "global_step": 373689, "epoch": 4502} {"train_loss": -26.145132064819336, "global_step": 373690, "epoch": 4502} {"train_loss": -26.73533058166504, "global_step": 373691, "epoch": 4502} {"train_loss": -26.19060707092285, "global_step": 373692, "epoch": 4502} {"train_loss": -26.156604766845703, "global_step": 373693, "epoch": 4502} {"train_loss": -26.486188888549805, "global_step": 373694, "epoch": 4502} {"train_loss": -26.236434936523438, "global_step": 373695, "epoch": 4502} {"train_loss": -26.3631534576416, "global_step": 373696, "epoch": 4502} {"train_loss": -26.519744873046875, "global_step": 373697, "epoch": 4502} {"train_loss": -26.291690826416016, "global_step": 373698, "epoch": 4502} {"train_loss": -26.42276382446289, "global_step": 373699, "epoch": 4502} {"train_loss": -26.236234664916992, "global_step": 373700, "epoch": 4502} {"train_loss": -26.476404190063477, "global_step": 373701, "epoch": 4502} {"train_loss": -26.427988052368164, "global_step": 373702, "epoch": 4502} {"train_loss": -26.704675674438477, "global_step": 373703, "epoch": 4502} {"train_loss": -26.957128524780273, "global_step": 373704, "epoch": 4502} {"train_loss": -26.829618453979492, "global_step": 373705, "epoch": 4502} {"train_loss": -26.8242244720459, "global_step": 373706, "epoch": 4502} {"train_loss": -26.66143798828125, "global_step": 373707, "epoch": 4502} {"train_loss": -26.574161529541016, "global_step": 373708, "epoch": 4502} {"train_loss": -26.83687400817871, "global_step": 373709, "epoch": 4502} {"train_loss": -26.287628173828125, "global_step": 373710, "epoch": 4502} {"train_loss": -26.407245635986328, "global_step": 373711, "epoch": 4502} {"train_loss": -26.082616806030273, "global_step": 373712, "epoch": 4502} {"train_loss": -26.276464462280273, "global_step": 373713, "epoch": 4502} {"train_loss": -25.954242706298828, "global_step": 373714, "epoch": 4502} {"train_loss": -26.119842529296875, "global_step": 373715, "epoch": 4502} {"train_loss": -26.176294326782227, "global_step": 373716, "epoch": 4502} {"train_loss": -26.479053497314453, "global_step": 373717, "epoch": 4502} {"train_loss": -26.575551986694336, "global_step": 373718, "epoch": 4502} {"train_loss": -25.8859920501709, "global_step": 373719, "epoch": 4502} {"train_loss": -26.4757137298584, "global_step": 373720, "epoch": 4502} {"train_loss": -25.9936466217041, "global_step": 373721, "epoch": 4502} {"train_loss": -25.95979118347168, "global_step": 373722, "epoch": 4502} {"train_loss": -25.88248062133789, "global_step": 373723, "epoch": 4502} {"train_loss": -26.15223503112793, "global_step": 373724, "epoch": 4502} {"train_loss": -26.125904083251953, "global_step": 373725, "epoch": 4502} {"train_loss": -26.6015567779541, "global_step": 373726, "epoch": 4502} {"train_loss": -26.404687881469727, "global_step": 373727, "epoch": 4502} {"train_loss": -26.16865348815918, "global_step": 373728, "epoch": 4502} {"train_loss": -26.444543838500977, "global_step": 373729, "epoch": 4502} {"train_loss": -26.12147331237793, "global_step": 373730, "epoch": 4502} {"train_loss": -26.43475341796875, "global_step": 373731, "epoch": 4502} {"train_loss": -26.362409591674805, "global_step": 373732, "epoch": 4502} {"train_loss": -26.251562118530273, "global_step": 373733, "epoch": 4502} {"train_loss": -26.543867111206055, "global_step": 373734, "epoch": 4502} {"train_loss": -26.112796783447266, "global_step": 373735, "epoch": 4502} {"train_loss": -26.485076904296875, "global_step": 373736, "epoch": 4502} {"train_loss": -26.413373947143555, "global_step": 373737, "epoch": 4502} {"train_loss": -26.599084854125977, "global_step": 373738, "epoch": 4502} {"train_loss": -26.360187530517578, "global_step": 373739, "epoch": 4502} {"train_loss": -26.35883903503418, "global_step": 373740, "epoch": 4502} {"train_loss": -26.562864303588867, "global_step": 373741, "epoch": 4502} {"train_loss": -26.285419464111328, "global_step": 373742, "epoch": 4502} {"train_loss": -26.6231689453125, "global_step": 373743, "epoch": 4502} {"train_loss": -26.547210693359375, "global_step": 373744, "epoch": 4502} {"train_loss": -26.72233009338379, "global_step": 373745, "epoch": 4502} {"train_loss": -26.160266876220703, "global_step": 373746, "epoch": 4502} {"train_loss": -26.863508224487305, "global_step": 373747, "epoch": 4502} {"train_loss": -26.315776273428675, "global_step": 373748, "epoch": 4502, "val_loss": 6615086.5} {"train_loss": -26.114057540893555, "global_step": 373749, "epoch": 4503} {"train_loss": -25.962646484375, "global_step": 373750, "epoch": 4503} {"train_loss": -25.075439453125, "global_step": 373751, "epoch": 4503} {"train_loss": -25.715429306030273, "global_step": 373752, "epoch": 4503} {"train_loss": -26.30933952331543, "global_step": 373753, "epoch": 4503} {"train_loss": -25.863677978515625, "global_step": 373754, "epoch": 4503} {"train_loss": -26.23990821838379, "global_step": 373755, "epoch": 4503} {"train_loss": -26.269697189331055, "global_step": 373756, "epoch": 4503} {"train_loss": -26.439407348632812, "global_step": 373757, "epoch": 4503} {"train_loss": -25.60304832458496, "global_step": 373758, "epoch": 4503} {"train_loss": -26.26238441467285, "global_step": 373759, "epoch": 4503} {"train_loss": -26.20195960998535, "global_step": 373760, "epoch": 4503} {"train_loss": -26.227506637573242, "global_step": 373761, "epoch": 4503} {"train_loss": -26.276845932006836, "global_step": 373762, "epoch": 4503} {"train_loss": -26.0736141204834, "global_step": 373763, "epoch": 4503} {"train_loss": -26.3791561126709, "global_step": 373764, "epoch": 4503} {"train_loss": -26.14316177368164, "global_step": 373765, "epoch": 4503} {"train_loss": -26.27705192565918, "global_step": 373766, "epoch": 4503} {"train_loss": -26.263259887695312, "global_step": 373767, "epoch": 4503} {"train_loss": -26.420576095581055, "global_step": 373768, "epoch": 4503} {"train_loss": -26.385456085205078, "global_step": 373769, "epoch": 4503} {"train_loss": -26.030710220336914, "global_step": 373770, "epoch": 4503} {"train_loss": -26.310644149780273, "global_step": 373771, "epoch": 4503} {"train_loss": -26.362991333007812, "global_step": 373772, "epoch": 4503} {"train_loss": -26.196500778198242, "global_step": 373773, "epoch": 4503} {"train_loss": -25.868268966674805, "global_step": 373774, "epoch": 4503} {"train_loss": -26.16448974609375, "global_step": 373775, "epoch": 4503} {"train_loss": -26.44140625, "global_step": 373776, "epoch": 4503} {"train_loss": -26.12275505065918, "global_step": 373777, "epoch": 4503} {"train_loss": -26.39045524597168, "global_step": 373778, "epoch": 4503} {"train_loss": -26.746713638305664, "global_step": 373779, "epoch": 4503} {"train_loss": -26.417911529541016, "global_step": 373780, "epoch": 4503} {"train_loss": -26.1381893157959, "global_step": 373781, "epoch": 4503} {"train_loss": -26.69342613220215, "global_step": 373782, "epoch": 4503} {"train_loss": -26.338943481445312, "global_step": 373783, "epoch": 4503} {"train_loss": -25.82269287109375, "global_step": 373784, "epoch": 4503} {"train_loss": -26.50287437438965, "global_step": 373785, "epoch": 4503} {"train_loss": -26.471139907836914, "global_step": 373786, "epoch": 4503} {"train_loss": -26.165258407592773, "global_step": 373787, "epoch": 4503} {"train_loss": -26.79256248474121, "global_step": 373788, "epoch": 4503} {"train_loss": -26.404462814331055, "global_step": 373789, "epoch": 4503} {"train_loss": -26.62452507019043, "global_step": 373790, "epoch": 4503} {"train_loss": -26.714868545532227, "global_step": 373791, "epoch": 4503} {"train_loss": -25.98760414123535, "global_step": 373792, "epoch": 4503} {"train_loss": -26.341833114624023, "global_step": 373793, "epoch": 4503} {"train_loss": -26.080463409423828, "global_step": 373794, "epoch": 4503} {"train_loss": -26.374820709228516, "global_step": 373795, "epoch": 4503} {"train_loss": -26.308216094970703, "global_step": 373796, "epoch": 4503} {"train_loss": -26.18012046813965, "global_step": 373797, "epoch": 4503} {"train_loss": -26.219995498657227, "global_step": 373798, "epoch": 4503} {"train_loss": -26.09882164001465, "global_step": 373799, "epoch": 4503} {"train_loss": -26.077001571655273, "global_step": 373800, "epoch": 4503} {"train_loss": -26.05606460571289, "global_step": 373801, "epoch": 4503} {"train_loss": -26.58160400390625, "global_step": 373802, "epoch": 4503} {"train_loss": -26.208749771118164, "global_step": 373803, "epoch": 4503} {"train_loss": -26.459985733032227, "global_step": 373804, "epoch": 4503} {"train_loss": -26.594457626342773, "global_step": 373805, "epoch": 4503} {"train_loss": -26.081302642822266, "global_step": 373806, "epoch": 4503} {"train_loss": -26.719776153564453, "global_step": 373807, "epoch": 4503} {"train_loss": -26.3350772857666, "global_step": 373808, "epoch": 4503} {"train_loss": -26.676488876342773, "global_step": 373809, "epoch": 4503} {"train_loss": -26.142988204956055, "global_step": 373810, "epoch": 4503} {"train_loss": -26.318511962890625, "global_step": 373811, "epoch": 4503} {"train_loss": -26.43596839904785, "global_step": 373812, "epoch": 4503} {"train_loss": -26.48380470275879, "global_step": 373813, "epoch": 4503} {"train_loss": -26.10727310180664, "global_step": 373814, "epoch": 4503} {"train_loss": -26.33375358581543, "global_step": 373815, "epoch": 4503} {"train_loss": -26.61402702331543, "global_step": 373816, "epoch": 4503} {"train_loss": -26.642471313476562, "global_step": 373817, "epoch": 4503} {"train_loss": -26.589406967163086, "global_step": 373818, "epoch": 4503} {"train_loss": -26.774555206298828, "global_step": 373819, "epoch": 4503} {"train_loss": -26.57513427734375, "global_step": 373820, "epoch": 4503} {"train_loss": -26.501483917236328, "global_step": 373821, "epoch": 4503} {"train_loss": -26.40041160583496, "global_step": 373822, "epoch": 4503} {"train_loss": -26.150922775268555, "global_step": 373823, "epoch": 4503} {"train_loss": -26.446252822875977, "global_step": 373824, "epoch": 4503} {"train_loss": -26.3695068359375, "global_step": 373825, "epoch": 4503} {"train_loss": -26.5975284576416, "global_step": 373826, "epoch": 4503} {"train_loss": -26.758405685424805, "global_step": 373827, "epoch": 4503} {"train_loss": -26.59185218811035, "global_step": 373828, "epoch": 4503} {"train_loss": -26.500173568725586, "global_step": 373829, "epoch": 4503} {"train_loss": -26.4638614654541, "global_step": 373830, "epoch": 4503} {"train_loss": -26.32301328268396, "global_step": 373831, "epoch": 4503, "val_loss": 6621706.0} {"train_loss": -25.582294464111328, "global_step": 373832, "epoch": 4504} {"train_loss": -25.95355796813965, "global_step": 373833, "epoch": 4504} {"train_loss": -26.009246826171875, "global_step": 373834, "epoch": 4504} {"train_loss": -25.7476806640625, "global_step": 373835, "epoch": 4504} {"train_loss": -26.231348037719727, "global_step": 373836, "epoch": 4504} {"train_loss": -26.1368465423584, "global_step": 373837, "epoch": 4504} {"train_loss": -25.077072143554688, "global_step": 373838, "epoch": 4504} {"train_loss": -26.13274574279785, "global_step": 373839, "epoch": 4504} {"train_loss": -26.3385066986084, "global_step": 373840, "epoch": 4504} {"train_loss": -26.30866050720215, "global_step": 373841, "epoch": 4504} {"train_loss": -26.108062744140625, "global_step": 373842, "epoch": 4504} {"train_loss": -26.1536865234375, "global_step": 373843, "epoch": 4504} {"train_loss": -26.157026290893555, "global_step": 373844, "epoch": 4504} {"train_loss": -26.065732955932617, "global_step": 373845, "epoch": 4504} {"train_loss": -25.922460556030273, "global_step": 373846, "epoch": 4504} {"train_loss": -25.61199378967285, "global_step": 373847, "epoch": 4504} {"train_loss": -25.992919921875, "global_step": 373848, "epoch": 4504} {"train_loss": -26.14802360534668, "global_step": 373849, "epoch": 4504} {"train_loss": -26.024917602539062, "global_step": 373850, "epoch": 4504} {"train_loss": -26.02790641784668, "global_step": 373851, "epoch": 4504} {"train_loss": -26.054162979125977, "global_step": 373852, "epoch": 4504} {"train_loss": -26.426916122436523, "global_step": 373853, "epoch": 4504} {"train_loss": -26.073949813842773, "global_step": 373854, "epoch": 4504} {"train_loss": -25.96134376525879, "global_step": 373855, "epoch": 4504} {"train_loss": -26.354694366455078, "global_step": 373856, "epoch": 4504} {"train_loss": -26.326324462890625, "global_step": 373857, "epoch": 4504} {"train_loss": -26.309667587280273, "global_step": 373858, "epoch": 4504} {"train_loss": -26.514928817749023, "global_step": 373859, "epoch": 4504} {"train_loss": -26.737646102905273, "global_step": 373860, "epoch": 4504} {"train_loss": -26.377546310424805, "global_step": 373861, "epoch": 4504} {"train_loss": -26.7490291595459, "global_step": 373862, "epoch": 4504} {"train_loss": -26.626632690429688, "global_step": 373863, "epoch": 4504} {"train_loss": -26.044403076171875, "global_step": 373864, "epoch": 4504} {"train_loss": -26.313934326171875, "global_step": 373865, "epoch": 4504} {"train_loss": -26.137052536010742, "global_step": 373866, "epoch": 4504} {"train_loss": -26.561681747436523, "global_step": 373867, "epoch": 4504} {"train_loss": -26.54652976989746, "global_step": 373868, "epoch": 4504} {"train_loss": -26.4241886138916, "global_step": 373869, "epoch": 4504} {"train_loss": -26.392810821533203, "global_step": 373870, "epoch": 4504} {"train_loss": -26.615171432495117, "global_step": 373871, "epoch": 4504} {"train_loss": -26.228742599487305, "global_step": 373872, "epoch": 4504} {"train_loss": -26.325109481811523, "global_step": 373873, "epoch": 4504} {"train_loss": -26.37006187438965, "global_step": 373874, "epoch": 4504} {"train_loss": -25.923248291015625, "global_step": 373875, "epoch": 4504} {"train_loss": -26.290170669555664, "global_step": 373876, "epoch": 4504} {"train_loss": -25.929107666015625, "global_step": 373877, "epoch": 4504} {"train_loss": -26.342267990112305, "global_step": 373878, "epoch": 4504} {"train_loss": -26.13197135925293, "global_step": 373879, "epoch": 4504} {"train_loss": -25.871570587158203, "global_step": 373880, "epoch": 4504} {"train_loss": -26.507476806640625, "global_step": 373881, "epoch": 4504} {"train_loss": -25.9770450592041, "global_step": 373882, "epoch": 4504} {"train_loss": -26.402318954467773, "global_step": 373883, "epoch": 4504} {"train_loss": -26.099035263061523, "global_step": 373884, "epoch": 4504} {"train_loss": -26.07806396484375, "global_step": 373885, "epoch": 4504} {"train_loss": -26.053211212158203, "global_step": 373886, "epoch": 4504} {"train_loss": -26.324405670166016, "global_step": 373887, "epoch": 4504} {"train_loss": -26.609973907470703, "global_step": 373888, "epoch": 4504} {"train_loss": -26.391510009765625, "global_step": 373889, "epoch": 4504} {"train_loss": -26.257659912109375, "global_step": 373890, "epoch": 4504} {"train_loss": -26.541059494018555, "global_step": 373891, "epoch": 4504} {"train_loss": -26.611181259155273, "global_step": 373892, "epoch": 4504} {"train_loss": -26.561084747314453, "global_step": 373893, "epoch": 4504} {"train_loss": -26.4327335357666, "global_step": 373894, "epoch": 4504} {"train_loss": -26.621688842773438, "global_step": 373895, "epoch": 4504} {"train_loss": -26.218841552734375, "global_step": 373896, "epoch": 4504} {"train_loss": -26.638381958007812, "global_step": 373897, "epoch": 4504} {"train_loss": -26.47848892211914, "global_step": 373898, "epoch": 4504} {"train_loss": -26.53742027282715, "global_step": 373899, "epoch": 4504} {"train_loss": -26.341480255126953, "global_step": 373900, "epoch": 4504} {"train_loss": -26.326528549194336, "global_step": 373901, "epoch": 4504} {"train_loss": -26.416107177734375, "global_step": 373902, "epoch": 4504} {"train_loss": -26.613981246948242, "global_step": 373903, "epoch": 4504} {"train_loss": -25.988666534423828, "global_step": 373904, "epoch": 4504} {"train_loss": -26.4748592376709, "global_step": 373905, "epoch": 4504} {"train_loss": -25.743427276611328, "global_step": 373906, "epoch": 4504} {"train_loss": -24.91396713256836, "global_step": 373907, "epoch": 4504} {"train_loss": -24.08528709411621, "global_step": 373908, "epoch": 4504} {"train_loss": -26.344528198242188, "global_step": 373909, "epoch": 4504} {"train_loss": -25.508371353149414, "global_step": 373910, "epoch": 4504} {"train_loss": -25.8048095703125, "global_step": 373911, "epoch": 4504} {"train_loss": -25.815393447875977, "global_step": 373912, "epoch": 4504} {"train_loss": -26.172597885131836, "global_step": 373913, "epoch": 4504} {"train_loss": -26.187306208782886, "global_step": 373914, "epoch": 4504, "val_loss": 6593385.5} {"train_loss": -25.602691650390625, "global_step": 373915, "epoch": 4505} {"train_loss": -25.64107322692871, "global_step": 373916, "epoch": 4505} {"train_loss": -25.816558837890625, "global_step": 373917, "epoch": 4505} {"train_loss": -25.745840072631836, "global_step": 373918, "epoch": 4505} {"train_loss": -25.504579544067383, "global_step": 373919, "epoch": 4505} {"train_loss": -25.704679489135742, "global_step": 373920, "epoch": 4505} {"train_loss": -26.039060592651367, "global_step": 373921, "epoch": 4505} {"train_loss": -25.927541732788086, "global_step": 373922, "epoch": 4505} {"train_loss": -25.97964859008789, "global_step": 373923, "epoch": 4505} {"train_loss": -25.995763778686523, "global_step": 373924, "epoch": 4505} {"train_loss": -25.87489128112793, "global_step": 373925, "epoch": 4505} {"train_loss": -25.8905086517334, "global_step": 373926, "epoch": 4505} {"train_loss": -25.86309814453125, "global_step": 373927, "epoch": 4505} {"train_loss": -25.813827514648438, "global_step": 373928, "epoch": 4505} {"train_loss": -26.026168823242188, "global_step": 373929, "epoch": 4505} {"train_loss": -26.41693115234375, "global_step": 373930, "epoch": 4505} {"train_loss": -25.969451904296875, "global_step": 373931, "epoch": 4505} {"train_loss": -26.00128173828125, "global_step": 373932, "epoch": 4505} {"train_loss": -26.446884155273438, "global_step": 373933, "epoch": 4505} {"train_loss": -26.394269943237305, "global_step": 373934, "epoch": 4505} {"train_loss": -25.798059463500977, "global_step": 373935, "epoch": 4505} {"train_loss": -26.295032501220703, "global_step": 373936, "epoch": 4505} {"train_loss": -25.998682022094727, "global_step": 373937, "epoch": 4505} {"train_loss": -25.877527236938477, "global_step": 373938, "epoch": 4505} {"train_loss": -26.03168296813965, "global_step": 373939, "epoch": 4505} {"train_loss": -26.421838760375977, "global_step": 373940, "epoch": 4505} {"train_loss": -26.37517738342285, "global_step": 373941, "epoch": 4505} {"train_loss": -26.425678253173828, "global_step": 373942, "epoch": 4505} {"train_loss": -26.56952476501465, "global_step": 373943, "epoch": 4505} {"train_loss": -26.484466552734375, "global_step": 373944, "epoch": 4505} {"train_loss": -26.268957138061523, "global_step": 373945, "epoch": 4505} {"train_loss": -25.93537712097168, "global_step": 373946, "epoch": 4505} {"train_loss": -26.780237197875977, "global_step": 373947, "epoch": 4505} {"train_loss": -26.4892635345459, "global_step": 373948, "epoch": 4505} {"train_loss": -26.34100914001465, "global_step": 373949, "epoch": 4505} {"train_loss": -25.910327911376953, "global_step": 373950, "epoch": 4505} {"train_loss": -26.634057998657227, "global_step": 373951, "epoch": 4505} {"train_loss": -26.462858200073242, "global_step": 373952, "epoch": 4505} {"train_loss": -26.440677642822266, "global_step": 373953, "epoch": 4505} {"train_loss": -26.444965362548828, "global_step": 373954, "epoch": 4505} {"train_loss": -26.516199111938477, "global_step": 373955, "epoch": 4505} {"train_loss": -26.51043128967285, "global_step": 373956, "epoch": 4505} {"train_loss": -26.54029655456543, "global_step": 373957, "epoch": 4505} {"train_loss": -26.572839736938477, "global_step": 373958, "epoch": 4505} {"train_loss": -26.333234786987305, "global_step": 373959, "epoch": 4505} {"train_loss": -26.4484920501709, "global_step": 373960, "epoch": 4505} {"train_loss": -26.17645835876465, "global_step": 373961, "epoch": 4505} {"train_loss": -26.435230255126953, "global_step": 373962, "epoch": 4505} {"train_loss": -26.599313735961914, "global_step": 373963, "epoch": 4505} {"train_loss": -26.464588165283203, "global_step": 373964, "epoch": 4505} {"train_loss": -26.73768424987793, "global_step": 373965, "epoch": 4505} {"train_loss": -26.416418075561523, "global_step": 373966, "epoch": 4505} {"train_loss": -26.438562393188477, "global_step": 373967, "epoch": 4505} {"train_loss": -26.808013916015625, "global_step": 373968, "epoch": 4505} {"train_loss": -26.587507247924805, "global_step": 373969, "epoch": 4505} {"train_loss": -26.65045738220215, "global_step": 373970, "epoch": 4505} {"train_loss": -26.747238159179688, "global_step": 373971, "epoch": 4505} {"train_loss": -26.660886764526367, "global_step": 373972, "epoch": 4505} {"train_loss": -26.644763946533203, "global_step": 373973, "epoch": 4505} {"train_loss": -26.70073890686035, "global_step": 373974, "epoch": 4505} {"train_loss": -26.645078659057617, "global_step": 373975, "epoch": 4505} {"train_loss": -26.457172393798828, "global_step": 373976, "epoch": 4505} {"train_loss": -26.391464233398438, "global_step": 373977, "epoch": 4505} {"train_loss": -26.39056968688965, "global_step": 373978, "epoch": 4505} {"train_loss": -26.0425968170166, "global_step": 373979, "epoch": 4505} {"train_loss": -26.0394344329834, "global_step": 373980, "epoch": 4505} {"train_loss": -26.226240158081055, "global_step": 373981, "epoch": 4505} {"train_loss": -26.5329532623291, "global_step": 373982, "epoch": 4505} {"train_loss": -26.292987823486328, "global_step": 373983, "epoch": 4505} {"train_loss": -26.40437126159668, "global_step": 373984, "epoch": 4505} {"train_loss": -26.70322036743164, "global_step": 373985, "epoch": 4505} {"train_loss": -25.994855880737305, "global_step": 373986, "epoch": 4505} {"train_loss": -26.072107315063477, "global_step": 373987, "epoch": 4505} {"train_loss": -26.3419189453125, "global_step": 373988, "epoch": 4505} {"train_loss": -25.909637451171875, "global_step": 373989, "epoch": 4505} {"train_loss": -26.344533920288086, "global_step": 373990, "epoch": 4505} {"train_loss": -26.17848777770996, "global_step": 373991, "epoch": 4505} {"train_loss": -26.1721134185791, "global_step": 373992, "epoch": 4505} {"train_loss": -26.11716079711914, "global_step": 373993, "epoch": 4505} {"train_loss": -26.170166015625, "global_step": 373994, "epoch": 4505} {"train_loss": -26.18756675720215, "global_step": 373995, "epoch": 4505} {"train_loss": -26.431686401367188, "global_step": 373996, "epoch": 4505} {"train_loss": -26.25820306984775, "global_step": 373997, "epoch": 4505, "val_loss": 6680486.5} {"train_loss": -25.384231567382812, "global_step": 373998, "epoch": 4506} {"train_loss": -25.388784408569336, "global_step": 373999, "epoch": 4506} {"train_loss": -25.788898468017578, "global_step": 374000, "epoch": 4506} {"train_loss": -26.096059799194336, "global_step": 374001, "epoch": 4506} {"train_loss": -25.383729934692383, "global_step": 374002, "epoch": 4506} {"train_loss": -25.681644439697266, "global_step": 374003, "epoch": 4506} {"train_loss": -25.699844360351562, "global_step": 374004, "epoch": 4506} {"train_loss": -25.905786514282227, "global_step": 374005, "epoch": 4506} {"train_loss": -26.04108238220215, "global_step": 374006, "epoch": 4506} {"train_loss": -26.178241729736328, "global_step": 374007, "epoch": 4506} {"train_loss": -26.36669921875, "global_step": 374008, "epoch": 4506} {"train_loss": -25.902301788330078, "global_step": 374009, "epoch": 4506} {"train_loss": -26.192535400390625, "global_step": 374010, "epoch": 4506} {"train_loss": -25.825531005859375, "global_step": 374011, "epoch": 4506} {"train_loss": -26.366254806518555, "global_step": 374012, "epoch": 4506} {"train_loss": -26.169178009033203, "global_step": 374013, "epoch": 4506} {"train_loss": -25.893598556518555, "global_step": 374014, "epoch": 4506} {"train_loss": -26.253393173217773, "global_step": 374015, "epoch": 4506} {"train_loss": -25.862445831298828, "global_step": 374016, "epoch": 4506} {"train_loss": -26.357404708862305, "global_step": 374017, "epoch": 4506} {"train_loss": -25.672260284423828, "global_step": 374018, "epoch": 4506} {"train_loss": -25.860980987548828, "global_step": 374019, "epoch": 4506} {"train_loss": -26.07858657836914, "global_step": 374020, "epoch": 4506} {"train_loss": -26.157201766967773, "global_step": 374021, "epoch": 4506} {"train_loss": -26.1495361328125, "global_step": 374022, "epoch": 4506} {"train_loss": -25.887537002563477, "global_step": 374023, "epoch": 4506} {"train_loss": -26.303760528564453, "global_step": 374024, "epoch": 4506} {"train_loss": -26.12091064453125, "global_step": 374025, "epoch": 4506} {"train_loss": -26.471708297729492, "global_step": 374026, "epoch": 4506} {"train_loss": -26.0954647064209, "global_step": 374027, "epoch": 4506} {"train_loss": -26.689599990844727, "global_step": 374028, "epoch": 4506} {"train_loss": -26.054224014282227, "global_step": 374029, "epoch": 4506} {"train_loss": -27.059240341186523, "global_step": 374030, "epoch": 4506} {"train_loss": -26.36582374572754, "global_step": 374031, "epoch": 4506} {"train_loss": -26.32501792907715, "global_step": 374032, "epoch": 4506} {"train_loss": -26.3319034576416, "global_step": 374033, "epoch": 4506} {"train_loss": -26.60256004333496, "global_step": 374034, "epoch": 4506} {"train_loss": -26.496091842651367, "global_step": 374035, "epoch": 4506} {"train_loss": -26.712467193603516, "global_step": 374036, "epoch": 4506} {"train_loss": -26.522321701049805, "global_step": 374037, "epoch": 4506} {"train_loss": -26.19087028503418, "global_step": 374038, "epoch": 4506} {"train_loss": -26.47784423828125, "global_step": 374039, "epoch": 4506} {"train_loss": -26.293014526367188, "global_step": 374040, "epoch": 4506} {"train_loss": -26.56317710876465, "global_step": 374041, "epoch": 4506} {"train_loss": -26.686613082885742, "global_step": 374042, "epoch": 4506} {"train_loss": -26.68021583557129, "global_step": 374043, "epoch": 4506} {"train_loss": -26.6207275390625, "global_step": 374044, "epoch": 4506} {"train_loss": -27.05201530456543, "global_step": 374045, "epoch": 4506} {"train_loss": -26.41407585144043, "global_step": 374046, "epoch": 4506} {"train_loss": -25.936391830444336, "global_step": 374047, "epoch": 4506} {"train_loss": -25.601715087890625, "global_step": 374048, "epoch": 4506} {"train_loss": -26.110700607299805, "global_step": 374049, "epoch": 4506} {"train_loss": -26.228302001953125, "global_step": 374050, "epoch": 4506} {"train_loss": -26.355072021484375, "global_step": 374051, "epoch": 4506} {"train_loss": -26.111310958862305, "global_step": 374052, "epoch": 4506} {"train_loss": -26.934309005737305, "global_step": 374053, "epoch": 4506} {"train_loss": -26.2814998626709, "global_step": 374054, "epoch": 4506} {"train_loss": -26.710662841796875, "global_step": 374055, "epoch": 4506} {"train_loss": -26.27266502380371, "global_step": 374056, "epoch": 4506} {"train_loss": -26.430896759033203, "global_step": 374057, "epoch": 4506} {"train_loss": -26.179529190063477, "global_step": 374058, "epoch": 4506} {"train_loss": -26.312299728393555, "global_step": 374059, "epoch": 4506} {"train_loss": -26.09584617614746, "global_step": 374060, "epoch": 4506} {"train_loss": -26.163976669311523, "global_step": 374061, "epoch": 4506} {"train_loss": -26.38938331604004, "global_step": 374062, "epoch": 4506} {"train_loss": -26.65534782409668, "global_step": 374063, "epoch": 4506} {"train_loss": -26.559040069580078, "global_step": 374064, "epoch": 4506} {"train_loss": -26.5860595703125, "global_step": 374065, "epoch": 4506} {"train_loss": -26.427053451538086, "global_step": 374066, "epoch": 4506} {"train_loss": -26.455183029174805, "global_step": 374067, "epoch": 4506} {"train_loss": -26.562597274780273, "global_step": 374068, "epoch": 4506} {"train_loss": -26.348831176757812, "global_step": 374069, "epoch": 4506} {"train_loss": -25.9610538482666, "global_step": 374070, "epoch": 4506} {"train_loss": -26.761640548706055, "global_step": 374071, "epoch": 4506} {"train_loss": -26.25141716003418, "global_step": 374072, "epoch": 4506} {"train_loss": -26.318603515625, "global_step": 374073, "epoch": 4506} {"train_loss": -26.448530197143555, "global_step": 374074, "epoch": 4506} {"train_loss": -26.346881866455078, "global_step": 374075, "epoch": 4506} {"train_loss": -26.232009887695312, "global_step": 374076, "epoch": 4506} {"train_loss": -26.568387985229492, "global_step": 374077, "epoch": 4506} {"train_loss": -26.47793960571289, "global_step": 374078, "epoch": 4506} {"train_loss": -26.08587074279785, "global_step": 374079, "epoch": 4506} {"train_loss": -26.237358001341303, "global_step": 374080, "epoch": 4506, "val_loss": 6655413.0} {"train_loss": -25.411035537719727, "global_step": 374081, "epoch": 4507} {"train_loss": -25.248708724975586, "global_step": 374082, "epoch": 4507} {"train_loss": -25.629322052001953, "global_step": 374083, "epoch": 4507} {"train_loss": -25.46817398071289, "global_step": 374084, "epoch": 4507} {"train_loss": -24.219236373901367, "global_step": 374085, "epoch": 4507} {"train_loss": -25.045166015625, "global_step": 374086, "epoch": 4507} {"train_loss": -25.30228614807129, "global_step": 374087, "epoch": 4507} {"train_loss": -25.15591812133789, "global_step": 374088, "epoch": 4507} {"train_loss": -25.137968063354492, "global_step": 374089, "epoch": 4507} {"train_loss": -25.329370498657227, "global_step": 374090, "epoch": 4507} {"train_loss": -24.93745994567871, "global_step": 374091, "epoch": 4507} {"train_loss": -25.383115768432617, "global_step": 374092, "epoch": 4507} {"train_loss": -25.803991317749023, "global_step": 374093, "epoch": 4507} {"train_loss": -25.303861618041992, "global_step": 374094, "epoch": 4507} {"train_loss": -25.96023941040039, "global_step": 374095, "epoch": 4507} {"train_loss": -25.5765323638916, "global_step": 374096, "epoch": 4507} {"train_loss": -25.522314071655273, "global_step": 374097, "epoch": 4507} {"train_loss": -25.921295166015625, "global_step": 374098, "epoch": 4507} {"train_loss": -25.680139541625977, "global_step": 374099, "epoch": 4507} {"train_loss": -25.677631378173828, "global_step": 374100, "epoch": 4507} {"train_loss": -25.882272720336914, "global_step": 374101, "epoch": 4507} {"train_loss": -25.920963287353516, "global_step": 374102, "epoch": 4507} {"train_loss": -25.776721954345703, "global_step": 374103, "epoch": 4507} {"train_loss": -25.834753036499023, "global_step": 374104, "epoch": 4507} {"train_loss": -25.477842330932617, "global_step": 374105, "epoch": 4507} {"train_loss": -26.251012802124023, "global_step": 374106, "epoch": 4507} {"train_loss": -26.06662368774414, "global_step": 374107, "epoch": 4507} {"train_loss": -25.793710708618164, "global_step": 374108, "epoch": 4507} {"train_loss": -26.636911392211914, "global_step": 374109, "epoch": 4507} {"train_loss": -26.124053955078125, "global_step": 374110, "epoch": 4507} {"train_loss": -26.110254287719727, "global_step": 374111, "epoch": 4507} {"train_loss": -26.77219009399414, "global_step": 374112, "epoch": 4507} {"train_loss": -26.4713134765625, "global_step": 374113, "epoch": 4507} {"train_loss": -26.02373695373535, "global_step": 374114, "epoch": 4507} {"train_loss": -26.28045082092285, "global_step": 374115, "epoch": 4507} {"train_loss": -26.2581844329834, "global_step": 374116, "epoch": 4507} {"train_loss": -26.258142471313477, "global_step": 374117, "epoch": 4507} {"train_loss": -25.939428329467773, "global_step": 374118, "epoch": 4507} {"train_loss": -26.472562789916992, "global_step": 374119, "epoch": 4507} {"train_loss": -26.613996505737305, "global_step": 374120, "epoch": 4507} {"train_loss": -26.146621704101562, "global_step": 374121, "epoch": 4507} {"train_loss": -26.491098403930664, "global_step": 374122, "epoch": 4507} {"train_loss": -26.322925567626953, "global_step": 374123, "epoch": 4507} {"train_loss": -26.82024574279785, "global_step": 374124, "epoch": 4507} {"train_loss": -26.642431259155273, "global_step": 374125, "epoch": 4507} {"train_loss": -26.292129516601562, "global_step": 374126, "epoch": 4507} {"train_loss": -26.879138946533203, "global_step": 374127, "epoch": 4507} {"train_loss": -26.624500274658203, "global_step": 374128, "epoch": 4507} {"train_loss": -26.76331901550293, "global_step": 374129, "epoch": 4507} {"train_loss": -26.68196678161621, "global_step": 374130, "epoch": 4507} {"train_loss": -26.42188835144043, "global_step": 374131, "epoch": 4507} {"train_loss": -26.79250144958496, "global_step": 374132, "epoch": 4507} {"train_loss": -26.699207305908203, "global_step": 374133, "epoch": 4507} {"train_loss": -26.637292861938477, "global_step": 374134, "epoch": 4507} {"train_loss": -26.60272216796875, "global_step": 374135, "epoch": 4507} {"train_loss": -26.684314727783203, "global_step": 374136, "epoch": 4507} {"train_loss": -26.295724868774414, "global_step": 374137, "epoch": 4507} {"train_loss": -26.206151962280273, "global_step": 374138, "epoch": 4507} {"train_loss": -26.65264320373535, "global_step": 374139, "epoch": 4507} {"train_loss": -26.53656578063965, "global_step": 374140, "epoch": 4507} {"train_loss": -26.867679595947266, "global_step": 374141, "epoch": 4507} {"train_loss": -26.655622482299805, "global_step": 374142, "epoch": 4507} {"train_loss": -26.695648193359375, "global_step": 374143, "epoch": 4507} {"train_loss": -26.394277572631836, "global_step": 374144, "epoch": 4507} {"train_loss": -26.522079467773438, "global_step": 374145, "epoch": 4507} {"train_loss": -26.155914306640625, "global_step": 374146, "epoch": 4507} {"train_loss": -26.486730575561523, "global_step": 374147, "epoch": 4507} {"train_loss": -26.207447052001953, "global_step": 374148, "epoch": 4507} {"train_loss": -26.262557983398438, "global_step": 374149, "epoch": 4507} {"train_loss": -26.151838302612305, "global_step": 374150, "epoch": 4507} {"train_loss": -26.458942413330078, "global_step": 374151, "epoch": 4507} {"train_loss": -26.58051109313965, "global_step": 374152, "epoch": 4507} {"train_loss": -26.25165367126465, "global_step": 374153, "epoch": 4507} {"train_loss": -26.361169815063477, "global_step": 374154, "epoch": 4507} {"train_loss": -26.043106079101562, "global_step": 374155, "epoch": 4507} {"train_loss": -26.378137588500977, "global_step": 374156, "epoch": 4507} {"train_loss": -26.19718360900879, "global_step": 374157, "epoch": 4507} {"train_loss": -26.837005615234375, "global_step": 374158, "epoch": 4507} {"train_loss": -26.143585205078125, "global_step": 374159, "epoch": 4507} {"train_loss": -26.164752960205078, "global_step": 374160, "epoch": 4507} {"train_loss": -26.289752960205078, "global_step": 374161, "epoch": 4507} {"train_loss": -26.254077911376953, "global_step": 374162, "epoch": 4507} {"train_loss": -26.128157397350634, "global_step": 374163, "epoch": 4507, "val_loss": 6635530.0} {"train_loss": -26.296003341674805, "global_step": 374164, "epoch": 4508} {"train_loss": -25.608762741088867, "global_step": 374165, "epoch": 4508} {"train_loss": -23.624717712402344, "global_step": 374166, "epoch": 4508} {"train_loss": -22.503576278686523, "global_step": 374167, "epoch": 4508} {"train_loss": -25.801294326782227, "global_step": 374168, "epoch": 4508} {"train_loss": -24.625747680664062, "global_step": 374169, "epoch": 4508} {"train_loss": -25.07767105102539, "global_step": 374170, "epoch": 4508} {"train_loss": -25.534446716308594, "global_step": 374171, "epoch": 4508} {"train_loss": -25.41804313659668, "global_step": 374172, "epoch": 4508} {"train_loss": -25.957473754882812, "global_step": 374173, "epoch": 4508} {"train_loss": -25.77947998046875, "global_step": 374174, "epoch": 4508} {"train_loss": -25.786672592163086, "global_step": 374175, "epoch": 4508} {"train_loss": -25.78156852722168, "global_step": 374176, "epoch": 4508} {"train_loss": -25.593894958496094, "global_step": 374177, "epoch": 4508} {"train_loss": -25.89667320251465, "global_step": 374178, "epoch": 4508} {"train_loss": -25.58339500427246, "global_step": 374179, "epoch": 4508} {"train_loss": -25.39525032043457, "global_step": 374180, "epoch": 4508} {"train_loss": -25.854755401611328, "global_step": 374181, "epoch": 4508} {"train_loss": -25.76136589050293, "global_step": 374182, "epoch": 4508} {"train_loss": -25.751264572143555, "global_step": 374183, "epoch": 4508} {"train_loss": -25.745166778564453, "global_step": 374184, "epoch": 4508} {"train_loss": -26.044218063354492, "global_step": 374185, "epoch": 4508} {"train_loss": -25.731555938720703, "global_step": 374186, "epoch": 4508} {"train_loss": -26.229541778564453, "global_step": 374187, "epoch": 4508} {"train_loss": -25.603967666625977, "global_step": 374188, "epoch": 4508} {"train_loss": -25.57691764831543, "global_step": 374189, "epoch": 4508} {"train_loss": -26.082799911499023, "global_step": 374190, "epoch": 4508} {"train_loss": -26.1135311126709, "global_step": 374191, "epoch": 4508} {"train_loss": -26.042612075805664, "global_step": 374192, "epoch": 4508} {"train_loss": -25.979217529296875, "global_step": 374193, "epoch": 4508} {"train_loss": -26.045679092407227, "global_step": 374194, "epoch": 4508} {"train_loss": -25.81902503967285, "global_step": 374195, "epoch": 4508} {"train_loss": -26.116352081298828, "global_step": 374196, "epoch": 4508} {"train_loss": -26.222360610961914, "global_step": 374197, "epoch": 4508} {"train_loss": -26.653356552124023, "global_step": 374198, "epoch": 4508} {"train_loss": -26.109323501586914, "global_step": 374199, "epoch": 4508} {"train_loss": -26.286462783813477, "global_step": 374200, "epoch": 4508} {"train_loss": -26.667341232299805, "global_step": 374201, "epoch": 4508} {"train_loss": -26.381610870361328, "global_step": 374202, "epoch": 4508} {"train_loss": -26.33319664001465, "global_step": 374203, "epoch": 4508} {"train_loss": -26.112104415893555, "global_step": 374204, "epoch": 4508} {"train_loss": -26.53529930114746, "global_step": 374205, "epoch": 4508} {"train_loss": -26.429244995117188, "global_step": 374206, "epoch": 4508} {"train_loss": -26.83076286315918, "global_step": 374207, "epoch": 4508} {"train_loss": -26.348188400268555, "global_step": 374208, "epoch": 4508} {"train_loss": -26.596546173095703, "global_step": 374209, "epoch": 4508} {"train_loss": -26.57806396484375, "global_step": 374210, "epoch": 4508} {"train_loss": -26.364118576049805, "global_step": 374211, "epoch": 4508} {"train_loss": -25.88581657409668, "global_step": 374212, "epoch": 4508} {"train_loss": -26.651453018188477, "global_step": 374213, "epoch": 4508} {"train_loss": -26.48868179321289, "global_step": 374214, "epoch": 4508} {"train_loss": -26.32282829284668, "global_step": 374215, "epoch": 4508} {"train_loss": -26.35603141784668, "global_step": 374216, "epoch": 4508} {"train_loss": -26.15130615234375, "global_step": 374217, "epoch": 4508} {"train_loss": -26.7042179107666, "global_step": 374218, "epoch": 4508} {"train_loss": -26.68758201599121, "global_step": 374219, "epoch": 4508} {"train_loss": -26.44073486328125, "global_step": 374220, "epoch": 4508} {"train_loss": -25.962873458862305, "global_step": 374221, "epoch": 4508} {"train_loss": -26.55335807800293, "global_step": 374222, "epoch": 4508} {"train_loss": -26.52068519592285, "global_step": 374223, "epoch": 4508} {"train_loss": -26.420196533203125, "global_step": 374224, "epoch": 4508} {"train_loss": -26.67677879333496, "global_step": 374225, "epoch": 4508} {"train_loss": -26.559019088745117, "global_step": 374226, "epoch": 4508} {"train_loss": -26.646203994750977, "global_step": 374227, "epoch": 4508} {"train_loss": -26.284448623657227, "global_step": 374228, "epoch": 4508} {"train_loss": -26.54987907409668, "global_step": 374229, "epoch": 4508} {"train_loss": -26.60468101501465, "global_step": 374230, "epoch": 4508} {"train_loss": -26.290084838867188, "global_step": 374231, "epoch": 4508} {"train_loss": -26.431320190429688, "global_step": 374232, "epoch": 4508} {"train_loss": -26.746408462524414, "global_step": 374233, "epoch": 4508} {"train_loss": -26.618213653564453, "global_step": 374234, "epoch": 4508} {"train_loss": -26.660497665405273, "global_step": 374235, "epoch": 4508} {"train_loss": -26.544538497924805, "global_step": 374236, "epoch": 4508} {"train_loss": -26.566572189331055, "global_step": 374237, "epoch": 4508} {"train_loss": -26.158203125, "global_step": 374238, "epoch": 4508} {"train_loss": -26.39491081237793, "global_step": 374239, "epoch": 4508} {"train_loss": -26.8438663482666, "global_step": 374240, "epoch": 4508} {"train_loss": -26.431262969970703, "global_step": 374241, "epoch": 4508} {"train_loss": -26.305011749267578, "global_step": 374242, "epoch": 4508} {"train_loss": -26.63629722595215, "global_step": 374243, "epoch": 4508} {"train_loss": -25.814884185791016, "global_step": 374244, "epoch": 4508} {"train_loss": -26.512693405151367, "global_step": 374245, "epoch": 4508} {"train_loss": -26.093734258628754, "global_step": 374246, "epoch": 4508, "val_loss": 6687983.5} {"train_loss": -25.8104248046875, "global_step": 374247, "epoch": 4509} {"train_loss": -25.1805362701416, "global_step": 374248, "epoch": 4509} {"train_loss": -25.635435104370117, "global_step": 374249, "epoch": 4509} {"train_loss": -25.070531845092773, "global_step": 374250, "epoch": 4509} {"train_loss": -25.685977935791016, "global_step": 374251, "epoch": 4509} {"train_loss": -25.185136795043945, "global_step": 374252, "epoch": 4509} {"train_loss": -25.589509963989258, "global_step": 374253, "epoch": 4509} {"train_loss": -26.136856079101562, "global_step": 374254, "epoch": 4509} {"train_loss": -25.8625545501709, "global_step": 374255, "epoch": 4509} {"train_loss": -25.483373641967773, "global_step": 374256, "epoch": 4509} {"train_loss": -26.026214599609375, "global_step": 374257, "epoch": 4509} {"train_loss": -26.202844619750977, "global_step": 374258, "epoch": 4509} {"train_loss": -25.839941024780273, "global_step": 374259, "epoch": 4509} {"train_loss": -26.181310653686523, "global_step": 374260, "epoch": 4509} {"train_loss": -25.962644577026367, "global_step": 374261, "epoch": 4509} {"train_loss": -25.827259063720703, "global_step": 374262, "epoch": 4509} {"train_loss": -26.009687423706055, "global_step": 374263, "epoch": 4509} {"train_loss": -26.170957565307617, "global_step": 374264, "epoch": 4509} {"train_loss": -26.114591598510742, "global_step": 374265, "epoch": 4509} {"train_loss": -26.0623836517334, "global_step": 374266, "epoch": 4509} {"train_loss": -26.193952560424805, "global_step": 374267, "epoch": 4509} {"train_loss": -26.267065048217773, "global_step": 374268, "epoch": 4509} {"train_loss": -26.009557723999023, "global_step": 374269, "epoch": 4509} {"train_loss": -26.234771728515625, "global_step": 374270, "epoch": 4509} {"train_loss": -26.211816787719727, "global_step": 374271, "epoch": 4509} {"train_loss": -25.926355361938477, "global_step": 374272, "epoch": 4509} {"train_loss": -26.05484962463379, "global_step": 374273, "epoch": 4509} {"train_loss": -26.252771377563477, "global_step": 374274, "epoch": 4509} {"train_loss": -26.468358993530273, "global_step": 374275, "epoch": 4509} {"train_loss": -26.279438018798828, "global_step": 374276, "epoch": 4509} {"train_loss": -26.24713706970215, "global_step": 374277, "epoch": 4509} {"train_loss": -26.046772003173828, "global_step": 374278, "epoch": 4509} {"train_loss": -26.35456657409668, "global_step": 374279, "epoch": 4509} {"train_loss": -26.47650718688965, "global_step": 374280, "epoch": 4509} {"train_loss": -26.374982833862305, "global_step": 374281, "epoch": 4509} {"train_loss": -26.17815589904785, "global_step": 374282, "epoch": 4509} {"train_loss": -26.315439224243164, "global_step": 374283, "epoch": 4509} {"train_loss": -26.49188232421875, "global_step": 374284, "epoch": 4509} {"train_loss": -26.182538986206055, "global_step": 374285, "epoch": 4509} {"train_loss": -26.416854858398438, "global_step": 374286, "epoch": 4509} {"train_loss": -26.80488395690918, "global_step": 374287, "epoch": 4509} {"train_loss": -26.3875789642334, "global_step": 374288, "epoch": 4509} {"train_loss": -26.691436767578125, "global_step": 374289, "epoch": 4509} {"train_loss": -26.459552764892578, "global_step": 374290, "epoch": 4509} {"train_loss": -26.405948638916016, "global_step": 374291, "epoch": 4509} {"train_loss": -26.291946411132812, "global_step": 374292, "epoch": 4509} {"train_loss": -26.577722549438477, "global_step": 374293, "epoch": 4509} {"train_loss": -26.11673927307129, "global_step": 374294, "epoch": 4509} {"train_loss": -26.55022621154785, "global_step": 374295, "epoch": 4509} {"train_loss": -26.48372459411621, "global_step": 374296, "epoch": 4509} {"train_loss": -26.179189682006836, "global_step": 374297, "epoch": 4509} {"train_loss": -26.313135147094727, "global_step": 374298, "epoch": 4509} {"train_loss": -26.5320987701416, "global_step": 374299, "epoch": 4509} {"train_loss": -26.1754093170166, "global_step": 374300, "epoch": 4509} {"train_loss": -26.31817626953125, "global_step": 374301, "epoch": 4509} {"train_loss": -26.22920036315918, "global_step": 374302, "epoch": 4509} {"train_loss": -26.282819747924805, "global_step": 374303, "epoch": 4509} {"train_loss": -26.37738037109375, "global_step": 374304, "epoch": 4509} {"train_loss": -26.657886505126953, "global_step": 374305, "epoch": 4509} {"train_loss": -26.51283073425293, "global_step": 374306, "epoch": 4509} {"train_loss": -26.52508544921875, "global_step": 374307, "epoch": 4509} {"train_loss": -26.29740333557129, "global_step": 374308, "epoch": 4509} {"train_loss": -26.568464279174805, "global_step": 374309, "epoch": 4509} {"train_loss": -26.504053115844727, "global_step": 374310, "epoch": 4509} {"train_loss": -26.4650821685791, "global_step": 374311, "epoch": 4509} {"train_loss": -26.468732833862305, "global_step": 374312, "epoch": 4509} {"train_loss": -26.64314079284668, "global_step": 374313, "epoch": 4509} {"train_loss": -26.201440811157227, "global_step": 374314, "epoch": 4509} {"train_loss": -26.49151611328125, "global_step": 374315, "epoch": 4509} {"train_loss": -26.5739688873291, "global_step": 374316, "epoch": 4509} {"train_loss": -26.369115829467773, "global_step": 374317, "epoch": 4509} {"train_loss": -26.609573364257812, "global_step": 374318, "epoch": 4509} {"train_loss": -26.561634063720703, "global_step": 374319, "epoch": 4509} {"train_loss": -26.814483642578125, "global_step": 374320, "epoch": 4509} {"train_loss": -26.705005645751953, "global_step": 374321, "epoch": 4509} {"train_loss": -26.47039794921875, "global_step": 374322, "epoch": 4509} {"train_loss": -26.475238800048828, "global_step": 374323, "epoch": 4509} {"train_loss": -26.398488998413086, "global_step": 374324, "epoch": 4509} {"train_loss": -26.474546432495117, "global_step": 374325, "epoch": 4509} {"train_loss": -26.208499908447266, "global_step": 374326, "epoch": 4509} {"train_loss": -26.32977294921875, "global_step": 374327, "epoch": 4509} {"train_loss": -26.44870948791504, "global_step": 374328, "epoch": 4509} {"train_loss": -26.260238440640002, "global_step": 374329, "epoch": 4509, "val_loss": 6682690.5} {"train_loss": -26.034900665283203, "global_step": 374330, "epoch": 4510} {"train_loss": -25.15563201904297, "global_step": 374331, "epoch": 4510} {"train_loss": -25.26125717163086, "global_step": 374332, "epoch": 4510} {"train_loss": -24.725751876831055, "global_step": 374333, "epoch": 4510} {"train_loss": -24.57903289794922, "global_step": 374334, "epoch": 4510} {"train_loss": -25.452077865600586, "global_step": 374335, "epoch": 4510} {"train_loss": -25.363937377929688, "global_step": 374336, "epoch": 4510} {"train_loss": -25.371614456176758, "global_step": 374337, "epoch": 4510} {"train_loss": -25.609134674072266, "global_step": 374338, "epoch": 4510} {"train_loss": -25.436643600463867, "global_step": 374339, "epoch": 4510} {"train_loss": -25.663562774658203, "global_step": 374340, "epoch": 4510} {"train_loss": -25.9138126373291, "global_step": 374341, "epoch": 4510} {"train_loss": -25.768049240112305, "global_step": 374342, "epoch": 4510} {"train_loss": -25.92193603515625, "global_step": 374343, "epoch": 4510} {"train_loss": -25.839740753173828, "global_step": 374344, "epoch": 4510} {"train_loss": -25.905054092407227, "global_step": 374345, "epoch": 4510} {"train_loss": -25.480506896972656, "global_step": 374346, "epoch": 4510} {"train_loss": -26.085241317749023, "global_step": 374347, "epoch": 4510} {"train_loss": -25.88822364807129, "global_step": 374348, "epoch": 4510} {"train_loss": -25.8916015625, "global_step": 374349, "epoch": 4510} {"train_loss": -26.3199462890625, "global_step": 374350, "epoch": 4510} {"train_loss": -26.06622886657715, "global_step": 374351, "epoch": 4510} {"train_loss": -26.151458740234375, "global_step": 374352, "epoch": 4510} {"train_loss": -25.997333526611328, "global_step": 374353, "epoch": 4510} {"train_loss": -25.986005783081055, "global_step": 374354, "epoch": 4510} {"train_loss": -26.310672760009766, "global_step": 374355, "epoch": 4510} {"train_loss": -26.46282386779785, "global_step": 374356, "epoch": 4510} {"train_loss": -26.485614776611328, "global_step": 374357, "epoch": 4510} {"train_loss": -26.21742820739746, "global_step": 374358, "epoch": 4510} {"train_loss": -26.482126235961914, "global_step": 374359, "epoch": 4510} {"train_loss": -26.24176597595215, "global_step": 374360, "epoch": 4510} {"train_loss": -26.43475341796875, "global_step": 374361, "epoch": 4510} {"train_loss": -26.464130401611328, "global_step": 374362, "epoch": 4510} {"train_loss": -26.380857467651367, "global_step": 374363, "epoch": 4510} {"train_loss": -26.614883422851562, "global_step": 374364, "epoch": 4510} {"train_loss": -26.33565330505371, "global_step": 374365, "epoch": 4510} {"train_loss": -26.454858779907227, "global_step": 374366, "epoch": 4510} {"train_loss": -26.594833374023438, "global_step": 374367, "epoch": 4510} {"train_loss": -26.386581420898438, "global_step": 374368, "epoch": 4510} {"train_loss": -26.5742130279541, "global_step": 374369, "epoch": 4510} {"train_loss": -26.5181884765625, "global_step": 374370, "epoch": 4510} {"train_loss": -26.687015533447266, "global_step": 374371, "epoch": 4510} {"train_loss": -26.4848575592041, "global_step": 374372, "epoch": 4510} {"train_loss": -26.4827823638916, "global_step": 374373, "epoch": 4510} {"train_loss": -26.91864585876465, "global_step": 374374, "epoch": 4510} {"train_loss": -27.024328231811523, "global_step": 374375, "epoch": 4510} {"train_loss": -26.91876792907715, "global_step": 374376, "epoch": 4510} {"train_loss": -26.337066650390625, "global_step": 374377, "epoch": 4510} {"train_loss": -26.643598556518555, "global_step": 374378, "epoch": 4510} {"train_loss": -26.641464233398438, "global_step": 374379, "epoch": 4510} {"train_loss": -26.680692672729492, "global_step": 374380, "epoch": 4510} {"train_loss": -26.58738136291504, "global_step": 374381, "epoch": 4510} {"train_loss": -26.582263946533203, "global_step": 374382, "epoch": 4510} {"train_loss": -26.730716705322266, "global_step": 374383, "epoch": 4510} {"train_loss": -26.2811336517334, "global_step": 374384, "epoch": 4510} {"train_loss": -26.341033935546875, "global_step": 374385, "epoch": 4510} {"train_loss": -26.242828369140625, "global_step": 374386, "epoch": 4510} {"train_loss": -26.54062843322754, "global_step": 374387, "epoch": 4510} {"train_loss": -26.103174209594727, "global_step": 374388, "epoch": 4510} {"train_loss": -26.022382736206055, "global_step": 374389, "epoch": 4510} {"train_loss": -26.298429489135742, "global_step": 374390, "epoch": 4510} {"train_loss": -26.14238929748535, "global_step": 374391, "epoch": 4510} {"train_loss": -26.154260635375977, "global_step": 374392, "epoch": 4510} {"train_loss": -25.7760009765625, "global_step": 374393, "epoch": 4510} {"train_loss": -26.270843505859375, "global_step": 374394, "epoch": 4510} {"train_loss": -26.469533920288086, "global_step": 374395, "epoch": 4510} {"train_loss": -26.036304473876953, "global_step": 374396, "epoch": 4510} {"train_loss": -26.060449600219727, "global_step": 374397, "epoch": 4510} {"train_loss": -26.22382164001465, "global_step": 374398, "epoch": 4510} {"train_loss": -25.902673721313477, "global_step": 374399, "epoch": 4510} {"train_loss": -25.753305435180664, "global_step": 374400, "epoch": 4510} {"train_loss": -25.96906852722168, "global_step": 374401, "epoch": 4510} {"train_loss": -26.481470108032227, "global_step": 374402, "epoch": 4510} {"train_loss": -26.61199951171875, "global_step": 374403, "epoch": 4510} {"train_loss": -26.359466552734375, "global_step": 374404, "epoch": 4510} {"train_loss": -26.581134796142578, "global_step": 374405, "epoch": 4510} {"train_loss": -26.446088790893555, "global_step": 374406, "epoch": 4510} {"train_loss": -26.459243774414062, "global_step": 374407, "epoch": 4510} {"train_loss": -26.138471603393555, "global_step": 374408, "epoch": 4510} {"train_loss": -26.231903076171875, "global_step": 374409, "epoch": 4510} {"train_loss": -26.453861236572266, "global_step": 374410, "epoch": 4510} {"train_loss": -26.292856216430664, "global_step": 374411, "epoch": 4510} {"train_loss": -26.16706135761307, "global_step": 374412, "epoch": 4510, "val_loss": 6638349.5} {"train_loss": -26.416748046875, "global_step": 374413, "epoch": 4511} {"train_loss": -26.036212921142578, "global_step": 374414, "epoch": 4511} {"train_loss": -26.103540420532227, "global_step": 374415, "epoch": 4511} {"train_loss": -26.16200065612793, "global_step": 374416, "epoch": 4511} {"train_loss": -26.549793243408203, "global_step": 374417, "epoch": 4511} {"train_loss": -26.315847396850586, "global_step": 374418, "epoch": 4511} {"train_loss": -26.083240509033203, "global_step": 374419, "epoch": 4511} {"train_loss": -26.011098861694336, "global_step": 374420, "epoch": 4511} {"train_loss": -26.378131866455078, "global_step": 374421, "epoch": 4511} {"train_loss": -26.020734786987305, "global_step": 374422, "epoch": 4511} {"train_loss": -26.631916046142578, "global_step": 374423, "epoch": 4511} {"train_loss": -26.201557159423828, "global_step": 374424, "epoch": 4511} {"train_loss": -26.282470703125, "global_step": 374425, "epoch": 4511} {"train_loss": -26.549901962280273, "global_step": 374426, "epoch": 4511} {"train_loss": -26.61860466003418, "global_step": 374427, "epoch": 4511} {"train_loss": -26.335113525390625, "global_step": 374428, "epoch": 4511} {"train_loss": -26.64336585998535, "global_step": 374429, "epoch": 4511} {"train_loss": -26.558353424072266, "global_step": 374430, "epoch": 4511} {"train_loss": -26.390180587768555, "global_step": 374431, "epoch": 4511} {"train_loss": -26.216779708862305, "global_step": 374432, "epoch": 4511} {"train_loss": -26.60336685180664, "global_step": 374433, "epoch": 4511} {"train_loss": -26.521127700805664, "global_step": 374434, "epoch": 4511} {"train_loss": -26.481531143188477, "global_step": 374435, "epoch": 4511} {"train_loss": -26.25788688659668, "global_step": 374436, "epoch": 4511} {"train_loss": -26.436750411987305, "global_step": 374437, "epoch": 4511} {"train_loss": -26.04258155822754, "global_step": 374438, "epoch": 4511} {"train_loss": -26.657672882080078, "global_step": 374439, "epoch": 4511} {"train_loss": -26.60613441467285, "global_step": 374440, "epoch": 4511} {"train_loss": -26.6539363861084, "global_step": 374441, "epoch": 4511} {"train_loss": -26.76372718811035, "global_step": 374442, "epoch": 4511} {"train_loss": -26.679401397705078, "global_step": 374443, "epoch": 4511} {"train_loss": -26.397714614868164, "global_step": 374444, "epoch": 4511} {"train_loss": -26.7066707611084, "global_step": 374445, "epoch": 4511} {"train_loss": -26.571502685546875, "global_step": 374446, "epoch": 4511} {"train_loss": -26.576154708862305, "global_step": 374447, "epoch": 4511} {"train_loss": -26.6830997467041, "global_step": 374448, "epoch": 4511} {"train_loss": -26.4964656829834, "global_step": 374449, "epoch": 4511} {"train_loss": -26.75741958618164, "global_step": 374450, "epoch": 4511} {"train_loss": -26.27473258972168, "global_step": 374451, "epoch": 4511} {"train_loss": -26.614744186401367, "global_step": 374452, "epoch": 4511} {"train_loss": -26.359643936157227, "global_step": 374453, "epoch": 4511} {"train_loss": -26.301788330078125, "global_step": 374454, "epoch": 4511} {"train_loss": -26.38018798828125, "global_step": 374455, "epoch": 4511} {"train_loss": -26.45404052734375, "global_step": 374456, "epoch": 4511} {"train_loss": -26.28572654724121, "global_step": 374457, "epoch": 4511} {"train_loss": -25.8162899017334, "global_step": 374458, "epoch": 4511} {"train_loss": -26.200162887573242, "global_step": 374459, "epoch": 4511} {"train_loss": -26.484973907470703, "global_step": 374460, "epoch": 4511} {"train_loss": -26.529926300048828, "global_step": 374461, "epoch": 4511} {"train_loss": -26.453550338745117, "global_step": 374462, "epoch": 4511} {"train_loss": -26.11529541015625, "global_step": 374463, "epoch": 4511} {"train_loss": -25.896102905273438, "global_step": 374464, "epoch": 4511} {"train_loss": -25.760208129882812, "global_step": 374465, "epoch": 4511} {"train_loss": -25.9328670501709, "global_step": 374466, "epoch": 4511} {"train_loss": -26.304996490478516, "global_step": 374467, "epoch": 4511} {"train_loss": -26.02039909362793, "global_step": 374468, "epoch": 4511} {"train_loss": -25.884918212890625, "global_step": 374469, "epoch": 4511} {"train_loss": -26.66046714782715, "global_step": 374470, "epoch": 4511} {"train_loss": -26.38026237487793, "global_step": 374471, "epoch": 4511} {"train_loss": -26.121662139892578, "global_step": 374472, "epoch": 4511} {"train_loss": -26.48651123046875, "global_step": 374473, "epoch": 4511} {"train_loss": -26.323211669921875, "global_step": 374474, "epoch": 4511} {"train_loss": -26.267210006713867, "global_step": 374475, "epoch": 4511} {"train_loss": -25.895898818969727, "global_step": 374476, "epoch": 4511} {"train_loss": -26.58339500427246, "global_step": 374477, "epoch": 4511} {"train_loss": -26.3858585357666, "global_step": 374478, "epoch": 4511} {"train_loss": -26.12890625, "global_step": 374479, "epoch": 4511} {"train_loss": -26.21184730529785, "global_step": 374480, "epoch": 4511} {"train_loss": -26.228647232055664, "global_step": 374481, "epoch": 4511} {"train_loss": -26.34364891052246, "global_step": 374482, "epoch": 4511} {"train_loss": -26.1134090423584, "global_step": 374483, "epoch": 4511} {"train_loss": -26.594511032104492, "global_step": 374484, "epoch": 4511} {"train_loss": -26.402118682861328, "global_step": 374485, "epoch": 4511} {"train_loss": -26.013809204101562, "global_step": 374486, "epoch": 4511} {"train_loss": -26.26898765563965, "global_step": 374487, "epoch": 4511} {"train_loss": -25.877338409423828, "global_step": 374488, "epoch": 4511} {"train_loss": -26.353925704956055, "global_step": 374489, "epoch": 4511} {"train_loss": -26.525592803955078, "global_step": 374490, "epoch": 4511} {"train_loss": -25.91230583190918, "global_step": 374491, "epoch": 4511} {"train_loss": -26.77167320251465, "global_step": 374492, "epoch": 4511} {"train_loss": -26.292383193969727, "global_step": 374493, "epoch": 4511} {"train_loss": -26.307703018188477, "global_step": 374494, "epoch": 4511} {"train_loss": -26.329777683120177, "global_step": 374495, "epoch": 4511, "val_loss": 6508821.5} {"train_loss": -26.191274642944336, "global_step": 374496, "epoch": 4512} {"train_loss": -26.129913330078125, "global_step": 374497, "epoch": 4512} {"train_loss": -26.072046279907227, "global_step": 374498, "epoch": 4512} {"train_loss": -26.1800479888916, "global_step": 374499, "epoch": 4512} {"train_loss": -25.80965232849121, "global_step": 374500, "epoch": 4512} {"train_loss": -26.06764030456543, "global_step": 374501, "epoch": 4512} {"train_loss": -25.991479873657227, "global_step": 374502, "epoch": 4512} {"train_loss": -26.58038902282715, "global_step": 374503, "epoch": 4512} {"train_loss": -25.833011627197266, "global_step": 374504, "epoch": 4512} {"train_loss": -26.428546905517578, "global_step": 374505, "epoch": 4512} {"train_loss": -26.15595817565918, "global_step": 374506, "epoch": 4512} {"train_loss": -26.03266716003418, "global_step": 374507, "epoch": 4512} {"train_loss": -26.325122833251953, "global_step": 374508, "epoch": 4512} {"train_loss": -26.592437744140625, "global_step": 374509, "epoch": 4512} {"train_loss": -26.23785972595215, "global_step": 374510, "epoch": 4512} {"train_loss": -26.168243408203125, "global_step": 374511, "epoch": 4512} {"train_loss": -26.403583526611328, "global_step": 374512, "epoch": 4512} {"train_loss": -26.60224723815918, "global_step": 374513, "epoch": 4512} {"train_loss": -26.515295028686523, "global_step": 374514, "epoch": 4512} {"train_loss": -26.460927963256836, "global_step": 374515, "epoch": 4512} {"train_loss": -26.07369041442871, "global_step": 374516, "epoch": 4512} {"train_loss": -26.256488800048828, "global_step": 374517, "epoch": 4512} {"train_loss": -26.376623153686523, "global_step": 374518, "epoch": 4512} {"train_loss": -26.36761474609375, "global_step": 374519, "epoch": 4512} {"train_loss": -26.383588790893555, "global_step": 374520, "epoch": 4512} {"train_loss": -26.15094566345215, "global_step": 374521, "epoch": 4512} {"train_loss": -26.72987937927246, "global_step": 374522, "epoch": 4512} {"train_loss": -26.483367919921875, "global_step": 374523, "epoch": 4512} {"train_loss": -26.418500900268555, "global_step": 374524, "epoch": 4512} {"train_loss": -26.335290908813477, "global_step": 374525, "epoch": 4512} {"train_loss": -26.2756404876709, "global_step": 374526, "epoch": 4512} {"train_loss": -26.71375846862793, "global_step": 374527, "epoch": 4512} {"train_loss": -26.54774284362793, "global_step": 374528, "epoch": 4512} {"train_loss": -26.29133415222168, "global_step": 374529, "epoch": 4512} {"train_loss": -26.54006004333496, "global_step": 374530, "epoch": 4512} {"train_loss": -26.760833740234375, "global_step": 374531, "epoch": 4512} {"train_loss": -26.356603622436523, "global_step": 374532, "epoch": 4512} {"train_loss": -26.216108322143555, "global_step": 374533, "epoch": 4512} {"train_loss": -26.374982833862305, "global_step": 374534, "epoch": 4512} {"train_loss": -26.465665817260742, "global_step": 374535, "epoch": 4512} {"train_loss": -26.213964462280273, "global_step": 374536, "epoch": 4512} {"train_loss": -26.378665924072266, "global_step": 374537, "epoch": 4512} {"train_loss": -26.56000328063965, "global_step": 374538, "epoch": 4512} {"train_loss": -26.513120651245117, "global_step": 374539, "epoch": 4512} {"train_loss": -26.418622970581055, "global_step": 374540, "epoch": 4512} {"train_loss": -26.255319595336914, "global_step": 374541, "epoch": 4512} {"train_loss": -26.535064697265625, "global_step": 374542, "epoch": 4512} {"train_loss": -26.4310245513916, "global_step": 374543, "epoch": 4512} {"train_loss": -26.54486656188965, "global_step": 374544, "epoch": 4512} {"train_loss": -26.762176513671875, "global_step": 374545, "epoch": 4512} {"train_loss": -26.5252628326416, "global_step": 374546, "epoch": 4512} {"train_loss": -25.975000381469727, "global_step": 374547, "epoch": 4512} {"train_loss": -26.3483829498291, "global_step": 374548, "epoch": 4512} {"train_loss": -26.544570922851562, "global_step": 374549, "epoch": 4512} {"train_loss": -26.577411651611328, "global_step": 374550, "epoch": 4512} {"train_loss": -26.536802291870117, "global_step": 374551, "epoch": 4512} {"train_loss": -26.445886611938477, "global_step": 374552, "epoch": 4512} {"train_loss": -26.309152603149414, "global_step": 374553, "epoch": 4512} {"train_loss": -26.1925106048584, "global_step": 374554, "epoch": 4512} {"train_loss": -26.5283203125, "global_step": 374555, "epoch": 4512} {"train_loss": -26.236225128173828, "global_step": 374556, "epoch": 4512} {"train_loss": -26.523681640625, "global_step": 374557, "epoch": 4512} {"train_loss": -25.987812042236328, "global_step": 374558, "epoch": 4512} {"train_loss": -25.61343765258789, "global_step": 374559, "epoch": 4512} {"train_loss": -25.1845760345459, "global_step": 374560, "epoch": 4512} {"train_loss": -26.165990829467773, "global_step": 374561, "epoch": 4512} {"train_loss": -26.816226959228516, "global_step": 374562, "epoch": 4512} {"train_loss": -25.810964584350586, "global_step": 374563, "epoch": 4512} {"train_loss": -26.22598648071289, "global_step": 374564, "epoch": 4512} {"train_loss": -26.466367721557617, "global_step": 374565, "epoch": 4512} {"train_loss": -26.21063232421875, "global_step": 374566, "epoch": 4512} {"train_loss": -26.394866943359375, "global_step": 374567, "epoch": 4512} {"train_loss": -25.976789474487305, "global_step": 374568, "epoch": 4512} {"train_loss": -26.138824462890625, "global_step": 374569, "epoch": 4512} {"train_loss": -26.34309959411621, "global_step": 374570, "epoch": 4512} {"train_loss": -26.45857048034668, "global_step": 374571, "epoch": 4512} {"train_loss": -26.048566818237305, "global_step": 374572, "epoch": 4512} {"train_loss": -26.410017013549805, "global_step": 374573, "epoch": 4512} {"train_loss": -26.10731315612793, "global_step": 374574, "epoch": 4512} {"train_loss": -26.625574111938477, "global_step": 374575, "epoch": 4512} {"train_loss": -26.509872436523438, "global_step": 374576, "epoch": 4512} {"train_loss": -26.052106857299805, "global_step": 374577, "epoch": 4512} {"train_loss": -26.310710401420135, "global_step": 374578, "epoch": 4512, "val_loss": 6655694.0} {"train_loss": -25.85552978515625, "global_step": 374579, "epoch": 4513} {"train_loss": -25.43395233154297, "global_step": 374580, "epoch": 4513} {"train_loss": -25.170942306518555, "global_step": 374581, "epoch": 4513} {"train_loss": -25.811086654663086, "global_step": 374582, "epoch": 4513} {"train_loss": -26.099851608276367, "global_step": 374583, "epoch": 4513} {"train_loss": -26.256635665893555, "global_step": 374584, "epoch": 4513} {"train_loss": -26.35341453552246, "global_step": 374585, "epoch": 4513} {"train_loss": -26.185400009155273, "global_step": 374586, "epoch": 4513} {"train_loss": -26.129745483398438, "global_step": 374587, "epoch": 4513} {"train_loss": -26.481220245361328, "global_step": 374588, "epoch": 4513} {"train_loss": -26.264999389648438, "global_step": 374589, "epoch": 4513} {"train_loss": -25.95562171936035, "global_step": 374590, "epoch": 4513} {"train_loss": -25.830097198486328, "global_step": 374591, "epoch": 4513} {"train_loss": -26.4306583404541, "global_step": 374592, "epoch": 4513} {"train_loss": -26.00760269165039, "global_step": 374593, "epoch": 4513} {"train_loss": -26.223379135131836, "global_step": 374594, "epoch": 4513} {"train_loss": -26.028573989868164, "global_step": 374595, "epoch": 4513} {"train_loss": -26.059661865234375, "global_step": 374596, "epoch": 4513} {"train_loss": -26.071500778198242, "global_step": 374597, "epoch": 4513} {"train_loss": -26.321447372436523, "global_step": 374598, "epoch": 4513} {"train_loss": -26.404516220092773, "global_step": 374599, "epoch": 4513} {"train_loss": -26.728260040283203, "global_step": 374600, "epoch": 4513} {"train_loss": -26.44245719909668, "global_step": 374601, "epoch": 4513} {"train_loss": -25.996442794799805, "global_step": 374602, "epoch": 4513} {"train_loss": -26.646198272705078, "global_step": 374603, "epoch": 4513} {"train_loss": -26.41071891784668, "global_step": 374604, "epoch": 4513} {"train_loss": -26.450016021728516, "global_step": 374605, "epoch": 4513} {"train_loss": -26.383527755737305, "global_step": 374606, "epoch": 4513} {"train_loss": -26.523883819580078, "global_step": 374607, "epoch": 4513} {"train_loss": -26.764963150024414, "global_step": 374608, "epoch": 4513} {"train_loss": -26.234725952148438, "global_step": 374609, "epoch": 4513} {"train_loss": -26.38289451599121, "global_step": 374610, "epoch": 4513} {"train_loss": -26.181623458862305, "global_step": 374611, "epoch": 4513} {"train_loss": -26.5484561920166, "global_step": 374612, "epoch": 4513} {"train_loss": -26.430517196655273, "global_step": 374613, "epoch": 4513} {"train_loss": -26.60446548461914, "global_step": 374614, "epoch": 4513} {"train_loss": -26.496118545532227, "global_step": 374615, "epoch": 4513} {"train_loss": -26.7985897064209, "global_step": 374616, "epoch": 4513} {"train_loss": -26.52619743347168, "global_step": 374617, "epoch": 4513} {"train_loss": -26.625242233276367, "global_step": 374618, "epoch": 4513} {"train_loss": -26.3494873046875, "global_step": 374619, "epoch": 4513} {"train_loss": -26.733295440673828, "global_step": 374620, "epoch": 4513} {"train_loss": -26.678380966186523, "global_step": 374621, "epoch": 4513} {"train_loss": -26.650558471679688, "global_step": 374622, "epoch": 4513} {"train_loss": -26.52320671081543, "global_step": 374623, "epoch": 4513} {"train_loss": -26.725360870361328, "global_step": 374624, "epoch": 4513} {"train_loss": -26.67024803161621, "global_step": 374625, "epoch": 4513} {"train_loss": -26.741485595703125, "global_step": 374626, "epoch": 4513} {"train_loss": -26.666278839111328, "global_step": 374627, "epoch": 4513} {"train_loss": -26.320556640625, "global_step": 374628, "epoch": 4513} {"train_loss": -26.392333984375, "global_step": 374629, "epoch": 4513} {"train_loss": -26.422719955444336, "global_step": 374630, "epoch": 4513} {"train_loss": -26.465351104736328, "global_step": 374631, "epoch": 4513} {"train_loss": -26.64967155456543, "global_step": 374632, "epoch": 4513} {"train_loss": -26.894336700439453, "global_step": 374633, "epoch": 4513} {"train_loss": -26.590356826782227, "global_step": 374634, "epoch": 4513} {"train_loss": -26.68915367126465, "global_step": 374635, "epoch": 4513} {"train_loss": -26.589086532592773, "global_step": 374636, "epoch": 4513} {"train_loss": -26.93172264099121, "global_step": 374637, "epoch": 4513} {"train_loss": -26.482030868530273, "global_step": 374638, "epoch": 4513} {"train_loss": -26.49849510192871, "global_step": 374639, "epoch": 4513} {"train_loss": -26.526891708374023, "global_step": 374640, "epoch": 4513} {"train_loss": -26.470870971679688, "global_step": 374641, "epoch": 4513} {"train_loss": -26.956787109375, "global_step": 374642, "epoch": 4513} {"train_loss": -26.910993576049805, "global_step": 374643, "epoch": 4513} {"train_loss": -26.703027725219727, "global_step": 374644, "epoch": 4513} {"train_loss": -26.624847412109375, "global_step": 374645, "epoch": 4513} {"train_loss": -26.481647491455078, "global_step": 374646, "epoch": 4513} {"train_loss": -25.54443359375, "global_step": 374647, "epoch": 4513} {"train_loss": -25.690961837768555, "global_step": 374648, "epoch": 4513} {"train_loss": -24.963523864746094, "global_step": 374649, "epoch": 4513} {"train_loss": -23.845312118530273, "global_step": 374650, "epoch": 4513} {"train_loss": -24.82521629333496, "global_step": 374651, "epoch": 4513} {"train_loss": -26.06587028503418, "global_step": 374652, "epoch": 4513} {"train_loss": -26.106796264648438, "global_step": 374653, "epoch": 4513} {"train_loss": -25.73884391784668, "global_step": 374654, "epoch": 4513} {"train_loss": -26.49591636657715, "global_step": 374655, "epoch": 4513} {"train_loss": -26.110021591186523, "global_step": 374656, "epoch": 4513} {"train_loss": -26.2607421875, "global_step": 374657, "epoch": 4513} {"train_loss": -26.228717803955078, "global_step": 374658, "epoch": 4513} {"train_loss": -26.32209587097168, "global_step": 374659, "epoch": 4513} {"train_loss": -25.881149291992188, "global_step": 374660, "epoch": 4513} {"train_loss": -26.2938232421875, "global_step": 374661, "epoch": 4513, "val_loss": 6553764.0} {"train_loss": -26.22879409790039, "global_step": 374662, "epoch": 4514} {"train_loss": -25.463241577148438, "global_step": 374663, "epoch": 4514} {"train_loss": -25.65632438659668, "global_step": 374664, "epoch": 4514} {"train_loss": -25.462583541870117, "global_step": 374665, "epoch": 4514} {"train_loss": -25.900793075561523, "global_step": 374666, "epoch": 4514} {"train_loss": -25.84584617614746, "global_step": 374667, "epoch": 4514} {"train_loss": -26.094221115112305, "global_step": 374668, "epoch": 4514} {"train_loss": -25.957128524780273, "global_step": 374669, "epoch": 4514} {"train_loss": -25.661779403686523, "global_step": 374670, "epoch": 4514} {"train_loss": -25.552011489868164, "global_step": 374671, "epoch": 4514} {"train_loss": -25.84647560119629, "global_step": 374672, "epoch": 4514} {"train_loss": -26.10697364807129, "global_step": 374673, "epoch": 4514} {"train_loss": -26.019031524658203, "global_step": 374674, "epoch": 4514} {"train_loss": -26.27634048461914, "global_step": 374675, "epoch": 4514} {"train_loss": -25.899799346923828, "global_step": 374676, "epoch": 4514} {"train_loss": -26.17919921875, "global_step": 374677, "epoch": 4514} {"train_loss": -26.055316925048828, "global_step": 374678, "epoch": 4514} {"train_loss": -25.946752548217773, "global_step": 374679, "epoch": 4514} {"train_loss": -26.26161766052246, "global_step": 374680, "epoch": 4514} {"train_loss": -26.178516387939453, "global_step": 374681, "epoch": 4514} {"train_loss": -26.307241439819336, "global_step": 374682, "epoch": 4514} {"train_loss": -26.259723663330078, "global_step": 374683, "epoch": 4514} {"train_loss": -26.45425796508789, "global_step": 374684, "epoch": 4514} {"train_loss": -26.01434326171875, "global_step": 374685, "epoch": 4514} {"train_loss": -26.4139404296875, "global_step": 374686, "epoch": 4514} {"train_loss": -26.152587890625, "global_step": 374687, "epoch": 4514} {"train_loss": -25.92572593688965, "global_step": 374688, "epoch": 4514} {"train_loss": -26.315265655517578, "global_step": 374689, "epoch": 4514} {"train_loss": -26.744733810424805, "global_step": 374690, "epoch": 4514} {"train_loss": -26.653104782104492, "global_step": 374691, "epoch": 4514} {"train_loss": -25.96904945373535, "global_step": 374692, "epoch": 4514} {"train_loss": -26.256179809570312, "global_step": 374693, "epoch": 4514} {"train_loss": -26.368274688720703, "global_step": 374694, "epoch": 4514} {"train_loss": -26.609472274780273, "global_step": 374695, "epoch": 4514} {"train_loss": -26.453886032104492, "global_step": 374696, "epoch": 4514} {"train_loss": -26.29861831665039, "global_step": 374697, "epoch": 4514} {"train_loss": -26.5831241607666, "global_step": 374698, "epoch": 4514} {"train_loss": -26.60462760925293, "global_step": 374699, "epoch": 4514} {"train_loss": -26.41791343688965, "global_step": 374700, "epoch": 4514} {"train_loss": -26.154788970947266, "global_step": 374701, "epoch": 4514} {"train_loss": -26.58026695251465, "global_step": 374702, "epoch": 4514} {"train_loss": -26.47356605529785, "global_step": 374703, "epoch": 4514} {"train_loss": -26.537673950195312, "global_step": 374704, "epoch": 4514} {"train_loss": -26.386341094970703, "global_step": 374705, "epoch": 4514} {"train_loss": -26.723953247070312, "global_step": 374706, "epoch": 4514} {"train_loss": -26.748361587524414, "global_step": 374707, "epoch": 4514} {"train_loss": -26.847593307495117, "global_step": 374708, "epoch": 4514} {"train_loss": -26.625837326049805, "global_step": 374709, "epoch": 4514} {"train_loss": -26.49715232849121, "global_step": 374710, "epoch": 4514} {"train_loss": -26.627197265625, "global_step": 374711, "epoch": 4514} {"train_loss": -26.563507080078125, "global_step": 374712, "epoch": 4514} {"train_loss": -26.785852432250977, "global_step": 374713, "epoch": 4514} {"train_loss": -26.181745529174805, "global_step": 374714, "epoch": 4514} {"train_loss": -26.658655166625977, "global_step": 374715, "epoch": 4514} {"train_loss": -26.618982315063477, "global_step": 374716, "epoch": 4514} {"train_loss": -26.43096923828125, "global_step": 374717, "epoch": 4514} {"train_loss": -26.299976348876953, "global_step": 374718, "epoch": 4514} {"train_loss": -26.9025821685791, "global_step": 374719, "epoch": 4514} {"train_loss": -26.512939453125, "global_step": 374720, "epoch": 4514} {"train_loss": -26.382802963256836, "global_step": 374721, "epoch": 4514} {"train_loss": -26.617170333862305, "global_step": 374722, "epoch": 4514} {"train_loss": -26.362524032592773, "global_step": 374723, "epoch": 4514} {"train_loss": -26.194427490234375, "global_step": 374724, "epoch": 4514} {"train_loss": -26.250946044921875, "global_step": 374725, "epoch": 4514} {"train_loss": -26.050901412963867, "global_step": 374726, "epoch": 4514} {"train_loss": -26.566299438476562, "global_step": 374727, "epoch": 4514} {"train_loss": -26.22468376159668, "global_step": 374728, "epoch": 4514} {"train_loss": -26.720233917236328, "global_step": 374729, "epoch": 4514} {"train_loss": -26.697284698486328, "global_step": 374730, "epoch": 4514} {"train_loss": -26.609891891479492, "global_step": 374731, "epoch": 4514} {"train_loss": -26.630401611328125, "global_step": 374732, "epoch": 4514} {"train_loss": -26.409570693969727, "global_step": 374733, "epoch": 4514} {"train_loss": -26.776090621948242, "global_step": 374734, "epoch": 4514} {"train_loss": -26.520444869995117, "global_step": 374735, "epoch": 4514} {"train_loss": -26.283344268798828, "global_step": 374736, "epoch": 4514} {"train_loss": -26.56214714050293, "global_step": 374737, "epoch": 4514} {"train_loss": -26.28229331970215, "global_step": 374738, "epoch": 4514} {"train_loss": -26.375574111938477, "global_step": 374739, "epoch": 4514} {"train_loss": -26.724069595336914, "global_step": 374740, "epoch": 4514} {"train_loss": -26.4094295501709, "global_step": 374741, "epoch": 4514} {"train_loss": -26.3759708404541, "global_step": 374742, "epoch": 4514} {"train_loss": -26.02853775024414, "global_step": 374743, "epoch": 4514} {"train_loss": -26.324353574270226, "global_step": 374744, "epoch": 4514, "val_loss": 6548172.0} {"train_loss": -25.114131927490234, "global_step": 374745, "epoch": 4515} {"train_loss": -25.534496307373047, "global_step": 374746, "epoch": 4515} {"train_loss": -25.74537467956543, "global_step": 374747, "epoch": 4515} {"train_loss": -25.4370174407959, "global_step": 374748, "epoch": 4515} {"train_loss": -25.866064071655273, "global_step": 374749, "epoch": 4515} {"train_loss": -25.870559692382812, "global_step": 374750, "epoch": 4515} {"train_loss": -26.11585807800293, "global_step": 374751, "epoch": 4515} {"train_loss": -25.698230743408203, "global_step": 374752, "epoch": 4515} {"train_loss": -26.08762550354004, "global_step": 374753, "epoch": 4515} {"train_loss": -25.748584747314453, "global_step": 374754, "epoch": 4515} {"train_loss": -25.727392196655273, "global_step": 374755, "epoch": 4515} {"train_loss": -26.198389053344727, "global_step": 374756, "epoch": 4515} {"train_loss": -26.16731071472168, "global_step": 374757, "epoch": 4515} {"train_loss": -26.288909912109375, "global_step": 374758, "epoch": 4515} {"train_loss": -26.12554931640625, "global_step": 374759, "epoch": 4515} {"train_loss": -26.217315673828125, "global_step": 374760, "epoch": 4515} {"train_loss": -25.90250015258789, "global_step": 374761, "epoch": 4515} {"train_loss": -26.42013931274414, "global_step": 374762, "epoch": 4515} {"train_loss": -25.85602378845215, "global_step": 374763, "epoch": 4515} {"train_loss": -26.18116569519043, "global_step": 374764, "epoch": 4515} {"train_loss": -25.607755661010742, "global_step": 374765, "epoch": 4515} {"train_loss": -25.931745529174805, "global_step": 374766, "epoch": 4515} {"train_loss": -26.321630477905273, "global_step": 374767, "epoch": 4515} {"train_loss": -25.750778198242188, "global_step": 374768, "epoch": 4515} {"train_loss": -26.223196029663086, "global_step": 374769, "epoch": 4515} {"train_loss": -26.121145248413086, "global_step": 374770, "epoch": 4515} {"train_loss": -26.091983795166016, "global_step": 374771, "epoch": 4515} {"train_loss": -26.424942016601562, "global_step": 374772, "epoch": 4515} {"train_loss": -26.334869384765625, "global_step": 374773, "epoch": 4515} {"train_loss": -26.05134391784668, "global_step": 374774, "epoch": 4515} {"train_loss": -26.197269439697266, "global_step": 374775, "epoch": 4515} {"train_loss": -26.34761619567871, "global_step": 374776, "epoch": 4515} {"train_loss": -26.40574073791504, "global_step": 374777, "epoch": 4515} {"train_loss": -26.45084571838379, "global_step": 374778, "epoch": 4515} {"train_loss": -25.81926918029785, "global_step": 374779, "epoch": 4515} {"train_loss": -26.533466339111328, "global_step": 374780, "epoch": 4515} {"train_loss": -26.739484786987305, "global_step": 374781, "epoch": 4515} {"train_loss": -26.570714950561523, "global_step": 374782, "epoch": 4515} {"train_loss": -26.266510009765625, "global_step": 374783, "epoch": 4515} {"train_loss": -26.695348739624023, "global_step": 374784, "epoch": 4515} {"train_loss": -26.28750991821289, "global_step": 374785, "epoch": 4515} {"train_loss": -26.330148696899414, "global_step": 374786, "epoch": 4515} {"train_loss": -26.60255241394043, "global_step": 374787, "epoch": 4515} {"train_loss": -26.257360458374023, "global_step": 374788, "epoch": 4515} {"train_loss": -26.209854125976562, "global_step": 374789, "epoch": 4515} {"train_loss": -26.44071388244629, "global_step": 374790, "epoch": 4515} {"train_loss": -26.382892608642578, "global_step": 374791, "epoch": 4515} {"train_loss": -26.354938507080078, "global_step": 374792, "epoch": 4515} {"train_loss": -26.307947158813477, "global_step": 374793, "epoch": 4515} {"train_loss": -26.334796905517578, "global_step": 374794, "epoch": 4515} {"train_loss": -26.534772872924805, "global_step": 374795, "epoch": 4515} {"train_loss": -26.46516227722168, "global_step": 374796, "epoch": 4515} {"train_loss": -26.31678581237793, "global_step": 374797, "epoch": 4515} {"train_loss": -26.378742218017578, "global_step": 374798, "epoch": 4515} {"train_loss": -26.32891273498535, "global_step": 374799, "epoch": 4515} {"train_loss": -26.47323989868164, "global_step": 374800, "epoch": 4515} {"train_loss": -26.224609375, "global_step": 374801, "epoch": 4515} {"train_loss": -26.50605583190918, "global_step": 374802, "epoch": 4515} {"train_loss": -26.711469650268555, "global_step": 374803, "epoch": 4515} {"train_loss": -26.18692970275879, "global_step": 374804, "epoch": 4515} {"train_loss": -26.934240341186523, "global_step": 374805, "epoch": 4515} {"train_loss": -26.411909103393555, "global_step": 374806, "epoch": 4515} {"train_loss": -26.424463272094727, "global_step": 374807, "epoch": 4515} {"train_loss": -26.36962890625, "global_step": 374808, "epoch": 4515} {"train_loss": -26.344202041625977, "global_step": 374809, "epoch": 4515} {"train_loss": -26.66217041015625, "global_step": 374810, "epoch": 4515} {"train_loss": -26.835620880126953, "global_step": 374811, "epoch": 4515} {"train_loss": -26.355545043945312, "global_step": 374812, "epoch": 4515} {"train_loss": -26.753049850463867, "global_step": 374813, "epoch": 4515} {"train_loss": -26.629201889038086, "global_step": 374814, "epoch": 4515} {"train_loss": -26.643728256225586, "global_step": 374815, "epoch": 4515} {"train_loss": -26.569721221923828, "global_step": 374816, "epoch": 4515} {"train_loss": -26.38557243347168, "global_step": 374817, "epoch": 4515} {"train_loss": -26.80634117126465, "global_step": 374818, "epoch": 4515} {"train_loss": -26.636173248291016, "global_step": 374819, "epoch": 4515} {"train_loss": -26.214344024658203, "global_step": 374820, "epoch": 4515} {"train_loss": -26.78814697265625, "global_step": 374821, "epoch": 4515} {"train_loss": -26.616724014282227, "global_step": 374822, "epoch": 4515} {"train_loss": -26.444965362548828, "global_step": 374823, "epoch": 4515} {"train_loss": -26.271060943603516, "global_step": 374824, "epoch": 4515} {"train_loss": -26.75893211364746, "global_step": 374825, "epoch": 4515} {"train_loss": -26.53980827331543, "global_step": 374826, "epoch": 4515} {"train_loss": -26.286575776984893, "global_step": 374827, "epoch": 4515, "val_loss": 6647385.0} {"train_loss": -24.687135696411133, "global_step": 374828, "epoch": 4516} {"train_loss": -24.08443260192871, "global_step": 374829, "epoch": 4516} {"train_loss": -25.595874786376953, "global_step": 374830, "epoch": 4516} {"train_loss": -25.190006256103516, "global_step": 374831, "epoch": 4516} {"train_loss": -24.806753158569336, "global_step": 374832, "epoch": 4516} {"train_loss": -25.248741149902344, "global_step": 374833, "epoch": 4516} {"train_loss": -25.355573654174805, "global_step": 374834, "epoch": 4516} {"train_loss": -25.83561134338379, "global_step": 374835, "epoch": 4516} {"train_loss": -25.289609909057617, "global_step": 374836, "epoch": 4516} {"train_loss": -25.89664077758789, "global_step": 374837, "epoch": 4516} {"train_loss": -25.478750228881836, "global_step": 374838, "epoch": 4516} {"train_loss": -25.624181747436523, "global_step": 374839, "epoch": 4516} {"train_loss": -25.93165397644043, "global_step": 374840, "epoch": 4516} {"train_loss": -25.72840690612793, "global_step": 374841, "epoch": 4516} {"train_loss": -25.807205200195312, "global_step": 374842, "epoch": 4516} {"train_loss": -25.584440231323242, "global_step": 374843, "epoch": 4516} {"train_loss": -26.109228134155273, "global_step": 374844, "epoch": 4516} {"train_loss": -26.016050338745117, "global_step": 374845, "epoch": 4516} {"train_loss": -26.07215690612793, "global_step": 374846, "epoch": 4516} {"train_loss": -26.350021362304688, "global_step": 374847, "epoch": 4516} {"train_loss": -26.381254196166992, "global_step": 374848, "epoch": 4516} {"train_loss": -26.018356323242188, "global_step": 374849, "epoch": 4516} {"train_loss": -25.821979522705078, "global_step": 374850, "epoch": 4516} {"train_loss": -26.143163681030273, "global_step": 374851, "epoch": 4516} {"train_loss": -26.19121742248535, "global_step": 374852, "epoch": 4516} {"train_loss": -26.310876846313477, "global_step": 374853, "epoch": 4516} {"train_loss": -26.414636611938477, "global_step": 374854, "epoch": 4516} {"train_loss": -26.281293869018555, "global_step": 374855, "epoch": 4516} {"train_loss": -26.485584259033203, "global_step": 374856, "epoch": 4516} {"train_loss": -26.446577072143555, "global_step": 374857, "epoch": 4516} {"train_loss": -26.392698287963867, "global_step": 374858, "epoch": 4516} {"train_loss": -26.17384147644043, "global_step": 374859, "epoch": 4516} {"train_loss": -26.234045028686523, "global_step": 374860, "epoch": 4516} {"train_loss": -26.051502227783203, "global_step": 374861, "epoch": 4516} {"train_loss": -26.20806884765625, "global_step": 374862, "epoch": 4516} {"train_loss": -26.506738662719727, "global_step": 374863, "epoch": 4516} {"train_loss": -26.475427627563477, "global_step": 374864, "epoch": 4516} {"train_loss": -26.104984283447266, "global_step": 374865, "epoch": 4516} {"train_loss": -26.614974975585938, "global_step": 374866, "epoch": 4516} {"train_loss": -26.487686157226562, "global_step": 374867, "epoch": 4516} {"train_loss": -26.042417526245117, "global_step": 374868, "epoch": 4516} {"train_loss": -26.31304359436035, "global_step": 374869, "epoch": 4516} {"train_loss": -26.234577178955078, "global_step": 374870, "epoch": 4516} {"train_loss": -26.0817928314209, "global_step": 374871, "epoch": 4516} {"train_loss": -26.350805282592773, "global_step": 374872, "epoch": 4516} {"train_loss": -26.884510040283203, "global_step": 374873, "epoch": 4516} {"train_loss": -25.866601943969727, "global_step": 374874, "epoch": 4516} {"train_loss": -25.94231605529785, "global_step": 374875, "epoch": 4516} {"train_loss": -26.379735946655273, "global_step": 374876, "epoch": 4516} {"train_loss": -26.235227584838867, "global_step": 374877, "epoch": 4516} {"train_loss": -26.16330337524414, "global_step": 374878, "epoch": 4516} {"train_loss": -26.55049705505371, "global_step": 374879, "epoch": 4516} {"train_loss": -26.447778701782227, "global_step": 374880, "epoch": 4516} {"train_loss": -26.129919052124023, "global_step": 374881, "epoch": 4516} {"train_loss": -26.376434326171875, "global_step": 374882, "epoch": 4516} {"train_loss": -26.036773681640625, "global_step": 374883, "epoch": 4516} {"train_loss": -26.544464111328125, "global_step": 374884, "epoch": 4516} {"train_loss": -26.465707778930664, "global_step": 374885, "epoch": 4516} {"train_loss": -26.465505599975586, "global_step": 374886, "epoch": 4516} {"train_loss": -26.572736740112305, "global_step": 374887, "epoch": 4516} {"train_loss": -26.504026412963867, "global_step": 374888, "epoch": 4516} {"train_loss": -26.466394424438477, "global_step": 374889, "epoch": 4516} {"train_loss": -26.103302001953125, "global_step": 374890, "epoch": 4516} {"train_loss": -26.376638412475586, "global_step": 374891, "epoch": 4516} {"train_loss": -26.484586715698242, "global_step": 374892, "epoch": 4516} {"train_loss": -26.535947799682617, "global_step": 374893, "epoch": 4516} {"train_loss": -26.46588706970215, "global_step": 374894, "epoch": 4516} {"train_loss": -26.556629180908203, "global_step": 374895, "epoch": 4516} {"train_loss": -26.184946060180664, "global_step": 374896, "epoch": 4516} {"train_loss": -26.593280792236328, "global_step": 374897, "epoch": 4516} {"train_loss": -26.259815216064453, "global_step": 374898, "epoch": 4516} {"train_loss": -26.5340576171875, "global_step": 374899, "epoch": 4516} {"train_loss": -26.567462921142578, "global_step": 374900, "epoch": 4516} {"train_loss": -26.69403076171875, "global_step": 374901, "epoch": 4516} {"train_loss": -26.662723541259766, "global_step": 374902, "epoch": 4516} {"train_loss": -26.616958618164062, "global_step": 374903, "epoch": 4516} {"train_loss": -26.703815460205078, "global_step": 374904, "epoch": 4516} {"train_loss": -26.43621826171875, "global_step": 374905, "epoch": 4516} {"train_loss": -26.65667152404785, "global_step": 374906, "epoch": 4516} {"train_loss": -26.12750816345215, "global_step": 374907, "epoch": 4516} {"train_loss": -26.352582931518555, "global_step": 374908, "epoch": 4516} {"train_loss": -26.441099166870117, "global_step": 374909, "epoch": 4516} {"train_loss": -26.149738426668097, "global_step": 374910, "epoch": 4516, "val_loss": 6669629.0} {"train_loss": -26.275440216064453, "global_step": 374911, "epoch": 4517} {"train_loss": -26.16864585876465, "global_step": 374912, "epoch": 4517} {"train_loss": -25.882516860961914, "global_step": 374913, "epoch": 4517} {"train_loss": -25.3157901763916, "global_step": 374914, "epoch": 4517} {"train_loss": -26.117223739624023, "global_step": 374915, "epoch": 4517} {"train_loss": -25.453645706176758, "global_step": 374916, "epoch": 4517} {"train_loss": -26.363224029541016, "global_step": 374917, "epoch": 4517} {"train_loss": -25.283367156982422, "global_step": 374918, "epoch": 4517} {"train_loss": -25.999067306518555, "global_step": 374919, "epoch": 4517} {"train_loss": -26.2687931060791, "global_step": 374920, "epoch": 4517} {"train_loss": -25.554780960083008, "global_step": 374921, "epoch": 4517} {"train_loss": -26.035552978515625, "global_step": 374922, "epoch": 4517} {"train_loss": -25.8344669342041, "global_step": 374923, "epoch": 4517} {"train_loss": -26.110885620117188, "global_step": 374924, "epoch": 4517} {"train_loss": -25.987363815307617, "global_step": 374925, "epoch": 4517} {"train_loss": -25.93429946899414, "global_step": 374926, "epoch": 4517} {"train_loss": -25.98029899597168, "global_step": 374927, "epoch": 4517} {"train_loss": -26.485031127929688, "global_step": 374928, "epoch": 4517} {"train_loss": -26.09577751159668, "global_step": 374929, "epoch": 4517} {"train_loss": -26.2207088470459, "global_step": 374930, "epoch": 4517} {"train_loss": -26.317138671875, "global_step": 374931, "epoch": 4517} {"train_loss": -25.886825561523438, "global_step": 374932, "epoch": 4517} {"train_loss": -25.593347549438477, "global_step": 374933, "epoch": 4517} {"train_loss": -25.86995506286621, "global_step": 374934, "epoch": 4517} {"train_loss": -26.34379005432129, "global_step": 374935, "epoch": 4517} {"train_loss": -25.7758846282959, "global_step": 374936, "epoch": 4517} {"train_loss": -26.658294677734375, "global_step": 374937, "epoch": 4517} {"train_loss": -26.2264347076416, "global_step": 374938, "epoch": 4517} {"train_loss": -26.111953735351562, "global_step": 374939, "epoch": 4517} {"train_loss": -26.243152618408203, "global_step": 374940, "epoch": 4517} {"train_loss": -26.071073532104492, "global_step": 374941, "epoch": 4517} {"train_loss": -26.140644073486328, "global_step": 374942, "epoch": 4517} {"train_loss": -26.37283706665039, "global_step": 374943, "epoch": 4517} {"train_loss": -26.37955665588379, "global_step": 374944, "epoch": 4517} {"train_loss": -26.28668212890625, "global_step": 374945, "epoch": 4517} {"train_loss": -26.715417861938477, "global_step": 374946, "epoch": 4517} {"train_loss": -26.468647003173828, "global_step": 374947, "epoch": 4517} {"train_loss": -26.3387393951416, "global_step": 374948, "epoch": 4517} {"train_loss": -26.195714950561523, "global_step": 374949, "epoch": 4517} {"train_loss": -26.319355010986328, "global_step": 374950, "epoch": 4517} {"train_loss": -26.0812931060791, "global_step": 374951, "epoch": 4517} {"train_loss": -26.58930778503418, "global_step": 374952, "epoch": 4517} {"train_loss": -26.74555015563965, "global_step": 374953, "epoch": 4517} {"train_loss": -26.445850372314453, "global_step": 374954, "epoch": 4517} {"train_loss": -26.710058212280273, "global_step": 374955, "epoch": 4517} {"train_loss": -26.27090835571289, "global_step": 374956, "epoch": 4517} {"train_loss": -26.350500106811523, "global_step": 374957, "epoch": 4517} {"train_loss": -26.631933212280273, "global_step": 374958, "epoch": 4517} {"train_loss": -26.51614761352539, "global_step": 374959, "epoch": 4517} {"train_loss": -26.4434814453125, "global_step": 374960, "epoch": 4517} {"train_loss": -26.82758140563965, "global_step": 374961, "epoch": 4517} {"train_loss": -26.352582931518555, "global_step": 374962, "epoch": 4517} {"train_loss": -26.599231719970703, "global_step": 374963, "epoch": 4517} {"train_loss": -26.9473876953125, "global_step": 374964, "epoch": 4517} {"train_loss": -26.665124893188477, "global_step": 374965, "epoch": 4517} {"train_loss": -26.248884201049805, "global_step": 374966, "epoch": 4517} {"train_loss": -26.715381622314453, "global_step": 374967, "epoch": 4517} {"train_loss": -26.628742218017578, "global_step": 374968, "epoch": 4517} {"train_loss": -26.45404052734375, "global_step": 374969, "epoch": 4517} {"train_loss": -26.649581909179688, "global_step": 374970, "epoch": 4517} {"train_loss": -26.33588981628418, "global_step": 374971, "epoch": 4517} {"train_loss": -26.47235679626465, "global_step": 374972, "epoch": 4517} {"train_loss": -26.81707763671875, "global_step": 374973, "epoch": 4517} {"train_loss": -26.545032501220703, "global_step": 374974, "epoch": 4517} {"train_loss": -26.47796630859375, "global_step": 374975, "epoch": 4517} {"train_loss": -26.668684005737305, "global_step": 374976, "epoch": 4517} {"train_loss": -26.500934600830078, "global_step": 374977, "epoch": 4517} {"train_loss": -26.609485626220703, "global_step": 374978, "epoch": 4517} {"train_loss": -26.43137550354004, "global_step": 374979, "epoch": 4517} {"train_loss": -26.36823844909668, "global_step": 374980, "epoch": 4517} {"train_loss": -26.62286949157715, "global_step": 374981, "epoch": 4517} {"train_loss": -26.45014762878418, "global_step": 374982, "epoch": 4517} {"train_loss": -26.382192611694336, "global_step": 374983, "epoch": 4517} {"train_loss": -26.50029945373535, "global_step": 374984, "epoch": 4517} {"train_loss": -26.019214630126953, "global_step": 374985, "epoch": 4517} {"train_loss": -26.265033721923828, "global_step": 374986, "epoch": 4517} {"train_loss": -26.308334350585938, "global_step": 374987, "epoch": 4517} {"train_loss": -26.3560791015625, "global_step": 374988, "epoch": 4517} {"train_loss": -26.11216163635254, "global_step": 374989, "epoch": 4517} {"train_loss": -26.056720733642578, "global_step": 374990, "epoch": 4517} {"train_loss": -26.775238037109375, "global_step": 374991, "epoch": 4517} {"train_loss": -26.588911056518555, "global_step": 374992, "epoch": 4517} {"train_loss": -26.29372272721256, "global_step": 374993, "epoch": 4517, "val_loss": 6643771.0} {"train_loss": -26.365705490112305, "global_step": 374994, "epoch": 4518} {"train_loss": -25.069482803344727, "global_step": 374995, "epoch": 4518} {"train_loss": -25.61355972290039, "global_step": 374996, "epoch": 4518} {"train_loss": -26.285253524780273, "global_step": 374997, "epoch": 4518} {"train_loss": -25.812637329101562, "global_step": 374998, "epoch": 4518} {"train_loss": -26.195154190063477, "global_step": 374999, "epoch": 4518} {"train_loss": -25.9332275390625, "global_step": 375000, "epoch": 4518} {"train_loss": -25.981494903564453, "global_step": 375001, "epoch": 4518} {"train_loss": -26.05451774597168, "global_step": 375002, "epoch": 4518} {"train_loss": -25.795087814331055, "global_step": 375003, "epoch": 4518} {"train_loss": -25.82081413269043, "global_step": 375004, "epoch": 4518} {"train_loss": -26.23341178894043, "global_step": 375005, "epoch": 4518} {"train_loss": -26.197193145751953, "global_step": 375006, "epoch": 4518} {"train_loss": -26.002023696899414, "global_step": 375007, "epoch": 4518} {"train_loss": -25.967309951782227, "global_step": 375008, "epoch": 4518} {"train_loss": -25.88471794128418, "global_step": 375009, "epoch": 4518} {"train_loss": -26.1483211517334, "global_step": 375010, "epoch": 4518} {"train_loss": -26.188583374023438, "global_step": 375011, "epoch": 4518} {"train_loss": -26.336963653564453, "global_step": 375012, "epoch": 4518} {"train_loss": -26.170856475830078, "global_step": 375013, "epoch": 4518} {"train_loss": -26.30330467224121, "global_step": 375014, "epoch": 4518} {"train_loss": -26.427295684814453, "global_step": 375015, "epoch": 4518} {"train_loss": -26.390851974487305, "global_step": 375016, "epoch": 4518} {"train_loss": -26.13104248046875, "global_step": 375017, "epoch": 4518} {"train_loss": -26.2337646484375, "global_step": 375018, "epoch": 4518} {"train_loss": -26.033369064331055, "global_step": 375019, "epoch": 4518} {"train_loss": -26.359601974487305, "global_step": 375020, "epoch": 4518} {"train_loss": -25.724218368530273, "global_step": 375021, "epoch": 4518} {"train_loss": -26.17608642578125, "global_step": 375022, "epoch": 4518} {"train_loss": -26.43086051940918, "global_step": 375023, "epoch": 4518} {"train_loss": -26.537281036376953, "global_step": 375024, "epoch": 4518} {"train_loss": -26.85786247253418, "global_step": 375025, "epoch": 4518} {"train_loss": -26.743621826171875, "global_step": 375026, "epoch": 4518} {"train_loss": -26.5477294921875, "global_step": 375027, "epoch": 4518} {"train_loss": -26.114877700805664, "global_step": 375028, "epoch": 4518} {"train_loss": -26.16792106628418, "global_step": 375029, "epoch": 4518} {"train_loss": -26.72991943359375, "global_step": 375030, "epoch": 4518} {"train_loss": -26.343793869018555, "global_step": 375031, "epoch": 4518} {"train_loss": -26.370254516601562, "global_step": 375032, "epoch": 4518} {"train_loss": -26.113834381103516, "global_step": 375033, "epoch": 4518} {"train_loss": -25.915796279907227, "global_step": 375034, "epoch": 4518} {"train_loss": -26.337942123413086, "global_step": 375035, "epoch": 4518} {"train_loss": -26.50889015197754, "global_step": 375036, "epoch": 4518} {"train_loss": -26.53207778930664, "global_step": 375037, "epoch": 4518} {"train_loss": -25.6356201171875, "global_step": 375038, "epoch": 4518} {"train_loss": -25.219778060913086, "global_step": 375039, "epoch": 4518} {"train_loss": -25.546310424804688, "global_step": 375040, "epoch": 4518} {"train_loss": -26.8723087310791, "global_step": 375041, "epoch": 4518} {"train_loss": -25.7488956451416, "global_step": 375042, "epoch": 4518} {"train_loss": -25.847272872924805, "global_step": 375043, "epoch": 4518} {"train_loss": -26.215478897094727, "global_step": 375044, "epoch": 4518} {"train_loss": -25.15152359008789, "global_step": 375045, "epoch": 4518} {"train_loss": -25.938343048095703, "global_step": 375046, "epoch": 4518} {"train_loss": -26.131744384765625, "global_step": 375047, "epoch": 4518} {"train_loss": -26.217687606811523, "global_step": 375048, "epoch": 4518} {"train_loss": -26.472110748291016, "global_step": 375049, "epoch": 4518} {"train_loss": -25.9716796875, "global_step": 375050, "epoch": 4518} {"train_loss": -26.38226318359375, "global_step": 375051, "epoch": 4518} {"train_loss": -26.19538688659668, "global_step": 375052, "epoch": 4518} {"train_loss": -26.423736572265625, "global_step": 375053, "epoch": 4518} {"train_loss": -26.278173446655273, "global_step": 375054, "epoch": 4518} {"train_loss": -25.956787109375, "global_step": 375055, "epoch": 4518} {"train_loss": -26.149274826049805, "global_step": 375056, "epoch": 4518} {"train_loss": -26.105924606323242, "global_step": 375057, "epoch": 4518} {"train_loss": -26.271026611328125, "global_step": 375058, "epoch": 4518} {"train_loss": -26.219024658203125, "global_step": 375059, "epoch": 4518} {"train_loss": -26.657865524291992, "global_step": 375060, "epoch": 4518} {"train_loss": -26.400808334350586, "global_step": 375061, "epoch": 4518} {"train_loss": -26.705951690673828, "global_step": 375062, "epoch": 4518} {"train_loss": -26.351484298706055, "global_step": 375063, "epoch": 4518} {"train_loss": -26.369558334350586, "global_step": 375064, "epoch": 4518} {"train_loss": -26.705799102783203, "global_step": 375065, "epoch": 4518} {"train_loss": -26.3870849609375, "global_step": 375066, "epoch": 4518} {"train_loss": -26.646387100219727, "global_step": 375067, "epoch": 4518} {"train_loss": -26.71783447265625, "global_step": 375068, "epoch": 4518} {"train_loss": -26.16444206237793, "global_step": 375069, "epoch": 4518} {"train_loss": -26.36298942565918, "global_step": 375070, "epoch": 4518} {"train_loss": -26.171295166015625, "global_step": 375071, "epoch": 4518} {"train_loss": -26.38709831237793, "global_step": 375072, "epoch": 4518} {"train_loss": -26.574594497680664, "global_step": 375073, "epoch": 4518} {"train_loss": -26.548786163330078, "global_step": 375074, "epoch": 4518} {"train_loss": -26.3232421875, "global_step": 375075, "epoch": 4518} {"train_loss": -26.195573393120824, "global_step": 375076, "epoch": 4518, "val_loss": 6569041.5} {"train_loss": -26.267175674438477, "global_step": 375077, "epoch": 4519} {"train_loss": -26.017749786376953, "global_step": 375078, "epoch": 4519} {"train_loss": -26.61117935180664, "global_step": 375079, "epoch": 4519} {"train_loss": -26.05610466003418, "global_step": 375080, "epoch": 4519} {"train_loss": -26.25459098815918, "global_step": 375081, "epoch": 4519} {"train_loss": -26.16510009765625, "global_step": 375082, "epoch": 4519} {"train_loss": -26.002655029296875, "global_step": 375083, "epoch": 4519} {"train_loss": -26.037418365478516, "global_step": 375084, "epoch": 4519} {"train_loss": -26.43523597717285, "global_step": 375085, "epoch": 4519} {"train_loss": -26.534223556518555, "global_step": 375086, "epoch": 4519} {"train_loss": -26.335569381713867, "global_step": 375087, "epoch": 4519} {"train_loss": -26.648176193237305, "global_step": 375088, "epoch": 4519} {"train_loss": -26.357593536376953, "global_step": 375089, "epoch": 4519} {"train_loss": -26.660968780517578, "global_step": 375090, "epoch": 4519} {"train_loss": -26.408044815063477, "global_step": 375091, "epoch": 4519} {"train_loss": -26.22723388671875, "global_step": 375092, "epoch": 4519} {"train_loss": -26.75699806213379, "global_step": 375093, "epoch": 4519} {"train_loss": -26.3736629486084, "global_step": 375094, "epoch": 4519} {"train_loss": -26.410242080688477, "global_step": 375095, "epoch": 4519} {"train_loss": -26.458236694335938, "global_step": 375096, "epoch": 4519} {"train_loss": -26.728246688842773, "global_step": 375097, "epoch": 4519} {"train_loss": -26.14240074157715, "global_step": 375098, "epoch": 4519} {"train_loss": -26.562952041625977, "global_step": 375099, "epoch": 4519} {"train_loss": -26.618213653564453, "global_step": 375100, "epoch": 4519} {"train_loss": -26.545495986938477, "global_step": 375101, "epoch": 4519} {"train_loss": -26.320486068725586, "global_step": 375102, "epoch": 4519} {"train_loss": -26.558706283569336, "global_step": 375103, "epoch": 4519} {"train_loss": -26.706735610961914, "global_step": 375104, "epoch": 4519} {"train_loss": -26.423376083374023, "global_step": 375105, "epoch": 4519} {"train_loss": -26.34748649597168, "global_step": 375106, "epoch": 4519} {"train_loss": -25.905851364135742, "global_step": 375107, "epoch": 4519} {"train_loss": -26.035282135009766, "global_step": 375108, "epoch": 4519} {"train_loss": -25.72564125061035, "global_step": 375109, "epoch": 4519} {"train_loss": -26.13486671447754, "global_step": 375110, "epoch": 4519} {"train_loss": -26.68442153930664, "global_step": 375111, "epoch": 4519} {"train_loss": -26.2801513671875, "global_step": 375112, "epoch": 4519} {"train_loss": -26.3066463470459, "global_step": 375113, "epoch": 4519} {"train_loss": -26.774097442626953, "global_step": 375114, "epoch": 4519} {"train_loss": -26.065839767456055, "global_step": 375115, "epoch": 4519} {"train_loss": -26.5734806060791, "global_step": 375116, "epoch": 4519} {"train_loss": -26.130176544189453, "global_step": 375117, "epoch": 4519} {"train_loss": -26.659244537353516, "global_step": 375118, "epoch": 4519} {"train_loss": -26.432538986206055, "global_step": 375119, "epoch": 4519} {"train_loss": -25.865081787109375, "global_step": 375120, "epoch": 4519} {"train_loss": -26.774433135986328, "global_step": 375121, "epoch": 4519} {"train_loss": -26.325048446655273, "global_step": 375122, "epoch": 4519} {"train_loss": -26.04011344909668, "global_step": 375123, "epoch": 4519} {"train_loss": -25.952880859375, "global_step": 375124, "epoch": 4519} {"train_loss": -26.75140953063965, "global_step": 375125, "epoch": 4519} {"train_loss": -26.412494659423828, "global_step": 375126, "epoch": 4519} {"train_loss": -26.75813865661621, "global_step": 375127, "epoch": 4519} {"train_loss": -26.4573974609375, "global_step": 375128, "epoch": 4519} {"train_loss": -26.189788818359375, "global_step": 375129, "epoch": 4519} {"train_loss": -26.486103057861328, "global_step": 375130, "epoch": 4519} {"train_loss": -26.927265167236328, "global_step": 375131, "epoch": 4519} {"train_loss": -26.383337020874023, "global_step": 375132, "epoch": 4519} {"train_loss": -26.516193389892578, "global_step": 375133, "epoch": 4519} {"train_loss": -26.466278076171875, "global_step": 375134, "epoch": 4519} {"train_loss": -26.526716232299805, "global_step": 375135, "epoch": 4519} {"train_loss": -26.095502853393555, "global_step": 375136, "epoch": 4519} {"train_loss": -26.551435470581055, "global_step": 375137, "epoch": 4519} {"train_loss": -26.6132755279541, "global_step": 375138, "epoch": 4519} {"train_loss": -26.22492027282715, "global_step": 375139, "epoch": 4519} {"train_loss": -26.13495445251465, "global_step": 375140, "epoch": 4519} {"train_loss": -26.056507110595703, "global_step": 375141, "epoch": 4519} {"train_loss": -26.369495391845703, "global_step": 375142, "epoch": 4519} {"train_loss": -26.01331901550293, "global_step": 375143, "epoch": 4519} {"train_loss": -26.3359432220459, "global_step": 375144, "epoch": 4519} {"train_loss": -26.220050811767578, "global_step": 375145, "epoch": 4519} {"train_loss": -25.9549617767334, "global_step": 375146, "epoch": 4519} {"train_loss": -26.305042266845703, "global_step": 375147, "epoch": 4519} {"train_loss": -26.559240341186523, "global_step": 375148, "epoch": 4519} {"train_loss": -26.132333755493164, "global_step": 375149, "epoch": 4519} {"train_loss": -25.94038200378418, "global_step": 375150, "epoch": 4519} {"train_loss": -26.544092178344727, "global_step": 375151, "epoch": 4519} {"train_loss": -26.622034072875977, "global_step": 375152, "epoch": 4519} {"train_loss": -26.435529708862305, "global_step": 375153, "epoch": 4519} {"train_loss": -26.51984977722168, "global_step": 375154, "epoch": 4519} {"train_loss": -26.41322135925293, "global_step": 375155, "epoch": 4519} {"train_loss": -26.148151397705078, "global_step": 375156, "epoch": 4519} {"train_loss": -26.457685470581055, "global_step": 375157, "epoch": 4519} {"train_loss": -26.654977798461914, "global_step": 375158, "epoch": 4519} {"train_loss": -26.36886886228998, "global_step": 375159, "epoch": 4519, "val_loss": 6617351.5} {"train_loss": -26.098432540893555, "global_step": 375160, "epoch": 4520} {"train_loss": -25.500173568725586, "global_step": 375161, "epoch": 4520} {"train_loss": -25.76263427734375, "global_step": 375162, "epoch": 4520} {"train_loss": -26.017614364624023, "global_step": 375163, "epoch": 4520} {"train_loss": -25.485641479492188, "global_step": 375164, "epoch": 4520} {"train_loss": -25.49567413330078, "global_step": 375165, "epoch": 4520} {"train_loss": -26.103708267211914, "global_step": 375166, "epoch": 4520} {"train_loss": -25.73394775390625, "global_step": 375167, "epoch": 4520} {"train_loss": -25.892017364501953, "global_step": 375168, "epoch": 4520} {"train_loss": -25.672775268554688, "global_step": 375169, "epoch": 4520} {"train_loss": -25.997528076171875, "global_step": 375170, "epoch": 4520} {"train_loss": -25.800098419189453, "global_step": 375171, "epoch": 4520} {"train_loss": -26.158666610717773, "global_step": 375172, "epoch": 4520} {"train_loss": -25.975479125976562, "global_step": 375173, "epoch": 4520} {"train_loss": -26.1534423828125, "global_step": 375174, "epoch": 4520} {"train_loss": -26.52439308166504, "global_step": 375175, "epoch": 4520} {"train_loss": -26.386091232299805, "global_step": 375176, "epoch": 4520} {"train_loss": -25.975202560424805, "global_step": 375177, "epoch": 4520} {"train_loss": -26.128698348999023, "global_step": 375178, "epoch": 4520} {"train_loss": -26.216489791870117, "global_step": 375179, "epoch": 4520} {"train_loss": -26.149621963500977, "global_step": 375180, "epoch": 4520} {"train_loss": -26.2889347076416, "global_step": 375181, "epoch": 4520} {"train_loss": -26.359058380126953, "global_step": 375182, "epoch": 4520} {"train_loss": -26.15886878967285, "global_step": 375183, "epoch": 4520} {"train_loss": -26.23728370666504, "global_step": 375184, "epoch": 4520} {"train_loss": -26.225238800048828, "global_step": 375185, "epoch": 4520} {"train_loss": -26.347217559814453, "global_step": 375186, "epoch": 4520} {"train_loss": -26.167383193969727, "global_step": 375187, "epoch": 4520} {"train_loss": -26.481287002563477, "global_step": 375188, "epoch": 4520} {"train_loss": -26.276403427124023, "global_step": 375189, "epoch": 4520} {"train_loss": -26.34296226501465, "global_step": 375190, "epoch": 4520} {"train_loss": -26.70870018005371, "global_step": 375191, "epoch": 4520} {"train_loss": -26.680530548095703, "global_step": 375192, "epoch": 4520} {"train_loss": -26.23076820373535, "global_step": 375193, "epoch": 4520} {"train_loss": -26.18732261657715, "global_step": 375194, "epoch": 4520} {"train_loss": -26.388879776000977, "global_step": 375195, "epoch": 4520} {"train_loss": -26.527002334594727, "global_step": 375196, "epoch": 4520} {"train_loss": -26.32197380065918, "global_step": 375197, "epoch": 4520} {"train_loss": -26.059982299804688, "global_step": 375198, "epoch": 4520} {"train_loss": -26.445165634155273, "global_step": 375199, "epoch": 4520} {"train_loss": -26.525609970092773, "global_step": 375200, "epoch": 4520} {"train_loss": -26.262235641479492, "global_step": 375201, "epoch": 4520} {"train_loss": -26.374902725219727, "global_step": 375202, "epoch": 4520} {"train_loss": -26.570819854736328, "global_step": 375203, "epoch": 4520} {"train_loss": -26.703771591186523, "global_step": 375204, "epoch": 4520} {"train_loss": -26.614898681640625, "global_step": 375205, "epoch": 4520} {"train_loss": -26.60593032836914, "global_step": 375206, "epoch": 4520} {"train_loss": -26.34235191345215, "global_step": 375207, "epoch": 4520} {"train_loss": -26.472070693969727, "global_step": 375208, "epoch": 4520} {"train_loss": -26.46396255493164, "global_step": 375209, "epoch": 4520} {"train_loss": -26.414831161499023, "global_step": 375210, "epoch": 4520} {"train_loss": -26.25520133972168, "global_step": 375211, "epoch": 4520} {"train_loss": -26.57562255859375, "global_step": 375212, "epoch": 4520} {"train_loss": -26.463598251342773, "global_step": 375213, "epoch": 4520} {"train_loss": -26.220251083374023, "global_step": 375214, "epoch": 4520} {"train_loss": -26.344968795776367, "global_step": 375215, "epoch": 4520} {"train_loss": -26.051395416259766, "global_step": 375216, "epoch": 4520} {"train_loss": -26.10487937927246, "global_step": 375217, "epoch": 4520} {"train_loss": -26.314990997314453, "global_step": 375218, "epoch": 4520} {"train_loss": -26.293054580688477, "global_step": 375219, "epoch": 4520} {"train_loss": -26.133193969726562, "global_step": 375220, "epoch": 4520} {"train_loss": -26.21428871154785, "global_step": 375221, "epoch": 4520} {"train_loss": -26.6159610748291, "global_step": 375222, "epoch": 4520} {"train_loss": -26.147932052612305, "global_step": 375223, "epoch": 4520} {"train_loss": -26.514707565307617, "global_step": 375224, "epoch": 4520} {"train_loss": -26.056650161743164, "global_step": 375225, "epoch": 4520} {"train_loss": -25.648157119750977, "global_step": 375226, "epoch": 4520} {"train_loss": -25.509361267089844, "global_step": 375227, "epoch": 4520} {"train_loss": -25.904815673828125, "global_step": 375228, "epoch": 4520} {"train_loss": -26.0830078125, "global_step": 375229, "epoch": 4520} {"train_loss": -26.51123046875, "global_step": 375230, "epoch": 4520} {"train_loss": -26.275304794311523, "global_step": 375231, "epoch": 4520} {"train_loss": -26.18505859375, "global_step": 375232, "epoch": 4520} {"train_loss": -26.36054801940918, "global_step": 375233, "epoch": 4520} {"train_loss": -26.46003532409668, "global_step": 375234, "epoch": 4520} {"train_loss": -26.196882247924805, "global_step": 375235, "epoch": 4520} {"train_loss": -26.16977882385254, "global_step": 375236, "epoch": 4520} {"train_loss": -26.493701934814453, "global_step": 375237, "epoch": 4520} {"train_loss": -26.23762321472168, "global_step": 375238, "epoch": 4520} {"train_loss": -26.44895362854004, "global_step": 375239, "epoch": 4520} {"train_loss": -26.585798263549805, "global_step": 375240, "epoch": 4520} {"train_loss": -26.50318717956543, "global_step": 375241, "epoch": 4520} {"train_loss": -26.241278177284332, "global_step": 375242, "epoch": 4520, "val_loss": 6631050.5} {"train_loss": -26.049610137939453, "global_step": 375243, "epoch": 4521} {"train_loss": -25.874719619750977, "global_step": 375244, "epoch": 4521} {"train_loss": -26.17840576171875, "global_step": 375245, "epoch": 4521} {"train_loss": -26.484304428100586, "global_step": 375246, "epoch": 4521} {"train_loss": -26.095483779907227, "global_step": 375247, "epoch": 4521} {"train_loss": -26.181732177734375, "global_step": 375248, "epoch": 4521} {"train_loss": -26.20123863220215, "global_step": 375249, "epoch": 4521} {"train_loss": -26.128759384155273, "global_step": 375250, "epoch": 4521} {"train_loss": -26.328466415405273, "global_step": 375251, "epoch": 4521} {"train_loss": -26.37723159790039, "global_step": 375252, "epoch": 4521} {"train_loss": -26.18482780456543, "global_step": 375253, "epoch": 4521} {"train_loss": -26.16035270690918, "global_step": 375254, "epoch": 4521} {"train_loss": -26.209461212158203, "global_step": 375255, "epoch": 4521} {"train_loss": -26.549396514892578, "global_step": 375256, "epoch": 4521} {"train_loss": -26.42719841003418, "global_step": 375257, "epoch": 4521} {"train_loss": -26.4476261138916, "global_step": 375258, "epoch": 4521} {"train_loss": -26.67909049987793, "global_step": 375259, "epoch": 4521} {"train_loss": -26.46882438659668, "global_step": 375260, "epoch": 4521} {"train_loss": -26.460254669189453, "global_step": 375261, "epoch": 4521} {"train_loss": -26.491987228393555, "global_step": 375262, "epoch": 4521} {"train_loss": -26.024816513061523, "global_step": 375263, "epoch": 4521} {"train_loss": -26.642953872680664, "global_step": 375264, "epoch": 4521} {"train_loss": -26.792978286743164, "global_step": 375265, "epoch": 4521} {"train_loss": -26.269485473632812, "global_step": 375266, "epoch": 4521} {"train_loss": -26.44073486328125, "global_step": 375267, "epoch": 4521} {"train_loss": -26.427289962768555, "global_step": 375268, "epoch": 4521} {"train_loss": -26.372961044311523, "global_step": 375269, "epoch": 4521} {"train_loss": -26.54631996154785, "global_step": 375270, "epoch": 4521} {"train_loss": -26.605661392211914, "global_step": 375271, "epoch": 4521} {"train_loss": -26.411535263061523, "global_step": 375272, "epoch": 4521} {"train_loss": -26.220596313476562, "global_step": 375273, "epoch": 4521} {"train_loss": -26.763519287109375, "global_step": 375274, "epoch": 4521} {"train_loss": -26.5856876373291, "global_step": 375275, "epoch": 4521} {"train_loss": -26.737451553344727, "global_step": 375276, "epoch": 4521} {"train_loss": -26.36872673034668, "global_step": 375277, "epoch": 4521} {"train_loss": -26.435504913330078, "global_step": 375278, "epoch": 4521} {"train_loss": -26.519643783569336, "global_step": 375279, "epoch": 4521} {"train_loss": -26.463224411010742, "global_step": 375280, "epoch": 4521} {"train_loss": -26.40851402282715, "global_step": 375281, "epoch": 4521} {"train_loss": -26.51702880859375, "global_step": 375282, "epoch": 4521} {"train_loss": -26.1306095123291, "global_step": 375283, "epoch": 4521} {"train_loss": -26.890905380249023, "global_step": 375284, "epoch": 4521} {"train_loss": -26.10860252380371, "global_step": 375285, "epoch": 4521} {"train_loss": -26.130578994750977, "global_step": 375286, "epoch": 4521} {"train_loss": -26.815099716186523, "global_step": 375287, "epoch": 4521} {"train_loss": -26.588727951049805, "global_step": 375288, "epoch": 4521} {"train_loss": -26.13336753845215, "global_step": 375289, "epoch": 4521} {"train_loss": -26.259387969970703, "global_step": 375290, "epoch": 4521} {"train_loss": -26.471967697143555, "global_step": 375291, "epoch": 4521} {"train_loss": -26.468048095703125, "global_step": 375292, "epoch": 4521} {"train_loss": -26.798437118530273, "global_step": 375293, "epoch": 4521} {"train_loss": -26.245065689086914, "global_step": 375294, "epoch": 4521} {"train_loss": -26.6531925201416, "global_step": 375295, "epoch": 4521} {"train_loss": -26.141036987304688, "global_step": 375296, "epoch": 4521} {"train_loss": -26.23042869567871, "global_step": 375297, "epoch": 4521} {"train_loss": -26.64394187927246, "global_step": 375298, "epoch": 4521} {"train_loss": -26.04072380065918, "global_step": 375299, "epoch": 4521} {"train_loss": -26.053335189819336, "global_step": 375300, "epoch": 4521} {"train_loss": -25.7025089263916, "global_step": 375301, "epoch": 4521} {"train_loss": -26.016775131225586, "global_step": 375302, "epoch": 4521} {"train_loss": -26.462711334228516, "global_step": 375303, "epoch": 4521} {"train_loss": -26.0956974029541, "global_step": 375304, "epoch": 4521} {"train_loss": -26.325483322143555, "global_step": 375305, "epoch": 4521} {"train_loss": -26.341144561767578, "global_step": 375306, "epoch": 4521} {"train_loss": -26.521371841430664, "global_step": 375307, "epoch": 4521} {"train_loss": -25.934762954711914, "global_step": 375308, "epoch": 4521} {"train_loss": -26.29143714904785, "global_step": 375309, "epoch": 4521} {"train_loss": -26.2551212310791, "global_step": 375310, "epoch": 4521} {"train_loss": -26.228513717651367, "global_step": 375311, "epoch": 4521} {"train_loss": -26.0367374420166, "global_step": 375312, "epoch": 4521} {"train_loss": -26.22706413269043, "global_step": 375313, "epoch": 4521} {"train_loss": -26.27533531188965, "global_step": 375314, "epoch": 4521} {"train_loss": -26.348745346069336, "global_step": 375315, "epoch": 4521} {"train_loss": -26.056732177734375, "global_step": 375316, "epoch": 4521} {"train_loss": -26.488080978393555, "global_step": 375317, "epoch": 4521} {"train_loss": -26.499433517456055, "global_step": 375318, "epoch": 4521} {"train_loss": -26.19736671447754, "global_step": 375319, "epoch": 4521} {"train_loss": -26.48648452758789, "global_step": 375320, "epoch": 4521} {"train_loss": -26.397146224975586, "global_step": 375321, "epoch": 4521} {"train_loss": -26.548294067382812, "global_step": 375322, "epoch": 4521} {"train_loss": -26.47724723815918, "global_step": 375323, "epoch": 4521} {"train_loss": -26.52836036682129, "global_step": 375324, "epoch": 4521} {"train_loss": -26.358822167637836, "global_step": 375325, "epoch": 4521, "val_loss": 6703443.0} {"train_loss": -25.14301300048828, "global_step": 375326, "epoch": 4522} {"train_loss": -26.603302001953125, "global_step": 375327, "epoch": 4522} {"train_loss": -25.553897857666016, "global_step": 375328, "epoch": 4522} {"train_loss": -25.919219970703125, "global_step": 375329, "epoch": 4522} {"train_loss": -26.037372589111328, "global_step": 375330, "epoch": 4522} {"train_loss": -25.7602481842041, "global_step": 375331, "epoch": 4522} {"train_loss": -26.515424728393555, "global_step": 375332, "epoch": 4522} {"train_loss": -25.67972183227539, "global_step": 375333, "epoch": 4522} {"train_loss": -26.231359481811523, "global_step": 375334, "epoch": 4522} {"train_loss": -26.23113441467285, "global_step": 375335, "epoch": 4522} {"train_loss": -26.034671783447266, "global_step": 375336, "epoch": 4522} {"train_loss": -26.10120964050293, "global_step": 375337, "epoch": 4522} {"train_loss": -26.2440128326416, "global_step": 375338, "epoch": 4522} {"train_loss": -26.14813232421875, "global_step": 375339, "epoch": 4522} {"train_loss": -26.187768936157227, "global_step": 375340, "epoch": 4522} {"train_loss": -26.073957443237305, "global_step": 375341, "epoch": 4522} {"train_loss": -26.26790428161621, "global_step": 375342, "epoch": 4522} {"train_loss": -26.371816635131836, "global_step": 375343, "epoch": 4522} {"train_loss": -26.660383224487305, "global_step": 375344, "epoch": 4522} {"train_loss": -26.197370529174805, "global_step": 375345, "epoch": 4522} {"train_loss": -26.352521896362305, "global_step": 375346, "epoch": 4522} {"train_loss": -26.414459228515625, "global_step": 375347, "epoch": 4522} {"train_loss": -26.359312057495117, "global_step": 375348, "epoch": 4522} {"train_loss": -26.545129776000977, "global_step": 375349, "epoch": 4522} {"train_loss": -26.73146629333496, "global_step": 375350, "epoch": 4522} {"train_loss": -26.3383846282959, "global_step": 375351, "epoch": 4522} {"train_loss": -26.239063262939453, "global_step": 375352, "epoch": 4522} {"train_loss": -26.328125, "global_step": 375353, "epoch": 4522} {"train_loss": -26.170734405517578, "global_step": 375354, "epoch": 4522} {"train_loss": -26.050048828125, "global_step": 375355, "epoch": 4522} {"train_loss": -26.482152938842773, "global_step": 375356, "epoch": 4522} {"train_loss": -26.603864669799805, "global_step": 375357, "epoch": 4522} {"train_loss": -26.5477237701416, "global_step": 375358, "epoch": 4522} {"train_loss": -26.316974639892578, "global_step": 375359, "epoch": 4522} {"train_loss": -26.435110092163086, "global_step": 375360, "epoch": 4522} {"train_loss": -26.52808952331543, "global_step": 375361, "epoch": 4522} {"train_loss": -26.593496322631836, "global_step": 375362, "epoch": 4522} {"train_loss": -26.4232177734375, "global_step": 375363, "epoch": 4522} {"train_loss": -25.90643310546875, "global_step": 375364, "epoch": 4522} {"train_loss": -26.45220375061035, "global_step": 375365, "epoch": 4522} {"train_loss": -26.604291915893555, "global_step": 375366, "epoch": 4522} {"train_loss": -26.38922691345215, "global_step": 375367, "epoch": 4522} {"train_loss": -26.2325439453125, "global_step": 375368, "epoch": 4522} {"train_loss": -26.86224937438965, "global_step": 375369, "epoch": 4522} {"train_loss": -26.488876342773438, "global_step": 375370, "epoch": 4522} {"train_loss": -26.265378952026367, "global_step": 375371, "epoch": 4522} {"train_loss": -26.52951431274414, "global_step": 375372, "epoch": 4522} {"train_loss": -26.16641616821289, "global_step": 375373, "epoch": 4522} {"train_loss": -26.600217819213867, "global_step": 375374, "epoch": 4522} {"train_loss": -26.312686920166016, "global_step": 375375, "epoch": 4522} {"train_loss": -25.960966110229492, "global_step": 375376, "epoch": 4522} {"train_loss": -26.304426193237305, "global_step": 375377, "epoch": 4522} {"train_loss": -26.114831924438477, "global_step": 375378, "epoch": 4522} {"train_loss": -26.211286544799805, "global_step": 375379, "epoch": 4522} {"train_loss": -26.273853302001953, "global_step": 375380, "epoch": 4522} {"train_loss": -26.1412296295166, "global_step": 375381, "epoch": 4522} {"train_loss": -26.493356704711914, "global_step": 375382, "epoch": 4522} {"train_loss": -25.974506378173828, "global_step": 375383, "epoch": 4522} {"train_loss": -26.516651153564453, "global_step": 375384, "epoch": 4522} {"train_loss": -26.45355796813965, "global_step": 375385, "epoch": 4522} {"train_loss": -26.457311630249023, "global_step": 375386, "epoch": 4522} {"train_loss": -26.36113929748535, "global_step": 375387, "epoch": 4522} {"train_loss": -26.7890625, "global_step": 375388, "epoch": 4522} {"train_loss": -26.128759384155273, "global_step": 375389, "epoch": 4522} {"train_loss": -26.605863571166992, "global_step": 375390, "epoch": 4522} {"train_loss": -26.359159469604492, "global_step": 375391, "epoch": 4522} {"train_loss": -26.610944747924805, "global_step": 375392, "epoch": 4522} {"train_loss": -26.43964195251465, "global_step": 375393, "epoch": 4522} {"train_loss": -26.362579345703125, "global_step": 375394, "epoch": 4522} {"train_loss": -26.387388229370117, "global_step": 375395, "epoch": 4522} {"train_loss": -26.802982330322266, "global_step": 375396, "epoch": 4522} {"train_loss": -26.81752586364746, "global_step": 375397, "epoch": 4522} {"train_loss": -26.498167037963867, "global_step": 375398, "epoch": 4522} {"train_loss": -26.515655517578125, "global_step": 375399, "epoch": 4522} {"train_loss": -26.87774658203125, "global_step": 375400, "epoch": 4522} {"train_loss": -26.272109985351562, "global_step": 375401, "epoch": 4522} {"train_loss": -26.72842788696289, "global_step": 375402, "epoch": 4522} {"train_loss": -26.32010269165039, "global_step": 375403, "epoch": 4522} {"train_loss": -27.097442626953125, "global_step": 375404, "epoch": 4522} {"train_loss": -26.233301162719727, "global_step": 375405, "epoch": 4522} {"train_loss": -26.873992919921875, "global_step": 375406, "epoch": 4522} {"train_loss": -26.620351791381836, "global_step": 375407, "epoch": 4522} {"train_loss": -26.350270811333715, "global_step": 375408, "epoch": 4522, "val_loss": 6580939.0} {"train_loss": -25.739282608032227, "global_step": 375409, "epoch": 4523} {"train_loss": -26.068517684936523, "global_step": 375410, "epoch": 4523} {"train_loss": -26.085248947143555, "global_step": 375411, "epoch": 4523} {"train_loss": -26.19144630432129, "global_step": 375412, "epoch": 4523} {"train_loss": -25.996356964111328, "global_step": 375413, "epoch": 4523} {"train_loss": -26.36138343811035, "global_step": 375414, "epoch": 4523} {"train_loss": -25.902973175048828, "global_step": 375415, "epoch": 4523} {"train_loss": -26.077314376831055, "global_step": 375416, "epoch": 4523} {"train_loss": -25.9306640625, "global_step": 375417, "epoch": 4523} {"train_loss": -26.287626266479492, "global_step": 375418, "epoch": 4523} {"train_loss": -26.283578872680664, "global_step": 375419, "epoch": 4523} {"train_loss": -25.659656524658203, "global_step": 375420, "epoch": 4523} {"train_loss": -25.207944869995117, "global_step": 375421, "epoch": 4523} {"train_loss": -26.228479385375977, "global_step": 375422, "epoch": 4523} {"train_loss": -26.202590942382812, "global_step": 375423, "epoch": 4523} {"train_loss": -25.7425479888916, "global_step": 375424, "epoch": 4523} {"train_loss": -25.871341705322266, "global_step": 375425, "epoch": 4523} {"train_loss": -26.354145050048828, "global_step": 375426, "epoch": 4523} {"train_loss": -25.562040328979492, "global_step": 375427, "epoch": 4523} {"train_loss": -26.13062858581543, "global_step": 375428, "epoch": 4523} {"train_loss": -26.00732421875, "global_step": 375429, "epoch": 4523} {"train_loss": -25.914337158203125, "global_step": 375430, "epoch": 4523} {"train_loss": -26.136341094970703, "global_step": 375431, "epoch": 4523} {"train_loss": -26.341541290283203, "global_step": 375432, "epoch": 4523} {"train_loss": -26.340564727783203, "global_step": 375433, "epoch": 4523} {"train_loss": -26.13446617126465, "global_step": 375434, "epoch": 4523} {"train_loss": -26.081256866455078, "global_step": 375435, "epoch": 4523} {"train_loss": -26.0809383392334, "global_step": 375436, "epoch": 4523} {"train_loss": -26.376312255859375, "global_step": 375437, "epoch": 4523} {"train_loss": -26.282567977905273, "global_step": 375438, "epoch": 4523} {"train_loss": -26.152801513671875, "global_step": 375439, "epoch": 4523} {"train_loss": -26.499042510986328, "global_step": 375440, "epoch": 4523} {"train_loss": -26.097126007080078, "global_step": 375441, "epoch": 4523} {"train_loss": -26.500919342041016, "global_step": 375442, "epoch": 4523} {"train_loss": -26.5155086517334, "global_step": 375443, "epoch": 4523} {"train_loss": -26.325183868408203, "global_step": 375444, "epoch": 4523} {"train_loss": -26.29645347595215, "global_step": 375445, "epoch": 4523} {"train_loss": -26.10426139831543, "global_step": 375446, "epoch": 4523} {"train_loss": -26.45819664001465, "global_step": 375447, "epoch": 4523} {"train_loss": -26.892072677612305, "global_step": 375448, "epoch": 4523} {"train_loss": -26.21967887878418, "global_step": 375449, "epoch": 4523} {"train_loss": -26.4434757232666, "global_step": 375450, "epoch": 4523} {"train_loss": -26.710599899291992, "global_step": 375451, "epoch": 4523} {"train_loss": -26.29204750061035, "global_step": 375452, "epoch": 4523} {"train_loss": -26.602283477783203, "global_step": 375453, "epoch": 4523} {"train_loss": -26.456754684448242, "global_step": 375454, "epoch": 4523} {"train_loss": -26.379728317260742, "global_step": 375455, "epoch": 4523} {"train_loss": -26.298791885375977, "global_step": 375456, "epoch": 4523} {"train_loss": -26.406818389892578, "global_step": 375457, "epoch": 4523} {"train_loss": -26.325613021850586, "global_step": 375458, "epoch": 4523} {"train_loss": -26.468603134155273, "global_step": 375459, "epoch": 4523} {"train_loss": -26.272907257080078, "global_step": 375460, "epoch": 4523} {"train_loss": -26.14227867126465, "global_step": 375461, "epoch": 4523} {"train_loss": -26.51189613342285, "global_step": 375462, "epoch": 4523} {"train_loss": -26.28862953186035, "global_step": 375463, "epoch": 4523} {"train_loss": -26.59686851501465, "global_step": 375464, "epoch": 4523} {"train_loss": -26.409082412719727, "global_step": 375465, "epoch": 4523} {"train_loss": -26.450550079345703, "global_step": 375466, "epoch": 4523} {"train_loss": -26.280851364135742, "global_step": 375467, "epoch": 4523} {"train_loss": -26.7867431640625, "global_step": 375468, "epoch": 4523} {"train_loss": -26.486108779907227, "global_step": 375469, "epoch": 4523} {"train_loss": -26.788227081298828, "global_step": 375470, "epoch": 4523} {"train_loss": -26.49456214904785, "global_step": 375471, "epoch": 4523} {"train_loss": -26.321308135986328, "global_step": 375472, "epoch": 4523} {"train_loss": -26.50274085998535, "global_step": 375473, "epoch": 4523} {"train_loss": -26.462873458862305, "global_step": 375474, "epoch": 4523} {"train_loss": -26.84553337097168, "global_step": 375475, "epoch": 4523} {"train_loss": -26.666095733642578, "global_step": 375476, "epoch": 4523} {"train_loss": -26.78702735900879, "global_step": 375477, "epoch": 4523} {"train_loss": -26.64645767211914, "global_step": 375478, "epoch": 4523} {"train_loss": -26.49770164489746, "global_step": 375479, "epoch": 4523} {"train_loss": -26.983808517456055, "global_step": 375480, "epoch": 4523} {"train_loss": -26.579898834228516, "global_step": 375481, "epoch": 4523} {"train_loss": -26.680896759033203, "global_step": 375482, "epoch": 4523} {"train_loss": -26.5162353515625, "global_step": 375483, "epoch": 4523} {"train_loss": -26.904239654541016, "global_step": 375484, "epoch": 4523} {"train_loss": -27.048837661743164, "global_step": 375485, "epoch": 4523} {"train_loss": -26.778533935546875, "global_step": 375486, "epoch": 4523} {"train_loss": -26.620563507080078, "global_step": 375487, "epoch": 4523} {"train_loss": -26.648273468017578, "global_step": 375488, "epoch": 4523} {"train_loss": -26.212549209594727, "global_step": 375489, "epoch": 4523} {"train_loss": -26.02444839477539, "global_step": 375490, "epoch": 4523} {"train_loss": -26.334575744996588, "global_step": 375491, "epoch": 4523, "val_loss": 6644910.0} {"train_loss": -25.705907821655273, "global_step": 375492, "epoch": 4524} {"train_loss": -25.62761878967285, "global_step": 375493, "epoch": 4524} {"train_loss": -25.826929092407227, "global_step": 375494, "epoch": 4524} {"train_loss": -25.64143943786621, "global_step": 375495, "epoch": 4524} {"train_loss": -26.445072174072266, "global_step": 375496, "epoch": 4524} {"train_loss": -25.196653366088867, "global_step": 375497, "epoch": 4524} {"train_loss": -25.58072280883789, "global_step": 375498, "epoch": 4524} {"train_loss": -25.90940284729004, "global_step": 375499, "epoch": 4524} {"train_loss": -25.957962036132812, "global_step": 375500, "epoch": 4524} {"train_loss": -26.008153915405273, "global_step": 375501, "epoch": 4524} {"train_loss": -25.61333656311035, "global_step": 375502, "epoch": 4524} {"train_loss": -25.276382446289062, "global_step": 375503, "epoch": 4524} {"train_loss": -25.758771896362305, "global_step": 375504, "epoch": 4524} {"train_loss": -26.02935791015625, "global_step": 375505, "epoch": 4524} {"train_loss": -25.592140197753906, "global_step": 375506, "epoch": 4524} {"train_loss": -25.937042236328125, "global_step": 375507, "epoch": 4524} {"train_loss": -25.548503875732422, "global_step": 375508, "epoch": 4524} {"train_loss": -25.915430068969727, "global_step": 375509, "epoch": 4524} {"train_loss": -25.9066162109375, "global_step": 375510, "epoch": 4524} {"train_loss": -25.8055419921875, "global_step": 375511, "epoch": 4524} {"train_loss": -26.160114288330078, "global_step": 375512, "epoch": 4524} {"train_loss": -26.084543228149414, "global_step": 375513, "epoch": 4524} {"train_loss": -26.52918815612793, "global_step": 375514, "epoch": 4524} {"train_loss": -25.62175941467285, "global_step": 375515, "epoch": 4524} {"train_loss": -26.16839027404785, "global_step": 375516, "epoch": 4524} {"train_loss": -25.839223861694336, "global_step": 375517, "epoch": 4524} {"train_loss": -26.089033126831055, "global_step": 375518, "epoch": 4524} {"train_loss": -26.147846221923828, "global_step": 375519, "epoch": 4524} {"train_loss": -26.075544357299805, "global_step": 375520, "epoch": 4524} {"train_loss": -26.47572135925293, "global_step": 375521, "epoch": 4524} {"train_loss": -26.456079483032227, "global_step": 375522, "epoch": 4524} {"train_loss": -26.517141342163086, "global_step": 375523, "epoch": 4524} {"train_loss": -26.297260284423828, "global_step": 375524, "epoch": 4524} {"train_loss": -26.292871475219727, "global_step": 375525, "epoch": 4524} {"train_loss": -26.252302169799805, "global_step": 375526, "epoch": 4524} {"train_loss": -26.05824089050293, "global_step": 375527, "epoch": 4524} {"train_loss": -25.998432159423828, "global_step": 375528, "epoch": 4524} {"train_loss": -26.401010513305664, "global_step": 375529, "epoch": 4524} {"train_loss": -26.718109130859375, "global_step": 375530, "epoch": 4524} {"train_loss": -26.2529239654541, "global_step": 375531, "epoch": 4524} {"train_loss": -26.5899715423584, "global_step": 375532, "epoch": 4524} {"train_loss": -26.441038131713867, "global_step": 375533, "epoch": 4524} {"train_loss": -26.385717391967773, "global_step": 375534, "epoch": 4524} {"train_loss": -26.39007568359375, "global_step": 375535, "epoch": 4524} {"train_loss": -26.637094497680664, "global_step": 375536, "epoch": 4524} {"train_loss": -26.495132446289062, "global_step": 375537, "epoch": 4524} {"train_loss": -26.485015869140625, "global_step": 375538, "epoch": 4524} {"train_loss": -26.900678634643555, "global_step": 375539, "epoch": 4524} {"train_loss": -26.504322052001953, "global_step": 375540, "epoch": 4524} {"train_loss": -26.56890869140625, "global_step": 375541, "epoch": 4524} {"train_loss": -26.74799919128418, "global_step": 375542, "epoch": 4524} {"train_loss": -26.5179386138916, "global_step": 375543, "epoch": 4524} {"train_loss": -26.303510665893555, "global_step": 375544, "epoch": 4524} {"train_loss": -27.035537719726562, "global_step": 375545, "epoch": 4524} {"train_loss": -26.382028579711914, "global_step": 375546, "epoch": 4524} {"train_loss": -26.597864151000977, "global_step": 375547, "epoch": 4524} {"train_loss": -26.46013832092285, "global_step": 375548, "epoch": 4524} {"train_loss": -26.76373863220215, "global_step": 375549, "epoch": 4524} {"train_loss": -26.82411766052246, "global_step": 375550, "epoch": 4524} {"train_loss": -26.450082778930664, "global_step": 375551, "epoch": 4524} {"train_loss": -26.571826934814453, "global_step": 375552, "epoch": 4524} {"train_loss": -26.224058151245117, "global_step": 375553, "epoch": 4524} {"train_loss": -26.459918975830078, "global_step": 375554, "epoch": 4524} {"train_loss": -26.561071395874023, "global_step": 375555, "epoch": 4524} {"train_loss": -26.35906982421875, "global_step": 375556, "epoch": 4524} {"train_loss": -26.786914825439453, "global_step": 375557, "epoch": 4524} {"train_loss": -26.185422897338867, "global_step": 375558, "epoch": 4524} {"train_loss": -26.01728630065918, "global_step": 375559, "epoch": 4524} {"train_loss": -26.25579833984375, "global_step": 375560, "epoch": 4524} {"train_loss": -26.35084342956543, "global_step": 375561, "epoch": 4524} {"train_loss": -26.70807456970215, "global_step": 375562, "epoch": 4524} {"train_loss": -26.221057891845703, "global_step": 375563, "epoch": 4524} {"train_loss": -25.923933029174805, "global_step": 375564, "epoch": 4524} {"train_loss": -26.5899600982666, "global_step": 375565, "epoch": 4524} {"train_loss": -26.495227813720703, "global_step": 375566, "epoch": 4524} {"train_loss": -26.19003677368164, "global_step": 375567, "epoch": 4524} {"train_loss": -26.22999382019043, "global_step": 375568, "epoch": 4524} {"train_loss": -25.560623168945312, "global_step": 375569, "epoch": 4524} {"train_loss": -26.47511100769043, "global_step": 375570, "epoch": 4524} {"train_loss": -25.854053497314453, "global_step": 375571, "epoch": 4524} {"train_loss": -25.964059829711914, "global_step": 375572, "epoch": 4524} {"train_loss": -26.527912139892578, "global_step": 375573, "epoch": 4524} {"train_loss": -26.2228969436094, "global_step": 375574, "epoch": 4524, "val_loss": 6577279.0} {"train_loss": -24.390918731689453, "global_step": 375575, "epoch": 4525} {"train_loss": -24.33827018737793, "global_step": 375576, "epoch": 4525} {"train_loss": -25.043106079101562, "global_step": 375577, "epoch": 4525} {"train_loss": -24.73102569580078, "global_step": 375578, "epoch": 4525} {"train_loss": -25.44289207458496, "global_step": 375579, "epoch": 4525} {"train_loss": -25.297531127929688, "global_step": 375580, "epoch": 4525} {"train_loss": -25.389301300048828, "global_step": 375581, "epoch": 4525} {"train_loss": -25.421796798706055, "global_step": 375582, "epoch": 4525} {"train_loss": -25.356897354125977, "global_step": 375583, "epoch": 4525} {"train_loss": -25.80586051940918, "global_step": 375584, "epoch": 4525} {"train_loss": -25.891845703125, "global_step": 375585, "epoch": 4525} {"train_loss": -25.62526512145996, "global_step": 375586, "epoch": 4525} {"train_loss": -25.944995880126953, "global_step": 375587, "epoch": 4525} {"train_loss": -25.920883178710938, "global_step": 375588, "epoch": 4525} {"train_loss": -25.71744728088379, "global_step": 375589, "epoch": 4525} {"train_loss": -25.850473403930664, "global_step": 375590, "epoch": 4525} {"train_loss": -25.830474853515625, "global_step": 375591, "epoch": 4525} {"train_loss": -26.059995651245117, "global_step": 375592, "epoch": 4525} {"train_loss": -25.797143936157227, "global_step": 375593, "epoch": 4525} {"train_loss": -26.1107177734375, "global_step": 375594, "epoch": 4525} {"train_loss": -26.208425521850586, "global_step": 375595, "epoch": 4525} {"train_loss": -25.875043869018555, "global_step": 375596, "epoch": 4525} {"train_loss": -26.283645629882812, "global_step": 375597, "epoch": 4525} {"train_loss": -26.1002254486084, "global_step": 375598, "epoch": 4525} {"train_loss": -26.164941787719727, "global_step": 375599, "epoch": 4525} {"train_loss": -26.030487060546875, "global_step": 375600, "epoch": 4525} {"train_loss": -26.175756454467773, "global_step": 375601, "epoch": 4525} {"train_loss": -26.428327560424805, "global_step": 375602, "epoch": 4525} {"train_loss": -25.797500610351562, "global_step": 375603, "epoch": 4525} {"train_loss": -26.2808780670166, "global_step": 375604, "epoch": 4525} {"train_loss": -26.08576774597168, "global_step": 375605, "epoch": 4525} {"train_loss": -26.352264404296875, "global_step": 375606, "epoch": 4525} {"train_loss": -26.21527671813965, "global_step": 375607, "epoch": 4525} {"train_loss": -26.381498336791992, "global_step": 375608, "epoch": 4525} {"train_loss": -26.095062255859375, "global_step": 375609, "epoch": 4525} {"train_loss": -26.25152015686035, "global_step": 375610, "epoch": 4525} {"train_loss": -26.525196075439453, "global_step": 375611, "epoch": 4525} {"train_loss": -26.439844131469727, "global_step": 375612, "epoch": 4525} {"train_loss": -26.643049240112305, "global_step": 375613, "epoch": 4525} {"train_loss": -26.444305419921875, "global_step": 375614, "epoch": 4525} {"train_loss": -26.53923988342285, "global_step": 375615, "epoch": 4525} {"train_loss": -26.42170524597168, "global_step": 375616, "epoch": 4525} {"train_loss": -26.66473388671875, "global_step": 375617, "epoch": 4525} {"train_loss": -26.740116119384766, "global_step": 375618, "epoch": 4525} {"train_loss": -26.43824577331543, "global_step": 375619, "epoch": 4525} {"train_loss": -26.274600982666016, "global_step": 375620, "epoch": 4525} {"train_loss": -26.620025634765625, "global_step": 375621, "epoch": 4525} {"train_loss": -26.69428062438965, "global_step": 375622, "epoch": 4525} {"train_loss": -26.28407096862793, "global_step": 375623, "epoch": 4525} {"train_loss": -26.39188575744629, "global_step": 375624, "epoch": 4525} {"train_loss": -26.330204010009766, "global_step": 375625, "epoch": 4525} {"train_loss": -26.4257869720459, "global_step": 375626, "epoch": 4525} {"train_loss": -26.451934814453125, "global_step": 375627, "epoch": 4525} {"train_loss": -26.670568466186523, "global_step": 375628, "epoch": 4525} {"train_loss": -26.58203125, "global_step": 375629, "epoch": 4525} {"train_loss": -26.455520629882812, "global_step": 375630, "epoch": 4525} {"train_loss": -26.600996017456055, "global_step": 375631, "epoch": 4525} {"train_loss": -26.8156795501709, "global_step": 375632, "epoch": 4525} {"train_loss": -26.515417098999023, "global_step": 375633, "epoch": 4525} {"train_loss": -26.5970401763916, "global_step": 375634, "epoch": 4525} {"train_loss": -26.528722763061523, "global_step": 375635, "epoch": 4525} {"train_loss": -26.33241844177246, "global_step": 375636, "epoch": 4525} {"train_loss": -26.519895553588867, "global_step": 375637, "epoch": 4525} {"train_loss": -26.665796279907227, "global_step": 375638, "epoch": 4525} {"train_loss": -26.546415328979492, "global_step": 375639, "epoch": 4525} {"train_loss": -26.64227294921875, "global_step": 375640, "epoch": 4525} {"train_loss": -26.52069664001465, "global_step": 375641, "epoch": 4525} {"train_loss": -26.99027442932129, "global_step": 375642, "epoch": 4525} {"train_loss": -26.732410430908203, "global_step": 375643, "epoch": 4525} {"train_loss": -26.415546417236328, "global_step": 375644, "epoch": 4525} {"train_loss": -26.520538330078125, "global_step": 375645, "epoch": 4525} {"train_loss": -26.590559005737305, "global_step": 375646, "epoch": 4525} {"train_loss": -26.326541900634766, "global_step": 375647, "epoch": 4525} {"train_loss": -26.11311149597168, "global_step": 375648, "epoch": 4525} {"train_loss": -26.549657821655273, "global_step": 375649, "epoch": 4525} {"train_loss": -26.73188591003418, "global_step": 375650, "epoch": 4525} {"train_loss": -26.068750381469727, "global_step": 375651, "epoch": 4525} {"train_loss": -26.220067977905273, "global_step": 375652, "epoch": 4525} {"train_loss": -26.359167098999023, "global_step": 375653, "epoch": 4525} {"train_loss": -26.301319122314453, "global_step": 375654, "epoch": 4525} {"train_loss": -26.120481491088867, "global_step": 375655, "epoch": 4525} {"train_loss": -26.370580673217773, "global_step": 375656, "epoch": 4525} {"train_loss": -26.209412264536663, "global_step": 375657, "epoch": 4525, "val_loss": 6576749.5} {"train_loss": -26.50105857849121, "global_step": 375658, "epoch": 4526} {"train_loss": -26.253997802734375, "global_step": 375659, "epoch": 4526} {"train_loss": -25.838003158569336, "global_step": 375660, "epoch": 4526} {"train_loss": -26.554624557495117, "global_step": 375661, "epoch": 4526} {"train_loss": -26.197168350219727, "global_step": 375662, "epoch": 4526} {"train_loss": -26.040302276611328, "global_step": 375663, "epoch": 4526} {"train_loss": -26.425352096557617, "global_step": 375664, "epoch": 4526} {"train_loss": -26.10023307800293, "global_step": 375665, "epoch": 4526} {"train_loss": -26.396753311157227, "global_step": 375666, "epoch": 4526} {"train_loss": -26.355642318725586, "global_step": 375667, "epoch": 4526} {"train_loss": -26.356714248657227, "global_step": 375668, "epoch": 4526} {"train_loss": -26.015644073486328, "global_step": 375669, "epoch": 4526} {"train_loss": -26.39887046813965, "global_step": 375670, "epoch": 4526} {"train_loss": -26.13325309753418, "global_step": 375671, "epoch": 4526} {"train_loss": -26.43950843811035, "global_step": 375672, "epoch": 4526} {"train_loss": -26.335235595703125, "global_step": 375673, "epoch": 4526} {"train_loss": -26.408411026000977, "global_step": 375674, "epoch": 4526} {"train_loss": -26.594501495361328, "global_step": 375675, "epoch": 4526} {"train_loss": -26.55022621154785, "global_step": 375676, "epoch": 4526} {"train_loss": -26.281030654907227, "global_step": 375677, "epoch": 4526} {"train_loss": -26.26517677307129, "global_step": 375678, "epoch": 4526} {"train_loss": -25.922449111938477, "global_step": 375679, "epoch": 4526} {"train_loss": -26.39413833618164, "global_step": 375680, "epoch": 4526} {"train_loss": -26.464826583862305, "global_step": 375681, "epoch": 4526} {"train_loss": -26.387042999267578, "global_step": 375682, "epoch": 4526} {"train_loss": -26.593164443969727, "global_step": 375683, "epoch": 4526} {"train_loss": -26.4561767578125, "global_step": 375684, "epoch": 4526} {"train_loss": -26.314208984375, "global_step": 375685, "epoch": 4526} {"train_loss": -26.549177169799805, "global_step": 375686, "epoch": 4526} {"train_loss": -26.370588302612305, "global_step": 375687, "epoch": 4526} {"train_loss": -26.46744728088379, "global_step": 375688, "epoch": 4526} {"train_loss": -26.4345760345459, "global_step": 375689, "epoch": 4526} {"train_loss": -26.25716209411621, "global_step": 375690, "epoch": 4526} {"train_loss": -26.5670223236084, "global_step": 375691, "epoch": 4526} {"train_loss": -26.3236141204834, "global_step": 375692, "epoch": 4526} {"train_loss": -26.554075241088867, "global_step": 375693, "epoch": 4526} {"train_loss": -26.362873077392578, "global_step": 375694, "epoch": 4526} {"train_loss": -26.063587188720703, "global_step": 375695, "epoch": 4526} {"train_loss": -26.886877059936523, "global_step": 375696, "epoch": 4526} {"train_loss": -26.573877334594727, "global_step": 375697, "epoch": 4526} {"train_loss": -26.417526245117188, "global_step": 375698, "epoch": 4526} {"train_loss": -26.49686050415039, "global_step": 375699, "epoch": 4526} {"train_loss": -26.474639892578125, "global_step": 375700, "epoch": 4526} {"train_loss": -26.698078155517578, "global_step": 375701, "epoch": 4526} {"train_loss": -26.371185302734375, "global_step": 375702, "epoch": 4526} {"train_loss": -26.577306747436523, "global_step": 375703, "epoch": 4526} {"train_loss": -26.313644409179688, "global_step": 375704, "epoch": 4526} {"train_loss": -26.48870849609375, "global_step": 375705, "epoch": 4526} {"train_loss": -26.487964630126953, "global_step": 375706, "epoch": 4526} {"train_loss": -26.46405029296875, "global_step": 375707, "epoch": 4526} {"train_loss": -26.31034278869629, "global_step": 375708, "epoch": 4526} {"train_loss": -26.357654571533203, "global_step": 375709, "epoch": 4526} {"train_loss": -26.106916427612305, "global_step": 375710, "epoch": 4526} {"train_loss": -26.587919235229492, "global_step": 375711, "epoch": 4526} {"train_loss": -26.464324951171875, "global_step": 375712, "epoch": 4526} {"train_loss": -26.3773250579834, "global_step": 375713, "epoch": 4526} {"train_loss": -26.511560440063477, "global_step": 375714, "epoch": 4526} {"train_loss": -26.62468910217285, "global_step": 375715, "epoch": 4526} {"train_loss": -26.70849609375, "global_step": 375716, "epoch": 4526} {"train_loss": -26.290924072265625, "global_step": 375717, "epoch": 4526} {"train_loss": -26.45979881286621, "global_step": 375718, "epoch": 4526} {"train_loss": -26.104406356811523, "global_step": 375719, "epoch": 4526} {"train_loss": -26.347021102905273, "global_step": 375720, "epoch": 4526} {"train_loss": -26.540124893188477, "global_step": 375721, "epoch": 4526} {"train_loss": -26.262006759643555, "global_step": 375722, "epoch": 4526} {"train_loss": -26.275358200073242, "global_step": 375723, "epoch": 4526} {"train_loss": -26.385242462158203, "global_step": 375724, "epoch": 4526} {"train_loss": -26.370853424072266, "global_step": 375725, "epoch": 4526} {"train_loss": -26.50653648376465, "global_step": 375726, "epoch": 4526} {"train_loss": -26.019140243530273, "global_step": 375727, "epoch": 4526} {"train_loss": -26.45772361755371, "global_step": 375728, "epoch": 4526} {"train_loss": -26.460357666015625, "global_step": 375729, "epoch": 4526} {"train_loss": -26.374860763549805, "global_step": 375730, "epoch": 4526} {"train_loss": -26.285354614257812, "global_step": 375731, "epoch": 4526} {"train_loss": -25.92778968811035, "global_step": 375732, "epoch": 4526} {"train_loss": -26.32428550720215, "global_step": 375733, "epoch": 4526} {"train_loss": -26.359210968017578, "global_step": 375734, "epoch": 4526} {"train_loss": -26.27277946472168, "global_step": 375735, "epoch": 4526} {"train_loss": -26.3301944732666, "global_step": 375736, "epoch": 4526} {"train_loss": -26.75946044921875, "global_step": 375737, "epoch": 4526} {"train_loss": -26.329608917236328, "global_step": 375738, "epoch": 4526} {"train_loss": -25.9156436920166, "global_step": 375739, "epoch": 4526} {"train_loss": -26.37325806215585, "global_step": 375740, "epoch": 4526, "val_loss": 6628565.5} {"train_loss": -25.345251083374023, "global_step": 375741, "epoch": 4527} {"train_loss": -24.586368560791016, "global_step": 375742, "epoch": 4527} {"train_loss": -24.876195907592773, "global_step": 375743, "epoch": 4527} {"train_loss": -24.735321044921875, "global_step": 375744, "epoch": 4527} {"train_loss": -25.17059898376465, "global_step": 375745, "epoch": 4527} {"train_loss": -24.72956657409668, "global_step": 375746, "epoch": 4527} {"train_loss": -25.835493087768555, "global_step": 375747, "epoch": 4527} {"train_loss": -25.500417709350586, "global_step": 375748, "epoch": 4527} {"train_loss": -25.58407974243164, "global_step": 375749, "epoch": 4527} {"train_loss": -25.495670318603516, "global_step": 375750, "epoch": 4527} {"train_loss": -25.569133758544922, "global_step": 375751, "epoch": 4527} {"train_loss": -25.719396591186523, "global_step": 375752, "epoch": 4527} {"train_loss": -26.094818115234375, "global_step": 375753, "epoch": 4527} {"train_loss": -25.477317810058594, "global_step": 375754, "epoch": 4527} {"train_loss": -25.7531681060791, "global_step": 375755, "epoch": 4527} {"train_loss": -25.772388458251953, "global_step": 375756, "epoch": 4527} {"train_loss": -25.610157012939453, "global_step": 375757, "epoch": 4527} {"train_loss": -25.773466110229492, "global_step": 375758, "epoch": 4527} {"train_loss": -26.127700805664062, "global_step": 375759, "epoch": 4527} {"train_loss": -26.157087326049805, "global_step": 375760, "epoch": 4527} {"train_loss": -25.960615158081055, "global_step": 375761, "epoch": 4527} {"train_loss": -25.768329620361328, "global_step": 375762, "epoch": 4527} {"train_loss": -26.1198673248291, "global_step": 375763, "epoch": 4527} {"train_loss": -25.916675567626953, "global_step": 375764, "epoch": 4527} {"train_loss": -26.518478393554688, "global_step": 375765, "epoch": 4527} {"train_loss": -26.23878288269043, "global_step": 375766, "epoch": 4527} {"train_loss": -26.291479110717773, "global_step": 375767, "epoch": 4527} {"train_loss": -26.54666519165039, "global_step": 375768, "epoch": 4527} {"train_loss": -25.974573135375977, "global_step": 375769, "epoch": 4527} {"train_loss": -26.473464965820312, "global_step": 375770, "epoch": 4527} {"train_loss": -26.105987548828125, "global_step": 375771, "epoch": 4527} {"train_loss": -25.931055068969727, "global_step": 375772, "epoch": 4527} {"train_loss": -26.28712272644043, "global_step": 375773, "epoch": 4527} {"train_loss": -26.12336540222168, "global_step": 375774, "epoch": 4527} {"train_loss": -26.291349411010742, "global_step": 375775, "epoch": 4527} {"train_loss": -26.512266159057617, "global_step": 375776, "epoch": 4527} {"train_loss": -26.470029830932617, "global_step": 375777, "epoch": 4527} {"train_loss": -26.33829689025879, "global_step": 375778, "epoch": 4527} {"train_loss": -26.679065704345703, "global_step": 375779, "epoch": 4527} {"train_loss": -26.63483238220215, "global_step": 375780, "epoch": 4527} {"train_loss": -26.46044921875, "global_step": 375781, "epoch": 4527} {"train_loss": -26.151050567626953, "global_step": 375782, "epoch": 4527} {"train_loss": -26.33349609375, "global_step": 375783, "epoch": 4527} {"train_loss": -26.2562313079834, "global_step": 375784, "epoch": 4527} {"train_loss": -26.354337692260742, "global_step": 375785, "epoch": 4527} {"train_loss": -26.752256393432617, "global_step": 375786, "epoch": 4527} {"train_loss": -26.531768798828125, "global_step": 375787, "epoch": 4527} {"train_loss": -26.453039169311523, "global_step": 375788, "epoch": 4527} {"train_loss": -26.27142333984375, "global_step": 375789, "epoch": 4527} {"train_loss": -26.567752838134766, "global_step": 375790, "epoch": 4527} {"train_loss": -26.587997436523438, "global_step": 375791, "epoch": 4527} {"train_loss": -26.217222213745117, "global_step": 375792, "epoch": 4527} {"train_loss": -26.41266441345215, "global_step": 375793, "epoch": 4527} {"train_loss": -26.639326095581055, "global_step": 375794, "epoch": 4527} {"train_loss": -25.974109649658203, "global_step": 375795, "epoch": 4527} {"train_loss": -26.215015411376953, "global_step": 375796, "epoch": 4527} {"train_loss": -26.450702667236328, "global_step": 375797, "epoch": 4527} {"train_loss": -26.160968780517578, "global_step": 375798, "epoch": 4527} {"train_loss": -26.012847900390625, "global_step": 375799, "epoch": 4527} {"train_loss": -26.596282958984375, "global_step": 375800, "epoch": 4527} {"train_loss": -26.570053100585938, "global_step": 375801, "epoch": 4527} {"train_loss": -26.590179443359375, "global_step": 375802, "epoch": 4527} {"train_loss": -26.599817276000977, "global_step": 375803, "epoch": 4527} {"train_loss": -26.441736221313477, "global_step": 375804, "epoch": 4527} {"train_loss": -26.43732261657715, "global_step": 375805, "epoch": 4527} {"train_loss": -26.84098243713379, "global_step": 375806, "epoch": 4527} {"train_loss": -26.69654655456543, "global_step": 375807, "epoch": 4527} {"train_loss": -26.416839599609375, "global_step": 375808, "epoch": 4527} {"train_loss": -26.595808029174805, "global_step": 375809, "epoch": 4527} {"train_loss": -26.326175689697266, "global_step": 375810, "epoch": 4527} {"train_loss": -26.680578231811523, "global_step": 375811, "epoch": 4527} {"train_loss": -26.548297882080078, "global_step": 375812, "epoch": 4527} {"train_loss": -25.953588485717773, "global_step": 375813, "epoch": 4527} {"train_loss": -26.718994140625, "global_step": 375814, "epoch": 4527} {"train_loss": -26.11374855041504, "global_step": 375815, "epoch": 4527} {"train_loss": -26.294219970703125, "global_step": 375816, "epoch": 4527} {"train_loss": -26.397306442260742, "global_step": 375817, "epoch": 4527} {"train_loss": -26.40534782409668, "global_step": 375818, "epoch": 4527} {"train_loss": -26.488752365112305, "global_step": 375819, "epoch": 4527} {"train_loss": -26.72039794921875, "global_step": 375820, "epoch": 4527} {"train_loss": -26.21938133239746, "global_step": 375821, "epoch": 4527} {"train_loss": -26.464202880859375, "global_step": 375822, "epoch": 4527} {"train_loss": -26.155081829392767, "global_step": 375823, "epoch": 4527, "val_loss": 6669957.5} {"train_loss": -26.084369659423828, "global_step": 375824, "epoch": 4528} {"train_loss": -25.99592399597168, "global_step": 375825, "epoch": 4528} {"train_loss": -26.32331657409668, "global_step": 375826, "epoch": 4528} {"train_loss": -26.197397232055664, "global_step": 375827, "epoch": 4528} {"train_loss": -25.913496017456055, "global_step": 375828, "epoch": 4528} {"train_loss": -26.154306411743164, "global_step": 375829, "epoch": 4528} {"train_loss": -26.04878044128418, "global_step": 375830, "epoch": 4528} {"train_loss": -26.19597816467285, "global_step": 375831, "epoch": 4528} {"train_loss": -26.00739860534668, "global_step": 375832, "epoch": 4528} {"train_loss": -26.027673721313477, "global_step": 375833, "epoch": 4528} {"train_loss": -26.202381134033203, "global_step": 375834, "epoch": 4528} {"train_loss": -26.303781509399414, "global_step": 375835, "epoch": 4528} {"train_loss": -26.567808151245117, "global_step": 375836, "epoch": 4528} {"train_loss": -26.00714111328125, "global_step": 375837, "epoch": 4528} {"train_loss": -26.542999267578125, "global_step": 375838, "epoch": 4528} {"train_loss": -26.6920223236084, "global_step": 375839, "epoch": 4528} {"train_loss": -26.307233810424805, "global_step": 375840, "epoch": 4528} {"train_loss": -26.479894638061523, "global_step": 375841, "epoch": 4528} {"train_loss": -26.274255752563477, "global_step": 375842, "epoch": 4528} {"train_loss": -26.157352447509766, "global_step": 375843, "epoch": 4528} {"train_loss": -26.18782615661621, "global_step": 375844, "epoch": 4528} {"train_loss": -26.210081100463867, "global_step": 375845, "epoch": 4528} {"train_loss": -26.0162296295166, "global_step": 375846, "epoch": 4528} {"train_loss": -25.82343101501465, "global_step": 375847, "epoch": 4528} {"train_loss": -26.213048934936523, "global_step": 375848, "epoch": 4528} {"train_loss": -26.30409049987793, "global_step": 375849, "epoch": 4528} {"train_loss": -26.435882568359375, "global_step": 375850, "epoch": 4528} {"train_loss": -26.306289672851562, "global_step": 375851, "epoch": 4528} {"train_loss": -25.916900634765625, "global_step": 375852, "epoch": 4528} {"train_loss": -26.49147605895996, "global_step": 375853, "epoch": 4528} {"train_loss": -26.28977394104004, "global_step": 375854, "epoch": 4528} {"train_loss": -26.376249313354492, "global_step": 375855, "epoch": 4528} {"train_loss": -26.116455078125, "global_step": 375856, "epoch": 4528} {"train_loss": -26.352405548095703, "global_step": 375857, "epoch": 4528} {"train_loss": -26.372602462768555, "global_step": 375858, "epoch": 4528} {"train_loss": -26.468891143798828, "global_step": 375859, "epoch": 4528} {"train_loss": -26.352848052978516, "global_step": 375860, "epoch": 4528} {"train_loss": -26.58662223815918, "global_step": 375861, "epoch": 4528} {"train_loss": -26.50043296813965, "global_step": 375862, "epoch": 4528} {"train_loss": -26.562610626220703, "global_step": 375863, "epoch": 4528} {"train_loss": -26.66135597229004, "global_step": 375864, "epoch": 4528} {"train_loss": -26.09539794921875, "global_step": 375865, "epoch": 4528} {"train_loss": -26.33247184753418, "global_step": 375866, "epoch": 4528} {"train_loss": -26.769739151000977, "global_step": 375867, "epoch": 4528} {"train_loss": -26.33785057067871, "global_step": 375868, "epoch": 4528} {"train_loss": -26.586111068725586, "global_step": 375869, "epoch": 4528} {"train_loss": -26.744348526000977, "global_step": 375870, "epoch": 4528} {"train_loss": -26.60640525817871, "global_step": 375871, "epoch": 4528} {"train_loss": -26.357709884643555, "global_step": 375872, "epoch": 4528} {"train_loss": -26.387128829956055, "global_step": 375873, "epoch": 4528} {"train_loss": -26.5823974609375, "global_step": 375874, "epoch": 4528} {"train_loss": -26.59998893737793, "global_step": 375875, "epoch": 4528} {"train_loss": -26.63425064086914, "global_step": 375876, "epoch": 4528} {"train_loss": -26.243993759155273, "global_step": 375877, "epoch": 4528} {"train_loss": -26.398426055908203, "global_step": 375878, "epoch": 4528} {"train_loss": -26.370361328125, "global_step": 375879, "epoch": 4528} {"train_loss": -26.290380477905273, "global_step": 375880, "epoch": 4528} {"train_loss": -26.74151611328125, "global_step": 375881, "epoch": 4528} {"train_loss": -26.314655303955078, "global_step": 375882, "epoch": 4528} {"train_loss": -26.193363189697266, "global_step": 375883, "epoch": 4528} {"train_loss": -26.179462432861328, "global_step": 375884, "epoch": 4528} {"train_loss": -26.067697525024414, "global_step": 375885, "epoch": 4528} {"train_loss": -26.511463165283203, "global_step": 375886, "epoch": 4528} {"train_loss": -26.25447654724121, "global_step": 375887, "epoch": 4528} {"train_loss": -26.277570724487305, "global_step": 375888, "epoch": 4528} {"train_loss": -26.46860122680664, "global_step": 375889, "epoch": 4528} {"train_loss": -26.314132690429688, "global_step": 375890, "epoch": 4528} {"train_loss": -26.068683624267578, "global_step": 375891, "epoch": 4528} {"train_loss": -25.9874324798584, "global_step": 375892, "epoch": 4528} {"train_loss": -26.38532066345215, "global_step": 375893, "epoch": 4528} {"train_loss": -26.46428871154785, "global_step": 375894, "epoch": 4528} {"train_loss": -26.395721435546875, "global_step": 375895, "epoch": 4528} {"train_loss": -26.643030166625977, "global_step": 375896, "epoch": 4528} {"train_loss": -26.294330596923828, "global_step": 375897, "epoch": 4528} {"train_loss": -26.8674373626709, "global_step": 375898, "epoch": 4528} {"train_loss": -26.552560806274414, "global_step": 375899, "epoch": 4528} {"train_loss": -26.7503719329834, "global_step": 375900, "epoch": 4528} {"train_loss": -26.2655086517334, "global_step": 375901, "epoch": 4528} {"train_loss": -26.75604248046875, "global_step": 375902, "epoch": 4528} {"train_loss": -26.094884872436523, "global_step": 375903, "epoch": 4528} {"train_loss": -26.4910945892334, "global_step": 375904, "epoch": 4528} {"train_loss": -26.33407974243164, "global_step": 375905, "epoch": 4528} {"train_loss": -26.344171822789203, "global_step": 375906, "epoch": 4528, "val_loss": 6590875.5} {"train_loss": -26.015167236328125, "global_step": 375907, "epoch": 4529} {"train_loss": -25.334989547729492, "global_step": 375908, "epoch": 4529} {"train_loss": -25.570556640625, "global_step": 375909, "epoch": 4529} {"train_loss": -26.20210838317871, "global_step": 375910, "epoch": 4529} {"train_loss": -25.4012393951416, "global_step": 375911, "epoch": 4529} {"train_loss": -25.547204971313477, "global_step": 375912, "epoch": 4529} {"train_loss": -25.402799606323242, "global_step": 375913, "epoch": 4529} {"train_loss": -26.337377548217773, "global_step": 375914, "epoch": 4529} {"train_loss": -25.36960792541504, "global_step": 375915, "epoch": 4529} {"train_loss": -25.911376953125, "global_step": 375916, "epoch": 4529} {"train_loss": -25.633573532104492, "global_step": 375917, "epoch": 4529} {"train_loss": -25.312992095947266, "global_step": 375918, "epoch": 4529} {"train_loss": -26.108999252319336, "global_step": 375919, "epoch": 4529} {"train_loss": -25.985082626342773, "global_step": 375920, "epoch": 4529} {"train_loss": -26.03586769104004, "global_step": 375921, "epoch": 4529} {"train_loss": -26.056049346923828, "global_step": 375922, "epoch": 4529} {"train_loss": -25.98048973083496, "global_step": 375923, "epoch": 4529} {"train_loss": -26.042194366455078, "global_step": 375924, "epoch": 4529} {"train_loss": -26.290563583374023, "global_step": 375925, "epoch": 4529} {"train_loss": -26.26072120666504, "global_step": 375926, "epoch": 4529} {"train_loss": -26.241342544555664, "global_step": 375927, "epoch": 4529} {"train_loss": -26.138519287109375, "global_step": 375928, "epoch": 4529} {"train_loss": -26.028345108032227, "global_step": 375929, "epoch": 4529} {"train_loss": -25.945730209350586, "global_step": 375930, "epoch": 4529} {"train_loss": -26.166797637939453, "global_step": 375931, "epoch": 4529} {"train_loss": -26.26006507873535, "global_step": 375932, "epoch": 4529} {"train_loss": -26.11081314086914, "global_step": 375933, "epoch": 4529} {"train_loss": -26.569990158081055, "global_step": 375934, "epoch": 4529} {"train_loss": -26.180688858032227, "global_step": 375935, "epoch": 4529} {"train_loss": -26.172937393188477, "global_step": 375936, "epoch": 4529} {"train_loss": -26.6785945892334, "global_step": 375937, "epoch": 4529} {"train_loss": -26.194660186767578, "global_step": 375938, "epoch": 4529} {"train_loss": -26.5279598236084, "global_step": 375939, "epoch": 4529} {"train_loss": -26.50241470336914, "global_step": 375940, "epoch": 4529} {"train_loss": -26.377721786499023, "global_step": 375941, "epoch": 4529} {"train_loss": -26.338796615600586, "global_step": 375942, "epoch": 4529} {"train_loss": -26.121063232421875, "global_step": 375943, "epoch": 4529} {"train_loss": -26.5126953125, "global_step": 375944, "epoch": 4529} {"train_loss": -26.811426162719727, "global_step": 375945, "epoch": 4529} {"train_loss": -26.69414710998535, "global_step": 375946, "epoch": 4529} {"train_loss": -26.811416625976562, "global_step": 375947, "epoch": 4529} {"train_loss": -26.596033096313477, "global_step": 375948, "epoch": 4529} {"train_loss": -26.396240234375, "global_step": 375949, "epoch": 4529} {"train_loss": -26.536657333374023, "global_step": 375950, "epoch": 4529} {"train_loss": -26.49774742126465, "global_step": 375951, "epoch": 4529} {"train_loss": -26.461536407470703, "global_step": 375952, "epoch": 4529} {"train_loss": -26.18988037109375, "global_step": 375953, "epoch": 4529} {"train_loss": -26.710193634033203, "global_step": 375954, "epoch": 4529} {"train_loss": -26.913639068603516, "global_step": 375955, "epoch": 4529} {"train_loss": -26.727209091186523, "global_step": 375956, "epoch": 4529} {"train_loss": -26.822589874267578, "global_step": 375957, "epoch": 4529} {"train_loss": -26.647632598876953, "global_step": 375958, "epoch": 4529} {"train_loss": -26.63223648071289, "global_step": 375959, "epoch": 4529} {"train_loss": -26.4481143951416, "global_step": 375960, "epoch": 4529} {"train_loss": -26.526350021362305, "global_step": 375961, "epoch": 4529} {"train_loss": -26.51483154296875, "global_step": 375962, "epoch": 4529} {"train_loss": -26.528528213500977, "global_step": 375963, "epoch": 4529} {"train_loss": -26.206317901611328, "global_step": 375964, "epoch": 4529} {"train_loss": -25.80474853515625, "global_step": 375965, "epoch": 4529} {"train_loss": -25.805953979492188, "global_step": 375966, "epoch": 4529} {"train_loss": -26.06525993347168, "global_step": 375967, "epoch": 4529} {"train_loss": -26.07355308532715, "global_step": 375968, "epoch": 4529} {"train_loss": -26.417139053344727, "global_step": 375969, "epoch": 4529} {"train_loss": -26.55191421508789, "global_step": 375970, "epoch": 4529} {"train_loss": -26.071924209594727, "global_step": 375971, "epoch": 4529} {"train_loss": -25.981048583984375, "global_step": 375972, "epoch": 4529} {"train_loss": -26.51665687561035, "global_step": 375973, "epoch": 4529} {"train_loss": -26.42820167541504, "global_step": 375974, "epoch": 4529} {"train_loss": -25.989028930664062, "global_step": 375975, "epoch": 4529} {"train_loss": -26.40996742248535, "global_step": 375976, "epoch": 4529} {"train_loss": -26.199752807617188, "global_step": 375977, "epoch": 4529} {"train_loss": -25.661497116088867, "global_step": 375978, "epoch": 4529} {"train_loss": -26.226911544799805, "global_step": 375979, "epoch": 4529} {"train_loss": -25.859603881835938, "global_step": 375980, "epoch": 4529} {"train_loss": -26.327489852905273, "global_step": 375981, "epoch": 4529} {"train_loss": -26.540159225463867, "global_step": 375982, "epoch": 4529} {"train_loss": -26.035451889038086, "global_step": 375983, "epoch": 4529} {"train_loss": -26.6372013092041, "global_step": 375984, "epoch": 4529} {"train_loss": -26.013050079345703, "global_step": 375985, "epoch": 4529} {"train_loss": -26.18695640563965, "global_step": 375986, "epoch": 4529} {"train_loss": -26.090925216674805, "global_step": 375987, "epoch": 4529} {"train_loss": -26.43415641784668, "global_step": 375988, "epoch": 4529} {"train_loss": -26.208701283098705, "global_step": 375989, "epoch": 4529, "val_loss": 6613857.0} {"train_loss": -25.132080078125, "global_step": 375990, "epoch": 4530} {"train_loss": -24.942169189453125, "global_step": 375991, "epoch": 4530} {"train_loss": -25.309890747070312, "global_step": 375992, "epoch": 4530} {"train_loss": -25.374685287475586, "global_step": 375993, "epoch": 4530} {"train_loss": -25.57002067565918, "global_step": 375994, "epoch": 4530} {"train_loss": -26.1016902923584, "global_step": 375995, "epoch": 4530} {"train_loss": -25.35045051574707, "global_step": 375996, "epoch": 4530} {"train_loss": -26.1289119720459, "global_step": 375997, "epoch": 4530} {"train_loss": -25.7871036529541, "global_step": 375998, "epoch": 4530} {"train_loss": -25.890249252319336, "global_step": 375999, "epoch": 4530} {"train_loss": -25.84255027770996, "global_step": 376000, "epoch": 4530} {"train_loss": -25.831823348999023, "global_step": 376001, "epoch": 4530} {"train_loss": -26.1121768951416, "global_step": 376002, "epoch": 4530} {"train_loss": -26.08246421813965, "global_step": 376003, "epoch": 4530} {"train_loss": -26.1673583984375, "global_step": 376004, "epoch": 4530} {"train_loss": -26.22530174255371, "global_step": 376005, "epoch": 4530} {"train_loss": -26.056005477905273, "global_step": 376006, "epoch": 4530} {"train_loss": -26.367639541625977, "global_step": 376007, "epoch": 4530} {"train_loss": -26.05812644958496, "global_step": 376008, "epoch": 4530} {"train_loss": -26.169164657592773, "global_step": 376009, "epoch": 4530} {"train_loss": -26.471097946166992, "global_step": 376010, "epoch": 4530} {"train_loss": -26.390018463134766, "global_step": 376011, "epoch": 4530} {"train_loss": -26.678770065307617, "global_step": 376012, "epoch": 4530} {"train_loss": -26.712162017822266, "global_step": 376013, "epoch": 4530} {"train_loss": -26.359790802001953, "global_step": 376014, "epoch": 4530} {"train_loss": -26.181303024291992, "global_step": 376015, "epoch": 4530} {"train_loss": -26.28610610961914, "global_step": 376016, "epoch": 4530} {"train_loss": -26.14773941040039, "global_step": 376017, "epoch": 4530} {"train_loss": -26.38205909729004, "global_step": 376018, "epoch": 4530} {"train_loss": -26.29090690612793, "global_step": 376019, "epoch": 4530} {"train_loss": -26.22285270690918, "global_step": 376020, "epoch": 4530} {"train_loss": -25.987695693969727, "global_step": 376021, "epoch": 4530} {"train_loss": -26.277130126953125, "global_step": 376022, "epoch": 4530} {"train_loss": -26.593992233276367, "global_step": 376023, "epoch": 4530} {"train_loss": -26.591861724853516, "global_step": 376024, "epoch": 4530} {"train_loss": -26.877593994140625, "global_step": 376025, "epoch": 4530} {"train_loss": -26.502973556518555, "global_step": 376026, "epoch": 4530} {"train_loss": -26.53818702697754, "global_step": 376027, "epoch": 4530} {"train_loss": -26.596454620361328, "global_step": 376028, "epoch": 4530} {"train_loss": -26.736501693725586, "global_step": 376029, "epoch": 4530} {"train_loss": -26.312854766845703, "global_step": 376030, "epoch": 4530} {"train_loss": -26.984785079956055, "global_step": 376031, "epoch": 4530} {"train_loss": -26.637914657592773, "global_step": 376032, "epoch": 4530} {"train_loss": -26.082355499267578, "global_step": 376033, "epoch": 4530} {"train_loss": -26.23712158203125, "global_step": 376034, "epoch": 4530} {"train_loss": -26.404678344726562, "global_step": 376035, "epoch": 4530} {"train_loss": -26.39413833618164, "global_step": 376036, "epoch": 4530} {"train_loss": -26.62255859375, "global_step": 376037, "epoch": 4530} {"train_loss": -26.445947647094727, "global_step": 376038, "epoch": 4530} {"train_loss": -25.964099884033203, "global_step": 376039, "epoch": 4530} {"train_loss": -26.299604415893555, "global_step": 376040, "epoch": 4530} {"train_loss": -26.832916259765625, "global_step": 376041, "epoch": 4530} {"train_loss": -26.503934860229492, "global_step": 376042, "epoch": 4530} {"train_loss": -26.448657989501953, "global_step": 376043, "epoch": 4530} {"train_loss": -26.056909561157227, "global_step": 376044, "epoch": 4530} {"train_loss": -26.500234603881836, "global_step": 376045, "epoch": 4530} {"train_loss": -26.603769302368164, "global_step": 376046, "epoch": 4530} {"train_loss": -26.29585075378418, "global_step": 376047, "epoch": 4530} {"train_loss": -26.007009506225586, "global_step": 376048, "epoch": 4530} {"train_loss": -26.849090576171875, "global_step": 376049, "epoch": 4530} {"train_loss": -26.315229415893555, "global_step": 376050, "epoch": 4530} {"train_loss": -26.328937530517578, "global_step": 376051, "epoch": 4530} {"train_loss": -25.71856117248535, "global_step": 376052, "epoch": 4530} {"train_loss": -25.6003475189209, "global_step": 376053, "epoch": 4530} {"train_loss": -26.407703399658203, "global_step": 376054, "epoch": 4530} {"train_loss": -26.392135620117188, "global_step": 376055, "epoch": 4530} {"train_loss": -26.2426815032959, "global_step": 376056, "epoch": 4530} {"train_loss": -26.53742790222168, "global_step": 376057, "epoch": 4530} {"train_loss": -26.49509620666504, "global_step": 376058, "epoch": 4530} {"train_loss": -26.121374130249023, "global_step": 376059, "epoch": 4530} {"train_loss": -26.40372657775879, "global_step": 376060, "epoch": 4530} {"train_loss": -26.135055541992188, "global_step": 376061, "epoch": 4530} {"train_loss": -26.633228302001953, "global_step": 376062, "epoch": 4530} {"train_loss": -26.262598037719727, "global_step": 376063, "epoch": 4530} {"train_loss": -26.603479385375977, "global_step": 376064, "epoch": 4530} {"train_loss": -26.5241641998291, "global_step": 376065, "epoch": 4530} {"train_loss": -26.736745834350586, "global_step": 376066, "epoch": 4530} {"train_loss": -26.6653995513916, "global_step": 376067, "epoch": 4530} {"train_loss": -26.472381591796875, "global_step": 376068, "epoch": 4530} {"train_loss": -26.790658950805664, "global_step": 376069, "epoch": 4530} {"train_loss": -26.207910537719727, "global_step": 376070, "epoch": 4530} {"train_loss": -26.58028221130371, "global_step": 376071, "epoch": 4530} {"train_loss": -26.258713205176665, "global_step": 376072, "epoch": 4530, "val_loss": 6661967.0} {"train_loss": -26.151050567626953, "global_step": 376073, "epoch": 4531} {"train_loss": -25.907758712768555, "global_step": 376074, "epoch": 4531} {"train_loss": -26.636341094970703, "global_step": 376075, "epoch": 4531} {"train_loss": -26.387943267822266, "global_step": 376076, "epoch": 4531} {"train_loss": -26.06292152404785, "global_step": 376077, "epoch": 4531} {"train_loss": -26.519947052001953, "global_step": 376078, "epoch": 4531} {"train_loss": -26.22157096862793, "global_step": 376079, "epoch": 4531} {"train_loss": -26.46884536743164, "global_step": 376080, "epoch": 4531} {"train_loss": -26.127477645874023, "global_step": 376081, "epoch": 4531} {"train_loss": -26.4592227935791, "global_step": 376082, "epoch": 4531} {"train_loss": -26.09527587890625, "global_step": 376083, "epoch": 4531} {"train_loss": -26.3959903717041, "global_step": 376084, "epoch": 4531} {"train_loss": -26.246829986572266, "global_step": 376085, "epoch": 4531} {"train_loss": -26.497058868408203, "global_step": 376086, "epoch": 4531} {"train_loss": -26.504194259643555, "global_step": 376087, "epoch": 4531} {"train_loss": -26.309558868408203, "global_step": 376088, "epoch": 4531} {"train_loss": -26.199796676635742, "global_step": 376089, "epoch": 4531} {"train_loss": -26.835851669311523, "global_step": 376090, "epoch": 4531} {"train_loss": -25.919641494750977, "global_step": 376091, "epoch": 4531} {"train_loss": -26.092147827148438, "global_step": 376092, "epoch": 4531} {"train_loss": -26.25092124938965, "global_step": 376093, "epoch": 4531} {"train_loss": -26.305118560791016, "global_step": 376094, "epoch": 4531} {"train_loss": -26.268213272094727, "global_step": 376095, "epoch": 4531} {"train_loss": -25.977920532226562, "global_step": 376096, "epoch": 4531} {"train_loss": -26.43792724609375, "global_step": 376097, "epoch": 4531} {"train_loss": -26.529800415039062, "global_step": 376098, "epoch": 4531} {"train_loss": -26.121301651000977, "global_step": 376099, "epoch": 4531} {"train_loss": -26.12322425842285, "global_step": 376100, "epoch": 4531} {"train_loss": -26.40313720703125, "global_step": 376101, "epoch": 4531} {"train_loss": -26.370670318603516, "global_step": 376102, "epoch": 4531} {"train_loss": -26.102375030517578, "global_step": 376103, "epoch": 4531} {"train_loss": -26.218225479125977, "global_step": 376104, "epoch": 4531} {"train_loss": -25.884906768798828, "global_step": 376105, "epoch": 4531} {"train_loss": -26.615299224853516, "global_step": 376106, "epoch": 4531} {"train_loss": -25.662755966186523, "global_step": 376107, "epoch": 4531} {"train_loss": -26.07428550720215, "global_step": 376108, "epoch": 4531} {"train_loss": -25.87799072265625, "global_step": 376109, "epoch": 4531} {"train_loss": -26.154850006103516, "global_step": 376110, "epoch": 4531} {"train_loss": -26.030242919921875, "global_step": 376111, "epoch": 4531} {"train_loss": -26.065099716186523, "global_step": 376112, "epoch": 4531} {"train_loss": -26.15705680847168, "global_step": 376113, "epoch": 4531} {"train_loss": -26.53419303894043, "global_step": 376114, "epoch": 4531} {"train_loss": -26.06475830078125, "global_step": 376115, "epoch": 4531} {"train_loss": -26.338544845581055, "global_step": 376116, "epoch": 4531} {"train_loss": -26.099197387695312, "global_step": 376117, "epoch": 4531} {"train_loss": -26.22705078125, "global_step": 376118, "epoch": 4531} {"train_loss": -26.45098876953125, "global_step": 376119, "epoch": 4531} {"train_loss": -26.10524559020996, "global_step": 376120, "epoch": 4531} {"train_loss": -26.474069595336914, "global_step": 376121, "epoch": 4531} {"train_loss": -26.581327438354492, "global_step": 376122, "epoch": 4531} {"train_loss": -26.259292602539062, "global_step": 376123, "epoch": 4531} {"train_loss": -26.13640785217285, "global_step": 376124, "epoch": 4531} {"train_loss": -26.142425537109375, "global_step": 376125, "epoch": 4531} {"train_loss": -26.1458683013916, "global_step": 376126, "epoch": 4531} {"train_loss": -26.50310707092285, "global_step": 376127, "epoch": 4531} {"train_loss": -26.360265731811523, "global_step": 376128, "epoch": 4531} {"train_loss": -26.760351181030273, "global_step": 376129, "epoch": 4531} {"train_loss": -26.64692497253418, "global_step": 376130, "epoch": 4531} {"train_loss": -26.340097427368164, "global_step": 376131, "epoch": 4531} {"train_loss": -26.451589584350586, "global_step": 376132, "epoch": 4531} {"train_loss": -26.4345645904541, "global_step": 376133, "epoch": 4531} {"train_loss": -27.18977928161621, "global_step": 376134, "epoch": 4531} {"train_loss": -26.62860107421875, "global_step": 376135, "epoch": 4531} {"train_loss": -26.38800048828125, "global_step": 376136, "epoch": 4531} {"train_loss": -26.106510162353516, "global_step": 376137, "epoch": 4531} {"train_loss": -26.185699462890625, "global_step": 376138, "epoch": 4531} {"train_loss": -26.58540916442871, "global_step": 376139, "epoch": 4531} {"train_loss": -26.490909576416016, "global_step": 376140, "epoch": 4531} {"train_loss": -26.73453140258789, "global_step": 376141, "epoch": 4531} {"train_loss": -26.368270874023438, "global_step": 376142, "epoch": 4531} {"train_loss": -26.640127182006836, "global_step": 376143, "epoch": 4531} {"train_loss": -26.097003936767578, "global_step": 376144, "epoch": 4531} {"train_loss": -26.794248580932617, "global_step": 376145, "epoch": 4531} {"train_loss": -26.878461837768555, "global_step": 376146, "epoch": 4531} {"train_loss": -26.329015731811523, "global_step": 376147, "epoch": 4531} {"train_loss": -26.510400772094727, "global_step": 376148, "epoch": 4531} {"train_loss": -26.294952392578125, "global_step": 376149, "epoch": 4531} {"train_loss": -26.21991539001465, "global_step": 376150, "epoch": 4531} {"train_loss": -26.5750789642334, "global_step": 376151, "epoch": 4531} {"train_loss": -26.643741607666016, "global_step": 376152, "epoch": 4531} {"train_loss": -26.75592613220215, "global_step": 376153, "epoch": 4531} {"train_loss": -26.3731632232666, "global_step": 376154, "epoch": 4531} {"train_loss": -26.329519662512354, "global_step": 376155, "epoch": 4531, "val_loss": 6591827.5} {"train_loss": -22.827299118041992, "global_step": 376156, "epoch": 4532} {"train_loss": -24.3973388671875, "global_step": 376157, "epoch": 4532} {"train_loss": -25.740026473999023, "global_step": 376158, "epoch": 4532} {"train_loss": -25.386768341064453, "global_step": 376159, "epoch": 4532} {"train_loss": -25.110883712768555, "global_step": 376160, "epoch": 4532} {"train_loss": -25.417861938476562, "global_step": 376161, "epoch": 4532} {"train_loss": -25.643583297729492, "global_step": 376162, "epoch": 4532} {"train_loss": -25.265316009521484, "global_step": 376163, "epoch": 4532} {"train_loss": -25.250446319580078, "global_step": 376164, "epoch": 4532} {"train_loss": -25.58150291442871, "global_step": 376165, "epoch": 4532} {"train_loss": -25.7794189453125, "global_step": 376166, "epoch": 4532} {"train_loss": -25.69610595703125, "global_step": 376167, "epoch": 4532} {"train_loss": -25.712060928344727, "global_step": 376168, "epoch": 4532} {"train_loss": -25.7266845703125, "global_step": 376169, "epoch": 4532} {"train_loss": -25.519926071166992, "global_step": 376170, "epoch": 4532} {"train_loss": -26.190753936767578, "global_step": 376171, "epoch": 4532} {"train_loss": -25.7596492767334, "global_step": 376172, "epoch": 4532} {"train_loss": -26.104398727416992, "global_step": 376173, "epoch": 4532} {"train_loss": -25.5869197845459, "global_step": 376174, "epoch": 4532} {"train_loss": -25.880895614624023, "global_step": 376175, "epoch": 4532} {"train_loss": -26.153226852416992, "global_step": 376176, "epoch": 4532} {"train_loss": -25.716266632080078, "global_step": 376177, "epoch": 4532} {"train_loss": -26.077497482299805, "global_step": 376178, "epoch": 4532} {"train_loss": -26.156723022460938, "global_step": 376179, "epoch": 4532} {"train_loss": -26.28474235534668, "global_step": 376180, "epoch": 4532} {"train_loss": -25.8203182220459, "global_step": 376181, "epoch": 4532} {"train_loss": -26.074085235595703, "global_step": 376182, "epoch": 4532} {"train_loss": -26.026636123657227, "global_step": 376183, "epoch": 4532} {"train_loss": -26.269445419311523, "global_step": 376184, "epoch": 4532} {"train_loss": -26.493274688720703, "global_step": 376185, "epoch": 4532} {"train_loss": -26.257246017456055, "global_step": 376186, "epoch": 4532} {"train_loss": -26.091388702392578, "global_step": 376187, "epoch": 4532} {"train_loss": -26.42270278930664, "global_step": 376188, "epoch": 4532} {"train_loss": -26.28204917907715, "global_step": 376189, "epoch": 4532} {"train_loss": -26.447006225585938, "global_step": 376190, "epoch": 4532} {"train_loss": -26.392431259155273, "global_step": 376191, "epoch": 4532} {"train_loss": -26.323627471923828, "global_step": 376192, "epoch": 4532} {"train_loss": -26.329065322875977, "global_step": 376193, "epoch": 4532} {"train_loss": -26.636648178100586, "global_step": 376194, "epoch": 4532} {"train_loss": -25.99757194519043, "global_step": 376195, "epoch": 4532} {"train_loss": -26.2410831451416, "global_step": 376196, "epoch": 4532} {"train_loss": -26.354307174682617, "global_step": 376197, "epoch": 4532} {"train_loss": -26.378767013549805, "global_step": 376198, "epoch": 4532} {"train_loss": -26.166791915893555, "global_step": 376199, "epoch": 4532} {"train_loss": -26.64332389831543, "global_step": 376200, "epoch": 4532} {"train_loss": -26.570693969726562, "global_step": 376201, "epoch": 4532} {"train_loss": -26.587539672851562, "global_step": 376202, "epoch": 4532} {"train_loss": -26.616851806640625, "global_step": 376203, "epoch": 4532} {"train_loss": -26.4783935546875, "global_step": 376204, "epoch": 4532} {"train_loss": -26.543176651000977, "global_step": 376205, "epoch": 4532} {"train_loss": -26.9210205078125, "global_step": 376206, "epoch": 4532} {"train_loss": -26.443525314331055, "global_step": 376207, "epoch": 4532} {"train_loss": -26.476179122924805, "global_step": 376208, "epoch": 4532} {"train_loss": -26.46622657775879, "global_step": 376209, "epoch": 4532} {"train_loss": -26.317209243774414, "global_step": 376210, "epoch": 4532} {"train_loss": -26.24380874633789, "global_step": 376211, "epoch": 4532} {"train_loss": -26.253204345703125, "global_step": 376212, "epoch": 4532} {"train_loss": -26.6021785736084, "global_step": 376213, "epoch": 4532} {"train_loss": -26.446548461914062, "global_step": 376214, "epoch": 4532} {"train_loss": -26.302173614501953, "global_step": 376215, "epoch": 4532} {"train_loss": -26.4318904876709, "global_step": 376216, "epoch": 4532} {"train_loss": -26.454458236694336, "global_step": 376217, "epoch": 4532} {"train_loss": -26.180938720703125, "global_step": 376218, "epoch": 4532} {"train_loss": -26.553085327148438, "global_step": 376219, "epoch": 4532} {"train_loss": -26.226099014282227, "global_step": 376220, "epoch": 4532} {"train_loss": -26.509723663330078, "global_step": 376221, "epoch": 4532} {"train_loss": -26.095754623413086, "global_step": 376222, "epoch": 4532} {"train_loss": -25.35645866394043, "global_step": 376223, "epoch": 4532} {"train_loss": -25.980453491210938, "global_step": 376224, "epoch": 4532} {"train_loss": -26.310705184936523, "global_step": 376225, "epoch": 4532} {"train_loss": -26.191354751586914, "global_step": 376226, "epoch": 4532} {"train_loss": -26.44573402404785, "global_step": 376227, "epoch": 4532} {"train_loss": -26.369653701782227, "global_step": 376228, "epoch": 4532} {"train_loss": -26.204511642456055, "global_step": 376229, "epoch": 4532} {"train_loss": -26.485082626342773, "global_step": 376230, "epoch": 4532} {"train_loss": -26.535419464111328, "global_step": 376231, "epoch": 4532} {"train_loss": -26.618621826171875, "global_step": 376232, "epoch": 4532} {"train_loss": -26.3927059173584, "global_step": 376233, "epoch": 4532} {"train_loss": -26.31134033203125, "global_step": 376234, "epoch": 4532} {"train_loss": -26.4754638671875, "global_step": 376235, "epoch": 4532} {"train_loss": -26.41383934020996, "global_step": 376236, "epoch": 4532} {"train_loss": -26.335315704345703, "global_step": 376237, "epoch": 4532} {"train_loss": -26.10769471777491, "global_step": 376238, "epoch": 4532, "val_loss": 6715011.0} {"train_loss": -26.083932876586914, "global_step": 376239, "epoch": 4533} {"train_loss": -26.10096549987793, "global_step": 376240, "epoch": 4533} {"train_loss": -25.672693252563477, "global_step": 376241, "epoch": 4533} {"train_loss": -26.371231079101562, "global_step": 376242, "epoch": 4533} {"train_loss": -26.04741859436035, "global_step": 376243, "epoch": 4533} {"train_loss": -25.806882858276367, "global_step": 376244, "epoch": 4533} {"train_loss": -26.036945343017578, "global_step": 376245, "epoch": 4533} {"train_loss": -26.2553768157959, "global_step": 376246, "epoch": 4533} {"train_loss": -25.60284996032715, "global_step": 376247, "epoch": 4533} {"train_loss": -25.723196029663086, "global_step": 376248, "epoch": 4533} {"train_loss": -25.85504722595215, "global_step": 376249, "epoch": 4533} {"train_loss": -26.252140045166016, "global_step": 376250, "epoch": 4533} {"train_loss": -25.945575714111328, "global_step": 376251, "epoch": 4533} {"train_loss": -25.7973690032959, "global_step": 376252, "epoch": 4533} {"train_loss": -26.414411544799805, "global_step": 376253, "epoch": 4533} {"train_loss": -26.06830406188965, "global_step": 376254, "epoch": 4533} {"train_loss": -25.785520553588867, "global_step": 376255, "epoch": 4533} {"train_loss": -26.322675704956055, "global_step": 376256, "epoch": 4533} {"train_loss": -26.25245475769043, "global_step": 376257, "epoch": 4533} {"train_loss": -26.3991641998291, "global_step": 376258, "epoch": 4533} {"train_loss": -26.363412857055664, "global_step": 376259, "epoch": 4533} {"train_loss": -26.491622924804688, "global_step": 376260, "epoch": 4533} {"train_loss": -26.381153106689453, "global_step": 376261, "epoch": 4533} {"train_loss": -26.323694229125977, "global_step": 376262, "epoch": 4533} {"train_loss": -26.785751342773438, "global_step": 376263, "epoch": 4533} {"train_loss": -26.333932876586914, "global_step": 376264, "epoch": 4533} {"train_loss": -26.1422119140625, "global_step": 376265, "epoch": 4533} {"train_loss": -26.294309616088867, "global_step": 376266, "epoch": 4533} {"train_loss": -26.27479362487793, "global_step": 376267, "epoch": 4533} {"train_loss": -26.093658447265625, "global_step": 376268, "epoch": 4533} {"train_loss": -26.49932861328125, "global_step": 376269, "epoch": 4533} {"train_loss": -26.10959815979004, "global_step": 376270, "epoch": 4533} {"train_loss": -26.565046310424805, "global_step": 376271, "epoch": 4533} {"train_loss": -26.40484619140625, "global_step": 376272, "epoch": 4533} {"train_loss": -26.517948150634766, "global_step": 376273, "epoch": 4533} {"train_loss": -26.363727569580078, "global_step": 376274, "epoch": 4533} {"train_loss": -26.818387985229492, "global_step": 376275, "epoch": 4533} {"train_loss": -26.834518432617188, "global_step": 376276, "epoch": 4533} {"train_loss": -26.44639015197754, "global_step": 376277, "epoch": 4533} {"train_loss": -26.391651153564453, "global_step": 376278, "epoch": 4533} {"train_loss": -26.3984317779541, "global_step": 376279, "epoch": 4533} {"train_loss": -26.90443229675293, "global_step": 376280, "epoch": 4533} {"train_loss": -26.626096725463867, "global_step": 376281, "epoch": 4533} {"train_loss": -26.515344619750977, "global_step": 376282, "epoch": 4533} {"train_loss": -26.276342391967773, "global_step": 376283, "epoch": 4533} {"train_loss": -26.15887451171875, "global_step": 376284, "epoch": 4533} {"train_loss": -26.299121856689453, "global_step": 376285, "epoch": 4533} {"train_loss": -26.77707290649414, "global_step": 376286, "epoch": 4533} {"train_loss": -26.31929588317871, "global_step": 376287, "epoch": 4533} {"train_loss": -25.967304229736328, "global_step": 376288, "epoch": 4533} {"train_loss": -26.066608428955078, "global_step": 376289, "epoch": 4533} {"train_loss": -26.0263614654541, "global_step": 376290, "epoch": 4533} {"train_loss": -26.4869441986084, "global_step": 376291, "epoch": 4533} {"train_loss": -26.284687042236328, "global_step": 376292, "epoch": 4533} {"train_loss": -26.100433349609375, "global_step": 376293, "epoch": 4533} {"train_loss": -26.572525024414062, "global_step": 376294, "epoch": 4533} {"train_loss": -26.192224502563477, "global_step": 376295, "epoch": 4533} {"train_loss": -26.296283721923828, "global_step": 376296, "epoch": 4533} {"train_loss": -26.89088249206543, "global_step": 376297, "epoch": 4533} {"train_loss": -26.556921005249023, "global_step": 376298, "epoch": 4533} {"train_loss": -26.98369789123535, "global_step": 376299, "epoch": 4533} {"train_loss": -26.152179718017578, "global_step": 376300, "epoch": 4533} {"train_loss": -26.38758659362793, "global_step": 376301, "epoch": 4533} {"train_loss": -26.86492347717285, "global_step": 376302, "epoch": 4533} {"train_loss": -26.435226440429688, "global_step": 376303, "epoch": 4533} {"train_loss": -26.21602439880371, "global_step": 376304, "epoch": 4533} {"train_loss": -26.37860107421875, "global_step": 376305, "epoch": 4533} {"train_loss": -26.22616958618164, "global_step": 376306, "epoch": 4533} {"train_loss": -26.44968032836914, "global_step": 376307, "epoch": 4533} {"train_loss": -26.54033851623535, "global_step": 376308, "epoch": 4533} {"train_loss": -26.5226993560791, "global_step": 376309, "epoch": 4533} {"train_loss": -26.20527458190918, "global_step": 376310, "epoch": 4533} {"train_loss": -26.649625778198242, "global_step": 376311, "epoch": 4533} {"train_loss": -26.480777740478516, "global_step": 376312, "epoch": 4533} {"train_loss": -26.525915145874023, "global_step": 376313, "epoch": 4533} {"train_loss": -26.1939640045166, "global_step": 376314, "epoch": 4533} {"train_loss": -26.584253311157227, "global_step": 376315, "epoch": 4533} {"train_loss": -26.5262508392334, "global_step": 376316, "epoch": 4533} {"train_loss": -26.40983009338379, "global_step": 376317, "epoch": 4533} {"train_loss": -26.892993927001953, "global_step": 376318, "epoch": 4533} {"train_loss": -26.468915939331055, "global_step": 376319, "epoch": 4533} {"train_loss": -26.3776798248291, "global_step": 376320, "epoch": 4533} {"train_loss": -26.34579591865999, "global_step": 376321, "epoch": 4533, "val_loss": 6594882.0} {"train_loss": -25.842395782470703, "global_step": 376322, "epoch": 4534} {"train_loss": -25.229564666748047, "global_step": 376323, "epoch": 4534} {"train_loss": -26.154653549194336, "global_step": 376324, "epoch": 4534} {"train_loss": -26.116247177124023, "global_step": 376325, "epoch": 4534} {"train_loss": -25.391250610351562, "global_step": 376326, "epoch": 4534} {"train_loss": -25.692480087280273, "global_step": 376327, "epoch": 4534} {"train_loss": -26.17513084411621, "global_step": 376328, "epoch": 4534} {"train_loss": -25.888273239135742, "global_step": 376329, "epoch": 4534} {"train_loss": -26.143232345581055, "global_step": 376330, "epoch": 4534} {"train_loss": -25.545679092407227, "global_step": 376331, "epoch": 4534} {"train_loss": -26.139495849609375, "global_step": 376332, "epoch": 4534} {"train_loss": -25.77144432067871, "global_step": 376333, "epoch": 4534} {"train_loss": -25.474782943725586, "global_step": 376334, "epoch": 4534} {"train_loss": -26.049253463745117, "global_step": 376335, "epoch": 4534} {"train_loss": -26.010461807250977, "global_step": 376336, "epoch": 4534} {"train_loss": -26.193750381469727, "global_step": 376337, "epoch": 4534} {"train_loss": -25.651472091674805, "global_step": 376338, "epoch": 4534} {"train_loss": -25.8574161529541, "global_step": 376339, "epoch": 4534} {"train_loss": -26.324249267578125, "global_step": 376340, "epoch": 4534} {"train_loss": -26.168127059936523, "global_step": 376341, "epoch": 4534} {"train_loss": -25.69708251953125, "global_step": 376342, "epoch": 4534} {"train_loss": -26.317426681518555, "global_step": 376343, "epoch": 4534} {"train_loss": -26.105695724487305, "global_step": 376344, "epoch": 4534} {"train_loss": -25.925756454467773, "global_step": 376345, "epoch": 4534} {"train_loss": -26.267078399658203, "global_step": 376346, "epoch": 4534} {"train_loss": -26.393857955932617, "global_step": 376347, "epoch": 4534} {"train_loss": -26.151411056518555, "global_step": 376348, "epoch": 4534} {"train_loss": -26.126867294311523, "global_step": 376349, "epoch": 4534} {"train_loss": -26.013681411743164, "global_step": 376350, "epoch": 4534} {"train_loss": -26.284931182861328, "global_step": 376351, "epoch": 4534} {"train_loss": -26.495452880859375, "global_step": 376352, "epoch": 4534} {"train_loss": -26.429853439331055, "global_step": 376353, "epoch": 4534} {"train_loss": -26.51104736328125, "global_step": 376354, "epoch": 4534} {"train_loss": -26.5980281829834, "global_step": 376355, "epoch": 4534} {"train_loss": -26.47613525390625, "global_step": 376356, "epoch": 4534} {"train_loss": -26.57655143737793, "global_step": 376357, "epoch": 4534} {"train_loss": -26.567218780517578, "global_step": 376358, "epoch": 4534} {"train_loss": -26.561933517456055, "global_step": 376359, "epoch": 4534} {"train_loss": -26.663238525390625, "global_step": 376360, "epoch": 4534} {"train_loss": -26.71257972717285, "global_step": 376361, "epoch": 4534} {"train_loss": -26.624591827392578, "global_step": 376362, "epoch": 4534} {"train_loss": -26.564191818237305, "global_step": 376363, "epoch": 4534} {"train_loss": -26.662689208984375, "global_step": 376364, "epoch": 4534} {"train_loss": -26.381925582885742, "global_step": 376365, "epoch": 4534} {"train_loss": -26.59492301940918, "global_step": 376366, "epoch": 4534} {"train_loss": -26.5369815826416, "global_step": 376367, "epoch": 4534} {"train_loss": -26.602155685424805, "global_step": 376368, "epoch": 4534} {"train_loss": -26.349714279174805, "global_step": 376369, "epoch": 4534} {"train_loss": -26.367521286010742, "global_step": 376370, "epoch": 4534} {"train_loss": -26.425947189331055, "global_step": 376371, "epoch": 4534} {"train_loss": -26.16363525390625, "global_step": 376372, "epoch": 4534} {"train_loss": -26.583478927612305, "global_step": 376373, "epoch": 4534} {"train_loss": -26.15003776550293, "global_step": 376374, "epoch": 4534} {"train_loss": -26.675119400024414, "global_step": 376375, "epoch": 4534} {"train_loss": -26.587610244750977, "global_step": 376376, "epoch": 4534} {"train_loss": -26.70289421081543, "global_step": 376377, "epoch": 4534} {"train_loss": -26.835248947143555, "global_step": 376378, "epoch": 4534} {"train_loss": -26.6306095123291, "global_step": 376379, "epoch": 4534} {"train_loss": -26.483301162719727, "global_step": 376380, "epoch": 4534} {"train_loss": -26.80936622619629, "global_step": 376381, "epoch": 4534} {"train_loss": -26.4348087310791, "global_step": 376382, "epoch": 4534} {"train_loss": -26.637054443359375, "global_step": 376383, "epoch": 4534} {"train_loss": -26.535303115844727, "global_step": 376384, "epoch": 4534} {"train_loss": -26.707651138305664, "global_step": 376385, "epoch": 4534} {"train_loss": -26.4814510345459, "global_step": 376386, "epoch": 4534} {"train_loss": -26.341156005859375, "global_step": 376387, "epoch": 4534} {"train_loss": -26.539127349853516, "global_step": 376388, "epoch": 4534} {"train_loss": -26.55217933654785, "global_step": 376389, "epoch": 4534} {"train_loss": -26.6019229888916, "global_step": 376390, "epoch": 4534} {"train_loss": -26.547229766845703, "global_step": 376391, "epoch": 4534} {"train_loss": -26.575300216674805, "global_step": 376392, "epoch": 4534} {"train_loss": -26.76820945739746, "global_step": 376393, "epoch": 4534} {"train_loss": -26.588422775268555, "global_step": 376394, "epoch": 4534} {"train_loss": -26.24344253540039, "global_step": 376395, "epoch": 4534} {"train_loss": -26.148120880126953, "global_step": 376396, "epoch": 4534} {"train_loss": -25.965356826782227, "global_step": 376397, "epoch": 4534} {"train_loss": -25.97898292541504, "global_step": 376398, "epoch": 4534} {"train_loss": -26.3466854095459, "global_step": 376399, "epoch": 4534} {"train_loss": -26.4473819732666, "global_step": 376400, "epoch": 4534} {"train_loss": -26.60833168029785, "global_step": 376401, "epoch": 4534} {"train_loss": -26.4559268951416, "global_step": 376402, "epoch": 4534} {"train_loss": -26.15863609313965, "global_step": 376403, "epoch": 4534} {"train_loss": -26.299405385212726, "global_step": 376404, "epoch": 4534, "val_loss": 6562321.0} {"train_loss": -25.912567138671875, "global_step": 376405, "epoch": 4535} {"train_loss": -25.932239532470703, "global_step": 376406, "epoch": 4535} {"train_loss": -26.208303451538086, "global_step": 376407, "epoch": 4535} {"train_loss": -26.168119430541992, "global_step": 376408, "epoch": 4535} {"train_loss": -25.53986930847168, "global_step": 376409, "epoch": 4535} {"train_loss": -26.062210083007812, "global_step": 376410, "epoch": 4535} {"train_loss": -25.71662712097168, "global_step": 376411, "epoch": 4535} {"train_loss": -26.043964385986328, "global_step": 376412, "epoch": 4535} {"train_loss": -25.837690353393555, "global_step": 376413, "epoch": 4535} {"train_loss": -26.304418563842773, "global_step": 376414, "epoch": 4535} {"train_loss": -25.919647216796875, "global_step": 376415, "epoch": 4535} {"train_loss": -25.587112426757812, "global_step": 376416, "epoch": 4535} {"train_loss": -25.819915771484375, "global_step": 376417, "epoch": 4535} {"train_loss": -26.078144073486328, "global_step": 376418, "epoch": 4535} {"train_loss": -26.253509521484375, "global_step": 376419, "epoch": 4535} {"train_loss": -25.588315963745117, "global_step": 376420, "epoch": 4535} {"train_loss": -26.217466354370117, "global_step": 376421, "epoch": 4535} {"train_loss": -25.969696044921875, "global_step": 376422, "epoch": 4535} {"train_loss": -25.73695182800293, "global_step": 376423, "epoch": 4535} {"train_loss": -26.020923614501953, "global_step": 376424, "epoch": 4535} {"train_loss": -26.541656494140625, "global_step": 376425, "epoch": 4535} {"train_loss": -26.07366943359375, "global_step": 376426, "epoch": 4535} {"train_loss": -26.364633560180664, "global_step": 376427, "epoch": 4535} {"train_loss": -26.307950973510742, "global_step": 376428, "epoch": 4535} {"train_loss": -26.065305709838867, "global_step": 376429, "epoch": 4535} {"train_loss": -26.199888229370117, "global_step": 376430, "epoch": 4535} {"train_loss": -26.66322898864746, "global_step": 376431, "epoch": 4535} {"train_loss": -26.309967041015625, "global_step": 376432, "epoch": 4535} {"train_loss": -26.56089210510254, "global_step": 376433, "epoch": 4535} {"train_loss": -26.774295806884766, "global_step": 376434, "epoch": 4535} {"train_loss": -26.348230361938477, "global_step": 376435, "epoch": 4535} {"train_loss": -26.238149642944336, "global_step": 376436, "epoch": 4535} {"train_loss": -26.828125, "global_step": 376437, "epoch": 4535} {"train_loss": -26.678159713745117, "global_step": 376438, "epoch": 4535} {"train_loss": -26.111347198486328, "global_step": 376439, "epoch": 4535} {"train_loss": -26.602659225463867, "global_step": 376440, "epoch": 4535} {"train_loss": -26.5826358795166, "global_step": 376441, "epoch": 4535} {"train_loss": -26.287683486938477, "global_step": 376442, "epoch": 4535} {"train_loss": -26.482654571533203, "global_step": 376443, "epoch": 4535} {"train_loss": -26.205087661743164, "global_step": 376444, "epoch": 4535} {"train_loss": -26.51197624206543, "global_step": 376445, "epoch": 4535} {"train_loss": -26.048505783081055, "global_step": 376446, "epoch": 4535} {"train_loss": -26.578500747680664, "global_step": 376447, "epoch": 4535} {"train_loss": -26.525144577026367, "global_step": 376448, "epoch": 4535} {"train_loss": -26.16342544555664, "global_step": 376449, "epoch": 4535} {"train_loss": -26.36142921447754, "global_step": 376450, "epoch": 4535} {"train_loss": -26.166412353515625, "global_step": 376451, "epoch": 4535} {"train_loss": -26.19037437438965, "global_step": 376452, "epoch": 4535} {"train_loss": -26.525583267211914, "global_step": 376453, "epoch": 4535} {"train_loss": -26.626270294189453, "global_step": 376454, "epoch": 4535} {"train_loss": -26.466827392578125, "global_step": 376455, "epoch": 4535} {"train_loss": -26.259979248046875, "global_step": 376456, "epoch": 4535} {"train_loss": -26.46912956237793, "global_step": 376457, "epoch": 4535} {"train_loss": -26.129657745361328, "global_step": 376458, "epoch": 4535} {"train_loss": -26.3787841796875, "global_step": 376459, "epoch": 4535} {"train_loss": -26.35015296936035, "global_step": 376460, "epoch": 4535} {"train_loss": -26.381591796875, "global_step": 376461, "epoch": 4535} {"train_loss": -26.77524757385254, "global_step": 376462, "epoch": 4535} {"train_loss": -26.173053741455078, "global_step": 376463, "epoch": 4535} {"train_loss": -26.2052059173584, "global_step": 376464, "epoch": 4535} {"train_loss": -26.51727294921875, "global_step": 376465, "epoch": 4535} {"train_loss": -27.000446319580078, "global_step": 376466, "epoch": 4535} {"train_loss": -26.544036865234375, "global_step": 376467, "epoch": 4535} {"train_loss": -26.3720703125, "global_step": 376468, "epoch": 4535} {"train_loss": -26.378583908081055, "global_step": 376469, "epoch": 4535} {"train_loss": -26.55256462097168, "global_step": 376470, "epoch": 4535} {"train_loss": -26.670713424682617, "global_step": 376471, "epoch": 4535} {"train_loss": -26.336551666259766, "global_step": 376472, "epoch": 4535} {"train_loss": -26.337650299072266, "global_step": 376473, "epoch": 4535} {"train_loss": -26.435565948486328, "global_step": 376474, "epoch": 4535} {"train_loss": -26.805084228515625, "global_step": 376475, "epoch": 4535} {"train_loss": -26.56446647644043, "global_step": 376476, "epoch": 4535} {"train_loss": -26.40858268737793, "global_step": 376477, "epoch": 4535} {"train_loss": -26.2623233795166, "global_step": 376478, "epoch": 4535} {"train_loss": -26.352340698242188, "global_step": 376479, "epoch": 4535} {"train_loss": -26.637815475463867, "global_step": 376480, "epoch": 4535} {"train_loss": -26.70147132873535, "global_step": 376481, "epoch": 4535} {"train_loss": -26.707061767578125, "global_step": 376482, "epoch": 4535} {"train_loss": -26.620569229125977, "global_step": 376483, "epoch": 4535} {"train_loss": -26.6439151763916, "global_step": 376484, "epoch": 4535} {"train_loss": -26.61185646057129, "global_step": 376485, "epoch": 4535} {"train_loss": -26.57240867614746, "global_step": 376486, "epoch": 4535} {"train_loss": -26.319019110806018, "global_step": 376487, "epoch": 4535, "val_loss": 6575049.0} {"train_loss": -26.357666015625, "global_step": 376488, "epoch": 4536} {"train_loss": -25.822256088256836, "global_step": 376489, "epoch": 4536} {"train_loss": -25.9619083404541, "global_step": 376490, "epoch": 4536} {"train_loss": -25.910297393798828, "global_step": 376491, "epoch": 4536} {"train_loss": -25.84375, "global_step": 376492, "epoch": 4536} {"train_loss": -26.424427032470703, "global_step": 376493, "epoch": 4536} {"train_loss": -26.273193359375, "global_step": 376494, "epoch": 4536} {"train_loss": -26.00806999206543, "global_step": 376495, "epoch": 4536} {"train_loss": -26.307727813720703, "global_step": 376496, "epoch": 4536} {"train_loss": -26.20428466796875, "global_step": 376497, "epoch": 4536} {"train_loss": -25.794361114501953, "global_step": 376498, "epoch": 4536} {"train_loss": -26.2996883392334, "global_step": 376499, "epoch": 4536} {"train_loss": -26.093463897705078, "global_step": 376500, "epoch": 4536} {"train_loss": -25.9819278717041, "global_step": 376501, "epoch": 4536} {"train_loss": -26.19818115234375, "global_step": 376502, "epoch": 4536} {"train_loss": -26.400894165039062, "global_step": 376503, "epoch": 4536} {"train_loss": -26.04044532775879, "global_step": 376504, "epoch": 4536} {"train_loss": -25.974817276000977, "global_step": 376505, "epoch": 4536} {"train_loss": -26.435653686523438, "global_step": 376506, "epoch": 4536} {"train_loss": -25.994171142578125, "global_step": 376507, "epoch": 4536} {"train_loss": -26.628971099853516, "global_step": 376508, "epoch": 4536} {"train_loss": -26.589527130126953, "global_step": 376509, "epoch": 4536} {"train_loss": -26.3807430267334, "global_step": 376510, "epoch": 4536} {"train_loss": -26.63799476623535, "global_step": 376511, "epoch": 4536} {"train_loss": -26.38673973083496, "global_step": 376512, "epoch": 4536} {"train_loss": -26.331165313720703, "global_step": 376513, "epoch": 4536} {"train_loss": -26.832172393798828, "global_step": 376514, "epoch": 4536} {"train_loss": -26.622671127319336, "global_step": 376515, "epoch": 4536} {"train_loss": -26.328351974487305, "global_step": 376516, "epoch": 4536} {"train_loss": -26.43832778930664, "global_step": 376517, "epoch": 4536} {"train_loss": -26.595075607299805, "global_step": 376518, "epoch": 4536} {"train_loss": -26.53997230529785, "global_step": 376519, "epoch": 4536} {"train_loss": -26.25630760192871, "global_step": 376520, "epoch": 4536} {"train_loss": -26.48890495300293, "global_step": 376521, "epoch": 4536} {"train_loss": -26.537647247314453, "global_step": 376522, "epoch": 4536} {"train_loss": -26.522802352905273, "global_step": 376523, "epoch": 4536} {"train_loss": -26.656158447265625, "global_step": 376524, "epoch": 4536} {"train_loss": -26.338226318359375, "global_step": 376525, "epoch": 4536} {"train_loss": -26.498815536499023, "global_step": 376526, "epoch": 4536} {"train_loss": -26.480072021484375, "global_step": 376527, "epoch": 4536} {"train_loss": -26.074737548828125, "global_step": 376528, "epoch": 4536} {"train_loss": -26.32370376586914, "global_step": 376529, "epoch": 4536} {"train_loss": -26.290510177612305, "global_step": 376530, "epoch": 4536} {"train_loss": -26.393157958984375, "global_step": 376531, "epoch": 4536} {"train_loss": -26.51056480407715, "global_step": 376532, "epoch": 4536} {"train_loss": -26.279804229736328, "global_step": 376533, "epoch": 4536} {"train_loss": -26.397146224975586, "global_step": 376534, "epoch": 4536} {"train_loss": -26.20318031311035, "global_step": 376535, "epoch": 4536} {"train_loss": -26.042226791381836, "global_step": 376536, "epoch": 4536} {"train_loss": -26.153736114501953, "global_step": 376537, "epoch": 4536} {"train_loss": -25.812427520751953, "global_step": 376538, "epoch": 4536} {"train_loss": -26.26114845275879, "global_step": 376539, "epoch": 4536} {"train_loss": -26.38356590270996, "global_step": 376540, "epoch": 4536} {"train_loss": -26.1767578125, "global_step": 376541, "epoch": 4536} {"train_loss": -25.997297286987305, "global_step": 376542, "epoch": 4536} {"train_loss": -26.282367706298828, "global_step": 376543, "epoch": 4536} {"train_loss": -26.151708602905273, "global_step": 376544, "epoch": 4536} {"train_loss": -26.280826568603516, "global_step": 376545, "epoch": 4536} {"train_loss": -26.367267608642578, "global_step": 376546, "epoch": 4536} {"train_loss": -26.420995712280273, "global_step": 376547, "epoch": 4536} {"train_loss": -26.542333602905273, "global_step": 376548, "epoch": 4536} {"train_loss": -26.66956901550293, "global_step": 376549, "epoch": 4536} {"train_loss": -26.566909790039062, "global_step": 376550, "epoch": 4536} {"train_loss": -26.52577018737793, "global_step": 376551, "epoch": 4536} {"train_loss": -26.7503719329834, "global_step": 376552, "epoch": 4536} {"train_loss": -26.40594482421875, "global_step": 376553, "epoch": 4536} {"train_loss": -26.4172420501709, "global_step": 376554, "epoch": 4536} {"train_loss": -26.7482967376709, "global_step": 376555, "epoch": 4536} {"train_loss": -26.149673461914062, "global_step": 376556, "epoch": 4536} {"train_loss": -26.910367965698242, "global_step": 376557, "epoch": 4536} {"train_loss": -26.4787654876709, "global_step": 376558, "epoch": 4536} {"train_loss": -26.775745391845703, "global_step": 376559, "epoch": 4536} {"train_loss": -26.4270076751709, "global_step": 376560, "epoch": 4536} {"train_loss": -26.296167373657227, "global_step": 376561, "epoch": 4536} {"train_loss": -26.838586807250977, "global_step": 376562, "epoch": 4536} {"train_loss": -26.4503173828125, "global_step": 376563, "epoch": 4536} {"train_loss": -26.260522842407227, "global_step": 376564, "epoch": 4536} {"train_loss": -26.561681747436523, "global_step": 376565, "epoch": 4536} {"train_loss": -26.501022338867188, "global_step": 376566, "epoch": 4536} {"train_loss": -26.514734268188477, "global_step": 376567, "epoch": 4536} {"train_loss": -26.363489151000977, "global_step": 376568, "epoch": 4536} {"train_loss": -26.769824981689453, "global_step": 376569, "epoch": 4536} {"train_loss": -26.35316138669669, "global_step": 376570, "epoch": 4536, "val_loss": 6620400.0} {"train_loss": -25.233007431030273, "global_step": 376571, "epoch": 4537} {"train_loss": -25.380701065063477, "global_step": 376572, "epoch": 4537} {"train_loss": -25.842422485351562, "global_step": 376573, "epoch": 4537} {"train_loss": -25.482969284057617, "global_step": 376574, "epoch": 4537} {"train_loss": -25.565113067626953, "global_step": 376575, "epoch": 4537} {"train_loss": -25.096250534057617, "global_step": 376576, "epoch": 4537} {"train_loss": -25.758909225463867, "global_step": 376577, "epoch": 4537} {"train_loss": -25.7037353515625, "global_step": 376578, "epoch": 4537} {"train_loss": -25.72890281677246, "global_step": 376579, "epoch": 4537} {"train_loss": -25.469268798828125, "global_step": 376580, "epoch": 4537} {"train_loss": -25.731698989868164, "global_step": 376581, "epoch": 4537} {"train_loss": -25.559871673583984, "global_step": 376582, "epoch": 4537} {"train_loss": -25.496152877807617, "global_step": 376583, "epoch": 4537} {"train_loss": -25.985986709594727, "global_step": 376584, "epoch": 4537} {"train_loss": -25.85127067565918, "global_step": 376585, "epoch": 4537} {"train_loss": -25.62977409362793, "global_step": 376586, "epoch": 4537} {"train_loss": -26.07523536682129, "global_step": 376587, "epoch": 4537} {"train_loss": -25.7562198638916, "global_step": 376588, "epoch": 4537} {"train_loss": -26.1490478515625, "global_step": 376589, "epoch": 4537} {"train_loss": -26.122528076171875, "global_step": 376590, "epoch": 4537} {"train_loss": -25.95139503479004, "global_step": 376591, "epoch": 4537} {"train_loss": -26.05838966369629, "global_step": 376592, "epoch": 4537} {"train_loss": -26.047765731811523, "global_step": 376593, "epoch": 4537} {"train_loss": -26.112890243530273, "global_step": 376594, "epoch": 4537} {"train_loss": -26.096435546875, "global_step": 376595, "epoch": 4537} {"train_loss": -26.225910186767578, "global_step": 376596, "epoch": 4537} {"train_loss": -26.1845645904541, "global_step": 376597, "epoch": 4537} {"train_loss": -25.87774658203125, "global_step": 376598, "epoch": 4537} {"train_loss": -26.175037384033203, "global_step": 376599, "epoch": 4537} {"train_loss": -26.199554443359375, "global_step": 376600, "epoch": 4537} {"train_loss": -26.231555938720703, "global_step": 376601, "epoch": 4537} {"train_loss": -26.117267608642578, "global_step": 376602, "epoch": 4537} {"train_loss": -26.8165340423584, "global_step": 376603, "epoch": 4537} {"train_loss": -26.526838302612305, "global_step": 376604, "epoch": 4537} {"train_loss": -26.171201705932617, "global_step": 376605, "epoch": 4537} {"train_loss": -26.49360466003418, "global_step": 376606, "epoch": 4537} {"train_loss": -26.280942916870117, "global_step": 376607, "epoch": 4537} {"train_loss": -26.666156768798828, "global_step": 376608, "epoch": 4537} {"train_loss": -26.672882080078125, "global_step": 376609, "epoch": 4537} {"train_loss": -26.003305435180664, "global_step": 376610, "epoch": 4537} {"train_loss": -26.630796432495117, "global_step": 376611, "epoch": 4537} {"train_loss": -26.30449867248535, "global_step": 376612, "epoch": 4537} {"train_loss": -26.210880279541016, "global_step": 376613, "epoch": 4537} {"train_loss": -26.260181427001953, "global_step": 376614, "epoch": 4537} {"train_loss": -26.91633415222168, "global_step": 376615, "epoch": 4537} {"train_loss": -26.357168197631836, "global_step": 376616, "epoch": 4537} {"train_loss": -26.776533126831055, "global_step": 376617, "epoch": 4537} {"train_loss": -26.65839958190918, "global_step": 376618, "epoch": 4537} {"train_loss": -26.329511642456055, "global_step": 376619, "epoch": 4537} {"train_loss": -26.333423614501953, "global_step": 376620, "epoch": 4537} {"train_loss": -26.377416610717773, "global_step": 376621, "epoch": 4537} {"train_loss": -26.134801864624023, "global_step": 376622, "epoch": 4537} {"train_loss": -26.21988296508789, "global_step": 376623, "epoch": 4537} {"train_loss": -26.513940811157227, "global_step": 376624, "epoch": 4537} {"train_loss": -26.49480628967285, "global_step": 376625, "epoch": 4537} {"train_loss": -26.24893569946289, "global_step": 376626, "epoch": 4537} {"train_loss": -26.422582626342773, "global_step": 376627, "epoch": 4537} {"train_loss": -26.52937889099121, "global_step": 376628, "epoch": 4537} {"train_loss": -26.366357803344727, "global_step": 376629, "epoch": 4537} {"train_loss": -26.587051391601562, "global_step": 376630, "epoch": 4537} {"train_loss": -26.41436195373535, "global_step": 376631, "epoch": 4537} {"train_loss": -26.51310157775879, "global_step": 376632, "epoch": 4537} {"train_loss": -26.372821807861328, "global_step": 376633, "epoch": 4537} {"train_loss": -26.618066787719727, "global_step": 376634, "epoch": 4537} {"train_loss": -26.150487899780273, "global_step": 376635, "epoch": 4537} {"train_loss": -26.006208419799805, "global_step": 376636, "epoch": 4537} {"train_loss": -26.115995407104492, "global_step": 376637, "epoch": 4537} {"train_loss": -26.509302139282227, "global_step": 376638, "epoch": 4537} {"train_loss": -26.647598266601562, "global_step": 376639, "epoch": 4537} {"train_loss": -25.986352920532227, "global_step": 376640, "epoch": 4537} {"train_loss": -26.119491577148438, "global_step": 376641, "epoch": 4537} {"train_loss": -26.3021240234375, "global_step": 376642, "epoch": 4537} {"train_loss": -26.413572311401367, "global_step": 376643, "epoch": 4537} {"train_loss": -25.985559463500977, "global_step": 376644, "epoch": 4537} {"train_loss": -26.344482421875, "global_step": 376645, "epoch": 4537} {"train_loss": -26.435455322265625, "global_step": 376646, "epoch": 4537} {"train_loss": -26.274076461791992, "global_step": 376647, "epoch": 4537} {"train_loss": -26.337263107299805, "global_step": 376648, "epoch": 4537} {"train_loss": -26.843215942382812, "global_step": 376649, "epoch": 4537} {"train_loss": -26.322912216186523, "global_step": 376650, "epoch": 4537} {"train_loss": -26.27985191345215, "global_step": 376651, "epoch": 4537} {"train_loss": -26.10467529296875, "global_step": 376652, "epoch": 4537} {"train_loss": -26.17892637597509, "global_step": 376653, "epoch": 4537, "val_loss": 6627980.0} {"train_loss": -26.49607276916504, "global_step": 376654, "epoch": 4538} {"train_loss": -26.13313865661621, "global_step": 376655, "epoch": 4538} {"train_loss": -26.143762588500977, "global_step": 376656, "epoch": 4538} {"train_loss": -26.37531852722168, "global_step": 376657, "epoch": 4538} {"train_loss": -26.47086524963379, "global_step": 376658, "epoch": 4538} {"train_loss": -26.2717227935791, "global_step": 376659, "epoch": 4538} {"train_loss": -26.594175338745117, "global_step": 376660, "epoch": 4538} {"train_loss": -26.485748291015625, "global_step": 376661, "epoch": 4538} {"train_loss": -26.424631118774414, "global_step": 376662, "epoch": 4538} {"train_loss": -26.411670684814453, "global_step": 376663, "epoch": 4538} {"train_loss": -26.2667293548584, "global_step": 376664, "epoch": 4538} {"train_loss": -26.623437881469727, "global_step": 376665, "epoch": 4538} {"train_loss": -26.277118682861328, "global_step": 376666, "epoch": 4538} {"train_loss": -26.495264053344727, "global_step": 376667, "epoch": 4538} {"train_loss": -26.306711196899414, "global_step": 376668, "epoch": 4538} {"train_loss": -26.65781593322754, "global_step": 376669, "epoch": 4538} {"train_loss": -26.408445358276367, "global_step": 376670, "epoch": 4538} {"train_loss": -26.607633590698242, "global_step": 376671, "epoch": 4538} {"train_loss": -26.44217872619629, "global_step": 376672, "epoch": 4538} {"train_loss": -26.374570846557617, "global_step": 376673, "epoch": 4538} {"train_loss": -26.291187286376953, "global_step": 376674, "epoch": 4538} {"train_loss": -26.03168296813965, "global_step": 376675, "epoch": 4538} {"train_loss": -26.23370933532715, "global_step": 376676, "epoch": 4538} {"train_loss": -26.461652755737305, "global_step": 376677, "epoch": 4538} {"train_loss": -26.7171688079834, "global_step": 376678, "epoch": 4538} {"train_loss": -26.614282608032227, "global_step": 376679, "epoch": 4538} {"train_loss": -26.449758529663086, "global_step": 376680, "epoch": 4538} {"train_loss": -26.621692657470703, "global_step": 376681, "epoch": 4538} {"train_loss": -26.507709503173828, "global_step": 376682, "epoch": 4538} {"train_loss": -26.434717178344727, "global_step": 376683, "epoch": 4538} {"train_loss": -26.66607666015625, "global_step": 376684, "epoch": 4538} {"train_loss": -26.486963272094727, "global_step": 376685, "epoch": 4538} {"train_loss": -26.27469825744629, "global_step": 376686, "epoch": 4538} {"train_loss": -26.52178382873535, "global_step": 376687, "epoch": 4538} {"train_loss": -26.242273330688477, "global_step": 376688, "epoch": 4538} {"train_loss": -26.576766967773438, "global_step": 376689, "epoch": 4538} {"train_loss": -26.36427116394043, "global_step": 376690, "epoch": 4538} {"train_loss": -26.768354415893555, "global_step": 376691, "epoch": 4538} {"train_loss": -26.528852462768555, "global_step": 376692, "epoch": 4538} {"train_loss": -26.50347900390625, "global_step": 376693, "epoch": 4538} {"train_loss": -26.610986709594727, "global_step": 376694, "epoch": 4538} {"train_loss": -26.3565616607666, "global_step": 376695, "epoch": 4538} {"train_loss": -26.399337768554688, "global_step": 376696, "epoch": 4538} {"train_loss": -26.57200050354004, "global_step": 376697, "epoch": 4538} {"train_loss": -26.281097412109375, "global_step": 376698, "epoch": 4538} {"train_loss": -26.195890426635742, "global_step": 376699, "epoch": 4538} {"train_loss": -26.877737045288086, "global_step": 376700, "epoch": 4538} {"train_loss": -26.20648193359375, "global_step": 376701, "epoch": 4538} {"train_loss": -25.983768463134766, "global_step": 376702, "epoch": 4538} {"train_loss": -26.281721115112305, "global_step": 376703, "epoch": 4538} {"train_loss": -26.549224853515625, "global_step": 376704, "epoch": 4538} {"train_loss": -26.46478271484375, "global_step": 376705, "epoch": 4538} {"train_loss": -26.338239669799805, "global_step": 376706, "epoch": 4538} {"train_loss": -26.48781394958496, "global_step": 376707, "epoch": 4538} {"train_loss": -26.282230377197266, "global_step": 376708, "epoch": 4538} {"train_loss": -26.345489501953125, "global_step": 376709, "epoch": 4538} {"train_loss": -26.44586181640625, "global_step": 376710, "epoch": 4538} {"train_loss": -26.080961227416992, "global_step": 376711, "epoch": 4538} {"train_loss": -26.07602882385254, "global_step": 376712, "epoch": 4538} {"train_loss": -26.218549728393555, "global_step": 376713, "epoch": 4538} {"train_loss": -26.40680503845215, "global_step": 376714, "epoch": 4538} {"train_loss": -26.477819442749023, "global_step": 376715, "epoch": 4538} {"train_loss": -26.402219772338867, "global_step": 376716, "epoch": 4538} {"train_loss": -26.30694580078125, "global_step": 376717, "epoch": 4538} {"train_loss": -26.360685348510742, "global_step": 376718, "epoch": 4538} {"train_loss": -26.224185943603516, "global_step": 376719, "epoch": 4538} {"train_loss": -27.0101318359375, "global_step": 376720, "epoch": 4538} {"train_loss": -26.458093643188477, "global_step": 376721, "epoch": 4538} {"train_loss": -26.30057716369629, "global_step": 376722, "epoch": 4538} {"train_loss": -26.282703399658203, "global_step": 376723, "epoch": 4538} {"train_loss": -26.433629989624023, "global_step": 376724, "epoch": 4538} {"train_loss": -26.40764808654785, "global_step": 376725, "epoch": 4538} {"train_loss": -26.23605728149414, "global_step": 376726, "epoch": 4538} {"train_loss": -25.76612663269043, "global_step": 376727, "epoch": 4538} {"train_loss": -26.47144889831543, "global_step": 376728, "epoch": 4538} {"train_loss": -26.249679565429688, "global_step": 376729, "epoch": 4538} {"train_loss": -26.278827667236328, "global_step": 376730, "epoch": 4538} {"train_loss": -26.2922420501709, "global_step": 376731, "epoch": 4538} {"train_loss": -26.6152400970459, "global_step": 376732, "epoch": 4538} {"train_loss": -26.4195613861084, "global_step": 376733, "epoch": 4538} {"train_loss": -26.9105281829834, "global_step": 376734, "epoch": 4538} {"train_loss": -26.202259063720703, "global_step": 376735, "epoch": 4538} {"train_loss": -26.40292321630271, "global_step": 376736, "epoch": 4538, "val_loss": 6592429.5} {"train_loss": -25.95270347595215, "global_step": 376737, "epoch": 4539} {"train_loss": -25.640287399291992, "global_step": 376738, "epoch": 4539} {"train_loss": -25.702489852905273, "global_step": 376739, "epoch": 4539} {"train_loss": -26.547666549682617, "global_step": 376740, "epoch": 4539} {"train_loss": -25.52593231201172, "global_step": 376741, "epoch": 4539} {"train_loss": -25.952184677124023, "global_step": 376742, "epoch": 4539} {"train_loss": -26.28977394104004, "global_step": 376743, "epoch": 4539} {"train_loss": -26.377614974975586, "global_step": 376744, "epoch": 4539} {"train_loss": -26.110998153686523, "global_step": 376745, "epoch": 4539} {"train_loss": -26.09305191040039, "global_step": 376746, "epoch": 4539} {"train_loss": -26.280776977539062, "global_step": 376747, "epoch": 4539} {"train_loss": -26.1174259185791, "global_step": 376748, "epoch": 4539} {"train_loss": -26.535634994506836, "global_step": 376749, "epoch": 4539} {"train_loss": -26.489410400390625, "global_step": 376750, "epoch": 4539} {"train_loss": -26.1054744720459, "global_step": 376751, "epoch": 4539} {"train_loss": -26.18779945373535, "global_step": 376752, "epoch": 4539} {"train_loss": -26.527685165405273, "global_step": 376753, "epoch": 4539} {"train_loss": -26.23809242248535, "global_step": 376754, "epoch": 4539} {"train_loss": -26.155492782592773, "global_step": 376755, "epoch": 4539} {"train_loss": -26.77593421936035, "global_step": 376756, "epoch": 4539} {"train_loss": -26.465612411499023, "global_step": 376757, "epoch": 4539} {"train_loss": -26.896900177001953, "global_step": 376758, "epoch": 4539} {"train_loss": -26.428319931030273, "global_step": 376759, "epoch": 4539} {"train_loss": -26.337156295776367, "global_step": 376760, "epoch": 4539} {"train_loss": -26.052331924438477, "global_step": 376761, "epoch": 4539} {"train_loss": -25.99468421936035, "global_step": 376762, "epoch": 4539} {"train_loss": -26.382177352905273, "global_step": 376763, "epoch": 4539} {"train_loss": -26.459766387939453, "global_step": 376764, "epoch": 4539} {"train_loss": -26.605304718017578, "global_step": 376765, "epoch": 4539} {"train_loss": -26.34370994567871, "global_step": 376766, "epoch": 4539} {"train_loss": -26.092670440673828, "global_step": 376767, "epoch": 4539} {"train_loss": -26.690418243408203, "global_step": 376768, "epoch": 4539} {"train_loss": -26.510822296142578, "global_step": 376769, "epoch": 4539} {"train_loss": -26.31842041015625, "global_step": 376770, "epoch": 4539} {"train_loss": -26.586807250976562, "global_step": 376771, "epoch": 4539} {"train_loss": -26.615005493164062, "global_step": 376772, "epoch": 4539} {"train_loss": -26.386154174804688, "global_step": 376773, "epoch": 4539} {"train_loss": -26.172748565673828, "global_step": 376774, "epoch": 4539} {"train_loss": -26.73299217224121, "global_step": 376775, "epoch": 4539} {"train_loss": -26.481653213500977, "global_step": 376776, "epoch": 4539} {"train_loss": -26.570276260375977, "global_step": 376777, "epoch": 4539} {"train_loss": -26.078964233398438, "global_step": 376778, "epoch": 4539} {"train_loss": -26.5346622467041, "global_step": 376779, "epoch": 4539} {"train_loss": -26.352502822875977, "global_step": 376780, "epoch": 4539} {"train_loss": -26.26856803894043, "global_step": 376781, "epoch": 4539} {"train_loss": -26.228042602539062, "global_step": 376782, "epoch": 4539} {"train_loss": -26.275766372680664, "global_step": 376783, "epoch": 4539} {"train_loss": -26.249128341674805, "global_step": 376784, "epoch": 4539} {"train_loss": -26.791425704956055, "global_step": 376785, "epoch": 4539} {"train_loss": -26.364307403564453, "global_step": 376786, "epoch": 4539} {"train_loss": -26.680068969726562, "global_step": 376787, "epoch": 4539} {"train_loss": -26.190351486206055, "global_step": 376788, "epoch": 4539} {"train_loss": -26.28570556640625, "global_step": 376789, "epoch": 4539} {"train_loss": -26.37701988220215, "global_step": 376790, "epoch": 4539} {"train_loss": -26.68952751159668, "global_step": 376791, "epoch": 4539} {"train_loss": -26.507495880126953, "global_step": 376792, "epoch": 4539} {"train_loss": -26.422119140625, "global_step": 376793, "epoch": 4539} {"train_loss": -26.925886154174805, "global_step": 376794, "epoch": 4539} {"train_loss": -26.37619400024414, "global_step": 376795, "epoch": 4539} {"train_loss": -26.27247428894043, "global_step": 376796, "epoch": 4539} {"train_loss": -27.003437042236328, "global_step": 376797, "epoch": 4539} {"train_loss": -26.477380752563477, "global_step": 376798, "epoch": 4539} {"train_loss": -26.18136978149414, "global_step": 376799, "epoch": 4539} {"train_loss": -26.138486862182617, "global_step": 376800, "epoch": 4539} {"train_loss": -26.75493812561035, "global_step": 376801, "epoch": 4539} {"train_loss": -26.143787384033203, "global_step": 376802, "epoch": 4539} {"train_loss": -26.04620933532715, "global_step": 376803, "epoch": 4539} {"train_loss": -26.05402183532715, "global_step": 376804, "epoch": 4539} {"train_loss": -26.366174697875977, "global_step": 376805, "epoch": 4539} {"train_loss": -26.433385848999023, "global_step": 376806, "epoch": 4539} {"train_loss": -26.660364151000977, "global_step": 376807, "epoch": 4539} {"train_loss": -26.776037216186523, "global_step": 376808, "epoch": 4539} {"train_loss": -26.476774215698242, "global_step": 376809, "epoch": 4539} {"train_loss": -26.284164428710938, "global_step": 376810, "epoch": 4539} {"train_loss": -26.258453369140625, "global_step": 376811, "epoch": 4539} {"train_loss": -26.208484649658203, "global_step": 376812, "epoch": 4539} {"train_loss": -25.93755531311035, "global_step": 376813, "epoch": 4539} {"train_loss": -26.158859252929688, "global_step": 376814, "epoch": 4539} {"train_loss": -26.626667022705078, "global_step": 376815, "epoch": 4539} {"train_loss": -26.586408615112305, "global_step": 376816, "epoch": 4539} {"train_loss": -26.371292114257812, "global_step": 376817, "epoch": 4539} {"train_loss": -26.404438018798828, "global_step": 376818, "epoch": 4539} {"train_loss": -26.352272906935358, "global_step": 376819, "epoch": 4539, "val_loss": 6698999.0} {"train_loss": -25.583555221557617, "global_step": 376820, "epoch": 4540} {"train_loss": -25.69053077697754, "global_step": 376821, "epoch": 4540} {"train_loss": -25.700109481811523, "global_step": 376822, "epoch": 4540} {"train_loss": -25.825607299804688, "global_step": 376823, "epoch": 4540} {"train_loss": -26.183353424072266, "global_step": 376824, "epoch": 4540} {"train_loss": -25.90399742126465, "global_step": 376825, "epoch": 4540} {"train_loss": -26.133703231811523, "global_step": 376826, "epoch": 4540} {"train_loss": -26.02338981628418, "global_step": 376827, "epoch": 4540} {"train_loss": -26.3076229095459, "global_step": 376828, "epoch": 4540} {"train_loss": -26.333911895751953, "global_step": 376829, "epoch": 4540} {"train_loss": -26.1208553314209, "global_step": 376830, "epoch": 4540} {"train_loss": -26.271448135375977, "global_step": 376831, "epoch": 4540} {"train_loss": -26.428674697875977, "global_step": 376832, "epoch": 4540} {"train_loss": -26.101736068725586, "global_step": 376833, "epoch": 4540} {"train_loss": -26.332489013671875, "global_step": 376834, "epoch": 4540} {"train_loss": -26.42732048034668, "global_step": 376835, "epoch": 4540} {"train_loss": -26.26824951171875, "global_step": 376836, "epoch": 4540} {"train_loss": -26.127548217773438, "global_step": 376837, "epoch": 4540} {"train_loss": -26.460895538330078, "global_step": 376838, "epoch": 4540} {"train_loss": -25.957538604736328, "global_step": 376839, "epoch": 4540} {"train_loss": -26.264591217041016, "global_step": 376840, "epoch": 4540} {"train_loss": -26.444753646850586, "global_step": 376841, "epoch": 4540} {"train_loss": -26.394668579101562, "global_step": 376842, "epoch": 4540} {"train_loss": -26.308197021484375, "global_step": 376843, "epoch": 4540} {"train_loss": -26.54705810546875, "global_step": 376844, "epoch": 4540} {"train_loss": -26.571125030517578, "global_step": 376845, "epoch": 4540} {"train_loss": -26.199481964111328, "global_step": 376846, "epoch": 4540} {"train_loss": -26.719022750854492, "global_step": 376847, "epoch": 4540} {"train_loss": -26.65228271484375, "global_step": 376848, "epoch": 4540} {"train_loss": -26.46416664123535, "global_step": 376849, "epoch": 4540} {"train_loss": -26.817113876342773, "global_step": 376850, "epoch": 4540} {"train_loss": -26.426025390625, "global_step": 376851, "epoch": 4540} {"train_loss": -26.77631187438965, "global_step": 376852, "epoch": 4540} {"train_loss": -26.801061630249023, "global_step": 376853, "epoch": 4540} {"train_loss": -26.36317253112793, "global_step": 376854, "epoch": 4540} {"train_loss": -26.607275009155273, "global_step": 376855, "epoch": 4540} {"train_loss": -26.697711944580078, "global_step": 376856, "epoch": 4540} {"train_loss": -26.87982177734375, "global_step": 376857, "epoch": 4540} {"train_loss": -26.67396354675293, "global_step": 376858, "epoch": 4540} {"train_loss": -26.905790328979492, "global_step": 376859, "epoch": 4540} {"train_loss": -26.952787399291992, "global_step": 376860, "epoch": 4540} {"train_loss": -26.70366859436035, "global_step": 376861, "epoch": 4540} {"train_loss": -26.63909339904785, "global_step": 376862, "epoch": 4540} {"train_loss": -26.579345703125, "global_step": 376863, "epoch": 4540} {"train_loss": -26.65681266784668, "global_step": 376864, "epoch": 4540} {"train_loss": -26.63502311706543, "global_step": 376865, "epoch": 4540} {"train_loss": -26.091211318969727, "global_step": 376866, "epoch": 4540} {"train_loss": -26.33961296081543, "global_step": 376867, "epoch": 4540} {"train_loss": -26.640066146850586, "global_step": 376868, "epoch": 4540} {"train_loss": -26.4288330078125, "global_step": 376869, "epoch": 4540} {"train_loss": -26.411151885986328, "global_step": 376870, "epoch": 4540} {"train_loss": -26.43638038635254, "global_step": 376871, "epoch": 4540} {"train_loss": -25.946542739868164, "global_step": 376872, "epoch": 4540} {"train_loss": -25.438058853149414, "global_step": 376873, "epoch": 4540} {"train_loss": -26.392099380493164, "global_step": 376874, "epoch": 4540} {"train_loss": -26.841144561767578, "global_step": 376875, "epoch": 4540} {"train_loss": -26.44400978088379, "global_step": 376876, "epoch": 4540} {"train_loss": -26.428329467773438, "global_step": 376877, "epoch": 4540} {"train_loss": -25.816797256469727, "global_step": 376878, "epoch": 4540} {"train_loss": -26.05470085144043, "global_step": 376879, "epoch": 4540} {"train_loss": -25.492929458618164, "global_step": 376880, "epoch": 4540} {"train_loss": -25.81412696838379, "global_step": 376881, "epoch": 4540} {"train_loss": -26.446069717407227, "global_step": 376882, "epoch": 4540} {"train_loss": -26.134124755859375, "global_step": 376883, "epoch": 4540} {"train_loss": -26.1124210357666, "global_step": 376884, "epoch": 4540} {"train_loss": -26.174457550048828, "global_step": 376885, "epoch": 4540} {"train_loss": -26.154525756835938, "global_step": 376886, "epoch": 4540} {"train_loss": -26.069766998291016, "global_step": 376887, "epoch": 4540} {"train_loss": -26.1989688873291, "global_step": 376888, "epoch": 4540} {"train_loss": -26.0123348236084, "global_step": 376889, "epoch": 4540} {"train_loss": -26.606740951538086, "global_step": 376890, "epoch": 4540} {"train_loss": -26.548986434936523, "global_step": 376891, "epoch": 4540} {"train_loss": -26.20778465270996, "global_step": 376892, "epoch": 4540} {"train_loss": -26.467090606689453, "global_step": 376893, "epoch": 4540} {"train_loss": -26.400409698486328, "global_step": 376894, "epoch": 4540} {"train_loss": -26.307342529296875, "global_step": 376895, "epoch": 4540} {"train_loss": -26.1912899017334, "global_step": 376896, "epoch": 4540} {"train_loss": -26.735260009765625, "global_step": 376897, "epoch": 4540} {"train_loss": -26.295068740844727, "global_step": 376898, "epoch": 4540} {"train_loss": -26.675168991088867, "global_step": 376899, "epoch": 4540} {"train_loss": -26.195819854736328, "global_step": 376900, "epoch": 4540} {"train_loss": -26.57891273498535, "global_step": 376901, "epoch": 4540} {"train_loss": -26.334770754159216, "global_step": 376902, "epoch": 4540, "val_loss": 6620314.0} {"train_loss": -26.285327911376953, "global_step": 376903, "epoch": 4541} {"train_loss": -26.15437126159668, "global_step": 376904, "epoch": 4541} {"train_loss": -25.95502281188965, "global_step": 376905, "epoch": 4541} {"train_loss": -26.324787139892578, "global_step": 376906, "epoch": 4541} {"train_loss": -25.800525665283203, "global_step": 376907, "epoch": 4541} {"train_loss": -25.824726104736328, "global_step": 376908, "epoch": 4541} {"train_loss": -25.8290958404541, "global_step": 376909, "epoch": 4541} {"train_loss": -26.556293487548828, "global_step": 376910, "epoch": 4541} {"train_loss": -26.38735008239746, "global_step": 376911, "epoch": 4541} {"train_loss": -26.187149047851562, "global_step": 376912, "epoch": 4541} {"train_loss": -26.13295555114746, "global_step": 376913, "epoch": 4541} {"train_loss": -26.150999069213867, "global_step": 376914, "epoch": 4541} {"train_loss": -26.0137882232666, "global_step": 376915, "epoch": 4541} {"train_loss": -26.141586303710938, "global_step": 376916, "epoch": 4541} {"train_loss": -26.345800399780273, "global_step": 376917, "epoch": 4541} {"train_loss": -26.43580436706543, "global_step": 376918, "epoch": 4541} {"train_loss": -26.28814125061035, "global_step": 376919, "epoch": 4541} {"train_loss": -26.61273193359375, "global_step": 376920, "epoch": 4541} {"train_loss": -26.1806697845459, "global_step": 376921, "epoch": 4541} {"train_loss": -26.39896011352539, "global_step": 376922, "epoch": 4541} {"train_loss": -26.4881591796875, "global_step": 376923, "epoch": 4541} {"train_loss": -26.2723445892334, "global_step": 376924, "epoch": 4541} {"train_loss": -26.328479766845703, "global_step": 376925, "epoch": 4541} {"train_loss": -26.1859073638916, "global_step": 376926, "epoch": 4541} {"train_loss": -26.703510284423828, "global_step": 376927, "epoch": 4541} {"train_loss": -26.5334529876709, "global_step": 376928, "epoch": 4541} {"train_loss": -26.412906646728516, "global_step": 376929, "epoch": 4541} {"train_loss": -26.740320205688477, "global_step": 376930, "epoch": 4541} {"train_loss": -26.66497802734375, "global_step": 376931, "epoch": 4541} {"train_loss": -26.780088424682617, "global_step": 376932, "epoch": 4541} {"train_loss": -26.398061752319336, "global_step": 376933, "epoch": 4541} {"train_loss": -26.641986846923828, "global_step": 376934, "epoch": 4541} {"train_loss": -26.232929229736328, "global_step": 376935, "epoch": 4541} {"train_loss": -26.737812042236328, "global_step": 376936, "epoch": 4541} {"train_loss": -26.195697784423828, "global_step": 376937, "epoch": 4541} {"train_loss": -26.307966232299805, "global_step": 376938, "epoch": 4541} {"train_loss": -26.179443359375, "global_step": 376939, "epoch": 4541} {"train_loss": -26.7005672454834, "global_step": 376940, "epoch": 4541} {"train_loss": -26.661701202392578, "global_step": 376941, "epoch": 4541} {"train_loss": -26.287891387939453, "global_step": 376942, "epoch": 4541} {"train_loss": -26.245527267456055, "global_step": 376943, "epoch": 4541} {"train_loss": -26.2893123626709, "global_step": 376944, "epoch": 4541} {"train_loss": -26.26995277404785, "global_step": 376945, "epoch": 4541} {"train_loss": -26.6331844329834, "global_step": 376946, "epoch": 4541} {"train_loss": -26.282575607299805, "global_step": 376947, "epoch": 4541} {"train_loss": -26.431232452392578, "global_step": 376948, "epoch": 4541} {"train_loss": -26.56043815612793, "global_step": 376949, "epoch": 4541} {"train_loss": -26.249738693237305, "global_step": 376950, "epoch": 4541} {"train_loss": -26.435871124267578, "global_step": 376951, "epoch": 4541} {"train_loss": -26.42780113220215, "global_step": 376952, "epoch": 4541} {"train_loss": -26.291040420532227, "global_step": 376953, "epoch": 4541} {"train_loss": -26.460205078125, "global_step": 376954, "epoch": 4541} {"train_loss": -26.23495864868164, "global_step": 376955, "epoch": 4541} {"train_loss": -26.453153610229492, "global_step": 376956, "epoch": 4541} {"train_loss": -26.13380241394043, "global_step": 376957, "epoch": 4541} {"train_loss": -26.49057388305664, "global_step": 376958, "epoch": 4541} {"train_loss": -26.187137603759766, "global_step": 376959, "epoch": 4541} {"train_loss": -26.13258171081543, "global_step": 376960, "epoch": 4541} {"train_loss": -26.47205924987793, "global_step": 376961, "epoch": 4541} {"train_loss": -26.06500816345215, "global_step": 376962, "epoch": 4541} {"train_loss": -26.104740142822266, "global_step": 376963, "epoch": 4541} {"train_loss": -26.411788940429688, "global_step": 376964, "epoch": 4541} {"train_loss": -26.307819366455078, "global_step": 376965, "epoch": 4541} {"train_loss": -26.20680046081543, "global_step": 376966, "epoch": 4541} {"train_loss": -26.3326358795166, "global_step": 376967, "epoch": 4541} {"train_loss": -26.35251235961914, "global_step": 376968, "epoch": 4541} {"train_loss": -26.460309982299805, "global_step": 376969, "epoch": 4541} {"train_loss": -25.849340438842773, "global_step": 376970, "epoch": 4541} {"train_loss": -26.3095645904541, "global_step": 376971, "epoch": 4541} {"train_loss": -26.05417823791504, "global_step": 376972, "epoch": 4541} {"train_loss": -26.34029197692871, "global_step": 376973, "epoch": 4541} {"train_loss": -26.731143951416016, "global_step": 376974, "epoch": 4541} {"train_loss": -26.049345016479492, "global_step": 376975, "epoch": 4541} {"train_loss": -26.39215087890625, "global_step": 376976, "epoch": 4541} {"train_loss": -26.26093864440918, "global_step": 376977, "epoch": 4541} {"train_loss": -26.710742950439453, "global_step": 376978, "epoch": 4541} {"train_loss": -26.33810806274414, "global_step": 376979, "epoch": 4541} {"train_loss": -26.214818954467773, "global_step": 376980, "epoch": 4541} {"train_loss": -26.639371871948242, "global_step": 376981, "epoch": 4541} {"train_loss": -26.191909790039062, "global_step": 376982, "epoch": 4541} {"train_loss": -26.408395767211914, "global_step": 376983, "epoch": 4541} {"train_loss": -26.404767990112305, "global_step": 376984, "epoch": 4541} {"train_loss": -26.344065769609198, "global_step": 376985, "epoch": 4541, "val_loss": 6540408.0} {"train_loss": -25.92138671875, "global_step": 376986, "epoch": 4542} {"train_loss": -24.94074058532715, "global_step": 376987, "epoch": 4542} {"train_loss": -25.646076202392578, "global_step": 376988, "epoch": 4542} {"train_loss": -25.5711669921875, "global_step": 376989, "epoch": 4542} {"train_loss": -25.534027099609375, "global_step": 376990, "epoch": 4542} {"train_loss": -25.71755027770996, "global_step": 376991, "epoch": 4542} {"train_loss": -26.166004180908203, "global_step": 376992, "epoch": 4542} {"train_loss": -25.410842895507812, "global_step": 376993, "epoch": 4542} {"train_loss": -25.902379989624023, "global_step": 376994, "epoch": 4542} {"train_loss": -26.01569938659668, "global_step": 376995, "epoch": 4542} {"train_loss": -25.9979190826416, "global_step": 376996, "epoch": 4542} {"train_loss": -25.94816017150879, "global_step": 376997, "epoch": 4542} {"train_loss": -25.973119735717773, "global_step": 376998, "epoch": 4542} {"train_loss": -26.045129776000977, "global_step": 376999, "epoch": 4542} {"train_loss": -26.15895652770996, "global_step": 377000, "epoch": 4542} {"train_loss": -26.44569206237793, "global_step": 377001, "epoch": 4542} {"train_loss": -26.24942398071289, "global_step": 377002, "epoch": 4542} {"train_loss": -25.868289947509766, "global_step": 377003, "epoch": 4542} {"train_loss": -26.26104164123535, "global_step": 377004, "epoch": 4542} {"train_loss": -25.482385635375977, "global_step": 377005, "epoch": 4542} {"train_loss": -26.1721134185791, "global_step": 377006, "epoch": 4542} {"train_loss": -26.288015365600586, "global_step": 377007, "epoch": 4542} {"train_loss": -26.457014083862305, "global_step": 377008, "epoch": 4542} {"train_loss": -25.900625228881836, "global_step": 377009, "epoch": 4542} {"train_loss": -25.917516708374023, "global_step": 377010, "epoch": 4542} {"train_loss": -26.509870529174805, "global_step": 377011, "epoch": 4542} {"train_loss": -26.310850143432617, "global_step": 377012, "epoch": 4542} {"train_loss": -26.34766960144043, "global_step": 377013, "epoch": 4542} {"train_loss": -26.21608543395996, "global_step": 377014, "epoch": 4542} {"train_loss": -26.371103286743164, "global_step": 377015, "epoch": 4542} {"train_loss": -26.453031539916992, "global_step": 377016, "epoch": 4542} {"train_loss": -26.48711585998535, "global_step": 377017, "epoch": 4542} {"train_loss": -26.48079490661621, "global_step": 377018, "epoch": 4542} {"train_loss": -26.328872680664062, "global_step": 377019, "epoch": 4542} {"train_loss": -26.58211326599121, "global_step": 377020, "epoch": 4542} {"train_loss": -26.494281768798828, "global_step": 377021, "epoch": 4542} {"train_loss": -26.572269439697266, "global_step": 377022, "epoch": 4542} {"train_loss": -26.339832305908203, "global_step": 377023, "epoch": 4542} {"train_loss": -26.329233169555664, "global_step": 377024, "epoch": 4542} {"train_loss": -26.389684677124023, "global_step": 377025, "epoch": 4542} {"train_loss": -26.772174835205078, "global_step": 377026, "epoch": 4542} {"train_loss": -26.722177505493164, "global_step": 377027, "epoch": 4542} {"train_loss": -26.405216217041016, "global_step": 377028, "epoch": 4542} {"train_loss": -26.706317901611328, "global_step": 377029, "epoch": 4542} {"train_loss": -26.77396583557129, "global_step": 377030, "epoch": 4542} {"train_loss": -26.7792911529541, "global_step": 377031, "epoch": 4542} {"train_loss": -26.804101943969727, "global_step": 377032, "epoch": 4542} {"train_loss": -26.590124130249023, "global_step": 377033, "epoch": 4542} {"train_loss": -26.62471580505371, "global_step": 377034, "epoch": 4542} {"train_loss": -26.561206817626953, "global_step": 377035, "epoch": 4542} {"train_loss": -26.662107467651367, "global_step": 377036, "epoch": 4542} {"train_loss": -26.5616512298584, "global_step": 377037, "epoch": 4542} {"train_loss": -26.686262130737305, "global_step": 377038, "epoch": 4542} {"train_loss": -26.545751571655273, "global_step": 377039, "epoch": 4542} {"train_loss": -26.849994659423828, "global_step": 377040, "epoch": 4542} {"train_loss": -26.153717041015625, "global_step": 377041, "epoch": 4542} {"train_loss": -26.442508697509766, "global_step": 377042, "epoch": 4542} {"train_loss": -26.627185821533203, "global_step": 377043, "epoch": 4542} {"train_loss": -26.352109909057617, "global_step": 377044, "epoch": 4542} {"train_loss": -26.692153930664062, "global_step": 377045, "epoch": 4542} {"train_loss": -26.71693229675293, "global_step": 377046, "epoch": 4542} {"train_loss": -26.44289207458496, "global_step": 377047, "epoch": 4542} {"train_loss": -26.49054527282715, "global_step": 377048, "epoch": 4542} {"train_loss": -26.456052780151367, "global_step": 377049, "epoch": 4542} {"train_loss": -26.61151695251465, "global_step": 377050, "epoch": 4542} {"train_loss": -26.36427879333496, "global_step": 377051, "epoch": 4542} {"train_loss": -25.926969528198242, "global_step": 377052, "epoch": 4542} {"train_loss": -25.632360458374023, "global_step": 377053, "epoch": 4542} {"train_loss": -25.471881866455078, "global_step": 377054, "epoch": 4542} {"train_loss": -25.87158203125, "global_step": 377055, "epoch": 4542} {"train_loss": -26.022104263305664, "global_step": 377056, "epoch": 4542} {"train_loss": -25.793371200561523, "global_step": 377057, "epoch": 4542} {"train_loss": -25.868377685546875, "global_step": 377058, "epoch": 4542} {"train_loss": -26.37628173828125, "global_step": 377059, "epoch": 4542} {"train_loss": -26.242868423461914, "global_step": 377060, "epoch": 4542} {"train_loss": -26.12794303894043, "global_step": 377061, "epoch": 4542} {"train_loss": -26.284101486206055, "global_step": 377062, "epoch": 4542} {"train_loss": -26.23193359375, "global_step": 377063, "epoch": 4542} {"train_loss": -26.581069946289062, "global_step": 377064, "epoch": 4542} {"train_loss": -26.22553062438965, "global_step": 377065, "epoch": 4542} {"train_loss": -26.274463653564453, "global_step": 377066, "epoch": 4542} {"train_loss": -26.41499137878418, "global_step": 377067, "epoch": 4542} {"train_loss": -26.253389059779156, "global_step": 377068, "epoch": 4542, "val_loss": 6670267.5} {"train_loss": -25.854028701782227, "global_step": 377069, "epoch": 4543} {"train_loss": -25.50836753845215, "global_step": 377070, "epoch": 4543} {"train_loss": -26.0588321685791, "global_step": 377071, "epoch": 4543} {"train_loss": -25.7427978515625, "global_step": 377072, "epoch": 4543} {"train_loss": -25.870046615600586, "global_step": 377073, "epoch": 4543} {"train_loss": -25.884252548217773, "global_step": 377074, "epoch": 4543} {"train_loss": -25.816442489624023, "global_step": 377075, "epoch": 4543} {"train_loss": -26.129011154174805, "global_step": 377076, "epoch": 4543} {"train_loss": -25.7995662689209, "global_step": 377077, "epoch": 4543} {"train_loss": -25.6671085357666, "global_step": 377078, "epoch": 4543} {"train_loss": -26.30521583557129, "global_step": 377079, "epoch": 4543} {"train_loss": -25.831878662109375, "global_step": 377080, "epoch": 4543} {"train_loss": -25.511892318725586, "global_step": 377081, "epoch": 4543} {"train_loss": -26.306640625, "global_step": 377082, "epoch": 4543} {"train_loss": -26.205663681030273, "global_step": 377083, "epoch": 4543} {"train_loss": -25.95196533203125, "global_step": 377084, "epoch": 4543} {"train_loss": -26.003894805908203, "global_step": 377085, "epoch": 4543} {"train_loss": -26.31580924987793, "global_step": 377086, "epoch": 4543} {"train_loss": -26.037933349609375, "global_step": 377087, "epoch": 4543} {"train_loss": -25.944257736206055, "global_step": 377088, "epoch": 4543} {"train_loss": -26.33989906311035, "global_step": 377089, "epoch": 4543} {"train_loss": -25.714155197143555, "global_step": 377090, "epoch": 4543} {"train_loss": -26.131210327148438, "global_step": 377091, "epoch": 4543} {"train_loss": -26.124792098999023, "global_step": 377092, "epoch": 4543} {"train_loss": -26.17652702331543, "global_step": 377093, "epoch": 4543} {"train_loss": -26.040449142456055, "global_step": 377094, "epoch": 4543} {"train_loss": -26.41843032836914, "global_step": 377095, "epoch": 4543} {"train_loss": -26.0677490234375, "global_step": 377096, "epoch": 4543} {"train_loss": -26.032758712768555, "global_step": 377097, "epoch": 4543} {"train_loss": -26.307880401611328, "global_step": 377098, "epoch": 4543} {"train_loss": -26.5147762298584, "global_step": 377099, "epoch": 4543} {"train_loss": -26.475177764892578, "global_step": 377100, "epoch": 4543} {"train_loss": -26.4164981842041, "global_step": 377101, "epoch": 4543} {"train_loss": -26.12335777282715, "global_step": 377102, "epoch": 4543} {"train_loss": -26.338943481445312, "global_step": 377103, "epoch": 4543} {"train_loss": -26.367795944213867, "global_step": 377104, "epoch": 4543} {"train_loss": -26.113142013549805, "global_step": 377105, "epoch": 4543} {"train_loss": -26.420669555664062, "global_step": 377106, "epoch": 4543} {"train_loss": -26.3558406829834, "global_step": 377107, "epoch": 4543} {"train_loss": -26.56934928894043, "global_step": 377108, "epoch": 4543} {"train_loss": -26.62062644958496, "global_step": 377109, "epoch": 4543} {"train_loss": -26.540449142456055, "global_step": 377110, "epoch": 4543} {"train_loss": -26.37790298461914, "global_step": 377111, "epoch": 4543} {"train_loss": -26.56062889099121, "global_step": 377112, "epoch": 4543} {"train_loss": -26.765594482421875, "global_step": 377113, "epoch": 4543} {"train_loss": -26.554243087768555, "global_step": 377114, "epoch": 4543} {"train_loss": -26.774396896362305, "global_step": 377115, "epoch": 4543} {"train_loss": -26.659748077392578, "global_step": 377116, "epoch": 4543} {"train_loss": -26.331647872924805, "global_step": 377117, "epoch": 4543} {"train_loss": -26.305835723876953, "global_step": 377118, "epoch": 4543} {"train_loss": -26.803518295288086, "global_step": 377119, "epoch": 4543} {"train_loss": -26.50941276550293, "global_step": 377120, "epoch": 4543} {"train_loss": -26.144800186157227, "global_step": 377121, "epoch": 4543} {"train_loss": -26.487457275390625, "global_step": 377122, "epoch": 4543} {"train_loss": -26.80567741394043, "global_step": 377123, "epoch": 4543} {"train_loss": -26.560495376586914, "global_step": 377124, "epoch": 4543} {"train_loss": -26.660425186157227, "global_step": 377125, "epoch": 4543} {"train_loss": -26.35236930847168, "global_step": 377126, "epoch": 4543} {"train_loss": -26.4509334564209, "global_step": 377127, "epoch": 4543} {"train_loss": -26.5153751373291, "global_step": 377128, "epoch": 4543} {"train_loss": -26.390527725219727, "global_step": 377129, "epoch": 4543} {"train_loss": -26.76015281677246, "global_step": 377130, "epoch": 4543} {"train_loss": -26.254592895507812, "global_step": 377131, "epoch": 4543} {"train_loss": -26.02813720703125, "global_step": 377132, "epoch": 4543} {"train_loss": -25.946273803710938, "global_step": 377133, "epoch": 4543} {"train_loss": -25.962827682495117, "global_step": 377134, "epoch": 4543} {"train_loss": -25.705671310424805, "global_step": 377135, "epoch": 4543} {"train_loss": -26.099380493164062, "global_step": 377136, "epoch": 4543} {"train_loss": -26.403974533081055, "global_step": 377137, "epoch": 4543} {"train_loss": -26.245004653930664, "global_step": 377138, "epoch": 4543} {"train_loss": -25.5546932220459, "global_step": 377139, "epoch": 4543} {"train_loss": -26.455469131469727, "global_step": 377140, "epoch": 4543} {"train_loss": -26.300251007080078, "global_step": 377141, "epoch": 4543} {"train_loss": -25.824304580688477, "global_step": 377142, "epoch": 4543} {"train_loss": -26.337560653686523, "global_step": 377143, "epoch": 4543} {"train_loss": -26.411962509155273, "global_step": 377144, "epoch": 4543} {"train_loss": -26.259723663330078, "global_step": 377145, "epoch": 4543} {"train_loss": -26.464111328125, "global_step": 377146, "epoch": 4543} {"train_loss": -26.38298988342285, "global_step": 377147, "epoch": 4543} {"train_loss": -25.99576759338379, "global_step": 377148, "epoch": 4543} {"train_loss": -26.317523956298828, "global_step": 377149, "epoch": 4543} {"train_loss": -26.410505294799805, "global_step": 377150, "epoch": 4543} {"train_loss": -26.22653618778091, "global_step": 377151, "epoch": 4543, "val_loss": 6506900.5} {"train_loss": -25.60013771057129, "global_step": 377152, "epoch": 4544} {"train_loss": -25.929004669189453, "global_step": 377153, "epoch": 4544} {"train_loss": -25.7999210357666, "global_step": 377154, "epoch": 4544} {"train_loss": -26.2568416595459, "global_step": 377155, "epoch": 4544} {"train_loss": -26.044824600219727, "global_step": 377156, "epoch": 4544} {"train_loss": -26.175018310546875, "global_step": 377157, "epoch": 4544} {"train_loss": -25.959325790405273, "global_step": 377158, "epoch": 4544} {"train_loss": -26.243396759033203, "global_step": 377159, "epoch": 4544} {"train_loss": -26.32343864440918, "global_step": 377160, "epoch": 4544} {"train_loss": -25.93840980529785, "global_step": 377161, "epoch": 4544} {"train_loss": -26.41552734375, "global_step": 377162, "epoch": 4544} {"train_loss": -26.18098258972168, "global_step": 377163, "epoch": 4544} {"train_loss": -26.411590576171875, "global_step": 377164, "epoch": 4544} {"train_loss": -26.197900772094727, "global_step": 377165, "epoch": 4544} {"train_loss": -26.2865047454834, "global_step": 377166, "epoch": 4544} {"train_loss": -26.219501495361328, "global_step": 377167, "epoch": 4544} {"train_loss": -26.196401596069336, "global_step": 377168, "epoch": 4544} {"train_loss": -26.272031784057617, "global_step": 377169, "epoch": 4544} {"train_loss": -26.408435821533203, "global_step": 377170, "epoch": 4544} {"train_loss": -26.51348304748535, "global_step": 377171, "epoch": 4544} {"train_loss": -26.238508224487305, "global_step": 377172, "epoch": 4544} {"train_loss": -26.152292251586914, "global_step": 377173, "epoch": 4544} {"train_loss": -26.215673446655273, "global_step": 377174, "epoch": 4544} {"train_loss": -26.578657150268555, "global_step": 377175, "epoch": 4544} {"train_loss": -26.344318389892578, "global_step": 377176, "epoch": 4544} {"train_loss": -26.577138900756836, "global_step": 377177, "epoch": 4544} {"train_loss": -26.2818603515625, "global_step": 377178, "epoch": 4544} {"train_loss": -26.112457275390625, "global_step": 377179, "epoch": 4544} {"train_loss": -26.633573532104492, "global_step": 377180, "epoch": 4544} {"train_loss": -26.516897201538086, "global_step": 377181, "epoch": 4544} {"train_loss": -26.364709854125977, "global_step": 377182, "epoch": 4544} {"train_loss": -26.107343673706055, "global_step": 377183, "epoch": 4544} {"train_loss": -26.4410343170166, "global_step": 377184, "epoch": 4544} {"train_loss": -26.35544776916504, "global_step": 377185, "epoch": 4544} {"train_loss": -26.413970947265625, "global_step": 377186, "epoch": 4544} {"train_loss": -26.502716064453125, "global_step": 377187, "epoch": 4544} {"train_loss": -26.316370010375977, "global_step": 377188, "epoch": 4544} {"train_loss": -26.369354248046875, "global_step": 377189, "epoch": 4544} {"train_loss": -26.372400283813477, "global_step": 377190, "epoch": 4544} {"train_loss": -26.368921279907227, "global_step": 377191, "epoch": 4544} {"train_loss": -26.222431182861328, "global_step": 377192, "epoch": 4544} {"train_loss": -26.352643966674805, "global_step": 377193, "epoch": 4544} {"train_loss": -26.126428604125977, "global_step": 377194, "epoch": 4544} {"train_loss": -26.402942657470703, "global_step": 377195, "epoch": 4544} {"train_loss": -25.87342643737793, "global_step": 377196, "epoch": 4544} {"train_loss": -26.426572799682617, "global_step": 377197, "epoch": 4544} {"train_loss": -26.541522979736328, "global_step": 377198, "epoch": 4544} {"train_loss": -26.16202735900879, "global_step": 377199, "epoch": 4544} {"train_loss": -26.312891006469727, "global_step": 377200, "epoch": 4544} {"train_loss": -26.59229850769043, "global_step": 377201, "epoch": 4544} {"train_loss": -26.565847396850586, "global_step": 377202, "epoch": 4544} {"train_loss": -26.437580108642578, "global_step": 377203, "epoch": 4544} {"train_loss": -26.60511589050293, "global_step": 377204, "epoch": 4544} {"train_loss": -26.7371768951416, "global_step": 377205, "epoch": 4544} {"train_loss": -26.5399112701416, "global_step": 377206, "epoch": 4544} {"train_loss": -26.590362548828125, "global_step": 377207, "epoch": 4544} {"train_loss": -26.48792839050293, "global_step": 377208, "epoch": 4544} {"train_loss": -26.509321212768555, "global_step": 377209, "epoch": 4544} {"train_loss": -26.52231788635254, "global_step": 377210, "epoch": 4544} {"train_loss": -26.713544845581055, "global_step": 377211, "epoch": 4544} {"train_loss": -26.691064834594727, "global_step": 377212, "epoch": 4544} {"train_loss": -26.603857040405273, "global_step": 377213, "epoch": 4544} {"train_loss": -26.7236385345459, "global_step": 377214, "epoch": 4544} {"train_loss": -26.77585792541504, "global_step": 377215, "epoch": 4544} {"train_loss": -26.55988883972168, "global_step": 377216, "epoch": 4544} {"train_loss": -26.67220115661621, "global_step": 377217, "epoch": 4544} {"train_loss": -26.555973052978516, "global_step": 377218, "epoch": 4544} {"train_loss": -26.130186080932617, "global_step": 377219, "epoch": 4544} {"train_loss": -26.418333053588867, "global_step": 377220, "epoch": 4544} {"train_loss": -26.113508224487305, "global_step": 377221, "epoch": 4544} {"train_loss": -25.696533203125, "global_step": 377222, "epoch": 4544} {"train_loss": -25.776569366455078, "global_step": 377223, "epoch": 4544} {"train_loss": -26.33683204650879, "global_step": 377224, "epoch": 4544} {"train_loss": -26.269561767578125, "global_step": 377225, "epoch": 4544} {"train_loss": -26.231992721557617, "global_step": 377226, "epoch": 4544} {"train_loss": -26.61712074279785, "global_step": 377227, "epoch": 4544} {"train_loss": -25.862548828125, "global_step": 377228, "epoch": 4544} {"train_loss": -26.318119049072266, "global_step": 377229, "epoch": 4544} {"train_loss": -26.08734130859375, "global_step": 377230, "epoch": 4544} {"train_loss": -25.76312255859375, "global_step": 377231, "epoch": 4544} {"train_loss": -26.610198974609375, "global_step": 377232, "epoch": 4544} {"train_loss": -26.64302635192871, "global_step": 377233, "epoch": 4544} {"train_loss": -26.334031461233117, "global_step": 377234, "epoch": 4544, "val_loss": 6621580.5} {"train_loss": -26.019474029541016, "global_step": 377235, "epoch": 4545} {"train_loss": -25.97662925720215, "global_step": 377236, "epoch": 4545} {"train_loss": -26.058368682861328, "global_step": 377237, "epoch": 4545} {"train_loss": -25.516586303710938, "global_step": 377238, "epoch": 4545} {"train_loss": -26.16904067993164, "global_step": 377239, "epoch": 4545} {"train_loss": -25.864316940307617, "global_step": 377240, "epoch": 4545} {"train_loss": -25.9531307220459, "global_step": 377241, "epoch": 4545} {"train_loss": -25.58058738708496, "global_step": 377242, "epoch": 4545} {"train_loss": -25.78449058532715, "global_step": 377243, "epoch": 4545} {"train_loss": -26.08670997619629, "global_step": 377244, "epoch": 4545} {"train_loss": -26.147953033447266, "global_step": 377245, "epoch": 4545} {"train_loss": -25.886953353881836, "global_step": 377246, "epoch": 4545} {"train_loss": -26.09932518005371, "global_step": 377247, "epoch": 4545} {"train_loss": -26.3493709564209, "global_step": 377248, "epoch": 4545} {"train_loss": -26.31085777282715, "global_step": 377249, "epoch": 4545} {"train_loss": -26.05558204650879, "global_step": 377250, "epoch": 4545} {"train_loss": -25.886554718017578, "global_step": 377251, "epoch": 4545} {"train_loss": -25.735876083374023, "global_step": 377252, "epoch": 4545} {"train_loss": -26.033597946166992, "global_step": 377253, "epoch": 4545} {"train_loss": -26.257917404174805, "global_step": 377254, "epoch": 4545} {"train_loss": -26.19940757751465, "global_step": 377255, "epoch": 4545} {"train_loss": -26.112808227539062, "global_step": 377256, "epoch": 4545} {"train_loss": -26.605371475219727, "global_step": 377257, "epoch": 4545} {"train_loss": -26.134235382080078, "global_step": 377258, "epoch": 4545} {"train_loss": -26.456607818603516, "global_step": 377259, "epoch": 4545} {"train_loss": -26.25379753112793, "global_step": 377260, "epoch": 4545} {"train_loss": -26.529111862182617, "global_step": 377261, "epoch": 4545} {"train_loss": -26.53485107421875, "global_step": 377262, "epoch": 4545} {"train_loss": -26.342676162719727, "global_step": 377263, "epoch": 4545} {"train_loss": -26.462793350219727, "global_step": 377264, "epoch": 4545} {"train_loss": -26.200040817260742, "global_step": 377265, "epoch": 4545} {"train_loss": -26.841367721557617, "global_step": 377266, "epoch": 4545} {"train_loss": -26.177520751953125, "global_step": 377267, "epoch": 4545} {"train_loss": -26.94351577758789, "global_step": 377268, "epoch": 4545} {"train_loss": -26.724029541015625, "global_step": 377269, "epoch": 4545} {"train_loss": -26.617233276367188, "global_step": 377270, "epoch": 4545} {"train_loss": -26.68141746520996, "global_step": 377271, "epoch": 4545} {"train_loss": -26.705942153930664, "global_step": 377272, "epoch": 4545} {"train_loss": -26.46533203125, "global_step": 377273, "epoch": 4545} {"train_loss": -26.406768798828125, "global_step": 377274, "epoch": 4545} {"train_loss": -26.573041915893555, "global_step": 377275, "epoch": 4545} {"train_loss": -26.468713760375977, "global_step": 377276, "epoch": 4545} {"train_loss": -26.685989379882812, "global_step": 377277, "epoch": 4545} {"train_loss": -26.502704620361328, "global_step": 377278, "epoch": 4545} {"train_loss": -26.631555557250977, "global_step": 377279, "epoch": 4545} {"train_loss": -26.471105575561523, "global_step": 377280, "epoch": 4545} {"train_loss": -26.47979736328125, "global_step": 377281, "epoch": 4545} {"train_loss": -26.4356746673584, "global_step": 377282, "epoch": 4545} {"train_loss": -26.642841339111328, "global_step": 377283, "epoch": 4545} {"train_loss": -26.713592529296875, "global_step": 377284, "epoch": 4545} {"train_loss": -26.8022518157959, "global_step": 377285, "epoch": 4545} {"train_loss": -26.345630645751953, "global_step": 377286, "epoch": 4545} {"train_loss": -26.75732421875, "global_step": 377287, "epoch": 4545} {"train_loss": -26.236133575439453, "global_step": 377288, "epoch": 4545} {"train_loss": -26.74005699157715, "global_step": 377289, "epoch": 4545} {"train_loss": -26.501813888549805, "global_step": 377290, "epoch": 4545} {"train_loss": -26.262781143188477, "global_step": 377291, "epoch": 4545} {"train_loss": -26.238910675048828, "global_step": 377292, "epoch": 4545} {"train_loss": -26.326017379760742, "global_step": 377293, "epoch": 4545} {"train_loss": -26.625036239624023, "global_step": 377294, "epoch": 4545} {"train_loss": -26.396753311157227, "global_step": 377295, "epoch": 4545} {"train_loss": -26.37155532836914, "global_step": 377296, "epoch": 4545} {"train_loss": -26.362157821655273, "global_step": 377297, "epoch": 4545} {"train_loss": -26.290246963500977, "global_step": 377298, "epoch": 4545} {"train_loss": -26.346731185913086, "global_step": 377299, "epoch": 4545} {"train_loss": -26.483861923217773, "global_step": 377300, "epoch": 4545} {"train_loss": -26.71381950378418, "global_step": 377301, "epoch": 4545} {"train_loss": -26.092466354370117, "global_step": 377302, "epoch": 4545} {"train_loss": -26.530942916870117, "global_step": 377303, "epoch": 4545} {"train_loss": -26.681228637695312, "global_step": 377304, "epoch": 4545} {"train_loss": -26.452239990234375, "global_step": 377305, "epoch": 4545} {"train_loss": -26.239429473876953, "global_step": 377306, "epoch": 4545} {"train_loss": -26.022424697875977, "global_step": 377307, "epoch": 4545} {"train_loss": -26.493371963500977, "global_step": 377308, "epoch": 4545} {"train_loss": -26.70835304260254, "global_step": 377309, "epoch": 4545} {"train_loss": -26.168737411499023, "global_step": 377310, "epoch": 4545} {"train_loss": -26.32393455505371, "global_step": 377311, "epoch": 4545} {"train_loss": -26.23223304748535, "global_step": 377312, "epoch": 4545} {"train_loss": -26.7416934967041, "global_step": 377313, "epoch": 4545} {"train_loss": -26.566862106323242, "global_step": 377314, "epoch": 4545} {"train_loss": -26.84649658203125, "global_step": 377315, "epoch": 4545} {"train_loss": -26.39583396911621, "global_step": 377316, "epoch": 4545} {"train_loss": -26.36045580025179, "global_step": 377317, "epoch": 4545, "val_loss": 6579018.5} {"train_loss": -25.7602481842041, "global_step": 377318, "epoch": 4546} {"train_loss": -24.72681999206543, "global_step": 377319, "epoch": 4546} {"train_loss": -25.47859001159668, "global_step": 377320, "epoch": 4546} {"train_loss": -24.95360565185547, "global_step": 377321, "epoch": 4546} {"train_loss": -25.6304988861084, "global_step": 377322, "epoch": 4546} {"train_loss": -25.597814559936523, "global_step": 377323, "epoch": 4546} {"train_loss": -25.649280548095703, "global_step": 377324, "epoch": 4546} {"train_loss": -26.255538940429688, "global_step": 377325, "epoch": 4546} {"train_loss": -26.04646110534668, "global_step": 377326, "epoch": 4546} {"train_loss": -26.19404411315918, "global_step": 377327, "epoch": 4546} {"train_loss": -26.446353912353516, "global_step": 377328, "epoch": 4546} {"train_loss": -26.241159439086914, "global_step": 377329, "epoch": 4546} {"train_loss": -26.233774185180664, "global_step": 377330, "epoch": 4546} {"train_loss": -26.44744873046875, "global_step": 377331, "epoch": 4546} {"train_loss": -26.493066787719727, "global_step": 377332, "epoch": 4546} {"train_loss": -26.449071884155273, "global_step": 377333, "epoch": 4546} {"train_loss": -26.534391403198242, "global_step": 377334, "epoch": 4546} {"train_loss": -26.492712020874023, "global_step": 377335, "epoch": 4546} {"train_loss": -26.18808937072754, "global_step": 377336, "epoch": 4546} {"train_loss": -26.047021865844727, "global_step": 377337, "epoch": 4546} {"train_loss": -26.200498580932617, "global_step": 377338, "epoch": 4546} {"train_loss": -26.420774459838867, "global_step": 377339, "epoch": 4546} {"train_loss": -26.307809829711914, "global_step": 377340, "epoch": 4546} {"train_loss": -26.382070541381836, "global_step": 377341, "epoch": 4546} {"train_loss": -26.293439865112305, "global_step": 377342, "epoch": 4546} {"train_loss": -26.110095977783203, "global_step": 377343, "epoch": 4546} {"train_loss": -26.222131729125977, "global_step": 377344, "epoch": 4546} {"train_loss": -26.312925338745117, "global_step": 377345, "epoch": 4546} {"train_loss": -26.369028091430664, "global_step": 377346, "epoch": 4546} {"train_loss": -26.252899169921875, "global_step": 377347, "epoch": 4546} {"train_loss": -26.564489364624023, "global_step": 377348, "epoch": 4546} {"train_loss": -26.07619285583496, "global_step": 377349, "epoch": 4546} {"train_loss": -26.756887435913086, "global_step": 377350, "epoch": 4546} {"train_loss": -26.369352340698242, "global_step": 377351, "epoch": 4546} {"train_loss": -26.216222763061523, "global_step": 377352, "epoch": 4546} {"train_loss": -27.04218101501465, "global_step": 377353, "epoch": 4546} {"train_loss": -26.444746017456055, "global_step": 377354, "epoch": 4546} {"train_loss": -26.294111251831055, "global_step": 377355, "epoch": 4546} {"train_loss": -26.79463005065918, "global_step": 377356, "epoch": 4546} {"train_loss": -26.48505973815918, "global_step": 377357, "epoch": 4546} {"train_loss": -26.455463409423828, "global_step": 377358, "epoch": 4546} {"train_loss": -26.68120765686035, "global_step": 377359, "epoch": 4546} {"train_loss": -26.291996002197266, "global_step": 377360, "epoch": 4546} {"train_loss": -26.2694149017334, "global_step": 377361, "epoch": 4546} {"train_loss": -26.14434814453125, "global_step": 377362, "epoch": 4546} {"train_loss": -26.362207412719727, "global_step": 377363, "epoch": 4546} {"train_loss": -26.583112716674805, "global_step": 377364, "epoch": 4546} {"train_loss": -26.90946388244629, "global_step": 377365, "epoch": 4546} {"train_loss": -26.318359375, "global_step": 377366, "epoch": 4546} {"train_loss": -26.097122192382812, "global_step": 377367, "epoch": 4546} {"train_loss": -26.41358757019043, "global_step": 377368, "epoch": 4546} {"train_loss": -26.603445053100586, "global_step": 377369, "epoch": 4546} {"train_loss": -26.717655181884766, "global_step": 377370, "epoch": 4546} {"train_loss": -26.239124298095703, "global_step": 377371, "epoch": 4546} {"train_loss": -27.01055908203125, "global_step": 377372, "epoch": 4546} {"train_loss": -26.67181396484375, "global_step": 377373, "epoch": 4546} {"train_loss": -26.495574951171875, "global_step": 377374, "epoch": 4546} {"train_loss": -26.34807777404785, "global_step": 377375, "epoch": 4546} {"train_loss": -26.604068756103516, "global_step": 377376, "epoch": 4546} {"train_loss": -26.61958122253418, "global_step": 377377, "epoch": 4546} {"train_loss": -26.7750301361084, "global_step": 377378, "epoch": 4546} {"train_loss": -26.375995635986328, "global_step": 377379, "epoch": 4546} {"train_loss": -26.614782333374023, "global_step": 377380, "epoch": 4546} {"train_loss": -26.740758895874023, "global_step": 377381, "epoch": 4546} {"train_loss": -26.33955192565918, "global_step": 377382, "epoch": 4546} {"train_loss": -26.25177574157715, "global_step": 377383, "epoch": 4546} {"train_loss": -26.827239990234375, "global_step": 377384, "epoch": 4546} {"train_loss": -26.768518447875977, "global_step": 377385, "epoch": 4546} {"train_loss": -26.52545166015625, "global_step": 377386, "epoch": 4546} {"train_loss": -26.01629638671875, "global_step": 377387, "epoch": 4546} {"train_loss": -25.7529354095459, "global_step": 377388, "epoch": 4546} {"train_loss": -26.04115867614746, "global_step": 377389, "epoch": 4546} {"train_loss": -26.413028717041016, "global_step": 377390, "epoch": 4546} {"train_loss": -26.294675827026367, "global_step": 377391, "epoch": 4546} {"train_loss": -25.95760154724121, "global_step": 377392, "epoch": 4546} {"train_loss": -26.418167114257812, "global_step": 377393, "epoch": 4546} {"train_loss": -25.739465713500977, "global_step": 377394, "epoch": 4546} {"train_loss": -26.411306381225586, "global_step": 377395, "epoch": 4546} {"train_loss": -25.862302780151367, "global_step": 377396, "epoch": 4546} {"train_loss": -26.36279296875, "global_step": 377397, "epoch": 4546} {"train_loss": -26.07942008972168, "global_step": 377398, "epoch": 4546} {"train_loss": -26.30047035217285, "global_step": 377399, "epoch": 4546} {"train_loss": -26.315673437463232, "global_step": 377400, "epoch": 4546, "val_loss": 6483369.0} {"train_loss": -25.587055206298828, "global_step": 377401, "epoch": 4547} {"train_loss": -26.18890380859375, "global_step": 377402, "epoch": 4547} {"train_loss": -25.68572425842285, "global_step": 377403, "epoch": 4547} {"train_loss": -26.120370864868164, "global_step": 377404, "epoch": 4547} {"train_loss": -25.817462921142578, "global_step": 377405, "epoch": 4547} {"train_loss": -26.2061767578125, "global_step": 377406, "epoch": 4547} {"train_loss": -25.902795791625977, "global_step": 377407, "epoch": 4547} {"train_loss": -26.026254653930664, "global_step": 377408, "epoch": 4547} {"train_loss": -26.150815963745117, "global_step": 377409, "epoch": 4547} {"train_loss": -25.819616317749023, "global_step": 377410, "epoch": 4547} {"train_loss": -26.25599479675293, "global_step": 377411, "epoch": 4547} {"train_loss": -26.258596420288086, "global_step": 377412, "epoch": 4547} {"train_loss": -26.09650993347168, "global_step": 377413, "epoch": 4547} {"train_loss": -26.400602340698242, "global_step": 377414, "epoch": 4547} {"train_loss": -26.295337677001953, "global_step": 377415, "epoch": 4547} {"train_loss": -26.199737548828125, "global_step": 377416, "epoch": 4547} {"train_loss": -26.496688842773438, "global_step": 377417, "epoch": 4547} {"train_loss": -26.454696655273438, "global_step": 377418, "epoch": 4547} {"train_loss": -26.71455192565918, "global_step": 377419, "epoch": 4547} {"train_loss": -26.457136154174805, "global_step": 377420, "epoch": 4547} {"train_loss": -26.176105499267578, "global_step": 377421, "epoch": 4547} {"train_loss": -26.395719528198242, "global_step": 377422, "epoch": 4547} {"train_loss": -26.393041610717773, "global_step": 377423, "epoch": 4547} {"train_loss": -26.815771102905273, "global_step": 377424, "epoch": 4547} {"train_loss": -26.18622398376465, "global_step": 377425, "epoch": 4547} {"train_loss": -26.31739616394043, "global_step": 377426, "epoch": 4547} {"train_loss": -26.35420799255371, "global_step": 377427, "epoch": 4547} {"train_loss": -26.381671905517578, "global_step": 377428, "epoch": 4547} {"train_loss": -26.707733154296875, "global_step": 377429, "epoch": 4547} {"train_loss": -26.199071884155273, "global_step": 377430, "epoch": 4547} {"train_loss": -26.423816680908203, "global_step": 377431, "epoch": 4547} {"train_loss": -26.33780860900879, "global_step": 377432, "epoch": 4547} {"train_loss": -26.612985610961914, "global_step": 377433, "epoch": 4547} {"train_loss": -26.36964225769043, "global_step": 377434, "epoch": 4547} {"train_loss": -26.45794105529785, "global_step": 377435, "epoch": 4547} {"train_loss": -26.316308975219727, "global_step": 377436, "epoch": 4547} {"train_loss": -26.529205322265625, "global_step": 377437, "epoch": 4547} {"train_loss": -26.309431076049805, "global_step": 377438, "epoch": 4547} {"train_loss": -26.591663360595703, "global_step": 377439, "epoch": 4547} {"train_loss": -26.380491256713867, "global_step": 377440, "epoch": 4547} {"train_loss": -26.6054630279541, "global_step": 377441, "epoch": 4547} {"train_loss": -26.443517684936523, "global_step": 377442, "epoch": 4547} {"train_loss": -26.17557144165039, "global_step": 377443, "epoch": 4547} {"train_loss": -26.14153480529785, "global_step": 377444, "epoch": 4547} {"train_loss": -26.075225830078125, "global_step": 377445, "epoch": 4547} {"train_loss": -26.641315460205078, "global_step": 377446, "epoch": 4547} {"train_loss": -26.293500900268555, "global_step": 377447, "epoch": 4547} {"train_loss": -26.23776626586914, "global_step": 377448, "epoch": 4547} {"train_loss": -26.37481689453125, "global_step": 377449, "epoch": 4547} {"train_loss": -25.988880157470703, "global_step": 377450, "epoch": 4547} {"train_loss": -26.555341720581055, "global_step": 377451, "epoch": 4547} {"train_loss": -25.881473541259766, "global_step": 377452, "epoch": 4547} {"train_loss": -25.861719131469727, "global_step": 377453, "epoch": 4547} {"train_loss": -26.523468017578125, "global_step": 377454, "epoch": 4547} {"train_loss": -25.879642486572266, "global_step": 377455, "epoch": 4547} {"train_loss": -26.05606460571289, "global_step": 377456, "epoch": 4547} {"train_loss": -26.0826416015625, "global_step": 377457, "epoch": 4547} {"train_loss": -26.069080352783203, "global_step": 377458, "epoch": 4547} {"train_loss": -26.51361083984375, "global_step": 377459, "epoch": 4547} {"train_loss": -26.256494522094727, "global_step": 377460, "epoch": 4547} {"train_loss": -26.707550048828125, "global_step": 377461, "epoch": 4547} {"train_loss": -26.418060302734375, "global_step": 377462, "epoch": 4547} {"train_loss": -26.19318199157715, "global_step": 377463, "epoch": 4547} {"train_loss": -26.334379196166992, "global_step": 377464, "epoch": 4547} {"train_loss": -26.079059600830078, "global_step": 377465, "epoch": 4547} {"train_loss": -26.724088668823242, "global_step": 377466, "epoch": 4547} {"train_loss": -26.22089958190918, "global_step": 377467, "epoch": 4547} {"train_loss": -26.196020126342773, "global_step": 377468, "epoch": 4547} {"train_loss": -26.418426513671875, "global_step": 377469, "epoch": 4547} {"train_loss": -26.15028190612793, "global_step": 377470, "epoch": 4547} {"train_loss": -26.303674697875977, "global_step": 377471, "epoch": 4547} {"train_loss": -26.607213973999023, "global_step": 377472, "epoch": 4547} {"train_loss": -26.560327529907227, "global_step": 377473, "epoch": 4547} {"train_loss": -26.28655433654785, "global_step": 377474, "epoch": 4547} {"train_loss": -26.633020401000977, "global_step": 377475, "epoch": 4547} {"train_loss": -26.291784286499023, "global_step": 377476, "epoch": 4547} {"train_loss": -26.385908126831055, "global_step": 377477, "epoch": 4547} {"train_loss": -26.545759201049805, "global_step": 377478, "epoch": 4547} {"train_loss": -26.033817291259766, "global_step": 377479, "epoch": 4547} {"train_loss": -26.687484741210938, "global_step": 377480, "epoch": 4547} {"train_loss": -26.55396842956543, "global_step": 377481, "epoch": 4547} {"train_loss": -26.419300079345703, "global_step": 377482, "epoch": 4547} {"train_loss": -26.31662122887301, "global_step": 377483, "epoch": 4547, "val_loss": 6632838.0} {"train_loss": -25.926755905151367, "global_step": 377484, "epoch": 4548} {"train_loss": -25.867218017578125, "global_step": 377485, "epoch": 4548} {"train_loss": -26.382999420166016, "global_step": 377486, "epoch": 4548} {"train_loss": -25.81223487854004, "global_step": 377487, "epoch": 4548} {"train_loss": -25.75812339782715, "global_step": 377488, "epoch": 4548} {"train_loss": -26.412389755249023, "global_step": 377489, "epoch": 4548} {"train_loss": -26.173614501953125, "global_step": 377490, "epoch": 4548} {"train_loss": -25.7856388092041, "global_step": 377491, "epoch": 4548} {"train_loss": -26.33955955505371, "global_step": 377492, "epoch": 4548} {"train_loss": -26.0557861328125, "global_step": 377493, "epoch": 4548} {"train_loss": -26.311248779296875, "global_step": 377494, "epoch": 4548} {"train_loss": -26.185834884643555, "global_step": 377495, "epoch": 4548} {"train_loss": -25.7197322845459, "global_step": 377496, "epoch": 4548} {"train_loss": -26.085630416870117, "global_step": 377497, "epoch": 4548} {"train_loss": -25.86212730407715, "global_step": 377498, "epoch": 4548} {"train_loss": -26.328216552734375, "global_step": 377499, "epoch": 4548} {"train_loss": -26.01714515686035, "global_step": 377500, "epoch": 4548} {"train_loss": -25.89208984375, "global_step": 377501, "epoch": 4548} {"train_loss": -26.054733276367188, "global_step": 377502, "epoch": 4548} {"train_loss": -26.404571533203125, "global_step": 377503, "epoch": 4548} {"train_loss": -25.931283950805664, "global_step": 377504, "epoch": 4548} {"train_loss": -26.522937774658203, "global_step": 377505, "epoch": 4548} {"train_loss": -26.010351181030273, "global_step": 377506, "epoch": 4548} {"train_loss": -26.26234245300293, "global_step": 377507, "epoch": 4548} {"train_loss": -26.19463539123535, "global_step": 377508, "epoch": 4548} {"train_loss": -26.018224716186523, "global_step": 377509, "epoch": 4548} {"train_loss": -26.095157623291016, "global_step": 377510, "epoch": 4548} {"train_loss": -26.114612579345703, "global_step": 377511, "epoch": 4548} {"train_loss": -26.220800399780273, "global_step": 377512, "epoch": 4548} {"train_loss": -26.34064292907715, "global_step": 377513, "epoch": 4548} {"train_loss": -26.53693962097168, "global_step": 377514, "epoch": 4548} {"train_loss": -26.368886947631836, "global_step": 377515, "epoch": 4548} {"train_loss": -26.516407012939453, "global_step": 377516, "epoch": 4548} {"train_loss": -26.583221435546875, "global_step": 377517, "epoch": 4548} {"train_loss": -26.391498565673828, "global_step": 377518, "epoch": 4548} {"train_loss": -26.37098503112793, "global_step": 377519, "epoch": 4548} {"train_loss": -26.525678634643555, "global_step": 377520, "epoch": 4548} {"train_loss": -26.39499282836914, "global_step": 377521, "epoch": 4548} {"train_loss": -26.251361846923828, "global_step": 377522, "epoch": 4548} {"train_loss": -26.686920166015625, "global_step": 377523, "epoch": 4548} {"train_loss": -26.23267936706543, "global_step": 377524, "epoch": 4548} {"train_loss": -26.673877716064453, "global_step": 377525, "epoch": 4548} {"train_loss": -26.402219772338867, "global_step": 377526, "epoch": 4548} {"train_loss": -26.48537254333496, "global_step": 377527, "epoch": 4548} {"train_loss": -26.45438003540039, "global_step": 377528, "epoch": 4548} {"train_loss": -26.8389835357666, "global_step": 377529, "epoch": 4548} {"train_loss": -26.680505752563477, "global_step": 377530, "epoch": 4548} {"train_loss": -26.639596939086914, "global_step": 377531, "epoch": 4548} {"train_loss": -26.661834716796875, "global_step": 377532, "epoch": 4548} {"train_loss": -26.71088218688965, "global_step": 377533, "epoch": 4548} {"train_loss": -26.620824813842773, "global_step": 377534, "epoch": 4548} {"train_loss": -26.741453170776367, "global_step": 377535, "epoch": 4548} {"train_loss": -26.504812240600586, "global_step": 377536, "epoch": 4548} {"train_loss": -26.62811851501465, "global_step": 377537, "epoch": 4548} {"train_loss": -26.592985153198242, "global_step": 377538, "epoch": 4548} {"train_loss": -26.63160514831543, "global_step": 377539, "epoch": 4548} {"train_loss": -26.417743682861328, "global_step": 377540, "epoch": 4548} {"train_loss": -26.908700942993164, "global_step": 377541, "epoch": 4548} {"train_loss": -26.484668731689453, "global_step": 377542, "epoch": 4548} {"train_loss": -26.863073348999023, "global_step": 377543, "epoch": 4548} {"train_loss": -26.74530029296875, "global_step": 377544, "epoch": 4548} {"train_loss": -26.757556915283203, "global_step": 377545, "epoch": 4548} {"train_loss": -26.78950309753418, "global_step": 377546, "epoch": 4548} {"train_loss": -26.832483291625977, "global_step": 377547, "epoch": 4548} {"train_loss": -26.36338233947754, "global_step": 377548, "epoch": 4548} {"train_loss": -26.106313705444336, "global_step": 377549, "epoch": 4548} {"train_loss": -25.938459396362305, "global_step": 377550, "epoch": 4548} {"train_loss": -25.60750389099121, "global_step": 377551, "epoch": 4548} {"train_loss": -24.16975212097168, "global_step": 377552, "epoch": 4548} {"train_loss": -23.43507194519043, "global_step": 377553, "epoch": 4548} {"train_loss": -25.032840728759766, "global_step": 377554, "epoch": 4548} {"train_loss": -25.768774032592773, "global_step": 377555, "epoch": 4548} {"train_loss": -25.513416290283203, "global_step": 377556, "epoch": 4548} {"train_loss": -26.002134323120117, "global_step": 377557, "epoch": 4548} {"train_loss": -25.705686569213867, "global_step": 377558, "epoch": 4548} {"train_loss": -25.943115234375, "global_step": 377559, "epoch": 4548} {"train_loss": -25.7857608795166, "global_step": 377560, "epoch": 4548} {"train_loss": -25.774030685424805, "global_step": 377561, "epoch": 4548} {"train_loss": -26.28982925415039, "global_step": 377562, "epoch": 4548} {"train_loss": -25.867572784423828, "global_step": 377563, "epoch": 4548} {"train_loss": -25.671232223510742, "global_step": 377564, "epoch": 4548} {"train_loss": -25.954694747924805, "global_step": 377565, "epoch": 4548} {"train_loss": -26.19680331126753, "global_step": 377566, "epoch": 4548, "val_loss": 6637563.0} {"train_loss": -25.535057067871094, "global_step": 377567, "epoch": 4549} {"train_loss": -26.035736083984375, "global_step": 377568, "epoch": 4549} {"train_loss": -25.560354232788086, "global_step": 377569, "epoch": 4549} {"train_loss": -25.724456787109375, "global_step": 377570, "epoch": 4549} {"train_loss": -25.47639274597168, "global_step": 377571, "epoch": 4549} {"train_loss": -25.597824096679688, "global_step": 377572, "epoch": 4549} {"train_loss": -25.960294723510742, "global_step": 377573, "epoch": 4549} {"train_loss": -25.98225212097168, "global_step": 377574, "epoch": 4549} {"train_loss": -25.95346450805664, "global_step": 377575, "epoch": 4549} {"train_loss": -25.8853759765625, "global_step": 377576, "epoch": 4549} {"train_loss": -25.970382690429688, "global_step": 377577, "epoch": 4549} {"train_loss": -26.218809127807617, "global_step": 377578, "epoch": 4549} {"train_loss": -25.970001220703125, "global_step": 377579, "epoch": 4549} {"train_loss": -26.1442928314209, "global_step": 377580, "epoch": 4549} {"train_loss": -25.932607650756836, "global_step": 377581, "epoch": 4549} {"train_loss": -26.253881454467773, "global_step": 377582, "epoch": 4549} {"train_loss": -26.54034423828125, "global_step": 377583, "epoch": 4549} {"train_loss": -26.359106063842773, "global_step": 377584, "epoch": 4549} {"train_loss": -26.214218139648438, "global_step": 377585, "epoch": 4549} {"train_loss": -26.239398956298828, "global_step": 377586, "epoch": 4549} {"train_loss": -26.118986129760742, "global_step": 377587, "epoch": 4549} {"train_loss": -26.1998348236084, "global_step": 377588, "epoch": 4549} {"train_loss": -26.236825942993164, "global_step": 377589, "epoch": 4549} {"train_loss": -26.59200096130371, "global_step": 377590, "epoch": 4549} {"train_loss": -26.426025390625, "global_step": 377591, "epoch": 4549} {"train_loss": -26.3802433013916, "global_step": 377592, "epoch": 4549} {"train_loss": -26.23102378845215, "global_step": 377593, "epoch": 4549} {"train_loss": -26.279926300048828, "global_step": 377594, "epoch": 4549} {"train_loss": -26.30879020690918, "global_step": 377595, "epoch": 4549} {"train_loss": -26.62884521484375, "global_step": 377596, "epoch": 4549} {"train_loss": -26.630451202392578, "global_step": 377597, "epoch": 4549} {"train_loss": -26.31256103515625, "global_step": 377598, "epoch": 4549} {"train_loss": -26.71759033203125, "global_step": 377599, "epoch": 4549} {"train_loss": -26.77240562438965, "global_step": 377600, "epoch": 4549} {"train_loss": -27.04445457458496, "global_step": 377601, "epoch": 4549} {"train_loss": -26.72562599182129, "global_step": 377602, "epoch": 4549} {"train_loss": -26.640155792236328, "global_step": 377603, "epoch": 4549} {"train_loss": -26.649972915649414, "global_step": 377604, "epoch": 4549} {"train_loss": -26.91437339782715, "global_step": 377605, "epoch": 4549} {"train_loss": -26.523305892944336, "global_step": 377606, "epoch": 4549} {"train_loss": -26.5715389251709, "global_step": 377607, "epoch": 4549} {"train_loss": -26.528472900390625, "global_step": 377608, "epoch": 4549} {"train_loss": -26.714202880859375, "global_step": 377609, "epoch": 4549} {"train_loss": -26.17707633972168, "global_step": 377610, "epoch": 4549} {"train_loss": -26.663053512573242, "global_step": 377611, "epoch": 4549} {"train_loss": -26.648609161376953, "global_step": 377612, "epoch": 4549} {"train_loss": -26.54804801940918, "global_step": 377613, "epoch": 4549} {"train_loss": -26.601993560791016, "global_step": 377614, "epoch": 4549} {"train_loss": -26.17351722717285, "global_step": 377615, "epoch": 4549} {"train_loss": -25.89149284362793, "global_step": 377616, "epoch": 4549} {"train_loss": -25.526123046875, "global_step": 377617, "epoch": 4549} {"train_loss": -25.181842803955078, "global_step": 377618, "epoch": 4549} {"train_loss": -24.99318504333496, "global_step": 377619, "epoch": 4549} {"train_loss": -26.6235408782959, "global_step": 377620, "epoch": 4549} {"train_loss": -26.13728141784668, "global_step": 377621, "epoch": 4549} {"train_loss": -26.50385856628418, "global_step": 377622, "epoch": 4549} {"train_loss": -25.884159088134766, "global_step": 377623, "epoch": 4549} {"train_loss": -26.2030029296875, "global_step": 377624, "epoch": 4549} {"train_loss": -26.145666122436523, "global_step": 377625, "epoch": 4549} {"train_loss": -26.2701358795166, "global_step": 377626, "epoch": 4549} {"train_loss": -26.29987144470215, "global_step": 377627, "epoch": 4549} {"train_loss": -26.00679588317871, "global_step": 377628, "epoch": 4549} {"train_loss": -26.279056549072266, "global_step": 377629, "epoch": 4549} {"train_loss": -26.061445236206055, "global_step": 377630, "epoch": 4549} {"train_loss": -26.314254760742188, "global_step": 377631, "epoch": 4549} {"train_loss": -26.073862075805664, "global_step": 377632, "epoch": 4549} {"train_loss": -25.87678337097168, "global_step": 377633, "epoch": 4549} {"train_loss": -26.139062881469727, "global_step": 377634, "epoch": 4549} {"train_loss": -25.816431045532227, "global_step": 377635, "epoch": 4549} {"train_loss": -26.247364044189453, "global_step": 377636, "epoch": 4549} {"train_loss": -26.2828311920166, "global_step": 377637, "epoch": 4549} {"train_loss": -26.260528564453125, "global_step": 377638, "epoch": 4549} {"train_loss": -26.463287353515625, "global_step": 377639, "epoch": 4549} {"train_loss": -26.050073623657227, "global_step": 377640, "epoch": 4549} {"train_loss": -26.29536247253418, "global_step": 377641, "epoch": 4549} {"train_loss": -26.114904403686523, "global_step": 377642, "epoch": 4549} {"train_loss": -26.04932975769043, "global_step": 377643, "epoch": 4549} {"train_loss": -26.693164825439453, "global_step": 377644, "epoch": 4549} {"train_loss": -26.153844833374023, "global_step": 377645, "epoch": 4549} {"train_loss": -25.98712158203125, "global_step": 377646, "epoch": 4549} {"train_loss": -26.1765193939209, "global_step": 377647, "epoch": 4549} {"train_loss": -26.052637100219727, "global_step": 377648, "epoch": 4549} {"train_loss": -26.21272172123553, "global_step": 377649, "epoch": 4549, "val_loss": 6584804.0} {"train_loss": -25.356908798217773, "global_step": 377650, "epoch": 4550} {"train_loss": -25.835052490234375, "global_step": 377651, "epoch": 4550} {"train_loss": -26.0551815032959, "global_step": 377652, "epoch": 4550} {"train_loss": -25.906641006469727, "global_step": 377653, "epoch": 4550} {"train_loss": -26.0213565826416, "global_step": 377654, "epoch": 4550} {"train_loss": -25.8596134185791, "global_step": 377655, "epoch": 4550} {"train_loss": -25.399011611938477, "global_step": 377656, "epoch": 4550} {"train_loss": -26.147388458251953, "global_step": 377657, "epoch": 4550} {"train_loss": -26.154998779296875, "global_step": 377658, "epoch": 4550} {"train_loss": -25.992633819580078, "global_step": 377659, "epoch": 4550} {"train_loss": -26.35556411743164, "global_step": 377660, "epoch": 4550} {"train_loss": -26.12774658203125, "global_step": 377661, "epoch": 4550} {"train_loss": -26.009790420532227, "global_step": 377662, "epoch": 4550} {"train_loss": -26.371957778930664, "global_step": 377663, "epoch": 4550} {"train_loss": -25.84433937072754, "global_step": 377664, "epoch": 4550} {"train_loss": -25.950794219970703, "global_step": 377665, "epoch": 4550} {"train_loss": -26.283430099487305, "global_step": 377666, "epoch": 4550} {"train_loss": -26.379987716674805, "global_step": 377667, "epoch": 4550} {"train_loss": -26.217687606811523, "global_step": 377668, "epoch": 4550} {"train_loss": -26.338247299194336, "global_step": 377669, "epoch": 4550} {"train_loss": -26.164264678955078, "global_step": 377670, "epoch": 4550} {"train_loss": -26.519012451171875, "global_step": 377671, "epoch": 4550} {"train_loss": -26.679067611694336, "global_step": 377672, "epoch": 4550} {"train_loss": -26.34504508972168, "global_step": 377673, "epoch": 4550} {"train_loss": -26.320581436157227, "global_step": 377674, "epoch": 4550} {"train_loss": -26.4365234375, "global_step": 377675, "epoch": 4550} {"train_loss": -26.712141036987305, "global_step": 377676, "epoch": 4550} {"train_loss": -26.42848014831543, "global_step": 377677, "epoch": 4550} {"train_loss": -26.6958065032959, "global_step": 377678, "epoch": 4550} {"train_loss": -26.559621810913086, "global_step": 377679, "epoch": 4550} {"train_loss": -26.47345542907715, "global_step": 377680, "epoch": 4550} {"train_loss": -26.52088737487793, "global_step": 377681, "epoch": 4550} {"train_loss": -26.171735763549805, "global_step": 377682, "epoch": 4550} {"train_loss": -26.272689819335938, "global_step": 377683, "epoch": 4550} {"train_loss": -26.434003829956055, "global_step": 377684, "epoch": 4550} {"train_loss": -26.37371253967285, "global_step": 377685, "epoch": 4550} {"train_loss": -26.421598434448242, "global_step": 377686, "epoch": 4550} {"train_loss": -26.161218643188477, "global_step": 377687, "epoch": 4550} {"train_loss": -26.4397029876709, "global_step": 377688, "epoch": 4550} {"train_loss": -26.479278564453125, "global_step": 377689, "epoch": 4550} {"train_loss": -26.48101806640625, "global_step": 377690, "epoch": 4550} {"train_loss": -26.44325828552246, "global_step": 377691, "epoch": 4550} {"train_loss": -26.757394790649414, "global_step": 377692, "epoch": 4550} {"train_loss": -26.592029571533203, "global_step": 377693, "epoch": 4550} {"train_loss": -26.5781192779541, "global_step": 377694, "epoch": 4550} {"train_loss": -26.84943199157715, "global_step": 377695, "epoch": 4550} {"train_loss": -26.68342399597168, "global_step": 377696, "epoch": 4550} {"train_loss": -26.778669357299805, "global_step": 377697, "epoch": 4550} {"train_loss": -26.32388687133789, "global_step": 377698, "epoch": 4550} {"train_loss": -26.307031631469727, "global_step": 377699, "epoch": 4550} {"train_loss": -26.573211669921875, "global_step": 377700, "epoch": 4550} {"train_loss": -26.370380401611328, "global_step": 377701, "epoch": 4550} {"train_loss": -26.724822998046875, "global_step": 377702, "epoch": 4550} {"train_loss": -26.813007354736328, "global_step": 377703, "epoch": 4550} {"train_loss": -26.7705020904541, "global_step": 377704, "epoch": 4550} {"train_loss": -26.66535758972168, "global_step": 377705, "epoch": 4550} {"train_loss": -26.504505157470703, "global_step": 377706, "epoch": 4550} {"train_loss": -26.53546714782715, "global_step": 377707, "epoch": 4550} {"train_loss": -26.47920036315918, "global_step": 377708, "epoch": 4550} {"train_loss": -26.865386962890625, "global_step": 377709, "epoch": 4550} {"train_loss": -26.678709030151367, "global_step": 377710, "epoch": 4550} {"train_loss": -26.711822509765625, "global_step": 377711, "epoch": 4550} {"train_loss": -26.85369300842285, "global_step": 377712, "epoch": 4550} {"train_loss": -26.499774932861328, "global_step": 377713, "epoch": 4550} {"train_loss": -26.370227813720703, "global_step": 377714, "epoch": 4550} {"train_loss": -26.554779052734375, "global_step": 377715, "epoch": 4550} {"train_loss": -26.392343521118164, "global_step": 377716, "epoch": 4550} {"train_loss": -26.065641403198242, "global_step": 377717, "epoch": 4550} {"train_loss": -26.05720329284668, "global_step": 377718, "epoch": 4550} {"train_loss": -26.719329833984375, "global_step": 377719, "epoch": 4550} {"train_loss": -26.53466796875, "global_step": 377720, "epoch": 4550} {"train_loss": -26.3767147064209, "global_step": 377721, "epoch": 4550} {"train_loss": -26.266870498657227, "global_step": 377722, "epoch": 4550} {"train_loss": -26.485776901245117, "global_step": 377723, "epoch": 4550} {"train_loss": -26.11903190612793, "global_step": 377724, "epoch": 4550} {"train_loss": -26.280126571655273, "global_step": 377725, "epoch": 4550} {"train_loss": -26.588367462158203, "global_step": 377726, "epoch": 4550} {"train_loss": -26.451807022094727, "global_step": 377727, "epoch": 4550} {"train_loss": -26.43006706237793, "global_step": 377728, "epoch": 4550} {"train_loss": -26.102216720581055, "global_step": 377729, "epoch": 4550} {"train_loss": -26.00745964050293, "global_step": 377730, "epoch": 4550} {"train_loss": -26.648550033569336, "global_step": 377731, "epoch": 4550} {"train_loss": -26.35432374333761, "global_step": 377732, "epoch": 4550, "train/sim_max_reward_0": 1.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4500000": 1.0, "test/sim_max_reward_4500001": 1.0, "test/sim_max_reward_4500002": 1.0, "test/sim_max_reward_4500003": 1.0, "test/sim_max_reward_4500004": 1.0, "test/sim_max_reward_4500005": 1.0, "test/sim_max_reward_4500006": 1.0, "test/sim_max_reward_4500007": 0.0, "test/sim_max_reward_4500008": 1.0, "test/sim_max_reward_4500009": 1.0, "test/sim_max_reward_4500010": 1.0, "test/sim_max_reward_4500011": 1.0, "test/sim_max_reward_4500012": 1.0, "test/sim_max_reward_4500013": 1.0, "test/sim_max_reward_4500014": 1.0, "test/sim_max_reward_4500015": 1.0, "test/sim_max_reward_4500016": 1.0, "test/sim_max_reward_4500017": 1.0, "test/sim_max_reward_4500018": 1.0, "test/sim_max_reward_4500019": 0.0, "test/sim_max_reward_4500020": 1.0, "test/sim_max_reward_4500021": 1.0, "train/mean_score": 1.0, "test/mean_score": 0.9090909090909091, "val_loss": 6530221.0} {"train_loss": -25.96247673034668, "global_step": 377733, "epoch": 4551} {"train_loss": -26.23797607421875, "global_step": 377734, "epoch": 4551} {"train_loss": -26.131855010986328, "global_step": 377735, "epoch": 4551} {"train_loss": -25.86124038696289, "global_step": 377736, "epoch": 4551} {"train_loss": -25.870710372924805, "global_step": 377737, "epoch": 4551} {"train_loss": -26.28549575805664, "global_step": 377738, "epoch": 4551} {"train_loss": -26.23322105407715, "global_step": 377739, "epoch": 4551} {"train_loss": -25.84391212463379, "global_step": 377740, "epoch": 4551} {"train_loss": -25.747343063354492, "global_step": 377741, "epoch": 4551} {"train_loss": -26.43524742126465, "global_step": 377742, "epoch": 4551} {"train_loss": -26.21198081970215, "global_step": 377743, "epoch": 4551} {"train_loss": -25.87615966796875, "global_step": 377744, "epoch": 4551} {"train_loss": -26.48067283630371, "global_step": 377745, "epoch": 4551} {"train_loss": -26.106103897094727, "global_step": 377746, "epoch": 4551} {"train_loss": -26.1373233795166, "global_step": 377747, "epoch": 4551} {"train_loss": -26.067346572875977, "global_step": 377748, "epoch": 4551} {"train_loss": -26.371448516845703, "global_step": 377749, "epoch": 4551} {"train_loss": -26.106969833374023, "global_step": 377750, "epoch": 4551} {"train_loss": -26.243757247924805, "global_step": 377751, "epoch": 4551} {"train_loss": -25.991992950439453, "global_step": 377752, "epoch": 4551} {"train_loss": -26.38498878479004, "global_step": 377753, "epoch": 4551} {"train_loss": -26.41080093383789, "global_step": 377754, "epoch": 4551} {"train_loss": -26.182907104492188, "global_step": 377755, "epoch": 4551} {"train_loss": -26.222471237182617, "global_step": 377756, "epoch": 4551} {"train_loss": -26.304534912109375, "global_step": 377757, "epoch": 4551} {"train_loss": -26.558990478515625, "global_step": 377758, "epoch": 4551} {"train_loss": -26.449783325195312, "global_step": 377759, "epoch": 4551} {"train_loss": -26.171142578125, "global_step": 377760, "epoch": 4551} {"train_loss": -26.442920684814453, "global_step": 377761, "epoch": 4551} {"train_loss": -26.420801162719727, "global_step": 377762, "epoch": 4551} {"train_loss": -26.4400691986084, "global_step": 377763, "epoch": 4551} {"train_loss": -26.424711227416992, "global_step": 377764, "epoch": 4551} {"train_loss": -26.608076095581055, "global_step": 377765, "epoch": 4551} {"train_loss": -25.946561813354492, "global_step": 377766, "epoch": 4551} {"train_loss": -26.284032821655273, "global_step": 377767, "epoch": 4551} {"train_loss": -26.44172477722168, "global_step": 377768, "epoch": 4551} {"train_loss": -26.737340927124023, "global_step": 377769, "epoch": 4551} {"train_loss": -26.825040817260742, "global_step": 377770, "epoch": 4551} {"train_loss": -26.269367218017578, "global_step": 377771, "epoch": 4551} {"train_loss": -26.35051918029785, "global_step": 377772, "epoch": 4551} {"train_loss": -26.75551414489746, "global_step": 377773, "epoch": 4551} {"train_loss": -26.363540649414062, "global_step": 377774, "epoch": 4551} {"train_loss": -26.09514808654785, "global_step": 377775, "epoch": 4551} {"train_loss": -26.098041534423828, "global_step": 377776, "epoch": 4551} {"train_loss": -26.395856857299805, "global_step": 377777, "epoch": 4551} {"train_loss": -26.45376968383789, "global_step": 377778, "epoch": 4551} {"train_loss": -26.435537338256836, "global_step": 377779, "epoch": 4551} {"train_loss": -26.14599609375, "global_step": 377780, "epoch": 4551} {"train_loss": -26.115400314331055, "global_step": 377781, "epoch": 4551} {"train_loss": -26.04291343688965, "global_step": 377782, "epoch": 4551} {"train_loss": -26.230077743530273, "global_step": 377783, "epoch": 4551} {"train_loss": -26.26616859436035, "global_step": 377784, "epoch": 4551} {"train_loss": -26.60870933532715, "global_step": 377785, "epoch": 4551} {"train_loss": -26.091388702392578, "global_step": 377786, "epoch": 4551} {"train_loss": -26.321807861328125, "global_step": 377787, "epoch": 4551} {"train_loss": -26.586578369140625, "global_step": 377788, "epoch": 4551} {"train_loss": -26.184234619140625, "global_step": 377789, "epoch": 4551} {"train_loss": -26.02850914001465, "global_step": 377790, "epoch": 4551} {"train_loss": -26.167083740234375, "global_step": 377791, "epoch": 4551} {"train_loss": -26.27594566345215, "global_step": 377792, "epoch": 4551} {"train_loss": -26.106531143188477, "global_step": 377793, "epoch": 4551} {"train_loss": -26.27764892578125, "global_step": 377794, "epoch": 4551} {"train_loss": -26.231775283813477, "global_step": 377795, "epoch": 4551} {"train_loss": -26.068893432617188, "global_step": 377796, "epoch": 4551} {"train_loss": -26.212400436401367, "global_step": 377797, "epoch": 4551} {"train_loss": -26.330921173095703, "global_step": 377798, "epoch": 4551} {"train_loss": -26.541336059570312, "global_step": 377799, "epoch": 4551} {"train_loss": -26.391523361206055, "global_step": 377800, "epoch": 4551} {"train_loss": -26.565576553344727, "global_step": 377801, "epoch": 4551} {"train_loss": -25.97842788696289, "global_step": 377802, "epoch": 4551} {"train_loss": -26.191736221313477, "global_step": 377803, "epoch": 4551} {"train_loss": -25.90997314453125, "global_step": 377804, "epoch": 4551} {"train_loss": -26.241422653198242, "global_step": 377805, "epoch": 4551} {"train_loss": -26.041410446166992, "global_step": 377806, "epoch": 4551} {"train_loss": -26.19687843322754, "global_step": 377807, "epoch": 4551} {"train_loss": -26.409799575805664, "global_step": 377808, "epoch": 4551} {"train_loss": -26.103046417236328, "global_step": 377809, "epoch": 4551} {"train_loss": -25.77834129333496, "global_step": 377810, "epoch": 4551} {"train_loss": -26.00738525390625, "global_step": 377811, "epoch": 4551} {"train_loss": -26.342132568359375, "global_step": 377812, "epoch": 4551} {"train_loss": -26.402814865112305, "global_step": 377813, "epoch": 4551} {"train_loss": -26.44870376586914, "global_step": 377814, "epoch": 4551} {"train_loss": -26.26102020079831, "global_step": 377815, "epoch": 4551, "val_loss": 6579487.5} {"train_loss": -25.701772689819336, "global_step": 377816, "epoch": 4552} {"train_loss": -25.883899688720703, "global_step": 377817, "epoch": 4552} {"train_loss": -26.291107177734375, "global_step": 377818, "epoch": 4552} {"train_loss": -25.724445343017578, "global_step": 377819, "epoch": 4552} {"train_loss": -26.039892196655273, "global_step": 377820, "epoch": 4552} {"train_loss": -26.053991317749023, "global_step": 377821, "epoch": 4552} {"train_loss": -26.345508575439453, "global_step": 377822, "epoch": 4552} {"train_loss": -26.3205509185791, "global_step": 377823, "epoch": 4552} {"train_loss": -26.59394645690918, "global_step": 377824, "epoch": 4552} {"train_loss": -26.270288467407227, "global_step": 377825, "epoch": 4552} {"train_loss": -26.396808624267578, "global_step": 377826, "epoch": 4552} {"train_loss": -26.560504913330078, "global_step": 377827, "epoch": 4552} {"train_loss": -26.154560089111328, "global_step": 377828, "epoch": 4552} {"train_loss": -26.424482345581055, "global_step": 377829, "epoch": 4552} {"train_loss": -26.19093894958496, "global_step": 377830, "epoch": 4552} {"train_loss": -26.234968185424805, "global_step": 377831, "epoch": 4552} {"train_loss": -26.328876495361328, "global_step": 377832, "epoch": 4552} {"train_loss": -26.50921630859375, "global_step": 377833, "epoch": 4552} {"train_loss": -26.60491371154785, "global_step": 377834, "epoch": 4552} {"train_loss": -26.409574508666992, "global_step": 377835, "epoch": 4552} {"train_loss": -26.220569610595703, "global_step": 377836, "epoch": 4552} {"train_loss": -26.708160400390625, "global_step": 377837, "epoch": 4552} {"train_loss": -26.292972564697266, "global_step": 377838, "epoch": 4552} {"train_loss": -26.43597412109375, "global_step": 377839, "epoch": 4552} {"train_loss": -26.557525634765625, "global_step": 377840, "epoch": 4552} {"train_loss": -26.774169921875, "global_step": 377841, "epoch": 4552} {"train_loss": -26.8872013092041, "global_step": 377842, "epoch": 4552} {"train_loss": -26.482519149780273, "global_step": 377843, "epoch": 4552} {"train_loss": -26.66691017150879, "global_step": 377844, "epoch": 4552} {"train_loss": -26.60694694519043, "global_step": 377845, "epoch": 4552} {"train_loss": -26.472009658813477, "global_step": 377846, "epoch": 4552} {"train_loss": -26.671560287475586, "global_step": 377847, "epoch": 4552} {"train_loss": -26.58111572265625, "global_step": 377848, "epoch": 4552} {"train_loss": -26.585346221923828, "global_step": 377849, "epoch": 4552} {"train_loss": -26.36750602722168, "global_step": 377850, "epoch": 4552} {"train_loss": -26.15949058532715, "global_step": 377851, "epoch": 4552} {"train_loss": -26.799625396728516, "global_step": 377852, "epoch": 4552} {"train_loss": -26.800764083862305, "global_step": 377853, "epoch": 4552} {"train_loss": -26.249496459960938, "global_step": 377854, "epoch": 4552} {"train_loss": -26.572214126586914, "global_step": 377855, "epoch": 4552} {"train_loss": -26.774301528930664, "global_step": 377856, "epoch": 4552} {"train_loss": -26.34403419494629, "global_step": 377857, "epoch": 4552} {"train_loss": -26.048547744750977, "global_step": 377858, "epoch": 4552} {"train_loss": -26.325910568237305, "global_step": 377859, "epoch": 4552} {"train_loss": -26.18596839904785, "global_step": 377860, "epoch": 4552} {"train_loss": -26.661386489868164, "global_step": 377861, "epoch": 4552} {"train_loss": -26.429996490478516, "global_step": 377862, "epoch": 4552} {"train_loss": -26.387653350830078, "global_step": 377863, "epoch": 4552} {"train_loss": -25.834875106811523, "global_step": 377864, "epoch": 4552} {"train_loss": -26.424671173095703, "global_step": 377865, "epoch": 4552} {"train_loss": -26.4586181640625, "global_step": 377866, "epoch": 4552} {"train_loss": -26.039142608642578, "global_step": 377867, "epoch": 4552} {"train_loss": -25.98733901977539, "global_step": 377868, "epoch": 4552} {"train_loss": -26.0714111328125, "global_step": 377869, "epoch": 4552} {"train_loss": -26.34295082092285, "global_step": 377870, "epoch": 4552} {"train_loss": -26.299530029296875, "global_step": 377871, "epoch": 4552} {"train_loss": -26.67474365234375, "global_step": 377872, "epoch": 4552} {"train_loss": -26.548791885375977, "global_step": 377873, "epoch": 4552} {"train_loss": -26.116962432861328, "global_step": 377874, "epoch": 4552} {"train_loss": -25.96573257446289, "global_step": 377875, "epoch": 4552} {"train_loss": -26.261127471923828, "global_step": 377876, "epoch": 4552} {"train_loss": -26.310699462890625, "global_step": 377877, "epoch": 4552} {"train_loss": -26.3216495513916, "global_step": 377878, "epoch": 4552} {"train_loss": -25.98810386657715, "global_step": 377879, "epoch": 4552} {"train_loss": -26.252822875976562, "global_step": 377880, "epoch": 4552} {"train_loss": -26.408849716186523, "global_step": 377881, "epoch": 4552} {"train_loss": -26.378955841064453, "global_step": 377882, "epoch": 4552} {"train_loss": -26.320648193359375, "global_step": 377883, "epoch": 4552} {"train_loss": -26.333784103393555, "global_step": 377884, "epoch": 4552} {"train_loss": -26.232879638671875, "global_step": 377885, "epoch": 4552} {"train_loss": -26.386703491210938, "global_step": 377886, "epoch": 4552} {"train_loss": -26.170883178710938, "global_step": 377887, "epoch": 4552} {"train_loss": -26.480945587158203, "global_step": 377888, "epoch": 4552} {"train_loss": -26.175384521484375, "global_step": 377889, "epoch": 4552} {"train_loss": -26.36591911315918, "global_step": 377890, "epoch": 4552} {"train_loss": -27.038312911987305, "global_step": 377891, "epoch": 4552} {"train_loss": -26.6528377532959, "global_step": 377892, "epoch": 4552} {"train_loss": -26.62979507446289, "global_step": 377893, "epoch": 4552} {"train_loss": -26.60086441040039, "global_step": 377894, "epoch": 4552} {"train_loss": -26.473251342773438, "global_step": 377895, "epoch": 4552} {"train_loss": -26.586267471313477, "global_step": 377896, "epoch": 4552} {"train_loss": -26.257892608642578, "global_step": 377897, "epoch": 4552} {"train_loss": -26.364343482327747, "global_step": 377898, "epoch": 4552, "val_loss": 6552349.0} {"train_loss": -26.04733657836914, "global_step": 377899, "epoch": 4553} {"train_loss": -26.061262130737305, "global_step": 377900, "epoch": 4553} {"train_loss": -25.865819931030273, "global_step": 377901, "epoch": 4553} {"train_loss": -25.77253532409668, "global_step": 377902, "epoch": 4553} {"train_loss": -26.517200469970703, "global_step": 377903, "epoch": 4553} {"train_loss": -25.76533317565918, "global_step": 377904, "epoch": 4553} {"train_loss": -25.444814682006836, "global_step": 377905, "epoch": 4553} {"train_loss": -25.730060577392578, "global_step": 377906, "epoch": 4553} {"train_loss": -25.966827392578125, "global_step": 377907, "epoch": 4553} {"train_loss": -25.794952392578125, "global_step": 377908, "epoch": 4553} {"train_loss": -26.057788848876953, "global_step": 377909, "epoch": 4553} {"train_loss": -26.121984481811523, "global_step": 377910, "epoch": 4553} {"train_loss": -26.2760066986084, "global_step": 377911, "epoch": 4553} {"train_loss": -25.84897804260254, "global_step": 377912, "epoch": 4553} {"train_loss": -26.388586044311523, "global_step": 377913, "epoch": 4553} {"train_loss": -26.115280151367188, "global_step": 377914, "epoch": 4553} {"train_loss": -26.572065353393555, "global_step": 377915, "epoch": 4553} {"train_loss": -26.050323486328125, "global_step": 377916, "epoch": 4553} {"train_loss": -26.44780921936035, "global_step": 377917, "epoch": 4553} {"train_loss": -25.9077205657959, "global_step": 377918, "epoch": 4553} {"train_loss": -26.31793785095215, "global_step": 377919, "epoch": 4553} {"train_loss": -26.193744659423828, "global_step": 377920, "epoch": 4553} {"train_loss": -26.4617919921875, "global_step": 377921, "epoch": 4553} {"train_loss": -26.222875595092773, "global_step": 377922, "epoch": 4553} {"train_loss": -26.082534790039062, "global_step": 377923, "epoch": 4553} {"train_loss": -26.438373565673828, "global_step": 377924, "epoch": 4553} {"train_loss": -25.97745132446289, "global_step": 377925, "epoch": 4553} {"train_loss": -26.2768611907959, "global_step": 377926, "epoch": 4553} {"train_loss": -26.479516983032227, "global_step": 377927, "epoch": 4553} {"train_loss": -26.57024574279785, "global_step": 377928, "epoch": 4553} {"train_loss": -26.173349380493164, "global_step": 377929, "epoch": 4553} {"train_loss": -26.766281127929688, "global_step": 377930, "epoch": 4553} {"train_loss": -26.40899658203125, "global_step": 377931, "epoch": 4553} {"train_loss": -26.496601104736328, "global_step": 377932, "epoch": 4553} {"train_loss": -26.69378662109375, "global_step": 377933, "epoch": 4553} {"train_loss": -26.30982780456543, "global_step": 377934, "epoch": 4553} {"train_loss": -26.533422470092773, "global_step": 377935, "epoch": 4553} {"train_loss": -26.57842445373535, "global_step": 377936, "epoch": 4553} {"train_loss": -26.643033981323242, "global_step": 377937, "epoch": 4553} {"train_loss": -26.691455841064453, "global_step": 377938, "epoch": 4553} {"train_loss": -26.6251163482666, "global_step": 377939, "epoch": 4553} {"train_loss": -26.597082138061523, "global_step": 377940, "epoch": 4553} {"train_loss": -26.72568130493164, "global_step": 377941, "epoch": 4553} {"train_loss": -26.643606185913086, "global_step": 377942, "epoch": 4553} {"train_loss": -26.51188087463379, "global_step": 377943, "epoch": 4553} {"train_loss": -26.734756469726562, "global_step": 377944, "epoch": 4553} {"train_loss": -26.695789337158203, "global_step": 377945, "epoch": 4553} {"train_loss": -26.043182373046875, "global_step": 377946, "epoch": 4553} {"train_loss": -26.60823631286621, "global_step": 377947, "epoch": 4553} {"train_loss": -25.970678329467773, "global_step": 377948, "epoch": 4553} {"train_loss": -24.55533790588379, "global_step": 377949, "epoch": 4553} {"train_loss": -23.887483596801758, "global_step": 377950, "epoch": 4553} {"train_loss": -24.94793701171875, "global_step": 377951, "epoch": 4553} {"train_loss": -25.562702178955078, "global_step": 377952, "epoch": 4553} {"train_loss": -24.450284957885742, "global_step": 377953, "epoch": 4553} {"train_loss": -24.72853660583496, "global_step": 377954, "epoch": 4553} {"train_loss": -25.103702545166016, "global_step": 377955, "epoch": 4553} {"train_loss": -25.401552200317383, "global_step": 377956, "epoch": 4553} {"train_loss": -25.712522506713867, "global_step": 377957, "epoch": 4553} {"train_loss": -25.59918785095215, "global_step": 377958, "epoch": 4553} {"train_loss": -25.373769760131836, "global_step": 377959, "epoch": 4553} {"train_loss": -25.6551570892334, "global_step": 377960, "epoch": 4553} {"train_loss": -25.500732421875, "global_step": 377961, "epoch": 4553} {"train_loss": -25.53371238708496, "global_step": 377962, "epoch": 4553} {"train_loss": -25.818723678588867, "global_step": 377963, "epoch": 4553} {"train_loss": -25.47735023498535, "global_step": 377964, "epoch": 4553} {"train_loss": -25.7901611328125, "global_step": 377965, "epoch": 4553} {"train_loss": -25.547033309936523, "global_step": 377966, "epoch": 4553} {"train_loss": -25.4824161529541, "global_step": 377967, "epoch": 4553} {"train_loss": -25.856115341186523, "global_step": 377968, "epoch": 4553} {"train_loss": -25.818578720092773, "global_step": 377969, "epoch": 4553} {"train_loss": -26.2271671295166, "global_step": 377970, "epoch": 4553} {"train_loss": -25.82905387878418, "global_step": 377971, "epoch": 4553} {"train_loss": -25.825275421142578, "global_step": 377972, "epoch": 4553} {"train_loss": -25.808002471923828, "global_step": 377973, "epoch": 4553} {"train_loss": -26.159271240234375, "global_step": 377974, "epoch": 4553} {"train_loss": -25.621490478515625, "global_step": 377975, "epoch": 4553} {"train_loss": -26.192367553710938, "global_step": 377976, "epoch": 4553} {"train_loss": -25.941913604736328, "global_step": 377977, "epoch": 4553} {"train_loss": -26.195545196533203, "global_step": 377978, "epoch": 4553} {"train_loss": -26.311437606811523, "global_step": 377979, "epoch": 4553} {"train_loss": -26.213790893554688, "global_step": 377980, "epoch": 4553} {"train_loss": -26.00917494440653, "global_step": 377981, "epoch": 4553, "val_loss": 6603632.5} {"train_loss": -26.146764755249023, "global_step": 377982, "epoch": 4554} {"train_loss": -26.23193359375, "global_step": 377983, "epoch": 4554} {"train_loss": -26.170429229736328, "global_step": 377984, "epoch": 4554} {"train_loss": -25.88075065612793, "global_step": 377985, "epoch": 4554} {"train_loss": -26.54925537109375, "global_step": 377986, "epoch": 4554} {"train_loss": -26.03204345703125, "global_step": 377987, "epoch": 4554} {"train_loss": -26.034595489501953, "global_step": 377988, "epoch": 4554} {"train_loss": -26.433496475219727, "global_step": 377989, "epoch": 4554} {"train_loss": -26.065643310546875, "global_step": 377990, "epoch": 4554} {"train_loss": -26.19877052307129, "global_step": 377991, "epoch": 4554} {"train_loss": -25.914539337158203, "global_step": 377992, "epoch": 4554} {"train_loss": -25.78460121154785, "global_step": 377993, "epoch": 4554} {"train_loss": -26.163360595703125, "global_step": 377994, "epoch": 4554} {"train_loss": -25.978015899658203, "global_step": 377995, "epoch": 4554} {"train_loss": -26.218652725219727, "global_step": 377996, "epoch": 4554} {"train_loss": -26.25092124938965, "global_step": 377997, "epoch": 4554} {"train_loss": -26.114032745361328, "global_step": 377998, "epoch": 4554} {"train_loss": -26.417078018188477, "global_step": 377999, "epoch": 4554} {"train_loss": -26.49753189086914, "global_step": 378000, "epoch": 4554} {"train_loss": -26.505319595336914, "global_step": 378001, "epoch": 4554} {"train_loss": -26.587732315063477, "global_step": 378002, "epoch": 4554} {"train_loss": -26.312265396118164, "global_step": 378003, "epoch": 4554} {"train_loss": -26.081573486328125, "global_step": 378004, "epoch": 4554} {"train_loss": -26.15134048461914, "global_step": 378005, "epoch": 4554} {"train_loss": -26.385290145874023, "global_step": 378006, "epoch": 4554} {"train_loss": -25.866376876831055, "global_step": 378007, "epoch": 4554} {"train_loss": -26.557260513305664, "global_step": 378008, "epoch": 4554} {"train_loss": -26.42209815979004, "global_step": 378009, "epoch": 4554} {"train_loss": -26.35601234436035, "global_step": 378010, "epoch": 4554} {"train_loss": -26.42129898071289, "global_step": 378011, "epoch": 4554} {"train_loss": -26.481658935546875, "global_step": 378012, "epoch": 4554} {"train_loss": -26.324827194213867, "global_step": 378013, "epoch": 4554} {"train_loss": -26.253904342651367, "global_step": 378014, "epoch": 4554} {"train_loss": -26.4436092376709, "global_step": 378015, "epoch": 4554} {"train_loss": -26.036056518554688, "global_step": 378016, "epoch": 4554} {"train_loss": -26.256071090698242, "global_step": 378017, "epoch": 4554} {"train_loss": -26.65091323852539, "global_step": 378018, "epoch": 4554} {"train_loss": -26.884153366088867, "global_step": 378019, "epoch": 4554} {"train_loss": -26.403844833374023, "global_step": 378020, "epoch": 4554} {"train_loss": -26.409894943237305, "global_step": 378021, "epoch": 4554} {"train_loss": -26.453414916992188, "global_step": 378022, "epoch": 4554} {"train_loss": -26.467527389526367, "global_step": 378023, "epoch": 4554} {"train_loss": -26.33271598815918, "global_step": 378024, "epoch": 4554} {"train_loss": -26.715940475463867, "global_step": 378025, "epoch": 4554} {"train_loss": -26.34266471862793, "global_step": 378026, "epoch": 4554} {"train_loss": -26.4820499420166, "global_step": 378027, "epoch": 4554} {"train_loss": -26.359785079956055, "global_step": 378028, "epoch": 4554} {"train_loss": -26.325332641601562, "global_step": 378029, "epoch": 4554} {"train_loss": -26.138696670532227, "global_step": 378030, "epoch": 4554} {"train_loss": -26.42646598815918, "global_step": 378031, "epoch": 4554} {"train_loss": -26.553430557250977, "global_step": 378032, "epoch": 4554} {"train_loss": -26.461095809936523, "global_step": 378033, "epoch": 4554} {"train_loss": -26.4581241607666, "global_step": 378034, "epoch": 4554} {"train_loss": -26.65154457092285, "global_step": 378035, "epoch": 4554} {"train_loss": -26.326004028320312, "global_step": 378036, "epoch": 4554} {"train_loss": -26.468372344970703, "global_step": 378037, "epoch": 4554} {"train_loss": -26.559799194335938, "global_step": 378038, "epoch": 4554} {"train_loss": -26.36823844909668, "global_step": 378039, "epoch": 4554} {"train_loss": -26.51946449279785, "global_step": 378040, "epoch": 4554} {"train_loss": -26.6317195892334, "global_step": 378041, "epoch": 4554} {"train_loss": -26.222333908081055, "global_step": 378042, "epoch": 4554} {"train_loss": -26.489551544189453, "global_step": 378043, "epoch": 4554} {"train_loss": -26.82080078125, "global_step": 378044, "epoch": 4554} {"train_loss": -26.427541732788086, "global_step": 378045, "epoch": 4554} {"train_loss": -26.317914962768555, "global_step": 378046, "epoch": 4554} {"train_loss": -26.766942977905273, "global_step": 378047, "epoch": 4554} {"train_loss": -26.595609664916992, "global_step": 378048, "epoch": 4554} {"train_loss": -26.451171875, "global_step": 378049, "epoch": 4554} {"train_loss": -26.629236221313477, "global_step": 378050, "epoch": 4554} {"train_loss": -26.327224731445312, "global_step": 378051, "epoch": 4554} {"train_loss": -26.54888916015625, "global_step": 378052, "epoch": 4554} {"train_loss": -26.732746124267578, "global_step": 378053, "epoch": 4554} {"train_loss": -26.5090389251709, "global_step": 378054, "epoch": 4554} {"train_loss": -26.837879180908203, "global_step": 378055, "epoch": 4554} {"train_loss": -26.433195114135742, "global_step": 378056, "epoch": 4554} {"train_loss": -26.512113571166992, "global_step": 378057, "epoch": 4554} {"train_loss": -26.4680233001709, "global_step": 378058, "epoch": 4554} {"train_loss": -26.78486442565918, "global_step": 378059, "epoch": 4554} {"train_loss": -26.45121192932129, "global_step": 378060, "epoch": 4554} {"train_loss": -26.967267990112305, "global_step": 378061, "epoch": 4554} {"train_loss": -26.476903915405273, "global_step": 378062, "epoch": 4554} {"train_loss": -26.90185546875, "global_step": 378063, "epoch": 4554} {"train_loss": -26.4057628677552, "global_step": 378064, "epoch": 4554, "val_loss": 6637311.0} {"train_loss": -25.648468017578125, "global_step": 378065, "epoch": 4555} {"train_loss": -26.183002471923828, "global_step": 378066, "epoch": 4555} {"train_loss": -25.54426383972168, "global_step": 378067, "epoch": 4555} {"train_loss": -25.545263290405273, "global_step": 378068, "epoch": 4555} {"train_loss": -26.01698875427246, "global_step": 378069, "epoch": 4555} {"train_loss": -25.63142967224121, "global_step": 378070, "epoch": 4555} {"train_loss": -26.05999755859375, "global_step": 378071, "epoch": 4555} {"train_loss": -25.419252395629883, "global_step": 378072, "epoch": 4555} {"train_loss": -26.402271270751953, "global_step": 378073, "epoch": 4555} {"train_loss": -25.788776397705078, "global_step": 378074, "epoch": 4555} {"train_loss": -26.349151611328125, "global_step": 378075, "epoch": 4555} {"train_loss": -26.530176162719727, "global_step": 378076, "epoch": 4555} {"train_loss": -26.15357780456543, "global_step": 378077, "epoch": 4555} {"train_loss": -25.936994552612305, "global_step": 378078, "epoch": 4555} {"train_loss": -25.834613800048828, "global_step": 378079, "epoch": 4555} {"train_loss": -26.0876522064209, "global_step": 378080, "epoch": 4555} {"train_loss": -26.194665908813477, "global_step": 378081, "epoch": 4555} {"train_loss": -26.368322372436523, "global_step": 378082, "epoch": 4555} {"train_loss": -26.49921226501465, "global_step": 378083, "epoch": 4555} {"train_loss": -26.146747589111328, "global_step": 378084, "epoch": 4555} {"train_loss": -26.060443878173828, "global_step": 378085, "epoch": 4555} {"train_loss": -25.896387100219727, "global_step": 378086, "epoch": 4555} {"train_loss": -26.5296688079834, "global_step": 378087, "epoch": 4555} {"train_loss": -26.311344146728516, "global_step": 378088, "epoch": 4555} {"train_loss": -26.190296173095703, "global_step": 378089, "epoch": 4555} {"train_loss": -26.23530387878418, "global_step": 378090, "epoch": 4555} {"train_loss": -25.93633460998535, "global_step": 378091, "epoch": 4555} {"train_loss": -26.28314781188965, "global_step": 378092, "epoch": 4555} {"train_loss": -26.22625160217285, "global_step": 378093, "epoch": 4555} {"train_loss": -26.093053817749023, "global_step": 378094, "epoch": 4555} {"train_loss": -26.2661190032959, "global_step": 378095, "epoch": 4555} {"train_loss": -26.529022216796875, "global_step": 378096, "epoch": 4555} {"train_loss": -26.844913482666016, "global_step": 378097, "epoch": 4555} {"train_loss": -26.205799102783203, "global_step": 378098, "epoch": 4555} {"train_loss": -26.133014678955078, "global_step": 378099, "epoch": 4555} {"train_loss": -26.40470314025879, "global_step": 378100, "epoch": 4555} {"train_loss": -26.063873291015625, "global_step": 378101, "epoch": 4555} {"train_loss": -26.517602920532227, "global_step": 378102, "epoch": 4555} {"train_loss": -26.280561447143555, "global_step": 378103, "epoch": 4555} {"train_loss": -26.59419059753418, "global_step": 378104, "epoch": 4555} {"train_loss": -26.608198165893555, "global_step": 378105, "epoch": 4555} {"train_loss": -25.836811065673828, "global_step": 378106, "epoch": 4555} {"train_loss": -26.332284927368164, "global_step": 378107, "epoch": 4555} {"train_loss": -26.43918228149414, "global_step": 378108, "epoch": 4555} {"train_loss": -26.64242935180664, "global_step": 378109, "epoch": 4555} {"train_loss": -26.007293701171875, "global_step": 378110, "epoch": 4555} {"train_loss": -26.305906295776367, "global_step": 378111, "epoch": 4555} {"train_loss": -26.393646240234375, "global_step": 378112, "epoch": 4555} {"train_loss": -26.491992950439453, "global_step": 378113, "epoch": 4555} {"train_loss": -26.90266990661621, "global_step": 378114, "epoch": 4555} {"train_loss": -26.579065322875977, "global_step": 378115, "epoch": 4555} {"train_loss": -26.683929443359375, "global_step": 378116, "epoch": 4555} {"train_loss": -26.416494369506836, "global_step": 378117, "epoch": 4555} {"train_loss": -26.38385581970215, "global_step": 378118, "epoch": 4555} {"train_loss": -26.509521484375, "global_step": 378119, "epoch": 4555} {"train_loss": -26.5914306640625, "global_step": 378120, "epoch": 4555} {"train_loss": -26.649921417236328, "global_step": 378121, "epoch": 4555} {"train_loss": -26.305038452148438, "global_step": 378122, "epoch": 4555} {"train_loss": -26.277719497680664, "global_step": 378123, "epoch": 4555} {"train_loss": -26.540740966796875, "global_step": 378124, "epoch": 4555} {"train_loss": -26.660877227783203, "global_step": 378125, "epoch": 4555} {"train_loss": -26.46640968322754, "global_step": 378126, "epoch": 4555} {"train_loss": -26.59320640563965, "global_step": 378127, "epoch": 4555} {"train_loss": -26.3118896484375, "global_step": 378128, "epoch": 4555} {"train_loss": -26.47578239440918, "global_step": 378129, "epoch": 4555} {"train_loss": -26.642126083374023, "global_step": 378130, "epoch": 4555} {"train_loss": -26.482629776000977, "global_step": 378131, "epoch": 4555} {"train_loss": -26.34272575378418, "global_step": 378132, "epoch": 4555} {"train_loss": -26.52656364440918, "global_step": 378133, "epoch": 4555} {"train_loss": -26.545154571533203, "global_step": 378134, "epoch": 4555} {"train_loss": -26.607959747314453, "global_step": 378135, "epoch": 4555} {"train_loss": -26.21161460876465, "global_step": 378136, "epoch": 4555} {"train_loss": -26.642852783203125, "global_step": 378137, "epoch": 4555} {"train_loss": -26.64569664001465, "global_step": 378138, "epoch": 4555} {"train_loss": -26.639118194580078, "global_step": 378139, "epoch": 4555} {"train_loss": -26.299911499023438, "global_step": 378140, "epoch": 4555} {"train_loss": -26.52113151550293, "global_step": 378141, "epoch": 4555} {"train_loss": -26.705175399780273, "global_step": 378142, "epoch": 4555} {"train_loss": -26.40195655822754, "global_step": 378143, "epoch": 4555} {"train_loss": -26.763818740844727, "global_step": 378144, "epoch": 4555} {"train_loss": -26.23833656311035, "global_step": 378145, "epoch": 4555} {"train_loss": -26.601003646850586, "global_step": 378146, "epoch": 4555} {"train_loss": -26.333648245018647, "global_step": 378147, "epoch": 4555, "val_loss": 6662364.0} {"train_loss": -26.357858657836914, "global_step": 378148, "epoch": 4556} {"train_loss": -25.81569480895996, "global_step": 378149, "epoch": 4556} {"train_loss": -26.488290786743164, "global_step": 378150, "epoch": 4556} {"train_loss": -26.007843017578125, "global_step": 378151, "epoch": 4556} {"train_loss": -25.843170166015625, "global_step": 378152, "epoch": 4556} {"train_loss": -26.3360538482666, "global_step": 378153, "epoch": 4556} {"train_loss": -26.49224853515625, "global_step": 378154, "epoch": 4556} {"train_loss": -26.39899253845215, "global_step": 378155, "epoch": 4556} {"train_loss": -26.128326416015625, "global_step": 378156, "epoch": 4556} {"train_loss": -26.328107833862305, "global_step": 378157, "epoch": 4556} {"train_loss": -26.397857666015625, "global_step": 378158, "epoch": 4556} {"train_loss": -26.09441566467285, "global_step": 378159, "epoch": 4556} {"train_loss": -26.3587646484375, "global_step": 378160, "epoch": 4556} {"train_loss": -26.3698673248291, "global_step": 378161, "epoch": 4556} {"train_loss": -26.54196548461914, "global_step": 378162, "epoch": 4556} {"train_loss": -26.35601806640625, "global_step": 378163, "epoch": 4556} {"train_loss": -26.518484115600586, "global_step": 378164, "epoch": 4556} {"train_loss": -26.53858757019043, "global_step": 378165, "epoch": 4556} {"train_loss": -26.57916831970215, "global_step": 378166, "epoch": 4556} {"train_loss": -26.101028442382812, "global_step": 378167, "epoch": 4556} {"train_loss": -26.629003524780273, "global_step": 378168, "epoch": 4556} {"train_loss": -26.558643341064453, "global_step": 378169, "epoch": 4556} {"train_loss": -26.323623657226562, "global_step": 378170, "epoch": 4556} {"train_loss": -26.25593376159668, "global_step": 378171, "epoch": 4556} {"train_loss": -26.346515655517578, "global_step": 378172, "epoch": 4556} {"train_loss": -26.374765396118164, "global_step": 378173, "epoch": 4556} {"train_loss": -26.273212432861328, "global_step": 378174, "epoch": 4556} {"train_loss": -26.461252212524414, "global_step": 378175, "epoch": 4556} {"train_loss": -26.500608444213867, "global_step": 378176, "epoch": 4556} {"train_loss": -26.2347354888916, "global_step": 378177, "epoch": 4556} {"train_loss": -26.44302749633789, "global_step": 378178, "epoch": 4556} {"train_loss": -25.77375602722168, "global_step": 378179, "epoch": 4556} {"train_loss": -25.8157901763916, "global_step": 378180, "epoch": 4556} {"train_loss": -25.735692977905273, "global_step": 378181, "epoch": 4556} {"train_loss": -26.017902374267578, "global_step": 378182, "epoch": 4556} {"train_loss": -26.489700317382812, "global_step": 378183, "epoch": 4556} {"train_loss": -25.047739028930664, "global_step": 378184, "epoch": 4556} {"train_loss": -26.014942169189453, "global_step": 378185, "epoch": 4556} {"train_loss": -25.960784912109375, "global_step": 378186, "epoch": 4556} {"train_loss": -25.789682388305664, "global_step": 378187, "epoch": 4556} {"train_loss": -25.927261352539062, "global_step": 378188, "epoch": 4556} {"train_loss": -26.113752365112305, "global_step": 378189, "epoch": 4556} {"train_loss": -25.94278907775879, "global_step": 378190, "epoch": 4556} {"train_loss": -26.511510848999023, "global_step": 378191, "epoch": 4556} {"train_loss": -25.965320587158203, "global_step": 378192, "epoch": 4556} {"train_loss": -26.430618286132812, "global_step": 378193, "epoch": 4556} {"train_loss": -26.21711540222168, "global_step": 378194, "epoch": 4556} {"train_loss": -26.161970138549805, "global_step": 378195, "epoch": 4556} {"train_loss": -26.244220733642578, "global_step": 378196, "epoch": 4556} {"train_loss": -26.337799072265625, "global_step": 378197, "epoch": 4556} {"train_loss": -26.244003295898438, "global_step": 378198, "epoch": 4556} {"train_loss": -26.18527603149414, "global_step": 378199, "epoch": 4556} {"train_loss": -26.245101928710938, "global_step": 378200, "epoch": 4556} {"train_loss": -26.58735466003418, "global_step": 378201, "epoch": 4556} {"train_loss": -26.4438533782959, "global_step": 378202, "epoch": 4556} {"train_loss": -26.071725845336914, "global_step": 378203, "epoch": 4556} {"train_loss": -26.151403427124023, "global_step": 378204, "epoch": 4556} {"train_loss": -26.537296295166016, "global_step": 378205, "epoch": 4556} {"train_loss": -26.14240074157715, "global_step": 378206, "epoch": 4556} {"train_loss": -26.66131019592285, "global_step": 378207, "epoch": 4556} {"train_loss": -26.2414493560791, "global_step": 378208, "epoch": 4556} {"train_loss": -26.175016403198242, "global_step": 378209, "epoch": 4556} {"train_loss": -26.198856353759766, "global_step": 378210, "epoch": 4556} {"train_loss": -26.184850692749023, "global_step": 378211, "epoch": 4556} {"train_loss": -26.2755069732666, "global_step": 378212, "epoch": 4556} {"train_loss": -26.42487144470215, "global_step": 378213, "epoch": 4556} {"train_loss": -26.517724990844727, "global_step": 378214, "epoch": 4556} {"train_loss": -26.552417755126953, "global_step": 378215, "epoch": 4556} {"train_loss": -26.261077880859375, "global_step": 378216, "epoch": 4556} {"train_loss": -26.60992431640625, "global_step": 378217, "epoch": 4556} {"train_loss": -26.546894073486328, "global_step": 378218, "epoch": 4556} {"train_loss": -26.33210563659668, "global_step": 378219, "epoch": 4556} {"train_loss": -26.36371421813965, "global_step": 378220, "epoch": 4556} {"train_loss": -26.263629913330078, "global_step": 378221, "epoch": 4556} {"train_loss": -26.365280151367188, "global_step": 378222, "epoch": 4556} {"train_loss": -26.52680778503418, "global_step": 378223, "epoch": 4556} {"train_loss": -26.43250846862793, "global_step": 378224, "epoch": 4556} {"train_loss": -26.633258819580078, "global_step": 378225, "epoch": 4556} {"train_loss": -26.548025131225586, "global_step": 378226, "epoch": 4556} {"train_loss": -26.47865104675293, "global_step": 378227, "epoch": 4556} {"train_loss": -26.417932510375977, "global_step": 378228, "epoch": 4556} {"train_loss": -26.348590850830078, "global_step": 378229, "epoch": 4556} {"train_loss": -26.27037873325578, "global_step": 378230, "epoch": 4556, "val_loss": 6536197.0} {"train_loss": -26.025266647338867, "global_step": 378231, "epoch": 4557} {"train_loss": -26.164270401000977, "global_step": 378232, "epoch": 4557} {"train_loss": -25.27193832397461, "global_step": 378233, "epoch": 4557} {"train_loss": -25.997455596923828, "global_step": 378234, "epoch": 4557} {"train_loss": -26.269433975219727, "global_step": 378235, "epoch": 4557} {"train_loss": -26.3234920501709, "global_step": 378236, "epoch": 4557} {"train_loss": -26.14100456237793, "global_step": 378237, "epoch": 4557} {"train_loss": -26.1627254486084, "global_step": 378238, "epoch": 4557} {"train_loss": -26.275848388671875, "global_step": 378239, "epoch": 4557} {"train_loss": -26.46198081970215, "global_step": 378240, "epoch": 4557} {"train_loss": -26.53679847717285, "global_step": 378241, "epoch": 4557} {"train_loss": -26.526111602783203, "global_step": 378242, "epoch": 4557} {"train_loss": -26.255701065063477, "global_step": 378243, "epoch": 4557} {"train_loss": -26.395593643188477, "global_step": 378244, "epoch": 4557} {"train_loss": -26.412555694580078, "global_step": 378245, "epoch": 4557} {"train_loss": -26.019269943237305, "global_step": 378246, "epoch": 4557} {"train_loss": -26.44019889831543, "global_step": 378247, "epoch": 4557} {"train_loss": -26.232934951782227, "global_step": 378248, "epoch": 4557} {"train_loss": -26.64336585998535, "global_step": 378249, "epoch": 4557} {"train_loss": -26.460590362548828, "global_step": 378250, "epoch": 4557} {"train_loss": -26.191404342651367, "global_step": 378251, "epoch": 4557} {"train_loss": -26.49110221862793, "global_step": 378252, "epoch": 4557} {"train_loss": -26.276264190673828, "global_step": 378253, "epoch": 4557} {"train_loss": -26.6622257232666, "global_step": 378254, "epoch": 4557} {"train_loss": -26.488300323486328, "global_step": 378255, "epoch": 4557} {"train_loss": -26.45722007751465, "global_step": 378256, "epoch": 4557} {"train_loss": -26.7222843170166, "global_step": 378257, "epoch": 4557} {"train_loss": -26.517175674438477, "global_step": 378258, "epoch": 4557} {"train_loss": -26.277551651000977, "global_step": 378259, "epoch": 4557} {"train_loss": -26.535654067993164, "global_step": 378260, "epoch": 4557} {"train_loss": -26.4581241607666, "global_step": 378261, "epoch": 4557} {"train_loss": -26.70413589477539, "global_step": 378262, "epoch": 4557} {"train_loss": -26.400014877319336, "global_step": 378263, "epoch": 4557} {"train_loss": -26.448163986206055, "global_step": 378264, "epoch": 4557} {"train_loss": -26.596296310424805, "global_step": 378265, "epoch": 4557} {"train_loss": -26.744949340820312, "global_step": 378266, "epoch": 4557} {"train_loss": -26.408716201782227, "global_step": 378267, "epoch": 4557} {"train_loss": -26.75197410583496, "global_step": 378268, "epoch": 4557} {"train_loss": -26.343006134033203, "global_step": 378269, "epoch": 4557} {"train_loss": -26.2305850982666, "global_step": 378270, "epoch": 4557} {"train_loss": -26.153461456298828, "global_step": 378271, "epoch": 4557} {"train_loss": -26.53809928894043, "global_step": 378272, "epoch": 4557} {"train_loss": -26.074182510375977, "global_step": 378273, "epoch": 4557} {"train_loss": -26.230899810791016, "global_step": 378274, "epoch": 4557} {"train_loss": -26.381742477416992, "global_step": 378275, "epoch": 4557} {"train_loss": -26.034759521484375, "global_step": 378276, "epoch": 4557} {"train_loss": -26.338659286499023, "global_step": 378277, "epoch": 4557} {"train_loss": -26.588977813720703, "global_step": 378278, "epoch": 4557} {"train_loss": -26.374094009399414, "global_step": 378279, "epoch": 4557} {"train_loss": -26.101613998413086, "global_step": 378280, "epoch": 4557} {"train_loss": -25.50288963317871, "global_step": 378281, "epoch": 4557} {"train_loss": -26.102170944213867, "global_step": 378282, "epoch": 4557} {"train_loss": -26.946191787719727, "global_step": 378283, "epoch": 4557} {"train_loss": -26.155319213867188, "global_step": 378284, "epoch": 4557} {"train_loss": -25.800933837890625, "global_step": 378285, "epoch": 4557} {"train_loss": -26.79163932800293, "global_step": 378286, "epoch": 4557} {"train_loss": -25.760726928710938, "global_step": 378287, "epoch": 4557} {"train_loss": -25.77545166015625, "global_step": 378288, "epoch": 4557} {"train_loss": -26.373260498046875, "global_step": 378289, "epoch": 4557} {"train_loss": -26.349292755126953, "global_step": 378290, "epoch": 4557} {"train_loss": -26.2747745513916, "global_step": 378291, "epoch": 4557} {"train_loss": -26.148420333862305, "global_step": 378292, "epoch": 4557} {"train_loss": -26.69459342956543, "global_step": 378293, "epoch": 4557} {"train_loss": -26.30792236328125, "global_step": 378294, "epoch": 4557} {"train_loss": -26.4704532623291, "global_step": 378295, "epoch": 4557} {"train_loss": -26.47075843811035, "global_step": 378296, "epoch": 4557} {"train_loss": -26.301227569580078, "global_step": 378297, "epoch": 4557} {"train_loss": -26.250513076782227, "global_step": 378298, "epoch": 4557} {"train_loss": -26.456329345703125, "global_step": 378299, "epoch": 4557} {"train_loss": -26.1791934967041, "global_step": 378300, "epoch": 4557} {"train_loss": -26.332181930541992, "global_step": 378301, "epoch": 4557} {"train_loss": -26.336902618408203, "global_step": 378302, "epoch": 4557} {"train_loss": -26.67236328125, "global_step": 378303, "epoch": 4557} {"train_loss": -26.398900985717773, "global_step": 378304, "epoch": 4557} {"train_loss": -26.149173736572266, "global_step": 378305, "epoch": 4557} {"train_loss": -26.386396408081055, "global_step": 378306, "epoch": 4557} {"train_loss": -26.584640502929688, "global_step": 378307, "epoch": 4557} {"train_loss": -26.061355590820312, "global_step": 378308, "epoch": 4557} {"train_loss": -26.536243438720703, "global_step": 378309, "epoch": 4557} {"train_loss": -26.038549423217773, "global_step": 378310, "epoch": 4557} {"train_loss": -26.035003662109375, "global_step": 378311, "epoch": 4557} {"train_loss": -26.417993545532227, "global_step": 378312, "epoch": 4557} {"train_loss": -26.30979043891631, "global_step": 378313, "epoch": 4557, "val_loss": 6528349.5} {"train_loss": -24.159778594970703, "global_step": 378314, "epoch": 4558} {"train_loss": -25.345279693603516, "global_step": 378315, "epoch": 4558} {"train_loss": -24.987775802612305, "global_step": 378316, "epoch": 4558} {"train_loss": -24.742467880249023, "global_step": 378317, "epoch": 4558} {"train_loss": -25.534202575683594, "global_step": 378318, "epoch": 4558} {"train_loss": -25.31641960144043, "global_step": 378319, "epoch": 4558} {"train_loss": -25.477262496948242, "global_step": 378320, "epoch": 4558} {"train_loss": -25.61049461364746, "global_step": 378321, "epoch": 4558} {"train_loss": -25.445220947265625, "global_step": 378322, "epoch": 4558} {"train_loss": -25.983274459838867, "global_step": 378323, "epoch": 4558} {"train_loss": -25.7105655670166, "global_step": 378324, "epoch": 4558} {"train_loss": -25.647871017456055, "global_step": 378325, "epoch": 4558} {"train_loss": -25.579782485961914, "global_step": 378326, "epoch": 4558} {"train_loss": -25.91595458984375, "global_step": 378327, "epoch": 4558} {"train_loss": -25.3090877532959, "global_step": 378328, "epoch": 4558} {"train_loss": -25.866931915283203, "global_step": 378329, "epoch": 4558} {"train_loss": -25.56618309020996, "global_step": 378330, "epoch": 4558} {"train_loss": -25.736913681030273, "global_step": 378331, "epoch": 4558} {"train_loss": -25.769514083862305, "global_step": 378332, "epoch": 4558} {"train_loss": -26.2663631439209, "global_step": 378333, "epoch": 4558} {"train_loss": -26.28571128845215, "global_step": 378334, "epoch": 4558} {"train_loss": -26.201648712158203, "global_step": 378335, "epoch": 4558} {"train_loss": -25.940927505493164, "global_step": 378336, "epoch": 4558} {"train_loss": -26.064767837524414, "global_step": 378337, "epoch": 4558} {"train_loss": -26.104644775390625, "global_step": 378338, "epoch": 4558} {"train_loss": -26.096227645874023, "global_step": 378339, "epoch": 4558} {"train_loss": -25.828372955322266, "global_step": 378340, "epoch": 4558} {"train_loss": -26.14397621154785, "global_step": 378341, "epoch": 4558} {"train_loss": -26.047061920166016, "global_step": 378342, "epoch": 4558} {"train_loss": -26.493932723999023, "global_step": 378343, "epoch": 4558} {"train_loss": -26.506153106689453, "global_step": 378344, "epoch": 4558} {"train_loss": -26.065876007080078, "global_step": 378345, "epoch": 4558} {"train_loss": -26.174020767211914, "global_step": 378346, "epoch": 4558} {"train_loss": -26.385955810546875, "global_step": 378347, "epoch": 4558} {"train_loss": -26.184967041015625, "global_step": 378348, "epoch": 4558} {"train_loss": -26.23433494567871, "global_step": 378349, "epoch": 4558} {"train_loss": -26.223052978515625, "global_step": 378350, "epoch": 4558} {"train_loss": -26.587543487548828, "global_step": 378351, "epoch": 4558} {"train_loss": -26.507604598999023, "global_step": 378352, "epoch": 4558} {"train_loss": -26.506948471069336, "global_step": 378353, "epoch": 4558} {"train_loss": -26.671661376953125, "global_step": 378354, "epoch": 4558} {"train_loss": -26.63588523864746, "global_step": 378355, "epoch": 4558} {"train_loss": -26.715478897094727, "global_step": 378356, "epoch": 4558} {"train_loss": -26.40923500061035, "global_step": 378357, "epoch": 4558} {"train_loss": -26.172897338867188, "global_step": 378358, "epoch": 4558} {"train_loss": -26.73378562927246, "global_step": 378359, "epoch": 4558} {"train_loss": -26.134485244750977, "global_step": 378360, "epoch": 4558} {"train_loss": -26.67776870727539, "global_step": 378361, "epoch": 4558} {"train_loss": -26.54729652404785, "global_step": 378362, "epoch": 4558} {"train_loss": -26.722883224487305, "global_step": 378363, "epoch": 4558} {"train_loss": -26.615631103515625, "global_step": 378364, "epoch": 4558} {"train_loss": -26.7521915435791, "global_step": 378365, "epoch": 4558} {"train_loss": -26.5784854888916, "global_step": 378366, "epoch": 4558} {"train_loss": -26.680694580078125, "global_step": 378367, "epoch": 4558} {"train_loss": -26.5964298248291, "global_step": 378368, "epoch": 4558} {"train_loss": -26.686254501342773, "global_step": 378369, "epoch": 4558} {"train_loss": -26.417200088500977, "global_step": 378370, "epoch": 4558} {"train_loss": -26.55816650390625, "global_step": 378371, "epoch": 4558} {"train_loss": -26.812870025634766, "global_step": 378372, "epoch": 4558} {"train_loss": -26.373144149780273, "global_step": 378373, "epoch": 4558} {"train_loss": -26.599191665649414, "global_step": 378374, "epoch": 4558} {"train_loss": -26.326536178588867, "global_step": 378375, "epoch": 4558} {"train_loss": -26.57234001159668, "global_step": 378376, "epoch": 4558} {"train_loss": -26.0775146484375, "global_step": 378377, "epoch": 4558} {"train_loss": -25.522602081298828, "global_step": 378378, "epoch": 4558} {"train_loss": -24.61860466003418, "global_step": 378379, "epoch": 4558} {"train_loss": -25.428922653198242, "global_step": 378380, "epoch": 4558} {"train_loss": -26.444238662719727, "global_step": 378381, "epoch": 4558} {"train_loss": -26.131397247314453, "global_step": 378382, "epoch": 4558} {"train_loss": -25.464033126831055, "global_step": 378383, "epoch": 4558} {"train_loss": -26.0498046875, "global_step": 378384, "epoch": 4558} {"train_loss": -26.249784469604492, "global_step": 378385, "epoch": 4558} {"train_loss": -25.32386016845703, "global_step": 378386, "epoch": 4558} {"train_loss": -26.090137481689453, "global_step": 378387, "epoch": 4558} {"train_loss": -26.403614044189453, "global_step": 378388, "epoch": 4558} {"train_loss": -26.02546501159668, "global_step": 378389, "epoch": 4558} {"train_loss": -26.52728843688965, "global_step": 378390, "epoch": 4558} {"train_loss": -26.12714958190918, "global_step": 378391, "epoch": 4558} {"train_loss": -26.190458297729492, "global_step": 378392, "epoch": 4558} {"train_loss": -26.53191566467285, "global_step": 378393, "epoch": 4558} {"train_loss": -26.149429321289062, "global_step": 378394, "epoch": 4558} {"train_loss": -26.062910079956055, "global_step": 378395, "epoch": 4558} {"train_loss": -26.10397513515978, "global_step": 378396, "epoch": 4558, "val_loss": 6565244.0} {"train_loss": -25.519224166870117, "global_step": 378397, "epoch": 4559} {"train_loss": -25.931781768798828, "global_step": 378398, "epoch": 4559} {"train_loss": -25.817541122436523, "global_step": 378399, "epoch": 4559} {"train_loss": -25.82028579711914, "global_step": 378400, "epoch": 4559} {"train_loss": -25.663816452026367, "global_step": 378401, "epoch": 4559} {"train_loss": -25.82244873046875, "global_step": 378402, "epoch": 4559} {"train_loss": -26.070270538330078, "global_step": 378403, "epoch": 4559} {"train_loss": -26.095945358276367, "global_step": 378404, "epoch": 4559} {"train_loss": -25.849811553955078, "global_step": 378405, "epoch": 4559} {"train_loss": -26.099811553955078, "global_step": 378406, "epoch": 4559} {"train_loss": -25.92496681213379, "global_step": 378407, "epoch": 4559} {"train_loss": -26.048236846923828, "global_step": 378408, "epoch": 4559} {"train_loss": -26.192487716674805, "global_step": 378409, "epoch": 4559} {"train_loss": -26.076379776000977, "global_step": 378410, "epoch": 4559} {"train_loss": -26.267230987548828, "global_step": 378411, "epoch": 4559} {"train_loss": -26.442102432250977, "global_step": 378412, "epoch": 4559} {"train_loss": -26.610809326171875, "global_step": 378413, "epoch": 4559} {"train_loss": -26.858678817749023, "global_step": 378414, "epoch": 4559} {"train_loss": -26.501081466674805, "global_step": 378415, "epoch": 4559} {"train_loss": -26.4377384185791, "global_step": 378416, "epoch": 4559} {"train_loss": -26.399784088134766, "global_step": 378417, "epoch": 4559} {"train_loss": -26.343097686767578, "global_step": 378418, "epoch": 4559} {"train_loss": -26.34872817993164, "global_step": 378419, "epoch": 4559} {"train_loss": -25.958454132080078, "global_step": 378420, "epoch": 4559} {"train_loss": -26.285886764526367, "global_step": 378421, "epoch": 4559} {"train_loss": -26.615137100219727, "global_step": 378422, "epoch": 4559} {"train_loss": -26.796552658081055, "global_step": 378423, "epoch": 4559} {"train_loss": -26.357715606689453, "global_step": 378424, "epoch": 4559} {"train_loss": -26.321979522705078, "global_step": 378425, "epoch": 4559} {"train_loss": -26.675464630126953, "global_step": 378426, "epoch": 4559} {"train_loss": -26.673044204711914, "global_step": 378427, "epoch": 4559} {"train_loss": -26.259845733642578, "global_step": 378428, "epoch": 4559} {"train_loss": -26.465930938720703, "global_step": 378429, "epoch": 4559} {"train_loss": -26.547998428344727, "global_step": 378430, "epoch": 4559} {"train_loss": -26.62543296813965, "global_step": 378431, "epoch": 4559} {"train_loss": -26.72309684753418, "global_step": 378432, "epoch": 4559} {"train_loss": -26.401655197143555, "global_step": 378433, "epoch": 4559} {"train_loss": -26.653736114501953, "global_step": 378434, "epoch": 4559} {"train_loss": -26.795974731445312, "global_step": 378435, "epoch": 4559} {"train_loss": -26.520246505737305, "global_step": 378436, "epoch": 4559} {"train_loss": -26.565155029296875, "global_step": 378437, "epoch": 4559} {"train_loss": -26.383508682250977, "global_step": 378438, "epoch": 4559} {"train_loss": -26.403100967407227, "global_step": 378439, "epoch": 4559} {"train_loss": -26.612573623657227, "global_step": 378440, "epoch": 4559} {"train_loss": -26.60984230041504, "global_step": 378441, "epoch": 4559} {"train_loss": -26.69463539123535, "global_step": 378442, "epoch": 4559} {"train_loss": -26.885135650634766, "global_step": 378443, "epoch": 4559} {"train_loss": -26.635894775390625, "global_step": 378444, "epoch": 4559} {"train_loss": -26.821496963500977, "global_step": 378445, "epoch": 4559} {"train_loss": -26.506513595581055, "global_step": 378446, "epoch": 4559} {"train_loss": -26.6781063079834, "global_step": 378447, "epoch": 4559} {"train_loss": -26.328262329101562, "global_step": 378448, "epoch": 4559} {"train_loss": -26.573455810546875, "global_step": 378449, "epoch": 4559} {"train_loss": -26.658735275268555, "global_step": 378450, "epoch": 4559} {"train_loss": -26.5771541595459, "global_step": 378451, "epoch": 4559} {"train_loss": -26.669055938720703, "global_step": 378452, "epoch": 4559} {"train_loss": -26.457250595092773, "global_step": 378453, "epoch": 4559} {"train_loss": -26.385761260986328, "global_step": 378454, "epoch": 4559} {"train_loss": -26.549976348876953, "global_step": 378455, "epoch": 4559} {"train_loss": -26.52304458618164, "global_step": 378456, "epoch": 4559} {"train_loss": -26.74647331237793, "global_step": 378457, "epoch": 4559} {"train_loss": -26.843000411987305, "global_step": 378458, "epoch": 4559} {"train_loss": -26.309621810913086, "global_step": 378459, "epoch": 4559} {"train_loss": -26.170324325561523, "global_step": 378460, "epoch": 4559} {"train_loss": -26.419836044311523, "global_step": 378461, "epoch": 4559} {"train_loss": -26.731489181518555, "global_step": 378462, "epoch": 4559} {"train_loss": -26.733978271484375, "global_step": 378463, "epoch": 4559} {"train_loss": -26.539560317993164, "global_step": 378464, "epoch": 4559} {"train_loss": -26.367353439331055, "global_step": 378465, "epoch": 4559} {"train_loss": -26.461088180541992, "global_step": 378466, "epoch": 4559} {"train_loss": -26.508289337158203, "global_step": 378467, "epoch": 4559} {"train_loss": -26.40431022644043, "global_step": 378468, "epoch": 4559} {"train_loss": -26.311071395874023, "global_step": 378469, "epoch": 4559} {"train_loss": -26.25080680847168, "global_step": 378470, "epoch": 4559} {"train_loss": -26.161895751953125, "global_step": 378471, "epoch": 4559} {"train_loss": -26.71563148498535, "global_step": 378472, "epoch": 4559} {"train_loss": -26.586719512939453, "global_step": 378473, "epoch": 4559} {"train_loss": -26.402942657470703, "global_step": 378474, "epoch": 4559} {"train_loss": -25.93342399597168, "global_step": 378475, "epoch": 4559} {"train_loss": -26.10275650024414, "global_step": 378476, "epoch": 4559} {"train_loss": -26.6715087890625, "global_step": 378477, "epoch": 4559} {"train_loss": -26.3485050201416, "global_step": 378478, "epoch": 4559} {"train_loss": -26.405199395604882, "global_step": 378479, "epoch": 4559, "val_loss": 6616696.0} {"train_loss": -25.94636344909668, "global_step": 378480, "epoch": 4560} {"train_loss": -25.468313217163086, "global_step": 378481, "epoch": 4560} {"train_loss": -25.855031967163086, "global_step": 378482, "epoch": 4560} {"train_loss": -25.98398780822754, "global_step": 378483, "epoch": 4560} {"train_loss": -25.627670288085938, "global_step": 378484, "epoch": 4560} {"train_loss": -25.635116577148438, "global_step": 378485, "epoch": 4560} {"train_loss": -26.515653610229492, "global_step": 378486, "epoch": 4560} {"train_loss": -25.871109008789062, "global_step": 378487, "epoch": 4560} {"train_loss": -26.02764320373535, "global_step": 378488, "epoch": 4560} {"train_loss": -26.055967330932617, "global_step": 378489, "epoch": 4560} {"train_loss": -25.980249404907227, "global_step": 378490, "epoch": 4560} {"train_loss": -26.12461280822754, "global_step": 378491, "epoch": 4560} {"train_loss": -26.528860092163086, "global_step": 378492, "epoch": 4560} {"train_loss": -25.9483585357666, "global_step": 378493, "epoch": 4560} {"train_loss": -26.347089767456055, "global_step": 378494, "epoch": 4560} {"train_loss": -26.257612228393555, "global_step": 378495, "epoch": 4560} {"train_loss": -26.22443962097168, "global_step": 378496, "epoch": 4560} {"train_loss": -26.29901695251465, "global_step": 378497, "epoch": 4560} {"train_loss": -26.16366958618164, "global_step": 378498, "epoch": 4560} {"train_loss": -26.23663902282715, "global_step": 378499, "epoch": 4560} {"train_loss": -26.3499755859375, "global_step": 378500, "epoch": 4560} {"train_loss": -26.1640567779541, "global_step": 378501, "epoch": 4560} {"train_loss": -25.97108268737793, "global_step": 378502, "epoch": 4560} {"train_loss": -26.498870849609375, "global_step": 378503, "epoch": 4560} {"train_loss": -26.108856201171875, "global_step": 378504, "epoch": 4560} {"train_loss": -26.1675968170166, "global_step": 378505, "epoch": 4560} {"train_loss": -26.449487686157227, "global_step": 378506, "epoch": 4560} {"train_loss": -26.092243194580078, "global_step": 378507, "epoch": 4560} {"train_loss": -26.756046295166016, "global_step": 378508, "epoch": 4560} {"train_loss": -26.3477725982666, "global_step": 378509, "epoch": 4560} {"train_loss": -26.256336212158203, "global_step": 378510, "epoch": 4560} {"train_loss": -26.5949764251709, "global_step": 378511, "epoch": 4560} {"train_loss": -26.707990646362305, "global_step": 378512, "epoch": 4560} {"train_loss": -26.30971336364746, "global_step": 378513, "epoch": 4560} {"train_loss": -26.318708419799805, "global_step": 378514, "epoch": 4560} {"train_loss": -26.280014038085938, "global_step": 378515, "epoch": 4560} {"train_loss": -26.76252555847168, "global_step": 378516, "epoch": 4560} {"train_loss": -26.554828643798828, "global_step": 378517, "epoch": 4560} {"train_loss": -26.345197677612305, "global_step": 378518, "epoch": 4560} {"train_loss": -26.41497802734375, "global_step": 378519, "epoch": 4560} {"train_loss": -26.56776237487793, "global_step": 378520, "epoch": 4560} {"train_loss": -26.46734046936035, "global_step": 378521, "epoch": 4560} {"train_loss": -26.945133209228516, "global_step": 378522, "epoch": 4560} {"train_loss": -26.6588077545166, "global_step": 378523, "epoch": 4560} {"train_loss": -26.206714630126953, "global_step": 378524, "epoch": 4560} {"train_loss": -26.680505752563477, "global_step": 378525, "epoch": 4560} {"train_loss": -26.247961044311523, "global_step": 378526, "epoch": 4560} {"train_loss": -26.289203643798828, "global_step": 378527, "epoch": 4560} {"train_loss": -26.595844268798828, "global_step": 378528, "epoch": 4560} {"train_loss": -26.091449737548828, "global_step": 378529, "epoch": 4560} {"train_loss": -26.286893844604492, "global_step": 378530, "epoch": 4560} {"train_loss": -26.655170440673828, "global_step": 378531, "epoch": 4560} {"train_loss": -26.235502243041992, "global_step": 378532, "epoch": 4560} {"train_loss": -26.71759605407715, "global_step": 378533, "epoch": 4560} {"train_loss": -26.3554630279541, "global_step": 378534, "epoch": 4560} {"train_loss": -26.259016036987305, "global_step": 378535, "epoch": 4560} {"train_loss": -26.257919311523438, "global_step": 378536, "epoch": 4560} {"train_loss": -26.364660263061523, "global_step": 378537, "epoch": 4560} {"train_loss": -26.36471939086914, "global_step": 378538, "epoch": 4560} {"train_loss": -25.91155433654785, "global_step": 378539, "epoch": 4560} {"train_loss": -26.58771324157715, "global_step": 378540, "epoch": 4560} {"train_loss": -25.968366622924805, "global_step": 378541, "epoch": 4560} {"train_loss": -26.81802749633789, "global_step": 378542, "epoch": 4560} {"train_loss": -26.526472091674805, "global_step": 378543, "epoch": 4560} {"train_loss": -26.635168075561523, "global_step": 378544, "epoch": 4560} {"train_loss": -26.57734489440918, "global_step": 378545, "epoch": 4560} {"train_loss": -26.54327964782715, "global_step": 378546, "epoch": 4560} {"train_loss": -26.46595573425293, "global_step": 378547, "epoch": 4560} {"train_loss": -26.551910400390625, "global_step": 378548, "epoch": 4560} {"train_loss": -26.38779640197754, "global_step": 378549, "epoch": 4560} {"train_loss": -26.496320724487305, "global_step": 378550, "epoch": 4560} {"train_loss": -26.514057159423828, "global_step": 378551, "epoch": 4560} {"train_loss": -26.185461044311523, "global_step": 378552, "epoch": 4560} {"train_loss": -26.735584259033203, "global_step": 378553, "epoch": 4560} {"train_loss": -26.7305850982666, "global_step": 378554, "epoch": 4560} {"train_loss": -26.329666137695312, "global_step": 378555, "epoch": 4560} {"train_loss": -26.385995864868164, "global_step": 378556, "epoch": 4560} {"train_loss": -26.248580932617188, "global_step": 378557, "epoch": 4560} {"train_loss": -26.552783966064453, "global_step": 378558, "epoch": 4560} {"train_loss": -26.30020523071289, "global_step": 378559, "epoch": 4560} {"train_loss": -26.246295928955078, "global_step": 378560, "epoch": 4560} {"train_loss": -26.36054039001465, "global_step": 378561, "epoch": 4560} {"train_loss": -26.33111243650138, "global_step": 378562, "epoch": 4560, "val_loss": 6656195.0} {"train_loss": -25.25558853149414, "global_step": 378563, "epoch": 4561} {"train_loss": -25.20783805847168, "global_step": 378564, "epoch": 4561} {"train_loss": -24.380603790283203, "global_step": 378565, "epoch": 4561} {"train_loss": -24.979536056518555, "global_step": 378566, "epoch": 4561} {"train_loss": -25.648839950561523, "global_step": 378567, "epoch": 4561} {"train_loss": -24.46649742126465, "global_step": 378568, "epoch": 4561} {"train_loss": -25.615802764892578, "global_step": 378569, "epoch": 4561} {"train_loss": -25.00676918029785, "global_step": 378570, "epoch": 4561} {"train_loss": -25.562028884887695, "global_step": 378571, "epoch": 4561} {"train_loss": -25.79915428161621, "global_step": 378572, "epoch": 4561} {"train_loss": -26.243127822875977, "global_step": 378573, "epoch": 4561} {"train_loss": -25.536680221557617, "global_step": 378574, "epoch": 4561} {"train_loss": -26.098562240600586, "global_step": 378575, "epoch": 4561} {"train_loss": -25.608661651611328, "global_step": 378576, "epoch": 4561} {"train_loss": -25.829511642456055, "global_step": 378577, "epoch": 4561} {"train_loss": -25.68348503112793, "global_step": 378578, "epoch": 4561} {"train_loss": -25.71748924255371, "global_step": 378579, "epoch": 4561} {"train_loss": -25.64533042907715, "global_step": 378580, "epoch": 4561} {"train_loss": -25.6948299407959, "global_step": 378581, "epoch": 4561} {"train_loss": -25.565378189086914, "global_step": 378582, "epoch": 4561} {"train_loss": -25.38539695739746, "global_step": 378583, "epoch": 4561} {"train_loss": -25.694799423217773, "global_step": 378584, "epoch": 4561} {"train_loss": -25.593191146850586, "global_step": 378585, "epoch": 4561} {"train_loss": -25.81024742126465, "global_step": 378586, "epoch": 4561} {"train_loss": -25.973285675048828, "global_step": 378587, "epoch": 4561} {"train_loss": -26.255430221557617, "global_step": 378588, "epoch": 4561} {"train_loss": -26.567163467407227, "global_step": 378589, "epoch": 4561} {"train_loss": -25.66069984436035, "global_step": 378590, "epoch": 4561} {"train_loss": -25.934045791625977, "global_step": 378591, "epoch": 4561} {"train_loss": -25.859867095947266, "global_step": 378592, "epoch": 4561} {"train_loss": -26.277902603149414, "global_step": 378593, "epoch": 4561} {"train_loss": -26.363407135009766, "global_step": 378594, "epoch": 4561} {"train_loss": -26.243505477905273, "global_step": 378595, "epoch": 4561} {"train_loss": -26.55780029296875, "global_step": 378596, "epoch": 4561} {"train_loss": -26.346311569213867, "global_step": 378597, "epoch": 4561} {"train_loss": -26.05387306213379, "global_step": 378598, "epoch": 4561} {"train_loss": -26.336217880249023, "global_step": 378599, "epoch": 4561} {"train_loss": -26.182947158813477, "global_step": 378600, "epoch": 4561} {"train_loss": -26.12912940979004, "global_step": 378601, "epoch": 4561} {"train_loss": -26.553525924682617, "global_step": 378602, "epoch": 4561} {"train_loss": -26.45002555847168, "global_step": 378603, "epoch": 4561} {"train_loss": -26.66437339782715, "global_step": 378604, "epoch": 4561} {"train_loss": -26.661115646362305, "global_step": 378605, "epoch": 4561} {"train_loss": -26.246679306030273, "global_step": 378606, "epoch": 4561} {"train_loss": -26.57184410095215, "global_step": 378607, "epoch": 4561} {"train_loss": -26.31683349609375, "global_step": 378608, "epoch": 4561} {"train_loss": -26.329547882080078, "global_step": 378609, "epoch": 4561} {"train_loss": -26.260135650634766, "global_step": 378610, "epoch": 4561} {"train_loss": -26.50225257873535, "global_step": 378611, "epoch": 4561} {"train_loss": -26.464807510375977, "global_step": 378612, "epoch": 4561} {"train_loss": -26.550933837890625, "global_step": 378613, "epoch": 4561} {"train_loss": -26.25983238220215, "global_step": 378614, "epoch": 4561} {"train_loss": -26.855655670166016, "global_step": 378615, "epoch": 4561} {"train_loss": -26.4036865234375, "global_step": 378616, "epoch": 4561} {"train_loss": -26.188486099243164, "global_step": 378617, "epoch": 4561} {"train_loss": -26.799072265625, "global_step": 378618, "epoch": 4561} {"train_loss": -26.109973907470703, "global_step": 378619, "epoch": 4561} {"train_loss": -26.531248092651367, "global_step": 378620, "epoch": 4561} {"train_loss": -26.53717041015625, "global_step": 378621, "epoch": 4561} {"train_loss": -26.47039222717285, "global_step": 378622, "epoch": 4561} {"train_loss": -26.443639755249023, "global_step": 378623, "epoch": 4561} {"train_loss": -26.417444229125977, "global_step": 378624, "epoch": 4561} {"train_loss": -26.866491317749023, "global_step": 378625, "epoch": 4561} {"train_loss": -26.781970977783203, "global_step": 378626, "epoch": 4561} {"train_loss": -26.70966911315918, "global_step": 378627, "epoch": 4561} {"train_loss": -26.668638229370117, "global_step": 378628, "epoch": 4561} {"train_loss": -26.669189453125, "global_step": 378629, "epoch": 4561} {"train_loss": -26.488454818725586, "global_step": 378630, "epoch": 4561} {"train_loss": -26.738691329956055, "global_step": 378631, "epoch": 4561} {"train_loss": -26.687381744384766, "global_step": 378632, "epoch": 4561} {"train_loss": -26.796833038330078, "global_step": 378633, "epoch": 4561} {"train_loss": -26.717884063720703, "global_step": 378634, "epoch": 4561} {"train_loss": -26.337635040283203, "global_step": 378635, "epoch": 4561} {"train_loss": -26.438817977905273, "global_step": 378636, "epoch": 4561} {"train_loss": -26.388397216796875, "global_step": 378637, "epoch": 4561} {"train_loss": -26.344482421875, "global_step": 378638, "epoch": 4561} {"train_loss": -26.65753173828125, "global_step": 378639, "epoch": 4561} {"train_loss": -26.506275177001953, "global_step": 378640, "epoch": 4561} {"train_loss": -26.58057975769043, "global_step": 378641, "epoch": 4561} {"train_loss": -26.539743423461914, "global_step": 378642, "epoch": 4561} {"train_loss": -26.849451065063477, "global_step": 378643, "epoch": 4561} {"train_loss": -26.463361740112305, "global_step": 378644, "epoch": 4561} {"train_loss": -26.1805557572698, "global_step": 378645, "epoch": 4561, "val_loss": 6578644.0} {"train_loss": -26.406936645507812, "global_step": 378646, "epoch": 4562} {"train_loss": -25.966339111328125, "global_step": 378647, "epoch": 4562} {"train_loss": -26.0189208984375, "global_step": 378648, "epoch": 4562} {"train_loss": -25.699905395507812, "global_step": 378649, "epoch": 4562} {"train_loss": -25.154422760009766, "global_step": 378650, "epoch": 4562} {"train_loss": -25.93695640563965, "global_step": 378651, "epoch": 4562} {"train_loss": -25.884790420532227, "global_step": 378652, "epoch": 4562} {"train_loss": -25.72259521484375, "global_step": 378653, "epoch": 4562} {"train_loss": -26.218286514282227, "global_step": 378654, "epoch": 4562} {"train_loss": -25.82791519165039, "global_step": 378655, "epoch": 4562} {"train_loss": -25.31840705871582, "global_step": 378656, "epoch": 4562} {"train_loss": -25.908212661743164, "global_step": 378657, "epoch": 4562} {"train_loss": -26.187030792236328, "global_step": 378658, "epoch": 4562} {"train_loss": -25.805593490600586, "global_step": 378659, "epoch": 4562} {"train_loss": -25.935644149780273, "global_step": 378660, "epoch": 4562} {"train_loss": -26.095121383666992, "global_step": 378661, "epoch": 4562} {"train_loss": -26.246564865112305, "global_step": 378662, "epoch": 4562} {"train_loss": -26.2099609375, "global_step": 378663, "epoch": 4562} {"train_loss": -26.103757858276367, "global_step": 378664, "epoch": 4562} {"train_loss": -26.145566940307617, "global_step": 378665, "epoch": 4562} {"train_loss": -26.363061904907227, "global_step": 378666, "epoch": 4562} {"train_loss": -26.18802261352539, "global_step": 378667, "epoch": 4562} {"train_loss": -26.06464958190918, "global_step": 378668, "epoch": 4562} {"train_loss": -25.915821075439453, "global_step": 378669, "epoch": 4562} {"train_loss": -26.14011001586914, "global_step": 378670, "epoch": 4562} {"train_loss": -26.15411949157715, "global_step": 378671, "epoch": 4562} {"train_loss": -26.247547149658203, "global_step": 378672, "epoch": 4562} {"train_loss": -26.048864364624023, "global_step": 378673, "epoch": 4562} {"train_loss": -26.20073890686035, "global_step": 378674, "epoch": 4562} {"train_loss": -25.864471435546875, "global_step": 378675, "epoch": 4562} {"train_loss": -26.374555587768555, "global_step": 378676, "epoch": 4562} {"train_loss": -26.198572158813477, "global_step": 378677, "epoch": 4562} {"train_loss": -26.034448623657227, "global_step": 378678, "epoch": 4562} {"train_loss": -26.514129638671875, "global_step": 378679, "epoch": 4562} {"train_loss": -26.013397216796875, "global_step": 378680, "epoch": 4562} {"train_loss": -26.502817153930664, "global_step": 378681, "epoch": 4562} {"train_loss": -26.323057174682617, "global_step": 378682, "epoch": 4562} {"train_loss": -26.65748405456543, "global_step": 378683, "epoch": 4562} {"train_loss": -26.443265914916992, "global_step": 378684, "epoch": 4562} {"train_loss": -26.619293212890625, "global_step": 378685, "epoch": 4562} {"train_loss": -26.2038516998291, "global_step": 378686, "epoch": 4562} {"train_loss": -26.22494888305664, "global_step": 378687, "epoch": 4562} {"train_loss": -26.340620040893555, "global_step": 378688, "epoch": 4562} {"train_loss": -26.26746940612793, "global_step": 378689, "epoch": 4562} {"train_loss": -26.382699966430664, "global_step": 378690, "epoch": 4562} {"train_loss": -26.37601089477539, "global_step": 378691, "epoch": 4562} {"train_loss": -26.347198486328125, "global_step": 378692, "epoch": 4562} {"train_loss": -26.408069610595703, "global_step": 378693, "epoch": 4562} {"train_loss": -26.397689819335938, "global_step": 378694, "epoch": 4562} {"train_loss": -26.63762855529785, "global_step": 378695, "epoch": 4562} {"train_loss": -26.5383358001709, "global_step": 378696, "epoch": 4562} {"train_loss": -26.230966567993164, "global_step": 378697, "epoch": 4562} {"train_loss": -26.54669761657715, "global_step": 378698, "epoch": 4562} {"train_loss": -26.336822509765625, "global_step": 378699, "epoch": 4562} {"train_loss": -27.042938232421875, "global_step": 378700, "epoch": 4562} {"train_loss": -26.3016414642334, "global_step": 378701, "epoch": 4562} {"train_loss": -26.846094131469727, "global_step": 378702, "epoch": 4562} {"train_loss": -26.157840728759766, "global_step": 378703, "epoch": 4562} {"train_loss": -26.763031005859375, "global_step": 378704, "epoch": 4562} {"train_loss": -26.451486587524414, "global_step": 378705, "epoch": 4562} {"train_loss": -26.504186630249023, "global_step": 378706, "epoch": 4562} {"train_loss": -26.98626708984375, "global_step": 378707, "epoch": 4562} {"train_loss": -26.632144927978516, "global_step": 378708, "epoch": 4562} {"train_loss": -27.1075439453125, "global_step": 378709, "epoch": 4562} {"train_loss": -26.312902450561523, "global_step": 378710, "epoch": 4562} {"train_loss": -26.583728790283203, "global_step": 378711, "epoch": 4562} {"train_loss": -26.58698844909668, "global_step": 378712, "epoch": 4562} {"train_loss": -26.348203659057617, "global_step": 378713, "epoch": 4562} {"train_loss": -26.99739646911621, "global_step": 378714, "epoch": 4562} {"train_loss": -26.36482810974121, "global_step": 378715, "epoch": 4562} {"train_loss": -26.50900650024414, "global_step": 378716, "epoch": 4562} {"train_loss": -26.41414451599121, "global_step": 378717, "epoch": 4562} {"train_loss": -26.56196403503418, "global_step": 378718, "epoch": 4562} {"train_loss": -26.326902389526367, "global_step": 378719, "epoch": 4562} {"train_loss": -26.29555320739746, "global_step": 378720, "epoch": 4562} {"train_loss": -26.4801025390625, "global_step": 378721, "epoch": 4562} {"train_loss": -26.20265769958496, "global_step": 378722, "epoch": 4562} {"train_loss": -25.701812744140625, "global_step": 378723, "epoch": 4562} {"train_loss": -26.674108505249023, "global_step": 378724, "epoch": 4562} {"train_loss": -26.413639068603516, "global_step": 378725, "epoch": 4562} {"train_loss": -26.469345092773438, "global_step": 378726, "epoch": 4562} {"train_loss": -26.191015243530273, "global_step": 378727, "epoch": 4562} {"train_loss": -26.288313141788343, "global_step": 378728, "epoch": 4562, "val_loss": 6527767.0} {"train_loss": -24.76227378845215, "global_step": 378729, "epoch": 4563} {"train_loss": -25.524696350097656, "global_step": 378730, "epoch": 4563} {"train_loss": -25.176177978515625, "global_step": 378731, "epoch": 4563} {"train_loss": -25.487646102905273, "global_step": 378732, "epoch": 4563} {"train_loss": -24.867109298706055, "global_step": 378733, "epoch": 4563} {"train_loss": -24.92609405517578, "global_step": 378734, "epoch": 4563} {"train_loss": -25.22151756286621, "global_step": 378735, "epoch": 4563} {"train_loss": -25.467079162597656, "global_step": 378736, "epoch": 4563} {"train_loss": -25.730640411376953, "global_step": 378737, "epoch": 4563} {"train_loss": -25.708532333374023, "global_step": 378738, "epoch": 4563} {"train_loss": -25.631826400756836, "global_step": 378739, "epoch": 4563} {"train_loss": -25.88118553161621, "global_step": 378740, "epoch": 4563} {"train_loss": -25.753936767578125, "global_step": 378741, "epoch": 4563} {"train_loss": -25.903676986694336, "global_step": 378742, "epoch": 4563} {"train_loss": -26.105316162109375, "global_step": 378743, "epoch": 4563} {"train_loss": -26.041257858276367, "global_step": 378744, "epoch": 4563} {"train_loss": -25.751977920532227, "global_step": 378745, "epoch": 4563} {"train_loss": -26.049835205078125, "global_step": 378746, "epoch": 4563} {"train_loss": -26.277027130126953, "global_step": 378747, "epoch": 4563} {"train_loss": -25.807897567749023, "global_step": 378748, "epoch": 4563} {"train_loss": -26.041339874267578, "global_step": 378749, "epoch": 4563} {"train_loss": -26.193944931030273, "global_step": 378750, "epoch": 4563} {"train_loss": -26.387775421142578, "global_step": 378751, "epoch": 4563} {"train_loss": -26.2891845703125, "global_step": 378752, "epoch": 4563} {"train_loss": -26.486495971679688, "global_step": 378753, "epoch": 4563} {"train_loss": -26.255929946899414, "global_step": 378754, "epoch": 4563} {"train_loss": -26.293920516967773, "global_step": 378755, "epoch": 4563} {"train_loss": -26.13263511657715, "global_step": 378756, "epoch": 4563} {"train_loss": -26.388324737548828, "global_step": 378757, "epoch": 4563} {"train_loss": -26.344940185546875, "global_step": 378758, "epoch": 4563} {"train_loss": -26.01581382751465, "global_step": 378759, "epoch": 4563} {"train_loss": -26.518781661987305, "global_step": 378760, "epoch": 4563} {"train_loss": -26.39374351501465, "global_step": 378761, "epoch": 4563} {"train_loss": -26.267805099487305, "global_step": 378762, "epoch": 4563} {"train_loss": -26.673612594604492, "global_step": 378763, "epoch": 4563} {"train_loss": -26.3229923248291, "global_step": 378764, "epoch": 4563} {"train_loss": -26.6560115814209, "global_step": 378765, "epoch": 4563} {"train_loss": -26.469675064086914, "global_step": 378766, "epoch": 4563} {"train_loss": -26.287134170532227, "global_step": 378767, "epoch": 4563} {"train_loss": -26.428791046142578, "global_step": 378768, "epoch": 4563} {"train_loss": -26.75933265686035, "global_step": 378769, "epoch": 4563} {"train_loss": -26.441669464111328, "global_step": 378770, "epoch": 4563} {"train_loss": -26.62062644958496, "global_step": 378771, "epoch": 4563} {"train_loss": -26.652759552001953, "global_step": 378772, "epoch": 4563} {"train_loss": -26.86861228942871, "global_step": 378773, "epoch": 4563} {"train_loss": -26.37422752380371, "global_step": 378774, "epoch": 4563} {"train_loss": -26.52235221862793, "global_step": 378775, "epoch": 4563} {"train_loss": -26.616352081298828, "global_step": 378776, "epoch": 4563} {"train_loss": -26.622289657592773, "global_step": 378777, "epoch": 4563} {"train_loss": -26.319543838500977, "global_step": 378778, "epoch": 4563} {"train_loss": -26.4200439453125, "global_step": 378779, "epoch": 4563} {"train_loss": -26.0312442779541, "global_step": 378780, "epoch": 4563} {"train_loss": -26.219141006469727, "global_step": 378781, "epoch": 4563} {"train_loss": -26.155506134033203, "global_step": 378782, "epoch": 4563} {"train_loss": -26.40749168395996, "global_step": 378783, "epoch": 4563} {"train_loss": -26.233381271362305, "global_step": 378784, "epoch": 4563} {"train_loss": -26.557727813720703, "global_step": 378785, "epoch": 4563} {"train_loss": -26.326282501220703, "global_step": 378786, "epoch": 4563} {"train_loss": -26.705747604370117, "global_step": 378787, "epoch": 4563} {"train_loss": -26.255796432495117, "global_step": 378788, "epoch": 4563} {"train_loss": -26.49000358581543, "global_step": 378789, "epoch": 4563} {"train_loss": -26.246667861938477, "global_step": 378790, "epoch": 4563} {"train_loss": -26.75397300720215, "global_step": 378791, "epoch": 4563} {"train_loss": -27.004587173461914, "global_step": 378792, "epoch": 4563} {"train_loss": -26.50979995727539, "global_step": 378793, "epoch": 4563} {"train_loss": -26.319055557250977, "global_step": 378794, "epoch": 4563} {"train_loss": -26.662939071655273, "global_step": 378795, "epoch": 4563} {"train_loss": -26.442495346069336, "global_step": 378796, "epoch": 4563} {"train_loss": -26.451507568359375, "global_step": 378797, "epoch": 4563} {"train_loss": -26.501569747924805, "global_step": 378798, "epoch": 4563} {"train_loss": -26.4591064453125, "global_step": 378799, "epoch": 4563} {"train_loss": -26.071313858032227, "global_step": 378800, "epoch": 4563} {"train_loss": -26.237714767456055, "global_step": 378801, "epoch": 4563} {"train_loss": -26.409839630126953, "global_step": 378802, "epoch": 4563} {"train_loss": -26.21632194519043, "global_step": 378803, "epoch": 4563} {"train_loss": -26.238866806030273, "global_step": 378804, "epoch": 4563} {"train_loss": -26.621686935424805, "global_step": 378805, "epoch": 4563} {"train_loss": -26.30548095703125, "global_step": 378806, "epoch": 4563} {"train_loss": -26.21125602722168, "global_step": 378807, "epoch": 4563} {"train_loss": -26.98853874206543, "global_step": 378808, "epoch": 4563} {"train_loss": -26.842151641845703, "global_step": 378809, "epoch": 4563} {"train_loss": -26.884449005126953, "global_step": 378810, "epoch": 4563} {"train_loss": -26.229949721370836, "global_step": 378811, "epoch": 4563, "val_loss": 6552882.0} {"train_loss": -24.79477882385254, "global_step": 378812, "epoch": 4564} {"train_loss": -24.076833724975586, "global_step": 378813, "epoch": 4564} {"train_loss": -24.671520233154297, "global_step": 378814, "epoch": 4564} {"train_loss": -25.305038452148438, "global_step": 378815, "epoch": 4564} {"train_loss": -24.367780685424805, "global_step": 378816, "epoch": 4564} {"train_loss": -25.920530319213867, "global_step": 378817, "epoch": 4564} {"train_loss": -25.193479537963867, "global_step": 378818, "epoch": 4564} {"train_loss": -25.488508224487305, "global_step": 378819, "epoch": 4564} {"train_loss": -25.8112735748291, "global_step": 378820, "epoch": 4564} {"train_loss": -25.56449317932129, "global_step": 378821, "epoch": 4564} {"train_loss": -25.93289566040039, "global_step": 378822, "epoch": 4564} {"train_loss": -25.73014259338379, "global_step": 378823, "epoch": 4564} {"train_loss": -26.004291534423828, "global_step": 378824, "epoch": 4564} {"train_loss": -25.741989135742188, "global_step": 378825, "epoch": 4564} {"train_loss": -25.730615615844727, "global_step": 378826, "epoch": 4564} {"train_loss": -25.748804092407227, "global_step": 378827, "epoch": 4564} {"train_loss": -25.74300193786621, "global_step": 378828, "epoch": 4564} {"train_loss": -25.842077255249023, "global_step": 378829, "epoch": 4564} {"train_loss": -26.029525756835938, "global_step": 378830, "epoch": 4564} {"train_loss": -26.15815544128418, "global_step": 378831, "epoch": 4564} {"train_loss": -26.049829483032227, "global_step": 378832, "epoch": 4564} {"train_loss": -26.14771842956543, "global_step": 378833, "epoch": 4564} {"train_loss": -25.612167358398438, "global_step": 378834, "epoch": 4564} {"train_loss": -25.767200469970703, "global_step": 378835, "epoch": 4564} {"train_loss": -26.013431549072266, "global_step": 378836, "epoch": 4564} {"train_loss": -26.352035522460938, "global_step": 378837, "epoch": 4564} {"train_loss": -25.97040367126465, "global_step": 378838, "epoch": 4564} {"train_loss": -26.358814239501953, "global_step": 378839, "epoch": 4564} {"train_loss": -25.790212631225586, "global_step": 378840, "epoch": 4564} {"train_loss": -26.362878799438477, "global_step": 378841, "epoch": 4564} {"train_loss": -26.425769805908203, "global_step": 378842, "epoch": 4564} {"train_loss": -26.278461456298828, "global_step": 378843, "epoch": 4564} {"train_loss": -26.267541885375977, "global_step": 378844, "epoch": 4564} {"train_loss": -26.980249404907227, "global_step": 378845, "epoch": 4564} {"train_loss": -26.8443546295166, "global_step": 378846, "epoch": 4564} {"train_loss": -26.467300415039062, "global_step": 378847, "epoch": 4564} {"train_loss": -26.518842697143555, "global_step": 378848, "epoch": 4564} {"train_loss": -26.175968170166016, "global_step": 378849, "epoch": 4564} {"train_loss": -26.53924560546875, "global_step": 378850, "epoch": 4564} {"train_loss": -26.28887939453125, "global_step": 378851, "epoch": 4564} {"train_loss": -26.42299461364746, "global_step": 378852, "epoch": 4564} {"train_loss": -26.45444107055664, "global_step": 378853, "epoch": 4564} {"train_loss": -26.72286033630371, "global_step": 378854, "epoch": 4564} {"train_loss": -26.7509822845459, "global_step": 378855, "epoch": 4564} {"train_loss": -26.393102645874023, "global_step": 378856, "epoch": 4564} {"train_loss": -26.439990997314453, "global_step": 378857, "epoch": 4564} {"train_loss": -26.343358993530273, "global_step": 378858, "epoch": 4564} {"train_loss": -26.29231071472168, "global_step": 378859, "epoch": 4564} {"train_loss": -26.45916748046875, "global_step": 378860, "epoch": 4564} {"train_loss": -26.62845802307129, "global_step": 378861, "epoch": 4564} {"train_loss": -26.476200103759766, "global_step": 378862, "epoch": 4564} {"train_loss": -26.457242965698242, "global_step": 378863, "epoch": 4564} {"train_loss": -26.241514205932617, "global_step": 378864, "epoch": 4564} {"train_loss": -26.836145401000977, "global_step": 378865, "epoch": 4564} {"train_loss": -26.6827335357666, "global_step": 378866, "epoch": 4564} {"train_loss": -26.62726402282715, "global_step": 378867, "epoch": 4564} {"train_loss": -26.516199111938477, "global_step": 378868, "epoch": 4564} {"train_loss": -26.664403915405273, "global_step": 378869, "epoch": 4564} {"train_loss": -26.5664119720459, "global_step": 378870, "epoch": 4564} {"train_loss": -26.315969467163086, "global_step": 378871, "epoch": 4564} {"train_loss": -26.32111167907715, "global_step": 378872, "epoch": 4564} {"train_loss": -26.255203247070312, "global_step": 378873, "epoch": 4564} {"train_loss": -26.49072265625, "global_step": 378874, "epoch": 4564} {"train_loss": -26.59108543395996, "global_step": 378875, "epoch": 4564} {"train_loss": -26.46872329711914, "global_step": 378876, "epoch": 4564} {"train_loss": -26.6429443359375, "global_step": 378877, "epoch": 4564} {"train_loss": -26.686126708984375, "global_step": 378878, "epoch": 4564} {"train_loss": -26.619897842407227, "global_step": 378879, "epoch": 4564} {"train_loss": -26.485366821289062, "global_step": 378880, "epoch": 4564} {"train_loss": -26.581018447875977, "global_step": 378881, "epoch": 4564} {"train_loss": -26.85272789001465, "global_step": 378882, "epoch": 4564} {"train_loss": -26.57891273498535, "global_step": 378883, "epoch": 4564} {"train_loss": -26.759918212890625, "global_step": 378884, "epoch": 4564} {"train_loss": -26.732572555541992, "global_step": 378885, "epoch": 4564} {"train_loss": -26.752948760986328, "global_step": 378886, "epoch": 4564} {"train_loss": -26.551471710205078, "global_step": 378887, "epoch": 4564} {"train_loss": -26.465591430664062, "global_step": 378888, "epoch": 4564} {"train_loss": -26.33401870727539, "global_step": 378889, "epoch": 4564} {"train_loss": -26.560321807861328, "global_step": 378890, "epoch": 4564} {"train_loss": -26.60636329650879, "global_step": 378891, "epoch": 4564} {"train_loss": -26.582763671875, "global_step": 378892, "epoch": 4564} {"train_loss": -26.45556640625, "global_step": 378893, "epoch": 4564} {"train_loss": -26.215313831007624, "global_step": 378894, "epoch": 4564, "val_loss": 6636497.0} {"train_loss": -25.206411361694336, "global_step": 378895, "epoch": 4565} {"train_loss": -25.510465621948242, "global_step": 378896, "epoch": 4565} {"train_loss": -26.10902214050293, "global_step": 378897, "epoch": 4565} {"train_loss": -26.108701705932617, "global_step": 378898, "epoch": 4565} {"train_loss": -26.00958251953125, "global_step": 378899, "epoch": 4565} {"train_loss": -26.729406356811523, "global_step": 378900, "epoch": 4565} {"train_loss": -25.923675537109375, "global_step": 378901, "epoch": 4565} {"train_loss": -26.28045082092285, "global_step": 378902, "epoch": 4565} {"train_loss": -25.92445945739746, "global_step": 378903, "epoch": 4565} {"train_loss": -26.167346954345703, "global_step": 378904, "epoch": 4565} {"train_loss": -25.823169708251953, "global_step": 378905, "epoch": 4565} {"train_loss": -26.054447174072266, "global_step": 378906, "epoch": 4565} {"train_loss": -25.611730575561523, "global_step": 378907, "epoch": 4565} {"train_loss": -26.571273803710938, "global_step": 378908, "epoch": 4565} {"train_loss": -25.7916202545166, "global_step": 378909, "epoch": 4565} {"train_loss": -26.31492042541504, "global_step": 378910, "epoch": 4565} {"train_loss": -26.14078140258789, "global_step": 378911, "epoch": 4565} {"train_loss": -26.114736557006836, "global_step": 378912, "epoch": 4565} {"train_loss": -25.810110092163086, "global_step": 378913, "epoch": 4565} {"train_loss": -26.22852897644043, "global_step": 378914, "epoch": 4565} {"train_loss": -26.363733291625977, "global_step": 378915, "epoch": 4565} {"train_loss": -26.112812042236328, "global_step": 378916, "epoch": 4565} {"train_loss": -26.503589630126953, "global_step": 378917, "epoch": 4565} {"train_loss": -26.589435577392578, "global_step": 378918, "epoch": 4565} {"train_loss": -26.408111572265625, "global_step": 378919, "epoch": 4565} {"train_loss": -26.437829971313477, "global_step": 378920, "epoch": 4565} {"train_loss": -26.301015853881836, "global_step": 378921, "epoch": 4565} {"train_loss": -26.508481979370117, "global_step": 378922, "epoch": 4565} {"train_loss": -26.742685317993164, "global_step": 378923, "epoch": 4565} {"train_loss": -26.48697853088379, "global_step": 378924, "epoch": 4565} {"train_loss": -26.304319381713867, "global_step": 378925, "epoch": 4565} {"train_loss": -26.440689086914062, "global_step": 378926, "epoch": 4565} {"train_loss": -26.209115982055664, "global_step": 378927, "epoch": 4565} {"train_loss": -26.57343101501465, "global_step": 378928, "epoch": 4565} {"train_loss": -26.61675453186035, "global_step": 378929, "epoch": 4565} {"train_loss": -26.665868759155273, "global_step": 378930, "epoch": 4565} {"train_loss": -26.502185821533203, "global_step": 378931, "epoch": 4565} {"train_loss": -26.2917537689209, "global_step": 378932, "epoch": 4565} {"train_loss": -26.8494815826416, "global_step": 378933, "epoch": 4565} {"train_loss": -26.664236068725586, "global_step": 378934, "epoch": 4565} {"train_loss": -26.683307647705078, "global_step": 378935, "epoch": 4565} {"train_loss": -26.18168067932129, "global_step": 378936, "epoch": 4565} {"train_loss": -26.687686920166016, "global_step": 378937, "epoch": 4565} {"train_loss": -26.34163475036621, "global_step": 378938, "epoch": 4565} {"train_loss": -26.383655548095703, "global_step": 378939, "epoch": 4565} {"train_loss": -26.437238693237305, "global_step": 378940, "epoch": 4565} {"train_loss": -26.6152286529541, "global_step": 378941, "epoch": 4565} {"train_loss": -26.353300094604492, "global_step": 378942, "epoch": 4565} {"train_loss": -26.651123046875, "global_step": 378943, "epoch": 4565} {"train_loss": -26.44246482849121, "global_step": 378944, "epoch": 4565} {"train_loss": -26.53411865234375, "global_step": 378945, "epoch": 4565} {"train_loss": -26.761449813842773, "global_step": 378946, "epoch": 4565} {"train_loss": -26.4989070892334, "global_step": 378947, "epoch": 4565} {"train_loss": -26.823434829711914, "global_step": 378948, "epoch": 4565} {"train_loss": -26.305383682250977, "global_step": 378949, "epoch": 4565} {"train_loss": -26.373828887939453, "global_step": 378950, "epoch": 4565} {"train_loss": -26.520959854125977, "global_step": 378951, "epoch": 4565} {"train_loss": -26.350605010986328, "global_step": 378952, "epoch": 4565} {"train_loss": -26.796239852905273, "global_step": 378953, "epoch": 4565} {"train_loss": -26.345136642456055, "global_step": 378954, "epoch": 4565} {"train_loss": -26.4085750579834, "global_step": 378955, "epoch": 4565} {"train_loss": -26.58906364440918, "global_step": 378956, "epoch": 4565} {"train_loss": -26.55933952331543, "global_step": 378957, "epoch": 4565} {"train_loss": -26.65097427368164, "global_step": 378958, "epoch": 4565} {"train_loss": -26.20355796813965, "global_step": 378959, "epoch": 4565} {"train_loss": -26.85140037536621, "global_step": 378960, "epoch": 4565} {"train_loss": -26.220722198486328, "global_step": 378961, "epoch": 4565} {"train_loss": -26.740549087524414, "global_step": 378962, "epoch": 4565} {"train_loss": -26.29617691040039, "global_step": 378963, "epoch": 4565} {"train_loss": -26.288740158081055, "global_step": 378964, "epoch": 4565} {"train_loss": -26.289154052734375, "global_step": 378965, "epoch": 4565} {"train_loss": -26.635282516479492, "global_step": 378966, "epoch": 4565} {"train_loss": -26.962493896484375, "global_step": 378967, "epoch": 4565} {"train_loss": -26.797454833984375, "global_step": 378968, "epoch": 4565} {"train_loss": -26.590927124023438, "global_step": 378969, "epoch": 4565} {"train_loss": -26.741077423095703, "global_step": 378970, "epoch": 4565} {"train_loss": -26.220966339111328, "global_step": 378971, "epoch": 4565} {"train_loss": -26.295246124267578, "global_step": 378972, "epoch": 4565} {"train_loss": -26.35248374938965, "global_step": 378973, "epoch": 4565} {"train_loss": -26.723041534423828, "global_step": 378974, "epoch": 4565} {"train_loss": -26.68183708190918, "global_step": 378975, "epoch": 4565} {"train_loss": -26.36810302734375, "global_step": 378976, "epoch": 4565} {"train_loss": -26.386991018272308, "global_step": 378977, "epoch": 4565, "val_loss": 6542453.0} {"train_loss": -25.723981857299805, "global_step": 378978, "epoch": 4566} {"train_loss": -25.169424057006836, "global_step": 378979, "epoch": 4566} {"train_loss": -25.905364990234375, "global_step": 378980, "epoch": 4566} {"train_loss": -25.409576416015625, "global_step": 378981, "epoch": 4566} {"train_loss": -25.10737419128418, "global_step": 378982, "epoch": 4566} {"train_loss": -24.891115188598633, "global_step": 378983, "epoch": 4566} {"train_loss": -25.094812393188477, "global_step": 378984, "epoch": 4566} {"train_loss": -25.317646026611328, "global_step": 378985, "epoch": 4566} {"train_loss": -25.383045196533203, "global_step": 378986, "epoch": 4566} {"train_loss": -25.14054298400879, "global_step": 378987, "epoch": 4566} {"train_loss": -25.42413902282715, "global_step": 378988, "epoch": 4566} {"train_loss": -25.591176986694336, "global_step": 378989, "epoch": 4566} {"train_loss": -25.89642333984375, "global_step": 378990, "epoch": 4566} {"train_loss": -25.76655387878418, "global_step": 378991, "epoch": 4566} {"train_loss": -25.892324447631836, "global_step": 378992, "epoch": 4566} {"train_loss": -26.17827796936035, "global_step": 378993, "epoch": 4566} {"train_loss": -25.668838500976562, "global_step": 378994, "epoch": 4566} {"train_loss": -26.16008949279785, "global_step": 378995, "epoch": 4566} {"train_loss": -26.160612106323242, "global_step": 378996, "epoch": 4566} {"train_loss": -26.048969268798828, "global_step": 378997, "epoch": 4566} {"train_loss": -26.059850692749023, "global_step": 378998, "epoch": 4566} {"train_loss": -26.475072860717773, "global_step": 378999, "epoch": 4566} {"train_loss": -26.06690788269043, "global_step": 379000, "epoch": 4566} {"train_loss": -26.429779052734375, "global_step": 379001, "epoch": 4566} {"train_loss": -26.1668701171875, "global_step": 379002, "epoch": 4566} {"train_loss": -26.231830596923828, "global_step": 379003, "epoch": 4566} {"train_loss": -26.216337203979492, "global_step": 379004, "epoch": 4566} {"train_loss": -26.10525894165039, "global_step": 379005, "epoch": 4566} {"train_loss": -25.966938018798828, "global_step": 379006, "epoch": 4566} {"train_loss": -26.533517837524414, "global_step": 379007, "epoch": 4566} {"train_loss": -26.31403160095215, "global_step": 379008, "epoch": 4566} {"train_loss": -26.144845962524414, "global_step": 379009, "epoch": 4566} {"train_loss": -26.686643600463867, "global_step": 379010, "epoch": 4566} {"train_loss": -26.813451766967773, "global_step": 379011, "epoch": 4566} {"train_loss": -26.186105728149414, "global_step": 379012, "epoch": 4566} {"train_loss": -26.36380386352539, "global_step": 379013, "epoch": 4566} {"train_loss": -26.324106216430664, "global_step": 379014, "epoch": 4566} {"train_loss": -26.608488082885742, "global_step": 379015, "epoch": 4566} {"train_loss": -26.55634117126465, "global_step": 379016, "epoch": 4566} {"train_loss": -26.479705810546875, "global_step": 379017, "epoch": 4566} {"train_loss": -26.6453857421875, "global_step": 379018, "epoch": 4566} {"train_loss": -26.8192195892334, "global_step": 379019, "epoch": 4566} {"train_loss": -26.788410186767578, "global_step": 379020, "epoch": 4566} {"train_loss": -26.44858741760254, "global_step": 379021, "epoch": 4566} {"train_loss": -26.5729923248291, "global_step": 379022, "epoch": 4566} {"train_loss": -26.8082275390625, "global_step": 379023, "epoch": 4566} {"train_loss": -26.520410537719727, "global_step": 379024, "epoch": 4566} {"train_loss": -26.404035568237305, "global_step": 379025, "epoch": 4566} {"train_loss": -26.385305404663086, "global_step": 379026, "epoch": 4566} {"train_loss": -26.41643714904785, "global_step": 379027, "epoch": 4566} {"train_loss": -26.5388240814209, "global_step": 379028, "epoch": 4566} {"train_loss": -26.58237075805664, "global_step": 379029, "epoch": 4566} {"train_loss": -26.623981475830078, "global_step": 379030, "epoch": 4566} {"train_loss": -26.45553970336914, "global_step": 379031, "epoch": 4566} {"train_loss": -26.60413932800293, "global_step": 379032, "epoch": 4566} {"train_loss": -26.804845809936523, "global_step": 379033, "epoch": 4566} {"train_loss": -26.43780517578125, "global_step": 379034, "epoch": 4566} {"train_loss": -26.4405460357666, "global_step": 379035, "epoch": 4566} {"train_loss": -26.2503719329834, "global_step": 379036, "epoch": 4566} {"train_loss": -25.703556060791016, "global_step": 379037, "epoch": 4566} {"train_loss": -26.2755126953125, "global_step": 379038, "epoch": 4566} {"train_loss": -26.106021881103516, "global_step": 379039, "epoch": 4566} {"train_loss": -26.269123077392578, "global_step": 379040, "epoch": 4566} {"train_loss": -26.166040420532227, "global_step": 379041, "epoch": 4566} {"train_loss": -26.3608341217041, "global_step": 379042, "epoch": 4566} {"train_loss": -26.49859046936035, "global_step": 379043, "epoch": 4566} {"train_loss": -26.6690731048584, "global_step": 379044, "epoch": 4566} {"train_loss": -26.295454025268555, "global_step": 379045, "epoch": 4566} {"train_loss": -25.693912506103516, "global_step": 379046, "epoch": 4566} {"train_loss": -25.96587562561035, "global_step": 379047, "epoch": 4566} {"train_loss": -26.42341423034668, "global_step": 379048, "epoch": 4566} {"train_loss": -26.49114418029785, "global_step": 379049, "epoch": 4566} {"train_loss": -26.258502960205078, "global_step": 379050, "epoch": 4566} {"train_loss": -25.933460235595703, "global_step": 379051, "epoch": 4566} {"train_loss": -26.39731216430664, "global_step": 379052, "epoch": 4566} {"train_loss": -26.307086944580078, "global_step": 379053, "epoch": 4566} {"train_loss": -25.965360641479492, "global_step": 379054, "epoch": 4566} {"train_loss": -26.249902725219727, "global_step": 379055, "epoch": 4566} {"train_loss": -26.22568702697754, "global_step": 379056, "epoch": 4566} {"train_loss": -26.112218856811523, "global_step": 379057, "epoch": 4566} {"train_loss": -26.255136489868164, "global_step": 379058, "epoch": 4566} {"train_loss": -26.427875518798828, "global_step": 379059, "epoch": 4566} {"train_loss": -26.175352487219385, "global_step": 379060, "epoch": 4566, "val_loss": 6652571.0} {"train_loss": -26.0958309173584, "global_step": 379061, "epoch": 4567} {"train_loss": -26.482421875, "global_step": 379062, "epoch": 4567} {"train_loss": -26.153162002563477, "global_step": 379063, "epoch": 4567} {"train_loss": -26.227588653564453, "global_step": 379064, "epoch": 4567} {"train_loss": -26.529767990112305, "global_step": 379065, "epoch": 4567} {"train_loss": -26.132434844970703, "global_step": 379066, "epoch": 4567} {"train_loss": -26.11481285095215, "global_step": 379067, "epoch": 4567} {"train_loss": -25.878503799438477, "global_step": 379068, "epoch": 4567} {"train_loss": -26.587753295898438, "global_step": 379069, "epoch": 4567} {"train_loss": -26.17449951171875, "global_step": 379070, "epoch": 4567} {"train_loss": -25.8360538482666, "global_step": 379071, "epoch": 4567} {"train_loss": -25.81256103515625, "global_step": 379072, "epoch": 4567} {"train_loss": -26.375015258789062, "global_step": 379073, "epoch": 4567} {"train_loss": -26.0827579498291, "global_step": 379074, "epoch": 4567} {"train_loss": -26.20047950744629, "global_step": 379075, "epoch": 4567} {"train_loss": -26.353235244750977, "global_step": 379076, "epoch": 4567} {"train_loss": -26.465423583984375, "global_step": 379077, "epoch": 4567} {"train_loss": -26.167312622070312, "global_step": 379078, "epoch": 4567} {"train_loss": -26.322986602783203, "global_step": 379079, "epoch": 4567} {"train_loss": -26.28193473815918, "global_step": 379080, "epoch": 4567} {"train_loss": -26.3586483001709, "global_step": 379081, "epoch": 4567} {"train_loss": -25.77508544921875, "global_step": 379082, "epoch": 4567} {"train_loss": -26.601301193237305, "global_step": 379083, "epoch": 4567} {"train_loss": -26.586896896362305, "global_step": 379084, "epoch": 4567} {"train_loss": -26.17251968383789, "global_step": 379085, "epoch": 4567} {"train_loss": -26.080341339111328, "global_step": 379086, "epoch": 4567} {"train_loss": -26.322528839111328, "global_step": 379087, "epoch": 4567} {"train_loss": -26.2018985748291, "global_step": 379088, "epoch": 4567} {"train_loss": -26.26698112487793, "global_step": 379089, "epoch": 4567} {"train_loss": -26.169172286987305, "global_step": 379090, "epoch": 4567} {"train_loss": -26.52056884765625, "global_step": 379091, "epoch": 4567} {"train_loss": -26.566980361938477, "global_step": 379092, "epoch": 4567} {"train_loss": -26.16316032409668, "global_step": 379093, "epoch": 4567} {"train_loss": -26.29547691345215, "global_step": 379094, "epoch": 4567} {"train_loss": -26.578662872314453, "global_step": 379095, "epoch": 4567} {"train_loss": -25.9642333984375, "global_step": 379096, "epoch": 4567} {"train_loss": -26.21451759338379, "global_step": 379097, "epoch": 4567} {"train_loss": -26.198637008666992, "global_step": 379098, "epoch": 4567} {"train_loss": -26.778217315673828, "global_step": 379099, "epoch": 4567} {"train_loss": -26.2889461517334, "global_step": 379100, "epoch": 4567} {"train_loss": -26.574872970581055, "global_step": 379101, "epoch": 4567} {"train_loss": -26.298681259155273, "global_step": 379102, "epoch": 4567} {"train_loss": -26.584197998046875, "global_step": 379103, "epoch": 4567} {"train_loss": -26.685068130493164, "global_step": 379104, "epoch": 4567} {"train_loss": -26.5754337310791, "global_step": 379105, "epoch": 4567} {"train_loss": -26.07442283630371, "global_step": 379106, "epoch": 4567} {"train_loss": -26.750471115112305, "global_step": 379107, "epoch": 4567} {"train_loss": -26.471250534057617, "global_step": 379108, "epoch": 4567} {"train_loss": -26.080419540405273, "global_step": 379109, "epoch": 4567} {"train_loss": -26.287967681884766, "global_step": 379110, "epoch": 4567} {"train_loss": -26.78216552734375, "global_step": 379111, "epoch": 4567} {"train_loss": -26.1503963470459, "global_step": 379112, "epoch": 4567} {"train_loss": -26.304950714111328, "global_step": 379113, "epoch": 4567} {"train_loss": -26.832965850830078, "global_step": 379114, "epoch": 4567} {"train_loss": -26.229185104370117, "global_step": 379115, "epoch": 4567} {"train_loss": -26.1845760345459, "global_step": 379116, "epoch": 4567} {"train_loss": -26.69866943359375, "global_step": 379117, "epoch": 4567} {"train_loss": -26.551481246948242, "global_step": 379118, "epoch": 4567} {"train_loss": -26.746856689453125, "global_step": 379119, "epoch": 4567} {"train_loss": -26.243101119995117, "global_step": 379120, "epoch": 4567} {"train_loss": -26.240985870361328, "global_step": 379121, "epoch": 4567} {"train_loss": -26.8597354888916, "global_step": 379122, "epoch": 4567} {"train_loss": -26.665729522705078, "global_step": 379123, "epoch": 4567} {"train_loss": -26.667530059814453, "global_step": 379124, "epoch": 4567} {"train_loss": -26.680145263671875, "global_step": 379125, "epoch": 4567} {"train_loss": -26.55048179626465, "global_step": 379126, "epoch": 4567} {"train_loss": -26.45814323425293, "global_step": 379127, "epoch": 4567} {"train_loss": -26.480207443237305, "global_step": 379128, "epoch": 4567} {"train_loss": -26.5484561920166, "global_step": 379129, "epoch": 4567} {"train_loss": -26.542011260986328, "global_step": 379130, "epoch": 4567} {"train_loss": -26.63210105895996, "global_step": 379131, "epoch": 4567} {"train_loss": -26.934728622436523, "global_step": 379132, "epoch": 4567} {"train_loss": -26.529150009155273, "global_step": 379133, "epoch": 4567} {"train_loss": -26.365203857421875, "global_step": 379134, "epoch": 4567} {"train_loss": -26.657522201538086, "global_step": 379135, "epoch": 4567} {"train_loss": -26.799951553344727, "global_step": 379136, "epoch": 4567} {"train_loss": -26.39511489868164, "global_step": 379137, "epoch": 4567} {"train_loss": -26.796680450439453, "global_step": 379138, "epoch": 4567} {"train_loss": -26.587177276611328, "global_step": 379139, "epoch": 4567} {"train_loss": -26.802326202392578, "global_step": 379140, "epoch": 4567} {"train_loss": -26.101184844970703, "global_step": 379141, "epoch": 4567} {"train_loss": -26.31171226501465, "global_step": 379142, "epoch": 4567} {"train_loss": -26.39531691677599, "global_step": 379143, "epoch": 4567, "val_loss": 6594713.0} {"train_loss": -25.779088973999023, "global_step": 379144, "epoch": 4568} {"train_loss": -24.714862823486328, "global_step": 379145, "epoch": 4568} {"train_loss": -24.90976333618164, "global_step": 379146, "epoch": 4568} {"train_loss": -25.583219528198242, "global_step": 379147, "epoch": 4568} {"train_loss": -25.81614112854004, "global_step": 379148, "epoch": 4568} {"train_loss": -24.939292907714844, "global_step": 379149, "epoch": 4568} {"train_loss": -25.46307373046875, "global_step": 379150, "epoch": 4568} {"train_loss": -25.757932662963867, "global_step": 379151, "epoch": 4568} {"train_loss": -25.76995849609375, "global_step": 379152, "epoch": 4568} {"train_loss": -26.024810791015625, "global_step": 379153, "epoch": 4568} {"train_loss": -26.181781768798828, "global_step": 379154, "epoch": 4568} {"train_loss": -26.333810806274414, "global_step": 379155, "epoch": 4568} {"train_loss": -26.02726173400879, "global_step": 379156, "epoch": 4568} {"train_loss": -25.687429428100586, "global_step": 379157, "epoch": 4568} {"train_loss": -25.852039337158203, "global_step": 379158, "epoch": 4568} {"train_loss": -26.088972091674805, "global_step": 379159, "epoch": 4568} {"train_loss": -26.207609176635742, "global_step": 379160, "epoch": 4568} {"train_loss": -26.082929611206055, "global_step": 379161, "epoch": 4568} {"train_loss": -25.975255966186523, "global_step": 379162, "epoch": 4568} {"train_loss": -26.0471134185791, "global_step": 379163, "epoch": 4568} {"train_loss": -26.181116104125977, "global_step": 379164, "epoch": 4568} {"train_loss": -26.29312515258789, "global_step": 379165, "epoch": 4568} {"train_loss": -26.195951461791992, "global_step": 379166, "epoch": 4568} {"train_loss": -26.251813888549805, "global_step": 379167, "epoch": 4568} {"train_loss": -26.444543838500977, "global_step": 379168, "epoch": 4568} {"train_loss": -26.308591842651367, "global_step": 379169, "epoch": 4568} {"train_loss": -26.3621768951416, "global_step": 379170, "epoch": 4568} {"train_loss": -26.53911781311035, "global_step": 379171, "epoch": 4568} {"train_loss": -26.533727645874023, "global_step": 379172, "epoch": 4568} {"train_loss": -26.348352432250977, "global_step": 379173, "epoch": 4568} {"train_loss": -26.639972686767578, "global_step": 379174, "epoch": 4568} {"train_loss": -26.30315589904785, "global_step": 379175, "epoch": 4568} {"train_loss": -26.620758056640625, "global_step": 379176, "epoch": 4568} {"train_loss": -26.41301918029785, "global_step": 379177, "epoch": 4568} {"train_loss": -26.503931045532227, "global_step": 379178, "epoch": 4568} {"train_loss": -26.45188331604004, "global_step": 379179, "epoch": 4568} {"train_loss": -26.4220027923584, "global_step": 379180, "epoch": 4568} {"train_loss": -26.282800674438477, "global_step": 379181, "epoch": 4568} {"train_loss": -26.305978775024414, "global_step": 379182, "epoch": 4568} {"train_loss": -26.1319580078125, "global_step": 379183, "epoch": 4568} {"train_loss": -26.358800888061523, "global_step": 379184, "epoch": 4568} {"train_loss": -26.854511260986328, "global_step": 379185, "epoch": 4568} {"train_loss": -26.41238784790039, "global_step": 379186, "epoch": 4568} {"train_loss": -26.590818405151367, "global_step": 379187, "epoch": 4568} {"train_loss": -26.32958984375, "global_step": 379188, "epoch": 4568} {"train_loss": -26.418310165405273, "global_step": 379189, "epoch": 4568} {"train_loss": -26.542871475219727, "global_step": 379190, "epoch": 4568} {"train_loss": -26.95045280456543, "global_step": 379191, "epoch": 4568} {"train_loss": -26.6612606048584, "global_step": 379192, "epoch": 4568} {"train_loss": -26.700468063354492, "global_step": 379193, "epoch": 4568} {"train_loss": -26.64491081237793, "global_step": 379194, "epoch": 4568} {"train_loss": -26.524084091186523, "global_step": 379195, "epoch": 4568} {"train_loss": -26.651166915893555, "global_step": 379196, "epoch": 4568} {"train_loss": -26.677488327026367, "global_step": 379197, "epoch": 4568} {"train_loss": -26.520673751831055, "global_step": 379198, "epoch": 4568} {"train_loss": -26.665241241455078, "global_step": 379199, "epoch": 4568} {"train_loss": -26.376331329345703, "global_step": 379200, "epoch": 4568} {"train_loss": -26.736042022705078, "global_step": 379201, "epoch": 4568} {"train_loss": -26.354339599609375, "global_step": 379202, "epoch": 4568} {"train_loss": -26.269372940063477, "global_step": 379203, "epoch": 4568} {"train_loss": -25.983142852783203, "global_step": 379204, "epoch": 4568} {"train_loss": -26.101255416870117, "global_step": 379205, "epoch": 4568} {"train_loss": -26.017820358276367, "global_step": 379206, "epoch": 4568} {"train_loss": -26.59881591796875, "global_step": 379207, "epoch": 4568} {"train_loss": -26.15668296813965, "global_step": 379208, "epoch": 4568} {"train_loss": -26.595258712768555, "global_step": 379209, "epoch": 4568} {"train_loss": -25.778121948242188, "global_step": 379210, "epoch": 4568} {"train_loss": -25.5336971282959, "global_step": 379211, "epoch": 4568} {"train_loss": -25.54087257385254, "global_step": 379212, "epoch": 4568} {"train_loss": -26.264490127563477, "global_step": 379213, "epoch": 4568} {"train_loss": -26.469236373901367, "global_step": 379214, "epoch": 4568} {"train_loss": -26.17888832092285, "global_step": 379215, "epoch": 4568} {"train_loss": -25.967914581298828, "global_step": 379216, "epoch": 4568} {"train_loss": -26.5925350189209, "global_step": 379217, "epoch": 4568} {"train_loss": -25.989643096923828, "global_step": 379218, "epoch": 4568} {"train_loss": -26.209890365600586, "global_step": 379219, "epoch": 4568} {"train_loss": -26.215112686157227, "global_step": 379220, "epoch": 4568} {"train_loss": -26.719085693359375, "global_step": 379221, "epoch": 4568} {"train_loss": -26.276493072509766, "global_step": 379222, "epoch": 4568} {"train_loss": -25.9954833984375, "global_step": 379223, "epoch": 4568} {"train_loss": -26.637451171875, "global_step": 379224, "epoch": 4568} {"train_loss": -26.66680335998535, "global_step": 379225, "epoch": 4568} {"train_loss": -26.225968050669476, "global_step": 379226, "epoch": 4568, "val_loss": 6634162.0} {"train_loss": -25.784255981445312, "global_step": 379227, "epoch": 4569} {"train_loss": -26.336206436157227, "global_step": 379228, "epoch": 4569} {"train_loss": -26.157541275024414, "global_step": 379229, "epoch": 4569} {"train_loss": -26.15460777282715, "global_step": 379230, "epoch": 4569} {"train_loss": -26.13140869140625, "global_step": 379231, "epoch": 4569} {"train_loss": -25.852313995361328, "global_step": 379232, "epoch": 4569} {"train_loss": -26.336166381835938, "global_step": 379233, "epoch": 4569} {"train_loss": -26.2778263092041, "global_step": 379234, "epoch": 4569} {"train_loss": -26.27198600769043, "global_step": 379235, "epoch": 4569} {"train_loss": -26.24700927734375, "global_step": 379236, "epoch": 4569} {"train_loss": -26.083362579345703, "global_step": 379237, "epoch": 4569} {"train_loss": -26.2913761138916, "global_step": 379238, "epoch": 4569} {"train_loss": -26.326435089111328, "global_step": 379239, "epoch": 4569} {"train_loss": -26.276443481445312, "global_step": 379240, "epoch": 4569} {"train_loss": -26.326446533203125, "global_step": 379241, "epoch": 4569} {"train_loss": -26.487279891967773, "global_step": 379242, "epoch": 4569} {"train_loss": -26.5004825592041, "global_step": 379243, "epoch": 4569} {"train_loss": -26.68158531188965, "global_step": 379244, "epoch": 4569} {"train_loss": -26.383283615112305, "global_step": 379245, "epoch": 4569} {"train_loss": -26.4075870513916, "global_step": 379246, "epoch": 4569} {"train_loss": -26.568098068237305, "global_step": 379247, "epoch": 4569} {"train_loss": -26.24057388305664, "global_step": 379248, "epoch": 4569} {"train_loss": -26.500452041625977, "global_step": 379249, "epoch": 4569} {"train_loss": -26.680871963500977, "global_step": 379250, "epoch": 4569} {"train_loss": -26.498804092407227, "global_step": 379251, "epoch": 4569} {"train_loss": -26.732385635375977, "global_step": 379252, "epoch": 4569} {"train_loss": -26.480255126953125, "global_step": 379253, "epoch": 4569} {"train_loss": -26.578466415405273, "global_step": 379254, "epoch": 4569} {"train_loss": -26.9599609375, "global_step": 379255, "epoch": 4569} {"train_loss": -26.776111602783203, "global_step": 379256, "epoch": 4569} {"train_loss": -26.749784469604492, "global_step": 379257, "epoch": 4569} {"train_loss": -26.715646743774414, "global_step": 379258, "epoch": 4569} {"train_loss": -26.517822265625, "global_step": 379259, "epoch": 4569} {"train_loss": -26.57608985900879, "global_step": 379260, "epoch": 4569} {"train_loss": -26.51630210876465, "global_step": 379261, "epoch": 4569} {"train_loss": -26.17888832092285, "global_step": 379262, "epoch": 4569} {"train_loss": -26.246906280517578, "global_step": 379263, "epoch": 4569} {"train_loss": -26.39157485961914, "global_step": 379264, "epoch": 4569} {"train_loss": -26.496667861938477, "global_step": 379265, "epoch": 4569} {"train_loss": -26.367847442626953, "global_step": 379266, "epoch": 4569} {"train_loss": -26.290510177612305, "global_step": 379267, "epoch": 4569} {"train_loss": -26.3385066986084, "global_step": 379268, "epoch": 4569} {"train_loss": -26.433164596557617, "global_step": 379269, "epoch": 4569} {"train_loss": -26.540943145751953, "global_step": 379270, "epoch": 4569} {"train_loss": -26.456058502197266, "global_step": 379271, "epoch": 4569} {"train_loss": -26.439929962158203, "global_step": 379272, "epoch": 4569} {"train_loss": -26.44032859802246, "global_step": 379273, "epoch": 4569} {"train_loss": -26.249303817749023, "global_step": 379274, "epoch": 4569} {"train_loss": -26.348175048828125, "global_step": 379275, "epoch": 4569} {"train_loss": -26.417938232421875, "global_step": 379276, "epoch": 4569} {"train_loss": -26.365568161010742, "global_step": 379277, "epoch": 4569} {"train_loss": -26.545745849609375, "global_step": 379278, "epoch": 4569} {"train_loss": -26.0914306640625, "global_step": 379279, "epoch": 4569} {"train_loss": -26.705554962158203, "global_step": 379280, "epoch": 4569} {"train_loss": -26.575550079345703, "global_step": 379281, "epoch": 4569} {"train_loss": -26.594745635986328, "global_step": 379282, "epoch": 4569} {"train_loss": -26.636493682861328, "global_step": 379283, "epoch": 4569} {"train_loss": -26.6641845703125, "global_step": 379284, "epoch": 4569} {"train_loss": -26.4348087310791, "global_step": 379285, "epoch": 4569} {"train_loss": -26.483291625976562, "global_step": 379286, "epoch": 4569} {"train_loss": -26.215585708618164, "global_step": 379287, "epoch": 4569} {"train_loss": -26.567493438720703, "global_step": 379288, "epoch": 4569} {"train_loss": -26.385974884033203, "global_step": 379289, "epoch": 4569} {"train_loss": -26.858259201049805, "global_step": 379290, "epoch": 4569} {"train_loss": -26.649656295776367, "global_step": 379291, "epoch": 4569} {"train_loss": -27.033130645751953, "global_step": 379292, "epoch": 4569} {"train_loss": -26.59565544128418, "global_step": 379293, "epoch": 4569} {"train_loss": -26.432205200195312, "global_step": 379294, "epoch": 4569} {"train_loss": -26.109006881713867, "global_step": 379295, "epoch": 4569} {"train_loss": -26.787506103515625, "global_step": 379296, "epoch": 4569} {"train_loss": -26.549503326416016, "global_step": 379297, "epoch": 4569} {"train_loss": -26.906782150268555, "global_step": 379298, "epoch": 4569} {"train_loss": -26.340133666992188, "global_step": 379299, "epoch": 4569} {"train_loss": -26.591760635375977, "global_step": 379300, "epoch": 4569} {"train_loss": -26.5692081451416, "global_step": 379301, "epoch": 4569} {"train_loss": -26.68379020690918, "global_step": 379302, "epoch": 4569} {"train_loss": -26.5467472076416, "global_step": 379303, "epoch": 4569} {"train_loss": -26.3099308013916, "global_step": 379304, "epoch": 4569} {"train_loss": -26.596540451049805, "global_step": 379305, "epoch": 4569} {"train_loss": -26.651824951171875, "global_step": 379306, "epoch": 4569} {"train_loss": -26.606664657592773, "global_step": 379307, "epoch": 4569} {"train_loss": -26.910863876342773, "global_step": 379308, "epoch": 4569} {"train_loss": -26.455389068787355, "global_step": 379309, "epoch": 4569, "val_loss": 6618123.5} {"train_loss": -22.197607040405273, "global_step": 379310, "epoch": 4570} {"train_loss": -19.620214462280273, "global_step": 379311, "epoch": 4570} {"train_loss": -22.563369750976562, "global_step": 379312, "epoch": 4570} {"train_loss": -25.087928771972656, "global_step": 379313, "epoch": 4570} {"train_loss": -24.096637725830078, "global_step": 379314, "epoch": 4570} {"train_loss": -24.37244987487793, "global_step": 379315, "epoch": 4570} {"train_loss": -23.991455078125, "global_step": 379316, "epoch": 4570} {"train_loss": -25.214183807373047, "global_step": 379317, "epoch": 4570} {"train_loss": -24.606094360351562, "global_step": 379318, "epoch": 4570} {"train_loss": -24.699277877807617, "global_step": 379319, "epoch": 4570} {"train_loss": -24.957645416259766, "global_step": 379320, "epoch": 4570} {"train_loss": -25.1291446685791, "global_step": 379321, "epoch": 4570} {"train_loss": -24.759946823120117, "global_step": 379322, "epoch": 4570} {"train_loss": -24.942604064941406, "global_step": 379323, "epoch": 4570} {"train_loss": -25.183408737182617, "global_step": 379324, "epoch": 4570} {"train_loss": -25.59077262878418, "global_step": 379325, "epoch": 4570} {"train_loss": -25.086637496948242, "global_step": 379326, "epoch": 4570} {"train_loss": -25.236310958862305, "global_step": 379327, "epoch": 4570} {"train_loss": -25.522581100463867, "global_step": 379328, "epoch": 4570} {"train_loss": -25.323917388916016, "global_step": 379329, "epoch": 4570} {"train_loss": -25.262128829956055, "global_step": 379330, "epoch": 4570} {"train_loss": -25.48676872253418, "global_step": 379331, "epoch": 4570} {"train_loss": -25.54851722717285, "global_step": 379332, "epoch": 4570} {"train_loss": -25.924585342407227, "global_step": 379333, "epoch": 4570} {"train_loss": -25.975488662719727, "global_step": 379334, "epoch": 4570} {"train_loss": -25.55918312072754, "global_step": 379335, "epoch": 4570} {"train_loss": -25.886367797851562, "global_step": 379336, "epoch": 4570} {"train_loss": -25.7934513092041, "global_step": 379337, "epoch": 4570} {"train_loss": -25.60202407836914, "global_step": 379338, "epoch": 4570} {"train_loss": -25.71717643737793, "global_step": 379339, "epoch": 4570} {"train_loss": -26.337934494018555, "global_step": 379340, "epoch": 4570} {"train_loss": -25.797107696533203, "global_step": 379341, "epoch": 4570} {"train_loss": -25.854022979736328, "global_step": 379342, "epoch": 4570} {"train_loss": -26.149261474609375, "global_step": 379343, "epoch": 4570} {"train_loss": -25.989700317382812, "global_step": 379344, "epoch": 4570} {"train_loss": -25.781143188476562, "global_step": 379345, "epoch": 4570} {"train_loss": -26.200668334960938, "global_step": 379346, "epoch": 4570} {"train_loss": -26.00245475769043, "global_step": 379347, "epoch": 4570} {"train_loss": -26.18853759765625, "global_step": 379348, "epoch": 4570} {"train_loss": -26.148365020751953, "global_step": 379349, "epoch": 4570} {"train_loss": -26.566205978393555, "global_step": 379350, "epoch": 4570} {"train_loss": -26.335737228393555, "global_step": 379351, "epoch": 4570} {"train_loss": -26.694467544555664, "global_step": 379352, "epoch": 4570} {"train_loss": -26.422697067260742, "global_step": 379353, "epoch": 4570} {"train_loss": -26.5673885345459, "global_step": 379354, "epoch": 4570} {"train_loss": -26.38248634338379, "global_step": 379355, "epoch": 4570} {"train_loss": -26.298810958862305, "global_step": 379356, "epoch": 4570} {"train_loss": -26.535669326782227, "global_step": 379357, "epoch": 4570} {"train_loss": -26.673887252807617, "global_step": 379358, "epoch": 4570} {"train_loss": -26.52857780456543, "global_step": 379359, "epoch": 4570} {"train_loss": -26.673114776611328, "global_step": 379360, "epoch": 4570} {"train_loss": -26.510150909423828, "global_step": 379361, "epoch": 4570} {"train_loss": -26.543155670166016, "global_step": 379362, "epoch": 4570} {"train_loss": -26.713459014892578, "global_step": 379363, "epoch": 4570} {"train_loss": -26.843225479125977, "global_step": 379364, "epoch": 4570} {"train_loss": -26.8452091217041, "global_step": 379365, "epoch": 4570} {"train_loss": -26.6649112701416, "global_step": 379366, "epoch": 4570} {"train_loss": -26.42439079284668, "global_step": 379367, "epoch": 4570} {"train_loss": -26.962146759033203, "global_step": 379368, "epoch": 4570} {"train_loss": -26.725751876831055, "global_step": 379369, "epoch": 4570} {"train_loss": -26.756162643432617, "global_step": 379370, "epoch": 4570} {"train_loss": -26.389577865600586, "global_step": 379371, "epoch": 4570} {"train_loss": -26.777118682861328, "global_step": 379372, "epoch": 4570} {"train_loss": -26.598386764526367, "global_step": 379373, "epoch": 4570} {"train_loss": -26.3194580078125, "global_step": 379374, "epoch": 4570} {"train_loss": -26.344884872436523, "global_step": 379375, "epoch": 4570} {"train_loss": -26.71991539001465, "global_step": 379376, "epoch": 4570} {"train_loss": -26.369049072265625, "global_step": 379377, "epoch": 4570} {"train_loss": -26.888513565063477, "global_step": 379378, "epoch": 4570} {"train_loss": -26.647069931030273, "global_step": 379379, "epoch": 4570} {"train_loss": -26.6126766204834, "global_step": 379380, "epoch": 4570} {"train_loss": -26.5093994140625, "global_step": 379381, "epoch": 4570} {"train_loss": -26.8106746673584, "global_step": 379382, "epoch": 4570} {"train_loss": -26.728002548217773, "global_step": 379383, "epoch": 4570} {"train_loss": -26.60633659362793, "global_step": 379384, "epoch": 4570} {"train_loss": -26.7459774017334, "global_step": 379385, "epoch": 4570} {"train_loss": -26.665390014648438, "global_step": 379386, "epoch": 4570} {"train_loss": -26.63020133972168, "global_step": 379387, "epoch": 4570} {"train_loss": -26.6458683013916, "global_step": 379388, "epoch": 4570} {"train_loss": -26.45148277282715, "global_step": 379389, "epoch": 4570} {"train_loss": -26.312429428100586, "global_step": 379390, "epoch": 4570} {"train_loss": -26.798492431640625, "global_step": 379391, "epoch": 4570} {"train_loss": -25.88478614623288, "global_step": 379392, "epoch": 4570, "val_loss": 6560915.5} {"train_loss": -25.24956703186035, "global_step": 379393, "epoch": 4571} {"train_loss": -24.153881072998047, "global_step": 379394, "epoch": 4571} {"train_loss": -25.54549789428711, "global_step": 379395, "epoch": 4571} {"train_loss": -25.786441802978516, "global_step": 379396, "epoch": 4571} {"train_loss": -25.564695358276367, "global_step": 379397, "epoch": 4571} {"train_loss": -25.34701156616211, "global_step": 379398, "epoch": 4571} {"train_loss": -26.2280216217041, "global_step": 379399, "epoch": 4571} {"train_loss": -25.812833786010742, "global_step": 379400, "epoch": 4571} {"train_loss": -26.12067985534668, "global_step": 379401, "epoch": 4571} {"train_loss": -25.992706298828125, "global_step": 379402, "epoch": 4571} {"train_loss": -26.285165786743164, "global_step": 379403, "epoch": 4571} {"train_loss": -26.27178955078125, "global_step": 379404, "epoch": 4571} {"train_loss": -26.186756134033203, "global_step": 379405, "epoch": 4571} {"train_loss": -26.185632705688477, "global_step": 379406, "epoch": 4571} {"train_loss": -26.383392333984375, "global_step": 379407, "epoch": 4571} {"train_loss": -26.450225830078125, "global_step": 379408, "epoch": 4571} {"train_loss": -26.488956451416016, "global_step": 379409, "epoch": 4571} {"train_loss": -26.0003604888916, "global_step": 379410, "epoch": 4571} {"train_loss": -26.427072525024414, "global_step": 379411, "epoch": 4571} {"train_loss": -26.051380157470703, "global_step": 379412, "epoch": 4571} {"train_loss": -26.182531356811523, "global_step": 379413, "epoch": 4571} {"train_loss": -26.549951553344727, "global_step": 379414, "epoch": 4571} {"train_loss": -26.687524795532227, "global_step": 379415, "epoch": 4571} {"train_loss": -26.35529136657715, "global_step": 379416, "epoch": 4571} {"train_loss": -26.529226303100586, "global_step": 379417, "epoch": 4571} {"train_loss": -26.2221622467041, "global_step": 379418, "epoch": 4571} {"train_loss": -26.536298751831055, "global_step": 379419, "epoch": 4571} {"train_loss": -26.464447021484375, "global_step": 379420, "epoch": 4571} {"train_loss": -26.521814346313477, "global_step": 379421, "epoch": 4571} {"train_loss": -26.52497673034668, "global_step": 379422, "epoch": 4571} {"train_loss": -26.36860466003418, "global_step": 379423, "epoch": 4571} {"train_loss": -26.483051300048828, "global_step": 379424, "epoch": 4571} {"train_loss": -26.502099990844727, "global_step": 379425, "epoch": 4571} {"train_loss": -26.87006950378418, "global_step": 379426, "epoch": 4571} {"train_loss": -26.58255386352539, "global_step": 379427, "epoch": 4571} {"train_loss": -26.621503829956055, "global_step": 379428, "epoch": 4571} {"train_loss": -26.79999351501465, "global_step": 379429, "epoch": 4571} {"train_loss": -26.637426376342773, "global_step": 379430, "epoch": 4571} {"train_loss": -26.83613395690918, "global_step": 379431, "epoch": 4571} {"train_loss": -26.744470596313477, "global_step": 379432, "epoch": 4571} {"train_loss": -27.009008407592773, "global_step": 379433, "epoch": 4571} {"train_loss": -26.8896484375, "global_step": 379434, "epoch": 4571} {"train_loss": -26.797224044799805, "global_step": 379435, "epoch": 4571} {"train_loss": -26.52385902404785, "global_step": 379436, "epoch": 4571} {"train_loss": -26.633222579956055, "global_step": 379437, "epoch": 4571} {"train_loss": -26.66244888305664, "global_step": 379438, "epoch": 4571} {"train_loss": -26.21298599243164, "global_step": 379439, "epoch": 4571} {"train_loss": -26.5695858001709, "global_step": 379440, "epoch": 4571} {"train_loss": -26.490888595581055, "global_step": 379441, "epoch": 4571} {"train_loss": -26.56658363342285, "global_step": 379442, "epoch": 4571} {"train_loss": -26.382862091064453, "global_step": 379443, "epoch": 4571} {"train_loss": -26.503173828125, "global_step": 379444, "epoch": 4571} {"train_loss": -26.564138412475586, "global_step": 379445, "epoch": 4571} {"train_loss": -27.065265655517578, "global_step": 379446, "epoch": 4571} {"train_loss": -26.552143096923828, "global_step": 379447, "epoch": 4571} {"train_loss": -26.45977210998535, "global_step": 379448, "epoch": 4571} {"train_loss": -26.43256187438965, "global_step": 379449, "epoch": 4571} {"train_loss": -26.449735641479492, "global_step": 379450, "epoch": 4571} {"train_loss": -26.385038375854492, "global_step": 379451, "epoch": 4571} {"train_loss": -26.07594108581543, "global_step": 379452, "epoch": 4571} {"train_loss": -26.015888214111328, "global_step": 379453, "epoch": 4571} {"train_loss": -26.174062728881836, "global_step": 379454, "epoch": 4571} {"train_loss": -26.434926986694336, "global_step": 379455, "epoch": 4571} {"train_loss": -26.254791259765625, "global_step": 379456, "epoch": 4571} {"train_loss": -26.5041446685791, "global_step": 379457, "epoch": 4571} {"train_loss": -26.854022979736328, "global_step": 379458, "epoch": 4571} {"train_loss": -26.458026885986328, "global_step": 379459, "epoch": 4571} {"train_loss": -26.366840362548828, "global_step": 379460, "epoch": 4571} {"train_loss": -26.30879020690918, "global_step": 379461, "epoch": 4571} {"train_loss": -26.220651626586914, "global_step": 379462, "epoch": 4571} {"train_loss": -26.84797477722168, "global_step": 379463, "epoch": 4571} {"train_loss": -26.595014572143555, "global_step": 379464, "epoch": 4571} {"train_loss": -26.52919578552246, "global_step": 379465, "epoch": 4571} {"train_loss": -26.456396102905273, "global_step": 379466, "epoch": 4571} {"train_loss": -26.394550323486328, "global_step": 379467, "epoch": 4571} {"train_loss": -26.469778060913086, "global_step": 379468, "epoch": 4571} {"train_loss": -26.321008682250977, "global_step": 379469, "epoch": 4571} {"train_loss": -26.36223793029785, "global_step": 379470, "epoch": 4571} {"train_loss": -26.490949630737305, "global_step": 379471, "epoch": 4571} {"train_loss": -26.741418838500977, "global_step": 379472, "epoch": 4571} {"train_loss": -26.46524429321289, "global_step": 379473, "epoch": 4571} {"train_loss": -26.477888107299805, "global_step": 379474, "epoch": 4571} {"train_loss": -26.368643381509436, "global_step": 379475, "epoch": 4571, "val_loss": 6683076.0} {"train_loss": -26.133947372436523, "global_step": 379476, "epoch": 4572} {"train_loss": -25.577104568481445, "global_step": 379477, "epoch": 4572} {"train_loss": -25.85621452331543, "global_step": 379478, "epoch": 4572} {"train_loss": -26.102313995361328, "global_step": 379479, "epoch": 4572} {"train_loss": -25.92431640625, "global_step": 379480, "epoch": 4572} {"train_loss": -25.804279327392578, "global_step": 379481, "epoch": 4572} {"train_loss": -26.392621994018555, "global_step": 379482, "epoch": 4572} {"train_loss": -25.86883544921875, "global_step": 379483, "epoch": 4572} {"train_loss": -25.8511962890625, "global_step": 379484, "epoch": 4572} {"train_loss": -25.99884605407715, "global_step": 379485, "epoch": 4572} {"train_loss": -25.95878028869629, "global_step": 379486, "epoch": 4572} {"train_loss": -26.230560302734375, "global_step": 379487, "epoch": 4572} {"train_loss": -25.624378204345703, "global_step": 379488, "epoch": 4572} {"train_loss": -26.41444969177246, "global_step": 379489, "epoch": 4572} {"train_loss": -26.309743881225586, "global_step": 379490, "epoch": 4572} {"train_loss": -26.633716583251953, "global_step": 379491, "epoch": 4572} {"train_loss": -26.01079750061035, "global_step": 379492, "epoch": 4572} {"train_loss": -26.058374404907227, "global_step": 379493, "epoch": 4572} {"train_loss": -26.24032974243164, "global_step": 379494, "epoch": 4572} {"train_loss": -26.527149200439453, "global_step": 379495, "epoch": 4572} {"train_loss": -26.46843910217285, "global_step": 379496, "epoch": 4572} {"train_loss": -26.2957820892334, "global_step": 379497, "epoch": 4572} {"train_loss": -26.216550827026367, "global_step": 379498, "epoch": 4572} {"train_loss": -26.270172119140625, "global_step": 379499, "epoch": 4572} {"train_loss": -26.62921714782715, "global_step": 379500, "epoch": 4572} {"train_loss": -26.217260360717773, "global_step": 379501, "epoch": 4572} {"train_loss": -26.6364688873291, "global_step": 379502, "epoch": 4572} {"train_loss": -26.2471866607666, "global_step": 379503, "epoch": 4572} {"train_loss": -26.4598445892334, "global_step": 379504, "epoch": 4572} {"train_loss": -26.450525283813477, "global_step": 379505, "epoch": 4572} {"train_loss": -26.473388671875, "global_step": 379506, "epoch": 4572} {"train_loss": -26.366626739501953, "global_step": 379507, "epoch": 4572} {"train_loss": -26.477802276611328, "global_step": 379508, "epoch": 4572} {"train_loss": -26.561323165893555, "global_step": 379509, "epoch": 4572} {"train_loss": -26.594074249267578, "global_step": 379510, "epoch": 4572} {"train_loss": -26.758045196533203, "global_step": 379511, "epoch": 4572} {"train_loss": -26.400466918945312, "global_step": 379512, "epoch": 4572} {"train_loss": -26.497241973876953, "global_step": 379513, "epoch": 4572} {"train_loss": -26.45684242248535, "global_step": 379514, "epoch": 4572} {"train_loss": -26.73552894592285, "global_step": 379515, "epoch": 4572} {"train_loss": -26.495187759399414, "global_step": 379516, "epoch": 4572} {"train_loss": -26.658416748046875, "global_step": 379517, "epoch": 4572} {"train_loss": -26.75654411315918, "global_step": 379518, "epoch": 4572} {"train_loss": -26.450109481811523, "global_step": 379519, "epoch": 4572} {"train_loss": -26.661396026611328, "global_step": 379520, "epoch": 4572} {"train_loss": -26.522705078125, "global_step": 379521, "epoch": 4572} {"train_loss": -27.107824325561523, "global_step": 379522, "epoch": 4572} {"train_loss": -26.827051162719727, "global_step": 379523, "epoch": 4572} {"train_loss": -26.654027938842773, "global_step": 379524, "epoch": 4572} {"train_loss": -26.516149520874023, "global_step": 379525, "epoch": 4572} {"train_loss": -26.18729019165039, "global_step": 379526, "epoch": 4572} {"train_loss": -26.727909088134766, "global_step": 379527, "epoch": 4572} {"train_loss": -26.18598747253418, "global_step": 379528, "epoch": 4572} {"train_loss": -26.598773956298828, "global_step": 379529, "epoch": 4572} {"train_loss": -26.553068161010742, "global_step": 379530, "epoch": 4572} {"train_loss": -26.98042106628418, "global_step": 379531, "epoch": 4572} {"train_loss": -26.720935821533203, "global_step": 379532, "epoch": 4572} {"train_loss": -26.697248458862305, "global_step": 379533, "epoch": 4572} {"train_loss": -26.941211700439453, "global_step": 379534, "epoch": 4572} {"train_loss": -26.47181510925293, "global_step": 379535, "epoch": 4572} {"train_loss": -26.81635856628418, "global_step": 379536, "epoch": 4572} {"train_loss": -26.580066680908203, "global_step": 379537, "epoch": 4572} {"train_loss": -26.66517448425293, "global_step": 379538, "epoch": 4572} {"train_loss": -26.67142677307129, "global_step": 379539, "epoch": 4572} {"train_loss": -26.734210968017578, "global_step": 379540, "epoch": 4572} {"train_loss": -26.476831436157227, "global_step": 379541, "epoch": 4572} {"train_loss": -26.818435668945312, "global_step": 379542, "epoch": 4572} {"train_loss": -26.5642147064209, "global_step": 379543, "epoch": 4572} {"train_loss": -26.887332916259766, "global_step": 379544, "epoch": 4572} {"train_loss": -26.5367488861084, "global_step": 379545, "epoch": 4572} {"train_loss": -26.783109664916992, "global_step": 379546, "epoch": 4572} {"train_loss": -26.172712326049805, "global_step": 379547, "epoch": 4572} {"train_loss": -26.591764450073242, "global_step": 379548, "epoch": 4572} {"train_loss": -26.782026290893555, "global_step": 379549, "epoch": 4572} {"train_loss": -26.29485511779785, "global_step": 379550, "epoch": 4572} {"train_loss": -26.27052879333496, "global_step": 379551, "epoch": 4572} {"train_loss": -26.794702529907227, "global_step": 379552, "epoch": 4572} {"train_loss": -26.533145904541016, "global_step": 379553, "epoch": 4572} {"train_loss": -26.24323844909668, "global_step": 379554, "epoch": 4572} {"train_loss": -25.836023330688477, "global_step": 379555, "epoch": 4572} {"train_loss": -25.993566513061523, "global_step": 379556, "epoch": 4572} {"train_loss": -25.91219139099121, "global_step": 379557, "epoch": 4572} {"train_loss": -26.402705410876905, "global_step": 379558, "epoch": 4572, "val_loss": 6528998.0} {"train_loss": -24.50876808166504, "global_step": 379559, "epoch": 4573} {"train_loss": -22.586360931396484, "global_step": 379560, "epoch": 4573} {"train_loss": -23.636016845703125, "global_step": 379561, "epoch": 4573} {"train_loss": -24.15163230895996, "global_step": 379562, "epoch": 4573} {"train_loss": -25.27215576171875, "global_step": 379563, "epoch": 4573} {"train_loss": -24.50004005432129, "global_step": 379564, "epoch": 4573} {"train_loss": -25.072120666503906, "global_step": 379565, "epoch": 4573} {"train_loss": -25.12775993347168, "global_step": 379566, "epoch": 4573} {"train_loss": -25.09551429748535, "global_step": 379567, "epoch": 4573} {"train_loss": -25.503154754638672, "global_step": 379568, "epoch": 4573} {"train_loss": -25.25655174255371, "global_step": 379569, "epoch": 4573} {"train_loss": -25.828588485717773, "global_step": 379570, "epoch": 4573} {"train_loss": -25.410812377929688, "global_step": 379571, "epoch": 4573} {"train_loss": -25.48015594482422, "global_step": 379572, "epoch": 4573} {"train_loss": -25.67133140563965, "global_step": 379573, "epoch": 4573} {"train_loss": -25.825775146484375, "global_step": 379574, "epoch": 4573} {"train_loss": -25.65040397644043, "global_step": 379575, "epoch": 4573} {"train_loss": -25.566905975341797, "global_step": 379576, "epoch": 4573} {"train_loss": -25.6492862701416, "global_step": 379577, "epoch": 4573} {"train_loss": -25.721332550048828, "global_step": 379578, "epoch": 4573} {"train_loss": -25.31987953186035, "global_step": 379579, "epoch": 4573} {"train_loss": -25.882953643798828, "global_step": 379580, "epoch": 4573} {"train_loss": -25.6112003326416, "global_step": 379581, "epoch": 4573} {"train_loss": -25.656417846679688, "global_step": 379582, "epoch": 4573} {"train_loss": -26.261884689331055, "global_step": 379583, "epoch": 4573} {"train_loss": -25.70851707458496, "global_step": 379584, "epoch": 4573} {"train_loss": -26.044340133666992, "global_step": 379585, "epoch": 4573} {"train_loss": -25.984121322631836, "global_step": 379586, "epoch": 4573} {"train_loss": -26.0538330078125, "global_step": 379587, "epoch": 4573} {"train_loss": -25.91694450378418, "global_step": 379588, "epoch": 4573} {"train_loss": -26.207197189331055, "global_step": 379589, "epoch": 4573} {"train_loss": -25.956298828125, "global_step": 379590, "epoch": 4573} {"train_loss": -26.08298683166504, "global_step": 379591, "epoch": 4573} {"train_loss": -25.886682510375977, "global_step": 379592, "epoch": 4573} {"train_loss": -26.181299209594727, "global_step": 379593, "epoch": 4573} {"train_loss": -26.10150146484375, "global_step": 379594, "epoch": 4573} {"train_loss": -25.93732261657715, "global_step": 379595, "epoch": 4573} {"train_loss": -26.021656036376953, "global_step": 379596, "epoch": 4573} {"train_loss": -26.326704025268555, "global_step": 379597, "epoch": 4573} {"train_loss": -26.39569091796875, "global_step": 379598, "epoch": 4573} {"train_loss": -26.11151695251465, "global_step": 379599, "epoch": 4573} {"train_loss": -26.565093994140625, "global_step": 379600, "epoch": 4573} {"train_loss": -26.201337814331055, "global_step": 379601, "epoch": 4573} {"train_loss": -26.335052490234375, "global_step": 379602, "epoch": 4573} {"train_loss": -26.560495376586914, "global_step": 379603, "epoch": 4573} {"train_loss": -26.497053146362305, "global_step": 379604, "epoch": 4573} {"train_loss": -26.4732666015625, "global_step": 379605, "epoch": 4573} {"train_loss": -26.453510284423828, "global_step": 379606, "epoch": 4573} {"train_loss": -26.28351402282715, "global_step": 379607, "epoch": 4573} {"train_loss": -26.939029693603516, "global_step": 379608, "epoch": 4573} {"train_loss": -26.544553756713867, "global_step": 379609, "epoch": 4573} {"train_loss": -26.53285026550293, "global_step": 379610, "epoch": 4573} {"train_loss": -26.444067001342773, "global_step": 379611, "epoch": 4573} {"train_loss": -26.653905868530273, "global_step": 379612, "epoch": 4573} {"train_loss": -26.39298439025879, "global_step": 379613, "epoch": 4573} {"train_loss": -26.137495040893555, "global_step": 379614, "epoch": 4573} {"train_loss": -26.433460235595703, "global_step": 379615, "epoch": 4573} {"train_loss": -26.700239181518555, "global_step": 379616, "epoch": 4573} {"train_loss": -26.588281631469727, "global_step": 379617, "epoch": 4573} {"train_loss": -26.75575828552246, "global_step": 379618, "epoch": 4573} {"train_loss": -26.883747100830078, "global_step": 379619, "epoch": 4573} {"train_loss": -26.51485252380371, "global_step": 379620, "epoch": 4573} {"train_loss": -26.909128189086914, "global_step": 379621, "epoch": 4573} {"train_loss": -27.242374420166016, "global_step": 379622, "epoch": 4573} {"train_loss": -26.309864044189453, "global_step": 379623, "epoch": 4573} {"train_loss": -26.504413604736328, "global_step": 379624, "epoch": 4573} {"train_loss": -26.383031845092773, "global_step": 379625, "epoch": 4573} {"train_loss": -26.50251579284668, "global_step": 379626, "epoch": 4573} {"train_loss": -26.29485511779785, "global_step": 379627, "epoch": 4573} {"train_loss": -26.967954635620117, "global_step": 379628, "epoch": 4573} {"train_loss": -26.6221866607666, "global_step": 379629, "epoch": 4573} {"train_loss": -26.636316299438477, "global_step": 379630, "epoch": 4573} {"train_loss": -26.30512046813965, "global_step": 379631, "epoch": 4573} {"train_loss": -26.747934341430664, "global_step": 379632, "epoch": 4573} {"train_loss": -26.5919246673584, "global_step": 379633, "epoch": 4573} {"train_loss": -26.204010009765625, "global_step": 379634, "epoch": 4573} {"train_loss": -26.432270050048828, "global_step": 379635, "epoch": 4573} {"train_loss": -26.491174697875977, "global_step": 379636, "epoch": 4573} {"train_loss": -26.769712448120117, "global_step": 379637, "epoch": 4573} {"train_loss": -26.580631256103516, "global_step": 379638, "epoch": 4573} {"train_loss": -26.4486026763916, "global_step": 379639, "epoch": 4573} {"train_loss": -26.278018951416016, "global_step": 379640, "epoch": 4573} {"train_loss": -26.029195004198925, "global_step": 379641, "epoch": 4573, "val_loss": 6657220.5} {"train_loss": -25.969335556030273, "global_step": 379642, "epoch": 4574} {"train_loss": -25.993566513061523, "global_step": 379643, "epoch": 4574} {"train_loss": -25.746061325073242, "global_step": 379644, "epoch": 4574} {"train_loss": -26.007953643798828, "global_step": 379645, "epoch": 4574} {"train_loss": -26.249588012695312, "global_step": 379646, "epoch": 4574} {"train_loss": -26.20953369140625, "global_step": 379647, "epoch": 4574} {"train_loss": -26.2230281829834, "global_step": 379648, "epoch": 4574} {"train_loss": -26.163496017456055, "global_step": 379649, "epoch": 4574} {"train_loss": -26.332477569580078, "global_step": 379650, "epoch": 4574} {"train_loss": -26.097158432006836, "global_step": 379651, "epoch": 4574} {"train_loss": -26.45123863220215, "global_step": 379652, "epoch": 4574} {"train_loss": -26.036649703979492, "global_step": 379653, "epoch": 4574} {"train_loss": -26.62175941467285, "global_step": 379654, "epoch": 4574} {"train_loss": -26.55124282836914, "global_step": 379655, "epoch": 4574} {"train_loss": -26.122888565063477, "global_step": 379656, "epoch": 4574} {"train_loss": -26.479406356811523, "global_step": 379657, "epoch": 4574} {"train_loss": -25.78852653503418, "global_step": 379658, "epoch": 4574} {"train_loss": -26.767969131469727, "global_step": 379659, "epoch": 4574} {"train_loss": -26.446191787719727, "global_step": 379660, "epoch": 4574} {"train_loss": -25.971078872680664, "global_step": 379661, "epoch": 4574} {"train_loss": -26.35209083557129, "global_step": 379662, "epoch": 4574} {"train_loss": -26.31745719909668, "global_step": 379663, "epoch": 4574} {"train_loss": -25.759119033813477, "global_step": 379664, "epoch": 4574} {"train_loss": -26.27004051208496, "global_step": 379665, "epoch": 4574} {"train_loss": -26.252975463867188, "global_step": 379666, "epoch": 4574} {"train_loss": -26.271926879882812, "global_step": 379667, "epoch": 4574} {"train_loss": -26.270069122314453, "global_step": 379668, "epoch": 4574} {"train_loss": -26.082204818725586, "global_step": 379669, "epoch": 4574} {"train_loss": -26.178577423095703, "global_step": 379670, "epoch": 4574} {"train_loss": -26.522287368774414, "global_step": 379671, "epoch": 4574} {"train_loss": -26.72711753845215, "global_step": 379672, "epoch": 4574} {"train_loss": -26.60816764831543, "global_step": 379673, "epoch": 4574} {"train_loss": -26.57394790649414, "global_step": 379674, "epoch": 4574} {"train_loss": -26.582401275634766, "global_step": 379675, "epoch": 4574} {"train_loss": -26.644351959228516, "global_step": 379676, "epoch": 4574} {"train_loss": -26.38779640197754, "global_step": 379677, "epoch": 4574} {"train_loss": -26.840030670166016, "global_step": 379678, "epoch": 4574} {"train_loss": -26.268239974975586, "global_step": 379679, "epoch": 4574} {"train_loss": -26.115234375, "global_step": 379680, "epoch": 4574} {"train_loss": -26.388431549072266, "global_step": 379681, "epoch": 4574} {"train_loss": -26.57721519470215, "global_step": 379682, "epoch": 4574} {"train_loss": -26.15066909790039, "global_step": 379683, "epoch": 4574} {"train_loss": -26.190235137939453, "global_step": 379684, "epoch": 4574} {"train_loss": -26.11763572692871, "global_step": 379685, "epoch": 4574} {"train_loss": -26.330982208251953, "global_step": 379686, "epoch": 4574} {"train_loss": -26.800947189331055, "global_step": 379687, "epoch": 4574} {"train_loss": -26.384754180908203, "global_step": 379688, "epoch": 4574} {"train_loss": -26.31812858581543, "global_step": 379689, "epoch": 4574} {"train_loss": -26.375263214111328, "global_step": 379690, "epoch": 4574} {"train_loss": -26.694156646728516, "global_step": 379691, "epoch": 4574} {"train_loss": -25.786115646362305, "global_step": 379692, "epoch": 4574} {"train_loss": -26.5867862701416, "global_step": 379693, "epoch": 4574} {"train_loss": -27.028289794921875, "global_step": 379694, "epoch": 4574} {"train_loss": -26.277210235595703, "global_step": 379695, "epoch": 4574} {"train_loss": -26.82996940612793, "global_step": 379696, "epoch": 4574} {"train_loss": -26.757858276367188, "global_step": 379697, "epoch": 4574} {"train_loss": -26.1772403717041, "global_step": 379698, "epoch": 4574} {"train_loss": -26.535619735717773, "global_step": 379699, "epoch": 4574} {"train_loss": -26.159225463867188, "global_step": 379700, "epoch": 4574} {"train_loss": -26.13191032409668, "global_step": 379701, "epoch": 4574} {"train_loss": -26.61439323425293, "global_step": 379702, "epoch": 4574} {"train_loss": -26.548513412475586, "global_step": 379703, "epoch": 4574} {"train_loss": -26.690540313720703, "global_step": 379704, "epoch": 4574} {"train_loss": -26.45954704284668, "global_step": 379705, "epoch": 4574} {"train_loss": -26.239057540893555, "global_step": 379706, "epoch": 4574} {"train_loss": -26.672155380249023, "global_step": 379707, "epoch": 4574} {"train_loss": -25.98854637145996, "global_step": 379708, "epoch": 4574} {"train_loss": -25.849960327148438, "global_step": 379709, "epoch": 4574} {"train_loss": -25.949268341064453, "global_step": 379710, "epoch": 4574} {"train_loss": -25.81226921081543, "global_step": 379711, "epoch": 4574} {"train_loss": -26.058399200439453, "global_step": 379712, "epoch": 4574} {"train_loss": -26.34295654296875, "global_step": 379713, "epoch": 4574} {"train_loss": -26.17970085144043, "global_step": 379714, "epoch": 4574} {"train_loss": -26.530664443969727, "global_step": 379715, "epoch": 4574} {"train_loss": -26.412633895874023, "global_step": 379716, "epoch": 4574} {"train_loss": -26.528656005859375, "global_step": 379717, "epoch": 4574} {"train_loss": -26.4040584564209, "global_step": 379718, "epoch": 4574} {"train_loss": -26.480764389038086, "global_step": 379719, "epoch": 4574} {"train_loss": -26.592239379882812, "global_step": 379720, "epoch": 4574} {"train_loss": -26.36604881286621, "global_step": 379721, "epoch": 4574} {"train_loss": -26.31186294555664, "global_step": 379722, "epoch": 4574} {"train_loss": -26.2706298828125, "global_step": 379723, "epoch": 4574} {"train_loss": -26.326377087328808, "global_step": 379724, "epoch": 4574, "val_loss": 6535624.0} {"train_loss": -26.02187156677246, "global_step": 379725, "epoch": 4575} {"train_loss": -25.74941062927246, "global_step": 379726, "epoch": 4575} {"train_loss": -25.92743492126465, "global_step": 379727, "epoch": 4575} {"train_loss": -25.76090431213379, "global_step": 379728, "epoch": 4575} {"train_loss": -25.9243106842041, "global_step": 379729, "epoch": 4575} {"train_loss": -25.494054794311523, "global_step": 379730, "epoch": 4575} {"train_loss": -26.0273494720459, "global_step": 379731, "epoch": 4575} {"train_loss": -25.559175491333008, "global_step": 379732, "epoch": 4575} {"train_loss": -25.871936798095703, "global_step": 379733, "epoch": 4575} {"train_loss": -26.006921768188477, "global_step": 379734, "epoch": 4575} {"train_loss": -25.8605899810791, "global_step": 379735, "epoch": 4575} {"train_loss": -26.307912826538086, "global_step": 379736, "epoch": 4575} {"train_loss": -26.06597328186035, "global_step": 379737, "epoch": 4575} {"train_loss": -26.436059951782227, "global_step": 379738, "epoch": 4575} {"train_loss": -26.402664184570312, "global_step": 379739, "epoch": 4575} {"train_loss": -26.131134033203125, "global_step": 379740, "epoch": 4575} {"train_loss": -26.515869140625, "global_step": 379741, "epoch": 4575} {"train_loss": -26.409210205078125, "global_step": 379742, "epoch": 4575} {"train_loss": -26.2147216796875, "global_step": 379743, "epoch": 4575} {"train_loss": -26.360563278198242, "global_step": 379744, "epoch": 4575} {"train_loss": -26.31361198425293, "global_step": 379745, "epoch": 4575} {"train_loss": -26.062116622924805, "global_step": 379746, "epoch": 4575} {"train_loss": -26.316089630126953, "global_step": 379747, "epoch": 4575} {"train_loss": -26.139856338500977, "global_step": 379748, "epoch": 4575} {"train_loss": -26.236072540283203, "global_step": 379749, "epoch": 4575} {"train_loss": -26.37448501586914, "global_step": 379750, "epoch": 4575} {"train_loss": -26.189138412475586, "global_step": 379751, "epoch": 4575} {"train_loss": -26.335630416870117, "global_step": 379752, "epoch": 4575} {"train_loss": -26.463382720947266, "global_step": 379753, "epoch": 4575} {"train_loss": -26.101648330688477, "global_step": 379754, "epoch": 4575} {"train_loss": -26.8449764251709, "global_step": 379755, "epoch": 4575} {"train_loss": -26.464176177978516, "global_step": 379756, "epoch": 4575} {"train_loss": -26.519861221313477, "global_step": 379757, "epoch": 4575} {"train_loss": -26.552509307861328, "global_step": 379758, "epoch": 4575} {"train_loss": -26.447458267211914, "global_step": 379759, "epoch": 4575} {"train_loss": -26.400543212890625, "global_step": 379760, "epoch": 4575} {"train_loss": -26.468236923217773, "global_step": 379761, "epoch": 4575} {"train_loss": -26.77274513244629, "global_step": 379762, "epoch": 4575} {"train_loss": -26.74773597717285, "global_step": 379763, "epoch": 4575} {"train_loss": -26.65578269958496, "global_step": 379764, "epoch": 4575} {"train_loss": -26.510086059570312, "global_step": 379765, "epoch": 4575} {"train_loss": -26.8962459564209, "global_step": 379766, "epoch": 4575} {"train_loss": -26.641340255737305, "global_step": 379767, "epoch": 4575} {"train_loss": -26.3743839263916, "global_step": 379768, "epoch": 4575} {"train_loss": -26.508834838867188, "global_step": 379769, "epoch": 4575} {"train_loss": -26.36480712890625, "global_step": 379770, "epoch": 4575} {"train_loss": -26.542760848999023, "global_step": 379771, "epoch": 4575} {"train_loss": -26.556974411010742, "global_step": 379772, "epoch": 4575} {"train_loss": -26.811399459838867, "global_step": 379773, "epoch": 4575} {"train_loss": -26.47012710571289, "global_step": 379774, "epoch": 4575} {"train_loss": -26.286285400390625, "global_step": 379775, "epoch": 4575} {"train_loss": -27.19488525390625, "global_step": 379776, "epoch": 4575} {"train_loss": -26.61910057067871, "global_step": 379777, "epoch": 4575} {"train_loss": -26.324838638305664, "global_step": 379778, "epoch": 4575} {"train_loss": -26.456405639648438, "global_step": 379779, "epoch": 4575} {"train_loss": -26.447446823120117, "global_step": 379780, "epoch": 4575} {"train_loss": -26.34016227722168, "global_step": 379781, "epoch": 4575} {"train_loss": -26.622610092163086, "global_step": 379782, "epoch": 4575} {"train_loss": -26.56758689880371, "global_step": 379783, "epoch": 4575} {"train_loss": -26.17716407775879, "global_step": 379784, "epoch": 4575} {"train_loss": -26.2435359954834, "global_step": 379785, "epoch": 4575} {"train_loss": -26.710739135742188, "global_step": 379786, "epoch": 4575} {"train_loss": -26.669723510742188, "global_step": 379787, "epoch": 4575} {"train_loss": -26.519306182861328, "global_step": 379788, "epoch": 4575} {"train_loss": -26.217634201049805, "global_step": 379789, "epoch": 4575} {"train_loss": -26.127426147460938, "global_step": 379790, "epoch": 4575} {"train_loss": -26.514936447143555, "global_step": 379791, "epoch": 4575} {"train_loss": -26.025243759155273, "global_step": 379792, "epoch": 4575} {"train_loss": -25.8985595703125, "global_step": 379793, "epoch": 4575} {"train_loss": -26.509557723999023, "global_step": 379794, "epoch": 4575} {"train_loss": -26.738134384155273, "global_step": 379795, "epoch": 4575} {"train_loss": -26.485509872436523, "global_step": 379796, "epoch": 4575} {"train_loss": -26.32051658630371, "global_step": 379797, "epoch": 4575} {"train_loss": -26.657840728759766, "global_step": 379798, "epoch": 4575} {"train_loss": -26.69681167602539, "global_step": 379799, "epoch": 4575} {"train_loss": -26.335248947143555, "global_step": 379800, "epoch": 4575} {"train_loss": -26.764474868774414, "global_step": 379801, "epoch": 4575} {"train_loss": -25.65789794921875, "global_step": 379802, "epoch": 4575} {"train_loss": -25.8604679107666, "global_step": 379803, "epoch": 4575} {"train_loss": -26.51715660095215, "global_step": 379804, "epoch": 4575} {"train_loss": -26.45313835144043, "global_step": 379805, "epoch": 4575} {"train_loss": -26.45655632019043, "global_step": 379806, "epoch": 4575} {"train_loss": -26.349307025771544, "global_step": 379807, "epoch": 4575, "val_loss": 6615625.5} {"train_loss": -26.2905330657959, "global_step": 379808, "epoch": 4576} {"train_loss": -25.972681045532227, "global_step": 379809, "epoch": 4576} {"train_loss": -26.690475463867188, "global_step": 379810, "epoch": 4576} {"train_loss": -25.944299697875977, "global_step": 379811, "epoch": 4576} {"train_loss": -26.202539443969727, "global_step": 379812, "epoch": 4576} {"train_loss": -25.883386611938477, "global_step": 379813, "epoch": 4576} {"train_loss": -26.21319580078125, "global_step": 379814, "epoch": 4576} {"train_loss": -26.168127059936523, "global_step": 379815, "epoch": 4576} {"train_loss": -26.0942440032959, "global_step": 379816, "epoch": 4576} {"train_loss": -26.033802032470703, "global_step": 379817, "epoch": 4576} {"train_loss": -25.928159713745117, "global_step": 379818, "epoch": 4576} {"train_loss": -26.326711654663086, "global_step": 379819, "epoch": 4576} {"train_loss": -26.173053741455078, "global_step": 379820, "epoch": 4576} {"train_loss": -26.396230697631836, "global_step": 379821, "epoch": 4576} {"train_loss": -26.244693756103516, "global_step": 379822, "epoch": 4576} {"train_loss": -26.15342140197754, "global_step": 379823, "epoch": 4576} {"train_loss": -26.3588924407959, "global_step": 379824, "epoch": 4576} {"train_loss": -26.387365341186523, "global_step": 379825, "epoch": 4576} {"train_loss": -26.7675724029541, "global_step": 379826, "epoch": 4576} {"train_loss": -26.170804977416992, "global_step": 379827, "epoch": 4576} {"train_loss": -26.44183921813965, "global_step": 379828, "epoch": 4576} {"train_loss": -26.415693283081055, "global_step": 379829, "epoch": 4576} {"train_loss": -26.287378311157227, "global_step": 379830, "epoch": 4576} {"train_loss": -26.293781280517578, "global_step": 379831, "epoch": 4576} {"train_loss": -26.452478408813477, "global_step": 379832, "epoch": 4576} {"train_loss": -26.335205078125, "global_step": 379833, "epoch": 4576} {"train_loss": -26.92876625061035, "global_step": 379834, "epoch": 4576} {"train_loss": -26.356088638305664, "global_step": 379835, "epoch": 4576} {"train_loss": -26.25995445251465, "global_step": 379836, "epoch": 4576} {"train_loss": -26.66593360900879, "global_step": 379837, "epoch": 4576} {"train_loss": -26.505008697509766, "global_step": 379838, "epoch": 4576} {"train_loss": -26.824604034423828, "global_step": 379839, "epoch": 4576} {"train_loss": -26.406238555908203, "global_step": 379840, "epoch": 4576} {"train_loss": -26.667530059814453, "global_step": 379841, "epoch": 4576} {"train_loss": -26.485919952392578, "global_step": 379842, "epoch": 4576} {"train_loss": -26.35177993774414, "global_step": 379843, "epoch": 4576} {"train_loss": -26.567890167236328, "global_step": 379844, "epoch": 4576} {"train_loss": -27.029584884643555, "global_step": 379845, "epoch": 4576} {"train_loss": -26.345849990844727, "global_step": 379846, "epoch": 4576} {"train_loss": -26.403059005737305, "global_step": 379847, "epoch": 4576} {"train_loss": -26.432544708251953, "global_step": 379848, "epoch": 4576} {"train_loss": -26.6070556640625, "global_step": 379849, "epoch": 4576} {"train_loss": -26.764148712158203, "global_step": 379850, "epoch": 4576} {"train_loss": -26.466053009033203, "global_step": 379851, "epoch": 4576} {"train_loss": -26.618499755859375, "global_step": 379852, "epoch": 4576} {"train_loss": -26.660694122314453, "global_step": 379853, "epoch": 4576} {"train_loss": -26.37434959411621, "global_step": 379854, "epoch": 4576} {"train_loss": -26.686920166015625, "global_step": 379855, "epoch": 4576} {"train_loss": -26.55805015563965, "global_step": 379856, "epoch": 4576} {"train_loss": -26.52191734313965, "global_step": 379857, "epoch": 4576} {"train_loss": -26.13348388671875, "global_step": 379858, "epoch": 4576} {"train_loss": -26.027429580688477, "global_step": 379859, "epoch": 4576} {"train_loss": -25.913206100463867, "global_step": 379860, "epoch": 4576} {"train_loss": -26.5963077545166, "global_step": 379861, "epoch": 4576} {"train_loss": -26.691177368164062, "global_step": 379862, "epoch": 4576} {"train_loss": -26.537195205688477, "global_step": 379863, "epoch": 4576} {"train_loss": -26.414276123046875, "global_step": 379864, "epoch": 4576} {"train_loss": -26.498876571655273, "global_step": 379865, "epoch": 4576} {"train_loss": -26.445180892944336, "global_step": 379866, "epoch": 4576} {"train_loss": -26.686010360717773, "global_step": 379867, "epoch": 4576} {"train_loss": -26.709766387939453, "global_step": 379868, "epoch": 4576} {"train_loss": -26.624042510986328, "global_step": 379869, "epoch": 4576} {"train_loss": -26.627416610717773, "global_step": 379870, "epoch": 4576} {"train_loss": -26.809051513671875, "global_step": 379871, "epoch": 4576} {"train_loss": -26.633310317993164, "global_step": 379872, "epoch": 4576} {"train_loss": -26.670682907104492, "global_step": 379873, "epoch": 4576} {"train_loss": -26.698720932006836, "global_step": 379874, "epoch": 4576} {"train_loss": -26.686954498291016, "global_step": 379875, "epoch": 4576} {"train_loss": -26.573102951049805, "global_step": 379876, "epoch": 4576} {"train_loss": -26.57587242126465, "global_step": 379877, "epoch": 4576} {"train_loss": -26.388248443603516, "global_step": 379878, "epoch": 4576} {"train_loss": -26.7213077545166, "global_step": 379879, "epoch": 4576} {"train_loss": -26.338794708251953, "global_step": 379880, "epoch": 4576} {"train_loss": -25.313800811767578, "global_step": 379881, "epoch": 4576} {"train_loss": -25.23482894897461, "global_step": 379882, "epoch": 4576} {"train_loss": -25.494897842407227, "global_step": 379883, "epoch": 4576} {"train_loss": -25.60495948791504, "global_step": 379884, "epoch": 4576} {"train_loss": -26.315771102905273, "global_step": 379885, "epoch": 4576} {"train_loss": -25.70701026916504, "global_step": 379886, "epoch": 4576} {"train_loss": -25.745773315429688, "global_step": 379887, "epoch": 4576} {"train_loss": -26.045751571655273, "global_step": 379888, "epoch": 4576} {"train_loss": -26.498809814453125, "global_step": 379889, "epoch": 4576} {"train_loss": -26.362628017563416, "global_step": 379890, "epoch": 4576, "val_loss": 6693734.0} {"train_loss": -25.628387451171875, "global_step": 379891, "epoch": 4577} {"train_loss": -25.533475875854492, "global_step": 379892, "epoch": 4577} {"train_loss": -25.853723526000977, "global_step": 379893, "epoch": 4577} {"train_loss": -25.29969596862793, "global_step": 379894, "epoch": 4577} {"train_loss": -25.87171745300293, "global_step": 379895, "epoch": 4577} {"train_loss": -25.888904571533203, "global_step": 379896, "epoch": 4577} {"train_loss": -26.261938095092773, "global_step": 379897, "epoch": 4577} {"train_loss": -26.1551570892334, "global_step": 379898, "epoch": 4577} {"train_loss": -26.26923179626465, "global_step": 379899, "epoch": 4577} {"train_loss": -25.68659019470215, "global_step": 379900, "epoch": 4577} {"train_loss": -25.868335723876953, "global_step": 379901, "epoch": 4577} {"train_loss": -26.27671241760254, "global_step": 379902, "epoch": 4577} {"train_loss": -25.86737060546875, "global_step": 379903, "epoch": 4577} {"train_loss": -26.07355308532715, "global_step": 379904, "epoch": 4577} {"train_loss": -26.202289581298828, "global_step": 379905, "epoch": 4577} {"train_loss": -26.27241325378418, "global_step": 379906, "epoch": 4577} {"train_loss": -26.185302734375, "global_step": 379907, "epoch": 4577} {"train_loss": -26.28597068786621, "global_step": 379908, "epoch": 4577} {"train_loss": -26.2141170501709, "global_step": 379909, "epoch": 4577} {"train_loss": -25.978464126586914, "global_step": 379910, "epoch": 4577} {"train_loss": -26.571104049682617, "global_step": 379911, "epoch": 4577} {"train_loss": -26.2628231048584, "global_step": 379912, "epoch": 4577} {"train_loss": -26.415143966674805, "global_step": 379913, "epoch": 4577} {"train_loss": -26.349775314331055, "global_step": 379914, "epoch": 4577} {"train_loss": -26.654638290405273, "global_step": 379915, "epoch": 4577} {"train_loss": -26.343536376953125, "global_step": 379916, "epoch": 4577} {"train_loss": -26.220495223999023, "global_step": 379917, "epoch": 4577} {"train_loss": -26.504255294799805, "global_step": 379918, "epoch": 4577} {"train_loss": -26.286575317382812, "global_step": 379919, "epoch": 4577} {"train_loss": -26.305112838745117, "global_step": 379920, "epoch": 4577} {"train_loss": -26.885074615478516, "global_step": 379921, "epoch": 4577} {"train_loss": -26.422393798828125, "global_step": 379922, "epoch": 4577} {"train_loss": -26.08308982849121, "global_step": 379923, "epoch": 4577} {"train_loss": -26.41098976135254, "global_step": 379924, "epoch": 4577} {"train_loss": -26.22797966003418, "global_step": 379925, "epoch": 4577} {"train_loss": -26.971729278564453, "global_step": 379926, "epoch": 4577} {"train_loss": -26.93195152282715, "global_step": 379927, "epoch": 4577} {"train_loss": -26.284534454345703, "global_step": 379928, "epoch": 4577} {"train_loss": -26.3055477142334, "global_step": 379929, "epoch": 4577} {"train_loss": -26.649982452392578, "global_step": 379930, "epoch": 4577} {"train_loss": -26.521427154541016, "global_step": 379931, "epoch": 4577} {"train_loss": -26.578107833862305, "global_step": 379932, "epoch": 4577} {"train_loss": -26.762130737304688, "global_step": 379933, "epoch": 4577} {"train_loss": -26.66046714782715, "global_step": 379934, "epoch": 4577} {"train_loss": -26.3431396484375, "global_step": 379935, "epoch": 4577} {"train_loss": -26.841245651245117, "global_step": 379936, "epoch": 4577} {"train_loss": -26.599332809448242, "global_step": 379937, "epoch": 4577} {"train_loss": -26.498945236206055, "global_step": 379938, "epoch": 4577} {"train_loss": -26.646757125854492, "global_step": 379939, "epoch": 4577} {"train_loss": -26.9859676361084, "global_step": 379940, "epoch": 4577} {"train_loss": -26.45442008972168, "global_step": 379941, "epoch": 4577} {"train_loss": -26.62471580505371, "global_step": 379942, "epoch": 4577} {"train_loss": -26.538013458251953, "global_step": 379943, "epoch": 4577} {"train_loss": -26.540496826171875, "global_step": 379944, "epoch": 4577} {"train_loss": -26.5439510345459, "global_step": 379945, "epoch": 4577} {"train_loss": -26.284317016601562, "global_step": 379946, "epoch": 4577} {"train_loss": -26.67994499206543, "global_step": 379947, "epoch": 4577} {"train_loss": -26.420013427734375, "global_step": 379948, "epoch": 4577} {"train_loss": -26.4334716796875, "global_step": 379949, "epoch": 4577} {"train_loss": -26.295398712158203, "global_step": 379950, "epoch": 4577} {"train_loss": -26.385883331298828, "global_step": 379951, "epoch": 4577} {"train_loss": -26.52615737915039, "global_step": 379952, "epoch": 4577} {"train_loss": -26.24366569519043, "global_step": 379953, "epoch": 4577} {"train_loss": -26.14545249938965, "global_step": 379954, "epoch": 4577} {"train_loss": -26.744842529296875, "global_step": 379955, "epoch": 4577} {"train_loss": -26.349308013916016, "global_step": 379956, "epoch": 4577} {"train_loss": -26.08198356628418, "global_step": 379957, "epoch": 4577} {"train_loss": -26.235437393188477, "global_step": 379958, "epoch": 4577} {"train_loss": -26.78065299987793, "global_step": 379959, "epoch": 4577} {"train_loss": -27.003875732421875, "global_step": 379960, "epoch": 4577} {"train_loss": -26.0288028717041, "global_step": 379961, "epoch": 4577} {"train_loss": -26.110376358032227, "global_step": 379962, "epoch": 4577} {"train_loss": -25.912921905517578, "global_step": 379963, "epoch": 4577} {"train_loss": -26.067358016967773, "global_step": 379964, "epoch": 4577} {"train_loss": -26.412857055664062, "global_step": 379965, "epoch": 4577} {"train_loss": -26.075475692749023, "global_step": 379966, "epoch": 4577} {"train_loss": -26.628881454467773, "global_step": 379967, "epoch": 4577} {"train_loss": -26.259368896484375, "global_step": 379968, "epoch": 4577} {"train_loss": -26.220224380493164, "global_step": 379969, "epoch": 4577} {"train_loss": -26.502721786499023, "global_step": 379970, "epoch": 4577} {"train_loss": -26.1509952545166, "global_step": 379971, "epoch": 4577} {"train_loss": -26.319660186767578, "global_step": 379972, "epoch": 4577} {"train_loss": -26.33958104145096, "global_step": 379973, "epoch": 4577, "val_loss": 6566266.0} {"train_loss": -26.012571334838867, "global_step": 379974, "epoch": 4578} {"train_loss": -25.969877243041992, "global_step": 379975, "epoch": 4578} {"train_loss": -26.02972984313965, "global_step": 379976, "epoch": 4578} {"train_loss": -25.733306884765625, "global_step": 379977, "epoch": 4578} {"train_loss": -25.843658447265625, "global_step": 379978, "epoch": 4578} {"train_loss": -25.957412719726562, "global_step": 379979, "epoch": 4578} {"train_loss": -26.36311912536621, "global_step": 379980, "epoch": 4578} {"train_loss": -25.818998336791992, "global_step": 379981, "epoch": 4578} {"train_loss": -26.184492111206055, "global_step": 379982, "epoch": 4578} {"train_loss": -25.9559383392334, "global_step": 379983, "epoch": 4578} {"train_loss": -26.5726375579834, "global_step": 379984, "epoch": 4578} {"train_loss": -26.084558486938477, "global_step": 379985, "epoch": 4578} {"train_loss": -26.100772857666016, "global_step": 379986, "epoch": 4578} {"train_loss": -26.09453773498535, "global_step": 379987, "epoch": 4578} {"train_loss": -26.42037010192871, "global_step": 379988, "epoch": 4578} {"train_loss": -26.0106258392334, "global_step": 379989, "epoch": 4578} {"train_loss": -26.181928634643555, "global_step": 379990, "epoch": 4578} {"train_loss": -26.273584365844727, "global_step": 379991, "epoch": 4578} {"train_loss": -26.224775314331055, "global_step": 379992, "epoch": 4578} {"train_loss": -26.389806747436523, "global_step": 379993, "epoch": 4578} {"train_loss": -26.34527015686035, "global_step": 379994, "epoch": 4578} {"train_loss": -26.435022354125977, "global_step": 379995, "epoch": 4578} {"train_loss": -26.77577018737793, "global_step": 379996, "epoch": 4578} {"train_loss": -26.373926162719727, "global_step": 379997, "epoch": 4578} {"train_loss": -26.449512481689453, "global_step": 379998, "epoch": 4578} {"train_loss": -26.448835372924805, "global_step": 379999, "epoch": 4578} {"train_loss": -26.205183029174805, "global_step": 380000, "epoch": 4578} {"train_loss": -26.595422744750977, "global_step": 380001, "epoch": 4578} {"train_loss": -26.26010513305664, "global_step": 380002, "epoch": 4578} {"train_loss": -26.127607345581055, "global_step": 380003, "epoch": 4578} {"train_loss": -26.447498321533203, "global_step": 380004, "epoch": 4578} {"train_loss": -26.979263305664062, "global_step": 380005, "epoch": 4578} {"train_loss": -26.7542781829834, "global_step": 380006, "epoch": 4578} {"train_loss": -26.395038604736328, "global_step": 380007, "epoch": 4578} {"train_loss": -26.484411239624023, "global_step": 380008, "epoch": 4578} {"train_loss": -26.649566650390625, "global_step": 380009, "epoch": 4578} {"train_loss": -26.420654296875, "global_step": 380010, "epoch": 4578} {"train_loss": -26.617429733276367, "global_step": 380011, "epoch": 4578} {"train_loss": -26.610870361328125, "global_step": 380012, "epoch": 4578} {"train_loss": -26.4915828704834, "global_step": 380013, "epoch": 4578} {"train_loss": -26.8321475982666, "global_step": 380014, "epoch": 4578} {"train_loss": -26.849634170532227, "global_step": 380015, "epoch": 4578} {"train_loss": -26.420270919799805, "global_step": 380016, "epoch": 4578} {"train_loss": -26.80160903930664, "global_step": 380017, "epoch": 4578} {"train_loss": -26.618085861206055, "global_step": 380018, "epoch": 4578} {"train_loss": -26.482919692993164, "global_step": 380019, "epoch": 4578} {"train_loss": -26.431177139282227, "global_step": 380020, "epoch": 4578} {"train_loss": -26.633649826049805, "global_step": 380021, "epoch": 4578} {"train_loss": -26.09493064880371, "global_step": 380022, "epoch": 4578} {"train_loss": -26.563724517822266, "global_step": 380023, "epoch": 4578} {"train_loss": -26.710424423217773, "global_step": 380024, "epoch": 4578} {"train_loss": -26.869497299194336, "global_step": 380025, "epoch": 4578} {"train_loss": -26.4725284576416, "global_step": 380026, "epoch": 4578} {"train_loss": -26.25349235534668, "global_step": 380027, "epoch": 4578} {"train_loss": -26.309141159057617, "global_step": 380028, "epoch": 4578} {"train_loss": -26.3271427154541, "global_step": 380029, "epoch": 4578} {"train_loss": -26.40262222290039, "global_step": 380030, "epoch": 4578} {"train_loss": -26.388574600219727, "global_step": 380031, "epoch": 4578} {"train_loss": -26.60784912109375, "global_step": 380032, "epoch": 4578} {"train_loss": -26.376968383789062, "global_step": 380033, "epoch": 4578} {"train_loss": -26.224414825439453, "global_step": 380034, "epoch": 4578} {"train_loss": -26.353757858276367, "global_step": 380035, "epoch": 4578} {"train_loss": -26.236099243164062, "global_step": 380036, "epoch": 4578} {"train_loss": -26.525304794311523, "global_step": 380037, "epoch": 4578} {"train_loss": -26.443395614624023, "global_step": 380038, "epoch": 4578} {"train_loss": -26.6054630279541, "global_step": 380039, "epoch": 4578} {"train_loss": -26.481637954711914, "global_step": 380040, "epoch": 4578} {"train_loss": -26.46821403503418, "global_step": 380041, "epoch": 4578} {"train_loss": -26.572416305541992, "global_step": 380042, "epoch": 4578} {"train_loss": -26.765228271484375, "global_step": 380043, "epoch": 4578} {"train_loss": -26.65448570251465, "global_step": 380044, "epoch": 4578} {"train_loss": -26.516698837280273, "global_step": 380045, "epoch": 4578} {"train_loss": -26.249134063720703, "global_step": 380046, "epoch": 4578} {"train_loss": -26.623571395874023, "global_step": 380047, "epoch": 4578} {"train_loss": -26.513757705688477, "global_step": 380048, "epoch": 4578} {"train_loss": -26.88373374938965, "global_step": 380049, "epoch": 4578} {"train_loss": -26.653091430664062, "global_step": 380050, "epoch": 4578} {"train_loss": -27.111419677734375, "global_step": 380051, "epoch": 4578} {"train_loss": -26.52178955078125, "global_step": 380052, "epoch": 4578} {"train_loss": -26.718820571899414, "global_step": 380053, "epoch": 4578} {"train_loss": -26.43497657775879, "global_step": 380054, "epoch": 4578} {"train_loss": -26.465621948242188, "global_step": 380055, "epoch": 4578} {"train_loss": -26.43769707737199, "global_step": 380056, "epoch": 4578, "val_loss": 6564667.5} {"train_loss": -25.9466495513916, "global_step": 380057, "epoch": 4579} {"train_loss": -26.09514808654785, "global_step": 380058, "epoch": 4579} {"train_loss": -26.710824966430664, "global_step": 380059, "epoch": 4579} {"train_loss": -26.171630859375, "global_step": 380060, "epoch": 4579} {"train_loss": -25.963748931884766, "global_step": 380061, "epoch": 4579} {"train_loss": -26.10345458984375, "global_step": 380062, "epoch": 4579} {"train_loss": -26.474149703979492, "global_step": 380063, "epoch": 4579} {"train_loss": -26.412662506103516, "global_step": 380064, "epoch": 4579} {"train_loss": -26.115835189819336, "global_step": 380065, "epoch": 4579} {"train_loss": -26.1549015045166, "global_step": 380066, "epoch": 4579} {"train_loss": -26.92683219909668, "global_step": 380067, "epoch": 4579} {"train_loss": -25.85433006286621, "global_step": 380068, "epoch": 4579} {"train_loss": -25.718534469604492, "global_step": 380069, "epoch": 4579} {"train_loss": -25.69598960876465, "global_step": 380070, "epoch": 4579} {"train_loss": -25.65152359008789, "global_step": 380071, "epoch": 4579} {"train_loss": -26.33516502380371, "global_step": 380072, "epoch": 4579} {"train_loss": -26.385629653930664, "global_step": 380073, "epoch": 4579} {"train_loss": -26.519397735595703, "global_step": 380074, "epoch": 4579} {"train_loss": -25.9932918548584, "global_step": 380075, "epoch": 4579} {"train_loss": -26.068714141845703, "global_step": 380076, "epoch": 4579} {"train_loss": -26.10930824279785, "global_step": 380077, "epoch": 4579} {"train_loss": -26.22757339477539, "global_step": 380078, "epoch": 4579} {"train_loss": -26.381988525390625, "global_step": 380079, "epoch": 4579} {"train_loss": -26.233600616455078, "global_step": 380080, "epoch": 4579} {"train_loss": -25.877796173095703, "global_step": 380081, "epoch": 4579} {"train_loss": -26.168609619140625, "global_step": 380082, "epoch": 4579} {"train_loss": -26.419727325439453, "global_step": 380083, "epoch": 4579} {"train_loss": -26.183801651000977, "global_step": 380084, "epoch": 4579} {"train_loss": -25.923147201538086, "global_step": 380085, "epoch": 4579} {"train_loss": -26.343311309814453, "global_step": 380086, "epoch": 4579} {"train_loss": -26.677066802978516, "global_step": 380087, "epoch": 4579} {"train_loss": -26.1268310546875, "global_step": 380088, "epoch": 4579} {"train_loss": -26.343210220336914, "global_step": 380089, "epoch": 4579} {"train_loss": -26.37678337097168, "global_step": 380090, "epoch": 4579} {"train_loss": -26.56900978088379, "global_step": 380091, "epoch": 4579} {"train_loss": -26.448205947875977, "global_step": 380092, "epoch": 4579} {"train_loss": -26.190393447875977, "global_step": 380093, "epoch": 4579} {"train_loss": -26.554889678955078, "global_step": 380094, "epoch": 4579} {"train_loss": -26.303586959838867, "global_step": 380095, "epoch": 4579} {"train_loss": -26.516067504882812, "global_step": 380096, "epoch": 4579} {"train_loss": -26.33892250061035, "global_step": 380097, "epoch": 4579} {"train_loss": -26.532501220703125, "global_step": 380098, "epoch": 4579} {"train_loss": -26.165063858032227, "global_step": 380099, "epoch": 4579} {"train_loss": -26.565061569213867, "global_step": 380100, "epoch": 4579} {"train_loss": -26.622039794921875, "global_step": 380101, "epoch": 4579} {"train_loss": -26.4596004486084, "global_step": 380102, "epoch": 4579} {"train_loss": -26.832258224487305, "global_step": 380103, "epoch": 4579} {"train_loss": -26.444929122924805, "global_step": 380104, "epoch": 4579} {"train_loss": -26.645923614501953, "global_step": 380105, "epoch": 4579} {"train_loss": -26.563695907592773, "global_step": 380106, "epoch": 4579} {"train_loss": -26.724393844604492, "global_step": 380107, "epoch": 4579} {"train_loss": -26.450180053710938, "global_step": 380108, "epoch": 4579} {"train_loss": -26.890771865844727, "global_step": 380109, "epoch": 4579} {"train_loss": -26.595773696899414, "global_step": 380110, "epoch": 4579} {"train_loss": -26.692005157470703, "global_step": 380111, "epoch": 4579} {"train_loss": -26.670093536376953, "global_step": 380112, "epoch": 4579} {"train_loss": -26.608488082885742, "global_step": 380113, "epoch": 4579} {"train_loss": -26.696714401245117, "global_step": 380114, "epoch": 4579} {"train_loss": -26.823740005493164, "global_step": 380115, "epoch": 4579} {"train_loss": -26.617572784423828, "global_step": 380116, "epoch": 4579} {"train_loss": -26.645572662353516, "global_step": 380117, "epoch": 4579} {"train_loss": -26.757917404174805, "global_step": 380118, "epoch": 4579} {"train_loss": -26.869293212890625, "global_step": 380119, "epoch": 4579} {"train_loss": -26.857330322265625, "global_step": 380120, "epoch": 4579} {"train_loss": -26.513830184936523, "global_step": 380121, "epoch": 4579} {"train_loss": -26.56398582458496, "global_step": 380122, "epoch": 4579} {"train_loss": -26.032590866088867, "global_step": 380123, "epoch": 4579} {"train_loss": -26.479522705078125, "global_step": 380124, "epoch": 4579} {"train_loss": -25.7589168548584, "global_step": 380125, "epoch": 4579} {"train_loss": -25.492721557617188, "global_step": 380126, "epoch": 4579} {"train_loss": -25.19513702392578, "global_step": 380127, "epoch": 4579} {"train_loss": -25.72181510925293, "global_step": 380128, "epoch": 4579} {"train_loss": -25.715564727783203, "global_step": 380129, "epoch": 4579} {"train_loss": -26.44231605529785, "global_step": 380130, "epoch": 4579} {"train_loss": -26.155353546142578, "global_step": 380131, "epoch": 4579} {"train_loss": -25.3289852142334, "global_step": 380132, "epoch": 4579} {"train_loss": -26.030054092407227, "global_step": 380133, "epoch": 4579} {"train_loss": -26.253910064697266, "global_step": 380134, "epoch": 4579} {"train_loss": -26.19125747680664, "global_step": 380135, "epoch": 4579} {"train_loss": -26.0856990814209, "global_step": 380136, "epoch": 4579} {"train_loss": -25.94398307800293, "global_step": 380137, "epoch": 4579} {"train_loss": -26.708526611328125, "global_step": 380138, "epoch": 4579} {"train_loss": -26.302704845566346, "global_step": 380139, "epoch": 4579, "val_loss": 6498663.0} {"train_loss": -25.588041305541992, "global_step": 380140, "epoch": 4580} {"train_loss": -26.106847763061523, "global_step": 380141, "epoch": 4580} {"train_loss": -25.511962890625, "global_step": 380142, "epoch": 4580} {"train_loss": -25.500125885009766, "global_step": 380143, "epoch": 4580} {"train_loss": -25.13157081604004, "global_step": 380144, "epoch": 4580} {"train_loss": -26.18121910095215, "global_step": 380145, "epoch": 4580} {"train_loss": -25.610427856445312, "global_step": 380146, "epoch": 4580} {"train_loss": -25.858251571655273, "global_step": 380147, "epoch": 4580} {"train_loss": -25.528146743774414, "global_step": 380148, "epoch": 4580} {"train_loss": -25.92325210571289, "global_step": 380149, "epoch": 4580} {"train_loss": -25.479562759399414, "global_step": 380150, "epoch": 4580} {"train_loss": -25.335153579711914, "global_step": 380151, "epoch": 4580} {"train_loss": -25.58809471130371, "global_step": 380152, "epoch": 4580} {"train_loss": -25.314680099487305, "global_step": 380153, "epoch": 4580} {"train_loss": -25.600095748901367, "global_step": 380154, "epoch": 4580} {"train_loss": -25.963581085205078, "global_step": 380155, "epoch": 4580} {"train_loss": -25.96746253967285, "global_step": 380156, "epoch": 4580} {"train_loss": -26.220006942749023, "global_step": 380157, "epoch": 4580} {"train_loss": -25.804061889648438, "global_step": 380158, "epoch": 4580} {"train_loss": -26.384159088134766, "global_step": 380159, "epoch": 4580} {"train_loss": -26.35959815979004, "global_step": 380160, "epoch": 4580} {"train_loss": -26.422718048095703, "global_step": 380161, "epoch": 4580} {"train_loss": -26.410797119140625, "global_step": 380162, "epoch": 4580} {"train_loss": -26.63062858581543, "global_step": 380163, "epoch": 4580} {"train_loss": -25.92600440979004, "global_step": 380164, "epoch": 4580} {"train_loss": -26.207386016845703, "global_step": 380165, "epoch": 4580} {"train_loss": -26.154376983642578, "global_step": 380166, "epoch": 4580} {"train_loss": -26.350906372070312, "global_step": 380167, "epoch": 4580} {"train_loss": -26.38031005859375, "global_step": 380168, "epoch": 4580} {"train_loss": -26.75833511352539, "global_step": 380169, "epoch": 4580} {"train_loss": -26.7174072265625, "global_step": 380170, "epoch": 4580} {"train_loss": -26.59824562072754, "global_step": 380171, "epoch": 4580} {"train_loss": -26.73212242126465, "global_step": 380172, "epoch": 4580} {"train_loss": -26.530466079711914, "global_step": 380173, "epoch": 4580} {"train_loss": -26.1638240814209, "global_step": 380174, "epoch": 4580} {"train_loss": -26.600906372070312, "global_step": 380175, "epoch": 4580} {"train_loss": -26.781085968017578, "global_step": 380176, "epoch": 4580} {"train_loss": -26.349740982055664, "global_step": 380177, "epoch": 4580} {"train_loss": -26.36236000061035, "global_step": 380178, "epoch": 4580} {"train_loss": -26.85687828063965, "global_step": 380179, "epoch": 4580} {"train_loss": -26.712753295898438, "global_step": 380180, "epoch": 4580} {"train_loss": -26.736419677734375, "global_step": 380181, "epoch": 4580} {"train_loss": -26.763885498046875, "global_step": 380182, "epoch": 4580} {"train_loss": -26.518930435180664, "global_step": 380183, "epoch": 4580} {"train_loss": -26.702497482299805, "global_step": 380184, "epoch": 4580} {"train_loss": -26.447376251220703, "global_step": 380185, "epoch": 4580} {"train_loss": -26.838224411010742, "global_step": 380186, "epoch": 4580} {"train_loss": -26.59476661682129, "global_step": 380187, "epoch": 4580} {"train_loss": -26.667943954467773, "global_step": 380188, "epoch": 4580} {"train_loss": -26.775293350219727, "global_step": 380189, "epoch": 4580} {"train_loss": -26.609888076782227, "global_step": 380190, "epoch": 4580} {"train_loss": -26.198261260986328, "global_step": 380191, "epoch": 4580} {"train_loss": -26.658288955688477, "global_step": 380192, "epoch": 4580} {"train_loss": -26.913808822631836, "global_step": 380193, "epoch": 4580} {"train_loss": -26.54511833190918, "global_step": 380194, "epoch": 4580} {"train_loss": -26.449813842773438, "global_step": 380195, "epoch": 4580} {"train_loss": -26.441986083984375, "global_step": 380196, "epoch": 4580} {"train_loss": -26.583852767944336, "global_step": 380197, "epoch": 4580} {"train_loss": -26.7418212890625, "global_step": 380198, "epoch": 4580} {"train_loss": -26.62871742248535, "global_step": 380199, "epoch": 4580} {"train_loss": -26.47247314453125, "global_step": 380200, "epoch": 4580} {"train_loss": -26.1535587310791, "global_step": 380201, "epoch": 4580} {"train_loss": -26.083993911743164, "global_step": 380202, "epoch": 4580} {"train_loss": -26.552072525024414, "global_step": 380203, "epoch": 4580} {"train_loss": -26.644367218017578, "global_step": 380204, "epoch": 4580} {"train_loss": -26.53898048400879, "global_step": 380205, "epoch": 4580} {"train_loss": -26.454694747924805, "global_step": 380206, "epoch": 4580} {"train_loss": -26.42462158203125, "global_step": 380207, "epoch": 4580} {"train_loss": -26.473047256469727, "global_step": 380208, "epoch": 4580} {"train_loss": -26.428319931030273, "global_step": 380209, "epoch": 4580} {"train_loss": -26.745771408081055, "global_step": 380210, "epoch": 4580} {"train_loss": -26.549219131469727, "global_step": 380211, "epoch": 4580} {"train_loss": -26.324743270874023, "global_step": 380212, "epoch": 4580} {"train_loss": -26.411895751953125, "global_step": 380213, "epoch": 4580} {"train_loss": -26.6450252532959, "global_step": 380214, "epoch": 4580} {"train_loss": -26.654199600219727, "global_step": 380215, "epoch": 4580} {"train_loss": -26.517337799072266, "global_step": 380216, "epoch": 4580} {"train_loss": -26.232038497924805, "global_step": 380217, "epoch": 4580} {"train_loss": -26.81007194519043, "global_step": 380218, "epoch": 4580} {"train_loss": -26.185998916625977, "global_step": 380219, "epoch": 4580} {"train_loss": -26.636417388916016, "global_step": 380220, "epoch": 4580} {"train_loss": -26.555652618408203, "global_step": 380221, "epoch": 4580} {"train_loss": -26.33665284765772, "global_step": 380222, "epoch": 4580, "val_loss": 6662797.0} {"train_loss": -26.139923095703125, "global_step": 380223, "epoch": 4581} {"train_loss": -26.099884033203125, "global_step": 380224, "epoch": 4581} {"train_loss": -26.16986083984375, "global_step": 380225, "epoch": 4581} {"train_loss": -26.377233505249023, "global_step": 380226, "epoch": 4581} {"train_loss": -26.206640243530273, "global_step": 380227, "epoch": 4581} {"train_loss": -26.39358901977539, "global_step": 380228, "epoch": 4581} {"train_loss": -26.152387619018555, "global_step": 380229, "epoch": 4581} {"train_loss": -26.48060417175293, "global_step": 380230, "epoch": 4581} {"train_loss": -25.99769401550293, "global_step": 380231, "epoch": 4581} {"train_loss": -26.331268310546875, "global_step": 380232, "epoch": 4581} {"train_loss": -26.215620040893555, "global_step": 380233, "epoch": 4581} {"train_loss": -26.059188842773438, "global_step": 380234, "epoch": 4581} {"train_loss": -26.032690048217773, "global_step": 380235, "epoch": 4581} {"train_loss": -25.97724723815918, "global_step": 380236, "epoch": 4581} {"train_loss": -26.281402587890625, "global_step": 380237, "epoch": 4581} {"train_loss": -26.30059242248535, "global_step": 380238, "epoch": 4581} {"train_loss": -26.140085220336914, "global_step": 380239, "epoch": 4581} {"train_loss": -26.497955322265625, "global_step": 380240, "epoch": 4581} {"train_loss": -26.25733757019043, "global_step": 380241, "epoch": 4581} {"train_loss": -26.63559913635254, "global_step": 380242, "epoch": 4581} {"train_loss": -26.37455177307129, "global_step": 380243, "epoch": 4581} {"train_loss": -25.80503273010254, "global_step": 380244, "epoch": 4581} {"train_loss": -26.2541561126709, "global_step": 380245, "epoch": 4581} {"train_loss": -26.282690048217773, "global_step": 380246, "epoch": 4581} {"train_loss": -26.451526641845703, "global_step": 380247, "epoch": 4581} {"train_loss": -26.211822509765625, "global_step": 380248, "epoch": 4581} {"train_loss": -26.156753540039062, "global_step": 380249, "epoch": 4581} {"train_loss": -26.242237091064453, "global_step": 380250, "epoch": 4581} {"train_loss": -26.275907516479492, "global_step": 380251, "epoch": 4581} {"train_loss": -26.341629028320312, "global_step": 380252, "epoch": 4581} {"train_loss": -26.435720443725586, "global_step": 380253, "epoch": 4581} {"train_loss": -26.148462295532227, "global_step": 380254, "epoch": 4581} {"train_loss": -26.284021377563477, "global_step": 380255, "epoch": 4581} {"train_loss": -26.788782119750977, "global_step": 380256, "epoch": 4581} {"train_loss": -26.23349380493164, "global_step": 380257, "epoch": 4581} {"train_loss": -26.749313354492188, "global_step": 380258, "epoch": 4581} {"train_loss": -26.385908126831055, "global_step": 380259, "epoch": 4581} {"train_loss": -26.62527847290039, "global_step": 380260, "epoch": 4581} {"train_loss": -26.202863693237305, "global_step": 380261, "epoch": 4581} {"train_loss": -26.559118270874023, "global_step": 380262, "epoch": 4581} {"train_loss": -26.394453048706055, "global_step": 380263, "epoch": 4581} {"train_loss": -26.334604263305664, "global_step": 380264, "epoch": 4581} {"train_loss": -26.555530548095703, "global_step": 380265, "epoch": 4581} {"train_loss": -26.942035675048828, "global_step": 380266, "epoch": 4581} {"train_loss": -26.565122604370117, "global_step": 380267, "epoch": 4581} {"train_loss": -26.26490592956543, "global_step": 380268, "epoch": 4581} {"train_loss": -26.622060775756836, "global_step": 380269, "epoch": 4581} {"train_loss": -26.595966339111328, "global_step": 380270, "epoch": 4581} {"train_loss": -26.24176597595215, "global_step": 380271, "epoch": 4581} {"train_loss": -26.813323974609375, "global_step": 380272, "epoch": 4581} {"train_loss": -26.870594024658203, "global_step": 380273, "epoch": 4581} {"train_loss": -26.5457820892334, "global_step": 380274, "epoch": 4581} {"train_loss": -26.91680908203125, "global_step": 380275, "epoch": 4581} {"train_loss": -26.500701904296875, "global_step": 380276, "epoch": 4581} {"train_loss": -26.69886589050293, "global_step": 380277, "epoch": 4581} {"train_loss": -26.906469345092773, "global_step": 380278, "epoch": 4581} {"train_loss": -26.65570068359375, "global_step": 380279, "epoch": 4581} {"train_loss": -26.25765037536621, "global_step": 380280, "epoch": 4581} {"train_loss": -26.484460830688477, "global_step": 380281, "epoch": 4581} {"train_loss": -26.394922256469727, "global_step": 380282, "epoch": 4581} {"train_loss": -26.707178115844727, "global_step": 380283, "epoch": 4581} {"train_loss": -26.994840621948242, "global_step": 380284, "epoch": 4581} {"train_loss": -26.543874740600586, "global_step": 380285, "epoch": 4581} {"train_loss": -26.087329864501953, "global_step": 380286, "epoch": 4581} {"train_loss": -26.413217544555664, "global_step": 380287, "epoch": 4581} {"train_loss": -26.609634399414062, "global_step": 380288, "epoch": 4581} {"train_loss": -26.991901397705078, "global_step": 380289, "epoch": 4581} {"train_loss": -26.6931209564209, "global_step": 380290, "epoch": 4581} {"train_loss": -26.643970489501953, "global_step": 380291, "epoch": 4581} {"train_loss": -26.64307975769043, "global_step": 380292, "epoch": 4581} {"train_loss": -26.492284774780273, "global_step": 380293, "epoch": 4581} {"train_loss": -26.701007843017578, "global_step": 380294, "epoch": 4581} {"train_loss": -26.4654598236084, "global_step": 380295, "epoch": 4581} {"train_loss": -26.580677032470703, "global_step": 380296, "epoch": 4581} {"train_loss": -26.230911254882812, "global_step": 380297, "epoch": 4581} {"train_loss": -26.267621994018555, "global_step": 380298, "epoch": 4581} {"train_loss": -26.15949821472168, "global_step": 380299, "epoch": 4581} {"train_loss": -27.0670166015625, "global_step": 380300, "epoch": 4581} {"train_loss": -26.77872085571289, "global_step": 380301, "epoch": 4581} {"train_loss": -26.742725372314453, "global_step": 380302, "epoch": 4581} {"train_loss": -26.941198348999023, "global_step": 380303, "epoch": 4581} {"train_loss": -26.479217529296875, "global_step": 380304, "epoch": 4581} {"train_loss": -26.43700523836067, "global_step": 380305, "epoch": 4581, "val_loss": 6673650.0} {"train_loss": -25.1283016204834, "global_step": 380306, "epoch": 4582} {"train_loss": -25.554105758666992, "global_step": 380307, "epoch": 4582} {"train_loss": -24.920320510864258, "global_step": 380308, "epoch": 4582} {"train_loss": -25.54259490966797, "global_step": 380309, "epoch": 4582} {"train_loss": -24.64179801940918, "global_step": 380310, "epoch": 4582} {"train_loss": -24.95157814025879, "global_step": 380311, "epoch": 4582} {"train_loss": -25.95710563659668, "global_step": 380312, "epoch": 4582} {"train_loss": -25.526212692260742, "global_step": 380313, "epoch": 4582} {"train_loss": -25.510499954223633, "global_step": 380314, "epoch": 4582} {"train_loss": -25.750314712524414, "global_step": 380315, "epoch": 4582} {"train_loss": -25.45372200012207, "global_step": 380316, "epoch": 4582} {"train_loss": -26.236356735229492, "global_step": 380317, "epoch": 4582} {"train_loss": -25.4821834564209, "global_step": 380318, "epoch": 4582} {"train_loss": -26.326980590820312, "global_step": 380319, "epoch": 4582} {"train_loss": -25.94581413269043, "global_step": 380320, "epoch": 4582} {"train_loss": -25.988080978393555, "global_step": 380321, "epoch": 4582} {"train_loss": -25.95587730407715, "global_step": 380322, "epoch": 4582} {"train_loss": -25.77167320251465, "global_step": 380323, "epoch": 4582} {"train_loss": -26.06196403503418, "global_step": 380324, "epoch": 4582} {"train_loss": -25.89325523376465, "global_step": 380325, "epoch": 4582} {"train_loss": -26.187057495117188, "global_step": 380326, "epoch": 4582} {"train_loss": -25.770767211914062, "global_step": 380327, "epoch": 4582} {"train_loss": -26.410261154174805, "global_step": 380328, "epoch": 4582} {"train_loss": -26.06610107421875, "global_step": 380329, "epoch": 4582} {"train_loss": -26.031024932861328, "global_step": 380330, "epoch": 4582} {"train_loss": -26.358951568603516, "global_step": 380331, "epoch": 4582} {"train_loss": -26.18855094909668, "global_step": 380332, "epoch": 4582} {"train_loss": -26.299701690673828, "global_step": 380333, "epoch": 4582} {"train_loss": -26.30086326599121, "global_step": 380334, "epoch": 4582} {"train_loss": -26.452558517456055, "global_step": 380335, "epoch": 4582} {"train_loss": -26.60294532775879, "global_step": 380336, "epoch": 4582} {"train_loss": -26.11147117614746, "global_step": 380337, "epoch": 4582} {"train_loss": -26.467029571533203, "global_step": 380338, "epoch": 4582} {"train_loss": -26.308917999267578, "global_step": 380339, "epoch": 4582} {"train_loss": -26.220014572143555, "global_step": 380340, "epoch": 4582} {"train_loss": -26.460309982299805, "global_step": 380341, "epoch": 4582} {"train_loss": -26.557693481445312, "global_step": 380342, "epoch": 4582} {"train_loss": -27.109790802001953, "global_step": 380343, "epoch": 4582} {"train_loss": -26.58349609375, "global_step": 380344, "epoch": 4582} {"train_loss": -26.19258689880371, "global_step": 380345, "epoch": 4582} {"train_loss": -26.764240264892578, "global_step": 380346, "epoch": 4582} {"train_loss": -26.17304039001465, "global_step": 380347, "epoch": 4582} {"train_loss": -26.46365737915039, "global_step": 380348, "epoch": 4582} {"train_loss": -26.264270782470703, "global_step": 380349, "epoch": 4582} {"train_loss": -26.663476943969727, "global_step": 380350, "epoch": 4582} {"train_loss": -26.815168380737305, "global_step": 380351, "epoch": 4582} {"train_loss": -26.723295211791992, "global_step": 380352, "epoch": 4582} {"train_loss": -26.69329833984375, "global_step": 380353, "epoch": 4582} {"train_loss": -26.47532081604004, "global_step": 380354, "epoch": 4582} {"train_loss": -26.567914962768555, "global_step": 380355, "epoch": 4582} {"train_loss": -26.441091537475586, "global_step": 380356, "epoch": 4582} {"train_loss": -26.335248947143555, "global_step": 380357, "epoch": 4582} {"train_loss": -26.411283493041992, "global_step": 380358, "epoch": 4582} {"train_loss": -26.358129501342773, "global_step": 380359, "epoch": 4582} {"train_loss": -26.77046012878418, "global_step": 380360, "epoch": 4582} {"train_loss": -26.628881454467773, "global_step": 380361, "epoch": 4582} {"train_loss": -26.349567413330078, "global_step": 380362, "epoch": 4582} {"train_loss": -26.297101974487305, "global_step": 380363, "epoch": 4582} {"train_loss": -26.25165367126465, "global_step": 380364, "epoch": 4582} {"train_loss": -25.9349422454834, "global_step": 380365, "epoch": 4582} {"train_loss": -25.916135787963867, "global_step": 380366, "epoch": 4582} {"train_loss": -25.821508407592773, "global_step": 380367, "epoch": 4582} {"train_loss": -26.232685089111328, "global_step": 380368, "epoch": 4582} {"train_loss": -26.07159996032715, "global_step": 380369, "epoch": 4582} {"train_loss": -26.11421775817871, "global_step": 380370, "epoch": 4582} {"train_loss": -25.842945098876953, "global_step": 380371, "epoch": 4582} {"train_loss": -26.62255859375, "global_step": 380372, "epoch": 4582} {"train_loss": -26.295379638671875, "global_step": 380373, "epoch": 4582} {"train_loss": -25.804595947265625, "global_step": 380374, "epoch": 4582} {"train_loss": -25.843854904174805, "global_step": 380375, "epoch": 4582} {"train_loss": -25.764402389526367, "global_step": 380376, "epoch": 4582} {"train_loss": -25.34014892578125, "global_step": 380377, "epoch": 4582} {"train_loss": -26.6561279296875, "global_step": 380378, "epoch": 4582} {"train_loss": -26.072046279907227, "global_step": 380379, "epoch": 4582} {"train_loss": -26.595335006713867, "global_step": 380380, "epoch": 4582} {"train_loss": -26.41008949279785, "global_step": 380381, "epoch": 4582} {"train_loss": -26.407255172729492, "global_step": 380382, "epoch": 4582} {"train_loss": -26.055627822875977, "global_step": 380383, "epoch": 4582} {"train_loss": -26.551441192626953, "global_step": 380384, "epoch": 4582} {"train_loss": -26.36757469177246, "global_step": 380385, "epoch": 4582} {"train_loss": -26.462268829345703, "global_step": 380386, "epoch": 4582} {"train_loss": -26.411359786987305, "global_step": 380387, "epoch": 4582} {"train_loss": -26.14129615691771, "global_step": 380388, "epoch": 4582, "val_loss": 6597953.0} {"train_loss": -25.825408935546875, "global_step": 380389, "epoch": 4583} {"train_loss": -25.304906845092773, "global_step": 380390, "epoch": 4583} {"train_loss": -25.54979705810547, "global_step": 380391, "epoch": 4583} {"train_loss": -25.8963623046875, "global_step": 380392, "epoch": 4583} {"train_loss": -25.342435836791992, "global_step": 380393, "epoch": 4583} {"train_loss": -26.083637237548828, "global_step": 380394, "epoch": 4583} {"train_loss": -25.821548461914062, "global_step": 380395, "epoch": 4583} {"train_loss": -26.040647506713867, "global_step": 380396, "epoch": 4583} {"train_loss": -26.18902015686035, "global_step": 380397, "epoch": 4583} {"train_loss": -26.20654296875, "global_step": 380398, "epoch": 4583} {"train_loss": -25.902902603149414, "global_step": 380399, "epoch": 4583} {"train_loss": -25.717893600463867, "global_step": 380400, "epoch": 4583} {"train_loss": -26.12074089050293, "global_step": 380401, "epoch": 4583} {"train_loss": -26.150836944580078, "global_step": 380402, "epoch": 4583} {"train_loss": -26.232030868530273, "global_step": 380403, "epoch": 4583} {"train_loss": -25.87152671813965, "global_step": 380404, "epoch": 4583} {"train_loss": -26.319320678710938, "global_step": 380405, "epoch": 4583} {"train_loss": -26.589557647705078, "global_step": 380406, "epoch": 4583} {"train_loss": -26.26154136657715, "global_step": 380407, "epoch": 4583} {"train_loss": -26.302921295166016, "global_step": 380408, "epoch": 4583} {"train_loss": -26.113317489624023, "global_step": 380409, "epoch": 4583} {"train_loss": -26.430896759033203, "global_step": 380410, "epoch": 4583} {"train_loss": -26.14461326599121, "global_step": 380411, "epoch": 4583} {"train_loss": -26.03718376159668, "global_step": 380412, "epoch": 4583} {"train_loss": -26.495513916015625, "global_step": 380413, "epoch": 4583} {"train_loss": -26.488943099975586, "global_step": 380414, "epoch": 4583} {"train_loss": -26.527448654174805, "global_step": 380415, "epoch": 4583} {"train_loss": -26.278417587280273, "global_step": 380416, "epoch": 4583} {"train_loss": -26.501632690429688, "global_step": 380417, "epoch": 4583} {"train_loss": -26.54816246032715, "global_step": 380418, "epoch": 4583} {"train_loss": -26.347009658813477, "global_step": 380419, "epoch": 4583} {"train_loss": -26.503759384155273, "global_step": 380420, "epoch": 4583} {"train_loss": -26.3131103515625, "global_step": 380421, "epoch": 4583} {"train_loss": -26.54163932800293, "global_step": 380422, "epoch": 4583} {"train_loss": -26.728322982788086, "global_step": 380423, "epoch": 4583} {"train_loss": -26.35552978515625, "global_step": 380424, "epoch": 4583} {"train_loss": -26.749570846557617, "global_step": 380425, "epoch": 4583} {"train_loss": -26.55864906311035, "global_step": 380426, "epoch": 4583} {"train_loss": -26.73028564453125, "global_step": 380427, "epoch": 4583} {"train_loss": -26.997589111328125, "global_step": 380428, "epoch": 4583} {"train_loss": -26.558551788330078, "global_step": 380429, "epoch": 4583} {"train_loss": -26.803302764892578, "global_step": 380430, "epoch": 4583} {"train_loss": -26.321805953979492, "global_step": 380431, "epoch": 4583} {"train_loss": -26.58930015563965, "global_step": 380432, "epoch": 4583} {"train_loss": -26.576147079467773, "global_step": 380433, "epoch": 4583} {"train_loss": -26.4741153717041, "global_step": 380434, "epoch": 4583} {"train_loss": -26.297739028930664, "global_step": 380435, "epoch": 4583} {"train_loss": -26.643726348876953, "global_step": 380436, "epoch": 4583} {"train_loss": -26.87391471862793, "global_step": 380437, "epoch": 4583} {"train_loss": -26.794721603393555, "global_step": 380438, "epoch": 4583} {"train_loss": -26.750030517578125, "global_step": 380439, "epoch": 4583} {"train_loss": -26.45181655883789, "global_step": 380440, "epoch": 4583} {"train_loss": -26.697179794311523, "global_step": 380441, "epoch": 4583} {"train_loss": -26.89763832092285, "global_step": 380442, "epoch": 4583} {"train_loss": -26.807233810424805, "global_step": 380443, "epoch": 4583} {"train_loss": -26.429962158203125, "global_step": 380444, "epoch": 4583} {"train_loss": -26.452320098876953, "global_step": 380445, "epoch": 4583} {"train_loss": -26.647510528564453, "global_step": 380446, "epoch": 4583} {"train_loss": -26.20502281188965, "global_step": 380447, "epoch": 4583} {"train_loss": -25.995697021484375, "global_step": 380448, "epoch": 4583} {"train_loss": -24.921995162963867, "global_step": 380449, "epoch": 4583} {"train_loss": -24.435110092163086, "global_step": 380450, "epoch": 4583} {"train_loss": -25.652511596679688, "global_step": 380451, "epoch": 4583} {"train_loss": -25.84994888305664, "global_step": 380452, "epoch": 4583} {"train_loss": -25.24553108215332, "global_step": 380453, "epoch": 4583} {"train_loss": -25.358264923095703, "global_step": 380454, "epoch": 4583} {"train_loss": -26.0706729888916, "global_step": 380455, "epoch": 4583} {"train_loss": -25.827436447143555, "global_step": 380456, "epoch": 4583} {"train_loss": -25.832660675048828, "global_step": 380457, "epoch": 4583} {"train_loss": -26.14039421081543, "global_step": 380458, "epoch": 4583} {"train_loss": -25.61181640625, "global_step": 380459, "epoch": 4583} {"train_loss": -26.00058364868164, "global_step": 380460, "epoch": 4583} {"train_loss": -25.926755905151367, "global_step": 380461, "epoch": 4583} {"train_loss": -26.20389747619629, "global_step": 380462, "epoch": 4583} {"train_loss": -26.0261287689209, "global_step": 380463, "epoch": 4583} {"train_loss": -26.067956924438477, "global_step": 380464, "epoch": 4583} {"train_loss": -25.84946060180664, "global_step": 380465, "epoch": 4583} {"train_loss": -26.19915771484375, "global_step": 380466, "epoch": 4583} {"train_loss": -26.120386123657227, "global_step": 380467, "epoch": 4583} {"train_loss": -26.09734535217285, "global_step": 380468, "epoch": 4583} {"train_loss": -26.20355796813965, "global_step": 380469, "epoch": 4583} {"train_loss": -26.150278091430664, "global_step": 380470, "epoch": 4583} {"train_loss": -26.191723858017518, "global_step": 380471, "epoch": 4583, "val_loss": 6548666.0} {"train_loss": -26.293582916259766, "global_step": 380472, "epoch": 4584} {"train_loss": -26.394067764282227, "global_step": 380473, "epoch": 4584} {"train_loss": -26.17801284790039, "global_step": 380474, "epoch": 4584} {"train_loss": -26.33783531188965, "global_step": 380475, "epoch": 4584} {"train_loss": -25.98451042175293, "global_step": 380476, "epoch": 4584} {"train_loss": -26.254016876220703, "global_step": 380477, "epoch": 4584} {"train_loss": -26.101083755493164, "global_step": 380478, "epoch": 4584} {"train_loss": -26.25897216796875, "global_step": 380479, "epoch": 4584} {"train_loss": -26.0626277923584, "global_step": 380480, "epoch": 4584} {"train_loss": -26.10334587097168, "global_step": 380481, "epoch": 4584} {"train_loss": -26.278371810913086, "global_step": 380482, "epoch": 4584} {"train_loss": -26.286603927612305, "global_step": 380483, "epoch": 4584} {"train_loss": -26.109663009643555, "global_step": 380484, "epoch": 4584} {"train_loss": -26.074777603149414, "global_step": 380485, "epoch": 4584} {"train_loss": -26.4307861328125, "global_step": 380486, "epoch": 4584} {"train_loss": -26.210981369018555, "global_step": 380487, "epoch": 4584} {"train_loss": -26.237258911132812, "global_step": 380488, "epoch": 4584} {"train_loss": -26.52479362487793, "global_step": 380489, "epoch": 4584} {"train_loss": -26.499380111694336, "global_step": 380490, "epoch": 4584} {"train_loss": -26.358190536499023, "global_step": 380491, "epoch": 4584} {"train_loss": -26.72858238220215, "global_step": 380492, "epoch": 4584} {"train_loss": -26.42658042907715, "global_step": 380493, "epoch": 4584} {"train_loss": -26.450220108032227, "global_step": 380494, "epoch": 4584} {"train_loss": -26.614816665649414, "global_step": 380495, "epoch": 4584} {"train_loss": -26.86968421936035, "global_step": 380496, "epoch": 4584} {"train_loss": -26.60367774963379, "global_step": 380497, "epoch": 4584} {"train_loss": -26.990222930908203, "global_step": 380498, "epoch": 4584} {"train_loss": -26.69776725769043, "global_step": 380499, "epoch": 4584} {"train_loss": -26.454864501953125, "global_step": 380500, "epoch": 4584} {"train_loss": -26.5238094329834, "global_step": 380501, "epoch": 4584} {"train_loss": -26.71355628967285, "global_step": 380502, "epoch": 4584} {"train_loss": -26.619848251342773, "global_step": 380503, "epoch": 4584} {"train_loss": -26.293283462524414, "global_step": 380504, "epoch": 4584} {"train_loss": -26.34723472595215, "global_step": 380505, "epoch": 4584} {"train_loss": -26.220951080322266, "global_step": 380506, "epoch": 4584} {"train_loss": -26.528039932250977, "global_step": 380507, "epoch": 4584} {"train_loss": -26.723419189453125, "global_step": 380508, "epoch": 4584} {"train_loss": -26.693851470947266, "global_step": 380509, "epoch": 4584} {"train_loss": -26.634424209594727, "global_step": 380510, "epoch": 4584} {"train_loss": -26.0168514251709, "global_step": 380511, "epoch": 4584} {"train_loss": -26.571918487548828, "global_step": 380512, "epoch": 4584} {"train_loss": -26.881505966186523, "global_step": 380513, "epoch": 4584} {"train_loss": -26.1474666595459, "global_step": 380514, "epoch": 4584} {"train_loss": -26.38616371154785, "global_step": 380515, "epoch": 4584} {"train_loss": -26.54725456237793, "global_step": 380516, "epoch": 4584} {"train_loss": -26.477039337158203, "global_step": 380517, "epoch": 4584} {"train_loss": -26.113449096679688, "global_step": 380518, "epoch": 4584} {"train_loss": -26.324848175048828, "global_step": 380519, "epoch": 4584} {"train_loss": -26.498794555664062, "global_step": 380520, "epoch": 4584} {"train_loss": -26.353891372680664, "global_step": 380521, "epoch": 4584} {"train_loss": -26.101709365844727, "global_step": 380522, "epoch": 4584} {"train_loss": -26.432952880859375, "global_step": 380523, "epoch": 4584} {"train_loss": -26.159473419189453, "global_step": 380524, "epoch": 4584} {"train_loss": -26.44464111328125, "global_step": 380525, "epoch": 4584} {"train_loss": -26.596607208251953, "global_step": 380526, "epoch": 4584} {"train_loss": -26.515588760375977, "global_step": 380527, "epoch": 4584} {"train_loss": -26.67056655883789, "global_step": 380528, "epoch": 4584} {"train_loss": -25.868295669555664, "global_step": 380529, "epoch": 4584} {"train_loss": -26.26218605041504, "global_step": 380530, "epoch": 4584} {"train_loss": -26.407764434814453, "global_step": 380531, "epoch": 4584} {"train_loss": -26.446502685546875, "global_step": 380532, "epoch": 4584} {"train_loss": -26.375463485717773, "global_step": 380533, "epoch": 4584} {"train_loss": -26.565387725830078, "global_step": 380534, "epoch": 4584} {"train_loss": -26.243133544921875, "global_step": 380535, "epoch": 4584} {"train_loss": -26.438928604125977, "global_step": 380536, "epoch": 4584} {"train_loss": -25.95856285095215, "global_step": 380537, "epoch": 4584} {"train_loss": -26.1044921875, "global_step": 380538, "epoch": 4584} {"train_loss": -26.2733097076416, "global_step": 380539, "epoch": 4584} {"train_loss": -26.933258056640625, "global_step": 380540, "epoch": 4584} {"train_loss": -26.6639347076416, "global_step": 380541, "epoch": 4584} {"train_loss": -26.288541793823242, "global_step": 380542, "epoch": 4584} {"train_loss": -26.61404800415039, "global_step": 380543, "epoch": 4584} {"train_loss": -26.37799644470215, "global_step": 380544, "epoch": 4584} {"train_loss": -26.62685203552246, "global_step": 380545, "epoch": 4584} {"train_loss": -26.312458038330078, "global_step": 380546, "epoch": 4584} {"train_loss": -26.372507095336914, "global_step": 380547, "epoch": 4584} {"train_loss": -26.485891342163086, "global_step": 380548, "epoch": 4584} {"train_loss": -26.651779174804688, "global_step": 380549, "epoch": 4584} {"train_loss": -26.344663619995117, "global_step": 380550, "epoch": 4584} {"train_loss": -26.101165771484375, "global_step": 380551, "epoch": 4584} {"train_loss": -26.778417587280273, "global_step": 380552, "epoch": 4584} {"train_loss": -26.08721923828125, "global_step": 380553, "epoch": 4584} {"train_loss": -26.40569110089038, "global_step": 380554, "epoch": 4584, "val_loss": 6679926.0} {"train_loss": -25.826374053955078, "global_step": 380555, "epoch": 4585} {"train_loss": -25.392309188842773, "global_step": 380556, "epoch": 4585} {"train_loss": -25.859006881713867, "global_step": 380557, "epoch": 4585} {"train_loss": -26.0264892578125, "global_step": 380558, "epoch": 4585} {"train_loss": -25.60747718811035, "global_step": 380559, "epoch": 4585} {"train_loss": -26.026235580444336, "global_step": 380560, "epoch": 4585} {"train_loss": -26.07583999633789, "global_step": 380561, "epoch": 4585} {"train_loss": -25.63492774963379, "global_step": 380562, "epoch": 4585} {"train_loss": -26.44194984436035, "global_step": 380563, "epoch": 4585} {"train_loss": -25.707117080688477, "global_step": 380564, "epoch": 4585} {"train_loss": -26.40407371520996, "global_step": 380565, "epoch": 4585} {"train_loss": -26.182998657226562, "global_step": 380566, "epoch": 4585} {"train_loss": -26.429306030273438, "global_step": 380567, "epoch": 4585} {"train_loss": -26.00591468811035, "global_step": 380568, "epoch": 4585} {"train_loss": -25.898696899414062, "global_step": 380569, "epoch": 4585} {"train_loss": -25.97486686706543, "global_step": 380570, "epoch": 4585} {"train_loss": -26.55964469909668, "global_step": 380571, "epoch": 4585} {"train_loss": -25.690444946289062, "global_step": 380572, "epoch": 4585} {"train_loss": -26.092016220092773, "global_step": 380573, "epoch": 4585} {"train_loss": -26.055341720581055, "global_step": 380574, "epoch": 4585} {"train_loss": -26.46647071838379, "global_step": 380575, "epoch": 4585} {"train_loss": -26.20733642578125, "global_step": 380576, "epoch": 4585} {"train_loss": -25.967212677001953, "global_step": 380577, "epoch": 4585} {"train_loss": -26.28803062438965, "global_step": 380578, "epoch": 4585} {"train_loss": -26.181543350219727, "global_step": 380579, "epoch": 4585} {"train_loss": -26.07267189025879, "global_step": 380580, "epoch": 4585} {"train_loss": -26.25274658203125, "global_step": 380581, "epoch": 4585} {"train_loss": -26.186664581298828, "global_step": 380582, "epoch": 4585} {"train_loss": -26.471323013305664, "global_step": 380583, "epoch": 4585} {"train_loss": -25.907052993774414, "global_step": 380584, "epoch": 4585} {"train_loss": -26.038244247436523, "global_step": 380585, "epoch": 4585} {"train_loss": -26.408187866210938, "global_step": 380586, "epoch": 4585} {"train_loss": -26.209735870361328, "global_step": 380587, "epoch": 4585} {"train_loss": -26.318119049072266, "global_step": 380588, "epoch": 4585} {"train_loss": -26.250534057617188, "global_step": 380589, "epoch": 4585} {"train_loss": -26.67536735534668, "global_step": 380590, "epoch": 4585} {"train_loss": -26.388229370117188, "global_step": 380591, "epoch": 4585} {"train_loss": -26.407373428344727, "global_step": 380592, "epoch": 4585} {"train_loss": -26.356481552124023, "global_step": 380593, "epoch": 4585} {"train_loss": -26.36712074279785, "global_step": 380594, "epoch": 4585} {"train_loss": -26.43269157409668, "global_step": 380595, "epoch": 4585} {"train_loss": -26.072952270507812, "global_step": 380596, "epoch": 4585} {"train_loss": -26.169347763061523, "global_step": 380597, "epoch": 4585} {"train_loss": -26.42567253112793, "global_step": 380598, "epoch": 4585} {"train_loss": -26.612247467041016, "global_step": 380599, "epoch": 4585} {"train_loss": -26.37409782409668, "global_step": 380600, "epoch": 4585} {"train_loss": -26.41587257385254, "global_step": 380601, "epoch": 4585} {"train_loss": -26.43536376953125, "global_step": 380602, "epoch": 4585} {"train_loss": -26.517332077026367, "global_step": 380603, "epoch": 4585} {"train_loss": -26.895849227905273, "global_step": 380604, "epoch": 4585} {"train_loss": -26.533599853515625, "global_step": 380605, "epoch": 4585} {"train_loss": -26.290536880493164, "global_step": 380606, "epoch": 4585} {"train_loss": -26.640771865844727, "global_step": 380607, "epoch": 4585} {"train_loss": -26.7365779876709, "global_step": 380608, "epoch": 4585} {"train_loss": -26.506183624267578, "global_step": 380609, "epoch": 4585} {"train_loss": -26.670133590698242, "global_step": 380610, "epoch": 4585} {"train_loss": -26.609960556030273, "global_step": 380611, "epoch": 4585} {"train_loss": -26.53420066833496, "global_step": 380612, "epoch": 4585} {"train_loss": -26.62652587890625, "global_step": 380613, "epoch": 4585} {"train_loss": -26.32985496520996, "global_step": 380614, "epoch": 4585} {"train_loss": -26.529417037963867, "global_step": 380615, "epoch": 4585} {"train_loss": -26.65744400024414, "global_step": 380616, "epoch": 4585} {"train_loss": -26.946393966674805, "global_step": 380617, "epoch": 4585} {"train_loss": -26.561399459838867, "global_step": 380618, "epoch": 4585} {"train_loss": -26.857603073120117, "global_step": 380619, "epoch": 4585} {"train_loss": -26.285993576049805, "global_step": 380620, "epoch": 4585} {"train_loss": -26.749393463134766, "global_step": 380621, "epoch": 4585} {"train_loss": -26.749357223510742, "global_step": 380622, "epoch": 4585} {"train_loss": -26.266767501831055, "global_step": 380623, "epoch": 4585} {"train_loss": -26.736225128173828, "global_step": 380624, "epoch": 4585} {"train_loss": -26.226947784423828, "global_step": 380625, "epoch": 4585} {"train_loss": -26.246137619018555, "global_step": 380626, "epoch": 4585} {"train_loss": -26.7252254486084, "global_step": 380627, "epoch": 4585} {"train_loss": -26.4310359954834, "global_step": 380628, "epoch": 4585} {"train_loss": -26.353626251220703, "global_step": 380629, "epoch": 4585} {"train_loss": -26.428186416625977, "global_step": 380630, "epoch": 4585} {"train_loss": -26.636478424072266, "global_step": 380631, "epoch": 4585} {"train_loss": -26.682722091674805, "global_step": 380632, "epoch": 4585} {"train_loss": -26.9127197265625, "global_step": 380633, "epoch": 4585} {"train_loss": -26.549306869506836, "global_step": 380634, "epoch": 4585} {"train_loss": -26.230396270751953, "global_step": 380635, "epoch": 4585} {"train_loss": -26.466327667236328, "global_step": 380636, "epoch": 4585} {"train_loss": -26.325457423566334, "global_step": 380637, "epoch": 4585, "val_loss": 6617318.0} {"train_loss": -25.452062606811523, "global_step": 380638, "epoch": 4586} {"train_loss": -24.959278106689453, "global_step": 380639, "epoch": 4586} {"train_loss": -26.029220581054688, "global_step": 380640, "epoch": 4586} {"train_loss": -25.668365478515625, "global_step": 380641, "epoch": 4586} {"train_loss": -25.94173240661621, "global_step": 380642, "epoch": 4586} {"train_loss": -25.410558700561523, "global_step": 380643, "epoch": 4586} {"train_loss": -26.00042724609375, "global_step": 380644, "epoch": 4586} {"train_loss": -26.02666664123535, "global_step": 380645, "epoch": 4586} {"train_loss": -26.15679931640625, "global_step": 380646, "epoch": 4586} {"train_loss": -25.89850425720215, "global_step": 380647, "epoch": 4586} {"train_loss": -26.135236740112305, "global_step": 380648, "epoch": 4586} {"train_loss": -26.054370880126953, "global_step": 380649, "epoch": 4586} {"train_loss": -26.266263961791992, "global_step": 380650, "epoch": 4586} {"train_loss": -26.25031089782715, "global_step": 380651, "epoch": 4586} {"train_loss": -25.851825714111328, "global_step": 380652, "epoch": 4586} {"train_loss": -25.911611557006836, "global_step": 380653, "epoch": 4586} {"train_loss": -26.1030330657959, "global_step": 380654, "epoch": 4586} {"train_loss": -26.207611083984375, "global_step": 380655, "epoch": 4586} {"train_loss": -26.300546646118164, "global_step": 380656, "epoch": 4586} {"train_loss": -26.037099838256836, "global_step": 380657, "epoch": 4586} {"train_loss": -26.29815673828125, "global_step": 380658, "epoch": 4586} {"train_loss": -26.163854598999023, "global_step": 380659, "epoch": 4586} {"train_loss": -26.28533935546875, "global_step": 380660, "epoch": 4586} {"train_loss": -26.223831176757812, "global_step": 380661, "epoch": 4586} {"train_loss": -26.566059112548828, "global_step": 380662, "epoch": 4586} {"train_loss": -26.26096534729004, "global_step": 380663, "epoch": 4586} {"train_loss": -26.55531883239746, "global_step": 380664, "epoch": 4586} {"train_loss": -26.372655868530273, "global_step": 380665, "epoch": 4586} {"train_loss": -26.47357177734375, "global_step": 380666, "epoch": 4586} {"train_loss": -26.521549224853516, "global_step": 380667, "epoch": 4586} {"train_loss": -26.628564834594727, "global_step": 380668, "epoch": 4586} {"train_loss": -26.37442398071289, "global_step": 380669, "epoch": 4586} {"train_loss": -26.596704483032227, "global_step": 380670, "epoch": 4586} {"train_loss": -26.566761016845703, "global_step": 380671, "epoch": 4586} {"train_loss": -26.324234008789062, "global_step": 380672, "epoch": 4586} {"train_loss": -26.34284019470215, "global_step": 380673, "epoch": 4586} {"train_loss": -26.849462509155273, "global_step": 380674, "epoch": 4586} {"train_loss": -26.54896354675293, "global_step": 380675, "epoch": 4586} {"train_loss": -26.281906127929688, "global_step": 380676, "epoch": 4586} {"train_loss": -26.529556274414062, "global_step": 380677, "epoch": 4586} {"train_loss": -26.81031608581543, "global_step": 380678, "epoch": 4586} {"train_loss": -26.86067008972168, "global_step": 380679, "epoch": 4586} {"train_loss": -26.451520919799805, "global_step": 380680, "epoch": 4586} {"train_loss": -26.53986930847168, "global_step": 380681, "epoch": 4586} {"train_loss": -26.774810791015625, "global_step": 380682, "epoch": 4586} {"train_loss": -26.567291259765625, "global_step": 380683, "epoch": 4586} {"train_loss": -26.558847427368164, "global_step": 380684, "epoch": 4586} {"train_loss": -26.566547393798828, "global_step": 380685, "epoch": 4586} {"train_loss": -26.42486572265625, "global_step": 380686, "epoch": 4586} {"train_loss": -26.41607666015625, "global_step": 380687, "epoch": 4586} {"train_loss": -26.16755485534668, "global_step": 380688, "epoch": 4586} {"train_loss": -26.567975997924805, "global_step": 380689, "epoch": 4586} {"train_loss": -26.31662940979004, "global_step": 380690, "epoch": 4586} {"train_loss": -26.17901039123535, "global_step": 380691, "epoch": 4586} {"train_loss": -26.284467697143555, "global_step": 380692, "epoch": 4586} {"train_loss": -26.82757568359375, "global_step": 380693, "epoch": 4586} {"train_loss": -26.645193099975586, "global_step": 380694, "epoch": 4586} {"train_loss": -26.27741813659668, "global_step": 380695, "epoch": 4586} {"train_loss": -26.34990882873535, "global_step": 380696, "epoch": 4586} {"train_loss": -26.452573776245117, "global_step": 380697, "epoch": 4586} {"train_loss": -26.19522476196289, "global_step": 380698, "epoch": 4586} {"train_loss": -26.4870662689209, "global_step": 380699, "epoch": 4586} {"train_loss": -27.004362106323242, "global_step": 380700, "epoch": 4586} {"train_loss": -26.3424129486084, "global_step": 380701, "epoch": 4586} {"train_loss": -26.2637882232666, "global_step": 380702, "epoch": 4586} {"train_loss": -26.316083908081055, "global_step": 380703, "epoch": 4586} {"train_loss": -26.498004913330078, "global_step": 380704, "epoch": 4586} {"train_loss": -26.5805606842041, "global_step": 380705, "epoch": 4586} {"train_loss": -26.293359756469727, "global_step": 380706, "epoch": 4586} {"train_loss": -26.21478271484375, "global_step": 380707, "epoch": 4586} {"train_loss": -26.305078506469727, "global_step": 380708, "epoch": 4586} {"train_loss": -26.887502670288086, "global_step": 380709, "epoch": 4586} {"train_loss": -26.500051498413086, "global_step": 380710, "epoch": 4586} {"train_loss": -26.460596084594727, "global_step": 380711, "epoch": 4586} {"train_loss": -26.552448272705078, "global_step": 380712, "epoch": 4586} {"train_loss": -26.6169376373291, "global_step": 380713, "epoch": 4586} {"train_loss": -26.547531127929688, "global_step": 380714, "epoch": 4586} {"train_loss": -26.383289337158203, "global_step": 380715, "epoch": 4586} {"train_loss": -26.474145889282227, "global_step": 380716, "epoch": 4586} {"train_loss": -25.894214630126953, "global_step": 380717, "epoch": 4586} {"train_loss": -26.297870635986328, "global_step": 380718, "epoch": 4586} {"train_loss": -26.657913208007812, "global_step": 380719, "epoch": 4586} {"train_loss": -26.345732217811676, "global_step": 380720, "epoch": 4586, "val_loss": 6553501.0} {"train_loss": -25.22498893737793, "global_step": 380721, "epoch": 4587} {"train_loss": -24.449487686157227, "global_step": 380722, "epoch": 4587} {"train_loss": -26.389684677124023, "global_step": 380723, "epoch": 4587} {"train_loss": -24.68768882751465, "global_step": 380724, "epoch": 4587} {"train_loss": -25.374666213989258, "global_step": 380725, "epoch": 4587} {"train_loss": -25.518939971923828, "global_step": 380726, "epoch": 4587} {"train_loss": -25.831830978393555, "global_step": 380727, "epoch": 4587} {"train_loss": -25.560199737548828, "global_step": 380728, "epoch": 4587} {"train_loss": -25.88983154296875, "global_step": 380729, "epoch": 4587} {"train_loss": -25.75906753540039, "global_step": 380730, "epoch": 4587} {"train_loss": -25.804840087890625, "global_step": 380731, "epoch": 4587} {"train_loss": -25.935138702392578, "global_step": 380732, "epoch": 4587} {"train_loss": -25.846261978149414, "global_step": 380733, "epoch": 4587} {"train_loss": -25.66291618347168, "global_step": 380734, "epoch": 4587} {"train_loss": -25.679244995117188, "global_step": 380735, "epoch": 4587} {"train_loss": -25.45261001586914, "global_step": 380736, "epoch": 4587} {"train_loss": -26.40704917907715, "global_step": 380737, "epoch": 4587} {"train_loss": -25.537076950073242, "global_step": 380738, "epoch": 4587} {"train_loss": -25.933856964111328, "global_step": 380739, "epoch": 4587} {"train_loss": -25.981616973876953, "global_step": 380740, "epoch": 4587} {"train_loss": -25.556915283203125, "global_step": 380741, "epoch": 4587} {"train_loss": -25.742197036743164, "global_step": 380742, "epoch": 4587} {"train_loss": -25.87821388244629, "global_step": 380743, "epoch": 4587} {"train_loss": -26.111358642578125, "global_step": 380744, "epoch": 4587} {"train_loss": -25.807861328125, "global_step": 380745, "epoch": 4587} {"train_loss": -26.290578842163086, "global_step": 380746, "epoch": 4587} {"train_loss": -26.090290069580078, "global_step": 380747, "epoch": 4587} {"train_loss": -26.65717887878418, "global_step": 380748, "epoch": 4587} {"train_loss": -26.33625602722168, "global_step": 380749, "epoch": 4587} {"train_loss": -26.39656639099121, "global_step": 380750, "epoch": 4587} {"train_loss": -26.504562377929688, "global_step": 380751, "epoch": 4587} {"train_loss": -26.314865112304688, "global_step": 380752, "epoch": 4587} {"train_loss": -26.41998291015625, "global_step": 380753, "epoch": 4587} {"train_loss": -26.342344284057617, "global_step": 380754, "epoch": 4587} {"train_loss": -26.284067153930664, "global_step": 380755, "epoch": 4587} {"train_loss": -26.174829483032227, "global_step": 380756, "epoch": 4587} {"train_loss": -26.646930694580078, "global_step": 380757, "epoch": 4587} {"train_loss": -26.420995712280273, "global_step": 380758, "epoch": 4587} {"train_loss": -26.566593170166016, "global_step": 380759, "epoch": 4587} {"train_loss": -26.27734375, "global_step": 380760, "epoch": 4587} {"train_loss": -26.248823165893555, "global_step": 380761, "epoch": 4587} {"train_loss": -26.445554733276367, "global_step": 380762, "epoch": 4587} {"train_loss": -26.22296714782715, "global_step": 380763, "epoch": 4587} {"train_loss": -26.550519943237305, "global_step": 380764, "epoch": 4587} {"train_loss": -26.673343658447266, "global_step": 380765, "epoch": 4587} {"train_loss": -26.733386993408203, "global_step": 380766, "epoch": 4587} {"train_loss": -26.5752010345459, "global_step": 380767, "epoch": 4587} {"train_loss": -26.411945343017578, "global_step": 380768, "epoch": 4587} {"train_loss": -26.804859161376953, "global_step": 380769, "epoch": 4587} {"train_loss": -26.0279483795166, "global_step": 380770, "epoch": 4587} {"train_loss": -26.367355346679688, "global_step": 380771, "epoch": 4587} {"train_loss": -26.45562171936035, "global_step": 380772, "epoch": 4587} {"train_loss": -26.651885986328125, "global_step": 380773, "epoch": 4587} {"train_loss": -26.480436325073242, "global_step": 380774, "epoch": 4587} {"train_loss": -26.22089958190918, "global_step": 380775, "epoch": 4587} {"train_loss": -26.222015380859375, "global_step": 380776, "epoch": 4587} {"train_loss": -26.069671630859375, "global_step": 380777, "epoch": 4587} {"train_loss": -26.459787368774414, "global_step": 380778, "epoch": 4587} {"train_loss": -26.328296661376953, "global_step": 380779, "epoch": 4587} {"train_loss": -26.152755737304688, "global_step": 380780, "epoch": 4587} {"train_loss": -26.206518173217773, "global_step": 380781, "epoch": 4587} {"train_loss": -26.51112937927246, "global_step": 380782, "epoch": 4587} {"train_loss": -26.668989181518555, "global_step": 380783, "epoch": 4587} {"train_loss": -26.342987060546875, "global_step": 380784, "epoch": 4587} {"train_loss": -26.186538696289062, "global_step": 380785, "epoch": 4587} {"train_loss": -25.880895614624023, "global_step": 380786, "epoch": 4587} {"train_loss": -26.075376510620117, "global_step": 380787, "epoch": 4587} {"train_loss": -26.881200790405273, "global_step": 380788, "epoch": 4587} {"train_loss": -26.65467643737793, "global_step": 380789, "epoch": 4587} {"train_loss": -26.766935348510742, "global_step": 380790, "epoch": 4587} {"train_loss": -26.33452796936035, "global_step": 380791, "epoch": 4587} {"train_loss": -26.234500885009766, "global_step": 380792, "epoch": 4587} {"train_loss": -26.4741153717041, "global_step": 380793, "epoch": 4587} {"train_loss": -26.571924209594727, "global_step": 380794, "epoch": 4587} {"train_loss": -26.61026954650879, "global_step": 380795, "epoch": 4587} {"train_loss": -26.088743209838867, "global_step": 380796, "epoch": 4587} {"train_loss": -26.5766544342041, "global_step": 380797, "epoch": 4587} {"train_loss": -26.28816795349121, "global_step": 380798, "epoch": 4587} {"train_loss": -26.46973991394043, "global_step": 380799, "epoch": 4587} {"train_loss": -26.231359481811523, "global_step": 380800, "epoch": 4587} {"train_loss": -26.43499755859375, "global_step": 380801, "epoch": 4587} {"train_loss": -26.191259384155273, "global_step": 380802, "epoch": 4587} {"train_loss": -26.168574367661073, "global_step": 380803, "epoch": 4587, "val_loss": 6600801.0} {"train_loss": -24.20479393005371, "global_step": 380804, "epoch": 4588} {"train_loss": -25.139684677124023, "global_step": 380805, "epoch": 4588} {"train_loss": -25.222423553466797, "global_step": 380806, "epoch": 4588} {"train_loss": -24.707754135131836, "global_step": 380807, "epoch": 4588} {"train_loss": -25.970935821533203, "global_step": 380808, "epoch": 4588} {"train_loss": -24.7872314453125, "global_step": 380809, "epoch": 4588} {"train_loss": -26.425474166870117, "global_step": 380810, "epoch": 4588} {"train_loss": -25.410675048828125, "global_step": 380811, "epoch": 4588} {"train_loss": -25.9645938873291, "global_step": 380812, "epoch": 4588} {"train_loss": -26.110305786132812, "global_step": 380813, "epoch": 4588} {"train_loss": -25.885578155517578, "global_step": 380814, "epoch": 4588} {"train_loss": -26.000173568725586, "global_step": 380815, "epoch": 4588} {"train_loss": -25.8132381439209, "global_step": 380816, "epoch": 4588} {"train_loss": -26.097631454467773, "global_step": 380817, "epoch": 4588} {"train_loss": -25.85055923461914, "global_step": 380818, "epoch": 4588} {"train_loss": -26.235815048217773, "global_step": 380819, "epoch": 4588} {"train_loss": -25.85003662109375, "global_step": 380820, "epoch": 4588} {"train_loss": -26.169931411743164, "global_step": 380821, "epoch": 4588} {"train_loss": -26.109745025634766, "global_step": 380822, "epoch": 4588} {"train_loss": -26.0029239654541, "global_step": 380823, "epoch": 4588} {"train_loss": -25.903228759765625, "global_step": 380824, "epoch": 4588} {"train_loss": -25.90296745300293, "global_step": 380825, "epoch": 4588} {"train_loss": -26.094945907592773, "global_step": 380826, "epoch": 4588} {"train_loss": -25.834253311157227, "global_step": 380827, "epoch": 4588} {"train_loss": -26.194110870361328, "global_step": 380828, "epoch": 4588} {"train_loss": -26.021276473999023, "global_step": 380829, "epoch": 4588} {"train_loss": -26.45216178894043, "global_step": 380830, "epoch": 4588} {"train_loss": -26.141996383666992, "global_step": 380831, "epoch": 4588} {"train_loss": -25.936166763305664, "global_step": 380832, "epoch": 4588} {"train_loss": -26.371702194213867, "global_step": 380833, "epoch": 4588} {"train_loss": -26.205371856689453, "global_step": 380834, "epoch": 4588} {"train_loss": -25.955976486206055, "global_step": 380835, "epoch": 4588} {"train_loss": -26.31354331970215, "global_step": 380836, "epoch": 4588} {"train_loss": -26.378437042236328, "global_step": 380837, "epoch": 4588} {"train_loss": -26.07560157775879, "global_step": 380838, "epoch": 4588} {"train_loss": -26.029584884643555, "global_step": 380839, "epoch": 4588} {"train_loss": -26.003454208374023, "global_step": 380840, "epoch": 4588} {"train_loss": -26.686559677124023, "global_step": 380841, "epoch": 4588} {"train_loss": -26.379165649414062, "global_step": 380842, "epoch": 4588} {"train_loss": -26.406478881835938, "global_step": 380843, "epoch": 4588} {"train_loss": -26.571704864501953, "global_step": 380844, "epoch": 4588} {"train_loss": -26.292388916015625, "global_step": 380845, "epoch": 4588} {"train_loss": -26.30929946899414, "global_step": 380846, "epoch": 4588} {"train_loss": -26.199481964111328, "global_step": 380847, "epoch": 4588} {"train_loss": -26.23419189453125, "global_step": 380848, "epoch": 4588} {"train_loss": -26.363683700561523, "global_step": 380849, "epoch": 4588} {"train_loss": -26.77166175842285, "global_step": 380850, "epoch": 4588} {"train_loss": -26.76272964477539, "global_step": 380851, "epoch": 4588} {"train_loss": -26.52937126159668, "global_step": 380852, "epoch": 4588} {"train_loss": -26.23993492126465, "global_step": 380853, "epoch": 4588} {"train_loss": -26.149173736572266, "global_step": 380854, "epoch": 4588} {"train_loss": -26.2218017578125, "global_step": 380855, "epoch": 4588} {"train_loss": -26.14459228515625, "global_step": 380856, "epoch": 4588} {"train_loss": -26.28118324279785, "global_step": 380857, "epoch": 4588} {"train_loss": -26.525381088256836, "global_step": 380858, "epoch": 4588} {"train_loss": -26.347875595092773, "global_step": 380859, "epoch": 4588} {"train_loss": -26.693578720092773, "global_step": 380860, "epoch": 4588} {"train_loss": -26.491535186767578, "global_step": 380861, "epoch": 4588} {"train_loss": -26.235254287719727, "global_step": 380862, "epoch": 4588} {"train_loss": -26.4035701751709, "global_step": 380863, "epoch": 4588} {"train_loss": -26.40999412536621, "global_step": 380864, "epoch": 4588} {"train_loss": -26.70191764831543, "global_step": 380865, "epoch": 4588} {"train_loss": -26.639957427978516, "global_step": 380866, "epoch": 4588} {"train_loss": -26.296314239501953, "global_step": 380867, "epoch": 4588} {"train_loss": -26.335987091064453, "global_step": 380868, "epoch": 4588} {"train_loss": -26.3743839263916, "global_step": 380869, "epoch": 4588} {"train_loss": -26.8796329498291, "global_step": 380870, "epoch": 4588} {"train_loss": -26.892812728881836, "global_step": 380871, "epoch": 4588} {"train_loss": -26.290979385375977, "global_step": 380872, "epoch": 4588} {"train_loss": -26.72620964050293, "global_step": 380873, "epoch": 4588} {"train_loss": -26.850967407226562, "global_step": 380874, "epoch": 4588} {"train_loss": -26.62603187561035, "global_step": 380875, "epoch": 4588} {"train_loss": -26.90656089782715, "global_step": 380876, "epoch": 4588} {"train_loss": -26.368688583374023, "global_step": 380877, "epoch": 4588} {"train_loss": -27.034116744995117, "global_step": 380878, "epoch": 4588} {"train_loss": -26.664358139038086, "global_step": 380879, "epoch": 4588} {"train_loss": -26.413501739501953, "global_step": 380880, "epoch": 4588} {"train_loss": -26.446401596069336, "global_step": 380881, "epoch": 4588} {"train_loss": -26.586688995361328, "global_step": 380882, "epoch": 4588} {"train_loss": -26.805212020874023, "global_step": 380883, "epoch": 4588} {"train_loss": -26.269678115844727, "global_step": 380884, "epoch": 4588} {"train_loss": -26.4295711517334, "global_step": 380885, "epoch": 4588} {"train_loss": -26.227680734841222, "global_step": 380886, "epoch": 4588, "val_loss": 6596399.0} {"train_loss": -26.057098388671875, "global_step": 380887, "epoch": 4589} {"train_loss": -25.936872482299805, "global_step": 380888, "epoch": 4589} {"train_loss": -25.779916763305664, "global_step": 380889, "epoch": 4589} {"train_loss": -25.6950626373291, "global_step": 380890, "epoch": 4589} {"train_loss": -25.945362091064453, "global_step": 380891, "epoch": 4589} {"train_loss": -26.003721237182617, "global_step": 380892, "epoch": 4589} {"train_loss": -26.103418350219727, "global_step": 380893, "epoch": 4589} {"train_loss": -25.759531021118164, "global_step": 380894, "epoch": 4589} {"train_loss": -26.32366943359375, "global_step": 380895, "epoch": 4589} {"train_loss": -25.9554443359375, "global_step": 380896, "epoch": 4589} {"train_loss": -25.898426055908203, "global_step": 380897, "epoch": 4589} {"train_loss": -26.417633056640625, "global_step": 380898, "epoch": 4589} {"train_loss": -26.279376983642578, "global_step": 380899, "epoch": 4589} {"train_loss": -26.423023223876953, "global_step": 380900, "epoch": 4589} {"train_loss": -26.45892906188965, "global_step": 380901, "epoch": 4589} {"train_loss": -26.70796012878418, "global_step": 380902, "epoch": 4589} {"train_loss": -26.245656967163086, "global_step": 380903, "epoch": 4589} {"train_loss": -26.55950927734375, "global_step": 380904, "epoch": 4589} {"train_loss": -26.516199111938477, "global_step": 380905, "epoch": 4589} {"train_loss": -26.458240509033203, "global_step": 380906, "epoch": 4589} {"train_loss": -26.073476791381836, "global_step": 380907, "epoch": 4589} {"train_loss": -26.38605308532715, "global_step": 380908, "epoch": 4589} {"train_loss": -26.118188858032227, "global_step": 380909, "epoch": 4589} {"train_loss": -26.174579620361328, "global_step": 380910, "epoch": 4589} {"train_loss": -26.596399307250977, "global_step": 380911, "epoch": 4589} {"train_loss": -26.563709259033203, "global_step": 380912, "epoch": 4589} {"train_loss": -26.594898223876953, "global_step": 380913, "epoch": 4589} {"train_loss": -26.7952938079834, "global_step": 380914, "epoch": 4589} {"train_loss": -26.453357696533203, "global_step": 380915, "epoch": 4589} {"train_loss": -26.42218589782715, "global_step": 380916, "epoch": 4589} {"train_loss": -26.5502986907959, "global_step": 380917, "epoch": 4589} {"train_loss": -26.3580322265625, "global_step": 380918, "epoch": 4589} {"train_loss": -26.282978057861328, "global_step": 380919, "epoch": 4589} {"train_loss": -26.37909507751465, "global_step": 380920, "epoch": 4589} {"train_loss": -26.636260986328125, "global_step": 380921, "epoch": 4589} {"train_loss": -26.72431755065918, "global_step": 380922, "epoch": 4589} {"train_loss": -26.703657150268555, "global_step": 380923, "epoch": 4589} {"train_loss": -26.66290855407715, "global_step": 380924, "epoch": 4589} {"train_loss": -27.107715606689453, "global_step": 380925, "epoch": 4589} {"train_loss": -26.620594024658203, "global_step": 380926, "epoch": 4589} {"train_loss": -26.663410186767578, "global_step": 380927, "epoch": 4589} {"train_loss": -26.272485733032227, "global_step": 380928, "epoch": 4589} {"train_loss": -26.79266357421875, "global_step": 380929, "epoch": 4589} {"train_loss": -26.5461483001709, "global_step": 380930, "epoch": 4589} {"train_loss": -26.390905380249023, "global_step": 380931, "epoch": 4589} {"train_loss": -25.922876358032227, "global_step": 380932, "epoch": 4589} {"train_loss": -25.97456169128418, "global_step": 380933, "epoch": 4589} {"train_loss": -25.403474807739258, "global_step": 380934, "epoch": 4589} {"train_loss": -25.832096099853516, "global_step": 380935, "epoch": 4589} {"train_loss": -26.003299713134766, "global_step": 380936, "epoch": 4589} {"train_loss": -25.993940353393555, "global_step": 380937, "epoch": 4589} {"train_loss": -26.71424674987793, "global_step": 380938, "epoch": 4589} {"train_loss": -26.03370475769043, "global_step": 380939, "epoch": 4589} {"train_loss": -26.4250545501709, "global_step": 380940, "epoch": 4589} {"train_loss": -26.267377853393555, "global_step": 380941, "epoch": 4589} {"train_loss": -26.474746704101562, "global_step": 380942, "epoch": 4589} {"train_loss": -26.569944381713867, "global_step": 380943, "epoch": 4589} {"train_loss": -26.450653076171875, "global_step": 380944, "epoch": 4589} {"train_loss": -26.171051025390625, "global_step": 380945, "epoch": 4589} {"train_loss": -26.528762817382812, "global_step": 380946, "epoch": 4589} {"train_loss": -26.410919189453125, "global_step": 380947, "epoch": 4589} {"train_loss": -26.163633346557617, "global_step": 380948, "epoch": 4589} {"train_loss": -26.08133316040039, "global_step": 380949, "epoch": 4589} {"train_loss": -26.164691925048828, "global_step": 380950, "epoch": 4589} {"train_loss": -26.10487174987793, "global_step": 380951, "epoch": 4589} {"train_loss": -26.403945922851562, "global_step": 380952, "epoch": 4589} {"train_loss": -26.40015983581543, "global_step": 380953, "epoch": 4589} {"train_loss": -26.645721435546875, "global_step": 380954, "epoch": 4589} {"train_loss": -26.282764434814453, "global_step": 380955, "epoch": 4589} {"train_loss": -26.183563232421875, "global_step": 380956, "epoch": 4589} {"train_loss": -26.398908615112305, "global_step": 380957, "epoch": 4589} {"train_loss": -26.1055965423584, "global_step": 380958, "epoch": 4589} {"train_loss": -26.299413681030273, "global_step": 380959, "epoch": 4589} {"train_loss": -26.323225021362305, "global_step": 380960, "epoch": 4589} {"train_loss": -26.6317081451416, "global_step": 380961, "epoch": 4589} {"train_loss": -26.695697784423828, "global_step": 380962, "epoch": 4589} {"train_loss": -26.479780197143555, "global_step": 380963, "epoch": 4589} {"train_loss": -26.60733985900879, "global_step": 380964, "epoch": 4589} {"train_loss": -26.864282608032227, "global_step": 380965, "epoch": 4589} {"train_loss": -26.604022979736328, "global_step": 380966, "epoch": 4589} {"train_loss": -26.95948600769043, "global_step": 380967, "epoch": 4589} {"train_loss": -26.616107940673828, "global_step": 380968, "epoch": 4589} {"train_loss": -26.360595565244378, "global_step": 380969, "epoch": 4589, "val_loss": 6603288.0} {"train_loss": -26.58670997619629, "global_step": 380970, "epoch": 4590} {"train_loss": -26.499536514282227, "global_step": 380971, "epoch": 4590} {"train_loss": -26.53466796875, "global_step": 380972, "epoch": 4590} {"train_loss": -26.167078018188477, "global_step": 380973, "epoch": 4590} {"train_loss": -26.620193481445312, "global_step": 380974, "epoch": 4590} {"train_loss": -26.425626754760742, "global_step": 380975, "epoch": 4590} {"train_loss": -26.519323348999023, "global_step": 380976, "epoch": 4590} {"train_loss": -26.223337173461914, "global_step": 380977, "epoch": 4590} {"train_loss": -26.246335983276367, "global_step": 380978, "epoch": 4590} {"train_loss": -26.20668601989746, "global_step": 380979, "epoch": 4590} {"train_loss": -26.34619140625, "global_step": 380980, "epoch": 4590} {"train_loss": -26.737035751342773, "global_step": 380981, "epoch": 4590} {"train_loss": -26.494001388549805, "global_step": 380982, "epoch": 4590} {"train_loss": -26.342519760131836, "global_step": 380983, "epoch": 4590} {"train_loss": -26.58992576599121, "global_step": 380984, "epoch": 4590} {"train_loss": -26.5474910736084, "global_step": 380985, "epoch": 4590} {"train_loss": -26.544952392578125, "global_step": 380986, "epoch": 4590} {"train_loss": -26.454099655151367, "global_step": 380987, "epoch": 4590} {"train_loss": -26.640548706054688, "global_step": 380988, "epoch": 4590} {"train_loss": -26.366455078125, "global_step": 380989, "epoch": 4590} {"train_loss": -26.66631507873535, "global_step": 380990, "epoch": 4590} {"train_loss": -26.6097354888916, "global_step": 380991, "epoch": 4590} {"train_loss": -26.354827880859375, "global_step": 380992, "epoch": 4590} {"train_loss": -26.7558650970459, "global_step": 380993, "epoch": 4590} {"train_loss": -26.54743766784668, "global_step": 380994, "epoch": 4590} {"train_loss": -26.53834342956543, "global_step": 380995, "epoch": 4590} {"train_loss": -26.57382583618164, "global_step": 380996, "epoch": 4590} {"train_loss": -26.527128219604492, "global_step": 380997, "epoch": 4590} {"train_loss": -26.6844482421875, "global_step": 380998, "epoch": 4590} {"train_loss": -26.111852645874023, "global_step": 380999, "epoch": 4590} {"train_loss": -26.523839950561523, "global_step": 381000, "epoch": 4590} {"train_loss": -26.585798263549805, "global_step": 381001, "epoch": 4590} {"train_loss": -26.573017120361328, "global_step": 381002, "epoch": 4590} {"train_loss": -26.204809188842773, "global_step": 381003, "epoch": 4590} {"train_loss": -26.38079833984375, "global_step": 381004, "epoch": 4590} {"train_loss": -26.1297607421875, "global_step": 381005, "epoch": 4590} {"train_loss": -25.992664337158203, "global_step": 381006, "epoch": 4590} {"train_loss": -26.433486938476562, "global_step": 381007, "epoch": 4590} {"train_loss": -26.78605079650879, "global_step": 381008, "epoch": 4590} {"train_loss": -26.441970825195312, "global_step": 381009, "epoch": 4590} {"train_loss": -26.796649932861328, "global_step": 381010, "epoch": 4590} {"train_loss": -26.142431259155273, "global_step": 381011, "epoch": 4590} {"train_loss": -26.44256019592285, "global_step": 381012, "epoch": 4590} {"train_loss": -26.400299072265625, "global_step": 381013, "epoch": 4590} {"train_loss": -26.485198974609375, "global_step": 381014, "epoch": 4590} {"train_loss": -26.617431640625, "global_step": 381015, "epoch": 4590} {"train_loss": -26.270898818969727, "global_step": 381016, "epoch": 4590} {"train_loss": -26.620441436767578, "global_step": 381017, "epoch": 4590} {"train_loss": -26.67706298828125, "global_step": 381018, "epoch": 4590} {"train_loss": -26.334857940673828, "global_step": 381019, "epoch": 4590} {"train_loss": -26.682968139648438, "global_step": 381020, "epoch": 4590} {"train_loss": -26.40081787109375, "global_step": 381021, "epoch": 4590} {"train_loss": -26.567312240600586, "global_step": 381022, "epoch": 4590} {"train_loss": -26.236276626586914, "global_step": 381023, "epoch": 4590} {"train_loss": -26.79681396484375, "global_step": 381024, "epoch": 4590} {"train_loss": -26.5955753326416, "global_step": 381025, "epoch": 4590} {"train_loss": -26.588773727416992, "global_step": 381026, "epoch": 4590} {"train_loss": -26.288043975830078, "global_step": 381027, "epoch": 4590} {"train_loss": -26.7970027923584, "global_step": 381028, "epoch": 4590} {"train_loss": -26.54432487487793, "global_step": 381029, "epoch": 4590} {"train_loss": -26.197477340698242, "global_step": 381030, "epoch": 4590} {"train_loss": -26.11212730407715, "global_step": 381031, "epoch": 4590} {"train_loss": -26.253925323486328, "global_step": 381032, "epoch": 4590} {"train_loss": -26.36958885192871, "global_step": 381033, "epoch": 4590} {"train_loss": -26.862287521362305, "global_step": 381034, "epoch": 4590} {"train_loss": -26.85662269592285, "global_step": 381035, "epoch": 4590} {"train_loss": -26.71245765686035, "global_step": 381036, "epoch": 4590} {"train_loss": -26.671249389648438, "global_step": 381037, "epoch": 4590} {"train_loss": -26.904682159423828, "global_step": 381038, "epoch": 4590} {"train_loss": -26.156869888305664, "global_step": 381039, "epoch": 4590} {"train_loss": -26.167097091674805, "global_step": 381040, "epoch": 4590} {"train_loss": -25.730993270874023, "global_step": 381041, "epoch": 4590} {"train_loss": -25.794111251831055, "global_step": 381042, "epoch": 4590} {"train_loss": -25.591955184936523, "global_step": 381043, "epoch": 4590} {"train_loss": -25.682849884033203, "global_step": 381044, "epoch": 4590} {"train_loss": -26.331628799438477, "global_step": 381045, "epoch": 4590} {"train_loss": -26.132587432861328, "global_step": 381046, "epoch": 4590} {"train_loss": -26.10149574279785, "global_step": 381047, "epoch": 4590} {"train_loss": -26.405231475830078, "global_step": 381048, "epoch": 4590} {"train_loss": -26.354883193969727, "global_step": 381049, "epoch": 4590} {"train_loss": -26.0177059173584, "global_step": 381050, "epoch": 4590} {"train_loss": -26.364709854125977, "global_step": 381051, "epoch": 4590} {"train_loss": -26.41275635684829, "global_step": 381052, "epoch": 4590, "val_loss": 6554075.5} {"train_loss": -26.097217559814453, "global_step": 381053, "epoch": 4591} {"train_loss": -25.87873649597168, "global_step": 381054, "epoch": 4591} {"train_loss": -26.137113571166992, "global_step": 381055, "epoch": 4591} {"train_loss": -26.3651065826416, "global_step": 381056, "epoch": 4591} {"train_loss": -25.8959903717041, "global_step": 381057, "epoch": 4591} {"train_loss": -26.058042526245117, "global_step": 381058, "epoch": 4591} {"train_loss": -26.070646286010742, "global_step": 381059, "epoch": 4591} {"train_loss": -26.422948837280273, "global_step": 381060, "epoch": 4591} {"train_loss": -26.37177848815918, "global_step": 381061, "epoch": 4591} {"train_loss": -26.30198097229004, "global_step": 381062, "epoch": 4591} {"train_loss": -26.450469970703125, "global_step": 381063, "epoch": 4591} {"train_loss": -26.33394432067871, "global_step": 381064, "epoch": 4591} {"train_loss": -26.480295181274414, "global_step": 381065, "epoch": 4591} {"train_loss": -26.430356979370117, "global_step": 381066, "epoch": 4591} {"train_loss": -26.545684814453125, "global_step": 381067, "epoch": 4591} {"train_loss": -26.45380210876465, "global_step": 381068, "epoch": 4591} {"train_loss": -26.363325119018555, "global_step": 381069, "epoch": 4591} {"train_loss": -26.530668258666992, "global_step": 381070, "epoch": 4591} {"train_loss": -26.511371612548828, "global_step": 381071, "epoch": 4591} {"train_loss": -26.5332088470459, "global_step": 381072, "epoch": 4591} {"train_loss": -26.384618759155273, "global_step": 381073, "epoch": 4591} {"train_loss": -26.590225219726562, "global_step": 381074, "epoch": 4591} {"train_loss": -26.39983558654785, "global_step": 381075, "epoch": 4591} {"train_loss": -26.02850341796875, "global_step": 381076, "epoch": 4591} {"train_loss": -26.508726119995117, "global_step": 381077, "epoch": 4591} {"train_loss": -26.416980743408203, "global_step": 381078, "epoch": 4591} {"train_loss": -26.542627334594727, "global_step": 381079, "epoch": 4591} {"train_loss": -26.467578887939453, "global_step": 381080, "epoch": 4591} {"train_loss": -26.241046905517578, "global_step": 381081, "epoch": 4591} {"train_loss": -26.588499069213867, "global_step": 381082, "epoch": 4591} {"train_loss": -26.364404678344727, "global_step": 381083, "epoch": 4591} {"train_loss": -26.669906616210938, "global_step": 381084, "epoch": 4591} {"train_loss": -26.570425033569336, "global_step": 381085, "epoch": 4591} {"train_loss": -26.718658447265625, "global_step": 381086, "epoch": 4591} {"train_loss": -26.727426528930664, "global_step": 381087, "epoch": 4591} {"train_loss": -26.238637924194336, "global_step": 381088, "epoch": 4591} {"train_loss": -26.797260284423828, "global_step": 381089, "epoch": 4591} {"train_loss": -26.625675201416016, "global_step": 381090, "epoch": 4591} {"train_loss": -26.620655059814453, "global_step": 381091, "epoch": 4591} {"train_loss": -26.479475021362305, "global_step": 381092, "epoch": 4591} {"train_loss": -26.33660888671875, "global_step": 381093, "epoch": 4591} {"train_loss": -26.36175537109375, "global_step": 381094, "epoch": 4591} {"train_loss": -26.33819007873535, "global_step": 381095, "epoch": 4591} {"train_loss": -26.548599243164062, "global_step": 381096, "epoch": 4591} {"train_loss": -26.7130184173584, "global_step": 381097, "epoch": 4591} {"train_loss": -26.658166885375977, "global_step": 381098, "epoch": 4591} {"train_loss": -26.53791618347168, "global_step": 381099, "epoch": 4591} {"train_loss": -26.425458908081055, "global_step": 381100, "epoch": 4591} {"train_loss": -26.710046768188477, "global_step": 381101, "epoch": 4591} {"train_loss": -26.618040084838867, "global_step": 381102, "epoch": 4591} {"train_loss": -26.488012313842773, "global_step": 381103, "epoch": 4591} {"train_loss": -26.695173263549805, "global_step": 381104, "epoch": 4591} {"train_loss": -26.629796981811523, "global_step": 381105, "epoch": 4591} {"train_loss": -26.965539932250977, "global_step": 381106, "epoch": 4591} {"train_loss": -26.531665802001953, "global_step": 381107, "epoch": 4591} {"train_loss": -26.458959579467773, "global_step": 381108, "epoch": 4591} {"train_loss": -26.61515235900879, "global_step": 381109, "epoch": 4591} {"train_loss": -26.63831901550293, "global_step": 381110, "epoch": 4591} {"train_loss": -26.19099235534668, "global_step": 381111, "epoch": 4591} {"train_loss": -26.4193115234375, "global_step": 381112, "epoch": 4591} {"train_loss": -26.25080680847168, "global_step": 381113, "epoch": 4591} {"train_loss": -26.063007354736328, "global_step": 381114, "epoch": 4591} {"train_loss": -26.54833984375, "global_step": 381115, "epoch": 4591} {"train_loss": -27.01038932800293, "global_step": 381116, "epoch": 4591} {"train_loss": -26.100072860717773, "global_step": 381117, "epoch": 4591} {"train_loss": -26.55047035217285, "global_step": 381118, "epoch": 4591} {"train_loss": -26.4782657623291, "global_step": 381119, "epoch": 4591} {"train_loss": -26.441564559936523, "global_step": 381120, "epoch": 4591} {"train_loss": -26.588064193725586, "global_step": 381121, "epoch": 4591} {"train_loss": -26.205236434936523, "global_step": 381122, "epoch": 4591} {"train_loss": -26.359710693359375, "global_step": 381123, "epoch": 4591} {"train_loss": -26.53348731994629, "global_step": 381124, "epoch": 4591} {"train_loss": -26.562055587768555, "global_step": 381125, "epoch": 4591} {"train_loss": -26.527313232421875, "global_step": 381126, "epoch": 4591} {"train_loss": -26.446319580078125, "global_step": 381127, "epoch": 4591} {"train_loss": -26.432621002197266, "global_step": 381128, "epoch": 4591} {"train_loss": -26.5292911529541, "global_step": 381129, "epoch": 4591} {"train_loss": -26.481861114501953, "global_step": 381130, "epoch": 4591} {"train_loss": -26.571033477783203, "global_step": 381131, "epoch": 4591} {"train_loss": -26.627750396728516, "global_step": 381132, "epoch": 4591} {"train_loss": -26.7110652923584, "global_step": 381133, "epoch": 4591} {"train_loss": -26.568710327148438, "global_step": 381134, "epoch": 4591} {"train_loss": -26.458552854606904, "global_step": 381135, "epoch": 4591, "val_loss": 6651581.0} {"train_loss": -24.956241607666016, "global_step": 381136, "epoch": 4592} {"train_loss": -25.36514663696289, "global_step": 381137, "epoch": 4592} {"train_loss": -25.30830955505371, "global_step": 381138, "epoch": 4592} {"train_loss": -25.650476455688477, "global_step": 381139, "epoch": 4592} {"train_loss": -25.592695236206055, "global_step": 381140, "epoch": 4592} {"train_loss": -25.537038803100586, "global_step": 381141, "epoch": 4592} {"train_loss": -25.215408325195312, "global_step": 381142, "epoch": 4592} {"train_loss": -26.058942794799805, "global_step": 381143, "epoch": 4592} {"train_loss": -25.541616439819336, "global_step": 381144, "epoch": 4592} {"train_loss": -25.738306045532227, "global_step": 381145, "epoch": 4592} {"train_loss": -26.288455963134766, "global_step": 381146, "epoch": 4592} {"train_loss": -25.78266716003418, "global_step": 381147, "epoch": 4592} {"train_loss": -26.11984634399414, "global_step": 381148, "epoch": 4592} {"train_loss": -25.94280433654785, "global_step": 381149, "epoch": 4592} {"train_loss": -26.002573013305664, "global_step": 381150, "epoch": 4592} {"train_loss": -25.73371696472168, "global_step": 381151, "epoch": 4592} {"train_loss": -25.895715713500977, "global_step": 381152, "epoch": 4592} {"train_loss": -26.07477378845215, "global_step": 381153, "epoch": 4592} {"train_loss": -25.86909294128418, "global_step": 381154, "epoch": 4592} {"train_loss": -25.719120025634766, "global_step": 381155, "epoch": 4592} {"train_loss": -25.845413208007812, "global_step": 381156, "epoch": 4592} {"train_loss": -26.106306076049805, "global_step": 381157, "epoch": 4592} {"train_loss": -26.085275650024414, "global_step": 381158, "epoch": 4592} {"train_loss": -25.837499618530273, "global_step": 381159, "epoch": 4592} {"train_loss": -26.380268096923828, "global_step": 381160, "epoch": 4592} {"train_loss": -26.039752960205078, "global_step": 381161, "epoch": 4592} {"train_loss": -26.41753578186035, "global_step": 381162, "epoch": 4592} {"train_loss": -26.13722038269043, "global_step": 381163, "epoch": 4592} {"train_loss": -26.302030563354492, "global_step": 381164, "epoch": 4592} {"train_loss": -26.215717315673828, "global_step": 381165, "epoch": 4592} {"train_loss": -25.954065322875977, "global_step": 381166, "epoch": 4592} {"train_loss": -26.305042266845703, "global_step": 381167, "epoch": 4592} {"train_loss": -26.1297607421875, "global_step": 381168, "epoch": 4592} {"train_loss": -26.290119171142578, "global_step": 381169, "epoch": 4592} {"train_loss": -26.455541610717773, "global_step": 381170, "epoch": 4592} {"train_loss": -26.42996597290039, "global_step": 381171, "epoch": 4592} {"train_loss": -26.52288246154785, "global_step": 381172, "epoch": 4592} {"train_loss": -26.114776611328125, "global_step": 381173, "epoch": 4592} {"train_loss": -26.841272354125977, "global_step": 381174, "epoch": 4592} {"train_loss": -26.291189193725586, "global_step": 381175, "epoch": 4592} {"train_loss": -26.486984252929688, "global_step": 381176, "epoch": 4592} {"train_loss": -26.4833984375, "global_step": 381177, "epoch": 4592} {"train_loss": -26.1953182220459, "global_step": 381178, "epoch": 4592} {"train_loss": -26.51468849182129, "global_step": 381179, "epoch": 4592} {"train_loss": -26.350894927978516, "global_step": 381180, "epoch": 4592} {"train_loss": -27.125690460205078, "global_step": 381181, "epoch": 4592} {"train_loss": -26.732452392578125, "global_step": 381182, "epoch": 4592} {"train_loss": -26.79632568359375, "global_step": 381183, "epoch": 4592} {"train_loss": -26.58576011657715, "global_step": 381184, "epoch": 4592} {"train_loss": -26.720291137695312, "global_step": 381185, "epoch": 4592} {"train_loss": -26.41993522644043, "global_step": 381186, "epoch": 4592} {"train_loss": -26.724380493164062, "global_step": 381187, "epoch": 4592} {"train_loss": -26.293842315673828, "global_step": 381188, "epoch": 4592} {"train_loss": -26.558670043945312, "global_step": 381189, "epoch": 4592} {"train_loss": -26.5004940032959, "global_step": 381190, "epoch": 4592} {"train_loss": -26.900426864624023, "global_step": 381191, "epoch": 4592} {"train_loss": -26.731964111328125, "global_step": 381192, "epoch": 4592} {"train_loss": -26.21881103515625, "global_step": 381193, "epoch": 4592} {"train_loss": -26.308521270751953, "global_step": 381194, "epoch": 4592} {"train_loss": -26.65044593811035, "global_step": 381195, "epoch": 4592} {"train_loss": -26.519926071166992, "global_step": 381196, "epoch": 4592} {"train_loss": -26.662704467773438, "global_step": 381197, "epoch": 4592} {"train_loss": -26.325490951538086, "global_step": 381198, "epoch": 4592} {"train_loss": -26.2750244140625, "global_step": 381199, "epoch": 4592} {"train_loss": -26.581192016601562, "global_step": 381200, "epoch": 4592} {"train_loss": -26.2830867767334, "global_step": 381201, "epoch": 4592} {"train_loss": -26.544015884399414, "global_step": 381202, "epoch": 4592} {"train_loss": -26.69715690612793, "global_step": 381203, "epoch": 4592} {"train_loss": -26.597402572631836, "global_step": 381204, "epoch": 4592} {"train_loss": -26.497684478759766, "global_step": 381205, "epoch": 4592} {"train_loss": -25.615142822265625, "global_step": 381206, "epoch": 4592} {"train_loss": -25.021146774291992, "global_step": 381207, "epoch": 4592} {"train_loss": -25.890533447265625, "global_step": 381208, "epoch": 4592} {"train_loss": -25.912738800048828, "global_step": 381209, "epoch": 4592} {"train_loss": -25.55029296875, "global_step": 381210, "epoch": 4592} {"train_loss": -26.1084041595459, "global_step": 381211, "epoch": 4592} {"train_loss": -25.841114044189453, "global_step": 381212, "epoch": 4592} {"train_loss": -25.645654678344727, "global_step": 381213, "epoch": 4592} {"train_loss": -26.05902671813965, "global_step": 381214, "epoch": 4592} {"train_loss": -25.854751586914062, "global_step": 381215, "epoch": 4592} {"train_loss": -26.09991455078125, "global_step": 381216, "epoch": 4592} {"train_loss": -26.40138053894043, "global_step": 381217, "epoch": 4592} {"train_loss": -26.180682722344457, "global_step": 381218, "epoch": 4592, "val_loss": 6528860.0} {"train_loss": -25.928424835205078, "global_step": 381219, "epoch": 4593} {"train_loss": -26.224775314331055, "global_step": 381220, "epoch": 4593} {"train_loss": -25.836090087890625, "global_step": 381221, "epoch": 4593} {"train_loss": -26.00113296508789, "global_step": 381222, "epoch": 4593} {"train_loss": -25.9158935546875, "global_step": 381223, "epoch": 4593} {"train_loss": -26.14353370666504, "global_step": 381224, "epoch": 4593} {"train_loss": -26.20574378967285, "global_step": 381225, "epoch": 4593} {"train_loss": -25.636981964111328, "global_step": 381226, "epoch": 4593} {"train_loss": -26.29532814025879, "global_step": 381227, "epoch": 4593} {"train_loss": -26.211261749267578, "global_step": 381228, "epoch": 4593} {"train_loss": -25.99301528930664, "global_step": 381229, "epoch": 4593} {"train_loss": -26.162504196166992, "global_step": 381230, "epoch": 4593} {"train_loss": -26.129743576049805, "global_step": 381231, "epoch": 4593} {"train_loss": -26.05744743347168, "global_step": 381232, "epoch": 4593} {"train_loss": -26.054859161376953, "global_step": 381233, "epoch": 4593} {"train_loss": -26.394861221313477, "global_step": 381234, "epoch": 4593} {"train_loss": -26.229175567626953, "global_step": 381235, "epoch": 4593} {"train_loss": -26.210468292236328, "global_step": 381236, "epoch": 4593} {"train_loss": -26.134479522705078, "global_step": 381237, "epoch": 4593} {"train_loss": -26.2066650390625, "global_step": 381238, "epoch": 4593} {"train_loss": -26.663305282592773, "global_step": 381239, "epoch": 4593} {"train_loss": -26.338998794555664, "global_step": 381240, "epoch": 4593} {"train_loss": -26.079925537109375, "global_step": 381241, "epoch": 4593} {"train_loss": -26.632909774780273, "global_step": 381242, "epoch": 4593} {"train_loss": -26.214231491088867, "global_step": 381243, "epoch": 4593} {"train_loss": -26.030099868774414, "global_step": 381244, "epoch": 4593} {"train_loss": -26.298282623291016, "global_step": 381245, "epoch": 4593} {"train_loss": -26.34893798828125, "global_step": 381246, "epoch": 4593} {"train_loss": -26.556598663330078, "global_step": 381247, "epoch": 4593} {"train_loss": -26.352264404296875, "global_step": 381248, "epoch": 4593} {"train_loss": -26.144641876220703, "global_step": 381249, "epoch": 4593} {"train_loss": -26.100799560546875, "global_step": 381250, "epoch": 4593} {"train_loss": -26.26801109313965, "global_step": 381251, "epoch": 4593} {"train_loss": -26.32606315612793, "global_step": 381252, "epoch": 4593} {"train_loss": -26.058103561401367, "global_step": 381253, "epoch": 4593} {"train_loss": -26.286909103393555, "global_step": 381254, "epoch": 4593} {"train_loss": -26.582290649414062, "global_step": 381255, "epoch": 4593} {"train_loss": -26.523773193359375, "global_step": 381256, "epoch": 4593} {"train_loss": -26.15030860900879, "global_step": 381257, "epoch": 4593} {"train_loss": -26.626453399658203, "global_step": 381258, "epoch": 4593} {"train_loss": -26.38360023498535, "global_step": 381259, "epoch": 4593} {"train_loss": -26.62360191345215, "global_step": 381260, "epoch": 4593} {"train_loss": -26.20119285583496, "global_step": 381261, "epoch": 4593} {"train_loss": -26.7109375, "global_step": 381262, "epoch": 4593} {"train_loss": -26.375471115112305, "global_step": 381263, "epoch": 4593} {"train_loss": -26.507980346679688, "global_step": 381264, "epoch": 4593} {"train_loss": -26.32514762878418, "global_step": 381265, "epoch": 4593} {"train_loss": -26.694015502929688, "global_step": 381266, "epoch": 4593} {"train_loss": -26.577497482299805, "global_step": 381267, "epoch": 4593} {"train_loss": -26.201520919799805, "global_step": 381268, "epoch": 4593} {"train_loss": -27.018091201782227, "global_step": 381269, "epoch": 4593} {"train_loss": -26.633386611938477, "global_step": 381270, "epoch": 4593} {"train_loss": -26.582563400268555, "global_step": 381271, "epoch": 4593} {"train_loss": -26.25520896911621, "global_step": 381272, "epoch": 4593} {"train_loss": -26.8522891998291, "global_step": 381273, "epoch": 4593} {"train_loss": -26.703744888305664, "global_step": 381274, "epoch": 4593} {"train_loss": -26.34234046936035, "global_step": 381275, "epoch": 4593} {"train_loss": -26.383359909057617, "global_step": 381276, "epoch": 4593} {"train_loss": -26.22003173828125, "global_step": 381277, "epoch": 4593} {"train_loss": -26.675195693969727, "global_step": 381278, "epoch": 4593} {"train_loss": -26.382415771484375, "global_step": 381279, "epoch": 4593} {"train_loss": -26.55120849609375, "global_step": 381280, "epoch": 4593} {"train_loss": -26.062726974487305, "global_step": 381281, "epoch": 4593} {"train_loss": -26.489294052124023, "global_step": 381282, "epoch": 4593} {"train_loss": -26.854034423828125, "global_step": 381283, "epoch": 4593} {"train_loss": -26.522180557250977, "global_step": 381284, "epoch": 4593} {"train_loss": -26.259374618530273, "global_step": 381285, "epoch": 4593} {"train_loss": -26.395263671875, "global_step": 381286, "epoch": 4593} {"train_loss": -26.36333656311035, "global_step": 381287, "epoch": 4593} {"train_loss": -26.333616256713867, "global_step": 381288, "epoch": 4593} {"train_loss": -26.338825225830078, "global_step": 381289, "epoch": 4593} {"train_loss": -26.321012496948242, "global_step": 381290, "epoch": 4593} {"train_loss": -26.615631103515625, "global_step": 381291, "epoch": 4593} {"train_loss": -26.480823516845703, "global_step": 381292, "epoch": 4593} {"train_loss": -26.3259220123291, "global_step": 381293, "epoch": 4593} {"train_loss": -26.488651275634766, "global_step": 381294, "epoch": 4593} {"train_loss": -26.697189331054688, "global_step": 381295, "epoch": 4593} {"train_loss": -26.27699089050293, "global_step": 381296, "epoch": 4593} {"train_loss": -26.573047637939453, "global_step": 381297, "epoch": 4593} {"train_loss": -26.403676986694336, "global_step": 381298, "epoch": 4593} {"train_loss": -26.6209774017334, "global_step": 381299, "epoch": 4593} {"train_loss": -26.348175048828125, "global_step": 381300, "epoch": 4593} {"train_loss": -26.35425349315965, "global_step": 381301, "epoch": 4593, "val_loss": 6547774.0} {"train_loss": -25.162736892700195, "global_step": 381302, "epoch": 4594} {"train_loss": -25.315340042114258, "global_step": 381303, "epoch": 4594} {"train_loss": -26.161916732788086, "global_step": 381304, "epoch": 4594} {"train_loss": -25.95233154296875, "global_step": 381305, "epoch": 4594} {"train_loss": -25.8690242767334, "global_step": 381306, "epoch": 4594} {"train_loss": -25.797582626342773, "global_step": 381307, "epoch": 4594} {"train_loss": -26.20534324645996, "global_step": 381308, "epoch": 4594} {"train_loss": -25.842975616455078, "global_step": 381309, "epoch": 4594} {"train_loss": -26.327320098876953, "global_step": 381310, "epoch": 4594} {"train_loss": -26.253833770751953, "global_step": 381311, "epoch": 4594} {"train_loss": -26.123275756835938, "global_step": 381312, "epoch": 4594} {"train_loss": -26.63214111328125, "global_step": 381313, "epoch": 4594} {"train_loss": -25.671606063842773, "global_step": 381314, "epoch": 4594} {"train_loss": -26.30506706237793, "global_step": 381315, "epoch": 4594} {"train_loss": -26.10772705078125, "global_step": 381316, "epoch": 4594} {"train_loss": -26.300460815429688, "global_step": 381317, "epoch": 4594} {"train_loss": -26.51739501953125, "global_step": 381318, "epoch": 4594} {"train_loss": -26.410572052001953, "global_step": 381319, "epoch": 4594} {"train_loss": -26.617279052734375, "global_step": 381320, "epoch": 4594} {"train_loss": -26.26959800720215, "global_step": 381321, "epoch": 4594} {"train_loss": -26.286767959594727, "global_step": 381322, "epoch": 4594} {"train_loss": -26.262771606445312, "global_step": 381323, "epoch": 4594} {"train_loss": -26.217687606811523, "global_step": 381324, "epoch": 4594} {"train_loss": -26.600101470947266, "global_step": 381325, "epoch": 4594} {"train_loss": -26.444660186767578, "global_step": 381326, "epoch": 4594} {"train_loss": -26.254125595092773, "global_step": 381327, "epoch": 4594} {"train_loss": -26.51723289489746, "global_step": 381328, "epoch": 4594} {"train_loss": -26.52256202697754, "global_step": 381329, "epoch": 4594} {"train_loss": -26.306684494018555, "global_step": 381330, "epoch": 4594} {"train_loss": -26.644208908081055, "global_step": 381331, "epoch": 4594} {"train_loss": -26.216611862182617, "global_step": 381332, "epoch": 4594} {"train_loss": -26.48395347595215, "global_step": 381333, "epoch": 4594} {"train_loss": -26.486637115478516, "global_step": 381334, "epoch": 4594} {"train_loss": -26.515365600585938, "global_step": 381335, "epoch": 4594} {"train_loss": -26.354095458984375, "global_step": 381336, "epoch": 4594} {"train_loss": -26.460668563842773, "global_step": 381337, "epoch": 4594} {"train_loss": -25.98833656311035, "global_step": 381338, "epoch": 4594} {"train_loss": -26.5839786529541, "global_step": 381339, "epoch": 4594} {"train_loss": -26.154499053955078, "global_step": 381340, "epoch": 4594} {"train_loss": -26.751453399658203, "global_step": 381341, "epoch": 4594} {"train_loss": -26.62558937072754, "global_step": 381342, "epoch": 4594} {"train_loss": -26.69171142578125, "global_step": 381343, "epoch": 4594} {"train_loss": -26.3323917388916, "global_step": 381344, "epoch": 4594} {"train_loss": -26.769132614135742, "global_step": 381345, "epoch": 4594} {"train_loss": -26.5794734954834, "global_step": 381346, "epoch": 4594} {"train_loss": -26.448034286499023, "global_step": 381347, "epoch": 4594} {"train_loss": -26.65960121154785, "global_step": 381348, "epoch": 4594} {"train_loss": -26.54473304748535, "global_step": 381349, "epoch": 4594} {"train_loss": -26.68755531311035, "global_step": 381350, "epoch": 4594} {"train_loss": -26.58784294128418, "global_step": 381351, "epoch": 4594} {"train_loss": -26.620941162109375, "global_step": 381352, "epoch": 4594} {"train_loss": -26.396596908569336, "global_step": 381353, "epoch": 4594} {"train_loss": -26.318395614624023, "global_step": 381354, "epoch": 4594} {"train_loss": -26.737592697143555, "global_step": 381355, "epoch": 4594} {"train_loss": -26.646650314331055, "global_step": 381356, "epoch": 4594} {"train_loss": -26.503049850463867, "global_step": 381357, "epoch": 4594} {"train_loss": -26.4979190826416, "global_step": 381358, "epoch": 4594} {"train_loss": -26.133275985717773, "global_step": 381359, "epoch": 4594} {"train_loss": -26.4649715423584, "global_step": 381360, "epoch": 4594} {"train_loss": -25.583675384521484, "global_step": 381361, "epoch": 4594} {"train_loss": -25.660242080688477, "global_step": 381362, "epoch": 4594} {"train_loss": -25.83307456970215, "global_step": 381363, "epoch": 4594} {"train_loss": -25.74152183532715, "global_step": 381364, "epoch": 4594} {"train_loss": -26.50439453125, "global_step": 381365, "epoch": 4594} {"train_loss": -26.357877731323242, "global_step": 381366, "epoch": 4594} {"train_loss": -26.05323600769043, "global_step": 381367, "epoch": 4594} {"train_loss": -26.206457138061523, "global_step": 381368, "epoch": 4594} {"train_loss": -26.39275550842285, "global_step": 381369, "epoch": 4594} {"train_loss": -26.34821128845215, "global_step": 381370, "epoch": 4594} {"train_loss": -26.29764175415039, "global_step": 381371, "epoch": 4594} {"train_loss": -26.24917984008789, "global_step": 381372, "epoch": 4594} {"train_loss": -26.1517276763916, "global_step": 381373, "epoch": 4594} {"train_loss": -26.72625732421875, "global_step": 381374, "epoch": 4594} {"train_loss": -26.014219284057617, "global_step": 381375, "epoch": 4594} {"train_loss": -26.39681053161621, "global_step": 381376, "epoch": 4594} {"train_loss": -26.47443962097168, "global_step": 381377, "epoch": 4594} {"train_loss": -26.149206161499023, "global_step": 381378, "epoch": 4594} {"train_loss": -26.445531845092773, "global_step": 381379, "epoch": 4594} {"train_loss": -26.151620864868164, "global_step": 381380, "epoch": 4594} {"train_loss": -26.542306900024414, "global_step": 381381, "epoch": 4594} {"train_loss": -26.54282569885254, "global_step": 381382, "epoch": 4594} {"train_loss": -25.90064811706543, "global_step": 381383, "epoch": 4594} {"train_loss": -26.324256046708808, "global_step": 381384, "epoch": 4594, "val_loss": 6573893.0} {"train_loss": -25.316125869750977, "global_step": 381385, "epoch": 4595} {"train_loss": -24.864212036132812, "global_step": 381386, "epoch": 4595} {"train_loss": -26.113265991210938, "global_step": 381387, "epoch": 4595} {"train_loss": -25.685651779174805, "global_step": 381388, "epoch": 4595} {"train_loss": -26.058292388916016, "global_step": 381389, "epoch": 4595} {"train_loss": -25.68305778503418, "global_step": 381390, "epoch": 4595} {"train_loss": -25.836469650268555, "global_step": 381391, "epoch": 4595} {"train_loss": -26.103551864624023, "global_step": 381392, "epoch": 4595} {"train_loss": -25.91117286682129, "global_step": 381393, "epoch": 4595} {"train_loss": -26.529150009155273, "global_step": 381394, "epoch": 4595} {"train_loss": -25.88102149963379, "global_step": 381395, "epoch": 4595} {"train_loss": -26.4459285736084, "global_step": 381396, "epoch": 4595} {"train_loss": -25.91162109375, "global_step": 381397, "epoch": 4595} {"train_loss": -26.17152214050293, "global_step": 381398, "epoch": 4595} {"train_loss": -26.085346221923828, "global_step": 381399, "epoch": 4595} {"train_loss": -26.1567440032959, "global_step": 381400, "epoch": 4595} {"train_loss": -26.267053604125977, "global_step": 381401, "epoch": 4595} {"train_loss": -25.95355796813965, "global_step": 381402, "epoch": 4595} {"train_loss": -25.916122436523438, "global_step": 381403, "epoch": 4595} {"train_loss": -26.16827964782715, "global_step": 381404, "epoch": 4595} {"train_loss": -26.327672958374023, "global_step": 381405, "epoch": 4595} {"train_loss": -26.400314331054688, "global_step": 381406, "epoch": 4595} {"train_loss": -26.518909454345703, "global_step": 381407, "epoch": 4595} {"train_loss": -26.480268478393555, "global_step": 381408, "epoch": 4595} {"train_loss": -26.440393447875977, "global_step": 381409, "epoch": 4595} {"train_loss": -26.509185791015625, "global_step": 381410, "epoch": 4595} {"train_loss": -26.73345947265625, "global_step": 381411, "epoch": 4595} {"train_loss": -26.473630905151367, "global_step": 381412, "epoch": 4595} {"train_loss": -26.85393714904785, "global_step": 381413, "epoch": 4595} {"train_loss": -26.585926055908203, "global_step": 381414, "epoch": 4595} {"train_loss": -26.466236114501953, "global_step": 381415, "epoch": 4595} {"train_loss": -26.618497848510742, "global_step": 381416, "epoch": 4595} {"train_loss": -26.652368545532227, "global_step": 381417, "epoch": 4595} {"train_loss": -26.19880485534668, "global_step": 381418, "epoch": 4595} {"train_loss": -26.3372745513916, "global_step": 381419, "epoch": 4595} {"train_loss": -26.16251564025879, "global_step": 381420, "epoch": 4595} {"train_loss": -26.714435577392578, "global_step": 381421, "epoch": 4595} {"train_loss": -26.72181510925293, "global_step": 381422, "epoch": 4595} {"train_loss": -26.354907989501953, "global_step": 381423, "epoch": 4595} {"train_loss": -26.61849021911621, "global_step": 381424, "epoch": 4595} {"train_loss": -26.417402267456055, "global_step": 381425, "epoch": 4595} {"train_loss": -26.671850204467773, "global_step": 381426, "epoch": 4595} {"train_loss": -26.8088436126709, "global_step": 381427, "epoch": 4595} {"train_loss": -26.44231605529785, "global_step": 381428, "epoch": 4595} {"train_loss": -26.897857666015625, "global_step": 381429, "epoch": 4595} {"train_loss": -26.66676902770996, "global_step": 381430, "epoch": 4595} {"train_loss": -26.683624267578125, "global_step": 381431, "epoch": 4595} {"train_loss": -26.7490177154541, "global_step": 381432, "epoch": 4595} {"train_loss": -26.8699893951416, "global_step": 381433, "epoch": 4595} {"train_loss": -26.748172760009766, "global_step": 381434, "epoch": 4595} {"train_loss": -26.845136642456055, "global_step": 381435, "epoch": 4595} {"train_loss": -26.590356826782227, "global_step": 381436, "epoch": 4595} {"train_loss": -26.31556510925293, "global_step": 381437, "epoch": 4595} {"train_loss": -27.127704620361328, "global_step": 381438, "epoch": 4595} {"train_loss": -26.57685661315918, "global_step": 381439, "epoch": 4595} {"train_loss": -26.557828903198242, "global_step": 381440, "epoch": 4595} {"train_loss": -26.621877670288086, "global_step": 381441, "epoch": 4595} {"train_loss": -26.730976104736328, "global_step": 381442, "epoch": 4595} {"train_loss": -26.611331939697266, "global_step": 381443, "epoch": 4595} {"train_loss": -26.34442138671875, "global_step": 381444, "epoch": 4595} {"train_loss": -26.442737579345703, "global_step": 381445, "epoch": 4595} {"train_loss": -25.570484161376953, "global_step": 381446, "epoch": 4595} {"train_loss": -24.82967758178711, "global_step": 381447, "epoch": 4595} {"train_loss": -24.31852149963379, "global_step": 381448, "epoch": 4595} {"train_loss": -25.03482437133789, "global_step": 381449, "epoch": 4595} {"train_loss": -26.019012451171875, "global_step": 381450, "epoch": 4595} {"train_loss": -25.534509658813477, "global_step": 381451, "epoch": 4595} {"train_loss": -25.268692016601562, "global_step": 381452, "epoch": 4595} {"train_loss": -25.819807052612305, "global_step": 381453, "epoch": 4595} {"train_loss": -25.795434951782227, "global_step": 381454, "epoch": 4595} {"train_loss": -26.093252182006836, "global_step": 381455, "epoch": 4595} {"train_loss": -25.269067764282227, "global_step": 381456, "epoch": 4595} {"train_loss": -26.224811553955078, "global_step": 381457, "epoch": 4595} {"train_loss": -25.9843692779541, "global_step": 381458, "epoch": 4595} {"train_loss": -25.86090087890625, "global_step": 381459, "epoch": 4595} {"train_loss": -26.181543350219727, "global_step": 381460, "epoch": 4595} {"train_loss": -26.31646156311035, "global_step": 381461, "epoch": 4595} {"train_loss": -26.01523208618164, "global_step": 381462, "epoch": 4595} {"train_loss": -25.898544311523438, "global_step": 381463, "epoch": 4595} {"train_loss": -26.340322494506836, "global_step": 381464, "epoch": 4595} {"train_loss": -26.40870475769043, "global_step": 381465, "epoch": 4595} {"train_loss": -26.269006729125977, "global_step": 381466, "epoch": 4595} {"train_loss": -26.208465599151978, "global_step": 381467, "epoch": 4595, "val_loss": 6581811.0} {"train_loss": -26.09775161743164, "global_step": 381468, "epoch": 4596} {"train_loss": -25.81195068359375, "global_step": 381469, "epoch": 4596} {"train_loss": -25.61101722717285, "global_step": 381470, "epoch": 4596} {"train_loss": -25.84480094909668, "global_step": 381471, "epoch": 4596} {"train_loss": -25.70560073852539, "global_step": 381472, "epoch": 4596} {"train_loss": -26.606958389282227, "global_step": 381473, "epoch": 4596} {"train_loss": -26.1759090423584, "global_step": 381474, "epoch": 4596} {"train_loss": -26.281721115112305, "global_step": 381475, "epoch": 4596} {"train_loss": -26.17656898498535, "global_step": 381476, "epoch": 4596} {"train_loss": -26.06496238708496, "global_step": 381477, "epoch": 4596} {"train_loss": -26.14725685119629, "global_step": 381478, "epoch": 4596} {"train_loss": -26.251758575439453, "global_step": 381479, "epoch": 4596} {"train_loss": -26.3697509765625, "global_step": 381480, "epoch": 4596} {"train_loss": -26.179702758789062, "global_step": 381481, "epoch": 4596} {"train_loss": -26.40619468688965, "global_step": 381482, "epoch": 4596} {"train_loss": -25.931365966796875, "global_step": 381483, "epoch": 4596} {"train_loss": -26.616138458251953, "global_step": 381484, "epoch": 4596} {"train_loss": -26.439496994018555, "global_step": 381485, "epoch": 4596} {"train_loss": -26.571298599243164, "global_step": 381486, "epoch": 4596} {"train_loss": -26.15089225769043, "global_step": 381487, "epoch": 4596} {"train_loss": -26.234100341796875, "global_step": 381488, "epoch": 4596} {"train_loss": -26.03339195251465, "global_step": 381489, "epoch": 4596} {"train_loss": -26.338592529296875, "global_step": 381490, "epoch": 4596} {"train_loss": -26.2689266204834, "global_step": 381491, "epoch": 4596} {"train_loss": -26.221349716186523, "global_step": 381492, "epoch": 4596} {"train_loss": -26.249067306518555, "global_step": 381493, "epoch": 4596} {"train_loss": -26.2992000579834, "global_step": 381494, "epoch": 4596} {"train_loss": -26.718358993530273, "global_step": 381495, "epoch": 4596} {"train_loss": -26.088544845581055, "global_step": 381496, "epoch": 4596} {"train_loss": -26.76020622253418, "global_step": 381497, "epoch": 4596} {"train_loss": -26.445127487182617, "global_step": 381498, "epoch": 4596} {"train_loss": -26.740060806274414, "global_step": 381499, "epoch": 4596} {"train_loss": -26.589155197143555, "global_step": 381500, "epoch": 4596} {"train_loss": -26.42927360534668, "global_step": 381501, "epoch": 4596} {"train_loss": -26.353620529174805, "global_step": 381502, "epoch": 4596} {"train_loss": -26.458913803100586, "global_step": 381503, "epoch": 4596} {"train_loss": -26.503726959228516, "global_step": 381504, "epoch": 4596} {"train_loss": -26.740955352783203, "global_step": 381505, "epoch": 4596} {"train_loss": -26.343793869018555, "global_step": 381506, "epoch": 4596} {"train_loss": -26.875244140625, "global_step": 381507, "epoch": 4596} {"train_loss": -26.27703285217285, "global_step": 381508, "epoch": 4596} {"train_loss": -26.845251083374023, "global_step": 381509, "epoch": 4596} {"train_loss": -26.4069881439209, "global_step": 381510, "epoch": 4596} {"train_loss": -26.377233505249023, "global_step": 381511, "epoch": 4596} {"train_loss": -26.178009033203125, "global_step": 381512, "epoch": 4596} {"train_loss": -26.32805824279785, "global_step": 381513, "epoch": 4596} {"train_loss": -26.432209014892578, "global_step": 381514, "epoch": 4596} {"train_loss": -26.922454833984375, "global_step": 381515, "epoch": 4596} {"train_loss": -26.757429122924805, "global_step": 381516, "epoch": 4596} {"train_loss": -26.71607780456543, "global_step": 381517, "epoch": 4596} {"train_loss": -26.248743057250977, "global_step": 381518, "epoch": 4596} {"train_loss": -26.640100479125977, "global_step": 381519, "epoch": 4596} {"train_loss": -26.292041778564453, "global_step": 381520, "epoch": 4596} {"train_loss": -26.842838287353516, "global_step": 381521, "epoch": 4596} {"train_loss": -26.185199737548828, "global_step": 381522, "epoch": 4596} {"train_loss": -26.03822135925293, "global_step": 381523, "epoch": 4596} {"train_loss": -25.878164291381836, "global_step": 381524, "epoch": 4596} {"train_loss": -25.13681983947754, "global_step": 381525, "epoch": 4596} {"train_loss": -25.53057861328125, "global_step": 381526, "epoch": 4596} {"train_loss": -26.168893814086914, "global_step": 381527, "epoch": 4596} {"train_loss": -26.503616333007812, "global_step": 381528, "epoch": 4596} {"train_loss": -25.87542152404785, "global_step": 381529, "epoch": 4596} {"train_loss": -26.320234298706055, "global_step": 381530, "epoch": 4596} {"train_loss": -26.834278106689453, "global_step": 381531, "epoch": 4596} {"train_loss": -26.256591796875, "global_step": 381532, "epoch": 4596} {"train_loss": -26.399627685546875, "global_step": 381533, "epoch": 4596} {"train_loss": -26.287738800048828, "global_step": 381534, "epoch": 4596} {"train_loss": -26.433263778686523, "global_step": 381535, "epoch": 4596} {"train_loss": -26.393728256225586, "global_step": 381536, "epoch": 4596} {"train_loss": -26.9075984954834, "global_step": 381537, "epoch": 4596} {"train_loss": -26.34099769592285, "global_step": 381538, "epoch": 4596} {"train_loss": -26.69071388244629, "global_step": 381539, "epoch": 4596} {"train_loss": -26.477563858032227, "global_step": 381540, "epoch": 4596} {"train_loss": -26.53021240234375, "global_step": 381541, "epoch": 4596} {"train_loss": -26.231428146362305, "global_step": 381542, "epoch": 4596} {"train_loss": -26.395313262939453, "global_step": 381543, "epoch": 4596} {"train_loss": -26.475427627563477, "global_step": 381544, "epoch": 4596} {"train_loss": -26.723358154296875, "global_step": 381545, "epoch": 4596} {"train_loss": -26.521957397460938, "global_step": 381546, "epoch": 4596} {"train_loss": -26.601964950561523, "global_step": 381547, "epoch": 4596} {"train_loss": -26.316604614257812, "global_step": 381548, "epoch": 4596} {"train_loss": -26.819076538085938, "global_step": 381549, "epoch": 4596} {"train_loss": -26.348377825265906, "global_step": 381550, "epoch": 4596, "val_loss": 6502724.5} {"train_loss": -25.54286003112793, "global_step": 381551, "epoch": 4597} {"train_loss": -26.31332778930664, "global_step": 381552, "epoch": 4597} {"train_loss": -26.066015243530273, "global_step": 381553, "epoch": 4597} {"train_loss": -25.787628173828125, "global_step": 381554, "epoch": 4597} {"train_loss": -25.661483764648438, "global_step": 381555, "epoch": 4597} {"train_loss": -26.208984375, "global_step": 381556, "epoch": 4597} {"train_loss": -25.801923751831055, "global_step": 381557, "epoch": 4597} {"train_loss": -25.920377731323242, "global_step": 381558, "epoch": 4597} {"train_loss": -26.53181266784668, "global_step": 381559, "epoch": 4597} {"train_loss": -26.29804801940918, "global_step": 381560, "epoch": 4597} {"train_loss": -26.361621856689453, "global_step": 381561, "epoch": 4597} {"train_loss": -26.065759658813477, "global_step": 381562, "epoch": 4597} {"train_loss": -26.514236450195312, "global_step": 381563, "epoch": 4597} {"train_loss": -26.143299102783203, "global_step": 381564, "epoch": 4597} {"train_loss": -26.459259033203125, "global_step": 381565, "epoch": 4597} {"train_loss": -26.31133460998535, "global_step": 381566, "epoch": 4597} {"train_loss": -26.285247802734375, "global_step": 381567, "epoch": 4597} {"train_loss": -26.287139892578125, "global_step": 381568, "epoch": 4597} {"train_loss": -26.177724838256836, "global_step": 381569, "epoch": 4597} {"train_loss": -26.33001136779785, "global_step": 381570, "epoch": 4597} {"train_loss": -26.4517822265625, "global_step": 381571, "epoch": 4597} {"train_loss": -26.674793243408203, "global_step": 381572, "epoch": 4597} {"train_loss": -26.60712242126465, "global_step": 381573, "epoch": 4597} {"train_loss": -26.2263126373291, "global_step": 381574, "epoch": 4597} {"train_loss": -26.616134643554688, "global_step": 381575, "epoch": 4597} {"train_loss": -26.656757354736328, "global_step": 381576, "epoch": 4597} {"train_loss": -26.70438575744629, "global_step": 381577, "epoch": 4597} {"train_loss": -26.54682731628418, "global_step": 381578, "epoch": 4597} {"train_loss": -26.551471710205078, "global_step": 381579, "epoch": 4597} {"train_loss": -26.409778594970703, "global_step": 381580, "epoch": 4597} {"train_loss": -26.378360748291016, "global_step": 381581, "epoch": 4597} {"train_loss": -26.4276065826416, "global_step": 381582, "epoch": 4597} {"train_loss": -26.534814834594727, "global_step": 381583, "epoch": 4597} {"train_loss": -26.348651885986328, "global_step": 381584, "epoch": 4597} {"train_loss": -26.577350616455078, "global_step": 381585, "epoch": 4597} {"train_loss": -26.503204345703125, "global_step": 381586, "epoch": 4597} {"train_loss": -26.210203170776367, "global_step": 381587, "epoch": 4597} {"train_loss": -26.12455177307129, "global_step": 381588, "epoch": 4597} {"train_loss": -26.264938354492188, "global_step": 381589, "epoch": 4597} {"train_loss": -26.696348190307617, "global_step": 381590, "epoch": 4597} {"train_loss": -26.441959381103516, "global_step": 381591, "epoch": 4597} {"train_loss": -26.571802139282227, "global_step": 381592, "epoch": 4597} {"train_loss": -26.69862937927246, "global_step": 381593, "epoch": 4597} {"train_loss": -26.524463653564453, "global_step": 381594, "epoch": 4597} {"train_loss": -26.26288414001465, "global_step": 381595, "epoch": 4597} {"train_loss": -26.36978530883789, "global_step": 381596, "epoch": 4597} {"train_loss": -26.40448570251465, "global_step": 381597, "epoch": 4597} {"train_loss": -26.346708297729492, "global_step": 381598, "epoch": 4597} {"train_loss": -26.338666915893555, "global_step": 381599, "epoch": 4597} {"train_loss": -26.67999267578125, "global_step": 381600, "epoch": 4597} {"train_loss": -26.604650497436523, "global_step": 381601, "epoch": 4597} {"train_loss": -26.59783363342285, "global_step": 381602, "epoch": 4597} {"train_loss": -26.520065307617188, "global_step": 381603, "epoch": 4597} {"train_loss": -26.680017471313477, "global_step": 381604, "epoch": 4597} {"train_loss": -26.475341796875, "global_step": 381605, "epoch": 4597} {"train_loss": -26.365463256835938, "global_step": 381606, "epoch": 4597} {"train_loss": -26.411422729492188, "global_step": 381607, "epoch": 4597} {"train_loss": -26.5041561126709, "global_step": 381608, "epoch": 4597} {"train_loss": -26.532394409179688, "global_step": 381609, "epoch": 4597} {"train_loss": -26.474050521850586, "global_step": 381610, "epoch": 4597} {"train_loss": -26.435461044311523, "global_step": 381611, "epoch": 4597} {"train_loss": -26.232580184936523, "global_step": 381612, "epoch": 4597} {"train_loss": -26.448535919189453, "global_step": 381613, "epoch": 4597} {"train_loss": -26.778533935546875, "global_step": 381614, "epoch": 4597} {"train_loss": -26.250757217407227, "global_step": 381615, "epoch": 4597} {"train_loss": -26.36997413635254, "global_step": 381616, "epoch": 4597} {"train_loss": -26.515735626220703, "global_step": 381617, "epoch": 4597} {"train_loss": -26.516393661499023, "global_step": 381618, "epoch": 4597} {"train_loss": -26.25583267211914, "global_step": 381619, "epoch": 4597} {"train_loss": -26.551013946533203, "global_step": 381620, "epoch": 4597} {"train_loss": -26.68611717224121, "global_step": 381621, "epoch": 4597} {"train_loss": -25.915328979492188, "global_step": 381622, "epoch": 4597} {"train_loss": -26.596296310424805, "global_step": 381623, "epoch": 4597} {"train_loss": -26.491498947143555, "global_step": 381624, "epoch": 4597} {"train_loss": -26.580097198486328, "global_step": 381625, "epoch": 4597} {"train_loss": -26.521839141845703, "global_step": 381626, "epoch": 4597} {"train_loss": -26.393112182617188, "global_step": 381627, "epoch": 4597} {"train_loss": -26.32573890686035, "global_step": 381628, "epoch": 4597} {"train_loss": -26.544519424438477, "global_step": 381629, "epoch": 4597} {"train_loss": -26.034488677978516, "global_step": 381630, "epoch": 4597} {"train_loss": -26.348499298095703, "global_step": 381631, "epoch": 4597} {"train_loss": -26.422067642211914, "global_step": 381632, "epoch": 4597} {"train_loss": -26.40093782723668, "global_step": 381633, "epoch": 4597, "val_loss": 6613991.0} {"train_loss": -25.674346923828125, "global_step": 381634, "epoch": 4598} {"train_loss": -25.777597427368164, "global_step": 381635, "epoch": 4598} {"train_loss": -25.281782150268555, "global_step": 381636, "epoch": 4598} {"train_loss": -25.884374618530273, "global_step": 381637, "epoch": 4598} {"train_loss": -25.8582820892334, "global_step": 381638, "epoch": 4598} {"train_loss": -25.959577560424805, "global_step": 381639, "epoch": 4598} {"train_loss": -25.6248836517334, "global_step": 381640, "epoch": 4598} {"train_loss": -25.7148380279541, "global_step": 381641, "epoch": 4598} {"train_loss": -25.200971603393555, "global_step": 381642, "epoch": 4598} {"train_loss": -25.723764419555664, "global_step": 381643, "epoch": 4598} {"train_loss": -25.81500244140625, "global_step": 381644, "epoch": 4598} {"train_loss": -26.073190689086914, "global_step": 381645, "epoch": 4598} {"train_loss": -25.836746215820312, "global_step": 381646, "epoch": 4598} {"train_loss": -26.0439395904541, "global_step": 381647, "epoch": 4598} {"train_loss": -26.26140785217285, "global_step": 381648, "epoch": 4598} {"train_loss": -25.7918758392334, "global_step": 381649, "epoch": 4598} {"train_loss": -26.283329010009766, "global_step": 381650, "epoch": 4598} {"train_loss": -26.2005558013916, "global_step": 381651, "epoch": 4598} {"train_loss": -25.957494735717773, "global_step": 381652, "epoch": 4598} {"train_loss": -26.463510513305664, "global_step": 381653, "epoch": 4598} {"train_loss": -26.390592575073242, "global_step": 381654, "epoch": 4598} {"train_loss": -26.20244789123535, "global_step": 381655, "epoch": 4598} {"train_loss": -26.072834014892578, "global_step": 381656, "epoch": 4598} {"train_loss": -26.2757568359375, "global_step": 381657, "epoch": 4598} {"train_loss": -26.42115592956543, "global_step": 381658, "epoch": 4598} {"train_loss": -26.251148223876953, "global_step": 381659, "epoch": 4598} {"train_loss": -26.828567504882812, "global_step": 381660, "epoch": 4598} {"train_loss": -26.431344985961914, "global_step": 381661, "epoch": 4598} {"train_loss": -26.424545288085938, "global_step": 381662, "epoch": 4598} {"train_loss": -26.839202880859375, "global_step": 381663, "epoch": 4598} {"train_loss": -26.4668025970459, "global_step": 381664, "epoch": 4598} {"train_loss": -26.428848266601562, "global_step": 381665, "epoch": 4598} {"train_loss": -26.61358642578125, "global_step": 381666, "epoch": 4598} {"train_loss": -26.505603790283203, "global_step": 381667, "epoch": 4598} {"train_loss": -26.708471298217773, "global_step": 381668, "epoch": 4598} {"train_loss": -26.625473022460938, "global_step": 381669, "epoch": 4598} {"train_loss": -26.801267623901367, "global_step": 381670, "epoch": 4598} {"train_loss": -26.7674617767334, "global_step": 381671, "epoch": 4598} {"train_loss": -26.189294815063477, "global_step": 381672, "epoch": 4598} {"train_loss": -26.09132194519043, "global_step": 381673, "epoch": 4598} {"train_loss": -26.444812774658203, "global_step": 381674, "epoch": 4598} {"train_loss": -26.643238067626953, "global_step": 381675, "epoch": 4598} {"train_loss": -26.685998916625977, "global_step": 381676, "epoch": 4598} {"train_loss": -26.33377456665039, "global_step": 381677, "epoch": 4598} {"train_loss": -26.709028244018555, "global_step": 381678, "epoch": 4598} {"train_loss": -26.435514450073242, "global_step": 381679, "epoch": 4598} {"train_loss": -26.408933639526367, "global_step": 381680, "epoch": 4598} {"train_loss": -26.451147079467773, "global_step": 381681, "epoch": 4598} {"train_loss": -26.488134384155273, "global_step": 381682, "epoch": 4598} {"train_loss": -26.752777099609375, "global_step": 381683, "epoch": 4598} {"train_loss": -26.39851951599121, "global_step": 381684, "epoch": 4598} {"train_loss": -26.411834716796875, "global_step": 381685, "epoch": 4598} {"train_loss": -27.000707626342773, "global_step": 381686, "epoch": 4598} {"train_loss": -26.47651481628418, "global_step": 381687, "epoch": 4598} {"train_loss": -26.509275436401367, "global_step": 381688, "epoch": 4598} {"train_loss": -26.47528648376465, "global_step": 381689, "epoch": 4598} {"train_loss": -26.45619010925293, "global_step": 381690, "epoch": 4598} {"train_loss": -26.595035552978516, "global_step": 381691, "epoch": 4598} {"train_loss": -26.8840389251709, "global_step": 381692, "epoch": 4598} {"train_loss": -26.64530372619629, "global_step": 381693, "epoch": 4598} {"train_loss": -26.499094009399414, "global_step": 381694, "epoch": 4598} {"train_loss": -26.68572998046875, "global_step": 381695, "epoch": 4598} {"train_loss": -26.663619995117188, "global_step": 381696, "epoch": 4598} {"train_loss": -26.6954288482666, "global_step": 381697, "epoch": 4598} {"train_loss": -26.51728630065918, "global_step": 381698, "epoch": 4598} {"train_loss": -26.725126266479492, "global_step": 381699, "epoch": 4598} {"train_loss": -26.465545654296875, "global_step": 381700, "epoch": 4598} {"train_loss": -26.65848731994629, "global_step": 381701, "epoch": 4598} {"train_loss": -26.62513542175293, "global_step": 381702, "epoch": 4598} {"train_loss": -26.129199981689453, "global_step": 381703, "epoch": 4598} {"train_loss": -26.30517578125, "global_step": 381704, "epoch": 4598} {"train_loss": -26.916248321533203, "global_step": 381705, "epoch": 4598} {"train_loss": -26.493513107299805, "global_step": 381706, "epoch": 4598} {"train_loss": -26.62408447265625, "global_step": 381707, "epoch": 4598} {"train_loss": -26.58064079284668, "global_step": 381708, "epoch": 4598} {"train_loss": -26.90715980529785, "global_step": 381709, "epoch": 4598} {"train_loss": -26.41556739807129, "global_step": 381710, "epoch": 4598} {"train_loss": -26.4475154876709, "global_step": 381711, "epoch": 4598} {"train_loss": -26.708765029907227, "global_step": 381712, "epoch": 4598} {"train_loss": -26.780683517456055, "global_step": 381713, "epoch": 4598} {"train_loss": -26.678430557250977, "global_step": 381714, "epoch": 4598} {"train_loss": -26.997211456298828, "global_step": 381715, "epoch": 4598} {"train_loss": -26.410776299166393, "global_step": 381716, "epoch": 4598, "val_loss": 6544713.0} {"train_loss": -25.871795654296875, "global_step": 381717, "epoch": 4599} {"train_loss": -25.822998046875, "global_step": 381718, "epoch": 4599} {"train_loss": -25.205760955810547, "global_step": 381719, "epoch": 4599} {"train_loss": -25.046979904174805, "global_step": 381720, "epoch": 4599} {"train_loss": -25.1187744140625, "global_step": 381721, "epoch": 4599} {"train_loss": -24.6517391204834, "global_step": 381722, "epoch": 4599} {"train_loss": -25.333463668823242, "global_step": 381723, "epoch": 4599} {"train_loss": -25.96677017211914, "global_step": 381724, "epoch": 4599} {"train_loss": -25.60462760925293, "global_step": 381725, "epoch": 4599} {"train_loss": -25.862424850463867, "global_step": 381726, "epoch": 4599} {"train_loss": -25.79523277282715, "global_step": 381727, "epoch": 4599} {"train_loss": -25.409221649169922, "global_step": 381728, "epoch": 4599} {"train_loss": -25.97477149963379, "global_step": 381729, "epoch": 4599} {"train_loss": -25.01436424255371, "global_step": 381730, "epoch": 4599} {"train_loss": -25.5159854888916, "global_step": 381731, "epoch": 4599} {"train_loss": -25.687780380249023, "global_step": 381732, "epoch": 4599} {"train_loss": -25.659753799438477, "global_step": 381733, "epoch": 4599} {"train_loss": -26.04706382751465, "global_step": 381734, "epoch": 4599} {"train_loss": -25.540287017822266, "global_step": 381735, "epoch": 4599} {"train_loss": -25.62360191345215, "global_step": 381736, "epoch": 4599} {"train_loss": -26.1505184173584, "global_step": 381737, "epoch": 4599} {"train_loss": -25.676441192626953, "global_step": 381738, "epoch": 4599} {"train_loss": -26.125690460205078, "global_step": 381739, "epoch": 4599} {"train_loss": -25.751413345336914, "global_step": 381740, "epoch": 4599} {"train_loss": -26.24433708190918, "global_step": 381741, "epoch": 4599} {"train_loss": -25.527828216552734, "global_step": 381742, "epoch": 4599} {"train_loss": -25.7989444732666, "global_step": 381743, "epoch": 4599} {"train_loss": -26.013538360595703, "global_step": 381744, "epoch": 4599} {"train_loss": -26.066913604736328, "global_step": 381745, "epoch": 4599} {"train_loss": -25.986547470092773, "global_step": 381746, "epoch": 4599} {"train_loss": -26.14615249633789, "global_step": 381747, "epoch": 4599} {"train_loss": -25.953113555908203, "global_step": 381748, "epoch": 4599} {"train_loss": -25.888742446899414, "global_step": 381749, "epoch": 4599} {"train_loss": -26.101316452026367, "global_step": 381750, "epoch": 4599} {"train_loss": -26.21018409729004, "global_step": 381751, "epoch": 4599} {"train_loss": -26.279388427734375, "global_step": 381752, "epoch": 4599} {"train_loss": -26.07581901550293, "global_step": 381753, "epoch": 4599} {"train_loss": -26.639440536499023, "global_step": 381754, "epoch": 4599} {"train_loss": -26.56803321838379, "global_step": 381755, "epoch": 4599} {"train_loss": -26.166208267211914, "global_step": 381756, "epoch": 4599} {"train_loss": -26.659423828125, "global_step": 381757, "epoch": 4599} {"train_loss": -26.75079917907715, "global_step": 381758, "epoch": 4599} {"train_loss": -26.481647491455078, "global_step": 381759, "epoch": 4599} {"train_loss": -26.6357479095459, "global_step": 381760, "epoch": 4599} {"train_loss": -26.583959579467773, "global_step": 381761, "epoch": 4599} {"train_loss": -26.689075469970703, "global_step": 381762, "epoch": 4599} {"train_loss": -26.432861328125, "global_step": 381763, "epoch": 4599} {"train_loss": -26.637205123901367, "global_step": 381764, "epoch": 4599} {"train_loss": -26.507429122924805, "global_step": 381765, "epoch": 4599} {"train_loss": -26.263227462768555, "global_step": 381766, "epoch": 4599} {"train_loss": -26.631330490112305, "global_step": 381767, "epoch": 4599} {"train_loss": -25.92425537109375, "global_step": 381768, "epoch": 4599} {"train_loss": -26.52630615234375, "global_step": 381769, "epoch": 4599} {"train_loss": -26.59443473815918, "global_step": 381770, "epoch": 4599} {"train_loss": -26.84088134765625, "global_step": 381771, "epoch": 4599} {"train_loss": -26.380523681640625, "global_step": 381772, "epoch": 4599} {"train_loss": -26.71772575378418, "global_step": 381773, "epoch": 4599} {"train_loss": -26.2559814453125, "global_step": 381774, "epoch": 4599} {"train_loss": -26.471561431884766, "global_step": 381775, "epoch": 4599} {"train_loss": -26.444421768188477, "global_step": 381776, "epoch": 4599} {"train_loss": -26.546003341674805, "global_step": 381777, "epoch": 4599} {"train_loss": -26.17995262145996, "global_step": 381778, "epoch": 4599} {"train_loss": -26.784025192260742, "global_step": 381779, "epoch": 4599} {"train_loss": -26.66229820251465, "global_step": 381780, "epoch": 4599} {"train_loss": -26.491180419921875, "global_step": 381781, "epoch": 4599} {"train_loss": -26.83063316345215, "global_step": 381782, "epoch": 4599} {"train_loss": -26.42864990234375, "global_step": 381783, "epoch": 4599} {"train_loss": -26.5753173828125, "global_step": 381784, "epoch": 4599} {"train_loss": -26.491241455078125, "global_step": 381785, "epoch": 4599} {"train_loss": -26.726028442382812, "global_step": 381786, "epoch": 4599} {"train_loss": -26.38690757751465, "global_step": 381787, "epoch": 4599} {"train_loss": -26.455108642578125, "global_step": 381788, "epoch": 4599} {"train_loss": -26.482318878173828, "global_step": 381789, "epoch": 4599} {"train_loss": -26.680938720703125, "global_step": 381790, "epoch": 4599} {"train_loss": -26.150938034057617, "global_step": 381791, "epoch": 4599} {"train_loss": -26.142786026000977, "global_step": 381792, "epoch": 4599} {"train_loss": -26.392230987548828, "global_step": 381793, "epoch": 4599} {"train_loss": -26.627634048461914, "global_step": 381794, "epoch": 4599} {"train_loss": -26.639789581298828, "global_step": 381795, "epoch": 4599} {"train_loss": -26.64240074157715, "global_step": 381796, "epoch": 4599} {"train_loss": -26.420934677124023, "global_step": 381797, "epoch": 4599} {"train_loss": -26.386045455932617, "global_step": 381798, "epoch": 4599} {"train_loss": -26.171467723616633, "global_step": 381799, "epoch": 4599, "val_loss": 6536757.0} {"train_loss": -25.7374324798584, "global_step": 381800, "epoch": 4600} {"train_loss": -24.91239356994629, "global_step": 381801, "epoch": 4600} {"train_loss": -25.456323623657227, "global_step": 381802, "epoch": 4600} {"train_loss": -25.2197265625, "global_step": 381803, "epoch": 4600} {"train_loss": -25.9697322845459, "global_step": 381804, "epoch": 4600} {"train_loss": -25.6159725189209, "global_step": 381805, "epoch": 4600} {"train_loss": -25.336509704589844, "global_step": 381806, "epoch": 4600} {"train_loss": -24.971052169799805, "global_step": 381807, "epoch": 4600} {"train_loss": -25.99395179748535, "global_step": 381808, "epoch": 4600} {"train_loss": -25.31177520751953, "global_step": 381809, "epoch": 4600} {"train_loss": -25.7999267578125, "global_step": 381810, "epoch": 4600} {"train_loss": -25.717649459838867, "global_step": 381811, "epoch": 4600} {"train_loss": -25.751300811767578, "global_step": 381812, "epoch": 4600} {"train_loss": -25.743330001831055, "global_step": 381813, "epoch": 4600} {"train_loss": -25.81281852722168, "global_step": 381814, "epoch": 4600} {"train_loss": -25.722070693969727, "global_step": 381815, "epoch": 4600} {"train_loss": -25.789325714111328, "global_step": 381816, "epoch": 4600} {"train_loss": -25.89591407775879, "global_step": 381817, "epoch": 4600} {"train_loss": -26.256366729736328, "global_step": 381818, "epoch": 4600} {"train_loss": -25.9107723236084, "global_step": 381819, "epoch": 4600} {"train_loss": -26.093414306640625, "global_step": 381820, "epoch": 4600} {"train_loss": -25.87327003479004, "global_step": 381821, "epoch": 4600} {"train_loss": -26.425867080688477, "global_step": 381822, "epoch": 4600} {"train_loss": -26.118833541870117, "global_step": 381823, "epoch": 4600} {"train_loss": -26.16713523864746, "global_step": 381824, "epoch": 4600} {"train_loss": -26.4427433013916, "global_step": 381825, "epoch": 4600} {"train_loss": -26.706226348876953, "global_step": 381826, "epoch": 4600} {"train_loss": -26.551237106323242, "global_step": 381827, "epoch": 4600} {"train_loss": -26.198774337768555, "global_step": 381828, "epoch": 4600} {"train_loss": -26.744184494018555, "global_step": 381829, "epoch": 4600} {"train_loss": -26.546905517578125, "global_step": 381830, "epoch": 4600} {"train_loss": -26.494848251342773, "global_step": 381831, "epoch": 4600} {"train_loss": -26.372156143188477, "global_step": 381832, "epoch": 4600} {"train_loss": -26.48679542541504, "global_step": 381833, "epoch": 4600} {"train_loss": -26.34405517578125, "global_step": 381834, "epoch": 4600} {"train_loss": -26.831378936767578, "global_step": 381835, "epoch": 4600} {"train_loss": -26.558349609375, "global_step": 381836, "epoch": 4600} {"train_loss": -26.660024642944336, "global_step": 381837, "epoch": 4600} {"train_loss": -26.370222091674805, "global_step": 381838, "epoch": 4600} {"train_loss": -26.376806259155273, "global_step": 381839, "epoch": 4600} {"train_loss": -26.50042724609375, "global_step": 381840, "epoch": 4600} {"train_loss": -26.798908233642578, "global_step": 381841, "epoch": 4600} {"train_loss": -26.489545822143555, "global_step": 381842, "epoch": 4600} {"train_loss": -26.478723526000977, "global_step": 381843, "epoch": 4600} {"train_loss": -26.8072452545166, "global_step": 381844, "epoch": 4600} {"train_loss": -26.72458839416504, "global_step": 381845, "epoch": 4600} {"train_loss": -26.265783309936523, "global_step": 381846, "epoch": 4600} {"train_loss": -26.659809112548828, "global_step": 381847, "epoch": 4600} {"train_loss": -26.52353286743164, "global_step": 381848, "epoch": 4600} {"train_loss": -26.77166748046875, "global_step": 381849, "epoch": 4600} {"train_loss": -26.62494468688965, "global_step": 381850, "epoch": 4600} {"train_loss": -26.857126235961914, "global_step": 381851, "epoch": 4600} {"train_loss": -26.956104278564453, "global_step": 381852, "epoch": 4600} {"train_loss": -26.414709091186523, "global_step": 381853, "epoch": 4600} {"train_loss": -26.889413833618164, "global_step": 381854, "epoch": 4600} {"train_loss": -26.575042724609375, "global_step": 381855, "epoch": 4600} {"train_loss": -26.673547744750977, "global_step": 381856, "epoch": 4600} {"train_loss": -26.37127685546875, "global_step": 381857, "epoch": 4600} {"train_loss": -26.14055824279785, "global_step": 381858, "epoch": 4600} {"train_loss": -26.344467163085938, "global_step": 381859, "epoch": 4600} {"train_loss": -26.687591552734375, "global_step": 381860, "epoch": 4600} {"train_loss": -26.663776397705078, "global_step": 381861, "epoch": 4600} {"train_loss": -26.55732536315918, "global_step": 381862, "epoch": 4600} {"train_loss": -26.50335121154785, "global_step": 381863, "epoch": 4600} {"train_loss": -26.5719051361084, "global_step": 381864, "epoch": 4600} {"train_loss": -26.5626163482666, "global_step": 381865, "epoch": 4600} {"train_loss": -26.576892852783203, "global_step": 381866, "epoch": 4600} {"train_loss": -26.856948852539062, "global_step": 381867, "epoch": 4600} {"train_loss": -26.6009464263916, "global_step": 381868, "epoch": 4600} {"train_loss": -26.511322021484375, "global_step": 381869, "epoch": 4600} {"train_loss": -26.715957641601562, "global_step": 381870, "epoch": 4600} {"train_loss": -26.673664093017578, "global_step": 381871, "epoch": 4600} {"train_loss": -26.562246322631836, "global_step": 381872, "epoch": 4600} {"train_loss": -26.737075805664062, "global_step": 381873, "epoch": 4600} {"train_loss": -26.450000762939453, "global_step": 381874, "epoch": 4600} {"train_loss": -26.887807846069336, "global_step": 381875, "epoch": 4600} {"train_loss": -26.626855850219727, "global_step": 381876, "epoch": 4600} {"train_loss": -26.16326904296875, "global_step": 381877, "epoch": 4600} {"train_loss": -26.82430076599121, "global_step": 381878, "epoch": 4600} {"train_loss": -26.53940773010254, "global_step": 381879, "epoch": 4600} {"train_loss": -26.567968368530273, "global_step": 381880, "epoch": 4600} {"train_loss": -26.863988876342773, "global_step": 381881, "epoch": 4600} {"train_loss": -26.330824794539485, "global_step": 381882, "epoch": 4600, "train/sim_max_reward_0": 1.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4500000": 1.0, "test/sim_max_reward_4500001": 1.0, "test/sim_max_reward_4500002": 1.0, "test/sim_max_reward_4500003": 1.0, "test/sim_max_reward_4500004": 1.0, "test/sim_max_reward_4500005": 1.0, "test/sim_max_reward_4500006": 1.0, "test/sim_max_reward_4500007": 0.0, "test/sim_max_reward_4500008": 1.0, "test/sim_max_reward_4500009": 1.0, "test/sim_max_reward_4500010": 1.0, "test/sim_max_reward_4500011": 1.0, "test/sim_max_reward_4500012": 1.0, "test/sim_max_reward_4500013": 1.0, "test/sim_max_reward_4500014": 1.0, "test/sim_max_reward_4500015": 1.0, "test/sim_max_reward_4500016": 1.0, "test/sim_max_reward_4500017": 1.0, "test/sim_max_reward_4500018": 1.0, "test/sim_max_reward_4500019": 1.0, "test/sim_max_reward_4500020": 1.0, "test/sim_max_reward_4500021": 1.0, "train/mean_score": 1.0, "test/mean_score": 0.9545454545454546, "val_loss": 6595006.0} {"train_loss": -25.951583862304688, "global_step": 381883, "epoch": 4601} {"train_loss": -25.86565589904785, "global_step": 381884, "epoch": 4601} {"train_loss": -26.50754737854004, "global_step": 381885, "epoch": 4601} {"train_loss": -25.978271484375, "global_step": 381886, "epoch": 4601} {"train_loss": -25.029190063476562, "global_step": 381887, "epoch": 4601} {"train_loss": -25.492984771728516, "global_step": 381888, "epoch": 4601} {"train_loss": -25.408620834350586, "global_step": 381889, "epoch": 4601} {"train_loss": -25.895923614501953, "global_step": 381890, "epoch": 4601} {"train_loss": -25.785602569580078, "global_step": 381891, "epoch": 4601} {"train_loss": -25.857152938842773, "global_step": 381892, "epoch": 4601} {"train_loss": -25.743408203125, "global_step": 381893, "epoch": 4601} {"train_loss": -26.272977828979492, "global_step": 381894, "epoch": 4601} {"train_loss": -25.70815086364746, "global_step": 381895, "epoch": 4601} {"train_loss": -26.21331787109375, "global_step": 381896, "epoch": 4601} {"train_loss": -26.276945114135742, "global_step": 381897, "epoch": 4601} {"train_loss": -26.04546546936035, "global_step": 381898, "epoch": 4601} {"train_loss": -25.93128776550293, "global_step": 381899, "epoch": 4601} {"train_loss": -26.076919555664062, "global_step": 381900, "epoch": 4601} {"train_loss": -26.3911075592041, "global_step": 381901, "epoch": 4601} {"train_loss": -26.049758911132812, "global_step": 381902, "epoch": 4601} {"train_loss": -26.221227645874023, "global_step": 381903, "epoch": 4601} {"train_loss": -26.383344650268555, "global_step": 381904, "epoch": 4601} {"train_loss": -26.6342830657959, "global_step": 381905, "epoch": 4601} {"train_loss": -26.141199111938477, "global_step": 381906, "epoch": 4601} {"train_loss": -25.97946548461914, "global_step": 381907, "epoch": 4601} {"train_loss": -26.731000900268555, "global_step": 381908, "epoch": 4601} {"train_loss": -25.99886131286621, "global_step": 381909, "epoch": 4601} {"train_loss": -26.63330078125, "global_step": 381910, "epoch": 4601} {"train_loss": -26.736902236938477, "global_step": 381911, "epoch": 4601} {"train_loss": -26.32771110534668, "global_step": 381912, "epoch": 4601} {"train_loss": -26.331018447875977, "global_step": 381913, "epoch": 4601} {"train_loss": -26.881216049194336, "global_step": 381914, "epoch": 4601} {"train_loss": -26.48688316345215, "global_step": 381915, "epoch": 4601} {"train_loss": -26.591663360595703, "global_step": 381916, "epoch": 4601} {"train_loss": -26.12533950805664, "global_step": 381917, "epoch": 4601} {"train_loss": -26.57612419128418, "global_step": 381918, "epoch": 4601} {"train_loss": -26.332874298095703, "global_step": 381919, "epoch": 4601} {"train_loss": -26.08098793029785, "global_step": 381920, "epoch": 4601} {"train_loss": -26.750165939331055, "global_step": 381921, "epoch": 4601} {"train_loss": -26.91889762878418, "global_step": 381922, "epoch": 4601} {"train_loss": -26.443912506103516, "global_step": 381923, "epoch": 4601} {"train_loss": -26.477075576782227, "global_step": 381924, "epoch": 4601} {"train_loss": -26.658838272094727, "global_step": 381925, "epoch": 4601} {"train_loss": -26.4224853515625, "global_step": 381926, "epoch": 4601} {"train_loss": -26.520177841186523, "global_step": 381927, "epoch": 4601} {"train_loss": -26.584814071655273, "global_step": 381928, "epoch": 4601} {"train_loss": -26.618335723876953, "global_step": 381929, "epoch": 4601} {"train_loss": -27.01296043395996, "global_step": 381930, "epoch": 4601} {"train_loss": -26.342300415039062, "global_step": 381931, "epoch": 4601} {"train_loss": -26.614837646484375, "global_step": 381932, "epoch": 4601} {"train_loss": -26.346654891967773, "global_step": 381933, "epoch": 4601} {"train_loss": -26.36777114868164, "global_step": 381934, "epoch": 4601} {"train_loss": -26.47052574157715, "global_step": 381935, "epoch": 4601} {"train_loss": -26.54006004333496, "global_step": 381936, "epoch": 4601} {"train_loss": -26.819168090820312, "global_step": 381937, "epoch": 4601} {"train_loss": -26.710651397705078, "global_step": 381938, "epoch": 4601} {"train_loss": -26.59640884399414, "global_step": 381939, "epoch": 4601} {"train_loss": -26.756505966186523, "global_step": 381940, "epoch": 4601} {"train_loss": -26.290374755859375, "global_step": 381941, "epoch": 4601} {"train_loss": -26.676654815673828, "global_step": 381942, "epoch": 4601} {"train_loss": -26.26885986328125, "global_step": 381943, "epoch": 4601} {"train_loss": -26.753767013549805, "global_step": 381944, "epoch": 4601} {"train_loss": -26.57252311706543, "global_step": 381945, "epoch": 4601} {"train_loss": -26.17770767211914, "global_step": 381946, "epoch": 4601} {"train_loss": -25.982519149780273, "global_step": 381947, "epoch": 4601} {"train_loss": -26.699125289916992, "global_step": 381948, "epoch": 4601} {"train_loss": -26.843961715698242, "global_step": 381949, "epoch": 4601} {"train_loss": -25.9364070892334, "global_step": 381950, "epoch": 4601} {"train_loss": -26.633291244506836, "global_step": 381951, "epoch": 4601} {"train_loss": -26.63702392578125, "global_step": 381952, "epoch": 4601} {"train_loss": -26.560251235961914, "global_step": 381953, "epoch": 4601} {"train_loss": -26.284765243530273, "global_step": 381954, "epoch": 4601} {"train_loss": -26.606473922729492, "global_step": 381955, "epoch": 4601} {"train_loss": -26.080230712890625, "global_step": 381956, "epoch": 4601} {"train_loss": -26.576618194580078, "global_step": 381957, "epoch": 4601} {"train_loss": -26.513219833374023, "global_step": 381958, "epoch": 4601} {"train_loss": -26.30486488342285, "global_step": 381959, "epoch": 4601} {"train_loss": -26.4134521484375, "global_step": 381960, "epoch": 4601} {"train_loss": -26.161046981811523, "global_step": 381961, "epoch": 4601} {"train_loss": -26.328039169311523, "global_step": 381962, "epoch": 4601} {"train_loss": -26.23016357421875, "global_step": 381963, "epoch": 4601} {"train_loss": -26.466480255126953, "global_step": 381964, "epoch": 4601} {"train_loss": -26.34503173828125, "global_step": 381965, "epoch": 4601, "val_loss": 6699189.0} {"train_loss": -24.868640899658203, "global_step": 381966, "epoch": 4602} {"train_loss": -25.07172966003418, "global_step": 381967, "epoch": 4602} {"train_loss": -25.266233444213867, "global_step": 381968, "epoch": 4602} {"train_loss": -25.171232223510742, "global_step": 381969, "epoch": 4602} {"train_loss": -25.480819702148438, "global_step": 381970, "epoch": 4602} {"train_loss": -25.67817497253418, "global_step": 381971, "epoch": 4602} {"train_loss": -25.681076049804688, "global_step": 381972, "epoch": 4602} {"train_loss": -25.78139305114746, "global_step": 381973, "epoch": 4602} {"train_loss": -25.736631393432617, "global_step": 381974, "epoch": 4602} {"train_loss": -25.95001792907715, "global_step": 381975, "epoch": 4602} {"train_loss": -25.8066349029541, "global_step": 381976, "epoch": 4602} {"train_loss": -26.209732055664062, "global_step": 381977, "epoch": 4602} {"train_loss": -26.1221866607666, "global_step": 381978, "epoch": 4602} {"train_loss": -26.048511505126953, "global_step": 381979, "epoch": 4602} {"train_loss": -25.931827545166016, "global_step": 381980, "epoch": 4602} {"train_loss": -25.875646591186523, "global_step": 381981, "epoch": 4602} {"train_loss": -25.647125244140625, "global_step": 381982, "epoch": 4602} {"train_loss": -26.28449058532715, "global_step": 381983, "epoch": 4602} {"train_loss": -26.161230087280273, "global_step": 381984, "epoch": 4602} {"train_loss": -26.099191665649414, "global_step": 381985, "epoch": 4602} {"train_loss": -26.14063835144043, "global_step": 381986, "epoch": 4602} {"train_loss": -26.088708877563477, "global_step": 381987, "epoch": 4602} {"train_loss": -26.15192222595215, "global_step": 381988, "epoch": 4602} {"train_loss": -26.119626998901367, "global_step": 381989, "epoch": 4602} {"train_loss": -26.155750274658203, "global_step": 381990, "epoch": 4602} {"train_loss": -26.329992294311523, "global_step": 381991, "epoch": 4602} {"train_loss": -26.39969253540039, "global_step": 381992, "epoch": 4602} {"train_loss": -26.30672264099121, "global_step": 381993, "epoch": 4602} {"train_loss": -26.082813262939453, "global_step": 381994, "epoch": 4602} {"train_loss": -26.4541072845459, "global_step": 381995, "epoch": 4602} {"train_loss": -26.180057525634766, "global_step": 381996, "epoch": 4602} {"train_loss": -26.149072647094727, "global_step": 381997, "epoch": 4602} {"train_loss": -26.7226619720459, "global_step": 381998, "epoch": 4602} {"train_loss": -26.666845321655273, "global_step": 381999, "epoch": 4602} {"train_loss": -26.682098388671875, "global_step": 382000, "epoch": 4602} {"train_loss": -26.59063148498535, "global_step": 382001, "epoch": 4602} {"train_loss": -26.509613037109375, "global_step": 382002, "epoch": 4602} {"train_loss": -25.99932289123535, "global_step": 382003, "epoch": 4602} {"train_loss": -26.415502548217773, "global_step": 382004, "epoch": 4602} {"train_loss": -26.59161376953125, "global_step": 382005, "epoch": 4602} {"train_loss": -26.261655807495117, "global_step": 382006, "epoch": 4602} {"train_loss": -25.880767822265625, "global_step": 382007, "epoch": 4602} {"train_loss": -25.948291778564453, "global_step": 382008, "epoch": 4602} {"train_loss": -26.46823501586914, "global_step": 382009, "epoch": 4602} {"train_loss": -26.356008529663086, "global_step": 382010, "epoch": 4602} {"train_loss": -26.12156105041504, "global_step": 382011, "epoch": 4602} {"train_loss": -26.29678726196289, "global_step": 382012, "epoch": 4602} {"train_loss": -26.517261505126953, "global_step": 382013, "epoch": 4602} {"train_loss": -25.951663970947266, "global_step": 382014, "epoch": 4602} {"train_loss": -26.545278549194336, "global_step": 382015, "epoch": 4602} {"train_loss": -26.412216186523438, "global_step": 382016, "epoch": 4602} {"train_loss": -26.446401596069336, "global_step": 382017, "epoch": 4602} {"train_loss": -26.750843048095703, "global_step": 382018, "epoch": 4602} {"train_loss": -25.983808517456055, "global_step": 382019, "epoch": 4602} {"train_loss": -26.320133209228516, "global_step": 382020, "epoch": 4602} {"train_loss": -26.460540771484375, "global_step": 382021, "epoch": 4602} {"train_loss": -26.466522216796875, "global_step": 382022, "epoch": 4602} {"train_loss": -26.6925048828125, "global_step": 382023, "epoch": 4602} {"train_loss": -26.25714111328125, "global_step": 382024, "epoch": 4602} {"train_loss": -26.30470085144043, "global_step": 382025, "epoch": 4602} {"train_loss": -26.596158981323242, "global_step": 382026, "epoch": 4602} {"train_loss": -26.57879066467285, "global_step": 382027, "epoch": 4602} {"train_loss": -26.26443862915039, "global_step": 382028, "epoch": 4602} {"train_loss": -26.30694580078125, "global_step": 382029, "epoch": 4602} {"train_loss": -26.3702449798584, "global_step": 382030, "epoch": 4602} {"train_loss": -26.411909103393555, "global_step": 382031, "epoch": 4602} {"train_loss": -26.421926498413086, "global_step": 382032, "epoch": 4602} {"train_loss": -26.684782028198242, "global_step": 382033, "epoch": 4602} {"train_loss": -26.677886962890625, "global_step": 382034, "epoch": 4602} {"train_loss": -26.35979652404785, "global_step": 382035, "epoch": 4602} {"train_loss": -26.916900634765625, "global_step": 382036, "epoch": 4602} {"train_loss": -26.827051162719727, "global_step": 382037, "epoch": 4602} {"train_loss": -26.588897705078125, "global_step": 382038, "epoch": 4602} {"train_loss": -26.838825225830078, "global_step": 382039, "epoch": 4602} {"train_loss": -26.667844772338867, "global_step": 382040, "epoch": 4602} {"train_loss": -26.484838485717773, "global_step": 382041, "epoch": 4602} {"train_loss": -26.454303741455078, "global_step": 382042, "epoch": 4602} {"train_loss": -26.29843521118164, "global_step": 382043, "epoch": 4602} {"train_loss": -26.8026065826416, "global_step": 382044, "epoch": 4602} {"train_loss": -26.964126586914062, "global_step": 382045, "epoch": 4602} {"train_loss": -26.72330093383789, "global_step": 382046, "epoch": 4602} {"train_loss": -26.670331954956055, "global_step": 382047, "epoch": 4602} {"train_loss": -26.2540781641581, "global_step": 382048, "epoch": 4602, "val_loss": 6646716.0} {"train_loss": -25.793487548828125, "global_step": 382049, "epoch": 4603} {"train_loss": -25.7388858795166, "global_step": 382050, "epoch": 4603} {"train_loss": -25.952484130859375, "global_step": 382051, "epoch": 4603} {"train_loss": -25.483497619628906, "global_step": 382052, "epoch": 4603} {"train_loss": -25.809492111206055, "global_step": 382053, "epoch": 4603} {"train_loss": -25.890411376953125, "global_step": 382054, "epoch": 4603} {"train_loss": -26.129499435424805, "global_step": 382055, "epoch": 4603} {"train_loss": -25.683765411376953, "global_step": 382056, "epoch": 4603} {"train_loss": -26.247838973999023, "global_step": 382057, "epoch": 4603} {"train_loss": -26.00644302368164, "global_step": 382058, "epoch": 4603} {"train_loss": -26.038537979125977, "global_step": 382059, "epoch": 4603} {"train_loss": -25.978656768798828, "global_step": 382060, "epoch": 4603} {"train_loss": -26.383955001831055, "global_step": 382061, "epoch": 4603} {"train_loss": -26.174484252929688, "global_step": 382062, "epoch": 4603} {"train_loss": -26.43275260925293, "global_step": 382063, "epoch": 4603} {"train_loss": -25.972431182861328, "global_step": 382064, "epoch": 4603} {"train_loss": -26.0140438079834, "global_step": 382065, "epoch": 4603} {"train_loss": -26.46915054321289, "global_step": 382066, "epoch": 4603} {"train_loss": -26.171606063842773, "global_step": 382067, "epoch": 4603} {"train_loss": -26.47907066345215, "global_step": 382068, "epoch": 4603} {"train_loss": -26.164220809936523, "global_step": 382069, "epoch": 4603} {"train_loss": -26.51763916015625, "global_step": 382070, "epoch": 4603} {"train_loss": -26.221616744995117, "global_step": 382071, "epoch": 4603} {"train_loss": -26.188161849975586, "global_step": 382072, "epoch": 4603} {"train_loss": -26.5327091217041, "global_step": 382073, "epoch": 4603} {"train_loss": -26.336835861206055, "global_step": 382074, "epoch": 4603} {"train_loss": -26.367822647094727, "global_step": 382075, "epoch": 4603} {"train_loss": -26.28199577331543, "global_step": 382076, "epoch": 4603} {"train_loss": -26.714475631713867, "global_step": 382077, "epoch": 4603} {"train_loss": -26.592512130737305, "global_step": 382078, "epoch": 4603} {"train_loss": -26.396875381469727, "global_step": 382079, "epoch": 4603} {"train_loss": -26.347192764282227, "global_step": 382080, "epoch": 4603} {"train_loss": -26.57916259765625, "global_step": 382081, "epoch": 4603} {"train_loss": -26.441516876220703, "global_step": 382082, "epoch": 4603} {"train_loss": -26.26228904724121, "global_step": 382083, "epoch": 4603} {"train_loss": -26.281286239624023, "global_step": 382084, "epoch": 4603} {"train_loss": -26.605756759643555, "global_step": 382085, "epoch": 4603} {"train_loss": -26.572040557861328, "global_step": 382086, "epoch": 4603} {"train_loss": -26.356653213500977, "global_step": 382087, "epoch": 4603} {"train_loss": -26.492115020751953, "global_step": 382088, "epoch": 4603} {"train_loss": -26.316186904907227, "global_step": 382089, "epoch": 4603} {"train_loss": -26.63747215270996, "global_step": 382090, "epoch": 4603} {"train_loss": -26.398046493530273, "global_step": 382091, "epoch": 4603} {"train_loss": -26.173690795898438, "global_step": 382092, "epoch": 4603} {"train_loss": -26.115371704101562, "global_step": 382093, "epoch": 4603} {"train_loss": -25.865354537963867, "global_step": 382094, "epoch": 4603} {"train_loss": -25.7296142578125, "global_step": 382095, "epoch": 4603} {"train_loss": -26.1667537689209, "global_step": 382096, "epoch": 4603} {"train_loss": -26.244754791259766, "global_step": 382097, "epoch": 4603} {"train_loss": -26.250080108642578, "global_step": 382098, "epoch": 4603} {"train_loss": -26.563190460205078, "global_step": 382099, "epoch": 4603} {"train_loss": -25.9136962890625, "global_step": 382100, "epoch": 4603} {"train_loss": -26.594709396362305, "global_step": 382101, "epoch": 4603} {"train_loss": -26.43979263305664, "global_step": 382102, "epoch": 4603} {"train_loss": -26.42716407775879, "global_step": 382103, "epoch": 4603} {"train_loss": -26.251434326171875, "global_step": 382104, "epoch": 4603} {"train_loss": -26.77606773376465, "global_step": 382105, "epoch": 4603} {"train_loss": -26.6754207611084, "global_step": 382106, "epoch": 4603} {"train_loss": -26.46235466003418, "global_step": 382107, "epoch": 4603} {"train_loss": -26.692285537719727, "global_step": 382108, "epoch": 4603} {"train_loss": -26.902875900268555, "global_step": 382109, "epoch": 4603} {"train_loss": -26.661670684814453, "global_step": 382110, "epoch": 4603} {"train_loss": -26.177825927734375, "global_step": 382111, "epoch": 4603} {"train_loss": -26.043554306030273, "global_step": 382112, "epoch": 4603} {"train_loss": -26.590768814086914, "global_step": 382113, "epoch": 4603} {"train_loss": -26.36781120300293, "global_step": 382114, "epoch": 4603} {"train_loss": -26.645008087158203, "global_step": 382115, "epoch": 4603} {"train_loss": -26.65138053894043, "global_step": 382116, "epoch": 4603} {"train_loss": -26.397024154663086, "global_step": 382117, "epoch": 4603} {"train_loss": -26.400012969970703, "global_step": 382118, "epoch": 4603} {"train_loss": -26.200183868408203, "global_step": 382119, "epoch": 4603} {"train_loss": -26.193801879882812, "global_step": 382120, "epoch": 4603} {"train_loss": -26.24897575378418, "global_step": 382121, "epoch": 4603} {"train_loss": -26.231857299804688, "global_step": 382122, "epoch": 4603} {"train_loss": -26.51521873474121, "global_step": 382123, "epoch": 4603} {"train_loss": -26.19241714477539, "global_step": 382124, "epoch": 4603} {"train_loss": -26.50470542907715, "global_step": 382125, "epoch": 4603} {"train_loss": -26.459278106689453, "global_step": 382126, "epoch": 4603} {"train_loss": -26.511402130126953, "global_step": 382127, "epoch": 4603} {"train_loss": -26.622772216796875, "global_step": 382128, "epoch": 4603} {"train_loss": -26.71209716796875, "global_step": 382129, "epoch": 4603} {"train_loss": -26.494556427001953, "global_step": 382130, "epoch": 4603} {"train_loss": -26.316429207123907, "global_step": 382131, "epoch": 4603, "val_loss": 6591883.0} {"train_loss": -25.894346237182617, "global_step": 382132, "epoch": 4604} {"train_loss": -25.16547393798828, "global_step": 382133, "epoch": 4604} {"train_loss": -25.69142723083496, "global_step": 382134, "epoch": 4604} {"train_loss": -25.614221572875977, "global_step": 382135, "epoch": 4604} {"train_loss": -26.02365493774414, "global_step": 382136, "epoch": 4604} {"train_loss": -26.304357528686523, "global_step": 382137, "epoch": 4604} {"train_loss": -26.181848526000977, "global_step": 382138, "epoch": 4604} {"train_loss": -26.33444595336914, "global_step": 382139, "epoch": 4604} {"train_loss": -26.512487411499023, "global_step": 382140, "epoch": 4604} {"train_loss": -26.520044326782227, "global_step": 382141, "epoch": 4604} {"train_loss": -26.301956176757812, "global_step": 382142, "epoch": 4604} {"train_loss": -26.27695655822754, "global_step": 382143, "epoch": 4604} {"train_loss": -26.612146377563477, "global_step": 382144, "epoch": 4604} {"train_loss": -26.226980209350586, "global_step": 382145, "epoch": 4604} {"train_loss": -26.741178512573242, "global_step": 382146, "epoch": 4604} {"train_loss": -26.022003173828125, "global_step": 382147, "epoch": 4604} {"train_loss": -26.11830711364746, "global_step": 382148, "epoch": 4604} {"train_loss": -26.43069839477539, "global_step": 382149, "epoch": 4604} {"train_loss": -26.52619743347168, "global_step": 382150, "epoch": 4604} {"train_loss": -26.604360580444336, "global_step": 382151, "epoch": 4604} {"train_loss": -26.461654663085938, "global_step": 382152, "epoch": 4604} {"train_loss": -26.7625675201416, "global_step": 382153, "epoch": 4604} {"train_loss": -26.233749389648438, "global_step": 382154, "epoch": 4604} {"train_loss": -26.390859603881836, "global_step": 382155, "epoch": 4604} {"train_loss": -26.1101131439209, "global_step": 382156, "epoch": 4604} {"train_loss": -26.416807174682617, "global_step": 382157, "epoch": 4604} {"train_loss": -26.404611587524414, "global_step": 382158, "epoch": 4604} {"train_loss": -26.632614135742188, "global_step": 382159, "epoch": 4604} {"train_loss": -26.317581176757812, "global_step": 382160, "epoch": 4604} {"train_loss": -26.710458755493164, "global_step": 382161, "epoch": 4604} {"train_loss": -26.37562370300293, "global_step": 382162, "epoch": 4604} {"train_loss": -26.497726440429688, "global_step": 382163, "epoch": 4604} {"train_loss": -26.514814376831055, "global_step": 382164, "epoch": 4604} {"train_loss": -26.842309951782227, "global_step": 382165, "epoch": 4604} {"train_loss": -26.770111083984375, "global_step": 382166, "epoch": 4604} {"train_loss": -26.328922271728516, "global_step": 382167, "epoch": 4604} {"train_loss": -26.342334747314453, "global_step": 382168, "epoch": 4604} {"train_loss": -26.248380661010742, "global_step": 382169, "epoch": 4604} {"train_loss": -26.52265739440918, "global_step": 382170, "epoch": 4604} {"train_loss": -26.4725341796875, "global_step": 382171, "epoch": 4604} {"train_loss": -26.769058227539062, "global_step": 382172, "epoch": 4604} {"train_loss": -26.854480743408203, "global_step": 382173, "epoch": 4604} {"train_loss": -26.652929306030273, "global_step": 382174, "epoch": 4604} {"train_loss": -26.531652450561523, "global_step": 382175, "epoch": 4604} {"train_loss": -26.722761154174805, "global_step": 382176, "epoch": 4604} {"train_loss": -26.513614654541016, "global_step": 382177, "epoch": 4604} {"train_loss": -26.516326904296875, "global_step": 382178, "epoch": 4604} {"train_loss": -26.356836318969727, "global_step": 382179, "epoch": 4604} {"train_loss": -26.988361358642578, "global_step": 382180, "epoch": 4604} {"train_loss": -26.513715744018555, "global_step": 382181, "epoch": 4604} {"train_loss": -26.626638412475586, "global_step": 382182, "epoch": 4604} {"train_loss": -26.379613876342773, "global_step": 382183, "epoch": 4604} {"train_loss": -26.748136520385742, "global_step": 382184, "epoch": 4604} {"train_loss": -26.433338165283203, "global_step": 382185, "epoch": 4604} {"train_loss": -26.44891357421875, "global_step": 382186, "epoch": 4604} {"train_loss": -26.80141258239746, "global_step": 382187, "epoch": 4604} {"train_loss": -27.003681182861328, "global_step": 382188, "epoch": 4604} {"train_loss": -26.583953857421875, "global_step": 382189, "epoch": 4604} {"train_loss": -26.717100143432617, "global_step": 382190, "epoch": 4604} {"train_loss": -26.393783569335938, "global_step": 382191, "epoch": 4604} {"train_loss": -26.617090225219727, "global_step": 382192, "epoch": 4604} {"train_loss": -26.421777725219727, "global_step": 382193, "epoch": 4604} {"train_loss": -26.357879638671875, "global_step": 382194, "epoch": 4604} {"train_loss": -26.87590980529785, "global_step": 382195, "epoch": 4604} {"train_loss": -26.734594345092773, "global_step": 382196, "epoch": 4604} {"train_loss": -26.60645866394043, "global_step": 382197, "epoch": 4604} {"train_loss": -26.836957931518555, "global_step": 382198, "epoch": 4604} {"train_loss": -26.7377986907959, "global_step": 382199, "epoch": 4604} {"train_loss": -26.420385360717773, "global_step": 382200, "epoch": 4604} {"train_loss": -26.725622177124023, "global_step": 382201, "epoch": 4604} {"train_loss": -26.36919593811035, "global_step": 382202, "epoch": 4604} {"train_loss": -26.831634521484375, "global_step": 382203, "epoch": 4604} {"train_loss": -26.440210342407227, "global_step": 382204, "epoch": 4604} {"train_loss": -26.590234756469727, "global_step": 382205, "epoch": 4604} {"train_loss": -26.76116943359375, "global_step": 382206, "epoch": 4604} {"train_loss": -26.410980224609375, "global_step": 382207, "epoch": 4604} {"train_loss": -26.546857833862305, "global_step": 382208, "epoch": 4604} {"train_loss": -26.412750244140625, "global_step": 382209, "epoch": 4604} {"train_loss": -26.120031356811523, "global_step": 382210, "epoch": 4604} {"train_loss": -26.130090713500977, "global_step": 382211, "epoch": 4604} {"train_loss": -24.542264938354492, "global_step": 382212, "epoch": 4604} {"train_loss": -23.0471248626709, "global_step": 382213, "epoch": 4604} {"train_loss": -26.36535743345697, "global_step": 382214, "epoch": 4604, "val_loss": 6650651.5} {"train_loss": -20.670591354370117, "global_step": 382215, "epoch": 4605} {"train_loss": -23.39937973022461, "global_step": 382216, "epoch": 4605} {"train_loss": -21.667226791381836, "global_step": 382217, "epoch": 4605} {"train_loss": -23.281593322753906, "global_step": 382218, "epoch": 4605} {"train_loss": -23.398651123046875, "global_step": 382219, "epoch": 4605} {"train_loss": -23.41360092163086, "global_step": 382220, "epoch": 4605} {"train_loss": -23.867719650268555, "global_step": 382221, "epoch": 4605} {"train_loss": -23.46908950805664, "global_step": 382222, "epoch": 4605} {"train_loss": -24.002197265625, "global_step": 382223, "epoch": 4605} {"train_loss": -24.571258544921875, "global_step": 382224, "epoch": 4605} {"train_loss": -24.006078720092773, "global_step": 382225, "epoch": 4605} {"train_loss": -23.70807456970215, "global_step": 382226, "epoch": 4605} {"train_loss": -24.52266502380371, "global_step": 382227, "epoch": 4605} {"train_loss": -24.461830139160156, "global_step": 382228, "epoch": 4605} {"train_loss": -24.242294311523438, "global_step": 382229, "epoch": 4605} {"train_loss": -24.015789031982422, "global_step": 382230, "epoch": 4605} {"train_loss": -24.229665756225586, "global_step": 382231, "epoch": 4605} {"train_loss": -24.46816635131836, "global_step": 382232, "epoch": 4605} {"train_loss": -24.527725219726562, "global_step": 382233, "epoch": 4605} {"train_loss": -24.716970443725586, "global_step": 382234, "epoch": 4605} {"train_loss": -24.4682559967041, "global_step": 382235, "epoch": 4605} {"train_loss": -24.510940551757812, "global_step": 382236, "epoch": 4605} {"train_loss": -24.730667114257812, "global_step": 382237, "epoch": 4605} {"train_loss": -24.92253875732422, "global_step": 382238, "epoch": 4605} {"train_loss": -24.964994430541992, "global_step": 382239, "epoch": 4605} {"train_loss": -24.841333389282227, "global_step": 382240, "epoch": 4605} {"train_loss": -24.466825485229492, "global_step": 382241, "epoch": 4605} {"train_loss": -25.295948028564453, "global_step": 382242, "epoch": 4605} {"train_loss": -24.99435806274414, "global_step": 382243, "epoch": 4605} {"train_loss": -24.898130416870117, "global_step": 382244, "epoch": 4605} {"train_loss": -25.341520309448242, "global_step": 382245, "epoch": 4605} {"train_loss": -25.33286476135254, "global_step": 382246, "epoch": 4605} {"train_loss": -25.486642837524414, "global_step": 382247, "epoch": 4605} {"train_loss": -25.19085121154785, "global_step": 382248, "epoch": 4605} {"train_loss": -25.521081924438477, "global_step": 382249, "epoch": 4605} {"train_loss": -25.548093795776367, "global_step": 382250, "epoch": 4605} {"train_loss": -25.52936363220215, "global_step": 382251, "epoch": 4605} {"train_loss": -25.239900588989258, "global_step": 382252, "epoch": 4605} {"train_loss": -25.727060317993164, "global_step": 382253, "epoch": 4605} {"train_loss": -25.46124839782715, "global_step": 382254, "epoch": 4605} {"train_loss": -25.557376861572266, "global_step": 382255, "epoch": 4605} {"train_loss": -25.54192543029785, "global_step": 382256, "epoch": 4605} {"train_loss": -25.822341918945312, "global_step": 382257, "epoch": 4605} {"train_loss": -25.901514053344727, "global_step": 382258, "epoch": 4605} {"train_loss": -25.834075927734375, "global_step": 382259, "epoch": 4605} {"train_loss": -26.022451400756836, "global_step": 382260, "epoch": 4605} {"train_loss": -25.88998794555664, "global_step": 382261, "epoch": 4605} {"train_loss": -26.04570960998535, "global_step": 382262, "epoch": 4605} {"train_loss": -25.930524826049805, "global_step": 382263, "epoch": 4605} {"train_loss": -25.94624137878418, "global_step": 382264, "epoch": 4605} {"train_loss": -26.205915451049805, "global_step": 382265, "epoch": 4605} {"train_loss": -25.601545333862305, "global_step": 382266, "epoch": 4605} {"train_loss": -26.295124053955078, "global_step": 382267, "epoch": 4605} {"train_loss": -25.908279418945312, "global_step": 382268, "epoch": 4605} {"train_loss": -25.763824462890625, "global_step": 382269, "epoch": 4605} {"train_loss": -26.328445434570312, "global_step": 382270, "epoch": 4605} {"train_loss": -26.38588523864746, "global_step": 382271, "epoch": 4605} {"train_loss": -26.14751625061035, "global_step": 382272, "epoch": 4605} {"train_loss": -26.420698165893555, "global_step": 382273, "epoch": 4605} {"train_loss": -26.566190719604492, "global_step": 382274, "epoch": 4605} {"train_loss": -26.2950382232666, "global_step": 382275, "epoch": 4605} {"train_loss": -26.19001579284668, "global_step": 382276, "epoch": 4605} {"train_loss": -26.3494930267334, "global_step": 382277, "epoch": 4605} {"train_loss": -26.209836959838867, "global_step": 382278, "epoch": 4605} {"train_loss": -26.427398681640625, "global_step": 382279, "epoch": 4605} {"train_loss": -25.93310546875, "global_step": 382280, "epoch": 4605} {"train_loss": -26.771692276000977, "global_step": 382281, "epoch": 4605} {"train_loss": -26.137786865234375, "global_step": 382282, "epoch": 4605} {"train_loss": -26.267993927001953, "global_step": 382283, "epoch": 4605} {"train_loss": -26.504119873046875, "global_step": 382284, "epoch": 4605} {"train_loss": -26.585363388061523, "global_step": 382285, "epoch": 4605} {"train_loss": -26.41541862487793, "global_step": 382286, "epoch": 4605} {"train_loss": -26.15241050720215, "global_step": 382287, "epoch": 4605} {"train_loss": -26.500410079956055, "global_step": 382288, "epoch": 4605} {"train_loss": -26.388168334960938, "global_step": 382289, "epoch": 4605} {"train_loss": -26.652210235595703, "global_step": 382290, "epoch": 4605} {"train_loss": -26.439788818359375, "global_step": 382291, "epoch": 4605} {"train_loss": -26.839826583862305, "global_step": 382292, "epoch": 4605} {"train_loss": -26.45058250427246, "global_step": 382293, "epoch": 4605} {"train_loss": -26.24614906311035, "global_step": 382294, "epoch": 4605} {"train_loss": -26.346647262573242, "global_step": 382295, "epoch": 4605} {"train_loss": -26.300296783447266, "global_step": 382296, "epoch": 4605} {"train_loss": -25.356358217905804, "global_step": 382297, "epoch": 4605, "val_loss": 6599245.0} {"train_loss": -26.060302734375, "global_step": 382298, "epoch": 4606} {"train_loss": -25.810230255126953, "global_step": 382299, "epoch": 4606} {"train_loss": -26.223569869995117, "global_step": 382300, "epoch": 4606} {"train_loss": -26.645893096923828, "global_step": 382301, "epoch": 4606} {"train_loss": -25.882898330688477, "global_step": 382302, "epoch": 4606} {"train_loss": -26.202184677124023, "global_step": 382303, "epoch": 4606} {"train_loss": -26.403961181640625, "global_step": 382304, "epoch": 4606} {"train_loss": -26.5823917388916, "global_step": 382305, "epoch": 4606} {"train_loss": -26.476720809936523, "global_step": 382306, "epoch": 4606} {"train_loss": -26.327804565429688, "global_step": 382307, "epoch": 4606} {"train_loss": -26.574939727783203, "global_step": 382308, "epoch": 4606} {"train_loss": -26.236921310424805, "global_step": 382309, "epoch": 4606} {"train_loss": -26.708240509033203, "global_step": 382310, "epoch": 4606} {"train_loss": -26.32929801940918, "global_step": 382311, "epoch": 4606} {"train_loss": -26.437946319580078, "global_step": 382312, "epoch": 4606} {"train_loss": -26.50323486328125, "global_step": 382313, "epoch": 4606} {"train_loss": -26.312646865844727, "global_step": 382314, "epoch": 4606} {"train_loss": -25.893157958984375, "global_step": 382315, "epoch": 4606} {"train_loss": -25.7800235748291, "global_step": 382316, "epoch": 4606} {"train_loss": -26.081226348876953, "global_step": 382317, "epoch": 4606} {"train_loss": -26.441272735595703, "global_step": 382318, "epoch": 4606} {"train_loss": -26.34478759765625, "global_step": 382319, "epoch": 4606} {"train_loss": -26.26169776916504, "global_step": 382320, "epoch": 4606} {"train_loss": -26.7970027923584, "global_step": 382321, "epoch": 4606} {"train_loss": -26.277084350585938, "global_step": 382322, "epoch": 4606} {"train_loss": -26.248748779296875, "global_step": 382323, "epoch": 4606} {"train_loss": -26.8887882232666, "global_step": 382324, "epoch": 4606} {"train_loss": -26.522724151611328, "global_step": 382325, "epoch": 4606} {"train_loss": -26.958948135375977, "global_step": 382326, "epoch": 4606} {"train_loss": -26.533674240112305, "global_step": 382327, "epoch": 4606} {"train_loss": -26.49567985534668, "global_step": 382328, "epoch": 4606} {"train_loss": -26.260221481323242, "global_step": 382329, "epoch": 4606} {"train_loss": -26.675724029541016, "global_step": 382330, "epoch": 4606} {"train_loss": -26.39851951599121, "global_step": 382331, "epoch": 4606} {"train_loss": -26.254526138305664, "global_step": 382332, "epoch": 4606} {"train_loss": -26.51999282836914, "global_step": 382333, "epoch": 4606} {"train_loss": -26.61014175415039, "global_step": 382334, "epoch": 4606} {"train_loss": -26.55824089050293, "global_step": 382335, "epoch": 4606} {"train_loss": -26.57919692993164, "global_step": 382336, "epoch": 4606} {"train_loss": -26.62372398376465, "global_step": 382337, "epoch": 4606} {"train_loss": -26.286865234375, "global_step": 382338, "epoch": 4606} {"train_loss": -26.763776779174805, "global_step": 382339, "epoch": 4606} {"train_loss": -26.523168563842773, "global_step": 382340, "epoch": 4606} {"train_loss": -26.537588119506836, "global_step": 382341, "epoch": 4606} {"train_loss": -26.2865047454834, "global_step": 382342, "epoch": 4606} {"train_loss": -26.6182861328125, "global_step": 382343, "epoch": 4606} {"train_loss": -26.4811954498291, "global_step": 382344, "epoch": 4606} {"train_loss": -26.623031616210938, "global_step": 382345, "epoch": 4606} {"train_loss": -26.35906982421875, "global_step": 382346, "epoch": 4606} {"train_loss": -26.59271812438965, "global_step": 382347, "epoch": 4606} {"train_loss": -26.583288192749023, "global_step": 382348, "epoch": 4606} {"train_loss": -26.53425407409668, "global_step": 382349, "epoch": 4606} {"train_loss": -26.423994064331055, "global_step": 382350, "epoch": 4606} {"train_loss": -26.55365562438965, "global_step": 382351, "epoch": 4606} {"train_loss": -26.88427734375, "global_step": 382352, "epoch": 4606} {"train_loss": -26.608911514282227, "global_step": 382353, "epoch": 4606} {"train_loss": -26.72125816345215, "global_step": 382354, "epoch": 4606} {"train_loss": -26.531890869140625, "global_step": 382355, "epoch": 4606} {"train_loss": -26.514062881469727, "global_step": 382356, "epoch": 4606} {"train_loss": -26.52212905883789, "global_step": 382357, "epoch": 4606} {"train_loss": -26.37189292907715, "global_step": 382358, "epoch": 4606} {"train_loss": -26.50811195373535, "global_step": 382359, "epoch": 4606} {"train_loss": -26.634113311767578, "global_step": 382360, "epoch": 4606} {"train_loss": -26.691343307495117, "global_step": 382361, "epoch": 4606} {"train_loss": -26.504140853881836, "global_step": 382362, "epoch": 4606} {"train_loss": -26.427005767822266, "global_step": 382363, "epoch": 4606} {"train_loss": -26.632917404174805, "global_step": 382364, "epoch": 4606} {"train_loss": -26.60499382019043, "global_step": 382365, "epoch": 4606} {"train_loss": -26.695051193237305, "global_step": 382366, "epoch": 4606} {"train_loss": -26.5065860748291, "global_step": 382367, "epoch": 4606} {"train_loss": -26.060531616210938, "global_step": 382368, "epoch": 4606} {"train_loss": -26.2331600189209, "global_step": 382369, "epoch": 4606} {"train_loss": -26.50144386291504, "global_step": 382370, "epoch": 4606} {"train_loss": -26.458511352539062, "global_step": 382371, "epoch": 4606} {"train_loss": -26.198286056518555, "global_step": 382372, "epoch": 4606} {"train_loss": -25.895313262939453, "global_step": 382373, "epoch": 4606} {"train_loss": -25.39408302307129, "global_step": 382374, "epoch": 4606} {"train_loss": -26.08164405822754, "global_step": 382375, "epoch": 4606} {"train_loss": -26.04633903503418, "global_step": 382376, "epoch": 4606} {"train_loss": -26.517065048217773, "global_step": 382377, "epoch": 4606} {"train_loss": -26.310352325439453, "global_step": 382378, "epoch": 4606} {"train_loss": -26.443151473999023, "global_step": 382379, "epoch": 4606} {"train_loss": -26.411471217511647, "global_step": 382380, "epoch": 4606, "val_loss": 6574070.5} {"train_loss": -25.456899642944336, "global_step": 382381, "epoch": 4607} {"train_loss": -26.205793380737305, "global_step": 382382, "epoch": 4607} {"train_loss": -26.224567413330078, "global_step": 382383, "epoch": 4607} {"train_loss": -25.830921173095703, "global_step": 382384, "epoch": 4607} {"train_loss": -25.7694091796875, "global_step": 382385, "epoch": 4607} {"train_loss": -25.853986740112305, "global_step": 382386, "epoch": 4607} {"train_loss": -25.85951805114746, "global_step": 382387, "epoch": 4607} {"train_loss": -25.886442184448242, "global_step": 382388, "epoch": 4607} {"train_loss": -26.028783798217773, "global_step": 382389, "epoch": 4607} {"train_loss": -25.969568252563477, "global_step": 382390, "epoch": 4607} {"train_loss": -25.56709861755371, "global_step": 382391, "epoch": 4607} {"train_loss": -25.754308700561523, "global_step": 382392, "epoch": 4607} {"train_loss": -26.01995849609375, "global_step": 382393, "epoch": 4607} {"train_loss": -26.306568145751953, "global_step": 382394, "epoch": 4607} {"train_loss": -26.536209106445312, "global_step": 382395, "epoch": 4607} {"train_loss": -26.135034561157227, "global_step": 382396, "epoch": 4607} {"train_loss": -26.156097412109375, "global_step": 382397, "epoch": 4607} {"train_loss": -26.265274047851562, "global_step": 382398, "epoch": 4607} {"train_loss": -25.981550216674805, "global_step": 382399, "epoch": 4607} {"train_loss": -25.973785400390625, "global_step": 382400, "epoch": 4607} {"train_loss": -26.439472198486328, "global_step": 382401, "epoch": 4607} {"train_loss": -26.326812744140625, "global_step": 382402, "epoch": 4607} {"train_loss": -25.970325469970703, "global_step": 382403, "epoch": 4607} {"train_loss": -26.71323013305664, "global_step": 382404, "epoch": 4607} {"train_loss": -26.103485107421875, "global_step": 382405, "epoch": 4607} {"train_loss": -26.1856746673584, "global_step": 382406, "epoch": 4607} {"train_loss": -26.496601104736328, "global_step": 382407, "epoch": 4607} {"train_loss": -26.154438018798828, "global_step": 382408, "epoch": 4607} {"train_loss": -26.068220138549805, "global_step": 382409, "epoch": 4607} {"train_loss": -26.607877731323242, "global_step": 382410, "epoch": 4607} {"train_loss": -26.3343563079834, "global_step": 382411, "epoch": 4607} {"train_loss": -26.6142520904541, "global_step": 382412, "epoch": 4607} {"train_loss": -26.862409591674805, "global_step": 382413, "epoch": 4607} {"train_loss": -26.839832305908203, "global_step": 382414, "epoch": 4607} {"train_loss": -26.772130966186523, "global_step": 382415, "epoch": 4607} {"train_loss": -26.555377960205078, "global_step": 382416, "epoch": 4607} {"train_loss": -26.601764678955078, "global_step": 382417, "epoch": 4607} {"train_loss": -26.792150497436523, "global_step": 382418, "epoch": 4607} {"train_loss": -26.431171417236328, "global_step": 382419, "epoch": 4607} {"train_loss": -26.232946395874023, "global_step": 382420, "epoch": 4607} {"train_loss": -26.96282386779785, "global_step": 382421, "epoch": 4607} {"train_loss": -26.58192253112793, "global_step": 382422, "epoch": 4607} {"train_loss": -26.495283126831055, "global_step": 382423, "epoch": 4607} {"train_loss": -26.031585693359375, "global_step": 382424, "epoch": 4607} {"train_loss": -25.955259323120117, "global_step": 382425, "epoch": 4607} {"train_loss": -26.21978187561035, "global_step": 382426, "epoch": 4607} {"train_loss": -26.55836296081543, "global_step": 382427, "epoch": 4607} {"train_loss": -26.607379913330078, "global_step": 382428, "epoch": 4607} {"train_loss": -26.321741104125977, "global_step": 382429, "epoch": 4607} {"train_loss": -26.46001625061035, "global_step": 382430, "epoch": 4607} {"train_loss": -26.346532821655273, "global_step": 382431, "epoch": 4607} {"train_loss": -26.887556076049805, "global_step": 382432, "epoch": 4607} {"train_loss": -26.154560089111328, "global_step": 382433, "epoch": 4607} {"train_loss": -26.325647354125977, "global_step": 382434, "epoch": 4607} {"train_loss": -26.859882354736328, "global_step": 382435, "epoch": 4607} {"train_loss": -25.85917091369629, "global_step": 382436, "epoch": 4607} {"train_loss": -26.451391220092773, "global_step": 382437, "epoch": 4607} {"train_loss": -26.224905014038086, "global_step": 382438, "epoch": 4607} {"train_loss": -26.403564453125, "global_step": 382439, "epoch": 4607} {"train_loss": -26.097639083862305, "global_step": 382440, "epoch": 4607} {"train_loss": -26.686899185180664, "global_step": 382441, "epoch": 4607} {"train_loss": -26.435791015625, "global_step": 382442, "epoch": 4607} {"train_loss": -26.465063095092773, "global_step": 382443, "epoch": 4607} {"train_loss": -26.15833854675293, "global_step": 382444, "epoch": 4607} {"train_loss": -26.736581802368164, "global_step": 382445, "epoch": 4607} {"train_loss": -26.83002281188965, "global_step": 382446, "epoch": 4607} {"train_loss": -26.74016761779785, "global_step": 382447, "epoch": 4607} {"train_loss": -26.20737075805664, "global_step": 382448, "epoch": 4607} {"train_loss": -26.700117111206055, "global_step": 382449, "epoch": 4607} {"train_loss": -26.829538345336914, "global_step": 382450, "epoch": 4607} {"train_loss": -26.516218185424805, "global_step": 382451, "epoch": 4607} {"train_loss": -26.50542640686035, "global_step": 382452, "epoch": 4607} {"train_loss": -26.487104415893555, "global_step": 382453, "epoch": 4607} {"train_loss": -26.809659957885742, "global_step": 382454, "epoch": 4607} {"train_loss": -26.507856369018555, "global_step": 382455, "epoch": 4607} {"train_loss": -26.76519775390625, "global_step": 382456, "epoch": 4607} {"train_loss": -26.430740356445312, "global_step": 382457, "epoch": 4607} {"train_loss": -26.566328048706055, "global_step": 382458, "epoch": 4607} {"train_loss": -26.589160919189453, "global_step": 382459, "epoch": 4607} {"train_loss": -26.288787841796875, "global_step": 382460, "epoch": 4607} {"train_loss": -26.70344352722168, "global_step": 382461, "epoch": 4607} {"train_loss": -26.174848556518555, "global_step": 382462, "epoch": 4607} {"train_loss": -26.345535117459583, "global_step": 382463, "epoch": 4607, "val_loss": 6654125.5} {"train_loss": -26.04505729675293, "global_step": 382464, "epoch": 4608} {"train_loss": -26.034027099609375, "global_step": 382465, "epoch": 4608} {"train_loss": -25.94687271118164, "global_step": 382466, "epoch": 4608} {"train_loss": -26.248319625854492, "global_step": 382467, "epoch": 4608} {"train_loss": -25.898880004882812, "global_step": 382468, "epoch": 4608} {"train_loss": -25.691450119018555, "global_step": 382469, "epoch": 4608} {"train_loss": -26.067596435546875, "global_step": 382470, "epoch": 4608} {"train_loss": -25.964282989501953, "global_step": 382471, "epoch": 4608} {"train_loss": -26.191572189331055, "global_step": 382472, "epoch": 4608} {"train_loss": -25.97565269470215, "global_step": 382473, "epoch": 4608} {"train_loss": -26.0230655670166, "global_step": 382474, "epoch": 4608} {"train_loss": -25.921201705932617, "global_step": 382475, "epoch": 4608} {"train_loss": -26.329259872436523, "global_step": 382476, "epoch": 4608} {"train_loss": -26.069183349609375, "global_step": 382477, "epoch": 4608} {"train_loss": -26.1540470123291, "global_step": 382478, "epoch": 4608} {"train_loss": -26.000410079956055, "global_step": 382479, "epoch": 4608} {"train_loss": -26.09331703186035, "global_step": 382480, "epoch": 4608} {"train_loss": -26.3308048248291, "global_step": 382481, "epoch": 4608} {"train_loss": -26.23811912536621, "global_step": 382482, "epoch": 4608} {"train_loss": -26.214330673217773, "global_step": 382483, "epoch": 4608} {"train_loss": -26.261688232421875, "global_step": 382484, "epoch": 4608} {"train_loss": -26.38815689086914, "global_step": 382485, "epoch": 4608} {"train_loss": -26.691959381103516, "global_step": 382486, "epoch": 4608} {"train_loss": -26.19394302368164, "global_step": 382487, "epoch": 4608} {"train_loss": -26.1827392578125, "global_step": 382488, "epoch": 4608} {"train_loss": -26.596765518188477, "global_step": 382489, "epoch": 4608} {"train_loss": -26.43511390686035, "global_step": 382490, "epoch": 4608} {"train_loss": -26.220693588256836, "global_step": 382491, "epoch": 4608} {"train_loss": -26.297536849975586, "global_step": 382492, "epoch": 4608} {"train_loss": -27.05718421936035, "global_step": 382493, "epoch": 4608} {"train_loss": -26.0949764251709, "global_step": 382494, "epoch": 4608} {"train_loss": -26.22035026550293, "global_step": 382495, "epoch": 4608} {"train_loss": -26.496179580688477, "global_step": 382496, "epoch": 4608} {"train_loss": -26.63298988342285, "global_step": 382497, "epoch": 4608} {"train_loss": -26.51006507873535, "global_step": 382498, "epoch": 4608} {"train_loss": -26.47901725769043, "global_step": 382499, "epoch": 4608} {"train_loss": -26.385297775268555, "global_step": 382500, "epoch": 4608} {"train_loss": -26.562658309936523, "global_step": 382501, "epoch": 4608} {"train_loss": -26.376239776611328, "global_step": 382502, "epoch": 4608} {"train_loss": -26.688161849975586, "global_step": 382503, "epoch": 4608} {"train_loss": -26.987232208251953, "global_step": 382504, "epoch": 4608} {"train_loss": -26.56752586364746, "global_step": 382505, "epoch": 4608} {"train_loss": -26.487268447875977, "global_step": 382506, "epoch": 4608} {"train_loss": -26.56394386291504, "global_step": 382507, "epoch": 4608} {"train_loss": -26.789533615112305, "global_step": 382508, "epoch": 4608} {"train_loss": -26.062463760375977, "global_step": 382509, "epoch": 4608} {"train_loss": -26.840030670166016, "global_step": 382510, "epoch": 4608} {"train_loss": -26.81206703186035, "global_step": 382511, "epoch": 4608} {"train_loss": -26.599903106689453, "global_step": 382512, "epoch": 4608} {"train_loss": -26.904150009155273, "global_step": 382513, "epoch": 4608} {"train_loss": -26.224109649658203, "global_step": 382514, "epoch": 4608} {"train_loss": -26.26691246032715, "global_step": 382515, "epoch": 4608} {"train_loss": -25.683948516845703, "global_step": 382516, "epoch": 4608} {"train_loss": -26.060026168823242, "global_step": 382517, "epoch": 4608} {"train_loss": -26.73612403869629, "global_step": 382518, "epoch": 4608} {"train_loss": -26.0969295501709, "global_step": 382519, "epoch": 4608} {"train_loss": -26.117101669311523, "global_step": 382520, "epoch": 4608} {"train_loss": -26.278339385986328, "global_step": 382521, "epoch": 4608} {"train_loss": -26.31367301940918, "global_step": 382522, "epoch": 4608} {"train_loss": -25.749530792236328, "global_step": 382523, "epoch": 4608} {"train_loss": -25.7541561126709, "global_step": 382524, "epoch": 4608} {"train_loss": -26.340620040893555, "global_step": 382525, "epoch": 4608} {"train_loss": -26.017566680908203, "global_step": 382526, "epoch": 4608} {"train_loss": -25.968647003173828, "global_step": 382527, "epoch": 4608} {"train_loss": -26.191781997680664, "global_step": 382528, "epoch": 4608} {"train_loss": -25.767187118530273, "global_step": 382529, "epoch": 4608} {"train_loss": -26.057907104492188, "global_step": 382530, "epoch": 4608} {"train_loss": -26.496442794799805, "global_step": 382531, "epoch": 4608} {"train_loss": -26.03938865661621, "global_step": 382532, "epoch": 4608} {"train_loss": -25.85003662109375, "global_step": 382533, "epoch": 4608} {"train_loss": -25.75953483581543, "global_step": 382534, "epoch": 4608} {"train_loss": -26.305068969726562, "global_step": 382535, "epoch": 4608} {"train_loss": -26.3941593170166, "global_step": 382536, "epoch": 4608} {"train_loss": -26.13629150390625, "global_step": 382537, "epoch": 4608} {"train_loss": -26.082300186157227, "global_step": 382538, "epoch": 4608} {"train_loss": -26.359699249267578, "global_step": 382539, "epoch": 4608} {"train_loss": -26.41178321838379, "global_step": 382540, "epoch": 4608} {"train_loss": -26.61232566833496, "global_step": 382541, "epoch": 4608} {"train_loss": -26.51235008239746, "global_step": 382542, "epoch": 4608} {"train_loss": -26.271820068359375, "global_step": 382543, "epoch": 4608} {"train_loss": -26.102863311767578, "global_step": 382544, "epoch": 4608} {"train_loss": -26.573102951049805, "global_step": 382545, "epoch": 4608} {"train_loss": -26.281198386686395, "global_step": 382546, "epoch": 4608, "val_loss": 6565631.0} {"train_loss": -26.74896240234375, "global_step": 382547, "epoch": 4609} {"train_loss": -26.354278564453125, "global_step": 382548, "epoch": 4609} {"train_loss": -26.060522079467773, "global_step": 382549, "epoch": 4609} {"train_loss": -26.186609268188477, "global_step": 382550, "epoch": 4609} {"train_loss": -26.462818145751953, "global_step": 382551, "epoch": 4609} {"train_loss": -26.407276153564453, "global_step": 382552, "epoch": 4609} {"train_loss": -26.294309616088867, "global_step": 382553, "epoch": 4609} {"train_loss": -26.482746124267578, "global_step": 382554, "epoch": 4609} {"train_loss": -26.17987060546875, "global_step": 382555, "epoch": 4609} {"train_loss": -26.564889907836914, "global_step": 382556, "epoch": 4609} {"train_loss": -26.22845458984375, "global_step": 382557, "epoch": 4609} {"train_loss": -26.279508590698242, "global_step": 382558, "epoch": 4609} {"train_loss": -26.052637100219727, "global_step": 382559, "epoch": 4609} {"train_loss": -26.496429443359375, "global_step": 382560, "epoch": 4609} {"train_loss": -26.325841903686523, "global_step": 382561, "epoch": 4609} {"train_loss": -26.36971092224121, "global_step": 382562, "epoch": 4609} {"train_loss": -26.492328643798828, "global_step": 382563, "epoch": 4609} {"train_loss": -26.48381996154785, "global_step": 382564, "epoch": 4609} {"train_loss": -26.372777938842773, "global_step": 382565, "epoch": 4609} {"train_loss": -26.62135124206543, "global_step": 382566, "epoch": 4609} {"train_loss": -26.55999183654785, "global_step": 382567, "epoch": 4609} {"train_loss": -26.420530319213867, "global_step": 382568, "epoch": 4609} {"train_loss": -26.455488204956055, "global_step": 382569, "epoch": 4609} {"train_loss": -26.569278717041016, "global_step": 382570, "epoch": 4609} {"train_loss": -26.85279655456543, "global_step": 382571, "epoch": 4609} {"train_loss": -26.386754989624023, "global_step": 382572, "epoch": 4609} {"train_loss": -26.611907958984375, "global_step": 382573, "epoch": 4609} {"train_loss": -26.811208724975586, "global_step": 382574, "epoch": 4609} {"train_loss": -26.569509506225586, "global_step": 382575, "epoch": 4609} {"train_loss": -26.62958335876465, "global_step": 382576, "epoch": 4609} {"train_loss": -26.64063835144043, "global_step": 382577, "epoch": 4609} {"train_loss": -26.829450607299805, "global_step": 382578, "epoch": 4609} {"train_loss": -26.598407745361328, "global_step": 382579, "epoch": 4609} {"train_loss": -26.572370529174805, "global_step": 382580, "epoch": 4609} {"train_loss": -26.802230834960938, "global_step": 382581, "epoch": 4609} {"train_loss": -26.73175048828125, "global_step": 382582, "epoch": 4609} {"train_loss": -26.682580947875977, "global_step": 382583, "epoch": 4609} {"train_loss": -26.421445846557617, "global_step": 382584, "epoch": 4609} {"train_loss": -26.543079376220703, "global_step": 382585, "epoch": 4609} {"train_loss": -26.517629623413086, "global_step": 382586, "epoch": 4609} {"train_loss": -26.963565826416016, "global_step": 382587, "epoch": 4609} {"train_loss": -26.619434356689453, "global_step": 382588, "epoch": 4609} {"train_loss": -26.63038444519043, "global_step": 382589, "epoch": 4609} {"train_loss": -26.815515518188477, "global_step": 382590, "epoch": 4609} {"train_loss": -26.500516891479492, "global_step": 382591, "epoch": 4609} {"train_loss": -26.694509506225586, "global_step": 382592, "epoch": 4609} {"train_loss": -26.996732711791992, "global_step": 382593, "epoch": 4609} {"train_loss": -26.71759605407715, "global_step": 382594, "epoch": 4609} {"train_loss": -26.507038116455078, "global_step": 382595, "epoch": 4609} {"train_loss": -26.722150802612305, "global_step": 382596, "epoch": 4609} {"train_loss": -25.764719009399414, "global_step": 382597, "epoch": 4609} {"train_loss": -26.185827255249023, "global_step": 382598, "epoch": 4609} {"train_loss": -26.643421173095703, "global_step": 382599, "epoch": 4609} {"train_loss": -26.730560302734375, "global_step": 382600, "epoch": 4609} {"train_loss": -26.679981231689453, "global_step": 382601, "epoch": 4609} {"train_loss": -26.721881866455078, "global_step": 382602, "epoch": 4609} {"train_loss": -26.273773193359375, "global_step": 382603, "epoch": 4609} {"train_loss": -26.52223014831543, "global_step": 382604, "epoch": 4609} {"train_loss": -26.451337814331055, "global_step": 382605, "epoch": 4609} {"train_loss": -26.108652114868164, "global_step": 382606, "epoch": 4609} {"train_loss": -26.622629165649414, "global_step": 382607, "epoch": 4609} {"train_loss": -26.196292877197266, "global_step": 382608, "epoch": 4609} {"train_loss": -25.9046688079834, "global_step": 382609, "epoch": 4609} {"train_loss": -25.086803436279297, "global_step": 382610, "epoch": 4609} {"train_loss": -25.788965225219727, "global_step": 382611, "epoch": 4609} {"train_loss": -26.191389083862305, "global_step": 382612, "epoch": 4609} {"train_loss": -26.106372833251953, "global_step": 382613, "epoch": 4609} {"train_loss": -26.157062530517578, "global_step": 382614, "epoch": 4609} {"train_loss": -25.934131622314453, "global_step": 382615, "epoch": 4609} {"train_loss": -26.387365341186523, "global_step": 382616, "epoch": 4609} {"train_loss": -25.87514305114746, "global_step": 382617, "epoch": 4609} {"train_loss": -26.33917808532715, "global_step": 382618, "epoch": 4609} {"train_loss": -26.4454402923584, "global_step": 382619, "epoch": 4609} {"train_loss": -26.418909072875977, "global_step": 382620, "epoch": 4609} {"train_loss": -26.435993194580078, "global_step": 382621, "epoch": 4609} {"train_loss": -26.25593376159668, "global_step": 382622, "epoch": 4609} {"train_loss": -26.38301658630371, "global_step": 382623, "epoch": 4609} {"train_loss": -26.282245635986328, "global_step": 382624, "epoch": 4609} {"train_loss": -26.456491470336914, "global_step": 382625, "epoch": 4609} {"train_loss": -26.551727294921875, "global_step": 382626, "epoch": 4609} {"train_loss": -26.302087783813477, "global_step": 382627, "epoch": 4609} {"train_loss": -26.48673439025879, "global_step": 382628, "epoch": 4609} {"train_loss": -26.43468121448195, "global_step": 382629, "epoch": 4609, "val_loss": 6597438.0} {"train_loss": -25.76847267150879, "global_step": 382630, "epoch": 4610} {"train_loss": -26.39800453186035, "global_step": 382631, "epoch": 4610} {"train_loss": -25.67679214477539, "global_step": 382632, "epoch": 4610} {"train_loss": -25.619953155517578, "global_step": 382633, "epoch": 4610} {"train_loss": -25.92205238342285, "global_step": 382634, "epoch": 4610} {"train_loss": -25.897985458374023, "global_step": 382635, "epoch": 4610} {"train_loss": -26.19565773010254, "global_step": 382636, "epoch": 4610} {"train_loss": -26.589563369750977, "global_step": 382637, "epoch": 4610} {"train_loss": -26.130041122436523, "global_step": 382638, "epoch": 4610} {"train_loss": -26.31587028503418, "global_step": 382639, "epoch": 4610} {"train_loss": -26.170074462890625, "global_step": 382640, "epoch": 4610} {"train_loss": -25.8612003326416, "global_step": 382641, "epoch": 4610} {"train_loss": -25.70503044128418, "global_step": 382642, "epoch": 4610} {"train_loss": -25.680402755737305, "global_step": 382643, "epoch": 4610} {"train_loss": -26.18134117126465, "global_step": 382644, "epoch": 4610} {"train_loss": -26.324121475219727, "global_step": 382645, "epoch": 4610} {"train_loss": -26.312665939331055, "global_step": 382646, "epoch": 4610} {"train_loss": -26.3496150970459, "global_step": 382647, "epoch": 4610} {"train_loss": -26.500598907470703, "global_step": 382648, "epoch": 4610} {"train_loss": -26.183103561401367, "global_step": 382649, "epoch": 4610} {"train_loss": -26.1978816986084, "global_step": 382650, "epoch": 4610} {"train_loss": -26.34035301208496, "global_step": 382651, "epoch": 4610} {"train_loss": -26.455188751220703, "global_step": 382652, "epoch": 4610} {"train_loss": -26.343809127807617, "global_step": 382653, "epoch": 4610} {"train_loss": -26.534290313720703, "global_step": 382654, "epoch": 4610} {"train_loss": -26.559253692626953, "global_step": 382655, "epoch": 4610} {"train_loss": -26.273635864257812, "global_step": 382656, "epoch": 4610} {"train_loss": -26.477375030517578, "global_step": 382657, "epoch": 4610} {"train_loss": -26.5539493560791, "global_step": 382658, "epoch": 4610} {"train_loss": -26.2581787109375, "global_step": 382659, "epoch": 4610} {"train_loss": -26.72454833984375, "global_step": 382660, "epoch": 4610} {"train_loss": -26.53057289123535, "global_step": 382661, "epoch": 4610} {"train_loss": -26.648160934448242, "global_step": 382662, "epoch": 4610} {"train_loss": -26.38949966430664, "global_step": 382663, "epoch": 4610} {"train_loss": -26.657224655151367, "global_step": 382664, "epoch": 4610} {"train_loss": -26.2500057220459, "global_step": 382665, "epoch": 4610} {"train_loss": -26.501550674438477, "global_step": 382666, "epoch": 4610} {"train_loss": -26.662546157836914, "global_step": 382667, "epoch": 4610} {"train_loss": -26.390531539916992, "global_step": 382668, "epoch": 4610} {"train_loss": -26.596820831298828, "global_step": 382669, "epoch": 4610} {"train_loss": -26.63299560546875, "global_step": 382670, "epoch": 4610} {"train_loss": -26.282928466796875, "global_step": 382671, "epoch": 4610} {"train_loss": -26.361658096313477, "global_step": 382672, "epoch": 4610} {"train_loss": -26.598419189453125, "global_step": 382673, "epoch": 4610} {"train_loss": -26.411657333374023, "global_step": 382674, "epoch": 4610} {"train_loss": -26.715208053588867, "global_step": 382675, "epoch": 4610} {"train_loss": -26.685949325561523, "global_step": 382676, "epoch": 4610} {"train_loss": -26.222309112548828, "global_step": 382677, "epoch": 4610} {"train_loss": -26.42498779296875, "global_step": 382678, "epoch": 4610} {"train_loss": -26.524396896362305, "global_step": 382679, "epoch": 4610} {"train_loss": -26.266620635986328, "global_step": 382680, "epoch": 4610} {"train_loss": -26.415332794189453, "global_step": 382681, "epoch": 4610} {"train_loss": -26.752023696899414, "global_step": 382682, "epoch": 4610} {"train_loss": -26.614545822143555, "global_step": 382683, "epoch": 4610} {"train_loss": -26.6739559173584, "global_step": 382684, "epoch": 4610} {"train_loss": -26.3790225982666, "global_step": 382685, "epoch": 4610} {"train_loss": -26.857975006103516, "global_step": 382686, "epoch": 4610} {"train_loss": -26.611469268798828, "global_step": 382687, "epoch": 4610} {"train_loss": -26.328039169311523, "global_step": 382688, "epoch": 4610} {"train_loss": -26.673566818237305, "global_step": 382689, "epoch": 4610} {"train_loss": -26.57807731628418, "global_step": 382690, "epoch": 4610} {"train_loss": -26.602386474609375, "global_step": 382691, "epoch": 4610} {"train_loss": -26.268850326538086, "global_step": 382692, "epoch": 4610} {"train_loss": -26.142805099487305, "global_step": 382693, "epoch": 4610} {"train_loss": -26.362075805664062, "global_step": 382694, "epoch": 4610} {"train_loss": -26.37224769592285, "global_step": 382695, "epoch": 4610} {"train_loss": -26.75444984436035, "global_step": 382696, "epoch": 4610} {"train_loss": -26.75431251525879, "global_step": 382697, "epoch": 4610} {"train_loss": -27.025390625, "global_step": 382698, "epoch": 4610} {"train_loss": -26.37220573425293, "global_step": 382699, "epoch": 4610} {"train_loss": -26.543500900268555, "global_step": 382700, "epoch": 4610} {"train_loss": -26.245718002319336, "global_step": 382701, "epoch": 4610} {"train_loss": -26.120786666870117, "global_step": 382702, "epoch": 4610} {"train_loss": -26.06694984436035, "global_step": 382703, "epoch": 4610} {"train_loss": -25.977874755859375, "global_step": 382704, "epoch": 4610} {"train_loss": -26.385061264038086, "global_step": 382705, "epoch": 4610} {"train_loss": -26.250701904296875, "global_step": 382706, "epoch": 4610} {"train_loss": -26.744531631469727, "global_step": 382707, "epoch": 4610} {"train_loss": -26.66779899597168, "global_step": 382708, "epoch": 4610} {"train_loss": -26.642333984375, "global_step": 382709, "epoch": 4610} {"train_loss": -26.855070114135742, "global_step": 382710, "epoch": 4610} {"train_loss": -26.436431884765625, "global_step": 382711, "epoch": 4610} {"train_loss": -26.36839758631695, "global_step": 382712, "epoch": 4610, "val_loss": 6523913.5} {"train_loss": -25.97806167602539, "global_step": 382713, "epoch": 4611} {"train_loss": -25.76409912109375, "global_step": 382714, "epoch": 4611} {"train_loss": -25.52638816833496, "global_step": 382715, "epoch": 4611} {"train_loss": -25.854272842407227, "global_step": 382716, "epoch": 4611} {"train_loss": -26.2817325592041, "global_step": 382717, "epoch": 4611} {"train_loss": -25.732290267944336, "global_step": 382718, "epoch": 4611} {"train_loss": -26.35810661315918, "global_step": 382719, "epoch": 4611} {"train_loss": -25.846704483032227, "global_step": 382720, "epoch": 4611} {"train_loss": -26.00557518005371, "global_step": 382721, "epoch": 4611} {"train_loss": -25.706695556640625, "global_step": 382722, "epoch": 4611} {"train_loss": -25.994598388671875, "global_step": 382723, "epoch": 4611} {"train_loss": -25.778430938720703, "global_step": 382724, "epoch": 4611} {"train_loss": -26.179889678955078, "global_step": 382725, "epoch": 4611} {"train_loss": -26.298654556274414, "global_step": 382726, "epoch": 4611} {"train_loss": -26.34720230102539, "global_step": 382727, "epoch": 4611} {"train_loss": -26.272510528564453, "global_step": 382728, "epoch": 4611} {"train_loss": -26.35410499572754, "global_step": 382729, "epoch": 4611} {"train_loss": -26.10178565979004, "global_step": 382730, "epoch": 4611} {"train_loss": -26.484989166259766, "global_step": 382731, "epoch": 4611} {"train_loss": -26.132816314697266, "global_step": 382732, "epoch": 4611} {"train_loss": -26.613452911376953, "global_step": 382733, "epoch": 4611} {"train_loss": -26.19459342956543, "global_step": 382734, "epoch": 4611} {"train_loss": -26.325021743774414, "global_step": 382735, "epoch": 4611} {"train_loss": -26.328357696533203, "global_step": 382736, "epoch": 4611} {"train_loss": -26.680011749267578, "global_step": 382737, "epoch": 4611} {"train_loss": -26.373708724975586, "global_step": 382738, "epoch": 4611} {"train_loss": -26.458826065063477, "global_step": 382739, "epoch": 4611} {"train_loss": -26.67236328125, "global_step": 382740, "epoch": 4611} {"train_loss": -26.471027374267578, "global_step": 382741, "epoch": 4611} {"train_loss": -26.539020538330078, "global_step": 382742, "epoch": 4611} {"train_loss": -26.33711814880371, "global_step": 382743, "epoch": 4611} {"train_loss": -26.70418357849121, "global_step": 382744, "epoch": 4611} {"train_loss": -26.242456436157227, "global_step": 382745, "epoch": 4611} {"train_loss": -26.420902252197266, "global_step": 382746, "epoch": 4611} {"train_loss": -26.92286491394043, "global_step": 382747, "epoch": 4611} {"train_loss": -26.337970733642578, "global_step": 382748, "epoch": 4611} {"train_loss": -26.51626968383789, "global_step": 382749, "epoch": 4611} {"train_loss": -26.707406997680664, "global_step": 382750, "epoch": 4611} {"train_loss": -26.220624923706055, "global_step": 382751, "epoch": 4611} {"train_loss": -26.299673080444336, "global_step": 382752, "epoch": 4611} {"train_loss": -26.1052188873291, "global_step": 382753, "epoch": 4611} {"train_loss": -26.549224853515625, "global_step": 382754, "epoch": 4611} {"train_loss": -26.842374801635742, "global_step": 382755, "epoch": 4611} {"train_loss": -26.828649520874023, "global_step": 382756, "epoch": 4611} {"train_loss": -26.71780776977539, "global_step": 382757, "epoch": 4611} {"train_loss": -26.52469253540039, "global_step": 382758, "epoch": 4611} {"train_loss": -26.4622859954834, "global_step": 382759, "epoch": 4611} {"train_loss": -26.55167579650879, "global_step": 382760, "epoch": 4611} {"train_loss": -26.37627601623535, "global_step": 382761, "epoch": 4611} {"train_loss": -26.80951499938965, "global_step": 382762, "epoch": 4611} {"train_loss": -26.585004806518555, "global_step": 382763, "epoch": 4611} {"train_loss": -26.575504302978516, "global_step": 382764, "epoch": 4611} {"train_loss": -26.425867080688477, "global_step": 382765, "epoch": 4611} {"train_loss": -26.424163818359375, "global_step": 382766, "epoch": 4611} {"train_loss": -26.3236026763916, "global_step": 382767, "epoch": 4611} {"train_loss": -26.30338478088379, "global_step": 382768, "epoch": 4611} {"train_loss": -26.5318660736084, "global_step": 382769, "epoch": 4611} {"train_loss": -26.470905303955078, "global_step": 382770, "epoch": 4611} {"train_loss": -26.636402130126953, "global_step": 382771, "epoch": 4611} {"train_loss": -26.5461483001709, "global_step": 382772, "epoch": 4611} {"train_loss": -26.879552841186523, "global_step": 382773, "epoch": 4611} {"train_loss": -26.859272003173828, "global_step": 382774, "epoch": 4611} {"train_loss": -26.59760856628418, "global_step": 382775, "epoch": 4611} {"train_loss": -27.134435653686523, "global_step": 382776, "epoch": 4611} {"train_loss": -26.52032470703125, "global_step": 382777, "epoch": 4611} {"train_loss": -26.565587997436523, "global_step": 382778, "epoch": 4611} {"train_loss": -26.79509925842285, "global_step": 382779, "epoch": 4611} {"train_loss": -26.576467514038086, "global_step": 382780, "epoch": 4611} {"train_loss": -26.769323348999023, "global_step": 382781, "epoch": 4611} {"train_loss": -26.867233276367188, "global_step": 382782, "epoch": 4611} {"train_loss": -26.5154972076416, "global_step": 382783, "epoch": 4611} {"train_loss": -26.324996948242188, "global_step": 382784, "epoch": 4611} {"train_loss": -26.404157638549805, "global_step": 382785, "epoch": 4611} {"train_loss": -26.144515991210938, "global_step": 382786, "epoch": 4611} {"train_loss": -26.5862979888916, "global_step": 382787, "epoch": 4611} {"train_loss": -26.545923233032227, "global_step": 382788, "epoch": 4611} {"train_loss": -26.6514835357666, "global_step": 382789, "epoch": 4611} {"train_loss": -26.400365829467773, "global_step": 382790, "epoch": 4611} {"train_loss": -26.621112823486328, "global_step": 382791, "epoch": 4611} {"train_loss": -26.29248046875, "global_step": 382792, "epoch": 4611} {"train_loss": -26.387176513671875, "global_step": 382793, "epoch": 4611} {"train_loss": -26.482961654663086, "global_step": 382794, "epoch": 4611} {"train_loss": -26.388950278960078, "global_step": 382795, "epoch": 4611, "val_loss": 6716973.0} {"train_loss": -25.88761329650879, "global_step": 382796, "epoch": 4612} {"train_loss": -23.471527099609375, "global_step": 382797, "epoch": 4612} {"train_loss": -22.26714324951172, "global_step": 382798, "epoch": 4612} {"train_loss": -24.78156089782715, "global_step": 382799, "epoch": 4612} {"train_loss": -25.37502670288086, "global_step": 382800, "epoch": 4612} {"train_loss": -24.24943733215332, "global_step": 382801, "epoch": 4612} {"train_loss": -25.54689598083496, "global_step": 382802, "epoch": 4612} {"train_loss": -25.010053634643555, "global_step": 382803, "epoch": 4612} {"train_loss": -25.43316078186035, "global_step": 382804, "epoch": 4612} {"train_loss": -26.060123443603516, "global_step": 382805, "epoch": 4612} {"train_loss": -25.194074630737305, "global_step": 382806, "epoch": 4612} {"train_loss": -25.315601348876953, "global_step": 382807, "epoch": 4612} {"train_loss": -25.91975975036621, "global_step": 382808, "epoch": 4612} {"train_loss": -25.715909957885742, "global_step": 382809, "epoch": 4612} {"train_loss": -25.602676391601562, "global_step": 382810, "epoch": 4612} {"train_loss": -25.867685317993164, "global_step": 382811, "epoch": 4612} {"train_loss": -25.751306533813477, "global_step": 382812, "epoch": 4612} {"train_loss": -25.562788009643555, "global_step": 382813, "epoch": 4612} {"train_loss": -25.3804874420166, "global_step": 382814, "epoch": 4612} {"train_loss": -25.538291931152344, "global_step": 382815, "epoch": 4612} {"train_loss": -25.59143829345703, "global_step": 382816, "epoch": 4612} {"train_loss": -25.869531631469727, "global_step": 382817, "epoch": 4612} {"train_loss": -25.741790771484375, "global_step": 382818, "epoch": 4612} {"train_loss": -25.928003311157227, "global_step": 382819, "epoch": 4612} {"train_loss": -25.77739906311035, "global_step": 382820, "epoch": 4612} {"train_loss": -25.784772872924805, "global_step": 382821, "epoch": 4612} {"train_loss": -26.217432022094727, "global_step": 382822, "epoch": 4612} {"train_loss": -25.983625411987305, "global_step": 382823, "epoch": 4612} {"train_loss": -26.150604248046875, "global_step": 382824, "epoch": 4612} {"train_loss": -26.097753524780273, "global_step": 382825, "epoch": 4612} {"train_loss": -25.995569229125977, "global_step": 382826, "epoch": 4612} {"train_loss": -26.199848175048828, "global_step": 382827, "epoch": 4612} {"train_loss": -26.079803466796875, "global_step": 382828, "epoch": 4612} {"train_loss": -26.0469913482666, "global_step": 382829, "epoch": 4612} {"train_loss": -26.226232528686523, "global_step": 382830, "epoch": 4612} {"train_loss": -26.472497940063477, "global_step": 382831, "epoch": 4612} {"train_loss": -26.158878326416016, "global_step": 382832, "epoch": 4612} {"train_loss": -26.1978702545166, "global_step": 382833, "epoch": 4612} {"train_loss": -26.774316787719727, "global_step": 382834, "epoch": 4612} {"train_loss": -26.652780532836914, "global_step": 382835, "epoch": 4612} {"train_loss": -26.570524215698242, "global_step": 382836, "epoch": 4612} {"train_loss": -26.194082260131836, "global_step": 382837, "epoch": 4612} {"train_loss": -26.694189071655273, "global_step": 382838, "epoch": 4612} {"train_loss": -26.478321075439453, "global_step": 382839, "epoch": 4612} {"train_loss": -26.24603843688965, "global_step": 382840, "epoch": 4612} {"train_loss": -26.68115234375, "global_step": 382841, "epoch": 4612} {"train_loss": -26.65797233581543, "global_step": 382842, "epoch": 4612} {"train_loss": -26.425622940063477, "global_step": 382843, "epoch": 4612} {"train_loss": -26.599781036376953, "global_step": 382844, "epoch": 4612} {"train_loss": -26.614850997924805, "global_step": 382845, "epoch": 4612} {"train_loss": -26.828969955444336, "global_step": 382846, "epoch": 4612} {"train_loss": -26.786802291870117, "global_step": 382847, "epoch": 4612} {"train_loss": -26.555700302124023, "global_step": 382848, "epoch": 4612} {"train_loss": -26.36689567565918, "global_step": 382849, "epoch": 4612} {"train_loss": -26.737445831298828, "global_step": 382850, "epoch": 4612} {"train_loss": -26.539081573486328, "global_step": 382851, "epoch": 4612} {"train_loss": -26.64401626586914, "global_step": 382852, "epoch": 4612} {"train_loss": -26.725622177124023, "global_step": 382853, "epoch": 4612} {"train_loss": -26.655094146728516, "global_step": 382854, "epoch": 4612} {"train_loss": -26.5882625579834, "global_step": 382855, "epoch": 4612} {"train_loss": -26.578954696655273, "global_step": 382856, "epoch": 4612} {"train_loss": -26.548664093017578, "global_step": 382857, "epoch": 4612} {"train_loss": -26.766895294189453, "global_step": 382858, "epoch": 4612} {"train_loss": -26.697431564331055, "global_step": 382859, "epoch": 4612} {"train_loss": -25.9985294342041, "global_step": 382860, "epoch": 4612} {"train_loss": -26.245288848876953, "global_step": 382861, "epoch": 4612} {"train_loss": -26.443729400634766, "global_step": 382862, "epoch": 4612} {"train_loss": -26.03436279296875, "global_step": 382863, "epoch": 4612} {"train_loss": -26.484846115112305, "global_step": 382864, "epoch": 4612} {"train_loss": -25.907764434814453, "global_step": 382865, "epoch": 4612} {"train_loss": -26.112060546875, "global_step": 382866, "epoch": 4612} {"train_loss": -26.06207275390625, "global_step": 382867, "epoch": 4612} {"train_loss": -25.6303768157959, "global_step": 382868, "epoch": 4612} {"train_loss": -25.98944091796875, "global_step": 382869, "epoch": 4612} {"train_loss": -26.249277114868164, "global_step": 382870, "epoch": 4612} {"train_loss": -26.008136749267578, "global_step": 382871, "epoch": 4612} {"train_loss": -26.43814468383789, "global_step": 382872, "epoch": 4612} {"train_loss": -25.96183204650879, "global_step": 382873, "epoch": 4612} {"train_loss": -26.506250381469727, "global_step": 382874, "epoch": 4612} {"train_loss": -26.5416202545166, "global_step": 382875, "epoch": 4612} {"train_loss": -26.19158935546875, "global_step": 382876, "epoch": 4612} {"train_loss": -26.6137752532959, "global_step": 382877, "epoch": 4612} {"train_loss": -26.031921455659063, "global_step": 382878, "epoch": 4612, "val_loss": 6639352.0} {"train_loss": -25.95425796508789, "global_step": 382879, "epoch": 4613} {"train_loss": -26.212894439697266, "global_step": 382880, "epoch": 4613} {"train_loss": -26.028913497924805, "global_step": 382881, "epoch": 4613} {"train_loss": -26.30023193359375, "global_step": 382882, "epoch": 4613} {"train_loss": -25.7846736907959, "global_step": 382883, "epoch": 4613} {"train_loss": -25.974836349487305, "global_step": 382884, "epoch": 4613} {"train_loss": -25.54836082458496, "global_step": 382885, "epoch": 4613} {"train_loss": -26.58170509338379, "global_step": 382886, "epoch": 4613} {"train_loss": -26.27890968322754, "global_step": 382887, "epoch": 4613} {"train_loss": -26.20149040222168, "global_step": 382888, "epoch": 4613} {"train_loss": -26.50483512878418, "global_step": 382889, "epoch": 4613} {"train_loss": -26.03839111328125, "global_step": 382890, "epoch": 4613} {"train_loss": -26.189422607421875, "global_step": 382891, "epoch": 4613} {"train_loss": -26.48508644104004, "global_step": 382892, "epoch": 4613} {"train_loss": -26.252851486206055, "global_step": 382893, "epoch": 4613} {"train_loss": -26.22614860534668, "global_step": 382894, "epoch": 4613} {"train_loss": -26.32813835144043, "global_step": 382895, "epoch": 4613} {"train_loss": -26.342456817626953, "global_step": 382896, "epoch": 4613} {"train_loss": -26.061792373657227, "global_step": 382897, "epoch": 4613} {"train_loss": -26.530471801757812, "global_step": 382898, "epoch": 4613} {"train_loss": -26.39080238342285, "global_step": 382899, "epoch": 4613} {"train_loss": -26.650882720947266, "global_step": 382900, "epoch": 4613} {"train_loss": -26.393842697143555, "global_step": 382901, "epoch": 4613} {"train_loss": -26.74481201171875, "global_step": 382902, "epoch": 4613} {"train_loss": -26.456933975219727, "global_step": 382903, "epoch": 4613} {"train_loss": -26.36528968811035, "global_step": 382904, "epoch": 4613} {"train_loss": -25.890216827392578, "global_step": 382905, "epoch": 4613} {"train_loss": -26.670032501220703, "global_step": 382906, "epoch": 4613} {"train_loss": -26.649677276611328, "global_step": 382907, "epoch": 4613} {"train_loss": -26.607023239135742, "global_step": 382908, "epoch": 4613} {"train_loss": -26.37162208557129, "global_step": 382909, "epoch": 4613} {"train_loss": -26.268796920776367, "global_step": 382910, "epoch": 4613} {"train_loss": -26.48444938659668, "global_step": 382911, "epoch": 4613} {"train_loss": -25.926319122314453, "global_step": 382912, "epoch": 4613} {"train_loss": -26.16128921508789, "global_step": 382913, "epoch": 4613} {"train_loss": -25.705921173095703, "global_step": 382914, "epoch": 4613} {"train_loss": -26.38686180114746, "global_step": 382915, "epoch": 4613} {"train_loss": -26.459836959838867, "global_step": 382916, "epoch": 4613} {"train_loss": -26.951810836791992, "global_step": 382917, "epoch": 4613} {"train_loss": -26.660253524780273, "global_step": 382918, "epoch": 4613} {"train_loss": -26.299102783203125, "global_step": 382919, "epoch": 4613} {"train_loss": -26.234582901000977, "global_step": 382920, "epoch": 4613} {"train_loss": -26.21341323852539, "global_step": 382921, "epoch": 4613} {"train_loss": -26.4759521484375, "global_step": 382922, "epoch": 4613} {"train_loss": -26.57307243347168, "global_step": 382923, "epoch": 4613} {"train_loss": -26.288801193237305, "global_step": 382924, "epoch": 4613} {"train_loss": -26.438180923461914, "global_step": 382925, "epoch": 4613} {"train_loss": -26.149194717407227, "global_step": 382926, "epoch": 4613} {"train_loss": -26.192697525024414, "global_step": 382927, "epoch": 4613} {"train_loss": -26.374181747436523, "global_step": 382928, "epoch": 4613} {"train_loss": -26.38818359375, "global_step": 382929, "epoch": 4613} {"train_loss": -26.550811767578125, "global_step": 382930, "epoch": 4613} {"train_loss": -26.396032333374023, "global_step": 382931, "epoch": 4613} {"train_loss": -26.896270751953125, "global_step": 382932, "epoch": 4613} {"train_loss": -26.625730514526367, "global_step": 382933, "epoch": 4613} {"train_loss": -26.78675651550293, "global_step": 382934, "epoch": 4613} {"train_loss": -26.712512969970703, "global_step": 382935, "epoch": 4613} {"train_loss": -26.520017623901367, "global_step": 382936, "epoch": 4613} {"train_loss": -26.35420799255371, "global_step": 382937, "epoch": 4613} {"train_loss": -26.402917861938477, "global_step": 382938, "epoch": 4613} {"train_loss": -26.434436798095703, "global_step": 382939, "epoch": 4613} {"train_loss": -26.702350616455078, "global_step": 382940, "epoch": 4613} {"train_loss": -26.350147247314453, "global_step": 382941, "epoch": 4613} {"train_loss": -26.4271183013916, "global_step": 382942, "epoch": 4613} {"train_loss": -26.571622848510742, "global_step": 382943, "epoch": 4613} {"train_loss": -26.68002700805664, "global_step": 382944, "epoch": 4613} {"train_loss": -26.40903091430664, "global_step": 382945, "epoch": 4613} {"train_loss": -26.511585235595703, "global_step": 382946, "epoch": 4613} {"train_loss": -26.199554443359375, "global_step": 382947, "epoch": 4613} {"train_loss": -26.620031356811523, "global_step": 382948, "epoch": 4613} {"train_loss": -26.480133056640625, "global_step": 382949, "epoch": 4613} {"train_loss": -26.6995792388916, "global_step": 382950, "epoch": 4613} {"train_loss": -26.258779525756836, "global_step": 382951, "epoch": 4613} {"train_loss": -26.663583755493164, "global_step": 382952, "epoch": 4613} {"train_loss": -26.24008560180664, "global_step": 382953, "epoch": 4613} {"train_loss": -27.138269424438477, "global_step": 382954, "epoch": 4613} {"train_loss": -26.490442276000977, "global_step": 382955, "epoch": 4613} {"train_loss": -26.948328018188477, "global_step": 382956, "epoch": 4613} {"train_loss": -26.506210327148438, "global_step": 382957, "epoch": 4613} {"train_loss": -26.36140251159668, "global_step": 382958, "epoch": 4613} {"train_loss": -26.97865867614746, "global_step": 382959, "epoch": 4613} {"train_loss": -26.29386329650879, "global_step": 382960, "epoch": 4613} {"train_loss": -26.38186149137566, "global_step": 382961, "epoch": 4613, "val_loss": 6606918.0} {"train_loss": -25.053319931030273, "global_step": 382962, "epoch": 4614} {"train_loss": -25.60590934753418, "global_step": 382963, "epoch": 4614} {"train_loss": -25.98724937438965, "global_step": 382964, "epoch": 4614} {"train_loss": -26.012548446655273, "global_step": 382965, "epoch": 4614} {"train_loss": -26.15280532836914, "global_step": 382966, "epoch": 4614} {"train_loss": -25.835296630859375, "global_step": 382967, "epoch": 4614} {"train_loss": -25.893102645874023, "global_step": 382968, "epoch": 4614} {"train_loss": -25.86751365661621, "global_step": 382969, "epoch": 4614} {"train_loss": -25.806196212768555, "global_step": 382970, "epoch": 4614} {"train_loss": -26.017017364501953, "global_step": 382971, "epoch": 4614} {"train_loss": -26.1811580657959, "global_step": 382972, "epoch": 4614} {"train_loss": -25.901782989501953, "global_step": 382973, "epoch": 4614} {"train_loss": -26.12955093383789, "global_step": 382974, "epoch": 4614} {"train_loss": -26.27482032775879, "global_step": 382975, "epoch": 4614} {"train_loss": -26.128324508666992, "global_step": 382976, "epoch": 4614} {"train_loss": -26.4613094329834, "global_step": 382977, "epoch": 4614} {"train_loss": -26.066736221313477, "global_step": 382978, "epoch": 4614} {"train_loss": -26.42624855041504, "global_step": 382979, "epoch": 4614} {"train_loss": -26.33279800415039, "global_step": 382980, "epoch": 4614} {"train_loss": -26.351001739501953, "global_step": 382981, "epoch": 4614} {"train_loss": -26.39520263671875, "global_step": 382982, "epoch": 4614} {"train_loss": -26.486499786376953, "global_step": 382983, "epoch": 4614} {"train_loss": -26.392353057861328, "global_step": 382984, "epoch": 4614} {"train_loss": -26.551733016967773, "global_step": 382985, "epoch": 4614} {"train_loss": -26.1826114654541, "global_step": 382986, "epoch": 4614} {"train_loss": -26.435277938842773, "global_step": 382987, "epoch": 4614} {"train_loss": -26.2940673828125, "global_step": 382988, "epoch": 4614} {"train_loss": -26.75306510925293, "global_step": 382989, "epoch": 4614} {"train_loss": -26.545303344726562, "global_step": 382990, "epoch": 4614} {"train_loss": -26.531030654907227, "global_step": 382991, "epoch": 4614} {"train_loss": -26.334930419921875, "global_step": 382992, "epoch": 4614} {"train_loss": -26.460901260375977, "global_step": 382993, "epoch": 4614} {"train_loss": -26.682737350463867, "global_step": 382994, "epoch": 4614} {"train_loss": -26.485870361328125, "global_step": 382995, "epoch": 4614} {"train_loss": -26.414630889892578, "global_step": 382996, "epoch": 4614} {"train_loss": -26.382902145385742, "global_step": 382997, "epoch": 4614} {"train_loss": -26.587995529174805, "global_step": 382998, "epoch": 4614} {"train_loss": -26.62598991394043, "global_step": 382999, "epoch": 4614} {"train_loss": -26.145233154296875, "global_step": 383000, "epoch": 4614} {"train_loss": -26.620655059814453, "global_step": 383001, "epoch": 4614} {"train_loss": -26.625595092773438, "global_step": 383002, "epoch": 4614} {"train_loss": -26.236618041992188, "global_step": 383003, "epoch": 4614} {"train_loss": -26.544565200805664, "global_step": 383004, "epoch": 4614} {"train_loss": -26.73382568359375, "global_step": 383005, "epoch": 4614} {"train_loss": -26.423154830932617, "global_step": 383006, "epoch": 4614} {"train_loss": -26.321624755859375, "global_step": 383007, "epoch": 4614} {"train_loss": -26.331268310546875, "global_step": 383008, "epoch": 4614} {"train_loss": -26.63720703125, "global_step": 383009, "epoch": 4614} {"train_loss": -26.60926628112793, "global_step": 383010, "epoch": 4614} {"train_loss": -26.759546279907227, "global_step": 383011, "epoch": 4614} {"train_loss": -26.754003524780273, "global_step": 383012, "epoch": 4614} {"train_loss": -26.383625030517578, "global_step": 383013, "epoch": 4614} {"train_loss": -26.384313583374023, "global_step": 383014, "epoch": 4614} {"train_loss": -26.550931930541992, "global_step": 383015, "epoch": 4614} {"train_loss": -26.3837947845459, "global_step": 383016, "epoch": 4614} {"train_loss": -26.62383460998535, "global_step": 383017, "epoch": 4614} {"train_loss": -26.72017478942871, "global_step": 383018, "epoch": 4614} {"train_loss": -26.333906173706055, "global_step": 383019, "epoch": 4614} {"train_loss": -26.708166122436523, "global_step": 383020, "epoch": 4614} {"train_loss": -27.0308895111084, "global_step": 383021, "epoch": 4614} {"train_loss": -26.27520751953125, "global_step": 383022, "epoch": 4614} {"train_loss": -26.699874877929688, "global_step": 383023, "epoch": 4614} {"train_loss": -26.238859176635742, "global_step": 383024, "epoch": 4614} {"train_loss": -26.365009307861328, "global_step": 383025, "epoch": 4614} {"train_loss": -26.684467315673828, "global_step": 383026, "epoch": 4614} {"train_loss": -26.868194580078125, "global_step": 383027, "epoch": 4614} {"train_loss": -26.489959716796875, "global_step": 383028, "epoch": 4614} {"train_loss": -26.354867935180664, "global_step": 383029, "epoch": 4614} {"train_loss": -26.46659278869629, "global_step": 383030, "epoch": 4614} {"train_loss": -26.80987548828125, "global_step": 383031, "epoch": 4614} {"train_loss": -26.50946617126465, "global_step": 383032, "epoch": 4614} {"train_loss": -26.266279220581055, "global_step": 383033, "epoch": 4614} {"train_loss": -26.53619956970215, "global_step": 383034, "epoch": 4614} {"train_loss": -26.078189849853516, "global_step": 383035, "epoch": 4614} {"train_loss": -26.362594604492188, "global_step": 383036, "epoch": 4614} {"train_loss": -26.51447105407715, "global_step": 383037, "epoch": 4614} {"train_loss": -26.73603630065918, "global_step": 383038, "epoch": 4614} {"train_loss": -25.91156578063965, "global_step": 383039, "epoch": 4614} {"train_loss": -25.769418716430664, "global_step": 383040, "epoch": 4614} {"train_loss": -26.395212173461914, "global_step": 383041, "epoch": 4614} {"train_loss": -26.772369384765625, "global_step": 383042, "epoch": 4614} {"train_loss": -26.100366592407227, "global_step": 383043, "epoch": 4614} {"train_loss": -26.36317917237799, "global_step": 383044, "epoch": 4614, "val_loss": 6550032.0} {"train_loss": -26.03670310974121, "global_step": 383045, "epoch": 4615} {"train_loss": -25.94097328186035, "global_step": 383046, "epoch": 4615} {"train_loss": -25.993885040283203, "global_step": 383047, "epoch": 4615} {"train_loss": -26.043725967407227, "global_step": 383048, "epoch": 4615} {"train_loss": -25.754892349243164, "global_step": 383049, "epoch": 4615} {"train_loss": -26.25459098815918, "global_step": 383050, "epoch": 4615} {"train_loss": -26.209030151367188, "global_step": 383051, "epoch": 4615} {"train_loss": -26.346118927001953, "global_step": 383052, "epoch": 4615} {"train_loss": -26.366147994995117, "global_step": 383053, "epoch": 4615} {"train_loss": -26.556976318359375, "global_step": 383054, "epoch": 4615} {"train_loss": -25.792348861694336, "global_step": 383055, "epoch": 4615} {"train_loss": -25.974348068237305, "global_step": 383056, "epoch": 4615} {"train_loss": -25.83782386779785, "global_step": 383057, "epoch": 4615} {"train_loss": -26.3043155670166, "global_step": 383058, "epoch": 4615} {"train_loss": -25.99745750427246, "global_step": 383059, "epoch": 4615} {"train_loss": -26.07110023498535, "global_step": 383060, "epoch": 4615} {"train_loss": -26.263538360595703, "global_step": 383061, "epoch": 4615} {"train_loss": -26.278583526611328, "global_step": 383062, "epoch": 4615} {"train_loss": -26.19806480407715, "global_step": 383063, "epoch": 4615} {"train_loss": -26.1384220123291, "global_step": 383064, "epoch": 4615} {"train_loss": -26.3177547454834, "global_step": 383065, "epoch": 4615} {"train_loss": -26.43878746032715, "global_step": 383066, "epoch": 4615} {"train_loss": -26.22260093688965, "global_step": 383067, "epoch": 4615} {"train_loss": -26.484710693359375, "global_step": 383068, "epoch": 4615} {"train_loss": -26.477432250976562, "global_step": 383069, "epoch": 4615} {"train_loss": -26.23736000061035, "global_step": 383070, "epoch": 4615} {"train_loss": -26.4066104888916, "global_step": 383071, "epoch": 4615} {"train_loss": -26.205652236938477, "global_step": 383072, "epoch": 4615} {"train_loss": -26.77587890625, "global_step": 383073, "epoch": 4615} {"train_loss": -26.023212432861328, "global_step": 383074, "epoch": 4615} {"train_loss": -26.399051666259766, "global_step": 383075, "epoch": 4615} {"train_loss": -26.20635986328125, "global_step": 383076, "epoch": 4615} {"train_loss": -26.4085636138916, "global_step": 383077, "epoch": 4615} {"train_loss": -26.513696670532227, "global_step": 383078, "epoch": 4615} {"train_loss": -26.70975685119629, "global_step": 383079, "epoch": 4615} {"train_loss": -26.49648094177246, "global_step": 383080, "epoch": 4615} {"train_loss": -26.441625595092773, "global_step": 383081, "epoch": 4615} {"train_loss": -26.6649169921875, "global_step": 383082, "epoch": 4615} {"train_loss": -26.674097061157227, "global_step": 383083, "epoch": 4615} {"train_loss": -26.526700973510742, "global_step": 383084, "epoch": 4615} {"train_loss": -26.09351921081543, "global_step": 383085, "epoch": 4615} {"train_loss": -26.51358413696289, "global_step": 383086, "epoch": 4615} {"train_loss": -26.738210678100586, "global_step": 383087, "epoch": 4615} {"train_loss": -26.38483238220215, "global_step": 383088, "epoch": 4615} {"train_loss": -26.593204498291016, "global_step": 383089, "epoch": 4615} {"train_loss": -26.65571403503418, "global_step": 383090, "epoch": 4615} {"train_loss": -26.717817306518555, "global_step": 383091, "epoch": 4615} {"train_loss": -26.464736938476562, "global_step": 383092, "epoch": 4615} {"train_loss": -26.903844833374023, "global_step": 383093, "epoch": 4615} {"train_loss": -26.4666805267334, "global_step": 383094, "epoch": 4615} {"train_loss": -26.66510009765625, "global_step": 383095, "epoch": 4615} {"train_loss": -27.004745483398438, "global_step": 383096, "epoch": 4615} {"train_loss": -26.631574630737305, "global_step": 383097, "epoch": 4615} {"train_loss": -26.259048461914062, "global_step": 383098, "epoch": 4615} {"train_loss": -26.411773681640625, "global_step": 383099, "epoch": 4615} {"train_loss": -26.20926856994629, "global_step": 383100, "epoch": 4615} {"train_loss": -26.671817779541016, "global_step": 383101, "epoch": 4615} {"train_loss": -26.5938777923584, "global_step": 383102, "epoch": 4615} {"train_loss": -26.569751739501953, "global_step": 383103, "epoch": 4615} {"train_loss": -26.623868942260742, "global_step": 383104, "epoch": 4615} {"train_loss": -26.588851928710938, "global_step": 383105, "epoch": 4615} {"train_loss": -26.7793025970459, "global_step": 383106, "epoch": 4615} {"train_loss": -26.595504760742188, "global_step": 383107, "epoch": 4615} {"train_loss": -26.570775985717773, "global_step": 383108, "epoch": 4615} {"train_loss": -26.381366729736328, "global_step": 383109, "epoch": 4615} {"train_loss": -26.616647720336914, "global_step": 383110, "epoch": 4615} {"train_loss": -26.72564697265625, "global_step": 383111, "epoch": 4615} {"train_loss": -26.616363525390625, "global_step": 383112, "epoch": 4615} {"train_loss": -27.005523681640625, "global_step": 383113, "epoch": 4615} {"train_loss": -26.644855499267578, "global_step": 383114, "epoch": 4615} {"train_loss": -26.557605743408203, "global_step": 383115, "epoch": 4615} {"train_loss": -26.57832908630371, "global_step": 383116, "epoch": 4615} {"train_loss": -26.52130699157715, "global_step": 383117, "epoch": 4615} {"train_loss": -26.377161026000977, "global_step": 383118, "epoch": 4615} {"train_loss": -26.554962158203125, "global_step": 383119, "epoch": 4615} {"train_loss": -26.52141761779785, "global_step": 383120, "epoch": 4615} {"train_loss": -26.3438663482666, "global_step": 383121, "epoch": 4615} {"train_loss": -26.366724014282227, "global_step": 383122, "epoch": 4615} {"train_loss": -26.575897216796875, "global_step": 383123, "epoch": 4615} {"train_loss": -26.451642990112305, "global_step": 383124, "epoch": 4615} {"train_loss": -26.48284339904785, "global_step": 383125, "epoch": 4615} {"train_loss": -26.77543067932129, "global_step": 383126, "epoch": 4615} {"train_loss": -26.430738632937512, "global_step": 383127, "epoch": 4615, "val_loss": 6668960.0} {"train_loss": -26.2330265045166, "global_step": 383128, "epoch": 4616} {"train_loss": -26.430450439453125, "global_step": 383129, "epoch": 4616} {"train_loss": -26.278196334838867, "global_step": 383130, "epoch": 4616} {"train_loss": -26.516021728515625, "global_step": 383131, "epoch": 4616} {"train_loss": -26.52436637878418, "global_step": 383132, "epoch": 4616} {"train_loss": -25.99295425415039, "global_step": 383133, "epoch": 4616} {"train_loss": -26.58551025390625, "global_step": 383134, "epoch": 4616} {"train_loss": -26.5372257232666, "global_step": 383135, "epoch": 4616} {"train_loss": -26.636571884155273, "global_step": 383136, "epoch": 4616} {"train_loss": -26.408950805664062, "global_step": 383137, "epoch": 4616} {"train_loss": -26.459671020507812, "global_step": 383138, "epoch": 4616} {"train_loss": -26.66815757751465, "global_step": 383139, "epoch": 4616} {"train_loss": -26.423114776611328, "global_step": 383140, "epoch": 4616} {"train_loss": -26.2757511138916, "global_step": 383141, "epoch": 4616} {"train_loss": -26.83935546875, "global_step": 383142, "epoch": 4616} {"train_loss": -26.7437801361084, "global_step": 383143, "epoch": 4616} {"train_loss": -26.594715118408203, "global_step": 383144, "epoch": 4616} {"train_loss": -26.263349533081055, "global_step": 383145, "epoch": 4616} {"train_loss": -26.641199111938477, "global_step": 383146, "epoch": 4616} {"train_loss": -26.531415939331055, "global_step": 383147, "epoch": 4616} {"train_loss": -26.308032989501953, "global_step": 383148, "epoch": 4616} {"train_loss": -26.652647018432617, "global_step": 383149, "epoch": 4616} {"train_loss": -26.587926864624023, "global_step": 383150, "epoch": 4616} {"train_loss": -26.625930786132812, "global_step": 383151, "epoch": 4616} {"train_loss": -26.653162002563477, "global_step": 383152, "epoch": 4616} {"train_loss": -26.478107452392578, "global_step": 383153, "epoch": 4616} {"train_loss": -26.546005249023438, "global_step": 383154, "epoch": 4616} {"train_loss": -26.7849178314209, "global_step": 383155, "epoch": 4616} {"train_loss": -26.557382583618164, "global_step": 383156, "epoch": 4616} {"train_loss": -26.71533203125, "global_step": 383157, "epoch": 4616} {"train_loss": -26.70734977722168, "global_step": 383158, "epoch": 4616} {"train_loss": -26.474212646484375, "global_step": 383159, "epoch": 4616} {"train_loss": -26.417011260986328, "global_step": 383160, "epoch": 4616} {"train_loss": -26.267108917236328, "global_step": 383161, "epoch": 4616} {"train_loss": -26.237939834594727, "global_step": 383162, "epoch": 4616} {"train_loss": -26.44671630859375, "global_step": 383163, "epoch": 4616} {"train_loss": -26.424671173095703, "global_step": 383164, "epoch": 4616} {"train_loss": -26.857074737548828, "global_step": 383165, "epoch": 4616} {"train_loss": -26.752338409423828, "global_step": 383166, "epoch": 4616} {"train_loss": -26.75971794128418, "global_step": 383167, "epoch": 4616} {"train_loss": -26.751001358032227, "global_step": 383168, "epoch": 4616} {"train_loss": -26.385257720947266, "global_step": 383169, "epoch": 4616} {"train_loss": -26.652542114257812, "global_step": 383170, "epoch": 4616} {"train_loss": -26.338214874267578, "global_step": 383171, "epoch": 4616} {"train_loss": -26.70929527282715, "global_step": 383172, "epoch": 4616} {"train_loss": -26.607192993164062, "global_step": 383173, "epoch": 4616} {"train_loss": -26.66865348815918, "global_step": 383174, "epoch": 4616} {"train_loss": -26.824430465698242, "global_step": 383175, "epoch": 4616} {"train_loss": -26.47537612915039, "global_step": 383176, "epoch": 4616} {"train_loss": -26.72507095336914, "global_step": 383177, "epoch": 4616} {"train_loss": -26.409696578979492, "global_step": 383178, "epoch": 4616} {"train_loss": -26.477161407470703, "global_step": 383179, "epoch": 4616} {"train_loss": -26.530170440673828, "global_step": 383180, "epoch": 4616} {"train_loss": -26.76826286315918, "global_step": 383181, "epoch": 4616} {"train_loss": -26.618518829345703, "global_step": 383182, "epoch": 4616} {"train_loss": -26.856077194213867, "global_step": 383183, "epoch": 4616} {"train_loss": -26.620574951171875, "global_step": 383184, "epoch": 4616} {"train_loss": -26.41236686706543, "global_step": 383185, "epoch": 4616} {"train_loss": -26.493589401245117, "global_step": 383186, "epoch": 4616} {"train_loss": -26.3622989654541, "global_step": 383187, "epoch": 4616} {"train_loss": -26.187047958374023, "global_step": 383188, "epoch": 4616} {"train_loss": -26.38510513305664, "global_step": 383189, "epoch": 4616} {"train_loss": -26.592105865478516, "global_step": 383190, "epoch": 4616} {"train_loss": -26.711811065673828, "global_step": 383191, "epoch": 4616} {"train_loss": -26.33185386657715, "global_step": 383192, "epoch": 4616} {"train_loss": -26.44309425354004, "global_step": 383193, "epoch": 4616} {"train_loss": -26.72723388671875, "global_step": 383194, "epoch": 4616} {"train_loss": -26.46674156188965, "global_step": 383195, "epoch": 4616} {"train_loss": -26.425146102905273, "global_step": 383196, "epoch": 4616} {"train_loss": -26.321969985961914, "global_step": 383197, "epoch": 4616} {"train_loss": -26.675390243530273, "global_step": 383198, "epoch": 4616} {"train_loss": -26.53128433227539, "global_step": 383199, "epoch": 4616} {"train_loss": -26.594924926757812, "global_step": 383200, "epoch": 4616} {"train_loss": -26.406179428100586, "global_step": 383201, "epoch": 4616} {"train_loss": -26.59454917907715, "global_step": 383202, "epoch": 4616} {"train_loss": -26.651859283447266, "global_step": 383203, "epoch": 4616} {"train_loss": -26.35906982421875, "global_step": 383204, "epoch": 4616} {"train_loss": -26.328039169311523, "global_step": 383205, "epoch": 4616} {"train_loss": -26.20868492126465, "global_step": 383206, "epoch": 4616} {"train_loss": -25.699920654296875, "global_step": 383207, "epoch": 4616} {"train_loss": -26.177661895751953, "global_step": 383208, "epoch": 4616} {"train_loss": -26.38577651977539, "global_step": 383209, "epoch": 4616} {"train_loss": -26.493397126714868, "global_step": 383210, "epoch": 4616, "val_loss": 6631458.0} {"train_loss": -24.97334861755371, "global_step": 383211, "epoch": 4617} {"train_loss": -24.41155242919922, "global_step": 383212, "epoch": 4617} {"train_loss": -25.87067985534668, "global_step": 383213, "epoch": 4617} {"train_loss": -24.541471481323242, "global_step": 383214, "epoch": 4617} {"train_loss": -25.228275299072266, "global_step": 383215, "epoch": 4617} {"train_loss": -25.11555290222168, "global_step": 383216, "epoch": 4617} {"train_loss": -25.098310470581055, "global_step": 383217, "epoch": 4617} {"train_loss": -24.753286361694336, "global_step": 383218, "epoch": 4617} {"train_loss": -25.772369384765625, "global_step": 383219, "epoch": 4617} {"train_loss": -25.671655654907227, "global_step": 383220, "epoch": 4617} {"train_loss": -25.714313507080078, "global_step": 383221, "epoch": 4617} {"train_loss": -26.146528244018555, "global_step": 383222, "epoch": 4617} {"train_loss": -25.821699142456055, "global_step": 383223, "epoch": 4617} {"train_loss": -26.09429931640625, "global_step": 383224, "epoch": 4617} {"train_loss": -25.977991104125977, "global_step": 383225, "epoch": 4617} {"train_loss": -25.973020553588867, "global_step": 383226, "epoch": 4617} {"train_loss": -25.59247398376465, "global_step": 383227, "epoch": 4617} {"train_loss": -26.0743408203125, "global_step": 383228, "epoch": 4617} {"train_loss": -26.16044044494629, "global_step": 383229, "epoch": 4617} {"train_loss": -25.936573028564453, "global_step": 383230, "epoch": 4617} {"train_loss": -26.350378036499023, "global_step": 383231, "epoch": 4617} {"train_loss": -26.26595115661621, "global_step": 383232, "epoch": 4617} {"train_loss": -26.010053634643555, "global_step": 383233, "epoch": 4617} {"train_loss": -25.869903564453125, "global_step": 383234, "epoch": 4617} {"train_loss": -25.991317749023438, "global_step": 383235, "epoch": 4617} {"train_loss": -26.443586349487305, "global_step": 383236, "epoch": 4617} {"train_loss": -26.115680694580078, "global_step": 383237, "epoch": 4617} {"train_loss": -26.085662841796875, "global_step": 383238, "epoch": 4617} {"train_loss": -26.03656578063965, "global_step": 383239, "epoch": 4617} {"train_loss": -26.153104782104492, "global_step": 383240, "epoch": 4617} {"train_loss": -26.364072799682617, "global_step": 383241, "epoch": 4617} {"train_loss": -26.659841537475586, "global_step": 383242, "epoch": 4617} {"train_loss": -26.345386505126953, "global_step": 383243, "epoch": 4617} {"train_loss": -25.7330265045166, "global_step": 383244, "epoch": 4617} {"train_loss": -26.61695671081543, "global_step": 383245, "epoch": 4617} {"train_loss": -26.078994750976562, "global_step": 383246, "epoch": 4617} {"train_loss": -26.380578994750977, "global_step": 383247, "epoch": 4617} {"train_loss": -26.523880004882812, "global_step": 383248, "epoch": 4617} {"train_loss": -26.169958114624023, "global_step": 383249, "epoch": 4617} {"train_loss": -26.902313232421875, "global_step": 383250, "epoch": 4617} {"train_loss": -26.714025497436523, "global_step": 383251, "epoch": 4617} {"train_loss": -26.432708740234375, "global_step": 383252, "epoch": 4617} {"train_loss": -26.941059112548828, "global_step": 383253, "epoch": 4617} {"train_loss": -26.60866355895996, "global_step": 383254, "epoch": 4617} {"train_loss": -26.795507431030273, "global_step": 383255, "epoch": 4617} {"train_loss": -26.607070922851562, "global_step": 383256, "epoch": 4617} {"train_loss": -26.692707061767578, "global_step": 383257, "epoch": 4617} {"train_loss": -26.895116806030273, "global_step": 383258, "epoch": 4617} {"train_loss": -26.374317169189453, "global_step": 383259, "epoch": 4617} {"train_loss": -26.39570426940918, "global_step": 383260, "epoch": 4617} {"train_loss": -26.604597091674805, "global_step": 383261, "epoch": 4617} {"train_loss": -26.68694496154785, "global_step": 383262, "epoch": 4617} {"train_loss": -26.352115631103516, "global_step": 383263, "epoch": 4617} {"train_loss": -27.002145767211914, "global_step": 383264, "epoch": 4617} {"train_loss": -26.64735984802246, "global_step": 383265, "epoch": 4617} {"train_loss": -26.62603187561035, "global_step": 383266, "epoch": 4617} {"train_loss": -26.641366958618164, "global_step": 383267, "epoch": 4617} {"train_loss": -26.687185287475586, "global_step": 383268, "epoch": 4617} {"train_loss": -26.18084716796875, "global_step": 383269, "epoch": 4617} {"train_loss": -26.626190185546875, "global_step": 383270, "epoch": 4617} {"train_loss": -26.723203659057617, "global_step": 383271, "epoch": 4617} {"train_loss": -26.0333251953125, "global_step": 383272, "epoch": 4617} {"train_loss": -25.35666847229004, "global_step": 383273, "epoch": 4617} {"train_loss": -26.1228084564209, "global_step": 383274, "epoch": 4617} {"train_loss": -26.09894371032715, "global_step": 383275, "epoch": 4617} {"train_loss": -26.365177154541016, "global_step": 383276, "epoch": 4617} {"train_loss": -26.345184326171875, "global_step": 383277, "epoch": 4617} {"train_loss": -26.497587203979492, "global_step": 383278, "epoch": 4617} {"train_loss": -26.237157821655273, "global_step": 383279, "epoch": 4617} {"train_loss": -26.192541122436523, "global_step": 383280, "epoch": 4617} {"train_loss": -26.315372467041016, "global_step": 383281, "epoch": 4617} {"train_loss": -26.394184112548828, "global_step": 383282, "epoch": 4617} {"train_loss": -26.394384384155273, "global_step": 383283, "epoch": 4617} {"train_loss": -26.648284912109375, "global_step": 383284, "epoch": 4617} {"train_loss": -26.73126220703125, "global_step": 383285, "epoch": 4617} {"train_loss": -26.529722213745117, "global_step": 383286, "epoch": 4617} {"train_loss": -26.07563591003418, "global_step": 383287, "epoch": 4617} {"train_loss": -26.182905197143555, "global_step": 383288, "epoch": 4617} {"train_loss": -26.473386764526367, "global_step": 383289, "epoch": 4617} {"train_loss": -26.021488189697266, "global_step": 383290, "epoch": 4617} {"train_loss": -25.877622604370117, "global_step": 383291, "epoch": 4617} {"train_loss": -26.5412654876709, "global_step": 383292, "epoch": 4617} {"train_loss": -26.189175318522626, "global_step": 383293, "epoch": 4617, "val_loss": 6616942.5} {"train_loss": -26.196531295776367, "global_step": 383294, "epoch": 4618} {"train_loss": -26.25420570373535, "global_step": 383295, "epoch": 4618} {"train_loss": -26.156782150268555, "global_step": 383296, "epoch": 4618} {"train_loss": -26.17416763305664, "global_step": 383297, "epoch": 4618} {"train_loss": -26.103195190429688, "global_step": 383298, "epoch": 4618} {"train_loss": -26.107574462890625, "global_step": 383299, "epoch": 4618} {"train_loss": -26.1546630859375, "global_step": 383300, "epoch": 4618} {"train_loss": -25.853559494018555, "global_step": 383301, "epoch": 4618} {"train_loss": -26.071674346923828, "global_step": 383302, "epoch": 4618} {"train_loss": -25.96732521057129, "global_step": 383303, "epoch": 4618} {"train_loss": -26.076459884643555, "global_step": 383304, "epoch": 4618} {"train_loss": -26.458723068237305, "global_step": 383305, "epoch": 4618} {"train_loss": -26.319543838500977, "global_step": 383306, "epoch": 4618} {"train_loss": -26.579980850219727, "global_step": 383307, "epoch": 4618} {"train_loss": -26.249372482299805, "global_step": 383308, "epoch": 4618} {"train_loss": -26.165441513061523, "global_step": 383309, "epoch": 4618} {"train_loss": -26.228519439697266, "global_step": 383310, "epoch": 4618} {"train_loss": -26.428754806518555, "global_step": 383311, "epoch": 4618} {"train_loss": -26.534503936767578, "global_step": 383312, "epoch": 4618} {"train_loss": -26.55962562561035, "global_step": 383313, "epoch": 4618} {"train_loss": -26.184162139892578, "global_step": 383314, "epoch": 4618} {"train_loss": -26.283477783203125, "global_step": 383315, "epoch": 4618} {"train_loss": -26.3525447845459, "global_step": 383316, "epoch": 4618} {"train_loss": -26.23612403869629, "global_step": 383317, "epoch": 4618} {"train_loss": -26.451007843017578, "global_step": 383318, "epoch": 4618} {"train_loss": -26.62566566467285, "global_step": 383319, "epoch": 4618} {"train_loss": -26.752628326416016, "global_step": 383320, "epoch": 4618} {"train_loss": -26.4954891204834, "global_step": 383321, "epoch": 4618} {"train_loss": -26.28509521484375, "global_step": 383322, "epoch": 4618} {"train_loss": -26.48240089416504, "global_step": 383323, "epoch": 4618} {"train_loss": -26.300220489501953, "global_step": 383324, "epoch": 4618} {"train_loss": -26.654645919799805, "global_step": 383325, "epoch": 4618} {"train_loss": -26.71250343322754, "global_step": 383326, "epoch": 4618} {"train_loss": -26.3150634765625, "global_step": 383327, "epoch": 4618} {"train_loss": -26.339609146118164, "global_step": 383328, "epoch": 4618} {"train_loss": -26.400278091430664, "global_step": 383329, "epoch": 4618} {"train_loss": -26.227252960205078, "global_step": 383330, "epoch": 4618} {"train_loss": -26.38531494140625, "global_step": 383331, "epoch": 4618} {"train_loss": -26.363386154174805, "global_step": 383332, "epoch": 4618} {"train_loss": -26.509140014648438, "global_step": 383333, "epoch": 4618} {"train_loss": -26.392980575561523, "global_step": 383334, "epoch": 4618} {"train_loss": -26.513336181640625, "global_step": 383335, "epoch": 4618} {"train_loss": -26.9957275390625, "global_step": 383336, "epoch": 4618} {"train_loss": -26.745100021362305, "global_step": 383337, "epoch": 4618} {"train_loss": -26.526121139526367, "global_step": 383338, "epoch": 4618} {"train_loss": -26.59943199157715, "global_step": 383339, "epoch": 4618} {"train_loss": -26.36931800842285, "global_step": 383340, "epoch": 4618} {"train_loss": -26.361846923828125, "global_step": 383341, "epoch": 4618} {"train_loss": -26.695621490478516, "global_step": 383342, "epoch": 4618} {"train_loss": -26.923690795898438, "global_step": 383343, "epoch": 4618} {"train_loss": -26.8442440032959, "global_step": 383344, "epoch": 4618} {"train_loss": -26.623193740844727, "global_step": 383345, "epoch": 4618} {"train_loss": -26.686634063720703, "global_step": 383346, "epoch": 4618} {"train_loss": -26.67119789123535, "global_step": 383347, "epoch": 4618} {"train_loss": -26.418975830078125, "global_step": 383348, "epoch": 4618} {"train_loss": -27.1367244720459, "global_step": 383349, "epoch": 4618} {"train_loss": -26.307361602783203, "global_step": 383350, "epoch": 4618} {"train_loss": -26.630075454711914, "global_step": 383351, "epoch": 4618} {"train_loss": -26.36591148376465, "global_step": 383352, "epoch": 4618} {"train_loss": -26.601123809814453, "global_step": 383353, "epoch": 4618} {"train_loss": -26.541950225830078, "global_step": 383354, "epoch": 4618} {"train_loss": -26.369373321533203, "global_step": 383355, "epoch": 4618} {"train_loss": -26.624502182006836, "global_step": 383356, "epoch": 4618} {"train_loss": -26.347028732299805, "global_step": 383357, "epoch": 4618} {"train_loss": -26.47823143005371, "global_step": 383358, "epoch": 4618} {"train_loss": -26.260793685913086, "global_step": 383359, "epoch": 4618} {"train_loss": -26.228662490844727, "global_step": 383360, "epoch": 4618} {"train_loss": -26.325925827026367, "global_step": 383361, "epoch": 4618} {"train_loss": -26.00079917907715, "global_step": 383362, "epoch": 4618} {"train_loss": -26.06337547302246, "global_step": 383363, "epoch": 4618} {"train_loss": -26.314847946166992, "global_step": 383364, "epoch": 4618} {"train_loss": -26.38179588317871, "global_step": 383365, "epoch": 4618} {"train_loss": -26.80277442932129, "global_step": 383366, "epoch": 4618} {"train_loss": -26.5156192779541, "global_step": 383367, "epoch": 4618} {"train_loss": -26.628366470336914, "global_step": 383368, "epoch": 4618} {"train_loss": -26.60394287109375, "global_step": 383369, "epoch": 4618} {"train_loss": -26.45697021484375, "global_step": 383370, "epoch": 4618} {"train_loss": -26.349807739257812, "global_step": 383371, "epoch": 4618} {"train_loss": -26.46234130859375, "global_step": 383372, "epoch": 4618} {"train_loss": -26.82294273376465, "global_step": 383373, "epoch": 4618} {"train_loss": -26.212432861328125, "global_step": 383374, "epoch": 4618} {"train_loss": -26.732959747314453, "global_step": 383375, "epoch": 4618} {"train_loss": -26.42409009818571, "global_step": 383376, "epoch": 4618, "val_loss": 6579932.0} {"train_loss": -25.487051010131836, "global_step": 383377, "epoch": 4619} {"train_loss": -25.538000106811523, "global_step": 383378, "epoch": 4619} {"train_loss": -26.176773071289062, "global_step": 383379, "epoch": 4619} {"train_loss": -25.7841796875, "global_step": 383380, "epoch": 4619} {"train_loss": -26.30523109436035, "global_step": 383381, "epoch": 4619} {"train_loss": -26.37506103515625, "global_step": 383382, "epoch": 4619} {"train_loss": -26.33306312561035, "global_step": 383383, "epoch": 4619} {"train_loss": -26.415374755859375, "global_step": 383384, "epoch": 4619} {"train_loss": -26.2965145111084, "global_step": 383385, "epoch": 4619} {"train_loss": -26.128522872924805, "global_step": 383386, "epoch": 4619} {"train_loss": -26.10104751586914, "global_step": 383387, "epoch": 4619} {"train_loss": -26.186737060546875, "global_step": 383388, "epoch": 4619} {"train_loss": -26.19370460510254, "global_step": 383389, "epoch": 4619} {"train_loss": -26.225818634033203, "global_step": 383390, "epoch": 4619} {"train_loss": -26.12476921081543, "global_step": 383391, "epoch": 4619} {"train_loss": -26.251148223876953, "global_step": 383392, "epoch": 4619} {"train_loss": -26.054290771484375, "global_step": 383393, "epoch": 4619} {"train_loss": -26.1874942779541, "global_step": 383394, "epoch": 4619} {"train_loss": -26.509275436401367, "global_step": 383395, "epoch": 4619} {"train_loss": -26.290746688842773, "global_step": 383396, "epoch": 4619} {"train_loss": -26.465805053710938, "global_step": 383397, "epoch": 4619} {"train_loss": -26.173505783081055, "global_step": 383398, "epoch": 4619} {"train_loss": -26.373092651367188, "global_step": 383399, "epoch": 4619} {"train_loss": -26.187164306640625, "global_step": 383400, "epoch": 4619} {"train_loss": -26.596948623657227, "global_step": 383401, "epoch": 4619} {"train_loss": -26.397348403930664, "global_step": 383402, "epoch": 4619} {"train_loss": -26.47623634338379, "global_step": 383403, "epoch": 4619} {"train_loss": -26.322851181030273, "global_step": 383404, "epoch": 4619} {"train_loss": -26.695236206054688, "global_step": 383405, "epoch": 4619} {"train_loss": -26.735675811767578, "global_step": 383406, "epoch": 4619} {"train_loss": -26.322315216064453, "global_step": 383407, "epoch": 4619} {"train_loss": -26.745756149291992, "global_step": 383408, "epoch": 4619} {"train_loss": -26.536035537719727, "global_step": 383409, "epoch": 4619} {"train_loss": -26.46363639831543, "global_step": 383410, "epoch": 4619} {"train_loss": -26.590986251831055, "global_step": 383411, "epoch": 4619} {"train_loss": -26.758359909057617, "global_step": 383412, "epoch": 4619} {"train_loss": -26.869876861572266, "global_step": 383413, "epoch": 4619} {"train_loss": -26.9573917388916, "global_step": 383414, "epoch": 4619} {"train_loss": -26.67158317565918, "global_step": 383415, "epoch": 4619} {"train_loss": -26.687255859375, "global_step": 383416, "epoch": 4619} {"train_loss": -26.401397705078125, "global_step": 383417, "epoch": 4619} {"train_loss": -26.5196533203125, "global_step": 383418, "epoch": 4619} {"train_loss": -26.741586685180664, "global_step": 383419, "epoch": 4619} {"train_loss": -26.672210693359375, "global_step": 383420, "epoch": 4619} {"train_loss": -26.341440200805664, "global_step": 383421, "epoch": 4619} {"train_loss": -26.202392578125, "global_step": 383422, "epoch": 4619} {"train_loss": -26.286108016967773, "global_step": 383423, "epoch": 4619} {"train_loss": -25.87323570251465, "global_step": 383424, "epoch": 4619} {"train_loss": -25.89115333557129, "global_step": 383425, "epoch": 4619} {"train_loss": -26.322168350219727, "global_step": 383426, "epoch": 4619} {"train_loss": -26.193647384643555, "global_step": 383427, "epoch": 4619} {"train_loss": -26.634735107421875, "global_step": 383428, "epoch": 4619} {"train_loss": -26.311460494995117, "global_step": 383429, "epoch": 4619} {"train_loss": -26.45760154724121, "global_step": 383430, "epoch": 4619} {"train_loss": -26.436786651611328, "global_step": 383431, "epoch": 4619} {"train_loss": -26.458703994750977, "global_step": 383432, "epoch": 4619} {"train_loss": -26.424291610717773, "global_step": 383433, "epoch": 4619} {"train_loss": -26.35281753540039, "global_step": 383434, "epoch": 4619} {"train_loss": -26.68043327331543, "global_step": 383435, "epoch": 4619} {"train_loss": -26.28669548034668, "global_step": 383436, "epoch": 4619} {"train_loss": -26.511999130249023, "global_step": 383437, "epoch": 4619} {"train_loss": -26.339460372924805, "global_step": 383438, "epoch": 4619} {"train_loss": -26.528573989868164, "global_step": 383439, "epoch": 4619} {"train_loss": -26.364486694335938, "global_step": 383440, "epoch": 4619} {"train_loss": -25.7587833404541, "global_step": 383441, "epoch": 4619} {"train_loss": -26.540149688720703, "global_step": 383442, "epoch": 4619} {"train_loss": -26.581647872924805, "global_step": 383443, "epoch": 4619} {"train_loss": -26.372644424438477, "global_step": 383444, "epoch": 4619} {"train_loss": -25.7276668548584, "global_step": 383445, "epoch": 4619} {"train_loss": -26.086034774780273, "global_step": 383446, "epoch": 4619} {"train_loss": -26.214313507080078, "global_step": 383447, "epoch": 4619} {"train_loss": -26.336380004882812, "global_step": 383448, "epoch": 4619} {"train_loss": -26.49190330505371, "global_step": 383449, "epoch": 4619} {"train_loss": -26.301239013671875, "global_step": 383450, "epoch": 4619} {"train_loss": -26.891651153564453, "global_step": 383451, "epoch": 4619} {"train_loss": -26.66849136352539, "global_step": 383452, "epoch": 4619} {"train_loss": -26.563928604125977, "global_step": 383453, "epoch": 4619} {"train_loss": -26.2254581451416, "global_step": 383454, "epoch": 4619} {"train_loss": -26.352994918823242, "global_step": 383455, "epoch": 4619} {"train_loss": -26.357324600219727, "global_step": 383456, "epoch": 4619} {"train_loss": -26.738483428955078, "global_step": 383457, "epoch": 4619} {"train_loss": -26.348102569580078, "global_step": 383458, "epoch": 4619} {"train_loss": -26.36154011645949, "global_step": 383459, "epoch": 4619, "val_loss": 6654962.0} {"train_loss": -25.525869369506836, "global_step": 383460, "epoch": 4620} {"train_loss": -25.578744888305664, "global_step": 383461, "epoch": 4620} {"train_loss": -25.842681884765625, "global_step": 383462, "epoch": 4620} {"train_loss": -26.4595890045166, "global_step": 383463, "epoch": 4620} {"train_loss": -26.228290557861328, "global_step": 383464, "epoch": 4620} {"train_loss": -26.114294052124023, "global_step": 383465, "epoch": 4620} {"train_loss": -26.2519588470459, "global_step": 383466, "epoch": 4620} {"train_loss": -26.146671295166016, "global_step": 383467, "epoch": 4620} {"train_loss": -25.756927490234375, "global_step": 383468, "epoch": 4620} {"train_loss": -26.185352325439453, "global_step": 383469, "epoch": 4620} {"train_loss": -26.11359977722168, "global_step": 383470, "epoch": 4620} {"train_loss": -25.8227481842041, "global_step": 383471, "epoch": 4620} {"train_loss": -26.362396240234375, "global_step": 383472, "epoch": 4620} {"train_loss": -26.040924072265625, "global_step": 383473, "epoch": 4620} {"train_loss": -26.370685577392578, "global_step": 383474, "epoch": 4620} {"train_loss": -25.94190788269043, "global_step": 383475, "epoch": 4620} {"train_loss": -26.14461326599121, "global_step": 383476, "epoch": 4620} {"train_loss": -25.903823852539062, "global_step": 383477, "epoch": 4620} {"train_loss": -26.1368465423584, "global_step": 383478, "epoch": 4620} {"train_loss": -26.4926700592041, "global_step": 383479, "epoch": 4620} {"train_loss": -26.33149528503418, "global_step": 383480, "epoch": 4620} {"train_loss": -25.76136589050293, "global_step": 383481, "epoch": 4620} {"train_loss": -26.203353881835938, "global_step": 383482, "epoch": 4620} {"train_loss": -26.296024322509766, "global_step": 383483, "epoch": 4620} {"train_loss": -26.06070899963379, "global_step": 383484, "epoch": 4620} {"train_loss": -26.1969051361084, "global_step": 383485, "epoch": 4620} {"train_loss": -26.470081329345703, "global_step": 383486, "epoch": 4620} {"train_loss": -26.389923095703125, "global_step": 383487, "epoch": 4620} {"train_loss": -26.250457763671875, "global_step": 383488, "epoch": 4620} {"train_loss": -26.515975952148438, "global_step": 383489, "epoch": 4620} {"train_loss": -26.14678382873535, "global_step": 383490, "epoch": 4620} {"train_loss": -26.53376579284668, "global_step": 383491, "epoch": 4620} {"train_loss": -26.322635650634766, "global_step": 383492, "epoch": 4620} {"train_loss": -26.61237907409668, "global_step": 383493, "epoch": 4620} {"train_loss": -26.431921005249023, "global_step": 383494, "epoch": 4620} {"train_loss": -26.75410270690918, "global_step": 383495, "epoch": 4620} {"train_loss": -26.48372459411621, "global_step": 383496, "epoch": 4620} {"train_loss": -26.475988388061523, "global_step": 383497, "epoch": 4620} {"train_loss": -26.803424835205078, "global_step": 383498, "epoch": 4620} {"train_loss": -26.408376693725586, "global_step": 383499, "epoch": 4620} {"train_loss": -26.58441734313965, "global_step": 383500, "epoch": 4620} {"train_loss": -26.78022575378418, "global_step": 383501, "epoch": 4620} {"train_loss": -26.459409713745117, "global_step": 383502, "epoch": 4620} {"train_loss": -26.95052146911621, "global_step": 383503, "epoch": 4620} {"train_loss": -26.442291259765625, "global_step": 383504, "epoch": 4620} {"train_loss": -26.8472957611084, "global_step": 383505, "epoch": 4620} {"train_loss": -26.548730850219727, "global_step": 383506, "epoch": 4620} {"train_loss": -26.357629776000977, "global_step": 383507, "epoch": 4620} {"train_loss": -26.597492218017578, "global_step": 383508, "epoch": 4620} {"train_loss": -26.406896591186523, "global_step": 383509, "epoch": 4620} {"train_loss": -26.52198600769043, "global_step": 383510, "epoch": 4620} {"train_loss": -26.42416763305664, "global_step": 383511, "epoch": 4620} {"train_loss": -26.370691299438477, "global_step": 383512, "epoch": 4620} {"train_loss": -26.668121337890625, "global_step": 383513, "epoch": 4620} {"train_loss": -26.558212280273438, "global_step": 383514, "epoch": 4620} {"train_loss": -26.562707901000977, "global_step": 383515, "epoch": 4620} {"train_loss": -27.03203773498535, "global_step": 383516, "epoch": 4620} {"train_loss": -26.393325805664062, "global_step": 383517, "epoch": 4620} {"train_loss": -26.975311279296875, "global_step": 383518, "epoch": 4620} {"train_loss": -26.601770401000977, "global_step": 383519, "epoch": 4620} {"train_loss": -26.545379638671875, "global_step": 383520, "epoch": 4620} {"train_loss": -26.719974517822266, "global_step": 383521, "epoch": 4620} {"train_loss": -26.44406509399414, "global_step": 383522, "epoch": 4620} {"train_loss": -26.9689884185791, "global_step": 383523, "epoch": 4620} {"train_loss": -26.732074737548828, "global_step": 383524, "epoch": 4620} {"train_loss": -26.524621963500977, "global_step": 383525, "epoch": 4620} {"train_loss": -26.764806747436523, "global_step": 383526, "epoch": 4620} {"train_loss": -26.820486068725586, "global_step": 383527, "epoch": 4620} {"train_loss": -26.734500885009766, "global_step": 383528, "epoch": 4620} {"train_loss": -26.359922409057617, "global_step": 383529, "epoch": 4620} {"train_loss": -26.03863525390625, "global_step": 383530, "epoch": 4620} {"train_loss": -25.331275939941406, "global_step": 383531, "epoch": 4620} {"train_loss": -25.45854377746582, "global_step": 383532, "epoch": 4620} {"train_loss": -26.366247177124023, "global_step": 383533, "epoch": 4620} {"train_loss": -25.863916397094727, "global_step": 383534, "epoch": 4620} {"train_loss": -25.52977752685547, "global_step": 383535, "epoch": 4620} {"train_loss": -25.609663009643555, "global_step": 383536, "epoch": 4620} {"train_loss": -25.73811912536621, "global_step": 383537, "epoch": 4620} {"train_loss": -26.26380729675293, "global_step": 383538, "epoch": 4620} {"train_loss": -25.529020309448242, "global_step": 383539, "epoch": 4620} {"train_loss": -26.0101375579834, "global_step": 383540, "epoch": 4620} {"train_loss": -25.597412109375, "global_step": 383541, "epoch": 4620} {"train_loss": -26.302813817219562, "global_step": 383542, "epoch": 4620, "val_loss": 6596270.0} {"train_loss": -25.687667846679688, "global_step": 383543, "epoch": 4621} {"train_loss": -25.406564712524414, "global_step": 383544, "epoch": 4621} {"train_loss": -25.908008575439453, "global_step": 383545, "epoch": 4621} {"train_loss": -25.55057716369629, "global_step": 383546, "epoch": 4621} {"train_loss": -25.873706817626953, "global_step": 383547, "epoch": 4621} {"train_loss": -25.516345977783203, "global_step": 383548, "epoch": 4621} {"train_loss": -25.548603057861328, "global_step": 383549, "epoch": 4621} {"train_loss": -25.903762817382812, "global_step": 383550, "epoch": 4621} {"train_loss": -26.1121883392334, "global_step": 383551, "epoch": 4621} {"train_loss": -26.19288444519043, "global_step": 383552, "epoch": 4621} {"train_loss": -26.224689483642578, "global_step": 383553, "epoch": 4621} {"train_loss": -26.1331787109375, "global_step": 383554, "epoch": 4621} {"train_loss": -26.12137794494629, "global_step": 383555, "epoch": 4621} {"train_loss": -25.904767990112305, "global_step": 383556, "epoch": 4621} {"train_loss": -26.093978881835938, "global_step": 383557, "epoch": 4621} {"train_loss": -26.17376708984375, "global_step": 383558, "epoch": 4621} {"train_loss": -26.2236270904541, "global_step": 383559, "epoch": 4621} {"train_loss": -26.515289306640625, "global_step": 383560, "epoch": 4621} {"train_loss": -26.00227928161621, "global_step": 383561, "epoch": 4621} {"train_loss": -26.11004066467285, "global_step": 383562, "epoch": 4621} {"train_loss": -26.46274185180664, "global_step": 383563, "epoch": 4621} {"train_loss": -26.270048141479492, "global_step": 383564, "epoch": 4621} {"train_loss": -26.039154052734375, "global_step": 383565, "epoch": 4621} {"train_loss": -26.387149810791016, "global_step": 383566, "epoch": 4621} {"train_loss": -26.36764907836914, "global_step": 383567, "epoch": 4621} {"train_loss": -26.341962814331055, "global_step": 383568, "epoch": 4621} {"train_loss": -26.61661720275879, "global_step": 383569, "epoch": 4621} {"train_loss": -26.459304809570312, "global_step": 383570, "epoch": 4621} {"train_loss": -26.489892959594727, "global_step": 383571, "epoch": 4621} {"train_loss": -26.304309844970703, "global_step": 383572, "epoch": 4621} {"train_loss": -26.375944137573242, "global_step": 383573, "epoch": 4621} {"train_loss": -26.163320541381836, "global_step": 383574, "epoch": 4621} {"train_loss": -26.35841178894043, "global_step": 383575, "epoch": 4621} {"train_loss": -26.5591983795166, "global_step": 383576, "epoch": 4621} {"train_loss": -26.3935546875, "global_step": 383577, "epoch": 4621} {"train_loss": -26.48459243774414, "global_step": 383578, "epoch": 4621} {"train_loss": -26.504150390625, "global_step": 383579, "epoch": 4621} {"train_loss": -26.667877197265625, "global_step": 383580, "epoch": 4621} {"train_loss": -26.7031307220459, "global_step": 383581, "epoch": 4621} {"train_loss": -26.580738067626953, "global_step": 383582, "epoch": 4621} {"train_loss": -26.6817684173584, "global_step": 383583, "epoch": 4621} {"train_loss": -26.600955963134766, "global_step": 383584, "epoch": 4621} {"train_loss": -26.529890060424805, "global_step": 383585, "epoch": 4621} {"train_loss": -26.65223503112793, "global_step": 383586, "epoch": 4621} {"train_loss": -26.558454513549805, "global_step": 383587, "epoch": 4621} {"train_loss": -26.459320068359375, "global_step": 383588, "epoch": 4621} {"train_loss": -26.689960479736328, "global_step": 383589, "epoch": 4621} {"train_loss": -26.842914581298828, "global_step": 383590, "epoch": 4621} {"train_loss": -26.77970314025879, "global_step": 383591, "epoch": 4621} {"train_loss": -26.1570987701416, "global_step": 383592, "epoch": 4621} {"train_loss": -26.060163497924805, "global_step": 383593, "epoch": 4621} {"train_loss": -26.390050888061523, "global_step": 383594, "epoch": 4621} {"train_loss": -26.59968376159668, "global_step": 383595, "epoch": 4621} {"train_loss": -26.346576690673828, "global_step": 383596, "epoch": 4621} {"train_loss": -26.160669326782227, "global_step": 383597, "epoch": 4621} {"train_loss": -26.559192657470703, "global_step": 383598, "epoch": 4621} {"train_loss": -26.24607276916504, "global_step": 383599, "epoch": 4621} {"train_loss": -26.457387924194336, "global_step": 383600, "epoch": 4621} {"train_loss": -26.613088607788086, "global_step": 383601, "epoch": 4621} {"train_loss": -26.057897567749023, "global_step": 383602, "epoch": 4621} {"train_loss": -26.648578643798828, "global_step": 383603, "epoch": 4621} {"train_loss": -26.03857421875, "global_step": 383604, "epoch": 4621} {"train_loss": -26.26100730895996, "global_step": 383605, "epoch": 4621} {"train_loss": -26.229063034057617, "global_step": 383606, "epoch": 4621} {"train_loss": -26.188398361206055, "global_step": 383607, "epoch": 4621} {"train_loss": -26.55466079711914, "global_step": 383608, "epoch": 4621} {"train_loss": -26.136926651000977, "global_step": 383609, "epoch": 4621} {"train_loss": -26.2489070892334, "global_step": 383610, "epoch": 4621} {"train_loss": -26.0937557220459, "global_step": 383611, "epoch": 4621} {"train_loss": -26.033689498901367, "global_step": 383612, "epoch": 4621} {"train_loss": -25.963560104370117, "global_step": 383613, "epoch": 4621} {"train_loss": -26.23365592956543, "global_step": 383614, "epoch": 4621} {"train_loss": -25.920019149780273, "global_step": 383615, "epoch": 4621} {"train_loss": -26.269092559814453, "global_step": 383616, "epoch": 4621} {"train_loss": -26.516422271728516, "global_step": 383617, "epoch": 4621} {"train_loss": -26.483184814453125, "global_step": 383618, "epoch": 4621} {"train_loss": -26.227436065673828, "global_step": 383619, "epoch": 4621} {"train_loss": -26.321502685546875, "global_step": 383620, "epoch": 4621} {"train_loss": -26.43568229675293, "global_step": 383621, "epoch": 4621} {"train_loss": -26.4285831451416, "global_step": 383622, "epoch": 4621} {"train_loss": -26.363067626953125, "global_step": 383623, "epoch": 4621} {"train_loss": -26.52849769592285, "global_step": 383624, "epoch": 4621} {"train_loss": -26.28871136401073, "global_step": 383625, "epoch": 4621, "val_loss": 6664250.0} {"train_loss": -26.298078536987305, "global_step": 383626, "epoch": 4622} {"train_loss": -25.801599502563477, "global_step": 383627, "epoch": 4622} {"train_loss": -25.809812545776367, "global_step": 383628, "epoch": 4622} {"train_loss": -25.742877960205078, "global_step": 383629, "epoch": 4622} {"train_loss": -26.254058837890625, "global_step": 383630, "epoch": 4622} {"train_loss": -25.642364501953125, "global_step": 383631, "epoch": 4622} {"train_loss": -26.1962833404541, "global_step": 383632, "epoch": 4622} {"train_loss": -26.01143455505371, "global_step": 383633, "epoch": 4622} {"train_loss": -25.878101348876953, "global_step": 383634, "epoch": 4622} {"train_loss": -26.33207130432129, "global_step": 383635, "epoch": 4622} {"train_loss": -26.035287857055664, "global_step": 383636, "epoch": 4622} {"train_loss": -26.0628604888916, "global_step": 383637, "epoch": 4622} {"train_loss": -25.882421493530273, "global_step": 383638, "epoch": 4622} {"train_loss": -26.225149154663086, "global_step": 383639, "epoch": 4622} {"train_loss": -26.2425537109375, "global_step": 383640, "epoch": 4622} {"train_loss": -26.0811710357666, "global_step": 383641, "epoch": 4622} {"train_loss": -26.11335563659668, "global_step": 383642, "epoch": 4622} {"train_loss": -26.49460792541504, "global_step": 383643, "epoch": 4622} {"train_loss": -26.396499633789062, "global_step": 383644, "epoch": 4622} {"train_loss": -26.405994415283203, "global_step": 383645, "epoch": 4622} {"train_loss": -26.499155044555664, "global_step": 383646, "epoch": 4622} {"train_loss": -26.126245498657227, "global_step": 383647, "epoch": 4622} {"train_loss": -25.836669921875, "global_step": 383648, "epoch": 4622} {"train_loss": -26.513233184814453, "global_step": 383649, "epoch": 4622} {"train_loss": -26.2089786529541, "global_step": 383650, "epoch": 4622} {"train_loss": -26.309940338134766, "global_step": 383651, "epoch": 4622} {"train_loss": -26.599746704101562, "global_step": 383652, "epoch": 4622} {"train_loss": -26.159509658813477, "global_step": 383653, "epoch": 4622} {"train_loss": -26.487125396728516, "global_step": 383654, "epoch": 4622} {"train_loss": -26.79352378845215, "global_step": 383655, "epoch": 4622} {"train_loss": -26.781696319580078, "global_step": 383656, "epoch": 4622} {"train_loss": -26.32244300842285, "global_step": 383657, "epoch": 4622} {"train_loss": -26.79176139831543, "global_step": 383658, "epoch": 4622} {"train_loss": -26.523542404174805, "global_step": 383659, "epoch": 4622} {"train_loss": -26.339101791381836, "global_step": 383660, "epoch": 4622} {"train_loss": -26.49869155883789, "global_step": 383661, "epoch": 4622} {"train_loss": -26.721179962158203, "global_step": 383662, "epoch": 4622} {"train_loss": -26.630237579345703, "global_step": 383663, "epoch": 4622} {"train_loss": -26.411529541015625, "global_step": 383664, "epoch": 4622} {"train_loss": -26.56980323791504, "global_step": 383665, "epoch": 4622} {"train_loss": -26.319320678710938, "global_step": 383666, "epoch": 4622} {"train_loss": -26.407861709594727, "global_step": 383667, "epoch": 4622} {"train_loss": -26.54969596862793, "global_step": 383668, "epoch": 4622} {"train_loss": -26.68410301208496, "global_step": 383669, "epoch": 4622} {"train_loss": -26.548248291015625, "global_step": 383670, "epoch": 4622} {"train_loss": -26.40937614440918, "global_step": 383671, "epoch": 4622} {"train_loss": -26.897232055664062, "global_step": 383672, "epoch": 4622} {"train_loss": -26.774717330932617, "global_step": 383673, "epoch": 4622} {"train_loss": -26.416629791259766, "global_step": 383674, "epoch": 4622} {"train_loss": -26.386154174804688, "global_step": 383675, "epoch": 4622} {"train_loss": -26.515859603881836, "global_step": 383676, "epoch": 4622} {"train_loss": -26.71120262145996, "global_step": 383677, "epoch": 4622} {"train_loss": -26.845325469970703, "global_step": 383678, "epoch": 4622} {"train_loss": -26.6014404296875, "global_step": 383679, "epoch": 4622} {"train_loss": -26.998077392578125, "global_step": 383680, "epoch": 4622} {"train_loss": -26.812963485717773, "global_step": 383681, "epoch": 4622} {"train_loss": -26.820051193237305, "global_step": 383682, "epoch": 4622} {"train_loss": -26.244184494018555, "global_step": 383683, "epoch": 4622} {"train_loss": -26.506732940673828, "global_step": 383684, "epoch": 4622} {"train_loss": -26.63789939880371, "global_step": 383685, "epoch": 4622} {"train_loss": -26.31560707092285, "global_step": 383686, "epoch": 4622} {"train_loss": -26.11305046081543, "global_step": 383687, "epoch": 4622} {"train_loss": -26.27308464050293, "global_step": 383688, "epoch": 4622} {"train_loss": -26.443883895874023, "global_step": 383689, "epoch": 4622} {"train_loss": -26.43515968322754, "global_step": 383690, "epoch": 4622} {"train_loss": -26.41225242614746, "global_step": 383691, "epoch": 4622} {"train_loss": -25.48590087890625, "global_step": 383692, "epoch": 4622} {"train_loss": -26.151769638061523, "global_step": 383693, "epoch": 4622} {"train_loss": -26.715002059936523, "global_step": 383694, "epoch": 4622} {"train_loss": -25.563098907470703, "global_step": 383695, "epoch": 4622} {"train_loss": -26.531164169311523, "global_step": 383696, "epoch": 4622} {"train_loss": -26.53663444519043, "global_step": 383697, "epoch": 4622} {"train_loss": -26.344745635986328, "global_step": 383698, "epoch": 4622} {"train_loss": -25.721776962280273, "global_step": 383699, "epoch": 4622} {"train_loss": -26.040014266967773, "global_step": 383700, "epoch": 4622} {"train_loss": -26.037521362304688, "global_step": 383701, "epoch": 4622} {"train_loss": -26.279340744018555, "global_step": 383702, "epoch": 4622} {"train_loss": -26.314743041992188, "global_step": 383703, "epoch": 4622} {"train_loss": -25.82256507873535, "global_step": 383704, "epoch": 4622} {"train_loss": -26.267993927001953, "global_step": 383705, "epoch": 4622} {"train_loss": -26.079309463500977, "global_step": 383706, "epoch": 4622} {"train_loss": -26.365787506103516, "global_step": 383707, "epoch": 4622} {"train_loss": -26.327947570616942, "global_step": 383708, "epoch": 4622, "val_loss": 6541843.0} {"train_loss": -25.22344207763672, "global_step": 383709, "epoch": 4623} {"train_loss": -24.775249481201172, "global_step": 383710, "epoch": 4623} {"train_loss": -24.639631271362305, "global_step": 383711, "epoch": 4623} {"train_loss": -25.57493019104004, "global_step": 383712, "epoch": 4623} {"train_loss": -25.310955047607422, "global_step": 383713, "epoch": 4623} {"train_loss": -24.83760643005371, "global_step": 383714, "epoch": 4623} {"train_loss": -24.857406616210938, "global_step": 383715, "epoch": 4623} {"train_loss": -25.305845260620117, "global_step": 383716, "epoch": 4623} {"train_loss": -25.57948112487793, "global_step": 383717, "epoch": 4623} {"train_loss": -25.661108016967773, "global_step": 383718, "epoch": 4623} {"train_loss": -25.319015502929688, "global_step": 383719, "epoch": 4623} {"train_loss": -25.365074157714844, "global_step": 383720, "epoch": 4623} {"train_loss": -25.422027587890625, "global_step": 383721, "epoch": 4623} {"train_loss": -25.365501403808594, "global_step": 383722, "epoch": 4623} {"train_loss": -25.712656021118164, "global_step": 383723, "epoch": 4623} {"train_loss": -25.8612117767334, "global_step": 383724, "epoch": 4623} {"train_loss": -25.848127365112305, "global_step": 383725, "epoch": 4623} {"train_loss": -25.804853439331055, "global_step": 383726, "epoch": 4623} {"train_loss": -25.817975997924805, "global_step": 383727, "epoch": 4623} {"train_loss": -25.631895065307617, "global_step": 383728, "epoch": 4623} {"train_loss": -25.516769409179688, "global_step": 383729, "epoch": 4623} {"train_loss": -26.14229393005371, "global_step": 383730, "epoch": 4623} {"train_loss": -26.17145347595215, "global_step": 383731, "epoch": 4623} {"train_loss": -26.058591842651367, "global_step": 383732, "epoch": 4623} {"train_loss": -26.328155517578125, "global_step": 383733, "epoch": 4623} {"train_loss": -26.239212036132812, "global_step": 383734, "epoch": 4623} {"train_loss": -26.408239364624023, "global_step": 383735, "epoch": 4623} {"train_loss": -26.135868072509766, "global_step": 383736, "epoch": 4623} {"train_loss": -25.945728302001953, "global_step": 383737, "epoch": 4623} {"train_loss": -26.054468154907227, "global_step": 383738, "epoch": 4623} {"train_loss": -26.348447799682617, "global_step": 383739, "epoch": 4623} {"train_loss": -25.78937339782715, "global_step": 383740, "epoch": 4623} {"train_loss": -26.756803512573242, "global_step": 383741, "epoch": 4623} {"train_loss": -26.251272201538086, "global_step": 383742, "epoch": 4623} {"train_loss": -26.63758659362793, "global_step": 383743, "epoch": 4623} {"train_loss": -26.544376373291016, "global_step": 383744, "epoch": 4623} {"train_loss": -26.210519790649414, "global_step": 383745, "epoch": 4623} {"train_loss": -26.3719539642334, "global_step": 383746, "epoch": 4623} {"train_loss": -26.337265014648438, "global_step": 383747, "epoch": 4623} {"train_loss": -26.66070556640625, "global_step": 383748, "epoch": 4623} {"train_loss": -26.460264205932617, "global_step": 383749, "epoch": 4623} {"train_loss": -26.46473503112793, "global_step": 383750, "epoch": 4623} {"train_loss": -26.6190128326416, "global_step": 383751, "epoch": 4623} {"train_loss": -26.818037033081055, "global_step": 383752, "epoch": 4623} {"train_loss": -26.34063720703125, "global_step": 383753, "epoch": 4623} {"train_loss": -26.191043853759766, "global_step": 383754, "epoch": 4623} {"train_loss": -26.55329704284668, "global_step": 383755, "epoch": 4623} {"train_loss": -26.742446899414062, "global_step": 383756, "epoch": 4623} {"train_loss": -26.8436279296875, "global_step": 383757, "epoch": 4623} {"train_loss": -26.947784423828125, "global_step": 383758, "epoch": 4623} {"train_loss": -26.765180587768555, "global_step": 383759, "epoch": 4623} {"train_loss": -26.822406768798828, "global_step": 383760, "epoch": 4623} {"train_loss": -26.660024642944336, "global_step": 383761, "epoch": 4623} {"train_loss": -26.5777530670166, "global_step": 383762, "epoch": 4623} {"train_loss": -26.778095245361328, "global_step": 383763, "epoch": 4623} {"train_loss": -26.754377365112305, "global_step": 383764, "epoch": 4623} {"train_loss": -26.989370346069336, "global_step": 383765, "epoch": 4623} {"train_loss": -26.407751083374023, "global_step": 383766, "epoch": 4623} {"train_loss": -26.581104278564453, "global_step": 383767, "epoch": 4623} {"train_loss": -26.1535701751709, "global_step": 383768, "epoch": 4623} {"train_loss": -26.637466430664062, "global_step": 383769, "epoch": 4623} {"train_loss": -26.481714248657227, "global_step": 383770, "epoch": 4623} {"train_loss": -26.485193252563477, "global_step": 383771, "epoch": 4623} {"train_loss": -26.95916748046875, "global_step": 383772, "epoch": 4623} {"train_loss": -27.12367057800293, "global_step": 383773, "epoch": 4623} {"train_loss": -26.623489379882812, "global_step": 383774, "epoch": 4623} {"train_loss": -26.410358428955078, "global_step": 383775, "epoch": 4623} {"train_loss": -26.667987823486328, "global_step": 383776, "epoch": 4623} {"train_loss": -26.7210750579834, "global_step": 383777, "epoch": 4623} {"train_loss": -26.66534423828125, "global_step": 383778, "epoch": 4623} {"train_loss": -26.641706466674805, "global_step": 383779, "epoch": 4623} {"train_loss": -26.572874069213867, "global_step": 383780, "epoch": 4623} {"train_loss": -26.409765243530273, "global_step": 383781, "epoch": 4623} {"train_loss": -26.60125732421875, "global_step": 383782, "epoch": 4623} {"train_loss": -26.24983787536621, "global_step": 383783, "epoch": 4623} {"train_loss": -26.560155868530273, "global_step": 383784, "epoch": 4623} {"train_loss": -26.877599716186523, "global_step": 383785, "epoch": 4623} {"train_loss": -26.38739013671875, "global_step": 383786, "epoch": 4623} {"train_loss": -26.990034103393555, "global_step": 383787, "epoch": 4623} {"train_loss": -26.698209762573242, "global_step": 383788, "epoch": 4623} {"train_loss": -26.676746368408203, "global_step": 383789, "epoch": 4623} {"train_loss": -26.2174072265625, "global_step": 383790, "epoch": 4623} {"train_loss": -26.2519422324307, "global_step": 383791, "epoch": 4623, "val_loss": 6637960.5} {"train_loss": -25.324758529663086, "global_step": 383792, "epoch": 4624} {"train_loss": -24.225385665893555, "global_step": 383793, "epoch": 4624} {"train_loss": -24.680124282836914, "global_step": 383794, "epoch": 4624} {"train_loss": -25.87298011779785, "global_step": 383795, "epoch": 4624} {"train_loss": -24.78546905517578, "global_step": 383796, "epoch": 4624} {"train_loss": -25.34729766845703, "global_step": 383797, "epoch": 4624} {"train_loss": -25.473745346069336, "global_step": 383798, "epoch": 4624} {"train_loss": -25.15810203552246, "global_step": 383799, "epoch": 4624} {"train_loss": -25.804357528686523, "global_step": 383800, "epoch": 4624} {"train_loss": -25.6099853515625, "global_step": 383801, "epoch": 4624} {"train_loss": -25.449520111083984, "global_step": 383802, "epoch": 4624} {"train_loss": -25.72950553894043, "global_step": 383803, "epoch": 4624} {"train_loss": -25.472997665405273, "global_step": 383804, "epoch": 4624} {"train_loss": -25.585365295410156, "global_step": 383805, "epoch": 4624} {"train_loss": -25.873870849609375, "global_step": 383806, "epoch": 4624} {"train_loss": -26.166494369506836, "global_step": 383807, "epoch": 4624} {"train_loss": -25.893096923828125, "global_step": 383808, "epoch": 4624} {"train_loss": -25.943866729736328, "global_step": 383809, "epoch": 4624} {"train_loss": -26.123388290405273, "global_step": 383810, "epoch": 4624} {"train_loss": -25.9439640045166, "global_step": 383811, "epoch": 4624} {"train_loss": -25.830564498901367, "global_step": 383812, "epoch": 4624} {"train_loss": -26.27791404724121, "global_step": 383813, "epoch": 4624} {"train_loss": -26.16158103942871, "global_step": 383814, "epoch": 4624} {"train_loss": -26.222684860229492, "global_step": 383815, "epoch": 4624} {"train_loss": -25.864965438842773, "global_step": 383816, "epoch": 4624} {"train_loss": -26.346424102783203, "global_step": 383817, "epoch": 4624} {"train_loss": -26.736867904663086, "global_step": 383818, "epoch": 4624} {"train_loss": -26.04062843322754, "global_step": 383819, "epoch": 4624} {"train_loss": -26.44873046875, "global_step": 383820, "epoch": 4624} {"train_loss": -26.44562339782715, "global_step": 383821, "epoch": 4624} {"train_loss": -26.627948760986328, "global_step": 383822, "epoch": 4624} {"train_loss": -26.4068603515625, "global_step": 383823, "epoch": 4624} {"train_loss": -26.314136505126953, "global_step": 383824, "epoch": 4624} {"train_loss": -26.146728515625, "global_step": 383825, "epoch": 4624} {"train_loss": -26.254474639892578, "global_step": 383826, "epoch": 4624} {"train_loss": -26.24724769592285, "global_step": 383827, "epoch": 4624} {"train_loss": -26.425622940063477, "global_step": 383828, "epoch": 4624} {"train_loss": -26.379724502563477, "global_step": 383829, "epoch": 4624} {"train_loss": -26.451520919799805, "global_step": 383830, "epoch": 4624} {"train_loss": -26.8466796875, "global_step": 383831, "epoch": 4624} {"train_loss": -26.59634780883789, "global_step": 383832, "epoch": 4624} {"train_loss": -26.558761596679688, "global_step": 383833, "epoch": 4624} {"train_loss": -26.648609161376953, "global_step": 383834, "epoch": 4624} {"train_loss": -26.734460830688477, "global_step": 383835, "epoch": 4624} {"train_loss": -26.15365982055664, "global_step": 383836, "epoch": 4624} {"train_loss": -26.399991989135742, "global_step": 383837, "epoch": 4624} {"train_loss": -26.529693603515625, "global_step": 383838, "epoch": 4624} {"train_loss": -26.91692543029785, "global_step": 383839, "epoch": 4624} {"train_loss": -26.3585205078125, "global_step": 383840, "epoch": 4624} {"train_loss": -26.303937911987305, "global_step": 383841, "epoch": 4624} {"train_loss": -26.359619140625, "global_step": 383842, "epoch": 4624} {"train_loss": -26.345335006713867, "global_step": 383843, "epoch": 4624} {"train_loss": -26.786090850830078, "global_step": 383844, "epoch": 4624} {"train_loss": -26.545886993408203, "global_step": 383845, "epoch": 4624} {"train_loss": -26.491413116455078, "global_step": 383846, "epoch": 4624} {"train_loss": -26.4853515625, "global_step": 383847, "epoch": 4624} {"train_loss": -26.501087188720703, "global_step": 383848, "epoch": 4624} {"train_loss": -26.44598388671875, "global_step": 383849, "epoch": 4624} {"train_loss": -26.783658981323242, "global_step": 383850, "epoch": 4624} {"train_loss": -26.631118774414062, "global_step": 383851, "epoch": 4624} {"train_loss": -26.620349884033203, "global_step": 383852, "epoch": 4624} {"train_loss": -26.531707763671875, "global_step": 383853, "epoch": 4624} {"train_loss": -26.665430068969727, "global_step": 383854, "epoch": 4624} {"train_loss": -26.810409545898438, "global_step": 383855, "epoch": 4624} {"train_loss": -26.492380142211914, "global_step": 383856, "epoch": 4624} {"train_loss": -26.540729522705078, "global_step": 383857, "epoch": 4624} {"train_loss": -26.477176666259766, "global_step": 383858, "epoch": 4624} {"train_loss": -26.75148582458496, "global_step": 383859, "epoch": 4624} {"train_loss": -26.75882339477539, "global_step": 383860, "epoch": 4624} {"train_loss": -26.52046012878418, "global_step": 383861, "epoch": 4624} {"train_loss": -26.670856475830078, "global_step": 383862, "epoch": 4624} {"train_loss": -26.579544067382812, "global_step": 383863, "epoch": 4624} {"train_loss": -26.562353134155273, "global_step": 383864, "epoch": 4624} {"train_loss": -26.856460571289062, "global_step": 383865, "epoch": 4624} {"train_loss": -26.45928382873535, "global_step": 383866, "epoch": 4624} {"train_loss": -26.668975830078125, "global_step": 383867, "epoch": 4624} {"train_loss": -26.668058395385742, "global_step": 383868, "epoch": 4624} {"train_loss": -26.5983943939209, "global_step": 383869, "epoch": 4624} {"train_loss": -26.438007354736328, "global_step": 383870, "epoch": 4624} {"train_loss": -26.43634033203125, "global_step": 383871, "epoch": 4624} {"train_loss": -26.33738136291504, "global_step": 383872, "epoch": 4624} {"train_loss": -26.385202407836914, "global_step": 383873, "epoch": 4624} {"train_loss": -26.23474509457508, "global_step": 383874, "epoch": 4624, "val_loss": 6786899.0} {"train_loss": -19.344074249267578, "global_step": 383875, "epoch": 4625} {"train_loss": -22.785757064819336, "global_step": 383876, "epoch": 4625} {"train_loss": -24.42896842956543, "global_step": 383877, "epoch": 4625} {"train_loss": -23.18149185180664, "global_step": 383878, "epoch": 4625} {"train_loss": -24.303510665893555, "global_step": 383879, "epoch": 4625} {"train_loss": -24.110593795776367, "global_step": 383880, "epoch": 4625} {"train_loss": -24.0695858001709, "global_step": 383881, "epoch": 4625} {"train_loss": -24.98578453063965, "global_step": 383882, "epoch": 4625} {"train_loss": -24.780805587768555, "global_step": 383883, "epoch": 4625} {"train_loss": -24.794963836669922, "global_step": 383884, "epoch": 4625} {"train_loss": -25.162738800048828, "global_step": 383885, "epoch": 4625} {"train_loss": -25.45269012451172, "global_step": 383886, "epoch": 4625} {"train_loss": -25.040098190307617, "global_step": 383887, "epoch": 4625} {"train_loss": -24.665250778198242, "global_step": 383888, "epoch": 4625} {"train_loss": -25.34465217590332, "global_step": 383889, "epoch": 4625} {"train_loss": -25.100177764892578, "global_step": 383890, "epoch": 4625} {"train_loss": -25.519319534301758, "global_step": 383891, "epoch": 4625} {"train_loss": -25.635915756225586, "global_step": 383892, "epoch": 4625} {"train_loss": -25.391971588134766, "global_step": 383893, "epoch": 4625} {"train_loss": -25.410512924194336, "global_step": 383894, "epoch": 4625} {"train_loss": -25.578290939331055, "global_step": 383895, "epoch": 4625} {"train_loss": -25.546537399291992, "global_step": 383896, "epoch": 4625} {"train_loss": -25.60544204711914, "global_step": 383897, "epoch": 4625} {"train_loss": -25.449453353881836, "global_step": 383898, "epoch": 4625} {"train_loss": -25.720901489257812, "global_step": 383899, "epoch": 4625} {"train_loss": -25.740131378173828, "global_step": 383900, "epoch": 4625} {"train_loss": -25.38681983947754, "global_step": 383901, "epoch": 4625} {"train_loss": -25.60794448852539, "global_step": 383902, "epoch": 4625} {"train_loss": -26.250577926635742, "global_step": 383903, "epoch": 4625} {"train_loss": -25.909687042236328, "global_step": 383904, "epoch": 4625} {"train_loss": -25.65787124633789, "global_step": 383905, "epoch": 4625} {"train_loss": -25.698495864868164, "global_step": 383906, "epoch": 4625} {"train_loss": -25.620227813720703, "global_step": 383907, "epoch": 4625} {"train_loss": -26.412220001220703, "global_step": 383908, "epoch": 4625} {"train_loss": -25.704492568969727, "global_step": 383909, "epoch": 4625} {"train_loss": -25.90593910217285, "global_step": 383910, "epoch": 4625} {"train_loss": -25.756261825561523, "global_step": 383911, "epoch": 4625} {"train_loss": -26.119842529296875, "global_step": 383912, "epoch": 4625} {"train_loss": -26.032251358032227, "global_step": 383913, "epoch": 4625} {"train_loss": -26.190027236938477, "global_step": 383914, "epoch": 4625} {"train_loss": -26.036991119384766, "global_step": 383915, "epoch": 4625} {"train_loss": -25.924575805664062, "global_step": 383916, "epoch": 4625} {"train_loss": -25.996835708618164, "global_step": 383917, "epoch": 4625} {"train_loss": -26.07940673828125, "global_step": 383918, "epoch": 4625} {"train_loss": -26.299030303955078, "global_step": 383919, "epoch": 4625} {"train_loss": -26.646093368530273, "global_step": 383920, "epoch": 4625} {"train_loss": -26.11177635192871, "global_step": 383921, "epoch": 4625} {"train_loss": -26.647811889648438, "global_step": 383922, "epoch": 4625} {"train_loss": -25.940900802612305, "global_step": 383923, "epoch": 4625} {"train_loss": -26.51099967956543, "global_step": 383924, "epoch": 4625} {"train_loss": -25.963193893432617, "global_step": 383925, "epoch": 4625} {"train_loss": -26.21884536743164, "global_step": 383926, "epoch": 4625} {"train_loss": -26.245513916015625, "global_step": 383927, "epoch": 4625} {"train_loss": -26.118635177612305, "global_step": 383928, "epoch": 4625} {"train_loss": -26.6487979888916, "global_step": 383929, "epoch": 4625} {"train_loss": -26.388090133666992, "global_step": 383930, "epoch": 4625} {"train_loss": -26.374670028686523, "global_step": 383931, "epoch": 4625} {"train_loss": -26.402841567993164, "global_step": 383932, "epoch": 4625} {"train_loss": -26.447052001953125, "global_step": 383933, "epoch": 4625} {"train_loss": -26.62152671813965, "global_step": 383934, "epoch": 4625} {"train_loss": -26.656152725219727, "global_step": 383935, "epoch": 4625} {"train_loss": -26.714832305908203, "global_step": 383936, "epoch": 4625} {"train_loss": -26.623029708862305, "global_step": 383937, "epoch": 4625} {"train_loss": -26.45658302307129, "global_step": 383938, "epoch": 4625} {"train_loss": -26.646411895751953, "global_step": 383939, "epoch": 4625} {"train_loss": -26.6507568359375, "global_step": 383940, "epoch": 4625} {"train_loss": -26.502042770385742, "global_step": 383941, "epoch": 4625} {"train_loss": -25.962482452392578, "global_step": 383942, "epoch": 4625} {"train_loss": -24.841718673706055, "global_step": 383943, "epoch": 4625} {"train_loss": -24.073488235473633, "global_step": 383944, "epoch": 4625} {"train_loss": -25.01129913330078, "global_step": 383945, "epoch": 4625} {"train_loss": -26.2280216217041, "global_step": 383946, "epoch": 4625} {"train_loss": -25.90546226501465, "global_step": 383947, "epoch": 4625} {"train_loss": -26.194843292236328, "global_step": 383948, "epoch": 4625} {"train_loss": -25.638940811157227, "global_step": 383949, "epoch": 4625} {"train_loss": -26.1460018157959, "global_step": 383950, "epoch": 4625} {"train_loss": -25.84417724609375, "global_step": 383951, "epoch": 4625} {"train_loss": -26.248676300048828, "global_step": 383952, "epoch": 4625} {"train_loss": -25.9946231842041, "global_step": 383953, "epoch": 4625} {"train_loss": -26.306379318237305, "global_step": 383954, "epoch": 4625} {"train_loss": -26.187891006469727, "global_step": 383955, "epoch": 4625} {"train_loss": -26.50300407409668, "global_step": 383956, "epoch": 4625} {"train_loss": -25.67684796344803, "global_step": 383957, "epoch": 4625, "val_loss": 6591042.0} {"train_loss": -26.4786434173584, "global_step": 383958, "epoch": 4626} {"train_loss": -26.092824935913086, "global_step": 383959, "epoch": 4626} {"train_loss": -26.481616973876953, "global_step": 383960, "epoch": 4626} {"train_loss": -25.931140899658203, "global_step": 383961, "epoch": 4626} {"train_loss": -25.88587760925293, "global_step": 383962, "epoch": 4626} {"train_loss": -26.236631393432617, "global_step": 383963, "epoch": 4626} {"train_loss": -26.241491317749023, "global_step": 383964, "epoch": 4626} {"train_loss": -26.126188278198242, "global_step": 383965, "epoch": 4626} {"train_loss": -26.013553619384766, "global_step": 383966, "epoch": 4626} {"train_loss": -26.27472496032715, "global_step": 383967, "epoch": 4626} {"train_loss": -26.057519912719727, "global_step": 383968, "epoch": 4626} {"train_loss": -26.185888290405273, "global_step": 383969, "epoch": 4626} {"train_loss": -26.093481063842773, "global_step": 383970, "epoch": 4626} {"train_loss": -26.315927505493164, "global_step": 383971, "epoch": 4626} {"train_loss": -26.268390655517578, "global_step": 383972, "epoch": 4626} {"train_loss": -26.7992000579834, "global_step": 383973, "epoch": 4626} {"train_loss": -26.351001739501953, "global_step": 383974, "epoch": 4626} {"train_loss": -26.788089752197266, "global_step": 383975, "epoch": 4626} {"train_loss": -26.502185821533203, "global_step": 383976, "epoch": 4626} {"train_loss": -26.267797470092773, "global_step": 383977, "epoch": 4626} {"train_loss": -26.1435489654541, "global_step": 383978, "epoch": 4626} {"train_loss": -26.733219146728516, "global_step": 383979, "epoch": 4626} {"train_loss": -25.7607421875, "global_step": 383980, "epoch": 4626} {"train_loss": -26.628583908081055, "global_step": 383981, "epoch": 4626} {"train_loss": -26.575286865234375, "global_step": 383982, "epoch": 4626} {"train_loss": -26.69135856628418, "global_step": 383983, "epoch": 4626} {"train_loss": -26.419849395751953, "global_step": 383984, "epoch": 4626} {"train_loss": -26.843433380126953, "global_step": 383985, "epoch": 4626} {"train_loss": -26.749561309814453, "global_step": 383986, "epoch": 4626} {"train_loss": -26.547840118408203, "global_step": 383987, "epoch": 4626} {"train_loss": -26.623260498046875, "global_step": 383988, "epoch": 4626} {"train_loss": -26.47958755493164, "global_step": 383989, "epoch": 4626} {"train_loss": -26.059350967407227, "global_step": 383990, "epoch": 4626} {"train_loss": -26.57712173461914, "global_step": 383991, "epoch": 4626} {"train_loss": -26.05586814880371, "global_step": 383992, "epoch": 4626} {"train_loss": -26.4848575592041, "global_step": 383993, "epoch": 4626} {"train_loss": -26.490589141845703, "global_step": 383994, "epoch": 4626} {"train_loss": -26.618642807006836, "global_step": 383995, "epoch": 4626} {"train_loss": -26.741979598999023, "global_step": 383996, "epoch": 4626} {"train_loss": -26.696781158447266, "global_step": 383997, "epoch": 4626} {"train_loss": -26.312015533447266, "global_step": 383998, "epoch": 4626} {"train_loss": -26.723840713500977, "global_step": 383999, "epoch": 4626} {"train_loss": -26.534439086914062, "global_step": 384000, "epoch": 4626} {"train_loss": -26.247907638549805, "global_step": 384001, "epoch": 4626} {"train_loss": -26.521467208862305, "global_step": 384002, "epoch": 4626} {"train_loss": -26.475759506225586, "global_step": 384003, "epoch": 4626} {"train_loss": -26.283935546875, "global_step": 384004, "epoch": 4626} {"train_loss": -26.65827751159668, "global_step": 384005, "epoch": 4626} {"train_loss": -26.576629638671875, "global_step": 384006, "epoch": 4626} {"train_loss": -26.471908569335938, "global_step": 384007, "epoch": 4626} {"train_loss": -26.673141479492188, "global_step": 384008, "epoch": 4626} {"train_loss": -26.580341339111328, "global_step": 384009, "epoch": 4626} {"train_loss": -26.8952693939209, "global_step": 384010, "epoch": 4626} {"train_loss": -26.62054443359375, "global_step": 384011, "epoch": 4626} {"train_loss": -26.600549697875977, "global_step": 384012, "epoch": 4626} {"train_loss": -26.865209579467773, "global_step": 384013, "epoch": 4626} {"train_loss": -26.633041381835938, "global_step": 384014, "epoch": 4626} {"train_loss": -26.664457321166992, "global_step": 384015, "epoch": 4626} {"train_loss": -26.75310707092285, "global_step": 384016, "epoch": 4626} {"train_loss": -26.562870025634766, "global_step": 384017, "epoch": 4626} {"train_loss": -26.76008415222168, "global_step": 384018, "epoch": 4626} {"train_loss": -26.402822494506836, "global_step": 384019, "epoch": 4626} {"train_loss": -26.701379776000977, "global_step": 384020, "epoch": 4626} {"train_loss": -26.904983520507812, "global_step": 384021, "epoch": 4626} {"train_loss": -26.46534538269043, "global_step": 384022, "epoch": 4626} {"train_loss": -26.305618286132812, "global_step": 384023, "epoch": 4626} {"train_loss": -26.586135864257812, "global_step": 384024, "epoch": 4626} {"train_loss": -26.7856502532959, "global_step": 384025, "epoch": 4626} {"train_loss": -26.603179931640625, "global_step": 384026, "epoch": 4626} {"train_loss": -26.687789916992188, "global_step": 384027, "epoch": 4626} {"train_loss": -26.212650299072266, "global_step": 384028, "epoch": 4626} {"train_loss": -26.924823760986328, "global_step": 384029, "epoch": 4626} {"train_loss": -26.69696617126465, "global_step": 384030, "epoch": 4626} {"train_loss": -26.550745010375977, "global_step": 384031, "epoch": 4626} {"train_loss": -26.36284828186035, "global_step": 384032, "epoch": 4626} {"train_loss": -26.56721305847168, "global_step": 384033, "epoch": 4626} {"train_loss": -26.3301944732666, "global_step": 384034, "epoch": 4626} {"train_loss": -26.243331909179688, "global_step": 384035, "epoch": 4626} {"train_loss": -25.911977767944336, "global_step": 384036, "epoch": 4626} {"train_loss": -26.650793075561523, "global_step": 384037, "epoch": 4626} {"train_loss": -26.600637435913086, "global_step": 384038, "epoch": 4626} {"train_loss": -26.850019454956055, "global_step": 384039, "epoch": 4626} {"train_loss": -26.48737392655338, "global_step": 384040, "epoch": 4626, "val_loss": 6641796.0} {"train_loss": -24.266895294189453, "global_step": 384041, "epoch": 4627} {"train_loss": -23.982160568237305, "global_step": 384042, "epoch": 4627} {"train_loss": -24.890226364135742, "global_step": 384043, "epoch": 4627} {"train_loss": -24.349802017211914, "global_step": 384044, "epoch": 4627} {"train_loss": -24.956912994384766, "global_step": 384045, "epoch": 4627} {"train_loss": -24.85154151916504, "global_step": 384046, "epoch": 4627} {"train_loss": -25.07002067565918, "global_step": 384047, "epoch": 4627} {"train_loss": -24.871070861816406, "global_step": 384048, "epoch": 4627} {"train_loss": -25.387109756469727, "global_step": 384049, "epoch": 4627} {"train_loss": -24.98831558227539, "global_step": 384050, "epoch": 4627} {"train_loss": -25.182483673095703, "global_step": 384051, "epoch": 4627} {"train_loss": -25.6779842376709, "global_step": 384052, "epoch": 4627} {"train_loss": -25.603239059448242, "global_step": 384053, "epoch": 4627} {"train_loss": -25.569501876831055, "global_step": 384054, "epoch": 4627} {"train_loss": -25.62371253967285, "global_step": 384055, "epoch": 4627} {"train_loss": -25.680246353149414, "global_step": 384056, "epoch": 4627} {"train_loss": -25.564884185791016, "global_step": 384057, "epoch": 4627} {"train_loss": -25.865341186523438, "global_step": 384058, "epoch": 4627} {"train_loss": -25.637725830078125, "global_step": 384059, "epoch": 4627} {"train_loss": -25.894763946533203, "global_step": 384060, "epoch": 4627} {"train_loss": -25.872303009033203, "global_step": 384061, "epoch": 4627} {"train_loss": -25.865610122680664, "global_step": 384062, "epoch": 4627} {"train_loss": -25.71077537536621, "global_step": 384063, "epoch": 4627} {"train_loss": -25.62677574157715, "global_step": 384064, "epoch": 4627} {"train_loss": -25.974430084228516, "global_step": 384065, "epoch": 4627} {"train_loss": -25.693893432617188, "global_step": 384066, "epoch": 4627} {"train_loss": -25.874784469604492, "global_step": 384067, "epoch": 4627} {"train_loss": -26.085126876831055, "global_step": 384068, "epoch": 4627} {"train_loss": -25.949888229370117, "global_step": 384069, "epoch": 4627} {"train_loss": -26.030221939086914, "global_step": 384070, "epoch": 4627} {"train_loss": -26.26398277282715, "global_step": 384071, "epoch": 4627} {"train_loss": -25.991601943969727, "global_step": 384072, "epoch": 4627} {"train_loss": -26.018198013305664, "global_step": 384073, "epoch": 4627} {"train_loss": -26.232898712158203, "global_step": 384074, "epoch": 4627} {"train_loss": -26.43886375427246, "global_step": 384075, "epoch": 4627} {"train_loss": -25.8776798248291, "global_step": 384076, "epoch": 4627} {"train_loss": -26.458759307861328, "global_step": 384077, "epoch": 4627} {"train_loss": -26.089187622070312, "global_step": 384078, "epoch": 4627} {"train_loss": -26.20423698425293, "global_step": 384079, "epoch": 4627} {"train_loss": -26.498998641967773, "global_step": 384080, "epoch": 4627} {"train_loss": -26.916006088256836, "global_step": 384081, "epoch": 4627} {"train_loss": -26.524686813354492, "global_step": 384082, "epoch": 4627} {"train_loss": -26.377599716186523, "global_step": 384083, "epoch": 4627} {"train_loss": -26.478662490844727, "global_step": 384084, "epoch": 4627} {"train_loss": -26.517475128173828, "global_step": 384085, "epoch": 4627} {"train_loss": -26.171850204467773, "global_step": 384086, "epoch": 4627} {"train_loss": -26.41045570373535, "global_step": 384087, "epoch": 4627} {"train_loss": -26.75862693786621, "global_step": 384088, "epoch": 4627} {"train_loss": -26.61446189880371, "global_step": 384089, "epoch": 4627} {"train_loss": -26.817819595336914, "global_step": 384090, "epoch": 4627} {"train_loss": -26.51944923400879, "global_step": 384091, "epoch": 4627} {"train_loss": -26.724454879760742, "global_step": 384092, "epoch": 4627} {"train_loss": -26.56292152404785, "global_step": 384093, "epoch": 4627} {"train_loss": -26.84053611755371, "global_step": 384094, "epoch": 4627} {"train_loss": -26.149951934814453, "global_step": 384095, "epoch": 4627} {"train_loss": -26.74945068359375, "global_step": 384096, "epoch": 4627} {"train_loss": -26.556507110595703, "global_step": 384097, "epoch": 4627} {"train_loss": -26.56689453125, "global_step": 384098, "epoch": 4627} {"train_loss": -26.95199966430664, "global_step": 384099, "epoch": 4627} {"train_loss": -26.912933349609375, "global_step": 384100, "epoch": 4627} {"train_loss": -26.777063369750977, "global_step": 384101, "epoch": 4627} {"train_loss": -26.71747398376465, "global_step": 384102, "epoch": 4627} {"train_loss": -26.3115291595459, "global_step": 384103, "epoch": 4627} {"train_loss": -26.53376579284668, "global_step": 384104, "epoch": 4627} {"train_loss": -26.79115867614746, "global_step": 384105, "epoch": 4627} {"train_loss": -26.530420303344727, "global_step": 384106, "epoch": 4627} {"train_loss": -26.7904109954834, "global_step": 384107, "epoch": 4627} {"train_loss": -26.558889389038086, "global_step": 384108, "epoch": 4627} {"train_loss": -26.83100700378418, "global_step": 384109, "epoch": 4627} {"train_loss": -26.8437442779541, "global_step": 384110, "epoch": 4627} {"train_loss": -26.940799713134766, "global_step": 384111, "epoch": 4627} {"train_loss": -26.329666137695312, "global_step": 384112, "epoch": 4627} {"train_loss": -26.89124870300293, "global_step": 384113, "epoch": 4627} {"train_loss": -27.052167892456055, "global_step": 384114, "epoch": 4627} {"train_loss": -26.5837345123291, "global_step": 384115, "epoch": 4627} {"train_loss": -26.429479598999023, "global_step": 384116, "epoch": 4627} {"train_loss": -26.390207290649414, "global_step": 384117, "epoch": 4627} {"train_loss": -26.38916015625, "global_step": 384118, "epoch": 4627} {"train_loss": -26.456525802612305, "global_step": 384119, "epoch": 4627} {"train_loss": -26.124114990234375, "global_step": 384120, "epoch": 4627} {"train_loss": -26.308948516845703, "global_step": 384121, "epoch": 4627} {"train_loss": -26.432580947875977, "global_step": 384122, "epoch": 4627} {"train_loss": -26.115088887961512, "global_step": 384123, "epoch": 4627, "val_loss": 6685276.0} {"train_loss": -24.641660690307617, "global_step": 384124, "epoch": 4628} {"train_loss": -24.320289611816406, "global_step": 384125, "epoch": 4628} {"train_loss": -25.362905502319336, "global_step": 384126, "epoch": 4628} {"train_loss": -25.581939697265625, "global_step": 384127, "epoch": 4628} {"train_loss": -25.4401912689209, "global_step": 384128, "epoch": 4628} {"train_loss": -25.49002456665039, "global_step": 384129, "epoch": 4628} {"train_loss": -25.878799438476562, "global_step": 384130, "epoch": 4628} {"train_loss": -25.386859893798828, "global_step": 384131, "epoch": 4628} {"train_loss": -26.034032821655273, "global_step": 384132, "epoch": 4628} {"train_loss": -25.431318283081055, "global_step": 384133, "epoch": 4628} {"train_loss": -25.719785690307617, "global_step": 384134, "epoch": 4628} {"train_loss": -25.44202423095703, "global_step": 384135, "epoch": 4628} {"train_loss": -25.304182052612305, "global_step": 384136, "epoch": 4628} {"train_loss": -25.8094482421875, "global_step": 384137, "epoch": 4628} {"train_loss": -25.517595291137695, "global_step": 384138, "epoch": 4628} {"train_loss": -25.88720703125, "global_step": 384139, "epoch": 4628} {"train_loss": -25.761371612548828, "global_step": 384140, "epoch": 4628} {"train_loss": -25.96824073791504, "global_step": 384141, "epoch": 4628} {"train_loss": -25.96759605407715, "global_step": 384142, "epoch": 4628} {"train_loss": -26.093799591064453, "global_step": 384143, "epoch": 4628} {"train_loss": -25.9544620513916, "global_step": 384144, "epoch": 4628} {"train_loss": -26.212182998657227, "global_step": 384145, "epoch": 4628} {"train_loss": -25.693084716796875, "global_step": 384146, "epoch": 4628} {"train_loss": -26.040679931640625, "global_step": 384147, "epoch": 4628} {"train_loss": -25.9532413482666, "global_step": 384148, "epoch": 4628} {"train_loss": -26.10611915588379, "global_step": 384149, "epoch": 4628} {"train_loss": -26.554224014282227, "global_step": 384150, "epoch": 4628} {"train_loss": -26.520471572875977, "global_step": 384151, "epoch": 4628} {"train_loss": -26.269826889038086, "global_step": 384152, "epoch": 4628} {"train_loss": -26.06450843811035, "global_step": 384153, "epoch": 4628} {"train_loss": -26.00738525390625, "global_step": 384154, "epoch": 4628} {"train_loss": -26.17949867248535, "global_step": 384155, "epoch": 4628} {"train_loss": -26.00689125061035, "global_step": 384156, "epoch": 4628} {"train_loss": -26.23016929626465, "global_step": 384157, "epoch": 4628} {"train_loss": -26.645477294921875, "global_step": 384158, "epoch": 4628} {"train_loss": -26.133764266967773, "global_step": 384159, "epoch": 4628} {"train_loss": -26.46449089050293, "global_step": 384160, "epoch": 4628} {"train_loss": -26.2834415435791, "global_step": 384161, "epoch": 4628} {"train_loss": -26.359251022338867, "global_step": 384162, "epoch": 4628} {"train_loss": -26.600006103515625, "global_step": 384163, "epoch": 4628} {"train_loss": -26.669677734375, "global_step": 384164, "epoch": 4628} {"train_loss": -26.2219181060791, "global_step": 384165, "epoch": 4628} {"train_loss": -26.553909301757812, "global_step": 384166, "epoch": 4628} {"train_loss": -26.61758804321289, "global_step": 384167, "epoch": 4628} {"train_loss": -26.563404083251953, "global_step": 384168, "epoch": 4628} {"train_loss": -26.318872451782227, "global_step": 384169, "epoch": 4628} {"train_loss": -26.20680809020996, "global_step": 384170, "epoch": 4628} {"train_loss": -26.57733726501465, "global_step": 384171, "epoch": 4628} {"train_loss": -26.742719650268555, "global_step": 384172, "epoch": 4628} {"train_loss": -26.826932907104492, "global_step": 384173, "epoch": 4628} {"train_loss": -26.627063751220703, "global_step": 384174, "epoch": 4628} {"train_loss": -26.92315101623535, "global_step": 384175, "epoch": 4628} {"train_loss": -26.589624404907227, "global_step": 384176, "epoch": 4628} {"train_loss": -26.864110946655273, "global_step": 384177, "epoch": 4628} {"train_loss": -26.63160514831543, "global_step": 384178, "epoch": 4628} {"train_loss": -26.874082565307617, "global_step": 384179, "epoch": 4628} {"train_loss": -26.72113609313965, "global_step": 384180, "epoch": 4628} {"train_loss": -26.536779403686523, "global_step": 384181, "epoch": 4628} {"train_loss": -26.319604873657227, "global_step": 384182, "epoch": 4628} {"train_loss": -26.54694938659668, "global_step": 384183, "epoch": 4628} {"train_loss": -26.829755783081055, "global_step": 384184, "epoch": 4628} {"train_loss": -26.60980224609375, "global_step": 384185, "epoch": 4628} {"train_loss": -26.5688533782959, "global_step": 384186, "epoch": 4628} {"train_loss": -26.945117950439453, "global_step": 384187, "epoch": 4628} {"train_loss": -26.5667667388916, "global_step": 384188, "epoch": 4628} {"train_loss": -26.742048263549805, "global_step": 384189, "epoch": 4628} {"train_loss": -26.68084144592285, "global_step": 384190, "epoch": 4628} {"train_loss": -26.480545043945312, "global_step": 384191, "epoch": 4628} {"train_loss": -26.44169044494629, "global_step": 384192, "epoch": 4628} {"train_loss": -26.497821807861328, "global_step": 384193, "epoch": 4628} {"train_loss": -26.3836612701416, "global_step": 384194, "epoch": 4628} {"train_loss": -26.69879150390625, "global_step": 384195, "epoch": 4628} {"train_loss": -26.520618438720703, "global_step": 384196, "epoch": 4628} {"train_loss": -26.41318702697754, "global_step": 384197, "epoch": 4628} {"train_loss": -26.639602661132812, "global_step": 384198, "epoch": 4628} {"train_loss": -26.888996124267578, "global_step": 384199, "epoch": 4628} {"train_loss": -26.593994140625, "global_step": 384200, "epoch": 4628} {"train_loss": -26.639179229736328, "global_step": 384201, "epoch": 4628} {"train_loss": -26.81742286682129, "global_step": 384202, "epoch": 4628} {"train_loss": -26.5537166595459, "global_step": 384203, "epoch": 4628} {"train_loss": -26.79962730407715, "global_step": 384204, "epoch": 4628} {"train_loss": -26.36909294128418, "global_step": 384205, "epoch": 4628} {"train_loss": -26.250423385436278, "global_step": 384206, "epoch": 4628, "val_loss": 6712016.0} {"train_loss": -25.4345645904541, "global_step": 384207, "epoch": 4629} {"train_loss": -24.504140853881836, "global_step": 384208, "epoch": 4629} {"train_loss": -25.044286727905273, "global_step": 384209, "epoch": 4629} {"train_loss": -24.35063362121582, "global_step": 384210, "epoch": 4629} {"train_loss": -25.92225456237793, "global_step": 384211, "epoch": 4629} {"train_loss": -24.99237632751465, "global_step": 384212, "epoch": 4629} {"train_loss": -24.603857040405273, "global_step": 384213, "epoch": 4629} {"train_loss": -25.707334518432617, "global_step": 384214, "epoch": 4629} {"train_loss": -25.477746963500977, "global_step": 384215, "epoch": 4629} {"train_loss": -25.71880531311035, "global_step": 384216, "epoch": 4629} {"train_loss": -25.38027000427246, "global_step": 384217, "epoch": 4629} {"train_loss": -26.115232467651367, "global_step": 384218, "epoch": 4629} {"train_loss": -25.710163116455078, "global_step": 384219, "epoch": 4629} {"train_loss": -26.440475463867188, "global_step": 384220, "epoch": 4629} {"train_loss": -25.873701095581055, "global_step": 384221, "epoch": 4629} {"train_loss": -25.666889190673828, "global_step": 384222, "epoch": 4629} {"train_loss": -26.199201583862305, "global_step": 384223, "epoch": 4629} {"train_loss": -26.09465980529785, "global_step": 384224, "epoch": 4629} {"train_loss": -25.88362693786621, "global_step": 384225, "epoch": 4629} {"train_loss": -26.27434730529785, "global_step": 384226, "epoch": 4629} {"train_loss": -25.96150016784668, "global_step": 384227, "epoch": 4629} {"train_loss": -25.781896591186523, "global_step": 384228, "epoch": 4629} {"train_loss": -26.326343536376953, "global_step": 384229, "epoch": 4629} {"train_loss": -26.0926513671875, "global_step": 384230, "epoch": 4629} {"train_loss": -26.25018310546875, "global_step": 384231, "epoch": 4629} {"train_loss": -26.2388916015625, "global_step": 384232, "epoch": 4629} {"train_loss": -26.066720962524414, "global_step": 384233, "epoch": 4629} {"train_loss": -26.166431427001953, "global_step": 384234, "epoch": 4629} {"train_loss": -26.202533721923828, "global_step": 384235, "epoch": 4629} {"train_loss": -26.4625186920166, "global_step": 384236, "epoch": 4629} {"train_loss": -26.2491512298584, "global_step": 384237, "epoch": 4629} {"train_loss": -26.53375244140625, "global_step": 384238, "epoch": 4629} {"train_loss": -26.70868492126465, "global_step": 384239, "epoch": 4629} {"train_loss": -26.341663360595703, "global_step": 384240, "epoch": 4629} {"train_loss": -26.418615341186523, "global_step": 384241, "epoch": 4629} {"train_loss": -26.496183395385742, "global_step": 384242, "epoch": 4629} {"train_loss": -26.307392120361328, "global_step": 384243, "epoch": 4629} {"train_loss": -26.84628677368164, "global_step": 384244, "epoch": 4629} {"train_loss": -26.608762741088867, "global_step": 384245, "epoch": 4629} {"train_loss": -26.396472930908203, "global_step": 384246, "epoch": 4629} {"train_loss": -26.348098754882812, "global_step": 384247, "epoch": 4629} {"train_loss": -26.26997184753418, "global_step": 384248, "epoch": 4629} {"train_loss": -26.48475456237793, "global_step": 384249, "epoch": 4629} {"train_loss": -26.745025634765625, "global_step": 384250, "epoch": 4629} {"train_loss": -26.62495231628418, "global_step": 384251, "epoch": 4629} {"train_loss": -26.63514518737793, "global_step": 384252, "epoch": 4629} {"train_loss": -26.8167781829834, "global_step": 384253, "epoch": 4629} {"train_loss": -26.557586669921875, "global_step": 384254, "epoch": 4629} {"train_loss": -26.488550186157227, "global_step": 384255, "epoch": 4629} {"train_loss": -26.88077163696289, "global_step": 384256, "epoch": 4629} {"train_loss": -26.68647575378418, "global_step": 384257, "epoch": 4629} {"train_loss": -26.76580810546875, "global_step": 384258, "epoch": 4629} {"train_loss": -26.59076499938965, "global_step": 384259, "epoch": 4629} {"train_loss": -26.54632568359375, "global_step": 384260, "epoch": 4629} {"train_loss": -26.6488037109375, "global_step": 384261, "epoch": 4629} {"train_loss": -26.831823348999023, "global_step": 384262, "epoch": 4629} {"train_loss": -26.527997970581055, "global_step": 384263, "epoch": 4629} {"train_loss": -27.041522979736328, "global_step": 384264, "epoch": 4629} {"train_loss": -26.782846450805664, "global_step": 384265, "epoch": 4629} {"train_loss": -26.464807510375977, "global_step": 384266, "epoch": 4629} {"train_loss": -26.7652645111084, "global_step": 384267, "epoch": 4629} {"train_loss": -26.327167510986328, "global_step": 384268, "epoch": 4629} {"train_loss": -26.81964683532715, "global_step": 384269, "epoch": 4629} {"train_loss": -26.02008056640625, "global_step": 384270, "epoch": 4629} {"train_loss": -26.50605583190918, "global_step": 384271, "epoch": 4629} {"train_loss": -26.48737907409668, "global_step": 384272, "epoch": 4629} {"train_loss": -26.779376983642578, "global_step": 384273, "epoch": 4629} {"train_loss": -26.549352645874023, "global_step": 384274, "epoch": 4629} {"train_loss": -26.4510440826416, "global_step": 384275, "epoch": 4629} {"train_loss": -26.398427963256836, "global_step": 384276, "epoch": 4629} {"train_loss": -26.579370498657227, "global_step": 384277, "epoch": 4629} {"train_loss": -26.46550941467285, "global_step": 384278, "epoch": 4629} {"train_loss": -26.140033721923828, "global_step": 384279, "epoch": 4629} {"train_loss": -26.471820831298828, "global_step": 384280, "epoch": 4629} {"train_loss": -26.344593048095703, "global_step": 384281, "epoch": 4629} {"train_loss": -26.318328857421875, "global_step": 384282, "epoch": 4629} {"train_loss": -26.145605087280273, "global_step": 384283, "epoch": 4629} {"train_loss": -26.7813777923584, "global_step": 384284, "epoch": 4629} {"train_loss": -25.886178970336914, "global_step": 384285, "epoch": 4629} {"train_loss": -26.084959030151367, "global_step": 384286, "epoch": 4629} {"train_loss": -26.359846115112305, "global_step": 384287, "epoch": 4629} {"train_loss": -26.244461059570312, "global_step": 384288, "epoch": 4629} {"train_loss": -26.23678395834314, "global_step": 384289, "epoch": 4629, "val_loss": 6623302.0} {"train_loss": -25.48760414123535, "global_step": 384290, "epoch": 4630} {"train_loss": -24.02554702758789, "global_step": 384291, "epoch": 4630} {"train_loss": -25.378450393676758, "global_step": 384292, "epoch": 4630} {"train_loss": -24.174379348754883, "global_step": 384293, "epoch": 4630} {"train_loss": -23.535354614257812, "global_step": 384294, "epoch": 4630} {"train_loss": -25.634418487548828, "global_step": 384295, "epoch": 4630} {"train_loss": -24.68739128112793, "global_step": 384296, "epoch": 4630} {"train_loss": -24.89937400817871, "global_step": 384297, "epoch": 4630} {"train_loss": -24.972412109375, "global_step": 384298, "epoch": 4630} {"train_loss": -25.167633056640625, "global_step": 384299, "epoch": 4630} {"train_loss": -25.304107666015625, "global_step": 384300, "epoch": 4630} {"train_loss": -25.655847549438477, "global_step": 384301, "epoch": 4630} {"train_loss": -25.005449295043945, "global_step": 384302, "epoch": 4630} {"train_loss": -25.136362075805664, "global_step": 384303, "epoch": 4630} {"train_loss": -25.72041893005371, "global_step": 384304, "epoch": 4630} {"train_loss": -25.6301326751709, "global_step": 384305, "epoch": 4630} {"train_loss": -25.894712448120117, "global_step": 384306, "epoch": 4630} {"train_loss": -25.778528213500977, "global_step": 384307, "epoch": 4630} {"train_loss": -25.819700241088867, "global_step": 384308, "epoch": 4630} {"train_loss": -25.635602951049805, "global_step": 384309, "epoch": 4630} {"train_loss": -25.528095245361328, "global_step": 384310, "epoch": 4630} {"train_loss": -25.793615341186523, "global_step": 384311, "epoch": 4630} {"train_loss": -25.565942764282227, "global_step": 384312, "epoch": 4630} {"train_loss": -25.8166446685791, "global_step": 384313, "epoch": 4630} {"train_loss": -26.121557235717773, "global_step": 384314, "epoch": 4630} {"train_loss": -25.64814567565918, "global_step": 384315, "epoch": 4630} {"train_loss": -25.96889305114746, "global_step": 384316, "epoch": 4630} {"train_loss": -26.129165649414062, "global_step": 384317, "epoch": 4630} {"train_loss": -26.202850341796875, "global_step": 384318, "epoch": 4630} {"train_loss": -25.85297203063965, "global_step": 384319, "epoch": 4630} {"train_loss": -26.163572311401367, "global_step": 384320, "epoch": 4630} {"train_loss": -25.799840927124023, "global_step": 384321, "epoch": 4630} {"train_loss": -25.663427352905273, "global_step": 384322, "epoch": 4630} {"train_loss": -25.95016860961914, "global_step": 384323, "epoch": 4630} {"train_loss": -25.773487091064453, "global_step": 384324, "epoch": 4630} {"train_loss": -26.5376033782959, "global_step": 384325, "epoch": 4630} {"train_loss": -26.109548568725586, "global_step": 384326, "epoch": 4630} {"train_loss": -26.28000831604004, "global_step": 384327, "epoch": 4630} {"train_loss": -25.934057235717773, "global_step": 384328, "epoch": 4630} {"train_loss": -26.32999610900879, "global_step": 384329, "epoch": 4630} {"train_loss": -25.99104118347168, "global_step": 384330, "epoch": 4630} {"train_loss": -26.436511993408203, "global_step": 384331, "epoch": 4630} {"train_loss": -26.44150733947754, "global_step": 384332, "epoch": 4630} {"train_loss": -26.17122459411621, "global_step": 384333, "epoch": 4630} {"train_loss": -26.433502197265625, "global_step": 384334, "epoch": 4630} {"train_loss": -26.067590713500977, "global_step": 384335, "epoch": 4630} {"train_loss": -26.17901039123535, "global_step": 384336, "epoch": 4630} {"train_loss": -26.720062255859375, "global_step": 384337, "epoch": 4630} {"train_loss": -26.448835372924805, "global_step": 384338, "epoch": 4630} {"train_loss": -26.141042709350586, "global_step": 384339, "epoch": 4630} {"train_loss": -26.425867080688477, "global_step": 384340, "epoch": 4630} {"train_loss": -26.379465103149414, "global_step": 384341, "epoch": 4630} {"train_loss": -26.497568130493164, "global_step": 384342, "epoch": 4630} {"train_loss": -26.839040756225586, "global_step": 384343, "epoch": 4630} {"train_loss": -26.65077018737793, "global_step": 384344, "epoch": 4630} {"train_loss": -26.496992111206055, "global_step": 384345, "epoch": 4630} {"train_loss": -26.701623916625977, "global_step": 384346, "epoch": 4630} {"train_loss": -26.428192138671875, "global_step": 384347, "epoch": 4630} {"train_loss": -26.445728302001953, "global_step": 384348, "epoch": 4630} {"train_loss": -26.722070693969727, "global_step": 384349, "epoch": 4630} {"train_loss": -26.721393585205078, "global_step": 384350, "epoch": 4630} {"train_loss": -26.611173629760742, "global_step": 384351, "epoch": 4630} {"train_loss": -26.517263412475586, "global_step": 384352, "epoch": 4630} {"train_loss": -26.31552505493164, "global_step": 384353, "epoch": 4630} {"train_loss": -26.293012619018555, "global_step": 384354, "epoch": 4630} {"train_loss": -26.755905151367188, "global_step": 384355, "epoch": 4630} {"train_loss": -26.2272891998291, "global_step": 384356, "epoch": 4630} {"train_loss": -25.6196346282959, "global_step": 384357, "epoch": 4630} {"train_loss": -25.941848754882812, "global_step": 384358, "epoch": 4630} {"train_loss": -26.17206382751465, "global_step": 384359, "epoch": 4630} {"train_loss": -25.629932403564453, "global_step": 384360, "epoch": 4630} {"train_loss": -25.995450973510742, "global_step": 384361, "epoch": 4630} {"train_loss": -25.566726684570312, "global_step": 384362, "epoch": 4630} {"train_loss": -25.787734985351562, "global_step": 384363, "epoch": 4630} {"train_loss": -26.00678825378418, "global_step": 384364, "epoch": 4630} {"train_loss": -26.00318717956543, "global_step": 384365, "epoch": 4630} {"train_loss": -25.986005783081055, "global_step": 384366, "epoch": 4630} {"train_loss": -25.97706413269043, "global_step": 384367, "epoch": 4630} {"train_loss": -26.530364990234375, "global_step": 384368, "epoch": 4630} {"train_loss": -26.211164474487305, "global_step": 384369, "epoch": 4630} {"train_loss": -25.863636016845703, "global_step": 384370, "epoch": 4630} {"train_loss": -26.562026977539062, "global_step": 384371, "epoch": 4630} {"train_loss": -25.94825680284615, "global_step": 384372, "epoch": 4630, "val_loss": 6589285.0} {"train_loss": -25.873117446899414, "global_step": 384373, "epoch": 4631} {"train_loss": -25.769983291625977, "global_step": 384374, "epoch": 4631} {"train_loss": -26.02753257751465, "global_step": 384375, "epoch": 4631} {"train_loss": -25.155960083007812, "global_step": 384376, "epoch": 4631} {"train_loss": -25.8621826171875, "global_step": 384377, "epoch": 4631} {"train_loss": -26.11907386779785, "global_step": 384378, "epoch": 4631} {"train_loss": -25.82916831970215, "global_step": 384379, "epoch": 4631} {"train_loss": -26.197317123413086, "global_step": 384380, "epoch": 4631} {"train_loss": -25.71217155456543, "global_step": 384381, "epoch": 4631} {"train_loss": -26.1065673828125, "global_step": 384382, "epoch": 4631} {"train_loss": -26.08570671081543, "global_step": 384383, "epoch": 4631} {"train_loss": -25.9694881439209, "global_step": 384384, "epoch": 4631} {"train_loss": -25.748443603515625, "global_step": 384385, "epoch": 4631} {"train_loss": -25.948705673217773, "global_step": 384386, "epoch": 4631} {"train_loss": -25.7156982421875, "global_step": 384387, "epoch": 4631} {"train_loss": -26.39765739440918, "global_step": 384388, "epoch": 4631} {"train_loss": -26.102914810180664, "global_step": 384389, "epoch": 4631} {"train_loss": -26.117645263671875, "global_step": 384390, "epoch": 4631} {"train_loss": -25.987226486206055, "global_step": 384391, "epoch": 4631} {"train_loss": -26.326068878173828, "global_step": 384392, "epoch": 4631} {"train_loss": -26.44296646118164, "global_step": 384393, "epoch": 4631} {"train_loss": -26.172651290893555, "global_step": 384394, "epoch": 4631} {"train_loss": -25.844247817993164, "global_step": 384395, "epoch": 4631} {"train_loss": -26.196990966796875, "global_step": 384396, "epoch": 4631} {"train_loss": -26.103199005126953, "global_step": 384397, "epoch": 4631} {"train_loss": -26.434406280517578, "global_step": 384398, "epoch": 4631} {"train_loss": -26.431262969970703, "global_step": 384399, "epoch": 4631} {"train_loss": -26.149946212768555, "global_step": 384400, "epoch": 4631} {"train_loss": -26.57090187072754, "global_step": 384401, "epoch": 4631} {"train_loss": -26.511072158813477, "global_step": 384402, "epoch": 4631} {"train_loss": -26.398550033569336, "global_step": 384403, "epoch": 4631} {"train_loss": -26.32550048828125, "global_step": 384404, "epoch": 4631} {"train_loss": -26.521589279174805, "global_step": 384405, "epoch": 4631} {"train_loss": -26.48734474182129, "global_step": 384406, "epoch": 4631} {"train_loss": -26.966617584228516, "global_step": 384407, "epoch": 4631} {"train_loss": -26.665924072265625, "global_step": 384408, "epoch": 4631} {"train_loss": -26.597822189331055, "global_step": 384409, "epoch": 4631} {"train_loss": -26.694232940673828, "global_step": 384410, "epoch": 4631} {"train_loss": -27.057538986206055, "global_step": 384411, "epoch": 4631} {"train_loss": -26.767663955688477, "global_step": 384412, "epoch": 4631} {"train_loss": -26.368192672729492, "global_step": 384413, "epoch": 4631} {"train_loss": -26.553258895874023, "global_step": 384414, "epoch": 4631} {"train_loss": -26.9110164642334, "global_step": 384415, "epoch": 4631} {"train_loss": -26.59486198425293, "global_step": 384416, "epoch": 4631} {"train_loss": -26.74688148498535, "global_step": 384417, "epoch": 4631} {"train_loss": -26.760419845581055, "global_step": 384418, "epoch": 4631} {"train_loss": -26.314172744750977, "global_step": 384419, "epoch": 4631} {"train_loss": -26.522907257080078, "global_step": 384420, "epoch": 4631} {"train_loss": -26.149478912353516, "global_step": 384421, "epoch": 4631} {"train_loss": -26.274490356445312, "global_step": 384422, "epoch": 4631} {"train_loss": -26.38071060180664, "global_step": 384423, "epoch": 4631} {"train_loss": -26.426939010620117, "global_step": 384424, "epoch": 4631} {"train_loss": -26.367828369140625, "global_step": 384425, "epoch": 4631} {"train_loss": -27.1651611328125, "global_step": 384426, "epoch": 4631} {"train_loss": -26.392627716064453, "global_step": 384427, "epoch": 4631} {"train_loss": -26.505130767822266, "global_step": 384428, "epoch": 4631} {"train_loss": -26.6105899810791, "global_step": 384429, "epoch": 4631} {"train_loss": -26.75657081604004, "global_step": 384430, "epoch": 4631} {"train_loss": -26.424245834350586, "global_step": 384431, "epoch": 4631} {"train_loss": -26.73780632019043, "global_step": 384432, "epoch": 4631} {"train_loss": -26.91958999633789, "global_step": 384433, "epoch": 4631} {"train_loss": -26.859634399414062, "global_step": 384434, "epoch": 4631} {"train_loss": -26.51862907409668, "global_step": 384435, "epoch": 4631} {"train_loss": -26.566593170166016, "global_step": 384436, "epoch": 4631} {"train_loss": -26.367633819580078, "global_step": 384437, "epoch": 4631} {"train_loss": -27.060895919799805, "global_step": 384438, "epoch": 4631} {"train_loss": -26.6047306060791, "global_step": 384439, "epoch": 4631} {"train_loss": -26.83829116821289, "global_step": 384440, "epoch": 4631} {"train_loss": -26.740005493164062, "global_step": 384441, "epoch": 4631} {"train_loss": -26.715803146362305, "global_step": 384442, "epoch": 4631} {"train_loss": -26.452054977416992, "global_step": 384443, "epoch": 4631} {"train_loss": -26.519826889038086, "global_step": 384444, "epoch": 4631} {"train_loss": -26.652097702026367, "global_step": 384445, "epoch": 4631} {"train_loss": -26.76080322265625, "global_step": 384446, "epoch": 4631} {"train_loss": -26.6430721282959, "global_step": 384447, "epoch": 4631} {"train_loss": -26.60479736328125, "global_step": 384448, "epoch": 4631} {"train_loss": -26.175764083862305, "global_step": 384449, "epoch": 4631} {"train_loss": -26.757593154907227, "global_step": 384450, "epoch": 4631} {"train_loss": -26.37074089050293, "global_step": 384451, "epoch": 4631} {"train_loss": -26.528564453125, "global_step": 384452, "epoch": 4631} {"train_loss": -27.078857421875, "global_step": 384453, "epoch": 4631} {"train_loss": -26.269739151000977, "global_step": 384454, "epoch": 4631} {"train_loss": -26.403445002544355, "global_step": 384455, "epoch": 4631, "val_loss": 6592833.0} {"train_loss": -26.008319854736328, "global_step": 384456, "epoch": 4632} {"train_loss": -26.35757827758789, "global_step": 384457, "epoch": 4632} {"train_loss": -26.078857421875, "global_step": 384458, "epoch": 4632} {"train_loss": -26.028705596923828, "global_step": 384459, "epoch": 4632} {"train_loss": -26.19122314453125, "global_step": 384460, "epoch": 4632} {"train_loss": -25.684049606323242, "global_step": 384461, "epoch": 4632} {"train_loss": -25.714719772338867, "global_step": 384462, "epoch": 4632} {"train_loss": -26.131872177124023, "global_step": 384463, "epoch": 4632} {"train_loss": -25.20930290222168, "global_step": 384464, "epoch": 4632} {"train_loss": -25.623504638671875, "global_step": 384465, "epoch": 4632} {"train_loss": -25.915542602539062, "global_step": 384466, "epoch": 4632} {"train_loss": -25.802021026611328, "global_step": 384467, "epoch": 4632} {"train_loss": -25.943960189819336, "global_step": 384468, "epoch": 4632} {"train_loss": -26.04736328125, "global_step": 384469, "epoch": 4632} {"train_loss": -25.79387855529785, "global_step": 384470, "epoch": 4632} {"train_loss": -25.902246475219727, "global_step": 384471, "epoch": 4632} {"train_loss": -25.815088272094727, "global_step": 384472, "epoch": 4632} {"train_loss": -26.316455841064453, "global_step": 384473, "epoch": 4632} {"train_loss": -26.13974952697754, "global_step": 384474, "epoch": 4632} {"train_loss": -26.10761833190918, "global_step": 384475, "epoch": 4632} {"train_loss": -25.94366455078125, "global_step": 384476, "epoch": 4632} {"train_loss": -26.388952255249023, "global_step": 384477, "epoch": 4632} {"train_loss": -26.09234046936035, "global_step": 384478, "epoch": 4632} {"train_loss": -26.139989852905273, "global_step": 384479, "epoch": 4632} {"train_loss": -26.435819625854492, "global_step": 384480, "epoch": 4632} {"train_loss": -26.419422149658203, "global_step": 384481, "epoch": 4632} {"train_loss": -26.1932315826416, "global_step": 384482, "epoch": 4632} {"train_loss": -26.162124633789062, "global_step": 384483, "epoch": 4632} {"train_loss": -26.418121337890625, "global_step": 384484, "epoch": 4632} {"train_loss": -26.286863327026367, "global_step": 384485, "epoch": 4632} {"train_loss": -26.106534957885742, "global_step": 384486, "epoch": 4632} {"train_loss": -26.673933029174805, "global_step": 384487, "epoch": 4632} {"train_loss": -26.162118911743164, "global_step": 384488, "epoch": 4632} {"train_loss": -26.340167999267578, "global_step": 384489, "epoch": 4632} {"train_loss": -26.170642852783203, "global_step": 384490, "epoch": 4632} {"train_loss": -26.198429107666016, "global_step": 384491, "epoch": 4632} {"train_loss": -26.788833618164062, "global_step": 384492, "epoch": 4632} {"train_loss": -26.5561580657959, "global_step": 384493, "epoch": 4632} {"train_loss": -26.775720596313477, "global_step": 384494, "epoch": 4632} {"train_loss": -26.5465087890625, "global_step": 384495, "epoch": 4632} {"train_loss": -26.61716079711914, "global_step": 384496, "epoch": 4632} {"train_loss": -26.745376586914062, "global_step": 384497, "epoch": 4632} {"train_loss": -26.435504913330078, "global_step": 384498, "epoch": 4632} {"train_loss": -26.877822875976562, "global_step": 384499, "epoch": 4632} {"train_loss": -26.989953994750977, "global_step": 384500, "epoch": 4632} {"train_loss": -26.495100021362305, "global_step": 384501, "epoch": 4632} {"train_loss": -26.6190128326416, "global_step": 384502, "epoch": 4632} {"train_loss": -26.405115127563477, "global_step": 384503, "epoch": 4632} {"train_loss": -26.370132446289062, "global_step": 384504, "epoch": 4632} {"train_loss": -26.64271354675293, "global_step": 384505, "epoch": 4632} {"train_loss": -26.867170333862305, "global_step": 384506, "epoch": 4632} {"train_loss": -26.716955184936523, "global_step": 384507, "epoch": 4632} {"train_loss": -26.745777130126953, "global_step": 384508, "epoch": 4632} {"train_loss": -26.59503746032715, "global_step": 384509, "epoch": 4632} {"train_loss": -26.60845947265625, "global_step": 384510, "epoch": 4632} {"train_loss": -26.330575942993164, "global_step": 384511, "epoch": 4632} {"train_loss": -26.374670028686523, "global_step": 384512, "epoch": 4632} {"train_loss": -25.934843063354492, "global_step": 384513, "epoch": 4632} {"train_loss": -26.35867691040039, "global_step": 384514, "epoch": 4632} {"train_loss": -26.444751739501953, "global_step": 384515, "epoch": 4632} {"train_loss": -26.713056564331055, "global_step": 384516, "epoch": 4632} {"train_loss": -26.34339714050293, "global_step": 384517, "epoch": 4632} {"train_loss": -26.18899917602539, "global_step": 384518, "epoch": 4632} {"train_loss": -26.49867820739746, "global_step": 384519, "epoch": 4632} {"train_loss": -26.6070613861084, "global_step": 384520, "epoch": 4632} {"train_loss": -26.4639835357666, "global_step": 384521, "epoch": 4632} {"train_loss": -26.4810733795166, "global_step": 384522, "epoch": 4632} {"train_loss": -26.26800537109375, "global_step": 384523, "epoch": 4632} {"train_loss": -26.6960506439209, "global_step": 384524, "epoch": 4632} {"train_loss": -26.514890670776367, "global_step": 384525, "epoch": 4632} {"train_loss": -26.23359489440918, "global_step": 384526, "epoch": 4632} {"train_loss": -26.56171989440918, "global_step": 384527, "epoch": 4632} {"train_loss": -26.346820831298828, "global_step": 384528, "epoch": 4632} {"train_loss": -26.61872673034668, "global_step": 384529, "epoch": 4632} {"train_loss": -26.586380004882812, "global_step": 384530, "epoch": 4632} {"train_loss": -26.10386085510254, "global_step": 384531, "epoch": 4632} {"train_loss": -26.2681827545166, "global_step": 384532, "epoch": 4632} {"train_loss": -27.080951690673828, "global_step": 384533, "epoch": 4632} {"train_loss": -26.52192497253418, "global_step": 384534, "epoch": 4632} {"train_loss": -26.697423934936523, "global_step": 384535, "epoch": 4632} {"train_loss": -26.506269454956055, "global_step": 384536, "epoch": 4632} {"train_loss": -26.471113204956055, "global_step": 384537, "epoch": 4632} {"train_loss": -26.36228009878871, "global_step": 384538, "epoch": 4632, "val_loss": 6565714.0} {"train_loss": -25.770116806030273, "global_step": 384539, "epoch": 4633} {"train_loss": -25.971174240112305, "global_step": 384540, "epoch": 4633} {"train_loss": -25.73383140563965, "global_step": 384541, "epoch": 4633} {"train_loss": -26.0430965423584, "global_step": 384542, "epoch": 4633} {"train_loss": -26.18476676940918, "global_step": 384543, "epoch": 4633} {"train_loss": -26.359638214111328, "global_step": 384544, "epoch": 4633} {"train_loss": -25.938308715820312, "global_step": 384545, "epoch": 4633} {"train_loss": -26.23565101623535, "global_step": 384546, "epoch": 4633} {"train_loss": -26.174299240112305, "global_step": 384547, "epoch": 4633} {"train_loss": -25.73517417907715, "global_step": 384548, "epoch": 4633} {"train_loss": -26.255563735961914, "global_step": 384549, "epoch": 4633} {"train_loss": -26.002197265625, "global_step": 384550, "epoch": 4633} {"train_loss": -26.227758407592773, "global_step": 384551, "epoch": 4633} {"train_loss": -26.151594161987305, "global_step": 384552, "epoch": 4633} {"train_loss": -26.3066349029541, "global_step": 384553, "epoch": 4633} {"train_loss": -25.9549560546875, "global_step": 384554, "epoch": 4633} {"train_loss": -26.587705612182617, "global_step": 384555, "epoch": 4633} {"train_loss": -26.279821395874023, "global_step": 384556, "epoch": 4633} {"train_loss": -26.338642120361328, "global_step": 384557, "epoch": 4633} {"train_loss": -26.369924545288086, "global_step": 384558, "epoch": 4633} {"train_loss": -26.6519775390625, "global_step": 384559, "epoch": 4633} {"train_loss": -26.640790939331055, "global_step": 384560, "epoch": 4633} {"train_loss": -26.256284713745117, "global_step": 384561, "epoch": 4633} {"train_loss": -26.205244064331055, "global_step": 384562, "epoch": 4633} {"train_loss": -26.234134674072266, "global_step": 384563, "epoch": 4633} {"train_loss": -26.1387882232666, "global_step": 384564, "epoch": 4633} {"train_loss": -26.16697120666504, "global_step": 384565, "epoch": 4633} {"train_loss": -26.503803253173828, "global_step": 384566, "epoch": 4633} {"train_loss": -26.45963478088379, "global_step": 384567, "epoch": 4633} {"train_loss": -26.347036361694336, "global_step": 384568, "epoch": 4633} {"train_loss": -26.469497680664062, "global_step": 384569, "epoch": 4633} {"train_loss": -26.468713760375977, "global_step": 384570, "epoch": 4633} {"train_loss": -26.334278106689453, "global_step": 384571, "epoch": 4633} {"train_loss": -26.20490837097168, "global_step": 384572, "epoch": 4633} {"train_loss": -26.292184829711914, "global_step": 384573, "epoch": 4633} {"train_loss": -26.393644332885742, "global_step": 384574, "epoch": 4633} {"train_loss": -26.303668975830078, "global_step": 384575, "epoch": 4633} {"train_loss": -26.28497886657715, "global_step": 384576, "epoch": 4633} {"train_loss": -26.550344467163086, "global_step": 384577, "epoch": 4633} {"train_loss": -26.378650665283203, "global_step": 384578, "epoch": 4633} {"train_loss": -26.613431930541992, "global_step": 384579, "epoch": 4633} {"train_loss": -26.566226959228516, "global_step": 384580, "epoch": 4633} {"train_loss": -26.562976837158203, "global_step": 384581, "epoch": 4633} {"train_loss": -26.650104522705078, "global_step": 384582, "epoch": 4633} {"train_loss": -26.526819229125977, "global_step": 384583, "epoch": 4633} {"train_loss": -26.656217575073242, "global_step": 384584, "epoch": 4633} {"train_loss": -26.61822509765625, "global_step": 384585, "epoch": 4633} {"train_loss": -26.318185806274414, "global_step": 384586, "epoch": 4633} {"train_loss": -26.444711685180664, "global_step": 384587, "epoch": 4633} {"train_loss": -26.64344596862793, "global_step": 384588, "epoch": 4633} {"train_loss": -26.876432418823242, "global_step": 384589, "epoch": 4633} {"train_loss": -26.394628524780273, "global_step": 384590, "epoch": 4633} {"train_loss": -26.615442276000977, "global_step": 384591, "epoch": 4633} {"train_loss": -26.938888549804688, "global_step": 384592, "epoch": 4633} {"train_loss": -26.779998779296875, "global_step": 384593, "epoch": 4633} {"train_loss": -26.52239418029785, "global_step": 384594, "epoch": 4633} {"train_loss": -26.047765731811523, "global_step": 384595, "epoch": 4633} {"train_loss": -26.423627853393555, "global_step": 384596, "epoch": 4633} {"train_loss": -26.5631103515625, "global_step": 384597, "epoch": 4633} {"train_loss": -26.486469268798828, "global_step": 384598, "epoch": 4633} {"train_loss": -26.562719345092773, "global_step": 384599, "epoch": 4633} {"train_loss": -26.833820343017578, "global_step": 384600, "epoch": 4633} {"train_loss": -26.561206817626953, "global_step": 384601, "epoch": 4633} {"train_loss": -26.37799644470215, "global_step": 384602, "epoch": 4633} {"train_loss": -26.54961585998535, "global_step": 384603, "epoch": 4633} {"train_loss": -26.512475967407227, "global_step": 384604, "epoch": 4633} {"train_loss": -26.871570587158203, "global_step": 384605, "epoch": 4633} {"train_loss": -26.94453239440918, "global_step": 384606, "epoch": 4633} {"train_loss": -26.699262619018555, "global_step": 384607, "epoch": 4633} {"train_loss": -26.75433921813965, "global_step": 384608, "epoch": 4633} {"train_loss": -26.72127342224121, "global_step": 384609, "epoch": 4633} {"train_loss": -26.10761833190918, "global_step": 384610, "epoch": 4633} {"train_loss": -27.125762939453125, "global_step": 384611, "epoch": 4633} {"train_loss": -26.02857780456543, "global_step": 384612, "epoch": 4633} {"train_loss": -26.4782657623291, "global_step": 384613, "epoch": 4633} {"train_loss": -26.686574935913086, "global_step": 384614, "epoch": 4633} {"train_loss": -26.467199325561523, "global_step": 384615, "epoch": 4633} {"train_loss": -26.73650550842285, "global_step": 384616, "epoch": 4633} {"train_loss": -26.472293853759766, "global_step": 384617, "epoch": 4633} {"train_loss": -26.378524780273438, "global_step": 384618, "epoch": 4633} {"train_loss": -26.475391387939453, "global_step": 384619, "epoch": 4633} {"train_loss": -26.667591094970703, "global_step": 384620, "epoch": 4633} {"train_loss": -26.396931200142365, "global_step": 384621, "epoch": 4633, "val_loss": 6566826.5} {"train_loss": -25.393003463745117, "global_step": 384622, "epoch": 4634} {"train_loss": -25.475522994995117, "global_step": 384623, "epoch": 4634} {"train_loss": -25.98304557800293, "global_step": 384624, "epoch": 4634} {"train_loss": -25.422019958496094, "global_step": 384625, "epoch": 4634} {"train_loss": -25.75543785095215, "global_step": 384626, "epoch": 4634} {"train_loss": -25.882476806640625, "global_step": 384627, "epoch": 4634} {"train_loss": -25.40859031677246, "global_step": 384628, "epoch": 4634} {"train_loss": -25.477130889892578, "global_step": 384629, "epoch": 4634} {"train_loss": -25.715055465698242, "global_step": 384630, "epoch": 4634} {"train_loss": -25.39198112487793, "global_step": 384631, "epoch": 4634} {"train_loss": -26.146625518798828, "global_step": 384632, "epoch": 4634} {"train_loss": -25.719879150390625, "global_step": 384633, "epoch": 4634} {"train_loss": -26.31525230407715, "global_step": 384634, "epoch": 4634} {"train_loss": -26.377796173095703, "global_step": 384635, "epoch": 4634} {"train_loss": -26.310285568237305, "global_step": 384636, "epoch": 4634} {"train_loss": -26.251279830932617, "global_step": 384637, "epoch": 4634} {"train_loss": -26.138975143432617, "global_step": 384638, "epoch": 4634} {"train_loss": -26.037694931030273, "global_step": 384639, "epoch": 4634} {"train_loss": -26.50493812561035, "global_step": 384640, "epoch": 4634} {"train_loss": -25.984466552734375, "global_step": 384641, "epoch": 4634} {"train_loss": -26.380401611328125, "global_step": 384642, "epoch": 4634} {"train_loss": -26.113983154296875, "global_step": 384643, "epoch": 4634} {"train_loss": -26.159820556640625, "global_step": 384644, "epoch": 4634} {"train_loss": -26.399097442626953, "global_step": 384645, "epoch": 4634} {"train_loss": -26.302560806274414, "global_step": 384646, "epoch": 4634} {"train_loss": -26.358901977539062, "global_step": 384647, "epoch": 4634} {"train_loss": -26.699438095092773, "global_step": 384648, "epoch": 4634} {"train_loss": -26.559711456298828, "global_step": 384649, "epoch": 4634} {"train_loss": -26.59490394592285, "global_step": 384650, "epoch": 4634} {"train_loss": -26.24118995666504, "global_step": 384651, "epoch": 4634} {"train_loss": -26.066421508789062, "global_step": 384652, "epoch": 4634} {"train_loss": -26.532819747924805, "global_step": 384653, "epoch": 4634} {"train_loss": -26.269683837890625, "global_step": 384654, "epoch": 4634} {"train_loss": -26.6037654876709, "global_step": 384655, "epoch": 4634} {"train_loss": -26.843097686767578, "global_step": 384656, "epoch": 4634} {"train_loss": -26.125839233398438, "global_step": 384657, "epoch": 4634} {"train_loss": -26.533475875854492, "global_step": 384658, "epoch": 4634} {"train_loss": -26.279571533203125, "global_step": 384659, "epoch": 4634} {"train_loss": -26.88802146911621, "global_step": 384660, "epoch": 4634} {"train_loss": -26.96388053894043, "global_step": 384661, "epoch": 4634} {"train_loss": -26.3695068359375, "global_step": 384662, "epoch": 4634} {"train_loss": -26.837512969970703, "global_step": 384663, "epoch": 4634} {"train_loss": -26.607526779174805, "global_step": 384664, "epoch": 4634} {"train_loss": -26.557758331298828, "global_step": 384665, "epoch": 4634} {"train_loss": -26.798694610595703, "global_step": 384666, "epoch": 4634} {"train_loss": -26.702001571655273, "global_step": 384667, "epoch": 4634} {"train_loss": -26.63129997253418, "global_step": 384668, "epoch": 4634} {"train_loss": -26.586566925048828, "global_step": 384669, "epoch": 4634} {"train_loss": -26.43680763244629, "global_step": 384670, "epoch": 4634} {"train_loss": -26.681798934936523, "global_step": 384671, "epoch": 4634} {"train_loss": -26.6386661529541, "global_step": 384672, "epoch": 4634} {"train_loss": -26.563425064086914, "global_step": 384673, "epoch": 4634} {"train_loss": -27.04242515563965, "global_step": 384674, "epoch": 4634} {"train_loss": -26.998767852783203, "global_step": 384675, "epoch": 4634} {"train_loss": -26.54587173461914, "global_step": 384676, "epoch": 4634} {"train_loss": -26.624683380126953, "global_step": 384677, "epoch": 4634} {"train_loss": -26.36686134338379, "global_step": 384678, "epoch": 4634} {"train_loss": -26.894739151000977, "global_step": 384679, "epoch": 4634} {"train_loss": -26.664188385009766, "global_step": 384680, "epoch": 4634} {"train_loss": -26.28708839416504, "global_step": 384681, "epoch": 4634} {"train_loss": -26.890491485595703, "global_step": 384682, "epoch": 4634} {"train_loss": -26.948240280151367, "global_step": 384683, "epoch": 4634} {"train_loss": -26.7673282623291, "global_step": 384684, "epoch": 4634} {"train_loss": -26.541889190673828, "global_step": 384685, "epoch": 4634} {"train_loss": -26.660846710205078, "global_step": 384686, "epoch": 4634} {"train_loss": -26.910205841064453, "global_step": 384687, "epoch": 4634} {"train_loss": -26.960086822509766, "global_step": 384688, "epoch": 4634} {"train_loss": -26.8291072845459, "global_step": 384689, "epoch": 4634} {"train_loss": -26.852819442749023, "global_step": 384690, "epoch": 4634} {"train_loss": -26.580646514892578, "global_step": 384691, "epoch": 4634} {"train_loss": -26.874053955078125, "global_step": 384692, "epoch": 4634} {"train_loss": -25.85993003845215, "global_step": 384693, "epoch": 4634} {"train_loss": -26.14702796936035, "global_step": 384694, "epoch": 4634} {"train_loss": -25.82917594909668, "global_step": 384695, "epoch": 4634} {"train_loss": -26.244504928588867, "global_step": 384696, "epoch": 4634} {"train_loss": -26.484893798828125, "global_step": 384697, "epoch": 4634} {"train_loss": -26.43385887145996, "global_step": 384698, "epoch": 4634} {"train_loss": -26.391250610351562, "global_step": 384699, "epoch": 4634} {"train_loss": -26.28264808654785, "global_step": 384700, "epoch": 4634} {"train_loss": -26.64314079284668, "global_step": 384701, "epoch": 4634} {"train_loss": -26.148426055908203, "global_step": 384702, "epoch": 4634} {"train_loss": -26.163333892822266, "global_step": 384703, "epoch": 4634} {"train_loss": -26.379418292677546, "global_step": 384704, "epoch": 4634, "val_loss": 6639529.0} {"train_loss": -24.847087860107422, "global_step": 384705, "epoch": 4635} {"train_loss": -25.71660804748535, "global_step": 384706, "epoch": 4635} {"train_loss": -25.456188201904297, "global_step": 384707, "epoch": 4635} {"train_loss": -23.915786743164062, "global_step": 384708, "epoch": 4635} {"train_loss": -23.958526611328125, "global_step": 384709, "epoch": 4635} {"train_loss": -25.384660720825195, "global_step": 384710, "epoch": 4635} {"train_loss": -24.796005249023438, "global_step": 384711, "epoch": 4635} {"train_loss": -25.039762496948242, "global_step": 384712, "epoch": 4635} {"train_loss": -25.264474868774414, "global_step": 384713, "epoch": 4635} {"train_loss": -25.153295516967773, "global_step": 384714, "epoch": 4635} {"train_loss": -25.46135711669922, "global_step": 384715, "epoch": 4635} {"train_loss": -25.329092025756836, "global_step": 384716, "epoch": 4635} {"train_loss": -25.541749954223633, "global_step": 384717, "epoch": 4635} {"train_loss": -25.823583602905273, "global_step": 384718, "epoch": 4635} {"train_loss": -25.38694190979004, "global_step": 384719, "epoch": 4635} {"train_loss": -25.317901611328125, "global_step": 384720, "epoch": 4635} {"train_loss": -26.055212020874023, "global_step": 384721, "epoch": 4635} {"train_loss": -25.863269805908203, "global_step": 384722, "epoch": 4635} {"train_loss": -25.939273834228516, "global_step": 384723, "epoch": 4635} {"train_loss": -26.15338134765625, "global_step": 384724, "epoch": 4635} {"train_loss": -25.71392250061035, "global_step": 384725, "epoch": 4635} {"train_loss": -26.00812339782715, "global_step": 384726, "epoch": 4635} {"train_loss": -25.924407958984375, "global_step": 384727, "epoch": 4635} {"train_loss": -25.925037384033203, "global_step": 384728, "epoch": 4635} {"train_loss": -26.09678077697754, "global_step": 384729, "epoch": 4635} {"train_loss": -26.021808624267578, "global_step": 384730, "epoch": 4635} {"train_loss": -26.118793487548828, "global_step": 384731, "epoch": 4635} {"train_loss": -26.14460563659668, "global_step": 384732, "epoch": 4635} {"train_loss": -26.39674186706543, "global_step": 384733, "epoch": 4635} {"train_loss": -26.49653434753418, "global_step": 384734, "epoch": 4635} {"train_loss": -25.846405029296875, "global_step": 384735, "epoch": 4635} {"train_loss": -26.474689483642578, "global_step": 384736, "epoch": 4635} {"train_loss": -26.433332443237305, "global_step": 384737, "epoch": 4635} {"train_loss": -26.2495174407959, "global_step": 384738, "epoch": 4635} {"train_loss": -26.291519165039062, "global_step": 384739, "epoch": 4635} {"train_loss": -26.09220314025879, "global_step": 384740, "epoch": 4635} {"train_loss": -26.464502334594727, "global_step": 384741, "epoch": 4635} {"train_loss": -26.814422607421875, "global_step": 384742, "epoch": 4635} {"train_loss": -26.319326400756836, "global_step": 384743, "epoch": 4635} {"train_loss": -26.1585750579834, "global_step": 384744, "epoch": 4635} {"train_loss": -26.481189727783203, "global_step": 384745, "epoch": 4635} {"train_loss": -26.282209396362305, "global_step": 384746, "epoch": 4635} {"train_loss": -26.23064613342285, "global_step": 384747, "epoch": 4635} {"train_loss": -26.68659019470215, "global_step": 384748, "epoch": 4635} {"train_loss": -26.567291259765625, "global_step": 384749, "epoch": 4635} {"train_loss": -26.30751609802246, "global_step": 384750, "epoch": 4635} {"train_loss": -26.483203887939453, "global_step": 384751, "epoch": 4635} {"train_loss": -26.564899444580078, "global_step": 384752, "epoch": 4635} {"train_loss": -26.75287437438965, "global_step": 384753, "epoch": 4635} {"train_loss": -26.659637451171875, "global_step": 384754, "epoch": 4635} {"train_loss": -26.4263916015625, "global_step": 384755, "epoch": 4635} {"train_loss": -26.25482749938965, "global_step": 384756, "epoch": 4635} {"train_loss": -26.48797035217285, "global_step": 384757, "epoch": 4635} {"train_loss": -26.598188400268555, "global_step": 384758, "epoch": 4635} {"train_loss": -26.920072555541992, "global_step": 384759, "epoch": 4635} {"train_loss": -26.8037109375, "global_step": 384760, "epoch": 4635} {"train_loss": -26.74118995666504, "global_step": 384761, "epoch": 4635} {"train_loss": -26.564014434814453, "global_step": 384762, "epoch": 4635} {"train_loss": -26.334951400756836, "global_step": 384763, "epoch": 4635} {"train_loss": -26.82435417175293, "global_step": 384764, "epoch": 4635} {"train_loss": -26.769643783569336, "global_step": 384765, "epoch": 4635} {"train_loss": -26.710371017456055, "global_step": 384766, "epoch": 4635} {"train_loss": -26.795927047729492, "global_step": 384767, "epoch": 4635} {"train_loss": -26.7325382232666, "global_step": 384768, "epoch": 4635} {"train_loss": -26.79791259765625, "global_step": 384769, "epoch": 4635} {"train_loss": -26.80482292175293, "global_step": 384770, "epoch": 4635} {"train_loss": -26.64797019958496, "global_step": 384771, "epoch": 4635} {"train_loss": -26.404861450195312, "global_step": 384772, "epoch": 4635} {"train_loss": -26.668933868408203, "global_step": 384773, "epoch": 4635} {"train_loss": -26.528827667236328, "global_step": 384774, "epoch": 4635} {"train_loss": -26.645811080932617, "global_step": 384775, "epoch": 4635} {"train_loss": -26.96708106994629, "global_step": 384776, "epoch": 4635} {"train_loss": -26.46283531188965, "global_step": 384777, "epoch": 4635} {"train_loss": -26.8192081451416, "global_step": 384778, "epoch": 4635} {"train_loss": -26.62250328063965, "global_step": 384779, "epoch": 4635} {"train_loss": -26.50543785095215, "global_step": 384780, "epoch": 4635} {"train_loss": -26.49908447265625, "global_step": 384781, "epoch": 4635} {"train_loss": -26.691293716430664, "global_step": 384782, "epoch": 4635} {"train_loss": -26.793731689453125, "global_step": 384783, "epoch": 4635} {"train_loss": -26.913116455078125, "global_step": 384784, "epoch": 4635} {"train_loss": -26.108251571655273, "global_step": 384785, "epoch": 4635} {"train_loss": -26.983190536499023, "global_step": 384786, "epoch": 4635} {"train_loss": -26.219625564942877, "global_step": 384787, "epoch": 4635, "val_loss": 6593632.0} {"train_loss": -26.004974365234375, "global_step": 384788, "epoch": 4636} {"train_loss": -26.011457443237305, "global_step": 384789, "epoch": 4636} {"train_loss": -26.22564697265625, "global_step": 384790, "epoch": 4636} {"train_loss": -26.118955612182617, "global_step": 384791, "epoch": 4636} {"train_loss": -26.29782485961914, "global_step": 384792, "epoch": 4636} {"train_loss": -26.35711097717285, "global_step": 384793, "epoch": 4636} {"train_loss": -26.00027847290039, "global_step": 384794, "epoch": 4636} {"train_loss": -26.0362491607666, "global_step": 384795, "epoch": 4636} {"train_loss": -26.145029067993164, "global_step": 384796, "epoch": 4636} {"train_loss": -26.310483932495117, "global_step": 384797, "epoch": 4636} {"train_loss": -26.22007179260254, "global_step": 384798, "epoch": 4636} {"train_loss": -26.17939567565918, "global_step": 384799, "epoch": 4636} {"train_loss": -26.44441032409668, "global_step": 384800, "epoch": 4636} {"train_loss": -26.158660888671875, "global_step": 384801, "epoch": 4636} {"train_loss": -26.533843994140625, "global_step": 384802, "epoch": 4636} {"train_loss": -26.191247940063477, "global_step": 384803, "epoch": 4636} {"train_loss": -26.464401245117188, "global_step": 384804, "epoch": 4636} {"train_loss": -26.42836570739746, "global_step": 384805, "epoch": 4636} {"train_loss": -26.355880737304688, "global_step": 384806, "epoch": 4636} {"train_loss": -26.604949951171875, "global_step": 384807, "epoch": 4636} {"train_loss": -26.401716232299805, "global_step": 384808, "epoch": 4636} {"train_loss": -26.1356201171875, "global_step": 384809, "epoch": 4636} {"train_loss": -26.54359245300293, "global_step": 384810, "epoch": 4636} {"train_loss": -26.23138999938965, "global_step": 384811, "epoch": 4636} {"train_loss": -26.32541275024414, "global_step": 384812, "epoch": 4636} {"train_loss": -26.494388580322266, "global_step": 384813, "epoch": 4636} {"train_loss": -26.66019630432129, "global_step": 384814, "epoch": 4636} {"train_loss": -26.779281616210938, "global_step": 384815, "epoch": 4636} {"train_loss": -26.609289169311523, "global_step": 384816, "epoch": 4636} {"train_loss": -26.65665626525879, "global_step": 384817, "epoch": 4636} {"train_loss": -26.173629760742188, "global_step": 384818, "epoch": 4636} {"train_loss": -26.542724609375, "global_step": 384819, "epoch": 4636} {"train_loss": -26.741178512573242, "global_step": 384820, "epoch": 4636} {"train_loss": -26.728992462158203, "global_step": 384821, "epoch": 4636} {"train_loss": -26.8701229095459, "global_step": 384822, "epoch": 4636} {"train_loss": -26.702726364135742, "global_step": 384823, "epoch": 4636} {"train_loss": -26.746673583984375, "global_step": 384824, "epoch": 4636} {"train_loss": -26.890491485595703, "global_step": 384825, "epoch": 4636} {"train_loss": -26.49197769165039, "global_step": 384826, "epoch": 4636} {"train_loss": -26.91064453125, "global_step": 384827, "epoch": 4636} {"train_loss": -26.812366485595703, "global_step": 384828, "epoch": 4636} {"train_loss": -26.650049209594727, "global_step": 384829, "epoch": 4636} {"train_loss": -26.552942276000977, "global_step": 384830, "epoch": 4636} {"train_loss": -26.3322696685791, "global_step": 384831, "epoch": 4636} {"train_loss": -26.513654708862305, "global_step": 384832, "epoch": 4636} {"train_loss": -26.405920028686523, "global_step": 384833, "epoch": 4636} {"train_loss": -26.59425163269043, "global_step": 384834, "epoch": 4636} {"train_loss": -26.8060245513916, "global_step": 384835, "epoch": 4636} {"train_loss": -26.371206283569336, "global_step": 384836, "epoch": 4636} {"train_loss": -27.042993545532227, "global_step": 384837, "epoch": 4636} {"train_loss": -26.708988189697266, "global_step": 384838, "epoch": 4636} {"train_loss": -26.483129501342773, "global_step": 384839, "epoch": 4636} {"train_loss": -26.468015670776367, "global_step": 384840, "epoch": 4636} {"train_loss": -26.46500015258789, "global_step": 384841, "epoch": 4636} {"train_loss": -26.423002243041992, "global_step": 384842, "epoch": 4636} {"train_loss": -26.875951766967773, "global_step": 384843, "epoch": 4636} {"train_loss": -27.109729766845703, "global_step": 384844, "epoch": 4636} {"train_loss": -25.904266357421875, "global_step": 384845, "epoch": 4636} {"train_loss": -26.559438705444336, "global_step": 384846, "epoch": 4636} {"train_loss": -25.970874786376953, "global_step": 384847, "epoch": 4636} {"train_loss": -26.244009017944336, "global_step": 384848, "epoch": 4636} {"train_loss": -26.3490047454834, "global_step": 384849, "epoch": 4636} {"train_loss": -26.496402740478516, "global_step": 384850, "epoch": 4636} {"train_loss": -26.33185386657715, "global_step": 384851, "epoch": 4636} {"train_loss": -25.80933952331543, "global_step": 384852, "epoch": 4636} {"train_loss": -26.038162231445312, "global_step": 384853, "epoch": 4636} {"train_loss": -26.531591415405273, "global_step": 384854, "epoch": 4636} {"train_loss": -26.394804000854492, "global_step": 384855, "epoch": 4636} {"train_loss": -26.520742416381836, "global_step": 384856, "epoch": 4636} {"train_loss": -26.29872703552246, "global_step": 384857, "epoch": 4636} {"train_loss": -26.072988510131836, "global_step": 384858, "epoch": 4636} {"train_loss": -26.46729850769043, "global_step": 384859, "epoch": 4636} {"train_loss": -26.56974220275879, "global_step": 384860, "epoch": 4636} {"train_loss": -26.7490177154541, "global_step": 384861, "epoch": 4636} {"train_loss": -26.523778915405273, "global_step": 384862, "epoch": 4636} {"train_loss": -25.937231063842773, "global_step": 384863, "epoch": 4636} {"train_loss": -26.381179809570312, "global_step": 384864, "epoch": 4636} {"train_loss": -26.13945960998535, "global_step": 384865, "epoch": 4636} {"train_loss": -26.365304946899414, "global_step": 384866, "epoch": 4636} {"train_loss": -26.338132858276367, "global_step": 384867, "epoch": 4636} {"train_loss": -26.38138771057129, "global_step": 384868, "epoch": 4636} {"train_loss": -26.714279174804688, "global_step": 384869, "epoch": 4636} {"train_loss": -26.425928690347327, "global_step": 384870, "epoch": 4636, "val_loss": 6659727.0} {"train_loss": -25.753223419189453, "global_step": 384871, "epoch": 4637} {"train_loss": -26.286945343017578, "global_step": 384872, "epoch": 4637} {"train_loss": -26.22715187072754, "global_step": 384873, "epoch": 4637} {"train_loss": -25.638822555541992, "global_step": 384874, "epoch": 4637} {"train_loss": -26.311370849609375, "global_step": 384875, "epoch": 4637} {"train_loss": -25.87298583984375, "global_step": 384876, "epoch": 4637} {"train_loss": -26.1972713470459, "global_step": 384877, "epoch": 4637} {"train_loss": -26.258438110351562, "global_step": 384878, "epoch": 4637} {"train_loss": -26.255292892456055, "global_step": 384879, "epoch": 4637} {"train_loss": -25.824262619018555, "global_step": 384880, "epoch": 4637} {"train_loss": -26.19234275817871, "global_step": 384881, "epoch": 4637} {"train_loss": -26.345163345336914, "global_step": 384882, "epoch": 4637} {"train_loss": -26.2877197265625, "global_step": 384883, "epoch": 4637} {"train_loss": -26.123077392578125, "global_step": 384884, "epoch": 4637} {"train_loss": -26.378507614135742, "global_step": 384885, "epoch": 4637} {"train_loss": -26.3554744720459, "global_step": 384886, "epoch": 4637} {"train_loss": -26.449499130249023, "global_step": 384887, "epoch": 4637} {"train_loss": -26.628589630126953, "global_step": 384888, "epoch": 4637} {"train_loss": -26.541799545288086, "global_step": 384889, "epoch": 4637} {"train_loss": -26.41786766052246, "global_step": 384890, "epoch": 4637} {"train_loss": -26.4853458404541, "global_step": 384891, "epoch": 4637} {"train_loss": -26.122915267944336, "global_step": 384892, "epoch": 4637} {"train_loss": -26.351587295532227, "global_step": 384893, "epoch": 4637} {"train_loss": -26.472654342651367, "global_step": 384894, "epoch": 4637} {"train_loss": -26.43524742126465, "global_step": 384895, "epoch": 4637} {"train_loss": -26.52869987487793, "global_step": 384896, "epoch": 4637} {"train_loss": -26.490453720092773, "global_step": 384897, "epoch": 4637} {"train_loss": -26.882923126220703, "global_step": 384898, "epoch": 4637} {"train_loss": -26.722553253173828, "global_step": 384899, "epoch": 4637} {"train_loss": -26.46003532409668, "global_step": 384900, "epoch": 4637} {"train_loss": -26.6345157623291, "global_step": 384901, "epoch": 4637} {"train_loss": -26.917865753173828, "global_step": 384902, "epoch": 4637} {"train_loss": -26.432098388671875, "global_step": 384903, "epoch": 4637} {"train_loss": -26.567541122436523, "global_step": 384904, "epoch": 4637} {"train_loss": -26.456546783447266, "global_step": 384905, "epoch": 4637} {"train_loss": -26.498397827148438, "global_step": 384906, "epoch": 4637} {"train_loss": -27.23880958557129, "global_step": 384907, "epoch": 4637} {"train_loss": -26.433069229125977, "global_step": 384908, "epoch": 4637} {"train_loss": -26.826007843017578, "global_step": 384909, "epoch": 4637} {"train_loss": -26.380603790283203, "global_step": 384910, "epoch": 4637} {"train_loss": -26.626453399658203, "global_step": 384911, "epoch": 4637} {"train_loss": -26.702726364135742, "global_step": 384912, "epoch": 4637} {"train_loss": -26.75166130065918, "global_step": 384913, "epoch": 4637} {"train_loss": -26.320423126220703, "global_step": 384914, "epoch": 4637} {"train_loss": -26.611621856689453, "global_step": 384915, "epoch": 4637} {"train_loss": -27.11151695251465, "global_step": 384916, "epoch": 4637} {"train_loss": -26.483373641967773, "global_step": 384917, "epoch": 4637} {"train_loss": -26.711938858032227, "global_step": 384918, "epoch": 4637} {"train_loss": -26.693878173828125, "global_step": 384919, "epoch": 4637} {"train_loss": -26.711994171142578, "global_step": 384920, "epoch": 4637} {"train_loss": -26.679401397705078, "global_step": 384921, "epoch": 4637} {"train_loss": -26.6523380279541, "global_step": 384922, "epoch": 4637} {"train_loss": -26.612791061401367, "global_step": 384923, "epoch": 4637} {"train_loss": -26.539426803588867, "global_step": 384924, "epoch": 4637} {"train_loss": -26.501794815063477, "global_step": 384925, "epoch": 4637} {"train_loss": -26.548431396484375, "global_step": 384926, "epoch": 4637} {"train_loss": -26.58906364440918, "global_step": 384927, "epoch": 4637} {"train_loss": -26.5685977935791, "global_step": 384928, "epoch": 4637} {"train_loss": -26.698760986328125, "global_step": 384929, "epoch": 4637} {"train_loss": -27.108203887939453, "global_step": 384930, "epoch": 4637} {"train_loss": -26.45233726501465, "global_step": 384931, "epoch": 4637} {"train_loss": -26.76972770690918, "global_step": 384932, "epoch": 4637} {"train_loss": -26.945266723632812, "global_step": 384933, "epoch": 4637} {"train_loss": -26.62546730041504, "global_step": 384934, "epoch": 4637} {"train_loss": -26.308996200561523, "global_step": 384935, "epoch": 4637} {"train_loss": -26.186975479125977, "global_step": 384936, "epoch": 4637} {"train_loss": -25.72530174255371, "global_step": 384937, "epoch": 4637} {"train_loss": -25.165746688842773, "global_step": 384938, "epoch": 4637} {"train_loss": -26.04445457458496, "global_step": 384939, "epoch": 4637} {"train_loss": -26.11903190612793, "global_step": 384940, "epoch": 4637} {"train_loss": -25.91777992248535, "global_step": 384941, "epoch": 4637} {"train_loss": -25.29380226135254, "global_step": 384942, "epoch": 4637} {"train_loss": -25.780807495117188, "global_step": 384943, "epoch": 4637} {"train_loss": -26.086278915405273, "global_step": 384944, "epoch": 4637} {"train_loss": -25.922983169555664, "global_step": 384945, "epoch": 4637} {"train_loss": -26.3035945892334, "global_step": 384946, "epoch": 4637} {"train_loss": -25.814468383789062, "global_step": 384947, "epoch": 4637} {"train_loss": -26.28557777404785, "global_step": 384948, "epoch": 4637} {"train_loss": -26.013742446899414, "global_step": 384949, "epoch": 4637} {"train_loss": -26.385955810546875, "global_step": 384950, "epoch": 4637} {"train_loss": -25.899829864501953, "global_step": 384951, "epoch": 4637} {"train_loss": -26.417648315429688, "global_step": 384952, "epoch": 4637} {"train_loss": -26.38819338327431, "global_step": 384953, "epoch": 4637, "val_loss": 6693078.5} {"train_loss": -25.422639846801758, "global_step": 384954, "epoch": 4638} {"train_loss": -26.105798721313477, "global_step": 384955, "epoch": 4638} {"train_loss": -26.2884521484375, "global_step": 384956, "epoch": 4638} {"train_loss": -25.2111873626709, "global_step": 384957, "epoch": 4638} {"train_loss": -25.386499404907227, "global_step": 384958, "epoch": 4638} {"train_loss": -25.616926193237305, "global_step": 384959, "epoch": 4638} {"train_loss": -26.22279930114746, "global_step": 384960, "epoch": 4638} {"train_loss": -25.913482666015625, "global_step": 384961, "epoch": 4638} {"train_loss": -25.99222755432129, "global_step": 384962, "epoch": 4638} {"train_loss": -26.123571395874023, "global_step": 384963, "epoch": 4638} {"train_loss": -25.895587921142578, "global_step": 384964, "epoch": 4638} {"train_loss": -26.36223793029785, "global_step": 384965, "epoch": 4638} {"train_loss": -25.820707321166992, "global_step": 384966, "epoch": 4638} {"train_loss": -26.36460304260254, "global_step": 384967, "epoch": 4638} {"train_loss": -26.052640914916992, "global_step": 384968, "epoch": 4638} {"train_loss": -26.17945671081543, "global_step": 384969, "epoch": 4638} {"train_loss": -26.0261173248291, "global_step": 384970, "epoch": 4638} {"train_loss": -26.376392364501953, "global_step": 384971, "epoch": 4638} {"train_loss": -26.186914443969727, "global_step": 384972, "epoch": 4638} {"train_loss": -26.16924476623535, "global_step": 384973, "epoch": 4638} {"train_loss": -26.05803871154785, "global_step": 384974, "epoch": 4638} {"train_loss": -26.27467155456543, "global_step": 384975, "epoch": 4638} {"train_loss": -26.42317008972168, "global_step": 384976, "epoch": 4638} {"train_loss": -26.54104995727539, "global_step": 384977, "epoch": 4638} {"train_loss": -26.67645835876465, "global_step": 384978, "epoch": 4638} {"train_loss": -26.42905616760254, "global_step": 384979, "epoch": 4638} {"train_loss": -26.19870376586914, "global_step": 384980, "epoch": 4638} {"train_loss": -26.835586547851562, "global_step": 384981, "epoch": 4638} {"train_loss": -26.4970703125, "global_step": 384982, "epoch": 4638} {"train_loss": -26.716659545898438, "global_step": 384983, "epoch": 4638} {"train_loss": -26.286420822143555, "global_step": 384984, "epoch": 4638} {"train_loss": -26.234174728393555, "global_step": 384985, "epoch": 4638} {"train_loss": -26.35938835144043, "global_step": 384986, "epoch": 4638} {"train_loss": -26.547956466674805, "global_step": 384987, "epoch": 4638} {"train_loss": -26.319232940673828, "global_step": 384988, "epoch": 4638} {"train_loss": -26.627750396728516, "global_step": 384989, "epoch": 4638} {"train_loss": -26.835163116455078, "global_step": 384990, "epoch": 4638} {"train_loss": -26.732685089111328, "global_step": 384991, "epoch": 4638} {"train_loss": -26.667179107666016, "global_step": 384992, "epoch": 4638} {"train_loss": -26.525739669799805, "global_step": 384993, "epoch": 4638} {"train_loss": -26.55047035217285, "global_step": 384994, "epoch": 4638} {"train_loss": -26.80582618713379, "global_step": 384995, "epoch": 4638} {"train_loss": -26.948017120361328, "global_step": 384996, "epoch": 4638} {"train_loss": -26.801223754882812, "global_step": 384997, "epoch": 4638} {"train_loss": -26.594085693359375, "global_step": 384998, "epoch": 4638} {"train_loss": -26.677112579345703, "global_step": 384999, "epoch": 4638} {"train_loss": -26.658185958862305, "global_step": 385000, "epoch": 4638} {"train_loss": -26.829517364501953, "global_step": 385001, "epoch": 4638} {"train_loss": -26.846113204956055, "global_step": 385002, "epoch": 4638} {"train_loss": -26.651792526245117, "global_step": 385003, "epoch": 4638} {"train_loss": -26.37055778503418, "global_step": 385004, "epoch": 4638} {"train_loss": -26.83709716796875, "global_step": 385005, "epoch": 4638} {"train_loss": -26.905231475830078, "global_step": 385006, "epoch": 4638} {"train_loss": -26.88191795349121, "global_step": 385007, "epoch": 4638} {"train_loss": -26.944477081298828, "global_step": 385008, "epoch": 4638} {"train_loss": -27.10181999206543, "global_step": 385009, "epoch": 4638} {"train_loss": -26.38118553161621, "global_step": 385010, "epoch": 4638} {"train_loss": -26.335712432861328, "global_step": 385011, "epoch": 4638} {"train_loss": -26.427404403686523, "global_step": 385012, "epoch": 4638} {"train_loss": -26.851144790649414, "global_step": 385013, "epoch": 4638} {"train_loss": -26.5898380279541, "global_step": 385014, "epoch": 4638} {"train_loss": -26.393518447875977, "global_step": 385015, "epoch": 4638} {"train_loss": -25.7503662109375, "global_step": 385016, "epoch": 4638} {"train_loss": -26.39215660095215, "global_step": 385017, "epoch": 4638} {"train_loss": -26.266088485717773, "global_step": 385018, "epoch": 4638} {"train_loss": -26.000492095947266, "global_step": 385019, "epoch": 4638} {"train_loss": -25.96075439453125, "global_step": 385020, "epoch": 4638} {"train_loss": -26.278162002563477, "global_step": 385021, "epoch": 4638} {"train_loss": -26.232318878173828, "global_step": 385022, "epoch": 4638} {"train_loss": -25.812036514282227, "global_step": 385023, "epoch": 4638} {"train_loss": -26.560016632080078, "global_step": 385024, "epoch": 4638} {"train_loss": -26.179609298706055, "global_step": 385025, "epoch": 4638} {"train_loss": -26.142690658569336, "global_step": 385026, "epoch": 4638} {"train_loss": -26.243698120117188, "global_step": 385027, "epoch": 4638} {"train_loss": -25.882495880126953, "global_step": 385028, "epoch": 4638} {"train_loss": -26.26826286315918, "global_step": 385029, "epoch": 4638} {"train_loss": -26.208337783813477, "global_step": 385030, "epoch": 4638} {"train_loss": -26.425113677978516, "global_step": 385031, "epoch": 4638} {"train_loss": -26.436376571655273, "global_step": 385032, "epoch": 4638} {"train_loss": -26.19131851196289, "global_step": 385033, "epoch": 4638} {"train_loss": -26.62434196472168, "global_step": 385034, "epoch": 4638} {"train_loss": -26.254789352416992, "global_step": 385035, "epoch": 4638} {"train_loss": -26.353524817041603, "global_step": 385036, "epoch": 4638, "val_loss": 6572029.0} {"train_loss": -26.2844295501709, "global_step": 385037, "epoch": 4639} {"train_loss": -25.826406478881836, "global_step": 385038, "epoch": 4639} {"train_loss": -26.105688095092773, "global_step": 385039, "epoch": 4639} {"train_loss": -25.78952980041504, "global_step": 385040, "epoch": 4639} {"train_loss": -26.34149169921875, "global_step": 385041, "epoch": 4639} {"train_loss": -25.793848037719727, "global_step": 385042, "epoch": 4639} {"train_loss": -26.194501876831055, "global_step": 385043, "epoch": 4639} {"train_loss": -25.616870880126953, "global_step": 385044, "epoch": 4639} {"train_loss": -25.909940719604492, "global_step": 385045, "epoch": 4639} {"train_loss": -26.160430908203125, "global_step": 385046, "epoch": 4639} {"train_loss": -25.95118522644043, "global_step": 385047, "epoch": 4639} {"train_loss": -26.106998443603516, "global_step": 385048, "epoch": 4639} {"train_loss": -25.912389755249023, "global_step": 385049, "epoch": 4639} {"train_loss": -26.109134674072266, "global_step": 385050, "epoch": 4639} {"train_loss": -26.4512996673584, "global_step": 385051, "epoch": 4639} {"train_loss": -26.592626571655273, "global_step": 385052, "epoch": 4639} {"train_loss": -26.228254318237305, "global_step": 385053, "epoch": 4639} {"train_loss": -26.306381225585938, "global_step": 385054, "epoch": 4639} {"train_loss": -26.265771865844727, "global_step": 385055, "epoch": 4639} {"train_loss": -26.703495025634766, "global_step": 385056, "epoch": 4639} {"train_loss": -26.253698348999023, "global_step": 385057, "epoch": 4639} {"train_loss": -26.345966339111328, "global_step": 385058, "epoch": 4639} {"train_loss": -26.570037841796875, "global_step": 385059, "epoch": 4639} {"train_loss": -26.45087242126465, "global_step": 385060, "epoch": 4639} {"train_loss": -26.37701416015625, "global_step": 385061, "epoch": 4639} {"train_loss": -26.644559860229492, "global_step": 385062, "epoch": 4639} {"train_loss": -26.75422477722168, "global_step": 385063, "epoch": 4639} {"train_loss": -26.367929458618164, "global_step": 385064, "epoch": 4639} {"train_loss": -26.512821197509766, "global_step": 385065, "epoch": 4639} {"train_loss": -26.775766372680664, "global_step": 385066, "epoch": 4639} {"train_loss": -26.5666561126709, "global_step": 385067, "epoch": 4639} {"train_loss": -27.129287719726562, "global_step": 385068, "epoch": 4639} {"train_loss": -26.42340087890625, "global_step": 385069, "epoch": 4639} {"train_loss": -26.308349609375, "global_step": 385070, "epoch": 4639} {"train_loss": -26.43145751953125, "global_step": 385071, "epoch": 4639} {"train_loss": -26.397241592407227, "global_step": 385072, "epoch": 4639} {"train_loss": -26.494638442993164, "global_step": 385073, "epoch": 4639} {"train_loss": -26.75491714477539, "global_step": 385074, "epoch": 4639} {"train_loss": -26.38677978515625, "global_step": 385075, "epoch": 4639} {"train_loss": -26.479339599609375, "global_step": 385076, "epoch": 4639} {"train_loss": -26.31903648376465, "global_step": 385077, "epoch": 4639} {"train_loss": -26.7733154296875, "global_step": 385078, "epoch": 4639} {"train_loss": -26.670156478881836, "global_step": 385079, "epoch": 4639} {"train_loss": -26.605060577392578, "global_step": 385080, "epoch": 4639} {"train_loss": -26.5672550201416, "global_step": 385081, "epoch": 4639} {"train_loss": -26.52570915222168, "global_step": 385082, "epoch": 4639} {"train_loss": -26.485919952392578, "global_step": 385083, "epoch": 4639} {"train_loss": -26.417755126953125, "global_step": 385084, "epoch": 4639} {"train_loss": -26.96254539489746, "global_step": 385085, "epoch": 4639} {"train_loss": -26.173437118530273, "global_step": 385086, "epoch": 4639} {"train_loss": -26.31988525390625, "global_step": 385087, "epoch": 4639} {"train_loss": -26.491941452026367, "global_step": 385088, "epoch": 4639} {"train_loss": -26.499103546142578, "global_step": 385089, "epoch": 4639} {"train_loss": -26.64076042175293, "global_step": 385090, "epoch": 4639} {"train_loss": -26.50099754333496, "global_step": 385091, "epoch": 4639} {"train_loss": -26.433740615844727, "global_step": 385092, "epoch": 4639} {"train_loss": -26.458189010620117, "global_step": 385093, "epoch": 4639} {"train_loss": -26.40570068359375, "global_step": 385094, "epoch": 4639} {"train_loss": -26.544422149658203, "global_step": 385095, "epoch": 4639} {"train_loss": -26.853607177734375, "global_step": 385096, "epoch": 4639} {"train_loss": -26.691680908203125, "global_step": 385097, "epoch": 4639} {"train_loss": -26.36419105529785, "global_step": 385098, "epoch": 4639} {"train_loss": -26.0107421875, "global_step": 385099, "epoch": 4639} {"train_loss": -26.26580810546875, "global_step": 385100, "epoch": 4639} {"train_loss": -26.565893173217773, "global_step": 385101, "epoch": 4639} {"train_loss": -26.458059310913086, "global_step": 385102, "epoch": 4639} {"train_loss": -26.329486846923828, "global_step": 385103, "epoch": 4639} {"train_loss": -26.4771671295166, "global_step": 385104, "epoch": 4639} {"train_loss": -26.136550903320312, "global_step": 385105, "epoch": 4639} {"train_loss": -26.513254165649414, "global_step": 385106, "epoch": 4639} {"train_loss": -26.580976486206055, "global_step": 385107, "epoch": 4639} {"train_loss": -26.65712547302246, "global_step": 385108, "epoch": 4639} {"train_loss": -26.643604278564453, "global_step": 385109, "epoch": 4639} {"train_loss": -26.75737953186035, "global_step": 385110, "epoch": 4639} {"train_loss": -26.8041934967041, "global_step": 385111, "epoch": 4639} {"train_loss": -26.459196090698242, "global_step": 385112, "epoch": 4639} {"train_loss": -26.55116081237793, "global_step": 385113, "epoch": 4639} {"train_loss": -26.60139274597168, "global_step": 385114, "epoch": 4639} {"train_loss": -26.639387130737305, "global_step": 385115, "epoch": 4639} {"train_loss": -26.67372703552246, "global_step": 385116, "epoch": 4639} {"train_loss": -26.491119384765625, "global_step": 385117, "epoch": 4639} {"train_loss": -26.702680587768555, "global_step": 385118, "epoch": 4639} {"train_loss": -26.434384426438665, "global_step": 385119, "epoch": 4639, "val_loss": 6590482.5} {"train_loss": -26.299768447875977, "global_step": 385120, "epoch": 4640} {"train_loss": -25.868488311767578, "global_step": 385121, "epoch": 4640} {"train_loss": -25.6452693939209, "global_step": 385122, "epoch": 4640} {"train_loss": -26.062793731689453, "global_step": 385123, "epoch": 4640} {"train_loss": -25.832305908203125, "global_step": 385124, "epoch": 4640} {"train_loss": -25.206398010253906, "global_step": 385125, "epoch": 4640} {"train_loss": -25.837127685546875, "global_step": 385126, "epoch": 4640} {"train_loss": -25.864959716796875, "global_step": 385127, "epoch": 4640} {"train_loss": -25.542465209960938, "global_step": 385128, "epoch": 4640} {"train_loss": -25.890893936157227, "global_step": 385129, "epoch": 4640} {"train_loss": -26.100751876831055, "global_step": 385130, "epoch": 4640} {"train_loss": -25.889068603515625, "global_step": 385131, "epoch": 4640} {"train_loss": -25.9715518951416, "global_step": 385132, "epoch": 4640} {"train_loss": -26.052114486694336, "global_step": 385133, "epoch": 4640} {"train_loss": -25.84238052368164, "global_step": 385134, "epoch": 4640} {"train_loss": -25.673568725585938, "global_step": 385135, "epoch": 4640} {"train_loss": -26.158971786499023, "global_step": 385136, "epoch": 4640} {"train_loss": -25.812652587890625, "global_step": 385137, "epoch": 4640} {"train_loss": -26.187902450561523, "global_step": 385138, "epoch": 4640} {"train_loss": -26.291650772094727, "global_step": 385139, "epoch": 4640} {"train_loss": -25.870685577392578, "global_step": 385140, "epoch": 4640} {"train_loss": -26.317291259765625, "global_step": 385141, "epoch": 4640} {"train_loss": -26.636999130249023, "global_step": 385142, "epoch": 4640} {"train_loss": -26.071247100830078, "global_step": 385143, "epoch": 4640} {"train_loss": -26.124204635620117, "global_step": 385144, "epoch": 4640} {"train_loss": -26.052143096923828, "global_step": 385145, "epoch": 4640} {"train_loss": -26.083444595336914, "global_step": 385146, "epoch": 4640} {"train_loss": -25.930683135986328, "global_step": 385147, "epoch": 4640} {"train_loss": -26.52556800842285, "global_step": 385148, "epoch": 4640} {"train_loss": -26.699426651000977, "global_step": 385149, "epoch": 4640} {"train_loss": -26.644775390625, "global_step": 385150, "epoch": 4640} {"train_loss": -26.4195613861084, "global_step": 385151, "epoch": 4640} {"train_loss": -26.429243087768555, "global_step": 385152, "epoch": 4640} {"train_loss": -26.307920455932617, "global_step": 385153, "epoch": 4640} {"train_loss": -26.397382736206055, "global_step": 385154, "epoch": 4640} {"train_loss": -26.08368492126465, "global_step": 385155, "epoch": 4640} {"train_loss": -26.189041137695312, "global_step": 385156, "epoch": 4640} {"train_loss": -26.652753829956055, "global_step": 385157, "epoch": 4640} {"train_loss": -26.586267471313477, "global_step": 385158, "epoch": 4640} {"train_loss": -27.16950798034668, "global_step": 385159, "epoch": 4640} {"train_loss": -26.574270248413086, "global_step": 385160, "epoch": 4640} {"train_loss": -26.441394805908203, "global_step": 385161, "epoch": 4640} {"train_loss": -26.52324867248535, "global_step": 385162, "epoch": 4640} {"train_loss": -27.00697135925293, "global_step": 385163, "epoch": 4640} {"train_loss": -26.565587997436523, "global_step": 385164, "epoch": 4640} {"train_loss": -26.571401596069336, "global_step": 385165, "epoch": 4640} {"train_loss": -26.371023178100586, "global_step": 385166, "epoch": 4640} {"train_loss": -26.660940170288086, "global_step": 385167, "epoch": 4640} {"train_loss": -26.700708389282227, "global_step": 385168, "epoch": 4640} {"train_loss": -27.003662109375, "global_step": 385169, "epoch": 4640} {"train_loss": -26.617090225219727, "global_step": 385170, "epoch": 4640} {"train_loss": -26.629169464111328, "global_step": 385171, "epoch": 4640} {"train_loss": -26.603342056274414, "global_step": 385172, "epoch": 4640} {"train_loss": -26.81764793395996, "global_step": 385173, "epoch": 4640} {"train_loss": -26.50296401977539, "global_step": 385174, "epoch": 4640} {"train_loss": -26.366378784179688, "global_step": 385175, "epoch": 4640} {"train_loss": -26.553022384643555, "global_step": 385176, "epoch": 4640} {"train_loss": -26.428451538085938, "global_step": 385177, "epoch": 4640} {"train_loss": -26.633081436157227, "global_step": 385178, "epoch": 4640} {"train_loss": -26.582849502563477, "global_step": 385179, "epoch": 4640} {"train_loss": -26.757537841796875, "global_step": 385180, "epoch": 4640} {"train_loss": -26.961517333984375, "global_step": 385181, "epoch": 4640} {"train_loss": -26.185550689697266, "global_step": 385182, "epoch": 4640} {"train_loss": -26.767322540283203, "global_step": 385183, "epoch": 4640} {"train_loss": -26.877389907836914, "global_step": 385184, "epoch": 4640} {"train_loss": -26.378421783447266, "global_step": 385185, "epoch": 4640} {"train_loss": -26.131793975830078, "global_step": 385186, "epoch": 4640} {"train_loss": -26.5292911529541, "global_step": 385187, "epoch": 4640} {"train_loss": -26.431379318237305, "global_step": 385188, "epoch": 4640} {"train_loss": -26.633054733276367, "global_step": 385189, "epoch": 4640} {"train_loss": -26.61024284362793, "global_step": 385190, "epoch": 4640} {"train_loss": -26.402362823486328, "global_step": 385191, "epoch": 4640} {"train_loss": -26.450931549072266, "global_step": 385192, "epoch": 4640} {"train_loss": -26.616140365600586, "global_step": 385193, "epoch": 4640} {"train_loss": -26.33957290649414, "global_step": 385194, "epoch": 4640} {"train_loss": -26.634531021118164, "global_step": 385195, "epoch": 4640} {"train_loss": -26.19647789001465, "global_step": 385196, "epoch": 4640} {"train_loss": -26.462766647338867, "global_step": 385197, "epoch": 4640} {"train_loss": -26.667312622070312, "global_step": 385198, "epoch": 4640} {"train_loss": -26.641752243041992, "global_step": 385199, "epoch": 4640} {"train_loss": -26.421417236328125, "global_step": 385200, "epoch": 4640} {"train_loss": -26.391651153564453, "global_step": 385201, "epoch": 4640} {"train_loss": -26.35014676473227, "global_step": 385202, "epoch": 4640, "val_loss": 6607074.0} {"train_loss": -25.89681053161621, "global_step": 385203, "epoch": 4641} {"train_loss": -26.05718421936035, "global_step": 385204, "epoch": 4641} {"train_loss": -25.88580322265625, "global_step": 385205, "epoch": 4641} {"train_loss": -25.349288940429688, "global_step": 385206, "epoch": 4641} {"train_loss": -26.042333602905273, "global_step": 385207, "epoch": 4641} {"train_loss": -25.344938278198242, "global_step": 385208, "epoch": 4641} {"train_loss": -26.12162208557129, "global_step": 385209, "epoch": 4641} {"train_loss": -25.538427352905273, "global_step": 385210, "epoch": 4641} {"train_loss": -25.53191375732422, "global_step": 385211, "epoch": 4641} {"train_loss": -25.544858932495117, "global_step": 385212, "epoch": 4641} {"train_loss": -25.85589599609375, "global_step": 385213, "epoch": 4641} {"train_loss": -25.974822998046875, "global_step": 385214, "epoch": 4641} {"train_loss": -26.16229820251465, "global_step": 385215, "epoch": 4641} {"train_loss": -26.188018798828125, "global_step": 385216, "epoch": 4641} {"train_loss": -26.3242244720459, "global_step": 385217, "epoch": 4641} {"train_loss": -25.97674560546875, "global_step": 385218, "epoch": 4641} {"train_loss": -26.242856979370117, "global_step": 385219, "epoch": 4641} {"train_loss": -26.529052734375, "global_step": 385220, "epoch": 4641} {"train_loss": -26.163043975830078, "global_step": 385221, "epoch": 4641} {"train_loss": -25.789901733398438, "global_step": 385222, "epoch": 4641} {"train_loss": -26.071456909179688, "global_step": 385223, "epoch": 4641} {"train_loss": -26.287214279174805, "global_step": 385224, "epoch": 4641} {"train_loss": -26.131330490112305, "global_step": 385225, "epoch": 4641} {"train_loss": -26.327985763549805, "global_step": 385226, "epoch": 4641} {"train_loss": -26.066619873046875, "global_step": 385227, "epoch": 4641} {"train_loss": -26.270832061767578, "global_step": 385228, "epoch": 4641} {"train_loss": -26.407001495361328, "global_step": 385229, "epoch": 4641} {"train_loss": -26.175825119018555, "global_step": 385230, "epoch": 4641} {"train_loss": -26.46668815612793, "global_step": 385231, "epoch": 4641} {"train_loss": -25.809249877929688, "global_step": 385232, "epoch": 4641} {"train_loss": -26.3395938873291, "global_step": 385233, "epoch": 4641} {"train_loss": -26.4514102935791, "global_step": 385234, "epoch": 4641} {"train_loss": -26.491199493408203, "global_step": 385235, "epoch": 4641} {"train_loss": -26.3533878326416, "global_step": 385236, "epoch": 4641} {"train_loss": -26.468557357788086, "global_step": 385237, "epoch": 4641} {"train_loss": -26.466047286987305, "global_step": 385238, "epoch": 4641} {"train_loss": -26.863269805908203, "global_step": 385239, "epoch": 4641} {"train_loss": -26.0722599029541, "global_step": 385240, "epoch": 4641} {"train_loss": -26.78397560119629, "global_step": 385241, "epoch": 4641} {"train_loss": -26.276187896728516, "global_step": 385242, "epoch": 4641} {"train_loss": -26.884031295776367, "global_step": 385243, "epoch": 4641} {"train_loss": -26.674732208251953, "global_step": 385244, "epoch": 4641} {"train_loss": -26.324975967407227, "global_step": 385245, "epoch": 4641} {"train_loss": -26.806028366088867, "global_step": 385246, "epoch": 4641} {"train_loss": -26.61408042907715, "global_step": 385247, "epoch": 4641} {"train_loss": -26.490524291992188, "global_step": 385248, "epoch": 4641} {"train_loss": -26.544523239135742, "global_step": 385249, "epoch": 4641} {"train_loss": -26.418914794921875, "global_step": 385250, "epoch": 4641} {"train_loss": -26.481176376342773, "global_step": 385251, "epoch": 4641} {"train_loss": -26.266672134399414, "global_step": 385252, "epoch": 4641} {"train_loss": -26.542234420776367, "global_step": 385253, "epoch": 4641} {"train_loss": -26.772504806518555, "global_step": 385254, "epoch": 4641} {"train_loss": -26.18894386291504, "global_step": 385255, "epoch": 4641} {"train_loss": -26.613788604736328, "global_step": 385256, "epoch": 4641} {"train_loss": -26.55121421813965, "global_step": 385257, "epoch": 4641} {"train_loss": -26.2686767578125, "global_step": 385258, "epoch": 4641} {"train_loss": -26.3583984375, "global_step": 385259, "epoch": 4641} {"train_loss": -26.88228416442871, "global_step": 385260, "epoch": 4641} {"train_loss": -26.413089752197266, "global_step": 385261, "epoch": 4641} {"train_loss": -26.70850944519043, "global_step": 385262, "epoch": 4641} {"train_loss": -26.81563377380371, "global_step": 385263, "epoch": 4641} {"train_loss": -26.5584774017334, "global_step": 385264, "epoch": 4641} {"train_loss": -26.6434383392334, "global_step": 385265, "epoch": 4641} {"train_loss": -26.773168563842773, "global_step": 385266, "epoch": 4641} {"train_loss": -26.6351375579834, "global_step": 385267, "epoch": 4641} {"train_loss": -26.4508113861084, "global_step": 385268, "epoch": 4641} {"train_loss": -27.030614852905273, "global_step": 385269, "epoch": 4641} {"train_loss": -26.6533260345459, "global_step": 385270, "epoch": 4641} {"train_loss": -26.649572372436523, "global_step": 385271, "epoch": 4641} {"train_loss": -26.81689453125, "global_step": 385272, "epoch": 4641} {"train_loss": -26.610300064086914, "global_step": 385273, "epoch": 4641} {"train_loss": -26.884357452392578, "global_step": 385274, "epoch": 4641} {"train_loss": -26.64013671875, "global_step": 385275, "epoch": 4641} {"train_loss": -26.318862915039062, "global_step": 385276, "epoch": 4641} {"train_loss": -26.67213249206543, "global_step": 385277, "epoch": 4641} {"train_loss": -26.679187774658203, "global_step": 385278, "epoch": 4641} {"train_loss": -26.788345336914062, "global_step": 385279, "epoch": 4641} {"train_loss": -26.907087326049805, "global_step": 385280, "epoch": 4641} {"train_loss": -26.673803329467773, "global_step": 385281, "epoch": 4641} {"train_loss": -26.827417373657227, "global_step": 385282, "epoch": 4641} {"train_loss": -26.540185928344727, "global_step": 385283, "epoch": 4641} {"train_loss": -26.492185592651367, "global_step": 385284, "epoch": 4641} {"train_loss": -26.369600502841443, "global_step": 385285, "epoch": 4641, "val_loss": 6618045.0} {"train_loss": -26.04802894592285, "global_step": 385286, "epoch": 4642} {"train_loss": -26.12110710144043, "global_step": 385287, "epoch": 4642} {"train_loss": -26.461658477783203, "global_step": 385288, "epoch": 4642} {"train_loss": -25.694629669189453, "global_step": 385289, "epoch": 4642} {"train_loss": -26.244098663330078, "global_step": 385290, "epoch": 4642} {"train_loss": -26.038095474243164, "global_step": 385291, "epoch": 4642} {"train_loss": -26.16741371154785, "global_step": 385292, "epoch": 4642} {"train_loss": -25.953998565673828, "global_step": 385293, "epoch": 4642} {"train_loss": -26.073932647705078, "global_step": 385294, "epoch": 4642} {"train_loss": -26.132749557495117, "global_step": 385295, "epoch": 4642} {"train_loss": -26.268497467041016, "global_step": 385296, "epoch": 4642} {"train_loss": -26.25921058654785, "global_step": 385297, "epoch": 4642} {"train_loss": -26.307565689086914, "global_step": 385298, "epoch": 4642} {"train_loss": -26.398487091064453, "global_step": 385299, "epoch": 4642} {"train_loss": -26.054367065429688, "global_step": 385300, "epoch": 4642} {"train_loss": -26.265914916992188, "global_step": 385301, "epoch": 4642} {"train_loss": -26.214277267456055, "global_step": 385302, "epoch": 4642} {"train_loss": -26.473188400268555, "global_step": 385303, "epoch": 4642} {"train_loss": -26.62330436706543, "global_step": 385304, "epoch": 4642} {"train_loss": -26.611358642578125, "global_step": 385305, "epoch": 4642} {"train_loss": -26.40903091430664, "global_step": 385306, "epoch": 4642} {"train_loss": -26.318267822265625, "global_step": 385307, "epoch": 4642} {"train_loss": -26.537023544311523, "global_step": 385308, "epoch": 4642} {"train_loss": -26.24479103088379, "global_step": 385309, "epoch": 4642} {"train_loss": -26.640783309936523, "global_step": 385310, "epoch": 4642} {"train_loss": -26.940784454345703, "global_step": 385311, "epoch": 4642} {"train_loss": -26.61163902282715, "global_step": 385312, "epoch": 4642} {"train_loss": -26.757068634033203, "global_step": 385313, "epoch": 4642} {"train_loss": -26.604019165039062, "global_step": 385314, "epoch": 4642} {"train_loss": -26.592243194580078, "global_step": 385315, "epoch": 4642} {"train_loss": -26.815998077392578, "global_step": 385316, "epoch": 4642} {"train_loss": -26.59931755065918, "global_step": 385317, "epoch": 4642} {"train_loss": -26.689661026000977, "global_step": 385318, "epoch": 4642} {"train_loss": -26.483667373657227, "global_step": 385319, "epoch": 4642} {"train_loss": -26.6413631439209, "global_step": 385320, "epoch": 4642} {"train_loss": -26.64472007751465, "global_step": 385321, "epoch": 4642} {"train_loss": -26.43611717224121, "global_step": 385322, "epoch": 4642} {"train_loss": -26.685148239135742, "global_step": 385323, "epoch": 4642} {"train_loss": -26.340463638305664, "global_step": 385324, "epoch": 4642} {"train_loss": -26.481983184814453, "global_step": 385325, "epoch": 4642} {"train_loss": -26.60288429260254, "global_step": 385326, "epoch": 4642} {"train_loss": -26.689870834350586, "global_step": 385327, "epoch": 4642} {"train_loss": -26.956695556640625, "global_step": 385328, "epoch": 4642} {"train_loss": -26.40566062927246, "global_step": 385329, "epoch": 4642} {"train_loss": -26.468915939331055, "global_step": 385330, "epoch": 4642} {"train_loss": -26.60182762145996, "global_step": 385331, "epoch": 4642} {"train_loss": -26.49346923828125, "global_step": 385332, "epoch": 4642} {"train_loss": -26.618911743164062, "global_step": 385333, "epoch": 4642} {"train_loss": -26.53407096862793, "global_step": 385334, "epoch": 4642} {"train_loss": -26.1951847076416, "global_step": 385335, "epoch": 4642} {"train_loss": -26.076648712158203, "global_step": 385336, "epoch": 4642} {"train_loss": -26.20371437072754, "global_step": 385337, "epoch": 4642} {"train_loss": -25.65773582458496, "global_step": 385338, "epoch": 4642} {"train_loss": -25.74365234375, "global_step": 385339, "epoch": 4642} {"train_loss": -26.43393898010254, "global_step": 385340, "epoch": 4642} {"train_loss": -26.32209587097168, "global_step": 385341, "epoch": 4642} {"train_loss": -25.78903579711914, "global_step": 385342, "epoch": 4642} {"train_loss": -25.38454818725586, "global_step": 385343, "epoch": 4642} {"train_loss": -26.545621871948242, "global_step": 385344, "epoch": 4642} {"train_loss": -26.06024169921875, "global_step": 385345, "epoch": 4642} {"train_loss": -26.069440841674805, "global_step": 385346, "epoch": 4642} {"train_loss": -25.96377944946289, "global_step": 385347, "epoch": 4642} {"train_loss": -26.12420654296875, "global_step": 385348, "epoch": 4642} {"train_loss": -26.389551162719727, "global_step": 385349, "epoch": 4642} {"train_loss": -26.513410568237305, "global_step": 385350, "epoch": 4642} {"train_loss": -26.141021728515625, "global_step": 385351, "epoch": 4642} {"train_loss": -26.275354385375977, "global_step": 385352, "epoch": 4642} {"train_loss": -26.233722686767578, "global_step": 385353, "epoch": 4642} {"train_loss": -26.385854721069336, "global_step": 385354, "epoch": 4642} {"train_loss": -26.323957443237305, "global_step": 385355, "epoch": 4642} {"train_loss": -26.234516143798828, "global_step": 385356, "epoch": 4642} {"train_loss": -26.040884017944336, "global_step": 385357, "epoch": 4642} {"train_loss": -26.769811630249023, "global_step": 385358, "epoch": 4642} {"train_loss": -26.58565330505371, "global_step": 385359, "epoch": 4642} {"train_loss": -26.165796279907227, "global_step": 385360, "epoch": 4642} {"train_loss": -26.377033233642578, "global_step": 385361, "epoch": 4642} {"train_loss": -26.373804092407227, "global_step": 385362, "epoch": 4642} {"train_loss": -26.509876251220703, "global_step": 385363, "epoch": 4642} {"train_loss": -26.414838790893555, "global_step": 385364, "epoch": 4642} {"train_loss": -26.75612449645996, "global_step": 385365, "epoch": 4642} {"train_loss": -26.486164093017578, "global_step": 385366, "epoch": 4642} {"train_loss": -26.416913986206055, "global_step": 385367, "epoch": 4642} {"train_loss": -26.33763094982469, "global_step": 385368, "epoch": 4642, "val_loss": 6625158.0} {"train_loss": -26.016998291015625, "global_step": 385369, "epoch": 4643} {"train_loss": -26.21323585510254, "global_step": 385370, "epoch": 4643} {"train_loss": -26.067052841186523, "global_step": 385371, "epoch": 4643} {"train_loss": -26.084848403930664, "global_step": 385372, "epoch": 4643} {"train_loss": -25.985315322875977, "global_step": 385373, "epoch": 4643} {"train_loss": -26.243438720703125, "global_step": 385374, "epoch": 4643} {"train_loss": -26.1451358795166, "global_step": 385375, "epoch": 4643} {"train_loss": -26.256803512573242, "global_step": 385376, "epoch": 4643} {"train_loss": -26.162073135375977, "global_step": 385377, "epoch": 4643} {"train_loss": -26.655120849609375, "global_step": 385378, "epoch": 4643} {"train_loss": -26.331695556640625, "global_step": 385379, "epoch": 4643} {"train_loss": -25.991968154907227, "global_step": 385380, "epoch": 4643} {"train_loss": -26.412351608276367, "global_step": 385381, "epoch": 4643} {"train_loss": -26.26315689086914, "global_step": 385382, "epoch": 4643} {"train_loss": -26.399433135986328, "global_step": 385383, "epoch": 4643} {"train_loss": -26.363866806030273, "global_step": 385384, "epoch": 4643} {"train_loss": -26.4060115814209, "global_step": 385385, "epoch": 4643} {"train_loss": -26.14582633972168, "global_step": 385386, "epoch": 4643} {"train_loss": -26.338232040405273, "global_step": 385387, "epoch": 4643} {"train_loss": -26.412626266479492, "global_step": 385388, "epoch": 4643} {"train_loss": -26.55710220336914, "global_step": 385389, "epoch": 4643} {"train_loss": -26.1856746673584, "global_step": 385390, "epoch": 4643} {"train_loss": -26.63124656677246, "global_step": 385391, "epoch": 4643} {"train_loss": -26.43939208984375, "global_step": 385392, "epoch": 4643} {"train_loss": -26.63818359375, "global_step": 385393, "epoch": 4643} {"train_loss": -26.360265731811523, "global_step": 385394, "epoch": 4643} {"train_loss": -26.43231201171875, "global_step": 385395, "epoch": 4643} {"train_loss": -26.3917293548584, "global_step": 385396, "epoch": 4643} {"train_loss": -26.74871826171875, "global_step": 385397, "epoch": 4643} {"train_loss": -26.615732192993164, "global_step": 385398, "epoch": 4643} {"train_loss": -26.94892692565918, "global_step": 385399, "epoch": 4643} {"train_loss": -26.71628189086914, "global_step": 385400, "epoch": 4643} {"train_loss": -26.518030166625977, "global_step": 385401, "epoch": 4643} {"train_loss": -26.518207550048828, "global_step": 385402, "epoch": 4643} {"train_loss": -26.6965389251709, "global_step": 385403, "epoch": 4643} {"train_loss": -26.52842140197754, "global_step": 385404, "epoch": 4643} {"train_loss": -26.224023818969727, "global_step": 385405, "epoch": 4643} {"train_loss": -26.637109756469727, "global_step": 385406, "epoch": 4643} {"train_loss": -26.434738159179688, "global_step": 385407, "epoch": 4643} {"train_loss": -26.61615562438965, "global_step": 385408, "epoch": 4643} {"train_loss": -26.58588981628418, "global_step": 385409, "epoch": 4643} {"train_loss": -26.895843505859375, "global_step": 385410, "epoch": 4643} {"train_loss": -26.574670791625977, "global_step": 385411, "epoch": 4643} {"train_loss": -26.898040771484375, "global_step": 385412, "epoch": 4643} {"train_loss": -26.090503692626953, "global_step": 385413, "epoch": 4643} {"train_loss": -26.53104591369629, "global_step": 385414, "epoch": 4643} {"train_loss": -26.51315689086914, "global_step": 385415, "epoch": 4643} {"train_loss": -26.832483291625977, "global_step": 385416, "epoch": 4643} {"train_loss": -26.5091552734375, "global_step": 385417, "epoch": 4643} {"train_loss": -26.631261825561523, "global_step": 385418, "epoch": 4643} {"train_loss": -26.002347946166992, "global_step": 385419, "epoch": 4643} {"train_loss": -26.567047119140625, "global_step": 385420, "epoch": 4643} {"train_loss": -26.624013900756836, "global_step": 385421, "epoch": 4643} {"train_loss": -26.685546875, "global_step": 385422, "epoch": 4643} {"train_loss": -26.91156578063965, "global_step": 385423, "epoch": 4643} {"train_loss": -26.02522087097168, "global_step": 385424, "epoch": 4643} {"train_loss": -26.718570709228516, "global_step": 385425, "epoch": 4643} {"train_loss": -26.8459529876709, "global_step": 385426, "epoch": 4643} {"train_loss": -26.468448638916016, "global_step": 385427, "epoch": 4643} {"train_loss": -26.8950252532959, "global_step": 385428, "epoch": 4643} {"train_loss": -26.578754425048828, "global_step": 385429, "epoch": 4643} {"train_loss": -26.338302612304688, "global_step": 385430, "epoch": 4643} {"train_loss": -26.68630027770996, "global_step": 385431, "epoch": 4643} {"train_loss": -26.84604835510254, "global_step": 385432, "epoch": 4643} {"train_loss": -26.778949737548828, "global_step": 385433, "epoch": 4643} {"train_loss": -26.61439323425293, "global_step": 385434, "epoch": 4643} {"train_loss": -26.608978271484375, "global_step": 385435, "epoch": 4643} {"train_loss": -26.449583053588867, "global_step": 385436, "epoch": 4643} {"train_loss": -26.548236846923828, "global_step": 385437, "epoch": 4643} {"train_loss": -26.811573028564453, "global_step": 385438, "epoch": 4643} {"train_loss": -26.697824478149414, "global_step": 385439, "epoch": 4643} {"train_loss": -26.28495216369629, "global_step": 385440, "epoch": 4643} {"train_loss": -26.545394897460938, "global_step": 385441, "epoch": 4643} {"train_loss": -26.1126766204834, "global_step": 385442, "epoch": 4643} {"train_loss": -26.67401695251465, "global_step": 385443, "epoch": 4643} {"train_loss": -26.170169830322266, "global_step": 385444, "epoch": 4643} {"train_loss": -25.7799072265625, "global_step": 385445, "epoch": 4643} {"train_loss": -26.38582420349121, "global_step": 385446, "epoch": 4643} {"train_loss": -26.57916259765625, "global_step": 385447, "epoch": 4643} {"train_loss": -26.53106117248535, "global_step": 385448, "epoch": 4643} {"train_loss": -26.12445068359375, "global_step": 385449, "epoch": 4643} {"train_loss": -26.0864315032959, "global_step": 385450, "epoch": 4643} {"train_loss": -26.441274045461633, "global_step": 385451, "epoch": 4643, "val_loss": 6599222.0} {"train_loss": -25.31805992126465, "global_step": 385452, "epoch": 4644} {"train_loss": -25.804141998291016, "global_step": 385453, "epoch": 4644} {"train_loss": -25.44256019592285, "global_step": 385454, "epoch": 4644} {"train_loss": -25.799041748046875, "global_step": 385455, "epoch": 4644} {"train_loss": -25.506793975830078, "global_step": 385456, "epoch": 4644} {"train_loss": -25.767175674438477, "global_step": 385457, "epoch": 4644} {"train_loss": -25.717273712158203, "global_step": 385458, "epoch": 4644} {"train_loss": -26.21816062927246, "global_step": 385459, "epoch": 4644} {"train_loss": -25.811908721923828, "global_step": 385460, "epoch": 4644} {"train_loss": -26.022846221923828, "global_step": 385461, "epoch": 4644} {"train_loss": -25.61305046081543, "global_step": 385462, "epoch": 4644} {"train_loss": -26.05712890625, "global_step": 385463, "epoch": 4644} {"train_loss": -25.765701293945312, "global_step": 385464, "epoch": 4644} {"train_loss": -25.851856231689453, "global_step": 385465, "epoch": 4644} {"train_loss": -26.205265045166016, "global_step": 385466, "epoch": 4644} {"train_loss": -26.213171005249023, "global_step": 385467, "epoch": 4644} {"train_loss": -26.27564811706543, "global_step": 385468, "epoch": 4644} {"train_loss": -26.09454917907715, "global_step": 385469, "epoch": 4644} {"train_loss": -26.383420944213867, "global_step": 385470, "epoch": 4644} {"train_loss": -26.114837646484375, "global_step": 385471, "epoch": 4644} {"train_loss": -26.625165939331055, "global_step": 385472, "epoch": 4644} {"train_loss": -26.081579208374023, "global_step": 385473, "epoch": 4644} {"train_loss": -26.36738395690918, "global_step": 385474, "epoch": 4644} {"train_loss": -25.952777862548828, "global_step": 385475, "epoch": 4644} {"train_loss": -26.06915283203125, "global_step": 385476, "epoch": 4644} {"train_loss": -26.396087646484375, "global_step": 385477, "epoch": 4644} {"train_loss": -26.1014461517334, "global_step": 385478, "epoch": 4644} {"train_loss": -26.6689395904541, "global_step": 385479, "epoch": 4644} {"train_loss": -26.53070068359375, "global_step": 385480, "epoch": 4644} {"train_loss": -26.509748458862305, "global_step": 385481, "epoch": 4644} {"train_loss": -26.36958885192871, "global_step": 385482, "epoch": 4644} {"train_loss": -26.273752212524414, "global_step": 385483, "epoch": 4644} {"train_loss": -26.724048614501953, "global_step": 385484, "epoch": 4644} {"train_loss": -26.160383224487305, "global_step": 385485, "epoch": 4644} {"train_loss": -26.352502822875977, "global_step": 385486, "epoch": 4644} {"train_loss": -26.472089767456055, "global_step": 385487, "epoch": 4644} {"train_loss": -26.481998443603516, "global_step": 385488, "epoch": 4644} {"train_loss": -26.73111343383789, "global_step": 385489, "epoch": 4644} {"train_loss": -26.726898193359375, "global_step": 385490, "epoch": 4644} {"train_loss": -26.406829833984375, "global_step": 385491, "epoch": 4644} {"train_loss": -26.494054794311523, "global_step": 385492, "epoch": 4644} {"train_loss": -26.25732421875, "global_step": 385493, "epoch": 4644} {"train_loss": -26.657690048217773, "global_step": 385494, "epoch": 4644} {"train_loss": -26.262195587158203, "global_step": 385495, "epoch": 4644} {"train_loss": -26.50286865234375, "global_step": 385496, "epoch": 4644} {"train_loss": -26.19644546508789, "global_step": 385497, "epoch": 4644} {"train_loss": -26.363540649414062, "global_step": 385498, "epoch": 4644} {"train_loss": -26.274438858032227, "global_step": 385499, "epoch": 4644} {"train_loss": -26.61834716796875, "global_step": 385500, "epoch": 4644} {"train_loss": -26.109670639038086, "global_step": 385501, "epoch": 4644} {"train_loss": -26.844717025756836, "global_step": 385502, "epoch": 4644} {"train_loss": -26.617284774780273, "global_step": 385503, "epoch": 4644} {"train_loss": -26.528478622436523, "global_step": 385504, "epoch": 4644} {"train_loss": -26.601404190063477, "global_step": 385505, "epoch": 4644} {"train_loss": -26.455656051635742, "global_step": 385506, "epoch": 4644} {"train_loss": -26.795557022094727, "global_step": 385507, "epoch": 4644} {"train_loss": -26.8344783782959, "global_step": 385508, "epoch": 4644} {"train_loss": -26.496732711791992, "global_step": 385509, "epoch": 4644} {"train_loss": -26.556884765625, "global_step": 385510, "epoch": 4644} {"train_loss": -26.548315048217773, "global_step": 385511, "epoch": 4644} {"train_loss": -26.50679588317871, "global_step": 385512, "epoch": 4644} {"train_loss": -26.72627067565918, "global_step": 385513, "epoch": 4644} {"train_loss": -26.463407516479492, "global_step": 385514, "epoch": 4644} {"train_loss": -26.621591567993164, "global_step": 385515, "epoch": 4644} {"train_loss": -26.766897201538086, "global_step": 385516, "epoch": 4644} {"train_loss": -26.7567195892334, "global_step": 385517, "epoch": 4644} {"train_loss": -26.508319854736328, "global_step": 385518, "epoch": 4644} {"train_loss": -26.66898536682129, "global_step": 385519, "epoch": 4644} {"train_loss": -26.377704620361328, "global_step": 385520, "epoch": 4644} {"train_loss": -26.334821701049805, "global_step": 385521, "epoch": 4644} {"train_loss": -26.133453369140625, "global_step": 385522, "epoch": 4644} {"train_loss": -26.3791446685791, "global_step": 385523, "epoch": 4644} {"train_loss": -26.391010284423828, "global_step": 385524, "epoch": 4644} {"train_loss": -26.183683395385742, "global_step": 385525, "epoch": 4644} {"train_loss": -26.519235610961914, "global_step": 385526, "epoch": 4644} {"train_loss": -26.90846061706543, "global_step": 385527, "epoch": 4644} {"train_loss": -26.856765747070312, "global_step": 385528, "epoch": 4644} {"train_loss": -26.55266761779785, "global_step": 385529, "epoch": 4644} {"train_loss": -26.8748722076416, "global_step": 385530, "epoch": 4644} {"train_loss": -26.450010299682617, "global_step": 385531, "epoch": 4644} {"train_loss": -26.582809448242188, "global_step": 385532, "epoch": 4644} {"train_loss": -26.820877075195312, "global_step": 385533, "epoch": 4644} {"train_loss": -26.355643582631306, "global_step": 385534, "epoch": 4644, "val_loss": 6631582.0} {"train_loss": -26.193323135375977, "global_step": 385535, "epoch": 4645} {"train_loss": -25.840961456298828, "global_step": 385536, "epoch": 4645} {"train_loss": -26.437915802001953, "global_step": 385537, "epoch": 4645} {"train_loss": -26.246198654174805, "global_step": 385538, "epoch": 4645} {"train_loss": -25.95878028869629, "global_step": 385539, "epoch": 4645} {"train_loss": -26.113393783569336, "global_step": 385540, "epoch": 4645} {"train_loss": -26.559614181518555, "global_step": 385541, "epoch": 4645} {"train_loss": -26.0841064453125, "global_step": 385542, "epoch": 4645} {"train_loss": -26.319074630737305, "global_step": 385543, "epoch": 4645} {"train_loss": -26.55072593688965, "global_step": 385544, "epoch": 4645} {"train_loss": -25.644763946533203, "global_step": 385545, "epoch": 4645} {"train_loss": -26.114057540893555, "global_step": 385546, "epoch": 4645} {"train_loss": -26.382770538330078, "global_step": 385547, "epoch": 4645} {"train_loss": -26.086811065673828, "global_step": 385548, "epoch": 4645} {"train_loss": -26.308319091796875, "global_step": 385549, "epoch": 4645} {"train_loss": -26.268756866455078, "global_step": 385550, "epoch": 4645} {"train_loss": -26.020355224609375, "global_step": 385551, "epoch": 4645} {"train_loss": -26.349897384643555, "global_step": 385552, "epoch": 4645} {"train_loss": -26.301605224609375, "global_step": 385553, "epoch": 4645} {"train_loss": -26.42483901977539, "global_step": 385554, "epoch": 4645} {"train_loss": -26.4141902923584, "global_step": 385555, "epoch": 4645} {"train_loss": -26.40131187438965, "global_step": 385556, "epoch": 4645} {"train_loss": -26.527755737304688, "global_step": 385557, "epoch": 4645} {"train_loss": -26.32343864440918, "global_step": 385558, "epoch": 4645} {"train_loss": -26.363447189331055, "global_step": 385559, "epoch": 4645} {"train_loss": -26.21161460876465, "global_step": 385560, "epoch": 4645} {"train_loss": -26.301788330078125, "global_step": 385561, "epoch": 4645} {"train_loss": -26.433679580688477, "global_step": 385562, "epoch": 4645} {"train_loss": -26.709869384765625, "global_step": 385563, "epoch": 4645} {"train_loss": -26.294286727905273, "global_step": 385564, "epoch": 4645} {"train_loss": -26.177579879760742, "global_step": 385565, "epoch": 4645} {"train_loss": -26.39141273498535, "global_step": 385566, "epoch": 4645} {"train_loss": -26.594573974609375, "global_step": 385567, "epoch": 4645} {"train_loss": -26.495981216430664, "global_step": 385568, "epoch": 4645} {"train_loss": -26.242801666259766, "global_step": 385569, "epoch": 4645} {"train_loss": -26.064733505249023, "global_step": 385570, "epoch": 4645} {"train_loss": -26.650848388671875, "global_step": 385571, "epoch": 4645} {"train_loss": -26.28742027282715, "global_step": 385572, "epoch": 4645} {"train_loss": -26.3747615814209, "global_step": 385573, "epoch": 4645} {"train_loss": -26.728986740112305, "global_step": 385574, "epoch": 4645} {"train_loss": -26.4938907623291, "global_step": 385575, "epoch": 4645} {"train_loss": -26.71954917907715, "global_step": 385576, "epoch": 4645} {"train_loss": -26.192230224609375, "global_step": 385577, "epoch": 4645} {"train_loss": -26.603870391845703, "global_step": 385578, "epoch": 4645} {"train_loss": -26.560810089111328, "global_step": 385579, "epoch": 4645} {"train_loss": -26.082128524780273, "global_step": 385580, "epoch": 4645} {"train_loss": -26.394943237304688, "global_step": 385581, "epoch": 4645} {"train_loss": -26.039875030517578, "global_step": 385582, "epoch": 4645} {"train_loss": -26.6306095123291, "global_step": 385583, "epoch": 4645} {"train_loss": -26.500396728515625, "global_step": 385584, "epoch": 4645} {"train_loss": -26.489761352539062, "global_step": 385585, "epoch": 4645} {"train_loss": -26.72089195251465, "global_step": 385586, "epoch": 4645} {"train_loss": -26.50665283203125, "global_step": 385587, "epoch": 4645} {"train_loss": -26.612470626831055, "global_step": 385588, "epoch": 4645} {"train_loss": -26.579687118530273, "global_step": 385589, "epoch": 4645} {"train_loss": -26.98215103149414, "global_step": 385590, "epoch": 4645} {"train_loss": -26.618473052978516, "global_step": 385591, "epoch": 4645} {"train_loss": -26.88614273071289, "global_step": 385592, "epoch": 4645} {"train_loss": -26.604116439819336, "global_step": 385593, "epoch": 4645} {"train_loss": -26.350744247436523, "global_step": 385594, "epoch": 4645} {"train_loss": -26.338993072509766, "global_step": 385595, "epoch": 4645} {"train_loss": -25.983076095581055, "global_step": 385596, "epoch": 4645} {"train_loss": -26.557416915893555, "global_step": 385597, "epoch": 4645} {"train_loss": -26.482885360717773, "global_step": 385598, "epoch": 4645} {"train_loss": -26.1219539642334, "global_step": 385599, "epoch": 4645} {"train_loss": -26.352155685424805, "global_step": 385600, "epoch": 4645} {"train_loss": -26.684955596923828, "global_step": 385601, "epoch": 4645} {"train_loss": -26.315610885620117, "global_step": 385602, "epoch": 4645} {"train_loss": -26.583744049072266, "global_step": 385603, "epoch": 4645} {"train_loss": -26.402807235717773, "global_step": 385604, "epoch": 4645} {"train_loss": -26.551025390625, "global_step": 385605, "epoch": 4645} {"train_loss": -26.496713638305664, "global_step": 385606, "epoch": 4645} {"train_loss": -26.29915428161621, "global_step": 385607, "epoch": 4645} {"train_loss": -26.412322998046875, "global_step": 385608, "epoch": 4645} {"train_loss": -26.391828536987305, "global_step": 385609, "epoch": 4645} {"train_loss": -26.570775985717773, "global_step": 385610, "epoch": 4645} {"train_loss": -26.434234619140625, "global_step": 385611, "epoch": 4645} {"train_loss": -26.414106369018555, "global_step": 385612, "epoch": 4645} {"train_loss": -26.414045333862305, "global_step": 385613, "epoch": 4645} {"train_loss": -26.81271743774414, "global_step": 385614, "epoch": 4645} {"train_loss": -26.375965118408203, "global_step": 385615, "epoch": 4645} {"train_loss": -27.145832061767578, "global_step": 385616, "epoch": 4645} {"train_loss": -26.397230401096575, "global_step": 385617, "epoch": 4645, "val_loss": 6578437.0} {"train_loss": -26.21003532409668, "global_step": 385618, "epoch": 4646} {"train_loss": -26.531097412109375, "global_step": 385619, "epoch": 4646} {"train_loss": -26.44698143005371, "global_step": 385620, "epoch": 4646} {"train_loss": -26.64528465270996, "global_step": 385621, "epoch": 4646} {"train_loss": -26.532581329345703, "global_step": 385622, "epoch": 4646} {"train_loss": -26.25419044494629, "global_step": 385623, "epoch": 4646} {"train_loss": -26.184614181518555, "global_step": 385624, "epoch": 4646} {"train_loss": -26.094867706298828, "global_step": 385625, "epoch": 4646} {"train_loss": -26.3126163482666, "global_step": 385626, "epoch": 4646} {"train_loss": -26.60867691040039, "global_step": 385627, "epoch": 4646} {"train_loss": -26.727277755737305, "global_step": 385628, "epoch": 4646} {"train_loss": -26.71210289001465, "global_step": 385629, "epoch": 4646} {"train_loss": -26.75591468811035, "global_step": 385630, "epoch": 4646} {"train_loss": -26.305755615234375, "global_step": 385631, "epoch": 4646} {"train_loss": -26.5648136138916, "global_step": 385632, "epoch": 4646} {"train_loss": -26.355487823486328, "global_step": 385633, "epoch": 4646} {"train_loss": -26.501249313354492, "global_step": 385634, "epoch": 4646} {"train_loss": -26.4332332611084, "global_step": 385635, "epoch": 4646} {"train_loss": -26.700668334960938, "global_step": 385636, "epoch": 4646} {"train_loss": -26.343713760375977, "global_step": 385637, "epoch": 4646} {"train_loss": -26.48846435546875, "global_step": 385638, "epoch": 4646} {"train_loss": -26.662078857421875, "global_step": 385639, "epoch": 4646} {"train_loss": -26.18610954284668, "global_step": 385640, "epoch": 4646} {"train_loss": -26.54096031188965, "global_step": 385641, "epoch": 4646} {"train_loss": -26.656055450439453, "global_step": 385642, "epoch": 4646} {"train_loss": -26.247587203979492, "global_step": 385643, "epoch": 4646} {"train_loss": -26.713632583618164, "global_step": 385644, "epoch": 4646} {"train_loss": -26.480701446533203, "global_step": 385645, "epoch": 4646} {"train_loss": -26.58151626586914, "global_step": 385646, "epoch": 4646} {"train_loss": -26.448577880859375, "global_step": 385647, "epoch": 4646} {"train_loss": -26.63372230529785, "global_step": 385648, "epoch": 4646} {"train_loss": -26.419330596923828, "global_step": 385649, "epoch": 4646} {"train_loss": -26.490814208984375, "global_step": 385650, "epoch": 4646} {"train_loss": -26.505395889282227, "global_step": 385651, "epoch": 4646} {"train_loss": -26.632038116455078, "global_step": 385652, "epoch": 4646} {"train_loss": -26.523298263549805, "global_step": 385653, "epoch": 4646} {"train_loss": -26.46901512145996, "global_step": 385654, "epoch": 4646} {"train_loss": -26.397008895874023, "global_step": 385655, "epoch": 4646} {"train_loss": -26.566837310791016, "global_step": 385656, "epoch": 4646} {"train_loss": -26.71930503845215, "global_step": 385657, "epoch": 4646} {"train_loss": -26.4254093170166, "global_step": 385658, "epoch": 4646} {"train_loss": -26.395395278930664, "global_step": 385659, "epoch": 4646} {"train_loss": -26.49171257019043, "global_step": 385660, "epoch": 4646} {"train_loss": -26.641584396362305, "global_step": 385661, "epoch": 4646} {"train_loss": -26.785886764526367, "global_step": 385662, "epoch": 4646} {"train_loss": -26.813308715820312, "global_step": 385663, "epoch": 4646} {"train_loss": -26.124780654907227, "global_step": 385664, "epoch": 4646} {"train_loss": -26.571470260620117, "global_step": 385665, "epoch": 4646} {"train_loss": -26.214038848876953, "global_step": 385666, "epoch": 4646} {"train_loss": -26.542531967163086, "global_step": 385667, "epoch": 4646} {"train_loss": -26.63283348083496, "global_step": 385668, "epoch": 4646} {"train_loss": -26.37393569946289, "global_step": 385669, "epoch": 4646} {"train_loss": -26.636404037475586, "global_step": 385670, "epoch": 4646} {"train_loss": -26.498437881469727, "global_step": 385671, "epoch": 4646} {"train_loss": -26.527612686157227, "global_step": 385672, "epoch": 4646} {"train_loss": -26.586612701416016, "global_step": 385673, "epoch": 4646} {"train_loss": -26.268573760986328, "global_step": 385674, "epoch": 4646} {"train_loss": -26.720184326171875, "global_step": 385675, "epoch": 4646} {"train_loss": -26.433969497680664, "global_step": 385676, "epoch": 4646} {"train_loss": -26.27924919128418, "global_step": 385677, "epoch": 4646} {"train_loss": -26.391759872436523, "global_step": 385678, "epoch": 4646} {"train_loss": -26.5507869720459, "global_step": 385679, "epoch": 4646} {"train_loss": -26.67970848083496, "global_step": 385680, "epoch": 4646} {"train_loss": -26.27126121520996, "global_step": 385681, "epoch": 4646} {"train_loss": -26.4144287109375, "global_step": 385682, "epoch": 4646} {"train_loss": -26.738229751586914, "global_step": 385683, "epoch": 4646} {"train_loss": -26.874176025390625, "global_step": 385684, "epoch": 4646} {"train_loss": -26.998579025268555, "global_step": 385685, "epoch": 4646} {"train_loss": -26.693115234375, "global_step": 385686, "epoch": 4646} {"train_loss": -26.54205894470215, "global_step": 385687, "epoch": 4646} {"train_loss": -26.299158096313477, "global_step": 385688, "epoch": 4646} {"train_loss": -26.564163208007812, "global_step": 385689, "epoch": 4646} {"train_loss": -26.590131759643555, "global_step": 385690, "epoch": 4646} {"train_loss": -26.609037399291992, "global_step": 385691, "epoch": 4646} {"train_loss": -26.467031478881836, "global_step": 385692, "epoch": 4646} {"train_loss": -26.510046005249023, "global_step": 385693, "epoch": 4646} {"train_loss": -26.398218154907227, "global_step": 385694, "epoch": 4646} {"train_loss": -26.377744674682617, "global_step": 385695, "epoch": 4646} {"train_loss": -26.335681915283203, "global_step": 385696, "epoch": 4646} {"train_loss": -26.5793399810791, "global_step": 385697, "epoch": 4646} {"train_loss": -26.67999839782715, "global_step": 385698, "epoch": 4646} {"train_loss": -26.54047203063965, "global_step": 385699, "epoch": 4646} {"train_loss": -26.517763091857177, "global_step": 385700, "epoch": 4646, "val_loss": 6605594.0} {"train_loss": -26.488910675048828, "global_step": 385701, "epoch": 4647} {"train_loss": -26.43924903869629, "global_step": 385702, "epoch": 4647} {"train_loss": -25.942920684814453, "global_step": 385703, "epoch": 4647} {"train_loss": -26.342111587524414, "global_step": 385704, "epoch": 4647} {"train_loss": -26.61528968811035, "global_step": 385705, "epoch": 4647} {"train_loss": -26.192779541015625, "global_step": 385706, "epoch": 4647} {"train_loss": -26.367170333862305, "global_step": 385707, "epoch": 4647} {"train_loss": -26.158166885375977, "global_step": 385708, "epoch": 4647} {"train_loss": -26.12965965270996, "global_step": 385709, "epoch": 4647} {"train_loss": -26.346033096313477, "global_step": 385710, "epoch": 4647} {"train_loss": -26.548986434936523, "global_step": 385711, "epoch": 4647} {"train_loss": -26.541980743408203, "global_step": 385712, "epoch": 4647} {"train_loss": -26.4493350982666, "global_step": 385713, "epoch": 4647} {"train_loss": -26.584997177124023, "global_step": 385714, "epoch": 4647} {"train_loss": -26.354816436767578, "global_step": 385715, "epoch": 4647} {"train_loss": -26.271692276000977, "global_step": 385716, "epoch": 4647} {"train_loss": -26.489267349243164, "global_step": 385717, "epoch": 4647} {"train_loss": -26.45765495300293, "global_step": 385718, "epoch": 4647} {"train_loss": -26.407032012939453, "global_step": 385719, "epoch": 4647} {"train_loss": -26.137399673461914, "global_step": 385720, "epoch": 4647} {"train_loss": -26.24051856994629, "global_step": 385721, "epoch": 4647} {"train_loss": -26.165668487548828, "global_step": 385722, "epoch": 4647} {"train_loss": -26.31342887878418, "global_step": 385723, "epoch": 4647} {"train_loss": -26.550357818603516, "global_step": 385724, "epoch": 4647} {"train_loss": -26.378515243530273, "global_step": 385725, "epoch": 4647} {"train_loss": -26.6742000579834, "global_step": 385726, "epoch": 4647} {"train_loss": -26.307279586791992, "global_step": 385727, "epoch": 4647} {"train_loss": -26.715208053588867, "global_step": 385728, "epoch": 4647} {"train_loss": -26.2033634185791, "global_step": 385729, "epoch": 4647} {"train_loss": -26.456098556518555, "global_step": 385730, "epoch": 4647} {"train_loss": -26.320966720581055, "global_step": 385731, "epoch": 4647} {"train_loss": -26.44318962097168, "global_step": 385732, "epoch": 4647} {"train_loss": -26.264780044555664, "global_step": 385733, "epoch": 4647} {"train_loss": -26.879724502563477, "global_step": 385734, "epoch": 4647} {"train_loss": -26.600433349609375, "global_step": 385735, "epoch": 4647} {"train_loss": -26.329137802124023, "global_step": 385736, "epoch": 4647} {"train_loss": -26.790037155151367, "global_step": 385737, "epoch": 4647} {"train_loss": -26.22946548461914, "global_step": 385738, "epoch": 4647} {"train_loss": -26.31377601623535, "global_step": 385739, "epoch": 4647} {"train_loss": -26.266803741455078, "global_step": 385740, "epoch": 4647} {"train_loss": -26.619043350219727, "global_step": 385741, "epoch": 4647} {"train_loss": -26.09759521484375, "global_step": 385742, "epoch": 4647} {"train_loss": -26.7196102142334, "global_step": 385743, "epoch": 4647} {"train_loss": -26.8549861907959, "global_step": 385744, "epoch": 4647} {"train_loss": -26.36829948425293, "global_step": 385745, "epoch": 4647} {"train_loss": -26.919818878173828, "global_step": 385746, "epoch": 4647} {"train_loss": -26.509069442749023, "global_step": 385747, "epoch": 4647} {"train_loss": -26.62384033203125, "global_step": 385748, "epoch": 4647} {"train_loss": -26.890836715698242, "global_step": 385749, "epoch": 4647} {"train_loss": -26.684335708618164, "global_step": 385750, "epoch": 4647} {"train_loss": -26.61931800842285, "global_step": 385751, "epoch": 4647} {"train_loss": -26.785425186157227, "global_step": 385752, "epoch": 4647} {"train_loss": -26.983810424804688, "global_step": 385753, "epoch": 4647} {"train_loss": -26.356983184814453, "global_step": 385754, "epoch": 4647} {"train_loss": -26.490381240844727, "global_step": 385755, "epoch": 4647} {"train_loss": -26.67872428894043, "global_step": 385756, "epoch": 4647} {"train_loss": -26.258441925048828, "global_step": 385757, "epoch": 4647} {"train_loss": -26.37879753112793, "global_step": 385758, "epoch": 4647} {"train_loss": -26.278467178344727, "global_step": 385759, "epoch": 4647} {"train_loss": -26.116724014282227, "global_step": 385760, "epoch": 4647} {"train_loss": -26.188495635986328, "global_step": 385761, "epoch": 4647} {"train_loss": -26.282445907592773, "global_step": 385762, "epoch": 4647} {"train_loss": -26.5745849609375, "global_step": 385763, "epoch": 4647} {"train_loss": -26.556415557861328, "global_step": 385764, "epoch": 4647} {"train_loss": -26.644256591796875, "global_step": 385765, "epoch": 4647} {"train_loss": -26.76276969909668, "global_step": 385766, "epoch": 4647} {"train_loss": -26.44013786315918, "global_step": 385767, "epoch": 4647} {"train_loss": -26.4066104888916, "global_step": 385768, "epoch": 4647} {"train_loss": -26.318267822265625, "global_step": 385769, "epoch": 4647} {"train_loss": -26.57331657409668, "global_step": 385770, "epoch": 4647} {"train_loss": -26.296234130859375, "global_step": 385771, "epoch": 4647} {"train_loss": -26.173627853393555, "global_step": 385772, "epoch": 4647} {"train_loss": -26.403135299682617, "global_step": 385773, "epoch": 4647} {"train_loss": -26.4249267578125, "global_step": 385774, "epoch": 4647} {"train_loss": -26.251708984375, "global_step": 385775, "epoch": 4647} {"train_loss": -26.60288429260254, "global_step": 385776, "epoch": 4647} {"train_loss": -26.734912872314453, "global_step": 385777, "epoch": 4647} {"train_loss": -26.471771240234375, "global_step": 385778, "epoch": 4647} {"train_loss": -26.634418487548828, "global_step": 385779, "epoch": 4647} {"train_loss": -26.72519874572754, "global_step": 385780, "epoch": 4647} {"train_loss": -26.5430850982666, "global_step": 385781, "epoch": 4647} {"train_loss": -26.86634635925293, "global_step": 385782, "epoch": 4647} {"train_loss": -26.459389698074524, "global_step": 385783, "epoch": 4647, "val_loss": 6503341.0} {"train_loss": -26.29213523864746, "global_step": 385784, "epoch": 4648} {"train_loss": -25.785388946533203, "global_step": 385785, "epoch": 4648} {"train_loss": -25.56957244873047, "global_step": 385786, "epoch": 4648} {"train_loss": -26.300458908081055, "global_step": 385787, "epoch": 4648} {"train_loss": -25.962549209594727, "global_step": 385788, "epoch": 4648} {"train_loss": -26.41499900817871, "global_step": 385789, "epoch": 4648} {"train_loss": -26.49334716796875, "global_step": 385790, "epoch": 4648} {"train_loss": -25.958099365234375, "global_step": 385791, "epoch": 4648} {"train_loss": -26.114526748657227, "global_step": 385792, "epoch": 4648} {"train_loss": -26.020002365112305, "global_step": 385793, "epoch": 4648} {"train_loss": -26.03168296813965, "global_step": 385794, "epoch": 4648} {"train_loss": -26.078201293945312, "global_step": 385795, "epoch": 4648} {"train_loss": -26.2069091796875, "global_step": 385796, "epoch": 4648} {"train_loss": -26.458362579345703, "global_step": 385797, "epoch": 4648} {"train_loss": -26.09583854675293, "global_step": 385798, "epoch": 4648} {"train_loss": -26.321455001831055, "global_step": 385799, "epoch": 4648} {"train_loss": -26.033172607421875, "global_step": 385800, "epoch": 4648} {"train_loss": -26.4611759185791, "global_step": 385801, "epoch": 4648} {"train_loss": -26.20708656311035, "global_step": 385802, "epoch": 4648} {"train_loss": -26.151397705078125, "global_step": 385803, "epoch": 4648} {"train_loss": -26.153005599975586, "global_step": 385804, "epoch": 4648} {"train_loss": -26.28580665588379, "global_step": 385805, "epoch": 4648} {"train_loss": -26.52716636657715, "global_step": 385806, "epoch": 4648} {"train_loss": -26.202539443969727, "global_step": 385807, "epoch": 4648} {"train_loss": -26.61524772644043, "global_step": 385808, "epoch": 4648} {"train_loss": -26.023880004882812, "global_step": 385809, "epoch": 4648} {"train_loss": -26.364431381225586, "global_step": 385810, "epoch": 4648} {"train_loss": -26.20893669128418, "global_step": 385811, "epoch": 4648} {"train_loss": -26.342823028564453, "global_step": 385812, "epoch": 4648} {"train_loss": -26.376544952392578, "global_step": 385813, "epoch": 4648} {"train_loss": -25.985376358032227, "global_step": 385814, "epoch": 4648} {"train_loss": -26.447620391845703, "global_step": 385815, "epoch": 4648} {"train_loss": -26.635284423828125, "global_step": 385816, "epoch": 4648} {"train_loss": -26.566190719604492, "global_step": 385817, "epoch": 4648} {"train_loss": -25.862823486328125, "global_step": 385818, "epoch": 4648} {"train_loss": -26.019744873046875, "global_step": 385819, "epoch": 4648} {"train_loss": -26.7711124420166, "global_step": 385820, "epoch": 4648} {"train_loss": -26.361845016479492, "global_step": 385821, "epoch": 4648} {"train_loss": -26.420785903930664, "global_step": 385822, "epoch": 4648} {"train_loss": -26.79768180847168, "global_step": 385823, "epoch": 4648} {"train_loss": -26.471601486206055, "global_step": 385824, "epoch": 4648} {"train_loss": -26.704193115234375, "global_step": 385825, "epoch": 4648} {"train_loss": -26.67371940612793, "global_step": 385826, "epoch": 4648} {"train_loss": -26.283170700073242, "global_step": 385827, "epoch": 4648} {"train_loss": -26.36927604675293, "global_step": 385828, "epoch": 4648} {"train_loss": -26.97378921508789, "global_step": 385829, "epoch": 4648} {"train_loss": -26.677871704101562, "global_step": 385830, "epoch": 4648} {"train_loss": -26.93562126159668, "global_step": 385831, "epoch": 4648} {"train_loss": -26.57126808166504, "global_step": 385832, "epoch": 4648} {"train_loss": -26.8233585357666, "global_step": 385833, "epoch": 4648} {"train_loss": -26.8623046875, "global_step": 385834, "epoch": 4648} {"train_loss": -26.803241729736328, "global_step": 385835, "epoch": 4648} {"train_loss": -26.782657623291016, "global_step": 385836, "epoch": 4648} {"train_loss": -26.500747680664062, "global_step": 385837, "epoch": 4648} {"train_loss": -26.506826400756836, "global_step": 385838, "epoch": 4648} {"train_loss": -26.58551597595215, "global_step": 385839, "epoch": 4648} {"train_loss": -26.671884536743164, "global_step": 385840, "epoch": 4648} {"train_loss": -26.529813766479492, "global_step": 385841, "epoch": 4648} {"train_loss": -26.937652587890625, "global_step": 385842, "epoch": 4648} {"train_loss": -26.966642379760742, "global_step": 385843, "epoch": 4648} {"train_loss": -26.53047752380371, "global_step": 385844, "epoch": 4648} {"train_loss": -26.564130783081055, "global_step": 385845, "epoch": 4648} {"train_loss": -26.838613510131836, "global_step": 385846, "epoch": 4648} {"train_loss": -26.694448471069336, "global_step": 385847, "epoch": 4648} {"train_loss": -26.61171531677246, "global_step": 385848, "epoch": 4648} {"train_loss": -26.482080459594727, "global_step": 385849, "epoch": 4648} {"train_loss": -26.180326461791992, "global_step": 385850, "epoch": 4648} {"train_loss": -24.90060806274414, "global_step": 385851, "epoch": 4648} {"train_loss": -23.350217819213867, "global_step": 385852, "epoch": 4648} {"train_loss": -23.657855987548828, "global_step": 385853, "epoch": 4648} {"train_loss": -24.978029251098633, "global_step": 385854, "epoch": 4648} {"train_loss": -25.803665161132812, "global_step": 385855, "epoch": 4648} {"train_loss": -25.627765655517578, "global_step": 385856, "epoch": 4648} {"train_loss": -25.185178756713867, "global_step": 385857, "epoch": 4648} {"train_loss": -25.752771377563477, "global_step": 385858, "epoch": 4648} {"train_loss": -25.752334594726562, "global_step": 385859, "epoch": 4648} {"train_loss": -25.4526309967041, "global_step": 385860, "epoch": 4648} {"train_loss": -26.250782012939453, "global_step": 385861, "epoch": 4648} {"train_loss": -26.096410751342773, "global_step": 385862, "epoch": 4648} {"train_loss": -26.046707153320312, "global_step": 385863, "epoch": 4648} {"train_loss": -25.65680503845215, "global_step": 385864, "epoch": 4648} {"train_loss": -26.006223678588867, "global_step": 385865, "epoch": 4648} {"train_loss": -26.221172057002423, "global_step": 385866, "epoch": 4648, "val_loss": 6597199.0} {"train_loss": -25.891698837280273, "global_step": 385867, "epoch": 4649} {"train_loss": -25.682586669921875, "global_step": 385868, "epoch": 4649} {"train_loss": -25.75376319885254, "global_step": 385869, "epoch": 4649} {"train_loss": -26.04888343811035, "global_step": 385870, "epoch": 4649} {"train_loss": -26.081823348999023, "global_step": 385871, "epoch": 4649} {"train_loss": -25.641162872314453, "global_step": 385872, "epoch": 4649} {"train_loss": -26.09234619140625, "global_step": 385873, "epoch": 4649} {"train_loss": -26.3459415435791, "global_step": 385874, "epoch": 4649} {"train_loss": -26.31009864807129, "global_step": 385875, "epoch": 4649} {"train_loss": -26.0670223236084, "global_step": 385876, "epoch": 4649} {"train_loss": -26.48573112487793, "global_step": 385877, "epoch": 4649} {"train_loss": -26.228235244750977, "global_step": 385878, "epoch": 4649} {"train_loss": -26.219640731811523, "global_step": 385879, "epoch": 4649} {"train_loss": -26.064817428588867, "global_step": 385880, "epoch": 4649} {"train_loss": -26.311132431030273, "global_step": 385881, "epoch": 4649} {"train_loss": -26.448566436767578, "global_step": 385882, "epoch": 4649} {"train_loss": -26.0860595703125, "global_step": 385883, "epoch": 4649} {"train_loss": -26.352752685546875, "global_step": 385884, "epoch": 4649} {"train_loss": -26.41485023498535, "global_step": 385885, "epoch": 4649} {"train_loss": -26.35508155822754, "global_step": 385886, "epoch": 4649} {"train_loss": -26.368982315063477, "global_step": 385887, "epoch": 4649} {"train_loss": -26.328195571899414, "global_step": 385888, "epoch": 4649} {"train_loss": -26.623044967651367, "global_step": 385889, "epoch": 4649} {"train_loss": -26.358734130859375, "global_step": 385890, "epoch": 4649} {"train_loss": -26.790760040283203, "global_step": 385891, "epoch": 4649} {"train_loss": -26.273773193359375, "global_step": 385892, "epoch": 4649} {"train_loss": -26.47865104675293, "global_step": 385893, "epoch": 4649} {"train_loss": -26.475025177001953, "global_step": 385894, "epoch": 4649} {"train_loss": -26.615915298461914, "global_step": 385895, "epoch": 4649} {"train_loss": -26.362619400024414, "global_step": 385896, "epoch": 4649} {"train_loss": -26.634052276611328, "global_step": 385897, "epoch": 4649} {"train_loss": -26.6729793548584, "global_step": 385898, "epoch": 4649} {"train_loss": -26.647083282470703, "global_step": 385899, "epoch": 4649} {"train_loss": -26.358911514282227, "global_step": 385900, "epoch": 4649} {"train_loss": -26.886926651000977, "global_step": 385901, "epoch": 4649} {"train_loss": -26.81965446472168, "global_step": 385902, "epoch": 4649} {"train_loss": -26.7453556060791, "global_step": 385903, "epoch": 4649} {"train_loss": -26.265522003173828, "global_step": 385904, "epoch": 4649} {"train_loss": -26.42655372619629, "global_step": 385905, "epoch": 4649} {"train_loss": -26.520832061767578, "global_step": 385906, "epoch": 4649} {"train_loss": -26.81220817565918, "global_step": 385907, "epoch": 4649} {"train_loss": -27.08806800842285, "global_step": 385908, "epoch": 4649} {"train_loss": -26.620405197143555, "global_step": 385909, "epoch": 4649} {"train_loss": -26.4510440826416, "global_step": 385910, "epoch": 4649} {"train_loss": -26.82366943359375, "global_step": 385911, "epoch": 4649} {"train_loss": -26.51413345336914, "global_step": 385912, "epoch": 4649} {"train_loss": -27.051193237304688, "global_step": 385913, "epoch": 4649} {"train_loss": -26.60871696472168, "global_step": 385914, "epoch": 4649} {"train_loss": -26.918493270874023, "global_step": 385915, "epoch": 4649} {"train_loss": -26.523290634155273, "global_step": 385916, "epoch": 4649} {"train_loss": -26.18086814880371, "global_step": 385917, "epoch": 4649} {"train_loss": -26.420501708984375, "global_step": 385918, "epoch": 4649} {"train_loss": -26.54254722595215, "global_step": 385919, "epoch": 4649} {"train_loss": -26.287933349609375, "global_step": 385920, "epoch": 4649} {"train_loss": -26.628820419311523, "global_step": 385921, "epoch": 4649} {"train_loss": -26.774438858032227, "global_step": 385922, "epoch": 4649} {"train_loss": -26.97298240661621, "global_step": 385923, "epoch": 4649} {"train_loss": -26.57576560974121, "global_step": 385924, "epoch": 4649} {"train_loss": -26.523300170898438, "global_step": 385925, "epoch": 4649} {"train_loss": -26.502429962158203, "global_step": 385926, "epoch": 4649} {"train_loss": -26.747827529907227, "global_step": 385927, "epoch": 4649} {"train_loss": -26.351226806640625, "global_step": 385928, "epoch": 4649} {"train_loss": -26.404510498046875, "global_step": 385929, "epoch": 4649} {"train_loss": -26.66766929626465, "global_step": 385930, "epoch": 4649} {"train_loss": -26.545166015625, "global_step": 385931, "epoch": 4649} {"train_loss": -26.311735153198242, "global_step": 385932, "epoch": 4649} {"train_loss": -26.27837562561035, "global_step": 385933, "epoch": 4649} {"train_loss": -26.272851943969727, "global_step": 385934, "epoch": 4649} {"train_loss": -26.254806518554688, "global_step": 385935, "epoch": 4649} {"train_loss": -26.5623779296875, "global_step": 385936, "epoch": 4649} {"train_loss": -26.422317504882812, "global_step": 385937, "epoch": 4649} {"train_loss": -26.58180046081543, "global_step": 385938, "epoch": 4649} {"train_loss": -26.476165771484375, "global_step": 385939, "epoch": 4649} {"train_loss": -26.498437881469727, "global_step": 385940, "epoch": 4649} {"train_loss": -26.38306999206543, "global_step": 385941, "epoch": 4649} {"train_loss": -26.468475341796875, "global_step": 385942, "epoch": 4649} {"train_loss": -26.446924209594727, "global_step": 385943, "epoch": 4649} {"train_loss": -26.67548942565918, "global_step": 385944, "epoch": 4649} {"train_loss": -26.110464096069336, "global_step": 385945, "epoch": 4649} {"train_loss": -26.199054718017578, "global_step": 385946, "epoch": 4649} {"train_loss": -26.58005142211914, "global_step": 385947, "epoch": 4649} {"train_loss": -26.432348251342773, "global_step": 385948, "epoch": 4649} {"train_loss": -26.420062651117163, "global_step": 385949, "epoch": 4649, "val_loss": 6557622.0} {"train_loss": -26.189361572265625, "global_step": 385950, "epoch": 4650} {"train_loss": -25.526418685913086, "global_step": 385951, "epoch": 4650} {"train_loss": -25.720733642578125, "global_step": 385952, "epoch": 4650} {"train_loss": -25.848546981811523, "global_step": 385953, "epoch": 4650} {"train_loss": -25.81524658203125, "global_step": 385954, "epoch": 4650} {"train_loss": -26.129993438720703, "global_step": 385955, "epoch": 4650} {"train_loss": -26.272369384765625, "global_step": 385956, "epoch": 4650} {"train_loss": -26.264114379882812, "global_step": 385957, "epoch": 4650} {"train_loss": -25.735498428344727, "global_step": 385958, "epoch": 4650} {"train_loss": -26.369464874267578, "global_step": 385959, "epoch": 4650} {"train_loss": -26.331546783447266, "global_step": 385960, "epoch": 4650} {"train_loss": -26.293554306030273, "global_step": 385961, "epoch": 4650} {"train_loss": -26.190082550048828, "global_step": 385962, "epoch": 4650} {"train_loss": -26.2349910736084, "global_step": 385963, "epoch": 4650} {"train_loss": -26.29896354675293, "global_step": 385964, "epoch": 4650} {"train_loss": -26.599023818969727, "global_step": 385965, "epoch": 4650} {"train_loss": -26.708267211914062, "global_step": 385966, "epoch": 4650} {"train_loss": -26.38337516784668, "global_step": 385967, "epoch": 4650} {"train_loss": -26.175519943237305, "global_step": 385968, "epoch": 4650} {"train_loss": -26.32756996154785, "global_step": 385969, "epoch": 4650} {"train_loss": -26.233251571655273, "global_step": 385970, "epoch": 4650} {"train_loss": -26.631559371948242, "global_step": 385971, "epoch": 4650} {"train_loss": -26.874725341796875, "global_step": 385972, "epoch": 4650} {"train_loss": -26.593952178955078, "global_step": 385973, "epoch": 4650} {"train_loss": -26.51629066467285, "global_step": 385974, "epoch": 4650} {"train_loss": -26.834775924682617, "global_step": 385975, "epoch": 4650} {"train_loss": -26.51531982421875, "global_step": 385976, "epoch": 4650} {"train_loss": -26.662927627563477, "global_step": 385977, "epoch": 4650} {"train_loss": -26.643787384033203, "global_step": 385978, "epoch": 4650} {"train_loss": -26.40437126159668, "global_step": 385979, "epoch": 4650} {"train_loss": -26.48029136657715, "global_step": 385980, "epoch": 4650} {"train_loss": -26.837839126586914, "global_step": 385981, "epoch": 4650} {"train_loss": -26.4803524017334, "global_step": 385982, "epoch": 4650} {"train_loss": -26.557174682617188, "global_step": 385983, "epoch": 4650} {"train_loss": -26.129779815673828, "global_step": 385984, "epoch": 4650} {"train_loss": -26.29241943359375, "global_step": 385985, "epoch": 4650} {"train_loss": -26.597919464111328, "global_step": 385986, "epoch": 4650} {"train_loss": -26.833728790283203, "global_step": 385987, "epoch": 4650} {"train_loss": -26.144285202026367, "global_step": 385988, "epoch": 4650} {"train_loss": -26.176544189453125, "global_step": 385989, "epoch": 4650} {"train_loss": -26.641454696655273, "global_step": 385990, "epoch": 4650} {"train_loss": -26.401281356811523, "global_step": 385991, "epoch": 4650} {"train_loss": -26.515405654907227, "global_step": 385992, "epoch": 4650} {"train_loss": -26.57468605041504, "global_step": 385993, "epoch": 4650} {"train_loss": -26.558258056640625, "global_step": 385994, "epoch": 4650} {"train_loss": -26.403945922851562, "global_step": 385995, "epoch": 4650} {"train_loss": -26.368310928344727, "global_step": 385996, "epoch": 4650} {"train_loss": -26.334360122680664, "global_step": 385997, "epoch": 4650} {"train_loss": -26.165983200073242, "global_step": 385998, "epoch": 4650} {"train_loss": -26.40740966796875, "global_step": 385999, "epoch": 4650} {"train_loss": -26.4725284576416, "global_step": 386000, "epoch": 4650} {"train_loss": -26.241809844970703, "global_step": 386001, "epoch": 4650} {"train_loss": -26.490741729736328, "global_step": 386002, "epoch": 4650} {"train_loss": -26.238632202148438, "global_step": 386003, "epoch": 4650} {"train_loss": -25.703083038330078, "global_step": 386004, "epoch": 4650} {"train_loss": -26.06613540649414, "global_step": 386005, "epoch": 4650} {"train_loss": -26.211181640625, "global_step": 386006, "epoch": 4650} {"train_loss": -26.134845733642578, "global_step": 386007, "epoch": 4650} {"train_loss": -25.192567825317383, "global_step": 386008, "epoch": 4650} {"train_loss": -26.189619064331055, "global_step": 386009, "epoch": 4650} {"train_loss": -25.97137451171875, "global_step": 386010, "epoch": 4650} {"train_loss": -26.544021606445312, "global_step": 386011, "epoch": 4650} {"train_loss": -25.862939834594727, "global_step": 386012, "epoch": 4650} {"train_loss": -25.850112915039062, "global_step": 386013, "epoch": 4650} {"train_loss": -26.24116325378418, "global_step": 386014, "epoch": 4650} {"train_loss": -26.160688400268555, "global_step": 386015, "epoch": 4650} {"train_loss": -26.15443229675293, "global_step": 386016, "epoch": 4650} {"train_loss": -26.03549575805664, "global_step": 386017, "epoch": 4650} {"train_loss": -26.4699764251709, "global_step": 386018, "epoch": 4650} {"train_loss": -26.53476333618164, "global_step": 386019, "epoch": 4650} {"train_loss": -26.13982582092285, "global_step": 386020, "epoch": 4650} {"train_loss": -26.200332641601562, "global_step": 386021, "epoch": 4650} {"train_loss": -26.258039474487305, "global_step": 386022, "epoch": 4650} {"train_loss": -26.252838134765625, "global_step": 386023, "epoch": 4650} {"train_loss": -26.511545181274414, "global_step": 386024, "epoch": 4650} {"train_loss": -26.235736846923828, "global_step": 386025, "epoch": 4650} {"train_loss": -26.707406997680664, "global_step": 386026, "epoch": 4650} {"train_loss": -26.466978073120117, "global_step": 386027, "epoch": 4650} {"train_loss": -26.15766716003418, "global_step": 386028, "epoch": 4650} {"train_loss": -25.9548397064209, "global_step": 386029, "epoch": 4650} {"train_loss": -26.503376007080078, "global_step": 386030, "epoch": 4650} {"train_loss": -26.67548942565918, "global_step": 386031, "epoch": 4650} {"train_loss": -26.295617252947338, "global_step": 386032, "epoch": 4650, "train/sim_max_reward_0": 1.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4500000": 1.0, "test/sim_max_reward_4500001": 1.0, "test/sim_max_reward_4500002": 1.0, "test/sim_max_reward_4500003": 1.0, "test/sim_max_reward_4500004": 1.0, "test/sim_max_reward_4500005": 0.0, "test/sim_max_reward_4500006": 1.0, "test/sim_max_reward_4500007": 0.0, "test/sim_max_reward_4500008": 1.0, "test/sim_max_reward_4500009": 1.0, "test/sim_max_reward_4500010": 1.0, "test/sim_max_reward_4500011": 1.0, "test/sim_max_reward_4500012": 1.0, "test/sim_max_reward_4500013": 0.0, "test/sim_max_reward_4500014": 1.0, "test/sim_max_reward_4500015": 1.0, "test/sim_max_reward_4500016": 1.0, "test/sim_max_reward_4500017": 1.0, "test/sim_max_reward_4500018": 1.0, "test/sim_max_reward_4500019": 1.0, "test/sim_max_reward_4500020": 1.0, "test/sim_max_reward_4500021": 1.0, "train/mean_score": 1.0, "test/mean_score": 0.8636363636363636, "val_loss": 6685948.0} {"train_loss": -25.866077423095703, "global_step": 386033, "epoch": 4651} {"train_loss": -26.108200073242188, "global_step": 386034, "epoch": 4651} {"train_loss": -25.83538818359375, "global_step": 386035, "epoch": 4651} {"train_loss": -25.877195358276367, "global_step": 386036, "epoch": 4651} {"train_loss": -26.163406372070312, "global_step": 386037, "epoch": 4651} {"train_loss": -26.107690811157227, "global_step": 386038, "epoch": 4651} {"train_loss": -26.225255966186523, "global_step": 386039, "epoch": 4651} {"train_loss": -25.999109268188477, "global_step": 386040, "epoch": 4651} {"train_loss": -26.255462646484375, "global_step": 386041, "epoch": 4651} {"train_loss": -25.89884376525879, "global_step": 386042, "epoch": 4651} {"train_loss": -26.658361434936523, "global_step": 386043, "epoch": 4651} {"train_loss": -26.01869010925293, "global_step": 386044, "epoch": 4651} {"train_loss": -26.560714721679688, "global_step": 386045, "epoch": 4651} {"train_loss": -26.21189308166504, "global_step": 386046, "epoch": 4651} {"train_loss": -26.138565063476562, "global_step": 386047, "epoch": 4651} {"train_loss": -26.45221519470215, "global_step": 386048, "epoch": 4651} {"train_loss": -26.311023712158203, "global_step": 386049, "epoch": 4651} {"train_loss": -26.64316177368164, "global_step": 386050, "epoch": 4651} {"train_loss": -26.422210693359375, "global_step": 386051, "epoch": 4651} {"train_loss": -26.618154525756836, "global_step": 386052, "epoch": 4651} {"train_loss": -26.4433650970459, "global_step": 386053, "epoch": 4651} {"train_loss": -26.350793838500977, "global_step": 386054, "epoch": 4651} {"train_loss": -26.368371963500977, "global_step": 386055, "epoch": 4651} {"train_loss": -26.140222549438477, "global_step": 386056, "epoch": 4651} {"train_loss": -26.870899200439453, "global_step": 386057, "epoch": 4651} {"train_loss": -26.498632431030273, "global_step": 386058, "epoch": 4651} {"train_loss": -26.672443389892578, "global_step": 386059, "epoch": 4651} {"train_loss": -26.466093063354492, "global_step": 386060, "epoch": 4651} {"train_loss": -26.450830459594727, "global_step": 386061, "epoch": 4651} {"train_loss": -26.73841667175293, "global_step": 386062, "epoch": 4651} {"train_loss": -26.54823112487793, "global_step": 386063, "epoch": 4651} {"train_loss": -27.039508819580078, "global_step": 386064, "epoch": 4651} {"train_loss": -26.724552154541016, "global_step": 386065, "epoch": 4651} {"train_loss": -26.29611587524414, "global_step": 386066, "epoch": 4651} {"train_loss": -26.6536808013916, "global_step": 386067, "epoch": 4651} {"train_loss": -26.508743286132812, "global_step": 386068, "epoch": 4651} {"train_loss": -26.388158798217773, "global_step": 386069, "epoch": 4651} {"train_loss": -26.538288116455078, "global_step": 386070, "epoch": 4651} {"train_loss": -26.4959659576416, "global_step": 386071, "epoch": 4651} {"train_loss": -26.57342529296875, "global_step": 386072, "epoch": 4651} {"train_loss": -26.4102840423584, "global_step": 386073, "epoch": 4651} {"train_loss": -26.649206161499023, "global_step": 386074, "epoch": 4651} {"train_loss": -26.626195907592773, "global_step": 386075, "epoch": 4651} {"train_loss": -26.337112426757812, "global_step": 386076, "epoch": 4651} {"train_loss": -26.691160202026367, "global_step": 386077, "epoch": 4651} {"train_loss": -26.86567497253418, "global_step": 386078, "epoch": 4651} {"train_loss": -26.556812286376953, "global_step": 386079, "epoch": 4651} {"train_loss": -26.91499137878418, "global_step": 386080, "epoch": 4651} {"train_loss": -26.506855010986328, "global_step": 386081, "epoch": 4651} {"train_loss": -26.721668243408203, "global_step": 386082, "epoch": 4651} {"train_loss": -26.857391357421875, "global_step": 386083, "epoch": 4651} {"train_loss": -26.688404083251953, "global_step": 386084, "epoch": 4651} {"train_loss": -26.598058700561523, "global_step": 386085, "epoch": 4651} {"train_loss": -26.791852951049805, "global_step": 386086, "epoch": 4651} {"train_loss": -26.982147216796875, "global_step": 386087, "epoch": 4651} {"train_loss": -26.364126205444336, "global_step": 386088, "epoch": 4651} {"train_loss": -26.5153865814209, "global_step": 386089, "epoch": 4651} {"train_loss": -26.436054229736328, "global_step": 386090, "epoch": 4651} {"train_loss": -26.747156143188477, "global_step": 386091, "epoch": 4651} {"train_loss": -26.697513580322266, "global_step": 386092, "epoch": 4651} {"train_loss": -26.775806427001953, "global_step": 386093, "epoch": 4651} {"train_loss": -26.79596519470215, "global_step": 386094, "epoch": 4651} {"train_loss": -26.646804809570312, "global_step": 386095, "epoch": 4651} {"train_loss": -26.42902183532715, "global_step": 386096, "epoch": 4651} {"train_loss": -27.044858932495117, "global_step": 386097, "epoch": 4651} {"train_loss": -26.731998443603516, "global_step": 386098, "epoch": 4651} {"train_loss": -26.364423751831055, "global_step": 386099, "epoch": 4651} {"train_loss": -26.547657012939453, "global_step": 386100, "epoch": 4651} {"train_loss": -26.491071701049805, "global_step": 386101, "epoch": 4651} {"train_loss": -26.546911239624023, "global_step": 386102, "epoch": 4651} {"train_loss": -26.3577823638916, "global_step": 386103, "epoch": 4651} {"train_loss": -26.272348403930664, "global_step": 386104, "epoch": 4651} {"train_loss": -26.43583106994629, "global_step": 386105, "epoch": 4651} {"train_loss": -25.95369529724121, "global_step": 386106, "epoch": 4651} {"train_loss": -26.60053062438965, "global_step": 386107, "epoch": 4651} {"train_loss": -26.798261642456055, "global_step": 386108, "epoch": 4651} {"train_loss": -26.657672882080078, "global_step": 386109, "epoch": 4651} {"train_loss": -26.346948623657227, "global_step": 386110, "epoch": 4651} {"train_loss": -26.417627334594727, "global_step": 386111, "epoch": 4651} {"train_loss": -26.41975212097168, "global_step": 386112, "epoch": 4651} {"train_loss": -26.26778221130371, "global_step": 386113, "epoch": 4651} {"train_loss": -26.318769454956055, "global_step": 386114, "epoch": 4651} {"train_loss": -26.47714580398008, "global_step": 386115, "epoch": 4651, "val_loss": 6532795.5} {"train_loss": -25.97933006286621, "global_step": 386116, "epoch": 4652} {"train_loss": -25.581592559814453, "global_step": 386117, "epoch": 4652} {"train_loss": -25.807785034179688, "global_step": 386118, "epoch": 4652} {"train_loss": -26.036911010742188, "global_step": 386119, "epoch": 4652} {"train_loss": -25.677825927734375, "global_step": 386120, "epoch": 4652} {"train_loss": -26.030576705932617, "global_step": 386121, "epoch": 4652} {"train_loss": -25.919607162475586, "global_step": 386122, "epoch": 4652} {"train_loss": -25.25504493713379, "global_step": 386123, "epoch": 4652} {"train_loss": -25.667539596557617, "global_step": 386124, "epoch": 4652} {"train_loss": -26.153661727905273, "global_step": 386125, "epoch": 4652} {"train_loss": -26.299243927001953, "global_step": 386126, "epoch": 4652} {"train_loss": -26.151275634765625, "global_step": 386127, "epoch": 4652} {"train_loss": -26.186355590820312, "global_step": 386128, "epoch": 4652} {"train_loss": -26.027318954467773, "global_step": 386129, "epoch": 4652} {"train_loss": -26.118738174438477, "global_step": 386130, "epoch": 4652} {"train_loss": -26.198719024658203, "global_step": 386131, "epoch": 4652} {"train_loss": -26.4006290435791, "global_step": 386132, "epoch": 4652} {"train_loss": -26.340063095092773, "global_step": 386133, "epoch": 4652} {"train_loss": -25.900365829467773, "global_step": 386134, "epoch": 4652} {"train_loss": -25.978219985961914, "global_step": 386135, "epoch": 4652} {"train_loss": -26.22950553894043, "global_step": 386136, "epoch": 4652} {"train_loss": -26.37714195251465, "global_step": 386137, "epoch": 4652} {"train_loss": -26.282567977905273, "global_step": 386138, "epoch": 4652} {"train_loss": -26.117446899414062, "global_step": 386139, "epoch": 4652} {"train_loss": -26.3956241607666, "global_step": 386140, "epoch": 4652} {"train_loss": -26.143524169921875, "global_step": 386141, "epoch": 4652} {"train_loss": -25.755294799804688, "global_step": 386142, "epoch": 4652} {"train_loss": -26.296142578125, "global_step": 386143, "epoch": 4652} {"train_loss": -26.338727951049805, "global_step": 386144, "epoch": 4652} {"train_loss": -26.434080123901367, "global_step": 386145, "epoch": 4652} {"train_loss": -26.14457130432129, "global_step": 386146, "epoch": 4652} {"train_loss": -26.384449005126953, "global_step": 386147, "epoch": 4652} {"train_loss": -26.193592071533203, "global_step": 386148, "epoch": 4652} {"train_loss": -26.501266479492188, "global_step": 386149, "epoch": 4652} {"train_loss": -26.267126083374023, "global_step": 386150, "epoch": 4652} {"train_loss": -26.5871639251709, "global_step": 386151, "epoch": 4652} {"train_loss": -26.277053833007812, "global_step": 386152, "epoch": 4652} {"train_loss": -26.695865631103516, "global_step": 386153, "epoch": 4652} {"train_loss": -26.17766761779785, "global_step": 386154, "epoch": 4652} {"train_loss": -26.5899658203125, "global_step": 386155, "epoch": 4652} {"train_loss": -26.51584815979004, "global_step": 386156, "epoch": 4652} {"train_loss": -26.276611328125, "global_step": 386157, "epoch": 4652} {"train_loss": -26.17340660095215, "global_step": 386158, "epoch": 4652} {"train_loss": -26.57309341430664, "global_step": 386159, "epoch": 4652} {"train_loss": -26.152725219726562, "global_step": 386160, "epoch": 4652} {"train_loss": -26.388574600219727, "global_step": 386161, "epoch": 4652} {"train_loss": -26.445301055908203, "global_step": 386162, "epoch": 4652} {"train_loss": -26.620656967163086, "global_step": 386163, "epoch": 4652} {"train_loss": -26.541202545166016, "global_step": 386164, "epoch": 4652} {"train_loss": -26.353656768798828, "global_step": 386165, "epoch": 4652} {"train_loss": -26.527692794799805, "global_step": 386166, "epoch": 4652} {"train_loss": -26.607162475585938, "global_step": 386167, "epoch": 4652} {"train_loss": -26.377853393554688, "global_step": 386168, "epoch": 4652} {"train_loss": -26.53254508972168, "global_step": 386169, "epoch": 4652} {"train_loss": -25.72908592224121, "global_step": 386170, "epoch": 4652} {"train_loss": -26.19550895690918, "global_step": 386171, "epoch": 4652} {"train_loss": -26.612049102783203, "global_step": 386172, "epoch": 4652} {"train_loss": -26.591400146484375, "global_step": 386173, "epoch": 4652} {"train_loss": -26.68820571899414, "global_step": 386174, "epoch": 4652} {"train_loss": -26.390134811401367, "global_step": 386175, "epoch": 4652} {"train_loss": -26.627368927001953, "global_step": 386176, "epoch": 4652} {"train_loss": -26.59505271911621, "global_step": 386177, "epoch": 4652} {"train_loss": -26.491180419921875, "global_step": 386178, "epoch": 4652} {"train_loss": -26.73000144958496, "global_step": 386179, "epoch": 4652} {"train_loss": -26.685321807861328, "global_step": 386180, "epoch": 4652} {"train_loss": -26.441015243530273, "global_step": 386181, "epoch": 4652} {"train_loss": -26.948535919189453, "global_step": 386182, "epoch": 4652} {"train_loss": -26.883649826049805, "global_step": 386183, "epoch": 4652} {"train_loss": -26.657745361328125, "global_step": 386184, "epoch": 4652} {"train_loss": -26.4796199798584, "global_step": 386185, "epoch": 4652} {"train_loss": -26.529312133789062, "global_step": 386186, "epoch": 4652} {"train_loss": -26.82219886779785, "global_step": 386187, "epoch": 4652} {"train_loss": -26.691015243530273, "global_step": 386188, "epoch": 4652} {"train_loss": -26.44532585144043, "global_step": 386189, "epoch": 4652} {"train_loss": -26.855539321899414, "global_step": 386190, "epoch": 4652} {"train_loss": -26.635162353515625, "global_step": 386191, "epoch": 4652} {"train_loss": -26.46628761291504, "global_step": 386192, "epoch": 4652} {"train_loss": -26.874847412109375, "global_step": 386193, "epoch": 4652} {"train_loss": -26.93340492248535, "global_step": 386194, "epoch": 4652} {"train_loss": -27.051542282104492, "global_step": 386195, "epoch": 4652} {"train_loss": -26.625349044799805, "global_step": 386196, "epoch": 4652} {"train_loss": -26.648645401000977, "global_step": 386197, "epoch": 4652} {"train_loss": -26.363700981599738, "global_step": 386198, "epoch": 4652, "val_loss": 6587649.0} {"train_loss": -26.0849666595459, "global_step": 386199, "epoch": 4653} {"train_loss": -26.0093936920166, "global_step": 386200, "epoch": 4653} {"train_loss": -26.008176803588867, "global_step": 386201, "epoch": 4653} {"train_loss": -26.5339298248291, "global_step": 386202, "epoch": 4653} {"train_loss": -25.961944580078125, "global_step": 386203, "epoch": 4653} {"train_loss": -25.99722671508789, "global_step": 386204, "epoch": 4653} {"train_loss": -25.938404083251953, "global_step": 386205, "epoch": 4653} {"train_loss": -25.90369987487793, "global_step": 386206, "epoch": 4653} {"train_loss": -26.23822021484375, "global_step": 386207, "epoch": 4653} {"train_loss": -26.145538330078125, "global_step": 386208, "epoch": 4653} {"train_loss": -26.2514591217041, "global_step": 386209, "epoch": 4653} {"train_loss": -26.259326934814453, "global_step": 386210, "epoch": 4653} {"train_loss": -26.549169540405273, "global_step": 386211, "epoch": 4653} {"train_loss": -26.736658096313477, "global_step": 386212, "epoch": 4653} {"train_loss": -26.44461441040039, "global_step": 386213, "epoch": 4653} {"train_loss": -26.05881690979004, "global_step": 386214, "epoch": 4653} {"train_loss": -26.064167022705078, "global_step": 386215, "epoch": 4653} {"train_loss": -26.59388542175293, "global_step": 386216, "epoch": 4653} {"train_loss": -26.28082847595215, "global_step": 386217, "epoch": 4653} {"train_loss": -26.58086585998535, "global_step": 386218, "epoch": 4653} {"train_loss": -26.222192764282227, "global_step": 386219, "epoch": 4653} {"train_loss": -26.905546188354492, "global_step": 386220, "epoch": 4653} {"train_loss": -26.061599731445312, "global_step": 386221, "epoch": 4653} {"train_loss": -26.18377113342285, "global_step": 386222, "epoch": 4653} {"train_loss": -26.312610626220703, "global_step": 386223, "epoch": 4653} {"train_loss": -26.469314575195312, "global_step": 386224, "epoch": 4653} {"train_loss": -26.151458740234375, "global_step": 386225, "epoch": 4653} {"train_loss": -26.300146102905273, "global_step": 386226, "epoch": 4653} {"train_loss": -26.568021774291992, "global_step": 386227, "epoch": 4653} {"train_loss": -26.28927993774414, "global_step": 386228, "epoch": 4653} {"train_loss": -26.381027221679688, "global_step": 386229, "epoch": 4653} {"train_loss": -26.253015518188477, "global_step": 386230, "epoch": 4653} {"train_loss": -26.4659423828125, "global_step": 386231, "epoch": 4653} {"train_loss": -26.376724243164062, "global_step": 386232, "epoch": 4653} {"train_loss": -26.62030601501465, "global_step": 386233, "epoch": 4653} {"train_loss": -26.672595977783203, "global_step": 386234, "epoch": 4653} {"train_loss": -26.819721221923828, "global_step": 386235, "epoch": 4653} {"train_loss": -26.36569595336914, "global_step": 386236, "epoch": 4653} {"train_loss": -26.99757194519043, "global_step": 386237, "epoch": 4653} {"train_loss": -26.38490867614746, "global_step": 386238, "epoch": 4653} {"train_loss": -26.63437843322754, "global_step": 386239, "epoch": 4653} {"train_loss": -26.737934112548828, "global_step": 386240, "epoch": 4653} {"train_loss": -26.7468204498291, "global_step": 386241, "epoch": 4653} {"train_loss": -26.424701690673828, "global_step": 386242, "epoch": 4653} {"train_loss": -26.562265396118164, "global_step": 386243, "epoch": 4653} {"train_loss": -26.578771591186523, "global_step": 386244, "epoch": 4653} {"train_loss": -26.966699600219727, "global_step": 386245, "epoch": 4653} {"train_loss": -26.775928497314453, "global_step": 386246, "epoch": 4653} {"train_loss": -26.6184139251709, "global_step": 386247, "epoch": 4653} {"train_loss": -26.279544830322266, "global_step": 386248, "epoch": 4653} {"train_loss": -26.313501358032227, "global_step": 386249, "epoch": 4653} {"train_loss": -26.607486724853516, "global_step": 386250, "epoch": 4653} {"train_loss": -26.831928253173828, "global_step": 386251, "epoch": 4653} {"train_loss": -27.047719955444336, "global_step": 386252, "epoch": 4653} {"train_loss": -26.262964248657227, "global_step": 386253, "epoch": 4653} {"train_loss": -26.665735244750977, "global_step": 386254, "epoch": 4653} {"train_loss": -26.34766960144043, "global_step": 386255, "epoch": 4653} {"train_loss": -26.678913116455078, "global_step": 386256, "epoch": 4653} {"train_loss": -26.787067413330078, "global_step": 386257, "epoch": 4653} {"train_loss": -26.90089225769043, "global_step": 386258, "epoch": 4653} {"train_loss": -26.61555290222168, "global_step": 386259, "epoch": 4653} {"train_loss": -26.501859664916992, "global_step": 386260, "epoch": 4653} {"train_loss": -26.69077491760254, "global_step": 386261, "epoch": 4653} {"train_loss": -26.325448989868164, "global_step": 386262, "epoch": 4653} {"train_loss": -26.591156005859375, "global_step": 386263, "epoch": 4653} {"train_loss": -26.2923583984375, "global_step": 386264, "epoch": 4653} {"train_loss": -26.680768966674805, "global_step": 386265, "epoch": 4653} {"train_loss": -26.270795822143555, "global_step": 386266, "epoch": 4653} {"train_loss": -26.768661499023438, "global_step": 386267, "epoch": 4653} {"train_loss": -26.596668243408203, "global_step": 386268, "epoch": 4653} {"train_loss": -26.804441452026367, "global_step": 386269, "epoch": 4653} {"train_loss": -27.128814697265625, "global_step": 386270, "epoch": 4653} {"train_loss": -26.33359718322754, "global_step": 386271, "epoch": 4653} {"train_loss": -26.204456329345703, "global_step": 386272, "epoch": 4653} {"train_loss": -25.703100204467773, "global_step": 386273, "epoch": 4653} {"train_loss": -25.975622177124023, "global_step": 386274, "epoch": 4653} {"train_loss": -26.362125396728516, "global_step": 386275, "epoch": 4653} {"train_loss": -26.173263549804688, "global_step": 386276, "epoch": 4653} {"train_loss": -26.814077377319336, "global_step": 386277, "epoch": 4653} {"train_loss": -26.57718849182129, "global_step": 386278, "epoch": 4653} {"train_loss": -26.188495635986328, "global_step": 386279, "epoch": 4653} {"train_loss": -26.411996841430664, "global_step": 386280, "epoch": 4653} {"train_loss": -26.44011299868664, "global_step": 386281, "epoch": 4653, "val_loss": 6586131.0} {"train_loss": -25.840545654296875, "global_step": 386282, "epoch": 4654} {"train_loss": -25.539703369140625, "global_step": 386283, "epoch": 4654} {"train_loss": -25.11408042907715, "global_step": 386284, "epoch": 4654} {"train_loss": -25.556427001953125, "global_step": 386285, "epoch": 4654} {"train_loss": -25.772428512573242, "global_step": 386286, "epoch": 4654} {"train_loss": -25.872419357299805, "global_step": 386287, "epoch": 4654} {"train_loss": -25.798934936523438, "global_step": 386288, "epoch": 4654} {"train_loss": -25.978544235229492, "global_step": 386289, "epoch": 4654} {"train_loss": -25.649465560913086, "global_step": 386290, "epoch": 4654} {"train_loss": -26.377851486206055, "global_step": 386291, "epoch": 4654} {"train_loss": -25.680097579956055, "global_step": 386292, "epoch": 4654} {"train_loss": -25.837873458862305, "global_step": 386293, "epoch": 4654} {"train_loss": -26.05328369140625, "global_step": 386294, "epoch": 4654} {"train_loss": -25.786579132080078, "global_step": 386295, "epoch": 4654} {"train_loss": -25.685216903686523, "global_step": 386296, "epoch": 4654} {"train_loss": -26.065454483032227, "global_step": 386297, "epoch": 4654} {"train_loss": -25.92608070373535, "global_step": 386298, "epoch": 4654} {"train_loss": -26.076889038085938, "global_step": 386299, "epoch": 4654} {"train_loss": -25.866296768188477, "global_step": 386300, "epoch": 4654} {"train_loss": -25.912582397460938, "global_step": 386301, "epoch": 4654} {"train_loss": -26.149099349975586, "global_step": 386302, "epoch": 4654} {"train_loss": -26.192365646362305, "global_step": 386303, "epoch": 4654} {"train_loss": -25.955148696899414, "global_step": 386304, "epoch": 4654} {"train_loss": -26.2402400970459, "global_step": 386305, "epoch": 4654} {"train_loss": -26.513782501220703, "global_step": 386306, "epoch": 4654} {"train_loss": -26.548969268798828, "global_step": 386307, "epoch": 4654} {"train_loss": -26.2253360748291, "global_step": 386308, "epoch": 4654} {"train_loss": -26.345853805541992, "global_step": 386309, "epoch": 4654} {"train_loss": -26.20047950744629, "global_step": 386310, "epoch": 4654} {"train_loss": -26.320486068725586, "global_step": 386311, "epoch": 4654} {"train_loss": -26.659738540649414, "global_step": 386312, "epoch": 4654} {"train_loss": -26.57735252380371, "global_step": 386313, "epoch": 4654} {"train_loss": -26.7011661529541, "global_step": 386314, "epoch": 4654} {"train_loss": -26.42054557800293, "global_step": 386315, "epoch": 4654} {"train_loss": -26.772512435913086, "global_step": 386316, "epoch": 4654} {"train_loss": -26.598554611206055, "global_step": 386317, "epoch": 4654} {"train_loss": -26.867141723632812, "global_step": 386318, "epoch": 4654} {"train_loss": -26.44775390625, "global_step": 386319, "epoch": 4654} {"train_loss": -26.718536376953125, "global_step": 386320, "epoch": 4654} {"train_loss": -26.765905380249023, "global_step": 386321, "epoch": 4654} {"train_loss": -26.54047966003418, "global_step": 386322, "epoch": 4654} {"train_loss": -26.895273208618164, "global_step": 386323, "epoch": 4654} {"train_loss": -26.499969482421875, "global_step": 386324, "epoch": 4654} {"train_loss": -26.798574447631836, "global_step": 386325, "epoch": 4654} {"train_loss": -26.6446475982666, "global_step": 386326, "epoch": 4654} {"train_loss": -26.67355728149414, "global_step": 386327, "epoch": 4654} {"train_loss": -26.742719650268555, "global_step": 386328, "epoch": 4654} {"train_loss": -26.6695499420166, "global_step": 386329, "epoch": 4654} {"train_loss": -26.490966796875, "global_step": 386330, "epoch": 4654} {"train_loss": -26.553638458251953, "global_step": 386331, "epoch": 4654} {"train_loss": -26.881696701049805, "global_step": 386332, "epoch": 4654} {"train_loss": -27.12827491760254, "global_step": 386333, "epoch": 4654} {"train_loss": -26.7512264251709, "global_step": 386334, "epoch": 4654} {"train_loss": -26.35865592956543, "global_step": 386335, "epoch": 4654} {"train_loss": -26.73712730407715, "global_step": 386336, "epoch": 4654} {"train_loss": -26.467451095581055, "global_step": 386337, "epoch": 4654} {"train_loss": -26.423730850219727, "global_step": 386338, "epoch": 4654} {"train_loss": -26.667200088500977, "global_step": 386339, "epoch": 4654} {"train_loss": -25.540555953979492, "global_step": 386340, "epoch": 4654} {"train_loss": -24.714710235595703, "global_step": 386341, "epoch": 4654} {"train_loss": -25.53458023071289, "global_step": 386342, "epoch": 4654} {"train_loss": -25.961292266845703, "global_step": 386343, "epoch": 4654} {"train_loss": -25.52789306640625, "global_step": 386344, "epoch": 4654} {"train_loss": -26.234811782836914, "global_step": 386345, "epoch": 4654} {"train_loss": -26.16449546813965, "global_step": 386346, "epoch": 4654} {"train_loss": -26.23341178894043, "global_step": 386347, "epoch": 4654} {"train_loss": -26.096790313720703, "global_step": 386348, "epoch": 4654} {"train_loss": -26.321027755737305, "global_step": 386349, "epoch": 4654} {"train_loss": -26.530969619750977, "global_step": 386350, "epoch": 4654} {"train_loss": -26.277698516845703, "global_step": 386351, "epoch": 4654} {"train_loss": -25.968931198120117, "global_step": 386352, "epoch": 4654} {"train_loss": -26.416040420532227, "global_step": 386353, "epoch": 4654} {"train_loss": -25.73834228515625, "global_step": 386354, "epoch": 4654} {"train_loss": -26.38157081604004, "global_step": 386355, "epoch": 4654} {"train_loss": -26.24617576599121, "global_step": 386356, "epoch": 4654} {"train_loss": -26.556196212768555, "global_step": 386357, "epoch": 4654} {"train_loss": -26.169330596923828, "global_step": 386358, "epoch": 4654} {"train_loss": -25.67453956604004, "global_step": 386359, "epoch": 4654} {"train_loss": -26.740461349487305, "global_step": 386360, "epoch": 4654} {"train_loss": -26.2437686920166, "global_step": 386361, "epoch": 4654} {"train_loss": -26.378644943237305, "global_step": 386362, "epoch": 4654} {"train_loss": -26.16790199279785, "global_step": 386363, "epoch": 4654} {"train_loss": -26.243864243289075, "global_step": 386364, "epoch": 4654, "val_loss": 6543945.0} {"train_loss": -25.75543785095215, "global_step": 386365, "epoch": 4655} {"train_loss": -25.586618423461914, "global_step": 386366, "epoch": 4655} {"train_loss": -25.774738311767578, "global_step": 386367, "epoch": 4655} {"train_loss": -26.204328536987305, "global_step": 386368, "epoch": 4655} {"train_loss": -26.0669002532959, "global_step": 386369, "epoch": 4655} {"train_loss": -26.18111228942871, "global_step": 386370, "epoch": 4655} {"train_loss": -26.29913330078125, "global_step": 386371, "epoch": 4655} {"train_loss": -26.001001358032227, "global_step": 386372, "epoch": 4655} {"train_loss": -26.2888240814209, "global_step": 386373, "epoch": 4655} {"train_loss": -26.071996688842773, "global_step": 386374, "epoch": 4655} {"train_loss": -26.270401000976562, "global_step": 386375, "epoch": 4655} {"train_loss": -26.24287986755371, "global_step": 386376, "epoch": 4655} {"train_loss": -26.1979923248291, "global_step": 386377, "epoch": 4655} {"train_loss": -26.255355834960938, "global_step": 386378, "epoch": 4655} {"train_loss": -26.395172119140625, "global_step": 386379, "epoch": 4655} {"train_loss": -26.369604110717773, "global_step": 386380, "epoch": 4655} {"train_loss": -26.490234375, "global_step": 386381, "epoch": 4655} {"train_loss": -26.584396362304688, "global_step": 386382, "epoch": 4655} {"train_loss": -26.4810733795166, "global_step": 386383, "epoch": 4655} {"train_loss": -26.424823760986328, "global_step": 386384, "epoch": 4655} {"train_loss": -26.516498565673828, "global_step": 386385, "epoch": 4655} {"train_loss": -26.628400802612305, "global_step": 386386, "epoch": 4655} {"train_loss": -26.288537979125977, "global_step": 386387, "epoch": 4655} {"train_loss": -26.551422119140625, "global_step": 386388, "epoch": 4655} {"train_loss": -26.676660537719727, "global_step": 386389, "epoch": 4655} {"train_loss": -26.25299072265625, "global_step": 386390, "epoch": 4655} {"train_loss": -26.7132511138916, "global_step": 386391, "epoch": 4655} {"train_loss": -26.3560848236084, "global_step": 386392, "epoch": 4655} {"train_loss": -26.67561912536621, "global_step": 386393, "epoch": 4655} {"train_loss": -26.790084838867188, "global_step": 386394, "epoch": 4655} {"train_loss": -26.319976806640625, "global_step": 386395, "epoch": 4655} {"train_loss": -26.627248764038086, "global_step": 386396, "epoch": 4655} {"train_loss": -26.548593521118164, "global_step": 386397, "epoch": 4655} {"train_loss": -26.405317306518555, "global_step": 386398, "epoch": 4655} {"train_loss": -26.544897079467773, "global_step": 386399, "epoch": 4655} {"train_loss": -26.953876495361328, "global_step": 386400, "epoch": 4655} {"train_loss": -26.7960147857666, "global_step": 386401, "epoch": 4655} {"train_loss": -26.60346794128418, "global_step": 386402, "epoch": 4655} {"train_loss": -26.896493911743164, "global_step": 386403, "epoch": 4655} {"train_loss": -26.426050186157227, "global_step": 386404, "epoch": 4655} {"train_loss": -26.627233505249023, "global_step": 386405, "epoch": 4655} {"train_loss": -27.168197631835938, "global_step": 386406, "epoch": 4655} {"train_loss": -26.98360252380371, "global_step": 386407, "epoch": 4655} {"train_loss": -26.77776527404785, "global_step": 386408, "epoch": 4655} {"train_loss": -26.753955841064453, "global_step": 386409, "epoch": 4655} {"train_loss": -26.664209365844727, "global_step": 386410, "epoch": 4655} {"train_loss": -26.860034942626953, "global_step": 386411, "epoch": 4655} {"train_loss": -26.974628448486328, "global_step": 386412, "epoch": 4655} {"train_loss": -26.477069854736328, "global_step": 386413, "epoch": 4655} {"train_loss": -26.961267471313477, "global_step": 386414, "epoch": 4655} {"train_loss": -26.7109432220459, "global_step": 386415, "epoch": 4655} {"train_loss": -27.076658248901367, "global_step": 386416, "epoch": 4655} {"train_loss": -26.23525047302246, "global_step": 386417, "epoch": 4655} {"train_loss": -25.819910049438477, "global_step": 386418, "epoch": 4655} {"train_loss": -25.454675674438477, "global_step": 386419, "epoch": 4655} {"train_loss": -24.63215446472168, "global_step": 386420, "epoch": 4655} {"train_loss": -24.461923599243164, "global_step": 386421, "epoch": 4655} {"train_loss": -24.57472801208496, "global_step": 386422, "epoch": 4655} {"train_loss": -25.8114013671875, "global_step": 386423, "epoch": 4655} {"train_loss": -26.34986686706543, "global_step": 386424, "epoch": 4655} {"train_loss": -25.406757354736328, "global_step": 386425, "epoch": 4655} {"train_loss": -25.940876007080078, "global_step": 386426, "epoch": 4655} {"train_loss": -26.259445190429688, "global_step": 386427, "epoch": 4655} {"train_loss": -26.154386520385742, "global_step": 386428, "epoch": 4655} {"train_loss": -25.723865509033203, "global_step": 386429, "epoch": 4655} {"train_loss": -25.786283493041992, "global_step": 386430, "epoch": 4655} {"train_loss": -25.899188995361328, "global_step": 386431, "epoch": 4655} {"train_loss": -25.84842872619629, "global_step": 386432, "epoch": 4655} {"train_loss": -25.739505767822266, "global_step": 386433, "epoch": 4655} {"train_loss": -26.007726669311523, "global_step": 386434, "epoch": 4655} {"train_loss": -26.105377197265625, "global_step": 386435, "epoch": 4655} {"train_loss": -26.24704360961914, "global_step": 386436, "epoch": 4655} {"train_loss": -26.203601837158203, "global_step": 386437, "epoch": 4655} {"train_loss": -26.147979736328125, "global_step": 386438, "epoch": 4655} {"train_loss": -26.157901763916016, "global_step": 386439, "epoch": 4655} {"train_loss": -26.303958892822266, "global_step": 386440, "epoch": 4655} {"train_loss": -26.11275291442871, "global_step": 386441, "epoch": 4655} {"train_loss": -26.342071533203125, "global_step": 386442, "epoch": 4655} {"train_loss": -26.321796417236328, "global_step": 386443, "epoch": 4655} {"train_loss": -26.343835830688477, "global_step": 386444, "epoch": 4655} {"train_loss": -26.19537353515625, "global_step": 386445, "epoch": 4655} {"train_loss": -26.026721954345703, "global_step": 386446, "epoch": 4655} {"train_loss": -26.288662324468774, "global_step": 386447, "epoch": 4655, "val_loss": 6596473.0} {"train_loss": -26.1313419342041, "global_step": 386448, "epoch": 4656} {"train_loss": -25.83577537536621, "global_step": 386449, "epoch": 4656} {"train_loss": -25.904621124267578, "global_step": 386450, "epoch": 4656} {"train_loss": -26.287649154663086, "global_step": 386451, "epoch": 4656} {"train_loss": -26.22926139831543, "global_step": 386452, "epoch": 4656} {"train_loss": -26.344818115234375, "global_step": 386453, "epoch": 4656} {"train_loss": -26.40693473815918, "global_step": 386454, "epoch": 4656} {"train_loss": -26.082334518432617, "global_step": 386455, "epoch": 4656} {"train_loss": -26.2423095703125, "global_step": 386456, "epoch": 4656} {"train_loss": -26.49732780456543, "global_step": 386457, "epoch": 4656} {"train_loss": -26.246557235717773, "global_step": 386458, "epoch": 4656} {"train_loss": -26.313434600830078, "global_step": 386459, "epoch": 4656} {"train_loss": -26.0692138671875, "global_step": 386460, "epoch": 4656} {"train_loss": -26.426992416381836, "global_step": 386461, "epoch": 4656} {"train_loss": -26.30559730529785, "global_step": 386462, "epoch": 4656} {"train_loss": -26.47368812561035, "global_step": 386463, "epoch": 4656} {"train_loss": -26.258264541625977, "global_step": 386464, "epoch": 4656} {"train_loss": -26.505807876586914, "global_step": 386465, "epoch": 4656} {"train_loss": -26.14703369140625, "global_step": 386466, "epoch": 4656} {"train_loss": -26.324878692626953, "global_step": 386467, "epoch": 4656} {"train_loss": -26.541540145874023, "global_step": 386468, "epoch": 4656} {"train_loss": -26.1881160736084, "global_step": 386469, "epoch": 4656} {"train_loss": -26.365314483642578, "global_step": 386470, "epoch": 4656} {"train_loss": -26.418994903564453, "global_step": 386471, "epoch": 4656} {"train_loss": -26.644454956054688, "global_step": 386472, "epoch": 4656} {"train_loss": -26.51010513305664, "global_step": 386473, "epoch": 4656} {"train_loss": -26.452621459960938, "global_step": 386474, "epoch": 4656} {"train_loss": -26.685094833374023, "global_step": 386475, "epoch": 4656} {"train_loss": -26.517333984375, "global_step": 386476, "epoch": 4656} {"train_loss": -26.575170516967773, "global_step": 386477, "epoch": 4656} {"train_loss": -26.45465660095215, "global_step": 386478, "epoch": 4656} {"train_loss": -26.68808937072754, "global_step": 386479, "epoch": 4656} {"train_loss": -26.45218849182129, "global_step": 386480, "epoch": 4656} {"train_loss": -26.90522575378418, "global_step": 386481, "epoch": 4656} {"train_loss": -26.854352951049805, "global_step": 386482, "epoch": 4656} {"train_loss": -27.198339462280273, "global_step": 386483, "epoch": 4656} {"train_loss": -26.527063369750977, "global_step": 386484, "epoch": 4656} {"train_loss": -26.669504165649414, "global_step": 386485, "epoch": 4656} {"train_loss": -26.45411491394043, "global_step": 386486, "epoch": 4656} {"train_loss": -26.8374080657959, "global_step": 386487, "epoch": 4656} {"train_loss": -26.6304931640625, "global_step": 386488, "epoch": 4656} {"train_loss": -26.935688018798828, "global_step": 386489, "epoch": 4656} {"train_loss": -26.51641845703125, "global_step": 386490, "epoch": 4656} {"train_loss": -26.66340446472168, "global_step": 386491, "epoch": 4656} {"train_loss": -26.545459747314453, "global_step": 386492, "epoch": 4656} {"train_loss": -26.45499610900879, "global_step": 386493, "epoch": 4656} {"train_loss": -26.54640007019043, "global_step": 386494, "epoch": 4656} {"train_loss": -26.404172897338867, "global_step": 386495, "epoch": 4656} {"train_loss": -26.467817306518555, "global_step": 386496, "epoch": 4656} {"train_loss": -26.088834762573242, "global_step": 386497, "epoch": 4656} {"train_loss": -25.797317504882812, "global_step": 386498, "epoch": 4656} {"train_loss": -25.07769775390625, "global_step": 386499, "epoch": 4656} {"train_loss": -25.651208877563477, "global_step": 386500, "epoch": 4656} {"train_loss": -25.482833862304688, "global_step": 386501, "epoch": 4656} {"train_loss": -26.324087142944336, "global_step": 386502, "epoch": 4656} {"train_loss": -26.666248321533203, "global_step": 386503, "epoch": 4656} {"train_loss": -26.26502799987793, "global_step": 386504, "epoch": 4656} {"train_loss": -26.319700241088867, "global_step": 386505, "epoch": 4656} {"train_loss": -25.875898361206055, "global_step": 386506, "epoch": 4656} {"train_loss": -26.343189239501953, "global_step": 386507, "epoch": 4656} {"train_loss": -26.285449981689453, "global_step": 386508, "epoch": 4656} {"train_loss": -26.057209014892578, "global_step": 386509, "epoch": 4656} {"train_loss": -26.786865234375, "global_step": 386510, "epoch": 4656} {"train_loss": -26.303333282470703, "global_step": 386511, "epoch": 4656} {"train_loss": -26.34916114807129, "global_step": 386512, "epoch": 4656} {"train_loss": -26.45188331604004, "global_step": 386513, "epoch": 4656} {"train_loss": -26.361425399780273, "global_step": 386514, "epoch": 4656} {"train_loss": -26.712207794189453, "global_step": 386515, "epoch": 4656} {"train_loss": -26.48004722595215, "global_step": 386516, "epoch": 4656} {"train_loss": -26.489608764648438, "global_step": 386517, "epoch": 4656} {"train_loss": -26.906753540039062, "global_step": 386518, "epoch": 4656} {"train_loss": -26.80352210998535, "global_step": 386519, "epoch": 4656} {"train_loss": -26.460657119750977, "global_step": 386520, "epoch": 4656} {"train_loss": -26.283466339111328, "global_step": 386521, "epoch": 4656} {"train_loss": -26.5988826751709, "global_step": 386522, "epoch": 4656} {"train_loss": -26.44294548034668, "global_step": 386523, "epoch": 4656} {"train_loss": -26.573486328125, "global_step": 386524, "epoch": 4656} {"train_loss": -26.806903839111328, "global_step": 386525, "epoch": 4656} {"train_loss": -26.70086097717285, "global_step": 386526, "epoch": 4656} {"train_loss": -26.777753829956055, "global_step": 386527, "epoch": 4656} {"train_loss": -26.68403434753418, "global_step": 386528, "epoch": 4656} {"train_loss": -26.712665557861328, "global_step": 386529, "epoch": 4656} {"train_loss": -26.409140161721105, "global_step": 386530, "epoch": 4656, "val_loss": 6502315.0} {"train_loss": -25.740299224853516, "global_step": 386531, "epoch": 4657} {"train_loss": -24.382217407226562, "global_step": 386532, "epoch": 4657} {"train_loss": -23.972658157348633, "global_step": 386533, "epoch": 4657} {"train_loss": -25.969161987304688, "global_step": 386534, "epoch": 4657} {"train_loss": -25.077253341674805, "global_step": 386535, "epoch": 4657} {"train_loss": -24.93168067932129, "global_step": 386536, "epoch": 4657} {"train_loss": -25.00920867919922, "global_step": 386537, "epoch": 4657} {"train_loss": -25.547069549560547, "global_step": 386538, "epoch": 4657} {"train_loss": -24.764453887939453, "global_step": 386539, "epoch": 4657} {"train_loss": -26.176923751831055, "global_step": 386540, "epoch": 4657} {"train_loss": -25.970932006835938, "global_step": 386541, "epoch": 4657} {"train_loss": -25.73834800720215, "global_step": 386542, "epoch": 4657} {"train_loss": -25.997089385986328, "global_step": 386543, "epoch": 4657} {"train_loss": -25.7912540435791, "global_step": 386544, "epoch": 4657} {"train_loss": -25.711307525634766, "global_step": 386545, "epoch": 4657} {"train_loss": -26.087533950805664, "global_step": 386546, "epoch": 4657} {"train_loss": -26.08164405822754, "global_step": 386547, "epoch": 4657} {"train_loss": -25.878482818603516, "global_step": 386548, "epoch": 4657} {"train_loss": -25.87822914123535, "global_step": 386549, "epoch": 4657} {"train_loss": -26.020660400390625, "global_step": 386550, "epoch": 4657} {"train_loss": -26.21906852722168, "global_step": 386551, "epoch": 4657} {"train_loss": -25.8735294342041, "global_step": 386552, "epoch": 4657} {"train_loss": -26.21529197692871, "global_step": 386553, "epoch": 4657} {"train_loss": -25.7841854095459, "global_step": 386554, "epoch": 4657} {"train_loss": -26.05598258972168, "global_step": 386555, "epoch": 4657} {"train_loss": -25.947179794311523, "global_step": 386556, "epoch": 4657} {"train_loss": -26.4710750579834, "global_step": 386557, "epoch": 4657} {"train_loss": -26.550317764282227, "global_step": 386558, "epoch": 4657} {"train_loss": -26.371856689453125, "global_step": 386559, "epoch": 4657} {"train_loss": -26.294189453125, "global_step": 386560, "epoch": 4657} {"train_loss": -26.184106826782227, "global_step": 386561, "epoch": 4657} {"train_loss": -26.636327743530273, "global_step": 386562, "epoch": 4657} {"train_loss": -26.344396591186523, "global_step": 386563, "epoch": 4657} {"train_loss": -26.469348907470703, "global_step": 386564, "epoch": 4657} {"train_loss": -26.40911865234375, "global_step": 386565, "epoch": 4657} {"train_loss": -26.575820922851562, "global_step": 386566, "epoch": 4657} {"train_loss": -26.405105590820312, "global_step": 386567, "epoch": 4657} {"train_loss": -26.37178611755371, "global_step": 386568, "epoch": 4657} {"train_loss": -26.5313777923584, "global_step": 386569, "epoch": 4657} {"train_loss": -26.642475128173828, "global_step": 386570, "epoch": 4657} {"train_loss": -26.565185546875, "global_step": 386571, "epoch": 4657} {"train_loss": -26.608015060424805, "global_step": 386572, "epoch": 4657} {"train_loss": -26.6239070892334, "global_step": 386573, "epoch": 4657} {"train_loss": -26.371795654296875, "global_step": 386574, "epoch": 4657} {"train_loss": -26.492345809936523, "global_step": 386575, "epoch": 4657} {"train_loss": -26.271469116210938, "global_step": 386576, "epoch": 4657} {"train_loss": -26.631122589111328, "global_step": 386577, "epoch": 4657} {"train_loss": -26.859699249267578, "global_step": 386578, "epoch": 4657} {"train_loss": -26.447385787963867, "global_step": 386579, "epoch": 4657} {"train_loss": -26.4074764251709, "global_step": 386580, "epoch": 4657} {"train_loss": -26.78394889831543, "global_step": 386581, "epoch": 4657} {"train_loss": -26.563459396362305, "global_step": 386582, "epoch": 4657} {"train_loss": -26.526350021362305, "global_step": 386583, "epoch": 4657} {"train_loss": -26.577163696289062, "global_step": 386584, "epoch": 4657} {"train_loss": -26.728124618530273, "global_step": 386585, "epoch": 4657} {"train_loss": -26.761062622070312, "global_step": 386586, "epoch": 4657} {"train_loss": -26.519506454467773, "global_step": 386587, "epoch": 4657} {"train_loss": -26.55327796936035, "global_step": 386588, "epoch": 4657} {"train_loss": -26.30594825744629, "global_step": 386589, "epoch": 4657} {"train_loss": -26.77448844909668, "global_step": 386590, "epoch": 4657} {"train_loss": -26.533166885375977, "global_step": 386591, "epoch": 4657} {"train_loss": -26.856103897094727, "global_step": 386592, "epoch": 4657} {"train_loss": -26.678495407104492, "global_step": 386593, "epoch": 4657} {"train_loss": -26.602197647094727, "global_step": 386594, "epoch": 4657} {"train_loss": -26.89020347595215, "global_step": 386595, "epoch": 4657} {"train_loss": -26.875446319580078, "global_step": 386596, "epoch": 4657} {"train_loss": -26.979291915893555, "global_step": 386597, "epoch": 4657} {"train_loss": -26.675336837768555, "global_step": 386598, "epoch": 4657} {"train_loss": -26.353595733642578, "global_step": 386599, "epoch": 4657} {"train_loss": -26.205673217773438, "global_step": 386600, "epoch": 4657} {"train_loss": -26.500568389892578, "global_step": 386601, "epoch": 4657} {"train_loss": -26.31182289123535, "global_step": 386602, "epoch": 4657} {"train_loss": -26.395822525024414, "global_step": 386603, "epoch": 4657} {"train_loss": -26.622314453125, "global_step": 386604, "epoch": 4657} {"train_loss": -26.490997314453125, "global_step": 386605, "epoch": 4657} {"train_loss": -26.777578353881836, "global_step": 386606, "epoch": 4657} {"train_loss": -26.3491153717041, "global_step": 386607, "epoch": 4657} {"train_loss": -27.004159927368164, "global_step": 386608, "epoch": 4657} {"train_loss": -26.209552764892578, "global_step": 386609, "epoch": 4657} {"train_loss": -26.320037841796875, "global_step": 386610, "epoch": 4657} {"train_loss": -26.717649459838867, "global_step": 386611, "epoch": 4657} {"train_loss": -27.06032371520996, "global_step": 386612, "epoch": 4657} {"train_loss": -26.25745265455131, "global_step": 386613, "epoch": 4657, "val_loss": 6585615.0} {"train_loss": -26.09111976623535, "global_step": 386614, "epoch": 4658} {"train_loss": -25.48880386352539, "global_step": 386615, "epoch": 4658} {"train_loss": -25.893924713134766, "global_step": 386616, "epoch": 4658} {"train_loss": -25.849958419799805, "global_step": 386617, "epoch": 4658} {"train_loss": -26.400663375854492, "global_step": 386618, "epoch": 4658} {"train_loss": -25.890472412109375, "global_step": 386619, "epoch": 4658} {"train_loss": -26.129682540893555, "global_step": 386620, "epoch": 4658} {"train_loss": -26.10564613342285, "global_step": 386621, "epoch": 4658} {"train_loss": -26.209228515625, "global_step": 386622, "epoch": 4658} {"train_loss": -26.4609375, "global_step": 386623, "epoch": 4658} {"train_loss": -26.319355010986328, "global_step": 386624, "epoch": 4658} {"train_loss": -26.360702514648438, "global_step": 386625, "epoch": 4658} {"train_loss": -26.492124557495117, "global_step": 386626, "epoch": 4658} {"train_loss": -26.216400146484375, "global_step": 386627, "epoch": 4658} {"train_loss": -26.1408748626709, "global_step": 386628, "epoch": 4658} {"train_loss": -26.364933013916016, "global_step": 386629, "epoch": 4658} {"train_loss": -26.111352920532227, "global_step": 386630, "epoch": 4658} {"train_loss": -26.39808464050293, "global_step": 386631, "epoch": 4658} {"train_loss": -26.443838119506836, "global_step": 386632, "epoch": 4658} {"train_loss": -26.66845703125, "global_step": 386633, "epoch": 4658} {"train_loss": -26.613248825073242, "global_step": 386634, "epoch": 4658} {"train_loss": -26.5010986328125, "global_step": 386635, "epoch": 4658} {"train_loss": -26.33399772644043, "global_step": 386636, "epoch": 4658} {"train_loss": -26.246143341064453, "global_step": 386637, "epoch": 4658} {"train_loss": -26.770954132080078, "global_step": 386638, "epoch": 4658} {"train_loss": -26.59980583190918, "global_step": 386639, "epoch": 4658} {"train_loss": -26.37641716003418, "global_step": 386640, "epoch": 4658} {"train_loss": -26.11174964904785, "global_step": 386641, "epoch": 4658} {"train_loss": -26.55506706237793, "global_step": 386642, "epoch": 4658} {"train_loss": -26.605316162109375, "global_step": 386643, "epoch": 4658} {"train_loss": -26.610355377197266, "global_step": 386644, "epoch": 4658} {"train_loss": -26.5360164642334, "global_step": 386645, "epoch": 4658} {"train_loss": -26.561603546142578, "global_step": 386646, "epoch": 4658} {"train_loss": -26.363203048706055, "global_step": 386647, "epoch": 4658} {"train_loss": -27.064558029174805, "global_step": 386648, "epoch": 4658} {"train_loss": -26.396148681640625, "global_step": 386649, "epoch": 4658} {"train_loss": -26.621667861938477, "global_step": 386650, "epoch": 4658} {"train_loss": -26.461851119995117, "global_step": 386651, "epoch": 4658} {"train_loss": -26.528589248657227, "global_step": 386652, "epoch": 4658} {"train_loss": -26.361677169799805, "global_step": 386653, "epoch": 4658} {"train_loss": -26.81512451171875, "global_step": 386654, "epoch": 4658} {"train_loss": -26.643665313720703, "global_step": 386655, "epoch": 4658} {"train_loss": -26.7611026763916, "global_step": 386656, "epoch": 4658} {"train_loss": -26.17316246032715, "global_step": 386657, "epoch": 4658} {"train_loss": -26.542804718017578, "global_step": 386658, "epoch": 4658} {"train_loss": -26.345489501953125, "global_step": 386659, "epoch": 4658} {"train_loss": -26.069473266601562, "global_step": 386660, "epoch": 4658} {"train_loss": -26.497846603393555, "global_step": 386661, "epoch": 4658} {"train_loss": -25.832738876342773, "global_step": 386662, "epoch": 4658} {"train_loss": -26.544137954711914, "global_step": 386663, "epoch": 4658} {"train_loss": -26.6258487701416, "global_step": 386664, "epoch": 4658} {"train_loss": -26.055286407470703, "global_step": 386665, "epoch": 4658} {"train_loss": -26.585851669311523, "global_step": 386666, "epoch": 4658} {"train_loss": -26.629602432250977, "global_step": 386667, "epoch": 4658} {"train_loss": -26.312408447265625, "global_step": 386668, "epoch": 4658} {"train_loss": -26.431640625, "global_step": 386669, "epoch": 4658} {"train_loss": -26.624774932861328, "global_step": 386670, "epoch": 4658} {"train_loss": -26.19080924987793, "global_step": 386671, "epoch": 4658} {"train_loss": -26.838659286499023, "global_step": 386672, "epoch": 4658} {"train_loss": -26.772729873657227, "global_step": 386673, "epoch": 4658} {"train_loss": -26.2602596282959, "global_step": 386674, "epoch": 4658} {"train_loss": -26.996305465698242, "global_step": 386675, "epoch": 4658} {"train_loss": -26.529443740844727, "global_step": 386676, "epoch": 4658} {"train_loss": -26.090742111206055, "global_step": 386677, "epoch": 4658} {"train_loss": -26.46713638305664, "global_step": 386678, "epoch": 4658} {"train_loss": -26.352630615234375, "global_step": 386679, "epoch": 4658} {"train_loss": -26.45401954650879, "global_step": 386680, "epoch": 4658} {"train_loss": -26.274988174438477, "global_step": 386681, "epoch": 4658} {"train_loss": -27.003376007080078, "global_step": 386682, "epoch": 4658} {"train_loss": -26.40215492248535, "global_step": 386683, "epoch": 4658} {"train_loss": -26.699934005737305, "global_step": 386684, "epoch": 4658} {"train_loss": -26.719928741455078, "global_step": 386685, "epoch": 4658} {"train_loss": -26.5128116607666, "global_step": 386686, "epoch": 4658} {"train_loss": -26.887603759765625, "global_step": 386687, "epoch": 4658} {"train_loss": -26.894433975219727, "global_step": 386688, "epoch": 4658} {"train_loss": -26.77284049987793, "global_step": 386689, "epoch": 4658} {"train_loss": -26.856687545776367, "global_step": 386690, "epoch": 4658} {"train_loss": -26.81904411315918, "global_step": 386691, "epoch": 4658} {"train_loss": -26.766889572143555, "global_step": 386692, "epoch": 4658} {"train_loss": -26.775165557861328, "global_step": 386693, "epoch": 4658} {"train_loss": -26.543676376342773, "global_step": 386694, "epoch": 4658} {"train_loss": -26.63746452331543, "global_step": 386695, "epoch": 4658} {"train_loss": -26.47912305808929, "global_step": 386696, "epoch": 4658, "val_loss": 6615010.5} {"train_loss": -25.788476943969727, "global_step": 386697, "epoch": 4659} {"train_loss": -25.985254287719727, "global_step": 386698, "epoch": 4659} {"train_loss": -26.108816146850586, "global_step": 386699, "epoch": 4659} {"train_loss": -26.398822784423828, "global_step": 386700, "epoch": 4659} {"train_loss": -26.21724510192871, "global_step": 386701, "epoch": 4659} {"train_loss": -26.430438995361328, "global_step": 386702, "epoch": 4659} {"train_loss": -26.26318359375, "global_step": 386703, "epoch": 4659} {"train_loss": -25.766925811767578, "global_step": 386704, "epoch": 4659} {"train_loss": -26.310388565063477, "global_step": 386705, "epoch": 4659} {"train_loss": -26.50360679626465, "global_step": 386706, "epoch": 4659} {"train_loss": -25.47947120666504, "global_step": 386707, "epoch": 4659} {"train_loss": -25.64035987854004, "global_step": 386708, "epoch": 4659} {"train_loss": -25.848142623901367, "global_step": 386709, "epoch": 4659} {"train_loss": -26.233068466186523, "global_step": 386710, "epoch": 4659} {"train_loss": -25.66517448425293, "global_step": 386711, "epoch": 4659} {"train_loss": -26.047611236572266, "global_step": 386712, "epoch": 4659} {"train_loss": -26.04791831970215, "global_step": 386713, "epoch": 4659} {"train_loss": -26.2255859375, "global_step": 386714, "epoch": 4659} {"train_loss": -26.304168701171875, "global_step": 386715, "epoch": 4659} {"train_loss": -26.011337280273438, "global_step": 386716, "epoch": 4659} {"train_loss": -26.177173614501953, "global_step": 386717, "epoch": 4659} {"train_loss": -26.17107582092285, "global_step": 386718, "epoch": 4659} {"train_loss": -25.85605239868164, "global_step": 386719, "epoch": 4659} {"train_loss": -25.80742835998535, "global_step": 386720, "epoch": 4659} {"train_loss": -26.58644676208496, "global_step": 386721, "epoch": 4659} {"train_loss": -26.314208984375, "global_step": 386722, "epoch": 4659} {"train_loss": -26.261518478393555, "global_step": 386723, "epoch": 4659} {"train_loss": -26.51423454284668, "global_step": 386724, "epoch": 4659} {"train_loss": -26.124969482421875, "global_step": 386725, "epoch": 4659} {"train_loss": -26.26093101501465, "global_step": 386726, "epoch": 4659} {"train_loss": -26.519433975219727, "global_step": 386727, "epoch": 4659} {"train_loss": -26.322742462158203, "global_step": 386728, "epoch": 4659} {"train_loss": -26.917272567749023, "global_step": 386729, "epoch": 4659} {"train_loss": -26.413467407226562, "global_step": 386730, "epoch": 4659} {"train_loss": -26.834156036376953, "global_step": 386731, "epoch": 4659} {"train_loss": -26.469465255737305, "global_step": 386732, "epoch": 4659} {"train_loss": -26.732349395751953, "global_step": 386733, "epoch": 4659} {"train_loss": -26.589399337768555, "global_step": 386734, "epoch": 4659} {"train_loss": -26.403949737548828, "global_step": 386735, "epoch": 4659} {"train_loss": -26.291675567626953, "global_step": 386736, "epoch": 4659} {"train_loss": -26.95830726623535, "global_step": 386737, "epoch": 4659} {"train_loss": -26.81464195251465, "global_step": 386738, "epoch": 4659} {"train_loss": -26.497312545776367, "global_step": 386739, "epoch": 4659} {"train_loss": -26.664722442626953, "global_step": 386740, "epoch": 4659} {"train_loss": -26.279327392578125, "global_step": 386741, "epoch": 4659} {"train_loss": -26.62652587890625, "global_step": 386742, "epoch": 4659} {"train_loss": -26.567829132080078, "global_step": 386743, "epoch": 4659} {"train_loss": -27.07209587097168, "global_step": 386744, "epoch": 4659} {"train_loss": -26.58808708190918, "global_step": 386745, "epoch": 4659} {"train_loss": -26.631620407104492, "global_step": 386746, "epoch": 4659} {"train_loss": -26.787128448486328, "global_step": 386747, "epoch": 4659} {"train_loss": -26.503034591674805, "global_step": 386748, "epoch": 4659} {"train_loss": -26.5257568359375, "global_step": 386749, "epoch": 4659} {"train_loss": -26.846942901611328, "global_step": 386750, "epoch": 4659} {"train_loss": -26.869205474853516, "global_step": 386751, "epoch": 4659} {"train_loss": -26.467039108276367, "global_step": 386752, "epoch": 4659} {"train_loss": -26.51881980895996, "global_step": 386753, "epoch": 4659} {"train_loss": -26.470502853393555, "global_step": 386754, "epoch": 4659} {"train_loss": -26.740219116210938, "global_step": 386755, "epoch": 4659} {"train_loss": -26.85645866394043, "global_step": 386756, "epoch": 4659} {"train_loss": -26.427265167236328, "global_step": 386757, "epoch": 4659} {"train_loss": -26.4768009185791, "global_step": 386758, "epoch": 4659} {"train_loss": -26.172048568725586, "global_step": 386759, "epoch": 4659} {"train_loss": -26.5721435546875, "global_step": 386760, "epoch": 4659} {"train_loss": -26.371509552001953, "global_step": 386761, "epoch": 4659} {"train_loss": -26.66082191467285, "global_step": 386762, "epoch": 4659} {"train_loss": -26.495328903198242, "global_step": 386763, "epoch": 4659} {"train_loss": -26.613311767578125, "global_step": 386764, "epoch": 4659} {"train_loss": -26.56103515625, "global_step": 386765, "epoch": 4659} {"train_loss": -26.460529327392578, "global_step": 386766, "epoch": 4659} {"train_loss": -26.88675880432129, "global_step": 386767, "epoch": 4659} {"train_loss": -26.372922897338867, "global_step": 386768, "epoch": 4659} {"train_loss": -26.598718643188477, "global_step": 386769, "epoch": 4659} {"train_loss": -26.405426025390625, "global_step": 386770, "epoch": 4659} {"train_loss": -26.129568099975586, "global_step": 386771, "epoch": 4659} {"train_loss": -26.6115779876709, "global_step": 386772, "epoch": 4659} {"train_loss": -26.740467071533203, "global_step": 386773, "epoch": 4659} {"train_loss": -26.961536407470703, "global_step": 386774, "epoch": 4659} {"train_loss": -26.74553871154785, "global_step": 386775, "epoch": 4659} {"train_loss": -26.635595321655273, "global_step": 386776, "epoch": 4659} {"train_loss": -26.6376895904541, "global_step": 386777, "epoch": 4659} {"train_loss": -26.24812126159668, "global_step": 386778, "epoch": 4659} {"train_loss": -26.41606657189059, "global_step": 386779, "epoch": 4659, "val_loss": 6589608.0} {"train_loss": -26.025299072265625, "global_step": 386780, "epoch": 4660} {"train_loss": -26.23151969909668, "global_step": 386781, "epoch": 4660} {"train_loss": -25.676334381103516, "global_step": 386782, "epoch": 4660} {"train_loss": -26.16143226623535, "global_step": 386783, "epoch": 4660} {"train_loss": -25.528512954711914, "global_step": 386784, "epoch": 4660} {"train_loss": -25.85816764831543, "global_step": 386785, "epoch": 4660} {"train_loss": -26.2360782623291, "global_step": 386786, "epoch": 4660} {"train_loss": -26.237293243408203, "global_step": 386787, "epoch": 4660} {"train_loss": -26.166650772094727, "global_step": 386788, "epoch": 4660} {"train_loss": -26.004352569580078, "global_step": 386789, "epoch": 4660} {"train_loss": -26.03118324279785, "global_step": 386790, "epoch": 4660} {"train_loss": -25.862756729125977, "global_step": 386791, "epoch": 4660} {"train_loss": -26.18352699279785, "global_step": 386792, "epoch": 4660} {"train_loss": -26.2666015625, "global_step": 386793, "epoch": 4660} {"train_loss": -26.4592227935791, "global_step": 386794, "epoch": 4660} {"train_loss": -26.42579460144043, "global_step": 386795, "epoch": 4660} {"train_loss": -26.158313751220703, "global_step": 386796, "epoch": 4660} {"train_loss": -26.01944351196289, "global_step": 386797, "epoch": 4660} {"train_loss": -26.329919815063477, "global_step": 386798, "epoch": 4660} {"train_loss": -26.16912269592285, "global_step": 386799, "epoch": 4660} {"train_loss": -26.362890243530273, "global_step": 386800, "epoch": 4660} {"train_loss": -26.549026489257812, "global_step": 386801, "epoch": 4660} {"train_loss": -25.9627685546875, "global_step": 386802, "epoch": 4660} {"train_loss": -26.74505615234375, "global_step": 386803, "epoch": 4660} {"train_loss": -26.491077423095703, "global_step": 386804, "epoch": 4660} {"train_loss": -26.13701820373535, "global_step": 386805, "epoch": 4660} {"train_loss": -26.6031436920166, "global_step": 386806, "epoch": 4660} {"train_loss": -26.454572677612305, "global_step": 386807, "epoch": 4660} {"train_loss": -26.11566162109375, "global_step": 386808, "epoch": 4660} {"train_loss": -26.633832931518555, "global_step": 386809, "epoch": 4660} {"train_loss": -26.49802589416504, "global_step": 386810, "epoch": 4660} {"train_loss": -26.264978408813477, "global_step": 386811, "epoch": 4660} {"train_loss": -26.543476104736328, "global_step": 386812, "epoch": 4660} {"train_loss": -26.6040096282959, "global_step": 386813, "epoch": 4660} {"train_loss": -26.26386833190918, "global_step": 386814, "epoch": 4660} {"train_loss": -26.368467330932617, "global_step": 386815, "epoch": 4660} {"train_loss": -26.90350341796875, "global_step": 386816, "epoch": 4660} {"train_loss": -26.782209396362305, "global_step": 386817, "epoch": 4660} {"train_loss": -26.32706069946289, "global_step": 386818, "epoch": 4660} {"train_loss": -26.632568359375, "global_step": 386819, "epoch": 4660} {"train_loss": -26.64645767211914, "global_step": 386820, "epoch": 4660} {"train_loss": -26.52972984313965, "global_step": 386821, "epoch": 4660} {"train_loss": -26.611379623413086, "global_step": 386822, "epoch": 4660} {"train_loss": -27.121740341186523, "global_step": 386823, "epoch": 4660} {"train_loss": -26.658727645874023, "global_step": 386824, "epoch": 4660} {"train_loss": -26.66547966003418, "global_step": 386825, "epoch": 4660} {"train_loss": -26.758569717407227, "global_step": 386826, "epoch": 4660} {"train_loss": -26.656890869140625, "global_step": 386827, "epoch": 4660} {"train_loss": -26.775344848632812, "global_step": 386828, "epoch": 4660} {"train_loss": -26.653467178344727, "global_step": 386829, "epoch": 4660} {"train_loss": -26.481037139892578, "global_step": 386830, "epoch": 4660} {"train_loss": -26.406768798828125, "global_step": 386831, "epoch": 4660} {"train_loss": -27.036184310913086, "global_step": 386832, "epoch": 4660} {"train_loss": -26.58710289001465, "global_step": 386833, "epoch": 4660} {"train_loss": -26.53253173828125, "global_step": 386834, "epoch": 4660} {"train_loss": -26.763961791992188, "global_step": 386835, "epoch": 4660} {"train_loss": -26.770856857299805, "global_step": 386836, "epoch": 4660} {"train_loss": -26.2922420501709, "global_step": 386837, "epoch": 4660} {"train_loss": -26.6367244720459, "global_step": 386838, "epoch": 4660} {"train_loss": -26.44707679748535, "global_step": 386839, "epoch": 4660} {"train_loss": -26.409006118774414, "global_step": 386840, "epoch": 4660} {"train_loss": -26.3826961517334, "global_step": 386841, "epoch": 4660} {"train_loss": -26.491580963134766, "global_step": 386842, "epoch": 4660} {"train_loss": -26.554931640625, "global_step": 386843, "epoch": 4660} {"train_loss": -26.602399826049805, "global_step": 386844, "epoch": 4660} {"train_loss": -26.455106735229492, "global_step": 386845, "epoch": 4660} {"train_loss": -26.6722412109375, "global_step": 386846, "epoch": 4660} {"train_loss": -26.205982208251953, "global_step": 386847, "epoch": 4660} {"train_loss": -26.069782257080078, "global_step": 386848, "epoch": 4660} {"train_loss": -26.384368896484375, "global_step": 386849, "epoch": 4660} {"train_loss": -26.208145141601562, "global_step": 386850, "epoch": 4660} {"train_loss": -26.44959831237793, "global_step": 386851, "epoch": 4660} {"train_loss": -26.320941925048828, "global_step": 386852, "epoch": 4660} {"train_loss": -26.350875854492188, "global_step": 386853, "epoch": 4660} {"train_loss": -26.75800132751465, "global_step": 386854, "epoch": 4660} {"train_loss": -26.6130313873291, "global_step": 386855, "epoch": 4660} {"train_loss": -26.645071029663086, "global_step": 386856, "epoch": 4660} {"train_loss": -26.376638412475586, "global_step": 386857, "epoch": 4660} {"train_loss": -26.9537353515625, "global_step": 386858, "epoch": 4660} {"train_loss": -26.36258316040039, "global_step": 386859, "epoch": 4660} {"train_loss": -26.374374389648438, "global_step": 386860, "epoch": 4660} {"train_loss": -26.544281005859375, "global_step": 386861, "epoch": 4660} {"train_loss": -26.42104194824954, "global_step": 386862, "epoch": 4660, "val_loss": 6572031.0} {"train_loss": -25.758798599243164, "global_step": 386863, "epoch": 4661} {"train_loss": -25.890064239501953, "global_step": 386864, "epoch": 4661} {"train_loss": -26.28936195373535, "global_step": 386865, "epoch": 4661} {"train_loss": -26.000513076782227, "global_step": 386866, "epoch": 4661} {"train_loss": -26.174060821533203, "global_step": 386867, "epoch": 4661} {"train_loss": -26.187467575073242, "global_step": 386868, "epoch": 4661} {"train_loss": -25.873184204101562, "global_step": 386869, "epoch": 4661} {"train_loss": -26.239973068237305, "global_step": 386870, "epoch": 4661} {"train_loss": -26.091833114624023, "global_step": 386871, "epoch": 4661} {"train_loss": -26.072233200073242, "global_step": 386872, "epoch": 4661} {"train_loss": -25.99042320251465, "global_step": 386873, "epoch": 4661} {"train_loss": -25.944257736206055, "global_step": 386874, "epoch": 4661} {"train_loss": -26.269977569580078, "global_step": 386875, "epoch": 4661} {"train_loss": -26.241546630859375, "global_step": 386876, "epoch": 4661} {"train_loss": -26.42172622680664, "global_step": 386877, "epoch": 4661} {"train_loss": -26.57845115661621, "global_step": 386878, "epoch": 4661} {"train_loss": -26.723596572875977, "global_step": 386879, "epoch": 4661} {"train_loss": -26.293867111206055, "global_step": 386880, "epoch": 4661} {"train_loss": -26.405088424682617, "global_step": 386881, "epoch": 4661} {"train_loss": -26.578336715698242, "global_step": 386882, "epoch": 4661} {"train_loss": -26.53255271911621, "global_step": 386883, "epoch": 4661} {"train_loss": -26.350584030151367, "global_step": 386884, "epoch": 4661} {"train_loss": -26.343292236328125, "global_step": 386885, "epoch": 4661} {"train_loss": -26.710702896118164, "global_step": 386886, "epoch": 4661} {"train_loss": -26.758615493774414, "global_step": 386887, "epoch": 4661} {"train_loss": -26.65234375, "global_step": 386888, "epoch": 4661} {"train_loss": -26.696714401245117, "global_step": 386889, "epoch": 4661} {"train_loss": -26.834440231323242, "global_step": 386890, "epoch": 4661} {"train_loss": -26.75449562072754, "global_step": 386891, "epoch": 4661} {"train_loss": -26.736328125, "global_step": 386892, "epoch": 4661} {"train_loss": -26.74903678894043, "global_step": 386893, "epoch": 4661} {"train_loss": -26.703292846679688, "global_step": 386894, "epoch": 4661} {"train_loss": -26.67279624938965, "global_step": 386895, "epoch": 4661} {"train_loss": -26.280719757080078, "global_step": 386896, "epoch": 4661} {"train_loss": -26.51055908203125, "global_step": 386897, "epoch": 4661} {"train_loss": -26.317020416259766, "global_step": 386898, "epoch": 4661} {"train_loss": -26.834802627563477, "global_step": 386899, "epoch": 4661} {"train_loss": -26.5699405670166, "global_step": 386900, "epoch": 4661} {"train_loss": -26.9975528717041, "global_step": 386901, "epoch": 4661} {"train_loss": -26.624317169189453, "global_step": 386902, "epoch": 4661} {"train_loss": -26.493017196655273, "global_step": 386903, "epoch": 4661} {"train_loss": -26.658771514892578, "global_step": 386904, "epoch": 4661} {"train_loss": -26.939224243164062, "global_step": 386905, "epoch": 4661} {"train_loss": -26.88788414001465, "global_step": 386906, "epoch": 4661} {"train_loss": -27.063879013061523, "global_step": 386907, "epoch": 4661} {"train_loss": -26.6823673248291, "global_step": 386908, "epoch": 4661} {"train_loss": -26.8002872467041, "global_step": 386909, "epoch": 4661} {"train_loss": -26.17799949645996, "global_step": 386910, "epoch": 4661} {"train_loss": -25.6546573638916, "global_step": 386911, "epoch": 4661} {"train_loss": -25.697412490844727, "global_step": 386912, "epoch": 4661} {"train_loss": -25.81259536743164, "global_step": 386913, "epoch": 4661} {"train_loss": -26.21196937561035, "global_step": 386914, "epoch": 4661} {"train_loss": -25.642980575561523, "global_step": 386915, "epoch": 4661} {"train_loss": -25.51512908935547, "global_step": 386916, "epoch": 4661} {"train_loss": -24.894697189331055, "global_step": 386917, "epoch": 4661} {"train_loss": -25.632177352905273, "global_step": 386918, "epoch": 4661} {"train_loss": -25.967370986938477, "global_step": 386919, "epoch": 4661} {"train_loss": -25.876501083374023, "global_step": 386920, "epoch": 4661} {"train_loss": -26.20918083190918, "global_step": 386921, "epoch": 4661} {"train_loss": -25.7130069732666, "global_step": 386922, "epoch": 4661} {"train_loss": -25.670312881469727, "global_step": 386923, "epoch": 4661} {"train_loss": -25.762922286987305, "global_step": 386924, "epoch": 4661} {"train_loss": -26.09147071838379, "global_step": 386925, "epoch": 4661} {"train_loss": -26.058950424194336, "global_step": 386926, "epoch": 4661} {"train_loss": -26.390766143798828, "global_step": 386927, "epoch": 4661} {"train_loss": -26.43867301940918, "global_step": 386928, "epoch": 4661} {"train_loss": -26.4377498626709, "global_step": 386929, "epoch": 4661} {"train_loss": -26.416889190673828, "global_step": 386930, "epoch": 4661} {"train_loss": -26.542957305908203, "global_step": 386931, "epoch": 4661} {"train_loss": -26.154306411743164, "global_step": 386932, "epoch": 4661} {"train_loss": -26.068838119506836, "global_step": 386933, "epoch": 4661} {"train_loss": -26.342870712280273, "global_step": 386934, "epoch": 4661} {"train_loss": -26.36187744140625, "global_step": 386935, "epoch": 4661} {"train_loss": -26.312997817993164, "global_step": 386936, "epoch": 4661} {"train_loss": -26.393991470336914, "global_step": 386937, "epoch": 4661} {"train_loss": -26.824432373046875, "global_step": 386938, "epoch": 4661} {"train_loss": -26.466796875, "global_step": 386939, "epoch": 4661} {"train_loss": -26.781423568725586, "global_step": 386940, "epoch": 4661} {"train_loss": -26.70230484008789, "global_step": 386941, "epoch": 4661} {"train_loss": -26.375951766967773, "global_step": 386942, "epoch": 4661} {"train_loss": -26.754926681518555, "global_step": 386943, "epoch": 4661} {"train_loss": -26.24671745300293, "global_step": 386944, "epoch": 4661} {"train_loss": -26.306646714727563, "global_step": 386945, "epoch": 4661, "val_loss": 6587710.0} {"train_loss": -26.32427406311035, "global_step": 386946, "epoch": 4662} {"train_loss": -26.0662841796875, "global_step": 386947, "epoch": 4662} {"train_loss": -26.324899673461914, "global_step": 386948, "epoch": 4662} {"train_loss": -26.166915893554688, "global_step": 386949, "epoch": 4662} {"train_loss": -26.254867553710938, "global_step": 386950, "epoch": 4662} {"train_loss": -26.31800651550293, "global_step": 386951, "epoch": 4662} {"train_loss": -25.899927139282227, "global_step": 386952, "epoch": 4662} {"train_loss": -26.27509117126465, "global_step": 386953, "epoch": 4662} {"train_loss": -26.454313278198242, "global_step": 386954, "epoch": 4662} {"train_loss": -26.507598876953125, "global_step": 386955, "epoch": 4662} {"train_loss": -26.415409088134766, "global_step": 386956, "epoch": 4662} {"train_loss": -26.538650512695312, "global_step": 386957, "epoch": 4662} {"train_loss": -26.2442684173584, "global_step": 386958, "epoch": 4662} {"train_loss": -26.254852294921875, "global_step": 386959, "epoch": 4662} {"train_loss": -26.366003036499023, "global_step": 386960, "epoch": 4662} {"train_loss": -26.3928279876709, "global_step": 386961, "epoch": 4662} {"train_loss": -26.418630599975586, "global_step": 386962, "epoch": 4662} {"train_loss": -26.46827507019043, "global_step": 386963, "epoch": 4662} {"train_loss": -26.59711265563965, "global_step": 386964, "epoch": 4662} {"train_loss": -26.50300407409668, "global_step": 386965, "epoch": 4662} {"train_loss": -26.553281784057617, "global_step": 386966, "epoch": 4662} {"train_loss": -26.131378173828125, "global_step": 386967, "epoch": 4662} {"train_loss": -26.312671661376953, "global_step": 386968, "epoch": 4662} {"train_loss": -26.813446044921875, "global_step": 386969, "epoch": 4662} {"train_loss": -26.511816024780273, "global_step": 386970, "epoch": 4662} {"train_loss": -26.68155288696289, "global_step": 386971, "epoch": 4662} {"train_loss": -26.741544723510742, "global_step": 386972, "epoch": 4662} {"train_loss": -26.663366317749023, "global_step": 386973, "epoch": 4662} {"train_loss": -26.660888671875, "global_step": 386974, "epoch": 4662} {"train_loss": -26.82830810546875, "global_step": 386975, "epoch": 4662} {"train_loss": -26.2324161529541, "global_step": 386976, "epoch": 4662} {"train_loss": -26.655181884765625, "global_step": 386977, "epoch": 4662} {"train_loss": -26.5242862701416, "global_step": 386978, "epoch": 4662} {"train_loss": -26.931116104125977, "global_step": 386979, "epoch": 4662} {"train_loss": -26.694625854492188, "global_step": 386980, "epoch": 4662} {"train_loss": -26.36835289001465, "global_step": 386981, "epoch": 4662} {"train_loss": -26.707962036132812, "global_step": 386982, "epoch": 4662} {"train_loss": -26.5942325592041, "global_step": 386983, "epoch": 4662} {"train_loss": -26.728546142578125, "global_step": 386984, "epoch": 4662} {"train_loss": -26.92424964904785, "global_step": 386985, "epoch": 4662} {"train_loss": -26.685407638549805, "global_step": 386986, "epoch": 4662} {"train_loss": -26.38850212097168, "global_step": 386987, "epoch": 4662} {"train_loss": -26.43366813659668, "global_step": 386988, "epoch": 4662} {"train_loss": -26.268085479736328, "global_step": 386989, "epoch": 4662} {"train_loss": -26.713077545166016, "global_step": 386990, "epoch": 4662} {"train_loss": -26.117597579956055, "global_step": 386991, "epoch": 4662} {"train_loss": -26.44331169128418, "global_step": 386992, "epoch": 4662} {"train_loss": -26.1534481048584, "global_step": 386993, "epoch": 4662} {"train_loss": -25.76730728149414, "global_step": 386994, "epoch": 4662} {"train_loss": -26.231225967407227, "global_step": 386995, "epoch": 4662} {"train_loss": -26.558826446533203, "global_step": 386996, "epoch": 4662} {"train_loss": -26.149768829345703, "global_step": 386997, "epoch": 4662} {"train_loss": -26.19293785095215, "global_step": 386998, "epoch": 4662} {"train_loss": -26.211896896362305, "global_step": 386999, "epoch": 4662} {"train_loss": -26.648839950561523, "global_step": 387000, "epoch": 4662} {"train_loss": -26.360807418823242, "global_step": 387001, "epoch": 4662} {"train_loss": -25.962268829345703, "global_step": 387002, "epoch": 4662} {"train_loss": -26.434253692626953, "global_step": 387003, "epoch": 4662} {"train_loss": -26.024744033813477, "global_step": 387004, "epoch": 4662} {"train_loss": -26.288345336914062, "global_step": 387005, "epoch": 4662} {"train_loss": -26.532886505126953, "global_step": 387006, "epoch": 4662} {"train_loss": -26.622961044311523, "global_step": 387007, "epoch": 4662} {"train_loss": -26.02031898498535, "global_step": 387008, "epoch": 4662} {"train_loss": -26.263290405273438, "global_step": 387009, "epoch": 4662} {"train_loss": -26.544879913330078, "global_step": 387010, "epoch": 4662} {"train_loss": -26.097522735595703, "global_step": 387011, "epoch": 4662} {"train_loss": -26.475080490112305, "global_step": 387012, "epoch": 4662} {"train_loss": -26.469629287719727, "global_step": 387013, "epoch": 4662} {"train_loss": -26.528554916381836, "global_step": 387014, "epoch": 4662} {"train_loss": -26.007492065429688, "global_step": 387015, "epoch": 4662} {"train_loss": -26.459280014038086, "global_step": 387016, "epoch": 4662} {"train_loss": -26.77310562133789, "global_step": 387017, "epoch": 4662} {"train_loss": -27.00381851196289, "global_step": 387018, "epoch": 4662} {"train_loss": -27.008625030517578, "global_step": 387019, "epoch": 4662} {"train_loss": -26.419172286987305, "global_step": 387020, "epoch": 4662} {"train_loss": -26.412763595581055, "global_step": 387021, "epoch": 4662} {"train_loss": -26.841129302978516, "global_step": 387022, "epoch": 4662} {"train_loss": -26.571857452392578, "global_step": 387023, "epoch": 4662} {"train_loss": -26.526819229125977, "global_step": 387024, "epoch": 4662} {"train_loss": -26.3271541595459, "global_step": 387025, "epoch": 4662} {"train_loss": -26.512149810791016, "global_step": 387026, "epoch": 4662} {"train_loss": -26.627700805664062, "global_step": 387027, "epoch": 4662} {"train_loss": -26.445389092686664, "global_step": 387028, "epoch": 4662, "val_loss": 6574877.0} {"train_loss": -26.158599853515625, "global_step": 387029, "epoch": 4663} {"train_loss": -25.776721954345703, "global_step": 387030, "epoch": 4663} {"train_loss": -26.129230499267578, "global_step": 387031, "epoch": 4663} {"train_loss": -25.332794189453125, "global_step": 387032, "epoch": 4663} {"train_loss": -25.585723876953125, "global_step": 387033, "epoch": 4663} {"train_loss": -26.14802360534668, "global_step": 387034, "epoch": 4663} {"train_loss": -26.300582885742188, "global_step": 387035, "epoch": 4663} {"train_loss": -26.26665687561035, "global_step": 387036, "epoch": 4663} {"train_loss": -26.444339752197266, "global_step": 387037, "epoch": 4663} {"train_loss": -26.393177032470703, "global_step": 387038, "epoch": 4663} {"train_loss": -26.193302154541016, "global_step": 387039, "epoch": 4663} {"train_loss": -26.205184936523438, "global_step": 387040, "epoch": 4663} {"train_loss": -26.29278564453125, "global_step": 387041, "epoch": 4663} {"train_loss": -26.39780616760254, "global_step": 387042, "epoch": 4663} {"train_loss": -26.17939567565918, "global_step": 387043, "epoch": 4663} {"train_loss": -26.29022216796875, "global_step": 387044, "epoch": 4663} {"train_loss": -26.248672485351562, "global_step": 387045, "epoch": 4663} {"train_loss": -26.15447998046875, "global_step": 387046, "epoch": 4663} {"train_loss": -26.074853897094727, "global_step": 387047, "epoch": 4663} {"train_loss": -26.00492286682129, "global_step": 387048, "epoch": 4663} {"train_loss": -26.343637466430664, "global_step": 387049, "epoch": 4663} {"train_loss": -26.2431583404541, "global_step": 387050, "epoch": 4663} {"train_loss": -26.41635513305664, "global_step": 387051, "epoch": 4663} {"train_loss": -26.30720329284668, "global_step": 387052, "epoch": 4663} {"train_loss": -26.40131950378418, "global_step": 387053, "epoch": 4663} {"train_loss": -26.388418197631836, "global_step": 387054, "epoch": 4663} {"train_loss": -26.72882652282715, "global_step": 387055, "epoch": 4663} {"train_loss": -26.942243576049805, "global_step": 387056, "epoch": 4663} {"train_loss": -26.519678115844727, "global_step": 387057, "epoch": 4663} {"train_loss": -26.41156005859375, "global_step": 387058, "epoch": 4663} {"train_loss": -26.656818389892578, "global_step": 387059, "epoch": 4663} {"train_loss": -26.31746482849121, "global_step": 387060, "epoch": 4663} {"train_loss": -26.588476181030273, "global_step": 387061, "epoch": 4663} {"train_loss": -26.68678092956543, "global_step": 387062, "epoch": 4663} {"train_loss": -26.727767944335938, "global_step": 387063, "epoch": 4663} {"train_loss": -26.557172775268555, "global_step": 387064, "epoch": 4663} {"train_loss": -26.54816246032715, "global_step": 387065, "epoch": 4663} {"train_loss": -26.360498428344727, "global_step": 387066, "epoch": 4663} {"train_loss": -26.488996505737305, "global_step": 387067, "epoch": 4663} {"train_loss": -26.61638832092285, "global_step": 387068, "epoch": 4663} {"train_loss": -26.8098201751709, "global_step": 387069, "epoch": 4663} {"train_loss": -26.6347713470459, "global_step": 387070, "epoch": 4663} {"train_loss": -26.400848388671875, "global_step": 387071, "epoch": 4663} {"train_loss": -26.40854835510254, "global_step": 387072, "epoch": 4663} {"train_loss": -26.580854415893555, "global_step": 387073, "epoch": 4663} {"train_loss": -26.395994186401367, "global_step": 387074, "epoch": 4663} {"train_loss": -26.455307006835938, "global_step": 387075, "epoch": 4663} {"train_loss": -26.411136627197266, "global_step": 387076, "epoch": 4663} {"train_loss": -26.459980010986328, "global_step": 387077, "epoch": 4663} {"train_loss": -26.628732681274414, "global_step": 387078, "epoch": 4663} {"train_loss": -26.52068519592285, "global_step": 387079, "epoch": 4663} {"train_loss": -26.768386840820312, "global_step": 387080, "epoch": 4663} {"train_loss": -26.8941650390625, "global_step": 387081, "epoch": 4663} {"train_loss": -26.688129425048828, "global_step": 387082, "epoch": 4663} {"train_loss": -26.83658218383789, "global_step": 387083, "epoch": 4663} {"train_loss": -27.0891170501709, "global_step": 387084, "epoch": 4663} {"train_loss": -26.27668571472168, "global_step": 387085, "epoch": 4663} {"train_loss": -26.554641723632812, "global_step": 387086, "epoch": 4663} {"train_loss": -26.391489028930664, "global_step": 387087, "epoch": 4663} {"train_loss": -26.59894371032715, "global_step": 387088, "epoch": 4663} {"train_loss": -26.933332443237305, "global_step": 387089, "epoch": 4663} {"train_loss": -26.30134391784668, "global_step": 387090, "epoch": 4663} {"train_loss": -26.55328941345215, "global_step": 387091, "epoch": 4663} {"train_loss": -26.713367462158203, "global_step": 387092, "epoch": 4663} {"train_loss": -26.62459373474121, "global_step": 387093, "epoch": 4663} {"train_loss": -26.291410446166992, "global_step": 387094, "epoch": 4663} {"train_loss": -26.41021728515625, "global_step": 387095, "epoch": 4663} {"train_loss": -26.854446411132812, "global_step": 387096, "epoch": 4663} {"train_loss": -26.204370498657227, "global_step": 387097, "epoch": 4663} {"train_loss": -26.514835357666016, "global_step": 387098, "epoch": 4663} {"train_loss": -26.782026290893555, "global_step": 387099, "epoch": 4663} {"train_loss": -26.443220138549805, "global_step": 387100, "epoch": 4663} {"train_loss": -26.6661434173584, "global_step": 387101, "epoch": 4663} {"train_loss": -26.53759765625, "global_step": 387102, "epoch": 4663} {"train_loss": -26.604877471923828, "global_step": 387103, "epoch": 4663} {"train_loss": -26.619327545166016, "global_step": 387104, "epoch": 4663} {"train_loss": -26.652612686157227, "global_step": 387105, "epoch": 4663} {"train_loss": -26.424856185913086, "global_step": 387106, "epoch": 4663} {"train_loss": -26.507925033569336, "global_step": 387107, "epoch": 4663} {"train_loss": -26.736265182495117, "global_step": 387108, "epoch": 4663} {"train_loss": -26.665098190307617, "global_step": 387109, "epoch": 4663} {"train_loss": -26.38214683532715, "global_step": 387110, "epoch": 4663} {"train_loss": -26.454128977764082, "global_step": 387111, "epoch": 4663, "val_loss": 6625498.0} {"train_loss": -25.6851749420166, "global_step": 387112, "epoch": 4664} {"train_loss": -25.61200523376465, "global_step": 387113, "epoch": 4664} {"train_loss": -25.80902671813965, "global_step": 387114, "epoch": 4664} {"train_loss": -25.851926803588867, "global_step": 387115, "epoch": 4664} {"train_loss": -26.28131675720215, "global_step": 387116, "epoch": 4664} {"train_loss": -25.94141960144043, "global_step": 387117, "epoch": 4664} {"train_loss": -26.083669662475586, "global_step": 387118, "epoch": 4664} {"train_loss": -25.871973037719727, "global_step": 387119, "epoch": 4664} {"train_loss": -25.63956642150879, "global_step": 387120, "epoch": 4664} {"train_loss": -26.182050704956055, "global_step": 387121, "epoch": 4664} {"train_loss": -26.41352653503418, "global_step": 387122, "epoch": 4664} {"train_loss": -26.218046188354492, "global_step": 387123, "epoch": 4664} {"train_loss": -26.048187255859375, "global_step": 387124, "epoch": 4664} {"train_loss": -25.69733238220215, "global_step": 387125, "epoch": 4664} {"train_loss": -26.118261337280273, "global_step": 387126, "epoch": 4664} {"train_loss": -26.5559024810791, "global_step": 387127, "epoch": 4664} {"train_loss": -26.030780792236328, "global_step": 387128, "epoch": 4664} {"train_loss": -26.153451919555664, "global_step": 387129, "epoch": 4664} {"train_loss": -26.48016357421875, "global_step": 387130, "epoch": 4664} {"train_loss": -26.3657283782959, "global_step": 387131, "epoch": 4664} {"train_loss": -26.125476837158203, "global_step": 387132, "epoch": 4664} {"train_loss": -26.542877197265625, "global_step": 387133, "epoch": 4664} {"train_loss": -26.53382682800293, "global_step": 387134, "epoch": 4664} {"train_loss": -26.482227325439453, "global_step": 387135, "epoch": 4664} {"train_loss": -26.487030029296875, "global_step": 387136, "epoch": 4664} {"train_loss": -26.706445693969727, "global_step": 387137, "epoch": 4664} {"train_loss": -26.19708824157715, "global_step": 387138, "epoch": 4664} {"train_loss": -26.2976016998291, "global_step": 387139, "epoch": 4664} {"train_loss": -26.41700553894043, "global_step": 387140, "epoch": 4664} {"train_loss": -26.527603149414062, "global_step": 387141, "epoch": 4664} {"train_loss": -26.4167537689209, "global_step": 387142, "epoch": 4664} {"train_loss": -26.415241241455078, "global_step": 387143, "epoch": 4664} {"train_loss": -26.406660079956055, "global_step": 387144, "epoch": 4664} {"train_loss": -26.254932403564453, "global_step": 387145, "epoch": 4664} {"train_loss": -26.32661247253418, "global_step": 387146, "epoch": 4664} {"train_loss": -26.56251335144043, "global_step": 387147, "epoch": 4664} {"train_loss": -26.773895263671875, "global_step": 387148, "epoch": 4664} {"train_loss": -26.357086181640625, "global_step": 387149, "epoch": 4664} {"train_loss": -26.503585815429688, "global_step": 387150, "epoch": 4664} {"train_loss": -26.80829429626465, "global_step": 387151, "epoch": 4664} {"train_loss": -26.525177001953125, "global_step": 387152, "epoch": 4664} {"train_loss": -26.971166610717773, "global_step": 387153, "epoch": 4664} {"train_loss": -26.915515899658203, "global_step": 387154, "epoch": 4664} {"train_loss": -26.20900535583496, "global_step": 387155, "epoch": 4664} {"train_loss": -26.6881046295166, "global_step": 387156, "epoch": 4664} {"train_loss": -26.204648971557617, "global_step": 387157, "epoch": 4664} {"train_loss": -26.602554321289062, "global_step": 387158, "epoch": 4664} {"train_loss": -26.364013671875, "global_step": 387159, "epoch": 4664} {"train_loss": -26.44545555114746, "global_step": 387160, "epoch": 4664} {"train_loss": -25.96345329284668, "global_step": 387161, "epoch": 4664} {"train_loss": -26.187591552734375, "global_step": 387162, "epoch": 4664} {"train_loss": -26.4448299407959, "global_step": 387163, "epoch": 4664} {"train_loss": -26.841699600219727, "global_step": 387164, "epoch": 4664} {"train_loss": -26.742633819580078, "global_step": 387165, "epoch": 4664} {"train_loss": -26.260009765625, "global_step": 387166, "epoch": 4664} {"train_loss": -26.117368698120117, "global_step": 387167, "epoch": 4664} {"train_loss": -26.299854278564453, "global_step": 387168, "epoch": 4664} {"train_loss": -26.675525665283203, "global_step": 387169, "epoch": 4664} {"train_loss": -26.419036865234375, "global_step": 387170, "epoch": 4664} {"train_loss": -26.356800079345703, "global_step": 387171, "epoch": 4664} {"train_loss": -26.18442153930664, "global_step": 387172, "epoch": 4664} {"train_loss": -26.460241317749023, "global_step": 387173, "epoch": 4664} {"train_loss": -26.498870849609375, "global_step": 387174, "epoch": 4664} {"train_loss": -26.51702880859375, "global_step": 387175, "epoch": 4664} {"train_loss": -26.330509185791016, "global_step": 387176, "epoch": 4664} {"train_loss": -26.23642349243164, "global_step": 387177, "epoch": 4664} {"train_loss": -26.6269474029541, "global_step": 387178, "epoch": 4664} {"train_loss": -26.01356315612793, "global_step": 387179, "epoch": 4664} {"train_loss": -26.5583438873291, "global_step": 387180, "epoch": 4664} {"train_loss": -26.5928955078125, "global_step": 387181, "epoch": 4664} {"train_loss": -26.51302146911621, "global_step": 387182, "epoch": 4664} {"train_loss": -26.194910049438477, "global_step": 387183, "epoch": 4664} {"train_loss": -26.23023796081543, "global_step": 387184, "epoch": 4664} {"train_loss": -26.599210739135742, "global_step": 387185, "epoch": 4664} {"train_loss": -26.135656356811523, "global_step": 387186, "epoch": 4664} {"train_loss": -26.54182243347168, "global_step": 387187, "epoch": 4664} {"train_loss": -26.54876708984375, "global_step": 387188, "epoch": 4664} {"train_loss": -26.400739669799805, "global_step": 387189, "epoch": 4664} {"train_loss": -26.73858642578125, "global_step": 387190, "epoch": 4664} {"train_loss": -26.5534610748291, "global_step": 387191, "epoch": 4664} {"train_loss": -26.46646499633789, "global_step": 387192, "epoch": 4664} {"train_loss": -26.523578643798828, "global_step": 387193, "epoch": 4664} {"train_loss": -26.335685316338598, "global_step": 387194, "epoch": 4664, "val_loss": 6579472.5} {"train_loss": -25.722867965698242, "global_step": 387195, "epoch": 4665} {"train_loss": -26.33757972717285, "global_step": 387196, "epoch": 4665} {"train_loss": -26.484262466430664, "global_step": 387197, "epoch": 4665} {"train_loss": -25.883289337158203, "global_step": 387198, "epoch": 4665} {"train_loss": -25.5855712890625, "global_step": 387199, "epoch": 4665} {"train_loss": -26.20770263671875, "global_step": 387200, "epoch": 4665} {"train_loss": -26.101398468017578, "global_step": 387201, "epoch": 4665} {"train_loss": -26.36249351501465, "global_step": 387202, "epoch": 4665} {"train_loss": -26.258575439453125, "global_step": 387203, "epoch": 4665} {"train_loss": -26.134521484375, "global_step": 387204, "epoch": 4665} {"train_loss": -26.59173011779785, "global_step": 387205, "epoch": 4665} {"train_loss": -26.575855255126953, "global_step": 387206, "epoch": 4665} {"train_loss": -26.112390518188477, "global_step": 387207, "epoch": 4665} {"train_loss": -26.19862174987793, "global_step": 387208, "epoch": 4665} {"train_loss": -25.976715087890625, "global_step": 387209, "epoch": 4665} {"train_loss": -26.390233993530273, "global_step": 387210, "epoch": 4665} {"train_loss": -26.868494033813477, "global_step": 387211, "epoch": 4665} {"train_loss": -26.073200225830078, "global_step": 387212, "epoch": 4665} {"train_loss": -26.565723419189453, "global_step": 387213, "epoch": 4665} {"train_loss": -26.30490493774414, "global_step": 387214, "epoch": 4665} {"train_loss": -26.599109649658203, "global_step": 387215, "epoch": 4665} {"train_loss": -26.411041259765625, "global_step": 387216, "epoch": 4665} {"train_loss": -26.2707576751709, "global_step": 387217, "epoch": 4665} {"train_loss": -26.80440330505371, "global_step": 387218, "epoch": 4665} {"train_loss": -26.8092098236084, "global_step": 387219, "epoch": 4665} {"train_loss": -26.637226104736328, "global_step": 387220, "epoch": 4665} {"train_loss": -26.47576332092285, "global_step": 387221, "epoch": 4665} {"train_loss": -26.67011070251465, "global_step": 387222, "epoch": 4665} {"train_loss": -26.2208251953125, "global_step": 387223, "epoch": 4665} {"train_loss": -26.246362686157227, "global_step": 387224, "epoch": 4665} {"train_loss": -26.350305557250977, "global_step": 387225, "epoch": 4665} {"train_loss": -26.429920196533203, "global_step": 387226, "epoch": 4665} {"train_loss": -26.333236694335938, "global_step": 387227, "epoch": 4665} {"train_loss": -26.8330020904541, "global_step": 387228, "epoch": 4665} {"train_loss": -26.68169593811035, "global_step": 387229, "epoch": 4665} {"train_loss": -26.4117431640625, "global_step": 387230, "epoch": 4665} {"train_loss": -26.08107566833496, "global_step": 387231, "epoch": 4665} {"train_loss": -26.441099166870117, "global_step": 387232, "epoch": 4665} {"train_loss": -26.6812686920166, "global_step": 387233, "epoch": 4665} {"train_loss": -26.492521286010742, "global_step": 387234, "epoch": 4665} {"train_loss": -26.359922409057617, "global_step": 387235, "epoch": 4665} {"train_loss": -26.125579833984375, "global_step": 387236, "epoch": 4665} {"train_loss": -26.243330001831055, "global_step": 387237, "epoch": 4665} {"train_loss": -26.561304092407227, "global_step": 387238, "epoch": 4665} {"train_loss": -26.291418075561523, "global_step": 387239, "epoch": 4665} {"train_loss": -26.361486434936523, "global_step": 387240, "epoch": 4665} {"train_loss": -26.6151180267334, "global_step": 387241, "epoch": 4665} {"train_loss": -26.442081451416016, "global_step": 387242, "epoch": 4665} {"train_loss": -26.67510414123535, "global_step": 387243, "epoch": 4665} {"train_loss": -26.574188232421875, "global_step": 387244, "epoch": 4665} {"train_loss": -26.516433715820312, "global_step": 387245, "epoch": 4665} {"train_loss": -26.203168869018555, "global_step": 387246, "epoch": 4665} {"train_loss": -26.37007713317871, "global_step": 387247, "epoch": 4665} {"train_loss": -26.55616569519043, "global_step": 387248, "epoch": 4665} {"train_loss": -26.298376083374023, "global_step": 387249, "epoch": 4665} {"train_loss": -26.39792823791504, "global_step": 387250, "epoch": 4665} {"train_loss": -26.576873779296875, "global_step": 387251, "epoch": 4665} {"train_loss": -26.34217643737793, "global_step": 387252, "epoch": 4665} {"train_loss": -26.6857967376709, "global_step": 387253, "epoch": 4665} {"train_loss": -26.471906661987305, "global_step": 387254, "epoch": 4665} {"train_loss": -26.5794620513916, "global_step": 387255, "epoch": 4665} {"train_loss": -26.3320369720459, "global_step": 387256, "epoch": 4665} {"train_loss": -25.8710994720459, "global_step": 387257, "epoch": 4665} {"train_loss": -26.52796745300293, "global_step": 387258, "epoch": 4665} {"train_loss": -26.414453506469727, "global_step": 387259, "epoch": 4665} {"train_loss": -26.6036319732666, "global_step": 387260, "epoch": 4665} {"train_loss": -26.236486434936523, "global_step": 387261, "epoch": 4665} {"train_loss": -25.626874923706055, "global_step": 387262, "epoch": 4665} {"train_loss": -25.497102737426758, "global_step": 387263, "epoch": 4665} {"train_loss": -25.70122718811035, "global_step": 387264, "epoch": 4665} {"train_loss": -25.9365177154541, "global_step": 387265, "epoch": 4665} {"train_loss": -26.37714195251465, "global_step": 387266, "epoch": 4665} {"train_loss": -25.905670166015625, "global_step": 387267, "epoch": 4665} {"train_loss": -26.348596572875977, "global_step": 387268, "epoch": 4665} {"train_loss": -25.953012466430664, "global_step": 387269, "epoch": 4665} {"train_loss": -26.841474533081055, "global_step": 387270, "epoch": 4665} {"train_loss": -26.324743270874023, "global_step": 387271, "epoch": 4665} {"train_loss": -26.32512855529785, "global_step": 387272, "epoch": 4665} {"train_loss": -26.5550537109375, "global_step": 387273, "epoch": 4665} {"train_loss": -26.2734432220459, "global_step": 387274, "epoch": 4665} {"train_loss": -26.503263473510742, "global_step": 387275, "epoch": 4665} {"train_loss": -26.155780792236328, "global_step": 387276, "epoch": 4665} {"train_loss": -26.338144072567125, "global_step": 387277, "epoch": 4665, "val_loss": 6629767.0} {"train_loss": -24.921646118164062, "global_step": 387278, "epoch": 4666} {"train_loss": -25.079309463500977, "global_step": 387279, "epoch": 4666} {"train_loss": -25.549137115478516, "global_step": 387280, "epoch": 4666} {"train_loss": -25.938039779663086, "global_step": 387281, "epoch": 4666} {"train_loss": -24.391468048095703, "global_step": 387282, "epoch": 4666} {"train_loss": -25.581878662109375, "global_step": 387283, "epoch": 4666} {"train_loss": -25.68341064453125, "global_step": 387284, "epoch": 4666} {"train_loss": -25.956069946289062, "global_step": 387285, "epoch": 4666} {"train_loss": -26.1118221282959, "global_step": 387286, "epoch": 4666} {"train_loss": -25.7264404296875, "global_step": 387287, "epoch": 4666} {"train_loss": -25.826828002929688, "global_step": 387288, "epoch": 4666} {"train_loss": -25.9583683013916, "global_step": 387289, "epoch": 4666} {"train_loss": -26.23714256286621, "global_step": 387290, "epoch": 4666} {"train_loss": -26.105636596679688, "global_step": 387291, "epoch": 4666} {"train_loss": -26.19036293029785, "global_step": 387292, "epoch": 4666} {"train_loss": -26.12445640563965, "global_step": 387293, "epoch": 4666} {"train_loss": -26.024383544921875, "global_step": 387294, "epoch": 4666} {"train_loss": -25.841781616210938, "global_step": 387295, "epoch": 4666} {"train_loss": -26.139209747314453, "global_step": 387296, "epoch": 4666} {"train_loss": -26.481115341186523, "global_step": 387297, "epoch": 4666} {"train_loss": -26.127649307250977, "global_step": 387298, "epoch": 4666} {"train_loss": -26.171106338500977, "global_step": 387299, "epoch": 4666} {"train_loss": -26.839513778686523, "global_step": 387300, "epoch": 4666} {"train_loss": -26.394723892211914, "global_step": 387301, "epoch": 4666} {"train_loss": -26.242944717407227, "global_step": 387302, "epoch": 4666} {"train_loss": -26.1444149017334, "global_step": 387303, "epoch": 4666} {"train_loss": -26.394287109375, "global_step": 387304, "epoch": 4666} {"train_loss": -26.182661056518555, "global_step": 387305, "epoch": 4666} {"train_loss": -26.737104415893555, "global_step": 387306, "epoch": 4666} {"train_loss": -26.2800350189209, "global_step": 387307, "epoch": 4666} {"train_loss": -26.54610252380371, "global_step": 387308, "epoch": 4666} {"train_loss": -26.534896850585938, "global_step": 387309, "epoch": 4666} {"train_loss": -26.519775390625, "global_step": 387310, "epoch": 4666} {"train_loss": -26.72040367126465, "global_step": 387311, "epoch": 4666} {"train_loss": -26.488065719604492, "global_step": 387312, "epoch": 4666} {"train_loss": -26.81989097595215, "global_step": 387313, "epoch": 4666} {"train_loss": -26.21270179748535, "global_step": 387314, "epoch": 4666} {"train_loss": -26.925214767456055, "global_step": 387315, "epoch": 4666} {"train_loss": -26.499120712280273, "global_step": 387316, "epoch": 4666} {"train_loss": -26.468976974487305, "global_step": 387317, "epoch": 4666} {"train_loss": -26.410043716430664, "global_step": 387318, "epoch": 4666} {"train_loss": -26.37605094909668, "global_step": 387319, "epoch": 4666} {"train_loss": -27.00949478149414, "global_step": 387320, "epoch": 4666} {"train_loss": -26.221954345703125, "global_step": 387321, "epoch": 4666} {"train_loss": -26.632192611694336, "global_step": 387322, "epoch": 4666} {"train_loss": -26.739273071289062, "global_step": 387323, "epoch": 4666} {"train_loss": -26.67764663696289, "global_step": 387324, "epoch": 4666} {"train_loss": -26.32271385192871, "global_step": 387325, "epoch": 4666} {"train_loss": -26.6340274810791, "global_step": 387326, "epoch": 4666} {"train_loss": -26.580957412719727, "global_step": 387327, "epoch": 4666} {"train_loss": -26.604724884033203, "global_step": 387328, "epoch": 4666} {"train_loss": -26.771728515625, "global_step": 387329, "epoch": 4666} {"train_loss": -26.640899658203125, "global_step": 387330, "epoch": 4666} {"train_loss": -26.11298179626465, "global_step": 387331, "epoch": 4666} {"train_loss": -26.246585845947266, "global_step": 387332, "epoch": 4666} {"train_loss": -26.22272300720215, "global_step": 387333, "epoch": 4666} {"train_loss": -26.029287338256836, "global_step": 387334, "epoch": 4666} {"train_loss": -26.150781631469727, "global_step": 387335, "epoch": 4666} {"train_loss": -26.3173828125, "global_step": 387336, "epoch": 4666} {"train_loss": -26.717334747314453, "global_step": 387337, "epoch": 4666} {"train_loss": -26.92207145690918, "global_step": 387338, "epoch": 4666} {"train_loss": -26.825897216796875, "global_step": 387339, "epoch": 4666} {"train_loss": -26.449085235595703, "global_step": 387340, "epoch": 4666} {"train_loss": -26.33060646057129, "global_step": 387341, "epoch": 4666} {"train_loss": -26.827783584594727, "global_step": 387342, "epoch": 4666} {"train_loss": -26.43194007873535, "global_step": 387343, "epoch": 4666} {"train_loss": -26.591796875, "global_step": 387344, "epoch": 4666} {"train_loss": -26.64967155456543, "global_step": 387345, "epoch": 4666} {"train_loss": -26.399499893188477, "global_step": 387346, "epoch": 4666} {"train_loss": -26.38694190979004, "global_step": 387347, "epoch": 4666} {"train_loss": -26.479278564453125, "global_step": 387348, "epoch": 4666} {"train_loss": -26.2171573638916, "global_step": 387349, "epoch": 4666} {"train_loss": -26.79890251159668, "global_step": 387350, "epoch": 4666} {"train_loss": -26.7987117767334, "global_step": 387351, "epoch": 4666} {"train_loss": -26.412994384765625, "global_step": 387352, "epoch": 4666} {"train_loss": -26.499597549438477, "global_step": 387353, "epoch": 4666} {"train_loss": -26.678192138671875, "global_step": 387354, "epoch": 4666} {"train_loss": -26.554508209228516, "global_step": 387355, "epoch": 4666} {"train_loss": -26.236804962158203, "global_step": 387356, "epoch": 4666} {"train_loss": -26.706134796142578, "global_step": 387357, "epoch": 4666} {"train_loss": -26.640859603881836, "global_step": 387358, "epoch": 4666} {"train_loss": -26.613473892211914, "global_step": 387359, "epoch": 4666} {"train_loss": -26.333501631955066, "global_step": 387360, "epoch": 4666, "val_loss": 6607243.0} {"train_loss": -25.8217716217041, "global_step": 387361, "epoch": 4667} {"train_loss": -25.20370864868164, "global_step": 387362, "epoch": 4667} {"train_loss": -25.218732833862305, "global_step": 387363, "epoch": 4667} {"train_loss": -25.248077392578125, "global_step": 387364, "epoch": 4667} {"train_loss": -25.562211990356445, "global_step": 387365, "epoch": 4667} {"train_loss": -26.21320152282715, "global_step": 387366, "epoch": 4667} {"train_loss": -26.190725326538086, "global_step": 387367, "epoch": 4667} {"train_loss": -25.976184844970703, "global_step": 387368, "epoch": 4667} {"train_loss": -25.51495933532715, "global_step": 387369, "epoch": 4667} {"train_loss": -26.563282012939453, "global_step": 387370, "epoch": 4667} {"train_loss": -25.804105758666992, "global_step": 387371, "epoch": 4667} {"train_loss": -26.523529052734375, "global_step": 387372, "epoch": 4667} {"train_loss": -25.840864181518555, "global_step": 387373, "epoch": 4667} {"train_loss": -26.126737594604492, "global_step": 387374, "epoch": 4667} {"train_loss": -26.045446395874023, "global_step": 387375, "epoch": 4667} {"train_loss": -25.957782745361328, "global_step": 387376, "epoch": 4667} {"train_loss": -26.317264556884766, "global_step": 387377, "epoch": 4667} {"train_loss": -26.118289947509766, "global_step": 387378, "epoch": 4667} {"train_loss": -25.972198486328125, "global_step": 387379, "epoch": 4667} {"train_loss": -26.098773956298828, "global_step": 387380, "epoch": 4667} {"train_loss": -26.084455490112305, "global_step": 387381, "epoch": 4667} {"train_loss": -26.33546257019043, "global_step": 387382, "epoch": 4667} {"train_loss": -26.021291732788086, "global_step": 387383, "epoch": 4667} {"train_loss": -26.242216110229492, "global_step": 387384, "epoch": 4667} {"train_loss": -26.35495948791504, "global_step": 387385, "epoch": 4667} {"train_loss": -26.271268844604492, "global_step": 387386, "epoch": 4667} {"train_loss": -26.154760360717773, "global_step": 387387, "epoch": 4667} {"train_loss": -26.569486618041992, "global_step": 387388, "epoch": 4667} {"train_loss": -26.434621810913086, "global_step": 387389, "epoch": 4667} {"train_loss": -26.415573120117188, "global_step": 387390, "epoch": 4667} {"train_loss": -26.386432647705078, "global_step": 387391, "epoch": 4667} {"train_loss": -26.565271377563477, "global_step": 387392, "epoch": 4667} {"train_loss": -26.533056259155273, "global_step": 387393, "epoch": 4667} {"train_loss": -26.446928024291992, "global_step": 387394, "epoch": 4667} {"train_loss": -26.24881362915039, "global_step": 387395, "epoch": 4667} {"train_loss": -26.54534339904785, "global_step": 387396, "epoch": 4667} {"train_loss": -26.333560943603516, "global_step": 387397, "epoch": 4667} {"train_loss": -26.56453514099121, "global_step": 387398, "epoch": 4667} {"train_loss": -26.42632484436035, "global_step": 387399, "epoch": 4667} {"train_loss": -26.626544952392578, "global_step": 387400, "epoch": 4667} {"train_loss": -26.615713119506836, "global_step": 387401, "epoch": 4667} {"train_loss": -26.447174072265625, "global_step": 387402, "epoch": 4667} {"train_loss": -26.62355613708496, "global_step": 387403, "epoch": 4667} {"train_loss": -26.386554718017578, "global_step": 387404, "epoch": 4667} {"train_loss": -26.930805206298828, "global_step": 387405, "epoch": 4667} {"train_loss": -26.454843521118164, "global_step": 387406, "epoch": 4667} {"train_loss": -26.813770294189453, "global_step": 387407, "epoch": 4667} {"train_loss": -26.6531925201416, "global_step": 387408, "epoch": 4667} {"train_loss": -26.818256378173828, "global_step": 387409, "epoch": 4667} {"train_loss": -26.46552085876465, "global_step": 387410, "epoch": 4667} {"train_loss": -26.744062423706055, "global_step": 387411, "epoch": 4667} {"train_loss": -26.39231300354004, "global_step": 387412, "epoch": 4667} {"train_loss": -26.767919540405273, "global_step": 387413, "epoch": 4667} {"train_loss": -26.31906509399414, "global_step": 387414, "epoch": 4667} {"train_loss": -26.784406661987305, "global_step": 387415, "epoch": 4667} {"train_loss": -26.676488876342773, "global_step": 387416, "epoch": 4667} {"train_loss": -26.225996017456055, "global_step": 387417, "epoch": 4667} {"train_loss": -26.717519760131836, "global_step": 387418, "epoch": 4667} {"train_loss": -25.979185104370117, "global_step": 387419, "epoch": 4667} {"train_loss": -26.02772331237793, "global_step": 387420, "epoch": 4667} {"train_loss": -26.595596313476562, "global_step": 387421, "epoch": 4667} {"train_loss": -26.46466064453125, "global_step": 387422, "epoch": 4667} {"train_loss": -26.235891342163086, "global_step": 387423, "epoch": 4667} {"train_loss": -25.295209884643555, "global_step": 387424, "epoch": 4667} {"train_loss": -25.71150016784668, "global_step": 387425, "epoch": 4667} {"train_loss": -26.255767822265625, "global_step": 387426, "epoch": 4667} {"train_loss": -26.355331420898438, "global_step": 387427, "epoch": 4667} {"train_loss": -25.836780548095703, "global_step": 387428, "epoch": 4667} {"train_loss": -26.21363639831543, "global_step": 387429, "epoch": 4667} {"train_loss": -26.328771591186523, "global_step": 387430, "epoch": 4667} {"train_loss": -26.02097511291504, "global_step": 387431, "epoch": 4667} {"train_loss": -25.98243522644043, "global_step": 387432, "epoch": 4667} {"train_loss": -26.6212100982666, "global_step": 387433, "epoch": 4667} {"train_loss": -26.554086685180664, "global_step": 387434, "epoch": 4667} {"train_loss": -26.104923248291016, "global_step": 387435, "epoch": 4667} {"train_loss": -26.309778213500977, "global_step": 387436, "epoch": 4667} {"train_loss": -26.397022247314453, "global_step": 387437, "epoch": 4667} {"train_loss": -26.62298011779785, "global_step": 387438, "epoch": 4667} {"train_loss": -26.508939743041992, "global_step": 387439, "epoch": 4667} {"train_loss": -26.549062728881836, "global_step": 387440, "epoch": 4667} {"train_loss": -26.63836097717285, "global_step": 387441, "epoch": 4667} {"train_loss": -26.522785186767578, "global_step": 387442, "epoch": 4667} {"train_loss": -26.281334681683276, "global_step": 387443, "epoch": 4667, "val_loss": 6591374.0} {"train_loss": -25.941165924072266, "global_step": 387444, "epoch": 4668} {"train_loss": -26.17768669128418, "global_step": 387445, "epoch": 4668} {"train_loss": -26.33794593811035, "global_step": 387446, "epoch": 4668} {"train_loss": -25.989057540893555, "global_step": 387447, "epoch": 4668} {"train_loss": -26.50857925415039, "global_step": 387448, "epoch": 4668} {"train_loss": -26.197248458862305, "global_step": 387449, "epoch": 4668} {"train_loss": -26.549962997436523, "global_step": 387450, "epoch": 4668} {"train_loss": -26.383337020874023, "global_step": 387451, "epoch": 4668} {"train_loss": -26.121368408203125, "global_step": 387452, "epoch": 4668} {"train_loss": -26.564697265625, "global_step": 387453, "epoch": 4668} {"train_loss": -26.374799728393555, "global_step": 387454, "epoch": 4668} {"train_loss": -26.61382484436035, "global_step": 387455, "epoch": 4668} {"train_loss": -26.87286949157715, "global_step": 387456, "epoch": 4668} {"train_loss": -26.15869140625, "global_step": 387457, "epoch": 4668} {"train_loss": -26.41813087463379, "global_step": 387458, "epoch": 4668} {"train_loss": -26.579923629760742, "global_step": 387459, "epoch": 4668} {"train_loss": -26.149755477905273, "global_step": 387460, "epoch": 4668} {"train_loss": -26.57520866394043, "global_step": 387461, "epoch": 4668} {"train_loss": -26.191450119018555, "global_step": 387462, "epoch": 4668} {"train_loss": -26.435504913330078, "global_step": 387463, "epoch": 4668} {"train_loss": -26.6793155670166, "global_step": 387464, "epoch": 4668} {"train_loss": -26.85407066345215, "global_step": 387465, "epoch": 4668} {"train_loss": -26.393552780151367, "global_step": 387466, "epoch": 4668} {"train_loss": -26.22517204284668, "global_step": 387467, "epoch": 4668} {"train_loss": -26.29935073852539, "global_step": 387468, "epoch": 4668} {"train_loss": -26.6717529296875, "global_step": 387469, "epoch": 4668} {"train_loss": -26.40252113342285, "global_step": 387470, "epoch": 4668} {"train_loss": -26.689960479736328, "global_step": 387471, "epoch": 4668} {"train_loss": -26.7027645111084, "global_step": 387472, "epoch": 4668} {"train_loss": -26.287158966064453, "global_step": 387473, "epoch": 4668} {"train_loss": -26.611846923828125, "global_step": 387474, "epoch": 4668} {"train_loss": -26.218250274658203, "global_step": 387475, "epoch": 4668} {"train_loss": -26.458093643188477, "global_step": 387476, "epoch": 4668} {"train_loss": -26.529983520507812, "global_step": 387477, "epoch": 4668} {"train_loss": -26.425155639648438, "global_step": 387478, "epoch": 4668} {"train_loss": -26.21851921081543, "global_step": 387479, "epoch": 4668} {"train_loss": -26.576154708862305, "global_step": 387480, "epoch": 4668} {"train_loss": -26.918310165405273, "global_step": 387481, "epoch": 4668} {"train_loss": -26.47580337524414, "global_step": 387482, "epoch": 4668} {"train_loss": -26.865543365478516, "global_step": 387483, "epoch": 4668} {"train_loss": -26.459136962890625, "global_step": 387484, "epoch": 4668} {"train_loss": -26.27897071838379, "global_step": 387485, "epoch": 4668} {"train_loss": -26.98785400390625, "global_step": 387486, "epoch": 4668} {"train_loss": -26.867578506469727, "global_step": 387487, "epoch": 4668} {"train_loss": -26.634601593017578, "global_step": 387488, "epoch": 4668} {"train_loss": -26.732162475585938, "global_step": 387489, "epoch": 4668} {"train_loss": -26.304285049438477, "global_step": 387490, "epoch": 4668} {"train_loss": -26.295928955078125, "global_step": 387491, "epoch": 4668} {"train_loss": -26.3618221282959, "global_step": 387492, "epoch": 4668} {"train_loss": -26.372995376586914, "global_step": 387493, "epoch": 4668} {"train_loss": -26.413888931274414, "global_step": 387494, "epoch": 4668} {"train_loss": -26.395811080932617, "global_step": 387495, "epoch": 4668} {"train_loss": -26.4178409576416, "global_step": 387496, "epoch": 4668} {"train_loss": -26.077014923095703, "global_step": 387497, "epoch": 4668} {"train_loss": -26.637624740600586, "global_step": 387498, "epoch": 4668} {"train_loss": -26.533552169799805, "global_step": 387499, "epoch": 4668} {"train_loss": -26.52520179748535, "global_step": 387500, "epoch": 4668} {"train_loss": -26.11690330505371, "global_step": 387501, "epoch": 4668} {"train_loss": -26.685956954956055, "global_step": 387502, "epoch": 4668} {"train_loss": -27.13917350769043, "global_step": 387503, "epoch": 4668} {"train_loss": -26.598224639892578, "global_step": 387504, "epoch": 4668} {"train_loss": -26.710479736328125, "global_step": 387505, "epoch": 4668} {"train_loss": -26.24153709411621, "global_step": 387506, "epoch": 4668} {"train_loss": -26.7957763671875, "global_step": 387507, "epoch": 4668} {"train_loss": -26.27399253845215, "global_step": 387508, "epoch": 4668} {"train_loss": -26.672163009643555, "global_step": 387509, "epoch": 4668} {"train_loss": -26.515899658203125, "global_step": 387510, "epoch": 4668} {"train_loss": -26.843597412109375, "global_step": 387511, "epoch": 4668} {"train_loss": -26.54866600036621, "global_step": 387512, "epoch": 4668} {"train_loss": -26.1925106048584, "global_step": 387513, "epoch": 4668} {"train_loss": -26.65704917907715, "global_step": 387514, "epoch": 4668} {"train_loss": -26.365554809570312, "global_step": 387515, "epoch": 4668} {"train_loss": -27.033926010131836, "global_step": 387516, "epoch": 4668} {"train_loss": -27.0252685546875, "global_step": 387517, "epoch": 4668} {"train_loss": -26.250839233398438, "global_step": 387518, "epoch": 4668} {"train_loss": -26.633249282836914, "global_step": 387519, "epoch": 4668} {"train_loss": -26.6038818359375, "global_step": 387520, "epoch": 4668} {"train_loss": -26.83707046508789, "global_step": 387521, "epoch": 4668} {"train_loss": -26.27467155456543, "global_step": 387522, "epoch": 4668} {"train_loss": -26.576313018798828, "global_step": 387523, "epoch": 4668} {"train_loss": -26.507177352905273, "global_step": 387524, "epoch": 4668} {"train_loss": -26.245344161987305, "global_step": 387525, "epoch": 4668} {"train_loss": -26.50143526835614, "global_step": 387526, "epoch": 4668, "val_loss": 6629898.0} {"train_loss": -26.151844024658203, "global_step": 387527, "epoch": 4669} {"train_loss": -25.71213150024414, "global_step": 387528, "epoch": 4669} {"train_loss": -26.1324405670166, "global_step": 387529, "epoch": 4669} {"train_loss": -25.565946578979492, "global_step": 387530, "epoch": 4669} {"train_loss": -26.450119018554688, "global_step": 387531, "epoch": 4669} {"train_loss": -25.988454818725586, "global_step": 387532, "epoch": 4669} {"train_loss": -26.147846221923828, "global_step": 387533, "epoch": 4669} {"train_loss": -26.398420333862305, "global_step": 387534, "epoch": 4669} {"train_loss": -25.894912719726562, "global_step": 387535, "epoch": 4669} {"train_loss": -25.870725631713867, "global_step": 387536, "epoch": 4669} {"train_loss": -26.12196922302246, "global_step": 387537, "epoch": 4669} {"train_loss": -25.629602432250977, "global_step": 387538, "epoch": 4669} {"train_loss": -26.2828426361084, "global_step": 387539, "epoch": 4669} {"train_loss": -26.051025390625, "global_step": 387540, "epoch": 4669} {"train_loss": -26.149137496948242, "global_step": 387541, "epoch": 4669} {"train_loss": -26.544879913330078, "global_step": 387542, "epoch": 4669} {"train_loss": -26.403003692626953, "global_step": 387543, "epoch": 4669} {"train_loss": -26.44174575805664, "global_step": 387544, "epoch": 4669} {"train_loss": -26.600194931030273, "global_step": 387545, "epoch": 4669} {"train_loss": -26.645339965820312, "global_step": 387546, "epoch": 4669} {"train_loss": -26.26144790649414, "global_step": 387547, "epoch": 4669} {"train_loss": -26.388891220092773, "global_step": 387548, "epoch": 4669} {"train_loss": -26.229812622070312, "global_step": 387549, "epoch": 4669} {"train_loss": -26.313098907470703, "global_step": 387550, "epoch": 4669} {"train_loss": -26.280561447143555, "global_step": 387551, "epoch": 4669} {"train_loss": -26.242883682250977, "global_step": 387552, "epoch": 4669} {"train_loss": -26.27589988708496, "global_step": 387553, "epoch": 4669} {"train_loss": -26.122730255126953, "global_step": 387554, "epoch": 4669} {"train_loss": -26.463708877563477, "global_step": 387555, "epoch": 4669} {"train_loss": -26.440759658813477, "global_step": 387556, "epoch": 4669} {"train_loss": -26.446802139282227, "global_step": 387557, "epoch": 4669} {"train_loss": -26.422719955444336, "global_step": 387558, "epoch": 4669} {"train_loss": -26.526975631713867, "global_step": 387559, "epoch": 4669} {"train_loss": -26.526142120361328, "global_step": 387560, "epoch": 4669} {"train_loss": -26.683979034423828, "global_step": 387561, "epoch": 4669} {"train_loss": -26.621992111206055, "global_step": 387562, "epoch": 4669} {"train_loss": -26.4322509765625, "global_step": 387563, "epoch": 4669} {"train_loss": -26.7285099029541, "global_step": 387564, "epoch": 4669} {"train_loss": -26.391040802001953, "global_step": 387565, "epoch": 4669} {"train_loss": -26.26787757873535, "global_step": 387566, "epoch": 4669} {"train_loss": -26.280324935913086, "global_step": 387567, "epoch": 4669} {"train_loss": -26.156356811523438, "global_step": 387568, "epoch": 4669} {"train_loss": -26.659021377563477, "global_step": 387569, "epoch": 4669} {"train_loss": -26.551233291625977, "global_step": 387570, "epoch": 4669} {"train_loss": -26.443265914916992, "global_step": 387571, "epoch": 4669} {"train_loss": -26.750019073486328, "global_step": 387572, "epoch": 4669} {"train_loss": -26.715810775756836, "global_step": 387573, "epoch": 4669} {"train_loss": -26.63433265686035, "global_step": 387574, "epoch": 4669} {"train_loss": -26.700658798217773, "global_step": 387575, "epoch": 4669} {"train_loss": -26.7037353515625, "global_step": 387576, "epoch": 4669} {"train_loss": -26.43100357055664, "global_step": 387577, "epoch": 4669} {"train_loss": -26.3302001953125, "global_step": 387578, "epoch": 4669} {"train_loss": -26.873794555664062, "global_step": 387579, "epoch": 4669} {"train_loss": -26.44722557067871, "global_step": 387580, "epoch": 4669} {"train_loss": -26.438573837280273, "global_step": 387581, "epoch": 4669} {"train_loss": -26.932294845581055, "global_step": 387582, "epoch": 4669} {"train_loss": -26.65791130065918, "global_step": 387583, "epoch": 4669} {"train_loss": -26.73196792602539, "global_step": 387584, "epoch": 4669} {"train_loss": -27.050537109375, "global_step": 387585, "epoch": 4669} {"train_loss": -26.957534790039062, "global_step": 387586, "epoch": 4669} {"train_loss": -26.771228790283203, "global_step": 387587, "epoch": 4669} {"train_loss": -26.354581832885742, "global_step": 387588, "epoch": 4669} {"train_loss": -26.790143966674805, "global_step": 387589, "epoch": 4669} {"train_loss": -26.612518310546875, "global_step": 387590, "epoch": 4669} {"train_loss": -26.603525161743164, "global_step": 387591, "epoch": 4669} {"train_loss": -26.544050216674805, "global_step": 387592, "epoch": 4669} {"train_loss": -26.02130699157715, "global_step": 387593, "epoch": 4669} {"train_loss": -26.771976470947266, "global_step": 387594, "epoch": 4669} {"train_loss": -26.81501579284668, "global_step": 387595, "epoch": 4669} {"train_loss": -26.468664169311523, "global_step": 387596, "epoch": 4669} {"train_loss": -26.164752960205078, "global_step": 387597, "epoch": 4669} {"train_loss": -26.253875732421875, "global_step": 387598, "epoch": 4669} {"train_loss": -26.070554733276367, "global_step": 387599, "epoch": 4669} {"train_loss": -25.43465232849121, "global_step": 387600, "epoch": 4669} {"train_loss": -25.308809280395508, "global_step": 387601, "epoch": 4669} {"train_loss": -25.93037223815918, "global_step": 387602, "epoch": 4669} {"train_loss": -26.4514217376709, "global_step": 387603, "epoch": 4669} {"train_loss": -26.291370391845703, "global_step": 387604, "epoch": 4669} {"train_loss": -25.812536239624023, "global_step": 387605, "epoch": 4669} {"train_loss": -26.2380428314209, "global_step": 387606, "epoch": 4669} {"train_loss": -25.638059616088867, "global_step": 387607, "epoch": 4669} {"train_loss": -26.14605712890625, "global_step": 387608, "epoch": 4669} {"train_loss": -26.35419709998441, "global_step": 387609, "epoch": 4669, "val_loss": 6549226.0} {"train_loss": -24.90520668029785, "global_step": 387610, "epoch": 4670} {"train_loss": -26.023365020751953, "global_step": 387611, "epoch": 4670} {"train_loss": -25.528318405151367, "global_step": 387612, "epoch": 4670} {"train_loss": -25.470172882080078, "global_step": 387613, "epoch": 4670} {"train_loss": -25.50294303894043, "global_step": 387614, "epoch": 4670} {"train_loss": -25.59236717224121, "global_step": 387615, "epoch": 4670} {"train_loss": -26.260107040405273, "global_step": 387616, "epoch": 4670} {"train_loss": -26.250228881835938, "global_step": 387617, "epoch": 4670} {"train_loss": -25.69972038269043, "global_step": 387618, "epoch": 4670} {"train_loss": -26.230712890625, "global_step": 387619, "epoch": 4670} {"train_loss": -26.07501220703125, "global_step": 387620, "epoch": 4670} {"train_loss": -26.065292358398438, "global_step": 387621, "epoch": 4670} {"train_loss": -26.136716842651367, "global_step": 387622, "epoch": 4670} {"train_loss": -26.164154052734375, "global_step": 387623, "epoch": 4670} {"train_loss": -25.918806076049805, "global_step": 387624, "epoch": 4670} {"train_loss": -26.35373878479004, "global_step": 387625, "epoch": 4670} {"train_loss": -26.06959342956543, "global_step": 387626, "epoch": 4670} {"train_loss": -26.0937442779541, "global_step": 387627, "epoch": 4670} {"train_loss": -25.952228546142578, "global_step": 387628, "epoch": 4670} {"train_loss": -26.338699340820312, "global_step": 387629, "epoch": 4670} {"train_loss": -26.319894790649414, "global_step": 387630, "epoch": 4670} {"train_loss": -26.457029342651367, "global_step": 387631, "epoch": 4670} {"train_loss": -26.18157386779785, "global_step": 387632, "epoch": 4670} {"train_loss": -26.792572021484375, "global_step": 387633, "epoch": 4670} {"train_loss": -26.519611358642578, "global_step": 387634, "epoch": 4670} {"train_loss": -26.061920166015625, "global_step": 387635, "epoch": 4670} {"train_loss": -26.253570556640625, "global_step": 387636, "epoch": 4670} {"train_loss": -26.716522216796875, "global_step": 387637, "epoch": 4670} {"train_loss": -26.425031661987305, "global_step": 387638, "epoch": 4670} {"train_loss": -26.451801300048828, "global_step": 387639, "epoch": 4670} {"train_loss": -26.549367904663086, "global_step": 387640, "epoch": 4670} {"train_loss": -26.846948623657227, "global_step": 387641, "epoch": 4670} {"train_loss": -26.741132736206055, "global_step": 387642, "epoch": 4670} {"train_loss": -26.79465675354004, "global_step": 387643, "epoch": 4670} {"train_loss": -26.93893814086914, "global_step": 387644, "epoch": 4670} {"train_loss": -26.61958885192871, "global_step": 387645, "epoch": 4670} {"train_loss": -26.580060958862305, "global_step": 387646, "epoch": 4670} {"train_loss": -26.585113525390625, "global_step": 387647, "epoch": 4670} {"train_loss": -26.785507202148438, "global_step": 387648, "epoch": 4670} {"train_loss": -26.833282470703125, "global_step": 387649, "epoch": 4670} {"train_loss": -26.491424560546875, "global_step": 387650, "epoch": 4670} {"train_loss": -26.686798095703125, "global_step": 387651, "epoch": 4670} {"train_loss": -26.5891170501709, "global_step": 387652, "epoch": 4670} {"train_loss": -26.781991958618164, "global_step": 387653, "epoch": 4670} {"train_loss": -26.657251358032227, "global_step": 387654, "epoch": 4670} {"train_loss": -26.867441177368164, "global_step": 387655, "epoch": 4670} {"train_loss": -26.819339752197266, "global_step": 387656, "epoch": 4670} {"train_loss": -26.5030460357666, "global_step": 387657, "epoch": 4670} {"train_loss": -27.017919540405273, "global_step": 387658, "epoch": 4670} {"train_loss": -26.289508819580078, "global_step": 387659, "epoch": 4670} {"train_loss": -26.718326568603516, "global_step": 387660, "epoch": 4670} {"train_loss": -26.372589111328125, "global_step": 387661, "epoch": 4670} {"train_loss": -26.2987003326416, "global_step": 387662, "epoch": 4670} {"train_loss": -26.543567657470703, "global_step": 387663, "epoch": 4670} {"train_loss": -26.134923934936523, "global_step": 387664, "epoch": 4670} {"train_loss": -25.56807518005371, "global_step": 387665, "epoch": 4670} {"train_loss": -25.708118438720703, "global_step": 387666, "epoch": 4670} {"train_loss": -25.35652732849121, "global_step": 387667, "epoch": 4670} {"train_loss": -26.287683486938477, "global_step": 387668, "epoch": 4670} {"train_loss": -26.395978927612305, "global_step": 387669, "epoch": 4670} {"train_loss": -26.154407501220703, "global_step": 387670, "epoch": 4670} {"train_loss": -26.942895889282227, "global_step": 387671, "epoch": 4670} {"train_loss": -26.14279556274414, "global_step": 387672, "epoch": 4670} {"train_loss": -26.109806060791016, "global_step": 387673, "epoch": 4670} {"train_loss": -26.280912399291992, "global_step": 387674, "epoch": 4670} {"train_loss": -26.589582443237305, "global_step": 387675, "epoch": 4670} {"train_loss": -26.726171493530273, "global_step": 387676, "epoch": 4670} {"train_loss": -26.395544052124023, "global_step": 387677, "epoch": 4670} {"train_loss": -26.6190128326416, "global_step": 387678, "epoch": 4670} {"train_loss": -26.189050674438477, "global_step": 387679, "epoch": 4670} {"train_loss": -26.680713653564453, "global_step": 387680, "epoch": 4670} {"train_loss": -26.2425537109375, "global_step": 387681, "epoch": 4670} {"train_loss": -26.78192710876465, "global_step": 387682, "epoch": 4670} {"train_loss": -26.050949096679688, "global_step": 387683, "epoch": 4670} {"train_loss": -26.727554321289062, "global_step": 387684, "epoch": 4670} {"train_loss": -26.598907470703125, "global_step": 387685, "epoch": 4670} {"train_loss": -26.440107345581055, "global_step": 387686, "epoch": 4670} {"train_loss": -26.612577438354492, "global_step": 387687, "epoch": 4670} {"train_loss": -26.141494750976562, "global_step": 387688, "epoch": 4670} {"train_loss": -26.100080490112305, "global_step": 387689, "epoch": 4670} {"train_loss": -26.45350456237793, "global_step": 387690, "epoch": 4670} {"train_loss": -26.759674072265625, "global_step": 387691, "epoch": 4670} {"train_loss": -26.32927538400673, "global_step": 387692, "epoch": 4670, "val_loss": 6560063.5} {"train_loss": -26.462909698486328, "global_step": 387693, "epoch": 4671} {"train_loss": -26.193323135375977, "global_step": 387694, "epoch": 4671} {"train_loss": -26.4244384765625, "global_step": 387695, "epoch": 4671} {"train_loss": -26.018512725830078, "global_step": 387696, "epoch": 4671} {"train_loss": -26.546722412109375, "global_step": 387697, "epoch": 4671} {"train_loss": -26.62447166442871, "global_step": 387698, "epoch": 4671} {"train_loss": -26.679296493530273, "global_step": 387699, "epoch": 4671} {"train_loss": -26.71124839782715, "global_step": 387700, "epoch": 4671} {"train_loss": -26.195920944213867, "global_step": 387701, "epoch": 4671} {"train_loss": -26.375324249267578, "global_step": 387702, "epoch": 4671} {"train_loss": -26.103118896484375, "global_step": 387703, "epoch": 4671} {"train_loss": -26.424823760986328, "global_step": 387704, "epoch": 4671} {"train_loss": -26.081518173217773, "global_step": 387705, "epoch": 4671} {"train_loss": -26.40296745300293, "global_step": 387706, "epoch": 4671} {"train_loss": -26.786727905273438, "global_step": 387707, "epoch": 4671} {"train_loss": -26.38507080078125, "global_step": 387708, "epoch": 4671} {"train_loss": -26.488971710205078, "global_step": 387709, "epoch": 4671} {"train_loss": -26.55231285095215, "global_step": 387710, "epoch": 4671} {"train_loss": -26.714826583862305, "global_step": 387711, "epoch": 4671} {"train_loss": -26.78204917907715, "global_step": 387712, "epoch": 4671} {"train_loss": -26.57735252380371, "global_step": 387713, "epoch": 4671} {"train_loss": -26.7286319732666, "global_step": 387714, "epoch": 4671} {"train_loss": -26.35930824279785, "global_step": 387715, "epoch": 4671} {"train_loss": -26.303075790405273, "global_step": 387716, "epoch": 4671} {"train_loss": -26.76504898071289, "global_step": 387717, "epoch": 4671} {"train_loss": -26.7108097076416, "global_step": 387718, "epoch": 4671} {"train_loss": -26.886505126953125, "global_step": 387719, "epoch": 4671} {"train_loss": -26.737409591674805, "global_step": 387720, "epoch": 4671} {"train_loss": -26.45806884765625, "global_step": 387721, "epoch": 4671} {"train_loss": -26.355880737304688, "global_step": 387722, "epoch": 4671} {"train_loss": -26.5775146484375, "global_step": 387723, "epoch": 4671} {"train_loss": -26.969762802124023, "global_step": 387724, "epoch": 4671} {"train_loss": -26.446313858032227, "global_step": 387725, "epoch": 4671} {"train_loss": -26.546875, "global_step": 387726, "epoch": 4671} {"train_loss": -26.725507736206055, "global_step": 387727, "epoch": 4671} {"train_loss": -26.510351181030273, "global_step": 387728, "epoch": 4671} {"train_loss": -26.767892837524414, "global_step": 387729, "epoch": 4671} {"train_loss": -26.490234375, "global_step": 387730, "epoch": 4671} {"train_loss": -26.75504493713379, "global_step": 387731, "epoch": 4671} {"train_loss": -25.942590713500977, "global_step": 387732, "epoch": 4671} {"train_loss": -26.76030921936035, "global_step": 387733, "epoch": 4671} {"train_loss": -26.804410934448242, "global_step": 387734, "epoch": 4671} {"train_loss": -26.633438110351562, "global_step": 387735, "epoch": 4671} {"train_loss": -26.82765007019043, "global_step": 387736, "epoch": 4671} {"train_loss": -26.360187530517578, "global_step": 387737, "epoch": 4671} {"train_loss": -26.72358512878418, "global_step": 387738, "epoch": 4671} {"train_loss": -26.557571411132812, "global_step": 387739, "epoch": 4671} {"train_loss": -26.613073348999023, "global_step": 387740, "epoch": 4671} {"train_loss": -26.210290908813477, "global_step": 387741, "epoch": 4671} {"train_loss": -26.28202247619629, "global_step": 387742, "epoch": 4671} {"train_loss": -26.26908302307129, "global_step": 387743, "epoch": 4671} {"train_loss": -26.216571807861328, "global_step": 387744, "epoch": 4671} {"train_loss": -26.804960250854492, "global_step": 387745, "epoch": 4671} {"train_loss": -26.454166412353516, "global_step": 387746, "epoch": 4671} {"train_loss": -26.471927642822266, "global_step": 387747, "epoch": 4671} {"train_loss": -26.06666374206543, "global_step": 387748, "epoch": 4671} {"train_loss": -26.129606246948242, "global_step": 387749, "epoch": 4671} {"train_loss": -25.97348403930664, "global_step": 387750, "epoch": 4671} {"train_loss": -26.417993545532227, "global_step": 387751, "epoch": 4671} {"train_loss": -26.644367218017578, "global_step": 387752, "epoch": 4671} {"train_loss": -26.706436157226562, "global_step": 387753, "epoch": 4671} {"train_loss": -26.518604278564453, "global_step": 387754, "epoch": 4671} {"train_loss": -26.73296546936035, "global_step": 387755, "epoch": 4671} {"train_loss": -26.70688247680664, "global_step": 387756, "epoch": 4671} {"train_loss": -26.315967559814453, "global_step": 387757, "epoch": 4671} {"train_loss": -26.58782958984375, "global_step": 387758, "epoch": 4671} {"train_loss": -26.68631935119629, "global_step": 387759, "epoch": 4671} {"train_loss": -26.4482421875, "global_step": 387760, "epoch": 4671} {"train_loss": -26.8525333404541, "global_step": 387761, "epoch": 4671} {"train_loss": -26.737567901611328, "global_step": 387762, "epoch": 4671} {"train_loss": -26.873945236206055, "global_step": 387763, "epoch": 4671} {"train_loss": -26.61594009399414, "global_step": 387764, "epoch": 4671} {"train_loss": -26.806528091430664, "global_step": 387765, "epoch": 4671} {"train_loss": -26.428075790405273, "global_step": 387766, "epoch": 4671} {"train_loss": -26.47296714782715, "global_step": 387767, "epoch": 4671} {"train_loss": -26.7331600189209, "global_step": 387768, "epoch": 4671} {"train_loss": -26.306903839111328, "global_step": 387769, "epoch": 4671} {"train_loss": -26.278425216674805, "global_step": 387770, "epoch": 4671} {"train_loss": -26.43665885925293, "global_step": 387771, "epoch": 4671} {"train_loss": -26.56971549987793, "global_step": 387772, "epoch": 4671} {"train_loss": -26.794830322265625, "global_step": 387773, "epoch": 4671} {"train_loss": -26.801319122314453, "global_step": 387774, "epoch": 4671} {"train_loss": -26.52391339497394, "global_step": 387775, "epoch": 4671, "val_loss": 6554739.5} {"train_loss": -25.951934814453125, "global_step": 387776, "epoch": 4672} {"train_loss": -25.9103946685791, "global_step": 387777, "epoch": 4672} {"train_loss": -26.221160888671875, "global_step": 387778, "epoch": 4672} {"train_loss": -25.976606369018555, "global_step": 387779, "epoch": 4672} {"train_loss": -25.8181095123291, "global_step": 387780, "epoch": 4672} {"train_loss": -26.267480850219727, "global_step": 387781, "epoch": 4672} {"train_loss": -25.35223388671875, "global_step": 387782, "epoch": 4672} {"train_loss": -26.114538192749023, "global_step": 387783, "epoch": 4672} {"train_loss": -27.0128231048584, "global_step": 387784, "epoch": 4672} {"train_loss": -25.644275665283203, "global_step": 387785, "epoch": 4672} {"train_loss": -26.226240158081055, "global_step": 387786, "epoch": 4672} {"train_loss": -25.597604751586914, "global_step": 387787, "epoch": 4672} {"train_loss": -26.124425888061523, "global_step": 387788, "epoch": 4672} {"train_loss": -26.0350341796875, "global_step": 387789, "epoch": 4672} {"train_loss": -26.53619384765625, "global_step": 387790, "epoch": 4672} {"train_loss": -25.70792007446289, "global_step": 387791, "epoch": 4672} {"train_loss": -26.087732315063477, "global_step": 387792, "epoch": 4672} {"train_loss": -26.096298217773438, "global_step": 387793, "epoch": 4672} {"train_loss": -26.26742935180664, "global_step": 387794, "epoch": 4672} {"train_loss": -25.95379066467285, "global_step": 387795, "epoch": 4672} {"train_loss": -26.163501739501953, "global_step": 387796, "epoch": 4672} {"train_loss": -26.564023971557617, "global_step": 387797, "epoch": 4672} {"train_loss": -26.367267608642578, "global_step": 387798, "epoch": 4672} {"train_loss": -26.38999366760254, "global_step": 387799, "epoch": 4672} {"train_loss": -26.054174423217773, "global_step": 387800, "epoch": 4672} {"train_loss": -26.480854034423828, "global_step": 387801, "epoch": 4672} {"train_loss": -26.433881759643555, "global_step": 387802, "epoch": 4672} {"train_loss": -26.196542739868164, "global_step": 387803, "epoch": 4672} {"train_loss": -26.6298885345459, "global_step": 387804, "epoch": 4672} {"train_loss": -26.446136474609375, "global_step": 387805, "epoch": 4672} {"train_loss": -26.417510986328125, "global_step": 387806, "epoch": 4672} {"train_loss": -26.2340030670166, "global_step": 387807, "epoch": 4672} {"train_loss": -26.06941032409668, "global_step": 387808, "epoch": 4672} {"train_loss": -26.416996002197266, "global_step": 387809, "epoch": 4672} {"train_loss": -26.257490158081055, "global_step": 387810, "epoch": 4672} {"train_loss": -26.522357940673828, "global_step": 387811, "epoch": 4672} {"train_loss": -26.413366317749023, "global_step": 387812, "epoch": 4672} {"train_loss": -26.363195419311523, "global_step": 387813, "epoch": 4672} {"train_loss": -26.656930923461914, "global_step": 387814, "epoch": 4672} {"train_loss": -26.319360733032227, "global_step": 387815, "epoch": 4672} {"train_loss": -26.82618522644043, "global_step": 387816, "epoch": 4672} {"train_loss": -26.14914321899414, "global_step": 387817, "epoch": 4672} {"train_loss": -26.683521270751953, "global_step": 387818, "epoch": 4672} {"train_loss": -26.51826286315918, "global_step": 387819, "epoch": 4672} {"train_loss": -26.911895751953125, "global_step": 387820, "epoch": 4672} {"train_loss": -26.4356689453125, "global_step": 387821, "epoch": 4672} {"train_loss": -26.48369789123535, "global_step": 387822, "epoch": 4672} {"train_loss": -26.18949317932129, "global_step": 387823, "epoch": 4672} {"train_loss": -26.285741806030273, "global_step": 387824, "epoch": 4672} {"train_loss": -26.576475143432617, "global_step": 387825, "epoch": 4672} {"train_loss": -26.414453506469727, "global_step": 387826, "epoch": 4672} {"train_loss": -26.236364364624023, "global_step": 387827, "epoch": 4672} {"train_loss": -26.505207061767578, "global_step": 387828, "epoch": 4672} {"train_loss": -26.44898796081543, "global_step": 387829, "epoch": 4672} {"train_loss": -26.117279052734375, "global_step": 387830, "epoch": 4672} {"train_loss": -26.735727310180664, "global_step": 387831, "epoch": 4672} {"train_loss": -26.347869873046875, "global_step": 387832, "epoch": 4672} {"train_loss": -26.604230880737305, "global_step": 387833, "epoch": 4672} {"train_loss": -26.954593658447266, "global_step": 387834, "epoch": 4672} {"train_loss": -26.470258712768555, "global_step": 387835, "epoch": 4672} {"train_loss": -26.617956161499023, "global_step": 387836, "epoch": 4672} {"train_loss": -26.603717803955078, "global_step": 387837, "epoch": 4672} {"train_loss": -26.727508544921875, "global_step": 387838, "epoch": 4672} {"train_loss": -26.28046226501465, "global_step": 387839, "epoch": 4672} {"train_loss": -26.282392501831055, "global_step": 387840, "epoch": 4672} {"train_loss": -26.69114112854004, "global_step": 387841, "epoch": 4672} {"train_loss": -26.544342041015625, "global_step": 387842, "epoch": 4672} {"train_loss": -26.591962814331055, "global_step": 387843, "epoch": 4672} {"train_loss": -26.474014282226562, "global_step": 387844, "epoch": 4672} {"train_loss": -26.428058624267578, "global_step": 387845, "epoch": 4672} {"train_loss": -26.545612335205078, "global_step": 387846, "epoch": 4672} {"train_loss": -26.273710250854492, "global_step": 387847, "epoch": 4672} {"train_loss": -26.48788833618164, "global_step": 387848, "epoch": 4672} {"train_loss": -26.691801071166992, "global_step": 387849, "epoch": 4672} {"train_loss": -26.619665145874023, "global_step": 387850, "epoch": 4672} {"train_loss": -26.626779556274414, "global_step": 387851, "epoch": 4672} {"train_loss": -26.513477325439453, "global_step": 387852, "epoch": 4672} {"train_loss": -26.750986099243164, "global_step": 387853, "epoch": 4672} {"train_loss": -26.357797622680664, "global_step": 387854, "epoch": 4672} {"train_loss": -26.983259201049805, "global_step": 387855, "epoch": 4672} {"train_loss": -26.452884674072266, "global_step": 387856, "epoch": 4672} {"train_loss": -26.455657958984375, "global_step": 387857, "epoch": 4672} {"train_loss": -26.385067721447314, "global_step": 387858, "epoch": 4672, "val_loss": 6561769.0} {"train_loss": -25.92022132873535, "global_step": 387859, "epoch": 4673} {"train_loss": -26.239505767822266, "global_step": 387860, "epoch": 4673} {"train_loss": -25.781034469604492, "global_step": 387861, "epoch": 4673} {"train_loss": -25.66473960876465, "global_step": 387862, "epoch": 4673} {"train_loss": -25.886960983276367, "global_step": 387863, "epoch": 4673} {"train_loss": -25.883939743041992, "global_step": 387864, "epoch": 4673} {"train_loss": -25.51676368713379, "global_step": 387865, "epoch": 4673} {"train_loss": -26.14302635192871, "global_step": 387866, "epoch": 4673} {"train_loss": -25.70134925842285, "global_step": 387867, "epoch": 4673} {"train_loss": -25.959808349609375, "global_step": 387868, "epoch": 4673} {"train_loss": -25.60831069946289, "global_step": 387869, "epoch": 4673} {"train_loss": -25.98560905456543, "global_step": 387870, "epoch": 4673} {"train_loss": -25.86697769165039, "global_step": 387871, "epoch": 4673} {"train_loss": -26.408782958984375, "global_step": 387872, "epoch": 4673} {"train_loss": -26.304855346679688, "global_step": 387873, "epoch": 4673} {"train_loss": -26.48536491394043, "global_step": 387874, "epoch": 4673} {"train_loss": -26.064746856689453, "global_step": 387875, "epoch": 4673} {"train_loss": -26.016904830932617, "global_step": 387876, "epoch": 4673} {"train_loss": -26.29718589782715, "global_step": 387877, "epoch": 4673} {"train_loss": -26.31593132019043, "global_step": 387878, "epoch": 4673} {"train_loss": -26.80034828186035, "global_step": 387879, "epoch": 4673} {"train_loss": -26.26924705505371, "global_step": 387880, "epoch": 4673} {"train_loss": -26.1180477142334, "global_step": 387881, "epoch": 4673} {"train_loss": -26.830902099609375, "global_step": 387882, "epoch": 4673} {"train_loss": -26.5174617767334, "global_step": 387883, "epoch": 4673} {"train_loss": -25.922704696655273, "global_step": 387884, "epoch": 4673} {"train_loss": -26.17146110534668, "global_step": 387885, "epoch": 4673} {"train_loss": -26.219104766845703, "global_step": 387886, "epoch": 4673} {"train_loss": -26.494281768798828, "global_step": 387887, "epoch": 4673} {"train_loss": -26.425048828125, "global_step": 387888, "epoch": 4673} {"train_loss": -26.204572677612305, "global_step": 387889, "epoch": 4673} {"train_loss": -26.367385864257812, "global_step": 387890, "epoch": 4673} {"train_loss": -26.404586791992188, "global_step": 387891, "epoch": 4673} {"train_loss": -26.532556533813477, "global_step": 387892, "epoch": 4673} {"train_loss": -26.286670684814453, "global_step": 387893, "epoch": 4673} {"train_loss": -26.800683975219727, "global_step": 387894, "epoch": 4673} {"train_loss": -26.701282501220703, "global_step": 387895, "epoch": 4673} {"train_loss": -26.238317489624023, "global_step": 387896, "epoch": 4673} {"train_loss": -26.620752334594727, "global_step": 387897, "epoch": 4673} {"train_loss": -26.980451583862305, "global_step": 387898, "epoch": 4673} {"train_loss": -26.10346031188965, "global_step": 387899, "epoch": 4673} {"train_loss": -26.926868438720703, "global_step": 387900, "epoch": 4673} {"train_loss": -26.693008422851562, "global_step": 387901, "epoch": 4673} {"train_loss": -26.737775802612305, "global_step": 387902, "epoch": 4673} {"train_loss": -26.762027740478516, "global_step": 387903, "epoch": 4673} {"train_loss": -26.67441177368164, "global_step": 387904, "epoch": 4673} {"train_loss": -26.39373207092285, "global_step": 387905, "epoch": 4673} {"train_loss": -26.813390731811523, "global_step": 387906, "epoch": 4673} {"train_loss": -27.041990280151367, "global_step": 387907, "epoch": 4673} {"train_loss": -26.390567779541016, "global_step": 387908, "epoch": 4673} {"train_loss": -26.350088119506836, "global_step": 387909, "epoch": 4673} {"train_loss": -26.616443634033203, "global_step": 387910, "epoch": 4673} {"train_loss": -26.522449493408203, "global_step": 387911, "epoch": 4673} {"train_loss": -26.490034103393555, "global_step": 387912, "epoch": 4673} {"train_loss": -26.1271915435791, "global_step": 387913, "epoch": 4673} {"train_loss": -26.950712203979492, "global_step": 387914, "epoch": 4673} {"train_loss": -26.4708194732666, "global_step": 387915, "epoch": 4673} {"train_loss": -26.854084014892578, "global_step": 387916, "epoch": 4673} {"train_loss": -26.420988082885742, "global_step": 387917, "epoch": 4673} {"train_loss": -26.809934616088867, "global_step": 387918, "epoch": 4673} {"train_loss": -26.388071060180664, "global_step": 387919, "epoch": 4673} {"train_loss": -26.36957359313965, "global_step": 387920, "epoch": 4673} {"train_loss": -26.284042358398438, "global_step": 387921, "epoch": 4673} {"train_loss": -26.595169067382812, "global_step": 387922, "epoch": 4673} {"train_loss": -26.42376136779785, "global_step": 387923, "epoch": 4673} {"train_loss": -26.422101974487305, "global_step": 387924, "epoch": 4673} {"train_loss": -26.47201919555664, "global_step": 387925, "epoch": 4673} {"train_loss": -26.622175216674805, "global_step": 387926, "epoch": 4673} {"train_loss": -26.527379989624023, "global_step": 387927, "epoch": 4673} {"train_loss": -26.397388458251953, "global_step": 387928, "epoch": 4673} {"train_loss": -26.578649520874023, "global_step": 387929, "epoch": 4673} {"train_loss": -26.66983985900879, "global_step": 387930, "epoch": 4673} {"train_loss": -26.537282943725586, "global_step": 387931, "epoch": 4673} {"train_loss": -26.45777702331543, "global_step": 387932, "epoch": 4673} {"train_loss": -26.681440353393555, "global_step": 387933, "epoch": 4673} {"train_loss": -26.8019962310791, "global_step": 387934, "epoch": 4673} {"train_loss": -26.85459327697754, "global_step": 387935, "epoch": 4673} {"train_loss": -26.507909774780273, "global_step": 387936, "epoch": 4673} {"train_loss": -26.662464141845703, "global_step": 387937, "epoch": 4673} {"train_loss": -26.68617057800293, "global_step": 387938, "epoch": 4673} {"train_loss": -26.967145919799805, "global_step": 387939, "epoch": 4673} {"train_loss": -26.82122230529785, "global_step": 387940, "epoch": 4673} {"train_loss": -26.421220503657697, "global_step": 387941, "epoch": 4673, "val_loss": 6595035.0} {"train_loss": -26.327123641967773, "global_step": 387942, "epoch": 4674} {"train_loss": -26.325292587280273, "global_step": 387943, "epoch": 4674} {"train_loss": -26.09488296508789, "global_step": 387944, "epoch": 4674} {"train_loss": -25.86146354675293, "global_step": 387945, "epoch": 4674} {"train_loss": -25.772968292236328, "global_step": 387946, "epoch": 4674} {"train_loss": -26.6317195892334, "global_step": 387947, "epoch": 4674} {"train_loss": -26.241748809814453, "global_step": 387948, "epoch": 4674} {"train_loss": -26.228076934814453, "global_step": 387949, "epoch": 4674} {"train_loss": -26.1162166595459, "global_step": 387950, "epoch": 4674} {"train_loss": -25.94740104675293, "global_step": 387951, "epoch": 4674} {"train_loss": -26.50099754333496, "global_step": 387952, "epoch": 4674} {"train_loss": -26.023117065429688, "global_step": 387953, "epoch": 4674} {"train_loss": -26.333118438720703, "global_step": 387954, "epoch": 4674} {"train_loss": -26.228199005126953, "global_step": 387955, "epoch": 4674} {"train_loss": -26.3032283782959, "global_step": 387956, "epoch": 4674} {"train_loss": -25.918231964111328, "global_step": 387957, "epoch": 4674} {"train_loss": -26.559125900268555, "global_step": 387958, "epoch": 4674} {"train_loss": -26.535825729370117, "global_step": 387959, "epoch": 4674} {"train_loss": -26.329126358032227, "global_step": 387960, "epoch": 4674} {"train_loss": -26.195266723632812, "global_step": 387961, "epoch": 4674} {"train_loss": -25.857440948486328, "global_step": 387962, "epoch": 4674} {"train_loss": -26.2628116607666, "global_step": 387963, "epoch": 4674} {"train_loss": -26.157012939453125, "global_step": 387964, "epoch": 4674} {"train_loss": -26.49165153503418, "global_step": 387965, "epoch": 4674} {"train_loss": -26.223920822143555, "global_step": 387966, "epoch": 4674} {"train_loss": -26.219263076782227, "global_step": 387967, "epoch": 4674} {"train_loss": -26.50679588317871, "global_step": 387968, "epoch": 4674} {"train_loss": -26.441436767578125, "global_step": 387969, "epoch": 4674} {"train_loss": -26.494800567626953, "global_step": 387970, "epoch": 4674} {"train_loss": -26.210590362548828, "global_step": 387971, "epoch": 4674} {"train_loss": -26.57962989807129, "global_step": 387972, "epoch": 4674} {"train_loss": -26.55439567565918, "global_step": 387973, "epoch": 4674} {"train_loss": -26.623498916625977, "global_step": 387974, "epoch": 4674} {"train_loss": -26.342008590698242, "global_step": 387975, "epoch": 4674} {"train_loss": -26.37615394592285, "global_step": 387976, "epoch": 4674} {"train_loss": -26.408288955688477, "global_step": 387977, "epoch": 4674} {"train_loss": -26.272214889526367, "global_step": 387978, "epoch": 4674} {"train_loss": -26.500885009765625, "global_step": 387979, "epoch": 4674} {"train_loss": -26.733661651611328, "global_step": 387980, "epoch": 4674} {"train_loss": -26.911489486694336, "global_step": 387981, "epoch": 4674} {"train_loss": -26.624929428100586, "global_step": 387982, "epoch": 4674} {"train_loss": -26.628753662109375, "global_step": 387983, "epoch": 4674} {"train_loss": -26.486343383789062, "global_step": 387984, "epoch": 4674} {"train_loss": -27.156442642211914, "global_step": 387985, "epoch": 4674} {"train_loss": -26.315631866455078, "global_step": 387986, "epoch": 4674} {"train_loss": -26.512720108032227, "global_step": 387987, "epoch": 4674} {"train_loss": -26.643049240112305, "global_step": 387988, "epoch": 4674} {"train_loss": -26.128660202026367, "global_step": 387989, "epoch": 4674} {"train_loss": -26.27276611328125, "global_step": 387990, "epoch": 4674} {"train_loss": -26.393537521362305, "global_step": 387991, "epoch": 4674} {"train_loss": -26.6373233795166, "global_step": 387992, "epoch": 4674} {"train_loss": -26.701587677001953, "global_step": 387993, "epoch": 4674} {"train_loss": -26.876251220703125, "global_step": 387994, "epoch": 4674} {"train_loss": -26.649890899658203, "global_step": 387995, "epoch": 4674} {"train_loss": -26.374547958374023, "global_step": 387996, "epoch": 4674} {"train_loss": -26.155506134033203, "global_step": 387997, "epoch": 4674} {"train_loss": -26.589277267456055, "global_step": 387998, "epoch": 4674} {"train_loss": -26.548276901245117, "global_step": 387999, "epoch": 4674} {"train_loss": -26.375579833984375, "global_step": 388000, "epoch": 4674} {"train_loss": -26.371902465820312, "global_step": 388001, "epoch": 4674} {"train_loss": -26.272424697875977, "global_step": 388002, "epoch": 4674} {"train_loss": -26.62152671813965, "global_step": 388003, "epoch": 4674} {"train_loss": -26.23440933227539, "global_step": 388004, "epoch": 4674} {"train_loss": -26.737539291381836, "global_step": 388005, "epoch": 4674} {"train_loss": -26.50979995727539, "global_step": 388006, "epoch": 4674} {"train_loss": -26.417621612548828, "global_step": 388007, "epoch": 4674} {"train_loss": -26.583642959594727, "global_step": 388008, "epoch": 4674} {"train_loss": -26.66705894470215, "global_step": 388009, "epoch": 4674} {"train_loss": -26.740203857421875, "global_step": 388010, "epoch": 4674} {"train_loss": -26.490365982055664, "global_step": 388011, "epoch": 4674} {"train_loss": -26.560577392578125, "global_step": 388012, "epoch": 4674} {"train_loss": -26.692626953125, "global_step": 388013, "epoch": 4674} {"train_loss": -26.507160186767578, "global_step": 388014, "epoch": 4674} {"train_loss": -26.599517822265625, "global_step": 388015, "epoch": 4674} {"train_loss": -26.420087814331055, "global_step": 388016, "epoch": 4674} {"train_loss": -26.304702758789062, "global_step": 388017, "epoch": 4674} {"train_loss": -26.89630699157715, "global_step": 388018, "epoch": 4674} {"train_loss": -26.571531295776367, "global_step": 388019, "epoch": 4674} {"train_loss": -26.663715362548828, "global_step": 388020, "epoch": 4674} {"train_loss": -27.086292266845703, "global_step": 388021, "epoch": 4674} {"train_loss": -26.692747116088867, "global_step": 388022, "epoch": 4674} {"train_loss": -26.661081314086914, "global_step": 388023, "epoch": 4674} {"train_loss": -26.44028429238193, "global_step": 388024, "epoch": 4674, "val_loss": 6634340.0} {"train_loss": -26.2394962310791, "global_step": 388025, "epoch": 4675} {"train_loss": -25.445024490356445, "global_step": 388026, "epoch": 4675} {"train_loss": -25.673681259155273, "global_step": 388027, "epoch": 4675} {"train_loss": -25.864944458007812, "global_step": 388028, "epoch": 4675} {"train_loss": -26.14584732055664, "global_step": 388029, "epoch": 4675} {"train_loss": -26.357318878173828, "global_step": 388030, "epoch": 4675} {"train_loss": -26.1469783782959, "global_step": 388031, "epoch": 4675} {"train_loss": -26.361495971679688, "global_step": 388032, "epoch": 4675} {"train_loss": -26.211780548095703, "global_step": 388033, "epoch": 4675} {"train_loss": -26.3958740234375, "global_step": 388034, "epoch": 4675} {"train_loss": -26.095548629760742, "global_step": 388035, "epoch": 4675} {"train_loss": -26.735340118408203, "global_step": 388036, "epoch": 4675} {"train_loss": -26.639495849609375, "global_step": 388037, "epoch": 4675} {"train_loss": -26.345569610595703, "global_step": 388038, "epoch": 4675} {"train_loss": -26.29387855529785, "global_step": 388039, "epoch": 4675} {"train_loss": -26.452117919921875, "global_step": 388040, "epoch": 4675} {"train_loss": -26.33167839050293, "global_step": 388041, "epoch": 4675} {"train_loss": -26.3837833404541, "global_step": 388042, "epoch": 4675} {"train_loss": -26.283292770385742, "global_step": 388043, "epoch": 4675} {"train_loss": -26.3216609954834, "global_step": 388044, "epoch": 4675} {"train_loss": -26.560094833374023, "global_step": 388045, "epoch": 4675} {"train_loss": -26.442296981811523, "global_step": 388046, "epoch": 4675} {"train_loss": -26.377607345581055, "global_step": 388047, "epoch": 4675} {"train_loss": -26.287763595581055, "global_step": 388048, "epoch": 4675} {"train_loss": -26.843250274658203, "global_step": 388049, "epoch": 4675} {"train_loss": -26.284109115600586, "global_step": 388050, "epoch": 4675} {"train_loss": -26.595962524414062, "global_step": 388051, "epoch": 4675} {"train_loss": -26.69978904724121, "global_step": 388052, "epoch": 4675} {"train_loss": -26.73060417175293, "global_step": 388053, "epoch": 4675} {"train_loss": -26.592920303344727, "global_step": 388054, "epoch": 4675} {"train_loss": -26.805097579956055, "global_step": 388055, "epoch": 4675} {"train_loss": -26.660491943359375, "global_step": 388056, "epoch": 4675} {"train_loss": -26.4869441986084, "global_step": 388057, "epoch": 4675} {"train_loss": -26.47596549987793, "global_step": 388058, "epoch": 4675} {"train_loss": -26.37970542907715, "global_step": 388059, "epoch": 4675} {"train_loss": -26.595233917236328, "global_step": 388060, "epoch": 4675} {"train_loss": -26.447113037109375, "global_step": 388061, "epoch": 4675} {"train_loss": -26.934865951538086, "global_step": 388062, "epoch": 4675} {"train_loss": -26.635162353515625, "global_step": 388063, "epoch": 4675} {"train_loss": -26.541309356689453, "global_step": 388064, "epoch": 4675} {"train_loss": -25.90057945251465, "global_step": 388065, "epoch": 4675} {"train_loss": -25.435319900512695, "global_step": 388066, "epoch": 4675} {"train_loss": -25.68463706970215, "global_step": 388067, "epoch": 4675} {"train_loss": -26.515729904174805, "global_step": 388068, "epoch": 4675} {"train_loss": -26.694610595703125, "global_step": 388069, "epoch": 4675} {"train_loss": -25.810611724853516, "global_step": 388070, "epoch": 4675} {"train_loss": -26.406850814819336, "global_step": 388071, "epoch": 4675} {"train_loss": -26.316381454467773, "global_step": 388072, "epoch": 4675} {"train_loss": -26.172224044799805, "global_step": 388073, "epoch": 4675} {"train_loss": -26.85405921936035, "global_step": 388074, "epoch": 4675} {"train_loss": -26.466657638549805, "global_step": 388075, "epoch": 4675} {"train_loss": -26.692890167236328, "global_step": 388076, "epoch": 4675} {"train_loss": -26.880386352539062, "global_step": 388077, "epoch": 4675} {"train_loss": -26.472126007080078, "global_step": 388078, "epoch": 4675} {"train_loss": -26.508285522460938, "global_step": 388079, "epoch": 4675} {"train_loss": -26.117267608642578, "global_step": 388080, "epoch": 4675} {"train_loss": -25.942554473876953, "global_step": 388081, "epoch": 4675} {"train_loss": -26.112201690673828, "global_step": 388082, "epoch": 4675} {"train_loss": -26.40437126159668, "global_step": 388083, "epoch": 4675} {"train_loss": -26.3153133392334, "global_step": 388084, "epoch": 4675} {"train_loss": -25.929624557495117, "global_step": 388085, "epoch": 4675} {"train_loss": -25.920745849609375, "global_step": 388086, "epoch": 4675} {"train_loss": -26.079391479492188, "global_step": 388087, "epoch": 4675} {"train_loss": -26.112897872924805, "global_step": 388088, "epoch": 4675} {"train_loss": -26.267820358276367, "global_step": 388089, "epoch": 4675} {"train_loss": -25.981443405151367, "global_step": 388090, "epoch": 4675} {"train_loss": -26.468463897705078, "global_step": 388091, "epoch": 4675} {"train_loss": -26.652618408203125, "global_step": 388092, "epoch": 4675} {"train_loss": -26.53740882873535, "global_step": 388093, "epoch": 4675} {"train_loss": -26.347915649414062, "global_step": 388094, "epoch": 4675} {"train_loss": -26.011686325073242, "global_step": 388095, "epoch": 4675} {"train_loss": -26.573974609375, "global_step": 388096, "epoch": 4675} {"train_loss": -26.17131996154785, "global_step": 388097, "epoch": 4675} {"train_loss": -26.846607208251953, "global_step": 388098, "epoch": 4675} {"train_loss": -26.474853515625, "global_step": 388099, "epoch": 4675} {"train_loss": -26.712011337280273, "global_step": 388100, "epoch": 4675} {"train_loss": -26.31194496154785, "global_step": 388101, "epoch": 4675} {"train_loss": -26.587533950805664, "global_step": 388102, "epoch": 4675} {"train_loss": -26.31318473815918, "global_step": 388103, "epoch": 4675} {"train_loss": -26.763614654541016, "global_step": 388104, "epoch": 4675} {"train_loss": -26.608091354370117, "global_step": 388105, "epoch": 4675} {"train_loss": -26.686674118041992, "global_step": 388106, "epoch": 4675} {"train_loss": -26.38764631891825, "global_step": 388107, "epoch": 4675, "val_loss": 6628906.0} {"train_loss": -26.379682540893555, "global_step": 388108, "epoch": 4676} {"train_loss": -26.097925186157227, "global_step": 388109, "epoch": 4676} {"train_loss": -26.603378295898438, "global_step": 388110, "epoch": 4676} {"train_loss": -26.630773544311523, "global_step": 388111, "epoch": 4676} {"train_loss": -26.176382064819336, "global_step": 388112, "epoch": 4676} {"train_loss": -26.3460636138916, "global_step": 388113, "epoch": 4676} {"train_loss": -26.270923614501953, "global_step": 388114, "epoch": 4676} {"train_loss": -26.619089126586914, "global_step": 388115, "epoch": 4676} {"train_loss": -26.364782333374023, "global_step": 388116, "epoch": 4676} {"train_loss": -26.396265029907227, "global_step": 388117, "epoch": 4676} {"train_loss": -26.148956298828125, "global_step": 388118, "epoch": 4676} {"train_loss": -26.374231338500977, "global_step": 388119, "epoch": 4676} {"train_loss": -26.543115615844727, "global_step": 388120, "epoch": 4676} {"train_loss": -26.915510177612305, "global_step": 388121, "epoch": 4676} {"train_loss": -26.82554054260254, "global_step": 388122, "epoch": 4676} {"train_loss": -26.443830490112305, "global_step": 388123, "epoch": 4676} {"train_loss": -26.552734375, "global_step": 388124, "epoch": 4676} {"train_loss": -26.46982765197754, "global_step": 388125, "epoch": 4676} {"train_loss": -26.9199275970459, "global_step": 388126, "epoch": 4676} {"train_loss": -26.275440216064453, "global_step": 388127, "epoch": 4676} {"train_loss": -26.630529403686523, "global_step": 388128, "epoch": 4676} {"train_loss": -26.600378036499023, "global_step": 388129, "epoch": 4676} {"train_loss": -26.28598403930664, "global_step": 388130, "epoch": 4676} {"train_loss": -26.840299606323242, "global_step": 388131, "epoch": 4676} {"train_loss": -26.377050399780273, "global_step": 388132, "epoch": 4676} {"train_loss": -26.522546768188477, "global_step": 388133, "epoch": 4676} {"train_loss": -25.79449462890625, "global_step": 388134, "epoch": 4676} {"train_loss": -26.4166316986084, "global_step": 388135, "epoch": 4676} {"train_loss": -26.387067794799805, "global_step": 388136, "epoch": 4676} {"train_loss": -26.82155418395996, "global_step": 388137, "epoch": 4676} {"train_loss": -25.963544845581055, "global_step": 388138, "epoch": 4676} {"train_loss": -26.52686882019043, "global_step": 388139, "epoch": 4676} {"train_loss": -26.63559341430664, "global_step": 388140, "epoch": 4676} {"train_loss": -26.916418075561523, "global_step": 388141, "epoch": 4676} {"train_loss": -26.870908737182617, "global_step": 388142, "epoch": 4676} {"train_loss": -26.85378074645996, "global_step": 388143, "epoch": 4676} {"train_loss": -26.9114933013916, "global_step": 388144, "epoch": 4676} {"train_loss": -26.512765884399414, "global_step": 388145, "epoch": 4676} {"train_loss": -25.956876754760742, "global_step": 388146, "epoch": 4676} {"train_loss": -26.651752471923828, "global_step": 388147, "epoch": 4676} {"train_loss": -26.87639808654785, "global_step": 388148, "epoch": 4676} {"train_loss": -26.4505558013916, "global_step": 388149, "epoch": 4676} {"train_loss": -26.401432037353516, "global_step": 388150, "epoch": 4676} {"train_loss": -26.079483032226562, "global_step": 388151, "epoch": 4676} {"train_loss": -26.171506881713867, "global_step": 388152, "epoch": 4676} {"train_loss": -26.317346572875977, "global_step": 388153, "epoch": 4676} {"train_loss": -26.616697311401367, "global_step": 388154, "epoch": 4676} {"train_loss": -26.442768096923828, "global_step": 388155, "epoch": 4676} {"train_loss": -26.563074111938477, "global_step": 388156, "epoch": 4676} {"train_loss": -26.310754776000977, "global_step": 388157, "epoch": 4676} {"train_loss": -26.476057052612305, "global_step": 388158, "epoch": 4676} {"train_loss": -26.141996383666992, "global_step": 388159, "epoch": 4676} {"train_loss": -26.5006046295166, "global_step": 388160, "epoch": 4676} {"train_loss": -26.3795223236084, "global_step": 388161, "epoch": 4676} {"train_loss": -26.484405517578125, "global_step": 388162, "epoch": 4676} {"train_loss": -26.714441299438477, "global_step": 388163, "epoch": 4676} {"train_loss": -26.6496524810791, "global_step": 388164, "epoch": 4676} {"train_loss": -26.552846908569336, "global_step": 388165, "epoch": 4676} {"train_loss": -26.547330856323242, "global_step": 388166, "epoch": 4676} {"train_loss": -26.674177169799805, "global_step": 388167, "epoch": 4676} {"train_loss": -26.452184677124023, "global_step": 388168, "epoch": 4676} {"train_loss": -26.469675064086914, "global_step": 388169, "epoch": 4676} {"train_loss": -26.722427368164062, "global_step": 388170, "epoch": 4676} {"train_loss": -26.814664840698242, "global_step": 388171, "epoch": 4676} {"train_loss": -26.925928115844727, "global_step": 388172, "epoch": 4676} {"train_loss": -26.42437171936035, "global_step": 388173, "epoch": 4676} {"train_loss": -26.658838272094727, "global_step": 388174, "epoch": 4676} {"train_loss": -27.032175064086914, "global_step": 388175, "epoch": 4676} {"train_loss": -26.361902236938477, "global_step": 388176, "epoch": 4676} {"train_loss": -26.80059814453125, "global_step": 388177, "epoch": 4676} {"train_loss": -26.601917266845703, "global_step": 388178, "epoch": 4676} {"train_loss": -26.336029052734375, "global_step": 388179, "epoch": 4676} {"train_loss": -26.8613224029541, "global_step": 388180, "epoch": 4676} {"train_loss": -26.674131393432617, "global_step": 388181, "epoch": 4676} {"train_loss": -26.776351928710938, "global_step": 388182, "epoch": 4676} {"train_loss": -26.80866050720215, "global_step": 388183, "epoch": 4676} {"train_loss": -26.504159927368164, "global_step": 388184, "epoch": 4676} {"train_loss": -26.751148223876953, "global_step": 388185, "epoch": 4676} {"train_loss": -26.86112403869629, "global_step": 388186, "epoch": 4676} {"train_loss": -26.64508056640625, "global_step": 388187, "epoch": 4676} {"train_loss": -26.637165069580078, "global_step": 388188, "epoch": 4676} {"train_loss": -26.508386611938477, "global_step": 388189, "epoch": 4676} {"train_loss": -26.5231647031853, "global_step": 388190, "epoch": 4676, "val_loss": 6589781.0} {"train_loss": -25.3580322265625, "global_step": 388191, "epoch": 4677} {"train_loss": -25.35902214050293, "global_step": 388192, "epoch": 4677} {"train_loss": -24.954805374145508, "global_step": 388193, "epoch": 4677} {"train_loss": -25.822580337524414, "global_step": 388194, "epoch": 4677} {"train_loss": -25.69635581970215, "global_step": 388195, "epoch": 4677} {"train_loss": -25.51708221435547, "global_step": 388196, "epoch": 4677} {"train_loss": -25.789764404296875, "global_step": 388197, "epoch": 4677} {"train_loss": -25.37232780456543, "global_step": 388198, "epoch": 4677} {"train_loss": -26.222997665405273, "global_step": 388199, "epoch": 4677} {"train_loss": -25.43632698059082, "global_step": 388200, "epoch": 4677} {"train_loss": -25.85434341430664, "global_step": 388201, "epoch": 4677} {"train_loss": -25.849170684814453, "global_step": 388202, "epoch": 4677} {"train_loss": -26.04184913635254, "global_step": 388203, "epoch": 4677} {"train_loss": -25.972457885742188, "global_step": 388204, "epoch": 4677} {"train_loss": -26.083393096923828, "global_step": 388205, "epoch": 4677} {"train_loss": -26.328893661499023, "global_step": 388206, "epoch": 4677} {"train_loss": -25.906869888305664, "global_step": 388207, "epoch": 4677} {"train_loss": -26.13715934753418, "global_step": 388208, "epoch": 4677} {"train_loss": -26.148221969604492, "global_step": 388209, "epoch": 4677} {"train_loss": -26.393518447875977, "global_step": 388210, "epoch": 4677} {"train_loss": -25.998926162719727, "global_step": 388211, "epoch": 4677} {"train_loss": -26.117612838745117, "global_step": 388212, "epoch": 4677} {"train_loss": -26.20081901550293, "global_step": 388213, "epoch": 4677} {"train_loss": -26.200088500976562, "global_step": 388214, "epoch": 4677} {"train_loss": -26.366653442382812, "global_step": 388215, "epoch": 4677} {"train_loss": -26.569660186767578, "global_step": 388216, "epoch": 4677} {"train_loss": -26.2054386138916, "global_step": 388217, "epoch": 4677} {"train_loss": -26.081653594970703, "global_step": 388218, "epoch": 4677} {"train_loss": -26.359699249267578, "global_step": 388219, "epoch": 4677} {"train_loss": -26.2939453125, "global_step": 388220, "epoch": 4677} {"train_loss": -25.93985939025879, "global_step": 388221, "epoch": 4677} {"train_loss": -26.680419921875, "global_step": 388222, "epoch": 4677} {"train_loss": -26.747116088867188, "global_step": 388223, "epoch": 4677} {"train_loss": -26.308307647705078, "global_step": 388224, "epoch": 4677} {"train_loss": -26.4951171875, "global_step": 388225, "epoch": 4677} {"train_loss": -26.66998291015625, "global_step": 388226, "epoch": 4677} {"train_loss": -26.551294326782227, "global_step": 388227, "epoch": 4677} {"train_loss": -26.678558349609375, "global_step": 388228, "epoch": 4677} {"train_loss": -26.718412399291992, "global_step": 388229, "epoch": 4677} {"train_loss": -26.53228187561035, "global_step": 388230, "epoch": 4677} {"train_loss": -26.572439193725586, "global_step": 388231, "epoch": 4677} {"train_loss": -26.766523361206055, "global_step": 388232, "epoch": 4677} {"train_loss": -26.63429832458496, "global_step": 388233, "epoch": 4677} {"train_loss": -26.51445960998535, "global_step": 388234, "epoch": 4677} {"train_loss": -26.3577938079834, "global_step": 388235, "epoch": 4677} {"train_loss": -26.55243492126465, "global_step": 388236, "epoch": 4677} {"train_loss": -26.774200439453125, "global_step": 388237, "epoch": 4677} {"train_loss": -26.52992820739746, "global_step": 388238, "epoch": 4677} {"train_loss": -26.431787490844727, "global_step": 388239, "epoch": 4677} {"train_loss": -26.671741485595703, "global_step": 388240, "epoch": 4677} {"train_loss": -26.15559196472168, "global_step": 388241, "epoch": 4677} {"train_loss": -26.519519805908203, "global_step": 388242, "epoch": 4677} {"train_loss": -26.30126953125, "global_step": 388243, "epoch": 4677} {"train_loss": -26.8154296875, "global_step": 388244, "epoch": 4677} {"train_loss": -25.77176856994629, "global_step": 388245, "epoch": 4677} {"train_loss": -26.6229305267334, "global_step": 388246, "epoch": 4677} {"train_loss": -26.338958740234375, "global_step": 388247, "epoch": 4677} {"train_loss": -26.062788009643555, "global_step": 388248, "epoch": 4677} {"train_loss": -26.23020362854004, "global_step": 388249, "epoch": 4677} {"train_loss": -25.977741241455078, "global_step": 388250, "epoch": 4677} {"train_loss": -25.793445587158203, "global_step": 388251, "epoch": 4677} {"train_loss": -24.892765045166016, "global_step": 388252, "epoch": 4677} {"train_loss": -25.541616439819336, "global_step": 388253, "epoch": 4677} {"train_loss": -25.24041175842285, "global_step": 388254, "epoch": 4677} {"train_loss": -25.52911949157715, "global_step": 388255, "epoch": 4677} {"train_loss": -26.096166610717773, "global_step": 388256, "epoch": 4677} {"train_loss": -25.238401412963867, "global_step": 388257, "epoch": 4677} {"train_loss": -25.79585838317871, "global_step": 388258, "epoch": 4677} {"train_loss": -25.699792861938477, "global_step": 388259, "epoch": 4677} {"train_loss": -25.891271591186523, "global_step": 388260, "epoch": 4677} {"train_loss": -26.034332275390625, "global_step": 388261, "epoch": 4677} {"train_loss": -25.850605010986328, "global_step": 388262, "epoch": 4677} {"train_loss": -25.932249069213867, "global_step": 388263, "epoch": 4677} {"train_loss": -26.102039337158203, "global_step": 388264, "epoch": 4677} {"train_loss": -26.083555221557617, "global_step": 388265, "epoch": 4677} {"train_loss": -26.19080924987793, "global_step": 388266, "epoch": 4677} {"train_loss": -26.05303955078125, "global_step": 388267, "epoch": 4677} {"train_loss": -26.143768310546875, "global_step": 388268, "epoch": 4677} {"train_loss": -26.416162490844727, "global_step": 388269, "epoch": 4677} {"train_loss": -26.561120986938477, "global_step": 388270, "epoch": 4677} {"train_loss": -25.9851016998291, "global_step": 388271, "epoch": 4677} {"train_loss": -26.31439781188965, "global_step": 388272, "epoch": 4677} {"train_loss": -26.122884796326417, "global_step": 388273, "epoch": 4677, "val_loss": 6555959.0} {"train_loss": -26.342512130737305, "global_step": 388274, "epoch": 4678} {"train_loss": -25.962804794311523, "global_step": 388275, "epoch": 4678} {"train_loss": -26.0146427154541, "global_step": 388276, "epoch": 4678} {"train_loss": -26.018890380859375, "global_step": 388277, "epoch": 4678} {"train_loss": -26.17056655883789, "global_step": 388278, "epoch": 4678} {"train_loss": -26.4274959564209, "global_step": 388279, "epoch": 4678} {"train_loss": -26.672088623046875, "global_step": 388280, "epoch": 4678} {"train_loss": -26.367938995361328, "global_step": 388281, "epoch": 4678} {"train_loss": -26.183685302734375, "global_step": 388282, "epoch": 4678} {"train_loss": -26.33485221862793, "global_step": 388283, "epoch": 4678} {"train_loss": -26.286191940307617, "global_step": 388284, "epoch": 4678} {"train_loss": -25.9731502532959, "global_step": 388285, "epoch": 4678} {"train_loss": -26.219465255737305, "global_step": 388286, "epoch": 4678} {"train_loss": -26.370397567749023, "global_step": 388287, "epoch": 4678} {"train_loss": -26.279083251953125, "global_step": 388288, "epoch": 4678} {"train_loss": -26.402318954467773, "global_step": 388289, "epoch": 4678} {"train_loss": -26.68484878540039, "global_step": 388290, "epoch": 4678} {"train_loss": -26.514179229736328, "global_step": 388291, "epoch": 4678} {"train_loss": -26.451284408569336, "global_step": 388292, "epoch": 4678} {"train_loss": -26.696014404296875, "global_step": 388293, "epoch": 4678} {"train_loss": -26.27097511291504, "global_step": 388294, "epoch": 4678} {"train_loss": -26.593353271484375, "global_step": 388295, "epoch": 4678} {"train_loss": -26.584320068359375, "global_step": 388296, "epoch": 4678} {"train_loss": -26.52968406677246, "global_step": 388297, "epoch": 4678} {"train_loss": -26.456811904907227, "global_step": 388298, "epoch": 4678} {"train_loss": -26.896081924438477, "global_step": 388299, "epoch": 4678} {"train_loss": -26.85996437072754, "global_step": 388300, "epoch": 4678} {"train_loss": -26.689533233642578, "global_step": 388301, "epoch": 4678} {"train_loss": -26.219099044799805, "global_step": 388302, "epoch": 4678} {"train_loss": -26.377939224243164, "global_step": 388303, "epoch": 4678} {"train_loss": -26.584259033203125, "global_step": 388304, "epoch": 4678} {"train_loss": -26.641067504882812, "global_step": 388305, "epoch": 4678} {"train_loss": -26.91204261779785, "global_step": 388306, "epoch": 4678} {"train_loss": -26.65620231628418, "global_step": 388307, "epoch": 4678} {"train_loss": -26.863391876220703, "global_step": 388308, "epoch": 4678} {"train_loss": -26.700489044189453, "global_step": 388309, "epoch": 4678} {"train_loss": -26.8260440826416, "global_step": 388310, "epoch": 4678} {"train_loss": -26.794973373413086, "global_step": 388311, "epoch": 4678} {"train_loss": -26.804723739624023, "global_step": 388312, "epoch": 4678} {"train_loss": -26.787734985351562, "global_step": 388313, "epoch": 4678} {"train_loss": -26.6826114654541, "global_step": 388314, "epoch": 4678} {"train_loss": -26.095678329467773, "global_step": 388315, "epoch": 4678} {"train_loss": -26.409093856811523, "global_step": 388316, "epoch": 4678} {"train_loss": -26.841535568237305, "global_step": 388317, "epoch": 4678} {"train_loss": -26.828222274780273, "global_step": 388318, "epoch": 4678} {"train_loss": -26.708356857299805, "global_step": 388319, "epoch": 4678} {"train_loss": -26.552154541015625, "global_step": 388320, "epoch": 4678} {"train_loss": -26.72541618347168, "global_step": 388321, "epoch": 4678} {"train_loss": -26.319610595703125, "global_step": 388322, "epoch": 4678} {"train_loss": -26.62848472595215, "global_step": 388323, "epoch": 4678} {"train_loss": -26.42371940612793, "global_step": 388324, "epoch": 4678} {"train_loss": -26.319049835205078, "global_step": 388325, "epoch": 4678} {"train_loss": -26.308252334594727, "global_step": 388326, "epoch": 4678} {"train_loss": -26.650976181030273, "global_step": 388327, "epoch": 4678} {"train_loss": -26.54302406311035, "global_step": 388328, "epoch": 4678} {"train_loss": -26.351667404174805, "global_step": 388329, "epoch": 4678} {"train_loss": -26.478071212768555, "global_step": 388330, "epoch": 4678} {"train_loss": -27.22977066040039, "global_step": 388331, "epoch": 4678} {"train_loss": -26.286701202392578, "global_step": 388332, "epoch": 4678} {"train_loss": -26.547164916992188, "global_step": 388333, "epoch": 4678} {"train_loss": -26.402563095092773, "global_step": 388334, "epoch": 4678} {"train_loss": -26.348196029663086, "global_step": 388335, "epoch": 4678} {"train_loss": -26.6715087890625, "global_step": 388336, "epoch": 4678} {"train_loss": -26.848730087280273, "global_step": 388337, "epoch": 4678} {"train_loss": -26.49798583984375, "global_step": 388338, "epoch": 4678} {"train_loss": -26.471094131469727, "global_step": 388339, "epoch": 4678} {"train_loss": -26.8071346282959, "global_step": 388340, "epoch": 4678} {"train_loss": -26.75201416015625, "global_step": 388341, "epoch": 4678} {"train_loss": -26.806018829345703, "global_step": 388342, "epoch": 4678} {"train_loss": -26.654027938842773, "global_step": 388343, "epoch": 4678} {"train_loss": -26.32952308654785, "global_step": 388344, "epoch": 4678} {"train_loss": -27.053485870361328, "global_step": 388345, "epoch": 4678} {"train_loss": -26.819250106811523, "global_step": 388346, "epoch": 4678} {"train_loss": -26.41385841369629, "global_step": 388347, "epoch": 4678} {"train_loss": -26.460556030273438, "global_step": 388348, "epoch": 4678} {"train_loss": -26.681066513061523, "global_step": 388349, "epoch": 4678} {"train_loss": -26.927804946899414, "global_step": 388350, "epoch": 4678} {"train_loss": -26.559656143188477, "global_step": 388351, "epoch": 4678} {"train_loss": -26.417905807495117, "global_step": 388352, "epoch": 4678} {"train_loss": -26.33723258972168, "global_step": 388353, "epoch": 4678} {"train_loss": -26.380578994750977, "global_step": 388354, "epoch": 4678} {"train_loss": -26.581344604492188, "global_step": 388355, "epoch": 4678} {"train_loss": -26.5258038302502, "global_step": 388356, "epoch": 4678, "val_loss": 6638117.0} {"train_loss": -25.671161651611328, "global_step": 388357, "epoch": 4679} {"train_loss": -25.620532989501953, "global_step": 388358, "epoch": 4679} {"train_loss": -26.223114013671875, "global_step": 388359, "epoch": 4679} {"train_loss": -26.0042724609375, "global_step": 388360, "epoch": 4679} {"train_loss": -26.037267684936523, "global_step": 388361, "epoch": 4679} {"train_loss": -25.93817138671875, "global_step": 388362, "epoch": 4679} {"train_loss": -26.166345596313477, "global_step": 388363, "epoch": 4679} {"train_loss": -26.161853790283203, "global_step": 388364, "epoch": 4679} {"train_loss": -25.83161735534668, "global_step": 388365, "epoch": 4679} {"train_loss": -26.502777099609375, "global_step": 388366, "epoch": 4679} {"train_loss": -26.128488540649414, "global_step": 388367, "epoch": 4679} {"train_loss": -26.295949935913086, "global_step": 388368, "epoch": 4679} {"train_loss": -26.2005558013916, "global_step": 388369, "epoch": 4679} {"train_loss": -26.00797462463379, "global_step": 388370, "epoch": 4679} {"train_loss": -26.519657135009766, "global_step": 388371, "epoch": 4679} {"train_loss": -26.504064559936523, "global_step": 388372, "epoch": 4679} {"train_loss": -26.408313751220703, "global_step": 388373, "epoch": 4679} {"train_loss": -26.49346923828125, "global_step": 388374, "epoch": 4679} {"train_loss": -26.458072662353516, "global_step": 388375, "epoch": 4679} {"train_loss": -26.267913818359375, "global_step": 388376, "epoch": 4679} {"train_loss": -26.136205673217773, "global_step": 388377, "epoch": 4679} {"train_loss": -26.82953453063965, "global_step": 388378, "epoch": 4679} {"train_loss": -26.570331573486328, "global_step": 388379, "epoch": 4679} {"train_loss": -26.598257064819336, "global_step": 388380, "epoch": 4679} {"train_loss": -26.1578311920166, "global_step": 388381, "epoch": 4679} {"train_loss": -26.2473087310791, "global_step": 388382, "epoch": 4679} {"train_loss": -26.471338272094727, "global_step": 388383, "epoch": 4679} {"train_loss": -26.43157958984375, "global_step": 388384, "epoch": 4679} {"train_loss": -26.64118766784668, "global_step": 388385, "epoch": 4679} {"train_loss": -26.483545303344727, "global_step": 388386, "epoch": 4679} {"train_loss": -26.773212432861328, "global_step": 388387, "epoch": 4679} {"train_loss": -26.88495445251465, "global_step": 388388, "epoch": 4679} {"train_loss": -26.522424697875977, "global_step": 388389, "epoch": 4679} {"train_loss": -26.263391494750977, "global_step": 388390, "epoch": 4679} {"train_loss": -26.8082275390625, "global_step": 388391, "epoch": 4679} {"train_loss": -27.017919540405273, "global_step": 388392, "epoch": 4679} {"train_loss": -26.71870994567871, "global_step": 388393, "epoch": 4679} {"train_loss": -26.7457218170166, "global_step": 388394, "epoch": 4679} {"train_loss": -26.3038272857666, "global_step": 388395, "epoch": 4679} {"train_loss": -26.070581436157227, "global_step": 388396, "epoch": 4679} {"train_loss": -25.788358688354492, "global_step": 388397, "epoch": 4679} {"train_loss": -25.569950103759766, "global_step": 388398, "epoch": 4679} {"train_loss": -26.339811325073242, "global_step": 388399, "epoch": 4679} {"train_loss": -25.970138549804688, "global_step": 388400, "epoch": 4679} {"train_loss": -26.391895294189453, "global_step": 388401, "epoch": 4679} {"train_loss": -26.49102783203125, "global_step": 388402, "epoch": 4679} {"train_loss": -26.245838165283203, "global_step": 388403, "epoch": 4679} {"train_loss": -26.518259048461914, "global_step": 388404, "epoch": 4679} {"train_loss": -26.25117301940918, "global_step": 388405, "epoch": 4679} {"train_loss": -26.243314743041992, "global_step": 388406, "epoch": 4679} {"train_loss": -26.0565128326416, "global_step": 388407, "epoch": 4679} {"train_loss": -26.65199089050293, "global_step": 388408, "epoch": 4679} {"train_loss": -26.5557861328125, "global_step": 388409, "epoch": 4679} {"train_loss": -26.475378036499023, "global_step": 388410, "epoch": 4679} {"train_loss": -26.21747398376465, "global_step": 388411, "epoch": 4679} {"train_loss": -26.06361198425293, "global_step": 388412, "epoch": 4679} {"train_loss": -26.248825073242188, "global_step": 388413, "epoch": 4679} {"train_loss": -26.65778160095215, "global_step": 388414, "epoch": 4679} {"train_loss": -26.507604598999023, "global_step": 388415, "epoch": 4679} {"train_loss": -26.202672958374023, "global_step": 388416, "epoch": 4679} {"train_loss": -25.904800415039062, "global_step": 388417, "epoch": 4679} {"train_loss": -26.220441818237305, "global_step": 388418, "epoch": 4679} {"train_loss": -26.358722686767578, "global_step": 388419, "epoch": 4679} {"train_loss": -26.1838436126709, "global_step": 388420, "epoch": 4679} {"train_loss": -26.249006271362305, "global_step": 388421, "epoch": 4679} {"train_loss": -26.446298599243164, "global_step": 388422, "epoch": 4679} {"train_loss": -26.606718063354492, "global_step": 388423, "epoch": 4679} {"train_loss": -26.59413719177246, "global_step": 388424, "epoch": 4679} {"train_loss": -26.612207412719727, "global_step": 388425, "epoch": 4679} {"train_loss": -26.378646850585938, "global_step": 388426, "epoch": 4679} {"train_loss": -26.552045822143555, "global_step": 388427, "epoch": 4679} {"train_loss": -26.36819839477539, "global_step": 388428, "epoch": 4679} {"train_loss": -26.614561080932617, "global_step": 388429, "epoch": 4679} {"train_loss": -26.54422378540039, "global_step": 388430, "epoch": 4679} {"train_loss": -26.651391983032227, "global_step": 388431, "epoch": 4679} {"train_loss": -26.5932559967041, "global_step": 388432, "epoch": 4679} {"train_loss": -26.47028160095215, "global_step": 388433, "epoch": 4679} {"train_loss": -27.070219039916992, "global_step": 388434, "epoch": 4679} {"train_loss": -27.107202529907227, "global_step": 388435, "epoch": 4679} {"train_loss": -26.63397789001465, "global_step": 388436, "epoch": 4679} {"train_loss": -27.109113693237305, "global_step": 388437, "epoch": 4679} {"train_loss": -26.571081161499023, "global_step": 388438, "epoch": 4679} {"train_loss": -26.387955608138117, "global_step": 388439, "epoch": 4679, "val_loss": 6567200.0} {"train_loss": -26.614044189453125, "global_step": 388440, "epoch": 4680} {"train_loss": -26.335418701171875, "global_step": 388441, "epoch": 4680} {"train_loss": -26.2441349029541, "global_step": 388442, "epoch": 4680} {"train_loss": -26.57063102722168, "global_step": 388443, "epoch": 4680} {"train_loss": -26.330188751220703, "global_step": 388444, "epoch": 4680} {"train_loss": -26.344907760620117, "global_step": 388445, "epoch": 4680} {"train_loss": -25.94170570373535, "global_step": 388446, "epoch": 4680} {"train_loss": -26.30181312561035, "global_step": 388447, "epoch": 4680} {"train_loss": -26.744699478149414, "global_step": 388448, "epoch": 4680} {"train_loss": -26.42825698852539, "global_step": 388449, "epoch": 4680} {"train_loss": -26.190900802612305, "global_step": 388450, "epoch": 4680} {"train_loss": -26.27691650390625, "global_step": 388451, "epoch": 4680} {"train_loss": -26.313739776611328, "global_step": 388452, "epoch": 4680} {"train_loss": -26.345306396484375, "global_step": 388453, "epoch": 4680} {"train_loss": -26.200241088867188, "global_step": 388454, "epoch": 4680} {"train_loss": -26.34891700744629, "global_step": 388455, "epoch": 4680} {"train_loss": -26.526824951171875, "global_step": 388456, "epoch": 4680} {"train_loss": -26.1079044342041, "global_step": 388457, "epoch": 4680} {"train_loss": -26.14936637878418, "global_step": 388458, "epoch": 4680} {"train_loss": -26.556928634643555, "global_step": 388459, "epoch": 4680} {"train_loss": -26.360883712768555, "global_step": 388460, "epoch": 4680} {"train_loss": -26.600290298461914, "global_step": 388461, "epoch": 4680} {"train_loss": -26.455554962158203, "global_step": 388462, "epoch": 4680} {"train_loss": -26.4462890625, "global_step": 388463, "epoch": 4680} {"train_loss": -26.211557388305664, "global_step": 388464, "epoch": 4680} {"train_loss": -26.2159423828125, "global_step": 388465, "epoch": 4680} {"train_loss": -26.751218795776367, "global_step": 388466, "epoch": 4680} {"train_loss": -26.294635772705078, "global_step": 388467, "epoch": 4680} {"train_loss": -26.2778377532959, "global_step": 388468, "epoch": 4680} {"train_loss": -26.121206283569336, "global_step": 388469, "epoch": 4680} {"train_loss": -26.145109176635742, "global_step": 388470, "epoch": 4680} {"train_loss": -26.727025985717773, "global_step": 388471, "epoch": 4680} {"train_loss": -26.247150421142578, "global_step": 388472, "epoch": 4680} {"train_loss": -26.698392868041992, "global_step": 388473, "epoch": 4680} {"train_loss": -26.445087432861328, "global_step": 388474, "epoch": 4680} {"train_loss": -26.675500869750977, "global_step": 388475, "epoch": 4680} {"train_loss": -26.548925399780273, "global_step": 388476, "epoch": 4680} {"train_loss": -26.458654403686523, "global_step": 388477, "epoch": 4680} {"train_loss": -26.481794357299805, "global_step": 388478, "epoch": 4680} {"train_loss": -26.414093017578125, "global_step": 388479, "epoch": 4680} {"train_loss": -26.6983642578125, "global_step": 388480, "epoch": 4680} {"train_loss": -26.74570083618164, "global_step": 388481, "epoch": 4680} {"train_loss": -26.353260040283203, "global_step": 388482, "epoch": 4680} {"train_loss": -26.163715362548828, "global_step": 388483, "epoch": 4680} {"train_loss": -26.31218910217285, "global_step": 388484, "epoch": 4680} {"train_loss": -26.341781616210938, "global_step": 388485, "epoch": 4680} {"train_loss": -25.718420028686523, "global_step": 388486, "epoch": 4680} {"train_loss": -26.00946617126465, "global_step": 388487, "epoch": 4680} {"train_loss": -26.513940811157227, "global_step": 388488, "epoch": 4680} {"train_loss": -25.92717933654785, "global_step": 388489, "epoch": 4680} {"train_loss": -25.95967674255371, "global_step": 388490, "epoch": 4680} {"train_loss": -26.060468673706055, "global_step": 388491, "epoch": 4680} {"train_loss": -26.308324813842773, "global_step": 388492, "epoch": 4680} {"train_loss": -25.880661010742188, "global_step": 388493, "epoch": 4680} {"train_loss": -26.011127471923828, "global_step": 388494, "epoch": 4680} {"train_loss": -26.06036949157715, "global_step": 388495, "epoch": 4680} {"train_loss": -26.590972900390625, "global_step": 388496, "epoch": 4680} {"train_loss": -26.19190788269043, "global_step": 388497, "epoch": 4680} {"train_loss": -26.31886863708496, "global_step": 388498, "epoch": 4680} {"train_loss": -26.07771110534668, "global_step": 388499, "epoch": 4680} {"train_loss": -26.2047061920166, "global_step": 388500, "epoch": 4680} {"train_loss": -26.62981605529785, "global_step": 388501, "epoch": 4680} {"train_loss": -26.49554443359375, "global_step": 388502, "epoch": 4680} {"train_loss": -26.67648696899414, "global_step": 388503, "epoch": 4680} {"train_loss": -26.5677547454834, "global_step": 388504, "epoch": 4680} {"train_loss": -26.632680892944336, "global_step": 388505, "epoch": 4680} {"train_loss": -26.610334396362305, "global_step": 388506, "epoch": 4680} {"train_loss": -26.09600830078125, "global_step": 388507, "epoch": 4680} {"train_loss": -26.552886962890625, "global_step": 388508, "epoch": 4680} {"train_loss": -26.503992080688477, "global_step": 388509, "epoch": 4680} {"train_loss": -26.594526290893555, "global_step": 388510, "epoch": 4680} {"train_loss": -26.33771324157715, "global_step": 388511, "epoch": 4680} {"train_loss": -26.399667739868164, "global_step": 388512, "epoch": 4680} {"train_loss": -26.33692741394043, "global_step": 388513, "epoch": 4680} {"train_loss": -26.72662925720215, "global_step": 388514, "epoch": 4680} {"train_loss": -26.535207748413086, "global_step": 388515, "epoch": 4680} {"train_loss": -26.501117706298828, "global_step": 388516, "epoch": 4680} {"train_loss": -26.598712921142578, "global_step": 388517, "epoch": 4680} {"train_loss": -26.734907150268555, "global_step": 388518, "epoch": 4680} {"train_loss": -27.007892608642578, "global_step": 388519, "epoch": 4680} {"train_loss": -26.421186447143555, "global_step": 388520, "epoch": 4680} {"train_loss": -26.486616134643555, "global_step": 388521, "epoch": 4680} {"train_loss": -26.388908937752966, "global_step": 388522, "epoch": 4680, "val_loss": 6534572.5} {"train_loss": -25.853805541992188, "global_step": 388523, "epoch": 4681} {"train_loss": -25.614927291870117, "global_step": 388524, "epoch": 4681} {"train_loss": -26.034564971923828, "global_step": 388525, "epoch": 4681} {"train_loss": -26.623083114624023, "global_step": 388526, "epoch": 4681} {"train_loss": -26.241153717041016, "global_step": 388527, "epoch": 4681} {"train_loss": -26.161298751831055, "global_step": 388528, "epoch": 4681} {"train_loss": -26.242399215698242, "global_step": 388529, "epoch": 4681} {"train_loss": -26.22265625, "global_step": 388530, "epoch": 4681} {"train_loss": -26.430334091186523, "global_step": 388531, "epoch": 4681} {"train_loss": -26.511981964111328, "global_step": 388532, "epoch": 4681} {"train_loss": -26.3314208984375, "global_step": 388533, "epoch": 4681} {"train_loss": -26.487598419189453, "global_step": 388534, "epoch": 4681} {"train_loss": -26.516721725463867, "global_step": 388535, "epoch": 4681} {"train_loss": -26.295270919799805, "global_step": 388536, "epoch": 4681} {"train_loss": -25.494281768798828, "global_step": 388537, "epoch": 4681} {"train_loss": -25.931243896484375, "global_step": 388538, "epoch": 4681} {"train_loss": -26.62946891784668, "global_step": 388539, "epoch": 4681} {"train_loss": -26.207239151000977, "global_step": 388540, "epoch": 4681} {"train_loss": -26.105802536010742, "global_step": 388541, "epoch": 4681} {"train_loss": -26.1530704498291, "global_step": 388542, "epoch": 4681} {"train_loss": -26.58100700378418, "global_step": 388543, "epoch": 4681} {"train_loss": -26.026758193969727, "global_step": 388544, "epoch": 4681} {"train_loss": -26.49896240234375, "global_step": 388545, "epoch": 4681} {"train_loss": -26.278797149658203, "global_step": 388546, "epoch": 4681} {"train_loss": -26.673978805541992, "global_step": 388547, "epoch": 4681} {"train_loss": -26.051496505737305, "global_step": 388548, "epoch": 4681} {"train_loss": -26.49074363708496, "global_step": 388549, "epoch": 4681} {"train_loss": -26.775421142578125, "global_step": 388550, "epoch": 4681} {"train_loss": -26.699987411499023, "global_step": 388551, "epoch": 4681} {"train_loss": -26.39423179626465, "global_step": 388552, "epoch": 4681} {"train_loss": -26.692413330078125, "global_step": 388553, "epoch": 4681} {"train_loss": -26.385122299194336, "global_step": 388554, "epoch": 4681} {"train_loss": -26.639225006103516, "global_step": 388555, "epoch": 4681} {"train_loss": -26.751022338867188, "global_step": 388556, "epoch": 4681} {"train_loss": -26.58138084411621, "global_step": 388557, "epoch": 4681} {"train_loss": -26.6502742767334, "global_step": 388558, "epoch": 4681} {"train_loss": -26.828088760375977, "global_step": 388559, "epoch": 4681} {"train_loss": -26.648269653320312, "global_step": 388560, "epoch": 4681} {"train_loss": -26.743391036987305, "global_step": 388561, "epoch": 4681} {"train_loss": -26.399442672729492, "global_step": 388562, "epoch": 4681} {"train_loss": -26.93300437927246, "global_step": 388563, "epoch": 4681} {"train_loss": -26.419103622436523, "global_step": 388564, "epoch": 4681} {"train_loss": -26.3950138092041, "global_step": 388565, "epoch": 4681} {"train_loss": -26.5964298248291, "global_step": 388566, "epoch": 4681} {"train_loss": -26.771764755249023, "global_step": 388567, "epoch": 4681} {"train_loss": -26.66306495666504, "global_step": 388568, "epoch": 4681} {"train_loss": -26.6154842376709, "global_step": 388569, "epoch": 4681} {"train_loss": -26.53675651550293, "global_step": 388570, "epoch": 4681} {"train_loss": -26.77716636657715, "global_step": 388571, "epoch": 4681} {"train_loss": -26.454252243041992, "global_step": 388572, "epoch": 4681} {"train_loss": -26.480234146118164, "global_step": 388573, "epoch": 4681} {"train_loss": -26.8651065826416, "global_step": 388574, "epoch": 4681} {"train_loss": -26.487091064453125, "global_step": 388575, "epoch": 4681} {"train_loss": -26.9451961517334, "global_step": 388576, "epoch": 4681} {"train_loss": -27.203046798706055, "global_step": 388577, "epoch": 4681} {"train_loss": -26.2843017578125, "global_step": 388578, "epoch": 4681} {"train_loss": -26.270404815673828, "global_step": 388579, "epoch": 4681} {"train_loss": -25.759342193603516, "global_step": 388580, "epoch": 4681} {"train_loss": -26.329694747924805, "global_step": 388581, "epoch": 4681} {"train_loss": -26.461843490600586, "global_step": 388582, "epoch": 4681} {"train_loss": -26.575712203979492, "global_step": 388583, "epoch": 4681} {"train_loss": -25.821765899658203, "global_step": 388584, "epoch": 4681} {"train_loss": -25.85009765625, "global_step": 388585, "epoch": 4681} {"train_loss": -25.782535552978516, "global_step": 388586, "epoch": 4681} {"train_loss": -26.17087173461914, "global_step": 388587, "epoch": 4681} {"train_loss": -26.244733810424805, "global_step": 388588, "epoch": 4681} {"train_loss": -26.11469841003418, "global_step": 388589, "epoch": 4681} {"train_loss": -26.32282066345215, "global_step": 388590, "epoch": 4681} {"train_loss": -26.374591827392578, "global_step": 388591, "epoch": 4681} {"train_loss": -26.069456100463867, "global_step": 388592, "epoch": 4681} {"train_loss": -26.136343002319336, "global_step": 388593, "epoch": 4681} {"train_loss": -26.351974487304688, "global_step": 388594, "epoch": 4681} {"train_loss": -26.49427604675293, "global_step": 388595, "epoch": 4681} {"train_loss": -26.62739372253418, "global_step": 388596, "epoch": 4681} {"train_loss": -26.52716064453125, "global_step": 388597, "epoch": 4681} {"train_loss": -26.24956703186035, "global_step": 388598, "epoch": 4681} {"train_loss": -26.407794952392578, "global_step": 388599, "epoch": 4681} {"train_loss": -25.96232032775879, "global_step": 388600, "epoch": 4681} {"train_loss": -26.11881446838379, "global_step": 388601, "epoch": 4681} {"train_loss": -26.577991485595703, "global_step": 388602, "epoch": 4681} {"train_loss": -26.258773803710938, "global_step": 388603, "epoch": 4681} {"train_loss": -26.666471481323242, "global_step": 388604, "epoch": 4681} {"train_loss": -26.370635273944902, "global_step": 388605, "epoch": 4681, "val_loss": 6508481.0} {"train_loss": -26.28285026550293, "global_step": 388606, "epoch": 4682} {"train_loss": -25.916967391967773, "global_step": 388607, "epoch": 4682} {"train_loss": -26.237075805664062, "global_step": 388608, "epoch": 4682} {"train_loss": -25.753217697143555, "global_step": 388609, "epoch": 4682} {"train_loss": -26.32472038269043, "global_step": 388610, "epoch": 4682} {"train_loss": -25.69012451171875, "global_step": 388611, "epoch": 4682} {"train_loss": -26.167856216430664, "global_step": 388612, "epoch": 4682} {"train_loss": -26.636417388916016, "global_step": 388613, "epoch": 4682} {"train_loss": -26.282323837280273, "global_step": 388614, "epoch": 4682} {"train_loss": -26.167028427124023, "global_step": 388615, "epoch": 4682} {"train_loss": -26.185583114624023, "global_step": 388616, "epoch": 4682} {"train_loss": -26.305349349975586, "global_step": 388617, "epoch": 4682} {"train_loss": -26.35088539123535, "global_step": 388618, "epoch": 4682} {"train_loss": -26.00095558166504, "global_step": 388619, "epoch": 4682} {"train_loss": -26.310277938842773, "global_step": 388620, "epoch": 4682} {"train_loss": -26.380691528320312, "global_step": 388621, "epoch": 4682} {"train_loss": -26.240741729736328, "global_step": 388622, "epoch": 4682} {"train_loss": -26.15345573425293, "global_step": 388623, "epoch": 4682} {"train_loss": -26.21479606628418, "global_step": 388624, "epoch": 4682} {"train_loss": -26.417205810546875, "global_step": 388625, "epoch": 4682} {"train_loss": -26.666120529174805, "global_step": 388626, "epoch": 4682} {"train_loss": -26.463830947875977, "global_step": 388627, "epoch": 4682} {"train_loss": -26.282535552978516, "global_step": 388628, "epoch": 4682} {"train_loss": -26.516637802124023, "global_step": 388629, "epoch": 4682} {"train_loss": -26.622465133666992, "global_step": 388630, "epoch": 4682} {"train_loss": -26.307971954345703, "global_step": 388631, "epoch": 4682} {"train_loss": -26.54054832458496, "global_step": 388632, "epoch": 4682} {"train_loss": -26.737897872924805, "global_step": 388633, "epoch": 4682} {"train_loss": -26.49785804748535, "global_step": 388634, "epoch": 4682} {"train_loss": -26.58587074279785, "global_step": 388635, "epoch": 4682} {"train_loss": -26.533838272094727, "global_step": 388636, "epoch": 4682} {"train_loss": -26.517053604125977, "global_step": 388637, "epoch": 4682} {"train_loss": -26.3974552154541, "global_step": 388638, "epoch": 4682} {"train_loss": -26.9813175201416, "global_step": 388639, "epoch": 4682} {"train_loss": -26.610309600830078, "global_step": 388640, "epoch": 4682} {"train_loss": -26.817829132080078, "global_step": 388641, "epoch": 4682} {"train_loss": -26.54497718811035, "global_step": 388642, "epoch": 4682} {"train_loss": -26.499408721923828, "global_step": 388643, "epoch": 4682} {"train_loss": -26.599878311157227, "global_step": 388644, "epoch": 4682} {"train_loss": -26.719507217407227, "global_step": 388645, "epoch": 4682} {"train_loss": -26.527368545532227, "global_step": 388646, "epoch": 4682} {"train_loss": -26.341140747070312, "global_step": 388647, "epoch": 4682} {"train_loss": -26.37190818786621, "global_step": 388648, "epoch": 4682} {"train_loss": -26.846887588500977, "global_step": 388649, "epoch": 4682} {"train_loss": -26.857709884643555, "global_step": 388650, "epoch": 4682} {"train_loss": -26.271528244018555, "global_step": 388651, "epoch": 4682} {"train_loss": -26.43670082092285, "global_step": 388652, "epoch": 4682} {"train_loss": -26.89934730529785, "global_step": 388653, "epoch": 4682} {"train_loss": -26.783620834350586, "global_step": 388654, "epoch": 4682} {"train_loss": -26.951757431030273, "global_step": 388655, "epoch": 4682} {"train_loss": -26.98067283630371, "global_step": 388656, "epoch": 4682} {"train_loss": -26.603439331054688, "global_step": 388657, "epoch": 4682} {"train_loss": -26.68861961364746, "global_step": 388658, "epoch": 4682} {"train_loss": -26.914661407470703, "global_step": 388659, "epoch": 4682} {"train_loss": -26.59620475769043, "global_step": 388660, "epoch": 4682} {"train_loss": -26.68166160583496, "global_step": 388661, "epoch": 4682} {"train_loss": -26.11073112487793, "global_step": 388662, "epoch": 4682} {"train_loss": -26.40634536743164, "global_step": 388663, "epoch": 4682} {"train_loss": -26.706151962280273, "global_step": 388664, "epoch": 4682} {"train_loss": -26.33609962463379, "global_step": 388665, "epoch": 4682} {"train_loss": -26.819074630737305, "global_step": 388666, "epoch": 4682} {"train_loss": -26.689279556274414, "global_step": 388667, "epoch": 4682} {"train_loss": -27.061582565307617, "global_step": 388668, "epoch": 4682} {"train_loss": -26.6833553314209, "global_step": 388669, "epoch": 4682} {"train_loss": -26.719989776611328, "global_step": 388670, "epoch": 4682} {"train_loss": -26.497303009033203, "global_step": 388671, "epoch": 4682} {"train_loss": -26.41878318786621, "global_step": 388672, "epoch": 4682} {"train_loss": -27.266143798828125, "global_step": 388673, "epoch": 4682} {"train_loss": -26.474706649780273, "global_step": 388674, "epoch": 4682} {"train_loss": -26.587997436523438, "global_step": 388675, "epoch": 4682} {"train_loss": -26.549041748046875, "global_step": 388676, "epoch": 4682} {"train_loss": -26.567785263061523, "global_step": 388677, "epoch": 4682} {"train_loss": -26.6136531829834, "global_step": 388678, "epoch": 4682} {"train_loss": -26.237079620361328, "global_step": 388679, "epoch": 4682} {"train_loss": -26.67389488220215, "global_step": 388680, "epoch": 4682} {"train_loss": -26.42095375061035, "global_step": 388681, "epoch": 4682} {"train_loss": -26.511520385742188, "global_step": 388682, "epoch": 4682} {"train_loss": -26.593860626220703, "global_step": 388683, "epoch": 4682} {"train_loss": -26.985910415649414, "global_step": 388684, "epoch": 4682} {"train_loss": -26.549060821533203, "global_step": 388685, "epoch": 4682} {"train_loss": -26.764835357666016, "global_step": 388686, "epoch": 4682} {"train_loss": -26.948841094970703, "global_step": 388687, "epoch": 4682} {"train_loss": -26.5170909927552, "global_step": 388688, "epoch": 4682, "val_loss": 6586049.5} {"train_loss": -24.96626091003418, "global_step": 388689, "epoch": 4683} {"train_loss": -24.2535457611084, "global_step": 388690, "epoch": 4683} {"train_loss": -24.179479598999023, "global_step": 388691, "epoch": 4683} {"train_loss": -24.822153091430664, "global_step": 388692, "epoch": 4683} {"train_loss": -24.68229103088379, "global_step": 388693, "epoch": 4683} {"train_loss": -25.6164493560791, "global_step": 388694, "epoch": 4683} {"train_loss": -24.881053924560547, "global_step": 388695, "epoch": 4683} {"train_loss": -25.942956924438477, "global_step": 388696, "epoch": 4683} {"train_loss": -25.059778213500977, "global_step": 388697, "epoch": 4683} {"train_loss": -24.45347023010254, "global_step": 388698, "epoch": 4683} {"train_loss": -26.11366081237793, "global_step": 388699, "epoch": 4683} {"train_loss": -25.154712677001953, "global_step": 388700, "epoch": 4683} {"train_loss": -25.618427276611328, "global_step": 388701, "epoch": 4683} {"train_loss": -25.898324966430664, "global_step": 388702, "epoch": 4683} {"train_loss": -25.250686645507812, "global_step": 388703, "epoch": 4683} {"train_loss": -25.692035675048828, "global_step": 388704, "epoch": 4683} {"train_loss": -25.447803497314453, "global_step": 388705, "epoch": 4683} {"train_loss": -25.648534774780273, "global_step": 388706, "epoch": 4683} {"train_loss": -25.680999755859375, "global_step": 388707, "epoch": 4683} {"train_loss": -25.653583526611328, "global_step": 388708, "epoch": 4683} {"train_loss": -25.815860748291016, "global_step": 388709, "epoch": 4683} {"train_loss": -26.233366012573242, "global_step": 388710, "epoch": 4683} {"train_loss": -25.825361251831055, "global_step": 388711, "epoch": 4683} {"train_loss": -25.925806045532227, "global_step": 388712, "epoch": 4683} {"train_loss": -26.24287223815918, "global_step": 388713, "epoch": 4683} {"train_loss": -26.087926864624023, "global_step": 388714, "epoch": 4683} {"train_loss": -26.073877334594727, "global_step": 388715, "epoch": 4683} {"train_loss": -26.05824851989746, "global_step": 388716, "epoch": 4683} {"train_loss": -26.113025665283203, "global_step": 388717, "epoch": 4683} {"train_loss": -26.438262939453125, "global_step": 388718, "epoch": 4683} {"train_loss": -26.36406898498535, "global_step": 388719, "epoch": 4683} {"train_loss": -26.534452438354492, "global_step": 388720, "epoch": 4683} {"train_loss": -26.4356746673584, "global_step": 388721, "epoch": 4683} {"train_loss": -26.4054012298584, "global_step": 388722, "epoch": 4683} {"train_loss": -25.89544677734375, "global_step": 388723, "epoch": 4683} {"train_loss": -26.278717041015625, "global_step": 388724, "epoch": 4683} {"train_loss": -26.209884643554688, "global_step": 388725, "epoch": 4683} {"train_loss": -26.48052406311035, "global_step": 388726, "epoch": 4683} {"train_loss": -26.625391006469727, "global_step": 388727, "epoch": 4683} {"train_loss": -26.514209747314453, "global_step": 388728, "epoch": 4683} {"train_loss": -26.58203125, "global_step": 388729, "epoch": 4683} {"train_loss": -26.39011573791504, "global_step": 388730, "epoch": 4683} {"train_loss": -26.792829513549805, "global_step": 388731, "epoch": 4683} {"train_loss": -26.6286678314209, "global_step": 388732, "epoch": 4683} {"train_loss": -26.748945236206055, "global_step": 388733, "epoch": 4683} {"train_loss": -26.344202041625977, "global_step": 388734, "epoch": 4683} {"train_loss": -26.428476333618164, "global_step": 388735, "epoch": 4683} {"train_loss": -27.075132369995117, "global_step": 388736, "epoch": 4683} {"train_loss": -26.6320858001709, "global_step": 388737, "epoch": 4683} {"train_loss": -26.486129760742188, "global_step": 388738, "epoch": 4683} {"train_loss": -26.498823165893555, "global_step": 388739, "epoch": 4683} {"train_loss": -27.026159286499023, "global_step": 388740, "epoch": 4683} {"train_loss": -26.456989288330078, "global_step": 388741, "epoch": 4683} {"train_loss": -26.3907413482666, "global_step": 388742, "epoch": 4683} {"train_loss": -26.579660415649414, "global_step": 388743, "epoch": 4683} {"train_loss": -26.65348243713379, "global_step": 388744, "epoch": 4683} {"train_loss": -26.22003173828125, "global_step": 388745, "epoch": 4683} {"train_loss": -26.558252334594727, "global_step": 388746, "epoch": 4683} {"train_loss": -26.091114044189453, "global_step": 388747, "epoch": 4683} {"train_loss": -26.100595474243164, "global_step": 388748, "epoch": 4683} {"train_loss": -26.095993041992188, "global_step": 388749, "epoch": 4683} {"train_loss": -26.446456909179688, "global_step": 388750, "epoch": 4683} {"train_loss": -26.61163902282715, "global_step": 388751, "epoch": 4683} {"train_loss": -26.313873291015625, "global_step": 388752, "epoch": 4683} {"train_loss": -26.416257858276367, "global_step": 388753, "epoch": 4683} {"train_loss": -26.575719833374023, "global_step": 388754, "epoch": 4683} {"train_loss": -26.362207412719727, "global_step": 388755, "epoch": 4683} {"train_loss": -26.580036163330078, "global_step": 388756, "epoch": 4683} {"train_loss": -26.394155502319336, "global_step": 388757, "epoch": 4683} {"train_loss": -26.696613311767578, "global_step": 388758, "epoch": 4683} {"train_loss": -26.2288875579834, "global_step": 388759, "epoch": 4683} {"train_loss": -26.39214515686035, "global_step": 388760, "epoch": 4683} {"train_loss": -26.53497314453125, "global_step": 388761, "epoch": 4683} {"train_loss": -26.364948272705078, "global_step": 388762, "epoch": 4683} {"train_loss": -26.449865341186523, "global_step": 388763, "epoch": 4683} {"train_loss": -26.540979385375977, "global_step": 388764, "epoch": 4683} {"train_loss": -26.514774322509766, "global_step": 388765, "epoch": 4683} {"train_loss": -26.48538589477539, "global_step": 388766, "epoch": 4683} {"train_loss": -26.144458770751953, "global_step": 388767, "epoch": 4683} {"train_loss": -26.28534507751465, "global_step": 388768, "epoch": 4683} {"train_loss": -26.738210678100586, "global_step": 388769, "epoch": 4683} {"train_loss": -26.831745147705078, "global_step": 388770, "epoch": 4683} {"train_loss": -26.13464178521949, "global_step": 388771, "epoch": 4683, "val_loss": 6495864.0} {"train_loss": -25.953460693359375, "global_step": 388772, "epoch": 4684} {"train_loss": -26.04450035095215, "global_step": 388773, "epoch": 4684} {"train_loss": -25.740253448486328, "global_step": 388774, "epoch": 4684} {"train_loss": -26.227218627929688, "global_step": 388775, "epoch": 4684} {"train_loss": -26.056060791015625, "global_step": 388776, "epoch": 4684} {"train_loss": -26.178075790405273, "global_step": 388777, "epoch": 4684} {"train_loss": -26.60654640197754, "global_step": 388778, "epoch": 4684} {"train_loss": -25.833276748657227, "global_step": 388779, "epoch": 4684} {"train_loss": -26.183740615844727, "global_step": 388780, "epoch": 4684} {"train_loss": -26.22553825378418, "global_step": 388781, "epoch": 4684} {"train_loss": -26.32769775390625, "global_step": 388782, "epoch": 4684} {"train_loss": -26.32673454284668, "global_step": 388783, "epoch": 4684} {"train_loss": -26.411518096923828, "global_step": 388784, "epoch": 4684} {"train_loss": -26.136503219604492, "global_step": 388785, "epoch": 4684} {"train_loss": -26.26077651977539, "global_step": 388786, "epoch": 4684} {"train_loss": -26.239364624023438, "global_step": 388787, "epoch": 4684} {"train_loss": -26.400842666625977, "global_step": 388788, "epoch": 4684} {"train_loss": -26.23182487487793, "global_step": 388789, "epoch": 4684} {"train_loss": -26.42236328125, "global_step": 388790, "epoch": 4684} {"train_loss": -26.797962188720703, "global_step": 388791, "epoch": 4684} {"train_loss": -26.666946411132812, "global_step": 388792, "epoch": 4684} {"train_loss": -26.559179306030273, "global_step": 388793, "epoch": 4684} {"train_loss": -26.510391235351562, "global_step": 388794, "epoch": 4684} {"train_loss": -26.29193115234375, "global_step": 388795, "epoch": 4684} {"train_loss": -26.179672241210938, "global_step": 388796, "epoch": 4684} {"train_loss": -26.413610458374023, "global_step": 388797, "epoch": 4684} {"train_loss": -26.491498947143555, "global_step": 388798, "epoch": 4684} {"train_loss": -26.57706069946289, "global_step": 388799, "epoch": 4684} {"train_loss": -26.635303497314453, "global_step": 388800, "epoch": 4684} {"train_loss": -26.474225997924805, "global_step": 388801, "epoch": 4684} {"train_loss": -26.539173126220703, "global_step": 388802, "epoch": 4684} {"train_loss": -26.44855308532715, "global_step": 388803, "epoch": 4684} {"train_loss": -26.489343643188477, "global_step": 388804, "epoch": 4684} {"train_loss": -26.683889389038086, "global_step": 388805, "epoch": 4684} {"train_loss": -26.34111976623535, "global_step": 388806, "epoch": 4684} {"train_loss": -26.840702056884766, "global_step": 388807, "epoch": 4684} {"train_loss": -26.804824829101562, "global_step": 388808, "epoch": 4684} {"train_loss": -26.21213150024414, "global_step": 388809, "epoch": 4684} {"train_loss": -26.545618057250977, "global_step": 388810, "epoch": 4684} {"train_loss": -26.4197998046875, "global_step": 388811, "epoch": 4684} {"train_loss": -26.502201080322266, "global_step": 388812, "epoch": 4684} {"train_loss": -26.716161727905273, "global_step": 388813, "epoch": 4684} {"train_loss": -26.5620174407959, "global_step": 388814, "epoch": 4684} {"train_loss": -27.015966415405273, "global_step": 388815, "epoch": 4684} {"train_loss": -26.591999053955078, "global_step": 388816, "epoch": 4684} {"train_loss": -26.5693416595459, "global_step": 388817, "epoch": 4684} {"train_loss": -26.814477920532227, "global_step": 388818, "epoch": 4684} {"train_loss": -26.644672393798828, "global_step": 388819, "epoch": 4684} {"train_loss": -26.434728622436523, "global_step": 388820, "epoch": 4684} {"train_loss": -26.664289474487305, "global_step": 388821, "epoch": 4684} {"train_loss": -26.80303382873535, "global_step": 388822, "epoch": 4684} {"train_loss": -26.984954833984375, "global_step": 388823, "epoch": 4684} {"train_loss": -26.89155387878418, "global_step": 388824, "epoch": 4684} {"train_loss": -26.754552841186523, "global_step": 388825, "epoch": 4684} {"train_loss": -26.678430557250977, "global_step": 388826, "epoch": 4684} {"train_loss": -26.564645767211914, "global_step": 388827, "epoch": 4684} {"train_loss": -26.36905288696289, "global_step": 388828, "epoch": 4684} {"train_loss": -26.521284103393555, "global_step": 388829, "epoch": 4684} {"train_loss": -26.52081298828125, "global_step": 388830, "epoch": 4684} {"train_loss": -26.29774284362793, "global_step": 388831, "epoch": 4684} {"train_loss": -26.363250732421875, "global_step": 388832, "epoch": 4684} {"train_loss": -26.37294578552246, "global_step": 388833, "epoch": 4684} {"train_loss": -26.370960235595703, "global_step": 388834, "epoch": 4684} {"train_loss": -26.623117446899414, "global_step": 388835, "epoch": 4684} {"train_loss": -26.53223991394043, "global_step": 388836, "epoch": 4684} {"train_loss": -26.38260841369629, "global_step": 388837, "epoch": 4684} {"train_loss": -26.50013542175293, "global_step": 388838, "epoch": 4684} {"train_loss": -26.78435707092285, "global_step": 388839, "epoch": 4684} {"train_loss": -26.738630294799805, "global_step": 388840, "epoch": 4684} {"train_loss": -26.49457359313965, "global_step": 388841, "epoch": 4684} {"train_loss": -26.613744735717773, "global_step": 388842, "epoch": 4684} {"train_loss": -26.9824275970459, "global_step": 388843, "epoch": 4684} {"train_loss": -26.530960083007812, "global_step": 388844, "epoch": 4684} {"train_loss": -26.78205680847168, "global_step": 388845, "epoch": 4684} {"train_loss": -26.871850967407227, "global_step": 388846, "epoch": 4684} {"train_loss": -26.681787490844727, "global_step": 388847, "epoch": 4684} {"train_loss": -26.55145835876465, "global_step": 388848, "epoch": 4684} {"train_loss": -26.978961944580078, "global_step": 388849, "epoch": 4684} {"train_loss": -27.103662490844727, "global_step": 388850, "epoch": 4684} {"train_loss": -26.60761070251465, "global_step": 388851, "epoch": 4684} {"train_loss": -26.21709632873535, "global_step": 388852, "epoch": 4684} {"train_loss": -26.764429092407227, "global_step": 388853, "epoch": 4684} {"train_loss": -26.5197398633842, "global_step": 388854, "epoch": 4684, "val_loss": 6614687.0} {"train_loss": -26.507177352905273, "global_step": 388855, "epoch": 4685} {"train_loss": -26.474084854125977, "global_step": 388856, "epoch": 4685} {"train_loss": -25.723133087158203, "global_step": 388857, "epoch": 4685} {"train_loss": -25.825300216674805, "global_step": 388858, "epoch": 4685} {"train_loss": -25.722763061523438, "global_step": 388859, "epoch": 4685} {"train_loss": -26.43024253845215, "global_step": 388860, "epoch": 4685} {"train_loss": -26.147138595581055, "global_step": 388861, "epoch": 4685} {"train_loss": -26.06476402282715, "global_step": 388862, "epoch": 4685} {"train_loss": -26.026031494140625, "global_step": 388863, "epoch": 4685} {"train_loss": -26.213150024414062, "global_step": 388864, "epoch": 4685} {"train_loss": -26.469350814819336, "global_step": 388865, "epoch": 4685} {"train_loss": -26.385421752929688, "global_step": 388866, "epoch": 4685} {"train_loss": -26.517194747924805, "global_step": 388867, "epoch": 4685} {"train_loss": -26.268604278564453, "global_step": 388868, "epoch": 4685} {"train_loss": -26.393171310424805, "global_step": 388869, "epoch": 4685} {"train_loss": -26.465707778930664, "global_step": 388870, "epoch": 4685} {"train_loss": -26.5694637298584, "global_step": 388871, "epoch": 4685} {"train_loss": -26.74374771118164, "global_step": 388872, "epoch": 4685} {"train_loss": -26.095731735229492, "global_step": 388873, "epoch": 4685} {"train_loss": -26.230981826782227, "global_step": 388874, "epoch": 4685} {"train_loss": -26.282943725585938, "global_step": 388875, "epoch": 4685} {"train_loss": -26.306110382080078, "global_step": 388876, "epoch": 4685} {"train_loss": -26.745996475219727, "global_step": 388877, "epoch": 4685} {"train_loss": -26.845178604125977, "global_step": 388878, "epoch": 4685} {"train_loss": -26.672260284423828, "global_step": 388879, "epoch": 4685} {"train_loss": -26.598520278930664, "global_step": 388880, "epoch": 4685} {"train_loss": -26.462976455688477, "global_step": 388881, "epoch": 4685} {"train_loss": -26.417163848876953, "global_step": 388882, "epoch": 4685} {"train_loss": -26.21856689453125, "global_step": 388883, "epoch": 4685} {"train_loss": -26.383237838745117, "global_step": 388884, "epoch": 4685} {"train_loss": -25.922229766845703, "global_step": 388885, "epoch": 4685} {"train_loss": -26.116392135620117, "global_step": 388886, "epoch": 4685} {"train_loss": -26.338850021362305, "global_step": 388887, "epoch": 4685} {"train_loss": -26.713336944580078, "global_step": 388888, "epoch": 4685} {"train_loss": -26.530614852905273, "global_step": 388889, "epoch": 4685} {"train_loss": -26.440229415893555, "global_step": 388890, "epoch": 4685} {"train_loss": -26.4299259185791, "global_step": 388891, "epoch": 4685} {"train_loss": -26.73023796081543, "global_step": 388892, "epoch": 4685} {"train_loss": -26.739709854125977, "global_step": 388893, "epoch": 4685} {"train_loss": -26.442615509033203, "global_step": 388894, "epoch": 4685} {"train_loss": -26.64751625061035, "global_step": 388895, "epoch": 4685} {"train_loss": -26.597986221313477, "global_step": 388896, "epoch": 4685} {"train_loss": -26.8337345123291, "global_step": 388897, "epoch": 4685} {"train_loss": -26.447010040283203, "global_step": 388898, "epoch": 4685} {"train_loss": -26.663379669189453, "global_step": 388899, "epoch": 4685} {"train_loss": -26.585294723510742, "global_step": 388900, "epoch": 4685} {"train_loss": -26.613428115844727, "global_step": 388901, "epoch": 4685} {"train_loss": -26.745100021362305, "global_step": 388902, "epoch": 4685} {"train_loss": -26.396915435791016, "global_step": 388903, "epoch": 4685} {"train_loss": -26.609277725219727, "global_step": 388904, "epoch": 4685} {"train_loss": -26.67568016052246, "global_step": 388905, "epoch": 4685} {"train_loss": -26.80965232849121, "global_step": 388906, "epoch": 4685} {"train_loss": -26.882810592651367, "global_step": 388907, "epoch": 4685} {"train_loss": -26.960248947143555, "global_step": 388908, "epoch": 4685} {"train_loss": -26.728178024291992, "global_step": 388909, "epoch": 4685} {"train_loss": -26.517593383789062, "global_step": 388910, "epoch": 4685} {"train_loss": -26.647918701171875, "global_step": 388911, "epoch": 4685} {"train_loss": -26.781513214111328, "global_step": 388912, "epoch": 4685} {"train_loss": -26.468786239624023, "global_step": 388913, "epoch": 4685} {"train_loss": -26.3891658782959, "global_step": 388914, "epoch": 4685} {"train_loss": -26.89592933654785, "global_step": 388915, "epoch": 4685} {"train_loss": -26.60700798034668, "global_step": 388916, "epoch": 4685} {"train_loss": -26.868566513061523, "global_step": 388917, "epoch": 4685} {"train_loss": -27.04908561706543, "global_step": 388918, "epoch": 4685} {"train_loss": -26.666778564453125, "global_step": 388919, "epoch": 4685} {"train_loss": -26.4948787689209, "global_step": 388920, "epoch": 4685} {"train_loss": -26.49906349182129, "global_step": 388921, "epoch": 4685} {"train_loss": -26.391464233398438, "global_step": 388922, "epoch": 4685} {"train_loss": -25.838470458984375, "global_step": 388923, "epoch": 4685} {"train_loss": -26.05364418029785, "global_step": 388924, "epoch": 4685} {"train_loss": -26.589628219604492, "global_step": 388925, "epoch": 4685} {"train_loss": -26.604736328125, "global_step": 388926, "epoch": 4685} {"train_loss": -26.335159301757812, "global_step": 388927, "epoch": 4685} {"train_loss": -26.5521240234375, "global_step": 388928, "epoch": 4685} {"train_loss": -26.37471580505371, "global_step": 388929, "epoch": 4685} {"train_loss": -25.743621826171875, "global_step": 388930, "epoch": 4685} {"train_loss": -25.714462280273438, "global_step": 388931, "epoch": 4685} {"train_loss": -25.50594139099121, "global_step": 388932, "epoch": 4685} {"train_loss": -26.575637817382812, "global_step": 388933, "epoch": 4685} {"train_loss": -26.012378692626953, "global_step": 388934, "epoch": 4685} {"train_loss": -25.55621337890625, "global_step": 388935, "epoch": 4685} {"train_loss": -26.068984985351562, "global_step": 388936, "epoch": 4685} {"train_loss": -26.420713424682617, "global_step": 388937, "epoch": 4685, "val_loss": 6635185.0} {"train_loss": -24.984189987182617, "global_step": 388938, "epoch": 4686} {"train_loss": -25.351282119750977, "global_step": 388939, "epoch": 4686} {"train_loss": -25.153234481811523, "global_step": 388940, "epoch": 4686} {"train_loss": -25.979297637939453, "global_step": 388941, "epoch": 4686} {"train_loss": -25.207685470581055, "global_step": 388942, "epoch": 4686} {"train_loss": -25.353952407836914, "global_step": 388943, "epoch": 4686} {"train_loss": -25.913715362548828, "global_step": 388944, "epoch": 4686} {"train_loss": -25.696969985961914, "global_step": 388945, "epoch": 4686} {"train_loss": -25.976953506469727, "global_step": 388946, "epoch": 4686} {"train_loss": -25.78888511657715, "global_step": 388947, "epoch": 4686} {"train_loss": -26.11212730407715, "global_step": 388948, "epoch": 4686} {"train_loss": -25.870136260986328, "global_step": 388949, "epoch": 4686} {"train_loss": -26.22124671936035, "global_step": 388950, "epoch": 4686} {"train_loss": -25.598684310913086, "global_step": 388951, "epoch": 4686} {"train_loss": -26.450366973876953, "global_step": 388952, "epoch": 4686} {"train_loss": -26.236303329467773, "global_step": 388953, "epoch": 4686} {"train_loss": -26.2313175201416, "global_step": 388954, "epoch": 4686} {"train_loss": -26.045703887939453, "global_step": 388955, "epoch": 4686} {"train_loss": -26.299062728881836, "global_step": 388956, "epoch": 4686} {"train_loss": -26.121671676635742, "global_step": 388957, "epoch": 4686} {"train_loss": -26.23813819885254, "global_step": 388958, "epoch": 4686} {"train_loss": -26.280441284179688, "global_step": 388959, "epoch": 4686} {"train_loss": -26.012847900390625, "global_step": 388960, "epoch": 4686} {"train_loss": -26.342077255249023, "global_step": 388961, "epoch": 4686} {"train_loss": -26.51643943786621, "global_step": 388962, "epoch": 4686} {"train_loss": -26.181516647338867, "global_step": 388963, "epoch": 4686} {"train_loss": -25.808197021484375, "global_step": 388964, "epoch": 4686} {"train_loss": -26.72077751159668, "global_step": 388965, "epoch": 4686} {"train_loss": -26.27504539489746, "global_step": 388966, "epoch": 4686} {"train_loss": -26.68775749206543, "global_step": 388967, "epoch": 4686} {"train_loss": -26.205596923828125, "global_step": 388968, "epoch": 4686} {"train_loss": -26.366363525390625, "global_step": 388969, "epoch": 4686} {"train_loss": -26.992874145507812, "global_step": 388970, "epoch": 4686} {"train_loss": -26.361438751220703, "global_step": 388971, "epoch": 4686} {"train_loss": -26.536334991455078, "global_step": 388972, "epoch": 4686} {"train_loss": -26.650482177734375, "global_step": 388973, "epoch": 4686} {"train_loss": -26.460248947143555, "global_step": 388974, "epoch": 4686} {"train_loss": -26.751962661743164, "global_step": 388975, "epoch": 4686} {"train_loss": -26.44795799255371, "global_step": 388976, "epoch": 4686} {"train_loss": -26.896289825439453, "global_step": 388977, "epoch": 4686} {"train_loss": -26.803125381469727, "global_step": 388978, "epoch": 4686} {"train_loss": -26.788171768188477, "global_step": 388979, "epoch": 4686} {"train_loss": -26.609521865844727, "global_step": 388980, "epoch": 4686} {"train_loss": -26.78036880493164, "global_step": 388981, "epoch": 4686} {"train_loss": -26.74212646484375, "global_step": 388982, "epoch": 4686} {"train_loss": -26.550283432006836, "global_step": 388983, "epoch": 4686} {"train_loss": -26.615386962890625, "global_step": 388984, "epoch": 4686} {"train_loss": -26.525556564331055, "global_step": 388985, "epoch": 4686} {"train_loss": -26.739160537719727, "global_step": 388986, "epoch": 4686} {"train_loss": -26.602081298828125, "global_step": 388987, "epoch": 4686} {"train_loss": -26.941131591796875, "global_step": 388988, "epoch": 4686} {"train_loss": -26.3964900970459, "global_step": 388989, "epoch": 4686} {"train_loss": -26.769880294799805, "global_step": 388990, "epoch": 4686} {"train_loss": -26.635955810546875, "global_step": 388991, "epoch": 4686} {"train_loss": -26.31269645690918, "global_step": 388992, "epoch": 4686} {"train_loss": -26.2451229095459, "global_step": 388993, "epoch": 4686} {"train_loss": -26.197174072265625, "global_step": 388994, "epoch": 4686} {"train_loss": -26.451175689697266, "global_step": 388995, "epoch": 4686} {"train_loss": -26.35519790649414, "global_step": 388996, "epoch": 4686} {"train_loss": -26.536619186401367, "global_step": 388997, "epoch": 4686} {"train_loss": -26.610029220581055, "global_step": 388998, "epoch": 4686} {"train_loss": -26.512115478515625, "global_step": 388999, "epoch": 4686} {"train_loss": -26.44325065612793, "global_step": 389000, "epoch": 4686} {"train_loss": -26.657297134399414, "global_step": 389001, "epoch": 4686} {"train_loss": -26.45244789123535, "global_step": 389002, "epoch": 4686} {"train_loss": -26.49836540222168, "global_step": 389003, "epoch": 4686} {"train_loss": -25.74886131286621, "global_step": 389004, "epoch": 4686} {"train_loss": -26.049062728881836, "global_step": 389005, "epoch": 4686} {"train_loss": -26.48505210876465, "global_step": 389006, "epoch": 4686} {"train_loss": -26.543441772460938, "global_step": 389007, "epoch": 4686} {"train_loss": -26.521574020385742, "global_step": 389008, "epoch": 4686} {"train_loss": -26.77247428894043, "global_step": 389009, "epoch": 4686} {"train_loss": -26.158639907836914, "global_step": 389010, "epoch": 4686} {"train_loss": -26.50970458984375, "global_step": 389011, "epoch": 4686} {"train_loss": -26.269092559814453, "global_step": 389012, "epoch": 4686} {"train_loss": -26.497119903564453, "global_step": 389013, "epoch": 4686} {"train_loss": -26.374555587768555, "global_step": 389014, "epoch": 4686} {"train_loss": -26.217153549194336, "global_step": 389015, "epoch": 4686} {"train_loss": -26.879871368408203, "global_step": 389016, "epoch": 4686} {"train_loss": -26.413745880126953, "global_step": 389017, "epoch": 4686} {"train_loss": -26.834426879882812, "global_step": 389018, "epoch": 4686} {"train_loss": -26.5593318939209, "global_step": 389019, "epoch": 4686} {"train_loss": -26.312834682234797, "global_step": 389020, "epoch": 4686, "val_loss": 6478016.5} {"train_loss": -25.788068771362305, "global_step": 389021, "epoch": 4687} {"train_loss": -26.60696792602539, "global_step": 389022, "epoch": 4687} {"train_loss": -25.94266128540039, "global_step": 389023, "epoch": 4687} {"train_loss": -26.256977081298828, "global_step": 389024, "epoch": 4687} {"train_loss": -26.033935546875, "global_step": 389025, "epoch": 4687} {"train_loss": -25.571569442749023, "global_step": 389026, "epoch": 4687} {"train_loss": -26.49720573425293, "global_step": 389027, "epoch": 4687} {"train_loss": -25.947647094726562, "global_step": 389028, "epoch": 4687} {"train_loss": -26.592748641967773, "global_step": 389029, "epoch": 4687} {"train_loss": -26.171842575073242, "global_step": 389030, "epoch": 4687} {"train_loss": -26.32624626159668, "global_step": 389031, "epoch": 4687} {"train_loss": -25.806598663330078, "global_step": 389032, "epoch": 4687} {"train_loss": -25.942102432250977, "global_step": 389033, "epoch": 4687} {"train_loss": -26.354190826416016, "global_step": 389034, "epoch": 4687} {"train_loss": -26.06679344177246, "global_step": 389035, "epoch": 4687} {"train_loss": -26.429401397705078, "global_step": 389036, "epoch": 4687} {"train_loss": -26.024921417236328, "global_step": 389037, "epoch": 4687} {"train_loss": -26.37554359436035, "global_step": 389038, "epoch": 4687} {"train_loss": -26.35077476501465, "global_step": 389039, "epoch": 4687} {"train_loss": -26.44813346862793, "global_step": 389040, "epoch": 4687} {"train_loss": -26.673181533813477, "global_step": 389041, "epoch": 4687} {"train_loss": -26.24281120300293, "global_step": 389042, "epoch": 4687} {"train_loss": -26.757522583007812, "global_step": 389043, "epoch": 4687} {"train_loss": -26.114301681518555, "global_step": 389044, "epoch": 4687} {"train_loss": -26.306304931640625, "global_step": 389045, "epoch": 4687} {"train_loss": -26.248395919799805, "global_step": 389046, "epoch": 4687} {"train_loss": -27.091541290283203, "global_step": 389047, "epoch": 4687} {"train_loss": -26.403583526611328, "global_step": 389048, "epoch": 4687} {"train_loss": -26.286588668823242, "global_step": 389049, "epoch": 4687} {"train_loss": -26.291547775268555, "global_step": 389050, "epoch": 4687} {"train_loss": -26.528324127197266, "global_step": 389051, "epoch": 4687} {"train_loss": -26.371063232421875, "global_step": 389052, "epoch": 4687} {"train_loss": -26.509260177612305, "global_step": 389053, "epoch": 4687} {"train_loss": -26.57569694519043, "global_step": 389054, "epoch": 4687} {"train_loss": -26.579065322875977, "global_step": 389055, "epoch": 4687} {"train_loss": -26.693342208862305, "global_step": 389056, "epoch": 4687} {"train_loss": -26.2356014251709, "global_step": 389057, "epoch": 4687} {"train_loss": -26.686124801635742, "global_step": 389058, "epoch": 4687} {"train_loss": -26.545928955078125, "global_step": 389059, "epoch": 4687} {"train_loss": -26.75335693359375, "global_step": 389060, "epoch": 4687} {"train_loss": -26.4670467376709, "global_step": 389061, "epoch": 4687} {"train_loss": -26.401968002319336, "global_step": 389062, "epoch": 4687} {"train_loss": -26.570249557495117, "global_step": 389063, "epoch": 4687} {"train_loss": -26.6535587310791, "global_step": 389064, "epoch": 4687} {"train_loss": -26.672712326049805, "global_step": 389065, "epoch": 4687} {"train_loss": -26.76848793029785, "global_step": 389066, "epoch": 4687} {"train_loss": -26.716922760009766, "global_step": 389067, "epoch": 4687} {"train_loss": -26.556838989257812, "global_step": 389068, "epoch": 4687} {"train_loss": -26.737295150756836, "global_step": 389069, "epoch": 4687} {"train_loss": -26.4349365234375, "global_step": 389070, "epoch": 4687} {"train_loss": -26.65528678894043, "global_step": 389071, "epoch": 4687} {"train_loss": -26.091657638549805, "global_step": 389072, "epoch": 4687} {"train_loss": -26.533588409423828, "global_step": 389073, "epoch": 4687} {"train_loss": -26.727148056030273, "global_step": 389074, "epoch": 4687} {"train_loss": -26.55539894104004, "global_step": 389075, "epoch": 4687} {"train_loss": -26.54461097717285, "global_step": 389076, "epoch": 4687} {"train_loss": -25.92058753967285, "global_step": 389077, "epoch": 4687} {"train_loss": -25.923933029174805, "global_step": 389078, "epoch": 4687} {"train_loss": -25.091026306152344, "global_step": 389079, "epoch": 4687} {"train_loss": -25.32466697692871, "global_step": 389080, "epoch": 4687} {"train_loss": -26.37604331970215, "global_step": 389081, "epoch": 4687} {"train_loss": -25.613300323486328, "global_step": 389082, "epoch": 4687} {"train_loss": -26.25497817993164, "global_step": 389083, "epoch": 4687} {"train_loss": -25.545408248901367, "global_step": 389084, "epoch": 4687} {"train_loss": -26.543615341186523, "global_step": 389085, "epoch": 4687} {"train_loss": -25.821142196655273, "global_step": 389086, "epoch": 4687} {"train_loss": -26.17156982421875, "global_step": 389087, "epoch": 4687} {"train_loss": -26.052047729492188, "global_step": 389088, "epoch": 4687} {"train_loss": -26.115890502929688, "global_step": 389089, "epoch": 4687} {"train_loss": -25.99165153503418, "global_step": 389090, "epoch": 4687} {"train_loss": -26.33009147644043, "global_step": 389091, "epoch": 4687} {"train_loss": -26.53020668029785, "global_step": 389092, "epoch": 4687} {"train_loss": -26.34466552734375, "global_step": 389093, "epoch": 4687} {"train_loss": -26.1623477935791, "global_step": 389094, "epoch": 4687} {"train_loss": -26.384876251220703, "global_step": 389095, "epoch": 4687} {"train_loss": -26.264789581298828, "global_step": 389096, "epoch": 4687} {"train_loss": -26.664541244506836, "global_step": 389097, "epoch": 4687} {"train_loss": -26.218097686767578, "global_step": 389098, "epoch": 4687} {"train_loss": -26.499109268188477, "global_step": 389099, "epoch": 4687} {"train_loss": -26.735000610351562, "global_step": 389100, "epoch": 4687} {"train_loss": -26.42091178894043, "global_step": 389101, "epoch": 4687} {"train_loss": -26.64546012878418, "global_step": 389102, "epoch": 4687} {"train_loss": -26.31947312872094, "global_step": 389103, "epoch": 4687, "val_loss": 6547424.5} {"train_loss": -25.920080184936523, "global_step": 389104, "epoch": 4688} {"train_loss": -24.470083236694336, "global_step": 389105, "epoch": 4688} {"train_loss": -24.64620590209961, "global_step": 389106, "epoch": 4688} {"train_loss": -25.50592803955078, "global_step": 389107, "epoch": 4688} {"train_loss": -25.642410278320312, "global_step": 389108, "epoch": 4688} {"train_loss": -26.245641708374023, "global_step": 389109, "epoch": 4688} {"train_loss": -25.971023559570312, "global_step": 389110, "epoch": 4688} {"train_loss": -26.301803588867188, "global_step": 389111, "epoch": 4688} {"train_loss": -25.85023307800293, "global_step": 389112, "epoch": 4688} {"train_loss": -26.568540573120117, "global_step": 389113, "epoch": 4688} {"train_loss": -25.689233779907227, "global_step": 389114, "epoch": 4688} {"train_loss": -26.467254638671875, "global_step": 389115, "epoch": 4688} {"train_loss": -26.060266494750977, "global_step": 389116, "epoch": 4688} {"train_loss": -26.161014556884766, "global_step": 389117, "epoch": 4688} {"train_loss": -26.077077865600586, "global_step": 389118, "epoch": 4688} {"train_loss": -26.481931686401367, "global_step": 389119, "epoch": 4688} {"train_loss": -26.084381103515625, "global_step": 389120, "epoch": 4688} {"train_loss": -26.32411003112793, "global_step": 389121, "epoch": 4688} {"train_loss": -26.19992446899414, "global_step": 389122, "epoch": 4688} {"train_loss": -26.373083114624023, "global_step": 389123, "epoch": 4688} {"train_loss": -26.30291175842285, "global_step": 389124, "epoch": 4688} {"train_loss": -26.122116088867188, "global_step": 389125, "epoch": 4688} {"train_loss": -26.456457138061523, "global_step": 389126, "epoch": 4688} {"train_loss": -26.3757381439209, "global_step": 389127, "epoch": 4688} {"train_loss": -26.65801429748535, "global_step": 389128, "epoch": 4688} {"train_loss": -26.30901527404785, "global_step": 389129, "epoch": 4688} {"train_loss": -26.285022735595703, "global_step": 389130, "epoch": 4688} {"train_loss": -26.504379272460938, "global_step": 389131, "epoch": 4688} {"train_loss": -26.25214958190918, "global_step": 389132, "epoch": 4688} {"train_loss": -26.59158706665039, "global_step": 389133, "epoch": 4688} {"train_loss": -26.558399200439453, "global_step": 389134, "epoch": 4688} {"train_loss": -26.56943702697754, "global_step": 389135, "epoch": 4688} {"train_loss": -26.18265151977539, "global_step": 389136, "epoch": 4688} {"train_loss": -26.44235610961914, "global_step": 389137, "epoch": 4688} {"train_loss": -26.633691787719727, "global_step": 389138, "epoch": 4688} {"train_loss": -26.15424156188965, "global_step": 389139, "epoch": 4688} {"train_loss": -26.868879318237305, "global_step": 389140, "epoch": 4688} {"train_loss": -26.34049415588379, "global_step": 389141, "epoch": 4688} {"train_loss": -26.87635612487793, "global_step": 389142, "epoch": 4688} {"train_loss": -26.67636489868164, "global_step": 389143, "epoch": 4688} {"train_loss": -26.413848876953125, "global_step": 389144, "epoch": 4688} {"train_loss": -26.612897872924805, "global_step": 389145, "epoch": 4688} {"train_loss": -26.813709259033203, "global_step": 389146, "epoch": 4688} {"train_loss": -26.4833984375, "global_step": 389147, "epoch": 4688} {"train_loss": -26.485340118408203, "global_step": 389148, "epoch": 4688} {"train_loss": -26.702972412109375, "global_step": 389149, "epoch": 4688} {"train_loss": -26.907455444335938, "global_step": 389150, "epoch": 4688} {"train_loss": -26.854373931884766, "global_step": 389151, "epoch": 4688} {"train_loss": -26.651227951049805, "global_step": 389152, "epoch": 4688} {"train_loss": -26.35173988342285, "global_step": 389153, "epoch": 4688} {"train_loss": -26.024473190307617, "global_step": 389154, "epoch": 4688} {"train_loss": -25.959674835205078, "global_step": 389155, "epoch": 4688} {"train_loss": -25.45627212524414, "global_step": 389156, "epoch": 4688} {"train_loss": -25.86492919921875, "global_step": 389157, "epoch": 4688} {"train_loss": -25.496280670166016, "global_step": 389158, "epoch": 4688} {"train_loss": -26.2657413482666, "global_step": 389159, "epoch": 4688} {"train_loss": -26.32368278503418, "global_step": 389160, "epoch": 4688} {"train_loss": -26.224756240844727, "global_step": 389161, "epoch": 4688} {"train_loss": -25.39789390563965, "global_step": 389162, "epoch": 4688} {"train_loss": -26.731613159179688, "global_step": 389163, "epoch": 4688} {"train_loss": -26.260786056518555, "global_step": 389164, "epoch": 4688} {"train_loss": -26.180448532104492, "global_step": 389165, "epoch": 4688} {"train_loss": -26.262006759643555, "global_step": 389166, "epoch": 4688} {"train_loss": -26.169458389282227, "global_step": 389167, "epoch": 4688} {"train_loss": -26.067951202392578, "global_step": 389168, "epoch": 4688} {"train_loss": -26.266218185424805, "global_step": 389169, "epoch": 4688} {"train_loss": -26.40484046936035, "global_step": 389170, "epoch": 4688} {"train_loss": -25.93141746520996, "global_step": 389171, "epoch": 4688} {"train_loss": -26.4982852935791, "global_step": 389172, "epoch": 4688} {"train_loss": -26.630823135375977, "global_step": 389173, "epoch": 4688} {"train_loss": -26.55096435546875, "global_step": 389174, "epoch": 4688} {"train_loss": -26.269256591796875, "global_step": 389175, "epoch": 4688} {"train_loss": -26.30512809753418, "global_step": 389176, "epoch": 4688} {"train_loss": -26.275503158569336, "global_step": 389177, "epoch": 4688} {"train_loss": -26.359683990478516, "global_step": 389178, "epoch": 4688} {"train_loss": -26.065536499023438, "global_step": 389179, "epoch": 4688} {"train_loss": -26.462390899658203, "global_step": 389180, "epoch": 4688} {"train_loss": -26.206579208374023, "global_step": 389181, "epoch": 4688} {"train_loss": -26.39751625061035, "global_step": 389182, "epoch": 4688} {"train_loss": -26.597747802734375, "global_step": 389183, "epoch": 4688} {"train_loss": -26.671112060546875, "global_step": 389184, "epoch": 4688} {"train_loss": -26.97397804260254, "global_step": 389185, "epoch": 4688} {"train_loss": -26.277192242174262, "global_step": 389186, "epoch": 4688, "val_loss": 6612636.0} {"train_loss": -26.299890518188477, "global_step": 389187, "epoch": 4689} {"train_loss": -26.001157760620117, "global_step": 389188, "epoch": 4689} {"train_loss": -26.469762802124023, "global_step": 389189, "epoch": 4689} {"train_loss": -26.714344024658203, "global_step": 389190, "epoch": 4689} {"train_loss": -26.571552276611328, "global_step": 389191, "epoch": 4689} {"train_loss": -26.124170303344727, "global_step": 389192, "epoch": 4689} {"train_loss": -26.768707275390625, "global_step": 389193, "epoch": 4689} {"train_loss": -26.237232208251953, "global_step": 389194, "epoch": 4689} {"train_loss": -26.122543334960938, "global_step": 389195, "epoch": 4689} {"train_loss": -26.2358455657959, "global_step": 389196, "epoch": 4689} {"train_loss": -26.31513023376465, "global_step": 389197, "epoch": 4689} {"train_loss": -26.7077579498291, "global_step": 389198, "epoch": 4689} {"train_loss": -25.8192138671875, "global_step": 389199, "epoch": 4689} {"train_loss": -26.260099411010742, "global_step": 389200, "epoch": 4689} {"train_loss": -26.291828155517578, "global_step": 389201, "epoch": 4689} {"train_loss": -26.681615829467773, "global_step": 389202, "epoch": 4689} {"train_loss": -26.00214195251465, "global_step": 389203, "epoch": 4689} {"train_loss": -26.42119789123535, "global_step": 389204, "epoch": 4689} {"train_loss": -26.26460838317871, "global_step": 389205, "epoch": 4689} {"train_loss": -26.447885513305664, "global_step": 389206, "epoch": 4689} {"train_loss": -26.762420654296875, "global_step": 389207, "epoch": 4689} {"train_loss": -26.37799072265625, "global_step": 389208, "epoch": 4689} {"train_loss": -26.797576904296875, "global_step": 389209, "epoch": 4689} {"train_loss": -26.235624313354492, "global_step": 389210, "epoch": 4689} {"train_loss": -26.2744140625, "global_step": 389211, "epoch": 4689} {"train_loss": -26.26030921936035, "global_step": 389212, "epoch": 4689} {"train_loss": -26.346607208251953, "global_step": 389213, "epoch": 4689} {"train_loss": -26.136194229125977, "global_step": 389214, "epoch": 4689} {"train_loss": -26.7633056640625, "global_step": 389215, "epoch": 4689} {"train_loss": -26.115400314331055, "global_step": 389216, "epoch": 4689} {"train_loss": -26.530546188354492, "global_step": 389217, "epoch": 4689} {"train_loss": -26.183141708374023, "global_step": 389218, "epoch": 4689} {"train_loss": -26.5153751373291, "global_step": 389219, "epoch": 4689} {"train_loss": -26.530195236206055, "global_step": 389220, "epoch": 4689} {"train_loss": -26.130176544189453, "global_step": 389221, "epoch": 4689} {"train_loss": -26.375234603881836, "global_step": 389222, "epoch": 4689} {"train_loss": -26.544973373413086, "global_step": 389223, "epoch": 4689} {"train_loss": -26.93549919128418, "global_step": 389224, "epoch": 4689} {"train_loss": -26.581457138061523, "global_step": 389225, "epoch": 4689} {"train_loss": -26.452329635620117, "global_step": 389226, "epoch": 4689} {"train_loss": -26.733051300048828, "global_step": 389227, "epoch": 4689} {"train_loss": -26.139545440673828, "global_step": 389228, "epoch": 4689} {"train_loss": -26.49629783630371, "global_step": 389229, "epoch": 4689} {"train_loss": -26.564987182617188, "global_step": 389230, "epoch": 4689} {"train_loss": -26.5237979888916, "global_step": 389231, "epoch": 4689} {"train_loss": -26.645849227905273, "global_step": 389232, "epoch": 4689} {"train_loss": -26.593061447143555, "global_step": 389233, "epoch": 4689} {"train_loss": -26.547870635986328, "global_step": 389234, "epoch": 4689} {"train_loss": -26.54444694519043, "global_step": 389235, "epoch": 4689} {"train_loss": -26.478620529174805, "global_step": 389236, "epoch": 4689} {"train_loss": -26.537372589111328, "global_step": 389237, "epoch": 4689} {"train_loss": -26.898284912109375, "global_step": 389238, "epoch": 4689} {"train_loss": -26.269439697265625, "global_step": 389239, "epoch": 4689} {"train_loss": -26.373632431030273, "global_step": 389240, "epoch": 4689} {"train_loss": -26.079730987548828, "global_step": 389241, "epoch": 4689} {"train_loss": -26.506153106689453, "global_step": 389242, "epoch": 4689} {"train_loss": -26.271753311157227, "global_step": 389243, "epoch": 4689} {"train_loss": -26.415088653564453, "global_step": 389244, "epoch": 4689} {"train_loss": -25.88699722290039, "global_step": 389245, "epoch": 4689} {"train_loss": -25.243467330932617, "global_step": 389246, "epoch": 4689} {"train_loss": -26.48941421508789, "global_step": 389247, "epoch": 4689} {"train_loss": -26.265127182006836, "global_step": 389248, "epoch": 4689} {"train_loss": -25.76421546936035, "global_step": 389249, "epoch": 4689} {"train_loss": -26.503110885620117, "global_step": 389250, "epoch": 4689} {"train_loss": -26.424264907836914, "global_step": 389251, "epoch": 4689} {"train_loss": -26.402374267578125, "global_step": 389252, "epoch": 4689} {"train_loss": -26.40700340270996, "global_step": 389253, "epoch": 4689} {"train_loss": -26.192890167236328, "global_step": 389254, "epoch": 4689} {"train_loss": -26.323999404907227, "global_step": 389255, "epoch": 4689} {"train_loss": -26.34492301940918, "global_step": 389256, "epoch": 4689} {"train_loss": -26.57234001159668, "global_step": 389257, "epoch": 4689} {"train_loss": -26.645227432250977, "global_step": 389258, "epoch": 4689} {"train_loss": -26.26227378845215, "global_step": 389259, "epoch": 4689} {"train_loss": -26.711694717407227, "global_step": 389260, "epoch": 4689} {"train_loss": -26.56597900390625, "global_step": 389261, "epoch": 4689} {"train_loss": -26.504430770874023, "global_step": 389262, "epoch": 4689} {"train_loss": -26.763813018798828, "global_step": 389263, "epoch": 4689} {"train_loss": -26.49126625061035, "global_step": 389264, "epoch": 4689} {"train_loss": -26.298852920532227, "global_step": 389265, "epoch": 4689} {"train_loss": -26.710596084594727, "global_step": 389266, "epoch": 4689} {"train_loss": -26.68017578125, "global_step": 389267, "epoch": 4689} {"train_loss": -26.661340713500977, "global_step": 389268, "epoch": 4689} {"train_loss": -26.398273146296123, "global_step": 389269, "epoch": 4689, "val_loss": 6576632.0} {"train_loss": -25.881610870361328, "global_step": 389270, "epoch": 4690} {"train_loss": -25.806324005126953, "global_step": 389271, "epoch": 4690} {"train_loss": -26.13150978088379, "global_step": 389272, "epoch": 4690} {"train_loss": -25.748838424682617, "global_step": 389273, "epoch": 4690} {"train_loss": -25.609628677368164, "global_step": 389274, "epoch": 4690} {"train_loss": -26.14678382873535, "global_step": 389275, "epoch": 4690} {"train_loss": -25.9374942779541, "global_step": 389276, "epoch": 4690} {"train_loss": -26.16876220703125, "global_step": 389277, "epoch": 4690} {"train_loss": -26.185089111328125, "global_step": 389278, "epoch": 4690} {"train_loss": -25.48634910583496, "global_step": 389279, "epoch": 4690} {"train_loss": -26.26740074157715, "global_step": 389280, "epoch": 4690} {"train_loss": -25.831201553344727, "global_step": 389281, "epoch": 4690} {"train_loss": -26.354801177978516, "global_step": 389282, "epoch": 4690} {"train_loss": -26.15627098083496, "global_step": 389283, "epoch": 4690} {"train_loss": -26.15348243713379, "global_step": 389284, "epoch": 4690} {"train_loss": -26.174713134765625, "global_step": 389285, "epoch": 4690} {"train_loss": -26.21909523010254, "global_step": 389286, "epoch": 4690} {"train_loss": -25.756290435791016, "global_step": 389287, "epoch": 4690} {"train_loss": -26.4644718170166, "global_step": 389288, "epoch": 4690} {"train_loss": -26.100528717041016, "global_step": 389289, "epoch": 4690} {"train_loss": -26.40573501586914, "global_step": 389290, "epoch": 4690} {"train_loss": -26.327295303344727, "global_step": 389291, "epoch": 4690} {"train_loss": -26.461145401000977, "global_step": 389292, "epoch": 4690} {"train_loss": -26.182920455932617, "global_step": 389293, "epoch": 4690} {"train_loss": -26.25984001159668, "global_step": 389294, "epoch": 4690} {"train_loss": -26.38175392150879, "global_step": 389295, "epoch": 4690} {"train_loss": -26.608264923095703, "global_step": 389296, "epoch": 4690} {"train_loss": -26.309051513671875, "global_step": 389297, "epoch": 4690} {"train_loss": -26.681303024291992, "global_step": 389298, "epoch": 4690} {"train_loss": -26.814544677734375, "global_step": 389299, "epoch": 4690} {"train_loss": -26.90830421447754, "global_step": 389300, "epoch": 4690} {"train_loss": -26.535602569580078, "global_step": 389301, "epoch": 4690} {"train_loss": -26.410009384155273, "global_step": 389302, "epoch": 4690} {"train_loss": -26.5344295501709, "global_step": 389303, "epoch": 4690} {"train_loss": -26.75104331970215, "global_step": 389304, "epoch": 4690} {"train_loss": -26.554468154907227, "global_step": 389305, "epoch": 4690} {"train_loss": -26.891254425048828, "global_step": 389306, "epoch": 4690} {"train_loss": -26.629175186157227, "global_step": 389307, "epoch": 4690} {"train_loss": -26.56586265563965, "global_step": 389308, "epoch": 4690} {"train_loss": -26.715925216674805, "global_step": 389309, "epoch": 4690} {"train_loss": -26.3619441986084, "global_step": 389310, "epoch": 4690} {"train_loss": -26.82728385925293, "global_step": 389311, "epoch": 4690} {"train_loss": -27.044132232666016, "global_step": 389312, "epoch": 4690} {"train_loss": -26.59499168395996, "global_step": 389313, "epoch": 4690} {"train_loss": -26.69959831237793, "global_step": 389314, "epoch": 4690} {"train_loss": -26.943323135375977, "global_step": 389315, "epoch": 4690} {"train_loss": -26.63028335571289, "global_step": 389316, "epoch": 4690} {"train_loss": -26.83820152282715, "global_step": 389317, "epoch": 4690} {"train_loss": -26.460187911987305, "global_step": 389318, "epoch": 4690} {"train_loss": -26.462499618530273, "global_step": 389319, "epoch": 4690} {"train_loss": -26.220117568969727, "global_step": 389320, "epoch": 4690} {"train_loss": -26.54487419128418, "global_step": 389321, "epoch": 4690} {"train_loss": -26.566679000854492, "global_step": 389322, "epoch": 4690} {"train_loss": -26.302091598510742, "global_step": 389323, "epoch": 4690} {"train_loss": -26.661985397338867, "global_step": 389324, "epoch": 4690} {"train_loss": -26.337177276611328, "global_step": 389325, "epoch": 4690} {"train_loss": -26.898487091064453, "global_step": 389326, "epoch": 4690} {"train_loss": -26.920501708984375, "global_step": 389327, "epoch": 4690} {"train_loss": -26.364171981811523, "global_step": 389328, "epoch": 4690} {"train_loss": -26.266178131103516, "global_step": 389329, "epoch": 4690} {"train_loss": -26.385940551757812, "global_step": 389330, "epoch": 4690} {"train_loss": -26.52923011779785, "global_step": 389331, "epoch": 4690} {"train_loss": -26.70180320739746, "global_step": 389332, "epoch": 4690} {"train_loss": -26.5811710357666, "global_step": 389333, "epoch": 4690} {"train_loss": -26.417743682861328, "global_step": 389334, "epoch": 4690} {"train_loss": -26.654626846313477, "global_step": 389335, "epoch": 4690} {"train_loss": -26.600177764892578, "global_step": 389336, "epoch": 4690} {"train_loss": -26.609272003173828, "global_step": 389337, "epoch": 4690} {"train_loss": -26.60076904296875, "global_step": 389338, "epoch": 4690} {"train_loss": -26.559350967407227, "global_step": 389339, "epoch": 4690} {"train_loss": -26.1444149017334, "global_step": 389340, "epoch": 4690} {"train_loss": -26.6488037109375, "global_step": 389341, "epoch": 4690} {"train_loss": -26.357593536376953, "global_step": 389342, "epoch": 4690} {"train_loss": -26.3682804107666, "global_step": 389343, "epoch": 4690} {"train_loss": -26.63337516784668, "global_step": 389344, "epoch": 4690} {"train_loss": -26.649744033813477, "global_step": 389345, "epoch": 4690} {"train_loss": -25.916019439697266, "global_step": 389346, "epoch": 4690} {"train_loss": -26.189605712890625, "global_step": 389347, "epoch": 4690} {"train_loss": -26.023391723632812, "global_step": 389348, "epoch": 4690} {"train_loss": -26.12158203125, "global_step": 389349, "epoch": 4690} {"train_loss": -26.27898597717285, "global_step": 389350, "epoch": 4690} {"train_loss": -26.328815460205078, "global_step": 389351, "epoch": 4690} {"train_loss": -26.392814107688075, "global_step": 389352, "epoch": 4690, "val_loss": 6652553.0} {"train_loss": -25.713830947875977, "global_step": 389353, "epoch": 4691} {"train_loss": -26.208526611328125, "global_step": 389354, "epoch": 4691} {"train_loss": -25.690710067749023, "global_step": 389355, "epoch": 4691} {"train_loss": -26.108524322509766, "global_step": 389356, "epoch": 4691} {"train_loss": -26.007394790649414, "global_step": 389357, "epoch": 4691} {"train_loss": -25.752744674682617, "global_step": 389358, "epoch": 4691} {"train_loss": -26.2891902923584, "global_step": 389359, "epoch": 4691} {"train_loss": -26.08306884765625, "global_step": 389360, "epoch": 4691} {"train_loss": -26.188547134399414, "global_step": 389361, "epoch": 4691} {"train_loss": -26.309436798095703, "global_step": 389362, "epoch": 4691} {"train_loss": -26.108877182006836, "global_step": 389363, "epoch": 4691} {"train_loss": -26.487335205078125, "global_step": 389364, "epoch": 4691} {"train_loss": -26.320348739624023, "global_step": 389365, "epoch": 4691} {"train_loss": -25.982421875, "global_step": 389366, "epoch": 4691} {"train_loss": -26.23455810546875, "global_step": 389367, "epoch": 4691} {"train_loss": -26.235614776611328, "global_step": 389368, "epoch": 4691} {"train_loss": -26.680845260620117, "global_step": 389369, "epoch": 4691} {"train_loss": -26.28913688659668, "global_step": 389370, "epoch": 4691} {"train_loss": -26.45952796936035, "global_step": 389371, "epoch": 4691} {"train_loss": -26.349756240844727, "global_step": 389372, "epoch": 4691} {"train_loss": -26.134307861328125, "global_step": 389373, "epoch": 4691} {"train_loss": -26.574630737304688, "global_step": 389374, "epoch": 4691} {"train_loss": -26.34212303161621, "global_step": 389375, "epoch": 4691} {"train_loss": -26.577123641967773, "global_step": 389376, "epoch": 4691} {"train_loss": -26.368078231811523, "global_step": 389377, "epoch": 4691} {"train_loss": -26.278644561767578, "global_step": 389378, "epoch": 4691} {"train_loss": -26.630414962768555, "global_step": 389379, "epoch": 4691} {"train_loss": -26.31361198425293, "global_step": 389380, "epoch": 4691} {"train_loss": -26.515165328979492, "global_step": 389381, "epoch": 4691} {"train_loss": -26.864587783813477, "global_step": 389382, "epoch": 4691} {"train_loss": -26.70977210998535, "global_step": 389383, "epoch": 4691} {"train_loss": -26.88014030456543, "global_step": 389384, "epoch": 4691} {"train_loss": -26.797576904296875, "global_step": 389385, "epoch": 4691} {"train_loss": -26.70380973815918, "global_step": 389386, "epoch": 4691} {"train_loss": -26.74066734313965, "global_step": 389387, "epoch": 4691} {"train_loss": -26.829090118408203, "global_step": 389388, "epoch": 4691} {"train_loss": -26.3294620513916, "global_step": 389389, "epoch": 4691} {"train_loss": -26.62320899963379, "global_step": 389390, "epoch": 4691} {"train_loss": -26.628076553344727, "global_step": 389391, "epoch": 4691} {"train_loss": -26.544095993041992, "global_step": 389392, "epoch": 4691} {"train_loss": -26.231616973876953, "global_step": 389393, "epoch": 4691} {"train_loss": -26.588916778564453, "global_step": 389394, "epoch": 4691} {"train_loss": -26.934646606445312, "global_step": 389395, "epoch": 4691} {"train_loss": -26.92994499206543, "global_step": 389396, "epoch": 4691} {"train_loss": -26.53989028930664, "global_step": 389397, "epoch": 4691} {"train_loss": -26.7147274017334, "global_step": 389398, "epoch": 4691} {"train_loss": -26.74323844909668, "global_step": 389399, "epoch": 4691} {"train_loss": -26.517087936401367, "global_step": 389400, "epoch": 4691} {"train_loss": -26.855533599853516, "global_step": 389401, "epoch": 4691} {"train_loss": -26.67561149597168, "global_step": 389402, "epoch": 4691} {"train_loss": -27.056507110595703, "global_step": 389403, "epoch": 4691} {"train_loss": -27.0395450592041, "global_step": 389404, "epoch": 4691} {"train_loss": -26.753589630126953, "global_step": 389405, "epoch": 4691} {"train_loss": -26.577924728393555, "global_step": 389406, "epoch": 4691} {"train_loss": -26.559173583984375, "global_step": 389407, "epoch": 4691} {"train_loss": -26.5970401763916, "global_step": 389408, "epoch": 4691} {"train_loss": -26.54556655883789, "global_step": 389409, "epoch": 4691} {"train_loss": -26.834985733032227, "global_step": 389410, "epoch": 4691} {"train_loss": -26.987903594970703, "global_step": 389411, "epoch": 4691} {"train_loss": -26.429065704345703, "global_step": 389412, "epoch": 4691} {"train_loss": -26.845050811767578, "global_step": 389413, "epoch": 4691} {"train_loss": -26.52669334411621, "global_step": 389414, "epoch": 4691} {"train_loss": -26.532751083374023, "global_step": 389415, "epoch": 4691} {"train_loss": -26.772785186767578, "global_step": 389416, "epoch": 4691} {"train_loss": -26.670560836791992, "global_step": 389417, "epoch": 4691} {"train_loss": -26.525766372680664, "global_step": 389418, "epoch": 4691} {"train_loss": -26.688379287719727, "global_step": 389419, "epoch": 4691} {"train_loss": -26.596555709838867, "global_step": 389420, "epoch": 4691} {"train_loss": -26.448261260986328, "global_step": 389421, "epoch": 4691} {"train_loss": -26.404449462890625, "global_step": 389422, "epoch": 4691} {"train_loss": -26.587411880493164, "global_step": 389423, "epoch": 4691} {"train_loss": -26.491668701171875, "global_step": 389424, "epoch": 4691} {"train_loss": -26.66316795349121, "global_step": 389425, "epoch": 4691} {"train_loss": -26.189462661743164, "global_step": 389426, "epoch": 4691} {"train_loss": -25.96234703063965, "global_step": 389427, "epoch": 4691} {"train_loss": -25.828662872314453, "global_step": 389428, "epoch": 4691} {"train_loss": -26.057470321655273, "global_step": 389429, "epoch": 4691} {"train_loss": -26.423925399780273, "global_step": 389430, "epoch": 4691} {"train_loss": -26.275131225585938, "global_step": 389431, "epoch": 4691} {"train_loss": -25.9149227142334, "global_step": 389432, "epoch": 4691} {"train_loss": -25.918537139892578, "global_step": 389433, "epoch": 4691} {"train_loss": -26.30682945251465, "global_step": 389434, "epoch": 4691} {"train_loss": -26.44093894958496, "global_step": 389435, "epoch": 4691, "val_loss": 6519252.0} {"train_loss": -25.3990421295166, "global_step": 389436, "epoch": 4692} {"train_loss": -25.760528564453125, "global_step": 389437, "epoch": 4692} {"train_loss": -25.364625930786133, "global_step": 389438, "epoch": 4692} {"train_loss": -25.434558868408203, "global_step": 389439, "epoch": 4692} {"train_loss": -25.47715950012207, "global_step": 389440, "epoch": 4692} {"train_loss": -25.302946090698242, "global_step": 389441, "epoch": 4692} {"train_loss": -25.365697860717773, "global_step": 389442, "epoch": 4692} {"train_loss": -25.6761474609375, "global_step": 389443, "epoch": 4692} {"train_loss": -25.30953025817871, "global_step": 389444, "epoch": 4692} {"train_loss": -26.20644187927246, "global_step": 389445, "epoch": 4692} {"train_loss": -25.877212524414062, "global_step": 389446, "epoch": 4692} {"train_loss": -26.013280868530273, "global_step": 389447, "epoch": 4692} {"train_loss": -25.96082878112793, "global_step": 389448, "epoch": 4692} {"train_loss": -26.16597557067871, "global_step": 389449, "epoch": 4692} {"train_loss": -25.61508560180664, "global_step": 389450, "epoch": 4692} {"train_loss": -26.57996940612793, "global_step": 389451, "epoch": 4692} {"train_loss": -26.163854598999023, "global_step": 389452, "epoch": 4692} {"train_loss": -26.205810546875, "global_step": 389453, "epoch": 4692} {"train_loss": -26.2165584564209, "global_step": 389454, "epoch": 4692} {"train_loss": -25.872608184814453, "global_step": 389455, "epoch": 4692} {"train_loss": -25.928098678588867, "global_step": 389456, "epoch": 4692} {"train_loss": -26.365808486938477, "global_step": 389457, "epoch": 4692} {"train_loss": -26.33389663696289, "global_step": 389458, "epoch": 4692} {"train_loss": -26.095905303955078, "global_step": 389459, "epoch": 4692} {"train_loss": -26.312442779541016, "global_step": 389460, "epoch": 4692} {"train_loss": -26.2999267578125, "global_step": 389461, "epoch": 4692} {"train_loss": -26.65193748474121, "global_step": 389462, "epoch": 4692} {"train_loss": -26.390100479125977, "global_step": 389463, "epoch": 4692} {"train_loss": -26.315826416015625, "global_step": 389464, "epoch": 4692} {"train_loss": -26.429426193237305, "global_step": 389465, "epoch": 4692} {"train_loss": -26.742828369140625, "global_step": 389466, "epoch": 4692} {"train_loss": -26.08258056640625, "global_step": 389467, "epoch": 4692} {"train_loss": -26.494735717773438, "global_step": 389468, "epoch": 4692} {"train_loss": -26.844253540039062, "global_step": 389469, "epoch": 4692} {"train_loss": -26.58392333984375, "global_step": 389470, "epoch": 4692} {"train_loss": -26.481210708618164, "global_step": 389471, "epoch": 4692} {"train_loss": -26.42694664001465, "global_step": 389472, "epoch": 4692} {"train_loss": -26.641565322875977, "global_step": 389473, "epoch": 4692} {"train_loss": -26.38337516784668, "global_step": 389474, "epoch": 4692} {"train_loss": -26.475000381469727, "global_step": 389475, "epoch": 4692} {"train_loss": -26.753406524658203, "global_step": 389476, "epoch": 4692} {"train_loss": -26.871124267578125, "global_step": 389477, "epoch": 4692} {"train_loss": -26.26900291442871, "global_step": 389478, "epoch": 4692} {"train_loss": -26.542932510375977, "global_step": 389479, "epoch": 4692} {"train_loss": -26.827381134033203, "global_step": 389480, "epoch": 4692} {"train_loss": -26.69476890563965, "global_step": 389481, "epoch": 4692} {"train_loss": -26.793237686157227, "global_step": 389482, "epoch": 4692} {"train_loss": -26.69154930114746, "global_step": 389483, "epoch": 4692} {"train_loss": -26.583026885986328, "global_step": 389484, "epoch": 4692} {"train_loss": -26.507099151611328, "global_step": 389485, "epoch": 4692} {"train_loss": -26.7970027923584, "global_step": 389486, "epoch": 4692} {"train_loss": -26.8513126373291, "global_step": 389487, "epoch": 4692} {"train_loss": -26.910017013549805, "global_step": 389488, "epoch": 4692} {"train_loss": -26.194171905517578, "global_step": 389489, "epoch": 4692} {"train_loss": -26.76100730895996, "global_step": 389490, "epoch": 4692} {"train_loss": -26.816452026367188, "global_step": 389491, "epoch": 4692} {"train_loss": -26.575443267822266, "global_step": 389492, "epoch": 4692} {"train_loss": -26.540653228759766, "global_step": 389493, "epoch": 4692} {"train_loss": -26.623960494995117, "global_step": 389494, "epoch": 4692} {"train_loss": -26.849475860595703, "global_step": 389495, "epoch": 4692} {"train_loss": -26.840566635131836, "global_step": 389496, "epoch": 4692} {"train_loss": -26.6827449798584, "global_step": 389497, "epoch": 4692} {"train_loss": -26.715320587158203, "global_step": 389498, "epoch": 4692} {"train_loss": -26.563135147094727, "global_step": 389499, "epoch": 4692} {"train_loss": -26.862573623657227, "global_step": 389500, "epoch": 4692} {"train_loss": -26.392993927001953, "global_step": 389501, "epoch": 4692} {"train_loss": -26.375410079956055, "global_step": 389502, "epoch": 4692} {"train_loss": -26.473770141601562, "global_step": 389503, "epoch": 4692} {"train_loss": -27.051111221313477, "global_step": 389504, "epoch": 4692} {"train_loss": -26.65520668029785, "global_step": 389505, "epoch": 4692} {"train_loss": -26.494077682495117, "global_step": 389506, "epoch": 4692} {"train_loss": -26.259733200073242, "global_step": 389507, "epoch": 4692} {"train_loss": -25.8541202545166, "global_step": 389508, "epoch": 4692} {"train_loss": -26.197723388671875, "global_step": 389509, "epoch": 4692} {"train_loss": -26.106168746948242, "global_step": 389510, "epoch": 4692} {"train_loss": -26.301639556884766, "global_step": 389511, "epoch": 4692} {"train_loss": -26.003705978393555, "global_step": 389512, "epoch": 4692} {"train_loss": -26.474218368530273, "global_step": 389513, "epoch": 4692} {"train_loss": -26.385969161987305, "global_step": 389514, "epoch": 4692} {"train_loss": -26.3609561920166, "global_step": 389515, "epoch": 4692} {"train_loss": -26.22379493713379, "global_step": 389516, "epoch": 4692} {"train_loss": -26.454992294311523, "global_step": 389517, "epoch": 4692} {"train_loss": -26.358230223138648, "global_step": 389518, "epoch": 4692, "val_loss": 6683652.0} {"train_loss": -26.368743896484375, "global_step": 389519, "epoch": 4693} {"train_loss": -26.314233779907227, "global_step": 389520, "epoch": 4693} {"train_loss": -25.89410400390625, "global_step": 389521, "epoch": 4693} {"train_loss": -25.787128448486328, "global_step": 389522, "epoch": 4693} {"train_loss": -25.842132568359375, "global_step": 389523, "epoch": 4693} {"train_loss": -25.72321128845215, "global_step": 389524, "epoch": 4693} {"train_loss": -26.027240753173828, "global_step": 389525, "epoch": 4693} {"train_loss": -26.0935115814209, "global_step": 389526, "epoch": 4693} {"train_loss": -26.32265281677246, "global_step": 389527, "epoch": 4693} {"train_loss": -26.079050064086914, "global_step": 389528, "epoch": 4693} {"train_loss": -26.102447509765625, "global_step": 389529, "epoch": 4693} {"train_loss": -25.866226196289062, "global_step": 389530, "epoch": 4693} {"train_loss": -26.44098472595215, "global_step": 389531, "epoch": 4693} {"train_loss": -26.392044067382812, "global_step": 389532, "epoch": 4693} {"train_loss": -26.287290573120117, "global_step": 389533, "epoch": 4693} {"train_loss": -26.229001998901367, "global_step": 389534, "epoch": 4693} {"train_loss": -26.094327926635742, "global_step": 389535, "epoch": 4693} {"train_loss": -26.37575340270996, "global_step": 389536, "epoch": 4693} {"train_loss": -26.368635177612305, "global_step": 389537, "epoch": 4693} {"train_loss": -26.267475128173828, "global_step": 389538, "epoch": 4693} {"train_loss": -26.764535903930664, "global_step": 389539, "epoch": 4693} {"train_loss": -25.9278621673584, "global_step": 389540, "epoch": 4693} {"train_loss": -26.50037956237793, "global_step": 389541, "epoch": 4693} {"train_loss": -26.254430770874023, "global_step": 389542, "epoch": 4693} {"train_loss": -26.400177001953125, "global_step": 389543, "epoch": 4693} {"train_loss": -26.386075973510742, "global_step": 389544, "epoch": 4693} {"train_loss": -26.531641006469727, "global_step": 389545, "epoch": 4693} {"train_loss": -26.514057159423828, "global_step": 389546, "epoch": 4693} {"train_loss": -26.84018898010254, "global_step": 389547, "epoch": 4693} {"train_loss": -26.186471939086914, "global_step": 389548, "epoch": 4693} {"train_loss": -26.882312774658203, "global_step": 389549, "epoch": 4693} {"train_loss": -26.985565185546875, "global_step": 389550, "epoch": 4693} {"train_loss": -26.47201919555664, "global_step": 389551, "epoch": 4693} {"train_loss": -26.5892333984375, "global_step": 389552, "epoch": 4693} {"train_loss": -26.676116943359375, "global_step": 389553, "epoch": 4693} {"train_loss": -26.5821533203125, "global_step": 389554, "epoch": 4693} {"train_loss": -26.67779541015625, "global_step": 389555, "epoch": 4693} {"train_loss": -26.474689483642578, "global_step": 389556, "epoch": 4693} {"train_loss": -26.893545150756836, "global_step": 389557, "epoch": 4693} {"train_loss": -26.690332412719727, "global_step": 389558, "epoch": 4693} {"train_loss": -26.97743034362793, "global_step": 389559, "epoch": 4693} {"train_loss": -26.687366485595703, "global_step": 389560, "epoch": 4693} {"train_loss": -26.658447265625, "global_step": 389561, "epoch": 4693} {"train_loss": -26.862445831298828, "global_step": 389562, "epoch": 4693} {"train_loss": -26.74323844909668, "global_step": 389563, "epoch": 4693} {"train_loss": -26.9442138671875, "global_step": 389564, "epoch": 4693} {"train_loss": -26.480850219726562, "global_step": 389565, "epoch": 4693} {"train_loss": -26.48139762878418, "global_step": 389566, "epoch": 4693} {"train_loss": -26.28956413269043, "global_step": 389567, "epoch": 4693} {"train_loss": -26.469409942626953, "global_step": 389568, "epoch": 4693} {"train_loss": -26.559289932250977, "global_step": 389569, "epoch": 4693} {"train_loss": -26.36964225769043, "global_step": 389570, "epoch": 4693} {"train_loss": -26.685422897338867, "global_step": 389571, "epoch": 4693} {"train_loss": -26.327722549438477, "global_step": 389572, "epoch": 4693} {"train_loss": -26.29144859313965, "global_step": 389573, "epoch": 4693} {"train_loss": -26.598346710205078, "global_step": 389574, "epoch": 4693} {"train_loss": -26.336029052734375, "global_step": 389575, "epoch": 4693} {"train_loss": -26.549591064453125, "global_step": 389576, "epoch": 4693} {"train_loss": -26.164154052734375, "global_step": 389577, "epoch": 4693} {"train_loss": -25.700315475463867, "global_step": 389578, "epoch": 4693} {"train_loss": -25.636274337768555, "global_step": 389579, "epoch": 4693} {"train_loss": -26.314794540405273, "global_step": 389580, "epoch": 4693} {"train_loss": -25.737192153930664, "global_step": 389581, "epoch": 4693} {"train_loss": -25.763946533203125, "global_step": 389582, "epoch": 4693} {"train_loss": -25.766088485717773, "global_step": 389583, "epoch": 4693} {"train_loss": -26.147748947143555, "global_step": 389584, "epoch": 4693} {"train_loss": -26.084747314453125, "global_step": 389585, "epoch": 4693} {"train_loss": -26.180221557617188, "global_step": 389586, "epoch": 4693} {"train_loss": -26.249176025390625, "global_step": 389587, "epoch": 4693} {"train_loss": -26.441221237182617, "global_step": 389588, "epoch": 4693} {"train_loss": -26.59050941467285, "global_step": 389589, "epoch": 4693} {"train_loss": -26.165740966796875, "global_step": 389590, "epoch": 4693} {"train_loss": -26.08976173400879, "global_step": 389591, "epoch": 4693} {"train_loss": -26.30936050415039, "global_step": 389592, "epoch": 4693} {"train_loss": -26.157377243041992, "global_step": 389593, "epoch": 4693} {"train_loss": -26.73101234436035, "global_step": 389594, "epoch": 4693} {"train_loss": -26.20911979675293, "global_step": 389595, "epoch": 4693} {"train_loss": -26.6090145111084, "global_step": 389596, "epoch": 4693} {"train_loss": -26.176782608032227, "global_step": 389597, "epoch": 4693} {"train_loss": -26.41181755065918, "global_step": 389598, "epoch": 4693} {"train_loss": -26.225378036499023, "global_step": 389599, "epoch": 4693} {"train_loss": -26.271198272705078, "global_step": 389600, "epoch": 4693} {"train_loss": -26.366562119449476, "global_step": 389601, "epoch": 4693, "val_loss": 6563167.0} {"train_loss": -26.327131271362305, "global_step": 389602, "epoch": 4694} {"train_loss": -25.152868270874023, "global_step": 389603, "epoch": 4694} {"train_loss": -25.358501434326172, "global_step": 389604, "epoch": 4694} {"train_loss": -26.059833526611328, "global_step": 389605, "epoch": 4694} {"train_loss": -26.01435661315918, "global_step": 389606, "epoch": 4694} {"train_loss": -26.163476943969727, "global_step": 389607, "epoch": 4694} {"train_loss": -26.40683937072754, "global_step": 389608, "epoch": 4694} {"train_loss": -26.20123863220215, "global_step": 389609, "epoch": 4694} {"train_loss": -26.514150619506836, "global_step": 389610, "epoch": 4694} {"train_loss": -25.8383731842041, "global_step": 389611, "epoch": 4694} {"train_loss": -26.109655380249023, "global_step": 389612, "epoch": 4694} {"train_loss": -25.928558349609375, "global_step": 389613, "epoch": 4694} {"train_loss": -26.03706932067871, "global_step": 389614, "epoch": 4694} {"train_loss": -26.28960609436035, "global_step": 389615, "epoch": 4694} {"train_loss": -26.3355712890625, "global_step": 389616, "epoch": 4694} {"train_loss": -26.409753799438477, "global_step": 389617, "epoch": 4694} {"train_loss": -26.649625778198242, "global_step": 389618, "epoch": 4694} {"train_loss": -26.021677017211914, "global_step": 389619, "epoch": 4694} {"train_loss": -26.4346866607666, "global_step": 389620, "epoch": 4694} {"train_loss": -26.40521240234375, "global_step": 389621, "epoch": 4694} {"train_loss": -26.187591552734375, "global_step": 389622, "epoch": 4694} {"train_loss": -26.34228515625, "global_step": 389623, "epoch": 4694} {"train_loss": -26.62159538269043, "global_step": 389624, "epoch": 4694} {"train_loss": -26.320032119750977, "global_step": 389625, "epoch": 4694} {"train_loss": -26.307083129882812, "global_step": 389626, "epoch": 4694} {"train_loss": -26.758270263671875, "global_step": 389627, "epoch": 4694} {"train_loss": -26.52552604675293, "global_step": 389628, "epoch": 4694} {"train_loss": -26.506399154663086, "global_step": 389629, "epoch": 4694} {"train_loss": -26.6466121673584, "global_step": 389630, "epoch": 4694} {"train_loss": -26.46525001525879, "global_step": 389631, "epoch": 4694} {"train_loss": -26.785282135009766, "global_step": 389632, "epoch": 4694} {"train_loss": -26.62715721130371, "global_step": 389633, "epoch": 4694} {"train_loss": -26.494287490844727, "global_step": 389634, "epoch": 4694} {"train_loss": -26.559223175048828, "global_step": 389635, "epoch": 4694} {"train_loss": -26.520788192749023, "global_step": 389636, "epoch": 4694} {"train_loss": -26.373493194580078, "global_step": 389637, "epoch": 4694} {"train_loss": -26.568445205688477, "global_step": 389638, "epoch": 4694} {"train_loss": -26.8963565826416, "global_step": 389639, "epoch": 4694} {"train_loss": -26.552770614624023, "global_step": 389640, "epoch": 4694} {"train_loss": -26.432783126831055, "global_step": 389641, "epoch": 4694} {"train_loss": -26.76544189453125, "global_step": 389642, "epoch": 4694} {"train_loss": -26.520971298217773, "global_step": 389643, "epoch": 4694} {"train_loss": -26.4251651763916, "global_step": 389644, "epoch": 4694} {"train_loss": -26.59491539001465, "global_step": 389645, "epoch": 4694} {"train_loss": -26.573474884033203, "global_step": 389646, "epoch": 4694} {"train_loss": -26.639928817749023, "global_step": 389647, "epoch": 4694} {"train_loss": -26.05999755859375, "global_step": 389648, "epoch": 4694} {"train_loss": -26.2514591217041, "global_step": 389649, "epoch": 4694} {"train_loss": -26.095624923706055, "global_step": 389650, "epoch": 4694} {"train_loss": -26.55574607849121, "global_step": 389651, "epoch": 4694} {"train_loss": -26.416223526000977, "global_step": 389652, "epoch": 4694} {"train_loss": -26.447162628173828, "global_step": 389653, "epoch": 4694} {"train_loss": -26.4512939453125, "global_step": 389654, "epoch": 4694} {"train_loss": -26.24799156188965, "global_step": 389655, "epoch": 4694} {"train_loss": -26.4620361328125, "global_step": 389656, "epoch": 4694} {"train_loss": -26.26466178894043, "global_step": 389657, "epoch": 4694} {"train_loss": -26.865543365478516, "global_step": 389658, "epoch": 4694} {"train_loss": -26.447757720947266, "global_step": 389659, "epoch": 4694} {"train_loss": -26.598478317260742, "global_step": 389660, "epoch": 4694} {"train_loss": -26.42069435119629, "global_step": 389661, "epoch": 4694} {"train_loss": -26.681137084960938, "global_step": 389662, "epoch": 4694} {"train_loss": -26.463537216186523, "global_step": 389663, "epoch": 4694} {"train_loss": -26.6149845123291, "global_step": 389664, "epoch": 4694} {"train_loss": -26.536413192749023, "global_step": 389665, "epoch": 4694} {"train_loss": -26.628698348999023, "global_step": 389666, "epoch": 4694} {"train_loss": -26.461591720581055, "global_step": 389667, "epoch": 4694} {"train_loss": -26.398080825805664, "global_step": 389668, "epoch": 4694} {"train_loss": -26.761743545532227, "global_step": 389669, "epoch": 4694} {"train_loss": -26.84404945373535, "global_step": 389670, "epoch": 4694} {"train_loss": -26.370222091674805, "global_step": 389671, "epoch": 4694} {"train_loss": -26.524335861206055, "global_step": 389672, "epoch": 4694} {"train_loss": -26.764928817749023, "global_step": 389673, "epoch": 4694} {"train_loss": -26.822912216186523, "global_step": 389674, "epoch": 4694} {"train_loss": -26.589080810546875, "global_step": 389675, "epoch": 4694} {"train_loss": -26.62822914123535, "global_step": 389676, "epoch": 4694} {"train_loss": -26.971668243408203, "global_step": 389677, "epoch": 4694} {"train_loss": -26.406604766845703, "global_step": 389678, "epoch": 4694} {"train_loss": -26.699920654296875, "global_step": 389679, "epoch": 4694} {"train_loss": -26.89179801940918, "global_step": 389680, "epoch": 4694} {"train_loss": -26.39728355407715, "global_step": 389681, "epoch": 4694} {"train_loss": -26.603357315063477, "global_step": 389682, "epoch": 4694} {"train_loss": -26.312458038330078, "global_step": 389683, "epoch": 4694} {"train_loss": -26.432049096348774, "global_step": 389684, "epoch": 4694, "val_loss": 6642790.0} {"train_loss": -25.93659019470215, "global_step": 389685, "epoch": 4695} {"train_loss": -25.452667236328125, "global_step": 389686, "epoch": 4695} {"train_loss": -25.82843017578125, "global_step": 389687, "epoch": 4695} {"train_loss": -26.51025390625, "global_step": 389688, "epoch": 4695} {"train_loss": -26.2710018157959, "global_step": 389689, "epoch": 4695} {"train_loss": -26.0737247467041, "global_step": 389690, "epoch": 4695} {"train_loss": -26.2916316986084, "global_step": 389691, "epoch": 4695} {"train_loss": -26.203018188476562, "global_step": 389692, "epoch": 4695} {"train_loss": -26.4743595123291, "global_step": 389693, "epoch": 4695} {"train_loss": -26.300800323486328, "global_step": 389694, "epoch": 4695} {"train_loss": -26.2108097076416, "global_step": 389695, "epoch": 4695} {"train_loss": -26.155298233032227, "global_step": 389696, "epoch": 4695} {"train_loss": -26.54461669921875, "global_step": 389697, "epoch": 4695} {"train_loss": -26.330575942993164, "global_step": 389698, "epoch": 4695} {"train_loss": -25.976703643798828, "global_step": 389699, "epoch": 4695} {"train_loss": -26.21963882446289, "global_step": 389700, "epoch": 4695} {"train_loss": -26.15667724609375, "global_step": 389701, "epoch": 4695} {"train_loss": -26.33560562133789, "global_step": 389702, "epoch": 4695} {"train_loss": -26.4355525970459, "global_step": 389703, "epoch": 4695} {"train_loss": -26.451379776000977, "global_step": 389704, "epoch": 4695} {"train_loss": -26.310775756835938, "global_step": 389705, "epoch": 4695} {"train_loss": -26.481367111206055, "global_step": 389706, "epoch": 4695} {"train_loss": -26.50269889831543, "global_step": 389707, "epoch": 4695} {"train_loss": -26.694091796875, "global_step": 389708, "epoch": 4695} {"train_loss": -26.547590255737305, "global_step": 389709, "epoch": 4695} {"train_loss": -26.344823837280273, "global_step": 389710, "epoch": 4695} {"train_loss": -26.67341423034668, "global_step": 389711, "epoch": 4695} {"train_loss": -26.616504669189453, "global_step": 389712, "epoch": 4695} {"train_loss": -26.40162467956543, "global_step": 389713, "epoch": 4695} {"train_loss": -26.358306884765625, "global_step": 389714, "epoch": 4695} {"train_loss": -26.5562686920166, "global_step": 389715, "epoch": 4695} {"train_loss": -26.72834587097168, "global_step": 389716, "epoch": 4695} {"train_loss": -26.456329345703125, "global_step": 389717, "epoch": 4695} {"train_loss": -26.505903244018555, "global_step": 389718, "epoch": 4695} {"train_loss": -26.618671417236328, "global_step": 389719, "epoch": 4695} {"train_loss": -26.477880477905273, "global_step": 389720, "epoch": 4695} {"train_loss": -26.110315322875977, "global_step": 389721, "epoch": 4695} {"train_loss": -26.79156494140625, "global_step": 389722, "epoch": 4695} {"train_loss": -26.59394645690918, "global_step": 389723, "epoch": 4695} {"train_loss": -26.588016510009766, "global_step": 389724, "epoch": 4695} {"train_loss": -26.142805099487305, "global_step": 389725, "epoch": 4695} {"train_loss": -26.536340713500977, "global_step": 389726, "epoch": 4695} {"train_loss": -26.110050201416016, "global_step": 389727, "epoch": 4695} {"train_loss": -26.641773223876953, "global_step": 389728, "epoch": 4695} {"train_loss": -26.74774169921875, "global_step": 389729, "epoch": 4695} {"train_loss": -26.62505531311035, "global_step": 389730, "epoch": 4695} {"train_loss": -26.594205856323242, "global_step": 389731, "epoch": 4695} {"train_loss": -26.73475456237793, "global_step": 389732, "epoch": 4695} {"train_loss": -26.238744735717773, "global_step": 389733, "epoch": 4695} {"train_loss": -26.92529296875, "global_step": 389734, "epoch": 4695} {"train_loss": -26.86384391784668, "global_step": 389735, "epoch": 4695} {"train_loss": -27.223920822143555, "global_step": 389736, "epoch": 4695} {"train_loss": -26.574771881103516, "global_step": 389737, "epoch": 4695} {"train_loss": -26.524566650390625, "global_step": 389738, "epoch": 4695} {"train_loss": -26.816726684570312, "global_step": 389739, "epoch": 4695} {"train_loss": -26.80527114868164, "global_step": 389740, "epoch": 4695} {"train_loss": -26.54034423828125, "global_step": 389741, "epoch": 4695} {"train_loss": -26.58345603942871, "global_step": 389742, "epoch": 4695} {"train_loss": -26.5698299407959, "global_step": 389743, "epoch": 4695} {"train_loss": -26.73944664001465, "global_step": 389744, "epoch": 4695} {"train_loss": -26.443439483642578, "global_step": 389745, "epoch": 4695} {"train_loss": -26.81385612487793, "global_step": 389746, "epoch": 4695} {"train_loss": -26.461450576782227, "global_step": 389747, "epoch": 4695} {"train_loss": -26.21639060974121, "global_step": 389748, "epoch": 4695} {"train_loss": -26.152042388916016, "global_step": 389749, "epoch": 4695} {"train_loss": -25.717727661132812, "global_step": 389750, "epoch": 4695} {"train_loss": -26.051834106445312, "global_step": 389751, "epoch": 4695} {"train_loss": -26.5032958984375, "global_step": 389752, "epoch": 4695} {"train_loss": -26.088605880737305, "global_step": 389753, "epoch": 4695} {"train_loss": -25.997406005859375, "global_step": 389754, "epoch": 4695} {"train_loss": -25.834009170532227, "global_step": 389755, "epoch": 4695} {"train_loss": -26.193174362182617, "global_step": 389756, "epoch": 4695} {"train_loss": -26.110660552978516, "global_step": 389757, "epoch": 4695} {"train_loss": -25.80830192565918, "global_step": 389758, "epoch": 4695} {"train_loss": -26.351404190063477, "global_step": 389759, "epoch": 4695} {"train_loss": -26.162565231323242, "global_step": 389760, "epoch": 4695} {"train_loss": -26.168079376220703, "global_step": 389761, "epoch": 4695} {"train_loss": -25.943342208862305, "global_step": 389762, "epoch": 4695} {"train_loss": -26.078582763671875, "global_step": 389763, "epoch": 4695} {"train_loss": -25.94080924987793, "global_step": 389764, "epoch": 4695} {"train_loss": -26.554061889648438, "global_step": 389765, "epoch": 4695} {"train_loss": -26.10163688659668, "global_step": 389766, "epoch": 4695} {"train_loss": -26.35899773563247, "global_step": 389767, "epoch": 4695, "val_loss": 6569613.0} {"train_loss": -25.862085342407227, "global_step": 389768, "epoch": 4696} {"train_loss": -25.9091854095459, "global_step": 389769, "epoch": 4696} {"train_loss": -26.04495620727539, "global_step": 389770, "epoch": 4696} {"train_loss": -25.544147491455078, "global_step": 389771, "epoch": 4696} {"train_loss": -25.56243324279785, "global_step": 389772, "epoch": 4696} {"train_loss": -25.633268356323242, "global_step": 389773, "epoch": 4696} {"train_loss": -26.027734756469727, "global_step": 389774, "epoch": 4696} {"train_loss": -25.729795455932617, "global_step": 389775, "epoch": 4696} {"train_loss": -25.953094482421875, "global_step": 389776, "epoch": 4696} {"train_loss": -26.192096710205078, "global_step": 389777, "epoch": 4696} {"train_loss": -26.284061431884766, "global_step": 389778, "epoch": 4696} {"train_loss": -26.463056564331055, "global_step": 389779, "epoch": 4696} {"train_loss": -26.278736114501953, "global_step": 389780, "epoch": 4696} {"train_loss": -26.139591217041016, "global_step": 389781, "epoch": 4696} {"train_loss": -26.3486270904541, "global_step": 389782, "epoch": 4696} {"train_loss": -26.10236167907715, "global_step": 389783, "epoch": 4696} {"train_loss": -26.218830108642578, "global_step": 389784, "epoch": 4696} {"train_loss": -26.463876724243164, "global_step": 389785, "epoch": 4696} {"train_loss": -26.350934982299805, "global_step": 389786, "epoch": 4696} {"train_loss": -25.969030380249023, "global_step": 389787, "epoch": 4696} {"train_loss": -26.665557861328125, "global_step": 389788, "epoch": 4696} {"train_loss": -26.679386138916016, "global_step": 389789, "epoch": 4696} {"train_loss": -26.802549362182617, "global_step": 389790, "epoch": 4696} {"train_loss": -26.217819213867188, "global_step": 389791, "epoch": 4696} {"train_loss": -26.555570602416992, "global_step": 389792, "epoch": 4696} {"train_loss": -26.238088607788086, "global_step": 389793, "epoch": 4696} {"train_loss": -26.899267196655273, "global_step": 389794, "epoch": 4696} {"train_loss": -26.79456901550293, "global_step": 389795, "epoch": 4696} {"train_loss": -26.485143661499023, "global_step": 389796, "epoch": 4696} {"train_loss": -26.778629302978516, "global_step": 389797, "epoch": 4696} {"train_loss": -26.676877975463867, "global_step": 389798, "epoch": 4696} {"train_loss": -26.47014808654785, "global_step": 389799, "epoch": 4696} {"train_loss": -26.559497833251953, "global_step": 389800, "epoch": 4696} {"train_loss": -26.779821395874023, "global_step": 389801, "epoch": 4696} {"train_loss": -26.366825103759766, "global_step": 389802, "epoch": 4696} {"train_loss": -26.666229248046875, "global_step": 389803, "epoch": 4696} {"train_loss": -26.53913688659668, "global_step": 389804, "epoch": 4696} {"train_loss": -26.837818145751953, "global_step": 389805, "epoch": 4696} {"train_loss": -26.927759170532227, "global_step": 389806, "epoch": 4696} {"train_loss": -26.68033790588379, "global_step": 389807, "epoch": 4696} {"train_loss": -26.93507194519043, "global_step": 389808, "epoch": 4696} {"train_loss": -26.58038902282715, "global_step": 389809, "epoch": 4696} {"train_loss": -26.976154327392578, "global_step": 389810, "epoch": 4696} {"train_loss": -27.133865356445312, "global_step": 389811, "epoch": 4696} {"train_loss": -26.74729347229004, "global_step": 389812, "epoch": 4696} {"train_loss": -26.68701171875, "global_step": 389813, "epoch": 4696} {"train_loss": -26.7097110748291, "global_step": 389814, "epoch": 4696} {"train_loss": -26.8271541595459, "global_step": 389815, "epoch": 4696} {"train_loss": -26.95941734313965, "global_step": 389816, "epoch": 4696} {"train_loss": -26.735448837280273, "global_step": 389817, "epoch": 4696} {"train_loss": -26.359182357788086, "global_step": 389818, "epoch": 4696} {"train_loss": -25.994619369506836, "global_step": 389819, "epoch": 4696} {"train_loss": -26.57025718688965, "global_step": 389820, "epoch": 4696} {"train_loss": -26.145450592041016, "global_step": 389821, "epoch": 4696} {"train_loss": -26.229883193969727, "global_step": 389822, "epoch": 4696} {"train_loss": -26.170490264892578, "global_step": 389823, "epoch": 4696} {"train_loss": -26.162755966186523, "global_step": 389824, "epoch": 4696} {"train_loss": -26.495243072509766, "global_step": 389825, "epoch": 4696} {"train_loss": -26.644184112548828, "global_step": 389826, "epoch": 4696} {"train_loss": -26.654804229736328, "global_step": 389827, "epoch": 4696} {"train_loss": -26.723739624023438, "global_step": 389828, "epoch": 4696} {"train_loss": -26.54652976989746, "global_step": 389829, "epoch": 4696} {"train_loss": -26.418323516845703, "global_step": 389830, "epoch": 4696} {"train_loss": -26.69900894165039, "global_step": 389831, "epoch": 4696} {"train_loss": -26.32320213317871, "global_step": 389832, "epoch": 4696} {"train_loss": -26.253427505493164, "global_step": 389833, "epoch": 4696} {"train_loss": -26.570886611938477, "global_step": 389834, "epoch": 4696} {"train_loss": -27.127857208251953, "global_step": 389835, "epoch": 4696} {"train_loss": -26.460752487182617, "global_step": 389836, "epoch": 4696} {"train_loss": -26.532201766967773, "global_step": 389837, "epoch": 4696} {"train_loss": -26.33780860900879, "global_step": 389838, "epoch": 4696} {"train_loss": -26.405536651611328, "global_step": 389839, "epoch": 4696} {"train_loss": -26.344205856323242, "global_step": 389840, "epoch": 4696} {"train_loss": -26.0876407623291, "global_step": 389841, "epoch": 4696} {"train_loss": -26.496536254882812, "global_step": 389842, "epoch": 4696} {"train_loss": -26.25679588317871, "global_step": 389843, "epoch": 4696} {"train_loss": -26.44327163696289, "global_step": 389844, "epoch": 4696} {"train_loss": -26.59002113342285, "global_step": 389845, "epoch": 4696} {"train_loss": -26.530170440673828, "global_step": 389846, "epoch": 4696} {"train_loss": -26.532880783081055, "global_step": 389847, "epoch": 4696} {"train_loss": -26.618179321289062, "global_step": 389848, "epoch": 4696} {"train_loss": -26.665815353393555, "global_step": 389849, "epoch": 4696} {"train_loss": -26.452264739806395, "global_step": 389850, "epoch": 4696, "val_loss": 6605455.5} {"train_loss": -26.819721221923828, "global_step": 389851, "epoch": 4697} {"train_loss": -26.06313133239746, "global_step": 389852, "epoch": 4697} {"train_loss": -26.116138458251953, "global_step": 389853, "epoch": 4697} {"train_loss": -26.217145919799805, "global_step": 389854, "epoch": 4697} {"train_loss": -26.84889030456543, "global_step": 389855, "epoch": 4697} {"train_loss": -26.501407623291016, "global_step": 389856, "epoch": 4697} {"train_loss": -26.13837242126465, "global_step": 389857, "epoch": 4697} {"train_loss": -25.86697769165039, "global_step": 389858, "epoch": 4697} {"train_loss": -26.40044593811035, "global_step": 389859, "epoch": 4697} {"train_loss": -26.30960464477539, "global_step": 389860, "epoch": 4697} {"train_loss": -26.78395652770996, "global_step": 389861, "epoch": 4697} {"train_loss": -26.54310417175293, "global_step": 389862, "epoch": 4697} {"train_loss": -26.357715606689453, "global_step": 389863, "epoch": 4697} {"train_loss": -26.838607788085938, "global_step": 389864, "epoch": 4697} {"train_loss": -26.54764175415039, "global_step": 389865, "epoch": 4697} {"train_loss": -26.372333526611328, "global_step": 389866, "epoch": 4697} {"train_loss": -26.468008041381836, "global_step": 389867, "epoch": 4697} {"train_loss": -26.224843978881836, "global_step": 389868, "epoch": 4697} {"train_loss": -26.3330020904541, "global_step": 389869, "epoch": 4697} {"train_loss": -26.566726684570312, "global_step": 389870, "epoch": 4697} {"train_loss": -26.01692008972168, "global_step": 389871, "epoch": 4697} {"train_loss": -25.934783935546875, "global_step": 389872, "epoch": 4697} {"train_loss": -26.667896270751953, "global_step": 389873, "epoch": 4697} {"train_loss": -26.268253326416016, "global_step": 389874, "epoch": 4697} {"train_loss": -26.244338989257812, "global_step": 389875, "epoch": 4697} {"train_loss": -26.67461585998535, "global_step": 389876, "epoch": 4697} {"train_loss": -26.204364776611328, "global_step": 389877, "epoch": 4697} {"train_loss": -26.12483787536621, "global_step": 389878, "epoch": 4697} {"train_loss": -26.527746200561523, "global_step": 389879, "epoch": 4697} {"train_loss": -26.335865020751953, "global_step": 389880, "epoch": 4697} {"train_loss": -26.3970947265625, "global_step": 389881, "epoch": 4697} {"train_loss": -26.346845626831055, "global_step": 389882, "epoch": 4697} {"train_loss": -26.443042755126953, "global_step": 389883, "epoch": 4697} {"train_loss": -26.297094345092773, "global_step": 389884, "epoch": 4697} {"train_loss": -25.841215133666992, "global_step": 389885, "epoch": 4697} {"train_loss": -26.261474609375, "global_step": 389886, "epoch": 4697} {"train_loss": -26.240665435791016, "global_step": 389887, "epoch": 4697} {"train_loss": -26.60809326171875, "global_step": 389888, "epoch": 4697} {"train_loss": -26.684106826782227, "global_step": 389889, "epoch": 4697} {"train_loss": -26.30496597290039, "global_step": 389890, "epoch": 4697} {"train_loss": -26.4312686920166, "global_step": 389891, "epoch": 4697} {"train_loss": -26.46607780456543, "global_step": 389892, "epoch": 4697} {"train_loss": -26.571277618408203, "global_step": 389893, "epoch": 4697} {"train_loss": -26.47089195251465, "global_step": 389894, "epoch": 4697} {"train_loss": -26.559818267822266, "global_step": 389895, "epoch": 4697} {"train_loss": -26.677936553955078, "global_step": 389896, "epoch": 4697} {"train_loss": -26.701223373413086, "global_step": 389897, "epoch": 4697} {"train_loss": -26.7407169342041, "global_step": 389898, "epoch": 4697} {"train_loss": -26.56618309020996, "global_step": 389899, "epoch": 4697} {"train_loss": -26.674331665039062, "global_step": 389900, "epoch": 4697} {"train_loss": -26.623382568359375, "global_step": 389901, "epoch": 4697} {"train_loss": -26.5732364654541, "global_step": 389902, "epoch": 4697} {"train_loss": -26.44756507873535, "global_step": 389903, "epoch": 4697} {"train_loss": -26.789560317993164, "global_step": 389904, "epoch": 4697} {"train_loss": -27.07610511779785, "global_step": 389905, "epoch": 4697} {"train_loss": -26.82672691345215, "global_step": 389906, "epoch": 4697} {"train_loss": -26.386554718017578, "global_step": 389907, "epoch": 4697} {"train_loss": -26.784448623657227, "global_step": 389908, "epoch": 4697} {"train_loss": -27.1935977935791, "global_step": 389909, "epoch": 4697} {"train_loss": -26.49161148071289, "global_step": 389910, "epoch": 4697} {"train_loss": -26.383955001831055, "global_step": 389911, "epoch": 4697} {"train_loss": -26.396728515625, "global_step": 389912, "epoch": 4697} {"train_loss": -26.40131950378418, "global_step": 389913, "epoch": 4697} {"train_loss": -25.95371437072754, "global_step": 389914, "epoch": 4697} {"train_loss": -26.218311309814453, "global_step": 389915, "epoch": 4697} {"train_loss": -26.384811401367188, "global_step": 389916, "epoch": 4697} {"train_loss": -26.41951560974121, "global_step": 389917, "epoch": 4697} {"train_loss": -26.526859283447266, "global_step": 389918, "epoch": 4697} {"train_loss": -26.61468505859375, "global_step": 389919, "epoch": 4697} {"train_loss": -26.51688575744629, "global_step": 389920, "epoch": 4697} {"train_loss": -26.869054794311523, "global_step": 389921, "epoch": 4697} {"train_loss": -26.37526512145996, "global_step": 389922, "epoch": 4697} {"train_loss": -26.776716232299805, "global_step": 389923, "epoch": 4697} {"train_loss": -26.62517738342285, "global_step": 389924, "epoch": 4697} {"train_loss": -26.721494674682617, "global_step": 389925, "epoch": 4697} {"train_loss": -26.489038467407227, "global_step": 389926, "epoch": 4697} {"train_loss": -26.563573837280273, "global_step": 389927, "epoch": 4697} {"train_loss": -26.429718017578125, "global_step": 389928, "epoch": 4697} {"train_loss": -26.6182918548584, "global_step": 389929, "epoch": 4697} {"train_loss": -26.572874069213867, "global_step": 389930, "epoch": 4697} {"train_loss": -26.704669952392578, "global_step": 389931, "epoch": 4697} {"train_loss": -26.28938102722168, "global_step": 389932, "epoch": 4697} {"train_loss": -26.47618682125965, "global_step": 389933, "epoch": 4697, "val_loss": 6611686.0} {"train_loss": -24.893091201782227, "global_step": 389934, "epoch": 4698} {"train_loss": -24.90239906311035, "global_step": 389935, "epoch": 4698} {"train_loss": -25.629053115844727, "global_step": 389936, "epoch": 4698} {"train_loss": -25.40626335144043, "global_step": 389937, "epoch": 4698} {"train_loss": -24.9110164642334, "global_step": 389938, "epoch": 4698} {"train_loss": -26.11453628540039, "global_step": 389939, "epoch": 4698} {"train_loss": -25.341421127319336, "global_step": 389940, "epoch": 4698} {"train_loss": -25.837133407592773, "global_step": 389941, "epoch": 4698} {"train_loss": -25.569189071655273, "global_step": 389942, "epoch": 4698} {"train_loss": -25.8304443359375, "global_step": 389943, "epoch": 4698} {"train_loss": -25.85365104675293, "global_step": 389944, "epoch": 4698} {"train_loss": -25.91901969909668, "global_step": 389945, "epoch": 4698} {"train_loss": -26.04071617126465, "global_step": 389946, "epoch": 4698} {"train_loss": -25.85935401916504, "global_step": 389947, "epoch": 4698} {"train_loss": -26.15301513671875, "global_step": 389948, "epoch": 4698} {"train_loss": -25.908864974975586, "global_step": 389949, "epoch": 4698} {"train_loss": -26.268787384033203, "global_step": 389950, "epoch": 4698} {"train_loss": -25.70393180847168, "global_step": 389951, "epoch": 4698} {"train_loss": -26.163721084594727, "global_step": 389952, "epoch": 4698} {"train_loss": -26.35272216796875, "global_step": 389953, "epoch": 4698} {"train_loss": -26.363452911376953, "global_step": 389954, "epoch": 4698} {"train_loss": -26.085773468017578, "global_step": 389955, "epoch": 4698} {"train_loss": -26.3265438079834, "global_step": 389956, "epoch": 4698} {"train_loss": -26.480701446533203, "global_step": 389957, "epoch": 4698} {"train_loss": -26.25308609008789, "global_step": 389958, "epoch": 4698} {"train_loss": -26.43122673034668, "global_step": 389959, "epoch": 4698} {"train_loss": -26.448261260986328, "global_step": 389960, "epoch": 4698} {"train_loss": -26.269001007080078, "global_step": 389961, "epoch": 4698} {"train_loss": -26.076452255249023, "global_step": 389962, "epoch": 4698} {"train_loss": -26.063108444213867, "global_step": 389963, "epoch": 4698} {"train_loss": -26.70038414001465, "global_step": 389964, "epoch": 4698} {"train_loss": -26.183990478515625, "global_step": 389965, "epoch": 4698} {"train_loss": -26.41632652282715, "global_step": 389966, "epoch": 4698} {"train_loss": -26.255414962768555, "global_step": 389967, "epoch": 4698} {"train_loss": -26.433700561523438, "global_step": 389968, "epoch": 4698} {"train_loss": -26.4123477935791, "global_step": 389969, "epoch": 4698} {"train_loss": -26.91440773010254, "global_step": 389970, "epoch": 4698} {"train_loss": -26.512609481811523, "global_step": 389971, "epoch": 4698} {"train_loss": -26.862356185913086, "global_step": 389972, "epoch": 4698} {"train_loss": -26.544607162475586, "global_step": 389973, "epoch": 4698} {"train_loss": -26.443695068359375, "global_step": 389974, "epoch": 4698} {"train_loss": -26.587738037109375, "global_step": 389975, "epoch": 4698} {"train_loss": -26.83906364440918, "global_step": 389976, "epoch": 4698} {"train_loss": -26.882938385009766, "global_step": 389977, "epoch": 4698} {"train_loss": -26.28095054626465, "global_step": 389978, "epoch": 4698} {"train_loss": -26.548095703125, "global_step": 389979, "epoch": 4698} {"train_loss": -26.40886878967285, "global_step": 389980, "epoch": 4698} {"train_loss": -26.52488136291504, "global_step": 389981, "epoch": 4698} {"train_loss": -26.81438636779785, "global_step": 389982, "epoch": 4698} {"train_loss": -26.833221435546875, "global_step": 389983, "epoch": 4698} {"train_loss": -26.6002254486084, "global_step": 389984, "epoch": 4698} {"train_loss": -26.70082664489746, "global_step": 389985, "epoch": 4698} {"train_loss": -26.77827262878418, "global_step": 389986, "epoch": 4698} {"train_loss": -26.580204010009766, "global_step": 389987, "epoch": 4698} {"train_loss": -26.386886596679688, "global_step": 389988, "epoch": 4698} {"train_loss": -26.33709144592285, "global_step": 389989, "epoch": 4698} {"train_loss": -26.612817764282227, "global_step": 389990, "epoch": 4698} {"train_loss": -26.785537719726562, "global_step": 389991, "epoch": 4698} {"train_loss": -26.793272018432617, "global_step": 389992, "epoch": 4698} {"train_loss": -26.254669189453125, "global_step": 389993, "epoch": 4698} {"train_loss": -26.135910034179688, "global_step": 389994, "epoch": 4698} {"train_loss": -25.972442626953125, "global_step": 389995, "epoch": 4698} {"train_loss": -26.558624267578125, "global_step": 389996, "epoch": 4698} {"train_loss": -26.31941795349121, "global_step": 389997, "epoch": 4698} {"train_loss": -26.594451904296875, "global_step": 389998, "epoch": 4698} {"train_loss": -26.136926651000977, "global_step": 389999, "epoch": 4698} {"train_loss": -26.17229652404785, "global_step": 390000, "epoch": 4698} {"train_loss": -26.309919357299805, "global_step": 390001, "epoch": 4698} {"train_loss": -26.527347564697266, "global_step": 390002, "epoch": 4698} {"train_loss": -26.506601333618164, "global_step": 390003, "epoch": 4698} {"train_loss": -26.281574249267578, "global_step": 390004, "epoch": 4698} {"train_loss": -26.791717529296875, "global_step": 390005, "epoch": 4698} {"train_loss": -26.608688354492188, "global_step": 390006, "epoch": 4698} {"train_loss": -26.76478385925293, "global_step": 390007, "epoch": 4698} {"train_loss": -26.411930084228516, "global_step": 390008, "epoch": 4698} {"train_loss": -26.456497192382812, "global_step": 390009, "epoch": 4698} {"train_loss": -26.813745498657227, "global_step": 390010, "epoch": 4698} {"train_loss": -26.02423667907715, "global_step": 390011, "epoch": 4698} {"train_loss": -26.62373161315918, "global_step": 390012, "epoch": 4698} {"train_loss": -26.47979736328125, "global_step": 390013, "epoch": 4698} {"train_loss": -26.72900390625, "global_step": 390014, "epoch": 4698} {"train_loss": -26.153364181518555, "global_step": 390015, "epoch": 4698} {"train_loss": -26.30700522733022, "global_step": 390016, "epoch": 4698, "val_loss": 6556062.0} {"train_loss": -26.393756866455078, "global_step": 390017, "epoch": 4699} {"train_loss": -26.32395362854004, "global_step": 390018, "epoch": 4699} {"train_loss": -26.349014282226562, "global_step": 390019, "epoch": 4699} {"train_loss": -26.277591705322266, "global_step": 390020, "epoch": 4699} {"train_loss": -26.172840118408203, "global_step": 390021, "epoch": 4699} {"train_loss": -26.1458797454834, "global_step": 390022, "epoch": 4699} {"train_loss": -26.269317626953125, "global_step": 390023, "epoch": 4699} {"train_loss": -26.323026657104492, "global_step": 390024, "epoch": 4699} {"train_loss": -26.43073081970215, "global_step": 390025, "epoch": 4699} {"train_loss": -25.954071044921875, "global_step": 390026, "epoch": 4699} {"train_loss": -26.090988159179688, "global_step": 390027, "epoch": 4699} {"train_loss": -26.53033447265625, "global_step": 390028, "epoch": 4699} {"train_loss": -26.878293991088867, "global_step": 390029, "epoch": 4699} {"train_loss": -26.448474884033203, "global_step": 390030, "epoch": 4699} {"train_loss": -26.171833038330078, "global_step": 390031, "epoch": 4699} {"train_loss": -26.504779815673828, "global_step": 390032, "epoch": 4699} {"train_loss": -26.673370361328125, "global_step": 390033, "epoch": 4699} {"train_loss": -26.651716232299805, "global_step": 390034, "epoch": 4699} {"train_loss": -26.620386123657227, "global_step": 390035, "epoch": 4699} {"train_loss": -26.749786376953125, "global_step": 390036, "epoch": 4699} {"train_loss": -26.523298263549805, "global_step": 390037, "epoch": 4699} {"train_loss": -26.82893943786621, "global_step": 390038, "epoch": 4699} {"train_loss": -26.447309494018555, "global_step": 390039, "epoch": 4699} {"train_loss": -26.415403366088867, "global_step": 390040, "epoch": 4699} {"train_loss": -26.41950035095215, "global_step": 390041, "epoch": 4699} {"train_loss": -26.62788963317871, "global_step": 390042, "epoch": 4699} {"train_loss": -26.666940689086914, "global_step": 390043, "epoch": 4699} {"train_loss": -26.642370223999023, "global_step": 390044, "epoch": 4699} {"train_loss": -26.707050323486328, "global_step": 390045, "epoch": 4699} {"train_loss": -26.546405792236328, "global_step": 390046, "epoch": 4699} {"train_loss": -26.212326049804688, "global_step": 390047, "epoch": 4699} {"train_loss": -26.227060317993164, "global_step": 390048, "epoch": 4699} {"train_loss": -26.52566909790039, "global_step": 390049, "epoch": 4699} {"train_loss": -26.633447647094727, "global_step": 390050, "epoch": 4699} {"train_loss": -26.86297607421875, "global_step": 390051, "epoch": 4699} {"train_loss": -26.503711700439453, "global_step": 390052, "epoch": 4699} {"train_loss": -26.31208610534668, "global_step": 390053, "epoch": 4699} {"train_loss": -25.93283462524414, "global_step": 390054, "epoch": 4699} {"train_loss": -26.07916831970215, "global_step": 390055, "epoch": 4699} {"train_loss": -25.915327072143555, "global_step": 390056, "epoch": 4699} {"train_loss": -26.4027042388916, "global_step": 390057, "epoch": 4699} {"train_loss": -26.413537979125977, "global_step": 390058, "epoch": 4699} {"train_loss": -26.503143310546875, "global_step": 390059, "epoch": 4699} {"train_loss": -26.45562744140625, "global_step": 390060, "epoch": 4699} {"train_loss": -26.44234275817871, "global_step": 390061, "epoch": 4699} {"train_loss": -26.750904083251953, "global_step": 390062, "epoch": 4699} {"train_loss": -26.029096603393555, "global_step": 390063, "epoch": 4699} {"train_loss": -26.6978759765625, "global_step": 390064, "epoch": 4699} {"train_loss": -26.722681045532227, "global_step": 390065, "epoch": 4699} {"train_loss": -26.673181533813477, "global_step": 390066, "epoch": 4699} {"train_loss": -26.618921279907227, "global_step": 390067, "epoch": 4699} {"train_loss": -26.377729415893555, "global_step": 390068, "epoch": 4699} {"train_loss": -26.68341064453125, "global_step": 390069, "epoch": 4699} {"train_loss": -26.448957443237305, "global_step": 390070, "epoch": 4699} {"train_loss": -26.448328018188477, "global_step": 390071, "epoch": 4699} {"train_loss": -26.39918327331543, "global_step": 390072, "epoch": 4699} {"train_loss": -26.618146896362305, "global_step": 390073, "epoch": 4699} {"train_loss": -26.561452865600586, "global_step": 390074, "epoch": 4699} {"train_loss": -26.68450355529785, "global_step": 390075, "epoch": 4699} {"train_loss": -26.64472770690918, "global_step": 390076, "epoch": 4699} {"train_loss": -26.622974395751953, "global_step": 390077, "epoch": 4699} {"train_loss": -26.841230392456055, "global_step": 390078, "epoch": 4699} {"train_loss": -26.516864776611328, "global_step": 390079, "epoch": 4699} {"train_loss": -26.78204917907715, "global_step": 390080, "epoch": 4699} {"train_loss": -26.875471115112305, "global_step": 390081, "epoch": 4699} {"train_loss": -26.505102157592773, "global_step": 390082, "epoch": 4699} {"train_loss": -26.524433135986328, "global_step": 390083, "epoch": 4699} {"train_loss": -26.458972930908203, "global_step": 390084, "epoch": 4699} {"train_loss": -26.9677677154541, "global_step": 390085, "epoch": 4699} {"train_loss": -26.74686622619629, "global_step": 390086, "epoch": 4699} {"train_loss": -26.74515151977539, "global_step": 390087, "epoch": 4699} {"train_loss": -26.598501205444336, "global_step": 390088, "epoch": 4699} {"train_loss": -26.502838134765625, "global_step": 390089, "epoch": 4699} {"train_loss": -26.895227432250977, "global_step": 390090, "epoch": 4699} {"train_loss": -26.874805450439453, "global_step": 390091, "epoch": 4699} {"train_loss": -26.5078182220459, "global_step": 390092, "epoch": 4699} {"train_loss": -26.820173263549805, "global_step": 390093, "epoch": 4699} {"train_loss": -26.4747371673584, "global_step": 390094, "epoch": 4699} {"train_loss": -26.714019775390625, "global_step": 390095, "epoch": 4699} {"train_loss": -26.444976806640625, "global_step": 390096, "epoch": 4699} {"train_loss": -26.911340713500977, "global_step": 390097, "epoch": 4699} {"train_loss": -26.534259796142578, "global_step": 390098, "epoch": 4699} {"train_loss": -26.52165934551193, "global_step": 390099, "epoch": 4699, "val_loss": 6496515.0} {"train_loss": -26.27864646911621, "global_step": 390100, "epoch": 4700} {"train_loss": -25.69025230407715, "global_step": 390101, "epoch": 4700} {"train_loss": -25.27248191833496, "global_step": 390102, "epoch": 4700} {"train_loss": -25.904632568359375, "global_step": 390103, "epoch": 4700} {"train_loss": -25.862207412719727, "global_step": 390104, "epoch": 4700} {"train_loss": -26.144323348999023, "global_step": 390105, "epoch": 4700} {"train_loss": -25.682905197143555, "global_step": 390106, "epoch": 4700} {"train_loss": -26.307422637939453, "global_step": 390107, "epoch": 4700} {"train_loss": -25.655120849609375, "global_step": 390108, "epoch": 4700} {"train_loss": -26.012556076049805, "global_step": 390109, "epoch": 4700} {"train_loss": -26.276655197143555, "global_step": 390110, "epoch": 4700} {"train_loss": -26.04371452331543, "global_step": 390111, "epoch": 4700} {"train_loss": -26.239688873291016, "global_step": 390112, "epoch": 4700} {"train_loss": -26.51340675354004, "global_step": 390113, "epoch": 4700} {"train_loss": -26.637060165405273, "global_step": 390114, "epoch": 4700} {"train_loss": -26.2560977935791, "global_step": 390115, "epoch": 4700} {"train_loss": -26.46671485900879, "global_step": 390116, "epoch": 4700} {"train_loss": -26.598783493041992, "global_step": 390117, "epoch": 4700} {"train_loss": -26.31387710571289, "global_step": 390118, "epoch": 4700} {"train_loss": -26.66291618347168, "global_step": 390119, "epoch": 4700} {"train_loss": -26.31686782836914, "global_step": 390120, "epoch": 4700} {"train_loss": -26.409788131713867, "global_step": 390121, "epoch": 4700} {"train_loss": -26.27555274963379, "global_step": 390122, "epoch": 4700} {"train_loss": -26.5006103515625, "global_step": 390123, "epoch": 4700} {"train_loss": -26.42160415649414, "global_step": 390124, "epoch": 4700} {"train_loss": -26.348011016845703, "global_step": 390125, "epoch": 4700} {"train_loss": -26.34307289123535, "global_step": 390126, "epoch": 4700} {"train_loss": -26.424015045166016, "global_step": 390127, "epoch": 4700} {"train_loss": -26.556262969970703, "global_step": 390128, "epoch": 4700} {"train_loss": -26.5553035736084, "global_step": 390129, "epoch": 4700} {"train_loss": -26.25465202331543, "global_step": 390130, "epoch": 4700} {"train_loss": -26.592580795288086, "global_step": 390131, "epoch": 4700} {"train_loss": -26.73980140686035, "global_step": 390132, "epoch": 4700} {"train_loss": -26.76002311706543, "global_step": 390133, "epoch": 4700} {"train_loss": -26.84421730041504, "global_step": 390134, "epoch": 4700} {"train_loss": -26.262195587158203, "global_step": 390135, "epoch": 4700} {"train_loss": -26.631702423095703, "global_step": 390136, "epoch": 4700} {"train_loss": -26.813373565673828, "global_step": 390137, "epoch": 4700} {"train_loss": -26.886554718017578, "global_step": 390138, "epoch": 4700} {"train_loss": -26.55106544494629, "global_step": 390139, "epoch": 4700} {"train_loss": -26.264108657836914, "global_step": 390140, "epoch": 4700} {"train_loss": -26.86482048034668, "global_step": 390141, "epoch": 4700} {"train_loss": -26.373178482055664, "global_step": 390142, "epoch": 4700} {"train_loss": -26.701398849487305, "global_step": 390143, "epoch": 4700} {"train_loss": -26.5566463470459, "global_step": 390144, "epoch": 4700} {"train_loss": -26.7242431640625, "global_step": 390145, "epoch": 4700} {"train_loss": -26.529071807861328, "global_step": 390146, "epoch": 4700} {"train_loss": -26.654434204101562, "global_step": 390147, "epoch": 4700} {"train_loss": -26.8356876373291, "global_step": 390148, "epoch": 4700} {"train_loss": -26.350168228149414, "global_step": 390149, "epoch": 4700} {"train_loss": -26.56275749206543, "global_step": 390150, "epoch": 4700} {"train_loss": -26.532751083374023, "global_step": 390151, "epoch": 4700} {"train_loss": -26.467529296875, "global_step": 390152, "epoch": 4700} {"train_loss": -26.425153732299805, "global_step": 390153, "epoch": 4700} {"train_loss": -26.199819564819336, "global_step": 390154, "epoch": 4700} {"train_loss": -26.7224063873291, "global_step": 390155, "epoch": 4700} {"train_loss": -26.103933334350586, "global_step": 390156, "epoch": 4700} {"train_loss": -26.350284576416016, "global_step": 390157, "epoch": 4700} {"train_loss": -26.419635772705078, "global_step": 390158, "epoch": 4700} {"train_loss": -26.781864166259766, "global_step": 390159, "epoch": 4700} {"train_loss": -27.048864364624023, "global_step": 390160, "epoch": 4700} {"train_loss": -26.553747177124023, "global_step": 390161, "epoch": 4700} {"train_loss": -26.623321533203125, "global_step": 390162, "epoch": 4700} {"train_loss": -26.644128799438477, "global_step": 390163, "epoch": 4700} {"train_loss": -26.511564254760742, "global_step": 390164, "epoch": 4700} {"train_loss": -26.407180786132812, "global_step": 390165, "epoch": 4700} {"train_loss": -26.380294799804688, "global_step": 390166, "epoch": 4700} {"train_loss": -26.706201553344727, "global_step": 390167, "epoch": 4700} {"train_loss": -26.667219161987305, "global_step": 390168, "epoch": 4700} {"train_loss": -26.93936538696289, "global_step": 390169, "epoch": 4700} {"train_loss": -26.671850204467773, "global_step": 390170, "epoch": 4700} {"train_loss": -26.605331420898438, "global_step": 390171, "epoch": 4700} {"train_loss": -26.413232803344727, "global_step": 390172, "epoch": 4700} {"train_loss": -26.55665397644043, "global_step": 390173, "epoch": 4700} {"train_loss": -26.48489761352539, "global_step": 390174, "epoch": 4700} {"train_loss": -26.453765869140625, "global_step": 390175, "epoch": 4700} {"train_loss": -26.588926315307617, "global_step": 390176, "epoch": 4700} {"train_loss": -26.768207550048828, "global_step": 390177, "epoch": 4700} {"train_loss": -26.9031982421875, "global_step": 390178, "epoch": 4700} {"train_loss": -26.363956451416016, "global_step": 390179, "epoch": 4700} {"train_loss": -26.3261661529541, "global_step": 390180, "epoch": 4700} {"train_loss": -26.60321044921875, "global_step": 390181, "epoch": 4700} {"train_loss": -26.436618414269873, "global_step": 390182, "epoch": 4700, "train/sim_max_reward_0": 1.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 0.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4500000": 1.0, "test/sim_max_reward_4500001": 1.0, "test/sim_max_reward_4500002": 1.0, "test/sim_max_reward_4500003": 1.0, "test/sim_max_reward_4500004": 1.0, "test/sim_max_reward_4500005": 1.0, "test/sim_max_reward_4500006": 1.0, "test/sim_max_reward_4500007": 1.0, "test/sim_max_reward_4500008": 1.0, "test/sim_max_reward_4500009": 1.0, "test/sim_max_reward_4500010": 1.0, "test/sim_max_reward_4500011": 1.0, "test/sim_max_reward_4500012": 1.0, "test/sim_max_reward_4500013": 0.0, "test/sim_max_reward_4500014": 1.0, "test/sim_max_reward_4500015": 1.0, "test/sim_max_reward_4500016": 1.0, "test/sim_max_reward_4500017": 1.0, "test/sim_max_reward_4500018": 1.0, "test/sim_max_reward_4500019": 0.0, "test/sim_max_reward_4500020": 1.0, "test/sim_max_reward_4500021": 1.0, "train/mean_score": 0.8333333333333334, "test/mean_score": 0.9090909090909091, "val_loss": 6544572.0} {"train_loss": -25.96549415588379, "global_step": 390183, "epoch": 4701} {"train_loss": -25.107542037963867, "global_step": 390184, "epoch": 4701} {"train_loss": -25.58940315246582, "global_step": 390185, "epoch": 4701} {"train_loss": -25.430458068847656, "global_step": 390186, "epoch": 4701} {"train_loss": -25.957792282104492, "global_step": 390187, "epoch": 4701} {"train_loss": -25.809789657592773, "global_step": 390188, "epoch": 4701} {"train_loss": -24.910057067871094, "global_step": 390189, "epoch": 4701} {"train_loss": -25.910863876342773, "global_step": 390190, "epoch": 4701} {"train_loss": -26.068937301635742, "global_step": 390191, "epoch": 4701} {"train_loss": -25.8656063079834, "global_step": 390192, "epoch": 4701} {"train_loss": -26.39642333984375, "global_step": 390193, "epoch": 4701} {"train_loss": -25.9929141998291, "global_step": 390194, "epoch": 4701} {"train_loss": -26.3551082611084, "global_step": 390195, "epoch": 4701} {"train_loss": -25.922534942626953, "global_step": 390196, "epoch": 4701} {"train_loss": -26.616260528564453, "global_step": 390197, "epoch": 4701} {"train_loss": -26.81171989440918, "global_step": 390198, "epoch": 4701} {"train_loss": -26.530399322509766, "global_step": 390199, "epoch": 4701} {"train_loss": -26.64031982421875, "global_step": 390200, "epoch": 4701} {"train_loss": -26.03119468688965, "global_step": 390201, "epoch": 4701} {"train_loss": -26.77949333190918, "global_step": 390202, "epoch": 4701} {"train_loss": -26.353498458862305, "global_step": 390203, "epoch": 4701} {"train_loss": -26.085861206054688, "global_step": 390204, "epoch": 4701} {"train_loss": -26.675745010375977, "global_step": 390205, "epoch": 4701} {"train_loss": -26.406076431274414, "global_step": 390206, "epoch": 4701} {"train_loss": -26.50762939453125, "global_step": 390207, "epoch": 4701} {"train_loss": -26.55866050720215, "global_step": 390208, "epoch": 4701} {"train_loss": -26.330480575561523, "global_step": 390209, "epoch": 4701} {"train_loss": -26.0091552734375, "global_step": 390210, "epoch": 4701} {"train_loss": -26.355310440063477, "global_step": 390211, "epoch": 4701} {"train_loss": -26.162073135375977, "global_step": 390212, "epoch": 4701} {"train_loss": -26.31178855895996, "global_step": 390213, "epoch": 4701} {"train_loss": -26.28126335144043, "global_step": 390214, "epoch": 4701} {"train_loss": -26.1008358001709, "global_step": 390215, "epoch": 4701} {"train_loss": -26.519086837768555, "global_step": 390216, "epoch": 4701} {"train_loss": -26.807361602783203, "global_step": 390217, "epoch": 4701} {"train_loss": -26.37624168395996, "global_step": 390218, "epoch": 4701} {"train_loss": -26.59869384765625, "global_step": 390219, "epoch": 4701} {"train_loss": -26.655393600463867, "global_step": 390220, "epoch": 4701} {"train_loss": -26.644987106323242, "global_step": 390221, "epoch": 4701} {"train_loss": -26.467260360717773, "global_step": 390222, "epoch": 4701} {"train_loss": -26.620685577392578, "global_step": 390223, "epoch": 4701} {"train_loss": -26.181974411010742, "global_step": 390224, "epoch": 4701} {"train_loss": -26.378284454345703, "global_step": 390225, "epoch": 4701} {"train_loss": -26.61850357055664, "global_step": 390226, "epoch": 4701} {"train_loss": -26.615522384643555, "global_step": 390227, "epoch": 4701} {"train_loss": -27.098020553588867, "global_step": 390228, "epoch": 4701} {"train_loss": -26.713623046875, "global_step": 390229, "epoch": 4701} {"train_loss": -26.45121192932129, "global_step": 390230, "epoch": 4701} {"train_loss": -26.63368034362793, "global_step": 390231, "epoch": 4701} {"train_loss": -26.41668128967285, "global_step": 390232, "epoch": 4701} {"train_loss": -26.764013290405273, "global_step": 390233, "epoch": 4701} {"train_loss": -26.411102294921875, "global_step": 390234, "epoch": 4701} {"train_loss": -26.796655654907227, "global_step": 390235, "epoch": 4701} {"train_loss": -26.71637535095215, "global_step": 390236, "epoch": 4701} {"train_loss": -26.716144561767578, "global_step": 390237, "epoch": 4701} {"train_loss": -26.3236026763916, "global_step": 390238, "epoch": 4701} {"train_loss": -27.127197265625, "global_step": 390239, "epoch": 4701} {"train_loss": -26.136510848999023, "global_step": 390240, "epoch": 4701} {"train_loss": -26.320056915283203, "global_step": 390241, "epoch": 4701} {"train_loss": -26.320043563842773, "global_step": 390242, "epoch": 4701} {"train_loss": -26.866376876831055, "global_step": 390243, "epoch": 4701} {"train_loss": -26.4522647857666, "global_step": 390244, "epoch": 4701} {"train_loss": -26.035192489624023, "global_step": 390245, "epoch": 4701} {"train_loss": -26.642602920532227, "global_step": 390246, "epoch": 4701} {"train_loss": -26.19721031188965, "global_step": 390247, "epoch": 4701} {"train_loss": -26.270618438720703, "global_step": 390248, "epoch": 4701} {"train_loss": -26.084470748901367, "global_step": 390249, "epoch": 4701} {"train_loss": -26.628705978393555, "global_step": 390250, "epoch": 4701} {"train_loss": -26.697973251342773, "global_step": 390251, "epoch": 4701} {"train_loss": -26.527984619140625, "global_step": 390252, "epoch": 4701} {"train_loss": -26.4899959564209, "global_step": 390253, "epoch": 4701} {"train_loss": -26.652206420898438, "global_step": 390254, "epoch": 4701} {"train_loss": -26.135663986206055, "global_step": 390255, "epoch": 4701} {"train_loss": -26.552473068237305, "global_step": 390256, "epoch": 4701} {"train_loss": -26.594995498657227, "global_step": 390257, "epoch": 4701} {"train_loss": -26.876745223999023, "global_step": 390258, "epoch": 4701} {"train_loss": -26.490381240844727, "global_step": 390259, "epoch": 4701} {"train_loss": -26.408010482788086, "global_step": 390260, "epoch": 4701} {"train_loss": -26.568021774291992, "global_step": 390261, "epoch": 4701} {"train_loss": -26.63465690612793, "global_step": 390262, "epoch": 4701} {"train_loss": -26.79459571838379, "global_step": 390263, "epoch": 4701} {"train_loss": -26.300458908081055, "global_step": 390264, "epoch": 4701} {"train_loss": -26.387571219938348, "global_step": 390265, "epoch": 4701, "val_loss": 6627081.0} {"train_loss": -24.79388999938965, "global_step": 390266, "epoch": 4702} {"train_loss": -25.781085968017578, "global_step": 390267, "epoch": 4702} {"train_loss": -25.02385711669922, "global_step": 390268, "epoch": 4702} {"train_loss": -25.229480743408203, "global_step": 390269, "epoch": 4702} {"train_loss": -25.77277183532715, "global_step": 390270, "epoch": 4702} {"train_loss": -25.535236358642578, "global_step": 390271, "epoch": 4702} {"train_loss": -25.709598541259766, "global_step": 390272, "epoch": 4702} {"train_loss": -25.830387115478516, "global_step": 390273, "epoch": 4702} {"train_loss": -25.896448135375977, "global_step": 390274, "epoch": 4702} {"train_loss": -25.761505126953125, "global_step": 390275, "epoch": 4702} {"train_loss": -26.1829833984375, "global_step": 390276, "epoch": 4702} {"train_loss": -26.01996421813965, "global_step": 390277, "epoch": 4702} {"train_loss": -26.33585548400879, "global_step": 390278, "epoch": 4702} {"train_loss": -25.79762077331543, "global_step": 390279, "epoch": 4702} {"train_loss": -26.1213321685791, "global_step": 390280, "epoch": 4702} {"train_loss": -26.42030143737793, "global_step": 390281, "epoch": 4702} {"train_loss": -26.161273956298828, "global_step": 390282, "epoch": 4702} {"train_loss": -25.99098014831543, "global_step": 390283, "epoch": 4702} {"train_loss": -25.967016220092773, "global_step": 390284, "epoch": 4702} {"train_loss": -26.10049819946289, "global_step": 390285, "epoch": 4702} {"train_loss": -26.003583908081055, "global_step": 390286, "epoch": 4702} {"train_loss": -26.318134307861328, "global_step": 390287, "epoch": 4702} {"train_loss": -26.01241111755371, "global_step": 390288, "epoch": 4702} {"train_loss": -26.520248413085938, "global_step": 390289, "epoch": 4702} {"train_loss": -26.279203414916992, "global_step": 390290, "epoch": 4702} {"train_loss": -26.39837074279785, "global_step": 390291, "epoch": 4702} {"train_loss": -26.3154354095459, "global_step": 390292, "epoch": 4702} {"train_loss": -26.220294952392578, "global_step": 390293, "epoch": 4702} {"train_loss": -26.538084030151367, "global_step": 390294, "epoch": 4702} {"train_loss": -26.28338050842285, "global_step": 390295, "epoch": 4702} {"train_loss": -26.801013946533203, "global_step": 390296, "epoch": 4702} {"train_loss": -26.30694007873535, "global_step": 390297, "epoch": 4702} {"train_loss": -26.435697555541992, "global_step": 390298, "epoch": 4702} {"train_loss": -26.632160186767578, "global_step": 390299, "epoch": 4702} {"train_loss": -26.555362701416016, "global_step": 390300, "epoch": 4702} {"train_loss": -26.620756149291992, "global_step": 390301, "epoch": 4702} {"train_loss": -26.698139190673828, "global_step": 390302, "epoch": 4702} {"train_loss": -26.633651733398438, "global_step": 390303, "epoch": 4702} {"train_loss": -26.615827560424805, "global_step": 390304, "epoch": 4702} {"train_loss": -26.298370361328125, "global_step": 390305, "epoch": 4702} {"train_loss": -26.581668853759766, "global_step": 390306, "epoch": 4702} {"train_loss": -26.9185791015625, "global_step": 390307, "epoch": 4702} {"train_loss": -26.727375030517578, "global_step": 390308, "epoch": 4702} {"train_loss": -26.77703857421875, "global_step": 390309, "epoch": 4702} {"train_loss": -26.707914352416992, "global_step": 390310, "epoch": 4702} {"train_loss": -26.63006019592285, "global_step": 390311, "epoch": 4702} {"train_loss": -26.84868812561035, "global_step": 390312, "epoch": 4702} {"train_loss": -26.42140769958496, "global_step": 390313, "epoch": 4702} {"train_loss": -26.49616813659668, "global_step": 390314, "epoch": 4702} {"train_loss": -26.454004287719727, "global_step": 390315, "epoch": 4702} {"train_loss": -26.639928817749023, "global_step": 390316, "epoch": 4702} {"train_loss": -26.93219566345215, "global_step": 390317, "epoch": 4702} {"train_loss": -27.063739776611328, "global_step": 390318, "epoch": 4702} {"train_loss": -26.491506576538086, "global_step": 390319, "epoch": 4702} {"train_loss": -26.827423095703125, "global_step": 390320, "epoch": 4702} {"train_loss": -26.712284088134766, "global_step": 390321, "epoch": 4702} {"train_loss": -26.13203239440918, "global_step": 390322, "epoch": 4702} {"train_loss": -26.01425552368164, "global_step": 390323, "epoch": 4702} {"train_loss": -26.379276275634766, "global_step": 390324, "epoch": 4702} {"train_loss": -26.711210250854492, "global_step": 390325, "epoch": 4702} {"train_loss": -26.500598907470703, "global_step": 390326, "epoch": 4702} {"train_loss": -26.6041316986084, "global_step": 390327, "epoch": 4702} {"train_loss": -26.72861671447754, "global_step": 390328, "epoch": 4702} {"train_loss": -26.69732666015625, "global_step": 390329, "epoch": 4702} {"train_loss": -26.40315055847168, "global_step": 390330, "epoch": 4702} {"train_loss": -26.852025985717773, "global_step": 390331, "epoch": 4702} {"train_loss": -26.855825424194336, "global_step": 390332, "epoch": 4702} {"train_loss": -26.582794189453125, "global_step": 390333, "epoch": 4702} {"train_loss": -26.85389518737793, "global_step": 390334, "epoch": 4702} {"train_loss": -26.66888999938965, "global_step": 390335, "epoch": 4702} {"train_loss": -26.402755737304688, "global_step": 390336, "epoch": 4702} {"train_loss": -26.292638778686523, "global_step": 390337, "epoch": 4702} {"train_loss": -26.232242584228516, "global_step": 390338, "epoch": 4702} {"train_loss": -26.429357528686523, "global_step": 390339, "epoch": 4702} {"train_loss": -26.668781280517578, "global_step": 390340, "epoch": 4702} {"train_loss": -26.703388214111328, "global_step": 390341, "epoch": 4702} {"train_loss": -26.495588302612305, "global_step": 390342, "epoch": 4702} {"train_loss": -26.45712661743164, "global_step": 390343, "epoch": 4702} {"train_loss": -26.927465438842773, "global_step": 390344, "epoch": 4702} {"train_loss": -26.997411727905273, "global_step": 390345, "epoch": 4702} {"train_loss": -26.885351181030273, "global_step": 390346, "epoch": 4702} {"train_loss": -26.66359519958496, "global_step": 390347, "epoch": 4702} {"train_loss": -26.3872047332396, "global_step": 390348, "epoch": 4702, "val_loss": 6537267.0} {"train_loss": -26.194904327392578, "global_step": 390349, "epoch": 4703} {"train_loss": -26.288330078125, "global_step": 390350, "epoch": 4703} {"train_loss": -26.24860191345215, "global_step": 390351, "epoch": 4703} {"train_loss": -25.939926147460938, "global_step": 390352, "epoch": 4703} {"train_loss": -26.122732162475586, "global_step": 390353, "epoch": 4703} {"train_loss": -25.849023818969727, "global_step": 390354, "epoch": 4703} {"train_loss": -26.510818481445312, "global_step": 390355, "epoch": 4703} {"train_loss": -26.293598175048828, "global_step": 390356, "epoch": 4703} {"train_loss": -26.273818969726562, "global_step": 390357, "epoch": 4703} {"train_loss": -25.909509658813477, "global_step": 390358, "epoch": 4703} {"train_loss": -25.935504913330078, "global_step": 390359, "epoch": 4703} {"train_loss": -25.786306381225586, "global_step": 390360, "epoch": 4703} {"train_loss": -26.412500381469727, "global_step": 390361, "epoch": 4703} {"train_loss": -26.128080368041992, "global_step": 390362, "epoch": 4703} {"train_loss": -25.805866241455078, "global_step": 390363, "epoch": 4703} {"train_loss": -26.346878051757812, "global_step": 390364, "epoch": 4703} {"train_loss": -26.259769439697266, "global_step": 390365, "epoch": 4703} {"train_loss": -25.71603775024414, "global_step": 390366, "epoch": 4703} {"train_loss": -26.253692626953125, "global_step": 390367, "epoch": 4703} {"train_loss": -26.083765029907227, "global_step": 390368, "epoch": 4703} {"train_loss": -26.15114402770996, "global_step": 390369, "epoch": 4703} {"train_loss": -26.23902702331543, "global_step": 390370, "epoch": 4703} {"train_loss": -26.07954216003418, "global_step": 390371, "epoch": 4703} {"train_loss": -26.722143173217773, "global_step": 390372, "epoch": 4703} {"train_loss": -26.369098663330078, "global_step": 390373, "epoch": 4703} {"train_loss": -26.598529815673828, "global_step": 390374, "epoch": 4703} {"train_loss": -26.4450740814209, "global_step": 390375, "epoch": 4703} {"train_loss": -26.290847778320312, "global_step": 390376, "epoch": 4703} {"train_loss": -26.642370223999023, "global_step": 390377, "epoch": 4703} {"train_loss": -26.07637596130371, "global_step": 390378, "epoch": 4703} {"train_loss": -26.76102638244629, "global_step": 390379, "epoch": 4703} {"train_loss": -26.15264892578125, "global_step": 390380, "epoch": 4703} {"train_loss": -26.263874053955078, "global_step": 390381, "epoch": 4703} {"train_loss": -26.125049591064453, "global_step": 390382, "epoch": 4703} {"train_loss": -26.139362335205078, "global_step": 390383, "epoch": 4703} {"train_loss": -26.611209869384766, "global_step": 390384, "epoch": 4703} {"train_loss": -26.57765769958496, "global_step": 390385, "epoch": 4703} {"train_loss": -26.434635162353516, "global_step": 390386, "epoch": 4703} {"train_loss": -26.6790771484375, "global_step": 390387, "epoch": 4703} {"train_loss": -26.30926513671875, "global_step": 390388, "epoch": 4703} {"train_loss": -26.691009521484375, "global_step": 390389, "epoch": 4703} {"train_loss": -26.45261001586914, "global_step": 390390, "epoch": 4703} {"train_loss": -26.72768211364746, "global_step": 390391, "epoch": 4703} {"train_loss": -26.390161514282227, "global_step": 390392, "epoch": 4703} {"train_loss": -26.845632553100586, "global_step": 390393, "epoch": 4703} {"train_loss": -26.264190673828125, "global_step": 390394, "epoch": 4703} {"train_loss": -26.70904541015625, "global_step": 390395, "epoch": 4703} {"train_loss": -26.882022857666016, "global_step": 390396, "epoch": 4703} {"train_loss": -26.7469539642334, "global_step": 390397, "epoch": 4703} {"train_loss": -26.862659454345703, "global_step": 390398, "epoch": 4703} {"train_loss": -26.958332061767578, "global_step": 390399, "epoch": 4703} {"train_loss": -26.562469482421875, "global_step": 390400, "epoch": 4703} {"train_loss": -26.534387588500977, "global_step": 390401, "epoch": 4703} {"train_loss": -26.739206314086914, "global_step": 390402, "epoch": 4703} {"train_loss": -26.399621963500977, "global_step": 390403, "epoch": 4703} {"train_loss": -26.795368194580078, "global_step": 390404, "epoch": 4703} {"train_loss": -26.350473403930664, "global_step": 390405, "epoch": 4703} {"train_loss": -26.406539916992188, "global_step": 390406, "epoch": 4703} {"train_loss": -26.85308265686035, "global_step": 390407, "epoch": 4703} {"train_loss": -26.598730087280273, "global_step": 390408, "epoch": 4703} {"train_loss": -26.877798080444336, "global_step": 390409, "epoch": 4703} {"train_loss": -26.4293155670166, "global_step": 390410, "epoch": 4703} {"train_loss": -26.379674911499023, "global_step": 390411, "epoch": 4703} {"train_loss": -26.445423126220703, "global_step": 390412, "epoch": 4703} {"train_loss": -26.771026611328125, "global_step": 390413, "epoch": 4703} {"train_loss": -26.8839111328125, "global_step": 390414, "epoch": 4703} {"train_loss": -26.78916358947754, "global_step": 390415, "epoch": 4703} {"train_loss": -26.58074951171875, "global_step": 390416, "epoch": 4703} {"train_loss": -26.332687377929688, "global_step": 390417, "epoch": 4703} {"train_loss": -26.531940460205078, "global_step": 390418, "epoch": 4703} {"train_loss": -26.826730728149414, "global_step": 390419, "epoch": 4703} {"train_loss": -26.612634658813477, "global_step": 390420, "epoch": 4703} {"train_loss": -26.612695693969727, "global_step": 390421, "epoch": 4703} {"train_loss": -26.4252872467041, "global_step": 390422, "epoch": 4703} {"train_loss": -26.173202514648438, "global_step": 390423, "epoch": 4703} {"train_loss": -26.57257652282715, "global_step": 390424, "epoch": 4703} {"train_loss": -26.45989990234375, "global_step": 390425, "epoch": 4703} {"train_loss": -26.5654354095459, "global_step": 390426, "epoch": 4703} {"train_loss": -26.631635665893555, "global_step": 390427, "epoch": 4703} {"train_loss": -26.457916259765625, "global_step": 390428, "epoch": 4703} {"train_loss": -26.760339736938477, "global_step": 390429, "epoch": 4703} {"train_loss": -26.530536651611328, "global_step": 390430, "epoch": 4703} {"train_loss": -26.449845049754682, "global_step": 390431, "epoch": 4703, "val_loss": 6483848.5} {"train_loss": -26.27119255065918, "global_step": 390432, "epoch": 4704} {"train_loss": -25.83713150024414, "global_step": 390433, "epoch": 4704} {"train_loss": -25.69583511352539, "global_step": 390434, "epoch": 4704} {"train_loss": -25.99690818786621, "global_step": 390435, "epoch": 4704} {"train_loss": -26.113107681274414, "global_step": 390436, "epoch": 4704} {"train_loss": -26.0700626373291, "global_step": 390437, "epoch": 4704} {"train_loss": -25.611852645874023, "global_step": 390438, "epoch": 4704} {"train_loss": -25.631683349609375, "global_step": 390439, "epoch": 4704} {"train_loss": -26.169797897338867, "global_step": 390440, "epoch": 4704} {"train_loss": -25.950834274291992, "global_step": 390441, "epoch": 4704} {"train_loss": -26.17633628845215, "global_step": 390442, "epoch": 4704} {"train_loss": -26.188024520874023, "global_step": 390443, "epoch": 4704} {"train_loss": -26.12494468688965, "global_step": 390444, "epoch": 4704} {"train_loss": -26.0324764251709, "global_step": 390445, "epoch": 4704} {"train_loss": -26.027448654174805, "global_step": 390446, "epoch": 4704} {"train_loss": -26.739105224609375, "global_step": 390447, "epoch": 4704} {"train_loss": -25.99985122680664, "global_step": 390448, "epoch": 4704} {"train_loss": -26.248571395874023, "global_step": 390449, "epoch": 4704} {"train_loss": -26.412097930908203, "global_step": 390450, "epoch": 4704} {"train_loss": -26.38593101501465, "global_step": 390451, "epoch": 4704} {"train_loss": -26.6203556060791, "global_step": 390452, "epoch": 4704} {"train_loss": -26.2790470123291, "global_step": 390453, "epoch": 4704} {"train_loss": -26.44343376159668, "global_step": 390454, "epoch": 4704} {"train_loss": -26.366748809814453, "global_step": 390455, "epoch": 4704} {"train_loss": -26.359350204467773, "global_step": 390456, "epoch": 4704} {"train_loss": -26.226694107055664, "global_step": 390457, "epoch": 4704} {"train_loss": -26.125381469726562, "global_step": 390458, "epoch": 4704} {"train_loss": -26.3819580078125, "global_step": 390459, "epoch": 4704} {"train_loss": -26.677082061767578, "global_step": 390460, "epoch": 4704} {"train_loss": -26.18220329284668, "global_step": 390461, "epoch": 4704} {"train_loss": -26.24837303161621, "global_step": 390462, "epoch": 4704} {"train_loss": -26.110071182250977, "global_step": 390463, "epoch": 4704} {"train_loss": -26.66497802734375, "global_step": 390464, "epoch": 4704} {"train_loss": -26.783971786499023, "global_step": 390465, "epoch": 4704} {"train_loss": -26.685876846313477, "global_step": 390466, "epoch": 4704} {"train_loss": -26.53407859802246, "global_step": 390467, "epoch": 4704} {"train_loss": -26.653467178344727, "global_step": 390468, "epoch": 4704} {"train_loss": -26.565631866455078, "global_step": 390469, "epoch": 4704} {"train_loss": -26.56511878967285, "global_step": 390470, "epoch": 4704} {"train_loss": -26.866247177124023, "global_step": 390471, "epoch": 4704} {"train_loss": -26.9208984375, "global_step": 390472, "epoch": 4704} {"train_loss": -26.52320671081543, "global_step": 390473, "epoch": 4704} {"train_loss": -26.488128662109375, "global_step": 390474, "epoch": 4704} {"train_loss": -26.710798263549805, "global_step": 390475, "epoch": 4704} {"train_loss": -26.70462989807129, "global_step": 390476, "epoch": 4704} {"train_loss": -26.36627769470215, "global_step": 390477, "epoch": 4704} {"train_loss": -26.62074089050293, "global_step": 390478, "epoch": 4704} {"train_loss": -26.459854125976562, "global_step": 390479, "epoch": 4704} {"train_loss": -26.511505126953125, "global_step": 390480, "epoch": 4704} {"train_loss": -26.614505767822266, "global_step": 390481, "epoch": 4704} {"train_loss": -26.68206214904785, "global_step": 390482, "epoch": 4704} {"train_loss": -26.839263916015625, "global_step": 390483, "epoch": 4704} {"train_loss": -26.43902587890625, "global_step": 390484, "epoch": 4704} {"train_loss": -26.954071044921875, "global_step": 390485, "epoch": 4704} {"train_loss": -26.876981735229492, "global_step": 390486, "epoch": 4704} {"train_loss": -26.475330352783203, "global_step": 390487, "epoch": 4704} {"train_loss": -26.360258102416992, "global_step": 390488, "epoch": 4704} {"train_loss": -26.453954696655273, "global_step": 390489, "epoch": 4704} {"train_loss": -26.761682510375977, "global_step": 390490, "epoch": 4704} {"train_loss": -26.69171142578125, "global_step": 390491, "epoch": 4704} {"train_loss": -26.77716064453125, "global_step": 390492, "epoch": 4704} {"train_loss": -26.7688045501709, "global_step": 390493, "epoch": 4704} {"train_loss": -26.191730499267578, "global_step": 390494, "epoch": 4704} {"train_loss": -26.445066452026367, "global_step": 390495, "epoch": 4704} {"train_loss": -26.53377342224121, "global_step": 390496, "epoch": 4704} {"train_loss": -26.50642204284668, "global_step": 390497, "epoch": 4704} {"train_loss": -26.4831485748291, "global_step": 390498, "epoch": 4704} {"train_loss": -26.745410919189453, "global_step": 390499, "epoch": 4704} {"train_loss": -27.01795768737793, "global_step": 390500, "epoch": 4704} {"train_loss": -26.74640464782715, "global_step": 390501, "epoch": 4704} {"train_loss": -26.590381622314453, "global_step": 390502, "epoch": 4704} {"train_loss": -26.544340133666992, "global_step": 390503, "epoch": 4704} {"train_loss": -26.563568115234375, "global_step": 390504, "epoch": 4704} {"train_loss": -26.8184757232666, "global_step": 390505, "epoch": 4704} {"train_loss": -26.802343368530273, "global_step": 390506, "epoch": 4704} {"train_loss": -26.634815216064453, "global_step": 390507, "epoch": 4704} {"train_loss": -26.476856231689453, "global_step": 390508, "epoch": 4704} {"train_loss": -26.549116134643555, "global_step": 390509, "epoch": 4704} {"train_loss": -26.358402252197266, "global_step": 390510, "epoch": 4704} {"train_loss": -26.4769287109375, "global_step": 390511, "epoch": 4704} {"train_loss": -26.5199031829834, "global_step": 390512, "epoch": 4704} {"train_loss": -26.633798599243164, "global_step": 390513, "epoch": 4704} {"train_loss": -26.443174063441266, "global_step": 390514, "epoch": 4704, "val_loss": 6472347.0} {"train_loss": -26.46817398071289, "global_step": 390515, "epoch": 4705} {"train_loss": -26.043060302734375, "global_step": 390516, "epoch": 4705} {"train_loss": -26.157835006713867, "global_step": 390517, "epoch": 4705} {"train_loss": -26.137680053710938, "global_step": 390518, "epoch": 4705} {"train_loss": -26.24072265625, "global_step": 390519, "epoch": 4705} {"train_loss": -26.170801162719727, "global_step": 390520, "epoch": 4705} {"train_loss": -26.203296661376953, "global_step": 390521, "epoch": 4705} {"train_loss": -26.307193756103516, "global_step": 390522, "epoch": 4705} {"train_loss": -25.888639450073242, "global_step": 390523, "epoch": 4705} {"train_loss": -26.3505916595459, "global_step": 390524, "epoch": 4705} {"train_loss": -26.34375, "global_step": 390525, "epoch": 4705} {"train_loss": -26.76959800720215, "global_step": 390526, "epoch": 4705} {"train_loss": -26.172399520874023, "global_step": 390527, "epoch": 4705} {"train_loss": -26.38619041442871, "global_step": 390528, "epoch": 4705} {"train_loss": -26.770389556884766, "global_step": 390529, "epoch": 4705} {"train_loss": -26.40827751159668, "global_step": 390530, "epoch": 4705} {"train_loss": -26.55116081237793, "global_step": 390531, "epoch": 4705} {"train_loss": -26.653738021850586, "global_step": 390532, "epoch": 4705} {"train_loss": -26.316574096679688, "global_step": 390533, "epoch": 4705} {"train_loss": -26.856689453125, "global_step": 390534, "epoch": 4705} {"train_loss": -26.4857120513916, "global_step": 390535, "epoch": 4705} {"train_loss": -26.82655143737793, "global_step": 390536, "epoch": 4705} {"train_loss": -26.426456451416016, "global_step": 390537, "epoch": 4705} {"train_loss": -26.623151779174805, "global_step": 390538, "epoch": 4705} {"train_loss": -26.569738388061523, "global_step": 390539, "epoch": 4705} {"train_loss": -26.60023307800293, "global_step": 390540, "epoch": 4705} {"train_loss": -26.758228302001953, "global_step": 390541, "epoch": 4705} {"train_loss": -26.771682739257812, "global_step": 390542, "epoch": 4705} {"train_loss": -26.639978408813477, "global_step": 390543, "epoch": 4705} {"train_loss": -26.628986358642578, "global_step": 390544, "epoch": 4705} {"train_loss": -26.670373916625977, "global_step": 390545, "epoch": 4705} {"train_loss": -26.744735717773438, "global_step": 390546, "epoch": 4705} {"train_loss": -26.665002822875977, "global_step": 390547, "epoch": 4705} {"train_loss": -26.972183227539062, "global_step": 390548, "epoch": 4705} {"train_loss": -26.656116485595703, "global_step": 390549, "epoch": 4705} {"train_loss": -26.591236114501953, "global_step": 390550, "epoch": 4705} {"train_loss": -26.743133544921875, "global_step": 390551, "epoch": 4705} {"train_loss": -26.748178482055664, "global_step": 390552, "epoch": 4705} {"train_loss": -26.6201114654541, "global_step": 390553, "epoch": 4705} {"train_loss": -26.747344970703125, "global_step": 390554, "epoch": 4705} {"train_loss": -26.56495475769043, "global_step": 390555, "epoch": 4705} {"train_loss": -26.194385528564453, "global_step": 390556, "epoch": 4705} {"train_loss": -26.8704833984375, "global_step": 390557, "epoch": 4705} {"train_loss": -26.366973876953125, "global_step": 390558, "epoch": 4705} {"train_loss": -26.59927749633789, "global_step": 390559, "epoch": 4705} {"train_loss": -26.87518882751465, "global_step": 390560, "epoch": 4705} {"train_loss": -26.696264266967773, "global_step": 390561, "epoch": 4705} {"train_loss": -26.809186935424805, "global_step": 390562, "epoch": 4705} {"train_loss": -26.68232536315918, "global_step": 390563, "epoch": 4705} {"train_loss": -26.932910919189453, "global_step": 390564, "epoch": 4705} {"train_loss": -26.925344467163086, "global_step": 390565, "epoch": 4705} {"train_loss": -26.61142921447754, "global_step": 390566, "epoch": 4705} {"train_loss": -26.234725952148438, "global_step": 390567, "epoch": 4705} {"train_loss": -26.232120513916016, "global_step": 390568, "epoch": 4705} {"train_loss": -26.227659225463867, "global_step": 390569, "epoch": 4705} {"train_loss": -26.4964599609375, "global_step": 390570, "epoch": 4705} {"train_loss": -26.920562744140625, "global_step": 390571, "epoch": 4705} {"train_loss": -26.76474380493164, "global_step": 390572, "epoch": 4705} {"train_loss": -26.31524658203125, "global_step": 390573, "epoch": 4705} {"train_loss": -26.31148338317871, "global_step": 390574, "epoch": 4705} {"train_loss": -26.198455810546875, "global_step": 390575, "epoch": 4705} {"train_loss": -26.7841796875, "global_step": 390576, "epoch": 4705} {"train_loss": -26.24759292602539, "global_step": 390577, "epoch": 4705} {"train_loss": -26.470239639282227, "global_step": 390578, "epoch": 4705} {"train_loss": -26.620899200439453, "global_step": 390579, "epoch": 4705} {"train_loss": -26.602319717407227, "global_step": 390580, "epoch": 4705} {"train_loss": -26.724943161010742, "global_step": 390581, "epoch": 4705} {"train_loss": -26.588953018188477, "global_step": 390582, "epoch": 4705} {"train_loss": -26.572158813476562, "global_step": 390583, "epoch": 4705} {"train_loss": -26.14069938659668, "global_step": 390584, "epoch": 4705} {"train_loss": -26.4395751953125, "global_step": 390585, "epoch": 4705} {"train_loss": -26.70380973815918, "global_step": 390586, "epoch": 4705} {"train_loss": -26.670581817626953, "global_step": 390587, "epoch": 4705} {"train_loss": -26.413360595703125, "global_step": 390588, "epoch": 4705} {"train_loss": -26.2974853515625, "global_step": 390589, "epoch": 4705} {"train_loss": -26.618789672851562, "global_step": 390590, "epoch": 4705} {"train_loss": -26.317686080932617, "global_step": 390591, "epoch": 4705} {"train_loss": -26.601200103759766, "global_step": 390592, "epoch": 4705} {"train_loss": -26.708759307861328, "global_step": 390593, "epoch": 4705} {"train_loss": -26.634450912475586, "global_step": 390594, "epoch": 4705} {"train_loss": -26.796817779541016, "global_step": 390595, "epoch": 4705} {"train_loss": -26.899890899658203, "global_step": 390596, "epoch": 4705} {"train_loss": -26.546601146100514, "global_step": 390597, "epoch": 4705, "val_loss": 6500392.0} {"train_loss": -25.76761245727539, "global_step": 390598, "epoch": 4706} {"train_loss": -26.20380210876465, "global_step": 390599, "epoch": 4706} {"train_loss": -25.657377243041992, "global_step": 390600, "epoch": 4706} {"train_loss": -25.6964168548584, "global_step": 390601, "epoch": 4706} {"train_loss": -26.09559440612793, "global_step": 390602, "epoch": 4706} {"train_loss": -25.81157875061035, "global_step": 390603, "epoch": 4706} {"train_loss": -25.78564453125, "global_step": 390604, "epoch": 4706} {"train_loss": -26.053863525390625, "global_step": 390605, "epoch": 4706} {"train_loss": -25.917236328125, "global_step": 390606, "epoch": 4706} {"train_loss": -25.260589599609375, "global_step": 390607, "epoch": 4706} {"train_loss": -26.237079620361328, "global_step": 390608, "epoch": 4706} {"train_loss": -26.3342227935791, "global_step": 390609, "epoch": 4706} {"train_loss": -25.930418014526367, "global_step": 390610, "epoch": 4706} {"train_loss": -26.010412216186523, "global_step": 390611, "epoch": 4706} {"train_loss": -25.992544174194336, "global_step": 390612, "epoch": 4706} {"train_loss": -26.028860092163086, "global_step": 390613, "epoch": 4706} {"train_loss": -26.318817138671875, "global_step": 390614, "epoch": 4706} {"train_loss": -26.1182804107666, "global_step": 390615, "epoch": 4706} {"train_loss": -26.194904327392578, "global_step": 390616, "epoch": 4706} {"train_loss": -25.653411865234375, "global_step": 390617, "epoch": 4706} {"train_loss": -26.320423126220703, "global_step": 390618, "epoch": 4706} {"train_loss": -26.203283309936523, "global_step": 390619, "epoch": 4706} {"train_loss": -26.084430694580078, "global_step": 390620, "epoch": 4706} {"train_loss": -26.390338897705078, "global_step": 390621, "epoch": 4706} {"train_loss": -25.96333122253418, "global_step": 390622, "epoch": 4706} {"train_loss": -26.282581329345703, "global_step": 390623, "epoch": 4706} {"train_loss": -26.109540939331055, "global_step": 390624, "epoch": 4706} {"train_loss": -26.31898307800293, "global_step": 390625, "epoch": 4706} {"train_loss": -26.168914794921875, "global_step": 390626, "epoch": 4706} {"train_loss": -26.149744033813477, "global_step": 390627, "epoch": 4706} {"train_loss": -26.417591094970703, "global_step": 390628, "epoch": 4706} {"train_loss": -26.06146812438965, "global_step": 390629, "epoch": 4706} {"train_loss": -26.268701553344727, "global_step": 390630, "epoch": 4706} {"train_loss": -26.3204288482666, "global_step": 390631, "epoch": 4706} {"train_loss": -26.343109130859375, "global_step": 390632, "epoch": 4706} {"train_loss": -26.343997955322266, "global_step": 390633, "epoch": 4706} {"train_loss": -26.3477725982666, "global_step": 390634, "epoch": 4706} {"train_loss": -26.220800399780273, "global_step": 390635, "epoch": 4706} {"train_loss": -26.608545303344727, "global_step": 390636, "epoch": 4706} {"train_loss": -26.738086700439453, "global_step": 390637, "epoch": 4706} {"train_loss": -26.346542358398438, "global_step": 390638, "epoch": 4706} {"train_loss": -26.474706649780273, "global_step": 390639, "epoch": 4706} {"train_loss": -26.30109977722168, "global_step": 390640, "epoch": 4706} {"train_loss": -26.840377807617188, "global_step": 390641, "epoch": 4706} {"train_loss": -26.27936363220215, "global_step": 390642, "epoch": 4706} {"train_loss": -26.41851234436035, "global_step": 390643, "epoch": 4706} {"train_loss": -26.408313751220703, "global_step": 390644, "epoch": 4706} {"train_loss": -26.4259090423584, "global_step": 390645, "epoch": 4706} {"train_loss": -26.473779678344727, "global_step": 390646, "epoch": 4706} {"train_loss": -26.24246597290039, "global_step": 390647, "epoch": 4706} {"train_loss": -26.20049476623535, "global_step": 390648, "epoch": 4706} {"train_loss": -26.57546043395996, "global_step": 390649, "epoch": 4706} {"train_loss": -26.518524169921875, "global_step": 390650, "epoch": 4706} {"train_loss": -26.70918083190918, "global_step": 390651, "epoch": 4706} {"train_loss": -26.238264083862305, "global_step": 390652, "epoch": 4706} {"train_loss": -26.300506591796875, "global_step": 390653, "epoch": 4706} {"train_loss": -26.99198341369629, "global_step": 390654, "epoch": 4706} {"train_loss": -26.547128677368164, "global_step": 390655, "epoch": 4706} {"train_loss": -26.460241317749023, "global_step": 390656, "epoch": 4706} {"train_loss": -26.343481063842773, "global_step": 390657, "epoch": 4706} {"train_loss": -26.811222076416016, "global_step": 390658, "epoch": 4706} {"train_loss": -26.748462677001953, "global_step": 390659, "epoch": 4706} {"train_loss": -26.55674171447754, "global_step": 390660, "epoch": 4706} {"train_loss": -26.363977432250977, "global_step": 390661, "epoch": 4706} {"train_loss": -26.53816795349121, "global_step": 390662, "epoch": 4706} {"train_loss": -26.820459365844727, "global_step": 390663, "epoch": 4706} {"train_loss": -26.945587158203125, "global_step": 390664, "epoch": 4706} {"train_loss": -26.636505126953125, "global_step": 390665, "epoch": 4706} {"train_loss": -26.781726837158203, "global_step": 390666, "epoch": 4706} {"train_loss": -26.724653244018555, "global_step": 390667, "epoch": 4706} {"train_loss": -26.6085262298584, "global_step": 390668, "epoch": 4706} {"train_loss": -26.475305557250977, "global_step": 390669, "epoch": 4706} {"train_loss": -26.7006778717041, "global_step": 390670, "epoch": 4706} {"train_loss": -26.610050201416016, "global_step": 390671, "epoch": 4706} {"train_loss": -27.021595001220703, "global_step": 390672, "epoch": 4706} {"train_loss": -26.727188110351562, "global_step": 390673, "epoch": 4706} {"train_loss": -26.354766845703125, "global_step": 390674, "epoch": 4706} {"train_loss": -26.989225387573242, "global_step": 390675, "epoch": 4706} {"train_loss": -26.690908432006836, "global_step": 390676, "epoch": 4706} {"train_loss": -26.751327514648438, "global_step": 390677, "epoch": 4706} {"train_loss": -26.554731369018555, "global_step": 390678, "epoch": 4706} {"train_loss": -27.11181640625, "global_step": 390679, "epoch": 4706} {"train_loss": -26.358262004622492, "global_step": 390680, "epoch": 4706, "val_loss": 6628746.0} {"train_loss": -24.446304321289062, "global_step": 390681, "epoch": 4707} {"train_loss": -22.51033592224121, "global_step": 390682, "epoch": 4707} {"train_loss": -24.530845642089844, "global_step": 390683, "epoch": 4707} {"train_loss": -25.303815841674805, "global_step": 390684, "epoch": 4707} {"train_loss": -24.575687408447266, "global_step": 390685, "epoch": 4707} {"train_loss": -25.549606323242188, "global_step": 390686, "epoch": 4707} {"train_loss": -25.118741989135742, "global_step": 390687, "epoch": 4707} {"train_loss": -25.898427963256836, "global_step": 390688, "epoch": 4707} {"train_loss": -25.12930679321289, "global_step": 390689, "epoch": 4707} {"train_loss": -25.988449096679688, "global_step": 390690, "epoch": 4707} {"train_loss": -25.4171142578125, "global_step": 390691, "epoch": 4707} {"train_loss": -25.74224281311035, "global_step": 390692, "epoch": 4707} {"train_loss": -25.82340431213379, "global_step": 390693, "epoch": 4707} {"train_loss": -25.661352157592773, "global_step": 390694, "epoch": 4707} {"train_loss": -26.0443172454834, "global_step": 390695, "epoch": 4707} {"train_loss": -25.7275390625, "global_step": 390696, "epoch": 4707} {"train_loss": -25.90899085998535, "global_step": 390697, "epoch": 4707} {"train_loss": -25.741546630859375, "global_step": 390698, "epoch": 4707} {"train_loss": -25.90132713317871, "global_step": 390699, "epoch": 4707} {"train_loss": -25.60627555847168, "global_step": 390700, "epoch": 4707} {"train_loss": -25.53780174255371, "global_step": 390701, "epoch": 4707} {"train_loss": -26.125091552734375, "global_step": 390702, "epoch": 4707} {"train_loss": -25.824237823486328, "global_step": 390703, "epoch": 4707} {"train_loss": -26.265487670898438, "global_step": 390704, "epoch": 4707} {"train_loss": -26.184619903564453, "global_step": 390705, "epoch": 4707} {"train_loss": -26.042022705078125, "global_step": 390706, "epoch": 4707} {"train_loss": -26.39432144165039, "global_step": 390707, "epoch": 4707} {"train_loss": -26.630084991455078, "global_step": 390708, "epoch": 4707} {"train_loss": -26.3586483001709, "global_step": 390709, "epoch": 4707} {"train_loss": -26.20598793029785, "global_step": 390710, "epoch": 4707} {"train_loss": -26.182249069213867, "global_step": 390711, "epoch": 4707} {"train_loss": -26.28925132751465, "global_step": 390712, "epoch": 4707} {"train_loss": -26.030248641967773, "global_step": 390713, "epoch": 4707} {"train_loss": -26.641889572143555, "global_step": 390714, "epoch": 4707} {"train_loss": -26.200414657592773, "global_step": 390715, "epoch": 4707} {"train_loss": -26.319873809814453, "global_step": 390716, "epoch": 4707} {"train_loss": -26.650726318359375, "global_step": 390717, "epoch": 4707} {"train_loss": -26.730321884155273, "global_step": 390718, "epoch": 4707} {"train_loss": -26.67165184020996, "global_step": 390719, "epoch": 4707} {"train_loss": -26.94099998474121, "global_step": 390720, "epoch": 4707} {"train_loss": -26.693567276000977, "global_step": 390721, "epoch": 4707} {"train_loss": -26.63776969909668, "global_step": 390722, "epoch": 4707} {"train_loss": -26.57931900024414, "global_step": 390723, "epoch": 4707} {"train_loss": -26.142547607421875, "global_step": 390724, "epoch": 4707} {"train_loss": -26.374332427978516, "global_step": 390725, "epoch": 4707} {"train_loss": -26.802404403686523, "global_step": 390726, "epoch": 4707} {"train_loss": -26.282093048095703, "global_step": 390727, "epoch": 4707} {"train_loss": -26.49367332458496, "global_step": 390728, "epoch": 4707} {"train_loss": -27.105548858642578, "global_step": 390729, "epoch": 4707} {"train_loss": -26.43756675720215, "global_step": 390730, "epoch": 4707} {"train_loss": -26.590391159057617, "global_step": 390731, "epoch": 4707} {"train_loss": -27.1507511138916, "global_step": 390732, "epoch": 4707} {"train_loss": -27.017587661743164, "global_step": 390733, "epoch": 4707} {"train_loss": -26.53899574279785, "global_step": 390734, "epoch": 4707} {"train_loss": -26.77216148376465, "global_step": 390735, "epoch": 4707} {"train_loss": -27.100263595581055, "global_step": 390736, "epoch": 4707} {"train_loss": -26.450109481811523, "global_step": 390737, "epoch": 4707} {"train_loss": -26.964242935180664, "global_step": 390738, "epoch": 4707} {"train_loss": -26.495468139648438, "global_step": 390739, "epoch": 4707} {"train_loss": -26.96209144592285, "global_step": 390740, "epoch": 4707} {"train_loss": -26.827966690063477, "global_step": 390741, "epoch": 4707} {"train_loss": -26.688385009765625, "global_step": 390742, "epoch": 4707} {"train_loss": -26.849225997924805, "global_step": 390743, "epoch": 4707} {"train_loss": -26.4766845703125, "global_step": 390744, "epoch": 4707} {"train_loss": -26.70363426208496, "global_step": 390745, "epoch": 4707} {"train_loss": -26.581649780273438, "global_step": 390746, "epoch": 4707} {"train_loss": -26.757898330688477, "global_step": 390747, "epoch": 4707} {"train_loss": -26.610395431518555, "global_step": 390748, "epoch": 4707} {"train_loss": -26.537067413330078, "global_step": 390749, "epoch": 4707} {"train_loss": -26.7567081451416, "global_step": 390750, "epoch": 4707} {"train_loss": -26.79920768737793, "global_step": 390751, "epoch": 4707} {"train_loss": -26.432971954345703, "global_step": 390752, "epoch": 4707} {"train_loss": -26.750181198120117, "global_step": 390753, "epoch": 4707} {"train_loss": -26.46518325805664, "global_step": 390754, "epoch": 4707} {"train_loss": -26.158788681030273, "global_step": 390755, "epoch": 4707} {"train_loss": -26.387475967407227, "global_step": 390756, "epoch": 4707} {"train_loss": -26.583524703979492, "global_step": 390757, "epoch": 4707} {"train_loss": -26.68706703186035, "global_step": 390758, "epoch": 4707} {"train_loss": -26.386686325073242, "global_step": 390759, "epoch": 4707} {"train_loss": -26.79290199279785, "global_step": 390760, "epoch": 4707} {"train_loss": -26.73063087463379, "global_step": 390761, "epoch": 4707} {"train_loss": -26.413665771484375, "global_step": 390762, "epoch": 4707} {"train_loss": -26.2420172863696, "global_step": 390763, "epoch": 4707, "val_loss": 6681148.0} {"train_loss": -26.21462059020996, "global_step": 390764, "epoch": 4708} {"train_loss": -26.17500114440918, "global_step": 390765, "epoch": 4708} {"train_loss": -26.324613571166992, "global_step": 390766, "epoch": 4708} {"train_loss": -26.4897518157959, "global_step": 390767, "epoch": 4708} {"train_loss": -26.533782958984375, "global_step": 390768, "epoch": 4708} {"train_loss": -26.401264190673828, "global_step": 390769, "epoch": 4708} {"train_loss": -26.166547775268555, "global_step": 390770, "epoch": 4708} {"train_loss": -26.23211669921875, "global_step": 390771, "epoch": 4708} {"train_loss": -26.494909286499023, "global_step": 390772, "epoch": 4708} {"train_loss": -26.428510665893555, "global_step": 390773, "epoch": 4708} {"train_loss": -26.71282386779785, "global_step": 390774, "epoch": 4708} {"train_loss": -26.962188720703125, "global_step": 390775, "epoch": 4708} {"train_loss": -26.388364791870117, "global_step": 390776, "epoch": 4708} {"train_loss": -26.30643653869629, "global_step": 390777, "epoch": 4708} {"train_loss": -26.330175399780273, "global_step": 390778, "epoch": 4708} {"train_loss": -26.2950382232666, "global_step": 390779, "epoch": 4708} {"train_loss": -26.723501205444336, "global_step": 390780, "epoch": 4708} {"train_loss": -26.077035903930664, "global_step": 390781, "epoch": 4708} {"train_loss": -26.656021118164062, "global_step": 390782, "epoch": 4708} {"train_loss": -26.09986686706543, "global_step": 390783, "epoch": 4708} {"train_loss": -26.249542236328125, "global_step": 390784, "epoch": 4708} {"train_loss": -26.4654598236084, "global_step": 390785, "epoch": 4708} {"train_loss": -26.747251510620117, "global_step": 390786, "epoch": 4708} {"train_loss": -26.824493408203125, "global_step": 390787, "epoch": 4708} {"train_loss": -26.56597900390625, "global_step": 390788, "epoch": 4708} {"train_loss": -26.87646484375, "global_step": 390789, "epoch": 4708} {"train_loss": -26.408655166625977, "global_step": 390790, "epoch": 4708} {"train_loss": -26.339862823486328, "global_step": 390791, "epoch": 4708} {"train_loss": -26.41535758972168, "global_step": 390792, "epoch": 4708} {"train_loss": -26.4260311126709, "global_step": 390793, "epoch": 4708} {"train_loss": -26.630386352539062, "global_step": 390794, "epoch": 4708} {"train_loss": -26.289688110351562, "global_step": 390795, "epoch": 4708} {"train_loss": -26.691003799438477, "global_step": 390796, "epoch": 4708} {"train_loss": -26.433359146118164, "global_step": 390797, "epoch": 4708} {"train_loss": -26.9217586517334, "global_step": 390798, "epoch": 4708} {"train_loss": -26.882612228393555, "global_step": 390799, "epoch": 4708} {"train_loss": -26.75729751586914, "global_step": 390800, "epoch": 4708} {"train_loss": -26.81385612487793, "global_step": 390801, "epoch": 4708} {"train_loss": -26.504150390625, "global_step": 390802, "epoch": 4708} {"train_loss": -26.362018585205078, "global_step": 390803, "epoch": 4708} {"train_loss": -26.925519943237305, "global_step": 390804, "epoch": 4708} {"train_loss": -26.419340133666992, "global_step": 390805, "epoch": 4708} {"train_loss": -26.482099533081055, "global_step": 390806, "epoch": 4708} {"train_loss": -26.95814323425293, "global_step": 390807, "epoch": 4708} {"train_loss": -26.647695541381836, "global_step": 390808, "epoch": 4708} {"train_loss": -26.823266983032227, "global_step": 390809, "epoch": 4708} {"train_loss": -26.664264678955078, "global_step": 390810, "epoch": 4708} {"train_loss": -26.928466796875, "global_step": 390811, "epoch": 4708} {"train_loss": -26.598709106445312, "global_step": 390812, "epoch": 4708} {"train_loss": -26.542036056518555, "global_step": 390813, "epoch": 4708} {"train_loss": -26.50357437133789, "global_step": 390814, "epoch": 4708} {"train_loss": -26.282962799072266, "global_step": 390815, "epoch": 4708} {"train_loss": -26.445234298706055, "global_step": 390816, "epoch": 4708} {"train_loss": -26.00227165222168, "global_step": 390817, "epoch": 4708} {"train_loss": -26.290668487548828, "global_step": 390818, "epoch": 4708} {"train_loss": -26.32989501953125, "global_step": 390819, "epoch": 4708} {"train_loss": -26.3346004486084, "global_step": 390820, "epoch": 4708} {"train_loss": -25.899688720703125, "global_step": 390821, "epoch": 4708} {"train_loss": -25.225589752197266, "global_step": 390822, "epoch": 4708} {"train_loss": -25.94614601135254, "global_step": 390823, "epoch": 4708} {"train_loss": -26.531396865844727, "global_step": 390824, "epoch": 4708} {"train_loss": -26.59224510192871, "global_step": 390825, "epoch": 4708} {"train_loss": -26.179834365844727, "global_step": 390826, "epoch": 4708} {"train_loss": -26.463842391967773, "global_step": 390827, "epoch": 4708} {"train_loss": -26.521728515625, "global_step": 390828, "epoch": 4708} {"train_loss": -26.341907501220703, "global_step": 390829, "epoch": 4708} {"train_loss": -26.228504180908203, "global_step": 390830, "epoch": 4708} {"train_loss": -26.343246459960938, "global_step": 390831, "epoch": 4708} {"train_loss": -26.541418075561523, "global_step": 390832, "epoch": 4708} {"train_loss": -26.179889678955078, "global_step": 390833, "epoch": 4708} {"train_loss": -26.424352645874023, "global_step": 390834, "epoch": 4708} {"train_loss": -26.34628677368164, "global_step": 390835, "epoch": 4708} {"train_loss": -26.615705490112305, "global_step": 390836, "epoch": 4708} {"train_loss": -26.326223373413086, "global_step": 390837, "epoch": 4708} {"train_loss": -26.347944259643555, "global_step": 390838, "epoch": 4708} {"train_loss": -26.373401641845703, "global_step": 390839, "epoch": 4708} {"train_loss": -26.287094116210938, "global_step": 390840, "epoch": 4708} {"train_loss": -26.26651954650879, "global_step": 390841, "epoch": 4708} {"train_loss": -26.25760841369629, "global_step": 390842, "epoch": 4708} {"train_loss": -26.708515167236328, "global_step": 390843, "epoch": 4708} {"train_loss": -26.53204917907715, "global_step": 390844, "epoch": 4708} {"train_loss": -25.997547149658203, "global_step": 390845, "epoch": 4708} {"train_loss": -26.459238672830974, "global_step": 390846, "epoch": 4708, "val_loss": 6723661.0} {"train_loss": -26.29656982421875, "global_step": 390847, "epoch": 4709} {"train_loss": -26.080251693725586, "global_step": 390848, "epoch": 4709} {"train_loss": -25.8990478515625, "global_step": 390849, "epoch": 4709} {"train_loss": -26.416296005249023, "global_step": 390850, "epoch": 4709} {"train_loss": -26.189926147460938, "global_step": 390851, "epoch": 4709} {"train_loss": -26.19928550720215, "global_step": 390852, "epoch": 4709} {"train_loss": -25.859128952026367, "global_step": 390853, "epoch": 4709} {"train_loss": -25.904010772705078, "global_step": 390854, "epoch": 4709} {"train_loss": -25.936758041381836, "global_step": 390855, "epoch": 4709} {"train_loss": -25.801233291625977, "global_step": 390856, "epoch": 4709} {"train_loss": -25.7357120513916, "global_step": 390857, "epoch": 4709} {"train_loss": -26.47125244140625, "global_step": 390858, "epoch": 4709} {"train_loss": -25.852575302124023, "global_step": 390859, "epoch": 4709} {"train_loss": -26.685657501220703, "global_step": 390860, "epoch": 4709} {"train_loss": -26.058624267578125, "global_step": 390861, "epoch": 4709} {"train_loss": -26.322336196899414, "global_step": 390862, "epoch": 4709} {"train_loss": -26.154706954956055, "global_step": 390863, "epoch": 4709} {"train_loss": -26.436599731445312, "global_step": 390864, "epoch": 4709} {"train_loss": -26.33843994140625, "global_step": 390865, "epoch": 4709} {"train_loss": -26.084402084350586, "global_step": 390866, "epoch": 4709} {"train_loss": -26.173465728759766, "global_step": 390867, "epoch": 4709} {"train_loss": -26.373083114624023, "global_step": 390868, "epoch": 4709} {"train_loss": -26.11094093322754, "global_step": 390869, "epoch": 4709} {"train_loss": -26.330841064453125, "global_step": 390870, "epoch": 4709} {"train_loss": -26.279525756835938, "global_step": 390871, "epoch": 4709} {"train_loss": -26.56117057800293, "global_step": 390872, "epoch": 4709} {"train_loss": -26.107343673706055, "global_step": 390873, "epoch": 4709} {"train_loss": -26.56502342224121, "global_step": 390874, "epoch": 4709} {"train_loss": -26.226715087890625, "global_step": 390875, "epoch": 4709} {"train_loss": -26.43902015686035, "global_step": 390876, "epoch": 4709} {"train_loss": -26.216100692749023, "global_step": 390877, "epoch": 4709} {"train_loss": -26.40638542175293, "global_step": 390878, "epoch": 4709} {"train_loss": -26.3244686126709, "global_step": 390879, "epoch": 4709} {"train_loss": -26.087636947631836, "global_step": 390880, "epoch": 4709} {"train_loss": -26.690753936767578, "global_step": 390881, "epoch": 4709} {"train_loss": -26.356414794921875, "global_step": 390882, "epoch": 4709} {"train_loss": -26.655588150024414, "global_step": 390883, "epoch": 4709} {"train_loss": -26.5018310546875, "global_step": 390884, "epoch": 4709} {"train_loss": -26.780136108398438, "global_step": 390885, "epoch": 4709} {"train_loss": -26.264814376831055, "global_step": 390886, "epoch": 4709} {"train_loss": -26.5451717376709, "global_step": 390887, "epoch": 4709} {"train_loss": -26.370817184448242, "global_step": 390888, "epoch": 4709} {"train_loss": -26.488025665283203, "global_step": 390889, "epoch": 4709} {"train_loss": -26.42523193359375, "global_step": 390890, "epoch": 4709} {"train_loss": -26.80474853515625, "global_step": 390891, "epoch": 4709} {"train_loss": -26.783588409423828, "global_step": 390892, "epoch": 4709} {"train_loss": -26.432422637939453, "global_step": 390893, "epoch": 4709} {"train_loss": -26.425537109375, "global_step": 390894, "epoch": 4709} {"train_loss": -26.807096481323242, "global_step": 390895, "epoch": 4709} {"train_loss": -26.38783073425293, "global_step": 390896, "epoch": 4709} {"train_loss": -26.391698837280273, "global_step": 390897, "epoch": 4709} {"train_loss": -26.299701690673828, "global_step": 390898, "epoch": 4709} {"train_loss": -26.52861976623535, "global_step": 390899, "epoch": 4709} {"train_loss": -26.673160552978516, "global_step": 390900, "epoch": 4709} {"train_loss": -26.584415435791016, "global_step": 390901, "epoch": 4709} {"train_loss": -26.837289810180664, "global_step": 390902, "epoch": 4709} {"train_loss": -26.382797241210938, "global_step": 390903, "epoch": 4709} {"train_loss": -26.726850509643555, "global_step": 390904, "epoch": 4709} {"train_loss": -26.961902618408203, "global_step": 390905, "epoch": 4709} {"train_loss": -27.154529571533203, "global_step": 390906, "epoch": 4709} {"train_loss": -26.302764892578125, "global_step": 390907, "epoch": 4709} {"train_loss": -26.423192977905273, "global_step": 390908, "epoch": 4709} {"train_loss": -26.318204879760742, "global_step": 390909, "epoch": 4709} {"train_loss": -25.99238395690918, "global_step": 390910, "epoch": 4709} {"train_loss": -26.016199111938477, "global_step": 390911, "epoch": 4709} {"train_loss": -25.3958797454834, "global_step": 390912, "epoch": 4709} {"train_loss": -26.505640029907227, "global_step": 390913, "epoch": 4709} {"train_loss": -26.60617446899414, "global_step": 390914, "epoch": 4709} {"train_loss": -26.740270614624023, "global_step": 390915, "epoch": 4709} {"train_loss": -26.19215202331543, "global_step": 390916, "epoch": 4709} {"train_loss": -25.98682975769043, "global_step": 390917, "epoch": 4709} {"train_loss": -26.653120040893555, "global_step": 390918, "epoch": 4709} {"train_loss": -26.698461532592773, "global_step": 390919, "epoch": 4709} {"train_loss": -26.546411514282227, "global_step": 390920, "epoch": 4709} {"train_loss": -26.76392936706543, "global_step": 390921, "epoch": 4709} {"train_loss": -26.621301651000977, "global_step": 390922, "epoch": 4709} {"train_loss": -26.6202335357666, "global_step": 390923, "epoch": 4709} {"train_loss": -26.459827423095703, "global_step": 390924, "epoch": 4709} {"train_loss": -26.351362228393555, "global_step": 390925, "epoch": 4709} {"train_loss": -26.540151596069336, "global_step": 390926, "epoch": 4709} {"train_loss": -26.533309936523438, "global_step": 390927, "epoch": 4709} {"train_loss": -26.842864990234375, "global_step": 390928, "epoch": 4709} {"train_loss": -26.378336228520038, "global_step": 390929, "epoch": 4709, "val_loss": 6662279.0} {"train_loss": -25.450387954711914, "global_step": 390930, "epoch": 4710} {"train_loss": -25.55208396911621, "global_step": 390931, "epoch": 4710} {"train_loss": -25.899627685546875, "global_step": 390932, "epoch": 4710} {"train_loss": -26.201696395874023, "global_step": 390933, "epoch": 4710} {"train_loss": -25.38763999938965, "global_step": 390934, "epoch": 4710} {"train_loss": -25.93158531188965, "global_step": 390935, "epoch": 4710} {"train_loss": -25.545822143554688, "global_step": 390936, "epoch": 4710} {"train_loss": -26.276269912719727, "global_step": 390937, "epoch": 4710} {"train_loss": -26.069700241088867, "global_step": 390938, "epoch": 4710} {"train_loss": -25.778797149658203, "global_step": 390939, "epoch": 4710} {"train_loss": -26.05779457092285, "global_step": 390940, "epoch": 4710} {"train_loss": -25.96257972717285, "global_step": 390941, "epoch": 4710} {"train_loss": -26.016653060913086, "global_step": 390942, "epoch": 4710} {"train_loss": -25.97650146484375, "global_step": 390943, "epoch": 4710} {"train_loss": -26.134693145751953, "global_step": 390944, "epoch": 4710} {"train_loss": -26.197885513305664, "global_step": 390945, "epoch": 4710} {"train_loss": -25.999908447265625, "global_step": 390946, "epoch": 4710} {"train_loss": -26.63705825805664, "global_step": 390947, "epoch": 4710} {"train_loss": -26.25412368774414, "global_step": 390948, "epoch": 4710} {"train_loss": -26.156702041625977, "global_step": 390949, "epoch": 4710} {"train_loss": -26.266483306884766, "global_step": 390950, "epoch": 4710} {"train_loss": -26.10585594177246, "global_step": 390951, "epoch": 4710} {"train_loss": -26.505401611328125, "global_step": 390952, "epoch": 4710} {"train_loss": -26.627033233642578, "global_step": 390953, "epoch": 4710} {"train_loss": -26.522886276245117, "global_step": 390954, "epoch": 4710} {"train_loss": -26.721176147460938, "global_step": 390955, "epoch": 4710} {"train_loss": -26.169599533081055, "global_step": 390956, "epoch": 4710} {"train_loss": -26.54243278503418, "global_step": 390957, "epoch": 4710} {"train_loss": -26.84031105041504, "global_step": 390958, "epoch": 4710} {"train_loss": -26.261383056640625, "global_step": 390959, "epoch": 4710} {"train_loss": -26.450361251831055, "global_step": 390960, "epoch": 4710} {"train_loss": -26.458707809448242, "global_step": 390961, "epoch": 4710} {"train_loss": -26.76201820373535, "global_step": 390962, "epoch": 4710} {"train_loss": -26.676218032836914, "global_step": 390963, "epoch": 4710} {"train_loss": -26.761051177978516, "global_step": 390964, "epoch": 4710} {"train_loss": -26.267288208007812, "global_step": 390965, "epoch": 4710} {"train_loss": -26.228551864624023, "global_step": 390966, "epoch": 4710} {"train_loss": -26.39518165588379, "global_step": 390967, "epoch": 4710} {"train_loss": -26.634841918945312, "global_step": 390968, "epoch": 4710} {"train_loss": -26.352758407592773, "global_step": 390969, "epoch": 4710} {"train_loss": -26.925872802734375, "global_step": 390970, "epoch": 4710} {"train_loss": -26.193761825561523, "global_step": 390971, "epoch": 4710} {"train_loss": -26.98431396484375, "global_step": 390972, "epoch": 4710} {"train_loss": -26.6668758392334, "global_step": 390973, "epoch": 4710} {"train_loss": -26.526294708251953, "global_step": 390974, "epoch": 4710} {"train_loss": -26.86406898498535, "global_step": 390975, "epoch": 4710} {"train_loss": -26.7778263092041, "global_step": 390976, "epoch": 4710} {"train_loss": -26.82195472717285, "global_step": 390977, "epoch": 4710} {"train_loss": -26.621856689453125, "global_step": 390978, "epoch": 4710} {"train_loss": -26.674646377563477, "global_step": 390979, "epoch": 4710} {"train_loss": -26.76629638671875, "global_step": 390980, "epoch": 4710} {"train_loss": -27.01377296447754, "global_step": 390981, "epoch": 4710} {"train_loss": -26.76263999938965, "global_step": 390982, "epoch": 4710} {"train_loss": -26.396093368530273, "global_step": 390983, "epoch": 4710} {"train_loss": -26.848724365234375, "global_step": 390984, "epoch": 4710} {"train_loss": -26.768644332885742, "global_step": 390985, "epoch": 4710} {"train_loss": -26.366613388061523, "global_step": 390986, "epoch": 4710} {"train_loss": -26.17374610900879, "global_step": 390987, "epoch": 4710} {"train_loss": -26.42902183532715, "global_step": 390988, "epoch": 4710} {"train_loss": -26.649860382080078, "global_step": 390989, "epoch": 4710} {"train_loss": -26.758747100830078, "global_step": 390990, "epoch": 4710} {"train_loss": -26.60422706604004, "global_step": 390991, "epoch": 4710} {"train_loss": -26.63715934753418, "global_step": 390992, "epoch": 4710} {"train_loss": -26.32468605041504, "global_step": 390993, "epoch": 4710} {"train_loss": -26.86726188659668, "global_step": 390994, "epoch": 4710} {"train_loss": -26.499774932861328, "global_step": 390995, "epoch": 4710} {"train_loss": -26.18482780456543, "global_step": 390996, "epoch": 4710} {"train_loss": -25.785781860351562, "global_step": 390997, "epoch": 4710} {"train_loss": -26.04790687561035, "global_step": 390998, "epoch": 4710} {"train_loss": -26.512393951416016, "global_step": 390999, "epoch": 4710} {"train_loss": -26.3371639251709, "global_step": 391000, "epoch": 4710} {"train_loss": -25.997467041015625, "global_step": 391001, "epoch": 4710} {"train_loss": -26.242338180541992, "global_step": 391002, "epoch": 4710} {"train_loss": -26.557647705078125, "global_step": 391003, "epoch": 4710} {"train_loss": -26.192779541015625, "global_step": 391004, "epoch": 4710} {"train_loss": -26.02957534790039, "global_step": 391005, "epoch": 4710} {"train_loss": -26.79947280883789, "global_step": 391006, "epoch": 4710} {"train_loss": -26.24252700805664, "global_step": 391007, "epoch": 4710} {"train_loss": -26.164199829101562, "global_step": 391008, "epoch": 4710} {"train_loss": -25.843597412109375, "global_step": 391009, "epoch": 4710} {"train_loss": -26.23494529724121, "global_step": 391010, "epoch": 4710} {"train_loss": -26.50322914123535, "global_step": 391011, "epoch": 4710} {"train_loss": -26.357085836939063, "global_step": 391012, "epoch": 4710, "val_loss": 6477304.5} {"train_loss": -26.255224227905273, "global_step": 391013, "epoch": 4711} {"train_loss": -25.817182540893555, "global_step": 391014, "epoch": 4711} {"train_loss": -25.50376319885254, "global_step": 391015, "epoch": 4711} {"train_loss": -25.455204010009766, "global_step": 391016, "epoch": 4711} {"train_loss": -25.93572998046875, "global_step": 391017, "epoch": 4711} {"train_loss": -25.76771354675293, "global_step": 391018, "epoch": 4711} {"train_loss": -25.849170684814453, "global_step": 391019, "epoch": 4711} {"train_loss": -26.015302658081055, "global_step": 391020, "epoch": 4711} {"train_loss": -25.74307632446289, "global_step": 391021, "epoch": 4711} {"train_loss": -25.632822036743164, "global_step": 391022, "epoch": 4711} {"train_loss": -25.63538932800293, "global_step": 391023, "epoch": 4711} {"train_loss": -25.761550903320312, "global_step": 391024, "epoch": 4711} {"train_loss": -26.170705795288086, "global_step": 391025, "epoch": 4711} {"train_loss": -26.2066707611084, "global_step": 391026, "epoch": 4711} {"train_loss": -26.180606842041016, "global_step": 391027, "epoch": 4711} {"train_loss": -26.2323055267334, "global_step": 391028, "epoch": 4711} {"train_loss": -25.887985229492188, "global_step": 391029, "epoch": 4711} {"train_loss": -26.44085693359375, "global_step": 391030, "epoch": 4711} {"train_loss": -26.570287704467773, "global_step": 391031, "epoch": 4711} {"train_loss": -26.441699981689453, "global_step": 391032, "epoch": 4711} {"train_loss": -26.605009078979492, "global_step": 391033, "epoch": 4711} {"train_loss": -25.959217071533203, "global_step": 391034, "epoch": 4711} {"train_loss": -26.64798927307129, "global_step": 391035, "epoch": 4711} {"train_loss": -26.588134765625, "global_step": 391036, "epoch": 4711} {"train_loss": -26.550867080688477, "global_step": 391037, "epoch": 4711} {"train_loss": -26.437719345092773, "global_step": 391038, "epoch": 4711} {"train_loss": -26.484207153320312, "global_step": 391039, "epoch": 4711} {"train_loss": -26.39995765686035, "global_step": 391040, "epoch": 4711} {"train_loss": -26.671253204345703, "global_step": 391041, "epoch": 4711} {"train_loss": -26.307453155517578, "global_step": 391042, "epoch": 4711} {"train_loss": -26.688146591186523, "global_step": 391043, "epoch": 4711} {"train_loss": -26.725433349609375, "global_step": 391044, "epoch": 4711} {"train_loss": -26.738845825195312, "global_step": 391045, "epoch": 4711} {"train_loss": -26.743927001953125, "global_step": 391046, "epoch": 4711} {"train_loss": -26.623340606689453, "global_step": 391047, "epoch": 4711} {"train_loss": -26.608434677124023, "global_step": 391048, "epoch": 4711} {"train_loss": -26.65724754333496, "global_step": 391049, "epoch": 4711} {"train_loss": -26.687612533569336, "global_step": 391050, "epoch": 4711} {"train_loss": -26.665481567382812, "global_step": 391051, "epoch": 4711} {"train_loss": -26.6323184967041, "global_step": 391052, "epoch": 4711} {"train_loss": -27.181812286376953, "global_step": 391053, "epoch": 4711} {"train_loss": -26.830463409423828, "global_step": 391054, "epoch": 4711} {"train_loss": -26.548322677612305, "global_step": 391055, "epoch": 4711} {"train_loss": -27.17982292175293, "global_step": 391056, "epoch": 4711} {"train_loss": -26.5930118560791, "global_step": 391057, "epoch": 4711} {"train_loss": -26.834821701049805, "global_step": 391058, "epoch": 4711} {"train_loss": -26.765979766845703, "global_step": 391059, "epoch": 4711} {"train_loss": -26.765796661376953, "global_step": 391060, "epoch": 4711} {"train_loss": -26.947248458862305, "global_step": 391061, "epoch": 4711} {"train_loss": -26.537145614624023, "global_step": 391062, "epoch": 4711} {"train_loss": -26.782520294189453, "global_step": 391063, "epoch": 4711} {"train_loss": -26.594160079956055, "global_step": 391064, "epoch": 4711} {"train_loss": -26.78179931640625, "global_step": 391065, "epoch": 4711} {"train_loss": -26.5686092376709, "global_step": 391066, "epoch": 4711} {"train_loss": -26.612043380737305, "global_step": 391067, "epoch": 4711} {"train_loss": -25.969274520874023, "global_step": 391068, "epoch": 4711} {"train_loss": -25.856037139892578, "global_step": 391069, "epoch": 4711} {"train_loss": -26.62940788269043, "global_step": 391070, "epoch": 4711} {"train_loss": -26.275903701782227, "global_step": 391071, "epoch": 4711} {"train_loss": -26.413354873657227, "global_step": 391072, "epoch": 4711} {"train_loss": -26.184234619140625, "global_step": 391073, "epoch": 4711} {"train_loss": -26.0345401763916, "global_step": 391074, "epoch": 4711} {"train_loss": -26.426055908203125, "global_step": 391075, "epoch": 4711} {"train_loss": -26.140356063842773, "global_step": 391076, "epoch": 4711} {"train_loss": -26.34552001953125, "global_step": 391077, "epoch": 4711} {"train_loss": -26.01639747619629, "global_step": 391078, "epoch": 4711} {"train_loss": -26.62774658203125, "global_step": 391079, "epoch": 4711} {"train_loss": -26.19927978515625, "global_step": 391080, "epoch": 4711} {"train_loss": -26.36091423034668, "global_step": 391081, "epoch": 4711} {"train_loss": -26.59663963317871, "global_step": 391082, "epoch": 4711} {"train_loss": -26.71536636352539, "global_step": 391083, "epoch": 4711} {"train_loss": -26.345203399658203, "global_step": 391084, "epoch": 4711} {"train_loss": -26.62497901916504, "global_step": 391085, "epoch": 4711} {"train_loss": -26.451215744018555, "global_step": 391086, "epoch": 4711} {"train_loss": -26.39857292175293, "global_step": 391087, "epoch": 4711} {"train_loss": -26.579248428344727, "global_step": 391088, "epoch": 4711} {"train_loss": -26.416351318359375, "global_step": 391089, "epoch": 4711} {"train_loss": -26.384275436401367, "global_step": 391090, "epoch": 4711} {"train_loss": -26.45180320739746, "global_step": 391091, "epoch": 4711} {"train_loss": -26.153711318969727, "global_step": 391092, "epoch": 4711} {"train_loss": -26.32672691345215, "global_step": 391093, "epoch": 4711} {"train_loss": -26.208484649658203, "global_step": 391094, "epoch": 4711} {"train_loss": -26.373194706009095, "global_step": 391095, "epoch": 4711, "val_loss": 6537505.0} {"train_loss": -25.087249755859375, "global_step": 391096, "epoch": 4712} {"train_loss": -24.845413208007812, "global_step": 391097, "epoch": 4712} {"train_loss": -26.257720947265625, "global_step": 391098, "epoch": 4712} {"train_loss": -26.022541046142578, "global_step": 391099, "epoch": 4712} {"train_loss": -25.438491821289062, "global_step": 391100, "epoch": 4712} {"train_loss": -26.613061904907227, "global_step": 391101, "epoch": 4712} {"train_loss": -26.10603141784668, "global_step": 391102, "epoch": 4712} {"train_loss": -26.030466079711914, "global_step": 391103, "epoch": 4712} {"train_loss": -26.263227462768555, "global_step": 391104, "epoch": 4712} {"train_loss": -25.988386154174805, "global_step": 391105, "epoch": 4712} {"train_loss": -26.080087661743164, "global_step": 391106, "epoch": 4712} {"train_loss": -26.11355972290039, "global_step": 391107, "epoch": 4712} {"train_loss": -26.409748077392578, "global_step": 391108, "epoch": 4712} {"train_loss": -25.734296798706055, "global_step": 391109, "epoch": 4712} {"train_loss": -26.546537399291992, "global_step": 391110, "epoch": 4712} {"train_loss": -26.473485946655273, "global_step": 391111, "epoch": 4712} {"train_loss": -26.53888511657715, "global_step": 391112, "epoch": 4712} {"train_loss": -26.147125244140625, "global_step": 391113, "epoch": 4712} {"train_loss": -26.439443588256836, "global_step": 391114, "epoch": 4712} {"train_loss": -26.303396224975586, "global_step": 391115, "epoch": 4712} {"train_loss": -26.56060218811035, "global_step": 391116, "epoch": 4712} {"train_loss": -26.4744815826416, "global_step": 391117, "epoch": 4712} {"train_loss": -26.1850643157959, "global_step": 391118, "epoch": 4712} {"train_loss": -25.936939239501953, "global_step": 391119, "epoch": 4712} {"train_loss": -26.9747257232666, "global_step": 391120, "epoch": 4712} {"train_loss": -26.307416915893555, "global_step": 391121, "epoch": 4712} {"train_loss": -26.764114379882812, "global_step": 391122, "epoch": 4712} {"train_loss": -26.2994384765625, "global_step": 391123, "epoch": 4712} {"train_loss": -26.77430534362793, "global_step": 391124, "epoch": 4712} {"train_loss": -26.46259117126465, "global_step": 391125, "epoch": 4712} {"train_loss": -26.4703426361084, "global_step": 391126, "epoch": 4712} {"train_loss": -26.611907958984375, "global_step": 391127, "epoch": 4712} {"train_loss": -26.151519775390625, "global_step": 391128, "epoch": 4712} {"train_loss": -26.596479415893555, "global_step": 391129, "epoch": 4712} {"train_loss": -26.512434005737305, "global_step": 391130, "epoch": 4712} {"train_loss": -26.5794620513916, "global_step": 391131, "epoch": 4712} {"train_loss": -26.78460693359375, "global_step": 391132, "epoch": 4712} {"train_loss": -26.72768211364746, "global_step": 391133, "epoch": 4712} {"train_loss": -26.130075454711914, "global_step": 391134, "epoch": 4712} {"train_loss": -26.7186279296875, "global_step": 391135, "epoch": 4712} {"train_loss": -26.127079010009766, "global_step": 391136, "epoch": 4712} {"train_loss": -26.046039581298828, "global_step": 391137, "epoch": 4712} {"train_loss": -26.640090942382812, "global_step": 391138, "epoch": 4712} {"train_loss": -26.566389083862305, "global_step": 391139, "epoch": 4712} {"train_loss": -26.568653106689453, "global_step": 391140, "epoch": 4712} {"train_loss": -26.235248565673828, "global_step": 391141, "epoch": 4712} {"train_loss": -26.343250274658203, "global_step": 391142, "epoch": 4712} {"train_loss": -26.371524810791016, "global_step": 391143, "epoch": 4712} {"train_loss": -26.40229606628418, "global_step": 391144, "epoch": 4712} {"train_loss": -26.381683349609375, "global_step": 391145, "epoch": 4712} {"train_loss": -26.628559112548828, "global_step": 391146, "epoch": 4712} {"train_loss": -26.403100967407227, "global_step": 391147, "epoch": 4712} {"train_loss": -25.789472579956055, "global_step": 391148, "epoch": 4712} {"train_loss": -26.299848556518555, "global_step": 391149, "epoch": 4712} {"train_loss": -26.127004623413086, "global_step": 391150, "epoch": 4712} {"train_loss": -26.293109893798828, "global_step": 391151, "epoch": 4712} {"train_loss": -26.21087646484375, "global_step": 391152, "epoch": 4712} {"train_loss": -26.32366371154785, "global_step": 391153, "epoch": 4712} {"train_loss": -26.323694229125977, "global_step": 391154, "epoch": 4712} {"train_loss": -26.620344161987305, "global_step": 391155, "epoch": 4712} {"train_loss": -26.820215225219727, "global_step": 391156, "epoch": 4712} {"train_loss": -26.709705352783203, "global_step": 391157, "epoch": 4712} {"train_loss": -26.734027862548828, "global_step": 391158, "epoch": 4712} {"train_loss": -26.41371726989746, "global_step": 391159, "epoch": 4712} {"train_loss": -26.35178565979004, "global_step": 391160, "epoch": 4712} {"train_loss": -26.45760154724121, "global_step": 391161, "epoch": 4712} {"train_loss": -26.315906524658203, "global_step": 391162, "epoch": 4712} {"train_loss": -26.347888946533203, "global_step": 391163, "epoch": 4712} {"train_loss": -26.163330078125, "global_step": 391164, "epoch": 4712} {"train_loss": -25.798477172851562, "global_step": 391165, "epoch": 4712} {"train_loss": -26.488264083862305, "global_step": 391166, "epoch": 4712} {"train_loss": -26.642728805541992, "global_step": 391167, "epoch": 4712} {"train_loss": -25.669010162353516, "global_step": 391168, "epoch": 4712} {"train_loss": -26.263219833374023, "global_step": 391169, "epoch": 4712} {"train_loss": -26.340627670288086, "global_step": 391170, "epoch": 4712} {"train_loss": -26.29816246032715, "global_step": 391171, "epoch": 4712} {"train_loss": -26.38984489440918, "global_step": 391172, "epoch": 4712} {"train_loss": -26.5432186126709, "global_step": 391173, "epoch": 4712} {"train_loss": -26.410146713256836, "global_step": 391174, "epoch": 4712} {"train_loss": -26.620868682861328, "global_step": 391175, "epoch": 4712} {"train_loss": -26.181753158569336, "global_step": 391176, "epoch": 4712} {"train_loss": -26.590063095092773, "global_step": 391177, "epoch": 4712} {"train_loss": -26.330270100788898, "global_step": 391178, "epoch": 4712, "val_loss": 6609245.5} {"train_loss": -25.689178466796875, "global_step": 391179, "epoch": 4713} {"train_loss": -26.191457748413086, "global_step": 391180, "epoch": 4713} {"train_loss": -26.02276039123535, "global_step": 391181, "epoch": 4713} {"train_loss": -26.742279052734375, "global_step": 391182, "epoch": 4713} {"train_loss": -26.311838150024414, "global_step": 391183, "epoch": 4713} {"train_loss": -26.96388053894043, "global_step": 391184, "epoch": 4713} {"train_loss": -26.251087188720703, "global_step": 391185, "epoch": 4713} {"train_loss": -26.495513916015625, "global_step": 391186, "epoch": 4713} {"train_loss": -26.649890899658203, "global_step": 391187, "epoch": 4713} {"train_loss": -26.411985397338867, "global_step": 391188, "epoch": 4713} {"train_loss": -26.691028594970703, "global_step": 391189, "epoch": 4713} {"train_loss": -26.723764419555664, "global_step": 391190, "epoch": 4713} {"train_loss": -26.083740234375, "global_step": 391191, "epoch": 4713} {"train_loss": -26.631946563720703, "global_step": 391192, "epoch": 4713} {"train_loss": -26.55317497253418, "global_step": 391193, "epoch": 4713} {"train_loss": -26.554718017578125, "global_step": 391194, "epoch": 4713} {"train_loss": -26.536725997924805, "global_step": 391195, "epoch": 4713} {"train_loss": -26.7091064453125, "global_step": 391196, "epoch": 4713} {"train_loss": -26.527502059936523, "global_step": 391197, "epoch": 4713} {"train_loss": -26.514631271362305, "global_step": 391198, "epoch": 4713} {"train_loss": -26.493024826049805, "global_step": 391199, "epoch": 4713} {"train_loss": -26.905414581298828, "global_step": 391200, "epoch": 4713} {"train_loss": -26.5720157623291, "global_step": 391201, "epoch": 4713} {"train_loss": -26.637928009033203, "global_step": 391202, "epoch": 4713} {"train_loss": -26.857227325439453, "global_step": 391203, "epoch": 4713} {"train_loss": -26.7883358001709, "global_step": 391204, "epoch": 4713} {"train_loss": -26.257526397705078, "global_step": 391205, "epoch": 4713} {"train_loss": -26.64837646484375, "global_step": 391206, "epoch": 4713} {"train_loss": -26.607513427734375, "global_step": 391207, "epoch": 4713} {"train_loss": -26.324148178100586, "global_step": 391208, "epoch": 4713} {"train_loss": -26.411884307861328, "global_step": 391209, "epoch": 4713} {"train_loss": -26.560880661010742, "global_step": 391210, "epoch": 4713} {"train_loss": -26.388818740844727, "global_step": 391211, "epoch": 4713} {"train_loss": -26.015167236328125, "global_step": 391212, "epoch": 4713} {"train_loss": -26.43344497680664, "global_step": 391213, "epoch": 4713} {"train_loss": -26.243005752563477, "global_step": 391214, "epoch": 4713} {"train_loss": -26.14181900024414, "global_step": 391215, "epoch": 4713} {"train_loss": -26.26163101196289, "global_step": 391216, "epoch": 4713} {"train_loss": -25.856842041015625, "global_step": 391217, "epoch": 4713} {"train_loss": -26.6483097076416, "global_step": 391218, "epoch": 4713} {"train_loss": -26.042499542236328, "global_step": 391219, "epoch": 4713} {"train_loss": -26.126571655273438, "global_step": 391220, "epoch": 4713} {"train_loss": -26.282562255859375, "global_step": 391221, "epoch": 4713} {"train_loss": -26.171110153198242, "global_step": 391222, "epoch": 4713} {"train_loss": -25.947011947631836, "global_step": 391223, "epoch": 4713} {"train_loss": -26.434070587158203, "global_step": 391224, "epoch": 4713} {"train_loss": -26.654993057250977, "global_step": 391225, "epoch": 4713} {"train_loss": -26.327421188354492, "global_step": 391226, "epoch": 4713} {"train_loss": -26.207971572875977, "global_step": 391227, "epoch": 4713} {"train_loss": -26.051502227783203, "global_step": 391228, "epoch": 4713} {"train_loss": -26.339590072631836, "global_step": 391229, "epoch": 4713} {"train_loss": -26.72272300720215, "global_step": 391230, "epoch": 4713} {"train_loss": -26.167449951171875, "global_step": 391231, "epoch": 4713} {"train_loss": -26.5184383392334, "global_step": 391232, "epoch": 4713} {"train_loss": -26.47629165649414, "global_step": 391233, "epoch": 4713} {"train_loss": -26.56229019165039, "global_step": 391234, "epoch": 4713} {"train_loss": -26.098464965820312, "global_step": 391235, "epoch": 4713} {"train_loss": -26.565906524658203, "global_step": 391236, "epoch": 4713} {"train_loss": -26.49091911315918, "global_step": 391237, "epoch": 4713} {"train_loss": -26.848651885986328, "global_step": 391238, "epoch": 4713} {"train_loss": -26.72256851196289, "global_step": 391239, "epoch": 4713} {"train_loss": -26.37945556640625, "global_step": 391240, "epoch": 4713} {"train_loss": -26.973901748657227, "global_step": 391241, "epoch": 4713} {"train_loss": -26.237812042236328, "global_step": 391242, "epoch": 4713} {"train_loss": -26.46152114868164, "global_step": 391243, "epoch": 4713} {"train_loss": -26.50615882873535, "global_step": 391244, "epoch": 4713} {"train_loss": -26.662755966186523, "global_step": 391245, "epoch": 4713} {"train_loss": -26.747480392456055, "global_step": 391246, "epoch": 4713} {"train_loss": -26.142200469970703, "global_step": 391247, "epoch": 4713} {"train_loss": -26.5073299407959, "global_step": 391248, "epoch": 4713} {"train_loss": -26.641876220703125, "global_step": 391249, "epoch": 4713} {"train_loss": -26.65252113342285, "global_step": 391250, "epoch": 4713} {"train_loss": -26.88730239868164, "global_step": 391251, "epoch": 4713} {"train_loss": -26.657629013061523, "global_step": 391252, "epoch": 4713} {"train_loss": -26.150470733642578, "global_step": 391253, "epoch": 4713} {"train_loss": -26.8142032623291, "global_step": 391254, "epoch": 4713} {"train_loss": -26.428796768188477, "global_step": 391255, "epoch": 4713} {"train_loss": -26.784738540649414, "global_step": 391256, "epoch": 4713} {"train_loss": -26.748077392578125, "global_step": 391257, "epoch": 4713} {"train_loss": -26.791873931884766, "global_step": 391258, "epoch": 4713} {"train_loss": -26.668500900268555, "global_step": 391259, "epoch": 4713} {"train_loss": -26.81697654724121, "global_step": 391260, "epoch": 4713} {"train_loss": -26.442273909787097, "global_step": 391261, "epoch": 4713, "val_loss": 6588589.0} {"train_loss": -26.496129989624023, "global_step": 391262, "epoch": 4714} {"train_loss": -25.533952713012695, "global_step": 391263, "epoch": 4714} {"train_loss": -25.753442764282227, "global_step": 391264, "epoch": 4714} {"train_loss": -25.8221492767334, "global_step": 391265, "epoch": 4714} {"train_loss": -25.828460693359375, "global_step": 391266, "epoch": 4714} {"train_loss": -25.5411319732666, "global_step": 391267, "epoch": 4714} {"train_loss": -25.380002975463867, "global_step": 391268, "epoch": 4714} {"train_loss": -25.331541061401367, "global_step": 391269, "epoch": 4714} {"train_loss": -25.945545196533203, "global_step": 391270, "epoch": 4714} {"train_loss": -25.93198013305664, "global_step": 391271, "epoch": 4714} {"train_loss": -25.901203155517578, "global_step": 391272, "epoch": 4714} {"train_loss": -25.899337768554688, "global_step": 391273, "epoch": 4714} {"train_loss": -26.0205078125, "global_step": 391274, "epoch": 4714} {"train_loss": -25.787677764892578, "global_step": 391275, "epoch": 4714} {"train_loss": -26.356637954711914, "global_step": 391276, "epoch": 4714} {"train_loss": -25.858020782470703, "global_step": 391277, "epoch": 4714} {"train_loss": -26.011449813842773, "global_step": 391278, "epoch": 4714} {"train_loss": -26.279905319213867, "global_step": 391279, "epoch": 4714} {"train_loss": -26.149572372436523, "global_step": 391280, "epoch": 4714} {"train_loss": -26.16705322265625, "global_step": 391281, "epoch": 4714} {"train_loss": -26.273725509643555, "global_step": 391282, "epoch": 4714} {"train_loss": -26.341352462768555, "global_step": 391283, "epoch": 4714} {"train_loss": -26.2974796295166, "global_step": 391284, "epoch": 4714} {"train_loss": -26.309661865234375, "global_step": 391285, "epoch": 4714} {"train_loss": -26.40715980529785, "global_step": 391286, "epoch": 4714} {"train_loss": -26.308364868164062, "global_step": 391287, "epoch": 4714} {"train_loss": -26.332366943359375, "global_step": 391288, "epoch": 4714} {"train_loss": -26.454547882080078, "global_step": 391289, "epoch": 4714} {"train_loss": -26.564884185791016, "global_step": 391290, "epoch": 4714} {"train_loss": -26.953475952148438, "global_step": 391291, "epoch": 4714} {"train_loss": -26.73089027404785, "global_step": 391292, "epoch": 4714} {"train_loss": -26.630233764648438, "global_step": 391293, "epoch": 4714} {"train_loss": -26.789031982421875, "global_step": 391294, "epoch": 4714} {"train_loss": -26.337888717651367, "global_step": 391295, "epoch": 4714} {"train_loss": -26.770776748657227, "global_step": 391296, "epoch": 4714} {"train_loss": -26.25153160095215, "global_step": 391297, "epoch": 4714} {"train_loss": -26.786725997924805, "global_step": 391298, "epoch": 4714} {"train_loss": -26.627344131469727, "global_step": 391299, "epoch": 4714} {"train_loss": -26.82618522644043, "global_step": 391300, "epoch": 4714} {"train_loss": -26.135059356689453, "global_step": 391301, "epoch": 4714} {"train_loss": -26.553028106689453, "global_step": 391302, "epoch": 4714} {"train_loss": -26.845874786376953, "global_step": 391303, "epoch": 4714} {"train_loss": -26.87039566040039, "global_step": 391304, "epoch": 4714} {"train_loss": -26.891082763671875, "global_step": 391305, "epoch": 4714} {"train_loss": -26.443017959594727, "global_step": 391306, "epoch": 4714} {"train_loss": -26.790063858032227, "global_step": 391307, "epoch": 4714} {"train_loss": -26.48225975036621, "global_step": 391308, "epoch": 4714} {"train_loss": -26.474023818969727, "global_step": 391309, "epoch": 4714} {"train_loss": -26.896493911743164, "global_step": 391310, "epoch": 4714} {"train_loss": -26.718017578125, "global_step": 391311, "epoch": 4714} {"train_loss": -26.836124420166016, "global_step": 391312, "epoch": 4714} {"train_loss": -26.684162139892578, "global_step": 391313, "epoch": 4714} {"train_loss": -26.9970760345459, "global_step": 391314, "epoch": 4714} {"train_loss": -26.908430099487305, "global_step": 391315, "epoch": 4714} {"train_loss": -26.899072647094727, "global_step": 391316, "epoch": 4714} {"train_loss": -26.938352584838867, "global_step": 391317, "epoch": 4714} {"train_loss": -26.902448654174805, "global_step": 391318, "epoch": 4714} {"train_loss": -26.77597999572754, "global_step": 391319, "epoch": 4714} {"train_loss": -26.633056640625, "global_step": 391320, "epoch": 4714} {"train_loss": -26.260833740234375, "global_step": 391321, "epoch": 4714} {"train_loss": -26.54184913635254, "global_step": 391322, "epoch": 4714} {"train_loss": -26.781217575073242, "global_step": 391323, "epoch": 4714} {"train_loss": -26.530317306518555, "global_step": 391324, "epoch": 4714} {"train_loss": -26.402509689331055, "global_step": 391325, "epoch": 4714} {"train_loss": -26.829877853393555, "global_step": 391326, "epoch": 4714} {"train_loss": -26.477191925048828, "global_step": 391327, "epoch": 4714} {"train_loss": -26.687896728515625, "global_step": 391328, "epoch": 4714} {"train_loss": -26.001874923706055, "global_step": 391329, "epoch": 4714} {"train_loss": -25.80682373046875, "global_step": 391330, "epoch": 4714} {"train_loss": -25.624975204467773, "global_step": 391331, "epoch": 4714} {"train_loss": -26.35224723815918, "global_step": 391332, "epoch": 4714} {"train_loss": -26.167160034179688, "global_step": 391333, "epoch": 4714} {"train_loss": -26.354049682617188, "global_step": 391334, "epoch": 4714} {"train_loss": -26.011341094970703, "global_step": 391335, "epoch": 4714} {"train_loss": -26.007062911987305, "global_step": 391336, "epoch": 4714} {"train_loss": -26.297239303588867, "global_step": 391337, "epoch": 4714} {"train_loss": -26.31570816040039, "global_step": 391338, "epoch": 4714} {"train_loss": -26.44911003112793, "global_step": 391339, "epoch": 4714} {"train_loss": -26.36322021484375, "global_step": 391340, "epoch": 4714} {"train_loss": -26.771747589111328, "global_step": 391341, "epoch": 4714} {"train_loss": -26.35009765625, "global_step": 391342, "epoch": 4714} {"train_loss": -26.296283721923828, "global_step": 391343, "epoch": 4714} {"train_loss": -26.36559881646949, "global_step": 391344, "epoch": 4714, "val_loss": 6537091.0} {"train_loss": -26.027679443359375, "global_step": 391345, "epoch": 4715} {"train_loss": -25.95197868347168, "global_step": 391346, "epoch": 4715} {"train_loss": -25.971582412719727, "global_step": 391347, "epoch": 4715} {"train_loss": -26.14032554626465, "global_step": 391348, "epoch": 4715} {"train_loss": -26.331787109375, "global_step": 391349, "epoch": 4715} {"train_loss": -25.8250789642334, "global_step": 391350, "epoch": 4715} {"train_loss": -26.157428741455078, "global_step": 391351, "epoch": 4715} {"train_loss": -26.3431339263916, "global_step": 391352, "epoch": 4715} {"train_loss": -26.333337783813477, "global_step": 391353, "epoch": 4715} {"train_loss": -26.5640811920166, "global_step": 391354, "epoch": 4715} {"train_loss": -26.449817657470703, "global_step": 391355, "epoch": 4715} {"train_loss": -25.92283058166504, "global_step": 391356, "epoch": 4715} {"train_loss": -26.13355827331543, "global_step": 391357, "epoch": 4715} {"train_loss": -26.179288864135742, "global_step": 391358, "epoch": 4715} {"train_loss": -25.869003295898438, "global_step": 391359, "epoch": 4715} {"train_loss": -26.129837036132812, "global_step": 391360, "epoch": 4715} {"train_loss": -26.3436279296875, "global_step": 391361, "epoch": 4715} {"train_loss": -26.56900978088379, "global_step": 391362, "epoch": 4715} {"train_loss": -25.980487823486328, "global_step": 391363, "epoch": 4715} {"train_loss": -26.485605239868164, "global_step": 391364, "epoch": 4715} {"train_loss": -26.32435417175293, "global_step": 391365, "epoch": 4715} {"train_loss": -26.39475440979004, "global_step": 391366, "epoch": 4715} {"train_loss": -26.599756240844727, "global_step": 391367, "epoch": 4715} {"train_loss": -26.333337783813477, "global_step": 391368, "epoch": 4715} {"train_loss": -26.63576316833496, "global_step": 391369, "epoch": 4715} {"train_loss": -26.564777374267578, "global_step": 391370, "epoch": 4715} {"train_loss": -26.31159019470215, "global_step": 391371, "epoch": 4715} {"train_loss": -26.2712345123291, "global_step": 391372, "epoch": 4715} {"train_loss": -26.458845138549805, "global_step": 391373, "epoch": 4715} {"train_loss": -26.577301025390625, "global_step": 391374, "epoch": 4715} {"train_loss": -26.5699462890625, "global_step": 391375, "epoch": 4715} {"train_loss": -26.6785831451416, "global_step": 391376, "epoch": 4715} {"train_loss": -26.68768882751465, "global_step": 391377, "epoch": 4715} {"train_loss": -26.813413619995117, "global_step": 391378, "epoch": 4715} {"train_loss": -26.39948081970215, "global_step": 391379, "epoch": 4715} {"train_loss": -26.81633949279785, "global_step": 391380, "epoch": 4715} {"train_loss": -26.201330184936523, "global_step": 391381, "epoch": 4715} {"train_loss": -26.703454971313477, "global_step": 391382, "epoch": 4715} {"train_loss": -26.513813018798828, "global_step": 391383, "epoch": 4715} {"train_loss": -26.405195236206055, "global_step": 391384, "epoch": 4715} {"train_loss": -26.874876022338867, "global_step": 391385, "epoch": 4715} {"train_loss": -26.602319717407227, "global_step": 391386, "epoch": 4715} {"train_loss": -26.397109985351562, "global_step": 391387, "epoch": 4715} {"train_loss": -26.67473793029785, "global_step": 391388, "epoch": 4715} {"train_loss": -26.672088623046875, "global_step": 391389, "epoch": 4715} {"train_loss": -26.50992774963379, "global_step": 391390, "epoch": 4715} {"train_loss": -26.47637939453125, "global_step": 391391, "epoch": 4715} {"train_loss": -26.868000030517578, "global_step": 391392, "epoch": 4715} {"train_loss": -26.835874557495117, "global_step": 391393, "epoch": 4715} {"train_loss": -27.132184982299805, "global_step": 391394, "epoch": 4715} {"train_loss": -26.57421875, "global_step": 391395, "epoch": 4715} {"train_loss": -26.540006637573242, "global_step": 391396, "epoch": 4715} {"train_loss": -26.508569717407227, "global_step": 391397, "epoch": 4715} {"train_loss": -26.720518112182617, "global_step": 391398, "epoch": 4715} {"train_loss": -26.554290771484375, "global_step": 391399, "epoch": 4715} {"train_loss": -26.558332443237305, "global_step": 391400, "epoch": 4715} {"train_loss": -27.113040924072266, "global_step": 391401, "epoch": 4715} {"train_loss": -26.987552642822266, "global_step": 391402, "epoch": 4715} {"train_loss": -26.5841007232666, "global_step": 391403, "epoch": 4715} {"train_loss": -26.770526885986328, "global_step": 391404, "epoch": 4715} {"train_loss": -26.75874137878418, "global_step": 391405, "epoch": 4715} {"train_loss": -26.58121681213379, "global_step": 391406, "epoch": 4715} {"train_loss": -26.874719619750977, "global_step": 391407, "epoch": 4715} {"train_loss": -26.77678871154785, "global_step": 391408, "epoch": 4715} {"train_loss": -26.490142822265625, "global_step": 391409, "epoch": 4715} {"train_loss": -26.59088134765625, "global_step": 391410, "epoch": 4715} {"train_loss": -26.510236740112305, "global_step": 391411, "epoch": 4715} {"train_loss": -26.71009635925293, "global_step": 391412, "epoch": 4715} {"train_loss": -26.40421485900879, "global_step": 391413, "epoch": 4715} {"train_loss": -26.489139556884766, "global_step": 391414, "epoch": 4715} {"train_loss": -26.2581787109375, "global_step": 391415, "epoch": 4715} {"train_loss": -26.394392013549805, "global_step": 391416, "epoch": 4715} {"train_loss": -26.64666748046875, "global_step": 391417, "epoch": 4715} {"train_loss": -26.52985954284668, "global_step": 391418, "epoch": 4715} {"train_loss": -26.261474609375, "global_step": 391419, "epoch": 4715} {"train_loss": -26.537555694580078, "global_step": 391420, "epoch": 4715} {"train_loss": -26.62359619140625, "global_step": 391421, "epoch": 4715} {"train_loss": -26.526248931884766, "global_step": 391422, "epoch": 4715} {"train_loss": -26.4691162109375, "global_step": 391423, "epoch": 4715} {"train_loss": -26.62196159362793, "global_step": 391424, "epoch": 4715} {"train_loss": -26.447004318237305, "global_step": 391425, "epoch": 4715} {"train_loss": -26.62775993347168, "global_step": 391426, "epoch": 4715} {"train_loss": -26.498148033417852, "global_step": 391427, "epoch": 4715, "val_loss": 6596400.0} {"train_loss": -25.00306510925293, "global_step": 391428, "epoch": 4716} {"train_loss": -23.729047775268555, "global_step": 391429, "epoch": 4716} {"train_loss": -25.3597412109375, "global_step": 391430, "epoch": 4716} {"train_loss": -25.083328247070312, "global_step": 391431, "epoch": 4716} {"train_loss": -23.894458770751953, "global_step": 391432, "epoch": 4716} {"train_loss": -25.612104415893555, "global_step": 391433, "epoch": 4716} {"train_loss": -23.84030532836914, "global_step": 391434, "epoch": 4716} {"train_loss": -25.654699325561523, "global_step": 391435, "epoch": 4716} {"train_loss": -25.091474533081055, "global_step": 391436, "epoch": 4716} {"train_loss": -25.880334854125977, "global_step": 391437, "epoch": 4716} {"train_loss": -25.57236671447754, "global_step": 391438, "epoch": 4716} {"train_loss": -25.443832397460938, "global_step": 391439, "epoch": 4716} {"train_loss": -25.975629806518555, "global_step": 391440, "epoch": 4716} {"train_loss": -25.690778732299805, "global_step": 391441, "epoch": 4716} {"train_loss": -25.92255210876465, "global_step": 391442, "epoch": 4716} {"train_loss": -25.65182876586914, "global_step": 391443, "epoch": 4716} {"train_loss": -25.710412979125977, "global_step": 391444, "epoch": 4716} {"train_loss": -25.985254287719727, "global_step": 391445, "epoch": 4716} {"train_loss": -25.613449096679688, "global_step": 391446, "epoch": 4716} {"train_loss": -26.040990829467773, "global_step": 391447, "epoch": 4716} {"train_loss": -26.003341674804688, "global_step": 391448, "epoch": 4716} {"train_loss": -25.980133056640625, "global_step": 391449, "epoch": 4716} {"train_loss": -25.932050704956055, "global_step": 391450, "epoch": 4716} {"train_loss": -26.22639274597168, "global_step": 391451, "epoch": 4716} {"train_loss": -26.18049430847168, "global_step": 391452, "epoch": 4716} {"train_loss": -26.1014347076416, "global_step": 391453, "epoch": 4716} {"train_loss": -25.914011001586914, "global_step": 391454, "epoch": 4716} {"train_loss": -25.881061553955078, "global_step": 391455, "epoch": 4716} {"train_loss": -26.56159782409668, "global_step": 391456, "epoch": 4716} {"train_loss": -26.508066177368164, "global_step": 391457, "epoch": 4716} {"train_loss": -25.52461051940918, "global_step": 391458, "epoch": 4716} {"train_loss": -25.95758056640625, "global_step": 391459, "epoch": 4716} {"train_loss": -26.531152725219727, "global_step": 391460, "epoch": 4716} {"train_loss": -26.566421508789062, "global_step": 391461, "epoch": 4716} {"train_loss": -26.420698165893555, "global_step": 391462, "epoch": 4716} {"train_loss": -26.3828067779541, "global_step": 391463, "epoch": 4716} {"train_loss": -26.21295166015625, "global_step": 391464, "epoch": 4716} {"train_loss": -26.18829917907715, "global_step": 391465, "epoch": 4716} {"train_loss": -26.656543731689453, "global_step": 391466, "epoch": 4716} {"train_loss": -26.320911407470703, "global_step": 391467, "epoch": 4716} {"train_loss": -26.456268310546875, "global_step": 391468, "epoch": 4716} {"train_loss": -26.23015785217285, "global_step": 391469, "epoch": 4716} {"train_loss": -26.14863395690918, "global_step": 391470, "epoch": 4716} {"train_loss": -26.5809326171875, "global_step": 391471, "epoch": 4716} {"train_loss": -26.774463653564453, "global_step": 391472, "epoch": 4716} {"train_loss": -26.886877059936523, "global_step": 391473, "epoch": 4716} {"train_loss": -26.351715087890625, "global_step": 391474, "epoch": 4716} {"train_loss": -26.70977210998535, "global_step": 391475, "epoch": 4716} {"train_loss": -26.63466453552246, "global_step": 391476, "epoch": 4716} {"train_loss": -26.708677291870117, "global_step": 391477, "epoch": 4716} {"train_loss": -26.840118408203125, "global_step": 391478, "epoch": 4716} {"train_loss": -26.50885009765625, "global_step": 391479, "epoch": 4716} {"train_loss": -26.43930435180664, "global_step": 391480, "epoch": 4716} {"train_loss": -26.526243209838867, "global_step": 391481, "epoch": 4716} {"train_loss": -26.701627731323242, "global_step": 391482, "epoch": 4716} {"train_loss": -26.529220581054688, "global_step": 391483, "epoch": 4716} {"train_loss": -26.95256996154785, "global_step": 391484, "epoch": 4716} {"train_loss": -26.49226188659668, "global_step": 391485, "epoch": 4716} {"train_loss": -26.7622127532959, "global_step": 391486, "epoch": 4716} {"train_loss": -27.017690658569336, "global_step": 391487, "epoch": 4716} {"train_loss": -26.84946060180664, "global_step": 391488, "epoch": 4716} {"train_loss": -26.97757339477539, "global_step": 391489, "epoch": 4716} {"train_loss": -27.122465133666992, "global_step": 391490, "epoch": 4716} {"train_loss": -26.833189010620117, "global_step": 391491, "epoch": 4716} {"train_loss": -26.652780532836914, "global_step": 391492, "epoch": 4716} {"train_loss": -26.404129028320312, "global_step": 391493, "epoch": 4716} {"train_loss": -26.74725341796875, "global_step": 391494, "epoch": 4716} {"train_loss": -26.909006118774414, "global_step": 391495, "epoch": 4716} {"train_loss": -26.44610023498535, "global_step": 391496, "epoch": 4716} {"train_loss": -26.353662490844727, "global_step": 391497, "epoch": 4716} {"train_loss": -26.55970573425293, "global_step": 391498, "epoch": 4716} {"train_loss": -26.921823501586914, "global_step": 391499, "epoch": 4716} {"train_loss": -26.526731491088867, "global_step": 391500, "epoch": 4716} {"train_loss": -26.77461051940918, "global_step": 391501, "epoch": 4716} {"train_loss": -26.674362182617188, "global_step": 391502, "epoch": 4716} {"train_loss": -26.400842666625977, "global_step": 391503, "epoch": 4716} {"train_loss": -26.62531089782715, "global_step": 391504, "epoch": 4716} {"train_loss": -26.641040802001953, "global_step": 391505, "epoch": 4716} {"train_loss": -26.463830947875977, "global_step": 391506, "epoch": 4716} {"train_loss": -26.708906173706055, "global_step": 391507, "epoch": 4716} {"train_loss": -26.893375396728516, "global_step": 391508, "epoch": 4716} {"train_loss": -26.349414825439453, "global_step": 391509, "epoch": 4716} {"train_loss": -26.238040280629352, "global_step": 391510, "epoch": 4716, "val_loss": 6457753.0} {"train_loss": -26.349027633666992, "global_step": 391511, "epoch": 4717} {"train_loss": -26.305057525634766, "global_step": 391512, "epoch": 4717} {"train_loss": -26.123960494995117, "global_step": 391513, "epoch": 4717} {"train_loss": -26.131011962890625, "global_step": 391514, "epoch": 4717} {"train_loss": -25.866256713867188, "global_step": 391515, "epoch": 4717} {"train_loss": -26.027606964111328, "global_step": 391516, "epoch": 4717} {"train_loss": -26.486764907836914, "global_step": 391517, "epoch": 4717} {"train_loss": -26.48394775390625, "global_step": 391518, "epoch": 4717} {"train_loss": -26.73334312438965, "global_step": 391519, "epoch": 4717} {"train_loss": -26.82916259765625, "global_step": 391520, "epoch": 4717} {"train_loss": -26.463647842407227, "global_step": 391521, "epoch": 4717} {"train_loss": -26.44040298461914, "global_step": 391522, "epoch": 4717} {"train_loss": -26.486038208007812, "global_step": 391523, "epoch": 4717} {"train_loss": -26.760730743408203, "global_step": 391524, "epoch": 4717} {"train_loss": -26.6466007232666, "global_step": 391525, "epoch": 4717} {"train_loss": -26.527618408203125, "global_step": 391526, "epoch": 4717} {"train_loss": -26.723764419555664, "global_step": 391527, "epoch": 4717} {"train_loss": -26.73139762878418, "global_step": 391528, "epoch": 4717} {"train_loss": -26.77271842956543, "global_step": 391529, "epoch": 4717} {"train_loss": -26.75052261352539, "global_step": 391530, "epoch": 4717} {"train_loss": -26.3885440826416, "global_step": 391531, "epoch": 4717} {"train_loss": -26.748340606689453, "global_step": 391532, "epoch": 4717} {"train_loss": -26.42616081237793, "global_step": 391533, "epoch": 4717} {"train_loss": -26.675657272338867, "global_step": 391534, "epoch": 4717} {"train_loss": -26.667890548706055, "global_step": 391535, "epoch": 4717} {"train_loss": -26.3926944732666, "global_step": 391536, "epoch": 4717} {"train_loss": -26.5794620513916, "global_step": 391537, "epoch": 4717} {"train_loss": -26.60441017150879, "global_step": 391538, "epoch": 4717} {"train_loss": -26.51189613342285, "global_step": 391539, "epoch": 4717} {"train_loss": -26.7991943359375, "global_step": 391540, "epoch": 4717} {"train_loss": -26.630115509033203, "global_step": 391541, "epoch": 4717} {"train_loss": -26.726119995117188, "global_step": 391542, "epoch": 4717} {"train_loss": -26.735645294189453, "global_step": 391543, "epoch": 4717} {"train_loss": -26.7740535736084, "global_step": 391544, "epoch": 4717} {"train_loss": -26.890405654907227, "global_step": 391545, "epoch": 4717} {"train_loss": -26.26677894592285, "global_step": 391546, "epoch": 4717} {"train_loss": -26.512720108032227, "global_step": 391547, "epoch": 4717} {"train_loss": -26.562164306640625, "global_step": 391548, "epoch": 4717} {"train_loss": -26.61749267578125, "global_step": 391549, "epoch": 4717} {"train_loss": -26.87922477722168, "global_step": 391550, "epoch": 4717} {"train_loss": -26.4569149017334, "global_step": 391551, "epoch": 4717} {"train_loss": -26.6085205078125, "global_step": 391552, "epoch": 4717} {"train_loss": -26.679555892944336, "global_step": 391553, "epoch": 4717} {"train_loss": -26.4000186920166, "global_step": 391554, "epoch": 4717} {"train_loss": -26.397937774658203, "global_step": 391555, "epoch": 4717} {"train_loss": -26.5915584564209, "global_step": 391556, "epoch": 4717} {"train_loss": -26.923002243041992, "global_step": 391557, "epoch": 4717} {"train_loss": -26.38016700744629, "global_step": 391558, "epoch": 4717} {"train_loss": -26.78914451599121, "global_step": 391559, "epoch": 4717} {"train_loss": -26.898584365844727, "global_step": 391560, "epoch": 4717} {"train_loss": -26.51056480407715, "global_step": 391561, "epoch": 4717} {"train_loss": -26.423131942749023, "global_step": 391562, "epoch": 4717} {"train_loss": -26.890989303588867, "global_step": 391563, "epoch": 4717} {"train_loss": -26.557416915893555, "global_step": 391564, "epoch": 4717} {"train_loss": -26.681921005249023, "global_step": 391565, "epoch": 4717} {"train_loss": -26.78084373474121, "global_step": 391566, "epoch": 4717} {"train_loss": -26.558225631713867, "global_step": 391567, "epoch": 4717} {"train_loss": -26.605539321899414, "global_step": 391568, "epoch": 4717} {"train_loss": -26.809438705444336, "global_step": 391569, "epoch": 4717} {"train_loss": -26.244970321655273, "global_step": 391570, "epoch": 4717} {"train_loss": -26.522245407104492, "global_step": 391571, "epoch": 4717} {"train_loss": -25.951745986938477, "global_step": 391572, "epoch": 4717} {"train_loss": -25.328594207763672, "global_step": 391573, "epoch": 4717} {"train_loss": -25.595279693603516, "global_step": 391574, "epoch": 4717} {"train_loss": -26.122400283813477, "global_step": 391575, "epoch": 4717} {"train_loss": -26.28444480895996, "global_step": 391576, "epoch": 4717} {"train_loss": -25.832809448242188, "global_step": 391577, "epoch": 4717} {"train_loss": -25.49558448791504, "global_step": 391578, "epoch": 4717} {"train_loss": -26.2788028717041, "global_step": 391579, "epoch": 4717} {"train_loss": -26.558984756469727, "global_step": 391580, "epoch": 4717} {"train_loss": -25.922321319580078, "global_step": 391581, "epoch": 4717} {"train_loss": -26.501569747924805, "global_step": 391582, "epoch": 4717} {"train_loss": -26.201963424682617, "global_step": 391583, "epoch": 4717} {"train_loss": -26.164838790893555, "global_step": 391584, "epoch": 4717} {"train_loss": -25.855377197265625, "global_step": 391585, "epoch": 4717} {"train_loss": -26.38530921936035, "global_step": 391586, "epoch": 4717} {"train_loss": -26.32850456237793, "global_step": 391587, "epoch": 4717} {"train_loss": -26.193872451782227, "global_step": 391588, "epoch": 4717} {"train_loss": -26.43186378479004, "global_step": 391589, "epoch": 4717} {"train_loss": -26.09635353088379, "global_step": 391590, "epoch": 4717} {"train_loss": -26.30010414123535, "global_step": 391591, "epoch": 4717} {"train_loss": -26.682910919189453, "global_step": 391592, "epoch": 4717} {"train_loss": -26.450866492397815, "global_step": 391593, "epoch": 4717, "val_loss": 6596691.0} {"train_loss": -25.598360061645508, "global_step": 391594, "epoch": 4718} {"train_loss": -25.890335083007812, "global_step": 391595, "epoch": 4718} {"train_loss": -25.487234115600586, "global_step": 391596, "epoch": 4718} {"train_loss": -25.96404457092285, "global_step": 391597, "epoch": 4718} {"train_loss": -25.84527015686035, "global_step": 391598, "epoch": 4718} {"train_loss": -25.8957462310791, "global_step": 391599, "epoch": 4718} {"train_loss": -25.74689292907715, "global_step": 391600, "epoch": 4718} {"train_loss": -25.83430290222168, "global_step": 391601, "epoch": 4718} {"train_loss": -25.831146240234375, "global_step": 391602, "epoch": 4718} {"train_loss": -25.96998405456543, "global_step": 391603, "epoch": 4718} {"train_loss": -26.34585952758789, "global_step": 391604, "epoch": 4718} {"train_loss": -25.97999382019043, "global_step": 391605, "epoch": 4718} {"train_loss": -26.31214714050293, "global_step": 391606, "epoch": 4718} {"train_loss": -26.29681396484375, "global_step": 391607, "epoch": 4718} {"train_loss": -26.329328536987305, "global_step": 391608, "epoch": 4718} {"train_loss": -26.2005672454834, "global_step": 391609, "epoch": 4718} {"train_loss": -26.259607315063477, "global_step": 391610, "epoch": 4718} {"train_loss": -26.225269317626953, "global_step": 391611, "epoch": 4718} {"train_loss": -26.331525802612305, "global_step": 391612, "epoch": 4718} {"train_loss": -26.597253799438477, "global_step": 391613, "epoch": 4718} {"train_loss": -26.041784286499023, "global_step": 391614, "epoch": 4718} {"train_loss": -26.175251007080078, "global_step": 391615, "epoch": 4718} {"train_loss": -26.800729751586914, "global_step": 391616, "epoch": 4718} {"train_loss": -26.424285888671875, "global_step": 391617, "epoch": 4718} {"train_loss": -26.432092666625977, "global_step": 391618, "epoch": 4718} {"train_loss": -26.367704391479492, "global_step": 391619, "epoch": 4718} {"train_loss": -26.5335750579834, "global_step": 391620, "epoch": 4718} {"train_loss": -26.634687423706055, "global_step": 391621, "epoch": 4718} {"train_loss": -26.535364151000977, "global_step": 391622, "epoch": 4718} {"train_loss": -26.29852867126465, "global_step": 391623, "epoch": 4718} {"train_loss": -26.60995864868164, "global_step": 391624, "epoch": 4718} {"train_loss": -26.898792266845703, "global_step": 391625, "epoch": 4718} {"train_loss": -26.45488929748535, "global_step": 391626, "epoch": 4718} {"train_loss": -26.464099884033203, "global_step": 391627, "epoch": 4718} {"train_loss": -26.45684242248535, "global_step": 391628, "epoch": 4718} {"train_loss": -26.585540771484375, "global_step": 391629, "epoch": 4718} {"train_loss": -26.571720123291016, "global_step": 391630, "epoch": 4718} {"train_loss": -26.743040084838867, "global_step": 391631, "epoch": 4718} {"train_loss": -26.630523681640625, "global_step": 391632, "epoch": 4718} {"train_loss": -26.828113555908203, "global_step": 391633, "epoch": 4718} {"train_loss": -26.453174591064453, "global_step": 391634, "epoch": 4718} {"train_loss": -26.38263511657715, "global_step": 391635, "epoch": 4718} {"train_loss": -26.78791618347168, "global_step": 391636, "epoch": 4718} {"train_loss": -27.099353790283203, "global_step": 391637, "epoch": 4718} {"train_loss": -26.49222755432129, "global_step": 391638, "epoch": 4718} {"train_loss": -26.755847930908203, "global_step": 391639, "epoch": 4718} {"train_loss": -27.028656005859375, "global_step": 391640, "epoch": 4718} {"train_loss": -26.61094093322754, "global_step": 391641, "epoch": 4718} {"train_loss": -26.87949562072754, "global_step": 391642, "epoch": 4718} {"train_loss": -26.9324951171875, "global_step": 391643, "epoch": 4718} {"train_loss": -26.463895797729492, "global_step": 391644, "epoch": 4718} {"train_loss": -26.564355850219727, "global_step": 391645, "epoch": 4718} {"train_loss": -26.723438262939453, "global_step": 391646, "epoch": 4718} {"train_loss": -26.834003448486328, "global_step": 391647, "epoch": 4718} {"train_loss": -26.799030303955078, "global_step": 391648, "epoch": 4718} {"train_loss": -26.3731746673584, "global_step": 391649, "epoch": 4718} {"train_loss": -26.825002670288086, "global_step": 391650, "epoch": 4718} {"train_loss": -26.57478904724121, "global_step": 391651, "epoch": 4718} {"train_loss": -26.5388240814209, "global_step": 391652, "epoch": 4718} {"train_loss": -27.054845809936523, "global_step": 391653, "epoch": 4718} {"train_loss": -26.3664493560791, "global_step": 391654, "epoch": 4718} {"train_loss": -26.242767333984375, "global_step": 391655, "epoch": 4718} {"train_loss": -26.798450469970703, "global_step": 391656, "epoch": 4718} {"train_loss": -26.60845375061035, "global_step": 391657, "epoch": 4718} {"train_loss": -26.506244659423828, "global_step": 391658, "epoch": 4718} {"train_loss": -26.14723014831543, "global_step": 391659, "epoch": 4718} {"train_loss": -26.615949630737305, "global_step": 391660, "epoch": 4718} {"train_loss": -26.37952995300293, "global_step": 391661, "epoch": 4718} {"train_loss": -26.101659774780273, "global_step": 391662, "epoch": 4718} {"train_loss": -26.4576416015625, "global_step": 391663, "epoch": 4718} {"train_loss": -26.25348472595215, "global_step": 391664, "epoch": 4718} {"train_loss": -26.59034538269043, "global_step": 391665, "epoch": 4718} {"train_loss": -26.642475128173828, "global_step": 391666, "epoch": 4718} {"train_loss": -26.592498779296875, "global_step": 391667, "epoch": 4718} {"train_loss": -26.766550064086914, "global_step": 391668, "epoch": 4718} {"train_loss": -26.542163848876953, "global_step": 391669, "epoch": 4718} {"train_loss": -26.476593017578125, "global_step": 391670, "epoch": 4718} {"train_loss": -25.98240089416504, "global_step": 391671, "epoch": 4718} {"train_loss": -26.534748077392578, "global_step": 391672, "epoch": 4718} {"train_loss": -26.552001953125, "global_step": 391673, "epoch": 4718} {"train_loss": -26.552473068237305, "global_step": 391674, "epoch": 4718} {"train_loss": -26.628881454467773, "global_step": 391675, "epoch": 4718} {"train_loss": -26.442383524883223, "global_step": 391676, "epoch": 4718, "val_loss": 6604845.0} {"train_loss": -26.253305435180664, "global_step": 391677, "epoch": 4719} {"train_loss": -26.46918296813965, "global_step": 391678, "epoch": 4719} {"train_loss": -26.7219295501709, "global_step": 391679, "epoch": 4719} {"train_loss": -25.816516876220703, "global_step": 391680, "epoch": 4719} {"train_loss": -26.141250610351562, "global_step": 391681, "epoch": 4719} {"train_loss": -26.30108642578125, "global_step": 391682, "epoch": 4719} {"train_loss": -26.347309112548828, "global_step": 391683, "epoch": 4719} {"train_loss": -26.58473014831543, "global_step": 391684, "epoch": 4719} {"train_loss": -26.489347457885742, "global_step": 391685, "epoch": 4719} {"train_loss": -26.28019142150879, "global_step": 391686, "epoch": 4719} {"train_loss": -26.086084365844727, "global_step": 391687, "epoch": 4719} {"train_loss": -26.217477798461914, "global_step": 391688, "epoch": 4719} {"train_loss": -26.419897079467773, "global_step": 391689, "epoch": 4719} {"train_loss": -26.386707305908203, "global_step": 391690, "epoch": 4719} {"train_loss": -26.57258415222168, "global_step": 391691, "epoch": 4719} {"train_loss": -26.147918701171875, "global_step": 391692, "epoch": 4719} {"train_loss": -26.716894149780273, "global_step": 391693, "epoch": 4719} {"train_loss": -26.40357780456543, "global_step": 391694, "epoch": 4719} {"train_loss": -26.375476837158203, "global_step": 391695, "epoch": 4719} {"train_loss": -26.4063720703125, "global_step": 391696, "epoch": 4719} {"train_loss": -26.592182159423828, "global_step": 391697, "epoch": 4719} {"train_loss": -26.18940544128418, "global_step": 391698, "epoch": 4719} {"train_loss": -26.024328231811523, "global_step": 391699, "epoch": 4719} {"train_loss": -26.585773468017578, "global_step": 391700, "epoch": 4719} {"train_loss": -26.298236846923828, "global_step": 391701, "epoch": 4719} {"train_loss": -26.192380905151367, "global_step": 391702, "epoch": 4719} {"train_loss": -26.27634048461914, "global_step": 391703, "epoch": 4719} {"train_loss": -26.427738189697266, "global_step": 391704, "epoch": 4719} {"train_loss": -26.376846313476562, "global_step": 391705, "epoch": 4719} {"train_loss": -26.349807739257812, "global_step": 391706, "epoch": 4719} {"train_loss": -26.335693359375, "global_step": 391707, "epoch": 4719} {"train_loss": -26.418439865112305, "global_step": 391708, "epoch": 4719} {"train_loss": -25.97177505493164, "global_step": 391709, "epoch": 4719} {"train_loss": -26.189579010009766, "global_step": 391710, "epoch": 4719} {"train_loss": -26.340423583984375, "global_step": 391711, "epoch": 4719} {"train_loss": -26.73017692565918, "global_step": 391712, "epoch": 4719} {"train_loss": -26.50223159790039, "global_step": 391713, "epoch": 4719} {"train_loss": -26.910079956054688, "global_step": 391714, "epoch": 4719} {"train_loss": -26.455631256103516, "global_step": 391715, "epoch": 4719} {"train_loss": -26.565235137939453, "global_step": 391716, "epoch": 4719} {"train_loss": -26.639795303344727, "global_step": 391717, "epoch": 4719} {"train_loss": -26.958454132080078, "global_step": 391718, "epoch": 4719} {"train_loss": -26.737157821655273, "global_step": 391719, "epoch": 4719} {"train_loss": -26.6917781829834, "global_step": 391720, "epoch": 4719} {"train_loss": -26.890920639038086, "global_step": 391721, "epoch": 4719} {"train_loss": -26.898513793945312, "global_step": 391722, "epoch": 4719} {"train_loss": -26.849288940429688, "global_step": 391723, "epoch": 4719} {"train_loss": -26.942907333374023, "global_step": 391724, "epoch": 4719} {"train_loss": -26.685232162475586, "global_step": 391725, "epoch": 4719} {"train_loss": -26.95098304748535, "global_step": 391726, "epoch": 4719} {"train_loss": -27.005584716796875, "global_step": 391727, "epoch": 4719} {"train_loss": -26.91523551940918, "global_step": 391728, "epoch": 4719} {"train_loss": -26.772693634033203, "global_step": 391729, "epoch": 4719} {"train_loss": -26.7971134185791, "global_step": 391730, "epoch": 4719} {"train_loss": -26.4467716217041, "global_step": 391731, "epoch": 4719} {"train_loss": -26.67424964904785, "global_step": 391732, "epoch": 4719} {"train_loss": -26.797882080078125, "global_step": 391733, "epoch": 4719} {"train_loss": -26.456668853759766, "global_step": 391734, "epoch": 4719} {"train_loss": -26.438276290893555, "global_step": 391735, "epoch": 4719} {"train_loss": -26.483123779296875, "global_step": 391736, "epoch": 4719} {"train_loss": -26.73089599609375, "global_step": 391737, "epoch": 4719} {"train_loss": -26.798980712890625, "global_step": 391738, "epoch": 4719} {"train_loss": -26.859750747680664, "global_step": 391739, "epoch": 4719} {"train_loss": -26.2208251953125, "global_step": 391740, "epoch": 4719} {"train_loss": -26.293699264526367, "global_step": 391741, "epoch": 4719} {"train_loss": -26.63779640197754, "global_step": 391742, "epoch": 4719} {"train_loss": -26.642431259155273, "global_step": 391743, "epoch": 4719} {"train_loss": -26.581928253173828, "global_step": 391744, "epoch": 4719} {"train_loss": -26.537811279296875, "global_step": 391745, "epoch": 4719} {"train_loss": -26.708118438720703, "global_step": 391746, "epoch": 4719} {"train_loss": -26.473031997680664, "global_step": 391747, "epoch": 4719} {"train_loss": -26.500524520874023, "global_step": 391748, "epoch": 4719} {"train_loss": -26.649429321289062, "global_step": 391749, "epoch": 4719} {"train_loss": -26.374103546142578, "global_step": 391750, "epoch": 4719} {"train_loss": -26.43438720703125, "global_step": 391751, "epoch": 4719} {"train_loss": -26.698591232299805, "global_step": 391752, "epoch": 4719} {"train_loss": -26.55362319946289, "global_step": 391753, "epoch": 4719} {"train_loss": -26.341968536376953, "global_step": 391754, "epoch": 4719} {"train_loss": -26.434919357299805, "global_step": 391755, "epoch": 4719} {"train_loss": -26.211938858032227, "global_step": 391756, "epoch": 4719} {"train_loss": -26.33387565612793, "global_step": 391757, "epoch": 4719} {"train_loss": -26.13264274597168, "global_step": 391758, "epoch": 4719} {"train_loss": -26.502376947058252, "global_step": 391759, "epoch": 4719, "val_loss": 6637164.0} {"train_loss": -26.38250732421875, "global_step": 391760, "epoch": 4720} {"train_loss": -26.0350284576416, "global_step": 391761, "epoch": 4720} {"train_loss": -26.370908737182617, "global_step": 391762, "epoch": 4720} {"train_loss": -26.1224365234375, "global_step": 391763, "epoch": 4720} {"train_loss": -26.5697021484375, "global_step": 391764, "epoch": 4720} {"train_loss": -25.768041610717773, "global_step": 391765, "epoch": 4720} {"train_loss": -26.174732208251953, "global_step": 391766, "epoch": 4720} {"train_loss": -26.056745529174805, "global_step": 391767, "epoch": 4720} {"train_loss": -26.10378074645996, "global_step": 391768, "epoch": 4720} {"train_loss": -26.343759536743164, "global_step": 391769, "epoch": 4720} {"train_loss": -26.545530319213867, "global_step": 391770, "epoch": 4720} {"train_loss": -26.144397735595703, "global_step": 391771, "epoch": 4720} {"train_loss": -26.228015899658203, "global_step": 391772, "epoch": 4720} {"train_loss": -26.54874038696289, "global_step": 391773, "epoch": 4720} {"train_loss": -26.614185333251953, "global_step": 391774, "epoch": 4720} {"train_loss": -26.55120277404785, "global_step": 391775, "epoch": 4720} {"train_loss": -26.296674728393555, "global_step": 391776, "epoch": 4720} {"train_loss": -26.188674926757812, "global_step": 391777, "epoch": 4720} {"train_loss": -26.525541305541992, "global_step": 391778, "epoch": 4720} {"train_loss": -26.17081642150879, "global_step": 391779, "epoch": 4720} {"train_loss": -26.51385498046875, "global_step": 391780, "epoch": 4720} {"train_loss": -26.53447914123535, "global_step": 391781, "epoch": 4720} {"train_loss": -26.585790634155273, "global_step": 391782, "epoch": 4720} {"train_loss": -26.287490844726562, "global_step": 391783, "epoch": 4720} {"train_loss": -26.694547653198242, "global_step": 391784, "epoch": 4720} {"train_loss": -26.09432029724121, "global_step": 391785, "epoch": 4720} {"train_loss": -26.926420211791992, "global_step": 391786, "epoch": 4720} {"train_loss": -26.51971435546875, "global_step": 391787, "epoch": 4720} {"train_loss": -26.316822052001953, "global_step": 391788, "epoch": 4720} {"train_loss": -26.502302169799805, "global_step": 391789, "epoch": 4720} {"train_loss": -26.60169792175293, "global_step": 391790, "epoch": 4720} {"train_loss": -26.64991569519043, "global_step": 391791, "epoch": 4720} {"train_loss": -26.760793685913086, "global_step": 391792, "epoch": 4720} {"train_loss": -26.536767959594727, "global_step": 391793, "epoch": 4720} {"train_loss": -26.53965187072754, "global_step": 391794, "epoch": 4720} {"train_loss": -26.397857666015625, "global_step": 391795, "epoch": 4720} {"train_loss": -26.639822006225586, "global_step": 391796, "epoch": 4720} {"train_loss": -26.442096710205078, "global_step": 391797, "epoch": 4720} {"train_loss": -26.758834838867188, "global_step": 391798, "epoch": 4720} {"train_loss": -26.500991821289062, "global_step": 391799, "epoch": 4720} {"train_loss": -26.61248779296875, "global_step": 391800, "epoch": 4720} {"train_loss": -26.99200439453125, "global_step": 391801, "epoch": 4720} {"train_loss": -26.515262603759766, "global_step": 391802, "epoch": 4720} {"train_loss": -26.627368927001953, "global_step": 391803, "epoch": 4720} {"train_loss": -26.278583526611328, "global_step": 391804, "epoch": 4720} {"train_loss": -26.726593017578125, "global_step": 391805, "epoch": 4720} {"train_loss": -26.96796989440918, "global_step": 391806, "epoch": 4720} {"train_loss": -26.43072509765625, "global_step": 391807, "epoch": 4720} {"train_loss": -26.620853424072266, "global_step": 391808, "epoch": 4720} {"train_loss": -26.559940338134766, "global_step": 391809, "epoch": 4720} {"train_loss": -26.51055908203125, "global_step": 391810, "epoch": 4720} {"train_loss": -26.517181396484375, "global_step": 391811, "epoch": 4720} {"train_loss": -26.605392456054688, "global_step": 391812, "epoch": 4720} {"train_loss": -26.28643798828125, "global_step": 391813, "epoch": 4720} {"train_loss": -26.0779972076416, "global_step": 391814, "epoch": 4720} {"train_loss": -26.552759170532227, "global_step": 391815, "epoch": 4720} {"train_loss": -26.453012466430664, "global_step": 391816, "epoch": 4720} {"train_loss": -26.290868759155273, "global_step": 391817, "epoch": 4720} {"train_loss": -26.440876007080078, "global_step": 391818, "epoch": 4720} {"train_loss": -26.756261825561523, "global_step": 391819, "epoch": 4720} {"train_loss": -26.59451675415039, "global_step": 391820, "epoch": 4720} {"train_loss": -26.30917739868164, "global_step": 391821, "epoch": 4720} {"train_loss": -26.929121017456055, "global_step": 391822, "epoch": 4720} {"train_loss": -26.58930778503418, "global_step": 391823, "epoch": 4720} {"train_loss": -26.287656784057617, "global_step": 391824, "epoch": 4720} {"train_loss": -26.62635612487793, "global_step": 391825, "epoch": 4720} {"train_loss": -26.625782012939453, "global_step": 391826, "epoch": 4720} {"train_loss": -26.74659538269043, "global_step": 391827, "epoch": 4720} {"train_loss": -26.439502716064453, "global_step": 391828, "epoch": 4720} {"train_loss": -26.497289657592773, "global_step": 391829, "epoch": 4720} {"train_loss": -26.546995162963867, "global_step": 391830, "epoch": 4720} {"train_loss": -26.431318283081055, "global_step": 391831, "epoch": 4720} {"train_loss": -26.60042381286621, "global_step": 391832, "epoch": 4720} {"train_loss": -26.348928451538086, "global_step": 391833, "epoch": 4720} {"train_loss": -26.14515495300293, "global_step": 391834, "epoch": 4720} {"train_loss": -26.329267501831055, "global_step": 391835, "epoch": 4720} {"train_loss": -26.47566032409668, "global_step": 391836, "epoch": 4720} {"train_loss": -26.13690757751465, "global_step": 391837, "epoch": 4720} {"train_loss": -25.35565757751465, "global_step": 391838, "epoch": 4720} {"train_loss": -25.39918327331543, "global_step": 391839, "epoch": 4720} {"train_loss": -25.9858455657959, "global_step": 391840, "epoch": 4720} {"train_loss": -26.50592041015625, "global_step": 391841, "epoch": 4720} {"train_loss": -26.444996247808618, "global_step": 391842, "epoch": 4720, "val_loss": 6759156.0} {"train_loss": -25.82056999206543, "global_step": 391843, "epoch": 4721} {"train_loss": -25.18874168395996, "global_step": 391844, "epoch": 4721} {"train_loss": -25.9062442779541, "global_step": 391845, "epoch": 4721} {"train_loss": -25.317846298217773, "global_step": 391846, "epoch": 4721} {"train_loss": -25.852432250976562, "global_step": 391847, "epoch": 4721} {"train_loss": -25.724027633666992, "global_step": 391848, "epoch": 4721} {"train_loss": -25.551090240478516, "global_step": 391849, "epoch": 4721} {"train_loss": -25.677459716796875, "global_step": 391850, "epoch": 4721} {"train_loss": -25.723590850830078, "global_step": 391851, "epoch": 4721} {"train_loss": -25.861616134643555, "global_step": 391852, "epoch": 4721} {"train_loss": -25.90009880065918, "global_step": 391853, "epoch": 4721} {"train_loss": -25.641748428344727, "global_step": 391854, "epoch": 4721} {"train_loss": -25.83306312561035, "global_step": 391855, "epoch": 4721} {"train_loss": -26.1761417388916, "global_step": 391856, "epoch": 4721} {"train_loss": -26.31110191345215, "global_step": 391857, "epoch": 4721} {"train_loss": -26.16390037536621, "global_step": 391858, "epoch": 4721} {"train_loss": -26.155078887939453, "global_step": 391859, "epoch": 4721} {"train_loss": -25.715286254882812, "global_step": 391860, "epoch": 4721} {"train_loss": -26.265844345092773, "global_step": 391861, "epoch": 4721} {"train_loss": -25.86432456970215, "global_step": 391862, "epoch": 4721} {"train_loss": -26.2445011138916, "global_step": 391863, "epoch": 4721} {"train_loss": -26.3720760345459, "global_step": 391864, "epoch": 4721} {"train_loss": -25.897375106811523, "global_step": 391865, "epoch": 4721} {"train_loss": -26.0371036529541, "global_step": 391866, "epoch": 4721} {"train_loss": -26.358606338500977, "global_step": 391867, "epoch": 4721} {"train_loss": -26.306859970092773, "global_step": 391868, "epoch": 4721} {"train_loss": -26.27170753479004, "global_step": 391869, "epoch": 4721} {"train_loss": -26.474231719970703, "global_step": 391870, "epoch": 4721} {"train_loss": -26.263599395751953, "global_step": 391871, "epoch": 4721} {"train_loss": -26.236936569213867, "global_step": 391872, "epoch": 4721} {"train_loss": -26.464868545532227, "global_step": 391873, "epoch": 4721} {"train_loss": -26.551294326782227, "global_step": 391874, "epoch": 4721} {"train_loss": -26.273609161376953, "global_step": 391875, "epoch": 4721} {"train_loss": -26.32978630065918, "global_step": 391876, "epoch": 4721} {"train_loss": -26.589496612548828, "global_step": 391877, "epoch": 4721} {"train_loss": -26.53020668029785, "global_step": 391878, "epoch": 4721} {"train_loss": -26.45747184753418, "global_step": 391879, "epoch": 4721} {"train_loss": -26.59708595275879, "global_step": 391880, "epoch": 4721} {"train_loss": -26.908430099487305, "global_step": 391881, "epoch": 4721} {"train_loss": -26.554443359375, "global_step": 391882, "epoch": 4721} {"train_loss": -26.49068260192871, "global_step": 391883, "epoch": 4721} {"train_loss": -26.7005615234375, "global_step": 391884, "epoch": 4721} {"train_loss": -26.489410400390625, "global_step": 391885, "epoch": 4721} {"train_loss": -26.58088493347168, "global_step": 391886, "epoch": 4721} {"train_loss": -26.58515739440918, "global_step": 391887, "epoch": 4721} {"train_loss": -27.09842300415039, "global_step": 391888, "epoch": 4721} {"train_loss": -26.3170223236084, "global_step": 391889, "epoch": 4721} {"train_loss": -26.841754913330078, "global_step": 391890, "epoch": 4721} {"train_loss": -26.745885848999023, "global_step": 391891, "epoch": 4721} {"train_loss": -26.839948654174805, "global_step": 391892, "epoch": 4721} {"train_loss": -26.1456298828125, "global_step": 391893, "epoch": 4721} {"train_loss": -26.51702880859375, "global_step": 391894, "epoch": 4721} {"train_loss": -26.753021240234375, "global_step": 391895, "epoch": 4721} {"train_loss": -26.466413497924805, "global_step": 391896, "epoch": 4721} {"train_loss": -26.29334831237793, "global_step": 391897, "epoch": 4721} {"train_loss": -26.185169219970703, "global_step": 391898, "epoch": 4721} {"train_loss": -26.81858253479004, "global_step": 391899, "epoch": 4721} {"train_loss": -26.6297664642334, "global_step": 391900, "epoch": 4721} {"train_loss": -26.53431510925293, "global_step": 391901, "epoch": 4721} {"train_loss": -26.5324764251709, "global_step": 391902, "epoch": 4721} {"train_loss": -26.559534072875977, "global_step": 391903, "epoch": 4721} {"train_loss": -26.610382080078125, "global_step": 391904, "epoch": 4721} {"train_loss": -26.297882080078125, "global_step": 391905, "epoch": 4721} {"train_loss": -26.702890396118164, "global_step": 391906, "epoch": 4721} {"train_loss": -26.646820068359375, "global_step": 391907, "epoch": 4721} {"train_loss": -26.521350860595703, "global_step": 391908, "epoch": 4721} {"train_loss": -26.794004440307617, "global_step": 391909, "epoch": 4721} {"train_loss": -26.461395263671875, "global_step": 391910, "epoch": 4721} {"train_loss": -26.771865844726562, "global_step": 391911, "epoch": 4721} {"train_loss": -26.6616153717041, "global_step": 391912, "epoch": 4721} {"train_loss": -26.401052474975586, "global_step": 391913, "epoch": 4721} {"train_loss": -26.138463973999023, "global_step": 391914, "epoch": 4721} {"train_loss": -26.65390968322754, "global_step": 391915, "epoch": 4721} {"train_loss": -26.701828002929688, "global_step": 391916, "epoch": 4721} {"train_loss": -26.4094295501709, "global_step": 391917, "epoch": 4721} {"train_loss": -26.73121452331543, "global_step": 391918, "epoch": 4721} {"train_loss": -26.5018367767334, "global_step": 391919, "epoch": 4721} {"train_loss": -26.265338897705078, "global_step": 391920, "epoch": 4721} {"train_loss": -26.222890853881836, "global_step": 391921, "epoch": 4721} {"train_loss": -25.803796768188477, "global_step": 391922, "epoch": 4721} {"train_loss": -26.457624435424805, "global_step": 391923, "epoch": 4721} {"train_loss": -26.769262313842773, "global_step": 391924, "epoch": 4721} {"train_loss": -26.333531712911213, "global_step": 391925, "epoch": 4721, "val_loss": 6478105.0} {"train_loss": -24.526203155517578, "global_step": 391926, "epoch": 4722} {"train_loss": -23.79804039001465, "global_step": 391927, "epoch": 4722} {"train_loss": -25.13771629333496, "global_step": 391928, "epoch": 4722} {"train_loss": -24.673490524291992, "global_step": 391929, "epoch": 4722} {"train_loss": -25.41870880126953, "global_step": 391930, "epoch": 4722} {"train_loss": -24.66055679321289, "global_step": 391931, "epoch": 4722} {"train_loss": -25.627521514892578, "global_step": 391932, "epoch": 4722} {"train_loss": -25.231618881225586, "global_step": 391933, "epoch": 4722} {"train_loss": -25.845508575439453, "global_step": 391934, "epoch": 4722} {"train_loss": -25.270526885986328, "global_step": 391935, "epoch": 4722} {"train_loss": -25.348724365234375, "global_step": 391936, "epoch": 4722} {"train_loss": -25.44213104248047, "global_step": 391937, "epoch": 4722} {"train_loss": -25.77288246154785, "global_step": 391938, "epoch": 4722} {"train_loss": -25.598867416381836, "global_step": 391939, "epoch": 4722} {"train_loss": -25.33497428894043, "global_step": 391940, "epoch": 4722} {"train_loss": -25.788354873657227, "global_step": 391941, "epoch": 4722} {"train_loss": -26.009897232055664, "global_step": 391942, "epoch": 4722} {"train_loss": -25.93400001525879, "global_step": 391943, "epoch": 4722} {"train_loss": -25.742889404296875, "global_step": 391944, "epoch": 4722} {"train_loss": -26.029184341430664, "global_step": 391945, "epoch": 4722} {"train_loss": -26.131010055541992, "global_step": 391946, "epoch": 4722} {"train_loss": -26.311010360717773, "global_step": 391947, "epoch": 4722} {"train_loss": -25.894092559814453, "global_step": 391948, "epoch": 4722} {"train_loss": -25.769968032836914, "global_step": 391949, "epoch": 4722} {"train_loss": -26.16864013671875, "global_step": 391950, "epoch": 4722} {"train_loss": -26.005767822265625, "global_step": 391951, "epoch": 4722} {"train_loss": -25.92045021057129, "global_step": 391952, "epoch": 4722} {"train_loss": -26.01840591430664, "global_step": 391953, "epoch": 4722} {"train_loss": -26.287525177001953, "global_step": 391954, "epoch": 4722} {"train_loss": -26.291440963745117, "global_step": 391955, "epoch": 4722} {"train_loss": -26.419178009033203, "global_step": 391956, "epoch": 4722} {"train_loss": -26.580320358276367, "global_step": 391957, "epoch": 4722} {"train_loss": -26.685626983642578, "global_step": 391958, "epoch": 4722} {"train_loss": -26.73091697692871, "global_step": 391959, "epoch": 4722} {"train_loss": -26.441152572631836, "global_step": 391960, "epoch": 4722} {"train_loss": -26.43818473815918, "global_step": 391961, "epoch": 4722} {"train_loss": -26.78272819519043, "global_step": 391962, "epoch": 4722} {"train_loss": -26.439233779907227, "global_step": 391963, "epoch": 4722} {"train_loss": -26.240896224975586, "global_step": 391964, "epoch": 4722} {"train_loss": -26.7270450592041, "global_step": 391965, "epoch": 4722} {"train_loss": -26.3685359954834, "global_step": 391966, "epoch": 4722} {"train_loss": -26.560224533081055, "global_step": 391967, "epoch": 4722} {"train_loss": -26.533893585205078, "global_step": 391968, "epoch": 4722} {"train_loss": -26.62127685546875, "global_step": 391969, "epoch": 4722} {"train_loss": -26.56879234313965, "global_step": 391970, "epoch": 4722} {"train_loss": -26.587621688842773, "global_step": 391971, "epoch": 4722} {"train_loss": -26.63557243347168, "global_step": 391972, "epoch": 4722} {"train_loss": -26.538360595703125, "global_step": 391973, "epoch": 4722} {"train_loss": -26.652923583984375, "global_step": 391974, "epoch": 4722} {"train_loss": -26.510297775268555, "global_step": 391975, "epoch": 4722} {"train_loss": -26.459009170532227, "global_step": 391976, "epoch": 4722} {"train_loss": -26.737829208374023, "global_step": 391977, "epoch": 4722} {"train_loss": -26.388824462890625, "global_step": 391978, "epoch": 4722} {"train_loss": -26.607404708862305, "global_step": 391979, "epoch": 4722} {"train_loss": -26.99176025390625, "global_step": 391980, "epoch": 4722} {"train_loss": -26.98658561706543, "global_step": 391981, "epoch": 4722} {"train_loss": -26.7290096282959, "global_step": 391982, "epoch": 4722} {"train_loss": -26.761762619018555, "global_step": 391983, "epoch": 4722} {"train_loss": -26.841461181640625, "global_step": 391984, "epoch": 4722} {"train_loss": -26.741226196289062, "global_step": 391985, "epoch": 4722} {"train_loss": -26.369367599487305, "global_step": 391986, "epoch": 4722} {"train_loss": -26.7010498046875, "global_step": 391987, "epoch": 4722} {"train_loss": -26.986684799194336, "global_step": 391988, "epoch": 4722} {"train_loss": -26.501819610595703, "global_step": 391989, "epoch": 4722} {"train_loss": -26.543615341186523, "global_step": 391990, "epoch": 4722} {"train_loss": -26.59228515625, "global_step": 391991, "epoch": 4722} {"train_loss": -26.605676651000977, "global_step": 391992, "epoch": 4722} {"train_loss": -26.424524307250977, "global_step": 391993, "epoch": 4722} {"train_loss": -26.679182052612305, "global_step": 391994, "epoch": 4722} {"train_loss": -26.221715927124023, "global_step": 391995, "epoch": 4722} {"train_loss": -26.387731552124023, "global_step": 391996, "epoch": 4722} {"train_loss": -26.589380264282227, "global_step": 391997, "epoch": 4722} {"train_loss": -26.496856689453125, "global_step": 391998, "epoch": 4722} {"train_loss": -26.356367111206055, "global_step": 391999, "epoch": 4722} {"train_loss": -26.161481857299805, "global_step": 392000, "epoch": 4722} {"train_loss": -26.233285903930664, "global_step": 392001, "epoch": 4722} {"train_loss": -26.380695343017578, "global_step": 392002, "epoch": 4722} {"train_loss": -26.708206176757812, "global_step": 392003, "epoch": 4722} {"train_loss": -26.385446548461914, "global_step": 392004, "epoch": 4722} {"train_loss": -26.535694122314453, "global_step": 392005, "epoch": 4722} {"train_loss": -26.151880264282227, "global_step": 392006, "epoch": 4722} {"train_loss": -26.420251846313477, "global_step": 392007, "epoch": 4722} {"train_loss": -26.208254848618104, "global_step": 392008, "epoch": 4722, "val_loss": 6706789.0} {"train_loss": -26.038654327392578, "global_step": 392009, "epoch": 4723} {"train_loss": -26.185489654541016, "global_step": 392010, "epoch": 4723} {"train_loss": -26.1591796875, "global_step": 392011, "epoch": 4723} {"train_loss": -26.391347885131836, "global_step": 392012, "epoch": 4723} {"train_loss": -26.247406005859375, "global_step": 392013, "epoch": 4723} {"train_loss": -26.159543991088867, "global_step": 392014, "epoch": 4723} {"train_loss": -26.44598388671875, "global_step": 392015, "epoch": 4723} {"train_loss": -26.18659782409668, "global_step": 392016, "epoch": 4723} {"train_loss": -26.52280044555664, "global_step": 392017, "epoch": 4723} {"train_loss": -26.149078369140625, "global_step": 392018, "epoch": 4723} {"train_loss": -26.112207412719727, "global_step": 392019, "epoch": 4723} {"train_loss": -26.432031631469727, "global_step": 392020, "epoch": 4723} {"train_loss": -25.999088287353516, "global_step": 392021, "epoch": 4723} {"train_loss": -26.361608505249023, "global_step": 392022, "epoch": 4723} {"train_loss": -26.634159088134766, "global_step": 392023, "epoch": 4723} {"train_loss": -26.167007446289062, "global_step": 392024, "epoch": 4723} {"train_loss": -26.402633666992188, "global_step": 392025, "epoch": 4723} {"train_loss": -26.45546531677246, "global_step": 392026, "epoch": 4723} {"train_loss": -26.62457847595215, "global_step": 392027, "epoch": 4723} {"train_loss": -26.782052993774414, "global_step": 392028, "epoch": 4723} {"train_loss": -26.6591854095459, "global_step": 392029, "epoch": 4723} {"train_loss": -26.348928451538086, "global_step": 392030, "epoch": 4723} {"train_loss": -26.325302124023438, "global_step": 392031, "epoch": 4723} {"train_loss": -26.666431427001953, "global_step": 392032, "epoch": 4723} {"train_loss": -26.463560104370117, "global_step": 392033, "epoch": 4723} {"train_loss": -26.516454696655273, "global_step": 392034, "epoch": 4723} {"train_loss": -26.2903995513916, "global_step": 392035, "epoch": 4723} {"train_loss": -26.532062530517578, "global_step": 392036, "epoch": 4723} {"train_loss": -26.88187026977539, "global_step": 392037, "epoch": 4723} {"train_loss": -26.351377487182617, "global_step": 392038, "epoch": 4723} {"train_loss": -26.93536376953125, "global_step": 392039, "epoch": 4723} {"train_loss": -26.572071075439453, "global_step": 392040, "epoch": 4723} {"train_loss": -26.3275089263916, "global_step": 392041, "epoch": 4723} {"train_loss": -26.3040714263916, "global_step": 392042, "epoch": 4723} {"train_loss": -25.43918800354004, "global_step": 392043, "epoch": 4723} {"train_loss": -26.092731475830078, "global_step": 392044, "epoch": 4723} {"train_loss": -26.42658805847168, "global_step": 392045, "epoch": 4723} {"train_loss": -26.032522201538086, "global_step": 392046, "epoch": 4723} {"train_loss": -26.34136962890625, "global_step": 392047, "epoch": 4723} {"train_loss": -26.123870849609375, "global_step": 392048, "epoch": 4723} {"train_loss": -26.076955795288086, "global_step": 392049, "epoch": 4723} {"train_loss": -26.45777702331543, "global_step": 392050, "epoch": 4723} {"train_loss": -26.213058471679688, "global_step": 392051, "epoch": 4723} {"train_loss": -26.214099884033203, "global_step": 392052, "epoch": 4723} {"train_loss": -26.32297706604004, "global_step": 392053, "epoch": 4723} {"train_loss": -26.42176628112793, "global_step": 392054, "epoch": 4723} {"train_loss": -26.183441162109375, "global_step": 392055, "epoch": 4723} {"train_loss": -26.82246208190918, "global_step": 392056, "epoch": 4723} {"train_loss": -26.583600997924805, "global_step": 392057, "epoch": 4723} {"train_loss": -26.333087921142578, "global_step": 392058, "epoch": 4723} {"train_loss": -26.536222457885742, "global_step": 392059, "epoch": 4723} {"train_loss": -25.9649715423584, "global_step": 392060, "epoch": 4723} {"train_loss": -26.19146728515625, "global_step": 392061, "epoch": 4723} {"train_loss": -26.37160301208496, "global_step": 392062, "epoch": 4723} {"train_loss": -26.258230209350586, "global_step": 392063, "epoch": 4723} {"train_loss": -26.44294548034668, "global_step": 392064, "epoch": 4723} {"train_loss": -26.760730743408203, "global_step": 392065, "epoch": 4723} {"train_loss": -26.222864151000977, "global_step": 392066, "epoch": 4723} {"train_loss": -26.521305084228516, "global_step": 392067, "epoch": 4723} {"train_loss": -26.38678550720215, "global_step": 392068, "epoch": 4723} {"train_loss": -26.394454956054688, "global_step": 392069, "epoch": 4723} {"train_loss": -26.313756942749023, "global_step": 392070, "epoch": 4723} {"train_loss": -26.55438804626465, "global_step": 392071, "epoch": 4723} {"train_loss": -26.635786056518555, "global_step": 392072, "epoch": 4723} {"train_loss": -26.291004180908203, "global_step": 392073, "epoch": 4723} {"train_loss": -26.21337890625, "global_step": 392074, "epoch": 4723} {"train_loss": -26.663686752319336, "global_step": 392075, "epoch": 4723} {"train_loss": -26.65595817565918, "global_step": 392076, "epoch": 4723} {"train_loss": -26.269445419311523, "global_step": 392077, "epoch": 4723} {"train_loss": -26.601409912109375, "global_step": 392078, "epoch": 4723} {"train_loss": -26.7347354888916, "global_step": 392079, "epoch": 4723} {"train_loss": -26.85196876525879, "global_step": 392080, "epoch": 4723} {"train_loss": -26.462905883789062, "global_step": 392081, "epoch": 4723} {"train_loss": -26.323974609375, "global_step": 392082, "epoch": 4723} {"train_loss": -26.64426612854004, "global_step": 392083, "epoch": 4723} {"train_loss": -26.426589965820312, "global_step": 392084, "epoch": 4723} {"train_loss": -27.054840087890625, "global_step": 392085, "epoch": 4723} {"train_loss": -26.844898223876953, "global_step": 392086, "epoch": 4723} {"train_loss": -27.135623931884766, "global_step": 392087, "epoch": 4723} {"train_loss": -26.78948402404785, "global_step": 392088, "epoch": 4723} {"train_loss": -26.437854766845703, "global_step": 392089, "epoch": 4723} {"train_loss": -26.872156143188477, "global_step": 392090, "epoch": 4723} {"train_loss": -26.424585204526604, "global_step": 392091, "epoch": 4723, "val_loss": 6764947.5} {"train_loss": -26.339563369750977, "global_step": 392092, "epoch": 4724} {"train_loss": -26.246173858642578, "global_step": 392093, "epoch": 4724} {"train_loss": -26.44611167907715, "global_step": 392094, "epoch": 4724} {"train_loss": -26.530841827392578, "global_step": 392095, "epoch": 4724} {"train_loss": -26.309051513671875, "global_step": 392096, "epoch": 4724} {"train_loss": -26.301176071166992, "global_step": 392097, "epoch": 4724} {"train_loss": -26.5982723236084, "global_step": 392098, "epoch": 4724} {"train_loss": -26.447660446166992, "global_step": 392099, "epoch": 4724} {"train_loss": -26.207265853881836, "global_step": 392100, "epoch": 4724} {"train_loss": -26.389806747436523, "global_step": 392101, "epoch": 4724} {"train_loss": -26.456327438354492, "global_step": 392102, "epoch": 4724} {"train_loss": -26.29825782775879, "global_step": 392103, "epoch": 4724} {"train_loss": -26.406238555908203, "global_step": 392104, "epoch": 4724} {"train_loss": -26.34126091003418, "global_step": 392105, "epoch": 4724} {"train_loss": -26.742624282836914, "global_step": 392106, "epoch": 4724} {"train_loss": -26.270811080932617, "global_step": 392107, "epoch": 4724} {"train_loss": -26.366418838500977, "global_step": 392108, "epoch": 4724} {"train_loss": -25.9751033782959, "global_step": 392109, "epoch": 4724} {"train_loss": -26.58669090270996, "global_step": 392110, "epoch": 4724} {"train_loss": -26.390060424804688, "global_step": 392111, "epoch": 4724} {"train_loss": -26.302114486694336, "global_step": 392112, "epoch": 4724} {"train_loss": -26.330875396728516, "global_step": 392113, "epoch": 4724} {"train_loss": -26.035608291625977, "global_step": 392114, "epoch": 4724} {"train_loss": -26.174680709838867, "global_step": 392115, "epoch": 4724} {"train_loss": -26.582218170166016, "global_step": 392116, "epoch": 4724} {"train_loss": -26.35321044921875, "global_step": 392117, "epoch": 4724} {"train_loss": -26.429885864257812, "global_step": 392118, "epoch": 4724} {"train_loss": -26.566251754760742, "global_step": 392119, "epoch": 4724} {"train_loss": -26.541767120361328, "global_step": 392120, "epoch": 4724} {"train_loss": -26.85686683654785, "global_step": 392121, "epoch": 4724} {"train_loss": -26.306360244750977, "global_step": 392122, "epoch": 4724} {"train_loss": -26.773630142211914, "global_step": 392123, "epoch": 4724} {"train_loss": -26.470441818237305, "global_step": 392124, "epoch": 4724} {"train_loss": -26.96417808532715, "global_step": 392125, "epoch": 4724} {"train_loss": -26.36736488342285, "global_step": 392126, "epoch": 4724} {"train_loss": -26.7487735748291, "global_step": 392127, "epoch": 4724} {"train_loss": -26.5765323638916, "global_step": 392128, "epoch": 4724} {"train_loss": -26.62470054626465, "global_step": 392129, "epoch": 4724} {"train_loss": -26.27984619140625, "global_step": 392130, "epoch": 4724} {"train_loss": -26.088281631469727, "global_step": 392131, "epoch": 4724} {"train_loss": -26.63772964477539, "global_step": 392132, "epoch": 4724} {"train_loss": -26.758304595947266, "global_step": 392133, "epoch": 4724} {"train_loss": -26.236234664916992, "global_step": 392134, "epoch": 4724} {"train_loss": -26.73628807067871, "global_step": 392135, "epoch": 4724} {"train_loss": -26.64253044128418, "global_step": 392136, "epoch": 4724} {"train_loss": -26.457990646362305, "global_step": 392137, "epoch": 4724} {"train_loss": -26.775075912475586, "global_step": 392138, "epoch": 4724} {"train_loss": -26.570459365844727, "global_step": 392139, "epoch": 4724} {"train_loss": -26.33782958984375, "global_step": 392140, "epoch": 4724} {"train_loss": -26.808399200439453, "global_step": 392141, "epoch": 4724} {"train_loss": -26.08863639831543, "global_step": 392142, "epoch": 4724} {"train_loss": -26.78321647644043, "global_step": 392143, "epoch": 4724} {"train_loss": -26.560327529907227, "global_step": 392144, "epoch": 4724} {"train_loss": -26.02814292907715, "global_step": 392145, "epoch": 4724} {"train_loss": -26.23552894592285, "global_step": 392146, "epoch": 4724} {"train_loss": -25.8835391998291, "global_step": 392147, "epoch": 4724} {"train_loss": -26.314029693603516, "global_step": 392148, "epoch": 4724} {"train_loss": -26.712621688842773, "global_step": 392149, "epoch": 4724} {"train_loss": -26.357868194580078, "global_step": 392150, "epoch": 4724} {"train_loss": -26.466205596923828, "global_step": 392151, "epoch": 4724} {"train_loss": -26.47528648376465, "global_step": 392152, "epoch": 4724} {"train_loss": -26.52308464050293, "global_step": 392153, "epoch": 4724} {"train_loss": -26.460418701171875, "global_step": 392154, "epoch": 4724} {"train_loss": -26.514280319213867, "global_step": 392155, "epoch": 4724} {"train_loss": -26.404621124267578, "global_step": 392156, "epoch": 4724} {"train_loss": -26.26715660095215, "global_step": 392157, "epoch": 4724} {"train_loss": -26.551828384399414, "global_step": 392158, "epoch": 4724} {"train_loss": -26.42279052734375, "global_step": 392159, "epoch": 4724} {"train_loss": -26.325971603393555, "global_step": 392160, "epoch": 4724} {"train_loss": -26.3939151763916, "global_step": 392161, "epoch": 4724} {"train_loss": -26.442060470581055, "global_step": 392162, "epoch": 4724} {"train_loss": -26.365924835205078, "global_step": 392163, "epoch": 4724} {"train_loss": -26.478443145751953, "global_step": 392164, "epoch": 4724} {"train_loss": -26.212249755859375, "global_step": 392165, "epoch": 4724} {"train_loss": -26.673002243041992, "global_step": 392166, "epoch": 4724} {"train_loss": -26.473386764526367, "global_step": 392167, "epoch": 4724} {"train_loss": -25.938251495361328, "global_step": 392168, "epoch": 4724} {"train_loss": -26.79937171936035, "global_step": 392169, "epoch": 4724} {"train_loss": -26.2929630279541, "global_step": 392170, "epoch": 4724} {"train_loss": -26.283334732055664, "global_step": 392171, "epoch": 4724} {"train_loss": -26.2174072265625, "global_step": 392172, "epoch": 4724} {"train_loss": -26.767332077026367, "global_step": 392173, "epoch": 4724} {"train_loss": -26.43779033063406, "global_step": 392174, "epoch": 4724, "val_loss": 6701990.5} {"train_loss": -26.083816528320312, "global_step": 392175, "epoch": 4725} {"train_loss": -26.604223251342773, "global_step": 392176, "epoch": 4725} {"train_loss": -26.677534103393555, "global_step": 392177, "epoch": 4725} {"train_loss": -26.369314193725586, "global_step": 392178, "epoch": 4725} {"train_loss": -26.254791259765625, "global_step": 392179, "epoch": 4725} {"train_loss": -26.23860740661621, "global_step": 392180, "epoch": 4725} {"train_loss": -26.234907150268555, "global_step": 392181, "epoch": 4725} {"train_loss": -26.479318618774414, "global_step": 392182, "epoch": 4725} {"train_loss": -26.390966415405273, "global_step": 392183, "epoch": 4725} {"train_loss": -26.258106231689453, "global_step": 392184, "epoch": 4725} {"train_loss": -26.6057071685791, "global_step": 392185, "epoch": 4725} {"train_loss": -26.2557373046875, "global_step": 392186, "epoch": 4725} {"train_loss": -26.266345977783203, "global_step": 392187, "epoch": 4725} {"train_loss": -26.24966812133789, "global_step": 392188, "epoch": 4725} {"train_loss": -26.391143798828125, "global_step": 392189, "epoch": 4725} {"train_loss": -26.82461929321289, "global_step": 392190, "epoch": 4725} {"train_loss": -26.664880752563477, "global_step": 392191, "epoch": 4725} {"train_loss": -26.791051864624023, "global_step": 392192, "epoch": 4725} {"train_loss": -26.35459327697754, "global_step": 392193, "epoch": 4725} {"train_loss": -26.554174423217773, "global_step": 392194, "epoch": 4725} {"train_loss": -26.720218658447266, "global_step": 392195, "epoch": 4725} {"train_loss": -26.546918869018555, "global_step": 392196, "epoch": 4725} {"train_loss": -27.059783935546875, "global_step": 392197, "epoch": 4725} {"train_loss": -26.56073570251465, "global_step": 392198, "epoch": 4725} {"train_loss": -26.359710693359375, "global_step": 392199, "epoch": 4725} {"train_loss": -26.684167861938477, "global_step": 392200, "epoch": 4725} {"train_loss": -26.47089195251465, "global_step": 392201, "epoch": 4725} {"train_loss": -26.441425323486328, "global_step": 392202, "epoch": 4725} {"train_loss": -26.672330856323242, "global_step": 392203, "epoch": 4725} {"train_loss": -26.81293296813965, "global_step": 392204, "epoch": 4725} {"train_loss": -26.465591430664062, "global_step": 392205, "epoch": 4725} {"train_loss": -26.49213218688965, "global_step": 392206, "epoch": 4725} {"train_loss": -26.80011558532715, "global_step": 392207, "epoch": 4725} {"train_loss": -26.646284103393555, "global_step": 392208, "epoch": 4725} {"train_loss": -26.8115291595459, "global_step": 392209, "epoch": 4725} {"train_loss": -26.870349884033203, "global_step": 392210, "epoch": 4725} {"train_loss": -26.3745174407959, "global_step": 392211, "epoch": 4725} {"train_loss": -26.517446517944336, "global_step": 392212, "epoch": 4725} {"train_loss": -26.653024673461914, "global_step": 392213, "epoch": 4725} {"train_loss": -26.573740005493164, "global_step": 392214, "epoch": 4725} {"train_loss": -26.947126388549805, "global_step": 392215, "epoch": 4725} {"train_loss": -26.240097045898438, "global_step": 392216, "epoch": 4725} {"train_loss": -26.35550308227539, "global_step": 392217, "epoch": 4725} {"train_loss": -26.695249557495117, "global_step": 392218, "epoch": 4725} {"train_loss": -26.33806800842285, "global_step": 392219, "epoch": 4725} {"train_loss": -26.31015968322754, "global_step": 392220, "epoch": 4725} {"train_loss": -26.206769943237305, "global_step": 392221, "epoch": 4725} {"train_loss": -26.123310089111328, "global_step": 392222, "epoch": 4725} {"train_loss": -26.862686157226562, "global_step": 392223, "epoch": 4725} {"train_loss": -26.35527992248535, "global_step": 392224, "epoch": 4725} {"train_loss": -26.21512794494629, "global_step": 392225, "epoch": 4725} {"train_loss": -26.3250732421875, "global_step": 392226, "epoch": 4725} {"train_loss": -26.368488311767578, "global_step": 392227, "epoch": 4725} {"train_loss": -26.118560791015625, "global_step": 392228, "epoch": 4725} {"train_loss": -26.29109001159668, "global_step": 392229, "epoch": 4725} {"train_loss": -26.450927734375, "global_step": 392230, "epoch": 4725} {"train_loss": -26.3812198638916, "global_step": 392231, "epoch": 4725} {"train_loss": -26.2475528717041, "global_step": 392232, "epoch": 4725} {"train_loss": -26.46473503112793, "global_step": 392233, "epoch": 4725} {"train_loss": -26.335966110229492, "global_step": 392234, "epoch": 4725} {"train_loss": -26.244062423706055, "global_step": 392235, "epoch": 4725} {"train_loss": -26.232913970947266, "global_step": 392236, "epoch": 4725} {"train_loss": -26.3994140625, "global_step": 392237, "epoch": 4725} {"train_loss": -26.437870025634766, "global_step": 392238, "epoch": 4725} {"train_loss": -26.110153198242188, "global_step": 392239, "epoch": 4725} {"train_loss": -26.354434967041016, "global_step": 392240, "epoch": 4725} {"train_loss": -26.270709991455078, "global_step": 392241, "epoch": 4725} {"train_loss": -26.048383712768555, "global_step": 392242, "epoch": 4725} {"train_loss": -26.034042358398438, "global_step": 392243, "epoch": 4725} {"train_loss": -26.487333297729492, "global_step": 392244, "epoch": 4725} {"train_loss": -26.396223068237305, "global_step": 392245, "epoch": 4725} {"train_loss": -26.753711700439453, "global_step": 392246, "epoch": 4725} {"train_loss": -26.685916900634766, "global_step": 392247, "epoch": 4725} {"train_loss": -26.34454917907715, "global_step": 392248, "epoch": 4725} {"train_loss": -26.621896743774414, "global_step": 392249, "epoch": 4725} {"train_loss": -26.3808536529541, "global_step": 392250, "epoch": 4725} {"train_loss": -26.513639450073242, "global_step": 392251, "epoch": 4725} {"train_loss": -25.982717514038086, "global_step": 392252, "epoch": 4725} {"train_loss": -26.2217960357666, "global_step": 392253, "epoch": 4725} {"train_loss": -26.780736923217773, "global_step": 392254, "epoch": 4725} {"train_loss": -26.382558822631836, "global_step": 392255, "epoch": 4725} {"train_loss": -26.591583251953125, "global_step": 392256, "epoch": 4725} {"train_loss": -26.458330705941442, "global_step": 392257, "epoch": 4725, "val_loss": 6640491.0} {"train_loss": -25.7110538482666, "global_step": 392258, "epoch": 4726} {"train_loss": -24.66033935546875, "global_step": 392259, "epoch": 4726} {"train_loss": -25.43690299987793, "global_step": 392260, "epoch": 4726} {"train_loss": -26.41324234008789, "global_step": 392261, "epoch": 4726} {"train_loss": -26.0064697265625, "global_step": 392262, "epoch": 4726} {"train_loss": -26.46076774597168, "global_step": 392263, "epoch": 4726} {"train_loss": -26.2112979888916, "global_step": 392264, "epoch": 4726} {"train_loss": -25.763696670532227, "global_step": 392265, "epoch": 4726} {"train_loss": -26.121856689453125, "global_step": 392266, "epoch": 4726} {"train_loss": -25.915206909179688, "global_step": 392267, "epoch": 4726} {"train_loss": -26.213794708251953, "global_step": 392268, "epoch": 4726} {"train_loss": -26.65936279296875, "global_step": 392269, "epoch": 4726} {"train_loss": -26.080625534057617, "global_step": 392270, "epoch": 4726} {"train_loss": -26.42010498046875, "global_step": 392271, "epoch": 4726} {"train_loss": -26.226734161376953, "global_step": 392272, "epoch": 4726} {"train_loss": -26.2237548828125, "global_step": 392273, "epoch": 4726} {"train_loss": -26.298770904541016, "global_step": 392274, "epoch": 4726} {"train_loss": -26.2286434173584, "global_step": 392275, "epoch": 4726} {"train_loss": -26.658899307250977, "global_step": 392276, "epoch": 4726} {"train_loss": -26.26862144470215, "global_step": 392277, "epoch": 4726} {"train_loss": -26.34804344177246, "global_step": 392278, "epoch": 4726} {"train_loss": -26.509435653686523, "global_step": 392279, "epoch": 4726} {"train_loss": -26.38724708557129, "global_step": 392280, "epoch": 4726} {"train_loss": -26.482526779174805, "global_step": 392281, "epoch": 4726} {"train_loss": -26.137903213500977, "global_step": 392282, "epoch": 4726} {"train_loss": -26.4349308013916, "global_step": 392283, "epoch": 4726} {"train_loss": -26.6054630279541, "global_step": 392284, "epoch": 4726} {"train_loss": -26.381763458251953, "global_step": 392285, "epoch": 4726} {"train_loss": -26.69215202331543, "global_step": 392286, "epoch": 4726} {"train_loss": -26.916046142578125, "global_step": 392287, "epoch": 4726} {"train_loss": -26.3566951751709, "global_step": 392288, "epoch": 4726} {"train_loss": -26.45648193359375, "global_step": 392289, "epoch": 4726} {"train_loss": -26.653369903564453, "global_step": 392290, "epoch": 4726} {"train_loss": -26.63576316833496, "global_step": 392291, "epoch": 4726} {"train_loss": -26.16644859313965, "global_step": 392292, "epoch": 4726} {"train_loss": -26.592065811157227, "global_step": 392293, "epoch": 4726} {"train_loss": -26.591400146484375, "global_step": 392294, "epoch": 4726} {"train_loss": -26.8898983001709, "global_step": 392295, "epoch": 4726} {"train_loss": -26.5352840423584, "global_step": 392296, "epoch": 4726} {"train_loss": -26.374914169311523, "global_step": 392297, "epoch": 4726} {"train_loss": -26.480854034423828, "global_step": 392298, "epoch": 4726} {"train_loss": -26.29495620727539, "global_step": 392299, "epoch": 4726} {"train_loss": -26.38643455505371, "global_step": 392300, "epoch": 4726} {"train_loss": -26.30930519104004, "global_step": 392301, "epoch": 4726} {"train_loss": -26.589492797851562, "global_step": 392302, "epoch": 4726} {"train_loss": -26.585317611694336, "global_step": 392303, "epoch": 4726} {"train_loss": -26.72857666015625, "global_step": 392304, "epoch": 4726} {"train_loss": -26.598825454711914, "global_step": 392305, "epoch": 4726} {"train_loss": -26.69244956970215, "global_step": 392306, "epoch": 4726} {"train_loss": -26.730255126953125, "global_step": 392307, "epoch": 4726} {"train_loss": -26.649255752563477, "global_step": 392308, "epoch": 4726} {"train_loss": -26.183521270751953, "global_step": 392309, "epoch": 4726} {"train_loss": -26.99368667602539, "global_step": 392310, "epoch": 4726} {"train_loss": -26.528818130493164, "global_step": 392311, "epoch": 4726} {"train_loss": -26.700592041015625, "global_step": 392312, "epoch": 4726} {"train_loss": -26.72308349609375, "global_step": 392313, "epoch": 4726} {"train_loss": -26.522327423095703, "global_step": 392314, "epoch": 4726} {"train_loss": -27.101911544799805, "global_step": 392315, "epoch": 4726} {"train_loss": -26.509973526000977, "global_step": 392316, "epoch": 4726} {"train_loss": -27.011117935180664, "global_step": 392317, "epoch": 4726} {"train_loss": -26.60121726989746, "global_step": 392318, "epoch": 4726} {"train_loss": -26.516437530517578, "global_step": 392319, "epoch": 4726} {"train_loss": -27.185901641845703, "global_step": 392320, "epoch": 4726} {"train_loss": -26.8773250579834, "global_step": 392321, "epoch": 4726} {"train_loss": -26.593978881835938, "global_step": 392322, "epoch": 4726} {"train_loss": -26.251220703125, "global_step": 392323, "epoch": 4726} {"train_loss": -26.649951934814453, "global_step": 392324, "epoch": 4726} {"train_loss": -26.550241470336914, "global_step": 392325, "epoch": 4726} {"train_loss": -26.37640953063965, "global_step": 392326, "epoch": 4726} {"train_loss": -26.246728897094727, "global_step": 392327, "epoch": 4726} {"train_loss": -26.821868896484375, "global_step": 392328, "epoch": 4726} {"train_loss": -26.16497230529785, "global_step": 392329, "epoch": 4726} {"train_loss": -26.392263412475586, "global_step": 392330, "epoch": 4726} {"train_loss": -26.079206466674805, "global_step": 392331, "epoch": 4726} {"train_loss": -26.33268165588379, "global_step": 392332, "epoch": 4726} {"train_loss": -26.260229110717773, "global_step": 392333, "epoch": 4726} {"train_loss": -26.406721115112305, "global_step": 392334, "epoch": 4726} {"train_loss": -26.33633804321289, "global_step": 392335, "epoch": 4726} {"train_loss": -26.3342342376709, "global_step": 392336, "epoch": 4726} {"train_loss": -26.395910263061523, "global_step": 392337, "epoch": 4726} {"train_loss": -26.634496688842773, "global_step": 392338, "epoch": 4726} {"train_loss": -26.7725887298584, "global_step": 392339, "epoch": 4726} {"train_loss": -26.427161687827972, "global_step": 392340, "epoch": 4726, "val_loss": 6646490.0} {"train_loss": -25.338144302368164, "global_step": 392341, "epoch": 4727} {"train_loss": -24.95327377319336, "global_step": 392342, "epoch": 4727} {"train_loss": -26.01826286315918, "global_step": 392343, "epoch": 4727} {"train_loss": -24.946680068969727, "global_step": 392344, "epoch": 4727} {"train_loss": -26.05714988708496, "global_step": 392345, "epoch": 4727} {"train_loss": -25.579191207885742, "global_step": 392346, "epoch": 4727} {"train_loss": -25.692480087280273, "global_step": 392347, "epoch": 4727} {"train_loss": -25.91290283203125, "global_step": 392348, "epoch": 4727} {"train_loss": -25.207456588745117, "global_step": 392349, "epoch": 4727} {"train_loss": -26.094135284423828, "global_step": 392350, "epoch": 4727} {"train_loss": -25.375940322875977, "global_step": 392351, "epoch": 4727} {"train_loss": -25.854589462280273, "global_step": 392352, "epoch": 4727} {"train_loss": -26.103300094604492, "global_step": 392353, "epoch": 4727} {"train_loss": -25.402700424194336, "global_step": 392354, "epoch": 4727} {"train_loss": -25.823001861572266, "global_step": 392355, "epoch": 4727} {"train_loss": -25.635976791381836, "global_step": 392356, "epoch": 4727} {"train_loss": -25.568662643432617, "global_step": 392357, "epoch": 4727} {"train_loss": -26.290857315063477, "global_step": 392358, "epoch": 4727} {"train_loss": -26.22878074645996, "global_step": 392359, "epoch": 4727} {"train_loss": -25.74199867248535, "global_step": 392360, "epoch": 4727} {"train_loss": -26.24470329284668, "global_step": 392361, "epoch": 4727} {"train_loss": -26.123748779296875, "global_step": 392362, "epoch": 4727} {"train_loss": -26.42603874206543, "global_step": 392363, "epoch": 4727} {"train_loss": -26.10433006286621, "global_step": 392364, "epoch": 4727} {"train_loss": -26.541608810424805, "global_step": 392365, "epoch": 4727} {"train_loss": -26.106565475463867, "global_step": 392366, "epoch": 4727} {"train_loss": -26.447803497314453, "global_step": 392367, "epoch": 4727} {"train_loss": -26.3449764251709, "global_step": 392368, "epoch": 4727} {"train_loss": -26.20759391784668, "global_step": 392369, "epoch": 4727} {"train_loss": -26.50604248046875, "global_step": 392370, "epoch": 4727} {"train_loss": -26.47757911682129, "global_step": 392371, "epoch": 4727} {"train_loss": -26.495458602905273, "global_step": 392372, "epoch": 4727} {"train_loss": -26.347671508789062, "global_step": 392373, "epoch": 4727} {"train_loss": -26.57935905456543, "global_step": 392374, "epoch": 4727} {"train_loss": -26.383407592773438, "global_step": 392375, "epoch": 4727} {"train_loss": -26.420883178710938, "global_step": 392376, "epoch": 4727} {"train_loss": -26.749799728393555, "global_step": 392377, "epoch": 4727} {"train_loss": -26.275297164916992, "global_step": 392378, "epoch": 4727} {"train_loss": -26.954776763916016, "global_step": 392379, "epoch": 4727} {"train_loss": -26.239179611206055, "global_step": 392380, "epoch": 4727} {"train_loss": -26.6560001373291, "global_step": 392381, "epoch": 4727} {"train_loss": -26.42548942565918, "global_step": 392382, "epoch": 4727} {"train_loss": -26.492328643798828, "global_step": 392383, "epoch": 4727} {"train_loss": -26.712024688720703, "global_step": 392384, "epoch": 4727} {"train_loss": -26.464567184448242, "global_step": 392385, "epoch": 4727} {"train_loss": -26.426137924194336, "global_step": 392386, "epoch": 4727} {"train_loss": -26.98151206970215, "global_step": 392387, "epoch": 4727} {"train_loss": -26.601659774780273, "global_step": 392388, "epoch": 4727} {"train_loss": -26.466171264648438, "global_step": 392389, "epoch": 4727} {"train_loss": -26.591825485229492, "global_step": 392390, "epoch": 4727} {"train_loss": -26.47553062438965, "global_step": 392391, "epoch": 4727} {"train_loss": -26.49395751953125, "global_step": 392392, "epoch": 4727} {"train_loss": -26.613683700561523, "global_step": 392393, "epoch": 4727} {"train_loss": -26.7163028717041, "global_step": 392394, "epoch": 4727} {"train_loss": -26.8384952545166, "global_step": 392395, "epoch": 4727} {"train_loss": -26.664941787719727, "global_step": 392396, "epoch": 4727} {"train_loss": -26.57002830505371, "global_step": 392397, "epoch": 4727} {"train_loss": -26.469772338867188, "global_step": 392398, "epoch": 4727} {"train_loss": -26.46487808227539, "global_step": 392399, "epoch": 4727} {"train_loss": -26.660566329956055, "global_step": 392400, "epoch": 4727} {"train_loss": -26.43133544921875, "global_step": 392401, "epoch": 4727} {"train_loss": -26.594196319580078, "global_step": 392402, "epoch": 4727} {"train_loss": -26.55071449279785, "global_step": 392403, "epoch": 4727} {"train_loss": -26.603918075561523, "global_step": 392404, "epoch": 4727} {"train_loss": -26.62872314453125, "global_step": 392405, "epoch": 4727} {"train_loss": -26.69025993347168, "global_step": 392406, "epoch": 4727} {"train_loss": -26.719989776611328, "global_step": 392407, "epoch": 4727} {"train_loss": -26.425399780273438, "global_step": 392408, "epoch": 4727} {"train_loss": -26.482431411743164, "global_step": 392409, "epoch": 4727} {"train_loss": -26.86883544921875, "global_step": 392410, "epoch": 4727} {"train_loss": -26.547103881835938, "global_step": 392411, "epoch": 4727} {"train_loss": -26.590993881225586, "global_step": 392412, "epoch": 4727} {"train_loss": -26.79817008972168, "global_step": 392413, "epoch": 4727} {"train_loss": -26.855487823486328, "global_step": 392414, "epoch": 4727} {"train_loss": -26.534992218017578, "global_step": 392415, "epoch": 4727} {"train_loss": -26.4758243560791, "global_step": 392416, "epoch": 4727} {"train_loss": -26.406787872314453, "global_step": 392417, "epoch": 4727} {"train_loss": -26.181432723999023, "global_step": 392418, "epoch": 4727} {"train_loss": -25.950342178344727, "global_step": 392419, "epoch": 4727} {"train_loss": -26.45751953125, "global_step": 392420, "epoch": 4727} {"train_loss": -26.509418487548828, "global_step": 392421, "epoch": 4727} {"train_loss": -26.13276481628418, "global_step": 392422, "epoch": 4727} {"train_loss": -26.303312370576055, "global_step": 392423, "epoch": 4727, "val_loss": 6652953.0} {"train_loss": -25.49704360961914, "global_step": 392424, "epoch": 4728} {"train_loss": -25.894079208374023, "global_step": 392425, "epoch": 4728} {"train_loss": -25.515771865844727, "global_step": 392426, "epoch": 4728} {"train_loss": -25.094282150268555, "global_step": 392427, "epoch": 4728} {"train_loss": -25.724151611328125, "global_step": 392428, "epoch": 4728} {"train_loss": -25.673471450805664, "global_step": 392429, "epoch": 4728} {"train_loss": -25.730213165283203, "global_step": 392430, "epoch": 4728} {"train_loss": -25.72304344177246, "global_step": 392431, "epoch": 4728} {"train_loss": -26.01250648498535, "global_step": 392432, "epoch": 4728} {"train_loss": -26.034717559814453, "global_step": 392433, "epoch": 4728} {"train_loss": -26.505353927612305, "global_step": 392434, "epoch": 4728} {"train_loss": -26.114713668823242, "global_step": 392435, "epoch": 4728} {"train_loss": -25.76177978515625, "global_step": 392436, "epoch": 4728} {"train_loss": -25.931921005249023, "global_step": 392437, "epoch": 4728} {"train_loss": -25.81037712097168, "global_step": 392438, "epoch": 4728} {"train_loss": -26.084714889526367, "global_step": 392439, "epoch": 4728} {"train_loss": -26.07661247253418, "global_step": 392440, "epoch": 4728} {"train_loss": -26.07193374633789, "global_step": 392441, "epoch": 4728} {"train_loss": -26.28631591796875, "global_step": 392442, "epoch": 4728} {"train_loss": -26.025556564331055, "global_step": 392443, "epoch": 4728} {"train_loss": -26.181787490844727, "global_step": 392444, "epoch": 4728} {"train_loss": -26.170881271362305, "global_step": 392445, "epoch": 4728} {"train_loss": -26.517154693603516, "global_step": 392446, "epoch": 4728} {"train_loss": -26.404569625854492, "global_step": 392447, "epoch": 4728} {"train_loss": -26.26251792907715, "global_step": 392448, "epoch": 4728} {"train_loss": -26.15418815612793, "global_step": 392449, "epoch": 4728} {"train_loss": -26.311023712158203, "global_step": 392450, "epoch": 4728} {"train_loss": -26.635639190673828, "global_step": 392451, "epoch": 4728} {"train_loss": -26.100610733032227, "global_step": 392452, "epoch": 4728} {"train_loss": -26.858814239501953, "global_step": 392453, "epoch": 4728} {"train_loss": -26.41182518005371, "global_step": 392454, "epoch": 4728} {"train_loss": -26.351404190063477, "global_step": 392455, "epoch": 4728} {"train_loss": -26.425018310546875, "global_step": 392456, "epoch": 4728} {"train_loss": -26.79862403869629, "global_step": 392457, "epoch": 4728} {"train_loss": -26.290380477905273, "global_step": 392458, "epoch": 4728} {"train_loss": -26.193500518798828, "global_step": 392459, "epoch": 4728} {"train_loss": -26.62477684020996, "global_step": 392460, "epoch": 4728} {"train_loss": -26.715747833251953, "global_step": 392461, "epoch": 4728} {"train_loss": -26.623443603515625, "global_step": 392462, "epoch": 4728} {"train_loss": -26.323760986328125, "global_step": 392463, "epoch": 4728} {"train_loss": -26.644254684448242, "global_step": 392464, "epoch": 4728} {"train_loss": -26.37276268005371, "global_step": 392465, "epoch": 4728} {"train_loss": -26.908063888549805, "global_step": 392466, "epoch": 4728} {"train_loss": -26.687591552734375, "global_step": 392467, "epoch": 4728} {"train_loss": -26.718170166015625, "global_step": 392468, "epoch": 4728} {"train_loss": -26.45672607421875, "global_step": 392469, "epoch": 4728} {"train_loss": -26.709577560424805, "global_step": 392470, "epoch": 4728} {"train_loss": -26.71725845336914, "global_step": 392471, "epoch": 4728} {"train_loss": -26.972280502319336, "global_step": 392472, "epoch": 4728} {"train_loss": -26.44288444519043, "global_step": 392473, "epoch": 4728} {"train_loss": -26.866941452026367, "global_step": 392474, "epoch": 4728} {"train_loss": -26.616378784179688, "global_step": 392475, "epoch": 4728} {"train_loss": -26.76714515686035, "global_step": 392476, "epoch": 4728} {"train_loss": -26.6921329498291, "global_step": 392477, "epoch": 4728} {"train_loss": -26.999393463134766, "global_step": 392478, "epoch": 4728} {"train_loss": -26.930850982666016, "global_step": 392479, "epoch": 4728} {"train_loss": -26.912891387939453, "global_step": 392480, "epoch": 4728} {"train_loss": -26.8830623626709, "global_step": 392481, "epoch": 4728} {"train_loss": -26.670629501342773, "global_step": 392482, "epoch": 4728} {"train_loss": -26.760391235351562, "global_step": 392483, "epoch": 4728} {"train_loss": -27.004297256469727, "global_step": 392484, "epoch": 4728} {"train_loss": -26.765064239501953, "global_step": 392485, "epoch": 4728} {"train_loss": -26.300098419189453, "global_step": 392486, "epoch": 4728} {"train_loss": -25.848922729492188, "global_step": 392487, "epoch": 4728} {"train_loss": -26.265073776245117, "global_step": 392488, "epoch": 4728} {"train_loss": -26.5636043548584, "global_step": 392489, "epoch": 4728} {"train_loss": -26.13335609436035, "global_step": 392490, "epoch": 4728} {"train_loss": -26.61176872253418, "global_step": 392491, "epoch": 4728} {"train_loss": -26.16895866394043, "global_step": 392492, "epoch": 4728} {"train_loss": -26.09498405456543, "global_step": 392493, "epoch": 4728} {"train_loss": -25.702686309814453, "global_step": 392494, "epoch": 4728} {"train_loss": -26.036970138549805, "global_step": 392495, "epoch": 4728} {"train_loss": -26.535348892211914, "global_step": 392496, "epoch": 4728} {"train_loss": -26.171279907226562, "global_step": 392497, "epoch": 4728} {"train_loss": -26.277002334594727, "global_step": 392498, "epoch": 4728} {"train_loss": -26.229785919189453, "global_step": 392499, "epoch": 4728} {"train_loss": -26.588438034057617, "global_step": 392500, "epoch": 4728} {"train_loss": -26.227252960205078, "global_step": 392501, "epoch": 4728} {"train_loss": -26.356678009033203, "global_step": 392502, "epoch": 4728} {"train_loss": -26.275344848632812, "global_step": 392503, "epoch": 4728} {"train_loss": -26.1098690032959, "global_step": 392504, "epoch": 4728} {"train_loss": -26.24538230895996, "global_step": 392505, "epoch": 4728} {"train_loss": -26.334476333066643, "global_step": 392506, "epoch": 4728, "val_loss": 6617116.0} {"train_loss": -26.27459716796875, "global_step": 392507, "epoch": 4729} {"train_loss": -25.856176376342773, "global_step": 392508, "epoch": 4729} {"train_loss": -26.00446128845215, "global_step": 392509, "epoch": 4729} {"train_loss": -26.22242546081543, "global_step": 392510, "epoch": 4729} {"train_loss": -25.83736228942871, "global_step": 392511, "epoch": 4729} {"train_loss": -26.070947647094727, "global_step": 392512, "epoch": 4729} {"train_loss": -26.334348678588867, "global_step": 392513, "epoch": 4729} {"train_loss": -26.17230796813965, "global_step": 392514, "epoch": 4729} {"train_loss": -26.319067001342773, "global_step": 392515, "epoch": 4729} {"train_loss": -26.1060848236084, "global_step": 392516, "epoch": 4729} {"train_loss": -26.502365112304688, "global_step": 392517, "epoch": 4729} {"train_loss": -26.27898597717285, "global_step": 392518, "epoch": 4729} {"train_loss": -25.988096237182617, "global_step": 392519, "epoch": 4729} {"train_loss": -26.14800453186035, "global_step": 392520, "epoch": 4729} {"train_loss": -26.406564712524414, "global_step": 392521, "epoch": 4729} {"train_loss": -26.690723419189453, "global_step": 392522, "epoch": 4729} {"train_loss": -26.16267967224121, "global_step": 392523, "epoch": 4729} {"train_loss": -26.365203857421875, "global_step": 392524, "epoch": 4729} {"train_loss": -26.460485458374023, "global_step": 392525, "epoch": 4729} {"train_loss": -26.44290542602539, "global_step": 392526, "epoch": 4729} {"train_loss": -26.608579635620117, "global_step": 392527, "epoch": 4729} {"train_loss": -26.770156860351562, "global_step": 392528, "epoch": 4729} {"train_loss": -26.2622013092041, "global_step": 392529, "epoch": 4729} {"train_loss": -26.71270179748535, "global_step": 392530, "epoch": 4729} {"train_loss": -26.544677734375, "global_step": 392531, "epoch": 4729} {"train_loss": -26.717294692993164, "global_step": 392532, "epoch": 4729} {"train_loss": -26.116846084594727, "global_step": 392533, "epoch": 4729} {"train_loss": -26.322540283203125, "global_step": 392534, "epoch": 4729} {"train_loss": -26.483240127563477, "global_step": 392535, "epoch": 4729} {"train_loss": -26.179096221923828, "global_step": 392536, "epoch": 4729} {"train_loss": -26.671606063842773, "global_step": 392537, "epoch": 4729} {"train_loss": -26.638214111328125, "global_step": 392538, "epoch": 4729} {"train_loss": -26.833093643188477, "global_step": 392539, "epoch": 4729} {"train_loss": -26.56989097595215, "global_step": 392540, "epoch": 4729} {"train_loss": -26.612104415893555, "global_step": 392541, "epoch": 4729} {"train_loss": -26.468358993530273, "global_step": 392542, "epoch": 4729} {"train_loss": -26.486743927001953, "global_step": 392543, "epoch": 4729} {"train_loss": -26.641538619995117, "global_step": 392544, "epoch": 4729} {"train_loss": -26.470905303955078, "global_step": 392545, "epoch": 4729} {"train_loss": -27.047056198120117, "global_step": 392546, "epoch": 4729} {"train_loss": -26.73067283630371, "global_step": 392547, "epoch": 4729} {"train_loss": -26.538818359375, "global_step": 392548, "epoch": 4729} {"train_loss": -26.788578033447266, "global_step": 392549, "epoch": 4729} {"train_loss": -26.547061920166016, "global_step": 392550, "epoch": 4729} {"train_loss": -26.90694236755371, "global_step": 392551, "epoch": 4729} {"train_loss": -26.65827751159668, "global_step": 392552, "epoch": 4729} {"train_loss": -27.063919067382812, "global_step": 392553, "epoch": 4729} {"train_loss": -26.641437530517578, "global_step": 392554, "epoch": 4729} {"train_loss": -26.615217208862305, "global_step": 392555, "epoch": 4729} {"train_loss": -26.3260440826416, "global_step": 392556, "epoch": 4729} {"train_loss": -26.722665786743164, "global_step": 392557, "epoch": 4729} {"train_loss": -26.773481369018555, "global_step": 392558, "epoch": 4729} {"train_loss": -27.07771110534668, "global_step": 392559, "epoch": 4729} {"train_loss": -26.652313232421875, "global_step": 392560, "epoch": 4729} {"train_loss": -26.692916870117188, "global_step": 392561, "epoch": 4729} {"train_loss": -26.628463745117188, "global_step": 392562, "epoch": 4729} {"train_loss": -26.55966567993164, "global_step": 392563, "epoch": 4729} {"train_loss": -26.767099380493164, "global_step": 392564, "epoch": 4729} {"train_loss": -26.588979721069336, "global_step": 392565, "epoch": 4729} {"train_loss": -26.643110275268555, "global_step": 392566, "epoch": 4729} {"train_loss": -26.287994384765625, "global_step": 392567, "epoch": 4729} {"train_loss": -26.652664184570312, "global_step": 392568, "epoch": 4729} {"train_loss": -26.4670352935791, "global_step": 392569, "epoch": 4729} {"train_loss": -26.60651969909668, "global_step": 392570, "epoch": 4729} {"train_loss": -26.2054500579834, "global_step": 392571, "epoch": 4729} {"train_loss": -27.026281356811523, "global_step": 392572, "epoch": 4729} {"train_loss": -26.597522735595703, "global_step": 392573, "epoch": 4729} {"train_loss": -26.21298599243164, "global_step": 392574, "epoch": 4729} {"train_loss": -26.454191207885742, "global_step": 392575, "epoch": 4729} {"train_loss": -26.7954044342041, "global_step": 392576, "epoch": 4729} {"train_loss": -26.805408477783203, "global_step": 392577, "epoch": 4729} {"train_loss": -26.502344131469727, "global_step": 392578, "epoch": 4729} {"train_loss": -26.65618324279785, "global_step": 392579, "epoch": 4729} {"train_loss": -26.646703720092773, "global_step": 392580, "epoch": 4729} {"train_loss": -26.979572296142578, "global_step": 392581, "epoch": 4729} {"train_loss": -26.8974552154541, "global_step": 392582, "epoch": 4729} {"train_loss": -26.633380889892578, "global_step": 392583, "epoch": 4729} {"train_loss": -26.501861572265625, "global_step": 392584, "epoch": 4729} {"train_loss": -26.786466598510742, "global_step": 392585, "epoch": 4729} {"train_loss": -26.889719009399414, "global_step": 392586, "epoch": 4729} {"train_loss": -26.47861671447754, "global_step": 392587, "epoch": 4729} {"train_loss": -26.700952529907227, "global_step": 392588, "epoch": 4729} {"train_loss": -26.523699771927063, "global_step": 392589, "epoch": 4729, "val_loss": 6667175.0} {"train_loss": -25.285343170166016, "global_step": 392590, "epoch": 4730} {"train_loss": -25.0289363861084, "global_step": 392591, "epoch": 4730} {"train_loss": -25.98809814453125, "global_step": 392592, "epoch": 4730} {"train_loss": -25.63221549987793, "global_step": 392593, "epoch": 4730} {"train_loss": -25.824420928955078, "global_step": 392594, "epoch": 4730} {"train_loss": -26.535619735717773, "global_step": 392595, "epoch": 4730} {"train_loss": -25.314468383789062, "global_step": 392596, "epoch": 4730} {"train_loss": -26.266855239868164, "global_step": 392597, "epoch": 4730} {"train_loss": -25.841663360595703, "global_step": 392598, "epoch": 4730} {"train_loss": -25.875202178955078, "global_step": 392599, "epoch": 4730} {"train_loss": -26.064273834228516, "global_step": 392600, "epoch": 4730} {"train_loss": -25.8413028717041, "global_step": 392601, "epoch": 4730} {"train_loss": -26.33675193786621, "global_step": 392602, "epoch": 4730} {"train_loss": -25.84712791442871, "global_step": 392603, "epoch": 4730} {"train_loss": -26.3427734375, "global_step": 392604, "epoch": 4730} {"train_loss": -26.435199737548828, "global_step": 392605, "epoch": 4730} {"train_loss": -26.245685577392578, "global_step": 392606, "epoch": 4730} {"train_loss": -26.1173152923584, "global_step": 392607, "epoch": 4730} {"train_loss": -26.222583770751953, "global_step": 392608, "epoch": 4730} {"train_loss": -26.62244987487793, "global_step": 392609, "epoch": 4730} {"train_loss": -26.42622184753418, "global_step": 392610, "epoch": 4730} {"train_loss": -26.710529327392578, "global_step": 392611, "epoch": 4730} {"train_loss": -26.568796157836914, "global_step": 392612, "epoch": 4730} {"train_loss": -26.564407348632812, "global_step": 392613, "epoch": 4730} {"train_loss": -26.35212516784668, "global_step": 392614, "epoch": 4730} {"train_loss": -26.5736026763916, "global_step": 392615, "epoch": 4730} {"train_loss": -26.545761108398438, "global_step": 392616, "epoch": 4730} {"train_loss": -26.518909454345703, "global_step": 392617, "epoch": 4730} {"train_loss": -26.2364444732666, "global_step": 392618, "epoch": 4730} {"train_loss": -26.871387481689453, "global_step": 392619, "epoch": 4730} {"train_loss": -26.786970138549805, "global_step": 392620, "epoch": 4730} {"train_loss": -26.58661460876465, "global_step": 392621, "epoch": 4730} {"train_loss": -26.37558364868164, "global_step": 392622, "epoch": 4730} {"train_loss": -26.648670196533203, "global_step": 392623, "epoch": 4730} {"train_loss": -26.395872116088867, "global_step": 392624, "epoch": 4730} {"train_loss": -26.8609619140625, "global_step": 392625, "epoch": 4730} {"train_loss": -26.580703735351562, "global_step": 392626, "epoch": 4730} {"train_loss": -26.73004150390625, "global_step": 392627, "epoch": 4730} {"train_loss": -26.83687400817871, "global_step": 392628, "epoch": 4730} {"train_loss": -26.492223739624023, "global_step": 392629, "epoch": 4730} {"train_loss": -26.83704948425293, "global_step": 392630, "epoch": 4730} {"train_loss": -26.916059494018555, "global_step": 392631, "epoch": 4730} {"train_loss": -26.692901611328125, "global_step": 392632, "epoch": 4730} {"train_loss": -26.767932891845703, "global_step": 392633, "epoch": 4730} {"train_loss": -26.50843620300293, "global_step": 392634, "epoch": 4730} {"train_loss": -26.463613510131836, "global_step": 392635, "epoch": 4730} {"train_loss": -27.067590713500977, "global_step": 392636, "epoch": 4730} {"train_loss": -26.901281356811523, "global_step": 392637, "epoch": 4730} {"train_loss": -26.711322784423828, "global_step": 392638, "epoch": 4730} {"train_loss": -26.734567642211914, "global_step": 392639, "epoch": 4730} {"train_loss": -26.99314308166504, "global_step": 392640, "epoch": 4730} {"train_loss": -26.500524520874023, "global_step": 392641, "epoch": 4730} {"train_loss": -26.433551788330078, "global_step": 392642, "epoch": 4730} {"train_loss": -26.578413009643555, "global_step": 392643, "epoch": 4730} {"train_loss": -26.503347396850586, "global_step": 392644, "epoch": 4730} {"train_loss": -26.876615524291992, "global_step": 392645, "epoch": 4730} {"train_loss": -26.868011474609375, "global_step": 392646, "epoch": 4730} {"train_loss": -26.794214248657227, "global_step": 392647, "epoch": 4730} {"train_loss": -26.4206600189209, "global_step": 392648, "epoch": 4730} {"train_loss": -26.577402114868164, "global_step": 392649, "epoch": 4730} {"train_loss": -26.59895133972168, "global_step": 392650, "epoch": 4730} {"train_loss": -26.137561798095703, "global_step": 392651, "epoch": 4730} {"train_loss": -25.46327781677246, "global_step": 392652, "epoch": 4730} {"train_loss": -26.118005752563477, "global_step": 392653, "epoch": 4730} {"train_loss": -26.660648345947266, "global_step": 392654, "epoch": 4730} {"train_loss": -25.947851181030273, "global_step": 392655, "epoch": 4730} {"train_loss": -26.166046142578125, "global_step": 392656, "epoch": 4730} {"train_loss": -26.652936935424805, "global_step": 392657, "epoch": 4730} {"train_loss": -26.2529296875, "global_step": 392658, "epoch": 4730} {"train_loss": -26.628889083862305, "global_step": 392659, "epoch": 4730} {"train_loss": -26.17203140258789, "global_step": 392660, "epoch": 4730} {"train_loss": -25.945703506469727, "global_step": 392661, "epoch": 4730} {"train_loss": -26.22373390197754, "global_step": 392662, "epoch": 4730} {"train_loss": -26.451313018798828, "global_step": 392663, "epoch": 4730} {"train_loss": -26.238080978393555, "global_step": 392664, "epoch": 4730} {"train_loss": -26.557981491088867, "global_step": 392665, "epoch": 4730} {"train_loss": -26.79347801208496, "global_step": 392666, "epoch": 4730} {"train_loss": -26.659753799438477, "global_step": 392667, "epoch": 4730} {"train_loss": -26.406116485595703, "global_step": 392668, "epoch": 4730} {"train_loss": -26.904632568359375, "global_step": 392669, "epoch": 4730} {"train_loss": -26.932540893554688, "global_step": 392670, "epoch": 4730} {"train_loss": -26.539648056030273, "global_step": 392671, "epoch": 4730} {"train_loss": -26.41877045688859, "global_step": 392672, "epoch": 4730, "val_loss": 6608909.0} {"train_loss": -26.20240592956543, "global_step": 392673, "epoch": 4731} {"train_loss": -26.665103912353516, "global_step": 392674, "epoch": 4731} {"train_loss": -26.272918701171875, "global_step": 392675, "epoch": 4731} {"train_loss": -26.393606185913086, "global_step": 392676, "epoch": 4731} {"train_loss": -26.454166412353516, "global_step": 392677, "epoch": 4731} {"train_loss": -26.277637481689453, "global_step": 392678, "epoch": 4731} {"train_loss": -26.472227096557617, "global_step": 392679, "epoch": 4731} {"train_loss": -26.511249542236328, "global_step": 392680, "epoch": 4731} {"train_loss": -26.448278427124023, "global_step": 392681, "epoch": 4731} {"train_loss": -26.451223373413086, "global_step": 392682, "epoch": 4731} {"train_loss": -26.2320613861084, "global_step": 392683, "epoch": 4731} {"train_loss": -26.4920654296875, "global_step": 392684, "epoch": 4731} {"train_loss": -26.132169723510742, "global_step": 392685, "epoch": 4731} {"train_loss": -26.69666862487793, "global_step": 392686, "epoch": 4731} {"train_loss": -26.137928009033203, "global_step": 392687, "epoch": 4731} {"train_loss": -26.243310928344727, "global_step": 392688, "epoch": 4731} {"train_loss": -26.545988082885742, "global_step": 392689, "epoch": 4731} {"train_loss": -26.176549911499023, "global_step": 392690, "epoch": 4731} {"train_loss": -26.38421058654785, "global_step": 392691, "epoch": 4731} {"train_loss": -26.851642608642578, "global_step": 392692, "epoch": 4731} {"train_loss": -26.51405143737793, "global_step": 392693, "epoch": 4731} {"train_loss": -26.111135482788086, "global_step": 392694, "epoch": 4731} {"train_loss": -26.541675567626953, "global_step": 392695, "epoch": 4731} {"train_loss": -26.51249122619629, "global_step": 392696, "epoch": 4731} {"train_loss": -26.625202178955078, "global_step": 392697, "epoch": 4731} {"train_loss": -26.516809463500977, "global_step": 392698, "epoch": 4731} {"train_loss": -26.6154842376709, "global_step": 392699, "epoch": 4731} {"train_loss": -26.610998153686523, "global_step": 392700, "epoch": 4731} {"train_loss": -26.282297134399414, "global_step": 392701, "epoch": 4731} {"train_loss": -26.790563583374023, "global_step": 392702, "epoch": 4731} {"train_loss": -26.455793380737305, "global_step": 392703, "epoch": 4731} {"train_loss": -26.93790054321289, "global_step": 392704, "epoch": 4731} {"train_loss": -26.770227432250977, "global_step": 392705, "epoch": 4731} {"train_loss": -26.871692657470703, "global_step": 392706, "epoch": 4731} {"train_loss": -26.78617286682129, "global_step": 392707, "epoch": 4731} {"train_loss": -26.801050186157227, "global_step": 392708, "epoch": 4731} {"train_loss": -26.837438583374023, "global_step": 392709, "epoch": 4731} {"train_loss": -26.85175895690918, "global_step": 392710, "epoch": 4731} {"train_loss": -26.752140045166016, "global_step": 392711, "epoch": 4731} {"train_loss": -26.475126266479492, "global_step": 392712, "epoch": 4731} {"train_loss": -26.690765380859375, "global_step": 392713, "epoch": 4731} {"train_loss": -26.628061294555664, "global_step": 392714, "epoch": 4731} {"train_loss": -26.97065544128418, "global_step": 392715, "epoch": 4731} {"train_loss": -26.81218910217285, "global_step": 392716, "epoch": 4731} {"train_loss": -26.489063262939453, "global_step": 392717, "epoch": 4731} {"train_loss": -26.260217666625977, "global_step": 392718, "epoch": 4731} {"train_loss": -26.294111251831055, "global_step": 392719, "epoch": 4731} {"train_loss": -26.00958251953125, "global_step": 392720, "epoch": 4731} {"train_loss": -26.028966903686523, "global_step": 392721, "epoch": 4731} {"train_loss": -25.826940536499023, "global_step": 392722, "epoch": 4731} {"train_loss": -26.755712509155273, "global_step": 392723, "epoch": 4731} {"train_loss": -26.217212677001953, "global_step": 392724, "epoch": 4731} {"train_loss": -26.198017120361328, "global_step": 392725, "epoch": 4731} {"train_loss": -26.712940216064453, "global_step": 392726, "epoch": 4731} {"train_loss": -26.265913009643555, "global_step": 392727, "epoch": 4731} {"train_loss": -26.627561569213867, "global_step": 392728, "epoch": 4731} {"train_loss": -26.31684684753418, "global_step": 392729, "epoch": 4731} {"train_loss": -26.549243927001953, "global_step": 392730, "epoch": 4731} {"train_loss": -26.448270797729492, "global_step": 392731, "epoch": 4731} {"train_loss": -26.44695472717285, "global_step": 392732, "epoch": 4731} {"train_loss": -26.122838973999023, "global_step": 392733, "epoch": 4731} {"train_loss": -26.322711944580078, "global_step": 392734, "epoch": 4731} {"train_loss": -26.5550479888916, "global_step": 392735, "epoch": 4731} {"train_loss": -26.49054527282715, "global_step": 392736, "epoch": 4731} {"train_loss": -26.65675163269043, "global_step": 392737, "epoch": 4731} {"train_loss": -26.689550399780273, "global_step": 392738, "epoch": 4731} {"train_loss": -26.549970626831055, "global_step": 392739, "epoch": 4731} {"train_loss": -26.502599716186523, "global_step": 392740, "epoch": 4731} {"train_loss": -26.695581436157227, "global_step": 392741, "epoch": 4731} {"train_loss": -26.609882354736328, "global_step": 392742, "epoch": 4731} {"train_loss": -26.561063766479492, "global_step": 392743, "epoch": 4731} {"train_loss": -26.793228149414062, "global_step": 392744, "epoch": 4731} {"train_loss": -26.659137725830078, "global_step": 392745, "epoch": 4731} {"train_loss": -26.589920043945312, "global_step": 392746, "epoch": 4731} {"train_loss": -26.473712921142578, "global_step": 392747, "epoch": 4731} {"train_loss": -26.78577995300293, "global_step": 392748, "epoch": 4731} {"train_loss": -26.890399932861328, "global_step": 392749, "epoch": 4731} {"train_loss": -26.685474395751953, "global_step": 392750, "epoch": 4731} {"train_loss": -26.685291290283203, "global_step": 392751, "epoch": 4731} {"train_loss": -26.619739532470703, "global_step": 392752, "epoch": 4731} {"train_loss": -26.63775062561035, "global_step": 392753, "epoch": 4731} {"train_loss": -26.940784454345703, "global_step": 392754, "epoch": 4731} {"train_loss": -26.539940408913488, "global_step": 392755, "epoch": 4731, "val_loss": 6616468.0} {"train_loss": -26.158361434936523, "global_step": 392756, "epoch": 4732} {"train_loss": -26.64613151550293, "global_step": 392757, "epoch": 4732} {"train_loss": -26.253705978393555, "global_step": 392758, "epoch": 4732} {"train_loss": -25.93048667907715, "global_step": 392759, "epoch": 4732} {"train_loss": -25.9873104095459, "global_step": 392760, "epoch": 4732} {"train_loss": -25.9956111907959, "global_step": 392761, "epoch": 4732} {"train_loss": -26.599365234375, "global_step": 392762, "epoch": 4732} {"train_loss": -26.624561309814453, "global_step": 392763, "epoch": 4732} {"train_loss": -26.6284236907959, "global_step": 392764, "epoch": 4732} {"train_loss": -26.480152130126953, "global_step": 392765, "epoch": 4732} {"train_loss": -26.62623405456543, "global_step": 392766, "epoch": 4732} {"train_loss": -26.55925941467285, "global_step": 392767, "epoch": 4732} {"train_loss": -26.35919761657715, "global_step": 392768, "epoch": 4732} {"train_loss": -26.059362411499023, "global_step": 392769, "epoch": 4732} {"train_loss": -26.363117218017578, "global_step": 392770, "epoch": 4732} {"train_loss": -26.59767723083496, "global_step": 392771, "epoch": 4732} {"train_loss": -26.157140731811523, "global_step": 392772, "epoch": 4732} {"train_loss": -26.206729888916016, "global_step": 392773, "epoch": 4732} {"train_loss": -26.18340492248535, "global_step": 392774, "epoch": 4732} {"train_loss": -26.361902236938477, "global_step": 392775, "epoch": 4732} {"train_loss": -26.05267333984375, "global_step": 392776, "epoch": 4732} {"train_loss": -26.298574447631836, "global_step": 392777, "epoch": 4732} {"train_loss": -26.461624145507812, "global_step": 392778, "epoch": 4732} {"train_loss": -26.692626953125, "global_step": 392779, "epoch": 4732} {"train_loss": -26.351276397705078, "global_step": 392780, "epoch": 4732} {"train_loss": -25.94451904296875, "global_step": 392781, "epoch": 4732} {"train_loss": -26.241455078125, "global_step": 392782, "epoch": 4732} {"train_loss": -26.428720474243164, "global_step": 392783, "epoch": 4732} {"train_loss": -26.121463775634766, "global_step": 392784, "epoch": 4732} {"train_loss": -26.393766403198242, "global_step": 392785, "epoch": 4732} {"train_loss": -26.775419235229492, "global_step": 392786, "epoch": 4732} {"train_loss": -26.607141494750977, "global_step": 392787, "epoch": 4732} {"train_loss": -26.520618438720703, "global_step": 392788, "epoch": 4732} {"train_loss": -26.38189697265625, "global_step": 392789, "epoch": 4732} {"train_loss": -26.5418701171875, "global_step": 392790, "epoch": 4732} {"train_loss": -26.556293487548828, "global_step": 392791, "epoch": 4732} {"train_loss": -26.861114501953125, "global_step": 392792, "epoch": 4732} {"train_loss": -26.27506446838379, "global_step": 392793, "epoch": 4732} {"train_loss": -26.56629753112793, "global_step": 392794, "epoch": 4732} {"train_loss": -26.25018310546875, "global_step": 392795, "epoch": 4732} {"train_loss": -26.658344268798828, "global_step": 392796, "epoch": 4732} {"train_loss": -26.501203536987305, "global_step": 392797, "epoch": 4732} {"train_loss": -26.289518356323242, "global_step": 392798, "epoch": 4732} {"train_loss": -26.166736602783203, "global_step": 392799, "epoch": 4732} {"train_loss": -26.482839584350586, "global_step": 392800, "epoch": 4732} {"train_loss": -26.231672286987305, "global_step": 392801, "epoch": 4732} {"train_loss": -26.4298038482666, "global_step": 392802, "epoch": 4732} {"train_loss": -26.790283203125, "global_step": 392803, "epoch": 4732} {"train_loss": -26.810657501220703, "global_step": 392804, "epoch": 4732} {"train_loss": -26.59244728088379, "global_step": 392805, "epoch": 4732} {"train_loss": -26.798004150390625, "global_step": 392806, "epoch": 4732} {"train_loss": -26.425321578979492, "global_step": 392807, "epoch": 4732} {"train_loss": -26.616687774658203, "global_step": 392808, "epoch": 4732} {"train_loss": -26.6082763671875, "global_step": 392809, "epoch": 4732} {"train_loss": -26.390796661376953, "global_step": 392810, "epoch": 4732} {"train_loss": -26.501789093017578, "global_step": 392811, "epoch": 4732} {"train_loss": -26.7620849609375, "global_step": 392812, "epoch": 4732} {"train_loss": -26.600568771362305, "global_step": 392813, "epoch": 4732} {"train_loss": -26.5894832611084, "global_step": 392814, "epoch": 4732} {"train_loss": -26.597925186157227, "global_step": 392815, "epoch": 4732} {"train_loss": -26.498584747314453, "global_step": 392816, "epoch": 4732} {"train_loss": -26.62113380432129, "global_step": 392817, "epoch": 4732} {"train_loss": -26.88832664489746, "global_step": 392818, "epoch": 4732} {"train_loss": -26.7417049407959, "global_step": 392819, "epoch": 4732} {"train_loss": -26.672138214111328, "global_step": 392820, "epoch": 4732} {"train_loss": -26.382299423217773, "global_step": 392821, "epoch": 4732} {"train_loss": -26.3364200592041, "global_step": 392822, "epoch": 4732} {"train_loss": -26.762426376342773, "global_step": 392823, "epoch": 4732} {"train_loss": -26.834043502807617, "global_step": 392824, "epoch": 4732} {"train_loss": -26.410314559936523, "global_step": 392825, "epoch": 4732} {"train_loss": -26.569067001342773, "global_step": 392826, "epoch": 4732} {"train_loss": -26.520862579345703, "global_step": 392827, "epoch": 4732} {"train_loss": -26.543354034423828, "global_step": 392828, "epoch": 4732} {"train_loss": -26.667322158813477, "global_step": 392829, "epoch": 4732} {"train_loss": -26.62346839904785, "global_step": 392830, "epoch": 4732} {"train_loss": -27.048486709594727, "global_step": 392831, "epoch": 4732} {"train_loss": -26.397586822509766, "global_step": 392832, "epoch": 4732} {"train_loss": -26.786794662475586, "global_step": 392833, "epoch": 4732} {"train_loss": -26.37623405456543, "global_step": 392834, "epoch": 4732} {"train_loss": -26.68698501586914, "global_step": 392835, "epoch": 4732} {"train_loss": -26.693740844726562, "global_step": 392836, "epoch": 4732} {"train_loss": -26.694284439086914, "global_step": 392837, "epoch": 4732} {"train_loss": -26.485142466533613, "global_step": 392838, "epoch": 4732, "val_loss": 6708821.5} {"train_loss": -26.325815200805664, "global_step": 392839, "epoch": 4733} {"train_loss": -24.015737533569336, "global_step": 392840, "epoch": 4733} {"train_loss": -25.388029098510742, "global_step": 392841, "epoch": 4733} {"train_loss": -25.335813522338867, "global_step": 392842, "epoch": 4733} {"train_loss": -25.776853561401367, "global_step": 392843, "epoch": 4733} {"train_loss": -25.999094009399414, "global_step": 392844, "epoch": 4733} {"train_loss": -25.70418357849121, "global_step": 392845, "epoch": 4733} {"train_loss": -24.863554000854492, "global_step": 392846, "epoch": 4733} {"train_loss": -25.437814712524414, "global_step": 392847, "epoch": 4733} {"train_loss": -25.63209342956543, "global_step": 392848, "epoch": 4733} {"train_loss": -25.691898345947266, "global_step": 392849, "epoch": 4733} {"train_loss": -26.216367721557617, "global_step": 392850, "epoch": 4733} {"train_loss": -26.21497917175293, "global_step": 392851, "epoch": 4733} {"train_loss": -26.201313018798828, "global_step": 392852, "epoch": 4733} {"train_loss": -25.972171783447266, "global_step": 392853, "epoch": 4733} {"train_loss": -26.22235679626465, "global_step": 392854, "epoch": 4733} {"train_loss": -26.197803497314453, "global_step": 392855, "epoch": 4733} {"train_loss": -25.81707191467285, "global_step": 392856, "epoch": 4733} {"train_loss": -25.93509864807129, "global_step": 392857, "epoch": 4733} {"train_loss": -26.18121337890625, "global_step": 392858, "epoch": 4733} {"train_loss": -26.241291046142578, "global_step": 392859, "epoch": 4733} {"train_loss": -26.346521377563477, "global_step": 392860, "epoch": 4733} {"train_loss": -26.219406127929688, "global_step": 392861, "epoch": 4733} {"train_loss": -25.950353622436523, "global_step": 392862, "epoch": 4733} {"train_loss": -26.019561767578125, "global_step": 392863, "epoch": 4733} {"train_loss": -26.011571884155273, "global_step": 392864, "epoch": 4733} {"train_loss": -26.387182235717773, "global_step": 392865, "epoch": 4733} {"train_loss": -26.40711784362793, "global_step": 392866, "epoch": 4733} {"train_loss": -26.003280639648438, "global_step": 392867, "epoch": 4733} {"train_loss": -26.435821533203125, "global_step": 392868, "epoch": 4733} {"train_loss": -26.575353622436523, "global_step": 392869, "epoch": 4733} {"train_loss": -26.190887451171875, "global_step": 392870, "epoch": 4733} {"train_loss": -26.70379066467285, "global_step": 392871, "epoch": 4733} {"train_loss": -26.45819091796875, "global_step": 392872, "epoch": 4733} {"train_loss": -26.753202438354492, "global_step": 392873, "epoch": 4733} {"train_loss": -26.846311569213867, "global_step": 392874, "epoch": 4733} {"train_loss": -26.63337516784668, "global_step": 392875, "epoch": 4733} {"train_loss": -26.691452026367188, "global_step": 392876, "epoch": 4733} {"train_loss": -26.475751876831055, "global_step": 392877, "epoch": 4733} {"train_loss": -26.442584991455078, "global_step": 392878, "epoch": 4733} {"train_loss": -26.673269271850586, "global_step": 392879, "epoch": 4733} {"train_loss": -26.158666610717773, "global_step": 392880, "epoch": 4733} {"train_loss": -26.646560668945312, "global_step": 392881, "epoch": 4733} {"train_loss": -26.396991729736328, "global_step": 392882, "epoch": 4733} {"train_loss": -26.494705200195312, "global_step": 392883, "epoch": 4733} {"train_loss": -26.79353141784668, "global_step": 392884, "epoch": 4733} {"train_loss": -26.744958877563477, "global_step": 392885, "epoch": 4733} {"train_loss": -26.798791885375977, "global_step": 392886, "epoch": 4733} {"train_loss": -26.389759063720703, "global_step": 392887, "epoch": 4733} {"train_loss": -26.547021865844727, "global_step": 392888, "epoch": 4733} {"train_loss": -26.4481201171875, "global_step": 392889, "epoch": 4733} {"train_loss": -26.74334716796875, "global_step": 392890, "epoch": 4733} {"train_loss": -26.502613067626953, "global_step": 392891, "epoch": 4733} {"train_loss": -26.687274932861328, "global_step": 392892, "epoch": 4733} {"train_loss": -27.0262393951416, "global_step": 392893, "epoch": 4733} {"train_loss": -26.666202545166016, "global_step": 392894, "epoch": 4733} {"train_loss": -26.618377685546875, "global_step": 392895, "epoch": 4733} {"train_loss": -26.90226173400879, "global_step": 392896, "epoch": 4733} {"train_loss": -26.897357940673828, "global_step": 392897, "epoch": 4733} {"train_loss": -26.685043334960938, "global_step": 392898, "epoch": 4733} {"train_loss": -26.9349365234375, "global_step": 392899, "epoch": 4733} {"train_loss": -26.685394287109375, "global_step": 392900, "epoch": 4733} {"train_loss": -27.022769927978516, "global_step": 392901, "epoch": 4733} {"train_loss": -26.005727767944336, "global_step": 392902, "epoch": 4733} {"train_loss": -26.308008193969727, "global_step": 392903, "epoch": 4733} {"train_loss": -25.28582191467285, "global_step": 392904, "epoch": 4733} {"train_loss": -25.37721824645996, "global_step": 392905, "epoch": 4733} {"train_loss": -25.63947105407715, "global_step": 392906, "epoch": 4733} {"train_loss": -26.25444984436035, "global_step": 392907, "epoch": 4733} {"train_loss": -26.443531036376953, "global_step": 392908, "epoch": 4733} {"train_loss": -26.236652374267578, "global_step": 392909, "epoch": 4733} {"train_loss": -26.698347091674805, "global_step": 392910, "epoch": 4733} {"train_loss": -26.77863121032715, "global_step": 392911, "epoch": 4733} {"train_loss": -26.42527198791504, "global_step": 392912, "epoch": 4733} {"train_loss": -26.45509147644043, "global_step": 392913, "epoch": 4733} {"train_loss": -25.974027633666992, "global_step": 392914, "epoch": 4733} {"train_loss": -26.54188346862793, "global_step": 392915, "epoch": 4733} {"train_loss": -26.13250160217285, "global_step": 392916, "epoch": 4733} {"train_loss": -26.711339950561523, "global_step": 392917, "epoch": 4733} {"train_loss": -26.517126083374023, "global_step": 392918, "epoch": 4733} {"train_loss": -26.555042266845703, "global_step": 392919, "epoch": 4733} {"train_loss": -26.57935905456543, "global_step": 392920, "epoch": 4733} {"train_loss": -26.28725511481963, "global_step": 392921, "epoch": 4733, "val_loss": 6667422.5} {"train_loss": -26.327306747436523, "global_step": 392922, "epoch": 4734} {"train_loss": -25.947296142578125, "global_step": 392923, "epoch": 4734} {"train_loss": -26.510900497436523, "global_step": 392924, "epoch": 4734} {"train_loss": -26.261037826538086, "global_step": 392925, "epoch": 4734} {"train_loss": -26.421972274780273, "global_step": 392926, "epoch": 4734} {"train_loss": -26.366535186767578, "global_step": 392927, "epoch": 4734} {"train_loss": -26.388748168945312, "global_step": 392928, "epoch": 4734} {"train_loss": -26.28267478942871, "global_step": 392929, "epoch": 4734} {"train_loss": -26.19904899597168, "global_step": 392930, "epoch": 4734} {"train_loss": -26.414274215698242, "global_step": 392931, "epoch": 4734} {"train_loss": -26.640583038330078, "global_step": 392932, "epoch": 4734} {"train_loss": -26.22284507751465, "global_step": 392933, "epoch": 4734} {"train_loss": -26.287267684936523, "global_step": 392934, "epoch": 4734} {"train_loss": -26.612775802612305, "global_step": 392935, "epoch": 4734} {"train_loss": -26.5003604888916, "global_step": 392936, "epoch": 4734} {"train_loss": -26.545225143432617, "global_step": 392937, "epoch": 4734} {"train_loss": -26.516721725463867, "global_step": 392938, "epoch": 4734} {"train_loss": -26.91729164123535, "global_step": 392939, "epoch": 4734} {"train_loss": -26.947248458862305, "global_step": 392940, "epoch": 4734} {"train_loss": -26.22462272644043, "global_step": 392941, "epoch": 4734} {"train_loss": -26.301725387573242, "global_step": 392942, "epoch": 4734} {"train_loss": -26.3485164642334, "global_step": 392943, "epoch": 4734} {"train_loss": -26.52876091003418, "global_step": 392944, "epoch": 4734} {"train_loss": -26.34177017211914, "global_step": 392945, "epoch": 4734} {"train_loss": -26.400848388671875, "global_step": 392946, "epoch": 4734} {"train_loss": -26.631067276000977, "global_step": 392947, "epoch": 4734} {"train_loss": -26.934906005859375, "global_step": 392948, "epoch": 4734} {"train_loss": -26.399572372436523, "global_step": 392949, "epoch": 4734} {"train_loss": -26.5397891998291, "global_step": 392950, "epoch": 4734} {"train_loss": -26.32196617126465, "global_step": 392951, "epoch": 4734} {"train_loss": -26.601825714111328, "global_step": 392952, "epoch": 4734} {"train_loss": -26.7217960357666, "global_step": 392953, "epoch": 4734} {"train_loss": -26.730321884155273, "global_step": 392954, "epoch": 4734} {"train_loss": -26.149066925048828, "global_step": 392955, "epoch": 4734} {"train_loss": -26.2695255279541, "global_step": 392956, "epoch": 4734} {"train_loss": -26.52338218688965, "global_step": 392957, "epoch": 4734} {"train_loss": -26.335285186767578, "global_step": 392958, "epoch": 4734} {"train_loss": -26.41836929321289, "global_step": 392959, "epoch": 4734} {"train_loss": -27.109317779541016, "global_step": 392960, "epoch": 4734} {"train_loss": -26.65094566345215, "global_step": 392961, "epoch": 4734} {"train_loss": -26.556232452392578, "global_step": 392962, "epoch": 4734} {"train_loss": -26.620527267456055, "global_step": 392963, "epoch": 4734} {"train_loss": -26.425642013549805, "global_step": 392964, "epoch": 4734} {"train_loss": -26.859968185424805, "global_step": 392965, "epoch": 4734} {"train_loss": -26.475269317626953, "global_step": 392966, "epoch": 4734} {"train_loss": -26.695999145507812, "global_step": 392967, "epoch": 4734} {"train_loss": -26.379663467407227, "global_step": 392968, "epoch": 4734} {"train_loss": -26.69514274597168, "global_step": 392969, "epoch": 4734} {"train_loss": -26.696073532104492, "global_step": 392970, "epoch": 4734} {"train_loss": -26.688190460205078, "global_step": 392971, "epoch": 4734} {"train_loss": -26.529165267944336, "global_step": 392972, "epoch": 4734} {"train_loss": -26.855548858642578, "global_step": 392973, "epoch": 4734} {"train_loss": -26.520811080932617, "global_step": 392974, "epoch": 4734} {"train_loss": -26.59004020690918, "global_step": 392975, "epoch": 4734} {"train_loss": -26.624387741088867, "global_step": 392976, "epoch": 4734} {"train_loss": -26.636816024780273, "global_step": 392977, "epoch": 4734} {"train_loss": -26.565168380737305, "global_step": 392978, "epoch": 4734} {"train_loss": -26.371984481811523, "global_step": 392979, "epoch": 4734} {"train_loss": -25.8260555267334, "global_step": 392980, "epoch": 4734} {"train_loss": -25.756134033203125, "global_step": 392981, "epoch": 4734} {"train_loss": -25.899677276611328, "global_step": 392982, "epoch": 4734} {"train_loss": -26.502185821533203, "global_step": 392983, "epoch": 4734} {"train_loss": -26.301740646362305, "global_step": 392984, "epoch": 4734} {"train_loss": -26.802753448486328, "global_step": 392985, "epoch": 4734} {"train_loss": -27.002761840820312, "global_step": 392986, "epoch": 4734} {"train_loss": -26.91798210144043, "global_step": 392987, "epoch": 4734} {"train_loss": -26.428335189819336, "global_step": 392988, "epoch": 4734} {"train_loss": -26.44059181213379, "global_step": 392989, "epoch": 4734} {"train_loss": -26.53253173828125, "global_step": 392990, "epoch": 4734} {"train_loss": -26.670461654663086, "global_step": 392991, "epoch": 4734} {"train_loss": -26.45022964477539, "global_step": 392992, "epoch": 4734} {"train_loss": -26.3445987701416, "global_step": 392993, "epoch": 4734} {"train_loss": -26.504926681518555, "global_step": 392994, "epoch": 4734} {"train_loss": -26.409040451049805, "global_step": 392995, "epoch": 4734} {"train_loss": -26.612268447875977, "global_step": 392996, "epoch": 4734} {"train_loss": -26.414587020874023, "global_step": 392997, "epoch": 4734} {"train_loss": -26.65537452697754, "global_step": 392998, "epoch": 4734} {"train_loss": -26.1372127532959, "global_step": 392999, "epoch": 4734} {"train_loss": -26.594202041625977, "global_step": 393000, "epoch": 4734} {"train_loss": -26.236862182617188, "global_step": 393001, "epoch": 4734} {"train_loss": -26.178930282592773, "global_step": 393002, "epoch": 4734} {"train_loss": -26.77219009399414, "global_step": 393003, "epoch": 4734} {"train_loss": -26.493402618959724, "global_step": 393004, "epoch": 4734, "val_loss": 6631223.0} {"train_loss": -25.619348526000977, "global_step": 393005, "epoch": 4735} {"train_loss": -25.550878524780273, "global_step": 393006, "epoch": 4735} {"train_loss": -24.933584213256836, "global_step": 393007, "epoch": 4735} {"train_loss": -25.303205490112305, "global_step": 393008, "epoch": 4735} {"train_loss": -25.517194747924805, "global_step": 393009, "epoch": 4735} {"train_loss": -26.40370750427246, "global_step": 393010, "epoch": 4735} {"train_loss": -25.795434951782227, "global_step": 393011, "epoch": 4735} {"train_loss": -26.212757110595703, "global_step": 393012, "epoch": 4735} {"train_loss": -25.54120635986328, "global_step": 393013, "epoch": 4735} {"train_loss": -26.26435661315918, "global_step": 393014, "epoch": 4735} {"train_loss": -25.66770362854004, "global_step": 393015, "epoch": 4735} {"train_loss": -26.158782958984375, "global_step": 393016, "epoch": 4735} {"train_loss": -26.154870986938477, "global_step": 393017, "epoch": 4735} {"train_loss": -26.23463249206543, "global_step": 393018, "epoch": 4735} {"train_loss": -26.016210556030273, "global_step": 393019, "epoch": 4735} {"train_loss": -26.11026382446289, "global_step": 393020, "epoch": 4735} {"train_loss": -25.771930694580078, "global_step": 393021, "epoch": 4735} {"train_loss": -26.076141357421875, "global_step": 393022, "epoch": 4735} {"train_loss": -26.405969619750977, "global_step": 393023, "epoch": 4735} {"train_loss": -25.98807144165039, "global_step": 393024, "epoch": 4735} {"train_loss": -26.34596824645996, "global_step": 393025, "epoch": 4735} {"train_loss": -26.354862213134766, "global_step": 393026, "epoch": 4735} {"train_loss": -26.244314193725586, "global_step": 393027, "epoch": 4735} {"train_loss": -26.21430015563965, "global_step": 393028, "epoch": 4735} {"train_loss": -25.920795440673828, "global_step": 393029, "epoch": 4735} {"train_loss": -26.089014053344727, "global_step": 393030, "epoch": 4735} {"train_loss": -26.2875919342041, "global_step": 393031, "epoch": 4735} {"train_loss": -26.297321319580078, "global_step": 393032, "epoch": 4735} {"train_loss": -26.254077911376953, "global_step": 393033, "epoch": 4735} {"train_loss": -26.69028663635254, "global_step": 393034, "epoch": 4735} {"train_loss": -26.485700607299805, "global_step": 393035, "epoch": 4735} {"train_loss": -26.375, "global_step": 393036, "epoch": 4735} {"train_loss": -26.21860122680664, "global_step": 393037, "epoch": 4735} {"train_loss": -26.602771759033203, "global_step": 393038, "epoch": 4735} {"train_loss": -26.86237144470215, "global_step": 393039, "epoch": 4735} {"train_loss": -26.6853084564209, "global_step": 393040, "epoch": 4735} {"train_loss": -26.692584991455078, "global_step": 393041, "epoch": 4735} {"train_loss": -26.644302368164062, "global_step": 393042, "epoch": 4735} {"train_loss": -26.554014205932617, "global_step": 393043, "epoch": 4735} {"train_loss": -26.581134796142578, "global_step": 393044, "epoch": 4735} {"train_loss": -26.915868759155273, "global_step": 393045, "epoch": 4735} {"train_loss": -26.713825225830078, "global_step": 393046, "epoch": 4735} {"train_loss": -26.662595748901367, "global_step": 393047, "epoch": 4735} {"train_loss": -26.651880264282227, "global_step": 393048, "epoch": 4735} {"train_loss": -26.808929443359375, "global_step": 393049, "epoch": 4735} {"train_loss": -26.957077026367188, "global_step": 393050, "epoch": 4735} {"train_loss": -26.67559242248535, "global_step": 393051, "epoch": 4735} {"train_loss": -26.92502212524414, "global_step": 393052, "epoch": 4735} {"train_loss": -26.770910263061523, "global_step": 393053, "epoch": 4735} {"train_loss": -26.353734970092773, "global_step": 393054, "epoch": 4735} {"train_loss": -26.683074951171875, "global_step": 393055, "epoch": 4735} {"train_loss": -26.781646728515625, "global_step": 393056, "epoch": 4735} {"train_loss": -26.853015899658203, "global_step": 393057, "epoch": 4735} {"train_loss": -26.729049682617188, "global_step": 393058, "epoch": 4735} {"train_loss": -26.813608169555664, "global_step": 393059, "epoch": 4735} {"train_loss": -26.9503173828125, "global_step": 393060, "epoch": 4735} {"train_loss": -26.9278621673584, "global_step": 393061, "epoch": 4735} {"train_loss": -26.799671173095703, "global_step": 393062, "epoch": 4735} {"train_loss": -26.674238204956055, "global_step": 393063, "epoch": 4735} {"train_loss": -26.652774810791016, "global_step": 393064, "epoch": 4735} {"train_loss": -26.464670181274414, "global_step": 393065, "epoch": 4735} {"train_loss": -25.935623168945312, "global_step": 393066, "epoch": 4735} {"train_loss": -25.80763053894043, "global_step": 393067, "epoch": 4735} {"train_loss": -25.172880172729492, "global_step": 393068, "epoch": 4735} {"train_loss": -26.400415420532227, "global_step": 393069, "epoch": 4735} {"train_loss": -26.297449111938477, "global_step": 393070, "epoch": 4735} {"train_loss": -26.101877212524414, "global_step": 393071, "epoch": 4735} {"train_loss": -25.868505477905273, "global_step": 393072, "epoch": 4735} {"train_loss": -26.016345977783203, "global_step": 393073, "epoch": 4735} {"train_loss": -26.244277954101562, "global_step": 393074, "epoch": 4735} {"train_loss": -26.4420223236084, "global_step": 393075, "epoch": 4735} {"train_loss": -26.3638916015625, "global_step": 393076, "epoch": 4735} {"train_loss": -25.871679306030273, "global_step": 393077, "epoch": 4735} {"train_loss": -26.30377197265625, "global_step": 393078, "epoch": 4735} {"train_loss": -26.4976749420166, "global_step": 393079, "epoch": 4735} {"train_loss": -26.497602462768555, "global_step": 393080, "epoch": 4735} {"train_loss": -26.393903732299805, "global_step": 393081, "epoch": 4735} {"train_loss": -26.49462890625, "global_step": 393082, "epoch": 4735} {"train_loss": -26.372522354125977, "global_step": 393083, "epoch": 4735} {"train_loss": -26.318603515625, "global_step": 393084, "epoch": 4735} {"train_loss": -26.752737045288086, "global_step": 393085, "epoch": 4735} {"train_loss": -26.442895889282227, "global_step": 393086, "epoch": 4735} {"train_loss": -26.31051456497376, "global_step": 393087, "epoch": 4735, "val_loss": 6644944.0} {"train_loss": -26.212799072265625, "global_step": 393088, "epoch": 4736} {"train_loss": -25.818830490112305, "global_step": 393089, "epoch": 4736} {"train_loss": -25.964862823486328, "global_step": 393090, "epoch": 4736} {"train_loss": -25.903051376342773, "global_step": 393091, "epoch": 4736} {"train_loss": -26.07099723815918, "global_step": 393092, "epoch": 4736} {"train_loss": -26.5013484954834, "global_step": 393093, "epoch": 4736} {"train_loss": -26.394224166870117, "global_step": 393094, "epoch": 4736} {"train_loss": -26.2756290435791, "global_step": 393095, "epoch": 4736} {"train_loss": -26.54208755493164, "global_step": 393096, "epoch": 4736} {"train_loss": -26.30206298828125, "global_step": 393097, "epoch": 4736} {"train_loss": -26.413381576538086, "global_step": 393098, "epoch": 4736} {"train_loss": -26.563528060913086, "global_step": 393099, "epoch": 4736} {"train_loss": -27.013397216796875, "global_step": 393100, "epoch": 4736} {"train_loss": -26.545461654663086, "global_step": 393101, "epoch": 4736} {"train_loss": -26.66943359375, "global_step": 393102, "epoch": 4736} {"train_loss": -26.457136154174805, "global_step": 393103, "epoch": 4736} {"train_loss": -26.816476821899414, "global_step": 393104, "epoch": 4736} {"train_loss": -26.778791427612305, "global_step": 393105, "epoch": 4736} {"train_loss": -26.59364891052246, "global_step": 393106, "epoch": 4736} {"train_loss": -26.352094650268555, "global_step": 393107, "epoch": 4736} {"train_loss": -26.293380737304688, "global_step": 393108, "epoch": 4736} {"train_loss": -26.69097328186035, "global_step": 393109, "epoch": 4736} {"train_loss": -26.343473434448242, "global_step": 393110, "epoch": 4736} {"train_loss": -26.493030548095703, "global_step": 393111, "epoch": 4736} {"train_loss": -26.32282829284668, "global_step": 393112, "epoch": 4736} {"train_loss": -26.555017471313477, "global_step": 393113, "epoch": 4736} {"train_loss": -26.492406845092773, "global_step": 393114, "epoch": 4736} {"train_loss": -26.771284103393555, "global_step": 393115, "epoch": 4736} {"train_loss": -26.432050704956055, "global_step": 393116, "epoch": 4736} {"train_loss": -26.64910316467285, "global_step": 393117, "epoch": 4736} {"train_loss": -26.802753448486328, "global_step": 393118, "epoch": 4736} {"train_loss": -26.739887237548828, "global_step": 393119, "epoch": 4736} {"train_loss": -27.159683227539062, "global_step": 393120, "epoch": 4736} {"train_loss": -26.47248649597168, "global_step": 393121, "epoch": 4736} {"train_loss": -26.776391983032227, "global_step": 393122, "epoch": 4736} {"train_loss": -26.606006622314453, "global_step": 393123, "epoch": 4736} {"train_loss": -27.0404052734375, "global_step": 393124, "epoch": 4736} {"train_loss": -26.9213924407959, "global_step": 393125, "epoch": 4736} {"train_loss": -26.76142692565918, "global_step": 393126, "epoch": 4736} {"train_loss": -26.73141860961914, "global_step": 393127, "epoch": 4736} {"train_loss": -26.48673439025879, "global_step": 393128, "epoch": 4736} {"train_loss": -26.635089874267578, "global_step": 393129, "epoch": 4736} {"train_loss": -26.134984970092773, "global_step": 393130, "epoch": 4736} {"train_loss": -26.23516273498535, "global_step": 393131, "epoch": 4736} {"train_loss": -26.02387046813965, "global_step": 393132, "epoch": 4736} {"train_loss": -26.49604606628418, "global_step": 393133, "epoch": 4736} {"train_loss": -26.54096794128418, "global_step": 393134, "epoch": 4736} {"train_loss": -26.09737205505371, "global_step": 393135, "epoch": 4736} {"train_loss": -26.056509017944336, "global_step": 393136, "epoch": 4736} {"train_loss": -26.44881248474121, "global_step": 393137, "epoch": 4736} {"train_loss": -26.418195724487305, "global_step": 393138, "epoch": 4736} {"train_loss": -26.18916130065918, "global_step": 393139, "epoch": 4736} {"train_loss": -26.2697696685791, "global_step": 393140, "epoch": 4736} {"train_loss": -25.988672256469727, "global_step": 393141, "epoch": 4736} {"train_loss": -26.19040298461914, "global_step": 393142, "epoch": 4736} {"train_loss": -26.1262149810791, "global_step": 393143, "epoch": 4736} {"train_loss": -26.560596466064453, "global_step": 393144, "epoch": 4736} {"train_loss": -26.639474868774414, "global_step": 393145, "epoch": 4736} {"train_loss": -26.4343318939209, "global_step": 393146, "epoch": 4736} {"train_loss": -26.56096839904785, "global_step": 393147, "epoch": 4736} {"train_loss": -26.5880126953125, "global_step": 393148, "epoch": 4736} {"train_loss": -26.552276611328125, "global_step": 393149, "epoch": 4736} {"train_loss": -26.541507720947266, "global_step": 393150, "epoch": 4736} {"train_loss": -26.702911376953125, "global_step": 393151, "epoch": 4736} {"train_loss": -26.438297271728516, "global_step": 393152, "epoch": 4736} {"train_loss": -26.67647361755371, "global_step": 393153, "epoch": 4736} {"train_loss": -26.671295166015625, "global_step": 393154, "epoch": 4736} {"train_loss": -26.569583892822266, "global_step": 393155, "epoch": 4736} {"train_loss": -26.35188102722168, "global_step": 393156, "epoch": 4736} {"train_loss": -26.519031524658203, "global_step": 393157, "epoch": 4736} {"train_loss": -26.449567794799805, "global_step": 393158, "epoch": 4736} {"train_loss": -26.68410301208496, "global_step": 393159, "epoch": 4736} {"train_loss": -26.453460693359375, "global_step": 393160, "epoch": 4736} {"train_loss": -26.85733413696289, "global_step": 393161, "epoch": 4736} {"train_loss": -26.695941925048828, "global_step": 393162, "epoch": 4736} {"train_loss": -26.63270378112793, "global_step": 393163, "epoch": 4736} {"train_loss": -26.80805778503418, "global_step": 393164, "epoch": 4736} {"train_loss": -26.448673248291016, "global_step": 393165, "epoch": 4736} {"train_loss": -26.70722770690918, "global_step": 393166, "epoch": 4736} {"train_loss": -26.92888832092285, "global_step": 393167, "epoch": 4736} {"train_loss": -26.53858757019043, "global_step": 393168, "epoch": 4736} {"train_loss": -26.806110382080078, "global_step": 393169, "epoch": 4736} {"train_loss": -26.51891733652138, "global_step": 393170, "epoch": 4736, "val_loss": 6601937.0} {"train_loss": -25.924036026000977, "global_step": 393171, "epoch": 4737} {"train_loss": -24.77512550354004, "global_step": 393172, "epoch": 4737} {"train_loss": -24.112693786621094, "global_step": 393173, "epoch": 4737} {"train_loss": -25.098535537719727, "global_step": 393174, "epoch": 4737} {"train_loss": -26.094879150390625, "global_step": 393175, "epoch": 4737} {"train_loss": -25.069854736328125, "global_step": 393176, "epoch": 4737} {"train_loss": -25.470468521118164, "global_step": 393177, "epoch": 4737} {"train_loss": -25.76810073852539, "global_step": 393178, "epoch": 4737} {"train_loss": -25.733911514282227, "global_step": 393179, "epoch": 4737} {"train_loss": -25.562475204467773, "global_step": 393180, "epoch": 4737} {"train_loss": -25.734882354736328, "global_step": 393181, "epoch": 4737} {"train_loss": -26.032751083374023, "global_step": 393182, "epoch": 4737} {"train_loss": -25.98615074157715, "global_step": 393183, "epoch": 4737} {"train_loss": -25.813817977905273, "global_step": 393184, "epoch": 4737} {"train_loss": -25.63972282409668, "global_step": 393185, "epoch": 4737} {"train_loss": -26.337203979492188, "global_step": 393186, "epoch": 4737} {"train_loss": -25.593305587768555, "global_step": 393187, "epoch": 4737} {"train_loss": -26.264053344726562, "global_step": 393188, "epoch": 4737} {"train_loss": -25.920446395874023, "global_step": 393189, "epoch": 4737} {"train_loss": -25.768884658813477, "global_step": 393190, "epoch": 4737} {"train_loss": -25.597232818603516, "global_step": 393191, "epoch": 4737} {"train_loss": -26.06231117248535, "global_step": 393192, "epoch": 4737} {"train_loss": -25.992767333984375, "global_step": 393193, "epoch": 4737} {"train_loss": -26.173297882080078, "global_step": 393194, "epoch": 4737} {"train_loss": -26.0515079498291, "global_step": 393195, "epoch": 4737} {"train_loss": -26.381017684936523, "global_step": 393196, "epoch": 4737} {"train_loss": -26.12005043029785, "global_step": 393197, "epoch": 4737} {"train_loss": -26.262800216674805, "global_step": 393198, "epoch": 4737} {"train_loss": -26.01959800720215, "global_step": 393199, "epoch": 4737} {"train_loss": -26.209613800048828, "global_step": 393200, "epoch": 4737} {"train_loss": -26.25127601623535, "global_step": 393201, "epoch": 4737} {"train_loss": -26.397937774658203, "global_step": 393202, "epoch": 4737} {"train_loss": -26.45454216003418, "global_step": 393203, "epoch": 4737} {"train_loss": -26.319318771362305, "global_step": 393204, "epoch": 4737} {"train_loss": -26.18212890625, "global_step": 393205, "epoch": 4737} {"train_loss": -26.514404296875, "global_step": 393206, "epoch": 4737} {"train_loss": -26.77870750427246, "global_step": 393207, "epoch": 4737} {"train_loss": -26.5699462890625, "global_step": 393208, "epoch": 4737} {"train_loss": -26.42997169494629, "global_step": 393209, "epoch": 4737} {"train_loss": -26.607229232788086, "global_step": 393210, "epoch": 4737} {"train_loss": -26.433012008666992, "global_step": 393211, "epoch": 4737} {"train_loss": -26.534687042236328, "global_step": 393212, "epoch": 4737} {"train_loss": -26.678730010986328, "global_step": 393213, "epoch": 4737} {"train_loss": -26.640226364135742, "global_step": 393214, "epoch": 4737} {"train_loss": -26.681516647338867, "global_step": 393215, "epoch": 4737} {"train_loss": -26.638784408569336, "global_step": 393216, "epoch": 4737} {"train_loss": -26.50433349609375, "global_step": 393217, "epoch": 4737} {"train_loss": -26.668140411376953, "global_step": 393218, "epoch": 4737} {"train_loss": -26.531646728515625, "global_step": 393219, "epoch": 4737} {"train_loss": -26.6160888671875, "global_step": 393220, "epoch": 4737} {"train_loss": -26.35748291015625, "global_step": 393221, "epoch": 4737} {"train_loss": -26.24336051940918, "global_step": 393222, "epoch": 4737} {"train_loss": -26.5506591796875, "global_step": 393223, "epoch": 4737} {"train_loss": -26.69166374206543, "global_step": 393224, "epoch": 4737} {"train_loss": -26.557214736938477, "global_step": 393225, "epoch": 4737} {"train_loss": -26.75732421875, "global_step": 393226, "epoch": 4737} {"train_loss": -26.6356143951416, "global_step": 393227, "epoch": 4737} {"train_loss": -26.561384201049805, "global_step": 393228, "epoch": 4737} {"train_loss": -26.2496337890625, "global_step": 393229, "epoch": 4737} {"train_loss": -26.367618560791016, "global_step": 393230, "epoch": 4737} {"train_loss": -26.7265567779541, "global_step": 393231, "epoch": 4737} {"train_loss": -26.828657150268555, "global_step": 393232, "epoch": 4737} {"train_loss": -26.664005279541016, "global_step": 393233, "epoch": 4737} {"train_loss": -26.624292373657227, "global_step": 393234, "epoch": 4737} {"train_loss": -26.706562042236328, "global_step": 393235, "epoch": 4737} {"train_loss": -26.43979835510254, "global_step": 393236, "epoch": 4737} {"train_loss": -26.551456451416016, "global_step": 393237, "epoch": 4737} {"train_loss": -26.678354263305664, "global_step": 393238, "epoch": 4737} {"train_loss": -26.584985733032227, "global_step": 393239, "epoch": 4737} {"train_loss": -27.202417373657227, "global_step": 393240, "epoch": 4737} {"train_loss": -27.006921768188477, "global_step": 393241, "epoch": 4737} {"train_loss": -26.757461547851562, "global_step": 393242, "epoch": 4737} {"train_loss": -26.971027374267578, "global_step": 393243, "epoch": 4737} {"train_loss": -26.978717803955078, "global_step": 393244, "epoch": 4737} {"train_loss": -26.638288497924805, "global_step": 393245, "epoch": 4737} {"train_loss": -26.512744903564453, "global_step": 393246, "epoch": 4737} {"train_loss": -26.895605087280273, "global_step": 393247, "epoch": 4737} {"train_loss": -26.620519638061523, "global_step": 393248, "epoch": 4737} {"train_loss": -26.597076416015625, "global_step": 393249, "epoch": 4737} {"train_loss": -26.326858520507812, "global_step": 393250, "epoch": 4737} {"train_loss": -26.647510528564453, "global_step": 393251, "epoch": 4737} {"train_loss": -26.001386642456055, "global_step": 393252, "epoch": 4737} {"train_loss": -26.274583839508423, "global_step": 393253, "epoch": 4737, "val_loss": 6628864.0} {"train_loss": -25.4014949798584, "global_step": 393254, "epoch": 4738} {"train_loss": -25.10114288330078, "global_step": 393255, "epoch": 4738} {"train_loss": -26.181781768798828, "global_step": 393256, "epoch": 4738} {"train_loss": -25.799829483032227, "global_step": 393257, "epoch": 4738} {"train_loss": -25.91904640197754, "global_step": 393258, "epoch": 4738} {"train_loss": -25.874292373657227, "global_step": 393259, "epoch": 4738} {"train_loss": -26.08770179748535, "global_step": 393260, "epoch": 4738} {"train_loss": -25.682058334350586, "global_step": 393261, "epoch": 4738} {"train_loss": -26.374853134155273, "global_step": 393262, "epoch": 4738} {"train_loss": -25.95169448852539, "global_step": 393263, "epoch": 4738} {"train_loss": -26.195280075073242, "global_step": 393264, "epoch": 4738} {"train_loss": -26.0135555267334, "global_step": 393265, "epoch": 4738} {"train_loss": -26.08148765563965, "global_step": 393266, "epoch": 4738} {"train_loss": -26.305036544799805, "global_step": 393267, "epoch": 4738} {"train_loss": -26.47878074645996, "global_step": 393268, "epoch": 4738} {"train_loss": -26.316431045532227, "global_step": 393269, "epoch": 4738} {"train_loss": -26.095670700073242, "global_step": 393270, "epoch": 4738} {"train_loss": -26.45759391784668, "global_step": 393271, "epoch": 4738} {"train_loss": -26.184675216674805, "global_step": 393272, "epoch": 4738} {"train_loss": -26.356496810913086, "global_step": 393273, "epoch": 4738} {"train_loss": -26.51824951171875, "global_step": 393274, "epoch": 4738} {"train_loss": -26.566457748413086, "global_step": 393275, "epoch": 4738} {"train_loss": -26.399580001831055, "global_step": 393276, "epoch": 4738} {"train_loss": -26.392358779907227, "global_step": 393277, "epoch": 4738} {"train_loss": -26.45111656188965, "global_step": 393278, "epoch": 4738} {"train_loss": -26.30719566345215, "global_step": 393279, "epoch": 4738} {"train_loss": -26.276874542236328, "global_step": 393280, "epoch": 4738} {"train_loss": -26.690078735351562, "global_step": 393281, "epoch": 4738} {"train_loss": -26.40650749206543, "global_step": 393282, "epoch": 4738} {"train_loss": -26.575082778930664, "global_step": 393283, "epoch": 4738} {"train_loss": -26.485034942626953, "global_step": 393284, "epoch": 4738} {"train_loss": -26.36789321899414, "global_step": 393285, "epoch": 4738} {"train_loss": -26.2849178314209, "global_step": 393286, "epoch": 4738} {"train_loss": -26.610349655151367, "global_step": 393287, "epoch": 4738} {"train_loss": -26.176786422729492, "global_step": 393288, "epoch": 4738} {"train_loss": -26.694843292236328, "global_step": 393289, "epoch": 4738} {"train_loss": -26.32563591003418, "global_step": 393290, "epoch": 4738} {"train_loss": -26.40236473083496, "global_step": 393291, "epoch": 4738} {"train_loss": -26.252124786376953, "global_step": 393292, "epoch": 4738} {"train_loss": -26.725309371948242, "global_step": 393293, "epoch": 4738} {"train_loss": -26.66615104675293, "global_step": 393294, "epoch": 4738} {"train_loss": -26.787464141845703, "global_step": 393295, "epoch": 4738} {"train_loss": -26.886066436767578, "global_step": 393296, "epoch": 4738} {"train_loss": -26.759119033813477, "global_step": 393297, "epoch": 4738} {"train_loss": -26.966894149780273, "global_step": 393298, "epoch": 4738} {"train_loss": -26.746122360229492, "global_step": 393299, "epoch": 4738} {"train_loss": -26.46405601501465, "global_step": 393300, "epoch": 4738} {"train_loss": -26.2889461517334, "global_step": 393301, "epoch": 4738} {"train_loss": -26.58013343811035, "global_step": 393302, "epoch": 4738} {"train_loss": -26.54837417602539, "global_step": 393303, "epoch": 4738} {"train_loss": -26.92116355895996, "global_step": 393304, "epoch": 4738} {"train_loss": -26.6521053314209, "global_step": 393305, "epoch": 4738} {"train_loss": -26.75604820251465, "global_step": 393306, "epoch": 4738} {"train_loss": -26.826486587524414, "global_step": 393307, "epoch": 4738} {"train_loss": -26.847732543945312, "global_step": 393308, "epoch": 4738} {"train_loss": -26.406726837158203, "global_step": 393309, "epoch": 4738} {"train_loss": -26.76889419555664, "global_step": 393310, "epoch": 4738} {"train_loss": -26.532400131225586, "global_step": 393311, "epoch": 4738} {"train_loss": -26.701507568359375, "global_step": 393312, "epoch": 4738} {"train_loss": -26.48626708984375, "global_step": 393313, "epoch": 4738} {"train_loss": -26.875411987304688, "global_step": 393314, "epoch": 4738} {"train_loss": -26.74972915649414, "global_step": 393315, "epoch": 4738} {"train_loss": -26.51336669921875, "global_step": 393316, "epoch": 4738} {"train_loss": -26.77143669128418, "global_step": 393317, "epoch": 4738} {"train_loss": -26.647083282470703, "global_step": 393318, "epoch": 4738} {"train_loss": -26.741317749023438, "global_step": 393319, "epoch": 4738} {"train_loss": -26.609039306640625, "global_step": 393320, "epoch": 4738} {"train_loss": -26.56516456604004, "global_step": 393321, "epoch": 4738} {"train_loss": -26.3375186920166, "global_step": 393322, "epoch": 4738} {"train_loss": -26.10286521911621, "global_step": 393323, "epoch": 4738} {"train_loss": -26.796844482421875, "global_step": 393324, "epoch": 4738} {"train_loss": -26.379926681518555, "global_step": 393325, "epoch": 4738} {"train_loss": -26.52665138244629, "global_step": 393326, "epoch": 4738} {"train_loss": -26.350616455078125, "global_step": 393327, "epoch": 4738} {"train_loss": -26.626758575439453, "global_step": 393328, "epoch": 4738} {"train_loss": -26.81646728515625, "global_step": 393329, "epoch": 4738} {"train_loss": -26.17203712463379, "global_step": 393330, "epoch": 4738} {"train_loss": -26.5085506439209, "global_step": 393331, "epoch": 4738} {"train_loss": -26.174896240234375, "global_step": 393332, "epoch": 4738} {"train_loss": -26.894947052001953, "global_step": 393333, "epoch": 4738} {"train_loss": -26.797651290893555, "global_step": 393334, "epoch": 4738} {"train_loss": -26.562421798706055, "global_step": 393335, "epoch": 4738} {"train_loss": -26.444668252784087, "global_step": 393336, "epoch": 4738, "val_loss": 6706522.0} {"train_loss": -26.065397262573242, "global_step": 393337, "epoch": 4739} {"train_loss": -26.72908592224121, "global_step": 393338, "epoch": 4739} {"train_loss": -26.382009506225586, "global_step": 393339, "epoch": 4739} {"train_loss": -25.838590621948242, "global_step": 393340, "epoch": 4739} {"train_loss": -25.760648727416992, "global_step": 393341, "epoch": 4739} {"train_loss": -26.058679580688477, "global_step": 393342, "epoch": 4739} {"train_loss": -25.598268508911133, "global_step": 393343, "epoch": 4739} {"train_loss": -26.190948486328125, "global_step": 393344, "epoch": 4739} {"train_loss": -26.051746368408203, "global_step": 393345, "epoch": 4739} {"train_loss": -26.0316104888916, "global_step": 393346, "epoch": 4739} {"train_loss": -25.741748809814453, "global_step": 393347, "epoch": 4739} {"train_loss": -25.760025024414062, "global_step": 393348, "epoch": 4739} {"train_loss": -26.130651473999023, "global_step": 393349, "epoch": 4739} {"train_loss": -26.549942016601562, "global_step": 393350, "epoch": 4739} {"train_loss": -25.6555233001709, "global_step": 393351, "epoch": 4739} {"train_loss": -26.02481460571289, "global_step": 393352, "epoch": 4739} {"train_loss": -26.38275146484375, "global_step": 393353, "epoch": 4739} {"train_loss": -26.28571891784668, "global_step": 393354, "epoch": 4739} {"train_loss": -26.639734268188477, "global_step": 393355, "epoch": 4739} {"train_loss": -26.52447509765625, "global_step": 393356, "epoch": 4739} {"train_loss": -26.399091720581055, "global_step": 393357, "epoch": 4739} {"train_loss": -26.48993492126465, "global_step": 393358, "epoch": 4739} {"train_loss": -26.45684814453125, "global_step": 393359, "epoch": 4739} {"train_loss": -26.336267471313477, "global_step": 393360, "epoch": 4739} {"train_loss": -26.567462921142578, "global_step": 393361, "epoch": 4739} {"train_loss": -26.41373062133789, "global_step": 393362, "epoch": 4739} {"train_loss": -26.418033599853516, "global_step": 393363, "epoch": 4739} {"train_loss": -26.479766845703125, "global_step": 393364, "epoch": 4739} {"train_loss": -26.262897491455078, "global_step": 393365, "epoch": 4739} {"train_loss": -26.643293380737305, "global_step": 393366, "epoch": 4739} {"train_loss": -26.258283615112305, "global_step": 393367, "epoch": 4739} {"train_loss": -26.524438858032227, "global_step": 393368, "epoch": 4739} {"train_loss": -26.620969772338867, "global_step": 393369, "epoch": 4739} {"train_loss": -26.525617599487305, "global_step": 393370, "epoch": 4739} {"train_loss": -26.705799102783203, "global_step": 393371, "epoch": 4739} {"train_loss": -26.222736358642578, "global_step": 393372, "epoch": 4739} {"train_loss": -26.497547149658203, "global_step": 393373, "epoch": 4739} {"train_loss": -26.645191192626953, "global_step": 393374, "epoch": 4739} {"train_loss": -26.349517822265625, "global_step": 393375, "epoch": 4739} {"train_loss": -26.737628936767578, "global_step": 393376, "epoch": 4739} {"train_loss": -26.712848663330078, "global_step": 393377, "epoch": 4739} {"train_loss": -26.465198516845703, "global_step": 393378, "epoch": 4739} {"train_loss": -26.488004684448242, "global_step": 393379, "epoch": 4739} {"train_loss": -26.431303024291992, "global_step": 393380, "epoch": 4739} {"train_loss": -26.381589889526367, "global_step": 393381, "epoch": 4739} {"train_loss": -26.462682723999023, "global_step": 393382, "epoch": 4739} {"train_loss": -26.540775299072266, "global_step": 393383, "epoch": 4739} {"train_loss": -27.03632164001465, "global_step": 393384, "epoch": 4739} {"train_loss": -26.537267684936523, "global_step": 393385, "epoch": 4739} {"train_loss": -26.6474666595459, "global_step": 393386, "epoch": 4739} {"train_loss": -26.726245880126953, "global_step": 393387, "epoch": 4739} {"train_loss": -26.91914939880371, "global_step": 393388, "epoch": 4739} {"train_loss": -26.9252872467041, "global_step": 393389, "epoch": 4739} {"train_loss": -27.02723503112793, "global_step": 393390, "epoch": 4739} {"train_loss": -27.050748825073242, "global_step": 393391, "epoch": 4739} {"train_loss": -26.732954025268555, "global_step": 393392, "epoch": 4739} {"train_loss": -27.13204002380371, "global_step": 393393, "epoch": 4739} {"train_loss": -26.63245964050293, "global_step": 393394, "epoch": 4739} {"train_loss": -26.655614852905273, "global_step": 393395, "epoch": 4739} {"train_loss": -26.861236572265625, "global_step": 393396, "epoch": 4739} {"train_loss": -26.638601303100586, "global_step": 393397, "epoch": 4739} {"train_loss": -27.01874351501465, "global_step": 393398, "epoch": 4739} {"train_loss": -26.567678451538086, "global_step": 393399, "epoch": 4739} {"train_loss": -26.914459228515625, "global_step": 393400, "epoch": 4739} {"train_loss": -26.75068473815918, "global_step": 393401, "epoch": 4739} {"train_loss": -26.5162410736084, "global_step": 393402, "epoch": 4739} {"train_loss": -26.876184463500977, "global_step": 393403, "epoch": 4739} {"train_loss": -26.79160499572754, "global_step": 393404, "epoch": 4739} {"train_loss": -26.618576049804688, "global_step": 393405, "epoch": 4739} {"train_loss": -26.495716094970703, "global_step": 393406, "epoch": 4739} {"train_loss": -26.174482345581055, "global_step": 393407, "epoch": 4739} {"train_loss": -26.5687198638916, "global_step": 393408, "epoch": 4739} {"train_loss": -26.7020320892334, "global_step": 393409, "epoch": 4739} {"train_loss": -26.402103424072266, "global_step": 393410, "epoch": 4739} {"train_loss": -25.951642990112305, "global_step": 393411, "epoch": 4739} {"train_loss": -26.324506759643555, "global_step": 393412, "epoch": 4739} {"train_loss": -27.095733642578125, "global_step": 393413, "epoch": 4739} {"train_loss": -26.473608016967773, "global_step": 393414, "epoch": 4739} {"train_loss": -26.579198837280273, "global_step": 393415, "epoch": 4739} {"train_loss": -26.41617202758789, "global_step": 393416, "epoch": 4739} {"train_loss": -26.69050407409668, "global_step": 393417, "epoch": 4739} {"train_loss": -26.7016544342041, "global_step": 393418, "epoch": 4739} {"train_loss": -26.490812623357197, "global_step": 393419, "epoch": 4739, "val_loss": 6722541.0} {"train_loss": -25.662067413330078, "global_step": 393420, "epoch": 4740} {"train_loss": -26.11795997619629, "global_step": 393421, "epoch": 4740} {"train_loss": -26.4295597076416, "global_step": 393422, "epoch": 4740} {"train_loss": -26.36189079284668, "global_step": 393423, "epoch": 4740} {"train_loss": -26.40723991394043, "global_step": 393424, "epoch": 4740} {"train_loss": -26.145658493041992, "global_step": 393425, "epoch": 4740} {"train_loss": -26.621801376342773, "global_step": 393426, "epoch": 4740} {"train_loss": -26.283817291259766, "global_step": 393427, "epoch": 4740} {"train_loss": -26.460834503173828, "global_step": 393428, "epoch": 4740} {"train_loss": -26.90451431274414, "global_step": 393429, "epoch": 4740} {"train_loss": -26.214635848999023, "global_step": 393430, "epoch": 4740} {"train_loss": -26.2595272064209, "global_step": 393431, "epoch": 4740} {"train_loss": -26.3762264251709, "global_step": 393432, "epoch": 4740} {"train_loss": -26.307348251342773, "global_step": 393433, "epoch": 4740} {"train_loss": -26.284006118774414, "global_step": 393434, "epoch": 4740} {"train_loss": -26.43769645690918, "global_step": 393435, "epoch": 4740} {"train_loss": -26.127771377563477, "global_step": 393436, "epoch": 4740} {"train_loss": -26.7138614654541, "global_step": 393437, "epoch": 4740} {"train_loss": -26.10481071472168, "global_step": 393438, "epoch": 4740} {"train_loss": -26.289539337158203, "global_step": 393439, "epoch": 4740} {"train_loss": -26.65504264831543, "global_step": 393440, "epoch": 4740} {"train_loss": -26.385522842407227, "global_step": 393441, "epoch": 4740} {"train_loss": -26.22056007385254, "global_step": 393442, "epoch": 4740} {"train_loss": -26.424835205078125, "global_step": 393443, "epoch": 4740} {"train_loss": -26.559253692626953, "global_step": 393444, "epoch": 4740} {"train_loss": -26.485675811767578, "global_step": 393445, "epoch": 4740} {"train_loss": -26.461170196533203, "global_step": 393446, "epoch": 4740} {"train_loss": -26.61702537536621, "global_step": 393447, "epoch": 4740} {"train_loss": -26.925262451171875, "global_step": 393448, "epoch": 4740} {"train_loss": -26.467945098876953, "global_step": 393449, "epoch": 4740} {"train_loss": -26.819547653198242, "global_step": 393450, "epoch": 4740} {"train_loss": -26.85379409790039, "global_step": 393451, "epoch": 4740} {"train_loss": -27.014753341674805, "global_step": 393452, "epoch": 4740} {"train_loss": -26.485815048217773, "global_step": 393453, "epoch": 4740} {"train_loss": -27.113927841186523, "global_step": 393454, "epoch": 4740} {"train_loss": -26.458881378173828, "global_step": 393455, "epoch": 4740} {"train_loss": -26.646711349487305, "global_step": 393456, "epoch": 4740} {"train_loss": -26.660062789916992, "global_step": 393457, "epoch": 4740} {"train_loss": -26.867013931274414, "global_step": 393458, "epoch": 4740} {"train_loss": -26.810531616210938, "global_step": 393459, "epoch": 4740} {"train_loss": -26.565271377563477, "global_step": 393460, "epoch": 4740} {"train_loss": -26.60896110534668, "global_step": 393461, "epoch": 4740} {"train_loss": -26.449111938476562, "global_step": 393462, "epoch": 4740} {"train_loss": -26.929828643798828, "global_step": 393463, "epoch": 4740} {"train_loss": -26.649616241455078, "global_step": 393464, "epoch": 4740} {"train_loss": -26.80718421936035, "global_step": 393465, "epoch": 4740} {"train_loss": -26.753387451171875, "global_step": 393466, "epoch": 4740} {"train_loss": -26.616880416870117, "global_step": 393467, "epoch": 4740} {"train_loss": -26.88703727722168, "global_step": 393468, "epoch": 4740} {"train_loss": -26.62727165222168, "global_step": 393469, "epoch": 4740} {"train_loss": -26.4868221282959, "global_step": 393470, "epoch": 4740} {"train_loss": -26.687824249267578, "global_step": 393471, "epoch": 4740} {"train_loss": -26.64188003540039, "global_step": 393472, "epoch": 4740} {"train_loss": -26.53240394592285, "global_step": 393473, "epoch": 4740} {"train_loss": -26.77655029296875, "global_step": 393474, "epoch": 4740} {"train_loss": -26.268381118774414, "global_step": 393475, "epoch": 4740} {"train_loss": -26.799808502197266, "global_step": 393476, "epoch": 4740} {"train_loss": -26.468114852905273, "global_step": 393477, "epoch": 4740} {"train_loss": -27.284337997436523, "global_step": 393478, "epoch": 4740} {"train_loss": -26.147199630737305, "global_step": 393479, "epoch": 4740} {"train_loss": -26.043100357055664, "global_step": 393480, "epoch": 4740} {"train_loss": -26.148147583007812, "global_step": 393481, "epoch": 4740} {"train_loss": -26.274534225463867, "global_step": 393482, "epoch": 4740} {"train_loss": -26.450286865234375, "global_step": 393483, "epoch": 4740} {"train_loss": -26.484399795532227, "global_step": 393484, "epoch": 4740} {"train_loss": -26.46152114868164, "global_step": 393485, "epoch": 4740} {"train_loss": -26.669675827026367, "global_step": 393486, "epoch": 4740} {"train_loss": -26.564823150634766, "global_step": 393487, "epoch": 4740} {"train_loss": -26.70393180847168, "global_step": 393488, "epoch": 4740} {"train_loss": -26.673980712890625, "global_step": 393489, "epoch": 4740} {"train_loss": -26.593835830688477, "global_step": 393490, "epoch": 4740} {"train_loss": -26.411487579345703, "global_step": 393491, "epoch": 4740} {"train_loss": -27.0118350982666, "global_step": 393492, "epoch": 4740} {"train_loss": -26.46843910217285, "global_step": 393493, "epoch": 4740} {"train_loss": -26.461774826049805, "global_step": 393494, "epoch": 4740} {"train_loss": -26.463972091674805, "global_step": 393495, "epoch": 4740} {"train_loss": -26.920629501342773, "global_step": 393496, "epoch": 4740} {"train_loss": -27.087066650390625, "global_step": 393497, "epoch": 4740} {"train_loss": -26.502655029296875, "global_step": 393498, "epoch": 4740} {"train_loss": -26.969589233398438, "global_step": 393499, "epoch": 4740} {"train_loss": -26.716413497924805, "global_step": 393500, "epoch": 4740} {"train_loss": -26.8345890045166, "global_step": 393501, "epoch": 4740} {"train_loss": -26.56150486957596, "global_step": 393502, "epoch": 4740, "val_loss": 6728117.0} {"train_loss": -26.74847984313965, "global_step": 393503, "epoch": 4741} {"train_loss": -26.29705810546875, "global_step": 393504, "epoch": 4741} {"train_loss": -25.40667152404785, "global_step": 393505, "epoch": 4741} {"train_loss": -25.555150985717773, "global_step": 393506, "epoch": 4741} {"train_loss": -25.937198638916016, "global_step": 393507, "epoch": 4741} {"train_loss": -25.07921028137207, "global_step": 393508, "epoch": 4741} {"train_loss": -25.905014038085938, "global_step": 393509, "epoch": 4741} {"train_loss": -25.452362060546875, "global_step": 393510, "epoch": 4741} {"train_loss": -25.907629013061523, "global_step": 393511, "epoch": 4741} {"train_loss": -25.872644424438477, "global_step": 393512, "epoch": 4741} {"train_loss": -26.26984214782715, "global_step": 393513, "epoch": 4741} {"train_loss": -25.821638107299805, "global_step": 393514, "epoch": 4741} {"train_loss": -26.33015251159668, "global_step": 393515, "epoch": 4741} {"train_loss": -26.33209228515625, "global_step": 393516, "epoch": 4741} {"train_loss": -26.195587158203125, "global_step": 393517, "epoch": 4741} {"train_loss": -25.9017391204834, "global_step": 393518, "epoch": 4741} {"train_loss": -25.919193267822266, "global_step": 393519, "epoch": 4741} {"train_loss": -25.95648765563965, "global_step": 393520, "epoch": 4741} {"train_loss": -26.05457878112793, "global_step": 393521, "epoch": 4741} {"train_loss": -26.231924057006836, "global_step": 393522, "epoch": 4741} {"train_loss": -26.06949234008789, "global_step": 393523, "epoch": 4741} {"train_loss": -25.858966827392578, "global_step": 393524, "epoch": 4741} {"train_loss": -26.334646224975586, "global_step": 393525, "epoch": 4741} {"train_loss": -26.186798095703125, "global_step": 393526, "epoch": 4741} {"train_loss": -26.21578025817871, "global_step": 393527, "epoch": 4741} {"train_loss": -26.496427536010742, "global_step": 393528, "epoch": 4741} {"train_loss": -26.63824462890625, "global_step": 393529, "epoch": 4741} {"train_loss": -26.32973289489746, "global_step": 393530, "epoch": 4741} {"train_loss": -26.514881134033203, "global_step": 393531, "epoch": 4741} {"train_loss": -26.4686336517334, "global_step": 393532, "epoch": 4741} {"train_loss": -26.244659423828125, "global_step": 393533, "epoch": 4741} {"train_loss": -26.414419174194336, "global_step": 393534, "epoch": 4741} {"train_loss": -26.46564292907715, "global_step": 393535, "epoch": 4741} {"train_loss": -26.47149085998535, "global_step": 393536, "epoch": 4741} {"train_loss": -26.492334365844727, "global_step": 393537, "epoch": 4741} {"train_loss": -26.571130752563477, "global_step": 393538, "epoch": 4741} {"train_loss": -26.296201705932617, "global_step": 393539, "epoch": 4741} {"train_loss": -26.60044288635254, "global_step": 393540, "epoch": 4741} {"train_loss": -26.7221736907959, "global_step": 393541, "epoch": 4741} {"train_loss": -26.708105087280273, "global_step": 393542, "epoch": 4741} {"train_loss": -26.8498592376709, "global_step": 393543, "epoch": 4741} {"train_loss": -26.81256103515625, "global_step": 393544, "epoch": 4741} {"train_loss": -26.891813278198242, "global_step": 393545, "epoch": 4741} {"train_loss": -26.749460220336914, "global_step": 393546, "epoch": 4741} {"train_loss": -26.898391723632812, "global_step": 393547, "epoch": 4741} {"train_loss": -26.573566436767578, "global_step": 393548, "epoch": 4741} {"train_loss": -26.949132919311523, "global_step": 393549, "epoch": 4741} {"train_loss": -26.717899322509766, "global_step": 393550, "epoch": 4741} {"train_loss": -26.506427764892578, "global_step": 393551, "epoch": 4741} {"train_loss": -26.218341827392578, "global_step": 393552, "epoch": 4741} {"train_loss": -26.911304473876953, "global_step": 393553, "epoch": 4741} {"train_loss": -26.812597274780273, "global_step": 393554, "epoch": 4741} {"train_loss": -26.717737197875977, "global_step": 393555, "epoch": 4741} {"train_loss": -26.485565185546875, "global_step": 393556, "epoch": 4741} {"train_loss": -26.58942985534668, "global_step": 393557, "epoch": 4741} {"train_loss": -26.592945098876953, "global_step": 393558, "epoch": 4741} {"train_loss": -26.369159698486328, "global_step": 393559, "epoch": 4741} {"train_loss": -26.590362548828125, "global_step": 393560, "epoch": 4741} {"train_loss": -26.8842716217041, "global_step": 393561, "epoch": 4741} {"train_loss": -26.309589385986328, "global_step": 393562, "epoch": 4741} {"train_loss": -26.473011016845703, "global_step": 393563, "epoch": 4741} {"train_loss": -26.83967399597168, "global_step": 393564, "epoch": 4741} {"train_loss": -26.033191680908203, "global_step": 393565, "epoch": 4741} {"train_loss": -25.8070125579834, "global_step": 393566, "epoch": 4741} {"train_loss": -24.748929977416992, "global_step": 393567, "epoch": 4741} {"train_loss": -24.183820724487305, "global_step": 393568, "epoch": 4741} {"train_loss": -25.588943481445312, "global_step": 393569, "epoch": 4741} {"train_loss": -25.339191436767578, "global_step": 393570, "epoch": 4741} {"train_loss": -25.031497955322266, "global_step": 393571, "epoch": 4741} {"train_loss": -25.67351722717285, "global_step": 393572, "epoch": 4741} {"train_loss": -25.299636840820312, "global_step": 393573, "epoch": 4741} {"train_loss": -25.948272705078125, "global_step": 393574, "epoch": 4741} {"train_loss": -25.86641502380371, "global_step": 393575, "epoch": 4741} {"train_loss": -25.807937622070312, "global_step": 393576, "epoch": 4741} {"train_loss": -26.49244499206543, "global_step": 393577, "epoch": 4741} {"train_loss": -25.89581298828125, "global_step": 393578, "epoch": 4741} {"train_loss": -26.395166397094727, "global_step": 393579, "epoch": 4741} {"train_loss": -25.582534790039062, "global_step": 393580, "epoch": 4741} {"train_loss": -25.817279815673828, "global_step": 393581, "epoch": 4741} {"train_loss": -25.976673126220703, "global_step": 393582, "epoch": 4741} {"train_loss": -26.378324508666992, "global_step": 393583, "epoch": 4741} {"train_loss": -25.8734130859375, "global_step": 393584, "epoch": 4741} {"train_loss": -26.19821031409574, "global_step": 393585, "epoch": 4741, "val_loss": 6656484.0} {"train_loss": -25.661151885986328, "global_step": 393586, "epoch": 4742} {"train_loss": -26.0433292388916, "global_step": 393587, "epoch": 4742} {"train_loss": -26.001483917236328, "global_step": 393588, "epoch": 4742} {"train_loss": -25.905536651611328, "global_step": 393589, "epoch": 4742} {"train_loss": -26.060871124267578, "global_step": 393590, "epoch": 4742} {"train_loss": -26.240842819213867, "global_step": 393591, "epoch": 4742} {"train_loss": -26.268463134765625, "global_step": 393592, "epoch": 4742} {"train_loss": -26.278961181640625, "global_step": 393593, "epoch": 4742} {"train_loss": -25.776844024658203, "global_step": 393594, "epoch": 4742} {"train_loss": -26.106449127197266, "global_step": 393595, "epoch": 4742} {"train_loss": -26.506025314331055, "global_step": 393596, "epoch": 4742} {"train_loss": -26.170902252197266, "global_step": 393597, "epoch": 4742} {"train_loss": -25.899816513061523, "global_step": 393598, "epoch": 4742} {"train_loss": -26.0419864654541, "global_step": 393599, "epoch": 4742} {"train_loss": -26.452423095703125, "global_step": 393600, "epoch": 4742} {"train_loss": -26.185333251953125, "global_step": 393601, "epoch": 4742} {"train_loss": -26.2708740234375, "global_step": 393602, "epoch": 4742} {"train_loss": -26.58295249938965, "global_step": 393603, "epoch": 4742} {"train_loss": -26.430017471313477, "global_step": 393604, "epoch": 4742} {"train_loss": -26.48148536682129, "global_step": 393605, "epoch": 4742} {"train_loss": -26.289127349853516, "global_step": 393606, "epoch": 4742} {"train_loss": -26.66206169128418, "global_step": 393607, "epoch": 4742} {"train_loss": -26.402196884155273, "global_step": 393608, "epoch": 4742} {"train_loss": -26.3198184967041, "global_step": 393609, "epoch": 4742} {"train_loss": -26.462961196899414, "global_step": 393610, "epoch": 4742} {"train_loss": -26.505462646484375, "global_step": 393611, "epoch": 4742} {"train_loss": -26.967222213745117, "global_step": 393612, "epoch": 4742} {"train_loss": -26.70904541015625, "global_step": 393613, "epoch": 4742} {"train_loss": -26.636672973632812, "global_step": 393614, "epoch": 4742} {"train_loss": -26.8023681640625, "global_step": 393615, "epoch": 4742} {"train_loss": -26.561437606811523, "global_step": 393616, "epoch": 4742} {"train_loss": -26.778329849243164, "global_step": 393617, "epoch": 4742} {"train_loss": -26.680150985717773, "global_step": 393618, "epoch": 4742} {"train_loss": -26.59617042541504, "global_step": 393619, "epoch": 4742} {"train_loss": -26.595666885375977, "global_step": 393620, "epoch": 4742} {"train_loss": -26.73163414001465, "global_step": 393621, "epoch": 4742} {"train_loss": -26.702056884765625, "global_step": 393622, "epoch": 4742} {"train_loss": -26.817468643188477, "global_step": 393623, "epoch": 4742} {"train_loss": -26.3568115234375, "global_step": 393624, "epoch": 4742} {"train_loss": -26.429187774658203, "global_step": 393625, "epoch": 4742} {"train_loss": -27.042972564697266, "global_step": 393626, "epoch": 4742} {"train_loss": -26.718433380126953, "global_step": 393627, "epoch": 4742} {"train_loss": -26.78895378112793, "global_step": 393628, "epoch": 4742} {"train_loss": -26.75140953063965, "global_step": 393629, "epoch": 4742} {"train_loss": -26.774356842041016, "global_step": 393630, "epoch": 4742} {"train_loss": -26.87420654296875, "global_step": 393631, "epoch": 4742} {"train_loss": -26.686908721923828, "global_step": 393632, "epoch": 4742} {"train_loss": -26.6809024810791, "global_step": 393633, "epoch": 4742} {"train_loss": -26.89304542541504, "global_step": 393634, "epoch": 4742} {"train_loss": -27.056415557861328, "global_step": 393635, "epoch": 4742} {"train_loss": -26.8040771484375, "global_step": 393636, "epoch": 4742} {"train_loss": -26.941604614257812, "global_step": 393637, "epoch": 4742} {"train_loss": -27.107568740844727, "global_step": 393638, "epoch": 4742} {"train_loss": -26.939172744750977, "global_step": 393639, "epoch": 4742} {"train_loss": -26.72637367248535, "global_step": 393640, "epoch": 4742} {"train_loss": -26.42453956604004, "global_step": 393641, "epoch": 4742} {"train_loss": -26.537647247314453, "global_step": 393642, "epoch": 4742} {"train_loss": -26.217687606811523, "global_step": 393643, "epoch": 4742} {"train_loss": -26.064411163330078, "global_step": 393644, "epoch": 4742} {"train_loss": -26.5739803314209, "global_step": 393645, "epoch": 4742} {"train_loss": -26.51189613342285, "global_step": 393646, "epoch": 4742} {"train_loss": -26.660755157470703, "global_step": 393647, "epoch": 4742} {"train_loss": -26.781360626220703, "global_step": 393648, "epoch": 4742} {"train_loss": -26.704608917236328, "global_step": 393649, "epoch": 4742} {"train_loss": -26.310937881469727, "global_step": 393650, "epoch": 4742} {"train_loss": -26.349863052368164, "global_step": 393651, "epoch": 4742} {"train_loss": -26.44576072692871, "global_step": 393652, "epoch": 4742} {"train_loss": -26.35849380493164, "global_step": 393653, "epoch": 4742} {"train_loss": -26.33987808227539, "global_step": 393654, "epoch": 4742} {"train_loss": -26.74183464050293, "global_step": 393655, "epoch": 4742} {"train_loss": -26.520709991455078, "global_step": 393656, "epoch": 4742} {"train_loss": -26.5607967376709, "global_step": 393657, "epoch": 4742} {"train_loss": -26.62454605102539, "global_step": 393658, "epoch": 4742} {"train_loss": -26.729345321655273, "global_step": 393659, "epoch": 4742} {"train_loss": -26.642553329467773, "global_step": 393660, "epoch": 4742} {"train_loss": -26.3480167388916, "global_step": 393661, "epoch": 4742} {"train_loss": -26.29435157775879, "global_step": 393662, "epoch": 4742} {"train_loss": -26.618305206298828, "global_step": 393663, "epoch": 4742} {"train_loss": -26.43171501159668, "global_step": 393664, "epoch": 4742} {"train_loss": -26.612445831298828, "global_step": 393665, "epoch": 4742} {"train_loss": -26.696516036987305, "global_step": 393666, "epoch": 4742} {"train_loss": -26.41095542907715, "global_step": 393667, "epoch": 4742} {"train_loss": -26.504586897700666, "global_step": 393668, "epoch": 4742, "val_loss": 6707309.0} {"train_loss": -25.754425048828125, "global_step": 393669, "epoch": 4743} {"train_loss": -25.698949813842773, "global_step": 393670, "epoch": 4743} {"train_loss": -25.8734188079834, "global_step": 393671, "epoch": 4743} {"train_loss": -25.98581314086914, "global_step": 393672, "epoch": 4743} {"train_loss": -25.732196807861328, "global_step": 393673, "epoch": 4743} {"train_loss": -25.858362197875977, "global_step": 393674, "epoch": 4743} {"train_loss": -25.979415893554688, "global_step": 393675, "epoch": 4743} {"train_loss": -26.01616859436035, "global_step": 393676, "epoch": 4743} {"train_loss": -26.375940322875977, "global_step": 393677, "epoch": 4743} {"train_loss": -26.524566650390625, "global_step": 393678, "epoch": 4743} {"train_loss": -26.003326416015625, "global_step": 393679, "epoch": 4743} {"train_loss": -26.27048683166504, "global_step": 393680, "epoch": 4743} {"train_loss": -26.458362579345703, "global_step": 393681, "epoch": 4743} {"train_loss": -26.555143356323242, "global_step": 393682, "epoch": 4743} {"train_loss": -26.18988609313965, "global_step": 393683, "epoch": 4743} {"train_loss": -26.36396598815918, "global_step": 393684, "epoch": 4743} {"train_loss": -25.795907974243164, "global_step": 393685, "epoch": 4743} {"train_loss": -26.359603881835938, "global_step": 393686, "epoch": 4743} {"train_loss": -26.285486221313477, "global_step": 393687, "epoch": 4743} {"train_loss": -26.579233169555664, "global_step": 393688, "epoch": 4743} {"train_loss": -26.245319366455078, "global_step": 393689, "epoch": 4743} {"train_loss": -26.3920955657959, "global_step": 393690, "epoch": 4743} {"train_loss": -26.2135066986084, "global_step": 393691, "epoch": 4743} {"train_loss": -25.98005485534668, "global_step": 393692, "epoch": 4743} {"train_loss": -26.4713134765625, "global_step": 393693, "epoch": 4743} {"train_loss": -26.02581214904785, "global_step": 393694, "epoch": 4743} {"train_loss": -26.29034423828125, "global_step": 393695, "epoch": 4743} {"train_loss": -26.627979278564453, "global_step": 393696, "epoch": 4743} {"train_loss": -26.5921688079834, "global_step": 393697, "epoch": 4743} {"train_loss": -26.78128433227539, "global_step": 393698, "epoch": 4743} {"train_loss": -26.462133407592773, "global_step": 393699, "epoch": 4743} {"train_loss": -26.420318603515625, "global_step": 393700, "epoch": 4743} {"train_loss": -26.51092529296875, "global_step": 393701, "epoch": 4743} {"train_loss": -26.337493896484375, "global_step": 393702, "epoch": 4743} {"train_loss": -26.552610397338867, "global_step": 393703, "epoch": 4743} {"train_loss": -26.3511962890625, "global_step": 393704, "epoch": 4743} {"train_loss": -26.61895179748535, "global_step": 393705, "epoch": 4743} {"train_loss": -26.57338523864746, "global_step": 393706, "epoch": 4743} {"train_loss": -26.766998291015625, "global_step": 393707, "epoch": 4743} {"train_loss": -26.67122459411621, "global_step": 393708, "epoch": 4743} {"train_loss": -26.42007827758789, "global_step": 393709, "epoch": 4743} {"train_loss": -26.121519088745117, "global_step": 393710, "epoch": 4743} {"train_loss": -26.60396385192871, "global_step": 393711, "epoch": 4743} {"train_loss": -26.373554229736328, "global_step": 393712, "epoch": 4743} {"train_loss": -26.47710609436035, "global_step": 393713, "epoch": 4743} {"train_loss": -26.859607696533203, "global_step": 393714, "epoch": 4743} {"train_loss": -26.567663192749023, "global_step": 393715, "epoch": 4743} {"train_loss": -26.76422119140625, "global_step": 393716, "epoch": 4743} {"train_loss": -26.628915786743164, "global_step": 393717, "epoch": 4743} {"train_loss": -26.478124618530273, "global_step": 393718, "epoch": 4743} {"train_loss": -26.397327423095703, "global_step": 393719, "epoch": 4743} {"train_loss": -26.77082633972168, "global_step": 393720, "epoch": 4743} {"train_loss": -26.3508358001709, "global_step": 393721, "epoch": 4743} {"train_loss": -26.365100860595703, "global_step": 393722, "epoch": 4743} {"train_loss": -26.466596603393555, "global_step": 393723, "epoch": 4743} {"train_loss": -26.56783103942871, "global_step": 393724, "epoch": 4743} {"train_loss": -26.889123916625977, "global_step": 393725, "epoch": 4743} {"train_loss": -26.6566104888916, "global_step": 393726, "epoch": 4743} {"train_loss": -26.84095573425293, "global_step": 393727, "epoch": 4743} {"train_loss": -26.526432037353516, "global_step": 393728, "epoch": 4743} {"train_loss": -26.800756454467773, "global_step": 393729, "epoch": 4743} {"train_loss": -26.482778549194336, "global_step": 393730, "epoch": 4743} {"train_loss": -26.70977210998535, "global_step": 393731, "epoch": 4743} {"train_loss": -26.737472534179688, "global_step": 393732, "epoch": 4743} {"train_loss": -26.239355087280273, "global_step": 393733, "epoch": 4743} {"train_loss": -25.96027183532715, "global_step": 393734, "epoch": 4743} {"train_loss": -26.26079750061035, "global_step": 393735, "epoch": 4743} {"train_loss": -26.73077964782715, "global_step": 393736, "epoch": 4743} {"train_loss": -26.475805282592773, "global_step": 393737, "epoch": 4743} {"train_loss": -26.600873947143555, "global_step": 393738, "epoch": 4743} {"train_loss": -26.395471572875977, "global_step": 393739, "epoch": 4743} {"train_loss": -26.511367797851562, "global_step": 393740, "epoch": 4743} {"train_loss": -26.65682029724121, "global_step": 393741, "epoch": 4743} {"train_loss": -26.689008712768555, "global_step": 393742, "epoch": 4743} {"train_loss": -26.864904403686523, "global_step": 393743, "epoch": 4743} {"train_loss": -26.603464126586914, "global_step": 393744, "epoch": 4743} {"train_loss": -26.568958282470703, "global_step": 393745, "epoch": 4743} {"train_loss": -26.64693260192871, "global_step": 393746, "epoch": 4743} {"train_loss": -26.150556564331055, "global_step": 393747, "epoch": 4743} {"train_loss": -26.071304321289062, "global_step": 393748, "epoch": 4743} {"train_loss": -26.549179077148438, "global_step": 393749, "epoch": 4743} {"train_loss": -26.72437858581543, "global_step": 393750, "epoch": 4743} {"train_loss": -26.388230748923426, "global_step": 393751, "epoch": 4743, "val_loss": 6821665.5} {"train_loss": -20.766357421875, "global_step": 393752, "epoch": 4744} {"train_loss": -21.30849838256836, "global_step": 393753, "epoch": 4744} {"train_loss": -24.461549758911133, "global_step": 393754, "epoch": 4744} {"train_loss": -23.802846908569336, "global_step": 393755, "epoch": 4744} {"train_loss": -23.17742347717285, "global_step": 393756, "epoch": 4744} {"train_loss": -24.75507926940918, "global_step": 393757, "epoch": 4744} {"train_loss": -24.422372817993164, "global_step": 393758, "epoch": 4744} {"train_loss": -24.484668731689453, "global_step": 393759, "epoch": 4744} {"train_loss": -24.83368492126465, "global_step": 393760, "epoch": 4744} {"train_loss": -25.229345321655273, "global_step": 393761, "epoch": 4744} {"train_loss": -24.751209259033203, "global_step": 393762, "epoch": 4744} {"train_loss": -25.4262752532959, "global_step": 393763, "epoch": 4744} {"train_loss": -25.010009765625, "global_step": 393764, "epoch": 4744} {"train_loss": -24.773550033569336, "global_step": 393765, "epoch": 4744} {"train_loss": -25.002901077270508, "global_step": 393766, "epoch": 4744} {"train_loss": -25.09479331970215, "global_step": 393767, "epoch": 4744} {"train_loss": -25.348691940307617, "global_step": 393768, "epoch": 4744} {"train_loss": -25.691946029663086, "global_step": 393769, "epoch": 4744} {"train_loss": -25.33299446105957, "global_step": 393770, "epoch": 4744} {"train_loss": -25.505800247192383, "global_step": 393771, "epoch": 4744} {"train_loss": -25.605138778686523, "global_step": 393772, "epoch": 4744} {"train_loss": -25.493894577026367, "global_step": 393773, "epoch": 4744} {"train_loss": -25.707477569580078, "global_step": 393774, "epoch": 4744} {"train_loss": -25.507516860961914, "global_step": 393775, "epoch": 4744} {"train_loss": -25.77866554260254, "global_step": 393776, "epoch": 4744} {"train_loss": -25.36810302734375, "global_step": 393777, "epoch": 4744} {"train_loss": -25.448774337768555, "global_step": 393778, "epoch": 4744} {"train_loss": -25.938602447509766, "global_step": 393779, "epoch": 4744} {"train_loss": -25.958545684814453, "global_step": 393780, "epoch": 4744} {"train_loss": -26.0450382232666, "global_step": 393781, "epoch": 4744} {"train_loss": -25.8136043548584, "global_step": 393782, "epoch": 4744} {"train_loss": -26.2557315826416, "global_step": 393783, "epoch": 4744} {"train_loss": -26.066579818725586, "global_step": 393784, "epoch": 4744} {"train_loss": -25.923627853393555, "global_step": 393785, "epoch": 4744} {"train_loss": -26.130727767944336, "global_step": 393786, "epoch": 4744} {"train_loss": -26.124364852905273, "global_step": 393787, "epoch": 4744} {"train_loss": -26.21951675415039, "global_step": 393788, "epoch": 4744} {"train_loss": -26.2382869720459, "global_step": 393789, "epoch": 4744} {"train_loss": -26.32716178894043, "global_step": 393790, "epoch": 4744} {"train_loss": -26.167530059814453, "global_step": 393791, "epoch": 4744} {"train_loss": -26.651611328125, "global_step": 393792, "epoch": 4744} {"train_loss": -26.702741622924805, "global_step": 393793, "epoch": 4744} {"train_loss": -26.0775146484375, "global_step": 393794, "epoch": 4744} {"train_loss": -26.656599044799805, "global_step": 393795, "epoch": 4744} {"train_loss": -26.403406143188477, "global_step": 393796, "epoch": 4744} {"train_loss": -26.448156356811523, "global_step": 393797, "epoch": 4744} {"train_loss": -26.648284912109375, "global_step": 393798, "epoch": 4744} {"train_loss": -26.0867862701416, "global_step": 393799, "epoch": 4744} {"train_loss": -26.626209259033203, "global_step": 393800, "epoch": 4744} {"train_loss": -26.898651123046875, "global_step": 393801, "epoch": 4744} {"train_loss": -26.44101905822754, "global_step": 393802, "epoch": 4744} {"train_loss": -26.45197105407715, "global_step": 393803, "epoch": 4744} {"train_loss": -26.714996337890625, "global_step": 393804, "epoch": 4744} {"train_loss": -26.16558265686035, "global_step": 393805, "epoch": 4744} {"train_loss": -26.6407527923584, "global_step": 393806, "epoch": 4744} {"train_loss": -26.63431739807129, "global_step": 393807, "epoch": 4744} {"train_loss": -26.905038833618164, "global_step": 393808, "epoch": 4744} {"train_loss": -26.474613189697266, "global_step": 393809, "epoch": 4744} {"train_loss": -26.688129425048828, "global_step": 393810, "epoch": 4744} {"train_loss": -26.561386108398438, "global_step": 393811, "epoch": 4744} {"train_loss": -26.54047203063965, "global_step": 393812, "epoch": 4744} {"train_loss": -26.637678146362305, "global_step": 393813, "epoch": 4744} {"train_loss": -26.79296875, "global_step": 393814, "epoch": 4744} {"train_loss": -26.798160552978516, "global_step": 393815, "epoch": 4744} {"train_loss": -26.779998779296875, "global_step": 393816, "epoch": 4744} {"train_loss": -26.655136108398438, "global_step": 393817, "epoch": 4744} {"train_loss": -26.63912010192871, "global_step": 393818, "epoch": 4744} {"train_loss": -26.612079620361328, "global_step": 393819, "epoch": 4744} {"train_loss": -26.981307983398438, "global_step": 393820, "epoch": 4744} {"train_loss": -26.87763786315918, "global_step": 393821, "epoch": 4744} {"train_loss": -26.699949264526367, "global_step": 393822, "epoch": 4744} {"train_loss": -26.78362464904785, "global_step": 393823, "epoch": 4744} {"train_loss": -26.745092391967773, "global_step": 393824, "epoch": 4744} {"train_loss": -26.4948673248291, "global_step": 393825, "epoch": 4744} {"train_loss": -26.667184829711914, "global_step": 393826, "epoch": 4744} {"train_loss": -26.27374839782715, "global_step": 393827, "epoch": 4744} {"train_loss": -27.145246505737305, "global_step": 393828, "epoch": 4744} {"train_loss": -26.97183609008789, "global_step": 393829, "epoch": 4744} {"train_loss": -27.015827178955078, "global_step": 393830, "epoch": 4744} {"train_loss": -27.08614158630371, "global_step": 393831, "epoch": 4744} {"train_loss": -26.56035804748535, "global_step": 393832, "epoch": 4744} {"train_loss": -26.7579345703125, "global_step": 393833, "epoch": 4744} {"train_loss": -25.9342149941318, "global_step": 393834, "epoch": 4744, "val_loss": 6665902.0} {"train_loss": -26.585193634033203, "global_step": 393835, "epoch": 4745} {"train_loss": -25.737218856811523, "global_step": 393836, "epoch": 4745} {"train_loss": -24.994766235351562, "global_step": 393837, "epoch": 4745} {"train_loss": -24.9500789642334, "global_step": 393838, "epoch": 4745} {"train_loss": -25.937210083007812, "global_step": 393839, "epoch": 4745} {"train_loss": -26.040624618530273, "global_step": 393840, "epoch": 4745} {"train_loss": -25.651514053344727, "global_step": 393841, "epoch": 4745} {"train_loss": -26.272375106811523, "global_step": 393842, "epoch": 4745} {"train_loss": -26.216299057006836, "global_step": 393843, "epoch": 4745} {"train_loss": -26.1755428314209, "global_step": 393844, "epoch": 4745} {"train_loss": -26.320714950561523, "global_step": 393845, "epoch": 4745} {"train_loss": -26.190475463867188, "global_step": 393846, "epoch": 4745} {"train_loss": -26.503366470336914, "global_step": 393847, "epoch": 4745} {"train_loss": -26.54134178161621, "global_step": 393848, "epoch": 4745} {"train_loss": -26.574935913085938, "global_step": 393849, "epoch": 4745} {"train_loss": -26.290939331054688, "global_step": 393850, "epoch": 4745} {"train_loss": -26.474517822265625, "global_step": 393851, "epoch": 4745} {"train_loss": -26.2783260345459, "global_step": 393852, "epoch": 4745} {"train_loss": -25.981473922729492, "global_step": 393853, "epoch": 4745} {"train_loss": -26.192829132080078, "global_step": 393854, "epoch": 4745} {"train_loss": -26.4176025390625, "global_step": 393855, "epoch": 4745} {"train_loss": -26.395727157592773, "global_step": 393856, "epoch": 4745} {"train_loss": -26.49493408203125, "global_step": 393857, "epoch": 4745} {"train_loss": -26.49542808532715, "global_step": 393858, "epoch": 4745} {"train_loss": -26.318159103393555, "global_step": 393859, "epoch": 4745} {"train_loss": -26.596460342407227, "global_step": 393860, "epoch": 4745} {"train_loss": -26.665205001831055, "global_step": 393861, "epoch": 4745} {"train_loss": -26.3445987701416, "global_step": 393862, "epoch": 4745} {"train_loss": -26.373046875, "global_step": 393863, "epoch": 4745} {"train_loss": -26.511474609375, "global_step": 393864, "epoch": 4745} {"train_loss": -26.533573150634766, "global_step": 393865, "epoch": 4745} {"train_loss": -26.51055335998535, "global_step": 393866, "epoch": 4745} {"train_loss": -26.614795684814453, "global_step": 393867, "epoch": 4745} {"train_loss": -26.55666160583496, "global_step": 393868, "epoch": 4745} {"train_loss": -26.99036979675293, "global_step": 393869, "epoch": 4745} {"train_loss": -26.86310386657715, "global_step": 393870, "epoch": 4745} {"train_loss": -26.63104248046875, "global_step": 393871, "epoch": 4745} {"train_loss": -26.7651309967041, "global_step": 393872, "epoch": 4745} {"train_loss": -26.651010513305664, "global_step": 393873, "epoch": 4745} {"train_loss": -26.708251953125, "global_step": 393874, "epoch": 4745} {"train_loss": -26.521589279174805, "global_step": 393875, "epoch": 4745} {"train_loss": -26.956655502319336, "global_step": 393876, "epoch": 4745} {"train_loss": -26.56648826599121, "global_step": 393877, "epoch": 4745} {"train_loss": -26.554162979125977, "global_step": 393878, "epoch": 4745} {"train_loss": -26.7456111907959, "global_step": 393879, "epoch": 4745} {"train_loss": -26.84857177734375, "global_step": 393880, "epoch": 4745} {"train_loss": -26.888996124267578, "global_step": 393881, "epoch": 4745} {"train_loss": -27.11573600769043, "global_step": 393882, "epoch": 4745} {"train_loss": -26.860620498657227, "global_step": 393883, "epoch": 4745} {"train_loss": -26.625890731811523, "global_step": 393884, "epoch": 4745} {"train_loss": -26.575897216796875, "global_step": 393885, "epoch": 4745} {"train_loss": -26.10343360900879, "global_step": 393886, "epoch": 4745} {"train_loss": -26.640689849853516, "global_step": 393887, "epoch": 4745} {"train_loss": -26.77252197265625, "global_step": 393888, "epoch": 4745} {"train_loss": -26.604520797729492, "global_step": 393889, "epoch": 4745} {"train_loss": -26.659011840820312, "global_step": 393890, "epoch": 4745} {"train_loss": -26.308841705322266, "global_step": 393891, "epoch": 4745} {"train_loss": -26.71845054626465, "global_step": 393892, "epoch": 4745} {"train_loss": -26.475055694580078, "global_step": 393893, "epoch": 4745} {"train_loss": -26.506345748901367, "global_step": 393894, "epoch": 4745} {"train_loss": -26.796293258666992, "global_step": 393895, "epoch": 4745} {"train_loss": -26.168048858642578, "global_step": 393896, "epoch": 4745} {"train_loss": -26.386274337768555, "global_step": 393897, "epoch": 4745} {"train_loss": -26.679611206054688, "global_step": 393898, "epoch": 4745} {"train_loss": -26.292526245117188, "global_step": 393899, "epoch": 4745} {"train_loss": -26.3526554107666, "global_step": 393900, "epoch": 4745} {"train_loss": -26.085418701171875, "global_step": 393901, "epoch": 4745} {"train_loss": -26.51618766784668, "global_step": 393902, "epoch": 4745} {"train_loss": -26.345111846923828, "global_step": 393903, "epoch": 4745} {"train_loss": -26.182785034179688, "global_step": 393904, "epoch": 4745} {"train_loss": -26.473526000976562, "global_step": 393905, "epoch": 4745} {"train_loss": -26.759016036987305, "global_step": 393906, "epoch": 4745} {"train_loss": -26.257123947143555, "global_step": 393907, "epoch": 4745} {"train_loss": -26.313886642456055, "global_step": 393908, "epoch": 4745} {"train_loss": -26.155744552612305, "global_step": 393909, "epoch": 4745} {"train_loss": -26.33112144470215, "global_step": 393910, "epoch": 4745} {"train_loss": -26.416303634643555, "global_step": 393911, "epoch": 4745} {"train_loss": -26.56227684020996, "global_step": 393912, "epoch": 4745} {"train_loss": -25.831899642944336, "global_step": 393913, "epoch": 4745} {"train_loss": -26.02764320373535, "global_step": 393914, "epoch": 4745} {"train_loss": -26.162158966064453, "global_step": 393915, "epoch": 4745} {"train_loss": -26.17902183532715, "global_step": 393916, "epoch": 4745} {"train_loss": -26.419002647859504, "global_step": 393917, "epoch": 4745, "val_loss": 6629958.0} {"train_loss": -24.82054901123047, "global_step": 393918, "epoch": 4746} {"train_loss": -26.025714874267578, "global_step": 393919, "epoch": 4746} {"train_loss": -25.550352096557617, "global_step": 393920, "epoch": 4746} {"train_loss": -25.731313705444336, "global_step": 393921, "epoch": 4746} {"train_loss": -25.7623233795166, "global_step": 393922, "epoch": 4746} {"train_loss": -25.490724563598633, "global_step": 393923, "epoch": 4746} {"train_loss": -25.808713912963867, "global_step": 393924, "epoch": 4746} {"train_loss": -25.152463912963867, "global_step": 393925, "epoch": 4746} {"train_loss": -26.47870445251465, "global_step": 393926, "epoch": 4746} {"train_loss": -26.059040069580078, "global_step": 393927, "epoch": 4746} {"train_loss": -26.1370906829834, "global_step": 393928, "epoch": 4746} {"train_loss": -26.086027145385742, "global_step": 393929, "epoch": 4746} {"train_loss": -25.791919708251953, "global_step": 393930, "epoch": 4746} {"train_loss": -26.205188751220703, "global_step": 393931, "epoch": 4746} {"train_loss": -26.336658477783203, "global_step": 393932, "epoch": 4746} {"train_loss": -26.453516006469727, "global_step": 393933, "epoch": 4746} {"train_loss": -26.394201278686523, "global_step": 393934, "epoch": 4746} {"train_loss": -25.862701416015625, "global_step": 393935, "epoch": 4746} {"train_loss": -26.405059814453125, "global_step": 393936, "epoch": 4746} {"train_loss": -26.23004722595215, "global_step": 393937, "epoch": 4746} {"train_loss": -26.418506622314453, "global_step": 393938, "epoch": 4746} {"train_loss": -26.369037628173828, "global_step": 393939, "epoch": 4746} {"train_loss": -26.5313663482666, "global_step": 393940, "epoch": 4746} {"train_loss": -26.363515853881836, "global_step": 393941, "epoch": 4746} {"train_loss": -26.4029541015625, "global_step": 393942, "epoch": 4746} {"train_loss": -26.464624404907227, "global_step": 393943, "epoch": 4746} {"train_loss": -26.393774032592773, "global_step": 393944, "epoch": 4746} {"train_loss": -26.61222267150879, "global_step": 393945, "epoch": 4746} {"train_loss": -26.149585723876953, "global_step": 393946, "epoch": 4746} {"train_loss": -26.353179931640625, "global_step": 393947, "epoch": 4746} {"train_loss": -26.30106544494629, "global_step": 393948, "epoch": 4746} {"train_loss": -26.429121017456055, "global_step": 393949, "epoch": 4746} {"train_loss": -26.6957950592041, "global_step": 393950, "epoch": 4746} {"train_loss": -26.54215431213379, "global_step": 393951, "epoch": 4746} {"train_loss": -26.677722930908203, "global_step": 393952, "epoch": 4746} {"train_loss": -26.802112579345703, "global_step": 393953, "epoch": 4746} {"train_loss": -26.333892822265625, "global_step": 393954, "epoch": 4746} {"train_loss": -26.3968448638916, "global_step": 393955, "epoch": 4746} {"train_loss": -26.93610191345215, "global_step": 393956, "epoch": 4746} {"train_loss": -26.63347816467285, "global_step": 393957, "epoch": 4746} {"train_loss": -26.644641876220703, "global_step": 393958, "epoch": 4746} {"train_loss": -26.57147789001465, "global_step": 393959, "epoch": 4746} {"train_loss": -26.200300216674805, "global_step": 393960, "epoch": 4746} {"train_loss": -26.62548828125, "global_step": 393961, "epoch": 4746} {"train_loss": -26.769372940063477, "global_step": 393962, "epoch": 4746} {"train_loss": -26.3311767578125, "global_step": 393963, "epoch": 4746} {"train_loss": -26.4869327545166, "global_step": 393964, "epoch": 4746} {"train_loss": -26.37397575378418, "global_step": 393965, "epoch": 4746} {"train_loss": -26.521875381469727, "global_step": 393966, "epoch": 4746} {"train_loss": -26.56451988220215, "global_step": 393967, "epoch": 4746} {"train_loss": -26.408985137939453, "global_step": 393968, "epoch": 4746} {"train_loss": -26.2789306640625, "global_step": 393969, "epoch": 4746} {"train_loss": -26.422842025756836, "global_step": 393970, "epoch": 4746} {"train_loss": -26.209293365478516, "global_step": 393971, "epoch": 4746} {"train_loss": -26.18218994140625, "global_step": 393972, "epoch": 4746} {"train_loss": -26.47077751159668, "global_step": 393973, "epoch": 4746} {"train_loss": -26.56044578552246, "global_step": 393974, "epoch": 4746} {"train_loss": -26.36506462097168, "global_step": 393975, "epoch": 4746} {"train_loss": -26.736499786376953, "global_step": 393976, "epoch": 4746} {"train_loss": -26.75641441345215, "global_step": 393977, "epoch": 4746} {"train_loss": -26.250112533569336, "global_step": 393978, "epoch": 4746} {"train_loss": -26.663776397705078, "global_step": 393979, "epoch": 4746} {"train_loss": -26.972578048706055, "global_step": 393980, "epoch": 4746} {"train_loss": -26.20722007751465, "global_step": 393981, "epoch": 4746} {"train_loss": -26.60785484313965, "global_step": 393982, "epoch": 4746} {"train_loss": -26.454345703125, "global_step": 393983, "epoch": 4746} {"train_loss": -26.34639549255371, "global_step": 393984, "epoch": 4746} {"train_loss": -26.49237060546875, "global_step": 393985, "epoch": 4746} {"train_loss": -26.0820369720459, "global_step": 393986, "epoch": 4746} {"train_loss": -26.982715606689453, "global_step": 393987, "epoch": 4746} {"train_loss": -26.453760147094727, "global_step": 393988, "epoch": 4746} {"train_loss": -26.3021297454834, "global_step": 393989, "epoch": 4746} {"train_loss": -25.86794090270996, "global_step": 393990, "epoch": 4746} {"train_loss": -26.34149742126465, "global_step": 393991, "epoch": 4746} {"train_loss": -26.57645606994629, "global_step": 393992, "epoch": 4746} {"train_loss": -26.248342514038086, "global_step": 393993, "epoch": 4746} {"train_loss": -26.449705123901367, "global_step": 393994, "epoch": 4746} {"train_loss": -26.7298641204834, "global_step": 393995, "epoch": 4746} {"train_loss": -26.746007919311523, "global_step": 393996, "epoch": 4746} {"train_loss": -26.44830894470215, "global_step": 393997, "epoch": 4746} {"train_loss": -26.44775390625, "global_step": 393998, "epoch": 4746} {"train_loss": -26.73194694519043, "global_step": 393999, "epoch": 4746} {"train_loss": -26.365389421761755, "global_step": 394000, "epoch": 4746, "val_loss": 6648031.0} {"train_loss": -26.069875717163086, "global_step": 394001, "epoch": 4747} {"train_loss": -26.098432540893555, "global_step": 394002, "epoch": 4747} {"train_loss": -25.829294204711914, "global_step": 394003, "epoch": 4747} {"train_loss": -25.914203643798828, "global_step": 394004, "epoch": 4747} {"train_loss": -26.257394790649414, "global_step": 394005, "epoch": 4747} {"train_loss": -26.201068878173828, "global_step": 394006, "epoch": 4747} {"train_loss": -26.0473575592041, "global_step": 394007, "epoch": 4747} {"train_loss": -25.88657569885254, "global_step": 394008, "epoch": 4747} {"train_loss": -26.87030029296875, "global_step": 394009, "epoch": 4747} {"train_loss": -26.00556755065918, "global_step": 394010, "epoch": 4747} {"train_loss": -26.433841705322266, "global_step": 394011, "epoch": 4747} {"train_loss": -26.121936798095703, "global_step": 394012, "epoch": 4747} {"train_loss": -26.269739151000977, "global_step": 394013, "epoch": 4747} {"train_loss": -26.05692481994629, "global_step": 394014, "epoch": 4747} {"train_loss": -26.3500919342041, "global_step": 394015, "epoch": 4747} {"train_loss": -26.428485870361328, "global_step": 394016, "epoch": 4747} {"train_loss": -26.707763671875, "global_step": 394017, "epoch": 4747} {"train_loss": -26.187463760375977, "global_step": 394018, "epoch": 4747} {"train_loss": -26.367420196533203, "global_step": 394019, "epoch": 4747} {"train_loss": -26.34619140625, "global_step": 394020, "epoch": 4747} {"train_loss": -26.148822784423828, "global_step": 394021, "epoch": 4747} {"train_loss": -26.286935806274414, "global_step": 394022, "epoch": 4747} {"train_loss": -26.182209014892578, "global_step": 394023, "epoch": 4747} {"train_loss": -26.708444595336914, "global_step": 394024, "epoch": 4747} {"train_loss": -26.691404342651367, "global_step": 394025, "epoch": 4747} {"train_loss": -26.512939453125, "global_step": 394026, "epoch": 4747} {"train_loss": -26.637598037719727, "global_step": 394027, "epoch": 4747} {"train_loss": -26.49267578125, "global_step": 394028, "epoch": 4747} {"train_loss": -26.938684463500977, "global_step": 394029, "epoch": 4747} {"train_loss": -26.617353439331055, "global_step": 394030, "epoch": 4747} {"train_loss": -26.665327072143555, "global_step": 394031, "epoch": 4747} {"train_loss": -26.750295639038086, "global_step": 394032, "epoch": 4747} {"train_loss": -26.485198974609375, "global_step": 394033, "epoch": 4747} {"train_loss": -26.60379409790039, "global_step": 394034, "epoch": 4747} {"train_loss": -26.886503219604492, "global_step": 394035, "epoch": 4747} {"train_loss": -26.80220603942871, "global_step": 394036, "epoch": 4747} {"train_loss": -26.793882369995117, "global_step": 394037, "epoch": 4747} {"train_loss": -26.9544677734375, "global_step": 394038, "epoch": 4747} {"train_loss": -26.586694717407227, "global_step": 394039, "epoch": 4747} {"train_loss": -27.125049591064453, "global_step": 394040, "epoch": 4747} {"train_loss": -26.75324821472168, "global_step": 394041, "epoch": 4747} {"train_loss": -26.924701690673828, "global_step": 394042, "epoch": 4747} {"train_loss": -26.914594650268555, "global_step": 394043, "epoch": 4747} {"train_loss": -27.026105880737305, "global_step": 394044, "epoch": 4747} {"train_loss": -26.855609893798828, "global_step": 394045, "epoch": 4747} {"train_loss": -26.907148361206055, "global_step": 394046, "epoch": 4747} {"train_loss": -26.693817138671875, "global_step": 394047, "epoch": 4747} {"train_loss": -26.81489372253418, "global_step": 394048, "epoch": 4747} {"train_loss": -26.96942710876465, "global_step": 394049, "epoch": 4747} {"train_loss": -27.032644271850586, "global_step": 394050, "epoch": 4747} {"train_loss": -26.57143211364746, "global_step": 394051, "epoch": 4747} {"train_loss": -26.894012451171875, "global_step": 394052, "epoch": 4747} {"train_loss": -26.342910766601562, "global_step": 394053, "epoch": 4747} {"train_loss": -26.39324378967285, "global_step": 394054, "epoch": 4747} {"train_loss": -27.203516006469727, "global_step": 394055, "epoch": 4747} {"train_loss": -26.87921714782715, "global_step": 394056, "epoch": 4747} {"train_loss": -26.60519790649414, "global_step": 394057, "epoch": 4747} {"train_loss": -26.2470703125, "global_step": 394058, "epoch": 4747} {"train_loss": -26.49082374572754, "global_step": 394059, "epoch": 4747} {"train_loss": -26.87867546081543, "global_step": 394060, "epoch": 4747} {"train_loss": -26.705371856689453, "global_step": 394061, "epoch": 4747} {"train_loss": -26.50489616394043, "global_step": 394062, "epoch": 4747} {"train_loss": -26.7945556640625, "global_step": 394063, "epoch": 4747} {"train_loss": -26.30933952331543, "global_step": 394064, "epoch": 4747} {"train_loss": -26.73294448852539, "global_step": 394065, "epoch": 4747} {"train_loss": -26.629281997680664, "global_step": 394066, "epoch": 4747} {"train_loss": -26.55889320373535, "global_step": 394067, "epoch": 4747} {"train_loss": -26.411224365234375, "global_step": 394068, "epoch": 4747} {"train_loss": -26.4721622467041, "global_step": 394069, "epoch": 4747} {"train_loss": -26.292621612548828, "global_step": 394070, "epoch": 4747} {"train_loss": -26.551908493041992, "global_step": 394071, "epoch": 4747} {"train_loss": -26.38738441467285, "global_step": 394072, "epoch": 4747} {"train_loss": -26.271459579467773, "global_step": 394073, "epoch": 4747} {"train_loss": -26.291000366210938, "global_step": 394074, "epoch": 4747} {"train_loss": -26.562646865844727, "global_step": 394075, "epoch": 4747} {"train_loss": -26.508228302001953, "global_step": 394076, "epoch": 4747} {"train_loss": -26.433795928955078, "global_step": 394077, "epoch": 4747} {"train_loss": -26.52069664001465, "global_step": 394078, "epoch": 4747} {"train_loss": -26.82527732849121, "global_step": 394079, "epoch": 4747} {"train_loss": -26.788822174072266, "global_step": 394080, "epoch": 4747} {"train_loss": -26.198440551757812, "global_step": 394081, "epoch": 4747} {"train_loss": -26.7803955078125, "global_step": 394082, "epoch": 4747} {"train_loss": -26.547708993934723, "global_step": 394083, "epoch": 4747, "val_loss": 6654836.0} {"train_loss": -25.597511291503906, "global_step": 394084, "epoch": 4748} {"train_loss": -25.514774322509766, "global_step": 394085, "epoch": 4748} {"train_loss": -25.807880401611328, "global_step": 394086, "epoch": 4748} {"train_loss": -26.136327743530273, "global_step": 394087, "epoch": 4748} {"train_loss": -26.057214736938477, "global_step": 394088, "epoch": 4748} {"train_loss": -26.40888023376465, "global_step": 394089, "epoch": 4748} {"train_loss": -25.995849609375, "global_step": 394090, "epoch": 4748} {"train_loss": -26.45786476135254, "global_step": 394091, "epoch": 4748} {"train_loss": -26.364892959594727, "global_step": 394092, "epoch": 4748} {"train_loss": -26.254072189331055, "global_step": 394093, "epoch": 4748} {"train_loss": -26.523481369018555, "global_step": 394094, "epoch": 4748} {"train_loss": -26.20843505859375, "global_step": 394095, "epoch": 4748} {"train_loss": -26.191974639892578, "global_step": 394096, "epoch": 4748} {"train_loss": -26.568973541259766, "global_step": 394097, "epoch": 4748} {"train_loss": -26.16554832458496, "global_step": 394098, "epoch": 4748} {"train_loss": -26.647903442382812, "global_step": 394099, "epoch": 4748} {"train_loss": -26.227670669555664, "global_step": 394100, "epoch": 4748} {"train_loss": -26.5948429107666, "global_step": 394101, "epoch": 4748} {"train_loss": -26.619165420532227, "global_step": 394102, "epoch": 4748} {"train_loss": -26.357624053955078, "global_step": 394103, "epoch": 4748} {"train_loss": -26.032733917236328, "global_step": 394104, "epoch": 4748} {"train_loss": -26.547164916992188, "global_step": 394105, "epoch": 4748} {"train_loss": -26.65899658203125, "global_step": 394106, "epoch": 4748} {"train_loss": -26.592914581298828, "global_step": 394107, "epoch": 4748} {"train_loss": -26.25665855407715, "global_step": 394108, "epoch": 4748} {"train_loss": -26.673419952392578, "global_step": 394109, "epoch": 4748} {"train_loss": -26.599416732788086, "global_step": 394110, "epoch": 4748} {"train_loss": -26.73215675354004, "global_step": 394111, "epoch": 4748} {"train_loss": -26.8347225189209, "global_step": 394112, "epoch": 4748} {"train_loss": -26.7891845703125, "global_step": 394113, "epoch": 4748} {"train_loss": -26.614322662353516, "global_step": 394114, "epoch": 4748} {"train_loss": -26.3677921295166, "global_step": 394115, "epoch": 4748} {"train_loss": -26.844358444213867, "global_step": 394116, "epoch": 4748} {"train_loss": -26.3830509185791, "global_step": 394117, "epoch": 4748} {"train_loss": -26.685876846313477, "global_step": 394118, "epoch": 4748} {"train_loss": -26.796588897705078, "global_step": 394119, "epoch": 4748} {"train_loss": -26.67266845703125, "global_step": 394120, "epoch": 4748} {"train_loss": -26.45892906188965, "global_step": 394121, "epoch": 4748} {"train_loss": -26.769880294799805, "global_step": 394122, "epoch": 4748} {"train_loss": -26.534963607788086, "global_step": 394123, "epoch": 4748} {"train_loss": -26.759069442749023, "global_step": 394124, "epoch": 4748} {"train_loss": -26.393457412719727, "global_step": 394125, "epoch": 4748} {"train_loss": -26.3320369720459, "global_step": 394126, "epoch": 4748} {"train_loss": -26.483556747436523, "global_step": 394127, "epoch": 4748} {"train_loss": -26.634397506713867, "global_step": 394128, "epoch": 4748} {"train_loss": -26.57843589782715, "global_step": 394129, "epoch": 4748} {"train_loss": -27.24161148071289, "global_step": 394130, "epoch": 4748} {"train_loss": -26.787817001342773, "global_step": 394131, "epoch": 4748} {"train_loss": -26.515106201171875, "global_step": 394132, "epoch": 4748} {"train_loss": -26.78968620300293, "global_step": 394133, "epoch": 4748} {"train_loss": -26.48077392578125, "global_step": 394134, "epoch": 4748} {"train_loss": -26.495849609375, "global_step": 394135, "epoch": 4748} {"train_loss": -26.530012130737305, "global_step": 394136, "epoch": 4748} {"train_loss": -26.438955307006836, "global_step": 394137, "epoch": 4748} {"train_loss": -26.545133590698242, "global_step": 394138, "epoch": 4748} {"train_loss": -26.51262855529785, "global_step": 394139, "epoch": 4748} {"train_loss": -26.704452514648438, "global_step": 394140, "epoch": 4748} {"train_loss": -26.484699249267578, "global_step": 394141, "epoch": 4748} {"train_loss": -26.938581466674805, "global_step": 394142, "epoch": 4748} {"train_loss": -26.809539794921875, "global_step": 394143, "epoch": 4748} {"train_loss": -26.919885635375977, "global_step": 394144, "epoch": 4748} {"train_loss": -26.70502281188965, "global_step": 394145, "epoch": 4748} {"train_loss": -26.944488525390625, "global_step": 394146, "epoch": 4748} {"train_loss": -26.648685455322266, "global_step": 394147, "epoch": 4748} {"train_loss": -27.084753036499023, "global_step": 394148, "epoch": 4748} {"train_loss": -26.970823287963867, "global_step": 394149, "epoch": 4748} {"train_loss": -26.874441146850586, "global_step": 394150, "epoch": 4748} {"train_loss": -27.28506851196289, "global_step": 394151, "epoch": 4748} {"train_loss": -26.599838256835938, "global_step": 394152, "epoch": 4748} {"train_loss": -26.816320419311523, "global_step": 394153, "epoch": 4748} {"train_loss": -26.719228744506836, "global_step": 394154, "epoch": 4748} {"train_loss": -26.620107650756836, "global_step": 394155, "epoch": 4748} {"train_loss": -26.743549346923828, "global_step": 394156, "epoch": 4748} {"train_loss": -26.611974716186523, "global_step": 394157, "epoch": 4748} {"train_loss": -26.683496475219727, "global_step": 394158, "epoch": 4748} {"train_loss": -26.965097427368164, "global_step": 394159, "epoch": 4748} {"train_loss": -26.64573097229004, "global_step": 394160, "epoch": 4748} {"train_loss": -26.644851684570312, "global_step": 394161, "epoch": 4748} {"train_loss": -27.05335807800293, "global_step": 394162, "epoch": 4748} {"train_loss": -26.78396987915039, "global_step": 394163, "epoch": 4748} {"train_loss": -26.210620880126953, "global_step": 394164, "epoch": 4748} {"train_loss": -27.025882720947266, "global_step": 394165, "epoch": 4748} {"train_loss": -26.567457451877825, "global_step": 394166, "epoch": 4748, "val_loss": 6538853.5} {"train_loss": -25.975406646728516, "global_step": 394167, "epoch": 4749} {"train_loss": -26.130247116088867, "global_step": 394168, "epoch": 4749} {"train_loss": -26.032886505126953, "global_step": 394169, "epoch": 4749} {"train_loss": -25.947900772094727, "global_step": 394170, "epoch": 4749} {"train_loss": -25.91291618347168, "global_step": 394171, "epoch": 4749} {"train_loss": -26.37190818786621, "global_step": 394172, "epoch": 4749} {"train_loss": -26.07212257385254, "global_step": 394173, "epoch": 4749} {"train_loss": -26.632404327392578, "global_step": 394174, "epoch": 4749} {"train_loss": -26.16316795349121, "global_step": 394175, "epoch": 4749} {"train_loss": -26.100080490112305, "global_step": 394176, "epoch": 4749} {"train_loss": -26.425317764282227, "global_step": 394177, "epoch": 4749} {"train_loss": -26.353317260742188, "global_step": 394178, "epoch": 4749} {"train_loss": -25.931995391845703, "global_step": 394179, "epoch": 4749} {"train_loss": -26.207605361938477, "global_step": 394180, "epoch": 4749} {"train_loss": -26.414520263671875, "global_step": 394181, "epoch": 4749} {"train_loss": -26.002674102783203, "global_step": 394182, "epoch": 4749} {"train_loss": -25.81001091003418, "global_step": 394183, "epoch": 4749} {"train_loss": -26.769062042236328, "global_step": 394184, "epoch": 4749} {"train_loss": -26.76187515258789, "global_step": 394185, "epoch": 4749} {"train_loss": -26.334156036376953, "global_step": 394186, "epoch": 4749} {"train_loss": -26.352386474609375, "global_step": 394187, "epoch": 4749} {"train_loss": -26.588403701782227, "global_step": 394188, "epoch": 4749} {"train_loss": -26.316808700561523, "global_step": 394189, "epoch": 4749} {"train_loss": -26.601659774780273, "global_step": 394190, "epoch": 4749} {"train_loss": -26.532285690307617, "global_step": 394191, "epoch": 4749} {"train_loss": -26.628774642944336, "global_step": 394192, "epoch": 4749} {"train_loss": -26.705188751220703, "global_step": 394193, "epoch": 4749} {"train_loss": -26.457101821899414, "global_step": 394194, "epoch": 4749} {"train_loss": -26.786828994750977, "global_step": 394195, "epoch": 4749} {"train_loss": -26.567508697509766, "global_step": 394196, "epoch": 4749} {"train_loss": -26.59852409362793, "global_step": 394197, "epoch": 4749} {"train_loss": -26.63270378112793, "global_step": 394198, "epoch": 4749} {"train_loss": -26.84077262878418, "global_step": 394199, "epoch": 4749} {"train_loss": -26.923898696899414, "global_step": 394200, "epoch": 4749} {"train_loss": -26.544431686401367, "global_step": 394201, "epoch": 4749} {"train_loss": -25.9124698638916, "global_step": 394202, "epoch": 4749} {"train_loss": -26.45172119140625, "global_step": 394203, "epoch": 4749} {"train_loss": -26.608850479125977, "global_step": 394204, "epoch": 4749} {"train_loss": -26.55890464782715, "global_step": 394205, "epoch": 4749} {"train_loss": -26.964221954345703, "global_step": 394206, "epoch": 4749} {"train_loss": -26.97895622253418, "global_step": 394207, "epoch": 4749} {"train_loss": -26.508718490600586, "global_step": 394208, "epoch": 4749} {"train_loss": -26.684207916259766, "global_step": 394209, "epoch": 4749} {"train_loss": -26.733356475830078, "global_step": 394210, "epoch": 4749} {"train_loss": -26.695011138916016, "global_step": 394211, "epoch": 4749} {"train_loss": -26.62685203552246, "global_step": 394212, "epoch": 4749} {"train_loss": -26.819257736206055, "global_step": 394213, "epoch": 4749} {"train_loss": -26.198774337768555, "global_step": 394214, "epoch": 4749} {"train_loss": -26.54656982421875, "global_step": 394215, "epoch": 4749} {"train_loss": -26.78009033203125, "global_step": 394216, "epoch": 4749} {"train_loss": -26.69483757019043, "global_step": 394217, "epoch": 4749} {"train_loss": -26.76447868347168, "global_step": 394218, "epoch": 4749} {"train_loss": -26.796646118164062, "global_step": 394219, "epoch": 4749} {"train_loss": -26.229700088500977, "global_step": 394220, "epoch": 4749} {"train_loss": -26.217105865478516, "global_step": 394221, "epoch": 4749} {"train_loss": -26.397705078125, "global_step": 394222, "epoch": 4749} {"train_loss": -26.373870849609375, "global_step": 394223, "epoch": 4749} {"train_loss": -26.5361385345459, "global_step": 394224, "epoch": 4749} {"train_loss": -26.356122970581055, "global_step": 394225, "epoch": 4749} {"train_loss": -26.35272216796875, "global_step": 394226, "epoch": 4749} {"train_loss": -26.30669593811035, "global_step": 394227, "epoch": 4749} {"train_loss": -26.89739418029785, "global_step": 394228, "epoch": 4749} {"train_loss": -26.47426414489746, "global_step": 394229, "epoch": 4749} {"train_loss": -26.80378532409668, "global_step": 394230, "epoch": 4749} {"train_loss": -26.85210609436035, "global_step": 394231, "epoch": 4749} {"train_loss": -26.33527183532715, "global_step": 394232, "epoch": 4749} {"train_loss": -26.722131729125977, "global_step": 394233, "epoch": 4749} {"train_loss": -26.518354415893555, "global_step": 394234, "epoch": 4749} {"train_loss": -25.864709854125977, "global_step": 394235, "epoch": 4749} {"train_loss": -26.04190444946289, "global_step": 394236, "epoch": 4749} {"train_loss": -26.59197998046875, "global_step": 394237, "epoch": 4749} {"train_loss": -26.020465850830078, "global_step": 394238, "epoch": 4749} {"train_loss": -26.04914665222168, "global_step": 394239, "epoch": 4749} {"train_loss": -26.488082885742188, "global_step": 394240, "epoch": 4749} {"train_loss": -26.43342399597168, "global_step": 394241, "epoch": 4749} {"train_loss": -25.626361846923828, "global_step": 394242, "epoch": 4749} {"train_loss": -26.063379287719727, "global_step": 394243, "epoch": 4749} {"train_loss": -26.506702423095703, "global_step": 394244, "epoch": 4749} {"train_loss": -26.067169189453125, "global_step": 394245, "epoch": 4749} {"train_loss": -26.43641471862793, "global_step": 394246, "epoch": 4749} {"train_loss": -26.322431564331055, "global_step": 394247, "epoch": 4749} {"train_loss": -26.764484405517578, "global_step": 394248, "epoch": 4749} {"train_loss": -26.43335059751947, "global_step": 394249, "epoch": 4749, "val_loss": 6550596.0} {"train_loss": -25.943044662475586, "global_step": 394250, "epoch": 4750} {"train_loss": -25.824487686157227, "global_step": 394251, "epoch": 4750} {"train_loss": -26.26316261291504, "global_step": 394252, "epoch": 4750} {"train_loss": -25.71046257019043, "global_step": 394253, "epoch": 4750} {"train_loss": -25.81769371032715, "global_step": 394254, "epoch": 4750} {"train_loss": -25.658018112182617, "global_step": 394255, "epoch": 4750} {"train_loss": -26.422571182250977, "global_step": 394256, "epoch": 4750} {"train_loss": -26.1192569732666, "global_step": 394257, "epoch": 4750} {"train_loss": -26.246564865112305, "global_step": 394258, "epoch": 4750} {"train_loss": -26.401086807250977, "global_step": 394259, "epoch": 4750} {"train_loss": -26.267953872680664, "global_step": 394260, "epoch": 4750} {"train_loss": -26.1649227142334, "global_step": 394261, "epoch": 4750} {"train_loss": -26.379552841186523, "global_step": 394262, "epoch": 4750} {"train_loss": -26.199176788330078, "global_step": 394263, "epoch": 4750} {"train_loss": -26.115833282470703, "global_step": 394264, "epoch": 4750} {"train_loss": -26.304101943969727, "global_step": 394265, "epoch": 4750} {"train_loss": -26.606176376342773, "global_step": 394266, "epoch": 4750} {"train_loss": -26.601892471313477, "global_step": 394267, "epoch": 4750} {"train_loss": -26.375049591064453, "global_step": 394268, "epoch": 4750} {"train_loss": -26.585458755493164, "global_step": 394269, "epoch": 4750} {"train_loss": -26.52570915222168, "global_step": 394270, "epoch": 4750} {"train_loss": -26.11039161682129, "global_step": 394271, "epoch": 4750} {"train_loss": -26.502552032470703, "global_step": 394272, "epoch": 4750} {"train_loss": -26.466171264648438, "global_step": 394273, "epoch": 4750} {"train_loss": -26.533782958984375, "global_step": 394274, "epoch": 4750} {"train_loss": -26.69873046875, "global_step": 394275, "epoch": 4750} {"train_loss": -26.48786735534668, "global_step": 394276, "epoch": 4750} {"train_loss": -26.48486328125, "global_step": 394277, "epoch": 4750} {"train_loss": -26.861440658569336, "global_step": 394278, "epoch": 4750} {"train_loss": -26.654251098632812, "global_step": 394279, "epoch": 4750} {"train_loss": -26.927093505859375, "global_step": 394280, "epoch": 4750} {"train_loss": -26.58521842956543, "global_step": 394281, "epoch": 4750} {"train_loss": -26.611740112304688, "global_step": 394282, "epoch": 4750} {"train_loss": -26.78303337097168, "global_step": 394283, "epoch": 4750} {"train_loss": -26.80095863342285, "global_step": 394284, "epoch": 4750} {"train_loss": -26.45380973815918, "global_step": 394285, "epoch": 4750} {"train_loss": -26.729644775390625, "global_step": 394286, "epoch": 4750} {"train_loss": -26.61249351501465, "global_step": 394287, "epoch": 4750} {"train_loss": -26.6584415435791, "global_step": 394288, "epoch": 4750} {"train_loss": -26.97904396057129, "global_step": 394289, "epoch": 4750} {"train_loss": -26.92799186706543, "global_step": 394290, "epoch": 4750} {"train_loss": -26.653528213500977, "global_step": 394291, "epoch": 4750} {"train_loss": -26.59058952331543, "global_step": 394292, "epoch": 4750} {"train_loss": -26.763751983642578, "global_step": 394293, "epoch": 4750} {"train_loss": -26.203475952148438, "global_step": 394294, "epoch": 4750} {"train_loss": -26.475255966186523, "global_step": 394295, "epoch": 4750} {"train_loss": -26.648452758789062, "global_step": 394296, "epoch": 4750} {"train_loss": -26.7424259185791, "global_step": 394297, "epoch": 4750} {"train_loss": -26.583423614501953, "global_step": 394298, "epoch": 4750} {"train_loss": -26.723127365112305, "global_step": 394299, "epoch": 4750} {"train_loss": -26.773029327392578, "global_step": 394300, "epoch": 4750} {"train_loss": -26.35943031311035, "global_step": 394301, "epoch": 4750} {"train_loss": -26.55356216430664, "global_step": 394302, "epoch": 4750} {"train_loss": -26.8355655670166, "global_step": 394303, "epoch": 4750} {"train_loss": -26.550689697265625, "global_step": 394304, "epoch": 4750} {"train_loss": -26.76932144165039, "global_step": 394305, "epoch": 4750} {"train_loss": -26.7984676361084, "global_step": 394306, "epoch": 4750} {"train_loss": -26.46502113342285, "global_step": 394307, "epoch": 4750} {"train_loss": -26.53285026550293, "global_step": 394308, "epoch": 4750} {"train_loss": -26.259418487548828, "global_step": 394309, "epoch": 4750} {"train_loss": -26.857385635375977, "global_step": 394310, "epoch": 4750} {"train_loss": -27.0019474029541, "global_step": 394311, "epoch": 4750} {"train_loss": -26.67805290222168, "global_step": 394312, "epoch": 4750} {"train_loss": -26.45221519470215, "global_step": 394313, "epoch": 4750} {"train_loss": -25.840442657470703, "global_step": 394314, "epoch": 4750} {"train_loss": -25.950458526611328, "global_step": 394315, "epoch": 4750} {"train_loss": -25.641162872314453, "global_step": 394316, "epoch": 4750} {"train_loss": -25.680496215820312, "global_step": 394317, "epoch": 4750} {"train_loss": -26.35945701599121, "global_step": 394318, "epoch": 4750} {"train_loss": -26.481002807617188, "global_step": 394319, "epoch": 4750} {"train_loss": -26.238983154296875, "global_step": 394320, "epoch": 4750} {"train_loss": -26.51690101623535, "global_step": 394321, "epoch": 4750} {"train_loss": -26.378568649291992, "global_step": 394322, "epoch": 4750} {"train_loss": -26.249835968017578, "global_step": 394323, "epoch": 4750} {"train_loss": -26.402359008789062, "global_step": 394324, "epoch": 4750} {"train_loss": -26.265775680541992, "global_step": 394325, "epoch": 4750} {"train_loss": -26.186725616455078, "global_step": 394326, "epoch": 4750} {"train_loss": -26.431015014648438, "global_step": 394327, "epoch": 4750} {"train_loss": -26.36474609375, "global_step": 394328, "epoch": 4750} {"train_loss": -26.4766788482666, "global_step": 394329, "epoch": 4750} {"train_loss": -26.981042861938477, "global_step": 394330, "epoch": 4750} {"train_loss": -26.548843383789062, "global_step": 394331, "epoch": 4750} {"train_loss": -26.446231106677686, "global_step": 394332, "epoch": 4750, "train/sim_max_reward_0": 1.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 0.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4500000": 1.0, "test/sim_max_reward_4500001": 1.0, "test/sim_max_reward_4500002": 1.0, "test/sim_max_reward_4500003": 1.0, "test/sim_max_reward_4500004": 1.0, "test/sim_max_reward_4500005": 1.0, "test/sim_max_reward_4500006": 1.0, "test/sim_max_reward_4500007": 0.0, "test/sim_max_reward_4500008": 1.0, "test/sim_max_reward_4500009": 1.0, "test/sim_max_reward_4500010": 1.0, "test/sim_max_reward_4500011": 1.0, "test/sim_max_reward_4500012": 1.0, "test/sim_max_reward_4500013": 0.0, "test/sim_max_reward_4500014": 1.0, "test/sim_max_reward_4500015": 1.0, "test/sim_max_reward_4500016": 1.0, "test/sim_max_reward_4500017": 1.0, "test/sim_max_reward_4500018": 1.0, "test/sim_max_reward_4500019": 1.0, "test/sim_max_reward_4500020": 1.0, "test/sim_max_reward_4500021": 1.0, "train/mean_score": 0.8333333333333334, "test/mean_score": 0.9090909090909091, "val_loss": 6581793.0} {"train_loss": -25.903583526611328, "global_step": 394333, "epoch": 4751} {"train_loss": -26.465307235717773, "global_step": 394334, "epoch": 4751} {"train_loss": -26.2082576751709, "global_step": 394335, "epoch": 4751} {"train_loss": -26.13071060180664, "global_step": 394336, "epoch": 4751} {"train_loss": -26.00046730041504, "global_step": 394337, "epoch": 4751} {"train_loss": -26.50446128845215, "global_step": 394338, "epoch": 4751} {"train_loss": -26.405536651611328, "global_step": 394339, "epoch": 4751} {"train_loss": -25.92706298828125, "global_step": 394340, "epoch": 4751} {"train_loss": -26.438385009765625, "global_step": 394341, "epoch": 4751} {"train_loss": -26.043066024780273, "global_step": 394342, "epoch": 4751} {"train_loss": -26.482852935791016, "global_step": 394343, "epoch": 4751} {"train_loss": -26.363149642944336, "global_step": 394344, "epoch": 4751} {"train_loss": -26.512969970703125, "global_step": 394345, "epoch": 4751} {"train_loss": -26.417652130126953, "global_step": 394346, "epoch": 4751} {"train_loss": -26.245086669921875, "global_step": 394347, "epoch": 4751} {"train_loss": -26.67978858947754, "global_step": 394348, "epoch": 4751} {"train_loss": -26.771162033081055, "global_step": 394349, "epoch": 4751} {"train_loss": -26.38157081604004, "global_step": 394350, "epoch": 4751} {"train_loss": -26.69317054748535, "global_step": 394351, "epoch": 4751} {"train_loss": -26.43470573425293, "global_step": 394352, "epoch": 4751} {"train_loss": -26.28759765625, "global_step": 394353, "epoch": 4751} {"train_loss": -26.670438766479492, "global_step": 394354, "epoch": 4751} {"train_loss": -26.647693634033203, "global_step": 394355, "epoch": 4751} {"train_loss": -26.573217391967773, "global_step": 394356, "epoch": 4751} {"train_loss": -26.786823272705078, "global_step": 394357, "epoch": 4751} {"train_loss": -26.48995018005371, "global_step": 394358, "epoch": 4751} {"train_loss": -26.769317626953125, "global_step": 394359, "epoch": 4751} {"train_loss": -26.58701515197754, "global_step": 394360, "epoch": 4751} {"train_loss": -26.89841651916504, "global_step": 394361, "epoch": 4751} {"train_loss": -26.62794303894043, "global_step": 394362, "epoch": 4751} {"train_loss": -26.054357528686523, "global_step": 394363, "epoch": 4751} {"train_loss": -26.923416137695312, "global_step": 394364, "epoch": 4751} {"train_loss": -26.9461612701416, "global_step": 394365, "epoch": 4751} {"train_loss": -26.273649215698242, "global_step": 394366, "epoch": 4751} {"train_loss": -26.5327205657959, "global_step": 394367, "epoch": 4751} {"train_loss": -26.532672882080078, "global_step": 394368, "epoch": 4751} {"train_loss": -26.584768295288086, "global_step": 394369, "epoch": 4751} {"train_loss": -26.57745361328125, "global_step": 394370, "epoch": 4751} {"train_loss": -26.40960693359375, "global_step": 394371, "epoch": 4751} {"train_loss": -26.691726684570312, "global_step": 394372, "epoch": 4751} {"train_loss": -26.589710235595703, "global_step": 394373, "epoch": 4751} {"train_loss": -26.6505069732666, "global_step": 394374, "epoch": 4751} {"train_loss": -26.70328712463379, "global_step": 394375, "epoch": 4751} {"train_loss": -26.526166915893555, "global_step": 394376, "epoch": 4751} {"train_loss": -26.47002601623535, "global_step": 394377, "epoch": 4751} {"train_loss": -26.697406768798828, "global_step": 394378, "epoch": 4751} {"train_loss": -26.3554744720459, "global_step": 394379, "epoch": 4751} {"train_loss": -26.640485763549805, "global_step": 394380, "epoch": 4751} {"train_loss": -26.364145278930664, "global_step": 394381, "epoch": 4751} {"train_loss": -26.44819450378418, "global_step": 394382, "epoch": 4751} {"train_loss": -26.512948989868164, "global_step": 394383, "epoch": 4751} {"train_loss": -26.557077407836914, "global_step": 394384, "epoch": 4751} {"train_loss": -26.624013900756836, "global_step": 394385, "epoch": 4751} {"train_loss": -26.675220489501953, "global_step": 394386, "epoch": 4751} {"train_loss": -26.756000518798828, "global_step": 394387, "epoch": 4751} {"train_loss": -26.7901668548584, "global_step": 394388, "epoch": 4751} {"train_loss": -26.51043128967285, "global_step": 394389, "epoch": 4751} {"train_loss": -26.753692626953125, "global_step": 394390, "epoch": 4751} {"train_loss": -26.09602928161621, "global_step": 394391, "epoch": 4751} {"train_loss": -25.986135482788086, "global_step": 394392, "epoch": 4751} {"train_loss": -26.815088272094727, "global_step": 394393, "epoch": 4751} {"train_loss": -26.79776382446289, "global_step": 394394, "epoch": 4751} {"train_loss": -26.681304931640625, "global_step": 394395, "epoch": 4751} {"train_loss": -26.252933502197266, "global_step": 394396, "epoch": 4751} {"train_loss": -26.780059814453125, "global_step": 394397, "epoch": 4751} {"train_loss": -26.74399757385254, "global_step": 394398, "epoch": 4751} {"train_loss": -26.58984375, "global_step": 394399, "epoch": 4751} {"train_loss": -26.64851188659668, "global_step": 394400, "epoch": 4751} {"train_loss": -26.56019401550293, "global_step": 394401, "epoch": 4751} {"train_loss": -26.554174423217773, "global_step": 394402, "epoch": 4751} {"train_loss": -26.7138729095459, "global_step": 394403, "epoch": 4751} {"train_loss": -26.495925903320312, "global_step": 394404, "epoch": 4751} {"train_loss": -26.972497940063477, "global_step": 394405, "epoch": 4751} {"train_loss": -26.46917152404785, "global_step": 394406, "epoch": 4751} {"train_loss": -26.8207950592041, "global_step": 394407, "epoch": 4751} {"train_loss": -26.223737716674805, "global_step": 394408, "epoch": 4751} {"train_loss": -26.603784561157227, "global_step": 394409, "epoch": 4751} {"train_loss": -26.451154708862305, "global_step": 394410, "epoch": 4751} {"train_loss": -26.257856369018555, "global_step": 394411, "epoch": 4751} {"train_loss": -26.759496688842773, "global_step": 394412, "epoch": 4751} {"train_loss": -26.485126495361328, "global_step": 394413, "epoch": 4751} {"train_loss": -26.608591079711914, "global_step": 394414, "epoch": 4751} {"train_loss": -26.531415640589703, "global_step": 394415, "epoch": 4751, "val_loss": 6597709.0} {"train_loss": -26.19386100769043, "global_step": 394416, "epoch": 4752} {"train_loss": -25.87855339050293, "global_step": 394417, "epoch": 4752} {"train_loss": -26.249664306640625, "global_step": 394418, "epoch": 4752} {"train_loss": -25.97721290588379, "global_step": 394419, "epoch": 4752} {"train_loss": -26.845640182495117, "global_step": 394420, "epoch": 4752} {"train_loss": -25.98151969909668, "global_step": 394421, "epoch": 4752} {"train_loss": -26.394678115844727, "global_step": 394422, "epoch": 4752} {"train_loss": -26.35236167907715, "global_step": 394423, "epoch": 4752} {"train_loss": -26.596967697143555, "global_step": 394424, "epoch": 4752} {"train_loss": -26.188688278198242, "global_step": 394425, "epoch": 4752} {"train_loss": -26.3760986328125, "global_step": 394426, "epoch": 4752} {"train_loss": -26.219141006469727, "global_step": 394427, "epoch": 4752} {"train_loss": -26.133625030517578, "global_step": 394428, "epoch": 4752} {"train_loss": -26.7111873626709, "global_step": 394429, "epoch": 4752} {"train_loss": -25.965723037719727, "global_step": 394430, "epoch": 4752} {"train_loss": -26.31844139099121, "global_step": 394431, "epoch": 4752} {"train_loss": -26.17801856994629, "global_step": 394432, "epoch": 4752} {"train_loss": -26.417999267578125, "global_step": 394433, "epoch": 4752} {"train_loss": -26.134052276611328, "global_step": 394434, "epoch": 4752} {"train_loss": -26.732196807861328, "global_step": 394435, "epoch": 4752} {"train_loss": -26.5712947845459, "global_step": 394436, "epoch": 4752} {"train_loss": -26.205219268798828, "global_step": 394437, "epoch": 4752} {"train_loss": -26.3468017578125, "global_step": 394438, "epoch": 4752} {"train_loss": -26.420995712280273, "global_step": 394439, "epoch": 4752} {"train_loss": -26.632862091064453, "global_step": 394440, "epoch": 4752} {"train_loss": -26.569555282592773, "global_step": 394441, "epoch": 4752} {"train_loss": -26.27180290222168, "global_step": 394442, "epoch": 4752} {"train_loss": -26.581790924072266, "global_step": 394443, "epoch": 4752} {"train_loss": -26.686878204345703, "global_step": 394444, "epoch": 4752} {"train_loss": -26.769994735717773, "global_step": 394445, "epoch": 4752} {"train_loss": -26.387298583984375, "global_step": 394446, "epoch": 4752} {"train_loss": -26.55390739440918, "global_step": 394447, "epoch": 4752} {"train_loss": -26.49491310119629, "global_step": 394448, "epoch": 4752} {"train_loss": -26.7376651763916, "global_step": 394449, "epoch": 4752} {"train_loss": -26.727725982666016, "global_step": 394450, "epoch": 4752} {"train_loss": -27.032678604125977, "global_step": 394451, "epoch": 4752} {"train_loss": -26.401813507080078, "global_step": 394452, "epoch": 4752} {"train_loss": -26.5341854095459, "global_step": 394453, "epoch": 4752} {"train_loss": -26.618717193603516, "global_step": 394454, "epoch": 4752} {"train_loss": -26.655384063720703, "global_step": 394455, "epoch": 4752} {"train_loss": -26.625940322875977, "global_step": 394456, "epoch": 4752} {"train_loss": -26.790807723999023, "global_step": 394457, "epoch": 4752} {"train_loss": -26.79725456237793, "global_step": 394458, "epoch": 4752} {"train_loss": -27.155935287475586, "global_step": 394459, "epoch": 4752} {"train_loss": -26.828393936157227, "global_step": 394460, "epoch": 4752} {"train_loss": -26.7856388092041, "global_step": 394461, "epoch": 4752} {"train_loss": -26.806028366088867, "global_step": 394462, "epoch": 4752} {"train_loss": -26.89015007019043, "global_step": 394463, "epoch": 4752} {"train_loss": -27.096837997436523, "global_step": 394464, "epoch": 4752} {"train_loss": -26.945775985717773, "global_step": 394465, "epoch": 4752} {"train_loss": -26.655969619750977, "global_step": 394466, "epoch": 4752} {"train_loss": -26.840314865112305, "global_step": 394467, "epoch": 4752} {"train_loss": -27.175519943237305, "global_step": 394468, "epoch": 4752} {"train_loss": -26.652753829956055, "global_step": 394469, "epoch": 4752} {"train_loss": -25.883060455322266, "global_step": 394470, "epoch": 4752} {"train_loss": -25.778522491455078, "global_step": 394471, "epoch": 4752} {"train_loss": -25.47658348083496, "global_step": 394472, "epoch": 4752} {"train_loss": -26.00592041015625, "global_step": 394473, "epoch": 4752} {"train_loss": -26.52497673034668, "global_step": 394474, "epoch": 4752} {"train_loss": -25.45027732849121, "global_step": 394475, "epoch": 4752} {"train_loss": -26.213964462280273, "global_step": 394476, "epoch": 4752} {"train_loss": -25.8426456451416, "global_step": 394477, "epoch": 4752} {"train_loss": -26.46329116821289, "global_step": 394478, "epoch": 4752} {"train_loss": -26.556427001953125, "global_step": 394479, "epoch": 4752} {"train_loss": -26.584970474243164, "global_step": 394480, "epoch": 4752} {"train_loss": -26.822540283203125, "global_step": 394481, "epoch": 4752} {"train_loss": -26.201374053955078, "global_step": 394482, "epoch": 4752} {"train_loss": -26.262094497680664, "global_step": 394483, "epoch": 4752} {"train_loss": -26.255298614501953, "global_step": 394484, "epoch": 4752} {"train_loss": -26.075342178344727, "global_step": 394485, "epoch": 4752} {"train_loss": -26.37696647644043, "global_step": 394486, "epoch": 4752} {"train_loss": -26.05438232421875, "global_step": 394487, "epoch": 4752} {"train_loss": -26.419921875, "global_step": 394488, "epoch": 4752} {"train_loss": -26.5539493560791, "global_step": 394489, "epoch": 4752} {"train_loss": -26.034292221069336, "global_step": 394490, "epoch": 4752} {"train_loss": -25.7801456451416, "global_step": 394491, "epoch": 4752} {"train_loss": -26.367298126220703, "global_step": 394492, "epoch": 4752} {"train_loss": -26.29391860961914, "global_step": 394493, "epoch": 4752} {"train_loss": -25.785146713256836, "global_step": 394494, "epoch": 4752} {"train_loss": -25.678449630737305, "global_step": 394495, "epoch": 4752} {"train_loss": -25.907007217407227, "global_step": 394496, "epoch": 4752} {"train_loss": -26.1866512298584, "global_step": 394497, "epoch": 4752} {"train_loss": -26.412919193865307, "global_step": 394498, "epoch": 4752, "val_loss": 6657768.0} {"train_loss": -25.60052490234375, "global_step": 394499, "epoch": 4753} {"train_loss": -25.838708877563477, "global_step": 394500, "epoch": 4753} {"train_loss": -26.01051139831543, "global_step": 394501, "epoch": 4753} {"train_loss": -25.81756591796875, "global_step": 394502, "epoch": 4753} {"train_loss": -26.112903594970703, "global_step": 394503, "epoch": 4753} {"train_loss": -26.170270919799805, "global_step": 394504, "epoch": 4753} {"train_loss": -25.799657821655273, "global_step": 394505, "epoch": 4753} {"train_loss": -25.683765411376953, "global_step": 394506, "epoch": 4753} {"train_loss": -25.891016006469727, "global_step": 394507, "epoch": 4753} {"train_loss": -25.9716854095459, "global_step": 394508, "epoch": 4753} {"train_loss": -26.018552780151367, "global_step": 394509, "epoch": 4753} {"train_loss": -25.868209838867188, "global_step": 394510, "epoch": 4753} {"train_loss": -26.05031394958496, "global_step": 394511, "epoch": 4753} {"train_loss": -25.923721313476562, "global_step": 394512, "epoch": 4753} {"train_loss": -26.3216609954834, "global_step": 394513, "epoch": 4753} {"train_loss": -25.85682487487793, "global_step": 394514, "epoch": 4753} {"train_loss": -26.10245704650879, "global_step": 394515, "epoch": 4753} {"train_loss": -26.5318603515625, "global_step": 394516, "epoch": 4753} {"train_loss": -26.291839599609375, "global_step": 394517, "epoch": 4753} {"train_loss": -26.332128524780273, "global_step": 394518, "epoch": 4753} {"train_loss": -26.160497665405273, "global_step": 394519, "epoch": 4753} {"train_loss": -26.114490509033203, "global_step": 394520, "epoch": 4753} {"train_loss": -26.644495010375977, "global_step": 394521, "epoch": 4753} {"train_loss": -26.27203369140625, "global_step": 394522, "epoch": 4753} {"train_loss": -26.34286880493164, "global_step": 394523, "epoch": 4753} {"train_loss": -26.621625900268555, "global_step": 394524, "epoch": 4753} {"train_loss": -26.286901473999023, "global_step": 394525, "epoch": 4753} {"train_loss": -26.431934356689453, "global_step": 394526, "epoch": 4753} {"train_loss": -26.235244750976562, "global_step": 394527, "epoch": 4753} {"train_loss": -26.61866569519043, "global_step": 394528, "epoch": 4753} {"train_loss": -26.728927612304688, "global_step": 394529, "epoch": 4753} {"train_loss": -26.627344131469727, "global_step": 394530, "epoch": 4753} {"train_loss": -26.39312171936035, "global_step": 394531, "epoch": 4753} {"train_loss": -26.569982528686523, "global_step": 394532, "epoch": 4753} {"train_loss": -26.41054344177246, "global_step": 394533, "epoch": 4753} {"train_loss": -26.682844161987305, "global_step": 394534, "epoch": 4753} {"train_loss": -26.4520320892334, "global_step": 394535, "epoch": 4753} {"train_loss": -26.560571670532227, "global_step": 394536, "epoch": 4753} {"train_loss": -26.715225219726562, "global_step": 394537, "epoch": 4753} {"train_loss": -26.60679054260254, "global_step": 394538, "epoch": 4753} {"train_loss": -26.940168380737305, "global_step": 394539, "epoch": 4753} {"train_loss": -26.635730743408203, "global_step": 394540, "epoch": 4753} {"train_loss": -26.609699249267578, "global_step": 394541, "epoch": 4753} {"train_loss": -26.866291046142578, "global_step": 394542, "epoch": 4753} {"train_loss": -26.20564079284668, "global_step": 394543, "epoch": 4753} {"train_loss": -26.556066513061523, "global_step": 394544, "epoch": 4753} {"train_loss": -26.333837509155273, "global_step": 394545, "epoch": 4753} {"train_loss": -26.648895263671875, "global_step": 394546, "epoch": 4753} {"train_loss": -26.614023208618164, "global_step": 394547, "epoch": 4753} {"train_loss": -26.78753089904785, "global_step": 394548, "epoch": 4753} {"train_loss": -26.708154678344727, "global_step": 394549, "epoch": 4753} {"train_loss": -26.84524917602539, "global_step": 394550, "epoch": 4753} {"train_loss": -27.03814697265625, "global_step": 394551, "epoch": 4753} {"train_loss": -26.623159408569336, "global_step": 394552, "epoch": 4753} {"train_loss": -26.465978622436523, "global_step": 394553, "epoch": 4753} {"train_loss": -26.526336669921875, "global_step": 394554, "epoch": 4753} {"train_loss": -26.79142189025879, "global_step": 394555, "epoch": 4753} {"train_loss": -26.87619972229004, "global_step": 394556, "epoch": 4753} {"train_loss": -26.954837799072266, "global_step": 394557, "epoch": 4753} {"train_loss": -26.669147491455078, "global_step": 394558, "epoch": 4753} {"train_loss": -27.24237632751465, "global_step": 394559, "epoch": 4753} {"train_loss": -26.8978328704834, "global_step": 394560, "epoch": 4753} {"train_loss": -27.092737197875977, "global_step": 394561, "epoch": 4753} {"train_loss": -26.4637451171875, "global_step": 394562, "epoch": 4753} {"train_loss": -26.7177791595459, "global_step": 394563, "epoch": 4753} {"train_loss": -26.891132354736328, "global_step": 394564, "epoch": 4753} {"train_loss": -26.086957931518555, "global_step": 394565, "epoch": 4753} {"train_loss": -25.02350425720215, "global_step": 394566, "epoch": 4753} {"train_loss": -25.577096939086914, "global_step": 394567, "epoch": 4753} {"train_loss": -26.372882843017578, "global_step": 394568, "epoch": 4753} {"train_loss": -26.512903213500977, "global_step": 394569, "epoch": 4753} {"train_loss": -25.9606876373291, "global_step": 394570, "epoch": 4753} {"train_loss": -26.342731475830078, "global_step": 394571, "epoch": 4753} {"train_loss": -26.078527450561523, "global_step": 394572, "epoch": 4753} {"train_loss": -26.127079010009766, "global_step": 394573, "epoch": 4753} {"train_loss": -25.69732666015625, "global_step": 394574, "epoch": 4753} {"train_loss": -26.3894100189209, "global_step": 394575, "epoch": 4753} {"train_loss": -25.73805046081543, "global_step": 394576, "epoch": 4753} {"train_loss": -25.847335815429688, "global_step": 394577, "epoch": 4753} {"train_loss": -26.194854736328125, "global_step": 394578, "epoch": 4753} {"train_loss": -26.418670654296875, "global_step": 394579, "epoch": 4753} {"train_loss": -25.876174926757812, "global_step": 394580, "epoch": 4753} {"train_loss": -26.348668845303088, "global_step": 394581, "epoch": 4753, "val_loss": 6740831.0} {"train_loss": -25.633920669555664, "global_step": 394582, "epoch": 4754} {"train_loss": -25.900876998901367, "global_step": 394583, "epoch": 4754} {"train_loss": -25.791065216064453, "global_step": 394584, "epoch": 4754} {"train_loss": -26.018756866455078, "global_step": 394585, "epoch": 4754} {"train_loss": -26.19209861755371, "global_step": 394586, "epoch": 4754} {"train_loss": -25.934417724609375, "global_step": 394587, "epoch": 4754} {"train_loss": -26.521472930908203, "global_step": 394588, "epoch": 4754} {"train_loss": -25.876638412475586, "global_step": 394589, "epoch": 4754} {"train_loss": -26.287342071533203, "global_step": 394590, "epoch": 4754} {"train_loss": -26.16682243347168, "global_step": 394591, "epoch": 4754} {"train_loss": -26.2393856048584, "global_step": 394592, "epoch": 4754} {"train_loss": -26.363889694213867, "global_step": 394593, "epoch": 4754} {"train_loss": -26.178796768188477, "global_step": 394594, "epoch": 4754} {"train_loss": -26.291528701782227, "global_step": 394595, "epoch": 4754} {"train_loss": -26.569427490234375, "global_step": 394596, "epoch": 4754} {"train_loss": -26.16656494140625, "global_step": 394597, "epoch": 4754} {"train_loss": -26.61053466796875, "global_step": 394598, "epoch": 4754} {"train_loss": -26.62201499938965, "global_step": 394599, "epoch": 4754} {"train_loss": -26.588525772094727, "global_step": 394600, "epoch": 4754} {"train_loss": -26.57643699645996, "global_step": 394601, "epoch": 4754} {"train_loss": -26.250579833984375, "global_step": 394602, "epoch": 4754} {"train_loss": -26.585285186767578, "global_step": 394603, "epoch": 4754} {"train_loss": -26.259963989257812, "global_step": 394604, "epoch": 4754} {"train_loss": -26.821969985961914, "global_step": 394605, "epoch": 4754} {"train_loss": -26.45891761779785, "global_step": 394606, "epoch": 4754} {"train_loss": -26.5382137298584, "global_step": 394607, "epoch": 4754} {"train_loss": -26.71746826171875, "global_step": 394608, "epoch": 4754} {"train_loss": -26.764326095581055, "global_step": 394609, "epoch": 4754} {"train_loss": -26.592548370361328, "global_step": 394610, "epoch": 4754} {"train_loss": -26.84210205078125, "global_step": 394611, "epoch": 4754} {"train_loss": -26.964574813842773, "global_step": 394612, "epoch": 4754} {"train_loss": -26.99663734436035, "global_step": 394613, "epoch": 4754} {"train_loss": -26.66804313659668, "global_step": 394614, "epoch": 4754} {"train_loss": -26.68914222717285, "global_step": 394615, "epoch": 4754} {"train_loss": -26.361059188842773, "global_step": 394616, "epoch": 4754} {"train_loss": -26.72737693786621, "global_step": 394617, "epoch": 4754} {"train_loss": -26.711734771728516, "global_step": 394618, "epoch": 4754} {"train_loss": -26.87576675415039, "global_step": 394619, "epoch": 4754} {"train_loss": -26.27107810974121, "global_step": 394620, "epoch": 4754} {"train_loss": -26.58973503112793, "global_step": 394621, "epoch": 4754} {"train_loss": -26.478361129760742, "global_step": 394622, "epoch": 4754} {"train_loss": -26.713422775268555, "global_step": 394623, "epoch": 4754} {"train_loss": -26.43291664123535, "global_step": 394624, "epoch": 4754} {"train_loss": -26.659387588500977, "global_step": 394625, "epoch": 4754} {"train_loss": -26.306249618530273, "global_step": 394626, "epoch": 4754} {"train_loss": -26.160146713256836, "global_step": 394627, "epoch": 4754} {"train_loss": -26.299997329711914, "global_step": 394628, "epoch": 4754} {"train_loss": -26.8281307220459, "global_step": 394629, "epoch": 4754} {"train_loss": -26.629547119140625, "global_step": 394630, "epoch": 4754} {"train_loss": -26.389867782592773, "global_step": 394631, "epoch": 4754} {"train_loss": -26.52509880065918, "global_step": 394632, "epoch": 4754} {"train_loss": -26.695571899414062, "global_step": 394633, "epoch": 4754} {"train_loss": -26.68281364440918, "global_step": 394634, "epoch": 4754} {"train_loss": -26.58778190612793, "global_step": 394635, "epoch": 4754} {"train_loss": -26.794775009155273, "global_step": 394636, "epoch": 4754} {"train_loss": -27.002355575561523, "global_step": 394637, "epoch": 4754} {"train_loss": -26.53254508972168, "global_step": 394638, "epoch": 4754} {"train_loss": -26.716230392456055, "global_step": 394639, "epoch": 4754} {"train_loss": -26.47954750061035, "global_step": 394640, "epoch": 4754} {"train_loss": -26.747425079345703, "global_step": 394641, "epoch": 4754} {"train_loss": -26.79571533203125, "global_step": 394642, "epoch": 4754} {"train_loss": -26.83159828186035, "global_step": 394643, "epoch": 4754} {"train_loss": -26.529865264892578, "global_step": 394644, "epoch": 4754} {"train_loss": -26.862415313720703, "global_step": 394645, "epoch": 4754} {"train_loss": -26.5456600189209, "global_step": 394646, "epoch": 4754} {"train_loss": -26.55183219909668, "global_step": 394647, "epoch": 4754} {"train_loss": -26.909137725830078, "global_step": 394648, "epoch": 4754} {"train_loss": -26.895383834838867, "global_step": 394649, "epoch": 4754} {"train_loss": -26.942296981811523, "global_step": 394650, "epoch": 4754} {"train_loss": -26.81043815612793, "global_step": 394651, "epoch": 4754} {"train_loss": -26.900358200073242, "global_step": 394652, "epoch": 4754} {"train_loss": -26.910465240478516, "global_step": 394653, "epoch": 4754} {"train_loss": -26.6732177734375, "global_step": 394654, "epoch": 4754} {"train_loss": -26.809167861938477, "global_step": 394655, "epoch": 4754} {"train_loss": -26.62473487854004, "global_step": 394656, "epoch": 4754} {"train_loss": -26.647907257080078, "global_step": 394657, "epoch": 4754} {"train_loss": -26.7238826751709, "global_step": 394658, "epoch": 4754} {"train_loss": -26.7060546875, "global_step": 394659, "epoch": 4754} {"train_loss": -26.662389755249023, "global_step": 394660, "epoch": 4754} {"train_loss": -26.389434814453125, "global_step": 394661, "epoch": 4754} {"train_loss": -26.657001495361328, "global_step": 394662, "epoch": 4754} {"train_loss": -26.532318115234375, "global_step": 394663, "epoch": 4754} {"train_loss": -26.544545552816736, "global_step": 394664, "epoch": 4754, "val_loss": 6661885.0} {"train_loss": -26.2991943359375, "global_step": 394665, "epoch": 4755} {"train_loss": -25.630170822143555, "global_step": 394666, "epoch": 4755} {"train_loss": -26.02924919128418, "global_step": 394667, "epoch": 4755} {"train_loss": -25.564416885375977, "global_step": 394668, "epoch": 4755} {"train_loss": -24.90570640563965, "global_step": 394669, "epoch": 4755} {"train_loss": -24.531124114990234, "global_step": 394670, "epoch": 4755} {"train_loss": -25.261064529418945, "global_step": 394671, "epoch": 4755} {"train_loss": -26.133996963500977, "global_step": 394672, "epoch": 4755} {"train_loss": -25.694690704345703, "global_step": 394673, "epoch": 4755} {"train_loss": -26.647083282470703, "global_step": 394674, "epoch": 4755} {"train_loss": -26.302143096923828, "global_step": 394675, "epoch": 4755} {"train_loss": -26.33683204650879, "global_step": 394676, "epoch": 4755} {"train_loss": -26.2379207611084, "global_step": 394677, "epoch": 4755} {"train_loss": -25.7279052734375, "global_step": 394678, "epoch": 4755} {"train_loss": -25.73797035217285, "global_step": 394679, "epoch": 4755} {"train_loss": -26.01995277404785, "global_step": 394680, "epoch": 4755} {"train_loss": -26.175485610961914, "global_step": 394681, "epoch": 4755} {"train_loss": -25.963342666625977, "global_step": 394682, "epoch": 4755} {"train_loss": -26.1675968170166, "global_step": 394683, "epoch": 4755} {"train_loss": -26.287561416625977, "global_step": 394684, "epoch": 4755} {"train_loss": -26.439395904541016, "global_step": 394685, "epoch": 4755} {"train_loss": -26.36494255065918, "global_step": 394686, "epoch": 4755} {"train_loss": -26.28085708618164, "global_step": 394687, "epoch": 4755} {"train_loss": -26.23823356628418, "global_step": 394688, "epoch": 4755} {"train_loss": -26.303308486938477, "global_step": 394689, "epoch": 4755} {"train_loss": -26.280698776245117, "global_step": 394690, "epoch": 4755} {"train_loss": -26.038455963134766, "global_step": 394691, "epoch": 4755} {"train_loss": -26.61334228515625, "global_step": 394692, "epoch": 4755} {"train_loss": -25.97737693786621, "global_step": 394693, "epoch": 4755} {"train_loss": -26.43413734436035, "global_step": 394694, "epoch": 4755} {"train_loss": -26.72039222717285, "global_step": 394695, "epoch": 4755} {"train_loss": -26.605798721313477, "global_step": 394696, "epoch": 4755} {"train_loss": -26.45001792907715, "global_step": 394697, "epoch": 4755} {"train_loss": -26.3716983795166, "global_step": 394698, "epoch": 4755} {"train_loss": -26.90692138671875, "global_step": 394699, "epoch": 4755} {"train_loss": -26.45379066467285, "global_step": 394700, "epoch": 4755} {"train_loss": -26.31928825378418, "global_step": 394701, "epoch": 4755} {"train_loss": -25.9952335357666, "global_step": 394702, "epoch": 4755} {"train_loss": -26.777502059936523, "global_step": 394703, "epoch": 4755} {"train_loss": -26.803699493408203, "global_step": 394704, "epoch": 4755} {"train_loss": -26.571929931640625, "global_step": 394705, "epoch": 4755} {"train_loss": -26.801971435546875, "global_step": 394706, "epoch": 4755} {"train_loss": -26.694982528686523, "global_step": 394707, "epoch": 4755} {"train_loss": -26.356786727905273, "global_step": 394708, "epoch": 4755} {"train_loss": -26.661283493041992, "global_step": 394709, "epoch": 4755} {"train_loss": -26.7052001953125, "global_step": 394710, "epoch": 4755} {"train_loss": -26.841018676757812, "global_step": 394711, "epoch": 4755} {"train_loss": -26.190534591674805, "global_step": 394712, "epoch": 4755} {"train_loss": -26.490222930908203, "global_step": 394713, "epoch": 4755} {"train_loss": -26.556201934814453, "global_step": 394714, "epoch": 4755} {"train_loss": -26.4860782623291, "global_step": 394715, "epoch": 4755} {"train_loss": -26.65347671508789, "global_step": 394716, "epoch": 4755} {"train_loss": -26.69056510925293, "global_step": 394717, "epoch": 4755} {"train_loss": -26.830121994018555, "global_step": 394718, "epoch": 4755} {"train_loss": -26.525226593017578, "global_step": 394719, "epoch": 4755} {"train_loss": -26.86403465270996, "global_step": 394720, "epoch": 4755} {"train_loss": -26.42575454711914, "global_step": 394721, "epoch": 4755} {"train_loss": -26.67974853515625, "global_step": 394722, "epoch": 4755} {"train_loss": -26.49859046936035, "global_step": 394723, "epoch": 4755} {"train_loss": -26.718658447265625, "global_step": 394724, "epoch": 4755} {"train_loss": -26.951904296875, "global_step": 394725, "epoch": 4755} {"train_loss": -26.765857696533203, "global_step": 394726, "epoch": 4755} {"train_loss": -26.62920570373535, "global_step": 394727, "epoch": 4755} {"train_loss": -26.68548583984375, "global_step": 394728, "epoch": 4755} {"train_loss": -26.735742568969727, "global_step": 394729, "epoch": 4755} {"train_loss": -26.37807273864746, "global_step": 394730, "epoch": 4755} {"train_loss": -26.597721099853516, "global_step": 394731, "epoch": 4755} {"train_loss": -26.646055221557617, "global_step": 394732, "epoch": 4755} {"train_loss": -26.73993492126465, "global_step": 394733, "epoch": 4755} {"train_loss": -26.622922897338867, "global_step": 394734, "epoch": 4755} {"train_loss": -26.50567054748535, "global_step": 394735, "epoch": 4755} {"train_loss": -26.707275390625, "global_step": 394736, "epoch": 4755} {"train_loss": -26.66607093811035, "global_step": 394737, "epoch": 4755} {"train_loss": -26.85890007019043, "global_step": 394738, "epoch": 4755} {"train_loss": -26.683609008789062, "global_step": 394739, "epoch": 4755} {"train_loss": -26.630985260009766, "global_step": 394740, "epoch": 4755} {"train_loss": -26.827322006225586, "global_step": 394741, "epoch": 4755} {"train_loss": -26.773223876953125, "global_step": 394742, "epoch": 4755} {"train_loss": -26.45283317565918, "global_step": 394743, "epoch": 4755} {"train_loss": -26.5707950592041, "global_step": 394744, "epoch": 4755} {"train_loss": -26.79558753967285, "global_step": 394745, "epoch": 4755} {"train_loss": -26.791208267211914, "global_step": 394746, "epoch": 4755} {"train_loss": -26.409296518348786, "global_step": 394747, "epoch": 4755, "val_loss": 6580442.0} {"train_loss": -25.979358673095703, "global_step": 394748, "epoch": 4756} {"train_loss": -26.0609188079834, "global_step": 394749, "epoch": 4756} {"train_loss": -26.583539962768555, "global_step": 394750, "epoch": 4756} {"train_loss": -26.612497329711914, "global_step": 394751, "epoch": 4756} {"train_loss": -26.5527400970459, "global_step": 394752, "epoch": 4756} {"train_loss": -26.37592124938965, "global_step": 394753, "epoch": 4756} {"train_loss": -26.044544219970703, "global_step": 394754, "epoch": 4756} {"train_loss": -26.565540313720703, "global_step": 394755, "epoch": 4756} {"train_loss": -26.20049476623535, "global_step": 394756, "epoch": 4756} {"train_loss": -26.106298446655273, "global_step": 394757, "epoch": 4756} {"train_loss": -26.512121200561523, "global_step": 394758, "epoch": 4756} {"train_loss": -26.574899673461914, "global_step": 394759, "epoch": 4756} {"train_loss": -25.9576358795166, "global_step": 394760, "epoch": 4756} {"train_loss": -26.420501708984375, "global_step": 394761, "epoch": 4756} {"train_loss": -26.17115592956543, "global_step": 394762, "epoch": 4756} {"train_loss": -26.733312606811523, "global_step": 394763, "epoch": 4756} {"train_loss": -26.247333526611328, "global_step": 394764, "epoch": 4756} {"train_loss": -25.68316650390625, "global_step": 394765, "epoch": 4756} {"train_loss": -26.347721099853516, "global_step": 394766, "epoch": 4756} {"train_loss": -26.370275497436523, "global_step": 394767, "epoch": 4756} {"train_loss": -26.152515411376953, "global_step": 394768, "epoch": 4756} {"train_loss": -26.351245880126953, "global_step": 394769, "epoch": 4756} {"train_loss": -26.519433975219727, "global_step": 394770, "epoch": 4756} {"train_loss": -26.234039306640625, "global_step": 394771, "epoch": 4756} {"train_loss": -26.105987548828125, "global_step": 394772, "epoch": 4756} {"train_loss": -25.998022079467773, "global_step": 394773, "epoch": 4756} {"train_loss": -26.366193771362305, "global_step": 394774, "epoch": 4756} {"train_loss": -26.248945236206055, "global_step": 394775, "epoch": 4756} {"train_loss": -26.442670822143555, "global_step": 394776, "epoch": 4756} {"train_loss": -26.41290855407715, "global_step": 394777, "epoch": 4756} {"train_loss": -26.374887466430664, "global_step": 394778, "epoch": 4756} {"train_loss": -26.159454345703125, "global_step": 394779, "epoch": 4756} {"train_loss": -26.509458541870117, "global_step": 394780, "epoch": 4756} {"train_loss": -26.15410804748535, "global_step": 394781, "epoch": 4756} {"train_loss": -26.40680503845215, "global_step": 394782, "epoch": 4756} {"train_loss": -26.446460723876953, "global_step": 394783, "epoch": 4756} {"train_loss": -26.26307487487793, "global_step": 394784, "epoch": 4756} {"train_loss": -26.685317993164062, "global_step": 394785, "epoch": 4756} {"train_loss": -26.818592071533203, "global_step": 394786, "epoch": 4756} {"train_loss": -26.609601974487305, "global_step": 394787, "epoch": 4756} {"train_loss": -26.294010162353516, "global_step": 394788, "epoch": 4756} {"train_loss": -26.770490646362305, "global_step": 394789, "epoch": 4756} {"train_loss": -26.56681251525879, "global_step": 394790, "epoch": 4756} {"train_loss": -26.59071159362793, "global_step": 394791, "epoch": 4756} {"train_loss": -26.889179229736328, "global_step": 394792, "epoch": 4756} {"train_loss": -26.689191818237305, "global_step": 394793, "epoch": 4756} {"train_loss": -26.082300186157227, "global_step": 394794, "epoch": 4756} {"train_loss": -26.37311363220215, "global_step": 394795, "epoch": 4756} {"train_loss": -26.853382110595703, "global_step": 394796, "epoch": 4756} {"train_loss": -26.697052001953125, "global_step": 394797, "epoch": 4756} {"train_loss": -26.566869735717773, "global_step": 394798, "epoch": 4756} {"train_loss": -26.62554359436035, "global_step": 394799, "epoch": 4756} {"train_loss": -26.567785263061523, "global_step": 394800, "epoch": 4756} {"train_loss": -26.855390548706055, "global_step": 394801, "epoch": 4756} {"train_loss": -26.977502822875977, "global_step": 394802, "epoch": 4756} {"train_loss": -26.714487075805664, "global_step": 394803, "epoch": 4756} {"train_loss": -26.655298233032227, "global_step": 394804, "epoch": 4756} {"train_loss": -26.9506778717041, "global_step": 394805, "epoch": 4756} {"train_loss": -26.883014678955078, "global_step": 394806, "epoch": 4756} {"train_loss": -26.548145294189453, "global_step": 394807, "epoch": 4756} {"train_loss": -26.480484008789062, "global_step": 394808, "epoch": 4756} {"train_loss": -26.535907745361328, "global_step": 394809, "epoch": 4756} {"train_loss": -26.696563720703125, "global_step": 394810, "epoch": 4756} {"train_loss": -26.734241485595703, "global_step": 394811, "epoch": 4756} {"train_loss": -26.9121036529541, "global_step": 394812, "epoch": 4756} {"train_loss": -26.46160888671875, "global_step": 394813, "epoch": 4756} {"train_loss": -26.47028160095215, "global_step": 394814, "epoch": 4756} {"train_loss": -26.688730239868164, "global_step": 394815, "epoch": 4756} {"train_loss": -26.5593318939209, "global_step": 394816, "epoch": 4756} {"train_loss": -26.2935848236084, "global_step": 394817, "epoch": 4756} {"train_loss": -26.592945098876953, "global_step": 394818, "epoch": 4756} {"train_loss": -26.384103775024414, "global_step": 394819, "epoch": 4756} {"train_loss": -26.536001205444336, "global_step": 394820, "epoch": 4756} {"train_loss": -25.89374351501465, "global_step": 394821, "epoch": 4756} {"train_loss": -26.1386661529541, "global_step": 394822, "epoch": 4756} {"train_loss": -26.52900505065918, "global_step": 394823, "epoch": 4756} {"train_loss": -26.964435577392578, "global_step": 394824, "epoch": 4756} {"train_loss": -26.369464874267578, "global_step": 394825, "epoch": 4756} {"train_loss": -26.6011962890625, "global_step": 394826, "epoch": 4756} {"train_loss": -26.597631454467773, "global_step": 394827, "epoch": 4756} {"train_loss": -26.58428382873535, "global_step": 394828, "epoch": 4756} {"train_loss": -26.576623916625977, "global_step": 394829, "epoch": 4756} {"train_loss": -26.46451095213373, "global_step": 394830, "epoch": 4756, "val_loss": 6563364.0} {"train_loss": -25.8541316986084, "global_step": 394831, "epoch": 4757} {"train_loss": -25.584348678588867, "global_step": 394832, "epoch": 4757} {"train_loss": -26.752017974853516, "global_step": 394833, "epoch": 4757} {"train_loss": -25.83063316345215, "global_step": 394834, "epoch": 4757} {"train_loss": -25.9791202545166, "global_step": 394835, "epoch": 4757} {"train_loss": -25.78815269470215, "global_step": 394836, "epoch": 4757} {"train_loss": -26.021839141845703, "global_step": 394837, "epoch": 4757} {"train_loss": -26.21278190612793, "global_step": 394838, "epoch": 4757} {"train_loss": -25.852712631225586, "global_step": 394839, "epoch": 4757} {"train_loss": -25.77239990234375, "global_step": 394840, "epoch": 4757} {"train_loss": -26.066375732421875, "global_step": 394841, "epoch": 4757} {"train_loss": -26.18133544921875, "global_step": 394842, "epoch": 4757} {"train_loss": -26.204614639282227, "global_step": 394843, "epoch": 4757} {"train_loss": -26.316442489624023, "global_step": 394844, "epoch": 4757} {"train_loss": -26.119977951049805, "global_step": 394845, "epoch": 4757} {"train_loss": -26.495391845703125, "global_step": 394846, "epoch": 4757} {"train_loss": -26.36231803894043, "global_step": 394847, "epoch": 4757} {"train_loss": -26.468393325805664, "global_step": 394848, "epoch": 4757} {"train_loss": -26.491525650024414, "global_step": 394849, "epoch": 4757} {"train_loss": -26.454376220703125, "global_step": 394850, "epoch": 4757} {"train_loss": -26.674665451049805, "global_step": 394851, "epoch": 4757} {"train_loss": -26.2977237701416, "global_step": 394852, "epoch": 4757} {"train_loss": -26.45270347595215, "global_step": 394853, "epoch": 4757} {"train_loss": -26.23031997680664, "global_step": 394854, "epoch": 4757} {"train_loss": -26.205698013305664, "global_step": 394855, "epoch": 4757} {"train_loss": -26.362577438354492, "global_step": 394856, "epoch": 4757} {"train_loss": -26.282407760620117, "global_step": 394857, "epoch": 4757} {"train_loss": -26.686206817626953, "global_step": 394858, "epoch": 4757} {"train_loss": -26.509469985961914, "global_step": 394859, "epoch": 4757} {"train_loss": -26.52168083190918, "global_step": 394860, "epoch": 4757} {"train_loss": -26.315664291381836, "global_step": 394861, "epoch": 4757} {"train_loss": -26.50641441345215, "global_step": 394862, "epoch": 4757} {"train_loss": -26.452499389648438, "global_step": 394863, "epoch": 4757} {"train_loss": -26.249755859375, "global_step": 394864, "epoch": 4757} {"train_loss": -26.789648056030273, "global_step": 394865, "epoch": 4757} {"train_loss": -26.518964767456055, "global_step": 394866, "epoch": 4757} {"train_loss": -26.781030654907227, "global_step": 394867, "epoch": 4757} {"train_loss": -26.58212661743164, "global_step": 394868, "epoch": 4757} {"train_loss": -26.40540885925293, "global_step": 394869, "epoch": 4757} {"train_loss": -26.7058048248291, "global_step": 394870, "epoch": 4757} {"train_loss": -26.777448654174805, "global_step": 394871, "epoch": 4757} {"train_loss": -26.061115264892578, "global_step": 394872, "epoch": 4757} {"train_loss": -26.42997169494629, "global_step": 394873, "epoch": 4757} {"train_loss": -26.727643966674805, "global_step": 394874, "epoch": 4757} {"train_loss": -26.758649826049805, "global_step": 394875, "epoch": 4757} {"train_loss": -26.49191665649414, "global_step": 394876, "epoch": 4757} {"train_loss": -26.35188102722168, "global_step": 394877, "epoch": 4757} {"train_loss": -26.845869064331055, "global_step": 394878, "epoch": 4757} {"train_loss": -26.49855613708496, "global_step": 394879, "epoch": 4757} {"train_loss": -26.411380767822266, "global_step": 394880, "epoch": 4757} {"train_loss": -26.587549209594727, "global_step": 394881, "epoch": 4757} {"train_loss": -26.797962188720703, "global_step": 394882, "epoch": 4757} {"train_loss": -26.852807998657227, "global_step": 394883, "epoch": 4757} {"train_loss": -26.55634880065918, "global_step": 394884, "epoch": 4757} {"train_loss": -26.13644790649414, "global_step": 394885, "epoch": 4757} {"train_loss": -26.38421630859375, "global_step": 394886, "epoch": 4757} {"train_loss": -26.5371036529541, "global_step": 394887, "epoch": 4757} {"train_loss": -26.55975914001465, "global_step": 394888, "epoch": 4757} {"train_loss": -26.788755416870117, "global_step": 394889, "epoch": 4757} {"train_loss": -26.317535400390625, "global_step": 394890, "epoch": 4757} {"train_loss": -26.58506202697754, "global_step": 394891, "epoch": 4757} {"train_loss": -26.446741104125977, "global_step": 394892, "epoch": 4757} {"train_loss": -26.929584503173828, "global_step": 394893, "epoch": 4757} {"train_loss": -26.595666885375977, "global_step": 394894, "epoch": 4757} {"train_loss": -26.924896240234375, "global_step": 394895, "epoch": 4757} {"train_loss": -26.940723419189453, "global_step": 394896, "epoch": 4757} {"train_loss": -26.679819107055664, "global_step": 394897, "epoch": 4757} {"train_loss": -26.923233032226562, "global_step": 394898, "epoch": 4757} {"train_loss": -26.9866943359375, "global_step": 394899, "epoch": 4757} {"train_loss": -26.72987174987793, "global_step": 394900, "epoch": 4757} {"train_loss": -27.140888214111328, "global_step": 394901, "epoch": 4757} {"train_loss": -26.699771881103516, "global_step": 394902, "epoch": 4757} {"train_loss": -26.728025436401367, "global_step": 394903, "epoch": 4757} {"train_loss": -26.764312744140625, "global_step": 394904, "epoch": 4757} {"train_loss": -26.393173217773438, "global_step": 394905, "epoch": 4757} {"train_loss": -26.838693618774414, "global_step": 394906, "epoch": 4757} {"train_loss": -26.946775436401367, "global_step": 394907, "epoch": 4757} {"train_loss": -26.75355339050293, "global_step": 394908, "epoch": 4757} {"train_loss": -26.64328384399414, "global_step": 394909, "epoch": 4757} {"train_loss": -26.557477951049805, "global_step": 394910, "epoch": 4757} {"train_loss": -26.6121883392334, "global_step": 394911, "epoch": 4757} {"train_loss": -26.52019691467285, "global_step": 394912, "epoch": 4757} {"train_loss": -26.462060629603375, "global_step": 394913, "epoch": 4757, "val_loss": 6668314.0} {"train_loss": -24.854177474975586, "global_step": 394914, "epoch": 4758} {"train_loss": -23.476516723632812, "global_step": 394915, "epoch": 4758} {"train_loss": -25.222274780273438, "global_step": 394916, "epoch": 4758} {"train_loss": -24.893529891967773, "global_step": 394917, "epoch": 4758} {"train_loss": -24.314786911010742, "global_step": 394918, "epoch": 4758} {"train_loss": -25.24527931213379, "global_step": 394919, "epoch": 4758} {"train_loss": -25.168773651123047, "global_step": 394920, "epoch": 4758} {"train_loss": -25.230905532836914, "global_step": 394921, "epoch": 4758} {"train_loss": -25.655609130859375, "global_step": 394922, "epoch": 4758} {"train_loss": -25.533098220825195, "global_step": 394923, "epoch": 4758} {"train_loss": -25.561965942382812, "global_step": 394924, "epoch": 4758} {"train_loss": -25.10799789428711, "global_step": 394925, "epoch": 4758} {"train_loss": -25.904438018798828, "global_step": 394926, "epoch": 4758} {"train_loss": -25.49686050415039, "global_step": 394927, "epoch": 4758} {"train_loss": -25.90760612487793, "global_step": 394928, "epoch": 4758} {"train_loss": -25.931501388549805, "global_step": 394929, "epoch": 4758} {"train_loss": -25.8958683013916, "global_step": 394930, "epoch": 4758} {"train_loss": -25.86256217956543, "global_step": 394931, "epoch": 4758} {"train_loss": -25.567895889282227, "global_step": 394932, "epoch": 4758} {"train_loss": -25.728469848632812, "global_step": 394933, "epoch": 4758} {"train_loss": -25.769824981689453, "global_step": 394934, "epoch": 4758} {"train_loss": -25.991113662719727, "global_step": 394935, "epoch": 4758} {"train_loss": -25.481754302978516, "global_step": 394936, "epoch": 4758} {"train_loss": -25.96748161315918, "global_step": 394937, "epoch": 4758} {"train_loss": -25.858957290649414, "global_step": 394938, "epoch": 4758} {"train_loss": -26.125629425048828, "global_step": 394939, "epoch": 4758} {"train_loss": -25.964155197143555, "global_step": 394940, "epoch": 4758} {"train_loss": -26.172077178955078, "global_step": 394941, "epoch": 4758} {"train_loss": -26.44183349609375, "global_step": 394942, "epoch": 4758} {"train_loss": -26.279455184936523, "global_step": 394943, "epoch": 4758} {"train_loss": -26.3204345703125, "global_step": 394944, "epoch": 4758} {"train_loss": -26.233274459838867, "global_step": 394945, "epoch": 4758} {"train_loss": -26.365741729736328, "global_step": 394946, "epoch": 4758} {"train_loss": -26.393529891967773, "global_step": 394947, "epoch": 4758} {"train_loss": -26.524274826049805, "global_step": 394948, "epoch": 4758} {"train_loss": -26.34916114807129, "global_step": 394949, "epoch": 4758} {"train_loss": -26.202762603759766, "global_step": 394950, "epoch": 4758} {"train_loss": -26.342615127563477, "global_step": 394951, "epoch": 4758} {"train_loss": -26.287067413330078, "global_step": 394952, "epoch": 4758} {"train_loss": -26.248855590820312, "global_step": 394953, "epoch": 4758} {"train_loss": -26.532379150390625, "global_step": 394954, "epoch": 4758} {"train_loss": -26.4595890045166, "global_step": 394955, "epoch": 4758} {"train_loss": -26.53675651550293, "global_step": 394956, "epoch": 4758} {"train_loss": -26.299047470092773, "global_step": 394957, "epoch": 4758} {"train_loss": -26.888574600219727, "global_step": 394958, "epoch": 4758} {"train_loss": -26.674304962158203, "global_step": 394959, "epoch": 4758} {"train_loss": -26.978734970092773, "global_step": 394960, "epoch": 4758} {"train_loss": -26.505414962768555, "global_step": 394961, "epoch": 4758} {"train_loss": -26.862207412719727, "global_step": 394962, "epoch": 4758} {"train_loss": -26.594451904296875, "global_step": 394963, "epoch": 4758} {"train_loss": -26.42389488220215, "global_step": 394964, "epoch": 4758} {"train_loss": -26.751724243164062, "global_step": 394965, "epoch": 4758} {"train_loss": -26.864953994750977, "global_step": 394966, "epoch": 4758} {"train_loss": -26.573434829711914, "global_step": 394967, "epoch": 4758} {"train_loss": -26.49075698852539, "global_step": 394968, "epoch": 4758} {"train_loss": -26.809301376342773, "global_step": 394969, "epoch": 4758} {"train_loss": -26.132068634033203, "global_step": 394970, "epoch": 4758} {"train_loss": -26.787185668945312, "global_step": 394971, "epoch": 4758} {"train_loss": -26.92532730102539, "global_step": 394972, "epoch": 4758} {"train_loss": -26.90180778503418, "global_step": 394973, "epoch": 4758} {"train_loss": -26.385046005249023, "global_step": 394974, "epoch": 4758} {"train_loss": -26.375959396362305, "global_step": 394975, "epoch": 4758} {"train_loss": -26.989904403686523, "global_step": 394976, "epoch": 4758} {"train_loss": -26.71376609802246, "global_step": 394977, "epoch": 4758} {"train_loss": -26.765869140625, "global_step": 394978, "epoch": 4758} {"train_loss": -26.553258895874023, "global_step": 394979, "epoch": 4758} {"train_loss": -26.5572509765625, "global_step": 394980, "epoch": 4758} {"train_loss": -26.834699630737305, "global_step": 394981, "epoch": 4758} {"train_loss": -26.578027725219727, "global_step": 394982, "epoch": 4758} {"train_loss": -26.9507999420166, "global_step": 394983, "epoch": 4758} {"train_loss": -26.93528175354004, "global_step": 394984, "epoch": 4758} {"train_loss": -26.660572052001953, "global_step": 394985, "epoch": 4758} {"train_loss": -26.31519889831543, "global_step": 394986, "epoch": 4758} {"train_loss": -26.694385528564453, "global_step": 394987, "epoch": 4758} {"train_loss": -26.925785064697266, "global_step": 394988, "epoch": 4758} {"train_loss": -26.0211238861084, "global_step": 394989, "epoch": 4758} {"train_loss": -26.223987579345703, "global_step": 394990, "epoch": 4758} {"train_loss": -26.521162033081055, "global_step": 394991, "epoch": 4758} {"train_loss": -25.607934951782227, "global_step": 394992, "epoch": 4758} {"train_loss": -26.289514541625977, "global_step": 394993, "epoch": 4758} {"train_loss": -26.576608657836914, "global_step": 394994, "epoch": 4758} {"train_loss": -26.490619659423828, "global_step": 394995, "epoch": 4758} {"train_loss": -26.169912889779333, "global_step": 394996, "epoch": 4758, "val_loss": 6674275.0} {"train_loss": -26.35284996032715, "global_step": 394997, "epoch": 4759} {"train_loss": -25.56612777709961, "global_step": 394998, "epoch": 4759} {"train_loss": -25.501718521118164, "global_step": 394999, "epoch": 4759} {"train_loss": -25.224576950073242, "global_step": 395000, "epoch": 4759} {"train_loss": -26.197484970092773, "global_step": 395001, "epoch": 4759} {"train_loss": -25.893096923828125, "global_step": 395002, "epoch": 4759} {"train_loss": -25.88575553894043, "global_step": 395003, "epoch": 4759} {"train_loss": -26.104312896728516, "global_step": 395004, "epoch": 4759} {"train_loss": -26.161212921142578, "global_step": 395005, "epoch": 4759} {"train_loss": -26.486963272094727, "global_step": 395006, "epoch": 4759} {"train_loss": -26.267377853393555, "global_step": 395007, "epoch": 4759} {"train_loss": -26.34400749206543, "global_step": 395008, "epoch": 4759} {"train_loss": -26.028451919555664, "global_step": 395009, "epoch": 4759} {"train_loss": -26.219818115234375, "global_step": 395010, "epoch": 4759} {"train_loss": -26.431394577026367, "global_step": 395011, "epoch": 4759} {"train_loss": -26.680700302124023, "global_step": 395012, "epoch": 4759} {"train_loss": -26.714635848999023, "global_step": 395013, "epoch": 4759} {"train_loss": -26.2530574798584, "global_step": 395014, "epoch": 4759} {"train_loss": -25.9872989654541, "global_step": 395015, "epoch": 4759} {"train_loss": -26.41733169555664, "global_step": 395016, "epoch": 4759} {"train_loss": -26.302839279174805, "global_step": 395017, "epoch": 4759} {"train_loss": -26.549854278564453, "global_step": 395018, "epoch": 4759} {"train_loss": -26.316381454467773, "global_step": 395019, "epoch": 4759} {"train_loss": -26.709064483642578, "global_step": 395020, "epoch": 4759} {"train_loss": -26.66656494140625, "global_step": 395021, "epoch": 4759} {"train_loss": -26.656930923461914, "global_step": 395022, "epoch": 4759} {"train_loss": -26.65535545349121, "global_step": 395023, "epoch": 4759} {"train_loss": -26.762771606445312, "global_step": 395024, "epoch": 4759} {"train_loss": -26.953638076782227, "global_step": 395025, "epoch": 4759} {"train_loss": -26.49884033203125, "global_step": 395026, "epoch": 4759} {"train_loss": -26.73443603515625, "global_step": 395027, "epoch": 4759} {"train_loss": -26.758544921875, "global_step": 395028, "epoch": 4759} {"train_loss": -27.0268611907959, "global_step": 395029, "epoch": 4759} {"train_loss": -26.93218994140625, "global_step": 395030, "epoch": 4759} {"train_loss": -26.607751846313477, "global_step": 395031, "epoch": 4759} {"train_loss": -26.485004425048828, "global_step": 395032, "epoch": 4759} {"train_loss": -26.531705856323242, "global_step": 395033, "epoch": 4759} {"train_loss": -26.560964584350586, "global_step": 395034, "epoch": 4759} {"train_loss": -26.45161247253418, "global_step": 395035, "epoch": 4759} {"train_loss": -26.525171279907227, "global_step": 395036, "epoch": 4759} {"train_loss": -26.86329460144043, "global_step": 395037, "epoch": 4759} {"train_loss": -26.677976608276367, "global_step": 395038, "epoch": 4759} {"train_loss": -26.387792587280273, "global_step": 395039, "epoch": 4759} {"train_loss": -26.611982345581055, "global_step": 395040, "epoch": 4759} {"train_loss": -27.138959884643555, "global_step": 395041, "epoch": 4759} {"train_loss": -26.614057540893555, "global_step": 395042, "epoch": 4759} {"train_loss": -27.08497428894043, "global_step": 395043, "epoch": 4759} {"train_loss": -26.702726364135742, "global_step": 395044, "epoch": 4759} {"train_loss": -26.970197677612305, "global_step": 395045, "epoch": 4759} {"train_loss": -26.588403701782227, "global_step": 395046, "epoch": 4759} {"train_loss": -26.59576988220215, "global_step": 395047, "epoch": 4759} {"train_loss": -26.755081176757812, "global_step": 395048, "epoch": 4759} {"train_loss": -26.160024642944336, "global_step": 395049, "epoch": 4759} {"train_loss": -26.256315231323242, "global_step": 395050, "epoch": 4759} {"train_loss": -26.78407096862793, "global_step": 395051, "epoch": 4759} {"train_loss": -26.836135864257812, "global_step": 395052, "epoch": 4759} {"train_loss": -26.397741317749023, "global_step": 395053, "epoch": 4759} {"train_loss": -26.345624923706055, "global_step": 395054, "epoch": 4759} {"train_loss": -26.494749069213867, "global_step": 395055, "epoch": 4759} {"train_loss": -26.19907569885254, "global_step": 395056, "epoch": 4759} {"train_loss": -26.76936149597168, "global_step": 395057, "epoch": 4759} {"train_loss": -26.877485275268555, "global_step": 395058, "epoch": 4759} {"train_loss": -26.3165283203125, "global_step": 395059, "epoch": 4759} {"train_loss": -26.837121963500977, "global_step": 395060, "epoch": 4759} {"train_loss": -26.600412368774414, "global_step": 395061, "epoch": 4759} {"train_loss": -26.643728256225586, "global_step": 395062, "epoch": 4759} {"train_loss": -26.31842613220215, "global_step": 395063, "epoch": 4759} {"train_loss": -26.119665145874023, "global_step": 395064, "epoch": 4759} {"train_loss": -26.43743896484375, "global_step": 395065, "epoch": 4759} {"train_loss": -26.44186782836914, "global_step": 395066, "epoch": 4759} {"train_loss": -26.51618003845215, "global_step": 395067, "epoch": 4759} {"train_loss": -26.459394454956055, "global_step": 395068, "epoch": 4759} {"train_loss": -26.637054443359375, "global_step": 395069, "epoch": 4759} {"train_loss": -26.559818267822266, "global_step": 395070, "epoch": 4759} {"train_loss": -26.5281982421875, "global_step": 395071, "epoch": 4759} {"train_loss": -26.447998046875, "global_step": 395072, "epoch": 4759} {"train_loss": -26.481952667236328, "global_step": 395073, "epoch": 4759} {"train_loss": -26.742511749267578, "global_step": 395074, "epoch": 4759} {"train_loss": -26.16119956970215, "global_step": 395075, "epoch": 4759} {"train_loss": -26.574766159057617, "global_step": 395076, "epoch": 4759} {"train_loss": -26.639074325561523, "global_step": 395077, "epoch": 4759} {"train_loss": -26.12623405456543, "global_step": 395078, "epoch": 4759} {"train_loss": -26.4806469836867, "global_step": 395079, "epoch": 4759, "val_loss": 6671540.0} {"train_loss": -26.416044235229492, "global_step": 395080, "epoch": 4760} {"train_loss": -26.005218505859375, "global_step": 395081, "epoch": 4760} {"train_loss": -26.478925704956055, "global_step": 395082, "epoch": 4760} {"train_loss": -26.109790802001953, "global_step": 395083, "epoch": 4760} {"train_loss": -26.192901611328125, "global_step": 395084, "epoch": 4760} {"train_loss": -25.752012252807617, "global_step": 395085, "epoch": 4760} {"train_loss": -26.658559799194336, "global_step": 395086, "epoch": 4760} {"train_loss": -26.17189598083496, "global_step": 395087, "epoch": 4760} {"train_loss": -26.345245361328125, "global_step": 395088, "epoch": 4760} {"train_loss": -26.61297607421875, "global_step": 395089, "epoch": 4760} {"train_loss": -26.507770538330078, "global_step": 395090, "epoch": 4760} {"train_loss": -25.99030876159668, "global_step": 395091, "epoch": 4760} {"train_loss": -26.466405868530273, "global_step": 395092, "epoch": 4760} {"train_loss": -26.1195068359375, "global_step": 395093, "epoch": 4760} {"train_loss": -26.350366592407227, "global_step": 395094, "epoch": 4760} {"train_loss": -26.51239585876465, "global_step": 395095, "epoch": 4760} {"train_loss": -26.653106689453125, "global_step": 395096, "epoch": 4760} {"train_loss": -26.476892471313477, "global_step": 395097, "epoch": 4760} {"train_loss": -26.291837692260742, "global_step": 395098, "epoch": 4760} {"train_loss": -26.537561416625977, "global_step": 395099, "epoch": 4760} {"train_loss": -26.581893920898438, "global_step": 395100, "epoch": 4760} {"train_loss": -26.37373161315918, "global_step": 395101, "epoch": 4760} {"train_loss": -26.39535903930664, "global_step": 395102, "epoch": 4760} {"train_loss": -26.34039878845215, "global_step": 395103, "epoch": 4760} {"train_loss": -26.540266036987305, "global_step": 395104, "epoch": 4760} {"train_loss": -26.750507354736328, "global_step": 395105, "epoch": 4760} {"train_loss": -26.6657657623291, "global_step": 395106, "epoch": 4760} {"train_loss": -26.322153091430664, "global_step": 395107, "epoch": 4760} {"train_loss": -26.727340698242188, "global_step": 395108, "epoch": 4760} {"train_loss": -26.212982177734375, "global_step": 395109, "epoch": 4760} {"train_loss": -26.6688289642334, "global_step": 395110, "epoch": 4760} {"train_loss": -26.49342918395996, "global_step": 395111, "epoch": 4760} {"train_loss": -26.729480743408203, "global_step": 395112, "epoch": 4760} {"train_loss": -26.662015914916992, "global_step": 395113, "epoch": 4760} {"train_loss": -26.5282039642334, "global_step": 395114, "epoch": 4760} {"train_loss": -26.6527099609375, "global_step": 395115, "epoch": 4760} {"train_loss": -26.487207412719727, "global_step": 395116, "epoch": 4760} {"train_loss": -26.50132179260254, "global_step": 395117, "epoch": 4760} {"train_loss": -26.395742416381836, "global_step": 395118, "epoch": 4760} {"train_loss": -26.953298568725586, "global_step": 395119, "epoch": 4760} {"train_loss": -26.7546329498291, "global_step": 395120, "epoch": 4760} {"train_loss": -26.620895385742188, "global_step": 395121, "epoch": 4760} {"train_loss": -26.626361846923828, "global_step": 395122, "epoch": 4760} {"train_loss": -27.141361236572266, "global_step": 395123, "epoch": 4760} {"train_loss": -26.585935592651367, "global_step": 395124, "epoch": 4760} {"train_loss": -26.96734619140625, "global_step": 395125, "epoch": 4760} {"train_loss": -26.796070098876953, "global_step": 395126, "epoch": 4760} {"train_loss": -26.73188591003418, "global_step": 395127, "epoch": 4760} {"train_loss": -26.810998916625977, "global_step": 395128, "epoch": 4760} {"train_loss": -26.682580947875977, "global_step": 395129, "epoch": 4760} {"train_loss": -27.06744384765625, "global_step": 395130, "epoch": 4760} {"train_loss": -27.170019149780273, "global_step": 395131, "epoch": 4760} {"train_loss": -26.79429054260254, "global_step": 395132, "epoch": 4760} {"train_loss": -26.630075454711914, "global_step": 395133, "epoch": 4760} {"train_loss": -26.051877975463867, "global_step": 395134, "epoch": 4760} {"train_loss": -26.209964752197266, "global_step": 395135, "epoch": 4760} {"train_loss": -26.22981071472168, "global_step": 395136, "epoch": 4760} {"train_loss": -26.145038604736328, "global_step": 395137, "epoch": 4760} {"train_loss": -26.3444766998291, "global_step": 395138, "epoch": 4760} {"train_loss": -25.869840621948242, "global_step": 395139, "epoch": 4760} {"train_loss": -26.488332748413086, "global_step": 395140, "epoch": 4760} {"train_loss": -25.930572509765625, "global_step": 395141, "epoch": 4760} {"train_loss": -26.524118423461914, "global_step": 395142, "epoch": 4760} {"train_loss": -26.518598556518555, "global_step": 395143, "epoch": 4760} {"train_loss": -25.88503074645996, "global_step": 395144, "epoch": 4760} {"train_loss": -26.147235870361328, "global_step": 395145, "epoch": 4760} {"train_loss": -25.512842178344727, "global_step": 395146, "epoch": 4760} {"train_loss": -25.973876953125, "global_step": 395147, "epoch": 4760} {"train_loss": -25.815139770507812, "global_step": 395148, "epoch": 4760} {"train_loss": -25.993701934814453, "global_step": 395149, "epoch": 4760} {"train_loss": -26.3029842376709, "global_step": 395150, "epoch": 4760} {"train_loss": -25.528921127319336, "global_step": 395151, "epoch": 4760} {"train_loss": -25.626636505126953, "global_step": 395152, "epoch": 4760} {"train_loss": -26.136213302612305, "global_step": 395153, "epoch": 4760} {"train_loss": -26.204065322875977, "global_step": 395154, "epoch": 4760} {"train_loss": -26.149246215820312, "global_step": 395155, "epoch": 4760} {"train_loss": -25.901569366455078, "global_step": 395156, "epoch": 4760} {"train_loss": -26.094099044799805, "global_step": 395157, "epoch": 4760} {"train_loss": -26.13081169128418, "global_step": 395158, "epoch": 4760} {"train_loss": -25.87350845336914, "global_step": 395159, "epoch": 4760} {"train_loss": -26.357025146484375, "global_step": 395160, "epoch": 4760} {"train_loss": -26.550893783569336, "global_step": 395161, "epoch": 4760} {"train_loss": -26.384671038891895, "global_step": 395162, "epoch": 4760, "val_loss": 6591115.0} {"train_loss": -25.567686080932617, "global_step": 395163, "epoch": 4761} {"train_loss": -26.238574981689453, "global_step": 395164, "epoch": 4761} {"train_loss": -25.87811279296875, "global_step": 395165, "epoch": 4761} {"train_loss": -26.049909591674805, "global_step": 395166, "epoch": 4761} {"train_loss": -25.891910552978516, "global_step": 395167, "epoch": 4761} {"train_loss": -25.981964111328125, "global_step": 395168, "epoch": 4761} {"train_loss": -26.08050537109375, "global_step": 395169, "epoch": 4761} {"train_loss": -26.322010040283203, "global_step": 395170, "epoch": 4761} {"train_loss": -25.7208194732666, "global_step": 395171, "epoch": 4761} {"train_loss": -26.3699893951416, "global_step": 395172, "epoch": 4761} {"train_loss": -25.635608673095703, "global_step": 395173, "epoch": 4761} {"train_loss": -25.86078453063965, "global_step": 395174, "epoch": 4761} {"train_loss": -26.41521644592285, "global_step": 395175, "epoch": 4761} {"train_loss": -26.15740394592285, "global_step": 395176, "epoch": 4761} {"train_loss": -26.333173751831055, "global_step": 395177, "epoch": 4761} {"train_loss": -25.375213623046875, "global_step": 395178, "epoch": 4761} {"train_loss": -26.21390724182129, "global_step": 395179, "epoch": 4761} {"train_loss": -26.659460067749023, "global_step": 395180, "epoch": 4761} {"train_loss": -26.4222412109375, "global_step": 395181, "epoch": 4761} {"train_loss": -26.073163986206055, "global_step": 395182, "epoch": 4761} {"train_loss": -26.403472900390625, "global_step": 395183, "epoch": 4761} {"train_loss": -26.356586456298828, "global_step": 395184, "epoch": 4761} {"train_loss": -26.52821922302246, "global_step": 395185, "epoch": 4761} {"train_loss": -26.69339370727539, "global_step": 395186, "epoch": 4761} {"train_loss": -26.24336814880371, "global_step": 395187, "epoch": 4761} {"train_loss": -26.667560577392578, "global_step": 395188, "epoch": 4761} {"train_loss": -26.473600387573242, "global_step": 395189, "epoch": 4761} {"train_loss": -26.47556495666504, "global_step": 395190, "epoch": 4761} {"train_loss": -26.5949764251709, "global_step": 395191, "epoch": 4761} {"train_loss": -26.306196212768555, "global_step": 395192, "epoch": 4761} {"train_loss": -26.439868927001953, "global_step": 395193, "epoch": 4761} {"train_loss": -26.821264266967773, "global_step": 395194, "epoch": 4761} {"train_loss": -26.68659782409668, "global_step": 395195, "epoch": 4761} {"train_loss": -26.148778915405273, "global_step": 395196, "epoch": 4761} {"train_loss": -26.70526695251465, "global_step": 395197, "epoch": 4761} {"train_loss": -26.601308822631836, "global_step": 395198, "epoch": 4761} {"train_loss": -26.751632690429688, "global_step": 395199, "epoch": 4761} {"train_loss": -27.15804100036621, "global_step": 395200, "epoch": 4761} {"train_loss": -26.5615234375, "global_step": 395201, "epoch": 4761} {"train_loss": -26.755151748657227, "global_step": 395202, "epoch": 4761} {"train_loss": -26.7171688079834, "global_step": 395203, "epoch": 4761} {"train_loss": -26.828937530517578, "global_step": 395204, "epoch": 4761} {"train_loss": -26.929208755493164, "global_step": 395205, "epoch": 4761} {"train_loss": -26.36261558532715, "global_step": 395206, "epoch": 4761} {"train_loss": -26.515893936157227, "global_step": 395207, "epoch": 4761} {"train_loss": -26.70161247253418, "global_step": 395208, "epoch": 4761} {"train_loss": -26.7814884185791, "global_step": 395209, "epoch": 4761} {"train_loss": -26.623022079467773, "global_step": 395210, "epoch": 4761} {"train_loss": -27.0506649017334, "global_step": 395211, "epoch": 4761} {"train_loss": -26.50526237487793, "global_step": 395212, "epoch": 4761} {"train_loss": -26.86651611328125, "global_step": 395213, "epoch": 4761} {"train_loss": -26.481220245361328, "global_step": 395214, "epoch": 4761} {"train_loss": -26.743011474609375, "global_step": 395215, "epoch": 4761} {"train_loss": -27.33994483947754, "global_step": 395216, "epoch": 4761} {"train_loss": -26.671695709228516, "global_step": 395217, "epoch": 4761} {"train_loss": -26.855361938476562, "global_step": 395218, "epoch": 4761} {"train_loss": -26.83139419555664, "global_step": 395219, "epoch": 4761} {"train_loss": -26.75913429260254, "global_step": 395220, "epoch": 4761} {"train_loss": -26.740234375, "global_step": 395221, "epoch": 4761} {"train_loss": -26.633747100830078, "global_step": 395222, "epoch": 4761} {"train_loss": -26.611164093017578, "global_step": 395223, "epoch": 4761} {"train_loss": -26.374805450439453, "global_step": 395224, "epoch": 4761} {"train_loss": -26.610387802124023, "global_step": 395225, "epoch": 4761} {"train_loss": -27.139204025268555, "global_step": 395226, "epoch": 4761} {"train_loss": -27.075225830078125, "global_step": 395227, "epoch": 4761} {"train_loss": -26.67789649963379, "global_step": 395228, "epoch": 4761} {"train_loss": -26.720306396484375, "global_step": 395229, "epoch": 4761} {"train_loss": -26.943252563476562, "global_step": 395230, "epoch": 4761} {"train_loss": -26.921295166015625, "global_step": 395231, "epoch": 4761} {"train_loss": -26.997434616088867, "global_step": 395232, "epoch": 4761} {"train_loss": -26.597578048706055, "global_step": 395233, "epoch": 4761} {"train_loss": -26.881000518798828, "global_step": 395234, "epoch": 4761} {"train_loss": -26.87053871154785, "global_step": 395235, "epoch": 4761} {"train_loss": -27.007720947265625, "global_step": 395236, "epoch": 4761} {"train_loss": -26.81473731994629, "global_step": 395237, "epoch": 4761} {"train_loss": -26.932727813720703, "global_step": 395238, "epoch": 4761} {"train_loss": -26.522497177124023, "global_step": 395239, "epoch": 4761} {"train_loss": -26.322559356689453, "global_step": 395240, "epoch": 4761} {"train_loss": -26.74911880493164, "global_step": 395241, "epoch": 4761} {"train_loss": -26.795989990234375, "global_step": 395242, "epoch": 4761} {"train_loss": -26.55267333984375, "global_step": 395243, "epoch": 4761} {"train_loss": -26.223392486572266, "global_step": 395244, "epoch": 4761} {"train_loss": -26.539442269198865, "global_step": 395245, "epoch": 4761, "val_loss": 6596021.0} {"train_loss": -26.151182174682617, "global_step": 395246, "epoch": 4762} {"train_loss": -25.9327335357666, "global_step": 395247, "epoch": 4762} {"train_loss": -26.725238800048828, "global_step": 395248, "epoch": 4762} {"train_loss": -26.58843994140625, "global_step": 395249, "epoch": 4762} {"train_loss": -25.356552124023438, "global_step": 395250, "epoch": 4762} {"train_loss": -25.662500381469727, "global_step": 395251, "epoch": 4762} {"train_loss": -25.932147979736328, "global_step": 395252, "epoch": 4762} {"train_loss": -25.924596786499023, "global_step": 395253, "epoch": 4762} {"train_loss": -26.07478141784668, "global_step": 395254, "epoch": 4762} {"train_loss": -26.064544677734375, "global_step": 395255, "epoch": 4762} {"train_loss": -26.500051498413086, "global_step": 395256, "epoch": 4762} {"train_loss": -26.216638565063477, "global_step": 395257, "epoch": 4762} {"train_loss": -26.22663688659668, "global_step": 395258, "epoch": 4762} {"train_loss": -26.124744415283203, "global_step": 395259, "epoch": 4762} {"train_loss": -26.24896240234375, "global_step": 395260, "epoch": 4762} {"train_loss": -26.3326416015625, "global_step": 395261, "epoch": 4762} {"train_loss": -26.27882957458496, "global_step": 395262, "epoch": 4762} {"train_loss": -26.212610244750977, "global_step": 395263, "epoch": 4762} {"train_loss": -26.128808975219727, "global_step": 395264, "epoch": 4762} {"train_loss": -26.613697052001953, "global_step": 395265, "epoch": 4762} {"train_loss": -26.129230499267578, "global_step": 395266, "epoch": 4762} {"train_loss": -26.46604347229004, "global_step": 395267, "epoch": 4762} {"train_loss": -26.269865036010742, "global_step": 395268, "epoch": 4762} {"train_loss": -26.44879150390625, "global_step": 395269, "epoch": 4762} {"train_loss": -26.388059616088867, "global_step": 395270, "epoch": 4762} {"train_loss": -26.637495040893555, "global_step": 395271, "epoch": 4762} {"train_loss": -26.56043815612793, "global_step": 395272, "epoch": 4762} {"train_loss": -26.35455894470215, "global_step": 395273, "epoch": 4762} {"train_loss": -26.484729766845703, "global_step": 395274, "epoch": 4762} {"train_loss": -26.618024826049805, "global_step": 395275, "epoch": 4762} {"train_loss": -26.65151023864746, "global_step": 395276, "epoch": 4762} {"train_loss": -26.6989803314209, "global_step": 395277, "epoch": 4762} {"train_loss": -26.449878692626953, "global_step": 395278, "epoch": 4762} {"train_loss": -26.68043327331543, "global_step": 395279, "epoch": 4762} {"train_loss": -26.279844284057617, "global_step": 395280, "epoch": 4762} {"train_loss": -26.389480590820312, "global_step": 395281, "epoch": 4762} {"train_loss": -26.89068031311035, "global_step": 395282, "epoch": 4762} {"train_loss": -26.67852783203125, "global_step": 395283, "epoch": 4762} {"train_loss": -26.530054092407227, "global_step": 395284, "epoch": 4762} {"train_loss": -26.6533145904541, "global_step": 395285, "epoch": 4762} {"train_loss": -26.306411743164062, "global_step": 395286, "epoch": 4762} {"train_loss": -26.509387969970703, "global_step": 395287, "epoch": 4762} {"train_loss": -26.605880737304688, "global_step": 395288, "epoch": 4762} {"train_loss": -26.506927490234375, "global_step": 395289, "epoch": 4762} {"train_loss": -26.835494995117188, "global_step": 395290, "epoch": 4762} {"train_loss": -26.89851188659668, "global_step": 395291, "epoch": 4762} {"train_loss": -26.35224723815918, "global_step": 395292, "epoch": 4762} {"train_loss": -27.020221710205078, "global_step": 395293, "epoch": 4762} {"train_loss": -26.7747745513916, "global_step": 395294, "epoch": 4762} {"train_loss": -26.590417861938477, "global_step": 395295, "epoch": 4762} {"train_loss": -26.601348876953125, "global_step": 395296, "epoch": 4762} {"train_loss": -26.33843994140625, "global_step": 395297, "epoch": 4762} {"train_loss": -26.859373092651367, "global_step": 395298, "epoch": 4762} {"train_loss": -26.406940460205078, "global_step": 395299, "epoch": 4762} {"train_loss": -26.63092613220215, "global_step": 395300, "epoch": 4762} {"train_loss": -26.672521591186523, "global_step": 395301, "epoch": 4762} {"train_loss": -26.8404598236084, "global_step": 395302, "epoch": 4762} {"train_loss": -26.584095001220703, "global_step": 395303, "epoch": 4762} {"train_loss": -26.794870376586914, "global_step": 395304, "epoch": 4762} {"train_loss": -26.768970489501953, "global_step": 395305, "epoch": 4762} {"train_loss": -26.440738677978516, "global_step": 395306, "epoch": 4762} {"train_loss": -26.863758087158203, "global_step": 395307, "epoch": 4762} {"train_loss": -26.477676391601562, "global_step": 395308, "epoch": 4762} {"train_loss": -27.055927276611328, "global_step": 395309, "epoch": 4762} {"train_loss": -26.62775230407715, "global_step": 395310, "epoch": 4762} {"train_loss": -26.662668228149414, "global_step": 395311, "epoch": 4762} {"train_loss": -26.746915817260742, "global_step": 395312, "epoch": 4762} {"train_loss": -26.676074981689453, "global_step": 395313, "epoch": 4762} {"train_loss": -26.85267448425293, "global_step": 395314, "epoch": 4762} {"train_loss": -26.704721450805664, "global_step": 395315, "epoch": 4762} {"train_loss": -26.60344886779785, "global_step": 395316, "epoch": 4762} {"train_loss": -26.558246612548828, "global_step": 395317, "epoch": 4762} {"train_loss": -26.976926803588867, "global_step": 395318, "epoch": 4762} {"train_loss": -26.963476181030273, "global_step": 395319, "epoch": 4762} {"train_loss": -26.529666900634766, "global_step": 395320, "epoch": 4762} {"train_loss": -26.919986724853516, "global_step": 395321, "epoch": 4762} {"train_loss": -26.892560958862305, "global_step": 395322, "epoch": 4762} {"train_loss": -26.572479248046875, "global_step": 395323, "epoch": 4762} {"train_loss": -26.55950927734375, "global_step": 395324, "epoch": 4762} {"train_loss": -26.580371856689453, "global_step": 395325, "epoch": 4762} {"train_loss": -26.2088680267334, "global_step": 395326, "epoch": 4762} {"train_loss": -26.6240177154541, "global_step": 395327, "epoch": 4762} {"train_loss": -26.509844791458313, "global_step": 395328, "epoch": 4762, "val_loss": 6678656.0} {"train_loss": -26.153284072875977, "global_step": 395329, "epoch": 4763} {"train_loss": -25.898298263549805, "global_step": 395330, "epoch": 4763} {"train_loss": -25.964813232421875, "global_step": 395331, "epoch": 4763} {"train_loss": -25.825651168823242, "global_step": 395332, "epoch": 4763} {"train_loss": -26.134912490844727, "global_step": 395333, "epoch": 4763} {"train_loss": -26.173404693603516, "global_step": 395334, "epoch": 4763} {"train_loss": -26.2020206451416, "global_step": 395335, "epoch": 4763} {"train_loss": -25.754959106445312, "global_step": 395336, "epoch": 4763} {"train_loss": -26.02211570739746, "global_step": 395337, "epoch": 4763} {"train_loss": -26.551034927368164, "global_step": 395338, "epoch": 4763} {"train_loss": -26.25077247619629, "global_step": 395339, "epoch": 4763} {"train_loss": -26.167526245117188, "global_step": 395340, "epoch": 4763} {"train_loss": -26.477859497070312, "global_step": 395341, "epoch": 4763} {"train_loss": -25.76923942565918, "global_step": 395342, "epoch": 4763} {"train_loss": -26.4586181640625, "global_step": 395343, "epoch": 4763} {"train_loss": -26.13614273071289, "global_step": 395344, "epoch": 4763} {"train_loss": -26.579620361328125, "global_step": 395345, "epoch": 4763} {"train_loss": -26.059595108032227, "global_step": 395346, "epoch": 4763} {"train_loss": -26.89227867126465, "global_step": 395347, "epoch": 4763} {"train_loss": -26.549972534179688, "global_step": 395348, "epoch": 4763} {"train_loss": -26.380874633789062, "global_step": 395349, "epoch": 4763} {"train_loss": -26.44512367248535, "global_step": 395350, "epoch": 4763} {"train_loss": -26.335315704345703, "global_step": 395351, "epoch": 4763} {"train_loss": -26.424030303955078, "global_step": 395352, "epoch": 4763} {"train_loss": -26.35626792907715, "global_step": 395353, "epoch": 4763} {"train_loss": -26.718435287475586, "global_step": 395354, "epoch": 4763} {"train_loss": -26.335132598876953, "global_step": 395355, "epoch": 4763} {"train_loss": -26.70856285095215, "global_step": 395356, "epoch": 4763} {"train_loss": -26.07537269592285, "global_step": 395357, "epoch": 4763} {"train_loss": -27.13654136657715, "global_step": 395358, "epoch": 4763} {"train_loss": -26.591846466064453, "global_step": 395359, "epoch": 4763} {"train_loss": -26.510522842407227, "global_step": 395360, "epoch": 4763} {"train_loss": -26.26307487487793, "global_step": 395361, "epoch": 4763} {"train_loss": -26.78091812133789, "global_step": 395362, "epoch": 4763} {"train_loss": -26.736835479736328, "global_step": 395363, "epoch": 4763} {"train_loss": -26.69403076171875, "global_step": 395364, "epoch": 4763} {"train_loss": -27.33047866821289, "global_step": 395365, "epoch": 4763} {"train_loss": -26.483068466186523, "global_step": 395366, "epoch": 4763} {"train_loss": -26.54084587097168, "global_step": 395367, "epoch": 4763} {"train_loss": -26.88380241394043, "global_step": 395368, "epoch": 4763} {"train_loss": -26.678857803344727, "global_step": 395369, "epoch": 4763} {"train_loss": -26.588287353515625, "global_step": 395370, "epoch": 4763} {"train_loss": -26.495141983032227, "global_step": 395371, "epoch": 4763} {"train_loss": -26.656579971313477, "global_step": 395372, "epoch": 4763} {"train_loss": -26.682708740234375, "global_step": 395373, "epoch": 4763} {"train_loss": -26.841720581054688, "global_step": 395374, "epoch": 4763} {"train_loss": -27.010740280151367, "global_step": 395375, "epoch": 4763} {"train_loss": -26.56661033630371, "global_step": 395376, "epoch": 4763} {"train_loss": -26.5764217376709, "global_step": 395377, "epoch": 4763} {"train_loss": -26.412038803100586, "global_step": 395378, "epoch": 4763} {"train_loss": -26.702804565429688, "global_step": 395379, "epoch": 4763} {"train_loss": -26.7943172454834, "global_step": 395380, "epoch": 4763} {"train_loss": -26.669097900390625, "global_step": 395381, "epoch": 4763} {"train_loss": -27.125431060791016, "global_step": 395382, "epoch": 4763} {"train_loss": -27.116455078125, "global_step": 395383, "epoch": 4763} {"train_loss": -26.51972007751465, "global_step": 395384, "epoch": 4763} {"train_loss": -26.561609268188477, "global_step": 395385, "epoch": 4763} {"train_loss": -26.451221466064453, "global_step": 395386, "epoch": 4763} {"train_loss": -26.904312133789062, "global_step": 395387, "epoch": 4763} {"train_loss": -26.186567306518555, "global_step": 395388, "epoch": 4763} {"train_loss": -26.25967788696289, "global_step": 395389, "epoch": 4763} {"train_loss": -26.07673454284668, "global_step": 395390, "epoch": 4763} {"train_loss": -26.88370132446289, "global_step": 395391, "epoch": 4763} {"train_loss": -27.3184757232666, "global_step": 395392, "epoch": 4763} {"train_loss": -26.557661056518555, "global_step": 395393, "epoch": 4763} {"train_loss": -26.208951950073242, "global_step": 395394, "epoch": 4763} {"train_loss": -26.292951583862305, "global_step": 395395, "epoch": 4763} {"train_loss": -26.21088981628418, "global_step": 395396, "epoch": 4763} {"train_loss": -25.39676856994629, "global_step": 395397, "epoch": 4763} {"train_loss": -24.456052780151367, "global_step": 395398, "epoch": 4763} {"train_loss": -25.044748306274414, "global_step": 395399, "epoch": 4763} {"train_loss": -25.938556671142578, "global_step": 395400, "epoch": 4763} {"train_loss": -25.866641998291016, "global_step": 395401, "epoch": 4763} {"train_loss": -26.18438720703125, "global_step": 395402, "epoch": 4763} {"train_loss": -25.94354248046875, "global_step": 395403, "epoch": 4763} {"train_loss": -26.471038818359375, "global_step": 395404, "epoch": 4763} {"train_loss": -25.929859161376953, "global_step": 395405, "epoch": 4763} {"train_loss": -26.340845108032227, "global_step": 395406, "epoch": 4763} {"train_loss": -26.22210121154785, "global_step": 395407, "epoch": 4763} {"train_loss": -26.654287338256836, "global_step": 395408, "epoch": 4763} {"train_loss": -26.485986709594727, "global_step": 395409, "epoch": 4763} {"train_loss": -26.387250900268555, "global_step": 395410, "epoch": 4763} {"train_loss": -26.39791688574366, "global_step": 395411, "epoch": 4763, "val_loss": 6548451.0} {"train_loss": -25.48280143737793, "global_step": 395412, "epoch": 4764} {"train_loss": -25.896087646484375, "global_step": 395413, "epoch": 4764} {"train_loss": -25.975677490234375, "global_step": 395414, "epoch": 4764} {"train_loss": -25.802631378173828, "global_step": 395415, "epoch": 4764} {"train_loss": -25.803083419799805, "global_step": 395416, "epoch": 4764} {"train_loss": -25.79520034790039, "global_step": 395417, "epoch": 4764} {"train_loss": -26.02685546875, "global_step": 395418, "epoch": 4764} {"train_loss": -26.165861129760742, "global_step": 395419, "epoch": 4764} {"train_loss": -26.120267868041992, "global_step": 395420, "epoch": 4764} {"train_loss": -25.9722900390625, "global_step": 395421, "epoch": 4764} {"train_loss": -26.2990665435791, "global_step": 395422, "epoch": 4764} {"train_loss": -26.02393913269043, "global_step": 395423, "epoch": 4764} {"train_loss": -26.09814453125, "global_step": 395424, "epoch": 4764} {"train_loss": -26.50104331970215, "global_step": 395425, "epoch": 4764} {"train_loss": -26.15532875061035, "global_step": 395426, "epoch": 4764} {"train_loss": -26.304489135742188, "global_step": 395427, "epoch": 4764} {"train_loss": -26.33186149597168, "global_step": 395428, "epoch": 4764} {"train_loss": -25.98211669921875, "global_step": 395429, "epoch": 4764} {"train_loss": -26.500141143798828, "global_step": 395430, "epoch": 4764} {"train_loss": -26.421899795532227, "global_step": 395431, "epoch": 4764} {"train_loss": -26.51372718811035, "global_step": 395432, "epoch": 4764} {"train_loss": -26.20777702331543, "global_step": 395433, "epoch": 4764} {"train_loss": -26.614843368530273, "global_step": 395434, "epoch": 4764} {"train_loss": -26.367822647094727, "global_step": 395435, "epoch": 4764} {"train_loss": -26.264301300048828, "global_step": 395436, "epoch": 4764} {"train_loss": -26.410131454467773, "global_step": 395437, "epoch": 4764} {"train_loss": -26.514678955078125, "global_step": 395438, "epoch": 4764} {"train_loss": -26.403303146362305, "global_step": 395439, "epoch": 4764} {"train_loss": -26.5438232421875, "global_step": 395440, "epoch": 4764} {"train_loss": -26.253555297851562, "global_step": 395441, "epoch": 4764} {"train_loss": -26.607177734375, "global_step": 395442, "epoch": 4764} {"train_loss": -26.53329849243164, "global_step": 395443, "epoch": 4764} {"train_loss": -26.436737060546875, "global_step": 395444, "epoch": 4764} {"train_loss": -26.349395751953125, "global_step": 395445, "epoch": 4764} {"train_loss": -26.68763542175293, "global_step": 395446, "epoch": 4764} {"train_loss": -26.79302978515625, "global_step": 395447, "epoch": 4764} {"train_loss": -26.84681510925293, "global_step": 395448, "epoch": 4764} {"train_loss": -26.83462905883789, "global_step": 395449, "epoch": 4764} {"train_loss": -26.633764266967773, "global_step": 395450, "epoch": 4764} {"train_loss": -26.691116333007812, "global_step": 395451, "epoch": 4764} {"train_loss": -26.906600952148438, "global_step": 395452, "epoch": 4764} {"train_loss": -26.649112701416016, "global_step": 395453, "epoch": 4764} {"train_loss": -27.008569717407227, "global_step": 395454, "epoch": 4764} {"train_loss": -26.505578994750977, "global_step": 395455, "epoch": 4764} {"train_loss": -26.638019561767578, "global_step": 395456, "epoch": 4764} {"train_loss": -26.880542755126953, "global_step": 395457, "epoch": 4764} {"train_loss": -26.4461727142334, "global_step": 395458, "epoch": 4764} {"train_loss": -26.882043838500977, "global_step": 395459, "epoch": 4764} {"train_loss": -26.793603897094727, "global_step": 395460, "epoch": 4764} {"train_loss": -26.97220802307129, "global_step": 395461, "epoch": 4764} {"train_loss": -26.036056518554688, "global_step": 395462, "epoch": 4764} {"train_loss": -26.531042098999023, "global_step": 395463, "epoch": 4764} {"train_loss": -26.42276954650879, "global_step": 395464, "epoch": 4764} {"train_loss": -26.750463485717773, "global_step": 395465, "epoch": 4764} {"train_loss": -26.7069149017334, "global_step": 395466, "epoch": 4764} {"train_loss": -26.76736831665039, "global_step": 395467, "epoch": 4764} {"train_loss": -26.849950790405273, "global_step": 395468, "epoch": 4764} {"train_loss": -26.28350257873535, "global_step": 395469, "epoch": 4764} {"train_loss": -26.607421875, "global_step": 395470, "epoch": 4764} {"train_loss": -26.39668846130371, "global_step": 395471, "epoch": 4764} {"train_loss": -26.333770751953125, "global_step": 395472, "epoch": 4764} {"train_loss": -26.25372886657715, "global_step": 395473, "epoch": 4764} {"train_loss": -26.941253662109375, "global_step": 395474, "epoch": 4764} {"train_loss": -26.59247398376465, "global_step": 395475, "epoch": 4764} {"train_loss": -26.817502975463867, "global_step": 395476, "epoch": 4764} {"train_loss": -27.018110275268555, "global_step": 395477, "epoch": 4764} {"train_loss": -26.56656265258789, "global_step": 395478, "epoch": 4764} {"train_loss": -26.29583168029785, "global_step": 395479, "epoch": 4764} {"train_loss": -26.876020431518555, "global_step": 395480, "epoch": 4764} {"train_loss": -26.381574630737305, "global_step": 395481, "epoch": 4764} {"train_loss": -27.133222579956055, "global_step": 395482, "epoch": 4764} {"train_loss": -26.70612907409668, "global_step": 395483, "epoch": 4764} {"train_loss": -26.60125732421875, "global_step": 395484, "epoch": 4764} {"train_loss": -26.322433471679688, "global_step": 395485, "epoch": 4764} {"train_loss": -26.850061416625977, "global_step": 395486, "epoch": 4764} {"train_loss": -26.638702392578125, "global_step": 395487, "epoch": 4764} {"train_loss": -26.9830379486084, "global_step": 395488, "epoch": 4764} {"train_loss": -27.01483726501465, "global_step": 395489, "epoch": 4764} {"train_loss": -26.447662353515625, "global_step": 395490, "epoch": 4764} {"train_loss": -26.70981788635254, "global_step": 395491, "epoch": 4764} {"train_loss": -26.226776123046875, "global_step": 395492, "epoch": 4764} {"train_loss": -26.591947555541992, "global_step": 395493, "epoch": 4764} {"train_loss": -26.48435661591679, "global_step": 395494, "epoch": 4764, "val_loss": 6684680.5} {"train_loss": -26.63119888305664, "global_step": 395495, "epoch": 4765} {"train_loss": -26.061491012573242, "global_step": 395496, "epoch": 4765} {"train_loss": -26.55510902404785, "global_step": 395497, "epoch": 4765} {"train_loss": -26.819738388061523, "global_step": 395498, "epoch": 4765} {"train_loss": -26.58991050720215, "global_step": 395499, "epoch": 4765} {"train_loss": -26.487375259399414, "global_step": 395500, "epoch": 4765} {"train_loss": -26.755029678344727, "global_step": 395501, "epoch": 4765} {"train_loss": -26.495349884033203, "global_step": 395502, "epoch": 4765} {"train_loss": -26.889429092407227, "global_step": 395503, "epoch": 4765} {"train_loss": -26.4786376953125, "global_step": 395504, "epoch": 4765} {"train_loss": -26.85590171813965, "global_step": 395505, "epoch": 4765} {"train_loss": -26.409921646118164, "global_step": 395506, "epoch": 4765} {"train_loss": -26.193012237548828, "global_step": 395507, "epoch": 4765} {"train_loss": -26.722091674804688, "global_step": 395508, "epoch": 4765} {"train_loss": -26.519140243530273, "global_step": 395509, "epoch": 4765} {"train_loss": -25.766433715820312, "global_step": 395510, "epoch": 4765} {"train_loss": -25.96735191345215, "global_step": 395511, "epoch": 4765} {"train_loss": -26.761260986328125, "global_step": 395512, "epoch": 4765} {"train_loss": -26.570287704467773, "global_step": 395513, "epoch": 4765} {"train_loss": -26.151885986328125, "global_step": 395514, "epoch": 4765} {"train_loss": -26.323444366455078, "global_step": 395515, "epoch": 4765} {"train_loss": -26.2508487701416, "global_step": 395516, "epoch": 4765} {"train_loss": -26.54007911682129, "global_step": 395517, "epoch": 4765} {"train_loss": -26.212060928344727, "global_step": 395518, "epoch": 4765} {"train_loss": -26.345197677612305, "global_step": 395519, "epoch": 4765} {"train_loss": -26.492130279541016, "global_step": 395520, "epoch": 4765} {"train_loss": -26.5982723236084, "global_step": 395521, "epoch": 4765} {"train_loss": -26.493757247924805, "global_step": 395522, "epoch": 4765} {"train_loss": -26.60941505432129, "global_step": 395523, "epoch": 4765} {"train_loss": -26.72633171081543, "global_step": 395524, "epoch": 4765} {"train_loss": -26.76551628112793, "global_step": 395525, "epoch": 4765} {"train_loss": -26.527801513671875, "global_step": 395526, "epoch": 4765} {"train_loss": -26.977283477783203, "global_step": 395527, "epoch": 4765} {"train_loss": -26.443334579467773, "global_step": 395528, "epoch": 4765} {"train_loss": -26.66582679748535, "global_step": 395529, "epoch": 4765} {"train_loss": -26.604352951049805, "global_step": 395530, "epoch": 4765} {"train_loss": -26.68250846862793, "global_step": 395531, "epoch": 4765} {"train_loss": -26.842559814453125, "global_step": 395532, "epoch": 4765} {"train_loss": -26.434717178344727, "global_step": 395533, "epoch": 4765} {"train_loss": -26.654605865478516, "global_step": 395534, "epoch": 4765} {"train_loss": -26.616846084594727, "global_step": 395535, "epoch": 4765} {"train_loss": -26.7609806060791, "global_step": 395536, "epoch": 4765} {"train_loss": -26.81758689880371, "global_step": 395537, "epoch": 4765} {"train_loss": -26.53301429748535, "global_step": 395538, "epoch": 4765} {"train_loss": -26.516895294189453, "global_step": 395539, "epoch": 4765} {"train_loss": -26.662525177001953, "global_step": 395540, "epoch": 4765} {"train_loss": -26.57234764099121, "global_step": 395541, "epoch": 4765} {"train_loss": -26.738325119018555, "global_step": 395542, "epoch": 4765} {"train_loss": -26.39540672302246, "global_step": 395543, "epoch": 4765} {"train_loss": -26.5773983001709, "global_step": 395544, "epoch": 4765} {"train_loss": -26.60109519958496, "global_step": 395545, "epoch": 4765} {"train_loss": -26.59771156311035, "global_step": 395546, "epoch": 4765} {"train_loss": -26.639989852905273, "global_step": 395547, "epoch": 4765} {"train_loss": -26.882314682006836, "global_step": 395548, "epoch": 4765} {"train_loss": -26.422576904296875, "global_step": 395549, "epoch": 4765} {"train_loss": -26.387338638305664, "global_step": 395550, "epoch": 4765} {"train_loss": -26.3687801361084, "global_step": 395551, "epoch": 4765} {"train_loss": -26.814062118530273, "global_step": 395552, "epoch": 4765} {"train_loss": -26.520421981811523, "global_step": 395553, "epoch": 4765} {"train_loss": -26.472522735595703, "global_step": 395554, "epoch": 4765} {"train_loss": -26.6076717376709, "global_step": 395555, "epoch": 4765} {"train_loss": -26.601892471313477, "global_step": 395556, "epoch": 4765} {"train_loss": -26.44712257385254, "global_step": 395557, "epoch": 4765} {"train_loss": -26.21542739868164, "global_step": 395558, "epoch": 4765} {"train_loss": -26.10743522644043, "global_step": 395559, "epoch": 4765} {"train_loss": -26.543994903564453, "global_step": 395560, "epoch": 4765} {"train_loss": -26.508392333984375, "global_step": 395561, "epoch": 4765} {"train_loss": -26.631925582885742, "global_step": 395562, "epoch": 4765} {"train_loss": -25.867572784423828, "global_step": 395563, "epoch": 4765} {"train_loss": -26.184722900390625, "global_step": 395564, "epoch": 4765} {"train_loss": -26.80314064025879, "global_step": 395565, "epoch": 4765} {"train_loss": -26.620121002197266, "global_step": 395566, "epoch": 4765} {"train_loss": -26.947362899780273, "global_step": 395567, "epoch": 4765} {"train_loss": -26.722131729125977, "global_step": 395568, "epoch": 4765} {"train_loss": -26.940702438354492, "global_step": 395569, "epoch": 4765} {"train_loss": -26.408308029174805, "global_step": 395570, "epoch": 4765} {"train_loss": -26.763080596923828, "global_step": 395571, "epoch": 4765} {"train_loss": -26.676166534423828, "global_step": 395572, "epoch": 4765} {"train_loss": -26.832244873046875, "global_step": 395573, "epoch": 4765} {"train_loss": -26.762277603149414, "global_step": 395574, "epoch": 4765} {"train_loss": -26.65644645690918, "global_step": 395575, "epoch": 4765} {"train_loss": -26.472620010375977, "global_step": 395576, "epoch": 4765} {"train_loss": -26.556639177253448, "global_step": 395577, "epoch": 4765, "val_loss": 6736629.0} {"train_loss": -25.662261962890625, "global_step": 395578, "epoch": 4766} {"train_loss": -26.107717514038086, "global_step": 395579, "epoch": 4766} {"train_loss": -25.500944137573242, "global_step": 395580, "epoch": 4766} {"train_loss": -25.94710350036621, "global_step": 395581, "epoch": 4766} {"train_loss": -25.939733505249023, "global_step": 395582, "epoch": 4766} {"train_loss": -26.011648178100586, "global_step": 395583, "epoch": 4766} {"train_loss": -25.637678146362305, "global_step": 395584, "epoch": 4766} {"train_loss": -26.153783798217773, "global_step": 395585, "epoch": 4766} {"train_loss": -26.155109405517578, "global_step": 395586, "epoch": 4766} {"train_loss": -26.162729263305664, "global_step": 395587, "epoch": 4766} {"train_loss": -25.91548728942871, "global_step": 395588, "epoch": 4766} {"train_loss": -26.437387466430664, "global_step": 395589, "epoch": 4766} {"train_loss": -26.09331703186035, "global_step": 395590, "epoch": 4766} {"train_loss": -26.14228630065918, "global_step": 395591, "epoch": 4766} {"train_loss": -26.313465118408203, "global_step": 395592, "epoch": 4766} {"train_loss": -26.0692138671875, "global_step": 395593, "epoch": 4766} {"train_loss": -26.383264541625977, "global_step": 395594, "epoch": 4766} {"train_loss": -26.04291343688965, "global_step": 395595, "epoch": 4766} {"train_loss": -26.392316818237305, "global_step": 395596, "epoch": 4766} {"train_loss": -26.731237411499023, "global_step": 395597, "epoch": 4766} {"train_loss": -26.204303741455078, "global_step": 395598, "epoch": 4766} {"train_loss": -26.756006240844727, "global_step": 395599, "epoch": 4766} {"train_loss": -26.39456558227539, "global_step": 395600, "epoch": 4766} {"train_loss": -26.600574493408203, "global_step": 395601, "epoch": 4766} {"train_loss": -26.410785675048828, "global_step": 395602, "epoch": 4766} {"train_loss": -26.474624633789062, "global_step": 395603, "epoch": 4766} {"train_loss": -26.23967933654785, "global_step": 395604, "epoch": 4766} {"train_loss": -26.787137985229492, "global_step": 395605, "epoch": 4766} {"train_loss": -26.637958526611328, "global_step": 395606, "epoch": 4766} {"train_loss": -26.815332412719727, "global_step": 395607, "epoch": 4766} {"train_loss": -26.57847023010254, "global_step": 395608, "epoch": 4766} {"train_loss": -26.56061363220215, "global_step": 395609, "epoch": 4766} {"train_loss": -26.48052978515625, "global_step": 395610, "epoch": 4766} {"train_loss": -26.550430297851562, "global_step": 395611, "epoch": 4766} {"train_loss": -26.64487648010254, "global_step": 395612, "epoch": 4766} {"train_loss": -26.893625259399414, "global_step": 395613, "epoch": 4766} {"train_loss": -26.531713485717773, "global_step": 395614, "epoch": 4766} {"train_loss": -26.522932052612305, "global_step": 395615, "epoch": 4766} {"train_loss": -26.652246475219727, "global_step": 395616, "epoch": 4766} {"train_loss": -26.5789737701416, "global_step": 395617, "epoch": 4766} {"train_loss": -26.529138565063477, "global_step": 395618, "epoch": 4766} {"train_loss": -26.731281280517578, "global_step": 395619, "epoch": 4766} {"train_loss": -26.940765380859375, "global_step": 395620, "epoch": 4766} {"train_loss": -26.3929500579834, "global_step": 395621, "epoch": 4766} {"train_loss": -26.372821807861328, "global_step": 395622, "epoch": 4766} {"train_loss": -26.59186363220215, "global_step": 395623, "epoch": 4766} {"train_loss": -26.876667022705078, "global_step": 395624, "epoch": 4766} {"train_loss": -26.5030574798584, "global_step": 395625, "epoch": 4766} {"train_loss": -26.77345085144043, "global_step": 395626, "epoch": 4766} {"train_loss": -26.264196395874023, "global_step": 395627, "epoch": 4766} {"train_loss": -26.6895809173584, "global_step": 395628, "epoch": 4766} {"train_loss": -26.703983306884766, "global_step": 395629, "epoch": 4766} {"train_loss": -26.752695083618164, "global_step": 395630, "epoch": 4766} {"train_loss": -26.515583038330078, "global_step": 395631, "epoch": 4766} {"train_loss": -26.626428604125977, "global_step": 395632, "epoch": 4766} {"train_loss": -26.559783935546875, "global_step": 395633, "epoch": 4766} {"train_loss": -26.103851318359375, "global_step": 395634, "epoch": 4766} {"train_loss": -26.900197982788086, "global_step": 395635, "epoch": 4766} {"train_loss": -26.742101669311523, "global_step": 395636, "epoch": 4766} {"train_loss": -26.49733543395996, "global_step": 395637, "epoch": 4766} {"train_loss": -26.22749900817871, "global_step": 395638, "epoch": 4766} {"train_loss": -26.346174240112305, "global_step": 395639, "epoch": 4766} {"train_loss": -26.414554595947266, "global_step": 395640, "epoch": 4766} {"train_loss": -26.325559616088867, "global_step": 395641, "epoch": 4766} {"train_loss": -26.268346786499023, "global_step": 395642, "epoch": 4766} {"train_loss": -26.19845962524414, "global_step": 395643, "epoch": 4766} {"train_loss": -26.127899169921875, "global_step": 395644, "epoch": 4766} {"train_loss": -26.45725440979004, "global_step": 395645, "epoch": 4766} {"train_loss": -26.546512603759766, "global_step": 395646, "epoch": 4766} {"train_loss": -26.20172119140625, "global_step": 395647, "epoch": 4766} {"train_loss": -26.660120010375977, "global_step": 395648, "epoch": 4766} {"train_loss": -26.230100631713867, "global_step": 395649, "epoch": 4766} {"train_loss": -26.366806030273438, "global_step": 395650, "epoch": 4766} {"train_loss": -26.54499626159668, "global_step": 395651, "epoch": 4766} {"train_loss": -26.416257858276367, "global_step": 395652, "epoch": 4766} {"train_loss": -26.163114547729492, "global_step": 395653, "epoch": 4766} {"train_loss": -26.62691307067871, "global_step": 395654, "epoch": 4766} {"train_loss": -26.50994300842285, "global_step": 395655, "epoch": 4766} {"train_loss": -26.89666748046875, "global_step": 395656, "epoch": 4766} {"train_loss": -26.35988426208496, "global_step": 395657, "epoch": 4766} {"train_loss": -26.42171287536621, "global_step": 395658, "epoch": 4766} {"train_loss": -26.204370498657227, "global_step": 395659, "epoch": 4766} {"train_loss": -26.40317537698401, "global_step": 395660, "epoch": 4766, "val_loss": 6646124.5} {"train_loss": -26.4721622467041, "global_step": 395661, "epoch": 4767} {"train_loss": -25.65472412109375, "global_step": 395662, "epoch": 4767} {"train_loss": -25.618207931518555, "global_step": 395663, "epoch": 4767} {"train_loss": -24.4292049407959, "global_step": 395664, "epoch": 4767} {"train_loss": -25.164758682250977, "global_step": 395665, "epoch": 4767} {"train_loss": -25.11490821838379, "global_step": 395666, "epoch": 4767} {"train_loss": -25.765167236328125, "global_step": 395667, "epoch": 4767} {"train_loss": -25.89827537536621, "global_step": 395668, "epoch": 4767} {"train_loss": -26.19294548034668, "global_step": 395669, "epoch": 4767} {"train_loss": -26.07675552368164, "global_step": 395670, "epoch": 4767} {"train_loss": -25.661447525024414, "global_step": 395671, "epoch": 4767} {"train_loss": -26.14472007751465, "global_step": 395672, "epoch": 4767} {"train_loss": -26.084375381469727, "global_step": 395673, "epoch": 4767} {"train_loss": -25.957910537719727, "global_step": 395674, "epoch": 4767} {"train_loss": -26.3311710357666, "global_step": 395675, "epoch": 4767} {"train_loss": -26.352325439453125, "global_step": 395676, "epoch": 4767} {"train_loss": -26.253650665283203, "global_step": 395677, "epoch": 4767} {"train_loss": -26.38474464416504, "global_step": 395678, "epoch": 4767} {"train_loss": -26.30741310119629, "global_step": 395679, "epoch": 4767} {"train_loss": -26.28509521484375, "global_step": 395680, "epoch": 4767} {"train_loss": -26.297332763671875, "global_step": 395681, "epoch": 4767} {"train_loss": -26.430456161499023, "global_step": 395682, "epoch": 4767} {"train_loss": -26.06201171875, "global_step": 395683, "epoch": 4767} {"train_loss": -26.90338706970215, "global_step": 395684, "epoch": 4767} {"train_loss": -26.705663681030273, "global_step": 395685, "epoch": 4767} {"train_loss": -26.41389274597168, "global_step": 395686, "epoch": 4767} {"train_loss": -26.627548217773438, "global_step": 395687, "epoch": 4767} {"train_loss": -26.4429874420166, "global_step": 395688, "epoch": 4767} {"train_loss": -26.30604362487793, "global_step": 395689, "epoch": 4767} {"train_loss": -27.127099990844727, "global_step": 395690, "epoch": 4767} {"train_loss": -26.662250518798828, "global_step": 395691, "epoch": 4767} {"train_loss": -26.604724884033203, "global_step": 395692, "epoch": 4767} {"train_loss": -26.565717697143555, "global_step": 395693, "epoch": 4767} {"train_loss": -26.703872680664062, "global_step": 395694, "epoch": 4767} {"train_loss": -26.298131942749023, "global_step": 395695, "epoch": 4767} {"train_loss": -26.575794219970703, "global_step": 395696, "epoch": 4767} {"train_loss": -26.85284423828125, "global_step": 395697, "epoch": 4767} {"train_loss": -26.427490234375, "global_step": 395698, "epoch": 4767} {"train_loss": -26.455005645751953, "global_step": 395699, "epoch": 4767} {"train_loss": -26.6159610748291, "global_step": 395700, "epoch": 4767} {"train_loss": -26.51093101501465, "global_step": 395701, "epoch": 4767} {"train_loss": -26.27579116821289, "global_step": 395702, "epoch": 4767} {"train_loss": -26.44305419921875, "global_step": 395703, "epoch": 4767} {"train_loss": -26.211883544921875, "global_step": 395704, "epoch": 4767} {"train_loss": -26.61004638671875, "global_step": 395705, "epoch": 4767} {"train_loss": -26.422290802001953, "global_step": 395706, "epoch": 4767} {"train_loss": -26.338850021362305, "global_step": 395707, "epoch": 4767} {"train_loss": -26.525741577148438, "global_step": 395708, "epoch": 4767} {"train_loss": -26.5175724029541, "global_step": 395709, "epoch": 4767} {"train_loss": -26.33807373046875, "global_step": 395710, "epoch": 4767} {"train_loss": -26.331607818603516, "global_step": 395711, "epoch": 4767} {"train_loss": -26.51190757751465, "global_step": 395712, "epoch": 4767} {"train_loss": -26.693090438842773, "global_step": 395713, "epoch": 4767} {"train_loss": -26.270383834838867, "global_step": 395714, "epoch": 4767} {"train_loss": -26.371570587158203, "global_step": 395715, "epoch": 4767} {"train_loss": -26.107379913330078, "global_step": 395716, "epoch": 4767} {"train_loss": -26.701303482055664, "global_step": 395717, "epoch": 4767} {"train_loss": -26.44219970703125, "global_step": 395718, "epoch": 4767} {"train_loss": -26.03375816345215, "global_step": 395719, "epoch": 4767} {"train_loss": -26.45957374572754, "global_step": 395720, "epoch": 4767} {"train_loss": -26.41866111755371, "global_step": 395721, "epoch": 4767} {"train_loss": -26.084081649780273, "global_step": 395722, "epoch": 4767} {"train_loss": -26.19985008239746, "global_step": 395723, "epoch": 4767} {"train_loss": -26.647449493408203, "global_step": 395724, "epoch": 4767} {"train_loss": -26.465930938720703, "global_step": 395725, "epoch": 4767} {"train_loss": -26.186725616455078, "global_step": 395726, "epoch": 4767} {"train_loss": -26.225141525268555, "global_step": 395727, "epoch": 4767} {"train_loss": -26.042713165283203, "global_step": 395728, "epoch": 4767} {"train_loss": -26.1596622467041, "global_step": 395729, "epoch": 4767} {"train_loss": -25.939971923828125, "global_step": 395730, "epoch": 4767} {"train_loss": -26.361371994018555, "global_step": 395731, "epoch": 4767} {"train_loss": -26.209217071533203, "global_step": 395732, "epoch": 4767} {"train_loss": -25.570497512817383, "global_step": 395733, "epoch": 4767} {"train_loss": -25.91650390625, "global_step": 395734, "epoch": 4767} {"train_loss": -26.102462768554688, "global_step": 395735, "epoch": 4767} {"train_loss": -26.538503646850586, "global_step": 395736, "epoch": 4767} {"train_loss": -26.467390060424805, "global_step": 395737, "epoch": 4767} {"train_loss": -26.40203285217285, "global_step": 395738, "epoch": 4767} {"train_loss": -26.253284454345703, "global_step": 395739, "epoch": 4767} {"train_loss": -26.126224517822266, "global_step": 395740, "epoch": 4767} {"train_loss": -26.320859909057617, "global_step": 395741, "epoch": 4767} {"train_loss": -26.795751571655273, "global_step": 395742, "epoch": 4767} {"train_loss": -26.284883820866963, "global_step": 395743, "epoch": 4767, "val_loss": 6694589.0} {"train_loss": -26.526126861572266, "global_step": 395744, "epoch": 4768} {"train_loss": -26.214502334594727, "global_step": 395745, "epoch": 4768} {"train_loss": -26.10337257385254, "global_step": 395746, "epoch": 4768} {"train_loss": -26.5634765625, "global_step": 395747, "epoch": 4768} {"train_loss": -26.570083618164062, "global_step": 395748, "epoch": 4768} {"train_loss": -26.1495418548584, "global_step": 395749, "epoch": 4768} {"train_loss": -26.5025691986084, "global_step": 395750, "epoch": 4768} {"train_loss": -26.777204513549805, "global_step": 395751, "epoch": 4768} {"train_loss": -26.115568161010742, "global_step": 395752, "epoch": 4768} {"train_loss": -26.157073974609375, "global_step": 395753, "epoch": 4768} {"train_loss": -26.432966232299805, "global_step": 395754, "epoch": 4768} {"train_loss": -26.41558265686035, "global_step": 395755, "epoch": 4768} {"train_loss": -26.5565185546875, "global_step": 395756, "epoch": 4768} {"train_loss": -26.589645385742188, "global_step": 395757, "epoch": 4768} {"train_loss": -26.337682723999023, "global_step": 395758, "epoch": 4768} {"train_loss": -26.596282958984375, "global_step": 395759, "epoch": 4768} {"train_loss": -26.282684326171875, "global_step": 395760, "epoch": 4768} {"train_loss": -26.537824630737305, "global_step": 395761, "epoch": 4768} {"train_loss": -26.460065841674805, "global_step": 395762, "epoch": 4768} {"train_loss": -26.561725616455078, "global_step": 395763, "epoch": 4768} {"train_loss": -26.31671142578125, "global_step": 395764, "epoch": 4768} {"train_loss": -26.738798141479492, "global_step": 395765, "epoch": 4768} {"train_loss": -27.19611167907715, "global_step": 395766, "epoch": 4768} {"train_loss": -26.704519271850586, "global_step": 395767, "epoch": 4768} {"train_loss": -26.84564208984375, "global_step": 395768, "epoch": 4768} {"train_loss": -27.070892333984375, "global_step": 395769, "epoch": 4768} {"train_loss": -26.6705265045166, "global_step": 395770, "epoch": 4768} {"train_loss": -26.358983993530273, "global_step": 395771, "epoch": 4768} {"train_loss": -26.735355377197266, "global_step": 395772, "epoch": 4768} {"train_loss": -26.430316925048828, "global_step": 395773, "epoch": 4768} {"train_loss": -26.742700576782227, "global_step": 395774, "epoch": 4768} {"train_loss": -27.085601806640625, "global_step": 395775, "epoch": 4768} {"train_loss": -26.588409423828125, "global_step": 395776, "epoch": 4768} {"train_loss": -26.376789093017578, "global_step": 395777, "epoch": 4768} {"train_loss": -26.515920639038086, "global_step": 395778, "epoch": 4768} {"train_loss": -26.231653213500977, "global_step": 395779, "epoch": 4768} {"train_loss": -26.363285064697266, "global_step": 395780, "epoch": 4768} {"train_loss": -26.723730087280273, "global_step": 395781, "epoch": 4768} {"train_loss": -26.643774032592773, "global_step": 395782, "epoch": 4768} {"train_loss": -26.690200805664062, "global_step": 395783, "epoch": 4768} {"train_loss": -26.664447784423828, "global_step": 395784, "epoch": 4768} {"train_loss": -26.828832626342773, "global_step": 395785, "epoch": 4768} {"train_loss": -26.451513290405273, "global_step": 395786, "epoch": 4768} {"train_loss": -26.648000717163086, "global_step": 395787, "epoch": 4768} {"train_loss": -26.681396484375, "global_step": 395788, "epoch": 4768} {"train_loss": -27.100269317626953, "global_step": 395789, "epoch": 4768} {"train_loss": -26.944238662719727, "global_step": 395790, "epoch": 4768} {"train_loss": -26.627899169921875, "global_step": 395791, "epoch": 4768} {"train_loss": -26.5810604095459, "global_step": 395792, "epoch": 4768} {"train_loss": -26.564008712768555, "global_step": 395793, "epoch": 4768} {"train_loss": -26.849084854125977, "global_step": 395794, "epoch": 4768} {"train_loss": -26.536392211914062, "global_step": 395795, "epoch": 4768} {"train_loss": -26.4135684967041, "global_step": 395796, "epoch": 4768} {"train_loss": -25.907896041870117, "global_step": 395797, "epoch": 4768} {"train_loss": -26.093915939331055, "global_step": 395798, "epoch": 4768} {"train_loss": -26.078632354736328, "global_step": 395799, "epoch": 4768} {"train_loss": -26.713647842407227, "global_step": 395800, "epoch": 4768} {"train_loss": -26.566308975219727, "global_step": 395801, "epoch": 4768} {"train_loss": -25.841251373291016, "global_step": 395802, "epoch": 4768} {"train_loss": -26.602834701538086, "global_step": 395803, "epoch": 4768} {"train_loss": -26.769418716430664, "global_step": 395804, "epoch": 4768} {"train_loss": -26.5418643951416, "global_step": 395805, "epoch": 4768} {"train_loss": -26.140710830688477, "global_step": 395806, "epoch": 4768} {"train_loss": -26.435083389282227, "global_step": 395807, "epoch": 4768} {"train_loss": -26.44769287109375, "global_step": 395808, "epoch": 4768} {"train_loss": -26.917932510375977, "global_step": 395809, "epoch": 4768} {"train_loss": -26.683496475219727, "global_step": 395810, "epoch": 4768} {"train_loss": -26.213979721069336, "global_step": 395811, "epoch": 4768} {"train_loss": -26.388696670532227, "global_step": 395812, "epoch": 4768} {"train_loss": -26.548023223876953, "global_step": 395813, "epoch": 4768} {"train_loss": -26.3968505859375, "global_step": 395814, "epoch": 4768} {"train_loss": -26.699234008789062, "global_step": 395815, "epoch": 4768} {"train_loss": -26.848957061767578, "global_step": 395816, "epoch": 4768} {"train_loss": -26.37672233581543, "global_step": 395817, "epoch": 4768} {"train_loss": -26.63010597229004, "global_step": 395818, "epoch": 4768} {"train_loss": -26.464746475219727, "global_step": 395819, "epoch": 4768} {"train_loss": -26.701486587524414, "global_step": 395820, "epoch": 4768} {"train_loss": -26.666778564453125, "global_step": 395821, "epoch": 4768} {"train_loss": -26.439105987548828, "global_step": 395822, "epoch": 4768} {"train_loss": -26.082677841186523, "global_step": 395823, "epoch": 4768} {"train_loss": -25.9335994720459, "global_step": 395824, "epoch": 4768} {"train_loss": -26.231901168823242, "global_step": 395825, "epoch": 4768} {"train_loss": -26.50293904040233, "global_step": 395826, "epoch": 4768, "val_loss": 6616877.5} {"train_loss": -24.329753875732422, "global_step": 395827, "epoch": 4769} {"train_loss": -23.04273796081543, "global_step": 395828, "epoch": 4769} {"train_loss": -24.230304718017578, "global_step": 395829, "epoch": 4769} {"train_loss": -23.5665340423584, "global_step": 395830, "epoch": 4769} {"train_loss": -25.43692970275879, "global_step": 395831, "epoch": 4769} {"train_loss": -24.74959373474121, "global_step": 395832, "epoch": 4769} {"train_loss": -25.16755485534668, "global_step": 395833, "epoch": 4769} {"train_loss": -24.628835678100586, "global_step": 395834, "epoch": 4769} {"train_loss": -24.682544708251953, "global_step": 395835, "epoch": 4769} {"train_loss": -25.153162002563477, "global_step": 395836, "epoch": 4769} {"train_loss": -25.11882781982422, "global_step": 395837, "epoch": 4769} {"train_loss": -25.45039939880371, "global_step": 395838, "epoch": 4769} {"train_loss": -25.166820526123047, "global_step": 395839, "epoch": 4769} {"train_loss": -25.742767333984375, "global_step": 395840, "epoch": 4769} {"train_loss": -25.31336784362793, "global_step": 395841, "epoch": 4769} {"train_loss": -25.794971466064453, "global_step": 395842, "epoch": 4769} {"train_loss": -25.930871963500977, "global_step": 395843, "epoch": 4769} {"train_loss": -25.713598251342773, "global_step": 395844, "epoch": 4769} {"train_loss": -25.509403228759766, "global_step": 395845, "epoch": 4769} {"train_loss": -25.744709014892578, "global_step": 395846, "epoch": 4769} {"train_loss": -25.82853126525879, "global_step": 395847, "epoch": 4769} {"train_loss": -25.735525131225586, "global_step": 395848, "epoch": 4769} {"train_loss": -25.541664123535156, "global_step": 395849, "epoch": 4769} {"train_loss": -25.576982498168945, "global_step": 395850, "epoch": 4769} {"train_loss": -25.72492790222168, "global_step": 395851, "epoch": 4769} {"train_loss": -25.950590133666992, "global_step": 395852, "epoch": 4769} {"train_loss": -25.929931640625, "global_step": 395853, "epoch": 4769} {"train_loss": -26.177371978759766, "global_step": 395854, "epoch": 4769} {"train_loss": -26.26797866821289, "global_step": 395855, "epoch": 4769} {"train_loss": -26.01875114440918, "global_step": 395856, "epoch": 4769} {"train_loss": -26.486738204956055, "global_step": 395857, "epoch": 4769} {"train_loss": -25.92793083190918, "global_step": 395858, "epoch": 4769} {"train_loss": -25.937612533569336, "global_step": 395859, "epoch": 4769} {"train_loss": -26.24567222595215, "global_step": 395860, "epoch": 4769} {"train_loss": -26.13298988342285, "global_step": 395861, "epoch": 4769} {"train_loss": -26.24700927734375, "global_step": 395862, "epoch": 4769} {"train_loss": -26.587066650390625, "global_step": 395863, "epoch": 4769} {"train_loss": -26.261707305908203, "global_step": 395864, "epoch": 4769} {"train_loss": -26.2219295501709, "global_step": 395865, "epoch": 4769} {"train_loss": -26.497900009155273, "global_step": 395866, "epoch": 4769} {"train_loss": -26.811548233032227, "global_step": 395867, "epoch": 4769} {"train_loss": -26.530258178710938, "global_step": 395868, "epoch": 4769} {"train_loss": -26.276559829711914, "global_step": 395869, "epoch": 4769} {"train_loss": -26.43350601196289, "global_step": 395870, "epoch": 4769} {"train_loss": -26.660322189331055, "global_step": 395871, "epoch": 4769} {"train_loss": -26.506793975830078, "global_step": 395872, "epoch": 4769} {"train_loss": -26.487979888916016, "global_step": 395873, "epoch": 4769} {"train_loss": -26.5128231048584, "global_step": 395874, "epoch": 4769} {"train_loss": -26.609882354736328, "global_step": 395875, "epoch": 4769} {"train_loss": -26.70155906677246, "global_step": 395876, "epoch": 4769} {"train_loss": -26.258752822875977, "global_step": 395877, "epoch": 4769} {"train_loss": -26.6234130859375, "global_step": 395878, "epoch": 4769} {"train_loss": -26.648481369018555, "global_step": 395879, "epoch": 4769} {"train_loss": -26.61240577697754, "global_step": 395880, "epoch": 4769} {"train_loss": -26.89886474609375, "global_step": 395881, "epoch": 4769} {"train_loss": -26.408315658569336, "global_step": 395882, "epoch": 4769} {"train_loss": -26.660139083862305, "global_step": 395883, "epoch": 4769} {"train_loss": -26.627914428710938, "global_step": 395884, "epoch": 4769} {"train_loss": -26.954360961914062, "global_step": 395885, "epoch": 4769} {"train_loss": -26.52125358581543, "global_step": 395886, "epoch": 4769} {"train_loss": -26.572864532470703, "global_step": 395887, "epoch": 4769} {"train_loss": -27.192062377929688, "global_step": 395888, "epoch": 4769} {"train_loss": -26.630859375, "global_step": 395889, "epoch": 4769} {"train_loss": -26.52019691467285, "global_step": 395890, "epoch": 4769} {"train_loss": -26.568506240844727, "global_step": 395891, "epoch": 4769} {"train_loss": -26.780969619750977, "global_step": 395892, "epoch": 4769} {"train_loss": -26.787887573242188, "global_step": 395893, "epoch": 4769} {"train_loss": -26.774219512939453, "global_step": 395894, "epoch": 4769} {"train_loss": -26.64356803894043, "global_step": 395895, "epoch": 4769} {"train_loss": -26.73172950744629, "global_step": 395896, "epoch": 4769} {"train_loss": -26.731637954711914, "global_step": 395897, "epoch": 4769} {"train_loss": -26.80194664001465, "global_step": 395898, "epoch": 4769} {"train_loss": -26.5042724609375, "global_step": 395899, "epoch": 4769} {"train_loss": -26.4647216796875, "global_step": 395900, "epoch": 4769} {"train_loss": -26.755111694335938, "global_step": 395901, "epoch": 4769} {"train_loss": -26.663257598876953, "global_step": 395902, "epoch": 4769} {"train_loss": -26.490747451782227, "global_step": 395903, "epoch": 4769} {"train_loss": -26.751317977905273, "global_step": 395904, "epoch": 4769} {"train_loss": -26.671533584594727, "global_step": 395905, "epoch": 4769} {"train_loss": -26.89161491394043, "global_step": 395906, "epoch": 4769} {"train_loss": -26.72503662109375, "global_step": 395907, "epoch": 4769} {"train_loss": -26.491621017456055, "global_step": 395908, "epoch": 4769} {"train_loss": -26.123062133789062, "global_step": 395909, "epoch": 4769, "val_loss": 6641498.5} {"train_loss": -25.78926658630371, "global_step": 395910, "epoch": 4770} {"train_loss": -25.545522689819336, "global_step": 395911, "epoch": 4770} {"train_loss": -24.5233211517334, "global_step": 395912, "epoch": 4770} {"train_loss": -24.81105613708496, "global_step": 395913, "epoch": 4770} {"train_loss": -26.48345947265625, "global_step": 395914, "epoch": 4770} {"train_loss": -26.09085464477539, "global_step": 395915, "epoch": 4770} {"train_loss": -25.484683990478516, "global_step": 395916, "epoch": 4770} {"train_loss": -25.815534591674805, "global_step": 395917, "epoch": 4770} {"train_loss": -25.981433868408203, "global_step": 395918, "epoch": 4770} {"train_loss": -25.943313598632812, "global_step": 395919, "epoch": 4770} {"train_loss": -26.2268009185791, "global_step": 395920, "epoch": 4770} {"train_loss": -26.232105255126953, "global_step": 395921, "epoch": 4770} {"train_loss": -26.26993751525879, "global_step": 395922, "epoch": 4770} {"train_loss": -25.92278480529785, "global_step": 395923, "epoch": 4770} {"train_loss": -26.319372177124023, "global_step": 395924, "epoch": 4770} {"train_loss": -25.952259063720703, "global_step": 395925, "epoch": 4770} {"train_loss": -26.07305908203125, "global_step": 395926, "epoch": 4770} {"train_loss": -26.212787628173828, "global_step": 395927, "epoch": 4770} {"train_loss": -26.014663696289062, "global_step": 395928, "epoch": 4770} {"train_loss": -26.07586669921875, "global_step": 395929, "epoch": 4770} {"train_loss": -26.50481605529785, "global_step": 395930, "epoch": 4770} {"train_loss": -26.104816436767578, "global_step": 395931, "epoch": 4770} {"train_loss": -26.317142486572266, "global_step": 395932, "epoch": 4770} {"train_loss": -26.067676544189453, "global_step": 395933, "epoch": 4770} {"train_loss": -26.733570098876953, "global_step": 395934, "epoch": 4770} {"train_loss": -26.47486686706543, "global_step": 395935, "epoch": 4770} {"train_loss": -26.45037841796875, "global_step": 395936, "epoch": 4770} {"train_loss": -26.66144371032715, "global_step": 395937, "epoch": 4770} {"train_loss": -26.326635360717773, "global_step": 395938, "epoch": 4770} {"train_loss": -26.7072811126709, "global_step": 395939, "epoch": 4770} {"train_loss": -26.414154052734375, "global_step": 395940, "epoch": 4770} {"train_loss": -26.957937240600586, "global_step": 395941, "epoch": 4770} {"train_loss": -26.662506103515625, "global_step": 395942, "epoch": 4770} {"train_loss": -26.85430908203125, "global_step": 395943, "epoch": 4770} {"train_loss": -26.53192138671875, "global_step": 395944, "epoch": 4770} {"train_loss": -26.652753829956055, "global_step": 395945, "epoch": 4770} {"train_loss": -26.69400978088379, "global_step": 395946, "epoch": 4770} {"train_loss": -26.604949951171875, "global_step": 395947, "epoch": 4770} {"train_loss": -26.615751266479492, "global_step": 395948, "epoch": 4770} {"train_loss": -26.97600746154785, "global_step": 395949, "epoch": 4770} {"train_loss": -26.755802154541016, "global_step": 395950, "epoch": 4770} {"train_loss": -26.81928062438965, "global_step": 395951, "epoch": 4770} {"train_loss": -26.749982833862305, "global_step": 395952, "epoch": 4770} {"train_loss": -26.744049072265625, "global_step": 395953, "epoch": 4770} {"train_loss": -26.629846572875977, "global_step": 395954, "epoch": 4770} {"train_loss": -26.982254028320312, "global_step": 395955, "epoch": 4770} {"train_loss": -26.72206687927246, "global_step": 395956, "epoch": 4770} {"train_loss": -27.097400665283203, "global_step": 395957, "epoch": 4770} {"train_loss": -26.6879940032959, "global_step": 395958, "epoch": 4770} {"train_loss": -26.699420928955078, "global_step": 395959, "epoch": 4770} {"train_loss": -26.95247459411621, "global_step": 395960, "epoch": 4770} {"train_loss": -26.718420028686523, "global_step": 395961, "epoch": 4770} {"train_loss": -26.600330352783203, "global_step": 395962, "epoch": 4770} {"train_loss": -26.620330810546875, "global_step": 395963, "epoch": 4770} {"train_loss": -26.456134796142578, "global_step": 395964, "epoch": 4770} {"train_loss": -26.693119049072266, "global_step": 395965, "epoch": 4770} {"train_loss": -26.938520431518555, "global_step": 395966, "epoch": 4770} {"train_loss": -26.66794204711914, "global_step": 395967, "epoch": 4770} {"train_loss": -26.976037979125977, "global_step": 395968, "epoch": 4770} {"train_loss": -26.821674346923828, "global_step": 395969, "epoch": 4770} {"train_loss": -26.35170555114746, "global_step": 395970, "epoch": 4770} {"train_loss": -26.13153648376465, "global_step": 395971, "epoch": 4770} {"train_loss": -26.509857177734375, "global_step": 395972, "epoch": 4770} {"train_loss": -25.969785690307617, "global_step": 395973, "epoch": 4770} {"train_loss": -25.34882164001465, "global_step": 395974, "epoch": 4770} {"train_loss": -25.423404693603516, "global_step": 395975, "epoch": 4770} {"train_loss": -25.69795036315918, "global_step": 395976, "epoch": 4770} {"train_loss": -26.6285457611084, "global_step": 395977, "epoch": 4770} {"train_loss": -26.240278244018555, "global_step": 395978, "epoch": 4770} {"train_loss": -26.359882354736328, "global_step": 395979, "epoch": 4770} {"train_loss": -26.189844131469727, "global_step": 395980, "epoch": 4770} {"train_loss": -26.2835693359375, "global_step": 395981, "epoch": 4770} {"train_loss": -26.27394676208496, "global_step": 395982, "epoch": 4770} {"train_loss": -26.114410400390625, "global_step": 395983, "epoch": 4770} {"train_loss": -26.11323356628418, "global_step": 395984, "epoch": 4770} {"train_loss": -26.4625186920166, "global_step": 395985, "epoch": 4770} {"train_loss": -26.505512237548828, "global_step": 395986, "epoch": 4770} {"train_loss": -26.418989181518555, "global_step": 395987, "epoch": 4770} {"train_loss": -26.13525390625, "global_step": 395988, "epoch": 4770} {"train_loss": -26.586292266845703, "global_step": 395989, "epoch": 4770} {"train_loss": -26.020124435424805, "global_step": 395990, "epoch": 4770} {"train_loss": -26.733640670776367, "global_step": 395991, "epoch": 4770} {"train_loss": -26.35251263538039, "global_step": 395992, "epoch": 4770, "val_loss": 6445767.0} {"train_loss": -25.96613883972168, "global_step": 395993, "epoch": 4771} {"train_loss": -25.96296501159668, "global_step": 395994, "epoch": 4771} {"train_loss": -26.29204750061035, "global_step": 395995, "epoch": 4771} {"train_loss": -25.61578369140625, "global_step": 395996, "epoch": 4771} {"train_loss": -25.794767379760742, "global_step": 395997, "epoch": 4771} {"train_loss": -25.9478816986084, "global_step": 395998, "epoch": 4771} {"train_loss": -25.931476593017578, "global_step": 395999, "epoch": 4771} {"train_loss": -26.135019302368164, "global_step": 396000, "epoch": 4771} {"train_loss": -26.378238677978516, "global_step": 396001, "epoch": 4771} {"train_loss": -25.92323875427246, "global_step": 396002, "epoch": 4771} {"train_loss": -25.960193634033203, "global_step": 396003, "epoch": 4771} {"train_loss": -26.108551025390625, "global_step": 396004, "epoch": 4771} {"train_loss": -26.0482234954834, "global_step": 396005, "epoch": 4771} {"train_loss": -26.35599708557129, "global_step": 396006, "epoch": 4771} {"train_loss": -26.179325103759766, "global_step": 396007, "epoch": 4771} {"train_loss": -26.131467819213867, "global_step": 396008, "epoch": 4771} {"train_loss": -26.591079711914062, "global_step": 396009, "epoch": 4771} {"train_loss": -26.392194747924805, "global_step": 396010, "epoch": 4771} {"train_loss": -26.094226837158203, "global_step": 396011, "epoch": 4771} {"train_loss": -26.7947998046875, "global_step": 396012, "epoch": 4771} {"train_loss": -26.559814453125, "global_step": 396013, "epoch": 4771} {"train_loss": -26.514225006103516, "global_step": 396014, "epoch": 4771} {"train_loss": -26.53761100769043, "global_step": 396015, "epoch": 4771} {"train_loss": -26.5869083404541, "global_step": 396016, "epoch": 4771} {"train_loss": -26.837600708007812, "global_step": 396017, "epoch": 4771} {"train_loss": -26.4267578125, "global_step": 396018, "epoch": 4771} {"train_loss": -26.276086807250977, "global_step": 396019, "epoch": 4771} {"train_loss": -26.17339515686035, "global_step": 396020, "epoch": 4771} {"train_loss": -26.547439575195312, "global_step": 396021, "epoch": 4771} {"train_loss": -26.939884185791016, "global_step": 396022, "epoch": 4771} {"train_loss": -26.363849639892578, "global_step": 396023, "epoch": 4771} {"train_loss": -26.39666748046875, "global_step": 396024, "epoch": 4771} {"train_loss": -26.958953857421875, "global_step": 396025, "epoch": 4771} {"train_loss": -26.67744255065918, "global_step": 396026, "epoch": 4771} {"train_loss": -26.74775505065918, "global_step": 396027, "epoch": 4771} {"train_loss": -26.55731201171875, "global_step": 396028, "epoch": 4771} {"train_loss": -26.396459579467773, "global_step": 396029, "epoch": 4771} {"train_loss": -26.567596435546875, "global_step": 396030, "epoch": 4771} {"train_loss": -26.9676513671875, "global_step": 396031, "epoch": 4771} {"train_loss": -26.6380615234375, "global_step": 396032, "epoch": 4771} {"train_loss": -26.77899742126465, "global_step": 396033, "epoch": 4771} {"train_loss": -26.64649772644043, "global_step": 396034, "epoch": 4771} {"train_loss": -26.86136245727539, "global_step": 396035, "epoch": 4771} {"train_loss": -26.64215660095215, "global_step": 396036, "epoch": 4771} {"train_loss": -26.82391357421875, "global_step": 396037, "epoch": 4771} {"train_loss": -26.210651397705078, "global_step": 396038, "epoch": 4771} {"train_loss": -27.216054916381836, "global_step": 396039, "epoch": 4771} {"train_loss": -26.9775390625, "global_step": 396040, "epoch": 4771} {"train_loss": -26.65640640258789, "global_step": 396041, "epoch": 4771} {"train_loss": -26.528289794921875, "global_step": 396042, "epoch": 4771} {"train_loss": -26.489810943603516, "global_step": 396043, "epoch": 4771} {"train_loss": -26.246442794799805, "global_step": 396044, "epoch": 4771} {"train_loss": -27.01545524597168, "global_step": 396045, "epoch": 4771} {"train_loss": -26.821308135986328, "global_step": 396046, "epoch": 4771} {"train_loss": -26.54426383972168, "global_step": 396047, "epoch": 4771} {"train_loss": -27.000146865844727, "global_step": 396048, "epoch": 4771} {"train_loss": -26.52433204650879, "global_step": 396049, "epoch": 4771} {"train_loss": -26.686267852783203, "global_step": 396050, "epoch": 4771} {"train_loss": -26.520109176635742, "global_step": 396051, "epoch": 4771} {"train_loss": -26.647138595581055, "global_step": 396052, "epoch": 4771} {"train_loss": -26.45307731628418, "global_step": 396053, "epoch": 4771} {"train_loss": -26.529632568359375, "global_step": 396054, "epoch": 4771} {"train_loss": -26.310672760009766, "global_step": 396055, "epoch": 4771} {"train_loss": -26.431623458862305, "global_step": 396056, "epoch": 4771} {"train_loss": -26.4227237701416, "global_step": 396057, "epoch": 4771} {"train_loss": -26.490793228149414, "global_step": 396058, "epoch": 4771} {"train_loss": -26.4268856048584, "global_step": 396059, "epoch": 4771} {"train_loss": -26.756322860717773, "global_step": 396060, "epoch": 4771} {"train_loss": -26.722442626953125, "global_step": 396061, "epoch": 4771} {"train_loss": -26.38153648376465, "global_step": 396062, "epoch": 4771} {"train_loss": -26.349990844726562, "global_step": 396063, "epoch": 4771} {"train_loss": -26.428852081298828, "global_step": 396064, "epoch": 4771} {"train_loss": -26.60981559753418, "global_step": 396065, "epoch": 4771} {"train_loss": -26.312536239624023, "global_step": 396066, "epoch": 4771} {"train_loss": -26.65276527404785, "global_step": 396067, "epoch": 4771} {"train_loss": -26.731830596923828, "global_step": 396068, "epoch": 4771} {"train_loss": -26.915924072265625, "global_step": 396069, "epoch": 4771} {"train_loss": -26.697952270507812, "global_step": 396070, "epoch": 4771} {"train_loss": -26.668333053588867, "global_step": 396071, "epoch": 4771} {"train_loss": -26.556396484375, "global_step": 396072, "epoch": 4771} {"train_loss": -26.887231826782227, "global_step": 396073, "epoch": 4771} {"train_loss": -26.125131607055664, "global_step": 396074, "epoch": 4771} {"train_loss": -26.484046131731517, "global_step": 396075, "epoch": 4771, "val_loss": 6681910.5} {"train_loss": -26.619226455688477, "global_step": 396076, "epoch": 4772} {"train_loss": -26.007965087890625, "global_step": 396077, "epoch": 4772} {"train_loss": -26.124326705932617, "global_step": 396078, "epoch": 4772} {"train_loss": -26.272851943969727, "global_step": 396079, "epoch": 4772} {"train_loss": -26.319326400756836, "global_step": 396080, "epoch": 4772} {"train_loss": -26.341283798217773, "global_step": 396081, "epoch": 4772} {"train_loss": -26.199207305908203, "global_step": 396082, "epoch": 4772} {"train_loss": -25.6910400390625, "global_step": 396083, "epoch": 4772} {"train_loss": -26.07790184020996, "global_step": 396084, "epoch": 4772} {"train_loss": -26.2971248626709, "global_step": 396085, "epoch": 4772} {"train_loss": -25.951507568359375, "global_step": 396086, "epoch": 4772} {"train_loss": -26.067590713500977, "global_step": 396087, "epoch": 4772} {"train_loss": -26.42561912536621, "global_step": 396088, "epoch": 4772} {"train_loss": -26.150068283081055, "global_step": 396089, "epoch": 4772} {"train_loss": -26.31658935546875, "global_step": 396090, "epoch": 4772} {"train_loss": -26.196243286132812, "global_step": 396091, "epoch": 4772} {"train_loss": -26.310571670532227, "global_step": 396092, "epoch": 4772} {"train_loss": -26.29827308654785, "global_step": 396093, "epoch": 4772} {"train_loss": -26.321752548217773, "global_step": 396094, "epoch": 4772} {"train_loss": -26.357213973999023, "global_step": 396095, "epoch": 4772} {"train_loss": -26.41530418395996, "global_step": 396096, "epoch": 4772} {"train_loss": -26.468814849853516, "global_step": 396097, "epoch": 4772} {"train_loss": -26.626773834228516, "global_step": 396098, "epoch": 4772} {"train_loss": -26.570514678955078, "global_step": 396099, "epoch": 4772} {"train_loss": -26.80372428894043, "global_step": 396100, "epoch": 4772} {"train_loss": -26.982526779174805, "global_step": 396101, "epoch": 4772} {"train_loss": -26.512662887573242, "global_step": 396102, "epoch": 4772} {"train_loss": -26.634260177612305, "global_step": 396103, "epoch": 4772} {"train_loss": -26.590076446533203, "global_step": 396104, "epoch": 4772} {"train_loss": -26.639368057250977, "global_step": 396105, "epoch": 4772} {"train_loss": -26.454486846923828, "global_step": 396106, "epoch": 4772} {"train_loss": -26.59937858581543, "global_step": 396107, "epoch": 4772} {"train_loss": -26.779088973999023, "global_step": 396108, "epoch": 4772} {"train_loss": -26.717945098876953, "global_step": 396109, "epoch": 4772} {"train_loss": -26.497106552124023, "global_step": 396110, "epoch": 4772} {"train_loss": -26.615177154541016, "global_step": 396111, "epoch": 4772} {"train_loss": -26.24732780456543, "global_step": 396112, "epoch": 4772} {"train_loss": -26.260547637939453, "global_step": 396113, "epoch": 4772} {"train_loss": -26.309925079345703, "global_step": 396114, "epoch": 4772} {"train_loss": -26.677356719970703, "global_step": 396115, "epoch": 4772} {"train_loss": -26.452594757080078, "global_step": 396116, "epoch": 4772} {"train_loss": -26.521289825439453, "global_step": 396117, "epoch": 4772} {"train_loss": -26.271366119384766, "global_step": 396118, "epoch": 4772} {"train_loss": -26.567890167236328, "global_step": 396119, "epoch": 4772} {"train_loss": -26.53921890258789, "global_step": 396120, "epoch": 4772} {"train_loss": -26.550418853759766, "global_step": 396121, "epoch": 4772} {"train_loss": -26.576459884643555, "global_step": 396122, "epoch": 4772} {"train_loss": -26.400659561157227, "global_step": 396123, "epoch": 4772} {"train_loss": -26.513647079467773, "global_step": 396124, "epoch": 4772} {"train_loss": -26.54353141784668, "global_step": 396125, "epoch": 4772} {"train_loss": -26.464218139648438, "global_step": 396126, "epoch": 4772} {"train_loss": -26.821027755737305, "global_step": 396127, "epoch": 4772} {"train_loss": -26.780460357666016, "global_step": 396128, "epoch": 4772} {"train_loss": -26.47327995300293, "global_step": 396129, "epoch": 4772} {"train_loss": -26.63667106628418, "global_step": 396130, "epoch": 4772} {"train_loss": -27.442068099975586, "global_step": 396131, "epoch": 4772} {"train_loss": -26.742191314697266, "global_step": 396132, "epoch": 4772} {"train_loss": -26.366168975830078, "global_step": 396133, "epoch": 4772} {"train_loss": -27.042882919311523, "global_step": 396134, "epoch": 4772} {"train_loss": -26.4849910736084, "global_step": 396135, "epoch": 4772} {"train_loss": -26.83038902282715, "global_step": 396136, "epoch": 4772} {"train_loss": -26.460559844970703, "global_step": 396137, "epoch": 4772} {"train_loss": -26.831655502319336, "global_step": 396138, "epoch": 4772} {"train_loss": -26.90496826171875, "global_step": 396139, "epoch": 4772} {"train_loss": -26.89008140563965, "global_step": 396140, "epoch": 4772} {"train_loss": -27.191816329956055, "global_step": 396141, "epoch": 4772} {"train_loss": -26.803442001342773, "global_step": 396142, "epoch": 4772} {"train_loss": -26.71796226501465, "global_step": 396143, "epoch": 4772} {"train_loss": -26.832660675048828, "global_step": 396144, "epoch": 4772} {"train_loss": -26.661834716796875, "global_step": 396145, "epoch": 4772} {"train_loss": -26.403913497924805, "global_step": 396146, "epoch": 4772} {"train_loss": -26.527029037475586, "global_step": 396147, "epoch": 4772} {"train_loss": -26.93486976623535, "global_step": 396148, "epoch": 4772} {"train_loss": -26.72706413269043, "global_step": 396149, "epoch": 4772} {"train_loss": -26.606489181518555, "global_step": 396150, "epoch": 4772} {"train_loss": -26.810409545898438, "global_step": 396151, "epoch": 4772} {"train_loss": -26.785985946655273, "global_step": 396152, "epoch": 4772} {"train_loss": -26.9424991607666, "global_step": 396153, "epoch": 4772} {"train_loss": -26.806610107421875, "global_step": 396154, "epoch": 4772} {"train_loss": -26.56878662109375, "global_step": 396155, "epoch": 4772} {"train_loss": -26.780094146728516, "global_step": 396156, "epoch": 4772} {"train_loss": -26.700586318969727, "global_step": 396157, "epoch": 4772} {"train_loss": -26.544849395751953, "global_step": 396158, "epoch": 4772, "val_loss": 6660945.0} {"train_loss": -25.79937744140625, "global_step": 396159, "epoch": 4773} {"train_loss": -25.098468780517578, "global_step": 396160, "epoch": 4773} {"train_loss": -25.286745071411133, "global_step": 396161, "epoch": 4773} {"train_loss": -25.76725196838379, "global_step": 396162, "epoch": 4773} {"train_loss": -25.3125057220459, "global_step": 396163, "epoch": 4773} {"train_loss": -25.491418838500977, "global_step": 396164, "epoch": 4773} {"train_loss": -25.58270263671875, "global_step": 396165, "epoch": 4773} {"train_loss": -25.759265899658203, "global_step": 396166, "epoch": 4773} {"train_loss": -25.9542293548584, "global_step": 396167, "epoch": 4773} {"train_loss": -25.8619327545166, "global_step": 396168, "epoch": 4773} {"train_loss": -26.014196395874023, "global_step": 396169, "epoch": 4773} {"train_loss": -26.50055503845215, "global_step": 396170, "epoch": 4773} {"train_loss": -25.974323272705078, "global_step": 396171, "epoch": 4773} {"train_loss": -26.364301681518555, "global_step": 396172, "epoch": 4773} {"train_loss": -25.913000106811523, "global_step": 396173, "epoch": 4773} {"train_loss": -26.032987594604492, "global_step": 396174, "epoch": 4773} {"train_loss": -26.0472354888916, "global_step": 396175, "epoch": 4773} {"train_loss": -26.23443031311035, "global_step": 396176, "epoch": 4773} {"train_loss": -26.289960861206055, "global_step": 396177, "epoch": 4773} {"train_loss": -26.721288681030273, "global_step": 396178, "epoch": 4773} {"train_loss": -26.56328773498535, "global_step": 396179, "epoch": 4773} {"train_loss": -26.575056076049805, "global_step": 396180, "epoch": 4773} {"train_loss": -26.487503051757812, "global_step": 396181, "epoch": 4773} {"train_loss": -26.64306640625, "global_step": 396182, "epoch": 4773} {"train_loss": -26.571374893188477, "global_step": 396183, "epoch": 4773} {"train_loss": -26.315397262573242, "global_step": 396184, "epoch": 4773} {"train_loss": -26.720783233642578, "global_step": 396185, "epoch": 4773} {"train_loss": -26.663415908813477, "global_step": 396186, "epoch": 4773} {"train_loss": -26.764373779296875, "global_step": 396187, "epoch": 4773} {"train_loss": -26.80231285095215, "global_step": 396188, "epoch": 4773} {"train_loss": -26.745161056518555, "global_step": 396189, "epoch": 4773} {"train_loss": -26.907852172851562, "global_step": 396190, "epoch": 4773} {"train_loss": -26.799468994140625, "global_step": 396191, "epoch": 4773} {"train_loss": -26.47861671447754, "global_step": 396192, "epoch": 4773} {"train_loss": -26.299549102783203, "global_step": 396193, "epoch": 4773} {"train_loss": -26.28367042541504, "global_step": 396194, "epoch": 4773} {"train_loss": -26.92681312561035, "global_step": 396195, "epoch": 4773} {"train_loss": -26.616361618041992, "global_step": 396196, "epoch": 4773} {"train_loss": -26.82333755493164, "global_step": 396197, "epoch": 4773} {"train_loss": -26.781696319580078, "global_step": 396198, "epoch": 4773} {"train_loss": -26.777769088745117, "global_step": 396199, "epoch": 4773} {"train_loss": -26.512939453125, "global_step": 396200, "epoch": 4773} {"train_loss": -26.615100860595703, "global_step": 396201, "epoch": 4773} {"train_loss": -26.815942764282227, "global_step": 396202, "epoch": 4773} {"train_loss": -26.7672176361084, "global_step": 396203, "epoch": 4773} {"train_loss": -26.856298446655273, "global_step": 396204, "epoch": 4773} {"train_loss": -27.004642486572266, "global_step": 396205, "epoch": 4773} {"train_loss": -26.674213409423828, "global_step": 396206, "epoch": 4773} {"train_loss": -26.846799850463867, "global_step": 396207, "epoch": 4773} {"train_loss": -26.8436222076416, "global_step": 396208, "epoch": 4773} {"train_loss": -26.598840713500977, "global_step": 396209, "epoch": 4773} {"train_loss": -26.853551864624023, "global_step": 396210, "epoch": 4773} {"train_loss": -26.770334243774414, "global_step": 396211, "epoch": 4773} {"train_loss": -26.198841094970703, "global_step": 396212, "epoch": 4773} {"train_loss": -26.980365753173828, "global_step": 396213, "epoch": 4773} {"train_loss": -26.391218185424805, "global_step": 396214, "epoch": 4773} {"train_loss": -26.56174087524414, "global_step": 396215, "epoch": 4773} {"train_loss": -26.708087921142578, "global_step": 396216, "epoch": 4773} {"train_loss": -26.71144676208496, "global_step": 396217, "epoch": 4773} {"train_loss": -26.6683349609375, "global_step": 396218, "epoch": 4773} {"train_loss": -26.779178619384766, "global_step": 396219, "epoch": 4773} {"train_loss": -26.715368270874023, "global_step": 396220, "epoch": 4773} {"train_loss": -26.6812744140625, "global_step": 396221, "epoch": 4773} {"train_loss": -26.357391357421875, "global_step": 396222, "epoch": 4773} {"train_loss": -26.84577751159668, "global_step": 396223, "epoch": 4773} {"train_loss": -26.679752349853516, "global_step": 396224, "epoch": 4773} {"train_loss": -26.232934951782227, "global_step": 396225, "epoch": 4773} {"train_loss": -26.998594284057617, "global_step": 396226, "epoch": 4773} {"train_loss": -26.869115829467773, "global_step": 396227, "epoch": 4773} {"train_loss": -26.57611083984375, "global_step": 396228, "epoch": 4773} {"train_loss": -26.395370483398438, "global_step": 396229, "epoch": 4773} {"train_loss": -26.67591667175293, "global_step": 396230, "epoch": 4773} {"train_loss": -26.514667510986328, "global_step": 396231, "epoch": 4773} {"train_loss": -26.523218154907227, "global_step": 396232, "epoch": 4773} {"train_loss": -26.727392196655273, "global_step": 396233, "epoch": 4773} {"train_loss": -26.572067260742188, "global_step": 396234, "epoch": 4773} {"train_loss": -26.705520629882812, "global_step": 396235, "epoch": 4773} {"train_loss": -26.522491455078125, "global_step": 396236, "epoch": 4773} {"train_loss": -26.645055770874023, "global_step": 396237, "epoch": 4773} {"train_loss": -26.64198112487793, "global_step": 396238, "epoch": 4773} {"train_loss": -26.626361846923828, "global_step": 396239, "epoch": 4773} {"train_loss": -26.645771026611328, "global_step": 396240, "epoch": 4773} {"train_loss": -26.489371931696514, "global_step": 396241, "epoch": 4773, "val_loss": 6636363.0} {"train_loss": -25.695348739624023, "global_step": 396242, "epoch": 4774} {"train_loss": -26.151081085205078, "global_step": 396243, "epoch": 4774} {"train_loss": -25.769994735717773, "global_step": 396244, "epoch": 4774} {"train_loss": -25.993249893188477, "global_step": 396245, "epoch": 4774} {"train_loss": -26.13795280456543, "global_step": 396246, "epoch": 4774} {"train_loss": -25.894214630126953, "global_step": 396247, "epoch": 4774} {"train_loss": -25.919111251831055, "global_step": 396248, "epoch": 4774} {"train_loss": -26.009763717651367, "global_step": 396249, "epoch": 4774} {"train_loss": -26.012720108032227, "global_step": 396250, "epoch": 4774} {"train_loss": -26.27198600769043, "global_step": 396251, "epoch": 4774} {"train_loss": -26.570825576782227, "global_step": 396252, "epoch": 4774} {"train_loss": -26.38368034362793, "global_step": 396253, "epoch": 4774} {"train_loss": -26.289960861206055, "global_step": 396254, "epoch": 4774} {"train_loss": -26.146488189697266, "global_step": 396255, "epoch": 4774} {"train_loss": -26.335041046142578, "global_step": 396256, "epoch": 4774} {"train_loss": -25.866836547851562, "global_step": 396257, "epoch": 4774} {"train_loss": -26.270462036132812, "global_step": 396258, "epoch": 4774} {"train_loss": -26.665897369384766, "global_step": 396259, "epoch": 4774} {"train_loss": -26.718793869018555, "global_step": 396260, "epoch": 4774} {"train_loss": -26.567041397094727, "global_step": 396261, "epoch": 4774} {"train_loss": -26.64887809753418, "global_step": 396262, "epoch": 4774} {"train_loss": -26.792896270751953, "global_step": 396263, "epoch": 4774} {"train_loss": -26.266386032104492, "global_step": 396264, "epoch": 4774} {"train_loss": -26.43267250061035, "global_step": 396265, "epoch": 4774} {"train_loss": -26.747053146362305, "global_step": 396266, "epoch": 4774} {"train_loss": -26.81561851501465, "global_step": 396267, "epoch": 4774} {"train_loss": -26.60262107849121, "global_step": 396268, "epoch": 4774} {"train_loss": -26.741315841674805, "global_step": 396269, "epoch": 4774} {"train_loss": -26.86871910095215, "global_step": 396270, "epoch": 4774} {"train_loss": -26.573633193969727, "global_step": 396271, "epoch": 4774} {"train_loss": -26.48893165588379, "global_step": 396272, "epoch": 4774} {"train_loss": -26.804121017456055, "global_step": 396273, "epoch": 4774} {"train_loss": -26.8363094329834, "global_step": 396274, "epoch": 4774} {"train_loss": -26.596221923828125, "global_step": 396275, "epoch": 4774} {"train_loss": -26.366498947143555, "global_step": 396276, "epoch": 4774} {"train_loss": -26.612390518188477, "global_step": 396277, "epoch": 4774} {"train_loss": -26.45086097717285, "global_step": 396278, "epoch": 4774} {"train_loss": -26.760807037353516, "global_step": 396279, "epoch": 4774} {"train_loss": -26.621740341186523, "global_step": 396280, "epoch": 4774} {"train_loss": -26.818883895874023, "global_step": 396281, "epoch": 4774} {"train_loss": -26.437061309814453, "global_step": 396282, "epoch": 4774} {"train_loss": -26.542444229125977, "global_step": 396283, "epoch": 4774} {"train_loss": -26.748859405517578, "global_step": 396284, "epoch": 4774} {"train_loss": -26.5697078704834, "global_step": 396285, "epoch": 4774} {"train_loss": -27.04754638671875, "global_step": 396286, "epoch": 4774} {"train_loss": -26.841413497924805, "global_step": 396287, "epoch": 4774} {"train_loss": -26.631322860717773, "global_step": 396288, "epoch": 4774} {"train_loss": -26.663578033447266, "global_step": 396289, "epoch": 4774} {"train_loss": -26.308935165405273, "global_step": 396290, "epoch": 4774} {"train_loss": -27.152124404907227, "global_step": 396291, "epoch": 4774} {"train_loss": -26.97149085998535, "global_step": 396292, "epoch": 4774} {"train_loss": -26.606725692749023, "global_step": 396293, "epoch": 4774} {"train_loss": -26.737659454345703, "global_step": 396294, "epoch": 4774} {"train_loss": -26.525571823120117, "global_step": 396295, "epoch": 4774} {"train_loss": -26.695547103881836, "global_step": 396296, "epoch": 4774} {"train_loss": -26.233163833618164, "global_step": 396297, "epoch": 4774} {"train_loss": -26.52212905883789, "global_step": 396298, "epoch": 4774} {"train_loss": -27.068708419799805, "global_step": 396299, "epoch": 4774} {"train_loss": -26.715351104736328, "global_step": 396300, "epoch": 4774} {"train_loss": -26.621814727783203, "global_step": 396301, "epoch": 4774} {"train_loss": -26.684354782104492, "global_step": 396302, "epoch": 4774} {"train_loss": -26.92889976501465, "global_step": 396303, "epoch": 4774} {"train_loss": -27.010406494140625, "global_step": 396304, "epoch": 4774} {"train_loss": -26.668188095092773, "global_step": 396305, "epoch": 4774} {"train_loss": -26.116382598876953, "global_step": 396306, "epoch": 4774} {"train_loss": -25.663007736206055, "global_step": 396307, "epoch": 4774} {"train_loss": -25.040929794311523, "global_step": 396308, "epoch": 4774} {"train_loss": -25.62678337097168, "global_step": 396309, "epoch": 4774} {"train_loss": -25.815872192382812, "global_step": 396310, "epoch": 4774} {"train_loss": -25.56255531311035, "global_step": 396311, "epoch": 4774} {"train_loss": -25.994184494018555, "global_step": 396312, "epoch": 4774} {"train_loss": -26.165246963500977, "global_step": 396313, "epoch": 4774} {"train_loss": -26.12373924255371, "global_step": 396314, "epoch": 4774} {"train_loss": -26.21137046813965, "global_step": 396315, "epoch": 4774} {"train_loss": -26.3199520111084, "global_step": 396316, "epoch": 4774} {"train_loss": -25.869672775268555, "global_step": 396317, "epoch": 4774} {"train_loss": -26.506555557250977, "global_step": 396318, "epoch": 4774} {"train_loss": -26.52099609375, "global_step": 396319, "epoch": 4774} {"train_loss": -26.1873836517334, "global_step": 396320, "epoch": 4774} {"train_loss": -26.29900550842285, "global_step": 396321, "epoch": 4774} {"train_loss": -26.263341903686523, "global_step": 396322, "epoch": 4774} {"train_loss": -25.9226016998291, "global_step": 396323, "epoch": 4774} {"train_loss": -26.42176414397826, "global_step": 396324, "epoch": 4774, "val_loss": 6709278.0} {"train_loss": -26.20297622680664, "global_step": 396325, "epoch": 4775} {"train_loss": -26.336820602416992, "global_step": 396326, "epoch": 4775} {"train_loss": -25.87644386291504, "global_step": 396327, "epoch": 4775} {"train_loss": -26.396020889282227, "global_step": 396328, "epoch": 4775} {"train_loss": -26.47736930847168, "global_step": 396329, "epoch": 4775} {"train_loss": -26.237918853759766, "global_step": 396330, "epoch": 4775} {"train_loss": -26.258249282836914, "global_step": 396331, "epoch": 4775} {"train_loss": -26.32635498046875, "global_step": 396332, "epoch": 4775} {"train_loss": -26.231367111206055, "global_step": 396333, "epoch": 4775} {"train_loss": -26.184844970703125, "global_step": 396334, "epoch": 4775} {"train_loss": -26.799020767211914, "global_step": 396335, "epoch": 4775} {"train_loss": -26.173725128173828, "global_step": 396336, "epoch": 4775} {"train_loss": -26.412214279174805, "global_step": 396337, "epoch": 4775} {"train_loss": -26.03092384338379, "global_step": 396338, "epoch": 4775} {"train_loss": -26.160064697265625, "global_step": 396339, "epoch": 4775} {"train_loss": -26.57171058654785, "global_step": 396340, "epoch": 4775} {"train_loss": -26.461572647094727, "global_step": 396341, "epoch": 4775} {"train_loss": -26.499713897705078, "global_step": 396342, "epoch": 4775} {"train_loss": -26.36576271057129, "global_step": 396343, "epoch": 4775} {"train_loss": -26.217222213745117, "global_step": 396344, "epoch": 4775} {"train_loss": -26.50714111328125, "global_step": 396345, "epoch": 4775} {"train_loss": -26.420181274414062, "global_step": 396346, "epoch": 4775} {"train_loss": -26.553089141845703, "global_step": 396347, "epoch": 4775} {"train_loss": -26.666217803955078, "global_step": 396348, "epoch": 4775} {"train_loss": -26.49140739440918, "global_step": 396349, "epoch": 4775} {"train_loss": -26.731494903564453, "global_step": 396350, "epoch": 4775} {"train_loss": -26.765625, "global_step": 396351, "epoch": 4775} {"train_loss": -26.656539916992188, "global_step": 396352, "epoch": 4775} {"train_loss": -26.8800106048584, "global_step": 396353, "epoch": 4775} {"train_loss": -26.923654556274414, "global_step": 396354, "epoch": 4775} {"train_loss": -26.833984375, "global_step": 396355, "epoch": 4775} {"train_loss": -26.59613609313965, "global_step": 396356, "epoch": 4775} {"train_loss": -26.679174423217773, "global_step": 396357, "epoch": 4775} {"train_loss": -26.7148494720459, "global_step": 396358, "epoch": 4775} {"train_loss": -26.610361099243164, "global_step": 396359, "epoch": 4775} {"train_loss": -26.4515438079834, "global_step": 396360, "epoch": 4775} {"train_loss": -26.9801082611084, "global_step": 396361, "epoch": 4775} {"train_loss": -26.97092056274414, "global_step": 396362, "epoch": 4775} {"train_loss": -26.48624038696289, "global_step": 396363, "epoch": 4775} {"train_loss": -26.451892852783203, "global_step": 396364, "epoch": 4775} {"train_loss": -26.924640655517578, "global_step": 396365, "epoch": 4775} {"train_loss": -26.721744537353516, "global_step": 396366, "epoch": 4775} {"train_loss": -26.482376098632812, "global_step": 396367, "epoch": 4775} {"train_loss": -26.633808135986328, "global_step": 396368, "epoch": 4775} {"train_loss": -26.774188995361328, "global_step": 396369, "epoch": 4775} {"train_loss": -26.533798217773438, "global_step": 396370, "epoch": 4775} {"train_loss": -26.81153678894043, "global_step": 396371, "epoch": 4775} {"train_loss": -26.75227165222168, "global_step": 396372, "epoch": 4775} {"train_loss": -26.64170265197754, "global_step": 396373, "epoch": 4775} {"train_loss": -26.78694725036621, "global_step": 396374, "epoch": 4775} {"train_loss": -26.353391647338867, "global_step": 396375, "epoch": 4775} {"train_loss": -26.173507690429688, "global_step": 396376, "epoch": 4775} {"train_loss": -26.52680778503418, "global_step": 396377, "epoch": 4775} {"train_loss": -26.646223068237305, "global_step": 396378, "epoch": 4775} {"train_loss": -26.345508575439453, "global_step": 396379, "epoch": 4775} {"train_loss": -26.198806762695312, "global_step": 396380, "epoch": 4775} {"train_loss": -26.337970733642578, "global_step": 396381, "epoch": 4775} {"train_loss": -26.722509384155273, "global_step": 396382, "epoch": 4775} {"train_loss": -26.390329360961914, "global_step": 396383, "epoch": 4775} {"train_loss": -26.53614616394043, "global_step": 396384, "epoch": 4775} {"train_loss": -26.439136505126953, "global_step": 396385, "epoch": 4775} {"train_loss": -26.930261611938477, "global_step": 396386, "epoch": 4775} {"train_loss": -27.00310707092285, "global_step": 396387, "epoch": 4775} {"train_loss": -26.463850021362305, "global_step": 396388, "epoch": 4775} {"train_loss": -26.8070011138916, "global_step": 396389, "epoch": 4775} {"train_loss": -26.641569137573242, "global_step": 396390, "epoch": 4775} {"train_loss": -26.668354034423828, "global_step": 396391, "epoch": 4775} {"train_loss": -27.091211318969727, "global_step": 396392, "epoch": 4775} {"train_loss": -26.647724151611328, "global_step": 396393, "epoch": 4775} {"train_loss": -26.448043823242188, "global_step": 396394, "epoch": 4775} {"train_loss": -26.59075355529785, "global_step": 396395, "epoch": 4775} {"train_loss": -26.630521774291992, "global_step": 396396, "epoch": 4775} {"train_loss": -26.70476722717285, "global_step": 396397, "epoch": 4775} {"train_loss": -26.53955078125, "global_step": 396398, "epoch": 4775} {"train_loss": -25.959760665893555, "global_step": 396399, "epoch": 4775} {"train_loss": -26.34360694885254, "global_step": 396400, "epoch": 4775} {"train_loss": -26.309850692749023, "global_step": 396401, "epoch": 4775} {"train_loss": -26.400150299072266, "global_step": 396402, "epoch": 4775} {"train_loss": -26.408597946166992, "global_step": 396403, "epoch": 4775} {"train_loss": -26.018451690673828, "global_step": 396404, "epoch": 4775} {"train_loss": -26.617963790893555, "global_step": 396405, "epoch": 4775} {"train_loss": -26.305225372314453, "global_step": 396406, "epoch": 4775} {"train_loss": -26.548344003148827, "global_step": 396407, "epoch": 4775, "val_loss": 6698446.5} {"train_loss": -25.445938110351562, "global_step": 396408, "epoch": 4776} {"train_loss": -25.262479782104492, "global_step": 396409, "epoch": 4776} {"train_loss": -26.105554580688477, "global_step": 396410, "epoch": 4776} {"train_loss": -25.91305923461914, "global_step": 396411, "epoch": 4776} {"train_loss": -25.499317169189453, "global_step": 396412, "epoch": 4776} {"train_loss": -25.85209083557129, "global_step": 396413, "epoch": 4776} {"train_loss": -25.02606964111328, "global_step": 396414, "epoch": 4776} {"train_loss": -25.426530838012695, "global_step": 396415, "epoch": 4776} {"train_loss": -25.74357032775879, "global_step": 396416, "epoch": 4776} {"train_loss": -25.422033309936523, "global_step": 396417, "epoch": 4776} {"train_loss": -26.00909423828125, "global_step": 396418, "epoch": 4776} {"train_loss": -25.730695724487305, "global_step": 396419, "epoch": 4776} {"train_loss": -26.208852767944336, "global_step": 396420, "epoch": 4776} {"train_loss": -26.32748794555664, "global_step": 396421, "epoch": 4776} {"train_loss": -26.24598503112793, "global_step": 396422, "epoch": 4776} {"train_loss": -26.302743911743164, "global_step": 396423, "epoch": 4776} {"train_loss": -26.311431884765625, "global_step": 396424, "epoch": 4776} {"train_loss": -26.35173988342285, "global_step": 396425, "epoch": 4776} {"train_loss": -26.22108268737793, "global_step": 396426, "epoch": 4776} {"train_loss": -26.431501388549805, "global_step": 396427, "epoch": 4776} {"train_loss": -26.203561782836914, "global_step": 396428, "epoch": 4776} {"train_loss": -26.2984676361084, "global_step": 396429, "epoch": 4776} {"train_loss": -26.547636032104492, "global_step": 396430, "epoch": 4776} {"train_loss": -26.1309814453125, "global_step": 396431, "epoch": 4776} {"train_loss": -26.29591178894043, "global_step": 396432, "epoch": 4776} {"train_loss": -26.448196411132812, "global_step": 396433, "epoch": 4776} {"train_loss": -26.455158233642578, "global_step": 396434, "epoch": 4776} {"train_loss": -26.55596923828125, "global_step": 396435, "epoch": 4776} {"train_loss": -26.246191024780273, "global_step": 396436, "epoch": 4776} {"train_loss": -26.370086669921875, "global_step": 396437, "epoch": 4776} {"train_loss": -26.537933349609375, "global_step": 396438, "epoch": 4776} {"train_loss": -26.552209854125977, "global_step": 396439, "epoch": 4776} {"train_loss": -26.566190719604492, "global_step": 396440, "epoch": 4776} {"train_loss": -26.760465621948242, "global_step": 396441, "epoch": 4776} {"train_loss": -26.771472930908203, "global_step": 396442, "epoch": 4776} {"train_loss": -26.37812614440918, "global_step": 396443, "epoch": 4776} {"train_loss": -26.834497451782227, "global_step": 396444, "epoch": 4776} {"train_loss": -26.8327579498291, "global_step": 396445, "epoch": 4776} {"train_loss": -26.982709884643555, "global_step": 396446, "epoch": 4776} {"train_loss": -26.673145294189453, "global_step": 396447, "epoch": 4776} {"train_loss": -26.742725372314453, "global_step": 396448, "epoch": 4776} {"train_loss": -26.66596794128418, "global_step": 396449, "epoch": 4776} {"train_loss": -26.89588737487793, "global_step": 396450, "epoch": 4776} {"train_loss": -26.908374786376953, "global_step": 396451, "epoch": 4776} {"train_loss": -26.3730411529541, "global_step": 396452, "epoch": 4776} {"train_loss": -26.62890625, "global_step": 396453, "epoch": 4776} {"train_loss": -26.812259674072266, "global_step": 396454, "epoch": 4776} {"train_loss": -26.961896896362305, "global_step": 396455, "epoch": 4776} {"train_loss": -26.97181510925293, "global_step": 396456, "epoch": 4776} {"train_loss": -26.320276260375977, "global_step": 396457, "epoch": 4776} {"train_loss": -26.61250877380371, "global_step": 396458, "epoch": 4776} {"train_loss": -26.694372177124023, "global_step": 396459, "epoch": 4776} {"train_loss": -25.85630226135254, "global_step": 396460, "epoch": 4776} {"train_loss": -26.796966552734375, "global_step": 396461, "epoch": 4776} {"train_loss": -26.826034545898438, "global_step": 396462, "epoch": 4776} {"train_loss": -26.410409927368164, "global_step": 396463, "epoch": 4776} {"train_loss": -26.679401397705078, "global_step": 396464, "epoch": 4776} {"train_loss": -26.810535430908203, "global_step": 396465, "epoch": 4776} {"train_loss": -26.63437271118164, "global_step": 396466, "epoch": 4776} {"train_loss": -26.441852569580078, "global_step": 396467, "epoch": 4776} {"train_loss": -26.392271041870117, "global_step": 396468, "epoch": 4776} {"train_loss": -26.746198654174805, "global_step": 396469, "epoch": 4776} {"train_loss": -26.551244735717773, "global_step": 396470, "epoch": 4776} {"train_loss": -26.59553337097168, "global_step": 396471, "epoch": 4776} {"train_loss": -26.456470489501953, "global_step": 396472, "epoch": 4776} {"train_loss": -26.70184898376465, "global_step": 396473, "epoch": 4776} {"train_loss": -26.427602767944336, "global_step": 396474, "epoch": 4776} {"train_loss": -26.652311325073242, "global_step": 396475, "epoch": 4776} {"train_loss": -26.430089950561523, "global_step": 396476, "epoch": 4776} {"train_loss": -26.893314361572266, "global_step": 396477, "epoch": 4776} {"train_loss": -26.801496505737305, "global_step": 396478, "epoch": 4776} {"train_loss": -26.119964599609375, "global_step": 396479, "epoch": 4776} {"train_loss": -26.042804718017578, "global_step": 396480, "epoch": 4776} {"train_loss": -26.324792861938477, "global_step": 396481, "epoch": 4776} {"train_loss": -26.534399032592773, "global_step": 396482, "epoch": 4776} {"train_loss": -26.3826961517334, "global_step": 396483, "epoch": 4776} {"train_loss": -26.582416534423828, "global_step": 396484, "epoch": 4776} {"train_loss": -26.44019889831543, "global_step": 396485, "epoch": 4776} {"train_loss": -26.246198654174805, "global_step": 396486, "epoch": 4776} {"train_loss": -26.36041831970215, "global_step": 396487, "epoch": 4776} {"train_loss": -26.21860694885254, "global_step": 396488, "epoch": 4776} {"train_loss": -26.4702091217041, "global_step": 396489, "epoch": 4776} {"train_loss": -26.38059602300805, "global_step": 396490, "epoch": 4776, "val_loss": 6714578.0} {"train_loss": -24.197866439819336, "global_step": 396491, "epoch": 4777} {"train_loss": -21.459585189819336, "global_step": 396492, "epoch": 4777} {"train_loss": -24.333454132080078, "global_step": 396493, "epoch": 4777} {"train_loss": -24.957494735717773, "global_step": 396494, "epoch": 4777} {"train_loss": -24.859338760375977, "global_step": 396495, "epoch": 4777} {"train_loss": -25.759191513061523, "global_step": 396496, "epoch": 4777} {"train_loss": -24.74256706237793, "global_step": 396497, "epoch": 4777} {"train_loss": -25.74199867248535, "global_step": 396498, "epoch": 4777} {"train_loss": -25.25874137878418, "global_step": 396499, "epoch": 4777} {"train_loss": -25.399656295776367, "global_step": 396500, "epoch": 4777} {"train_loss": -25.859750747680664, "global_step": 396501, "epoch": 4777} {"train_loss": -25.17445182800293, "global_step": 396502, "epoch": 4777} {"train_loss": -25.5664119720459, "global_step": 396503, "epoch": 4777} {"train_loss": -25.81305503845215, "global_step": 396504, "epoch": 4777} {"train_loss": -25.539979934692383, "global_step": 396505, "epoch": 4777} {"train_loss": -25.49618911743164, "global_step": 396506, "epoch": 4777} {"train_loss": -25.53441047668457, "global_step": 396507, "epoch": 4777} {"train_loss": -25.903955459594727, "global_step": 396508, "epoch": 4777} {"train_loss": -26.050107955932617, "global_step": 396509, "epoch": 4777} {"train_loss": -25.943267822265625, "global_step": 396510, "epoch": 4777} {"train_loss": -26.155866622924805, "global_step": 396511, "epoch": 4777} {"train_loss": -26.15167236328125, "global_step": 396512, "epoch": 4777} {"train_loss": -26.040939331054688, "global_step": 396513, "epoch": 4777} {"train_loss": -25.939855575561523, "global_step": 396514, "epoch": 4777} {"train_loss": -25.881210327148438, "global_step": 396515, "epoch": 4777} {"train_loss": -26.167016983032227, "global_step": 396516, "epoch": 4777} {"train_loss": -26.212284088134766, "global_step": 396517, "epoch": 4777} {"train_loss": -26.055435180664062, "global_step": 396518, "epoch": 4777} {"train_loss": -25.74561882019043, "global_step": 396519, "epoch": 4777} {"train_loss": -26.114185333251953, "global_step": 396520, "epoch": 4777} {"train_loss": -26.430505752563477, "global_step": 396521, "epoch": 4777} {"train_loss": -26.104068756103516, "global_step": 396522, "epoch": 4777} {"train_loss": -26.276996612548828, "global_step": 396523, "epoch": 4777} {"train_loss": -26.381078720092773, "global_step": 396524, "epoch": 4777} {"train_loss": -26.1401309967041, "global_step": 396525, "epoch": 4777} {"train_loss": -26.80401611328125, "global_step": 396526, "epoch": 4777} {"train_loss": -26.19977378845215, "global_step": 396527, "epoch": 4777} {"train_loss": -26.5677547454834, "global_step": 396528, "epoch": 4777} {"train_loss": -26.3801326751709, "global_step": 396529, "epoch": 4777} {"train_loss": -26.508996963500977, "global_step": 396530, "epoch": 4777} {"train_loss": -26.258529663085938, "global_step": 396531, "epoch": 4777} {"train_loss": -26.142202377319336, "global_step": 396532, "epoch": 4777} {"train_loss": -26.7121524810791, "global_step": 396533, "epoch": 4777} {"train_loss": -26.609237670898438, "global_step": 396534, "epoch": 4777} {"train_loss": -26.307376861572266, "global_step": 396535, "epoch": 4777} {"train_loss": -26.347156524658203, "global_step": 396536, "epoch": 4777} {"train_loss": -26.564306259155273, "global_step": 396537, "epoch": 4777} {"train_loss": -26.662267684936523, "global_step": 396538, "epoch": 4777} {"train_loss": -26.777063369750977, "global_step": 396539, "epoch": 4777} {"train_loss": -26.48370361328125, "global_step": 396540, "epoch": 4777} {"train_loss": -26.523853302001953, "global_step": 396541, "epoch": 4777} {"train_loss": -26.49664878845215, "global_step": 396542, "epoch": 4777} {"train_loss": -26.63494300842285, "global_step": 396543, "epoch": 4777} {"train_loss": -26.80670166015625, "global_step": 396544, "epoch": 4777} {"train_loss": -26.812482833862305, "global_step": 396545, "epoch": 4777} {"train_loss": -26.192808151245117, "global_step": 396546, "epoch": 4777} {"train_loss": -26.5238094329834, "global_step": 396547, "epoch": 4777} {"train_loss": -26.53264808654785, "global_step": 396548, "epoch": 4777} {"train_loss": -26.7878475189209, "global_step": 396549, "epoch": 4777} {"train_loss": -26.36443519592285, "global_step": 396550, "epoch": 4777} {"train_loss": -26.66358757019043, "global_step": 396551, "epoch": 4777} {"train_loss": -26.813247680664062, "global_step": 396552, "epoch": 4777} {"train_loss": -26.6567440032959, "global_step": 396553, "epoch": 4777} {"train_loss": -26.8528995513916, "global_step": 396554, "epoch": 4777} {"train_loss": -26.3153018951416, "global_step": 396555, "epoch": 4777} {"train_loss": -26.228195190429688, "global_step": 396556, "epoch": 4777} {"train_loss": -26.17044448852539, "global_step": 396557, "epoch": 4777} {"train_loss": -26.651708602905273, "global_step": 396558, "epoch": 4777} {"train_loss": -26.718427658081055, "global_step": 396559, "epoch": 4777} {"train_loss": -26.853885650634766, "global_step": 396560, "epoch": 4777} {"train_loss": -26.25201988220215, "global_step": 396561, "epoch": 4777} {"train_loss": -26.7463321685791, "global_step": 396562, "epoch": 4777} {"train_loss": -26.7884521484375, "global_step": 396563, "epoch": 4777} {"train_loss": -26.873517990112305, "global_step": 396564, "epoch": 4777} {"train_loss": -26.875150680541992, "global_step": 396565, "epoch": 4777} {"train_loss": -26.906265258789062, "global_step": 396566, "epoch": 4777} {"train_loss": -26.48028564453125, "global_step": 396567, "epoch": 4777} {"train_loss": -26.632328033447266, "global_step": 396568, "epoch": 4777} {"train_loss": -26.884122848510742, "global_step": 396569, "epoch": 4777} {"train_loss": -26.829288482666016, "global_step": 396570, "epoch": 4777} {"train_loss": -26.731855392456055, "global_step": 396571, "epoch": 4777} {"train_loss": -26.28057289123535, "global_step": 396572, "epoch": 4777} {"train_loss": -26.172111051628388, "global_step": 396573, "epoch": 4777, "val_loss": 6705862.0} {"train_loss": -26.021488189697266, "global_step": 396574, "epoch": 4778} {"train_loss": -25.54261589050293, "global_step": 396575, "epoch": 4778} {"train_loss": -26.38785171508789, "global_step": 396576, "epoch": 4778} {"train_loss": -25.958908081054688, "global_step": 396577, "epoch": 4778} {"train_loss": -25.87411880493164, "global_step": 396578, "epoch": 4778} {"train_loss": -25.68622398376465, "global_step": 396579, "epoch": 4778} {"train_loss": -25.548675537109375, "global_step": 396580, "epoch": 4778} {"train_loss": -26.240751266479492, "global_step": 396581, "epoch": 4778} {"train_loss": -26.157739639282227, "global_step": 396582, "epoch": 4778} {"train_loss": -25.522342681884766, "global_step": 396583, "epoch": 4778} {"train_loss": -26.150800704956055, "global_step": 396584, "epoch": 4778} {"train_loss": -25.92681884765625, "global_step": 396585, "epoch": 4778} {"train_loss": -26.124500274658203, "global_step": 396586, "epoch": 4778} {"train_loss": -26.33087158203125, "global_step": 396587, "epoch": 4778} {"train_loss": -25.996484756469727, "global_step": 396588, "epoch": 4778} {"train_loss": -26.077878952026367, "global_step": 396589, "epoch": 4778} {"train_loss": -26.1619930267334, "global_step": 396590, "epoch": 4778} {"train_loss": -26.247772216796875, "global_step": 396591, "epoch": 4778} {"train_loss": -26.518512725830078, "global_step": 396592, "epoch": 4778} {"train_loss": -26.37225341796875, "global_step": 396593, "epoch": 4778} {"train_loss": -26.544973373413086, "global_step": 396594, "epoch": 4778} {"train_loss": -26.57159996032715, "global_step": 396595, "epoch": 4778} {"train_loss": -26.6707706451416, "global_step": 396596, "epoch": 4778} {"train_loss": -26.192365646362305, "global_step": 396597, "epoch": 4778} {"train_loss": -26.700973510742188, "global_step": 396598, "epoch": 4778} {"train_loss": -26.79207420349121, "global_step": 396599, "epoch": 4778} {"train_loss": -26.634445190429688, "global_step": 396600, "epoch": 4778} {"train_loss": -26.571142196655273, "global_step": 396601, "epoch": 4778} {"train_loss": -26.405126571655273, "global_step": 396602, "epoch": 4778} {"train_loss": -26.451414108276367, "global_step": 396603, "epoch": 4778} {"train_loss": -26.684370040893555, "global_step": 396604, "epoch": 4778} {"train_loss": -26.829511642456055, "global_step": 396605, "epoch": 4778} {"train_loss": -26.67963218688965, "global_step": 396606, "epoch": 4778} {"train_loss": -26.880359649658203, "global_step": 396607, "epoch": 4778} {"train_loss": -26.41939353942871, "global_step": 396608, "epoch": 4778} {"train_loss": -27.04469108581543, "global_step": 396609, "epoch": 4778} {"train_loss": -26.84047508239746, "global_step": 396610, "epoch": 4778} {"train_loss": -26.716943740844727, "global_step": 396611, "epoch": 4778} {"train_loss": -26.89053726196289, "global_step": 396612, "epoch": 4778} {"train_loss": -26.78058433532715, "global_step": 396613, "epoch": 4778} {"train_loss": -26.807861328125, "global_step": 396614, "epoch": 4778} {"train_loss": -26.11823844909668, "global_step": 396615, "epoch": 4778} {"train_loss": -26.7251033782959, "global_step": 396616, "epoch": 4778} {"train_loss": -26.189416885375977, "global_step": 396617, "epoch": 4778} {"train_loss": -26.681310653686523, "global_step": 396618, "epoch": 4778} {"train_loss": -26.77766990661621, "global_step": 396619, "epoch": 4778} {"train_loss": -26.77069664001465, "global_step": 396620, "epoch": 4778} {"train_loss": -26.35467529296875, "global_step": 396621, "epoch": 4778} {"train_loss": -26.84759521484375, "global_step": 396622, "epoch": 4778} {"train_loss": -26.285974502563477, "global_step": 396623, "epoch": 4778} {"train_loss": -26.528858184814453, "global_step": 396624, "epoch": 4778} {"train_loss": -26.88103675842285, "global_step": 396625, "epoch": 4778} {"train_loss": -26.798505783081055, "global_step": 396626, "epoch": 4778} {"train_loss": -26.77791404724121, "global_step": 396627, "epoch": 4778} {"train_loss": -26.728124618530273, "global_step": 396628, "epoch": 4778} {"train_loss": -26.706823348999023, "global_step": 396629, "epoch": 4778} {"train_loss": -26.904287338256836, "global_step": 396630, "epoch": 4778} {"train_loss": -26.4616641998291, "global_step": 396631, "epoch": 4778} {"train_loss": -26.87908935546875, "global_step": 396632, "epoch": 4778} {"train_loss": -26.631866455078125, "global_step": 396633, "epoch": 4778} {"train_loss": -26.710229873657227, "global_step": 396634, "epoch": 4778} {"train_loss": -26.805082321166992, "global_step": 396635, "epoch": 4778} {"train_loss": -26.661075592041016, "global_step": 396636, "epoch": 4778} {"train_loss": -26.832616806030273, "global_step": 396637, "epoch": 4778} {"train_loss": -26.567672729492188, "global_step": 396638, "epoch": 4778} {"train_loss": -26.559619903564453, "global_step": 396639, "epoch": 4778} {"train_loss": -26.820587158203125, "global_step": 396640, "epoch": 4778} {"train_loss": -26.886926651000977, "global_step": 396641, "epoch": 4778} {"train_loss": -26.757299423217773, "global_step": 396642, "epoch": 4778} {"train_loss": -26.7298526763916, "global_step": 396643, "epoch": 4778} {"train_loss": -26.352706909179688, "global_step": 396644, "epoch": 4778} {"train_loss": -26.586013793945312, "global_step": 396645, "epoch": 4778} {"train_loss": -26.34568214416504, "global_step": 396646, "epoch": 4778} {"train_loss": -26.8934383392334, "global_step": 396647, "epoch": 4778} {"train_loss": -26.770414352416992, "global_step": 396648, "epoch": 4778} {"train_loss": -26.85468864440918, "global_step": 396649, "epoch": 4778} {"train_loss": -26.384082794189453, "global_step": 396650, "epoch": 4778} {"train_loss": -27.044967651367188, "global_step": 396651, "epoch": 4778} {"train_loss": -26.87775993347168, "global_step": 396652, "epoch": 4778} {"train_loss": -26.96624755859375, "global_step": 396653, "epoch": 4778} {"train_loss": -26.662555694580078, "global_step": 396654, "epoch": 4778} {"train_loss": -26.55731201171875, "global_step": 396655, "epoch": 4778} {"train_loss": -26.528947117816973, "global_step": 396656, "epoch": 4778, "val_loss": 6638079.0} {"train_loss": -26.713489532470703, "global_step": 396657, "epoch": 4779} {"train_loss": -26.4184627532959, "global_step": 396658, "epoch": 4779} {"train_loss": -26.012104034423828, "global_step": 396659, "epoch": 4779} {"train_loss": -25.291942596435547, "global_step": 396660, "epoch": 4779} {"train_loss": -25.74256706237793, "global_step": 396661, "epoch": 4779} {"train_loss": -26.449182510375977, "global_step": 396662, "epoch": 4779} {"train_loss": -26.43561363220215, "global_step": 396663, "epoch": 4779} {"train_loss": -26.3319034576416, "global_step": 396664, "epoch": 4779} {"train_loss": -26.43119239807129, "global_step": 396665, "epoch": 4779} {"train_loss": -26.331113815307617, "global_step": 396666, "epoch": 4779} {"train_loss": -26.530054092407227, "global_step": 396667, "epoch": 4779} {"train_loss": -26.470722198486328, "global_step": 396668, "epoch": 4779} {"train_loss": -26.492151260375977, "global_step": 396669, "epoch": 4779} {"train_loss": -26.609289169311523, "global_step": 396670, "epoch": 4779} {"train_loss": -26.335886001586914, "global_step": 396671, "epoch": 4779} {"train_loss": -26.39801597595215, "global_step": 396672, "epoch": 4779} {"train_loss": -26.753026962280273, "global_step": 396673, "epoch": 4779} {"train_loss": -27.00086784362793, "global_step": 396674, "epoch": 4779} {"train_loss": -26.750402450561523, "global_step": 396675, "epoch": 4779} {"train_loss": -26.771652221679688, "global_step": 396676, "epoch": 4779} {"train_loss": -26.70553970336914, "global_step": 396677, "epoch": 4779} {"train_loss": -26.1506404876709, "global_step": 396678, "epoch": 4779} {"train_loss": -26.4360408782959, "global_step": 396679, "epoch": 4779} {"train_loss": -26.52442741394043, "global_step": 396680, "epoch": 4779} {"train_loss": -26.230539321899414, "global_step": 396681, "epoch": 4779} {"train_loss": -26.536563873291016, "global_step": 396682, "epoch": 4779} {"train_loss": -26.160415649414062, "global_step": 396683, "epoch": 4779} {"train_loss": -26.53120231628418, "global_step": 396684, "epoch": 4779} {"train_loss": -26.59381675720215, "global_step": 396685, "epoch": 4779} {"train_loss": -26.554479598999023, "global_step": 396686, "epoch": 4779} {"train_loss": -26.883047103881836, "global_step": 396687, "epoch": 4779} {"train_loss": -26.716068267822266, "global_step": 396688, "epoch": 4779} {"train_loss": -26.793638229370117, "global_step": 396689, "epoch": 4779} {"train_loss": -26.361841201782227, "global_step": 396690, "epoch": 4779} {"train_loss": -26.687707901000977, "global_step": 396691, "epoch": 4779} {"train_loss": -26.4787654876709, "global_step": 396692, "epoch": 4779} {"train_loss": -26.56787109375, "global_step": 396693, "epoch": 4779} {"train_loss": -26.89800453186035, "global_step": 396694, "epoch": 4779} {"train_loss": -26.700275421142578, "global_step": 396695, "epoch": 4779} {"train_loss": -26.6834774017334, "global_step": 396696, "epoch": 4779} {"train_loss": -26.515430450439453, "global_step": 396697, "epoch": 4779} {"train_loss": -26.66339683532715, "global_step": 396698, "epoch": 4779} {"train_loss": -26.697362899780273, "global_step": 396699, "epoch": 4779} {"train_loss": -26.41863441467285, "global_step": 396700, "epoch": 4779} {"train_loss": -26.643524169921875, "global_step": 396701, "epoch": 4779} {"train_loss": -26.824140548706055, "global_step": 396702, "epoch": 4779} {"train_loss": -26.627288818359375, "global_step": 396703, "epoch": 4779} {"train_loss": -26.519229888916016, "global_step": 396704, "epoch": 4779} {"train_loss": -26.586078643798828, "global_step": 396705, "epoch": 4779} {"train_loss": -26.676727294921875, "global_step": 396706, "epoch": 4779} {"train_loss": -26.714221954345703, "global_step": 396707, "epoch": 4779} {"train_loss": -26.802265167236328, "global_step": 396708, "epoch": 4779} {"train_loss": -26.510412216186523, "global_step": 396709, "epoch": 4779} {"train_loss": -26.29786491394043, "global_step": 396710, "epoch": 4779} {"train_loss": -26.561084747314453, "global_step": 396711, "epoch": 4779} {"train_loss": -26.893585205078125, "global_step": 396712, "epoch": 4779} {"train_loss": -26.689666748046875, "global_step": 396713, "epoch": 4779} {"train_loss": -26.559797286987305, "global_step": 396714, "epoch": 4779} {"train_loss": -26.748090744018555, "global_step": 396715, "epoch": 4779} {"train_loss": -26.523778915405273, "global_step": 396716, "epoch": 4779} {"train_loss": -27.144636154174805, "global_step": 396717, "epoch": 4779} {"train_loss": -26.744312286376953, "global_step": 396718, "epoch": 4779} {"train_loss": -26.776824951171875, "global_step": 396719, "epoch": 4779} {"train_loss": -26.38507080078125, "global_step": 396720, "epoch": 4779} {"train_loss": -26.471206665039062, "global_step": 396721, "epoch": 4779} {"train_loss": -26.430587768554688, "global_step": 396722, "epoch": 4779} {"train_loss": -26.434919357299805, "global_step": 396723, "epoch": 4779} {"train_loss": -26.376798629760742, "global_step": 396724, "epoch": 4779} {"train_loss": -26.609039306640625, "global_step": 396725, "epoch": 4779} {"train_loss": -26.75811767578125, "global_step": 396726, "epoch": 4779} {"train_loss": -26.857166290283203, "global_step": 396727, "epoch": 4779} {"train_loss": -26.301074981689453, "global_step": 396728, "epoch": 4779} {"train_loss": -26.395721435546875, "global_step": 396729, "epoch": 4779} {"train_loss": -26.262598037719727, "global_step": 396730, "epoch": 4779} {"train_loss": -26.137775421142578, "global_step": 396731, "epoch": 4779} {"train_loss": -26.77591896057129, "global_step": 396732, "epoch": 4779} {"train_loss": -26.26904296875, "global_step": 396733, "epoch": 4779} {"train_loss": -26.76375389099121, "global_step": 396734, "epoch": 4779} {"train_loss": -26.388275146484375, "global_step": 396735, "epoch": 4779} {"train_loss": -26.555709838867188, "global_step": 396736, "epoch": 4779} {"train_loss": -26.517602920532227, "global_step": 396737, "epoch": 4779} {"train_loss": -26.229639053344727, "global_step": 396738, "epoch": 4779} {"train_loss": -26.53102442729904, "global_step": 396739, "epoch": 4779, "val_loss": 6675047.0} {"train_loss": -26.240726470947266, "global_step": 396740, "epoch": 4780} {"train_loss": -25.52997589111328, "global_step": 396741, "epoch": 4780} {"train_loss": -25.894168853759766, "global_step": 396742, "epoch": 4780} {"train_loss": -25.846704483032227, "global_step": 396743, "epoch": 4780} {"train_loss": -26.2984561920166, "global_step": 396744, "epoch": 4780} {"train_loss": -26.313156127929688, "global_step": 396745, "epoch": 4780} {"train_loss": -26.012563705444336, "global_step": 396746, "epoch": 4780} {"train_loss": -26.214017868041992, "global_step": 396747, "epoch": 4780} {"train_loss": -26.341535568237305, "global_step": 396748, "epoch": 4780} {"train_loss": -26.126245498657227, "global_step": 396749, "epoch": 4780} {"train_loss": -26.167692184448242, "global_step": 396750, "epoch": 4780} {"train_loss": -26.143817901611328, "global_step": 396751, "epoch": 4780} {"train_loss": -26.090290069580078, "global_step": 396752, "epoch": 4780} {"train_loss": -26.130115509033203, "global_step": 396753, "epoch": 4780} {"train_loss": -26.053546905517578, "global_step": 396754, "epoch": 4780} {"train_loss": -26.342578887939453, "global_step": 396755, "epoch": 4780} {"train_loss": -26.631641387939453, "global_step": 396756, "epoch": 4780} {"train_loss": -26.22549819946289, "global_step": 396757, "epoch": 4780} {"train_loss": -26.507699966430664, "global_step": 396758, "epoch": 4780} {"train_loss": -26.384321212768555, "global_step": 396759, "epoch": 4780} {"train_loss": -26.15669059753418, "global_step": 396760, "epoch": 4780} {"train_loss": -26.143970489501953, "global_step": 396761, "epoch": 4780} {"train_loss": -26.295557022094727, "global_step": 396762, "epoch": 4780} {"train_loss": -26.51059341430664, "global_step": 396763, "epoch": 4780} {"train_loss": -26.139434814453125, "global_step": 396764, "epoch": 4780} {"train_loss": -26.595388412475586, "global_step": 396765, "epoch": 4780} {"train_loss": -26.5891170501709, "global_step": 396766, "epoch": 4780} {"train_loss": -26.356414794921875, "global_step": 396767, "epoch": 4780} {"train_loss": -26.557392120361328, "global_step": 396768, "epoch": 4780} {"train_loss": -26.4852352142334, "global_step": 396769, "epoch": 4780} {"train_loss": -26.534337997436523, "global_step": 396770, "epoch": 4780} {"train_loss": -26.628686904907227, "global_step": 396771, "epoch": 4780} {"train_loss": -26.646387100219727, "global_step": 396772, "epoch": 4780} {"train_loss": -26.231861114501953, "global_step": 396773, "epoch": 4780} {"train_loss": -26.297460556030273, "global_step": 396774, "epoch": 4780} {"train_loss": -26.830671310424805, "global_step": 396775, "epoch": 4780} {"train_loss": -26.25813102722168, "global_step": 396776, "epoch": 4780} {"train_loss": -26.81122398376465, "global_step": 396777, "epoch": 4780} {"train_loss": -26.991424560546875, "global_step": 396778, "epoch": 4780} {"train_loss": -26.006921768188477, "global_step": 396779, "epoch": 4780} {"train_loss": -26.373334884643555, "global_step": 396780, "epoch": 4780} {"train_loss": -26.80218505859375, "global_step": 396781, "epoch": 4780} {"train_loss": -26.302753448486328, "global_step": 396782, "epoch": 4780} {"train_loss": -26.772363662719727, "global_step": 396783, "epoch": 4780} {"train_loss": -26.46162223815918, "global_step": 396784, "epoch": 4780} {"train_loss": -26.84708595275879, "global_step": 396785, "epoch": 4780} {"train_loss": -26.686582565307617, "global_step": 396786, "epoch": 4780} {"train_loss": -26.374555587768555, "global_step": 396787, "epoch": 4780} {"train_loss": -26.68165397644043, "global_step": 396788, "epoch": 4780} {"train_loss": -26.48935890197754, "global_step": 396789, "epoch": 4780} {"train_loss": -26.59675407409668, "global_step": 396790, "epoch": 4780} {"train_loss": -26.534423828125, "global_step": 396791, "epoch": 4780} {"train_loss": -26.414052963256836, "global_step": 396792, "epoch": 4780} {"train_loss": -26.4238338470459, "global_step": 396793, "epoch": 4780} {"train_loss": -26.429792404174805, "global_step": 396794, "epoch": 4780} {"train_loss": -26.634668350219727, "global_step": 396795, "epoch": 4780} {"train_loss": -26.63992691040039, "global_step": 396796, "epoch": 4780} {"train_loss": -26.57992935180664, "global_step": 396797, "epoch": 4780} {"train_loss": -26.557260513305664, "global_step": 396798, "epoch": 4780} {"train_loss": -27.0421085357666, "global_step": 396799, "epoch": 4780} {"train_loss": -26.339340209960938, "global_step": 396800, "epoch": 4780} {"train_loss": -26.787479400634766, "global_step": 396801, "epoch": 4780} {"train_loss": -26.604984283447266, "global_step": 396802, "epoch": 4780} {"train_loss": -26.73798942565918, "global_step": 396803, "epoch": 4780} {"train_loss": -26.911701202392578, "global_step": 396804, "epoch": 4780} {"train_loss": -26.517444610595703, "global_step": 396805, "epoch": 4780} {"train_loss": -26.2345027923584, "global_step": 396806, "epoch": 4780} {"train_loss": -26.66108512878418, "global_step": 396807, "epoch": 4780} {"train_loss": -26.60617446899414, "global_step": 396808, "epoch": 4780} {"train_loss": -26.44769287109375, "global_step": 396809, "epoch": 4780} {"train_loss": -26.64389991760254, "global_step": 396810, "epoch": 4780} {"train_loss": -26.890722274780273, "global_step": 396811, "epoch": 4780} {"train_loss": -26.4450740814209, "global_step": 396812, "epoch": 4780} {"train_loss": -26.53622817993164, "global_step": 396813, "epoch": 4780} {"train_loss": -26.43829917907715, "global_step": 396814, "epoch": 4780} {"train_loss": -26.44942283630371, "global_step": 396815, "epoch": 4780} {"train_loss": -26.48244285583496, "global_step": 396816, "epoch": 4780} {"train_loss": -26.605987548828125, "global_step": 396817, "epoch": 4780} {"train_loss": -26.39887809753418, "global_step": 396818, "epoch": 4780} {"train_loss": -26.857797622680664, "global_step": 396819, "epoch": 4780} {"train_loss": -27.17984962463379, "global_step": 396820, "epoch": 4780} {"train_loss": -26.961719512939453, "global_step": 396821, "epoch": 4780} {"train_loss": -26.47188434830631, "global_step": 396822, "epoch": 4780, "val_loss": 6684084.0} {"train_loss": -26.418750762939453, "global_step": 396823, "epoch": 4781} {"train_loss": -26.105865478515625, "global_step": 396824, "epoch": 4781} {"train_loss": -26.376998901367188, "global_step": 396825, "epoch": 4781} {"train_loss": -26.648340225219727, "global_step": 396826, "epoch": 4781} {"train_loss": -26.29168701171875, "global_step": 396827, "epoch": 4781} {"train_loss": -25.925567626953125, "global_step": 396828, "epoch": 4781} {"train_loss": -26.449539184570312, "global_step": 396829, "epoch": 4781} {"train_loss": -26.42633628845215, "global_step": 396830, "epoch": 4781} {"train_loss": -26.486703872680664, "global_step": 396831, "epoch": 4781} {"train_loss": -26.576618194580078, "global_step": 396832, "epoch": 4781} {"train_loss": -26.705801010131836, "global_step": 396833, "epoch": 4781} {"train_loss": -26.688756942749023, "global_step": 396834, "epoch": 4781} {"train_loss": -26.066104888916016, "global_step": 396835, "epoch": 4781} {"train_loss": -26.46611976623535, "global_step": 396836, "epoch": 4781} {"train_loss": -26.7208309173584, "global_step": 396837, "epoch": 4781} {"train_loss": -26.285358428955078, "global_step": 396838, "epoch": 4781} {"train_loss": -26.381973266601562, "global_step": 396839, "epoch": 4781} {"train_loss": -26.4583683013916, "global_step": 396840, "epoch": 4781} {"train_loss": -26.59197425842285, "global_step": 396841, "epoch": 4781} {"train_loss": -26.588088989257812, "global_step": 396842, "epoch": 4781} {"train_loss": -26.236215591430664, "global_step": 396843, "epoch": 4781} {"train_loss": -26.7705020904541, "global_step": 396844, "epoch": 4781} {"train_loss": -26.389902114868164, "global_step": 396845, "epoch": 4781} {"train_loss": -26.89397621154785, "global_step": 396846, "epoch": 4781} {"train_loss": -26.361881256103516, "global_step": 396847, "epoch": 4781} {"train_loss": -26.813512802124023, "global_step": 396848, "epoch": 4781} {"train_loss": -26.68873405456543, "global_step": 396849, "epoch": 4781} {"train_loss": -26.72138023376465, "global_step": 396850, "epoch": 4781} {"train_loss": -26.58454704284668, "global_step": 396851, "epoch": 4781} {"train_loss": -26.656530380249023, "global_step": 396852, "epoch": 4781} {"train_loss": -26.7338809967041, "global_step": 396853, "epoch": 4781} {"train_loss": -27.07966423034668, "global_step": 396854, "epoch": 4781} {"train_loss": -26.665502548217773, "global_step": 396855, "epoch": 4781} {"train_loss": -26.644306182861328, "global_step": 396856, "epoch": 4781} {"train_loss": -26.51466178894043, "global_step": 396857, "epoch": 4781} {"train_loss": -26.792667388916016, "global_step": 396858, "epoch": 4781} {"train_loss": -26.54535484313965, "global_step": 396859, "epoch": 4781} {"train_loss": -26.552448272705078, "global_step": 396860, "epoch": 4781} {"train_loss": -26.551599502563477, "global_step": 396861, "epoch": 4781} {"train_loss": -26.636920928955078, "global_step": 396862, "epoch": 4781} {"train_loss": -26.99580192565918, "global_step": 396863, "epoch": 4781} {"train_loss": -26.737775802612305, "global_step": 396864, "epoch": 4781} {"train_loss": -26.561264038085938, "global_step": 396865, "epoch": 4781} {"train_loss": -26.298542022705078, "global_step": 396866, "epoch": 4781} {"train_loss": -26.956958770751953, "global_step": 396867, "epoch": 4781} {"train_loss": -26.593658447265625, "global_step": 396868, "epoch": 4781} {"train_loss": -26.90888786315918, "global_step": 396869, "epoch": 4781} {"train_loss": -26.4893856048584, "global_step": 396870, "epoch": 4781} {"train_loss": -26.82679557800293, "global_step": 396871, "epoch": 4781} {"train_loss": -26.281848907470703, "global_step": 396872, "epoch": 4781} {"train_loss": -26.29157066345215, "global_step": 396873, "epoch": 4781} {"train_loss": -26.435108184814453, "global_step": 396874, "epoch": 4781} {"train_loss": -26.325658798217773, "global_step": 396875, "epoch": 4781} {"train_loss": -26.743555068969727, "global_step": 396876, "epoch": 4781} {"train_loss": -26.63970947265625, "global_step": 396877, "epoch": 4781} {"train_loss": -26.42665672302246, "global_step": 396878, "epoch": 4781} {"train_loss": -26.467817306518555, "global_step": 396879, "epoch": 4781} {"train_loss": -26.666296005249023, "global_step": 396880, "epoch": 4781} {"train_loss": -26.479944229125977, "global_step": 396881, "epoch": 4781} {"train_loss": -26.713302612304688, "global_step": 396882, "epoch": 4781} {"train_loss": -26.34031105041504, "global_step": 396883, "epoch": 4781} {"train_loss": -26.727020263671875, "global_step": 396884, "epoch": 4781} {"train_loss": -26.855188369750977, "global_step": 396885, "epoch": 4781} {"train_loss": -26.523595809936523, "global_step": 396886, "epoch": 4781} {"train_loss": -26.697729110717773, "global_step": 396887, "epoch": 4781} {"train_loss": -26.8891544342041, "global_step": 396888, "epoch": 4781} {"train_loss": -26.79774284362793, "global_step": 396889, "epoch": 4781} {"train_loss": -26.695112228393555, "global_step": 396890, "epoch": 4781} {"train_loss": -27.08733558654785, "global_step": 396891, "epoch": 4781} {"train_loss": -27.008319854736328, "global_step": 396892, "epoch": 4781} {"train_loss": -26.983245849609375, "global_step": 396893, "epoch": 4781} {"train_loss": -26.50266456604004, "global_step": 396894, "epoch": 4781} {"train_loss": -26.909149169921875, "global_step": 396895, "epoch": 4781} {"train_loss": -26.90760612487793, "global_step": 396896, "epoch": 4781} {"train_loss": -26.923080444335938, "global_step": 396897, "epoch": 4781} {"train_loss": -26.5582332611084, "global_step": 396898, "epoch": 4781} {"train_loss": -26.76653480529785, "global_step": 396899, "epoch": 4781} {"train_loss": -26.539575576782227, "global_step": 396900, "epoch": 4781} {"train_loss": -26.6174259185791, "global_step": 396901, "epoch": 4781} {"train_loss": -26.744958877563477, "global_step": 396902, "epoch": 4781} {"train_loss": -26.80364418029785, "global_step": 396903, "epoch": 4781} {"train_loss": -26.578266143798828, "global_step": 396904, "epoch": 4781} {"train_loss": -26.642012331859174, "global_step": 396905, "epoch": 4781, "val_loss": 6707480.0} {"train_loss": -24.903949737548828, "global_step": 396906, "epoch": 4782} {"train_loss": -22.722875595092773, "global_step": 396907, "epoch": 4782} {"train_loss": -21.35580062866211, "global_step": 396908, "epoch": 4782} {"train_loss": -25.001750946044922, "global_step": 396909, "epoch": 4782} {"train_loss": -25.166440963745117, "global_step": 396910, "epoch": 4782} {"train_loss": -24.635387420654297, "global_step": 396911, "epoch": 4782} {"train_loss": -25.120765686035156, "global_step": 396912, "epoch": 4782} {"train_loss": -24.851526260375977, "global_step": 396913, "epoch": 4782} {"train_loss": -25.342952728271484, "global_step": 396914, "epoch": 4782} {"train_loss": -25.540451049804688, "global_step": 396915, "epoch": 4782} {"train_loss": -25.25651741027832, "global_step": 396916, "epoch": 4782} {"train_loss": -26.223962783813477, "global_step": 396917, "epoch": 4782} {"train_loss": -25.6865291595459, "global_step": 396918, "epoch": 4782} {"train_loss": -25.765491485595703, "global_step": 396919, "epoch": 4782} {"train_loss": -26.02174186706543, "global_step": 396920, "epoch": 4782} {"train_loss": -25.74201774597168, "global_step": 396921, "epoch": 4782} {"train_loss": -25.866910934448242, "global_step": 396922, "epoch": 4782} {"train_loss": -25.692920684814453, "global_step": 396923, "epoch": 4782} {"train_loss": -25.864416122436523, "global_step": 396924, "epoch": 4782} {"train_loss": -26.12916374206543, "global_step": 396925, "epoch": 4782} {"train_loss": -25.91413688659668, "global_step": 396926, "epoch": 4782} {"train_loss": -26.15484046936035, "global_step": 396927, "epoch": 4782} {"train_loss": -26.0111083984375, "global_step": 396928, "epoch": 4782} {"train_loss": -26.095264434814453, "global_step": 396929, "epoch": 4782} {"train_loss": -25.83534812927246, "global_step": 396930, "epoch": 4782} {"train_loss": -26.383380889892578, "global_step": 396931, "epoch": 4782} {"train_loss": -25.875532150268555, "global_step": 396932, "epoch": 4782} {"train_loss": -26.16501808166504, "global_step": 396933, "epoch": 4782} {"train_loss": -26.4136905670166, "global_step": 396934, "epoch": 4782} {"train_loss": -26.0997257232666, "global_step": 396935, "epoch": 4782} {"train_loss": -26.681833267211914, "global_step": 396936, "epoch": 4782} {"train_loss": -26.116535186767578, "global_step": 396937, "epoch": 4782} {"train_loss": -26.334699630737305, "global_step": 396938, "epoch": 4782} {"train_loss": -26.388696670532227, "global_step": 396939, "epoch": 4782} {"train_loss": -26.12006187438965, "global_step": 396940, "epoch": 4782} {"train_loss": -26.4637393951416, "global_step": 396941, "epoch": 4782} {"train_loss": -26.50276756286621, "global_step": 396942, "epoch": 4782} {"train_loss": -26.153711318969727, "global_step": 396943, "epoch": 4782} {"train_loss": -26.63800048828125, "global_step": 396944, "epoch": 4782} {"train_loss": -26.348676681518555, "global_step": 396945, "epoch": 4782} {"train_loss": -26.6700439453125, "global_step": 396946, "epoch": 4782} {"train_loss": -26.332782745361328, "global_step": 396947, "epoch": 4782} {"train_loss": -26.5535945892334, "global_step": 396948, "epoch": 4782} {"train_loss": -26.560903549194336, "global_step": 396949, "epoch": 4782} {"train_loss": -26.716445922851562, "global_step": 396950, "epoch": 4782} {"train_loss": -26.544071197509766, "global_step": 396951, "epoch": 4782} {"train_loss": -26.563495635986328, "global_step": 396952, "epoch": 4782} {"train_loss": -26.59710121154785, "global_step": 396953, "epoch": 4782} {"train_loss": -26.630722045898438, "global_step": 396954, "epoch": 4782} {"train_loss": -26.456470489501953, "global_step": 396955, "epoch": 4782} {"train_loss": -26.783288955688477, "global_step": 396956, "epoch": 4782} {"train_loss": -26.77848243713379, "global_step": 396957, "epoch": 4782} {"train_loss": -26.537113189697266, "global_step": 396958, "epoch": 4782} {"train_loss": -26.452850341796875, "global_step": 396959, "epoch": 4782} {"train_loss": -26.62687110900879, "global_step": 396960, "epoch": 4782} {"train_loss": -26.677093505859375, "global_step": 396961, "epoch": 4782} {"train_loss": -26.881017684936523, "global_step": 396962, "epoch": 4782} {"train_loss": -26.710500717163086, "global_step": 396963, "epoch": 4782} {"train_loss": -26.878320693969727, "global_step": 396964, "epoch": 4782} {"train_loss": -26.464679718017578, "global_step": 396965, "epoch": 4782} {"train_loss": -26.710294723510742, "global_step": 396966, "epoch": 4782} {"train_loss": -26.4023380279541, "global_step": 396967, "epoch": 4782} {"train_loss": -27.02899169921875, "global_step": 396968, "epoch": 4782} {"train_loss": -26.873218536376953, "global_step": 396969, "epoch": 4782} {"train_loss": -26.775211334228516, "global_step": 396970, "epoch": 4782} {"train_loss": -27.076589584350586, "global_step": 396971, "epoch": 4782} {"train_loss": -26.933094024658203, "global_step": 396972, "epoch": 4782} {"train_loss": -26.730512619018555, "global_step": 396973, "epoch": 4782} {"train_loss": -27.2258358001709, "global_step": 396974, "epoch": 4782} {"train_loss": -26.59144401550293, "global_step": 396975, "epoch": 4782} {"train_loss": -26.730844497680664, "global_step": 396976, "epoch": 4782} {"train_loss": -26.832061767578125, "global_step": 396977, "epoch": 4782} {"train_loss": -26.77326011657715, "global_step": 396978, "epoch": 4782} {"train_loss": -26.316425323486328, "global_step": 396979, "epoch": 4782} {"train_loss": -26.601043701171875, "global_step": 396980, "epoch": 4782} {"train_loss": -26.7947998046875, "global_step": 396981, "epoch": 4782} {"train_loss": -26.68698501586914, "global_step": 396982, "epoch": 4782} {"train_loss": -26.8551025390625, "global_step": 396983, "epoch": 4782} {"train_loss": -26.772146224975586, "global_step": 396984, "epoch": 4782} {"train_loss": -26.597061157226562, "global_step": 396985, "epoch": 4782} {"train_loss": -26.7987117767334, "global_step": 396986, "epoch": 4782} {"train_loss": -26.672086715698242, "global_step": 396987, "epoch": 4782} {"train_loss": -26.201709586453724, "global_step": 396988, "epoch": 4782, "val_loss": 6587580.0} {"train_loss": -26.303974151611328, "global_step": 396989, "epoch": 4783} {"train_loss": -25.936172485351562, "global_step": 396990, "epoch": 4783} {"train_loss": -25.656299591064453, "global_step": 396991, "epoch": 4783} {"train_loss": -25.994998931884766, "global_step": 396992, "epoch": 4783} {"train_loss": -26.440204620361328, "global_step": 396993, "epoch": 4783} {"train_loss": -26.139341354370117, "global_step": 396994, "epoch": 4783} {"train_loss": -25.325984954833984, "global_step": 396995, "epoch": 4783} {"train_loss": -25.878101348876953, "global_step": 396996, "epoch": 4783} {"train_loss": -26.337997436523438, "global_step": 396997, "epoch": 4783} {"train_loss": -26.220544815063477, "global_step": 396998, "epoch": 4783} {"train_loss": -26.131113052368164, "global_step": 396999, "epoch": 4783} {"train_loss": -26.407739639282227, "global_step": 397000, "epoch": 4783} {"train_loss": -26.243682861328125, "global_step": 397001, "epoch": 4783} {"train_loss": -26.34498405456543, "global_step": 397002, "epoch": 4783} {"train_loss": -26.403366088867188, "global_step": 397003, "epoch": 4783} {"train_loss": -26.19818687438965, "global_step": 397004, "epoch": 4783} {"train_loss": -26.606897354125977, "global_step": 397005, "epoch": 4783} {"train_loss": -26.453527450561523, "global_step": 397006, "epoch": 4783} {"train_loss": -26.610931396484375, "global_step": 397007, "epoch": 4783} {"train_loss": -26.323333740234375, "global_step": 397008, "epoch": 4783} {"train_loss": -26.740182876586914, "global_step": 397009, "epoch": 4783} {"train_loss": -26.687780380249023, "global_step": 397010, "epoch": 4783} {"train_loss": -26.451208114624023, "global_step": 397011, "epoch": 4783} {"train_loss": -26.5936222076416, "global_step": 397012, "epoch": 4783} {"train_loss": -26.5806941986084, "global_step": 397013, "epoch": 4783} {"train_loss": -26.342329025268555, "global_step": 397014, "epoch": 4783} {"train_loss": -26.456466674804688, "global_step": 397015, "epoch": 4783} {"train_loss": -26.55376625061035, "global_step": 397016, "epoch": 4783} {"train_loss": -26.508520126342773, "global_step": 397017, "epoch": 4783} {"train_loss": -26.819684982299805, "global_step": 397018, "epoch": 4783} {"train_loss": -26.53086280822754, "global_step": 397019, "epoch": 4783} {"train_loss": -26.808231353759766, "global_step": 397020, "epoch": 4783} {"train_loss": -26.44744873046875, "global_step": 397021, "epoch": 4783} {"train_loss": -26.601715087890625, "global_step": 397022, "epoch": 4783} {"train_loss": -26.528608322143555, "global_step": 397023, "epoch": 4783} {"train_loss": -26.76582908630371, "global_step": 397024, "epoch": 4783} {"train_loss": -26.660633087158203, "global_step": 397025, "epoch": 4783} {"train_loss": -26.546741485595703, "global_step": 397026, "epoch": 4783} {"train_loss": -26.797964096069336, "global_step": 397027, "epoch": 4783} {"train_loss": -26.384174346923828, "global_step": 397028, "epoch": 4783} {"train_loss": -26.545944213867188, "global_step": 397029, "epoch": 4783} {"train_loss": -26.9010009765625, "global_step": 397030, "epoch": 4783} {"train_loss": -26.465993881225586, "global_step": 397031, "epoch": 4783} {"train_loss": -26.4495849609375, "global_step": 397032, "epoch": 4783} {"train_loss": -26.660263061523438, "global_step": 397033, "epoch": 4783} {"train_loss": -26.206846237182617, "global_step": 397034, "epoch": 4783} {"train_loss": -26.620508193969727, "global_step": 397035, "epoch": 4783} {"train_loss": -26.7796630859375, "global_step": 397036, "epoch": 4783} {"train_loss": -26.58111572265625, "global_step": 397037, "epoch": 4783} {"train_loss": -26.99713706970215, "global_step": 397038, "epoch": 4783} {"train_loss": -26.46462059020996, "global_step": 397039, "epoch": 4783} {"train_loss": -27.197553634643555, "global_step": 397040, "epoch": 4783} {"train_loss": -26.8817081451416, "global_step": 397041, "epoch": 4783} {"train_loss": -27.032058715820312, "global_step": 397042, "epoch": 4783} {"train_loss": -26.965356826782227, "global_step": 397043, "epoch": 4783} {"train_loss": -27.14658546447754, "global_step": 397044, "epoch": 4783} {"train_loss": -26.707273483276367, "global_step": 397045, "epoch": 4783} {"train_loss": -26.670719146728516, "global_step": 397046, "epoch": 4783} {"train_loss": -26.78485679626465, "global_step": 397047, "epoch": 4783} {"train_loss": -26.737375259399414, "global_step": 397048, "epoch": 4783} {"train_loss": -26.795852661132812, "global_step": 397049, "epoch": 4783} {"train_loss": -26.600255966186523, "global_step": 397050, "epoch": 4783} {"train_loss": -26.952062606811523, "global_step": 397051, "epoch": 4783} {"train_loss": -26.81744384765625, "global_step": 397052, "epoch": 4783} {"train_loss": -26.75615882873535, "global_step": 397053, "epoch": 4783} {"train_loss": -26.812658309936523, "global_step": 397054, "epoch": 4783} {"train_loss": -26.84893798828125, "global_step": 397055, "epoch": 4783} {"train_loss": -26.8017635345459, "global_step": 397056, "epoch": 4783} {"train_loss": -26.86713218688965, "global_step": 397057, "epoch": 4783} {"train_loss": -26.643569946289062, "global_step": 397058, "epoch": 4783} {"train_loss": -26.501867294311523, "global_step": 397059, "epoch": 4783} {"train_loss": -25.761932373046875, "global_step": 397060, "epoch": 4783} {"train_loss": -25.50118064880371, "global_step": 397061, "epoch": 4783} {"train_loss": -25.511695861816406, "global_step": 397062, "epoch": 4783} {"train_loss": -26.578933715820312, "global_step": 397063, "epoch": 4783} {"train_loss": -26.644611358642578, "global_step": 397064, "epoch": 4783} {"train_loss": -25.886091232299805, "global_step": 397065, "epoch": 4783} {"train_loss": -26.2581729888916, "global_step": 397066, "epoch": 4783} {"train_loss": -26.466032028198242, "global_step": 397067, "epoch": 4783} {"train_loss": -26.58762550354004, "global_step": 397068, "epoch": 4783} {"train_loss": -26.370777130126953, "global_step": 397069, "epoch": 4783} {"train_loss": -26.287168502807617, "global_step": 397070, "epoch": 4783} {"train_loss": -26.506710121430547, "global_step": 397071, "epoch": 4783, "val_loss": 6663494.0} {"train_loss": -25.878116607666016, "global_step": 397072, "epoch": 4784} {"train_loss": -26.08111000061035, "global_step": 397073, "epoch": 4784} {"train_loss": -25.98487663269043, "global_step": 397074, "epoch": 4784} {"train_loss": -26.167938232421875, "global_step": 397075, "epoch": 4784} {"train_loss": -25.84358024597168, "global_step": 397076, "epoch": 4784} {"train_loss": -26.118118286132812, "global_step": 397077, "epoch": 4784} {"train_loss": -26.018146514892578, "global_step": 397078, "epoch": 4784} {"train_loss": -25.815174102783203, "global_step": 397079, "epoch": 4784} {"train_loss": -26.03248405456543, "global_step": 397080, "epoch": 4784} {"train_loss": -26.311838150024414, "global_step": 397081, "epoch": 4784} {"train_loss": -26.001129150390625, "global_step": 397082, "epoch": 4784} {"train_loss": -25.944583892822266, "global_step": 397083, "epoch": 4784} {"train_loss": -26.047826766967773, "global_step": 397084, "epoch": 4784} {"train_loss": -26.308496475219727, "global_step": 397085, "epoch": 4784} {"train_loss": -25.96685218811035, "global_step": 397086, "epoch": 4784} {"train_loss": -26.14630699157715, "global_step": 397087, "epoch": 4784} {"train_loss": -26.551361083984375, "global_step": 397088, "epoch": 4784} {"train_loss": -26.34381103515625, "global_step": 397089, "epoch": 4784} {"train_loss": -26.415897369384766, "global_step": 397090, "epoch": 4784} {"train_loss": -26.350269317626953, "global_step": 397091, "epoch": 4784} {"train_loss": -26.20511817932129, "global_step": 397092, "epoch": 4784} {"train_loss": -26.661413192749023, "global_step": 397093, "epoch": 4784} {"train_loss": -26.667821884155273, "global_step": 397094, "epoch": 4784} {"train_loss": -26.026037216186523, "global_step": 397095, "epoch": 4784} {"train_loss": -26.144184112548828, "global_step": 397096, "epoch": 4784} {"train_loss": -26.198766708374023, "global_step": 397097, "epoch": 4784} {"train_loss": -26.564279556274414, "global_step": 397098, "epoch": 4784} {"train_loss": -26.59882926940918, "global_step": 397099, "epoch": 4784} {"train_loss": -26.424182891845703, "global_step": 397100, "epoch": 4784} {"train_loss": -26.194488525390625, "global_step": 397101, "epoch": 4784} {"train_loss": -26.01331901550293, "global_step": 397102, "epoch": 4784} {"train_loss": -26.341703414916992, "global_step": 397103, "epoch": 4784} {"train_loss": -26.586645126342773, "global_step": 397104, "epoch": 4784} {"train_loss": -26.467426300048828, "global_step": 397105, "epoch": 4784} {"train_loss": -26.526899337768555, "global_step": 397106, "epoch": 4784} {"train_loss": -26.663742065429688, "global_step": 397107, "epoch": 4784} {"train_loss": -26.228612899780273, "global_step": 397108, "epoch": 4784} {"train_loss": -26.615692138671875, "global_step": 397109, "epoch": 4784} {"train_loss": -26.581769943237305, "global_step": 397110, "epoch": 4784} {"train_loss": -26.8353271484375, "global_step": 397111, "epoch": 4784} {"train_loss": -26.537439346313477, "global_step": 397112, "epoch": 4784} {"train_loss": -26.53944969177246, "global_step": 397113, "epoch": 4784} {"train_loss": -26.872121810913086, "global_step": 397114, "epoch": 4784} {"train_loss": -26.391286849975586, "global_step": 397115, "epoch": 4784} {"train_loss": -26.566329956054688, "global_step": 397116, "epoch": 4784} {"train_loss": -26.961984634399414, "global_step": 397117, "epoch": 4784} {"train_loss": -26.49175453186035, "global_step": 397118, "epoch": 4784} {"train_loss": -26.73697853088379, "global_step": 397119, "epoch": 4784} {"train_loss": -26.834409713745117, "global_step": 397120, "epoch": 4784} {"train_loss": -27.09963035583496, "global_step": 397121, "epoch": 4784} {"train_loss": -26.600866317749023, "global_step": 397122, "epoch": 4784} {"train_loss": -26.99708366394043, "global_step": 397123, "epoch": 4784} {"train_loss": -26.358631134033203, "global_step": 397124, "epoch": 4784} {"train_loss": -26.213544845581055, "global_step": 397125, "epoch": 4784} {"train_loss": -26.91158103942871, "global_step": 397126, "epoch": 4784} {"train_loss": -26.875091552734375, "global_step": 397127, "epoch": 4784} {"train_loss": -26.662220001220703, "global_step": 397128, "epoch": 4784} {"train_loss": -26.488269805908203, "global_step": 397129, "epoch": 4784} {"train_loss": -26.680139541625977, "global_step": 397130, "epoch": 4784} {"train_loss": -26.7178955078125, "global_step": 397131, "epoch": 4784} {"train_loss": -26.81915855407715, "global_step": 397132, "epoch": 4784} {"train_loss": -26.687713623046875, "global_step": 397133, "epoch": 4784} {"train_loss": -26.281417846679688, "global_step": 397134, "epoch": 4784} {"train_loss": -26.541351318359375, "global_step": 397135, "epoch": 4784} {"train_loss": -26.318267822265625, "global_step": 397136, "epoch": 4784} {"train_loss": -26.073633193969727, "global_step": 397137, "epoch": 4784} {"train_loss": -26.341215133666992, "global_step": 397138, "epoch": 4784} {"train_loss": -26.68916130065918, "global_step": 397139, "epoch": 4784} {"train_loss": -26.278812408447266, "global_step": 397140, "epoch": 4784} {"train_loss": -26.503143310546875, "global_step": 397141, "epoch": 4784} {"train_loss": -26.624866485595703, "global_step": 397142, "epoch": 4784} {"train_loss": -26.4376163482666, "global_step": 397143, "epoch": 4784} {"train_loss": -26.4896240234375, "global_step": 397144, "epoch": 4784} {"train_loss": -26.52850341796875, "global_step": 397145, "epoch": 4784} {"train_loss": -26.73610496520996, "global_step": 397146, "epoch": 4784} {"train_loss": -25.870397567749023, "global_step": 397147, "epoch": 4784} {"train_loss": -26.565454483032227, "global_step": 397148, "epoch": 4784} {"train_loss": -26.301898956298828, "global_step": 397149, "epoch": 4784} {"train_loss": -26.56083106994629, "global_step": 397150, "epoch": 4784} {"train_loss": -26.300811767578125, "global_step": 397151, "epoch": 4784} {"train_loss": -26.883747100830078, "global_step": 397152, "epoch": 4784} {"train_loss": -26.444604873657227, "global_step": 397153, "epoch": 4784} {"train_loss": -26.430932378194417, "global_step": 397154, "epoch": 4784, "val_loss": 6815908.5} {"train_loss": -26.177289962768555, "global_step": 397155, "epoch": 4785} {"train_loss": -25.500030517578125, "global_step": 397156, "epoch": 4785} {"train_loss": -26.054357528686523, "global_step": 397157, "epoch": 4785} {"train_loss": -25.891061782836914, "global_step": 397158, "epoch": 4785} {"train_loss": -26.46967887878418, "global_step": 397159, "epoch": 4785} {"train_loss": -26.1419620513916, "global_step": 397160, "epoch": 4785} {"train_loss": -26.58668327331543, "global_step": 397161, "epoch": 4785} {"train_loss": -26.112518310546875, "global_step": 397162, "epoch": 4785} {"train_loss": -26.14032554626465, "global_step": 397163, "epoch": 4785} {"train_loss": -26.277591705322266, "global_step": 397164, "epoch": 4785} {"train_loss": -25.938955307006836, "global_step": 397165, "epoch": 4785} {"train_loss": -26.02595329284668, "global_step": 397166, "epoch": 4785} {"train_loss": -26.514636993408203, "global_step": 397167, "epoch": 4785} {"train_loss": -26.21976661682129, "global_step": 397168, "epoch": 4785} {"train_loss": -26.040374755859375, "global_step": 397169, "epoch": 4785} {"train_loss": -26.388071060180664, "global_step": 397170, "epoch": 4785} {"train_loss": -26.40919303894043, "global_step": 397171, "epoch": 4785} {"train_loss": -26.147363662719727, "global_step": 397172, "epoch": 4785} {"train_loss": -26.650360107421875, "global_step": 397173, "epoch": 4785} {"train_loss": -26.4571475982666, "global_step": 397174, "epoch": 4785} {"train_loss": -26.456266403198242, "global_step": 397175, "epoch": 4785} {"train_loss": -26.751312255859375, "global_step": 397176, "epoch": 4785} {"train_loss": -26.379104614257812, "global_step": 397177, "epoch": 4785} {"train_loss": -26.700056076049805, "global_step": 397178, "epoch": 4785} {"train_loss": -26.33315086364746, "global_step": 397179, "epoch": 4785} {"train_loss": -26.501605987548828, "global_step": 397180, "epoch": 4785} {"train_loss": -26.372716903686523, "global_step": 397181, "epoch": 4785} {"train_loss": -26.524219512939453, "global_step": 397182, "epoch": 4785} {"train_loss": -26.711841583251953, "global_step": 397183, "epoch": 4785} {"train_loss": -26.85172462463379, "global_step": 397184, "epoch": 4785} {"train_loss": -26.554712295532227, "global_step": 397185, "epoch": 4785} {"train_loss": -26.76413345336914, "global_step": 397186, "epoch": 4785} {"train_loss": -26.878324508666992, "global_step": 397187, "epoch": 4785} {"train_loss": -26.706830978393555, "global_step": 397188, "epoch": 4785} {"train_loss": -26.709400177001953, "global_step": 397189, "epoch": 4785} {"train_loss": -26.849348068237305, "global_step": 397190, "epoch": 4785} {"train_loss": -26.777576446533203, "global_step": 397191, "epoch": 4785} {"train_loss": -26.701597213745117, "global_step": 397192, "epoch": 4785} {"train_loss": -26.7922420501709, "global_step": 397193, "epoch": 4785} {"train_loss": -26.445722579956055, "global_step": 397194, "epoch": 4785} {"train_loss": -26.720693588256836, "global_step": 397195, "epoch": 4785} {"train_loss": -26.6904296875, "global_step": 397196, "epoch": 4785} {"train_loss": -26.620895385742188, "global_step": 397197, "epoch": 4785} {"train_loss": -26.850971221923828, "global_step": 397198, "epoch": 4785} {"train_loss": -26.81509780883789, "global_step": 397199, "epoch": 4785} {"train_loss": -26.756254196166992, "global_step": 397200, "epoch": 4785} {"train_loss": -26.774799346923828, "global_step": 397201, "epoch": 4785} {"train_loss": -26.88477897644043, "global_step": 397202, "epoch": 4785} {"train_loss": -27.099340438842773, "global_step": 397203, "epoch": 4785} {"train_loss": -26.9263858795166, "global_step": 397204, "epoch": 4785} {"train_loss": -27.086288452148438, "global_step": 397205, "epoch": 4785} {"train_loss": -27.06031608581543, "global_step": 397206, "epoch": 4785} {"train_loss": -26.890546798706055, "global_step": 397207, "epoch": 4785} {"train_loss": -26.733325958251953, "global_step": 397208, "epoch": 4785} {"train_loss": -26.55232048034668, "global_step": 397209, "epoch": 4785} {"train_loss": -26.591583251953125, "global_step": 397210, "epoch": 4785} {"train_loss": -27.051624298095703, "global_step": 397211, "epoch": 4785} {"train_loss": -26.719221115112305, "global_step": 397212, "epoch": 4785} {"train_loss": -26.564239501953125, "global_step": 397213, "epoch": 4785} {"train_loss": -26.618030548095703, "global_step": 397214, "epoch": 4785} {"train_loss": -26.753751754760742, "global_step": 397215, "epoch": 4785} {"train_loss": -26.899063110351562, "global_step": 397216, "epoch": 4785} {"train_loss": -26.69447135925293, "global_step": 397217, "epoch": 4785} {"train_loss": -26.797119140625, "global_step": 397218, "epoch": 4785} {"train_loss": -26.479421615600586, "global_step": 397219, "epoch": 4785} {"train_loss": -26.74152946472168, "global_step": 397220, "epoch": 4785} {"train_loss": -26.662282943725586, "global_step": 397221, "epoch": 4785} {"train_loss": -26.540319442749023, "global_step": 397222, "epoch": 4785} {"train_loss": -26.658309936523438, "global_step": 397223, "epoch": 4785} {"train_loss": -25.954137802124023, "global_step": 397224, "epoch": 4785} {"train_loss": -26.62264060974121, "global_step": 397225, "epoch": 4785} {"train_loss": -26.81365394592285, "global_step": 397226, "epoch": 4785} {"train_loss": -26.338642120361328, "global_step": 397227, "epoch": 4785} {"train_loss": -25.57257652282715, "global_step": 397228, "epoch": 4785} {"train_loss": -26.318256378173828, "global_step": 397229, "epoch": 4785} {"train_loss": -26.823484420776367, "global_step": 397230, "epoch": 4785} {"train_loss": -26.242334365844727, "global_step": 397231, "epoch": 4785} {"train_loss": -26.096527099609375, "global_step": 397232, "epoch": 4785} {"train_loss": -26.537534713745117, "global_step": 397233, "epoch": 4785} {"train_loss": -26.0189208984375, "global_step": 397234, "epoch": 4785} {"train_loss": -25.7504940032959, "global_step": 397235, "epoch": 4785} {"train_loss": -26.410419464111328, "global_step": 397236, "epoch": 4785} {"train_loss": -26.529295817915216, "global_step": 397237, "epoch": 4785, "val_loss": 6771867.0} {"train_loss": -26.471364974975586, "global_step": 397238, "epoch": 4786} {"train_loss": -26.092132568359375, "global_step": 397239, "epoch": 4786} {"train_loss": -26.217975616455078, "global_step": 397240, "epoch": 4786} {"train_loss": -26.171743392944336, "global_step": 397241, "epoch": 4786} {"train_loss": -26.1683349609375, "global_step": 397242, "epoch": 4786} {"train_loss": -25.905670166015625, "global_step": 397243, "epoch": 4786} {"train_loss": -26.161712646484375, "global_step": 397244, "epoch": 4786} {"train_loss": -26.01093101501465, "global_step": 397245, "epoch": 4786} {"train_loss": -26.1578426361084, "global_step": 397246, "epoch": 4786} {"train_loss": -26.300058364868164, "global_step": 397247, "epoch": 4786} {"train_loss": -26.077774047851562, "global_step": 397248, "epoch": 4786} {"train_loss": -26.119964599609375, "global_step": 397249, "epoch": 4786} {"train_loss": -25.825138092041016, "global_step": 397250, "epoch": 4786} {"train_loss": -25.947769165039062, "global_step": 397251, "epoch": 4786} {"train_loss": -26.337244033813477, "global_step": 397252, "epoch": 4786} {"train_loss": -25.984655380249023, "global_step": 397253, "epoch": 4786} {"train_loss": -25.88449478149414, "global_step": 397254, "epoch": 4786} {"train_loss": -26.300012588500977, "global_step": 397255, "epoch": 4786} {"train_loss": -26.26551628112793, "global_step": 397256, "epoch": 4786} {"train_loss": -26.064085006713867, "global_step": 397257, "epoch": 4786} {"train_loss": -26.615814208984375, "global_step": 397258, "epoch": 4786} {"train_loss": -26.186756134033203, "global_step": 397259, "epoch": 4786} {"train_loss": -26.0289363861084, "global_step": 397260, "epoch": 4786} {"train_loss": -26.636579513549805, "global_step": 397261, "epoch": 4786} {"train_loss": -26.389997482299805, "global_step": 397262, "epoch": 4786} {"train_loss": -26.7218017578125, "global_step": 397263, "epoch": 4786} {"train_loss": -26.455204010009766, "global_step": 397264, "epoch": 4786} {"train_loss": -26.3746395111084, "global_step": 397265, "epoch": 4786} {"train_loss": -26.307910919189453, "global_step": 397266, "epoch": 4786} {"train_loss": -26.174936294555664, "global_step": 397267, "epoch": 4786} {"train_loss": -26.278181076049805, "global_step": 397268, "epoch": 4786} {"train_loss": -26.47104835510254, "global_step": 397269, "epoch": 4786} {"train_loss": -26.838266372680664, "global_step": 397270, "epoch": 4786} {"train_loss": -26.417285919189453, "global_step": 397271, "epoch": 4786} {"train_loss": -26.45699119567871, "global_step": 397272, "epoch": 4786} {"train_loss": -26.444665908813477, "global_step": 397273, "epoch": 4786} {"train_loss": -26.561614990234375, "global_step": 397274, "epoch": 4786} {"train_loss": -26.603363037109375, "global_step": 397275, "epoch": 4786} {"train_loss": -26.81598472595215, "global_step": 397276, "epoch": 4786} {"train_loss": -26.743371963500977, "global_step": 397277, "epoch": 4786} {"train_loss": -26.709707260131836, "global_step": 397278, "epoch": 4786} {"train_loss": -26.65289878845215, "global_step": 397279, "epoch": 4786} {"train_loss": -26.705224990844727, "global_step": 397280, "epoch": 4786} {"train_loss": -26.44866371154785, "global_step": 397281, "epoch": 4786} {"train_loss": -26.8327579498291, "global_step": 397282, "epoch": 4786} {"train_loss": -26.39226722717285, "global_step": 397283, "epoch": 4786} {"train_loss": -26.654661178588867, "global_step": 397284, "epoch": 4786} {"train_loss": -26.679113388061523, "global_step": 397285, "epoch": 4786} {"train_loss": -26.625873565673828, "global_step": 397286, "epoch": 4786} {"train_loss": -26.832075119018555, "global_step": 397287, "epoch": 4786} {"train_loss": -26.759063720703125, "global_step": 397288, "epoch": 4786} {"train_loss": -26.87080955505371, "global_step": 397289, "epoch": 4786} {"train_loss": -26.862913131713867, "global_step": 397290, "epoch": 4786} {"train_loss": -26.61310386657715, "global_step": 397291, "epoch": 4786} {"train_loss": -26.723291397094727, "global_step": 397292, "epoch": 4786} {"train_loss": -26.96076011657715, "global_step": 397293, "epoch": 4786} {"train_loss": -27.0120792388916, "global_step": 397294, "epoch": 4786} {"train_loss": -27.1500301361084, "global_step": 397295, "epoch": 4786} {"train_loss": -26.857837677001953, "global_step": 397296, "epoch": 4786} {"train_loss": -27.023447036743164, "global_step": 397297, "epoch": 4786} {"train_loss": -26.944318771362305, "global_step": 397298, "epoch": 4786} {"train_loss": -26.998682022094727, "global_step": 397299, "epoch": 4786} {"train_loss": -26.931976318359375, "global_step": 397300, "epoch": 4786} {"train_loss": -26.68182945251465, "global_step": 397301, "epoch": 4786} {"train_loss": -26.677228927612305, "global_step": 397302, "epoch": 4786} {"train_loss": -26.760242462158203, "global_step": 397303, "epoch": 4786} {"train_loss": -26.230422973632812, "global_step": 397304, "epoch": 4786} {"train_loss": -25.90662956237793, "global_step": 397305, "epoch": 4786} {"train_loss": -25.91914176940918, "global_step": 397306, "epoch": 4786} {"train_loss": -26.337888717651367, "global_step": 397307, "epoch": 4786} {"train_loss": -26.44978904724121, "global_step": 397308, "epoch": 4786} {"train_loss": -26.20527458190918, "global_step": 397309, "epoch": 4786} {"train_loss": -26.433008193969727, "global_step": 397310, "epoch": 4786} {"train_loss": -26.318378448486328, "global_step": 397311, "epoch": 4786} {"train_loss": -26.459325790405273, "global_step": 397312, "epoch": 4786} {"train_loss": -26.3635196685791, "global_step": 397313, "epoch": 4786} {"train_loss": -26.239994049072266, "global_step": 397314, "epoch": 4786} {"train_loss": -26.60650062561035, "global_step": 397315, "epoch": 4786} {"train_loss": -26.59834098815918, "global_step": 397316, "epoch": 4786} {"train_loss": -26.80006217956543, "global_step": 397317, "epoch": 4786} {"train_loss": -26.831436157226562, "global_step": 397318, "epoch": 4786} {"train_loss": -26.50394058227539, "global_step": 397319, "epoch": 4786} {"train_loss": -26.48332028216626, "global_step": 397320, "epoch": 4786, "val_loss": 6664804.0} {"train_loss": -25.86305809020996, "global_step": 397321, "epoch": 4787} {"train_loss": -25.674264907836914, "global_step": 397322, "epoch": 4787} {"train_loss": -26.0269832611084, "global_step": 397323, "epoch": 4787} {"train_loss": -26.235410690307617, "global_step": 397324, "epoch": 4787} {"train_loss": -25.55817222595215, "global_step": 397325, "epoch": 4787} {"train_loss": -26.635583877563477, "global_step": 397326, "epoch": 4787} {"train_loss": -25.98026466369629, "global_step": 397327, "epoch": 4787} {"train_loss": -25.791440963745117, "global_step": 397328, "epoch": 4787} {"train_loss": -25.870824813842773, "global_step": 397329, "epoch": 4787} {"train_loss": -26.052221298217773, "global_step": 397330, "epoch": 4787} {"train_loss": -26.347082138061523, "global_step": 397331, "epoch": 4787} {"train_loss": -26.2432861328125, "global_step": 397332, "epoch": 4787} {"train_loss": -26.044824600219727, "global_step": 397333, "epoch": 4787} {"train_loss": -26.06454849243164, "global_step": 397334, "epoch": 4787} {"train_loss": -26.87310791015625, "global_step": 397335, "epoch": 4787} {"train_loss": -26.348669052124023, "global_step": 397336, "epoch": 4787} {"train_loss": -26.084476470947266, "global_step": 397337, "epoch": 4787} {"train_loss": -26.226545333862305, "global_step": 397338, "epoch": 4787} {"train_loss": -26.440820693969727, "global_step": 397339, "epoch": 4787} {"train_loss": -26.133960723876953, "global_step": 397340, "epoch": 4787} {"train_loss": -26.37428092956543, "global_step": 397341, "epoch": 4787} {"train_loss": -26.6867618560791, "global_step": 397342, "epoch": 4787} {"train_loss": -26.29532241821289, "global_step": 397343, "epoch": 4787} {"train_loss": -26.568037033081055, "global_step": 397344, "epoch": 4787} {"train_loss": -26.48357582092285, "global_step": 397345, "epoch": 4787} {"train_loss": -26.41619300842285, "global_step": 397346, "epoch": 4787} {"train_loss": -26.84259033203125, "global_step": 397347, "epoch": 4787} {"train_loss": -26.060644149780273, "global_step": 397348, "epoch": 4787} {"train_loss": -26.235544204711914, "global_step": 397349, "epoch": 4787} {"train_loss": -26.56605339050293, "global_step": 397350, "epoch": 4787} {"train_loss": -26.263166427612305, "global_step": 397351, "epoch": 4787} {"train_loss": -26.888479232788086, "global_step": 397352, "epoch": 4787} {"train_loss": -26.8741512298584, "global_step": 397353, "epoch": 4787} {"train_loss": -26.465158462524414, "global_step": 397354, "epoch": 4787} {"train_loss": -26.654300689697266, "global_step": 397355, "epoch": 4787} {"train_loss": -26.6407527923584, "global_step": 397356, "epoch": 4787} {"train_loss": -26.373584747314453, "global_step": 397357, "epoch": 4787} {"train_loss": -26.8594970703125, "global_step": 397358, "epoch": 4787} {"train_loss": -26.610715866088867, "global_step": 397359, "epoch": 4787} {"train_loss": -26.82327651977539, "global_step": 397360, "epoch": 4787} {"train_loss": -26.330215454101562, "global_step": 397361, "epoch": 4787} {"train_loss": -26.856159210205078, "global_step": 397362, "epoch": 4787} {"train_loss": -26.934057235717773, "global_step": 397363, "epoch": 4787} {"train_loss": -26.653507232666016, "global_step": 397364, "epoch": 4787} {"train_loss": -26.945249557495117, "global_step": 397365, "epoch": 4787} {"train_loss": -26.834217071533203, "global_step": 397366, "epoch": 4787} {"train_loss": -26.779138565063477, "global_step": 397367, "epoch": 4787} {"train_loss": -27.129194259643555, "global_step": 397368, "epoch": 4787} {"train_loss": -26.845849990844727, "global_step": 397369, "epoch": 4787} {"train_loss": -26.413013458251953, "global_step": 397370, "epoch": 4787} {"train_loss": -27.018238067626953, "global_step": 397371, "epoch": 4787} {"train_loss": -26.74971580505371, "global_step": 397372, "epoch": 4787} {"train_loss": -26.81226921081543, "global_step": 397373, "epoch": 4787} {"train_loss": -26.744653701782227, "global_step": 397374, "epoch": 4787} {"train_loss": -26.832067489624023, "global_step": 397375, "epoch": 4787} {"train_loss": -26.700037002563477, "global_step": 397376, "epoch": 4787} {"train_loss": -26.68622398376465, "global_step": 397377, "epoch": 4787} {"train_loss": -26.05084228515625, "global_step": 397378, "epoch": 4787} {"train_loss": -26.330102920532227, "global_step": 397379, "epoch": 4787} {"train_loss": -26.39228630065918, "global_step": 397380, "epoch": 4787} {"train_loss": -26.54775047302246, "global_step": 397381, "epoch": 4787} {"train_loss": -27.032209396362305, "global_step": 397382, "epoch": 4787} {"train_loss": -26.526966094970703, "global_step": 397383, "epoch": 4787} {"train_loss": -26.32691764831543, "global_step": 397384, "epoch": 4787} {"train_loss": -26.46477699279785, "global_step": 397385, "epoch": 4787} {"train_loss": -26.44215202331543, "global_step": 397386, "epoch": 4787} {"train_loss": -26.80193519592285, "global_step": 397387, "epoch": 4787} {"train_loss": -26.43696403503418, "global_step": 397388, "epoch": 4787} {"train_loss": -26.172040939331055, "global_step": 397389, "epoch": 4787} {"train_loss": -26.351428985595703, "global_step": 397390, "epoch": 4787} {"train_loss": -26.8956298828125, "global_step": 397391, "epoch": 4787} {"train_loss": -26.374792098999023, "global_step": 397392, "epoch": 4787} {"train_loss": -26.470203399658203, "global_step": 397393, "epoch": 4787} {"train_loss": -26.570484161376953, "global_step": 397394, "epoch": 4787} {"train_loss": -26.808734893798828, "global_step": 397395, "epoch": 4787} {"train_loss": -26.569538116455078, "global_step": 397396, "epoch": 4787} {"train_loss": -26.438196182250977, "global_step": 397397, "epoch": 4787} {"train_loss": -26.004352569580078, "global_step": 397398, "epoch": 4787} {"train_loss": -26.814746856689453, "global_step": 397399, "epoch": 4787} {"train_loss": -26.674463272094727, "global_step": 397400, "epoch": 4787} {"train_loss": -26.08478355407715, "global_step": 397401, "epoch": 4787} {"train_loss": -26.692646026611328, "global_step": 397402, "epoch": 4787} {"train_loss": -26.462264141404486, "global_step": 397403, "epoch": 4787, "val_loss": 6697027.5} {"train_loss": -25.30904197692871, "global_step": 397404, "epoch": 4788} {"train_loss": -24.49134635925293, "global_step": 397405, "epoch": 4788} {"train_loss": -25.845624923706055, "global_step": 397406, "epoch": 4788} {"train_loss": -25.46238136291504, "global_step": 397407, "epoch": 4788} {"train_loss": -24.6795654296875, "global_step": 397408, "epoch": 4788} {"train_loss": -25.31153678894043, "global_step": 397409, "epoch": 4788} {"train_loss": -25.676681518554688, "global_step": 397410, "epoch": 4788} {"train_loss": -25.651580810546875, "global_step": 397411, "epoch": 4788} {"train_loss": -25.5187931060791, "global_step": 397412, "epoch": 4788} {"train_loss": -25.347909927368164, "global_step": 397413, "epoch": 4788} {"train_loss": -25.737958908081055, "global_step": 397414, "epoch": 4788} {"train_loss": -25.642484664916992, "global_step": 397415, "epoch": 4788} {"train_loss": -25.509132385253906, "global_step": 397416, "epoch": 4788} {"train_loss": -25.964338302612305, "global_step": 397417, "epoch": 4788} {"train_loss": -25.889179229736328, "global_step": 397418, "epoch": 4788} {"train_loss": -26.071552276611328, "global_step": 397419, "epoch": 4788} {"train_loss": -25.73382568359375, "global_step": 397420, "epoch": 4788} {"train_loss": -26.205026626586914, "global_step": 397421, "epoch": 4788} {"train_loss": -26.165008544921875, "global_step": 397422, "epoch": 4788} {"train_loss": -25.780393600463867, "global_step": 397423, "epoch": 4788} {"train_loss": -26.301069259643555, "global_step": 397424, "epoch": 4788} {"train_loss": -25.97368812561035, "global_step": 397425, "epoch": 4788} {"train_loss": -26.180572509765625, "global_step": 397426, "epoch": 4788} {"train_loss": -26.161834716796875, "global_step": 397427, "epoch": 4788} {"train_loss": -26.025129318237305, "global_step": 397428, "epoch": 4788} {"train_loss": -26.369184494018555, "global_step": 397429, "epoch": 4788} {"train_loss": -26.12555503845215, "global_step": 397430, "epoch": 4788} {"train_loss": -26.347375869750977, "global_step": 397431, "epoch": 4788} {"train_loss": -25.82861328125, "global_step": 397432, "epoch": 4788} {"train_loss": -26.441030502319336, "global_step": 397433, "epoch": 4788} {"train_loss": -26.548877716064453, "global_step": 397434, "epoch": 4788} {"train_loss": -26.0982723236084, "global_step": 397435, "epoch": 4788} {"train_loss": -26.387731552124023, "global_step": 397436, "epoch": 4788} {"train_loss": -26.571369171142578, "global_step": 397437, "epoch": 4788} {"train_loss": -26.50245475769043, "global_step": 397438, "epoch": 4788} {"train_loss": -26.572607040405273, "global_step": 397439, "epoch": 4788} {"train_loss": -26.2974796295166, "global_step": 397440, "epoch": 4788} {"train_loss": -26.470426559448242, "global_step": 397441, "epoch": 4788} {"train_loss": -26.32492446899414, "global_step": 397442, "epoch": 4788} {"train_loss": -26.906848907470703, "global_step": 397443, "epoch": 4788} {"train_loss": -26.567174911499023, "global_step": 397444, "epoch": 4788} {"train_loss": -26.52252197265625, "global_step": 397445, "epoch": 4788} {"train_loss": -26.54657554626465, "global_step": 397446, "epoch": 4788} {"train_loss": -26.457448959350586, "global_step": 397447, "epoch": 4788} {"train_loss": -26.817188262939453, "global_step": 397448, "epoch": 4788} {"train_loss": -26.508405685424805, "global_step": 397449, "epoch": 4788} {"train_loss": -26.66916275024414, "global_step": 397450, "epoch": 4788} {"train_loss": -26.73792839050293, "global_step": 397451, "epoch": 4788} {"train_loss": -26.59943199157715, "global_step": 397452, "epoch": 4788} {"train_loss": -26.4879150390625, "global_step": 397453, "epoch": 4788} {"train_loss": -26.27292251586914, "global_step": 397454, "epoch": 4788} {"train_loss": -26.16982078552246, "global_step": 397455, "epoch": 4788} {"train_loss": -26.711868286132812, "global_step": 397456, "epoch": 4788} {"train_loss": -26.72047233581543, "global_step": 397457, "epoch": 4788} {"train_loss": -26.617902755737305, "global_step": 397458, "epoch": 4788} {"train_loss": -26.402883529663086, "global_step": 397459, "epoch": 4788} {"train_loss": -26.58735466003418, "global_step": 397460, "epoch": 4788} {"train_loss": -26.73567771911621, "global_step": 397461, "epoch": 4788} {"train_loss": -26.74420166015625, "global_step": 397462, "epoch": 4788} {"train_loss": -26.708112716674805, "global_step": 397463, "epoch": 4788} {"train_loss": -26.667926788330078, "global_step": 397464, "epoch": 4788} {"train_loss": -26.669652938842773, "global_step": 397465, "epoch": 4788} {"train_loss": -25.810001373291016, "global_step": 397466, "epoch": 4788} {"train_loss": -26.637481689453125, "global_step": 397467, "epoch": 4788} {"train_loss": -26.29509925842285, "global_step": 397468, "epoch": 4788} {"train_loss": -26.4104061126709, "global_step": 397469, "epoch": 4788} {"train_loss": -26.571125030517578, "global_step": 397470, "epoch": 4788} {"train_loss": -26.752099990844727, "global_step": 397471, "epoch": 4788} {"train_loss": -26.604568481445312, "global_step": 397472, "epoch": 4788} {"train_loss": -26.554468154907227, "global_step": 397473, "epoch": 4788} {"train_loss": -26.75575065612793, "global_step": 397474, "epoch": 4788} {"train_loss": -26.693286895751953, "global_step": 397475, "epoch": 4788} {"train_loss": -26.250720977783203, "global_step": 397476, "epoch": 4788} {"train_loss": -26.197561264038086, "global_step": 397477, "epoch": 4788} {"train_loss": -26.62869644165039, "global_step": 397478, "epoch": 4788} {"train_loss": -26.341949462890625, "global_step": 397479, "epoch": 4788} {"train_loss": -26.52596092224121, "global_step": 397480, "epoch": 4788} {"train_loss": -26.08685874938965, "global_step": 397481, "epoch": 4788} {"train_loss": -25.6494083404541, "global_step": 397482, "epoch": 4788} {"train_loss": -26.59918212890625, "global_step": 397483, "epoch": 4788} {"train_loss": -25.931425094604492, "global_step": 397484, "epoch": 4788} {"train_loss": -26.195226669311523, "global_step": 397485, "epoch": 4788} {"train_loss": -26.22766747532121, "global_step": 397486, "epoch": 4788, "val_loss": 6693485.0} {"train_loss": -25.720487594604492, "global_step": 397487, "epoch": 4789} {"train_loss": -26.146100997924805, "global_step": 397488, "epoch": 4789} {"train_loss": -26.299606323242188, "global_step": 397489, "epoch": 4789} {"train_loss": -25.674835205078125, "global_step": 397490, "epoch": 4789} {"train_loss": -25.975866317749023, "global_step": 397491, "epoch": 4789} {"train_loss": -25.788009643554688, "global_step": 397492, "epoch": 4789} {"train_loss": -26.07382583618164, "global_step": 397493, "epoch": 4789} {"train_loss": -25.423757553100586, "global_step": 397494, "epoch": 4789} {"train_loss": -26.26759147644043, "global_step": 397495, "epoch": 4789} {"train_loss": -26.0340518951416, "global_step": 397496, "epoch": 4789} {"train_loss": -26.054763793945312, "global_step": 397497, "epoch": 4789} {"train_loss": -26.323270797729492, "global_step": 397498, "epoch": 4789} {"train_loss": -26.175537109375, "global_step": 397499, "epoch": 4789} {"train_loss": -26.411161422729492, "global_step": 397500, "epoch": 4789} {"train_loss": -26.422027587890625, "global_step": 397501, "epoch": 4789} {"train_loss": -26.177846908569336, "global_step": 397502, "epoch": 4789} {"train_loss": -26.25580406188965, "global_step": 397503, "epoch": 4789} {"train_loss": -26.4237117767334, "global_step": 397504, "epoch": 4789} {"train_loss": -26.611454010009766, "global_step": 397505, "epoch": 4789} {"train_loss": -26.407550811767578, "global_step": 397506, "epoch": 4789} {"train_loss": -26.034900665283203, "global_step": 397507, "epoch": 4789} {"train_loss": -26.445484161376953, "global_step": 397508, "epoch": 4789} {"train_loss": -26.8256778717041, "global_step": 397509, "epoch": 4789} {"train_loss": -26.072952270507812, "global_step": 397510, "epoch": 4789} {"train_loss": -26.567829132080078, "global_step": 397511, "epoch": 4789} {"train_loss": -26.588342666625977, "global_step": 397512, "epoch": 4789} {"train_loss": -26.35294532775879, "global_step": 397513, "epoch": 4789} {"train_loss": -26.155792236328125, "global_step": 397514, "epoch": 4789} {"train_loss": -26.393590927124023, "global_step": 397515, "epoch": 4789} {"train_loss": -26.42988395690918, "global_step": 397516, "epoch": 4789} {"train_loss": -26.43450927734375, "global_step": 397517, "epoch": 4789} {"train_loss": -26.18951416015625, "global_step": 397518, "epoch": 4789} {"train_loss": -26.688434600830078, "global_step": 397519, "epoch": 4789} {"train_loss": -26.500280380249023, "global_step": 397520, "epoch": 4789} {"train_loss": -26.621402740478516, "global_step": 397521, "epoch": 4789} {"train_loss": -26.769241333007812, "global_step": 397522, "epoch": 4789} {"train_loss": -26.349958419799805, "global_step": 397523, "epoch": 4789} {"train_loss": -26.906660079956055, "global_step": 397524, "epoch": 4789} {"train_loss": -26.252042770385742, "global_step": 397525, "epoch": 4789} {"train_loss": -26.592191696166992, "global_step": 397526, "epoch": 4789} {"train_loss": -26.898679733276367, "global_step": 397527, "epoch": 4789} {"train_loss": -26.26239013671875, "global_step": 397528, "epoch": 4789} {"train_loss": -27.045337677001953, "global_step": 397529, "epoch": 4789} {"train_loss": -26.623977661132812, "global_step": 397530, "epoch": 4789} {"train_loss": -26.85163688659668, "global_step": 397531, "epoch": 4789} {"train_loss": -26.678863525390625, "global_step": 397532, "epoch": 4789} {"train_loss": -26.556766510009766, "global_step": 397533, "epoch": 4789} {"train_loss": -27.00148582458496, "global_step": 397534, "epoch": 4789} {"train_loss": -26.39967918395996, "global_step": 397535, "epoch": 4789} {"train_loss": -26.222387313842773, "global_step": 397536, "epoch": 4789} {"train_loss": -26.404693603515625, "global_step": 397537, "epoch": 4789} {"train_loss": -26.46393394470215, "global_step": 397538, "epoch": 4789} {"train_loss": -26.34012794494629, "global_step": 397539, "epoch": 4789} {"train_loss": -26.504474639892578, "global_step": 397540, "epoch": 4789} {"train_loss": -26.721954345703125, "global_step": 397541, "epoch": 4789} {"train_loss": -26.30645179748535, "global_step": 397542, "epoch": 4789} {"train_loss": -26.60807228088379, "global_step": 397543, "epoch": 4789} {"train_loss": -26.846540451049805, "global_step": 397544, "epoch": 4789} {"train_loss": -26.410675048828125, "global_step": 397545, "epoch": 4789} {"train_loss": -26.4486083984375, "global_step": 397546, "epoch": 4789} {"train_loss": -26.882450103759766, "global_step": 397547, "epoch": 4789} {"train_loss": -26.753131866455078, "global_step": 397548, "epoch": 4789} {"train_loss": -26.77583122253418, "global_step": 397549, "epoch": 4789} {"train_loss": -26.785131454467773, "global_step": 397550, "epoch": 4789} {"train_loss": -26.402313232421875, "global_step": 397551, "epoch": 4789} {"train_loss": -26.41580581665039, "global_step": 397552, "epoch": 4789} {"train_loss": -26.555768966674805, "global_step": 397553, "epoch": 4789} {"train_loss": -26.86223793029785, "global_step": 397554, "epoch": 4789} {"train_loss": -26.58649253845215, "global_step": 397555, "epoch": 4789} {"train_loss": -26.750097274780273, "global_step": 397556, "epoch": 4789} {"train_loss": -26.6463680267334, "global_step": 397557, "epoch": 4789} {"train_loss": -26.57663917541504, "global_step": 397558, "epoch": 4789} {"train_loss": -26.423629760742188, "global_step": 397559, "epoch": 4789} {"train_loss": -26.477766036987305, "global_step": 397560, "epoch": 4789} {"train_loss": -26.420148849487305, "global_step": 397561, "epoch": 4789} {"train_loss": -26.473386764526367, "global_step": 397562, "epoch": 4789} {"train_loss": -26.525192260742188, "global_step": 397563, "epoch": 4789} {"train_loss": -26.456787109375, "global_step": 397564, "epoch": 4789} {"train_loss": -26.312763214111328, "global_step": 397565, "epoch": 4789} {"train_loss": -26.924285888671875, "global_step": 397566, "epoch": 4789} {"train_loss": -26.7232666015625, "global_step": 397567, "epoch": 4789} {"train_loss": -26.4537410736084, "global_step": 397568, "epoch": 4789} {"train_loss": -26.443786598113647, "global_step": 397569, "epoch": 4789, "val_loss": 6715271.5} {"train_loss": -25.739789962768555, "global_step": 397570, "epoch": 4790} {"train_loss": -25.8376522064209, "global_step": 397571, "epoch": 4790} {"train_loss": -24.566818237304688, "global_step": 397572, "epoch": 4790} {"train_loss": -25.078290939331055, "global_step": 397573, "epoch": 4790} {"train_loss": -25.098501205444336, "global_step": 397574, "epoch": 4790} {"train_loss": -25.978124618530273, "global_step": 397575, "epoch": 4790} {"train_loss": -25.47101402282715, "global_step": 397576, "epoch": 4790} {"train_loss": -25.587831497192383, "global_step": 397577, "epoch": 4790} {"train_loss": -25.789209365844727, "global_step": 397578, "epoch": 4790} {"train_loss": -26.007497787475586, "global_step": 397579, "epoch": 4790} {"train_loss": -25.55274772644043, "global_step": 397580, "epoch": 4790} {"train_loss": -26.178598403930664, "global_step": 397581, "epoch": 4790} {"train_loss": -25.787235260009766, "global_step": 397582, "epoch": 4790} {"train_loss": -26.2376708984375, "global_step": 397583, "epoch": 4790} {"train_loss": -26.063678741455078, "global_step": 397584, "epoch": 4790} {"train_loss": -25.954755783081055, "global_step": 397585, "epoch": 4790} {"train_loss": -26.192703247070312, "global_step": 397586, "epoch": 4790} {"train_loss": -25.7169246673584, "global_step": 397587, "epoch": 4790} {"train_loss": -26.077199935913086, "global_step": 397588, "epoch": 4790} {"train_loss": -25.898269653320312, "global_step": 397589, "epoch": 4790} {"train_loss": -26.09661865234375, "global_step": 397590, "epoch": 4790} {"train_loss": -26.48248291015625, "global_step": 397591, "epoch": 4790} {"train_loss": -26.349775314331055, "global_step": 397592, "epoch": 4790} {"train_loss": -26.090290069580078, "global_step": 397593, "epoch": 4790} {"train_loss": -26.586286544799805, "global_step": 397594, "epoch": 4790} {"train_loss": -26.201923370361328, "global_step": 397595, "epoch": 4790} {"train_loss": -26.2501220703125, "global_step": 397596, "epoch": 4790} {"train_loss": -26.85983657836914, "global_step": 397597, "epoch": 4790} {"train_loss": -26.72932243347168, "global_step": 397598, "epoch": 4790} {"train_loss": -26.806180953979492, "global_step": 397599, "epoch": 4790} {"train_loss": -26.334442138671875, "global_step": 397600, "epoch": 4790} {"train_loss": -26.250829696655273, "global_step": 397601, "epoch": 4790} {"train_loss": -26.83045768737793, "global_step": 397602, "epoch": 4790} {"train_loss": -26.710737228393555, "global_step": 397603, "epoch": 4790} {"train_loss": -26.49408531188965, "global_step": 397604, "epoch": 4790} {"train_loss": -26.844587326049805, "global_step": 397605, "epoch": 4790} {"train_loss": -26.6709041595459, "global_step": 397606, "epoch": 4790} {"train_loss": -26.6458797454834, "global_step": 397607, "epoch": 4790} {"train_loss": -26.52141761779785, "global_step": 397608, "epoch": 4790} {"train_loss": -26.455163955688477, "global_step": 397609, "epoch": 4790} {"train_loss": -26.68208122253418, "global_step": 397610, "epoch": 4790} {"train_loss": -26.71526527404785, "global_step": 397611, "epoch": 4790} {"train_loss": -26.617938995361328, "global_step": 397612, "epoch": 4790} {"train_loss": -26.439435958862305, "global_step": 397613, "epoch": 4790} {"train_loss": -26.526626586914062, "global_step": 397614, "epoch": 4790} {"train_loss": -26.725830078125, "global_step": 397615, "epoch": 4790} {"train_loss": -26.389673233032227, "global_step": 397616, "epoch": 4790} {"train_loss": -26.497854232788086, "global_step": 397617, "epoch": 4790} {"train_loss": -26.53989601135254, "global_step": 397618, "epoch": 4790} {"train_loss": -26.18304443359375, "global_step": 397619, "epoch": 4790} {"train_loss": -26.64371681213379, "global_step": 397620, "epoch": 4790} {"train_loss": -26.78680419921875, "global_step": 397621, "epoch": 4790} {"train_loss": -26.358261108398438, "global_step": 397622, "epoch": 4790} {"train_loss": -26.560571670532227, "global_step": 397623, "epoch": 4790} {"train_loss": -26.66351890563965, "global_step": 397624, "epoch": 4790} {"train_loss": -26.605682373046875, "global_step": 397625, "epoch": 4790} {"train_loss": -26.722705841064453, "global_step": 397626, "epoch": 4790} {"train_loss": -26.70002555847168, "global_step": 397627, "epoch": 4790} {"train_loss": -26.63477897644043, "global_step": 397628, "epoch": 4790} {"train_loss": -26.377323150634766, "global_step": 397629, "epoch": 4790} {"train_loss": -26.540241241455078, "global_step": 397630, "epoch": 4790} {"train_loss": -26.153440475463867, "global_step": 397631, "epoch": 4790} {"train_loss": -26.526906967163086, "global_step": 397632, "epoch": 4790} {"train_loss": -26.701019287109375, "global_step": 397633, "epoch": 4790} {"train_loss": -26.642837524414062, "global_step": 397634, "epoch": 4790} {"train_loss": -26.616376876831055, "global_step": 397635, "epoch": 4790} {"train_loss": -26.540027618408203, "global_step": 397636, "epoch": 4790} {"train_loss": -26.343097686767578, "global_step": 397637, "epoch": 4790} {"train_loss": -25.744230270385742, "global_step": 397638, "epoch": 4790} {"train_loss": -26.25984001159668, "global_step": 397639, "epoch": 4790} {"train_loss": -26.7976016998291, "global_step": 397640, "epoch": 4790} {"train_loss": -26.48024559020996, "global_step": 397641, "epoch": 4790} {"train_loss": -26.24268913269043, "global_step": 397642, "epoch": 4790} {"train_loss": -25.74262046813965, "global_step": 397643, "epoch": 4790} {"train_loss": -26.37940788269043, "global_step": 397644, "epoch": 4790} {"train_loss": -26.523151397705078, "global_step": 397645, "epoch": 4790} {"train_loss": -26.60103416442871, "global_step": 397646, "epoch": 4790} {"train_loss": -25.7230281829834, "global_step": 397647, "epoch": 4790} {"train_loss": -26.422399520874023, "global_step": 397648, "epoch": 4790} {"train_loss": -26.743478775024414, "global_step": 397649, "epoch": 4790} {"train_loss": -26.516006469726562, "global_step": 397650, "epoch": 4790} {"train_loss": -26.629322052001953, "global_step": 397651, "epoch": 4790} {"train_loss": -26.301113634224397, "global_step": 397652, "epoch": 4790, "val_loss": 6600223.0} {"train_loss": -25.224990844726562, "global_step": 397653, "epoch": 4791} {"train_loss": -25.886938095092773, "global_step": 397654, "epoch": 4791} {"train_loss": -26.43308448791504, "global_step": 397655, "epoch": 4791} {"train_loss": -25.493457794189453, "global_step": 397656, "epoch": 4791} {"train_loss": -24.94719886779785, "global_step": 397657, "epoch": 4791} {"train_loss": -26.293018341064453, "global_step": 397658, "epoch": 4791} {"train_loss": -25.805097579956055, "global_step": 397659, "epoch": 4791} {"train_loss": -26.18654441833496, "global_step": 397660, "epoch": 4791} {"train_loss": -26.283462524414062, "global_step": 397661, "epoch": 4791} {"train_loss": -25.9272518157959, "global_step": 397662, "epoch": 4791} {"train_loss": -26.3696346282959, "global_step": 397663, "epoch": 4791} {"train_loss": -26.500125885009766, "global_step": 397664, "epoch": 4791} {"train_loss": -26.615320205688477, "global_step": 397665, "epoch": 4791} {"train_loss": -26.03004264831543, "global_step": 397666, "epoch": 4791} {"train_loss": -26.33123779296875, "global_step": 397667, "epoch": 4791} {"train_loss": -26.124664306640625, "global_step": 397668, "epoch": 4791} {"train_loss": -26.414249420166016, "global_step": 397669, "epoch": 4791} {"train_loss": -26.382902145385742, "global_step": 397670, "epoch": 4791} {"train_loss": -26.323843002319336, "global_step": 397671, "epoch": 4791} {"train_loss": -26.34405517578125, "global_step": 397672, "epoch": 4791} {"train_loss": -26.353933334350586, "global_step": 397673, "epoch": 4791} {"train_loss": -26.52741050720215, "global_step": 397674, "epoch": 4791} {"train_loss": -26.802627563476562, "global_step": 397675, "epoch": 4791} {"train_loss": -26.17695426940918, "global_step": 397676, "epoch": 4791} {"train_loss": -26.563934326171875, "global_step": 397677, "epoch": 4791} {"train_loss": -26.675092697143555, "global_step": 397678, "epoch": 4791} {"train_loss": -26.482318878173828, "global_step": 397679, "epoch": 4791} {"train_loss": -26.57866859436035, "global_step": 397680, "epoch": 4791} {"train_loss": -26.860092163085938, "global_step": 397681, "epoch": 4791} {"train_loss": -26.593442916870117, "global_step": 397682, "epoch": 4791} {"train_loss": -26.630868911743164, "global_step": 397683, "epoch": 4791} {"train_loss": -26.674543380737305, "global_step": 397684, "epoch": 4791} {"train_loss": -26.513166427612305, "global_step": 397685, "epoch": 4791} {"train_loss": -26.633209228515625, "global_step": 397686, "epoch": 4791} {"train_loss": -26.52229118347168, "global_step": 397687, "epoch": 4791} {"train_loss": -26.305072784423828, "global_step": 397688, "epoch": 4791} {"train_loss": -26.6894474029541, "global_step": 397689, "epoch": 4791} {"train_loss": -26.32608413696289, "global_step": 397690, "epoch": 4791} {"train_loss": -26.551237106323242, "global_step": 397691, "epoch": 4791} {"train_loss": -26.574115753173828, "global_step": 397692, "epoch": 4791} {"train_loss": -26.426488876342773, "global_step": 397693, "epoch": 4791} {"train_loss": -26.544784545898438, "global_step": 397694, "epoch": 4791} {"train_loss": -26.956995010375977, "global_step": 397695, "epoch": 4791} {"train_loss": -26.384403228759766, "global_step": 397696, "epoch": 4791} {"train_loss": -26.78554344177246, "global_step": 397697, "epoch": 4791} {"train_loss": -26.573871612548828, "global_step": 397698, "epoch": 4791} {"train_loss": -26.553466796875, "global_step": 397699, "epoch": 4791} {"train_loss": -26.5200138092041, "global_step": 397700, "epoch": 4791} {"train_loss": -26.933490753173828, "global_step": 397701, "epoch": 4791} {"train_loss": -26.90870475769043, "global_step": 397702, "epoch": 4791} {"train_loss": -26.85480308532715, "global_step": 397703, "epoch": 4791} {"train_loss": -26.367624282836914, "global_step": 397704, "epoch": 4791} {"train_loss": -26.563861846923828, "global_step": 397705, "epoch": 4791} {"train_loss": -26.71575927734375, "global_step": 397706, "epoch": 4791} {"train_loss": -26.958826065063477, "global_step": 397707, "epoch": 4791} {"train_loss": -26.30728530883789, "global_step": 397708, "epoch": 4791} {"train_loss": -26.540241241455078, "global_step": 397709, "epoch": 4791} {"train_loss": -26.352752685546875, "global_step": 397710, "epoch": 4791} {"train_loss": -26.558332443237305, "global_step": 397711, "epoch": 4791} {"train_loss": -26.69610023498535, "global_step": 397712, "epoch": 4791} {"train_loss": -26.505781173706055, "global_step": 397713, "epoch": 4791} {"train_loss": -26.842756271362305, "global_step": 397714, "epoch": 4791} {"train_loss": -26.717365264892578, "global_step": 397715, "epoch": 4791} {"train_loss": -26.516407012939453, "global_step": 397716, "epoch": 4791} {"train_loss": -26.714893341064453, "global_step": 397717, "epoch": 4791} {"train_loss": -26.909292221069336, "global_step": 397718, "epoch": 4791} {"train_loss": -26.92925453186035, "global_step": 397719, "epoch": 4791} {"train_loss": -26.422887802124023, "global_step": 397720, "epoch": 4791} {"train_loss": -26.593505859375, "global_step": 397721, "epoch": 4791} {"train_loss": -26.518522262573242, "global_step": 397722, "epoch": 4791} {"train_loss": -26.6889705657959, "global_step": 397723, "epoch": 4791} {"train_loss": -27.107763290405273, "global_step": 397724, "epoch": 4791} {"train_loss": -26.80872917175293, "global_step": 397725, "epoch": 4791} {"train_loss": -26.896177291870117, "global_step": 397726, "epoch": 4791} {"train_loss": -26.51124382019043, "global_step": 397727, "epoch": 4791} {"train_loss": -26.578603744506836, "global_step": 397728, "epoch": 4791} {"train_loss": -26.776758193969727, "global_step": 397729, "epoch": 4791} {"train_loss": -27.055896759033203, "global_step": 397730, "epoch": 4791} {"train_loss": -26.7503604888916, "global_step": 397731, "epoch": 4791} {"train_loss": -26.742151260375977, "global_step": 397732, "epoch": 4791} {"train_loss": -26.880630493164062, "global_step": 397733, "epoch": 4791} {"train_loss": -26.896066665649414, "global_step": 397734, "epoch": 4791} {"train_loss": -26.514713126492786, "global_step": 397735, "epoch": 4791, "val_loss": 6697268.0} {"train_loss": -26.21026611328125, "global_step": 397736, "epoch": 4792} {"train_loss": -26.51771354675293, "global_step": 397737, "epoch": 4792} {"train_loss": -25.42829704284668, "global_step": 397738, "epoch": 4792} {"train_loss": -25.242794036865234, "global_step": 397739, "epoch": 4792} {"train_loss": -25.69219398498535, "global_step": 397740, "epoch": 4792} {"train_loss": -26.026403427124023, "global_step": 397741, "epoch": 4792} {"train_loss": -26.557575225830078, "global_step": 397742, "epoch": 4792} {"train_loss": -25.798627853393555, "global_step": 397743, "epoch": 4792} {"train_loss": -25.94077491760254, "global_step": 397744, "epoch": 4792} {"train_loss": -26.267608642578125, "global_step": 397745, "epoch": 4792} {"train_loss": -26.341623306274414, "global_step": 397746, "epoch": 4792} {"train_loss": -25.949262619018555, "global_step": 397747, "epoch": 4792} {"train_loss": -26.253583908081055, "global_step": 397748, "epoch": 4792} {"train_loss": -26.358545303344727, "global_step": 397749, "epoch": 4792} {"train_loss": -26.309370040893555, "global_step": 397750, "epoch": 4792} {"train_loss": -26.371353149414062, "global_step": 397751, "epoch": 4792} {"train_loss": -26.442468643188477, "global_step": 397752, "epoch": 4792} {"train_loss": -26.278966903686523, "global_step": 397753, "epoch": 4792} {"train_loss": -26.758283615112305, "global_step": 397754, "epoch": 4792} {"train_loss": -26.579151153564453, "global_step": 397755, "epoch": 4792} {"train_loss": -26.376203536987305, "global_step": 397756, "epoch": 4792} {"train_loss": -26.698108673095703, "global_step": 397757, "epoch": 4792} {"train_loss": -26.45633316040039, "global_step": 397758, "epoch": 4792} {"train_loss": -26.426990509033203, "global_step": 397759, "epoch": 4792} {"train_loss": -26.60420036315918, "global_step": 397760, "epoch": 4792} {"train_loss": -26.700592041015625, "global_step": 397761, "epoch": 4792} {"train_loss": -26.758132934570312, "global_step": 397762, "epoch": 4792} {"train_loss": -26.508132934570312, "global_step": 397763, "epoch": 4792} {"train_loss": -26.602075576782227, "global_step": 397764, "epoch": 4792} {"train_loss": -26.678552627563477, "global_step": 397765, "epoch": 4792} {"train_loss": -26.202390670776367, "global_step": 397766, "epoch": 4792} {"train_loss": -26.681995391845703, "global_step": 397767, "epoch": 4792} {"train_loss": -26.389575958251953, "global_step": 397768, "epoch": 4792} {"train_loss": -26.817840576171875, "global_step": 397769, "epoch": 4792} {"train_loss": -26.500585556030273, "global_step": 397770, "epoch": 4792} {"train_loss": -26.582111358642578, "global_step": 397771, "epoch": 4792} {"train_loss": -26.7862606048584, "global_step": 397772, "epoch": 4792} {"train_loss": -26.720502853393555, "global_step": 397773, "epoch": 4792} {"train_loss": -26.8550968170166, "global_step": 397774, "epoch": 4792} {"train_loss": -26.651519775390625, "global_step": 397775, "epoch": 4792} {"train_loss": -26.313764572143555, "global_step": 397776, "epoch": 4792} {"train_loss": -26.83734703063965, "global_step": 397777, "epoch": 4792} {"train_loss": -26.84525489807129, "global_step": 397778, "epoch": 4792} {"train_loss": -26.916275024414062, "global_step": 397779, "epoch": 4792} {"train_loss": -26.646228790283203, "global_step": 397780, "epoch": 4792} {"train_loss": -27.152563095092773, "global_step": 397781, "epoch": 4792} {"train_loss": -26.72804069519043, "global_step": 397782, "epoch": 4792} {"train_loss": -26.599945068359375, "global_step": 397783, "epoch": 4792} {"train_loss": -26.727819442749023, "global_step": 397784, "epoch": 4792} {"train_loss": -26.758209228515625, "global_step": 397785, "epoch": 4792} {"train_loss": -26.9068546295166, "global_step": 397786, "epoch": 4792} {"train_loss": -26.774396896362305, "global_step": 397787, "epoch": 4792} {"train_loss": -26.58642578125, "global_step": 397788, "epoch": 4792} {"train_loss": -26.907621383666992, "global_step": 397789, "epoch": 4792} {"train_loss": -26.69849967956543, "global_step": 397790, "epoch": 4792} {"train_loss": -27.168842315673828, "global_step": 397791, "epoch": 4792} {"train_loss": -26.749792098999023, "global_step": 397792, "epoch": 4792} {"train_loss": -26.843618392944336, "global_step": 397793, "epoch": 4792} {"train_loss": -26.982370376586914, "global_step": 397794, "epoch": 4792} {"train_loss": -26.723352432250977, "global_step": 397795, "epoch": 4792} {"train_loss": -26.667041778564453, "global_step": 397796, "epoch": 4792} {"train_loss": -26.930072784423828, "global_step": 397797, "epoch": 4792} {"train_loss": -27.05303382873535, "global_step": 397798, "epoch": 4792} {"train_loss": -26.843122482299805, "global_step": 397799, "epoch": 4792} {"train_loss": -26.668201446533203, "global_step": 397800, "epoch": 4792} {"train_loss": -26.57634925842285, "global_step": 397801, "epoch": 4792} {"train_loss": -26.5594425201416, "global_step": 397802, "epoch": 4792} {"train_loss": -26.739233016967773, "global_step": 397803, "epoch": 4792} {"train_loss": -26.556385040283203, "global_step": 397804, "epoch": 4792} {"train_loss": -26.50359535217285, "global_step": 397805, "epoch": 4792} {"train_loss": -26.415878295898438, "global_step": 397806, "epoch": 4792} {"train_loss": -26.94492530822754, "global_step": 397807, "epoch": 4792} {"train_loss": -26.333887100219727, "global_step": 397808, "epoch": 4792} {"train_loss": -26.4736270904541, "global_step": 397809, "epoch": 4792} {"train_loss": -26.510908126831055, "global_step": 397810, "epoch": 4792} {"train_loss": -26.236740112304688, "global_step": 397811, "epoch": 4792} {"train_loss": -25.437591552734375, "global_step": 397812, "epoch": 4792} {"train_loss": -25.19532585144043, "global_step": 397813, "epoch": 4792} {"train_loss": -25.565082550048828, "global_step": 397814, "epoch": 4792} {"train_loss": -25.800373077392578, "global_step": 397815, "epoch": 4792} {"train_loss": -26.69097900390625, "global_step": 397816, "epoch": 4792} {"train_loss": -26.4069881439209, "global_step": 397817, "epoch": 4792} {"train_loss": -26.476421402161378, "global_step": 397818, "epoch": 4792, "val_loss": 6729275.0} {"train_loss": -26.073633193969727, "global_step": 397819, "epoch": 4793} {"train_loss": -25.96552848815918, "global_step": 397820, "epoch": 4793} {"train_loss": -26.276840209960938, "global_step": 397821, "epoch": 4793} {"train_loss": -26.231006622314453, "global_step": 397822, "epoch": 4793} {"train_loss": -25.65872573852539, "global_step": 397823, "epoch": 4793} {"train_loss": -26.39899253845215, "global_step": 397824, "epoch": 4793} {"train_loss": -26.236791610717773, "global_step": 397825, "epoch": 4793} {"train_loss": -26.041290283203125, "global_step": 397826, "epoch": 4793} {"train_loss": -26.174179077148438, "global_step": 397827, "epoch": 4793} {"train_loss": -25.969369888305664, "global_step": 397828, "epoch": 4793} {"train_loss": -26.220504760742188, "global_step": 397829, "epoch": 4793} {"train_loss": -25.916919708251953, "global_step": 397830, "epoch": 4793} {"train_loss": -25.894163131713867, "global_step": 397831, "epoch": 4793} {"train_loss": -26.188220977783203, "global_step": 397832, "epoch": 4793} {"train_loss": -25.827783584594727, "global_step": 397833, "epoch": 4793} {"train_loss": -26.314664840698242, "global_step": 397834, "epoch": 4793} {"train_loss": -26.175128936767578, "global_step": 397835, "epoch": 4793} {"train_loss": -26.031726837158203, "global_step": 397836, "epoch": 4793} {"train_loss": -26.4219970703125, "global_step": 397837, "epoch": 4793} {"train_loss": -26.1943416595459, "global_step": 397838, "epoch": 4793} {"train_loss": -26.28314781188965, "global_step": 397839, "epoch": 4793} {"train_loss": -26.506946563720703, "global_step": 397840, "epoch": 4793} {"train_loss": -26.437082290649414, "global_step": 397841, "epoch": 4793} {"train_loss": -26.448888778686523, "global_step": 397842, "epoch": 4793} {"train_loss": -26.40962028503418, "global_step": 397843, "epoch": 4793} {"train_loss": -26.610361099243164, "global_step": 397844, "epoch": 4793} {"train_loss": -26.376264572143555, "global_step": 397845, "epoch": 4793} {"train_loss": -26.926055908203125, "global_step": 397846, "epoch": 4793} {"train_loss": -26.60528564453125, "global_step": 397847, "epoch": 4793} {"train_loss": -26.614709854125977, "global_step": 397848, "epoch": 4793} {"train_loss": -26.740060806274414, "global_step": 397849, "epoch": 4793} {"train_loss": -26.580005645751953, "global_step": 397850, "epoch": 4793} {"train_loss": -26.270898818969727, "global_step": 397851, "epoch": 4793} {"train_loss": -26.77924919128418, "global_step": 397852, "epoch": 4793} {"train_loss": -26.141403198242188, "global_step": 397853, "epoch": 4793} {"train_loss": -26.518762588500977, "global_step": 397854, "epoch": 4793} {"train_loss": -26.628875732421875, "global_step": 397855, "epoch": 4793} {"train_loss": -26.526966094970703, "global_step": 397856, "epoch": 4793} {"train_loss": -26.32986831665039, "global_step": 397857, "epoch": 4793} {"train_loss": -26.577600479125977, "global_step": 397858, "epoch": 4793} {"train_loss": -26.995458602905273, "global_step": 397859, "epoch": 4793} {"train_loss": -26.67214012145996, "global_step": 397860, "epoch": 4793} {"train_loss": -26.387659072875977, "global_step": 397861, "epoch": 4793} {"train_loss": -26.65517234802246, "global_step": 397862, "epoch": 4793} {"train_loss": -26.60514259338379, "global_step": 397863, "epoch": 4793} {"train_loss": -26.852148056030273, "global_step": 397864, "epoch": 4793} {"train_loss": -26.683298110961914, "global_step": 397865, "epoch": 4793} {"train_loss": -26.690786361694336, "global_step": 397866, "epoch": 4793} {"train_loss": -26.454181671142578, "global_step": 397867, "epoch": 4793} {"train_loss": -26.645856857299805, "global_step": 397868, "epoch": 4793} {"train_loss": -26.80171775817871, "global_step": 397869, "epoch": 4793} {"train_loss": -27.097009658813477, "global_step": 397870, "epoch": 4793} {"train_loss": -26.587539672851562, "global_step": 397871, "epoch": 4793} {"train_loss": -26.363269805908203, "global_step": 397872, "epoch": 4793} {"train_loss": -27.088150024414062, "global_step": 397873, "epoch": 4793} {"train_loss": -26.556066513061523, "global_step": 397874, "epoch": 4793} {"train_loss": -26.634754180908203, "global_step": 397875, "epoch": 4793} {"train_loss": -26.51783561706543, "global_step": 397876, "epoch": 4793} {"train_loss": -26.881866455078125, "global_step": 397877, "epoch": 4793} {"train_loss": -27.003890991210938, "global_step": 397878, "epoch": 4793} {"train_loss": -26.560455322265625, "global_step": 397879, "epoch": 4793} {"train_loss": -26.544416427612305, "global_step": 397880, "epoch": 4793} {"train_loss": -26.642383575439453, "global_step": 397881, "epoch": 4793} {"train_loss": -26.710180282592773, "global_step": 397882, "epoch": 4793} {"train_loss": -26.54871940612793, "global_step": 397883, "epoch": 4793} {"train_loss": -26.637039184570312, "global_step": 397884, "epoch": 4793} {"train_loss": -26.787866592407227, "global_step": 397885, "epoch": 4793} {"train_loss": -26.800474166870117, "global_step": 397886, "epoch": 4793} {"train_loss": -26.934839248657227, "global_step": 397887, "epoch": 4793} {"train_loss": -26.7513427734375, "global_step": 397888, "epoch": 4793} {"train_loss": -26.74677085876465, "global_step": 397889, "epoch": 4793} {"train_loss": -26.87188148498535, "global_step": 397890, "epoch": 4793} {"train_loss": -26.957504272460938, "global_step": 397891, "epoch": 4793} {"train_loss": -26.72686195373535, "global_step": 397892, "epoch": 4793} {"train_loss": -26.864459991455078, "global_step": 397893, "epoch": 4793} {"train_loss": -26.8418025970459, "global_step": 397894, "epoch": 4793} {"train_loss": -26.647329330444336, "global_step": 397895, "epoch": 4793} {"train_loss": -27.07374382019043, "global_step": 397896, "epoch": 4793} {"train_loss": -26.772418975830078, "global_step": 397897, "epoch": 4793} {"train_loss": -26.44400978088379, "global_step": 397898, "epoch": 4793} {"train_loss": -26.812646865844727, "global_step": 397899, "epoch": 4793} {"train_loss": -26.84844398498535, "global_step": 397900, "epoch": 4793} {"train_loss": -26.54715993030962, "global_step": 397901, "epoch": 4793, "val_loss": 6841108.0} {"train_loss": -26.17280387878418, "global_step": 397902, "epoch": 4794} {"train_loss": -25.69321632385254, "global_step": 397903, "epoch": 4794} {"train_loss": -25.387815475463867, "global_step": 397904, "epoch": 4794} {"train_loss": -25.832189559936523, "global_step": 397905, "epoch": 4794} {"train_loss": -25.752277374267578, "global_step": 397906, "epoch": 4794} {"train_loss": -25.868249893188477, "global_step": 397907, "epoch": 4794} {"train_loss": -25.560348510742188, "global_step": 397908, "epoch": 4794} {"train_loss": -25.903005599975586, "global_step": 397909, "epoch": 4794} {"train_loss": -26.22071647644043, "global_step": 397910, "epoch": 4794} {"train_loss": -25.914953231811523, "global_step": 397911, "epoch": 4794} {"train_loss": -26.27309226989746, "global_step": 397912, "epoch": 4794} {"train_loss": -25.95172691345215, "global_step": 397913, "epoch": 4794} {"train_loss": -26.5764217376709, "global_step": 397914, "epoch": 4794} {"train_loss": -26.280136108398438, "global_step": 397915, "epoch": 4794} {"train_loss": -26.216556549072266, "global_step": 397916, "epoch": 4794} {"train_loss": -25.912036895751953, "global_step": 397917, "epoch": 4794} {"train_loss": -26.430158615112305, "global_step": 397918, "epoch": 4794} {"train_loss": -26.070714950561523, "global_step": 397919, "epoch": 4794} {"train_loss": -26.444049835205078, "global_step": 397920, "epoch": 4794} {"train_loss": -26.188032150268555, "global_step": 397921, "epoch": 4794} {"train_loss": -26.174386978149414, "global_step": 397922, "epoch": 4794} {"train_loss": -26.659423828125, "global_step": 397923, "epoch": 4794} {"train_loss": -26.180500030517578, "global_step": 397924, "epoch": 4794} {"train_loss": -26.429162979125977, "global_step": 397925, "epoch": 4794} {"train_loss": -26.802213668823242, "global_step": 397926, "epoch": 4794} {"train_loss": -26.382709503173828, "global_step": 397927, "epoch": 4794} {"train_loss": -26.610595703125, "global_step": 397928, "epoch": 4794} {"train_loss": -26.66019058227539, "global_step": 397929, "epoch": 4794} {"train_loss": -26.889841079711914, "global_step": 397930, "epoch": 4794} {"train_loss": -26.719152450561523, "global_step": 397931, "epoch": 4794} {"train_loss": -26.640127182006836, "global_step": 397932, "epoch": 4794} {"train_loss": -26.55691909790039, "global_step": 397933, "epoch": 4794} {"train_loss": -26.77068519592285, "global_step": 397934, "epoch": 4794} {"train_loss": -26.937152862548828, "global_step": 397935, "epoch": 4794} {"train_loss": -26.651052474975586, "global_step": 397936, "epoch": 4794} {"train_loss": -26.71827507019043, "global_step": 397937, "epoch": 4794} {"train_loss": -26.898298263549805, "global_step": 397938, "epoch": 4794} {"train_loss": -26.469074249267578, "global_step": 397939, "epoch": 4794} {"train_loss": -26.60260009765625, "global_step": 397940, "epoch": 4794} {"train_loss": -26.786252975463867, "global_step": 397941, "epoch": 4794} {"train_loss": -26.600439071655273, "global_step": 397942, "epoch": 4794} {"train_loss": -26.765228271484375, "global_step": 397943, "epoch": 4794} {"train_loss": -26.412626266479492, "global_step": 397944, "epoch": 4794} {"train_loss": -26.775299072265625, "global_step": 397945, "epoch": 4794} {"train_loss": -26.564443588256836, "global_step": 397946, "epoch": 4794} {"train_loss": -26.869611740112305, "global_step": 397947, "epoch": 4794} {"train_loss": -26.64389419555664, "global_step": 397948, "epoch": 4794} {"train_loss": -26.766193389892578, "global_step": 397949, "epoch": 4794} {"train_loss": -26.75147819519043, "global_step": 397950, "epoch": 4794} {"train_loss": -26.838037490844727, "global_step": 397951, "epoch": 4794} {"train_loss": -26.889616012573242, "global_step": 397952, "epoch": 4794} {"train_loss": -26.83489418029785, "global_step": 397953, "epoch": 4794} {"train_loss": -26.636310577392578, "global_step": 397954, "epoch": 4794} {"train_loss": -26.792163848876953, "global_step": 397955, "epoch": 4794} {"train_loss": -26.985815048217773, "global_step": 397956, "epoch": 4794} {"train_loss": -26.859481811523438, "global_step": 397957, "epoch": 4794} {"train_loss": -26.6160888671875, "global_step": 397958, "epoch": 4794} {"train_loss": -27.004291534423828, "global_step": 397959, "epoch": 4794} {"train_loss": -26.523223876953125, "global_step": 397960, "epoch": 4794} {"train_loss": -26.522083282470703, "global_step": 397961, "epoch": 4794} {"train_loss": -26.565439224243164, "global_step": 397962, "epoch": 4794} {"train_loss": -26.592620849609375, "global_step": 397963, "epoch": 4794} {"train_loss": -26.600967407226562, "global_step": 397964, "epoch": 4794} {"train_loss": -26.592199325561523, "global_step": 397965, "epoch": 4794} {"train_loss": -26.734121322631836, "global_step": 397966, "epoch": 4794} {"train_loss": -26.636220932006836, "global_step": 397967, "epoch": 4794} {"train_loss": -26.473020553588867, "global_step": 397968, "epoch": 4794} {"train_loss": -26.975238800048828, "global_step": 397969, "epoch": 4794} {"train_loss": -26.753870010375977, "global_step": 397970, "epoch": 4794} {"train_loss": -26.746856689453125, "global_step": 397971, "epoch": 4794} {"train_loss": -26.707889556884766, "global_step": 397972, "epoch": 4794} {"train_loss": -26.71742820739746, "global_step": 397973, "epoch": 4794} {"train_loss": -26.590869903564453, "global_step": 397974, "epoch": 4794} {"train_loss": -26.80024528503418, "global_step": 397975, "epoch": 4794} {"train_loss": -26.34392738342285, "global_step": 397976, "epoch": 4794} {"train_loss": -26.53130531311035, "global_step": 397977, "epoch": 4794} {"train_loss": -26.100391387939453, "global_step": 397978, "epoch": 4794} {"train_loss": -25.883899688720703, "global_step": 397979, "epoch": 4794} {"train_loss": -25.166921615600586, "global_step": 397980, "epoch": 4794} {"train_loss": -23.39190673828125, "global_step": 397981, "epoch": 4794} {"train_loss": -24.1319522857666, "global_step": 397982, "epoch": 4794} {"train_loss": -25.893020629882812, "global_step": 397983, "epoch": 4794} {"train_loss": -26.388040473662226, "global_step": 397984, "epoch": 4794, "val_loss": 6591208.0} {"train_loss": -24.868120193481445, "global_step": 397985, "epoch": 4795} {"train_loss": -24.888402938842773, "global_step": 397986, "epoch": 4795} {"train_loss": -24.418609619140625, "global_step": 397987, "epoch": 4795} {"train_loss": -25.121891021728516, "global_step": 397988, "epoch": 4795} {"train_loss": -24.5590877532959, "global_step": 397989, "epoch": 4795} {"train_loss": -25.262100219726562, "global_step": 397990, "epoch": 4795} {"train_loss": -25.379533767700195, "global_step": 397991, "epoch": 4795} {"train_loss": -25.6097412109375, "global_step": 397992, "epoch": 4795} {"train_loss": -25.60024070739746, "global_step": 397993, "epoch": 4795} {"train_loss": -25.850927352905273, "global_step": 397994, "epoch": 4795} {"train_loss": -25.592248916625977, "global_step": 397995, "epoch": 4795} {"train_loss": -25.690982818603516, "global_step": 397996, "epoch": 4795} {"train_loss": -25.928762435913086, "global_step": 397997, "epoch": 4795} {"train_loss": -25.73919677734375, "global_step": 397998, "epoch": 4795} {"train_loss": -25.59480094909668, "global_step": 397999, "epoch": 4795} {"train_loss": -25.952194213867188, "global_step": 398000, "epoch": 4795} {"train_loss": -25.72586441040039, "global_step": 398001, "epoch": 4795} {"train_loss": -25.984289169311523, "global_step": 398002, "epoch": 4795} {"train_loss": -26.075510025024414, "global_step": 398003, "epoch": 4795} {"train_loss": -25.800573348999023, "global_step": 398004, "epoch": 4795} {"train_loss": -25.930484771728516, "global_step": 398005, "epoch": 4795} {"train_loss": -25.975244522094727, "global_step": 398006, "epoch": 4795} {"train_loss": -26.06928825378418, "global_step": 398007, "epoch": 4795} {"train_loss": -26.22089958190918, "global_step": 398008, "epoch": 4795} {"train_loss": -26.437849044799805, "global_step": 398009, "epoch": 4795} {"train_loss": -26.205785751342773, "global_step": 398010, "epoch": 4795} {"train_loss": -26.203113555908203, "global_step": 398011, "epoch": 4795} {"train_loss": -26.39466667175293, "global_step": 398012, "epoch": 4795} {"train_loss": -26.441755294799805, "global_step": 398013, "epoch": 4795} {"train_loss": -26.592121124267578, "global_step": 398014, "epoch": 4795} {"train_loss": -26.35702896118164, "global_step": 398015, "epoch": 4795} {"train_loss": -26.731367111206055, "global_step": 398016, "epoch": 4795} {"train_loss": -26.62457847595215, "global_step": 398017, "epoch": 4795} {"train_loss": -26.367725372314453, "global_step": 398018, "epoch": 4795} {"train_loss": -26.435388565063477, "global_step": 398019, "epoch": 4795} {"train_loss": -26.57887077331543, "global_step": 398020, "epoch": 4795} {"train_loss": -26.454391479492188, "global_step": 398021, "epoch": 4795} {"train_loss": -26.621479034423828, "global_step": 398022, "epoch": 4795} {"train_loss": -26.640064239501953, "global_step": 398023, "epoch": 4795} {"train_loss": -26.735273361206055, "global_step": 398024, "epoch": 4795} {"train_loss": -26.645124435424805, "global_step": 398025, "epoch": 4795} {"train_loss": -26.6672306060791, "global_step": 398026, "epoch": 4795} {"train_loss": -26.61993980407715, "global_step": 398027, "epoch": 4795} {"train_loss": -26.4553279876709, "global_step": 398028, "epoch": 4795} {"train_loss": -26.518171310424805, "global_step": 398029, "epoch": 4795} {"train_loss": -26.304168701171875, "global_step": 398030, "epoch": 4795} {"train_loss": -26.67030143737793, "global_step": 398031, "epoch": 4795} {"train_loss": -26.85310173034668, "global_step": 398032, "epoch": 4795} {"train_loss": -26.918594360351562, "global_step": 398033, "epoch": 4795} {"train_loss": -26.900089263916016, "global_step": 398034, "epoch": 4795} {"train_loss": -26.860748291015625, "global_step": 398035, "epoch": 4795} {"train_loss": -26.7703914642334, "global_step": 398036, "epoch": 4795} {"train_loss": -27.17213249206543, "global_step": 398037, "epoch": 4795} {"train_loss": -26.85664176940918, "global_step": 398038, "epoch": 4795} {"train_loss": -26.6921329498291, "global_step": 398039, "epoch": 4795} {"train_loss": -26.595014572143555, "global_step": 398040, "epoch": 4795} {"train_loss": -26.8852596282959, "global_step": 398041, "epoch": 4795} {"train_loss": -26.839935302734375, "global_step": 398042, "epoch": 4795} {"train_loss": -26.482065200805664, "global_step": 398043, "epoch": 4795} {"train_loss": -26.6899356842041, "global_step": 398044, "epoch": 4795} {"train_loss": -26.670108795166016, "global_step": 398045, "epoch": 4795} {"train_loss": -26.54421043395996, "global_step": 398046, "epoch": 4795} {"train_loss": -26.424814224243164, "global_step": 398047, "epoch": 4795} {"train_loss": -26.16095542907715, "global_step": 398048, "epoch": 4795} {"train_loss": -26.13532066345215, "global_step": 398049, "epoch": 4795} {"train_loss": -25.69236183166504, "global_step": 398050, "epoch": 4795} {"train_loss": -26.186634063720703, "global_step": 398051, "epoch": 4795} {"train_loss": -26.81524658203125, "global_step": 398052, "epoch": 4795} {"train_loss": -26.328205108642578, "global_step": 398053, "epoch": 4795} {"train_loss": -26.86063575744629, "global_step": 398054, "epoch": 4795} {"train_loss": -26.60845375061035, "global_step": 398055, "epoch": 4795} {"train_loss": -26.658960342407227, "global_step": 398056, "epoch": 4795} {"train_loss": -26.8449649810791, "global_step": 398057, "epoch": 4795} {"train_loss": -26.35821533203125, "global_step": 398058, "epoch": 4795} {"train_loss": -26.401691436767578, "global_step": 398059, "epoch": 4795} {"train_loss": -26.33148193359375, "global_step": 398060, "epoch": 4795} {"train_loss": -26.764623641967773, "global_step": 398061, "epoch": 4795} {"train_loss": -26.728260040283203, "global_step": 398062, "epoch": 4795} {"train_loss": -26.368579864501953, "global_step": 398063, "epoch": 4795} {"train_loss": -26.497751235961914, "global_step": 398064, "epoch": 4795} {"train_loss": -26.717529296875, "global_step": 398065, "epoch": 4795} {"train_loss": -26.782928466796875, "global_step": 398066, "epoch": 4795} {"train_loss": -26.28001295802105, "global_step": 398067, "epoch": 4795, "val_loss": 6627166.5} {"train_loss": -25.547361373901367, "global_step": 398068, "epoch": 4796} {"train_loss": -25.84621238708496, "global_step": 398069, "epoch": 4796} {"train_loss": -26.511215209960938, "global_step": 398070, "epoch": 4796} {"train_loss": -26.053791046142578, "global_step": 398071, "epoch": 4796} {"train_loss": -26.399139404296875, "global_step": 398072, "epoch": 4796} {"train_loss": -26.008535385131836, "global_step": 398073, "epoch": 4796} {"train_loss": -25.970930099487305, "global_step": 398074, "epoch": 4796} {"train_loss": -26.409015655517578, "global_step": 398075, "epoch": 4796} {"train_loss": -26.05025291442871, "global_step": 398076, "epoch": 4796} {"train_loss": -26.522558212280273, "global_step": 398077, "epoch": 4796} {"train_loss": -26.16949462890625, "global_step": 398078, "epoch": 4796} {"train_loss": -26.133743286132812, "global_step": 398079, "epoch": 4796} {"train_loss": -26.398359298706055, "global_step": 398080, "epoch": 4796} {"train_loss": -26.035669326782227, "global_step": 398081, "epoch": 4796} {"train_loss": -26.277210235595703, "global_step": 398082, "epoch": 4796} {"train_loss": -26.255308151245117, "global_step": 398083, "epoch": 4796} {"train_loss": -26.459863662719727, "global_step": 398084, "epoch": 4796} {"train_loss": -26.593109130859375, "global_step": 398085, "epoch": 4796} {"train_loss": -26.928363800048828, "global_step": 398086, "epoch": 4796} {"train_loss": -26.86219596862793, "global_step": 398087, "epoch": 4796} {"train_loss": -26.53938102722168, "global_step": 398088, "epoch": 4796} {"train_loss": -26.51093864440918, "global_step": 398089, "epoch": 4796} {"train_loss": -26.60515785217285, "global_step": 398090, "epoch": 4796} {"train_loss": -26.584394454956055, "global_step": 398091, "epoch": 4796} {"train_loss": -26.82732582092285, "global_step": 398092, "epoch": 4796} {"train_loss": -26.899377822875977, "global_step": 398093, "epoch": 4796} {"train_loss": -26.630783081054688, "global_step": 398094, "epoch": 4796} {"train_loss": -26.680578231811523, "global_step": 398095, "epoch": 4796} {"train_loss": -26.34535789489746, "global_step": 398096, "epoch": 4796} {"train_loss": -26.794652938842773, "global_step": 398097, "epoch": 4796} {"train_loss": -26.55936050415039, "global_step": 398098, "epoch": 4796} {"train_loss": -26.66132926940918, "global_step": 398099, "epoch": 4796} {"train_loss": -26.73587989807129, "global_step": 398100, "epoch": 4796} {"train_loss": -26.714319229125977, "global_step": 398101, "epoch": 4796} {"train_loss": -25.95704460144043, "global_step": 398102, "epoch": 4796} {"train_loss": -26.771133422851562, "global_step": 398103, "epoch": 4796} {"train_loss": -26.653339385986328, "global_step": 398104, "epoch": 4796} {"train_loss": -26.746402740478516, "global_step": 398105, "epoch": 4796} {"train_loss": -27.0832576751709, "global_step": 398106, "epoch": 4796} {"train_loss": -26.37360191345215, "global_step": 398107, "epoch": 4796} {"train_loss": -26.43780517578125, "global_step": 398108, "epoch": 4796} {"train_loss": -26.340652465820312, "global_step": 398109, "epoch": 4796} {"train_loss": -26.48297119140625, "global_step": 398110, "epoch": 4796} {"train_loss": -26.465909957885742, "global_step": 398111, "epoch": 4796} {"train_loss": -26.311237335205078, "global_step": 398112, "epoch": 4796} {"train_loss": -26.596643447875977, "global_step": 398113, "epoch": 4796} {"train_loss": -26.84757423400879, "global_step": 398114, "epoch": 4796} {"train_loss": -26.49786949157715, "global_step": 398115, "epoch": 4796} {"train_loss": -26.16684913635254, "global_step": 398116, "epoch": 4796} {"train_loss": -26.159881591796875, "global_step": 398117, "epoch": 4796} {"train_loss": -26.41890525817871, "global_step": 398118, "epoch": 4796} {"train_loss": -26.737232208251953, "global_step": 398119, "epoch": 4796} {"train_loss": -26.596601486206055, "global_step": 398120, "epoch": 4796} {"train_loss": -26.575971603393555, "global_step": 398121, "epoch": 4796} {"train_loss": -26.73703956604004, "global_step": 398122, "epoch": 4796} {"train_loss": -26.62245750427246, "global_step": 398123, "epoch": 4796} {"train_loss": -26.632776260375977, "global_step": 398124, "epoch": 4796} {"train_loss": -26.745182037353516, "global_step": 398125, "epoch": 4796} {"train_loss": -27.225269317626953, "global_step": 398126, "epoch": 4796} {"train_loss": -26.77205467224121, "global_step": 398127, "epoch": 4796} {"train_loss": -26.803754806518555, "global_step": 398128, "epoch": 4796} {"train_loss": -26.862791061401367, "global_step": 398129, "epoch": 4796} {"train_loss": -26.8729248046875, "global_step": 398130, "epoch": 4796} {"train_loss": -27.037267684936523, "global_step": 398131, "epoch": 4796} {"train_loss": -26.286283493041992, "global_step": 398132, "epoch": 4796} {"train_loss": -26.575992584228516, "global_step": 398133, "epoch": 4796} {"train_loss": -26.63055992126465, "global_step": 398134, "epoch": 4796} {"train_loss": -26.66996192932129, "global_step": 398135, "epoch": 4796} {"train_loss": -26.728445053100586, "global_step": 398136, "epoch": 4796} {"train_loss": -26.633544921875, "global_step": 398137, "epoch": 4796} {"train_loss": -26.92205810546875, "global_step": 398138, "epoch": 4796} {"train_loss": -26.847864151000977, "global_step": 398139, "epoch": 4796} {"train_loss": -27.002527236938477, "global_step": 398140, "epoch": 4796} {"train_loss": -26.543212890625, "global_step": 398141, "epoch": 4796} {"train_loss": -26.972003936767578, "global_step": 398142, "epoch": 4796} {"train_loss": -26.949356079101562, "global_step": 398143, "epoch": 4796} {"train_loss": -26.919519424438477, "global_step": 398144, "epoch": 4796} {"train_loss": -26.96375846862793, "global_step": 398145, "epoch": 4796} {"train_loss": -26.517669677734375, "global_step": 398146, "epoch": 4796} {"train_loss": -26.792133331298828, "global_step": 398147, "epoch": 4796} {"train_loss": -26.809799194335938, "global_step": 398148, "epoch": 4796} {"train_loss": -27.01900291442871, "global_step": 398149, "epoch": 4796} {"train_loss": -26.577278918530567, "global_step": 398150, "epoch": 4796, "val_loss": 6627304.0} {"train_loss": -25.6591796875, "global_step": 398151, "epoch": 4797} {"train_loss": -23.90021514892578, "global_step": 398152, "epoch": 4797} {"train_loss": -24.27190589904785, "global_step": 398153, "epoch": 4797} {"train_loss": -25.829065322875977, "global_step": 398154, "epoch": 4797} {"train_loss": -25.8346004486084, "global_step": 398155, "epoch": 4797} {"train_loss": -24.923748016357422, "global_step": 398156, "epoch": 4797} {"train_loss": -26.026870727539062, "global_step": 398157, "epoch": 4797} {"train_loss": -25.88331413269043, "global_step": 398158, "epoch": 4797} {"train_loss": -26.065948486328125, "global_step": 398159, "epoch": 4797} {"train_loss": -25.92677879333496, "global_step": 398160, "epoch": 4797} {"train_loss": -25.512548446655273, "global_step": 398161, "epoch": 4797} {"train_loss": -26.25275993347168, "global_step": 398162, "epoch": 4797} {"train_loss": -26.241315841674805, "global_step": 398163, "epoch": 4797} {"train_loss": -26.375757217407227, "global_step": 398164, "epoch": 4797} {"train_loss": -25.982257843017578, "global_step": 398165, "epoch": 4797} {"train_loss": -25.915929794311523, "global_step": 398166, "epoch": 4797} {"train_loss": -26.61537742614746, "global_step": 398167, "epoch": 4797} {"train_loss": -26.24446678161621, "global_step": 398168, "epoch": 4797} {"train_loss": -26.00434684753418, "global_step": 398169, "epoch": 4797} {"train_loss": -26.0986328125, "global_step": 398170, "epoch": 4797} {"train_loss": -26.026569366455078, "global_step": 398171, "epoch": 4797} {"train_loss": -25.914203643798828, "global_step": 398172, "epoch": 4797} {"train_loss": -26.649890899658203, "global_step": 398173, "epoch": 4797} {"train_loss": -26.572858810424805, "global_step": 398174, "epoch": 4797} {"train_loss": -26.264066696166992, "global_step": 398175, "epoch": 4797} {"train_loss": -26.40338706970215, "global_step": 398176, "epoch": 4797} {"train_loss": -26.110172271728516, "global_step": 398177, "epoch": 4797} {"train_loss": -26.260272979736328, "global_step": 398178, "epoch": 4797} {"train_loss": -26.256250381469727, "global_step": 398179, "epoch": 4797} {"train_loss": -26.350879669189453, "global_step": 398180, "epoch": 4797} {"train_loss": -26.6113224029541, "global_step": 398181, "epoch": 4797} {"train_loss": -26.453296661376953, "global_step": 398182, "epoch": 4797} {"train_loss": -26.1972599029541, "global_step": 398183, "epoch": 4797} {"train_loss": -26.497364044189453, "global_step": 398184, "epoch": 4797} {"train_loss": -26.5710391998291, "global_step": 398185, "epoch": 4797} {"train_loss": -26.46076774597168, "global_step": 398186, "epoch": 4797} {"train_loss": -26.968759536743164, "global_step": 398187, "epoch": 4797} {"train_loss": -26.44874382019043, "global_step": 398188, "epoch": 4797} {"train_loss": -26.722381591796875, "global_step": 398189, "epoch": 4797} {"train_loss": -26.790729522705078, "global_step": 398190, "epoch": 4797} {"train_loss": -26.556974411010742, "global_step": 398191, "epoch": 4797} {"train_loss": -26.227460861206055, "global_step": 398192, "epoch": 4797} {"train_loss": -26.667804718017578, "global_step": 398193, "epoch": 4797} {"train_loss": -26.610864639282227, "global_step": 398194, "epoch": 4797} {"train_loss": -26.27870750427246, "global_step": 398195, "epoch": 4797} {"train_loss": -26.552051544189453, "global_step": 398196, "epoch": 4797} {"train_loss": -26.428064346313477, "global_step": 398197, "epoch": 4797} {"train_loss": -26.532758712768555, "global_step": 398198, "epoch": 4797} {"train_loss": -26.451614379882812, "global_step": 398199, "epoch": 4797} {"train_loss": -26.383472442626953, "global_step": 398200, "epoch": 4797} {"train_loss": -26.579010009765625, "global_step": 398201, "epoch": 4797} {"train_loss": -26.985198974609375, "global_step": 398202, "epoch": 4797} {"train_loss": -26.762531280517578, "global_step": 398203, "epoch": 4797} {"train_loss": -26.621442794799805, "global_step": 398204, "epoch": 4797} {"train_loss": -26.711633682250977, "global_step": 398205, "epoch": 4797} {"train_loss": -26.798725128173828, "global_step": 398206, "epoch": 4797} {"train_loss": -26.555744171142578, "global_step": 398207, "epoch": 4797} {"train_loss": -26.74335289001465, "global_step": 398208, "epoch": 4797} {"train_loss": -26.642114639282227, "global_step": 398209, "epoch": 4797} {"train_loss": -26.72113609313965, "global_step": 398210, "epoch": 4797} {"train_loss": -26.53860855102539, "global_step": 398211, "epoch": 4797} {"train_loss": -26.64997673034668, "global_step": 398212, "epoch": 4797} {"train_loss": -26.711109161376953, "global_step": 398213, "epoch": 4797} {"train_loss": -26.6314754486084, "global_step": 398214, "epoch": 4797} {"train_loss": -26.62849998474121, "global_step": 398215, "epoch": 4797} {"train_loss": -26.86855125427246, "global_step": 398216, "epoch": 4797} {"train_loss": -26.805994033813477, "global_step": 398217, "epoch": 4797} {"train_loss": -26.71441078186035, "global_step": 398218, "epoch": 4797} {"train_loss": -26.775659561157227, "global_step": 398219, "epoch": 4797} {"train_loss": -26.43953514099121, "global_step": 398220, "epoch": 4797} {"train_loss": -26.866077423095703, "global_step": 398221, "epoch": 4797} {"train_loss": -26.721466064453125, "global_step": 398222, "epoch": 4797} {"train_loss": -26.94769859313965, "global_step": 398223, "epoch": 4797} {"train_loss": -26.82179069519043, "global_step": 398224, "epoch": 4797} {"train_loss": -26.903417587280273, "global_step": 398225, "epoch": 4797} {"train_loss": -26.736164093017578, "global_step": 398226, "epoch": 4797} {"train_loss": -26.96698570251465, "global_step": 398227, "epoch": 4797} {"train_loss": -26.632699966430664, "global_step": 398228, "epoch": 4797} {"train_loss": -26.65553092956543, "global_step": 398229, "epoch": 4797} {"train_loss": -26.829954147338867, "global_step": 398230, "epoch": 4797} {"train_loss": -26.474903106689453, "global_step": 398231, "epoch": 4797} {"train_loss": -26.63352394104004, "global_step": 398232, "epoch": 4797} {"train_loss": -26.381815806928888, "global_step": 398233, "epoch": 4797, "val_loss": 6652744.5} {"train_loss": -25.3692569732666, "global_step": 398234, "epoch": 4798} {"train_loss": -23.865522384643555, "global_step": 398235, "epoch": 4798} {"train_loss": -24.893192291259766, "global_step": 398236, "epoch": 4798} {"train_loss": -25.833209991455078, "global_step": 398237, "epoch": 4798} {"train_loss": -25.216053009033203, "global_step": 398238, "epoch": 4798} {"train_loss": -25.820301055908203, "global_step": 398239, "epoch": 4798} {"train_loss": -25.811689376831055, "global_step": 398240, "epoch": 4798} {"train_loss": -25.7248477935791, "global_step": 398241, "epoch": 4798} {"train_loss": -25.811277389526367, "global_step": 398242, "epoch": 4798} {"train_loss": -25.7431640625, "global_step": 398243, "epoch": 4798} {"train_loss": -25.49805450439453, "global_step": 398244, "epoch": 4798} {"train_loss": -25.90985679626465, "global_step": 398245, "epoch": 4798} {"train_loss": -25.456317901611328, "global_step": 398246, "epoch": 4798} {"train_loss": -25.702991485595703, "global_step": 398247, "epoch": 4798} {"train_loss": -25.731948852539062, "global_step": 398248, "epoch": 4798} {"train_loss": -25.733474731445312, "global_step": 398249, "epoch": 4798} {"train_loss": -25.637731552124023, "global_step": 398250, "epoch": 4798} {"train_loss": -26.079675674438477, "global_step": 398251, "epoch": 4798} {"train_loss": -25.83829689025879, "global_step": 398252, "epoch": 4798} {"train_loss": -25.592830657958984, "global_step": 398253, "epoch": 4798} {"train_loss": -26.050500869750977, "global_step": 398254, "epoch": 4798} {"train_loss": -26.056884765625, "global_step": 398255, "epoch": 4798} {"train_loss": -25.592121124267578, "global_step": 398256, "epoch": 4798} {"train_loss": -26.388797760009766, "global_step": 398257, "epoch": 4798} {"train_loss": -25.869781494140625, "global_step": 398258, "epoch": 4798} {"train_loss": -26.2401180267334, "global_step": 398259, "epoch": 4798} {"train_loss": -26.10297966003418, "global_step": 398260, "epoch": 4798} {"train_loss": -26.03705406188965, "global_step": 398261, "epoch": 4798} {"train_loss": -26.169218063354492, "global_step": 398262, "epoch": 4798} {"train_loss": -26.26434326171875, "global_step": 398263, "epoch": 4798} {"train_loss": -26.271223068237305, "global_step": 398264, "epoch": 4798} {"train_loss": -26.51996421813965, "global_step": 398265, "epoch": 4798} {"train_loss": -26.3698673248291, "global_step": 398266, "epoch": 4798} {"train_loss": -26.141803741455078, "global_step": 398267, "epoch": 4798} {"train_loss": -26.59124183654785, "global_step": 398268, "epoch": 4798} {"train_loss": -26.524423599243164, "global_step": 398269, "epoch": 4798} {"train_loss": -26.581518173217773, "global_step": 398270, "epoch": 4798} {"train_loss": -26.5894775390625, "global_step": 398271, "epoch": 4798} {"train_loss": -26.569461822509766, "global_step": 398272, "epoch": 4798} {"train_loss": -26.515851974487305, "global_step": 398273, "epoch": 4798} {"train_loss": -26.633020401000977, "global_step": 398274, "epoch": 4798} {"train_loss": -26.63114356994629, "global_step": 398275, "epoch": 4798} {"train_loss": -26.7252254486084, "global_step": 398276, "epoch": 4798} {"train_loss": -26.875019073486328, "global_step": 398277, "epoch": 4798} {"train_loss": -26.44821548461914, "global_step": 398278, "epoch": 4798} {"train_loss": -26.57282066345215, "global_step": 398279, "epoch": 4798} {"train_loss": -26.515838623046875, "global_step": 398280, "epoch": 4798} {"train_loss": -26.956335067749023, "global_step": 398281, "epoch": 4798} {"train_loss": -26.52739906311035, "global_step": 398282, "epoch": 4798} {"train_loss": -26.838544845581055, "global_step": 398283, "epoch": 4798} {"train_loss": -26.617664337158203, "global_step": 398284, "epoch": 4798} {"train_loss": -27.00860595703125, "global_step": 398285, "epoch": 4798} {"train_loss": -26.52552604675293, "global_step": 398286, "epoch": 4798} {"train_loss": -27.007360458374023, "global_step": 398287, "epoch": 4798} {"train_loss": -26.92405128479004, "global_step": 398288, "epoch": 4798} {"train_loss": -26.6710147857666, "global_step": 398289, "epoch": 4798} {"train_loss": -26.553503036499023, "global_step": 398290, "epoch": 4798} {"train_loss": -26.727155685424805, "global_step": 398291, "epoch": 4798} {"train_loss": -26.694055557250977, "global_step": 398292, "epoch": 4798} {"train_loss": -26.90690040588379, "global_step": 398293, "epoch": 4798} {"train_loss": -26.819059371948242, "global_step": 398294, "epoch": 4798} {"train_loss": -26.784000396728516, "global_step": 398295, "epoch": 4798} {"train_loss": -26.289350509643555, "global_step": 398296, "epoch": 4798} {"train_loss": -26.554813385009766, "global_step": 398297, "epoch": 4798} {"train_loss": -26.349409103393555, "global_step": 398298, "epoch": 4798} {"train_loss": -26.80307388305664, "global_step": 398299, "epoch": 4798} {"train_loss": -26.410154342651367, "global_step": 398300, "epoch": 4798} {"train_loss": -26.68024253845215, "global_step": 398301, "epoch": 4798} {"train_loss": -26.65938377380371, "global_step": 398302, "epoch": 4798} {"train_loss": -26.687335968017578, "global_step": 398303, "epoch": 4798} {"train_loss": -26.51236915588379, "global_step": 398304, "epoch": 4798} {"train_loss": -26.48428726196289, "global_step": 398305, "epoch": 4798} {"train_loss": -26.63935661315918, "global_step": 398306, "epoch": 4798} {"train_loss": -26.305646896362305, "global_step": 398307, "epoch": 4798} {"train_loss": -26.841094970703125, "global_step": 398308, "epoch": 4798} {"train_loss": -26.668439865112305, "global_step": 398309, "epoch": 4798} {"train_loss": -26.607004165649414, "global_step": 398310, "epoch": 4798} {"train_loss": -26.634490966796875, "global_step": 398311, "epoch": 4798} {"train_loss": -26.615921020507812, "global_step": 398312, "epoch": 4798} {"train_loss": -26.87745475769043, "global_step": 398313, "epoch": 4798} {"train_loss": -26.62005615234375, "global_step": 398314, "epoch": 4798} {"train_loss": -26.544540405273438, "global_step": 398315, "epoch": 4798} {"train_loss": -26.292672467519, "global_step": 398316, "epoch": 4798, "val_loss": 6624660.0} {"train_loss": -25.688085556030273, "global_step": 398317, "epoch": 4799} {"train_loss": -25.904748916625977, "global_step": 398318, "epoch": 4799} {"train_loss": -26.29619789123535, "global_step": 398319, "epoch": 4799} {"train_loss": -25.959325790405273, "global_step": 398320, "epoch": 4799} {"train_loss": -26.385068893432617, "global_step": 398321, "epoch": 4799} {"train_loss": -25.743408203125, "global_step": 398322, "epoch": 4799} {"train_loss": -25.869062423706055, "global_step": 398323, "epoch": 4799} {"train_loss": -25.742420196533203, "global_step": 398324, "epoch": 4799} {"train_loss": -25.908369064331055, "global_step": 398325, "epoch": 4799} {"train_loss": -25.83930778503418, "global_step": 398326, "epoch": 4799} {"train_loss": -25.923934936523438, "global_step": 398327, "epoch": 4799} {"train_loss": -26.069616317749023, "global_step": 398328, "epoch": 4799} {"train_loss": -26.077713012695312, "global_step": 398329, "epoch": 4799} {"train_loss": -26.127119064331055, "global_step": 398330, "epoch": 4799} {"train_loss": -26.2971248626709, "global_step": 398331, "epoch": 4799} {"train_loss": -26.356281280517578, "global_step": 398332, "epoch": 4799} {"train_loss": -25.889911651611328, "global_step": 398333, "epoch": 4799} {"train_loss": -26.451684951782227, "global_step": 398334, "epoch": 4799} {"train_loss": -26.14251136779785, "global_step": 398335, "epoch": 4799} {"train_loss": -26.45636558532715, "global_step": 398336, "epoch": 4799} {"train_loss": -26.717893600463867, "global_step": 398337, "epoch": 4799} {"train_loss": -25.95597267150879, "global_step": 398338, "epoch": 4799} {"train_loss": -26.64874267578125, "global_step": 398339, "epoch": 4799} {"train_loss": -26.405902862548828, "global_step": 398340, "epoch": 4799} {"train_loss": -26.4677791595459, "global_step": 398341, "epoch": 4799} {"train_loss": -26.290754318237305, "global_step": 398342, "epoch": 4799} {"train_loss": -26.867895126342773, "global_step": 398343, "epoch": 4799} {"train_loss": -26.492557525634766, "global_step": 398344, "epoch": 4799} {"train_loss": -26.696552276611328, "global_step": 398345, "epoch": 4799} {"train_loss": -26.742055892944336, "global_step": 398346, "epoch": 4799} {"train_loss": -26.186548233032227, "global_step": 398347, "epoch": 4799} {"train_loss": -26.5731201171875, "global_step": 398348, "epoch": 4799} {"train_loss": -26.699567794799805, "global_step": 398349, "epoch": 4799} {"train_loss": -26.425893783569336, "global_step": 398350, "epoch": 4799} {"train_loss": -26.717309951782227, "global_step": 398351, "epoch": 4799} {"train_loss": -26.724573135375977, "global_step": 398352, "epoch": 4799} {"train_loss": -26.542570114135742, "global_step": 398353, "epoch": 4799} {"train_loss": -26.41387367248535, "global_step": 398354, "epoch": 4799} {"train_loss": -26.55763053894043, "global_step": 398355, "epoch": 4799} {"train_loss": -26.92355728149414, "global_step": 398356, "epoch": 4799} {"train_loss": -26.5815486907959, "global_step": 398357, "epoch": 4799} {"train_loss": -26.70635414123535, "global_step": 398358, "epoch": 4799} {"train_loss": -26.555419921875, "global_step": 398359, "epoch": 4799} {"train_loss": -27.042936325073242, "global_step": 398360, "epoch": 4799} {"train_loss": -26.607690811157227, "global_step": 398361, "epoch": 4799} {"train_loss": -26.8581485748291, "global_step": 398362, "epoch": 4799} {"train_loss": -26.5488338470459, "global_step": 398363, "epoch": 4799} {"train_loss": -26.944843292236328, "global_step": 398364, "epoch": 4799} {"train_loss": -26.637643814086914, "global_step": 398365, "epoch": 4799} {"train_loss": -27.032800674438477, "global_step": 398366, "epoch": 4799} {"train_loss": -26.891101837158203, "global_step": 398367, "epoch": 4799} {"train_loss": -27.143402099609375, "global_step": 398368, "epoch": 4799} {"train_loss": -26.486616134643555, "global_step": 398369, "epoch": 4799} {"train_loss": -26.743698120117188, "global_step": 398370, "epoch": 4799} {"train_loss": -26.720706939697266, "global_step": 398371, "epoch": 4799} {"train_loss": -26.789722442626953, "global_step": 398372, "epoch": 4799} {"train_loss": -27.17559814453125, "global_step": 398373, "epoch": 4799} {"train_loss": -26.492910385131836, "global_step": 398374, "epoch": 4799} {"train_loss": -26.795166015625, "global_step": 398375, "epoch": 4799} {"train_loss": -26.910602569580078, "global_step": 398376, "epoch": 4799} {"train_loss": -26.496692657470703, "global_step": 398377, "epoch": 4799} {"train_loss": -26.722265243530273, "global_step": 398378, "epoch": 4799} {"train_loss": -26.031335830688477, "global_step": 398379, "epoch": 4799} {"train_loss": -25.98467445373535, "global_step": 398380, "epoch": 4799} {"train_loss": -26.660322189331055, "global_step": 398381, "epoch": 4799} {"train_loss": -26.593708038330078, "global_step": 398382, "epoch": 4799} {"train_loss": -26.775999069213867, "global_step": 398383, "epoch": 4799} {"train_loss": -26.245569229125977, "global_step": 398384, "epoch": 4799} {"train_loss": -26.23822021484375, "global_step": 398385, "epoch": 4799} {"train_loss": -26.186071395874023, "global_step": 398386, "epoch": 4799} {"train_loss": -26.343427658081055, "global_step": 398387, "epoch": 4799} {"train_loss": -26.335712432861328, "global_step": 398388, "epoch": 4799} {"train_loss": -26.700458526611328, "global_step": 398389, "epoch": 4799} {"train_loss": -26.358123779296875, "global_step": 398390, "epoch": 4799} {"train_loss": -26.52906608581543, "global_step": 398391, "epoch": 4799} {"train_loss": -26.165191650390625, "global_step": 398392, "epoch": 4799} {"train_loss": -26.5943546295166, "global_step": 398393, "epoch": 4799} {"train_loss": -26.66448402404785, "global_step": 398394, "epoch": 4799} {"train_loss": -26.724197387695312, "global_step": 398395, "epoch": 4799} {"train_loss": -26.664188385009766, "global_step": 398396, "epoch": 4799} {"train_loss": -26.661645889282227, "global_step": 398397, "epoch": 4799} {"train_loss": -26.71917152404785, "global_step": 398398, "epoch": 4799} {"train_loss": -26.467010153345313, "global_step": 398399, "epoch": 4799, "val_loss": 6825160.0} {"train_loss": -25.4035587310791, "global_step": 398400, "epoch": 4800} {"train_loss": -25.951679229736328, "global_step": 398401, "epoch": 4800} {"train_loss": -25.665449142456055, "global_step": 398402, "epoch": 4800} {"train_loss": -25.8725643157959, "global_step": 398403, "epoch": 4800} {"train_loss": -26.0211124420166, "global_step": 398404, "epoch": 4800} {"train_loss": -25.85064125061035, "global_step": 398405, "epoch": 4800} {"train_loss": -26.13301658630371, "global_step": 398406, "epoch": 4800} {"train_loss": -25.7413330078125, "global_step": 398407, "epoch": 4800} {"train_loss": -25.85755729675293, "global_step": 398408, "epoch": 4800} {"train_loss": -25.8315486907959, "global_step": 398409, "epoch": 4800} {"train_loss": -26.061370849609375, "global_step": 398410, "epoch": 4800} {"train_loss": -26.043664932250977, "global_step": 398411, "epoch": 4800} {"train_loss": -26.03122329711914, "global_step": 398412, "epoch": 4800} {"train_loss": -26.21173667907715, "global_step": 398413, "epoch": 4800} {"train_loss": -25.99933433532715, "global_step": 398414, "epoch": 4800} {"train_loss": -26.7549991607666, "global_step": 398415, "epoch": 4800} {"train_loss": -26.344228744506836, "global_step": 398416, "epoch": 4800} {"train_loss": -26.429418563842773, "global_step": 398417, "epoch": 4800} {"train_loss": -26.46573829650879, "global_step": 398418, "epoch": 4800} {"train_loss": -26.22124671936035, "global_step": 398419, "epoch": 4800} {"train_loss": -26.492734909057617, "global_step": 398420, "epoch": 4800} {"train_loss": -26.459125518798828, "global_step": 398421, "epoch": 4800} {"train_loss": -26.55781364440918, "global_step": 398422, "epoch": 4800} {"train_loss": -26.54608154296875, "global_step": 398423, "epoch": 4800} {"train_loss": -26.58341407775879, "global_step": 398424, "epoch": 4800} {"train_loss": -26.324277877807617, "global_step": 398425, "epoch": 4800} {"train_loss": -26.714914321899414, "global_step": 398426, "epoch": 4800} {"train_loss": -26.7180233001709, "global_step": 398427, "epoch": 4800} {"train_loss": -26.839466094970703, "global_step": 398428, "epoch": 4800} {"train_loss": -27.025787353515625, "global_step": 398429, "epoch": 4800} {"train_loss": -26.65586280822754, "global_step": 398430, "epoch": 4800} {"train_loss": -26.554685592651367, "global_step": 398431, "epoch": 4800} {"train_loss": -26.77910804748535, "global_step": 398432, "epoch": 4800} {"train_loss": -26.537626266479492, "global_step": 398433, "epoch": 4800} {"train_loss": -26.654478073120117, "global_step": 398434, "epoch": 4800} {"train_loss": -27.029687881469727, "global_step": 398435, "epoch": 4800} {"train_loss": -26.50345230102539, "global_step": 398436, "epoch": 4800} {"train_loss": -26.8391056060791, "global_step": 398437, "epoch": 4800} {"train_loss": -26.503507614135742, "global_step": 398438, "epoch": 4800} {"train_loss": -26.634033203125, "global_step": 398439, "epoch": 4800} {"train_loss": -27.272321701049805, "global_step": 398440, "epoch": 4800} {"train_loss": -26.509902954101562, "global_step": 398441, "epoch": 4800} {"train_loss": -26.2454891204834, "global_step": 398442, "epoch": 4800} {"train_loss": -26.439802169799805, "global_step": 398443, "epoch": 4800} {"train_loss": -26.938690185546875, "global_step": 398444, "epoch": 4800} {"train_loss": -27.115188598632812, "global_step": 398445, "epoch": 4800} {"train_loss": -26.867273330688477, "global_step": 398446, "epoch": 4800} {"train_loss": -26.67181396484375, "global_step": 398447, "epoch": 4800} {"train_loss": -26.6219539642334, "global_step": 398448, "epoch": 4800} {"train_loss": -26.58194351196289, "global_step": 398449, "epoch": 4800} {"train_loss": -26.101547241210938, "global_step": 398450, "epoch": 4800} {"train_loss": -25.981786727905273, "global_step": 398451, "epoch": 4800} {"train_loss": -26.48012351989746, "global_step": 398452, "epoch": 4800} {"train_loss": -26.74432945251465, "global_step": 398453, "epoch": 4800} {"train_loss": -26.191213607788086, "global_step": 398454, "epoch": 4800} {"train_loss": -26.60284996032715, "global_step": 398455, "epoch": 4800} {"train_loss": -26.273712158203125, "global_step": 398456, "epoch": 4800} {"train_loss": -26.63470458984375, "global_step": 398457, "epoch": 4800} {"train_loss": -26.63547706604004, "global_step": 398458, "epoch": 4800} {"train_loss": -26.720556259155273, "global_step": 398459, "epoch": 4800} {"train_loss": -26.4370059967041, "global_step": 398460, "epoch": 4800} {"train_loss": -26.43634605407715, "global_step": 398461, "epoch": 4800} {"train_loss": -26.167987823486328, "global_step": 398462, "epoch": 4800} {"train_loss": -26.7447452545166, "global_step": 398463, "epoch": 4800} {"train_loss": -26.35529899597168, "global_step": 398464, "epoch": 4800} {"train_loss": -26.239850997924805, "global_step": 398465, "epoch": 4800} {"train_loss": -26.700092315673828, "global_step": 398466, "epoch": 4800} {"train_loss": -26.57730484008789, "global_step": 398467, "epoch": 4800} {"train_loss": -26.933868408203125, "global_step": 398468, "epoch": 4800} {"train_loss": -26.561206817626953, "global_step": 398469, "epoch": 4800} {"train_loss": -26.769739151000977, "global_step": 398470, "epoch": 4800} {"train_loss": -26.465116500854492, "global_step": 398471, "epoch": 4800} {"train_loss": -26.811084747314453, "global_step": 398472, "epoch": 4800} {"train_loss": -26.478296279907227, "global_step": 398473, "epoch": 4800} {"train_loss": -26.847126007080078, "global_step": 398474, "epoch": 4800} {"train_loss": -26.60806655883789, "global_step": 398475, "epoch": 4800} {"train_loss": -27.083988189697266, "global_step": 398476, "epoch": 4800} {"train_loss": -26.436105728149414, "global_step": 398477, "epoch": 4800} {"train_loss": -26.774463653564453, "global_step": 398478, "epoch": 4800} {"train_loss": -26.779388427734375, "global_step": 398479, "epoch": 4800} {"train_loss": -26.521753311157227, "global_step": 398480, "epoch": 4800} {"train_loss": -26.740407943725586, "global_step": 398481, "epoch": 4800} {"train_loss": -26.481828229973114, "global_step": 398482, "epoch": 4800, "train/sim_max_reward_0": 0.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4500000": 1.0, "test/sim_max_reward_4500001": 0.0, "test/sim_max_reward_4500002": 1.0, "test/sim_max_reward_4500003": 1.0, "test/sim_max_reward_4500004": 0.0, "test/sim_max_reward_4500005": 1.0, "test/sim_max_reward_4500006": 1.0, "test/sim_max_reward_4500007": 0.0, "test/sim_max_reward_4500008": 1.0, "test/sim_max_reward_4500009": 1.0, "test/sim_max_reward_4500010": 1.0, "test/sim_max_reward_4500011": 1.0, "test/sim_max_reward_4500012": 1.0, "test/sim_max_reward_4500013": 0.0, "test/sim_max_reward_4500014": 1.0, "test/sim_max_reward_4500015": 1.0, "test/sim_max_reward_4500016": 1.0, "test/sim_max_reward_4500017": 1.0, "test/sim_max_reward_4500018": 1.0, "test/sim_max_reward_4500019": 0.0, "test/sim_max_reward_4500020": 1.0, "test/sim_max_reward_4500021": 1.0, "train/mean_score": 0.8333333333333334, "test/mean_score": 0.7727272727272727, "val_loss": 6685710.0} {"train_loss": -26.434696197509766, "global_step": 398483, "epoch": 4801} {"train_loss": -26.249963760375977, "global_step": 398484, "epoch": 4801} {"train_loss": -26.27825355529785, "global_step": 398485, "epoch": 4801} {"train_loss": -26.540637969970703, "global_step": 398486, "epoch": 4801} {"train_loss": -26.40781593322754, "global_step": 398487, "epoch": 4801} {"train_loss": -26.6037540435791, "global_step": 398488, "epoch": 4801} {"train_loss": -26.03021240234375, "global_step": 398489, "epoch": 4801} {"train_loss": -26.507007598876953, "global_step": 398490, "epoch": 4801} {"train_loss": -26.44671058654785, "global_step": 398491, "epoch": 4801} {"train_loss": -26.392181396484375, "global_step": 398492, "epoch": 4801} {"train_loss": -26.30426025390625, "global_step": 398493, "epoch": 4801} {"train_loss": -26.398365020751953, "global_step": 398494, "epoch": 4801} {"train_loss": -26.338354110717773, "global_step": 398495, "epoch": 4801} {"train_loss": -26.374319076538086, "global_step": 398496, "epoch": 4801} {"train_loss": -26.5075626373291, "global_step": 398497, "epoch": 4801} {"train_loss": -26.587549209594727, "global_step": 398498, "epoch": 4801} {"train_loss": -26.578144073486328, "global_step": 398499, "epoch": 4801} {"train_loss": -26.742307662963867, "global_step": 398500, "epoch": 4801} {"train_loss": -26.60699462890625, "global_step": 398501, "epoch": 4801} {"train_loss": -26.645618438720703, "global_step": 398502, "epoch": 4801} {"train_loss": -26.458093643188477, "global_step": 398503, "epoch": 4801} {"train_loss": -26.183256149291992, "global_step": 398504, "epoch": 4801} {"train_loss": -26.28964614868164, "global_step": 398505, "epoch": 4801} {"train_loss": -26.75375747680664, "global_step": 398506, "epoch": 4801} {"train_loss": -26.989179611206055, "global_step": 398507, "epoch": 4801} {"train_loss": -26.56206703186035, "global_step": 398508, "epoch": 4801} {"train_loss": -26.964130401611328, "global_step": 398509, "epoch": 4801} {"train_loss": -26.84004783630371, "global_step": 398510, "epoch": 4801} {"train_loss": -26.415027618408203, "global_step": 398511, "epoch": 4801} {"train_loss": -26.56028175354004, "global_step": 398512, "epoch": 4801} {"train_loss": -26.383258819580078, "global_step": 398513, "epoch": 4801} {"train_loss": -26.9608211517334, "global_step": 398514, "epoch": 4801} {"train_loss": -26.723424911499023, "global_step": 398515, "epoch": 4801} {"train_loss": -26.659591674804688, "global_step": 398516, "epoch": 4801} {"train_loss": -26.589435577392578, "global_step": 398517, "epoch": 4801} {"train_loss": -27.071063995361328, "global_step": 398518, "epoch": 4801} {"train_loss": -26.795713424682617, "global_step": 398519, "epoch": 4801} {"train_loss": -26.65411949157715, "global_step": 398520, "epoch": 4801} {"train_loss": -26.2862491607666, "global_step": 398521, "epoch": 4801} {"train_loss": -26.601964950561523, "global_step": 398522, "epoch": 4801} {"train_loss": -26.028181076049805, "global_step": 398523, "epoch": 4801} {"train_loss": -26.45194435119629, "global_step": 398524, "epoch": 4801} {"train_loss": -26.05306053161621, "global_step": 398525, "epoch": 4801} {"train_loss": -26.381866455078125, "global_step": 398526, "epoch": 4801} {"train_loss": -26.367034912109375, "global_step": 398527, "epoch": 4801} {"train_loss": -26.800384521484375, "global_step": 398528, "epoch": 4801} {"train_loss": -26.331785202026367, "global_step": 398529, "epoch": 4801} {"train_loss": -26.7874755859375, "global_step": 398530, "epoch": 4801} {"train_loss": -26.365015029907227, "global_step": 398531, "epoch": 4801} {"train_loss": -27.077306747436523, "global_step": 398532, "epoch": 4801} {"train_loss": -26.49329948425293, "global_step": 398533, "epoch": 4801} {"train_loss": -26.7319278717041, "global_step": 398534, "epoch": 4801} {"train_loss": -26.88309097290039, "global_step": 398535, "epoch": 4801} {"train_loss": -26.417875289916992, "global_step": 398536, "epoch": 4801} {"train_loss": -26.408796310424805, "global_step": 398537, "epoch": 4801} {"train_loss": -26.798925399780273, "global_step": 398538, "epoch": 4801} {"train_loss": -26.44769287109375, "global_step": 398539, "epoch": 4801} {"train_loss": -26.325037002563477, "global_step": 398540, "epoch": 4801} {"train_loss": -26.611021041870117, "global_step": 398541, "epoch": 4801} {"train_loss": -26.326135635375977, "global_step": 398542, "epoch": 4801} {"train_loss": -26.574106216430664, "global_step": 398543, "epoch": 4801} {"train_loss": -26.730871200561523, "global_step": 398544, "epoch": 4801} {"train_loss": -27.07954978942871, "global_step": 398545, "epoch": 4801} {"train_loss": -26.453632354736328, "global_step": 398546, "epoch": 4801} {"train_loss": -26.65874671936035, "global_step": 398547, "epoch": 4801} {"train_loss": -26.753870010375977, "global_step": 398548, "epoch": 4801} {"train_loss": -26.532190322875977, "global_step": 398549, "epoch": 4801} {"train_loss": -26.9608154296875, "global_step": 398550, "epoch": 4801} {"train_loss": -26.72553062438965, "global_step": 398551, "epoch": 4801} {"train_loss": -26.63943862915039, "global_step": 398552, "epoch": 4801} {"train_loss": -27.103931427001953, "global_step": 398553, "epoch": 4801} {"train_loss": -26.85540771484375, "global_step": 398554, "epoch": 4801} {"train_loss": -26.522729873657227, "global_step": 398555, "epoch": 4801} {"train_loss": -26.557819366455078, "global_step": 398556, "epoch": 4801} {"train_loss": -26.743268966674805, "global_step": 398557, "epoch": 4801} {"train_loss": -26.674280166625977, "global_step": 398558, "epoch": 4801} {"train_loss": -26.6258602142334, "global_step": 398559, "epoch": 4801} {"train_loss": -26.798095703125, "global_step": 398560, "epoch": 4801} {"train_loss": -26.483373641967773, "global_step": 398561, "epoch": 4801} {"train_loss": -26.636640548706055, "global_step": 398562, "epoch": 4801} {"train_loss": -27.08711051940918, "global_step": 398563, "epoch": 4801} {"train_loss": -27.385089874267578, "global_step": 398564, "epoch": 4801} {"train_loss": -26.58966036877, "global_step": 398565, "epoch": 4801, "val_loss": 6666618.0} {"train_loss": -26.61899757385254, "global_step": 398566, "epoch": 4802} {"train_loss": -26.069860458374023, "global_step": 398567, "epoch": 4802} {"train_loss": -26.460529327392578, "global_step": 398568, "epoch": 4802} {"train_loss": -25.889820098876953, "global_step": 398569, "epoch": 4802} {"train_loss": -26.405780792236328, "global_step": 398570, "epoch": 4802} {"train_loss": -26.545724868774414, "global_step": 398571, "epoch": 4802} {"train_loss": -26.343259811401367, "global_step": 398572, "epoch": 4802} {"train_loss": -26.485082626342773, "global_step": 398573, "epoch": 4802} {"train_loss": -26.42734718322754, "global_step": 398574, "epoch": 4802} {"train_loss": -26.58180046081543, "global_step": 398575, "epoch": 4802} {"train_loss": -26.55462074279785, "global_step": 398576, "epoch": 4802} {"train_loss": -26.461252212524414, "global_step": 398577, "epoch": 4802} {"train_loss": -26.378759384155273, "global_step": 398578, "epoch": 4802} {"train_loss": -26.329565048217773, "global_step": 398579, "epoch": 4802} {"train_loss": -26.2620849609375, "global_step": 398580, "epoch": 4802} {"train_loss": -25.894140243530273, "global_step": 398581, "epoch": 4802} {"train_loss": -26.675012588500977, "global_step": 398582, "epoch": 4802} {"train_loss": -26.358875274658203, "global_step": 398583, "epoch": 4802} {"train_loss": -26.6048583984375, "global_step": 398584, "epoch": 4802} {"train_loss": -26.657428741455078, "global_step": 398585, "epoch": 4802} {"train_loss": -26.469654083251953, "global_step": 398586, "epoch": 4802} {"train_loss": -26.313562393188477, "global_step": 398587, "epoch": 4802} {"train_loss": -26.494916915893555, "global_step": 398588, "epoch": 4802} {"train_loss": -26.19974708557129, "global_step": 398589, "epoch": 4802} {"train_loss": -26.302038192749023, "global_step": 398590, "epoch": 4802} {"train_loss": -26.408222198486328, "global_step": 398591, "epoch": 4802} {"train_loss": -26.62354850769043, "global_step": 398592, "epoch": 4802} {"train_loss": -26.138919830322266, "global_step": 398593, "epoch": 4802} {"train_loss": -26.658435821533203, "global_step": 398594, "epoch": 4802} {"train_loss": -26.853002548217773, "global_step": 398595, "epoch": 4802} {"train_loss": -26.49794578552246, "global_step": 398596, "epoch": 4802} {"train_loss": -26.60151481628418, "global_step": 398597, "epoch": 4802} {"train_loss": -26.9663143157959, "global_step": 398598, "epoch": 4802} {"train_loss": -26.3698673248291, "global_step": 398599, "epoch": 4802} {"train_loss": -26.637609481811523, "global_step": 398600, "epoch": 4802} {"train_loss": -26.773473739624023, "global_step": 398601, "epoch": 4802} {"train_loss": -26.81965446472168, "global_step": 398602, "epoch": 4802} {"train_loss": -26.519376754760742, "global_step": 398603, "epoch": 4802} {"train_loss": -26.72566032409668, "global_step": 398604, "epoch": 4802} {"train_loss": -26.586400985717773, "global_step": 398605, "epoch": 4802} {"train_loss": -26.60540771484375, "global_step": 398606, "epoch": 4802} {"train_loss": -26.5181884765625, "global_step": 398607, "epoch": 4802} {"train_loss": -26.935382843017578, "global_step": 398608, "epoch": 4802} {"train_loss": -26.885730743408203, "global_step": 398609, "epoch": 4802} {"train_loss": -26.908063888549805, "global_step": 398610, "epoch": 4802} {"train_loss": -26.87489128112793, "global_step": 398611, "epoch": 4802} {"train_loss": -26.66187858581543, "global_step": 398612, "epoch": 4802} {"train_loss": -26.745101928710938, "global_step": 398613, "epoch": 4802} {"train_loss": -26.3677921295166, "global_step": 398614, "epoch": 4802} {"train_loss": -26.961206436157227, "global_step": 398615, "epoch": 4802} {"train_loss": -26.41095542907715, "global_step": 398616, "epoch": 4802} {"train_loss": -26.82062339782715, "global_step": 398617, "epoch": 4802} {"train_loss": -27.092304229736328, "global_step": 398618, "epoch": 4802} {"train_loss": -26.617895126342773, "global_step": 398619, "epoch": 4802} {"train_loss": -26.520187377929688, "global_step": 398620, "epoch": 4802} {"train_loss": -26.672443389892578, "global_step": 398621, "epoch": 4802} {"train_loss": -26.85626792907715, "global_step": 398622, "epoch": 4802} {"train_loss": -27.190475463867188, "global_step": 398623, "epoch": 4802} {"train_loss": -26.819843292236328, "global_step": 398624, "epoch": 4802} {"train_loss": -26.628570556640625, "global_step": 398625, "epoch": 4802} {"train_loss": -26.617233276367188, "global_step": 398626, "epoch": 4802} {"train_loss": -26.649124145507812, "global_step": 398627, "epoch": 4802} {"train_loss": -26.745038986206055, "global_step": 398628, "epoch": 4802} {"train_loss": -26.573949813842773, "global_step": 398629, "epoch": 4802} {"train_loss": -26.65764808654785, "global_step": 398630, "epoch": 4802} {"train_loss": -26.597211837768555, "global_step": 398631, "epoch": 4802} {"train_loss": -26.62444496154785, "global_step": 398632, "epoch": 4802} {"train_loss": -26.984018325805664, "global_step": 398633, "epoch": 4802} {"train_loss": -26.568927764892578, "global_step": 398634, "epoch": 4802} {"train_loss": -26.379138946533203, "global_step": 398635, "epoch": 4802} {"train_loss": -26.45102882385254, "global_step": 398636, "epoch": 4802} {"train_loss": -26.17096519470215, "global_step": 398637, "epoch": 4802} {"train_loss": -26.276147842407227, "global_step": 398638, "epoch": 4802} {"train_loss": -26.848102569580078, "global_step": 398639, "epoch": 4802} {"train_loss": -26.782108306884766, "global_step": 398640, "epoch": 4802} {"train_loss": -26.539230346679688, "global_step": 398641, "epoch": 4802} {"train_loss": -26.255603790283203, "global_step": 398642, "epoch": 4802} {"train_loss": -26.644495010375977, "global_step": 398643, "epoch": 4802} {"train_loss": -26.424579620361328, "global_step": 398644, "epoch": 4802} {"train_loss": -26.526153564453125, "global_step": 398645, "epoch": 4802} {"train_loss": -26.808164596557617, "global_step": 398646, "epoch": 4802} {"train_loss": -26.821935653686523, "global_step": 398647, "epoch": 4802} {"train_loss": -26.576391013271838, "global_step": 398648, "epoch": 4802, "val_loss": 6698426.5} {"train_loss": -26.677398681640625, "global_step": 398649, "epoch": 4803} {"train_loss": -26.390350341796875, "global_step": 398650, "epoch": 4803} {"train_loss": -26.460050582885742, "global_step": 398651, "epoch": 4803} {"train_loss": -25.99672508239746, "global_step": 398652, "epoch": 4803} {"train_loss": -26.560016632080078, "global_step": 398653, "epoch": 4803} {"train_loss": -26.22262954711914, "global_step": 398654, "epoch": 4803} {"train_loss": -26.175870895385742, "global_step": 398655, "epoch": 4803} {"train_loss": -26.719327926635742, "global_step": 398656, "epoch": 4803} {"train_loss": -26.215368270874023, "global_step": 398657, "epoch": 4803} {"train_loss": -26.639188766479492, "global_step": 398658, "epoch": 4803} {"train_loss": -26.004987716674805, "global_step": 398659, "epoch": 4803} {"train_loss": -26.690969467163086, "global_step": 398660, "epoch": 4803} {"train_loss": -26.298810958862305, "global_step": 398661, "epoch": 4803} {"train_loss": -25.968915939331055, "global_step": 398662, "epoch": 4803} {"train_loss": -26.613927841186523, "global_step": 398663, "epoch": 4803} {"train_loss": -26.415510177612305, "global_step": 398664, "epoch": 4803} {"train_loss": -26.730283737182617, "global_step": 398665, "epoch": 4803} {"train_loss": -26.460697174072266, "global_step": 398666, "epoch": 4803} {"train_loss": -26.400959014892578, "global_step": 398667, "epoch": 4803} {"train_loss": -26.541967391967773, "global_step": 398668, "epoch": 4803} {"train_loss": -26.3852481842041, "global_step": 398669, "epoch": 4803} {"train_loss": -26.57851219177246, "global_step": 398670, "epoch": 4803} {"train_loss": -26.645557403564453, "global_step": 398671, "epoch": 4803} {"train_loss": -26.485858917236328, "global_step": 398672, "epoch": 4803} {"train_loss": -26.903717041015625, "global_step": 398673, "epoch": 4803} {"train_loss": -26.890735626220703, "global_step": 398674, "epoch": 4803} {"train_loss": -26.523962020874023, "global_step": 398675, "epoch": 4803} {"train_loss": -26.624540328979492, "global_step": 398676, "epoch": 4803} {"train_loss": -26.944910049438477, "global_step": 398677, "epoch": 4803} {"train_loss": -26.455402374267578, "global_step": 398678, "epoch": 4803} {"train_loss": -26.564838409423828, "global_step": 398679, "epoch": 4803} {"train_loss": -27.085357666015625, "global_step": 398680, "epoch": 4803} {"train_loss": -26.379541397094727, "global_step": 398681, "epoch": 4803} {"train_loss": -26.66481590270996, "global_step": 398682, "epoch": 4803} {"train_loss": -26.474002838134766, "global_step": 398683, "epoch": 4803} {"train_loss": -26.56894874572754, "global_step": 398684, "epoch": 4803} {"train_loss": -26.575178146362305, "global_step": 398685, "epoch": 4803} {"train_loss": -26.688644409179688, "global_step": 398686, "epoch": 4803} {"train_loss": -26.72946548461914, "global_step": 398687, "epoch": 4803} {"train_loss": -26.665632247924805, "global_step": 398688, "epoch": 4803} {"train_loss": -26.74348258972168, "global_step": 398689, "epoch": 4803} {"train_loss": -26.664413452148438, "global_step": 398690, "epoch": 4803} {"train_loss": -26.555646896362305, "global_step": 398691, "epoch": 4803} {"train_loss": -26.99867057800293, "global_step": 398692, "epoch": 4803} {"train_loss": -26.59162712097168, "global_step": 398693, "epoch": 4803} {"train_loss": -26.93067741394043, "global_step": 398694, "epoch": 4803} {"train_loss": -26.6793270111084, "global_step": 398695, "epoch": 4803} {"train_loss": -27.013879776000977, "global_step": 398696, "epoch": 4803} {"train_loss": -26.576745986938477, "global_step": 398697, "epoch": 4803} {"train_loss": -26.70951271057129, "global_step": 398698, "epoch": 4803} {"train_loss": -26.49214744567871, "global_step": 398699, "epoch": 4803} {"train_loss": -26.8593692779541, "global_step": 398700, "epoch": 4803} {"train_loss": -27.049970626831055, "global_step": 398701, "epoch": 4803} {"train_loss": -26.8497371673584, "global_step": 398702, "epoch": 4803} {"train_loss": -26.294342041015625, "global_step": 398703, "epoch": 4803} {"train_loss": -25.874862670898438, "global_step": 398704, "epoch": 4803} {"train_loss": -25.784351348876953, "global_step": 398705, "epoch": 4803} {"train_loss": -26.2591495513916, "global_step": 398706, "epoch": 4803} {"train_loss": -26.628341674804688, "global_step": 398707, "epoch": 4803} {"train_loss": -25.755573272705078, "global_step": 398708, "epoch": 4803} {"train_loss": -26.36016273498535, "global_step": 398709, "epoch": 4803} {"train_loss": -26.1510066986084, "global_step": 398710, "epoch": 4803} {"train_loss": -25.978961944580078, "global_step": 398711, "epoch": 4803} {"train_loss": -26.335458755493164, "global_step": 398712, "epoch": 4803} {"train_loss": -25.985986709594727, "global_step": 398713, "epoch": 4803} {"train_loss": -26.483327865600586, "global_step": 398714, "epoch": 4803} {"train_loss": -26.523019790649414, "global_step": 398715, "epoch": 4803} {"train_loss": -26.50333023071289, "global_step": 398716, "epoch": 4803} {"train_loss": -26.104883193969727, "global_step": 398717, "epoch": 4803} {"train_loss": -26.244647979736328, "global_step": 398718, "epoch": 4803} {"train_loss": -26.572589874267578, "global_step": 398719, "epoch": 4803} {"train_loss": -26.540952682495117, "global_step": 398720, "epoch": 4803} {"train_loss": -26.440359115600586, "global_step": 398721, "epoch": 4803} {"train_loss": -26.418766021728516, "global_step": 398722, "epoch": 4803} {"train_loss": -26.4929141998291, "global_step": 398723, "epoch": 4803} {"train_loss": -26.60255241394043, "global_step": 398724, "epoch": 4803} {"train_loss": -26.54268455505371, "global_step": 398725, "epoch": 4803} {"train_loss": -26.651870727539062, "global_step": 398726, "epoch": 4803} {"train_loss": -26.595233917236328, "global_step": 398727, "epoch": 4803} {"train_loss": -26.46583366394043, "global_step": 398728, "epoch": 4803} {"train_loss": -26.5157470703125, "global_step": 398729, "epoch": 4803} {"train_loss": -26.472217559814453, "global_step": 398730, "epoch": 4803} {"train_loss": -26.505408620259846, "global_step": 398731, "epoch": 4803, "val_loss": 6603473.0} {"train_loss": -25.764001846313477, "global_step": 398732, "epoch": 4804} {"train_loss": -24.991289138793945, "global_step": 398733, "epoch": 4804} {"train_loss": -24.958097457885742, "global_step": 398734, "epoch": 4804} {"train_loss": -25.98321533203125, "global_step": 398735, "epoch": 4804} {"train_loss": -25.46157455444336, "global_step": 398736, "epoch": 4804} {"train_loss": -25.513532638549805, "global_step": 398737, "epoch": 4804} {"train_loss": -26.018354415893555, "global_step": 398738, "epoch": 4804} {"train_loss": -25.8900089263916, "global_step": 398739, "epoch": 4804} {"train_loss": -26.03602409362793, "global_step": 398740, "epoch": 4804} {"train_loss": -26.249103546142578, "global_step": 398741, "epoch": 4804} {"train_loss": -26.180139541625977, "global_step": 398742, "epoch": 4804} {"train_loss": -26.247833251953125, "global_step": 398743, "epoch": 4804} {"train_loss": -25.790861129760742, "global_step": 398744, "epoch": 4804} {"train_loss": -26.310413360595703, "global_step": 398745, "epoch": 4804} {"train_loss": -26.117740631103516, "global_step": 398746, "epoch": 4804} {"train_loss": -26.4736385345459, "global_step": 398747, "epoch": 4804} {"train_loss": -26.335683822631836, "global_step": 398748, "epoch": 4804} {"train_loss": -26.362762451171875, "global_step": 398749, "epoch": 4804} {"train_loss": -26.48200035095215, "global_step": 398750, "epoch": 4804} {"train_loss": -26.0701847076416, "global_step": 398751, "epoch": 4804} {"train_loss": -26.388025283813477, "global_step": 398752, "epoch": 4804} {"train_loss": -26.29743766784668, "global_step": 398753, "epoch": 4804} {"train_loss": -26.646020889282227, "global_step": 398754, "epoch": 4804} {"train_loss": -26.25327491760254, "global_step": 398755, "epoch": 4804} {"train_loss": -26.539670944213867, "global_step": 398756, "epoch": 4804} {"train_loss": -26.421796798706055, "global_step": 398757, "epoch": 4804} {"train_loss": -26.606977462768555, "global_step": 398758, "epoch": 4804} {"train_loss": -26.496118545532227, "global_step": 398759, "epoch": 4804} {"train_loss": -26.925451278686523, "global_step": 398760, "epoch": 4804} {"train_loss": -26.4431209564209, "global_step": 398761, "epoch": 4804} {"train_loss": -26.735570907592773, "global_step": 398762, "epoch": 4804} {"train_loss": -26.770978927612305, "global_step": 398763, "epoch": 4804} {"train_loss": -26.31406021118164, "global_step": 398764, "epoch": 4804} {"train_loss": -26.74505043029785, "global_step": 398765, "epoch": 4804} {"train_loss": -26.69060707092285, "global_step": 398766, "epoch": 4804} {"train_loss": -26.452741622924805, "global_step": 398767, "epoch": 4804} {"train_loss": -26.7300968170166, "global_step": 398768, "epoch": 4804} {"train_loss": -26.56683349609375, "global_step": 398769, "epoch": 4804} {"train_loss": -26.483734130859375, "global_step": 398770, "epoch": 4804} {"train_loss": -26.896930694580078, "global_step": 398771, "epoch": 4804} {"train_loss": -26.890295028686523, "global_step": 398772, "epoch": 4804} {"train_loss": -26.85373878479004, "global_step": 398773, "epoch": 4804} {"train_loss": -26.882822036743164, "global_step": 398774, "epoch": 4804} {"train_loss": -26.790714263916016, "global_step": 398775, "epoch": 4804} {"train_loss": -26.514251708984375, "global_step": 398776, "epoch": 4804} {"train_loss": -26.91729736328125, "global_step": 398777, "epoch": 4804} {"train_loss": -26.735448837280273, "global_step": 398778, "epoch": 4804} {"train_loss": -26.77829933166504, "global_step": 398779, "epoch": 4804} {"train_loss": -26.922632217407227, "global_step": 398780, "epoch": 4804} {"train_loss": -26.81377601623535, "global_step": 398781, "epoch": 4804} {"train_loss": -26.65994644165039, "global_step": 398782, "epoch": 4804} {"train_loss": -27.048965454101562, "global_step": 398783, "epoch": 4804} {"train_loss": -26.422271728515625, "global_step": 398784, "epoch": 4804} {"train_loss": -26.980701446533203, "global_step": 398785, "epoch": 4804} {"train_loss": -26.871877670288086, "global_step": 398786, "epoch": 4804} {"train_loss": -26.62074089050293, "global_step": 398787, "epoch": 4804} {"train_loss": -26.487735748291016, "global_step": 398788, "epoch": 4804} {"train_loss": -25.81879997253418, "global_step": 398789, "epoch": 4804} {"train_loss": -26.4251766204834, "global_step": 398790, "epoch": 4804} {"train_loss": -26.978422164916992, "global_step": 398791, "epoch": 4804} {"train_loss": -26.72901725769043, "global_step": 398792, "epoch": 4804} {"train_loss": -26.352191925048828, "global_step": 398793, "epoch": 4804} {"train_loss": -26.677114486694336, "global_step": 398794, "epoch": 4804} {"train_loss": -26.78826332092285, "global_step": 398795, "epoch": 4804} {"train_loss": -26.737295150756836, "global_step": 398796, "epoch": 4804} {"train_loss": -26.86561393737793, "global_step": 398797, "epoch": 4804} {"train_loss": -26.45171546936035, "global_step": 398798, "epoch": 4804} {"train_loss": -26.5212345123291, "global_step": 398799, "epoch": 4804} {"train_loss": -26.475324630737305, "global_step": 398800, "epoch": 4804} {"train_loss": -26.624414443969727, "global_step": 398801, "epoch": 4804} {"train_loss": -26.2340030670166, "global_step": 398802, "epoch": 4804} {"train_loss": -26.6285343170166, "global_step": 398803, "epoch": 4804} {"train_loss": -26.53187370300293, "global_step": 398804, "epoch": 4804} {"train_loss": -26.858356475830078, "global_step": 398805, "epoch": 4804} {"train_loss": -26.548791885375977, "global_step": 398806, "epoch": 4804} {"train_loss": -26.695404052734375, "global_step": 398807, "epoch": 4804} {"train_loss": -26.946216583251953, "global_step": 398808, "epoch": 4804} {"train_loss": -26.64300537109375, "global_step": 398809, "epoch": 4804} {"train_loss": -26.755407333374023, "global_step": 398810, "epoch": 4804} {"train_loss": -26.508764266967773, "global_step": 398811, "epoch": 4804} {"train_loss": -26.707843780517578, "global_step": 398812, "epoch": 4804} {"train_loss": -26.458688735961914, "global_step": 398813, "epoch": 4804} {"train_loss": -26.47374732235828, "global_step": 398814, "epoch": 4804, "val_loss": 6651649.0} {"train_loss": -26.025985717773438, "global_step": 398815, "epoch": 4805} {"train_loss": -25.943286895751953, "global_step": 398816, "epoch": 4805} {"train_loss": -25.612619400024414, "global_step": 398817, "epoch": 4805} {"train_loss": -25.75140953063965, "global_step": 398818, "epoch": 4805} {"train_loss": -26.359350204467773, "global_step": 398819, "epoch": 4805} {"train_loss": -25.708948135375977, "global_step": 398820, "epoch": 4805} {"train_loss": -26.292219161987305, "global_step": 398821, "epoch": 4805} {"train_loss": -26.259424209594727, "global_step": 398822, "epoch": 4805} {"train_loss": -25.57002830505371, "global_step": 398823, "epoch": 4805} {"train_loss": -26.289417266845703, "global_step": 398824, "epoch": 4805} {"train_loss": -26.25654411315918, "global_step": 398825, "epoch": 4805} {"train_loss": -26.253942489624023, "global_step": 398826, "epoch": 4805} {"train_loss": -26.48190689086914, "global_step": 398827, "epoch": 4805} {"train_loss": -26.2374267578125, "global_step": 398828, "epoch": 4805} {"train_loss": -26.426877975463867, "global_step": 398829, "epoch": 4805} {"train_loss": -26.5450382232666, "global_step": 398830, "epoch": 4805} {"train_loss": -26.575010299682617, "global_step": 398831, "epoch": 4805} {"train_loss": -26.62054443359375, "global_step": 398832, "epoch": 4805} {"train_loss": -26.24114418029785, "global_step": 398833, "epoch": 4805} {"train_loss": -26.3138484954834, "global_step": 398834, "epoch": 4805} {"train_loss": -26.807870864868164, "global_step": 398835, "epoch": 4805} {"train_loss": -26.009244918823242, "global_step": 398836, "epoch": 4805} {"train_loss": -26.186567306518555, "global_step": 398837, "epoch": 4805} {"train_loss": -26.439233779907227, "global_step": 398838, "epoch": 4805} {"train_loss": -26.26007080078125, "global_step": 398839, "epoch": 4805} {"train_loss": -26.370771408081055, "global_step": 398840, "epoch": 4805} {"train_loss": -26.72150230407715, "global_step": 398841, "epoch": 4805} {"train_loss": -26.30719566345215, "global_step": 398842, "epoch": 4805} {"train_loss": -26.646564483642578, "global_step": 398843, "epoch": 4805} {"train_loss": -26.54994010925293, "global_step": 398844, "epoch": 4805} {"train_loss": -26.446619033813477, "global_step": 398845, "epoch": 4805} {"train_loss": -26.748748779296875, "global_step": 398846, "epoch": 4805} {"train_loss": -26.933944702148438, "global_step": 398847, "epoch": 4805} {"train_loss": -26.680017471313477, "global_step": 398848, "epoch": 4805} {"train_loss": -26.4274959564209, "global_step": 398849, "epoch": 4805} {"train_loss": -26.5029239654541, "global_step": 398850, "epoch": 4805} {"train_loss": -26.673261642456055, "global_step": 398851, "epoch": 4805} {"train_loss": -26.495466232299805, "global_step": 398852, "epoch": 4805} {"train_loss": -26.66786003112793, "global_step": 398853, "epoch": 4805} {"train_loss": -26.713520050048828, "global_step": 398854, "epoch": 4805} {"train_loss": -26.72748374938965, "global_step": 398855, "epoch": 4805} {"train_loss": -26.805078506469727, "global_step": 398856, "epoch": 4805} {"train_loss": -26.507190704345703, "global_step": 398857, "epoch": 4805} {"train_loss": -26.56296157836914, "global_step": 398858, "epoch": 4805} {"train_loss": -26.659992218017578, "global_step": 398859, "epoch": 4805} {"train_loss": -26.668066024780273, "global_step": 398860, "epoch": 4805} {"train_loss": -26.934438705444336, "global_step": 398861, "epoch": 4805} {"train_loss": -26.616180419921875, "global_step": 398862, "epoch": 4805} {"train_loss": -26.6242733001709, "global_step": 398863, "epoch": 4805} {"train_loss": -27.005319595336914, "global_step": 398864, "epoch": 4805} {"train_loss": -26.39249610900879, "global_step": 398865, "epoch": 4805} {"train_loss": -26.826385498046875, "global_step": 398866, "epoch": 4805} {"train_loss": -26.727197647094727, "global_step": 398867, "epoch": 4805} {"train_loss": -26.630720138549805, "global_step": 398868, "epoch": 4805} {"train_loss": -26.82563591003418, "global_step": 398869, "epoch": 4805} {"train_loss": -26.88385009765625, "global_step": 398870, "epoch": 4805} {"train_loss": -26.44135093688965, "global_step": 398871, "epoch": 4805} {"train_loss": -26.67055320739746, "global_step": 398872, "epoch": 4805} {"train_loss": -26.68609619140625, "global_step": 398873, "epoch": 4805} {"train_loss": -26.789316177368164, "global_step": 398874, "epoch": 4805} {"train_loss": -26.535724639892578, "global_step": 398875, "epoch": 4805} {"train_loss": -26.80586051940918, "global_step": 398876, "epoch": 4805} {"train_loss": -26.18818473815918, "global_step": 398877, "epoch": 4805} {"train_loss": -26.671751022338867, "global_step": 398878, "epoch": 4805} {"train_loss": -26.728656768798828, "global_step": 398879, "epoch": 4805} {"train_loss": -26.79347038269043, "global_step": 398880, "epoch": 4805} {"train_loss": -26.6640682220459, "global_step": 398881, "epoch": 4805} {"train_loss": -26.78627586364746, "global_step": 398882, "epoch": 4805} {"train_loss": -26.177505493164062, "global_step": 398883, "epoch": 4805} {"train_loss": -26.575719833374023, "global_step": 398884, "epoch": 4805} {"train_loss": -26.76734733581543, "global_step": 398885, "epoch": 4805} {"train_loss": -26.455419540405273, "global_step": 398886, "epoch": 4805} {"train_loss": -26.624868392944336, "global_step": 398887, "epoch": 4805} {"train_loss": -26.822040557861328, "global_step": 398888, "epoch": 4805} {"train_loss": -26.511816024780273, "global_step": 398889, "epoch": 4805} {"train_loss": -26.0699405670166, "global_step": 398890, "epoch": 4805} {"train_loss": -26.142017364501953, "global_step": 398891, "epoch": 4805} {"train_loss": -26.17413330078125, "global_step": 398892, "epoch": 4805} {"train_loss": -26.405263900756836, "global_step": 398893, "epoch": 4805} {"train_loss": -26.37428092956543, "global_step": 398894, "epoch": 4805} {"train_loss": -26.360565185546875, "global_step": 398895, "epoch": 4805} {"train_loss": -26.46944236755371, "global_step": 398896, "epoch": 4805} {"train_loss": -26.478963622127672, "global_step": 398897, "epoch": 4805, "val_loss": 6694663.0} {"train_loss": -25.60413932800293, "global_step": 398898, "epoch": 4806} {"train_loss": -25.94936180114746, "global_step": 398899, "epoch": 4806} {"train_loss": -26.1162052154541, "global_step": 398900, "epoch": 4806} {"train_loss": -25.67703628540039, "global_step": 398901, "epoch": 4806} {"train_loss": -25.881072998046875, "global_step": 398902, "epoch": 4806} {"train_loss": -25.588947296142578, "global_step": 398903, "epoch": 4806} {"train_loss": -26.473752975463867, "global_step": 398904, "epoch": 4806} {"train_loss": -26.18665885925293, "global_step": 398905, "epoch": 4806} {"train_loss": -26.061574935913086, "global_step": 398906, "epoch": 4806} {"train_loss": -26.058990478515625, "global_step": 398907, "epoch": 4806} {"train_loss": -26.395587921142578, "global_step": 398908, "epoch": 4806} {"train_loss": -26.47211265563965, "global_step": 398909, "epoch": 4806} {"train_loss": -26.23223304748535, "global_step": 398910, "epoch": 4806} {"train_loss": -26.588010787963867, "global_step": 398911, "epoch": 4806} {"train_loss": -26.2299747467041, "global_step": 398912, "epoch": 4806} {"train_loss": -26.499256134033203, "global_step": 398913, "epoch": 4806} {"train_loss": -26.116470336914062, "global_step": 398914, "epoch": 4806} {"train_loss": -26.1578311920166, "global_step": 398915, "epoch": 4806} {"train_loss": -26.17327308654785, "global_step": 398916, "epoch": 4806} {"train_loss": -26.41571044921875, "global_step": 398917, "epoch": 4806} {"train_loss": -26.28419303894043, "global_step": 398918, "epoch": 4806} {"train_loss": -26.12890625, "global_step": 398919, "epoch": 4806} {"train_loss": -26.682966232299805, "global_step": 398920, "epoch": 4806} {"train_loss": -26.66896629333496, "global_step": 398921, "epoch": 4806} {"train_loss": -26.7803897857666, "global_step": 398922, "epoch": 4806} {"train_loss": -26.85230827331543, "global_step": 398923, "epoch": 4806} {"train_loss": -26.287281036376953, "global_step": 398924, "epoch": 4806} {"train_loss": -26.653182983398438, "global_step": 398925, "epoch": 4806} {"train_loss": -26.6464786529541, "global_step": 398926, "epoch": 4806} {"train_loss": -26.29891014099121, "global_step": 398927, "epoch": 4806} {"train_loss": -27.10133171081543, "global_step": 398928, "epoch": 4806} {"train_loss": -26.514835357666016, "global_step": 398929, "epoch": 4806} {"train_loss": -26.369298934936523, "global_step": 398930, "epoch": 4806} {"train_loss": -26.51178550720215, "global_step": 398931, "epoch": 4806} {"train_loss": -26.698688507080078, "global_step": 398932, "epoch": 4806} {"train_loss": -26.6029052734375, "global_step": 398933, "epoch": 4806} {"train_loss": -26.644031524658203, "global_step": 398934, "epoch": 4806} {"train_loss": -26.875837326049805, "global_step": 398935, "epoch": 4806} {"train_loss": -26.65130615234375, "global_step": 398936, "epoch": 4806} {"train_loss": -25.923389434814453, "global_step": 398937, "epoch": 4806} {"train_loss": -25.565799713134766, "global_step": 398938, "epoch": 4806} {"train_loss": -26.45920181274414, "global_step": 398939, "epoch": 4806} {"train_loss": -26.289093017578125, "global_step": 398940, "epoch": 4806} {"train_loss": -26.4371337890625, "global_step": 398941, "epoch": 4806} {"train_loss": -26.778018951416016, "global_step": 398942, "epoch": 4806} {"train_loss": -25.8012752532959, "global_step": 398943, "epoch": 4806} {"train_loss": -26.428699493408203, "global_step": 398944, "epoch": 4806} {"train_loss": -26.366867065429688, "global_step": 398945, "epoch": 4806} {"train_loss": -26.54595947265625, "global_step": 398946, "epoch": 4806} {"train_loss": -26.599578857421875, "global_step": 398947, "epoch": 4806} {"train_loss": -26.383451461791992, "global_step": 398948, "epoch": 4806} {"train_loss": -26.18328857421875, "global_step": 398949, "epoch": 4806} {"train_loss": -26.814605712890625, "global_step": 398950, "epoch": 4806} {"train_loss": -26.607519149780273, "global_step": 398951, "epoch": 4806} {"train_loss": -26.490015029907227, "global_step": 398952, "epoch": 4806} {"train_loss": -26.51630973815918, "global_step": 398953, "epoch": 4806} {"train_loss": -26.088483810424805, "global_step": 398954, "epoch": 4806} {"train_loss": -26.443485260009766, "global_step": 398955, "epoch": 4806} {"train_loss": -27.078454971313477, "global_step": 398956, "epoch": 4806} {"train_loss": -26.015417098999023, "global_step": 398957, "epoch": 4806} {"train_loss": -26.492273330688477, "global_step": 398958, "epoch": 4806} {"train_loss": -26.60431480407715, "global_step": 398959, "epoch": 4806} {"train_loss": -25.80889320373535, "global_step": 398960, "epoch": 4806} {"train_loss": -26.420307159423828, "global_step": 398961, "epoch": 4806} {"train_loss": -26.606555938720703, "global_step": 398962, "epoch": 4806} {"train_loss": -26.444976806640625, "global_step": 398963, "epoch": 4806} {"train_loss": -26.27484130859375, "global_step": 398964, "epoch": 4806} {"train_loss": -26.843067169189453, "global_step": 398965, "epoch": 4806} {"train_loss": -26.524932861328125, "global_step": 398966, "epoch": 4806} {"train_loss": -26.304059982299805, "global_step": 398967, "epoch": 4806} {"train_loss": -26.162778854370117, "global_step": 398968, "epoch": 4806} {"train_loss": -26.429279327392578, "global_step": 398969, "epoch": 4806} {"train_loss": -26.572446823120117, "global_step": 398970, "epoch": 4806} {"train_loss": -26.292388916015625, "global_step": 398971, "epoch": 4806} {"train_loss": -26.46839714050293, "global_step": 398972, "epoch": 4806} {"train_loss": -26.818317413330078, "global_step": 398973, "epoch": 4806} {"train_loss": -26.33283805847168, "global_step": 398974, "epoch": 4806} {"train_loss": -26.950180053710938, "global_step": 398975, "epoch": 4806} {"train_loss": -26.738056182861328, "global_step": 398976, "epoch": 4806} {"train_loss": -26.616674423217773, "global_step": 398977, "epoch": 4806} {"train_loss": -26.41047477722168, "global_step": 398978, "epoch": 4806} {"train_loss": -26.553802490234375, "global_step": 398979, "epoch": 4806} {"train_loss": -26.379602845892848, "global_step": 398980, "epoch": 4806, "val_loss": 6648706.0} {"train_loss": -25.393518447875977, "global_step": 398981, "epoch": 4807} {"train_loss": -26.19818687438965, "global_step": 398982, "epoch": 4807} {"train_loss": -26.311437606811523, "global_step": 398983, "epoch": 4807} {"train_loss": -26.383026123046875, "global_step": 398984, "epoch": 4807} {"train_loss": -25.774869918823242, "global_step": 398985, "epoch": 4807} {"train_loss": -26.328588485717773, "global_step": 398986, "epoch": 4807} {"train_loss": -26.121063232421875, "global_step": 398987, "epoch": 4807} {"train_loss": -26.334487915039062, "global_step": 398988, "epoch": 4807} {"train_loss": -26.580066680908203, "global_step": 398989, "epoch": 4807} {"train_loss": -26.043054580688477, "global_step": 398990, "epoch": 4807} {"train_loss": -26.22439956665039, "global_step": 398991, "epoch": 4807} {"train_loss": -26.125120162963867, "global_step": 398992, "epoch": 4807} {"train_loss": -26.082799911499023, "global_step": 398993, "epoch": 4807} {"train_loss": -26.262908935546875, "global_step": 398994, "epoch": 4807} {"train_loss": -26.5394287109375, "global_step": 398995, "epoch": 4807} {"train_loss": -26.395620346069336, "global_step": 398996, "epoch": 4807} {"train_loss": -26.569091796875, "global_step": 398997, "epoch": 4807} {"train_loss": -26.31135368347168, "global_step": 398998, "epoch": 4807} {"train_loss": -26.78500747680664, "global_step": 398999, "epoch": 4807} {"train_loss": -26.447118759155273, "global_step": 399000, "epoch": 4807} {"train_loss": -26.637693405151367, "global_step": 399001, "epoch": 4807} {"train_loss": -26.862585067749023, "global_step": 399002, "epoch": 4807} {"train_loss": -26.312362670898438, "global_step": 399003, "epoch": 4807} {"train_loss": -26.337350845336914, "global_step": 399004, "epoch": 4807} {"train_loss": -26.518218994140625, "global_step": 399005, "epoch": 4807} {"train_loss": -26.710412979125977, "global_step": 399006, "epoch": 4807} {"train_loss": -26.200571060180664, "global_step": 399007, "epoch": 4807} {"train_loss": -26.351255416870117, "global_step": 399008, "epoch": 4807} {"train_loss": -26.5976619720459, "global_step": 399009, "epoch": 4807} {"train_loss": -26.594221115112305, "global_step": 399010, "epoch": 4807} {"train_loss": -26.6550350189209, "global_step": 399011, "epoch": 4807} {"train_loss": -26.109466552734375, "global_step": 399012, "epoch": 4807} {"train_loss": -26.523962020874023, "global_step": 399013, "epoch": 4807} {"train_loss": -26.391599655151367, "global_step": 399014, "epoch": 4807} {"train_loss": -26.589948654174805, "global_step": 399015, "epoch": 4807} {"train_loss": -26.37544059753418, "global_step": 399016, "epoch": 4807} {"train_loss": -26.311019897460938, "global_step": 399017, "epoch": 4807} {"train_loss": -25.999469757080078, "global_step": 399018, "epoch": 4807} {"train_loss": -26.007490158081055, "global_step": 399019, "epoch": 4807} {"train_loss": -26.53223991394043, "global_step": 399020, "epoch": 4807} {"train_loss": -26.50310707092285, "global_step": 399021, "epoch": 4807} {"train_loss": -26.912811279296875, "global_step": 399022, "epoch": 4807} {"train_loss": -26.803735733032227, "global_step": 399023, "epoch": 4807} {"train_loss": -26.860015869140625, "global_step": 399024, "epoch": 4807} {"train_loss": -26.833478927612305, "global_step": 399025, "epoch": 4807} {"train_loss": -26.455549240112305, "global_step": 399026, "epoch": 4807} {"train_loss": -26.6983642578125, "global_step": 399027, "epoch": 4807} {"train_loss": -26.87115478515625, "global_step": 399028, "epoch": 4807} {"train_loss": -26.571369171142578, "global_step": 399029, "epoch": 4807} {"train_loss": -26.669464111328125, "global_step": 399030, "epoch": 4807} {"train_loss": -26.725461959838867, "global_step": 399031, "epoch": 4807} {"train_loss": -26.62079429626465, "global_step": 399032, "epoch": 4807} {"train_loss": -26.453327178955078, "global_step": 399033, "epoch": 4807} {"train_loss": -26.6680965423584, "global_step": 399034, "epoch": 4807} {"train_loss": -26.34815788269043, "global_step": 399035, "epoch": 4807} {"train_loss": -26.454883575439453, "global_step": 399036, "epoch": 4807} {"train_loss": -26.9078311920166, "global_step": 399037, "epoch": 4807} {"train_loss": -26.6353702545166, "global_step": 399038, "epoch": 4807} {"train_loss": -26.431854248046875, "global_step": 399039, "epoch": 4807} {"train_loss": -26.31739616394043, "global_step": 399040, "epoch": 4807} {"train_loss": -26.761831283569336, "global_step": 399041, "epoch": 4807} {"train_loss": -26.5205020904541, "global_step": 399042, "epoch": 4807} {"train_loss": -26.92305564880371, "global_step": 399043, "epoch": 4807} {"train_loss": -26.642576217651367, "global_step": 399044, "epoch": 4807} {"train_loss": -26.969253540039062, "global_step": 399045, "epoch": 4807} {"train_loss": -26.487035751342773, "global_step": 399046, "epoch": 4807} {"train_loss": -27.024229049682617, "global_step": 399047, "epoch": 4807} {"train_loss": -26.495508193969727, "global_step": 399048, "epoch": 4807} {"train_loss": -26.748046875, "global_step": 399049, "epoch": 4807} {"train_loss": -26.865894317626953, "global_step": 399050, "epoch": 4807} {"train_loss": -27.128742218017578, "global_step": 399051, "epoch": 4807} {"train_loss": -26.7322940826416, "global_step": 399052, "epoch": 4807} {"train_loss": -26.846479415893555, "global_step": 399053, "epoch": 4807} {"train_loss": -26.776596069335938, "global_step": 399054, "epoch": 4807} {"train_loss": -26.549665451049805, "global_step": 399055, "epoch": 4807} {"train_loss": -26.53766441345215, "global_step": 399056, "epoch": 4807} {"train_loss": -25.878005981445312, "global_step": 399057, "epoch": 4807} {"train_loss": -25.989282608032227, "global_step": 399058, "epoch": 4807} {"train_loss": -26.736356735229492, "global_step": 399059, "epoch": 4807} {"train_loss": -26.71405601501465, "global_step": 399060, "epoch": 4807} {"train_loss": -26.1507625579834, "global_step": 399061, "epoch": 4807} {"train_loss": -26.0109920501709, "global_step": 399062, "epoch": 4807} {"train_loss": -26.47856932950307, "global_step": 399063, "epoch": 4807, "val_loss": 6748361.0} {"train_loss": -25.48024559020996, "global_step": 399064, "epoch": 4808} {"train_loss": -25.120359420776367, "global_step": 399065, "epoch": 4808} {"train_loss": -25.068382263183594, "global_step": 399066, "epoch": 4808} {"train_loss": -25.078462600708008, "global_step": 399067, "epoch": 4808} {"train_loss": -25.76724624633789, "global_step": 399068, "epoch": 4808} {"train_loss": -25.762556076049805, "global_step": 399069, "epoch": 4808} {"train_loss": -25.54275894165039, "global_step": 399070, "epoch": 4808} {"train_loss": -25.358251571655273, "global_step": 399071, "epoch": 4808} {"train_loss": -25.960098266601562, "global_step": 399072, "epoch": 4808} {"train_loss": -25.65188980102539, "global_step": 399073, "epoch": 4808} {"train_loss": -25.466115951538086, "global_step": 399074, "epoch": 4808} {"train_loss": -25.31573486328125, "global_step": 399075, "epoch": 4808} {"train_loss": -25.460224151611328, "global_step": 399076, "epoch": 4808} {"train_loss": -25.7346248626709, "global_step": 399077, "epoch": 4808} {"train_loss": -25.875463485717773, "global_step": 399078, "epoch": 4808} {"train_loss": -25.98356056213379, "global_step": 399079, "epoch": 4808} {"train_loss": -26.01120376586914, "global_step": 399080, "epoch": 4808} {"train_loss": -26.36931800842285, "global_step": 399081, "epoch": 4808} {"train_loss": -25.856592178344727, "global_step": 399082, "epoch": 4808} {"train_loss": -26.14969825744629, "global_step": 399083, "epoch": 4808} {"train_loss": -26.183313369750977, "global_step": 399084, "epoch": 4808} {"train_loss": -25.91128921508789, "global_step": 399085, "epoch": 4808} {"train_loss": -26.316009521484375, "global_step": 399086, "epoch": 4808} {"train_loss": -26.181182861328125, "global_step": 399087, "epoch": 4808} {"train_loss": -26.19131851196289, "global_step": 399088, "epoch": 4808} {"train_loss": -26.317792892456055, "global_step": 399089, "epoch": 4808} {"train_loss": -26.174535751342773, "global_step": 399090, "epoch": 4808} {"train_loss": -26.66815185546875, "global_step": 399091, "epoch": 4808} {"train_loss": -26.488330841064453, "global_step": 399092, "epoch": 4808} {"train_loss": -26.63837242126465, "global_step": 399093, "epoch": 4808} {"train_loss": -26.624347686767578, "global_step": 399094, "epoch": 4808} {"train_loss": -26.49753761291504, "global_step": 399095, "epoch": 4808} {"train_loss": -26.61543083190918, "global_step": 399096, "epoch": 4808} {"train_loss": -26.4085636138916, "global_step": 399097, "epoch": 4808} {"train_loss": -26.441213607788086, "global_step": 399098, "epoch": 4808} {"train_loss": -26.394758224487305, "global_step": 399099, "epoch": 4808} {"train_loss": -26.310205459594727, "global_step": 399100, "epoch": 4808} {"train_loss": -26.6404972076416, "global_step": 399101, "epoch": 4808} {"train_loss": -26.774831771850586, "global_step": 399102, "epoch": 4808} {"train_loss": -26.26479148864746, "global_step": 399103, "epoch": 4808} {"train_loss": -26.751102447509766, "global_step": 399104, "epoch": 4808} {"train_loss": -26.510663986206055, "global_step": 399105, "epoch": 4808} {"train_loss": -26.499853134155273, "global_step": 399106, "epoch": 4808} {"train_loss": -26.057498931884766, "global_step": 399107, "epoch": 4808} {"train_loss": -26.4682559967041, "global_step": 399108, "epoch": 4808} {"train_loss": -26.631591796875, "global_step": 399109, "epoch": 4808} {"train_loss": -26.427072525024414, "global_step": 399110, "epoch": 4808} {"train_loss": -26.42844009399414, "global_step": 399111, "epoch": 4808} {"train_loss": -26.251434326171875, "global_step": 399112, "epoch": 4808} {"train_loss": -26.84735107421875, "global_step": 399113, "epoch": 4808} {"train_loss": -26.93851661682129, "global_step": 399114, "epoch": 4808} {"train_loss": -26.6295223236084, "global_step": 399115, "epoch": 4808} {"train_loss": -26.622900009155273, "global_step": 399116, "epoch": 4808} {"train_loss": -26.611881256103516, "global_step": 399117, "epoch": 4808} {"train_loss": -26.783416748046875, "global_step": 399118, "epoch": 4808} {"train_loss": -26.513763427734375, "global_step": 399119, "epoch": 4808} {"train_loss": -26.99778175354004, "global_step": 399120, "epoch": 4808} {"train_loss": -26.821584701538086, "global_step": 399121, "epoch": 4808} {"train_loss": -26.62714958190918, "global_step": 399122, "epoch": 4808} {"train_loss": -26.600061416625977, "global_step": 399123, "epoch": 4808} {"train_loss": -26.325607299804688, "global_step": 399124, "epoch": 4808} {"train_loss": -26.21662712097168, "global_step": 399125, "epoch": 4808} {"train_loss": -26.80622673034668, "global_step": 399126, "epoch": 4808} {"train_loss": -26.942310333251953, "global_step": 399127, "epoch": 4808} {"train_loss": -26.502424240112305, "global_step": 399128, "epoch": 4808} {"train_loss": -26.600149154663086, "global_step": 399129, "epoch": 4808} {"train_loss": -26.6415958404541, "global_step": 399130, "epoch": 4808} {"train_loss": -26.376773834228516, "global_step": 399131, "epoch": 4808} {"train_loss": -26.262653350830078, "global_step": 399132, "epoch": 4808} {"train_loss": -26.817121505737305, "global_step": 399133, "epoch": 4808} {"train_loss": -26.94037437438965, "global_step": 399134, "epoch": 4808} {"train_loss": -26.81878662109375, "global_step": 399135, "epoch": 4808} {"train_loss": -26.520116806030273, "global_step": 399136, "epoch": 4808} {"train_loss": -26.944868087768555, "global_step": 399137, "epoch": 4808} {"train_loss": -26.461048126220703, "global_step": 399138, "epoch": 4808} {"train_loss": -26.673349380493164, "global_step": 399139, "epoch": 4808} {"train_loss": -26.518356323242188, "global_step": 399140, "epoch": 4808} {"train_loss": -26.8677921295166, "global_step": 399141, "epoch": 4808} {"train_loss": -26.7802677154541, "global_step": 399142, "epoch": 4808} {"train_loss": -26.610076904296875, "global_step": 399143, "epoch": 4808} {"train_loss": -26.503040313720703, "global_step": 399144, "epoch": 4808} {"train_loss": -26.540664672851562, "global_step": 399145, "epoch": 4808} {"train_loss": -26.335211052952044, "global_step": 399146, "epoch": 4808, "val_loss": 6772751.0} {"train_loss": -24.703227996826172, "global_step": 399147, "epoch": 4809} {"train_loss": -25.100690841674805, "global_step": 399148, "epoch": 4809} {"train_loss": -24.912141799926758, "global_step": 399149, "epoch": 4809} {"train_loss": -25.347824096679688, "global_step": 399150, "epoch": 4809} {"train_loss": -25.83613395690918, "global_step": 399151, "epoch": 4809} {"train_loss": -25.104684829711914, "global_step": 399152, "epoch": 4809} {"train_loss": -25.827268600463867, "global_step": 399153, "epoch": 4809} {"train_loss": -25.45650291442871, "global_step": 399154, "epoch": 4809} {"train_loss": -25.824665069580078, "global_step": 399155, "epoch": 4809} {"train_loss": -25.460988998413086, "global_step": 399156, "epoch": 4809} {"train_loss": -25.827573776245117, "global_step": 399157, "epoch": 4809} {"train_loss": -25.80201530456543, "global_step": 399158, "epoch": 4809} {"train_loss": -26.003692626953125, "global_step": 399159, "epoch": 4809} {"train_loss": -26.14946937561035, "global_step": 399160, "epoch": 4809} {"train_loss": -26.253889083862305, "global_step": 399161, "epoch": 4809} {"train_loss": -25.91900062561035, "global_step": 399162, "epoch": 4809} {"train_loss": -26.105985641479492, "global_step": 399163, "epoch": 4809} {"train_loss": -25.95576286315918, "global_step": 399164, "epoch": 4809} {"train_loss": -25.88100242614746, "global_step": 399165, "epoch": 4809} {"train_loss": -26.640050888061523, "global_step": 399166, "epoch": 4809} {"train_loss": -26.244535446166992, "global_step": 399167, "epoch": 4809} {"train_loss": -26.20954704284668, "global_step": 399168, "epoch": 4809} {"train_loss": -26.322601318359375, "global_step": 399169, "epoch": 4809} {"train_loss": -26.169342041015625, "global_step": 399170, "epoch": 4809} {"train_loss": -26.240055084228516, "global_step": 399171, "epoch": 4809} {"train_loss": -26.500608444213867, "global_step": 399172, "epoch": 4809} {"train_loss": -26.216482162475586, "global_step": 399173, "epoch": 4809} {"train_loss": -26.58723258972168, "global_step": 399174, "epoch": 4809} {"train_loss": -26.57557487487793, "global_step": 399175, "epoch": 4809} {"train_loss": -26.682788848876953, "global_step": 399176, "epoch": 4809} {"train_loss": -26.60553550720215, "global_step": 399177, "epoch": 4809} {"train_loss": -26.40178871154785, "global_step": 399178, "epoch": 4809} {"train_loss": -26.349018096923828, "global_step": 399179, "epoch": 4809} {"train_loss": -26.3897647857666, "global_step": 399180, "epoch": 4809} {"train_loss": -26.734699249267578, "global_step": 399181, "epoch": 4809} {"train_loss": -26.89316749572754, "global_step": 399182, "epoch": 4809} {"train_loss": -26.5443115234375, "global_step": 399183, "epoch": 4809} {"train_loss": -26.52229881286621, "global_step": 399184, "epoch": 4809} {"train_loss": -26.327880859375, "global_step": 399185, "epoch": 4809} {"train_loss": -26.459381103515625, "global_step": 399186, "epoch": 4809} {"train_loss": -26.711618423461914, "global_step": 399187, "epoch": 4809} {"train_loss": -26.703603744506836, "global_step": 399188, "epoch": 4809} {"train_loss": -26.57940673828125, "global_step": 399189, "epoch": 4809} {"train_loss": -26.448551177978516, "global_step": 399190, "epoch": 4809} {"train_loss": -25.646625518798828, "global_step": 399191, "epoch": 4809} {"train_loss": -25.853708267211914, "global_step": 399192, "epoch": 4809} {"train_loss": -26.68244743347168, "global_step": 399193, "epoch": 4809} {"train_loss": -26.26322364807129, "global_step": 399194, "epoch": 4809} {"train_loss": -25.502174377441406, "global_step": 399195, "epoch": 4809} {"train_loss": -26.4675350189209, "global_step": 399196, "epoch": 4809} {"train_loss": -26.04047203063965, "global_step": 399197, "epoch": 4809} {"train_loss": -26.3160343170166, "global_step": 399198, "epoch": 4809} {"train_loss": -26.27410316467285, "global_step": 399199, "epoch": 4809} {"train_loss": -26.379785537719727, "global_step": 399200, "epoch": 4809} {"train_loss": -26.660932540893555, "global_step": 399201, "epoch": 4809} {"train_loss": -26.529199600219727, "global_step": 399202, "epoch": 4809} {"train_loss": -26.619659423828125, "global_step": 399203, "epoch": 4809} {"train_loss": -26.901611328125, "global_step": 399204, "epoch": 4809} {"train_loss": -26.37537956237793, "global_step": 399205, "epoch": 4809} {"train_loss": -26.472631454467773, "global_step": 399206, "epoch": 4809} {"train_loss": -26.21486473083496, "global_step": 399207, "epoch": 4809} {"train_loss": -26.564395904541016, "global_step": 399208, "epoch": 4809} {"train_loss": -26.66022300720215, "global_step": 399209, "epoch": 4809} {"train_loss": -26.382251739501953, "global_step": 399210, "epoch": 4809} {"train_loss": -26.424036026000977, "global_step": 399211, "epoch": 4809} {"train_loss": -26.8843994140625, "global_step": 399212, "epoch": 4809} {"train_loss": -26.60749626159668, "global_step": 399213, "epoch": 4809} {"train_loss": -26.483997344970703, "global_step": 399214, "epoch": 4809} {"train_loss": -26.781675338745117, "global_step": 399215, "epoch": 4809} {"train_loss": -26.610620498657227, "global_step": 399216, "epoch": 4809} {"train_loss": -26.384387969970703, "global_step": 399217, "epoch": 4809} {"train_loss": -26.489526748657227, "global_step": 399218, "epoch": 4809} {"train_loss": -26.472003936767578, "global_step": 399219, "epoch": 4809} {"train_loss": -26.571430206298828, "global_step": 399220, "epoch": 4809} {"train_loss": -26.80695915222168, "global_step": 399221, "epoch": 4809} {"train_loss": -26.00105094909668, "global_step": 399222, "epoch": 4809} {"train_loss": -26.90716552734375, "global_step": 399223, "epoch": 4809} {"train_loss": -26.440351486206055, "global_step": 399224, "epoch": 4809} {"train_loss": -27.291275024414062, "global_step": 399225, "epoch": 4809} {"train_loss": -26.567174911499023, "global_step": 399226, "epoch": 4809} {"train_loss": -26.38612937927246, "global_step": 399227, "epoch": 4809} {"train_loss": -26.146764755249023, "global_step": 399228, "epoch": 4809} {"train_loss": -26.279402399637615, "global_step": 399229, "epoch": 4809, "val_loss": 6627000.5} {"train_loss": -25.333642959594727, "global_step": 399230, "epoch": 4810} {"train_loss": -25.928308486938477, "global_step": 399231, "epoch": 4810} {"train_loss": -25.660419464111328, "global_step": 399232, "epoch": 4810} {"train_loss": -25.948705673217773, "global_step": 399233, "epoch": 4810} {"train_loss": -26.312788009643555, "global_step": 399234, "epoch": 4810} {"train_loss": -26.006607055664062, "global_step": 399235, "epoch": 4810} {"train_loss": -26.5064754486084, "global_step": 399236, "epoch": 4810} {"train_loss": -26.02515983581543, "global_step": 399237, "epoch": 4810} {"train_loss": -26.38516616821289, "global_step": 399238, "epoch": 4810} {"train_loss": -26.140029907226562, "global_step": 399239, "epoch": 4810} {"train_loss": -25.949438095092773, "global_step": 399240, "epoch": 4810} {"train_loss": -26.3870849609375, "global_step": 399241, "epoch": 4810} {"train_loss": -26.464435577392578, "global_step": 399242, "epoch": 4810} {"train_loss": -26.5892276763916, "global_step": 399243, "epoch": 4810} {"train_loss": -26.6276798248291, "global_step": 399244, "epoch": 4810} {"train_loss": -26.671844482421875, "global_step": 399245, "epoch": 4810} {"train_loss": -26.65349769592285, "global_step": 399246, "epoch": 4810} {"train_loss": -26.389358520507812, "global_step": 399247, "epoch": 4810} {"train_loss": -26.67305564880371, "global_step": 399248, "epoch": 4810} {"train_loss": -26.389657974243164, "global_step": 399249, "epoch": 4810} {"train_loss": -26.283802032470703, "global_step": 399250, "epoch": 4810} {"train_loss": -26.568273544311523, "global_step": 399251, "epoch": 4810} {"train_loss": -26.41636085510254, "global_step": 399252, "epoch": 4810} {"train_loss": -26.742359161376953, "global_step": 399253, "epoch": 4810} {"train_loss": -26.476911544799805, "global_step": 399254, "epoch": 4810} {"train_loss": -26.863391876220703, "global_step": 399255, "epoch": 4810} {"train_loss": -26.905542373657227, "global_step": 399256, "epoch": 4810} {"train_loss": -26.541242599487305, "global_step": 399257, "epoch": 4810} {"train_loss": -26.956562042236328, "global_step": 399258, "epoch": 4810} {"train_loss": -26.665090560913086, "global_step": 399259, "epoch": 4810} {"train_loss": -26.513891220092773, "global_step": 399260, "epoch": 4810} {"train_loss": -26.582616806030273, "global_step": 399261, "epoch": 4810} {"train_loss": -26.7343807220459, "global_step": 399262, "epoch": 4810} {"train_loss": -26.502609252929688, "global_step": 399263, "epoch": 4810} {"train_loss": -26.791479110717773, "global_step": 399264, "epoch": 4810} {"train_loss": -26.635934829711914, "global_step": 399265, "epoch": 4810} {"train_loss": -27.022626876831055, "global_step": 399266, "epoch": 4810} {"train_loss": -26.871479034423828, "global_step": 399267, "epoch": 4810} {"train_loss": -26.77155876159668, "global_step": 399268, "epoch": 4810} {"train_loss": -26.62837791442871, "global_step": 399269, "epoch": 4810} {"train_loss": -25.933319091796875, "global_step": 399270, "epoch": 4810} {"train_loss": -25.517797470092773, "global_step": 399271, "epoch": 4810} {"train_loss": -25.69209098815918, "global_step": 399272, "epoch": 4810} {"train_loss": -26.212636947631836, "global_step": 399273, "epoch": 4810} {"train_loss": -26.1395263671875, "global_step": 399274, "epoch": 4810} {"train_loss": -26.60654067993164, "global_step": 399275, "epoch": 4810} {"train_loss": -26.441511154174805, "global_step": 399276, "epoch": 4810} {"train_loss": -26.69414710998535, "global_step": 399277, "epoch": 4810} {"train_loss": -26.692840576171875, "global_step": 399278, "epoch": 4810} {"train_loss": -26.596405029296875, "global_step": 399279, "epoch": 4810} {"train_loss": -26.72983741760254, "global_step": 399280, "epoch": 4810} {"train_loss": -26.39361572265625, "global_step": 399281, "epoch": 4810} {"train_loss": -26.561553955078125, "global_step": 399282, "epoch": 4810} {"train_loss": -26.55170249938965, "global_step": 399283, "epoch": 4810} {"train_loss": -26.967315673828125, "global_step": 399284, "epoch": 4810} {"train_loss": -26.155872344970703, "global_step": 399285, "epoch": 4810} {"train_loss": -26.9383487701416, "global_step": 399286, "epoch": 4810} {"train_loss": -26.879255294799805, "global_step": 399287, "epoch": 4810} {"train_loss": -26.339853286743164, "global_step": 399288, "epoch": 4810} {"train_loss": -26.66438865661621, "global_step": 399289, "epoch": 4810} {"train_loss": -26.573644638061523, "global_step": 399290, "epoch": 4810} {"train_loss": -26.482589721679688, "global_step": 399291, "epoch": 4810} {"train_loss": -26.13218116760254, "global_step": 399292, "epoch": 4810} {"train_loss": -25.966527938842773, "global_step": 399293, "epoch": 4810} {"train_loss": -26.466278076171875, "global_step": 399294, "epoch": 4810} {"train_loss": -26.7620906829834, "global_step": 399295, "epoch": 4810} {"train_loss": -26.602643966674805, "global_step": 399296, "epoch": 4810} {"train_loss": -26.842199325561523, "global_step": 399297, "epoch": 4810} {"train_loss": -26.496183395385742, "global_step": 399298, "epoch": 4810} {"train_loss": -26.740859985351562, "global_step": 399299, "epoch": 4810} {"train_loss": -26.293481826782227, "global_step": 399300, "epoch": 4810} {"train_loss": -26.455448150634766, "global_step": 399301, "epoch": 4810} {"train_loss": -26.706695556640625, "global_step": 399302, "epoch": 4810} {"train_loss": -27.062793731689453, "global_step": 399303, "epoch": 4810} {"train_loss": -26.527368545532227, "global_step": 399304, "epoch": 4810} {"train_loss": -26.979511260986328, "global_step": 399305, "epoch": 4810} {"train_loss": -26.858936309814453, "global_step": 399306, "epoch": 4810} {"train_loss": -26.77225685119629, "global_step": 399307, "epoch": 4810} {"train_loss": -26.646020889282227, "global_step": 399308, "epoch": 4810} {"train_loss": -26.950653076171875, "global_step": 399309, "epoch": 4810} {"train_loss": -26.843189239501953, "global_step": 399310, "epoch": 4810} {"train_loss": -26.496057510375977, "global_step": 399311, "epoch": 4810} {"train_loss": -26.51444864847574, "global_step": 399312, "epoch": 4810, "val_loss": 6686446.5} {"train_loss": -23.1903076171875, "global_step": 399313, "epoch": 4811} {"train_loss": -24.773731231689453, "global_step": 399314, "epoch": 4811} {"train_loss": -24.441913604736328, "global_step": 399315, "epoch": 4811} {"train_loss": -24.96673011779785, "global_step": 399316, "epoch": 4811} {"train_loss": -24.361711502075195, "global_step": 399317, "epoch": 4811} {"train_loss": -25.345436096191406, "global_step": 399318, "epoch": 4811} {"train_loss": -25.10614585876465, "global_step": 399319, "epoch": 4811} {"train_loss": -25.093963623046875, "global_step": 399320, "epoch": 4811} {"train_loss": -25.50214195251465, "global_step": 399321, "epoch": 4811} {"train_loss": -25.580373764038086, "global_step": 399322, "epoch": 4811} {"train_loss": -25.4715518951416, "global_step": 399323, "epoch": 4811} {"train_loss": -25.759428024291992, "global_step": 399324, "epoch": 4811} {"train_loss": -25.996362686157227, "global_step": 399325, "epoch": 4811} {"train_loss": -25.58155059814453, "global_step": 399326, "epoch": 4811} {"train_loss": -25.213117599487305, "global_step": 399327, "epoch": 4811} {"train_loss": -25.646169662475586, "global_step": 399328, "epoch": 4811} {"train_loss": -26.09441566467285, "global_step": 399329, "epoch": 4811} {"train_loss": -26.09974479675293, "global_step": 399330, "epoch": 4811} {"train_loss": -26.122655868530273, "global_step": 399331, "epoch": 4811} {"train_loss": -25.8715877532959, "global_step": 399332, "epoch": 4811} {"train_loss": -25.851144790649414, "global_step": 399333, "epoch": 4811} {"train_loss": -26.01373863220215, "global_step": 399334, "epoch": 4811} {"train_loss": -26.080026626586914, "global_step": 399335, "epoch": 4811} {"train_loss": -25.74564552307129, "global_step": 399336, "epoch": 4811} {"train_loss": -26.417936325073242, "global_step": 399337, "epoch": 4811} {"train_loss": -26.239206314086914, "global_step": 399338, "epoch": 4811} {"train_loss": -26.03120231628418, "global_step": 399339, "epoch": 4811} {"train_loss": -26.14804458618164, "global_step": 399340, "epoch": 4811} {"train_loss": -26.14824867248535, "global_step": 399341, "epoch": 4811} {"train_loss": -26.3024959564209, "global_step": 399342, "epoch": 4811} {"train_loss": -26.133319854736328, "global_step": 399343, "epoch": 4811} {"train_loss": -26.0009822845459, "global_step": 399344, "epoch": 4811} {"train_loss": -26.27790641784668, "global_step": 399345, "epoch": 4811} {"train_loss": -26.109745025634766, "global_step": 399346, "epoch": 4811} {"train_loss": -26.477109909057617, "global_step": 399347, "epoch": 4811} {"train_loss": -26.239017486572266, "global_step": 399348, "epoch": 4811} {"train_loss": -26.24308204650879, "global_step": 399349, "epoch": 4811} {"train_loss": -26.08746910095215, "global_step": 399350, "epoch": 4811} {"train_loss": -26.4200439453125, "global_step": 399351, "epoch": 4811} {"train_loss": -26.43812370300293, "global_step": 399352, "epoch": 4811} {"train_loss": -26.799072265625, "global_step": 399353, "epoch": 4811} {"train_loss": -26.780954360961914, "global_step": 399354, "epoch": 4811} {"train_loss": -26.580121994018555, "global_step": 399355, "epoch": 4811} {"train_loss": -26.174942016601562, "global_step": 399356, "epoch": 4811} {"train_loss": -26.359272003173828, "global_step": 399357, "epoch": 4811} {"train_loss": -26.3031005859375, "global_step": 399358, "epoch": 4811} {"train_loss": -26.426868438720703, "global_step": 399359, "epoch": 4811} {"train_loss": -26.592029571533203, "global_step": 399360, "epoch": 4811} {"train_loss": -26.43878746032715, "global_step": 399361, "epoch": 4811} {"train_loss": -26.76226806640625, "global_step": 399362, "epoch": 4811} {"train_loss": -26.5682373046875, "global_step": 399363, "epoch": 4811} {"train_loss": -26.262617111206055, "global_step": 399364, "epoch": 4811} {"train_loss": -26.62259864807129, "global_step": 399365, "epoch": 4811} {"train_loss": -26.43250846862793, "global_step": 399366, "epoch": 4811} {"train_loss": -26.63738441467285, "global_step": 399367, "epoch": 4811} {"train_loss": -26.535736083984375, "global_step": 399368, "epoch": 4811} {"train_loss": -26.46005630493164, "global_step": 399369, "epoch": 4811} {"train_loss": -26.383594512939453, "global_step": 399370, "epoch": 4811} {"train_loss": -26.438018798828125, "global_step": 399371, "epoch": 4811} {"train_loss": -26.845102310180664, "global_step": 399372, "epoch": 4811} {"train_loss": -26.405975341796875, "global_step": 399373, "epoch": 4811} {"train_loss": -26.532922744750977, "global_step": 399374, "epoch": 4811} {"train_loss": -26.657190322875977, "global_step": 399375, "epoch": 4811} {"train_loss": -26.785715103149414, "global_step": 399376, "epoch": 4811} {"train_loss": -26.566761016845703, "global_step": 399377, "epoch": 4811} {"train_loss": -26.4837703704834, "global_step": 399378, "epoch": 4811} {"train_loss": -26.779489517211914, "global_step": 399379, "epoch": 4811} {"train_loss": -26.886337280273438, "global_step": 399380, "epoch": 4811} {"train_loss": -26.68739891052246, "global_step": 399381, "epoch": 4811} {"train_loss": -26.911041259765625, "global_step": 399382, "epoch": 4811} {"train_loss": -26.801410675048828, "global_step": 399383, "epoch": 4811} {"train_loss": -26.56989860534668, "global_step": 399384, "epoch": 4811} {"train_loss": -26.71742820739746, "global_step": 399385, "epoch": 4811} {"train_loss": -27.277881622314453, "global_step": 399386, "epoch": 4811} {"train_loss": -26.467199325561523, "global_step": 399387, "epoch": 4811} {"train_loss": -26.129932403564453, "global_step": 399388, "epoch": 4811} {"train_loss": -26.51953125, "global_step": 399389, "epoch": 4811} {"train_loss": -26.2423152923584, "global_step": 399390, "epoch": 4811} {"train_loss": -26.4565372467041, "global_step": 399391, "epoch": 4811} {"train_loss": -26.754491806030273, "global_step": 399392, "epoch": 4811} {"train_loss": -26.567914962768555, "global_step": 399393, "epoch": 4811} {"train_loss": -26.665008544921875, "global_step": 399394, "epoch": 4811} {"train_loss": -26.189028774399354, "global_step": 399395, "epoch": 4811, "val_loss": 6838596.5} {"train_loss": -26.189062118530273, "global_step": 399396, "epoch": 4812} {"train_loss": -26.170440673828125, "global_step": 399397, "epoch": 4812} {"train_loss": -26.0368709564209, "global_step": 399398, "epoch": 4812} {"train_loss": -26.141544342041016, "global_step": 399399, "epoch": 4812} {"train_loss": -26.63080406188965, "global_step": 399400, "epoch": 4812} {"train_loss": -26.32374382019043, "global_step": 399401, "epoch": 4812} {"train_loss": -26.345783233642578, "global_step": 399402, "epoch": 4812} {"train_loss": -26.38454246520996, "global_step": 399403, "epoch": 4812} {"train_loss": -26.80543327331543, "global_step": 399404, "epoch": 4812} {"train_loss": -26.410837173461914, "global_step": 399405, "epoch": 4812} {"train_loss": -26.843881607055664, "global_step": 399406, "epoch": 4812} {"train_loss": -26.48005485534668, "global_step": 399407, "epoch": 4812} {"train_loss": -26.617528915405273, "global_step": 399408, "epoch": 4812} {"train_loss": -26.25101089477539, "global_step": 399409, "epoch": 4812} {"train_loss": -26.8161678314209, "global_step": 399410, "epoch": 4812} {"train_loss": -26.677541732788086, "global_step": 399411, "epoch": 4812} {"train_loss": -26.51385498046875, "global_step": 399412, "epoch": 4812} {"train_loss": -26.502857208251953, "global_step": 399413, "epoch": 4812} {"train_loss": -26.501209259033203, "global_step": 399414, "epoch": 4812} {"train_loss": -26.47637367248535, "global_step": 399415, "epoch": 4812} {"train_loss": -26.733991622924805, "global_step": 399416, "epoch": 4812} {"train_loss": -26.639509201049805, "global_step": 399417, "epoch": 4812} {"train_loss": -26.49114418029785, "global_step": 399418, "epoch": 4812} {"train_loss": -26.5350284576416, "global_step": 399419, "epoch": 4812} {"train_loss": -26.5406494140625, "global_step": 399420, "epoch": 4812} {"train_loss": -26.449705123901367, "global_step": 399421, "epoch": 4812} {"train_loss": -26.247467041015625, "global_step": 399422, "epoch": 4812} {"train_loss": -26.986989974975586, "global_step": 399423, "epoch": 4812} {"train_loss": -26.68511962890625, "global_step": 399424, "epoch": 4812} {"train_loss": -26.96131706237793, "global_step": 399425, "epoch": 4812} {"train_loss": -26.78428077697754, "global_step": 399426, "epoch": 4812} {"train_loss": -26.714879989624023, "global_step": 399427, "epoch": 4812} {"train_loss": -26.67352867126465, "global_step": 399428, "epoch": 4812} {"train_loss": -26.805204391479492, "global_step": 399429, "epoch": 4812} {"train_loss": -26.576618194580078, "global_step": 399430, "epoch": 4812} {"train_loss": -26.770471572875977, "global_step": 399431, "epoch": 4812} {"train_loss": -26.419458389282227, "global_step": 399432, "epoch": 4812} {"train_loss": -26.58558464050293, "global_step": 399433, "epoch": 4812} {"train_loss": -26.919696807861328, "global_step": 399434, "epoch": 4812} {"train_loss": -26.83481788635254, "global_step": 399435, "epoch": 4812} {"train_loss": -26.42854881286621, "global_step": 399436, "epoch": 4812} {"train_loss": -26.474042892456055, "global_step": 399437, "epoch": 4812} {"train_loss": -26.6390380859375, "global_step": 399438, "epoch": 4812} {"train_loss": -26.550954818725586, "global_step": 399439, "epoch": 4812} {"train_loss": -26.752857208251953, "global_step": 399440, "epoch": 4812} {"train_loss": -26.622451782226562, "global_step": 399441, "epoch": 4812} {"train_loss": -26.978071212768555, "global_step": 399442, "epoch": 4812} {"train_loss": -26.785324096679688, "global_step": 399443, "epoch": 4812} {"train_loss": -26.955890655517578, "global_step": 399444, "epoch": 4812} {"train_loss": -26.671178817749023, "global_step": 399445, "epoch": 4812} {"train_loss": -26.770923614501953, "global_step": 399446, "epoch": 4812} {"train_loss": -26.208316802978516, "global_step": 399447, "epoch": 4812} {"train_loss": -26.70576286315918, "global_step": 399448, "epoch": 4812} {"train_loss": -26.394744873046875, "global_step": 399449, "epoch": 4812} {"train_loss": -26.92012596130371, "global_step": 399450, "epoch": 4812} {"train_loss": -26.193695068359375, "global_step": 399451, "epoch": 4812} {"train_loss": -26.553251266479492, "global_step": 399452, "epoch": 4812} {"train_loss": -26.029834747314453, "global_step": 399453, "epoch": 4812} {"train_loss": -26.265867233276367, "global_step": 399454, "epoch": 4812} {"train_loss": -26.777545928955078, "global_step": 399455, "epoch": 4812} {"train_loss": -26.74213981628418, "global_step": 399456, "epoch": 4812} {"train_loss": -26.77406120300293, "global_step": 399457, "epoch": 4812} {"train_loss": -26.819639205932617, "global_step": 399458, "epoch": 4812} {"train_loss": -26.290441513061523, "global_step": 399459, "epoch": 4812} {"train_loss": -26.46420669555664, "global_step": 399460, "epoch": 4812} {"train_loss": -27.1746883392334, "global_step": 399461, "epoch": 4812} {"train_loss": -26.760242462158203, "global_step": 399462, "epoch": 4812} {"train_loss": -26.62543296813965, "global_step": 399463, "epoch": 4812} {"train_loss": -26.61746597290039, "global_step": 399464, "epoch": 4812} {"train_loss": -26.43938636779785, "global_step": 399465, "epoch": 4812} {"train_loss": -26.756433486938477, "global_step": 399466, "epoch": 4812} {"train_loss": -26.789899826049805, "global_step": 399467, "epoch": 4812} {"train_loss": -26.7277774810791, "global_step": 399468, "epoch": 4812} {"train_loss": -26.39837646484375, "global_step": 399469, "epoch": 4812} {"train_loss": -26.6395263671875, "global_step": 399470, "epoch": 4812} {"train_loss": -26.5943603515625, "global_step": 399471, "epoch": 4812} {"train_loss": -26.495635986328125, "global_step": 399472, "epoch": 4812} {"train_loss": -26.5657958984375, "global_step": 399473, "epoch": 4812} {"train_loss": -26.855758666992188, "global_step": 399474, "epoch": 4812} {"train_loss": -26.414661407470703, "global_step": 399475, "epoch": 4812} {"train_loss": -26.785842895507812, "global_step": 399476, "epoch": 4812} {"train_loss": -26.70624351501465, "global_step": 399477, "epoch": 4812} {"train_loss": -26.58327217561653, "global_step": 399478, "epoch": 4812, "val_loss": 6737600.0} {"train_loss": -26.124267578125, "global_step": 399479, "epoch": 4813} {"train_loss": -26.068098068237305, "global_step": 399480, "epoch": 4813} {"train_loss": -25.830896377563477, "global_step": 399481, "epoch": 4813} {"train_loss": -25.98072624206543, "global_step": 399482, "epoch": 4813} {"train_loss": -25.741687774658203, "global_step": 399483, "epoch": 4813} {"train_loss": -26.3616943359375, "global_step": 399484, "epoch": 4813} {"train_loss": -25.602262496948242, "global_step": 399485, "epoch": 4813} {"train_loss": -26.3328800201416, "global_step": 399486, "epoch": 4813} {"train_loss": -26.640552520751953, "global_step": 399487, "epoch": 4813} {"train_loss": -26.236602783203125, "global_step": 399488, "epoch": 4813} {"train_loss": -26.32501792907715, "global_step": 399489, "epoch": 4813} {"train_loss": -26.438024520874023, "global_step": 399490, "epoch": 4813} {"train_loss": -26.514209747314453, "global_step": 399491, "epoch": 4813} {"train_loss": -26.271066665649414, "global_step": 399492, "epoch": 4813} {"train_loss": -26.262502670288086, "global_step": 399493, "epoch": 4813} {"train_loss": -26.630125045776367, "global_step": 399494, "epoch": 4813} {"train_loss": -26.15170669555664, "global_step": 399495, "epoch": 4813} {"train_loss": -26.07822036743164, "global_step": 399496, "epoch": 4813} {"train_loss": -26.456817626953125, "global_step": 399497, "epoch": 4813} {"train_loss": -26.899290084838867, "global_step": 399498, "epoch": 4813} {"train_loss": -26.178424835205078, "global_step": 399499, "epoch": 4813} {"train_loss": -26.440587997436523, "global_step": 399500, "epoch": 4813} {"train_loss": -26.39823341369629, "global_step": 399501, "epoch": 4813} {"train_loss": -26.554960250854492, "global_step": 399502, "epoch": 4813} {"train_loss": -26.443273544311523, "global_step": 399503, "epoch": 4813} {"train_loss": -26.606008529663086, "global_step": 399504, "epoch": 4813} {"train_loss": -26.352636337280273, "global_step": 399505, "epoch": 4813} {"train_loss": -26.730010986328125, "global_step": 399506, "epoch": 4813} {"train_loss": -26.9018497467041, "global_step": 399507, "epoch": 4813} {"train_loss": -26.900049209594727, "global_step": 399508, "epoch": 4813} {"train_loss": -26.93631935119629, "global_step": 399509, "epoch": 4813} {"train_loss": -26.728601455688477, "global_step": 399510, "epoch": 4813} {"train_loss": -26.501007080078125, "global_step": 399511, "epoch": 4813} {"train_loss": -26.701892852783203, "global_step": 399512, "epoch": 4813} {"train_loss": -26.78455924987793, "global_step": 399513, "epoch": 4813} {"train_loss": -26.61051368713379, "global_step": 399514, "epoch": 4813} {"train_loss": -26.92449378967285, "global_step": 399515, "epoch": 4813} {"train_loss": -27.191837310791016, "global_step": 399516, "epoch": 4813} {"train_loss": -26.717077255249023, "global_step": 399517, "epoch": 4813} {"train_loss": -26.961688995361328, "global_step": 399518, "epoch": 4813} {"train_loss": -26.928802490234375, "global_step": 399519, "epoch": 4813} {"train_loss": -26.806371688842773, "global_step": 399520, "epoch": 4813} {"train_loss": -26.317596435546875, "global_step": 399521, "epoch": 4813} {"train_loss": -26.38504981994629, "global_step": 399522, "epoch": 4813} {"train_loss": -26.428552627563477, "global_step": 399523, "epoch": 4813} {"train_loss": -26.896448135375977, "global_step": 399524, "epoch": 4813} {"train_loss": -26.5653133392334, "global_step": 399525, "epoch": 4813} {"train_loss": -26.291259765625, "global_step": 399526, "epoch": 4813} {"train_loss": -26.98105239868164, "global_step": 399527, "epoch": 4813} {"train_loss": -26.59528923034668, "global_step": 399528, "epoch": 4813} {"train_loss": -26.3696231842041, "global_step": 399529, "epoch": 4813} {"train_loss": -26.742650985717773, "global_step": 399530, "epoch": 4813} {"train_loss": -26.320648193359375, "global_step": 399531, "epoch": 4813} {"train_loss": -26.508081436157227, "global_step": 399532, "epoch": 4813} {"train_loss": -26.70863151550293, "global_step": 399533, "epoch": 4813} {"train_loss": -26.05010414123535, "global_step": 399534, "epoch": 4813} {"train_loss": -26.943017959594727, "global_step": 399535, "epoch": 4813} {"train_loss": -26.514596939086914, "global_step": 399536, "epoch": 4813} {"train_loss": -26.690786361694336, "global_step": 399537, "epoch": 4813} {"train_loss": -26.46584129333496, "global_step": 399538, "epoch": 4813} {"train_loss": -26.66507339477539, "global_step": 399539, "epoch": 4813} {"train_loss": -26.554548263549805, "global_step": 399540, "epoch": 4813} {"train_loss": -26.791961669921875, "global_step": 399541, "epoch": 4813} {"train_loss": -26.579809188842773, "global_step": 399542, "epoch": 4813} {"train_loss": -26.415613174438477, "global_step": 399543, "epoch": 4813} {"train_loss": -26.1468563079834, "global_step": 399544, "epoch": 4813} {"train_loss": -26.398977279663086, "global_step": 399545, "epoch": 4813} {"train_loss": -26.80286979675293, "global_step": 399546, "epoch": 4813} {"train_loss": -26.86494255065918, "global_step": 399547, "epoch": 4813} {"train_loss": -26.542612075805664, "global_step": 399548, "epoch": 4813} {"train_loss": -26.78731346130371, "global_step": 399549, "epoch": 4813} {"train_loss": -26.845788955688477, "global_step": 399550, "epoch": 4813} {"train_loss": -26.91236686706543, "global_step": 399551, "epoch": 4813} {"train_loss": -26.645986557006836, "global_step": 399552, "epoch": 4813} {"train_loss": -26.652099609375, "global_step": 399553, "epoch": 4813} {"train_loss": -26.996204376220703, "global_step": 399554, "epoch": 4813} {"train_loss": -26.614593505859375, "global_step": 399555, "epoch": 4813} {"train_loss": -26.901342391967773, "global_step": 399556, "epoch": 4813} {"train_loss": -26.419843673706055, "global_step": 399557, "epoch": 4813} {"train_loss": -26.907514572143555, "global_step": 399558, "epoch": 4813} {"train_loss": -26.655927658081055, "global_step": 399559, "epoch": 4813} {"train_loss": -26.799299240112305, "global_step": 399560, "epoch": 4813} {"train_loss": -26.57048248382936, "global_step": 399561, "epoch": 4813, "val_loss": 6748324.0} {"train_loss": -26.10595703125, "global_step": 399562, "epoch": 4814} {"train_loss": -26.300687789916992, "global_step": 399563, "epoch": 4814} {"train_loss": -26.691930770874023, "global_step": 399564, "epoch": 4814} {"train_loss": -26.4888858795166, "global_step": 399565, "epoch": 4814} {"train_loss": -26.005207061767578, "global_step": 399566, "epoch": 4814} {"train_loss": -26.274744033813477, "global_step": 399567, "epoch": 4814} {"train_loss": -25.999868392944336, "global_step": 399568, "epoch": 4814} {"train_loss": -25.926633834838867, "global_step": 399569, "epoch": 4814} {"train_loss": -25.990354537963867, "global_step": 399570, "epoch": 4814} {"train_loss": -26.3275203704834, "global_step": 399571, "epoch": 4814} {"train_loss": -26.655637741088867, "global_step": 399572, "epoch": 4814} {"train_loss": -26.344623565673828, "global_step": 399573, "epoch": 4814} {"train_loss": -26.062549591064453, "global_step": 399574, "epoch": 4814} {"train_loss": -25.82244300842285, "global_step": 399575, "epoch": 4814} {"train_loss": -26.38041114807129, "global_step": 399576, "epoch": 4814} {"train_loss": -26.3125, "global_step": 399577, "epoch": 4814} {"train_loss": -26.30958366394043, "global_step": 399578, "epoch": 4814} {"train_loss": -26.12761878967285, "global_step": 399579, "epoch": 4814} {"train_loss": -26.194751739501953, "global_step": 399580, "epoch": 4814} {"train_loss": -26.47120475769043, "global_step": 399581, "epoch": 4814} {"train_loss": -26.236780166625977, "global_step": 399582, "epoch": 4814} {"train_loss": -26.303564071655273, "global_step": 399583, "epoch": 4814} {"train_loss": -26.355443954467773, "global_step": 399584, "epoch": 4814} {"train_loss": -26.60455894470215, "global_step": 399585, "epoch": 4814} {"train_loss": -26.60699462890625, "global_step": 399586, "epoch": 4814} {"train_loss": -26.59228515625, "global_step": 399587, "epoch": 4814} {"train_loss": -26.632410049438477, "global_step": 399588, "epoch": 4814} {"train_loss": -26.2475528717041, "global_step": 399589, "epoch": 4814} {"train_loss": -26.696319580078125, "global_step": 399590, "epoch": 4814} {"train_loss": -26.343795776367188, "global_step": 399591, "epoch": 4814} {"train_loss": -26.337493896484375, "global_step": 399592, "epoch": 4814} {"train_loss": -26.50961685180664, "global_step": 399593, "epoch": 4814} {"train_loss": -26.429153442382812, "global_step": 399594, "epoch": 4814} {"train_loss": -26.848501205444336, "global_step": 399595, "epoch": 4814} {"train_loss": -26.777441024780273, "global_step": 399596, "epoch": 4814} {"train_loss": -26.631505966186523, "global_step": 399597, "epoch": 4814} {"train_loss": -26.491540908813477, "global_step": 399598, "epoch": 4814} {"train_loss": -27.399444580078125, "global_step": 399599, "epoch": 4814} {"train_loss": -26.70400047302246, "global_step": 399600, "epoch": 4814} {"train_loss": -26.528491973876953, "global_step": 399601, "epoch": 4814} {"train_loss": -26.04294776916504, "global_step": 399602, "epoch": 4814} {"train_loss": -25.734891891479492, "global_step": 399603, "epoch": 4814} {"train_loss": -26.124832153320312, "global_step": 399604, "epoch": 4814} {"train_loss": -26.417236328125, "global_step": 399605, "epoch": 4814} {"train_loss": -26.388416290283203, "global_step": 399606, "epoch": 4814} {"train_loss": -26.08791160583496, "global_step": 399607, "epoch": 4814} {"train_loss": -26.59259605407715, "global_step": 399608, "epoch": 4814} {"train_loss": -26.45263671875, "global_step": 399609, "epoch": 4814} {"train_loss": -26.853961944580078, "global_step": 399610, "epoch": 4814} {"train_loss": -26.53985595703125, "global_step": 399611, "epoch": 4814} {"train_loss": -26.3775691986084, "global_step": 399612, "epoch": 4814} {"train_loss": -26.626331329345703, "global_step": 399613, "epoch": 4814} {"train_loss": -26.7628173828125, "global_step": 399614, "epoch": 4814} {"train_loss": -26.750873565673828, "global_step": 399615, "epoch": 4814} {"train_loss": -26.474103927612305, "global_step": 399616, "epoch": 4814} {"train_loss": -26.551807403564453, "global_step": 399617, "epoch": 4814} {"train_loss": -26.360193252563477, "global_step": 399618, "epoch": 4814} {"train_loss": -26.45343017578125, "global_step": 399619, "epoch": 4814} {"train_loss": -26.468505859375, "global_step": 399620, "epoch": 4814} {"train_loss": -26.898151397705078, "global_step": 399621, "epoch": 4814} {"train_loss": -25.92703628540039, "global_step": 399622, "epoch": 4814} {"train_loss": -26.1859188079834, "global_step": 399623, "epoch": 4814} {"train_loss": -26.417966842651367, "global_step": 399624, "epoch": 4814} {"train_loss": -26.366621017456055, "global_step": 399625, "epoch": 4814} {"train_loss": -26.695478439331055, "global_step": 399626, "epoch": 4814} {"train_loss": -26.395071029663086, "global_step": 399627, "epoch": 4814} {"train_loss": -26.214324951171875, "global_step": 399628, "epoch": 4814} {"train_loss": -26.251880645751953, "global_step": 399629, "epoch": 4814} {"train_loss": -26.469009399414062, "global_step": 399630, "epoch": 4814} {"train_loss": -26.666595458984375, "global_step": 399631, "epoch": 4814} {"train_loss": -26.467077255249023, "global_step": 399632, "epoch": 4814} {"train_loss": -26.113691329956055, "global_step": 399633, "epoch": 4814} {"train_loss": -26.456436157226562, "global_step": 399634, "epoch": 4814} {"train_loss": -26.3865909576416, "global_step": 399635, "epoch": 4814} {"train_loss": -26.484485626220703, "global_step": 399636, "epoch": 4814} {"train_loss": -26.21023941040039, "global_step": 399637, "epoch": 4814} {"train_loss": -26.81497573852539, "global_step": 399638, "epoch": 4814} {"train_loss": -26.299304962158203, "global_step": 399639, "epoch": 4814} {"train_loss": -26.1114559173584, "global_step": 399640, "epoch": 4814} {"train_loss": -26.488967895507812, "global_step": 399641, "epoch": 4814} {"train_loss": -26.710397720336914, "global_step": 399642, "epoch": 4814} {"train_loss": -26.374181747436523, "global_step": 399643, "epoch": 4814} {"train_loss": -26.414466329367762, "global_step": 399644, "epoch": 4814, "val_loss": 6804421.0} {"train_loss": -26.466489791870117, "global_step": 399645, "epoch": 4815} {"train_loss": -26.46482276916504, "global_step": 399646, "epoch": 4815} {"train_loss": -26.19870376586914, "global_step": 399647, "epoch": 4815} {"train_loss": -26.130126953125, "global_step": 399648, "epoch": 4815} {"train_loss": -26.153696060180664, "global_step": 399649, "epoch": 4815} {"train_loss": -26.319360733032227, "global_step": 399650, "epoch": 4815} {"train_loss": -26.430089950561523, "global_step": 399651, "epoch": 4815} {"train_loss": -25.754796981811523, "global_step": 399652, "epoch": 4815} {"train_loss": -26.188568115234375, "global_step": 399653, "epoch": 4815} {"train_loss": -26.682525634765625, "global_step": 399654, "epoch": 4815} {"train_loss": -25.987829208374023, "global_step": 399655, "epoch": 4815} {"train_loss": -26.513166427612305, "global_step": 399656, "epoch": 4815} {"train_loss": -26.130712509155273, "global_step": 399657, "epoch": 4815} {"train_loss": -26.25789451599121, "global_step": 399658, "epoch": 4815} {"train_loss": -26.489980697631836, "global_step": 399659, "epoch": 4815} {"train_loss": -26.194807052612305, "global_step": 399660, "epoch": 4815} {"train_loss": -26.148645401000977, "global_step": 399661, "epoch": 4815} {"train_loss": -26.406152725219727, "global_step": 399662, "epoch": 4815} {"train_loss": -26.573287963867188, "global_step": 399663, "epoch": 4815} {"train_loss": -26.292144775390625, "global_step": 399664, "epoch": 4815} {"train_loss": -26.46870231628418, "global_step": 399665, "epoch": 4815} {"train_loss": -26.07887077331543, "global_step": 399666, "epoch": 4815} {"train_loss": -26.67363929748535, "global_step": 399667, "epoch": 4815} {"train_loss": -26.15897560119629, "global_step": 399668, "epoch": 4815} {"train_loss": -26.894086837768555, "global_step": 399669, "epoch": 4815} {"train_loss": -26.15689468383789, "global_step": 399670, "epoch": 4815} {"train_loss": -26.271778106689453, "global_step": 399671, "epoch": 4815} {"train_loss": -26.524627685546875, "global_step": 399672, "epoch": 4815} {"train_loss": -26.8262939453125, "global_step": 399673, "epoch": 4815} {"train_loss": -26.297712326049805, "global_step": 399674, "epoch": 4815} {"train_loss": -26.82856559753418, "global_step": 399675, "epoch": 4815} {"train_loss": -26.59478759765625, "global_step": 399676, "epoch": 4815} {"train_loss": -26.568195343017578, "global_step": 399677, "epoch": 4815} {"train_loss": -26.738025665283203, "global_step": 399678, "epoch": 4815} {"train_loss": -26.243804931640625, "global_step": 399679, "epoch": 4815} {"train_loss": -26.406814575195312, "global_step": 399680, "epoch": 4815} {"train_loss": -26.471036911010742, "global_step": 399681, "epoch": 4815} {"train_loss": -26.472522735595703, "global_step": 399682, "epoch": 4815} {"train_loss": -26.45795249938965, "global_step": 399683, "epoch": 4815} {"train_loss": -26.406681060791016, "global_step": 399684, "epoch": 4815} {"train_loss": -26.717565536499023, "global_step": 399685, "epoch": 4815} {"train_loss": -26.583087921142578, "global_step": 399686, "epoch": 4815} {"train_loss": -26.69245719909668, "global_step": 399687, "epoch": 4815} {"train_loss": -26.52557373046875, "global_step": 399688, "epoch": 4815} {"train_loss": -26.49740982055664, "global_step": 399689, "epoch": 4815} {"train_loss": -26.553197860717773, "global_step": 399690, "epoch": 4815} {"train_loss": -26.96903419494629, "global_step": 399691, "epoch": 4815} {"train_loss": -26.214635848999023, "global_step": 399692, "epoch": 4815} {"train_loss": -26.656518936157227, "global_step": 399693, "epoch": 4815} {"train_loss": -26.160200119018555, "global_step": 399694, "epoch": 4815} {"train_loss": -26.93360710144043, "global_step": 399695, "epoch": 4815} {"train_loss": -26.484817504882812, "global_step": 399696, "epoch": 4815} {"train_loss": -26.954395294189453, "global_step": 399697, "epoch": 4815} {"train_loss": -26.332197189331055, "global_step": 399698, "epoch": 4815} {"train_loss": -26.552387237548828, "global_step": 399699, "epoch": 4815} {"train_loss": -26.562347412109375, "global_step": 399700, "epoch": 4815} {"train_loss": -26.404937744140625, "global_step": 399701, "epoch": 4815} {"train_loss": -26.5513916015625, "global_step": 399702, "epoch": 4815} {"train_loss": -26.607152938842773, "global_step": 399703, "epoch": 4815} {"train_loss": -26.673919677734375, "global_step": 399704, "epoch": 4815} {"train_loss": -26.2691593170166, "global_step": 399705, "epoch": 4815} {"train_loss": -26.417118072509766, "global_step": 399706, "epoch": 4815} {"train_loss": -26.943662643432617, "global_step": 399707, "epoch": 4815} {"train_loss": -26.51372718811035, "global_step": 399708, "epoch": 4815} {"train_loss": -26.463184356689453, "global_step": 399709, "epoch": 4815} {"train_loss": -26.719375610351562, "global_step": 399710, "epoch": 4815} {"train_loss": -27.0990047454834, "global_step": 399711, "epoch": 4815} {"train_loss": -26.743627548217773, "global_step": 399712, "epoch": 4815} {"train_loss": -26.80988883972168, "global_step": 399713, "epoch": 4815} {"train_loss": -27.037458419799805, "global_step": 399714, "epoch": 4815} {"train_loss": -26.440954208374023, "global_step": 399715, "epoch": 4815} {"train_loss": -26.71854019165039, "global_step": 399716, "epoch": 4815} {"train_loss": -26.57993507385254, "global_step": 399717, "epoch": 4815} {"train_loss": -27.079370498657227, "global_step": 399718, "epoch": 4815} {"train_loss": -26.677526473999023, "global_step": 399719, "epoch": 4815} {"train_loss": -26.919782638549805, "global_step": 399720, "epoch": 4815} {"train_loss": -26.899810791015625, "global_step": 399721, "epoch": 4815} {"train_loss": -27.041234970092773, "global_step": 399722, "epoch": 4815} {"train_loss": -26.578948974609375, "global_step": 399723, "epoch": 4815} {"train_loss": -26.721586227416992, "global_step": 399724, "epoch": 4815} {"train_loss": -26.863971710205078, "global_step": 399725, "epoch": 4815} {"train_loss": -26.99952507019043, "global_step": 399726, "epoch": 4815} {"train_loss": -26.539759233773474, "global_step": 399727, "epoch": 4815, "val_loss": 6684043.5} {"train_loss": -26.689062118530273, "global_step": 399728, "epoch": 4816} {"train_loss": -26.41534996032715, "global_step": 399729, "epoch": 4816} {"train_loss": -26.126623153686523, "global_step": 399730, "epoch": 4816} {"train_loss": -26.798816680908203, "global_step": 399731, "epoch": 4816} {"train_loss": -26.680683135986328, "global_step": 399732, "epoch": 4816} {"train_loss": -26.254974365234375, "global_step": 399733, "epoch": 4816} {"train_loss": -26.767675399780273, "global_step": 399734, "epoch": 4816} {"train_loss": -26.470077514648438, "global_step": 399735, "epoch": 4816} {"train_loss": -25.957000732421875, "global_step": 399736, "epoch": 4816} {"train_loss": -26.026214599609375, "global_step": 399737, "epoch": 4816} {"train_loss": -26.48182487487793, "global_step": 399738, "epoch": 4816} {"train_loss": -26.482542037963867, "global_step": 399739, "epoch": 4816} {"train_loss": -26.689496994018555, "global_step": 399740, "epoch": 4816} {"train_loss": -26.044042587280273, "global_step": 399741, "epoch": 4816} {"train_loss": -26.69632911682129, "global_step": 399742, "epoch": 4816} {"train_loss": -26.04839515686035, "global_step": 399743, "epoch": 4816} {"train_loss": -26.30080223083496, "global_step": 399744, "epoch": 4816} {"train_loss": -26.41840171813965, "global_step": 399745, "epoch": 4816} {"train_loss": -26.923887252807617, "global_step": 399746, "epoch": 4816} {"train_loss": -26.397537231445312, "global_step": 399747, "epoch": 4816} {"train_loss": -26.358524322509766, "global_step": 399748, "epoch": 4816} {"train_loss": -26.757247924804688, "global_step": 399749, "epoch": 4816} {"train_loss": -26.614444732666016, "global_step": 399750, "epoch": 4816} {"train_loss": -26.703458786010742, "global_step": 399751, "epoch": 4816} {"train_loss": -26.513702392578125, "global_step": 399752, "epoch": 4816} {"train_loss": -26.631732940673828, "global_step": 399753, "epoch": 4816} {"train_loss": -26.65020179748535, "global_step": 399754, "epoch": 4816} {"train_loss": -26.56589698791504, "global_step": 399755, "epoch": 4816} {"train_loss": -26.74004554748535, "global_step": 399756, "epoch": 4816} {"train_loss": -26.6964111328125, "global_step": 399757, "epoch": 4816} {"train_loss": -26.777807235717773, "global_step": 399758, "epoch": 4816} {"train_loss": -26.9038028717041, "global_step": 399759, "epoch": 4816} {"train_loss": -26.76258659362793, "global_step": 399760, "epoch": 4816} {"train_loss": -26.608911514282227, "global_step": 399761, "epoch": 4816} {"train_loss": -26.638446807861328, "global_step": 399762, "epoch": 4816} {"train_loss": -26.81990623474121, "global_step": 399763, "epoch": 4816} {"train_loss": -26.584577560424805, "global_step": 399764, "epoch": 4816} {"train_loss": -26.82269287109375, "global_step": 399765, "epoch": 4816} {"train_loss": -26.557703018188477, "global_step": 399766, "epoch": 4816} {"train_loss": -27.00933265686035, "global_step": 399767, "epoch": 4816} {"train_loss": -26.796735763549805, "global_step": 399768, "epoch": 4816} {"train_loss": -26.535736083984375, "global_step": 399769, "epoch": 4816} {"train_loss": -26.62932777404785, "global_step": 399770, "epoch": 4816} {"train_loss": -27.035154342651367, "global_step": 399771, "epoch": 4816} {"train_loss": -27.033939361572266, "global_step": 399772, "epoch": 4816} {"train_loss": -26.80976676940918, "global_step": 399773, "epoch": 4816} {"train_loss": -26.55914878845215, "global_step": 399774, "epoch": 4816} {"train_loss": -26.653745651245117, "global_step": 399775, "epoch": 4816} {"train_loss": -26.635541915893555, "global_step": 399776, "epoch": 4816} {"train_loss": -26.5672664642334, "global_step": 399777, "epoch": 4816} {"train_loss": -26.12863540649414, "global_step": 399778, "epoch": 4816} {"train_loss": -26.889972686767578, "global_step": 399779, "epoch": 4816} {"train_loss": -26.199665069580078, "global_step": 399780, "epoch": 4816} {"train_loss": -26.91204261779785, "global_step": 399781, "epoch": 4816} {"train_loss": -26.881261825561523, "global_step": 399782, "epoch": 4816} {"train_loss": -26.736303329467773, "global_step": 399783, "epoch": 4816} {"train_loss": -27.003463745117188, "global_step": 399784, "epoch": 4816} {"train_loss": -26.7347469329834, "global_step": 399785, "epoch": 4816} {"train_loss": -26.605688095092773, "global_step": 399786, "epoch": 4816} {"train_loss": -26.006546020507812, "global_step": 399787, "epoch": 4816} {"train_loss": -26.127294540405273, "global_step": 399788, "epoch": 4816} {"train_loss": -26.378381729125977, "global_step": 399789, "epoch": 4816} {"train_loss": -26.4074764251709, "global_step": 399790, "epoch": 4816} {"train_loss": -26.06524658203125, "global_step": 399791, "epoch": 4816} {"train_loss": -26.19977378845215, "global_step": 399792, "epoch": 4816} {"train_loss": -26.400808334350586, "global_step": 399793, "epoch": 4816} {"train_loss": -26.190481185913086, "global_step": 399794, "epoch": 4816} {"train_loss": -26.51094627380371, "global_step": 399795, "epoch": 4816} {"train_loss": -26.667387008666992, "global_step": 399796, "epoch": 4816} {"train_loss": -26.6544189453125, "global_step": 399797, "epoch": 4816} {"train_loss": -26.489805221557617, "global_step": 399798, "epoch": 4816} {"train_loss": -26.505590438842773, "global_step": 399799, "epoch": 4816} {"train_loss": -26.87131118774414, "global_step": 399800, "epoch": 4816} {"train_loss": -26.63117790222168, "global_step": 399801, "epoch": 4816} {"train_loss": -27.002180099487305, "global_step": 399802, "epoch": 4816} {"train_loss": -26.84455680847168, "global_step": 399803, "epoch": 4816} {"train_loss": -26.468534469604492, "global_step": 399804, "epoch": 4816} {"train_loss": -26.969989776611328, "global_step": 399805, "epoch": 4816} {"train_loss": -26.56402015686035, "global_step": 399806, "epoch": 4816} {"train_loss": -26.77003288269043, "global_step": 399807, "epoch": 4816} {"train_loss": -26.761335372924805, "global_step": 399808, "epoch": 4816} {"train_loss": -26.677865982055664, "global_step": 399809, "epoch": 4816} {"train_loss": -26.59517954631024, "global_step": 399810, "epoch": 4816, "val_loss": 6703626.5} {"train_loss": -26.375640869140625, "global_step": 399811, "epoch": 4817} {"train_loss": -26.7966365814209, "global_step": 399812, "epoch": 4817} {"train_loss": -25.94040298461914, "global_step": 399813, "epoch": 4817} {"train_loss": -26.2027530670166, "global_step": 399814, "epoch": 4817} {"train_loss": -26.3197021484375, "global_step": 399815, "epoch": 4817} {"train_loss": -26.434595108032227, "global_step": 399816, "epoch": 4817} {"train_loss": -26.399206161499023, "global_step": 399817, "epoch": 4817} {"train_loss": -26.28403663635254, "global_step": 399818, "epoch": 4817} {"train_loss": -26.5401611328125, "global_step": 399819, "epoch": 4817} {"train_loss": -26.173803329467773, "global_step": 399820, "epoch": 4817} {"train_loss": -26.184301376342773, "global_step": 399821, "epoch": 4817} {"train_loss": -26.49488639831543, "global_step": 399822, "epoch": 4817} {"train_loss": -26.0751895904541, "global_step": 399823, "epoch": 4817} {"train_loss": -26.690433502197266, "global_step": 399824, "epoch": 4817} {"train_loss": -26.427417755126953, "global_step": 399825, "epoch": 4817} {"train_loss": -26.614797592163086, "global_step": 399826, "epoch": 4817} {"train_loss": -26.082447052001953, "global_step": 399827, "epoch": 4817} {"train_loss": -26.32208824157715, "global_step": 399828, "epoch": 4817} {"train_loss": -26.188159942626953, "global_step": 399829, "epoch": 4817} {"train_loss": -27.043201446533203, "global_step": 399830, "epoch": 4817} {"train_loss": -26.475830078125, "global_step": 399831, "epoch": 4817} {"train_loss": -26.6883487701416, "global_step": 399832, "epoch": 4817} {"train_loss": -26.711017608642578, "global_step": 399833, "epoch": 4817} {"train_loss": -26.474700927734375, "global_step": 399834, "epoch": 4817} {"train_loss": -26.596073150634766, "global_step": 399835, "epoch": 4817} {"train_loss": -26.583654403686523, "global_step": 399836, "epoch": 4817} {"train_loss": -26.369504928588867, "global_step": 399837, "epoch": 4817} {"train_loss": -26.560754776000977, "global_step": 399838, "epoch": 4817} {"train_loss": -26.6137638092041, "global_step": 399839, "epoch": 4817} {"train_loss": -26.611902236938477, "global_step": 399840, "epoch": 4817} {"train_loss": -26.35245132446289, "global_step": 399841, "epoch": 4817} {"train_loss": -26.465662002563477, "global_step": 399842, "epoch": 4817} {"train_loss": -26.3966064453125, "global_step": 399843, "epoch": 4817} {"train_loss": -26.475677490234375, "global_step": 399844, "epoch": 4817} {"train_loss": -26.711820602416992, "global_step": 399845, "epoch": 4817} {"train_loss": -26.416366577148438, "global_step": 399846, "epoch": 4817} {"train_loss": -26.689123153686523, "global_step": 399847, "epoch": 4817} {"train_loss": -26.75900650024414, "global_step": 399848, "epoch": 4817} {"train_loss": -26.721654891967773, "global_step": 399849, "epoch": 4817} {"train_loss": -26.9066162109375, "global_step": 399850, "epoch": 4817} {"train_loss": -26.827823638916016, "global_step": 399851, "epoch": 4817} {"train_loss": -26.39404296875, "global_step": 399852, "epoch": 4817} {"train_loss": -26.044605255126953, "global_step": 399853, "epoch": 4817} {"train_loss": -26.991342544555664, "global_step": 399854, "epoch": 4817} {"train_loss": -26.709110260009766, "global_step": 399855, "epoch": 4817} {"train_loss": -26.604190826416016, "global_step": 399856, "epoch": 4817} {"train_loss": -26.66530418395996, "global_step": 399857, "epoch": 4817} {"train_loss": -26.65398597717285, "global_step": 399858, "epoch": 4817} {"train_loss": -26.622879028320312, "global_step": 399859, "epoch": 4817} {"train_loss": -26.3913631439209, "global_step": 399860, "epoch": 4817} {"train_loss": -26.246906280517578, "global_step": 399861, "epoch": 4817} {"train_loss": -26.686368942260742, "global_step": 399862, "epoch": 4817} {"train_loss": -26.61260986328125, "global_step": 399863, "epoch": 4817} {"train_loss": -26.510480880737305, "global_step": 399864, "epoch": 4817} {"train_loss": -26.59699821472168, "global_step": 399865, "epoch": 4817} {"train_loss": -26.33642578125, "global_step": 399866, "epoch": 4817} {"train_loss": -26.92853355407715, "global_step": 399867, "epoch": 4817} {"train_loss": -26.177337646484375, "global_step": 399868, "epoch": 4817} {"train_loss": -26.238433837890625, "global_step": 399869, "epoch": 4817} {"train_loss": -26.393945693969727, "global_step": 399870, "epoch": 4817} {"train_loss": -26.395679473876953, "global_step": 399871, "epoch": 4817} {"train_loss": -26.67447280883789, "global_step": 399872, "epoch": 4817} {"train_loss": -26.677490234375, "global_step": 399873, "epoch": 4817} {"train_loss": -26.6820011138916, "global_step": 399874, "epoch": 4817} {"train_loss": -26.840423583984375, "global_step": 399875, "epoch": 4817} {"train_loss": -26.544431686401367, "global_step": 399876, "epoch": 4817} {"train_loss": -26.733671188354492, "global_step": 399877, "epoch": 4817} {"train_loss": -26.84309196472168, "global_step": 399878, "epoch": 4817} {"train_loss": -26.62391471862793, "global_step": 399879, "epoch": 4817} {"train_loss": -26.7000675201416, "global_step": 399880, "epoch": 4817} {"train_loss": -26.6552791595459, "global_step": 399881, "epoch": 4817} {"train_loss": -26.742481231689453, "global_step": 399882, "epoch": 4817} {"train_loss": -26.636457443237305, "global_step": 399883, "epoch": 4817} {"train_loss": -26.932580947875977, "global_step": 399884, "epoch": 4817} {"train_loss": -26.78889274597168, "global_step": 399885, "epoch": 4817} {"train_loss": -26.686920166015625, "global_step": 399886, "epoch": 4817} {"train_loss": -26.815366744995117, "global_step": 399887, "epoch": 4817} {"train_loss": -26.589441299438477, "global_step": 399888, "epoch": 4817} {"train_loss": -27.101022720336914, "global_step": 399889, "epoch": 4817} {"train_loss": -26.49993324279785, "global_step": 399890, "epoch": 4817} {"train_loss": -26.967451095581055, "global_step": 399891, "epoch": 4817} {"train_loss": -26.66506004333496, "global_step": 399892, "epoch": 4817} {"train_loss": -26.56589115096862, "global_step": 399893, "epoch": 4817, "val_loss": 6620963.0} {"train_loss": -26.242963790893555, "global_step": 399894, "epoch": 4818} {"train_loss": -25.931257247924805, "global_step": 399895, "epoch": 4818} {"train_loss": -26.117889404296875, "global_step": 399896, "epoch": 4818} {"train_loss": -26.67119789123535, "global_step": 399897, "epoch": 4818} {"train_loss": -26.577640533447266, "global_step": 399898, "epoch": 4818} {"train_loss": -26.32404899597168, "global_step": 399899, "epoch": 4818} {"train_loss": -26.461027145385742, "global_step": 399900, "epoch": 4818} {"train_loss": -26.822772979736328, "global_step": 399901, "epoch": 4818} {"train_loss": -26.457239151000977, "global_step": 399902, "epoch": 4818} {"train_loss": -26.176664352416992, "global_step": 399903, "epoch": 4818} {"train_loss": -26.331762313842773, "global_step": 399904, "epoch": 4818} {"train_loss": -26.491413116455078, "global_step": 399905, "epoch": 4818} {"train_loss": -26.31355094909668, "global_step": 399906, "epoch": 4818} {"train_loss": -26.616790771484375, "global_step": 399907, "epoch": 4818} {"train_loss": -26.5406551361084, "global_step": 399908, "epoch": 4818} {"train_loss": -26.491186141967773, "global_step": 399909, "epoch": 4818} {"train_loss": -26.30609130859375, "global_step": 399910, "epoch": 4818} {"train_loss": -26.683231353759766, "global_step": 399911, "epoch": 4818} {"train_loss": -26.491125106811523, "global_step": 399912, "epoch": 4818} {"train_loss": -26.604223251342773, "global_step": 399913, "epoch": 4818} {"train_loss": -26.471837997436523, "global_step": 399914, "epoch": 4818} {"train_loss": -27.065460205078125, "global_step": 399915, "epoch": 4818} {"train_loss": -26.51235008239746, "global_step": 399916, "epoch": 4818} {"train_loss": -26.676944732666016, "global_step": 399917, "epoch": 4818} {"train_loss": -27.106245040893555, "global_step": 399918, "epoch": 4818} {"train_loss": -26.551801681518555, "global_step": 399919, "epoch": 4818} {"train_loss": -26.78333854675293, "global_step": 399920, "epoch": 4818} {"train_loss": -26.691679000854492, "global_step": 399921, "epoch": 4818} {"train_loss": -26.886823654174805, "global_step": 399922, "epoch": 4818} {"train_loss": -26.619985580444336, "global_step": 399923, "epoch": 4818} {"train_loss": -27.129858016967773, "global_step": 399924, "epoch": 4818} {"train_loss": -26.910093307495117, "global_step": 399925, "epoch": 4818} {"train_loss": -26.678525924682617, "global_step": 399926, "epoch": 4818} {"train_loss": -26.65418815612793, "global_step": 399927, "epoch": 4818} {"train_loss": -26.555044174194336, "global_step": 399928, "epoch": 4818} {"train_loss": -26.47605323791504, "global_step": 399929, "epoch": 4818} {"train_loss": -26.5191707611084, "global_step": 399930, "epoch": 4818} {"train_loss": -26.843069076538086, "global_step": 399931, "epoch": 4818} {"train_loss": -26.62367057800293, "global_step": 399932, "epoch": 4818} {"train_loss": -26.906946182250977, "global_step": 399933, "epoch": 4818} {"train_loss": -26.548877716064453, "global_step": 399934, "epoch": 4818} {"train_loss": -26.3961124420166, "global_step": 399935, "epoch": 4818} {"train_loss": -26.64316749572754, "global_step": 399936, "epoch": 4818} {"train_loss": -26.55375099182129, "global_step": 399937, "epoch": 4818} {"train_loss": -26.4078426361084, "global_step": 399938, "epoch": 4818} {"train_loss": -26.506000518798828, "global_step": 399939, "epoch": 4818} {"train_loss": -26.600156784057617, "global_step": 399940, "epoch": 4818} {"train_loss": -26.98661231994629, "global_step": 399941, "epoch": 4818} {"train_loss": -26.55791664123535, "global_step": 399942, "epoch": 4818} {"train_loss": -26.82769775390625, "global_step": 399943, "epoch": 4818} {"train_loss": -26.51032066345215, "global_step": 399944, "epoch": 4818} {"train_loss": -26.751667022705078, "global_step": 399945, "epoch": 4818} {"train_loss": -26.995046615600586, "global_step": 399946, "epoch": 4818} {"train_loss": -26.865436553955078, "global_step": 399947, "epoch": 4818} {"train_loss": -26.971036911010742, "global_step": 399948, "epoch": 4818} {"train_loss": -26.588043212890625, "global_step": 399949, "epoch": 4818} {"train_loss": -26.530292510986328, "global_step": 399950, "epoch": 4818} {"train_loss": -26.73198890686035, "global_step": 399951, "epoch": 4818} {"train_loss": -26.704620361328125, "global_step": 399952, "epoch": 4818} {"train_loss": -26.75684928894043, "global_step": 399953, "epoch": 4818} {"train_loss": -26.861373901367188, "global_step": 399954, "epoch": 4818} {"train_loss": -26.96213722229004, "global_step": 399955, "epoch": 4818} {"train_loss": -26.777475357055664, "global_step": 399956, "epoch": 4818} {"train_loss": -26.784021377563477, "global_step": 399957, "epoch": 4818} {"train_loss": -26.887537002563477, "global_step": 399958, "epoch": 4818} {"train_loss": -26.63907241821289, "global_step": 399959, "epoch": 4818} {"train_loss": -26.617109298706055, "global_step": 399960, "epoch": 4818} {"train_loss": -26.81589126586914, "global_step": 399961, "epoch": 4818} {"train_loss": -26.767560958862305, "global_step": 399962, "epoch": 4818} {"train_loss": -26.683425903320312, "global_step": 399963, "epoch": 4818} {"train_loss": -26.66316795349121, "global_step": 399964, "epoch": 4818} {"train_loss": -26.916025161743164, "global_step": 399965, "epoch": 4818} {"train_loss": -26.82110595703125, "global_step": 399966, "epoch": 4818} {"train_loss": -26.28936195373535, "global_step": 399967, "epoch": 4818} {"train_loss": -26.731775283813477, "global_step": 399968, "epoch": 4818} {"train_loss": -26.804004669189453, "global_step": 399969, "epoch": 4818} {"train_loss": -27.03607177734375, "global_step": 399970, "epoch": 4818} {"train_loss": -26.721105575561523, "global_step": 399971, "epoch": 4818} {"train_loss": -26.850204467773438, "global_step": 399972, "epoch": 4818} {"train_loss": -26.645994186401367, "global_step": 399973, "epoch": 4818} {"train_loss": -26.152860641479492, "global_step": 399974, "epoch": 4818} {"train_loss": -25.790616989135742, "global_step": 399975, "epoch": 4818} {"train_loss": -26.619541811655804, "global_step": 399976, "epoch": 4818, "val_loss": 6759696.0} {"train_loss": -24.904708862304688, "global_step": 399977, "epoch": 4819} {"train_loss": -23.91005516052246, "global_step": 399978, "epoch": 4819} {"train_loss": -23.717702865600586, "global_step": 399979, "epoch": 4819} {"train_loss": -25.11409568786621, "global_step": 399980, "epoch": 4819} {"train_loss": -25.132429122924805, "global_step": 399981, "epoch": 4819} {"train_loss": -25.198471069335938, "global_step": 399982, "epoch": 4819} {"train_loss": -24.54119873046875, "global_step": 399983, "epoch": 4819} {"train_loss": -24.858346939086914, "global_step": 399984, "epoch": 4819} {"train_loss": -25.582181930541992, "global_step": 399985, "epoch": 4819} {"train_loss": -25.844099044799805, "global_step": 399986, "epoch": 4819} {"train_loss": -25.711755752563477, "global_step": 399987, "epoch": 4819} {"train_loss": -25.326812744140625, "global_step": 399988, "epoch": 4819} {"train_loss": -25.50031852722168, "global_step": 399989, "epoch": 4819} {"train_loss": -25.888288497924805, "global_step": 399990, "epoch": 4819} {"train_loss": -25.80059814453125, "global_step": 399991, "epoch": 4819} {"train_loss": -25.729629516601562, "global_step": 399992, "epoch": 4819} {"train_loss": -25.595075607299805, "global_step": 399993, "epoch": 4819} {"train_loss": -25.760892868041992, "global_step": 399994, "epoch": 4819} {"train_loss": -25.925138473510742, "global_step": 399995, "epoch": 4819} {"train_loss": -25.925662994384766, "global_step": 399996, "epoch": 4819} {"train_loss": -25.69839859008789, "global_step": 399997, "epoch": 4819} {"train_loss": -25.814035415649414, "global_step": 399998, "epoch": 4819} {"train_loss": -26.404987335205078, "global_step": 399999, "epoch": 4819} {"train_loss": -26.211156845092773, "global_step": 400000, "epoch": 4819} {"train_loss": -26.300769805908203, "global_step": 400001, "epoch": 4819} {"train_loss": -26.425235748291016, "global_step": 400002, "epoch": 4819} {"train_loss": -26.301443099975586, "global_step": 400003, "epoch": 4819} {"train_loss": -26.229589462280273, "global_step": 400004, "epoch": 4819} {"train_loss": -26.755807876586914, "global_step": 400005, "epoch": 4819} {"train_loss": -25.901086807250977, "global_step": 400006, "epoch": 4819} {"train_loss": -26.259374618530273, "global_step": 400007, "epoch": 4819} {"train_loss": -26.319534301757812, "global_step": 400008, "epoch": 4819} {"train_loss": -26.508459091186523, "global_step": 400009, "epoch": 4819} {"train_loss": -26.53914451599121, "global_step": 400010, "epoch": 4819} {"train_loss": -26.34266471862793, "global_step": 400011, "epoch": 4819} {"train_loss": -26.472732543945312, "global_step": 400012, "epoch": 4819} {"train_loss": -26.484729766845703, "global_step": 400013, "epoch": 4819} {"train_loss": -26.30267906188965, "global_step": 400014, "epoch": 4819} {"train_loss": -26.693342208862305, "global_step": 400015, "epoch": 4819} {"train_loss": -26.545307159423828, "global_step": 400016, "epoch": 4819} {"train_loss": -26.596235275268555, "global_step": 400017, "epoch": 4819} {"train_loss": -26.75153160095215, "global_step": 400018, "epoch": 4819} {"train_loss": -26.471933364868164, "global_step": 400019, "epoch": 4819} {"train_loss": -26.738067626953125, "global_step": 400020, "epoch": 4819} {"train_loss": -26.82096290588379, "global_step": 400021, "epoch": 4819} {"train_loss": -26.295812606811523, "global_step": 400022, "epoch": 4819} {"train_loss": -26.285358428955078, "global_step": 400023, "epoch": 4819} {"train_loss": -26.711200714111328, "global_step": 400024, "epoch": 4819} {"train_loss": -26.674070358276367, "global_step": 400025, "epoch": 4819} {"train_loss": -26.778425216674805, "global_step": 400026, "epoch": 4819} {"train_loss": -26.803531646728516, "global_step": 400027, "epoch": 4819} {"train_loss": -26.79241371154785, "global_step": 400028, "epoch": 4819} {"train_loss": -26.73700523376465, "global_step": 400029, "epoch": 4819} {"train_loss": -26.741806030273438, "global_step": 400030, "epoch": 4819} {"train_loss": -26.620849609375, "global_step": 400031, "epoch": 4819} {"train_loss": -26.731693267822266, "global_step": 400032, "epoch": 4819} {"train_loss": -26.71308708190918, "global_step": 400033, "epoch": 4819} {"train_loss": -26.7937068939209, "global_step": 400034, "epoch": 4819} {"train_loss": -27.087228775024414, "global_step": 400035, "epoch": 4819} {"train_loss": -26.961889266967773, "global_step": 400036, "epoch": 4819} {"train_loss": -27.01018714904785, "global_step": 400037, "epoch": 4819} {"train_loss": -26.5809383392334, "global_step": 400038, "epoch": 4819} {"train_loss": -26.82500648498535, "global_step": 400039, "epoch": 4819} {"train_loss": -26.70173454284668, "global_step": 400040, "epoch": 4819} {"train_loss": -26.751026153564453, "global_step": 400041, "epoch": 4819} {"train_loss": -26.799530029296875, "global_step": 400042, "epoch": 4819} {"train_loss": -26.897552490234375, "global_step": 400043, "epoch": 4819} {"train_loss": -26.970752716064453, "global_step": 400044, "epoch": 4819} {"train_loss": -26.63067054748535, "global_step": 400045, "epoch": 4819} {"train_loss": -26.9132080078125, "global_step": 400046, "epoch": 4819} {"train_loss": -26.617090225219727, "global_step": 400047, "epoch": 4819} {"train_loss": -26.7127628326416, "global_step": 400048, "epoch": 4819} {"train_loss": -26.3945255279541, "global_step": 400049, "epoch": 4819} {"train_loss": -26.375354766845703, "global_step": 400050, "epoch": 4819} {"train_loss": -26.448087692260742, "global_step": 400051, "epoch": 4819} {"train_loss": -26.395437240600586, "global_step": 400052, "epoch": 4819} {"train_loss": -25.92584800720215, "global_step": 400053, "epoch": 4819} {"train_loss": -26.363981246948242, "global_step": 400054, "epoch": 4819} {"train_loss": -26.004667282104492, "global_step": 400055, "epoch": 4819} {"train_loss": -26.531835556030273, "global_step": 400056, "epoch": 4819} {"train_loss": -25.732929229736328, "global_step": 400057, "epoch": 4819} {"train_loss": -24.751140594482422, "global_step": 400058, "epoch": 4819} {"train_loss": -26.199427340404096, "global_step": 400059, "epoch": 4819, "val_loss": 6758620.0} {"train_loss": -23.480030059814453, "global_step": 400060, "epoch": 4820} {"train_loss": -21.106449127197266, "global_step": 400061, "epoch": 4820} {"train_loss": -23.752286911010742, "global_step": 400062, "epoch": 4820} {"train_loss": -24.161867141723633, "global_step": 400063, "epoch": 4820} {"train_loss": -24.365005493164062, "global_step": 400064, "epoch": 4820} {"train_loss": -23.640827178955078, "global_step": 400065, "epoch": 4820} {"train_loss": -24.49299430847168, "global_step": 400066, "epoch": 4820} {"train_loss": -24.714908599853516, "global_step": 400067, "epoch": 4820} {"train_loss": -25.245349884033203, "global_step": 400068, "epoch": 4820} {"train_loss": -24.333158493041992, "global_step": 400069, "epoch": 4820} {"train_loss": -24.78660774230957, "global_step": 400070, "epoch": 4820} {"train_loss": -24.87331199645996, "global_step": 400071, "epoch": 4820} {"train_loss": -25.48908042907715, "global_step": 400072, "epoch": 4820} {"train_loss": -25.183034896850586, "global_step": 400073, "epoch": 4820} {"train_loss": -24.94660758972168, "global_step": 400074, "epoch": 4820} {"train_loss": -25.10167121887207, "global_step": 400075, "epoch": 4820} {"train_loss": -25.241418838500977, "global_step": 400076, "epoch": 4820} {"train_loss": -25.128129959106445, "global_step": 400077, "epoch": 4820} {"train_loss": -25.185504913330078, "global_step": 400078, "epoch": 4820} {"train_loss": -25.060937881469727, "global_step": 400079, "epoch": 4820} {"train_loss": -25.325687408447266, "global_step": 400080, "epoch": 4820} {"train_loss": -25.483396530151367, "global_step": 400081, "epoch": 4820} {"train_loss": -25.44282341003418, "global_step": 400082, "epoch": 4820} {"train_loss": -25.470273971557617, "global_step": 400083, "epoch": 4820} {"train_loss": -25.635122299194336, "global_step": 400084, "epoch": 4820} {"train_loss": -25.63079833984375, "global_step": 400085, "epoch": 4820} {"train_loss": -25.975351333618164, "global_step": 400086, "epoch": 4820} {"train_loss": -25.655231475830078, "global_step": 400087, "epoch": 4820} {"train_loss": -25.503393173217773, "global_step": 400088, "epoch": 4820} {"train_loss": -25.7796630859375, "global_step": 400089, "epoch": 4820} {"train_loss": -25.8279972076416, "global_step": 400090, "epoch": 4820} {"train_loss": -26.14373779296875, "global_step": 400091, "epoch": 4820} {"train_loss": -26.093862533569336, "global_step": 400092, "epoch": 4820} {"train_loss": -25.811017990112305, "global_step": 400093, "epoch": 4820} {"train_loss": -26.0789737701416, "global_step": 400094, "epoch": 4820} {"train_loss": -26.37922477722168, "global_step": 400095, "epoch": 4820} {"train_loss": -26.282094955444336, "global_step": 400096, "epoch": 4820} {"train_loss": -26.284276962280273, "global_step": 400097, "epoch": 4820} {"train_loss": -25.787281036376953, "global_step": 400098, "epoch": 4820} {"train_loss": -26.31679344177246, "global_step": 400099, "epoch": 4820} {"train_loss": -25.76296043395996, "global_step": 400100, "epoch": 4820} {"train_loss": -26.363697052001953, "global_step": 400101, "epoch": 4820} {"train_loss": -26.367956161499023, "global_step": 400102, "epoch": 4820} {"train_loss": -25.988386154174805, "global_step": 400103, "epoch": 4820} {"train_loss": -26.18512535095215, "global_step": 400104, "epoch": 4820} {"train_loss": -26.202428817749023, "global_step": 400105, "epoch": 4820} {"train_loss": -26.897369384765625, "global_step": 400106, "epoch": 4820} {"train_loss": -26.354785919189453, "global_step": 400107, "epoch": 4820} {"train_loss": -26.277334213256836, "global_step": 400108, "epoch": 4820} {"train_loss": -26.517210006713867, "global_step": 400109, "epoch": 4820} {"train_loss": -26.553115844726562, "global_step": 400110, "epoch": 4820} {"train_loss": -26.264780044555664, "global_step": 400111, "epoch": 4820} {"train_loss": -26.535612106323242, "global_step": 400112, "epoch": 4820} {"train_loss": -26.708662033081055, "global_step": 400113, "epoch": 4820} {"train_loss": -27.00733757019043, "global_step": 400114, "epoch": 4820} {"train_loss": -26.157190322875977, "global_step": 400115, "epoch": 4820} {"train_loss": -25.928205490112305, "global_step": 400116, "epoch": 4820} {"train_loss": -26.05837059020996, "global_step": 400117, "epoch": 4820} {"train_loss": -26.150983810424805, "global_step": 400118, "epoch": 4820} {"train_loss": -26.620025634765625, "global_step": 400119, "epoch": 4820} {"train_loss": -26.626678466796875, "global_step": 400120, "epoch": 4820} {"train_loss": -26.31723976135254, "global_step": 400121, "epoch": 4820} {"train_loss": -26.180402755737305, "global_step": 400122, "epoch": 4820} {"train_loss": -26.515913009643555, "global_step": 400123, "epoch": 4820} {"train_loss": -26.914352416992188, "global_step": 400124, "epoch": 4820} {"train_loss": -26.739368438720703, "global_step": 400125, "epoch": 4820} {"train_loss": -26.354612350463867, "global_step": 400126, "epoch": 4820} {"train_loss": -26.441320419311523, "global_step": 400127, "epoch": 4820} {"train_loss": -26.251434326171875, "global_step": 400128, "epoch": 4820} {"train_loss": -26.84453773498535, "global_step": 400129, "epoch": 4820} {"train_loss": -26.345905303955078, "global_step": 400130, "epoch": 4820} {"train_loss": -26.119171142578125, "global_step": 400131, "epoch": 4820} {"train_loss": -26.527286529541016, "global_step": 400132, "epoch": 4820} {"train_loss": -26.39088249206543, "global_step": 400133, "epoch": 4820} {"train_loss": -26.605148315429688, "global_step": 400134, "epoch": 4820} {"train_loss": -26.428207397460938, "global_step": 400135, "epoch": 4820} {"train_loss": -26.42243766784668, "global_step": 400136, "epoch": 4820} {"train_loss": -26.57303810119629, "global_step": 400137, "epoch": 4820} {"train_loss": -26.602163314819336, "global_step": 400138, "epoch": 4820} {"train_loss": -26.553293228149414, "global_step": 400139, "epoch": 4820} {"train_loss": -26.814069747924805, "global_step": 400140, "epoch": 4820} {"train_loss": -26.855960845947266, "global_step": 400141, "epoch": 4820} {"train_loss": -25.839009687124964, "global_step": 400142, "epoch": 4820, "val_loss": 6566575.0} {"train_loss": -25.971776962280273, "global_step": 400143, "epoch": 4821} {"train_loss": -26.222692489624023, "global_step": 400144, "epoch": 4821} {"train_loss": -26.044803619384766, "global_step": 400145, "epoch": 4821} {"train_loss": -26.025537490844727, "global_step": 400146, "epoch": 4821} {"train_loss": -26.204986572265625, "global_step": 400147, "epoch": 4821} {"train_loss": -26.2634220123291, "global_step": 400148, "epoch": 4821} {"train_loss": -26.320144653320312, "global_step": 400149, "epoch": 4821} {"train_loss": -26.40277671813965, "global_step": 400150, "epoch": 4821} {"train_loss": -26.2718563079834, "global_step": 400151, "epoch": 4821} {"train_loss": -26.563831329345703, "global_step": 400152, "epoch": 4821} {"train_loss": -26.42127799987793, "global_step": 400153, "epoch": 4821} {"train_loss": -26.230594635009766, "global_step": 400154, "epoch": 4821} {"train_loss": -26.686742782592773, "global_step": 400155, "epoch": 4821} {"train_loss": -26.246810913085938, "global_step": 400156, "epoch": 4821} {"train_loss": -26.365177154541016, "global_step": 400157, "epoch": 4821} {"train_loss": -26.534988403320312, "global_step": 400158, "epoch": 4821} {"train_loss": -26.548627853393555, "global_step": 400159, "epoch": 4821} {"train_loss": -26.544357299804688, "global_step": 400160, "epoch": 4821} {"train_loss": -26.832258224487305, "global_step": 400161, "epoch": 4821} {"train_loss": -26.297388076782227, "global_step": 400162, "epoch": 4821} {"train_loss": -26.755712509155273, "global_step": 400163, "epoch": 4821} {"train_loss": -26.468046188354492, "global_step": 400164, "epoch": 4821} {"train_loss": -26.380151748657227, "global_step": 400165, "epoch": 4821} {"train_loss": -26.558944702148438, "global_step": 400166, "epoch": 4821} {"train_loss": -26.3786678314209, "global_step": 400167, "epoch": 4821} {"train_loss": -26.398746490478516, "global_step": 400168, "epoch": 4821} {"train_loss": -26.665754318237305, "global_step": 400169, "epoch": 4821} {"train_loss": -26.615278244018555, "global_step": 400170, "epoch": 4821} {"train_loss": -26.32130241394043, "global_step": 400171, "epoch": 4821} {"train_loss": -26.6716365814209, "global_step": 400172, "epoch": 4821} {"train_loss": -26.80878257751465, "global_step": 400173, "epoch": 4821} {"train_loss": -26.4560489654541, "global_step": 400174, "epoch": 4821} {"train_loss": -26.79326820373535, "global_step": 400175, "epoch": 4821} {"train_loss": -27.00977897644043, "global_step": 400176, "epoch": 4821} {"train_loss": -26.872989654541016, "global_step": 400177, "epoch": 4821} {"train_loss": -26.500577926635742, "global_step": 400178, "epoch": 4821} {"train_loss": -26.7490234375, "global_step": 400179, "epoch": 4821} {"train_loss": -26.918424606323242, "global_step": 400180, "epoch": 4821} {"train_loss": -26.846044540405273, "global_step": 400181, "epoch": 4821} {"train_loss": -26.650842666625977, "global_step": 400182, "epoch": 4821} {"train_loss": -25.980390548706055, "global_step": 400183, "epoch": 4821} {"train_loss": -26.78375244140625, "global_step": 400184, "epoch": 4821} {"train_loss": -26.5677547454834, "global_step": 400185, "epoch": 4821} {"train_loss": -26.500003814697266, "global_step": 400186, "epoch": 4821} {"train_loss": -26.71929359436035, "global_step": 400187, "epoch": 4821} {"train_loss": -26.5377254486084, "global_step": 400188, "epoch": 4821} {"train_loss": -26.834646224975586, "global_step": 400189, "epoch": 4821} {"train_loss": -26.632349014282227, "global_step": 400190, "epoch": 4821} {"train_loss": -26.53093910217285, "global_step": 400191, "epoch": 4821} {"train_loss": -26.73203468322754, "global_step": 400192, "epoch": 4821} {"train_loss": -26.878782272338867, "global_step": 400193, "epoch": 4821} {"train_loss": -26.750232696533203, "global_step": 400194, "epoch": 4821} {"train_loss": -26.695280075073242, "global_step": 400195, "epoch": 4821} {"train_loss": -26.6643123626709, "global_step": 400196, "epoch": 4821} {"train_loss": -26.953723907470703, "global_step": 400197, "epoch": 4821} {"train_loss": -26.623754501342773, "global_step": 400198, "epoch": 4821} {"train_loss": -26.772062301635742, "global_step": 400199, "epoch": 4821} {"train_loss": -26.42732048034668, "global_step": 400200, "epoch": 4821} {"train_loss": -27.107385635375977, "global_step": 400201, "epoch": 4821} {"train_loss": -26.392431259155273, "global_step": 400202, "epoch": 4821} {"train_loss": -26.739919662475586, "global_step": 400203, "epoch": 4821} {"train_loss": -26.773406982421875, "global_step": 400204, "epoch": 4821} {"train_loss": -26.744857788085938, "global_step": 400205, "epoch": 4821} {"train_loss": -26.700525283813477, "global_step": 400206, "epoch": 4821} {"train_loss": -27.23273277282715, "global_step": 400207, "epoch": 4821} {"train_loss": -26.741622924804688, "global_step": 400208, "epoch": 4821} {"train_loss": -26.82392692565918, "global_step": 400209, "epoch": 4821} {"train_loss": -26.890399932861328, "global_step": 400210, "epoch": 4821} {"train_loss": -27.062305450439453, "global_step": 400211, "epoch": 4821} {"train_loss": -26.581552505493164, "global_step": 400212, "epoch": 4821} {"train_loss": -26.600143432617188, "global_step": 400213, "epoch": 4821} {"train_loss": -25.99028968811035, "global_step": 400214, "epoch": 4821} {"train_loss": -25.89497947692871, "global_step": 400215, "epoch": 4821} {"train_loss": -26.272306442260742, "global_step": 400216, "epoch": 4821} {"train_loss": -26.58233642578125, "global_step": 400217, "epoch": 4821} {"train_loss": -26.860166549682617, "global_step": 400218, "epoch": 4821} {"train_loss": -26.3908634185791, "global_step": 400219, "epoch": 4821} {"train_loss": -26.311548233032227, "global_step": 400220, "epoch": 4821} {"train_loss": -26.866193771362305, "global_step": 400221, "epoch": 4821} {"train_loss": -26.25083351135254, "global_step": 400222, "epoch": 4821} {"train_loss": -26.339588165283203, "global_step": 400223, "epoch": 4821} {"train_loss": -26.631488800048828, "global_step": 400224, "epoch": 4821} {"train_loss": -26.570965111973774, "global_step": 400225, "epoch": 4821, "val_loss": 6721725.0} {"train_loss": -24.513349533081055, "global_step": 400226, "epoch": 4822} {"train_loss": -24.01304817199707, "global_step": 400227, "epoch": 4822} {"train_loss": -23.231582641601562, "global_step": 400228, "epoch": 4822} {"train_loss": -25.20058822631836, "global_step": 400229, "epoch": 4822} {"train_loss": -25.166351318359375, "global_step": 400230, "epoch": 4822} {"train_loss": -24.864835739135742, "global_step": 400231, "epoch": 4822} {"train_loss": -25.574562072753906, "global_step": 400232, "epoch": 4822} {"train_loss": -25.69990348815918, "global_step": 400233, "epoch": 4822} {"train_loss": -25.31802749633789, "global_step": 400234, "epoch": 4822} {"train_loss": -25.431428909301758, "global_step": 400235, "epoch": 4822} {"train_loss": -25.17311668395996, "global_step": 400236, "epoch": 4822} {"train_loss": -25.572967529296875, "global_step": 400237, "epoch": 4822} {"train_loss": -25.799097061157227, "global_step": 400238, "epoch": 4822} {"train_loss": -25.870344161987305, "global_step": 400239, "epoch": 4822} {"train_loss": -25.959280014038086, "global_step": 400240, "epoch": 4822} {"train_loss": -25.855823516845703, "global_step": 400241, "epoch": 4822} {"train_loss": -25.909351348876953, "global_step": 400242, "epoch": 4822} {"train_loss": -25.647541046142578, "global_step": 400243, "epoch": 4822} {"train_loss": -26.040388107299805, "global_step": 400244, "epoch": 4822} {"train_loss": -26.342161178588867, "global_step": 400245, "epoch": 4822} {"train_loss": -26.516738891601562, "global_step": 400246, "epoch": 4822} {"train_loss": -26.226337432861328, "global_step": 400247, "epoch": 4822} {"train_loss": -26.186203002929688, "global_step": 400248, "epoch": 4822} {"train_loss": -25.917861938476562, "global_step": 400249, "epoch": 4822} {"train_loss": -26.146350860595703, "global_step": 400250, "epoch": 4822} {"train_loss": -26.32026481628418, "global_step": 400251, "epoch": 4822} {"train_loss": -26.21369743347168, "global_step": 400252, "epoch": 4822} {"train_loss": -26.067670822143555, "global_step": 400253, "epoch": 4822} {"train_loss": -26.3045654296875, "global_step": 400254, "epoch": 4822} {"train_loss": -26.160058975219727, "global_step": 400255, "epoch": 4822} {"train_loss": -26.253259658813477, "global_step": 400256, "epoch": 4822} {"train_loss": -26.550073623657227, "global_step": 400257, "epoch": 4822} {"train_loss": -26.81061363220215, "global_step": 400258, "epoch": 4822} {"train_loss": -26.7517032623291, "global_step": 400259, "epoch": 4822} {"train_loss": -26.41936683654785, "global_step": 400260, "epoch": 4822} {"train_loss": -27.003772735595703, "global_step": 400261, "epoch": 4822} {"train_loss": -26.46461296081543, "global_step": 400262, "epoch": 4822} {"train_loss": -26.5189151763916, "global_step": 400263, "epoch": 4822} {"train_loss": -26.425251007080078, "global_step": 400264, "epoch": 4822} {"train_loss": -26.849075317382812, "global_step": 400265, "epoch": 4822} {"train_loss": -26.45733070373535, "global_step": 400266, "epoch": 4822} {"train_loss": -26.761564254760742, "global_step": 400267, "epoch": 4822} {"train_loss": -26.579511642456055, "global_step": 400268, "epoch": 4822} {"train_loss": -26.490110397338867, "global_step": 400269, "epoch": 4822} {"train_loss": -26.746023178100586, "global_step": 400270, "epoch": 4822} {"train_loss": -27.053207397460938, "global_step": 400271, "epoch": 4822} {"train_loss": -27.088254928588867, "global_step": 400272, "epoch": 4822} {"train_loss": -26.897064208984375, "global_step": 400273, "epoch": 4822} {"train_loss": -26.48880958557129, "global_step": 400274, "epoch": 4822} {"train_loss": -26.508207321166992, "global_step": 400275, "epoch": 4822} {"train_loss": -26.87483024597168, "global_step": 400276, "epoch": 4822} {"train_loss": -26.472803115844727, "global_step": 400277, "epoch": 4822} {"train_loss": -26.510915756225586, "global_step": 400278, "epoch": 4822} {"train_loss": -26.503339767456055, "global_step": 400279, "epoch": 4822} {"train_loss": -26.761274337768555, "global_step": 400280, "epoch": 4822} {"train_loss": -26.80251121520996, "global_step": 400281, "epoch": 4822} {"train_loss": -26.775014877319336, "global_step": 400282, "epoch": 4822} {"train_loss": -26.760419845581055, "global_step": 400283, "epoch": 4822} {"train_loss": -26.648847579956055, "global_step": 400284, "epoch": 4822} {"train_loss": -26.619232177734375, "global_step": 400285, "epoch": 4822} {"train_loss": -26.87734031677246, "global_step": 400286, "epoch": 4822} {"train_loss": -26.699323654174805, "global_step": 400287, "epoch": 4822} {"train_loss": -26.986968994140625, "global_step": 400288, "epoch": 4822} {"train_loss": -26.7711124420166, "global_step": 400289, "epoch": 4822} {"train_loss": -26.58037757873535, "global_step": 400290, "epoch": 4822} {"train_loss": -26.58709144592285, "global_step": 400291, "epoch": 4822} {"train_loss": -26.747106552124023, "global_step": 400292, "epoch": 4822} {"train_loss": -26.957300186157227, "global_step": 400293, "epoch": 4822} {"train_loss": -27.07435417175293, "global_step": 400294, "epoch": 4822} {"train_loss": -26.814451217651367, "global_step": 400295, "epoch": 4822} {"train_loss": -26.961353302001953, "global_step": 400296, "epoch": 4822} {"train_loss": -26.92010498046875, "global_step": 400297, "epoch": 4822} {"train_loss": -26.77829360961914, "global_step": 400298, "epoch": 4822} {"train_loss": -26.805225372314453, "global_step": 400299, "epoch": 4822} {"train_loss": -26.607406616210938, "global_step": 400300, "epoch": 4822} {"train_loss": -26.912199020385742, "global_step": 400301, "epoch": 4822} {"train_loss": -27.1894588470459, "global_step": 400302, "epoch": 4822} {"train_loss": -27.221288681030273, "global_step": 400303, "epoch": 4822} {"train_loss": -27.12093162536621, "global_step": 400304, "epoch": 4822} {"train_loss": -26.985198974609375, "global_step": 400305, "epoch": 4822} {"train_loss": -26.506616592407227, "global_step": 400306, "epoch": 4822} {"train_loss": -26.23273277282715, "global_step": 400307, "epoch": 4822} {"train_loss": -26.341734254216572, "global_step": 400308, "epoch": 4822, "val_loss": 6678774.0} {"train_loss": -26.6610107421875, "global_step": 400309, "epoch": 4823} {"train_loss": -26.388952255249023, "global_step": 400310, "epoch": 4823} {"train_loss": -26.597122192382812, "global_step": 400311, "epoch": 4823} {"train_loss": -26.502216339111328, "global_step": 400312, "epoch": 4823} {"train_loss": -26.3583984375, "global_step": 400313, "epoch": 4823} {"train_loss": -26.736127853393555, "global_step": 400314, "epoch": 4823} {"train_loss": -26.76409912109375, "global_step": 400315, "epoch": 4823} {"train_loss": -26.867170333862305, "global_step": 400316, "epoch": 4823} {"train_loss": -26.78229331970215, "global_step": 400317, "epoch": 4823} {"train_loss": -26.57745933532715, "global_step": 400318, "epoch": 4823} {"train_loss": -26.475324630737305, "global_step": 400319, "epoch": 4823} {"train_loss": -26.692480087280273, "global_step": 400320, "epoch": 4823} {"train_loss": -26.643014907836914, "global_step": 400321, "epoch": 4823} {"train_loss": -26.774127960205078, "global_step": 400322, "epoch": 4823} {"train_loss": -26.689716339111328, "global_step": 400323, "epoch": 4823} {"train_loss": -27.093671798706055, "global_step": 400324, "epoch": 4823} {"train_loss": -26.656219482421875, "global_step": 400325, "epoch": 4823} {"train_loss": -26.577817916870117, "global_step": 400326, "epoch": 4823} {"train_loss": -26.666217803955078, "global_step": 400327, "epoch": 4823} {"train_loss": -26.781539916992188, "global_step": 400328, "epoch": 4823} {"train_loss": -26.8994083404541, "global_step": 400329, "epoch": 4823} {"train_loss": -26.740209579467773, "global_step": 400330, "epoch": 4823} {"train_loss": -26.8204288482666, "global_step": 400331, "epoch": 4823} {"train_loss": -26.720748901367188, "global_step": 400332, "epoch": 4823} {"train_loss": -26.69624137878418, "global_step": 400333, "epoch": 4823} {"train_loss": -26.549299240112305, "global_step": 400334, "epoch": 4823} {"train_loss": -26.367176055908203, "global_step": 400335, "epoch": 4823} {"train_loss": -26.419891357421875, "global_step": 400336, "epoch": 4823} {"train_loss": -26.227609634399414, "global_step": 400337, "epoch": 4823} {"train_loss": -26.25669288635254, "global_step": 400338, "epoch": 4823} {"train_loss": -26.1688289642334, "global_step": 400339, "epoch": 4823} {"train_loss": -26.3682918548584, "global_step": 400340, "epoch": 4823} {"train_loss": -26.007123947143555, "global_step": 400341, "epoch": 4823} {"train_loss": -26.5838680267334, "global_step": 400342, "epoch": 4823} {"train_loss": -26.73583984375, "global_step": 400343, "epoch": 4823} {"train_loss": -26.371673583984375, "global_step": 400344, "epoch": 4823} {"train_loss": -26.64288330078125, "global_step": 400345, "epoch": 4823} {"train_loss": -26.3763427734375, "global_step": 400346, "epoch": 4823} {"train_loss": -26.545602798461914, "global_step": 400347, "epoch": 4823} {"train_loss": -26.822589874267578, "global_step": 400348, "epoch": 4823} {"train_loss": -26.591943740844727, "global_step": 400349, "epoch": 4823} {"train_loss": -26.686492919921875, "global_step": 400350, "epoch": 4823} {"train_loss": -26.831802368164062, "global_step": 400351, "epoch": 4823} {"train_loss": -26.689701080322266, "global_step": 400352, "epoch": 4823} {"train_loss": -26.8866024017334, "global_step": 400353, "epoch": 4823} {"train_loss": -26.409225463867188, "global_step": 400354, "epoch": 4823} {"train_loss": -26.791263580322266, "global_step": 400355, "epoch": 4823} {"train_loss": -26.607995986938477, "global_step": 400356, "epoch": 4823} {"train_loss": -26.816980361938477, "global_step": 400357, "epoch": 4823} {"train_loss": -26.640100479125977, "global_step": 400358, "epoch": 4823} {"train_loss": -26.82712745666504, "global_step": 400359, "epoch": 4823} {"train_loss": -26.527820587158203, "global_step": 400360, "epoch": 4823} {"train_loss": -26.36476707458496, "global_step": 400361, "epoch": 4823} {"train_loss": -26.777830123901367, "global_step": 400362, "epoch": 4823} {"train_loss": -26.7093505859375, "global_step": 400363, "epoch": 4823} {"train_loss": -27.1247501373291, "global_step": 400364, "epoch": 4823} {"train_loss": -26.657947540283203, "global_step": 400365, "epoch": 4823} {"train_loss": -26.472442626953125, "global_step": 400366, "epoch": 4823} {"train_loss": -26.374841690063477, "global_step": 400367, "epoch": 4823} {"train_loss": -26.612180709838867, "global_step": 400368, "epoch": 4823} {"train_loss": -26.742155075073242, "global_step": 400369, "epoch": 4823} {"train_loss": -26.587711334228516, "global_step": 400370, "epoch": 4823} {"train_loss": -26.988550186157227, "global_step": 400371, "epoch": 4823} {"train_loss": -26.7365779876709, "global_step": 400372, "epoch": 4823} {"train_loss": -26.39845085144043, "global_step": 400373, "epoch": 4823} {"train_loss": -26.498411178588867, "global_step": 400374, "epoch": 4823} {"train_loss": -26.422391891479492, "global_step": 400375, "epoch": 4823} {"train_loss": -26.528217315673828, "global_step": 400376, "epoch": 4823} {"train_loss": -26.97214126586914, "global_step": 400377, "epoch": 4823} {"train_loss": -26.80280876159668, "global_step": 400378, "epoch": 4823} {"train_loss": -26.560476303100586, "global_step": 400379, "epoch": 4823} {"train_loss": -26.64985466003418, "global_step": 400380, "epoch": 4823} {"train_loss": -26.745222091674805, "global_step": 400381, "epoch": 4823} {"train_loss": -26.583709716796875, "global_step": 400382, "epoch": 4823} {"train_loss": -26.724639892578125, "global_step": 400383, "epoch": 4823} {"train_loss": -26.57368278503418, "global_step": 400384, "epoch": 4823} {"train_loss": -26.765899658203125, "global_step": 400385, "epoch": 4823} {"train_loss": -26.654706954956055, "global_step": 400386, "epoch": 4823} {"train_loss": -26.45564079284668, "global_step": 400387, "epoch": 4823} {"train_loss": -26.749317169189453, "global_step": 400388, "epoch": 4823} {"train_loss": -26.525609970092773, "global_step": 400389, "epoch": 4823} {"train_loss": -26.636905670166016, "global_step": 400390, "epoch": 4823} {"train_loss": -26.621693025152368, "global_step": 400391, "epoch": 4823, "val_loss": 6567229.5} {"train_loss": -26.46283531188965, "global_step": 400392, "epoch": 4824} {"train_loss": -26.507526397705078, "global_step": 400393, "epoch": 4824} {"train_loss": -26.293066024780273, "global_step": 400394, "epoch": 4824} {"train_loss": -26.57935905456543, "global_step": 400395, "epoch": 4824} {"train_loss": -25.449676513671875, "global_step": 400396, "epoch": 4824} {"train_loss": -25.918170928955078, "global_step": 400397, "epoch": 4824} {"train_loss": -25.595956802368164, "global_step": 400398, "epoch": 4824} {"train_loss": -25.551481246948242, "global_step": 400399, "epoch": 4824} {"train_loss": -26.286956787109375, "global_step": 400400, "epoch": 4824} {"train_loss": -25.994775772094727, "global_step": 400401, "epoch": 4824} {"train_loss": -26.046173095703125, "global_step": 400402, "epoch": 4824} {"train_loss": -26.26128578186035, "global_step": 400403, "epoch": 4824} {"train_loss": -26.04131507873535, "global_step": 400404, "epoch": 4824} {"train_loss": -26.198291778564453, "global_step": 400405, "epoch": 4824} {"train_loss": -26.372312545776367, "global_step": 400406, "epoch": 4824} {"train_loss": -26.349164962768555, "global_step": 400407, "epoch": 4824} {"train_loss": -26.65546226501465, "global_step": 400408, "epoch": 4824} {"train_loss": -26.571884155273438, "global_step": 400409, "epoch": 4824} {"train_loss": -26.521289825439453, "global_step": 400410, "epoch": 4824} {"train_loss": -26.20814323425293, "global_step": 400411, "epoch": 4824} {"train_loss": -26.67510986328125, "global_step": 400412, "epoch": 4824} {"train_loss": -26.121051788330078, "global_step": 400413, "epoch": 4824} {"train_loss": -26.755298614501953, "global_step": 400414, "epoch": 4824} {"train_loss": -26.706205368041992, "global_step": 400415, "epoch": 4824} {"train_loss": -26.824939727783203, "global_step": 400416, "epoch": 4824} {"train_loss": -26.71466636657715, "global_step": 400417, "epoch": 4824} {"train_loss": -26.7962646484375, "global_step": 400418, "epoch": 4824} {"train_loss": -26.56344985961914, "global_step": 400419, "epoch": 4824} {"train_loss": -26.40724754333496, "global_step": 400420, "epoch": 4824} {"train_loss": -26.817035675048828, "global_step": 400421, "epoch": 4824} {"train_loss": -26.762531280517578, "global_step": 400422, "epoch": 4824} {"train_loss": -26.630640029907227, "global_step": 400423, "epoch": 4824} {"train_loss": -26.781875610351562, "global_step": 400424, "epoch": 4824} {"train_loss": -26.73711585998535, "global_step": 400425, "epoch": 4824} {"train_loss": -26.776105880737305, "global_step": 400426, "epoch": 4824} {"train_loss": -26.798675537109375, "global_step": 400427, "epoch": 4824} {"train_loss": -26.657224655151367, "global_step": 400428, "epoch": 4824} {"train_loss": -26.71052360534668, "global_step": 400429, "epoch": 4824} {"train_loss": -26.84209632873535, "global_step": 400430, "epoch": 4824} {"train_loss": -26.446191787719727, "global_step": 400431, "epoch": 4824} {"train_loss": -26.846792221069336, "global_step": 400432, "epoch": 4824} {"train_loss": -26.52215003967285, "global_step": 400433, "epoch": 4824} {"train_loss": -26.441919326782227, "global_step": 400434, "epoch": 4824} {"train_loss": -26.7320556640625, "global_step": 400435, "epoch": 4824} {"train_loss": -26.53510093688965, "global_step": 400436, "epoch": 4824} {"train_loss": -26.876745223999023, "global_step": 400437, "epoch": 4824} {"train_loss": -26.855833053588867, "global_step": 400438, "epoch": 4824} {"train_loss": -26.800556182861328, "global_step": 400439, "epoch": 4824} {"train_loss": -26.884613037109375, "global_step": 400440, "epoch": 4824} {"train_loss": -26.68110466003418, "global_step": 400441, "epoch": 4824} {"train_loss": -27.04877281188965, "global_step": 400442, "epoch": 4824} {"train_loss": -26.870635986328125, "global_step": 400443, "epoch": 4824} {"train_loss": -26.367883682250977, "global_step": 400444, "epoch": 4824} {"train_loss": -26.64972496032715, "global_step": 400445, "epoch": 4824} {"train_loss": -26.268339157104492, "global_step": 400446, "epoch": 4824} {"train_loss": -26.20170021057129, "global_step": 400447, "epoch": 4824} {"train_loss": -26.189111709594727, "global_step": 400448, "epoch": 4824} {"train_loss": -26.56538200378418, "global_step": 400449, "epoch": 4824} {"train_loss": -26.74591636657715, "global_step": 400450, "epoch": 4824} {"train_loss": -25.76505470275879, "global_step": 400451, "epoch": 4824} {"train_loss": -26.333831787109375, "global_step": 400452, "epoch": 4824} {"train_loss": -26.489837646484375, "global_step": 400453, "epoch": 4824} {"train_loss": -26.738880157470703, "global_step": 400454, "epoch": 4824} {"train_loss": -26.418121337890625, "global_step": 400455, "epoch": 4824} {"train_loss": -26.455535888671875, "global_step": 400456, "epoch": 4824} {"train_loss": -26.249847412109375, "global_step": 400457, "epoch": 4824} {"train_loss": -26.704214096069336, "global_step": 400458, "epoch": 4824} {"train_loss": -26.758344650268555, "global_step": 400459, "epoch": 4824} {"train_loss": -26.785314559936523, "global_step": 400460, "epoch": 4824} {"train_loss": -26.230070114135742, "global_step": 400461, "epoch": 4824} {"train_loss": -26.3380184173584, "global_step": 400462, "epoch": 4824} {"train_loss": -26.882165908813477, "global_step": 400463, "epoch": 4824} {"train_loss": -26.513349533081055, "global_step": 400464, "epoch": 4824} {"train_loss": -26.352407455444336, "global_step": 400465, "epoch": 4824} {"train_loss": -26.33796501159668, "global_step": 400466, "epoch": 4824} {"train_loss": -26.793323516845703, "global_step": 400467, "epoch": 4824} {"train_loss": -26.07373046875, "global_step": 400468, "epoch": 4824} {"train_loss": -26.50298500061035, "global_step": 400469, "epoch": 4824} {"train_loss": -26.59201431274414, "global_step": 400470, "epoch": 4824} {"train_loss": -26.589752197265625, "global_step": 400471, "epoch": 4824} {"train_loss": -26.55413818359375, "global_step": 400472, "epoch": 4824} {"train_loss": -26.687162399291992, "global_step": 400473, "epoch": 4824} {"train_loss": -26.496578331453254, "global_step": 400474, "epoch": 4824, "val_loss": 6671349.0} {"train_loss": -26.28158950805664, "global_step": 400475, "epoch": 4825} {"train_loss": -26.535755157470703, "global_step": 400476, "epoch": 4825} {"train_loss": -26.40994644165039, "global_step": 400477, "epoch": 4825} {"train_loss": -26.1817626953125, "global_step": 400478, "epoch": 4825} {"train_loss": -26.317243576049805, "global_step": 400479, "epoch": 4825} {"train_loss": -26.43779945373535, "global_step": 400480, "epoch": 4825} {"train_loss": -26.06231689453125, "global_step": 400481, "epoch": 4825} {"train_loss": -26.038623809814453, "global_step": 400482, "epoch": 4825} {"train_loss": -26.083654403686523, "global_step": 400483, "epoch": 4825} {"train_loss": -26.482166290283203, "global_step": 400484, "epoch": 4825} {"train_loss": -26.51655387878418, "global_step": 400485, "epoch": 4825} {"train_loss": -25.828107833862305, "global_step": 400486, "epoch": 4825} {"train_loss": -26.668272018432617, "global_step": 400487, "epoch": 4825} {"train_loss": -26.033987045288086, "global_step": 400488, "epoch": 4825} {"train_loss": -26.6821346282959, "global_step": 400489, "epoch": 4825} {"train_loss": -26.319005966186523, "global_step": 400490, "epoch": 4825} {"train_loss": -26.116424560546875, "global_step": 400491, "epoch": 4825} {"train_loss": -26.152881622314453, "global_step": 400492, "epoch": 4825} {"train_loss": -26.42350196838379, "global_step": 400493, "epoch": 4825} {"train_loss": -26.27362632751465, "global_step": 400494, "epoch": 4825} {"train_loss": -25.823904037475586, "global_step": 400495, "epoch": 4825} {"train_loss": -26.391834259033203, "global_step": 400496, "epoch": 4825} {"train_loss": -26.023279190063477, "global_step": 400497, "epoch": 4825} {"train_loss": -26.380542755126953, "global_step": 400498, "epoch": 4825} {"train_loss": -26.682950973510742, "global_step": 400499, "epoch": 4825} {"train_loss": -26.23237419128418, "global_step": 400500, "epoch": 4825} {"train_loss": -26.448766708374023, "global_step": 400501, "epoch": 4825} {"train_loss": -26.377843856811523, "global_step": 400502, "epoch": 4825} {"train_loss": -26.389097213745117, "global_step": 400503, "epoch": 4825} {"train_loss": -26.946447372436523, "global_step": 400504, "epoch": 4825} {"train_loss": -26.657806396484375, "global_step": 400505, "epoch": 4825} {"train_loss": -26.420928955078125, "global_step": 400506, "epoch": 4825} {"train_loss": -26.572595596313477, "global_step": 400507, "epoch": 4825} {"train_loss": -26.956806182861328, "global_step": 400508, "epoch": 4825} {"train_loss": -26.437292098999023, "global_step": 400509, "epoch": 4825} {"train_loss": -26.577722549438477, "global_step": 400510, "epoch": 4825} {"train_loss": -26.71571159362793, "global_step": 400511, "epoch": 4825} {"train_loss": -26.847700119018555, "global_step": 400512, "epoch": 4825} {"train_loss": -26.62916374206543, "global_step": 400513, "epoch": 4825} {"train_loss": -27.148681640625, "global_step": 400514, "epoch": 4825} {"train_loss": -26.70918083190918, "global_step": 400515, "epoch": 4825} {"train_loss": -26.86838150024414, "global_step": 400516, "epoch": 4825} {"train_loss": -26.708810806274414, "global_step": 400517, "epoch": 4825} {"train_loss": -26.6701717376709, "global_step": 400518, "epoch": 4825} {"train_loss": -26.34950065612793, "global_step": 400519, "epoch": 4825} {"train_loss": -26.753421783447266, "global_step": 400520, "epoch": 4825} {"train_loss": -26.62916374206543, "global_step": 400521, "epoch": 4825} {"train_loss": -26.78595542907715, "global_step": 400522, "epoch": 4825} {"train_loss": -26.71907615661621, "global_step": 400523, "epoch": 4825} {"train_loss": -26.5703125, "global_step": 400524, "epoch": 4825} {"train_loss": -26.722888946533203, "global_step": 400525, "epoch": 4825} {"train_loss": -26.73622703552246, "global_step": 400526, "epoch": 4825} {"train_loss": -26.480548858642578, "global_step": 400527, "epoch": 4825} {"train_loss": -26.670175552368164, "global_step": 400528, "epoch": 4825} {"train_loss": -26.61922264099121, "global_step": 400529, "epoch": 4825} {"train_loss": -26.665842056274414, "global_step": 400530, "epoch": 4825} {"train_loss": -26.798810958862305, "global_step": 400531, "epoch": 4825} {"train_loss": -26.645965576171875, "global_step": 400532, "epoch": 4825} {"train_loss": -26.624109268188477, "global_step": 400533, "epoch": 4825} {"train_loss": -26.598623275756836, "global_step": 400534, "epoch": 4825} {"train_loss": -26.6735782623291, "global_step": 400535, "epoch": 4825} {"train_loss": -26.918853759765625, "global_step": 400536, "epoch": 4825} {"train_loss": -26.707294464111328, "global_step": 400537, "epoch": 4825} {"train_loss": -26.676523208618164, "global_step": 400538, "epoch": 4825} {"train_loss": -26.67119789123535, "global_step": 400539, "epoch": 4825} {"train_loss": -26.59677505493164, "global_step": 400540, "epoch": 4825} {"train_loss": -26.54585075378418, "global_step": 400541, "epoch": 4825} {"train_loss": -26.662616729736328, "global_step": 400542, "epoch": 4825} {"train_loss": -26.6320858001709, "global_step": 400543, "epoch": 4825} {"train_loss": -27.140155792236328, "global_step": 400544, "epoch": 4825} {"train_loss": -26.46781349182129, "global_step": 400545, "epoch": 4825} {"train_loss": -26.756261825561523, "global_step": 400546, "epoch": 4825} {"train_loss": -26.7032527923584, "global_step": 400547, "epoch": 4825} {"train_loss": -27.06316566467285, "global_step": 400548, "epoch": 4825} {"train_loss": -26.73392105102539, "global_step": 400549, "epoch": 4825} {"train_loss": -27.027311325073242, "global_step": 400550, "epoch": 4825} {"train_loss": -26.581708908081055, "global_step": 400551, "epoch": 4825} {"train_loss": -26.750085830688477, "global_step": 400552, "epoch": 4825} {"train_loss": -26.84758949279785, "global_step": 400553, "epoch": 4825} {"train_loss": -26.437658309936523, "global_step": 400554, "epoch": 4825} {"train_loss": -26.510135650634766, "global_step": 400555, "epoch": 4825} {"train_loss": -26.565597534179688, "global_step": 400556, "epoch": 4825} {"train_loss": -26.549724073295135, "global_step": 400557, "epoch": 4825, "val_loss": 6674345.0} {"train_loss": -25.39906883239746, "global_step": 400558, "epoch": 4826} {"train_loss": -24.745328903198242, "global_step": 400559, "epoch": 4826} {"train_loss": -25.10080909729004, "global_step": 400560, "epoch": 4826} {"train_loss": -24.72222900390625, "global_step": 400561, "epoch": 4826} {"train_loss": -25.866357803344727, "global_step": 400562, "epoch": 4826} {"train_loss": -25.08083724975586, "global_step": 400563, "epoch": 4826} {"train_loss": -25.98029136657715, "global_step": 400564, "epoch": 4826} {"train_loss": -25.581165313720703, "global_step": 400565, "epoch": 4826} {"train_loss": -25.937414169311523, "global_step": 400566, "epoch": 4826} {"train_loss": -25.976465225219727, "global_step": 400567, "epoch": 4826} {"train_loss": -25.585582733154297, "global_step": 400568, "epoch": 4826} {"train_loss": -25.897552490234375, "global_step": 400569, "epoch": 4826} {"train_loss": -26.0770206451416, "global_step": 400570, "epoch": 4826} {"train_loss": -26.24207878112793, "global_step": 400571, "epoch": 4826} {"train_loss": -25.731739044189453, "global_step": 400572, "epoch": 4826} {"train_loss": -26.080398559570312, "global_step": 400573, "epoch": 4826} {"train_loss": -26.341638565063477, "global_step": 400574, "epoch": 4826} {"train_loss": -25.987003326416016, "global_step": 400575, "epoch": 4826} {"train_loss": -26.212751388549805, "global_step": 400576, "epoch": 4826} {"train_loss": -26.521520614624023, "global_step": 400577, "epoch": 4826} {"train_loss": -26.20175552368164, "global_step": 400578, "epoch": 4826} {"train_loss": -26.361536026000977, "global_step": 400579, "epoch": 4826} {"train_loss": -26.13443946838379, "global_step": 400580, "epoch": 4826} {"train_loss": -26.617395401000977, "global_step": 400581, "epoch": 4826} {"train_loss": -26.3903751373291, "global_step": 400582, "epoch": 4826} {"train_loss": -26.764902114868164, "global_step": 400583, "epoch": 4826} {"train_loss": -26.6337833404541, "global_step": 400584, "epoch": 4826} {"train_loss": -26.219030380249023, "global_step": 400585, "epoch": 4826} {"train_loss": -26.35286521911621, "global_step": 400586, "epoch": 4826} {"train_loss": -26.557849884033203, "global_step": 400587, "epoch": 4826} {"train_loss": -26.37141227722168, "global_step": 400588, "epoch": 4826} {"train_loss": -26.50067710876465, "global_step": 400589, "epoch": 4826} {"train_loss": -26.332813262939453, "global_step": 400590, "epoch": 4826} {"train_loss": -26.804052352905273, "global_step": 400591, "epoch": 4826} {"train_loss": -26.328298568725586, "global_step": 400592, "epoch": 4826} {"train_loss": -26.722797393798828, "global_step": 400593, "epoch": 4826} {"train_loss": -26.17889404296875, "global_step": 400594, "epoch": 4826} {"train_loss": -26.66914176940918, "global_step": 400595, "epoch": 4826} {"train_loss": -26.50604248046875, "global_step": 400596, "epoch": 4826} {"train_loss": -26.46929931640625, "global_step": 400597, "epoch": 4826} {"train_loss": -26.310529708862305, "global_step": 400598, "epoch": 4826} {"train_loss": -26.803098678588867, "global_step": 400599, "epoch": 4826} {"train_loss": -26.358240127563477, "global_step": 400600, "epoch": 4826} {"train_loss": -26.700225830078125, "global_step": 400601, "epoch": 4826} {"train_loss": -26.06852149963379, "global_step": 400602, "epoch": 4826} {"train_loss": -26.227685928344727, "global_step": 400603, "epoch": 4826} {"train_loss": -26.24045181274414, "global_step": 400604, "epoch": 4826} {"train_loss": -26.800628662109375, "global_step": 400605, "epoch": 4826} {"train_loss": -26.237165451049805, "global_step": 400606, "epoch": 4826} {"train_loss": -26.724353790283203, "global_step": 400607, "epoch": 4826} {"train_loss": -26.58344078063965, "global_step": 400608, "epoch": 4826} {"train_loss": -26.831090927124023, "global_step": 400609, "epoch": 4826} {"train_loss": -26.493513107299805, "global_step": 400610, "epoch": 4826} {"train_loss": -26.758176803588867, "global_step": 400611, "epoch": 4826} {"train_loss": -26.609708786010742, "global_step": 400612, "epoch": 4826} {"train_loss": -26.929059982299805, "global_step": 400613, "epoch": 4826} {"train_loss": -26.675146102905273, "global_step": 400614, "epoch": 4826} {"train_loss": -26.730777740478516, "global_step": 400615, "epoch": 4826} {"train_loss": -27.235021591186523, "global_step": 400616, "epoch": 4826} {"train_loss": -26.794706344604492, "global_step": 400617, "epoch": 4826} {"train_loss": -26.738256454467773, "global_step": 400618, "epoch": 4826} {"train_loss": -26.48874282836914, "global_step": 400619, "epoch": 4826} {"train_loss": -26.607099533081055, "global_step": 400620, "epoch": 4826} {"train_loss": -26.7772216796875, "global_step": 400621, "epoch": 4826} {"train_loss": -26.756103515625, "global_step": 400622, "epoch": 4826} {"train_loss": -26.812646865844727, "global_step": 400623, "epoch": 4826} {"train_loss": -27.041105270385742, "global_step": 400624, "epoch": 4826} {"train_loss": -26.620635986328125, "global_step": 400625, "epoch": 4826} {"train_loss": -26.97486686706543, "global_step": 400626, "epoch": 4826} {"train_loss": -26.56312370300293, "global_step": 400627, "epoch": 4826} {"train_loss": -27.120649337768555, "global_step": 400628, "epoch": 4826} {"train_loss": -26.96586036682129, "global_step": 400629, "epoch": 4826} {"train_loss": -26.932205200195312, "global_step": 400630, "epoch": 4826} {"train_loss": -26.895832061767578, "global_step": 400631, "epoch": 4826} {"train_loss": -26.999494552612305, "global_step": 400632, "epoch": 4826} {"train_loss": -26.732559204101562, "global_step": 400633, "epoch": 4826} {"train_loss": -26.493261337280273, "global_step": 400634, "epoch": 4826} {"train_loss": -26.5089168548584, "global_step": 400635, "epoch": 4826} {"train_loss": -26.890914916992188, "global_step": 400636, "epoch": 4826} {"train_loss": -26.99846839904785, "global_step": 400637, "epoch": 4826} {"train_loss": -26.698352813720703, "global_step": 400638, "epoch": 4826} {"train_loss": -26.95577049255371, "global_step": 400639, "epoch": 4826} {"train_loss": -26.41892594027232, "global_step": 400640, "epoch": 4826, "val_loss": 6702976.0} {"train_loss": -26.431034088134766, "global_step": 400641, "epoch": 4827} {"train_loss": -26.21210289001465, "global_step": 400642, "epoch": 4827} {"train_loss": -26.20399284362793, "global_step": 400643, "epoch": 4827} {"train_loss": -26.13309097290039, "global_step": 400644, "epoch": 4827} {"train_loss": -25.8568172454834, "global_step": 400645, "epoch": 4827} {"train_loss": -26.72015380859375, "global_step": 400646, "epoch": 4827} {"train_loss": -26.38750648498535, "global_step": 400647, "epoch": 4827} {"train_loss": -26.3287296295166, "global_step": 400648, "epoch": 4827} {"train_loss": -26.440616607666016, "global_step": 400649, "epoch": 4827} {"train_loss": -26.584522247314453, "global_step": 400650, "epoch": 4827} {"train_loss": -26.537567138671875, "global_step": 400651, "epoch": 4827} {"train_loss": -26.416614532470703, "global_step": 400652, "epoch": 4827} {"train_loss": -26.465152740478516, "global_step": 400653, "epoch": 4827} {"train_loss": -26.591373443603516, "global_step": 400654, "epoch": 4827} {"train_loss": -26.7540283203125, "global_step": 400655, "epoch": 4827} {"train_loss": -26.36505126953125, "global_step": 400656, "epoch": 4827} {"train_loss": -26.689695358276367, "global_step": 400657, "epoch": 4827} {"train_loss": -26.5162353515625, "global_step": 400658, "epoch": 4827} {"train_loss": -26.578153610229492, "global_step": 400659, "epoch": 4827} {"train_loss": -26.54425048828125, "global_step": 400660, "epoch": 4827} {"train_loss": -26.994556427001953, "global_step": 400661, "epoch": 4827} {"train_loss": -26.524280548095703, "global_step": 400662, "epoch": 4827} {"train_loss": -26.501346588134766, "global_step": 400663, "epoch": 4827} {"train_loss": -26.674245834350586, "global_step": 400664, "epoch": 4827} {"train_loss": -26.81544303894043, "global_step": 400665, "epoch": 4827} {"train_loss": -26.31365394592285, "global_step": 400666, "epoch": 4827} {"train_loss": -26.95050621032715, "global_step": 400667, "epoch": 4827} {"train_loss": -26.422163009643555, "global_step": 400668, "epoch": 4827} {"train_loss": -26.221384048461914, "global_step": 400669, "epoch": 4827} {"train_loss": -26.438302993774414, "global_step": 400670, "epoch": 4827} {"train_loss": -26.552946090698242, "global_step": 400671, "epoch": 4827} {"train_loss": -26.84246253967285, "global_step": 400672, "epoch": 4827} {"train_loss": -26.582868576049805, "global_step": 400673, "epoch": 4827} {"train_loss": -26.480810165405273, "global_step": 400674, "epoch": 4827} {"train_loss": -26.83961296081543, "global_step": 400675, "epoch": 4827} {"train_loss": -26.656896591186523, "global_step": 400676, "epoch": 4827} {"train_loss": -26.693586349487305, "global_step": 400677, "epoch": 4827} {"train_loss": -26.816925048828125, "global_step": 400678, "epoch": 4827} {"train_loss": -26.770681381225586, "global_step": 400679, "epoch": 4827} {"train_loss": -26.852773666381836, "global_step": 400680, "epoch": 4827} {"train_loss": -26.86958885192871, "global_step": 400681, "epoch": 4827} {"train_loss": -26.462615966796875, "global_step": 400682, "epoch": 4827} {"train_loss": -26.687707901000977, "global_step": 400683, "epoch": 4827} {"train_loss": -26.479536056518555, "global_step": 400684, "epoch": 4827} {"train_loss": -26.24591636657715, "global_step": 400685, "epoch": 4827} {"train_loss": -26.4771785736084, "global_step": 400686, "epoch": 4827} {"train_loss": -26.519933700561523, "global_step": 400687, "epoch": 4827} {"train_loss": -26.326459884643555, "global_step": 400688, "epoch": 4827} {"train_loss": -26.435636520385742, "global_step": 400689, "epoch": 4827} {"train_loss": -26.583499908447266, "global_step": 400690, "epoch": 4827} {"train_loss": -26.88669204711914, "global_step": 400691, "epoch": 4827} {"train_loss": -26.223129272460938, "global_step": 400692, "epoch": 4827} {"train_loss": -26.759429931640625, "global_step": 400693, "epoch": 4827} {"train_loss": -26.672687530517578, "global_step": 400694, "epoch": 4827} {"train_loss": -27.112646102905273, "global_step": 400695, "epoch": 4827} {"train_loss": -27.01016616821289, "global_step": 400696, "epoch": 4827} {"train_loss": -26.887176513671875, "global_step": 400697, "epoch": 4827} {"train_loss": -26.55555534362793, "global_step": 400698, "epoch": 4827} {"train_loss": -26.938642501831055, "global_step": 400699, "epoch": 4827} {"train_loss": -26.65558433532715, "global_step": 400700, "epoch": 4827} {"train_loss": -26.6005802154541, "global_step": 400701, "epoch": 4827} {"train_loss": -27.014209747314453, "global_step": 400702, "epoch": 4827} {"train_loss": -27.192529678344727, "global_step": 400703, "epoch": 4827} {"train_loss": -26.6124210357666, "global_step": 400704, "epoch": 4827} {"train_loss": -26.47568130493164, "global_step": 400705, "epoch": 4827} {"train_loss": -26.66213035583496, "global_step": 400706, "epoch": 4827} {"train_loss": -26.311384201049805, "global_step": 400707, "epoch": 4827} {"train_loss": -26.731704711914062, "global_step": 400708, "epoch": 4827} {"train_loss": -26.788894653320312, "global_step": 400709, "epoch": 4827} {"train_loss": -26.770523071289062, "global_step": 400710, "epoch": 4827} {"train_loss": -26.8147029876709, "global_step": 400711, "epoch": 4827} {"train_loss": -26.461002349853516, "global_step": 400712, "epoch": 4827} {"train_loss": -26.225919723510742, "global_step": 400713, "epoch": 4827} {"train_loss": -26.853830337524414, "global_step": 400714, "epoch": 4827} {"train_loss": -26.7790470123291, "global_step": 400715, "epoch": 4827} {"train_loss": -26.6506290435791, "global_step": 400716, "epoch": 4827} {"train_loss": -26.22926139831543, "global_step": 400717, "epoch": 4827} {"train_loss": -26.570737838745117, "global_step": 400718, "epoch": 4827} {"train_loss": -26.704833984375, "global_step": 400719, "epoch": 4827} {"train_loss": -26.237455368041992, "global_step": 400720, "epoch": 4827} {"train_loss": -26.93994140625, "global_step": 400721, "epoch": 4827} {"train_loss": -26.808795928955078, "global_step": 400722, "epoch": 4827} {"train_loss": -26.606962732521886, "global_step": 400723, "epoch": 4827, "val_loss": 6659227.0} {"train_loss": -25.460355758666992, "global_step": 400724, "epoch": 4828} {"train_loss": -25.359954833984375, "global_step": 400725, "epoch": 4828} {"train_loss": -25.34214973449707, "global_step": 400726, "epoch": 4828} {"train_loss": -25.697101593017578, "global_step": 400727, "epoch": 4828} {"train_loss": -25.49317741394043, "global_step": 400728, "epoch": 4828} {"train_loss": -25.938501358032227, "global_step": 400729, "epoch": 4828} {"train_loss": -25.913970947265625, "global_step": 400730, "epoch": 4828} {"train_loss": -25.790821075439453, "global_step": 400731, "epoch": 4828} {"train_loss": -25.8911190032959, "global_step": 400732, "epoch": 4828} {"train_loss": -26.052581787109375, "global_step": 400733, "epoch": 4828} {"train_loss": -25.18088722229004, "global_step": 400734, "epoch": 4828} {"train_loss": -25.946563720703125, "global_step": 400735, "epoch": 4828} {"train_loss": -25.85861587524414, "global_step": 400736, "epoch": 4828} {"train_loss": -26.3082332611084, "global_step": 400737, "epoch": 4828} {"train_loss": -26.09404945373535, "global_step": 400738, "epoch": 4828} {"train_loss": -26.164108276367188, "global_step": 400739, "epoch": 4828} {"train_loss": -26.288175582885742, "global_step": 400740, "epoch": 4828} {"train_loss": -25.91423988342285, "global_step": 400741, "epoch": 4828} {"train_loss": -26.653730392456055, "global_step": 400742, "epoch": 4828} {"train_loss": -26.397266387939453, "global_step": 400743, "epoch": 4828} {"train_loss": -26.176929473876953, "global_step": 400744, "epoch": 4828} {"train_loss": -26.7758731842041, "global_step": 400745, "epoch": 4828} {"train_loss": -26.52277946472168, "global_step": 400746, "epoch": 4828} {"train_loss": -26.609472274780273, "global_step": 400747, "epoch": 4828} {"train_loss": -26.553180694580078, "global_step": 400748, "epoch": 4828} {"train_loss": -26.45757484436035, "global_step": 400749, "epoch": 4828} {"train_loss": -26.503583908081055, "global_step": 400750, "epoch": 4828} {"train_loss": -26.42140007019043, "global_step": 400751, "epoch": 4828} {"train_loss": -26.395788192749023, "global_step": 400752, "epoch": 4828} {"train_loss": -26.848363876342773, "global_step": 400753, "epoch": 4828} {"train_loss": -26.720773696899414, "global_step": 400754, "epoch": 4828} {"train_loss": -26.334369659423828, "global_step": 400755, "epoch": 4828} {"train_loss": -26.49932289123535, "global_step": 400756, "epoch": 4828} {"train_loss": -26.76545524597168, "global_step": 400757, "epoch": 4828} {"train_loss": -26.7273006439209, "global_step": 400758, "epoch": 4828} {"train_loss": -26.709211349487305, "global_step": 400759, "epoch": 4828} {"train_loss": -26.430408477783203, "global_step": 400760, "epoch": 4828} {"train_loss": -26.7893123626709, "global_step": 400761, "epoch": 4828} {"train_loss": -26.54206657409668, "global_step": 400762, "epoch": 4828} {"train_loss": -26.66973876953125, "global_step": 400763, "epoch": 4828} {"train_loss": -26.77617835998535, "global_step": 400764, "epoch": 4828} {"train_loss": -26.70354652404785, "global_step": 400765, "epoch": 4828} {"train_loss": -26.607664108276367, "global_step": 400766, "epoch": 4828} {"train_loss": -26.84686851501465, "global_step": 400767, "epoch": 4828} {"train_loss": -26.735279083251953, "global_step": 400768, "epoch": 4828} {"train_loss": -26.756620407104492, "global_step": 400769, "epoch": 4828} {"train_loss": -26.82508659362793, "global_step": 400770, "epoch": 4828} {"train_loss": -27.082080841064453, "global_step": 400771, "epoch": 4828} {"train_loss": -26.449865341186523, "global_step": 400772, "epoch": 4828} {"train_loss": -26.94222068786621, "global_step": 400773, "epoch": 4828} {"train_loss": -26.519550323486328, "global_step": 400774, "epoch": 4828} {"train_loss": -27.050031661987305, "global_step": 400775, "epoch": 4828} {"train_loss": -26.814111709594727, "global_step": 400776, "epoch": 4828} {"train_loss": -27.042280197143555, "global_step": 400777, "epoch": 4828} {"train_loss": -27.019132614135742, "global_step": 400778, "epoch": 4828} {"train_loss": -26.807815551757812, "global_step": 400779, "epoch": 4828} {"train_loss": -26.89453125, "global_step": 400780, "epoch": 4828} {"train_loss": -26.92331886291504, "global_step": 400781, "epoch": 4828} {"train_loss": -26.92951774597168, "global_step": 400782, "epoch": 4828} {"train_loss": -26.910253524780273, "global_step": 400783, "epoch": 4828} {"train_loss": -26.89020347595215, "global_step": 400784, "epoch": 4828} {"train_loss": -26.883432388305664, "global_step": 400785, "epoch": 4828} {"train_loss": -26.42632484436035, "global_step": 400786, "epoch": 4828} {"train_loss": -26.592466354370117, "global_step": 400787, "epoch": 4828} {"train_loss": -27.1126708984375, "global_step": 400788, "epoch": 4828} {"train_loss": -26.654285430908203, "global_step": 400789, "epoch": 4828} {"train_loss": -26.366674423217773, "global_step": 400790, "epoch": 4828} {"train_loss": -26.477888107299805, "global_step": 400791, "epoch": 4828} {"train_loss": -26.696598052978516, "global_step": 400792, "epoch": 4828} {"train_loss": -26.861846923828125, "global_step": 400793, "epoch": 4828} {"train_loss": -26.67618179321289, "global_step": 400794, "epoch": 4828} {"train_loss": -26.6248779296875, "global_step": 400795, "epoch": 4828} {"train_loss": -26.865875244140625, "global_step": 400796, "epoch": 4828} {"train_loss": -26.569690704345703, "global_step": 400797, "epoch": 4828} {"train_loss": -26.751150131225586, "global_step": 400798, "epoch": 4828} {"train_loss": -26.697467803955078, "global_step": 400799, "epoch": 4828} {"train_loss": -26.753454208374023, "global_step": 400800, "epoch": 4828} {"train_loss": -26.202545166015625, "global_step": 400801, "epoch": 4828} {"train_loss": -26.47879981994629, "global_step": 400802, "epoch": 4828} {"train_loss": -26.856796264648438, "global_step": 400803, "epoch": 4828} {"train_loss": -26.3291072845459, "global_step": 400804, "epoch": 4828} {"train_loss": -26.669565200805664, "global_step": 400805, "epoch": 4828} {"train_loss": -26.494869829660438, "global_step": 400806, "epoch": 4828, "val_loss": 6779534.0} {"train_loss": -25.64483070373535, "global_step": 400807, "epoch": 4829} {"train_loss": -24.837827682495117, "global_step": 400808, "epoch": 4829} {"train_loss": -25.049123764038086, "global_step": 400809, "epoch": 4829} {"train_loss": -24.799402236938477, "global_step": 400810, "epoch": 4829} {"train_loss": -25.95705223083496, "global_step": 400811, "epoch": 4829} {"train_loss": -25.5800838470459, "global_step": 400812, "epoch": 4829} {"train_loss": -25.7120361328125, "global_step": 400813, "epoch": 4829} {"train_loss": -26.213623046875, "global_step": 400814, "epoch": 4829} {"train_loss": -25.794265747070312, "global_step": 400815, "epoch": 4829} {"train_loss": -25.83294677734375, "global_step": 400816, "epoch": 4829} {"train_loss": -26.069936752319336, "global_step": 400817, "epoch": 4829} {"train_loss": -25.84181785583496, "global_step": 400818, "epoch": 4829} {"train_loss": -26.09576988220215, "global_step": 400819, "epoch": 4829} {"train_loss": -25.834287643432617, "global_step": 400820, "epoch": 4829} {"train_loss": -26.1823673248291, "global_step": 400821, "epoch": 4829} {"train_loss": -26.309528350830078, "global_step": 400822, "epoch": 4829} {"train_loss": -26.275653839111328, "global_step": 400823, "epoch": 4829} {"train_loss": -26.376264572143555, "global_step": 400824, "epoch": 4829} {"train_loss": -26.285938262939453, "global_step": 400825, "epoch": 4829} {"train_loss": -26.194055557250977, "global_step": 400826, "epoch": 4829} {"train_loss": -26.297531127929688, "global_step": 400827, "epoch": 4829} {"train_loss": -26.32965087890625, "global_step": 400828, "epoch": 4829} {"train_loss": -26.402973175048828, "global_step": 400829, "epoch": 4829} {"train_loss": -26.58353042602539, "global_step": 400830, "epoch": 4829} {"train_loss": -26.314786911010742, "global_step": 400831, "epoch": 4829} {"train_loss": -26.547931671142578, "global_step": 400832, "epoch": 4829} {"train_loss": -26.344409942626953, "global_step": 400833, "epoch": 4829} {"train_loss": -26.4464054107666, "global_step": 400834, "epoch": 4829} {"train_loss": -26.989431381225586, "global_step": 400835, "epoch": 4829} {"train_loss": -26.38577651977539, "global_step": 400836, "epoch": 4829} {"train_loss": -26.268024444580078, "global_step": 400837, "epoch": 4829} {"train_loss": -26.609485626220703, "global_step": 400838, "epoch": 4829} {"train_loss": -26.22587013244629, "global_step": 400839, "epoch": 4829} {"train_loss": -26.901630401611328, "global_step": 400840, "epoch": 4829} {"train_loss": -26.487552642822266, "global_step": 400841, "epoch": 4829} {"train_loss": -26.59968376159668, "global_step": 400842, "epoch": 4829} {"train_loss": -26.770238876342773, "global_step": 400843, "epoch": 4829} {"train_loss": -27.03681755065918, "global_step": 400844, "epoch": 4829} {"train_loss": -26.733001708984375, "global_step": 400845, "epoch": 4829} {"train_loss": -26.651899337768555, "global_step": 400846, "epoch": 4829} {"train_loss": -26.847461700439453, "global_step": 400847, "epoch": 4829} {"train_loss": -26.883764266967773, "global_step": 400848, "epoch": 4829} {"train_loss": -26.712060928344727, "global_step": 400849, "epoch": 4829} {"train_loss": -26.636152267456055, "global_step": 400850, "epoch": 4829} {"train_loss": -26.871337890625, "global_step": 400851, "epoch": 4829} {"train_loss": -26.549224853515625, "global_step": 400852, "epoch": 4829} {"train_loss": -26.725723266601562, "global_step": 400853, "epoch": 4829} {"train_loss": -26.84335708618164, "global_step": 400854, "epoch": 4829} {"train_loss": -26.9533634185791, "global_step": 400855, "epoch": 4829} {"train_loss": -26.53901481628418, "global_step": 400856, "epoch": 4829} {"train_loss": -26.564716339111328, "global_step": 400857, "epoch": 4829} {"train_loss": -26.458524703979492, "global_step": 400858, "epoch": 4829} {"train_loss": -26.3273868560791, "global_step": 400859, "epoch": 4829} {"train_loss": -26.605121612548828, "global_step": 400860, "epoch": 4829} {"train_loss": -26.49004554748535, "global_step": 400861, "epoch": 4829} {"train_loss": -26.577489852905273, "global_step": 400862, "epoch": 4829} {"train_loss": -26.352270126342773, "global_step": 400863, "epoch": 4829} {"train_loss": -26.731088638305664, "global_step": 400864, "epoch": 4829} {"train_loss": -27.082080841064453, "global_step": 400865, "epoch": 4829} {"train_loss": -26.8680362701416, "global_step": 400866, "epoch": 4829} {"train_loss": -27.023746490478516, "global_step": 400867, "epoch": 4829} {"train_loss": -26.586111068725586, "global_step": 400868, "epoch": 4829} {"train_loss": -26.96493911743164, "global_step": 400869, "epoch": 4829} {"train_loss": -26.488052368164062, "global_step": 400870, "epoch": 4829} {"train_loss": -26.866443634033203, "global_step": 400871, "epoch": 4829} {"train_loss": -26.07908058166504, "global_step": 400872, "epoch": 4829} {"train_loss": -26.28230094909668, "global_step": 400873, "epoch": 4829} {"train_loss": -26.780826568603516, "global_step": 400874, "epoch": 4829} {"train_loss": -27.015180587768555, "global_step": 400875, "epoch": 4829} {"train_loss": -26.648298263549805, "global_step": 400876, "epoch": 4829} {"train_loss": -26.723981857299805, "global_step": 400877, "epoch": 4829} {"train_loss": -26.551923751831055, "global_step": 400878, "epoch": 4829} {"train_loss": -26.893741607666016, "global_step": 400879, "epoch": 4829} {"train_loss": -26.423175811767578, "global_step": 400880, "epoch": 4829} {"train_loss": -26.83180809020996, "global_step": 400881, "epoch": 4829} {"train_loss": -26.605016708374023, "global_step": 400882, "epoch": 4829} {"train_loss": -26.6342716217041, "global_step": 400883, "epoch": 4829} {"train_loss": -27.129779815673828, "global_step": 400884, "epoch": 4829} {"train_loss": -26.66229820251465, "global_step": 400885, "epoch": 4829} {"train_loss": -26.96773338317871, "global_step": 400886, "epoch": 4829} {"train_loss": -26.416540145874023, "global_step": 400887, "epoch": 4829} {"train_loss": -26.483083724975586, "global_step": 400888, "epoch": 4829} {"train_loss": -26.451539211962597, "global_step": 400889, "epoch": 4829, "val_loss": 6794143.0} {"train_loss": -26.12587547302246, "global_step": 400890, "epoch": 4830} {"train_loss": -25.836353302001953, "global_step": 400891, "epoch": 4830} {"train_loss": -26.297529220581055, "global_step": 400892, "epoch": 4830} {"train_loss": -25.861713409423828, "global_step": 400893, "epoch": 4830} {"train_loss": -26.196741104125977, "global_step": 400894, "epoch": 4830} {"train_loss": -26.63984489440918, "global_step": 400895, "epoch": 4830} {"train_loss": -26.067840576171875, "global_step": 400896, "epoch": 4830} {"train_loss": -26.18378257751465, "global_step": 400897, "epoch": 4830} {"train_loss": -26.25689697265625, "global_step": 400898, "epoch": 4830} {"train_loss": -26.190549850463867, "global_step": 400899, "epoch": 4830} {"train_loss": -26.221006393432617, "global_step": 400900, "epoch": 4830} {"train_loss": -26.410444259643555, "global_step": 400901, "epoch": 4830} {"train_loss": -26.644132614135742, "global_step": 400902, "epoch": 4830} {"train_loss": -26.473413467407227, "global_step": 400903, "epoch": 4830} {"train_loss": -26.574752807617188, "global_step": 400904, "epoch": 4830} {"train_loss": -26.79010581970215, "global_step": 400905, "epoch": 4830} {"train_loss": -26.717010498046875, "global_step": 400906, "epoch": 4830} {"train_loss": -26.301776885986328, "global_step": 400907, "epoch": 4830} {"train_loss": -26.455280303955078, "global_step": 400908, "epoch": 4830} {"train_loss": -26.484893798828125, "global_step": 400909, "epoch": 4830} {"train_loss": -26.74945068359375, "global_step": 400910, "epoch": 4830} {"train_loss": -26.33441162109375, "global_step": 400911, "epoch": 4830} {"train_loss": -26.804895401000977, "global_step": 400912, "epoch": 4830} {"train_loss": -26.47052001953125, "global_step": 400913, "epoch": 4830} {"train_loss": -26.622329711914062, "global_step": 400914, "epoch": 4830} {"train_loss": -26.27734375, "global_step": 400915, "epoch": 4830} {"train_loss": -26.706073760986328, "global_step": 400916, "epoch": 4830} {"train_loss": -26.708927154541016, "global_step": 400917, "epoch": 4830} {"train_loss": -27.014379501342773, "global_step": 400918, "epoch": 4830} {"train_loss": -26.26544189453125, "global_step": 400919, "epoch": 4830} {"train_loss": -26.802576065063477, "global_step": 400920, "epoch": 4830} {"train_loss": -26.824323654174805, "global_step": 400921, "epoch": 4830} {"train_loss": -26.8815860748291, "global_step": 400922, "epoch": 4830} {"train_loss": -26.760915756225586, "global_step": 400923, "epoch": 4830} {"train_loss": -26.75813865661621, "global_step": 400924, "epoch": 4830} {"train_loss": -26.79364013671875, "global_step": 400925, "epoch": 4830} {"train_loss": -26.518024444580078, "global_step": 400926, "epoch": 4830} {"train_loss": -26.441486358642578, "global_step": 400927, "epoch": 4830} {"train_loss": -27.04973793029785, "global_step": 400928, "epoch": 4830} {"train_loss": -27.043975830078125, "global_step": 400929, "epoch": 4830} {"train_loss": -26.5341854095459, "global_step": 400930, "epoch": 4830} {"train_loss": -26.67133140563965, "global_step": 400931, "epoch": 4830} {"train_loss": -26.841672897338867, "global_step": 400932, "epoch": 4830} {"train_loss": -26.93252944946289, "global_step": 400933, "epoch": 4830} {"train_loss": -26.964996337890625, "global_step": 400934, "epoch": 4830} {"train_loss": -26.78101921081543, "global_step": 400935, "epoch": 4830} {"train_loss": -26.686691284179688, "global_step": 400936, "epoch": 4830} {"train_loss": -26.767438888549805, "global_step": 400937, "epoch": 4830} {"train_loss": -26.450626373291016, "global_step": 400938, "epoch": 4830} {"train_loss": -26.401580810546875, "global_step": 400939, "epoch": 4830} {"train_loss": -26.56369972229004, "global_step": 400940, "epoch": 4830} {"train_loss": -26.561742782592773, "global_step": 400941, "epoch": 4830} {"train_loss": -26.881729125976562, "global_step": 400942, "epoch": 4830} {"train_loss": -26.17803955078125, "global_step": 400943, "epoch": 4830} {"train_loss": -26.694400787353516, "global_step": 400944, "epoch": 4830} {"train_loss": -26.491220474243164, "global_step": 400945, "epoch": 4830} {"train_loss": -26.5258846282959, "global_step": 400946, "epoch": 4830} {"train_loss": -26.08173942565918, "global_step": 400947, "epoch": 4830} {"train_loss": -26.450613021850586, "global_step": 400948, "epoch": 4830} {"train_loss": -26.800262451171875, "global_step": 400949, "epoch": 4830} {"train_loss": -26.560871124267578, "global_step": 400950, "epoch": 4830} {"train_loss": -26.443326950073242, "global_step": 400951, "epoch": 4830} {"train_loss": -26.544025421142578, "global_step": 400952, "epoch": 4830} {"train_loss": -26.845014572143555, "global_step": 400953, "epoch": 4830} {"train_loss": -26.898193359375, "global_step": 400954, "epoch": 4830} {"train_loss": -26.76449966430664, "global_step": 400955, "epoch": 4830} {"train_loss": -26.556211471557617, "global_step": 400956, "epoch": 4830} {"train_loss": -26.965173721313477, "global_step": 400957, "epoch": 4830} {"train_loss": -26.885791778564453, "global_step": 400958, "epoch": 4830} {"train_loss": -26.401432037353516, "global_step": 400959, "epoch": 4830} {"train_loss": -27.021997451782227, "global_step": 400960, "epoch": 4830} {"train_loss": -26.3707218170166, "global_step": 400961, "epoch": 4830} {"train_loss": -26.547887802124023, "global_step": 400962, "epoch": 4830} {"train_loss": -26.70037269592285, "global_step": 400963, "epoch": 4830} {"train_loss": -26.87738037109375, "global_step": 400964, "epoch": 4830} {"train_loss": -26.6583194732666, "global_step": 400965, "epoch": 4830} {"train_loss": -26.72454833984375, "global_step": 400966, "epoch": 4830} {"train_loss": -26.654376983642578, "global_step": 400967, "epoch": 4830} {"train_loss": -27.084274291992188, "global_step": 400968, "epoch": 4830} {"train_loss": -26.66941261291504, "global_step": 400969, "epoch": 4830} {"train_loss": -26.67990493774414, "global_step": 400970, "epoch": 4830} {"train_loss": -26.589874267578125, "global_step": 400971, "epoch": 4830} {"train_loss": -26.59472867666957, "global_step": 400972, "epoch": 4830, "val_loss": 6795078.0} {"train_loss": -26.19793128967285, "global_step": 400973, "epoch": 4831} {"train_loss": -26.057775497436523, "global_step": 400974, "epoch": 4831} {"train_loss": -26.242599487304688, "global_step": 400975, "epoch": 4831} {"train_loss": -26.226598739624023, "global_step": 400976, "epoch": 4831} {"train_loss": -26.27788734436035, "global_step": 400977, "epoch": 4831} {"train_loss": -26.06844139099121, "global_step": 400978, "epoch": 4831} {"train_loss": -26.63077735900879, "global_step": 400979, "epoch": 4831} {"train_loss": -26.59437370300293, "global_step": 400980, "epoch": 4831} {"train_loss": -26.55177879333496, "global_step": 400981, "epoch": 4831} {"train_loss": -26.305551528930664, "global_step": 400982, "epoch": 4831} {"train_loss": -26.36142349243164, "global_step": 400983, "epoch": 4831} {"train_loss": -26.423084259033203, "global_step": 400984, "epoch": 4831} {"train_loss": -26.182849884033203, "global_step": 400985, "epoch": 4831} {"train_loss": -26.747039794921875, "global_step": 400986, "epoch": 4831} {"train_loss": -26.1318302154541, "global_step": 400987, "epoch": 4831} {"train_loss": -26.187122344970703, "global_step": 400988, "epoch": 4831} {"train_loss": -26.26065444946289, "global_step": 400989, "epoch": 4831} {"train_loss": -26.38248062133789, "global_step": 400990, "epoch": 4831} {"train_loss": -26.308664321899414, "global_step": 400991, "epoch": 4831} {"train_loss": -25.977630615234375, "global_step": 400992, "epoch": 4831} {"train_loss": -26.407358169555664, "global_step": 400993, "epoch": 4831} {"train_loss": -26.362930297851562, "global_step": 400994, "epoch": 4831} {"train_loss": -25.992795944213867, "global_step": 400995, "epoch": 4831} {"train_loss": -26.723190307617188, "global_step": 400996, "epoch": 4831} {"train_loss": -26.740070343017578, "global_step": 400997, "epoch": 4831} {"train_loss": -26.71870994567871, "global_step": 400998, "epoch": 4831} {"train_loss": -26.35088539123535, "global_step": 400999, "epoch": 4831} {"train_loss": -26.456043243408203, "global_step": 401000, "epoch": 4831} {"train_loss": -26.66611099243164, "global_step": 401001, "epoch": 4831} {"train_loss": -26.446142196655273, "global_step": 401002, "epoch": 4831} {"train_loss": -26.71986198425293, "global_step": 401003, "epoch": 4831} {"train_loss": -26.653242111206055, "global_step": 401004, "epoch": 4831} {"train_loss": -26.56878089904785, "global_step": 401005, "epoch": 4831} {"train_loss": -26.509613037109375, "global_step": 401006, "epoch": 4831} {"train_loss": -26.709253311157227, "global_step": 401007, "epoch": 4831} {"train_loss": -26.44927978515625, "global_step": 401008, "epoch": 4831} {"train_loss": -26.579858779907227, "global_step": 401009, "epoch": 4831} {"train_loss": -26.735260009765625, "global_step": 401010, "epoch": 4831} {"train_loss": -26.83526039123535, "global_step": 401011, "epoch": 4831} {"train_loss": -27.14324378967285, "global_step": 401012, "epoch": 4831} {"train_loss": -26.341123580932617, "global_step": 401013, "epoch": 4831} {"train_loss": -26.45564079284668, "global_step": 401014, "epoch": 4831} {"train_loss": -26.857501983642578, "global_step": 401015, "epoch": 4831} {"train_loss": -26.50762367248535, "global_step": 401016, "epoch": 4831} {"train_loss": -26.68404197692871, "global_step": 401017, "epoch": 4831} {"train_loss": -26.82502555847168, "global_step": 401018, "epoch": 4831} {"train_loss": -26.255956649780273, "global_step": 401019, "epoch": 4831} {"train_loss": -26.511920928955078, "global_step": 401020, "epoch": 4831} {"train_loss": -26.41704750061035, "global_step": 401021, "epoch": 4831} {"train_loss": -26.429492950439453, "global_step": 401022, "epoch": 4831} {"train_loss": -26.63568687438965, "global_step": 401023, "epoch": 4831} {"train_loss": -26.170560836791992, "global_step": 401024, "epoch": 4831} {"train_loss": -26.837858200073242, "global_step": 401025, "epoch": 4831} {"train_loss": -26.623655319213867, "global_step": 401026, "epoch": 4831} {"train_loss": -26.38483238220215, "global_step": 401027, "epoch": 4831} {"train_loss": -26.658588409423828, "global_step": 401028, "epoch": 4831} {"train_loss": -26.779932022094727, "global_step": 401029, "epoch": 4831} {"train_loss": -26.746078491210938, "global_step": 401030, "epoch": 4831} {"train_loss": -26.375030517578125, "global_step": 401031, "epoch": 4831} {"train_loss": -26.707935333251953, "global_step": 401032, "epoch": 4831} {"train_loss": -26.716943740844727, "global_step": 401033, "epoch": 4831} {"train_loss": -26.81037712097168, "global_step": 401034, "epoch": 4831} {"train_loss": -27.08326530456543, "global_step": 401035, "epoch": 4831} {"train_loss": -26.738962173461914, "global_step": 401036, "epoch": 4831} {"train_loss": -26.826202392578125, "global_step": 401037, "epoch": 4831} {"train_loss": -26.317914962768555, "global_step": 401038, "epoch": 4831} {"train_loss": -26.716886520385742, "global_step": 401039, "epoch": 4831} {"train_loss": -27.05365562438965, "global_step": 401040, "epoch": 4831} {"train_loss": -26.482940673828125, "global_step": 401041, "epoch": 4831} {"train_loss": -27.05885887145996, "global_step": 401042, "epoch": 4831} {"train_loss": -26.69231605529785, "global_step": 401043, "epoch": 4831} {"train_loss": -27.235675811767578, "global_step": 401044, "epoch": 4831} {"train_loss": -26.54132080078125, "global_step": 401045, "epoch": 4831} {"train_loss": -26.126256942749023, "global_step": 401046, "epoch": 4831} {"train_loss": -26.806142807006836, "global_step": 401047, "epoch": 4831} {"train_loss": -26.504831314086914, "global_step": 401048, "epoch": 4831} {"train_loss": -26.759124755859375, "global_step": 401049, "epoch": 4831} {"train_loss": -26.454761505126953, "global_step": 401050, "epoch": 4831} {"train_loss": -26.787250518798828, "global_step": 401051, "epoch": 4831} {"train_loss": -26.619821548461914, "global_step": 401052, "epoch": 4831} {"train_loss": -26.67647361755371, "global_step": 401053, "epoch": 4831} {"train_loss": -26.487329483032227, "global_step": 401054, "epoch": 4831} {"train_loss": -26.550239907689843, "global_step": 401055, "epoch": 4831, "val_loss": 6742735.0} {"train_loss": -26.97942543029785, "global_step": 401056, "epoch": 4832} {"train_loss": -26.061532974243164, "global_step": 401057, "epoch": 4832} {"train_loss": -26.217533111572266, "global_step": 401058, "epoch": 4832} {"train_loss": -26.524057388305664, "global_step": 401059, "epoch": 4832} {"train_loss": -26.311182022094727, "global_step": 401060, "epoch": 4832} {"train_loss": -25.68482780456543, "global_step": 401061, "epoch": 4832} {"train_loss": -25.92630958557129, "global_step": 401062, "epoch": 4832} {"train_loss": -25.840576171875, "global_step": 401063, "epoch": 4832} {"train_loss": -25.795398712158203, "global_step": 401064, "epoch": 4832} {"train_loss": -25.161819458007812, "global_step": 401065, "epoch": 4832} {"train_loss": -25.99860954284668, "global_step": 401066, "epoch": 4832} {"train_loss": -25.540252685546875, "global_step": 401067, "epoch": 4832} {"train_loss": -26.267871856689453, "global_step": 401068, "epoch": 4832} {"train_loss": -25.924701690673828, "global_step": 401069, "epoch": 4832} {"train_loss": -25.912206649780273, "global_step": 401070, "epoch": 4832} {"train_loss": -25.884008407592773, "global_step": 401071, "epoch": 4832} {"train_loss": -26.051013946533203, "global_step": 401072, "epoch": 4832} {"train_loss": -26.16119956970215, "global_step": 401073, "epoch": 4832} {"train_loss": -26.351449966430664, "global_step": 401074, "epoch": 4832} {"train_loss": -26.354740142822266, "global_step": 401075, "epoch": 4832} {"train_loss": -26.35114097595215, "global_step": 401076, "epoch": 4832} {"train_loss": -26.006454467773438, "global_step": 401077, "epoch": 4832} {"train_loss": -26.514245986938477, "global_step": 401078, "epoch": 4832} {"train_loss": -25.823816299438477, "global_step": 401079, "epoch": 4832} {"train_loss": -26.136571884155273, "global_step": 401080, "epoch": 4832} {"train_loss": -26.44081687927246, "global_step": 401081, "epoch": 4832} {"train_loss": -26.266666412353516, "global_step": 401082, "epoch": 4832} {"train_loss": -26.566638946533203, "global_step": 401083, "epoch": 4832} {"train_loss": -26.471832275390625, "global_step": 401084, "epoch": 4832} {"train_loss": -26.677722930908203, "global_step": 401085, "epoch": 4832} {"train_loss": -26.510541915893555, "global_step": 401086, "epoch": 4832} {"train_loss": -26.456037521362305, "global_step": 401087, "epoch": 4832} {"train_loss": -26.66560173034668, "global_step": 401088, "epoch": 4832} {"train_loss": -26.552871704101562, "global_step": 401089, "epoch": 4832} {"train_loss": -26.44700050354004, "global_step": 401090, "epoch": 4832} {"train_loss": -26.627735137939453, "global_step": 401091, "epoch": 4832} {"train_loss": -26.65732192993164, "global_step": 401092, "epoch": 4832} {"train_loss": -26.84293556213379, "global_step": 401093, "epoch": 4832} {"train_loss": -26.71962547302246, "global_step": 401094, "epoch": 4832} {"train_loss": -26.748977661132812, "global_step": 401095, "epoch": 4832} {"train_loss": -26.418561935424805, "global_step": 401096, "epoch": 4832} {"train_loss": -26.666601181030273, "global_step": 401097, "epoch": 4832} {"train_loss": -26.61490249633789, "global_step": 401098, "epoch": 4832} {"train_loss": -26.83772087097168, "global_step": 401099, "epoch": 4832} {"train_loss": -26.5147647857666, "global_step": 401100, "epoch": 4832} {"train_loss": -26.77410888671875, "global_step": 401101, "epoch": 4832} {"train_loss": -26.332611083984375, "global_step": 401102, "epoch": 4832} {"train_loss": -26.64887046813965, "global_step": 401103, "epoch": 4832} {"train_loss": -26.7371768951416, "global_step": 401104, "epoch": 4832} {"train_loss": -26.782751083374023, "global_step": 401105, "epoch": 4832} {"train_loss": -26.707876205444336, "global_step": 401106, "epoch": 4832} {"train_loss": -26.4731502532959, "global_step": 401107, "epoch": 4832} {"train_loss": -26.4183406829834, "global_step": 401108, "epoch": 4832} {"train_loss": -26.660430908203125, "global_step": 401109, "epoch": 4832} {"train_loss": -26.880878448486328, "global_step": 401110, "epoch": 4832} {"train_loss": -27.057767868041992, "global_step": 401111, "epoch": 4832} {"train_loss": -26.530088424682617, "global_step": 401112, "epoch": 4832} {"train_loss": -26.803735733032227, "global_step": 401113, "epoch": 4832} {"train_loss": -26.518468856811523, "global_step": 401114, "epoch": 4832} {"train_loss": -26.70122718811035, "global_step": 401115, "epoch": 4832} {"train_loss": -26.52031898498535, "global_step": 401116, "epoch": 4832} {"train_loss": -26.399057388305664, "global_step": 401117, "epoch": 4832} {"train_loss": -26.861297607421875, "global_step": 401118, "epoch": 4832} {"train_loss": -26.5447998046875, "global_step": 401119, "epoch": 4832} {"train_loss": -26.768402099609375, "global_step": 401120, "epoch": 4832} {"train_loss": -26.719221115112305, "global_step": 401121, "epoch": 4832} {"train_loss": -26.29327392578125, "global_step": 401122, "epoch": 4832} {"train_loss": -26.56879234313965, "global_step": 401123, "epoch": 4832} {"train_loss": -26.598224639892578, "global_step": 401124, "epoch": 4832} {"train_loss": -26.971588134765625, "global_step": 401125, "epoch": 4832} {"train_loss": -26.80769920349121, "global_step": 401126, "epoch": 4832} {"train_loss": -26.40485191345215, "global_step": 401127, "epoch": 4832} {"train_loss": -26.460102081298828, "global_step": 401128, "epoch": 4832} {"train_loss": -26.031057357788086, "global_step": 401129, "epoch": 4832} {"train_loss": -26.76738929748535, "global_step": 401130, "epoch": 4832} {"train_loss": -26.323566436767578, "global_step": 401131, "epoch": 4832} {"train_loss": -26.60751724243164, "global_step": 401132, "epoch": 4832} {"train_loss": -26.640430450439453, "global_step": 401133, "epoch": 4832} {"train_loss": -26.693029403686523, "global_step": 401134, "epoch": 4832} {"train_loss": -26.532758712768555, "global_step": 401135, "epoch": 4832} {"train_loss": -26.574787139892578, "global_step": 401136, "epoch": 4832} {"train_loss": -26.744291305541992, "global_step": 401137, "epoch": 4832} {"train_loss": -26.43869273633842, "global_step": 401138, "epoch": 4832, "val_loss": 6720220.5} {"train_loss": -26.449426651000977, "global_step": 401139, "epoch": 4833} {"train_loss": -26.702157974243164, "global_step": 401140, "epoch": 4833} {"train_loss": -26.504138946533203, "global_step": 401141, "epoch": 4833} {"train_loss": -26.42677879333496, "global_step": 401142, "epoch": 4833} {"train_loss": -26.2206974029541, "global_step": 401143, "epoch": 4833} {"train_loss": -26.311094284057617, "global_step": 401144, "epoch": 4833} {"train_loss": -26.36992835998535, "global_step": 401145, "epoch": 4833} {"train_loss": -26.94025993347168, "global_step": 401146, "epoch": 4833} {"train_loss": -26.54584312438965, "global_step": 401147, "epoch": 4833} {"train_loss": -26.87939453125, "global_step": 401148, "epoch": 4833} {"train_loss": -26.463125228881836, "global_step": 401149, "epoch": 4833} {"train_loss": -26.628198623657227, "global_step": 401150, "epoch": 4833} {"train_loss": -26.821044921875, "global_step": 401151, "epoch": 4833} {"train_loss": -26.414350509643555, "global_step": 401152, "epoch": 4833} {"train_loss": -26.655439376831055, "global_step": 401153, "epoch": 4833} {"train_loss": -26.353195190429688, "global_step": 401154, "epoch": 4833} {"train_loss": -26.383386611938477, "global_step": 401155, "epoch": 4833} {"train_loss": -26.494428634643555, "global_step": 401156, "epoch": 4833} {"train_loss": -26.742544174194336, "global_step": 401157, "epoch": 4833} {"train_loss": -26.296268463134766, "global_step": 401158, "epoch": 4833} {"train_loss": -27.024078369140625, "global_step": 401159, "epoch": 4833} {"train_loss": -26.256128311157227, "global_step": 401160, "epoch": 4833} {"train_loss": -26.684619903564453, "global_step": 401161, "epoch": 4833} {"train_loss": -26.723066329956055, "global_step": 401162, "epoch": 4833} {"train_loss": -26.508377075195312, "global_step": 401163, "epoch": 4833} {"train_loss": -26.636133193969727, "global_step": 401164, "epoch": 4833} {"train_loss": -26.458585739135742, "global_step": 401165, "epoch": 4833} {"train_loss": -26.8233585357666, "global_step": 401166, "epoch": 4833} {"train_loss": -26.72300148010254, "global_step": 401167, "epoch": 4833} {"train_loss": -26.1455135345459, "global_step": 401168, "epoch": 4833} {"train_loss": -26.2254695892334, "global_step": 401169, "epoch": 4833} {"train_loss": -26.45928382873535, "global_step": 401170, "epoch": 4833} {"train_loss": -26.682775497436523, "global_step": 401171, "epoch": 4833} {"train_loss": -26.3593692779541, "global_step": 401172, "epoch": 4833} {"train_loss": -26.54876708984375, "global_step": 401173, "epoch": 4833} {"train_loss": -26.62627601623535, "global_step": 401174, "epoch": 4833} {"train_loss": -26.51297378540039, "global_step": 401175, "epoch": 4833} {"train_loss": -26.999372482299805, "global_step": 401176, "epoch": 4833} {"train_loss": -26.688098907470703, "global_step": 401177, "epoch": 4833} {"train_loss": -26.793664932250977, "global_step": 401178, "epoch": 4833} {"train_loss": -26.6275577545166, "global_step": 401179, "epoch": 4833} {"train_loss": -26.822538375854492, "global_step": 401180, "epoch": 4833} {"train_loss": -26.255645751953125, "global_step": 401181, "epoch": 4833} {"train_loss": -26.855077743530273, "global_step": 401182, "epoch": 4833} {"train_loss": -26.8377742767334, "global_step": 401183, "epoch": 4833} {"train_loss": -26.630399703979492, "global_step": 401184, "epoch": 4833} {"train_loss": -26.809518814086914, "global_step": 401185, "epoch": 4833} {"train_loss": -26.573394775390625, "global_step": 401186, "epoch": 4833} {"train_loss": -27.042551040649414, "global_step": 401187, "epoch": 4833} {"train_loss": -26.566495895385742, "global_step": 401188, "epoch": 4833} {"train_loss": -26.73847770690918, "global_step": 401189, "epoch": 4833} {"train_loss": -26.99073600769043, "global_step": 401190, "epoch": 4833} {"train_loss": -26.501789093017578, "global_step": 401191, "epoch": 4833} {"train_loss": -26.442920684814453, "global_step": 401192, "epoch": 4833} {"train_loss": -26.89849281311035, "global_step": 401193, "epoch": 4833} {"train_loss": -26.756519317626953, "global_step": 401194, "epoch": 4833} {"train_loss": -26.80707359313965, "global_step": 401195, "epoch": 4833} {"train_loss": -26.452133178710938, "global_step": 401196, "epoch": 4833} {"train_loss": -26.523534774780273, "global_step": 401197, "epoch": 4833} {"train_loss": -26.4031982421875, "global_step": 401198, "epoch": 4833} {"train_loss": -26.29680824279785, "global_step": 401199, "epoch": 4833} {"train_loss": -26.30694007873535, "global_step": 401200, "epoch": 4833} {"train_loss": -26.673919677734375, "global_step": 401201, "epoch": 4833} {"train_loss": -26.556598663330078, "global_step": 401202, "epoch": 4833} {"train_loss": -26.5843448638916, "global_step": 401203, "epoch": 4833} {"train_loss": -26.17982292175293, "global_step": 401204, "epoch": 4833} {"train_loss": -26.0117244720459, "global_step": 401205, "epoch": 4833} {"train_loss": -26.2800235748291, "global_step": 401206, "epoch": 4833} {"train_loss": -26.882831573486328, "global_step": 401207, "epoch": 4833} {"train_loss": -25.9136905670166, "global_step": 401208, "epoch": 4833} {"train_loss": -26.010181427001953, "global_step": 401209, "epoch": 4833} {"train_loss": -26.263309478759766, "global_step": 401210, "epoch": 4833} {"train_loss": -26.6628360748291, "global_step": 401211, "epoch": 4833} {"train_loss": -26.32477378845215, "global_step": 401212, "epoch": 4833} {"train_loss": -26.459247589111328, "global_step": 401213, "epoch": 4833} {"train_loss": -26.695348739624023, "global_step": 401214, "epoch": 4833} {"train_loss": -26.532155990600586, "global_step": 401215, "epoch": 4833} {"train_loss": -26.54902458190918, "global_step": 401216, "epoch": 4833} {"train_loss": -26.503345489501953, "global_step": 401217, "epoch": 4833} {"train_loss": -27.02117347717285, "global_step": 401218, "epoch": 4833} {"train_loss": -26.46662712097168, "global_step": 401219, "epoch": 4833} {"train_loss": -26.646371841430664, "global_step": 401220, "epoch": 4833} {"train_loss": -26.54480729620141, "global_step": 401221, "epoch": 4833, "val_loss": 6781594.0} {"train_loss": -26.67756462097168, "global_step": 401222, "epoch": 4834} {"train_loss": -26.548154830932617, "global_step": 401223, "epoch": 4834} {"train_loss": -26.640918731689453, "global_step": 401224, "epoch": 4834} {"train_loss": -26.18000602722168, "global_step": 401225, "epoch": 4834} {"train_loss": -26.4292049407959, "global_step": 401226, "epoch": 4834} {"train_loss": -26.29937744140625, "global_step": 401227, "epoch": 4834} {"train_loss": -26.645660400390625, "global_step": 401228, "epoch": 4834} {"train_loss": -26.574132919311523, "global_step": 401229, "epoch": 4834} {"train_loss": -26.38251304626465, "global_step": 401230, "epoch": 4834} {"train_loss": -26.19581413269043, "global_step": 401231, "epoch": 4834} {"train_loss": -26.49212074279785, "global_step": 401232, "epoch": 4834} {"train_loss": -26.739938735961914, "global_step": 401233, "epoch": 4834} {"train_loss": -26.435089111328125, "global_step": 401234, "epoch": 4834} {"train_loss": -26.65009117126465, "global_step": 401235, "epoch": 4834} {"train_loss": -26.5767879486084, "global_step": 401236, "epoch": 4834} {"train_loss": -26.551069259643555, "global_step": 401237, "epoch": 4834} {"train_loss": -26.952924728393555, "global_step": 401238, "epoch": 4834} {"train_loss": -26.583471298217773, "global_step": 401239, "epoch": 4834} {"train_loss": -26.285633087158203, "global_step": 401240, "epoch": 4834} {"train_loss": -26.739578247070312, "global_step": 401241, "epoch": 4834} {"train_loss": -26.542743682861328, "global_step": 401242, "epoch": 4834} {"train_loss": -26.595266342163086, "global_step": 401243, "epoch": 4834} {"train_loss": -26.189664840698242, "global_step": 401244, "epoch": 4834} {"train_loss": -26.583154678344727, "global_step": 401245, "epoch": 4834} {"train_loss": -26.928695678710938, "global_step": 401246, "epoch": 4834} {"train_loss": -26.829938888549805, "global_step": 401247, "epoch": 4834} {"train_loss": -26.262426376342773, "global_step": 401248, "epoch": 4834} {"train_loss": -26.302473068237305, "global_step": 401249, "epoch": 4834} {"train_loss": -26.473114013671875, "global_step": 401250, "epoch": 4834} {"train_loss": -26.557693481445312, "global_step": 401251, "epoch": 4834} {"train_loss": -26.500385284423828, "global_step": 401252, "epoch": 4834} {"train_loss": -26.182416915893555, "global_step": 401253, "epoch": 4834} {"train_loss": -26.81654167175293, "global_step": 401254, "epoch": 4834} {"train_loss": -26.741743087768555, "global_step": 401255, "epoch": 4834} {"train_loss": -26.568517684936523, "global_step": 401256, "epoch": 4834} {"train_loss": -26.624481201171875, "global_step": 401257, "epoch": 4834} {"train_loss": -26.492053985595703, "global_step": 401258, "epoch": 4834} {"train_loss": -26.615741729736328, "global_step": 401259, "epoch": 4834} {"train_loss": -26.37750244140625, "global_step": 401260, "epoch": 4834} {"train_loss": -26.78925132751465, "global_step": 401261, "epoch": 4834} {"train_loss": -26.470006942749023, "global_step": 401262, "epoch": 4834} {"train_loss": -26.878164291381836, "global_step": 401263, "epoch": 4834} {"train_loss": -26.7615909576416, "global_step": 401264, "epoch": 4834} {"train_loss": -26.604516983032227, "global_step": 401265, "epoch": 4834} {"train_loss": -26.793628692626953, "global_step": 401266, "epoch": 4834} {"train_loss": -26.70570945739746, "global_step": 401267, "epoch": 4834} {"train_loss": -26.768156051635742, "global_step": 401268, "epoch": 4834} {"train_loss": -26.358566284179688, "global_step": 401269, "epoch": 4834} {"train_loss": -26.5562744140625, "global_step": 401270, "epoch": 4834} {"train_loss": -26.412012100219727, "global_step": 401271, "epoch": 4834} {"train_loss": -26.500076293945312, "global_step": 401272, "epoch": 4834} {"train_loss": -26.447118759155273, "global_step": 401273, "epoch": 4834} {"train_loss": -27.157318115234375, "global_step": 401274, "epoch": 4834} {"train_loss": -26.400836944580078, "global_step": 401275, "epoch": 4834} {"train_loss": -26.38751792907715, "global_step": 401276, "epoch": 4834} {"train_loss": -26.5458984375, "global_step": 401277, "epoch": 4834} {"train_loss": -26.700162887573242, "global_step": 401278, "epoch": 4834} {"train_loss": -26.206769943237305, "global_step": 401279, "epoch": 4834} {"train_loss": -26.413679122924805, "global_step": 401280, "epoch": 4834} {"train_loss": -26.579626083374023, "global_step": 401281, "epoch": 4834} {"train_loss": -26.525434494018555, "global_step": 401282, "epoch": 4834} {"train_loss": -26.913660049438477, "global_step": 401283, "epoch": 4834} {"train_loss": -26.2994384765625, "global_step": 401284, "epoch": 4834} {"train_loss": -26.838531494140625, "global_step": 401285, "epoch": 4834} {"train_loss": -26.651952743530273, "global_step": 401286, "epoch": 4834} {"train_loss": -26.762527465820312, "global_step": 401287, "epoch": 4834} {"train_loss": -26.73655128479004, "global_step": 401288, "epoch": 4834} {"train_loss": -26.594303131103516, "global_step": 401289, "epoch": 4834} {"train_loss": -26.595733642578125, "global_step": 401290, "epoch": 4834} {"train_loss": -26.891834259033203, "global_step": 401291, "epoch": 4834} {"train_loss": -25.971181869506836, "global_step": 401292, "epoch": 4834} {"train_loss": -26.5230712890625, "global_step": 401293, "epoch": 4834} {"train_loss": -26.392194747924805, "global_step": 401294, "epoch": 4834} {"train_loss": -26.545673370361328, "global_step": 401295, "epoch": 4834} {"train_loss": -26.2296199798584, "global_step": 401296, "epoch": 4834} {"train_loss": -26.707433700561523, "global_step": 401297, "epoch": 4834} {"train_loss": -27.018957138061523, "global_step": 401298, "epoch": 4834} {"train_loss": -26.293745040893555, "global_step": 401299, "epoch": 4834} {"train_loss": -26.498899459838867, "global_step": 401300, "epoch": 4834} {"train_loss": -26.69647789001465, "global_step": 401301, "epoch": 4834} {"train_loss": -26.7867431640625, "global_step": 401302, "epoch": 4834} {"train_loss": -26.84376335144043, "global_step": 401303, "epoch": 4834} {"train_loss": -26.565600889274872, "global_step": 401304, "epoch": 4834, "val_loss": 6748354.0} {"train_loss": -26.440601348876953, "global_step": 401305, "epoch": 4835} {"train_loss": -26.363178253173828, "global_step": 401306, "epoch": 4835} {"train_loss": -26.473468780517578, "global_step": 401307, "epoch": 4835} {"train_loss": -26.08209228515625, "global_step": 401308, "epoch": 4835} {"train_loss": -26.002506256103516, "global_step": 401309, "epoch": 4835} {"train_loss": -26.283533096313477, "global_step": 401310, "epoch": 4835} {"train_loss": -26.038894653320312, "global_step": 401311, "epoch": 4835} {"train_loss": -26.1878662109375, "global_step": 401312, "epoch": 4835} {"train_loss": -25.8089656829834, "global_step": 401313, "epoch": 4835} {"train_loss": -26.523548126220703, "global_step": 401314, "epoch": 4835} {"train_loss": -26.047107696533203, "global_step": 401315, "epoch": 4835} {"train_loss": -25.868635177612305, "global_step": 401316, "epoch": 4835} {"train_loss": -26.094446182250977, "global_step": 401317, "epoch": 4835} {"train_loss": -25.862335205078125, "global_step": 401318, "epoch": 4835} {"train_loss": -26.32634925842285, "global_step": 401319, "epoch": 4835} {"train_loss": -26.213651657104492, "global_step": 401320, "epoch": 4835} {"train_loss": -26.634443283081055, "global_step": 401321, "epoch": 4835} {"train_loss": -26.26814079284668, "global_step": 401322, "epoch": 4835} {"train_loss": -26.428485870361328, "global_step": 401323, "epoch": 4835} {"train_loss": -26.069915771484375, "global_step": 401324, "epoch": 4835} {"train_loss": -26.37030601501465, "global_step": 401325, "epoch": 4835} {"train_loss": -26.965320587158203, "global_step": 401326, "epoch": 4835} {"train_loss": -26.38093376159668, "global_step": 401327, "epoch": 4835} {"train_loss": -26.51405143737793, "global_step": 401328, "epoch": 4835} {"train_loss": -26.3702335357666, "global_step": 401329, "epoch": 4835} {"train_loss": -26.10247802734375, "global_step": 401330, "epoch": 4835} {"train_loss": -26.728534698486328, "global_step": 401331, "epoch": 4835} {"train_loss": -26.446380615234375, "global_step": 401332, "epoch": 4835} {"train_loss": -26.5638427734375, "global_step": 401333, "epoch": 4835} {"train_loss": -26.48103141784668, "global_step": 401334, "epoch": 4835} {"train_loss": -26.474597930908203, "global_step": 401335, "epoch": 4835} {"train_loss": -26.676197052001953, "global_step": 401336, "epoch": 4835} {"train_loss": -26.938058853149414, "global_step": 401337, "epoch": 4835} {"train_loss": -26.6522274017334, "global_step": 401338, "epoch": 4835} {"train_loss": -26.765806198120117, "global_step": 401339, "epoch": 4835} {"train_loss": -26.945356369018555, "global_step": 401340, "epoch": 4835} {"train_loss": -26.59901237487793, "global_step": 401341, "epoch": 4835} {"train_loss": -26.81756591796875, "global_step": 401342, "epoch": 4835} {"train_loss": -27.085285186767578, "global_step": 401343, "epoch": 4835} {"train_loss": -26.640954971313477, "global_step": 401344, "epoch": 4835} {"train_loss": -26.83717155456543, "global_step": 401345, "epoch": 4835} {"train_loss": -26.63758659362793, "global_step": 401346, "epoch": 4835} {"train_loss": -27.0211181640625, "global_step": 401347, "epoch": 4835} {"train_loss": -26.406469345092773, "global_step": 401348, "epoch": 4835} {"train_loss": -26.727209091186523, "global_step": 401349, "epoch": 4835} {"train_loss": -26.321640014648438, "global_step": 401350, "epoch": 4835} {"train_loss": -26.5992431640625, "global_step": 401351, "epoch": 4835} {"train_loss": -26.52728843688965, "global_step": 401352, "epoch": 4835} {"train_loss": -26.762060165405273, "global_step": 401353, "epoch": 4835} {"train_loss": -26.269062042236328, "global_step": 401354, "epoch": 4835} {"train_loss": -26.224018096923828, "global_step": 401355, "epoch": 4835} {"train_loss": -26.412525177001953, "global_step": 401356, "epoch": 4835} {"train_loss": -26.972814559936523, "global_step": 401357, "epoch": 4835} {"train_loss": -26.387510299682617, "global_step": 401358, "epoch": 4835} {"train_loss": -26.728124618530273, "global_step": 401359, "epoch": 4835} {"train_loss": -27.059955596923828, "global_step": 401360, "epoch": 4835} {"train_loss": -26.391332626342773, "global_step": 401361, "epoch": 4835} {"train_loss": -26.1856632232666, "global_step": 401362, "epoch": 4835} {"train_loss": -26.337656021118164, "global_step": 401363, "epoch": 4835} {"train_loss": -26.576099395751953, "global_step": 401364, "epoch": 4835} {"train_loss": -27.04288101196289, "global_step": 401365, "epoch": 4835} {"train_loss": -26.95908546447754, "global_step": 401366, "epoch": 4835} {"train_loss": -26.225677490234375, "global_step": 401367, "epoch": 4835} {"train_loss": -26.277875900268555, "global_step": 401368, "epoch": 4835} {"train_loss": -26.615570068359375, "global_step": 401369, "epoch": 4835} {"train_loss": -26.57295036315918, "global_step": 401370, "epoch": 4835} {"train_loss": -26.216033935546875, "global_step": 401371, "epoch": 4835} {"train_loss": -26.22870445251465, "global_step": 401372, "epoch": 4835} {"train_loss": -27.015100479125977, "global_step": 401373, "epoch": 4835} {"train_loss": -26.804962158203125, "global_step": 401374, "epoch": 4835} {"train_loss": -26.387714385986328, "global_step": 401375, "epoch": 4835} {"train_loss": -26.691022872924805, "global_step": 401376, "epoch": 4835} {"train_loss": -26.4537296295166, "global_step": 401377, "epoch": 4835} {"train_loss": -26.007307052612305, "global_step": 401378, "epoch": 4835} {"train_loss": -26.585180282592773, "global_step": 401379, "epoch": 4835} {"train_loss": -26.80750846862793, "global_step": 401380, "epoch": 4835} {"train_loss": -26.76893424987793, "global_step": 401381, "epoch": 4835} {"train_loss": -26.95220947265625, "global_step": 401382, "epoch": 4835} {"train_loss": -26.771076202392578, "global_step": 401383, "epoch": 4835} {"train_loss": -26.626068115234375, "global_step": 401384, "epoch": 4835} {"train_loss": -26.48642349243164, "global_step": 401385, "epoch": 4835} {"train_loss": -26.30983543395996, "global_step": 401386, "epoch": 4835} {"train_loss": -26.49188163481563, "global_step": 401387, "epoch": 4835, "val_loss": 6779937.0} {"train_loss": -26.082691192626953, "global_step": 401388, "epoch": 4836} {"train_loss": -25.903295516967773, "global_step": 401389, "epoch": 4836} {"train_loss": -26.317401885986328, "global_step": 401390, "epoch": 4836} {"train_loss": -26.754959106445312, "global_step": 401391, "epoch": 4836} {"train_loss": -26.40723991394043, "global_step": 401392, "epoch": 4836} {"train_loss": -26.372655868530273, "global_step": 401393, "epoch": 4836} {"train_loss": -26.108352661132812, "global_step": 401394, "epoch": 4836} {"train_loss": -26.752851486206055, "global_step": 401395, "epoch": 4836} {"train_loss": -26.649932861328125, "global_step": 401396, "epoch": 4836} {"train_loss": -26.222131729125977, "global_step": 401397, "epoch": 4836} {"train_loss": -26.597272872924805, "global_step": 401398, "epoch": 4836} {"train_loss": -26.660146713256836, "global_step": 401399, "epoch": 4836} {"train_loss": -26.6966609954834, "global_step": 401400, "epoch": 4836} {"train_loss": -26.71759033203125, "global_step": 401401, "epoch": 4836} {"train_loss": -26.446683883666992, "global_step": 401402, "epoch": 4836} {"train_loss": -26.60808753967285, "global_step": 401403, "epoch": 4836} {"train_loss": -26.729745864868164, "global_step": 401404, "epoch": 4836} {"train_loss": -26.691389083862305, "global_step": 401405, "epoch": 4836} {"train_loss": -26.5998477935791, "global_step": 401406, "epoch": 4836} {"train_loss": -25.9465389251709, "global_step": 401407, "epoch": 4836} {"train_loss": -26.368600845336914, "global_step": 401408, "epoch": 4836} {"train_loss": -26.539709091186523, "global_step": 401409, "epoch": 4836} {"train_loss": -26.469680786132812, "global_step": 401410, "epoch": 4836} {"train_loss": -26.37769889831543, "global_step": 401411, "epoch": 4836} {"train_loss": -26.351537704467773, "global_step": 401412, "epoch": 4836} {"train_loss": -26.5382080078125, "global_step": 401413, "epoch": 4836} {"train_loss": -26.266956329345703, "global_step": 401414, "epoch": 4836} {"train_loss": -26.599401473999023, "global_step": 401415, "epoch": 4836} {"train_loss": -26.713623046875, "global_step": 401416, "epoch": 4836} {"train_loss": -26.683441162109375, "global_step": 401417, "epoch": 4836} {"train_loss": -26.731372833251953, "global_step": 401418, "epoch": 4836} {"train_loss": -26.703962326049805, "global_step": 401419, "epoch": 4836} {"train_loss": -26.684995651245117, "global_step": 401420, "epoch": 4836} {"train_loss": -26.621707916259766, "global_step": 401421, "epoch": 4836} {"train_loss": -26.840635299682617, "global_step": 401422, "epoch": 4836} {"train_loss": -26.573535919189453, "global_step": 401423, "epoch": 4836} {"train_loss": -26.881757736206055, "global_step": 401424, "epoch": 4836} {"train_loss": -26.84100914001465, "global_step": 401425, "epoch": 4836} {"train_loss": -26.880125045776367, "global_step": 401426, "epoch": 4836} {"train_loss": -26.4211368560791, "global_step": 401427, "epoch": 4836} {"train_loss": -26.283430099487305, "global_step": 401428, "epoch": 4836} {"train_loss": -26.390527725219727, "global_step": 401429, "epoch": 4836} {"train_loss": -27.1586856842041, "global_step": 401430, "epoch": 4836} {"train_loss": -26.721471786499023, "global_step": 401431, "epoch": 4836} {"train_loss": -26.801191329956055, "global_step": 401432, "epoch": 4836} {"train_loss": -26.856983184814453, "global_step": 401433, "epoch": 4836} {"train_loss": -27.02199363708496, "global_step": 401434, "epoch": 4836} {"train_loss": -26.508716583251953, "global_step": 401435, "epoch": 4836} {"train_loss": -26.770307540893555, "global_step": 401436, "epoch": 4836} {"train_loss": -26.642133712768555, "global_step": 401437, "epoch": 4836} {"train_loss": -26.818191528320312, "global_step": 401438, "epoch": 4836} {"train_loss": -26.7392578125, "global_step": 401439, "epoch": 4836} {"train_loss": -26.545373916625977, "global_step": 401440, "epoch": 4836} {"train_loss": -26.3155517578125, "global_step": 401441, "epoch": 4836} {"train_loss": -24.9827880859375, "global_step": 401442, "epoch": 4836} {"train_loss": -23.0916690826416, "global_step": 401443, "epoch": 4836} {"train_loss": -25.402944564819336, "global_step": 401444, "epoch": 4836} {"train_loss": -26.48760414123535, "global_step": 401445, "epoch": 4836} {"train_loss": -25.686847686767578, "global_step": 401446, "epoch": 4836} {"train_loss": -26.183624267578125, "global_step": 401447, "epoch": 4836} {"train_loss": -26.205459594726562, "global_step": 401448, "epoch": 4836} {"train_loss": -26.0529727935791, "global_step": 401449, "epoch": 4836} {"train_loss": -26.09539794921875, "global_step": 401450, "epoch": 4836} {"train_loss": -25.76166343688965, "global_step": 401451, "epoch": 4836} {"train_loss": -26.5156192779541, "global_step": 401452, "epoch": 4836} {"train_loss": -26.473623275756836, "global_step": 401453, "epoch": 4836} {"train_loss": -25.99275779724121, "global_step": 401454, "epoch": 4836} {"train_loss": -26.763818740844727, "global_step": 401455, "epoch": 4836} {"train_loss": -26.460790634155273, "global_step": 401456, "epoch": 4836} {"train_loss": -26.0209903717041, "global_step": 401457, "epoch": 4836} {"train_loss": -26.467899322509766, "global_step": 401458, "epoch": 4836} {"train_loss": -26.171859741210938, "global_step": 401459, "epoch": 4836} {"train_loss": -26.505691528320312, "global_step": 401460, "epoch": 4836} {"train_loss": -26.3693904876709, "global_step": 401461, "epoch": 4836} {"train_loss": -26.227319717407227, "global_step": 401462, "epoch": 4836} {"train_loss": -25.99945068359375, "global_step": 401463, "epoch": 4836} {"train_loss": -26.636432647705078, "global_step": 401464, "epoch": 4836} {"train_loss": -26.495771408081055, "global_step": 401465, "epoch": 4836} {"train_loss": -26.223432540893555, "global_step": 401466, "epoch": 4836} {"train_loss": -26.82573890686035, "global_step": 401467, "epoch": 4836} {"train_loss": -26.567224502563477, "global_step": 401468, "epoch": 4836} {"train_loss": -26.4985294342041, "global_step": 401469, "epoch": 4836} {"train_loss": -26.420546543167298, "global_step": 401470, "epoch": 4836, "val_loss": 6722153.5} {"train_loss": -26.41098403930664, "global_step": 401471, "epoch": 4837} {"train_loss": -25.8353214263916, "global_step": 401472, "epoch": 4837} {"train_loss": -26.236312866210938, "global_step": 401473, "epoch": 4837} {"train_loss": -26.24456214904785, "global_step": 401474, "epoch": 4837} {"train_loss": -26.273117065429688, "global_step": 401475, "epoch": 4837} {"train_loss": -26.520099639892578, "global_step": 401476, "epoch": 4837} {"train_loss": -26.29184341430664, "global_step": 401477, "epoch": 4837} {"train_loss": -26.422910690307617, "global_step": 401478, "epoch": 4837} {"train_loss": -26.351449966430664, "global_step": 401479, "epoch": 4837} {"train_loss": -26.305978775024414, "global_step": 401480, "epoch": 4837} {"train_loss": -26.244190216064453, "global_step": 401481, "epoch": 4837} {"train_loss": -26.134876251220703, "global_step": 401482, "epoch": 4837} {"train_loss": -26.27541160583496, "global_step": 401483, "epoch": 4837} {"train_loss": -26.756362915039062, "global_step": 401484, "epoch": 4837} {"train_loss": -26.682912826538086, "global_step": 401485, "epoch": 4837} {"train_loss": -26.353321075439453, "global_step": 401486, "epoch": 4837} {"train_loss": -26.403955459594727, "global_step": 401487, "epoch": 4837} {"train_loss": -26.755874633789062, "global_step": 401488, "epoch": 4837} {"train_loss": -26.875873565673828, "global_step": 401489, "epoch": 4837} {"train_loss": -26.8617000579834, "global_step": 401490, "epoch": 4837} {"train_loss": -26.58329200744629, "global_step": 401491, "epoch": 4837} {"train_loss": -26.430402755737305, "global_step": 401492, "epoch": 4837} {"train_loss": -26.413171768188477, "global_step": 401493, "epoch": 4837} {"train_loss": -26.805557250976562, "global_step": 401494, "epoch": 4837} {"train_loss": -26.27033805847168, "global_step": 401495, "epoch": 4837} {"train_loss": -26.8558292388916, "global_step": 401496, "epoch": 4837} {"train_loss": -26.815168380737305, "global_step": 401497, "epoch": 4837} {"train_loss": -26.661914825439453, "global_step": 401498, "epoch": 4837} {"train_loss": -26.5259952545166, "global_step": 401499, "epoch": 4837} {"train_loss": -26.443744659423828, "global_step": 401500, "epoch": 4837} {"train_loss": -26.779220581054688, "global_step": 401501, "epoch": 4837} {"train_loss": -26.897695541381836, "global_step": 401502, "epoch": 4837} {"train_loss": -26.70121192932129, "global_step": 401503, "epoch": 4837} {"train_loss": -26.112939834594727, "global_step": 401504, "epoch": 4837} {"train_loss": -26.43536376953125, "global_step": 401505, "epoch": 4837} {"train_loss": -26.89588737487793, "global_step": 401506, "epoch": 4837} {"train_loss": -26.448165893554688, "global_step": 401507, "epoch": 4837} {"train_loss": -26.11798667907715, "global_step": 401508, "epoch": 4837} {"train_loss": -25.944854736328125, "global_step": 401509, "epoch": 4837} {"train_loss": -26.405319213867188, "global_step": 401510, "epoch": 4837} {"train_loss": -26.49729347229004, "global_step": 401511, "epoch": 4837} {"train_loss": -26.957382202148438, "global_step": 401512, "epoch": 4837} {"train_loss": -27.147428512573242, "global_step": 401513, "epoch": 4837} {"train_loss": -26.585763931274414, "global_step": 401514, "epoch": 4837} {"train_loss": -27.041152954101562, "global_step": 401515, "epoch": 4837} {"train_loss": -26.910663604736328, "global_step": 401516, "epoch": 4837} {"train_loss": -26.464588165283203, "global_step": 401517, "epoch": 4837} {"train_loss": -26.628339767456055, "global_step": 401518, "epoch": 4837} {"train_loss": -26.729883193969727, "global_step": 401519, "epoch": 4837} {"train_loss": -26.77573585510254, "global_step": 401520, "epoch": 4837} {"train_loss": -26.35940933227539, "global_step": 401521, "epoch": 4837} {"train_loss": -26.87738037109375, "global_step": 401522, "epoch": 4837} {"train_loss": -26.618183135986328, "global_step": 401523, "epoch": 4837} {"train_loss": -26.83552360534668, "global_step": 401524, "epoch": 4837} {"train_loss": -26.40559196472168, "global_step": 401525, "epoch": 4837} {"train_loss": -26.508703231811523, "global_step": 401526, "epoch": 4837} {"train_loss": -26.848682403564453, "global_step": 401527, "epoch": 4837} {"train_loss": -26.841611862182617, "global_step": 401528, "epoch": 4837} {"train_loss": -26.303632736206055, "global_step": 401529, "epoch": 4837} {"train_loss": -25.873632431030273, "global_step": 401530, "epoch": 4837} {"train_loss": -25.383697509765625, "global_step": 401531, "epoch": 4837} {"train_loss": -26.562280654907227, "global_step": 401532, "epoch": 4837} {"train_loss": -26.574499130249023, "global_step": 401533, "epoch": 4837} {"train_loss": -26.43459129333496, "global_step": 401534, "epoch": 4837} {"train_loss": -26.896631240844727, "global_step": 401535, "epoch": 4837} {"train_loss": -26.553781509399414, "global_step": 401536, "epoch": 4837} {"train_loss": -26.35847282409668, "global_step": 401537, "epoch": 4837} {"train_loss": -26.685394287109375, "global_step": 401538, "epoch": 4837} {"train_loss": -26.71201515197754, "global_step": 401539, "epoch": 4837} {"train_loss": -26.517993927001953, "global_step": 401540, "epoch": 4837} {"train_loss": -26.763349533081055, "global_step": 401541, "epoch": 4837} {"train_loss": -26.460790634155273, "global_step": 401542, "epoch": 4837} {"train_loss": -26.613317489624023, "global_step": 401543, "epoch": 4837} {"train_loss": -26.400312423706055, "global_step": 401544, "epoch": 4837} {"train_loss": -26.8039608001709, "global_step": 401545, "epoch": 4837} {"train_loss": -26.485218048095703, "global_step": 401546, "epoch": 4837} {"train_loss": -26.502063751220703, "global_step": 401547, "epoch": 4837} {"train_loss": -26.800891876220703, "global_step": 401548, "epoch": 4837} {"train_loss": -26.462141036987305, "global_step": 401549, "epoch": 4837} {"train_loss": -27.04132652282715, "global_step": 401550, "epoch": 4837} {"train_loss": -26.421483993530273, "global_step": 401551, "epoch": 4837} {"train_loss": -26.403440475463867, "global_step": 401552, "epoch": 4837} {"train_loss": -26.542048098093055, "global_step": 401553, "epoch": 4837, "val_loss": 6793187.5} {"train_loss": -26.074995040893555, "global_step": 401554, "epoch": 4838} {"train_loss": -26.677194595336914, "global_step": 401555, "epoch": 4838} {"train_loss": -26.84186363220215, "global_step": 401556, "epoch": 4838} {"train_loss": -26.125410079956055, "global_step": 401557, "epoch": 4838} {"train_loss": -26.00827407836914, "global_step": 401558, "epoch": 4838} {"train_loss": -26.405664443969727, "global_step": 401559, "epoch": 4838} {"train_loss": -26.393451690673828, "global_step": 401560, "epoch": 4838} {"train_loss": -26.139158248901367, "global_step": 401561, "epoch": 4838} {"train_loss": -26.5819034576416, "global_step": 401562, "epoch": 4838} {"train_loss": -26.362592697143555, "global_step": 401563, "epoch": 4838} {"train_loss": -26.603994369506836, "global_step": 401564, "epoch": 4838} {"train_loss": -26.473953247070312, "global_step": 401565, "epoch": 4838} {"train_loss": -26.559431076049805, "global_step": 401566, "epoch": 4838} {"train_loss": -26.93072509765625, "global_step": 401567, "epoch": 4838} {"train_loss": -26.832050323486328, "global_step": 401568, "epoch": 4838} {"train_loss": -26.78346824645996, "global_step": 401569, "epoch": 4838} {"train_loss": -27.001794815063477, "global_step": 401570, "epoch": 4838} {"train_loss": -26.744287490844727, "global_step": 401571, "epoch": 4838} {"train_loss": -26.797439575195312, "global_step": 401572, "epoch": 4838} {"train_loss": -26.329442977905273, "global_step": 401573, "epoch": 4838} {"train_loss": -26.685644149780273, "global_step": 401574, "epoch": 4838} {"train_loss": -26.8068904876709, "global_step": 401575, "epoch": 4838} {"train_loss": -26.745391845703125, "global_step": 401576, "epoch": 4838} {"train_loss": -26.517194747924805, "global_step": 401577, "epoch": 4838} {"train_loss": -26.8603458404541, "global_step": 401578, "epoch": 4838} {"train_loss": -26.77581214904785, "global_step": 401579, "epoch": 4838} {"train_loss": -26.819950103759766, "global_step": 401580, "epoch": 4838} {"train_loss": -26.752538681030273, "global_step": 401581, "epoch": 4838} {"train_loss": -26.730072021484375, "global_step": 401582, "epoch": 4838} {"train_loss": -26.66849136352539, "global_step": 401583, "epoch": 4838} {"train_loss": -27.07569694519043, "global_step": 401584, "epoch": 4838} {"train_loss": -26.608570098876953, "global_step": 401585, "epoch": 4838} {"train_loss": -26.691604614257812, "global_step": 401586, "epoch": 4838} {"train_loss": -26.99408531188965, "global_step": 401587, "epoch": 4838} {"train_loss": -26.586984634399414, "global_step": 401588, "epoch": 4838} {"train_loss": -26.342987060546875, "global_step": 401589, "epoch": 4838} {"train_loss": -26.5290584564209, "global_step": 401590, "epoch": 4838} {"train_loss": -26.47364616394043, "global_step": 401591, "epoch": 4838} {"train_loss": -25.76258659362793, "global_step": 401592, "epoch": 4838} {"train_loss": -24.707239151000977, "global_step": 401593, "epoch": 4838} {"train_loss": -22.741613388061523, "global_step": 401594, "epoch": 4838} {"train_loss": -25.393951416015625, "global_step": 401595, "epoch": 4838} {"train_loss": -25.728378295898438, "global_step": 401596, "epoch": 4838} {"train_loss": -25.826614379882812, "global_step": 401597, "epoch": 4838} {"train_loss": -25.70979118347168, "global_step": 401598, "epoch": 4838} {"train_loss": -26.005197525024414, "global_step": 401599, "epoch": 4838} {"train_loss": -26.221281051635742, "global_step": 401600, "epoch": 4838} {"train_loss": -26.30499839782715, "global_step": 401601, "epoch": 4838} {"train_loss": -26.243976593017578, "global_step": 401602, "epoch": 4838} {"train_loss": -26.144805908203125, "global_step": 401603, "epoch": 4838} {"train_loss": -26.167612075805664, "global_step": 401604, "epoch": 4838} {"train_loss": -26.538244247436523, "global_step": 401605, "epoch": 4838} {"train_loss": -26.062170028686523, "global_step": 401606, "epoch": 4838} {"train_loss": -26.464269638061523, "global_step": 401607, "epoch": 4838} {"train_loss": -26.374311447143555, "global_step": 401608, "epoch": 4838} {"train_loss": -26.30694580078125, "global_step": 401609, "epoch": 4838} {"train_loss": -26.261295318603516, "global_step": 401610, "epoch": 4838} {"train_loss": -26.152408599853516, "global_step": 401611, "epoch": 4838} {"train_loss": -26.700149536132812, "global_step": 401612, "epoch": 4838} {"train_loss": -26.442249298095703, "global_step": 401613, "epoch": 4838} {"train_loss": -26.482681274414062, "global_step": 401614, "epoch": 4838} {"train_loss": -26.937183380126953, "global_step": 401615, "epoch": 4838} {"train_loss": -26.521026611328125, "global_step": 401616, "epoch": 4838} {"train_loss": -26.6863956451416, "global_step": 401617, "epoch": 4838} {"train_loss": -26.42118263244629, "global_step": 401618, "epoch": 4838} {"train_loss": -26.665363311767578, "global_step": 401619, "epoch": 4838} {"train_loss": -26.365127563476562, "global_step": 401620, "epoch": 4838} {"train_loss": -26.821069717407227, "global_step": 401621, "epoch": 4838} {"train_loss": -26.51515007019043, "global_step": 401622, "epoch": 4838} {"train_loss": -26.7053279876709, "global_step": 401623, "epoch": 4838} {"train_loss": -26.4266300201416, "global_step": 401624, "epoch": 4838} {"train_loss": -26.646581649780273, "global_step": 401625, "epoch": 4838} {"train_loss": -26.330106735229492, "global_step": 401626, "epoch": 4838} {"train_loss": -26.541065216064453, "global_step": 401627, "epoch": 4838} {"train_loss": -26.34979820251465, "global_step": 401628, "epoch": 4838} {"train_loss": -26.681177139282227, "global_step": 401629, "epoch": 4838} {"train_loss": -26.79654884338379, "global_step": 401630, "epoch": 4838} {"train_loss": -26.71368980407715, "global_step": 401631, "epoch": 4838} {"train_loss": -26.634992599487305, "global_step": 401632, "epoch": 4838} {"train_loss": -26.64837074279785, "global_step": 401633, "epoch": 4838} {"train_loss": -26.568225860595703, "global_step": 401634, "epoch": 4838} {"train_loss": -26.6936092376709, "global_step": 401635, "epoch": 4838} {"train_loss": -26.429601784212043, "global_step": 401636, "epoch": 4838, "val_loss": 6769050.0} {"train_loss": -26.400348663330078, "global_step": 401637, "epoch": 4839} {"train_loss": -26.489368438720703, "global_step": 401638, "epoch": 4839} {"train_loss": -26.45049476623535, "global_step": 401639, "epoch": 4839} {"train_loss": -26.254352569580078, "global_step": 401640, "epoch": 4839} {"train_loss": -26.288976669311523, "global_step": 401641, "epoch": 4839} {"train_loss": -26.666616439819336, "global_step": 401642, "epoch": 4839} {"train_loss": -25.9671573638916, "global_step": 401643, "epoch": 4839} {"train_loss": -26.8866024017334, "global_step": 401644, "epoch": 4839} {"train_loss": -26.51149559020996, "global_step": 401645, "epoch": 4839} {"train_loss": -25.982467651367188, "global_step": 401646, "epoch": 4839} {"train_loss": -26.719629287719727, "global_step": 401647, "epoch": 4839} {"train_loss": -26.534711837768555, "global_step": 401648, "epoch": 4839} {"train_loss": -26.024587631225586, "global_step": 401649, "epoch": 4839} {"train_loss": -26.46760368347168, "global_step": 401650, "epoch": 4839} {"train_loss": -26.452917098999023, "global_step": 401651, "epoch": 4839} {"train_loss": -26.375202178955078, "global_step": 401652, "epoch": 4839} {"train_loss": -26.0788631439209, "global_step": 401653, "epoch": 4839} {"train_loss": -26.668737411499023, "global_step": 401654, "epoch": 4839} {"train_loss": -26.557371139526367, "global_step": 401655, "epoch": 4839} {"train_loss": -26.6774959564209, "global_step": 401656, "epoch": 4839} {"train_loss": -26.48012351989746, "global_step": 401657, "epoch": 4839} {"train_loss": -26.747053146362305, "global_step": 401658, "epoch": 4839} {"train_loss": -26.34518814086914, "global_step": 401659, "epoch": 4839} {"train_loss": -26.567800521850586, "global_step": 401660, "epoch": 4839} {"train_loss": -26.89823341369629, "global_step": 401661, "epoch": 4839} {"train_loss": -26.625226974487305, "global_step": 401662, "epoch": 4839} {"train_loss": -26.413837432861328, "global_step": 401663, "epoch": 4839} {"train_loss": -26.405715942382812, "global_step": 401664, "epoch": 4839} {"train_loss": -26.595932006835938, "global_step": 401665, "epoch": 4839} {"train_loss": -26.401718139648438, "global_step": 401666, "epoch": 4839} {"train_loss": -26.54252052307129, "global_step": 401667, "epoch": 4839} {"train_loss": -26.4205379486084, "global_step": 401668, "epoch": 4839} {"train_loss": -26.28965187072754, "global_step": 401669, "epoch": 4839} {"train_loss": -26.5009822845459, "global_step": 401670, "epoch": 4839} {"train_loss": -26.86427879333496, "global_step": 401671, "epoch": 4839} {"train_loss": -26.542285919189453, "global_step": 401672, "epoch": 4839} {"train_loss": -26.807498931884766, "global_step": 401673, "epoch": 4839} {"train_loss": -26.79913902282715, "global_step": 401674, "epoch": 4839} {"train_loss": -26.66511344909668, "global_step": 401675, "epoch": 4839} {"train_loss": -26.98834800720215, "global_step": 401676, "epoch": 4839} {"train_loss": -27.061283111572266, "global_step": 401677, "epoch": 4839} {"train_loss": -27.020017623901367, "global_step": 401678, "epoch": 4839} {"train_loss": -26.907140731811523, "global_step": 401679, "epoch": 4839} {"train_loss": -26.45115089416504, "global_step": 401680, "epoch": 4839} {"train_loss": -26.86602783203125, "global_step": 401681, "epoch": 4839} {"train_loss": -26.93645668029785, "global_step": 401682, "epoch": 4839} {"train_loss": -26.574142456054688, "global_step": 401683, "epoch": 4839} {"train_loss": -26.966644287109375, "global_step": 401684, "epoch": 4839} {"train_loss": -26.64597511291504, "global_step": 401685, "epoch": 4839} {"train_loss": -26.622344970703125, "global_step": 401686, "epoch": 4839} {"train_loss": -27.111371994018555, "global_step": 401687, "epoch": 4839} {"train_loss": -26.620834350585938, "global_step": 401688, "epoch": 4839} {"train_loss": -26.542282104492188, "global_step": 401689, "epoch": 4839} {"train_loss": -26.888341903686523, "global_step": 401690, "epoch": 4839} {"train_loss": -26.802392959594727, "global_step": 401691, "epoch": 4839} {"train_loss": -26.455347061157227, "global_step": 401692, "epoch": 4839} {"train_loss": -26.311359405517578, "global_step": 401693, "epoch": 4839} {"train_loss": -26.256519317626953, "global_step": 401694, "epoch": 4839} {"train_loss": -26.741147994995117, "global_step": 401695, "epoch": 4839} {"train_loss": -26.99411392211914, "global_step": 401696, "epoch": 4839} {"train_loss": -26.09415626525879, "global_step": 401697, "epoch": 4839} {"train_loss": -26.28071403503418, "global_step": 401698, "epoch": 4839} {"train_loss": -27.011518478393555, "global_step": 401699, "epoch": 4839} {"train_loss": -26.297672271728516, "global_step": 401700, "epoch": 4839} {"train_loss": -26.425506591796875, "global_step": 401701, "epoch": 4839} {"train_loss": -26.61930274963379, "global_step": 401702, "epoch": 4839} {"train_loss": -26.58975601196289, "global_step": 401703, "epoch": 4839} {"train_loss": -26.493066787719727, "global_step": 401704, "epoch": 4839} {"train_loss": -26.744903564453125, "global_step": 401705, "epoch": 4839} {"train_loss": -26.551416397094727, "global_step": 401706, "epoch": 4839} {"train_loss": -26.476850509643555, "global_step": 401707, "epoch": 4839} {"train_loss": -26.53541374206543, "global_step": 401708, "epoch": 4839} {"train_loss": -26.399555206298828, "global_step": 401709, "epoch": 4839} {"train_loss": -26.623676300048828, "global_step": 401710, "epoch": 4839} {"train_loss": -26.14204978942871, "global_step": 401711, "epoch": 4839} {"train_loss": -26.517810821533203, "global_step": 401712, "epoch": 4839} {"train_loss": -26.11981201171875, "global_step": 401713, "epoch": 4839} {"train_loss": -26.833526611328125, "global_step": 401714, "epoch": 4839} {"train_loss": -26.554275512695312, "global_step": 401715, "epoch": 4839} {"train_loss": -26.518970489501953, "global_step": 401716, "epoch": 4839} {"train_loss": -26.257577896118164, "global_step": 401717, "epoch": 4839} {"train_loss": -26.433984756469727, "global_step": 401718, "epoch": 4839} {"train_loss": -26.53847972456231, "global_step": 401719, "epoch": 4839, "val_loss": 6804726.0} {"train_loss": -25.595983505249023, "global_step": 401720, "epoch": 4840} {"train_loss": -24.455371856689453, "global_step": 401721, "epoch": 4840} {"train_loss": -25.183012008666992, "global_step": 401722, "epoch": 4840} {"train_loss": -26.331872940063477, "global_step": 401723, "epoch": 4840} {"train_loss": -24.86847496032715, "global_step": 401724, "epoch": 4840} {"train_loss": -26.211444854736328, "global_step": 401725, "epoch": 4840} {"train_loss": -25.52890968322754, "global_step": 401726, "epoch": 4840} {"train_loss": -26.025983810424805, "global_step": 401727, "epoch": 4840} {"train_loss": -25.91982078552246, "global_step": 401728, "epoch": 4840} {"train_loss": -26.1950740814209, "global_step": 401729, "epoch": 4840} {"train_loss": -25.983800888061523, "global_step": 401730, "epoch": 4840} {"train_loss": -26.032026290893555, "global_step": 401731, "epoch": 4840} {"train_loss": -26.470321655273438, "global_step": 401732, "epoch": 4840} {"train_loss": -26.370519638061523, "global_step": 401733, "epoch": 4840} {"train_loss": -26.257675170898438, "global_step": 401734, "epoch": 4840} {"train_loss": -26.348276138305664, "global_step": 401735, "epoch": 4840} {"train_loss": -26.313434600830078, "global_step": 401736, "epoch": 4840} {"train_loss": -26.138233184814453, "global_step": 401737, "epoch": 4840} {"train_loss": -26.44548988342285, "global_step": 401738, "epoch": 4840} {"train_loss": -26.481122970581055, "global_step": 401739, "epoch": 4840} {"train_loss": -26.108198165893555, "global_step": 401740, "epoch": 4840} {"train_loss": -26.27382469177246, "global_step": 401741, "epoch": 4840} {"train_loss": -26.25990104675293, "global_step": 401742, "epoch": 4840} {"train_loss": -26.13311767578125, "global_step": 401743, "epoch": 4840} {"train_loss": -26.02060317993164, "global_step": 401744, "epoch": 4840} {"train_loss": -26.449506759643555, "global_step": 401745, "epoch": 4840} {"train_loss": -26.414365768432617, "global_step": 401746, "epoch": 4840} {"train_loss": -26.69202995300293, "global_step": 401747, "epoch": 4840} {"train_loss": -26.37139892578125, "global_step": 401748, "epoch": 4840} {"train_loss": -26.31858253479004, "global_step": 401749, "epoch": 4840} {"train_loss": -26.67742919921875, "global_step": 401750, "epoch": 4840} {"train_loss": -26.41558837890625, "global_step": 401751, "epoch": 4840} {"train_loss": -26.666568756103516, "global_step": 401752, "epoch": 4840} {"train_loss": -26.461400985717773, "global_step": 401753, "epoch": 4840} {"train_loss": -26.617767333984375, "global_step": 401754, "epoch": 4840} {"train_loss": -26.35320472717285, "global_step": 401755, "epoch": 4840} {"train_loss": -26.418472290039062, "global_step": 401756, "epoch": 4840} {"train_loss": -26.576812744140625, "global_step": 401757, "epoch": 4840} {"train_loss": -26.70722007751465, "global_step": 401758, "epoch": 4840} {"train_loss": -26.3548583984375, "global_step": 401759, "epoch": 4840} {"train_loss": -26.726903915405273, "global_step": 401760, "epoch": 4840} {"train_loss": -26.82671546936035, "global_step": 401761, "epoch": 4840} {"train_loss": -26.612913131713867, "global_step": 401762, "epoch": 4840} {"train_loss": -26.62969398498535, "global_step": 401763, "epoch": 4840} {"train_loss": -26.571762084960938, "global_step": 401764, "epoch": 4840} {"train_loss": -26.78143882751465, "global_step": 401765, "epoch": 4840} {"train_loss": -26.6372013092041, "global_step": 401766, "epoch": 4840} {"train_loss": -26.601728439331055, "global_step": 401767, "epoch": 4840} {"train_loss": -26.546483993530273, "global_step": 401768, "epoch": 4840} {"train_loss": -26.685678482055664, "global_step": 401769, "epoch": 4840} {"train_loss": -26.8034725189209, "global_step": 401770, "epoch": 4840} {"train_loss": -26.663410186767578, "global_step": 401771, "epoch": 4840} {"train_loss": -26.62958335876465, "global_step": 401772, "epoch": 4840} {"train_loss": -26.640003204345703, "global_step": 401773, "epoch": 4840} {"train_loss": -26.961942672729492, "global_step": 401774, "epoch": 4840} {"train_loss": -26.558629989624023, "global_step": 401775, "epoch": 4840} {"train_loss": -27.154767990112305, "global_step": 401776, "epoch": 4840} {"train_loss": -26.603315353393555, "global_step": 401777, "epoch": 4840} {"train_loss": -26.41004753112793, "global_step": 401778, "epoch": 4840} {"train_loss": -26.24769401550293, "global_step": 401779, "epoch": 4840} {"train_loss": -26.80292320251465, "global_step": 401780, "epoch": 4840} {"train_loss": -26.395009994506836, "global_step": 401781, "epoch": 4840} {"train_loss": -26.6215877532959, "global_step": 401782, "epoch": 4840} {"train_loss": -26.828033447265625, "global_step": 401783, "epoch": 4840} {"train_loss": -26.622974395751953, "global_step": 401784, "epoch": 4840} {"train_loss": -26.86566162109375, "global_step": 401785, "epoch": 4840} {"train_loss": -26.685148239135742, "global_step": 401786, "epoch": 4840} {"train_loss": -27.050771713256836, "global_step": 401787, "epoch": 4840} {"train_loss": -26.530492782592773, "global_step": 401788, "epoch": 4840} {"train_loss": -26.791452407836914, "global_step": 401789, "epoch": 4840} {"train_loss": -26.958850860595703, "global_step": 401790, "epoch": 4840} {"train_loss": -26.62090492248535, "global_step": 401791, "epoch": 4840} {"train_loss": -26.485416412353516, "global_step": 401792, "epoch": 4840} {"train_loss": -26.66529655456543, "global_step": 401793, "epoch": 4840} {"train_loss": -26.62159538269043, "global_step": 401794, "epoch": 4840} {"train_loss": -26.451343536376953, "global_step": 401795, "epoch": 4840} {"train_loss": -26.896955490112305, "global_step": 401796, "epoch": 4840} {"train_loss": -26.683807373046875, "global_step": 401797, "epoch": 4840} {"train_loss": -26.85857582092285, "global_step": 401798, "epoch": 4840} {"train_loss": -26.402536392211914, "global_step": 401799, "epoch": 4840} {"train_loss": -26.55086326599121, "global_step": 401800, "epoch": 4840} {"train_loss": -25.997961044311523, "global_step": 401801, "epoch": 4840} {"train_loss": -26.426814918058465, "global_step": 401802, "epoch": 4840, "val_loss": 6812910.0} {"train_loss": -25.816883087158203, "global_step": 401803, "epoch": 4841} {"train_loss": -24.579845428466797, "global_step": 401804, "epoch": 4841} {"train_loss": -25.310434341430664, "global_step": 401805, "epoch": 4841} {"train_loss": -26.28623390197754, "global_step": 401806, "epoch": 4841} {"train_loss": -25.785497665405273, "global_step": 401807, "epoch": 4841} {"train_loss": -26.066686630249023, "global_step": 401808, "epoch": 4841} {"train_loss": -26.229141235351562, "global_step": 401809, "epoch": 4841} {"train_loss": -25.922962188720703, "global_step": 401810, "epoch": 4841} {"train_loss": -25.90704917907715, "global_step": 401811, "epoch": 4841} {"train_loss": -25.8880672454834, "global_step": 401812, "epoch": 4841} {"train_loss": -26.135801315307617, "global_step": 401813, "epoch": 4841} {"train_loss": -26.2669734954834, "global_step": 401814, "epoch": 4841} {"train_loss": -25.975305557250977, "global_step": 401815, "epoch": 4841} {"train_loss": -26.6776123046875, "global_step": 401816, "epoch": 4841} {"train_loss": -26.34235954284668, "global_step": 401817, "epoch": 4841} {"train_loss": -26.47003746032715, "global_step": 401818, "epoch": 4841} {"train_loss": -26.49652671813965, "global_step": 401819, "epoch": 4841} {"train_loss": -26.21720314025879, "global_step": 401820, "epoch": 4841} {"train_loss": -26.24200439453125, "global_step": 401821, "epoch": 4841} {"train_loss": -26.801115036010742, "global_step": 401822, "epoch": 4841} {"train_loss": -26.327966690063477, "global_step": 401823, "epoch": 4841} {"train_loss": -26.734052658081055, "global_step": 401824, "epoch": 4841} {"train_loss": -26.424909591674805, "global_step": 401825, "epoch": 4841} {"train_loss": -26.3343563079834, "global_step": 401826, "epoch": 4841} {"train_loss": -26.340612411499023, "global_step": 401827, "epoch": 4841} {"train_loss": -26.39790153503418, "global_step": 401828, "epoch": 4841} {"train_loss": -26.729639053344727, "global_step": 401829, "epoch": 4841} {"train_loss": -26.61600112915039, "global_step": 401830, "epoch": 4841} {"train_loss": -26.5461483001709, "global_step": 401831, "epoch": 4841} {"train_loss": -26.492328643798828, "global_step": 401832, "epoch": 4841} {"train_loss": -26.780181884765625, "global_step": 401833, "epoch": 4841} {"train_loss": -26.601444244384766, "global_step": 401834, "epoch": 4841} {"train_loss": -26.769378662109375, "global_step": 401835, "epoch": 4841} {"train_loss": -26.45380210876465, "global_step": 401836, "epoch": 4841} {"train_loss": -26.76508903503418, "global_step": 401837, "epoch": 4841} {"train_loss": -26.757619857788086, "global_step": 401838, "epoch": 4841} {"train_loss": -26.152545928955078, "global_step": 401839, "epoch": 4841} {"train_loss": -26.488882064819336, "global_step": 401840, "epoch": 4841} {"train_loss": -26.677322387695312, "global_step": 401841, "epoch": 4841} {"train_loss": -27.1234130859375, "global_step": 401842, "epoch": 4841} {"train_loss": -26.79996681213379, "global_step": 401843, "epoch": 4841} {"train_loss": -26.961231231689453, "global_step": 401844, "epoch": 4841} {"train_loss": -26.464399337768555, "global_step": 401845, "epoch": 4841} {"train_loss": -26.922040939331055, "global_step": 401846, "epoch": 4841} {"train_loss": -26.737674713134766, "global_step": 401847, "epoch": 4841} {"train_loss": -26.781522750854492, "global_step": 401848, "epoch": 4841} {"train_loss": -26.623733520507812, "global_step": 401849, "epoch": 4841} {"train_loss": -26.975126266479492, "global_step": 401850, "epoch": 4841} {"train_loss": -26.814477920532227, "global_step": 401851, "epoch": 4841} {"train_loss": -26.78986167907715, "global_step": 401852, "epoch": 4841} {"train_loss": -27.042499542236328, "global_step": 401853, "epoch": 4841} {"train_loss": -26.936065673828125, "global_step": 401854, "epoch": 4841} {"train_loss": -26.8040828704834, "global_step": 401855, "epoch": 4841} {"train_loss": -26.965808868408203, "global_step": 401856, "epoch": 4841} {"train_loss": -26.400903701782227, "global_step": 401857, "epoch": 4841} {"train_loss": -26.71711540222168, "global_step": 401858, "epoch": 4841} {"train_loss": -26.817136764526367, "global_step": 401859, "epoch": 4841} {"train_loss": -26.70147132873535, "global_step": 401860, "epoch": 4841} {"train_loss": -26.753828048706055, "global_step": 401861, "epoch": 4841} {"train_loss": -26.8079891204834, "global_step": 401862, "epoch": 4841} {"train_loss": -26.71546745300293, "global_step": 401863, "epoch": 4841} {"train_loss": -27.023162841796875, "global_step": 401864, "epoch": 4841} {"train_loss": -26.63666343688965, "global_step": 401865, "epoch": 4841} {"train_loss": -26.478235244750977, "global_step": 401866, "epoch": 4841} {"train_loss": -26.495203018188477, "global_step": 401867, "epoch": 4841} {"train_loss": -26.819580078125, "global_step": 401868, "epoch": 4841} {"train_loss": -26.807676315307617, "global_step": 401869, "epoch": 4841} {"train_loss": -26.69672203063965, "global_step": 401870, "epoch": 4841} {"train_loss": -26.5916805267334, "global_step": 401871, "epoch": 4841} {"train_loss": -26.710935592651367, "global_step": 401872, "epoch": 4841} {"train_loss": -27.18903923034668, "global_step": 401873, "epoch": 4841} {"train_loss": -26.65157127380371, "global_step": 401874, "epoch": 4841} {"train_loss": -26.82159996032715, "global_step": 401875, "epoch": 4841} {"train_loss": -26.45767593383789, "global_step": 401876, "epoch": 4841} {"train_loss": -26.25984001159668, "global_step": 401877, "epoch": 4841} {"train_loss": -26.56258201599121, "global_step": 401878, "epoch": 4841} {"train_loss": -26.797338485717773, "global_step": 401879, "epoch": 4841} {"train_loss": -27.107391357421875, "global_step": 401880, "epoch": 4841} {"train_loss": -26.968402862548828, "global_step": 401881, "epoch": 4841} {"train_loss": -27.0975399017334, "global_step": 401882, "epoch": 4841} {"train_loss": -26.66901969909668, "global_step": 401883, "epoch": 4841} {"train_loss": -26.69839859008789, "global_step": 401884, "epoch": 4841} {"train_loss": -26.552870440195843, "global_step": 401885, "epoch": 4841, "val_loss": 6768447.5} {"train_loss": -26.46036720275879, "global_step": 401886, "epoch": 4842} {"train_loss": -26.122541427612305, "global_step": 401887, "epoch": 4842} {"train_loss": -25.711578369140625, "global_step": 401888, "epoch": 4842} {"train_loss": -25.748260498046875, "global_step": 401889, "epoch": 4842} {"train_loss": -26.19671058654785, "global_step": 401890, "epoch": 4842} {"train_loss": -26.564197540283203, "global_step": 401891, "epoch": 4842} {"train_loss": -26.05842399597168, "global_step": 401892, "epoch": 4842} {"train_loss": -26.091638565063477, "global_step": 401893, "epoch": 4842} {"train_loss": -26.10105323791504, "global_step": 401894, "epoch": 4842} {"train_loss": -26.033981323242188, "global_step": 401895, "epoch": 4842} {"train_loss": -26.419843673706055, "global_step": 401896, "epoch": 4842} {"train_loss": -26.47308921813965, "global_step": 401897, "epoch": 4842} {"train_loss": -26.812925338745117, "global_step": 401898, "epoch": 4842} {"train_loss": -26.49383544921875, "global_step": 401899, "epoch": 4842} {"train_loss": -26.363880157470703, "global_step": 401900, "epoch": 4842} {"train_loss": -26.64019203186035, "global_step": 401901, "epoch": 4842} {"train_loss": -26.748090744018555, "global_step": 401902, "epoch": 4842} {"train_loss": -26.3084774017334, "global_step": 401903, "epoch": 4842} {"train_loss": -26.799848556518555, "global_step": 401904, "epoch": 4842} {"train_loss": -26.355356216430664, "global_step": 401905, "epoch": 4842} {"train_loss": -26.680688858032227, "global_step": 401906, "epoch": 4842} {"train_loss": -26.568103790283203, "global_step": 401907, "epoch": 4842} {"train_loss": -26.70011329650879, "global_step": 401908, "epoch": 4842} {"train_loss": -26.771081924438477, "global_step": 401909, "epoch": 4842} {"train_loss": -26.2979793548584, "global_step": 401910, "epoch": 4842} {"train_loss": -26.468076705932617, "global_step": 401911, "epoch": 4842} {"train_loss": -26.406631469726562, "global_step": 401912, "epoch": 4842} {"train_loss": -26.686954498291016, "global_step": 401913, "epoch": 4842} {"train_loss": -26.60498046875, "global_step": 401914, "epoch": 4842} {"train_loss": -26.801855087280273, "global_step": 401915, "epoch": 4842} {"train_loss": -26.65756607055664, "global_step": 401916, "epoch": 4842} {"train_loss": -26.880126953125, "global_step": 401917, "epoch": 4842} {"train_loss": -26.538557052612305, "global_step": 401918, "epoch": 4842} {"train_loss": -26.551679611206055, "global_step": 401919, "epoch": 4842} {"train_loss": -26.576574325561523, "global_step": 401920, "epoch": 4842} {"train_loss": -26.764108657836914, "global_step": 401921, "epoch": 4842} {"train_loss": -26.690906524658203, "global_step": 401922, "epoch": 4842} {"train_loss": -26.947607040405273, "global_step": 401923, "epoch": 4842} {"train_loss": -26.62543296813965, "global_step": 401924, "epoch": 4842} {"train_loss": -26.833984375, "global_step": 401925, "epoch": 4842} {"train_loss": -26.965290069580078, "global_step": 401926, "epoch": 4842} {"train_loss": -26.73335075378418, "global_step": 401927, "epoch": 4842} {"train_loss": -26.83216667175293, "global_step": 401928, "epoch": 4842} {"train_loss": -26.726511001586914, "global_step": 401929, "epoch": 4842} {"train_loss": -26.696353912353516, "global_step": 401930, "epoch": 4842} {"train_loss": -26.514875411987305, "global_step": 401931, "epoch": 4842} {"train_loss": -26.031522750854492, "global_step": 401932, "epoch": 4842} {"train_loss": -25.93536949157715, "global_step": 401933, "epoch": 4842} {"train_loss": -26.40174674987793, "global_step": 401934, "epoch": 4842} {"train_loss": -26.66632080078125, "global_step": 401935, "epoch": 4842} {"train_loss": -25.974609375, "global_step": 401936, "epoch": 4842} {"train_loss": -26.48560905456543, "global_step": 401937, "epoch": 4842} {"train_loss": -26.47258949279785, "global_step": 401938, "epoch": 4842} {"train_loss": -26.658782958984375, "global_step": 401939, "epoch": 4842} {"train_loss": -26.8024959564209, "global_step": 401940, "epoch": 4842} {"train_loss": -26.81830406188965, "global_step": 401941, "epoch": 4842} {"train_loss": -26.502172470092773, "global_step": 401942, "epoch": 4842} {"train_loss": -26.500839233398438, "global_step": 401943, "epoch": 4842} {"train_loss": -26.53065299987793, "global_step": 401944, "epoch": 4842} {"train_loss": -26.8051815032959, "global_step": 401945, "epoch": 4842} {"train_loss": -26.759702682495117, "global_step": 401946, "epoch": 4842} {"train_loss": -27.04095458984375, "global_step": 401947, "epoch": 4842} {"train_loss": -26.79302406311035, "global_step": 401948, "epoch": 4842} {"train_loss": -26.85854148864746, "global_step": 401949, "epoch": 4842} {"train_loss": -26.953659057617188, "global_step": 401950, "epoch": 4842} {"train_loss": -26.758087158203125, "global_step": 401951, "epoch": 4842} {"train_loss": -27.188879013061523, "global_step": 401952, "epoch": 4842} {"train_loss": -26.839523315429688, "global_step": 401953, "epoch": 4842} {"train_loss": -26.44880485534668, "global_step": 401954, "epoch": 4842} {"train_loss": -26.51981544494629, "global_step": 401955, "epoch": 4842} {"train_loss": -27.024999618530273, "global_step": 401956, "epoch": 4842} {"train_loss": -26.981821060180664, "global_step": 401957, "epoch": 4842} {"train_loss": -26.26641273498535, "global_step": 401958, "epoch": 4842} {"train_loss": -26.445465087890625, "global_step": 401959, "epoch": 4842} {"train_loss": -26.5068359375, "global_step": 401960, "epoch": 4842} {"train_loss": -26.78397560119629, "global_step": 401961, "epoch": 4842} {"train_loss": -26.698719024658203, "global_step": 401962, "epoch": 4842} {"train_loss": -26.41559410095215, "global_step": 401963, "epoch": 4842} {"train_loss": -26.8641300201416, "global_step": 401964, "epoch": 4842} {"train_loss": -26.837080001831055, "global_step": 401965, "epoch": 4842} {"train_loss": -26.4853515625, "global_step": 401966, "epoch": 4842} {"train_loss": -26.6888427734375, "global_step": 401967, "epoch": 4842} {"train_loss": -26.577981650111187, "global_step": 401968, "epoch": 4842, "val_loss": 6873824.0} {"train_loss": -26.492345809936523, "global_step": 401969, "epoch": 4843} {"train_loss": -26.3455867767334, "global_step": 401970, "epoch": 4843} {"train_loss": -26.467065811157227, "global_step": 401971, "epoch": 4843} {"train_loss": -26.19711685180664, "global_step": 401972, "epoch": 4843} {"train_loss": -26.044864654541016, "global_step": 401973, "epoch": 4843} {"train_loss": -26.282026290893555, "global_step": 401974, "epoch": 4843} {"train_loss": -26.097320556640625, "global_step": 401975, "epoch": 4843} {"train_loss": -26.614246368408203, "global_step": 401976, "epoch": 4843} {"train_loss": -26.311084747314453, "global_step": 401977, "epoch": 4843} {"train_loss": -26.449304580688477, "global_step": 401978, "epoch": 4843} {"train_loss": -26.1827335357666, "global_step": 401979, "epoch": 4843} {"train_loss": -26.0306396484375, "global_step": 401980, "epoch": 4843} {"train_loss": -26.31952476501465, "global_step": 401981, "epoch": 4843} {"train_loss": -26.379175186157227, "global_step": 401982, "epoch": 4843} {"train_loss": -26.593366622924805, "global_step": 401983, "epoch": 4843} {"train_loss": -26.493839263916016, "global_step": 401984, "epoch": 4843} {"train_loss": -26.496801376342773, "global_step": 401985, "epoch": 4843} {"train_loss": -26.5216007232666, "global_step": 401986, "epoch": 4843} {"train_loss": -26.89249038696289, "global_step": 401987, "epoch": 4843} {"train_loss": -26.920446395874023, "global_step": 401988, "epoch": 4843} {"train_loss": -26.464094161987305, "global_step": 401989, "epoch": 4843} {"train_loss": -26.5720157623291, "global_step": 401990, "epoch": 4843} {"train_loss": -26.48184585571289, "global_step": 401991, "epoch": 4843} {"train_loss": -26.62664222717285, "global_step": 401992, "epoch": 4843} {"train_loss": -26.578338623046875, "global_step": 401993, "epoch": 4843} {"train_loss": -26.585742950439453, "global_step": 401994, "epoch": 4843} {"train_loss": -26.57744789123535, "global_step": 401995, "epoch": 4843} {"train_loss": -26.716848373413086, "global_step": 401996, "epoch": 4843} {"train_loss": -27.133298873901367, "global_step": 401997, "epoch": 4843} {"train_loss": -26.752853393554688, "global_step": 401998, "epoch": 4843} {"train_loss": -26.795129776000977, "global_step": 401999, "epoch": 4843} {"train_loss": -26.6908016204834, "global_step": 402000, "epoch": 4843} {"train_loss": -26.86980628967285, "global_step": 402001, "epoch": 4843} {"train_loss": -26.687469482421875, "global_step": 402002, "epoch": 4843} {"train_loss": -26.8505916595459, "global_step": 402003, "epoch": 4843} {"train_loss": -26.34962272644043, "global_step": 402004, "epoch": 4843} {"train_loss": -26.808216094970703, "global_step": 402005, "epoch": 4843} {"train_loss": -26.591800689697266, "global_step": 402006, "epoch": 4843} {"train_loss": -26.748708724975586, "global_step": 402007, "epoch": 4843} {"train_loss": -26.718103408813477, "global_step": 402008, "epoch": 4843} {"train_loss": -26.834009170532227, "global_step": 402009, "epoch": 4843} {"train_loss": -26.900434494018555, "global_step": 402010, "epoch": 4843} {"train_loss": -26.875951766967773, "global_step": 402011, "epoch": 4843} {"train_loss": -26.83740234375, "global_step": 402012, "epoch": 4843} {"train_loss": -26.716690063476562, "global_step": 402013, "epoch": 4843} {"train_loss": -26.672300338745117, "global_step": 402014, "epoch": 4843} {"train_loss": -26.62623405456543, "global_step": 402015, "epoch": 4843} {"train_loss": -26.68145179748535, "global_step": 402016, "epoch": 4843} {"train_loss": -26.82900047302246, "global_step": 402017, "epoch": 4843} {"train_loss": -26.39674186706543, "global_step": 402018, "epoch": 4843} {"train_loss": -26.481908798217773, "global_step": 402019, "epoch": 4843} {"train_loss": -26.569929122924805, "global_step": 402020, "epoch": 4843} {"train_loss": -26.982685089111328, "global_step": 402021, "epoch": 4843} {"train_loss": -26.526391983032227, "global_step": 402022, "epoch": 4843} {"train_loss": -26.785924911499023, "global_step": 402023, "epoch": 4843} {"train_loss": -26.887531280517578, "global_step": 402024, "epoch": 4843} {"train_loss": -26.62153434753418, "global_step": 402025, "epoch": 4843} {"train_loss": -26.483068466186523, "global_step": 402026, "epoch": 4843} {"train_loss": -26.27691078186035, "global_step": 402027, "epoch": 4843} {"train_loss": -26.80598258972168, "global_step": 402028, "epoch": 4843} {"train_loss": -26.64004898071289, "global_step": 402029, "epoch": 4843} {"train_loss": -26.459552764892578, "global_step": 402030, "epoch": 4843} {"train_loss": -26.725393295288086, "global_step": 402031, "epoch": 4843} {"train_loss": -26.126239776611328, "global_step": 402032, "epoch": 4843} {"train_loss": -26.54949378967285, "global_step": 402033, "epoch": 4843} {"train_loss": -26.48663902282715, "global_step": 402034, "epoch": 4843} {"train_loss": -26.67978286743164, "global_step": 402035, "epoch": 4843} {"train_loss": -26.916950225830078, "global_step": 402036, "epoch": 4843} {"train_loss": -26.620336532592773, "global_step": 402037, "epoch": 4843} {"train_loss": -26.4831485748291, "global_step": 402038, "epoch": 4843} {"train_loss": -26.574392318725586, "global_step": 402039, "epoch": 4843} {"train_loss": -26.767654418945312, "global_step": 402040, "epoch": 4843} {"train_loss": -26.905588150024414, "global_step": 402041, "epoch": 4843} {"train_loss": -26.2971248626709, "global_step": 402042, "epoch": 4843} {"train_loss": -25.867841720581055, "global_step": 402043, "epoch": 4843} {"train_loss": -26.81801414489746, "global_step": 402044, "epoch": 4843} {"train_loss": -26.54839515686035, "global_step": 402045, "epoch": 4843} {"train_loss": -26.0777587890625, "global_step": 402046, "epoch": 4843} {"train_loss": -26.06546974182129, "global_step": 402047, "epoch": 4843} {"train_loss": -26.486478805541992, "global_step": 402048, "epoch": 4843} {"train_loss": -25.987478256225586, "global_step": 402049, "epoch": 4843} {"train_loss": -26.08542251586914, "global_step": 402050, "epoch": 4843} {"train_loss": -26.53800035959267, "global_step": 402051, "epoch": 4843, "val_loss": 6792541.0} {"train_loss": -25.87445068359375, "global_step": 402052, "epoch": 4844} {"train_loss": -26.146183013916016, "global_step": 402053, "epoch": 4844} {"train_loss": -26.293848037719727, "global_step": 402054, "epoch": 4844} {"train_loss": -25.96449089050293, "global_step": 402055, "epoch": 4844} {"train_loss": -25.981109619140625, "global_step": 402056, "epoch": 4844} {"train_loss": -25.590341567993164, "global_step": 402057, "epoch": 4844} {"train_loss": -26.283523559570312, "global_step": 402058, "epoch": 4844} {"train_loss": -26.26716423034668, "global_step": 402059, "epoch": 4844} {"train_loss": -26.170862197875977, "global_step": 402060, "epoch": 4844} {"train_loss": -25.650720596313477, "global_step": 402061, "epoch": 4844} {"train_loss": -26.244876861572266, "global_step": 402062, "epoch": 4844} {"train_loss": -25.87104606628418, "global_step": 402063, "epoch": 4844} {"train_loss": -26.265338897705078, "global_step": 402064, "epoch": 4844} {"train_loss": -26.621374130249023, "global_step": 402065, "epoch": 4844} {"train_loss": -26.387319564819336, "global_step": 402066, "epoch": 4844} {"train_loss": -25.982858657836914, "global_step": 402067, "epoch": 4844} {"train_loss": -26.42754554748535, "global_step": 402068, "epoch": 4844} {"train_loss": -26.347965240478516, "global_step": 402069, "epoch": 4844} {"train_loss": -26.236785888671875, "global_step": 402070, "epoch": 4844} {"train_loss": -26.32305908203125, "global_step": 402071, "epoch": 4844} {"train_loss": -26.570114135742188, "global_step": 402072, "epoch": 4844} {"train_loss": -26.77880859375, "global_step": 402073, "epoch": 4844} {"train_loss": -26.443845748901367, "global_step": 402074, "epoch": 4844} {"train_loss": -26.496183395385742, "global_step": 402075, "epoch": 4844} {"train_loss": -26.325775146484375, "global_step": 402076, "epoch": 4844} {"train_loss": -26.37721824645996, "global_step": 402077, "epoch": 4844} {"train_loss": -26.533918380737305, "global_step": 402078, "epoch": 4844} {"train_loss": -26.256656646728516, "global_step": 402079, "epoch": 4844} {"train_loss": -26.3588809967041, "global_step": 402080, "epoch": 4844} {"train_loss": -26.322980880737305, "global_step": 402081, "epoch": 4844} {"train_loss": -26.635595321655273, "global_step": 402082, "epoch": 4844} {"train_loss": -25.965932846069336, "global_step": 402083, "epoch": 4844} {"train_loss": -26.99814224243164, "global_step": 402084, "epoch": 4844} {"train_loss": -26.644384384155273, "global_step": 402085, "epoch": 4844} {"train_loss": -26.50849723815918, "global_step": 402086, "epoch": 4844} {"train_loss": -26.771316528320312, "global_step": 402087, "epoch": 4844} {"train_loss": -26.5026798248291, "global_step": 402088, "epoch": 4844} {"train_loss": -26.29596519470215, "global_step": 402089, "epoch": 4844} {"train_loss": -26.599958419799805, "global_step": 402090, "epoch": 4844} {"train_loss": -26.94508934020996, "global_step": 402091, "epoch": 4844} {"train_loss": -26.582754135131836, "global_step": 402092, "epoch": 4844} {"train_loss": -26.79705238342285, "global_step": 402093, "epoch": 4844} {"train_loss": -26.3494930267334, "global_step": 402094, "epoch": 4844} {"train_loss": -26.59516716003418, "global_step": 402095, "epoch": 4844} {"train_loss": -26.836822509765625, "global_step": 402096, "epoch": 4844} {"train_loss": -26.333805084228516, "global_step": 402097, "epoch": 4844} {"train_loss": -26.93475914001465, "global_step": 402098, "epoch": 4844} {"train_loss": -26.55951499938965, "global_step": 402099, "epoch": 4844} {"train_loss": -26.46272087097168, "global_step": 402100, "epoch": 4844} {"train_loss": -26.737958908081055, "global_step": 402101, "epoch": 4844} {"train_loss": -26.848373413085938, "global_step": 402102, "epoch": 4844} {"train_loss": -26.8104190826416, "global_step": 402103, "epoch": 4844} {"train_loss": -26.430761337280273, "global_step": 402104, "epoch": 4844} {"train_loss": -27.03981590270996, "global_step": 402105, "epoch": 4844} {"train_loss": -26.960529327392578, "global_step": 402106, "epoch": 4844} {"train_loss": -26.7041015625, "global_step": 402107, "epoch": 4844} {"train_loss": -26.9360294342041, "global_step": 402108, "epoch": 4844} {"train_loss": -26.58473014831543, "global_step": 402109, "epoch": 4844} {"train_loss": -26.79463005065918, "global_step": 402110, "epoch": 4844} {"train_loss": -26.513214111328125, "global_step": 402111, "epoch": 4844} {"train_loss": -26.644031524658203, "global_step": 402112, "epoch": 4844} {"train_loss": -26.243167877197266, "global_step": 402113, "epoch": 4844} {"train_loss": -25.89888572692871, "global_step": 402114, "epoch": 4844} {"train_loss": -26.35225486755371, "global_step": 402115, "epoch": 4844} {"train_loss": -26.0706844329834, "global_step": 402116, "epoch": 4844} {"train_loss": -26.648406982421875, "global_step": 402117, "epoch": 4844} {"train_loss": -26.472259521484375, "global_step": 402118, "epoch": 4844} {"train_loss": -26.545896530151367, "global_step": 402119, "epoch": 4844} {"train_loss": -26.511856079101562, "global_step": 402120, "epoch": 4844} {"train_loss": -26.53232192993164, "global_step": 402121, "epoch": 4844} {"train_loss": -26.816755294799805, "global_step": 402122, "epoch": 4844} {"train_loss": -26.591291427612305, "global_step": 402123, "epoch": 4844} {"train_loss": -26.806238174438477, "global_step": 402124, "epoch": 4844} {"train_loss": -26.305200576782227, "global_step": 402125, "epoch": 4844} {"train_loss": -26.450170516967773, "global_step": 402126, "epoch": 4844} {"train_loss": -26.77375602722168, "global_step": 402127, "epoch": 4844} {"train_loss": -26.69843101501465, "global_step": 402128, "epoch": 4844} {"train_loss": -26.865985870361328, "global_step": 402129, "epoch": 4844} {"train_loss": -26.297574996948242, "global_step": 402130, "epoch": 4844} {"train_loss": -26.07423210144043, "global_step": 402131, "epoch": 4844} {"train_loss": -26.479345321655273, "global_step": 402132, "epoch": 4844} {"train_loss": -26.756620407104492, "global_step": 402133, "epoch": 4844} {"train_loss": -26.457619747483587, "global_step": 402134, "epoch": 4844, "val_loss": 6738428.5} {"train_loss": -25.184091567993164, "global_step": 402135, "epoch": 4845} {"train_loss": -24.95423698425293, "global_step": 402136, "epoch": 4845} {"train_loss": -26.546178817749023, "global_step": 402137, "epoch": 4845} {"train_loss": -24.993494033813477, "global_step": 402138, "epoch": 4845} {"train_loss": -26.238245010375977, "global_step": 402139, "epoch": 4845} {"train_loss": -25.857837677001953, "global_step": 402140, "epoch": 4845} {"train_loss": -26.161579132080078, "global_step": 402141, "epoch": 4845} {"train_loss": -26.396926879882812, "global_step": 402142, "epoch": 4845} {"train_loss": -26.045568466186523, "global_step": 402143, "epoch": 4845} {"train_loss": -26.171710968017578, "global_step": 402144, "epoch": 4845} {"train_loss": -26.144784927368164, "global_step": 402145, "epoch": 4845} {"train_loss": -26.10349464416504, "global_step": 402146, "epoch": 4845} {"train_loss": -26.675092697143555, "global_step": 402147, "epoch": 4845} {"train_loss": -26.371809005737305, "global_step": 402148, "epoch": 4845} {"train_loss": -26.48237419128418, "global_step": 402149, "epoch": 4845} {"train_loss": -25.771488189697266, "global_step": 402150, "epoch": 4845} {"train_loss": -26.269128799438477, "global_step": 402151, "epoch": 4845} {"train_loss": -26.011310577392578, "global_step": 402152, "epoch": 4845} {"train_loss": -26.3503475189209, "global_step": 402153, "epoch": 4845} {"train_loss": -26.517383575439453, "global_step": 402154, "epoch": 4845} {"train_loss": -26.213836669921875, "global_step": 402155, "epoch": 4845} {"train_loss": -25.943822860717773, "global_step": 402156, "epoch": 4845} {"train_loss": -26.75709342956543, "global_step": 402157, "epoch": 4845} {"train_loss": -26.487524032592773, "global_step": 402158, "epoch": 4845} {"train_loss": -26.332204818725586, "global_step": 402159, "epoch": 4845} {"train_loss": -26.449161529541016, "global_step": 402160, "epoch": 4845} {"train_loss": -26.471200942993164, "global_step": 402161, "epoch": 4845} {"train_loss": -26.625818252563477, "global_step": 402162, "epoch": 4845} {"train_loss": -27.082883834838867, "global_step": 402163, "epoch": 4845} {"train_loss": -26.612335205078125, "global_step": 402164, "epoch": 4845} {"train_loss": -26.44721031188965, "global_step": 402165, "epoch": 4845} {"train_loss": -26.237442016601562, "global_step": 402166, "epoch": 4845} {"train_loss": -26.461105346679688, "global_step": 402167, "epoch": 4845} {"train_loss": -26.5269775390625, "global_step": 402168, "epoch": 4845} {"train_loss": -26.61273765563965, "global_step": 402169, "epoch": 4845} {"train_loss": -26.5496826171875, "global_step": 402170, "epoch": 4845} {"train_loss": -26.681272506713867, "global_step": 402171, "epoch": 4845} {"train_loss": -26.656009674072266, "global_step": 402172, "epoch": 4845} {"train_loss": -26.846210479736328, "global_step": 402173, "epoch": 4845} {"train_loss": -26.665414810180664, "global_step": 402174, "epoch": 4845} {"train_loss": -26.635278701782227, "global_step": 402175, "epoch": 4845} {"train_loss": -26.416913986206055, "global_step": 402176, "epoch": 4845} {"train_loss": -26.685949325561523, "global_step": 402177, "epoch": 4845} {"train_loss": -26.955352783203125, "global_step": 402178, "epoch": 4845} {"train_loss": -26.534713745117188, "global_step": 402179, "epoch": 4845} {"train_loss": -26.91389274597168, "global_step": 402180, "epoch": 4845} {"train_loss": -26.623754501342773, "global_step": 402181, "epoch": 4845} {"train_loss": -26.826181411743164, "global_step": 402182, "epoch": 4845} {"train_loss": -26.806974411010742, "global_step": 402183, "epoch": 4845} {"train_loss": -26.756994247436523, "global_step": 402184, "epoch": 4845} {"train_loss": -26.895292282104492, "global_step": 402185, "epoch": 4845} {"train_loss": -26.931371688842773, "global_step": 402186, "epoch": 4845} {"train_loss": -26.787229537963867, "global_step": 402187, "epoch": 4845} {"train_loss": -27.18960952758789, "global_step": 402188, "epoch": 4845} {"train_loss": -26.798908233642578, "global_step": 402189, "epoch": 4845} {"train_loss": -27.001617431640625, "global_step": 402190, "epoch": 4845} {"train_loss": -26.4904727935791, "global_step": 402191, "epoch": 4845} {"train_loss": -26.278120040893555, "global_step": 402192, "epoch": 4845} {"train_loss": -26.21929931640625, "global_step": 402193, "epoch": 4845} {"train_loss": -25.978055953979492, "global_step": 402194, "epoch": 4845} {"train_loss": -26.13026237487793, "global_step": 402195, "epoch": 4845} {"train_loss": -25.8646297454834, "global_step": 402196, "epoch": 4845} {"train_loss": -26.50325584411621, "global_step": 402197, "epoch": 4845} {"train_loss": -26.4574031829834, "global_step": 402198, "epoch": 4845} {"train_loss": -26.559911727905273, "global_step": 402199, "epoch": 4845} {"train_loss": -26.553237915039062, "global_step": 402200, "epoch": 4845} {"train_loss": -26.58854103088379, "global_step": 402201, "epoch": 4845} {"train_loss": -26.63741111755371, "global_step": 402202, "epoch": 4845} {"train_loss": -26.655200958251953, "global_step": 402203, "epoch": 4845} {"train_loss": -26.35273551940918, "global_step": 402204, "epoch": 4845} {"train_loss": -26.753204345703125, "global_step": 402205, "epoch": 4845} {"train_loss": -26.36382484436035, "global_step": 402206, "epoch": 4845} {"train_loss": -26.413244247436523, "global_step": 402207, "epoch": 4845} {"train_loss": -26.768827438354492, "global_step": 402208, "epoch": 4845} {"train_loss": -26.022851943969727, "global_step": 402209, "epoch": 4845} {"train_loss": -26.584745407104492, "global_step": 402210, "epoch": 4845} {"train_loss": -26.58941078186035, "global_step": 402211, "epoch": 4845} {"train_loss": -26.248966217041016, "global_step": 402212, "epoch": 4845} {"train_loss": -26.599578857421875, "global_step": 402213, "epoch": 4845} {"train_loss": -26.59272575378418, "global_step": 402214, "epoch": 4845} {"train_loss": -26.37347412109375, "global_step": 402215, "epoch": 4845} {"train_loss": -26.584177017211914, "global_step": 402216, "epoch": 4845} {"train_loss": -26.43981577402138, "global_step": 402217, "epoch": 4845, "val_loss": 6791810.5} {"train_loss": -26.2609920501709, "global_step": 402218, "epoch": 4846} {"train_loss": -26.53217124938965, "global_step": 402219, "epoch": 4846} {"train_loss": -26.253665924072266, "global_step": 402220, "epoch": 4846} {"train_loss": -26.657794952392578, "global_step": 402221, "epoch": 4846} {"train_loss": -26.383466720581055, "global_step": 402222, "epoch": 4846} {"train_loss": -26.68232536315918, "global_step": 402223, "epoch": 4846} {"train_loss": -26.802515029907227, "global_step": 402224, "epoch": 4846} {"train_loss": -25.973581314086914, "global_step": 402225, "epoch": 4846} {"train_loss": -26.66543960571289, "global_step": 402226, "epoch": 4846} {"train_loss": -26.416196823120117, "global_step": 402227, "epoch": 4846} {"train_loss": -26.44136619567871, "global_step": 402228, "epoch": 4846} {"train_loss": -26.583404541015625, "global_step": 402229, "epoch": 4846} {"train_loss": -26.348846435546875, "global_step": 402230, "epoch": 4846} {"train_loss": -26.738439559936523, "global_step": 402231, "epoch": 4846} {"train_loss": -26.345041275024414, "global_step": 402232, "epoch": 4846} {"train_loss": -26.607166290283203, "global_step": 402233, "epoch": 4846} {"train_loss": -26.586261749267578, "global_step": 402234, "epoch": 4846} {"train_loss": -26.31648063659668, "global_step": 402235, "epoch": 4846} {"train_loss": -26.862157821655273, "global_step": 402236, "epoch": 4846} {"train_loss": -26.70184326171875, "global_step": 402237, "epoch": 4846} {"train_loss": -26.328872680664062, "global_step": 402238, "epoch": 4846} {"train_loss": -26.6903018951416, "global_step": 402239, "epoch": 4846} {"train_loss": -26.85641860961914, "global_step": 402240, "epoch": 4846} {"train_loss": -26.522674560546875, "global_step": 402241, "epoch": 4846} {"train_loss": -26.9051456451416, "global_step": 402242, "epoch": 4846} {"train_loss": -26.623123168945312, "global_step": 402243, "epoch": 4846} {"train_loss": -26.4322452545166, "global_step": 402244, "epoch": 4846} {"train_loss": -26.852645874023438, "global_step": 402245, "epoch": 4846} {"train_loss": -26.4381046295166, "global_step": 402246, "epoch": 4846} {"train_loss": -26.62697410583496, "global_step": 402247, "epoch": 4846} {"train_loss": -26.208343505859375, "global_step": 402248, "epoch": 4846} {"train_loss": -26.826873779296875, "global_step": 402249, "epoch": 4846} {"train_loss": -26.539026260375977, "global_step": 402250, "epoch": 4846} {"train_loss": -26.597814559936523, "global_step": 402251, "epoch": 4846} {"train_loss": -26.809741973876953, "global_step": 402252, "epoch": 4846} {"train_loss": -26.439294815063477, "global_step": 402253, "epoch": 4846} {"train_loss": -26.77495765686035, "global_step": 402254, "epoch": 4846} {"train_loss": -26.83609962463379, "global_step": 402255, "epoch": 4846} {"train_loss": -26.999134063720703, "global_step": 402256, "epoch": 4846} {"train_loss": -27.053455352783203, "global_step": 402257, "epoch": 4846} {"train_loss": -26.689884185791016, "global_step": 402258, "epoch": 4846} {"train_loss": -26.743574142456055, "global_step": 402259, "epoch": 4846} {"train_loss": -26.95552635192871, "global_step": 402260, "epoch": 4846} {"train_loss": -26.766651153564453, "global_step": 402261, "epoch": 4846} {"train_loss": -26.689849853515625, "global_step": 402262, "epoch": 4846} {"train_loss": -26.95135498046875, "global_step": 402263, "epoch": 4846} {"train_loss": -26.8624210357666, "global_step": 402264, "epoch": 4846} {"train_loss": -26.685861587524414, "global_step": 402265, "epoch": 4846} {"train_loss": -26.649755477905273, "global_step": 402266, "epoch": 4846} {"train_loss": -26.858671188354492, "global_step": 402267, "epoch": 4846} {"train_loss": -27.075551986694336, "global_step": 402268, "epoch": 4846} {"train_loss": -27.010452270507812, "global_step": 402269, "epoch": 4846} {"train_loss": -26.765722274780273, "global_step": 402270, "epoch": 4846} {"train_loss": -26.566650390625, "global_step": 402271, "epoch": 4846} {"train_loss": -26.336593627929688, "global_step": 402272, "epoch": 4846} {"train_loss": -26.50018310546875, "global_step": 402273, "epoch": 4846} {"train_loss": -26.49173927307129, "global_step": 402274, "epoch": 4846} {"train_loss": -25.612173080444336, "global_step": 402275, "epoch": 4846} {"train_loss": -26.55974769592285, "global_step": 402276, "epoch": 4846} {"train_loss": -26.86128807067871, "global_step": 402277, "epoch": 4846} {"train_loss": -26.581701278686523, "global_step": 402278, "epoch": 4846} {"train_loss": -26.2762451171875, "global_step": 402279, "epoch": 4846} {"train_loss": -26.720340728759766, "global_step": 402280, "epoch": 4846} {"train_loss": -26.827499389648438, "global_step": 402281, "epoch": 4846} {"train_loss": -26.689056396484375, "global_step": 402282, "epoch": 4846} {"train_loss": -26.4842586517334, "global_step": 402283, "epoch": 4846} {"train_loss": -26.7393741607666, "global_step": 402284, "epoch": 4846} {"train_loss": -27.05396842956543, "global_step": 402285, "epoch": 4846} {"train_loss": -26.900136947631836, "global_step": 402286, "epoch": 4846} {"train_loss": -26.876129150390625, "global_step": 402287, "epoch": 4846} {"train_loss": -27.026525497436523, "global_step": 402288, "epoch": 4846} {"train_loss": -27.043582916259766, "global_step": 402289, "epoch": 4846} {"train_loss": -26.566495895385742, "global_step": 402290, "epoch": 4846} {"train_loss": -26.69424819946289, "global_step": 402291, "epoch": 4846} {"train_loss": -26.35637855529785, "global_step": 402292, "epoch": 4846} {"train_loss": -26.37708854675293, "global_step": 402293, "epoch": 4846} {"train_loss": -26.679723739624023, "global_step": 402294, "epoch": 4846} {"train_loss": -26.94217872619629, "global_step": 402295, "epoch": 4846} {"train_loss": -26.64973258972168, "global_step": 402296, "epoch": 4846} {"train_loss": -26.543859481811523, "global_step": 402297, "epoch": 4846} {"train_loss": -26.65772819519043, "global_step": 402298, "epoch": 4846} {"train_loss": -26.973987579345703, "global_step": 402299, "epoch": 4846} {"train_loss": -26.6429649720709, "global_step": 402300, "epoch": 4846, "val_loss": 6768773.5} {"train_loss": -26.279388427734375, "global_step": 402301, "epoch": 4847} {"train_loss": -25.152708053588867, "global_step": 402302, "epoch": 4847} {"train_loss": -26.165369033813477, "global_step": 402303, "epoch": 4847} {"train_loss": -26.558027267456055, "global_step": 402304, "epoch": 4847} {"train_loss": -26.551410675048828, "global_step": 402305, "epoch": 4847} {"train_loss": -26.306060791015625, "global_step": 402306, "epoch": 4847} {"train_loss": -25.612653732299805, "global_step": 402307, "epoch": 4847} {"train_loss": -25.74712562561035, "global_step": 402308, "epoch": 4847} {"train_loss": -25.9685115814209, "global_step": 402309, "epoch": 4847} {"train_loss": -26.3443603515625, "global_step": 402310, "epoch": 4847} {"train_loss": -25.869245529174805, "global_step": 402311, "epoch": 4847} {"train_loss": -25.814146041870117, "global_step": 402312, "epoch": 4847} {"train_loss": -26.232473373413086, "global_step": 402313, "epoch": 4847} {"train_loss": -26.13201332092285, "global_step": 402314, "epoch": 4847} {"train_loss": -26.329425811767578, "global_step": 402315, "epoch": 4847} {"train_loss": -26.693571090698242, "global_step": 402316, "epoch": 4847} {"train_loss": -26.25367546081543, "global_step": 402317, "epoch": 4847} {"train_loss": -26.245389938354492, "global_step": 402318, "epoch": 4847} {"train_loss": -26.152496337890625, "global_step": 402319, "epoch": 4847} {"train_loss": -26.476043701171875, "global_step": 402320, "epoch": 4847} {"train_loss": -26.491247177124023, "global_step": 402321, "epoch": 4847} {"train_loss": -26.540191650390625, "global_step": 402322, "epoch": 4847} {"train_loss": -26.57441520690918, "global_step": 402323, "epoch": 4847} {"train_loss": -26.409290313720703, "global_step": 402324, "epoch": 4847} {"train_loss": -26.39351463317871, "global_step": 402325, "epoch": 4847} {"train_loss": -26.495298385620117, "global_step": 402326, "epoch": 4847} {"train_loss": -26.546829223632812, "global_step": 402327, "epoch": 4847} {"train_loss": -26.90681266784668, "global_step": 402328, "epoch": 4847} {"train_loss": -26.2901554107666, "global_step": 402329, "epoch": 4847} {"train_loss": -26.513965606689453, "global_step": 402330, "epoch": 4847} {"train_loss": -26.588083267211914, "global_step": 402331, "epoch": 4847} {"train_loss": -26.6075496673584, "global_step": 402332, "epoch": 4847} {"train_loss": -26.67046546936035, "global_step": 402333, "epoch": 4847} {"train_loss": -26.8304443359375, "global_step": 402334, "epoch": 4847} {"train_loss": -26.6440486907959, "global_step": 402335, "epoch": 4847} {"train_loss": -26.5942440032959, "global_step": 402336, "epoch": 4847} {"train_loss": -26.439687728881836, "global_step": 402337, "epoch": 4847} {"train_loss": -26.456974029541016, "global_step": 402338, "epoch": 4847} {"train_loss": -26.5786190032959, "global_step": 402339, "epoch": 4847} {"train_loss": -26.761539459228516, "global_step": 402340, "epoch": 4847} {"train_loss": -26.809335708618164, "global_step": 402341, "epoch": 4847} {"train_loss": -26.834375381469727, "global_step": 402342, "epoch": 4847} {"train_loss": -26.946935653686523, "global_step": 402343, "epoch": 4847} {"train_loss": -26.694461822509766, "global_step": 402344, "epoch": 4847} {"train_loss": -26.31092643737793, "global_step": 402345, "epoch": 4847} {"train_loss": -26.968469619750977, "global_step": 402346, "epoch": 4847} {"train_loss": -26.334775924682617, "global_step": 402347, "epoch": 4847} {"train_loss": -27.115509033203125, "global_step": 402348, "epoch": 4847} {"train_loss": -25.913854598999023, "global_step": 402349, "epoch": 4847} {"train_loss": -26.192642211914062, "global_step": 402350, "epoch": 4847} {"train_loss": -26.37457275390625, "global_step": 402351, "epoch": 4847} {"train_loss": -26.5736083984375, "global_step": 402352, "epoch": 4847} {"train_loss": -26.384241104125977, "global_step": 402353, "epoch": 4847} {"train_loss": -26.217395782470703, "global_step": 402354, "epoch": 4847} {"train_loss": -26.2615966796875, "global_step": 402355, "epoch": 4847} {"train_loss": -26.676361083984375, "global_step": 402356, "epoch": 4847} {"train_loss": -26.511640548706055, "global_step": 402357, "epoch": 4847} {"train_loss": -26.310956954956055, "global_step": 402358, "epoch": 4847} {"train_loss": -26.65403175354004, "global_step": 402359, "epoch": 4847} {"train_loss": -26.56320571899414, "global_step": 402360, "epoch": 4847} {"train_loss": -26.644983291625977, "global_step": 402361, "epoch": 4847} {"train_loss": -26.15616798400879, "global_step": 402362, "epoch": 4847} {"train_loss": -26.787155151367188, "global_step": 402363, "epoch": 4847} {"train_loss": -26.669973373413086, "global_step": 402364, "epoch": 4847} {"train_loss": -26.460561752319336, "global_step": 402365, "epoch": 4847} {"train_loss": -26.849185943603516, "global_step": 402366, "epoch": 4847} {"train_loss": -26.500579833984375, "global_step": 402367, "epoch": 4847} {"train_loss": -26.618255615234375, "global_step": 402368, "epoch": 4847} {"train_loss": -26.669193267822266, "global_step": 402369, "epoch": 4847} {"train_loss": -26.658926010131836, "global_step": 402370, "epoch": 4847} {"train_loss": -26.35932731628418, "global_step": 402371, "epoch": 4847} {"train_loss": -26.421985626220703, "global_step": 402372, "epoch": 4847} {"train_loss": -26.615530014038086, "global_step": 402373, "epoch": 4847} {"train_loss": -26.38299560546875, "global_step": 402374, "epoch": 4847} {"train_loss": -26.342451095581055, "global_step": 402375, "epoch": 4847} {"train_loss": -27.0665340423584, "global_step": 402376, "epoch": 4847} {"train_loss": -26.8396053314209, "global_step": 402377, "epoch": 4847} {"train_loss": -26.574237823486328, "global_step": 402378, "epoch": 4847} {"train_loss": -26.490758895874023, "global_step": 402379, "epoch": 4847} {"train_loss": -26.8515682220459, "global_step": 402380, "epoch": 4847} {"train_loss": -26.752899169921875, "global_step": 402381, "epoch": 4847} {"train_loss": -26.827423095703125, "global_step": 402382, "epoch": 4847} {"train_loss": -26.47950039139713, "global_step": 402383, "epoch": 4847, "val_loss": 6733823.5} {"train_loss": -27.01263999938965, "global_step": 402384, "epoch": 4848} {"train_loss": -26.805561065673828, "global_step": 402385, "epoch": 4848} {"train_loss": -26.770605087280273, "global_step": 402386, "epoch": 4848} {"train_loss": -26.6308650970459, "global_step": 402387, "epoch": 4848} {"train_loss": -26.234777450561523, "global_step": 402388, "epoch": 4848} {"train_loss": -26.531631469726562, "global_step": 402389, "epoch": 4848} {"train_loss": -26.88081169128418, "global_step": 402390, "epoch": 4848} {"train_loss": -26.76045036315918, "global_step": 402391, "epoch": 4848} {"train_loss": -26.40220069885254, "global_step": 402392, "epoch": 4848} {"train_loss": -26.631845474243164, "global_step": 402393, "epoch": 4848} {"train_loss": -26.2791805267334, "global_step": 402394, "epoch": 4848} {"train_loss": -26.8868408203125, "global_step": 402395, "epoch": 4848} {"train_loss": -26.776723861694336, "global_step": 402396, "epoch": 4848} {"train_loss": -26.97639274597168, "global_step": 402397, "epoch": 4848} {"train_loss": -26.73346519470215, "global_step": 402398, "epoch": 4848} {"train_loss": -26.698226928710938, "global_step": 402399, "epoch": 4848} {"train_loss": -26.812305450439453, "global_step": 402400, "epoch": 4848} {"train_loss": -26.428924560546875, "global_step": 402401, "epoch": 4848} {"train_loss": -26.156042098999023, "global_step": 402402, "epoch": 4848} {"train_loss": -25.882017135620117, "global_step": 402403, "epoch": 4848} {"train_loss": -26.365514755249023, "global_step": 402404, "epoch": 4848} {"train_loss": -26.74593162536621, "global_step": 402405, "epoch": 4848} {"train_loss": -26.685897827148438, "global_step": 402406, "epoch": 4848} {"train_loss": -26.419851303100586, "global_step": 402407, "epoch": 4848} {"train_loss": -27.06354331970215, "global_step": 402408, "epoch": 4848} {"train_loss": -26.336767196655273, "global_step": 402409, "epoch": 4848} {"train_loss": -26.524890899658203, "global_step": 402410, "epoch": 4848} {"train_loss": -26.294525146484375, "global_step": 402411, "epoch": 4848} {"train_loss": -26.54532241821289, "global_step": 402412, "epoch": 4848} {"train_loss": -26.769174575805664, "global_step": 402413, "epoch": 4848} {"train_loss": -26.60418701171875, "global_step": 402414, "epoch": 4848} {"train_loss": -26.489551544189453, "global_step": 402415, "epoch": 4848} {"train_loss": -26.498205184936523, "global_step": 402416, "epoch": 4848} {"train_loss": -26.427576065063477, "global_step": 402417, "epoch": 4848} {"train_loss": -26.265127182006836, "global_step": 402418, "epoch": 4848} {"train_loss": -26.436132431030273, "global_step": 402419, "epoch": 4848} {"train_loss": -26.835901260375977, "global_step": 402420, "epoch": 4848} {"train_loss": -26.510190963745117, "global_step": 402421, "epoch": 4848} {"train_loss": -26.779163360595703, "global_step": 402422, "epoch": 4848} {"train_loss": -26.422286987304688, "global_step": 402423, "epoch": 4848} {"train_loss": -26.627212524414062, "global_step": 402424, "epoch": 4848} {"train_loss": -26.722360610961914, "global_step": 402425, "epoch": 4848} {"train_loss": -26.987751007080078, "global_step": 402426, "epoch": 4848} {"train_loss": -26.76191520690918, "global_step": 402427, "epoch": 4848} {"train_loss": -26.921466827392578, "global_step": 402428, "epoch": 4848} {"train_loss": -26.520614624023438, "global_step": 402429, "epoch": 4848} {"train_loss": -26.49468421936035, "global_step": 402430, "epoch": 4848} {"train_loss": -26.79545021057129, "global_step": 402431, "epoch": 4848} {"train_loss": -26.77374267578125, "global_step": 402432, "epoch": 4848} {"train_loss": -26.833337783813477, "global_step": 402433, "epoch": 4848} {"train_loss": -26.886611938476562, "global_step": 402434, "epoch": 4848} {"train_loss": -26.580636978149414, "global_step": 402435, "epoch": 4848} {"train_loss": -26.872602462768555, "global_step": 402436, "epoch": 4848} {"train_loss": -26.821706771850586, "global_step": 402437, "epoch": 4848} {"train_loss": -26.808324813842773, "global_step": 402438, "epoch": 4848} {"train_loss": -26.644855499267578, "global_step": 402439, "epoch": 4848} {"train_loss": -26.604248046875, "global_step": 402440, "epoch": 4848} {"train_loss": -26.473697662353516, "global_step": 402441, "epoch": 4848} {"train_loss": -26.62403678894043, "global_step": 402442, "epoch": 4848} {"train_loss": -26.144882202148438, "global_step": 402443, "epoch": 4848} {"train_loss": -25.576997756958008, "global_step": 402444, "epoch": 4848} {"train_loss": -25.70267677307129, "global_step": 402445, "epoch": 4848} {"train_loss": -26.30975341796875, "global_step": 402446, "epoch": 4848} {"train_loss": -26.44268226623535, "global_step": 402447, "epoch": 4848} {"train_loss": -26.474210739135742, "global_step": 402448, "epoch": 4848} {"train_loss": -26.1535587310791, "global_step": 402449, "epoch": 4848} {"train_loss": -26.70515251159668, "global_step": 402450, "epoch": 4848} {"train_loss": -26.39385414123535, "global_step": 402451, "epoch": 4848} {"train_loss": -26.569992065429688, "global_step": 402452, "epoch": 4848} {"train_loss": -26.6953067779541, "global_step": 402453, "epoch": 4848} {"train_loss": -26.575510025024414, "global_step": 402454, "epoch": 4848} {"train_loss": -26.75471305847168, "global_step": 402455, "epoch": 4848} {"train_loss": -26.619626998901367, "global_step": 402456, "epoch": 4848} {"train_loss": -26.682727813720703, "global_step": 402457, "epoch": 4848} {"train_loss": -27.273670196533203, "global_step": 402458, "epoch": 4848} {"train_loss": -26.7846622467041, "global_step": 402459, "epoch": 4848} {"train_loss": -26.557340621948242, "global_step": 402460, "epoch": 4848} {"train_loss": -26.62879753112793, "global_step": 402461, "epoch": 4848} {"train_loss": -26.91542625427246, "global_step": 402462, "epoch": 4848} {"train_loss": -26.695327758789062, "global_step": 402463, "epoch": 4848} {"train_loss": -26.143905639648438, "global_step": 402464, "epoch": 4848} {"train_loss": -26.41669273376465, "global_step": 402465, "epoch": 4848} {"train_loss": -26.593041155711713, "global_step": 402466, "epoch": 4848, "val_loss": 6727742.0} {"train_loss": -24.91768455505371, "global_step": 402467, "epoch": 4849} {"train_loss": -22.6929988861084, "global_step": 402468, "epoch": 4849} {"train_loss": -25.372732162475586, "global_step": 402469, "epoch": 4849} {"train_loss": -24.94375991821289, "global_step": 402470, "epoch": 4849} {"train_loss": -25.719043731689453, "global_step": 402471, "epoch": 4849} {"train_loss": -25.0006046295166, "global_step": 402472, "epoch": 4849} {"train_loss": -25.8945369720459, "global_step": 402473, "epoch": 4849} {"train_loss": -25.42990493774414, "global_step": 402474, "epoch": 4849} {"train_loss": -25.580032348632812, "global_step": 402475, "epoch": 4849} {"train_loss": -25.27425765991211, "global_step": 402476, "epoch": 4849} {"train_loss": -25.957183837890625, "global_step": 402477, "epoch": 4849} {"train_loss": -25.714094161987305, "global_step": 402478, "epoch": 4849} {"train_loss": -25.427127838134766, "global_step": 402479, "epoch": 4849} {"train_loss": -25.55918312072754, "global_step": 402480, "epoch": 4849} {"train_loss": -25.38363265991211, "global_step": 402481, "epoch": 4849} {"train_loss": -25.846338272094727, "global_step": 402482, "epoch": 4849} {"train_loss": -26.114730834960938, "global_step": 402483, "epoch": 4849} {"train_loss": -25.959386825561523, "global_step": 402484, "epoch": 4849} {"train_loss": -26.18287467956543, "global_step": 402485, "epoch": 4849} {"train_loss": -25.824438095092773, "global_step": 402486, "epoch": 4849} {"train_loss": -26.05030632019043, "global_step": 402487, "epoch": 4849} {"train_loss": -26.27363395690918, "global_step": 402488, "epoch": 4849} {"train_loss": -26.041034698486328, "global_step": 402489, "epoch": 4849} {"train_loss": -25.904203414916992, "global_step": 402490, "epoch": 4849} {"train_loss": -26.337888717651367, "global_step": 402491, "epoch": 4849} {"train_loss": -26.133380889892578, "global_step": 402492, "epoch": 4849} {"train_loss": -26.418933868408203, "global_step": 402493, "epoch": 4849} {"train_loss": -26.20082664489746, "global_step": 402494, "epoch": 4849} {"train_loss": -26.633270263671875, "global_step": 402495, "epoch": 4849} {"train_loss": -26.24897575378418, "global_step": 402496, "epoch": 4849} {"train_loss": -26.54412841796875, "global_step": 402497, "epoch": 4849} {"train_loss": -26.563018798828125, "global_step": 402498, "epoch": 4849} {"train_loss": -26.396060943603516, "global_step": 402499, "epoch": 4849} {"train_loss": -26.74762535095215, "global_step": 402500, "epoch": 4849} {"train_loss": -26.438983917236328, "global_step": 402501, "epoch": 4849} {"train_loss": -26.739171981811523, "global_step": 402502, "epoch": 4849} {"train_loss": -26.63325309753418, "global_step": 402503, "epoch": 4849} {"train_loss": -26.345205307006836, "global_step": 402504, "epoch": 4849} {"train_loss": -26.352548599243164, "global_step": 402505, "epoch": 4849} {"train_loss": -26.688674926757812, "global_step": 402506, "epoch": 4849} {"train_loss": -26.760168075561523, "global_step": 402507, "epoch": 4849} {"train_loss": -26.4525089263916, "global_step": 402508, "epoch": 4849} {"train_loss": -26.570587158203125, "global_step": 402509, "epoch": 4849} {"train_loss": -26.74444007873535, "global_step": 402510, "epoch": 4849} {"train_loss": -26.723346710205078, "global_step": 402511, "epoch": 4849} {"train_loss": -26.495519638061523, "global_step": 402512, "epoch": 4849} {"train_loss": -26.976709365844727, "global_step": 402513, "epoch": 4849} {"train_loss": -26.74896812438965, "global_step": 402514, "epoch": 4849} {"train_loss": -26.92670249938965, "global_step": 402515, "epoch": 4849} {"train_loss": -26.941669464111328, "global_step": 402516, "epoch": 4849} {"train_loss": -26.957382202148438, "global_step": 402517, "epoch": 4849} {"train_loss": -26.805627822875977, "global_step": 402518, "epoch": 4849} {"train_loss": -26.89214515686035, "global_step": 402519, "epoch": 4849} {"train_loss": -26.85369300842285, "global_step": 402520, "epoch": 4849} {"train_loss": -27.045820236206055, "global_step": 402521, "epoch": 4849} {"train_loss": -27.008710861206055, "global_step": 402522, "epoch": 4849} {"train_loss": -26.754003524780273, "global_step": 402523, "epoch": 4849} {"train_loss": -26.686254501342773, "global_step": 402524, "epoch": 4849} {"train_loss": -26.687707901000977, "global_step": 402525, "epoch": 4849} {"train_loss": -26.779861450195312, "global_step": 402526, "epoch": 4849} {"train_loss": -26.803863525390625, "global_step": 402527, "epoch": 4849} {"train_loss": -26.75494384765625, "global_step": 402528, "epoch": 4849} {"train_loss": -26.795169830322266, "global_step": 402529, "epoch": 4849} {"train_loss": -27.245685577392578, "global_step": 402530, "epoch": 4849} {"train_loss": -26.876882553100586, "global_step": 402531, "epoch": 4849} {"train_loss": -26.84038734436035, "global_step": 402532, "epoch": 4849} {"train_loss": -26.647327423095703, "global_step": 402533, "epoch": 4849} {"train_loss": -26.672698974609375, "global_step": 402534, "epoch": 4849} {"train_loss": -26.903900146484375, "global_step": 402535, "epoch": 4849} {"train_loss": -26.698694229125977, "global_step": 402536, "epoch": 4849} {"train_loss": -26.663984298706055, "global_step": 402537, "epoch": 4849} {"train_loss": -26.616907119750977, "global_step": 402538, "epoch": 4849} {"train_loss": -26.354093551635742, "global_step": 402539, "epoch": 4849} {"train_loss": -25.893354415893555, "global_step": 402540, "epoch": 4849} {"train_loss": -25.68683433532715, "global_step": 402541, "epoch": 4849} {"train_loss": -25.45819091796875, "global_step": 402542, "epoch": 4849} {"train_loss": -25.514705657958984, "global_step": 402543, "epoch": 4849} {"train_loss": -25.548816680908203, "global_step": 402544, "epoch": 4849} {"train_loss": -26.767004013061523, "global_step": 402545, "epoch": 4849} {"train_loss": -26.31072998046875, "global_step": 402546, "epoch": 4849} {"train_loss": -26.0174617767334, "global_step": 402547, "epoch": 4849} {"train_loss": -25.830350875854492, "global_step": 402548, "epoch": 4849} {"train_loss": -26.250284401767225, "global_step": 402549, "epoch": 4849, "val_loss": 6764444.0} {"train_loss": -24.969364166259766, "global_step": 402550, "epoch": 4850} {"train_loss": -25.791345596313477, "global_step": 402551, "epoch": 4850} {"train_loss": -25.680952072143555, "global_step": 402552, "epoch": 4850} {"train_loss": -24.93750762939453, "global_step": 402553, "epoch": 4850} {"train_loss": -25.273542404174805, "global_step": 402554, "epoch": 4850} {"train_loss": -25.314130783081055, "global_step": 402555, "epoch": 4850} {"train_loss": -25.35677146911621, "global_step": 402556, "epoch": 4850} {"train_loss": -25.06671142578125, "global_step": 402557, "epoch": 4850} {"train_loss": -25.543914794921875, "global_step": 402558, "epoch": 4850} {"train_loss": -26.168195724487305, "global_step": 402559, "epoch": 4850} {"train_loss": -25.555606842041016, "global_step": 402560, "epoch": 4850} {"train_loss": -25.627456665039062, "global_step": 402561, "epoch": 4850} {"train_loss": -25.9084529876709, "global_step": 402562, "epoch": 4850} {"train_loss": -25.75935935974121, "global_step": 402563, "epoch": 4850} {"train_loss": -25.97771644592285, "global_step": 402564, "epoch": 4850} {"train_loss": -25.84848403930664, "global_step": 402565, "epoch": 4850} {"train_loss": -26.056074142456055, "global_step": 402566, "epoch": 4850} {"train_loss": -26.014707565307617, "global_step": 402567, "epoch": 4850} {"train_loss": -25.895923614501953, "global_step": 402568, "epoch": 4850} {"train_loss": -25.929107666015625, "global_step": 402569, "epoch": 4850} {"train_loss": -25.756452560424805, "global_step": 402570, "epoch": 4850} {"train_loss": -26.069257736206055, "global_step": 402571, "epoch": 4850} {"train_loss": -26.24871826171875, "global_step": 402572, "epoch": 4850} {"train_loss": -26.0081844329834, "global_step": 402573, "epoch": 4850} {"train_loss": -26.22063636779785, "global_step": 402574, "epoch": 4850} {"train_loss": -26.568328857421875, "global_step": 402575, "epoch": 4850} {"train_loss": -25.92885398864746, "global_step": 402576, "epoch": 4850} {"train_loss": -25.9669246673584, "global_step": 402577, "epoch": 4850} {"train_loss": -26.492694854736328, "global_step": 402578, "epoch": 4850} {"train_loss": -26.502643585205078, "global_step": 402579, "epoch": 4850} {"train_loss": -26.409290313720703, "global_step": 402580, "epoch": 4850} {"train_loss": -26.475610733032227, "global_step": 402581, "epoch": 4850} {"train_loss": -26.577564239501953, "global_step": 402582, "epoch": 4850} {"train_loss": -26.541168212890625, "global_step": 402583, "epoch": 4850} {"train_loss": -26.530792236328125, "global_step": 402584, "epoch": 4850} {"train_loss": -26.456777572631836, "global_step": 402585, "epoch": 4850} {"train_loss": -26.516681671142578, "global_step": 402586, "epoch": 4850} {"train_loss": -26.626413345336914, "global_step": 402587, "epoch": 4850} {"train_loss": -26.411970138549805, "global_step": 402588, "epoch": 4850} {"train_loss": -26.183752059936523, "global_step": 402589, "epoch": 4850} {"train_loss": -26.636310577392578, "global_step": 402590, "epoch": 4850} {"train_loss": -26.803028106689453, "global_step": 402591, "epoch": 4850} {"train_loss": -26.632511138916016, "global_step": 402592, "epoch": 4850} {"train_loss": -26.696430206298828, "global_step": 402593, "epoch": 4850} {"train_loss": -26.85308265686035, "global_step": 402594, "epoch": 4850} {"train_loss": -26.817047119140625, "global_step": 402595, "epoch": 4850} {"train_loss": -26.686969757080078, "global_step": 402596, "epoch": 4850} {"train_loss": -26.772504806518555, "global_step": 402597, "epoch": 4850} {"train_loss": -26.9091739654541, "global_step": 402598, "epoch": 4850} {"train_loss": -26.148466110229492, "global_step": 402599, "epoch": 4850} {"train_loss": -26.665374755859375, "global_step": 402600, "epoch": 4850} {"train_loss": -26.781986236572266, "global_step": 402601, "epoch": 4850} {"train_loss": -26.637561798095703, "global_step": 402602, "epoch": 4850} {"train_loss": -26.50751304626465, "global_step": 402603, "epoch": 4850} {"train_loss": -26.16790199279785, "global_step": 402604, "epoch": 4850} {"train_loss": -26.828611373901367, "global_step": 402605, "epoch": 4850} {"train_loss": -26.729053497314453, "global_step": 402606, "epoch": 4850} {"train_loss": -26.67671012878418, "global_step": 402607, "epoch": 4850} {"train_loss": -26.4814395904541, "global_step": 402608, "epoch": 4850} {"train_loss": -26.30165672302246, "global_step": 402609, "epoch": 4850} {"train_loss": -26.813257217407227, "global_step": 402610, "epoch": 4850} {"train_loss": -26.770477294921875, "global_step": 402611, "epoch": 4850} {"train_loss": -26.559415817260742, "global_step": 402612, "epoch": 4850} {"train_loss": -26.84370231628418, "global_step": 402613, "epoch": 4850} {"train_loss": -26.714513778686523, "global_step": 402614, "epoch": 4850} {"train_loss": -26.772186279296875, "global_step": 402615, "epoch": 4850} {"train_loss": -26.772085189819336, "global_step": 402616, "epoch": 4850} {"train_loss": -26.85272789001465, "global_step": 402617, "epoch": 4850} {"train_loss": -26.985248565673828, "global_step": 402618, "epoch": 4850} {"train_loss": -26.92022705078125, "global_step": 402619, "epoch": 4850} {"train_loss": -26.401050567626953, "global_step": 402620, "epoch": 4850} {"train_loss": -26.623693466186523, "global_step": 402621, "epoch": 4850} {"train_loss": -27.171518325805664, "global_step": 402622, "epoch": 4850} {"train_loss": -26.697004318237305, "global_step": 402623, "epoch": 4850} {"train_loss": -26.4875545501709, "global_step": 402624, "epoch": 4850} {"train_loss": -26.66595458984375, "global_step": 402625, "epoch": 4850} {"train_loss": -26.85304069519043, "global_step": 402626, "epoch": 4850} {"train_loss": -27.1807918548584, "global_step": 402627, "epoch": 4850} {"train_loss": -26.7998046875, "global_step": 402628, "epoch": 4850} {"train_loss": -27.05671501159668, "global_step": 402629, "epoch": 4850} {"train_loss": -26.9066104888916, "global_step": 402630, "epoch": 4850} {"train_loss": -27.05222511291504, "global_step": 402631, "epoch": 4850} {"train_loss": -26.38308947919363, "global_step": 402632, "epoch": 4850, "train/sim_max_reward_0": 1.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4500000": 1.0, "test/sim_max_reward_4500001": 1.0, "test/sim_max_reward_4500002": 1.0, "test/sim_max_reward_4500003": 1.0, "test/sim_max_reward_4500004": 1.0, "test/sim_max_reward_4500005": 1.0, "test/sim_max_reward_4500006": 1.0, "test/sim_max_reward_4500007": 1.0, "test/sim_max_reward_4500008": 1.0, "test/sim_max_reward_4500009": 1.0, "test/sim_max_reward_4500010": 1.0, "test/sim_max_reward_4500011": 1.0, "test/sim_max_reward_4500012": 1.0, "test/sim_max_reward_4500013": 1.0, "test/sim_max_reward_4500014": 1.0, "test/sim_max_reward_4500015": 1.0, "test/sim_max_reward_4500016": 1.0, "test/sim_max_reward_4500017": 1.0, "test/sim_max_reward_4500018": 1.0, "test/sim_max_reward_4500019": 1.0, "test/sim_max_reward_4500020": 1.0, "test/sim_max_reward_4500021": 1.0, "train/mean_score": 1.0, "test/mean_score": 1.0, "val_loss": 6815270.5} {"train_loss": -26.0388126373291, "global_step": 402633, "epoch": 4851} {"train_loss": -26.047077178955078, "global_step": 402634, "epoch": 4851} {"train_loss": -26.0816650390625, "global_step": 402635, "epoch": 4851} {"train_loss": -26.525501251220703, "global_step": 402636, "epoch": 4851} {"train_loss": -26.345861434936523, "global_step": 402637, "epoch": 4851} {"train_loss": -26.231678009033203, "global_step": 402638, "epoch": 4851} {"train_loss": -26.141775131225586, "global_step": 402639, "epoch": 4851} {"train_loss": -26.318090438842773, "global_step": 402640, "epoch": 4851} {"train_loss": -26.30989646911621, "global_step": 402641, "epoch": 4851} {"train_loss": -26.27534294128418, "global_step": 402642, "epoch": 4851} {"train_loss": -26.538740158081055, "global_step": 402643, "epoch": 4851} {"train_loss": -26.490203857421875, "global_step": 402644, "epoch": 4851} {"train_loss": -26.36170768737793, "global_step": 402645, "epoch": 4851} {"train_loss": -26.67946434020996, "global_step": 402646, "epoch": 4851} {"train_loss": -26.697498321533203, "global_step": 402647, "epoch": 4851} {"train_loss": -26.526031494140625, "global_step": 402648, "epoch": 4851} {"train_loss": -26.349451065063477, "global_step": 402649, "epoch": 4851} {"train_loss": -26.644712448120117, "global_step": 402650, "epoch": 4851} {"train_loss": -26.65791893005371, "global_step": 402651, "epoch": 4851} {"train_loss": -26.623388290405273, "global_step": 402652, "epoch": 4851} {"train_loss": -26.655866622924805, "global_step": 402653, "epoch": 4851} {"train_loss": -26.555173873901367, "global_step": 402654, "epoch": 4851} {"train_loss": -26.61536979675293, "global_step": 402655, "epoch": 4851} {"train_loss": -26.587875366210938, "global_step": 402656, "epoch": 4851} {"train_loss": -27.059736251831055, "global_step": 402657, "epoch": 4851} {"train_loss": -26.727680206298828, "global_step": 402658, "epoch": 4851} {"train_loss": -27.19758415222168, "global_step": 402659, "epoch": 4851} {"train_loss": -26.716522216796875, "global_step": 402660, "epoch": 4851} {"train_loss": -26.552921295166016, "global_step": 402661, "epoch": 4851} {"train_loss": -26.761693954467773, "global_step": 402662, "epoch": 4851} {"train_loss": -26.74738121032715, "global_step": 402663, "epoch": 4851} {"train_loss": -26.595624923706055, "global_step": 402664, "epoch": 4851} {"train_loss": -26.3216495513916, "global_step": 402665, "epoch": 4851} {"train_loss": -26.825260162353516, "global_step": 402666, "epoch": 4851} {"train_loss": -26.890411376953125, "global_step": 402667, "epoch": 4851} {"train_loss": -26.77142906188965, "global_step": 402668, "epoch": 4851} {"train_loss": -26.66383171081543, "global_step": 402669, "epoch": 4851} {"train_loss": -26.64556312561035, "global_step": 402670, "epoch": 4851} {"train_loss": -26.689472198486328, "global_step": 402671, "epoch": 4851} {"train_loss": -26.57256507873535, "global_step": 402672, "epoch": 4851} {"train_loss": -26.37176513671875, "global_step": 402673, "epoch": 4851} {"train_loss": -26.628644943237305, "global_step": 402674, "epoch": 4851} {"train_loss": -26.806171417236328, "global_step": 402675, "epoch": 4851} {"train_loss": -26.906482696533203, "global_step": 402676, "epoch": 4851} {"train_loss": -26.843341827392578, "global_step": 402677, "epoch": 4851} {"train_loss": -26.7647705078125, "global_step": 402678, "epoch": 4851} {"train_loss": -26.563344955444336, "global_step": 402679, "epoch": 4851} {"train_loss": -26.48140525817871, "global_step": 402680, "epoch": 4851} {"train_loss": -26.827463150024414, "global_step": 402681, "epoch": 4851} {"train_loss": -26.755695343017578, "global_step": 402682, "epoch": 4851} {"train_loss": -26.64691734313965, "global_step": 402683, "epoch": 4851} {"train_loss": -26.653406143188477, "global_step": 402684, "epoch": 4851} {"train_loss": -26.13862419128418, "global_step": 402685, "epoch": 4851} {"train_loss": -26.75672721862793, "global_step": 402686, "epoch": 4851} {"train_loss": -26.3869686126709, "global_step": 402687, "epoch": 4851} {"train_loss": -26.366220474243164, "global_step": 402688, "epoch": 4851} {"train_loss": -26.590972900390625, "global_step": 402689, "epoch": 4851} {"train_loss": -26.82356071472168, "global_step": 402690, "epoch": 4851} {"train_loss": -26.783308029174805, "global_step": 402691, "epoch": 4851} {"train_loss": -26.924848556518555, "global_step": 402692, "epoch": 4851} {"train_loss": -26.963031768798828, "global_step": 402693, "epoch": 4851} {"train_loss": -26.4958438873291, "global_step": 402694, "epoch": 4851} {"train_loss": -27.02430534362793, "global_step": 402695, "epoch": 4851} {"train_loss": -26.875091552734375, "global_step": 402696, "epoch": 4851} {"train_loss": -26.807477951049805, "global_step": 402697, "epoch": 4851} {"train_loss": -26.818450927734375, "global_step": 402698, "epoch": 4851} {"train_loss": -27.06709098815918, "global_step": 402699, "epoch": 4851} {"train_loss": -26.681304931640625, "global_step": 402700, "epoch": 4851} {"train_loss": -26.909454345703125, "global_step": 402701, "epoch": 4851} {"train_loss": -26.7904109954834, "global_step": 402702, "epoch": 4851} {"train_loss": -26.82643699645996, "global_step": 402703, "epoch": 4851} {"train_loss": -26.609683990478516, "global_step": 402704, "epoch": 4851} {"train_loss": -27.278112411499023, "global_step": 402705, "epoch": 4851} {"train_loss": -26.879117965698242, "global_step": 402706, "epoch": 4851} {"train_loss": -26.725427627563477, "global_step": 402707, "epoch": 4851} {"train_loss": -26.9332218170166, "global_step": 402708, "epoch": 4851} {"train_loss": -26.481754302978516, "global_step": 402709, "epoch": 4851} {"train_loss": -26.4090576171875, "global_step": 402710, "epoch": 4851} {"train_loss": -26.923818588256836, "global_step": 402711, "epoch": 4851} {"train_loss": -26.662567138671875, "global_step": 402712, "epoch": 4851} {"train_loss": -26.749847412109375, "global_step": 402713, "epoch": 4851} {"train_loss": -26.906644821166992, "global_step": 402714, "epoch": 4851} {"train_loss": -26.656210727002247, "global_step": 402715, "epoch": 4851, "val_loss": 6578054.0} {"train_loss": -25.345458984375, "global_step": 402716, "epoch": 4852} {"train_loss": -25.596920013427734, "global_step": 402717, "epoch": 4852} {"train_loss": -25.53898048400879, "global_step": 402718, "epoch": 4852} {"train_loss": -24.723407745361328, "global_step": 402719, "epoch": 4852} {"train_loss": -25.35496711730957, "global_step": 402720, "epoch": 4852} {"train_loss": -25.275344848632812, "global_step": 402721, "epoch": 4852} {"train_loss": -25.587677001953125, "global_step": 402722, "epoch": 4852} {"train_loss": -25.58315086364746, "global_step": 402723, "epoch": 4852} {"train_loss": -25.4775390625, "global_step": 402724, "epoch": 4852} {"train_loss": -25.135211944580078, "global_step": 402725, "epoch": 4852} {"train_loss": -26.106107711791992, "global_step": 402726, "epoch": 4852} {"train_loss": -25.620468139648438, "global_step": 402727, "epoch": 4852} {"train_loss": -25.557353973388672, "global_step": 402728, "epoch": 4852} {"train_loss": -25.53851890563965, "global_step": 402729, "epoch": 4852} {"train_loss": -25.675928115844727, "global_step": 402730, "epoch": 4852} {"train_loss": -25.760297775268555, "global_step": 402731, "epoch": 4852} {"train_loss": -25.789457321166992, "global_step": 402732, "epoch": 4852} {"train_loss": -26.06781005859375, "global_step": 402733, "epoch": 4852} {"train_loss": -25.81658935546875, "global_step": 402734, "epoch": 4852} {"train_loss": -25.983983993530273, "global_step": 402735, "epoch": 4852} {"train_loss": -25.991809844970703, "global_step": 402736, "epoch": 4852} {"train_loss": -25.931827545166016, "global_step": 402737, "epoch": 4852} {"train_loss": -26.20220375061035, "global_step": 402738, "epoch": 4852} {"train_loss": -25.89578628540039, "global_step": 402739, "epoch": 4852} {"train_loss": -26.476675033569336, "global_step": 402740, "epoch": 4852} {"train_loss": -26.447525024414062, "global_step": 402741, "epoch": 4852} {"train_loss": -26.30008316040039, "global_step": 402742, "epoch": 4852} {"train_loss": -25.689254760742188, "global_step": 402743, "epoch": 4852} {"train_loss": -26.205371856689453, "global_step": 402744, "epoch": 4852} {"train_loss": -26.22493553161621, "global_step": 402745, "epoch": 4852} {"train_loss": -26.529499053955078, "global_step": 402746, "epoch": 4852} {"train_loss": -26.262182235717773, "global_step": 402747, "epoch": 4852} {"train_loss": -26.3537540435791, "global_step": 402748, "epoch": 4852} {"train_loss": -26.3193416595459, "global_step": 402749, "epoch": 4852} {"train_loss": -26.556543350219727, "global_step": 402750, "epoch": 4852} {"train_loss": -26.540725708007812, "global_step": 402751, "epoch": 4852} {"train_loss": -26.29034996032715, "global_step": 402752, "epoch": 4852} {"train_loss": -26.72637367248535, "global_step": 402753, "epoch": 4852} {"train_loss": -26.76958656311035, "global_step": 402754, "epoch": 4852} {"train_loss": -26.251428604125977, "global_step": 402755, "epoch": 4852} {"train_loss": -26.342731475830078, "global_step": 402756, "epoch": 4852} {"train_loss": -26.284042358398438, "global_step": 402757, "epoch": 4852} {"train_loss": -26.640844345092773, "global_step": 402758, "epoch": 4852} {"train_loss": -26.86504554748535, "global_step": 402759, "epoch": 4852} {"train_loss": -26.674640655517578, "global_step": 402760, "epoch": 4852} {"train_loss": -26.578079223632812, "global_step": 402761, "epoch": 4852} {"train_loss": -26.974103927612305, "global_step": 402762, "epoch": 4852} {"train_loss": -26.52099609375, "global_step": 402763, "epoch": 4852} {"train_loss": -26.633268356323242, "global_step": 402764, "epoch": 4852} {"train_loss": -26.48653221130371, "global_step": 402765, "epoch": 4852} {"train_loss": -27.113004684448242, "global_step": 402766, "epoch": 4852} {"train_loss": -26.604780197143555, "global_step": 402767, "epoch": 4852} {"train_loss": -26.96978759765625, "global_step": 402768, "epoch": 4852} {"train_loss": -26.537199020385742, "global_step": 402769, "epoch": 4852} {"train_loss": -26.649368286132812, "global_step": 402770, "epoch": 4852} {"train_loss": -26.964624404907227, "global_step": 402771, "epoch": 4852} {"train_loss": -26.74881362915039, "global_step": 402772, "epoch": 4852} {"train_loss": -26.67694664001465, "global_step": 402773, "epoch": 4852} {"train_loss": -26.49515151977539, "global_step": 402774, "epoch": 4852} {"train_loss": -26.2004451751709, "global_step": 402775, "epoch": 4852} {"train_loss": -26.66399574279785, "global_step": 402776, "epoch": 4852} {"train_loss": -26.585891723632812, "global_step": 402777, "epoch": 4852} {"train_loss": -26.0950870513916, "global_step": 402778, "epoch": 4852} {"train_loss": -26.59918212890625, "global_step": 402779, "epoch": 4852} {"train_loss": -26.897205352783203, "global_step": 402780, "epoch": 4852} {"train_loss": -26.675378799438477, "global_step": 402781, "epoch": 4852} {"train_loss": -26.446395874023438, "global_step": 402782, "epoch": 4852} {"train_loss": -26.810338973999023, "global_step": 402783, "epoch": 4852} {"train_loss": -26.8808536529541, "global_step": 402784, "epoch": 4852} {"train_loss": -26.72332763671875, "global_step": 402785, "epoch": 4852} {"train_loss": -26.847244262695312, "global_step": 402786, "epoch": 4852} {"train_loss": -26.760644912719727, "global_step": 402787, "epoch": 4852} {"train_loss": -26.869556427001953, "global_step": 402788, "epoch": 4852} {"train_loss": -26.648160934448242, "global_step": 402789, "epoch": 4852} {"train_loss": -26.66886329650879, "global_step": 402790, "epoch": 4852} {"train_loss": -26.662078857421875, "global_step": 402791, "epoch": 4852} {"train_loss": -26.962812423706055, "global_step": 402792, "epoch": 4852} {"train_loss": -26.64580726623535, "global_step": 402793, "epoch": 4852} {"train_loss": -26.677473068237305, "global_step": 402794, "epoch": 4852} {"train_loss": -26.940082550048828, "global_step": 402795, "epoch": 4852} {"train_loss": -26.631521224975586, "global_step": 402796, "epoch": 4852} {"train_loss": -26.774694442749023, "global_step": 402797, "epoch": 4852} {"train_loss": -26.33042606675481, "global_step": 402798, "epoch": 4852, "val_loss": 6617841.0} {"train_loss": -26.490644454956055, "global_step": 402799, "epoch": 4853} {"train_loss": -26.442188262939453, "global_step": 402800, "epoch": 4853} {"train_loss": -26.552234649658203, "global_step": 402801, "epoch": 4853} {"train_loss": -26.64246940612793, "global_step": 402802, "epoch": 4853} {"train_loss": -25.912878036499023, "global_step": 402803, "epoch": 4853} {"train_loss": -26.75800132751465, "global_step": 402804, "epoch": 4853} {"train_loss": -26.500720977783203, "global_step": 402805, "epoch": 4853} {"train_loss": -26.53594398498535, "global_step": 402806, "epoch": 4853} {"train_loss": -26.51799964904785, "global_step": 402807, "epoch": 4853} {"train_loss": -26.169620513916016, "global_step": 402808, "epoch": 4853} {"train_loss": -26.469343185424805, "global_step": 402809, "epoch": 4853} {"train_loss": -26.52583885192871, "global_step": 402810, "epoch": 4853} {"train_loss": -26.7071590423584, "global_step": 402811, "epoch": 4853} {"train_loss": -26.361297607421875, "global_step": 402812, "epoch": 4853} {"train_loss": -26.5727596282959, "global_step": 402813, "epoch": 4853} {"train_loss": -26.5963077545166, "global_step": 402814, "epoch": 4853} {"train_loss": -26.285776138305664, "global_step": 402815, "epoch": 4853} {"train_loss": -26.692060470581055, "global_step": 402816, "epoch": 4853} {"train_loss": -26.475082397460938, "global_step": 402817, "epoch": 4853} {"train_loss": -26.46791648864746, "global_step": 402818, "epoch": 4853} {"train_loss": -26.68767738342285, "global_step": 402819, "epoch": 4853} {"train_loss": -26.398969650268555, "global_step": 402820, "epoch": 4853} {"train_loss": -26.758100509643555, "global_step": 402821, "epoch": 4853} {"train_loss": -26.657682418823242, "global_step": 402822, "epoch": 4853} {"train_loss": -26.73818016052246, "global_step": 402823, "epoch": 4853} {"train_loss": -27.055566787719727, "global_step": 402824, "epoch": 4853} {"train_loss": -26.50299072265625, "global_step": 402825, "epoch": 4853} {"train_loss": -26.741758346557617, "global_step": 402826, "epoch": 4853} {"train_loss": -26.885467529296875, "global_step": 402827, "epoch": 4853} {"train_loss": -26.877614974975586, "global_step": 402828, "epoch": 4853} {"train_loss": -26.79143714904785, "global_step": 402829, "epoch": 4853} {"train_loss": -26.569250106811523, "global_step": 402830, "epoch": 4853} {"train_loss": -26.85932731628418, "global_step": 402831, "epoch": 4853} {"train_loss": -26.787878036499023, "global_step": 402832, "epoch": 4853} {"train_loss": -26.439483642578125, "global_step": 402833, "epoch": 4853} {"train_loss": -26.83176040649414, "global_step": 402834, "epoch": 4853} {"train_loss": -26.759784698486328, "global_step": 402835, "epoch": 4853} {"train_loss": -27.10491371154785, "global_step": 402836, "epoch": 4853} {"train_loss": -26.682727813720703, "global_step": 402837, "epoch": 4853} {"train_loss": -26.450153350830078, "global_step": 402838, "epoch": 4853} {"train_loss": -26.1523380279541, "global_step": 402839, "epoch": 4853} {"train_loss": -26.14883804321289, "global_step": 402840, "epoch": 4853} {"train_loss": -25.75788688659668, "global_step": 402841, "epoch": 4853} {"train_loss": -24.989917755126953, "global_step": 402842, "epoch": 4853} {"train_loss": -24.578794479370117, "global_step": 402843, "epoch": 4853} {"train_loss": -26.45855140686035, "global_step": 402844, "epoch": 4853} {"train_loss": -25.510595321655273, "global_step": 402845, "epoch": 4853} {"train_loss": -26.229724884033203, "global_step": 402846, "epoch": 4853} {"train_loss": -25.803319931030273, "global_step": 402847, "epoch": 4853} {"train_loss": -26.338220596313477, "global_step": 402848, "epoch": 4853} {"train_loss": -25.769994735717773, "global_step": 402849, "epoch": 4853} {"train_loss": -26.573705673217773, "global_step": 402850, "epoch": 4853} {"train_loss": -25.913984298706055, "global_step": 402851, "epoch": 4853} {"train_loss": -26.655420303344727, "global_step": 402852, "epoch": 4853} {"train_loss": -26.291528701782227, "global_step": 402853, "epoch": 4853} {"train_loss": -26.15773582458496, "global_step": 402854, "epoch": 4853} {"train_loss": -26.16135025024414, "global_step": 402855, "epoch": 4853} {"train_loss": -26.363279342651367, "global_step": 402856, "epoch": 4853} {"train_loss": -26.342863082885742, "global_step": 402857, "epoch": 4853} {"train_loss": -26.230886459350586, "global_step": 402858, "epoch": 4853} {"train_loss": -26.201642990112305, "global_step": 402859, "epoch": 4853} {"train_loss": -26.144372940063477, "global_step": 402860, "epoch": 4853} {"train_loss": -26.070587158203125, "global_step": 402861, "epoch": 4853} {"train_loss": -26.238910675048828, "global_step": 402862, "epoch": 4853} {"train_loss": -26.406274795532227, "global_step": 402863, "epoch": 4853} {"train_loss": -26.4685001373291, "global_step": 402864, "epoch": 4853} {"train_loss": -26.426328659057617, "global_step": 402865, "epoch": 4853} {"train_loss": -26.476526260375977, "global_step": 402866, "epoch": 4853} {"train_loss": -26.348379135131836, "global_step": 402867, "epoch": 4853} {"train_loss": -26.63758659362793, "global_step": 402868, "epoch": 4853} {"train_loss": -26.518268585205078, "global_step": 402869, "epoch": 4853} {"train_loss": -26.4287166595459, "global_step": 402870, "epoch": 4853} {"train_loss": -26.39985466003418, "global_step": 402871, "epoch": 4853} {"train_loss": -26.6865177154541, "global_step": 402872, "epoch": 4853} {"train_loss": -26.66510009765625, "global_step": 402873, "epoch": 4853} {"train_loss": -26.351526260375977, "global_step": 402874, "epoch": 4853} {"train_loss": -26.55946159362793, "global_step": 402875, "epoch": 4853} {"train_loss": -26.486602783203125, "global_step": 402876, "epoch": 4853} {"train_loss": -26.938650131225586, "global_step": 402877, "epoch": 4853} {"train_loss": -26.666513442993164, "global_step": 402878, "epoch": 4853} {"train_loss": -26.436681747436523, "global_step": 402879, "epoch": 4853} {"train_loss": -26.43109703063965, "global_step": 402880, "epoch": 4853} {"train_loss": -26.440575955862023, "global_step": 402881, "epoch": 4853, "val_loss": 6707548.0} {"train_loss": -25.69622230529785, "global_step": 402882, "epoch": 4854} {"train_loss": -24.279342651367188, "global_step": 402883, "epoch": 4854} {"train_loss": -24.234304428100586, "global_step": 402884, "epoch": 4854} {"train_loss": -25.831396102905273, "global_step": 402885, "epoch": 4854} {"train_loss": -26.477813720703125, "global_step": 402886, "epoch": 4854} {"train_loss": -25.63551902770996, "global_step": 402887, "epoch": 4854} {"train_loss": -26.055713653564453, "global_step": 402888, "epoch": 4854} {"train_loss": -25.71646499633789, "global_step": 402889, "epoch": 4854} {"train_loss": -26.04823112487793, "global_step": 402890, "epoch": 4854} {"train_loss": -26.04526138305664, "global_step": 402891, "epoch": 4854} {"train_loss": -25.871076583862305, "global_step": 402892, "epoch": 4854} {"train_loss": -25.7819881439209, "global_step": 402893, "epoch": 4854} {"train_loss": -26.027057647705078, "global_step": 402894, "epoch": 4854} {"train_loss": -26.2491397857666, "global_step": 402895, "epoch": 4854} {"train_loss": -26.057363510131836, "global_step": 402896, "epoch": 4854} {"train_loss": -26.483808517456055, "global_step": 402897, "epoch": 4854} {"train_loss": -26.602819442749023, "global_step": 402898, "epoch": 4854} {"train_loss": -26.320972442626953, "global_step": 402899, "epoch": 4854} {"train_loss": -26.32952880859375, "global_step": 402900, "epoch": 4854} {"train_loss": -25.79889488220215, "global_step": 402901, "epoch": 4854} {"train_loss": -26.40052604675293, "global_step": 402902, "epoch": 4854} {"train_loss": -26.545923233032227, "global_step": 402903, "epoch": 4854} {"train_loss": -26.603424072265625, "global_step": 402904, "epoch": 4854} {"train_loss": -26.80817985534668, "global_step": 402905, "epoch": 4854} {"train_loss": -26.2310848236084, "global_step": 402906, "epoch": 4854} {"train_loss": -26.167591094970703, "global_step": 402907, "epoch": 4854} {"train_loss": -26.279571533203125, "global_step": 402908, "epoch": 4854} {"train_loss": -26.737668991088867, "global_step": 402909, "epoch": 4854} {"train_loss": -26.513513565063477, "global_step": 402910, "epoch": 4854} {"train_loss": -26.579212188720703, "global_step": 402911, "epoch": 4854} {"train_loss": -26.67450523376465, "global_step": 402912, "epoch": 4854} {"train_loss": -26.702606201171875, "global_step": 402913, "epoch": 4854} {"train_loss": -26.259183883666992, "global_step": 402914, "epoch": 4854} {"train_loss": -26.437231063842773, "global_step": 402915, "epoch": 4854} {"train_loss": -26.734973907470703, "global_step": 402916, "epoch": 4854} {"train_loss": -26.590253829956055, "global_step": 402917, "epoch": 4854} {"train_loss": -26.519811630249023, "global_step": 402918, "epoch": 4854} {"train_loss": -26.57193374633789, "global_step": 402919, "epoch": 4854} {"train_loss": -26.80630874633789, "global_step": 402920, "epoch": 4854} {"train_loss": -26.620361328125, "global_step": 402921, "epoch": 4854} {"train_loss": -26.674320220947266, "global_step": 402922, "epoch": 4854} {"train_loss": -26.589826583862305, "global_step": 402923, "epoch": 4854} {"train_loss": -26.57269859313965, "global_step": 402924, "epoch": 4854} {"train_loss": -26.394668579101562, "global_step": 402925, "epoch": 4854} {"train_loss": -26.759326934814453, "global_step": 402926, "epoch": 4854} {"train_loss": -26.478103637695312, "global_step": 402927, "epoch": 4854} {"train_loss": -26.786640167236328, "global_step": 402928, "epoch": 4854} {"train_loss": -26.723007202148438, "global_step": 402929, "epoch": 4854} {"train_loss": -27.023096084594727, "global_step": 402930, "epoch": 4854} {"train_loss": -27.1566162109375, "global_step": 402931, "epoch": 4854} {"train_loss": -26.7899169921875, "global_step": 402932, "epoch": 4854} {"train_loss": -26.68597984313965, "global_step": 402933, "epoch": 4854} {"train_loss": -26.695425033569336, "global_step": 402934, "epoch": 4854} {"train_loss": -26.75885009765625, "global_step": 402935, "epoch": 4854} {"train_loss": -26.7446231842041, "global_step": 402936, "epoch": 4854} {"train_loss": -27.235763549804688, "global_step": 402937, "epoch": 4854} {"train_loss": -27.07027244567871, "global_step": 402938, "epoch": 4854} {"train_loss": -26.798385620117188, "global_step": 402939, "epoch": 4854} {"train_loss": -26.760400772094727, "global_step": 402940, "epoch": 4854} {"train_loss": -26.93879508972168, "global_step": 402941, "epoch": 4854} {"train_loss": -26.711301803588867, "global_step": 402942, "epoch": 4854} {"train_loss": -27.18536376953125, "global_step": 402943, "epoch": 4854} {"train_loss": -27.008390426635742, "global_step": 402944, "epoch": 4854} {"train_loss": -26.575092315673828, "global_step": 402945, "epoch": 4854} {"train_loss": -26.425134658813477, "global_step": 402946, "epoch": 4854} {"train_loss": -26.16143798828125, "global_step": 402947, "epoch": 4854} {"train_loss": -26.324249267578125, "global_step": 402948, "epoch": 4854} {"train_loss": -26.6743106842041, "global_step": 402949, "epoch": 4854} {"train_loss": -26.432342529296875, "global_step": 402950, "epoch": 4854} {"train_loss": -27.21230125427246, "global_step": 402951, "epoch": 4854} {"train_loss": -26.464496612548828, "global_step": 402952, "epoch": 4854} {"train_loss": -26.754785537719727, "global_step": 402953, "epoch": 4854} {"train_loss": -26.631567001342773, "global_step": 402954, "epoch": 4854} {"train_loss": -26.3555908203125, "global_step": 402955, "epoch": 4854} {"train_loss": -26.209991455078125, "global_step": 402956, "epoch": 4854} {"train_loss": -26.797998428344727, "global_step": 402957, "epoch": 4854} {"train_loss": -26.518939971923828, "global_step": 402958, "epoch": 4854} {"train_loss": -26.553268432617188, "global_step": 402959, "epoch": 4854} {"train_loss": -26.802392959594727, "global_step": 402960, "epoch": 4854} {"train_loss": -26.4726505279541, "global_step": 402961, "epoch": 4854} {"train_loss": -26.607690811157227, "global_step": 402962, "epoch": 4854} {"train_loss": -26.13856315612793, "global_step": 402963, "epoch": 4854} {"train_loss": -26.43498616046216, "global_step": 402964, "epoch": 4854, "val_loss": 6574933.0} {"train_loss": -25.93951988220215, "global_step": 402965, "epoch": 4855} {"train_loss": -25.259016036987305, "global_step": 402966, "epoch": 4855} {"train_loss": -25.8030948638916, "global_step": 402967, "epoch": 4855} {"train_loss": -25.63042640686035, "global_step": 402968, "epoch": 4855} {"train_loss": -25.203704833984375, "global_step": 402969, "epoch": 4855} {"train_loss": -25.628637313842773, "global_step": 402970, "epoch": 4855} {"train_loss": -25.645322799682617, "global_step": 402971, "epoch": 4855} {"train_loss": -26.01723289489746, "global_step": 402972, "epoch": 4855} {"train_loss": -25.785507202148438, "global_step": 402973, "epoch": 4855} {"train_loss": -25.835142135620117, "global_step": 402974, "epoch": 4855} {"train_loss": -25.949743270874023, "global_step": 402975, "epoch": 4855} {"train_loss": -25.666784286499023, "global_step": 402976, "epoch": 4855} {"train_loss": -26.00775146484375, "global_step": 402977, "epoch": 4855} {"train_loss": -26.028818130493164, "global_step": 402978, "epoch": 4855} {"train_loss": -26.297683715820312, "global_step": 402979, "epoch": 4855} {"train_loss": -26.089136123657227, "global_step": 402980, "epoch": 4855} {"train_loss": -26.06123924255371, "global_step": 402981, "epoch": 4855} {"train_loss": -25.982620239257812, "global_step": 402982, "epoch": 4855} {"train_loss": -26.144611358642578, "global_step": 402983, "epoch": 4855} {"train_loss": -25.965986251831055, "global_step": 402984, "epoch": 4855} {"train_loss": -26.003204345703125, "global_step": 402985, "epoch": 4855} {"train_loss": -25.978302001953125, "global_step": 402986, "epoch": 4855} {"train_loss": -25.90180778503418, "global_step": 402987, "epoch": 4855} {"train_loss": -26.140609741210938, "global_step": 402988, "epoch": 4855} {"train_loss": -26.21744155883789, "global_step": 402989, "epoch": 4855} {"train_loss": -26.404205322265625, "global_step": 402990, "epoch": 4855} {"train_loss": -26.199064254760742, "global_step": 402991, "epoch": 4855} {"train_loss": -26.651416778564453, "global_step": 402992, "epoch": 4855} {"train_loss": -26.398000717163086, "global_step": 402993, "epoch": 4855} {"train_loss": -26.728912353515625, "global_step": 402994, "epoch": 4855} {"train_loss": -26.6848087310791, "global_step": 402995, "epoch": 4855} {"train_loss": -26.68134117126465, "global_step": 402996, "epoch": 4855} {"train_loss": -26.587308883666992, "global_step": 402997, "epoch": 4855} {"train_loss": -26.401168823242188, "global_step": 402998, "epoch": 4855} {"train_loss": -26.624486923217773, "global_step": 402999, "epoch": 4855} {"train_loss": -26.64237403869629, "global_step": 403000, "epoch": 4855} {"train_loss": -26.867319107055664, "global_step": 403001, "epoch": 4855} {"train_loss": -26.23699951171875, "global_step": 403002, "epoch": 4855} {"train_loss": -26.331022262573242, "global_step": 403003, "epoch": 4855} {"train_loss": -26.84408950805664, "global_step": 403004, "epoch": 4855} {"train_loss": -26.758258819580078, "global_step": 403005, "epoch": 4855} {"train_loss": -26.66690444946289, "global_step": 403006, "epoch": 4855} {"train_loss": -26.810577392578125, "global_step": 403007, "epoch": 4855} {"train_loss": -26.396377563476562, "global_step": 403008, "epoch": 4855} {"train_loss": -26.554651260375977, "global_step": 403009, "epoch": 4855} {"train_loss": -26.481658935546875, "global_step": 403010, "epoch": 4855} {"train_loss": -26.668914794921875, "global_step": 403011, "epoch": 4855} {"train_loss": -26.369312286376953, "global_step": 403012, "epoch": 4855} {"train_loss": -26.683155059814453, "global_step": 403013, "epoch": 4855} {"train_loss": -26.177698135375977, "global_step": 403014, "epoch": 4855} {"train_loss": -26.52971839904785, "global_step": 403015, "epoch": 4855} {"train_loss": -26.70244789123535, "global_step": 403016, "epoch": 4855} {"train_loss": -26.9266414642334, "global_step": 403017, "epoch": 4855} {"train_loss": -26.491392135620117, "global_step": 403018, "epoch": 4855} {"train_loss": -26.43189811706543, "global_step": 403019, "epoch": 4855} {"train_loss": -26.62255859375, "global_step": 403020, "epoch": 4855} {"train_loss": -26.862167358398438, "global_step": 403021, "epoch": 4855} {"train_loss": -26.684356689453125, "global_step": 403022, "epoch": 4855} {"train_loss": -27.337682723999023, "global_step": 403023, "epoch": 4855} {"train_loss": -26.757003784179688, "global_step": 403024, "epoch": 4855} {"train_loss": -26.924238204956055, "global_step": 403025, "epoch": 4855} {"train_loss": -26.850086212158203, "global_step": 403026, "epoch": 4855} {"train_loss": -26.793079376220703, "global_step": 403027, "epoch": 4855} {"train_loss": -26.581281661987305, "global_step": 403028, "epoch": 4855} {"train_loss": -27.0878849029541, "global_step": 403029, "epoch": 4855} {"train_loss": -27.204498291015625, "global_step": 403030, "epoch": 4855} {"train_loss": -26.790273666381836, "global_step": 403031, "epoch": 4855} {"train_loss": -27.069433212280273, "global_step": 403032, "epoch": 4855} {"train_loss": -26.78773307800293, "global_step": 403033, "epoch": 4855} {"train_loss": -26.88821792602539, "global_step": 403034, "epoch": 4855} {"train_loss": -26.672260284423828, "global_step": 403035, "epoch": 4855} {"train_loss": -26.9090633392334, "global_step": 403036, "epoch": 4855} {"train_loss": -26.514867782592773, "global_step": 403037, "epoch": 4855} {"train_loss": -27.03655433654785, "global_step": 403038, "epoch": 4855} {"train_loss": -27.23406410217285, "global_step": 403039, "epoch": 4855} {"train_loss": -26.720975875854492, "global_step": 403040, "epoch": 4855} {"train_loss": -26.649188995361328, "global_step": 403041, "epoch": 4855} {"train_loss": -26.490283966064453, "global_step": 403042, "epoch": 4855} {"train_loss": -26.40806007385254, "global_step": 403043, "epoch": 4855} {"train_loss": -26.903928756713867, "global_step": 403044, "epoch": 4855} {"train_loss": -26.22271156311035, "global_step": 403045, "epoch": 4855} {"train_loss": -26.794845581054688, "global_step": 403046, "epoch": 4855} {"train_loss": -26.43762218521302, "global_step": 403047, "epoch": 4855, "val_loss": 6780312.0} {"train_loss": -26.27003288269043, "global_step": 403048, "epoch": 4856} {"train_loss": -26.139368057250977, "global_step": 403049, "epoch": 4856} {"train_loss": -26.029022216796875, "global_step": 403050, "epoch": 4856} {"train_loss": -26.103317260742188, "global_step": 403051, "epoch": 4856} {"train_loss": -26.317459106445312, "global_step": 403052, "epoch": 4856} {"train_loss": -25.914783477783203, "global_step": 403053, "epoch": 4856} {"train_loss": -25.979700088500977, "global_step": 403054, "epoch": 4856} {"train_loss": -26.8134765625, "global_step": 403055, "epoch": 4856} {"train_loss": -26.778339385986328, "global_step": 403056, "epoch": 4856} {"train_loss": -26.637067794799805, "global_step": 403057, "epoch": 4856} {"train_loss": -26.695154190063477, "global_step": 403058, "epoch": 4856} {"train_loss": -26.747394561767578, "global_step": 403059, "epoch": 4856} {"train_loss": -26.60686683654785, "global_step": 403060, "epoch": 4856} {"train_loss": -26.558202743530273, "global_step": 403061, "epoch": 4856} {"train_loss": -27.007978439331055, "global_step": 403062, "epoch": 4856} {"train_loss": -26.381261825561523, "global_step": 403063, "epoch": 4856} {"train_loss": -27.013193130493164, "global_step": 403064, "epoch": 4856} {"train_loss": -26.522235870361328, "global_step": 403065, "epoch": 4856} {"train_loss": -26.40414810180664, "global_step": 403066, "epoch": 4856} {"train_loss": -26.582799911499023, "global_step": 403067, "epoch": 4856} {"train_loss": -26.537988662719727, "global_step": 403068, "epoch": 4856} {"train_loss": -26.821531295776367, "global_step": 403069, "epoch": 4856} {"train_loss": -27.073095321655273, "global_step": 403070, "epoch": 4856} {"train_loss": -26.557830810546875, "global_step": 403071, "epoch": 4856} {"train_loss": -26.791982650756836, "global_step": 403072, "epoch": 4856} {"train_loss": -26.8753604888916, "global_step": 403073, "epoch": 4856} {"train_loss": -26.726348876953125, "global_step": 403074, "epoch": 4856} {"train_loss": -26.716978073120117, "global_step": 403075, "epoch": 4856} {"train_loss": -26.54620933532715, "global_step": 403076, "epoch": 4856} {"train_loss": -26.557546615600586, "global_step": 403077, "epoch": 4856} {"train_loss": -26.546466827392578, "global_step": 403078, "epoch": 4856} {"train_loss": -26.812320709228516, "global_step": 403079, "epoch": 4856} {"train_loss": -27.02191734313965, "global_step": 403080, "epoch": 4856} {"train_loss": -26.40010643005371, "global_step": 403081, "epoch": 4856} {"train_loss": -26.958845138549805, "global_step": 403082, "epoch": 4856} {"train_loss": -26.61836051940918, "global_step": 403083, "epoch": 4856} {"train_loss": -26.637847900390625, "global_step": 403084, "epoch": 4856} {"train_loss": -26.87164306640625, "global_step": 403085, "epoch": 4856} {"train_loss": -26.918384552001953, "global_step": 403086, "epoch": 4856} {"train_loss": -26.4499454498291, "global_step": 403087, "epoch": 4856} {"train_loss": -26.91070556640625, "global_step": 403088, "epoch": 4856} {"train_loss": -26.75568962097168, "global_step": 403089, "epoch": 4856} {"train_loss": -26.625036239624023, "global_step": 403090, "epoch": 4856} {"train_loss": -26.91217041015625, "global_step": 403091, "epoch": 4856} {"train_loss": -26.38753318786621, "global_step": 403092, "epoch": 4856} {"train_loss": -26.359516143798828, "global_step": 403093, "epoch": 4856} {"train_loss": -26.213211059570312, "global_step": 403094, "epoch": 4856} {"train_loss": -26.286218643188477, "global_step": 403095, "epoch": 4856} {"train_loss": -26.75530433654785, "global_step": 403096, "epoch": 4856} {"train_loss": -26.0935115814209, "global_step": 403097, "epoch": 4856} {"train_loss": -26.42014503479004, "global_step": 403098, "epoch": 4856} {"train_loss": -26.8541316986084, "global_step": 403099, "epoch": 4856} {"train_loss": -26.879077911376953, "global_step": 403100, "epoch": 4856} {"train_loss": -26.39802360534668, "global_step": 403101, "epoch": 4856} {"train_loss": -26.107147216796875, "global_step": 403102, "epoch": 4856} {"train_loss": -25.99057960510254, "global_step": 403103, "epoch": 4856} {"train_loss": -26.176166534423828, "global_step": 403104, "epoch": 4856} {"train_loss": -26.43280029296875, "global_step": 403105, "epoch": 4856} {"train_loss": -26.660526275634766, "global_step": 403106, "epoch": 4856} {"train_loss": -26.59876823425293, "global_step": 403107, "epoch": 4856} {"train_loss": -26.414859771728516, "global_step": 403108, "epoch": 4856} {"train_loss": -26.93453025817871, "global_step": 403109, "epoch": 4856} {"train_loss": -26.777002334594727, "global_step": 403110, "epoch": 4856} {"train_loss": -26.610065460205078, "global_step": 403111, "epoch": 4856} {"train_loss": -26.723968505859375, "global_step": 403112, "epoch": 4856} {"train_loss": -26.887542724609375, "global_step": 403113, "epoch": 4856} {"train_loss": -26.6496639251709, "global_step": 403114, "epoch": 4856} {"train_loss": -26.387155532836914, "global_step": 403115, "epoch": 4856} {"train_loss": -26.757434844970703, "global_step": 403116, "epoch": 4856} {"train_loss": -26.5566349029541, "global_step": 403117, "epoch": 4856} {"train_loss": -26.4967041015625, "global_step": 403118, "epoch": 4856} {"train_loss": -26.858015060424805, "global_step": 403119, "epoch": 4856} {"train_loss": -27.040454864501953, "global_step": 403120, "epoch": 4856} {"train_loss": -26.813556671142578, "global_step": 403121, "epoch": 4856} {"train_loss": -26.680402755737305, "global_step": 403122, "epoch": 4856} {"train_loss": -26.621511459350586, "global_step": 403123, "epoch": 4856} {"train_loss": -26.94068717956543, "global_step": 403124, "epoch": 4856} {"train_loss": -26.54874610900879, "global_step": 403125, "epoch": 4856} {"train_loss": -26.769428253173828, "global_step": 403126, "epoch": 4856} {"train_loss": -26.65110206604004, "global_step": 403127, "epoch": 4856} {"train_loss": -26.46537208557129, "global_step": 403128, "epoch": 4856} {"train_loss": -26.7976131439209, "global_step": 403129, "epoch": 4856} {"train_loss": -26.58890324328319, "global_step": 403130, "epoch": 4856, "val_loss": 6711584.0} {"train_loss": -26.629901885986328, "global_step": 403131, "epoch": 4857} {"train_loss": -26.233503341674805, "global_step": 403132, "epoch": 4857} {"train_loss": -26.499235153198242, "global_step": 403133, "epoch": 4857} {"train_loss": -26.012928009033203, "global_step": 403134, "epoch": 4857} {"train_loss": -26.20444679260254, "global_step": 403135, "epoch": 4857} {"train_loss": -26.641027450561523, "global_step": 403136, "epoch": 4857} {"train_loss": -26.392194747924805, "global_step": 403137, "epoch": 4857} {"train_loss": -26.261676788330078, "global_step": 403138, "epoch": 4857} {"train_loss": -26.385400772094727, "global_step": 403139, "epoch": 4857} {"train_loss": -26.437442779541016, "global_step": 403140, "epoch": 4857} {"train_loss": -26.624755859375, "global_step": 403141, "epoch": 4857} {"train_loss": -26.11212730407715, "global_step": 403142, "epoch": 4857} {"train_loss": -26.752655029296875, "global_step": 403143, "epoch": 4857} {"train_loss": -26.174589157104492, "global_step": 403144, "epoch": 4857} {"train_loss": -26.181921005249023, "global_step": 403145, "epoch": 4857} {"train_loss": -26.679691314697266, "global_step": 403146, "epoch": 4857} {"train_loss": -26.435394287109375, "global_step": 403147, "epoch": 4857} {"train_loss": -26.547992706298828, "global_step": 403148, "epoch": 4857} {"train_loss": -26.524356842041016, "global_step": 403149, "epoch": 4857} {"train_loss": -26.581806182861328, "global_step": 403150, "epoch": 4857} {"train_loss": -26.693944931030273, "global_step": 403151, "epoch": 4857} {"train_loss": -26.575836181640625, "global_step": 403152, "epoch": 4857} {"train_loss": -27.078948974609375, "global_step": 403153, "epoch": 4857} {"train_loss": -26.3610782623291, "global_step": 403154, "epoch": 4857} {"train_loss": -26.49799919128418, "global_step": 403155, "epoch": 4857} {"train_loss": -26.7032413482666, "global_step": 403156, "epoch": 4857} {"train_loss": -26.85664176940918, "global_step": 403157, "epoch": 4857} {"train_loss": -26.4566593170166, "global_step": 403158, "epoch": 4857} {"train_loss": -26.705419540405273, "global_step": 403159, "epoch": 4857} {"train_loss": -26.4927978515625, "global_step": 403160, "epoch": 4857} {"train_loss": -26.852628707885742, "global_step": 403161, "epoch": 4857} {"train_loss": -26.820098876953125, "global_step": 403162, "epoch": 4857} {"train_loss": -27.026464462280273, "global_step": 403163, "epoch": 4857} {"train_loss": -26.47773551940918, "global_step": 403164, "epoch": 4857} {"train_loss": -26.497861862182617, "global_step": 403165, "epoch": 4857} {"train_loss": -26.23046875, "global_step": 403166, "epoch": 4857} {"train_loss": -26.62871742248535, "global_step": 403167, "epoch": 4857} {"train_loss": -26.847259521484375, "global_step": 403168, "epoch": 4857} {"train_loss": -26.82234001159668, "global_step": 403169, "epoch": 4857} {"train_loss": -26.913436889648438, "global_step": 403170, "epoch": 4857} {"train_loss": -26.77911949157715, "global_step": 403171, "epoch": 4857} {"train_loss": -26.8690128326416, "global_step": 403172, "epoch": 4857} {"train_loss": -26.723251342773438, "global_step": 403173, "epoch": 4857} {"train_loss": -26.317920684814453, "global_step": 403174, "epoch": 4857} {"train_loss": -26.803125381469727, "global_step": 403175, "epoch": 4857} {"train_loss": -26.56195640563965, "global_step": 403176, "epoch": 4857} {"train_loss": -26.300617218017578, "global_step": 403177, "epoch": 4857} {"train_loss": -26.765851974487305, "global_step": 403178, "epoch": 4857} {"train_loss": -26.649351119995117, "global_step": 403179, "epoch": 4857} {"train_loss": -26.817319869995117, "global_step": 403180, "epoch": 4857} {"train_loss": -26.165525436401367, "global_step": 403181, "epoch": 4857} {"train_loss": -26.32380485534668, "global_step": 403182, "epoch": 4857} {"train_loss": -26.09711265563965, "global_step": 403183, "epoch": 4857} {"train_loss": -27.012500762939453, "global_step": 403184, "epoch": 4857} {"train_loss": -26.187280654907227, "global_step": 403185, "epoch": 4857} {"train_loss": -26.523717880249023, "global_step": 403186, "epoch": 4857} {"train_loss": -26.97779655456543, "global_step": 403187, "epoch": 4857} {"train_loss": -26.954639434814453, "global_step": 403188, "epoch": 4857} {"train_loss": -26.059036254882812, "global_step": 403189, "epoch": 4857} {"train_loss": -26.722919464111328, "global_step": 403190, "epoch": 4857} {"train_loss": -26.26019287109375, "global_step": 403191, "epoch": 4857} {"train_loss": -26.95000648498535, "global_step": 403192, "epoch": 4857} {"train_loss": -26.346281051635742, "global_step": 403193, "epoch": 4857} {"train_loss": -26.6285343170166, "global_step": 403194, "epoch": 4857} {"train_loss": -26.605260848999023, "global_step": 403195, "epoch": 4857} {"train_loss": -26.69744873046875, "global_step": 403196, "epoch": 4857} {"train_loss": -26.483118057250977, "global_step": 403197, "epoch": 4857} {"train_loss": -26.834735870361328, "global_step": 403198, "epoch": 4857} {"train_loss": -26.678293228149414, "global_step": 403199, "epoch": 4857} {"train_loss": -26.58027458190918, "global_step": 403200, "epoch": 4857} {"train_loss": -26.208084106445312, "global_step": 403201, "epoch": 4857} {"train_loss": -26.382415771484375, "global_step": 403202, "epoch": 4857} {"train_loss": -26.388784408569336, "global_step": 403203, "epoch": 4857} {"train_loss": -26.548358917236328, "global_step": 403204, "epoch": 4857} {"train_loss": -26.435842514038086, "global_step": 403205, "epoch": 4857} {"train_loss": -26.78030776977539, "global_step": 403206, "epoch": 4857} {"train_loss": -26.785383224487305, "global_step": 403207, "epoch": 4857} {"train_loss": -26.926477432250977, "global_step": 403208, "epoch": 4857} {"train_loss": -26.632339477539062, "global_step": 403209, "epoch": 4857} {"train_loss": -26.680744171142578, "global_step": 403210, "epoch": 4857} {"train_loss": -26.88983154296875, "global_step": 403211, "epoch": 4857} {"train_loss": -26.6960391998291, "global_step": 403212, "epoch": 4857} {"train_loss": -26.565250833350493, "global_step": 403213, "epoch": 4857, "val_loss": 6718925.0} {"train_loss": -26.118391036987305, "global_step": 403214, "epoch": 4858} {"train_loss": -25.75031852722168, "global_step": 403215, "epoch": 4858} {"train_loss": -26.191110610961914, "global_step": 403216, "epoch": 4858} {"train_loss": -26.700727462768555, "global_step": 403217, "epoch": 4858} {"train_loss": -26.171737670898438, "global_step": 403218, "epoch": 4858} {"train_loss": -26.100183486938477, "global_step": 403219, "epoch": 4858} {"train_loss": -26.635482788085938, "global_step": 403220, "epoch": 4858} {"train_loss": -26.689102172851562, "global_step": 403221, "epoch": 4858} {"train_loss": -26.671064376831055, "global_step": 403222, "epoch": 4858} {"train_loss": -26.358295440673828, "global_step": 403223, "epoch": 4858} {"train_loss": -26.2198486328125, "global_step": 403224, "epoch": 4858} {"train_loss": -26.62433433532715, "global_step": 403225, "epoch": 4858} {"train_loss": -26.386215209960938, "global_step": 403226, "epoch": 4858} {"train_loss": -26.167333602905273, "global_step": 403227, "epoch": 4858} {"train_loss": -26.474103927612305, "global_step": 403228, "epoch": 4858} {"train_loss": -26.306171417236328, "global_step": 403229, "epoch": 4858} {"train_loss": -26.68086814880371, "global_step": 403230, "epoch": 4858} {"train_loss": -26.364166259765625, "global_step": 403231, "epoch": 4858} {"train_loss": -26.641620635986328, "global_step": 403232, "epoch": 4858} {"train_loss": -26.202112197875977, "global_step": 403233, "epoch": 4858} {"train_loss": -26.41887855529785, "global_step": 403234, "epoch": 4858} {"train_loss": -26.535757064819336, "global_step": 403235, "epoch": 4858} {"train_loss": -26.840351104736328, "global_step": 403236, "epoch": 4858} {"train_loss": -26.152618408203125, "global_step": 403237, "epoch": 4858} {"train_loss": -26.738000869750977, "global_step": 403238, "epoch": 4858} {"train_loss": -26.44569969177246, "global_step": 403239, "epoch": 4858} {"train_loss": -26.87369728088379, "global_step": 403240, "epoch": 4858} {"train_loss": -26.897308349609375, "global_step": 403241, "epoch": 4858} {"train_loss": -26.165761947631836, "global_step": 403242, "epoch": 4858} {"train_loss": -26.800647735595703, "global_step": 403243, "epoch": 4858} {"train_loss": -26.534765243530273, "global_step": 403244, "epoch": 4858} {"train_loss": -26.504013061523438, "global_step": 403245, "epoch": 4858} {"train_loss": -26.41547203063965, "global_step": 403246, "epoch": 4858} {"train_loss": -26.913381576538086, "global_step": 403247, "epoch": 4858} {"train_loss": -26.282073974609375, "global_step": 403248, "epoch": 4858} {"train_loss": -26.54151725769043, "global_step": 403249, "epoch": 4858} {"train_loss": -26.41663932800293, "global_step": 403250, "epoch": 4858} {"train_loss": -26.6005859375, "global_step": 403251, "epoch": 4858} {"train_loss": -27.0352725982666, "global_step": 403252, "epoch": 4858} {"train_loss": -26.618743896484375, "global_step": 403253, "epoch": 4858} {"train_loss": -26.42363929748535, "global_step": 403254, "epoch": 4858} {"train_loss": -26.9782772064209, "global_step": 403255, "epoch": 4858} {"train_loss": -26.981555938720703, "global_step": 403256, "epoch": 4858} {"train_loss": -26.8239688873291, "global_step": 403257, "epoch": 4858} {"train_loss": -26.81463623046875, "global_step": 403258, "epoch": 4858} {"train_loss": -26.895355224609375, "global_step": 403259, "epoch": 4858} {"train_loss": -26.892499923706055, "global_step": 403260, "epoch": 4858} {"train_loss": -27.025720596313477, "global_step": 403261, "epoch": 4858} {"train_loss": -26.937524795532227, "global_step": 403262, "epoch": 4858} {"train_loss": -26.8586483001709, "global_step": 403263, "epoch": 4858} {"train_loss": -26.6766300201416, "global_step": 403264, "epoch": 4858} {"train_loss": -26.804243087768555, "global_step": 403265, "epoch": 4858} {"train_loss": -26.30293083190918, "global_step": 403266, "epoch": 4858} {"train_loss": -26.640380859375, "global_step": 403267, "epoch": 4858} {"train_loss": -26.836088180541992, "global_step": 403268, "epoch": 4858} {"train_loss": -26.947843551635742, "global_step": 403269, "epoch": 4858} {"train_loss": -26.782989501953125, "global_step": 403270, "epoch": 4858} {"train_loss": -26.691984176635742, "global_step": 403271, "epoch": 4858} {"train_loss": -26.78285026550293, "global_step": 403272, "epoch": 4858} {"train_loss": -26.76007652282715, "global_step": 403273, "epoch": 4858} {"train_loss": -26.720685958862305, "global_step": 403274, "epoch": 4858} {"train_loss": -27.192914962768555, "global_step": 403275, "epoch": 4858} {"train_loss": -26.908109664916992, "global_step": 403276, "epoch": 4858} {"train_loss": -26.52494239807129, "global_step": 403277, "epoch": 4858} {"train_loss": -27.026290893554688, "global_step": 403278, "epoch": 4858} {"train_loss": -26.727294921875, "global_step": 403279, "epoch": 4858} {"train_loss": -27.070648193359375, "global_step": 403280, "epoch": 4858} {"train_loss": -26.9439697265625, "global_step": 403281, "epoch": 4858} {"train_loss": -26.637948989868164, "global_step": 403282, "epoch": 4858} {"train_loss": -26.604461669921875, "global_step": 403283, "epoch": 4858} {"train_loss": -26.979827880859375, "global_step": 403284, "epoch": 4858} {"train_loss": -26.99374771118164, "global_step": 403285, "epoch": 4858} {"train_loss": -26.455764770507812, "global_step": 403286, "epoch": 4858} {"train_loss": -26.397781372070312, "global_step": 403287, "epoch": 4858} {"train_loss": -26.5441837310791, "global_step": 403288, "epoch": 4858} {"train_loss": -26.086807250976562, "global_step": 403289, "epoch": 4858} {"train_loss": -26.526355743408203, "global_step": 403290, "epoch": 4858} {"train_loss": -26.335803985595703, "global_step": 403291, "epoch": 4858} {"train_loss": -26.0347900390625, "global_step": 403292, "epoch": 4858} {"train_loss": -26.65582275390625, "global_step": 403293, "epoch": 4858} {"train_loss": -26.555713653564453, "global_step": 403294, "epoch": 4858} {"train_loss": -26.27821922302246, "global_step": 403295, "epoch": 4858} {"train_loss": -26.603940044540956, "global_step": 403296, "epoch": 4858, "val_loss": 6641173.0} {"train_loss": -24.917377471923828, "global_step": 403297, "epoch": 4859} {"train_loss": -23.9617919921875, "global_step": 403298, "epoch": 4859} {"train_loss": -25.230649948120117, "global_step": 403299, "epoch": 4859} {"train_loss": -25.425479888916016, "global_step": 403300, "epoch": 4859} {"train_loss": -25.01908302307129, "global_step": 403301, "epoch": 4859} {"train_loss": -25.591096878051758, "global_step": 403302, "epoch": 4859} {"train_loss": -25.38201332092285, "global_step": 403303, "epoch": 4859} {"train_loss": -25.603683471679688, "global_step": 403304, "epoch": 4859} {"train_loss": -25.7158203125, "global_step": 403305, "epoch": 4859} {"train_loss": -25.37886619567871, "global_step": 403306, "epoch": 4859} {"train_loss": -25.75372314453125, "global_step": 403307, "epoch": 4859} {"train_loss": -25.97833824157715, "global_step": 403308, "epoch": 4859} {"train_loss": -25.650373458862305, "global_step": 403309, "epoch": 4859} {"train_loss": -26.0960693359375, "global_step": 403310, "epoch": 4859} {"train_loss": -25.712594985961914, "global_step": 403311, "epoch": 4859} {"train_loss": -26.01093864440918, "global_step": 403312, "epoch": 4859} {"train_loss": -26.326623916625977, "global_step": 403313, "epoch": 4859} {"train_loss": -25.855411529541016, "global_step": 403314, "epoch": 4859} {"train_loss": -25.982391357421875, "global_step": 403315, "epoch": 4859} {"train_loss": -26.686920166015625, "global_step": 403316, "epoch": 4859} {"train_loss": -26.155588150024414, "global_step": 403317, "epoch": 4859} {"train_loss": -26.012954711914062, "global_step": 403318, "epoch": 4859} {"train_loss": -26.19170570373535, "global_step": 403319, "epoch": 4859} {"train_loss": -25.988636016845703, "global_step": 403320, "epoch": 4859} {"train_loss": -25.751239776611328, "global_step": 403321, "epoch": 4859} {"train_loss": -26.01059341430664, "global_step": 403322, "epoch": 4859} {"train_loss": -26.083393096923828, "global_step": 403323, "epoch": 4859} {"train_loss": -26.246362686157227, "global_step": 403324, "epoch": 4859} {"train_loss": -26.405059814453125, "global_step": 403325, "epoch": 4859} {"train_loss": -26.4478759765625, "global_step": 403326, "epoch": 4859} {"train_loss": -26.41566276550293, "global_step": 403327, "epoch": 4859} {"train_loss": -26.304412841796875, "global_step": 403328, "epoch": 4859} {"train_loss": -26.4958553314209, "global_step": 403329, "epoch": 4859} {"train_loss": -26.393844604492188, "global_step": 403330, "epoch": 4859} {"train_loss": -26.3802547454834, "global_step": 403331, "epoch": 4859} {"train_loss": -26.7316837310791, "global_step": 403332, "epoch": 4859} {"train_loss": -26.240652084350586, "global_step": 403333, "epoch": 4859} {"train_loss": -26.438690185546875, "global_step": 403334, "epoch": 4859} {"train_loss": -26.47357177734375, "global_step": 403335, "epoch": 4859} {"train_loss": -26.9440860748291, "global_step": 403336, "epoch": 4859} {"train_loss": -26.3034725189209, "global_step": 403337, "epoch": 4859} {"train_loss": -26.42848014831543, "global_step": 403338, "epoch": 4859} {"train_loss": -26.53266716003418, "global_step": 403339, "epoch": 4859} {"train_loss": -26.58356285095215, "global_step": 403340, "epoch": 4859} {"train_loss": -26.83985710144043, "global_step": 403341, "epoch": 4859} {"train_loss": -26.66815185546875, "global_step": 403342, "epoch": 4859} {"train_loss": -26.834997177124023, "global_step": 403343, "epoch": 4859} {"train_loss": -26.648941040039062, "global_step": 403344, "epoch": 4859} {"train_loss": -26.67156982421875, "global_step": 403345, "epoch": 4859} {"train_loss": -26.69968605041504, "global_step": 403346, "epoch": 4859} {"train_loss": -26.925512313842773, "global_step": 403347, "epoch": 4859} {"train_loss": -26.9661922454834, "global_step": 403348, "epoch": 4859} {"train_loss": -26.463953018188477, "global_step": 403349, "epoch": 4859} {"train_loss": -26.510284423828125, "global_step": 403350, "epoch": 4859} {"train_loss": -26.51934814453125, "global_step": 403351, "epoch": 4859} {"train_loss": -26.782032012939453, "global_step": 403352, "epoch": 4859} {"train_loss": -26.550519943237305, "global_step": 403353, "epoch": 4859} {"train_loss": -26.586896896362305, "global_step": 403354, "epoch": 4859} {"train_loss": -27.100238800048828, "global_step": 403355, "epoch": 4859} {"train_loss": -26.669208526611328, "global_step": 403356, "epoch": 4859} {"train_loss": -26.53162956237793, "global_step": 403357, "epoch": 4859} {"train_loss": -26.2249813079834, "global_step": 403358, "epoch": 4859} {"train_loss": -26.424779891967773, "global_step": 403359, "epoch": 4859} {"train_loss": -26.818862915039062, "global_step": 403360, "epoch": 4859} {"train_loss": -26.754865646362305, "global_step": 403361, "epoch": 4859} {"train_loss": -26.46953773498535, "global_step": 403362, "epoch": 4859} {"train_loss": -26.446332931518555, "global_step": 403363, "epoch": 4859} {"train_loss": -26.776620864868164, "global_step": 403364, "epoch": 4859} {"train_loss": -26.651891708374023, "global_step": 403365, "epoch": 4859} {"train_loss": -26.347021102905273, "global_step": 403366, "epoch": 4859} {"train_loss": -26.7691707611084, "global_step": 403367, "epoch": 4859} {"train_loss": -26.81886100769043, "global_step": 403368, "epoch": 4859} {"train_loss": -26.809232711791992, "global_step": 403369, "epoch": 4859} {"train_loss": -26.389759063720703, "global_step": 403370, "epoch": 4859} {"train_loss": -26.26166343688965, "global_step": 403371, "epoch": 4859} {"train_loss": -26.60650634765625, "global_step": 403372, "epoch": 4859} {"train_loss": -26.952733993530273, "global_step": 403373, "epoch": 4859} {"train_loss": -26.847919464111328, "global_step": 403374, "epoch": 4859} {"train_loss": -26.58002281188965, "global_step": 403375, "epoch": 4859} {"train_loss": -26.423688888549805, "global_step": 403376, "epoch": 4859} {"train_loss": -26.334814071655273, "global_step": 403377, "epoch": 4859} {"train_loss": -26.287805557250977, "global_step": 403378, "epoch": 4859} {"train_loss": -26.309813005378448, "global_step": 403379, "epoch": 4859, "val_loss": 6717383.0} {"train_loss": -25.9318904876709, "global_step": 403380, "epoch": 4860} {"train_loss": -26.147293090820312, "global_step": 403381, "epoch": 4860} {"train_loss": -26.1716365814209, "global_step": 403382, "epoch": 4860} {"train_loss": -26.063547134399414, "global_step": 403383, "epoch": 4860} {"train_loss": -26.386571884155273, "global_step": 403384, "epoch": 4860} {"train_loss": -26.09600830078125, "global_step": 403385, "epoch": 4860} {"train_loss": -26.549606323242188, "global_step": 403386, "epoch": 4860} {"train_loss": -26.064441680908203, "global_step": 403387, "epoch": 4860} {"train_loss": -26.474721908569336, "global_step": 403388, "epoch": 4860} {"train_loss": -26.169952392578125, "global_step": 403389, "epoch": 4860} {"train_loss": -26.314611434936523, "global_step": 403390, "epoch": 4860} {"train_loss": -26.06537437438965, "global_step": 403391, "epoch": 4860} {"train_loss": -26.68995475769043, "global_step": 403392, "epoch": 4860} {"train_loss": -26.34002113342285, "global_step": 403393, "epoch": 4860} {"train_loss": -26.301471710205078, "global_step": 403394, "epoch": 4860} {"train_loss": -26.62161636352539, "global_step": 403395, "epoch": 4860} {"train_loss": -26.820362091064453, "global_step": 403396, "epoch": 4860} {"train_loss": -26.527179718017578, "global_step": 403397, "epoch": 4860} {"train_loss": -26.514301300048828, "global_step": 403398, "epoch": 4860} {"train_loss": -26.370269775390625, "global_step": 403399, "epoch": 4860} {"train_loss": -26.384008407592773, "global_step": 403400, "epoch": 4860} {"train_loss": -26.27390480041504, "global_step": 403401, "epoch": 4860} {"train_loss": -26.444875717163086, "global_step": 403402, "epoch": 4860} {"train_loss": -26.398956298828125, "global_step": 403403, "epoch": 4860} {"train_loss": -26.579248428344727, "global_step": 403404, "epoch": 4860} {"train_loss": -26.9902400970459, "global_step": 403405, "epoch": 4860} {"train_loss": -26.899656295776367, "global_step": 403406, "epoch": 4860} {"train_loss": -26.96449089050293, "global_step": 403407, "epoch": 4860} {"train_loss": -26.678205490112305, "global_step": 403408, "epoch": 4860} {"train_loss": -26.8601131439209, "global_step": 403409, "epoch": 4860} {"train_loss": -26.468231201171875, "global_step": 403410, "epoch": 4860} {"train_loss": -26.77259635925293, "global_step": 403411, "epoch": 4860} {"train_loss": -26.742279052734375, "global_step": 403412, "epoch": 4860} {"train_loss": -26.76722526550293, "global_step": 403413, "epoch": 4860} {"train_loss": -26.571863174438477, "global_step": 403414, "epoch": 4860} {"train_loss": -26.867124557495117, "global_step": 403415, "epoch": 4860} {"train_loss": -26.751209259033203, "global_step": 403416, "epoch": 4860} {"train_loss": -26.915414810180664, "global_step": 403417, "epoch": 4860} {"train_loss": -26.815113067626953, "global_step": 403418, "epoch": 4860} {"train_loss": -26.470014572143555, "global_step": 403419, "epoch": 4860} {"train_loss": -26.59915542602539, "global_step": 403420, "epoch": 4860} {"train_loss": -26.932300567626953, "global_step": 403421, "epoch": 4860} {"train_loss": -26.857379913330078, "global_step": 403422, "epoch": 4860} {"train_loss": -26.76175880432129, "global_step": 403423, "epoch": 4860} {"train_loss": -26.7310848236084, "global_step": 403424, "epoch": 4860} {"train_loss": -26.694202423095703, "global_step": 403425, "epoch": 4860} {"train_loss": -26.855627059936523, "global_step": 403426, "epoch": 4860} {"train_loss": -26.740131378173828, "global_step": 403427, "epoch": 4860} {"train_loss": -26.56670570373535, "global_step": 403428, "epoch": 4860} {"train_loss": -26.747283935546875, "global_step": 403429, "epoch": 4860} {"train_loss": -27.048095703125, "global_step": 403430, "epoch": 4860} {"train_loss": -26.87038230895996, "global_step": 403431, "epoch": 4860} {"train_loss": -26.61773681640625, "global_step": 403432, "epoch": 4860} {"train_loss": -26.57373046875, "global_step": 403433, "epoch": 4860} {"train_loss": -26.17889976501465, "global_step": 403434, "epoch": 4860} {"train_loss": -26.139204025268555, "global_step": 403435, "epoch": 4860} {"train_loss": -26.496280670166016, "global_step": 403436, "epoch": 4860} {"train_loss": -26.82087516784668, "global_step": 403437, "epoch": 4860} {"train_loss": -26.057416915893555, "global_step": 403438, "epoch": 4860} {"train_loss": -26.25506019592285, "global_step": 403439, "epoch": 4860} {"train_loss": -26.91741943359375, "global_step": 403440, "epoch": 4860} {"train_loss": -26.41656494140625, "global_step": 403441, "epoch": 4860} {"train_loss": -26.485580444335938, "global_step": 403442, "epoch": 4860} {"train_loss": -26.418134689331055, "global_step": 403443, "epoch": 4860} {"train_loss": -26.625391006469727, "global_step": 403444, "epoch": 4860} {"train_loss": -26.72791862487793, "global_step": 403445, "epoch": 4860} {"train_loss": -26.86224365234375, "global_step": 403446, "epoch": 4860} {"train_loss": -26.45745849609375, "global_step": 403447, "epoch": 4860} {"train_loss": -26.673826217651367, "global_step": 403448, "epoch": 4860} {"train_loss": -26.78327751159668, "global_step": 403449, "epoch": 4860} {"train_loss": -26.49738883972168, "global_step": 403450, "epoch": 4860} {"train_loss": -26.701242446899414, "global_step": 403451, "epoch": 4860} {"train_loss": -26.669469833374023, "global_step": 403452, "epoch": 4860} {"train_loss": -26.652563095092773, "global_step": 403453, "epoch": 4860} {"train_loss": -26.777456283569336, "global_step": 403454, "epoch": 4860} {"train_loss": -26.56732177734375, "global_step": 403455, "epoch": 4860} {"train_loss": -26.844684600830078, "global_step": 403456, "epoch": 4860} {"train_loss": -26.73638343811035, "global_step": 403457, "epoch": 4860} {"train_loss": -27.141355514526367, "global_step": 403458, "epoch": 4860} {"train_loss": -26.735931396484375, "global_step": 403459, "epoch": 4860} {"train_loss": -26.582128524780273, "global_step": 403460, "epoch": 4860} {"train_loss": -26.45106315612793, "global_step": 403461, "epoch": 4860} {"train_loss": -26.572354443101997, "global_step": 403462, "epoch": 4860, "val_loss": 6721461.0} {"train_loss": -25.707275390625, "global_step": 403463, "epoch": 4861} {"train_loss": -25.723968505859375, "global_step": 403464, "epoch": 4861} {"train_loss": -25.929519653320312, "global_step": 403465, "epoch": 4861} {"train_loss": -25.419322967529297, "global_step": 403466, "epoch": 4861} {"train_loss": -26.580642700195312, "global_step": 403467, "epoch": 4861} {"train_loss": -25.465662002563477, "global_step": 403468, "epoch": 4861} {"train_loss": -26.421274185180664, "global_step": 403469, "epoch": 4861} {"train_loss": -25.85686683654785, "global_step": 403470, "epoch": 4861} {"train_loss": -26.32773208618164, "global_step": 403471, "epoch": 4861} {"train_loss": -25.526121139526367, "global_step": 403472, "epoch": 4861} {"train_loss": -26.015186309814453, "global_step": 403473, "epoch": 4861} {"train_loss": -25.86884117126465, "global_step": 403474, "epoch": 4861} {"train_loss": -25.7096004486084, "global_step": 403475, "epoch": 4861} {"train_loss": -25.983144760131836, "global_step": 403476, "epoch": 4861} {"train_loss": -25.656564712524414, "global_step": 403477, "epoch": 4861} {"train_loss": -26.31671714782715, "global_step": 403478, "epoch": 4861} {"train_loss": -25.992273330688477, "global_step": 403479, "epoch": 4861} {"train_loss": -25.931934356689453, "global_step": 403480, "epoch": 4861} {"train_loss": -26.336578369140625, "global_step": 403481, "epoch": 4861} {"train_loss": -26.324750900268555, "global_step": 403482, "epoch": 4861} {"train_loss": -26.424001693725586, "global_step": 403483, "epoch": 4861} {"train_loss": -26.346698760986328, "global_step": 403484, "epoch": 4861} {"train_loss": -26.551589965820312, "global_step": 403485, "epoch": 4861} {"train_loss": -26.151641845703125, "global_step": 403486, "epoch": 4861} {"train_loss": -26.530780792236328, "global_step": 403487, "epoch": 4861} {"train_loss": -26.60968017578125, "global_step": 403488, "epoch": 4861} {"train_loss": -26.781482696533203, "global_step": 403489, "epoch": 4861} {"train_loss": -26.603500366210938, "global_step": 403490, "epoch": 4861} {"train_loss": -26.80755043029785, "global_step": 403491, "epoch": 4861} {"train_loss": -26.522064208984375, "global_step": 403492, "epoch": 4861} {"train_loss": -26.478275299072266, "global_step": 403493, "epoch": 4861} {"train_loss": -26.755258560180664, "global_step": 403494, "epoch": 4861} {"train_loss": -26.552154541015625, "global_step": 403495, "epoch": 4861} {"train_loss": -26.61567497253418, "global_step": 403496, "epoch": 4861} {"train_loss": -26.83871841430664, "global_step": 403497, "epoch": 4861} {"train_loss": -26.724079132080078, "global_step": 403498, "epoch": 4861} {"train_loss": -26.96162223815918, "global_step": 403499, "epoch": 4861} {"train_loss": -26.898284912109375, "global_step": 403500, "epoch": 4861} {"train_loss": -26.679025650024414, "global_step": 403501, "epoch": 4861} {"train_loss": -26.253509521484375, "global_step": 403502, "epoch": 4861} {"train_loss": -26.783828735351562, "global_step": 403503, "epoch": 4861} {"train_loss": -26.870420455932617, "global_step": 403504, "epoch": 4861} {"train_loss": -26.851959228515625, "global_step": 403505, "epoch": 4861} {"train_loss": -26.72959327697754, "global_step": 403506, "epoch": 4861} {"train_loss": -26.598962783813477, "global_step": 403507, "epoch": 4861} {"train_loss": -26.347030639648438, "global_step": 403508, "epoch": 4861} {"train_loss": -26.41987419128418, "global_step": 403509, "epoch": 4861} {"train_loss": -26.751672744750977, "global_step": 403510, "epoch": 4861} {"train_loss": -26.677579879760742, "global_step": 403511, "epoch": 4861} {"train_loss": -26.778778076171875, "global_step": 403512, "epoch": 4861} {"train_loss": -26.797754287719727, "global_step": 403513, "epoch": 4861} {"train_loss": -26.859708786010742, "global_step": 403514, "epoch": 4861} {"train_loss": -26.771747589111328, "global_step": 403515, "epoch": 4861} {"train_loss": -26.743335723876953, "global_step": 403516, "epoch": 4861} {"train_loss": -26.738006591796875, "global_step": 403517, "epoch": 4861} {"train_loss": -26.43683433532715, "global_step": 403518, "epoch": 4861} {"train_loss": -26.57700538635254, "global_step": 403519, "epoch": 4861} {"train_loss": -27.31769371032715, "global_step": 403520, "epoch": 4861} {"train_loss": -27.108722686767578, "global_step": 403521, "epoch": 4861} {"train_loss": -26.72246742248535, "global_step": 403522, "epoch": 4861} {"train_loss": -26.969650268554688, "global_step": 403523, "epoch": 4861} {"train_loss": -26.582019805908203, "global_step": 403524, "epoch": 4861} {"train_loss": -26.46651268005371, "global_step": 403525, "epoch": 4861} {"train_loss": -26.615964889526367, "global_step": 403526, "epoch": 4861} {"train_loss": -26.422367095947266, "global_step": 403527, "epoch": 4861} {"train_loss": -26.937641143798828, "global_step": 403528, "epoch": 4861} {"train_loss": -26.855493545532227, "global_step": 403529, "epoch": 4861} {"train_loss": -27.08793067932129, "global_step": 403530, "epoch": 4861} {"train_loss": -26.539688110351562, "global_step": 403531, "epoch": 4861} {"train_loss": -26.7894229888916, "global_step": 403532, "epoch": 4861} {"train_loss": -26.77980613708496, "global_step": 403533, "epoch": 4861} {"train_loss": -26.7265567779541, "global_step": 403534, "epoch": 4861} {"train_loss": -26.7854061126709, "global_step": 403535, "epoch": 4861} {"train_loss": -26.82733726501465, "global_step": 403536, "epoch": 4861} {"train_loss": -27.00127601623535, "global_step": 403537, "epoch": 4861} {"train_loss": -26.74267578125, "global_step": 403538, "epoch": 4861} {"train_loss": -27.198047637939453, "global_step": 403539, "epoch": 4861} {"train_loss": -26.34791374206543, "global_step": 403540, "epoch": 4861} {"train_loss": -26.599225997924805, "global_step": 403541, "epoch": 4861} {"train_loss": -26.23023796081543, "global_step": 403542, "epoch": 4861} {"train_loss": -26.33552360534668, "global_step": 403543, "epoch": 4861} {"train_loss": -25.894052505493164, "global_step": 403544, "epoch": 4861} {"train_loss": -26.48878763957196, "global_step": 403545, "epoch": 4861, "val_loss": 6760527.0} {"train_loss": -24.581308364868164, "global_step": 403546, "epoch": 4862} {"train_loss": -24.84528923034668, "global_step": 403547, "epoch": 4862} {"train_loss": -25.670063018798828, "global_step": 403548, "epoch": 4862} {"train_loss": -24.963815689086914, "global_step": 403549, "epoch": 4862} {"train_loss": -26.292463302612305, "global_step": 403550, "epoch": 4862} {"train_loss": -25.37708854675293, "global_step": 403551, "epoch": 4862} {"train_loss": -26.13599967956543, "global_step": 403552, "epoch": 4862} {"train_loss": -25.720020294189453, "global_step": 403553, "epoch": 4862} {"train_loss": -25.974735260009766, "global_step": 403554, "epoch": 4862} {"train_loss": -25.801855087280273, "global_step": 403555, "epoch": 4862} {"train_loss": -26.328149795532227, "global_step": 403556, "epoch": 4862} {"train_loss": -25.944477081298828, "global_step": 403557, "epoch": 4862} {"train_loss": -26.213621139526367, "global_step": 403558, "epoch": 4862} {"train_loss": -26.271839141845703, "global_step": 403559, "epoch": 4862} {"train_loss": -26.579999923706055, "global_step": 403560, "epoch": 4862} {"train_loss": -26.030384063720703, "global_step": 403561, "epoch": 4862} {"train_loss": -26.50089454650879, "global_step": 403562, "epoch": 4862} {"train_loss": -26.234455108642578, "global_step": 403563, "epoch": 4862} {"train_loss": -26.163288116455078, "global_step": 403564, "epoch": 4862} {"train_loss": -26.293567657470703, "global_step": 403565, "epoch": 4862} {"train_loss": -26.379560470581055, "global_step": 403566, "epoch": 4862} {"train_loss": -26.26399040222168, "global_step": 403567, "epoch": 4862} {"train_loss": -26.4128475189209, "global_step": 403568, "epoch": 4862} {"train_loss": -26.4339542388916, "global_step": 403569, "epoch": 4862} {"train_loss": -26.73748207092285, "global_step": 403570, "epoch": 4862} {"train_loss": -26.49964714050293, "global_step": 403571, "epoch": 4862} {"train_loss": -26.74393081665039, "global_step": 403572, "epoch": 4862} {"train_loss": -26.553070068359375, "global_step": 403573, "epoch": 4862} {"train_loss": -26.557966232299805, "global_step": 403574, "epoch": 4862} {"train_loss": -26.586408615112305, "global_step": 403575, "epoch": 4862} {"train_loss": -26.802722930908203, "global_step": 403576, "epoch": 4862} {"train_loss": -26.447940826416016, "global_step": 403577, "epoch": 4862} {"train_loss": -26.607099533081055, "global_step": 403578, "epoch": 4862} {"train_loss": -26.74403190612793, "global_step": 403579, "epoch": 4862} {"train_loss": -26.681936264038086, "global_step": 403580, "epoch": 4862} {"train_loss": -26.843551635742188, "global_step": 403581, "epoch": 4862} {"train_loss": -26.40338134765625, "global_step": 403582, "epoch": 4862} {"train_loss": -26.647573471069336, "global_step": 403583, "epoch": 4862} {"train_loss": -26.722517013549805, "global_step": 403584, "epoch": 4862} {"train_loss": -26.958234786987305, "global_step": 403585, "epoch": 4862} {"train_loss": -26.76250648498535, "global_step": 403586, "epoch": 4862} {"train_loss": -26.655689239501953, "global_step": 403587, "epoch": 4862} {"train_loss": -26.691741943359375, "global_step": 403588, "epoch": 4862} {"train_loss": -26.9964542388916, "global_step": 403589, "epoch": 4862} {"train_loss": -26.861988067626953, "global_step": 403590, "epoch": 4862} {"train_loss": -26.740583419799805, "global_step": 403591, "epoch": 4862} {"train_loss": -26.677587509155273, "global_step": 403592, "epoch": 4862} {"train_loss": -26.83901023864746, "global_step": 403593, "epoch": 4862} {"train_loss": -26.843494415283203, "global_step": 403594, "epoch": 4862} {"train_loss": -26.57257652282715, "global_step": 403595, "epoch": 4862} {"train_loss": -26.674041748046875, "global_step": 403596, "epoch": 4862} {"train_loss": -26.833356857299805, "global_step": 403597, "epoch": 4862} {"train_loss": -26.964935302734375, "global_step": 403598, "epoch": 4862} {"train_loss": -26.83194923400879, "global_step": 403599, "epoch": 4862} {"train_loss": -26.93915367126465, "global_step": 403600, "epoch": 4862} {"train_loss": -26.516347885131836, "global_step": 403601, "epoch": 4862} {"train_loss": -26.696516036987305, "global_step": 403602, "epoch": 4862} {"train_loss": -26.813940048217773, "global_step": 403603, "epoch": 4862} {"train_loss": -27.06292724609375, "global_step": 403604, "epoch": 4862} {"train_loss": -27.032855987548828, "global_step": 403605, "epoch": 4862} {"train_loss": -26.8765811920166, "global_step": 403606, "epoch": 4862} {"train_loss": -26.854965209960938, "global_step": 403607, "epoch": 4862} {"train_loss": -26.497304916381836, "global_step": 403608, "epoch": 4862} {"train_loss": -26.635278701782227, "global_step": 403609, "epoch": 4862} {"train_loss": -26.029621124267578, "global_step": 403610, "epoch": 4862} {"train_loss": -26.35699462890625, "global_step": 403611, "epoch": 4862} {"train_loss": -26.65231704711914, "global_step": 403612, "epoch": 4862} {"train_loss": -26.80267906188965, "global_step": 403613, "epoch": 4862} {"train_loss": -26.716772079467773, "global_step": 403614, "epoch": 4862} {"train_loss": -26.653940200805664, "global_step": 403615, "epoch": 4862} {"train_loss": -26.632404327392578, "global_step": 403616, "epoch": 4862} {"train_loss": -26.645444869995117, "global_step": 403617, "epoch": 4862} {"train_loss": -26.77473258972168, "global_step": 403618, "epoch": 4862} {"train_loss": -26.9647159576416, "global_step": 403619, "epoch": 4862} {"train_loss": -26.67205810546875, "global_step": 403620, "epoch": 4862} {"train_loss": -26.811384201049805, "global_step": 403621, "epoch": 4862} {"train_loss": -26.775272369384766, "global_step": 403622, "epoch": 4862} {"train_loss": -26.737165451049805, "global_step": 403623, "epoch": 4862} {"train_loss": -26.782669067382812, "global_step": 403624, "epoch": 4862} {"train_loss": -26.696069717407227, "global_step": 403625, "epoch": 4862} {"train_loss": -26.431806564331055, "global_step": 403626, "epoch": 4862} {"train_loss": -26.619550704956055, "global_step": 403627, "epoch": 4862} {"train_loss": -26.491799389023377, "global_step": 403628, "epoch": 4862, "val_loss": 6694576.0} {"train_loss": -25.295988082885742, "global_step": 403629, "epoch": 4863} {"train_loss": -25.99783706665039, "global_step": 403630, "epoch": 4863} {"train_loss": -26.502460479736328, "global_step": 403631, "epoch": 4863} {"train_loss": -25.67917251586914, "global_step": 403632, "epoch": 4863} {"train_loss": -26.09370231628418, "global_step": 403633, "epoch": 4863} {"train_loss": -26.630950927734375, "global_step": 403634, "epoch": 4863} {"train_loss": -26.0736141204834, "global_step": 403635, "epoch": 4863} {"train_loss": -26.18329429626465, "global_step": 403636, "epoch": 4863} {"train_loss": -26.47877311706543, "global_step": 403637, "epoch": 4863} {"train_loss": -26.258466720581055, "global_step": 403638, "epoch": 4863} {"train_loss": -26.47654151916504, "global_step": 403639, "epoch": 4863} {"train_loss": -26.418359756469727, "global_step": 403640, "epoch": 4863} {"train_loss": -26.32209587097168, "global_step": 403641, "epoch": 4863} {"train_loss": -26.540725708007812, "global_step": 403642, "epoch": 4863} {"train_loss": -25.81085205078125, "global_step": 403643, "epoch": 4863} {"train_loss": -26.71173667907715, "global_step": 403644, "epoch": 4863} {"train_loss": -26.40997886657715, "global_step": 403645, "epoch": 4863} {"train_loss": -26.56757164001465, "global_step": 403646, "epoch": 4863} {"train_loss": -26.405044555664062, "global_step": 403647, "epoch": 4863} {"train_loss": -26.685047149658203, "global_step": 403648, "epoch": 4863} {"train_loss": -26.829870223999023, "global_step": 403649, "epoch": 4863} {"train_loss": -26.02931022644043, "global_step": 403650, "epoch": 4863} {"train_loss": -26.784170150756836, "global_step": 403651, "epoch": 4863} {"train_loss": -26.440916061401367, "global_step": 403652, "epoch": 4863} {"train_loss": -26.57171058654785, "global_step": 403653, "epoch": 4863} {"train_loss": -26.884567260742188, "global_step": 403654, "epoch": 4863} {"train_loss": -26.1341552734375, "global_step": 403655, "epoch": 4863} {"train_loss": -26.572711944580078, "global_step": 403656, "epoch": 4863} {"train_loss": -26.446441650390625, "global_step": 403657, "epoch": 4863} {"train_loss": -26.37103843688965, "global_step": 403658, "epoch": 4863} {"train_loss": -26.774560928344727, "global_step": 403659, "epoch": 4863} {"train_loss": -26.845767974853516, "global_step": 403660, "epoch": 4863} {"train_loss": -26.5690860748291, "global_step": 403661, "epoch": 4863} {"train_loss": -26.577375411987305, "global_step": 403662, "epoch": 4863} {"train_loss": -26.565404891967773, "global_step": 403663, "epoch": 4863} {"train_loss": -26.948999404907227, "global_step": 403664, "epoch": 4863} {"train_loss": -26.577131271362305, "global_step": 403665, "epoch": 4863} {"train_loss": -26.419687271118164, "global_step": 403666, "epoch": 4863} {"train_loss": -26.935138702392578, "global_step": 403667, "epoch": 4863} {"train_loss": -26.61826515197754, "global_step": 403668, "epoch": 4863} {"train_loss": -26.772430419921875, "global_step": 403669, "epoch": 4863} {"train_loss": -27.03619956970215, "global_step": 403670, "epoch": 4863} {"train_loss": -27.151792526245117, "global_step": 403671, "epoch": 4863} {"train_loss": -26.75250244140625, "global_step": 403672, "epoch": 4863} {"train_loss": -26.461462020874023, "global_step": 403673, "epoch": 4863} {"train_loss": -26.66547966003418, "global_step": 403674, "epoch": 4863} {"train_loss": -26.74677848815918, "global_step": 403675, "epoch": 4863} {"train_loss": -26.66741371154785, "global_step": 403676, "epoch": 4863} {"train_loss": -26.716278076171875, "global_step": 403677, "epoch": 4863} {"train_loss": -26.588897705078125, "global_step": 403678, "epoch": 4863} {"train_loss": -26.7828369140625, "global_step": 403679, "epoch": 4863} {"train_loss": -26.665861129760742, "global_step": 403680, "epoch": 4863} {"train_loss": -26.8298397064209, "global_step": 403681, "epoch": 4863} {"train_loss": -26.35895347595215, "global_step": 403682, "epoch": 4863} {"train_loss": -26.89969825744629, "global_step": 403683, "epoch": 4863} {"train_loss": -26.773731231689453, "global_step": 403684, "epoch": 4863} {"train_loss": -26.490829467773438, "global_step": 403685, "epoch": 4863} {"train_loss": -26.8544864654541, "global_step": 403686, "epoch": 4863} {"train_loss": -26.576374053955078, "global_step": 403687, "epoch": 4863} {"train_loss": -26.500091552734375, "global_step": 403688, "epoch": 4863} {"train_loss": -26.85302734375, "global_step": 403689, "epoch": 4863} {"train_loss": -26.448226928710938, "global_step": 403690, "epoch": 4863} {"train_loss": -26.537158966064453, "global_step": 403691, "epoch": 4863} {"train_loss": -26.55500602722168, "global_step": 403692, "epoch": 4863} {"train_loss": -26.326038360595703, "global_step": 403693, "epoch": 4863} {"train_loss": -26.670820236206055, "global_step": 403694, "epoch": 4863} {"train_loss": -26.758060455322266, "global_step": 403695, "epoch": 4863} {"train_loss": -26.372777938842773, "global_step": 403696, "epoch": 4863} {"train_loss": -26.586706161499023, "global_step": 403697, "epoch": 4863} {"train_loss": -26.705610275268555, "global_step": 403698, "epoch": 4863} {"train_loss": -26.506864547729492, "global_step": 403699, "epoch": 4863} {"train_loss": -26.4820499420166, "global_step": 403700, "epoch": 4863} {"train_loss": -26.4196834564209, "global_step": 403701, "epoch": 4863} {"train_loss": -26.997455596923828, "global_step": 403702, "epoch": 4863} {"train_loss": -26.606964111328125, "global_step": 403703, "epoch": 4863} {"train_loss": -26.776899337768555, "global_step": 403704, "epoch": 4863} {"train_loss": -26.25799560546875, "global_step": 403705, "epoch": 4863} {"train_loss": -26.719486236572266, "global_step": 403706, "epoch": 4863} {"train_loss": -26.513702392578125, "global_step": 403707, "epoch": 4863} {"train_loss": -26.611799240112305, "global_step": 403708, "epoch": 4863} {"train_loss": -26.86224937438965, "global_step": 403709, "epoch": 4863} {"train_loss": -26.830860137939453, "global_step": 403710, "epoch": 4863} {"train_loss": -26.545601557536298, "global_step": 403711, "epoch": 4863, "val_loss": 6722743.5} {"train_loss": -26.224756240844727, "global_step": 403712, "epoch": 4864} {"train_loss": -26.472198486328125, "global_step": 403713, "epoch": 4864} {"train_loss": -25.871240615844727, "global_step": 403714, "epoch": 4864} {"train_loss": -26.2563419342041, "global_step": 403715, "epoch": 4864} {"train_loss": -26.217605590820312, "global_step": 403716, "epoch": 4864} {"train_loss": -26.2210750579834, "global_step": 403717, "epoch": 4864} {"train_loss": -26.34908103942871, "global_step": 403718, "epoch": 4864} {"train_loss": -26.565526962280273, "global_step": 403719, "epoch": 4864} {"train_loss": -26.42629051208496, "global_step": 403720, "epoch": 4864} {"train_loss": -26.062849044799805, "global_step": 403721, "epoch": 4864} {"train_loss": -26.11347770690918, "global_step": 403722, "epoch": 4864} {"train_loss": -26.345441818237305, "global_step": 403723, "epoch": 4864} {"train_loss": -26.40228271484375, "global_step": 403724, "epoch": 4864} {"train_loss": -26.229135513305664, "global_step": 403725, "epoch": 4864} {"train_loss": -26.821619033813477, "global_step": 403726, "epoch": 4864} {"train_loss": -26.3620662689209, "global_step": 403727, "epoch": 4864} {"train_loss": -26.480573654174805, "global_step": 403728, "epoch": 4864} {"train_loss": -26.4869441986084, "global_step": 403729, "epoch": 4864} {"train_loss": -26.68646812438965, "global_step": 403730, "epoch": 4864} {"train_loss": -26.298486709594727, "global_step": 403731, "epoch": 4864} {"train_loss": -26.704015731811523, "global_step": 403732, "epoch": 4864} {"train_loss": -26.629810333251953, "global_step": 403733, "epoch": 4864} {"train_loss": -26.770254135131836, "global_step": 403734, "epoch": 4864} {"train_loss": -26.6227970123291, "global_step": 403735, "epoch": 4864} {"train_loss": -26.33744239807129, "global_step": 403736, "epoch": 4864} {"train_loss": -26.4965877532959, "global_step": 403737, "epoch": 4864} {"train_loss": -26.59967613220215, "global_step": 403738, "epoch": 4864} {"train_loss": -26.875946044921875, "global_step": 403739, "epoch": 4864} {"train_loss": -26.353723526000977, "global_step": 403740, "epoch": 4864} {"train_loss": -26.807409286499023, "global_step": 403741, "epoch": 4864} {"train_loss": -26.73972511291504, "global_step": 403742, "epoch": 4864} {"train_loss": -26.371000289916992, "global_step": 403743, "epoch": 4864} {"train_loss": -26.592243194580078, "global_step": 403744, "epoch": 4864} {"train_loss": -26.824146270751953, "global_step": 403745, "epoch": 4864} {"train_loss": -26.3865909576416, "global_step": 403746, "epoch": 4864} {"train_loss": -26.45354652404785, "global_step": 403747, "epoch": 4864} {"train_loss": -26.692480087280273, "global_step": 403748, "epoch": 4864} {"train_loss": -26.696313858032227, "global_step": 403749, "epoch": 4864} {"train_loss": -26.814496994018555, "global_step": 403750, "epoch": 4864} {"train_loss": -26.708499908447266, "global_step": 403751, "epoch": 4864} {"train_loss": -26.638044357299805, "global_step": 403752, "epoch": 4864} {"train_loss": -26.502737045288086, "global_step": 403753, "epoch": 4864} {"train_loss": -26.6839542388916, "global_step": 403754, "epoch": 4864} {"train_loss": -26.681806564331055, "global_step": 403755, "epoch": 4864} {"train_loss": -26.876821517944336, "global_step": 403756, "epoch": 4864} {"train_loss": -26.290693283081055, "global_step": 403757, "epoch": 4864} {"train_loss": -26.7685546875, "global_step": 403758, "epoch": 4864} {"train_loss": -26.159048080444336, "global_step": 403759, "epoch": 4864} {"train_loss": -26.79143714904785, "global_step": 403760, "epoch": 4864} {"train_loss": -26.864728927612305, "global_step": 403761, "epoch": 4864} {"train_loss": -27.07337760925293, "global_step": 403762, "epoch": 4864} {"train_loss": -26.572179794311523, "global_step": 403763, "epoch": 4864} {"train_loss": -26.652851104736328, "global_step": 403764, "epoch": 4864} {"train_loss": -26.75191307067871, "global_step": 403765, "epoch": 4864} {"train_loss": -27.306211471557617, "global_step": 403766, "epoch": 4864} {"train_loss": -26.821884155273438, "global_step": 403767, "epoch": 4864} {"train_loss": -27.10407066345215, "global_step": 403768, "epoch": 4864} {"train_loss": -26.89191246032715, "global_step": 403769, "epoch": 4864} {"train_loss": -26.73191261291504, "global_step": 403770, "epoch": 4864} {"train_loss": -26.49264907836914, "global_step": 403771, "epoch": 4864} {"train_loss": -27.001514434814453, "global_step": 403772, "epoch": 4864} {"train_loss": -26.142780303955078, "global_step": 403773, "epoch": 4864} {"train_loss": -26.46628189086914, "global_step": 403774, "epoch": 4864} {"train_loss": -26.60914421081543, "global_step": 403775, "epoch": 4864} {"train_loss": -26.4969425201416, "global_step": 403776, "epoch": 4864} {"train_loss": -26.0892276763916, "global_step": 403777, "epoch": 4864} {"train_loss": -26.25067138671875, "global_step": 403778, "epoch": 4864} {"train_loss": -26.691755294799805, "global_step": 403779, "epoch": 4864} {"train_loss": -26.56080436706543, "global_step": 403780, "epoch": 4864} {"train_loss": -26.5572452545166, "global_step": 403781, "epoch": 4864} {"train_loss": -26.37835121154785, "global_step": 403782, "epoch": 4864} {"train_loss": -26.569677352905273, "global_step": 403783, "epoch": 4864} {"train_loss": -26.39935874938965, "global_step": 403784, "epoch": 4864} {"train_loss": -26.324731826782227, "global_step": 403785, "epoch": 4864} {"train_loss": -26.535614013671875, "global_step": 403786, "epoch": 4864} {"train_loss": -26.402515411376953, "global_step": 403787, "epoch": 4864} {"train_loss": -26.435993194580078, "global_step": 403788, "epoch": 4864} {"train_loss": -26.576353073120117, "global_step": 403789, "epoch": 4864} {"train_loss": -26.464954376220703, "global_step": 403790, "epoch": 4864} {"train_loss": -26.630903244018555, "global_step": 403791, "epoch": 4864} {"train_loss": -26.756677627563477, "global_step": 403792, "epoch": 4864} {"train_loss": -26.56818199157715, "global_step": 403793, "epoch": 4864} {"train_loss": -26.55752657694989, "global_step": 403794, "epoch": 4864, "val_loss": 6643835.0} {"train_loss": -25.783771514892578, "global_step": 403795, "epoch": 4865} {"train_loss": -25.09052085876465, "global_step": 403796, "epoch": 4865} {"train_loss": -26.389379501342773, "global_step": 403797, "epoch": 4865} {"train_loss": -25.224958419799805, "global_step": 403798, "epoch": 4865} {"train_loss": -25.52439308166504, "global_step": 403799, "epoch": 4865} {"train_loss": -26.065338134765625, "global_step": 403800, "epoch": 4865} {"train_loss": -25.574546813964844, "global_step": 403801, "epoch": 4865} {"train_loss": -26.341693878173828, "global_step": 403802, "epoch": 4865} {"train_loss": -26.185474395751953, "global_step": 403803, "epoch": 4865} {"train_loss": -25.73287010192871, "global_step": 403804, "epoch": 4865} {"train_loss": -26.559415817260742, "global_step": 403805, "epoch": 4865} {"train_loss": -25.9830265045166, "global_step": 403806, "epoch": 4865} {"train_loss": -26.167835235595703, "global_step": 403807, "epoch": 4865} {"train_loss": -26.33560562133789, "global_step": 403808, "epoch": 4865} {"train_loss": -26.566797256469727, "global_step": 403809, "epoch": 4865} {"train_loss": -26.2736759185791, "global_step": 403810, "epoch": 4865} {"train_loss": -26.38154411315918, "global_step": 403811, "epoch": 4865} {"train_loss": -26.394214630126953, "global_step": 403812, "epoch": 4865} {"train_loss": -25.938199996948242, "global_step": 403813, "epoch": 4865} {"train_loss": -26.566755294799805, "global_step": 403814, "epoch": 4865} {"train_loss": -26.489126205444336, "global_step": 403815, "epoch": 4865} {"train_loss": -26.281564712524414, "global_step": 403816, "epoch": 4865} {"train_loss": -26.185697555541992, "global_step": 403817, "epoch": 4865} {"train_loss": -26.595361709594727, "global_step": 403818, "epoch": 4865} {"train_loss": -26.391128540039062, "global_step": 403819, "epoch": 4865} {"train_loss": -26.512990951538086, "global_step": 403820, "epoch": 4865} {"train_loss": -26.278217315673828, "global_step": 403821, "epoch": 4865} {"train_loss": -26.448963165283203, "global_step": 403822, "epoch": 4865} {"train_loss": -26.646947860717773, "global_step": 403823, "epoch": 4865} {"train_loss": -25.976438522338867, "global_step": 403824, "epoch": 4865} {"train_loss": -26.94988441467285, "global_step": 403825, "epoch": 4865} {"train_loss": -26.231037139892578, "global_step": 403826, "epoch": 4865} {"train_loss": -26.748645782470703, "global_step": 403827, "epoch": 4865} {"train_loss": -26.40900993347168, "global_step": 403828, "epoch": 4865} {"train_loss": -26.725744247436523, "global_step": 403829, "epoch": 4865} {"train_loss": -26.68196678161621, "global_step": 403830, "epoch": 4865} {"train_loss": -26.925006866455078, "global_step": 403831, "epoch": 4865} {"train_loss": -26.957000732421875, "global_step": 403832, "epoch": 4865} {"train_loss": -26.847244262695312, "global_step": 403833, "epoch": 4865} {"train_loss": -26.806562423706055, "global_step": 403834, "epoch": 4865} {"train_loss": -26.906641006469727, "global_step": 403835, "epoch": 4865} {"train_loss": -26.891889572143555, "global_step": 403836, "epoch": 4865} {"train_loss": -26.592763900756836, "global_step": 403837, "epoch": 4865} {"train_loss": -26.675046920776367, "global_step": 403838, "epoch": 4865} {"train_loss": -26.764978408813477, "global_step": 403839, "epoch": 4865} {"train_loss": -26.792301177978516, "global_step": 403840, "epoch": 4865} {"train_loss": -26.996973037719727, "global_step": 403841, "epoch": 4865} {"train_loss": -26.91629981994629, "global_step": 403842, "epoch": 4865} {"train_loss": -27.093236923217773, "global_step": 403843, "epoch": 4865} {"train_loss": -26.79620933532715, "global_step": 403844, "epoch": 4865} {"train_loss": -26.78187370300293, "global_step": 403845, "epoch": 4865} {"train_loss": -26.419586181640625, "global_step": 403846, "epoch": 4865} {"train_loss": -26.748035430908203, "global_step": 403847, "epoch": 4865} {"train_loss": -26.519622802734375, "global_step": 403848, "epoch": 4865} {"train_loss": -26.72501564025879, "global_step": 403849, "epoch": 4865} {"train_loss": -26.596256256103516, "global_step": 403850, "epoch": 4865} {"train_loss": -27.099365234375, "global_step": 403851, "epoch": 4865} {"train_loss": -26.478565216064453, "global_step": 403852, "epoch": 4865} {"train_loss": -26.44167137145996, "global_step": 403853, "epoch": 4865} {"train_loss": -26.6881160736084, "global_step": 403854, "epoch": 4865} {"train_loss": -26.633115768432617, "global_step": 403855, "epoch": 4865} {"train_loss": -27.36612319946289, "global_step": 403856, "epoch": 4865} {"train_loss": -26.826391220092773, "global_step": 403857, "epoch": 4865} {"train_loss": -26.650949478149414, "global_step": 403858, "epoch": 4865} {"train_loss": -26.2320556640625, "global_step": 403859, "epoch": 4865} {"train_loss": -26.802091598510742, "global_step": 403860, "epoch": 4865} {"train_loss": -26.5983829498291, "global_step": 403861, "epoch": 4865} {"train_loss": -26.61629295349121, "global_step": 403862, "epoch": 4865} {"train_loss": -26.655410766601562, "global_step": 403863, "epoch": 4865} {"train_loss": -26.7994441986084, "global_step": 403864, "epoch": 4865} {"train_loss": -26.74207878112793, "global_step": 403865, "epoch": 4865} {"train_loss": -26.856103897094727, "global_step": 403866, "epoch": 4865} {"train_loss": -26.855224609375, "global_step": 403867, "epoch": 4865} {"train_loss": -26.886953353881836, "global_step": 403868, "epoch": 4865} {"train_loss": -26.70246696472168, "global_step": 403869, "epoch": 4865} {"train_loss": -26.597232818603516, "global_step": 403870, "epoch": 4865} {"train_loss": -26.788076400756836, "global_step": 403871, "epoch": 4865} {"train_loss": -26.961563110351562, "global_step": 403872, "epoch": 4865} {"train_loss": -26.803319931030273, "global_step": 403873, "epoch": 4865} {"train_loss": -26.85894203186035, "global_step": 403874, "epoch": 4865} {"train_loss": -26.603727340698242, "global_step": 403875, "epoch": 4865} {"train_loss": -26.3810977935791, "global_step": 403876, "epoch": 4865} {"train_loss": -26.534766461475787, "global_step": 403877, "epoch": 4865, "val_loss": 6755954.0} {"train_loss": -26.47613525390625, "global_step": 403878, "epoch": 4866} {"train_loss": -25.815671920776367, "global_step": 403879, "epoch": 4866} {"train_loss": -25.8051700592041, "global_step": 403880, "epoch": 4866} {"train_loss": -25.831266403198242, "global_step": 403881, "epoch": 4866} {"train_loss": -26.205764770507812, "global_step": 403882, "epoch": 4866} {"train_loss": -26.194196701049805, "global_step": 403883, "epoch": 4866} {"train_loss": -25.877614974975586, "global_step": 403884, "epoch": 4866} {"train_loss": -26.183252334594727, "global_step": 403885, "epoch": 4866} {"train_loss": -26.095367431640625, "global_step": 403886, "epoch": 4866} {"train_loss": -25.754669189453125, "global_step": 403887, "epoch": 4866} {"train_loss": -26.66538429260254, "global_step": 403888, "epoch": 4866} {"train_loss": -26.332555770874023, "global_step": 403889, "epoch": 4866} {"train_loss": -25.891992568969727, "global_step": 403890, "epoch": 4866} {"train_loss": -26.292387008666992, "global_step": 403891, "epoch": 4866} {"train_loss": -26.44610595703125, "global_step": 403892, "epoch": 4866} {"train_loss": -26.28937339782715, "global_step": 403893, "epoch": 4866} {"train_loss": -25.965131759643555, "global_step": 403894, "epoch": 4866} {"train_loss": -26.475622177124023, "global_step": 403895, "epoch": 4866} {"train_loss": -26.280359268188477, "global_step": 403896, "epoch": 4866} {"train_loss": -26.358905792236328, "global_step": 403897, "epoch": 4866} {"train_loss": -26.415546417236328, "global_step": 403898, "epoch": 4866} {"train_loss": -26.423852920532227, "global_step": 403899, "epoch": 4866} {"train_loss": -26.459524154663086, "global_step": 403900, "epoch": 4866} {"train_loss": -26.075788497924805, "global_step": 403901, "epoch": 4866} {"train_loss": -26.335498809814453, "global_step": 403902, "epoch": 4866} {"train_loss": -26.731201171875, "global_step": 403903, "epoch": 4866} {"train_loss": -26.58725357055664, "global_step": 403904, "epoch": 4866} {"train_loss": -26.771352767944336, "global_step": 403905, "epoch": 4866} {"train_loss": -27.022165298461914, "global_step": 403906, "epoch": 4866} {"train_loss": -26.436416625976562, "global_step": 403907, "epoch": 4866} {"train_loss": -26.693456649780273, "global_step": 403908, "epoch": 4866} {"train_loss": -26.829004287719727, "global_step": 403909, "epoch": 4866} {"train_loss": -26.585926055908203, "global_step": 403910, "epoch": 4866} {"train_loss": -26.822668075561523, "global_step": 403911, "epoch": 4866} {"train_loss": -26.89805030822754, "global_step": 403912, "epoch": 4866} {"train_loss": -26.72102165222168, "global_step": 403913, "epoch": 4866} {"train_loss": -26.52130126953125, "global_step": 403914, "epoch": 4866} {"train_loss": -26.78816032409668, "global_step": 403915, "epoch": 4866} {"train_loss": -26.671375274658203, "global_step": 403916, "epoch": 4866} {"train_loss": -26.406238555908203, "global_step": 403917, "epoch": 4866} {"train_loss": -26.45403480529785, "global_step": 403918, "epoch": 4866} {"train_loss": -26.839487075805664, "global_step": 403919, "epoch": 4866} {"train_loss": -26.678329467773438, "global_step": 403920, "epoch": 4866} {"train_loss": -26.422529220581055, "global_step": 403921, "epoch": 4866} {"train_loss": -26.85405921936035, "global_step": 403922, "epoch": 4866} {"train_loss": -26.639310836791992, "global_step": 403923, "epoch": 4866} {"train_loss": -26.772308349609375, "global_step": 403924, "epoch": 4866} {"train_loss": -26.63149070739746, "global_step": 403925, "epoch": 4866} {"train_loss": -26.466796875, "global_step": 403926, "epoch": 4866} {"train_loss": -26.449493408203125, "global_step": 403927, "epoch": 4866} {"train_loss": -26.888355255126953, "global_step": 403928, "epoch": 4866} {"train_loss": -26.63544273376465, "global_step": 403929, "epoch": 4866} {"train_loss": -26.417224884033203, "global_step": 403930, "epoch": 4866} {"train_loss": -26.74222183227539, "global_step": 403931, "epoch": 4866} {"train_loss": -26.269214630126953, "global_step": 403932, "epoch": 4866} {"train_loss": -26.358016967773438, "global_step": 403933, "epoch": 4866} {"train_loss": -26.449914932250977, "global_step": 403934, "epoch": 4866} {"train_loss": -26.357160568237305, "global_step": 403935, "epoch": 4866} {"train_loss": -26.493478775024414, "global_step": 403936, "epoch": 4866} {"train_loss": -26.109201431274414, "global_step": 403937, "epoch": 4866} {"train_loss": -26.528900146484375, "global_step": 403938, "epoch": 4866} {"train_loss": -26.7965145111084, "global_step": 403939, "epoch": 4866} {"train_loss": -26.748083114624023, "global_step": 403940, "epoch": 4866} {"train_loss": -26.552961349487305, "global_step": 403941, "epoch": 4866} {"train_loss": -26.72524070739746, "global_step": 403942, "epoch": 4866} {"train_loss": -26.822162628173828, "global_step": 403943, "epoch": 4866} {"train_loss": -26.803268432617188, "global_step": 403944, "epoch": 4866} {"train_loss": -26.457441329956055, "global_step": 403945, "epoch": 4866} {"train_loss": -26.850549697875977, "global_step": 403946, "epoch": 4866} {"train_loss": -26.649871826171875, "global_step": 403947, "epoch": 4866} {"train_loss": -26.583845138549805, "global_step": 403948, "epoch": 4866} {"train_loss": -26.842870712280273, "global_step": 403949, "epoch": 4866} {"train_loss": -26.6503849029541, "global_step": 403950, "epoch": 4866} {"train_loss": -26.997385025024414, "global_step": 403951, "epoch": 4866} {"train_loss": -26.289234161376953, "global_step": 403952, "epoch": 4866} {"train_loss": -26.741384506225586, "global_step": 403953, "epoch": 4866} {"train_loss": -26.398157119750977, "global_step": 403954, "epoch": 4866} {"train_loss": -26.69718360900879, "global_step": 403955, "epoch": 4866} {"train_loss": -26.5754337310791, "global_step": 403956, "epoch": 4866} {"train_loss": -26.58563232421875, "global_step": 403957, "epoch": 4866} {"train_loss": -26.9212703704834, "global_step": 403958, "epoch": 4866} {"train_loss": -26.6312198638916, "global_step": 403959, "epoch": 4866} {"train_loss": -26.50992878373847, "global_step": 403960, "epoch": 4866, "val_loss": 6768932.0} {"train_loss": -25.7850341796875, "global_step": 403961, "epoch": 4867} {"train_loss": -26.500595092773438, "global_step": 403962, "epoch": 4867} {"train_loss": -26.290374755859375, "global_step": 403963, "epoch": 4867} {"train_loss": -25.732440948486328, "global_step": 403964, "epoch": 4867} {"train_loss": -26.388427734375, "global_step": 403965, "epoch": 4867} {"train_loss": -25.994476318359375, "global_step": 403966, "epoch": 4867} {"train_loss": -25.82879066467285, "global_step": 403967, "epoch": 4867} {"train_loss": -26.043371200561523, "global_step": 403968, "epoch": 4867} {"train_loss": -26.423547744750977, "global_step": 403969, "epoch": 4867} {"train_loss": -26.12763023376465, "global_step": 403970, "epoch": 4867} {"train_loss": -26.424224853515625, "global_step": 403971, "epoch": 4867} {"train_loss": -26.684659957885742, "global_step": 403972, "epoch": 4867} {"train_loss": -25.705047607421875, "global_step": 403973, "epoch": 4867} {"train_loss": -26.410120010375977, "global_step": 403974, "epoch": 4867} {"train_loss": -26.0269718170166, "global_step": 403975, "epoch": 4867} {"train_loss": -26.546783447265625, "global_step": 403976, "epoch": 4867} {"train_loss": -26.208484649658203, "global_step": 403977, "epoch": 4867} {"train_loss": -26.035400390625, "global_step": 403978, "epoch": 4867} {"train_loss": -26.528684616088867, "global_step": 403979, "epoch": 4867} {"train_loss": -26.472375869750977, "global_step": 403980, "epoch": 4867} {"train_loss": -26.693771362304688, "global_step": 403981, "epoch": 4867} {"train_loss": -26.75153160095215, "global_step": 403982, "epoch": 4867} {"train_loss": -26.601682662963867, "global_step": 403983, "epoch": 4867} {"train_loss": -26.60152244567871, "global_step": 403984, "epoch": 4867} {"train_loss": -26.45283317565918, "global_step": 403985, "epoch": 4867} {"train_loss": -26.409976959228516, "global_step": 403986, "epoch": 4867} {"train_loss": -26.428030014038086, "global_step": 403987, "epoch": 4867} {"train_loss": -25.876691818237305, "global_step": 403988, "epoch": 4867} {"train_loss": -26.968597412109375, "global_step": 403989, "epoch": 4867} {"train_loss": -26.41702651977539, "global_step": 403990, "epoch": 4867} {"train_loss": -26.2547664642334, "global_step": 403991, "epoch": 4867} {"train_loss": -26.230432510375977, "global_step": 403992, "epoch": 4867} {"train_loss": -26.488452911376953, "global_step": 403993, "epoch": 4867} {"train_loss": -26.53875732421875, "global_step": 403994, "epoch": 4867} {"train_loss": -26.072463989257812, "global_step": 403995, "epoch": 4867} {"train_loss": -26.731430053710938, "global_step": 403996, "epoch": 4867} {"train_loss": -26.214147567749023, "global_step": 403997, "epoch": 4867} {"train_loss": -26.415760040283203, "global_step": 403998, "epoch": 4867} {"train_loss": -25.932950973510742, "global_step": 403999, "epoch": 4867} {"train_loss": -26.18697166442871, "global_step": 404000, "epoch": 4867} {"train_loss": -26.3791561126709, "global_step": 404001, "epoch": 4867} {"train_loss": -26.052785873413086, "global_step": 404002, "epoch": 4867} {"train_loss": -27.11025047302246, "global_step": 404003, "epoch": 4867} {"train_loss": -26.61089515686035, "global_step": 404004, "epoch": 4867} {"train_loss": -26.81279945373535, "global_step": 404005, "epoch": 4867} {"train_loss": -26.230712890625, "global_step": 404006, "epoch": 4867} {"train_loss": -26.607812881469727, "global_step": 404007, "epoch": 4867} {"train_loss": -26.6702880859375, "global_step": 404008, "epoch": 4867} {"train_loss": -26.665435791015625, "global_step": 404009, "epoch": 4867} {"train_loss": -26.62100601196289, "global_step": 404010, "epoch": 4867} {"train_loss": -26.425378799438477, "global_step": 404011, "epoch": 4867} {"train_loss": -26.886205673217773, "global_step": 404012, "epoch": 4867} {"train_loss": -26.762414932250977, "global_step": 404013, "epoch": 4867} {"train_loss": -26.586164474487305, "global_step": 404014, "epoch": 4867} {"train_loss": -26.55191421508789, "global_step": 404015, "epoch": 4867} {"train_loss": -26.35542869567871, "global_step": 404016, "epoch": 4867} {"train_loss": -26.481388092041016, "global_step": 404017, "epoch": 4867} {"train_loss": -26.827829360961914, "global_step": 404018, "epoch": 4867} {"train_loss": -26.826416015625, "global_step": 404019, "epoch": 4867} {"train_loss": -26.83294105529785, "global_step": 404020, "epoch": 4867} {"train_loss": -26.92974281311035, "global_step": 404021, "epoch": 4867} {"train_loss": -26.85648536682129, "global_step": 404022, "epoch": 4867} {"train_loss": -26.583148956298828, "global_step": 404023, "epoch": 4867} {"train_loss": -26.54550552368164, "global_step": 404024, "epoch": 4867} {"train_loss": -26.64060401916504, "global_step": 404025, "epoch": 4867} {"train_loss": -26.766376495361328, "global_step": 404026, "epoch": 4867} {"train_loss": -26.860340118408203, "global_step": 404027, "epoch": 4867} {"train_loss": -26.650928497314453, "global_step": 404028, "epoch": 4867} {"train_loss": -26.81988525390625, "global_step": 404029, "epoch": 4867} {"train_loss": -26.68507194519043, "global_step": 404030, "epoch": 4867} {"train_loss": -26.17195701599121, "global_step": 404031, "epoch": 4867} {"train_loss": -26.773656845092773, "global_step": 404032, "epoch": 4867} {"train_loss": -26.860456466674805, "global_step": 404033, "epoch": 4867} {"train_loss": -26.94268798828125, "global_step": 404034, "epoch": 4867} {"train_loss": -26.80179214477539, "global_step": 404035, "epoch": 4867} {"train_loss": -26.1223201751709, "global_step": 404036, "epoch": 4867} {"train_loss": -26.367624282836914, "global_step": 404037, "epoch": 4867} {"train_loss": -26.079992294311523, "global_step": 404038, "epoch": 4867} {"train_loss": -26.9942684173584, "global_step": 404039, "epoch": 4867} {"train_loss": -26.062646865844727, "global_step": 404040, "epoch": 4867} {"train_loss": -26.632314682006836, "global_step": 404041, "epoch": 4867} {"train_loss": -26.4404354095459, "global_step": 404042, "epoch": 4867} {"train_loss": -26.463449937751495, "global_step": 404043, "epoch": 4867, "val_loss": 6733300.5} {"train_loss": -26.16167640686035, "global_step": 404044, "epoch": 4868} {"train_loss": -26.357742309570312, "global_step": 404045, "epoch": 4868} {"train_loss": -25.71589469909668, "global_step": 404046, "epoch": 4868} {"train_loss": -26.071203231811523, "global_step": 404047, "epoch": 4868} {"train_loss": -26.467554092407227, "global_step": 404048, "epoch": 4868} {"train_loss": -26.0096378326416, "global_step": 404049, "epoch": 4868} {"train_loss": -26.10174560546875, "global_step": 404050, "epoch": 4868} {"train_loss": -25.998062133789062, "global_step": 404051, "epoch": 4868} {"train_loss": -26.392475128173828, "global_step": 404052, "epoch": 4868} {"train_loss": -25.983203887939453, "global_step": 404053, "epoch": 4868} {"train_loss": -26.372434616088867, "global_step": 404054, "epoch": 4868} {"train_loss": -25.938047409057617, "global_step": 404055, "epoch": 4868} {"train_loss": -25.9034481048584, "global_step": 404056, "epoch": 4868} {"train_loss": -26.112735748291016, "global_step": 404057, "epoch": 4868} {"train_loss": -26.154455184936523, "global_step": 404058, "epoch": 4868} {"train_loss": -26.549360275268555, "global_step": 404059, "epoch": 4868} {"train_loss": -26.404006958007812, "global_step": 404060, "epoch": 4868} {"train_loss": -26.628721237182617, "global_step": 404061, "epoch": 4868} {"train_loss": -26.307392120361328, "global_step": 404062, "epoch": 4868} {"train_loss": -26.330472946166992, "global_step": 404063, "epoch": 4868} {"train_loss": -26.278522491455078, "global_step": 404064, "epoch": 4868} {"train_loss": -26.125518798828125, "global_step": 404065, "epoch": 4868} {"train_loss": -26.18259048461914, "global_step": 404066, "epoch": 4868} {"train_loss": -26.51344108581543, "global_step": 404067, "epoch": 4868} {"train_loss": -26.361225128173828, "global_step": 404068, "epoch": 4868} {"train_loss": -26.495594024658203, "global_step": 404069, "epoch": 4868} {"train_loss": -26.796106338500977, "global_step": 404070, "epoch": 4868} {"train_loss": -26.992773056030273, "global_step": 404071, "epoch": 4868} {"train_loss": -26.279211044311523, "global_step": 404072, "epoch": 4868} {"train_loss": -26.864917755126953, "global_step": 404073, "epoch": 4868} {"train_loss": -26.705480575561523, "global_step": 404074, "epoch": 4868} {"train_loss": -26.42193603515625, "global_step": 404075, "epoch": 4868} {"train_loss": -26.38117027282715, "global_step": 404076, "epoch": 4868} {"train_loss": -26.733570098876953, "global_step": 404077, "epoch": 4868} {"train_loss": -26.806806564331055, "global_step": 404078, "epoch": 4868} {"train_loss": -26.489736557006836, "global_step": 404079, "epoch": 4868} {"train_loss": -26.431934356689453, "global_step": 404080, "epoch": 4868} {"train_loss": -26.2557430267334, "global_step": 404081, "epoch": 4868} {"train_loss": -26.71613121032715, "global_step": 404082, "epoch": 4868} {"train_loss": -26.825408935546875, "global_step": 404083, "epoch": 4868} {"train_loss": -27.170969009399414, "global_step": 404084, "epoch": 4868} {"train_loss": -26.298505783081055, "global_step": 404085, "epoch": 4868} {"train_loss": -26.39093589782715, "global_step": 404086, "epoch": 4868} {"train_loss": -26.266876220703125, "global_step": 404087, "epoch": 4868} {"train_loss": -26.5048885345459, "global_step": 404088, "epoch": 4868} {"train_loss": -26.71784782409668, "global_step": 404089, "epoch": 4868} {"train_loss": -26.896448135375977, "global_step": 404090, "epoch": 4868} {"train_loss": -26.94272804260254, "global_step": 404091, "epoch": 4868} {"train_loss": -26.786895751953125, "global_step": 404092, "epoch": 4868} {"train_loss": -27.169981002807617, "global_step": 404093, "epoch": 4868} {"train_loss": -26.980392456054688, "global_step": 404094, "epoch": 4868} {"train_loss": -26.994359970092773, "global_step": 404095, "epoch": 4868} {"train_loss": -27.073715209960938, "global_step": 404096, "epoch": 4868} {"train_loss": -26.856840133666992, "global_step": 404097, "epoch": 4868} {"train_loss": -26.977163314819336, "global_step": 404098, "epoch": 4868} {"train_loss": -26.879154205322266, "global_step": 404099, "epoch": 4868} {"train_loss": -27.087194442749023, "global_step": 404100, "epoch": 4868} {"train_loss": -26.537220001220703, "global_step": 404101, "epoch": 4868} {"train_loss": -26.682849884033203, "global_step": 404102, "epoch": 4868} {"train_loss": -27.04694175720215, "global_step": 404103, "epoch": 4868} {"train_loss": -26.769947052001953, "global_step": 404104, "epoch": 4868} {"train_loss": -26.569854736328125, "global_step": 404105, "epoch": 4868} {"train_loss": -26.97072410583496, "global_step": 404106, "epoch": 4868} {"train_loss": -26.917224884033203, "global_step": 404107, "epoch": 4868} {"train_loss": -26.636035919189453, "global_step": 404108, "epoch": 4868} {"train_loss": -26.3680477142334, "global_step": 404109, "epoch": 4868} {"train_loss": -26.983463287353516, "global_step": 404110, "epoch": 4868} {"train_loss": -26.464292526245117, "global_step": 404111, "epoch": 4868} {"train_loss": -26.35257911682129, "global_step": 404112, "epoch": 4868} {"train_loss": -26.135828018188477, "global_step": 404113, "epoch": 4868} {"train_loss": -26.22504997253418, "global_step": 404114, "epoch": 4868} {"train_loss": -26.14576530456543, "global_step": 404115, "epoch": 4868} {"train_loss": -26.62114906311035, "global_step": 404116, "epoch": 4868} {"train_loss": -26.776824951171875, "global_step": 404117, "epoch": 4868} {"train_loss": -26.07693862915039, "global_step": 404118, "epoch": 4868} {"train_loss": -26.503530502319336, "global_step": 404119, "epoch": 4868} {"train_loss": -26.261859893798828, "global_step": 404120, "epoch": 4868} {"train_loss": -26.279926300048828, "global_step": 404121, "epoch": 4868} {"train_loss": -26.51604652404785, "global_step": 404122, "epoch": 4868} {"train_loss": -26.40813636779785, "global_step": 404123, "epoch": 4868} {"train_loss": -26.459369659423828, "global_step": 404124, "epoch": 4868} {"train_loss": -26.90532875061035, "global_step": 404125, "epoch": 4868} {"train_loss": -26.519724949296698, "global_step": 404126, "epoch": 4868, "val_loss": 6756185.0} {"train_loss": -25.956724166870117, "global_step": 404127, "epoch": 4869} {"train_loss": -25.642807006835938, "global_step": 404128, "epoch": 4869} {"train_loss": -25.50226402282715, "global_step": 404129, "epoch": 4869} {"train_loss": -25.7189884185791, "global_step": 404130, "epoch": 4869} {"train_loss": -26.0742130279541, "global_step": 404131, "epoch": 4869} {"train_loss": -26.11000633239746, "global_step": 404132, "epoch": 4869} {"train_loss": -25.950632095336914, "global_step": 404133, "epoch": 4869} {"train_loss": -26.120553970336914, "global_step": 404134, "epoch": 4869} {"train_loss": -25.863666534423828, "global_step": 404135, "epoch": 4869} {"train_loss": -26.396413803100586, "global_step": 404136, "epoch": 4869} {"train_loss": -26.109281539916992, "global_step": 404137, "epoch": 4869} {"train_loss": -26.22257423400879, "global_step": 404138, "epoch": 4869} {"train_loss": -25.953638076782227, "global_step": 404139, "epoch": 4869} {"train_loss": -26.024763107299805, "global_step": 404140, "epoch": 4869} {"train_loss": -26.485807418823242, "global_step": 404141, "epoch": 4869} {"train_loss": -26.655914306640625, "global_step": 404142, "epoch": 4869} {"train_loss": -26.313013076782227, "global_step": 404143, "epoch": 4869} {"train_loss": -26.80729103088379, "global_step": 404144, "epoch": 4869} {"train_loss": -26.37727165222168, "global_step": 404145, "epoch": 4869} {"train_loss": -26.464557647705078, "global_step": 404146, "epoch": 4869} {"train_loss": -26.238428115844727, "global_step": 404147, "epoch": 4869} {"train_loss": -26.436315536499023, "global_step": 404148, "epoch": 4869} {"train_loss": -26.345508575439453, "global_step": 404149, "epoch": 4869} {"train_loss": -26.266088485717773, "global_step": 404150, "epoch": 4869} {"train_loss": -26.33698844909668, "global_step": 404151, "epoch": 4869} {"train_loss": -26.648778915405273, "global_step": 404152, "epoch": 4869} {"train_loss": -25.937665939331055, "global_step": 404153, "epoch": 4869} {"train_loss": -26.629077911376953, "global_step": 404154, "epoch": 4869} {"train_loss": -26.65352439880371, "global_step": 404155, "epoch": 4869} {"train_loss": -26.79640007019043, "global_step": 404156, "epoch": 4869} {"train_loss": -27.025360107421875, "global_step": 404157, "epoch": 4869} {"train_loss": -26.798246383666992, "global_step": 404158, "epoch": 4869} {"train_loss": -26.54298973083496, "global_step": 404159, "epoch": 4869} {"train_loss": -26.662649154663086, "global_step": 404160, "epoch": 4869} {"train_loss": -26.798009872436523, "global_step": 404161, "epoch": 4869} {"train_loss": -26.287683486938477, "global_step": 404162, "epoch": 4869} {"train_loss": -26.57200050354004, "global_step": 404163, "epoch": 4869} {"train_loss": -26.429523468017578, "global_step": 404164, "epoch": 4869} {"train_loss": -26.95806312561035, "global_step": 404165, "epoch": 4869} {"train_loss": -26.838186264038086, "global_step": 404166, "epoch": 4869} {"train_loss": -27.365320205688477, "global_step": 404167, "epoch": 4869} {"train_loss": -26.954730987548828, "global_step": 404168, "epoch": 4869} {"train_loss": -26.918481826782227, "global_step": 404169, "epoch": 4869} {"train_loss": -26.86504554748535, "global_step": 404170, "epoch": 4869} {"train_loss": -26.621143341064453, "global_step": 404171, "epoch": 4869} {"train_loss": -26.20367431640625, "global_step": 404172, "epoch": 4869} {"train_loss": -26.109647750854492, "global_step": 404173, "epoch": 4869} {"train_loss": -26.4484806060791, "global_step": 404174, "epoch": 4869} {"train_loss": -26.7824764251709, "global_step": 404175, "epoch": 4869} {"train_loss": -26.44025993347168, "global_step": 404176, "epoch": 4869} {"train_loss": -26.764007568359375, "global_step": 404177, "epoch": 4869} {"train_loss": -26.640949249267578, "global_step": 404178, "epoch": 4869} {"train_loss": -26.60993003845215, "global_step": 404179, "epoch": 4869} {"train_loss": -26.84994888305664, "global_step": 404180, "epoch": 4869} {"train_loss": -26.46822166442871, "global_step": 404181, "epoch": 4869} {"train_loss": -26.6567440032959, "global_step": 404182, "epoch": 4869} {"train_loss": -26.92710304260254, "global_step": 404183, "epoch": 4869} {"train_loss": -26.616178512573242, "global_step": 404184, "epoch": 4869} {"train_loss": -27.195581436157227, "global_step": 404185, "epoch": 4869} {"train_loss": -26.386199951171875, "global_step": 404186, "epoch": 4869} {"train_loss": -26.85194206237793, "global_step": 404187, "epoch": 4869} {"train_loss": -26.961294174194336, "global_step": 404188, "epoch": 4869} {"train_loss": -26.590713500976562, "global_step": 404189, "epoch": 4869} {"train_loss": -27.01513671875, "global_step": 404190, "epoch": 4869} {"train_loss": -26.53545570373535, "global_step": 404191, "epoch": 4869} {"train_loss": -27.10660743713379, "global_step": 404192, "epoch": 4869} {"train_loss": -26.653213500976562, "global_step": 404193, "epoch": 4869} {"train_loss": -26.80559730529785, "global_step": 404194, "epoch": 4869} {"train_loss": -26.837024688720703, "global_step": 404195, "epoch": 4869} {"train_loss": -26.367685317993164, "global_step": 404196, "epoch": 4869} {"train_loss": -26.506528854370117, "global_step": 404197, "epoch": 4869} {"train_loss": -26.455158233642578, "global_step": 404198, "epoch": 4869} {"train_loss": -26.73232078552246, "global_step": 404199, "epoch": 4869} {"train_loss": -26.23822593688965, "global_step": 404200, "epoch": 4869} {"train_loss": -26.8321533203125, "global_step": 404201, "epoch": 4869} {"train_loss": -26.69606590270996, "global_step": 404202, "epoch": 4869} {"train_loss": -26.500219345092773, "global_step": 404203, "epoch": 4869} {"train_loss": -26.7731990814209, "global_step": 404204, "epoch": 4869} {"train_loss": -26.73834800720215, "global_step": 404205, "epoch": 4869} {"train_loss": -26.696704864501953, "global_step": 404206, "epoch": 4869} {"train_loss": -26.59395408630371, "global_step": 404207, "epoch": 4869} {"train_loss": -26.82257080078125, "global_step": 404208, "epoch": 4869} {"train_loss": -26.53965446747929, "global_step": 404209, "epoch": 4869, "val_loss": 6663838.5} {"train_loss": -26.255334854125977, "global_step": 404210, "epoch": 4870} {"train_loss": -26.580738067626953, "global_step": 404211, "epoch": 4870} {"train_loss": -26.463764190673828, "global_step": 404212, "epoch": 4870} {"train_loss": -26.554349899291992, "global_step": 404213, "epoch": 4870} {"train_loss": -25.944623947143555, "global_step": 404214, "epoch": 4870} {"train_loss": -26.616443634033203, "global_step": 404215, "epoch": 4870} {"train_loss": -26.4238224029541, "global_step": 404216, "epoch": 4870} {"train_loss": -26.36481285095215, "global_step": 404217, "epoch": 4870} {"train_loss": -26.466821670532227, "global_step": 404218, "epoch": 4870} {"train_loss": -26.21497917175293, "global_step": 404219, "epoch": 4870} {"train_loss": -26.133508682250977, "global_step": 404220, "epoch": 4870} {"train_loss": -26.11248779296875, "global_step": 404221, "epoch": 4870} {"train_loss": -26.692529678344727, "global_step": 404222, "epoch": 4870} {"train_loss": -26.66022300720215, "global_step": 404223, "epoch": 4870} {"train_loss": -26.553211212158203, "global_step": 404224, "epoch": 4870} {"train_loss": -26.439701080322266, "global_step": 404225, "epoch": 4870} {"train_loss": -26.8450927734375, "global_step": 404226, "epoch": 4870} {"train_loss": -26.976110458374023, "global_step": 404227, "epoch": 4870} {"train_loss": -26.540372848510742, "global_step": 404228, "epoch": 4870} {"train_loss": -26.45147705078125, "global_step": 404229, "epoch": 4870} {"train_loss": -26.4807071685791, "global_step": 404230, "epoch": 4870} {"train_loss": -26.216354370117188, "global_step": 404231, "epoch": 4870} {"train_loss": -26.60784339904785, "global_step": 404232, "epoch": 4870} {"train_loss": -26.505569458007812, "global_step": 404233, "epoch": 4870} {"train_loss": -26.684070587158203, "global_step": 404234, "epoch": 4870} {"train_loss": -26.313581466674805, "global_step": 404235, "epoch": 4870} {"train_loss": -26.382556915283203, "global_step": 404236, "epoch": 4870} {"train_loss": -26.34847068786621, "global_step": 404237, "epoch": 4870} {"train_loss": -26.484655380249023, "global_step": 404238, "epoch": 4870} {"train_loss": -26.47690200805664, "global_step": 404239, "epoch": 4870} {"train_loss": -26.31414794921875, "global_step": 404240, "epoch": 4870} {"train_loss": -26.76996421813965, "global_step": 404241, "epoch": 4870} {"train_loss": -26.765661239624023, "global_step": 404242, "epoch": 4870} {"train_loss": -26.7702693939209, "global_step": 404243, "epoch": 4870} {"train_loss": -26.66019058227539, "global_step": 404244, "epoch": 4870} {"train_loss": -26.441083908081055, "global_step": 404245, "epoch": 4870} {"train_loss": -26.260391235351562, "global_step": 404246, "epoch": 4870} {"train_loss": -26.903966903686523, "global_step": 404247, "epoch": 4870} {"train_loss": -26.762624740600586, "global_step": 404248, "epoch": 4870} {"train_loss": -26.731128692626953, "global_step": 404249, "epoch": 4870} {"train_loss": -26.395801544189453, "global_step": 404250, "epoch": 4870} {"train_loss": -26.838773727416992, "global_step": 404251, "epoch": 4870} {"train_loss": -26.250614166259766, "global_step": 404252, "epoch": 4870} {"train_loss": -26.61781120300293, "global_step": 404253, "epoch": 4870} {"train_loss": -26.850753784179688, "global_step": 404254, "epoch": 4870} {"train_loss": -26.851184844970703, "global_step": 404255, "epoch": 4870} {"train_loss": -26.74784278869629, "global_step": 404256, "epoch": 4870} {"train_loss": -26.41896629333496, "global_step": 404257, "epoch": 4870} {"train_loss": -26.7136173248291, "global_step": 404258, "epoch": 4870} {"train_loss": -26.646207809448242, "global_step": 404259, "epoch": 4870} {"train_loss": -26.858386993408203, "global_step": 404260, "epoch": 4870} {"train_loss": -26.650060653686523, "global_step": 404261, "epoch": 4870} {"train_loss": -26.645751953125, "global_step": 404262, "epoch": 4870} {"train_loss": -26.5905704498291, "global_step": 404263, "epoch": 4870} {"train_loss": -26.57428550720215, "global_step": 404264, "epoch": 4870} {"train_loss": -26.809728622436523, "global_step": 404265, "epoch": 4870} {"train_loss": -27.222869873046875, "global_step": 404266, "epoch": 4870} {"train_loss": -27.03753089904785, "global_step": 404267, "epoch": 4870} {"train_loss": -26.887348175048828, "global_step": 404268, "epoch": 4870} {"train_loss": -26.427539825439453, "global_step": 404269, "epoch": 4870} {"train_loss": -26.194013595581055, "global_step": 404270, "epoch": 4870} {"train_loss": -26.526309967041016, "global_step": 404271, "epoch": 4870} {"train_loss": -26.55242919921875, "global_step": 404272, "epoch": 4870} {"train_loss": -27.00787353515625, "global_step": 404273, "epoch": 4870} {"train_loss": -26.538232803344727, "global_step": 404274, "epoch": 4870} {"train_loss": -26.52095603942871, "global_step": 404275, "epoch": 4870} {"train_loss": -26.24140739440918, "global_step": 404276, "epoch": 4870} {"train_loss": -26.427030563354492, "global_step": 404277, "epoch": 4870} {"train_loss": -26.7703914642334, "global_step": 404278, "epoch": 4870} {"train_loss": -26.347097396850586, "global_step": 404279, "epoch": 4870} {"train_loss": -26.435962677001953, "global_step": 404280, "epoch": 4870} {"train_loss": -26.784210205078125, "global_step": 404281, "epoch": 4870} {"train_loss": -26.71687126159668, "global_step": 404282, "epoch": 4870} {"train_loss": -26.451929092407227, "global_step": 404283, "epoch": 4870} {"train_loss": -26.6605224609375, "global_step": 404284, "epoch": 4870} {"train_loss": -26.368316650390625, "global_step": 404285, "epoch": 4870} {"train_loss": -26.49359130859375, "global_step": 404286, "epoch": 4870} {"train_loss": -26.45416259765625, "global_step": 404287, "epoch": 4870} {"train_loss": -26.54689598083496, "global_step": 404288, "epoch": 4870} {"train_loss": -26.55013084411621, "global_step": 404289, "epoch": 4870} {"train_loss": -26.911117553710938, "global_step": 404290, "epoch": 4870} {"train_loss": -26.329065322875977, "global_step": 404291, "epoch": 4870} {"train_loss": -26.561603913824243, "global_step": 404292, "epoch": 4870, "val_loss": 6739034.0} {"train_loss": -26.102941513061523, "global_step": 404293, "epoch": 4871} {"train_loss": -25.471332550048828, "global_step": 404294, "epoch": 4871} {"train_loss": -26.314844131469727, "global_step": 404295, "epoch": 4871} {"train_loss": -26.21219253540039, "global_step": 404296, "epoch": 4871} {"train_loss": -26.365951538085938, "global_step": 404297, "epoch": 4871} {"train_loss": -26.63032341003418, "global_step": 404298, "epoch": 4871} {"train_loss": -26.147815704345703, "global_step": 404299, "epoch": 4871} {"train_loss": -25.962848663330078, "global_step": 404300, "epoch": 4871} {"train_loss": -26.382043838500977, "global_step": 404301, "epoch": 4871} {"train_loss": -26.43010902404785, "global_step": 404302, "epoch": 4871} {"train_loss": -26.299230575561523, "global_step": 404303, "epoch": 4871} {"train_loss": -26.138660430908203, "global_step": 404304, "epoch": 4871} {"train_loss": -26.584308624267578, "global_step": 404305, "epoch": 4871} {"train_loss": -26.39834976196289, "global_step": 404306, "epoch": 4871} {"train_loss": -26.42740821838379, "global_step": 404307, "epoch": 4871} {"train_loss": -26.34943199157715, "global_step": 404308, "epoch": 4871} {"train_loss": -26.642194747924805, "global_step": 404309, "epoch": 4871} {"train_loss": -26.564193725585938, "global_step": 404310, "epoch": 4871} {"train_loss": -26.469228744506836, "global_step": 404311, "epoch": 4871} {"train_loss": -26.559219360351562, "global_step": 404312, "epoch": 4871} {"train_loss": -26.64752197265625, "global_step": 404313, "epoch": 4871} {"train_loss": -26.695520401000977, "global_step": 404314, "epoch": 4871} {"train_loss": -26.571142196655273, "global_step": 404315, "epoch": 4871} {"train_loss": -26.23063087463379, "global_step": 404316, "epoch": 4871} {"train_loss": -27.01218032836914, "global_step": 404317, "epoch": 4871} {"train_loss": -26.362340927124023, "global_step": 404318, "epoch": 4871} {"train_loss": -26.47572898864746, "global_step": 404319, "epoch": 4871} {"train_loss": -26.466400146484375, "global_step": 404320, "epoch": 4871} {"train_loss": -26.924909591674805, "global_step": 404321, "epoch": 4871} {"train_loss": -26.782678604125977, "global_step": 404322, "epoch": 4871} {"train_loss": -27.090341567993164, "global_step": 404323, "epoch": 4871} {"train_loss": -26.407062530517578, "global_step": 404324, "epoch": 4871} {"train_loss": -27.116785049438477, "global_step": 404325, "epoch": 4871} {"train_loss": -26.70440673828125, "global_step": 404326, "epoch": 4871} {"train_loss": -26.417926788330078, "global_step": 404327, "epoch": 4871} {"train_loss": -26.652759552001953, "global_step": 404328, "epoch": 4871} {"train_loss": -26.181798934936523, "global_step": 404329, "epoch": 4871} {"train_loss": -26.82551383972168, "global_step": 404330, "epoch": 4871} {"train_loss": -26.02560806274414, "global_step": 404331, "epoch": 4871} {"train_loss": -26.41823387145996, "global_step": 404332, "epoch": 4871} {"train_loss": -26.52554702758789, "global_step": 404333, "epoch": 4871} {"train_loss": -26.538766860961914, "global_step": 404334, "epoch": 4871} {"train_loss": -26.58699607849121, "global_step": 404335, "epoch": 4871} {"train_loss": -26.64407730102539, "global_step": 404336, "epoch": 4871} {"train_loss": -26.260211944580078, "global_step": 404337, "epoch": 4871} {"train_loss": -26.709857940673828, "global_step": 404338, "epoch": 4871} {"train_loss": -26.324731826782227, "global_step": 404339, "epoch": 4871} {"train_loss": -26.929351806640625, "global_step": 404340, "epoch": 4871} {"train_loss": -26.758264541625977, "global_step": 404341, "epoch": 4871} {"train_loss": -26.970539093017578, "global_step": 404342, "epoch": 4871} {"train_loss": -26.394947052001953, "global_step": 404343, "epoch": 4871} {"train_loss": -26.368005752563477, "global_step": 404344, "epoch": 4871} {"train_loss": -26.966135025024414, "global_step": 404345, "epoch": 4871} {"train_loss": -26.555822372436523, "global_step": 404346, "epoch": 4871} {"train_loss": -26.928226470947266, "global_step": 404347, "epoch": 4871} {"train_loss": -26.60331153869629, "global_step": 404348, "epoch": 4871} {"train_loss": -26.50124168395996, "global_step": 404349, "epoch": 4871} {"train_loss": -27.054187774658203, "global_step": 404350, "epoch": 4871} {"train_loss": -26.428333282470703, "global_step": 404351, "epoch": 4871} {"train_loss": -26.6453857421875, "global_step": 404352, "epoch": 4871} {"train_loss": -27.168350219726562, "global_step": 404353, "epoch": 4871} {"train_loss": -26.718402862548828, "global_step": 404354, "epoch": 4871} {"train_loss": -26.656158447265625, "global_step": 404355, "epoch": 4871} {"train_loss": -26.633758544921875, "global_step": 404356, "epoch": 4871} {"train_loss": -26.54489517211914, "global_step": 404357, "epoch": 4871} {"train_loss": -26.126977920532227, "global_step": 404358, "epoch": 4871} {"train_loss": -26.105396270751953, "global_step": 404359, "epoch": 4871} {"train_loss": -26.366180419921875, "global_step": 404360, "epoch": 4871} {"train_loss": -26.677825927734375, "global_step": 404361, "epoch": 4871} {"train_loss": -26.931238174438477, "global_step": 404362, "epoch": 4871} {"train_loss": -26.48158836364746, "global_step": 404363, "epoch": 4871} {"train_loss": -26.433286666870117, "global_step": 404364, "epoch": 4871} {"train_loss": -26.73885154724121, "global_step": 404365, "epoch": 4871} {"train_loss": -26.5626220703125, "global_step": 404366, "epoch": 4871} {"train_loss": -26.55525779724121, "global_step": 404367, "epoch": 4871} {"train_loss": -26.434911727905273, "global_step": 404368, "epoch": 4871} {"train_loss": -26.606155395507812, "global_step": 404369, "epoch": 4871} {"train_loss": -26.537078857421875, "global_step": 404370, "epoch": 4871} {"train_loss": -26.475051879882812, "global_step": 404371, "epoch": 4871} {"train_loss": -26.970788955688477, "global_step": 404372, "epoch": 4871} {"train_loss": -26.5075626373291, "global_step": 404373, "epoch": 4871} {"train_loss": -26.53140640258789, "global_step": 404374, "epoch": 4871} {"train_loss": -26.528696450842432, "global_step": 404375, "epoch": 4871, "val_loss": 6808107.0} {"train_loss": -26.1638126373291, "global_step": 404376, "epoch": 4872} {"train_loss": -25.741098403930664, "global_step": 404377, "epoch": 4872} {"train_loss": -26.376859664916992, "global_step": 404378, "epoch": 4872} {"train_loss": -26.3700008392334, "global_step": 404379, "epoch": 4872} {"train_loss": -25.855859756469727, "global_step": 404380, "epoch": 4872} {"train_loss": -26.05925941467285, "global_step": 404381, "epoch": 4872} {"train_loss": -25.820098876953125, "global_step": 404382, "epoch": 4872} {"train_loss": -26.4292049407959, "global_step": 404383, "epoch": 4872} {"train_loss": -26.123889923095703, "global_step": 404384, "epoch": 4872} {"train_loss": -26.72418785095215, "global_step": 404385, "epoch": 4872} {"train_loss": -26.3846435546875, "global_step": 404386, "epoch": 4872} {"train_loss": -26.3004150390625, "global_step": 404387, "epoch": 4872} {"train_loss": -26.4738712310791, "global_step": 404388, "epoch": 4872} {"train_loss": -26.204364776611328, "global_step": 404389, "epoch": 4872} {"train_loss": -25.997333526611328, "global_step": 404390, "epoch": 4872} {"train_loss": -26.620580673217773, "global_step": 404391, "epoch": 4872} {"train_loss": -26.07684898376465, "global_step": 404392, "epoch": 4872} {"train_loss": -26.713953018188477, "global_step": 404393, "epoch": 4872} {"train_loss": -26.193838119506836, "global_step": 404394, "epoch": 4872} {"train_loss": -26.521387100219727, "global_step": 404395, "epoch": 4872} {"train_loss": -26.044330596923828, "global_step": 404396, "epoch": 4872} {"train_loss": -26.761951446533203, "global_step": 404397, "epoch": 4872} {"train_loss": -26.275754928588867, "global_step": 404398, "epoch": 4872} {"train_loss": -26.25821304321289, "global_step": 404399, "epoch": 4872} {"train_loss": -26.572513580322266, "global_step": 404400, "epoch": 4872} {"train_loss": -26.406070709228516, "global_step": 404401, "epoch": 4872} {"train_loss": -26.520599365234375, "global_step": 404402, "epoch": 4872} {"train_loss": -26.755023956298828, "global_step": 404403, "epoch": 4872} {"train_loss": -26.7219295501709, "global_step": 404404, "epoch": 4872} {"train_loss": -26.144521713256836, "global_step": 404405, "epoch": 4872} {"train_loss": -26.63673210144043, "global_step": 404406, "epoch": 4872} {"train_loss": -26.854154586791992, "global_step": 404407, "epoch": 4872} {"train_loss": -27.149805068969727, "global_step": 404408, "epoch": 4872} {"train_loss": -26.783966064453125, "global_step": 404409, "epoch": 4872} {"train_loss": -26.681446075439453, "global_step": 404410, "epoch": 4872} {"train_loss": -26.940540313720703, "global_step": 404411, "epoch": 4872} {"train_loss": -26.76032829284668, "global_step": 404412, "epoch": 4872} {"train_loss": -26.57850456237793, "global_step": 404413, "epoch": 4872} {"train_loss": -26.763473510742188, "global_step": 404414, "epoch": 4872} {"train_loss": -26.97039222717285, "global_step": 404415, "epoch": 4872} {"train_loss": -26.824411392211914, "global_step": 404416, "epoch": 4872} {"train_loss": -26.940393447875977, "global_step": 404417, "epoch": 4872} {"train_loss": -26.847314834594727, "global_step": 404418, "epoch": 4872} {"train_loss": -26.807764053344727, "global_step": 404419, "epoch": 4872} {"train_loss": -26.693466186523438, "global_step": 404420, "epoch": 4872} {"train_loss": -27.125045776367188, "global_step": 404421, "epoch": 4872} {"train_loss": -26.700925827026367, "global_step": 404422, "epoch": 4872} {"train_loss": -26.702844619750977, "global_step": 404423, "epoch": 4872} {"train_loss": -27.042083740234375, "global_step": 404424, "epoch": 4872} {"train_loss": -26.73615074157715, "global_step": 404425, "epoch": 4872} {"train_loss": -26.818403244018555, "global_step": 404426, "epoch": 4872} {"train_loss": -27.24557876586914, "global_step": 404427, "epoch": 4872} {"train_loss": -26.422000885009766, "global_step": 404428, "epoch": 4872} {"train_loss": -25.946805953979492, "global_step": 404429, "epoch": 4872} {"train_loss": -26.084997177124023, "global_step": 404430, "epoch": 4872} {"train_loss": -25.928396224975586, "global_step": 404431, "epoch": 4872} {"train_loss": -25.8392276763916, "global_step": 404432, "epoch": 4872} {"train_loss": -26.564258575439453, "global_step": 404433, "epoch": 4872} {"train_loss": -26.532657623291016, "global_step": 404434, "epoch": 4872} {"train_loss": -26.432941436767578, "global_step": 404435, "epoch": 4872} {"train_loss": -26.319305419921875, "global_step": 404436, "epoch": 4872} {"train_loss": -26.48370933532715, "global_step": 404437, "epoch": 4872} {"train_loss": -26.259286880493164, "global_step": 404438, "epoch": 4872} {"train_loss": -26.714208602905273, "global_step": 404439, "epoch": 4872} {"train_loss": -26.864126205444336, "global_step": 404440, "epoch": 4872} {"train_loss": -26.620441436767578, "global_step": 404441, "epoch": 4872} {"train_loss": -26.53873062133789, "global_step": 404442, "epoch": 4872} {"train_loss": -26.7113094329834, "global_step": 404443, "epoch": 4872} {"train_loss": -26.405139923095703, "global_step": 404444, "epoch": 4872} {"train_loss": -26.527311325073242, "global_step": 404445, "epoch": 4872} {"train_loss": -26.71270179748535, "global_step": 404446, "epoch": 4872} {"train_loss": -26.91316032409668, "global_step": 404447, "epoch": 4872} {"train_loss": -26.8613224029541, "global_step": 404448, "epoch": 4872} {"train_loss": -27.01848793029785, "global_step": 404449, "epoch": 4872} {"train_loss": -26.988821029663086, "global_step": 404450, "epoch": 4872} {"train_loss": -26.590408325195312, "global_step": 404451, "epoch": 4872} {"train_loss": -27.018033981323242, "global_step": 404452, "epoch": 4872} {"train_loss": -26.70749282836914, "global_step": 404453, "epoch": 4872} {"train_loss": -26.491226196289062, "global_step": 404454, "epoch": 4872} {"train_loss": -26.566574096679688, "global_step": 404455, "epoch": 4872} {"train_loss": -26.8807315826416, "global_step": 404456, "epoch": 4872} {"train_loss": -26.831079483032227, "global_step": 404457, "epoch": 4872} {"train_loss": -26.536589450146778, "global_step": 404458, "epoch": 4872, "val_loss": 6712058.0} {"train_loss": -25.6248722076416, "global_step": 404459, "epoch": 4873} {"train_loss": -25.745161056518555, "global_step": 404460, "epoch": 4873} {"train_loss": -26.52790641784668, "global_step": 404461, "epoch": 4873} {"train_loss": -25.585124969482422, "global_step": 404462, "epoch": 4873} {"train_loss": -26.24812126159668, "global_step": 404463, "epoch": 4873} {"train_loss": -26.176807403564453, "global_step": 404464, "epoch": 4873} {"train_loss": -25.59327507019043, "global_step": 404465, "epoch": 4873} {"train_loss": -26.594085693359375, "global_step": 404466, "epoch": 4873} {"train_loss": -25.76017189025879, "global_step": 404467, "epoch": 4873} {"train_loss": -26.096216201782227, "global_step": 404468, "epoch": 4873} {"train_loss": -26.367359161376953, "global_step": 404469, "epoch": 4873} {"train_loss": -26.730915069580078, "global_step": 404470, "epoch": 4873} {"train_loss": -26.490503311157227, "global_step": 404471, "epoch": 4873} {"train_loss": -26.7096004486084, "global_step": 404472, "epoch": 4873} {"train_loss": -26.313446044921875, "global_step": 404473, "epoch": 4873} {"train_loss": -26.653614044189453, "global_step": 404474, "epoch": 4873} {"train_loss": -26.31153678894043, "global_step": 404475, "epoch": 4873} {"train_loss": -26.526172637939453, "global_step": 404476, "epoch": 4873} {"train_loss": -26.659101486206055, "global_step": 404477, "epoch": 4873} {"train_loss": -26.635793685913086, "global_step": 404478, "epoch": 4873} {"train_loss": -26.545307159423828, "global_step": 404479, "epoch": 4873} {"train_loss": -26.475589752197266, "global_step": 404480, "epoch": 4873} {"train_loss": -26.43613624572754, "global_step": 404481, "epoch": 4873} {"train_loss": -26.551603317260742, "global_step": 404482, "epoch": 4873} {"train_loss": -26.805389404296875, "global_step": 404483, "epoch": 4873} {"train_loss": -26.648900985717773, "global_step": 404484, "epoch": 4873} {"train_loss": -26.55820655822754, "global_step": 404485, "epoch": 4873} {"train_loss": -26.66961097717285, "global_step": 404486, "epoch": 4873} {"train_loss": -26.280019760131836, "global_step": 404487, "epoch": 4873} {"train_loss": -26.43136978149414, "global_step": 404488, "epoch": 4873} {"train_loss": -26.939123153686523, "global_step": 404489, "epoch": 4873} {"train_loss": -26.625720977783203, "global_step": 404490, "epoch": 4873} {"train_loss": -26.481626510620117, "global_step": 404491, "epoch": 4873} {"train_loss": -26.80637550354004, "global_step": 404492, "epoch": 4873} {"train_loss": -26.525964736938477, "global_step": 404493, "epoch": 4873} {"train_loss": -26.94569206237793, "global_step": 404494, "epoch": 4873} {"train_loss": -26.734180450439453, "global_step": 404495, "epoch": 4873} {"train_loss": -26.926023483276367, "global_step": 404496, "epoch": 4873} {"train_loss": -26.453100204467773, "global_step": 404497, "epoch": 4873} {"train_loss": -26.774566650390625, "global_step": 404498, "epoch": 4873} {"train_loss": -26.321990966796875, "global_step": 404499, "epoch": 4873} {"train_loss": -26.57086753845215, "global_step": 404500, "epoch": 4873} {"train_loss": -27.08620262145996, "global_step": 404501, "epoch": 4873} {"train_loss": -26.33428955078125, "global_step": 404502, "epoch": 4873} {"train_loss": -25.9694881439209, "global_step": 404503, "epoch": 4873} {"train_loss": -25.710912704467773, "global_step": 404504, "epoch": 4873} {"train_loss": -25.81635093688965, "global_step": 404505, "epoch": 4873} {"train_loss": -26.3551082611084, "global_step": 404506, "epoch": 4873} {"train_loss": -26.613666534423828, "global_step": 404507, "epoch": 4873} {"train_loss": -25.83203125, "global_step": 404508, "epoch": 4873} {"train_loss": -26.4354248046875, "global_step": 404509, "epoch": 4873} {"train_loss": -26.860410690307617, "global_step": 404510, "epoch": 4873} {"train_loss": -26.60353660583496, "global_step": 404511, "epoch": 4873} {"train_loss": -26.176074981689453, "global_step": 404512, "epoch": 4873} {"train_loss": -26.642786026000977, "global_step": 404513, "epoch": 4873} {"train_loss": -26.500019073486328, "global_step": 404514, "epoch": 4873} {"train_loss": -26.569854736328125, "global_step": 404515, "epoch": 4873} {"train_loss": -26.873245239257812, "global_step": 404516, "epoch": 4873} {"train_loss": -26.69097900390625, "global_step": 404517, "epoch": 4873} {"train_loss": -26.491308212280273, "global_step": 404518, "epoch": 4873} {"train_loss": -26.6320858001709, "global_step": 404519, "epoch": 4873} {"train_loss": -26.39556884765625, "global_step": 404520, "epoch": 4873} {"train_loss": -26.758087158203125, "global_step": 404521, "epoch": 4873} {"train_loss": -26.38518714904785, "global_step": 404522, "epoch": 4873} {"train_loss": -26.66668701171875, "global_step": 404523, "epoch": 4873} {"train_loss": -26.734527587890625, "global_step": 404524, "epoch": 4873} {"train_loss": -26.539520263671875, "global_step": 404525, "epoch": 4873} {"train_loss": -26.397886276245117, "global_step": 404526, "epoch": 4873} {"train_loss": -26.906997680664062, "global_step": 404527, "epoch": 4873} {"train_loss": -26.38899040222168, "global_step": 404528, "epoch": 4873} {"train_loss": -26.338226318359375, "global_step": 404529, "epoch": 4873} {"train_loss": -26.257211685180664, "global_step": 404530, "epoch": 4873} {"train_loss": -26.52052116394043, "global_step": 404531, "epoch": 4873} {"train_loss": -26.67758560180664, "global_step": 404532, "epoch": 4873} {"train_loss": -26.882770538330078, "global_step": 404533, "epoch": 4873} {"train_loss": -26.60418128967285, "global_step": 404534, "epoch": 4873} {"train_loss": -26.758756637573242, "global_step": 404535, "epoch": 4873} {"train_loss": -26.63773536682129, "global_step": 404536, "epoch": 4873} {"train_loss": -26.857519149780273, "global_step": 404537, "epoch": 4873} {"train_loss": -26.52019691467285, "global_step": 404538, "epoch": 4873} {"train_loss": -26.63300895690918, "global_step": 404539, "epoch": 4873} {"train_loss": -26.84929847717285, "global_step": 404540, "epoch": 4873} {"train_loss": -26.490027048501624, "global_step": 404541, "epoch": 4873, "val_loss": 6712618.0} {"train_loss": -25.678714752197266, "global_step": 404542, "epoch": 4874} {"train_loss": -25.12717628479004, "global_step": 404543, "epoch": 4874} {"train_loss": -25.356969833374023, "global_step": 404544, "epoch": 4874} {"train_loss": -26.29010009765625, "global_step": 404545, "epoch": 4874} {"train_loss": -26.208097457885742, "global_step": 404546, "epoch": 4874} {"train_loss": -25.628889083862305, "global_step": 404547, "epoch": 4874} {"train_loss": -26.530536651611328, "global_step": 404548, "epoch": 4874} {"train_loss": -25.994199752807617, "global_step": 404549, "epoch": 4874} {"train_loss": -26.337499618530273, "global_step": 404550, "epoch": 4874} {"train_loss": -25.78529930114746, "global_step": 404551, "epoch": 4874} {"train_loss": -26.226316452026367, "global_step": 404552, "epoch": 4874} {"train_loss": -26.33758544921875, "global_step": 404553, "epoch": 4874} {"train_loss": -26.447248458862305, "global_step": 404554, "epoch": 4874} {"train_loss": -26.1676082611084, "global_step": 404555, "epoch": 4874} {"train_loss": -26.024921417236328, "global_step": 404556, "epoch": 4874} {"train_loss": -26.430944442749023, "global_step": 404557, "epoch": 4874} {"train_loss": -25.983678817749023, "global_step": 404558, "epoch": 4874} {"train_loss": -26.403913497924805, "global_step": 404559, "epoch": 4874} {"train_loss": -26.617490768432617, "global_step": 404560, "epoch": 4874} {"train_loss": -26.3095703125, "global_step": 404561, "epoch": 4874} {"train_loss": -26.20100212097168, "global_step": 404562, "epoch": 4874} {"train_loss": -26.636728286743164, "global_step": 404563, "epoch": 4874} {"train_loss": -26.75628089904785, "global_step": 404564, "epoch": 4874} {"train_loss": -26.564199447631836, "global_step": 404565, "epoch": 4874} {"train_loss": -26.40516471862793, "global_step": 404566, "epoch": 4874} {"train_loss": -26.528451919555664, "global_step": 404567, "epoch": 4874} {"train_loss": -26.495817184448242, "global_step": 404568, "epoch": 4874} {"train_loss": -26.628931045532227, "global_step": 404569, "epoch": 4874} {"train_loss": -27.084531784057617, "global_step": 404570, "epoch": 4874} {"train_loss": -26.468076705932617, "global_step": 404571, "epoch": 4874} {"train_loss": -26.4149169921875, "global_step": 404572, "epoch": 4874} {"train_loss": -26.82965660095215, "global_step": 404573, "epoch": 4874} {"train_loss": -26.788562774658203, "global_step": 404574, "epoch": 4874} {"train_loss": -26.400482177734375, "global_step": 404575, "epoch": 4874} {"train_loss": -26.354785919189453, "global_step": 404576, "epoch": 4874} {"train_loss": -26.7171573638916, "global_step": 404577, "epoch": 4874} {"train_loss": -26.53299331665039, "global_step": 404578, "epoch": 4874} {"train_loss": -26.7321720123291, "global_step": 404579, "epoch": 4874} {"train_loss": -26.468183517456055, "global_step": 404580, "epoch": 4874} {"train_loss": -26.750608444213867, "global_step": 404581, "epoch": 4874} {"train_loss": -26.338092803955078, "global_step": 404582, "epoch": 4874} {"train_loss": -26.598669052124023, "global_step": 404583, "epoch": 4874} {"train_loss": -26.42401695251465, "global_step": 404584, "epoch": 4874} {"train_loss": -27.102277755737305, "global_step": 404585, "epoch": 4874} {"train_loss": -26.299070358276367, "global_step": 404586, "epoch": 4874} {"train_loss": -26.484708786010742, "global_step": 404587, "epoch": 4874} {"train_loss": -26.633209228515625, "global_step": 404588, "epoch": 4874} {"train_loss": -26.819202423095703, "global_step": 404589, "epoch": 4874} {"train_loss": -26.679275512695312, "global_step": 404590, "epoch": 4874} {"train_loss": -26.565427780151367, "global_step": 404591, "epoch": 4874} {"train_loss": -26.621917724609375, "global_step": 404592, "epoch": 4874} {"train_loss": -26.80963706970215, "global_step": 404593, "epoch": 4874} {"train_loss": -26.84028434753418, "global_step": 404594, "epoch": 4874} {"train_loss": -26.638341903686523, "global_step": 404595, "epoch": 4874} {"train_loss": -26.677331924438477, "global_step": 404596, "epoch": 4874} {"train_loss": -26.811376571655273, "global_step": 404597, "epoch": 4874} {"train_loss": -26.96158790588379, "global_step": 404598, "epoch": 4874} {"train_loss": -26.866352081298828, "global_step": 404599, "epoch": 4874} {"train_loss": -26.899805068969727, "global_step": 404600, "epoch": 4874} {"train_loss": -26.777103424072266, "global_step": 404601, "epoch": 4874} {"train_loss": -26.72027015686035, "global_step": 404602, "epoch": 4874} {"train_loss": -26.758359909057617, "global_step": 404603, "epoch": 4874} {"train_loss": -26.78911781311035, "global_step": 404604, "epoch": 4874} {"train_loss": -26.574289321899414, "global_step": 404605, "epoch": 4874} {"train_loss": -26.673444747924805, "global_step": 404606, "epoch": 4874} {"train_loss": -26.179895401000977, "global_step": 404607, "epoch": 4874} {"train_loss": -27.259265899658203, "global_step": 404608, "epoch": 4874} {"train_loss": -26.416797637939453, "global_step": 404609, "epoch": 4874} {"train_loss": -26.76716423034668, "global_step": 404610, "epoch": 4874} {"train_loss": -26.53900718688965, "global_step": 404611, "epoch": 4874} {"train_loss": -26.839563369750977, "global_step": 404612, "epoch": 4874} {"train_loss": -26.77394676208496, "global_step": 404613, "epoch": 4874} {"train_loss": -26.552154541015625, "global_step": 404614, "epoch": 4874} {"train_loss": -27.303892135620117, "global_step": 404615, "epoch": 4874} {"train_loss": -26.580408096313477, "global_step": 404616, "epoch": 4874} {"train_loss": -26.465286254882812, "global_step": 404617, "epoch": 4874} {"train_loss": -26.920995712280273, "global_step": 404618, "epoch": 4874} {"train_loss": -26.770233154296875, "global_step": 404619, "epoch": 4874} {"train_loss": -26.45496940612793, "global_step": 404620, "epoch": 4874} {"train_loss": -26.723876953125, "global_step": 404621, "epoch": 4874} {"train_loss": -26.623395919799805, "global_step": 404622, "epoch": 4874} {"train_loss": -27.20587158203125, "global_step": 404623, "epoch": 4874} {"train_loss": -26.52179986884795, "global_step": 404624, "epoch": 4874, "val_loss": 6722500.0} {"train_loss": -25.958251953125, "global_step": 404625, "epoch": 4875} {"train_loss": -25.197101593017578, "global_step": 404626, "epoch": 4875} {"train_loss": -26.0866641998291, "global_step": 404627, "epoch": 4875} {"train_loss": -26.168853759765625, "global_step": 404628, "epoch": 4875} {"train_loss": -25.761157989501953, "global_step": 404629, "epoch": 4875} {"train_loss": -26.145374298095703, "global_step": 404630, "epoch": 4875} {"train_loss": -25.980932235717773, "global_step": 404631, "epoch": 4875} {"train_loss": -26.14204978942871, "global_step": 404632, "epoch": 4875} {"train_loss": -25.914663314819336, "global_step": 404633, "epoch": 4875} {"train_loss": -26.422983169555664, "global_step": 404634, "epoch": 4875} {"train_loss": -26.199798583984375, "global_step": 404635, "epoch": 4875} {"train_loss": -26.408557891845703, "global_step": 404636, "epoch": 4875} {"train_loss": -26.574853897094727, "global_step": 404637, "epoch": 4875} {"train_loss": -26.455636978149414, "global_step": 404638, "epoch": 4875} {"train_loss": -26.53169059753418, "global_step": 404639, "epoch": 4875} {"train_loss": -26.255035400390625, "global_step": 404640, "epoch": 4875} {"train_loss": -26.50208854675293, "global_step": 404641, "epoch": 4875} {"train_loss": -26.377180099487305, "global_step": 404642, "epoch": 4875} {"train_loss": -26.245574951171875, "global_step": 404643, "epoch": 4875} {"train_loss": -26.258285522460938, "global_step": 404644, "epoch": 4875} {"train_loss": -26.445287704467773, "global_step": 404645, "epoch": 4875} {"train_loss": -26.345489501953125, "global_step": 404646, "epoch": 4875} {"train_loss": -26.620655059814453, "global_step": 404647, "epoch": 4875} {"train_loss": -26.815282821655273, "global_step": 404648, "epoch": 4875} {"train_loss": -26.527999877929688, "global_step": 404649, "epoch": 4875} {"train_loss": -26.90535545349121, "global_step": 404650, "epoch": 4875} {"train_loss": -26.551273345947266, "global_step": 404651, "epoch": 4875} {"train_loss": -26.83735466003418, "global_step": 404652, "epoch": 4875} {"train_loss": -26.702539443969727, "global_step": 404653, "epoch": 4875} {"train_loss": -26.4558048248291, "global_step": 404654, "epoch": 4875} {"train_loss": -26.720407485961914, "global_step": 404655, "epoch": 4875} {"train_loss": -26.818662643432617, "global_step": 404656, "epoch": 4875} {"train_loss": -26.657995223999023, "global_step": 404657, "epoch": 4875} {"train_loss": -26.992816925048828, "global_step": 404658, "epoch": 4875} {"train_loss": -26.7177791595459, "global_step": 404659, "epoch": 4875} {"train_loss": -26.615819931030273, "global_step": 404660, "epoch": 4875} {"train_loss": -27.05048179626465, "global_step": 404661, "epoch": 4875} {"train_loss": -26.89618492126465, "global_step": 404662, "epoch": 4875} {"train_loss": -26.727670669555664, "global_step": 404663, "epoch": 4875} {"train_loss": -26.7235050201416, "global_step": 404664, "epoch": 4875} {"train_loss": -26.85846519470215, "global_step": 404665, "epoch": 4875} {"train_loss": -26.678930282592773, "global_step": 404666, "epoch": 4875} {"train_loss": -26.660612106323242, "global_step": 404667, "epoch": 4875} {"train_loss": -26.385950088500977, "global_step": 404668, "epoch": 4875} {"train_loss": -26.580322265625, "global_step": 404669, "epoch": 4875} {"train_loss": -26.689777374267578, "global_step": 404670, "epoch": 4875} {"train_loss": -26.70147705078125, "global_step": 404671, "epoch": 4875} {"train_loss": -26.628767013549805, "global_step": 404672, "epoch": 4875} {"train_loss": -26.957508087158203, "global_step": 404673, "epoch": 4875} {"train_loss": -26.755041122436523, "global_step": 404674, "epoch": 4875} {"train_loss": -26.26568603515625, "global_step": 404675, "epoch": 4875} {"train_loss": -27.022199630737305, "global_step": 404676, "epoch": 4875} {"train_loss": -26.093189239501953, "global_step": 404677, "epoch": 4875} {"train_loss": -26.33338737487793, "global_step": 404678, "epoch": 4875} {"train_loss": -26.4367733001709, "global_step": 404679, "epoch": 4875} {"train_loss": -26.62885856628418, "global_step": 404680, "epoch": 4875} {"train_loss": -26.69886589050293, "global_step": 404681, "epoch": 4875} {"train_loss": -26.09320640563965, "global_step": 404682, "epoch": 4875} {"train_loss": -26.402332305908203, "global_step": 404683, "epoch": 4875} {"train_loss": -26.88983154296875, "global_step": 404684, "epoch": 4875} {"train_loss": -26.391836166381836, "global_step": 404685, "epoch": 4875} {"train_loss": -26.41257095336914, "global_step": 404686, "epoch": 4875} {"train_loss": -26.447290420532227, "global_step": 404687, "epoch": 4875} {"train_loss": -26.34991455078125, "global_step": 404688, "epoch": 4875} {"train_loss": -26.709787368774414, "global_step": 404689, "epoch": 4875} {"train_loss": -26.682910919189453, "global_step": 404690, "epoch": 4875} {"train_loss": -26.763751983642578, "global_step": 404691, "epoch": 4875} {"train_loss": -26.465116500854492, "global_step": 404692, "epoch": 4875} {"train_loss": -26.47123146057129, "global_step": 404693, "epoch": 4875} {"train_loss": -26.90093994140625, "global_step": 404694, "epoch": 4875} {"train_loss": -26.466230392456055, "global_step": 404695, "epoch": 4875} {"train_loss": -26.58683204650879, "global_step": 404696, "epoch": 4875} {"train_loss": -26.540863037109375, "global_step": 404697, "epoch": 4875} {"train_loss": -26.7613525390625, "global_step": 404698, "epoch": 4875} {"train_loss": -26.418842315673828, "global_step": 404699, "epoch": 4875} {"train_loss": -26.809356689453125, "global_step": 404700, "epoch": 4875} {"train_loss": -26.530826568603516, "global_step": 404701, "epoch": 4875} {"train_loss": -26.699827194213867, "global_step": 404702, "epoch": 4875} {"train_loss": -26.480243682861328, "global_step": 404703, "epoch": 4875} {"train_loss": -26.497272491455078, "global_step": 404704, "epoch": 4875} {"train_loss": -26.628971099853516, "global_step": 404705, "epoch": 4875} {"train_loss": -26.76898765563965, "global_step": 404706, "epoch": 4875} {"train_loss": -26.531756757253625, "global_step": 404707, "epoch": 4875, "val_loss": 6599702.0} {"train_loss": -26.154699325561523, "global_step": 404708, "epoch": 4876} {"train_loss": -26.374380111694336, "global_step": 404709, "epoch": 4876} {"train_loss": -25.934879302978516, "global_step": 404710, "epoch": 4876} {"train_loss": -25.913328170776367, "global_step": 404711, "epoch": 4876} {"train_loss": -25.794103622436523, "global_step": 404712, "epoch": 4876} {"train_loss": -25.431201934814453, "global_step": 404713, "epoch": 4876} {"train_loss": -25.8767032623291, "global_step": 404714, "epoch": 4876} {"train_loss": -26.112207412719727, "global_step": 404715, "epoch": 4876} {"train_loss": -25.301971435546875, "global_step": 404716, "epoch": 4876} {"train_loss": -26.056737899780273, "global_step": 404717, "epoch": 4876} {"train_loss": -26.338916778564453, "global_step": 404718, "epoch": 4876} {"train_loss": -25.74342155456543, "global_step": 404719, "epoch": 4876} {"train_loss": -25.981739044189453, "global_step": 404720, "epoch": 4876} {"train_loss": -26.279462814331055, "global_step": 404721, "epoch": 4876} {"train_loss": -26.043577194213867, "global_step": 404722, "epoch": 4876} {"train_loss": -26.6136474609375, "global_step": 404723, "epoch": 4876} {"train_loss": -26.229047775268555, "global_step": 404724, "epoch": 4876} {"train_loss": -26.241758346557617, "global_step": 404725, "epoch": 4876} {"train_loss": -26.313318252563477, "global_step": 404726, "epoch": 4876} {"train_loss": -26.347631454467773, "global_step": 404727, "epoch": 4876} {"train_loss": -26.268646240234375, "global_step": 404728, "epoch": 4876} {"train_loss": -26.063879013061523, "global_step": 404729, "epoch": 4876} {"train_loss": -26.671186447143555, "global_step": 404730, "epoch": 4876} {"train_loss": -26.211578369140625, "global_step": 404731, "epoch": 4876} {"train_loss": -26.42145347595215, "global_step": 404732, "epoch": 4876} {"train_loss": -26.338092803955078, "global_step": 404733, "epoch": 4876} {"train_loss": -26.576574325561523, "global_step": 404734, "epoch": 4876} {"train_loss": -26.380399703979492, "global_step": 404735, "epoch": 4876} {"train_loss": -26.2938175201416, "global_step": 404736, "epoch": 4876} {"train_loss": -26.593515396118164, "global_step": 404737, "epoch": 4876} {"train_loss": -26.397642135620117, "global_step": 404738, "epoch": 4876} {"train_loss": -26.989776611328125, "global_step": 404739, "epoch": 4876} {"train_loss": -26.692462921142578, "global_step": 404740, "epoch": 4876} {"train_loss": -26.526264190673828, "global_step": 404741, "epoch": 4876} {"train_loss": -26.848600387573242, "global_step": 404742, "epoch": 4876} {"train_loss": -26.657888412475586, "global_step": 404743, "epoch": 4876} {"train_loss": -26.452991485595703, "global_step": 404744, "epoch": 4876} {"train_loss": -26.876996994018555, "global_step": 404745, "epoch": 4876} {"train_loss": -26.733091354370117, "global_step": 404746, "epoch": 4876} {"train_loss": -26.687332153320312, "global_step": 404747, "epoch": 4876} {"train_loss": -26.7960147857666, "global_step": 404748, "epoch": 4876} {"train_loss": -26.79913902282715, "global_step": 404749, "epoch": 4876} {"train_loss": -26.932662963867188, "global_step": 404750, "epoch": 4876} {"train_loss": -26.9355525970459, "global_step": 404751, "epoch": 4876} {"train_loss": -26.913925170898438, "global_step": 404752, "epoch": 4876} {"train_loss": -26.752164840698242, "global_step": 404753, "epoch": 4876} {"train_loss": -26.510190963745117, "global_step": 404754, "epoch": 4876} {"train_loss": -26.952442169189453, "global_step": 404755, "epoch": 4876} {"train_loss": -26.94068717956543, "global_step": 404756, "epoch": 4876} {"train_loss": -26.855316162109375, "global_step": 404757, "epoch": 4876} {"train_loss": -26.68080711364746, "global_step": 404758, "epoch": 4876} {"train_loss": -26.989883422851562, "global_step": 404759, "epoch": 4876} {"train_loss": -26.47600746154785, "global_step": 404760, "epoch": 4876} {"train_loss": -27.099700927734375, "global_step": 404761, "epoch": 4876} {"train_loss": -26.77308464050293, "global_step": 404762, "epoch": 4876} {"train_loss": -26.81084632873535, "global_step": 404763, "epoch": 4876} {"train_loss": -26.516199111938477, "global_step": 404764, "epoch": 4876} {"train_loss": -26.67099380493164, "global_step": 404765, "epoch": 4876} {"train_loss": -27.21766471862793, "global_step": 404766, "epoch": 4876} {"train_loss": -26.785572052001953, "global_step": 404767, "epoch": 4876} {"train_loss": -26.571792602539062, "global_step": 404768, "epoch": 4876} {"train_loss": -27.36139488220215, "global_step": 404769, "epoch": 4876} {"train_loss": -26.948719024658203, "global_step": 404770, "epoch": 4876} {"train_loss": -26.608823776245117, "global_step": 404771, "epoch": 4876} {"train_loss": -26.794763565063477, "global_step": 404772, "epoch": 4876} {"train_loss": -26.3937931060791, "global_step": 404773, "epoch": 4876} {"train_loss": -25.326526641845703, "global_step": 404774, "epoch": 4876} {"train_loss": -25.81961441040039, "global_step": 404775, "epoch": 4876} {"train_loss": -25.472034454345703, "global_step": 404776, "epoch": 4876} {"train_loss": -26.04500389099121, "global_step": 404777, "epoch": 4876} {"train_loss": -26.5765438079834, "global_step": 404778, "epoch": 4876} {"train_loss": -26.0084285736084, "global_step": 404779, "epoch": 4876} {"train_loss": -26.134510040283203, "global_step": 404780, "epoch": 4876} {"train_loss": -26.3564453125, "global_step": 404781, "epoch": 4876} {"train_loss": -26.320173263549805, "global_step": 404782, "epoch": 4876} {"train_loss": -26.409208297729492, "global_step": 404783, "epoch": 4876} {"train_loss": -26.073169708251953, "global_step": 404784, "epoch": 4876} {"train_loss": -26.55735206604004, "global_step": 404785, "epoch": 4876} {"train_loss": -26.639636993408203, "global_step": 404786, "epoch": 4876} {"train_loss": -26.291446685791016, "global_step": 404787, "epoch": 4876} {"train_loss": -26.402307510375977, "global_step": 404788, "epoch": 4876} {"train_loss": -26.827009201049805, "global_step": 404789, "epoch": 4876} {"train_loss": -26.435931010418628, "global_step": 404790, "epoch": 4876, "val_loss": 6676404.5} {"train_loss": -26.16592788696289, "global_step": 404791, "epoch": 4877} {"train_loss": -26.509668350219727, "global_step": 404792, "epoch": 4877} {"train_loss": -26.561120986938477, "global_step": 404793, "epoch": 4877} {"train_loss": -26.392841339111328, "global_step": 404794, "epoch": 4877} {"train_loss": -26.538330078125, "global_step": 404795, "epoch": 4877} {"train_loss": -26.406171798706055, "global_step": 404796, "epoch": 4877} {"train_loss": -26.533309936523438, "global_step": 404797, "epoch": 4877} {"train_loss": -26.302167892456055, "global_step": 404798, "epoch": 4877} {"train_loss": -26.43650245666504, "global_step": 404799, "epoch": 4877} {"train_loss": -26.668964385986328, "global_step": 404800, "epoch": 4877} {"train_loss": -26.645185470581055, "global_step": 404801, "epoch": 4877} {"train_loss": -26.41033935546875, "global_step": 404802, "epoch": 4877} {"train_loss": -26.02545166015625, "global_step": 404803, "epoch": 4877} {"train_loss": -26.51043701171875, "global_step": 404804, "epoch": 4877} {"train_loss": -26.7343692779541, "global_step": 404805, "epoch": 4877} {"train_loss": -26.82404899597168, "global_step": 404806, "epoch": 4877} {"train_loss": -26.50200843811035, "global_step": 404807, "epoch": 4877} {"train_loss": -26.57770347595215, "global_step": 404808, "epoch": 4877} {"train_loss": -26.753314971923828, "global_step": 404809, "epoch": 4877} {"train_loss": -26.66385841369629, "global_step": 404810, "epoch": 4877} {"train_loss": -26.757226943969727, "global_step": 404811, "epoch": 4877} {"train_loss": -26.544727325439453, "global_step": 404812, "epoch": 4877} {"train_loss": -26.623661041259766, "global_step": 404813, "epoch": 4877} {"train_loss": -26.86626625061035, "global_step": 404814, "epoch": 4877} {"train_loss": -26.97600746154785, "global_step": 404815, "epoch": 4877} {"train_loss": -26.92083168029785, "global_step": 404816, "epoch": 4877} {"train_loss": -26.655261993408203, "global_step": 404817, "epoch": 4877} {"train_loss": -26.70344352722168, "global_step": 404818, "epoch": 4877} {"train_loss": -26.93947410583496, "global_step": 404819, "epoch": 4877} {"train_loss": -26.9379940032959, "global_step": 404820, "epoch": 4877} {"train_loss": -26.71917724609375, "global_step": 404821, "epoch": 4877} {"train_loss": -26.569501876831055, "global_step": 404822, "epoch": 4877} {"train_loss": -26.9016056060791, "global_step": 404823, "epoch": 4877} {"train_loss": -26.81575584411621, "global_step": 404824, "epoch": 4877} {"train_loss": -27.031757354736328, "global_step": 404825, "epoch": 4877} {"train_loss": -26.415790557861328, "global_step": 404826, "epoch": 4877} {"train_loss": -26.723539352416992, "global_step": 404827, "epoch": 4877} {"train_loss": -26.99495506286621, "global_step": 404828, "epoch": 4877} {"train_loss": -26.772998809814453, "global_step": 404829, "epoch": 4877} {"train_loss": -26.71211051940918, "global_step": 404830, "epoch": 4877} {"train_loss": -26.13465690612793, "global_step": 404831, "epoch": 4877} {"train_loss": -26.224380493164062, "global_step": 404832, "epoch": 4877} {"train_loss": -26.584808349609375, "global_step": 404833, "epoch": 4877} {"train_loss": -26.392850875854492, "global_step": 404834, "epoch": 4877} {"train_loss": -26.636362075805664, "global_step": 404835, "epoch": 4877} {"train_loss": -26.334455490112305, "global_step": 404836, "epoch": 4877} {"train_loss": -26.391584396362305, "global_step": 404837, "epoch": 4877} {"train_loss": -26.75458335876465, "global_step": 404838, "epoch": 4877} {"train_loss": -26.7838191986084, "global_step": 404839, "epoch": 4877} {"train_loss": -26.445343017578125, "global_step": 404840, "epoch": 4877} {"train_loss": -26.78689956665039, "global_step": 404841, "epoch": 4877} {"train_loss": -26.572555541992188, "global_step": 404842, "epoch": 4877} {"train_loss": -27.004459381103516, "global_step": 404843, "epoch": 4877} {"train_loss": -26.691823959350586, "global_step": 404844, "epoch": 4877} {"train_loss": -26.9123592376709, "global_step": 404845, "epoch": 4877} {"train_loss": -26.979312896728516, "global_step": 404846, "epoch": 4877} {"train_loss": -26.968271255493164, "global_step": 404847, "epoch": 4877} {"train_loss": -26.9104061126709, "global_step": 404848, "epoch": 4877} {"train_loss": -26.966876983642578, "global_step": 404849, "epoch": 4877} {"train_loss": -26.613256454467773, "global_step": 404850, "epoch": 4877} {"train_loss": -26.568811416625977, "global_step": 404851, "epoch": 4877} {"train_loss": -26.656396865844727, "global_step": 404852, "epoch": 4877} {"train_loss": -26.975637435913086, "global_step": 404853, "epoch": 4877} {"train_loss": -26.581445693969727, "global_step": 404854, "epoch": 4877} {"train_loss": -26.827117919921875, "global_step": 404855, "epoch": 4877} {"train_loss": -26.9327449798584, "global_step": 404856, "epoch": 4877} {"train_loss": -26.9482421875, "global_step": 404857, "epoch": 4877} {"train_loss": -26.9116153717041, "global_step": 404858, "epoch": 4877} {"train_loss": -27.342329025268555, "global_step": 404859, "epoch": 4877} {"train_loss": -26.726301193237305, "global_step": 404860, "epoch": 4877} {"train_loss": -26.7103328704834, "global_step": 404861, "epoch": 4877} {"train_loss": -27.101911544799805, "global_step": 404862, "epoch": 4877} {"train_loss": -26.7617130279541, "global_step": 404863, "epoch": 4877} {"train_loss": -26.88850212097168, "global_step": 404864, "epoch": 4877} {"train_loss": -26.4571475982666, "global_step": 404865, "epoch": 4877} {"train_loss": -26.804407119750977, "global_step": 404866, "epoch": 4877} {"train_loss": -26.560068130493164, "global_step": 404867, "epoch": 4877} {"train_loss": -26.082380294799805, "global_step": 404868, "epoch": 4877} {"train_loss": -26.601959228515625, "global_step": 404869, "epoch": 4877} {"train_loss": -26.922582626342773, "global_step": 404870, "epoch": 4877} {"train_loss": -26.78545570373535, "global_step": 404871, "epoch": 4877} {"train_loss": -26.492929458618164, "global_step": 404872, "epoch": 4877} {"train_loss": -26.67167010939265, "global_step": 404873, "epoch": 4877, "val_loss": 6624711.0} {"train_loss": -26.0069522857666, "global_step": 404874, "epoch": 4878} {"train_loss": -25.164352416992188, "global_step": 404875, "epoch": 4878} {"train_loss": -23.928518295288086, "global_step": 404876, "epoch": 4878} {"train_loss": -24.51397132873535, "global_step": 404877, "epoch": 4878} {"train_loss": -26.270496368408203, "global_step": 404878, "epoch": 4878} {"train_loss": -25.08958625793457, "global_step": 404879, "epoch": 4878} {"train_loss": -26.316394805908203, "global_step": 404880, "epoch": 4878} {"train_loss": -25.608444213867188, "global_step": 404881, "epoch": 4878} {"train_loss": -26.233844757080078, "global_step": 404882, "epoch": 4878} {"train_loss": -25.654836654663086, "global_step": 404883, "epoch": 4878} {"train_loss": -25.98211669921875, "global_step": 404884, "epoch": 4878} {"train_loss": -25.919174194335938, "global_step": 404885, "epoch": 4878} {"train_loss": -26.12967872619629, "global_step": 404886, "epoch": 4878} {"train_loss": -25.876867294311523, "global_step": 404887, "epoch": 4878} {"train_loss": -26.19329833984375, "global_step": 404888, "epoch": 4878} {"train_loss": -26.2699031829834, "global_step": 404889, "epoch": 4878} {"train_loss": -26.052900314331055, "global_step": 404890, "epoch": 4878} {"train_loss": -26.317977905273438, "global_step": 404891, "epoch": 4878} {"train_loss": -26.457305908203125, "global_step": 404892, "epoch": 4878} {"train_loss": -26.281396865844727, "global_step": 404893, "epoch": 4878} {"train_loss": -26.032989501953125, "global_step": 404894, "epoch": 4878} {"train_loss": -26.57797622680664, "global_step": 404895, "epoch": 4878} {"train_loss": -26.330198287963867, "global_step": 404896, "epoch": 4878} {"train_loss": -26.471343994140625, "global_step": 404897, "epoch": 4878} {"train_loss": -26.55280876159668, "global_step": 404898, "epoch": 4878} {"train_loss": -26.375091552734375, "global_step": 404899, "epoch": 4878} {"train_loss": -25.987186431884766, "global_step": 404900, "epoch": 4878} {"train_loss": -26.638715744018555, "global_step": 404901, "epoch": 4878} {"train_loss": -26.171070098876953, "global_step": 404902, "epoch": 4878} {"train_loss": -26.4254207611084, "global_step": 404903, "epoch": 4878} {"train_loss": -26.5673770904541, "global_step": 404904, "epoch": 4878} {"train_loss": -26.212568283081055, "global_step": 404905, "epoch": 4878} {"train_loss": -26.36634635925293, "global_step": 404906, "epoch": 4878} {"train_loss": -26.58343505859375, "global_step": 404907, "epoch": 4878} {"train_loss": -26.591068267822266, "global_step": 404908, "epoch": 4878} {"train_loss": -26.23703384399414, "global_step": 404909, "epoch": 4878} {"train_loss": -26.520490646362305, "global_step": 404910, "epoch": 4878} {"train_loss": -26.374982833862305, "global_step": 404911, "epoch": 4878} {"train_loss": -26.809656143188477, "global_step": 404912, "epoch": 4878} {"train_loss": -26.65443992614746, "global_step": 404913, "epoch": 4878} {"train_loss": -26.44595718383789, "global_step": 404914, "epoch": 4878} {"train_loss": -26.606821060180664, "global_step": 404915, "epoch": 4878} {"train_loss": -26.680774688720703, "global_step": 404916, "epoch": 4878} {"train_loss": -26.190204620361328, "global_step": 404917, "epoch": 4878} {"train_loss": -26.5548152923584, "global_step": 404918, "epoch": 4878} {"train_loss": -26.590906143188477, "global_step": 404919, "epoch": 4878} {"train_loss": -26.638090133666992, "global_step": 404920, "epoch": 4878} {"train_loss": -26.446247100830078, "global_step": 404921, "epoch": 4878} {"train_loss": -26.60369300842285, "global_step": 404922, "epoch": 4878} {"train_loss": -26.60931968688965, "global_step": 404923, "epoch": 4878} {"train_loss": -26.40445899963379, "global_step": 404924, "epoch": 4878} {"train_loss": -25.885517120361328, "global_step": 404925, "epoch": 4878} {"train_loss": -25.905094146728516, "global_step": 404926, "epoch": 4878} {"train_loss": -26.1417236328125, "global_step": 404927, "epoch": 4878} {"train_loss": -26.38262939453125, "global_step": 404928, "epoch": 4878} {"train_loss": -26.604562759399414, "global_step": 404929, "epoch": 4878} {"train_loss": -26.654016494750977, "global_step": 404930, "epoch": 4878} {"train_loss": -26.33933448791504, "global_step": 404931, "epoch": 4878} {"train_loss": -26.49261474609375, "global_step": 404932, "epoch": 4878} {"train_loss": -26.641666412353516, "global_step": 404933, "epoch": 4878} {"train_loss": -26.236066818237305, "global_step": 404934, "epoch": 4878} {"train_loss": -26.7187557220459, "global_step": 404935, "epoch": 4878} {"train_loss": -26.516767501831055, "global_step": 404936, "epoch": 4878} {"train_loss": -26.77239418029785, "global_step": 404937, "epoch": 4878} {"train_loss": -26.49772071838379, "global_step": 404938, "epoch": 4878} {"train_loss": -26.573780059814453, "global_step": 404939, "epoch": 4878} {"train_loss": -27.04876136779785, "global_step": 404940, "epoch": 4878} {"train_loss": -26.65610694885254, "global_step": 404941, "epoch": 4878} {"train_loss": -26.772485733032227, "global_step": 404942, "epoch": 4878} {"train_loss": -26.81556510925293, "global_step": 404943, "epoch": 4878} {"train_loss": -26.869291305541992, "global_step": 404944, "epoch": 4878} {"train_loss": -26.55034828186035, "global_step": 404945, "epoch": 4878} {"train_loss": -26.521747589111328, "global_step": 404946, "epoch": 4878} {"train_loss": -26.9232177734375, "global_step": 404947, "epoch": 4878} {"train_loss": -26.34712028503418, "global_step": 404948, "epoch": 4878} {"train_loss": -26.487781524658203, "global_step": 404949, "epoch": 4878} {"train_loss": -26.53040885925293, "global_step": 404950, "epoch": 4878} {"train_loss": -26.385345458984375, "global_step": 404951, "epoch": 4878} {"train_loss": -26.746389389038086, "global_step": 404952, "epoch": 4878} {"train_loss": -26.370197296142578, "global_step": 404953, "epoch": 4878} {"train_loss": -25.829456329345703, "global_step": 404954, "epoch": 4878} {"train_loss": -26.530536651611328, "global_step": 404955, "epoch": 4878} {"train_loss": -26.308590808546686, "global_step": 404956, "epoch": 4878, "val_loss": 6713840.5} {"train_loss": -25.64835548400879, "global_step": 404957, "epoch": 4879} {"train_loss": -25.86330223083496, "global_step": 404958, "epoch": 4879} {"train_loss": -26.314863204956055, "global_step": 404959, "epoch": 4879} {"train_loss": -25.859628677368164, "global_step": 404960, "epoch": 4879} {"train_loss": -26.162261962890625, "global_step": 404961, "epoch": 4879} {"train_loss": -26.517263412475586, "global_step": 404962, "epoch": 4879} {"train_loss": -26.280349731445312, "global_step": 404963, "epoch": 4879} {"train_loss": -26.073179244995117, "global_step": 404964, "epoch": 4879} {"train_loss": -26.5827579498291, "global_step": 404965, "epoch": 4879} {"train_loss": -26.278156280517578, "global_step": 404966, "epoch": 4879} {"train_loss": -26.23298454284668, "global_step": 404967, "epoch": 4879} {"train_loss": -26.498151779174805, "global_step": 404968, "epoch": 4879} {"train_loss": -26.407922744750977, "global_step": 404969, "epoch": 4879} {"train_loss": -26.527713775634766, "global_step": 404970, "epoch": 4879} {"train_loss": -26.302892684936523, "global_step": 404971, "epoch": 4879} {"train_loss": -26.233016967773438, "global_step": 404972, "epoch": 4879} {"train_loss": -26.439550399780273, "global_step": 404973, "epoch": 4879} {"train_loss": -26.030704498291016, "global_step": 404974, "epoch": 4879} {"train_loss": -26.712982177734375, "global_step": 404975, "epoch": 4879} {"train_loss": -26.621877670288086, "global_step": 404976, "epoch": 4879} {"train_loss": -26.071430206298828, "global_step": 404977, "epoch": 4879} {"train_loss": -26.45383644104004, "global_step": 404978, "epoch": 4879} {"train_loss": -26.7027645111084, "global_step": 404979, "epoch": 4879} {"train_loss": -26.389612197875977, "global_step": 404980, "epoch": 4879} {"train_loss": -26.673147201538086, "global_step": 404981, "epoch": 4879} {"train_loss": -26.555103302001953, "global_step": 404982, "epoch": 4879} {"train_loss": -26.64424705505371, "global_step": 404983, "epoch": 4879} {"train_loss": -26.77277946472168, "global_step": 404984, "epoch": 4879} {"train_loss": -26.856800079345703, "global_step": 404985, "epoch": 4879} {"train_loss": -26.705652236938477, "global_step": 404986, "epoch": 4879} {"train_loss": -26.82008171081543, "global_step": 404987, "epoch": 4879} {"train_loss": -26.388229370117188, "global_step": 404988, "epoch": 4879} {"train_loss": -26.81675148010254, "global_step": 404989, "epoch": 4879} {"train_loss": -26.600433349609375, "global_step": 404990, "epoch": 4879} {"train_loss": -26.497243881225586, "global_step": 404991, "epoch": 4879} {"train_loss": -26.38178062438965, "global_step": 404992, "epoch": 4879} {"train_loss": -26.891077041625977, "global_step": 404993, "epoch": 4879} {"train_loss": -27.203384399414062, "global_step": 404994, "epoch": 4879} {"train_loss": -26.737476348876953, "global_step": 404995, "epoch": 4879} {"train_loss": -26.761219024658203, "global_step": 404996, "epoch": 4879} {"train_loss": -27.035398483276367, "global_step": 404997, "epoch": 4879} {"train_loss": -26.614389419555664, "global_step": 404998, "epoch": 4879} {"train_loss": -26.44293785095215, "global_step": 404999, "epoch": 4879} {"train_loss": -26.62986183166504, "global_step": 405000, "epoch": 4879} {"train_loss": -26.7390079498291, "global_step": 405001, "epoch": 4879} {"train_loss": -26.86753273010254, "global_step": 405002, "epoch": 4879} {"train_loss": -26.612518310546875, "global_step": 405003, "epoch": 4879} {"train_loss": -26.535614013671875, "global_step": 405004, "epoch": 4879} {"train_loss": -26.475461959838867, "global_step": 405005, "epoch": 4879} {"train_loss": -26.649097442626953, "global_step": 405006, "epoch": 4879} {"train_loss": -26.594614028930664, "global_step": 405007, "epoch": 4879} {"train_loss": -26.867965698242188, "global_step": 405008, "epoch": 4879} {"train_loss": -26.585189819335938, "global_step": 405009, "epoch": 4879} {"train_loss": -26.80149269104004, "global_step": 405010, "epoch": 4879} {"train_loss": -26.76299476623535, "global_step": 405011, "epoch": 4879} {"train_loss": -26.837295532226562, "global_step": 405012, "epoch": 4879} {"train_loss": -26.98976707458496, "global_step": 405013, "epoch": 4879} {"train_loss": -26.93576431274414, "global_step": 405014, "epoch": 4879} {"train_loss": -26.872201919555664, "global_step": 405015, "epoch": 4879} {"train_loss": -26.468109130859375, "global_step": 405016, "epoch": 4879} {"train_loss": -26.76649284362793, "global_step": 405017, "epoch": 4879} {"train_loss": -26.63677406311035, "global_step": 405018, "epoch": 4879} {"train_loss": -26.952564239501953, "global_step": 405019, "epoch": 4879} {"train_loss": -26.992979049682617, "global_step": 405020, "epoch": 4879} {"train_loss": -26.8632869720459, "global_step": 405021, "epoch": 4879} {"train_loss": -26.973886489868164, "global_step": 405022, "epoch": 4879} {"train_loss": -26.829788208007812, "global_step": 405023, "epoch": 4879} {"train_loss": -26.877676010131836, "global_step": 405024, "epoch": 4879} {"train_loss": -26.869674682617188, "global_step": 405025, "epoch": 4879} {"train_loss": -27.21114158630371, "global_step": 405026, "epoch": 4879} {"train_loss": -26.5657958984375, "global_step": 405027, "epoch": 4879} {"train_loss": -26.719806671142578, "global_step": 405028, "epoch": 4879} {"train_loss": -26.93792724609375, "global_step": 405029, "epoch": 4879} {"train_loss": -26.469867706298828, "global_step": 405030, "epoch": 4879} {"train_loss": -27.07891845703125, "global_step": 405031, "epoch": 4879} {"train_loss": -26.95564079284668, "global_step": 405032, "epoch": 4879} {"train_loss": -26.707138061523438, "global_step": 405033, "epoch": 4879} {"train_loss": -26.71658706665039, "global_step": 405034, "epoch": 4879} {"train_loss": -26.53803825378418, "global_step": 405035, "epoch": 4879} {"train_loss": -26.915525436401367, "global_step": 405036, "epoch": 4879} {"train_loss": -26.724130630493164, "global_step": 405037, "epoch": 4879} {"train_loss": -27.02790641784668, "global_step": 405038, "epoch": 4879} {"train_loss": -26.592794188533922, "global_step": 405039, "epoch": 4879, "val_loss": 6729547.0} {"train_loss": -26.44705581665039, "global_step": 405040, "epoch": 4880} {"train_loss": -26.6693115234375, "global_step": 405041, "epoch": 4880} {"train_loss": -26.141992568969727, "global_step": 405042, "epoch": 4880} {"train_loss": -26.80342674255371, "global_step": 405043, "epoch": 4880} {"train_loss": -26.266342163085938, "global_step": 405044, "epoch": 4880} {"train_loss": -26.545978546142578, "global_step": 405045, "epoch": 4880} {"train_loss": -26.603723526000977, "global_step": 405046, "epoch": 4880} {"train_loss": -26.463623046875, "global_step": 405047, "epoch": 4880} {"train_loss": -26.39027976989746, "global_step": 405048, "epoch": 4880} {"train_loss": -26.08527946472168, "global_step": 405049, "epoch": 4880} {"train_loss": -26.17716407775879, "global_step": 405050, "epoch": 4880} {"train_loss": -26.565631866455078, "global_step": 405051, "epoch": 4880} {"train_loss": -26.838438034057617, "global_step": 405052, "epoch": 4880} {"train_loss": -26.924030303955078, "global_step": 405053, "epoch": 4880} {"train_loss": -26.37127113342285, "global_step": 405054, "epoch": 4880} {"train_loss": -26.38800621032715, "global_step": 405055, "epoch": 4880} {"train_loss": -26.655874252319336, "global_step": 405056, "epoch": 4880} {"train_loss": -26.725650787353516, "global_step": 405057, "epoch": 4880} {"train_loss": -26.04852294921875, "global_step": 405058, "epoch": 4880} {"train_loss": -26.320316314697266, "global_step": 405059, "epoch": 4880} {"train_loss": -26.778905868530273, "global_step": 405060, "epoch": 4880} {"train_loss": -26.17207908630371, "global_step": 405061, "epoch": 4880} {"train_loss": -26.311140060424805, "global_step": 405062, "epoch": 4880} {"train_loss": -26.82537841796875, "global_step": 405063, "epoch": 4880} {"train_loss": -26.655603408813477, "global_step": 405064, "epoch": 4880} {"train_loss": -26.77585220336914, "global_step": 405065, "epoch": 4880} {"train_loss": -26.339447021484375, "global_step": 405066, "epoch": 4880} {"train_loss": -26.481887817382812, "global_step": 405067, "epoch": 4880} {"train_loss": -26.70692253112793, "global_step": 405068, "epoch": 4880} {"train_loss": -26.501371383666992, "global_step": 405069, "epoch": 4880} {"train_loss": -26.574447631835938, "global_step": 405070, "epoch": 4880} {"train_loss": -26.53011131286621, "global_step": 405071, "epoch": 4880} {"train_loss": -26.53138542175293, "global_step": 405072, "epoch": 4880} {"train_loss": -26.807632446289062, "global_step": 405073, "epoch": 4880} {"train_loss": -26.685394287109375, "global_step": 405074, "epoch": 4880} {"train_loss": -26.83074951171875, "global_step": 405075, "epoch": 4880} {"train_loss": -26.699298858642578, "global_step": 405076, "epoch": 4880} {"train_loss": -26.88228416442871, "global_step": 405077, "epoch": 4880} {"train_loss": -26.929357528686523, "global_step": 405078, "epoch": 4880} {"train_loss": -26.64314079284668, "global_step": 405079, "epoch": 4880} {"train_loss": -26.858091354370117, "global_step": 405080, "epoch": 4880} {"train_loss": -26.59882164001465, "global_step": 405081, "epoch": 4880} {"train_loss": -26.5181941986084, "global_step": 405082, "epoch": 4880} {"train_loss": -26.947265625, "global_step": 405083, "epoch": 4880} {"train_loss": -26.743383407592773, "global_step": 405084, "epoch": 4880} {"train_loss": -26.597213745117188, "global_step": 405085, "epoch": 4880} {"train_loss": -26.692487716674805, "global_step": 405086, "epoch": 4880} {"train_loss": -26.51236343383789, "global_step": 405087, "epoch": 4880} {"train_loss": -26.984399795532227, "global_step": 405088, "epoch": 4880} {"train_loss": -26.66458511352539, "global_step": 405089, "epoch": 4880} {"train_loss": -26.41155433654785, "global_step": 405090, "epoch": 4880} {"train_loss": -26.598005294799805, "global_step": 405091, "epoch": 4880} {"train_loss": -27.171110153198242, "global_step": 405092, "epoch": 4880} {"train_loss": -26.93964195251465, "global_step": 405093, "epoch": 4880} {"train_loss": -26.605634689331055, "global_step": 405094, "epoch": 4880} {"train_loss": -26.880407333374023, "global_step": 405095, "epoch": 4880} {"train_loss": -26.749958038330078, "global_step": 405096, "epoch": 4880} {"train_loss": -26.930328369140625, "global_step": 405097, "epoch": 4880} {"train_loss": -27.19915199279785, "global_step": 405098, "epoch": 4880} {"train_loss": -26.5892391204834, "global_step": 405099, "epoch": 4880} {"train_loss": -26.3057804107666, "global_step": 405100, "epoch": 4880} {"train_loss": -26.238794326782227, "global_step": 405101, "epoch": 4880} {"train_loss": -25.917261123657227, "global_step": 405102, "epoch": 4880} {"train_loss": -26.392385482788086, "global_step": 405103, "epoch": 4880} {"train_loss": -26.856786727905273, "global_step": 405104, "epoch": 4880} {"train_loss": -26.44475746154785, "global_step": 405105, "epoch": 4880} {"train_loss": -26.272674560546875, "global_step": 405106, "epoch": 4880} {"train_loss": -26.359724044799805, "global_step": 405107, "epoch": 4880} {"train_loss": -26.370010375976562, "global_step": 405108, "epoch": 4880} {"train_loss": -26.51801872253418, "global_step": 405109, "epoch": 4880} {"train_loss": -26.465368270874023, "global_step": 405110, "epoch": 4880} {"train_loss": -26.643186569213867, "global_step": 405111, "epoch": 4880} {"train_loss": -26.407318115234375, "global_step": 405112, "epoch": 4880} {"train_loss": -26.414831161499023, "global_step": 405113, "epoch": 4880} {"train_loss": -26.87156105041504, "global_step": 405114, "epoch": 4880} {"train_loss": -26.30146598815918, "global_step": 405115, "epoch": 4880} {"train_loss": -26.69940757751465, "global_step": 405116, "epoch": 4880} {"train_loss": -26.81305503845215, "global_step": 405117, "epoch": 4880} {"train_loss": -26.440359115600586, "global_step": 405118, "epoch": 4880} {"train_loss": -26.541189193725586, "global_step": 405119, "epoch": 4880} {"train_loss": -27.081134796142578, "global_step": 405120, "epoch": 4880} {"train_loss": -26.36512565612793, "global_step": 405121, "epoch": 4880} {"train_loss": -26.584901028368847, "global_step": 405122, "epoch": 4880, "val_loss": 6738483.0} {"train_loss": -25.623016357421875, "global_step": 405123, "epoch": 4881} {"train_loss": -25.509002685546875, "global_step": 405124, "epoch": 4881} {"train_loss": -25.28685188293457, "global_step": 405125, "epoch": 4881} {"train_loss": -26.181655883789062, "global_step": 405126, "epoch": 4881} {"train_loss": -25.666685104370117, "global_step": 405127, "epoch": 4881} {"train_loss": -25.816776275634766, "global_step": 405128, "epoch": 4881} {"train_loss": -26.194005966186523, "global_step": 405129, "epoch": 4881} {"train_loss": -26.17168617248535, "global_step": 405130, "epoch": 4881} {"train_loss": -26.155893325805664, "global_step": 405131, "epoch": 4881} {"train_loss": -26.350494384765625, "global_step": 405132, "epoch": 4881} {"train_loss": -25.889053344726562, "global_step": 405133, "epoch": 4881} {"train_loss": -26.06868553161621, "global_step": 405134, "epoch": 4881} {"train_loss": -25.960742950439453, "global_step": 405135, "epoch": 4881} {"train_loss": -26.338165283203125, "global_step": 405136, "epoch": 4881} {"train_loss": -26.314977645874023, "global_step": 405137, "epoch": 4881} {"train_loss": -26.34662437438965, "global_step": 405138, "epoch": 4881} {"train_loss": -26.686094284057617, "global_step": 405139, "epoch": 4881} {"train_loss": -25.988428115844727, "global_step": 405140, "epoch": 4881} {"train_loss": -26.22690773010254, "global_step": 405141, "epoch": 4881} {"train_loss": -26.61004066467285, "global_step": 405142, "epoch": 4881} {"train_loss": -26.437299728393555, "global_step": 405143, "epoch": 4881} {"train_loss": -26.209558486938477, "global_step": 405144, "epoch": 4881} {"train_loss": -26.3394775390625, "global_step": 405145, "epoch": 4881} {"train_loss": -26.18819236755371, "global_step": 405146, "epoch": 4881} {"train_loss": -26.76917839050293, "global_step": 405147, "epoch": 4881} {"train_loss": -26.15382194519043, "global_step": 405148, "epoch": 4881} {"train_loss": -26.389219284057617, "global_step": 405149, "epoch": 4881} {"train_loss": -26.513046264648438, "global_step": 405150, "epoch": 4881} {"train_loss": -26.85407066345215, "global_step": 405151, "epoch": 4881} {"train_loss": -26.557117462158203, "global_step": 405152, "epoch": 4881} {"train_loss": -27.02271842956543, "global_step": 405153, "epoch": 4881} {"train_loss": -26.9764404296875, "global_step": 405154, "epoch": 4881} {"train_loss": -26.42058753967285, "global_step": 405155, "epoch": 4881} {"train_loss": -26.635557174682617, "global_step": 405156, "epoch": 4881} {"train_loss": -27.045429229736328, "global_step": 405157, "epoch": 4881} {"train_loss": -26.578907012939453, "global_step": 405158, "epoch": 4881} {"train_loss": -26.540180206298828, "global_step": 405159, "epoch": 4881} {"train_loss": -26.747547149658203, "global_step": 405160, "epoch": 4881} {"train_loss": -26.958057403564453, "global_step": 405161, "epoch": 4881} {"train_loss": -26.90156364440918, "global_step": 405162, "epoch": 4881} {"train_loss": -26.576650619506836, "global_step": 405163, "epoch": 4881} {"train_loss": -26.657617568969727, "global_step": 405164, "epoch": 4881} {"train_loss": -26.3471622467041, "global_step": 405165, "epoch": 4881} {"train_loss": -26.485498428344727, "global_step": 405166, "epoch": 4881} {"train_loss": -26.790699005126953, "global_step": 405167, "epoch": 4881} {"train_loss": -26.637014389038086, "global_step": 405168, "epoch": 4881} {"train_loss": -26.693023681640625, "global_step": 405169, "epoch": 4881} {"train_loss": -26.471851348876953, "global_step": 405170, "epoch": 4881} {"train_loss": -26.324621200561523, "global_step": 405171, "epoch": 4881} {"train_loss": -27.002593994140625, "global_step": 405172, "epoch": 4881} {"train_loss": -26.5642147064209, "global_step": 405173, "epoch": 4881} {"train_loss": -26.295822143554688, "global_step": 405174, "epoch": 4881} {"train_loss": -26.448776245117188, "global_step": 405175, "epoch": 4881} {"train_loss": -27.0098876953125, "global_step": 405176, "epoch": 4881} {"train_loss": -26.578113555908203, "global_step": 405177, "epoch": 4881} {"train_loss": -26.6223087310791, "global_step": 405178, "epoch": 4881} {"train_loss": -26.610517501831055, "global_step": 405179, "epoch": 4881} {"train_loss": -26.701025009155273, "global_step": 405180, "epoch": 4881} {"train_loss": -26.470367431640625, "global_step": 405181, "epoch": 4881} {"train_loss": -26.36286735534668, "global_step": 405182, "epoch": 4881} {"train_loss": -26.895593643188477, "global_step": 405183, "epoch": 4881} {"train_loss": -26.744709014892578, "global_step": 405184, "epoch": 4881} {"train_loss": -26.844924926757812, "global_step": 405185, "epoch": 4881} {"train_loss": -26.738256454467773, "global_step": 405186, "epoch": 4881} {"train_loss": -26.301671981811523, "global_step": 405187, "epoch": 4881} {"train_loss": -26.578643798828125, "global_step": 405188, "epoch": 4881} {"train_loss": -26.073089599609375, "global_step": 405189, "epoch": 4881} {"train_loss": -26.653884887695312, "global_step": 405190, "epoch": 4881} {"train_loss": -26.871784210205078, "global_step": 405191, "epoch": 4881} {"train_loss": -26.642654418945312, "global_step": 405192, "epoch": 4881} {"train_loss": -26.092975616455078, "global_step": 405193, "epoch": 4881} {"train_loss": -26.730289459228516, "global_step": 405194, "epoch": 4881} {"train_loss": -26.610761642456055, "global_step": 405195, "epoch": 4881} {"train_loss": -26.33539390563965, "global_step": 405196, "epoch": 4881} {"train_loss": -26.889707565307617, "global_step": 405197, "epoch": 4881} {"train_loss": -26.873584747314453, "global_step": 405198, "epoch": 4881} {"train_loss": -26.882205963134766, "global_step": 405199, "epoch": 4881} {"train_loss": -26.906667709350586, "global_step": 405200, "epoch": 4881} {"train_loss": -26.521799087524414, "global_step": 405201, "epoch": 4881} {"train_loss": -27.0017032623291, "global_step": 405202, "epoch": 4881} {"train_loss": -26.398252487182617, "global_step": 405203, "epoch": 4881} {"train_loss": -26.547317504882812, "global_step": 405204, "epoch": 4881} {"train_loss": -26.488081851637507, "global_step": 405205, "epoch": 4881, "val_loss": 6697506.0} {"train_loss": -25.6934814453125, "global_step": 405206, "epoch": 4882} {"train_loss": -27.07448387145996, "global_step": 405207, "epoch": 4882} {"train_loss": -26.151884078979492, "global_step": 405208, "epoch": 4882} {"train_loss": -26.416259765625, "global_step": 405209, "epoch": 4882} {"train_loss": -26.00453758239746, "global_step": 405210, "epoch": 4882} {"train_loss": -26.478540420532227, "global_step": 405211, "epoch": 4882} {"train_loss": -26.254852294921875, "global_step": 405212, "epoch": 4882} {"train_loss": -26.537145614624023, "global_step": 405213, "epoch": 4882} {"train_loss": -26.14178466796875, "global_step": 405214, "epoch": 4882} {"train_loss": -26.568042755126953, "global_step": 405215, "epoch": 4882} {"train_loss": -26.67728614807129, "global_step": 405216, "epoch": 4882} {"train_loss": -26.647266387939453, "global_step": 405217, "epoch": 4882} {"train_loss": -26.503503799438477, "global_step": 405218, "epoch": 4882} {"train_loss": -26.704023361206055, "global_step": 405219, "epoch": 4882} {"train_loss": -26.595746994018555, "global_step": 405220, "epoch": 4882} {"train_loss": -26.738615036010742, "global_step": 405221, "epoch": 4882} {"train_loss": -26.429685592651367, "global_step": 405222, "epoch": 4882} {"train_loss": -26.668537139892578, "global_step": 405223, "epoch": 4882} {"train_loss": -26.679168701171875, "global_step": 405224, "epoch": 4882} {"train_loss": -26.225805282592773, "global_step": 405225, "epoch": 4882} {"train_loss": -26.71469497680664, "global_step": 405226, "epoch": 4882} {"train_loss": -27.099475860595703, "global_step": 405227, "epoch": 4882} {"train_loss": -26.90056800842285, "global_step": 405228, "epoch": 4882} {"train_loss": -26.593557357788086, "global_step": 405229, "epoch": 4882} {"train_loss": -26.43686294555664, "global_step": 405230, "epoch": 4882} {"train_loss": -26.52105140686035, "global_step": 405231, "epoch": 4882} {"train_loss": -27.003076553344727, "global_step": 405232, "epoch": 4882} {"train_loss": -26.491804122924805, "global_step": 405233, "epoch": 4882} {"train_loss": -26.617633819580078, "global_step": 405234, "epoch": 4882} {"train_loss": -26.584253311157227, "global_step": 405235, "epoch": 4882} {"train_loss": -26.80973243713379, "global_step": 405236, "epoch": 4882} {"train_loss": -26.669370651245117, "global_step": 405237, "epoch": 4882} {"train_loss": -26.533613204956055, "global_step": 405238, "epoch": 4882} {"train_loss": -26.522546768188477, "global_step": 405239, "epoch": 4882} {"train_loss": -26.776966094970703, "global_step": 405240, "epoch": 4882} {"train_loss": -26.571542739868164, "global_step": 405241, "epoch": 4882} {"train_loss": -26.711551666259766, "global_step": 405242, "epoch": 4882} {"train_loss": -26.7718563079834, "global_step": 405243, "epoch": 4882} {"train_loss": -26.674301147460938, "global_step": 405244, "epoch": 4882} {"train_loss": -26.43439292907715, "global_step": 405245, "epoch": 4882} {"train_loss": -26.814929962158203, "global_step": 405246, "epoch": 4882} {"train_loss": -26.835651397705078, "global_step": 405247, "epoch": 4882} {"train_loss": -26.6219482421875, "global_step": 405248, "epoch": 4882} {"train_loss": -26.225934982299805, "global_step": 405249, "epoch": 4882} {"train_loss": -26.918426513671875, "global_step": 405250, "epoch": 4882} {"train_loss": -26.634418487548828, "global_step": 405251, "epoch": 4882} {"train_loss": -27.00390625, "global_step": 405252, "epoch": 4882} {"train_loss": -26.919784545898438, "global_step": 405253, "epoch": 4882} {"train_loss": -26.642560958862305, "global_step": 405254, "epoch": 4882} {"train_loss": -26.729379653930664, "global_step": 405255, "epoch": 4882} {"train_loss": -26.67131996154785, "global_step": 405256, "epoch": 4882} {"train_loss": -26.974924087524414, "global_step": 405257, "epoch": 4882} {"train_loss": -26.827726364135742, "global_step": 405258, "epoch": 4882} {"train_loss": -26.732152938842773, "global_step": 405259, "epoch": 4882} {"train_loss": -26.48431968688965, "global_step": 405260, "epoch": 4882} {"train_loss": -26.707077026367188, "global_step": 405261, "epoch": 4882} {"train_loss": -26.373991012573242, "global_step": 405262, "epoch": 4882} {"train_loss": -27.01702308654785, "global_step": 405263, "epoch": 4882} {"train_loss": -26.61805534362793, "global_step": 405264, "epoch": 4882} {"train_loss": -26.453189849853516, "global_step": 405265, "epoch": 4882} {"train_loss": -26.949615478515625, "global_step": 405266, "epoch": 4882} {"train_loss": -26.6002254486084, "global_step": 405267, "epoch": 4882} {"train_loss": -26.412460327148438, "global_step": 405268, "epoch": 4882} {"train_loss": -26.830780029296875, "global_step": 405269, "epoch": 4882} {"train_loss": -26.415063858032227, "global_step": 405270, "epoch": 4882} {"train_loss": -26.40626335144043, "global_step": 405271, "epoch": 4882} {"train_loss": -26.351947784423828, "global_step": 405272, "epoch": 4882} {"train_loss": -27.053003311157227, "global_step": 405273, "epoch": 4882} {"train_loss": -26.488439559936523, "global_step": 405274, "epoch": 4882} {"train_loss": -26.766935348510742, "global_step": 405275, "epoch": 4882} {"train_loss": -27.03162956237793, "global_step": 405276, "epoch": 4882} {"train_loss": -26.397628784179688, "global_step": 405277, "epoch": 4882} {"train_loss": -26.59388542175293, "global_step": 405278, "epoch": 4882} {"train_loss": -26.391204833984375, "global_step": 405279, "epoch": 4882} {"train_loss": -26.849720001220703, "global_step": 405280, "epoch": 4882} {"train_loss": -26.546613693237305, "global_step": 405281, "epoch": 4882} {"train_loss": -27.096668243408203, "global_step": 405282, "epoch": 4882} {"train_loss": -27.091466903686523, "global_step": 405283, "epoch": 4882} {"train_loss": -26.57370376586914, "global_step": 405284, "epoch": 4882} {"train_loss": -27.02644157409668, "global_step": 405285, "epoch": 4882} {"train_loss": -26.55156898498535, "global_step": 405286, "epoch": 4882} {"train_loss": -26.031118392944336, "global_step": 405287, "epoch": 4882} {"train_loss": -26.63611253485622, "global_step": 405288, "epoch": 4882, "val_loss": 6681023.5} {"train_loss": -23.863927841186523, "global_step": 405289, "epoch": 4883} {"train_loss": -25.51154136657715, "global_step": 405290, "epoch": 4883} {"train_loss": -23.35327911376953, "global_step": 405291, "epoch": 4883} {"train_loss": -24.18802261352539, "global_step": 405292, "epoch": 4883} {"train_loss": -25.381607055664062, "global_step": 405293, "epoch": 4883} {"train_loss": -24.648099899291992, "global_step": 405294, "epoch": 4883} {"train_loss": -25.2000789642334, "global_step": 405295, "epoch": 4883} {"train_loss": -25.09990692138672, "global_step": 405296, "epoch": 4883} {"train_loss": -25.247631072998047, "global_step": 405297, "epoch": 4883} {"train_loss": -25.7469482421875, "global_step": 405298, "epoch": 4883} {"train_loss": -24.81492042541504, "global_step": 405299, "epoch": 4883} {"train_loss": -25.762887954711914, "global_step": 405300, "epoch": 4883} {"train_loss": -25.29248809814453, "global_step": 405301, "epoch": 4883} {"train_loss": -25.400304794311523, "global_step": 405302, "epoch": 4883} {"train_loss": -25.473163604736328, "global_step": 405303, "epoch": 4883} {"train_loss": -25.264493942260742, "global_step": 405304, "epoch": 4883} {"train_loss": -25.64505958557129, "global_step": 405305, "epoch": 4883} {"train_loss": -25.71832275390625, "global_step": 405306, "epoch": 4883} {"train_loss": -25.611059188842773, "global_step": 405307, "epoch": 4883} {"train_loss": -25.860946655273438, "global_step": 405308, "epoch": 4883} {"train_loss": -25.880207061767578, "global_step": 405309, "epoch": 4883} {"train_loss": -25.521635055541992, "global_step": 405310, "epoch": 4883} {"train_loss": -25.949188232421875, "global_step": 405311, "epoch": 4883} {"train_loss": -25.454256057739258, "global_step": 405312, "epoch": 4883} {"train_loss": -25.81882095336914, "global_step": 405313, "epoch": 4883} {"train_loss": -25.998371124267578, "global_step": 405314, "epoch": 4883} {"train_loss": -25.860153198242188, "global_step": 405315, "epoch": 4883} {"train_loss": -26.251117706298828, "global_step": 405316, "epoch": 4883} {"train_loss": -25.911405563354492, "global_step": 405317, "epoch": 4883} {"train_loss": -26.4140682220459, "global_step": 405318, "epoch": 4883} {"train_loss": -26.201257705688477, "global_step": 405319, "epoch": 4883} {"train_loss": -26.164600372314453, "global_step": 405320, "epoch": 4883} {"train_loss": -26.562347412109375, "global_step": 405321, "epoch": 4883} {"train_loss": -26.22663688659668, "global_step": 405322, "epoch": 4883} {"train_loss": -26.40423011779785, "global_step": 405323, "epoch": 4883} {"train_loss": -26.419233322143555, "global_step": 405324, "epoch": 4883} {"train_loss": -26.54475975036621, "global_step": 405325, "epoch": 4883} {"train_loss": -26.437528610229492, "global_step": 405326, "epoch": 4883} {"train_loss": -26.262121200561523, "global_step": 405327, "epoch": 4883} {"train_loss": -26.637388229370117, "global_step": 405328, "epoch": 4883} {"train_loss": -26.557714462280273, "global_step": 405329, "epoch": 4883} {"train_loss": -26.661619186401367, "global_step": 405330, "epoch": 4883} {"train_loss": -26.271581649780273, "global_step": 405331, "epoch": 4883} {"train_loss": -26.976104736328125, "global_step": 405332, "epoch": 4883} {"train_loss": -26.617633819580078, "global_step": 405333, "epoch": 4883} {"train_loss": -26.525999069213867, "global_step": 405334, "epoch": 4883} {"train_loss": -27.04144287109375, "global_step": 405335, "epoch": 4883} {"train_loss": -26.70464515686035, "global_step": 405336, "epoch": 4883} {"train_loss": -26.694955825805664, "global_step": 405337, "epoch": 4883} {"train_loss": -26.4697322845459, "global_step": 405338, "epoch": 4883} {"train_loss": -27.063079833984375, "global_step": 405339, "epoch": 4883} {"train_loss": -26.736316680908203, "global_step": 405340, "epoch": 4883} {"train_loss": -26.743255615234375, "global_step": 405341, "epoch": 4883} {"train_loss": -26.835302352905273, "global_step": 405342, "epoch": 4883} {"train_loss": -26.984827041625977, "global_step": 405343, "epoch": 4883} {"train_loss": -27.00628662109375, "global_step": 405344, "epoch": 4883} {"train_loss": -26.940662384033203, "global_step": 405345, "epoch": 4883} {"train_loss": -27.048715591430664, "global_step": 405346, "epoch": 4883} {"train_loss": -26.752195358276367, "global_step": 405347, "epoch": 4883} {"train_loss": -26.614294052124023, "global_step": 405348, "epoch": 4883} {"train_loss": -26.890533447265625, "global_step": 405349, "epoch": 4883} {"train_loss": -26.444122314453125, "global_step": 405350, "epoch": 4883} {"train_loss": -26.41840171813965, "global_step": 405351, "epoch": 4883} {"train_loss": -25.791706085205078, "global_step": 405352, "epoch": 4883} {"train_loss": -25.249069213867188, "global_step": 405353, "epoch": 4883} {"train_loss": -25.32985496520996, "global_step": 405354, "epoch": 4883} {"train_loss": -26.87837028503418, "global_step": 405355, "epoch": 4883} {"train_loss": -26.28375816345215, "global_step": 405356, "epoch": 4883} {"train_loss": -25.7535457611084, "global_step": 405357, "epoch": 4883} {"train_loss": -26.68886375427246, "global_step": 405358, "epoch": 4883} {"train_loss": -26.444448471069336, "global_step": 405359, "epoch": 4883} {"train_loss": -26.252660751342773, "global_step": 405360, "epoch": 4883} {"train_loss": -26.272886276245117, "global_step": 405361, "epoch": 4883} {"train_loss": -26.785154342651367, "global_step": 405362, "epoch": 4883} {"train_loss": -26.132862091064453, "global_step": 405363, "epoch": 4883} {"train_loss": -26.47909927368164, "global_step": 405364, "epoch": 4883} {"train_loss": -26.271081924438477, "global_step": 405365, "epoch": 4883} {"train_loss": -26.647790908813477, "global_step": 405366, "epoch": 4883} {"train_loss": -26.428876876831055, "global_step": 405367, "epoch": 4883} {"train_loss": -26.431354522705078, "global_step": 405368, "epoch": 4883} {"train_loss": -26.4835262298584, "global_step": 405369, "epoch": 4883} {"train_loss": -26.601911544799805, "global_step": 405370, "epoch": 4883} {"train_loss": -26.12834845393537, "global_step": 405371, "epoch": 4883, "val_loss": 6688986.5} {"train_loss": -25.645923614501953, "global_step": 405372, "epoch": 4884} {"train_loss": -26.06955909729004, "global_step": 405373, "epoch": 4884} {"train_loss": -25.581531524658203, "global_step": 405374, "epoch": 4884} {"train_loss": -25.706439971923828, "global_step": 405375, "epoch": 4884} {"train_loss": -26.011953353881836, "global_step": 405376, "epoch": 4884} {"train_loss": -26.094146728515625, "global_step": 405377, "epoch": 4884} {"train_loss": -26.472824096679688, "global_step": 405378, "epoch": 4884} {"train_loss": -26.53177833557129, "global_step": 405379, "epoch": 4884} {"train_loss": -26.68897819519043, "global_step": 405380, "epoch": 4884} {"train_loss": -26.58632469177246, "global_step": 405381, "epoch": 4884} {"train_loss": -26.544269561767578, "global_step": 405382, "epoch": 4884} {"train_loss": -26.4186954498291, "global_step": 405383, "epoch": 4884} {"train_loss": -26.392810821533203, "global_step": 405384, "epoch": 4884} {"train_loss": -26.584177017211914, "global_step": 405385, "epoch": 4884} {"train_loss": -26.849899291992188, "global_step": 405386, "epoch": 4884} {"train_loss": -26.623703002929688, "global_step": 405387, "epoch": 4884} {"train_loss": -26.539871215820312, "global_step": 405388, "epoch": 4884} {"train_loss": -26.29962730407715, "global_step": 405389, "epoch": 4884} {"train_loss": -26.71445083618164, "global_step": 405390, "epoch": 4884} {"train_loss": -26.373449325561523, "global_step": 405391, "epoch": 4884} {"train_loss": -27.047576904296875, "global_step": 405392, "epoch": 4884} {"train_loss": -26.589431762695312, "global_step": 405393, "epoch": 4884} {"train_loss": -26.87922477722168, "global_step": 405394, "epoch": 4884} {"train_loss": -27.057266235351562, "global_step": 405395, "epoch": 4884} {"train_loss": -26.895822525024414, "global_step": 405396, "epoch": 4884} {"train_loss": -26.67034912109375, "global_step": 405397, "epoch": 4884} {"train_loss": -26.51778221130371, "global_step": 405398, "epoch": 4884} {"train_loss": -26.7899169921875, "global_step": 405399, "epoch": 4884} {"train_loss": -26.57053565979004, "global_step": 405400, "epoch": 4884} {"train_loss": -26.79595947265625, "global_step": 405401, "epoch": 4884} {"train_loss": -26.407135009765625, "global_step": 405402, "epoch": 4884} {"train_loss": -26.419754028320312, "global_step": 405403, "epoch": 4884} {"train_loss": -26.609975814819336, "global_step": 405404, "epoch": 4884} {"train_loss": -26.432844161987305, "global_step": 405405, "epoch": 4884} {"train_loss": -26.85854148864746, "global_step": 405406, "epoch": 4884} {"train_loss": -26.976947784423828, "global_step": 405407, "epoch": 4884} {"train_loss": -26.8757381439209, "global_step": 405408, "epoch": 4884} {"train_loss": -26.525876998901367, "global_step": 405409, "epoch": 4884} {"train_loss": -26.888952255249023, "global_step": 405410, "epoch": 4884} {"train_loss": -27.088001251220703, "global_step": 405411, "epoch": 4884} {"train_loss": -26.7332763671875, "global_step": 405412, "epoch": 4884} {"train_loss": -27.163410186767578, "global_step": 405413, "epoch": 4884} {"train_loss": -26.6905574798584, "global_step": 405414, "epoch": 4884} {"train_loss": -27.01185417175293, "global_step": 405415, "epoch": 4884} {"train_loss": -26.609954833984375, "global_step": 405416, "epoch": 4884} {"train_loss": -26.555591583251953, "global_step": 405417, "epoch": 4884} {"train_loss": -26.40470314025879, "global_step": 405418, "epoch": 4884} {"train_loss": -26.069217681884766, "global_step": 405419, "epoch": 4884} {"train_loss": -25.677066802978516, "global_step": 405420, "epoch": 4884} {"train_loss": -25.69070816040039, "global_step": 405421, "epoch": 4884} {"train_loss": -26.578454971313477, "global_step": 405422, "epoch": 4884} {"train_loss": -26.997507095336914, "global_step": 405423, "epoch": 4884} {"train_loss": -26.26752281188965, "global_step": 405424, "epoch": 4884} {"train_loss": -26.534454345703125, "global_step": 405425, "epoch": 4884} {"train_loss": -26.7619571685791, "global_step": 405426, "epoch": 4884} {"train_loss": -26.943603515625, "global_step": 405427, "epoch": 4884} {"train_loss": -26.777692794799805, "global_step": 405428, "epoch": 4884} {"train_loss": -26.723407745361328, "global_step": 405429, "epoch": 4884} {"train_loss": -26.14105796813965, "global_step": 405430, "epoch": 4884} {"train_loss": -26.559324264526367, "global_step": 405431, "epoch": 4884} {"train_loss": -26.529388427734375, "global_step": 405432, "epoch": 4884} {"train_loss": -26.741193771362305, "global_step": 405433, "epoch": 4884} {"train_loss": -26.84902000427246, "global_step": 405434, "epoch": 4884} {"train_loss": -26.746850967407227, "global_step": 405435, "epoch": 4884} {"train_loss": -26.772674560546875, "global_step": 405436, "epoch": 4884} {"train_loss": -26.682294845581055, "global_step": 405437, "epoch": 4884} {"train_loss": -26.884008407592773, "global_step": 405438, "epoch": 4884} {"train_loss": -26.79559326171875, "global_step": 405439, "epoch": 4884} {"train_loss": -26.729047775268555, "global_step": 405440, "epoch": 4884} {"train_loss": -26.734088897705078, "global_step": 405441, "epoch": 4884} {"train_loss": -26.97901725769043, "global_step": 405442, "epoch": 4884} {"train_loss": -26.686559677124023, "global_step": 405443, "epoch": 4884} {"train_loss": -26.81805992126465, "global_step": 405444, "epoch": 4884} {"train_loss": -27.135229110717773, "global_step": 405445, "epoch": 4884} {"train_loss": -26.963109970092773, "global_step": 405446, "epoch": 4884} {"train_loss": -26.489099502563477, "global_step": 405447, "epoch": 4884} {"train_loss": -26.778833389282227, "global_step": 405448, "epoch": 4884} {"train_loss": -26.798437118530273, "global_step": 405449, "epoch": 4884} {"train_loss": -26.7131290435791, "global_step": 405450, "epoch": 4884} {"train_loss": -26.581756591796875, "global_step": 405451, "epoch": 4884} {"train_loss": -26.74490737915039, "global_step": 405452, "epoch": 4884} {"train_loss": -27.146087646484375, "global_step": 405453, "epoch": 4884} {"train_loss": -26.58996965798987, "global_step": 405454, "epoch": 4884, "val_loss": 6729238.5} {"train_loss": -26.331344604492188, "global_step": 405455, "epoch": 4885} {"train_loss": -25.664636611938477, "global_step": 405456, "epoch": 4885} {"train_loss": -26.960254669189453, "global_step": 405457, "epoch": 4885} {"train_loss": -26.422266006469727, "global_step": 405458, "epoch": 4885} {"train_loss": -25.978973388671875, "global_step": 405459, "epoch": 4885} {"train_loss": -26.5915470123291, "global_step": 405460, "epoch": 4885} {"train_loss": -25.7054500579834, "global_step": 405461, "epoch": 4885} {"train_loss": -26.231531143188477, "global_step": 405462, "epoch": 4885} {"train_loss": -26.07661247253418, "global_step": 405463, "epoch": 4885} {"train_loss": -25.955902099609375, "global_step": 405464, "epoch": 4885} {"train_loss": -26.235431671142578, "global_step": 405465, "epoch": 4885} {"train_loss": -26.302900314331055, "global_step": 405466, "epoch": 4885} {"train_loss": -26.47962760925293, "global_step": 405467, "epoch": 4885} {"train_loss": -26.354963302612305, "global_step": 405468, "epoch": 4885} {"train_loss": -26.542530059814453, "global_step": 405469, "epoch": 4885} {"train_loss": -26.817306518554688, "global_step": 405470, "epoch": 4885} {"train_loss": -26.230268478393555, "global_step": 405471, "epoch": 4885} {"train_loss": -26.87603187561035, "global_step": 405472, "epoch": 4885} {"train_loss": -26.936384201049805, "global_step": 405473, "epoch": 4885} {"train_loss": -26.444631576538086, "global_step": 405474, "epoch": 4885} {"train_loss": -26.556991577148438, "global_step": 405475, "epoch": 4885} {"train_loss": -26.7611141204834, "global_step": 405476, "epoch": 4885} {"train_loss": -26.41107177734375, "global_step": 405477, "epoch": 4885} {"train_loss": -26.789655685424805, "global_step": 405478, "epoch": 4885} {"train_loss": -26.80645751953125, "global_step": 405479, "epoch": 4885} {"train_loss": -26.4239501953125, "global_step": 405480, "epoch": 4885} {"train_loss": -26.829700469970703, "global_step": 405481, "epoch": 4885} {"train_loss": -26.46352195739746, "global_step": 405482, "epoch": 4885} {"train_loss": -26.758636474609375, "global_step": 405483, "epoch": 4885} {"train_loss": -26.639633178710938, "global_step": 405484, "epoch": 4885} {"train_loss": -26.777435302734375, "global_step": 405485, "epoch": 4885} {"train_loss": -26.799474716186523, "global_step": 405486, "epoch": 4885} {"train_loss": -26.696802139282227, "global_step": 405487, "epoch": 4885} {"train_loss": -26.635568618774414, "global_step": 405488, "epoch": 4885} {"train_loss": -26.702716827392578, "global_step": 405489, "epoch": 4885} {"train_loss": -26.656021118164062, "global_step": 405490, "epoch": 4885} {"train_loss": -26.56170654296875, "global_step": 405491, "epoch": 4885} {"train_loss": -27.012924194335938, "global_step": 405492, "epoch": 4885} {"train_loss": -26.583999633789062, "global_step": 405493, "epoch": 4885} {"train_loss": -27.050251007080078, "global_step": 405494, "epoch": 4885} {"train_loss": -26.430021286010742, "global_step": 405495, "epoch": 4885} {"train_loss": -26.6778621673584, "global_step": 405496, "epoch": 4885} {"train_loss": -26.566946029663086, "global_step": 405497, "epoch": 4885} {"train_loss": -26.793262481689453, "global_step": 405498, "epoch": 4885} {"train_loss": -27.047367095947266, "global_step": 405499, "epoch": 4885} {"train_loss": -26.44961929321289, "global_step": 405500, "epoch": 4885} {"train_loss": -26.527124404907227, "global_step": 405501, "epoch": 4885} {"train_loss": -26.448232650756836, "global_step": 405502, "epoch": 4885} {"train_loss": -26.5750675201416, "global_step": 405503, "epoch": 4885} {"train_loss": -26.207462310791016, "global_step": 405504, "epoch": 4885} {"train_loss": -26.41251564025879, "global_step": 405505, "epoch": 4885} {"train_loss": -25.991662979125977, "global_step": 405506, "epoch": 4885} {"train_loss": -25.80344009399414, "global_step": 405507, "epoch": 4885} {"train_loss": -25.758874893188477, "global_step": 405508, "epoch": 4885} {"train_loss": -26.55145263671875, "global_step": 405509, "epoch": 4885} {"train_loss": -26.435876846313477, "global_step": 405510, "epoch": 4885} {"train_loss": -26.25640296936035, "global_step": 405511, "epoch": 4885} {"train_loss": -26.2606143951416, "global_step": 405512, "epoch": 4885} {"train_loss": -26.3136043548584, "global_step": 405513, "epoch": 4885} {"train_loss": -26.45778465270996, "global_step": 405514, "epoch": 4885} {"train_loss": -26.314817428588867, "global_step": 405515, "epoch": 4885} {"train_loss": -26.254638671875, "global_step": 405516, "epoch": 4885} {"train_loss": -26.675817489624023, "global_step": 405517, "epoch": 4885} {"train_loss": -26.239765167236328, "global_step": 405518, "epoch": 4885} {"train_loss": -26.241941452026367, "global_step": 405519, "epoch": 4885} {"train_loss": -26.52596092224121, "global_step": 405520, "epoch": 4885} {"train_loss": -26.627307891845703, "global_step": 405521, "epoch": 4885} {"train_loss": -26.543787002563477, "global_step": 405522, "epoch": 4885} {"train_loss": -26.850439071655273, "global_step": 405523, "epoch": 4885} {"train_loss": -26.361066818237305, "global_step": 405524, "epoch": 4885} {"train_loss": -26.378644943237305, "global_step": 405525, "epoch": 4885} {"train_loss": -26.548053741455078, "global_step": 405526, "epoch": 4885} {"train_loss": -26.474607467651367, "global_step": 405527, "epoch": 4885} {"train_loss": -26.69317626953125, "global_step": 405528, "epoch": 4885} {"train_loss": -26.5637264251709, "global_step": 405529, "epoch": 4885} {"train_loss": -26.630390167236328, "global_step": 405530, "epoch": 4885} {"train_loss": -26.84967041015625, "global_step": 405531, "epoch": 4885} {"train_loss": -26.890928268432617, "global_step": 405532, "epoch": 4885} {"train_loss": -26.848920822143555, "global_step": 405533, "epoch": 4885} {"train_loss": -26.9489688873291, "global_step": 405534, "epoch": 4885} {"train_loss": -27.035430908203125, "global_step": 405535, "epoch": 4885} {"train_loss": -26.85991859436035, "global_step": 405536, "epoch": 4885} {"train_loss": -26.527794573680463, "global_step": 405537, "epoch": 4885, "val_loss": 6650690.0} {"train_loss": -26.737695693969727, "global_step": 405538, "epoch": 4886} {"train_loss": -26.853424072265625, "global_step": 405539, "epoch": 4886} {"train_loss": -26.6112003326416, "global_step": 405540, "epoch": 4886} {"train_loss": -26.48414421081543, "global_step": 405541, "epoch": 4886} {"train_loss": -26.715314865112305, "global_step": 405542, "epoch": 4886} {"train_loss": -26.4569149017334, "global_step": 405543, "epoch": 4886} {"train_loss": -26.693286895751953, "global_step": 405544, "epoch": 4886} {"train_loss": -26.7751407623291, "global_step": 405545, "epoch": 4886} {"train_loss": -26.32501792907715, "global_step": 405546, "epoch": 4886} {"train_loss": -26.426055908203125, "global_step": 405547, "epoch": 4886} {"train_loss": -26.485492706298828, "global_step": 405548, "epoch": 4886} {"train_loss": -26.589170455932617, "global_step": 405549, "epoch": 4886} {"train_loss": -26.308425903320312, "global_step": 405550, "epoch": 4886} {"train_loss": -26.863611221313477, "global_step": 405551, "epoch": 4886} {"train_loss": -26.908370971679688, "global_step": 405552, "epoch": 4886} {"train_loss": -26.953821182250977, "global_step": 405553, "epoch": 4886} {"train_loss": -26.477680206298828, "global_step": 405554, "epoch": 4886} {"train_loss": -26.61317253112793, "global_step": 405555, "epoch": 4886} {"train_loss": -26.70088005065918, "global_step": 405556, "epoch": 4886} {"train_loss": -26.387435913085938, "global_step": 405557, "epoch": 4886} {"train_loss": -26.691232681274414, "global_step": 405558, "epoch": 4886} {"train_loss": -26.625080108642578, "global_step": 405559, "epoch": 4886} {"train_loss": -27.040735244750977, "global_step": 405560, "epoch": 4886} {"train_loss": -26.714862823486328, "global_step": 405561, "epoch": 4886} {"train_loss": -26.762964248657227, "global_step": 405562, "epoch": 4886} {"train_loss": -26.294647216796875, "global_step": 405563, "epoch": 4886} {"train_loss": -26.7854061126709, "global_step": 405564, "epoch": 4886} {"train_loss": -26.611103057861328, "global_step": 405565, "epoch": 4886} {"train_loss": -26.782800674438477, "global_step": 405566, "epoch": 4886} {"train_loss": -26.902082443237305, "global_step": 405567, "epoch": 4886} {"train_loss": -26.714874267578125, "global_step": 405568, "epoch": 4886} {"train_loss": -26.77797508239746, "global_step": 405569, "epoch": 4886} {"train_loss": -26.552200317382812, "global_step": 405570, "epoch": 4886} {"train_loss": -26.679325103759766, "global_step": 405571, "epoch": 4886} {"train_loss": -26.772958755493164, "global_step": 405572, "epoch": 4886} {"train_loss": -26.801136016845703, "global_step": 405573, "epoch": 4886} {"train_loss": -26.60767936706543, "global_step": 405574, "epoch": 4886} {"train_loss": -26.98236656188965, "global_step": 405575, "epoch": 4886} {"train_loss": -26.566267013549805, "global_step": 405576, "epoch": 4886} {"train_loss": -26.80120849609375, "global_step": 405577, "epoch": 4886} {"train_loss": -26.285608291625977, "global_step": 405578, "epoch": 4886} {"train_loss": -26.714340209960938, "global_step": 405579, "epoch": 4886} {"train_loss": -26.85164451599121, "global_step": 405580, "epoch": 4886} {"train_loss": -27.04670524597168, "global_step": 405581, "epoch": 4886} {"train_loss": -26.886457443237305, "global_step": 405582, "epoch": 4886} {"train_loss": -26.96078872680664, "global_step": 405583, "epoch": 4886} {"train_loss": -27.020750045776367, "global_step": 405584, "epoch": 4886} {"train_loss": -26.6739501953125, "global_step": 405585, "epoch": 4886} {"train_loss": -26.656339645385742, "global_step": 405586, "epoch": 4886} {"train_loss": -26.673139572143555, "global_step": 405587, "epoch": 4886} {"train_loss": -26.90693473815918, "global_step": 405588, "epoch": 4886} {"train_loss": -26.96671485900879, "global_step": 405589, "epoch": 4886} {"train_loss": -26.615589141845703, "global_step": 405590, "epoch": 4886} {"train_loss": -27.334640502929688, "global_step": 405591, "epoch": 4886} {"train_loss": -26.597015380859375, "global_step": 405592, "epoch": 4886} {"train_loss": -26.601770401000977, "global_step": 405593, "epoch": 4886} {"train_loss": -26.84547233581543, "global_step": 405594, "epoch": 4886} {"train_loss": -26.735309600830078, "global_step": 405595, "epoch": 4886} {"train_loss": -27.272979736328125, "global_step": 405596, "epoch": 4886} {"train_loss": -26.8116512298584, "global_step": 405597, "epoch": 4886} {"train_loss": -26.705793380737305, "global_step": 405598, "epoch": 4886} {"train_loss": -26.64676284790039, "global_step": 405599, "epoch": 4886} {"train_loss": -26.5753116607666, "global_step": 405600, "epoch": 4886} {"train_loss": -26.53704833984375, "global_step": 405601, "epoch": 4886} {"train_loss": -27.27446937561035, "global_step": 405602, "epoch": 4886} {"train_loss": -27.120655059814453, "global_step": 405603, "epoch": 4886} {"train_loss": -26.904682159423828, "global_step": 405604, "epoch": 4886} {"train_loss": -26.764862060546875, "global_step": 405605, "epoch": 4886} {"train_loss": -26.90069580078125, "global_step": 405606, "epoch": 4886} {"train_loss": -26.51259422302246, "global_step": 405607, "epoch": 4886} {"train_loss": -26.667402267456055, "global_step": 405608, "epoch": 4886} {"train_loss": -26.462461471557617, "global_step": 405609, "epoch": 4886} {"train_loss": -26.724750518798828, "global_step": 405610, "epoch": 4886} {"train_loss": -26.928632736206055, "global_step": 405611, "epoch": 4886} {"train_loss": -26.984939575195312, "global_step": 405612, "epoch": 4886} {"train_loss": -26.917234420776367, "global_step": 405613, "epoch": 4886} {"train_loss": -26.698835372924805, "global_step": 405614, "epoch": 4886} {"train_loss": -27.027481079101562, "global_step": 405615, "epoch": 4886} {"train_loss": -26.373401641845703, "global_step": 405616, "epoch": 4886} {"train_loss": -26.352705001831055, "global_step": 405617, "epoch": 4886} {"train_loss": -26.13941764831543, "global_step": 405618, "epoch": 4886} {"train_loss": -25.74152183532715, "global_step": 405619, "epoch": 4886} {"train_loss": -26.675607014851398, "global_step": 405620, "epoch": 4886, "val_loss": 6719954.0} {"train_loss": -20.723535537719727, "global_step": 405621, "epoch": 4887} {"train_loss": -24.74104118347168, "global_step": 405622, "epoch": 4887} {"train_loss": -22.735658645629883, "global_step": 405623, "epoch": 4887} {"train_loss": -24.215734481811523, "global_step": 405624, "epoch": 4887} {"train_loss": -24.395902633666992, "global_step": 405625, "epoch": 4887} {"train_loss": -23.288015365600586, "global_step": 405626, "epoch": 4887} {"train_loss": -25.03449821472168, "global_step": 405627, "epoch": 4887} {"train_loss": -24.380216598510742, "global_step": 405628, "epoch": 4887} {"train_loss": -24.8460693359375, "global_step": 405629, "epoch": 4887} {"train_loss": -24.60333251953125, "global_step": 405630, "epoch": 4887} {"train_loss": -25.33522605895996, "global_step": 405631, "epoch": 4887} {"train_loss": -24.738494873046875, "global_step": 405632, "epoch": 4887} {"train_loss": -25.277124404907227, "global_step": 405633, "epoch": 4887} {"train_loss": -24.427061080932617, "global_step": 405634, "epoch": 4887} {"train_loss": -25.16091537475586, "global_step": 405635, "epoch": 4887} {"train_loss": -25.051572799682617, "global_step": 405636, "epoch": 4887} {"train_loss": -25.409873962402344, "global_step": 405637, "epoch": 4887} {"train_loss": -25.418819427490234, "global_step": 405638, "epoch": 4887} {"train_loss": -25.528522491455078, "global_step": 405639, "epoch": 4887} {"train_loss": -25.230958938598633, "global_step": 405640, "epoch": 4887} {"train_loss": -25.22371482849121, "global_step": 405641, "epoch": 4887} {"train_loss": -25.11356544494629, "global_step": 405642, "epoch": 4887} {"train_loss": -25.723819732666016, "global_step": 405643, "epoch": 4887} {"train_loss": -25.689611434936523, "global_step": 405644, "epoch": 4887} {"train_loss": -25.652667999267578, "global_step": 405645, "epoch": 4887} {"train_loss": -26.077463150024414, "global_step": 405646, "epoch": 4887} {"train_loss": -25.1220760345459, "global_step": 405647, "epoch": 4887} {"train_loss": -25.77640724182129, "global_step": 405648, "epoch": 4887} {"train_loss": -25.469051361083984, "global_step": 405649, "epoch": 4887} {"train_loss": -25.90998649597168, "global_step": 405650, "epoch": 4887} {"train_loss": -25.422834396362305, "global_step": 405651, "epoch": 4887} {"train_loss": -25.863712310791016, "global_step": 405652, "epoch": 4887} {"train_loss": -25.831424713134766, "global_step": 405653, "epoch": 4887} {"train_loss": -26.007644653320312, "global_step": 405654, "epoch": 4887} {"train_loss": -25.790634155273438, "global_step": 405655, "epoch": 4887} {"train_loss": -26.327219009399414, "global_step": 405656, "epoch": 4887} {"train_loss": -26.231061935424805, "global_step": 405657, "epoch": 4887} {"train_loss": -25.908538818359375, "global_step": 405658, "epoch": 4887} {"train_loss": -26.20181655883789, "global_step": 405659, "epoch": 4887} {"train_loss": -26.156238555908203, "global_step": 405660, "epoch": 4887} {"train_loss": -26.076948165893555, "global_step": 405661, "epoch": 4887} {"train_loss": -26.228713989257812, "global_step": 405662, "epoch": 4887} {"train_loss": -26.46074867248535, "global_step": 405663, "epoch": 4887} {"train_loss": -26.001087188720703, "global_step": 405664, "epoch": 4887} {"train_loss": -26.392822265625, "global_step": 405665, "epoch": 4887} {"train_loss": -26.291351318359375, "global_step": 405666, "epoch": 4887} {"train_loss": -26.44183349609375, "global_step": 405667, "epoch": 4887} {"train_loss": -26.655729293823242, "global_step": 405668, "epoch": 4887} {"train_loss": -26.050098419189453, "global_step": 405669, "epoch": 4887} {"train_loss": -26.370426177978516, "global_step": 405670, "epoch": 4887} {"train_loss": -26.554092407226562, "global_step": 405671, "epoch": 4887} {"train_loss": -26.15497398376465, "global_step": 405672, "epoch": 4887} {"train_loss": -26.355854034423828, "global_step": 405673, "epoch": 4887} {"train_loss": -26.087574005126953, "global_step": 405674, "epoch": 4887} {"train_loss": -26.68210792541504, "global_step": 405675, "epoch": 4887} {"train_loss": -26.56972312927246, "global_step": 405676, "epoch": 4887} {"train_loss": -26.539413452148438, "global_step": 405677, "epoch": 4887} {"train_loss": -26.626922607421875, "global_step": 405678, "epoch": 4887} {"train_loss": -25.85442543029785, "global_step": 405679, "epoch": 4887} {"train_loss": -26.372894287109375, "global_step": 405680, "epoch": 4887} {"train_loss": -26.6380615234375, "global_step": 405681, "epoch": 4887} {"train_loss": -26.346527099609375, "global_step": 405682, "epoch": 4887} {"train_loss": -25.96484375, "global_step": 405683, "epoch": 4887} {"train_loss": -26.447019577026367, "global_step": 405684, "epoch": 4887} {"train_loss": -25.843420028686523, "global_step": 405685, "epoch": 4887} {"train_loss": -26.57758140563965, "global_step": 405686, "epoch": 4887} {"train_loss": -26.141393661499023, "global_step": 405687, "epoch": 4887} {"train_loss": -25.91706657409668, "global_step": 405688, "epoch": 4887} {"train_loss": -26.116601943969727, "global_step": 405689, "epoch": 4887} {"train_loss": -26.12812614440918, "global_step": 405690, "epoch": 4887} {"train_loss": -26.51702880859375, "global_step": 405691, "epoch": 4887} {"train_loss": -26.261920928955078, "global_step": 405692, "epoch": 4887} {"train_loss": -26.143545150756836, "global_step": 405693, "epoch": 4887} {"train_loss": -26.67353630065918, "global_step": 405694, "epoch": 4887} {"train_loss": -26.2600040435791, "global_step": 405695, "epoch": 4887} {"train_loss": -26.370471954345703, "global_step": 405696, "epoch": 4887} {"train_loss": -26.445404052734375, "global_step": 405697, "epoch": 4887} {"train_loss": -26.440876007080078, "global_step": 405698, "epoch": 4887} {"train_loss": -26.465869903564453, "global_step": 405699, "epoch": 4887} {"train_loss": -26.4401798248291, "global_step": 405700, "epoch": 4887} {"train_loss": -26.389509201049805, "global_step": 405701, "epoch": 4887} {"train_loss": -26.59461784362793, "global_step": 405702, "epoch": 4887} {"train_loss": -25.756183095725184, "global_step": 405703, "epoch": 4887, "val_loss": 6565064.5} {"train_loss": -26.4160099029541, "global_step": 405704, "epoch": 4888} {"train_loss": -25.677953720092773, "global_step": 405705, "epoch": 4888} {"train_loss": -25.968942642211914, "global_step": 405706, "epoch": 4888} {"train_loss": -26.1580753326416, "global_step": 405707, "epoch": 4888} {"train_loss": -26.09638786315918, "global_step": 405708, "epoch": 4888} {"train_loss": -26.314664840698242, "global_step": 405709, "epoch": 4888} {"train_loss": -26.395734786987305, "global_step": 405710, "epoch": 4888} {"train_loss": -26.442768096923828, "global_step": 405711, "epoch": 4888} {"train_loss": -26.1734561920166, "global_step": 405712, "epoch": 4888} {"train_loss": -26.338727951049805, "global_step": 405713, "epoch": 4888} {"train_loss": -26.59235954284668, "global_step": 405714, "epoch": 4888} {"train_loss": -26.79335594177246, "global_step": 405715, "epoch": 4888} {"train_loss": -26.72113037109375, "global_step": 405716, "epoch": 4888} {"train_loss": -26.57496452331543, "global_step": 405717, "epoch": 4888} {"train_loss": -26.470640182495117, "global_step": 405718, "epoch": 4888} {"train_loss": -26.4921932220459, "global_step": 405719, "epoch": 4888} {"train_loss": -26.397855758666992, "global_step": 405720, "epoch": 4888} {"train_loss": -26.638166427612305, "global_step": 405721, "epoch": 4888} {"train_loss": -26.77736473083496, "global_step": 405722, "epoch": 4888} {"train_loss": -26.526350021362305, "global_step": 405723, "epoch": 4888} {"train_loss": -26.946094512939453, "global_step": 405724, "epoch": 4888} {"train_loss": -26.85407829284668, "global_step": 405725, "epoch": 4888} {"train_loss": -26.91900062561035, "global_step": 405726, "epoch": 4888} {"train_loss": -26.489927291870117, "global_step": 405727, "epoch": 4888} {"train_loss": -26.8679141998291, "global_step": 405728, "epoch": 4888} {"train_loss": -26.777225494384766, "global_step": 405729, "epoch": 4888} {"train_loss": -27.01435661315918, "global_step": 405730, "epoch": 4888} {"train_loss": -27.09235954284668, "global_step": 405731, "epoch": 4888} {"train_loss": -27.031503677368164, "global_step": 405732, "epoch": 4888} {"train_loss": -26.764907836914062, "global_step": 405733, "epoch": 4888} {"train_loss": -26.930164337158203, "global_step": 405734, "epoch": 4888} {"train_loss": -26.82209587097168, "global_step": 405735, "epoch": 4888} {"train_loss": -26.9074649810791, "global_step": 405736, "epoch": 4888} {"train_loss": -26.94791030883789, "global_step": 405737, "epoch": 4888} {"train_loss": -26.930255889892578, "global_step": 405738, "epoch": 4888} {"train_loss": -26.87420654296875, "global_step": 405739, "epoch": 4888} {"train_loss": -27.16877555847168, "global_step": 405740, "epoch": 4888} {"train_loss": -26.8533878326416, "global_step": 405741, "epoch": 4888} {"train_loss": -26.83542251586914, "global_step": 405742, "epoch": 4888} {"train_loss": -26.759307861328125, "global_step": 405743, "epoch": 4888} {"train_loss": -27.1760196685791, "global_step": 405744, "epoch": 4888} {"train_loss": -26.683765411376953, "global_step": 405745, "epoch": 4888} {"train_loss": -26.920568466186523, "global_step": 405746, "epoch": 4888} {"train_loss": -26.87747573852539, "global_step": 405747, "epoch": 4888} {"train_loss": -26.3772029876709, "global_step": 405748, "epoch": 4888} {"train_loss": -26.85706901550293, "global_step": 405749, "epoch": 4888} {"train_loss": -26.698444366455078, "global_step": 405750, "epoch": 4888} {"train_loss": -26.63422203063965, "global_step": 405751, "epoch": 4888} {"train_loss": -26.840957641601562, "global_step": 405752, "epoch": 4888} {"train_loss": -26.77735710144043, "global_step": 405753, "epoch": 4888} {"train_loss": -26.904224395751953, "global_step": 405754, "epoch": 4888} {"train_loss": -26.6328182220459, "global_step": 405755, "epoch": 4888} {"train_loss": -26.927997589111328, "global_step": 405756, "epoch": 4888} {"train_loss": -26.555023193359375, "global_step": 405757, "epoch": 4888} {"train_loss": -26.963794708251953, "global_step": 405758, "epoch": 4888} {"train_loss": -26.668493270874023, "global_step": 405759, "epoch": 4888} {"train_loss": -26.306936264038086, "global_step": 405760, "epoch": 4888} {"train_loss": -26.41145133972168, "global_step": 405761, "epoch": 4888} {"train_loss": -26.634443283081055, "global_step": 405762, "epoch": 4888} {"train_loss": -26.56491470336914, "global_step": 405763, "epoch": 4888} {"train_loss": -26.417861938476562, "global_step": 405764, "epoch": 4888} {"train_loss": -26.710783004760742, "global_step": 405765, "epoch": 4888} {"train_loss": -26.68226432800293, "global_step": 405766, "epoch": 4888} {"train_loss": -26.705808639526367, "global_step": 405767, "epoch": 4888} {"train_loss": -26.675275802612305, "global_step": 405768, "epoch": 4888} {"train_loss": -26.910680770874023, "global_step": 405769, "epoch": 4888} {"train_loss": -26.6635799407959, "global_step": 405770, "epoch": 4888} {"train_loss": -26.68790054321289, "global_step": 405771, "epoch": 4888} {"train_loss": -26.715988159179688, "global_step": 405772, "epoch": 4888} {"train_loss": -26.858423233032227, "global_step": 405773, "epoch": 4888} {"train_loss": -26.823217391967773, "global_step": 405774, "epoch": 4888} {"train_loss": -26.55518913269043, "global_step": 405775, "epoch": 4888} {"train_loss": -26.753515243530273, "global_step": 405776, "epoch": 4888} {"train_loss": -26.876306533813477, "global_step": 405777, "epoch": 4888} {"train_loss": -26.965682983398438, "global_step": 405778, "epoch": 4888} {"train_loss": -26.80745506286621, "global_step": 405779, "epoch": 4888} {"train_loss": -27.24875259399414, "global_step": 405780, "epoch": 4888} {"train_loss": -26.7104549407959, "global_step": 405781, "epoch": 4888} {"train_loss": -27.229032516479492, "global_step": 405782, "epoch": 4888} {"train_loss": -26.676244735717773, "global_step": 405783, "epoch": 4888} {"train_loss": -26.946619033813477, "global_step": 405784, "epoch": 4888} {"train_loss": -26.754674911499023, "global_step": 405785, "epoch": 4888} {"train_loss": -26.705547861306066, "global_step": 405786, "epoch": 4888, "val_loss": 6711899.0} {"train_loss": -26.976423263549805, "global_step": 405787, "epoch": 4889} {"train_loss": -26.527685165405273, "global_step": 405788, "epoch": 4889} {"train_loss": -27.18281364440918, "global_step": 405789, "epoch": 4889} {"train_loss": -26.866132736206055, "global_step": 405790, "epoch": 4889} {"train_loss": -26.75408935546875, "global_step": 405791, "epoch": 4889} {"train_loss": -26.8317813873291, "global_step": 405792, "epoch": 4889} {"train_loss": -26.51618766784668, "global_step": 405793, "epoch": 4889} {"train_loss": -26.485021591186523, "global_step": 405794, "epoch": 4889} {"train_loss": -26.588342666625977, "global_step": 405795, "epoch": 4889} {"train_loss": -26.659635543823242, "global_step": 405796, "epoch": 4889} {"train_loss": -26.27117919921875, "global_step": 405797, "epoch": 4889} {"train_loss": -27.034093856811523, "global_step": 405798, "epoch": 4889} {"train_loss": -26.31494140625, "global_step": 405799, "epoch": 4889} {"train_loss": -26.252643585205078, "global_step": 405800, "epoch": 4889} {"train_loss": -26.257970809936523, "global_step": 405801, "epoch": 4889} {"train_loss": -26.681726455688477, "global_step": 405802, "epoch": 4889} {"train_loss": -26.697986602783203, "global_step": 405803, "epoch": 4889} {"train_loss": -26.48710060119629, "global_step": 405804, "epoch": 4889} {"train_loss": -26.789159774780273, "global_step": 405805, "epoch": 4889} {"train_loss": -26.258848190307617, "global_step": 405806, "epoch": 4889} {"train_loss": -26.757720947265625, "global_step": 405807, "epoch": 4889} {"train_loss": -26.387042999267578, "global_step": 405808, "epoch": 4889} {"train_loss": -26.574569702148438, "global_step": 405809, "epoch": 4889} {"train_loss": -26.633899688720703, "global_step": 405810, "epoch": 4889} {"train_loss": -26.90699577331543, "global_step": 405811, "epoch": 4889} {"train_loss": -26.53830337524414, "global_step": 405812, "epoch": 4889} {"train_loss": -26.447681427001953, "global_step": 405813, "epoch": 4889} {"train_loss": -26.5841121673584, "global_step": 405814, "epoch": 4889} {"train_loss": -26.513357162475586, "global_step": 405815, "epoch": 4889} {"train_loss": -26.524667739868164, "global_step": 405816, "epoch": 4889} {"train_loss": -26.576038360595703, "global_step": 405817, "epoch": 4889} {"train_loss": -26.967681884765625, "global_step": 405818, "epoch": 4889} {"train_loss": -26.384729385375977, "global_step": 405819, "epoch": 4889} {"train_loss": -26.860937118530273, "global_step": 405820, "epoch": 4889} {"train_loss": -26.630502700805664, "global_step": 405821, "epoch": 4889} {"train_loss": -26.55372428894043, "global_step": 405822, "epoch": 4889} {"train_loss": -26.457916259765625, "global_step": 405823, "epoch": 4889} {"train_loss": -26.783843994140625, "global_step": 405824, "epoch": 4889} {"train_loss": -26.503347396850586, "global_step": 405825, "epoch": 4889} {"train_loss": -26.618865966796875, "global_step": 405826, "epoch": 4889} {"train_loss": -26.823261260986328, "global_step": 405827, "epoch": 4889} {"train_loss": -26.558074951171875, "global_step": 405828, "epoch": 4889} {"train_loss": -26.6402587890625, "global_step": 405829, "epoch": 4889} {"train_loss": -26.50345802307129, "global_step": 405830, "epoch": 4889} {"train_loss": -26.38680076599121, "global_step": 405831, "epoch": 4889} {"train_loss": -26.73318862915039, "global_step": 405832, "epoch": 4889} {"train_loss": -26.75758171081543, "global_step": 405833, "epoch": 4889} {"train_loss": -26.592121124267578, "global_step": 405834, "epoch": 4889} {"train_loss": -26.219146728515625, "global_step": 405835, "epoch": 4889} {"train_loss": -26.637760162353516, "global_step": 405836, "epoch": 4889} {"train_loss": -26.325178146362305, "global_step": 405837, "epoch": 4889} {"train_loss": -26.6532039642334, "global_step": 405838, "epoch": 4889} {"train_loss": -26.304956436157227, "global_step": 405839, "epoch": 4889} {"train_loss": -26.246383666992188, "global_step": 405840, "epoch": 4889} {"train_loss": -26.437946319580078, "global_step": 405841, "epoch": 4889} {"train_loss": -26.51535415649414, "global_step": 405842, "epoch": 4889} {"train_loss": -26.612409591674805, "global_step": 405843, "epoch": 4889} {"train_loss": -25.9327392578125, "global_step": 405844, "epoch": 4889} {"train_loss": -26.336450576782227, "global_step": 405845, "epoch": 4889} {"train_loss": -26.898298263549805, "global_step": 405846, "epoch": 4889} {"train_loss": -26.592599868774414, "global_step": 405847, "epoch": 4889} {"train_loss": -26.362823486328125, "global_step": 405848, "epoch": 4889} {"train_loss": -26.595306396484375, "global_step": 405849, "epoch": 4889} {"train_loss": -27.002660751342773, "global_step": 405850, "epoch": 4889} {"train_loss": -26.720539093017578, "global_step": 405851, "epoch": 4889} {"train_loss": -26.38264274597168, "global_step": 405852, "epoch": 4889} {"train_loss": -26.563079833984375, "global_step": 405853, "epoch": 4889} {"train_loss": -26.79984474182129, "global_step": 405854, "epoch": 4889} {"train_loss": -26.722455978393555, "global_step": 405855, "epoch": 4889} {"train_loss": -26.88568115234375, "global_step": 405856, "epoch": 4889} {"train_loss": -26.82293128967285, "global_step": 405857, "epoch": 4889} {"train_loss": -26.4864444732666, "global_step": 405858, "epoch": 4889} {"train_loss": -26.43805503845215, "global_step": 405859, "epoch": 4889} {"train_loss": -26.739423751831055, "global_step": 405860, "epoch": 4889} {"train_loss": -26.475500106811523, "global_step": 405861, "epoch": 4889} {"train_loss": -26.93438148498535, "global_step": 405862, "epoch": 4889} {"train_loss": -26.57533073425293, "global_step": 405863, "epoch": 4889} {"train_loss": -26.18074607849121, "global_step": 405864, "epoch": 4889} {"train_loss": -26.4694766998291, "global_step": 405865, "epoch": 4889} {"train_loss": -26.427978515625, "global_step": 405866, "epoch": 4889} {"train_loss": -26.993009567260742, "global_step": 405867, "epoch": 4889} {"train_loss": -26.55419921875, "global_step": 405868, "epoch": 4889} {"train_loss": -26.58841289382383, "global_step": 405869, "epoch": 4889, "val_loss": 6629875.5} {"train_loss": -26.084716796875, "global_step": 405870, "epoch": 4890} {"train_loss": -25.92078971862793, "global_step": 405871, "epoch": 4890} {"train_loss": -25.446487426757812, "global_step": 405872, "epoch": 4890} {"train_loss": -26.041486740112305, "global_step": 405873, "epoch": 4890} {"train_loss": -26.559207916259766, "global_step": 405874, "epoch": 4890} {"train_loss": -26.259275436401367, "global_step": 405875, "epoch": 4890} {"train_loss": -26.280393600463867, "global_step": 405876, "epoch": 4890} {"train_loss": -26.450376510620117, "global_step": 405877, "epoch": 4890} {"train_loss": -26.013427734375, "global_step": 405878, "epoch": 4890} {"train_loss": -26.055450439453125, "global_step": 405879, "epoch": 4890} {"train_loss": -26.321218490600586, "global_step": 405880, "epoch": 4890} {"train_loss": -26.10633659362793, "global_step": 405881, "epoch": 4890} {"train_loss": -25.894622802734375, "global_step": 405882, "epoch": 4890} {"train_loss": -26.349756240844727, "global_step": 405883, "epoch": 4890} {"train_loss": -26.302526473999023, "global_step": 405884, "epoch": 4890} {"train_loss": -26.375280380249023, "global_step": 405885, "epoch": 4890} {"train_loss": -25.998981475830078, "global_step": 405886, "epoch": 4890} {"train_loss": -26.64027214050293, "global_step": 405887, "epoch": 4890} {"train_loss": -26.382104873657227, "global_step": 405888, "epoch": 4890} {"train_loss": -26.45033073425293, "global_step": 405889, "epoch": 4890} {"train_loss": -26.443750381469727, "global_step": 405890, "epoch": 4890} {"train_loss": -26.575244903564453, "global_step": 405891, "epoch": 4890} {"train_loss": -26.684818267822266, "global_step": 405892, "epoch": 4890} {"train_loss": -26.861602783203125, "global_step": 405893, "epoch": 4890} {"train_loss": -26.680204391479492, "global_step": 405894, "epoch": 4890} {"train_loss": -26.325183868408203, "global_step": 405895, "epoch": 4890} {"train_loss": -26.496667861938477, "global_step": 405896, "epoch": 4890} {"train_loss": -26.5647029876709, "global_step": 405897, "epoch": 4890} {"train_loss": -26.472837448120117, "global_step": 405898, "epoch": 4890} {"train_loss": -26.71839714050293, "global_step": 405899, "epoch": 4890} {"train_loss": -26.72120475769043, "global_step": 405900, "epoch": 4890} {"train_loss": -26.55903434753418, "global_step": 405901, "epoch": 4890} {"train_loss": -26.386295318603516, "global_step": 405902, "epoch": 4890} {"train_loss": -26.439743041992188, "global_step": 405903, "epoch": 4890} {"train_loss": -26.115772247314453, "global_step": 405904, "epoch": 4890} {"train_loss": -26.874526977539062, "global_step": 405905, "epoch": 4890} {"train_loss": -26.334089279174805, "global_step": 405906, "epoch": 4890} {"train_loss": -26.6131534576416, "global_step": 405907, "epoch": 4890} {"train_loss": -26.579309463500977, "global_step": 405908, "epoch": 4890} {"train_loss": -26.77593994140625, "global_step": 405909, "epoch": 4890} {"train_loss": -26.597021102905273, "global_step": 405910, "epoch": 4890} {"train_loss": -26.530292510986328, "global_step": 405911, "epoch": 4890} {"train_loss": -26.069580078125, "global_step": 405912, "epoch": 4890} {"train_loss": -26.068552017211914, "global_step": 405913, "epoch": 4890} {"train_loss": -26.32160758972168, "global_step": 405914, "epoch": 4890} {"train_loss": -26.61333656311035, "global_step": 405915, "epoch": 4890} {"train_loss": -26.366804122924805, "global_step": 405916, "epoch": 4890} {"train_loss": -26.6158447265625, "global_step": 405917, "epoch": 4890} {"train_loss": -26.870166778564453, "global_step": 405918, "epoch": 4890} {"train_loss": -26.515167236328125, "global_step": 405919, "epoch": 4890} {"train_loss": -26.525135040283203, "global_step": 405920, "epoch": 4890} {"train_loss": -26.8636474609375, "global_step": 405921, "epoch": 4890} {"train_loss": -26.699689865112305, "global_step": 405922, "epoch": 4890} {"train_loss": -26.499719619750977, "global_step": 405923, "epoch": 4890} {"train_loss": -27.087305068969727, "global_step": 405924, "epoch": 4890} {"train_loss": -26.473058700561523, "global_step": 405925, "epoch": 4890} {"train_loss": -26.76021385192871, "global_step": 405926, "epoch": 4890} {"train_loss": -27.0146484375, "global_step": 405927, "epoch": 4890} {"train_loss": -26.11749267578125, "global_step": 405928, "epoch": 4890} {"train_loss": -26.27557373046875, "global_step": 405929, "epoch": 4890} {"train_loss": -26.699390411376953, "global_step": 405930, "epoch": 4890} {"train_loss": -26.503692626953125, "global_step": 405931, "epoch": 4890} {"train_loss": -26.466556549072266, "global_step": 405932, "epoch": 4890} {"train_loss": -27.0206298828125, "global_step": 405933, "epoch": 4890} {"train_loss": -26.992752075195312, "global_step": 405934, "epoch": 4890} {"train_loss": -26.786569595336914, "global_step": 405935, "epoch": 4890} {"train_loss": -26.63245964050293, "global_step": 405936, "epoch": 4890} {"train_loss": -26.602628707885742, "global_step": 405937, "epoch": 4890} {"train_loss": -26.933027267456055, "global_step": 405938, "epoch": 4890} {"train_loss": -26.795873641967773, "global_step": 405939, "epoch": 4890} {"train_loss": -26.6556339263916, "global_step": 405940, "epoch": 4890} {"train_loss": -26.964208602905273, "global_step": 405941, "epoch": 4890} {"train_loss": -26.700510025024414, "global_step": 405942, "epoch": 4890} {"train_loss": -26.706104278564453, "global_step": 405943, "epoch": 4890} {"train_loss": -26.944562911987305, "global_step": 405944, "epoch": 4890} {"train_loss": -26.91357421875, "global_step": 405945, "epoch": 4890} {"train_loss": -26.9460506439209, "global_step": 405946, "epoch": 4890} {"train_loss": -27.1617431640625, "global_step": 405947, "epoch": 4890} {"train_loss": -26.35944175720215, "global_step": 405948, "epoch": 4890} {"train_loss": -26.702722549438477, "global_step": 405949, "epoch": 4890} {"train_loss": -26.130414962768555, "global_step": 405950, "epoch": 4890} {"train_loss": -26.864307403564453, "global_step": 405951, "epoch": 4890} {"train_loss": -26.521965670298382, "global_step": 405952, "epoch": 4890, "val_loss": 6623515.0} {"train_loss": -26.26584243774414, "global_step": 405953, "epoch": 4891} {"train_loss": -25.997594833374023, "global_step": 405954, "epoch": 4891} {"train_loss": -26.603418350219727, "global_step": 405955, "epoch": 4891} {"train_loss": -26.05592155456543, "global_step": 405956, "epoch": 4891} {"train_loss": -26.085840225219727, "global_step": 405957, "epoch": 4891} {"train_loss": -25.997526168823242, "global_step": 405958, "epoch": 4891} {"train_loss": -26.278858184814453, "global_step": 405959, "epoch": 4891} {"train_loss": -26.299291610717773, "global_step": 405960, "epoch": 4891} {"train_loss": -26.593158721923828, "global_step": 405961, "epoch": 4891} {"train_loss": -26.087411880493164, "global_step": 405962, "epoch": 4891} {"train_loss": -26.130659103393555, "global_step": 405963, "epoch": 4891} {"train_loss": -26.529052734375, "global_step": 405964, "epoch": 4891} {"train_loss": -26.161962509155273, "global_step": 405965, "epoch": 4891} {"train_loss": -26.51139259338379, "global_step": 405966, "epoch": 4891} {"train_loss": -26.3640079498291, "global_step": 405967, "epoch": 4891} {"train_loss": -26.51323890686035, "global_step": 405968, "epoch": 4891} {"train_loss": -26.565942764282227, "global_step": 405969, "epoch": 4891} {"train_loss": -26.3760986328125, "global_step": 405970, "epoch": 4891} {"train_loss": -26.636035919189453, "global_step": 405971, "epoch": 4891} {"train_loss": -26.6065731048584, "global_step": 405972, "epoch": 4891} {"train_loss": -26.61653709411621, "global_step": 405973, "epoch": 4891} {"train_loss": -26.376449584960938, "global_step": 405974, "epoch": 4891} {"train_loss": -26.974145889282227, "global_step": 405975, "epoch": 4891} {"train_loss": -26.512609481811523, "global_step": 405976, "epoch": 4891} {"train_loss": -26.843652725219727, "global_step": 405977, "epoch": 4891} {"train_loss": -26.568571090698242, "global_step": 405978, "epoch": 4891} {"train_loss": -26.909833908081055, "global_step": 405979, "epoch": 4891} {"train_loss": -26.42679786682129, "global_step": 405980, "epoch": 4891} {"train_loss": -26.653173446655273, "global_step": 405981, "epoch": 4891} {"train_loss": -26.808155059814453, "global_step": 405982, "epoch": 4891} {"train_loss": -27.017499923706055, "global_step": 405983, "epoch": 4891} {"train_loss": -26.624765396118164, "global_step": 405984, "epoch": 4891} {"train_loss": -26.4578857421875, "global_step": 405985, "epoch": 4891} {"train_loss": -26.571430206298828, "global_step": 405986, "epoch": 4891} {"train_loss": -26.406103134155273, "global_step": 405987, "epoch": 4891} {"train_loss": -26.640478134155273, "global_step": 405988, "epoch": 4891} {"train_loss": -26.833532333374023, "global_step": 405989, "epoch": 4891} {"train_loss": -26.53676414489746, "global_step": 405990, "epoch": 4891} {"train_loss": -26.662073135375977, "global_step": 405991, "epoch": 4891} {"train_loss": -26.854589462280273, "global_step": 405992, "epoch": 4891} {"train_loss": -27.181232452392578, "global_step": 405993, "epoch": 4891} {"train_loss": -26.497129440307617, "global_step": 405994, "epoch": 4891} {"train_loss": -26.230985641479492, "global_step": 405995, "epoch": 4891} {"train_loss": -26.702665328979492, "global_step": 405996, "epoch": 4891} {"train_loss": -26.73598289489746, "global_step": 405997, "epoch": 4891} {"train_loss": -26.885501861572266, "global_step": 405998, "epoch": 4891} {"train_loss": -26.529966354370117, "global_step": 405999, "epoch": 4891} {"train_loss": -26.640439987182617, "global_step": 406000, "epoch": 4891} {"train_loss": -26.90460205078125, "global_step": 406001, "epoch": 4891} {"train_loss": -27.078933715820312, "global_step": 406002, "epoch": 4891} {"train_loss": -26.90015983581543, "global_step": 406003, "epoch": 4891} {"train_loss": -27.066884994506836, "global_step": 406004, "epoch": 4891} {"train_loss": -26.440235137939453, "global_step": 406005, "epoch": 4891} {"train_loss": -27.309167861938477, "global_step": 406006, "epoch": 4891} {"train_loss": -26.690753936767578, "global_step": 406007, "epoch": 4891} {"train_loss": -26.5716609954834, "global_step": 406008, "epoch": 4891} {"train_loss": -26.911840438842773, "global_step": 406009, "epoch": 4891} {"train_loss": -26.527790069580078, "global_step": 406010, "epoch": 4891} {"train_loss": -27.12286376953125, "global_step": 406011, "epoch": 4891} {"train_loss": -26.731836318969727, "global_step": 406012, "epoch": 4891} {"train_loss": -26.62418556213379, "global_step": 406013, "epoch": 4891} {"train_loss": -27.06031608581543, "global_step": 406014, "epoch": 4891} {"train_loss": -26.628681182861328, "global_step": 406015, "epoch": 4891} {"train_loss": -26.922006607055664, "global_step": 406016, "epoch": 4891} {"train_loss": -26.72262954711914, "global_step": 406017, "epoch": 4891} {"train_loss": -27.316009521484375, "global_step": 406018, "epoch": 4891} {"train_loss": -26.61089515686035, "global_step": 406019, "epoch": 4891} {"train_loss": -26.73261833190918, "global_step": 406020, "epoch": 4891} {"train_loss": -26.964130401611328, "global_step": 406021, "epoch": 4891} {"train_loss": -26.71728515625, "global_step": 406022, "epoch": 4891} {"train_loss": -26.58479118347168, "global_step": 406023, "epoch": 4891} {"train_loss": -26.76837158203125, "global_step": 406024, "epoch": 4891} {"train_loss": -26.460956573486328, "global_step": 406025, "epoch": 4891} {"train_loss": -26.59846305847168, "global_step": 406026, "epoch": 4891} {"train_loss": -26.5925350189209, "global_step": 406027, "epoch": 4891} {"train_loss": -26.754703521728516, "global_step": 406028, "epoch": 4891} {"train_loss": -26.675580978393555, "global_step": 406029, "epoch": 4891} {"train_loss": -26.678497314453125, "global_step": 406030, "epoch": 4891} {"train_loss": -26.69146728515625, "global_step": 406031, "epoch": 4891} {"train_loss": -26.902729034423828, "global_step": 406032, "epoch": 4891} {"train_loss": -26.4011173248291, "global_step": 406033, "epoch": 4891} {"train_loss": -26.598657608032227, "global_step": 406034, "epoch": 4891} {"train_loss": -26.613764268806182, "global_step": 406035, "epoch": 4891, "val_loss": 6725728.0} {"train_loss": -23.33062744140625, "global_step": 406036, "epoch": 4892} {"train_loss": -20.12436294555664, "global_step": 406037, "epoch": 4892} {"train_loss": -24.20366859436035, "global_step": 406038, "epoch": 4892} {"train_loss": -24.90371322631836, "global_step": 406039, "epoch": 4892} {"train_loss": -24.151723861694336, "global_step": 406040, "epoch": 4892} {"train_loss": -24.364002227783203, "global_step": 406041, "epoch": 4892} {"train_loss": -23.362485885620117, "global_step": 406042, "epoch": 4892} {"train_loss": -25.24072265625, "global_step": 406043, "epoch": 4892} {"train_loss": -24.645830154418945, "global_step": 406044, "epoch": 4892} {"train_loss": -24.670225143432617, "global_step": 406045, "epoch": 4892} {"train_loss": -25.54281997680664, "global_step": 406046, "epoch": 4892} {"train_loss": -25.1704044342041, "global_step": 406047, "epoch": 4892} {"train_loss": -25.320032119750977, "global_step": 406048, "epoch": 4892} {"train_loss": -25.508085250854492, "global_step": 406049, "epoch": 4892} {"train_loss": -25.38954734802246, "global_step": 406050, "epoch": 4892} {"train_loss": -25.886219024658203, "global_step": 406051, "epoch": 4892} {"train_loss": -25.614643096923828, "global_step": 406052, "epoch": 4892} {"train_loss": -25.5777587890625, "global_step": 406053, "epoch": 4892} {"train_loss": -25.87055015563965, "global_step": 406054, "epoch": 4892} {"train_loss": -25.393207550048828, "global_step": 406055, "epoch": 4892} {"train_loss": -25.62420082092285, "global_step": 406056, "epoch": 4892} {"train_loss": -25.868106842041016, "global_step": 406057, "epoch": 4892} {"train_loss": -26.038379669189453, "global_step": 406058, "epoch": 4892} {"train_loss": -26.070404052734375, "global_step": 406059, "epoch": 4892} {"train_loss": -25.628875732421875, "global_step": 406060, "epoch": 4892} {"train_loss": -25.84552574157715, "global_step": 406061, "epoch": 4892} {"train_loss": -26.1522274017334, "global_step": 406062, "epoch": 4892} {"train_loss": -26.143701553344727, "global_step": 406063, "epoch": 4892} {"train_loss": -25.83795738220215, "global_step": 406064, "epoch": 4892} {"train_loss": -26.05474281311035, "global_step": 406065, "epoch": 4892} {"train_loss": -26.2086238861084, "global_step": 406066, "epoch": 4892} {"train_loss": -26.206212997436523, "global_step": 406067, "epoch": 4892} {"train_loss": -26.20548439025879, "global_step": 406068, "epoch": 4892} {"train_loss": -26.05571937561035, "global_step": 406069, "epoch": 4892} {"train_loss": -26.229156494140625, "global_step": 406070, "epoch": 4892} {"train_loss": -26.49863052368164, "global_step": 406071, "epoch": 4892} {"train_loss": -26.53523826599121, "global_step": 406072, "epoch": 4892} {"train_loss": -26.56805419921875, "global_step": 406073, "epoch": 4892} {"train_loss": -26.184345245361328, "global_step": 406074, "epoch": 4892} {"train_loss": -26.37385368347168, "global_step": 406075, "epoch": 4892} {"train_loss": -26.329496383666992, "global_step": 406076, "epoch": 4892} {"train_loss": -26.416793823242188, "global_step": 406077, "epoch": 4892} {"train_loss": -26.403425216674805, "global_step": 406078, "epoch": 4892} {"train_loss": -26.529489517211914, "global_step": 406079, "epoch": 4892} {"train_loss": -26.45539665222168, "global_step": 406080, "epoch": 4892} {"train_loss": -26.78568458557129, "global_step": 406081, "epoch": 4892} {"train_loss": -26.674219131469727, "global_step": 406082, "epoch": 4892} {"train_loss": -26.67168617248535, "global_step": 406083, "epoch": 4892} {"train_loss": -26.736892700195312, "global_step": 406084, "epoch": 4892} {"train_loss": -26.94742774963379, "global_step": 406085, "epoch": 4892} {"train_loss": -26.38079833984375, "global_step": 406086, "epoch": 4892} {"train_loss": -26.481861114501953, "global_step": 406087, "epoch": 4892} {"train_loss": -26.32172966003418, "global_step": 406088, "epoch": 4892} {"train_loss": -26.703418731689453, "global_step": 406089, "epoch": 4892} {"train_loss": -26.645221710205078, "global_step": 406090, "epoch": 4892} {"train_loss": -26.661426544189453, "global_step": 406091, "epoch": 4892} {"train_loss": -26.712326049804688, "global_step": 406092, "epoch": 4892} {"train_loss": -26.62334632873535, "global_step": 406093, "epoch": 4892} {"train_loss": -26.63751792907715, "global_step": 406094, "epoch": 4892} {"train_loss": -26.720661163330078, "global_step": 406095, "epoch": 4892} {"train_loss": -26.745283126831055, "global_step": 406096, "epoch": 4892} {"train_loss": -26.1293888092041, "global_step": 406097, "epoch": 4892} {"train_loss": -26.32465934753418, "global_step": 406098, "epoch": 4892} {"train_loss": -26.291040420532227, "global_step": 406099, "epoch": 4892} {"train_loss": -26.1790771484375, "global_step": 406100, "epoch": 4892} {"train_loss": -26.299936294555664, "global_step": 406101, "epoch": 4892} {"train_loss": -26.779706954956055, "global_step": 406102, "epoch": 4892} {"train_loss": -26.534896850585938, "global_step": 406103, "epoch": 4892} {"train_loss": -26.621597290039062, "global_step": 406104, "epoch": 4892} {"train_loss": -26.752735137939453, "global_step": 406105, "epoch": 4892} {"train_loss": -26.245136260986328, "global_step": 406106, "epoch": 4892} {"train_loss": -26.79695701599121, "global_step": 406107, "epoch": 4892} {"train_loss": -26.532806396484375, "global_step": 406108, "epoch": 4892} {"train_loss": -26.73957633972168, "global_step": 406109, "epoch": 4892} {"train_loss": -26.557458877563477, "global_step": 406110, "epoch": 4892} {"train_loss": -26.73676109313965, "global_step": 406111, "epoch": 4892} {"train_loss": -26.69841957092285, "global_step": 406112, "epoch": 4892} {"train_loss": -26.87810707092285, "global_step": 406113, "epoch": 4892} {"train_loss": -26.65178871154785, "global_step": 406114, "epoch": 4892} {"train_loss": -26.59644889831543, "global_step": 406115, "epoch": 4892} {"train_loss": -26.90628433227539, "global_step": 406116, "epoch": 4892} {"train_loss": -26.63752555847168, "global_step": 406117, "epoch": 4892} {"train_loss": -26.035006189920818, "global_step": 406118, "epoch": 4892, "val_loss": 6711887.0} {"train_loss": -25.871246337890625, "global_step": 406119, "epoch": 4893} {"train_loss": -26.4982967376709, "global_step": 406120, "epoch": 4893} {"train_loss": -26.762836456298828, "global_step": 406121, "epoch": 4893} {"train_loss": -26.52739906311035, "global_step": 406122, "epoch": 4893} {"train_loss": -26.16473388671875, "global_step": 406123, "epoch": 4893} {"train_loss": -26.609378814697266, "global_step": 406124, "epoch": 4893} {"train_loss": -26.621078491210938, "global_step": 406125, "epoch": 4893} {"train_loss": -26.182586669921875, "global_step": 406126, "epoch": 4893} {"train_loss": -26.78900718688965, "global_step": 406127, "epoch": 4893} {"train_loss": -26.646411895751953, "global_step": 406128, "epoch": 4893} {"train_loss": -26.44803810119629, "global_step": 406129, "epoch": 4893} {"train_loss": -26.2022647857666, "global_step": 406130, "epoch": 4893} {"train_loss": -26.65888023376465, "global_step": 406131, "epoch": 4893} {"train_loss": -26.284955978393555, "global_step": 406132, "epoch": 4893} {"train_loss": -26.519943237304688, "global_step": 406133, "epoch": 4893} {"train_loss": -26.8854923248291, "global_step": 406134, "epoch": 4893} {"train_loss": -26.886999130249023, "global_step": 406135, "epoch": 4893} {"train_loss": -26.634307861328125, "global_step": 406136, "epoch": 4893} {"train_loss": -26.446826934814453, "global_step": 406137, "epoch": 4893} {"train_loss": -26.706708908081055, "global_step": 406138, "epoch": 4893} {"train_loss": -26.17832374572754, "global_step": 406139, "epoch": 4893} {"train_loss": -26.68885612487793, "global_step": 406140, "epoch": 4893} {"train_loss": -26.835559844970703, "global_step": 406141, "epoch": 4893} {"train_loss": -26.68851089477539, "global_step": 406142, "epoch": 4893} {"train_loss": -26.75226402282715, "global_step": 406143, "epoch": 4893} {"train_loss": -26.702484130859375, "global_step": 406144, "epoch": 4893} {"train_loss": -26.65057373046875, "global_step": 406145, "epoch": 4893} {"train_loss": -26.300458908081055, "global_step": 406146, "epoch": 4893} {"train_loss": -26.442480087280273, "global_step": 406147, "epoch": 4893} {"train_loss": -26.713653564453125, "global_step": 406148, "epoch": 4893} {"train_loss": -26.73638343811035, "global_step": 406149, "epoch": 4893} {"train_loss": -26.751935958862305, "global_step": 406150, "epoch": 4893} {"train_loss": -26.755176544189453, "global_step": 406151, "epoch": 4893} {"train_loss": -26.916259765625, "global_step": 406152, "epoch": 4893} {"train_loss": -26.396106719970703, "global_step": 406153, "epoch": 4893} {"train_loss": -26.80615234375, "global_step": 406154, "epoch": 4893} {"train_loss": -26.80604362487793, "global_step": 406155, "epoch": 4893} {"train_loss": -26.574975967407227, "global_step": 406156, "epoch": 4893} {"train_loss": -26.800256729125977, "global_step": 406157, "epoch": 4893} {"train_loss": -26.45602798461914, "global_step": 406158, "epoch": 4893} {"train_loss": -26.90313720703125, "global_step": 406159, "epoch": 4893} {"train_loss": -26.475339889526367, "global_step": 406160, "epoch": 4893} {"train_loss": -26.92176628112793, "global_step": 406161, "epoch": 4893} {"train_loss": -26.616613388061523, "global_step": 406162, "epoch": 4893} {"train_loss": -26.54656410217285, "global_step": 406163, "epoch": 4893} {"train_loss": -26.68824577331543, "global_step": 406164, "epoch": 4893} {"train_loss": -26.71162223815918, "global_step": 406165, "epoch": 4893} {"train_loss": -26.529403686523438, "global_step": 406166, "epoch": 4893} {"train_loss": -26.881805419921875, "global_step": 406167, "epoch": 4893} {"train_loss": -26.515073776245117, "global_step": 406168, "epoch": 4893} {"train_loss": -26.393310546875, "global_step": 406169, "epoch": 4893} {"train_loss": -26.662769317626953, "global_step": 406170, "epoch": 4893} {"train_loss": -26.652429580688477, "global_step": 406171, "epoch": 4893} {"train_loss": -27.002334594726562, "global_step": 406172, "epoch": 4893} {"train_loss": -26.57808494567871, "global_step": 406173, "epoch": 4893} {"train_loss": -26.527379989624023, "global_step": 406174, "epoch": 4893} {"train_loss": -26.53558349609375, "global_step": 406175, "epoch": 4893} {"train_loss": -26.836374282836914, "global_step": 406176, "epoch": 4893} {"train_loss": -26.797321319580078, "global_step": 406177, "epoch": 4893} {"train_loss": -26.711963653564453, "global_step": 406178, "epoch": 4893} {"train_loss": -26.397375106811523, "global_step": 406179, "epoch": 4893} {"train_loss": -26.62534523010254, "global_step": 406180, "epoch": 4893} {"train_loss": -26.570959091186523, "global_step": 406181, "epoch": 4893} {"train_loss": -26.745868682861328, "global_step": 406182, "epoch": 4893} {"train_loss": -26.560592651367188, "global_step": 406183, "epoch": 4893} {"train_loss": -26.709613800048828, "global_step": 406184, "epoch": 4893} {"train_loss": -27.26926612854004, "global_step": 406185, "epoch": 4893} {"train_loss": -26.561498641967773, "global_step": 406186, "epoch": 4893} {"train_loss": -26.770299911499023, "global_step": 406187, "epoch": 4893} {"train_loss": -26.11615562438965, "global_step": 406188, "epoch": 4893} {"train_loss": -26.373117446899414, "global_step": 406189, "epoch": 4893} {"train_loss": -26.396921157836914, "global_step": 406190, "epoch": 4893} {"train_loss": -26.585676193237305, "global_step": 406191, "epoch": 4893} {"train_loss": -26.74073600769043, "global_step": 406192, "epoch": 4893} {"train_loss": -26.982816696166992, "global_step": 406193, "epoch": 4893} {"train_loss": -27.0889949798584, "global_step": 406194, "epoch": 4893} {"train_loss": -26.575042724609375, "global_step": 406195, "epoch": 4893} {"train_loss": -26.791763305664062, "global_step": 406196, "epoch": 4893} {"train_loss": -26.965377807617188, "global_step": 406197, "epoch": 4893} {"train_loss": -26.862390518188477, "global_step": 406198, "epoch": 4893} {"train_loss": -26.9047794342041, "global_step": 406199, "epoch": 4893} {"train_loss": -26.760894775390625, "global_step": 406200, "epoch": 4893} {"train_loss": -26.63055923186153, "global_step": 406201, "epoch": 4893, "val_loss": 6665960.0} {"train_loss": -26.539081573486328, "global_step": 406202, "epoch": 4894} {"train_loss": -26.441511154174805, "global_step": 406203, "epoch": 4894} {"train_loss": -26.52308464050293, "global_step": 406204, "epoch": 4894} {"train_loss": -26.076879501342773, "global_step": 406205, "epoch": 4894} {"train_loss": -26.118453979492188, "global_step": 406206, "epoch": 4894} {"train_loss": -26.223302841186523, "global_step": 406207, "epoch": 4894} {"train_loss": -26.347700119018555, "global_step": 406208, "epoch": 4894} {"train_loss": -26.117395401000977, "global_step": 406209, "epoch": 4894} {"train_loss": -26.804147720336914, "global_step": 406210, "epoch": 4894} {"train_loss": -26.08951759338379, "global_step": 406211, "epoch": 4894} {"train_loss": -26.290027618408203, "global_step": 406212, "epoch": 4894} {"train_loss": -26.287031173706055, "global_step": 406213, "epoch": 4894} {"train_loss": -25.979894638061523, "global_step": 406214, "epoch": 4894} {"train_loss": -26.237741470336914, "global_step": 406215, "epoch": 4894} {"train_loss": -26.070409774780273, "global_step": 406216, "epoch": 4894} {"train_loss": -26.9085636138916, "global_step": 406217, "epoch": 4894} {"train_loss": -26.290695190429688, "global_step": 406218, "epoch": 4894} {"train_loss": -26.436559677124023, "global_step": 406219, "epoch": 4894} {"train_loss": -26.640356063842773, "global_step": 406220, "epoch": 4894} {"train_loss": -26.727563858032227, "global_step": 406221, "epoch": 4894} {"train_loss": -26.64253044128418, "global_step": 406222, "epoch": 4894} {"train_loss": -26.623472213745117, "global_step": 406223, "epoch": 4894} {"train_loss": -26.205121994018555, "global_step": 406224, "epoch": 4894} {"train_loss": -26.552371978759766, "global_step": 406225, "epoch": 4894} {"train_loss": -26.5880126953125, "global_step": 406226, "epoch": 4894} {"train_loss": -26.799869537353516, "global_step": 406227, "epoch": 4894} {"train_loss": -26.569448471069336, "global_step": 406228, "epoch": 4894} {"train_loss": -26.665393829345703, "global_step": 406229, "epoch": 4894} {"train_loss": -26.478351593017578, "global_step": 406230, "epoch": 4894} {"train_loss": -26.388853073120117, "global_step": 406231, "epoch": 4894} {"train_loss": -26.5410213470459, "global_step": 406232, "epoch": 4894} {"train_loss": -26.1982479095459, "global_step": 406233, "epoch": 4894} {"train_loss": -26.165576934814453, "global_step": 406234, "epoch": 4894} {"train_loss": -26.542081832885742, "global_step": 406235, "epoch": 4894} {"train_loss": -26.285192489624023, "global_step": 406236, "epoch": 4894} {"train_loss": -26.97176170349121, "global_step": 406237, "epoch": 4894} {"train_loss": -26.706708908081055, "global_step": 406238, "epoch": 4894} {"train_loss": -26.690351486206055, "global_step": 406239, "epoch": 4894} {"train_loss": -26.45493507385254, "global_step": 406240, "epoch": 4894} {"train_loss": -26.554906845092773, "global_step": 406241, "epoch": 4894} {"train_loss": -26.792104721069336, "global_step": 406242, "epoch": 4894} {"train_loss": -26.80482292175293, "global_step": 406243, "epoch": 4894} {"train_loss": -26.538888931274414, "global_step": 406244, "epoch": 4894} {"train_loss": -26.988271713256836, "global_step": 406245, "epoch": 4894} {"train_loss": -26.516407012939453, "global_step": 406246, "epoch": 4894} {"train_loss": -26.9342041015625, "global_step": 406247, "epoch": 4894} {"train_loss": -26.773406982421875, "global_step": 406248, "epoch": 4894} {"train_loss": -26.779525756835938, "global_step": 406249, "epoch": 4894} {"train_loss": -27.20819091796875, "global_step": 406250, "epoch": 4894} {"train_loss": -26.8802547454834, "global_step": 406251, "epoch": 4894} {"train_loss": -26.845502853393555, "global_step": 406252, "epoch": 4894} {"train_loss": -26.689130783081055, "global_step": 406253, "epoch": 4894} {"train_loss": -26.452672958374023, "global_step": 406254, "epoch": 4894} {"train_loss": -26.58492088317871, "global_step": 406255, "epoch": 4894} {"train_loss": -26.53981590270996, "global_step": 406256, "epoch": 4894} {"train_loss": -27.15242576599121, "global_step": 406257, "epoch": 4894} {"train_loss": -26.439245223999023, "global_step": 406258, "epoch": 4894} {"train_loss": -26.736108779907227, "global_step": 406259, "epoch": 4894} {"train_loss": -27.041913986206055, "global_step": 406260, "epoch": 4894} {"train_loss": -26.88407325744629, "global_step": 406261, "epoch": 4894} {"train_loss": -26.03486442565918, "global_step": 406262, "epoch": 4894} {"train_loss": -26.97507667541504, "global_step": 406263, "epoch": 4894} {"train_loss": -26.774688720703125, "global_step": 406264, "epoch": 4894} {"train_loss": -26.4268856048584, "global_step": 406265, "epoch": 4894} {"train_loss": -26.740543365478516, "global_step": 406266, "epoch": 4894} {"train_loss": -26.6803035736084, "global_step": 406267, "epoch": 4894} {"train_loss": -26.828540802001953, "global_step": 406268, "epoch": 4894} {"train_loss": -26.778472900390625, "global_step": 406269, "epoch": 4894} {"train_loss": -26.892499923706055, "global_step": 406270, "epoch": 4894} {"train_loss": -26.637481689453125, "global_step": 406271, "epoch": 4894} {"train_loss": -26.446393966674805, "global_step": 406272, "epoch": 4894} {"train_loss": -26.993505477905273, "global_step": 406273, "epoch": 4894} {"train_loss": -26.970808029174805, "global_step": 406274, "epoch": 4894} {"train_loss": -27.05561637878418, "global_step": 406275, "epoch": 4894} {"train_loss": -26.53779411315918, "global_step": 406276, "epoch": 4894} {"train_loss": -27.207752227783203, "global_step": 406277, "epoch": 4894} {"train_loss": -26.717639923095703, "global_step": 406278, "epoch": 4894} {"train_loss": -26.581289291381836, "global_step": 406279, "epoch": 4894} {"train_loss": -26.34168815612793, "global_step": 406280, "epoch": 4894} {"train_loss": -26.845428466796875, "global_step": 406281, "epoch": 4894} {"train_loss": -26.70224380493164, "global_step": 406282, "epoch": 4894} {"train_loss": -26.658655166625977, "global_step": 406283, "epoch": 4894} {"train_loss": -26.60192236842879, "global_step": 406284, "epoch": 4894, "val_loss": 6791356.5} {"train_loss": -26.617889404296875, "global_step": 406285, "epoch": 4895} {"train_loss": -26.455434799194336, "global_step": 406286, "epoch": 4895} {"train_loss": -26.414093017578125, "global_step": 406287, "epoch": 4895} {"train_loss": -26.29483413696289, "global_step": 406288, "epoch": 4895} {"train_loss": -26.55608558654785, "global_step": 406289, "epoch": 4895} {"train_loss": -26.537214279174805, "global_step": 406290, "epoch": 4895} {"train_loss": -26.565185546875, "global_step": 406291, "epoch": 4895} {"train_loss": -26.715412139892578, "global_step": 406292, "epoch": 4895} {"train_loss": -26.230695724487305, "global_step": 406293, "epoch": 4895} {"train_loss": -26.47730827331543, "global_step": 406294, "epoch": 4895} {"train_loss": -26.567163467407227, "global_step": 406295, "epoch": 4895} {"train_loss": -26.381916046142578, "global_step": 406296, "epoch": 4895} {"train_loss": -26.574743270874023, "global_step": 406297, "epoch": 4895} {"train_loss": -26.358814239501953, "global_step": 406298, "epoch": 4895} {"train_loss": -26.498987197875977, "global_step": 406299, "epoch": 4895} {"train_loss": -26.793323516845703, "global_step": 406300, "epoch": 4895} {"train_loss": -26.642602920532227, "global_step": 406301, "epoch": 4895} {"train_loss": -26.588581085205078, "global_step": 406302, "epoch": 4895} {"train_loss": -26.69196891784668, "global_step": 406303, "epoch": 4895} {"train_loss": -26.731037139892578, "global_step": 406304, "epoch": 4895} {"train_loss": -26.476659774780273, "global_step": 406305, "epoch": 4895} {"train_loss": -26.17534828186035, "global_step": 406306, "epoch": 4895} {"train_loss": -26.64313316345215, "global_step": 406307, "epoch": 4895} {"train_loss": -26.758121490478516, "global_step": 406308, "epoch": 4895} {"train_loss": -26.9077205657959, "global_step": 406309, "epoch": 4895} {"train_loss": -26.74321937561035, "global_step": 406310, "epoch": 4895} {"train_loss": -26.500574111938477, "global_step": 406311, "epoch": 4895} {"train_loss": -26.652624130249023, "global_step": 406312, "epoch": 4895} {"train_loss": -26.807336807250977, "global_step": 406313, "epoch": 4895} {"train_loss": -26.787424087524414, "global_step": 406314, "epoch": 4895} {"train_loss": -26.557958602905273, "global_step": 406315, "epoch": 4895} {"train_loss": -26.337499618530273, "global_step": 406316, "epoch": 4895} {"train_loss": -26.705163955688477, "global_step": 406317, "epoch": 4895} {"train_loss": -26.808988571166992, "global_step": 406318, "epoch": 4895} {"train_loss": -27.218250274658203, "global_step": 406319, "epoch": 4895} {"train_loss": -27.104333877563477, "global_step": 406320, "epoch": 4895} {"train_loss": -26.796844482421875, "global_step": 406321, "epoch": 4895} {"train_loss": -26.631925582885742, "global_step": 406322, "epoch": 4895} {"train_loss": -26.63043212890625, "global_step": 406323, "epoch": 4895} {"train_loss": -27.23187828063965, "global_step": 406324, "epoch": 4895} {"train_loss": -26.385419845581055, "global_step": 406325, "epoch": 4895} {"train_loss": -26.567840576171875, "global_step": 406326, "epoch": 4895} {"train_loss": -27.13751220703125, "global_step": 406327, "epoch": 4895} {"train_loss": -26.66900062561035, "global_step": 406328, "epoch": 4895} {"train_loss": -26.3746395111084, "global_step": 406329, "epoch": 4895} {"train_loss": -26.68568229675293, "global_step": 406330, "epoch": 4895} {"train_loss": -26.475921630859375, "global_step": 406331, "epoch": 4895} {"train_loss": -26.5456600189209, "global_step": 406332, "epoch": 4895} {"train_loss": -26.654150009155273, "global_step": 406333, "epoch": 4895} {"train_loss": -26.515201568603516, "global_step": 406334, "epoch": 4895} {"train_loss": -26.668310165405273, "global_step": 406335, "epoch": 4895} {"train_loss": -26.595050811767578, "global_step": 406336, "epoch": 4895} {"train_loss": -26.79230308532715, "global_step": 406337, "epoch": 4895} {"train_loss": -26.859546661376953, "global_step": 406338, "epoch": 4895} {"train_loss": -26.871984481811523, "global_step": 406339, "epoch": 4895} {"train_loss": -26.482351303100586, "global_step": 406340, "epoch": 4895} {"train_loss": -26.5201473236084, "global_step": 406341, "epoch": 4895} {"train_loss": -26.70960807800293, "global_step": 406342, "epoch": 4895} {"train_loss": -26.836673736572266, "global_step": 406343, "epoch": 4895} {"train_loss": -26.97784423828125, "global_step": 406344, "epoch": 4895} {"train_loss": -26.738996505737305, "global_step": 406345, "epoch": 4895} {"train_loss": -26.523733139038086, "global_step": 406346, "epoch": 4895} {"train_loss": -26.507261276245117, "global_step": 406347, "epoch": 4895} {"train_loss": -27.044025421142578, "global_step": 406348, "epoch": 4895} {"train_loss": -26.718814849853516, "global_step": 406349, "epoch": 4895} {"train_loss": -26.96101188659668, "global_step": 406350, "epoch": 4895} {"train_loss": -26.61382484436035, "global_step": 406351, "epoch": 4895} {"train_loss": -26.872604370117188, "global_step": 406352, "epoch": 4895} {"train_loss": -26.521106719970703, "global_step": 406353, "epoch": 4895} {"train_loss": -26.698028564453125, "global_step": 406354, "epoch": 4895} {"train_loss": -26.63221549987793, "global_step": 406355, "epoch": 4895} {"train_loss": -26.73829460144043, "global_step": 406356, "epoch": 4895} {"train_loss": -26.695653915405273, "global_step": 406357, "epoch": 4895} {"train_loss": -26.72100830078125, "global_step": 406358, "epoch": 4895} {"train_loss": -26.765539169311523, "global_step": 406359, "epoch": 4895} {"train_loss": -26.68816566467285, "global_step": 406360, "epoch": 4895} {"train_loss": -26.931583404541016, "global_step": 406361, "epoch": 4895} {"train_loss": -26.890928268432617, "global_step": 406362, "epoch": 4895} {"train_loss": -26.758987426757812, "global_step": 406363, "epoch": 4895} {"train_loss": -26.970874786376953, "global_step": 406364, "epoch": 4895} {"train_loss": -26.77396011352539, "global_step": 406365, "epoch": 4895} {"train_loss": -26.68863296508789, "global_step": 406366, "epoch": 4895} {"train_loss": -26.65839896144637, "global_step": 406367, "epoch": 4895, "val_loss": 6672104.0} {"train_loss": -26.32899284362793, "global_step": 406368, "epoch": 4896} {"train_loss": -26.833240509033203, "global_step": 406369, "epoch": 4896} {"train_loss": -26.24994468688965, "global_step": 406370, "epoch": 4896} {"train_loss": -26.560230255126953, "global_step": 406371, "epoch": 4896} {"train_loss": -26.189451217651367, "global_step": 406372, "epoch": 4896} {"train_loss": -26.286832809448242, "global_step": 406373, "epoch": 4896} {"train_loss": -26.2477970123291, "global_step": 406374, "epoch": 4896} {"train_loss": -26.248458862304688, "global_step": 406375, "epoch": 4896} {"train_loss": -26.84344482421875, "global_step": 406376, "epoch": 4896} {"train_loss": -26.569976806640625, "global_step": 406377, "epoch": 4896} {"train_loss": -26.570770263671875, "global_step": 406378, "epoch": 4896} {"train_loss": -26.366987228393555, "global_step": 406379, "epoch": 4896} {"train_loss": -26.42144203186035, "global_step": 406380, "epoch": 4896} {"train_loss": -26.318756103515625, "global_step": 406381, "epoch": 4896} {"train_loss": -26.510379791259766, "global_step": 406382, "epoch": 4896} {"train_loss": -26.48809242248535, "global_step": 406383, "epoch": 4896} {"train_loss": -26.787647247314453, "global_step": 406384, "epoch": 4896} {"train_loss": -26.5971736907959, "global_step": 406385, "epoch": 4896} {"train_loss": -26.660297393798828, "global_step": 406386, "epoch": 4896} {"train_loss": -26.52001953125, "global_step": 406387, "epoch": 4896} {"train_loss": -26.29262351989746, "global_step": 406388, "epoch": 4896} {"train_loss": -26.538406372070312, "global_step": 406389, "epoch": 4896} {"train_loss": -26.216184616088867, "global_step": 406390, "epoch": 4896} {"train_loss": -26.415485382080078, "global_step": 406391, "epoch": 4896} {"train_loss": -26.67085838317871, "global_step": 406392, "epoch": 4896} {"train_loss": -26.517969131469727, "global_step": 406393, "epoch": 4896} {"train_loss": -27.08320426940918, "global_step": 406394, "epoch": 4896} {"train_loss": -26.704675674438477, "global_step": 406395, "epoch": 4896} {"train_loss": -26.505634307861328, "global_step": 406396, "epoch": 4896} {"train_loss": -27.064233779907227, "global_step": 406397, "epoch": 4896} {"train_loss": -26.505102157592773, "global_step": 406398, "epoch": 4896} {"train_loss": -26.09122085571289, "global_step": 406399, "epoch": 4896} {"train_loss": -26.9058780670166, "global_step": 406400, "epoch": 4896} {"train_loss": -26.77373695373535, "global_step": 406401, "epoch": 4896} {"train_loss": -26.676624298095703, "global_step": 406402, "epoch": 4896} {"train_loss": -26.742847442626953, "global_step": 406403, "epoch": 4896} {"train_loss": -26.701467514038086, "global_step": 406404, "epoch": 4896} {"train_loss": -26.966068267822266, "global_step": 406405, "epoch": 4896} {"train_loss": -26.806249618530273, "global_step": 406406, "epoch": 4896} {"train_loss": -26.58403968811035, "global_step": 406407, "epoch": 4896} {"train_loss": -26.7642879486084, "global_step": 406408, "epoch": 4896} {"train_loss": -26.787500381469727, "global_step": 406409, "epoch": 4896} {"train_loss": -26.545429229736328, "global_step": 406410, "epoch": 4896} {"train_loss": -26.414167404174805, "global_step": 406411, "epoch": 4896} {"train_loss": -26.630903244018555, "global_step": 406412, "epoch": 4896} {"train_loss": -26.44330406188965, "global_step": 406413, "epoch": 4896} {"train_loss": -26.585729598999023, "global_step": 406414, "epoch": 4896} {"train_loss": -26.88994789123535, "global_step": 406415, "epoch": 4896} {"train_loss": -26.53293800354004, "global_step": 406416, "epoch": 4896} {"train_loss": -26.7768611907959, "global_step": 406417, "epoch": 4896} {"train_loss": -26.560394287109375, "global_step": 406418, "epoch": 4896} {"train_loss": -26.5393123626709, "global_step": 406419, "epoch": 4896} {"train_loss": -26.837427139282227, "global_step": 406420, "epoch": 4896} {"train_loss": -26.887104034423828, "global_step": 406421, "epoch": 4896} {"train_loss": -27.144195556640625, "global_step": 406422, "epoch": 4896} {"train_loss": -26.864517211914062, "global_step": 406423, "epoch": 4896} {"train_loss": -26.685583114624023, "global_step": 406424, "epoch": 4896} {"train_loss": -26.783613204956055, "global_step": 406425, "epoch": 4896} {"train_loss": -26.811309814453125, "global_step": 406426, "epoch": 4896} {"train_loss": -26.6427001953125, "global_step": 406427, "epoch": 4896} {"train_loss": -26.7785701751709, "global_step": 406428, "epoch": 4896} {"train_loss": -26.546247482299805, "global_step": 406429, "epoch": 4896} {"train_loss": -26.482858657836914, "global_step": 406430, "epoch": 4896} {"train_loss": -26.41485023498535, "global_step": 406431, "epoch": 4896} {"train_loss": -26.778940200805664, "global_step": 406432, "epoch": 4896} {"train_loss": -27.087671279907227, "global_step": 406433, "epoch": 4896} {"train_loss": -26.648244857788086, "global_step": 406434, "epoch": 4896} {"train_loss": -27.012104034423828, "global_step": 406435, "epoch": 4896} {"train_loss": -26.8245849609375, "global_step": 406436, "epoch": 4896} {"train_loss": -26.683591842651367, "global_step": 406437, "epoch": 4896} {"train_loss": -26.865619659423828, "global_step": 406438, "epoch": 4896} {"train_loss": -26.628406524658203, "global_step": 406439, "epoch": 4896} {"train_loss": -26.501996994018555, "global_step": 406440, "epoch": 4896} {"train_loss": -27.038293838500977, "global_step": 406441, "epoch": 4896} {"train_loss": -26.87116813659668, "global_step": 406442, "epoch": 4896} {"train_loss": -26.958887100219727, "global_step": 406443, "epoch": 4896} {"train_loss": -26.724409103393555, "global_step": 406444, "epoch": 4896} {"train_loss": -26.997650146484375, "global_step": 406445, "epoch": 4896} {"train_loss": -26.89820671081543, "global_step": 406446, "epoch": 4896} {"train_loss": -26.990802764892578, "global_step": 406447, "epoch": 4896} {"train_loss": -26.6302490234375, "global_step": 406448, "epoch": 4896} {"train_loss": -26.747648239135742, "global_step": 406449, "epoch": 4896} {"train_loss": -26.66181428748441, "global_step": 406450, "epoch": 4896, "val_loss": 6651234.0} {"train_loss": -25.783527374267578, "global_step": 406451, "epoch": 4897} {"train_loss": -25.400278091430664, "global_step": 406452, "epoch": 4897} {"train_loss": -25.823928833007812, "global_step": 406453, "epoch": 4897} {"train_loss": -25.881505966186523, "global_step": 406454, "epoch": 4897} {"train_loss": -26.492944717407227, "global_step": 406455, "epoch": 4897} {"train_loss": -25.951435089111328, "global_step": 406456, "epoch": 4897} {"train_loss": -25.70545768737793, "global_step": 406457, "epoch": 4897} {"train_loss": -25.77012062072754, "global_step": 406458, "epoch": 4897} {"train_loss": -26.623126983642578, "global_step": 406459, "epoch": 4897} {"train_loss": -26.2091121673584, "global_step": 406460, "epoch": 4897} {"train_loss": -26.518787384033203, "global_step": 406461, "epoch": 4897} {"train_loss": -26.474760055541992, "global_step": 406462, "epoch": 4897} {"train_loss": -26.424673080444336, "global_step": 406463, "epoch": 4897} {"train_loss": -26.71233558654785, "global_step": 406464, "epoch": 4897} {"train_loss": -26.22334098815918, "global_step": 406465, "epoch": 4897} {"train_loss": -26.245086669921875, "global_step": 406466, "epoch": 4897} {"train_loss": -26.607709884643555, "global_step": 406467, "epoch": 4897} {"train_loss": -26.084741592407227, "global_step": 406468, "epoch": 4897} {"train_loss": -26.85546875, "global_step": 406469, "epoch": 4897} {"train_loss": -26.470346450805664, "global_step": 406470, "epoch": 4897} {"train_loss": -26.49993896484375, "global_step": 406471, "epoch": 4897} {"train_loss": -26.738737106323242, "global_step": 406472, "epoch": 4897} {"train_loss": -27.172393798828125, "global_step": 406473, "epoch": 4897} {"train_loss": -26.95244789123535, "global_step": 406474, "epoch": 4897} {"train_loss": -26.746509552001953, "global_step": 406475, "epoch": 4897} {"train_loss": -26.6728572845459, "global_step": 406476, "epoch": 4897} {"train_loss": -26.624502182006836, "global_step": 406477, "epoch": 4897} {"train_loss": -26.588605880737305, "global_step": 406478, "epoch": 4897} {"train_loss": -26.594696044921875, "global_step": 406479, "epoch": 4897} {"train_loss": -26.353063583374023, "global_step": 406480, "epoch": 4897} {"train_loss": -26.837583541870117, "global_step": 406481, "epoch": 4897} {"train_loss": -26.68463134765625, "global_step": 406482, "epoch": 4897} {"train_loss": -26.7465877532959, "global_step": 406483, "epoch": 4897} {"train_loss": -26.20709800720215, "global_step": 406484, "epoch": 4897} {"train_loss": -26.81800651550293, "global_step": 406485, "epoch": 4897} {"train_loss": -27.012907028198242, "global_step": 406486, "epoch": 4897} {"train_loss": -26.817951202392578, "global_step": 406487, "epoch": 4897} {"train_loss": -26.950092315673828, "global_step": 406488, "epoch": 4897} {"train_loss": -26.660938262939453, "global_step": 406489, "epoch": 4897} {"train_loss": -26.539569854736328, "global_step": 406490, "epoch": 4897} {"train_loss": -26.57065200805664, "global_step": 406491, "epoch": 4897} {"train_loss": -26.696319580078125, "global_step": 406492, "epoch": 4897} {"train_loss": -26.380157470703125, "global_step": 406493, "epoch": 4897} {"train_loss": -26.26722526550293, "global_step": 406494, "epoch": 4897} {"train_loss": -26.845090866088867, "global_step": 406495, "epoch": 4897} {"train_loss": -26.776702880859375, "global_step": 406496, "epoch": 4897} {"train_loss": -26.90000343322754, "global_step": 406497, "epoch": 4897} {"train_loss": -27.171436309814453, "global_step": 406498, "epoch": 4897} {"train_loss": -26.981674194335938, "global_step": 406499, "epoch": 4897} {"train_loss": -26.688974380493164, "global_step": 406500, "epoch": 4897} {"train_loss": -26.91217041015625, "global_step": 406501, "epoch": 4897} {"train_loss": -26.440673828125, "global_step": 406502, "epoch": 4897} {"train_loss": -26.41117286682129, "global_step": 406503, "epoch": 4897} {"train_loss": -26.41596031188965, "global_step": 406504, "epoch": 4897} {"train_loss": -26.399667739868164, "global_step": 406505, "epoch": 4897} {"train_loss": -26.638574600219727, "global_step": 406506, "epoch": 4897} {"train_loss": -26.930831909179688, "global_step": 406507, "epoch": 4897} {"train_loss": -26.95172119140625, "global_step": 406508, "epoch": 4897} {"train_loss": -26.472946166992188, "global_step": 406509, "epoch": 4897} {"train_loss": -26.669584274291992, "global_step": 406510, "epoch": 4897} {"train_loss": -26.41837501525879, "global_step": 406511, "epoch": 4897} {"train_loss": -26.64778709411621, "global_step": 406512, "epoch": 4897} {"train_loss": -26.641555786132812, "global_step": 406513, "epoch": 4897} {"train_loss": -26.750213623046875, "global_step": 406514, "epoch": 4897} {"train_loss": -26.571088790893555, "global_step": 406515, "epoch": 4897} {"train_loss": -26.615583419799805, "global_step": 406516, "epoch": 4897} {"train_loss": -26.441614151000977, "global_step": 406517, "epoch": 4897} {"train_loss": -26.71270751953125, "global_step": 406518, "epoch": 4897} {"train_loss": -26.844709396362305, "global_step": 406519, "epoch": 4897} {"train_loss": -26.9752140045166, "global_step": 406520, "epoch": 4897} {"train_loss": -26.635345458984375, "global_step": 406521, "epoch": 4897} {"train_loss": -26.427865982055664, "global_step": 406522, "epoch": 4897} {"train_loss": -26.59295082092285, "global_step": 406523, "epoch": 4897} {"train_loss": -26.2244815826416, "global_step": 406524, "epoch": 4897} {"train_loss": -27.025007247924805, "global_step": 406525, "epoch": 4897} {"train_loss": -26.676488876342773, "global_step": 406526, "epoch": 4897} {"train_loss": -26.958288192749023, "global_step": 406527, "epoch": 4897} {"train_loss": -26.743799209594727, "global_step": 406528, "epoch": 4897} {"train_loss": -26.738727569580078, "global_step": 406529, "epoch": 4897} {"train_loss": -26.72486686706543, "global_step": 406530, "epoch": 4897} {"train_loss": -26.99017333984375, "global_step": 406531, "epoch": 4897} {"train_loss": -26.706762313842773, "global_step": 406532, "epoch": 4897} {"train_loss": -26.57497649594962, "global_step": 406533, "epoch": 4897, "val_loss": 6675882.0} {"train_loss": -25.947254180908203, "global_step": 406534, "epoch": 4898} {"train_loss": -26.429357528686523, "global_step": 406535, "epoch": 4898} {"train_loss": -26.47283363342285, "global_step": 406536, "epoch": 4898} {"train_loss": -26.356855392456055, "global_step": 406537, "epoch": 4898} {"train_loss": -26.414297103881836, "global_step": 406538, "epoch": 4898} {"train_loss": -26.58304214477539, "global_step": 406539, "epoch": 4898} {"train_loss": -26.144168853759766, "global_step": 406540, "epoch": 4898} {"train_loss": -26.00116539001465, "global_step": 406541, "epoch": 4898} {"train_loss": -26.31220054626465, "global_step": 406542, "epoch": 4898} {"train_loss": -26.364065170288086, "global_step": 406543, "epoch": 4898} {"train_loss": -26.645002365112305, "global_step": 406544, "epoch": 4898} {"train_loss": -26.837148666381836, "global_step": 406545, "epoch": 4898} {"train_loss": -26.552274703979492, "global_step": 406546, "epoch": 4898} {"train_loss": -26.519439697265625, "global_step": 406547, "epoch": 4898} {"train_loss": -26.45880126953125, "global_step": 406548, "epoch": 4898} {"train_loss": -26.16847038269043, "global_step": 406549, "epoch": 4898} {"train_loss": -26.50419044494629, "global_step": 406550, "epoch": 4898} {"train_loss": -26.338459014892578, "global_step": 406551, "epoch": 4898} {"train_loss": -26.765888214111328, "global_step": 406552, "epoch": 4898} {"train_loss": -26.727985382080078, "global_step": 406553, "epoch": 4898} {"train_loss": -26.465167999267578, "global_step": 406554, "epoch": 4898} {"train_loss": -26.515644073486328, "global_step": 406555, "epoch": 4898} {"train_loss": -26.6108341217041, "global_step": 406556, "epoch": 4898} {"train_loss": -26.61358070373535, "global_step": 406557, "epoch": 4898} {"train_loss": -26.6101016998291, "global_step": 406558, "epoch": 4898} {"train_loss": -26.717334747314453, "global_step": 406559, "epoch": 4898} {"train_loss": -26.717132568359375, "global_step": 406560, "epoch": 4898} {"train_loss": -26.698209762573242, "global_step": 406561, "epoch": 4898} {"train_loss": -26.493844985961914, "global_step": 406562, "epoch": 4898} {"train_loss": -26.580646514892578, "global_step": 406563, "epoch": 4898} {"train_loss": -26.8013858795166, "global_step": 406564, "epoch": 4898} {"train_loss": -26.48894691467285, "global_step": 406565, "epoch": 4898} {"train_loss": -26.874807357788086, "global_step": 406566, "epoch": 4898} {"train_loss": -27.045135498046875, "global_step": 406567, "epoch": 4898} {"train_loss": -26.793149948120117, "global_step": 406568, "epoch": 4898} {"train_loss": -26.729475021362305, "global_step": 406569, "epoch": 4898} {"train_loss": -26.795007705688477, "global_step": 406570, "epoch": 4898} {"train_loss": -26.668054580688477, "global_step": 406571, "epoch": 4898} {"train_loss": -26.677820205688477, "global_step": 406572, "epoch": 4898} {"train_loss": -26.697839736938477, "global_step": 406573, "epoch": 4898} {"train_loss": -26.851612091064453, "global_step": 406574, "epoch": 4898} {"train_loss": -26.809492111206055, "global_step": 406575, "epoch": 4898} {"train_loss": -26.583311080932617, "global_step": 406576, "epoch": 4898} {"train_loss": -26.853424072265625, "global_step": 406577, "epoch": 4898} {"train_loss": -26.7913818359375, "global_step": 406578, "epoch": 4898} {"train_loss": -26.57379150390625, "global_step": 406579, "epoch": 4898} {"train_loss": -26.69830894470215, "global_step": 406580, "epoch": 4898} {"train_loss": -26.840106964111328, "global_step": 406581, "epoch": 4898} {"train_loss": -26.725128173828125, "global_step": 406582, "epoch": 4898} {"train_loss": -27.047040939331055, "global_step": 406583, "epoch": 4898} {"train_loss": -27.038984298706055, "global_step": 406584, "epoch": 4898} {"train_loss": -26.610998153686523, "global_step": 406585, "epoch": 4898} {"train_loss": -26.188947677612305, "global_step": 406586, "epoch": 4898} {"train_loss": -26.283552169799805, "global_step": 406587, "epoch": 4898} {"train_loss": -26.381574630737305, "global_step": 406588, "epoch": 4898} {"train_loss": -26.834903717041016, "global_step": 406589, "epoch": 4898} {"train_loss": -26.658710479736328, "global_step": 406590, "epoch": 4898} {"train_loss": -26.41607666015625, "global_step": 406591, "epoch": 4898} {"train_loss": -26.632568359375, "global_step": 406592, "epoch": 4898} {"train_loss": -26.8553524017334, "global_step": 406593, "epoch": 4898} {"train_loss": -26.551395416259766, "global_step": 406594, "epoch": 4898} {"train_loss": -26.46124839782715, "global_step": 406595, "epoch": 4898} {"train_loss": -26.111989974975586, "global_step": 406596, "epoch": 4898} {"train_loss": -26.906408309936523, "global_step": 406597, "epoch": 4898} {"train_loss": -26.4915828704834, "global_step": 406598, "epoch": 4898} {"train_loss": -26.683643341064453, "global_step": 406599, "epoch": 4898} {"train_loss": -26.851011276245117, "global_step": 406600, "epoch": 4898} {"train_loss": -26.53620719909668, "global_step": 406601, "epoch": 4898} {"train_loss": -27.0632381439209, "global_step": 406602, "epoch": 4898} {"train_loss": -26.584442138671875, "global_step": 406603, "epoch": 4898} {"train_loss": -26.70770835876465, "global_step": 406604, "epoch": 4898} {"train_loss": -26.627527236938477, "global_step": 406605, "epoch": 4898} {"train_loss": -26.6153507232666, "global_step": 406606, "epoch": 4898} {"train_loss": -26.886844635009766, "global_step": 406607, "epoch": 4898} {"train_loss": -27.234302520751953, "global_step": 406608, "epoch": 4898} {"train_loss": -26.74432945251465, "global_step": 406609, "epoch": 4898} {"train_loss": -26.503543853759766, "global_step": 406610, "epoch": 4898} {"train_loss": -26.7907772064209, "global_step": 406611, "epoch": 4898} {"train_loss": -26.581619262695312, "global_step": 406612, "epoch": 4898} {"train_loss": -27.045520782470703, "global_step": 406613, "epoch": 4898} {"train_loss": -26.55506706237793, "global_step": 406614, "epoch": 4898} {"train_loss": -26.554258346557617, "global_step": 406615, "epoch": 4898} {"train_loss": -26.60992992355163, "global_step": 406616, "epoch": 4898, "val_loss": 6589823.0} {"train_loss": -25.21647834777832, "global_step": 406617, "epoch": 4899} {"train_loss": -25.00191307067871, "global_step": 406618, "epoch": 4899} {"train_loss": -25.496732711791992, "global_step": 406619, "epoch": 4899} {"train_loss": -25.4991397857666, "global_step": 406620, "epoch": 4899} {"train_loss": -25.0592098236084, "global_step": 406621, "epoch": 4899} {"train_loss": -25.676172256469727, "global_step": 406622, "epoch": 4899} {"train_loss": -25.879995346069336, "global_step": 406623, "epoch": 4899} {"train_loss": -25.478055953979492, "global_step": 406624, "epoch": 4899} {"train_loss": -25.389358520507812, "global_step": 406625, "epoch": 4899} {"train_loss": -25.231822967529297, "global_step": 406626, "epoch": 4899} {"train_loss": -25.572935104370117, "global_step": 406627, "epoch": 4899} {"train_loss": -25.225088119506836, "global_step": 406628, "epoch": 4899} {"train_loss": -25.489587783813477, "global_step": 406629, "epoch": 4899} {"train_loss": -25.64332389831543, "global_step": 406630, "epoch": 4899} {"train_loss": -25.792133331298828, "global_step": 406631, "epoch": 4899} {"train_loss": -25.809141159057617, "global_step": 406632, "epoch": 4899} {"train_loss": -25.59836769104004, "global_step": 406633, "epoch": 4899} {"train_loss": -26.122791290283203, "global_step": 406634, "epoch": 4899} {"train_loss": -25.984375, "global_step": 406635, "epoch": 4899} {"train_loss": -26.082666397094727, "global_step": 406636, "epoch": 4899} {"train_loss": -25.787458419799805, "global_step": 406637, "epoch": 4899} {"train_loss": -26.29349136352539, "global_step": 406638, "epoch": 4899} {"train_loss": -26.186969757080078, "global_step": 406639, "epoch": 4899} {"train_loss": -26.564462661743164, "global_step": 406640, "epoch": 4899} {"train_loss": -25.834152221679688, "global_step": 406641, "epoch": 4899} {"train_loss": -26.412378311157227, "global_step": 406642, "epoch": 4899} {"train_loss": -25.888717651367188, "global_step": 406643, "epoch": 4899} {"train_loss": -26.1602840423584, "global_step": 406644, "epoch": 4899} {"train_loss": -26.218780517578125, "global_step": 406645, "epoch": 4899} {"train_loss": -26.336668014526367, "global_step": 406646, "epoch": 4899} {"train_loss": -26.05841636657715, "global_step": 406647, "epoch": 4899} {"train_loss": -26.5081844329834, "global_step": 406648, "epoch": 4899} {"train_loss": -26.509733200073242, "global_step": 406649, "epoch": 4899} {"train_loss": -26.32093620300293, "global_step": 406650, "epoch": 4899} {"train_loss": -26.649169921875, "global_step": 406651, "epoch": 4899} {"train_loss": -26.110986709594727, "global_step": 406652, "epoch": 4899} {"train_loss": -26.40473747253418, "global_step": 406653, "epoch": 4899} {"train_loss": -26.423681259155273, "global_step": 406654, "epoch": 4899} {"train_loss": -26.596210479736328, "global_step": 406655, "epoch": 4899} {"train_loss": -26.60296630859375, "global_step": 406656, "epoch": 4899} {"train_loss": -26.748493194580078, "global_step": 406657, "epoch": 4899} {"train_loss": -26.712921142578125, "global_step": 406658, "epoch": 4899} {"train_loss": -26.54068946838379, "global_step": 406659, "epoch": 4899} {"train_loss": -26.749317169189453, "global_step": 406660, "epoch": 4899} {"train_loss": -26.44667625427246, "global_step": 406661, "epoch": 4899} {"train_loss": -26.793188095092773, "global_step": 406662, "epoch": 4899} {"train_loss": -26.64935302734375, "global_step": 406663, "epoch": 4899} {"train_loss": -27.379175186157227, "global_step": 406664, "epoch": 4899} {"train_loss": -26.653589248657227, "global_step": 406665, "epoch": 4899} {"train_loss": -26.88802146911621, "global_step": 406666, "epoch": 4899} {"train_loss": -26.817373275756836, "global_step": 406667, "epoch": 4899} {"train_loss": -26.756818771362305, "global_step": 406668, "epoch": 4899} {"train_loss": -27.113996505737305, "global_step": 406669, "epoch": 4899} {"train_loss": -26.545242309570312, "global_step": 406670, "epoch": 4899} {"train_loss": -26.8227596282959, "global_step": 406671, "epoch": 4899} {"train_loss": -26.256103515625, "global_step": 406672, "epoch": 4899} {"train_loss": -26.597700119018555, "global_step": 406673, "epoch": 4899} {"train_loss": -26.8331241607666, "global_step": 406674, "epoch": 4899} {"train_loss": -26.887710571289062, "global_step": 406675, "epoch": 4899} {"train_loss": -27.044591903686523, "global_step": 406676, "epoch": 4899} {"train_loss": -26.745214462280273, "global_step": 406677, "epoch": 4899} {"train_loss": -26.453031539916992, "global_step": 406678, "epoch": 4899} {"train_loss": -26.692737579345703, "global_step": 406679, "epoch": 4899} {"train_loss": -26.9343318939209, "global_step": 406680, "epoch": 4899} {"train_loss": -26.821386337280273, "global_step": 406681, "epoch": 4899} {"train_loss": -26.46941566467285, "global_step": 406682, "epoch": 4899} {"train_loss": -27.133214950561523, "global_step": 406683, "epoch": 4899} {"train_loss": -26.666540145874023, "global_step": 406684, "epoch": 4899} {"train_loss": -26.882831573486328, "global_step": 406685, "epoch": 4899} {"train_loss": -26.891916275024414, "global_step": 406686, "epoch": 4899} {"train_loss": -26.844913482666016, "global_step": 406687, "epoch": 4899} {"train_loss": -26.6751651763916, "global_step": 406688, "epoch": 4899} {"train_loss": -26.42866325378418, "global_step": 406689, "epoch": 4899} {"train_loss": -26.635778427124023, "global_step": 406690, "epoch": 4899} {"train_loss": -26.627538681030273, "global_step": 406691, "epoch": 4899} {"train_loss": -26.7730712890625, "global_step": 406692, "epoch": 4899} {"train_loss": -26.56312370300293, "global_step": 406693, "epoch": 4899} {"train_loss": -26.891403198242188, "global_step": 406694, "epoch": 4899} {"train_loss": -26.5076847076416, "global_step": 406695, "epoch": 4899} {"train_loss": -26.510757446289062, "global_step": 406696, "epoch": 4899} {"train_loss": -26.9613037109375, "global_step": 406697, "epoch": 4899} {"train_loss": -26.85433006286621, "global_step": 406698, "epoch": 4899} {"train_loss": -26.340499763029168, "global_step": 406699, "epoch": 4899, "val_loss": 6591273.0} {"train_loss": -26.330041885375977, "global_step": 406700, "epoch": 4900} {"train_loss": -26.297407150268555, "global_step": 406701, "epoch": 4900} {"train_loss": -26.69723892211914, "global_step": 406702, "epoch": 4900} {"train_loss": -26.316059112548828, "global_step": 406703, "epoch": 4900} {"train_loss": -25.703901290893555, "global_step": 406704, "epoch": 4900} {"train_loss": -26.17423439025879, "global_step": 406705, "epoch": 4900} {"train_loss": -26.295364379882812, "global_step": 406706, "epoch": 4900} {"train_loss": -26.431964874267578, "global_step": 406707, "epoch": 4900} {"train_loss": -25.883939743041992, "global_step": 406708, "epoch": 4900} {"train_loss": -26.23874855041504, "global_step": 406709, "epoch": 4900} {"train_loss": -26.392053604125977, "global_step": 406710, "epoch": 4900} {"train_loss": -26.385425567626953, "global_step": 406711, "epoch": 4900} {"train_loss": -26.29596519470215, "global_step": 406712, "epoch": 4900} {"train_loss": -26.644088745117188, "global_step": 406713, "epoch": 4900} {"train_loss": -26.563138961791992, "global_step": 406714, "epoch": 4900} {"train_loss": -26.89263916015625, "global_step": 406715, "epoch": 4900} {"train_loss": -26.400205612182617, "global_step": 406716, "epoch": 4900} {"train_loss": -26.599939346313477, "global_step": 406717, "epoch": 4900} {"train_loss": -26.328754425048828, "global_step": 406718, "epoch": 4900} {"train_loss": -26.850555419921875, "global_step": 406719, "epoch": 4900} {"train_loss": -26.58282470703125, "global_step": 406720, "epoch": 4900} {"train_loss": -26.64910888671875, "global_step": 406721, "epoch": 4900} {"train_loss": -26.722211837768555, "global_step": 406722, "epoch": 4900} {"train_loss": -26.548749923706055, "global_step": 406723, "epoch": 4900} {"train_loss": -26.59756851196289, "global_step": 406724, "epoch": 4900} {"train_loss": -26.73434829711914, "global_step": 406725, "epoch": 4900} {"train_loss": -26.877517700195312, "global_step": 406726, "epoch": 4900} {"train_loss": -26.763504028320312, "global_step": 406727, "epoch": 4900} {"train_loss": -26.827707290649414, "global_step": 406728, "epoch": 4900} {"train_loss": -26.87527847290039, "global_step": 406729, "epoch": 4900} {"train_loss": -26.599821090698242, "global_step": 406730, "epoch": 4900} {"train_loss": -26.611572265625, "global_step": 406731, "epoch": 4900} {"train_loss": -26.954761505126953, "global_step": 406732, "epoch": 4900} {"train_loss": -26.562971115112305, "global_step": 406733, "epoch": 4900} {"train_loss": -27.213239669799805, "global_step": 406734, "epoch": 4900} {"train_loss": -26.78850746154785, "global_step": 406735, "epoch": 4900} {"train_loss": -27.07389259338379, "global_step": 406736, "epoch": 4900} {"train_loss": -26.882490158081055, "global_step": 406737, "epoch": 4900} {"train_loss": -26.967878341674805, "global_step": 406738, "epoch": 4900} {"train_loss": -26.78644371032715, "global_step": 406739, "epoch": 4900} {"train_loss": -26.61993980407715, "global_step": 406740, "epoch": 4900} {"train_loss": -26.428693771362305, "global_step": 406741, "epoch": 4900} {"train_loss": -26.710540771484375, "global_step": 406742, "epoch": 4900} {"train_loss": -26.709522247314453, "global_step": 406743, "epoch": 4900} {"train_loss": -26.559463500976562, "global_step": 406744, "epoch": 4900} {"train_loss": -27.178258895874023, "global_step": 406745, "epoch": 4900} {"train_loss": -26.939115524291992, "global_step": 406746, "epoch": 4900} {"train_loss": -26.94080924987793, "global_step": 406747, "epoch": 4900} {"train_loss": -26.535200119018555, "global_step": 406748, "epoch": 4900} {"train_loss": -27.07856559753418, "global_step": 406749, "epoch": 4900} {"train_loss": -27.22586441040039, "global_step": 406750, "epoch": 4900} {"train_loss": -26.70462989807129, "global_step": 406751, "epoch": 4900} {"train_loss": -26.907400131225586, "global_step": 406752, "epoch": 4900} {"train_loss": -26.972265243530273, "global_step": 406753, "epoch": 4900} {"train_loss": -27.011157989501953, "global_step": 406754, "epoch": 4900} {"train_loss": -26.938129425048828, "global_step": 406755, "epoch": 4900} {"train_loss": -27.082361221313477, "global_step": 406756, "epoch": 4900} {"train_loss": -26.898740768432617, "global_step": 406757, "epoch": 4900} {"train_loss": -26.802902221679688, "global_step": 406758, "epoch": 4900} {"train_loss": -26.61695671081543, "global_step": 406759, "epoch": 4900} {"train_loss": -26.908527374267578, "global_step": 406760, "epoch": 4900} {"train_loss": -26.82879066467285, "global_step": 406761, "epoch": 4900} {"train_loss": -26.834314346313477, "global_step": 406762, "epoch": 4900} {"train_loss": -26.975727081298828, "global_step": 406763, "epoch": 4900} {"train_loss": -26.8870906829834, "global_step": 406764, "epoch": 4900} {"train_loss": -27.098285675048828, "global_step": 406765, "epoch": 4900} {"train_loss": -26.780126571655273, "global_step": 406766, "epoch": 4900} {"train_loss": -26.5406494140625, "global_step": 406767, "epoch": 4900} {"train_loss": -26.466455459594727, "global_step": 406768, "epoch": 4900} {"train_loss": -26.24932289123535, "global_step": 406769, "epoch": 4900} {"train_loss": -26.558252334594727, "global_step": 406770, "epoch": 4900} {"train_loss": -26.9088134765625, "global_step": 406771, "epoch": 4900} {"train_loss": -26.738910675048828, "global_step": 406772, "epoch": 4900} {"train_loss": -26.30303955078125, "global_step": 406773, "epoch": 4900} {"train_loss": -26.690322875976562, "global_step": 406774, "epoch": 4900} {"train_loss": -26.88312339782715, "global_step": 406775, "epoch": 4900} {"train_loss": -26.70574378967285, "global_step": 406776, "epoch": 4900} {"train_loss": -26.479251861572266, "global_step": 406777, "epoch": 4900} {"train_loss": -26.078927993774414, "global_step": 406778, "epoch": 4900} {"train_loss": -26.132944107055664, "global_step": 406779, "epoch": 4900} {"train_loss": -26.123350143432617, "global_step": 406780, "epoch": 4900} {"train_loss": -25.870397567749023, "global_step": 406781, "epoch": 4900} {"train_loss": -26.649630902761437, "global_step": 406782, "epoch": 4900, "train/sim_max_reward_0": 0.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4500000": 1.0, "test/sim_max_reward_4500001": 1.0, "test/sim_max_reward_4500002": 1.0, "test/sim_max_reward_4500003": 1.0, "test/sim_max_reward_4500004": 1.0, "test/sim_max_reward_4500005": 1.0, "test/sim_max_reward_4500006": 1.0, "test/sim_max_reward_4500007": 0.0, "test/sim_max_reward_4500008": 1.0, "test/sim_max_reward_4500009": 1.0, "test/sim_max_reward_4500010": 1.0, "test/sim_max_reward_4500011": 1.0, "test/sim_max_reward_4500012": 1.0, "test/sim_max_reward_4500013": 0.0, "test/sim_max_reward_4500014": 1.0, "test/sim_max_reward_4500015": 1.0, "test/sim_max_reward_4500016": 1.0, "test/sim_max_reward_4500017": 1.0, "test/sim_max_reward_4500018": 0.0, "test/sim_max_reward_4500019": 0.0, "test/sim_max_reward_4500020": 1.0, "test/sim_max_reward_4500021": 1.0, "train/mean_score": 0.8333333333333334, "test/mean_score": 0.8181818181818182, "val_loss": 6625089.5} {"train_loss": -26.23261070251465, "global_step": 406783, "epoch": 4901} {"train_loss": -26.188024520874023, "global_step": 406784, "epoch": 4901} {"train_loss": -26.421430587768555, "global_step": 406785, "epoch": 4901} {"train_loss": -26.300199508666992, "global_step": 406786, "epoch": 4901} {"train_loss": -26.427515029907227, "global_step": 406787, "epoch": 4901} {"train_loss": -26.293920516967773, "global_step": 406788, "epoch": 4901} {"train_loss": -26.391096115112305, "global_step": 406789, "epoch": 4901} {"train_loss": -26.367908477783203, "global_step": 406790, "epoch": 4901} {"train_loss": -26.134607315063477, "global_step": 406791, "epoch": 4901} {"train_loss": -26.443862915039062, "global_step": 406792, "epoch": 4901} {"train_loss": -26.518171310424805, "global_step": 406793, "epoch": 4901} {"train_loss": -26.53558921813965, "global_step": 406794, "epoch": 4901} {"train_loss": -26.674219131469727, "global_step": 406795, "epoch": 4901} {"train_loss": -26.359533309936523, "global_step": 406796, "epoch": 4901} {"train_loss": -26.661413192749023, "global_step": 406797, "epoch": 4901} {"train_loss": -26.374597549438477, "global_step": 406798, "epoch": 4901} {"train_loss": -26.211339950561523, "global_step": 406799, "epoch": 4901} {"train_loss": -26.78632164001465, "global_step": 406800, "epoch": 4901} {"train_loss": -26.56035804748535, "global_step": 406801, "epoch": 4901} {"train_loss": -26.391754150390625, "global_step": 406802, "epoch": 4901} {"train_loss": -26.591785430908203, "global_step": 406803, "epoch": 4901} {"train_loss": -26.439355850219727, "global_step": 406804, "epoch": 4901} {"train_loss": -26.642404556274414, "global_step": 406805, "epoch": 4901} {"train_loss": -26.442785263061523, "global_step": 406806, "epoch": 4901} {"train_loss": -26.944067001342773, "global_step": 406807, "epoch": 4901} {"train_loss": -26.227819442749023, "global_step": 406808, "epoch": 4901} {"train_loss": -26.77157974243164, "global_step": 406809, "epoch": 4901} {"train_loss": -26.724328994750977, "global_step": 406810, "epoch": 4901} {"train_loss": -26.8198299407959, "global_step": 406811, "epoch": 4901} {"train_loss": -26.774084091186523, "global_step": 406812, "epoch": 4901} {"train_loss": -26.796152114868164, "global_step": 406813, "epoch": 4901} {"train_loss": -26.768598556518555, "global_step": 406814, "epoch": 4901} {"train_loss": -27.070636749267578, "global_step": 406815, "epoch": 4901} {"train_loss": -26.54767417907715, "global_step": 406816, "epoch": 4901} {"train_loss": -26.5070743560791, "global_step": 406817, "epoch": 4901} {"train_loss": -26.808191299438477, "global_step": 406818, "epoch": 4901} {"train_loss": -26.55390739440918, "global_step": 406819, "epoch": 4901} {"train_loss": -26.972900390625, "global_step": 406820, "epoch": 4901} {"train_loss": -26.666458129882812, "global_step": 406821, "epoch": 4901} {"train_loss": -26.993322372436523, "global_step": 406822, "epoch": 4901} {"train_loss": -26.95990562438965, "global_step": 406823, "epoch": 4901} {"train_loss": -26.539472579956055, "global_step": 406824, "epoch": 4901} {"train_loss": -26.932172775268555, "global_step": 406825, "epoch": 4901} {"train_loss": -27.222829818725586, "global_step": 406826, "epoch": 4901} {"train_loss": -26.50361442565918, "global_step": 406827, "epoch": 4901} {"train_loss": -26.533674240112305, "global_step": 406828, "epoch": 4901} {"train_loss": -26.4058895111084, "global_step": 406829, "epoch": 4901} {"train_loss": -26.3135929107666, "global_step": 406830, "epoch": 4901} {"train_loss": -26.163013458251953, "global_step": 406831, "epoch": 4901} {"train_loss": -25.005847930908203, "global_step": 406832, "epoch": 4901} {"train_loss": -22.591154098510742, "global_step": 406833, "epoch": 4901} {"train_loss": -24.02315330505371, "global_step": 406834, "epoch": 4901} {"train_loss": -25.956043243408203, "global_step": 406835, "epoch": 4901} {"train_loss": -24.5137996673584, "global_step": 406836, "epoch": 4901} {"train_loss": -25.437332153320312, "global_step": 406837, "epoch": 4901} {"train_loss": -25.561630249023438, "global_step": 406838, "epoch": 4901} {"train_loss": -25.531286239624023, "global_step": 406839, "epoch": 4901} {"train_loss": -26.460973739624023, "global_step": 406840, "epoch": 4901} {"train_loss": -25.837186813354492, "global_step": 406841, "epoch": 4901} {"train_loss": -25.86884117126465, "global_step": 406842, "epoch": 4901} {"train_loss": -26.19550895690918, "global_step": 406843, "epoch": 4901} {"train_loss": -26.10914421081543, "global_step": 406844, "epoch": 4901} {"train_loss": -26.302448272705078, "global_step": 406845, "epoch": 4901} {"train_loss": -25.90728759765625, "global_step": 406846, "epoch": 4901} {"train_loss": -26.1735897064209, "global_step": 406847, "epoch": 4901} {"train_loss": -26.03705406188965, "global_step": 406848, "epoch": 4901} {"train_loss": -26.331342697143555, "global_step": 406849, "epoch": 4901} {"train_loss": -26.1208553314209, "global_step": 406850, "epoch": 4901} {"train_loss": -26.185022354125977, "global_step": 406851, "epoch": 4901} {"train_loss": -26.240442276000977, "global_step": 406852, "epoch": 4901} {"train_loss": -26.485570907592773, "global_step": 406853, "epoch": 4901} {"train_loss": -26.10334587097168, "global_step": 406854, "epoch": 4901} {"train_loss": -26.4357967376709, "global_step": 406855, "epoch": 4901} {"train_loss": -26.513708114624023, "global_step": 406856, "epoch": 4901} {"train_loss": -26.328107833862305, "global_step": 406857, "epoch": 4901} {"train_loss": -26.043333053588867, "global_step": 406858, "epoch": 4901} {"train_loss": -26.38469886779785, "global_step": 406859, "epoch": 4901} {"train_loss": -26.25373649597168, "global_step": 406860, "epoch": 4901} {"train_loss": -26.5163631439209, "global_step": 406861, "epoch": 4901} {"train_loss": -26.498279571533203, "global_step": 406862, "epoch": 4901} {"train_loss": -26.433032989501953, "global_step": 406863, "epoch": 4901} {"train_loss": -26.428354263305664, "global_step": 406864, "epoch": 4901} {"train_loss": -26.30632811856557, "global_step": 406865, "epoch": 4901, "val_loss": 6650070.0} {"train_loss": -26.072229385375977, "global_step": 406866, "epoch": 4902} {"train_loss": -25.54156494140625, "global_step": 406867, "epoch": 4902} {"train_loss": -26.000608444213867, "global_step": 406868, "epoch": 4902} {"train_loss": -25.932458877563477, "global_step": 406869, "epoch": 4902} {"train_loss": -26.05161476135254, "global_step": 406870, "epoch": 4902} {"train_loss": -26.106836318969727, "global_step": 406871, "epoch": 4902} {"train_loss": -26.174869537353516, "global_step": 406872, "epoch": 4902} {"train_loss": -26.50992202758789, "global_step": 406873, "epoch": 4902} {"train_loss": -26.020328521728516, "global_step": 406874, "epoch": 4902} {"train_loss": -25.843021392822266, "global_step": 406875, "epoch": 4902} {"train_loss": -26.821247100830078, "global_step": 406876, "epoch": 4902} {"train_loss": -26.348047256469727, "global_step": 406877, "epoch": 4902} {"train_loss": -26.02581214904785, "global_step": 406878, "epoch": 4902} {"train_loss": -26.133642196655273, "global_step": 406879, "epoch": 4902} {"train_loss": -26.047033309936523, "global_step": 406880, "epoch": 4902} {"train_loss": -26.07954216003418, "global_step": 406881, "epoch": 4902} {"train_loss": -25.882293701171875, "global_step": 406882, "epoch": 4902} {"train_loss": -26.115751266479492, "global_step": 406883, "epoch": 4902} {"train_loss": -26.224872589111328, "global_step": 406884, "epoch": 4902} {"train_loss": -26.38711929321289, "global_step": 406885, "epoch": 4902} {"train_loss": -26.385971069335938, "global_step": 406886, "epoch": 4902} {"train_loss": -26.330747604370117, "global_step": 406887, "epoch": 4902} {"train_loss": -26.42079734802246, "global_step": 406888, "epoch": 4902} {"train_loss": -26.48792839050293, "global_step": 406889, "epoch": 4902} {"train_loss": -25.963321685791016, "global_step": 406890, "epoch": 4902} {"train_loss": -26.724267959594727, "global_step": 406891, "epoch": 4902} {"train_loss": -26.66538429260254, "global_step": 406892, "epoch": 4902} {"train_loss": -26.34480094909668, "global_step": 406893, "epoch": 4902} {"train_loss": -26.55230140686035, "global_step": 406894, "epoch": 4902} {"train_loss": -26.610891342163086, "global_step": 406895, "epoch": 4902} {"train_loss": -26.628650665283203, "global_step": 406896, "epoch": 4902} {"train_loss": -26.65823745727539, "global_step": 406897, "epoch": 4902} {"train_loss": -26.957136154174805, "global_step": 406898, "epoch": 4902} {"train_loss": -26.465194702148438, "global_step": 406899, "epoch": 4902} {"train_loss": -26.663000106811523, "global_step": 406900, "epoch": 4902} {"train_loss": -26.88994789123535, "global_step": 406901, "epoch": 4902} {"train_loss": -26.843229293823242, "global_step": 406902, "epoch": 4902} {"train_loss": -27.096342086791992, "global_step": 406903, "epoch": 4902} {"train_loss": -26.73109245300293, "global_step": 406904, "epoch": 4902} {"train_loss": -27.345739364624023, "global_step": 406905, "epoch": 4902} {"train_loss": -26.742658615112305, "global_step": 406906, "epoch": 4902} {"train_loss": -26.9507999420166, "global_step": 406907, "epoch": 4902} {"train_loss": -26.299428939819336, "global_step": 406908, "epoch": 4902} {"train_loss": -26.97003173828125, "global_step": 406909, "epoch": 4902} {"train_loss": -26.952884674072266, "global_step": 406910, "epoch": 4902} {"train_loss": -26.7880802154541, "global_step": 406911, "epoch": 4902} {"train_loss": -25.982654571533203, "global_step": 406912, "epoch": 4902} {"train_loss": -26.813629150390625, "global_step": 406913, "epoch": 4902} {"train_loss": -26.356245040893555, "global_step": 406914, "epoch": 4902} {"train_loss": -25.801610946655273, "global_step": 406915, "epoch": 4902} {"train_loss": -26.146631240844727, "global_step": 406916, "epoch": 4902} {"train_loss": -26.391653060913086, "global_step": 406917, "epoch": 4902} {"train_loss": -26.188358306884766, "global_step": 406918, "epoch": 4902} {"train_loss": -26.484846115112305, "global_step": 406919, "epoch": 4902} {"train_loss": -26.3883056640625, "global_step": 406920, "epoch": 4902} {"train_loss": -26.671369552612305, "global_step": 406921, "epoch": 4902} {"train_loss": -26.56842041015625, "global_step": 406922, "epoch": 4902} {"train_loss": -26.08098793029785, "global_step": 406923, "epoch": 4902} {"train_loss": -26.462116241455078, "global_step": 406924, "epoch": 4902} {"train_loss": -26.44620704650879, "global_step": 406925, "epoch": 4902} {"train_loss": -26.06123161315918, "global_step": 406926, "epoch": 4902} {"train_loss": -26.25261878967285, "global_step": 406927, "epoch": 4902} {"train_loss": -26.546768188476562, "global_step": 406928, "epoch": 4902} {"train_loss": -25.91167640686035, "global_step": 406929, "epoch": 4902} {"train_loss": -26.31536865234375, "global_step": 406930, "epoch": 4902} {"train_loss": -26.71284294128418, "global_step": 406931, "epoch": 4902} {"train_loss": -26.482757568359375, "global_step": 406932, "epoch": 4902} {"train_loss": -27.002042770385742, "global_step": 406933, "epoch": 4902} {"train_loss": -26.43263053894043, "global_step": 406934, "epoch": 4902} {"train_loss": -26.338092803955078, "global_step": 406935, "epoch": 4902} {"train_loss": -26.446104049682617, "global_step": 406936, "epoch": 4902} {"train_loss": -26.385175704956055, "global_step": 406937, "epoch": 4902} {"train_loss": -27.156110763549805, "global_step": 406938, "epoch": 4902} {"train_loss": -26.7203369140625, "global_step": 406939, "epoch": 4902} {"train_loss": -26.390905380249023, "global_step": 406940, "epoch": 4902} {"train_loss": -26.61665916442871, "global_step": 406941, "epoch": 4902} {"train_loss": -26.543546676635742, "global_step": 406942, "epoch": 4902} {"train_loss": -26.790868759155273, "global_step": 406943, "epoch": 4902} {"train_loss": -26.655292510986328, "global_step": 406944, "epoch": 4902} {"train_loss": -26.6994686126709, "global_step": 406945, "epoch": 4902} {"train_loss": -26.699512481689453, "global_step": 406946, "epoch": 4902} {"train_loss": -26.838104248046875, "global_step": 406947, "epoch": 4902} {"train_loss": -26.442075039966998, "global_step": 406948, "epoch": 4902, "val_loss": 6572662.0} {"train_loss": -26.253009796142578, "global_step": 406949, "epoch": 4903} {"train_loss": -26.566638946533203, "global_step": 406950, "epoch": 4903} {"train_loss": -26.06780433654785, "global_step": 406951, "epoch": 4903} {"train_loss": -26.59796714782715, "global_step": 406952, "epoch": 4903} {"train_loss": -26.414356231689453, "global_step": 406953, "epoch": 4903} {"train_loss": -25.941486358642578, "global_step": 406954, "epoch": 4903} {"train_loss": -26.357803344726562, "global_step": 406955, "epoch": 4903} {"train_loss": -26.462488174438477, "global_step": 406956, "epoch": 4903} {"train_loss": -26.0415096282959, "global_step": 406957, "epoch": 4903} {"train_loss": -26.382553100585938, "global_step": 406958, "epoch": 4903} {"train_loss": -26.629934310913086, "global_step": 406959, "epoch": 4903} {"train_loss": -26.60566520690918, "global_step": 406960, "epoch": 4903} {"train_loss": -26.329965591430664, "global_step": 406961, "epoch": 4903} {"train_loss": -26.26022720336914, "global_step": 406962, "epoch": 4903} {"train_loss": -26.190954208374023, "global_step": 406963, "epoch": 4903} {"train_loss": -26.345060348510742, "global_step": 406964, "epoch": 4903} {"train_loss": -26.603540420532227, "global_step": 406965, "epoch": 4903} {"train_loss": -26.493764877319336, "global_step": 406966, "epoch": 4903} {"train_loss": -26.52019691467285, "global_step": 406967, "epoch": 4903} {"train_loss": -26.532888412475586, "global_step": 406968, "epoch": 4903} {"train_loss": -26.449542999267578, "global_step": 406969, "epoch": 4903} {"train_loss": -26.12961196899414, "global_step": 406970, "epoch": 4903} {"train_loss": -26.693622589111328, "global_step": 406971, "epoch": 4903} {"train_loss": -26.8759822845459, "global_step": 406972, "epoch": 4903} {"train_loss": -26.810998916625977, "global_step": 406973, "epoch": 4903} {"train_loss": -26.768247604370117, "global_step": 406974, "epoch": 4903} {"train_loss": -27.180978775024414, "global_step": 406975, "epoch": 4903} {"train_loss": -26.546201705932617, "global_step": 406976, "epoch": 4903} {"train_loss": -26.845203399658203, "global_step": 406977, "epoch": 4903} {"train_loss": -26.7561092376709, "global_step": 406978, "epoch": 4903} {"train_loss": -26.79668617248535, "global_step": 406979, "epoch": 4903} {"train_loss": -26.568586349487305, "global_step": 406980, "epoch": 4903} {"train_loss": -26.472339630126953, "global_step": 406981, "epoch": 4903} {"train_loss": -26.582651138305664, "global_step": 406982, "epoch": 4903} {"train_loss": -26.639429092407227, "global_step": 406983, "epoch": 4903} {"train_loss": -26.5998592376709, "global_step": 406984, "epoch": 4903} {"train_loss": -26.74769401550293, "global_step": 406985, "epoch": 4903} {"train_loss": -26.58466148376465, "global_step": 406986, "epoch": 4903} {"train_loss": -26.983484268188477, "global_step": 406987, "epoch": 4903} {"train_loss": -26.416717529296875, "global_step": 406988, "epoch": 4903} {"train_loss": -26.88482666015625, "global_step": 406989, "epoch": 4903} {"train_loss": -26.920026779174805, "global_step": 406990, "epoch": 4903} {"train_loss": -26.595844268798828, "global_step": 406991, "epoch": 4903} {"train_loss": -26.832807540893555, "global_step": 406992, "epoch": 4903} {"train_loss": -27.03498649597168, "global_step": 406993, "epoch": 4903} {"train_loss": -26.75001335144043, "global_step": 406994, "epoch": 4903} {"train_loss": -26.82777214050293, "global_step": 406995, "epoch": 4903} {"train_loss": -27.079166412353516, "global_step": 406996, "epoch": 4903} {"train_loss": -26.584863662719727, "global_step": 406997, "epoch": 4903} {"train_loss": -26.418670654296875, "global_step": 406998, "epoch": 4903} {"train_loss": -26.985624313354492, "global_step": 406999, "epoch": 4903} {"train_loss": -26.64900016784668, "global_step": 407000, "epoch": 4903} {"train_loss": -26.432897567749023, "global_step": 407001, "epoch": 4903} {"train_loss": -26.723623275756836, "global_step": 407002, "epoch": 4903} {"train_loss": -26.540464401245117, "global_step": 407003, "epoch": 4903} {"train_loss": -26.420682907104492, "global_step": 407004, "epoch": 4903} {"train_loss": -27.03840446472168, "global_step": 407005, "epoch": 4903} {"train_loss": -26.23573112487793, "global_step": 407006, "epoch": 4903} {"train_loss": -26.79591941833496, "global_step": 407007, "epoch": 4903} {"train_loss": -26.90692710876465, "global_step": 407008, "epoch": 4903} {"train_loss": -26.899564743041992, "global_step": 407009, "epoch": 4903} {"train_loss": -26.76995277404785, "global_step": 407010, "epoch": 4903} {"train_loss": -26.3087158203125, "global_step": 407011, "epoch": 4903} {"train_loss": -27.104578018188477, "global_step": 407012, "epoch": 4903} {"train_loss": -26.87884521484375, "global_step": 407013, "epoch": 4903} {"train_loss": -26.7696475982666, "global_step": 407014, "epoch": 4903} {"train_loss": -26.765888214111328, "global_step": 407015, "epoch": 4903} {"train_loss": -26.8787784576416, "global_step": 407016, "epoch": 4903} {"train_loss": -26.435382843017578, "global_step": 407017, "epoch": 4903} {"train_loss": -26.660480499267578, "global_step": 407018, "epoch": 4903} {"train_loss": -26.660388946533203, "global_step": 407019, "epoch": 4903} {"train_loss": -26.631671905517578, "global_step": 407020, "epoch": 4903} {"train_loss": -26.648473739624023, "global_step": 407021, "epoch": 4903} {"train_loss": -26.841537475585938, "global_step": 407022, "epoch": 4903} {"train_loss": -26.596349716186523, "global_step": 407023, "epoch": 4903} {"train_loss": -26.822885513305664, "global_step": 407024, "epoch": 4903} {"train_loss": -26.882858276367188, "global_step": 407025, "epoch": 4903} {"train_loss": -26.542097091674805, "global_step": 407026, "epoch": 4903} {"train_loss": -26.918628692626953, "global_step": 407027, "epoch": 4903} {"train_loss": -26.868305206298828, "global_step": 407028, "epoch": 4903} {"train_loss": -27.037336349487305, "global_step": 407029, "epoch": 4903} {"train_loss": -27.060104370117188, "global_step": 407030, "epoch": 4903} {"train_loss": -26.643953989787274, "global_step": 407031, "epoch": 4903, "val_loss": 6655565.5} {"train_loss": -26.53571128845215, "global_step": 407032, "epoch": 4904} {"train_loss": -26.38812828063965, "global_step": 407033, "epoch": 4904} {"train_loss": -25.987619400024414, "global_step": 407034, "epoch": 4904} {"train_loss": -26.482763290405273, "global_step": 407035, "epoch": 4904} {"train_loss": -25.99464225769043, "global_step": 407036, "epoch": 4904} {"train_loss": -26.261249542236328, "global_step": 407037, "epoch": 4904} {"train_loss": -26.04465103149414, "global_step": 407038, "epoch": 4904} {"train_loss": -26.408910751342773, "global_step": 407039, "epoch": 4904} {"train_loss": -26.22528648376465, "global_step": 407040, "epoch": 4904} {"train_loss": -26.5312557220459, "global_step": 407041, "epoch": 4904} {"train_loss": -26.00200843811035, "global_step": 407042, "epoch": 4904} {"train_loss": -26.1662654876709, "global_step": 407043, "epoch": 4904} {"train_loss": -26.580480575561523, "global_step": 407044, "epoch": 4904} {"train_loss": -26.370532989501953, "global_step": 407045, "epoch": 4904} {"train_loss": -25.81168556213379, "global_step": 407046, "epoch": 4904} {"train_loss": -26.407148361206055, "global_step": 407047, "epoch": 4904} {"train_loss": -26.361114501953125, "global_step": 407048, "epoch": 4904} {"train_loss": -26.607141494750977, "global_step": 407049, "epoch": 4904} {"train_loss": -26.30255126953125, "global_step": 407050, "epoch": 4904} {"train_loss": -26.8924503326416, "global_step": 407051, "epoch": 4904} {"train_loss": -26.23758888244629, "global_step": 407052, "epoch": 4904} {"train_loss": -26.339466094970703, "global_step": 407053, "epoch": 4904} {"train_loss": -26.43513298034668, "global_step": 407054, "epoch": 4904} {"train_loss": -26.535144805908203, "global_step": 407055, "epoch": 4904} {"train_loss": -26.667682647705078, "global_step": 407056, "epoch": 4904} {"train_loss": -26.516386032104492, "global_step": 407057, "epoch": 4904} {"train_loss": -26.256330490112305, "global_step": 407058, "epoch": 4904} {"train_loss": -26.60371971130371, "global_step": 407059, "epoch": 4904} {"train_loss": -26.6032657623291, "global_step": 407060, "epoch": 4904} {"train_loss": -26.796918869018555, "global_step": 407061, "epoch": 4904} {"train_loss": -26.838459014892578, "global_step": 407062, "epoch": 4904} {"train_loss": -26.69902992248535, "global_step": 407063, "epoch": 4904} {"train_loss": -26.607629776000977, "global_step": 407064, "epoch": 4904} {"train_loss": -26.688308715820312, "global_step": 407065, "epoch": 4904} {"train_loss": -26.604202270507812, "global_step": 407066, "epoch": 4904} {"train_loss": -26.807104110717773, "global_step": 407067, "epoch": 4904} {"train_loss": -26.65256118774414, "global_step": 407068, "epoch": 4904} {"train_loss": -26.350204467773438, "global_step": 407069, "epoch": 4904} {"train_loss": -27.237775802612305, "global_step": 407070, "epoch": 4904} {"train_loss": -26.737476348876953, "global_step": 407071, "epoch": 4904} {"train_loss": -26.67378044128418, "global_step": 407072, "epoch": 4904} {"train_loss": -26.42717933654785, "global_step": 407073, "epoch": 4904} {"train_loss": -26.405506134033203, "global_step": 407074, "epoch": 4904} {"train_loss": -27.133222579956055, "global_step": 407075, "epoch": 4904} {"train_loss": -26.73788833618164, "global_step": 407076, "epoch": 4904} {"train_loss": -26.75335693359375, "global_step": 407077, "epoch": 4904} {"train_loss": -26.926916122436523, "global_step": 407078, "epoch": 4904} {"train_loss": -26.56610107421875, "global_step": 407079, "epoch": 4904} {"train_loss": -27.130390167236328, "global_step": 407080, "epoch": 4904} {"train_loss": -26.552051544189453, "global_step": 407081, "epoch": 4904} {"train_loss": -26.921772003173828, "global_step": 407082, "epoch": 4904} {"train_loss": -26.598371505737305, "global_step": 407083, "epoch": 4904} {"train_loss": -26.387048721313477, "global_step": 407084, "epoch": 4904} {"train_loss": -27.120092391967773, "global_step": 407085, "epoch": 4904} {"train_loss": -26.7924861907959, "global_step": 407086, "epoch": 4904} {"train_loss": -26.721765518188477, "global_step": 407087, "epoch": 4904} {"train_loss": -26.857666015625, "global_step": 407088, "epoch": 4904} {"train_loss": -26.31363868713379, "global_step": 407089, "epoch": 4904} {"train_loss": -26.912002563476562, "global_step": 407090, "epoch": 4904} {"train_loss": -26.728748321533203, "global_step": 407091, "epoch": 4904} {"train_loss": -26.90736198425293, "global_step": 407092, "epoch": 4904} {"train_loss": -26.428516387939453, "global_step": 407093, "epoch": 4904} {"train_loss": -26.06001091003418, "global_step": 407094, "epoch": 4904} {"train_loss": -26.100656509399414, "global_step": 407095, "epoch": 4904} {"train_loss": -25.705713272094727, "global_step": 407096, "epoch": 4904} {"train_loss": -25.753889083862305, "global_step": 407097, "epoch": 4904} {"train_loss": -26.378705978393555, "global_step": 407098, "epoch": 4904} {"train_loss": -26.946502685546875, "global_step": 407099, "epoch": 4904} {"train_loss": -26.744958877563477, "global_step": 407100, "epoch": 4904} {"train_loss": -26.4363956451416, "global_step": 407101, "epoch": 4904} {"train_loss": -26.298852920532227, "global_step": 407102, "epoch": 4904} {"train_loss": -26.46856689453125, "global_step": 407103, "epoch": 4904} {"train_loss": -26.641891479492188, "global_step": 407104, "epoch": 4904} {"train_loss": -26.83969497680664, "global_step": 407105, "epoch": 4904} {"train_loss": -26.61958122253418, "global_step": 407106, "epoch": 4904} {"train_loss": -26.63703727722168, "global_step": 407107, "epoch": 4904} {"train_loss": -26.950485229492188, "global_step": 407108, "epoch": 4904} {"train_loss": -26.618650436401367, "global_step": 407109, "epoch": 4904} {"train_loss": -26.649169921875, "global_step": 407110, "epoch": 4904} {"train_loss": -26.845916748046875, "global_step": 407111, "epoch": 4904} {"train_loss": -26.63115882873535, "global_step": 407112, "epoch": 4904} {"train_loss": -26.52556800842285, "global_step": 407113, "epoch": 4904} {"train_loss": -26.540706657501588, "global_step": 407114, "epoch": 4904, "val_loss": 6684658.0} {"train_loss": -25.553874969482422, "global_step": 407115, "epoch": 4905} {"train_loss": -25.547555923461914, "global_step": 407116, "epoch": 4905} {"train_loss": -26.100543975830078, "global_step": 407117, "epoch": 4905} {"train_loss": -26.196826934814453, "global_step": 407118, "epoch": 4905} {"train_loss": -26.09807777404785, "global_step": 407119, "epoch": 4905} {"train_loss": -26.163482666015625, "global_step": 407120, "epoch": 4905} {"train_loss": -26.734272003173828, "global_step": 407121, "epoch": 4905} {"train_loss": -25.9328670501709, "global_step": 407122, "epoch": 4905} {"train_loss": -26.625757217407227, "global_step": 407123, "epoch": 4905} {"train_loss": -26.28602409362793, "global_step": 407124, "epoch": 4905} {"train_loss": -26.49932861328125, "global_step": 407125, "epoch": 4905} {"train_loss": -26.152612686157227, "global_step": 407126, "epoch": 4905} {"train_loss": -26.692035675048828, "global_step": 407127, "epoch": 4905} {"train_loss": -26.20002555847168, "global_step": 407128, "epoch": 4905} {"train_loss": -26.889509201049805, "global_step": 407129, "epoch": 4905} {"train_loss": -26.367111206054688, "global_step": 407130, "epoch": 4905} {"train_loss": -26.518051147460938, "global_step": 407131, "epoch": 4905} {"train_loss": -26.736059188842773, "global_step": 407132, "epoch": 4905} {"train_loss": -26.672765731811523, "global_step": 407133, "epoch": 4905} {"train_loss": -26.58542251586914, "global_step": 407134, "epoch": 4905} {"train_loss": -26.633237838745117, "global_step": 407135, "epoch": 4905} {"train_loss": -26.575464248657227, "global_step": 407136, "epoch": 4905} {"train_loss": -26.38947105407715, "global_step": 407137, "epoch": 4905} {"train_loss": -26.826587677001953, "global_step": 407138, "epoch": 4905} {"train_loss": -26.87946891784668, "global_step": 407139, "epoch": 4905} {"train_loss": -27.191797256469727, "global_step": 407140, "epoch": 4905} {"train_loss": -26.728519439697266, "global_step": 407141, "epoch": 4905} {"train_loss": -26.654434204101562, "global_step": 407142, "epoch": 4905} {"train_loss": -26.711328506469727, "global_step": 407143, "epoch": 4905} {"train_loss": -26.59791374206543, "global_step": 407144, "epoch": 4905} {"train_loss": -26.765933990478516, "global_step": 407145, "epoch": 4905} {"train_loss": -27.027313232421875, "global_step": 407146, "epoch": 4905} {"train_loss": -26.9047794342041, "global_step": 407147, "epoch": 4905} {"train_loss": -26.964120864868164, "global_step": 407148, "epoch": 4905} {"train_loss": -26.882953643798828, "global_step": 407149, "epoch": 4905} {"train_loss": -27.301029205322266, "global_step": 407150, "epoch": 4905} {"train_loss": -26.701379776000977, "global_step": 407151, "epoch": 4905} {"train_loss": -26.59393310546875, "global_step": 407152, "epoch": 4905} {"train_loss": -26.706226348876953, "global_step": 407153, "epoch": 4905} {"train_loss": -27.059295654296875, "global_step": 407154, "epoch": 4905} {"train_loss": -26.943281173706055, "global_step": 407155, "epoch": 4905} {"train_loss": -26.90654945373535, "global_step": 407156, "epoch": 4905} {"train_loss": -27.056894302368164, "global_step": 407157, "epoch": 4905} {"train_loss": -26.90839195251465, "global_step": 407158, "epoch": 4905} {"train_loss": -26.680530548095703, "global_step": 407159, "epoch": 4905} {"train_loss": -26.800189971923828, "global_step": 407160, "epoch": 4905} {"train_loss": -26.96668815612793, "global_step": 407161, "epoch": 4905} {"train_loss": -26.7767391204834, "global_step": 407162, "epoch": 4905} {"train_loss": -26.851810455322266, "global_step": 407163, "epoch": 4905} {"train_loss": -26.911701202392578, "global_step": 407164, "epoch": 4905} {"train_loss": -26.78104591369629, "global_step": 407165, "epoch": 4905} {"train_loss": -26.88618278503418, "global_step": 407166, "epoch": 4905} {"train_loss": -26.525360107421875, "global_step": 407167, "epoch": 4905} {"train_loss": -26.7565860748291, "global_step": 407168, "epoch": 4905} {"train_loss": -26.794818878173828, "global_step": 407169, "epoch": 4905} {"train_loss": -26.771642684936523, "global_step": 407170, "epoch": 4905} {"train_loss": -26.81318473815918, "global_step": 407171, "epoch": 4905} {"train_loss": -26.806344985961914, "global_step": 407172, "epoch": 4905} {"train_loss": -26.970489501953125, "global_step": 407173, "epoch": 4905} {"train_loss": -26.687042236328125, "global_step": 407174, "epoch": 4905} {"train_loss": -26.6317195892334, "global_step": 407175, "epoch": 4905} {"train_loss": -26.865598678588867, "global_step": 407176, "epoch": 4905} {"train_loss": -26.72907066345215, "global_step": 407177, "epoch": 4905} {"train_loss": -26.74811363220215, "global_step": 407178, "epoch": 4905} {"train_loss": -26.894094467163086, "global_step": 407179, "epoch": 4905} {"train_loss": -27.241043090820312, "global_step": 407180, "epoch": 4905} {"train_loss": -27.02796745300293, "global_step": 407181, "epoch": 4905} {"train_loss": -26.776044845581055, "global_step": 407182, "epoch": 4905} {"train_loss": -26.493635177612305, "global_step": 407183, "epoch": 4905} {"train_loss": -26.7448673248291, "global_step": 407184, "epoch": 4905} {"train_loss": -26.742202758789062, "global_step": 407185, "epoch": 4905} {"train_loss": -26.980823516845703, "global_step": 407186, "epoch": 4905} {"train_loss": -26.78907585144043, "global_step": 407187, "epoch": 4905} {"train_loss": -26.584753036499023, "global_step": 407188, "epoch": 4905} {"train_loss": -26.83271598815918, "global_step": 407189, "epoch": 4905} {"train_loss": -26.86103630065918, "global_step": 407190, "epoch": 4905} {"train_loss": -26.818777084350586, "global_step": 407191, "epoch": 4905} {"train_loss": -26.63624382019043, "global_step": 407192, "epoch": 4905} {"train_loss": -27.1124324798584, "global_step": 407193, "epoch": 4905} {"train_loss": -26.363752365112305, "global_step": 407194, "epoch": 4905} {"train_loss": -26.771467208862305, "global_step": 407195, "epoch": 4905} {"train_loss": -26.842411041259766, "global_step": 407196, "epoch": 4905} {"train_loss": -26.689957607223327, "global_step": 407197, "epoch": 4905, "val_loss": 6505209.0} {"train_loss": -25.04511070251465, "global_step": 407198, "epoch": 4906} {"train_loss": -26.003646850585938, "global_step": 407199, "epoch": 4906} {"train_loss": -25.321414947509766, "global_step": 407200, "epoch": 4906} {"train_loss": -24.040231704711914, "global_step": 407201, "epoch": 4906} {"train_loss": -25.440196990966797, "global_step": 407202, "epoch": 4906} {"train_loss": -25.047988891601562, "global_step": 407203, "epoch": 4906} {"train_loss": -24.625839233398438, "global_step": 407204, "epoch": 4906} {"train_loss": -24.234813690185547, "global_step": 407205, "epoch": 4906} {"train_loss": -25.54574966430664, "global_step": 407206, "epoch": 4906} {"train_loss": -25.20223045349121, "global_step": 407207, "epoch": 4906} {"train_loss": -24.89820671081543, "global_step": 407208, "epoch": 4906} {"train_loss": -24.95708656311035, "global_step": 407209, "epoch": 4906} {"train_loss": -24.534940719604492, "global_step": 407210, "epoch": 4906} {"train_loss": -25.81571388244629, "global_step": 407211, "epoch": 4906} {"train_loss": -25.446443557739258, "global_step": 407212, "epoch": 4906} {"train_loss": -25.49019432067871, "global_step": 407213, "epoch": 4906} {"train_loss": -25.5021915435791, "global_step": 407214, "epoch": 4906} {"train_loss": -26.113866806030273, "global_step": 407215, "epoch": 4906} {"train_loss": -25.659149169921875, "global_step": 407216, "epoch": 4906} {"train_loss": -25.622617721557617, "global_step": 407217, "epoch": 4906} {"train_loss": -26.12045669555664, "global_step": 407218, "epoch": 4906} {"train_loss": -25.6925048828125, "global_step": 407219, "epoch": 4906} {"train_loss": -26.027603149414062, "global_step": 407220, "epoch": 4906} {"train_loss": -26.07407569885254, "global_step": 407221, "epoch": 4906} {"train_loss": -25.93830680847168, "global_step": 407222, "epoch": 4906} {"train_loss": -26.236896514892578, "global_step": 407223, "epoch": 4906} {"train_loss": -25.79383659362793, "global_step": 407224, "epoch": 4906} {"train_loss": -25.820724487304688, "global_step": 407225, "epoch": 4906} {"train_loss": -25.911136627197266, "global_step": 407226, "epoch": 4906} {"train_loss": -25.940399169921875, "global_step": 407227, "epoch": 4906} {"train_loss": -26.271757125854492, "global_step": 407228, "epoch": 4906} {"train_loss": -26.263647079467773, "global_step": 407229, "epoch": 4906} {"train_loss": -25.908599853515625, "global_step": 407230, "epoch": 4906} {"train_loss": -26.305932998657227, "global_step": 407231, "epoch": 4906} {"train_loss": -26.309494018554688, "global_step": 407232, "epoch": 4906} {"train_loss": -26.379858016967773, "global_step": 407233, "epoch": 4906} {"train_loss": -26.430713653564453, "global_step": 407234, "epoch": 4906} {"train_loss": -26.499563217163086, "global_step": 407235, "epoch": 4906} {"train_loss": -26.712400436401367, "global_step": 407236, "epoch": 4906} {"train_loss": -26.299352645874023, "global_step": 407237, "epoch": 4906} {"train_loss": -26.22633934020996, "global_step": 407238, "epoch": 4906} {"train_loss": -26.830184936523438, "global_step": 407239, "epoch": 4906} {"train_loss": -26.762754440307617, "global_step": 407240, "epoch": 4906} {"train_loss": -26.379379272460938, "global_step": 407241, "epoch": 4906} {"train_loss": -26.74611473083496, "global_step": 407242, "epoch": 4906} {"train_loss": -26.63697624206543, "global_step": 407243, "epoch": 4906} {"train_loss": -26.745092391967773, "global_step": 407244, "epoch": 4906} {"train_loss": -26.46039390563965, "global_step": 407245, "epoch": 4906} {"train_loss": -26.676040649414062, "global_step": 407246, "epoch": 4906} {"train_loss": -26.914535522460938, "global_step": 407247, "epoch": 4906} {"train_loss": -26.899335861206055, "global_step": 407248, "epoch": 4906} {"train_loss": -26.48740005493164, "global_step": 407249, "epoch": 4906} {"train_loss": -26.962890625, "global_step": 407250, "epoch": 4906} {"train_loss": -26.599319458007812, "global_step": 407251, "epoch": 4906} {"train_loss": -26.64361572265625, "global_step": 407252, "epoch": 4906} {"train_loss": -26.694971084594727, "global_step": 407253, "epoch": 4906} {"train_loss": -26.923303604125977, "global_step": 407254, "epoch": 4906} {"train_loss": -26.801916122436523, "global_step": 407255, "epoch": 4906} {"train_loss": -26.88812828063965, "global_step": 407256, "epoch": 4906} {"train_loss": -26.704010009765625, "global_step": 407257, "epoch": 4906} {"train_loss": -26.401565551757812, "global_step": 407258, "epoch": 4906} {"train_loss": -27.004016876220703, "global_step": 407259, "epoch": 4906} {"train_loss": -26.7026309967041, "global_step": 407260, "epoch": 4906} {"train_loss": -26.831653594970703, "global_step": 407261, "epoch": 4906} {"train_loss": -26.497772216796875, "global_step": 407262, "epoch": 4906} {"train_loss": -25.914386749267578, "global_step": 407263, "epoch": 4906} {"train_loss": -25.767202377319336, "global_step": 407264, "epoch": 4906} {"train_loss": -25.804967880249023, "global_step": 407265, "epoch": 4906} {"train_loss": -26.865177154541016, "global_step": 407266, "epoch": 4906} {"train_loss": -26.684179306030273, "global_step": 407267, "epoch": 4906} {"train_loss": -26.372541427612305, "global_step": 407268, "epoch": 4906} {"train_loss": -26.851593017578125, "global_step": 407269, "epoch": 4906} {"train_loss": -26.461511611938477, "global_step": 407270, "epoch": 4906} {"train_loss": -26.662134170532227, "global_step": 407271, "epoch": 4906} {"train_loss": -26.49491310119629, "global_step": 407272, "epoch": 4906} {"train_loss": -26.59315299987793, "global_step": 407273, "epoch": 4906} {"train_loss": -26.589313507080078, "global_step": 407274, "epoch": 4906} {"train_loss": -26.130512237548828, "global_step": 407275, "epoch": 4906} {"train_loss": -26.394765853881836, "global_step": 407276, "epoch": 4906} {"train_loss": -26.655126571655273, "global_step": 407277, "epoch": 4906} {"train_loss": -26.41883659362793, "global_step": 407278, "epoch": 4906} {"train_loss": -25.82562828063965, "global_step": 407279, "epoch": 4906} {"train_loss": -26.11741279693971, "global_step": 407280, "epoch": 4906, "val_loss": 6766103.0} {"train_loss": -25.359756469726562, "global_step": 407281, "epoch": 4907} {"train_loss": -25.591815948486328, "global_step": 407282, "epoch": 4907} {"train_loss": -24.805809020996094, "global_step": 407283, "epoch": 4907} {"train_loss": -24.891263961791992, "global_step": 407284, "epoch": 4907} {"train_loss": -25.350528717041016, "global_step": 407285, "epoch": 4907} {"train_loss": -25.587356567382812, "global_step": 407286, "epoch": 4907} {"train_loss": -25.492605209350586, "global_step": 407287, "epoch": 4907} {"train_loss": -25.58054542541504, "global_step": 407288, "epoch": 4907} {"train_loss": -25.425992965698242, "global_step": 407289, "epoch": 4907} {"train_loss": -25.9842529296875, "global_step": 407290, "epoch": 4907} {"train_loss": -25.64900016784668, "global_step": 407291, "epoch": 4907} {"train_loss": -26.263525009155273, "global_step": 407292, "epoch": 4907} {"train_loss": -25.809778213500977, "global_step": 407293, "epoch": 4907} {"train_loss": -25.695653915405273, "global_step": 407294, "epoch": 4907} {"train_loss": -26.070575714111328, "global_step": 407295, "epoch": 4907} {"train_loss": -26.343753814697266, "global_step": 407296, "epoch": 4907} {"train_loss": -25.952213287353516, "global_step": 407297, "epoch": 4907} {"train_loss": -26.19471549987793, "global_step": 407298, "epoch": 4907} {"train_loss": -25.982839584350586, "global_step": 407299, "epoch": 4907} {"train_loss": -25.919483184814453, "global_step": 407300, "epoch": 4907} {"train_loss": -26.175390243530273, "global_step": 407301, "epoch": 4907} {"train_loss": -25.921613693237305, "global_step": 407302, "epoch": 4907} {"train_loss": -26.171091079711914, "global_step": 407303, "epoch": 4907} {"train_loss": -26.18250846862793, "global_step": 407304, "epoch": 4907} {"train_loss": -26.466760635375977, "global_step": 407305, "epoch": 4907} {"train_loss": -26.10762596130371, "global_step": 407306, "epoch": 4907} {"train_loss": -26.3233642578125, "global_step": 407307, "epoch": 4907} {"train_loss": -26.271631240844727, "global_step": 407308, "epoch": 4907} {"train_loss": -26.03961753845215, "global_step": 407309, "epoch": 4907} {"train_loss": -26.516080856323242, "global_step": 407310, "epoch": 4907} {"train_loss": -26.382291793823242, "global_step": 407311, "epoch": 4907} {"train_loss": -26.570871353149414, "global_step": 407312, "epoch": 4907} {"train_loss": -26.887985229492188, "global_step": 407313, "epoch": 4907} {"train_loss": -26.624027252197266, "global_step": 407314, "epoch": 4907} {"train_loss": -26.42551040649414, "global_step": 407315, "epoch": 4907} {"train_loss": -26.529006958007812, "global_step": 407316, "epoch": 4907} {"train_loss": -26.5151424407959, "global_step": 407317, "epoch": 4907} {"train_loss": -26.121259689331055, "global_step": 407318, "epoch": 4907} {"train_loss": -26.5518741607666, "global_step": 407319, "epoch": 4907} {"train_loss": -26.617895126342773, "global_step": 407320, "epoch": 4907} {"train_loss": -26.379690170288086, "global_step": 407321, "epoch": 4907} {"train_loss": -26.12347984313965, "global_step": 407322, "epoch": 4907} {"train_loss": -26.49542236328125, "global_step": 407323, "epoch": 4907} {"train_loss": -26.79151725769043, "global_step": 407324, "epoch": 4907} {"train_loss": -26.380048751831055, "global_step": 407325, "epoch": 4907} {"train_loss": -26.503950119018555, "global_step": 407326, "epoch": 4907} {"train_loss": -26.710935592651367, "global_step": 407327, "epoch": 4907} {"train_loss": -26.87396812438965, "global_step": 407328, "epoch": 4907} {"train_loss": -27.0107364654541, "global_step": 407329, "epoch": 4907} {"train_loss": -26.446487426757812, "global_step": 407330, "epoch": 4907} {"train_loss": -26.895353317260742, "global_step": 407331, "epoch": 4907} {"train_loss": -26.749027252197266, "global_step": 407332, "epoch": 4907} {"train_loss": -26.626203536987305, "global_step": 407333, "epoch": 4907} {"train_loss": -26.682348251342773, "global_step": 407334, "epoch": 4907} {"train_loss": -26.72230339050293, "global_step": 407335, "epoch": 4907} {"train_loss": -26.76726722717285, "global_step": 407336, "epoch": 4907} {"train_loss": -27.098968505859375, "global_step": 407337, "epoch": 4907} {"train_loss": -26.566425323486328, "global_step": 407338, "epoch": 4907} {"train_loss": -26.429670333862305, "global_step": 407339, "epoch": 4907} {"train_loss": -26.589563369750977, "global_step": 407340, "epoch": 4907} {"train_loss": -26.66762351989746, "global_step": 407341, "epoch": 4907} {"train_loss": -26.934799194335938, "global_step": 407342, "epoch": 4907} {"train_loss": -26.933252334594727, "global_step": 407343, "epoch": 4907} {"train_loss": -26.73719596862793, "global_step": 407344, "epoch": 4907} {"train_loss": -26.96368408203125, "global_step": 407345, "epoch": 4907} {"train_loss": -26.976898193359375, "global_step": 407346, "epoch": 4907} {"train_loss": -26.915771484375, "global_step": 407347, "epoch": 4907} {"train_loss": -26.833576202392578, "global_step": 407348, "epoch": 4907} {"train_loss": -26.765954971313477, "global_step": 407349, "epoch": 4907} {"train_loss": -26.987110137939453, "global_step": 407350, "epoch": 4907} {"train_loss": -26.885000228881836, "global_step": 407351, "epoch": 4907} {"train_loss": -26.917255401611328, "global_step": 407352, "epoch": 4907} {"train_loss": -27.1263484954834, "global_step": 407353, "epoch": 4907} {"train_loss": -26.868173599243164, "global_step": 407354, "epoch": 4907} {"train_loss": -27.203855514526367, "global_step": 407355, "epoch": 4907} {"train_loss": -26.430744171142578, "global_step": 407356, "epoch": 4907} {"train_loss": -26.62421989440918, "global_step": 407357, "epoch": 4907} {"train_loss": -26.99831199645996, "global_step": 407358, "epoch": 4907} {"train_loss": -26.78565788269043, "global_step": 407359, "epoch": 4907} {"train_loss": -26.881946563720703, "global_step": 407360, "epoch": 4907} {"train_loss": -26.66715431213379, "global_step": 407361, "epoch": 4907} {"train_loss": -26.837909698486328, "global_step": 407362, "epoch": 4907} {"train_loss": -26.402321597179736, "global_step": 407363, "epoch": 4907, "val_loss": 6824896.5} {"train_loss": -25.580629348754883, "global_step": 407364, "epoch": 4908} {"train_loss": -25.034391403198242, "global_step": 407365, "epoch": 4908} {"train_loss": -26.3049373626709, "global_step": 407366, "epoch": 4908} {"train_loss": -25.060258865356445, "global_step": 407367, "epoch": 4908} {"train_loss": -25.387069702148438, "global_step": 407368, "epoch": 4908} {"train_loss": -25.452289581298828, "global_step": 407369, "epoch": 4908} {"train_loss": -25.491714477539062, "global_step": 407370, "epoch": 4908} {"train_loss": -25.67682456970215, "global_step": 407371, "epoch": 4908} {"train_loss": -25.15545082092285, "global_step": 407372, "epoch": 4908} {"train_loss": -25.70277214050293, "global_step": 407373, "epoch": 4908} {"train_loss": -25.74493408203125, "global_step": 407374, "epoch": 4908} {"train_loss": -26.106985092163086, "global_step": 407375, "epoch": 4908} {"train_loss": -25.50581932067871, "global_step": 407376, "epoch": 4908} {"train_loss": -26.55533790588379, "global_step": 407377, "epoch": 4908} {"train_loss": -25.876951217651367, "global_step": 407378, "epoch": 4908} {"train_loss": -26.230783462524414, "global_step": 407379, "epoch": 4908} {"train_loss": -25.94007682800293, "global_step": 407380, "epoch": 4908} {"train_loss": -26.36855125427246, "global_step": 407381, "epoch": 4908} {"train_loss": -26.277219772338867, "global_step": 407382, "epoch": 4908} {"train_loss": -26.23089599609375, "global_step": 407383, "epoch": 4908} {"train_loss": -26.05267333984375, "global_step": 407384, "epoch": 4908} {"train_loss": -26.054853439331055, "global_step": 407385, "epoch": 4908} {"train_loss": -26.488998413085938, "global_step": 407386, "epoch": 4908} {"train_loss": -26.342260360717773, "global_step": 407387, "epoch": 4908} {"train_loss": -26.33951187133789, "global_step": 407388, "epoch": 4908} {"train_loss": -26.551618576049805, "global_step": 407389, "epoch": 4908} {"train_loss": -26.341434478759766, "global_step": 407390, "epoch": 4908} {"train_loss": -26.743207931518555, "global_step": 407391, "epoch": 4908} {"train_loss": -26.557361602783203, "global_step": 407392, "epoch": 4908} {"train_loss": -26.18375587463379, "global_step": 407393, "epoch": 4908} {"train_loss": -26.7428035736084, "global_step": 407394, "epoch": 4908} {"train_loss": -26.610258102416992, "global_step": 407395, "epoch": 4908} {"train_loss": -26.84136962890625, "global_step": 407396, "epoch": 4908} {"train_loss": -26.71870231628418, "global_step": 407397, "epoch": 4908} {"train_loss": -26.93794822692871, "global_step": 407398, "epoch": 4908} {"train_loss": -26.659271240234375, "global_step": 407399, "epoch": 4908} {"train_loss": -26.5274658203125, "global_step": 407400, "epoch": 4908} {"train_loss": -27.10479164123535, "global_step": 407401, "epoch": 4908} {"train_loss": -27.0604190826416, "global_step": 407402, "epoch": 4908} {"train_loss": -26.350006103515625, "global_step": 407403, "epoch": 4908} {"train_loss": -26.467390060424805, "global_step": 407404, "epoch": 4908} {"train_loss": -26.70087242126465, "global_step": 407405, "epoch": 4908} {"train_loss": -27.1676082611084, "global_step": 407406, "epoch": 4908} {"train_loss": -26.580411911010742, "global_step": 407407, "epoch": 4908} {"train_loss": -26.51422119140625, "global_step": 407408, "epoch": 4908} {"train_loss": -26.703811645507812, "global_step": 407409, "epoch": 4908} {"train_loss": -27.032621383666992, "global_step": 407410, "epoch": 4908} {"train_loss": -26.76102638244629, "global_step": 407411, "epoch": 4908} {"train_loss": -27.156553268432617, "global_step": 407412, "epoch": 4908} {"train_loss": -27.068450927734375, "global_step": 407413, "epoch": 4908} {"train_loss": -26.435272216796875, "global_step": 407414, "epoch": 4908} {"train_loss": -26.827009201049805, "global_step": 407415, "epoch": 4908} {"train_loss": -27.12493324279785, "global_step": 407416, "epoch": 4908} {"train_loss": -26.813901901245117, "global_step": 407417, "epoch": 4908} {"train_loss": -26.75055503845215, "global_step": 407418, "epoch": 4908} {"train_loss": -26.716222763061523, "global_step": 407419, "epoch": 4908} {"train_loss": -26.99647331237793, "global_step": 407420, "epoch": 4908} {"train_loss": -26.897180557250977, "global_step": 407421, "epoch": 4908} {"train_loss": -27.219608306884766, "global_step": 407422, "epoch": 4908} {"train_loss": -26.8914794921875, "global_step": 407423, "epoch": 4908} {"train_loss": -26.597003936767578, "global_step": 407424, "epoch": 4908} {"train_loss": -26.881254196166992, "global_step": 407425, "epoch": 4908} {"train_loss": -26.89484977722168, "global_step": 407426, "epoch": 4908} {"train_loss": -26.57305908203125, "global_step": 407427, "epoch": 4908} {"train_loss": -26.84144401550293, "global_step": 407428, "epoch": 4908} {"train_loss": -26.757476806640625, "global_step": 407429, "epoch": 4908} {"train_loss": -26.98137855529785, "global_step": 407430, "epoch": 4908} {"train_loss": -26.9034366607666, "global_step": 407431, "epoch": 4908} {"train_loss": -26.699491500854492, "global_step": 407432, "epoch": 4908} {"train_loss": -26.761205673217773, "global_step": 407433, "epoch": 4908} {"train_loss": -26.64657974243164, "global_step": 407434, "epoch": 4908} {"train_loss": -26.86191749572754, "global_step": 407435, "epoch": 4908} {"train_loss": -26.540210723876953, "global_step": 407436, "epoch": 4908} {"train_loss": -26.663450241088867, "global_step": 407437, "epoch": 4908} {"train_loss": -26.45180320739746, "global_step": 407438, "epoch": 4908} {"train_loss": -26.748249053955078, "global_step": 407439, "epoch": 4908} {"train_loss": -26.285207748413086, "global_step": 407440, "epoch": 4908} {"train_loss": -26.499746322631836, "global_step": 407441, "epoch": 4908} {"train_loss": -26.084365844726562, "global_step": 407442, "epoch": 4908} {"train_loss": -26.3297119140625, "global_step": 407443, "epoch": 4908} {"train_loss": -26.913990020751953, "global_step": 407444, "epoch": 4908} {"train_loss": -26.257953643798828, "global_step": 407445, "epoch": 4908} {"train_loss": -26.44589573503977, "global_step": 407446, "epoch": 4908, "val_loss": 6693327.5} {"train_loss": -24.34870719909668, "global_step": 407447, "epoch": 4909} {"train_loss": -25.548860549926758, "global_step": 407448, "epoch": 4909} {"train_loss": -24.139657974243164, "global_step": 407449, "epoch": 4909} {"train_loss": -25.00330924987793, "global_step": 407450, "epoch": 4909} {"train_loss": -25.58222770690918, "global_step": 407451, "epoch": 4909} {"train_loss": -24.866439819335938, "global_step": 407452, "epoch": 4909} {"train_loss": -25.88580322265625, "global_step": 407453, "epoch": 4909} {"train_loss": -26.002674102783203, "global_step": 407454, "epoch": 4909} {"train_loss": -25.457534790039062, "global_step": 407455, "epoch": 4909} {"train_loss": -25.78256607055664, "global_step": 407456, "epoch": 4909} {"train_loss": -25.258914947509766, "global_step": 407457, "epoch": 4909} {"train_loss": -25.829809188842773, "global_step": 407458, "epoch": 4909} {"train_loss": -25.804346084594727, "global_step": 407459, "epoch": 4909} {"train_loss": -25.66184425354004, "global_step": 407460, "epoch": 4909} {"train_loss": -25.9814395904541, "global_step": 407461, "epoch": 4909} {"train_loss": -25.6945858001709, "global_step": 407462, "epoch": 4909} {"train_loss": -26.21831703186035, "global_step": 407463, "epoch": 4909} {"train_loss": -25.84756851196289, "global_step": 407464, "epoch": 4909} {"train_loss": -26.020872116088867, "global_step": 407465, "epoch": 4909} {"train_loss": -26.394306182861328, "global_step": 407466, "epoch": 4909} {"train_loss": -26.19866943359375, "global_step": 407467, "epoch": 4909} {"train_loss": -26.26515769958496, "global_step": 407468, "epoch": 4909} {"train_loss": -25.984821319580078, "global_step": 407469, "epoch": 4909} {"train_loss": -26.076648712158203, "global_step": 407470, "epoch": 4909} {"train_loss": -26.374433517456055, "global_step": 407471, "epoch": 4909} {"train_loss": -26.262983322143555, "global_step": 407472, "epoch": 4909} {"train_loss": -26.20819664001465, "global_step": 407473, "epoch": 4909} {"train_loss": -26.067523956298828, "global_step": 407474, "epoch": 4909} {"train_loss": -26.475900650024414, "global_step": 407475, "epoch": 4909} {"train_loss": -26.095544815063477, "global_step": 407476, "epoch": 4909} {"train_loss": -26.112024307250977, "global_step": 407477, "epoch": 4909} {"train_loss": -26.6910343170166, "global_step": 407478, "epoch": 4909} {"train_loss": -26.043766021728516, "global_step": 407479, "epoch": 4909} {"train_loss": -26.28201675415039, "global_step": 407480, "epoch": 4909} {"train_loss": -26.63360023498535, "global_step": 407481, "epoch": 4909} {"train_loss": -26.536197662353516, "global_step": 407482, "epoch": 4909} {"train_loss": -26.715185165405273, "global_step": 407483, "epoch": 4909} {"train_loss": -26.330215454101562, "global_step": 407484, "epoch": 4909} {"train_loss": -26.455402374267578, "global_step": 407485, "epoch": 4909} {"train_loss": -27.034255981445312, "global_step": 407486, "epoch": 4909} {"train_loss": -26.336103439331055, "global_step": 407487, "epoch": 4909} {"train_loss": -26.04488182067871, "global_step": 407488, "epoch": 4909} {"train_loss": -26.57794189453125, "global_step": 407489, "epoch": 4909} {"train_loss": -26.34815788269043, "global_step": 407490, "epoch": 4909} {"train_loss": -26.52080726623535, "global_step": 407491, "epoch": 4909} {"train_loss": -26.229278564453125, "global_step": 407492, "epoch": 4909} {"train_loss": -26.91000747680664, "global_step": 407493, "epoch": 4909} {"train_loss": -26.533090591430664, "global_step": 407494, "epoch": 4909} {"train_loss": -26.48516273498535, "global_step": 407495, "epoch": 4909} {"train_loss": -26.760242462158203, "global_step": 407496, "epoch": 4909} {"train_loss": -26.77540397644043, "global_step": 407497, "epoch": 4909} {"train_loss": -26.6039981842041, "global_step": 407498, "epoch": 4909} {"train_loss": -26.4989070892334, "global_step": 407499, "epoch": 4909} {"train_loss": -27.15618324279785, "global_step": 407500, "epoch": 4909} {"train_loss": -26.37601661682129, "global_step": 407501, "epoch": 4909} {"train_loss": -27.065143585205078, "global_step": 407502, "epoch": 4909} {"train_loss": -26.593292236328125, "global_step": 407503, "epoch": 4909} {"train_loss": -26.55445671081543, "global_step": 407504, "epoch": 4909} {"train_loss": -26.913450241088867, "global_step": 407505, "epoch": 4909} {"train_loss": -26.850849151611328, "global_step": 407506, "epoch": 4909} {"train_loss": -26.403989791870117, "global_step": 407507, "epoch": 4909} {"train_loss": -26.7318115234375, "global_step": 407508, "epoch": 4909} {"train_loss": -26.948461532592773, "global_step": 407509, "epoch": 4909} {"train_loss": -26.932912826538086, "global_step": 407510, "epoch": 4909} {"train_loss": -26.90336036682129, "global_step": 407511, "epoch": 4909} {"train_loss": -26.4632511138916, "global_step": 407512, "epoch": 4909} {"train_loss": -26.845983505249023, "global_step": 407513, "epoch": 4909} {"train_loss": -26.468076705932617, "global_step": 407514, "epoch": 4909} {"train_loss": -26.7193660736084, "global_step": 407515, "epoch": 4909} {"train_loss": -26.401243209838867, "global_step": 407516, "epoch": 4909} {"train_loss": -26.5203857421875, "global_step": 407517, "epoch": 4909} {"train_loss": -26.83088493347168, "global_step": 407518, "epoch": 4909} {"train_loss": -26.8568115234375, "global_step": 407519, "epoch": 4909} {"train_loss": -26.763446807861328, "global_step": 407520, "epoch": 4909} {"train_loss": -26.76496696472168, "global_step": 407521, "epoch": 4909} {"train_loss": -26.877344131469727, "global_step": 407522, "epoch": 4909} {"train_loss": -26.902475357055664, "global_step": 407523, "epoch": 4909} {"train_loss": -27.119176864624023, "global_step": 407524, "epoch": 4909} {"train_loss": -26.86854362487793, "global_step": 407525, "epoch": 4909} {"train_loss": -27.057645797729492, "global_step": 407526, "epoch": 4909} {"train_loss": -27.291858673095703, "global_step": 407527, "epoch": 4909} {"train_loss": -27.2310733795166, "global_step": 407528, "epoch": 4909} {"train_loss": -26.348244150000884, "global_step": 407529, "epoch": 4909, "val_loss": 6713734.0} {"train_loss": -26.85418128967285, "global_step": 407530, "epoch": 4910} {"train_loss": -26.483930587768555, "global_step": 407531, "epoch": 4910} {"train_loss": -26.646167755126953, "global_step": 407532, "epoch": 4910} {"train_loss": -26.628326416015625, "global_step": 407533, "epoch": 4910} {"train_loss": -26.68535804748535, "global_step": 407534, "epoch": 4910} {"train_loss": -26.731815338134766, "global_step": 407535, "epoch": 4910} {"train_loss": -26.65228843688965, "global_step": 407536, "epoch": 4910} {"train_loss": -26.623395919799805, "global_step": 407537, "epoch": 4910} {"train_loss": -26.789966583251953, "global_step": 407538, "epoch": 4910} {"train_loss": -26.6362361907959, "global_step": 407539, "epoch": 4910} {"train_loss": -26.697467803955078, "global_step": 407540, "epoch": 4910} {"train_loss": -26.77662467956543, "global_step": 407541, "epoch": 4910} {"train_loss": -26.961572647094727, "global_step": 407542, "epoch": 4910} {"train_loss": -27.289350509643555, "global_step": 407543, "epoch": 4910} {"train_loss": -26.924673080444336, "global_step": 407544, "epoch": 4910} {"train_loss": -26.77412223815918, "global_step": 407545, "epoch": 4910} {"train_loss": -27.105772018432617, "global_step": 407546, "epoch": 4910} {"train_loss": -26.7476806640625, "global_step": 407547, "epoch": 4910} {"train_loss": -27.055334091186523, "global_step": 407548, "epoch": 4910} {"train_loss": -26.488845825195312, "global_step": 407549, "epoch": 4910} {"train_loss": -26.870685577392578, "global_step": 407550, "epoch": 4910} {"train_loss": -26.729572296142578, "global_step": 407551, "epoch": 4910} {"train_loss": -26.875446319580078, "global_step": 407552, "epoch": 4910} {"train_loss": -26.68405532836914, "global_step": 407553, "epoch": 4910} {"train_loss": -26.84050941467285, "global_step": 407554, "epoch": 4910} {"train_loss": -26.668317794799805, "global_step": 407555, "epoch": 4910} {"train_loss": -26.675739288330078, "global_step": 407556, "epoch": 4910} {"train_loss": -26.651386260986328, "global_step": 407557, "epoch": 4910} {"train_loss": -26.695261001586914, "global_step": 407558, "epoch": 4910} {"train_loss": -26.97517204284668, "global_step": 407559, "epoch": 4910} {"train_loss": -26.883222579956055, "global_step": 407560, "epoch": 4910} {"train_loss": -26.448932647705078, "global_step": 407561, "epoch": 4910} {"train_loss": -26.310277938842773, "global_step": 407562, "epoch": 4910} {"train_loss": -26.968524932861328, "global_step": 407563, "epoch": 4910} {"train_loss": -27.068134307861328, "global_step": 407564, "epoch": 4910} {"train_loss": -27.142608642578125, "global_step": 407565, "epoch": 4910} {"train_loss": -26.5028133392334, "global_step": 407566, "epoch": 4910} {"train_loss": -26.7545108795166, "global_step": 407567, "epoch": 4910} {"train_loss": -26.843358993530273, "global_step": 407568, "epoch": 4910} {"train_loss": -26.735065460205078, "global_step": 407569, "epoch": 4910} {"train_loss": -27.098791122436523, "global_step": 407570, "epoch": 4910} {"train_loss": -26.663074493408203, "global_step": 407571, "epoch": 4910} {"train_loss": -26.48067283630371, "global_step": 407572, "epoch": 4910} {"train_loss": -26.821813583374023, "global_step": 407573, "epoch": 4910} {"train_loss": -26.839614868164062, "global_step": 407574, "epoch": 4910} {"train_loss": -26.51325035095215, "global_step": 407575, "epoch": 4910} {"train_loss": -26.33342933654785, "global_step": 407576, "epoch": 4910} {"train_loss": -26.361499786376953, "global_step": 407577, "epoch": 4910} {"train_loss": -26.690771102905273, "global_step": 407578, "epoch": 4910} {"train_loss": -26.90130615234375, "global_step": 407579, "epoch": 4910} {"train_loss": -26.642419815063477, "global_step": 407580, "epoch": 4910} {"train_loss": -26.590051651000977, "global_step": 407581, "epoch": 4910} {"train_loss": -26.84052848815918, "global_step": 407582, "epoch": 4910} {"train_loss": -26.766000747680664, "global_step": 407583, "epoch": 4910} {"train_loss": -26.494245529174805, "global_step": 407584, "epoch": 4910} {"train_loss": -26.342004776000977, "global_step": 407585, "epoch": 4910} {"train_loss": -26.332990646362305, "global_step": 407586, "epoch": 4910} {"train_loss": -27.057188034057617, "global_step": 407587, "epoch": 4910} {"train_loss": -26.58869743347168, "global_step": 407588, "epoch": 4910} {"train_loss": -26.752460479736328, "global_step": 407589, "epoch": 4910} {"train_loss": -26.40662956237793, "global_step": 407590, "epoch": 4910} {"train_loss": -26.671268463134766, "global_step": 407591, "epoch": 4910} {"train_loss": -26.31534767150879, "global_step": 407592, "epoch": 4910} {"train_loss": -26.03619384765625, "global_step": 407593, "epoch": 4910} {"train_loss": -26.56598472595215, "global_step": 407594, "epoch": 4910} {"train_loss": -26.5234375, "global_step": 407595, "epoch": 4910} {"train_loss": -26.194217681884766, "global_step": 407596, "epoch": 4910} {"train_loss": -26.975662231445312, "global_step": 407597, "epoch": 4910} {"train_loss": -26.520282745361328, "global_step": 407598, "epoch": 4910} {"train_loss": -26.890466690063477, "global_step": 407599, "epoch": 4910} {"train_loss": -26.568761825561523, "global_step": 407600, "epoch": 4910} {"train_loss": -26.50537109375, "global_step": 407601, "epoch": 4910} {"train_loss": -27.063562393188477, "global_step": 407602, "epoch": 4910} {"train_loss": -26.651601791381836, "global_step": 407603, "epoch": 4910} {"train_loss": -26.586767196655273, "global_step": 407604, "epoch": 4910} {"train_loss": -26.45810890197754, "global_step": 407605, "epoch": 4910} {"train_loss": -26.405445098876953, "global_step": 407606, "epoch": 4910} {"train_loss": -26.551679611206055, "global_step": 407607, "epoch": 4910} {"train_loss": -27.047250747680664, "global_step": 407608, "epoch": 4910} {"train_loss": -26.576623916625977, "global_step": 407609, "epoch": 4910} {"train_loss": -26.653308868408203, "global_step": 407610, "epoch": 4910} {"train_loss": -26.74648094177246, "global_step": 407611, "epoch": 4910} {"train_loss": -26.68153769711414, "global_step": 407612, "epoch": 4910, "val_loss": 6752609.0} {"train_loss": -25.372236251831055, "global_step": 407613, "epoch": 4911} {"train_loss": -25.765399932861328, "global_step": 407614, "epoch": 4911} {"train_loss": -26.092350006103516, "global_step": 407615, "epoch": 4911} {"train_loss": -25.27825164794922, "global_step": 407616, "epoch": 4911} {"train_loss": -25.213808059692383, "global_step": 407617, "epoch": 4911} {"train_loss": -26.315155029296875, "global_step": 407618, "epoch": 4911} {"train_loss": -25.802106857299805, "global_step": 407619, "epoch": 4911} {"train_loss": -25.93531608581543, "global_step": 407620, "epoch": 4911} {"train_loss": -25.586912155151367, "global_step": 407621, "epoch": 4911} {"train_loss": -25.908233642578125, "global_step": 407622, "epoch": 4911} {"train_loss": -26.125741958618164, "global_step": 407623, "epoch": 4911} {"train_loss": -25.616308212280273, "global_step": 407624, "epoch": 4911} {"train_loss": -26.093708038330078, "global_step": 407625, "epoch": 4911} {"train_loss": -26.39888572692871, "global_step": 407626, "epoch": 4911} {"train_loss": -26.2072811126709, "global_step": 407627, "epoch": 4911} {"train_loss": -26.131717681884766, "global_step": 407628, "epoch": 4911} {"train_loss": -26.50897216796875, "global_step": 407629, "epoch": 4911} {"train_loss": -25.93238639831543, "global_step": 407630, "epoch": 4911} {"train_loss": -26.263975143432617, "global_step": 407631, "epoch": 4911} {"train_loss": -26.429553985595703, "global_step": 407632, "epoch": 4911} {"train_loss": -25.81964683532715, "global_step": 407633, "epoch": 4911} {"train_loss": -26.594297409057617, "global_step": 407634, "epoch": 4911} {"train_loss": -26.20574378967285, "global_step": 407635, "epoch": 4911} {"train_loss": -26.299243927001953, "global_step": 407636, "epoch": 4911} {"train_loss": -26.802656173706055, "global_step": 407637, "epoch": 4911} {"train_loss": -26.489166259765625, "global_step": 407638, "epoch": 4911} {"train_loss": -26.6426944732666, "global_step": 407639, "epoch": 4911} {"train_loss": -26.492589950561523, "global_step": 407640, "epoch": 4911} {"train_loss": -26.47016716003418, "global_step": 407641, "epoch": 4911} {"train_loss": -26.883142471313477, "global_step": 407642, "epoch": 4911} {"train_loss": -26.6668643951416, "global_step": 407643, "epoch": 4911} {"train_loss": -26.64739990234375, "global_step": 407644, "epoch": 4911} {"train_loss": -26.921133041381836, "global_step": 407645, "epoch": 4911} {"train_loss": -26.7435245513916, "global_step": 407646, "epoch": 4911} {"train_loss": -26.386770248413086, "global_step": 407647, "epoch": 4911} {"train_loss": -26.707468032836914, "global_step": 407648, "epoch": 4911} {"train_loss": -26.588682174682617, "global_step": 407649, "epoch": 4911} {"train_loss": -26.818531036376953, "global_step": 407650, "epoch": 4911} {"train_loss": -26.55731201171875, "global_step": 407651, "epoch": 4911} {"train_loss": -26.90610122680664, "global_step": 407652, "epoch": 4911} {"train_loss": -26.70087242126465, "global_step": 407653, "epoch": 4911} {"train_loss": -26.7100830078125, "global_step": 407654, "epoch": 4911} {"train_loss": -27.113183975219727, "global_step": 407655, "epoch": 4911} {"train_loss": -26.638586044311523, "global_step": 407656, "epoch": 4911} {"train_loss": -26.823944091796875, "global_step": 407657, "epoch": 4911} {"train_loss": -26.794031143188477, "global_step": 407658, "epoch": 4911} {"train_loss": -26.782079696655273, "global_step": 407659, "epoch": 4911} {"train_loss": -26.962255477905273, "global_step": 407660, "epoch": 4911} {"train_loss": -26.96742820739746, "global_step": 407661, "epoch": 4911} {"train_loss": -26.866073608398438, "global_step": 407662, "epoch": 4911} {"train_loss": -26.74617576599121, "global_step": 407663, "epoch": 4911} {"train_loss": -26.57071876525879, "global_step": 407664, "epoch": 4911} {"train_loss": -26.620532989501953, "global_step": 407665, "epoch": 4911} {"train_loss": -27.084985733032227, "global_step": 407666, "epoch": 4911} {"train_loss": -26.96729850769043, "global_step": 407667, "epoch": 4911} {"train_loss": -26.695392608642578, "global_step": 407668, "epoch": 4911} {"train_loss": -26.720800399780273, "global_step": 407669, "epoch": 4911} {"train_loss": -27.06853675842285, "global_step": 407670, "epoch": 4911} {"train_loss": -26.686115264892578, "global_step": 407671, "epoch": 4911} {"train_loss": -26.209192276000977, "global_step": 407672, "epoch": 4911} {"train_loss": -27.0980281829834, "global_step": 407673, "epoch": 4911} {"train_loss": -26.889240264892578, "global_step": 407674, "epoch": 4911} {"train_loss": -26.888538360595703, "global_step": 407675, "epoch": 4911} {"train_loss": -26.498798370361328, "global_step": 407676, "epoch": 4911} {"train_loss": -26.628936767578125, "global_step": 407677, "epoch": 4911} {"train_loss": -26.944934844970703, "global_step": 407678, "epoch": 4911} {"train_loss": -27.09528923034668, "global_step": 407679, "epoch": 4911} {"train_loss": -26.967395782470703, "global_step": 407680, "epoch": 4911} {"train_loss": -26.980518341064453, "global_step": 407681, "epoch": 4911} {"train_loss": -26.678730010986328, "global_step": 407682, "epoch": 4911} {"train_loss": -27.094472885131836, "global_step": 407683, "epoch": 4911} {"train_loss": -27.255117416381836, "global_step": 407684, "epoch": 4911} {"train_loss": -26.60544776916504, "global_step": 407685, "epoch": 4911} {"train_loss": -26.817819595336914, "global_step": 407686, "epoch": 4911} {"train_loss": -26.789525985717773, "global_step": 407687, "epoch": 4911} {"train_loss": -26.72263526916504, "global_step": 407688, "epoch": 4911} {"train_loss": -26.715917587280273, "global_step": 407689, "epoch": 4911} {"train_loss": -26.214553833007812, "global_step": 407690, "epoch": 4911} {"train_loss": -26.25966453552246, "global_step": 407691, "epoch": 4911} {"train_loss": -26.4262638092041, "global_step": 407692, "epoch": 4911} {"train_loss": -26.71668815612793, "global_step": 407693, "epoch": 4911} {"train_loss": -26.853559494018555, "global_step": 407694, "epoch": 4911} {"train_loss": -26.53155064870076, "global_step": 407695, "epoch": 4911, "val_loss": 6678963.0} {"train_loss": -24.080299377441406, "global_step": 407696, "epoch": 4912} {"train_loss": -24.482254028320312, "global_step": 407697, "epoch": 4912} {"train_loss": -25.650266647338867, "global_step": 407698, "epoch": 4912} {"train_loss": -25.166156768798828, "global_step": 407699, "epoch": 4912} {"train_loss": -26.03635025024414, "global_step": 407700, "epoch": 4912} {"train_loss": -24.844898223876953, "global_step": 407701, "epoch": 4912} {"train_loss": -25.211158752441406, "global_step": 407702, "epoch": 4912} {"train_loss": -25.33875846862793, "global_step": 407703, "epoch": 4912} {"train_loss": -26.035816192626953, "global_step": 407704, "epoch": 4912} {"train_loss": -25.828542709350586, "global_step": 407705, "epoch": 4912} {"train_loss": -25.83295249938965, "global_step": 407706, "epoch": 4912} {"train_loss": -25.879613876342773, "global_step": 407707, "epoch": 4912} {"train_loss": -25.966053009033203, "global_step": 407708, "epoch": 4912} {"train_loss": -25.8957576751709, "global_step": 407709, "epoch": 4912} {"train_loss": -26.153417587280273, "global_step": 407710, "epoch": 4912} {"train_loss": -25.8896541595459, "global_step": 407711, "epoch": 4912} {"train_loss": -26.204111099243164, "global_step": 407712, "epoch": 4912} {"train_loss": -26.189929962158203, "global_step": 407713, "epoch": 4912} {"train_loss": -26.00392723083496, "global_step": 407714, "epoch": 4912} {"train_loss": -25.832712173461914, "global_step": 407715, "epoch": 4912} {"train_loss": -26.099653244018555, "global_step": 407716, "epoch": 4912} {"train_loss": -26.04945182800293, "global_step": 407717, "epoch": 4912} {"train_loss": -25.601163864135742, "global_step": 407718, "epoch": 4912} {"train_loss": -25.786481857299805, "global_step": 407719, "epoch": 4912} {"train_loss": -26.00771141052246, "global_step": 407720, "epoch": 4912} {"train_loss": -25.860370635986328, "global_step": 407721, "epoch": 4912} {"train_loss": -26.039770126342773, "global_step": 407722, "epoch": 4912} {"train_loss": -26.26852798461914, "global_step": 407723, "epoch": 4912} {"train_loss": -25.829076766967773, "global_step": 407724, "epoch": 4912} {"train_loss": -26.427892684936523, "global_step": 407725, "epoch": 4912} {"train_loss": -26.30904197692871, "global_step": 407726, "epoch": 4912} {"train_loss": -26.29805564880371, "global_step": 407727, "epoch": 4912} {"train_loss": -26.505369186401367, "global_step": 407728, "epoch": 4912} {"train_loss": -26.31435203552246, "global_step": 407729, "epoch": 4912} {"train_loss": -26.142602920532227, "global_step": 407730, "epoch": 4912} {"train_loss": -26.881616592407227, "global_step": 407731, "epoch": 4912} {"train_loss": -26.483346939086914, "global_step": 407732, "epoch": 4912} {"train_loss": -26.54644203186035, "global_step": 407733, "epoch": 4912} {"train_loss": -26.241525650024414, "global_step": 407734, "epoch": 4912} {"train_loss": -26.747516632080078, "global_step": 407735, "epoch": 4912} {"train_loss": -26.703964233398438, "global_step": 407736, "epoch": 4912} {"train_loss": -26.445220947265625, "global_step": 407737, "epoch": 4912} {"train_loss": -26.782917022705078, "global_step": 407738, "epoch": 4912} {"train_loss": -26.17111587524414, "global_step": 407739, "epoch": 4912} {"train_loss": -27.080408096313477, "global_step": 407740, "epoch": 4912} {"train_loss": -26.15693473815918, "global_step": 407741, "epoch": 4912} {"train_loss": -26.75518226623535, "global_step": 407742, "epoch": 4912} {"train_loss": -26.804828643798828, "global_step": 407743, "epoch": 4912} {"train_loss": -26.85879898071289, "global_step": 407744, "epoch": 4912} {"train_loss": -26.817611694335938, "global_step": 407745, "epoch": 4912} {"train_loss": -26.60249137878418, "global_step": 407746, "epoch": 4912} {"train_loss": -26.80191993713379, "global_step": 407747, "epoch": 4912} {"train_loss": -26.687213897705078, "global_step": 407748, "epoch": 4912} {"train_loss": -26.398090362548828, "global_step": 407749, "epoch": 4912} {"train_loss": -26.507007598876953, "global_step": 407750, "epoch": 4912} {"train_loss": -26.802658081054688, "global_step": 407751, "epoch": 4912} {"train_loss": -26.510236740112305, "global_step": 407752, "epoch": 4912} {"train_loss": -26.607654571533203, "global_step": 407753, "epoch": 4912} {"train_loss": -26.98809814453125, "global_step": 407754, "epoch": 4912} {"train_loss": -26.551565170288086, "global_step": 407755, "epoch": 4912} {"train_loss": -26.77451515197754, "global_step": 407756, "epoch": 4912} {"train_loss": -27.12054443359375, "global_step": 407757, "epoch": 4912} {"train_loss": -26.200231552124023, "global_step": 407758, "epoch": 4912} {"train_loss": -26.69937515258789, "global_step": 407759, "epoch": 4912} {"train_loss": -26.759002685546875, "global_step": 407760, "epoch": 4912} {"train_loss": -26.588659286499023, "global_step": 407761, "epoch": 4912} {"train_loss": -26.992040634155273, "global_step": 407762, "epoch": 4912} {"train_loss": -26.729206085205078, "global_step": 407763, "epoch": 4912} {"train_loss": -26.84223747253418, "global_step": 407764, "epoch": 4912} {"train_loss": -26.789234161376953, "global_step": 407765, "epoch": 4912} {"train_loss": -26.596912384033203, "global_step": 407766, "epoch": 4912} {"train_loss": -27.0791072845459, "global_step": 407767, "epoch": 4912} {"train_loss": -26.37237548828125, "global_step": 407768, "epoch": 4912} {"train_loss": -27.26238441467285, "global_step": 407769, "epoch": 4912} {"train_loss": -26.509428024291992, "global_step": 407770, "epoch": 4912} {"train_loss": -27.00016212463379, "global_step": 407771, "epoch": 4912} {"train_loss": -26.520404815673828, "global_step": 407772, "epoch": 4912} {"train_loss": -26.662382125854492, "global_step": 407773, "epoch": 4912} {"train_loss": -26.433263778686523, "global_step": 407774, "epoch": 4912} {"train_loss": -27.101917266845703, "global_step": 407775, "epoch": 4912} {"train_loss": -26.79107666015625, "global_step": 407776, "epoch": 4912} {"train_loss": -26.60941505432129, "global_step": 407777, "epoch": 4912} {"train_loss": -26.335717580404626, "global_step": 407778, "epoch": 4912, "val_loss": 6690701.5} {"train_loss": -26.00750160217285, "global_step": 407779, "epoch": 4913} {"train_loss": -25.691024780273438, "global_step": 407780, "epoch": 4913} {"train_loss": -26.231245040893555, "global_step": 407781, "epoch": 4913} {"train_loss": -26.138553619384766, "global_step": 407782, "epoch": 4913} {"train_loss": -25.39786148071289, "global_step": 407783, "epoch": 4913} {"train_loss": -26.0457706451416, "global_step": 407784, "epoch": 4913} {"train_loss": -26.357437133789062, "global_step": 407785, "epoch": 4913} {"train_loss": -25.800983428955078, "global_step": 407786, "epoch": 4913} {"train_loss": -25.900775909423828, "global_step": 407787, "epoch": 4913} {"train_loss": -26.121536254882812, "global_step": 407788, "epoch": 4913} {"train_loss": -26.462921142578125, "global_step": 407789, "epoch": 4913} {"train_loss": -26.45871925354004, "global_step": 407790, "epoch": 4913} {"train_loss": -26.275732040405273, "global_step": 407791, "epoch": 4913} {"train_loss": -26.492889404296875, "global_step": 407792, "epoch": 4913} {"train_loss": -26.337671279907227, "global_step": 407793, "epoch": 4913} {"train_loss": -26.89151954650879, "global_step": 407794, "epoch": 4913} {"train_loss": -26.532764434814453, "global_step": 407795, "epoch": 4913} {"train_loss": -26.617233276367188, "global_step": 407796, "epoch": 4913} {"train_loss": -26.072546005249023, "global_step": 407797, "epoch": 4913} {"train_loss": -26.616724014282227, "global_step": 407798, "epoch": 4913} {"train_loss": -26.599609375, "global_step": 407799, "epoch": 4913} {"train_loss": -26.6107177734375, "global_step": 407800, "epoch": 4913} {"train_loss": -26.16282081604004, "global_step": 407801, "epoch": 4913} {"train_loss": -26.4813232421875, "global_step": 407802, "epoch": 4913} {"train_loss": -26.749439239501953, "global_step": 407803, "epoch": 4913} {"train_loss": -26.56487464904785, "global_step": 407804, "epoch": 4913} {"train_loss": -26.408721923828125, "global_step": 407805, "epoch": 4913} {"train_loss": -26.569305419921875, "global_step": 407806, "epoch": 4913} {"train_loss": -26.502918243408203, "global_step": 407807, "epoch": 4913} {"train_loss": -26.637130737304688, "global_step": 407808, "epoch": 4913} {"train_loss": -26.952411651611328, "global_step": 407809, "epoch": 4913} {"train_loss": -26.685535430908203, "global_step": 407810, "epoch": 4913} {"train_loss": -26.811216354370117, "global_step": 407811, "epoch": 4913} {"train_loss": -26.699384689331055, "global_step": 407812, "epoch": 4913} {"train_loss": -26.946252822875977, "global_step": 407813, "epoch": 4913} {"train_loss": -26.605560302734375, "global_step": 407814, "epoch": 4913} {"train_loss": -26.776803970336914, "global_step": 407815, "epoch": 4913} {"train_loss": -26.522382736206055, "global_step": 407816, "epoch": 4913} {"train_loss": -26.322967529296875, "global_step": 407817, "epoch": 4913} {"train_loss": -26.447284698486328, "global_step": 407818, "epoch": 4913} {"train_loss": -26.98890495300293, "global_step": 407819, "epoch": 4913} {"train_loss": -26.246984481811523, "global_step": 407820, "epoch": 4913} {"train_loss": -26.354665756225586, "global_step": 407821, "epoch": 4913} {"train_loss": -26.302570343017578, "global_step": 407822, "epoch": 4913} {"train_loss": -27.050769805908203, "global_step": 407823, "epoch": 4913} {"train_loss": -26.71466064453125, "global_step": 407824, "epoch": 4913} {"train_loss": -26.607080459594727, "global_step": 407825, "epoch": 4913} {"train_loss": -26.79109001159668, "global_step": 407826, "epoch": 4913} {"train_loss": -26.59394645690918, "global_step": 407827, "epoch": 4913} {"train_loss": -26.451501846313477, "global_step": 407828, "epoch": 4913} {"train_loss": -27.257810592651367, "global_step": 407829, "epoch": 4913} {"train_loss": -26.895959854125977, "global_step": 407830, "epoch": 4913} {"train_loss": -26.794437408447266, "global_step": 407831, "epoch": 4913} {"train_loss": -26.704374313354492, "global_step": 407832, "epoch": 4913} {"train_loss": -26.993961334228516, "global_step": 407833, "epoch": 4913} {"train_loss": -26.907052993774414, "global_step": 407834, "epoch": 4913} {"train_loss": -26.791614532470703, "global_step": 407835, "epoch": 4913} {"train_loss": -26.889738082885742, "global_step": 407836, "epoch": 4913} {"train_loss": -26.217615127563477, "global_step": 407837, "epoch": 4913} {"train_loss": -26.369403839111328, "global_step": 407838, "epoch": 4913} {"train_loss": -26.62391471862793, "global_step": 407839, "epoch": 4913} {"train_loss": -26.213605880737305, "global_step": 407840, "epoch": 4913} {"train_loss": -26.306650161743164, "global_step": 407841, "epoch": 4913} {"train_loss": -26.27975845336914, "global_step": 407842, "epoch": 4913} {"train_loss": -26.44814109802246, "global_step": 407843, "epoch": 4913} {"train_loss": -26.72525405883789, "global_step": 407844, "epoch": 4913} {"train_loss": -27.116012573242188, "global_step": 407845, "epoch": 4913} {"train_loss": -27.2027530670166, "global_step": 407846, "epoch": 4913} {"train_loss": -27.227283477783203, "global_step": 407847, "epoch": 4913} {"train_loss": -26.25123405456543, "global_step": 407848, "epoch": 4913} {"train_loss": -26.58499526977539, "global_step": 407849, "epoch": 4913} {"train_loss": -26.72527503967285, "global_step": 407850, "epoch": 4913} {"train_loss": -26.756397247314453, "global_step": 407851, "epoch": 4913} {"train_loss": -26.878955841064453, "global_step": 407852, "epoch": 4913} {"train_loss": -26.781049728393555, "global_step": 407853, "epoch": 4913} {"train_loss": -26.9002685546875, "global_step": 407854, "epoch": 4913} {"train_loss": -26.813390731811523, "global_step": 407855, "epoch": 4913} {"train_loss": -27.150110244750977, "global_step": 407856, "epoch": 4913} {"train_loss": -26.696802139282227, "global_step": 407857, "epoch": 4913} {"train_loss": -26.78728675842285, "global_step": 407858, "epoch": 4913} {"train_loss": -26.645299911499023, "global_step": 407859, "epoch": 4913} {"train_loss": -26.94891357421875, "global_step": 407860, "epoch": 4913} {"train_loss": -26.567158273903722, "global_step": 407861, "epoch": 4913, "val_loss": 7004892.0} {"train_loss": -23.6555233001709, "global_step": 407862, "epoch": 4914} {"train_loss": -23.245534896850586, "global_step": 407863, "epoch": 4914} {"train_loss": -24.267324447631836, "global_step": 407864, "epoch": 4914} {"train_loss": -24.11313819885254, "global_step": 407865, "epoch": 4914} {"train_loss": -24.03767967224121, "global_step": 407866, "epoch": 4914} {"train_loss": -25.52978515625, "global_step": 407867, "epoch": 4914} {"train_loss": -24.025672912597656, "global_step": 407868, "epoch": 4914} {"train_loss": -24.647109985351562, "global_step": 407869, "epoch": 4914} {"train_loss": -24.761693954467773, "global_step": 407870, "epoch": 4914} {"train_loss": -25.336393356323242, "global_step": 407871, "epoch": 4914} {"train_loss": -24.91724967956543, "global_step": 407872, "epoch": 4914} {"train_loss": -24.75193214416504, "global_step": 407873, "epoch": 4914} {"train_loss": -25.498252868652344, "global_step": 407874, "epoch": 4914} {"train_loss": -25.24018669128418, "global_step": 407875, "epoch": 4914} {"train_loss": -25.36756706237793, "global_step": 407876, "epoch": 4914} {"train_loss": -25.21672248840332, "global_step": 407877, "epoch": 4914} {"train_loss": -25.314985275268555, "global_step": 407878, "epoch": 4914} {"train_loss": -25.54306411743164, "global_step": 407879, "epoch": 4914} {"train_loss": -25.497756958007812, "global_step": 407880, "epoch": 4914} {"train_loss": -25.296823501586914, "global_step": 407881, "epoch": 4914} {"train_loss": -25.835050582885742, "global_step": 407882, "epoch": 4914} {"train_loss": -25.822294235229492, "global_step": 407883, "epoch": 4914} {"train_loss": -25.852872848510742, "global_step": 407884, "epoch": 4914} {"train_loss": -25.999420166015625, "global_step": 407885, "epoch": 4914} {"train_loss": -25.884124755859375, "global_step": 407886, "epoch": 4914} {"train_loss": -26.091760635375977, "global_step": 407887, "epoch": 4914} {"train_loss": -25.900604248046875, "global_step": 407888, "epoch": 4914} {"train_loss": -25.946455001831055, "global_step": 407889, "epoch": 4914} {"train_loss": -25.973037719726562, "global_step": 407890, "epoch": 4914} {"train_loss": -26.19675064086914, "global_step": 407891, "epoch": 4914} {"train_loss": -26.34193229675293, "global_step": 407892, "epoch": 4914} {"train_loss": -26.002979278564453, "global_step": 407893, "epoch": 4914} {"train_loss": -26.265356063842773, "global_step": 407894, "epoch": 4914} {"train_loss": -26.3671817779541, "global_step": 407895, "epoch": 4914} {"train_loss": -26.21393394470215, "global_step": 407896, "epoch": 4914} {"train_loss": -26.1818904876709, "global_step": 407897, "epoch": 4914} {"train_loss": -26.40095329284668, "global_step": 407898, "epoch": 4914} {"train_loss": -26.664411544799805, "global_step": 407899, "epoch": 4914} {"train_loss": -26.452716827392578, "global_step": 407900, "epoch": 4914} {"train_loss": -26.2951717376709, "global_step": 407901, "epoch": 4914} {"train_loss": -26.39175796508789, "global_step": 407902, "epoch": 4914} {"train_loss": -26.60040283203125, "global_step": 407903, "epoch": 4914} {"train_loss": -26.589466094970703, "global_step": 407904, "epoch": 4914} {"train_loss": -26.67475700378418, "global_step": 407905, "epoch": 4914} {"train_loss": -26.8971004486084, "global_step": 407906, "epoch": 4914} {"train_loss": -26.4946346282959, "global_step": 407907, "epoch": 4914} {"train_loss": -26.596277236938477, "global_step": 407908, "epoch": 4914} {"train_loss": -26.805755615234375, "global_step": 407909, "epoch": 4914} {"train_loss": -26.492502212524414, "global_step": 407910, "epoch": 4914} {"train_loss": -26.560754776000977, "global_step": 407911, "epoch": 4914} {"train_loss": -26.826215744018555, "global_step": 407912, "epoch": 4914} {"train_loss": -26.966520309448242, "global_step": 407913, "epoch": 4914} {"train_loss": -26.668109893798828, "global_step": 407914, "epoch": 4914} {"train_loss": -27.026752471923828, "global_step": 407915, "epoch": 4914} {"train_loss": -26.567169189453125, "global_step": 407916, "epoch": 4914} {"train_loss": -26.77203941345215, "global_step": 407917, "epoch": 4914} {"train_loss": -27.030126571655273, "global_step": 407918, "epoch": 4914} {"train_loss": -26.907123565673828, "global_step": 407919, "epoch": 4914} {"train_loss": -26.810688018798828, "global_step": 407920, "epoch": 4914} {"train_loss": -26.852874755859375, "global_step": 407921, "epoch": 4914} {"train_loss": -26.896459579467773, "global_step": 407922, "epoch": 4914} {"train_loss": -26.8156795501709, "global_step": 407923, "epoch": 4914} {"train_loss": -26.594833374023438, "global_step": 407924, "epoch": 4914} {"train_loss": -26.679019927978516, "global_step": 407925, "epoch": 4914} {"train_loss": -26.899084091186523, "global_step": 407926, "epoch": 4914} {"train_loss": -26.880537033081055, "global_step": 407927, "epoch": 4914} {"train_loss": -27.13517189025879, "global_step": 407928, "epoch": 4914} {"train_loss": -26.57259178161621, "global_step": 407929, "epoch": 4914} {"train_loss": -26.558530807495117, "global_step": 407930, "epoch": 4914} {"train_loss": -27.21076011657715, "global_step": 407931, "epoch": 4914} {"train_loss": -27.021474838256836, "global_step": 407932, "epoch": 4914} {"train_loss": -26.6353702545166, "global_step": 407933, "epoch": 4914} {"train_loss": -26.712039947509766, "global_step": 407934, "epoch": 4914} {"train_loss": -27.14108657836914, "global_step": 407935, "epoch": 4914} {"train_loss": -26.757247924804688, "global_step": 407936, "epoch": 4914} {"train_loss": -26.96689224243164, "global_step": 407937, "epoch": 4914} {"train_loss": -26.89996910095215, "global_step": 407938, "epoch": 4914} {"train_loss": -26.867597579956055, "global_step": 407939, "epoch": 4914} {"train_loss": -26.75098991394043, "global_step": 407940, "epoch": 4914} {"train_loss": -26.80682373046875, "global_step": 407941, "epoch": 4914} {"train_loss": -26.683090209960938, "global_step": 407942, "epoch": 4914} {"train_loss": -26.52052116394043, "global_step": 407943, "epoch": 4914} {"train_loss": -26.163633001856056, "global_step": 407944, "epoch": 4914, "val_loss": 6667202.0} {"train_loss": -25.4443302154541, "global_step": 407945, "epoch": 4915} {"train_loss": -25.547039031982422, "global_step": 407946, "epoch": 4915} {"train_loss": -25.0460205078125, "global_step": 407947, "epoch": 4915} {"train_loss": -25.60882568359375, "global_step": 407948, "epoch": 4915} {"train_loss": -25.876928329467773, "global_step": 407949, "epoch": 4915} {"train_loss": -25.729995727539062, "global_step": 407950, "epoch": 4915} {"train_loss": -25.9395694732666, "global_step": 407951, "epoch": 4915} {"train_loss": -25.928253173828125, "global_step": 407952, "epoch": 4915} {"train_loss": -25.807538986206055, "global_step": 407953, "epoch": 4915} {"train_loss": -25.987411499023438, "global_step": 407954, "epoch": 4915} {"train_loss": -25.95997428894043, "global_step": 407955, "epoch": 4915} {"train_loss": -25.906885147094727, "global_step": 407956, "epoch": 4915} {"train_loss": -25.802387237548828, "global_step": 407957, "epoch": 4915} {"train_loss": -26.398059844970703, "global_step": 407958, "epoch": 4915} {"train_loss": -26.2274169921875, "global_step": 407959, "epoch": 4915} {"train_loss": -26.402963638305664, "global_step": 407960, "epoch": 4915} {"train_loss": -26.17047691345215, "global_step": 407961, "epoch": 4915} {"train_loss": -25.995569229125977, "global_step": 407962, "epoch": 4915} {"train_loss": -26.418386459350586, "global_step": 407963, "epoch": 4915} {"train_loss": -26.364002227783203, "global_step": 407964, "epoch": 4915} {"train_loss": -26.265546798706055, "global_step": 407965, "epoch": 4915} {"train_loss": -26.27691650390625, "global_step": 407966, "epoch": 4915} {"train_loss": -26.325363159179688, "global_step": 407967, "epoch": 4915} {"train_loss": -26.566823959350586, "global_step": 407968, "epoch": 4915} {"train_loss": -26.740283966064453, "global_step": 407969, "epoch": 4915} {"train_loss": -26.240478515625, "global_step": 407970, "epoch": 4915} {"train_loss": -26.577909469604492, "global_step": 407971, "epoch": 4915} {"train_loss": -26.724164962768555, "global_step": 407972, "epoch": 4915} {"train_loss": -26.46394157409668, "global_step": 407973, "epoch": 4915} {"train_loss": -26.42658042907715, "global_step": 407974, "epoch": 4915} {"train_loss": -26.50531578063965, "global_step": 407975, "epoch": 4915} {"train_loss": -26.631427764892578, "global_step": 407976, "epoch": 4915} {"train_loss": -26.41880226135254, "global_step": 407977, "epoch": 4915} {"train_loss": -26.83056640625, "global_step": 407978, "epoch": 4915} {"train_loss": -26.55901527404785, "global_step": 407979, "epoch": 4915} {"train_loss": -26.55698585510254, "global_step": 407980, "epoch": 4915} {"train_loss": -26.70782470703125, "global_step": 407981, "epoch": 4915} {"train_loss": -26.676624298095703, "global_step": 407982, "epoch": 4915} {"train_loss": -26.635583877563477, "global_step": 407983, "epoch": 4915} {"train_loss": -26.726293563842773, "global_step": 407984, "epoch": 4915} {"train_loss": -26.664945602416992, "global_step": 407985, "epoch": 4915} {"train_loss": -26.759536743164062, "global_step": 407986, "epoch": 4915} {"train_loss": -26.68134117126465, "global_step": 407987, "epoch": 4915} {"train_loss": -26.59441566467285, "global_step": 407988, "epoch": 4915} {"train_loss": -26.778308868408203, "global_step": 407989, "epoch": 4915} {"train_loss": -27.106231689453125, "global_step": 407990, "epoch": 4915} {"train_loss": -26.90997886657715, "global_step": 407991, "epoch": 4915} {"train_loss": -26.67780113220215, "global_step": 407992, "epoch": 4915} {"train_loss": -27.355676651000977, "global_step": 407993, "epoch": 4915} {"train_loss": -26.947803497314453, "global_step": 407994, "epoch": 4915} {"train_loss": -26.989261627197266, "global_step": 407995, "epoch": 4915} {"train_loss": -27.2498722076416, "global_step": 407996, "epoch": 4915} {"train_loss": -27.0711727142334, "global_step": 407997, "epoch": 4915} {"train_loss": -26.498300552368164, "global_step": 407998, "epoch": 4915} {"train_loss": -27.239782333374023, "global_step": 407999, "epoch": 4915} {"train_loss": -26.92962074279785, "global_step": 408000, "epoch": 4915} {"train_loss": -27.329675674438477, "global_step": 408001, "epoch": 4915} {"train_loss": -27.095151901245117, "global_step": 408002, "epoch": 4915} {"train_loss": -26.890745162963867, "global_step": 408003, "epoch": 4915} {"train_loss": -26.926191329956055, "global_step": 408004, "epoch": 4915} {"train_loss": -27.014972686767578, "global_step": 408005, "epoch": 4915} {"train_loss": -26.967620849609375, "global_step": 408006, "epoch": 4915} {"train_loss": -26.303150177001953, "global_step": 408007, "epoch": 4915} {"train_loss": -26.36878776550293, "global_step": 408008, "epoch": 4915} {"train_loss": -26.744531631469727, "global_step": 408009, "epoch": 4915} {"train_loss": -26.59225845336914, "global_step": 408010, "epoch": 4915} {"train_loss": -26.726430892944336, "global_step": 408011, "epoch": 4915} {"train_loss": -26.478116989135742, "global_step": 408012, "epoch": 4915} {"train_loss": -26.737625122070312, "global_step": 408013, "epoch": 4915} {"train_loss": -26.994104385375977, "global_step": 408014, "epoch": 4915} {"train_loss": -27.244617462158203, "global_step": 408015, "epoch": 4915} {"train_loss": -26.596601486206055, "global_step": 408016, "epoch": 4915} {"train_loss": -26.67612075805664, "global_step": 408017, "epoch": 4915} {"train_loss": -26.7225399017334, "global_step": 408018, "epoch": 4915} {"train_loss": -26.647659301757812, "global_step": 408019, "epoch": 4915} {"train_loss": -26.64100456237793, "global_step": 408020, "epoch": 4915} {"train_loss": -26.690692901611328, "global_step": 408021, "epoch": 4915} {"train_loss": -26.984296798706055, "global_step": 408022, "epoch": 4915} {"train_loss": -26.514745712280273, "global_step": 408023, "epoch": 4915} {"train_loss": -26.715784072875977, "global_step": 408024, "epoch": 4915} {"train_loss": -26.65348243713379, "global_step": 408025, "epoch": 4915} {"train_loss": -26.793798446655273, "global_step": 408026, "epoch": 4915} {"train_loss": -26.55281007146261, "global_step": 408027, "epoch": 4915, "val_loss": 6613759.0} {"train_loss": -25.877872467041016, "global_step": 408028, "epoch": 4916} {"train_loss": -25.841047286987305, "global_step": 408029, "epoch": 4916} {"train_loss": -26.11993408203125, "global_step": 408030, "epoch": 4916} {"train_loss": -25.71575355529785, "global_step": 408031, "epoch": 4916} {"train_loss": -25.799001693725586, "global_step": 408032, "epoch": 4916} {"train_loss": -26.219701766967773, "global_step": 408033, "epoch": 4916} {"train_loss": -26.370410919189453, "global_step": 408034, "epoch": 4916} {"train_loss": -26.119775772094727, "global_step": 408035, "epoch": 4916} {"train_loss": -26.10255241394043, "global_step": 408036, "epoch": 4916} {"train_loss": -26.673559188842773, "global_step": 408037, "epoch": 4916} {"train_loss": -26.659015655517578, "global_step": 408038, "epoch": 4916} {"train_loss": -26.14042091369629, "global_step": 408039, "epoch": 4916} {"train_loss": -26.770904541015625, "global_step": 408040, "epoch": 4916} {"train_loss": -26.133625030517578, "global_step": 408041, "epoch": 4916} {"train_loss": -26.395004272460938, "global_step": 408042, "epoch": 4916} {"train_loss": -26.316877365112305, "global_step": 408043, "epoch": 4916} {"train_loss": -26.816781997680664, "global_step": 408044, "epoch": 4916} {"train_loss": -26.7048397064209, "global_step": 408045, "epoch": 4916} {"train_loss": -26.286767959594727, "global_step": 408046, "epoch": 4916} {"train_loss": -26.770368576049805, "global_step": 408047, "epoch": 4916} {"train_loss": -26.746164321899414, "global_step": 408048, "epoch": 4916} {"train_loss": -26.925033569335938, "global_step": 408049, "epoch": 4916} {"train_loss": -26.525354385375977, "global_step": 408050, "epoch": 4916} {"train_loss": -26.52130699157715, "global_step": 408051, "epoch": 4916} {"train_loss": -26.356489181518555, "global_step": 408052, "epoch": 4916} {"train_loss": -26.621444702148438, "global_step": 408053, "epoch": 4916} {"train_loss": -27.20869255065918, "global_step": 408054, "epoch": 4916} {"train_loss": -26.755643844604492, "global_step": 408055, "epoch": 4916} {"train_loss": -26.876630783081055, "global_step": 408056, "epoch": 4916} {"train_loss": -26.496850967407227, "global_step": 408057, "epoch": 4916} {"train_loss": -26.602243423461914, "global_step": 408058, "epoch": 4916} {"train_loss": -26.496326446533203, "global_step": 408059, "epoch": 4916} {"train_loss": -26.59076499938965, "global_step": 408060, "epoch": 4916} {"train_loss": -26.456317901611328, "global_step": 408061, "epoch": 4916} {"train_loss": -26.7067928314209, "global_step": 408062, "epoch": 4916} {"train_loss": -26.91145133972168, "global_step": 408063, "epoch": 4916} {"train_loss": -26.69684410095215, "global_step": 408064, "epoch": 4916} {"train_loss": -26.52945327758789, "global_step": 408065, "epoch": 4916} {"train_loss": -26.704761505126953, "global_step": 408066, "epoch": 4916} {"train_loss": -27.054067611694336, "global_step": 408067, "epoch": 4916} {"train_loss": -26.274763107299805, "global_step": 408068, "epoch": 4916} {"train_loss": -26.517078399658203, "global_step": 408069, "epoch": 4916} {"train_loss": -26.80460548400879, "global_step": 408070, "epoch": 4916} {"train_loss": -26.648706436157227, "global_step": 408071, "epoch": 4916} {"train_loss": -26.62066078186035, "global_step": 408072, "epoch": 4916} {"train_loss": -26.92170524597168, "global_step": 408073, "epoch": 4916} {"train_loss": -26.719388961791992, "global_step": 408074, "epoch": 4916} {"train_loss": -26.377410888671875, "global_step": 408075, "epoch": 4916} {"train_loss": -27.01776123046875, "global_step": 408076, "epoch": 4916} {"train_loss": -26.621984481811523, "global_step": 408077, "epoch": 4916} {"train_loss": -26.644147872924805, "global_step": 408078, "epoch": 4916} {"train_loss": -26.282196044921875, "global_step": 408079, "epoch": 4916} {"train_loss": -26.240497589111328, "global_step": 408080, "epoch": 4916} {"train_loss": -27.093469619750977, "global_step": 408081, "epoch": 4916} {"train_loss": -26.88059425354004, "global_step": 408082, "epoch": 4916} {"train_loss": -26.225177764892578, "global_step": 408083, "epoch": 4916} {"train_loss": -26.51262855529785, "global_step": 408084, "epoch": 4916} {"train_loss": -26.482275009155273, "global_step": 408085, "epoch": 4916} {"train_loss": -26.4929256439209, "global_step": 408086, "epoch": 4916} {"train_loss": -26.58949089050293, "global_step": 408087, "epoch": 4916} {"train_loss": -26.617237091064453, "global_step": 408088, "epoch": 4916} {"train_loss": -26.471372604370117, "global_step": 408089, "epoch": 4916} {"train_loss": -26.873615264892578, "global_step": 408090, "epoch": 4916} {"train_loss": -26.947309494018555, "global_step": 408091, "epoch": 4916} {"train_loss": -26.855268478393555, "global_step": 408092, "epoch": 4916} {"train_loss": -26.640485763549805, "global_step": 408093, "epoch": 4916} {"train_loss": -26.499103546142578, "global_step": 408094, "epoch": 4916} {"train_loss": -26.822973251342773, "global_step": 408095, "epoch": 4916} {"train_loss": -26.67278480529785, "global_step": 408096, "epoch": 4916} {"train_loss": -26.29193687438965, "global_step": 408097, "epoch": 4916} {"train_loss": -26.623212814331055, "global_step": 408098, "epoch": 4916} {"train_loss": -26.846710205078125, "global_step": 408099, "epoch": 4916} {"train_loss": -26.325464248657227, "global_step": 408100, "epoch": 4916} {"train_loss": -26.58391761779785, "global_step": 408101, "epoch": 4916} {"train_loss": -26.392593383789062, "global_step": 408102, "epoch": 4916} {"train_loss": -26.7750301361084, "global_step": 408103, "epoch": 4916} {"train_loss": -26.235824584960938, "global_step": 408104, "epoch": 4916} {"train_loss": -26.769865036010742, "global_step": 408105, "epoch": 4916} {"train_loss": -26.83765983581543, "global_step": 408106, "epoch": 4916} {"train_loss": -26.59916114807129, "global_step": 408107, "epoch": 4916} {"train_loss": -26.76381492614746, "global_step": 408108, "epoch": 4916} {"train_loss": -26.479108810424805, "global_step": 408109, "epoch": 4916} {"train_loss": -26.54709489661527, "global_step": 408110, "epoch": 4916, "val_loss": 6749442.5} {"train_loss": -26.071226119995117, "global_step": 408111, "epoch": 4917} {"train_loss": -26.00136375427246, "global_step": 408112, "epoch": 4917} {"train_loss": -26.20598793029785, "global_step": 408113, "epoch": 4917} {"train_loss": -26.278629302978516, "global_step": 408114, "epoch": 4917} {"train_loss": -26.01215934753418, "global_step": 408115, "epoch": 4917} {"train_loss": -26.378259658813477, "global_step": 408116, "epoch": 4917} {"train_loss": -25.82900047302246, "global_step": 408117, "epoch": 4917} {"train_loss": -26.14227294921875, "global_step": 408118, "epoch": 4917} {"train_loss": -25.690290451049805, "global_step": 408119, "epoch": 4917} {"train_loss": -26.06305503845215, "global_step": 408120, "epoch": 4917} {"train_loss": -26.060102462768555, "global_step": 408121, "epoch": 4917} {"train_loss": -25.868268966674805, "global_step": 408122, "epoch": 4917} {"train_loss": -26.418256759643555, "global_step": 408123, "epoch": 4917} {"train_loss": -26.574295043945312, "global_step": 408124, "epoch": 4917} {"train_loss": -26.009235382080078, "global_step": 408125, "epoch": 4917} {"train_loss": -26.317724227905273, "global_step": 408126, "epoch": 4917} {"train_loss": -25.989059448242188, "global_step": 408127, "epoch": 4917} {"train_loss": -26.20159912109375, "global_step": 408128, "epoch": 4917} {"train_loss": -26.750280380249023, "global_step": 408129, "epoch": 4917} {"train_loss": -26.450016021728516, "global_step": 408130, "epoch": 4917} {"train_loss": -26.540393829345703, "global_step": 408131, "epoch": 4917} {"train_loss": -26.897703170776367, "global_step": 408132, "epoch": 4917} {"train_loss": -26.605152130126953, "global_step": 408133, "epoch": 4917} {"train_loss": -26.75628089904785, "global_step": 408134, "epoch": 4917} {"train_loss": -26.502248764038086, "global_step": 408135, "epoch": 4917} {"train_loss": -26.646778106689453, "global_step": 408136, "epoch": 4917} {"train_loss": -26.468358993530273, "global_step": 408137, "epoch": 4917} {"train_loss": -26.676984786987305, "global_step": 408138, "epoch": 4917} {"train_loss": -26.35610008239746, "global_step": 408139, "epoch": 4917} {"train_loss": -26.56867027282715, "global_step": 408140, "epoch": 4917} {"train_loss": -26.651071548461914, "global_step": 408141, "epoch": 4917} {"train_loss": -26.772541046142578, "global_step": 408142, "epoch": 4917} {"train_loss": -26.502893447875977, "global_step": 408143, "epoch": 4917} {"train_loss": -26.741596221923828, "global_step": 408144, "epoch": 4917} {"train_loss": -26.44182777404785, "global_step": 408145, "epoch": 4917} {"train_loss": -27.09442710876465, "global_step": 408146, "epoch": 4917} {"train_loss": -26.93634033203125, "global_step": 408147, "epoch": 4917} {"train_loss": -26.593189239501953, "global_step": 408148, "epoch": 4917} {"train_loss": -26.941144943237305, "global_step": 408149, "epoch": 4917} {"train_loss": -27.01405143737793, "global_step": 408150, "epoch": 4917} {"train_loss": -26.855642318725586, "global_step": 408151, "epoch": 4917} {"train_loss": -27.151174545288086, "global_step": 408152, "epoch": 4917} {"train_loss": -26.972476959228516, "global_step": 408153, "epoch": 4917} {"train_loss": -26.97725486755371, "global_step": 408154, "epoch": 4917} {"train_loss": -26.600229263305664, "global_step": 408155, "epoch": 4917} {"train_loss": -27.036584854125977, "global_step": 408156, "epoch": 4917} {"train_loss": -26.812864303588867, "global_step": 408157, "epoch": 4917} {"train_loss": -26.963733673095703, "global_step": 408158, "epoch": 4917} {"train_loss": -26.626453399658203, "global_step": 408159, "epoch": 4917} {"train_loss": -26.365365982055664, "global_step": 408160, "epoch": 4917} {"train_loss": -26.688434600830078, "global_step": 408161, "epoch": 4917} {"train_loss": -26.821807861328125, "global_step": 408162, "epoch": 4917} {"train_loss": -26.523283004760742, "global_step": 408163, "epoch": 4917} {"train_loss": -26.369123458862305, "global_step": 408164, "epoch": 4917} {"train_loss": -26.34397315979004, "global_step": 408165, "epoch": 4917} {"train_loss": -27.07342529296875, "global_step": 408166, "epoch": 4917} {"train_loss": -26.711685180664062, "global_step": 408167, "epoch": 4917} {"train_loss": -26.4737491607666, "global_step": 408168, "epoch": 4917} {"train_loss": -26.79485511779785, "global_step": 408169, "epoch": 4917} {"train_loss": -26.639480590820312, "global_step": 408170, "epoch": 4917} {"train_loss": -26.480661392211914, "global_step": 408171, "epoch": 4917} {"train_loss": -26.34697914123535, "global_step": 408172, "epoch": 4917} {"train_loss": -26.456878662109375, "global_step": 408173, "epoch": 4917} {"train_loss": -26.7724609375, "global_step": 408174, "epoch": 4917} {"train_loss": -26.368732452392578, "global_step": 408175, "epoch": 4917} {"train_loss": -26.363183975219727, "global_step": 408176, "epoch": 4917} {"train_loss": -26.681299209594727, "global_step": 408177, "epoch": 4917} {"train_loss": -26.65045166015625, "global_step": 408178, "epoch": 4917} {"train_loss": -26.700551986694336, "global_step": 408179, "epoch": 4917} {"train_loss": -26.596220016479492, "global_step": 408180, "epoch": 4917} {"train_loss": -26.69833755493164, "global_step": 408181, "epoch": 4917} {"train_loss": -27.069177627563477, "global_step": 408182, "epoch": 4917} {"train_loss": -26.4126033782959, "global_step": 408183, "epoch": 4917} {"train_loss": -26.675342559814453, "global_step": 408184, "epoch": 4917} {"train_loss": -26.502866744995117, "global_step": 408185, "epoch": 4917} {"train_loss": -26.970911026000977, "global_step": 408186, "epoch": 4917} {"train_loss": -26.798355102539062, "global_step": 408187, "epoch": 4917} {"train_loss": -26.599973678588867, "global_step": 408188, "epoch": 4917} {"train_loss": -26.2307071685791, "global_step": 408189, "epoch": 4917} {"train_loss": -26.79802894592285, "global_step": 408190, "epoch": 4917} {"train_loss": -26.912006378173828, "global_step": 408191, "epoch": 4917} {"train_loss": -26.77442741394043, "global_step": 408192, "epoch": 4917} {"train_loss": -26.54724711682423, "global_step": 408193, "epoch": 4917, "val_loss": 6743150.0} {"train_loss": -26.45405387878418, "global_step": 408194, "epoch": 4918} {"train_loss": -26.261627197265625, "global_step": 408195, "epoch": 4918} {"train_loss": -26.307727813720703, "global_step": 408196, "epoch": 4918} {"train_loss": -26.005176544189453, "global_step": 408197, "epoch": 4918} {"train_loss": -26.31702995300293, "global_step": 408198, "epoch": 4918} {"train_loss": -26.1354923248291, "global_step": 408199, "epoch": 4918} {"train_loss": -26.642736434936523, "global_step": 408200, "epoch": 4918} {"train_loss": -26.4710636138916, "global_step": 408201, "epoch": 4918} {"train_loss": -26.427335739135742, "global_step": 408202, "epoch": 4918} {"train_loss": -26.634687423706055, "global_step": 408203, "epoch": 4918} {"train_loss": -26.632312774658203, "global_step": 408204, "epoch": 4918} {"train_loss": -26.642053604125977, "global_step": 408205, "epoch": 4918} {"train_loss": -26.537586212158203, "global_step": 408206, "epoch": 4918} {"train_loss": -26.338220596313477, "global_step": 408207, "epoch": 4918} {"train_loss": -26.504470825195312, "global_step": 408208, "epoch": 4918} {"train_loss": -26.709020614624023, "global_step": 408209, "epoch": 4918} {"train_loss": -26.812255859375, "global_step": 408210, "epoch": 4918} {"train_loss": -26.474531173706055, "global_step": 408211, "epoch": 4918} {"train_loss": -26.723346710205078, "global_step": 408212, "epoch": 4918} {"train_loss": -26.744409561157227, "global_step": 408213, "epoch": 4918} {"train_loss": -26.301105499267578, "global_step": 408214, "epoch": 4918} {"train_loss": -26.48347282409668, "global_step": 408215, "epoch": 4918} {"train_loss": -27.020360946655273, "global_step": 408216, "epoch": 4918} {"train_loss": -26.09446144104004, "global_step": 408217, "epoch": 4918} {"train_loss": -26.609601974487305, "global_step": 408218, "epoch": 4918} {"train_loss": -26.697370529174805, "global_step": 408219, "epoch": 4918} {"train_loss": -26.67164421081543, "global_step": 408220, "epoch": 4918} {"train_loss": -26.981369018554688, "global_step": 408221, "epoch": 4918} {"train_loss": -26.352344512939453, "global_step": 408222, "epoch": 4918} {"train_loss": -27.002073287963867, "global_step": 408223, "epoch": 4918} {"train_loss": -26.9251766204834, "global_step": 408224, "epoch": 4918} {"train_loss": -26.442121505737305, "global_step": 408225, "epoch": 4918} {"train_loss": -26.953323364257812, "global_step": 408226, "epoch": 4918} {"train_loss": -26.77894401550293, "global_step": 408227, "epoch": 4918} {"train_loss": -26.90106773376465, "global_step": 408228, "epoch": 4918} {"train_loss": -26.66534423828125, "global_step": 408229, "epoch": 4918} {"train_loss": -26.847339630126953, "global_step": 408230, "epoch": 4918} {"train_loss": -27.01056480407715, "global_step": 408231, "epoch": 4918} {"train_loss": -26.855817794799805, "global_step": 408232, "epoch": 4918} {"train_loss": -26.69540786743164, "global_step": 408233, "epoch": 4918} {"train_loss": -26.690893173217773, "global_step": 408234, "epoch": 4918} {"train_loss": -26.823719024658203, "global_step": 408235, "epoch": 4918} {"train_loss": -26.759918212890625, "global_step": 408236, "epoch": 4918} {"train_loss": -26.8475341796875, "global_step": 408237, "epoch": 4918} {"train_loss": -26.88534927368164, "global_step": 408238, "epoch": 4918} {"train_loss": -26.932010650634766, "global_step": 408239, "epoch": 4918} {"train_loss": -26.655109405517578, "global_step": 408240, "epoch": 4918} {"train_loss": -26.69083595275879, "global_step": 408241, "epoch": 4918} {"train_loss": -26.452733993530273, "global_step": 408242, "epoch": 4918} {"train_loss": -26.90223503112793, "global_step": 408243, "epoch": 4918} {"train_loss": -26.7031192779541, "global_step": 408244, "epoch": 4918} {"train_loss": -26.558841705322266, "global_step": 408245, "epoch": 4918} {"train_loss": -26.700048446655273, "global_step": 408246, "epoch": 4918} {"train_loss": -26.983373641967773, "global_step": 408247, "epoch": 4918} {"train_loss": -26.622983932495117, "global_step": 408248, "epoch": 4918} {"train_loss": -26.837072372436523, "global_step": 408249, "epoch": 4918} {"train_loss": -26.523883819580078, "global_step": 408250, "epoch": 4918} {"train_loss": -26.670608520507812, "global_step": 408251, "epoch": 4918} {"train_loss": -26.8333740234375, "global_step": 408252, "epoch": 4918} {"train_loss": -26.531354904174805, "global_step": 408253, "epoch": 4918} {"train_loss": -26.609159469604492, "global_step": 408254, "epoch": 4918} {"train_loss": -26.406888961791992, "global_step": 408255, "epoch": 4918} {"train_loss": -26.403966903686523, "global_step": 408256, "epoch": 4918} {"train_loss": -27.211435317993164, "global_step": 408257, "epoch": 4918} {"train_loss": -26.679492950439453, "global_step": 408258, "epoch": 4918} {"train_loss": -26.299718856811523, "global_step": 408259, "epoch": 4918} {"train_loss": -26.32050132751465, "global_step": 408260, "epoch": 4918} {"train_loss": -26.892791748046875, "global_step": 408261, "epoch": 4918} {"train_loss": -26.649417877197266, "global_step": 408262, "epoch": 4918} {"train_loss": -26.7315616607666, "global_step": 408263, "epoch": 4918} {"train_loss": -26.65020179748535, "global_step": 408264, "epoch": 4918} {"train_loss": -26.761194229125977, "global_step": 408265, "epoch": 4918} {"train_loss": -26.669095993041992, "global_step": 408266, "epoch": 4918} {"train_loss": -26.48809814453125, "global_step": 408267, "epoch": 4918} {"train_loss": -26.93723487854004, "global_step": 408268, "epoch": 4918} {"train_loss": -26.925268173217773, "global_step": 408269, "epoch": 4918} {"train_loss": -26.628324508666992, "global_step": 408270, "epoch": 4918} {"train_loss": -26.55742835998535, "global_step": 408271, "epoch": 4918} {"train_loss": -26.59461784362793, "global_step": 408272, "epoch": 4918} {"train_loss": -26.6911678314209, "global_step": 408273, "epoch": 4918} {"train_loss": -26.852237701416016, "global_step": 408274, "epoch": 4918} {"train_loss": -26.725692749023438, "global_step": 408275, "epoch": 4918} {"train_loss": -26.656552739890223, "global_step": 408276, "epoch": 4918, "val_loss": 6814311.0} {"train_loss": -25.766714096069336, "global_step": 408277, "epoch": 4919} {"train_loss": -25.362546920776367, "global_step": 408278, "epoch": 4919} {"train_loss": -26.194904327392578, "global_step": 408279, "epoch": 4919} {"train_loss": -25.920730590820312, "global_step": 408280, "epoch": 4919} {"train_loss": -25.7127628326416, "global_step": 408281, "epoch": 4919} {"train_loss": -25.990478515625, "global_step": 408282, "epoch": 4919} {"train_loss": -25.52347183227539, "global_step": 408283, "epoch": 4919} {"train_loss": -26.165918350219727, "global_step": 408284, "epoch": 4919} {"train_loss": -25.905364990234375, "global_step": 408285, "epoch": 4919} {"train_loss": -25.689163208007812, "global_step": 408286, "epoch": 4919} {"train_loss": -25.5037899017334, "global_step": 408287, "epoch": 4919} {"train_loss": -26.167505264282227, "global_step": 408288, "epoch": 4919} {"train_loss": -25.91275405883789, "global_step": 408289, "epoch": 4919} {"train_loss": -25.9307804107666, "global_step": 408290, "epoch": 4919} {"train_loss": -26.166799545288086, "global_step": 408291, "epoch": 4919} {"train_loss": -26.2766056060791, "global_step": 408292, "epoch": 4919} {"train_loss": -26.057043075561523, "global_step": 408293, "epoch": 4919} {"train_loss": -26.3212947845459, "global_step": 408294, "epoch": 4919} {"train_loss": -26.331418991088867, "global_step": 408295, "epoch": 4919} {"train_loss": -26.136327743530273, "global_step": 408296, "epoch": 4919} {"train_loss": -26.193700790405273, "global_step": 408297, "epoch": 4919} {"train_loss": -26.401281356811523, "global_step": 408298, "epoch": 4919} {"train_loss": -26.520954132080078, "global_step": 408299, "epoch": 4919} {"train_loss": -26.430145263671875, "global_step": 408300, "epoch": 4919} {"train_loss": -26.284780502319336, "global_step": 408301, "epoch": 4919} {"train_loss": -26.472187042236328, "global_step": 408302, "epoch": 4919} {"train_loss": -26.511564254760742, "global_step": 408303, "epoch": 4919} {"train_loss": -26.67999267578125, "global_step": 408304, "epoch": 4919} {"train_loss": -26.57746696472168, "global_step": 408305, "epoch": 4919} {"train_loss": -25.95931053161621, "global_step": 408306, "epoch": 4919} {"train_loss": -26.28498649597168, "global_step": 408307, "epoch": 4919} {"train_loss": -26.504255294799805, "global_step": 408308, "epoch": 4919} {"train_loss": -26.532684326171875, "global_step": 408309, "epoch": 4919} {"train_loss": -26.47736930847168, "global_step": 408310, "epoch": 4919} {"train_loss": -26.497486114501953, "global_step": 408311, "epoch": 4919} {"train_loss": -26.335790634155273, "global_step": 408312, "epoch": 4919} {"train_loss": -27.02613639831543, "global_step": 408313, "epoch": 4919} {"train_loss": -26.25762367248535, "global_step": 408314, "epoch": 4919} {"train_loss": -26.70718765258789, "global_step": 408315, "epoch": 4919} {"train_loss": -26.73933219909668, "global_step": 408316, "epoch": 4919} {"train_loss": -27.075956344604492, "global_step": 408317, "epoch": 4919} {"train_loss": -26.67164421081543, "global_step": 408318, "epoch": 4919} {"train_loss": -26.60260009765625, "global_step": 408319, "epoch": 4919} {"train_loss": -26.740110397338867, "global_step": 408320, "epoch": 4919} {"train_loss": -26.56817054748535, "global_step": 408321, "epoch": 4919} {"train_loss": -26.517881393432617, "global_step": 408322, "epoch": 4919} {"train_loss": -26.953989028930664, "global_step": 408323, "epoch": 4919} {"train_loss": -26.718286514282227, "global_step": 408324, "epoch": 4919} {"train_loss": -26.8195858001709, "global_step": 408325, "epoch": 4919} {"train_loss": -26.72040367126465, "global_step": 408326, "epoch": 4919} {"train_loss": -26.859689712524414, "global_step": 408327, "epoch": 4919} {"train_loss": -27.0469970703125, "global_step": 408328, "epoch": 4919} {"train_loss": -26.875940322875977, "global_step": 408329, "epoch": 4919} {"train_loss": -26.417951583862305, "global_step": 408330, "epoch": 4919} {"train_loss": -26.68426513671875, "global_step": 408331, "epoch": 4919} {"train_loss": -26.456012725830078, "global_step": 408332, "epoch": 4919} {"train_loss": -26.779443740844727, "global_step": 408333, "epoch": 4919} {"train_loss": -26.630802154541016, "global_step": 408334, "epoch": 4919} {"train_loss": -26.737812042236328, "global_step": 408335, "epoch": 4919} {"train_loss": -26.633291244506836, "global_step": 408336, "epoch": 4919} {"train_loss": -26.929128646850586, "global_step": 408337, "epoch": 4919} {"train_loss": -26.737171173095703, "global_step": 408338, "epoch": 4919} {"train_loss": -26.71462059020996, "global_step": 408339, "epoch": 4919} {"train_loss": -26.849597930908203, "global_step": 408340, "epoch": 4919} {"train_loss": -26.558639526367188, "global_step": 408341, "epoch": 4919} {"train_loss": -26.45282554626465, "global_step": 408342, "epoch": 4919} {"train_loss": -26.54190444946289, "global_step": 408343, "epoch": 4919} {"train_loss": -26.63446044921875, "global_step": 408344, "epoch": 4919} {"train_loss": -26.829761505126953, "global_step": 408345, "epoch": 4919} {"train_loss": -26.77669334411621, "global_step": 408346, "epoch": 4919} {"train_loss": -26.407245635986328, "global_step": 408347, "epoch": 4919} {"train_loss": -26.95926284790039, "global_step": 408348, "epoch": 4919} {"train_loss": -26.5353946685791, "global_step": 408349, "epoch": 4919} {"train_loss": -26.767257690429688, "global_step": 408350, "epoch": 4919} {"train_loss": -26.735370635986328, "global_step": 408351, "epoch": 4919} {"train_loss": -26.6340274810791, "global_step": 408352, "epoch": 4919} {"train_loss": -27.129230499267578, "global_step": 408353, "epoch": 4919} {"train_loss": -26.49674415588379, "global_step": 408354, "epoch": 4919} {"train_loss": -26.609289169311523, "global_step": 408355, "epoch": 4919} {"train_loss": -26.71803092956543, "global_step": 408356, "epoch": 4919} {"train_loss": -26.94333839416504, "global_step": 408357, "epoch": 4919} {"train_loss": -26.6551570892334, "global_step": 408358, "epoch": 4919} {"train_loss": -26.46997541404632, "global_step": 408359, "epoch": 4919, "val_loss": 6825665.0} {"train_loss": -26.22307777404785, "global_step": 408360, "epoch": 4920} {"train_loss": -26.033926010131836, "global_step": 408361, "epoch": 4920} {"train_loss": -26.333906173706055, "global_step": 408362, "epoch": 4920} {"train_loss": -26.17236328125, "global_step": 408363, "epoch": 4920} {"train_loss": -26.824054718017578, "global_step": 408364, "epoch": 4920} {"train_loss": -26.20533561706543, "global_step": 408365, "epoch": 4920} {"train_loss": -26.679067611694336, "global_step": 408366, "epoch": 4920} {"train_loss": -26.5294189453125, "global_step": 408367, "epoch": 4920} {"train_loss": -25.974506378173828, "global_step": 408368, "epoch": 4920} {"train_loss": -26.405324935913086, "global_step": 408369, "epoch": 4920} {"train_loss": -26.599348068237305, "global_step": 408370, "epoch": 4920} {"train_loss": -26.66291618347168, "global_step": 408371, "epoch": 4920} {"train_loss": -26.48988151550293, "global_step": 408372, "epoch": 4920} {"train_loss": -26.35210609436035, "global_step": 408373, "epoch": 4920} {"train_loss": -26.64948081970215, "global_step": 408374, "epoch": 4920} {"train_loss": -26.640417098999023, "global_step": 408375, "epoch": 4920} {"train_loss": -26.584638595581055, "global_step": 408376, "epoch": 4920} {"train_loss": -26.866962432861328, "global_step": 408377, "epoch": 4920} {"train_loss": -26.81463050842285, "global_step": 408378, "epoch": 4920} {"train_loss": -26.421354293823242, "global_step": 408379, "epoch": 4920} {"train_loss": -26.740955352783203, "global_step": 408380, "epoch": 4920} {"train_loss": -26.734323501586914, "global_step": 408381, "epoch": 4920} {"train_loss": -26.741992950439453, "global_step": 408382, "epoch": 4920} {"train_loss": -26.83405876159668, "global_step": 408383, "epoch": 4920} {"train_loss": -26.81959342956543, "global_step": 408384, "epoch": 4920} {"train_loss": -26.831262588500977, "global_step": 408385, "epoch": 4920} {"train_loss": -26.981725692749023, "global_step": 408386, "epoch": 4920} {"train_loss": -26.853134155273438, "global_step": 408387, "epoch": 4920} {"train_loss": -26.72638511657715, "global_step": 408388, "epoch": 4920} {"train_loss": -26.716840744018555, "global_step": 408389, "epoch": 4920} {"train_loss": -26.808629989624023, "global_step": 408390, "epoch": 4920} {"train_loss": -26.70088005065918, "global_step": 408391, "epoch": 4920} {"train_loss": -26.581424713134766, "global_step": 408392, "epoch": 4920} {"train_loss": -26.678918838500977, "global_step": 408393, "epoch": 4920} {"train_loss": -26.85627555847168, "global_step": 408394, "epoch": 4920} {"train_loss": -26.687576293945312, "global_step": 408395, "epoch": 4920} {"train_loss": -26.73970603942871, "global_step": 408396, "epoch": 4920} {"train_loss": -26.700895309448242, "global_step": 408397, "epoch": 4920} {"train_loss": -26.846149444580078, "global_step": 408398, "epoch": 4920} {"train_loss": -26.866979598999023, "global_step": 408399, "epoch": 4920} {"train_loss": -26.704431533813477, "global_step": 408400, "epoch": 4920} {"train_loss": -27.08194923400879, "global_step": 408401, "epoch": 4920} {"train_loss": -27.063114166259766, "global_step": 408402, "epoch": 4920} {"train_loss": -26.609731674194336, "global_step": 408403, "epoch": 4920} {"train_loss": -26.42213249206543, "global_step": 408404, "epoch": 4920} {"train_loss": -26.233381271362305, "global_step": 408405, "epoch": 4920} {"train_loss": -26.795576095581055, "global_step": 408406, "epoch": 4920} {"train_loss": -26.53021812438965, "global_step": 408407, "epoch": 4920} {"train_loss": -26.858407974243164, "global_step": 408408, "epoch": 4920} {"train_loss": -26.80499267578125, "global_step": 408409, "epoch": 4920} {"train_loss": -26.70853614807129, "global_step": 408410, "epoch": 4920} {"train_loss": -26.15522575378418, "global_step": 408411, "epoch": 4920} {"train_loss": -26.176956176757812, "global_step": 408412, "epoch": 4920} {"train_loss": -26.535720825195312, "global_step": 408413, "epoch": 4920} {"train_loss": -26.552722930908203, "global_step": 408414, "epoch": 4920} {"train_loss": -26.89898681640625, "global_step": 408415, "epoch": 4920} {"train_loss": -26.676288604736328, "global_step": 408416, "epoch": 4920} {"train_loss": -27.11762046813965, "global_step": 408417, "epoch": 4920} {"train_loss": -26.568334579467773, "global_step": 408418, "epoch": 4920} {"train_loss": -26.672149658203125, "global_step": 408419, "epoch": 4920} {"train_loss": -26.311222076416016, "global_step": 408420, "epoch": 4920} {"train_loss": -26.797910690307617, "global_step": 408421, "epoch": 4920} {"train_loss": -26.49818229675293, "global_step": 408422, "epoch": 4920} {"train_loss": -26.411279678344727, "global_step": 408423, "epoch": 4920} {"train_loss": -26.585296630859375, "global_step": 408424, "epoch": 4920} {"train_loss": -26.60711097717285, "global_step": 408425, "epoch": 4920} {"train_loss": -26.671432495117188, "global_step": 408426, "epoch": 4920} {"train_loss": -26.464221954345703, "global_step": 408427, "epoch": 4920} {"train_loss": -26.923383712768555, "global_step": 408428, "epoch": 4920} {"train_loss": -26.789499282836914, "global_step": 408429, "epoch": 4920} {"train_loss": -26.466827392578125, "global_step": 408430, "epoch": 4920} {"train_loss": -26.3956298828125, "global_step": 408431, "epoch": 4920} {"train_loss": -26.84649658203125, "global_step": 408432, "epoch": 4920} {"train_loss": -26.894317626953125, "global_step": 408433, "epoch": 4920} {"train_loss": -26.71441650390625, "global_step": 408434, "epoch": 4920} {"train_loss": -26.747699737548828, "global_step": 408435, "epoch": 4920} {"train_loss": -26.721649169921875, "global_step": 408436, "epoch": 4920} {"train_loss": -27.1116943359375, "global_step": 408437, "epoch": 4920} {"train_loss": -26.853973388671875, "global_step": 408438, "epoch": 4920} {"train_loss": -27.007638931274414, "global_step": 408439, "epoch": 4920} {"train_loss": -26.70245933532715, "global_step": 408440, "epoch": 4920} {"train_loss": -26.479084014892578, "global_step": 408441, "epoch": 4920} {"train_loss": -26.65566619045763, "global_step": 408442, "epoch": 4920, "val_loss": 6769004.0} {"train_loss": -26.439218521118164, "global_step": 408443, "epoch": 4921} {"train_loss": -25.98883056640625, "global_step": 408444, "epoch": 4921} {"train_loss": -26.05674171447754, "global_step": 408445, "epoch": 4921} {"train_loss": -25.985082626342773, "global_step": 408446, "epoch": 4921} {"train_loss": -26.677648544311523, "global_step": 408447, "epoch": 4921} {"train_loss": -26.32199478149414, "global_step": 408448, "epoch": 4921} {"train_loss": -26.473173141479492, "global_step": 408449, "epoch": 4921} {"train_loss": -26.049901962280273, "global_step": 408450, "epoch": 4921} {"train_loss": -26.332319259643555, "global_step": 408451, "epoch": 4921} {"train_loss": -26.514514923095703, "global_step": 408452, "epoch": 4921} {"train_loss": -26.2755184173584, "global_step": 408453, "epoch": 4921} {"train_loss": -26.5013484954834, "global_step": 408454, "epoch": 4921} {"train_loss": -26.244409561157227, "global_step": 408455, "epoch": 4921} {"train_loss": -26.643640518188477, "global_step": 408456, "epoch": 4921} {"train_loss": -26.167160034179688, "global_step": 408457, "epoch": 4921} {"train_loss": -26.60402488708496, "global_step": 408458, "epoch": 4921} {"train_loss": -26.346261978149414, "global_step": 408459, "epoch": 4921} {"train_loss": -26.44891929626465, "global_step": 408460, "epoch": 4921} {"train_loss": -26.67303466796875, "global_step": 408461, "epoch": 4921} {"train_loss": -26.574649810791016, "global_step": 408462, "epoch": 4921} {"train_loss": -26.651397705078125, "global_step": 408463, "epoch": 4921} {"train_loss": -26.449462890625, "global_step": 408464, "epoch": 4921} {"train_loss": -26.606536865234375, "global_step": 408465, "epoch": 4921} {"train_loss": -26.348419189453125, "global_step": 408466, "epoch": 4921} {"train_loss": -26.667724609375, "global_step": 408467, "epoch": 4921} {"train_loss": -26.431869506835938, "global_step": 408468, "epoch": 4921} {"train_loss": -26.8723087310791, "global_step": 408469, "epoch": 4921} {"train_loss": -26.426511764526367, "global_step": 408470, "epoch": 4921} {"train_loss": -27.119857788085938, "global_step": 408471, "epoch": 4921} {"train_loss": -26.897689819335938, "global_step": 408472, "epoch": 4921} {"train_loss": -26.356992721557617, "global_step": 408473, "epoch": 4921} {"train_loss": -26.7669620513916, "global_step": 408474, "epoch": 4921} {"train_loss": -26.64076805114746, "global_step": 408475, "epoch": 4921} {"train_loss": -26.645292282104492, "global_step": 408476, "epoch": 4921} {"train_loss": -26.755346298217773, "global_step": 408477, "epoch": 4921} {"train_loss": -27.16309928894043, "global_step": 408478, "epoch": 4921} {"train_loss": -26.675628662109375, "global_step": 408479, "epoch": 4921} {"train_loss": -26.51304054260254, "global_step": 408480, "epoch": 4921} {"train_loss": -26.258625030517578, "global_step": 408481, "epoch": 4921} {"train_loss": -26.390974044799805, "global_step": 408482, "epoch": 4921} {"train_loss": -26.62312126159668, "global_step": 408483, "epoch": 4921} {"train_loss": -26.68391227722168, "global_step": 408484, "epoch": 4921} {"train_loss": -26.928068161010742, "global_step": 408485, "epoch": 4921} {"train_loss": -26.599811553955078, "global_step": 408486, "epoch": 4921} {"train_loss": -26.6464786529541, "global_step": 408487, "epoch": 4921} {"train_loss": -26.296701431274414, "global_step": 408488, "epoch": 4921} {"train_loss": -26.663665771484375, "global_step": 408489, "epoch": 4921} {"train_loss": -26.498632431030273, "global_step": 408490, "epoch": 4921} {"train_loss": -26.491308212280273, "global_step": 408491, "epoch": 4921} {"train_loss": -26.493982315063477, "global_step": 408492, "epoch": 4921} {"train_loss": -26.44010353088379, "global_step": 408493, "epoch": 4921} {"train_loss": -26.635391235351562, "global_step": 408494, "epoch": 4921} {"train_loss": -26.175704956054688, "global_step": 408495, "epoch": 4921} {"train_loss": -26.750192642211914, "global_step": 408496, "epoch": 4921} {"train_loss": -26.810888290405273, "global_step": 408497, "epoch": 4921} {"train_loss": -26.723407745361328, "global_step": 408498, "epoch": 4921} {"train_loss": -26.47307777404785, "global_step": 408499, "epoch": 4921} {"train_loss": -26.7186279296875, "global_step": 408500, "epoch": 4921} {"train_loss": -26.596277236938477, "global_step": 408501, "epoch": 4921} {"train_loss": -26.7905330657959, "global_step": 408502, "epoch": 4921} {"train_loss": -26.949127197265625, "global_step": 408503, "epoch": 4921} {"train_loss": -26.916400909423828, "global_step": 408504, "epoch": 4921} {"train_loss": -26.80486488342285, "global_step": 408505, "epoch": 4921} {"train_loss": -27.02438735961914, "global_step": 408506, "epoch": 4921} {"train_loss": -26.55866813659668, "global_step": 408507, "epoch": 4921} {"train_loss": -26.769031524658203, "global_step": 408508, "epoch": 4921} {"train_loss": -27.046247482299805, "global_step": 408509, "epoch": 4921} {"train_loss": -26.623310089111328, "global_step": 408510, "epoch": 4921} {"train_loss": -26.542795181274414, "global_step": 408511, "epoch": 4921} {"train_loss": -26.808454513549805, "global_step": 408512, "epoch": 4921} {"train_loss": -26.7520751953125, "global_step": 408513, "epoch": 4921} {"train_loss": -26.887969970703125, "global_step": 408514, "epoch": 4921} {"train_loss": -26.445215225219727, "global_step": 408515, "epoch": 4921} {"train_loss": -26.321149826049805, "global_step": 408516, "epoch": 4921} {"train_loss": -26.848621368408203, "global_step": 408517, "epoch": 4921} {"train_loss": -26.5618896484375, "global_step": 408518, "epoch": 4921} {"train_loss": -26.375646591186523, "global_step": 408519, "epoch": 4921} {"train_loss": -26.87308120727539, "global_step": 408520, "epoch": 4921} {"train_loss": -26.695669174194336, "global_step": 408521, "epoch": 4921} {"train_loss": -26.573028564453125, "global_step": 408522, "epoch": 4921} {"train_loss": -26.716938018798828, "global_step": 408523, "epoch": 4921} {"train_loss": -26.87628173828125, "global_step": 408524, "epoch": 4921} {"train_loss": -26.587659077471997, "global_step": 408525, "epoch": 4921, "val_loss": 6700493.0} {"train_loss": -26.434415817260742, "global_step": 408526, "epoch": 4922} {"train_loss": -26.222003936767578, "global_step": 408527, "epoch": 4922} {"train_loss": -26.55319595336914, "global_step": 408528, "epoch": 4922} {"train_loss": -26.101917266845703, "global_step": 408529, "epoch": 4922} {"train_loss": -25.873823165893555, "global_step": 408530, "epoch": 4922} {"train_loss": -26.6782169342041, "global_step": 408531, "epoch": 4922} {"train_loss": -25.986738204956055, "global_step": 408532, "epoch": 4922} {"train_loss": -26.14369010925293, "global_step": 408533, "epoch": 4922} {"train_loss": -26.061370849609375, "global_step": 408534, "epoch": 4922} {"train_loss": -26.430078506469727, "global_step": 408535, "epoch": 4922} {"train_loss": -25.988439559936523, "global_step": 408536, "epoch": 4922} {"train_loss": -26.80280876159668, "global_step": 408537, "epoch": 4922} {"train_loss": -26.529224395751953, "global_step": 408538, "epoch": 4922} {"train_loss": -26.09407615661621, "global_step": 408539, "epoch": 4922} {"train_loss": -26.389310836791992, "global_step": 408540, "epoch": 4922} {"train_loss": -26.908422470092773, "global_step": 408541, "epoch": 4922} {"train_loss": -26.563711166381836, "global_step": 408542, "epoch": 4922} {"train_loss": -26.142553329467773, "global_step": 408543, "epoch": 4922} {"train_loss": -26.54572868347168, "global_step": 408544, "epoch": 4922} {"train_loss": -26.692407608032227, "global_step": 408545, "epoch": 4922} {"train_loss": -26.253753662109375, "global_step": 408546, "epoch": 4922} {"train_loss": -26.470624923706055, "global_step": 408547, "epoch": 4922} {"train_loss": -26.83668327331543, "global_step": 408548, "epoch": 4922} {"train_loss": -26.7320556640625, "global_step": 408549, "epoch": 4922} {"train_loss": -26.877592086791992, "global_step": 408550, "epoch": 4922} {"train_loss": -26.63266944885254, "global_step": 408551, "epoch": 4922} {"train_loss": -26.89922523498535, "global_step": 408552, "epoch": 4922} {"train_loss": -26.301740646362305, "global_step": 408553, "epoch": 4922} {"train_loss": -26.438989639282227, "global_step": 408554, "epoch": 4922} {"train_loss": -27.069421768188477, "global_step": 408555, "epoch": 4922} {"train_loss": -26.65402603149414, "global_step": 408556, "epoch": 4922} {"train_loss": -26.56940269470215, "global_step": 408557, "epoch": 4922} {"train_loss": -26.826765060424805, "global_step": 408558, "epoch": 4922} {"train_loss": -26.86578369140625, "global_step": 408559, "epoch": 4922} {"train_loss": -26.979084014892578, "global_step": 408560, "epoch": 4922} {"train_loss": -27.2167911529541, "global_step": 408561, "epoch": 4922} {"train_loss": -26.954614639282227, "global_step": 408562, "epoch": 4922} {"train_loss": -26.552061080932617, "global_step": 408563, "epoch": 4922} {"train_loss": -26.8143367767334, "global_step": 408564, "epoch": 4922} {"train_loss": -26.872119903564453, "global_step": 408565, "epoch": 4922} {"train_loss": -26.737396240234375, "global_step": 408566, "epoch": 4922} {"train_loss": -26.460458755493164, "global_step": 408567, "epoch": 4922} {"train_loss": -27.00835609436035, "global_step": 408568, "epoch": 4922} {"train_loss": -27.010435104370117, "global_step": 408569, "epoch": 4922} {"train_loss": -26.87843894958496, "global_step": 408570, "epoch": 4922} {"train_loss": -27.00840187072754, "global_step": 408571, "epoch": 4922} {"train_loss": -26.942859649658203, "global_step": 408572, "epoch": 4922} {"train_loss": -26.974395751953125, "global_step": 408573, "epoch": 4922} {"train_loss": -27.223403930664062, "global_step": 408574, "epoch": 4922} {"train_loss": -26.731006622314453, "global_step": 408575, "epoch": 4922} {"train_loss": -26.93011474609375, "global_step": 408576, "epoch": 4922} {"train_loss": -26.405832290649414, "global_step": 408577, "epoch": 4922} {"train_loss": -26.941003799438477, "global_step": 408578, "epoch": 4922} {"train_loss": -26.230066299438477, "global_step": 408579, "epoch": 4922} {"train_loss": -26.694671630859375, "global_step": 408580, "epoch": 4922} {"train_loss": -26.622222900390625, "global_step": 408581, "epoch": 4922} {"train_loss": -26.075347900390625, "global_step": 408582, "epoch": 4922} {"train_loss": -26.665668487548828, "global_step": 408583, "epoch": 4922} {"train_loss": -26.38172721862793, "global_step": 408584, "epoch": 4922} {"train_loss": -26.71402931213379, "global_step": 408585, "epoch": 4922} {"train_loss": -26.608306884765625, "global_step": 408586, "epoch": 4922} {"train_loss": -26.887100219726562, "global_step": 408587, "epoch": 4922} {"train_loss": -26.15308952331543, "global_step": 408588, "epoch": 4922} {"train_loss": -26.305191040039062, "global_step": 408589, "epoch": 4922} {"train_loss": -26.398544311523438, "global_step": 408590, "epoch": 4922} {"train_loss": -26.8104248046875, "global_step": 408591, "epoch": 4922} {"train_loss": -25.8199405670166, "global_step": 408592, "epoch": 4922} {"train_loss": -26.472076416015625, "global_step": 408593, "epoch": 4922} {"train_loss": -26.744037628173828, "global_step": 408594, "epoch": 4922} {"train_loss": -26.67218589782715, "global_step": 408595, "epoch": 4922} {"train_loss": -26.74136734008789, "global_step": 408596, "epoch": 4922} {"train_loss": -26.411039352416992, "global_step": 408597, "epoch": 4922} {"train_loss": -27.008337020874023, "global_step": 408598, "epoch": 4922} {"train_loss": -26.79931640625, "global_step": 408599, "epoch": 4922} {"train_loss": -26.5878849029541, "global_step": 408600, "epoch": 4922} {"train_loss": -26.46980094909668, "global_step": 408601, "epoch": 4922} {"train_loss": -26.498580932617188, "global_step": 408602, "epoch": 4922} {"train_loss": -27.0272274017334, "global_step": 408603, "epoch": 4922} {"train_loss": -26.683881759643555, "global_step": 408604, "epoch": 4922} {"train_loss": -26.50532341003418, "global_step": 408605, "epoch": 4922} {"train_loss": -26.851530075073242, "global_step": 408606, "epoch": 4922} {"train_loss": -26.836462020874023, "global_step": 408607, "epoch": 4922} {"train_loss": -26.608608452670545, "global_step": 408608, "epoch": 4922, "val_loss": 6638036.0} {"train_loss": -26.233367919921875, "global_step": 408609, "epoch": 4923} {"train_loss": -26.298023223876953, "global_step": 408610, "epoch": 4923} {"train_loss": -26.106775283813477, "global_step": 408611, "epoch": 4923} {"train_loss": -26.2432804107666, "global_step": 408612, "epoch": 4923} {"train_loss": -26.0780086517334, "global_step": 408613, "epoch": 4923} {"train_loss": -26.375478744506836, "global_step": 408614, "epoch": 4923} {"train_loss": -26.477453231811523, "global_step": 408615, "epoch": 4923} {"train_loss": -26.204450607299805, "global_step": 408616, "epoch": 4923} {"train_loss": -26.627634048461914, "global_step": 408617, "epoch": 4923} {"train_loss": -26.519086837768555, "global_step": 408618, "epoch": 4923} {"train_loss": -26.67453384399414, "global_step": 408619, "epoch": 4923} {"train_loss": -26.353132247924805, "global_step": 408620, "epoch": 4923} {"train_loss": -26.585407257080078, "global_step": 408621, "epoch": 4923} {"train_loss": -26.496845245361328, "global_step": 408622, "epoch": 4923} {"train_loss": -26.80087661743164, "global_step": 408623, "epoch": 4923} {"train_loss": -26.491943359375, "global_step": 408624, "epoch": 4923} {"train_loss": -26.490156173706055, "global_step": 408625, "epoch": 4923} {"train_loss": -26.571985244750977, "global_step": 408626, "epoch": 4923} {"train_loss": -26.489582061767578, "global_step": 408627, "epoch": 4923} {"train_loss": -26.50764274597168, "global_step": 408628, "epoch": 4923} {"train_loss": -26.29645347595215, "global_step": 408629, "epoch": 4923} {"train_loss": -26.4675350189209, "global_step": 408630, "epoch": 4923} {"train_loss": -26.842878341674805, "global_step": 408631, "epoch": 4923} {"train_loss": -26.556615829467773, "global_step": 408632, "epoch": 4923} {"train_loss": -26.672164916992188, "global_step": 408633, "epoch": 4923} {"train_loss": -26.41777992248535, "global_step": 408634, "epoch": 4923} {"train_loss": -26.543567657470703, "global_step": 408635, "epoch": 4923} {"train_loss": -26.42130470275879, "global_step": 408636, "epoch": 4923} {"train_loss": -26.935266494750977, "global_step": 408637, "epoch": 4923} {"train_loss": -26.579666137695312, "global_step": 408638, "epoch": 4923} {"train_loss": -26.736719131469727, "global_step": 408639, "epoch": 4923} {"train_loss": -26.4998779296875, "global_step": 408640, "epoch": 4923} {"train_loss": -26.6080265045166, "global_step": 408641, "epoch": 4923} {"train_loss": -26.7772159576416, "global_step": 408642, "epoch": 4923} {"train_loss": -26.692792892456055, "global_step": 408643, "epoch": 4923} {"train_loss": -26.666187286376953, "global_step": 408644, "epoch": 4923} {"train_loss": -27.06227684020996, "global_step": 408645, "epoch": 4923} {"train_loss": -26.757841110229492, "global_step": 408646, "epoch": 4923} {"train_loss": -26.925582885742188, "global_step": 408647, "epoch": 4923} {"train_loss": -27.044164657592773, "global_step": 408648, "epoch": 4923} {"train_loss": -26.684865951538086, "global_step": 408649, "epoch": 4923} {"train_loss": -26.856903076171875, "global_step": 408650, "epoch": 4923} {"train_loss": -26.474716186523438, "global_step": 408651, "epoch": 4923} {"train_loss": -26.775686264038086, "global_step": 408652, "epoch": 4923} {"train_loss": -26.903913497924805, "global_step": 408653, "epoch": 4923} {"train_loss": -26.854419708251953, "global_step": 408654, "epoch": 4923} {"train_loss": -26.886255264282227, "global_step": 408655, "epoch": 4923} {"train_loss": -26.54678726196289, "global_step": 408656, "epoch": 4923} {"train_loss": -27.147748947143555, "global_step": 408657, "epoch": 4923} {"train_loss": -26.96042251586914, "global_step": 408658, "epoch": 4923} {"train_loss": -26.862821578979492, "global_step": 408659, "epoch": 4923} {"train_loss": -26.990798950195312, "global_step": 408660, "epoch": 4923} {"train_loss": -26.82880210876465, "global_step": 408661, "epoch": 4923} {"train_loss": -26.77286148071289, "global_step": 408662, "epoch": 4923} {"train_loss": -26.789758682250977, "global_step": 408663, "epoch": 4923} {"train_loss": -26.78639030456543, "global_step": 408664, "epoch": 4923} {"train_loss": -26.464099884033203, "global_step": 408665, "epoch": 4923} {"train_loss": -26.97101402282715, "global_step": 408666, "epoch": 4923} {"train_loss": -26.8801212310791, "global_step": 408667, "epoch": 4923} {"train_loss": -26.64426040649414, "global_step": 408668, "epoch": 4923} {"train_loss": -26.81815528869629, "global_step": 408669, "epoch": 4923} {"train_loss": -26.31817054748535, "global_step": 408670, "epoch": 4923} {"train_loss": -25.89582633972168, "global_step": 408671, "epoch": 4923} {"train_loss": -26.009855270385742, "global_step": 408672, "epoch": 4923} {"train_loss": -26.57850456237793, "global_step": 408673, "epoch": 4923} {"train_loss": -26.860843658447266, "global_step": 408674, "epoch": 4923} {"train_loss": -26.618070602416992, "global_step": 408675, "epoch": 4923} {"train_loss": -26.615880966186523, "global_step": 408676, "epoch": 4923} {"train_loss": -26.965087890625, "global_step": 408677, "epoch": 4923} {"train_loss": -26.9155216217041, "global_step": 408678, "epoch": 4923} {"train_loss": -27.205270767211914, "global_step": 408679, "epoch": 4923} {"train_loss": -26.7215576171875, "global_step": 408680, "epoch": 4923} {"train_loss": -27.083173751831055, "global_step": 408681, "epoch": 4923} {"train_loss": -26.928857803344727, "global_step": 408682, "epoch": 4923} {"train_loss": -26.535858154296875, "global_step": 408683, "epoch": 4923} {"train_loss": -26.569486618041992, "global_step": 408684, "epoch": 4923} {"train_loss": -26.621679306030273, "global_step": 408685, "epoch": 4923} {"train_loss": -26.766372680664062, "global_step": 408686, "epoch": 4923} {"train_loss": -26.67157554626465, "global_step": 408687, "epoch": 4923} {"train_loss": -26.775293350219727, "global_step": 408688, "epoch": 4923} {"train_loss": -26.917890548706055, "global_step": 408689, "epoch": 4923} {"train_loss": -26.668231964111328, "global_step": 408690, "epoch": 4923} {"train_loss": -26.646371749510248, "global_step": 408691, "epoch": 4923, "val_loss": 6687319.0} {"train_loss": -25.537132263183594, "global_step": 408692, "epoch": 4924} {"train_loss": -26.081314086914062, "global_step": 408693, "epoch": 4924} {"train_loss": -26.012353897094727, "global_step": 408694, "epoch": 4924} {"train_loss": -26.08839225769043, "global_step": 408695, "epoch": 4924} {"train_loss": -26.20578956604004, "global_step": 408696, "epoch": 4924} {"train_loss": -26.029178619384766, "global_step": 408697, "epoch": 4924} {"train_loss": -26.118688583374023, "global_step": 408698, "epoch": 4924} {"train_loss": -26.518911361694336, "global_step": 408699, "epoch": 4924} {"train_loss": -26.07594108581543, "global_step": 408700, "epoch": 4924} {"train_loss": -26.059011459350586, "global_step": 408701, "epoch": 4924} {"train_loss": -26.3990535736084, "global_step": 408702, "epoch": 4924} {"train_loss": -26.422693252563477, "global_step": 408703, "epoch": 4924} {"train_loss": -26.432722091674805, "global_step": 408704, "epoch": 4924} {"train_loss": -26.161130905151367, "global_step": 408705, "epoch": 4924} {"train_loss": -26.43414878845215, "global_step": 408706, "epoch": 4924} {"train_loss": -26.52948570251465, "global_step": 408707, "epoch": 4924} {"train_loss": -26.503660202026367, "global_step": 408708, "epoch": 4924} {"train_loss": -26.394819259643555, "global_step": 408709, "epoch": 4924} {"train_loss": -26.47333335876465, "global_step": 408710, "epoch": 4924} {"train_loss": -26.475788116455078, "global_step": 408711, "epoch": 4924} {"train_loss": -26.604928970336914, "global_step": 408712, "epoch": 4924} {"train_loss": -26.137571334838867, "global_step": 408713, "epoch": 4924} {"train_loss": -26.244144439697266, "global_step": 408714, "epoch": 4924} {"train_loss": -26.31829261779785, "global_step": 408715, "epoch": 4924} {"train_loss": -26.403799057006836, "global_step": 408716, "epoch": 4924} {"train_loss": -26.490461349487305, "global_step": 408717, "epoch": 4924} {"train_loss": -26.764678955078125, "global_step": 408718, "epoch": 4924} {"train_loss": -26.651721954345703, "global_step": 408719, "epoch": 4924} {"train_loss": -26.437849044799805, "global_step": 408720, "epoch": 4924} {"train_loss": -26.630020141601562, "global_step": 408721, "epoch": 4924} {"train_loss": -26.773534774780273, "global_step": 408722, "epoch": 4924} {"train_loss": -26.348791122436523, "global_step": 408723, "epoch": 4924} {"train_loss": -26.68311882019043, "global_step": 408724, "epoch": 4924} {"train_loss": -26.5506649017334, "global_step": 408725, "epoch": 4924} {"train_loss": -26.675552368164062, "global_step": 408726, "epoch": 4924} {"train_loss": -26.729063034057617, "global_step": 408727, "epoch": 4924} {"train_loss": -26.857959747314453, "global_step": 408728, "epoch": 4924} {"train_loss": -26.851654052734375, "global_step": 408729, "epoch": 4924} {"train_loss": -26.670621871948242, "global_step": 408730, "epoch": 4924} {"train_loss": -26.415435791015625, "global_step": 408731, "epoch": 4924} {"train_loss": -26.549911499023438, "global_step": 408732, "epoch": 4924} {"train_loss": -26.851964950561523, "global_step": 408733, "epoch": 4924} {"train_loss": -26.822675704956055, "global_step": 408734, "epoch": 4924} {"train_loss": -26.734739303588867, "global_step": 408735, "epoch": 4924} {"train_loss": -27.183441162109375, "global_step": 408736, "epoch": 4924} {"train_loss": -26.52113151550293, "global_step": 408737, "epoch": 4924} {"train_loss": -26.7127628326416, "global_step": 408738, "epoch": 4924} {"train_loss": -26.803552627563477, "global_step": 408739, "epoch": 4924} {"train_loss": -26.7372989654541, "global_step": 408740, "epoch": 4924} {"train_loss": -26.68497085571289, "global_step": 408741, "epoch": 4924} {"train_loss": -26.329559326171875, "global_step": 408742, "epoch": 4924} {"train_loss": -26.377410888671875, "global_step": 408743, "epoch": 4924} {"train_loss": -26.266910552978516, "global_step": 408744, "epoch": 4924} {"train_loss": -25.89948081970215, "global_step": 408745, "epoch": 4924} {"train_loss": -26.120025634765625, "global_step": 408746, "epoch": 4924} {"train_loss": -25.8679256439209, "global_step": 408747, "epoch": 4924} {"train_loss": -26.219898223876953, "global_step": 408748, "epoch": 4924} {"train_loss": -26.352069854736328, "global_step": 408749, "epoch": 4924} {"train_loss": -26.351669311523438, "global_step": 408750, "epoch": 4924} {"train_loss": -26.661169052124023, "global_step": 408751, "epoch": 4924} {"train_loss": -26.3808536529541, "global_step": 408752, "epoch": 4924} {"train_loss": -26.618804931640625, "global_step": 408753, "epoch": 4924} {"train_loss": -26.235870361328125, "global_step": 408754, "epoch": 4924} {"train_loss": -26.757871627807617, "global_step": 408755, "epoch": 4924} {"train_loss": -26.823694229125977, "global_step": 408756, "epoch": 4924} {"train_loss": -26.469030380249023, "global_step": 408757, "epoch": 4924} {"train_loss": -27.090991973876953, "global_step": 408758, "epoch": 4924} {"train_loss": -26.64442253112793, "global_step": 408759, "epoch": 4924} {"train_loss": -26.774810791015625, "global_step": 408760, "epoch": 4924} {"train_loss": -26.600698471069336, "global_step": 408761, "epoch": 4924} {"train_loss": -26.586933135986328, "global_step": 408762, "epoch": 4924} {"train_loss": -26.694568634033203, "global_step": 408763, "epoch": 4924} {"train_loss": -26.66025733947754, "global_step": 408764, "epoch": 4924} {"train_loss": -27.026508331298828, "global_step": 408765, "epoch": 4924} {"train_loss": -26.481481552124023, "global_step": 408766, "epoch": 4924} {"train_loss": -26.641782760620117, "global_step": 408767, "epoch": 4924} {"train_loss": -26.591760635375977, "global_step": 408768, "epoch": 4924} {"train_loss": -26.4168701171875, "global_step": 408769, "epoch": 4924} {"train_loss": -26.899200439453125, "global_step": 408770, "epoch": 4924} {"train_loss": -26.477807998657227, "global_step": 408771, "epoch": 4924} {"train_loss": -26.389272689819336, "global_step": 408772, "epoch": 4924} {"train_loss": -26.883346557617188, "global_step": 408773, "epoch": 4924} {"train_loss": -26.49152808591544, "global_step": 408774, "epoch": 4924, "val_loss": 6680578.0} {"train_loss": -26.638900756835938, "global_step": 408775, "epoch": 4925} {"train_loss": -26.832077026367188, "global_step": 408776, "epoch": 4925} {"train_loss": -26.946081161499023, "global_step": 408777, "epoch": 4925} {"train_loss": -26.430301666259766, "global_step": 408778, "epoch": 4925} {"train_loss": -26.706775665283203, "global_step": 408779, "epoch": 4925} {"train_loss": -26.695356369018555, "global_step": 408780, "epoch": 4925} {"train_loss": -26.809326171875, "global_step": 408781, "epoch": 4925} {"train_loss": -26.79092788696289, "global_step": 408782, "epoch": 4925} {"train_loss": -26.853851318359375, "global_step": 408783, "epoch": 4925} {"train_loss": -26.78252601623535, "global_step": 408784, "epoch": 4925} {"train_loss": -26.701995849609375, "global_step": 408785, "epoch": 4925} {"train_loss": -26.701745986938477, "global_step": 408786, "epoch": 4925} {"train_loss": -26.64893913269043, "global_step": 408787, "epoch": 4925} {"train_loss": -26.24167823791504, "global_step": 408788, "epoch": 4925} {"train_loss": -26.843297958374023, "global_step": 408789, "epoch": 4925} {"train_loss": -26.848983764648438, "global_step": 408790, "epoch": 4925} {"train_loss": -27.365568161010742, "global_step": 408791, "epoch": 4925} {"train_loss": -27.034475326538086, "global_step": 408792, "epoch": 4925} {"train_loss": -26.761371612548828, "global_step": 408793, "epoch": 4925} {"train_loss": -26.7630672454834, "global_step": 408794, "epoch": 4925} {"train_loss": -26.70184898376465, "global_step": 408795, "epoch": 4925} {"train_loss": -26.6433162689209, "global_step": 408796, "epoch": 4925} {"train_loss": -26.83005714416504, "global_step": 408797, "epoch": 4925} {"train_loss": -26.617902755737305, "global_step": 408798, "epoch": 4925} {"train_loss": -26.464080810546875, "global_step": 408799, "epoch": 4925} {"train_loss": -27.010339736938477, "global_step": 408800, "epoch": 4925} {"train_loss": -26.537322998046875, "global_step": 408801, "epoch": 4925} {"train_loss": -26.9521484375, "global_step": 408802, "epoch": 4925} {"train_loss": -26.983657836914062, "global_step": 408803, "epoch": 4925} {"train_loss": -27.077716827392578, "global_step": 408804, "epoch": 4925} {"train_loss": -26.338993072509766, "global_step": 408805, "epoch": 4925} {"train_loss": -26.645187377929688, "global_step": 408806, "epoch": 4925} {"train_loss": -26.615814208984375, "global_step": 408807, "epoch": 4925} {"train_loss": -26.69580078125, "global_step": 408808, "epoch": 4925} {"train_loss": -26.790924072265625, "global_step": 408809, "epoch": 4925} {"train_loss": -26.416873931884766, "global_step": 408810, "epoch": 4925} {"train_loss": -26.228351593017578, "global_step": 408811, "epoch": 4925} {"train_loss": -25.904050827026367, "global_step": 408812, "epoch": 4925} {"train_loss": -26.5723934173584, "global_step": 408813, "epoch": 4925} {"train_loss": -26.944665908813477, "global_step": 408814, "epoch": 4925} {"train_loss": -26.50737953186035, "global_step": 408815, "epoch": 4925} {"train_loss": -26.96967887878418, "global_step": 408816, "epoch": 4925} {"train_loss": -26.966073989868164, "global_step": 408817, "epoch": 4925} {"train_loss": -26.980438232421875, "global_step": 408818, "epoch": 4925} {"train_loss": -26.848541259765625, "global_step": 408819, "epoch": 4925} {"train_loss": -26.276166915893555, "global_step": 408820, "epoch": 4925} {"train_loss": -26.57663917541504, "global_step": 408821, "epoch": 4925} {"train_loss": -26.577817916870117, "global_step": 408822, "epoch": 4925} {"train_loss": -26.31800651550293, "global_step": 408823, "epoch": 4925} {"train_loss": -26.451862335205078, "global_step": 408824, "epoch": 4925} {"train_loss": -26.646215438842773, "global_step": 408825, "epoch": 4925} {"train_loss": -26.456741333007812, "global_step": 408826, "epoch": 4925} {"train_loss": -26.707447052001953, "global_step": 408827, "epoch": 4925} {"train_loss": -26.846776962280273, "global_step": 408828, "epoch": 4925} {"train_loss": -26.388538360595703, "global_step": 408829, "epoch": 4925} {"train_loss": -26.9008846282959, "global_step": 408830, "epoch": 4925} {"train_loss": -26.56842613220215, "global_step": 408831, "epoch": 4925} {"train_loss": -26.535680770874023, "global_step": 408832, "epoch": 4925} {"train_loss": -26.955657958984375, "global_step": 408833, "epoch": 4925} {"train_loss": -26.85169792175293, "global_step": 408834, "epoch": 4925} {"train_loss": -26.905364990234375, "global_step": 408835, "epoch": 4925} {"train_loss": -26.63226890563965, "global_step": 408836, "epoch": 4925} {"train_loss": -26.550703048706055, "global_step": 408837, "epoch": 4925} {"train_loss": -26.535587310791016, "global_step": 408838, "epoch": 4925} {"train_loss": -26.748254776000977, "global_step": 408839, "epoch": 4925} {"train_loss": -26.745649337768555, "global_step": 408840, "epoch": 4925} {"train_loss": -26.632883071899414, "global_step": 408841, "epoch": 4925} {"train_loss": -27.227691650390625, "global_step": 408842, "epoch": 4925} {"train_loss": -26.75249671936035, "global_step": 408843, "epoch": 4925} {"train_loss": -26.720869064331055, "global_step": 408844, "epoch": 4925} {"train_loss": -26.688251495361328, "global_step": 408845, "epoch": 4925} {"train_loss": -26.970666885375977, "global_step": 408846, "epoch": 4925} {"train_loss": -26.8955020904541, "global_step": 408847, "epoch": 4925} {"train_loss": -26.589147567749023, "global_step": 408848, "epoch": 4925} {"train_loss": -26.89715003967285, "global_step": 408849, "epoch": 4925} {"train_loss": -26.668493270874023, "global_step": 408850, "epoch": 4925} {"train_loss": -26.543691635131836, "global_step": 408851, "epoch": 4925} {"train_loss": -27.12994956970215, "global_step": 408852, "epoch": 4925} {"train_loss": -26.75745964050293, "global_step": 408853, "epoch": 4925} {"train_loss": -26.88553810119629, "global_step": 408854, "epoch": 4925} {"train_loss": -26.59347915649414, "global_step": 408855, "epoch": 4925} {"train_loss": -27.27739906311035, "global_step": 408856, "epoch": 4925} {"train_loss": -26.733944582651898, "global_step": 408857, "epoch": 4925, "val_loss": 6795880.0} {"train_loss": -26.333749771118164, "global_step": 408858, "epoch": 4926} {"train_loss": -26.208600997924805, "global_step": 408859, "epoch": 4926} {"train_loss": -26.34840965270996, "global_step": 408860, "epoch": 4926} {"train_loss": -26.2924747467041, "global_step": 408861, "epoch": 4926} {"train_loss": -26.48648452758789, "global_step": 408862, "epoch": 4926} {"train_loss": -26.76336097717285, "global_step": 408863, "epoch": 4926} {"train_loss": -26.238529205322266, "global_step": 408864, "epoch": 4926} {"train_loss": -26.10109519958496, "global_step": 408865, "epoch": 4926} {"train_loss": -25.847553253173828, "global_step": 408866, "epoch": 4926} {"train_loss": -25.86724281311035, "global_step": 408867, "epoch": 4926} {"train_loss": -26.358322143554688, "global_step": 408868, "epoch": 4926} {"train_loss": -26.417245864868164, "global_step": 408869, "epoch": 4926} {"train_loss": -26.195337295532227, "global_step": 408870, "epoch": 4926} {"train_loss": -26.53627586364746, "global_step": 408871, "epoch": 4926} {"train_loss": -26.654935836791992, "global_step": 408872, "epoch": 4926} {"train_loss": -26.412317276000977, "global_step": 408873, "epoch": 4926} {"train_loss": -26.292083740234375, "global_step": 408874, "epoch": 4926} {"train_loss": -26.460153579711914, "global_step": 408875, "epoch": 4926} {"train_loss": -26.59967041015625, "global_step": 408876, "epoch": 4926} {"train_loss": -26.69074821472168, "global_step": 408877, "epoch": 4926} {"train_loss": -26.745901107788086, "global_step": 408878, "epoch": 4926} {"train_loss": -26.871978759765625, "global_step": 408879, "epoch": 4926} {"train_loss": -26.58490562438965, "global_step": 408880, "epoch": 4926} {"train_loss": -26.6627254486084, "global_step": 408881, "epoch": 4926} {"train_loss": -26.85040855407715, "global_step": 408882, "epoch": 4926} {"train_loss": -26.656415939331055, "global_step": 408883, "epoch": 4926} {"train_loss": -26.8223819732666, "global_step": 408884, "epoch": 4926} {"train_loss": -26.769697189331055, "global_step": 408885, "epoch": 4926} {"train_loss": -26.8394718170166, "global_step": 408886, "epoch": 4926} {"train_loss": -26.491689682006836, "global_step": 408887, "epoch": 4926} {"train_loss": -26.54926109313965, "global_step": 408888, "epoch": 4926} {"train_loss": -26.74853515625, "global_step": 408889, "epoch": 4926} {"train_loss": -26.77152442932129, "global_step": 408890, "epoch": 4926} {"train_loss": -27.02347755432129, "global_step": 408891, "epoch": 4926} {"train_loss": -26.641101837158203, "global_step": 408892, "epoch": 4926} {"train_loss": -26.438047409057617, "global_step": 408893, "epoch": 4926} {"train_loss": -26.461872100830078, "global_step": 408894, "epoch": 4926} {"train_loss": -26.652542114257812, "global_step": 408895, "epoch": 4926} {"train_loss": -26.943836212158203, "global_step": 408896, "epoch": 4926} {"train_loss": -26.819501876831055, "global_step": 408897, "epoch": 4926} {"train_loss": -26.975574493408203, "global_step": 408898, "epoch": 4926} {"train_loss": -26.77734375, "global_step": 408899, "epoch": 4926} {"train_loss": -26.6380615234375, "global_step": 408900, "epoch": 4926} {"train_loss": -26.493879318237305, "global_step": 408901, "epoch": 4926} {"train_loss": -26.47147560119629, "global_step": 408902, "epoch": 4926} {"train_loss": -26.91633415222168, "global_step": 408903, "epoch": 4926} {"train_loss": -26.83560562133789, "global_step": 408904, "epoch": 4926} {"train_loss": -26.84686279296875, "global_step": 408905, "epoch": 4926} {"train_loss": -26.889347076416016, "global_step": 408906, "epoch": 4926} {"train_loss": -26.600784301757812, "global_step": 408907, "epoch": 4926} {"train_loss": -26.793725967407227, "global_step": 408908, "epoch": 4926} {"train_loss": -26.58709144592285, "global_step": 408909, "epoch": 4926} {"train_loss": -27.072834014892578, "global_step": 408910, "epoch": 4926} {"train_loss": -26.542728424072266, "global_step": 408911, "epoch": 4926} {"train_loss": -26.643539428710938, "global_step": 408912, "epoch": 4926} {"train_loss": -26.871540069580078, "global_step": 408913, "epoch": 4926} {"train_loss": -26.45746421813965, "global_step": 408914, "epoch": 4926} {"train_loss": -26.33635902404785, "global_step": 408915, "epoch": 4926} {"train_loss": -26.65229606628418, "global_step": 408916, "epoch": 4926} {"train_loss": -26.635358810424805, "global_step": 408917, "epoch": 4926} {"train_loss": -26.60940933227539, "global_step": 408918, "epoch": 4926} {"train_loss": -26.2406005859375, "global_step": 408919, "epoch": 4926} {"train_loss": -26.827157974243164, "global_step": 408920, "epoch": 4926} {"train_loss": -27.105680465698242, "global_step": 408921, "epoch": 4926} {"train_loss": -26.691267013549805, "global_step": 408922, "epoch": 4926} {"train_loss": -26.293445587158203, "global_step": 408923, "epoch": 4926} {"train_loss": -26.641571044921875, "global_step": 408924, "epoch": 4926} {"train_loss": -26.77772331237793, "global_step": 408925, "epoch": 4926} {"train_loss": -27.06907081604004, "global_step": 408926, "epoch": 4926} {"train_loss": -26.744308471679688, "global_step": 408927, "epoch": 4926} {"train_loss": -27.122583389282227, "global_step": 408928, "epoch": 4926} {"train_loss": -26.522794723510742, "global_step": 408929, "epoch": 4926} {"train_loss": -26.61958122253418, "global_step": 408930, "epoch": 4926} {"train_loss": -26.76167869567871, "global_step": 408931, "epoch": 4926} {"train_loss": -26.881921768188477, "global_step": 408932, "epoch": 4926} {"train_loss": -26.978900909423828, "global_step": 408933, "epoch": 4926} {"train_loss": -26.55388832092285, "global_step": 408934, "epoch": 4926} {"train_loss": -26.52547264099121, "global_step": 408935, "epoch": 4926} {"train_loss": -27.1704158782959, "global_step": 408936, "epoch": 4926} {"train_loss": -26.54729652404785, "global_step": 408937, "epoch": 4926} {"train_loss": -26.464807510375977, "global_step": 408938, "epoch": 4926} {"train_loss": -26.821338653564453, "global_step": 408939, "epoch": 4926} {"train_loss": -26.619850733194006, "global_step": 408940, "epoch": 4926, "val_loss": 6682018.0} {"train_loss": -25.959156036376953, "global_step": 408941, "epoch": 4927} {"train_loss": -24.929174423217773, "global_step": 408942, "epoch": 4927} {"train_loss": -25.305326461791992, "global_step": 408943, "epoch": 4927} {"train_loss": -24.634624481201172, "global_step": 408944, "epoch": 4927} {"train_loss": -25.712549209594727, "global_step": 408945, "epoch": 4927} {"train_loss": -25.54918670654297, "global_step": 408946, "epoch": 4927} {"train_loss": -25.16904640197754, "global_step": 408947, "epoch": 4927} {"train_loss": -25.7050724029541, "global_step": 408948, "epoch": 4927} {"train_loss": -25.31781578063965, "global_step": 408949, "epoch": 4927} {"train_loss": -24.70877456665039, "global_step": 408950, "epoch": 4927} {"train_loss": -24.66111183166504, "global_step": 408951, "epoch": 4927} {"train_loss": -25.565317153930664, "global_step": 408952, "epoch": 4927} {"train_loss": -25.84235954284668, "global_step": 408953, "epoch": 4927} {"train_loss": -25.911117553710938, "global_step": 408954, "epoch": 4927} {"train_loss": -25.334238052368164, "global_step": 408955, "epoch": 4927} {"train_loss": -26.029117584228516, "global_step": 408956, "epoch": 4927} {"train_loss": -25.902973175048828, "global_step": 408957, "epoch": 4927} {"train_loss": -26.025482177734375, "global_step": 408958, "epoch": 4927} {"train_loss": -25.43309211730957, "global_step": 408959, "epoch": 4927} {"train_loss": -26.00782585144043, "global_step": 408960, "epoch": 4927} {"train_loss": -26.276748657226562, "global_step": 408961, "epoch": 4927} {"train_loss": -26.326984405517578, "global_step": 408962, "epoch": 4927} {"train_loss": -26.021886825561523, "global_step": 408963, "epoch": 4927} {"train_loss": -26.14983558654785, "global_step": 408964, "epoch": 4927} {"train_loss": -26.20196533203125, "global_step": 408965, "epoch": 4927} {"train_loss": -26.235754013061523, "global_step": 408966, "epoch": 4927} {"train_loss": -26.587799072265625, "global_step": 408967, "epoch": 4927} {"train_loss": -26.458974838256836, "global_step": 408968, "epoch": 4927} {"train_loss": -26.00238037109375, "global_step": 408969, "epoch": 4927} {"train_loss": -26.455209732055664, "global_step": 408970, "epoch": 4927} {"train_loss": -26.188140869140625, "global_step": 408971, "epoch": 4927} {"train_loss": -26.266061782836914, "global_step": 408972, "epoch": 4927} {"train_loss": -26.18415641784668, "global_step": 408973, "epoch": 4927} {"train_loss": -26.53960609436035, "global_step": 408974, "epoch": 4927} {"train_loss": -26.495527267456055, "global_step": 408975, "epoch": 4927} {"train_loss": -26.771732330322266, "global_step": 408976, "epoch": 4927} {"train_loss": -26.322372436523438, "global_step": 408977, "epoch": 4927} {"train_loss": -26.49640464782715, "global_step": 408978, "epoch": 4927} {"train_loss": -26.488134384155273, "global_step": 408979, "epoch": 4927} {"train_loss": -26.567541122436523, "global_step": 408980, "epoch": 4927} {"train_loss": -26.515623092651367, "global_step": 408981, "epoch": 4927} {"train_loss": -26.497711181640625, "global_step": 408982, "epoch": 4927} {"train_loss": -26.927759170532227, "global_step": 408983, "epoch": 4927} {"train_loss": -27.052412033081055, "global_step": 408984, "epoch": 4927} {"train_loss": -26.8823184967041, "global_step": 408985, "epoch": 4927} {"train_loss": -26.699066162109375, "global_step": 408986, "epoch": 4927} {"train_loss": -26.591161727905273, "global_step": 408987, "epoch": 4927} {"train_loss": -26.7293758392334, "global_step": 408988, "epoch": 4927} {"train_loss": -26.6296443939209, "global_step": 408989, "epoch": 4927} {"train_loss": -26.79532241821289, "global_step": 408990, "epoch": 4927} {"train_loss": -26.36614990234375, "global_step": 408991, "epoch": 4927} {"train_loss": -26.7308406829834, "global_step": 408992, "epoch": 4927} {"train_loss": -26.709003448486328, "global_step": 408993, "epoch": 4927} {"train_loss": -26.259063720703125, "global_step": 408994, "epoch": 4927} {"train_loss": -26.218551635742188, "global_step": 408995, "epoch": 4927} {"train_loss": -26.623376846313477, "global_step": 408996, "epoch": 4927} {"train_loss": -27.002456665039062, "global_step": 408997, "epoch": 4927} {"train_loss": -26.295135498046875, "global_step": 408998, "epoch": 4927} {"train_loss": -26.603513717651367, "global_step": 408999, "epoch": 4927} {"train_loss": -26.615598678588867, "global_step": 409000, "epoch": 4927} {"train_loss": -25.998464584350586, "global_step": 409001, "epoch": 4927} {"train_loss": -25.953372955322266, "global_step": 409002, "epoch": 4927} {"train_loss": -26.474706649780273, "global_step": 409003, "epoch": 4927} {"train_loss": -26.50495719909668, "global_step": 409004, "epoch": 4927} {"train_loss": -26.551929473876953, "global_step": 409005, "epoch": 4927} {"train_loss": -26.690229415893555, "global_step": 409006, "epoch": 4927} {"train_loss": -26.35236167907715, "global_step": 409007, "epoch": 4927} {"train_loss": -26.684656143188477, "global_step": 409008, "epoch": 4927} {"train_loss": -26.674158096313477, "global_step": 409009, "epoch": 4927} {"train_loss": -26.387723922729492, "global_step": 409010, "epoch": 4927} {"train_loss": -26.526142120361328, "global_step": 409011, "epoch": 4927} {"train_loss": -26.966785430908203, "global_step": 409012, "epoch": 4927} {"train_loss": -26.535022735595703, "global_step": 409013, "epoch": 4927} {"train_loss": -26.07004737854004, "global_step": 409014, "epoch": 4927} {"train_loss": -26.597137451171875, "global_step": 409015, "epoch": 4927} {"train_loss": -26.32716178894043, "global_step": 409016, "epoch": 4927} {"train_loss": -25.909162521362305, "global_step": 409017, "epoch": 4927} {"train_loss": -26.281970977783203, "global_step": 409018, "epoch": 4927} {"train_loss": -26.51177406311035, "global_step": 409019, "epoch": 4927} {"train_loss": -26.16328239440918, "global_step": 409020, "epoch": 4927} {"train_loss": -26.131078720092773, "global_step": 409021, "epoch": 4927} {"train_loss": -26.51010513305664, "global_step": 409022, "epoch": 4927} {"train_loss": -26.21733925141484, "global_step": 409023, "epoch": 4927, "val_loss": 6759552.0} {"train_loss": -25.34191131591797, "global_step": 409024, "epoch": 4928} {"train_loss": -25.985219955444336, "global_step": 409025, "epoch": 4928} {"train_loss": -25.05726432800293, "global_step": 409026, "epoch": 4928} {"train_loss": -26.1258487701416, "global_step": 409027, "epoch": 4928} {"train_loss": -25.447372436523438, "global_step": 409028, "epoch": 4928} {"train_loss": -25.748815536499023, "global_step": 409029, "epoch": 4928} {"train_loss": -25.636991500854492, "global_step": 409030, "epoch": 4928} {"train_loss": -25.366060256958008, "global_step": 409031, "epoch": 4928} {"train_loss": -26.052335739135742, "global_step": 409032, "epoch": 4928} {"train_loss": -26.12345314025879, "global_step": 409033, "epoch": 4928} {"train_loss": -25.975194931030273, "global_step": 409034, "epoch": 4928} {"train_loss": -26.2744197845459, "global_step": 409035, "epoch": 4928} {"train_loss": -26.168603897094727, "global_step": 409036, "epoch": 4928} {"train_loss": -26.33942222595215, "global_step": 409037, "epoch": 4928} {"train_loss": -26.398263931274414, "global_step": 409038, "epoch": 4928} {"train_loss": -26.313276290893555, "global_step": 409039, "epoch": 4928} {"train_loss": -26.349502563476562, "global_step": 409040, "epoch": 4928} {"train_loss": -26.47108268737793, "global_step": 409041, "epoch": 4928} {"train_loss": -26.2004337310791, "global_step": 409042, "epoch": 4928} {"train_loss": -26.35040855407715, "global_step": 409043, "epoch": 4928} {"train_loss": -26.45539665222168, "global_step": 409044, "epoch": 4928} {"train_loss": -26.3764591217041, "global_step": 409045, "epoch": 4928} {"train_loss": -26.607763290405273, "global_step": 409046, "epoch": 4928} {"train_loss": -26.38605308532715, "global_step": 409047, "epoch": 4928} {"train_loss": -26.48701286315918, "global_step": 409048, "epoch": 4928} {"train_loss": -26.878080368041992, "global_step": 409049, "epoch": 4928} {"train_loss": -26.275129318237305, "global_step": 409050, "epoch": 4928} {"train_loss": -26.53814125061035, "global_step": 409051, "epoch": 4928} {"train_loss": -26.561262130737305, "global_step": 409052, "epoch": 4928} {"train_loss": -26.907129287719727, "global_step": 409053, "epoch": 4928} {"train_loss": -26.599740982055664, "global_step": 409054, "epoch": 4928} {"train_loss": -26.7227840423584, "global_step": 409055, "epoch": 4928} {"train_loss": -26.663442611694336, "global_step": 409056, "epoch": 4928} {"train_loss": -26.50075340270996, "global_step": 409057, "epoch": 4928} {"train_loss": -26.7814884185791, "global_step": 409058, "epoch": 4928} {"train_loss": -26.754364013671875, "global_step": 409059, "epoch": 4928} {"train_loss": -26.728759765625, "global_step": 409060, "epoch": 4928} {"train_loss": -26.85858154296875, "global_step": 409061, "epoch": 4928} {"train_loss": -26.733274459838867, "global_step": 409062, "epoch": 4928} {"train_loss": -26.3582763671875, "global_step": 409063, "epoch": 4928} {"train_loss": -26.64973258972168, "global_step": 409064, "epoch": 4928} {"train_loss": -26.9075927734375, "global_step": 409065, "epoch": 4928} {"train_loss": -26.53523063659668, "global_step": 409066, "epoch": 4928} {"train_loss": -26.84567642211914, "global_step": 409067, "epoch": 4928} {"train_loss": -26.71796989440918, "global_step": 409068, "epoch": 4928} {"train_loss": -27.078094482421875, "global_step": 409069, "epoch": 4928} {"train_loss": -26.589426040649414, "global_step": 409070, "epoch": 4928} {"train_loss": -26.719406127929688, "global_step": 409071, "epoch": 4928} {"train_loss": -26.66925621032715, "global_step": 409072, "epoch": 4928} {"train_loss": -26.54391860961914, "global_step": 409073, "epoch": 4928} {"train_loss": -26.746814727783203, "global_step": 409074, "epoch": 4928} {"train_loss": -26.914960861206055, "global_step": 409075, "epoch": 4928} {"train_loss": -26.814172744750977, "global_step": 409076, "epoch": 4928} {"train_loss": -26.347461700439453, "global_step": 409077, "epoch": 4928} {"train_loss": -26.846052169799805, "global_step": 409078, "epoch": 4928} {"train_loss": -26.72906494140625, "global_step": 409079, "epoch": 4928} {"train_loss": -26.396198272705078, "global_step": 409080, "epoch": 4928} {"train_loss": -26.544843673706055, "global_step": 409081, "epoch": 4928} {"train_loss": -26.451522827148438, "global_step": 409082, "epoch": 4928} {"train_loss": -26.402551651000977, "global_step": 409083, "epoch": 4928} {"train_loss": -26.540878295898438, "global_step": 409084, "epoch": 4928} {"train_loss": -26.4150390625, "global_step": 409085, "epoch": 4928} {"train_loss": -26.84197425842285, "global_step": 409086, "epoch": 4928} {"train_loss": -27.218536376953125, "global_step": 409087, "epoch": 4928} {"train_loss": -26.6841983795166, "global_step": 409088, "epoch": 4928} {"train_loss": -26.686920166015625, "global_step": 409089, "epoch": 4928} {"train_loss": -26.878067016601562, "global_step": 409090, "epoch": 4928} {"train_loss": -26.736474990844727, "global_step": 409091, "epoch": 4928} {"train_loss": -26.320831298828125, "global_step": 409092, "epoch": 4928} {"train_loss": -26.95949363708496, "global_step": 409093, "epoch": 4928} {"train_loss": -26.901708602905273, "global_step": 409094, "epoch": 4928} {"train_loss": -26.6313419342041, "global_step": 409095, "epoch": 4928} {"train_loss": -26.40895652770996, "global_step": 409096, "epoch": 4928} {"train_loss": -26.92814064025879, "global_step": 409097, "epoch": 4928} {"train_loss": -26.721603393554688, "global_step": 409098, "epoch": 4928} {"train_loss": -26.516027450561523, "global_step": 409099, "epoch": 4928} {"train_loss": -26.897430419921875, "global_step": 409100, "epoch": 4928} {"train_loss": -26.40705680847168, "global_step": 409101, "epoch": 4928} {"train_loss": -26.413837432861328, "global_step": 409102, "epoch": 4928} {"train_loss": -26.576261520385742, "global_step": 409103, "epoch": 4928} {"train_loss": -26.935155868530273, "global_step": 409104, "epoch": 4928} {"train_loss": -26.88364028930664, "global_step": 409105, "epoch": 4928} {"train_loss": -26.498750962406756, "global_step": 409106, "epoch": 4928, "val_loss": 6669806.0} {"train_loss": -26.324148178100586, "global_step": 409107, "epoch": 4929} {"train_loss": -26.102930068969727, "global_step": 409108, "epoch": 4929} {"train_loss": -26.71880531311035, "global_step": 409109, "epoch": 4929} {"train_loss": -25.851404190063477, "global_step": 409110, "epoch": 4929} {"train_loss": -26.63408851623535, "global_step": 409111, "epoch": 4929} {"train_loss": -25.77315330505371, "global_step": 409112, "epoch": 4929} {"train_loss": -26.10530662536621, "global_step": 409113, "epoch": 4929} {"train_loss": -26.205469131469727, "global_step": 409114, "epoch": 4929} {"train_loss": -26.234521865844727, "global_step": 409115, "epoch": 4929} {"train_loss": -26.27345085144043, "global_step": 409116, "epoch": 4929} {"train_loss": -26.49441909790039, "global_step": 409117, "epoch": 4929} {"train_loss": -26.295608520507812, "global_step": 409118, "epoch": 4929} {"train_loss": -26.004404067993164, "global_step": 409119, "epoch": 4929} {"train_loss": -26.272098541259766, "global_step": 409120, "epoch": 4929} {"train_loss": -26.30721092224121, "global_step": 409121, "epoch": 4929} {"train_loss": -26.284454345703125, "global_step": 409122, "epoch": 4929} {"train_loss": -26.37422752380371, "global_step": 409123, "epoch": 4929} {"train_loss": -26.458242416381836, "global_step": 409124, "epoch": 4929} {"train_loss": -26.721607208251953, "global_step": 409125, "epoch": 4929} {"train_loss": -26.37617301940918, "global_step": 409126, "epoch": 4929} {"train_loss": -26.119342803955078, "global_step": 409127, "epoch": 4929} {"train_loss": -26.3104190826416, "global_step": 409128, "epoch": 4929} {"train_loss": -26.43265151977539, "global_step": 409129, "epoch": 4929} {"train_loss": -26.253128051757812, "global_step": 409130, "epoch": 4929} {"train_loss": -26.611225128173828, "global_step": 409131, "epoch": 4929} {"train_loss": -26.822189331054688, "global_step": 409132, "epoch": 4929} {"train_loss": -26.60284423828125, "global_step": 409133, "epoch": 4929} {"train_loss": -26.4869441986084, "global_step": 409134, "epoch": 4929} {"train_loss": -26.4605712890625, "global_step": 409135, "epoch": 4929} {"train_loss": -26.8198299407959, "global_step": 409136, "epoch": 4929} {"train_loss": -26.482336044311523, "global_step": 409137, "epoch": 4929} {"train_loss": -26.347244262695312, "global_step": 409138, "epoch": 4929} {"train_loss": -26.74749755859375, "global_step": 409139, "epoch": 4929} {"train_loss": -26.72977066040039, "global_step": 409140, "epoch": 4929} {"train_loss": -26.6363525390625, "global_step": 409141, "epoch": 4929} {"train_loss": -26.503522872924805, "global_step": 409142, "epoch": 4929} {"train_loss": -26.631336212158203, "global_step": 409143, "epoch": 4929} {"train_loss": -26.551910400390625, "global_step": 409144, "epoch": 4929} {"train_loss": -26.49468421936035, "global_step": 409145, "epoch": 4929} {"train_loss": -26.770465850830078, "global_step": 409146, "epoch": 4929} {"train_loss": -26.6175594329834, "global_step": 409147, "epoch": 4929} {"train_loss": -26.558408737182617, "global_step": 409148, "epoch": 4929} {"train_loss": -27.008625030517578, "global_step": 409149, "epoch": 4929} {"train_loss": -26.737192153930664, "global_step": 409150, "epoch": 4929} {"train_loss": -26.3525447845459, "global_step": 409151, "epoch": 4929} {"train_loss": -26.805511474609375, "global_step": 409152, "epoch": 4929} {"train_loss": -26.690876007080078, "global_step": 409153, "epoch": 4929} {"train_loss": -26.720239639282227, "global_step": 409154, "epoch": 4929} {"train_loss": -27.113269805908203, "global_step": 409155, "epoch": 4929} {"train_loss": -27.109180450439453, "global_step": 409156, "epoch": 4929} {"train_loss": -26.9401912689209, "global_step": 409157, "epoch": 4929} {"train_loss": -26.795618057250977, "global_step": 409158, "epoch": 4929} {"train_loss": -27.093358993530273, "global_step": 409159, "epoch": 4929} {"train_loss": -26.8818302154541, "global_step": 409160, "epoch": 4929} {"train_loss": -27.08492088317871, "global_step": 409161, "epoch": 4929} {"train_loss": -26.86139488220215, "global_step": 409162, "epoch": 4929} {"train_loss": -26.624231338500977, "global_step": 409163, "epoch": 4929} {"train_loss": -27.083423614501953, "global_step": 409164, "epoch": 4929} {"train_loss": -27.123050689697266, "global_step": 409165, "epoch": 4929} {"train_loss": -27.008686065673828, "global_step": 409166, "epoch": 4929} {"train_loss": -26.9542236328125, "global_step": 409167, "epoch": 4929} {"train_loss": -26.601057052612305, "global_step": 409168, "epoch": 4929} {"train_loss": -26.690521240234375, "global_step": 409169, "epoch": 4929} {"train_loss": -26.273975372314453, "global_step": 409170, "epoch": 4929} {"train_loss": -24.903715133666992, "global_step": 409171, "epoch": 4929} {"train_loss": -21.48549461364746, "global_step": 409172, "epoch": 4929} {"train_loss": -22.44349479675293, "global_step": 409173, "epoch": 4929} {"train_loss": -25.909589767456055, "global_step": 409174, "epoch": 4929} {"train_loss": -24.5607967376709, "global_step": 409175, "epoch": 4929} {"train_loss": -24.956571578979492, "global_step": 409176, "epoch": 4929} {"train_loss": -25.074411392211914, "global_step": 409177, "epoch": 4929} {"train_loss": -24.978492736816406, "global_step": 409178, "epoch": 4929} {"train_loss": -25.582456588745117, "global_step": 409179, "epoch": 4929} {"train_loss": -25.389774322509766, "global_step": 409180, "epoch": 4929} {"train_loss": -25.63665199279785, "global_step": 409181, "epoch": 4929} {"train_loss": -25.722930908203125, "global_step": 409182, "epoch": 4929} {"train_loss": -26.314855575561523, "global_step": 409183, "epoch": 4929} {"train_loss": -25.854278564453125, "global_step": 409184, "epoch": 4929} {"train_loss": -26.134647369384766, "global_step": 409185, "epoch": 4929} {"train_loss": -26.049726486206055, "global_step": 409186, "epoch": 4929} {"train_loss": -26.122709274291992, "global_step": 409187, "epoch": 4929} {"train_loss": -25.929412841796875, "global_step": 409188, "epoch": 4929} {"train_loss": -26.243616333927015, "global_step": 409189, "epoch": 4929, "val_loss": 6788208.5} {"train_loss": -25.762405395507812, "global_step": 409190, "epoch": 4930} {"train_loss": -25.562040328979492, "global_step": 409191, "epoch": 4930} {"train_loss": -25.770782470703125, "global_step": 409192, "epoch": 4930} {"train_loss": -25.239042282104492, "global_step": 409193, "epoch": 4930} {"train_loss": -25.158960342407227, "global_step": 409194, "epoch": 4930} {"train_loss": -25.84225845336914, "global_step": 409195, "epoch": 4930} {"train_loss": -25.885156631469727, "global_step": 409196, "epoch": 4930} {"train_loss": -25.582117080688477, "global_step": 409197, "epoch": 4930} {"train_loss": -26.3144474029541, "global_step": 409198, "epoch": 4930} {"train_loss": -25.433460235595703, "global_step": 409199, "epoch": 4930} {"train_loss": -25.78633689880371, "global_step": 409200, "epoch": 4930} {"train_loss": -25.7374267578125, "global_step": 409201, "epoch": 4930} {"train_loss": -26.072622299194336, "global_step": 409202, "epoch": 4930} {"train_loss": -25.810651779174805, "global_step": 409203, "epoch": 4930} {"train_loss": -26.36525535583496, "global_step": 409204, "epoch": 4930} {"train_loss": -26.0108699798584, "global_step": 409205, "epoch": 4930} {"train_loss": -26.112531661987305, "global_step": 409206, "epoch": 4930} {"train_loss": -26.29279136657715, "global_step": 409207, "epoch": 4930} {"train_loss": -26.719160079956055, "global_step": 409208, "epoch": 4930} {"train_loss": -26.16080665588379, "global_step": 409209, "epoch": 4930} {"train_loss": -26.34429931640625, "global_step": 409210, "epoch": 4930} {"train_loss": -26.219961166381836, "global_step": 409211, "epoch": 4930} {"train_loss": -26.3989315032959, "global_step": 409212, "epoch": 4930} {"train_loss": -26.313323974609375, "global_step": 409213, "epoch": 4930} {"train_loss": -26.490304946899414, "global_step": 409214, "epoch": 4930} {"train_loss": -26.346357345581055, "global_step": 409215, "epoch": 4930} {"train_loss": -26.159536361694336, "global_step": 409216, "epoch": 4930} {"train_loss": -26.526254653930664, "global_step": 409217, "epoch": 4930} {"train_loss": -26.1966552734375, "global_step": 409218, "epoch": 4930} {"train_loss": -26.499677658081055, "global_step": 409219, "epoch": 4930} {"train_loss": -26.983341217041016, "global_step": 409220, "epoch": 4930} {"train_loss": -26.46504020690918, "global_step": 409221, "epoch": 4930} {"train_loss": -26.442285537719727, "global_step": 409222, "epoch": 4930} {"train_loss": -26.33033561706543, "global_step": 409223, "epoch": 4930} {"train_loss": -26.823379516601562, "global_step": 409224, "epoch": 4930} {"train_loss": -26.476041793823242, "global_step": 409225, "epoch": 4930} {"train_loss": -26.67026138305664, "global_step": 409226, "epoch": 4930} {"train_loss": -26.704748153686523, "global_step": 409227, "epoch": 4930} {"train_loss": -26.747318267822266, "global_step": 409228, "epoch": 4930} {"train_loss": -26.502517700195312, "global_step": 409229, "epoch": 4930} {"train_loss": -26.15410804748535, "global_step": 409230, "epoch": 4930} {"train_loss": -26.481657028198242, "global_step": 409231, "epoch": 4930} {"train_loss": -26.77943229675293, "global_step": 409232, "epoch": 4930} {"train_loss": -26.109699249267578, "global_step": 409233, "epoch": 4930} {"train_loss": -26.718053817749023, "global_step": 409234, "epoch": 4930} {"train_loss": -26.409046173095703, "global_step": 409235, "epoch": 4930} {"train_loss": -26.500720977783203, "global_step": 409236, "epoch": 4930} {"train_loss": -26.739715576171875, "global_step": 409237, "epoch": 4930} {"train_loss": -26.519460678100586, "global_step": 409238, "epoch": 4930} {"train_loss": -26.793140411376953, "global_step": 409239, "epoch": 4930} {"train_loss": -26.560571670532227, "global_step": 409240, "epoch": 4930} {"train_loss": -26.40681266784668, "global_step": 409241, "epoch": 4930} {"train_loss": -26.806644439697266, "global_step": 409242, "epoch": 4930} {"train_loss": -26.511035919189453, "global_step": 409243, "epoch": 4930} {"train_loss": -26.89711570739746, "global_step": 409244, "epoch": 4930} {"train_loss": -26.54428482055664, "global_step": 409245, "epoch": 4930} {"train_loss": -26.49283790588379, "global_step": 409246, "epoch": 4930} {"train_loss": -26.266773223876953, "global_step": 409247, "epoch": 4930} {"train_loss": -26.63164710998535, "global_step": 409248, "epoch": 4930} {"train_loss": -26.61101722717285, "global_step": 409249, "epoch": 4930} {"train_loss": -26.781482696533203, "global_step": 409250, "epoch": 4930} {"train_loss": -26.980133056640625, "global_step": 409251, "epoch": 4930} {"train_loss": -26.310998916625977, "global_step": 409252, "epoch": 4930} {"train_loss": -26.85845947265625, "global_step": 409253, "epoch": 4930} {"train_loss": -27.085233688354492, "global_step": 409254, "epoch": 4930} {"train_loss": -26.492679595947266, "global_step": 409255, "epoch": 4930} {"train_loss": -26.50408363342285, "global_step": 409256, "epoch": 4930} {"train_loss": -26.4522647857666, "global_step": 409257, "epoch": 4930} {"train_loss": -26.541746139526367, "global_step": 409258, "epoch": 4930} {"train_loss": -26.930532455444336, "global_step": 409259, "epoch": 4930} {"train_loss": -26.66737937927246, "global_step": 409260, "epoch": 4930} {"train_loss": -27.120685577392578, "global_step": 409261, "epoch": 4930} {"train_loss": -26.535566329956055, "global_step": 409262, "epoch": 4930} {"train_loss": -26.76144790649414, "global_step": 409263, "epoch": 4930} {"train_loss": -27.15485954284668, "global_step": 409264, "epoch": 4930} {"train_loss": -26.344730377197266, "global_step": 409265, "epoch": 4930} {"train_loss": -27.010236740112305, "global_step": 409266, "epoch": 4930} {"train_loss": -26.97700309753418, "global_step": 409267, "epoch": 4930} {"train_loss": -26.768146514892578, "global_step": 409268, "epoch": 4930} {"train_loss": -26.81501579284668, "global_step": 409269, "epoch": 4930} {"train_loss": -26.639978408813477, "global_step": 409270, "epoch": 4930} {"train_loss": -26.791494369506836, "global_step": 409271, "epoch": 4930} {"train_loss": -26.430381384240576, "global_step": 409272, "epoch": 4930, "val_loss": 6705251.0} {"train_loss": -25.912490844726562, "global_step": 409273, "epoch": 4931} {"train_loss": -24.9761905670166, "global_step": 409274, "epoch": 4931} {"train_loss": -25.711856842041016, "global_step": 409275, "epoch": 4931} {"train_loss": -25.734556198120117, "global_step": 409276, "epoch": 4931} {"train_loss": -26.05862808227539, "global_step": 409277, "epoch": 4931} {"train_loss": -25.634382247924805, "global_step": 409278, "epoch": 4931} {"train_loss": -25.99175453186035, "global_step": 409279, "epoch": 4931} {"train_loss": -25.65118408203125, "global_step": 409280, "epoch": 4931} {"train_loss": -25.590660095214844, "global_step": 409281, "epoch": 4931} {"train_loss": -25.864755630493164, "global_step": 409282, "epoch": 4931} {"train_loss": -26.35637855529785, "global_step": 409283, "epoch": 4931} {"train_loss": -26.042348861694336, "global_step": 409284, "epoch": 4931} {"train_loss": -26.119873046875, "global_step": 409285, "epoch": 4931} {"train_loss": -26.322050094604492, "global_step": 409286, "epoch": 4931} {"train_loss": -25.870710372924805, "global_step": 409287, "epoch": 4931} {"train_loss": -26.147287368774414, "global_step": 409288, "epoch": 4931} {"train_loss": -26.435733795166016, "global_step": 409289, "epoch": 4931} {"train_loss": -26.472991943359375, "global_step": 409290, "epoch": 4931} {"train_loss": -26.24814796447754, "global_step": 409291, "epoch": 4931} {"train_loss": -26.33704948425293, "global_step": 409292, "epoch": 4931} {"train_loss": -26.659521102905273, "global_step": 409293, "epoch": 4931} {"train_loss": -26.202777862548828, "global_step": 409294, "epoch": 4931} {"train_loss": -26.640411376953125, "global_step": 409295, "epoch": 4931} {"train_loss": -26.452260971069336, "global_step": 409296, "epoch": 4931} {"train_loss": -26.790273666381836, "global_step": 409297, "epoch": 4931} {"train_loss": -26.81103515625, "global_step": 409298, "epoch": 4931} {"train_loss": -26.481306076049805, "global_step": 409299, "epoch": 4931} {"train_loss": -26.589252471923828, "global_step": 409300, "epoch": 4931} {"train_loss": -26.63884925842285, "global_step": 409301, "epoch": 4931} {"train_loss": -26.36017417907715, "global_step": 409302, "epoch": 4931} {"train_loss": -26.646677017211914, "global_step": 409303, "epoch": 4931} {"train_loss": -26.80873680114746, "global_step": 409304, "epoch": 4931} {"train_loss": -26.5816707611084, "global_step": 409305, "epoch": 4931} {"train_loss": -26.682188034057617, "global_step": 409306, "epoch": 4931} {"train_loss": -26.879810333251953, "global_step": 409307, "epoch": 4931} {"train_loss": -26.91119956970215, "global_step": 409308, "epoch": 4931} {"train_loss": -26.585895538330078, "global_step": 409309, "epoch": 4931} {"train_loss": -26.88823890686035, "global_step": 409310, "epoch": 4931} {"train_loss": -26.69105339050293, "global_step": 409311, "epoch": 4931} {"train_loss": -26.98762321472168, "global_step": 409312, "epoch": 4931} {"train_loss": -26.916595458984375, "global_step": 409313, "epoch": 4931} {"train_loss": -26.720813751220703, "global_step": 409314, "epoch": 4931} {"train_loss": -26.70539665222168, "global_step": 409315, "epoch": 4931} {"train_loss": -26.902250289916992, "global_step": 409316, "epoch": 4931} {"train_loss": -26.785486221313477, "global_step": 409317, "epoch": 4931} {"train_loss": -27.064172744750977, "global_step": 409318, "epoch": 4931} {"train_loss": -26.990365982055664, "global_step": 409319, "epoch": 4931} {"train_loss": -27.00038719177246, "global_step": 409320, "epoch": 4931} {"train_loss": -26.925275802612305, "global_step": 409321, "epoch": 4931} {"train_loss": -26.9771728515625, "global_step": 409322, "epoch": 4931} {"train_loss": -26.73031997680664, "global_step": 409323, "epoch": 4931} {"train_loss": -26.9837589263916, "global_step": 409324, "epoch": 4931} {"train_loss": -26.805286407470703, "global_step": 409325, "epoch": 4931} {"train_loss": -27.039587020874023, "global_step": 409326, "epoch": 4931} {"train_loss": -27.3863582611084, "global_step": 409327, "epoch": 4931} {"train_loss": -26.82537269592285, "global_step": 409328, "epoch": 4931} {"train_loss": -26.956567764282227, "global_step": 409329, "epoch": 4931} {"train_loss": -26.807254791259766, "global_step": 409330, "epoch": 4931} {"train_loss": -26.99869155883789, "global_step": 409331, "epoch": 4931} {"train_loss": -26.77121353149414, "global_step": 409332, "epoch": 4931} {"train_loss": -26.9893741607666, "global_step": 409333, "epoch": 4931} {"train_loss": -27.00764274597168, "global_step": 409334, "epoch": 4931} {"train_loss": -26.779626846313477, "global_step": 409335, "epoch": 4931} {"train_loss": -26.708959579467773, "global_step": 409336, "epoch": 4931} {"train_loss": -26.88104248046875, "global_step": 409337, "epoch": 4931} {"train_loss": -26.53339195251465, "global_step": 409338, "epoch": 4931} {"train_loss": -25.774133682250977, "global_step": 409339, "epoch": 4931} {"train_loss": -25.497774124145508, "global_step": 409340, "epoch": 4931} {"train_loss": -25.398191452026367, "global_step": 409341, "epoch": 4931} {"train_loss": -26.1291561126709, "global_step": 409342, "epoch": 4931} {"train_loss": -26.474044799804688, "global_step": 409343, "epoch": 4931} {"train_loss": -26.426916122436523, "global_step": 409344, "epoch": 4931} {"train_loss": -26.615320205688477, "global_step": 409345, "epoch": 4931} {"train_loss": -26.50371742248535, "global_step": 409346, "epoch": 4931} {"train_loss": -26.5152645111084, "global_step": 409347, "epoch": 4931} {"train_loss": -26.800302505493164, "global_step": 409348, "epoch": 4931} {"train_loss": -26.55544090270996, "global_step": 409349, "epoch": 4931} {"train_loss": -26.991485595703125, "global_step": 409350, "epoch": 4931} {"train_loss": -26.454389572143555, "global_step": 409351, "epoch": 4931} {"train_loss": -26.404150009155273, "global_step": 409352, "epoch": 4931} {"train_loss": -26.19440269470215, "global_step": 409353, "epoch": 4931} {"train_loss": -26.65386962890625, "global_step": 409354, "epoch": 4931} {"train_loss": -26.505288824977644, "global_step": 409355, "epoch": 4931, "val_loss": 6706795.0} {"train_loss": -26.7686767578125, "global_step": 409356, "epoch": 4932} {"train_loss": -26.14162254333496, "global_step": 409357, "epoch": 4932} {"train_loss": -26.290220260620117, "global_step": 409358, "epoch": 4932} {"train_loss": -26.201568603515625, "global_step": 409359, "epoch": 4932} {"train_loss": -26.583871841430664, "global_step": 409360, "epoch": 4932} {"train_loss": -26.09226417541504, "global_step": 409361, "epoch": 4932} {"train_loss": -26.33509635925293, "global_step": 409362, "epoch": 4932} {"train_loss": -26.3654727935791, "global_step": 409363, "epoch": 4932} {"train_loss": -26.299243927001953, "global_step": 409364, "epoch": 4932} {"train_loss": -26.714689254760742, "global_step": 409365, "epoch": 4932} {"train_loss": -26.60919761657715, "global_step": 409366, "epoch": 4932} {"train_loss": -26.518198013305664, "global_step": 409367, "epoch": 4932} {"train_loss": -26.69598388671875, "global_step": 409368, "epoch": 4932} {"train_loss": -26.351734161376953, "global_step": 409369, "epoch": 4932} {"train_loss": -26.661285400390625, "global_step": 409370, "epoch": 4932} {"train_loss": -26.56080436706543, "global_step": 409371, "epoch": 4932} {"train_loss": -26.710737228393555, "global_step": 409372, "epoch": 4932} {"train_loss": -26.863813400268555, "global_step": 409373, "epoch": 4932} {"train_loss": -26.980222702026367, "global_step": 409374, "epoch": 4932} {"train_loss": -26.835180282592773, "global_step": 409375, "epoch": 4932} {"train_loss": -26.39251136779785, "global_step": 409376, "epoch": 4932} {"train_loss": -26.407703399658203, "global_step": 409377, "epoch": 4932} {"train_loss": -26.597517013549805, "global_step": 409378, "epoch": 4932} {"train_loss": -26.938812255859375, "global_step": 409379, "epoch": 4932} {"train_loss": -26.757404327392578, "global_step": 409380, "epoch": 4932} {"train_loss": -26.6525821685791, "global_step": 409381, "epoch": 4932} {"train_loss": -26.631879806518555, "global_step": 409382, "epoch": 4932} {"train_loss": -26.870817184448242, "global_step": 409383, "epoch": 4932} {"train_loss": -26.60761833190918, "global_step": 409384, "epoch": 4932} {"train_loss": -26.765295028686523, "global_step": 409385, "epoch": 4932} {"train_loss": -26.770740509033203, "global_step": 409386, "epoch": 4932} {"train_loss": -26.769702911376953, "global_step": 409387, "epoch": 4932} {"train_loss": -26.349035263061523, "global_step": 409388, "epoch": 4932} {"train_loss": -26.66008949279785, "global_step": 409389, "epoch": 4932} {"train_loss": -26.786701202392578, "global_step": 409390, "epoch": 4932} {"train_loss": -26.074264526367188, "global_step": 409391, "epoch": 4932} {"train_loss": -26.05022621154785, "global_step": 409392, "epoch": 4932} {"train_loss": -27.055530548095703, "global_step": 409393, "epoch": 4932} {"train_loss": -26.7091121673584, "global_step": 409394, "epoch": 4932} {"train_loss": -26.65766716003418, "global_step": 409395, "epoch": 4932} {"train_loss": -26.40582847595215, "global_step": 409396, "epoch": 4932} {"train_loss": -26.96697998046875, "global_step": 409397, "epoch": 4932} {"train_loss": -26.605072021484375, "global_step": 409398, "epoch": 4932} {"train_loss": -26.64084815979004, "global_step": 409399, "epoch": 4932} {"train_loss": -26.564802169799805, "global_step": 409400, "epoch": 4932} {"train_loss": -26.59036636352539, "global_step": 409401, "epoch": 4932} {"train_loss": -26.5106201171875, "global_step": 409402, "epoch": 4932} {"train_loss": -26.851316452026367, "global_step": 409403, "epoch": 4932} {"train_loss": -26.52803611755371, "global_step": 409404, "epoch": 4932} {"train_loss": -26.900375366210938, "global_step": 409405, "epoch": 4932} {"train_loss": -26.569473266601562, "global_step": 409406, "epoch": 4932} {"train_loss": -26.638097763061523, "global_step": 409407, "epoch": 4932} {"train_loss": -26.4258975982666, "global_step": 409408, "epoch": 4932} {"train_loss": -27.132871627807617, "global_step": 409409, "epoch": 4932} {"train_loss": -26.489660263061523, "global_step": 409410, "epoch": 4932} {"train_loss": -27.07769203186035, "global_step": 409411, "epoch": 4932} {"train_loss": -26.644887924194336, "global_step": 409412, "epoch": 4932} {"train_loss": -26.81998062133789, "global_step": 409413, "epoch": 4932} {"train_loss": -26.89674186706543, "global_step": 409414, "epoch": 4932} {"train_loss": -26.676733016967773, "global_step": 409415, "epoch": 4932} {"train_loss": -26.473358154296875, "global_step": 409416, "epoch": 4932} {"train_loss": -26.314512252807617, "global_step": 409417, "epoch": 4932} {"train_loss": -26.411060333251953, "global_step": 409418, "epoch": 4932} {"train_loss": -27.18147850036621, "global_step": 409419, "epoch": 4932} {"train_loss": -26.666616439819336, "global_step": 409420, "epoch": 4932} {"train_loss": -26.18379020690918, "global_step": 409421, "epoch": 4932} {"train_loss": -26.760950088500977, "global_step": 409422, "epoch": 4932} {"train_loss": -26.7475643157959, "global_step": 409423, "epoch": 4932} {"train_loss": -26.4268798828125, "global_step": 409424, "epoch": 4932} {"train_loss": -27.10738182067871, "global_step": 409425, "epoch": 4932} {"train_loss": -26.661640167236328, "global_step": 409426, "epoch": 4932} {"train_loss": -26.602338790893555, "global_step": 409427, "epoch": 4932} {"train_loss": -26.897785186767578, "global_step": 409428, "epoch": 4932} {"train_loss": -26.847692489624023, "global_step": 409429, "epoch": 4932} {"train_loss": -26.530807495117188, "global_step": 409430, "epoch": 4932} {"train_loss": -26.750720977783203, "global_step": 409431, "epoch": 4932} {"train_loss": -26.604902267456055, "global_step": 409432, "epoch": 4932} {"train_loss": -26.757923126220703, "global_step": 409433, "epoch": 4932} {"train_loss": -26.89021110534668, "global_step": 409434, "epoch": 4932} {"train_loss": -26.60140037536621, "global_step": 409435, "epoch": 4932} {"train_loss": -26.582929611206055, "global_step": 409436, "epoch": 4932} {"train_loss": -26.842466354370117, "global_step": 409437, "epoch": 4932} {"train_loss": -26.632578953202948, "global_step": 409438, "epoch": 4932, "val_loss": 6706752.0} {"train_loss": -26.639591217041016, "global_step": 409439, "epoch": 4933} {"train_loss": -25.979822158813477, "global_step": 409440, "epoch": 4933} {"train_loss": -26.438018798828125, "global_step": 409441, "epoch": 4933} {"train_loss": -26.62617301940918, "global_step": 409442, "epoch": 4933} {"train_loss": -26.511533737182617, "global_step": 409443, "epoch": 4933} {"train_loss": -26.429574966430664, "global_step": 409444, "epoch": 4933} {"train_loss": -26.3219051361084, "global_step": 409445, "epoch": 4933} {"train_loss": -26.15703773498535, "global_step": 409446, "epoch": 4933} {"train_loss": -26.31220054626465, "global_step": 409447, "epoch": 4933} {"train_loss": -26.472692489624023, "global_step": 409448, "epoch": 4933} {"train_loss": -26.969013214111328, "global_step": 409449, "epoch": 4933} {"train_loss": -26.55458641052246, "global_step": 409450, "epoch": 4933} {"train_loss": -26.696447372436523, "global_step": 409451, "epoch": 4933} {"train_loss": -26.46265983581543, "global_step": 409452, "epoch": 4933} {"train_loss": -26.105377197265625, "global_step": 409453, "epoch": 4933} {"train_loss": -26.396835327148438, "global_step": 409454, "epoch": 4933} {"train_loss": -26.742822647094727, "global_step": 409455, "epoch": 4933} {"train_loss": -26.825347900390625, "global_step": 409456, "epoch": 4933} {"train_loss": -26.45185661315918, "global_step": 409457, "epoch": 4933} {"train_loss": -26.245466232299805, "global_step": 409458, "epoch": 4933} {"train_loss": -26.737634658813477, "global_step": 409459, "epoch": 4933} {"train_loss": -26.498367309570312, "global_step": 409460, "epoch": 4933} {"train_loss": -26.467639923095703, "global_step": 409461, "epoch": 4933} {"train_loss": -26.75445556640625, "global_step": 409462, "epoch": 4933} {"train_loss": -26.911733627319336, "global_step": 409463, "epoch": 4933} {"train_loss": -26.859121322631836, "global_step": 409464, "epoch": 4933} {"train_loss": -26.397363662719727, "global_step": 409465, "epoch": 4933} {"train_loss": -26.58392906188965, "global_step": 409466, "epoch": 4933} {"train_loss": -26.727651596069336, "global_step": 409467, "epoch": 4933} {"train_loss": -26.89215660095215, "global_step": 409468, "epoch": 4933} {"train_loss": -26.89277458190918, "global_step": 409469, "epoch": 4933} {"train_loss": -26.76700782775879, "global_step": 409470, "epoch": 4933} {"train_loss": -26.70318603515625, "global_step": 409471, "epoch": 4933} {"train_loss": -26.801172256469727, "global_step": 409472, "epoch": 4933} {"train_loss": -26.68049430847168, "global_step": 409473, "epoch": 4933} {"train_loss": -26.853195190429688, "global_step": 409474, "epoch": 4933} {"train_loss": -26.77985954284668, "global_step": 409475, "epoch": 4933} {"train_loss": -26.69854736328125, "global_step": 409476, "epoch": 4933} {"train_loss": -26.769596099853516, "global_step": 409477, "epoch": 4933} {"train_loss": -27.110910415649414, "global_step": 409478, "epoch": 4933} {"train_loss": -27.05315589904785, "global_step": 409479, "epoch": 4933} {"train_loss": -26.938215255737305, "global_step": 409480, "epoch": 4933} {"train_loss": -27.054288864135742, "global_step": 409481, "epoch": 4933} {"train_loss": -26.639892578125, "global_step": 409482, "epoch": 4933} {"train_loss": -26.906909942626953, "global_step": 409483, "epoch": 4933} {"train_loss": -26.55908203125, "global_step": 409484, "epoch": 4933} {"train_loss": -26.606250762939453, "global_step": 409485, "epoch": 4933} {"train_loss": -26.72108268737793, "global_step": 409486, "epoch": 4933} {"train_loss": -26.48223876953125, "global_step": 409487, "epoch": 4933} {"train_loss": -26.785741806030273, "global_step": 409488, "epoch": 4933} {"train_loss": -27.022729873657227, "global_step": 409489, "epoch": 4933} {"train_loss": -26.51881217956543, "global_step": 409490, "epoch": 4933} {"train_loss": -26.957538604736328, "global_step": 409491, "epoch": 4933} {"train_loss": -27.019763946533203, "global_step": 409492, "epoch": 4933} {"train_loss": -27.111133575439453, "global_step": 409493, "epoch": 4933} {"train_loss": -26.957630157470703, "global_step": 409494, "epoch": 4933} {"train_loss": -26.623737335205078, "global_step": 409495, "epoch": 4933} {"train_loss": -26.654767990112305, "global_step": 409496, "epoch": 4933} {"train_loss": -26.619115829467773, "global_step": 409497, "epoch": 4933} {"train_loss": -27.009496688842773, "global_step": 409498, "epoch": 4933} {"train_loss": -26.84382438659668, "global_step": 409499, "epoch": 4933} {"train_loss": -26.706201553344727, "global_step": 409500, "epoch": 4933} {"train_loss": -27.088048934936523, "global_step": 409501, "epoch": 4933} {"train_loss": -26.91707420349121, "global_step": 409502, "epoch": 4933} {"train_loss": -26.8492488861084, "global_step": 409503, "epoch": 4933} {"train_loss": -26.851476669311523, "global_step": 409504, "epoch": 4933} {"train_loss": -26.662185668945312, "global_step": 409505, "epoch": 4933} {"train_loss": -27.051313400268555, "global_step": 409506, "epoch": 4933} {"train_loss": -26.930028915405273, "global_step": 409507, "epoch": 4933} {"train_loss": -26.619001388549805, "global_step": 409508, "epoch": 4933} {"train_loss": -26.2589111328125, "global_step": 409509, "epoch": 4933} {"train_loss": -26.166479110717773, "global_step": 409510, "epoch": 4933} {"train_loss": -26.261734008789062, "global_step": 409511, "epoch": 4933} {"train_loss": -26.483036041259766, "global_step": 409512, "epoch": 4933} {"train_loss": -26.516647338867188, "global_step": 409513, "epoch": 4933} {"train_loss": -26.10713005065918, "global_step": 409514, "epoch": 4933} {"train_loss": -26.54144287109375, "global_step": 409515, "epoch": 4933} {"train_loss": -26.38331413269043, "global_step": 409516, "epoch": 4933} {"train_loss": -26.173816680908203, "global_step": 409517, "epoch": 4933} {"train_loss": -26.479238510131836, "global_step": 409518, "epoch": 4933} {"train_loss": -26.59222412109375, "global_step": 409519, "epoch": 4933} {"train_loss": -26.46600341796875, "global_step": 409520, "epoch": 4933} {"train_loss": -26.666237681745045, "global_step": 409521, "epoch": 4933, "val_loss": 6551062.0} {"train_loss": -23.456857681274414, "global_step": 409522, "epoch": 4934} {"train_loss": -24.700021743774414, "global_step": 409523, "epoch": 4934} {"train_loss": -24.530929565429688, "global_step": 409524, "epoch": 4934} {"train_loss": -25.22688102722168, "global_step": 409525, "epoch": 4934} {"train_loss": -24.39252281188965, "global_step": 409526, "epoch": 4934} {"train_loss": -24.670320510864258, "global_step": 409527, "epoch": 4934} {"train_loss": -24.727798461914062, "global_step": 409528, "epoch": 4934} {"train_loss": -25.27760124206543, "global_step": 409529, "epoch": 4934} {"train_loss": -24.81697654724121, "global_step": 409530, "epoch": 4934} {"train_loss": -25.832870483398438, "global_step": 409531, "epoch": 4934} {"train_loss": -24.90582847595215, "global_step": 409532, "epoch": 4934} {"train_loss": -25.7231502532959, "global_step": 409533, "epoch": 4934} {"train_loss": -25.85391616821289, "global_step": 409534, "epoch": 4934} {"train_loss": -25.8051815032959, "global_step": 409535, "epoch": 4934} {"train_loss": -25.702960968017578, "global_step": 409536, "epoch": 4934} {"train_loss": -25.37571907043457, "global_step": 409537, "epoch": 4934} {"train_loss": -25.86371421813965, "global_step": 409538, "epoch": 4934} {"train_loss": -25.8521728515625, "global_step": 409539, "epoch": 4934} {"train_loss": -25.739477157592773, "global_step": 409540, "epoch": 4934} {"train_loss": -25.46616554260254, "global_step": 409541, "epoch": 4934} {"train_loss": -26.006134033203125, "global_step": 409542, "epoch": 4934} {"train_loss": -25.94136619567871, "global_step": 409543, "epoch": 4934} {"train_loss": -26.005390167236328, "global_step": 409544, "epoch": 4934} {"train_loss": -26.40504264831543, "global_step": 409545, "epoch": 4934} {"train_loss": -26.405487060546875, "global_step": 409546, "epoch": 4934} {"train_loss": -26.02566909790039, "global_step": 409547, "epoch": 4934} {"train_loss": -26.45795249938965, "global_step": 409548, "epoch": 4934} {"train_loss": -26.134286880493164, "global_step": 409549, "epoch": 4934} {"train_loss": -26.353879928588867, "global_step": 409550, "epoch": 4934} {"train_loss": -26.065488815307617, "global_step": 409551, "epoch": 4934} {"train_loss": -25.898305892944336, "global_step": 409552, "epoch": 4934} {"train_loss": -26.242856979370117, "global_step": 409553, "epoch": 4934} {"train_loss": -26.488828659057617, "global_step": 409554, "epoch": 4934} {"train_loss": -26.58935546875, "global_step": 409555, "epoch": 4934} {"train_loss": -26.5489559173584, "global_step": 409556, "epoch": 4934} {"train_loss": -26.663549423217773, "global_step": 409557, "epoch": 4934} {"train_loss": -26.688276290893555, "global_step": 409558, "epoch": 4934} {"train_loss": -26.684757232666016, "global_step": 409559, "epoch": 4934} {"train_loss": -26.46404457092285, "global_step": 409560, "epoch": 4934} {"train_loss": -26.17949867248535, "global_step": 409561, "epoch": 4934} {"train_loss": -26.505582809448242, "global_step": 409562, "epoch": 4934} {"train_loss": -26.306440353393555, "global_step": 409563, "epoch": 4934} {"train_loss": -26.808866500854492, "global_step": 409564, "epoch": 4934} {"train_loss": -26.458499908447266, "global_step": 409565, "epoch": 4934} {"train_loss": -26.520654678344727, "global_step": 409566, "epoch": 4934} {"train_loss": -26.461240768432617, "global_step": 409567, "epoch": 4934} {"train_loss": -26.545324325561523, "global_step": 409568, "epoch": 4934} {"train_loss": -26.745908737182617, "global_step": 409569, "epoch": 4934} {"train_loss": -26.6684513092041, "global_step": 409570, "epoch": 4934} {"train_loss": -26.746335983276367, "global_step": 409571, "epoch": 4934} {"train_loss": -26.63027000427246, "global_step": 409572, "epoch": 4934} {"train_loss": -26.564680099487305, "global_step": 409573, "epoch": 4934} {"train_loss": -26.5274715423584, "global_step": 409574, "epoch": 4934} {"train_loss": -26.827009201049805, "global_step": 409575, "epoch": 4934} {"train_loss": -26.869064331054688, "global_step": 409576, "epoch": 4934} {"train_loss": -26.981985092163086, "global_step": 409577, "epoch": 4934} {"train_loss": -26.538421630859375, "global_step": 409578, "epoch": 4934} {"train_loss": -26.602949142456055, "global_step": 409579, "epoch": 4934} {"train_loss": -26.789350509643555, "global_step": 409580, "epoch": 4934} {"train_loss": -26.741714477539062, "global_step": 409581, "epoch": 4934} {"train_loss": -26.81904411315918, "global_step": 409582, "epoch": 4934} {"train_loss": -27.071069717407227, "global_step": 409583, "epoch": 4934} {"train_loss": -26.896320343017578, "global_step": 409584, "epoch": 4934} {"train_loss": -26.545679092407227, "global_step": 409585, "epoch": 4934} {"train_loss": -27.230695724487305, "global_step": 409586, "epoch": 4934} {"train_loss": -27.141620635986328, "global_step": 409587, "epoch": 4934} {"train_loss": -26.989744186401367, "global_step": 409588, "epoch": 4934} {"train_loss": -26.878721237182617, "global_step": 409589, "epoch": 4934} {"train_loss": -26.90911293029785, "global_step": 409590, "epoch": 4934} {"train_loss": -26.8282527923584, "global_step": 409591, "epoch": 4934} {"train_loss": -26.914962768554688, "global_step": 409592, "epoch": 4934} {"train_loss": -26.441024780273438, "global_step": 409593, "epoch": 4934} {"train_loss": -26.685333251953125, "global_step": 409594, "epoch": 4934} {"train_loss": -26.462011337280273, "global_step": 409595, "epoch": 4934} {"train_loss": -26.842618942260742, "global_step": 409596, "epoch": 4934} {"train_loss": -26.627735137939453, "global_step": 409597, "epoch": 4934} {"train_loss": -26.71514320373535, "global_step": 409598, "epoch": 4934} {"train_loss": -26.705108642578125, "global_step": 409599, "epoch": 4934} {"train_loss": -26.736963272094727, "global_step": 409600, "epoch": 4934} {"train_loss": -27.084386825561523, "global_step": 409601, "epoch": 4934} {"train_loss": -26.856542587280273, "global_step": 409602, "epoch": 4934} {"train_loss": -27.0955867767334, "global_step": 409603, "epoch": 4934} {"train_loss": -26.2511599667101, "global_step": 409604, "epoch": 4934, "val_loss": 6485594.0} {"train_loss": -25.601362228393555, "global_step": 409605, "epoch": 4935} {"train_loss": -24.66187858581543, "global_step": 409606, "epoch": 4935} {"train_loss": -26.1210994720459, "global_step": 409607, "epoch": 4935} {"train_loss": -25.767135620117188, "global_step": 409608, "epoch": 4935} {"train_loss": -25.353544235229492, "global_step": 409609, "epoch": 4935} {"train_loss": -25.955158233642578, "global_step": 409610, "epoch": 4935} {"train_loss": -25.736188888549805, "global_step": 409611, "epoch": 4935} {"train_loss": -25.933439254760742, "global_step": 409612, "epoch": 4935} {"train_loss": -25.37327766418457, "global_step": 409613, "epoch": 4935} {"train_loss": -26.047943115234375, "global_step": 409614, "epoch": 4935} {"train_loss": -25.74186134338379, "global_step": 409615, "epoch": 4935} {"train_loss": -26.524572372436523, "global_step": 409616, "epoch": 4935} {"train_loss": -25.709943771362305, "global_step": 409617, "epoch": 4935} {"train_loss": -26.367033004760742, "global_step": 409618, "epoch": 4935} {"train_loss": -26.0373477935791, "global_step": 409619, "epoch": 4935} {"train_loss": -25.871381759643555, "global_step": 409620, "epoch": 4935} {"train_loss": -25.86222267150879, "global_step": 409621, "epoch": 4935} {"train_loss": -26.205738067626953, "global_step": 409622, "epoch": 4935} {"train_loss": -25.9797420501709, "global_step": 409623, "epoch": 4935} {"train_loss": -25.94953727722168, "global_step": 409624, "epoch": 4935} {"train_loss": -26.281238555908203, "global_step": 409625, "epoch": 4935} {"train_loss": -26.548816680908203, "global_step": 409626, "epoch": 4935} {"train_loss": -26.545948028564453, "global_step": 409627, "epoch": 4935} {"train_loss": -26.347402572631836, "global_step": 409628, "epoch": 4935} {"train_loss": -26.5688419342041, "global_step": 409629, "epoch": 4935} {"train_loss": -26.325464248657227, "global_step": 409630, "epoch": 4935} {"train_loss": -26.5526065826416, "global_step": 409631, "epoch": 4935} {"train_loss": -26.389440536499023, "global_step": 409632, "epoch": 4935} {"train_loss": -26.62815284729004, "global_step": 409633, "epoch": 4935} {"train_loss": -26.436004638671875, "global_step": 409634, "epoch": 4935} {"train_loss": -26.167932510375977, "global_step": 409635, "epoch": 4935} {"train_loss": -26.55950355529785, "global_step": 409636, "epoch": 4935} {"train_loss": -26.519855499267578, "global_step": 409637, "epoch": 4935} {"train_loss": -26.477609634399414, "global_step": 409638, "epoch": 4935} {"train_loss": -26.959272384643555, "global_step": 409639, "epoch": 4935} {"train_loss": -26.55925941467285, "global_step": 409640, "epoch": 4935} {"train_loss": -26.759357452392578, "global_step": 409641, "epoch": 4935} {"train_loss": -26.384963989257812, "global_step": 409642, "epoch": 4935} {"train_loss": -26.509521484375, "global_step": 409643, "epoch": 4935} {"train_loss": -26.736780166625977, "global_step": 409644, "epoch": 4935} {"train_loss": -26.57051658630371, "global_step": 409645, "epoch": 4935} {"train_loss": -26.455921173095703, "global_step": 409646, "epoch": 4935} {"train_loss": -26.7698974609375, "global_step": 409647, "epoch": 4935} {"train_loss": -26.72076416015625, "global_step": 409648, "epoch": 4935} {"train_loss": -26.93183708190918, "global_step": 409649, "epoch": 4935} {"train_loss": -26.979602813720703, "global_step": 409650, "epoch": 4935} {"train_loss": -27.101764678955078, "global_step": 409651, "epoch": 4935} {"train_loss": -26.58560562133789, "global_step": 409652, "epoch": 4935} {"train_loss": -26.838638305664062, "global_step": 409653, "epoch": 4935} {"train_loss": -26.615371704101562, "global_step": 409654, "epoch": 4935} {"train_loss": -26.672082901000977, "global_step": 409655, "epoch": 4935} {"train_loss": -26.864028930664062, "global_step": 409656, "epoch": 4935} {"train_loss": -26.795042037963867, "global_step": 409657, "epoch": 4935} {"train_loss": -26.74454689025879, "global_step": 409658, "epoch": 4935} {"train_loss": -26.932453155517578, "global_step": 409659, "epoch": 4935} {"train_loss": -26.86817741394043, "global_step": 409660, "epoch": 4935} {"train_loss": -27.035104751586914, "global_step": 409661, "epoch": 4935} {"train_loss": -26.89141845703125, "global_step": 409662, "epoch": 4935} {"train_loss": -26.917346954345703, "global_step": 409663, "epoch": 4935} {"train_loss": -27.09903335571289, "global_step": 409664, "epoch": 4935} {"train_loss": -26.521726608276367, "global_step": 409665, "epoch": 4935} {"train_loss": -26.857885360717773, "global_step": 409666, "epoch": 4935} {"train_loss": -27.03944206237793, "global_step": 409667, "epoch": 4935} {"train_loss": -26.728195190429688, "global_step": 409668, "epoch": 4935} {"train_loss": -26.582670211791992, "global_step": 409669, "epoch": 4935} {"train_loss": -26.4704532623291, "global_step": 409670, "epoch": 4935} {"train_loss": -26.01807975769043, "global_step": 409671, "epoch": 4935} {"train_loss": -26.190710067749023, "global_step": 409672, "epoch": 4935} {"train_loss": -26.813705444335938, "global_step": 409673, "epoch": 4935} {"train_loss": -26.510868072509766, "global_step": 409674, "epoch": 4935} {"train_loss": -26.71864128112793, "global_step": 409675, "epoch": 4935} {"train_loss": -26.51324462890625, "global_step": 409676, "epoch": 4935} {"train_loss": -26.97016716003418, "global_step": 409677, "epoch": 4935} {"train_loss": -26.591684341430664, "global_step": 409678, "epoch": 4935} {"train_loss": -26.863279342651367, "global_step": 409679, "epoch": 4935} {"train_loss": -26.807287216186523, "global_step": 409680, "epoch": 4935} {"train_loss": -26.68824577331543, "global_step": 409681, "epoch": 4935} {"train_loss": -26.617658615112305, "global_step": 409682, "epoch": 4935} {"train_loss": -26.690000534057617, "global_step": 409683, "epoch": 4935} {"train_loss": -26.63690757751465, "global_step": 409684, "epoch": 4935} {"train_loss": -26.969745635986328, "global_step": 409685, "epoch": 4935} {"train_loss": -26.417943954467773, "global_step": 409686, "epoch": 4935} {"train_loss": -26.45471522319748, "global_step": 409687, "epoch": 4935, "val_loss": 6519622.0} {"train_loss": -26.22662925720215, "global_step": 409688, "epoch": 4936} {"train_loss": -26.429065704345703, "global_step": 409689, "epoch": 4936} {"train_loss": -26.38787269592285, "global_step": 409690, "epoch": 4936} {"train_loss": -26.306177139282227, "global_step": 409691, "epoch": 4936} {"train_loss": -26.0756778717041, "global_step": 409692, "epoch": 4936} {"train_loss": -26.658193588256836, "global_step": 409693, "epoch": 4936} {"train_loss": -26.159265518188477, "global_step": 409694, "epoch": 4936} {"train_loss": -26.674001693725586, "global_step": 409695, "epoch": 4936} {"train_loss": -26.64228630065918, "global_step": 409696, "epoch": 4936} {"train_loss": -26.40472412109375, "global_step": 409697, "epoch": 4936} {"train_loss": -26.534027099609375, "global_step": 409698, "epoch": 4936} {"train_loss": -26.14418601989746, "global_step": 409699, "epoch": 4936} {"train_loss": -25.982839584350586, "global_step": 409700, "epoch": 4936} {"train_loss": -26.383813858032227, "global_step": 409701, "epoch": 4936} {"train_loss": -26.4871826171875, "global_step": 409702, "epoch": 4936} {"train_loss": -25.881696701049805, "global_step": 409703, "epoch": 4936} {"train_loss": -26.505313873291016, "global_step": 409704, "epoch": 4936} {"train_loss": -26.594348907470703, "global_step": 409705, "epoch": 4936} {"train_loss": -26.485990524291992, "global_step": 409706, "epoch": 4936} {"train_loss": -26.291044235229492, "global_step": 409707, "epoch": 4936} {"train_loss": -26.560413360595703, "global_step": 409708, "epoch": 4936} {"train_loss": -26.511716842651367, "global_step": 409709, "epoch": 4936} {"train_loss": -26.4501953125, "global_step": 409710, "epoch": 4936} {"train_loss": -26.769092559814453, "global_step": 409711, "epoch": 4936} {"train_loss": -26.594675064086914, "global_step": 409712, "epoch": 4936} {"train_loss": -26.553913116455078, "global_step": 409713, "epoch": 4936} {"train_loss": -26.747228622436523, "global_step": 409714, "epoch": 4936} {"train_loss": -26.6845760345459, "global_step": 409715, "epoch": 4936} {"train_loss": -26.2613582611084, "global_step": 409716, "epoch": 4936} {"train_loss": -26.610395431518555, "global_step": 409717, "epoch": 4936} {"train_loss": -26.5162296295166, "global_step": 409718, "epoch": 4936} {"train_loss": -26.575515747070312, "global_step": 409719, "epoch": 4936} {"train_loss": -26.0992374420166, "global_step": 409720, "epoch": 4936} {"train_loss": -26.86297607421875, "global_step": 409721, "epoch": 4936} {"train_loss": -26.4661865234375, "global_step": 409722, "epoch": 4936} {"train_loss": -26.49835205078125, "global_step": 409723, "epoch": 4936} {"train_loss": -26.20452308654785, "global_step": 409724, "epoch": 4936} {"train_loss": -26.25282096862793, "global_step": 409725, "epoch": 4936} {"train_loss": -26.624664306640625, "global_step": 409726, "epoch": 4936} {"train_loss": -26.39984703063965, "global_step": 409727, "epoch": 4936} {"train_loss": -26.623571395874023, "global_step": 409728, "epoch": 4936} {"train_loss": -26.809064865112305, "global_step": 409729, "epoch": 4936} {"train_loss": -26.551233291625977, "global_step": 409730, "epoch": 4936} {"train_loss": -26.773786544799805, "global_step": 409731, "epoch": 4936} {"train_loss": -26.726037979125977, "global_step": 409732, "epoch": 4936} {"train_loss": -26.914514541625977, "global_step": 409733, "epoch": 4936} {"train_loss": -26.59844398498535, "global_step": 409734, "epoch": 4936} {"train_loss": -26.55450439453125, "global_step": 409735, "epoch": 4936} {"train_loss": -26.726682662963867, "global_step": 409736, "epoch": 4936} {"train_loss": -26.371686935424805, "global_step": 409737, "epoch": 4936} {"train_loss": -26.46344566345215, "global_step": 409738, "epoch": 4936} {"train_loss": -26.459232330322266, "global_step": 409739, "epoch": 4936} {"train_loss": -27.0899715423584, "global_step": 409740, "epoch": 4936} {"train_loss": -27.023700714111328, "global_step": 409741, "epoch": 4936} {"train_loss": -26.799299240112305, "global_step": 409742, "epoch": 4936} {"train_loss": -26.797607421875, "global_step": 409743, "epoch": 4936} {"train_loss": -26.848432540893555, "global_step": 409744, "epoch": 4936} {"train_loss": -26.742969512939453, "global_step": 409745, "epoch": 4936} {"train_loss": -26.892446517944336, "global_step": 409746, "epoch": 4936} {"train_loss": -26.5106143951416, "global_step": 409747, "epoch": 4936} {"train_loss": -26.995630264282227, "global_step": 409748, "epoch": 4936} {"train_loss": -26.894689559936523, "global_step": 409749, "epoch": 4936} {"train_loss": -26.867603302001953, "global_step": 409750, "epoch": 4936} {"train_loss": -27.041950225830078, "global_step": 409751, "epoch": 4936} {"train_loss": -26.871734619140625, "global_step": 409752, "epoch": 4936} {"train_loss": -26.69010353088379, "global_step": 409753, "epoch": 4936} {"train_loss": -26.7308292388916, "global_step": 409754, "epoch": 4936} {"train_loss": -27.06025505065918, "global_step": 409755, "epoch": 4936} {"train_loss": -26.753950119018555, "global_step": 409756, "epoch": 4936} {"train_loss": -26.736494064331055, "global_step": 409757, "epoch": 4936} {"train_loss": -27.0391845703125, "global_step": 409758, "epoch": 4936} {"train_loss": -27.090917587280273, "global_step": 409759, "epoch": 4936} {"train_loss": -27.107044219970703, "global_step": 409760, "epoch": 4936} {"train_loss": -26.7025203704834, "global_step": 409761, "epoch": 4936} {"train_loss": -26.799564361572266, "global_step": 409762, "epoch": 4936} {"train_loss": -26.779748916625977, "global_step": 409763, "epoch": 4936} {"train_loss": -26.81838035583496, "global_step": 409764, "epoch": 4936} {"train_loss": -27.019397735595703, "global_step": 409765, "epoch": 4936} {"train_loss": -26.865503311157227, "global_step": 409766, "epoch": 4936} {"train_loss": -26.874231338500977, "global_step": 409767, "epoch": 4936} {"train_loss": -26.580673217773438, "global_step": 409768, "epoch": 4936} {"train_loss": -26.593225479125977, "global_step": 409769, "epoch": 4936} {"train_loss": -26.64032255885113, "global_step": 409770, "epoch": 4936, "val_loss": 6541105.0} {"train_loss": -26.295846939086914, "global_step": 409771, "epoch": 4937} {"train_loss": -25.72455406188965, "global_step": 409772, "epoch": 4937} {"train_loss": -25.47742462158203, "global_step": 409773, "epoch": 4937} {"train_loss": -26.121809005737305, "global_step": 409774, "epoch": 4937} {"train_loss": -26.407501220703125, "global_step": 409775, "epoch": 4937} {"train_loss": -26.37603759765625, "global_step": 409776, "epoch": 4937} {"train_loss": -26.1812744140625, "global_step": 409777, "epoch": 4937} {"train_loss": -26.077951431274414, "global_step": 409778, "epoch": 4937} {"train_loss": -26.522985458374023, "global_step": 409779, "epoch": 4937} {"train_loss": -26.545560836791992, "global_step": 409780, "epoch": 4937} {"train_loss": -26.2010498046875, "global_step": 409781, "epoch": 4937} {"train_loss": -26.671369552612305, "global_step": 409782, "epoch": 4937} {"train_loss": -26.083112716674805, "global_step": 409783, "epoch": 4937} {"train_loss": -26.738691329956055, "global_step": 409784, "epoch": 4937} {"train_loss": -26.44134521484375, "global_step": 409785, "epoch": 4937} {"train_loss": -26.606765747070312, "global_step": 409786, "epoch": 4937} {"train_loss": -26.67714500427246, "global_step": 409787, "epoch": 4937} {"train_loss": -26.528806686401367, "global_step": 409788, "epoch": 4937} {"train_loss": -26.6843204498291, "global_step": 409789, "epoch": 4937} {"train_loss": -26.715627670288086, "global_step": 409790, "epoch": 4937} {"train_loss": -26.75660514831543, "global_step": 409791, "epoch": 4937} {"train_loss": -26.632587432861328, "global_step": 409792, "epoch": 4937} {"train_loss": -26.799474716186523, "global_step": 409793, "epoch": 4937} {"train_loss": -26.705530166625977, "global_step": 409794, "epoch": 4937} {"train_loss": -26.724714279174805, "global_step": 409795, "epoch": 4937} {"train_loss": -26.80994987487793, "global_step": 409796, "epoch": 4937} {"train_loss": -27.133869171142578, "global_step": 409797, "epoch": 4937} {"train_loss": -26.839496612548828, "global_step": 409798, "epoch": 4937} {"train_loss": -27.01216697692871, "global_step": 409799, "epoch": 4937} {"train_loss": -26.317432403564453, "global_step": 409800, "epoch": 4937} {"train_loss": -26.778234481811523, "global_step": 409801, "epoch": 4937} {"train_loss": -26.850269317626953, "global_step": 409802, "epoch": 4937} {"train_loss": -26.631214141845703, "global_step": 409803, "epoch": 4937} {"train_loss": -26.832380294799805, "global_step": 409804, "epoch": 4937} {"train_loss": -27.0653018951416, "global_step": 409805, "epoch": 4937} {"train_loss": -27.059598922729492, "global_step": 409806, "epoch": 4937} {"train_loss": -27.134984970092773, "global_step": 409807, "epoch": 4937} {"train_loss": -26.685943603515625, "global_step": 409808, "epoch": 4937} {"train_loss": -26.914947509765625, "global_step": 409809, "epoch": 4937} {"train_loss": -27.07866859436035, "global_step": 409810, "epoch": 4937} {"train_loss": -26.913171768188477, "global_step": 409811, "epoch": 4937} {"train_loss": -26.4056339263916, "global_step": 409812, "epoch": 4937} {"train_loss": -26.922534942626953, "global_step": 409813, "epoch": 4937} {"train_loss": -26.87952995300293, "global_step": 409814, "epoch": 4937} {"train_loss": -27.00104331970215, "global_step": 409815, "epoch": 4937} {"train_loss": -26.967496871948242, "global_step": 409816, "epoch": 4937} {"train_loss": -26.50445556640625, "global_step": 409817, "epoch": 4937} {"train_loss": -26.989734649658203, "global_step": 409818, "epoch": 4937} {"train_loss": -26.689172744750977, "global_step": 409819, "epoch": 4937} {"train_loss": -26.746686935424805, "global_step": 409820, "epoch": 4937} {"train_loss": -26.771259307861328, "global_step": 409821, "epoch": 4937} {"train_loss": -26.921340942382812, "global_step": 409822, "epoch": 4937} {"train_loss": -26.88213539123535, "global_step": 409823, "epoch": 4937} {"train_loss": -27.13136100769043, "global_step": 409824, "epoch": 4937} {"train_loss": -27.281116485595703, "global_step": 409825, "epoch": 4937} {"train_loss": -26.493249893188477, "global_step": 409826, "epoch": 4937} {"train_loss": -26.953718185424805, "global_step": 409827, "epoch": 4937} {"train_loss": -26.71271324157715, "global_step": 409828, "epoch": 4937} {"train_loss": -26.433975219726562, "global_step": 409829, "epoch": 4937} {"train_loss": -26.331480026245117, "global_step": 409830, "epoch": 4937} {"train_loss": -26.497241973876953, "global_step": 409831, "epoch": 4937} {"train_loss": -26.778654098510742, "global_step": 409832, "epoch": 4937} {"train_loss": -26.87040138244629, "global_step": 409833, "epoch": 4937} {"train_loss": -26.7302303314209, "global_step": 409834, "epoch": 4937} {"train_loss": -26.678136825561523, "global_step": 409835, "epoch": 4937} {"train_loss": -26.51936149597168, "global_step": 409836, "epoch": 4937} {"train_loss": -27.037017822265625, "global_step": 409837, "epoch": 4937} {"train_loss": -26.49237060546875, "global_step": 409838, "epoch": 4937} {"train_loss": -26.874053955078125, "global_step": 409839, "epoch": 4937} {"train_loss": -26.441858291625977, "global_step": 409840, "epoch": 4937} {"train_loss": -26.029132843017578, "global_step": 409841, "epoch": 4937} {"train_loss": -25.8375244140625, "global_step": 409842, "epoch": 4937} {"train_loss": -25.062255859375, "global_step": 409843, "epoch": 4937} {"train_loss": -26.108718872070312, "global_step": 409844, "epoch": 4937} {"train_loss": -26.714279174804688, "global_step": 409845, "epoch": 4937} {"train_loss": -25.95586585998535, "global_step": 409846, "epoch": 4937} {"train_loss": -25.437103271484375, "global_step": 409847, "epoch": 4937} {"train_loss": -26.720245361328125, "global_step": 409848, "epoch": 4937} {"train_loss": -26.020490646362305, "global_step": 409849, "epoch": 4937} {"train_loss": -26.49911880493164, "global_step": 409850, "epoch": 4937} {"train_loss": -26.337682723999023, "global_step": 409851, "epoch": 4937} {"train_loss": -26.46579933166504, "global_step": 409852, "epoch": 4937} {"train_loss": -26.57771758573601, "global_step": 409853, "epoch": 4937, "val_loss": 6518050.0} {"train_loss": -25.83917236328125, "global_step": 409854, "epoch": 4938} {"train_loss": -26.168603897094727, "global_step": 409855, "epoch": 4938} {"train_loss": -25.71152687072754, "global_step": 409856, "epoch": 4938} {"train_loss": -25.900732040405273, "global_step": 409857, "epoch": 4938} {"train_loss": -25.735746383666992, "global_step": 409858, "epoch": 4938} {"train_loss": -25.9392032623291, "global_step": 409859, "epoch": 4938} {"train_loss": -26.01348876953125, "global_step": 409860, "epoch": 4938} {"train_loss": -26.18726921081543, "global_step": 409861, "epoch": 4938} {"train_loss": -26.15522575378418, "global_step": 409862, "epoch": 4938} {"train_loss": -26.080469131469727, "global_step": 409863, "epoch": 4938} {"train_loss": -26.1243896484375, "global_step": 409864, "epoch": 4938} {"train_loss": -26.31622886657715, "global_step": 409865, "epoch": 4938} {"train_loss": -26.36158561706543, "global_step": 409866, "epoch": 4938} {"train_loss": -26.429275512695312, "global_step": 409867, "epoch": 4938} {"train_loss": -26.09734535217285, "global_step": 409868, "epoch": 4938} {"train_loss": -26.803937911987305, "global_step": 409869, "epoch": 4938} {"train_loss": -26.606489181518555, "global_step": 409870, "epoch": 4938} {"train_loss": -26.198896408081055, "global_step": 409871, "epoch": 4938} {"train_loss": -26.397485733032227, "global_step": 409872, "epoch": 4938} {"train_loss": -26.40138053894043, "global_step": 409873, "epoch": 4938} {"train_loss": -26.54326820373535, "global_step": 409874, "epoch": 4938} {"train_loss": -26.607831954956055, "global_step": 409875, "epoch": 4938} {"train_loss": -26.645116806030273, "global_step": 409876, "epoch": 4938} {"train_loss": -26.301862716674805, "global_step": 409877, "epoch": 4938} {"train_loss": -26.5949649810791, "global_step": 409878, "epoch": 4938} {"train_loss": -26.631580352783203, "global_step": 409879, "epoch": 4938} {"train_loss": -26.74921226501465, "global_step": 409880, "epoch": 4938} {"train_loss": -26.509313583374023, "global_step": 409881, "epoch": 4938} {"train_loss": -26.468732833862305, "global_step": 409882, "epoch": 4938} {"train_loss": -26.675907135009766, "global_step": 409883, "epoch": 4938} {"train_loss": -26.683639526367188, "global_step": 409884, "epoch": 4938} {"train_loss": -26.632604598999023, "global_step": 409885, "epoch": 4938} {"train_loss": -26.490793228149414, "global_step": 409886, "epoch": 4938} {"train_loss": -26.73687744140625, "global_step": 409887, "epoch": 4938} {"train_loss": -26.6920166015625, "global_step": 409888, "epoch": 4938} {"train_loss": -26.841360092163086, "global_step": 409889, "epoch": 4938} {"train_loss": -26.90728759765625, "global_step": 409890, "epoch": 4938} {"train_loss": -26.540775299072266, "global_step": 409891, "epoch": 4938} {"train_loss": -26.598175048828125, "global_step": 409892, "epoch": 4938} {"train_loss": -26.59751319885254, "global_step": 409893, "epoch": 4938} {"train_loss": -26.699003219604492, "global_step": 409894, "epoch": 4938} {"train_loss": -26.82645606994629, "global_step": 409895, "epoch": 4938} {"train_loss": -26.67075538635254, "global_step": 409896, "epoch": 4938} {"train_loss": -26.984710693359375, "global_step": 409897, "epoch": 4938} {"train_loss": -26.762958526611328, "global_step": 409898, "epoch": 4938} {"train_loss": -26.59967041015625, "global_step": 409899, "epoch": 4938} {"train_loss": -26.889606475830078, "global_step": 409900, "epoch": 4938} {"train_loss": -27.224985122680664, "global_step": 409901, "epoch": 4938} {"train_loss": -26.994037628173828, "global_step": 409902, "epoch": 4938} {"train_loss": -26.994787216186523, "global_step": 409903, "epoch": 4938} {"train_loss": -26.59278678894043, "global_step": 409904, "epoch": 4938} {"train_loss": -26.885690689086914, "global_step": 409905, "epoch": 4938} {"train_loss": -27.1302547454834, "global_step": 409906, "epoch": 4938} {"train_loss": -26.740365982055664, "global_step": 409907, "epoch": 4938} {"train_loss": -27.12471580505371, "global_step": 409908, "epoch": 4938} {"train_loss": -27.238561630249023, "global_step": 409909, "epoch": 4938} {"train_loss": -26.928869247436523, "global_step": 409910, "epoch": 4938} {"train_loss": -26.967069625854492, "global_step": 409911, "epoch": 4938} {"train_loss": -26.845767974853516, "global_step": 409912, "epoch": 4938} {"train_loss": -26.714385986328125, "global_step": 409913, "epoch": 4938} {"train_loss": -26.848957061767578, "global_step": 409914, "epoch": 4938} {"train_loss": -26.807851791381836, "global_step": 409915, "epoch": 4938} {"train_loss": -26.854726791381836, "global_step": 409916, "epoch": 4938} {"train_loss": -26.98465347290039, "global_step": 409917, "epoch": 4938} {"train_loss": -26.944843292236328, "global_step": 409918, "epoch": 4938} {"train_loss": -26.83694839477539, "global_step": 409919, "epoch": 4938} {"train_loss": -27.019027709960938, "global_step": 409920, "epoch": 4938} {"train_loss": -26.930103302001953, "global_step": 409921, "epoch": 4938} {"train_loss": -26.94344139099121, "global_step": 409922, "epoch": 4938} {"train_loss": -26.756772994995117, "global_step": 409923, "epoch": 4938} {"train_loss": -26.659713745117188, "global_step": 409924, "epoch": 4938} {"train_loss": -26.900466918945312, "global_step": 409925, "epoch": 4938} {"train_loss": -26.598379135131836, "global_step": 409926, "epoch": 4938} {"train_loss": -26.96601676940918, "global_step": 409927, "epoch": 4938} {"train_loss": -27.081405639648438, "global_step": 409928, "epoch": 4938} {"train_loss": -27.00675392150879, "global_step": 409929, "epoch": 4938} {"train_loss": -26.855976104736328, "global_step": 409930, "epoch": 4938} {"train_loss": -26.8721923828125, "global_step": 409931, "epoch": 4938} {"train_loss": -26.655649185180664, "global_step": 409932, "epoch": 4938} {"train_loss": -26.734113693237305, "global_step": 409933, "epoch": 4938} {"train_loss": -26.9222354888916, "global_step": 409934, "epoch": 4938} {"train_loss": -26.8188419342041, "global_step": 409935, "epoch": 4938} {"train_loss": -26.65072176829878, "global_step": 409936, "epoch": 4938, "val_loss": 6364584.0} {"train_loss": -24.465782165527344, "global_step": 409937, "epoch": 4939} {"train_loss": -23.644775390625, "global_step": 409938, "epoch": 4939} {"train_loss": -23.09300994873047, "global_step": 409939, "epoch": 4939} {"train_loss": -24.522979736328125, "global_step": 409940, "epoch": 4939} {"train_loss": -24.461877822875977, "global_step": 409941, "epoch": 4939} {"train_loss": -24.456050872802734, "global_step": 409942, "epoch": 4939} {"train_loss": -24.033784866333008, "global_step": 409943, "epoch": 4939} {"train_loss": -24.52981948852539, "global_step": 409944, "epoch": 4939} {"train_loss": -25.190404891967773, "global_step": 409945, "epoch": 4939} {"train_loss": -24.65921974182129, "global_step": 409946, "epoch": 4939} {"train_loss": -25.592435836791992, "global_step": 409947, "epoch": 4939} {"train_loss": -24.9231014251709, "global_step": 409948, "epoch": 4939} {"train_loss": -25.412199020385742, "global_step": 409949, "epoch": 4939} {"train_loss": -25.71565818786621, "global_step": 409950, "epoch": 4939} {"train_loss": -25.210561752319336, "global_step": 409951, "epoch": 4939} {"train_loss": -25.40125274658203, "global_step": 409952, "epoch": 4939} {"train_loss": -25.47333335876465, "global_step": 409953, "epoch": 4939} {"train_loss": -25.644224166870117, "global_step": 409954, "epoch": 4939} {"train_loss": -26.099014282226562, "global_step": 409955, "epoch": 4939} {"train_loss": -25.69049644470215, "global_step": 409956, "epoch": 4939} {"train_loss": -25.911779403686523, "global_step": 409957, "epoch": 4939} {"train_loss": -25.576658248901367, "global_step": 409958, "epoch": 4939} {"train_loss": -25.822589874267578, "global_step": 409959, "epoch": 4939} {"train_loss": -26.00931167602539, "global_step": 409960, "epoch": 4939} {"train_loss": -25.696792602539062, "global_step": 409961, "epoch": 4939} {"train_loss": -26.38413429260254, "global_step": 409962, "epoch": 4939} {"train_loss": -25.997528076171875, "global_step": 409963, "epoch": 4939} {"train_loss": -26.379638671875, "global_step": 409964, "epoch": 4939} {"train_loss": -26.32649040222168, "global_step": 409965, "epoch": 4939} {"train_loss": -26.008771896362305, "global_step": 409966, "epoch": 4939} {"train_loss": -25.95423698425293, "global_step": 409967, "epoch": 4939} {"train_loss": -26.152179718017578, "global_step": 409968, "epoch": 4939} {"train_loss": -26.241376876831055, "global_step": 409969, "epoch": 4939} {"train_loss": -26.291141510009766, "global_step": 409970, "epoch": 4939} {"train_loss": -26.654401779174805, "global_step": 409971, "epoch": 4939} {"train_loss": -26.09444236755371, "global_step": 409972, "epoch": 4939} {"train_loss": -26.389572143554688, "global_step": 409973, "epoch": 4939} {"train_loss": -26.359130859375, "global_step": 409974, "epoch": 4939} {"train_loss": -26.3810977935791, "global_step": 409975, "epoch": 4939} {"train_loss": -26.464685440063477, "global_step": 409976, "epoch": 4939} {"train_loss": -26.528005599975586, "global_step": 409977, "epoch": 4939} {"train_loss": -25.9904842376709, "global_step": 409978, "epoch": 4939} {"train_loss": -26.747299194335938, "global_step": 409979, "epoch": 4939} {"train_loss": -26.74506950378418, "global_step": 409980, "epoch": 4939} {"train_loss": -26.270666122436523, "global_step": 409981, "epoch": 4939} {"train_loss": -26.523603439331055, "global_step": 409982, "epoch": 4939} {"train_loss": -26.811288833618164, "global_step": 409983, "epoch": 4939} {"train_loss": -26.550573348999023, "global_step": 409984, "epoch": 4939} {"train_loss": -26.31940269470215, "global_step": 409985, "epoch": 4939} {"train_loss": -26.539840698242188, "global_step": 409986, "epoch": 4939} {"train_loss": -26.43927574157715, "global_step": 409987, "epoch": 4939} {"train_loss": -26.547744750976562, "global_step": 409988, "epoch": 4939} {"train_loss": -26.544422149658203, "global_step": 409989, "epoch": 4939} {"train_loss": -26.831878662109375, "global_step": 409990, "epoch": 4939} {"train_loss": -26.72739028930664, "global_step": 409991, "epoch": 4939} {"train_loss": -26.72804069519043, "global_step": 409992, "epoch": 4939} {"train_loss": -26.815465927124023, "global_step": 409993, "epoch": 4939} {"train_loss": -27.107574462890625, "global_step": 409994, "epoch": 4939} {"train_loss": -26.400354385375977, "global_step": 409995, "epoch": 4939} {"train_loss": -26.397705078125, "global_step": 409996, "epoch": 4939} {"train_loss": -26.9605712890625, "global_step": 409997, "epoch": 4939} {"train_loss": -27.012481689453125, "global_step": 409998, "epoch": 4939} {"train_loss": -26.761947631835938, "global_step": 409999, "epoch": 4939} {"train_loss": -26.805561065673828, "global_step": 410000, "epoch": 4939} {"train_loss": -27.072355270385742, "global_step": 410001, "epoch": 4939} {"train_loss": -26.5700626373291, "global_step": 410002, "epoch": 4939} {"train_loss": -26.831159591674805, "global_step": 410003, "epoch": 4939} {"train_loss": -26.609607696533203, "global_step": 410004, "epoch": 4939} {"train_loss": -26.877180099487305, "global_step": 410005, "epoch": 4939} {"train_loss": -27.16480827331543, "global_step": 410006, "epoch": 4939} {"train_loss": -27.092208862304688, "global_step": 410007, "epoch": 4939} {"train_loss": -26.890888214111328, "global_step": 410008, "epoch": 4939} {"train_loss": -26.749801635742188, "global_step": 410009, "epoch": 4939} {"train_loss": -26.79697608947754, "global_step": 410010, "epoch": 4939} {"train_loss": -26.979291915893555, "global_step": 410011, "epoch": 4939} {"train_loss": -26.72210121154785, "global_step": 410012, "epoch": 4939} {"train_loss": -26.83919334411621, "global_step": 410013, "epoch": 4939} {"train_loss": -26.951526641845703, "global_step": 410014, "epoch": 4939} {"train_loss": -26.60737419128418, "global_step": 410015, "epoch": 4939} {"train_loss": -26.827621459960938, "global_step": 410016, "epoch": 4939} {"train_loss": -26.620908737182617, "global_step": 410017, "epoch": 4939} {"train_loss": -26.717504501342773, "global_step": 410018, "epoch": 4939} {"train_loss": -26.153540117194854, "global_step": 410019, "epoch": 4939, "val_loss": 6525286.5} {"train_loss": -26.48313331604004, "global_step": 410020, "epoch": 4940} {"train_loss": -25.983503341674805, "global_step": 410021, "epoch": 4940} {"train_loss": -26.053653717041016, "global_step": 410022, "epoch": 4940} {"train_loss": -26.255802154541016, "global_step": 410023, "epoch": 4940} {"train_loss": -25.417510986328125, "global_step": 410024, "epoch": 4940} {"train_loss": -25.46820640563965, "global_step": 410025, "epoch": 4940} {"train_loss": -26.126617431640625, "global_step": 410026, "epoch": 4940} {"train_loss": -25.733495712280273, "global_step": 410027, "epoch": 4940} {"train_loss": -26.305999755859375, "global_step": 410028, "epoch": 4940} {"train_loss": -26.1418514251709, "global_step": 410029, "epoch": 4940} {"train_loss": -25.780725479125977, "global_step": 410030, "epoch": 4940} {"train_loss": -26.200727462768555, "global_step": 410031, "epoch": 4940} {"train_loss": -26.072803497314453, "global_step": 410032, "epoch": 4940} {"train_loss": -26.174230575561523, "global_step": 410033, "epoch": 4940} {"train_loss": -26.327716827392578, "global_step": 410034, "epoch": 4940} {"train_loss": -26.562543869018555, "global_step": 410035, "epoch": 4940} {"train_loss": -26.560270309448242, "global_step": 410036, "epoch": 4940} {"train_loss": -26.41168785095215, "global_step": 410037, "epoch": 4940} {"train_loss": -26.507287979125977, "global_step": 410038, "epoch": 4940} {"train_loss": -26.375171661376953, "global_step": 410039, "epoch": 4940} {"train_loss": -26.33302116394043, "global_step": 410040, "epoch": 4940} {"train_loss": -26.429834365844727, "global_step": 410041, "epoch": 4940} {"train_loss": -26.2268009185791, "global_step": 410042, "epoch": 4940} {"train_loss": -26.430341720581055, "global_step": 410043, "epoch": 4940} {"train_loss": -26.44288444519043, "global_step": 410044, "epoch": 4940} {"train_loss": -26.45990562438965, "global_step": 410045, "epoch": 4940} {"train_loss": -26.602890014648438, "global_step": 410046, "epoch": 4940} {"train_loss": -26.600385665893555, "global_step": 410047, "epoch": 4940} {"train_loss": -27.228864669799805, "global_step": 410048, "epoch": 4940} {"train_loss": -26.59515380859375, "global_step": 410049, "epoch": 4940} {"train_loss": -26.7851619720459, "global_step": 410050, "epoch": 4940} {"train_loss": -26.777912139892578, "global_step": 410051, "epoch": 4940} {"train_loss": -26.5269718170166, "global_step": 410052, "epoch": 4940} {"train_loss": -26.93255615234375, "global_step": 410053, "epoch": 4940} {"train_loss": -26.847387313842773, "global_step": 410054, "epoch": 4940} {"train_loss": -26.832172393798828, "global_step": 410055, "epoch": 4940} {"train_loss": -26.628070831298828, "global_step": 410056, "epoch": 4940} {"train_loss": -26.534259796142578, "global_step": 410057, "epoch": 4940} {"train_loss": -26.5788516998291, "global_step": 410058, "epoch": 4940} {"train_loss": -26.646320343017578, "global_step": 410059, "epoch": 4940} {"train_loss": -26.791589736938477, "global_step": 410060, "epoch": 4940} {"train_loss": -27.01641273498535, "global_step": 410061, "epoch": 4940} {"train_loss": -26.78147315979004, "global_step": 410062, "epoch": 4940} {"train_loss": -27.276044845581055, "global_step": 410063, "epoch": 4940} {"train_loss": -26.992420196533203, "global_step": 410064, "epoch": 4940} {"train_loss": -26.739118576049805, "global_step": 410065, "epoch": 4940} {"train_loss": -26.8276424407959, "global_step": 410066, "epoch": 4940} {"train_loss": -26.984878540039062, "global_step": 410067, "epoch": 4940} {"train_loss": -26.7943115234375, "global_step": 410068, "epoch": 4940} {"train_loss": -26.78303337097168, "global_step": 410069, "epoch": 4940} {"train_loss": -27.019445419311523, "global_step": 410070, "epoch": 4940} {"train_loss": -26.79203224182129, "global_step": 410071, "epoch": 4940} {"train_loss": -26.4799861907959, "global_step": 410072, "epoch": 4940} {"train_loss": -26.0770206451416, "global_step": 410073, "epoch": 4940} {"train_loss": -27.060407638549805, "global_step": 410074, "epoch": 4940} {"train_loss": -26.457101821899414, "global_step": 410075, "epoch": 4940} {"train_loss": -27.156234741210938, "global_step": 410076, "epoch": 4940} {"train_loss": -26.67048454284668, "global_step": 410077, "epoch": 4940} {"train_loss": -26.621912002563477, "global_step": 410078, "epoch": 4940} {"train_loss": -26.889602661132812, "global_step": 410079, "epoch": 4940} {"train_loss": -26.8326416015625, "global_step": 410080, "epoch": 4940} {"train_loss": -26.902679443359375, "global_step": 410081, "epoch": 4940} {"train_loss": -26.628280639648438, "global_step": 410082, "epoch": 4940} {"train_loss": -26.683135986328125, "global_step": 410083, "epoch": 4940} {"train_loss": -26.6142635345459, "global_step": 410084, "epoch": 4940} {"train_loss": -26.3964786529541, "global_step": 410085, "epoch": 4940} {"train_loss": -26.983861923217773, "global_step": 410086, "epoch": 4940} {"train_loss": -26.56400489807129, "global_step": 410087, "epoch": 4940} {"train_loss": -26.677494049072266, "global_step": 410088, "epoch": 4940} {"train_loss": -26.761075973510742, "global_step": 410089, "epoch": 4940} {"train_loss": -26.659284591674805, "global_step": 410090, "epoch": 4940} {"train_loss": -26.517759323120117, "global_step": 410091, "epoch": 4940} {"train_loss": -26.666736602783203, "global_step": 410092, "epoch": 4940} {"train_loss": -26.868637084960938, "global_step": 410093, "epoch": 4940} {"train_loss": -26.76027488708496, "global_step": 410094, "epoch": 4940} {"train_loss": -26.7592716217041, "global_step": 410095, "epoch": 4940} {"train_loss": -26.5499210357666, "global_step": 410096, "epoch": 4940} {"train_loss": -26.805133819580078, "global_step": 410097, "epoch": 4940} {"train_loss": -26.384424209594727, "global_step": 410098, "epoch": 4940} {"train_loss": -26.579608917236328, "global_step": 410099, "epoch": 4940} {"train_loss": -26.62237548828125, "global_step": 410100, "epoch": 4940} {"train_loss": -26.50495719909668, "global_step": 410101, "epoch": 4940} {"train_loss": -26.552000321537616, "global_step": 410102, "epoch": 4940, "val_loss": 6527096.5} {"train_loss": -25.93902015686035, "global_step": 410103, "epoch": 4941} {"train_loss": -25.37516975402832, "global_step": 410104, "epoch": 4941} {"train_loss": -26.042373657226562, "global_step": 410105, "epoch": 4941} {"train_loss": -26.710723876953125, "global_step": 410106, "epoch": 4941} {"train_loss": -26.439529418945312, "global_step": 410107, "epoch": 4941} {"train_loss": -26.410083770751953, "global_step": 410108, "epoch": 4941} {"train_loss": -26.383106231689453, "global_step": 410109, "epoch": 4941} {"train_loss": -26.329345703125, "global_step": 410110, "epoch": 4941} {"train_loss": -26.302026748657227, "global_step": 410111, "epoch": 4941} {"train_loss": -26.412403106689453, "global_step": 410112, "epoch": 4941} {"train_loss": -26.119049072265625, "global_step": 410113, "epoch": 4941} {"train_loss": -26.6747989654541, "global_step": 410114, "epoch": 4941} {"train_loss": -26.370824813842773, "global_step": 410115, "epoch": 4941} {"train_loss": -26.163976669311523, "global_step": 410116, "epoch": 4941} {"train_loss": -26.470754623413086, "global_step": 410117, "epoch": 4941} {"train_loss": -26.402587890625, "global_step": 410118, "epoch": 4941} {"train_loss": -26.52057456970215, "global_step": 410119, "epoch": 4941} {"train_loss": -26.268213272094727, "global_step": 410120, "epoch": 4941} {"train_loss": -26.26531982421875, "global_step": 410121, "epoch": 4941} {"train_loss": -26.550024032592773, "global_step": 410122, "epoch": 4941} {"train_loss": -26.903921127319336, "global_step": 410123, "epoch": 4941} {"train_loss": -26.613361358642578, "global_step": 410124, "epoch": 4941} {"train_loss": -26.542285919189453, "global_step": 410125, "epoch": 4941} {"train_loss": -26.81793212890625, "global_step": 410126, "epoch": 4941} {"train_loss": -26.63140869140625, "global_step": 410127, "epoch": 4941} {"train_loss": -26.21698570251465, "global_step": 410128, "epoch": 4941} {"train_loss": -26.554834365844727, "global_step": 410129, "epoch": 4941} {"train_loss": -26.691320419311523, "global_step": 410130, "epoch": 4941} {"train_loss": -26.62310218811035, "global_step": 410131, "epoch": 4941} {"train_loss": -26.885786056518555, "global_step": 410132, "epoch": 4941} {"train_loss": -26.84432029724121, "global_step": 410133, "epoch": 4941} {"train_loss": -26.646081924438477, "global_step": 410134, "epoch": 4941} {"train_loss": -26.818119049072266, "global_step": 410135, "epoch": 4941} {"train_loss": -27.13736343383789, "global_step": 410136, "epoch": 4941} {"train_loss": -26.79456901550293, "global_step": 410137, "epoch": 4941} {"train_loss": -26.70875358581543, "global_step": 410138, "epoch": 4941} {"train_loss": -26.814294815063477, "global_step": 410139, "epoch": 4941} {"train_loss": -26.9575138092041, "global_step": 410140, "epoch": 4941} {"train_loss": -26.98125648498535, "global_step": 410141, "epoch": 4941} {"train_loss": -26.896520614624023, "global_step": 410142, "epoch": 4941} {"train_loss": -26.888334274291992, "global_step": 410143, "epoch": 4941} {"train_loss": -27.237302780151367, "global_step": 410144, "epoch": 4941} {"train_loss": -26.82004165649414, "global_step": 410145, "epoch": 4941} {"train_loss": -26.858625411987305, "global_step": 410146, "epoch": 4941} {"train_loss": -26.80841064453125, "global_step": 410147, "epoch": 4941} {"train_loss": -27.047489166259766, "global_step": 410148, "epoch": 4941} {"train_loss": -26.65650749206543, "global_step": 410149, "epoch": 4941} {"train_loss": -27.046289443969727, "global_step": 410150, "epoch": 4941} {"train_loss": -27.134876251220703, "global_step": 410151, "epoch": 4941} {"train_loss": -26.62647819519043, "global_step": 410152, "epoch": 4941} {"train_loss": -26.820178985595703, "global_step": 410153, "epoch": 4941} {"train_loss": -26.898426055908203, "global_step": 410154, "epoch": 4941} {"train_loss": -27.222198486328125, "global_step": 410155, "epoch": 4941} {"train_loss": -27.156896591186523, "global_step": 410156, "epoch": 4941} {"train_loss": -27.112781524658203, "global_step": 410157, "epoch": 4941} {"train_loss": -26.606473922729492, "global_step": 410158, "epoch": 4941} {"train_loss": -26.890485763549805, "global_step": 410159, "epoch": 4941} {"train_loss": -26.837427139282227, "global_step": 410160, "epoch": 4941} {"train_loss": -26.97528648376465, "global_step": 410161, "epoch": 4941} {"train_loss": -26.8045711517334, "global_step": 410162, "epoch": 4941} {"train_loss": -26.95884132385254, "global_step": 410163, "epoch": 4941} {"train_loss": -26.524831771850586, "global_step": 410164, "epoch": 4941} {"train_loss": -25.769254684448242, "global_step": 410165, "epoch": 4941} {"train_loss": -24.21546173095703, "global_step": 410166, "epoch": 4941} {"train_loss": -24.150110244750977, "global_step": 410167, "epoch": 4941} {"train_loss": -24.538320541381836, "global_step": 410168, "epoch": 4941} {"train_loss": -25.31777000427246, "global_step": 410169, "epoch": 4941} {"train_loss": -25.83609962463379, "global_step": 410170, "epoch": 4941} {"train_loss": -25.544965744018555, "global_step": 410171, "epoch": 4941} {"train_loss": -25.711872100830078, "global_step": 410172, "epoch": 4941} {"train_loss": -26.825719833374023, "global_step": 410173, "epoch": 4941} {"train_loss": -25.76728630065918, "global_step": 410174, "epoch": 4941} {"train_loss": -26.5399227142334, "global_step": 410175, "epoch": 4941} {"train_loss": -26.091266632080078, "global_step": 410176, "epoch": 4941} {"train_loss": -26.30132484436035, "global_step": 410177, "epoch": 4941} {"train_loss": -25.918333053588867, "global_step": 410178, "epoch": 4941} {"train_loss": -26.13262939453125, "global_step": 410179, "epoch": 4941} {"train_loss": -26.382007598876953, "global_step": 410180, "epoch": 4941} {"train_loss": -26.344648361206055, "global_step": 410181, "epoch": 4941} {"train_loss": -26.397796630859375, "global_step": 410182, "epoch": 4941} {"train_loss": -26.471982955932617, "global_step": 410183, "epoch": 4941} {"train_loss": -26.312936782836914, "global_step": 410184, "epoch": 4941} {"train_loss": -26.45284549299493, "global_step": 410185, "epoch": 4941, "val_loss": 6539818.0} {"train_loss": -26.3179874420166, "global_step": 410186, "epoch": 4942} {"train_loss": -26.164749145507812, "global_step": 410187, "epoch": 4942} {"train_loss": -26.707199096679688, "global_step": 410188, "epoch": 4942} {"train_loss": -25.9034366607666, "global_step": 410189, "epoch": 4942} {"train_loss": -26.111597061157227, "global_step": 410190, "epoch": 4942} {"train_loss": -26.43204689025879, "global_step": 410191, "epoch": 4942} {"train_loss": -26.56070899963379, "global_step": 410192, "epoch": 4942} {"train_loss": -26.275915145874023, "global_step": 410193, "epoch": 4942} {"train_loss": -26.261987686157227, "global_step": 410194, "epoch": 4942} {"train_loss": -26.2784423828125, "global_step": 410195, "epoch": 4942} {"train_loss": -26.403905868530273, "global_step": 410196, "epoch": 4942} {"train_loss": -26.565916061401367, "global_step": 410197, "epoch": 4942} {"train_loss": -26.671106338500977, "global_step": 410198, "epoch": 4942} {"train_loss": -26.587966918945312, "global_step": 410199, "epoch": 4942} {"train_loss": -26.656036376953125, "global_step": 410200, "epoch": 4942} {"train_loss": -26.411605834960938, "global_step": 410201, "epoch": 4942} {"train_loss": -26.81365394592285, "global_step": 410202, "epoch": 4942} {"train_loss": -26.290374755859375, "global_step": 410203, "epoch": 4942} {"train_loss": -26.461755752563477, "global_step": 410204, "epoch": 4942} {"train_loss": -26.445560455322266, "global_step": 410205, "epoch": 4942} {"train_loss": -26.162506103515625, "global_step": 410206, "epoch": 4942} {"train_loss": -26.859018325805664, "global_step": 410207, "epoch": 4942} {"train_loss": -26.44733238220215, "global_step": 410208, "epoch": 4942} {"train_loss": -26.166624069213867, "global_step": 410209, "epoch": 4942} {"train_loss": -26.759138107299805, "global_step": 410210, "epoch": 4942} {"train_loss": -26.482152938842773, "global_step": 410211, "epoch": 4942} {"train_loss": -26.5327205657959, "global_step": 410212, "epoch": 4942} {"train_loss": -26.624242782592773, "global_step": 410213, "epoch": 4942} {"train_loss": -26.544513702392578, "global_step": 410214, "epoch": 4942} {"train_loss": -26.925382614135742, "global_step": 410215, "epoch": 4942} {"train_loss": -26.65826988220215, "global_step": 410216, "epoch": 4942} {"train_loss": -26.783065795898438, "global_step": 410217, "epoch": 4942} {"train_loss": -26.452686309814453, "global_step": 410218, "epoch": 4942} {"train_loss": -26.69715690612793, "global_step": 410219, "epoch": 4942} {"train_loss": -26.393665313720703, "global_step": 410220, "epoch": 4942} {"train_loss": -26.448001861572266, "global_step": 410221, "epoch": 4942} {"train_loss": -26.993896484375, "global_step": 410222, "epoch": 4942} {"train_loss": -26.9478702545166, "global_step": 410223, "epoch": 4942} {"train_loss": -26.74458122253418, "global_step": 410224, "epoch": 4942} {"train_loss": -26.81874656677246, "global_step": 410225, "epoch": 4942} {"train_loss": -27.0030574798584, "global_step": 410226, "epoch": 4942} {"train_loss": -26.705114364624023, "global_step": 410227, "epoch": 4942} {"train_loss": -26.879003524780273, "global_step": 410228, "epoch": 4942} {"train_loss": -27.169586181640625, "global_step": 410229, "epoch": 4942} {"train_loss": -26.664478302001953, "global_step": 410230, "epoch": 4942} {"train_loss": -26.9554386138916, "global_step": 410231, "epoch": 4942} {"train_loss": -27.257970809936523, "global_step": 410232, "epoch": 4942} {"train_loss": -26.821264266967773, "global_step": 410233, "epoch": 4942} {"train_loss": -27.259628295898438, "global_step": 410234, "epoch": 4942} {"train_loss": -27.023351669311523, "global_step": 410235, "epoch": 4942} {"train_loss": -26.71561050415039, "global_step": 410236, "epoch": 4942} {"train_loss": -26.868879318237305, "global_step": 410237, "epoch": 4942} {"train_loss": -26.679967880249023, "global_step": 410238, "epoch": 4942} {"train_loss": -26.930694580078125, "global_step": 410239, "epoch": 4942} {"train_loss": -26.9112606048584, "global_step": 410240, "epoch": 4942} {"train_loss": -26.744495391845703, "global_step": 410241, "epoch": 4942} {"train_loss": -26.80097007751465, "global_step": 410242, "epoch": 4942} {"train_loss": -26.821807861328125, "global_step": 410243, "epoch": 4942} {"train_loss": -27.159765243530273, "global_step": 410244, "epoch": 4942} {"train_loss": -26.77009391784668, "global_step": 410245, "epoch": 4942} {"train_loss": -26.831024169921875, "global_step": 410246, "epoch": 4942} {"train_loss": -26.784753799438477, "global_step": 410247, "epoch": 4942} {"train_loss": -27.069730758666992, "global_step": 410248, "epoch": 4942} {"train_loss": -26.747650146484375, "global_step": 410249, "epoch": 4942} {"train_loss": -26.6005802154541, "global_step": 410250, "epoch": 4942} {"train_loss": -26.729206085205078, "global_step": 410251, "epoch": 4942} {"train_loss": -26.755338668823242, "global_step": 410252, "epoch": 4942} {"train_loss": -26.361743927001953, "global_step": 410253, "epoch": 4942} {"train_loss": -26.930280685424805, "global_step": 410254, "epoch": 4942} {"train_loss": -26.89573097229004, "global_step": 410255, "epoch": 4942} {"train_loss": -26.76997184753418, "global_step": 410256, "epoch": 4942} {"train_loss": -26.134048461914062, "global_step": 410257, "epoch": 4942} {"train_loss": -26.515888214111328, "global_step": 410258, "epoch": 4942} {"train_loss": -27.008075714111328, "global_step": 410259, "epoch": 4942} {"train_loss": -26.559003829956055, "global_step": 410260, "epoch": 4942} {"train_loss": -26.187543869018555, "global_step": 410261, "epoch": 4942} {"train_loss": -26.923370361328125, "global_step": 410262, "epoch": 4942} {"train_loss": -26.75733757019043, "global_step": 410263, "epoch": 4942} {"train_loss": -26.29495620727539, "global_step": 410264, "epoch": 4942} {"train_loss": -27.03948402404785, "global_step": 410265, "epoch": 4942} {"train_loss": -26.35286521911621, "global_step": 410266, "epoch": 4942} {"train_loss": -26.706079483032227, "global_step": 410267, "epoch": 4942} {"train_loss": -26.645318456442958, "global_step": 410268, "epoch": 4942, "val_loss": 6632044.5} {"train_loss": -25.34644317626953, "global_step": 410269, "epoch": 4943} {"train_loss": -26.143604278564453, "global_step": 410270, "epoch": 4943} {"train_loss": -26.1278133392334, "global_step": 410271, "epoch": 4943} {"train_loss": -25.38587760925293, "global_step": 410272, "epoch": 4943} {"train_loss": -26.15863609313965, "global_step": 410273, "epoch": 4943} {"train_loss": -25.707050323486328, "global_step": 410274, "epoch": 4943} {"train_loss": -26.4886474609375, "global_step": 410275, "epoch": 4943} {"train_loss": -25.822509765625, "global_step": 410276, "epoch": 4943} {"train_loss": -26.231103897094727, "global_step": 410277, "epoch": 4943} {"train_loss": -26.39299964904785, "global_step": 410278, "epoch": 4943} {"train_loss": -26.10055923461914, "global_step": 410279, "epoch": 4943} {"train_loss": -26.23390007019043, "global_step": 410280, "epoch": 4943} {"train_loss": -25.95550537109375, "global_step": 410281, "epoch": 4943} {"train_loss": -26.321088790893555, "global_step": 410282, "epoch": 4943} {"train_loss": -26.571592330932617, "global_step": 410283, "epoch": 4943} {"train_loss": -26.201074600219727, "global_step": 410284, "epoch": 4943} {"train_loss": -26.315418243408203, "global_step": 410285, "epoch": 4943} {"train_loss": -26.406579971313477, "global_step": 410286, "epoch": 4943} {"train_loss": -26.587818145751953, "global_step": 410287, "epoch": 4943} {"train_loss": -26.729711532592773, "global_step": 410288, "epoch": 4943} {"train_loss": -26.533039093017578, "global_step": 410289, "epoch": 4943} {"train_loss": -26.80476188659668, "global_step": 410290, "epoch": 4943} {"train_loss": -26.202234268188477, "global_step": 410291, "epoch": 4943} {"train_loss": -26.26495361328125, "global_step": 410292, "epoch": 4943} {"train_loss": -27.000324249267578, "global_step": 410293, "epoch": 4943} {"train_loss": -26.88177490234375, "global_step": 410294, "epoch": 4943} {"train_loss": -26.413726806640625, "global_step": 410295, "epoch": 4943} {"train_loss": -26.842798233032227, "global_step": 410296, "epoch": 4943} {"train_loss": -26.662189483642578, "global_step": 410297, "epoch": 4943} {"train_loss": -26.743545532226562, "global_step": 410298, "epoch": 4943} {"train_loss": -26.66556739807129, "global_step": 410299, "epoch": 4943} {"train_loss": -26.687143325805664, "global_step": 410300, "epoch": 4943} {"train_loss": -26.911840438842773, "global_step": 410301, "epoch": 4943} {"train_loss": -26.982160568237305, "global_step": 410302, "epoch": 4943} {"train_loss": -26.879287719726562, "global_step": 410303, "epoch": 4943} {"train_loss": -26.6148681640625, "global_step": 410304, "epoch": 4943} {"train_loss": -26.916046142578125, "global_step": 410305, "epoch": 4943} {"train_loss": -26.71670913696289, "global_step": 410306, "epoch": 4943} {"train_loss": -26.434030532836914, "global_step": 410307, "epoch": 4943} {"train_loss": -26.794172286987305, "global_step": 410308, "epoch": 4943} {"train_loss": -26.791528701782227, "global_step": 410309, "epoch": 4943} {"train_loss": -27.185758590698242, "global_step": 410310, "epoch": 4943} {"train_loss": -26.403867721557617, "global_step": 410311, "epoch": 4943} {"train_loss": -26.652502059936523, "global_step": 410312, "epoch": 4943} {"train_loss": -27.015640258789062, "global_step": 410313, "epoch": 4943} {"train_loss": -27.10541343688965, "global_step": 410314, "epoch": 4943} {"train_loss": -27.053892135620117, "global_step": 410315, "epoch": 4943} {"train_loss": -26.70918083190918, "global_step": 410316, "epoch": 4943} {"train_loss": -26.23736000061035, "global_step": 410317, "epoch": 4943} {"train_loss": -26.70244789123535, "global_step": 410318, "epoch": 4943} {"train_loss": -26.7551212310791, "global_step": 410319, "epoch": 4943} {"train_loss": -26.69776725769043, "global_step": 410320, "epoch": 4943} {"train_loss": -26.38465690612793, "global_step": 410321, "epoch": 4943} {"train_loss": -27.025171279907227, "global_step": 410322, "epoch": 4943} {"train_loss": -26.514617919921875, "global_step": 410323, "epoch": 4943} {"train_loss": -26.703943252563477, "global_step": 410324, "epoch": 4943} {"train_loss": -26.523664474487305, "global_step": 410325, "epoch": 4943} {"train_loss": -26.865537643432617, "global_step": 410326, "epoch": 4943} {"train_loss": -27.07215690612793, "global_step": 410327, "epoch": 4943} {"train_loss": -26.669492721557617, "global_step": 410328, "epoch": 4943} {"train_loss": -27.076568603515625, "global_step": 410329, "epoch": 4943} {"train_loss": -26.674850463867188, "global_step": 410330, "epoch": 4943} {"train_loss": -26.929113388061523, "global_step": 410331, "epoch": 4943} {"train_loss": -26.848596572875977, "global_step": 410332, "epoch": 4943} {"train_loss": -26.8638973236084, "global_step": 410333, "epoch": 4943} {"train_loss": -27.057279586791992, "global_step": 410334, "epoch": 4943} {"train_loss": -26.903778076171875, "global_step": 410335, "epoch": 4943} {"train_loss": -26.819061279296875, "global_step": 410336, "epoch": 4943} {"train_loss": -27.012502670288086, "global_step": 410337, "epoch": 4943} {"train_loss": -26.651208877563477, "global_step": 410338, "epoch": 4943} {"train_loss": -26.761077880859375, "global_step": 410339, "epoch": 4943} {"train_loss": -26.816516876220703, "global_step": 410340, "epoch": 4943} {"train_loss": -26.768686294555664, "global_step": 410341, "epoch": 4943} {"train_loss": -26.866159439086914, "global_step": 410342, "epoch": 4943} {"train_loss": -27.501358032226562, "global_step": 410343, "epoch": 4943} {"train_loss": -26.976232528686523, "global_step": 410344, "epoch": 4943} {"train_loss": -26.69950294494629, "global_step": 410345, "epoch": 4943} {"train_loss": -26.36572265625, "global_step": 410346, "epoch": 4943} {"train_loss": -26.90265464782715, "global_step": 410347, "epoch": 4943} {"train_loss": -26.83805274963379, "global_step": 410348, "epoch": 4943} {"train_loss": -26.704614639282227, "global_step": 410349, "epoch": 4943} {"train_loss": -26.417463302612305, "global_step": 410350, "epoch": 4943} {"train_loss": -26.618858176541615, "global_step": 410351, "epoch": 4943, "val_loss": 6525125.0} {"train_loss": -23.205265045166016, "global_step": 410352, "epoch": 4944} {"train_loss": -24.28131103515625, "global_step": 410353, "epoch": 4944} {"train_loss": -25.704069137573242, "global_step": 410354, "epoch": 4944} {"train_loss": -25.06528091430664, "global_step": 410355, "epoch": 4944} {"train_loss": -25.6624813079834, "global_step": 410356, "epoch": 4944} {"train_loss": -24.538711547851562, "global_step": 410357, "epoch": 4944} {"train_loss": -25.931238174438477, "global_step": 410358, "epoch": 4944} {"train_loss": -25.132078170776367, "global_step": 410359, "epoch": 4944} {"train_loss": -24.948604583740234, "global_step": 410360, "epoch": 4944} {"train_loss": -26.029870986938477, "global_step": 410361, "epoch": 4944} {"train_loss": -25.233116149902344, "global_step": 410362, "epoch": 4944} {"train_loss": -25.662494659423828, "global_step": 410363, "epoch": 4944} {"train_loss": -25.3709774017334, "global_step": 410364, "epoch": 4944} {"train_loss": -25.70979118347168, "global_step": 410365, "epoch": 4944} {"train_loss": -25.690052032470703, "global_step": 410366, "epoch": 4944} {"train_loss": -25.547264099121094, "global_step": 410367, "epoch": 4944} {"train_loss": -26.05425453186035, "global_step": 410368, "epoch": 4944} {"train_loss": -25.56020164489746, "global_step": 410369, "epoch": 4944} {"train_loss": -25.911197662353516, "global_step": 410370, "epoch": 4944} {"train_loss": -25.916263580322266, "global_step": 410371, "epoch": 4944} {"train_loss": -26.17009925842285, "global_step": 410372, "epoch": 4944} {"train_loss": -25.878156661987305, "global_step": 410373, "epoch": 4944} {"train_loss": -25.950153350830078, "global_step": 410374, "epoch": 4944} {"train_loss": -26.48089027404785, "global_step": 410375, "epoch": 4944} {"train_loss": -26.330244064331055, "global_step": 410376, "epoch": 4944} {"train_loss": -25.985855102539062, "global_step": 410377, "epoch": 4944} {"train_loss": -26.00014305114746, "global_step": 410378, "epoch": 4944} {"train_loss": -26.633441925048828, "global_step": 410379, "epoch": 4944} {"train_loss": -26.346532821655273, "global_step": 410380, "epoch": 4944} {"train_loss": -25.92145347595215, "global_step": 410381, "epoch": 4944} {"train_loss": -26.374744415283203, "global_step": 410382, "epoch": 4944} {"train_loss": -25.895360946655273, "global_step": 410383, "epoch": 4944} {"train_loss": -25.99834632873535, "global_step": 410384, "epoch": 4944} {"train_loss": -26.3520450592041, "global_step": 410385, "epoch": 4944} {"train_loss": -26.400806427001953, "global_step": 410386, "epoch": 4944} {"train_loss": -26.8580265045166, "global_step": 410387, "epoch": 4944} {"train_loss": -26.270898818969727, "global_step": 410388, "epoch": 4944} {"train_loss": -26.614465713500977, "global_step": 410389, "epoch": 4944} {"train_loss": -27.004119873046875, "global_step": 410390, "epoch": 4944} {"train_loss": -26.423980712890625, "global_step": 410391, "epoch": 4944} {"train_loss": -26.65793800354004, "global_step": 410392, "epoch": 4944} {"train_loss": -26.473392486572266, "global_step": 410393, "epoch": 4944} {"train_loss": -26.9036922454834, "global_step": 410394, "epoch": 4944} {"train_loss": -26.75998306274414, "global_step": 410395, "epoch": 4944} {"train_loss": -26.914093017578125, "global_step": 410396, "epoch": 4944} {"train_loss": -26.849897384643555, "global_step": 410397, "epoch": 4944} {"train_loss": -26.770288467407227, "global_step": 410398, "epoch": 4944} {"train_loss": -26.53623390197754, "global_step": 410399, "epoch": 4944} {"train_loss": -26.555866241455078, "global_step": 410400, "epoch": 4944} {"train_loss": -27.047317504882812, "global_step": 410401, "epoch": 4944} {"train_loss": -27.132726669311523, "global_step": 410402, "epoch": 4944} {"train_loss": -26.986337661743164, "global_step": 410403, "epoch": 4944} {"train_loss": -26.565200805664062, "global_step": 410404, "epoch": 4944} {"train_loss": -26.504724502563477, "global_step": 410405, "epoch": 4944} {"train_loss": -26.729272842407227, "global_step": 410406, "epoch": 4944} {"train_loss": -26.60233497619629, "global_step": 410407, "epoch": 4944} {"train_loss": -26.662580490112305, "global_step": 410408, "epoch": 4944} {"train_loss": -26.719411849975586, "global_step": 410409, "epoch": 4944} {"train_loss": -27.14436149597168, "global_step": 410410, "epoch": 4944} {"train_loss": -26.94685173034668, "global_step": 410411, "epoch": 4944} {"train_loss": -26.771011352539062, "global_step": 410412, "epoch": 4944} {"train_loss": -26.78753662109375, "global_step": 410413, "epoch": 4944} {"train_loss": -26.495849609375, "global_step": 410414, "epoch": 4944} {"train_loss": -26.942792892456055, "global_step": 410415, "epoch": 4944} {"train_loss": -26.933191299438477, "global_step": 410416, "epoch": 4944} {"train_loss": -26.808374404907227, "global_step": 410417, "epoch": 4944} {"train_loss": -26.73468589782715, "global_step": 410418, "epoch": 4944} {"train_loss": -26.810632705688477, "global_step": 410419, "epoch": 4944} {"train_loss": -26.666311264038086, "global_step": 410420, "epoch": 4944} {"train_loss": -26.977514266967773, "global_step": 410421, "epoch": 4944} {"train_loss": -26.719532012939453, "global_step": 410422, "epoch": 4944} {"train_loss": -26.81648063659668, "global_step": 410423, "epoch": 4944} {"train_loss": -26.484012603759766, "global_step": 410424, "epoch": 4944} {"train_loss": -27.10707664489746, "global_step": 410425, "epoch": 4944} {"train_loss": -26.693424224853516, "global_step": 410426, "epoch": 4944} {"train_loss": -26.62652015686035, "global_step": 410427, "epoch": 4944} {"train_loss": -26.907291412353516, "global_step": 410428, "epoch": 4944} {"train_loss": -26.6267032623291, "global_step": 410429, "epoch": 4944} {"train_loss": -26.7833309173584, "global_step": 410430, "epoch": 4944} {"train_loss": -26.891788482666016, "global_step": 410431, "epoch": 4944} {"train_loss": -26.97149085998535, "global_step": 410432, "epoch": 4944} {"train_loss": -26.93631362915039, "global_step": 410433, "epoch": 4944} {"train_loss": -26.33342359152185, "global_step": 410434, "epoch": 4944, "val_loss": 6518076.5} {"train_loss": -26.20099449157715, "global_step": 410435, "epoch": 4945} {"train_loss": -26.53144645690918, "global_step": 410436, "epoch": 4945} {"train_loss": -26.71044921875, "global_step": 410437, "epoch": 4945} {"train_loss": -26.7415828704834, "global_step": 410438, "epoch": 4945} {"train_loss": -26.215381622314453, "global_step": 410439, "epoch": 4945} {"train_loss": -26.507373809814453, "global_step": 410440, "epoch": 4945} {"train_loss": -25.912769317626953, "global_step": 410441, "epoch": 4945} {"train_loss": -26.80078125, "global_step": 410442, "epoch": 4945} {"train_loss": -26.54184913635254, "global_step": 410443, "epoch": 4945} {"train_loss": -26.85621452331543, "global_step": 410444, "epoch": 4945} {"train_loss": -26.265233993530273, "global_step": 410445, "epoch": 4945} {"train_loss": -26.796140670776367, "global_step": 410446, "epoch": 4945} {"train_loss": -26.61368179321289, "global_step": 410447, "epoch": 4945} {"train_loss": -27.08949089050293, "global_step": 410448, "epoch": 4945} {"train_loss": -26.742563247680664, "global_step": 410449, "epoch": 4945} {"train_loss": -26.422138214111328, "global_step": 410450, "epoch": 4945} {"train_loss": -26.053863525390625, "global_step": 410451, "epoch": 4945} {"train_loss": -26.51152992248535, "global_step": 410452, "epoch": 4945} {"train_loss": -26.640222549438477, "global_step": 410453, "epoch": 4945} {"train_loss": -26.714147567749023, "global_step": 410454, "epoch": 4945} {"train_loss": -26.738981246948242, "global_step": 410455, "epoch": 4945} {"train_loss": -26.69302749633789, "global_step": 410456, "epoch": 4945} {"train_loss": -26.242816925048828, "global_step": 410457, "epoch": 4945} {"train_loss": -26.551965713500977, "global_step": 410458, "epoch": 4945} {"train_loss": -27.001667022705078, "global_step": 410459, "epoch": 4945} {"train_loss": -26.600828170776367, "global_step": 410460, "epoch": 4945} {"train_loss": -26.2905330657959, "global_step": 410461, "epoch": 4945} {"train_loss": -26.4351749420166, "global_step": 410462, "epoch": 4945} {"train_loss": -26.988571166992188, "global_step": 410463, "epoch": 4945} {"train_loss": -27.303808212280273, "global_step": 410464, "epoch": 4945} {"train_loss": -26.500452041625977, "global_step": 410465, "epoch": 4945} {"train_loss": -26.64251708984375, "global_step": 410466, "epoch": 4945} {"train_loss": -26.339319229125977, "global_step": 410467, "epoch": 4945} {"train_loss": -26.849279403686523, "global_step": 410468, "epoch": 4945} {"train_loss": -26.786855697631836, "global_step": 410469, "epoch": 4945} {"train_loss": -26.60806655883789, "global_step": 410470, "epoch": 4945} {"train_loss": -26.177331924438477, "global_step": 410471, "epoch": 4945} {"train_loss": -26.513837814331055, "global_step": 410472, "epoch": 4945} {"train_loss": -26.943408966064453, "global_step": 410473, "epoch": 4945} {"train_loss": -26.496265411376953, "global_step": 410474, "epoch": 4945} {"train_loss": -26.58454704284668, "global_step": 410475, "epoch": 4945} {"train_loss": -27.018207550048828, "global_step": 410476, "epoch": 4945} {"train_loss": -26.699588775634766, "global_step": 410477, "epoch": 4945} {"train_loss": -26.865690231323242, "global_step": 410478, "epoch": 4945} {"train_loss": -26.246871948242188, "global_step": 410479, "epoch": 4945} {"train_loss": -27.023107528686523, "global_step": 410480, "epoch": 4945} {"train_loss": -26.8093204498291, "global_step": 410481, "epoch": 4945} {"train_loss": -26.270166397094727, "global_step": 410482, "epoch": 4945} {"train_loss": -26.453876495361328, "global_step": 410483, "epoch": 4945} {"train_loss": -26.6448974609375, "global_step": 410484, "epoch": 4945} {"train_loss": -25.906652450561523, "global_step": 410485, "epoch": 4945} {"train_loss": -26.417633056640625, "global_step": 410486, "epoch": 4945} {"train_loss": -27.0094051361084, "global_step": 410487, "epoch": 4945} {"train_loss": -26.532407760620117, "global_step": 410488, "epoch": 4945} {"train_loss": -26.25331687927246, "global_step": 410489, "epoch": 4945} {"train_loss": -26.5998592376709, "global_step": 410490, "epoch": 4945} {"train_loss": -26.935209274291992, "global_step": 410491, "epoch": 4945} {"train_loss": -26.6126708984375, "global_step": 410492, "epoch": 4945} {"train_loss": -26.253828048706055, "global_step": 410493, "epoch": 4945} {"train_loss": -26.568206787109375, "global_step": 410494, "epoch": 4945} {"train_loss": -26.84966468811035, "global_step": 410495, "epoch": 4945} {"train_loss": -26.93479347229004, "global_step": 410496, "epoch": 4945} {"train_loss": -26.456457138061523, "global_step": 410497, "epoch": 4945} {"train_loss": -26.642484664916992, "global_step": 410498, "epoch": 4945} {"train_loss": -26.672794342041016, "global_step": 410499, "epoch": 4945} {"train_loss": -26.969289779663086, "global_step": 410500, "epoch": 4945} {"train_loss": -26.563730239868164, "global_step": 410501, "epoch": 4945} {"train_loss": -26.75540542602539, "global_step": 410502, "epoch": 4945} {"train_loss": -26.72012710571289, "global_step": 410503, "epoch": 4945} {"train_loss": -26.56197166442871, "global_step": 410504, "epoch": 4945} {"train_loss": -26.9669246673584, "global_step": 410505, "epoch": 4945} {"train_loss": -26.747333526611328, "global_step": 410506, "epoch": 4945} {"train_loss": -26.6822566986084, "global_step": 410507, "epoch": 4945} {"train_loss": -26.575937271118164, "global_step": 410508, "epoch": 4945} {"train_loss": -26.76422119140625, "global_step": 410509, "epoch": 4945} {"train_loss": -26.865278244018555, "global_step": 410510, "epoch": 4945} {"train_loss": -26.674121856689453, "global_step": 410511, "epoch": 4945} {"train_loss": -27.044767379760742, "global_step": 410512, "epoch": 4945} {"train_loss": -26.64661979675293, "global_step": 410513, "epoch": 4945} {"train_loss": -26.656442642211914, "global_step": 410514, "epoch": 4945} {"train_loss": -26.888837814331055, "global_step": 410515, "epoch": 4945} {"train_loss": -26.80543327331543, "global_step": 410516, "epoch": 4945} {"train_loss": -26.615415228418556, "global_step": 410517, "epoch": 4945, "val_loss": 6508126.0} {"train_loss": -25.31081771850586, "global_step": 410518, "epoch": 4946} {"train_loss": -24.8815860748291, "global_step": 410519, "epoch": 4946} {"train_loss": -26.0335750579834, "global_step": 410520, "epoch": 4946} {"train_loss": -24.911762237548828, "global_step": 410521, "epoch": 4946} {"train_loss": -25.338361740112305, "global_step": 410522, "epoch": 4946} {"train_loss": -25.742660522460938, "global_step": 410523, "epoch": 4946} {"train_loss": -26.153812408447266, "global_step": 410524, "epoch": 4946} {"train_loss": -26.07391929626465, "global_step": 410525, "epoch": 4946} {"train_loss": -25.740375518798828, "global_step": 410526, "epoch": 4946} {"train_loss": -26.141122817993164, "global_step": 410527, "epoch": 4946} {"train_loss": -25.767724990844727, "global_step": 410528, "epoch": 4946} {"train_loss": -25.936445236206055, "global_step": 410529, "epoch": 4946} {"train_loss": -26.43564796447754, "global_step": 410530, "epoch": 4946} {"train_loss": -26.30396842956543, "global_step": 410531, "epoch": 4946} {"train_loss": -26.07935905456543, "global_step": 410532, "epoch": 4946} {"train_loss": -26.29083824157715, "global_step": 410533, "epoch": 4946} {"train_loss": -25.993576049804688, "global_step": 410534, "epoch": 4946} {"train_loss": -26.215383529663086, "global_step": 410535, "epoch": 4946} {"train_loss": -26.442123413085938, "global_step": 410536, "epoch": 4946} {"train_loss": -26.450754165649414, "global_step": 410537, "epoch": 4946} {"train_loss": -26.172657012939453, "global_step": 410538, "epoch": 4946} {"train_loss": -26.32218360900879, "global_step": 410539, "epoch": 4946} {"train_loss": -26.00774574279785, "global_step": 410540, "epoch": 4946} {"train_loss": -26.26816749572754, "global_step": 410541, "epoch": 4946} {"train_loss": -26.87354850769043, "global_step": 410542, "epoch": 4946} {"train_loss": -26.1341552734375, "global_step": 410543, "epoch": 4946} {"train_loss": -26.018585205078125, "global_step": 410544, "epoch": 4946} {"train_loss": -26.334375381469727, "global_step": 410545, "epoch": 4946} {"train_loss": -26.1474552154541, "global_step": 410546, "epoch": 4946} {"train_loss": -26.180944442749023, "global_step": 410547, "epoch": 4946} {"train_loss": -26.494287490844727, "global_step": 410548, "epoch": 4946} {"train_loss": -26.680463790893555, "global_step": 410549, "epoch": 4946} {"train_loss": -26.547922134399414, "global_step": 410550, "epoch": 4946} {"train_loss": -26.6132869720459, "global_step": 410551, "epoch": 4946} {"train_loss": -26.28851890563965, "global_step": 410552, "epoch": 4946} {"train_loss": -26.702756881713867, "global_step": 410553, "epoch": 4946} {"train_loss": -26.575448989868164, "global_step": 410554, "epoch": 4946} {"train_loss": -26.388233184814453, "global_step": 410555, "epoch": 4946} {"train_loss": -26.554187774658203, "global_step": 410556, "epoch": 4946} {"train_loss": -26.4279842376709, "global_step": 410557, "epoch": 4946} {"train_loss": -26.7965087890625, "global_step": 410558, "epoch": 4946} {"train_loss": -26.722314834594727, "global_step": 410559, "epoch": 4946} {"train_loss": -26.573450088500977, "global_step": 410560, "epoch": 4946} {"train_loss": -26.914264678955078, "global_step": 410561, "epoch": 4946} {"train_loss": -26.749059677124023, "global_step": 410562, "epoch": 4946} {"train_loss": -26.6289119720459, "global_step": 410563, "epoch": 4946} {"train_loss": -26.830127716064453, "global_step": 410564, "epoch": 4946} {"train_loss": -26.509597778320312, "global_step": 410565, "epoch": 4946} {"train_loss": -26.77350425720215, "global_step": 410566, "epoch": 4946} {"train_loss": -26.431629180908203, "global_step": 410567, "epoch": 4946} {"train_loss": -26.884769439697266, "global_step": 410568, "epoch": 4946} {"train_loss": -27.0443058013916, "global_step": 410569, "epoch": 4946} {"train_loss": -27.027921676635742, "global_step": 410570, "epoch": 4946} {"train_loss": -27.002622604370117, "global_step": 410571, "epoch": 4946} {"train_loss": -26.55732536315918, "global_step": 410572, "epoch": 4946} {"train_loss": -26.282012939453125, "global_step": 410573, "epoch": 4946} {"train_loss": -26.813962936401367, "global_step": 410574, "epoch": 4946} {"train_loss": -26.8238582611084, "global_step": 410575, "epoch": 4946} {"train_loss": -26.890546798706055, "global_step": 410576, "epoch": 4946} {"train_loss": -27.219125747680664, "global_step": 410577, "epoch": 4946} {"train_loss": -26.758712768554688, "global_step": 410578, "epoch": 4946} {"train_loss": -26.457136154174805, "global_step": 410579, "epoch": 4946} {"train_loss": -26.881759643554688, "global_step": 410580, "epoch": 4946} {"train_loss": -27.180225372314453, "global_step": 410581, "epoch": 4946} {"train_loss": -27.029447555541992, "global_step": 410582, "epoch": 4946} {"train_loss": -26.877134323120117, "global_step": 410583, "epoch": 4946} {"train_loss": -27.23782730102539, "global_step": 410584, "epoch": 4946} {"train_loss": -26.962738037109375, "global_step": 410585, "epoch": 4946} {"train_loss": -27.07830810546875, "global_step": 410586, "epoch": 4946} {"train_loss": -26.901601791381836, "global_step": 410587, "epoch": 4946} {"train_loss": -26.885953903198242, "global_step": 410588, "epoch": 4946} {"train_loss": -27.063434600830078, "global_step": 410589, "epoch": 4946} {"train_loss": -26.9730281829834, "global_step": 410590, "epoch": 4946} {"train_loss": -26.509912490844727, "global_step": 410591, "epoch": 4946} {"train_loss": -27.138578414916992, "global_step": 410592, "epoch": 4946} {"train_loss": -27.218786239624023, "global_step": 410593, "epoch": 4946} {"train_loss": -26.945295333862305, "global_step": 410594, "epoch": 4946} {"train_loss": -26.30447769165039, "global_step": 410595, "epoch": 4946} {"train_loss": -26.13051414489746, "global_step": 410596, "epoch": 4946} {"train_loss": -25.113515853881836, "global_step": 410597, "epoch": 4946} {"train_loss": -23.914344787597656, "global_step": 410598, "epoch": 4946} {"train_loss": -23.835418701171875, "global_step": 410599, "epoch": 4946} {"train_loss": -26.389483808034875, "global_step": 410600, "epoch": 4946, "val_loss": 6610649.0} {"train_loss": -20.832258224487305, "global_step": 410601, "epoch": 4947} {"train_loss": -22.703481674194336, "global_step": 410602, "epoch": 4947} {"train_loss": -24.60931396484375, "global_step": 410603, "epoch": 4947} {"train_loss": -22.914011001586914, "global_step": 410604, "epoch": 4947} {"train_loss": -24.01702880859375, "global_step": 410605, "epoch": 4947} {"train_loss": -24.94148063659668, "global_step": 410606, "epoch": 4947} {"train_loss": -24.48500633239746, "global_step": 410607, "epoch": 4947} {"train_loss": -24.99908447265625, "global_step": 410608, "epoch": 4947} {"train_loss": -24.403005599975586, "global_step": 410609, "epoch": 4947} {"train_loss": -24.884119033813477, "global_step": 410610, "epoch": 4947} {"train_loss": -25.111082077026367, "global_step": 410611, "epoch": 4947} {"train_loss": -24.868345260620117, "global_step": 410612, "epoch": 4947} {"train_loss": -24.97010040283203, "global_step": 410613, "epoch": 4947} {"train_loss": -25.141332626342773, "global_step": 410614, "epoch": 4947} {"train_loss": -25.16006851196289, "global_step": 410615, "epoch": 4947} {"train_loss": -25.1390323638916, "global_step": 410616, "epoch": 4947} {"train_loss": -25.256380081176758, "global_step": 410617, "epoch": 4947} {"train_loss": -25.46588706970215, "global_step": 410618, "epoch": 4947} {"train_loss": -25.435245513916016, "global_step": 410619, "epoch": 4947} {"train_loss": -25.452133178710938, "global_step": 410620, "epoch": 4947} {"train_loss": -25.272506713867188, "global_step": 410621, "epoch": 4947} {"train_loss": -25.7336368560791, "global_step": 410622, "epoch": 4947} {"train_loss": -25.52931022644043, "global_step": 410623, "epoch": 4947} {"train_loss": -25.440641403198242, "global_step": 410624, "epoch": 4947} {"train_loss": -25.7593936920166, "global_step": 410625, "epoch": 4947} {"train_loss": -25.98171043395996, "global_step": 410626, "epoch": 4947} {"train_loss": -25.720661163330078, "global_step": 410627, "epoch": 4947} {"train_loss": -25.653696060180664, "global_step": 410628, "epoch": 4947} {"train_loss": -26.255573272705078, "global_step": 410629, "epoch": 4947} {"train_loss": -26.129358291625977, "global_step": 410630, "epoch": 4947} {"train_loss": -26.291345596313477, "global_step": 410631, "epoch": 4947} {"train_loss": -26.3469181060791, "global_step": 410632, "epoch": 4947} {"train_loss": -26.424726486206055, "global_step": 410633, "epoch": 4947} {"train_loss": -26.506885528564453, "global_step": 410634, "epoch": 4947} {"train_loss": -25.97772216796875, "global_step": 410635, "epoch": 4947} {"train_loss": -26.199100494384766, "global_step": 410636, "epoch": 4947} {"train_loss": -26.48097038269043, "global_step": 410637, "epoch": 4947} {"train_loss": -26.160221099853516, "global_step": 410638, "epoch": 4947} {"train_loss": -26.440479278564453, "global_step": 410639, "epoch": 4947} {"train_loss": -25.9946231842041, "global_step": 410640, "epoch": 4947} {"train_loss": -26.44439697265625, "global_step": 410641, "epoch": 4947} {"train_loss": -26.36969566345215, "global_step": 410642, "epoch": 4947} {"train_loss": -26.559955596923828, "global_step": 410643, "epoch": 4947} {"train_loss": -26.126508712768555, "global_step": 410644, "epoch": 4947} {"train_loss": -26.773115158081055, "global_step": 410645, "epoch": 4947} {"train_loss": -26.54903221130371, "global_step": 410646, "epoch": 4947} {"train_loss": -26.383758544921875, "global_step": 410647, "epoch": 4947} {"train_loss": -26.133520126342773, "global_step": 410648, "epoch": 4947} {"train_loss": -26.6583251953125, "global_step": 410649, "epoch": 4947} {"train_loss": -25.975208282470703, "global_step": 410650, "epoch": 4947} {"train_loss": -26.42219352722168, "global_step": 410651, "epoch": 4947} {"train_loss": -26.553495407104492, "global_step": 410652, "epoch": 4947} {"train_loss": -26.56245231628418, "global_step": 410653, "epoch": 4947} {"train_loss": -26.724639892578125, "global_step": 410654, "epoch": 4947} {"train_loss": -26.632741928100586, "global_step": 410655, "epoch": 4947} {"train_loss": -26.60700035095215, "global_step": 410656, "epoch": 4947} {"train_loss": -26.56023597717285, "global_step": 410657, "epoch": 4947} {"train_loss": -26.68153190612793, "global_step": 410658, "epoch": 4947} {"train_loss": -26.714780807495117, "global_step": 410659, "epoch": 4947} {"train_loss": -26.52115821838379, "global_step": 410660, "epoch": 4947} {"train_loss": -26.633380889892578, "global_step": 410661, "epoch": 4947} {"train_loss": -26.532093048095703, "global_step": 410662, "epoch": 4947} {"train_loss": -26.74313735961914, "global_step": 410663, "epoch": 4947} {"train_loss": -26.83534049987793, "global_step": 410664, "epoch": 4947} {"train_loss": -26.903905868530273, "global_step": 410665, "epoch": 4947} {"train_loss": -27.057538986206055, "global_step": 410666, "epoch": 4947} {"train_loss": -26.832746505737305, "global_step": 410667, "epoch": 4947} {"train_loss": -26.76666831970215, "global_step": 410668, "epoch": 4947} {"train_loss": -26.8712215423584, "global_step": 410669, "epoch": 4947} {"train_loss": -26.917383193969727, "global_step": 410670, "epoch": 4947} {"train_loss": -26.720184326171875, "global_step": 410671, "epoch": 4947} {"train_loss": -27.04890251159668, "global_step": 410672, "epoch": 4947} {"train_loss": -27.042083740234375, "global_step": 410673, "epoch": 4947} {"train_loss": -27.0400390625, "global_step": 410674, "epoch": 4947} {"train_loss": -26.818058013916016, "global_step": 410675, "epoch": 4947} {"train_loss": -26.861555099487305, "global_step": 410676, "epoch": 4947} {"train_loss": -26.71527671813965, "global_step": 410677, "epoch": 4947} {"train_loss": -27.137975692749023, "global_step": 410678, "epoch": 4947} {"train_loss": -26.7277889251709, "global_step": 410679, "epoch": 4947} {"train_loss": -26.605127334594727, "global_step": 410680, "epoch": 4947} {"train_loss": -26.551000595092773, "global_step": 410681, "epoch": 4947} {"train_loss": -26.72332191467285, "global_step": 410682, "epoch": 4947} {"train_loss": -25.994651518672345, "global_step": 410683, "epoch": 4947, "val_loss": 6566475.5} {"train_loss": -26.604589462280273, "global_step": 410684, "epoch": 4948} {"train_loss": -26.13797950744629, "global_step": 410685, "epoch": 4948} {"train_loss": -26.35625648498535, "global_step": 410686, "epoch": 4948} {"train_loss": -26.487791061401367, "global_step": 410687, "epoch": 4948} {"train_loss": -26.380956649780273, "global_step": 410688, "epoch": 4948} {"train_loss": -26.708887100219727, "global_step": 410689, "epoch": 4948} {"train_loss": -26.823728561401367, "global_step": 410690, "epoch": 4948} {"train_loss": -26.891271591186523, "global_step": 410691, "epoch": 4948} {"train_loss": -26.852386474609375, "global_step": 410692, "epoch": 4948} {"train_loss": -26.464008331298828, "global_step": 410693, "epoch": 4948} {"train_loss": -25.78962516784668, "global_step": 410694, "epoch": 4948} {"train_loss": -26.527069091796875, "global_step": 410695, "epoch": 4948} {"train_loss": -25.995222091674805, "global_step": 410696, "epoch": 4948} {"train_loss": -26.15894889831543, "global_step": 410697, "epoch": 4948} {"train_loss": -26.693801879882812, "global_step": 410698, "epoch": 4948} {"train_loss": -26.18243980407715, "global_step": 410699, "epoch": 4948} {"train_loss": -26.19938087463379, "global_step": 410700, "epoch": 4948} {"train_loss": -26.246475219726562, "global_step": 410701, "epoch": 4948} {"train_loss": -26.247833251953125, "global_step": 410702, "epoch": 4948} {"train_loss": -26.768075942993164, "global_step": 410703, "epoch": 4948} {"train_loss": -26.4052677154541, "global_step": 410704, "epoch": 4948} {"train_loss": -26.541662216186523, "global_step": 410705, "epoch": 4948} {"train_loss": -26.340839385986328, "global_step": 410706, "epoch": 4948} {"train_loss": -26.56976890563965, "global_step": 410707, "epoch": 4948} {"train_loss": -26.623632431030273, "global_step": 410708, "epoch": 4948} {"train_loss": -25.984830856323242, "global_step": 410709, "epoch": 4948} {"train_loss": -26.347156524658203, "global_step": 410710, "epoch": 4948} {"train_loss": -26.789630889892578, "global_step": 410711, "epoch": 4948} {"train_loss": -26.215030670166016, "global_step": 410712, "epoch": 4948} {"train_loss": -26.66773796081543, "global_step": 410713, "epoch": 4948} {"train_loss": -26.5086669921875, "global_step": 410714, "epoch": 4948} {"train_loss": -26.297582626342773, "global_step": 410715, "epoch": 4948} {"train_loss": -26.820871353149414, "global_step": 410716, "epoch": 4948} {"train_loss": -26.741987228393555, "global_step": 410717, "epoch": 4948} {"train_loss": -26.403268814086914, "global_step": 410718, "epoch": 4948} {"train_loss": -26.857751846313477, "global_step": 410719, "epoch": 4948} {"train_loss": -26.04286766052246, "global_step": 410720, "epoch": 4948} {"train_loss": -26.885669708251953, "global_step": 410721, "epoch": 4948} {"train_loss": -26.587329864501953, "global_step": 410722, "epoch": 4948} {"train_loss": -26.81109046936035, "global_step": 410723, "epoch": 4948} {"train_loss": -26.73491859436035, "global_step": 410724, "epoch": 4948} {"train_loss": -26.39139747619629, "global_step": 410725, "epoch": 4948} {"train_loss": -26.645063400268555, "global_step": 410726, "epoch": 4948} {"train_loss": -26.854755401611328, "global_step": 410727, "epoch": 4948} {"train_loss": -26.432071685791016, "global_step": 410728, "epoch": 4948} {"train_loss": -26.53264808654785, "global_step": 410729, "epoch": 4948} {"train_loss": -26.990976333618164, "global_step": 410730, "epoch": 4948} {"train_loss": -26.342065811157227, "global_step": 410731, "epoch": 4948} {"train_loss": -26.486555099487305, "global_step": 410732, "epoch": 4948} {"train_loss": -26.788888931274414, "global_step": 410733, "epoch": 4948} {"train_loss": -26.820524215698242, "global_step": 410734, "epoch": 4948} {"train_loss": -26.865201950073242, "global_step": 410735, "epoch": 4948} {"train_loss": -26.80213737487793, "global_step": 410736, "epoch": 4948} {"train_loss": -26.978015899658203, "global_step": 410737, "epoch": 4948} {"train_loss": -26.766849517822266, "global_step": 410738, "epoch": 4948} {"train_loss": -26.940597534179688, "global_step": 410739, "epoch": 4948} {"train_loss": -26.86054039001465, "global_step": 410740, "epoch": 4948} {"train_loss": -26.64301872253418, "global_step": 410741, "epoch": 4948} {"train_loss": -26.87360954284668, "global_step": 410742, "epoch": 4948} {"train_loss": -26.938846588134766, "global_step": 410743, "epoch": 4948} {"train_loss": -26.58961296081543, "global_step": 410744, "epoch": 4948} {"train_loss": -27.28679847717285, "global_step": 410745, "epoch": 4948} {"train_loss": -27.007465362548828, "global_step": 410746, "epoch": 4948} {"train_loss": -26.534826278686523, "global_step": 410747, "epoch": 4948} {"train_loss": -26.8287353515625, "global_step": 410748, "epoch": 4948} {"train_loss": -26.62725257873535, "global_step": 410749, "epoch": 4948} {"train_loss": -26.40851402282715, "global_step": 410750, "epoch": 4948} {"train_loss": -26.855833053588867, "global_step": 410751, "epoch": 4948} {"train_loss": -26.662805557250977, "global_step": 410752, "epoch": 4948} {"train_loss": -26.802032470703125, "global_step": 410753, "epoch": 4948} {"train_loss": -27.02524185180664, "global_step": 410754, "epoch": 4948} {"train_loss": -26.79224967956543, "global_step": 410755, "epoch": 4948} {"train_loss": -27.074569702148438, "global_step": 410756, "epoch": 4948} {"train_loss": -26.68701171875, "global_step": 410757, "epoch": 4948} {"train_loss": -26.51972770690918, "global_step": 410758, "epoch": 4948} {"train_loss": -26.456485748291016, "global_step": 410759, "epoch": 4948} {"train_loss": -26.860137939453125, "global_step": 410760, "epoch": 4948} {"train_loss": -26.81843376159668, "global_step": 410761, "epoch": 4948} {"train_loss": -26.90106201171875, "global_step": 410762, "epoch": 4948} {"train_loss": -26.959997177124023, "global_step": 410763, "epoch": 4948} {"train_loss": -26.6657772064209, "global_step": 410764, "epoch": 4948} {"train_loss": -27.0575008392334, "global_step": 410765, "epoch": 4948} {"train_loss": -26.634249859545605, "global_step": 410766, "epoch": 4948, "val_loss": 6600968.0} {"train_loss": -25.51792335510254, "global_step": 410767, "epoch": 4949} {"train_loss": -25.926305770874023, "global_step": 410768, "epoch": 4949} {"train_loss": -25.921472549438477, "global_step": 410769, "epoch": 4949} {"train_loss": -26.07720947265625, "global_step": 410770, "epoch": 4949} {"train_loss": -25.69060707092285, "global_step": 410771, "epoch": 4949} {"train_loss": -25.979833602905273, "global_step": 410772, "epoch": 4949} {"train_loss": -26.350866317749023, "global_step": 410773, "epoch": 4949} {"train_loss": -26.18720817565918, "global_step": 410774, "epoch": 4949} {"train_loss": -26.30792236328125, "global_step": 410775, "epoch": 4949} {"train_loss": -26.9506778717041, "global_step": 410776, "epoch": 4949} {"train_loss": -26.442285537719727, "global_step": 410777, "epoch": 4949} {"train_loss": -26.43837547302246, "global_step": 410778, "epoch": 4949} {"train_loss": -26.523813247680664, "global_step": 410779, "epoch": 4949} {"train_loss": -26.384933471679688, "global_step": 410780, "epoch": 4949} {"train_loss": -26.875080108642578, "global_step": 410781, "epoch": 4949} {"train_loss": -26.669605255126953, "global_step": 410782, "epoch": 4949} {"train_loss": -26.748762130737305, "global_step": 410783, "epoch": 4949} {"train_loss": -26.678800582885742, "global_step": 410784, "epoch": 4949} {"train_loss": -26.547561645507812, "global_step": 410785, "epoch": 4949} {"train_loss": -27.144540786743164, "global_step": 410786, "epoch": 4949} {"train_loss": -26.91621208190918, "global_step": 410787, "epoch": 4949} {"train_loss": -26.64866065979004, "global_step": 410788, "epoch": 4949} {"train_loss": -26.7210750579834, "global_step": 410789, "epoch": 4949} {"train_loss": -26.73007583618164, "global_step": 410790, "epoch": 4949} {"train_loss": -26.9721736907959, "global_step": 410791, "epoch": 4949} {"train_loss": -26.787033081054688, "global_step": 410792, "epoch": 4949} {"train_loss": -26.59685707092285, "global_step": 410793, "epoch": 4949} {"train_loss": -26.955358505249023, "global_step": 410794, "epoch": 4949} {"train_loss": -26.679977416992188, "global_step": 410795, "epoch": 4949} {"train_loss": -26.490930557250977, "global_step": 410796, "epoch": 4949} {"train_loss": -27.02176856994629, "global_step": 410797, "epoch": 4949} {"train_loss": -26.826154708862305, "global_step": 410798, "epoch": 4949} {"train_loss": -26.987531661987305, "global_step": 410799, "epoch": 4949} {"train_loss": -26.51435661315918, "global_step": 410800, "epoch": 4949} {"train_loss": -26.727994918823242, "global_step": 410801, "epoch": 4949} {"train_loss": -26.593250274658203, "global_step": 410802, "epoch": 4949} {"train_loss": -26.834369659423828, "global_step": 410803, "epoch": 4949} {"train_loss": -26.84162712097168, "global_step": 410804, "epoch": 4949} {"train_loss": -26.855138778686523, "global_step": 410805, "epoch": 4949} {"train_loss": -27.061315536499023, "global_step": 410806, "epoch": 4949} {"train_loss": -26.15673828125, "global_step": 410807, "epoch": 4949} {"train_loss": -26.256423950195312, "global_step": 410808, "epoch": 4949} {"train_loss": -26.800872802734375, "global_step": 410809, "epoch": 4949} {"train_loss": -26.840545654296875, "global_step": 410810, "epoch": 4949} {"train_loss": -26.616849899291992, "global_step": 410811, "epoch": 4949} {"train_loss": -27.158206939697266, "global_step": 410812, "epoch": 4949} {"train_loss": -27.002832412719727, "global_step": 410813, "epoch": 4949} {"train_loss": -26.813800811767578, "global_step": 410814, "epoch": 4949} {"train_loss": -26.8673038482666, "global_step": 410815, "epoch": 4949} {"train_loss": -26.895811080932617, "global_step": 410816, "epoch": 4949} {"train_loss": -26.7698917388916, "global_step": 410817, "epoch": 4949} {"train_loss": -26.731855392456055, "global_step": 410818, "epoch": 4949} {"train_loss": -26.92848777770996, "global_step": 410819, "epoch": 4949} {"train_loss": -27.04203224182129, "global_step": 410820, "epoch": 4949} {"train_loss": -27.348941802978516, "global_step": 410821, "epoch": 4949} {"train_loss": -26.58379554748535, "global_step": 410822, "epoch": 4949} {"train_loss": -26.972497940063477, "global_step": 410823, "epoch": 4949} {"train_loss": -27.2576961517334, "global_step": 410824, "epoch": 4949} {"train_loss": -26.64923095703125, "global_step": 410825, "epoch": 4949} {"train_loss": -27.028034210205078, "global_step": 410826, "epoch": 4949} {"train_loss": -27.136938095092773, "global_step": 410827, "epoch": 4949} {"train_loss": -26.8836669921875, "global_step": 410828, "epoch": 4949} {"train_loss": -27.191593170166016, "global_step": 410829, "epoch": 4949} {"train_loss": -26.76418113708496, "global_step": 410830, "epoch": 4949} {"train_loss": -26.749725341796875, "global_step": 410831, "epoch": 4949} {"train_loss": -26.910348892211914, "global_step": 410832, "epoch": 4949} {"train_loss": -26.848676681518555, "global_step": 410833, "epoch": 4949} {"train_loss": -26.5693416595459, "global_step": 410834, "epoch": 4949} {"train_loss": -26.610437393188477, "global_step": 410835, "epoch": 4949} {"train_loss": -26.52082633972168, "global_step": 410836, "epoch": 4949} {"train_loss": -25.917688369750977, "global_step": 410837, "epoch": 4949} {"train_loss": -26.5729923248291, "global_step": 410838, "epoch": 4949} {"train_loss": -26.35498046875, "global_step": 410839, "epoch": 4949} {"train_loss": -25.672443389892578, "global_step": 410840, "epoch": 4949} {"train_loss": -25.578636169433594, "global_step": 410841, "epoch": 4949} {"train_loss": -26.4823055267334, "global_step": 410842, "epoch": 4949} {"train_loss": -26.136188507080078, "global_step": 410843, "epoch": 4949} {"train_loss": -25.911352157592773, "global_step": 410844, "epoch": 4949} {"train_loss": -26.27911949157715, "global_step": 410845, "epoch": 4949} {"train_loss": -25.6284236907959, "global_step": 410846, "epoch": 4949} {"train_loss": -26.31085205078125, "global_step": 410847, "epoch": 4949} {"train_loss": -26.454395294189453, "global_step": 410848, "epoch": 4949} {"train_loss": -26.587358911353423, "global_step": 410849, "epoch": 4949, "val_loss": 6637640.0} {"train_loss": -25.2236385345459, "global_step": 410850, "epoch": 4950} {"train_loss": -25.020095825195312, "global_step": 410851, "epoch": 4950} {"train_loss": -24.704862594604492, "global_step": 410852, "epoch": 4950} {"train_loss": -26.046300888061523, "global_step": 410853, "epoch": 4950} {"train_loss": -24.902036666870117, "global_step": 410854, "epoch": 4950} {"train_loss": -25.10782814025879, "global_step": 410855, "epoch": 4950} {"train_loss": -25.57023048400879, "global_step": 410856, "epoch": 4950} {"train_loss": -25.789533615112305, "global_step": 410857, "epoch": 4950} {"train_loss": -25.6319637298584, "global_step": 410858, "epoch": 4950} {"train_loss": -25.837305068969727, "global_step": 410859, "epoch": 4950} {"train_loss": -25.90046501159668, "global_step": 410860, "epoch": 4950} {"train_loss": -25.703317642211914, "global_step": 410861, "epoch": 4950} {"train_loss": -25.891504287719727, "global_step": 410862, "epoch": 4950} {"train_loss": -25.512983322143555, "global_step": 410863, "epoch": 4950} {"train_loss": -26.287092208862305, "global_step": 410864, "epoch": 4950} {"train_loss": -25.86809730529785, "global_step": 410865, "epoch": 4950} {"train_loss": -26.107803344726562, "global_step": 410866, "epoch": 4950} {"train_loss": -26.35663414001465, "global_step": 410867, "epoch": 4950} {"train_loss": -26.228784561157227, "global_step": 410868, "epoch": 4950} {"train_loss": -26.17872428894043, "global_step": 410869, "epoch": 4950} {"train_loss": -26.154315948486328, "global_step": 410870, "epoch": 4950} {"train_loss": -26.42767333984375, "global_step": 410871, "epoch": 4950} {"train_loss": -26.269519805908203, "global_step": 410872, "epoch": 4950} {"train_loss": -26.357160568237305, "global_step": 410873, "epoch": 4950} {"train_loss": -26.18354606628418, "global_step": 410874, "epoch": 4950} {"train_loss": -26.364521026611328, "global_step": 410875, "epoch": 4950} {"train_loss": -26.77971839904785, "global_step": 410876, "epoch": 4950} {"train_loss": -26.7067813873291, "global_step": 410877, "epoch": 4950} {"train_loss": -26.501798629760742, "global_step": 410878, "epoch": 4950} {"train_loss": -26.141809463500977, "global_step": 410879, "epoch": 4950} {"train_loss": -26.4668025970459, "global_step": 410880, "epoch": 4950} {"train_loss": -26.704486846923828, "global_step": 410881, "epoch": 4950} {"train_loss": -26.373096466064453, "global_step": 410882, "epoch": 4950} {"train_loss": -26.575668334960938, "global_step": 410883, "epoch": 4950} {"train_loss": -26.70342445373535, "global_step": 410884, "epoch": 4950} {"train_loss": -26.656509399414062, "global_step": 410885, "epoch": 4950} {"train_loss": -26.683149337768555, "global_step": 410886, "epoch": 4950} {"train_loss": -25.86651611328125, "global_step": 410887, "epoch": 4950} {"train_loss": -26.609975814819336, "global_step": 410888, "epoch": 4950} {"train_loss": -26.76130485534668, "global_step": 410889, "epoch": 4950} {"train_loss": -26.723346710205078, "global_step": 410890, "epoch": 4950} {"train_loss": -26.8809814453125, "global_step": 410891, "epoch": 4950} {"train_loss": -26.66275405883789, "global_step": 410892, "epoch": 4950} {"train_loss": -26.824026107788086, "global_step": 410893, "epoch": 4950} {"train_loss": -26.738800048828125, "global_step": 410894, "epoch": 4950} {"train_loss": -26.780847549438477, "global_step": 410895, "epoch": 4950} {"train_loss": -26.7838134765625, "global_step": 410896, "epoch": 4950} {"train_loss": -26.532550811767578, "global_step": 410897, "epoch": 4950} {"train_loss": -26.771717071533203, "global_step": 410898, "epoch": 4950} {"train_loss": -26.878997802734375, "global_step": 410899, "epoch": 4950} {"train_loss": -26.528778076171875, "global_step": 410900, "epoch": 4950} {"train_loss": -26.9443359375, "global_step": 410901, "epoch": 4950} {"train_loss": -26.967086791992188, "global_step": 410902, "epoch": 4950} {"train_loss": -27.152490615844727, "global_step": 410903, "epoch": 4950} {"train_loss": -26.723974227905273, "global_step": 410904, "epoch": 4950} {"train_loss": -26.70252799987793, "global_step": 410905, "epoch": 4950} {"train_loss": -27.121109008789062, "global_step": 410906, "epoch": 4950} {"train_loss": -26.965208053588867, "global_step": 410907, "epoch": 4950} {"train_loss": -27.218358993530273, "global_step": 410908, "epoch": 4950} {"train_loss": -26.86211585998535, "global_step": 410909, "epoch": 4950} {"train_loss": -26.993621826171875, "global_step": 410910, "epoch": 4950} {"train_loss": -26.692411422729492, "global_step": 410911, "epoch": 4950} {"train_loss": -27.1124267578125, "global_step": 410912, "epoch": 4950} {"train_loss": -26.69209098815918, "global_step": 410913, "epoch": 4950} {"train_loss": -27.086780548095703, "global_step": 410914, "epoch": 4950} {"train_loss": -27.230167388916016, "global_step": 410915, "epoch": 4950} {"train_loss": -26.745487213134766, "global_step": 410916, "epoch": 4950} {"train_loss": -26.634326934814453, "global_step": 410917, "epoch": 4950} {"train_loss": -26.995197296142578, "global_step": 410918, "epoch": 4950} {"train_loss": -26.797338485717773, "global_step": 410919, "epoch": 4950} {"train_loss": -26.433399200439453, "global_step": 410920, "epoch": 4950} {"train_loss": -26.717548370361328, "global_step": 410921, "epoch": 4950} {"train_loss": -26.61298942565918, "global_step": 410922, "epoch": 4950} {"train_loss": -26.710493087768555, "global_step": 410923, "epoch": 4950} {"train_loss": -26.146142959594727, "global_step": 410924, "epoch": 4950} {"train_loss": -27.048078536987305, "global_step": 410925, "epoch": 4950} {"train_loss": -26.508432388305664, "global_step": 410926, "epoch": 4950} {"train_loss": -26.292682647705078, "global_step": 410927, "epoch": 4950} {"train_loss": -26.973529815673828, "global_step": 410928, "epoch": 4950} {"train_loss": -26.286970138549805, "global_step": 410929, "epoch": 4950} {"train_loss": -26.531147003173828, "global_step": 410930, "epoch": 4950} {"train_loss": -26.636077880859375, "global_step": 410931, "epoch": 4950} {"train_loss": -26.42830965892378, "global_step": 410932, "epoch": 4950, "train/sim_max_reward_0": 1.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4500000": 1.0, "test/sim_max_reward_4500001": 1.0, "test/sim_max_reward_4500002": 1.0, "test/sim_max_reward_4500003": 1.0, "test/sim_max_reward_4500004": 1.0, "test/sim_max_reward_4500005": 1.0, "test/sim_max_reward_4500006": 1.0, "test/sim_max_reward_4500007": 0.0, "test/sim_max_reward_4500008": 1.0, "test/sim_max_reward_4500009": 1.0, "test/sim_max_reward_4500010": 1.0, "test/sim_max_reward_4500011": 1.0, "test/sim_max_reward_4500012": 1.0, "test/sim_max_reward_4500013": 0.0, "test/sim_max_reward_4500014": 1.0, "test/sim_max_reward_4500015": 1.0, "test/sim_max_reward_4500016": 1.0, "test/sim_max_reward_4500017": 1.0, "test/sim_max_reward_4500018": 0.0, "test/sim_max_reward_4500019": 0.0, "test/sim_max_reward_4500020": 1.0, "test/sim_max_reward_4500021": 1.0, "train/mean_score": 1.0, "test/mean_score": 0.8181818181818182, "val_loss": 6624821.0} {"train_loss": -26.33112907409668, "global_step": 410933, "epoch": 4951} {"train_loss": -26.711469650268555, "global_step": 410934, "epoch": 4951} {"train_loss": -25.98866081237793, "global_step": 410935, "epoch": 4951} {"train_loss": -26.095930099487305, "global_step": 410936, "epoch": 4951} {"train_loss": -25.998132705688477, "global_step": 410937, "epoch": 4951} {"train_loss": -26.10561180114746, "global_step": 410938, "epoch": 4951} {"train_loss": -26.41010856628418, "global_step": 410939, "epoch": 4951} {"train_loss": -26.13998794555664, "global_step": 410940, "epoch": 4951} {"train_loss": -26.659948348999023, "global_step": 410941, "epoch": 4951} {"train_loss": -26.2911376953125, "global_step": 410942, "epoch": 4951} {"train_loss": -26.36297607421875, "global_step": 410943, "epoch": 4951} {"train_loss": -26.249984741210938, "global_step": 410944, "epoch": 4951} {"train_loss": -25.6522274017334, "global_step": 410945, "epoch": 4951} {"train_loss": -25.92987060546875, "global_step": 410946, "epoch": 4951} {"train_loss": -25.953283309936523, "global_step": 410947, "epoch": 4951} {"train_loss": -26.822895050048828, "global_step": 410948, "epoch": 4951} {"train_loss": -26.14509391784668, "global_step": 410949, "epoch": 4951} {"train_loss": -26.318878173828125, "global_step": 410950, "epoch": 4951} {"train_loss": -26.674121856689453, "global_step": 410951, "epoch": 4951} {"train_loss": -26.11793327331543, "global_step": 410952, "epoch": 4951} {"train_loss": -26.311450958251953, "global_step": 410953, "epoch": 4951} {"train_loss": -26.408597946166992, "global_step": 410954, "epoch": 4951} {"train_loss": -26.16659927368164, "global_step": 410955, "epoch": 4951} {"train_loss": -26.37766456604004, "global_step": 410956, "epoch": 4951} {"train_loss": -26.019906997680664, "global_step": 410957, "epoch": 4951} {"train_loss": -26.816213607788086, "global_step": 410958, "epoch": 4951} {"train_loss": -26.551239013671875, "global_step": 410959, "epoch": 4951} {"train_loss": -26.403888702392578, "global_step": 410960, "epoch": 4951} {"train_loss": -26.279905319213867, "global_step": 410961, "epoch": 4951} {"train_loss": -26.205402374267578, "global_step": 410962, "epoch": 4951} {"train_loss": -26.899494171142578, "global_step": 410963, "epoch": 4951} {"train_loss": -26.42128562927246, "global_step": 410964, "epoch": 4951} {"train_loss": -26.628055572509766, "global_step": 410965, "epoch": 4951} {"train_loss": -26.718534469604492, "global_step": 410966, "epoch": 4951} {"train_loss": -26.890228271484375, "global_step": 410967, "epoch": 4951} {"train_loss": -26.188451766967773, "global_step": 410968, "epoch": 4951} {"train_loss": -26.778478622436523, "global_step": 410969, "epoch": 4951} {"train_loss": -26.621768951416016, "global_step": 410970, "epoch": 4951} {"train_loss": -26.6579532623291, "global_step": 410971, "epoch": 4951} {"train_loss": -26.817462921142578, "global_step": 410972, "epoch": 4951} {"train_loss": -26.851972579956055, "global_step": 410973, "epoch": 4951} {"train_loss": -27.236557006835938, "global_step": 410974, "epoch": 4951} {"train_loss": -26.529834747314453, "global_step": 410975, "epoch": 4951} {"train_loss": -26.9644832611084, "global_step": 410976, "epoch": 4951} {"train_loss": -27.116607666015625, "global_step": 410977, "epoch": 4951} {"train_loss": -27.027877807617188, "global_step": 410978, "epoch": 4951} {"train_loss": -26.87196159362793, "global_step": 410979, "epoch": 4951} {"train_loss": -26.682104110717773, "global_step": 410980, "epoch": 4951} {"train_loss": -26.88077735900879, "global_step": 410981, "epoch": 4951} {"train_loss": -26.780603408813477, "global_step": 410982, "epoch": 4951} {"train_loss": -26.9332332611084, "global_step": 410983, "epoch": 4951} {"train_loss": -26.449716567993164, "global_step": 410984, "epoch": 4951} {"train_loss": -26.909744262695312, "global_step": 410985, "epoch": 4951} {"train_loss": -26.496850967407227, "global_step": 410986, "epoch": 4951} {"train_loss": -26.79192543029785, "global_step": 410987, "epoch": 4951} {"train_loss": -26.72218132019043, "global_step": 410988, "epoch": 4951} {"train_loss": -26.908246994018555, "global_step": 410989, "epoch": 4951} {"train_loss": -26.888931274414062, "global_step": 410990, "epoch": 4951} {"train_loss": -26.9003963470459, "global_step": 410991, "epoch": 4951} {"train_loss": -27.20429801940918, "global_step": 410992, "epoch": 4951} {"train_loss": -26.93511390686035, "global_step": 410993, "epoch": 4951} {"train_loss": -27.006744384765625, "global_step": 410994, "epoch": 4951} {"train_loss": -26.873798370361328, "global_step": 410995, "epoch": 4951} {"train_loss": -27.32710838317871, "global_step": 410996, "epoch": 4951} {"train_loss": -26.973779678344727, "global_step": 410997, "epoch": 4951} {"train_loss": -26.71038246154785, "global_step": 410998, "epoch": 4951} {"train_loss": -26.362302780151367, "global_step": 410999, "epoch": 4951} {"train_loss": -25.952646255493164, "global_step": 411000, "epoch": 4951} {"train_loss": -25.959354400634766, "global_step": 411001, "epoch": 4951} {"train_loss": -26.495803833007812, "global_step": 411002, "epoch": 4951} {"train_loss": -26.54157066345215, "global_step": 411003, "epoch": 4951} {"train_loss": -26.19350242614746, "global_step": 411004, "epoch": 4951} {"train_loss": -26.49521255493164, "global_step": 411005, "epoch": 4951} {"train_loss": -26.86713981628418, "global_step": 411006, "epoch": 4951} {"train_loss": -26.68865394592285, "global_step": 411007, "epoch": 4951} {"train_loss": -26.71400260925293, "global_step": 411008, "epoch": 4951} {"train_loss": -26.377552032470703, "global_step": 411009, "epoch": 4951} {"train_loss": -26.667999267578125, "global_step": 411010, "epoch": 4951} {"train_loss": -26.453845977783203, "global_step": 411011, "epoch": 4951} {"train_loss": -26.326019287109375, "global_step": 411012, "epoch": 4951} {"train_loss": -26.606786727905273, "global_step": 411013, "epoch": 4951} {"train_loss": -26.525922775268555, "global_step": 411014, "epoch": 4951} {"train_loss": -26.552141304475715, "global_step": 411015, "epoch": 4951, "val_loss": 6542195.0} {"train_loss": -25.969039916992188, "global_step": 411016, "epoch": 4952} {"train_loss": -26.458209991455078, "global_step": 411017, "epoch": 4952} {"train_loss": -26.58609390258789, "global_step": 411018, "epoch": 4952} {"train_loss": -26.341238021850586, "global_step": 411019, "epoch": 4952} {"train_loss": -26.26386070251465, "global_step": 411020, "epoch": 4952} {"train_loss": -26.695892333984375, "global_step": 411021, "epoch": 4952} {"train_loss": -26.193716049194336, "global_step": 411022, "epoch": 4952} {"train_loss": -26.502695083618164, "global_step": 411023, "epoch": 4952} {"train_loss": -26.525150299072266, "global_step": 411024, "epoch": 4952} {"train_loss": -26.628931045532227, "global_step": 411025, "epoch": 4952} {"train_loss": -26.55531120300293, "global_step": 411026, "epoch": 4952} {"train_loss": -26.26698112487793, "global_step": 411027, "epoch": 4952} {"train_loss": -26.047269821166992, "global_step": 411028, "epoch": 4952} {"train_loss": -26.045581817626953, "global_step": 411029, "epoch": 4952} {"train_loss": -26.139240264892578, "global_step": 411030, "epoch": 4952} {"train_loss": -26.542905807495117, "global_step": 411031, "epoch": 4952} {"train_loss": -26.677398681640625, "global_step": 411032, "epoch": 4952} {"train_loss": -26.251163482666016, "global_step": 411033, "epoch": 4952} {"train_loss": -26.462430953979492, "global_step": 411034, "epoch": 4952} {"train_loss": -26.834228515625, "global_step": 411035, "epoch": 4952} {"train_loss": -25.99021339416504, "global_step": 411036, "epoch": 4952} {"train_loss": -26.450042724609375, "global_step": 411037, "epoch": 4952} {"train_loss": -26.321252822875977, "global_step": 411038, "epoch": 4952} {"train_loss": -26.44705581665039, "global_step": 411039, "epoch": 4952} {"train_loss": -26.351343154907227, "global_step": 411040, "epoch": 4952} {"train_loss": -26.316884994506836, "global_step": 411041, "epoch": 4952} {"train_loss": -26.6946964263916, "global_step": 411042, "epoch": 4952} {"train_loss": -26.08621597290039, "global_step": 411043, "epoch": 4952} {"train_loss": -26.408130645751953, "global_step": 411044, "epoch": 4952} {"train_loss": -26.23749351501465, "global_step": 411045, "epoch": 4952} {"train_loss": -26.550580978393555, "global_step": 411046, "epoch": 4952} {"train_loss": -26.8149471282959, "global_step": 411047, "epoch": 4952} {"train_loss": -26.698888778686523, "global_step": 411048, "epoch": 4952} {"train_loss": -26.412500381469727, "global_step": 411049, "epoch": 4952} {"train_loss": -27.086767196655273, "global_step": 411050, "epoch": 4952} {"train_loss": -26.901586532592773, "global_step": 411051, "epoch": 4952} {"train_loss": -26.545007705688477, "global_step": 411052, "epoch": 4952} {"train_loss": -26.671106338500977, "global_step": 411053, "epoch": 4952} {"train_loss": -26.541213989257812, "global_step": 411054, "epoch": 4952} {"train_loss": -26.7741641998291, "global_step": 411055, "epoch": 4952} {"train_loss": -27.018692016601562, "global_step": 411056, "epoch": 4952} {"train_loss": -26.854604721069336, "global_step": 411057, "epoch": 4952} {"train_loss": -26.823291778564453, "global_step": 411058, "epoch": 4952} {"train_loss": -26.95850944519043, "global_step": 411059, "epoch": 4952} {"train_loss": -26.681421279907227, "global_step": 411060, "epoch": 4952} {"train_loss": -26.892902374267578, "global_step": 411061, "epoch": 4952} {"train_loss": -26.78339958190918, "global_step": 411062, "epoch": 4952} {"train_loss": -26.844654083251953, "global_step": 411063, "epoch": 4952} {"train_loss": -26.87074089050293, "global_step": 411064, "epoch": 4952} {"train_loss": -26.80661392211914, "global_step": 411065, "epoch": 4952} {"train_loss": -26.544498443603516, "global_step": 411066, "epoch": 4952} {"train_loss": -26.9539737701416, "global_step": 411067, "epoch": 4952} {"train_loss": -26.5832462310791, "global_step": 411068, "epoch": 4952} {"train_loss": -26.436996459960938, "global_step": 411069, "epoch": 4952} {"train_loss": -26.570484161376953, "global_step": 411070, "epoch": 4952} {"train_loss": -26.4633731842041, "global_step": 411071, "epoch": 4952} {"train_loss": -26.680017471313477, "global_step": 411072, "epoch": 4952} {"train_loss": -26.268163681030273, "global_step": 411073, "epoch": 4952} {"train_loss": -26.595991134643555, "global_step": 411074, "epoch": 4952} {"train_loss": -26.79254150390625, "global_step": 411075, "epoch": 4952} {"train_loss": -27.199954986572266, "global_step": 411076, "epoch": 4952} {"train_loss": -26.590375900268555, "global_step": 411077, "epoch": 4952} {"train_loss": -26.752546310424805, "global_step": 411078, "epoch": 4952} {"train_loss": -26.599872589111328, "global_step": 411079, "epoch": 4952} {"train_loss": -26.703495025634766, "global_step": 411080, "epoch": 4952} {"train_loss": -26.682586669921875, "global_step": 411081, "epoch": 4952} {"train_loss": -26.794605255126953, "global_step": 411082, "epoch": 4952} {"train_loss": -26.67451286315918, "global_step": 411083, "epoch": 4952} {"train_loss": -26.446487426757812, "global_step": 411084, "epoch": 4952} {"train_loss": -26.648136138916016, "global_step": 411085, "epoch": 4952} {"train_loss": -26.473407745361328, "global_step": 411086, "epoch": 4952} {"train_loss": -26.9688663482666, "global_step": 411087, "epoch": 4952} {"train_loss": -26.860864639282227, "global_step": 411088, "epoch": 4952} {"train_loss": -26.774860382080078, "global_step": 411089, "epoch": 4952} {"train_loss": -26.826093673706055, "global_step": 411090, "epoch": 4952} {"train_loss": -26.766326904296875, "global_step": 411091, "epoch": 4952} {"train_loss": -26.57972526550293, "global_step": 411092, "epoch": 4952} {"train_loss": -27.0760555267334, "global_step": 411093, "epoch": 4952} {"train_loss": -27.045103073120117, "global_step": 411094, "epoch": 4952} {"train_loss": -26.817718505859375, "global_step": 411095, "epoch": 4952} {"train_loss": -26.29546546936035, "global_step": 411096, "epoch": 4952} {"train_loss": -27.187414169311523, "global_step": 411097, "epoch": 4952} {"train_loss": -26.585599462670015, "global_step": 411098, "epoch": 4952, "val_loss": 6515695.0} {"train_loss": -25.40932846069336, "global_step": 411099, "epoch": 4953} {"train_loss": -24.405521392822266, "global_step": 411100, "epoch": 4953} {"train_loss": -25.055570602416992, "global_step": 411101, "epoch": 4953} {"train_loss": -25.91684913635254, "global_step": 411102, "epoch": 4953} {"train_loss": -25.83928871154785, "global_step": 411103, "epoch": 4953} {"train_loss": -25.984272003173828, "global_step": 411104, "epoch": 4953} {"train_loss": -25.58245277404785, "global_step": 411105, "epoch": 4953} {"train_loss": -25.96832275390625, "global_step": 411106, "epoch": 4953} {"train_loss": -25.32907485961914, "global_step": 411107, "epoch": 4953} {"train_loss": -26.001224517822266, "global_step": 411108, "epoch": 4953} {"train_loss": -25.748071670532227, "global_step": 411109, "epoch": 4953} {"train_loss": -26.04255485534668, "global_step": 411110, "epoch": 4953} {"train_loss": -25.689559936523438, "global_step": 411111, "epoch": 4953} {"train_loss": -26.102262496948242, "global_step": 411112, "epoch": 4953} {"train_loss": -26.29939079284668, "global_step": 411113, "epoch": 4953} {"train_loss": -26.218128204345703, "global_step": 411114, "epoch": 4953} {"train_loss": -26.101886749267578, "global_step": 411115, "epoch": 4953} {"train_loss": -26.07343864440918, "global_step": 411116, "epoch": 4953} {"train_loss": -26.338159561157227, "global_step": 411117, "epoch": 4953} {"train_loss": -26.161849975585938, "global_step": 411118, "epoch": 4953} {"train_loss": -26.34954261779785, "global_step": 411119, "epoch": 4953} {"train_loss": -26.318716049194336, "global_step": 411120, "epoch": 4953} {"train_loss": -26.300918579101562, "global_step": 411121, "epoch": 4953} {"train_loss": -26.25409507751465, "global_step": 411122, "epoch": 4953} {"train_loss": -26.264978408813477, "global_step": 411123, "epoch": 4953} {"train_loss": -26.3947696685791, "global_step": 411124, "epoch": 4953} {"train_loss": -26.36380958557129, "global_step": 411125, "epoch": 4953} {"train_loss": -26.264978408813477, "global_step": 411126, "epoch": 4953} {"train_loss": -26.159515380859375, "global_step": 411127, "epoch": 4953} {"train_loss": -26.313512802124023, "global_step": 411128, "epoch": 4953} {"train_loss": -26.477008819580078, "global_step": 411129, "epoch": 4953} {"train_loss": -26.497516632080078, "global_step": 411130, "epoch": 4953} {"train_loss": -26.443084716796875, "global_step": 411131, "epoch": 4953} {"train_loss": -26.452560424804688, "global_step": 411132, "epoch": 4953} {"train_loss": -26.480548858642578, "global_step": 411133, "epoch": 4953} {"train_loss": -26.760847091674805, "global_step": 411134, "epoch": 4953} {"train_loss": -26.50238037109375, "global_step": 411135, "epoch": 4953} {"train_loss": -26.462549209594727, "global_step": 411136, "epoch": 4953} {"train_loss": -26.59144401550293, "global_step": 411137, "epoch": 4953} {"train_loss": -26.43800163269043, "global_step": 411138, "epoch": 4953} {"train_loss": -26.616361618041992, "global_step": 411139, "epoch": 4953} {"train_loss": -26.774372100830078, "global_step": 411140, "epoch": 4953} {"train_loss": -26.706256866455078, "global_step": 411141, "epoch": 4953} {"train_loss": -26.65421485900879, "global_step": 411142, "epoch": 4953} {"train_loss": -26.818700790405273, "global_step": 411143, "epoch": 4953} {"train_loss": -26.898529052734375, "global_step": 411144, "epoch": 4953} {"train_loss": -26.620649337768555, "global_step": 411145, "epoch": 4953} {"train_loss": -26.944488525390625, "global_step": 411146, "epoch": 4953} {"train_loss": -27.003000259399414, "global_step": 411147, "epoch": 4953} {"train_loss": -27.183155059814453, "global_step": 411148, "epoch": 4953} {"train_loss": -26.9736328125, "global_step": 411149, "epoch": 4953} {"train_loss": -27.113134384155273, "global_step": 411150, "epoch": 4953} {"train_loss": -26.937604904174805, "global_step": 411151, "epoch": 4953} {"train_loss": -27.02471351623535, "global_step": 411152, "epoch": 4953} {"train_loss": -27.0692081451416, "global_step": 411153, "epoch": 4953} {"train_loss": -26.995054244995117, "global_step": 411154, "epoch": 4953} {"train_loss": -26.976465225219727, "global_step": 411155, "epoch": 4953} {"train_loss": -26.770767211914062, "global_step": 411156, "epoch": 4953} {"train_loss": -26.73764419555664, "global_step": 411157, "epoch": 4953} {"train_loss": -27.05681800842285, "global_step": 411158, "epoch": 4953} {"train_loss": -26.71976661682129, "global_step": 411159, "epoch": 4953} {"train_loss": -26.54496192932129, "global_step": 411160, "epoch": 4953} {"train_loss": -27.06357765197754, "global_step": 411161, "epoch": 4953} {"train_loss": -27.035388946533203, "global_step": 411162, "epoch": 4953} {"train_loss": -26.607440948486328, "global_step": 411163, "epoch": 4953} {"train_loss": -26.831317901611328, "global_step": 411164, "epoch": 4953} {"train_loss": -26.86353874206543, "global_step": 411165, "epoch": 4953} {"train_loss": -27.069616317749023, "global_step": 411166, "epoch": 4953} {"train_loss": -26.49970054626465, "global_step": 411167, "epoch": 4953} {"train_loss": -26.365060806274414, "global_step": 411168, "epoch": 4953} {"train_loss": -26.697744369506836, "global_step": 411169, "epoch": 4953} {"train_loss": -26.9431095123291, "global_step": 411170, "epoch": 4953} {"train_loss": -26.777265548706055, "global_step": 411171, "epoch": 4953} {"train_loss": -26.850021362304688, "global_step": 411172, "epoch": 4953} {"train_loss": -26.932363510131836, "global_step": 411173, "epoch": 4953} {"train_loss": -26.86663246154785, "global_step": 411174, "epoch": 4953} {"train_loss": -26.79231071472168, "global_step": 411175, "epoch": 4953} {"train_loss": -26.541791915893555, "global_step": 411176, "epoch": 4953} {"train_loss": -26.80719566345215, "global_step": 411177, "epoch": 4953} {"train_loss": -26.679187774658203, "global_step": 411178, "epoch": 4953} {"train_loss": -26.96724510192871, "global_step": 411179, "epoch": 4953} {"train_loss": -26.47220230102539, "global_step": 411180, "epoch": 4953} {"train_loss": -26.47927647326366, "global_step": 411181, "epoch": 4953, "val_loss": 6605210.0} {"train_loss": -24.245574951171875, "global_step": 411182, "epoch": 4954} {"train_loss": -25.061614990234375, "global_step": 411183, "epoch": 4954} {"train_loss": -25.178258895874023, "global_step": 411184, "epoch": 4954} {"train_loss": -24.05152702331543, "global_step": 411185, "epoch": 4954} {"train_loss": -24.731658935546875, "global_step": 411186, "epoch": 4954} {"train_loss": -25.57356071472168, "global_step": 411187, "epoch": 4954} {"train_loss": -25.062490463256836, "global_step": 411188, "epoch": 4954} {"train_loss": -25.28120994567871, "global_step": 411189, "epoch": 4954} {"train_loss": -26.076086044311523, "global_step": 411190, "epoch": 4954} {"train_loss": -25.350902557373047, "global_step": 411191, "epoch": 4954} {"train_loss": -25.459409713745117, "global_step": 411192, "epoch": 4954} {"train_loss": -26.141530990600586, "global_step": 411193, "epoch": 4954} {"train_loss": -25.57618522644043, "global_step": 411194, "epoch": 4954} {"train_loss": -25.600610733032227, "global_step": 411195, "epoch": 4954} {"train_loss": -25.973987579345703, "global_step": 411196, "epoch": 4954} {"train_loss": -25.883703231811523, "global_step": 411197, "epoch": 4954} {"train_loss": -25.948591232299805, "global_step": 411198, "epoch": 4954} {"train_loss": -26.1229190826416, "global_step": 411199, "epoch": 4954} {"train_loss": -26.160367965698242, "global_step": 411200, "epoch": 4954} {"train_loss": -26.00886344909668, "global_step": 411201, "epoch": 4954} {"train_loss": -25.95938491821289, "global_step": 411202, "epoch": 4954} {"train_loss": -26.14832878112793, "global_step": 411203, "epoch": 4954} {"train_loss": -25.954273223876953, "global_step": 411204, "epoch": 4954} {"train_loss": -26.336963653564453, "global_step": 411205, "epoch": 4954} {"train_loss": -26.388547897338867, "global_step": 411206, "epoch": 4954} {"train_loss": -26.27670669555664, "global_step": 411207, "epoch": 4954} {"train_loss": -26.419652938842773, "global_step": 411208, "epoch": 4954} {"train_loss": -26.615890502929688, "global_step": 411209, "epoch": 4954} {"train_loss": -26.418304443359375, "global_step": 411210, "epoch": 4954} {"train_loss": -26.390228271484375, "global_step": 411211, "epoch": 4954} {"train_loss": -26.485258102416992, "global_step": 411212, "epoch": 4954} {"train_loss": -26.375211715698242, "global_step": 411213, "epoch": 4954} {"train_loss": -26.663284301757812, "global_step": 411214, "epoch": 4954} {"train_loss": -26.727527618408203, "global_step": 411215, "epoch": 4954} {"train_loss": -26.511402130126953, "global_step": 411216, "epoch": 4954} {"train_loss": -26.692472457885742, "global_step": 411217, "epoch": 4954} {"train_loss": -26.317163467407227, "global_step": 411218, "epoch": 4954} {"train_loss": -26.851186752319336, "global_step": 411219, "epoch": 4954} {"train_loss": -26.6997127532959, "global_step": 411220, "epoch": 4954} {"train_loss": -26.289487838745117, "global_step": 411221, "epoch": 4954} {"train_loss": -26.681116104125977, "global_step": 411222, "epoch": 4954} {"train_loss": -26.735809326171875, "global_step": 411223, "epoch": 4954} {"train_loss": -26.413175582885742, "global_step": 411224, "epoch": 4954} {"train_loss": -26.568891525268555, "global_step": 411225, "epoch": 4954} {"train_loss": -26.748220443725586, "global_step": 411226, "epoch": 4954} {"train_loss": -26.399616241455078, "global_step": 411227, "epoch": 4954} {"train_loss": -26.618738174438477, "global_step": 411228, "epoch": 4954} {"train_loss": -27.180408477783203, "global_step": 411229, "epoch": 4954} {"train_loss": -26.607959747314453, "global_step": 411230, "epoch": 4954} {"train_loss": -26.728933334350586, "global_step": 411231, "epoch": 4954} {"train_loss": -26.656696319580078, "global_step": 411232, "epoch": 4954} {"train_loss": -26.45849609375, "global_step": 411233, "epoch": 4954} {"train_loss": -26.827880859375, "global_step": 411234, "epoch": 4954} {"train_loss": -26.531675338745117, "global_step": 411235, "epoch": 4954} {"train_loss": -26.790119171142578, "global_step": 411236, "epoch": 4954} {"train_loss": -27.05547523498535, "global_step": 411237, "epoch": 4954} {"train_loss": -26.7966365814209, "global_step": 411238, "epoch": 4954} {"train_loss": -26.827356338500977, "global_step": 411239, "epoch": 4954} {"train_loss": -26.658849716186523, "global_step": 411240, "epoch": 4954} {"train_loss": -26.737415313720703, "global_step": 411241, "epoch": 4954} {"train_loss": -26.350088119506836, "global_step": 411242, "epoch": 4954} {"train_loss": -26.742481231689453, "global_step": 411243, "epoch": 4954} {"train_loss": -26.757246017456055, "global_step": 411244, "epoch": 4954} {"train_loss": -26.784910202026367, "global_step": 411245, "epoch": 4954} {"train_loss": -26.749902725219727, "global_step": 411246, "epoch": 4954} {"train_loss": -26.967554092407227, "global_step": 411247, "epoch": 4954} {"train_loss": -26.782445907592773, "global_step": 411248, "epoch": 4954} {"train_loss": -26.93378257751465, "global_step": 411249, "epoch": 4954} {"train_loss": -26.662891387939453, "global_step": 411250, "epoch": 4954} {"train_loss": -26.95199966430664, "global_step": 411251, "epoch": 4954} {"train_loss": -26.838720321655273, "global_step": 411252, "epoch": 4954} {"train_loss": -27.06418800354004, "global_step": 411253, "epoch": 4954} {"train_loss": -26.984363555908203, "global_step": 411254, "epoch": 4954} {"train_loss": -26.9290771484375, "global_step": 411255, "epoch": 4954} {"train_loss": -26.941503524780273, "global_step": 411256, "epoch": 4954} {"train_loss": -26.731962203979492, "global_step": 411257, "epoch": 4954} {"train_loss": -27.089330673217773, "global_step": 411258, "epoch": 4954} {"train_loss": -26.930627822875977, "global_step": 411259, "epoch": 4954} {"train_loss": -27.04631996154785, "global_step": 411260, "epoch": 4954} {"train_loss": -26.69988441467285, "global_step": 411261, "epoch": 4954} {"train_loss": -26.628799438476562, "global_step": 411262, "epoch": 4954} {"train_loss": -27.15388298034668, "global_step": 411263, "epoch": 4954} {"train_loss": -26.38678380667445, "global_step": 411264, "epoch": 4954, "val_loss": 6551564.0} {"train_loss": -24.89607048034668, "global_step": 411265, "epoch": 4955} {"train_loss": -25.07045555114746, "global_step": 411266, "epoch": 4955} {"train_loss": -24.868534088134766, "global_step": 411267, "epoch": 4955} {"train_loss": -25.362533569335938, "global_step": 411268, "epoch": 4955} {"train_loss": -25.69637107849121, "global_step": 411269, "epoch": 4955} {"train_loss": -25.715612411499023, "global_step": 411270, "epoch": 4955} {"train_loss": -26.140302658081055, "global_step": 411271, "epoch": 4955} {"train_loss": -25.610837936401367, "global_step": 411272, "epoch": 4955} {"train_loss": -25.833515167236328, "global_step": 411273, "epoch": 4955} {"train_loss": -25.8642520904541, "global_step": 411274, "epoch": 4955} {"train_loss": -26.09600257873535, "global_step": 411275, "epoch": 4955} {"train_loss": -25.55940818786621, "global_step": 411276, "epoch": 4955} {"train_loss": -26.492034912109375, "global_step": 411277, "epoch": 4955} {"train_loss": -25.849872589111328, "global_step": 411278, "epoch": 4955} {"train_loss": -25.900894165039062, "global_step": 411279, "epoch": 4955} {"train_loss": -26.016626358032227, "global_step": 411280, "epoch": 4955} {"train_loss": -25.984546661376953, "global_step": 411281, "epoch": 4955} {"train_loss": -26.297046661376953, "global_step": 411282, "epoch": 4955} {"train_loss": -25.96817970275879, "global_step": 411283, "epoch": 4955} {"train_loss": -26.1801815032959, "global_step": 411284, "epoch": 4955} {"train_loss": -26.175687789916992, "global_step": 411285, "epoch": 4955} {"train_loss": -26.30224609375, "global_step": 411286, "epoch": 4955} {"train_loss": -25.9621639251709, "global_step": 411287, "epoch": 4955} {"train_loss": -26.25798988342285, "global_step": 411288, "epoch": 4955} {"train_loss": -26.50115966796875, "global_step": 411289, "epoch": 4955} {"train_loss": -26.2460994720459, "global_step": 411290, "epoch": 4955} {"train_loss": -26.181249618530273, "global_step": 411291, "epoch": 4955} {"train_loss": -26.46903419494629, "global_step": 411292, "epoch": 4955} {"train_loss": -26.737634658813477, "global_step": 411293, "epoch": 4955} {"train_loss": -26.579792022705078, "global_step": 411294, "epoch": 4955} {"train_loss": -26.560728073120117, "global_step": 411295, "epoch": 4955} {"train_loss": -26.25152587890625, "global_step": 411296, "epoch": 4955} {"train_loss": -26.552534103393555, "global_step": 411297, "epoch": 4955} {"train_loss": -26.74976921081543, "global_step": 411298, "epoch": 4955} {"train_loss": -26.736852645874023, "global_step": 411299, "epoch": 4955} {"train_loss": -26.47308349609375, "global_step": 411300, "epoch": 4955} {"train_loss": -26.690753936767578, "global_step": 411301, "epoch": 4955} {"train_loss": -26.57618522644043, "global_step": 411302, "epoch": 4955} {"train_loss": -26.815168380737305, "global_step": 411303, "epoch": 4955} {"train_loss": -26.605451583862305, "global_step": 411304, "epoch": 4955} {"train_loss": -26.53668785095215, "global_step": 411305, "epoch": 4955} {"train_loss": -26.825971603393555, "global_step": 411306, "epoch": 4955} {"train_loss": -26.99118423461914, "global_step": 411307, "epoch": 4955} {"train_loss": -26.60599708557129, "global_step": 411308, "epoch": 4955} {"train_loss": -26.3843994140625, "global_step": 411309, "epoch": 4955} {"train_loss": -26.741540908813477, "global_step": 411310, "epoch": 4955} {"train_loss": -26.937286376953125, "global_step": 411311, "epoch": 4955} {"train_loss": -26.953571319580078, "global_step": 411312, "epoch": 4955} {"train_loss": -26.545461654663086, "global_step": 411313, "epoch": 4955} {"train_loss": -26.404743194580078, "global_step": 411314, "epoch": 4955} {"train_loss": -26.574115753173828, "global_step": 411315, "epoch": 4955} {"train_loss": -26.886350631713867, "global_step": 411316, "epoch": 4955} {"train_loss": -26.730798721313477, "global_step": 411317, "epoch": 4955} {"train_loss": -26.768842697143555, "global_step": 411318, "epoch": 4955} {"train_loss": -26.914350509643555, "global_step": 411319, "epoch": 4955} {"train_loss": -26.907209396362305, "global_step": 411320, "epoch": 4955} {"train_loss": -27.0572452545166, "global_step": 411321, "epoch": 4955} {"train_loss": -26.82999610900879, "global_step": 411322, "epoch": 4955} {"train_loss": -26.994497299194336, "global_step": 411323, "epoch": 4955} {"train_loss": -27.10516929626465, "global_step": 411324, "epoch": 4955} {"train_loss": -26.84980583190918, "global_step": 411325, "epoch": 4955} {"train_loss": -27.0545654296875, "global_step": 411326, "epoch": 4955} {"train_loss": -26.704938888549805, "global_step": 411327, "epoch": 4955} {"train_loss": -27.154956817626953, "global_step": 411328, "epoch": 4955} {"train_loss": -26.778533935546875, "global_step": 411329, "epoch": 4955} {"train_loss": -27.01069450378418, "global_step": 411330, "epoch": 4955} {"train_loss": -26.83509635925293, "global_step": 411331, "epoch": 4955} {"train_loss": -27.204513549804688, "global_step": 411332, "epoch": 4955} {"train_loss": -27.084003448486328, "global_step": 411333, "epoch": 4955} {"train_loss": -26.997629165649414, "global_step": 411334, "epoch": 4955} {"train_loss": -26.54816246032715, "global_step": 411335, "epoch": 4955} {"train_loss": -26.751972198486328, "global_step": 411336, "epoch": 4955} {"train_loss": -26.4796199798584, "global_step": 411337, "epoch": 4955} {"train_loss": -26.91090202331543, "global_step": 411338, "epoch": 4955} {"train_loss": -26.783716201782227, "global_step": 411339, "epoch": 4955} {"train_loss": -26.0015811920166, "global_step": 411340, "epoch": 4955} {"train_loss": -26.448516845703125, "global_step": 411341, "epoch": 4955} {"train_loss": -26.336776733398438, "global_step": 411342, "epoch": 4955} {"train_loss": -27.237512588500977, "global_step": 411343, "epoch": 4955} {"train_loss": -26.45281982421875, "global_step": 411344, "epoch": 4955} {"train_loss": -26.396209716796875, "global_step": 411345, "epoch": 4955} {"train_loss": -26.81910514831543, "global_step": 411346, "epoch": 4955} {"train_loss": -26.459888619112682, "global_step": 411347, "epoch": 4955, "val_loss": 6586724.0} {"train_loss": -22.86539649963379, "global_step": 411348, "epoch": 4956} {"train_loss": -24.634105682373047, "global_step": 411349, "epoch": 4956} {"train_loss": -24.18904685974121, "global_step": 411350, "epoch": 4956} {"train_loss": -24.784387588500977, "global_step": 411351, "epoch": 4956} {"train_loss": -24.629398345947266, "global_step": 411352, "epoch": 4956} {"train_loss": -25.150592803955078, "global_step": 411353, "epoch": 4956} {"train_loss": -24.518369674682617, "global_step": 411354, "epoch": 4956} {"train_loss": -24.63703727722168, "global_step": 411355, "epoch": 4956} {"train_loss": -25.976194381713867, "global_step": 411356, "epoch": 4956} {"train_loss": -24.802490234375, "global_step": 411357, "epoch": 4956} {"train_loss": -25.024150848388672, "global_step": 411358, "epoch": 4956} {"train_loss": -25.37030029296875, "global_step": 411359, "epoch": 4956} {"train_loss": -25.206159591674805, "global_step": 411360, "epoch": 4956} {"train_loss": -25.529991149902344, "global_step": 411361, "epoch": 4956} {"train_loss": -25.535383224487305, "global_step": 411362, "epoch": 4956} {"train_loss": -25.78472900390625, "global_step": 411363, "epoch": 4956} {"train_loss": -25.778797149658203, "global_step": 411364, "epoch": 4956} {"train_loss": -25.696447372436523, "global_step": 411365, "epoch": 4956} {"train_loss": -25.41411781311035, "global_step": 411366, "epoch": 4956} {"train_loss": -25.808746337890625, "global_step": 411367, "epoch": 4956} {"train_loss": -25.528945922851562, "global_step": 411368, "epoch": 4956} {"train_loss": -26.22602653503418, "global_step": 411369, "epoch": 4956} {"train_loss": -25.4766788482666, "global_step": 411370, "epoch": 4956} {"train_loss": -26.03303337097168, "global_step": 411371, "epoch": 4956} {"train_loss": -25.94532585144043, "global_step": 411372, "epoch": 4956} {"train_loss": -25.913818359375, "global_step": 411373, "epoch": 4956} {"train_loss": -26.11962890625, "global_step": 411374, "epoch": 4956} {"train_loss": -26.153522491455078, "global_step": 411375, "epoch": 4956} {"train_loss": -25.990188598632812, "global_step": 411376, "epoch": 4956} {"train_loss": -26.582412719726562, "global_step": 411377, "epoch": 4956} {"train_loss": -26.4659481048584, "global_step": 411378, "epoch": 4956} {"train_loss": -26.24515151977539, "global_step": 411379, "epoch": 4956} {"train_loss": -26.450719833374023, "global_step": 411380, "epoch": 4956} {"train_loss": -26.319746017456055, "global_step": 411381, "epoch": 4956} {"train_loss": -26.198486328125, "global_step": 411382, "epoch": 4956} {"train_loss": -26.329437255859375, "global_step": 411383, "epoch": 4956} {"train_loss": -26.407133102416992, "global_step": 411384, "epoch": 4956} {"train_loss": -26.246631622314453, "global_step": 411385, "epoch": 4956} {"train_loss": -26.237272262573242, "global_step": 411386, "epoch": 4956} {"train_loss": -26.835906982421875, "global_step": 411387, "epoch": 4956} {"train_loss": -26.761615753173828, "global_step": 411388, "epoch": 4956} {"train_loss": -26.68752098083496, "global_step": 411389, "epoch": 4956} {"train_loss": -26.639434814453125, "global_step": 411390, "epoch": 4956} {"train_loss": -26.75446128845215, "global_step": 411391, "epoch": 4956} {"train_loss": -26.78257179260254, "global_step": 411392, "epoch": 4956} {"train_loss": -26.550159454345703, "global_step": 411393, "epoch": 4956} {"train_loss": -26.68592643737793, "global_step": 411394, "epoch": 4956} {"train_loss": -26.33341407775879, "global_step": 411395, "epoch": 4956} {"train_loss": -26.50904655456543, "global_step": 411396, "epoch": 4956} {"train_loss": -26.969043731689453, "global_step": 411397, "epoch": 4956} {"train_loss": -26.7011775970459, "global_step": 411398, "epoch": 4956} {"train_loss": -26.98972511291504, "global_step": 411399, "epoch": 4956} {"train_loss": -26.71793556213379, "global_step": 411400, "epoch": 4956} {"train_loss": -26.436864852905273, "global_step": 411401, "epoch": 4956} {"train_loss": -26.421863555908203, "global_step": 411402, "epoch": 4956} {"train_loss": -26.86572265625, "global_step": 411403, "epoch": 4956} {"train_loss": -26.68098258972168, "global_step": 411404, "epoch": 4956} {"train_loss": -26.783050537109375, "global_step": 411405, "epoch": 4956} {"train_loss": -26.745513916015625, "global_step": 411406, "epoch": 4956} {"train_loss": -26.64493179321289, "global_step": 411407, "epoch": 4956} {"train_loss": -27.0226993560791, "global_step": 411408, "epoch": 4956} {"train_loss": -27.12711524963379, "global_step": 411409, "epoch": 4956} {"train_loss": -26.604894638061523, "global_step": 411410, "epoch": 4956} {"train_loss": -26.65606689453125, "global_step": 411411, "epoch": 4956} {"train_loss": -26.832473754882812, "global_step": 411412, "epoch": 4956} {"train_loss": -26.88483238220215, "global_step": 411413, "epoch": 4956} {"train_loss": -26.9150333404541, "global_step": 411414, "epoch": 4956} {"train_loss": -26.591663360595703, "global_step": 411415, "epoch": 4956} {"train_loss": -27.010915756225586, "global_step": 411416, "epoch": 4956} {"train_loss": -26.667652130126953, "global_step": 411417, "epoch": 4956} {"train_loss": -27.029600143432617, "global_step": 411418, "epoch": 4956} {"train_loss": -26.805273056030273, "global_step": 411419, "epoch": 4956} {"train_loss": -26.763031005859375, "global_step": 411420, "epoch": 4956} {"train_loss": -26.840213775634766, "global_step": 411421, "epoch": 4956} {"train_loss": -26.820947647094727, "global_step": 411422, "epoch": 4956} {"train_loss": -26.926685333251953, "global_step": 411423, "epoch": 4956} {"train_loss": -26.743789672851562, "global_step": 411424, "epoch": 4956} {"train_loss": -26.685400009155273, "global_step": 411425, "epoch": 4956} {"train_loss": -27.04254150390625, "global_step": 411426, "epoch": 4956} {"train_loss": -27.0645809173584, "global_step": 411427, "epoch": 4956} {"train_loss": -26.622480392456055, "global_step": 411428, "epoch": 4956} {"train_loss": -26.6943416595459, "global_step": 411429, "epoch": 4956} {"train_loss": -26.212300587849445, "global_step": 411430, "epoch": 4956, "val_loss": 6492739.0} {"train_loss": -25.3125057220459, "global_step": 411431, "epoch": 4957} {"train_loss": -24.657573699951172, "global_step": 411432, "epoch": 4957} {"train_loss": -24.915578842163086, "global_step": 411433, "epoch": 4957} {"train_loss": -26.08601188659668, "global_step": 411434, "epoch": 4957} {"train_loss": -26.127912521362305, "global_step": 411435, "epoch": 4957} {"train_loss": -25.050251007080078, "global_step": 411436, "epoch": 4957} {"train_loss": -25.552230834960938, "global_step": 411437, "epoch": 4957} {"train_loss": -25.6286563873291, "global_step": 411438, "epoch": 4957} {"train_loss": -25.40994644165039, "global_step": 411439, "epoch": 4957} {"train_loss": -26.25555419921875, "global_step": 411440, "epoch": 4957} {"train_loss": -25.356674194335938, "global_step": 411441, "epoch": 4957} {"train_loss": -26.22403335571289, "global_step": 411442, "epoch": 4957} {"train_loss": -25.444272994995117, "global_step": 411443, "epoch": 4957} {"train_loss": -25.84803581237793, "global_step": 411444, "epoch": 4957} {"train_loss": -25.898212432861328, "global_step": 411445, "epoch": 4957} {"train_loss": -25.971176147460938, "global_step": 411446, "epoch": 4957} {"train_loss": -26.02931022644043, "global_step": 411447, "epoch": 4957} {"train_loss": -25.752695083618164, "global_step": 411448, "epoch": 4957} {"train_loss": -26.003477096557617, "global_step": 411449, "epoch": 4957} {"train_loss": -26.139556884765625, "global_step": 411450, "epoch": 4957} {"train_loss": -26.2043399810791, "global_step": 411451, "epoch": 4957} {"train_loss": -26.317474365234375, "global_step": 411452, "epoch": 4957} {"train_loss": -25.89606285095215, "global_step": 411453, "epoch": 4957} {"train_loss": -26.439741134643555, "global_step": 411454, "epoch": 4957} {"train_loss": -26.506683349609375, "global_step": 411455, "epoch": 4957} {"train_loss": -26.313232421875, "global_step": 411456, "epoch": 4957} {"train_loss": -26.635772705078125, "global_step": 411457, "epoch": 4957} {"train_loss": -26.4085636138916, "global_step": 411458, "epoch": 4957} {"train_loss": -26.11420249938965, "global_step": 411459, "epoch": 4957} {"train_loss": -26.395849227905273, "global_step": 411460, "epoch": 4957} {"train_loss": -26.15032958984375, "global_step": 411461, "epoch": 4957} {"train_loss": -26.724201202392578, "global_step": 411462, "epoch": 4957} {"train_loss": -26.506128311157227, "global_step": 411463, "epoch": 4957} {"train_loss": -26.280380249023438, "global_step": 411464, "epoch": 4957} {"train_loss": -26.69341468811035, "global_step": 411465, "epoch": 4957} {"train_loss": -26.299707412719727, "global_step": 411466, "epoch": 4957} {"train_loss": -26.639692306518555, "global_step": 411467, "epoch": 4957} {"train_loss": -26.8999080657959, "global_step": 411468, "epoch": 4957} {"train_loss": -26.81563377380371, "global_step": 411469, "epoch": 4957} {"train_loss": -26.8587589263916, "global_step": 411470, "epoch": 4957} {"train_loss": -26.645389556884766, "global_step": 411471, "epoch": 4957} {"train_loss": -26.81608009338379, "global_step": 411472, "epoch": 4957} {"train_loss": -27.0521240234375, "global_step": 411473, "epoch": 4957} {"train_loss": -26.884387969970703, "global_step": 411474, "epoch": 4957} {"train_loss": -26.782934188842773, "global_step": 411475, "epoch": 4957} {"train_loss": -26.48992347717285, "global_step": 411476, "epoch": 4957} {"train_loss": -26.835678100585938, "global_step": 411477, "epoch": 4957} {"train_loss": -26.765460968017578, "global_step": 411478, "epoch": 4957} {"train_loss": -26.832319259643555, "global_step": 411479, "epoch": 4957} {"train_loss": -26.759122848510742, "global_step": 411480, "epoch": 4957} {"train_loss": -26.838764190673828, "global_step": 411481, "epoch": 4957} {"train_loss": -27.042499542236328, "global_step": 411482, "epoch": 4957} {"train_loss": -26.761159896850586, "global_step": 411483, "epoch": 4957} {"train_loss": -27.077259063720703, "global_step": 411484, "epoch": 4957} {"train_loss": -26.8818416595459, "global_step": 411485, "epoch": 4957} {"train_loss": -26.513647079467773, "global_step": 411486, "epoch": 4957} {"train_loss": -26.588972091674805, "global_step": 411487, "epoch": 4957} {"train_loss": -26.563467025756836, "global_step": 411488, "epoch": 4957} {"train_loss": -26.951074600219727, "global_step": 411489, "epoch": 4957} {"train_loss": -26.91169548034668, "global_step": 411490, "epoch": 4957} {"train_loss": -26.866708755493164, "global_step": 411491, "epoch": 4957} {"train_loss": -26.6423282623291, "global_step": 411492, "epoch": 4957} {"train_loss": -26.96036720275879, "global_step": 411493, "epoch": 4957} {"train_loss": -26.530899047851562, "global_step": 411494, "epoch": 4957} {"train_loss": -26.58945083618164, "global_step": 411495, "epoch": 4957} {"train_loss": -26.52454948425293, "global_step": 411496, "epoch": 4957} {"train_loss": -26.697866439819336, "global_step": 411497, "epoch": 4957} {"train_loss": -26.669086456298828, "global_step": 411498, "epoch": 4957} {"train_loss": -26.72235107421875, "global_step": 411499, "epoch": 4957} {"train_loss": -26.373767852783203, "global_step": 411500, "epoch": 4957} {"train_loss": -26.7562198638916, "global_step": 411501, "epoch": 4957} {"train_loss": -26.84869956970215, "global_step": 411502, "epoch": 4957} {"train_loss": -26.93473243713379, "global_step": 411503, "epoch": 4957} {"train_loss": -27.049896240234375, "global_step": 411504, "epoch": 4957} {"train_loss": -26.890289306640625, "global_step": 411505, "epoch": 4957} {"train_loss": -26.6789608001709, "global_step": 411506, "epoch": 4957} {"train_loss": -26.742578506469727, "global_step": 411507, "epoch": 4957} {"train_loss": -26.569433212280273, "global_step": 411508, "epoch": 4957} {"train_loss": -26.351245880126953, "global_step": 411509, "epoch": 4957} {"train_loss": -26.6227970123291, "global_step": 411510, "epoch": 4957} {"train_loss": -26.831388473510742, "global_step": 411511, "epoch": 4957} {"train_loss": -26.46014404296875, "global_step": 411512, "epoch": 4957} {"train_loss": -26.426988693604986, "global_step": 411513, "epoch": 4957, "val_loss": 6531638.0} {"train_loss": -25.823652267456055, "global_step": 411514, "epoch": 4958} {"train_loss": -26.284719467163086, "global_step": 411515, "epoch": 4958} {"train_loss": -25.871566772460938, "global_step": 411516, "epoch": 4958} {"train_loss": -26.193639755249023, "global_step": 411517, "epoch": 4958} {"train_loss": -25.7257137298584, "global_step": 411518, "epoch": 4958} {"train_loss": -26.1870174407959, "global_step": 411519, "epoch": 4958} {"train_loss": -26.174158096313477, "global_step": 411520, "epoch": 4958} {"train_loss": -25.61176109313965, "global_step": 411521, "epoch": 4958} {"train_loss": -26.059621810913086, "global_step": 411522, "epoch": 4958} {"train_loss": -26.296344757080078, "global_step": 411523, "epoch": 4958} {"train_loss": -26.090314865112305, "global_step": 411524, "epoch": 4958} {"train_loss": -26.710193634033203, "global_step": 411525, "epoch": 4958} {"train_loss": -26.3319034576416, "global_step": 411526, "epoch": 4958} {"train_loss": -26.378881454467773, "global_step": 411527, "epoch": 4958} {"train_loss": -26.45243263244629, "global_step": 411528, "epoch": 4958} {"train_loss": -26.526371002197266, "global_step": 411529, "epoch": 4958} {"train_loss": -26.423614501953125, "global_step": 411530, "epoch": 4958} {"train_loss": -26.172088623046875, "global_step": 411531, "epoch": 4958} {"train_loss": -26.55830192565918, "global_step": 411532, "epoch": 4958} {"train_loss": -26.64847755432129, "global_step": 411533, "epoch": 4958} {"train_loss": -26.524616241455078, "global_step": 411534, "epoch": 4958} {"train_loss": -26.975849151611328, "global_step": 411535, "epoch": 4958} {"train_loss": -26.373533248901367, "global_step": 411536, "epoch": 4958} {"train_loss": -26.864450454711914, "global_step": 411537, "epoch": 4958} {"train_loss": -26.70474624633789, "global_step": 411538, "epoch": 4958} {"train_loss": -26.659265518188477, "global_step": 411539, "epoch": 4958} {"train_loss": -26.74129295349121, "global_step": 411540, "epoch": 4958} {"train_loss": -27.060794830322266, "global_step": 411541, "epoch": 4958} {"train_loss": -27.144149780273438, "global_step": 411542, "epoch": 4958} {"train_loss": -26.683441162109375, "global_step": 411543, "epoch": 4958} {"train_loss": -26.482410430908203, "global_step": 411544, "epoch": 4958} {"train_loss": -26.47076416015625, "global_step": 411545, "epoch": 4958} {"train_loss": -26.915430068969727, "global_step": 411546, "epoch": 4958} {"train_loss": -26.724506378173828, "global_step": 411547, "epoch": 4958} {"train_loss": -26.42408561706543, "global_step": 411548, "epoch": 4958} {"train_loss": -26.623992919921875, "global_step": 411549, "epoch": 4958} {"train_loss": -26.922597885131836, "global_step": 411550, "epoch": 4958} {"train_loss": -26.649673461914062, "global_step": 411551, "epoch": 4958} {"train_loss": -26.892148971557617, "global_step": 411552, "epoch": 4958} {"train_loss": -26.8817081451416, "global_step": 411553, "epoch": 4958} {"train_loss": -26.54094886779785, "global_step": 411554, "epoch": 4958} {"train_loss": -26.82388687133789, "global_step": 411555, "epoch": 4958} {"train_loss": -26.886585235595703, "global_step": 411556, "epoch": 4958} {"train_loss": -27.242517471313477, "global_step": 411557, "epoch": 4958} {"train_loss": -26.8709659576416, "global_step": 411558, "epoch": 4958} {"train_loss": -26.95203971862793, "global_step": 411559, "epoch": 4958} {"train_loss": -26.914220809936523, "global_step": 411560, "epoch": 4958} {"train_loss": -26.75861930847168, "global_step": 411561, "epoch": 4958} {"train_loss": -27.083770751953125, "global_step": 411562, "epoch": 4958} {"train_loss": -26.791547775268555, "global_step": 411563, "epoch": 4958} {"train_loss": -27.021743774414062, "global_step": 411564, "epoch": 4958} {"train_loss": -27.07333755493164, "global_step": 411565, "epoch": 4958} {"train_loss": -27.205158233642578, "global_step": 411566, "epoch": 4958} {"train_loss": -26.84889030456543, "global_step": 411567, "epoch": 4958} {"train_loss": -27.148269653320312, "global_step": 411568, "epoch": 4958} {"train_loss": -26.901371002197266, "global_step": 411569, "epoch": 4958} {"train_loss": -26.627065658569336, "global_step": 411570, "epoch": 4958} {"train_loss": -26.508352279663086, "global_step": 411571, "epoch": 4958} {"train_loss": -26.5164852142334, "global_step": 411572, "epoch": 4958} {"train_loss": -26.821165084838867, "global_step": 411573, "epoch": 4958} {"train_loss": -26.673995971679688, "global_step": 411574, "epoch": 4958} {"train_loss": -27.0830135345459, "global_step": 411575, "epoch": 4958} {"train_loss": -26.500518798828125, "global_step": 411576, "epoch": 4958} {"train_loss": -26.768590927124023, "global_step": 411577, "epoch": 4958} {"train_loss": -27.040241241455078, "global_step": 411578, "epoch": 4958} {"train_loss": -26.56736183166504, "global_step": 411579, "epoch": 4958} {"train_loss": -26.624120712280273, "global_step": 411580, "epoch": 4958} {"train_loss": -26.707412719726562, "global_step": 411581, "epoch": 4958} {"train_loss": -26.6323184967041, "global_step": 411582, "epoch": 4958} {"train_loss": -26.61048698425293, "global_step": 411583, "epoch": 4958} {"train_loss": -26.213764190673828, "global_step": 411584, "epoch": 4958} {"train_loss": -26.249536514282227, "global_step": 411585, "epoch": 4958} {"train_loss": -26.353891372680664, "global_step": 411586, "epoch": 4958} {"train_loss": -26.54168701171875, "global_step": 411587, "epoch": 4958} {"train_loss": -26.82508659362793, "global_step": 411588, "epoch": 4958} {"train_loss": -26.586273193359375, "global_step": 411589, "epoch": 4958} {"train_loss": -26.721410751342773, "global_step": 411590, "epoch": 4958} {"train_loss": -26.861352920532227, "global_step": 411591, "epoch": 4958} {"train_loss": -26.763757705688477, "global_step": 411592, "epoch": 4958} {"train_loss": -26.44635581970215, "global_step": 411593, "epoch": 4958} {"train_loss": -26.702728271484375, "global_step": 411594, "epoch": 4958} {"train_loss": -26.725290298461914, "global_step": 411595, "epoch": 4958} {"train_loss": -26.60649053734469, "global_step": 411596, "epoch": 4958, "val_loss": 6537050.0} {"train_loss": -26.439865112304688, "global_step": 411597, "epoch": 4959} {"train_loss": -26.279348373413086, "global_step": 411598, "epoch": 4959} {"train_loss": -26.35074806213379, "global_step": 411599, "epoch": 4959} {"train_loss": -26.56927490234375, "global_step": 411600, "epoch": 4959} {"train_loss": -26.416757583618164, "global_step": 411601, "epoch": 4959} {"train_loss": -26.15741539001465, "global_step": 411602, "epoch": 4959} {"train_loss": -25.880355834960938, "global_step": 411603, "epoch": 4959} {"train_loss": -26.64712905883789, "global_step": 411604, "epoch": 4959} {"train_loss": -26.4166202545166, "global_step": 411605, "epoch": 4959} {"train_loss": -26.347503662109375, "global_step": 411606, "epoch": 4959} {"train_loss": -26.548547744750977, "global_step": 411607, "epoch": 4959} {"train_loss": -26.417890548706055, "global_step": 411608, "epoch": 4959} {"train_loss": -26.328977584838867, "global_step": 411609, "epoch": 4959} {"train_loss": -26.324872970581055, "global_step": 411610, "epoch": 4959} {"train_loss": -26.45469093322754, "global_step": 411611, "epoch": 4959} {"train_loss": -26.872028350830078, "global_step": 411612, "epoch": 4959} {"train_loss": -26.865676879882812, "global_step": 411613, "epoch": 4959} {"train_loss": -26.641843795776367, "global_step": 411614, "epoch": 4959} {"train_loss": -26.767898559570312, "global_step": 411615, "epoch": 4959} {"train_loss": -26.6959228515625, "global_step": 411616, "epoch": 4959} {"train_loss": -26.531665802001953, "global_step": 411617, "epoch": 4959} {"train_loss": -26.535404205322266, "global_step": 411618, "epoch": 4959} {"train_loss": -26.442651748657227, "global_step": 411619, "epoch": 4959} {"train_loss": -26.973947525024414, "global_step": 411620, "epoch": 4959} {"train_loss": -26.470550537109375, "global_step": 411621, "epoch": 4959} {"train_loss": -27.105432510375977, "global_step": 411622, "epoch": 4959} {"train_loss": -26.575946807861328, "global_step": 411623, "epoch": 4959} {"train_loss": -26.52817726135254, "global_step": 411624, "epoch": 4959} {"train_loss": -26.893049240112305, "global_step": 411625, "epoch": 4959} {"train_loss": -26.919677734375, "global_step": 411626, "epoch": 4959} {"train_loss": -26.724517822265625, "global_step": 411627, "epoch": 4959} {"train_loss": -26.35623550415039, "global_step": 411628, "epoch": 4959} {"train_loss": -26.920129776000977, "global_step": 411629, "epoch": 4959} {"train_loss": -27.028461456298828, "global_step": 411630, "epoch": 4959} {"train_loss": -26.61128044128418, "global_step": 411631, "epoch": 4959} {"train_loss": -27.091638565063477, "global_step": 411632, "epoch": 4959} {"train_loss": -26.99258804321289, "global_step": 411633, "epoch": 4959} {"train_loss": -26.827600479125977, "global_step": 411634, "epoch": 4959} {"train_loss": -26.609832763671875, "global_step": 411635, "epoch": 4959} {"train_loss": -26.5330810546875, "global_step": 411636, "epoch": 4959} {"train_loss": -26.589935302734375, "global_step": 411637, "epoch": 4959} {"train_loss": -27.12788200378418, "global_step": 411638, "epoch": 4959} {"train_loss": -26.903791427612305, "global_step": 411639, "epoch": 4959} {"train_loss": -26.761157989501953, "global_step": 411640, "epoch": 4959} {"train_loss": -26.475601196289062, "global_step": 411641, "epoch": 4959} {"train_loss": -26.57421875, "global_step": 411642, "epoch": 4959} {"train_loss": -26.992361068725586, "global_step": 411643, "epoch": 4959} {"train_loss": -26.839502334594727, "global_step": 411644, "epoch": 4959} {"train_loss": -26.748538970947266, "global_step": 411645, "epoch": 4959} {"train_loss": -26.796667098999023, "global_step": 411646, "epoch": 4959} {"train_loss": -26.967029571533203, "global_step": 411647, "epoch": 4959} {"train_loss": -26.835346221923828, "global_step": 411648, "epoch": 4959} {"train_loss": -26.80173683166504, "global_step": 411649, "epoch": 4959} {"train_loss": -26.9744815826416, "global_step": 411650, "epoch": 4959} {"train_loss": -26.223356246948242, "global_step": 411651, "epoch": 4959} {"train_loss": -26.83099937438965, "global_step": 411652, "epoch": 4959} {"train_loss": -26.763341903686523, "global_step": 411653, "epoch": 4959} {"train_loss": -26.462860107421875, "global_step": 411654, "epoch": 4959} {"train_loss": -26.58650016784668, "global_step": 411655, "epoch": 4959} {"train_loss": -26.564489364624023, "global_step": 411656, "epoch": 4959} {"train_loss": -26.7606201171875, "global_step": 411657, "epoch": 4959} {"train_loss": -26.72063636779785, "global_step": 411658, "epoch": 4959} {"train_loss": -27.02935218811035, "global_step": 411659, "epoch": 4959} {"train_loss": -26.540693283081055, "global_step": 411660, "epoch": 4959} {"train_loss": -26.402149200439453, "global_step": 411661, "epoch": 4959} {"train_loss": -26.349145889282227, "global_step": 411662, "epoch": 4959} {"train_loss": -26.38763427734375, "global_step": 411663, "epoch": 4959} {"train_loss": -26.73468017578125, "global_step": 411664, "epoch": 4959} {"train_loss": -26.38277244567871, "global_step": 411665, "epoch": 4959} {"train_loss": -26.301801681518555, "global_step": 411666, "epoch": 4959} {"train_loss": -26.746540069580078, "global_step": 411667, "epoch": 4959} {"train_loss": -26.515295028686523, "global_step": 411668, "epoch": 4959} {"train_loss": -26.21758460998535, "global_step": 411669, "epoch": 4959} {"train_loss": -26.531721115112305, "global_step": 411670, "epoch": 4959} {"train_loss": -25.87158203125, "global_step": 411671, "epoch": 4959} {"train_loss": -26.013568878173828, "global_step": 411672, "epoch": 4959} {"train_loss": -26.429189682006836, "global_step": 411673, "epoch": 4959} {"train_loss": -26.894901275634766, "global_step": 411674, "epoch": 4959} {"train_loss": -26.562580108642578, "global_step": 411675, "epoch": 4959} {"train_loss": -26.805164337158203, "global_step": 411676, "epoch": 4959} {"train_loss": -26.555896759033203, "global_step": 411677, "epoch": 4959} {"train_loss": -26.792770385742188, "global_step": 411678, "epoch": 4959} {"train_loss": -26.599619141544203, "global_step": 411679, "epoch": 4959, "val_loss": 6471167.0} {"train_loss": -26.3212947845459, "global_step": 411680, "epoch": 4960} {"train_loss": -26.31534194946289, "global_step": 411681, "epoch": 4960} {"train_loss": -26.224822998046875, "global_step": 411682, "epoch": 4960} {"train_loss": -26.263086318969727, "global_step": 411683, "epoch": 4960} {"train_loss": -26.20244789123535, "global_step": 411684, "epoch": 4960} {"train_loss": -26.853178024291992, "global_step": 411685, "epoch": 4960} {"train_loss": -26.486536026000977, "global_step": 411686, "epoch": 4960} {"train_loss": -26.798315048217773, "global_step": 411687, "epoch": 4960} {"train_loss": -26.575361251831055, "global_step": 411688, "epoch": 4960} {"train_loss": -26.79817771911621, "global_step": 411689, "epoch": 4960} {"train_loss": -26.73834228515625, "global_step": 411690, "epoch": 4960} {"train_loss": -26.597763061523438, "global_step": 411691, "epoch": 4960} {"train_loss": -26.573339462280273, "global_step": 411692, "epoch": 4960} {"train_loss": -26.630041122436523, "global_step": 411693, "epoch": 4960} {"train_loss": -26.4682559967041, "global_step": 411694, "epoch": 4960} {"train_loss": -26.669193267822266, "global_step": 411695, "epoch": 4960} {"train_loss": -26.5986385345459, "global_step": 411696, "epoch": 4960} {"train_loss": -26.7352294921875, "global_step": 411697, "epoch": 4960} {"train_loss": -26.745105743408203, "global_step": 411698, "epoch": 4960} {"train_loss": -27.005186080932617, "global_step": 411699, "epoch": 4960} {"train_loss": -26.616559982299805, "global_step": 411700, "epoch": 4960} {"train_loss": -26.8327579498291, "global_step": 411701, "epoch": 4960} {"train_loss": -26.758758544921875, "global_step": 411702, "epoch": 4960} {"train_loss": -26.602792739868164, "global_step": 411703, "epoch": 4960} {"train_loss": -26.693897247314453, "global_step": 411704, "epoch": 4960} {"train_loss": -26.979068756103516, "global_step": 411705, "epoch": 4960} {"train_loss": -26.905500411987305, "global_step": 411706, "epoch": 4960} {"train_loss": -27.107629776000977, "global_step": 411707, "epoch": 4960} {"train_loss": -26.78215980529785, "global_step": 411708, "epoch": 4960} {"train_loss": -26.880985260009766, "global_step": 411709, "epoch": 4960} {"train_loss": -26.5331974029541, "global_step": 411710, "epoch": 4960} {"train_loss": -26.7639217376709, "global_step": 411711, "epoch": 4960} {"train_loss": -26.90093994140625, "global_step": 411712, "epoch": 4960} {"train_loss": -26.785688400268555, "global_step": 411713, "epoch": 4960} {"train_loss": -27.00946617126465, "global_step": 411714, "epoch": 4960} {"train_loss": -27.23026466369629, "global_step": 411715, "epoch": 4960} {"train_loss": -26.666967391967773, "global_step": 411716, "epoch": 4960} {"train_loss": -26.879074096679688, "global_step": 411717, "epoch": 4960} {"train_loss": -26.564559936523438, "global_step": 411718, "epoch": 4960} {"train_loss": -26.87428855895996, "global_step": 411719, "epoch": 4960} {"train_loss": -27.009775161743164, "global_step": 411720, "epoch": 4960} {"train_loss": -26.920654296875, "global_step": 411721, "epoch": 4960} {"train_loss": -27.30368995666504, "global_step": 411722, "epoch": 4960} {"train_loss": -26.7230224609375, "global_step": 411723, "epoch": 4960} {"train_loss": -27.035749435424805, "global_step": 411724, "epoch": 4960} {"train_loss": -27.12497329711914, "global_step": 411725, "epoch": 4960} {"train_loss": -26.8864803314209, "global_step": 411726, "epoch": 4960} {"train_loss": -26.88177490234375, "global_step": 411727, "epoch": 4960} {"train_loss": -26.963581085205078, "global_step": 411728, "epoch": 4960} {"train_loss": -26.547943115234375, "global_step": 411729, "epoch": 4960} {"train_loss": -26.628442764282227, "global_step": 411730, "epoch": 4960} {"train_loss": -27.06342887878418, "global_step": 411731, "epoch": 4960} {"train_loss": -26.762155532836914, "global_step": 411732, "epoch": 4960} {"train_loss": -26.98443031311035, "global_step": 411733, "epoch": 4960} {"train_loss": -26.611087799072266, "global_step": 411734, "epoch": 4960} {"train_loss": -26.574115753173828, "global_step": 411735, "epoch": 4960} {"train_loss": -26.51681900024414, "global_step": 411736, "epoch": 4960} {"train_loss": -26.61606216430664, "global_step": 411737, "epoch": 4960} {"train_loss": -26.93434715270996, "global_step": 411738, "epoch": 4960} {"train_loss": -27.042661666870117, "global_step": 411739, "epoch": 4960} {"train_loss": -26.82681655883789, "global_step": 411740, "epoch": 4960} {"train_loss": -26.70429801940918, "global_step": 411741, "epoch": 4960} {"train_loss": -26.376667022705078, "global_step": 411742, "epoch": 4960} {"train_loss": -26.482202529907227, "global_step": 411743, "epoch": 4960} {"train_loss": -26.589405059814453, "global_step": 411744, "epoch": 4960} {"train_loss": -26.54062271118164, "global_step": 411745, "epoch": 4960} {"train_loss": -27.0512752532959, "global_step": 411746, "epoch": 4960} {"train_loss": -26.98883628845215, "global_step": 411747, "epoch": 4960} {"train_loss": -26.820363998413086, "global_step": 411748, "epoch": 4960} {"train_loss": -27.238271713256836, "global_step": 411749, "epoch": 4960} {"train_loss": -26.890478134155273, "global_step": 411750, "epoch": 4960} {"train_loss": -26.7486572265625, "global_step": 411751, "epoch": 4960} {"train_loss": -26.725967407226562, "global_step": 411752, "epoch": 4960} {"train_loss": -26.952157974243164, "global_step": 411753, "epoch": 4960} {"train_loss": -26.556808471679688, "global_step": 411754, "epoch": 4960} {"train_loss": -26.680591583251953, "global_step": 411755, "epoch": 4960} {"train_loss": -26.860197067260742, "global_step": 411756, "epoch": 4960} {"train_loss": -26.339847564697266, "global_step": 411757, "epoch": 4960} {"train_loss": -26.19965934753418, "global_step": 411758, "epoch": 4960} {"train_loss": -26.665746688842773, "global_step": 411759, "epoch": 4960} {"train_loss": -26.7960262298584, "global_step": 411760, "epoch": 4960} {"train_loss": -26.806228637695312, "global_step": 411761, "epoch": 4960} {"train_loss": -26.7579872866711, "global_step": 411762, "epoch": 4960, "val_loss": 6487777.0} {"train_loss": -26.395475387573242, "global_step": 411763, "epoch": 4961} {"train_loss": -26.735153198242188, "global_step": 411764, "epoch": 4961} {"train_loss": -26.909774780273438, "global_step": 411765, "epoch": 4961} {"train_loss": -26.433507919311523, "global_step": 411766, "epoch": 4961} {"train_loss": -26.31879234313965, "global_step": 411767, "epoch": 4961} {"train_loss": -26.0794620513916, "global_step": 411768, "epoch": 4961} {"train_loss": -26.326740264892578, "global_step": 411769, "epoch": 4961} {"train_loss": -26.5247745513916, "global_step": 411770, "epoch": 4961} {"train_loss": -26.222431182861328, "global_step": 411771, "epoch": 4961} {"train_loss": -26.565317153930664, "global_step": 411772, "epoch": 4961} {"train_loss": -26.55665397644043, "global_step": 411773, "epoch": 4961} {"train_loss": -26.515338897705078, "global_step": 411774, "epoch": 4961} {"train_loss": -26.657459259033203, "global_step": 411775, "epoch": 4961} {"train_loss": -26.568601608276367, "global_step": 411776, "epoch": 4961} {"train_loss": -26.959217071533203, "global_step": 411777, "epoch": 4961} {"train_loss": -26.472579956054688, "global_step": 411778, "epoch": 4961} {"train_loss": -26.591236114501953, "global_step": 411779, "epoch": 4961} {"train_loss": -26.465055465698242, "global_step": 411780, "epoch": 4961} {"train_loss": -26.72492790222168, "global_step": 411781, "epoch": 4961} {"train_loss": -26.333881378173828, "global_step": 411782, "epoch": 4961} {"train_loss": -26.547256469726562, "global_step": 411783, "epoch": 4961} {"train_loss": -27.184112548828125, "global_step": 411784, "epoch": 4961} {"train_loss": -26.85235595703125, "global_step": 411785, "epoch": 4961} {"train_loss": -26.846633911132812, "global_step": 411786, "epoch": 4961} {"train_loss": -26.540109634399414, "global_step": 411787, "epoch": 4961} {"train_loss": -26.85566520690918, "global_step": 411788, "epoch": 4961} {"train_loss": -26.752338409423828, "global_step": 411789, "epoch": 4961} {"train_loss": -26.883710861206055, "global_step": 411790, "epoch": 4961} {"train_loss": -26.867734909057617, "global_step": 411791, "epoch": 4961} {"train_loss": -26.902374267578125, "global_step": 411792, "epoch": 4961} {"train_loss": -26.454946517944336, "global_step": 411793, "epoch": 4961} {"train_loss": -26.6439266204834, "global_step": 411794, "epoch": 4961} {"train_loss": -26.917224884033203, "global_step": 411795, "epoch": 4961} {"train_loss": -27.083587646484375, "global_step": 411796, "epoch": 4961} {"train_loss": -27.064773559570312, "global_step": 411797, "epoch": 4961} {"train_loss": -26.974149703979492, "global_step": 411798, "epoch": 4961} {"train_loss": -26.84124755859375, "global_step": 411799, "epoch": 4961} {"train_loss": -26.730361938476562, "global_step": 411800, "epoch": 4961} {"train_loss": -26.6246337890625, "global_step": 411801, "epoch": 4961} {"train_loss": -26.90028953552246, "global_step": 411802, "epoch": 4961} {"train_loss": -26.793659210205078, "global_step": 411803, "epoch": 4961} {"train_loss": -26.614038467407227, "global_step": 411804, "epoch": 4961} {"train_loss": -26.52835464477539, "global_step": 411805, "epoch": 4961} {"train_loss": -26.905664443969727, "global_step": 411806, "epoch": 4961} {"train_loss": -26.67401123046875, "global_step": 411807, "epoch": 4961} {"train_loss": -27.06526756286621, "global_step": 411808, "epoch": 4961} {"train_loss": -26.815969467163086, "global_step": 411809, "epoch": 4961} {"train_loss": -27.309070587158203, "global_step": 411810, "epoch": 4961} {"train_loss": -26.425302505493164, "global_step": 411811, "epoch": 4961} {"train_loss": -26.813329696655273, "global_step": 411812, "epoch": 4961} {"train_loss": -26.603063583374023, "global_step": 411813, "epoch": 4961} {"train_loss": -27.07866859436035, "global_step": 411814, "epoch": 4961} {"train_loss": -26.92066764831543, "global_step": 411815, "epoch": 4961} {"train_loss": -26.66803550720215, "global_step": 411816, "epoch": 4961} {"train_loss": -26.649906158447266, "global_step": 411817, "epoch": 4961} {"train_loss": -26.5224666595459, "global_step": 411818, "epoch": 4961} {"train_loss": -26.675983428955078, "global_step": 411819, "epoch": 4961} {"train_loss": -27.122119903564453, "global_step": 411820, "epoch": 4961} {"train_loss": -27.041913986206055, "global_step": 411821, "epoch": 4961} {"train_loss": -26.823644638061523, "global_step": 411822, "epoch": 4961} {"train_loss": -26.81705093383789, "global_step": 411823, "epoch": 4961} {"train_loss": -26.815326690673828, "global_step": 411824, "epoch": 4961} {"train_loss": -26.538732528686523, "global_step": 411825, "epoch": 4961} {"train_loss": -26.684850692749023, "global_step": 411826, "epoch": 4961} {"train_loss": -26.532562255859375, "global_step": 411827, "epoch": 4961} {"train_loss": -27.055130004882812, "global_step": 411828, "epoch": 4961} {"train_loss": -26.778717041015625, "global_step": 411829, "epoch": 4961} {"train_loss": -26.871753692626953, "global_step": 411830, "epoch": 4961} {"train_loss": -26.485015869140625, "global_step": 411831, "epoch": 4961} {"train_loss": -26.7294979095459, "global_step": 411832, "epoch": 4961} {"train_loss": -26.677026748657227, "global_step": 411833, "epoch": 4961} {"train_loss": -27.170103073120117, "global_step": 411834, "epoch": 4961} {"train_loss": -26.745040893554688, "global_step": 411835, "epoch": 4961} {"train_loss": -26.9372501373291, "global_step": 411836, "epoch": 4961} {"train_loss": -26.674711227416992, "global_step": 411837, "epoch": 4961} {"train_loss": -27.0095272064209, "global_step": 411838, "epoch": 4961} {"train_loss": -26.63397789001465, "global_step": 411839, "epoch": 4961} {"train_loss": -26.8074893951416, "global_step": 411840, "epoch": 4961} {"train_loss": -26.908370971679688, "global_step": 411841, "epoch": 4961} {"train_loss": -26.9686222076416, "global_step": 411842, "epoch": 4961} {"train_loss": -26.852096557617188, "global_step": 411843, "epoch": 4961} {"train_loss": -26.681243896484375, "global_step": 411844, "epoch": 4961} {"train_loss": -26.73778453505183, "global_step": 411845, "epoch": 4961, "val_loss": 6495106.5} {"train_loss": -26.412113189697266, "global_step": 411846, "epoch": 4962} {"train_loss": -26.24757957458496, "global_step": 411847, "epoch": 4962} {"train_loss": -26.850019454956055, "global_step": 411848, "epoch": 4962} {"train_loss": -26.465784072875977, "global_step": 411849, "epoch": 4962} {"train_loss": -25.938207626342773, "global_step": 411850, "epoch": 4962} {"train_loss": -26.179868698120117, "global_step": 411851, "epoch": 4962} {"train_loss": -26.493146896362305, "global_step": 411852, "epoch": 4962} {"train_loss": -25.798065185546875, "global_step": 411853, "epoch": 4962} {"train_loss": -26.25798988342285, "global_step": 411854, "epoch": 4962} {"train_loss": -25.882238388061523, "global_step": 411855, "epoch": 4962} {"train_loss": -26.8006534576416, "global_step": 411856, "epoch": 4962} {"train_loss": -26.53516960144043, "global_step": 411857, "epoch": 4962} {"train_loss": -26.312103271484375, "global_step": 411858, "epoch": 4962} {"train_loss": -26.388309478759766, "global_step": 411859, "epoch": 4962} {"train_loss": -26.079206466674805, "global_step": 411860, "epoch": 4962} {"train_loss": -25.958341598510742, "global_step": 411861, "epoch": 4962} {"train_loss": -26.702056884765625, "global_step": 411862, "epoch": 4962} {"train_loss": -26.862701416015625, "global_step": 411863, "epoch": 4962} {"train_loss": -26.61248779296875, "global_step": 411864, "epoch": 4962} {"train_loss": -26.3068790435791, "global_step": 411865, "epoch": 4962} {"train_loss": -26.68751335144043, "global_step": 411866, "epoch": 4962} {"train_loss": -26.38986587524414, "global_step": 411867, "epoch": 4962} {"train_loss": -26.967172622680664, "global_step": 411868, "epoch": 4962} {"train_loss": -26.545042037963867, "global_step": 411869, "epoch": 4962} {"train_loss": -26.55128288269043, "global_step": 411870, "epoch": 4962} {"train_loss": -26.5506591796875, "global_step": 411871, "epoch": 4962} {"train_loss": -26.693775177001953, "global_step": 411872, "epoch": 4962} {"train_loss": -26.628137588500977, "global_step": 411873, "epoch": 4962} {"train_loss": -26.52545738220215, "global_step": 411874, "epoch": 4962} {"train_loss": -26.878284454345703, "global_step": 411875, "epoch": 4962} {"train_loss": -26.646909713745117, "global_step": 411876, "epoch": 4962} {"train_loss": -26.641162872314453, "global_step": 411877, "epoch": 4962} {"train_loss": -26.846973419189453, "global_step": 411878, "epoch": 4962} {"train_loss": -26.55584716796875, "global_step": 411879, "epoch": 4962} {"train_loss": -26.74972915649414, "global_step": 411880, "epoch": 4962} {"train_loss": -26.793668746948242, "global_step": 411881, "epoch": 4962} {"train_loss": -26.936389923095703, "global_step": 411882, "epoch": 4962} {"train_loss": -26.860071182250977, "global_step": 411883, "epoch": 4962} {"train_loss": -26.868988037109375, "global_step": 411884, "epoch": 4962} {"train_loss": -26.727148056030273, "global_step": 411885, "epoch": 4962} {"train_loss": -26.828414916992188, "global_step": 411886, "epoch": 4962} {"train_loss": -26.74488639831543, "global_step": 411887, "epoch": 4962} {"train_loss": -26.545623779296875, "global_step": 411888, "epoch": 4962} {"train_loss": -26.864532470703125, "global_step": 411889, "epoch": 4962} {"train_loss": -26.89630126953125, "global_step": 411890, "epoch": 4962} {"train_loss": -26.972009658813477, "global_step": 411891, "epoch": 4962} {"train_loss": -26.894495010375977, "global_step": 411892, "epoch": 4962} {"train_loss": -27.045766830444336, "global_step": 411893, "epoch": 4962} {"train_loss": -26.748945236206055, "global_step": 411894, "epoch": 4962} {"train_loss": -26.91139793395996, "global_step": 411895, "epoch": 4962} {"train_loss": -26.592178344726562, "global_step": 411896, "epoch": 4962} {"train_loss": -26.88276481628418, "global_step": 411897, "epoch": 4962} {"train_loss": -27.029468536376953, "global_step": 411898, "epoch": 4962} {"train_loss": -26.594018936157227, "global_step": 411899, "epoch": 4962} {"train_loss": -26.895185470581055, "global_step": 411900, "epoch": 4962} {"train_loss": -26.33138084411621, "global_step": 411901, "epoch": 4962} {"train_loss": -25.865646362304688, "global_step": 411902, "epoch": 4962} {"train_loss": -26.56611442565918, "global_step": 411903, "epoch": 4962} {"train_loss": -26.340063095092773, "global_step": 411904, "epoch": 4962} {"train_loss": -26.94829750061035, "global_step": 411905, "epoch": 4962} {"train_loss": -26.947357177734375, "global_step": 411906, "epoch": 4962} {"train_loss": -26.859182357788086, "global_step": 411907, "epoch": 4962} {"train_loss": -26.439319610595703, "global_step": 411908, "epoch": 4962} {"train_loss": -26.537878036499023, "global_step": 411909, "epoch": 4962} {"train_loss": -26.847951889038086, "global_step": 411910, "epoch": 4962} {"train_loss": -26.88690757751465, "global_step": 411911, "epoch": 4962} {"train_loss": -26.467254638671875, "global_step": 411912, "epoch": 4962} {"train_loss": -26.62794303894043, "global_step": 411913, "epoch": 4962} {"train_loss": -26.641864776611328, "global_step": 411914, "epoch": 4962} {"train_loss": -26.86053466796875, "global_step": 411915, "epoch": 4962} {"train_loss": -27.045400619506836, "global_step": 411916, "epoch": 4962} {"train_loss": -26.832849502563477, "global_step": 411917, "epoch": 4962} {"train_loss": -26.871946334838867, "global_step": 411918, "epoch": 4962} {"train_loss": -26.52439308166504, "global_step": 411919, "epoch": 4962} {"train_loss": -27.160123825073242, "global_step": 411920, "epoch": 4962} {"train_loss": -26.84114646911621, "global_step": 411921, "epoch": 4962} {"train_loss": -26.67789649963379, "global_step": 411922, "epoch": 4962} {"train_loss": -26.707275390625, "global_step": 411923, "epoch": 4962} {"train_loss": -26.928930282592773, "global_step": 411924, "epoch": 4962} {"train_loss": -26.770755767822266, "global_step": 411925, "epoch": 4962} {"train_loss": -26.614355087280273, "global_step": 411926, "epoch": 4962} {"train_loss": -27.1538143157959, "global_step": 411927, "epoch": 4962} {"train_loss": -26.640100594026496, "global_step": 411928, "epoch": 4962, "val_loss": 6448932.0} {"train_loss": -25.45442771911621, "global_step": 411929, "epoch": 4963} {"train_loss": -25.06299591064453, "global_step": 411930, "epoch": 4963} {"train_loss": -25.980329513549805, "global_step": 411931, "epoch": 4963} {"train_loss": -25.656848907470703, "global_step": 411932, "epoch": 4963} {"train_loss": -25.91800308227539, "global_step": 411933, "epoch": 4963} {"train_loss": -25.9705867767334, "global_step": 411934, "epoch": 4963} {"train_loss": -26.010412216186523, "global_step": 411935, "epoch": 4963} {"train_loss": -26.610471725463867, "global_step": 411936, "epoch": 4963} {"train_loss": -25.98799705505371, "global_step": 411937, "epoch": 4963} {"train_loss": -26.368316650390625, "global_step": 411938, "epoch": 4963} {"train_loss": -26.60774040222168, "global_step": 411939, "epoch": 4963} {"train_loss": -26.55783462524414, "global_step": 411940, "epoch": 4963} {"train_loss": -26.691125869750977, "global_step": 411941, "epoch": 4963} {"train_loss": -26.65461540222168, "global_step": 411942, "epoch": 4963} {"train_loss": -26.3319034576416, "global_step": 411943, "epoch": 4963} {"train_loss": -26.73917579650879, "global_step": 411944, "epoch": 4963} {"train_loss": -26.46869468688965, "global_step": 411945, "epoch": 4963} {"train_loss": -26.384506225585938, "global_step": 411946, "epoch": 4963} {"train_loss": -26.542322158813477, "global_step": 411947, "epoch": 4963} {"train_loss": -26.74554443359375, "global_step": 411948, "epoch": 4963} {"train_loss": -26.599878311157227, "global_step": 411949, "epoch": 4963} {"train_loss": -26.603086471557617, "global_step": 411950, "epoch": 4963} {"train_loss": -26.683517456054688, "global_step": 411951, "epoch": 4963} {"train_loss": -26.74946403503418, "global_step": 411952, "epoch": 4963} {"train_loss": -26.52947998046875, "global_step": 411953, "epoch": 4963} {"train_loss": -26.616230010986328, "global_step": 411954, "epoch": 4963} {"train_loss": -26.95442771911621, "global_step": 411955, "epoch": 4963} {"train_loss": -26.600677490234375, "global_step": 411956, "epoch": 4963} {"train_loss": -26.748010635375977, "global_step": 411957, "epoch": 4963} {"train_loss": -26.69038200378418, "global_step": 411958, "epoch": 4963} {"train_loss": -26.878952026367188, "global_step": 411959, "epoch": 4963} {"train_loss": -26.664587020874023, "global_step": 411960, "epoch": 4963} {"train_loss": -26.970544815063477, "global_step": 411961, "epoch": 4963} {"train_loss": -27.015583038330078, "global_step": 411962, "epoch": 4963} {"train_loss": -26.5775089263916, "global_step": 411963, "epoch": 4963} {"train_loss": -27.032855987548828, "global_step": 411964, "epoch": 4963} {"train_loss": -27.017602920532227, "global_step": 411965, "epoch": 4963} {"train_loss": -26.906518936157227, "global_step": 411966, "epoch": 4963} {"train_loss": -27.288864135742188, "global_step": 411967, "epoch": 4963} {"train_loss": -26.766019821166992, "global_step": 411968, "epoch": 4963} {"train_loss": -26.5804443359375, "global_step": 411969, "epoch": 4963} {"train_loss": -26.920825958251953, "global_step": 411970, "epoch": 4963} {"train_loss": -26.84914207458496, "global_step": 411971, "epoch": 4963} {"train_loss": -26.450714111328125, "global_step": 411972, "epoch": 4963} {"train_loss": -26.628198623657227, "global_step": 411973, "epoch": 4963} {"train_loss": -26.428848266601562, "global_step": 411974, "epoch": 4963} {"train_loss": -26.67974853515625, "global_step": 411975, "epoch": 4963} {"train_loss": -26.84183692932129, "global_step": 411976, "epoch": 4963} {"train_loss": -26.912677764892578, "global_step": 411977, "epoch": 4963} {"train_loss": -27.060489654541016, "global_step": 411978, "epoch": 4963} {"train_loss": -26.8421688079834, "global_step": 411979, "epoch": 4963} {"train_loss": -26.866153717041016, "global_step": 411980, "epoch": 4963} {"train_loss": -26.74793815612793, "global_step": 411981, "epoch": 4963} {"train_loss": -26.793439865112305, "global_step": 411982, "epoch": 4963} {"train_loss": -27.328216552734375, "global_step": 411983, "epoch": 4963} {"train_loss": -26.93255615234375, "global_step": 411984, "epoch": 4963} {"train_loss": -26.679380416870117, "global_step": 411985, "epoch": 4963} {"train_loss": -26.770923614501953, "global_step": 411986, "epoch": 4963} {"train_loss": -26.716541290283203, "global_step": 411987, "epoch": 4963} {"train_loss": -26.696496963500977, "global_step": 411988, "epoch": 4963} {"train_loss": -26.740427017211914, "global_step": 411989, "epoch": 4963} {"train_loss": -26.835159301757812, "global_step": 411990, "epoch": 4963} {"train_loss": -27.113361358642578, "global_step": 411991, "epoch": 4963} {"train_loss": -26.909372329711914, "global_step": 411992, "epoch": 4963} {"train_loss": -26.753652572631836, "global_step": 411993, "epoch": 4963} {"train_loss": -26.74346923828125, "global_step": 411994, "epoch": 4963} {"train_loss": -26.92384147644043, "global_step": 411995, "epoch": 4963} {"train_loss": -26.704681396484375, "global_step": 411996, "epoch": 4963} {"train_loss": -26.903400421142578, "global_step": 411997, "epoch": 4963} {"train_loss": -27.072498321533203, "global_step": 411998, "epoch": 4963} {"train_loss": -27.025991439819336, "global_step": 411999, "epoch": 4963} {"train_loss": -26.631845474243164, "global_step": 412000, "epoch": 4963} {"train_loss": -26.53461265563965, "global_step": 412001, "epoch": 4963} {"train_loss": -26.798688888549805, "global_step": 412002, "epoch": 4963} {"train_loss": -26.6925048828125, "global_step": 412003, "epoch": 4963} {"train_loss": -26.346179962158203, "global_step": 412004, "epoch": 4963} {"train_loss": -26.6999568939209, "global_step": 412005, "epoch": 4963} {"train_loss": -26.62294578552246, "global_step": 412006, "epoch": 4963} {"train_loss": -26.78553581237793, "global_step": 412007, "epoch": 4963} {"train_loss": -26.549589157104492, "global_step": 412008, "epoch": 4963} {"train_loss": -26.818262100219727, "global_step": 412009, "epoch": 4963} {"train_loss": -27.123992919921875, "global_step": 412010, "epoch": 4963} {"train_loss": -26.641440150249434, "global_step": 412011, "epoch": 4963, "val_loss": 6435150.0} {"train_loss": -25.581087112426758, "global_step": 412012, "epoch": 4964} {"train_loss": -25.624378204345703, "global_step": 412013, "epoch": 4964} {"train_loss": -26.29262351989746, "global_step": 412014, "epoch": 4964} {"train_loss": -25.624526977539062, "global_step": 412015, "epoch": 4964} {"train_loss": -26.1153564453125, "global_step": 412016, "epoch": 4964} {"train_loss": -26.543996810913086, "global_step": 412017, "epoch": 4964} {"train_loss": -25.95660972595215, "global_step": 412018, "epoch": 4964} {"train_loss": -26.740909576416016, "global_step": 412019, "epoch": 4964} {"train_loss": -26.524078369140625, "global_step": 412020, "epoch": 4964} {"train_loss": -26.234846115112305, "global_step": 412021, "epoch": 4964} {"train_loss": -26.220319747924805, "global_step": 412022, "epoch": 4964} {"train_loss": -26.702733993530273, "global_step": 412023, "epoch": 4964} {"train_loss": -26.499603271484375, "global_step": 412024, "epoch": 4964} {"train_loss": -26.617938995361328, "global_step": 412025, "epoch": 4964} {"train_loss": -26.783918380737305, "global_step": 412026, "epoch": 4964} {"train_loss": -26.465097427368164, "global_step": 412027, "epoch": 4964} {"train_loss": -26.21897315979004, "global_step": 412028, "epoch": 4964} {"train_loss": -26.5972900390625, "global_step": 412029, "epoch": 4964} {"train_loss": -26.572376251220703, "global_step": 412030, "epoch": 4964} {"train_loss": -26.550695419311523, "global_step": 412031, "epoch": 4964} {"train_loss": -26.53519058227539, "global_step": 412032, "epoch": 4964} {"train_loss": -26.52765464782715, "global_step": 412033, "epoch": 4964} {"train_loss": -26.606231689453125, "global_step": 412034, "epoch": 4964} {"train_loss": -26.528308868408203, "global_step": 412035, "epoch": 4964} {"train_loss": -26.917316436767578, "global_step": 412036, "epoch": 4964} {"train_loss": -26.85527992248535, "global_step": 412037, "epoch": 4964} {"train_loss": -26.59528923034668, "global_step": 412038, "epoch": 4964} {"train_loss": -27.223712921142578, "global_step": 412039, "epoch": 4964} {"train_loss": -26.952672958374023, "global_step": 412040, "epoch": 4964} {"train_loss": -26.52460289001465, "global_step": 412041, "epoch": 4964} {"train_loss": -26.8524169921875, "global_step": 412042, "epoch": 4964} {"train_loss": -26.868234634399414, "global_step": 412043, "epoch": 4964} {"train_loss": -26.815561294555664, "global_step": 412044, "epoch": 4964} {"train_loss": -27.198511123657227, "global_step": 412045, "epoch": 4964} {"train_loss": -26.956357955932617, "global_step": 412046, "epoch": 4964} {"train_loss": -27.027103424072266, "global_step": 412047, "epoch": 4964} {"train_loss": -26.991418838500977, "global_step": 412048, "epoch": 4964} {"train_loss": -27.01651954650879, "global_step": 412049, "epoch": 4964} {"train_loss": -26.862863540649414, "global_step": 412050, "epoch": 4964} {"train_loss": -26.45657730102539, "global_step": 412051, "epoch": 4964} {"train_loss": -26.50373649597168, "global_step": 412052, "epoch": 4964} {"train_loss": -26.5654296875, "global_step": 412053, "epoch": 4964} {"train_loss": -26.55756187438965, "global_step": 412054, "epoch": 4964} {"train_loss": -27.027984619140625, "global_step": 412055, "epoch": 4964} {"train_loss": -26.6027774810791, "global_step": 412056, "epoch": 4964} {"train_loss": -27.171279907226562, "global_step": 412057, "epoch": 4964} {"train_loss": -26.90757179260254, "global_step": 412058, "epoch": 4964} {"train_loss": -26.67878532409668, "global_step": 412059, "epoch": 4964} {"train_loss": -26.34621238708496, "global_step": 412060, "epoch": 4964} {"train_loss": -26.758092880249023, "global_step": 412061, "epoch": 4964} {"train_loss": -26.414417266845703, "global_step": 412062, "epoch": 4964} {"train_loss": -26.524744033813477, "global_step": 412063, "epoch": 4964} {"train_loss": -26.5718994140625, "global_step": 412064, "epoch": 4964} {"train_loss": -27.0224666595459, "global_step": 412065, "epoch": 4964} {"train_loss": -26.954227447509766, "global_step": 412066, "epoch": 4964} {"train_loss": -26.923542022705078, "global_step": 412067, "epoch": 4964} {"train_loss": -26.997304916381836, "global_step": 412068, "epoch": 4964} {"train_loss": -26.938276290893555, "global_step": 412069, "epoch": 4964} {"train_loss": -26.867523193359375, "global_step": 412070, "epoch": 4964} {"train_loss": -26.66782569885254, "global_step": 412071, "epoch": 4964} {"train_loss": -26.679479598999023, "global_step": 412072, "epoch": 4964} {"train_loss": -26.878070831298828, "global_step": 412073, "epoch": 4964} {"train_loss": -26.626758575439453, "global_step": 412074, "epoch": 4964} {"train_loss": -26.7191104888916, "global_step": 412075, "epoch": 4964} {"train_loss": -26.858814239501953, "global_step": 412076, "epoch": 4964} {"train_loss": -26.635644912719727, "global_step": 412077, "epoch": 4964} {"train_loss": -26.50674819946289, "global_step": 412078, "epoch": 4964} {"train_loss": -26.858478546142578, "global_step": 412079, "epoch": 4964} {"train_loss": -26.70111656188965, "global_step": 412080, "epoch": 4964} {"train_loss": -26.55610466003418, "global_step": 412081, "epoch": 4964} {"train_loss": -26.935510635375977, "global_step": 412082, "epoch": 4964} {"train_loss": -27.124893188476562, "global_step": 412083, "epoch": 4964} {"train_loss": -27.022308349609375, "global_step": 412084, "epoch": 4964} {"train_loss": -26.74629020690918, "global_step": 412085, "epoch": 4964} {"train_loss": -26.914508819580078, "global_step": 412086, "epoch": 4964} {"train_loss": -26.951231002807617, "global_step": 412087, "epoch": 4964} {"train_loss": -26.8985652923584, "global_step": 412088, "epoch": 4964} {"train_loss": -26.4212589263916, "global_step": 412089, "epoch": 4964} {"train_loss": -27.020902633666992, "global_step": 412090, "epoch": 4964} {"train_loss": -27.0729923248291, "global_step": 412091, "epoch": 4964} {"train_loss": -26.9310245513916, "global_step": 412092, "epoch": 4964} {"train_loss": -26.801990509033203, "global_step": 412093, "epoch": 4964} {"train_loss": -26.682167742625776, "global_step": 412094, "epoch": 4964, "val_loss": 6494350.5} {"train_loss": -25.82337760925293, "global_step": 412095, "epoch": 4965} {"train_loss": -25.35997200012207, "global_step": 412096, "epoch": 4965} {"train_loss": -26.175024032592773, "global_step": 412097, "epoch": 4965} {"train_loss": -26.397602081298828, "global_step": 412098, "epoch": 4965} {"train_loss": -26.13471031188965, "global_step": 412099, "epoch": 4965} {"train_loss": -26.367643356323242, "global_step": 412100, "epoch": 4965} {"train_loss": -26.333759307861328, "global_step": 412101, "epoch": 4965} {"train_loss": -26.2692813873291, "global_step": 412102, "epoch": 4965} {"train_loss": -26.112146377563477, "global_step": 412103, "epoch": 4965} {"train_loss": -26.2691593170166, "global_step": 412104, "epoch": 4965} {"train_loss": -26.5400390625, "global_step": 412105, "epoch": 4965} {"train_loss": -26.540435791015625, "global_step": 412106, "epoch": 4965} {"train_loss": -26.53370475769043, "global_step": 412107, "epoch": 4965} {"train_loss": -26.28009605407715, "global_step": 412108, "epoch": 4965} {"train_loss": -26.599990844726562, "global_step": 412109, "epoch": 4965} {"train_loss": -26.43475914001465, "global_step": 412110, "epoch": 4965} {"train_loss": -26.619775772094727, "global_step": 412111, "epoch": 4965} {"train_loss": -26.824674606323242, "global_step": 412112, "epoch": 4965} {"train_loss": -26.38472557067871, "global_step": 412113, "epoch": 4965} {"train_loss": -26.81809425354004, "global_step": 412114, "epoch": 4965} {"train_loss": -27.030506134033203, "global_step": 412115, "epoch": 4965} {"train_loss": -26.597497940063477, "global_step": 412116, "epoch": 4965} {"train_loss": -26.88405418395996, "global_step": 412117, "epoch": 4965} {"train_loss": -26.718616485595703, "global_step": 412118, "epoch": 4965} {"train_loss": -26.548553466796875, "global_step": 412119, "epoch": 4965} {"train_loss": -26.62796401977539, "global_step": 412120, "epoch": 4965} {"train_loss": -26.34293556213379, "global_step": 412121, "epoch": 4965} {"train_loss": -26.217697143554688, "global_step": 412122, "epoch": 4965} {"train_loss": -26.655353546142578, "global_step": 412123, "epoch": 4965} {"train_loss": -26.653100967407227, "global_step": 412124, "epoch": 4965} {"train_loss": -26.528369903564453, "global_step": 412125, "epoch": 4965} {"train_loss": -26.517255783081055, "global_step": 412126, "epoch": 4965} {"train_loss": -26.742284774780273, "global_step": 412127, "epoch": 4965} {"train_loss": -26.415990829467773, "global_step": 412128, "epoch": 4965} {"train_loss": -26.476165771484375, "global_step": 412129, "epoch": 4965} {"train_loss": -26.20026969909668, "global_step": 412130, "epoch": 4965} {"train_loss": -26.7104434967041, "global_step": 412131, "epoch": 4965} {"train_loss": -26.635568618774414, "global_step": 412132, "epoch": 4965} {"train_loss": -27.08099365234375, "global_step": 412133, "epoch": 4965} {"train_loss": -26.543798446655273, "global_step": 412134, "epoch": 4965} {"train_loss": -26.631576538085938, "global_step": 412135, "epoch": 4965} {"train_loss": -26.9107666015625, "global_step": 412136, "epoch": 4965} {"train_loss": -26.905725479125977, "global_step": 412137, "epoch": 4965} {"train_loss": -26.873388290405273, "global_step": 412138, "epoch": 4965} {"train_loss": -26.847549438476562, "global_step": 412139, "epoch": 4965} {"train_loss": -26.654861450195312, "global_step": 412140, "epoch": 4965} {"train_loss": -27.00362205505371, "global_step": 412141, "epoch": 4965} {"train_loss": -26.876800537109375, "global_step": 412142, "epoch": 4965} {"train_loss": -26.89117431640625, "global_step": 412143, "epoch": 4965} {"train_loss": -26.98044776916504, "global_step": 412144, "epoch": 4965} {"train_loss": -26.60479164123535, "global_step": 412145, "epoch": 4965} {"train_loss": -27.019535064697266, "global_step": 412146, "epoch": 4965} {"train_loss": -27.070524215698242, "global_step": 412147, "epoch": 4965} {"train_loss": -26.459564208984375, "global_step": 412148, "epoch": 4965} {"train_loss": -26.78304100036621, "global_step": 412149, "epoch": 4965} {"train_loss": -26.7623291015625, "global_step": 412150, "epoch": 4965} {"train_loss": -26.9593563079834, "global_step": 412151, "epoch": 4965} {"train_loss": -26.439706802368164, "global_step": 412152, "epoch": 4965} {"train_loss": -26.60791015625, "global_step": 412153, "epoch": 4965} {"train_loss": -26.66083335876465, "global_step": 412154, "epoch": 4965} {"train_loss": -26.03177261352539, "global_step": 412155, "epoch": 4965} {"train_loss": -26.395816802978516, "global_step": 412156, "epoch": 4965} {"train_loss": -26.09490966796875, "global_step": 412157, "epoch": 4965} {"train_loss": -26.7857723236084, "global_step": 412158, "epoch": 4965} {"train_loss": -26.548248291015625, "global_step": 412159, "epoch": 4965} {"train_loss": -26.915903091430664, "global_step": 412160, "epoch": 4965} {"train_loss": -26.81538200378418, "global_step": 412161, "epoch": 4965} {"train_loss": -26.460912704467773, "global_step": 412162, "epoch": 4965} {"train_loss": -26.711050033569336, "global_step": 412163, "epoch": 4965} {"train_loss": -26.58282470703125, "global_step": 412164, "epoch": 4965} {"train_loss": -26.621540069580078, "global_step": 412165, "epoch": 4965} {"train_loss": -26.724157333374023, "global_step": 412166, "epoch": 4965} {"train_loss": -26.77860450744629, "global_step": 412167, "epoch": 4965} {"train_loss": -27.067697525024414, "global_step": 412168, "epoch": 4965} {"train_loss": -26.910322189331055, "global_step": 412169, "epoch": 4965} {"train_loss": -26.237287521362305, "global_step": 412170, "epoch": 4965} {"train_loss": -26.91952896118164, "global_step": 412171, "epoch": 4965} {"train_loss": -26.87127685546875, "global_step": 412172, "epoch": 4965} {"train_loss": -26.845991134643555, "global_step": 412173, "epoch": 4965} {"train_loss": -26.83174705505371, "global_step": 412174, "epoch": 4965} {"train_loss": -26.6789608001709, "global_step": 412175, "epoch": 4965} {"train_loss": -27.06073570251465, "global_step": 412176, "epoch": 4965} {"train_loss": -26.611983149884693, "global_step": 412177, "epoch": 4965, "val_loss": 6483246.0} {"train_loss": -25.48866844177246, "global_step": 412178, "epoch": 4966} {"train_loss": -26.091211318969727, "global_step": 412179, "epoch": 4966} {"train_loss": -25.683752059936523, "global_step": 412180, "epoch": 4966} {"train_loss": -25.01024627685547, "global_step": 412181, "epoch": 4966} {"train_loss": -25.4007568359375, "global_step": 412182, "epoch": 4966} {"train_loss": -25.8051815032959, "global_step": 412183, "epoch": 4966} {"train_loss": -26.284454345703125, "global_step": 412184, "epoch": 4966} {"train_loss": -25.32290267944336, "global_step": 412185, "epoch": 4966} {"train_loss": -26.244037628173828, "global_step": 412186, "epoch": 4966} {"train_loss": -25.800931930541992, "global_step": 412187, "epoch": 4966} {"train_loss": -25.549068450927734, "global_step": 412188, "epoch": 4966} {"train_loss": -25.777130126953125, "global_step": 412189, "epoch": 4966} {"train_loss": -26.398096084594727, "global_step": 412190, "epoch": 4966} {"train_loss": -25.955820083618164, "global_step": 412191, "epoch": 4966} {"train_loss": -26.1281795501709, "global_step": 412192, "epoch": 4966} {"train_loss": -26.09734535217285, "global_step": 412193, "epoch": 4966} {"train_loss": -26.452178955078125, "global_step": 412194, "epoch": 4966} {"train_loss": -26.122421264648438, "global_step": 412195, "epoch": 4966} {"train_loss": -26.66572380065918, "global_step": 412196, "epoch": 4966} {"train_loss": -26.318359375, "global_step": 412197, "epoch": 4966} {"train_loss": -26.375635147094727, "global_step": 412198, "epoch": 4966} {"train_loss": -26.15213966369629, "global_step": 412199, "epoch": 4966} {"train_loss": -26.148412704467773, "global_step": 412200, "epoch": 4966} {"train_loss": -26.222888946533203, "global_step": 412201, "epoch": 4966} {"train_loss": -26.48627281188965, "global_step": 412202, "epoch": 4966} {"train_loss": -26.03325843811035, "global_step": 412203, "epoch": 4966} {"train_loss": -26.463464736938477, "global_step": 412204, "epoch": 4966} {"train_loss": -26.5411434173584, "global_step": 412205, "epoch": 4966} {"train_loss": -26.515344619750977, "global_step": 412206, "epoch": 4966} {"train_loss": -26.55902099609375, "global_step": 412207, "epoch": 4966} {"train_loss": -26.639368057250977, "global_step": 412208, "epoch": 4966} {"train_loss": -26.61163330078125, "global_step": 412209, "epoch": 4966} {"train_loss": -26.636260986328125, "global_step": 412210, "epoch": 4966} {"train_loss": -26.526803970336914, "global_step": 412211, "epoch": 4966} {"train_loss": -26.705554962158203, "global_step": 412212, "epoch": 4966} {"train_loss": -26.575885772705078, "global_step": 412213, "epoch": 4966} {"train_loss": -26.723773956298828, "global_step": 412214, "epoch": 4966} {"train_loss": -26.643054962158203, "global_step": 412215, "epoch": 4966} {"train_loss": -27.064023971557617, "global_step": 412216, "epoch": 4966} {"train_loss": -26.756855010986328, "global_step": 412217, "epoch": 4966} {"train_loss": -26.815235137939453, "global_step": 412218, "epoch": 4966} {"train_loss": -27.14198112487793, "global_step": 412219, "epoch": 4966} {"train_loss": -27.03621482849121, "global_step": 412220, "epoch": 4966} {"train_loss": -26.87458610534668, "global_step": 412221, "epoch": 4966} {"train_loss": -26.73896598815918, "global_step": 412222, "epoch": 4966} {"train_loss": -26.9290828704834, "global_step": 412223, "epoch": 4966} {"train_loss": -26.7722225189209, "global_step": 412224, "epoch": 4966} {"train_loss": -26.90077018737793, "global_step": 412225, "epoch": 4966} {"train_loss": -26.8283748626709, "global_step": 412226, "epoch": 4966} {"train_loss": -26.759363174438477, "global_step": 412227, "epoch": 4966} {"train_loss": -27.188867568969727, "global_step": 412228, "epoch": 4966} {"train_loss": -26.995656967163086, "global_step": 412229, "epoch": 4966} {"train_loss": -26.67249870300293, "global_step": 412230, "epoch": 4966} {"train_loss": -27.061349868774414, "global_step": 412231, "epoch": 4966} {"train_loss": -26.727380752563477, "global_step": 412232, "epoch": 4966} {"train_loss": -26.773040771484375, "global_step": 412233, "epoch": 4966} {"train_loss": -26.454364776611328, "global_step": 412234, "epoch": 4966} {"train_loss": -26.75140380859375, "global_step": 412235, "epoch": 4966} {"train_loss": -26.885290145874023, "global_step": 412236, "epoch": 4966} {"train_loss": -26.681928634643555, "global_step": 412237, "epoch": 4966} {"train_loss": -26.656391143798828, "global_step": 412238, "epoch": 4966} {"train_loss": -26.76576042175293, "global_step": 412239, "epoch": 4966} {"train_loss": -26.52080726623535, "global_step": 412240, "epoch": 4966} {"train_loss": -26.814239501953125, "global_step": 412241, "epoch": 4966} {"train_loss": -26.1005916595459, "global_step": 412242, "epoch": 4966} {"train_loss": -26.576025009155273, "global_step": 412243, "epoch": 4966} {"train_loss": -26.756757736206055, "global_step": 412244, "epoch": 4966} {"train_loss": -26.58966636657715, "global_step": 412245, "epoch": 4966} {"train_loss": -26.73101234436035, "global_step": 412246, "epoch": 4966} {"train_loss": -26.482772827148438, "global_step": 412247, "epoch": 4966} {"train_loss": -26.338993072509766, "global_step": 412248, "epoch": 4966} {"train_loss": -26.644163131713867, "global_step": 412249, "epoch": 4966} {"train_loss": -26.65157127380371, "global_step": 412250, "epoch": 4966} {"train_loss": -26.6546688079834, "global_step": 412251, "epoch": 4966} {"train_loss": -26.495630264282227, "global_step": 412252, "epoch": 4966} {"train_loss": -26.533679962158203, "global_step": 412253, "epoch": 4966} {"train_loss": -26.4039249420166, "global_step": 412254, "epoch": 4966} {"train_loss": -26.660602569580078, "global_step": 412255, "epoch": 4966} {"train_loss": -26.63504409790039, "global_step": 412256, "epoch": 4966} {"train_loss": -26.795263290405273, "global_step": 412257, "epoch": 4966} {"train_loss": -26.745141983032227, "global_step": 412258, "epoch": 4966} {"train_loss": -26.77728271484375, "global_step": 412259, "epoch": 4966} {"train_loss": -26.503742149077265, "global_step": 412260, "epoch": 4966, "val_loss": 6394576.0} {"train_loss": -25.908832550048828, "global_step": 412261, "epoch": 4967} {"train_loss": -26.234149932861328, "global_step": 412262, "epoch": 4967} {"train_loss": -26.189069747924805, "global_step": 412263, "epoch": 4967} {"train_loss": -26.28557777404785, "global_step": 412264, "epoch": 4967} {"train_loss": -26.573230743408203, "global_step": 412265, "epoch": 4967} {"train_loss": -26.299177169799805, "global_step": 412266, "epoch": 4967} {"train_loss": -26.295612335205078, "global_step": 412267, "epoch": 4967} {"train_loss": -26.3931941986084, "global_step": 412268, "epoch": 4967} {"train_loss": -26.831531524658203, "global_step": 412269, "epoch": 4967} {"train_loss": -26.215530395507812, "global_step": 412270, "epoch": 4967} {"train_loss": -26.347259521484375, "global_step": 412271, "epoch": 4967} {"train_loss": -26.23163414001465, "global_step": 412272, "epoch": 4967} {"train_loss": -26.74688720703125, "global_step": 412273, "epoch": 4967} {"train_loss": -26.08265495300293, "global_step": 412274, "epoch": 4967} {"train_loss": -26.683563232421875, "global_step": 412275, "epoch": 4967} {"train_loss": -26.356863021850586, "global_step": 412276, "epoch": 4967} {"train_loss": -26.923486709594727, "global_step": 412277, "epoch": 4967} {"train_loss": -26.8529052734375, "global_step": 412278, "epoch": 4967} {"train_loss": -26.550567626953125, "global_step": 412279, "epoch": 4967} {"train_loss": -26.57075309753418, "global_step": 412280, "epoch": 4967} {"train_loss": -26.355396270751953, "global_step": 412281, "epoch": 4967} {"train_loss": -26.736011505126953, "global_step": 412282, "epoch": 4967} {"train_loss": -26.658777236938477, "global_step": 412283, "epoch": 4967} {"train_loss": -26.394880294799805, "global_step": 412284, "epoch": 4967} {"train_loss": -26.87249183654785, "global_step": 412285, "epoch": 4967} {"train_loss": -26.51148796081543, "global_step": 412286, "epoch": 4967} {"train_loss": -26.696063995361328, "global_step": 412287, "epoch": 4967} {"train_loss": -27.028669357299805, "global_step": 412288, "epoch": 4967} {"train_loss": -26.684900283813477, "global_step": 412289, "epoch": 4967} {"train_loss": -27.047765731811523, "global_step": 412290, "epoch": 4967} {"train_loss": -26.449026107788086, "global_step": 412291, "epoch": 4967} {"train_loss": -26.6999454498291, "global_step": 412292, "epoch": 4967} {"train_loss": -27.04871940612793, "global_step": 412293, "epoch": 4967} {"train_loss": -27.488935470581055, "global_step": 412294, "epoch": 4967} {"train_loss": -26.5130615234375, "global_step": 412295, "epoch": 4967} {"train_loss": -26.668787002563477, "global_step": 412296, "epoch": 4967} {"train_loss": -26.688196182250977, "global_step": 412297, "epoch": 4967} {"train_loss": -26.943838119506836, "global_step": 412298, "epoch": 4967} {"train_loss": -26.829132080078125, "global_step": 412299, "epoch": 4967} {"train_loss": -26.531599044799805, "global_step": 412300, "epoch": 4967} {"train_loss": -26.551969528198242, "global_step": 412301, "epoch": 4967} {"train_loss": -26.817764282226562, "global_step": 412302, "epoch": 4967} {"train_loss": -26.789304733276367, "global_step": 412303, "epoch": 4967} {"train_loss": -26.743244171142578, "global_step": 412304, "epoch": 4967} {"train_loss": -26.794876098632812, "global_step": 412305, "epoch": 4967} {"train_loss": -26.7404842376709, "global_step": 412306, "epoch": 4967} {"train_loss": -26.362722396850586, "global_step": 412307, "epoch": 4967} {"train_loss": -26.764942169189453, "global_step": 412308, "epoch": 4967} {"train_loss": -26.89885902404785, "global_step": 412309, "epoch": 4967} {"train_loss": -26.91745948791504, "global_step": 412310, "epoch": 4967} {"train_loss": -26.71473503112793, "global_step": 412311, "epoch": 4967} {"train_loss": -26.609411239624023, "global_step": 412312, "epoch": 4967} {"train_loss": -26.99582290649414, "global_step": 412313, "epoch": 4967} {"train_loss": -26.44476318359375, "global_step": 412314, "epoch": 4967} {"train_loss": -25.932958602905273, "global_step": 412315, "epoch": 4967} {"train_loss": -26.6409912109375, "global_step": 412316, "epoch": 4967} {"train_loss": -26.21332359313965, "global_step": 412317, "epoch": 4967} {"train_loss": -26.49395751953125, "global_step": 412318, "epoch": 4967} {"train_loss": -26.9385986328125, "global_step": 412319, "epoch": 4967} {"train_loss": -26.481678009033203, "global_step": 412320, "epoch": 4967} {"train_loss": -26.68787956237793, "global_step": 412321, "epoch": 4967} {"train_loss": -26.408935546875, "global_step": 412322, "epoch": 4967} {"train_loss": -26.773298263549805, "global_step": 412323, "epoch": 4967} {"train_loss": -26.815778732299805, "global_step": 412324, "epoch": 4967} {"train_loss": -26.739225387573242, "global_step": 412325, "epoch": 4967} {"train_loss": -27.079132080078125, "global_step": 412326, "epoch": 4967} {"train_loss": -26.510852813720703, "global_step": 412327, "epoch": 4967} {"train_loss": -26.8671875, "global_step": 412328, "epoch": 4967} {"train_loss": -26.48292350769043, "global_step": 412329, "epoch": 4967} {"train_loss": -27.0252685546875, "global_step": 412330, "epoch": 4967} {"train_loss": -26.427860260009766, "global_step": 412331, "epoch": 4967} {"train_loss": -26.916112899780273, "global_step": 412332, "epoch": 4967} {"train_loss": -26.95204734802246, "global_step": 412333, "epoch": 4967} {"train_loss": -26.87261390686035, "global_step": 412334, "epoch": 4967} {"train_loss": -26.63502311706543, "global_step": 412335, "epoch": 4967} {"train_loss": -26.74542236328125, "global_step": 412336, "epoch": 4967} {"train_loss": -26.688684463500977, "global_step": 412337, "epoch": 4967} {"train_loss": -26.6772518157959, "global_step": 412338, "epoch": 4967} {"train_loss": -26.8548583984375, "global_step": 412339, "epoch": 4967} {"train_loss": -26.919015884399414, "global_step": 412340, "epoch": 4967} {"train_loss": -26.865100860595703, "global_step": 412341, "epoch": 4967} {"train_loss": -26.4544734954834, "global_step": 412342, "epoch": 4967} {"train_loss": -26.640138970800194, "global_step": 412343, "epoch": 4967, "val_loss": 6582832.0} {"train_loss": -25.58851432800293, "global_step": 412344, "epoch": 4968} {"train_loss": -25.955493927001953, "global_step": 412345, "epoch": 4968} {"train_loss": -26.2700138092041, "global_step": 412346, "epoch": 4968} {"train_loss": -26.482391357421875, "global_step": 412347, "epoch": 4968} {"train_loss": -26.201520919799805, "global_step": 412348, "epoch": 4968} {"train_loss": -26.059051513671875, "global_step": 412349, "epoch": 4968} {"train_loss": -26.163110733032227, "global_step": 412350, "epoch": 4968} {"train_loss": -25.866458892822266, "global_step": 412351, "epoch": 4968} {"train_loss": -26.474660873413086, "global_step": 412352, "epoch": 4968} {"train_loss": -25.985116958618164, "global_step": 412353, "epoch": 4968} {"train_loss": -26.71759033203125, "global_step": 412354, "epoch": 4968} {"train_loss": -26.0238094329834, "global_step": 412355, "epoch": 4968} {"train_loss": -26.422134399414062, "global_step": 412356, "epoch": 4968} {"train_loss": -26.468414306640625, "global_step": 412357, "epoch": 4968} {"train_loss": -26.179107666015625, "global_step": 412358, "epoch": 4968} {"train_loss": -26.13168716430664, "global_step": 412359, "epoch": 4968} {"train_loss": -26.46961784362793, "global_step": 412360, "epoch": 4968} {"train_loss": -26.382282257080078, "global_step": 412361, "epoch": 4968} {"train_loss": -26.673215866088867, "global_step": 412362, "epoch": 4968} {"train_loss": -26.71463394165039, "global_step": 412363, "epoch": 4968} {"train_loss": -27.062946319580078, "global_step": 412364, "epoch": 4968} {"train_loss": -26.544477462768555, "global_step": 412365, "epoch": 4968} {"train_loss": -26.8765869140625, "global_step": 412366, "epoch": 4968} {"train_loss": -26.838226318359375, "global_step": 412367, "epoch": 4968} {"train_loss": -26.762128829956055, "global_step": 412368, "epoch": 4968} {"train_loss": -26.558019638061523, "global_step": 412369, "epoch": 4968} {"train_loss": -26.323816299438477, "global_step": 412370, "epoch": 4968} {"train_loss": -26.765714645385742, "global_step": 412371, "epoch": 4968} {"train_loss": -26.6939697265625, "global_step": 412372, "epoch": 4968} {"train_loss": -26.878173828125, "global_step": 412373, "epoch": 4968} {"train_loss": -26.804914474487305, "global_step": 412374, "epoch": 4968} {"train_loss": -26.520965576171875, "global_step": 412375, "epoch": 4968} {"train_loss": -26.788389205932617, "global_step": 412376, "epoch": 4968} {"train_loss": -26.375524520874023, "global_step": 412377, "epoch": 4968} {"train_loss": -26.594619750976562, "global_step": 412378, "epoch": 4968} {"train_loss": -26.832300186157227, "global_step": 412379, "epoch": 4968} {"train_loss": -26.79017448425293, "global_step": 412380, "epoch": 4968} {"train_loss": -26.528793334960938, "global_step": 412381, "epoch": 4968} {"train_loss": -26.429365158081055, "global_step": 412382, "epoch": 4968} {"train_loss": -26.52412223815918, "global_step": 412383, "epoch": 4968} {"train_loss": -26.899267196655273, "global_step": 412384, "epoch": 4968} {"train_loss": -26.744298934936523, "global_step": 412385, "epoch": 4968} {"train_loss": -26.38871192932129, "global_step": 412386, "epoch": 4968} {"train_loss": -26.457294464111328, "global_step": 412387, "epoch": 4968} {"train_loss": -26.569747924804688, "global_step": 412388, "epoch": 4968} {"train_loss": -26.584491729736328, "global_step": 412389, "epoch": 4968} {"train_loss": -26.24256706237793, "global_step": 412390, "epoch": 4968} {"train_loss": -26.5787353515625, "global_step": 412391, "epoch": 4968} {"train_loss": -26.442285537719727, "global_step": 412392, "epoch": 4968} {"train_loss": -26.731781005859375, "global_step": 412393, "epoch": 4968} {"train_loss": -26.245946884155273, "global_step": 412394, "epoch": 4968} {"train_loss": -26.496313095092773, "global_step": 412395, "epoch": 4968} {"train_loss": -26.724695205688477, "global_step": 412396, "epoch": 4968} {"train_loss": -26.488332748413086, "global_step": 412397, "epoch": 4968} {"train_loss": -26.503650665283203, "global_step": 412398, "epoch": 4968} {"train_loss": -26.763671875, "global_step": 412399, "epoch": 4968} {"train_loss": -26.742904663085938, "global_step": 412400, "epoch": 4968} {"train_loss": -26.727741241455078, "global_step": 412401, "epoch": 4968} {"train_loss": -26.867277145385742, "global_step": 412402, "epoch": 4968} {"train_loss": -26.736068725585938, "global_step": 412403, "epoch": 4968} {"train_loss": -26.939655303955078, "global_step": 412404, "epoch": 4968} {"train_loss": -26.8906307220459, "global_step": 412405, "epoch": 4968} {"train_loss": -26.655920028686523, "global_step": 412406, "epoch": 4968} {"train_loss": -26.620267868041992, "global_step": 412407, "epoch": 4968} {"train_loss": -26.86905288696289, "global_step": 412408, "epoch": 4968} {"train_loss": -26.70893669128418, "global_step": 412409, "epoch": 4968} {"train_loss": -26.666290283203125, "global_step": 412410, "epoch": 4968} {"train_loss": -26.867765426635742, "global_step": 412411, "epoch": 4968} {"train_loss": -26.96933937072754, "global_step": 412412, "epoch": 4968} {"train_loss": -26.6923828125, "global_step": 412413, "epoch": 4968} {"train_loss": -26.384490966796875, "global_step": 412414, "epoch": 4968} {"train_loss": -26.935110092163086, "global_step": 412415, "epoch": 4968} {"train_loss": -26.880407333374023, "global_step": 412416, "epoch": 4968} {"train_loss": -26.618696212768555, "global_step": 412417, "epoch": 4968} {"train_loss": -26.837921142578125, "global_step": 412418, "epoch": 4968} {"train_loss": -26.763608932495117, "global_step": 412419, "epoch": 4968} {"train_loss": -26.696386337280273, "global_step": 412420, "epoch": 4968} {"train_loss": -26.8643798828125, "global_step": 412421, "epoch": 4968} {"train_loss": -27.292194366455078, "global_step": 412422, "epoch": 4968} {"train_loss": -26.839868545532227, "global_step": 412423, "epoch": 4968} {"train_loss": -27.024921417236328, "global_step": 412424, "epoch": 4968} {"train_loss": -26.766876220703125, "global_step": 412425, "epoch": 4968} {"train_loss": -26.585134506225586, "global_step": 412426, "epoch": 4968, "val_loss": 6531361.0} {"train_loss": -25.00417137145996, "global_step": 412427, "epoch": 4969} {"train_loss": -24.115392684936523, "global_step": 412428, "epoch": 4969} {"train_loss": -26.08949089050293, "global_step": 412429, "epoch": 4969} {"train_loss": -25.821929931640625, "global_step": 412430, "epoch": 4969} {"train_loss": -25.63166618347168, "global_step": 412431, "epoch": 4969} {"train_loss": -25.696979522705078, "global_step": 412432, "epoch": 4969} {"train_loss": -25.672483444213867, "global_step": 412433, "epoch": 4969} {"train_loss": -26.032617568969727, "global_step": 412434, "epoch": 4969} {"train_loss": -26.12113380432129, "global_step": 412435, "epoch": 4969} {"train_loss": -25.854904174804688, "global_step": 412436, "epoch": 4969} {"train_loss": -26.196561813354492, "global_step": 412437, "epoch": 4969} {"train_loss": -25.936498641967773, "global_step": 412438, "epoch": 4969} {"train_loss": -26.084796905517578, "global_step": 412439, "epoch": 4969} {"train_loss": -25.974218368530273, "global_step": 412440, "epoch": 4969} {"train_loss": -26.389554977416992, "global_step": 412441, "epoch": 4969} {"train_loss": -25.785612106323242, "global_step": 412442, "epoch": 4969} {"train_loss": -26.307199478149414, "global_step": 412443, "epoch": 4969} {"train_loss": -26.02418327331543, "global_step": 412444, "epoch": 4969} {"train_loss": -26.137861251831055, "global_step": 412445, "epoch": 4969} {"train_loss": -26.36297607421875, "global_step": 412446, "epoch": 4969} {"train_loss": -26.540607452392578, "global_step": 412447, "epoch": 4969} {"train_loss": -25.858774185180664, "global_step": 412448, "epoch": 4969} {"train_loss": -26.558130264282227, "global_step": 412449, "epoch": 4969} {"train_loss": -26.383642196655273, "global_step": 412450, "epoch": 4969} {"train_loss": -26.56375503540039, "global_step": 412451, "epoch": 4969} {"train_loss": -26.49124526977539, "global_step": 412452, "epoch": 4969} {"train_loss": -26.62701988220215, "global_step": 412453, "epoch": 4969} {"train_loss": -26.862722396850586, "global_step": 412454, "epoch": 4969} {"train_loss": -26.835290908813477, "global_step": 412455, "epoch": 4969} {"train_loss": -26.651147842407227, "global_step": 412456, "epoch": 4969} {"train_loss": -26.512853622436523, "global_step": 412457, "epoch": 4969} {"train_loss": -26.828744888305664, "global_step": 412458, "epoch": 4969} {"train_loss": -26.987634658813477, "global_step": 412459, "epoch": 4969} {"train_loss": -26.782888412475586, "global_step": 412460, "epoch": 4969} {"train_loss": -26.73725700378418, "global_step": 412461, "epoch": 4969} {"train_loss": -26.88605308532715, "global_step": 412462, "epoch": 4969} {"train_loss": -26.836139678955078, "global_step": 412463, "epoch": 4969} {"train_loss": -26.50571632385254, "global_step": 412464, "epoch": 4969} {"train_loss": -26.886932373046875, "global_step": 412465, "epoch": 4969} {"train_loss": -26.989511489868164, "global_step": 412466, "epoch": 4969} {"train_loss": -26.934614181518555, "global_step": 412467, "epoch": 4969} {"train_loss": -26.9830322265625, "global_step": 412468, "epoch": 4969} {"train_loss": -26.918798446655273, "global_step": 412469, "epoch": 4969} {"train_loss": -27.135303497314453, "global_step": 412470, "epoch": 4969} {"train_loss": -26.933460235595703, "global_step": 412471, "epoch": 4969} {"train_loss": -27.093236923217773, "global_step": 412472, "epoch": 4969} {"train_loss": -27.258014678955078, "global_step": 412473, "epoch": 4969} {"train_loss": -26.923288345336914, "global_step": 412474, "epoch": 4969} {"train_loss": -26.58538246154785, "global_step": 412475, "epoch": 4969} {"train_loss": -26.827856063842773, "global_step": 412476, "epoch": 4969} {"train_loss": -26.995466232299805, "global_step": 412477, "epoch": 4969} {"train_loss": -26.9060001373291, "global_step": 412478, "epoch": 4969} {"train_loss": -26.744705200195312, "global_step": 412479, "epoch": 4969} {"train_loss": -27.114383697509766, "global_step": 412480, "epoch": 4969} {"train_loss": -26.694549560546875, "global_step": 412481, "epoch": 4969} {"train_loss": -26.874998092651367, "global_step": 412482, "epoch": 4969} {"train_loss": -27.010181427001953, "global_step": 412483, "epoch": 4969} {"train_loss": -26.678647994995117, "global_step": 412484, "epoch": 4969} {"train_loss": -27.107526779174805, "global_step": 412485, "epoch": 4969} {"train_loss": -27.0889949798584, "global_step": 412486, "epoch": 4969} {"train_loss": -26.8288516998291, "global_step": 412487, "epoch": 4969} {"train_loss": -26.6592960357666, "global_step": 412488, "epoch": 4969} {"train_loss": -26.541461944580078, "global_step": 412489, "epoch": 4969} {"train_loss": -26.5081729888916, "global_step": 412490, "epoch": 4969} {"train_loss": -26.199514389038086, "global_step": 412491, "epoch": 4969} {"train_loss": -26.46518898010254, "global_step": 412492, "epoch": 4969} {"train_loss": -26.532196044921875, "global_step": 412493, "epoch": 4969} {"train_loss": -26.59139060974121, "global_step": 412494, "epoch": 4969} {"train_loss": -26.6867618560791, "global_step": 412495, "epoch": 4969} {"train_loss": -27.200231552124023, "global_step": 412496, "epoch": 4969} {"train_loss": -26.814294815063477, "global_step": 412497, "epoch": 4969} {"train_loss": -26.582059860229492, "global_step": 412498, "epoch": 4969} {"train_loss": -27.145740509033203, "global_step": 412499, "epoch": 4969} {"train_loss": -26.66851234436035, "global_step": 412500, "epoch": 4969} {"train_loss": -26.746612548828125, "global_step": 412501, "epoch": 4969} {"train_loss": -26.019733428955078, "global_step": 412502, "epoch": 4969} {"train_loss": -26.745664596557617, "global_step": 412503, "epoch": 4969} {"train_loss": -26.476728439331055, "global_step": 412504, "epoch": 4969} {"train_loss": -26.846576690673828, "global_step": 412505, "epoch": 4969} {"train_loss": -26.8068904876709, "global_step": 412506, "epoch": 4969} {"train_loss": -26.771991729736328, "global_step": 412507, "epoch": 4969} {"train_loss": -26.902912139892578, "global_step": 412508, "epoch": 4969} {"train_loss": -26.534731508737586, "global_step": 412509, "epoch": 4969, "val_loss": 6525684.0} {"train_loss": -25.60747718811035, "global_step": 412510, "epoch": 4970} {"train_loss": -25.94502067565918, "global_step": 412511, "epoch": 4970} {"train_loss": -25.811676025390625, "global_step": 412512, "epoch": 4970} {"train_loss": -25.495731353759766, "global_step": 412513, "epoch": 4970} {"train_loss": -25.364116668701172, "global_step": 412514, "epoch": 4970} {"train_loss": -26.186986923217773, "global_step": 412515, "epoch": 4970} {"train_loss": -25.7528076171875, "global_step": 412516, "epoch": 4970} {"train_loss": -26.4176025390625, "global_step": 412517, "epoch": 4970} {"train_loss": -26.064329147338867, "global_step": 412518, "epoch": 4970} {"train_loss": -26.05844497680664, "global_step": 412519, "epoch": 4970} {"train_loss": -26.3905086517334, "global_step": 412520, "epoch": 4970} {"train_loss": -25.887042999267578, "global_step": 412521, "epoch": 4970} {"train_loss": -26.514789581298828, "global_step": 412522, "epoch": 4970} {"train_loss": -26.2912654876709, "global_step": 412523, "epoch": 4970} {"train_loss": -26.26263999938965, "global_step": 412524, "epoch": 4970} {"train_loss": -26.409921646118164, "global_step": 412525, "epoch": 4970} {"train_loss": -25.905120849609375, "global_step": 412526, "epoch": 4970} {"train_loss": -26.337879180908203, "global_step": 412527, "epoch": 4970} {"train_loss": -25.91645622253418, "global_step": 412528, "epoch": 4970} {"train_loss": -26.401830673217773, "global_step": 412529, "epoch": 4970} {"train_loss": -26.624967575073242, "global_step": 412530, "epoch": 4970} {"train_loss": -26.361703872680664, "global_step": 412531, "epoch": 4970} {"train_loss": -26.2968807220459, "global_step": 412532, "epoch": 4970} {"train_loss": -26.415754318237305, "global_step": 412533, "epoch": 4970} {"train_loss": -26.678131103515625, "global_step": 412534, "epoch": 4970} {"train_loss": -26.644811630249023, "global_step": 412535, "epoch": 4970} {"train_loss": -26.824970245361328, "global_step": 412536, "epoch": 4970} {"train_loss": -26.6668758392334, "global_step": 412537, "epoch": 4970} {"train_loss": -26.138235092163086, "global_step": 412538, "epoch": 4970} {"train_loss": -26.460163116455078, "global_step": 412539, "epoch": 4970} {"train_loss": -26.70187759399414, "global_step": 412540, "epoch": 4970} {"train_loss": -26.937957763671875, "global_step": 412541, "epoch": 4970} {"train_loss": -27.018590927124023, "global_step": 412542, "epoch": 4970} {"train_loss": -26.880163192749023, "global_step": 412543, "epoch": 4970} {"train_loss": -26.748966217041016, "global_step": 412544, "epoch": 4970} {"train_loss": -26.896259307861328, "global_step": 412545, "epoch": 4970} {"train_loss": -26.587018966674805, "global_step": 412546, "epoch": 4970} {"train_loss": -26.820714950561523, "global_step": 412547, "epoch": 4970} {"train_loss": -26.992414474487305, "global_step": 412548, "epoch": 4970} {"train_loss": -26.858753204345703, "global_step": 412549, "epoch": 4970} {"train_loss": -26.947967529296875, "global_step": 412550, "epoch": 4970} {"train_loss": -26.622817993164062, "global_step": 412551, "epoch": 4970} {"train_loss": -26.80354118347168, "global_step": 412552, "epoch": 4970} {"train_loss": -26.530866622924805, "global_step": 412553, "epoch": 4970} {"train_loss": -26.84309196472168, "global_step": 412554, "epoch": 4970} {"train_loss": -26.67392349243164, "global_step": 412555, "epoch": 4970} {"train_loss": -26.66523551940918, "global_step": 412556, "epoch": 4970} {"train_loss": -26.201154708862305, "global_step": 412557, "epoch": 4970} {"train_loss": -26.82582664489746, "global_step": 412558, "epoch": 4970} {"train_loss": -26.766372680664062, "global_step": 412559, "epoch": 4970} {"train_loss": -26.842151641845703, "global_step": 412560, "epoch": 4970} {"train_loss": -26.297826766967773, "global_step": 412561, "epoch": 4970} {"train_loss": -26.251605987548828, "global_step": 412562, "epoch": 4970} {"train_loss": -26.45263671875, "global_step": 412563, "epoch": 4970} {"train_loss": -26.930561065673828, "global_step": 412564, "epoch": 4970} {"train_loss": -26.626203536987305, "global_step": 412565, "epoch": 4970} {"train_loss": -26.708118438720703, "global_step": 412566, "epoch": 4970} {"train_loss": -26.867429733276367, "global_step": 412567, "epoch": 4970} {"train_loss": -27.15911865234375, "global_step": 412568, "epoch": 4970} {"train_loss": -26.611474990844727, "global_step": 412569, "epoch": 4970} {"train_loss": -27.110071182250977, "global_step": 412570, "epoch": 4970} {"train_loss": -26.987125396728516, "global_step": 412571, "epoch": 4970} {"train_loss": -26.987043380737305, "global_step": 412572, "epoch": 4970} {"train_loss": -26.7834415435791, "global_step": 412573, "epoch": 4970} {"train_loss": -26.68538475036621, "global_step": 412574, "epoch": 4970} {"train_loss": -26.86733055114746, "global_step": 412575, "epoch": 4970} {"train_loss": -26.81060791015625, "global_step": 412576, "epoch": 4970} {"train_loss": -26.73406410217285, "global_step": 412577, "epoch": 4970} {"train_loss": -26.99515724182129, "global_step": 412578, "epoch": 4970} {"train_loss": -27.154376983642578, "global_step": 412579, "epoch": 4970} {"train_loss": -26.952777862548828, "global_step": 412580, "epoch": 4970} {"train_loss": -26.92022705078125, "global_step": 412581, "epoch": 4970} {"train_loss": -26.940078735351562, "global_step": 412582, "epoch": 4970} {"train_loss": -26.92374038696289, "global_step": 412583, "epoch": 4970} {"train_loss": -26.929990768432617, "global_step": 412584, "epoch": 4970} {"train_loss": -26.866907119750977, "global_step": 412585, "epoch": 4970} {"train_loss": -26.676040649414062, "global_step": 412586, "epoch": 4970} {"train_loss": -27.126972198486328, "global_step": 412587, "epoch": 4970} {"train_loss": -26.798908233642578, "global_step": 412588, "epoch": 4970} {"train_loss": -26.718053817749023, "global_step": 412589, "epoch": 4970} {"train_loss": -26.787282943725586, "global_step": 412590, "epoch": 4970} {"train_loss": -26.90297508239746, "global_step": 412591, "epoch": 4970} {"train_loss": -26.601910786456372, "global_step": 412592, "epoch": 4970, "val_loss": 6776922.0} {"train_loss": -23.91429901123047, "global_step": 412593, "epoch": 4971} {"train_loss": -25.00118637084961, "global_step": 412594, "epoch": 4971} {"train_loss": -24.985490798950195, "global_step": 412595, "epoch": 4971} {"train_loss": -24.91670036315918, "global_step": 412596, "epoch": 4971} {"train_loss": -25.111974716186523, "global_step": 412597, "epoch": 4971} {"train_loss": -26.15091896057129, "global_step": 412598, "epoch": 4971} {"train_loss": -25.04663848876953, "global_step": 412599, "epoch": 4971} {"train_loss": -25.4001522064209, "global_step": 412600, "epoch": 4971} {"train_loss": -25.24225425720215, "global_step": 412601, "epoch": 4971} {"train_loss": -25.503568649291992, "global_step": 412602, "epoch": 4971} {"train_loss": -25.78705406188965, "global_step": 412603, "epoch": 4971} {"train_loss": -25.429452896118164, "global_step": 412604, "epoch": 4971} {"train_loss": -26.19606590270996, "global_step": 412605, "epoch": 4971} {"train_loss": -25.755752563476562, "global_step": 412606, "epoch": 4971} {"train_loss": -25.782678604125977, "global_step": 412607, "epoch": 4971} {"train_loss": -25.76736831665039, "global_step": 412608, "epoch": 4971} {"train_loss": -25.88995933532715, "global_step": 412609, "epoch": 4971} {"train_loss": -25.8294734954834, "global_step": 412610, "epoch": 4971} {"train_loss": -25.839075088500977, "global_step": 412611, "epoch": 4971} {"train_loss": -25.81538963317871, "global_step": 412612, "epoch": 4971} {"train_loss": -26.29563331604004, "global_step": 412613, "epoch": 4971} {"train_loss": -26.434783935546875, "global_step": 412614, "epoch": 4971} {"train_loss": -26.045730590820312, "global_step": 412615, "epoch": 4971} {"train_loss": -26.151220321655273, "global_step": 412616, "epoch": 4971} {"train_loss": -26.17339515686035, "global_step": 412617, "epoch": 4971} {"train_loss": -26.412235260009766, "global_step": 412618, "epoch": 4971} {"train_loss": -26.323841094970703, "global_step": 412619, "epoch": 4971} {"train_loss": -26.416522979736328, "global_step": 412620, "epoch": 4971} {"train_loss": -26.304590225219727, "global_step": 412621, "epoch": 4971} {"train_loss": -26.71425437927246, "global_step": 412622, "epoch": 4971} {"train_loss": -26.469297409057617, "global_step": 412623, "epoch": 4971} {"train_loss": -26.539020538330078, "global_step": 412624, "epoch": 4971} {"train_loss": -26.514890670776367, "global_step": 412625, "epoch": 4971} {"train_loss": -26.446481704711914, "global_step": 412626, "epoch": 4971} {"train_loss": -26.650602340698242, "global_step": 412627, "epoch": 4971} {"train_loss": -26.47832679748535, "global_step": 412628, "epoch": 4971} {"train_loss": -26.55376625061035, "global_step": 412629, "epoch": 4971} {"train_loss": -26.76401710510254, "global_step": 412630, "epoch": 4971} {"train_loss": -26.468420028686523, "global_step": 412631, "epoch": 4971} {"train_loss": -26.39922523498535, "global_step": 412632, "epoch": 4971} {"train_loss": -26.596282958984375, "global_step": 412633, "epoch": 4971} {"train_loss": -26.88583755493164, "global_step": 412634, "epoch": 4971} {"train_loss": -26.693897247314453, "global_step": 412635, "epoch": 4971} {"train_loss": -26.503662109375, "global_step": 412636, "epoch": 4971} {"train_loss": -26.69548988342285, "global_step": 412637, "epoch": 4971} {"train_loss": -26.475208282470703, "global_step": 412638, "epoch": 4971} {"train_loss": -26.64265251159668, "global_step": 412639, "epoch": 4971} {"train_loss": -26.663068771362305, "global_step": 412640, "epoch": 4971} {"train_loss": -26.618566513061523, "global_step": 412641, "epoch": 4971} {"train_loss": -26.435102462768555, "global_step": 412642, "epoch": 4971} {"train_loss": -27.127328872680664, "global_step": 412643, "epoch": 4971} {"train_loss": -26.66178321838379, "global_step": 412644, "epoch": 4971} {"train_loss": -26.793548583984375, "global_step": 412645, "epoch": 4971} {"train_loss": -26.689990997314453, "global_step": 412646, "epoch": 4971} {"train_loss": -26.83699607849121, "global_step": 412647, "epoch": 4971} {"train_loss": -26.58101463317871, "global_step": 412648, "epoch": 4971} {"train_loss": -26.63748550415039, "global_step": 412649, "epoch": 4971} {"train_loss": -26.645360946655273, "global_step": 412650, "epoch": 4971} {"train_loss": -26.641067504882812, "global_step": 412651, "epoch": 4971} {"train_loss": -26.894254684448242, "global_step": 412652, "epoch": 4971} {"train_loss": -26.456653594970703, "global_step": 412653, "epoch": 4971} {"train_loss": -26.7541561126709, "global_step": 412654, "epoch": 4971} {"train_loss": -27.14503288269043, "global_step": 412655, "epoch": 4971} {"train_loss": -27.014867782592773, "global_step": 412656, "epoch": 4971} {"train_loss": -27.0374755859375, "global_step": 412657, "epoch": 4971} {"train_loss": -26.957141876220703, "global_step": 412658, "epoch": 4971} {"train_loss": -26.690656661987305, "global_step": 412659, "epoch": 4971} {"train_loss": -26.89918327331543, "global_step": 412660, "epoch": 4971} {"train_loss": -27.38083267211914, "global_step": 412661, "epoch": 4971} {"train_loss": -26.84290885925293, "global_step": 412662, "epoch": 4971} {"train_loss": -26.91214942932129, "global_step": 412663, "epoch": 4971} {"train_loss": -26.467748641967773, "global_step": 412664, "epoch": 4971} {"train_loss": -26.52571678161621, "global_step": 412665, "epoch": 4971} {"train_loss": -27.07327651977539, "global_step": 412666, "epoch": 4971} {"train_loss": -26.8255615234375, "global_step": 412667, "epoch": 4971} {"train_loss": -26.353900909423828, "global_step": 412668, "epoch": 4971} {"train_loss": -26.591032028198242, "global_step": 412669, "epoch": 4971} {"train_loss": -26.814380645751953, "global_step": 412670, "epoch": 4971} {"train_loss": -26.969141006469727, "global_step": 412671, "epoch": 4971} {"train_loss": -26.877424240112305, "global_step": 412672, "epoch": 4971} {"train_loss": -26.68678092956543, "global_step": 412673, "epoch": 4971} {"train_loss": -26.86199951171875, "global_step": 412674, "epoch": 4971} {"train_loss": -26.370337061135167, "global_step": 412675, "epoch": 4971, "val_loss": 6499080.0} {"train_loss": -26.337488174438477, "global_step": 412676, "epoch": 4972} {"train_loss": -26.596521377563477, "global_step": 412677, "epoch": 4972} {"train_loss": -26.780975341796875, "global_step": 412678, "epoch": 4972} {"train_loss": -26.099445343017578, "global_step": 412679, "epoch": 4972} {"train_loss": -26.43282127380371, "global_step": 412680, "epoch": 4972} {"train_loss": -26.52752685546875, "global_step": 412681, "epoch": 4972} {"train_loss": -26.431699752807617, "global_step": 412682, "epoch": 4972} {"train_loss": -26.774738311767578, "global_step": 412683, "epoch": 4972} {"train_loss": -26.595584869384766, "global_step": 412684, "epoch": 4972} {"train_loss": -26.28150749206543, "global_step": 412685, "epoch": 4972} {"train_loss": -25.568899154663086, "global_step": 412686, "epoch": 4972} {"train_loss": -25.563047409057617, "global_step": 412687, "epoch": 4972} {"train_loss": -25.99567985534668, "global_step": 412688, "epoch": 4972} {"train_loss": -26.59050941467285, "global_step": 412689, "epoch": 4972} {"train_loss": -26.294300079345703, "global_step": 412690, "epoch": 4972} {"train_loss": -26.46881103515625, "global_step": 412691, "epoch": 4972} {"train_loss": -26.49041748046875, "global_step": 412692, "epoch": 4972} {"train_loss": -26.477436065673828, "global_step": 412693, "epoch": 4972} {"train_loss": -26.4401912689209, "global_step": 412694, "epoch": 4972} {"train_loss": -26.694440841674805, "global_step": 412695, "epoch": 4972} {"train_loss": -26.104780197143555, "global_step": 412696, "epoch": 4972} {"train_loss": -26.539031982421875, "global_step": 412697, "epoch": 4972} {"train_loss": -26.28272819519043, "global_step": 412698, "epoch": 4972} {"train_loss": -26.249303817749023, "global_step": 412699, "epoch": 4972} {"train_loss": -26.360639572143555, "global_step": 412700, "epoch": 4972} {"train_loss": -26.479337692260742, "global_step": 412701, "epoch": 4972} {"train_loss": -26.644702911376953, "global_step": 412702, "epoch": 4972} {"train_loss": -26.706790924072266, "global_step": 412703, "epoch": 4972} {"train_loss": -26.344396591186523, "global_step": 412704, "epoch": 4972} {"train_loss": -26.64113426208496, "global_step": 412705, "epoch": 4972} {"train_loss": -26.996625900268555, "global_step": 412706, "epoch": 4972} {"train_loss": -26.5185604095459, "global_step": 412707, "epoch": 4972} {"train_loss": -26.555395126342773, "global_step": 412708, "epoch": 4972} {"train_loss": -26.894285202026367, "global_step": 412709, "epoch": 4972} {"train_loss": -26.75160789489746, "global_step": 412710, "epoch": 4972} {"train_loss": -26.69319725036621, "global_step": 412711, "epoch": 4972} {"train_loss": -26.668848037719727, "global_step": 412712, "epoch": 4972} {"train_loss": -26.79310417175293, "global_step": 412713, "epoch": 4972} {"train_loss": -26.718341827392578, "global_step": 412714, "epoch": 4972} {"train_loss": -26.645984649658203, "global_step": 412715, "epoch": 4972} {"train_loss": -26.295913696289062, "global_step": 412716, "epoch": 4972} {"train_loss": -26.849353790283203, "global_step": 412717, "epoch": 4972} {"train_loss": -26.699304580688477, "global_step": 412718, "epoch": 4972} {"train_loss": -26.86299705505371, "global_step": 412719, "epoch": 4972} {"train_loss": -26.46302604675293, "global_step": 412720, "epoch": 4972} {"train_loss": -26.85153579711914, "global_step": 412721, "epoch": 4972} {"train_loss": -27.089147567749023, "global_step": 412722, "epoch": 4972} {"train_loss": -26.66770362854004, "global_step": 412723, "epoch": 4972} {"train_loss": -26.8383846282959, "global_step": 412724, "epoch": 4972} {"train_loss": -26.614166259765625, "global_step": 412725, "epoch": 4972} {"train_loss": -26.521533966064453, "global_step": 412726, "epoch": 4972} {"train_loss": -26.904327392578125, "global_step": 412727, "epoch": 4972} {"train_loss": -26.979572296142578, "global_step": 412728, "epoch": 4972} {"train_loss": -26.958616256713867, "global_step": 412729, "epoch": 4972} {"train_loss": -27.112319946289062, "global_step": 412730, "epoch": 4972} {"train_loss": -26.455890655517578, "global_step": 412731, "epoch": 4972} {"train_loss": -26.584951400756836, "global_step": 412732, "epoch": 4972} {"train_loss": -26.635934829711914, "global_step": 412733, "epoch": 4972} {"train_loss": -26.786291122436523, "global_step": 412734, "epoch": 4972} {"train_loss": -26.879281997680664, "global_step": 412735, "epoch": 4972} {"train_loss": -26.646326065063477, "global_step": 412736, "epoch": 4972} {"train_loss": -26.748876571655273, "global_step": 412737, "epoch": 4972} {"train_loss": -26.449583053588867, "global_step": 412738, "epoch": 4972} {"train_loss": -26.766210556030273, "global_step": 412739, "epoch": 4972} {"train_loss": -26.814306259155273, "global_step": 412740, "epoch": 4972} {"train_loss": -26.692829132080078, "global_step": 412741, "epoch": 4972} {"train_loss": -27.046945571899414, "global_step": 412742, "epoch": 4972} {"train_loss": -26.93781089782715, "global_step": 412743, "epoch": 4972} {"train_loss": -26.966535568237305, "global_step": 412744, "epoch": 4972} {"train_loss": -26.78533935546875, "global_step": 412745, "epoch": 4972} {"train_loss": -26.772382736206055, "global_step": 412746, "epoch": 4972} {"train_loss": -26.4028377532959, "global_step": 412747, "epoch": 4972} {"train_loss": -27.098371505737305, "global_step": 412748, "epoch": 4972} {"train_loss": -26.98309326171875, "global_step": 412749, "epoch": 4972} {"train_loss": -26.943490982055664, "global_step": 412750, "epoch": 4972} {"train_loss": -26.747486114501953, "global_step": 412751, "epoch": 4972} {"train_loss": -26.86988639831543, "global_step": 412752, "epoch": 4972} {"train_loss": -26.981704711914062, "global_step": 412753, "epoch": 4972} {"train_loss": -26.855188369750977, "global_step": 412754, "epoch": 4972} {"train_loss": -26.959936141967773, "global_step": 412755, "epoch": 4972} {"train_loss": -26.05609703063965, "global_step": 412756, "epoch": 4972} {"train_loss": -26.303119659423828, "global_step": 412757, "epoch": 4972} {"train_loss": -26.631318793239362, "global_step": 412758, "epoch": 4972, "val_loss": 6554870.5} {"train_loss": -25.494510650634766, "global_step": 412759, "epoch": 4973} {"train_loss": -25.36374855041504, "global_step": 412760, "epoch": 4973} {"train_loss": -26.00980567932129, "global_step": 412761, "epoch": 4973} {"train_loss": -25.192636489868164, "global_step": 412762, "epoch": 4973} {"train_loss": -25.94610023498535, "global_step": 412763, "epoch": 4973} {"train_loss": -25.588207244873047, "global_step": 412764, "epoch": 4973} {"train_loss": -25.34327507019043, "global_step": 412765, "epoch": 4973} {"train_loss": -25.71536636352539, "global_step": 412766, "epoch": 4973} {"train_loss": -26.134939193725586, "global_step": 412767, "epoch": 4973} {"train_loss": -25.547758102416992, "global_step": 412768, "epoch": 4973} {"train_loss": -25.585805892944336, "global_step": 412769, "epoch": 4973} {"train_loss": -26.335058212280273, "global_step": 412770, "epoch": 4973} {"train_loss": -25.836057662963867, "global_step": 412771, "epoch": 4973} {"train_loss": -26.00874137878418, "global_step": 412772, "epoch": 4973} {"train_loss": -25.951948165893555, "global_step": 412773, "epoch": 4973} {"train_loss": -25.994491577148438, "global_step": 412774, "epoch": 4973} {"train_loss": -25.849699020385742, "global_step": 412775, "epoch": 4973} {"train_loss": -26.08790397644043, "global_step": 412776, "epoch": 4973} {"train_loss": -26.006521224975586, "global_step": 412777, "epoch": 4973} {"train_loss": -25.896392822265625, "global_step": 412778, "epoch": 4973} {"train_loss": -26.207204818725586, "global_step": 412779, "epoch": 4973} {"train_loss": -26.1993350982666, "global_step": 412780, "epoch": 4973} {"train_loss": -26.596616744995117, "global_step": 412781, "epoch": 4973} {"train_loss": -26.393781661987305, "global_step": 412782, "epoch": 4973} {"train_loss": -26.261503219604492, "global_step": 412783, "epoch": 4973} {"train_loss": -26.166828155517578, "global_step": 412784, "epoch": 4973} {"train_loss": -26.357084274291992, "global_step": 412785, "epoch": 4973} {"train_loss": -26.325641632080078, "global_step": 412786, "epoch": 4973} {"train_loss": -26.27121925354004, "global_step": 412787, "epoch": 4973} {"train_loss": -26.433319091796875, "global_step": 412788, "epoch": 4973} {"train_loss": -26.469579696655273, "global_step": 412789, "epoch": 4973} {"train_loss": -26.39227867126465, "global_step": 412790, "epoch": 4973} {"train_loss": -26.49613380432129, "global_step": 412791, "epoch": 4973} {"train_loss": -26.379199981689453, "global_step": 412792, "epoch": 4973} {"train_loss": -26.61366081237793, "global_step": 412793, "epoch": 4973} {"train_loss": -26.257410049438477, "global_step": 412794, "epoch": 4973} {"train_loss": -26.62434196472168, "global_step": 412795, "epoch": 4973} {"train_loss": -26.605091094970703, "global_step": 412796, "epoch": 4973} {"train_loss": -26.632598876953125, "global_step": 412797, "epoch": 4973} {"train_loss": -26.5682373046875, "global_step": 412798, "epoch": 4973} {"train_loss": -26.814477920532227, "global_step": 412799, "epoch": 4973} {"train_loss": -26.673141479492188, "global_step": 412800, "epoch": 4973} {"train_loss": -27.0223388671875, "global_step": 412801, "epoch": 4973} {"train_loss": -26.8878231048584, "global_step": 412802, "epoch": 4973} {"train_loss": -26.825315475463867, "global_step": 412803, "epoch": 4973} {"train_loss": -27.080123901367188, "global_step": 412804, "epoch": 4973} {"train_loss": -26.8112850189209, "global_step": 412805, "epoch": 4973} {"train_loss": -26.8931884765625, "global_step": 412806, "epoch": 4973} {"train_loss": -26.646133422851562, "global_step": 412807, "epoch": 4973} {"train_loss": -26.680679321289062, "global_step": 412808, "epoch": 4973} {"train_loss": -26.901641845703125, "global_step": 412809, "epoch": 4973} {"train_loss": -26.809986114501953, "global_step": 412810, "epoch": 4973} {"train_loss": -26.856231689453125, "global_step": 412811, "epoch": 4973} {"train_loss": -26.5478458404541, "global_step": 412812, "epoch": 4973} {"train_loss": -26.866796493530273, "global_step": 412813, "epoch": 4973} {"train_loss": -27.105268478393555, "global_step": 412814, "epoch": 4973} {"train_loss": -26.61527442932129, "global_step": 412815, "epoch": 4973} {"train_loss": -26.961883544921875, "global_step": 412816, "epoch": 4973} {"train_loss": -26.79499626159668, "global_step": 412817, "epoch": 4973} {"train_loss": -26.581098556518555, "global_step": 412818, "epoch": 4973} {"train_loss": -26.843610763549805, "global_step": 412819, "epoch": 4973} {"train_loss": -26.556196212768555, "global_step": 412820, "epoch": 4973} {"train_loss": -26.67913246154785, "global_step": 412821, "epoch": 4973} {"train_loss": -26.85062026977539, "global_step": 412822, "epoch": 4973} {"train_loss": -26.716516494750977, "global_step": 412823, "epoch": 4973} {"train_loss": -26.757308959960938, "global_step": 412824, "epoch": 4973} {"train_loss": -26.345666885375977, "global_step": 412825, "epoch": 4973} {"train_loss": -26.529998779296875, "global_step": 412826, "epoch": 4973} {"train_loss": -27.03987693786621, "global_step": 412827, "epoch": 4973} {"train_loss": -26.705963134765625, "global_step": 412828, "epoch": 4973} {"train_loss": -26.623708724975586, "global_step": 412829, "epoch": 4973} {"train_loss": -26.5617618560791, "global_step": 412830, "epoch": 4973} {"train_loss": -27.00432777404785, "global_step": 412831, "epoch": 4973} {"train_loss": -26.895421981811523, "global_step": 412832, "epoch": 4973} {"train_loss": -26.574853897094727, "global_step": 412833, "epoch": 4973} {"train_loss": -26.72016716003418, "global_step": 412834, "epoch": 4973} {"train_loss": -26.855871200561523, "global_step": 412835, "epoch": 4973} {"train_loss": -26.865781784057617, "global_step": 412836, "epoch": 4973} {"train_loss": -26.947839736938477, "global_step": 412837, "epoch": 4973} {"train_loss": -27.176877975463867, "global_step": 412838, "epoch": 4973} {"train_loss": -27.11464500427246, "global_step": 412839, "epoch": 4973} {"train_loss": -26.711029052734375, "global_step": 412840, "epoch": 4973} {"train_loss": -26.44384090009942, "global_step": 412841, "epoch": 4973, "val_loss": 6622264.5} {"train_loss": -25.666086196899414, "global_step": 412842, "epoch": 4974} {"train_loss": -25.720539093017578, "global_step": 412843, "epoch": 4974} {"train_loss": -26.35906982421875, "global_step": 412844, "epoch": 4974} {"train_loss": -26.074996948242188, "global_step": 412845, "epoch": 4974} {"train_loss": -26.42826271057129, "global_step": 412846, "epoch": 4974} {"train_loss": -25.94422721862793, "global_step": 412847, "epoch": 4974} {"train_loss": -26.674896240234375, "global_step": 412848, "epoch": 4974} {"train_loss": -26.40511131286621, "global_step": 412849, "epoch": 4974} {"train_loss": -26.695547103881836, "global_step": 412850, "epoch": 4974} {"train_loss": -26.738245010375977, "global_step": 412851, "epoch": 4974} {"train_loss": -26.882766723632812, "global_step": 412852, "epoch": 4974} {"train_loss": -26.623212814331055, "global_step": 412853, "epoch": 4974} {"train_loss": -26.860748291015625, "global_step": 412854, "epoch": 4974} {"train_loss": -26.4578914642334, "global_step": 412855, "epoch": 4974} {"train_loss": -26.751922607421875, "global_step": 412856, "epoch": 4974} {"train_loss": -26.6175479888916, "global_step": 412857, "epoch": 4974} {"train_loss": -26.759946823120117, "global_step": 412858, "epoch": 4974} {"train_loss": -26.782276153564453, "global_step": 412859, "epoch": 4974} {"train_loss": -26.74521255493164, "global_step": 412860, "epoch": 4974} {"train_loss": -26.708837509155273, "global_step": 412861, "epoch": 4974} {"train_loss": -26.39510154724121, "global_step": 412862, "epoch": 4974} {"train_loss": -26.339990615844727, "global_step": 412863, "epoch": 4974} {"train_loss": -26.398412704467773, "global_step": 412864, "epoch": 4974} {"train_loss": -26.56446647644043, "global_step": 412865, "epoch": 4974} {"train_loss": -26.80042839050293, "global_step": 412866, "epoch": 4974} {"train_loss": -26.6883602142334, "global_step": 412867, "epoch": 4974} {"train_loss": -26.639623641967773, "global_step": 412868, "epoch": 4974} {"train_loss": -26.546377182006836, "global_step": 412869, "epoch": 4974} {"train_loss": -26.703474044799805, "global_step": 412870, "epoch": 4974} {"train_loss": -27.107696533203125, "global_step": 412871, "epoch": 4974} {"train_loss": -26.44045066833496, "global_step": 412872, "epoch": 4974} {"train_loss": -27.15399742126465, "global_step": 412873, "epoch": 4974} {"train_loss": -26.646198272705078, "global_step": 412874, "epoch": 4974} {"train_loss": -26.804401397705078, "global_step": 412875, "epoch": 4974} {"train_loss": -26.87127685546875, "global_step": 412876, "epoch": 4974} {"train_loss": -26.827817916870117, "global_step": 412877, "epoch": 4974} {"train_loss": -27.01056480407715, "global_step": 412878, "epoch": 4974} {"train_loss": -26.900976181030273, "global_step": 412879, "epoch": 4974} {"train_loss": -26.78030776977539, "global_step": 412880, "epoch": 4974} {"train_loss": -26.532470703125, "global_step": 412881, "epoch": 4974} {"train_loss": -26.690988540649414, "global_step": 412882, "epoch": 4974} {"train_loss": -26.999069213867188, "global_step": 412883, "epoch": 4974} {"train_loss": -26.681365966796875, "global_step": 412884, "epoch": 4974} {"train_loss": -26.65093421936035, "global_step": 412885, "epoch": 4974} {"train_loss": -26.84663963317871, "global_step": 412886, "epoch": 4974} {"train_loss": -26.901214599609375, "global_step": 412887, "epoch": 4974} {"train_loss": -26.515338897705078, "global_step": 412888, "epoch": 4974} {"train_loss": -26.51307487487793, "global_step": 412889, "epoch": 4974} {"train_loss": -26.795801162719727, "global_step": 412890, "epoch": 4974} {"train_loss": -27.085254669189453, "global_step": 412891, "epoch": 4974} {"train_loss": -26.93113136291504, "global_step": 412892, "epoch": 4974} {"train_loss": -26.783315658569336, "global_step": 412893, "epoch": 4974} {"train_loss": -26.673376083374023, "global_step": 412894, "epoch": 4974} {"train_loss": -26.741010665893555, "global_step": 412895, "epoch": 4974} {"train_loss": -26.3382625579834, "global_step": 412896, "epoch": 4974} {"train_loss": -26.8619327545166, "global_step": 412897, "epoch": 4974} {"train_loss": -26.87952995300293, "global_step": 412898, "epoch": 4974} {"train_loss": -26.828039169311523, "global_step": 412899, "epoch": 4974} {"train_loss": -26.704320907592773, "global_step": 412900, "epoch": 4974} {"train_loss": -26.605573654174805, "global_step": 412901, "epoch": 4974} {"train_loss": -26.953125, "global_step": 412902, "epoch": 4974} {"train_loss": -26.416807174682617, "global_step": 412903, "epoch": 4974} {"train_loss": -26.70326042175293, "global_step": 412904, "epoch": 4974} {"train_loss": -26.930500030517578, "global_step": 412905, "epoch": 4974} {"train_loss": -26.683963775634766, "global_step": 412906, "epoch": 4974} {"train_loss": -26.984872817993164, "global_step": 412907, "epoch": 4974} {"train_loss": -26.626434326171875, "global_step": 412908, "epoch": 4974} {"train_loss": -26.930463790893555, "global_step": 412909, "epoch": 4974} {"train_loss": -26.782941818237305, "global_step": 412910, "epoch": 4974} {"train_loss": -26.771413803100586, "global_step": 412911, "epoch": 4974} {"train_loss": -27.08123779296875, "global_step": 412912, "epoch": 4974} {"train_loss": -26.97041130065918, "global_step": 412913, "epoch": 4974} {"train_loss": -26.7740421295166, "global_step": 412914, "epoch": 4974} {"train_loss": -26.928247451782227, "global_step": 412915, "epoch": 4974} {"train_loss": -27.0374813079834, "global_step": 412916, "epoch": 4974} {"train_loss": -26.882171630859375, "global_step": 412917, "epoch": 4974} {"train_loss": -27.003711700439453, "global_step": 412918, "epoch": 4974} {"train_loss": -26.62384605407715, "global_step": 412919, "epoch": 4974} {"train_loss": -26.829730987548828, "global_step": 412920, "epoch": 4974} {"train_loss": -26.608869552612305, "global_step": 412921, "epoch": 4974} {"train_loss": -26.3428897857666, "global_step": 412922, "epoch": 4974} {"train_loss": -26.215463638305664, "global_step": 412923, "epoch": 4974} {"train_loss": -26.672787746751165, "global_step": 412924, "epoch": 4974, "val_loss": 6562273.0} {"train_loss": -26.401334762573242, "global_step": 412925, "epoch": 4975} {"train_loss": -26.16236686706543, "global_step": 412926, "epoch": 4975} {"train_loss": -25.8013858795166, "global_step": 412927, "epoch": 4975} {"train_loss": -26.512195587158203, "global_step": 412928, "epoch": 4975} {"train_loss": -26.49183464050293, "global_step": 412929, "epoch": 4975} {"train_loss": -25.459110260009766, "global_step": 412930, "epoch": 4975} {"train_loss": -26.55561637878418, "global_step": 412931, "epoch": 4975} {"train_loss": -26.37603187561035, "global_step": 412932, "epoch": 4975} {"train_loss": -26.078216552734375, "global_step": 412933, "epoch": 4975} {"train_loss": -26.58418083190918, "global_step": 412934, "epoch": 4975} {"train_loss": -26.348098754882812, "global_step": 412935, "epoch": 4975} {"train_loss": -26.011295318603516, "global_step": 412936, "epoch": 4975} {"train_loss": -26.21416664123535, "global_step": 412937, "epoch": 4975} {"train_loss": -26.250228881835938, "global_step": 412938, "epoch": 4975} {"train_loss": -26.767881393432617, "global_step": 412939, "epoch": 4975} {"train_loss": -26.532316207885742, "global_step": 412940, "epoch": 4975} {"train_loss": -26.458982467651367, "global_step": 412941, "epoch": 4975} {"train_loss": -26.634458541870117, "global_step": 412942, "epoch": 4975} {"train_loss": -26.409698486328125, "global_step": 412943, "epoch": 4975} {"train_loss": -26.802139282226562, "global_step": 412944, "epoch": 4975} {"train_loss": -26.721235275268555, "global_step": 412945, "epoch": 4975} {"train_loss": -26.544158935546875, "global_step": 412946, "epoch": 4975} {"train_loss": -26.647159576416016, "global_step": 412947, "epoch": 4975} {"train_loss": -26.7694034576416, "global_step": 412948, "epoch": 4975} {"train_loss": -26.336429595947266, "global_step": 412949, "epoch": 4975} {"train_loss": -26.732807159423828, "global_step": 412950, "epoch": 4975} {"train_loss": -26.704309463500977, "global_step": 412951, "epoch": 4975} {"train_loss": -26.941497802734375, "global_step": 412952, "epoch": 4975} {"train_loss": -26.586862564086914, "global_step": 412953, "epoch": 4975} {"train_loss": -26.369359970092773, "global_step": 412954, "epoch": 4975} {"train_loss": -26.802539825439453, "global_step": 412955, "epoch": 4975} {"train_loss": -26.44734001159668, "global_step": 412956, "epoch": 4975} {"train_loss": -26.919574737548828, "global_step": 412957, "epoch": 4975} {"train_loss": -26.508258819580078, "global_step": 412958, "epoch": 4975} {"train_loss": -26.6927490234375, "global_step": 412959, "epoch": 4975} {"train_loss": -26.86580467224121, "global_step": 412960, "epoch": 4975} {"train_loss": -26.632116317749023, "global_step": 412961, "epoch": 4975} {"train_loss": -26.819122314453125, "global_step": 412962, "epoch": 4975} {"train_loss": -27.18194007873535, "global_step": 412963, "epoch": 4975} {"train_loss": -26.80006217956543, "global_step": 412964, "epoch": 4975} {"train_loss": -26.555713653564453, "global_step": 412965, "epoch": 4975} {"train_loss": -26.682453155517578, "global_step": 412966, "epoch": 4975} {"train_loss": -26.789953231811523, "global_step": 412967, "epoch": 4975} {"train_loss": -26.543622970581055, "global_step": 412968, "epoch": 4975} {"train_loss": -26.914365768432617, "global_step": 412969, "epoch": 4975} {"train_loss": -26.894672393798828, "global_step": 412970, "epoch": 4975} {"train_loss": -26.9440975189209, "global_step": 412971, "epoch": 4975} {"train_loss": -27.21124839782715, "global_step": 412972, "epoch": 4975} {"train_loss": -26.984533309936523, "global_step": 412973, "epoch": 4975} {"train_loss": -26.78407859802246, "global_step": 412974, "epoch": 4975} {"train_loss": -26.468244552612305, "global_step": 412975, "epoch": 4975} {"train_loss": -27.102888107299805, "global_step": 412976, "epoch": 4975} {"train_loss": -26.294708251953125, "global_step": 412977, "epoch": 4975} {"train_loss": -27.035144805908203, "global_step": 412978, "epoch": 4975} {"train_loss": -26.471155166625977, "global_step": 412979, "epoch": 4975} {"train_loss": -26.451263427734375, "global_step": 412980, "epoch": 4975} {"train_loss": -26.328262329101562, "global_step": 412981, "epoch": 4975} {"train_loss": -26.1949405670166, "global_step": 412982, "epoch": 4975} {"train_loss": -26.666784286499023, "global_step": 412983, "epoch": 4975} {"train_loss": -26.72857093811035, "global_step": 412984, "epoch": 4975} {"train_loss": -26.417829513549805, "global_step": 412985, "epoch": 4975} {"train_loss": -26.153873443603516, "global_step": 412986, "epoch": 4975} {"train_loss": -26.056293487548828, "global_step": 412987, "epoch": 4975} {"train_loss": -26.459095001220703, "global_step": 412988, "epoch": 4975} {"train_loss": -26.51722526550293, "global_step": 412989, "epoch": 4975} {"train_loss": -26.15791130065918, "global_step": 412990, "epoch": 4975} {"train_loss": -26.373693466186523, "global_step": 412991, "epoch": 4975} {"train_loss": -26.886768341064453, "global_step": 412992, "epoch": 4975} {"train_loss": -26.34404945373535, "global_step": 412993, "epoch": 4975} {"train_loss": -26.626798629760742, "global_step": 412994, "epoch": 4975} {"train_loss": -26.48298454284668, "global_step": 412995, "epoch": 4975} {"train_loss": -26.543289184570312, "global_step": 412996, "epoch": 4975} {"train_loss": -26.70815086364746, "global_step": 412997, "epoch": 4975} {"train_loss": -26.5273494720459, "global_step": 412998, "epoch": 4975} {"train_loss": -26.67609214782715, "global_step": 412999, "epoch": 4975} {"train_loss": -26.797637939453125, "global_step": 413000, "epoch": 4975} {"train_loss": -26.761850357055664, "global_step": 413001, "epoch": 4975} {"train_loss": -26.997201919555664, "global_step": 413002, "epoch": 4975} {"train_loss": -26.87049674987793, "global_step": 413003, "epoch": 4975} {"train_loss": -26.551000595092773, "global_step": 413004, "epoch": 4975} {"train_loss": -26.49932289123535, "global_step": 413005, "epoch": 4975} {"train_loss": -26.75790786743164, "global_step": 413006, "epoch": 4975} {"train_loss": -26.589089749807336, "global_step": 413007, "epoch": 4975, "val_loss": 6482793.0} {"train_loss": -26.446334838867188, "global_step": 413008, "epoch": 4976} {"train_loss": -25.387121200561523, "global_step": 413009, "epoch": 4976} {"train_loss": -25.657804489135742, "global_step": 413010, "epoch": 4976} {"train_loss": -25.742420196533203, "global_step": 413011, "epoch": 4976} {"train_loss": -26.54766273498535, "global_step": 413012, "epoch": 4976} {"train_loss": -25.853897094726562, "global_step": 413013, "epoch": 4976} {"train_loss": -25.898120880126953, "global_step": 413014, "epoch": 4976} {"train_loss": -26.512470245361328, "global_step": 413015, "epoch": 4976} {"train_loss": -26.20001220703125, "global_step": 413016, "epoch": 4976} {"train_loss": -26.14704704284668, "global_step": 413017, "epoch": 4976} {"train_loss": -26.531457901000977, "global_step": 413018, "epoch": 4976} {"train_loss": -26.395919799804688, "global_step": 413019, "epoch": 4976} {"train_loss": -26.356748580932617, "global_step": 413020, "epoch": 4976} {"train_loss": -26.339599609375, "global_step": 413021, "epoch": 4976} {"train_loss": -26.490537643432617, "global_step": 413022, "epoch": 4976} {"train_loss": -26.482175827026367, "global_step": 413023, "epoch": 4976} {"train_loss": -26.208057403564453, "global_step": 413024, "epoch": 4976} {"train_loss": -26.313861846923828, "global_step": 413025, "epoch": 4976} {"train_loss": -26.21143913269043, "global_step": 413026, "epoch": 4976} {"train_loss": -26.396467208862305, "global_step": 413027, "epoch": 4976} {"train_loss": -26.2278995513916, "global_step": 413028, "epoch": 4976} {"train_loss": -26.167438507080078, "global_step": 413029, "epoch": 4976} {"train_loss": -26.380170822143555, "global_step": 413030, "epoch": 4976} {"train_loss": -26.66792869567871, "global_step": 413031, "epoch": 4976} {"train_loss": -26.050525665283203, "global_step": 413032, "epoch": 4976} {"train_loss": -26.195295333862305, "global_step": 413033, "epoch": 4976} {"train_loss": -26.952985763549805, "global_step": 413034, "epoch": 4976} {"train_loss": -26.251800537109375, "global_step": 413035, "epoch": 4976} {"train_loss": -26.312931060791016, "global_step": 413036, "epoch": 4976} {"train_loss": -26.30752944946289, "global_step": 413037, "epoch": 4976} {"train_loss": -27.029422760009766, "global_step": 413038, "epoch": 4976} {"train_loss": -26.844568252563477, "global_step": 413039, "epoch": 4976} {"train_loss": -26.757482528686523, "global_step": 413040, "epoch": 4976} {"train_loss": -26.73586082458496, "global_step": 413041, "epoch": 4976} {"train_loss": -26.606122970581055, "global_step": 413042, "epoch": 4976} {"train_loss": -26.80510902404785, "global_step": 413043, "epoch": 4976} {"train_loss": -26.659116744995117, "global_step": 413044, "epoch": 4976} {"train_loss": -27.08453369140625, "global_step": 413045, "epoch": 4976} {"train_loss": -26.6892147064209, "global_step": 413046, "epoch": 4976} {"train_loss": -27.026641845703125, "global_step": 413047, "epoch": 4976} {"train_loss": -27.0697078704834, "global_step": 413048, "epoch": 4976} {"train_loss": -26.9343204498291, "global_step": 413049, "epoch": 4976} {"train_loss": -26.77646827697754, "global_step": 413050, "epoch": 4976} {"train_loss": -26.504724502563477, "global_step": 413051, "epoch": 4976} {"train_loss": -27.13277244567871, "global_step": 413052, "epoch": 4976} {"train_loss": -26.581424713134766, "global_step": 413053, "epoch": 4976} {"train_loss": -26.360647201538086, "global_step": 413054, "epoch": 4976} {"train_loss": -27.23630714416504, "global_step": 413055, "epoch": 4976} {"train_loss": -26.770132064819336, "global_step": 413056, "epoch": 4976} {"train_loss": -26.80621337890625, "global_step": 413057, "epoch": 4976} {"train_loss": -26.836013793945312, "global_step": 413058, "epoch": 4976} {"train_loss": -26.956754684448242, "global_step": 413059, "epoch": 4976} {"train_loss": -26.72291374206543, "global_step": 413060, "epoch": 4976} {"train_loss": -26.494077682495117, "global_step": 413061, "epoch": 4976} {"train_loss": -26.5443172454834, "global_step": 413062, "epoch": 4976} {"train_loss": -26.77961540222168, "global_step": 413063, "epoch": 4976} {"train_loss": -26.78582763671875, "global_step": 413064, "epoch": 4976} {"train_loss": -26.64922523498535, "global_step": 413065, "epoch": 4976} {"train_loss": -26.873769760131836, "global_step": 413066, "epoch": 4976} {"train_loss": -27.106586456298828, "global_step": 413067, "epoch": 4976} {"train_loss": -26.9814395904541, "global_step": 413068, "epoch": 4976} {"train_loss": -27.249408721923828, "global_step": 413069, "epoch": 4976} {"train_loss": -26.678327560424805, "global_step": 413070, "epoch": 4976} {"train_loss": -26.865982055664062, "global_step": 413071, "epoch": 4976} {"train_loss": -27.106658935546875, "global_step": 413072, "epoch": 4976} {"train_loss": -26.89275550842285, "global_step": 413073, "epoch": 4976} {"train_loss": -26.897851943969727, "global_step": 413074, "epoch": 4976} {"train_loss": -26.227375030517578, "global_step": 413075, "epoch": 4976} {"train_loss": -26.223302841186523, "global_step": 413076, "epoch": 4976} {"train_loss": -26.205163955688477, "global_step": 413077, "epoch": 4976} {"train_loss": -26.757476806640625, "global_step": 413078, "epoch": 4976} {"train_loss": -26.810226440429688, "global_step": 413079, "epoch": 4976} {"train_loss": -26.821380615234375, "global_step": 413080, "epoch": 4976} {"train_loss": -26.812833786010742, "global_step": 413081, "epoch": 4976} {"train_loss": -27.027301788330078, "global_step": 413082, "epoch": 4976} {"train_loss": -26.813093185424805, "global_step": 413083, "epoch": 4976} {"train_loss": -27.019901275634766, "global_step": 413084, "epoch": 4976} {"train_loss": -26.60287857055664, "global_step": 413085, "epoch": 4976} {"train_loss": -26.315277099609375, "global_step": 413086, "epoch": 4976} {"train_loss": -26.497940063476562, "global_step": 413087, "epoch": 4976} {"train_loss": -27.44123649597168, "global_step": 413088, "epoch": 4976} {"train_loss": -26.8277645111084, "global_step": 413089, "epoch": 4976} {"train_loss": -26.579356549734094, "global_step": 413090, "epoch": 4976, "val_loss": 6513953.5} {"train_loss": -26.520620346069336, "global_step": 413091, "epoch": 4977} {"train_loss": -26.08136558532715, "global_step": 413092, "epoch": 4977} {"train_loss": -25.548843383789062, "global_step": 413093, "epoch": 4977} {"train_loss": -26.421401977539062, "global_step": 413094, "epoch": 4977} {"train_loss": -26.605222702026367, "global_step": 413095, "epoch": 4977} {"train_loss": -26.633512496948242, "global_step": 413096, "epoch": 4977} {"train_loss": -26.661645889282227, "global_step": 413097, "epoch": 4977} {"train_loss": -26.582304000854492, "global_step": 413098, "epoch": 4977} {"train_loss": -26.39990234375, "global_step": 413099, "epoch": 4977} {"train_loss": -26.910619735717773, "global_step": 413100, "epoch": 4977} {"train_loss": -26.426456451416016, "global_step": 413101, "epoch": 4977} {"train_loss": -26.766000747680664, "global_step": 413102, "epoch": 4977} {"train_loss": -26.73636817932129, "global_step": 413103, "epoch": 4977} {"train_loss": -26.840591430664062, "global_step": 413104, "epoch": 4977} {"train_loss": -26.692554473876953, "global_step": 413105, "epoch": 4977} {"train_loss": -26.629941940307617, "global_step": 413106, "epoch": 4977} {"train_loss": -27.022314071655273, "global_step": 413107, "epoch": 4977} {"train_loss": -26.28513526916504, "global_step": 413108, "epoch": 4977} {"train_loss": -26.97498893737793, "global_step": 413109, "epoch": 4977} {"train_loss": -26.780134201049805, "global_step": 413110, "epoch": 4977} {"train_loss": -26.447162628173828, "global_step": 413111, "epoch": 4977} {"train_loss": -26.61212730407715, "global_step": 413112, "epoch": 4977} {"train_loss": -26.82459831237793, "global_step": 413113, "epoch": 4977} {"train_loss": -26.969205856323242, "global_step": 413114, "epoch": 4977} {"train_loss": -26.745420455932617, "global_step": 413115, "epoch": 4977} {"train_loss": -26.583118438720703, "global_step": 413116, "epoch": 4977} {"train_loss": -26.56874656677246, "global_step": 413117, "epoch": 4977} {"train_loss": -26.703962326049805, "global_step": 413118, "epoch": 4977} {"train_loss": -26.674142837524414, "global_step": 413119, "epoch": 4977} {"train_loss": -26.75629234313965, "global_step": 413120, "epoch": 4977} {"train_loss": -26.75379753112793, "global_step": 413121, "epoch": 4977} {"train_loss": -26.641815185546875, "global_step": 413122, "epoch": 4977} {"train_loss": -26.545495986938477, "global_step": 413123, "epoch": 4977} {"train_loss": -26.551040649414062, "global_step": 413124, "epoch": 4977} {"train_loss": -26.9956111907959, "global_step": 413125, "epoch": 4977} {"train_loss": -26.626272201538086, "global_step": 413126, "epoch": 4977} {"train_loss": -26.777191162109375, "global_step": 413127, "epoch": 4977} {"train_loss": -26.96990394592285, "global_step": 413128, "epoch": 4977} {"train_loss": -26.703134536743164, "global_step": 413129, "epoch": 4977} {"train_loss": -26.810361862182617, "global_step": 413130, "epoch": 4977} {"train_loss": -26.749637603759766, "global_step": 413131, "epoch": 4977} {"train_loss": -27.10772132873535, "global_step": 413132, "epoch": 4977} {"train_loss": -27.21259880065918, "global_step": 413133, "epoch": 4977} {"train_loss": -26.631372451782227, "global_step": 413134, "epoch": 4977} {"train_loss": -26.65887451171875, "global_step": 413135, "epoch": 4977} {"train_loss": -27.137537002563477, "global_step": 413136, "epoch": 4977} {"train_loss": -26.8417911529541, "global_step": 413137, "epoch": 4977} {"train_loss": -26.747882843017578, "global_step": 413138, "epoch": 4977} {"train_loss": -26.77583122253418, "global_step": 413139, "epoch": 4977} {"train_loss": -26.56184959411621, "global_step": 413140, "epoch": 4977} {"train_loss": -26.856115341186523, "global_step": 413141, "epoch": 4977} {"train_loss": -27.036718368530273, "global_step": 413142, "epoch": 4977} {"train_loss": -27.113367080688477, "global_step": 413143, "epoch": 4977} {"train_loss": -26.60394859313965, "global_step": 413144, "epoch": 4977} {"train_loss": -26.659839630126953, "global_step": 413145, "epoch": 4977} {"train_loss": -26.6260986328125, "global_step": 413146, "epoch": 4977} {"train_loss": -26.462173461914062, "global_step": 413147, "epoch": 4977} {"train_loss": -26.59183692932129, "global_step": 413148, "epoch": 4977} {"train_loss": -26.723440170288086, "global_step": 413149, "epoch": 4977} {"train_loss": -26.763813018798828, "global_step": 413150, "epoch": 4977} {"train_loss": -26.885940551757812, "global_step": 413151, "epoch": 4977} {"train_loss": -26.90414810180664, "global_step": 413152, "epoch": 4977} {"train_loss": -26.371601104736328, "global_step": 413153, "epoch": 4977} {"train_loss": -26.815204620361328, "global_step": 413154, "epoch": 4977} {"train_loss": -26.934051513671875, "global_step": 413155, "epoch": 4977} {"train_loss": -27.075780868530273, "global_step": 413156, "epoch": 4977} {"train_loss": -26.94815444946289, "global_step": 413157, "epoch": 4977} {"train_loss": -26.972497940063477, "global_step": 413158, "epoch": 4977} {"train_loss": -27.029621124267578, "global_step": 413159, "epoch": 4977} {"train_loss": -26.877233505249023, "global_step": 413160, "epoch": 4977} {"train_loss": -26.80508804321289, "global_step": 413161, "epoch": 4977} {"train_loss": -26.940387725830078, "global_step": 413162, "epoch": 4977} {"train_loss": -26.693317413330078, "global_step": 413163, "epoch": 4977} {"train_loss": -27.142627716064453, "global_step": 413164, "epoch": 4977} {"train_loss": -26.877124786376953, "global_step": 413165, "epoch": 4977} {"train_loss": -26.733945846557617, "global_step": 413166, "epoch": 4977} {"train_loss": -26.531864166259766, "global_step": 413167, "epoch": 4977} {"train_loss": -26.301258087158203, "global_step": 413168, "epoch": 4977} {"train_loss": -26.683399200439453, "global_step": 413169, "epoch": 4977} {"train_loss": -26.68170166015625, "global_step": 413170, "epoch": 4977} {"train_loss": -26.275390625, "global_step": 413171, "epoch": 4977} {"train_loss": -26.4876708984375, "global_step": 413172, "epoch": 4977} {"train_loss": -26.70821091065924, "global_step": 413173, "epoch": 4977, "val_loss": 6596735.0} {"train_loss": -25.18271827697754, "global_step": 413174, "epoch": 4978} {"train_loss": -25.567785263061523, "global_step": 413175, "epoch": 4978} {"train_loss": -25.805994033813477, "global_step": 413176, "epoch": 4978} {"train_loss": -25.115278244018555, "global_step": 413177, "epoch": 4978} {"train_loss": -25.62093162536621, "global_step": 413178, "epoch": 4978} {"train_loss": -25.940326690673828, "global_step": 413179, "epoch": 4978} {"train_loss": -26.388513565063477, "global_step": 413180, "epoch": 4978} {"train_loss": -26.18548583984375, "global_step": 413181, "epoch": 4978} {"train_loss": -26.019046783447266, "global_step": 413182, "epoch": 4978} {"train_loss": -26.23731803894043, "global_step": 413183, "epoch": 4978} {"train_loss": -26.016098022460938, "global_step": 413184, "epoch": 4978} {"train_loss": -26.3179931640625, "global_step": 413185, "epoch": 4978} {"train_loss": -26.386770248413086, "global_step": 413186, "epoch": 4978} {"train_loss": -26.580902099609375, "global_step": 413187, "epoch": 4978} {"train_loss": -26.341588973999023, "global_step": 413188, "epoch": 4978} {"train_loss": -26.455841064453125, "global_step": 413189, "epoch": 4978} {"train_loss": -26.385818481445312, "global_step": 413190, "epoch": 4978} {"train_loss": -26.739490509033203, "global_step": 413191, "epoch": 4978} {"train_loss": -26.71857261657715, "global_step": 413192, "epoch": 4978} {"train_loss": -26.389633178710938, "global_step": 413193, "epoch": 4978} {"train_loss": -26.558752059936523, "global_step": 413194, "epoch": 4978} {"train_loss": -26.90738296508789, "global_step": 413195, "epoch": 4978} {"train_loss": -26.531431198120117, "global_step": 413196, "epoch": 4978} {"train_loss": -26.682540893554688, "global_step": 413197, "epoch": 4978} {"train_loss": -26.559070587158203, "global_step": 413198, "epoch": 4978} {"train_loss": -26.651687622070312, "global_step": 413199, "epoch": 4978} {"train_loss": -26.729145050048828, "global_step": 413200, "epoch": 4978} {"train_loss": -27.028045654296875, "global_step": 413201, "epoch": 4978} {"train_loss": -26.595190048217773, "global_step": 413202, "epoch": 4978} {"train_loss": -26.3692626953125, "global_step": 413203, "epoch": 4978} {"train_loss": -26.705814361572266, "global_step": 413204, "epoch": 4978} {"train_loss": -26.86122703552246, "global_step": 413205, "epoch": 4978} {"train_loss": -26.673009872436523, "global_step": 413206, "epoch": 4978} {"train_loss": -26.620243072509766, "global_step": 413207, "epoch": 4978} {"train_loss": -26.867345809936523, "global_step": 413208, "epoch": 4978} {"train_loss": -26.77998161315918, "global_step": 413209, "epoch": 4978} {"train_loss": -26.68195152282715, "global_step": 413210, "epoch": 4978} {"train_loss": -26.48563575744629, "global_step": 413211, "epoch": 4978} {"train_loss": -26.74506950378418, "global_step": 413212, "epoch": 4978} {"train_loss": -26.5937442779541, "global_step": 413213, "epoch": 4978} {"train_loss": -26.774694442749023, "global_step": 413214, "epoch": 4978} {"train_loss": -26.99037742614746, "global_step": 413215, "epoch": 4978} {"train_loss": -26.76373863220215, "global_step": 413216, "epoch": 4978} {"train_loss": -26.78461265563965, "global_step": 413217, "epoch": 4978} {"train_loss": -26.99698257446289, "global_step": 413218, "epoch": 4978} {"train_loss": -26.639799118041992, "global_step": 413219, "epoch": 4978} {"train_loss": -26.573429107666016, "global_step": 413220, "epoch": 4978} {"train_loss": -26.398916244506836, "global_step": 413221, "epoch": 4978} {"train_loss": -26.43073081970215, "global_step": 413222, "epoch": 4978} {"train_loss": -26.493606567382812, "global_step": 413223, "epoch": 4978} {"train_loss": -26.782846450805664, "global_step": 413224, "epoch": 4978} {"train_loss": -26.967761993408203, "global_step": 413225, "epoch": 4978} {"train_loss": -26.926776885986328, "global_step": 413226, "epoch": 4978} {"train_loss": -26.815784454345703, "global_step": 413227, "epoch": 4978} {"train_loss": -26.553741455078125, "global_step": 413228, "epoch": 4978} {"train_loss": -27.25886344909668, "global_step": 413229, "epoch": 4978} {"train_loss": -26.795093536376953, "global_step": 413230, "epoch": 4978} {"train_loss": -27.005359649658203, "global_step": 413231, "epoch": 4978} {"train_loss": -26.977216720581055, "global_step": 413232, "epoch": 4978} {"train_loss": -27.1468505859375, "global_step": 413233, "epoch": 4978} {"train_loss": -27.04770851135254, "global_step": 413234, "epoch": 4978} {"train_loss": -26.99175453186035, "global_step": 413235, "epoch": 4978} {"train_loss": -26.680158615112305, "global_step": 413236, "epoch": 4978} {"train_loss": -26.436674118041992, "global_step": 413237, "epoch": 4978} {"train_loss": -26.2191219329834, "global_step": 413238, "epoch": 4978} {"train_loss": -25.3211612701416, "global_step": 413239, "epoch": 4978} {"train_loss": -23.419580459594727, "global_step": 413240, "epoch": 4978} {"train_loss": -22.88282585144043, "global_step": 413241, "epoch": 4978} {"train_loss": -25.247894287109375, "global_step": 413242, "epoch": 4978} {"train_loss": -25.537216186523438, "global_step": 413243, "epoch": 4978} {"train_loss": -25.555252075195312, "global_step": 413244, "epoch": 4978} {"train_loss": -26.088058471679688, "global_step": 413245, "epoch": 4978} {"train_loss": -25.88299560546875, "global_step": 413246, "epoch": 4978} {"train_loss": -25.993331909179688, "global_step": 413247, "epoch": 4978} {"train_loss": -26.270788192749023, "global_step": 413248, "epoch": 4978} {"train_loss": -26.092077255249023, "global_step": 413249, "epoch": 4978} {"train_loss": -26.193984985351562, "global_step": 413250, "epoch": 4978} {"train_loss": -26.03822135925293, "global_step": 413251, "epoch": 4978} {"train_loss": -26.4018497467041, "global_step": 413252, "epoch": 4978} {"train_loss": -26.185943603515625, "global_step": 413253, "epoch": 4978} {"train_loss": -25.93829345703125, "global_step": 413254, "epoch": 4978} {"train_loss": -26.127389907836914, "global_step": 413255, "epoch": 4978} {"train_loss": -26.340213361992895, "global_step": 413256, "epoch": 4978, "val_loss": 6572291.0} {"train_loss": -25.984405517578125, "global_step": 413257, "epoch": 4979} {"train_loss": -26.097883224487305, "global_step": 413258, "epoch": 4979} {"train_loss": -26.020055770874023, "global_step": 413259, "epoch": 4979} {"train_loss": -26.19797706604004, "global_step": 413260, "epoch": 4979} {"train_loss": -25.769010543823242, "global_step": 413261, "epoch": 4979} {"train_loss": -26.115478515625, "global_step": 413262, "epoch": 4979} {"train_loss": -26.14167594909668, "global_step": 413263, "epoch": 4979} {"train_loss": -26.193740844726562, "global_step": 413264, "epoch": 4979} {"train_loss": -26.603168487548828, "global_step": 413265, "epoch": 4979} {"train_loss": -26.7432804107666, "global_step": 413266, "epoch": 4979} {"train_loss": -26.318395614624023, "global_step": 413267, "epoch": 4979} {"train_loss": -26.459272384643555, "global_step": 413268, "epoch": 4979} {"train_loss": -26.2229061126709, "global_step": 413269, "epoch": 4979} {"train_loss": -26.188995361328125, "global_step": 413270, "epoch": 4979} {"train_loss": -26.3178653717041, "global_step": 413271, "epoch": 4979} {"train_loss": -26.664636611938477, "global_step": 413272, "epoch": 4979} {"train_loss": -26.847492218017578, "global_step": 413273, "epoch": 4979} {"train_loss": -26.45197105407715, "global_step": 413274, "epoch": 4979} {"train_loss": -27.03108024597168, "global_step": 413275, "epoch": 4979} {"train_loss": -26.09693717956543, "global_step": 413276, "epoch": 4979} {"train_loss": -26.53995132446289, "global_step": 413277, "epoch": 4979} {"train_loss": -26.7661075592041, "global_step": 413278, "epoch": 4979} {"train_loss": -26.456897735595703, "global_step": 413279, "epoch": 4979} {"train_loss": -26.601276397705078, "global_step": 413280, "epoch": 4979} {"train_loss": -26.614166259765625, "global_step": 413281, "epoch": 4979} {"train_loss": -26.577667236328125, "global_step": 413282, "epoch": 4979} {"train_loss": -26.609710693359375, "global_step": 413283, "epoch": 4979} {"train_loss": -26.44234275817871, "global_step": 413284, "epoch": 4979} {"train_loss": -26.93722915649414, "global_step": 413285, "epoch": 4979} {"train_loss": -26.873273849487305, "global_step": 413286, "epoch": 4979} {"train_loss": -26.679931640625, "global_step": 413287, "epoch": 4979} {"train_loss": -26.616872787475586, "global_step": 413288, "epoch": 4979} {"train_loss": -26.3461971282959, "global_step": 413289, "epoch": 4979} {"train_loss": -26.707508087158203, "global_step": 413290, "epoch": 4979} {"train_loss": -26.51759147644043, "global_step": 413291, "epoch": 4979} {"train_loss": -27.025373458862305, "global_step": 413292, "epoch": 4979} {"train_loss": -26.80734634399414, "global_step": 413293, "epoch": 4979} {"train_loss": -26.86159324645996, "global_step": 413294, "epoch": 4979} {"train_loss": -26.716617584228516, "global_step": 413295, "epoch": 4979} {"train_loss": -26.685150146484375, "global_step": 413296, "epoch": 4979} {"train_loss": -26.85822105407715, "global_step": 413297, "epoch": 4979} {"train_loss": -26.964385986328125, "global_step": 413298, "epoch": 4979} {"train_loss": -26.785247802734375, "global_step": 413299, "epoch": 4979} {"train_loss": -26.968236923217773, "global_step": 413300, "epoch": 4979} {"train_loss": -27.180389404296875, "global_step": 413301, "epoch": 4979} {"train_loss": -26.89013671875, "global_step": 413302, "epoch": 4979} {"train_loss": -26.95745277404785, "global_step": 413303, "epoch": 4979} {"train_loss": -26.80816078186035, "global_step": 413304, "epoch": 4979} {"train_loss": -26.871549606323242, "global_step": 413305, "epoch": 4979} {"train_loss": -26.701826095581055, "global_step": 413306, "epoch": 4979} {"train_loss": -26.648481369018555, "global_step": 413307, "epoch": 4979} {"train_loss": -27.128952026367188, "global_step": 413308, "epoch": 4979} {"train_loss": -26.552661895751953, "global_step": 413309, "epoch": 4979} {"train_loss": -26.651920318603516, "global_step": 413310, "epoch": 4979} {"train_loss": -26.636112213134766, "global_step": 413311, "epoch": 4979} {"train_loss": -26.331832885742188, "global_step": 413312, "epoch": 4979} {"train_loss": -26.864877700805664, "global_step": 413313, "epoch": 4979} {"train_loss": -26.76215171813965, "global_step": 413314, "epoch": 4979} {"train_loss": -26.783533096313477, "global_step": 413315, "epoch": 4979} {"train_loss": -26.59765625, "global_step": 413316, "epoch": 4979} {"train_loss": -26.546173095703125, "global_step": 413317, "epoch": 4979} {"train_loss": -27.012659072875977, "global_step": 413318, "epoch": 4979} {"train_loss": -26.900787353515625, "global_step": 413319, "epoch": 4979} {"train_loss": -26.652679443359375, "global_step": 413320, "epoch": 4979} {"train_loss": -26.940601348876953, "global_step": 413321, "epoch": 4979} {"train_loss": -26.725696563720703, "global_step": 413322, "epoch": 4979} {"train_loss": -26.875446319580078, "global_step": 413323, "epoch": 4979} {"train_loss": -26.710330963134766, "global_step": 413324, "epoch": 4979} {"train_loss": -26.937448501586914, "global_step": 413325, "epoch": 4979} {"train_loss": -26.714086532592773, "global_step": 413326, "epoch": 4979} {"train_loss": -26.86029052734375, "global_step": 413327, "epoch": 4979} {"train_loss": -26.715063095092773, "global_step": 413328, "epoch": 4979} {"train_loss": -26.63276481628418, "global_step": 413329, "epoch": 4979} {"train_loss": -27.166156768798828, "global_step": 413330, "epoch": 4979} {"train_loss": -26.668996810913086, "global_step": 413331, "epoch": 4979} {"train_loss": -27.0555419921875, "global_step": 413332, "epoch": 4979} {"train_loss": -26.908008575439453, "global_step": 413333, "epoch": 4979} {"train_loss": -26.886444091796875, "global_step": 413334, "epoch": 4979} {"train_loss": -27.12550163269043, "global_step": 413335, "epoch": 4979} {"train_loss": -26.6795597076416, "global_step": 413336, "epoch": 4979} {"train_loss": -26.52449607849121, "global_step": 413337, "epoch": 4979} {"train_loss": -26.939619064331055, "global_step": 413338, "epoch": 4979} {"train_loss": -26.650986613997492, "global_step": 413339, "epoch": 4979, "val_loss": 6637526.0} {"train_loss": -26.776269912719727, "global_step": 413340, "epoch": 4980} {"train_loss": -26.157806396484375, "global_step": 413341, "epoch": 4980} {"train_loss": -26.25591468811035, "global_step": 413342, "epoch": 4980} {"train_loss": -26.022653579711914, "global_step": 413343, "epoch": 4980} {"train_loss": -26.4970645904541, "global_step": 413344, "epoch": 4980} {"train_loss": -26.1768798828125, "global_step": 413345, "epoch": 4980} {"train_loss": -26.6164493560791, "global_step": 413346, "epoch": 4980} {"train_loss": -26.107471466064453, "global_step": 413347, "epoch": 4980} {"train_loss": -26.082067489624023, "global_step": 413348, "epoch": 4980} {"train_loss": -25.960556030273438, "global_step": 413349, "epoch": 4980} {"train_loss": -26.66202735900879, "global_step": 413350, "epoch": 4980} {"train_loss": -26.314207077026367, "global_step": 413351, "epoch": 4980} {"train_loss": -26.507526397705078, "global_step": 413352, "epoch": 4980} {"train_loss": -26.6260986328125, "global_step": 413353, "epoch": 4980} {"train_loss": -26.781829833984375, "global_step": 413354, "epoch": 4980} {"train_loss": -26.505935668945312, "global_step": 413355, "epoch": 4980} {"train_loss": -26.6524715423584, "global_step": 413356, "epoch": 4980} {"train_loss": -26.45041275024414, "global_step": 413357, "epoch": 4980} {"train_loss": -26.783918380737305, "global_step": 413358, "epoch": 4980} {"train_loss": -26.4156494140625, "global_step": 413359, "epoch": 4980} {"train_loss": -26.42963218688965, "global_step": 413360, "epoch": 4980} {"train_loss": -26.834552764892578, "global_step": 413361, "epoch": 4980} {"train_loss": -26.87360954284668, "global_step": 413362, "epoch": 4980} {"train_loss": -27.045251846313477, "global_step": 413363, "epoch": 4980} {"train_loss": -26.642587661743164, "global_step": 413364, "epoch": 4980} {"train_loss": -26.832096099853516, "global_step": 413365, "epoch": 4980} {"train_loss": -26.4603271484375, "global_step": 413366, "epoch": 4980} {"train_loss": -27.013355255126953, "global_step": 413367, "epoch": 4980} {"train_loss": -26.6749210357666, "global_step": 413368, "epoch": 4980} {"train_loss": -26.502649307250977, "global_step": 413369, "epoch": 4980} {"train_loss": -26.79157066345215, "global_step": 413370, "epoch": 4980} {"train_loss": -26.98261833190918, "global_step": 413371, "epoch": 4980} {"train_loss": -26.750577926635742, "global_step": 413372, "epoch": 4980} {"train_loss": -27.019989013671875, "global_step": 413373, "epoch": 4980} {"train_loss": -26.962024688720703, "global_step": 413374, "epoch": 4980} {"train_loss": -26.82697868347168, "global_step": 413375, "epoch": 4980} {"train_loss": -27.0100154876709, "global_step": 413376, "epoch": 4980} {"train_loss": -26.774694442749023, "global_step": 413377, "epoch": 4980} {"train_loss": -27.07892417907715, "global_step": 413378, "epoch": 4980} {"train_loss": -27.131017684936523, "global_step": 413379, "epoch": 4980} {"train_loss": -26.60909080505371, "global_step": 413380, "epoch": 4980} {"train_loss": -26.86846351623535, "global_step": 413381, "epoch": 4980} {"train_loss": -26.799036026000977, "global_step": 413382, "epoch": 4980} {"train_loss": -26.705713272094727, "global_step": 413383, "epoch": 4980} {"train_loss": -26.760223388671875, "global_step": 413384, "epoch": 4980} {"train_loss": -27.3302001953125, "global_step": 413385, "epoch": 4980} {"train_loss": -26.808374404907227, "global_step": 413386, "epoch": 4980} {"train_loss": -26.971017837524414, "global_step": 413387, "epoch": 4980} {"train_loss": -26.85270118713379, "global_step": 413388, "epoch": 4980} {"train_loss": -27.01190757751465, "global_step": 413389, "epoch": 4980} {"train_loss": -26.83933448791504, "global_step": 413390, "epoch": 4980} {"train_loss": -26.82379722595215, "global_step": 413391, "epoch": 4980} {"train_loss": -26.831897735595703, "global_step": 413392, "epoch": 4980} {"train_loss": -26.753942489624023, "global_step": 413393, "epoch": 4980} {"train_loss": -26.682327270507812, "global_step": 413394, "epoch": 4980} {"train_loss": -26.79225730895996, "global_step": 413395, "epoch": 4980} {"train_loss": -26.778919219970703, "global_step": 413396, "epoch": 4980} {"train_loss": -27.015472412109375, "global_step": 413397, "epoch": 4980} {"train_loss": -26.4826717376709, "global_step": 413398, "epoch": 4980} {"train_loss": -26.959089279174805, "global_step": 413399, "epoch": 4980} {"train_loss": -27.049152374267578, "global_step": 413400, "epoch": 4980} {"train_loss": -26.616153717041016, "global_step": 413401, "epoch": 4980} {"train_loss": -26.5223445892334, "global_step": 413402, "epoch": 4980} {"train_loss": -26.43189811706543, "global_step": 413403, "epoch": 4980} {"train_loss": -26.798187255859375, "global_step": 413404, "epoch": 4980} {"train_loss": -26.659887313842773, "global_step": 413405, "epoch": 4980} {"train_loss": -26.24299430847168, "global_step": 413406, "epoch": 4980} {"train_loss": -26.649023056030273, "global_step": 413407, "epoch": 4980} {"train_loss": -26.477468490600586, "global_step": 413408, "epoch": 4980} {"train_loss": -26.470794677734375, "global_step": 413409, "epoch": 4980} {"train_loss": -26.820322036743164, "global_step": 413410, "epoch": 4980} {"train_loss": -26.279001235961914, "global_step": 413411, "epoch": 4980} {"train_loss": -26.148160934448242, "global_step": 413412, "epoch": 4980} {"train_loss": -26.495941162109375, "global_step": 413413, "epoch": 4980} {"train_loss": -26.25204849243164, "global_step": 413414, "epoch": 4980} {"train_loss": -26.15268325805664, "global_step": 413415, "epoch": 4980} {"train_loss": -26.495075225830078, "global_step": 413416, "epoch": 4980} {"train_loss": -26.69178581237793, "global_step": 413417, "epoch": 4980} {"train_loss": -26.2078914642334, "global_step": 413418, "epoch": 4980} {"train_loss": -26.43341064453125, "global_step": 413419, "epoch": 4980} {"train_loss": -25.940311431884766, "global_step": 413420, "epoch": 4980} {"train_loss": -26.543994903564453, "global_step": 413421, "epoch": 4980} {"train_loss": -26.619011040193488, "global_step": 413422, "epoch": 4980, "val_loss": 6565913.0} {"train_loss": -26.161407470703125, "global_step": 413423, "epoch": 4981} {"train_loss": -25.6643123626709, "global_step": 413424, "epoch": 4981} {"train_loss": -26.18182373046875, "global_step": 413425, "epoch": 4981} {"train_loss": -26.07074546813965, "global_step": 413426, "epoch": 4981} {"train_loss": -26.53143882751465, "global_step": 413427, "epoch": 4981} {"train_loss": -26.120771408081055, "global_step": 413428, "epoch": 4981} {"train_loss": -25.985326766967773, "global_step": 413429, "epoch": 4981} {"train_loss": -26.007904052734375, "global_step": 413430, "epoch": 4981} {"train_loss": -25.586191177368164, "global_step": 413431, "epoch": 4981} {"train_loss": -26.257251739501953, "global_step": 413432, "epoch": 4981} {"train_loss": -26.232553482055664, "global_step": 413433, "epoch": 4981} {"train_loss": -26.253376007080078, "global_step": 413434, "epoch": 4981} {"train_loss": -26.05096435546875, "global_step": 413435, "epoch": 4981} {"train_loss": -26.31702995300293, "global_step": 413436, "epoch": 4981} {"train_loss": -26.392181396484375, "global_step": 413437, "epoch": 4981} {"train_loss": -25.960046768188477, "global_step": 413438, "epoch": 4981} {"train_loss": -26.41259765625, "global_step": 413439, "epoch": 4981} {"train_loss": -26.562976837158203, "global_step": 413440, "epoch": 4981} {"train_loss": -26.655517578125, "global_step": 413441, "epoch": 4981} {"train_loss": -26.072458267211914, "global_step": 413442, "epoch": 4981} {"train_loss": -26.491369247436523, "global_step": 413443, "epoch": 4981} {"train_loss": -26.401443481445312, "global_step": 413444, "epoch": 4981} {"train_loss": -26.701812744140625, "global_step": 413445, "epoch": 4981} {"train_loss": -26.43653678894043, "global_step": 413446, "epoch": 4981} {"train_loss": -26.69611167907715, "global_step": 413447, "epoch": 4981} {"train_loss": -26.85651206970215, "global_step": 413448, "epoch": 4981} {"train_loss": -26.423688888549805, "global_step": 413449, "epoch": 4981} {"train_loss": -26.55524253845215, "global_step": 413450, "epoch": 4981} {"train_loss": -26.951269149780273, "global_step": 413451, "epoch": 4981} {"train_loss": -26.81818199157715, "global_step": 413452, "epoch": 4981} {"train_loss": -27.040571212768555, "global_step": 413453, "epoch": 4981} {"train_loss": -26.604455947875977, "global_step": 413454, "epoch": 4981} {"train_loss": -26.703454971313477, "global_step": 413455, "epoch": 4981} {"train_loss": -26.569934844970703, "global_step": 413456, "epoch": 4981} {"train_loss": -26.869354248046875, "global_step": 413457, "epoch": 4981} {"train_loss": -27.124149322509766, "global_step": 413458, "epoch": 4981} {"train_loss": -26.808338165283203, "global_step": 413459, "epoch": 4981} {"train_loss": -27.234655380249023, "global_step": 413460, "epoch": 4981} {"train_loss": -26.882938385009766, "global_step": 413461, "epoch": 4981} {"train_loss": -26.474964141845703, "global_step": 413462, "epoch": 4981} {"train_loss": -27.412799835205078, "global_step": 413463, "epoch": 4981} {"train_loss": -26.78132438659668, "global_step": 413464, "epoch": 4981} {"train_loss": -26.9310359954834, "global_step": 413465, "epoch": 4981} {"train_loss": -27.10359764099121, "global_step": 413466, "epoch": 4981} {"train_loss": -26.919965744018555, "global_step": 413467, "epoch": 4981} {"train_loss": -26.798954010009766, "global_step": 413468, "epoch": 4981} {"train_loss": -27.0334529876709, "global_step": 413469, "epoch": 4981} {"train_loss": -27.0518856048584, "global_step": 413470, "epoch": 4981} {"train_loss": -27.040876388549805, "global_step": 413471, "epoch": 4981} {"train_loss": -26.829381942749023, "global_step": 413472, "epoch": 4981} {"train_loss": -26.900074005126953, "global_step": 413473, "epoch": 4981} {"train_loss": -26.796161651611328, "global_step": 413474, "epoch": 4981} {"train_loss": -27.045490264892578, "global_step": 413475, "epoch": 4981} {"train_loss": -26.586429595947266, "global_step": 413476, "epoch": 4981} {"train_loss": -26.82098960876465, "global_step": 413477, "epoch": 4981} {"train_loss": -26.22190284729004, "global_step": 413478, "epoch": 4981} {"train_loss": -26.008825302124023, "global_step": 413479, "epoch": 4981} {"train_loss": -26.667877197265625, "global_step": 413480, "epoch": 4981} {"train_loss": -26.428842544555664, "global_step": 413481, "epoch": 4981} {"train_loss": -26.432035446166992, "global_step": 413482, "epoch": 4981} {"train_loss": -26.99420738220215, "global_step": 413483, "epoch": 4981} {"train_loss": -26.26028823852539, "global_step": 413484, "epoch": 4981} {"train_loss": -26.79937171936035, "global_step": 413485, "epoch": 4981} {"train_loss": -26.3804988861084, "global_step": 413486, "epoch": 4981} {"train_loss": -26.8216552734375, "global_step": 413487, "epoch": 4981} {"train_loss": -26.37654685974121, "global_step": 413488, "epoch": 4981} {"train_loss": -25.66023826599121, "global_step": 413489, "epoch": 4981} {"train_loss": -26.672901153564453, "global_step": 413490, "epoch": 4981} {"train_loss": -26.4180850982666, "global_step": 413491, "epoch": 4981} {"train_loss": -26.945348739624023, "global_step": 413492, "epoch": 4981} {"train_loss": -26.578290939331055, "global_step": 413493, "epoch": 4981} {"train_loss": -26.584455490112305, "global_step": 413494, "epoch": 4981} {"train_loss": -26.3956298828125, "global_step": 413495, "epoch": 4981} {"train_loss": -26.633045196533203, "global_step": 413496, "epoch": 4981} {"train_loss": -27.262887954711914, "global_step": 413497, "epoch": 4981} {"train_loss": -26.756818771362305, "global_step": 413498, "epoch": 4981} {"train_loss": -26.70979118347168, "global_step": 413499, "epoch": 4981} {"train_loss": -26.507917404174805, "global_step": 413500, "epoch": 4981} {"train_loss": -26.66840171813965, "global_step": 413501, "epoch": 4981} {"train_loss": -26.52445411682129, "global_step": 413502, "epoch": 4981} {"train_loss": -26.043725967407227, "global_step": 413503, "epoch": 4981} {"train_loss": -26.820470809936523, "global_step": 413504, "epoch": 4981} {"train_loss": -26.587754421923535, "global_step": 413505, "epoch": 4981, "val_loss": 6577298.0} {"train_loss": -25.54892349243164, "global_step": 413506, "epoch": 4982} {"train_loss": -26.11029624938965, "global_step": 413507, "epoch": 4982} {"train_loss": -26.111730575561523, "global_step": 413508, "epoch": 4982} {"train_loss": -25.77457618713379, "global_step": 413509, "epoch": 4982} {"train_loss": -26.106769561767578, "global_step": 413510, "epoch": 4982} {"train_loss": -26.00625991821289, "global_step": 413511, "epoch": 4982} {"train_loss": -26.306005477905273, "global_step": 413512, "epoch": 4982} {"train_loss": -26.087833404541016, "global_step": 413513, "epoch": 4982} {"train_loss": -26.61321449279785, "global_step": 413514, "epoch": 4982} {"train_loss": -25.842939376831055, "global_step": 413515, "epoch": 4982} {"train_loss": -26.188983917236328, "global_step": 413516, "epoch": 4982} {"train_loss": -25.93707275390625, "global_step": 413517, "epoch": 4982} {"train_loss": -26.46327018737793, "global_step": 413518, "epoch": 4982} {"train_loss": -26.172260284423828, "global_step": 413519, "epoch": 4982} {"train_loss": -26.267730712890625, "global_step": 413520, "epoch": 4982} {"train_loss": -26.568449020385742, "global_step": 413521, "epoch": 4982} {"train_loss": -26.54743003845215, "global_step": 413522, "epoch": 4982} {"train_loss": -26.6826171875, "global_step": 413523, "epoch": 4982} {"train_loss": -26.23224449157715, "global_step": 413524, "epoch": 4982} {"train_loss": -26.80926513671875, "global_step": 413525, "epoch": 4982} {"train_loss": -26.6468448638916, "global_step": 413526, "epoch": 4982} {"train_loss": -26.719745635986328, "global_step": 413527, "epoch": 4982} {"train_loss": -26.29306411743164, "global_step": 413528, "epoch": 4982} {"train_loss": -26.913150787353516, "global_step": 413529, "epoch": 4982} {"train_loss": -26.394351959228516, "global_step": 413530, "epoch": 4982} {"train_loss": -26.103559494018555, "global_step": 413531, "epoch": 4982} {"train_loss": -26.490747451782227, "global_step": 413532, "epoch": 4982} {"train_loss": -26.689512252807617, "global_step": 413533, "epoch": 4982} {"train_loss": -26.39837074279785, "global_step": 413534, "epoch": 4982} {"train_loss": -26.4774169921875, "global_step": 413535, "epoch": 4982} {"train_loss": -27.015661239624023, "global_step": 413536, "epoch": 4982} {"train_loss": -26.628467559814453, "global_step": 413537, "epoch": 4982} {"train_loss": -26.37912940979004, "global_step": 413538, "epoch": 4982} {"train_loss": -26.634931564331055, "global_step": 413539, "epoch": 4982} {"train_loss": -26.401473999023438, "global_step": 413540, "epoch": 4982} {"train_loss": -26.259809494018555, "global_step": 413541, "epoch": 4982} {"train_loss": -26.689990997314453, "global_step": 413542, "epoch": 4982} {"train_loss": -26.797657012939453, "global_step": 413543, "epoch": 4982} {"train_loss": -26.706119537353516, "global_step": 413544, "epoch": 4982} {"train_loss": -26.5770320892334, "global_step": 413545, "epoch": 4982} {"train_loss": -26.628498077392578, "global_step": 413546, "epoch": 4982} {"train_loss": -26.791040420532227, "global_step": 413547, "epoch": 4982} {"train_loss": -26.859088897705078, "global_step": 413548, "epoch": 4982} {"train_loss": -26.97419548034668, "global_step": 413549, "epoch": 4982} {"train_loss": -26.79330825805664, "global_step": 413550, "epoch": 4982} {"train_loss": -26.673877716064453, "global_step": 413551, "epoch": 4982} {"train_loss": -26.631460189819336, "global_step": 413552, "epoch": 4982} {"train_loss": -26.97413444519043, "global_step": 413553, "epoch": 4982} {"train_loss": -26.881927490234375, "global_step": 413554, "epoch": 4982} {"train_loss": -27.070219039916992, "global_step": 413555, "epoch": 4982} {"train_loss": -26.599960327148438, "global_step": 413556, "epoch": 4982} {"train_loss": -27.048383712768555, "global_step": 413557, "epoch": 4982} {"train_loss": -26.900251388549805, "global_step": 413558, "epoch": 4982} {"train_loss": -27.04819107055664, "global_step": 413559, "epoch": 4982} {"train_loss": -26.297582626342773, "global_step": 413560, "epoch": 4982} {"train_loss": -26.497976303100586, "global_step": 413561, "epoch": 4982} {"train_loss": -26.703744888305664, "global_step": 413562, "epoch": 4982} {"train_loss": -26.5816650390625, "global_step": 413563, "epoch": 4982} {"train_loss": -26.36115837097168, "global_step": 413564, "epoch": 4982} {"train_loss": -26.887243270874023, "global_step": 413565, "epoch": 4982} {"train_loss": -26.551898956298828, "global_step": 413566, "epoch": 4982} {"train_loss": -26.548986434936523, "global_step": 413567, "epoch": 4982} {"train_loss": -26.845172882080078, "global_step": 413568, "epoch": 4982} {"train_loss": -26.394699096679688, "global_step": 413569, "epoch": 4982} {"train_loss": -26.657312393188477, "global_step": 413570, "epoch": 4982} {"train_loss": -26.52931022644043, "global_step": 413571, "epoch": 4982} {"train_loss": -27.045581817626953, "global_step": 413572, "epoch": 4982} {"train_loss": -26.76506996154785, "global_step": 413573, "epoch": 4982} {"train_loss": -26.476001739501953, "global_step": 413574, "epoch": 4982} {"train_loss": -26.60346794128418, "global_step": 413575, "epoch": 4982} {"train_loss": -26.76117515563965, "global_step": 413576, "epoch": 4982} {"train_loss": -26.879087448120117, "global_step": 413577, "epoch": 4982} {"train_loss": -26.703832626342773, "global_step": 413578, "epoch": 4982} {"train_loss": -26.543249130249023, "global_step": 413579, "epoch": 4982} {"train_loss": -27.095687866210938, "global_step": 413580, "epoch": 4982} {"train_loss": -27.179590225219727, "global_step": 413581, "epoch": 4982} {"train_loss": -26.7037410736084, "global_step": 413582, "epoch": 4982} {"train_loss": -27.156818389892578, "global_step": 413583, "epoch": 4982} {"train_loss": -26.37677001953125, "global_step": 413584, "epoch": 4982} {"train_loss": -26.784582138061523, "global_step": 413585, "epoch": 4982} {"train_loss": -26.6016902923584, "global_step": 413586, "epoch": 4982} {"train_loss": -26.98566246032715, "global_step": 413587, "epoch": 4982} {"train_loss": -26.57926993772208, "global_step": 413588, "epoch": 4982, "val_loss": 6561659.0} {"train_loss": -25.49751091003418, "global_step": 413589, "epoch": 4983} {"train_loss": -25.565404891967773, "global_step": 413590, "epoch": 4983} {"train_loss": -25.928625106811523, "global_step": 413591, "epoch": 4983} {"train_loss": -26.612085342407227, "global_step": 413592, "epoch": 4983} {"train_loss": -26.042692184448242, "global_step": 413593, "epoch": 4983} {"train_loss": -26.55304527282715, "global_step": 413594, "epoch": 4983} {"train_loss": -26.628713607788086, "global_step": 413595, "epoch": 4983} {"train_loss": -26.093917846679688, "global_step": 413596, "epoch": 4983} {"train_loss": -26.374256134033203, "global_step": 413597, "epoch": 4983} {"train_loss": -26.803558349609375, "global_step": 413598, "epoch": 4983} {"train_loss": -26.60525894165039, "global_step": 413599, "epoch": 4983} {"train_loss": -26.431669235229492, "global_step": 413600, "epoch": 4983} {"train_loss": -26.568082809448242, "global_step": 413601, "epoch": 4983} {"train_loss": -26.50081443786621, "global_step": 413602, "epoch": 4983} {"train_loss": -26.25568962097168, "global_step": 413603, "epoch": 4983} {"train_loss": -26.358739852905273, "global_step": 413604, "epoch": 4983} {"train_loss": -26.305728912353516, "global_step": 413605, "epoch": 4983} {"train_loss": -26.656402587890625, "global_step": 413606, "epoch": 4983} {"train_loss": -26.725574493408203, "global_step": 413607, "epoch": 4983} {"train_loss": -26.738813400268555, "global_step": 413608, "epoch": 4983} {"train_loss": -26.983991622924805, "global_step": 413609, "epoch": 4983} {"train_loss": -26.63250160217285, "global_step": 413610, "epoch": 4983} {"train_loss": -26.89834976196289, "global_step": 413611, "epoch": 4983} {"train_loss": -26.38343620300293, "global_step": 413612, "epoch": 4983} {"train_loss": -26.995166778564453, "global_step": 413613, "epoch": 4983} {"train_loss": -26.516860961914062, "global_step": 413614, "epoch": 4983} {"train_loss": -26.822330474853516, "global_step": 413615, "epoch": 4983} {"train_loss": -26.637847900390625, "global_step": 413616, "epoch": 4983} {"train_loss": -26.931058883666992, "global_step": 413617, "epoch": 4983} {"train_loss": -26.919921875, "global_step": 413618, "epoch": 4983} {"train_loss": -26.659631729125977, "global_step": 413619, "epoch": 4983} {"train_loss": -26.426252365112305, "global_step": 413620, "epoch": 4983} {"train_loss": -26.824731826782227, "global_step": 413621, "epoch": 4983} {"train_loss": -26.8662166595459, "global_step": 413622, "epoch": 4983} {"train_loss": -26.63960075378418, "global_step": 413623, "epoch": 4983} {"train_loss": -26.682828903198242, "global_step": 413624, "epoch": 4983} {"train_loss": -26.68230628967285, "global_step": 413625, "epoch": 4983} {"train_loss": -26.84980583190918, "global_step": 413626, "epoch": 4983} {"train_loss": -26.92103385925293, "global_step": 413627, "epoch": 4983} {"train_loss": -26.916852951049805, "global_step": 413628, "epoch": 4983} {"train_loss": -26.858600616455078, "global_step": 413629, "epoch": 4983} {"train_loss": -26.687936782836914, "global_step": 413630, "epoch": 4983} {"train_loss": -26.892902374267578, "global_step": 413631, "epoch": 4983} {"train_loss": -26.639631271362305, "global_step": 413632, "epoch": 4983} {"train_loss": -27.045501708984375, "global_step": 413633, "epoch": 4983} {"train_loss": -27.301908493041992, "global_step": 413634, "epoch": 4983} {"train_loss": -27.06287956237793, "global_step": 413635, "epoch": 4983} {"train_loss": -26.93562889099121, "global_step": 413636, "epoch": 4983} {"train_loss": -26.83612060546875, "global_step": 413637, "epoch": 4983} {"train_loss": -26.892114639282227, "global_step": 413638, "epoch": 4983} {"train_loss": -27.139286041259766, "global_step": 413639, "epoch": 4983} {"train_loss": -26.677106857299805, "global_step": 413640, "epoch": 4983} {"train_loss": -26.675886154174805, "global_step": 413641, "epoch": 4983} {"train_loss": -26.51889991760254, "global_step": 413642, "epoch": 4983} {"train_loss": -26.80341148376465, "global_step": 413643, "epoch": 4983} {"train_loss": -27.065814971923828, "global_step": 413644, "epoch": 4983} {"train_loss": -26.800058364868164, "global_step": 413645, "epoch": 4983} {"train_loss": -26.525922775268555, "global_step": 413646, "epoch": 4983} {"train_loss": -26.1126766204834, "global_step": 413647, "epoch": 4983} {"train_loss": -25.722919464111328, "global_step": 413648, "epoch": 4983} {"train_loss": -26.200361251831055, "global_step": 413649, "epoch": 4983} {"train_loss": -26.58194923400879, "global_step": 413650, "epoch": 4983} {"train_loss": -26.465795516967773, "global_step": 413651, "epoch": 4983} {"train_loss": -26.682861328125, "global_step": 413652, "epoch": 4983} {"train_loss": -26.324438095092773, "global_step": 413653, "epoch": 4983} {"train_loss": -26.474802017211914, "global_step": 413654, "epoch": 4983} {"train_loss": -27.19379234313965, "global_step": 413655, "epoch": 4983} {"train_loss": -26.803617477416992, "global_step": 413656, "epoch": 4983} {"train_loss": -26.777236938476562, "global_step": 413657, "epoch": 4983} {"train_loss": -26.816162109375, "global_step": 413658, "epoch": 4983} {"train_loss": -26.703907012939453, "global_step": 413659, "epoch": 4983} {"train_loss": -26.882827758789062, "global_step": 413660, "epoch": 4983} {"train_loss": -26.330860137939453, "global_step": 413661, "epoch": 4983} {"train_loss": -26.82478141784668, "global_step": 413662, "epoch": 4983} {"train_loss": -26.672021865844727, "global_step": 413663, "epoch": 4983} {"train_loss": -26.825031280517578, "global_step": 413664, "epoch": 4983} {"train_loss": -26.508380889892578, "global_step": 413665, "epoch": 4983} {"train_loss": -26.787322998046875, "global_step": 413666, "epoch": 4983} {"train_loss": -26.747486114501953, "global_step": 413667, "epoch": 4983} {"train_loss": -26.411178588867188, "global_step": 413668, "epoch": 4983} {"train_loss": -26.89642333984375, "global_step": 413669, "epoch": 4983} {"train_loss": -26.906415939331055, "global_step": 413670, "epoch": 4983} {"train_loss": -26.64414566683482, "global_step": 413671, "epoch": 4983, "val_loss": 6505355.0} {"train_loss": -26.45916748046875, "global_step": 413672, "epoch": 4984} {"train_loss": -26.31298828125, "global_step": 413673, "epoch": 4984} {"train_loss": -26.39814567565918, "global_step": 413674, "epoch": 4984} {"train_loss": -26.701629638671875, "global_step": 413675, "epoch": 4984} {"train_loss": -26.796192169189453, "global_step": 413676, "epoch": 4984} {"train_loss": -26.74968910217285, "global_step": 413677, "epoch": 4984} {"train_loss": -26.710119247436523, "global_step": 413678, "epoch": 4984} {"train_loss": -26.49326515197754, "global_step": 413679, "epoch": 4984} {"train_loss": -27.14788246154785, "global_step": 413680, "epoch": 4984} {"train_loss": -26.875696182250977, "global_step": 413681, "epoch": 4984} {"train_loss": -26.597726821899414, "global_step": 413682, "epoch": 4984} {"train_loss": -26.42693519592285, "global_step": 413683, "epoch": 4984} {"train_loss": -26.977615356445312, "global_step": 413684, "epoch": 4984} {"train_loss": -26.478357315063477, "global_step": 413685, "epoch": 4984} {"train_loss": -26.563495635986328, "global_step": 413686, "epoch": 4984} {"train_loss": -26.480077743530273, "global_step": 413687, "epoch": 4984} {"train_loss": -27.209930419921875, "global_step": 413688, "epoch": 4984} {"train_loss": -27.013696670532227, "global_step": 413689, "epoch": 4984} {"train_loss": -26.972314834594727, "global_step": 413690, "epoch": 4984} {"train_loss": -26.679534912109375, "global_step": 413691, "epoch": 4984} {"train_loss": -26.736387252807617, "global_step": 413692, "epoch": 4984} {"train_loss": -26.48628044128418, "global_step": 413693, "epoch": 4984} {"train_loss": -26.815595626831055, "global_step": 413694, "epoch": 4984} {"train_loss": -27.0146427154541, "global_step": 413695, "epoch": 4984} {"train_loss": -27.04363441467285, "global_step": 413696, "epoch": 4984} {"train_loss": -26.71527671813965, "global_step": 413697, "epoch": 4984} {"train_loss": -26.900360107421875, "global_step": 413698, "epoch": 4984} {"train_loss": -26.88973045349121, "global_step": 413699, "epoch": 4984} {"train_loss": -26.9060115814209, "global_step": 413700, "epoch": 4984} {"train_loss": -26.448415756225586, "global_step": 413701, "epoch": 4984} {"train_loss": -26.386505126953125, "global_step": 413702, "epoch": 4984} {"train_loss": -26.29569435119629, "global_step": 413703, "epoch": 4984} {"train_loss": -26.19257164001465, "global_step": 413704, "epoch": 4984} {"train_loss": -26.428308486938477, "global_step": 413705, "epoch": 4984} {"train_loss": -26.785430908203125, "global_step": 413706, "epoch": 4984} {"train_loss": -26.931089401245117, "global_step": 413707, "epoch": 4984} {"train_loss": -26.601703643798828, "global_step": 413708, "epoch": 4984} {"train_loss": -26.047916412353516, "global_step": 413709, "epoch": 4984} {"train_loss": -26.421802520751953, "global_step": 413710, "epoch": 4984} {"train_loss": -26.186065673828125, "global_step": 413711, "epoch": 4984} {"train_loss": -26.663061141967773, "global_step": 413712, "epoch": 4984} {"train_loss": -26.858285903930664, "global_step": 413713, "epoch": 4984} {"train_loss": -26.896026611328125, "global_step": 413714, "epoch": 4984} {"train_loss": -26.653915405273438, "global_step": 413715, "epoch": 4984} {"train_loss": -26.617109298706055, "global_step": 413716, "epoch": 4984} {"train_loss": -26.713485717773438, "global_step": 413717, "epoch": 4984} {"train_loss": -26.46746253967285, "global_step": 413718, "epoch": 4984} {"train_loss": -26.705158233642578, "global_step": 413719, "epoch": 4984} {"train_loss": -26.696630477905273, "global_step": 413720, "epoch": 4984} {"train_loss": -26.70682716369629, "global_step": 413721, "epoch": 4984} {"train_loss": -26.589588165283203, "global_step": 413722, "epoch": 4984} {"train_loss": -27.010345458984375, "global_step": 413723, "epoch": 4984} {"train_loss": -26.962635040283203, "global_step": 413724, "epoch": 4984} {"train_loss": -26.9090633392334, "global_step": 413725, "epoch": 4984} {"train_loss": -26.824453353881836, "global_step": 413726, "epoch": 4984} {"train_loss": -26.606597900390625, "global_step": 413727, "epoch": 4984} {"train_loss": -27.008630752563477, "global_step": 413728, "epoch": 4984} {"train_loss": -26.693937301635742, "global_step": 413729, "epoch": 4984} {"train_loss": -26.45465660095215, "global_step": 413730, "epoch": 4984} {"train_loss": -26.65715980529785, "global_step": 413731, "epoch": 4984} {"train_loss": -26.833066940307617, "global_step": 413732, "epoch": 4984} {"train_loss": -26.832223892211914, "global_step": 413733, "epoch": 4984} {"train_loss": -26.673023223876953, "global_step": 413734, "epoch": 4984} {"train_loss": -26.24493980407715, "global_step": 413735, "epoch": 4984} {"train_loss": -26.819791793823242, "global_step": 413736, "epoch": 4984} {"train_loss": -26.68231773376465, "global_step": 413737, "epoch": 4984} {"train_loss": -26.820404052734375, "global_step": 413738, "epoch": 4984} {"train_loss": -26.815998077392578, "global_step": 413739, "epoch": 4984} {"train_loss": -26.727432250976562, "global_step": 413740, "epoch": 4984} {"train_loss": -26.64582633972168, "global_step": 413741, "epoch": 4984} {"train_loss": -26.499780654907227, "global_step": 413742, "epoch": 4984} {"train_loss": -26.797658920288086, "global_step": 413743, "epoch": 4984} {"train_loss": -26.81218910217285, "global_step": 413744, "epoch": 4984} {"train_loss": -26.645544052124023, "global_step": 413745, "epoch": 4984} {"train_loss": -26.77277946472168, "global_step": 413746, "epoch": 4984} {"train_loss": -26.809232711791992, "global_step": 413747, "epoch": 4984} {"train_loss": -26.95182228088379, "global_step": 413748, "epoch": 4984} {"train_loss": -26.585708618164062, "global_step": 413749, "epoch": 4984} {"train_loss": -27.013059616088867, "global_step": 413750, "epoch": 4984} {"train_loss": -26.70318031311035, "global_step": 413751, "epoch": 4984} {"train_loss": -26.894113540649414, "global_step": 413752, "epoch": 4984} {"train_loss": -26.978235244750977, "global_step": 413753, "epoch": 4984} {"train_loss": -26.697503262255566, "global_step": 413754, "epoch": 4984, "val_loss": 6510257.0} {"train_loss": -25.7021427154541, "global_step": 413755, "epoch": 4985} {"train_loss": -25.74738121032715, "global_step": 413756, "epoch": 4985} {"train_loss": -25.662336349487305, "global_step": 413757, "epoch": 4985} {"train_loss": -25.678665161132812, "global_step": 413758, "epoch": 4985} {"train_loss": -26.017786026000977, "global_step": 413759, "epoch": 4985} {"train_loss": -26.440908432006836, "global_step": 413760, "epoch": 4985} {"train_loss": -25.465816497802734, "global_step": 413761, "epoch": 4985} {"train_loss": -26.021570205688477, "global_step": 413762, "epoch": 4985} {"train_loss": -25.73355484008789, "global_step": 413763, "epoch": 4985} {"train_loss": -26.225561141967773, "global_step": 413764, "epoch": 4985} {"train_loss": -26.19972801208496, "global_step": 413765, "epoch": 4985} {"train_loss": -26.32025718688965, "global_step": 413766, "epoch": 4985} {"train_loss": -26.68284034729004, "global_step": 413767, "epoch": 4985} {"train_loss": -26.418432235717773, "global_step": 413768, "epoch": 4985} {"train_loss": -26.17051124572754, "global_step": 413769, "epoch": 4985} {"train_loss": -26.86374855041504, "global_step": 413770, "epoch": 4985} {"train_loss": -26.163440704345703, "global_step": 413771, "epoch": 4985} {"train_loss": -26.595224380493164, "global_step": 413772, "epoch": 4985} {"train_loss": -26.4639949798584, "global_step": 413773, "epoch": 4985} {"train_loss": -26.557348251342773, "global_step": 413774, "epoch": 4985} {"train_loss": -26.562341690063477, "global_step": 413775, "epoch": 4985} {"train_loss": -26.539331436157227, "global_step": 413776, "epoch": 4985} {"train_loss": -26.491987228393555, "global_step": 413777, "epoch": 4985} {"train_loss": -26.657257080078125, "global_step": 413778, "epoch": 4985} {"train_loss": -26.18671989440918, "global_step": 413779, "epoch": 4985} {"train_loss": -26.659317016601562, "global_step": 413780, "epoch": 4985} {"train_loss": -26.499958038330078, "global_step": 413781, "epoch": 4985} {"train_loss": -26.587646484375, "global_step": 413782, "epoch": 4985} {"train_loss": -26.84010887145996, "global_step": 413783, "epoch": 4985} {"train_loss": -26.713891983032227, "global_step": 413784, "epoch": 4985} {"train_loss": -26.615768432617188, "global_step": 413785, "epoch": 4985} {"train_loss": -26.859792709350586, "global_step": 413786, "epoch": 4985} {"train_loss": -26.769927978515625, "global_step": 413787, "epoch": 4985} {"train_loss": -26.733137130737305, "global_step": 413788, "epoch": 4985} {"train_loss": -26.631439208984375, "global_step": 413789, "epoch": 4985} {"train_loss": -27.06302833557129, "global_step": 413790, "epoch": 4985} {"train_loss": -26.667707443237305, "global_step": 413791, "epoch": 4985} {"train_loss": -26.612096786499023, "global_step": 413792, "epoch": 4985} {"train_loss": -26.843170166015625, "global_step": 413793, "epoch": 4985} {"train_loss": -26.55376625061035, "global_step": 413794, "epoch": 4985} {"train_loss": -26.807477951049805, "global_step": 413795, "epoch": 4985} {"train_loss": -27.016393661499023, "global_step": 413796, "epoch": 4985} {"train_loss": -26.747451782226562, "global_step": 413797, "epoch": 4985} {"train_loss": -26.860519409179688, "global_step": 413798, "epoch": 4985} {"train_loss": -26.76130485534668, "global_step": 413799, "epoch": 4985} {"train_loss": -26.904809951782227, "global_step": 413800, "epoch": 4985} {"train_loss": -27.037738800048828, "global_step": 413801, "epoch": 4985} {"train_loss": -27.090967178344727, "global_step": 413802, "epoch": 4985} {"train_loss": -26.684858322143555, "global_step": 413803, "epoch": 4985} {"train_loss": -26.73212242126465, "global_step": 413804, "epoch": 4985} {"train_loss": -27.143827438354492, "global_step": 413805, "epoch": 4985} {"train_loss": -27.1912784576416, "global_step": 413806, "epoch": 4985} {"train_loss": -27.0837459564209, "global_step": 413807, "epoch": 4985} {"train_loss": -27.024145126342773, "global_step": 413808, "epoch": 4985} {"train_loss": -26.83223533630371, "global_step": 413809, "epoch": 4985} {"train_loss": -26.703632354736328, "global_step": 413810, "epoch": 4985} {"train_loss": -26.782672882080078, "global_step": 413811, "epoch": 4985} {"train_loss": -26.3280029296875, "global_step": 413812, "epoch": 4985} {"train_loss": -26.63441276550293, "global_step": 413813, "epoch": 4985} {"train_loss": -26.81195640563965, "global_step": 413814, "epoch": 4985} {"train_loss": -26.9326229095459, "global_step": 413815, "epoch": 4985} {"train_loss": -26.658370971679688, "global_step": 413816, "epoch": 4985} {"train_loss": -26.8636417388916, "global_step": 413817, "epoch": 4985} {"train_loss": -26.5129337310791, "global_step": 413818, "epoch": 4985} {"train_loss": -26.5855770111084, "global_step": 413819, "epoch": 4985} {"train_loss": -26.63215446472168, "global_step": 413820, "epoch": 4985} {"train_loss": -26.897357940673828, "global_step": 413821, "epoch": 4985} {"train_loss": -26.8356876373291, "global_step": 413822, "epoch": 4985} {"train_loss": -26.92011070251465, "global_step": 413823, "epoch": 4985} {"train_loss": -26.595340728759766, "global_step": 413824, "epoch": 4985} {"train_loss": -26.67107582092285, "global_step": 413825, "epoch": 4985} {"train_loss": -26.390228271484375, "global_step": 413826, "epoch": 4985} {"train_loss": -26.54859733581543, "global_step": 413827, "epoch": 4985} {"train_loss": -26.549169540405273, "global_step": 413828, "epoch": 4985} {"train_loss": -26.554563522338867, "global_step": 413829, "epoch": 4985} {"train_loss": -26.775861740112305, "global_step": 413830, "epoch": 4985} {"train_loss": -26.71710777282715, "global_step": 413831, "epoch": 4985} {"train_loss": -26.88372802734375, "global_step": 413832, "epoch": 4985} {"train_loss": -26.87824821472168, "global_step": 413833, "epoch": 4985} {"train_loss": -27.01934242248535, "global_step": 413834, "epoch": 4985} {"train_loss": -26.988967895507812, "global_step": 413835, "epoch": 4985} {"train_loss": -26.787817001342773, "global_step": 413836, "epoch": 4985} {"train_loss": -26.60207518612046, "global_step": 413837, "epoch": 4985, "val_loss": 6530273.0} {"train_loss": -26.628610610961914, "global_step": 413838, "epoch": 4986} {"train_loss": -26.461286544799805, "global_step": 413839, "epoch": 4986} {"train_loss": -26.510705947875977, "global_step": 413840, "epoch": 4986} {"train_loss": -26.415119171142578, "global_step": 413841, "epoch": 4986} {"train_loss": -26.73639488220215, "global_step": 413842, "epoch": 4986} {"train_loss": -26.573110580444336, "global_step": 413843, "epoch": 4986} {"train_loss": -26.04261589050293, "global_step": 413844, "epoch": 4986} {"train_loss": -25.84659767150879, "global_step": 413845, "epoch": 4986} {"train_loss": -27.030536651611328, "global_step": 413846, "epoch": 4986} {"train_loss": -26.420684814453125, "global_step": 413847, "epoch": 4986} {"train_loss": -26.303558349609375, "global_step": 413848, "epoch": 4986} {"train_loss": -26.6516170501709, "global_step": 413849, "epoch": 4986} {"train_loss": -26.699560165405273, "global_step": 413850, "epoch": 4986} {"train_loss": -26.44038963317871, "global_step": 413851, "epoch": 4986} {"train_loss": -26.8085994720459, "global_step": 413852, "epoch": 4986} {"train_loss": -26.496423721313477, "global_step": 413853, "epoch": 4986} {"train_loss": -26.257949829101562, "global_step": 413854, "epoch": 4986} {"train_loss": -26.545886993408203, "global_step": 413855, "epoch": 4986} {"train_loss": -26.583417892456055, "global_step": 413856, "epoch": 4986} {"train_loss": -26.197946548461914, "global_step": 413857, "epoch": 4986} {"train_loss": -26.700727462768555, "global_step": 413858, "epoch": 4986} {"train_loss": -26.60089111328125, "global_step": 413859, "epoch": 4986} {"train_loss": -27.127187728881836, "global_step": 413860, "epoch": 4986} {"train_loss": -26.6461181640625, "global_step": 413861, "epoch": 4986} {"train_loss": -27.04732322692871, "global_step": 413862, "epoch": 4986} {"train_loss": -26.946659088134766, "global_step": 413863, "epoch": 4986} {"train_loss": -26.781747817993164, "global_step": 413864, "epoch": 4986} {"train_loss": -26.75691032409668, "global_step": 413865, "epoch": 4986} {"train_loss": -26.524789810180664, "global_step": 413866, "epoch": 4986} {"train_loss": -26.679101943969727, "global_step": 413867, "epoch": 4986} {"train_loss": -26.885046005249023, "global_step": 413868, "epoch": 4986} {"train_loss": -26.883319854736328, "global_step": 413869, "epoch": 4986} {"train_loss": -27.04068946838379, "global_step": 413870, "epoch": 4986} {"train_loss": -26.81513786315918, "global_step": 413871, "epoch": 4986} {"train_loss": -26.489843368530273, "global_step": 413872, "epoch": 4986} {"train_loss": -27.151281356811523, "global_step": 413873, "epoch": 4986} {"train_loss": -26.74714469909668, "global_step": 413874, "epoch": 4986} {"train_loss": -26.382421493530273, "global_step": 413875, "epoch": 4986} {"train_loss": -26.843250274658203, "global_step": 413876, "epoch": 4986} {"train_loss": -26.880258560180664, "global_step": 413877, "epoch": 4986} {"train_loss": -26.827157974243164, "global_step": 413878, "epoch": 4986} {"train_loss": -26.380847930908203, "global_step": 413879, "epoch": 4986} {"train_loss": -27.23870849609375, "global_step": 413880, "epoch": 4986} {"train_loss": -26.745288848876953, "global_step": 413881, "epoch": 4986} {"train_loss": -26.379932403564453, "global_step": 413882, "epoch": 4986} {"train_loss": -26.62273597717285, "global_step": 413883, "epoch": 4986} {"train_loss": -26.051626205444336, "global_step": 413884, "epoch": 4986} {"train_loss": -27.001556396484375, "global_step": 413885, "epoch": 4986} {"train_loss": -26.57635498046875, "global_step": 413886, "epoch": 4986} {"train_loss": -26.6124210357666, "global_step": 413887, "epoch": 4986} {"train_loss": -26.835535049438477, "global_step": 413888, "epoch": 4986} {"train_loss": -26.774311065673828, "global_step": 413889, "epoch": 4986} {"train_loss": -26.91229820251465, "global_step": 413890, "epoch": 4986} {"train_loss": -26.395008087158203, "global_step": 413891, "epoch": 4986} {"train_loss": -26.526264190673828, "global_step": 413892, "epoch": 4986} {"train_loss": -26.986478805541992, "global_step": 413893, "epoch": 4986} {"train_loss": -26.569793701171875, "global_step": 413894, "epoch": 4986} {"train_loss": -26.928741455078125, "global_step": 413895, "epoch": 4986} {"train_loss": -26.729482650756836, "global_step": 413896, "epoch": 4986} {"train_loss": -26.265207290649414, "global_step": 413897, "epoch": 4986} {"train_loss": -26.256635665893555, "global_step": 413898, "epoch": 4986} {"train_loss": -26.3527889251709, "global_step": 413899, "epoch": 4986} {"train_loss": -26.883127212524414, "global_step": 413900, "epoch": 4986} {"train_loss": -26.69333267211914, "global_step": 413901, "epoch": 4986} {"train_loss": -26.71063232421875, "global_step": 413902, "epoch": 4986} {"train_loss": -26.81162452697754, "global_step": 413903, "epoch": 4986} {"train_loss": -26.73833656311035, "global_step": 413904, "epoch": 4986} {"train_loss": -26.839828491210938, "global_step": 413905, "epoch": 4986} {"train_loss": -26.62522315979004, "global_step": 413906, "epoch": 4986} {"train_loss": -26.616119384765625, "global_step": 413907, "epoch": 4986} {"train_loss": -27.04278564453125, "global_step": 413908, "epoch": 4986} {"train_loss": -26.90925407409668, "global_step": 413909, "epoch": 4986} {"train_loss": -26.65751075744629, "global_step": 413910, "epoch": 4986} {"train_loss": -26.849185943603516, "global_step": 413911, "epoch": 4986} {"train_loss": -27.056310653686523, "global_step": 413912, "epoch": 4986} {"train_loss": -26.9443359375, "global_step": 413913, "epoch": 4986} {"train_loss": -26.74359703063965, "global_step": 413914, "epoch": 4986} {"train_loss": -26.629438400268555, "global_step": 413915, "epoch": 4986} {"train_loss": -26.529382705688477, "global_step": 413916, "epoch": 4986} {"train_loss": -26.7506103515625, "global_step": 413917, "epoch": 4986} {"train_loss": -26.73285484313965, "global_step": 413918, "epoch": 4986} {"train_loss": -26.535303115844727, "global_step": 413919, "epoch": 4986} {"train_loss": -26.686018380774073, "global_step": 413920, "epoch": 4986, "val_loss": 6581851.5} {"train_loss": -26.620548248291016, "global_step": 413921, "epoch": 4987} {"train_loss": -26.44538688659668, "global_step": 413922, "epoch": 4987} {"train_loss": -26.450658798217773, "global_step": 413923, "epoch": 4987} {"train_loss": -26.689462661743164, "global_step": 413924, "epoch": 4987} {"train_loss": -26.581884384155273, "global_step": 413925, "epoch": 4987} {"train_loss": -26.736576080322266, "global_step": 413926, "epoch": 4987} {"train_loss": -26.555496215820312, "global_step": 413927, "epoch": 4987} {"train_loss": -26.645063400268555, "global_step": 413928, "epoch": 4987} {"train_loss": -26.297077178955078, "global_step": 413929, "epoch": 4987} {"train_loss": -26.429044723510742, "global_step": 413930, "epoch": 4987} {"train_loss": -26.551258087158203, "global_step": 413931, "epoch": 4987} {"train_loss": -26.753400802612305, "global_step": 413932, "epoch": 4987} {"train_loss": -26.710660934448242, "global_step": 413933, "epoch": 4987} {"train_loss": -26.495702743530273, "global_step": 413934, "epoch": 4987} {"train_loss": -26.236255645751953, "global_step": 413935, "epoch": 4987} {"train_loss": -26.93048667907715, "global_step": 413936, "epoch": 4987} {"train_loss": -26.871551513671875, "global_step": 413937, "epoch": 4987} {"train_loss": -26.80341148376465, "global_step": 413938, "epoch": 4987} {"train_loss": -26.79473876953125, "global_step": 413939, "epoch": 4987} {"train_loss": -26.751935958862305, "global_step": 413940, "epoch": 4987} {"train_loss": -26.567291259765625, "global_step": 413941, "epoch": 4987} {"train_loss": -26.749191284179688, "global_step": 413942, "epoch": 4987} {"train_loss": -27.04758644104004, "global_step": 413943, "epoch": 4987} {"train_loss": -26.74900245666504, "global_step": 413944, "epoch": 4987} {"train_loss": -26.907470703125, "global_step": 413945, "epoch": 4987} {"train_loss": -26.762243270874023, "global_step": 413946, "epoch": 4987} {"train_loss": -26.909229278564453, "global_step": 413947, "epoch": 4987} {"train_loss": -26.718982696533203, "global_step": 413948, "epoch": 4987} {"train_loss": -26.80901527404785, "global_step": 413949, "epoch": 4987} {"train_loss": -26.893774032592773, "global_step": 413950, "epoch": 4987} {"train_loss": -26.60755729675293, "global_step": 413951, "epoch": 4987} {"train_loss": -26.370101928710938, "global_step": 413952, "epoch": 4987} {"train_loss": -26.47287368774414, "global_step": 413953, "epoch": 4987} {"train_loss": -26.818735122680664, "global_step": 413954, "epoch": 4987} {"train_loss": -26.942859649658203, "global_step": 413955, "epoch": 4987} {"train_loss": -26.923328399658203, "global_step": 413956, "epoch": 4987} {"train_loss": -26.63580894470215, "global_step": 413957, "epoch": 4987} {"train_loss": -26.812986373901367, "global_step": 413958, "epoch": 4987} {"train_loss": -26.820138931274414, "global_step": 413959, "epoch": 4987} {"train_loss": -26.991718292236328, "global_step": 413960, "epoch": 4987} {"train_loss": -26.015613555908203, "global_step": 413961, "epoch": 4987} {"train_loss": -26.836502075195312, "global_step": 413962, "epoch": 4987} {"train_loss": -26.747854232788086, "global_step": 413963, "epoch": 4987} {"train_loss": -26.611112594604492, "global_step": 413964, "epoch": 4987} {"train_loss": -27.289464950561523, "global_step": 413965, "epoch": 4987} {"train_loss": -26.923322677612305, "global_step": 413966, "epoch": 4987} {"train_loss": -26.453460693359375, "global_step": 413967, "epoch": 4987} {"train_loss": -27.068103790283203, "global_step": 413968, "epoch": 4987} {"train_loss": -26.40497398376465, "global_step": 413969, "epoch": 4987} {"train_loss": -26.67043113708496, "global_step": 413970, "epoch": 4987} {"train_loss": -26.461963653564453, "global_step": 413971, "epoch": 4987} {"train_loss": -26.69414710998535, "global_step": 413972, "epoch": 4987} {"train_loss": -26.858936309814453, "global_step": 413973, "epoch": 4987} {"train_loss": -26.77789878845215, "global_step": 413974, "epoch": 4987} {"train_loss": -27.060256958007812, "global_step": 413975, "epoch": 4987} {"train_loss": -26.603845596313477, "global_step": 413976, "epoch": 4987} {"train_loss": -26.713321685791016, "global_step": 413977, "epoch": 4987} {"train_loss": -26.66176414489746, "global_step": 413978, "epoch": 4987} {"train_loss": -26.525049209594727, "global_step": 413979, "epoch": 4987} {"train_loss": -26.52239418029785, "global_step": 413980, "epoch": 4987} {"train_loss": -26.369016647338867, "global_step": 413981, "epoch": 4987} {"train_loss": -26.787311553955078, "global_step": 413982, "epoch": 4987} {"train_loss": -26.568954467773438, "global_step": 413983, "epoch": 4987} {"train_loss": -26.802061080932617, "global_step": 413984, "epoch": 4987} {"train_loss": -26.74591636657715, "global_step": 413985, "epoch": 4987} {"train_loss": -26.6997013092041, "global_step": 413986, "epoch": 4987} {"train_loss": -26.606901168823242, "global_step": 413987, "epoch": 4987} {"train_loss": -26.583358764648438, "global_step": 413988, "epoch": 4987} {"train_loss": -26.871891021728516, "global_step": 413989, "epoch": 4987} {"train_loss": -26.915658950805664, "global_step": 413990, "epoch": 4987} {"train_loss": -26.64723014831543, "global_step": 413991, "epoch": 4987} {"train_loss": -26.349454879760742, "global_step": 413992, "epoch": 4987} {"train_loss": -26.7675724029541, "global_step": 413993, "epoch": 4987} {"train_loss": -26.488195419311523, "global_step": 413994, "epoch": 4987} {"train_loss": -26.814441680908203, "global_step": 413995, "epoch": 4987} {"train_loss": -26.705907821655273, "global_step": 413996, "epoch": 4987} {"train_loss": -27.03019142150879, "global_step": 413997, "epoch": 4987} {"train_loss": -26.973453521728516, "global_step": 413998, "epoch": 4987} {"train_loss": -26.925161361694336, "global_step": 413999, "epoch": 4987} {"train_loss": -27.196945190429688, "global_step": 414000, "epoch": 4987} {"train_loss": -26.5658016204834, "global_step": 414001, "epoch": 4987} {"train_loss": -26.746536254882812, "global_step": 414002, "epoch": 4987} {"train_loss": -26.71745576054217, "global_step": 414003, "epoch": 4987, "val_loss": 6458772.0} {"train_loss": -25.768817901611328, "global_step": 414004, "epoch": 4988} {"train_loss": -24.6269474029541, "global_step": 414005, "epoch": 4988} {"train_loss": -25.546720504760742, "global_step": 414006, "epoch": 4988} {"train_loss": -26.071802139282227, "global_step": 414007, "epoch": 4988} {"train_loss": -25.55304718017578, "global_step": 414008, "epoch": 4988} {"train_loss": -26.03382682800293, "global_step": 414009, "epoch": 4988} {"train_loss": -26.292139053344727, "global_step": 414010, "epoch": 4988} {"train_loss": -25.89874839782715, "global_step": 414011, "epoch": 4988} {"train_loss": -25.960102081298828, "global_step": 414012, "epoch": 4988} {"train_loss": -25.8532657623291, "global_step": 414013, "epoch": 4988} {"train_loss": -26.20734977722168, "global_step": 414014, "epoch": 4988} {"train_loss": -26.051471710205078, "global_step": 414015, "epoch": 4988} {"train_loss": -26.281497955322266, "global_step": 414016, "epoch": 4988} {"train_loss": -26.357166290283203, "global_step": 414017, "epoch": 4988} {"train_loss": -26.00800132751465, "global_step": 414018, "epoch": 4988} {"train_loss": -26.22185707092285, "global_step": 414019, "epoch": 4988} {"train_loss": -25.73723793029785, "global_step": 414020, "epoch": 4988} {"train_loss": -26.28516960144043, "global_step": 414021, "epoch": 4988} {"train_loss": -26.3560733795166, "global_step": 414022, "epoch": 4988} {"train_loss": -26.29717445373535, "global_step": 414023, "epoch": 4988} {"train_loss": -26.369421005249023, "global_step": 414024, "epoch": 4988} {"train_loss": -26.145496368408203, "global_step": 414025, "epoch": 4988} {"train_loss": -26.581384658813477, "global_step": 414026, "epoch": 4988} {"train_loss": -26.46630859375, "global_step": 414027, "epoch": 4988} {"train_loss": -26.42377281188965, "global_step": 414028, "epoch": 4988} {"train_loss": -26.76861000061035, "global_step": 414029, "epoch": 4988} {"train_loss": -26.59551429748535, "global_step": 414030, "epoch": 4988} {"train_loss": -26.7635440826416, "global_step": 414031, "epoch": 4988} {"train_loss": -26.263370513916016, "global_step": 414032, "epoch": 4988} {"train_loss": -26.764453887939453, "global_step": 414033, "epoch": 4988} {"train_loss": -26.620471954345703, "global_step": 414034, "epoch": 4988} {"train_loss": -26.220264434814453, "global_step": 414035, "epoch": 4988} {"train_loss": -26.407133102416992, "global_step": 414036, "epoch": 4988} {"train_loss": -26.61762046813965, "global_step": 414037, "epoch": 4988} {"train_loss": -26.3170223236084, "global_step": 414038, "epoch": 4988} {"train_loss": -26.567615509033203, "global_step": 414039, "epoch": 4988} {"train_loss": -26.800018310546875, "global_step": 414040, "epoch": 4988} {"train_loss": -26.544763565063477, "global_step": 414041, "epoch": 4988} {"train_loss": -26.602689743041992, "global_step": 414042, "epoch": 4988} {"train_loss": -26.633411407470703, "global_step": 414043, "epoch": 4988} {"train_loss": -27.0259952545166, "global_step": 414044, "epoch": 4988} {"train_loss": -26.757129669189453, "global_step": 414045, "epoch": 4988} {"train_loss": -27.12796974182129, "global_step": 414046, "epoch": 4988} {"train_loss": -26.616437911987305, "global_step": 414047, "epoch": 4988} {"train_loss": -26.832029342651367, "global_step": 414048, "epoch": 4988} {"train_loss": -26.65277671813965, "global_step": 414049, "epoch": 4988} {"train_loss": -26.771886825561523, "global_step": 414050, "epoch": 4988} {"train_loss": -26.91595458984375, "global_step": 414051, "epoch": 4988} {"train_loss": -26.959646224975586, "global_step": 414052, "epoch": 4988} {"train_loss": -26.527448654174805, "global_step": 414053, "epoch": 4988} {"train_loss": -26.762434005737305, "global_step": 414054, "epoch": 4988} {"train_loss": -27.1094913482666, "global_step": 414055, "epoch": 4988} {"train_loss": -26.849109649658203, "global_step": 414056, "epoch": 4988} {"train_loss": -26.781076431274414, "global_step": 414057, "epoch": 4988} {"train_loss": -26.787878036499023, "global_step": 414058, "epoch": 4988} {"train_loss": -26.74798583984375, "global_step": 414059, "epoch": 4988} {"train_loss": -26.406391143798828, "global_step": 414060, "epoch": 4988} {"train_loss": -26.926055908203125, "global_step": 414061, "epoch": 4988} {"train_loss": -26.728422164916992, "global_step": 414062, "epoch": 4988} {"train_loss": -26.836532592773438, "global_step": 414063, "epoch": 4988} {"train_loss": -26.555578231811523, "global_step": 414064, "epoch": 4988} {"train_loss": -26.750675201416016, "global_step": 414065, "epoch": 4988} {"train_loss": -27.228897094726562, "global_step": 414066, "epoch": 4988} {"train_loss": -26.99574089050293, "global_step": 414067, "epoch": 4988} {"train_loss": -26.833303451538086, "global_step": 414068, "epoch": 4988} {"train_loss": -26.938039779663086, "global_step": 414069, "epoch": 4988} {"train_loss": -26.596250534057617, "global_step": 414070, "epoch": 4988} {"train_loss": -26.70587730407715, "global_step": 414071, "epoch": 4988} {"train_loss": -26.83247184753418, "global_step": 414072, "epoch": 4988} {"train_loss": -26.945825576782227, "global_step": 414073, "epoch": 4988} {"train_loss": -26.672927856445312, "global_step": 414074, "epoch": 4988} {"train_loss": -26.809595108032227, "global_step": 414075, "epoch": 4988} {"train_loss": -26.8026180267334, "global_step": 414076, "epoch": 4988} {"train_loss": -26.185163497924805, "global_step": 414077, "epoch": 4988} {"train_loss": -26.64607048034668, "global_step": 414078, "epoch": 4988} {"train_loss": -26.488739013671875, "global_step": 414079, "epoch": 4988} {"train_loss": -26.418039321899414, "global_step": 414080, "epoch": 4988} {"train_loss": -26.486547470092773, "global_step": 414081, "epoch": 4988} {"train_loss": -26.752527236938477, "global_step": 414082, "epoch": 4988} {"train_loss": -25.794523239135742, "global_step": 414083, "epoch": 4988} {"train_loss": -25.84128189086914, "global_step": 414084, "epoch": 4988} {"train_loss": -26.47890281677246, "global_step": 414085, "epoch": 4988} {"train_loss": -26.48802690620882, "global_step": 414086, "epoch": 4988, "val_loss": 6544745.0} {"train_loss": -25.990808486938477, "global_step": 414087, "epoch": 4989} {"train_loss": -26.539350509643555, "global_step": 414088, "epoch": 4989} {"train_loss": -26.674457550048828, "global_step": 414089, "epoch": 4989} {"train_loss": -26.3756160736084, "global_step": 414090, "epoch": 4989} {"train_loss": -26.165435791015625, "global_step": 414091, "epoch": 4989} {"train_loss": -26.4111270904541, "global_step": 414092, "epoch": 4989} {"train_loss": -26.11054801940918, "global_step": 414093, "epoch": 4989} {"train_loss": -26.48681640625, "global_step": 414094, "epoch": 4989} {"train_loss": -26.4682559967041, "global_step": 414095, "epoch": 4989} {"train_loss": -26.558765411376953, "global_step": 414096, "epoch": 4989} {"train_loss": -26.441904067993164, "global_step": 414097, "epoch": 4989} {"train_loss": -26.449121475219727, "global_step": 414098, "epoch": 4989} {"train_loss": -26.475488662719727, "global_step": 414099, "epoch": 4989} {"train_loss": -26.730390548706055, "global_step": 414100, "epoch": 4989} {"train_loss": -26.5127010345459, "global_step": 414101, "epoch": 4989} {"train_loss": -26.295169830322266, "global_step": 414102, "epoch": 4989} {"train_loss": -26.47994041442871, "global_step": 414103, "epoch": 4989} {"train_loss": -26.5539608001709, "global_step": 414104, "epoch": 4989} {"train_loss": -26.811731338500977, "global_step": 414105, "epoch": 4989} {"train_loss": -26.830114364624023, "global_step": 414106, "epoch": 4989} {"train_loss": -26.81656265258789, "global_step": 414107, "epoch": 4989} {"train_loss": -26.873565673828125, "global_step": 414108, "epoch": 4989} {"train_loss": -26.45880699157715, "global_step": 414109, "epoch": 4989} {"train_loss": -26.711639404296875, "global_step": 414110, "epoch": 4989} {"train_loss": -26.811933517456055, "global_step": 414111, "epoch": 4989} {"train_loss": -26.581073760986328, "global_step": 414112, "epoch": 4989} {"train_loss": -26.2974796295166, "global_step": 414113, "epoch": 4989} {"train_loss": -26.329877853393555, "global_step": 414114, "epoch": 4989} {"train_loss": -26.715778350830078, "global_step": 414115, "epoch": 4989} {"train_loss": -26.965490341186523, "global_step": 414116, "epoch": 4989} {"train_loss": -26.675952911376953, "global_step": 414117, "epoch": 4989} {"train_loss": -26.596418380737305, "global_step": 414118, "epoch": 4989} {"train_loss": -26.707778930664062, "global_step": 414119, "epoch": 4989} {"train_loss": -27.2159366607666, "global_step": 414120, "epoch": 4989} {"train_loss": -26.5792236328125, "global_step": 414121, "epoch": 4989} {"train_loss": -26.639312744140625, "global_step": 414122, "epoch": 4989} {"train_loss": -26.83600425720215, "global_step": 414123, "epoch": 4989} {"train_loss": -26.744037628173828, "global_step": 414124, "epoch": 4989} {"train_loss": -26.88252830505371, "global_step": 414125, "epoch": 4989} {"train_loss": -26.6816463470459, "global_step": 414126, "epoch": 4989} {"train_loss": -26.8170108795166, "global_step": 414127, "epoch": 4989} {"train_loss": -26.771753311157227, "global_step": 414128, "epoch": 4989} {"train_loss": -26.389301300048828, "global_step": 414129, "epoch": 4989} {"train_loss": -26.8419132232666, "global_step": 414130, "epoch": 4989} {"train_loss": -27.215158462524414, "global_step": 414131, "epoch": 4989} {"train_loss": -27.352313995361328, "global_step": 414132, "epoch": 4989} {"train_loss": -26.3508243560791, "global_step": 414133, "epoch": 4989} {"train_loss": -26.889616012573242, "global_step": 414134, "epoch": 4989} {"train_loss": -26.581342697143555, "global_step": 414135, "epoch": 4989} {"train_loss": -26.770008087158203, "global_step": 414136, "epoch": 4989} {"train_loss": -27.17683982849121, "global_step": 414137, "epoch": 4989} {"train_loss": -26.496368408203125, "global_step": 414138, "epoch": 4989} {"train_loss": -27.163854598999023, "global_step": 414139, "epoch": 4989} {"train_loss": -26.80512046813965, "global_step": 414140, "epoch": 4989} {"train_loss": -26.820844650268555, "global_step": 414141, "epoch": 4989} {"train_loss": -26.773956298828125, "global_step": 414142, "epoch": 4989} {"train_loss": -27.044370651245117, "global_step": 414143, "epoch": 4989} {"train_loss": -26.905927658081055, "global_step": 414144, "epoch": 4989} {"train_loss": -27.00018310546875, "global_step": 414145, "epoch": 4989} {"train_loss": -26.59576988220215, "global_step": 414146, "epoch": 4989} {"train_loss": -27.154743194580078, "global_step": 414147, "epoch": 4989} {"train_loss": -27.000593185424805, "global_step": 414148, "epoch": 4989} {"train_loss": -26.7108097076416, "global_step": 414149, "epoch": 4989} {"train_loss": -26.974027633666992, "global_step": 414150, "epoch": 4989} {"train_loss": -26.721927642822266, "global_step": 414151, "epoch": 4989} {"train_loss": -26.716537475585938, "global_step": 414152, "epoch": 4989} {"train_loss": -26.69858741760254, "global_step": 414153, "epoch": 4989} {"train_loss": -26.730350494384766, "global_step": 414154, "epoch": 4989} {"train_loss": -26.612180709838867, "global_step": 414155, "epoch": 4989} {"train_loss": -27.052520751953125, "global_step": 414156, "epoch": 4989} {"train_loss": -26.937469482421875, "global_step": 414157, "epoch": 4989} {"train_loss": -26.927244186401367, "global_step": 414158, "epoch": 4989} {"train_loss": -26.799177169799805, "global_step": 414159, "epoch": 4989} {"train_loss": -26.9827938079834, "global_step": 414160, "epoch": 4989} {"train_loss": -27.126245498657227, "global_step": 414161, "epoch": 4989} {"train_loss": -26.872106552124023, "global_step": 414162, "epoch": 4989} {"train_loss": -26.290517807006836, "global_step": 414163, "epoch": 4989} {"train_loss": -25.802276611328125, "global_step": 414164, "epoch": 4989} {"train_loss": -25.209857940673828, "global_step": 414165, "epoch": 4989} {"train_loss": -26.183866500854492, "global_step": 414166, "epoch": 4989} {"train_loss": -26.637226104736328, "global_step": 414167, "epoch": 4989} {"train_loss": -26.155115127563477, "global_step": 414168, "epoch": 4989} {"train_loss": -26.655190088662756, "global_step": 414169, "epoch": 4989, "val_loss": 6612569.0} {"train_loss": -26.602643966674805, "global_step": 414170, "epoch": 4990} {"train_loss": -25.578256607055664, "global_step": 414171, "epoch": 4990} {"train_loss": -26.181365966796875, "global_step": 414172, "epoch": 4990} {"train_loss": -25.972797393798828, "global_step": 414173, "epoch": 4990} {"train_loss": -26.01972007751465, "global_step": 414174, "epoch": 4990} {"train_loss": -26.078872680664062, "global_step": 414175, "epoch": 4990} {"train_loss": -26.142597198486328, "global_step": 414176, "epoch": 4990} {"train_loss": -26.31028175354004, "global_step": 414177, "epoch": 4990} {"train_loss": -26.293004989624023, "global_step": 414178, "epoch": 4990} {"train_loss": -26.155487060546875, "global_step": 414179, "epoch": 4990} {"train_loss": -26.538028717041016, "global_step": 414180, "epoch": 4990} {"train_loss": -26.562585830688477, "global_step": 414181, "epoch": 4990} {"train_loss": -25.897119522094727, "global_step": 414182, "epoch": 4990} {"train_loss": -26.574085235595703, "global_step": 414183, "epoch": 4990} {"train_loss": -26.239551544189453, "global_step": 414184, "epoch": 4990} {"train_loss": -26.579938888549805, "global_step": 414185, "epoch": 4990} {"train_loss": -26.118261337280273, "global_step": 414186, "epoch": 4990} {"train_loss": -26.443439483642578, "global_step": 414187, "epoch": 4990} {"train_loss": -26.545557022094727, "global_step": 414188, "epoch": 4990} {"train_loss": -26.551965713500977, "global_step": 414189, "epoch": 4990} {"train_loss": -26.831830978393555, "global_step": 414190, "epoch": 4990} {"train_loss": -26.364532470703125, "global_step": 414191, "epoch": 4990} {"train_loss": -26.656408309936523, "global_step": 414192, "epoch": 4990} {"train_loss": -26.60125160217285, "global_step": 414193, "epoch": 4990} {"train_loss": -26.072118759155273, "global_step": 414194, "epoch": 4990} {"train_loss": -26.683246612548828, "global_step": 414195, "epoch": 4990} {"train_loss": -26.526611328125, "global_step": 414196, "epoch": 4990} {"train_loss": -26.549560546875, "global_step": 414197, "epoch": 4990} {"train_loss": -26.72336196899414, "global_step": 414198, "epoch": 4990} {"train_loss": -26.522932052612305, "global_step": 414199, "epoch": 4990} {"train_loss": -26.919153213500977, "global_step": 414200, "epoch": 4990} {"train_loss": -26.71551513671875, "global_step": 414201, "epoch": 4990} {"train_loss": -26.701093673706055, "global_step": 414202, "epoch": 4990} {"train_loss": -26.915388107299805, "global_step": 414203, "epoch": 4990} {"train_loss": -26.79816246032715, "global_step": 414204, "epoch": 4990} {"train_loss": -26.71502113342285, "global_step": 414205, "epoch": 4990} {"train_loss": -26.776517868041992, "global_step": 414206, "epoch": 4990} {"train_loss": -26.59881019592285, "global_step": 414207, "epoch": 4990} {"train_loss": -26.662256240844727, "global_step": 414208, "epoch": 4990} {"train_loss": -26.858856201171875, "global_step": 414209, "epoch": 4990} {"train_loss": -26.969013214111328, "global_step": 414210, "epoch": 4990} {"train_loss": -27.1516056060791, "global_step": 414211, "epoch": 4990} {"train_loss": -26.800256729125977, "global_step": 414212, "epoch": 4990} {"train_loss": -27.03289222717285, "global_step": 414213, "epoch": 4990} {"train_loss": -26.776670455932617, "global_step": 414214, "epoch": 4990} {"train_loss": -26.95466423034668, "global_step": 414215, "epoch": 4990} {"train_loss": -26.95210075378418, "global_step": 414216, "epoch": 4990} {"train_loss": -26.916717529296875, "global_step": 414217, "epoch": 4990} {"train_loss": -27.040685653686523, "global_step": 414218, "epoch": 4990} {"train_loss": -26.896154403686523, "global_step": 414219, "epoch": 4990} {"train_loss": -26.925739288330078, "global_step": 414220, "epoch": 4990} {"train_loss": -27.00119972229004, "global_step": 414221, "epoch": 4990} {"train_loss": -27.014957427978516, "global_step": 414222, "epoch": 4990} {"train_loss": -26.9145565032959, "global_step": 414223, "epoch": 4990} {"train_loss": -26.710092544555664, "global_step": 414224, "epoch": 4990} {"train_loss": -26.548871994018555, "global_step": 414225, "epoch": 4990} {"train_loss": -26.705875396728516, "global_step": 414226, "epoch": 4990} {"train_loss": -26.82522964477539, "global_step": 414227, "epoch": 4990} {"train_loss": -27.032880783081055, "global_step": 414228, "epoch": 4990} {"train_loss": -26.79496192932129, "global_step": 414229, "epoch": 4990} {"train_loss": -26.6848201751709, "global_step": 414230, "epoch": 4990} {"train_loss": -26.882184982299805, "global_step": 414231, "epoch": 4990} {"train_loss": -26.63936424255371, "global_step": 414232, "epoch": 4990} {"train_loss": -26.300424575805664, "global_step": 414233, "epoch": 4990} {"train_loss": -26.5986270904541, "global_step": 414234, "epoch": 4990} {"train_loss": -26.120941162109375, "global_step": 414235, "epoch": 4990} {"train_loss": -26.182758331298828, "global_step": 414236, "epoch": 4990} {"train_loss": -26.31313133239746, "global_step": 414237, "epoch": 4990} {"train_loss": -26.193212509155273, "global_step": 414238, "epoch": 4990} {"train_loss": -26.710447311401367, "global_step": 414239, "epoch": 4990} {"train_loss": -26.522430419921875, "global_step": 414240, "epoch": 4990} {"train_loss": -26.233137130737305, "global_step": 414241, "epoch": 4990} {"train_loss": -26.712228775024414, "global_step": 414242, "epoch": 4990} {"train_loss": -26.738147735595703, "global_step": 414243, "epoch": 4990} {"train_loss": -26.918867111206055, "global_step": 414244, "epoch": 4990} {"train_loss": -26.695974349975586, "global_step": 414245, "epoch": 4990} {"train_loss": -26.593183517456055, "global_step": 414246, "epoch": 4990} {"train_loss": -26.740615844726562, "global_step": 414247, "epoch": 4990} {"train_loss": -26.77878761291504, "global_step": 414248, "epoch": 4990} {"train_loss": -26.621158599853516, "global_step": 414249, "epoch": 4990} {"train_loss": -26.7869815826416, "global_step": 414250, "epoch": 4990} {"train_loss": -26.9348087310791, "global_step": 414251, "epoch": 4990} {"train_loss": -26.61874196615564, "global_step": 414252, "epoch": 4990, "val_loss": 6513221.0} {"train_loss": -25.607736587524414, "global_step": 414253, "epoch": 4991} {"train_loss": -26.165775299072266, "global_step": 414254, "epoch": 4991} {"train_loss": -26.17656898498535, "global_step": 414255, "epoch": 4991} {"train_loss": -25.73065757751465, "global_step": 414256, "epoch": 4991} {"train_loss": -26.331396102905273, "global_step": 414257, "epoch": 4991} {"train_loss": -26.1518497467041, "global_step": 414258, "epoch": 4991} {"train_loss": -26.277868270874023, "global_step": 414259, "epoch": 4991} {"train_loss": -26.174558639526367, "global_step": 414260, "epoch": 4991} {"train_loss": -25.9478759765625, "global_step": 414261, "epoch": 4991} {"train_loss": -26.24835205078125, "global_step": 414262, "epoch": 4991} {"train_loss": -26.737279891967773, "global_step": 414263, "epoch": 4991} {"train_loss": -26.388071060180664, "global_step": 414264, "epoch": 4991} {"train_loss": -25.930856704711914, "global_step": 414265, "epoch": 4991} {"train_loss": -26.487781524658203, "global_step": 414266, "epoch": 4991} {"train_loss": -26.31475830078125, "global_step": 414267, "epoch": 4991} {"train_loss": -26.338266372680664, "global_step": 414268, "epoch": 4991} {"train_loss": -26.00074577331543, "global_step": 414269, "epoch": 4991} {"train_loss": -26.755725860595703, "global_step": 414270, "epoch": 4991} {"train_loss": -26.44565773010254, "global_step": 414271, "epoch": 4991} {"train_loss": -26.50874137878418, "global_step": 414272, "epoch": 4991} {"train_loss": -26.520883560180664, "global_step": 414273, "epoch": 4991} {"train_loss": -26.856403350830078, "global_step": 414274, "epoch": 4991} {"train_loss": -26.608850479125977, "global_step": 414275, "epoch": 4991} {"train_loss": -26.5913028717041, "global_step": 414276, "epoch": 4991} {"train_loss": -26.600879669189453, "global_step": 414277, "epoch": 4991} {"train_loss": -26.582849502563477, "global_step": 414278, "epoch": 4991} {"train_loss": -26.7578067779541, "global_step": 414279, "epoch": 4991} {"train_loss": -26.632211685180664, "global_step": 414280, "epoch": 4991} {"train_loss": -26.231748580932617, "global_step": 414281, "epoch": 4991} {"train_loss": -26.522430419921875, "global_step": 414282, "epoch": 4991} {"train_loss": -26.62054443359375, "global_step": 414283, "epoch": 4991} {"train_loss": -26.607831954956055, "global_step": 414284, "epoch": 4991} {"train_loss": -27.074323654174805, "global_step": 414285, "epoch": 4991} {"train_loss": -26.800256729125977, "global_step": 414286, "epoch": 4991} {"train_loss": -26.6995849609375, "global_step": 414287, "epoch": 4991} {"train_loss": -27.10611915588379, "global_step": 414288, "epoch": 4991} {"train_loss": -26.52483558654785, "global_step": 414289, "epoch": 4991} {"train_loss": -26.752668380737305, "global_step": 414290, "epoch": 4991} {"train_loss": -26.66475486755371, "global_step": 414291, "epoch": 4991} {"train_loss": -26.881589889526367, "global_step": 414292, "epoch": 4991} {"train_loss": -26.84873390197754, "global_step": 414293, "epoch": 4991} {"train_loss": -26.672138214111328, "global_step": 414294, "epoch": 4991} {"train_loss": -27.295785903930664, "global_step": 414295, "epoch": 4991} {"train_loss": -26.56430435180664, "global_step": 414296, "epoch": 4991} {"train_loss": -27.04659080505371, "global_step": 414297, "epoch": 4991} {"train_loss": -26.655094146728516, "global_step": 414298, "epoch": 4991} {"train_loss": -26.776599884033203, "global_step": 414299, "epoch": 4991} {"train_loss": -26.65924072265625, "global_step": 414300, "epoch": 4991} {"train_loss": -26.800373077392578, "global_step": 414301, "epoch": 4991} {"train_loss": -26.5701904296875, "global_step": 414302, "epoch": 4991} {"train_loss": -26.920331954956055, "global_step": 414303, "epoch": 4991} {"train_loss": -27.0628604888916, "global_step": 414304, "epoch": 4991} {"train_loss": -27.093372344970703, "global_step": 414305, "epoch": 4991} {"train_loss": -26.79353141784668, "global_step": 414306, "epoch": 4991} {"train_loss": -27.166213989257812, "global_step": 414307, "epoch": 4991} {"train_loss": -26.701984405517578, "global_step": 414308, "epoch": 4991} {"train_loss": -26.915075302124023, "global_step": 414309, "epoch": 4991} {"train_loss": -27.077655792236328, "global_step": 414310, "epoch": 4991} {"train_loss": -26.947757720947266, "global_step": 414311, "epoch": 4991} {"train_loss": -26.981246948242188, "global_step": 414312, "epoch": 4991} {"train_loss": -27.098352432250977, "global_step": 414313, "epoch": 4991} {"train_loss": -26.92364501953125, "global_step": 414314, "epoch": 4991} {"train_loss": -26.87310791015625, "global_step": 414315, "epoch": 4991} {"train_loss": -26.630414962768555, "global_step": 414316, "epoch": 4991} {"train_loss": -26.85420036315918, "global_step": 414317, "epoch": 4991} {"train_loss": -26.874902725219727, "global_step": 414318, "epoch": 4991} {"train_loss": -27.003376007080078, "global_step": 414319, "epoch": 4991} {"train_loss": -27.1217098236084, "global_step": 414320, "epoch": 4991} {"train_loss": -26.829456329345703, "global_step": 414321, "epoch": 4991} {"train_loss": -26.75314712524414, "global_step": 414322, "epoch": 4991} {"train_loss": -26.719013214111328, "global_step": 414323, "epoch": 4991} {"train_loss": -26.7684383392334, "global_step": 414324, "epoch": 4991} {"train_loss": -27.017236709594727, "global_step": 414325, "epoch": 4991} {"train_loss": -26.549530029296875, "global_step": 414326, "epoch": 4991} {"train_loss": -27.119787216186523, "global_step": 414327, "epoch": 4991} {"train_loss": -26.95368766784668, "global_step": 414328, "epoch": 4991} {"train_loss": -26.56058120727539, "global_step": 414329, "epoch": 4991} {"train_loss": -27.011396408081055, "global_step": 414330, "epoch": 4991} {"train_loss": -27.040485382080078, "global_step": 414331, "epoch": 4991} {"train_loss": -26.899707794189453, "global_step": 414332, "epoch": 4991} {"train_loss": -27.0730037689209, "global_step": 414333, "epoch": 4991} {"train_loss": -26.39674186706543, "global_step": 414334, "epoch": 4991} {"train_loss": -26.68125715600439, "global_step": 414335, "epoch": 4991, "val_loss": 6562731.0} {"train_loss": -26.105712890625, "global_step": 414336, "epoch": 4992} {"train_loss": -25.294889450073242, "global_step": 414337, "epoch": 4992} {"train_loss": -25.820524215698242, "global_step": 414338, "epoch": 4992} {"train_loss": -26.040246963500977, "global_step": 414339, "epoch": 4992} {"train_loss": -26.1640625, "global_step": 414340, "epoch": 4992} {"train_loss": -26.12884521484375, "global_step": 414341, "epoch": 4992} {"train_loss": -25.766189575195312, "global_step": 414342, "epoch": 4992} {"train_loss": -26.203699111938477, "global_step": 414343, "epoch": 4992} {"train_loss": -25.72779655456543, "global_step": 414344, "epoch": 4992} {"train_loss": -25.85874366760254, "global_step": 414345, "epoch": 4992} {"train_loss": -26.1977481842041, "global_step": 414346, "epoch": 4992} {"train_loss": -26.07301139831543, "global_step": 414347, "epoch": 4992} {"train_loss": -26.422931671142578, "global_step": 414348, "epoch": 4992} {"train_loss": -26.355627059936523, "global_step": 414349, "epoch": 4992} {"train_loss": -26.40240478515625, "global_step": 414350, "epoch": 4992} {"train_loss": -26.077991485595703, "global_step": 414351, "epoch": 4992} {"train_loss": -26.1978702545166, "global_step": 414352, "epoch": 4992} {"train_loss": -26.313663482666016, "global_step": 414353, "epoch": 4992} {"train_loss": -26.684040069580078, "global_step": 414354, "epoch": 4992} {"train_loss": -26.39045524597168, "global_step": 414355, "epoch": 4992} {"train_loss": -26.6597900390625, "global_step": 414356, "epoch": 4992} {"train_loss": -26.59290885925293, "global_step": 414357, "epoch": 4992} {"train_loss": -26.54400634765625, "global_step": 414358, "epoch": 4992} {"train_loss": -26.27595329284668, "global_step": 414359, "epoch": 4992} {"train_loss": -26.689075469970703, "global_step": 414360, "epoch": 4992} {"train_loss": -26.636859893798828, "global_step": 414361, "epoch": 4992} {"train_loss": -26.369953155517578, "global_step": 414362, "epoch": 4992} {"train_loss": -26.715890884399414, "global_step": 414363, "epoch": 4992} {"train_loss": -26.570404052734375, "global_step": 414364, "epoch": 4992} {"train_loss": -26.702856063842773, "global_step": 414365, "epoch": 4992} {"train_loss": -26.5280818939209, "global_step": 414366, "epoch": 4992} {"train_loss": -26.817779541015625, "global_step": 414367, "epoch": 4992} {"train_loss": -26.66187858581543, "global_step": 414368, "epoch": 4992} {"train_loss": -27.03608512878418, "global_step": 414369, "epoch": 4992} {"train_loss": -26.455642700195312, "global_step": 414370, "epoch": 4992} {"train_loss": -26.69573402404785, "global_step": 414371, "epoch": 4992} {"train_loss": -26.810895919799805, "global_step": 414372, "epoch": 4992} {"train_loss": -26.524459838867188, "global_step": 414373, "epoch": 4992} {"train_loss": -26.81777000427246, "global_step": 414374, "epoch": 4992} {"train_loss": -26.897504806518555, "global_step": 414375, "epoch": 4992} {"train_loss": -26.9968318939209, "global_step": 414376, "epoch": 4992} {"train_loss": -26.79871940612793, "global_step": 414377, "epoch": 4992} {"train_loss": -26.95258140563965, "global_step": 414378, "epoch": 4992} {"train_loss": -26.280622482299805, "global_step": 414379, "epoch": 4992} {"train_loss": -26.672204971313477, "global_step": 414380, "epoch": 4992} {"train_loss": -26.850980758666992, "global_step": 414381, "epoch": 4992} {"train_loss": -26.89697265625, "global_step": 414382, "epoch": 4992} {"train_loss": -26.772314071655273, "global_step": 414383, "epoch": 4992} {"train_loss": -26.550100326538086, "global_step": 414384, "epoch": 4992} {"train_loss": -27.124603271484375, "global_step": 414385, "epoch": 4992} {"train_loss": -26.908849716186523, "global_step": 414386, "epoch": 4992} {"train_loss": -26.676538467407227, "global_step": 414387, "epoch": 4992} {"train_loss": -27.031946182250977, "global_step": 414388, "epoch": 4992} {"train_loss": -26.834991455078125, "global_step": 414389, "epoch": 4992} {"train_loss": -26.6285343170166, "global_step": 414390, "epoch": 4992} {"train_loss": -26.659637451171875, "global_step": 414391, "epoch": 4992} {"train_loss": -26.95059585571289, "global_step": 414392, "epoch": 4992} {"train_loss": -27.113935470581055, "global_step": 414393, "epoch": 4992} {"train_loss": -26.92420768737793, "global_step": 414394, "epoch": 4992} {"train_loss": -27.111194610595703, "global_step": 414395, "epoch": 4992} {"train_loss": -26.769872665405273, "global_step": 414396, "epoch": 4992} {"train_loss": -26.93621826171875, "global_step": 414397, "epoch": 4992} {"train_loss": -26.74677085876465, "global_step": 414398, "epoch": 4992} {"train_loss": -26.5967960357666, "global_step": 414399, "epoch": 4992} {"train_loss": -26.498838424682617, "global_step": 414400, "epoch": 4992} {"train_loss": -26.20401954650879, "global_step": 414401, "epoch": 4992} {"train_loss": -26.307531356811523, "global_step": 414402, "epoch": 4992} {"train_loss": -26.26967430114746, "global_step": 414403, "epoch": 4992} {"train_loss": -26.6483154296875, "global_step": 414404, "epoch": 4992} {"train_loss": -26.18808364868164, "global_step": 414405, "epoch": 4992} {"train_loss": -26.596303939819336, "global_step": 414406, "epoch": 4992} {"train_loss": -26.725378036499023, "global_step": 414407, "epoch": 4992} {"train_loss": -26.602054595947266, "global_step": 414408, "epoch": 4992} {"train_loss": -26.468036651611328, "global_step": 414409, "epoch": 4992} {"train_loss": -26.231489181518555, "global_step": 414410, "epoch": 4992} {"train_loss": -26.48341941833496, "global_step": 414411, "epoch": 4992} {"train_loss": -26.554031372070312, "global_step": 414412, "epoch": 4992} {"train_loss": -26.591291427612305, "global_step": 414413, "epoch": 4992} {"train_loss": -26.6722412109375, "global_step": 414414, "epoch": 4992} {"train_loss": -26.54462242126465, "global_step": 414415, "epoch": 4992} {"train_loss": -26.732473373413086, "global_step": 414416, "epoch": 4992} {"train_loss": -26.6761474609375, "global_step": 414417, "epoch": 4992} {"train_loss": -26.535177943218184, "global_step": 414418, "epoch": 4992, "val_loss": 6461043.0} {"train_loss": -25.825220108032227, "global_step": 414419, "epoch": 4993} {"train_loss": -26.51918601989746, "global_step": 414420, "epoch": 4993} {"train_loss": -26.423791885375977, "global_step": 414421, "epoch": 4993} {"train_loss": -25.900007247924805, "global_step": 414422, "epoch": 4993} {"train_loss": -25.913700103759766, "global_step": 414423, "epoch": 4993} {"train_loss": -26.45195960998535, "global_step": 414424, "epoch": 4993} {"train_loss": -26.398548126220703, "global_step": 414425, "epoch": 4993} {"train_loss": -25.982213973999023, "global_step": 414426, "epoch": 4993} {"train_loss": -26.505054473876953, "global_step": 414427, "epoch": 4993} {"train_loss": -26.231292724609375, "global_step": 414428, "epoch": 4993} {"train_loss": -26.716047286987305, "global_step": 414429, "epoch": 4993} {"train_loss": -26.271392822265625, "global_step": 414430, "epoch": 4993} {"train_loss": -26.07366371154785, "global_step": 414431, "epoch": 4993} {"train_loss": -26.774702072143555, "global_step": 414432, "epoch": 4993} {"train_loss": -26.1911678314209, "global_step": 414433, "epoch": 4993} {"train_loss": -26.797861099243164, "global_step": 414434, "epoch": 4993} {"train_loss": -26.34425163269043, "global_step": 414435, "epoch": 4993} {"train_loss": -26.620141983032227, "global_step": 414436, "epoch": 4993} {"train_loss": -26.85357093811035, "global_step": 414437, "epoch": 4993} {"train_loss": -26.4717960357666, "global_step": 414438, "epoch": 4993} {"train_loss": -26.710813522338867, "global_step": 414439, "epoch": 4993} {"train_loss": -26.901309967041016, "global_step": 414440, "epoch": 4993} {"train_loss": -26.903736114501953, "global_step": 414441, "epoch": 4993} {"train_loss": -26.4010066986084, "global_step": 414442, "epoch": 4993} {"train_loss": -26.8452205657959, "global_step": 414443, "epoch": 4993} {"train_loss": -26.5870418548584, "global_step": 414444, "epoch": 4993} {"train_loss": -27.06829833984375, "global_step": 414445, "epoch": 4993} {"train_loss": -26.489709854125977, "global_step": 414446, "epoch": 4993} {"train_loss": -26.8016300201416, "global_step": 414447, "epoch": 4993} {"train_loss": -26.964847564697266, "global_step": 414448, "epoch": 4993} {"train_loss": -26.65529441833496, "global_step": 414449, "epoch": 4993} {"train_loss": -26.583688735961914, "global_step": 414450, "epoch": 4993} {"train_loss": -26.538110733032227, "global_step": 414451, "epoch": 4993} {"train_loss": -26.8295841217041, "global_step": 414452, "epoch": 4993} {"train_loss": -26.896997451782227, "global_step": 414453, "epoch": 4993} {"train_loss": -26.653018951416016, "global_step": 414454, "epoch": 4993} {"train_loss": -27.156030654907227, "global_step": 414455, "epoch": 4993} {"train_loss": -26.56015968322754, "global_step": 414456, "epoch": 4993} {"train_loss": -26.13665771484375, "global_step": 414457, "epoch": 4993} {"train_loss": -26.21430015563965, "global_step": 414458, "epoch": 4993} {"train_loss": -26.467870712280273, "global_step": 414459, "epoch": 4993} {"train_loss": -27.15455436706543, "global_step": 414460, "epoch": 4993} {"train_loss": -26.70522117614746, "global_step": 414461, "epoch": 4993} {"train_loss": -26.67817497253418, "global_step": 414462, "epoch": 4993} {"train_loss": -26.747467041015625, "global_step": 414463, "epoch": 4993} {"train_loss": -26.67240333557129, "global_step": 414464, "epoch": 4993} {"train_loss": -26.505704879760742, "global_step": 414465, "epoch": 4993} {"train_loss": -26.15870475769043, "global_step": 414466, "epoch": 4993} {"train_loss": -26.744476318359375, "global_step": 414467, "epoch": 4993} {"train_loss": -26.55672264099121, "global_step": 414468, "epoch": 4993} {"train_loss": -26.45918083190918, "global_step": 414469, "epoch": 4993} {"train_loss": -26.806671142578125, "global_step": 414470, "epoch": 4993} {"train_loss": -26.822376251220703, "global_step": 414471, "epoch": 4993} {"train_loss": -26.422611236572266, "global_step": 414472, "epoch": 4993} {"train_loss": -26.9046630859375, "global_step": 414473, "epoch": 4993} {"train_loss": -26.786401748657227, "global_step": 414474, "epoch": 4993} {"train_loss": -26.783649444580078, "global_step": 414475, "epoch": 4993} {"train_loss": -26.544540405273438, "global_step": 414476, "epoch": 4993} {"train_loss": -26.320981979370117, "global_step": 414477, "epoch": 4993} {"train_loss": -26.77617835998535, "global_step": 414478, "epoch": 4993} {"train_loss": -26.58182144165039, "global_step": 414479, "epoch": 4993} {"train_loss": -26.826770782470703, "global_step": 414480, "epoch": 4993} {"train_loss": -26.792234420776367, "global_step": 414481, "epoch": 4993} {"train_loss": -26.389572143554688, "global_step": 414482, "epoch": 4993} {"train_loss": -26.377904891967773, "global_step": 414483, "epoch": 4993} {"train_loss": -26.54905128479004, "global_step": 414484, "epoch": 4993} {"train_loss": -26.391891479492188, "global_step": 414485, "epoch": 4993} {"train_loss": -26.778329849243164, "global_step": 414486, "epoch": 4993} {"train_loss": -26.527484893798828, "global_step": 414487, "epoch": 4993} {"train_loss": -26.684736251831055, "global_step": 414488, "epoch": 4993} {"train_loss": -26.709936141967773, "global_step": 414489, "epoch": 4993} {"train_loss": -26.79986572265625, "global_step": 414490, "epoch": 4993} {"train_loss": -26.765106201171875, "global_step": 414491, "epoch": 4993} {"train_loss": -26.714879989624023, "global_step": 414492, "epoch": 4993} {"train_loss": -26.681537628173828, "global_step": 414493, "epoch": 4993} {"train_loss": -26.31760025024414, "global_step": 414494, "epoch": 4993} {"train_loss": -26.694915771484375, "global_step": 414495, "epoch": 4993} {"train_loss": -26.62042808532715, "global_step": 414496, "epoch": 4993} {"train_loss": -26.896392822265625, "global_step": 414497, "epoch": 4993} {"train_loss": -26.67331886291504, "global_step": 414498, "epoch": 4993} {"train_loss": -26.615243911743164, "global_step": 414499, "epoch": 4993} {"train_loss": -26.70875358581543, "global_step": 414500, "epoch": 4993} {"train_loss": -26.618182216782166, "global_step": 414501, "epoch": 4993, "val_loss": 6546263.0} {"train_loss": -25.751569747924805, "global_step": 414502, "epoch": 4994} {"train_loss": -25.888410568237305, "global_step": 414503, "epoch": 4994} {"train_loss": -26.1962890625, "global_step": 414504, "epoch": 4994} {"train_loss": -25.95020866394043, "global_step": 414505, "epoch": 4994} {"train_loss": -25.96142578125, "global_step": 414506, "epoch": 4994} {"train_loss": -25.66094398498535, "global_step": 414507, "epoch": 4994} {"train_loss": -26.637914657592773, "global_step": 414508, "epoch": 4994} {"train_loss": -26.052488327026367, "global_step": 414509, "epoch": 4994} {"train_loss": -26.55838966369629, "global_step": 414510, "epoch": 4994} {"train_loss": -26.5081844329834, "global_step": 414511, "epoch": 4994} {"train_loss": -26.189008712768555, "global_step": 414512, "epoch": 4994} {"train_loss": -26.501697540283203, "global_step": 414513, "epoch": 4994} {"train_loss": -26.352060317993164, "global_step": 414514, "epoch": 4994} {"train_loss": -26.165754318237305, "global_step": 414515, "epoch": 4994} {"train_loss": -26.556716918945312, "global_step": 414516, "epoch": 4994} {"train_loss": -26.515186309814453, "global_step": 414517, "epoch": 4994} {"train_loss": -26.395856857299805, "global_step": 414518, "epoch": 4994} {"train_loss": -26.535125732421875, "global_step": 414519, "epoch": 4994} {"train_loss": -26.53629493713379, "global_step": 414520, "epoch": 4994} {"train_loss": -26.554792404174805, "global_step": 414521, "epoch": 4994} {"train_loss": -26.554548263549805, "global_step": 414522, "epoch": 4994} {"train_loss": -26.47480583190918, "global_step": 414523, "epoch": 4994} {"train_loss": -26.946212768554688, "global_step": 414524, "epoch": 4994} {"train_loss": -26.910968780517578, "global_step": 414525, "epoch": 4994} {"train_loss": -26.7768611907959, "global_step": 414526, "epoch": 4994} {"train_loss": -26.783557891845703, "global_step": 414527, "epoch": 4994} {"train_loss": -26.7781982421875, "global_step": 414528, "epoch": 4994} {"train_loss": -26.437484741210938, "global_step": 414529, "epoch": 4994} {"train_loss": -26.799091339111328, "global_step": 414530, "epoch": 4994} {"train_loss": -26.3819637298584, "global_step": 414531, "epoch": 4994} {"train_loss": -26.83154296875, "global_step": 414532, "epoch": 4994} {"train_loss": -26.822940826416016, "global_step": 414533, "epoch": 4994} {"train_loss": -27.3905086517334, "global_step": 414534, "epoch": 4994} {"train_loss": -26.846582412719727, "global_step": 414535, "epoch": 4994} {"train_loss": -26.882415771484375, "global_step": 414536, "epoch": 4994} {"train_loss": -26.8021240234375, "global_step": 414537, "epoch": 4994} {"train_loss": -26.898395538330078, "global_step": 414538, "epoch": 4994} {"train_loss": -27.15707778930664, "global_step": 414539, "epoch": 4994} {"train_loss": -26.649169921875, "global_step": 414540, "epoch": 4994} {"train_loss": -27.05561637878418, "global_step": 414541, "epoch": 4994} {"train_loss": -26.676319122314453, "global_step": 414542, "epoch": 4994} {"train_loss": -27.00201416015625, "global_step": 414543, "epoch": 4994} {"train_loss": -27.145776748657227, "global_step": 414544, "epoch": 4994} {"train_loss": -27.180570602416992, "global_step": 414545, "epoch": 4994} {"train_loss": -26.779296875, "global_step": 414546, "epoch": 4994} {"train_loss": -27.12714958190918, "global_step": 414547, "epoch": 4994} {"train_loss": -27.02256202697754, "global_step": 414548, "epoch": 4994} {"train_loss": -26.63718605041504, "global_step": 414549, "epoch": 4994} {"train_loss": -26.664417266845703, "global_step": 414550, "epoch": 4994} {"train_loss": -26.313425064086914, "global_step": 414551, "epoch": 4994} {"train_loss": -26.853256225585938, "global_step": 414552, "epoch": 4994} {"train_loss": -26.86767578125, "global_step": 414553, "epoch": 4994} {"train_loss": -26.177902221679688, "global_step": 414554, "epoch": 4994} {"train_loss": -26.340734481811523, "global_step": 414555, "epoch": 4994} {"train_loss": -27.12894630432129, "global_step": 414556, "epoch": 4994} {"train_loss": -26.565277099609375, "global_step": 414557, "epoch": 4994} {"train_loss": -26.665502548217773, "global_step": 414558, "epoch": 4994} {"train_loss": -26.458093643188477, "global_step": 414559, "epoch": 4994} {"train_loss": -26.758712768554688, "global_step": 414560, "epoch": 4994} {"train_loss": -26.895404815673828, "global_step": 414561, "epoch": 4994} {"train_loss": -26.659067153930664, "global_step": 414562, "epoch": 4994} {"train_loss": -26.677099227905273, "global_step": 414563, "epoch": 4994} {"train_loss": -26.751611709594727, "global_step": 414564, "epoch": 4994} {"train_loss": -26.726409912109375, "global_step": 414565, "epoch": 4994} {"train_loss": -27.258716583251953, "global_step": 414566, "epoch": 4994} {"train_loss": -26.461889266967773, "global_step": 414567, "epoch": 4994} {"train_loss": -26.69138526916504, "global_step": 414568, "epoch": 4994} {"train_loss": -26.849365234375, "global_step": 414569, "epoch": 4994} {"train_loss": -26.54925537109375, "global_step": 414570, "epoch": 4994} {"train_loss": -26.936309814453125, "global_step": 414571, "epoch": 4994} {"train_loss": -26.642614364624023, "global_step": 414572, "epoch": 4994} {"train_loss": -26.8973331451416, "global_step": 414573, "epoch": 4994} {"train_loss": -26.992338180541992, "global_step": 414574, "epoch": 4994} {"train_loss": -26.142866134643555, "global_step": 414575, "epoch": 4994} {"train_loss": -26.5366153717041, "global_step": 414576, "epoch": 4994} {"train_loss": -27.076099395751953, "global_step": 414577, "epoch": 4994} {"train_loss": -26.60795021057129, "global_step": 414578, "epoch": 4994} {"train_loss": -27.078704833984375, "global_step": 414579, "epoch": 4994} {"train_loss": -26.710220336914062, "global_step": 414580, "epoch": 4994} {"train_loss": -26.676944732666016, "global_step": 414581, "epoch": 4994} {"train_loss": -26.854206085205078, "global_step": 414582, "epoch": 4994} {"train_loss": -26.6184024810791, "global_step": 414583, "epoch": 4994} {"train_loss": -26.644245515386743, "global_step": 414584, "epoch": 4994, "val_loss": 6462225.0} {"train_loss": -26.00050926208496, "global_step": 414585, "epoch": 4995} {"train_loss": -26.500288009643555, "global_step": 414586, "epoch": 4995} {"train_loss": -26.507801055908203, "global_step": 414587, "epoch": 4995} {"train_loss": -26.739255905151367, "global_step": 414588, "epoch": 4995} {"train_loss": -26.44574546813965, "global_step": 414589, "epoch": 4995} {"train_loss": -26.512048721313477, "global_step": 414590, "epoch": 4995} {"train_loss": -26.712926864624023, "global_step": 414591, "epoch": 4995} {"train_loss": -27.06255531311035, "global_step": 414592, "epoch": 4995} {"train_loss": -26.92603874206543, "global_step": 414593, "epoch": 4995} {"train_loss": -26.693256378173828, "global_step": 414594, "epoch": 4995} {"train_loss": -26.75933837890625, "global_step": 414595, "epoch": 4995} {"train_loss": -26.75701332092285, "global_step": 414596, "epoch": 4995} {"train_loss": -26.813648223876953, "global_step": 414597, "epoch": 4995} {"train_loss": -26.52418327331543, "global_step": 414598, "epoch": 4995} {"train_loss": -26.568069458007812, "global_step": 414599, "epoch": 4995} {"train_loss": -26.56317710876465, "global_step": 414600, "epoch": 4995} {"train_loss": -26.534351348876953, "global_step": 414601, "epoch": 4995} {"train_loss": -26.644702911376953, "global_step": 414602, "epoch": 4995} {"train_loss": -26.449359893798828, "global_step": 414603, "epoch": 4995} {"train_loss": -26.341291427612305, "global_step": 414604, "epoch": 4995} {"train_loss": -26.686262130737305, "global_step": 414605, "epoch": 4995} {"train_loss": -26.878202438354492, "global_step": 414606, "epoch": 4995} {"train_loss": -26.705127716064453, "global_step": 414607, "epoch": 4995} {"train_loss": -26.783435821533203, "global_step": 414608, "epoch": 4995} {"train_loss": -27.040103912353516, "global_step": 414609, "epoch": 4995} {"train_loss": -26.74725914001465, "global_step": 414610, "epoch": 4995} {"train_loss": -27.052845001220703, "global_step": 414611, "epoch": 4995} {"train_loss": -26.677352905273438, "global_step": 414612, "epoch": 4995} {"train_loss": -26.73379898071289, "global_step": 414613, "epoch": 4995} {"train_loss": -26.717702865600586, "global_step": 414614, "epoch": 4995} {"train_loss": -26.590850830078125, "global_step": 414615, "epoch": 4995} {"train_loss": -26.606067657470703, "global_step": 414616, "epoch": 4995} {"train_loss": -27.079010009765625, "global_step": 414617, "epoch": 4995} {"train_loss": -26.8282470703125, "global_step": 414618, "epoch": 4995} {"train_loss": -26.820789337158203, "global_step": 414619, "epoch": 4995} {"train_loss": -26.77197265625, "global_step": 414620, "epoch": 4995} {"train_loss": -26.572101593017578, "global_step": 414621, "epoch": 4995} {"train_loss": -26.792499542236328, "global_step": 414622, "epoch": 4995} {"train_loss": -26.715412139892578, "global_step": 414623, "epoch": 4995} {"train_loss": -26.60943603515625, "global_step": 414624, "epoch": 4995} {"train_loss": -26.454025268554688, "global_step": 414625, "epoch": 4995} {"train_loss": -26.72797966003418, "global_step": 414626, "epoch": 4995} {"train_loss": -26.73274040222168, "global_step": 414627, "epoch": 4995} {"train_loss": -26.899188995361328, "global_step": 414628, "epoch": 4995} {"train_loss": -26.938583374023438, "global_step": 414629, "epoch": 4995} {"train_loss": -26.827972412109375, "global_step": 414630, "epoch": 4995} {"train_loss": -26.778671264648438, "global_step": 414631, "epoch": 4995} {"train_loss": -27.05769157409668, "global_step": 414632, "epoch": 4995} {"train_loss": -27.059492111206055, "global_step": 414633, "epoch": 4995} {"train_loss": -26.845800399780273, "global_step": 414634, "epoch": 4995} {"train_loss": -26.974323272705078, "global_step": 414635, "epoch": 4995} {"train_loss": -26.631744384765625, "global_step": 414636, "epoch": 4995} {"train_loss": -26.76655387878418, "global_step": 414637, "epoch": 4995} {"train_loss": -26.54597282409668, "global_step": 414638, "epoch": 4995} {"train_loss": -26.577411651611328, "global_step": 414639, "epoch": 4995} {"train_loss": -26.851520538330078, "global_step": 414640, "epoch": 4995} {"train_loss": -26.761106491088867, "global_step": 414641, "epoch": 4995} {"train_loss": -27.201223373413086, "global_step": 414642, "epoch": 4995} {"train_loss": -26.7902774810791, "global_step": 414643, "epoch": 4995} {"train_loss": -26.75257682800293, "global_step": 414644, "epoch": 4995} {"train_loss": -27.158781051635742, "global_step": 414645, "epoch": 4995} {"train_loss": -26.98101806640625, "global_step": 414646, "epoch": 4995} {"train_loss": -27.1267147064209, "global_step": 414647, "epoch": 4995} {"train_loss": -26.9615421295166, "global_step": 414648, "epoch": 4995} {"train_loss": -26.697418212890625, "global_step": 414649, "epoch": 4995} {"train_loss": -27.072345733642578, "global_step": 414650, "epoch": 4995} {"train_loss": -27.213916778564453, "global_step": 414651, "epoch": 4995} {"train_loss": -26.752410888671875, "global_step": 414652, "epoch": 4995} {"train_loss": -27.33806800842285, "global_step": 414653, "epoch": 4995} {"train_loss": -26.642908096313477, "global_step": 414654, "epoch": 4995} {"train_loss": -26.9682674407959, "global_step": 414655, "epoch": 4995} {"train_loss": -26.787139892578125, "global_step": 414656, "epoch": 4995} {"train_loss": -26.253253936767578, "global_step": 414657, "epoch": 4995} {"train_loss": -25.659748077392578, "global_step": 414658, "epoch": 4995} {"train_loss": -25.509435653686523, "global_step": 414659, "epoch": 4995} {"train_loss": -26.35968017578125, "global_step": 414660, "epoch": 4995} {"train_loss": -26.63654899597168, "global_step": 414661, "epoch": 4995} {"train_loss": -26.83643913269043, "global_step": 414662, "epoch": 4995} {"train_loss": -26.296939849853516, "global_step": 414663, "epoch": 4995} {"train_loss": -26.5413761138916, "global_step": 414664, "epoch": 4995} {"train_loss": -26.074970245361328, "global_step": 414665, "epoch": 4995} {"train_loss": -26.733057022094727, "global_step": 414666, "epoch": 4995} {"train_loss": -26.707143622708607, "global_step": 414667, "epoch": 4995, "val_loss": 6382059.0} {"train_loss": -26.287763595581055, "global_step": 414668, "epoch": 4996} {"train_loss": -25.802326202392578, "global_step": 414669, "epoch": 4996} {"train_loss": -26.385770797729492, "global_step": 414670, "epoch": 4996} {"train_loss": -26.00786781311035, "global_step": 414671, "epoch": 4996} {"train_loss": -25.876134872436523, "global_step": 414672, "epoch": 4996} {"train_loss": -26.358381271362305, "global_step": 414673, "epoch": 4996} {"train_loss": -26.2498836517334, "global_step": 414674, "epoch": 4996} {"train_loss": -26.228429794311523, "global_step": 414675, "epoch": 4996} {"train_loss": -26.108076095581055, "global_step": 414676, "epoch": 4996} {"train_loss": -26.468347549438477, "global_step": 414677, "epoch": 4996} {"train_loss": -26.489349365234375, "global_step": 414678, "epoch": 4996} {"train_loss": -26.513092041015625, "global_step": 414679, "epoch": 4996} {"train_loss": -25.993085861206055, "global_step": 414680, "epoch": 4996} {"train_loss": -26.302932739257812, "global_step": 414681, "epoch": 4996} {"train_loss": -26.612775802612305, "global_step": 414682, "epoch": 4996} {"train_loss": -26.31269645690918, "global_step": 414683, "epoch": 4996} {"train_loss": -26.592309951782227, "global_step": 414684, "epoch": 4996} {"train_loss": -26.319005966186523, "global_step": 414685, "epoch": 4996} {"train_loss": -26.504056930541992, "global_step": 414686, "epoch": 4996} {"train_loss": -26.5627384185791, "global_step": 414687, "epoch": 4996} {"train_loss": -26.507699966430664, "global_step": 414688, "epoch": 4996} {"train_loss": -26.3946475982666, "global_step": 414689, "epoch": 4996} {"train_loss": -26.50196647644043, "global_step": 414690, "epoch": 4996} {"train_loss": -26.8703670501709, "global_step": 414691, "epoch": 4996} {"train_loss": -26.675683975219727, "global_step": 414692, "epoch": 4996} {"train_loss": -26.337167739868164, "global_step": 414693, "epoch": 4996} {"train_loss": -26.861860275268555, "global_step": 414694, "epoch": 4996} {"train_loss": -26.824329376220703, "global_step": 414695, "epoch": 4996} {"train_loss": -26.615774154663086, "global_step": 414696, "epoch": 4996} {"train_loss": -26.78435707092285, "global_step": 414697, "epoch": 4996} {"train_loss": -26.906116485595703, "global_step": 414698, "epoch": 4996} {"train_loss": -26.505048751831055, "global_step": 414699, "epoch": 4996} {"train_loss": -26.500234603881836, "global_step": 414700, "epoch": 4996} {"train_loss": -26.7665958404541, "global_step": 414701, "epoch": 4996} {"train_loss": -26.328039169311523, "global_step": 414702, "epoch": 4996} {"train_loss": -26.844329833984375, "global_step": 414703, "epoch": 4996} {"train_loss": -27.043500900268555, "global_step": 414704, "epoch": 4996} {"train_loss": -26.748559951782227, "global_step": 414705, "epoch": 4996} {"train_loss": -26.80177116394043, "global_step": 414706, "epoch": 4996} {"train_loss": -27.183551788330078, "global_step": 414707, "epoch": 4996} {"train_loss": -26.69069480895996, "global_step": 414708, "epoch": 4996} {"train_loss": -27.013641357421875, "global_step": 414709, "epoch": 4996} {"train_loss": -27.140222549438477, "global_step": 414710, "epoch": 4996} {"train_loss": -27.07294273376465, "global_step": 414711, "epoch": 4996} {"train_loss": -26.551074981689453, "global_step": 414712, "epoch": 4996} {"train_loss": -26.773481369018555, "global_step": 414713, "epoch": 4996} {"train_loss": -26.542844772338867, "global_step": 414714, "epoch": 4996} {"train_loss": -26.441207885742188, "global_step": 414715, "epoch": 4996} {"train_loss": -26.883392333984375, "global_step": 414716, "epoch": 4996} {"train_loss": -27.400989532470703, "global_step": 414717, "epoch": 4996} {"train_loss": -27.032255172729492, "global_step": 414718, "epoch": 4996} {"train_loss": -26.584918975830078, "global_step": 414719, "epoch": 4996} {"train_loss": -26.64129638671875, "global_step": 414720, "epoch": 4996} {"train_loss": -26.903778076171875, "global_step": 414721, "epoch": 4996} {"train_loss": -26.533710479736328, "global_step": 414722, "epoch": 4996} {"train_loss": -26.349231719970703, "global_step": 414723, "epoch": 4996} {"train_loss": -26.665267944335938, "global_step": 414724, "epoch": 4996} {"train_loss": -26.77192497253418, "global_step": 414725, "epoch": 4996} {"train_loss": -26.18442153930664, "global_step": 414726, "epoch": 4996} {"train_loss": -26.779464721679688, "global_step": 414727, "epoch": 4996} {"train_loss": -26.9249210357666, "global_step": 414728, "epoch": 4996} {"train_loss": -26.602888107299805, "global_step": 414729, "epoch": 4996} {"train_loss": -26.53240394592285, "global_step": 414730, "epoch": 4996} {"train_loss": -26.352039337158203, "global_step": 414731, "epoch": 4996} {"train_loss": -27.036813735961914, "global_step": 414732, "epoch": 4996} {"train_loss": -26.676603317260742, "global_step": 414733, "epoch": 4996} {"train_loss": -26.59512710571289, "global_step": 414734, "epoch": 4996} {"train_loss": -26.637479782104492, "global_step": 414735, "epoch": 4996} {"train_loss": -26.635589599609375, "global_step": 414736, "epoch": 4996} {"train_loss": -26.82110023498535, "global_step": 414737, "epoch": 4996} {"train_loss": -26.49725914001465, "global_step": 414738, "epoch": 4996} {"train_loss": -26.268970489501953, "global_step": 414739, "epoch": 4996} {"train_loss": -26.567584991455078, "global_step": 414740, "epoch": 4996} {"train_loss": -26.842334747314453, "global_step": 414741, "epoch": 4996} {"train_loss": -26.63276481628418, "global_step": 414742, "epoch": 4996} {"train_loss": -26.688507080078125, "global_step": 414743, "epoch": 4996} {"train_loss": -26.4666690826416, "global_step": 414744, "epoch": 4996} {"train_loss": -26.897314071655273, "global_step": 414745, "epoch": 4996} {"train_loss": -26.658466339111328, "global_step": 414746, "epoch": 4996} {"train_loss": -26.702625274658203, "global_step": 414747, "epoch": 4996} {"train_loss": -26.861181259155273, "global_step": 414748, "epoch": 4996} {"train_loss": -26.570159912109375, "global_step": 414749, "epoch": 4996} {"train_loss": -26.614484557186266, "global_step": 414750, "epoch": 4996, "val_loss": 6513517.0} {"train_loss": -25.7375545501709, "global_step": 414751, "epoch": 4997} {"train_loss": -25.906766891479492, "global_step": 414752, "epoch": 4997} {"train_loss": -26.17725944519043, "global_step": 414753, "epoch": 4997} {"train_loss": -26.036834716796875, "global_step": 414754, "epoch": 4997} {"train_loss": -26.377033233642578, "global_step": 414755, "epoch": 4997} {"train_loss": -26.2565860748291, "global_step": 414756, "epoch": 4997} {"train_loss": -26.04608154296875, "global_step": 414757, "epoch": 4997} {"train_loss": -26.266454696655273, "global_step": 414758, "epoch": 4997} {"train_loss": -26.041828155517578, "global_step": 414759, "epoch": 4997} {"train_loss": -26.473608016967773, "global_step": 414760, "epoch": 4997} {"train_loss": -25.95538330078125, "global_step": 414761, "epoch": 4997} {"train_loss": -26.409204483032227, "global_step": 414762, "epoch": 4997} {"train_loss": -26.260400772094727, "global_step": 414763, "epoch": 4997} {"train_loss": -26.531396865844727, "global_step": 414764, "epoch": 4997} {"train_loss": -26.279626846313477, "global_step": 414765, "epoch": 4997} {"train_loss": -26.4107723236084, "global_step": 414766, "epoch": 4997} {"train_loss": -26.458051681518555, "global_step": 414767, "epoch": 4997} {"train_loss": -26.389387130737305, "global_step": 414768, "epoch": 4997} {"train_loss": -26.566730499267578, "global_step": 414769, "epoch": 4997} {"train_loss": -26.780170440673828, "global_step": 414770, "epoch": 4997} {"train_loss": -26.744840621948242, "global_step": 414771, "epoch": 4997} {"train_loss": -26.71908950805664, "global_step": 414772, "epoch": 4997} {"train_loss": -26.378332138061523, "global_step": 414773, "epoch": 4997} {"train_loss": -26.315475463867188, "global_step": 414774, "epoch": 4997} {"train_loss": -26.938440322875977, "global_step": 414775, "epoch": 4997} {"train_loss": -26.676013946533203, "global_step": 414776, "epoch": 4997} {"train_loss": -26.76771354675293, "global_step": 414777, "epoch": 4997} {"train_loss": -26.87996482849121, "global_step": 414778, "epoch": 4997} {"train_loss": -26.638935089111328, "global_step": 414779, "epoch": 4997} {"train_loss": -26.677932739257812, "global_step": 414780, "epoch": 4997} {"train_loss": -26.801427841186523, "global_step": 414781, "epoch": 4997} {"train_loss": -26.629270553588867, "global_step": 414782, "epoch": 4997} {"train_loss": -26.741666793823242, "global_step": 414783, "epoch": 4997} {"train_loss": -26.728271484375, "global_step": 414784, "epoch": 4997} {"train_loss": -26.37874412536621, "global_step": 414785, "epoch": 4997} {"train_loss": -26.452438354492188, "global_step": 414786, "epoch": 4997} {"train_loss": -26.84315299987793, "global_step": 414787, "epoch": 4997} {"train_loss": -26.0459041595459, "global_step": 414788, "epoch": 4997} {"train_loss": -26.56930923461914, "global_step": 414789, "epoch": 4997} {"train_loss": -26.9121150970459, "global_step": 414790, "epoch": 4997} {"train_loss": -27.038833618164062, "global_step": 414791, "epoch": 4997} {"train_loss": -26.752613067626953, "global_step": 414792, "epoch": 4997} {"train_loss": -27.222736358642578, "global_step": 414793, "epoch": 4997} {"train_loss": -26.919891357421875, "global_step": 414794, "epoch": 4997} {"train_loss": -27.033554077148438, "global_step": 414795, "epoch": 4997} {"train_loss": -26.693830490112305, "global_step": 414796, "epoch": 4997} {"train_loss": -26.419275283813477, "global_step": 414797, "epoch": 4997} {"train_loss": -26.890737533569336, "global_step": 414798, "epoch": 4997} {"train_loss": -26.525177001953125, "global_step": 414799, "epoch": 4997} {"train_loss": -26.902917861938477, "global_step": 414800, "epoch": 4997} {"train_loss": -26.628692626953125, "global_step": 414801, "epoch": 4997} {"train_loss": -26.444660186767578, "global_step": 414802, "epoch": 4997} {"train_loss": -27.038049697875977, "global_step": 414803, "epoch": 4997} {"train_loss": -26.935911178588867, "global_step": 414804, "epoch": 4997} {"train_loss": -26.781980514526367, "global_step": 414805, "epoch": 4997} {"train_loss": -26.565841674804688, "global_step": 414806, "epoch": 4997} {"train_loss": -26.901586532592773, "global_step": 414807, "epoch": 4997} {"train_loss": -26.812524795532227, "global_step": 414808, "epoch": 4997} {"train_loss": -27.0157470703125, "global_step": 414809, "epoch": 4997} {"train_loss": -26.5740966796875, "global_step": 414810, "epoch": 4997} {"train_loss": -26.96845817565918, "global_step": 414811, "epoch": 4997} {"train_loss": -26.785730361938477, "global_step": 414812, "epoch": 4997} {"train_loss": -26.468175888061523, "global_step": 414813, "epoch": 4997} {"train_loss": -27.12775993347168, "global_step": 414814, "epoch": 4997} {"train_loss": -26.58054542541504, "global_step": 414815, "epoch": 4997} {"train_loss": -26.810928344726562, "global_step": 414816, "epoch": 4997} {"train_loss": -26.819793701171875, "global_step": 414817, "epoch": 4997} {"train_loss": -27.135732650756836, "global_step": 414818, "epoch": 4997} {"train_loss": -26.69683837890625, "global_step": 414819, "epoch": 4997} {"train_loss": -26.7738094329834, "global_step": 414820, "epoch": 4997} {"train_loss": -26.830472946166992, "global_step": 414821, "epoch": 4997} {"train_loss": -26.62800407409668, "global_step": 414822, "epoch": 4997} {"train_loss": -26.966461181640625, "global_step": 414823, "epoch": 4997} {"train_loss": -27.064044952392578, "global_step": 414824, "epoch": 4997} {"train_loss": -26.947301864624023, "global_step": 414825, "epoch": 4997} {"train_loss": -26.883710861206055, "global_step": 414826, "epoch": 4997} {"train_loss": -27.037057876586914, "global_step": 414827, "epoch": 4997} {"train_loss": -26.75028419494629, "global_step": 414828, "epoch": 4997} {"train_loss": -27.2332706451416, "global_step": 414829, "epoch": 4997} {"train_loss": -27.27374267578125, "global_step": 414830, "epoch": 4997} {"train_loss": -26.691421508789062, "global_step": 414831, "epoch": 4997} {"train_loss": -26.468612670898438, "global_step": 414832, "epoch": 4997} {"train_loss": -26.662283518228186, "global_step": 414833, "epoch": 4997, "val_loss": 6473007.5} {"train_loss": -26.080541610717773, "global_step": 414834, "epoch": 4998} {"train_loss": -25.696521759033203, "global_step": 414835, "epoch": 4998} {"train_loss": -25.714269638061523, "global_step": 414836, "epoch": 4998} {"train_loss": -25.491392135620117, "global_step": 414837, "epoch": 4998} {"train_loss": -25.380918502807617, "global_step": 414838, "epoch": 4998} {"train_loss": -25.868701934814453, "global_step": 414839, "epoch": 4998} {"train_loss": -25.85373878479004, "global_step": 414840, "epoch": 4998} {"train_loss": -25.862070083618164, "global_step": 414841, "epoch": 4998} {"train_loss": -26.252838134765625, "global_step": 414842, "epoch": 4998} {"train_loss": -26.292694091796875, "global_step": 414843, "epoch": 4998} {"train_loss": -26.400238037109375, "global_step": 414844, "epoch": 4998} {"train_loss": -25.961475372314453, "global_step": 414845, "epoch": 4998} {"train_loss": -26.270132064819336, "global_step": 414846, "epoch": 4998} {"train_loss": -26.467029571533203, "global_step": 414847, "epoch": 4998} {"train_loss": -26.68512535095215, "global_step": 414848, "epoch": 4998} {"train_loss": -26.797348022460938, "global_step": 414849, "epoch": 4998} {"train_loss": -26.157928466796875, "global_step": 414850, "epoch": 4998} {"train_loss": -26.352590560913086, "global_step": 414851, "epoch": 4998} {"train_loss": -26.362741470336914, "global_step": 414852, "epoch": 4998} {"train_loss": -26.65467643737793, "global_step": 414853, "epoch": 4998} {"train_loss": -26.557483673095703, "global_step": 414854, "epoch": 4998} {"train_loss": -26.785465240478516, "global_step": 414855, "epoch": 4998} {"train_loss": -26.382877349853516, "global_step": 414856, "epoch": 4998} {"train_loss": -26.467666625976562, "global_step": 414857, "epoch": 4998} {"train_loss": -26.309717178344727, "global_step": 414858, "epoch": 4998} {"train_loss": -26.713489532470703, "global_step": 414859, "epoch": 4998} {"train_loss": -26.645349502563477, "global_step": 414860, "epoch": 4998} {"train_loss": -26.72039794921875, "global_step": 414861, "epoch": 4998} {"train_loss": -26.84992790222168, "global_step": 414862, "epoch": 4998} {"train_loss": -26.541173934936523, "global_step": 414863, "epoch": 4998} {"train_loss": -26.780195236206055, "global_step": 414864, "epoch": 4998} {"train_loss": -26.89569091796875, "global_step": 414865, "epoch": 4998} {"train_loss": -26.772674560546875, "global_step": 414866, "epoch": 4998} {"train_loss": -26.790237426757812, "global_step": 414867, "epoch": 4998} {"train_loss": -26.92486572265625, "global_step": 414868, "epoch": 4998} {"train_loss": -26.992212295532227, "global_step": 414869, "epoch": 4998} {"train_loss": -27.244892120361328, "global_step": 414870, "epoch": 4998} {"train_loss": -26.79877281188965, "global_step": 414871, "epoch": 4998} {"train_loss": -26.91265296936035, "global_step": 414872, "epoch": 4998} {"train_loss": -26.808401107788086, "global_step": 414873, "epoch": 4998} {"train_loss": -26.76045799255371, "global_step": 414874, "epoch": 4998} {"train_loss": -27.014066696166992, "global_step": 414875, "epoch": 4998} {"train_loss": -26.961729049682617, "global_step": 414876, "epoch": 4998} {"train_loss": -26.899641036987305, "global_step": 414877, "epoch": 4998} {"train_loss": -27.106611251831055, "global_step": 414878, "epoch": 4998} {"train_loss": -26.874338150024414, "global_step": 414879, "epoch": 4998} {"train_loss": -26.83473014831543, "global_step": 414880, "epoch": 4998} {"train_loss": -27.077234268188477, "global_step": 414881, "epoch": 4998} {"train_loss": -26.79566764831543, "global_step": 414882, "epoch": 4998} {"train_loss": -26.866397857666016, "global_step": 414883, "epoch": 4998} {"train_loss": -26.633420944213867, "global_step": 414884, "epoch": 4998} {"train_loss": -26.82377052307129, "global_step": 414885, "epoch": 4998} {"train_loss": -26.587390899658203, "global_step": 414886, "epoch": 4998} {"train_loss": -26.646652221679688, "global_step": 414887, "epoch": 4998} {"train_loss": -26.677331924438477, "global_step": 414888, "epoch": 4998} {"train_loss": -27.09320068359375, "global_step": 414889, "epoch": 4998} {"train_loss": -26.927526473999023, "global_step": 414890, "epoch": 4998} {"train_loss": -26.741241455078125, "global_step": 414891, "epoch": 4998} {"train_loss": -26.7470645904541, "global_step": 414892, "epoch": 4998} {"train_loss": -26.321517944335938, "global_step": 414893, "epoch": 4998} {"train_loss": -26.4393367767334, "global_step": 414894, "epoch": 4998} {"train_loss": -26.74976921081543, "global_step": 414895, "epoch": 4998} {"train_loss": -26.758359909057617, "global_step": 414896, "epoch": 4998} {"train_loss": -27.066152572631836, "global_step": 414897, "epoch": 4998} {"train_loss": -26.9537410736084, "global_step": 414898, "epoch": 4998} {"train_loss": -26.705915451049805, "global_step": 414899, "epoch": 4998} {"train_loss": -26.7930850982666, "global_step": 414900, "epoch": 4998} {"train_loss": -26.960477828979492, "global_step": 414901, "epoch": 4998} {"train_loss": -27.022916793823242, "global_step": 414902, "epoch": 4998} {"train_loss": -27.289350509643555, "global_step": 414903, "epoch": 4998} {"train_loss": -27.044330596923828, "global_step": 414904, "epoch": 4998} {"train_loss": -26.994129180908203, "global_step": 414905, "epoch": 4998} {"train_loss": -26.890066146850586, "global_step": 414906, "epoch": 4998} {"train_loss": -26.71278190612793, "global_step": 414907, "epoch": 4998} {"train_loss": -26.835920333862305, "global_step": 414908, "epoch": 4998} {"train_loss": -26.575916290283203, "global_step": 414909, "epoch": 4998} {"train_loss": -26.6511173248291, "global_step": 414910, "epoch": 4998} {"train_loss": -26.619211196899414, "global_step": 414911, "epoch": 4998} {"train_loss": -26.916601181030273, "global_step": 414912, "epoch": 4998} {"train_loss": -27.194110870361328, "global_step": 414913, "epoch": 4998} {"train_loss": -26.778583526611328, "global_step": 414914, "epoch": 4998} {"train_loss": -26.35943031311035, "global_step": 414915, "epoch": 4998} {"train_loss": -26.626457650977446, "global_step": 414916, "epoch": 4998, "val_loss": 6518126.0} {"train_loss": -25.83009147644043, "global_step": 414917, "epoch": 4999} {"train_loss": -24.153278350830078, "global_step": 414918, "epoch": 4999} {"train_loss": -24.620365142822266, "global_step": 414919, "epoch": 4999} {"train_loss": -24.536239624023438, "global_step": 414920, "epoch": 4999} {"train_loss": -25.284879684448242, "global_step": 414921, "epoch": 4999} {"train_loss": -25.068357467651367, "global_step": 414922, "epoch": 4999} {"train_loss": -25.514720916748047, "global_step": 414923, "epoch": 4999} {"train_loss": -25.67911148071289, "global_step": 414924, "epoch": 4999} {"train_loss": -24.9974308013916, "global_step": 414925, "epoch": 4999} {"train_loss": -26.07208824157715, "global_step": 414926, "epoch": 4999} {"train_loss": -25.744291305541992, "global_step": 414927, "epoch": 4999} {"train_loss": -25.221263885498047, "global_step": 414928, "epoch": 4999} {"train_loss": -25.934019088745117, "global_step": 414929, "epoch": 4999} {"train_loss": -26.196338653564453, "global_step": 414930, "epoch": 4999} {"train_loss": -25.80608558654785, "global_step": 414931, "epoch": 4999} {"train_loss": -26.61551856994629, "global_step": 414932, "epoch": 4999} {"train_loss": -25.89655876159668, "global_step": 414933, "epoch": 4999} {"train_loss": -26.25202751159668, "global_step": 414934, "epoch": 4999} {"train_loss": -26.20004653930664, "global_step": 414935, "epoch": 4999} {"train_loss": -25.9864559173584, "global_step": 414936, "epoch": 4999} {"train_loss": -26.218311309814453, "global_step": 414937, "epoch": 4999} {"train_loss": -26.55232048034668, "global_step": 414938, "epoch": 4999} {"train_loss": -26.345251083374023, "global_step": 414939, "epoch": 4999} {"train_loss": -26.29007339477539, "global_step": 414940, "epoch": 4999} {"train_loss": -26.390579223632812, "global_step": 414941, "epoch": 4999} {"train_loss": -26.16322135925293, "global_step": 414942, "epoch": 4999} {"train_loss": -26.291797637939453, "global_step": 414943, "epoch": 4999} {"train_loss": -26.333887100219727, "global_step": 414944, "epoch": 4999} {"train_loss": -26.49427604675293, "global_step": 414945, "epoch": 4999} {"train_loss": -26.406187057495117, "global_step": 414946, "epoch": 4999} {"train_loss": -26.533313751220703, "global_step": 414947, "epoch": 4999} {"train_loss": -26.103897094726562, "global_step": 414948, "epoch": 4999} {"train_loss": -26.332687377929688, "global_step": 414949, "epoch": 4999} {"train_loss": -26.815322875976562, "global_step": 414950, "epoch": 4999} {"train_loss": -26.392927169799805, "global_step": 414951, "epoch": 4999} {"train_loss": -26.53228759765625, "global_step": 414952, "epoch": 4999} {"train_loss": -26.339941024780273, "global_step": 414953, "epoch": 4999} {"train_loss": -26.23712730407715, "global_step": 414954, "epoch": 4999} {"train_loss": -26.586750030517578, "global_step": 414955, "epoch": 4999} {"train_loss": -26.473468780517578, "global_step": 414956, "epoch": 4999} {"train_loss": -26.271146774291992, "global_step": 414957, "epoch": 4999} {"train_loss": -26.34002113342285, "global_step": 414958, "epoch": 4999} {"train_loss": -26.464710235595703, "global_step": 414959, "epoch": 4999} {"train_loss": -26.209531784057617, "global_step": 414960, "epoch": 4999} {"train_loss": -26.478107452392578, "global_step": 414961, "epoch": 4999} {"train_loss": -26.46904945373535, "global_step": 414962, "epoch": 4999} {"train_loss": -26.792646408081055, "global_step": 414963, "epoch": 4999} {"train_loss": -26.351459503173828, "global_step": 414964, "epoch": 4999} {"train_loss": -26.689992904663086, "global_step": 414965, "epoch": 4999} {"train_loss": -26.634902954101562, "global_step": 414966, "epoch": 4999} {"train_loss": -26.656951904296875, "global_step": 414967, "epoch": 4999} {"train_loss": -26.835742950439453, "global_step": 414968, "epoch": 4999} {"train_loss": -26.761587142944336, "global_step": 414969, "epoch": 4999} {"train_loss": -26.744998931884766, "global_step": 414970, "epoch": 4999} {"train_loss": -26.635969161987305, "global_step": 414971, "epoch": 4999} {"train_loss": -26.68842124938965, "global_step": 414972, "epoch": 4999} {"train_loss": -26.979705810546875, "global_step": 414973, "epoch": 4999} {"train_loss": -26.82889175415039, "global_step": 414974, "epoch": 4999} {"train_loss": -26.636688232421875, "global_step": 414975, "epoch": 4999} {"train_loss": -26.818649291992188, "global_step": 414976, "epoch": 4999} {"train_loss": -26.95721435546875, "global_step": 414977, "epoch": 4999} {"train_loss": -26.7971248626709, "global_step": 414978, "epoch": 4999} {"train_loss": -26.5747013092041, "global_step": 414979, "epoch": 4999} {"train_loss": -27.197681427001953, "global_step": 414980, "epoch": 4999} {"train_loss": -27.0235652923584, "global_step": 414981, "epoch": 4999} {"train_loss": -26.741382598876953, "global_step": 414982, "epoch": 4999} {"train_loss": -27.187971115112305, "global_step": 414983, "epoch": 4999} {"train_loss": -27.327051162719727, "global_step": 414984, "epoch": 4999} {"train_loss": -26.75716209411621, "global_step": 414985, "epoch": 4999} {"train_loss": -26.740869522094727, "global_step": 414986, "epoch": 4999} {"train_loss": -26.593399047851562, "global_step": 414987, "epoch": 4999} {"train_loss": -26.973102569580078, "global_step": 414988, "epoch": 4999} {"train_loss": -26.693918228149414, "global_step": 414989, "epoch": 4999} {"train_loss": -26.549097061157227, "global_step": 414990, "epoch": 4999} {"train_loss": -26.92853355407715, "global_step": 414991, "epoch": 4999} {"train_loss": -27.190998077392578, "global_step": 414992, "epoch": 4999} {"train_loss": -26.560575485229492, "global_step": 414993, "epoch": 4999} {"train_loss": -26.76611328125, "global_step": 414994, "epoch": 4999} {"train_loss": -26.734683990478516, "global_step": 414995, "epoch": 4999} {"train_loss": -27.017728805541992, "global_step": 414996, "epoch": 4999} {"train_loss": -27.048192977905273, "global_step": 414997, "epoch": 4999} {"train_loss": -26.80364990234375, "global_step": 414998, "epoch": 4999} {"train_loss": -26.381589889526367, "global_step": 414999, "epoch": 4999, "val_loss": 6481289.0} {"train_loss": -25.48099136352539, "global_step": 415000, "epoch": 5000} {"train_loss": -25.228805541992188, "global_step": 415001, "epoch": 5000} {"train_loss": -25.67087745666504, "global_step": 415002, "epoch": 5000} {"train_loss": -25.825942993164062, "global_step": 415003, "epoch": 5000} {"train_loss": -25.29926872253418, "global_step": 415004, "epoch": 5000} {"train_loss": -26.443695068359375, "global_step": 415005, "epoch": 5000} {"train_loss": -26.125720977783203, "global_step": 415006, "epoch": 5000} {"train_loss": -26.00587272644043, "global_step": 415007, "epoch": 5000} {"train_loss": -25.9909610748291, "global_step": 415008, "epoch": 5000} {"train_loss": -26.09014892578125, "global_step": 415009, "epoch": 5000} {"train_loss": -26.25544548034668, "global_step": 415010, "epoch": 5000} {"train_loss": -26.169431686401367, "global_step": 415011, "epoch": 5000} {"train_loss": -26.13825035095215, "global_step": 415012, "epoch": 5000} {"train_loss": -26.375165939331055, "global_step": 415013, "epoch": 5000} {"train_loss": -26.858505249023438, "global_step": 415014, "epoch": 5000} {"train_loss": -26.15069007873535, "global_step": 415015, "epoch": 5000} {"train_loss": -26.436325073242188, "global_step": 415016, "epoch": 5000} {"train_loss": -26.446523666381836, "global_step": 415017, "epoch": 5000} {"train_loss": -26.32059097290039, "global_step": 415018, "epoch": 5000} {"train_loss": -26.522436141967773, "global_step": 415019, "epoch": 5000} {"train_loss": -26.3644962310791, "global_step": 415020, "epoch": 5000} {"train_loss": -26.361968994140625, "global_step": 415021, "epoch": 5000} {"train_loss": -26.710865020751953, "global_step": 415022, "epoch": 5000} {"train_loss": -26.67377281188965, "global_step": 415023, "epoch": 5000} {"train_loss": -26.45256996154785, "global_step": 415024, "epoch": 5000} {"train_loss": -26.310327529907227, "global_step": 415025, "epoch": 5000} {"train_loss": -26.76517105102539, "global_step": 415026, "epoch": 5000} {"train_loss": -26.597665786743164, "global_step": 415027, "epoch": 5000} {"train_loss": -26.731353759765625, "global_step": 415028, "epoch": 5000} {"train_loss": -26.549274444580078, "global_step": 415029, "epoch": 5000} {"train_loss": -26.635778427124023, "global_step": 415030, "epoch": 5000} {"train_loss": -26.927112579345703, "global_step": 415031, "epoch": 5000} {"train_loss": -26.808523178100586, "global_step": 415032, "epoch": 5000} {"train_loss": -26.38750648498535, "global_step": 415033, "epoch": 5000} {"train_loss": -26.50381851196289, "global_step": 415034, "epoch": 5000} {"train_loss": -26.838825225830078, "global_step": 415035, "epoch": 5000} {"train_loss": -26.951940536499023, "global_step": 415036, "epoch": 5000} {"train_loss": -26.69868278503418, "global_step": 415037, "epoch": 5000} {"train_loss": -26.692153930664062, "global_step": 415038, "epoch": 5000} {"train_loss": -27.177169799804688, "global_step": 415039, "epoch": 5000} {"train_loss": -26.93701171875, "global_step": 415040, "epoch": 5000} {"train_loss": -26.886505126953125, "global_step": 415041, "epoch": 5000} {"train_loss": -26.77243423461914, "global_step": 415042, "epoch": 5000} {"train_loss": -26.724323272705078, "global_step": 415043, "epoch": 5000} {"train_loss": -27.01901626586914, "global_step": 415044, "epoch": 5000} {"train_loss": -26.85642433166504, "global_step": 415045, "epoch": 5000} {"train_loss": -26.772993087768555, "global_step": 415046, "epoch": 5000} {"train_loss": -26.9034423828125, "global_step": 415047, "epoch": 5000} {"train_loss": -26.619464874267578, "global_step": 415048, "epoch": 5000} {"train_loss": -26.654027938842773, "global_step": 415049, "epoch": 5000} {"train_loss": -27.272207260131836, "global_step": 415050, "epoch": 5000} {"train_loss": -26.783105850219727, "global_step": 415051, "epoch": 5000} {"train_loss": -26.806812286376953, "global_step": 415052, "epoch": 5000} {"train_loss": -26.73467445373535, "global_step": 415053, "epoch": 5000} {"train_loss": -26.660558700561523, "global_step": 415054, "epoch": 5000} {"train_loss": -26.261260986328125, "global_step": 415055, "epoch": 5000} {"train_loss": -26.796789169311523, "global_step": 415056, "epoch": 5000} {"train_loss": -26.66924476623535, "global_step": 415057, "epoch": 5000} {"train_loss": -26.499807357788086, "global_step": 415058, "epoch": 5000} {"train_loss": -26.48357582092285, "global_step": 415059, "epoch": 5000} {"train_loss": -26.65764808654785, "global_step": 415060, "epoch": 5000} {"train_loss": -26.800058364868164, "global_step": 415061, "epoch": 5000} {"train_loss": -26.681020736694336, "global_step": 415062, "epoch": 5000} {"train_loss": -26.877470016479492, "global_step": 415063, "epoch": 5000} {"train_loss": -27.157577514648438, "global_step": 415064, "epoch": 5000} {"train_loss": -26.77789306640625, "global_step": 415065, "epoch": 5000} {"train_loss": -26.64858055114746, "global_step": 415066, "epoch": 5000} {"train_loss": -26.74749183654785, "global_step": 415067, "epoch": 5000} {"train_loss": -26.662006378173828, "global_step": 415068, "epoch": 5000} {"train_loss": -26.624242782592773, "global_step": 415069, "epoch": 5000} {"train_loss": -27.2548770904541, "global_step": 415070, "epoch": 5000} {"train_loss": -26.6755313873291, "global_step": 415071, "epoch": 5000} {"train_loss": -27.0520076751709, "global_step": 415072, "epoch": 5000} {"train_loss": -26.778024673461914, "global_step": 415073, "epoch": 5000} {"train_loss": -27.100299835205078, "global_step": 415074, "epoch": 5000} {"train_loss": -26.690725326538086, "global_step": 415075, "epoch": 5000} {"train_loss": -26.803180694580078, "global_step": 415076, "epoch": 5000} {"train_loss": -26.707111358642578, "global_step": 415077, "epoch": 5000} {"train_loss": -26.712020874023438, "global_step": 415078, "epoch": 5000} {"train_loss": -26.898767471313477, "global_step": 415079, "epoch": 5000} {"train_loss": -26.671308517456055, "global_step": 415080, "epoch": 5000} {"train_loss": -26.72307777404785, "global_step": 415081, "epoch": 5000} {"train_loss": -26.59512894412121, "global_step": 415082, "epoch": 5000, "train/sim_max_reward_0": 1.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4500000": 1.0, "test/sim_max_reward_4500001": 1.0, "test/sim_max_reward_4500002": 1.0, "test/sim_max_reward_4500003": 1.0, "test/sim_max_reward_4500004": 1.0, "test/sim_max_reward_4500005": 1.0, "test/sim_max_reward_4500006": 1.0, "test/sim_max_reward_4500007": 0.0, "test/sim_max_reward_4500008": 1.0, "test/sim_max_reward_4500009": 1.0, "test/sim_max_reward_4500010": 1.0, "test/sim_max_reward_4500011": 1.0, "test/sim_max_reward_4500012": 1.0, "test/sim_max_reward_4500013": 0.0, "test/sim_max_reward_4500014": 1.0, "test/sim_max_reward_4500015": 1.0, "test/sim_max_reward_4500016": 1.0, "test/sim_max_reward_4500017": 1.0, "test/sim_max_reward_4500018": 1.0, "test/sim_max_reward_4500019": 0.0, "test/sim_max_reward_4500020": 1.0, "test/sim_max_reward_4500021": 1.0, "train/mean_score": 1.0, "test/mean_score": 0.8636363636363636, "val_loss": 6491888.0} {"train_loss": -25.72002601623535, "global_step": 415083, "epoch": 5001} {"train_loss": -25.43475341796875, "global_step": 415084, "epoch": 5001} {"train_loss": -25.404279708862305, "global_step": 415085, "epoch": 5001} {"train_loss": -25.99977684020996, "global_step": 415086, "epoch": 5001} {"train_loss": -26.211217880249023, "global_step": 415087, "epoch": 5001} {"train_loss": -26.138769149780273, "global_step": 415088, "epoch": 5001} {"train_loss": -26.23479652404785, "global_step": 415089, "epoch": 5001} {"train_loss": -26.15707778930664, "global_step": 415090, "epoch": 5001} {"train_loss": -26.071359634399414, "global_step": 415091, "epoch": 5001} {"train_loss": -26.432889938354492, "global_step": 415092, "epoch": 5001} {"train_loss": -26.036060333251953, "global_step": 415093, "epoch": 5001} {"train_loss": -26.404870986938477, "global_step": 415094, "epoch": 5001} {"train_loss": -26.349515914916992, "global_step": 415095, "epoch": 5001} {"train_loss": -26.443204879760742, "global_step": 415096, "epoch": 5001} {"train_loss": -25.95254898071289, "global_step": 415097, "epoch": 5001} {"train_loss": -26.70588493347168, "global_step": 415098, "epoch": 5001} {"train_loss": -26.15936279296875, "global_step": 415099, "epoch": 5001} {"train_loss": -26.667221069335938, "global_step": 415100, "epoch": 5001} {"train_loss": -26.68499755859375, "global_step": 415101, "epoch": 5001} {"train_loss": -26.570953369140625, "global_step": 415102, "epoch": 5001} {"train_loss": -26.56831169128418, "global_step": 415103, "epoch": 5001} {"train_loss": -26.442386627197266, "global_step": 415104, "epoch": 5001} {"train_loss": -26.49323844909668, "global_step": 415105, "epoch": 5001} {"train_loss": -26.67824363708496, "global_step": 415106, "epoch": 5001} {"train_loss": -26.6192569732666, "global_step": 415107, "epoch": 5001} {"train_loss": -26.53388023376465, "global_step": 415108, "epoch": 5001} {"train_loss": -26.784082412719727, "global_step": 415109, "epoch": 5001} {"train_loss": -26.509235382080078, "global_step": 415110, "epoch": 5001} {"train_loss": -26.386281967163086, "global_step": 415111, "epoch": 5001} {"train_loss": -26.830047607421875, "global_step": 415112, "epoch": 5001} {"train_loss": -26.97383689880371, "global_step": 415113, "epoch": 5001} {"train_loss": -26.661035537719727, "global_step": 415114, "epoch": 5001} {"train_loss": -26.457075119018555, "global_step": 415115, "epoch": 5001} {"train_loss": -26.56839370727539, "global_step": 415116, "epoch": 5001} {"train_loss": -26.95224952697754, "global_step": 415117, "epoch": 5001} {"train_loss": -26.636127471923828, "global_step": 415118, "epoch": 5001} {"train_loss": -26.902997970581055, "global_step": 415119, "epoch": 5001} {"train_loss": -26.8676700592041, "global_step": 415120, "epoch": 5001} {"train_loss": -26.808095932006836, "global_step": 415121, "epoch": 5001} {"train_loss": -26.696081161499023, "global_step": 415122, "epoch": 5001} {"train_loss": -26.817358016967773, "global_step": 415123, "epoch": 5001} {"train_loss": -27.24104881286621, "global_step": 415124, "epoch": 5001} {"train_loss": -26.85321617126465, "global_step": 415125, "epoch": 5001} {"train_loss": -26.501239776611328, "global_step": 415126, "epoch": 5001} {"train_loss": -26.6888427734375, "global_step": 415127, "epoch": 5001} {"train_loss": -26.812881469726562, "global_step": 415128, "epoch": 5001} {"train_loss": -26.7568416595459, "global_step": 415129, "epoch": 5001} {"train_loss": -26.7294864654541, "global_step": 415130, "epoch": 5001} {"train_loss": -26.779340744018555, "global_step": 415131, "epoch": 5001} {"train_loss": -27.071414947509766, "global_step": 415132, "epoch": 5001} {"train_loss": -27.222639083862305, "global_step": 415133, "epoch": 5001} {"train_loss": -26.43427848815918, "global_step": 415134, "epoch": 5001} {"train_loss": -26.744766235351562, "global_step": 415135, "epoch": 5001} {"train_loss": -26.7475643157959, "global_step": 415136, "epoch": 5001} {"train_loss": -26.787534713745117, "global_step": 415137, "epoch": 5001} {"train_loss": -26.687149047851562, "global_step": 415138, "epoch": 5001} {"train_loss": -26.670612335205078, "global_step": 415139, "epoch": 5001} {"train_loss": -26.658771514892578, "global_step": 415140, "epoch": 5001} {"train_loss": -26.808948516845703, "global_step": 415141, "epoch": 5001} {"train_loss": -26.609418869018555, "global_step": 415142, "epoch": 5001} {"train_loss": -26.694629669189453, "global_step": 415143, "epoch": 5001} {"train_loss": -26.561176300048828, "global_step": 415144, "epoch": 5001} {"train_loss": -26.438383102416992, "global_step": 415145, "epoch": 5001} {"train_loss": -26.641504287719727, "global_step": 415146, "epoch": 5001} {"train_loss": -26.425159454345703, "global_step": 415147, "epoch": 5001} {"train_loss": -26.756229400634766, "global_step": 415148, "epoch": 5001} {"train_loss": -26.69675636291504, "global_step": 415149, "epoch": 5001} {"train_loss": -26.800098419189453, "global_step": 415150, "epoch": 5001} {"train_loss": -26.67112159729004, "global_step": 415151, "epoch": 5001} {"train_loss": -26.462583541870117, "global_step": 415152, "epoch": 5001} {"train_loss": -26.70769691467285, "global_step": 415153, "epoch": 5001} {"train_loss": -26.616241455078125, "global_step": 415154, "epoch": 5001} {"train_loss": -26.528837203979492, "global_step": 415155, "epoch": 5001} {"train_loss": -26.94911766052246, "global_step": 415156, "epoch": 5001} {"train_loss": -26.75235939025879, "global_step": 415157, "epoch": 5001} {"train_loss": -26.745878219604492, "global_step": 415158, "epoch": 5001} {"train_loss": -26.707311630249023, "global_step": 415159, "epoch": 5001} {"train_loss": -26.77045249938965, "global_step": 415160, "epoch": 5001} {"train_loss": -26.902685165405273, "global_step": 415161, "epoch": 5001} {"train_loss": -26.925308227539062, "global_step": 415162, "epoch": 5001} {"train_loss": -26.45658302307129, "global_step": 415163, "epoch": 5001} {"train_loss": -27.030187606811523, "global_step": 415164, "epoch": 5001} {"train_loss": -26.596800264105738, "global_step": 415165, "epoch": 5001, "val_loss": 6490687.0} {"train_loss": -26.48923110961914, "global_step": 415166, "epoch": 5002} {"train_loss": -25.39867401123047, "global_step": 415167, "epoch": 5002} {"train_loss": -26.26593589782715, "global_step": 415168, "epoch": 5002} {"train_loss": -26.4428653717041, "global_step": 415169, "epoch": 5002} {"train_loss": -25.439697265625, "global_step": 415170, "epoch": 5002} {"train_loss": -26.16651725769043, "global_step": 415171, "epoch": 5002} {"train_loss": -25.758514404296875, "global_step": 415172, "epoch": 5002} {"train_loss": -26.438404083251953, "global_step": 415173, "epoch": 5002} {"train_loss": -26.111799240112305, "global_step": 415174, "epoch": 5002} {"train_loss": -26.350433349609375, "global_step": 415175, "epoch": 5002} {"train_loss": -26.363012313842773, "global_step": 415176, "epoch": 5002} {"train_loss": -26.73663330078125, "global_step": 415177, "epoch": 5002} {"train_loss": -26.659168243408203, "global_step": 415178, "epoch": 5002} {"train_loss": -26.434051513671875, "global_step": 415179, "epoch": 5002} {"train_loss": -26.170185089111328, "global_step": 415180, "epoch": 5002} {"train_loss": -25.949726104736328, "global_step": 415181, "epoch": 5002} {"train_loss": -26.19202995300293, "global_step": 415182, "epoch": 5002} {"train_loss": -26.570697784423828, "global_step": 415183, "epoch": 5002} {"train_loss": -26.521459579467773, "global_step": 415184, "epoch": 5002} {"train_loss": -26.441797256469727, "global_step": 415185, "epoch": 5002} {"train_loss": -26.287841796875, "global_step": 415186, "epoch": 5002} {"train_loss": -26.58260154724121, "global_step": 415187, "epoch": 5002} {"train_loss": -26.28871726989746, "global_step": 415188, "epoch": 5002} {"train_loss": -26.492639541625977, "global_step": 415189, "epoch": 5002} {"train_loss": -26.309125900268555, "global_step": 415190, "epoch": 5002} {"train_loss": -26.8629150390625, "global_step": 415191, "epoch": 5002} {"train_loss": -26.300006866455078, "global_step": 415192, "epoch": 5002} {"train_loss": -26.630298614501953, "global_step": 415193, "epoch": 5002} {"train_loss": -26.522550582885742, "global_step": 415194, "epoch": 5002} {"train_loss": -26.926965713500977, "global_step": 415195, "epoch": 5002} {"train_loss": -26.610937118530273, "global_step": 415196, "epoch": 5002} {"train_loss": -26.662006378173828, "global_step": 415197, "epoch": 5002} {"train_loss": -26.764570236206055, "global_step": 415198, "epoch": 5002} {"train_loss": -26.656524658203125, "global_step": 415199, "epoch": 5002} {"train_loss": -26.74897575378418, "global_step": 415200, "epoch": 5002} {"train_loss": -26.43486976623535, "global_step": 415201, "epoch": 5002} {"train_loss": -26.37517738342285, "global_step": 415202, "epoch": 5002} {"train_loss": -26.564620971679688, "global_step": 415203, "epoch": 5002} {"train_loss": -26.709014892578125, "global_step": 415204, "epoch": 5002} {"train_loss": -26.904220581054688, "global_step": 415205, "epoch": 5002} {"train_loss": -26.8421630859375, "global_step": 415206, "epoch": 5002} {"train_loss": -26.58827781677246, "global_step": 415207, "epoch": 5002} {"train_loss": -26.569799423217773, "global_step": 415208, "epoch": 5002} {"train_loss": -26.962631225585938, "global_step": 415209, "epoch": 5002} {"train_loss": -27.109968185424805, "global_step": 415210, "epoch": 5002} {"train_loss": -26.82257652282715, "global_step": 415211, "epoch": 5002} {"train_loss": -26.752582550048828, "global_step": 415212, "epoch": 5002} {"train_loss": -26.63142967224121, "global_step": 415213, "epoch": 5002} {"train_loss": -26.87287712097168, "global_step": 415214, "epoch": 5002} {"train_loss": -26.867389678955078, "global_step": 415215, "epoch": 5002} {"train_loss": -26.90180015563965, "global_step": 415216, "epoch": 5002} {"train_loss": -27.11936378479004, "global_step": 415217, "epoch": 5002} {"train_loss": -26.82771110534668, "global_step": 415218, "epoch": 5002} {"train_loss": -27.250579833984375, "global_step": 415219, "epoch": 5002} {"train_loss": -26.744043350219727, "global_step": 415220, "epoch": 5002} {"train_loss": -27.449493408203125, "global_step": 415221, "epoch": 5002} {"train_loss": -26.955488204956055, "global_step": 415222, "epoch": 5002} {"train_loss": -26.510986328125, "global_step": 415223, "epoch": 5002} {"train_loss": -26.643396377563477, "global_step": 415224, "epoch": 5002} {"train_loss": -26.771728515625, "global_step": 415225, "epoch": 5002} {"train_loss": -26.799549102783203, "global_step": 415226, "epoch": 5002} {"train_loss": -26.577844619750977, "global_step": 415227, "epoch": 5002} {"train_loss": -26.27802085876465, "global_step": 415228, "epoch": 5002} {"train_loss": -26.651208877563477, "global_step": 415229, "epoch": 5002} {"train_loss": -26.6340389251709, "global_step": 415230, "epoch": 5002} {"train_loss": -27.014551162719727, "global_step": 415231, "epoch": 5002} {"train_loss": -26.48565673828125, "global_step": 415232, "epoch": 5002} {"train_loss": -26.661823272705078, "global_step": 415233, "epoch": 5002} {"train_loss": -26.42315673828125, "global_step": 415234, "epoch": 5002} {"train_loss": -26.7749080657959, "global_step": 415235, "epoch": 5002} {"train_loss": -26.66998291015625, "global_step": 415236, "epoch": 5002} {"train_loss": -26.587316513061523, "global_step": 415237, "epoch": 5002} {"train_loss": -26.404651641845703, "global_step": 415238, "epoch": 5002} {"train_loss": -26.492605209350586, "global_step": 415239, "epoch": 5002} {"train_loss": -26.88056755065918, "global_step": 415240, "epoch": 5002} {"train_loss": -26.30952262878418, "global_step": 415241, "epoch": 5002} {"train_loss": -26.77011489868164, "global_step": 415242, "epoch": 5002} {"train_loss": -26.82586097717285, "global_step": 415243, "epoch": 5002} {"train_loss": -26.660375595092773, "global_step": 415244, "epoch": 5002} {"train_loss": -26.805646896362305, "global_step": 415245, "epoch": 5002} {"train_loss": -26.944355010986328, "global_step": 415246, "epoch": 5002} {"train_loss": -26.92901611328125, "global_step": 415247, "epoch": 5002} {"train_loss": -26.58307172016925, "global_step": 415248, "epoch": 5002, "val_loss": 6459306.5} {"train_loss": -26.523954391479492, "global_step": 415249, "epoch": 5003} {"train_loss": -25.731061935424805, "global_step": 415250, "epoch": 5003} {"train_loss": -26.51507568359375, "global_step": 415251, "epoch": 5003} {"train_loss": -26.1751766204834, "global_step": 415252, "epoch": 5003} {"train_loss": -26.387495040893555, "global_step": 415253, "epoch": 5003} {"train_loss": -26.19319725036621, "global_step": 415254, "epoch": 5003} {"train_loss": -26.178543090820312, "global_step": 415255, "epoch": 5003} {"train_loss": -26.482166290283203, "global_step": 415256, "epoch": 5003} {"train_loss": -26.167829513549805, "global_step": 415257, "epoch": 5003} {"train_loss": -26.417203903198242, "global_step": 415258, "epoch": 5003} {"train_loss": -26.143972396850586, "global_step": 415259, "epoch": 5003} {"train_loss": -26.31937599182129, "global_step": 415260, "epoch": 5003} {"train_loss": -26.162137985229492, "global_step": 415261, "epoch": 5003} {"train_loss": -26.42571449279785, "global_step": 415262, "epoch": 5003} {"train_loss": -26.312665939331055, "global_step": 415263, "epoch": 5003} {"train_loss": -26.521337509155273, "global_step": 415264, "epoch": 5003} {"train_loss": -26.52150535583496, "global_step": 415265, "epoch": 5003} {"train_loss": -26.2639217376709, "global_step": 415266, "epoch": 5003} {"train_loss": -26.78754234313965, "global_step": 415267, "epoch": 5003} {"train_loss": -26.4868221282959, "global_step": 415268, "epoch": 5003} {"train_loss": -26.96418571472168, "global_step": 415269, "epoch": 5003} {"train_loss": -26.746442794799805, "global_step": 415270, "epoch": 5003} {"train_loss": -26.5156307220459, "global_step": 415271, "epoch": 5003} {"train_loss": -26.629230499267578, "global_step": 415272, "epoch": 5003} {"train_loss": -26.54766845703125, "global_step": 415273, "epoch": 5003} {"train_loss": -26.60797691345215, "global_step": 415274, "epoch": 5003} {"train_loss": -26.643766403198242, "global_step": 415275, "epoch": 5003} {"train_loss": -26.547842025756836, "global_step": 415276, "epoch": 5003} {"train_loss": -26.82642936706543, "global_step": 415277, "epoch": 5003} {"train_loss": -26.83447265625, "global_step": 415278, "epoch": 5003} {"train_loss": -27.012012481689453, "global_step": 415279, "epoch": 5003} {"train_loss": -26.60249137878418, "global_step": 415280, "epoch": 5003} {"train_loss": -26.967212677001953, "global_step": 415281, "epoch": 5003} {"train_loss": -26.851919174194336, "global_step": 415282, "epoch": 5003} {"train_loss": -26.73603630065918, "global_step": 415283, "epoch": 5003} {"train_loss": -27.249563217163086, "global_step": 415284, "epoch": 5003} {"train_loss": -27.24024772644043, "global_step": 415285, "epoch": 5003} {"train_loss": -26.663373947143555, "global_step": 415286, "epoch": 5003} {"train_loss": -26.8566837310791, "global_step": 415287, "epoch": 5003} {"train_loss": -26.700910568237305, "global_step": 415288, "epoch": 5003} {"train_loss": -26.9613037109375, "global_step": 415289, "epoch": 5003} {"train_loss": -26.939208984375, "global_step": 415290, "epoch": 5003} {"train_loss": -26.691211700439453, "global_step": 415291, "epoch": 5003} {"train_loss": -26.990808486938477, "global_step": 415292, "epoch": 5003} {"train_loss": -26.64252281188965, "global_step": 415293, "epoch": 5003} {"train_loss": -26.53818130493164, "global_step": 415294, "epoch": 5003} {"train_loss": -26.44133949279785, "global_step": 415295, "epoch": 5003} {"train_loss": -26.578022003173828, "global_step": 415296, "epoch": 5003} {"train_loss": -26.63958168029785, "global_step": 415297, "epoch": 5003} {"train_loss": -26.754596710205078, "global_step": 415298, "epoch": 5003} {"train_loss": -26.612592697143555, "global_step": 415299, "epoch": 5003} {"train_loss": -26.505435943603516, "global_step": 415300, "epoch": 5003} {"train_loss": -26.68702507019043, "global_step": 415301, "epoch": 5003} {"train_loss": -26.9045467376709, "global_step": 415302, "epoch": 5003} {"train_loss": -27.117786407470703, "global_step": 415303, "epoch": 5003} {"train_loss": -26.659666061401367, "global_step": 415304, "epoch": 5003} {"train_loss": -26.677000045776367, "global_step": 415305, "epoch": 5003} {"train_loss": -26.358386993408203, "global_step": 415306, "epoch": 5003} {"train_loss": -26.518529891967773, "global_step": 415307, "epoch": 5003} {"train_loss": -26.73335075378418, "global_step": 415308, "epoch": 5003} {"train_loss": -26.8398380279541, "global_step": 415309, "epoch": 5003} {"train_loss": -26.434762954711914, "global_step": 415310, "epoch": 5003} {"train_loss": -26.521692276000977, "global_step": 415311, "epoch": 5003} {"train_loss": -26.899688720703125, "global_step": 415312, "epoch": 5003} {"train_loss": -26.791610717773438, "global_step": 415313, "epoch": 5003} {"train_loss": -26.469228744506836, "global_step": 415314, "epoch": 5003} {"train_loss": -26.5303897857666, "global_step": 415315, "epoch": 5003} {"train_loss": -26.58428382873535, "global_step": 415316, "epoch": 5003} {"train_loss": -27.14064598083496, "global_step": 415317, "epoch": 5003} {"train_loss": -26.77553367614746, "global_step": 415318, "epoch": 5003} {"train_loss": -26.08892822265625, "global_step": 415319, "epoch": 5003} {"train_loss": -26.246826171875, "global_step": 415320, "epoch": 5003} {"train_loss": -26.52131462097168, "global_step": 415321, "epoch": 5003} {"train_loss": -26.463531494140625, "global_step": 415322, "epoch": 5003} {"train_loss": -26.775232315063477, "global_step": 415323, "epoch": 5003} {"train_loss": -26.733503341674805, "global_step": 415324, "epoch": 5003} {"train_loss": -26.862150192260742, "global_step": 415325, "epoch": 5003} {"train_loss": -26.777158737182617, "global_step": 415326, "epoch": 5003} {"train_loss": -26.799758911132812, "global_step": 415327, "epoch": 5003} {"train_loss": -26.68844985961914, "global_step": 415328, "epoch": 5003} {"train_loss": -26.817401885986328, "global_step": 415329, "epoch": 5003} {"train_loss": -26.554113388061523, "global_step": 415330, "epoch": 5003} {"train_loss": -26.62493462160409, "global_step": 415331, "epoch": 5003, "val_loss": 6586263.0} {"train_loss": -26.05280113220215, "global_step": 415332, "epoch": 5004} {"train_loss": -25.82630729675293, "global_step": 415333, "epoch": 5004} {"train_loss": -26.184423446655273, "global_step": 415334, "epoch": 5004} {"train_loss": -25.991357803344727, "global_step": 415335, "epoch": 5004} {"train_loss": -25.69727897644043, "global_step": 415336, "epoch": 5004} {"train_loss": -26.108732223510742, "global_step": 415337, "epoch": 5004} {"train_loss": -26.300092697143555, "global_step": 415338, "epoch": 5004} {"train_loss": -25.517227172851562, "global_step": 415339, "epoch": 5004} {"train_loss": -26.029132843017578, "global_step": 415340, "epoch": 5004} {"train_loss": -26.796979904174805, "global_step": 415341, "epoch": 5004} {"train_loss": -26.176532745361328, "global_step": 415342, "epoch": 5004} {"train_loss": -26.531482696533203, "global_step": 415343, "epoch": 5004} {"train_loss": -26.13306999206543, "global_step": 415344, "epoch": 5004} {"train_loss": -26.245086669921875, "global_step": 415345, "epoch": 5004} {"train_loss": -26.666168212890625, "global_step": 415346, "epoch": 5004} {"train_loss": -26.35735511779785, "global_step": 415347, "epoch": 5004} {"train_loss": -26.341384887695312, "global_step": 415348, "epoch": 5004} {"train_loss": -26.159774780273438, "global_step": 415349, "epoch": 5004} {"train_loss": -26.65931510925293, "global_step": 415350, "epoch": 5004} {"train_loss": -26.484243392944336, "global_step": 415351, "epoch": 5004} {"train_loss": -26.484052658081055, "global_step": 415352, "epoch": 5004} {"train_loss": -26.674808502197266, "global_step": 415353, "epoch": 5004} {"train_loss": -26.397531509399414, "global_step": 415354, "epoch": 5004} {"train_loss": -26.211576461791992, "global_step": 415355, "epoch": 5004} {"train_loss": -26.805944442749023, "global_step": 415356, "epoch": 5004} {"train_loss": -26.31098747253418, "global_step": 415357, "epoch": 5004} {"train_loss": -26.743310928344727, "global_step": 415358, "epoch": 5004} {"train_loss": -26.86121940612793, "global_step": 415359, "epoch": 5004} {"train_loss": -26.498626708984375, "global_step": 415360, "epoch": 5004} {"train_loss": -26.86330223083496, "global_step": 415361, "epoch": 5004} {"train_loss": -26.515466690063477, "global_step": 415362, "epoch": 5004} {"train_loss": -26.44196128845215, "global_step": 415363, "epoch": 5004} {"train_loss": -26.878942489624023, "global_step": 415364, "epoch": 5004} {"train_loss": -26.950286865234375, "global_step": 415365, "epoch": 5004} {"train_loss": -26.76127052307129, "global_step": 415366, "epoch": 5004} {"train_loss": -27.199874877929688, "global_step": 415367, "epoch": 5004} {"train_loss": -27.158966064453125, "global_step": 415368, "epoch": 5004} {"train_loss": -27.27549171447754, "global_step": 415369, "epoch": 5004} {"train_loss": -26.861486434936523, "global_step": 415370, "epoch": 5004} {"train_loss": -27.201770782470703, "global_step": 415371, "epoch": 5004} {"train_loss": -27.080228805541992, "global_step": 415372, "epoch": 5004} {"train_loss": -26.969120025634766, "global_step": 415373, "epoch": 5004} {"train_loss": -26.90803337097168, "global_step": 415374, "epoch": 5004} {"train_loss": -26.6055908203125, "global_step": 415375, "epoch": 5004} {"train_loss": -26.865009307861328, "global_step": 415376, "epoch": 5004} {"train_loss": -26.8571834564209, "global_step": 415377, "epoch": 5004} {"train_loss": -26.737668991088867, "global_step": 415378, "epoch": 5004} {"train_loss": -26.837865829467773, "global_step": 415379, "epoch": 5004} {"train_loss": -27.065418243408203, "global_step": 415380, "epoch": 5004} {"train_loss": -27.026662826538086, "global_step": 415381, "epoch": 5004} {"train_loss": -26.711551666259766, "global_step": 415382, "epoch": 5004} {"train_loss": -26.992101669311523, "global_step": 415383, "epoch": 5004} {"train_loss": -26.765405654907227, "global_step": 415384, "epoch": 5004} {"train_loss": -26.747888565063477, "global_step": 415385, "epoch": 5004} {"train_loss": -27.458093643188477, "global_step": 415386, "epoch": 5004} {"train_loss": -27.065540313720703, "global_step": 415387, "epoch": 5004} {"train_loss": -27.086034774780273, "global_step": 415388, "epoch": 5004} {"train_loss": -27.072158813476562, "global_step": 415389, "epoch": 5004} {"train_loss": -27.032840728759766, "global_step": 415390, "epoch": 5004} {"train_loss": -27.20648765563965, "global_step": 415391, "epoch": 5004} {"train_loss": -26.700010299682617, "global_step": 415392, "epoch": 5004} {"train_loss": -27.273639678955078, "global_step": 415393, "epoch": 5004} {"train_loss": -26.5341796875, "global_step": 415394, "epoch": 5004} {"train_loss": -27.128097534179688, "global_step": 415395, "epoch": 5004} {"train_loss": -26.498559951782227, "global_step": 415396, "epoch": 5004} {"train_loss": -26.77796745300293, "global_step": 415397, "epoch": 5004} {"train_loss": -26.8148193359375, "global_step": 415398, "epoch": 5004} {"train_loss": -26.7990779876709, "global_step": 415399, "epoch": 5004} {"train_loss": -26.58734130859375, "global_step": 415400, "epoch": 5004} {"train_loss": -26.875818252563477, "global_step": 415401, "epoch": 5004} {"train_loss": -26.83930015563965, "global_step": 415402, "epoch": 5004} {"train_loss": -26.65642738342285, "global_step": 415403, "epoch": 5004} {"train_loss": -26.62630271911621, "global_step": 415404, "epoch": 5004} {"train_loss": -26.677703857421875, "global_step": 415405, "epoch": 5004} {"train_loss": -26.573694229125977, "global_step": 415406, "epoch": 5004} {"train_loss": -26.7191219329834, "global_step": 415407, "epoch": 5004} {"train_loss": -26.09515953063965, "global_step": 415408, "epoch": 5004} {"train_loss": -25.506610870361328, "global_step": 415409, "epoch": 5004} {"train_loss": -24.467357635498047, "global_step": 415410, "epoch": 5004} {"train_loss": -25.850797653198242, "global_step": 415411, "epoch": 5004} {"train_loss": -26.346271514892578, "global_step": 415412, "epoch": 5004} {"train_loss": -25.691913604736328, "global_step": 415413, "epoch": 5004} {"train_loss": -26.58028106229851, "global_step": 415414, "epoch": 5004, "val_loss": 6434968.0} {"train_loss": -25.777088165283203, "global_step": 415415, "epoch": 5005} {"train_loss": -25.917699813842773, "global_step": 415416, "epoch": 5005} {"train_loss": -25.85504722595215, "global_step": 415417, "epoch": 5005} {"train_loss": -25.477046966552734, "global_step": 415418, "epoch": 5005} {"train_loss": -26.18402671813965, "global_step": 415419, "epoch": 5005} {"train_loss": -25.951080322265625, "global_step": 415420, "epoch": 5005} {"train_loss": -25.6080379486084, "global_step": 415421, "epoch": 5005} {"train_loss": -26.2989559173584, "global_step": 415422, "epoch": 5005} {"train_loss": -25.965045928955078, "global_step": 415423, "epoch": 5005} {"train_loss": -25.635412216186523, "global_step": 415424, "epoch": 5005} {"train_loss": -26.25495719909668, "global_step": 415425, "epoch": 5005} {"train_loss": -26.045028686523438, "global_step": 415426, "epoch": 5005} {"train_loss": -26.15894889831543, "global_step": 415427, "epoch": 5005} {"train_loss": -26.136051177978516, "global_step": 415428, "epoch": 5005} {"train_loss": -26.299915313720703, "global_step": 415429, "epoch": 5005} {"train_loss": -26.32245445251465, "global_step": 415430, "epoch": 5005} {"train_loss": -26.576282501220703, "global_step": 415431, "epoch": 5005} {"train_loss": -26.817489624023438, "global_step": 415432, "epoch": 5005} {"train_loss": -26.591733932495117, "global_step": 415433, "epoch": 5005} {"train_loss": -26.735401153564453, "global_step": 415434, "epoch": 5005} {"train_loss": -26.732452392578125, "global_step": 415435, "epoch": 5005} {"train_loss": -26.337453842163086, "global_step": 415436, "epoch": 5005} {"train_loss": -26.75471305847168, "global_step": 415437, "epoch": 5005} {"train_loss": -26.44318962097168, "global_step": 415438, "epoch": 5005} {"train_loss": -26.8189697265625, "global_step": 415439, "epoch": 5005} {"train_loss": -26.445688247680664, "global_step": 415440, "epoch": 5005} {"train_loss": -26.8649845123291, "global_step": 415441, "epoch": 5005} {"train_loss": -26.841903686523438, "global_step": 415442, "epoch": 5005} {"train_loss": -26.9581356048584, "global_step": 415443, "epoch": 5005} {"train_loss": -26.673086166381836, "global_step": 415444, "epoch": 5005} {"train_loss": -27.189666748046875, "global_step": 415445, "epoch": 5005} {"train_loss": -26.96270751953125, "global_step": 415446, "epoch": 5005} {"train_loss": -26.841543197631836, "global_step": 415447, "epoch": 5005} {"train_loss": -26.8863582611084, "global_step": 415448, "epoch": 5005} {"train_loss": -26.91084098815918, "global_step": 415449, "epoch": 5005} {"train_loss": -26.42237663269043, "global_step": 415450, "epoch": 5005} {"train_loss": -27.08176040649414, "global_step": 415451, "epoch": 5005} {"train_loss": -27.28690528869629, "global_step": 415452, "epoch": 5005} {"train_loss": -26.539167404174805, "global_step": 415453, "epoch": 5005} {"train_loss": -26.906177520751953, "global_step": 415454, "epoch": 5005} {"train_loss": -26.926610946655273, "global_step": 415455, "epoch": 5005} {"train_loss": -27.171049118041992, "global_step": 415456, "epoch": 5005} {"train_loss": -27.105878829956055, "global_step": 415457, "epoch": 5005} {"train_loss": -26.4957332611084, "global_step": 415458, "epoch": 5005} {"train_loss": -26.599042892456055, "global_step": 415459, "epoch": 5005} {"train_loss": -26.95234489440918, "global_step": 415460, "epoch": 5005} {"train_loss": -26.850305557250977, "global_step": 415461, "epoch": 5005} {"train_loss": -26.839757919311523, "global_step": 415462, "epoch": 5005} {"train_loss": -27.056442260742188, "global_step": 415463, "epoch": 5005} {"train_loss": -26.694799423217773, "global_step": 415464, "epoch": 5005} {"train_loss": -26.34952163696289, "global_step": 415465, "epoch": 5005} {"train_loss": -27.36371421813965, "global_step": 415466, "epoch": 5005} {"train_loss": -26.667682647705078, "global_step": 415467, "epoch": 5005} {"train_loss": -26.849695205688477, "global_step": 415468, "epoch": 5005} {"train_loss": -26.107282638549805, "global_step": 415469, "epoch": 5005} {"train_loss": -26.484399795532227, "global_step": 415470, "epoch": 5005} {"train_loss": -25.999393463134766, "global_step": 415471, "epoch": 5005} {"train_loss": -26.437793731689453, "global_step": 415472, "epoch": 5005} {"train_loss": -26.80805015563965, "global_step": 415473, "epoch": 5005} {"train_loss": -26.8687801361084, "global_step": 415474, "epoch": 5005} {"train_loss": -26.42120361328125, "global_step": 415475, "epoch": 5005} {"train_loss": -27.097707748413086, "global_step": 415476, "epoch": 5005} {"train_loss": -26.620847702026367, "global_step": 415477, "epoch": 5005} {"train_loss": -26.98975944519043, "global_step": 415478, "epoch": 5005} {"train_loss": -26.452993392944336, "global_step": 415479, "epoch": 5005} {"train_loss": -26.8909854888916, "global_step": 415480, "epoch": 5005} {"train_loss": -26.7177677154541, "global_step": 415481, "epoch": 5005} {"train_loss": -26.860889434814453, "global_step": 415482, "epoch": 5005} {"train_loss": -26.891433715820312, "global_step": 415483, "epoch": 5005} {"train_loss": -26.89340591430664, "global_step": 415484, "epoch": 5005} {"train_loss": -26.53696632385254, "global_step": 415485, "epoch": 5005} {"train_loss": -26.684682846069336, "global_step": 415486, "epoch": 5005} {"train_loss": -26.91412925720215, "global_step": 415487, "epoch": 5005} {"train_loss": -26.74726676940918, "global_step": 415488, "epoch": 5005} {"train_loss": -26.773733139038086, "global_step": 415489, "epoch": 5005} {"train_loss": -26.92142105102539, "global_step": 415490, "epoch": 5005} {"train_loss": -26.89607048034668, "global_step": 415491, "epoch": 5005} {"train_loss": -27.03009033203125, "global_step": 415492, "epoch": 5005} {"train_loss": -27.212799072265625, "global_step": 415493, "epoch": 5005} {"train_loss": -26.619367599487305, "global_step": 415494, "epoch": 5005} {"train_loss": -26.81818962097168, "global_step": 415495, "epoch": 5005} {"train_loss": -27.0896053314209, "global_step": 415496, "epoch": 5005} {"train_loss": -26.628260072455348, "global_step": 415497, "epoch": 5005, "val_loss": 6536498.0} {"train_loss": -26.37091636657715, "global_step": 415498, "epoch": 5006} {"train_loss": -26.37346839904785, "global_step": 415499, "epoch": 5006} {"train_loss": -26.610870361328125, "global_step": 415500, "epoch": 5006} {"train_loss": -26.359821319580078, "global_step": 415501, "epoch": 5006} {"train_loss": -26.489154815673828, "global_step": 415502, "epoch": 5006} {"train_loss": -26.71600914001465, "global_step": 415503, "epoch": 5006} {"train_loss": -26.505023956298828, "global_step": 415504, "epoch": 5006} {"train_loss": -26.605239868164062, "global_step": 415505, "epoch": 5006} {"train_loss": -26.779626846313477, "global_step": 415506, "epoch": 5006} {"train_loss": -26.52009391784668, "global_step": 415507, "epoch": 5006} {"train_loss": -26.284988403320312, "global_step": 415508, "epoch": 5006} {"train_loss": -25.926685333251953, "global_step": 415509, "epoch": 5006} {"train_loss": -26.318485260009766, "global_step": 415510, "epoch": 5006} {"train_loss": -27.07240867614746, "global_step": 415511, "epoch": 5006} {"train_loss": -26.280378341674805, "global_step": 415512, "epoch": 5006} {"train_loss": -25.608200073242188, "global_step": 415513, "epoch": 5006} {"train_loss": -26.066556930541992, "global_step": 415514, "epoch": 5006} {"train_loss": -26.326486587524414, "global_step": 415515, "epoch": 5006} {"train_loss": -26.208433151245117, "global_step": 415516, "epoch": 5006} {"train_loss": -25.98529624938965, "global_step": 415517, "epoch": 5006} {"train_loss": -26.765172958374023, "global_step": 415518, "epoch": 5006} {"train_loss": -26.253183364868164, "global_step": 415519, "epoch": 5006} {"train_loss": -26.6842041015625, "global_step": 415520, "epoch": 5006} {"train_loss": -26.180316925048828, "global_step": 415521, "epoch": 5006} {"train_loss": -26.783050537109375, "global_step": 415522, "epoch": 5006} {"train_loss": -26.153348922729492, "global_step": 415523, "epoch": 5006} {"train_loss": -26.628467559814453, "global_step": 415524, "epoch": 5006} {"train_loss": -26.558063507080078, "global_step": 415525, "epoch": 5006} {"train_loss": -26.6094970703125, "global_step": 415526, "epoch": 5006} {"train_loss": -26.4554500579834, "global_step": 415527, "epoch": 5006} {"train_loss": -26.5260066986084, "global_step": 415528, "epoch": 5006} {"train_loss": -26.612964630126953, "global_step": 415529, "epoch": 5006} {"train_loss": -26.66916275024414, "global_step": 415530, "epoch": 5006} {"train_loss": -26.65234375, "global_step": 415531, "epoch": 5006} {"train_loss": -26.28861427307129, "global_step": 415532, "epoch": 5006} {"train_loss": -26.53607177734375, "global_step": 415533, "epoch": 5006} {"train_loss": -26.61164665222168, "global_step": 415534, "epoch": 5006} {"train_loss": -26.460773468017578, "global_step": 415535, "epoch": 5006} {"train_loss": -26.42718505859375, "global_step": 415536, "epoch": 5006} {"train_loss": -26.668180465698242, "global_step": 415537, "epoch": 5006} {"train_loss": -26.866540908813477, "global_step": 415538, "epoch": 5006} {"train_loss": -26.62616539001465, "global_step": 415539, "epoch": 5006} {"train_loss": -26.64765739440918, "global_step": 415540, "epoch": 5006} {"train_loss": -26.895999908447266, "global_step": 415541, "epoch": 5006} {"train_loss": -27.112951278686523, "global_step": 415542, "epoch": 5006} {"train_loss": -26.76546287536621, "global_step": 415543, "epoch": 5006} {"train_loss": -27.218414306640625, "global_step": 415544, "epoch": 5006} {"train_loss": -26.95542335510254, "global_step": 415545, "epoch": 5006} {"train_loss": -26.960479736328125, "global_step": 415546, "epoch": 5006} {"train_loss": -27.251474380493164, "global_step": 415547, "epoch": 5006} {"train_loss": -26.990253448486328, "global_step": 415548, "epoch": 5006} {"train_loss": -26.89143180847168, "global_step": 415549, "epoch": 5006} {"train_loss": -27.06094741821289, "global_step": 415550, "epoch": 5006} {"train_loss": -26.798070907592773, "global_step": 415551, "epoch": 5006} {"train_loss": -26.753341674804688, "global_step": 415552, "epoch": 5006} {"train_loss": -26.8740291595459, "global_step": 415553, "epoch": 5006} {"train_loss": -26.801502227783203, "global_step": 415554, "epoch": 5006} {"train_loss": -26.888051986694336, "global_step": 415555, "epoch": 5006} {"train_loss": -27.11882972717285, "global_step": 415556, "epoch": 5006} {"train_loss": -27.21746253967285, "global_step": 415557, "epoch": 5006} {"train_loss": -26.93353271484375, "global_step": 415558, "epoch": 5006} {"train_loss": -26.92333984375, "global_step": 415559, "epoch": 5006} {"train_loss": -26.944135665893555, "global_step": 415560, "epoch": 5006} {"train_loss": -26.749792098999023, "global_step": 415561, "epoch": 5006} {"train_loss": -26.941938400268555, "global_step": 415562, "epoch": 5006} {"train_loss": -26.646259307861328, "global_step": 415563, "epoch": 5006} {"train_loss": -26.49787712097168, "global_step": 415564, "epoch": 5006} {"train_loss": -26.687524795532227, "global_step": 415565, "epoch": 5006} {"train_loss": -26.73203468322754, "global_step": 415566, "epoch": 5006} {"train_loss": -26.620264053344727, "global_step": 415567, "epoch": 5006} {"train_loss": -26.502344131469727, "global_step": 415568, "epoch": 5006} {"train_loss": -26.801136016845703, "global_step": 415569, "epoch": 5006} {"train_loss": -26.82388687133789, "global_step": 415570, "epoch": 5006} {"train_loss": -26.59503173828125, "global_step": 415571, "epoch": 5006} {"train_loss": -26.533340454101562, "global_step": 415572, "epoch": 5006} {"train_loss": -26.88779067993164, "global_step": 415573, "epoch": 5006} {"train_loss": -26.796552658081055, "global_step": 415574, "epoch": 5006} {"train_loss": -26.98746109008789, "global_step": 415575, "epoch": 5006} {"train_loss": -26.97260856628418, "global_step": 415576, "epoch": 5006} {"train_loss": -26.644330978393555, "global_step": 415577, "epoch": 5006} {"train_loss": -26.604665756225586, "global_step": 415578, "epoch": 5006} {"train_loss": -26.814167022705078, "global_step": 415579, "epoch": 5006} {"train_loss": -26.656170948442206, "global_step": 415580, "epoch": 5006, "val_loss": 6467186.0} {"train_loss": -26.740137100219727, "global_step": 415581, "epoch": 5007} {"train_loss": -26.4476375579834, "global_step": 415582, "epoch": 5007} {"train_loss": -26.2875919342041, "global_step": 415583, "epoch": 5007} {"train_loss": -26.581939697265625, "global_step": 415584, "epoch": 5007} {"train_loss": -26.192007064819336, "global_step": 415585, "epoch": 5007} {"train_loss": -26.379484176635742, "global_step": 415586, "epoch": 5007} {"train_loss": -26.941822052001953, "global_step": 415587, "epoch": 5007} {"train_loss": -26.57513999938965, "global_step": 415588, "epoch": 5007} {"train_loss": -26.196378707885742, "global_step": 415589, "epoch": 5007} {"train_loss": -26.423904418945312, "global_step": 415590, "epoch": 5007} {"train_loss": -26.701501846313477, "global_step": 415591, "epoch": 5007} {"train_loss": -26.498456954956055, "global_step": 415592, "epoch": 5007} {"train_loss": -27.041614532470703, "global_step": 415593, "epoch": 5007} {"train_loss": -26.4591007232666, "global_step": 415594, "epoch": 5007} {"train_loss": -26.48418617248535, "global_step": 415595, "epoch": 5007} {"train_loss": -26.46027183532715, "global_step": 415596, "epoch": 5007} {"train_loss": -27.309131622314453, "global_step": 415597, "epoch": 5007} {"train_loss": -26.571908950805664, "global_step": 415598, "epoch": 5007} {"train_loss": -27.114912033081055, "global_step": 415599, "epoch": 5007} {"train_loss": -26.833820343017578, "global_step": 415600, "epoch": 5007} {"train_loss": -26.965085983276367, "global_step": 415601, "epoch": 5007} {"train_loss": -26.74383544921875, "global_step": 415602, "epoch": 5007} {"train_loss": -26.897573471069336, "global_step": 415603, "epoch": 5007} {"train_loss": -26.822265625, "global_step": 415604, "epoch": 5007} {"train_loss": -26.874399185180664, "global_step": 415605, "epoch": 5007} {"train_loss": -26.68372917175293, "global_step": 415606, "epoch": 5007} {"train_loss": -26.91310691833496, "global_step": 415607, "epoch": 5007} {"train_loss": -27.20130729675293, "global_step": 415608, "epoch": 5007} {"train_loss": -26.75482749938965, "global_step": 415609, "epoch": 5007} {"train_loss": -26.96182632446289, "global_step": 415610, "epoch": 5007} {"train_loss": -26.768110275268555, "global_step": 415611, "epoch": 5007} {"train_loss": -26.916467666625977, "global_step": 415612, "epoch": 5007} {"train_loss": -26.719091415405273, "global_step": 415613, "epoch": 5007} {"train_loss": -26.631357192993164, "global_step": 415614, "epoch": 5007} {"train_loss": -26.60157585144043, "global_step": 415615, "epoch": 5007} {"train_loss": -26.97458267211914, "global_step": 415616, "epoch": 5007} {"train_loss": -27.156721115112305, "global_step": 415617, "epoch": 5007} {"train_loss": -27.176794052124023, "global_step": 415618, "epoch": 5007} {"train_loss": -26.94646644592285, "global_step": 415619, "epoch": 5007} {"train_loss": -26.692291259765625, "global_step": 415620, "epoch": 5007} {"train_loss": -26.868335723876953, "global_step": 415621, "epoch": 5007} {"train_loss": -27.057209014892578, "global_step": 415622, "epoch": 5007} {"train_loss": -26.87525749206543, "global_step": 415623, "epoch": 5007} {"train_loss": -27.329166412353516, "global_step": 415624, "epoch": 5007} {"train_loss": -26.81561279296875, "global_step": 415625, "epoch": 5007} {"train_loss": -26.869104385375977, "global_step": 415626, "epoch": 5007} {"train_loss": -26.700048446655273, "global_step": 415627, "epoch": 5007} {"train_loss": -26.639738082885742, "global_step": 415628, "epoch": 5007} {"train_loss": -26.86993980407715, "global_step": 415629, "epoch": 5007} {"train_loss": -26.77484703063965, "global_step": 415630, "epoch": 5007} {"train_loss": -26.81451416015625, "global_step": 415631, "epoch": 5007} {"train_loss": -26.523300170898438, "global_step": 415632, "epoch": 5007} {"train_loss": -26.993316650390625, "global_step": 415633, "epoch": 5007} {"train_loss": -26.957548141479492, "global_step": 415634, "epoch": 5007} {"train_loss": -26.716373443603516, "global_step": 415635, "epoch": 5007} {"train_loss": -26.79170799255371, "global_step": 415636, "epoch": 5007} {"train_loss": -26.58650779724121, "global_step": 415637, "epoch": 5007} {"train_loss": -26.710107803344727, "global_step": 415638, "epoch": 5007} {"train_loss": -26.896835327148438, "global_step": 415639, "epoch": 5007} {"train_loss": -26.966535568237305, "global_step": 415640, "epoch": 5007} {"train_loss": -26.77764892578125, "global_step": 415641, "epoch": 5007} {"train_loss": -27.223560333251953, "global_step": 415642, "epoch": 5007} {"train_loss": -26.864892959594727, "global_step": 415643, "epoch": 5007} {"train_loss": -26.8294677734375, "global_step": 415644, "epoch": 5007} {"train_loss": -26.96443748474121, "global_step": 415645, "epoch": 5007} {"train_loss": -26.993558883666992, "global_step": 415646, "epoch": 5007} {"train_loss": -26.539478302001953, "global_step": 415647, "epoch": 5007} {"train_loss": -26.68521499633789, "global_step": 415648, "epoch": 5007} {"train_loss": -26.74551773071289, "global_step": 415649, "epoch": 5007} {"train_loss": -26.678197860717773, "global_step": 415650, "epoch": 5007} {"train_loss": -26.65510368347168, "global_step": 415651, "epoch": 5007} {"train_loss": -26.95302391052246, "global_step": 415652, "epoch": 5007} {"train_loss": -26.72416114807129, "global_step": 415653, "epoch": 5007} {"train_loss": -26.354108810424805, "global_step": 415654, "epoch": 5007} {"train_loss": -26.52107048034668, "global_step": 415655, "epoch": 5007} {"train_loss": -26.836713790893555, "global_step": 415656, "epoch": 5007} {"train_loss": -26.60235023498535, "global_step": 415657, "epoch": 5007} {"train_loss": -26.406667709350586, "global_step": 415658, "epoch": 5007} {"train_loss": -26.657135009765625, "global_step": 415659, "epoch": 5007} {"train_loss": -26.550922393798828, "global_step": 415660, "epoch": 5007} {"train_loss": -26.62689781188965, "global_step": 415661, "epoch": 5007} {"train_loss": -27.044626235961914, "global_step": 415662, "epoch": 5007} {"train_loss": -26.76672425327531, "global_step": 415663, "epoch": 5007, "val_loss": 6426317.0} {"train_loss": -26.253681182861328, "global_step": 415664, "epoch": 5008} {"train_loss": -25.114225387573242, "global_step": 415665, "epoch": 5008} {"train_loss": -26.3936767578125, "global_step": 415666, "epoch": 5008} {"train_loss": -25.70059585571289, "global_step": 415667, "epoch": 5008} {"train_loss": -26.591461181640625, "global_step": 415668, "epoch": 5008} {"train_loss": -25.926855087280273, "global_step": 415669, "epoch": 5008} {"train_loss": -26.024250030517578, "global_step": 415670, "epoch": 5008} {"train_loss": -25.61203956604004, "global_step": 415671, "epoch": 5008} {"train_loss": -26.294586181640625, "global_step": 415672, "epoch": 5008} {"train_loss": -26.099897384643555, "global_step": 415673, "epoch": 5008} {"train_loss": -26.155370712280273, "global_step": 415674, "epoch": 5008} {"train_loss": -26.480976104736328, "global_step": 415675, "epoch": 5008} {"train_loss": -25.984777450561523, "global_step": 415676, "epoch": 5008} {"train_loss": -26.38006591796875, "global_step": 415677, "epoch": 5008} {"train_loss": -26.452306747436523, "global_step": 415678, "epoch": 5008} {"train_loss": -26.65081214904785, "global_step": 415679, "epoch": 5008} {"train_loss": -26.64533042907715, "global_step": 415680, "epoch": 5008} {"train_loss": -26.493610382080078, "global_step": 415681, "epoch": 5008} {"train_loss": -26.752887725830078, "global_step": 415682, "epoch": 5008} {"train_loss": -26.317407608032227, "global_step": 415683, "epoch": 5008} {"train_loss": -26.73929214477539, "global_step": 415684, "epoch": 5008} {"train_loss": -26.4714298248291, "global_step": 415685, "epoch": 5008} {"train_loss": -26.6241455078125, "global_step": 415686, "epoch": 5008} {"train_loss": -26.72509765625, "global_step": 415687, "epoch": 5008} {"train_loss": -26.266210556030273, "global_step": 415688, "epoch": 5008} {"train_loss": -26.716726303100586, "global_step": 415689, "epoch": 5008} {"train_loss": -25.927047729492188, "global_step": 415690, "epoch": 5008} {"train_loss": -26.84364891052246, "global_step": 415691, "epoch": 5008} {"train_loss": -26.605670928955078, "global_step": 415692, "epoch": 5008} {"train_loss": -26.359933853149414, "global_step": 415693, "epoch": 5008} {"train_loss": -26.532377243041992, "global_step": 415694, "epoch": 5008} {"train_loss": -26.421728134155273, "global_step": 415695, "epoch": 5008} {"train_loss": -26.79802894592285, "global_step": 415696, "epoch": 5008} {"train_loss": -27.12127685546875, "global_step": 415697, "epoch": 5008} {"train_loss": -26.652353286743164, "global_step": 415698, "epoch": 5008} {"train_loss": -26.842432022094727, "global_step": 415699, "epoch": 5008} {"train_loss": -26.65227699279785, "global_step": 415700, "epoch": 5008} {"train_loss": -26.828458786010742, "global_step": 415701, "epoch": 5008} {"train_loss": -26.780004501342773, "global_step": 415702, "epoch": 5008} {"train_loss": -26.905832290649414, "global_step": 415703, "epoch": 5008} {"train_loss": -26.8142147064209, "global_step": 415704, "epoch": 5008} {"train_loss": -26.74586296081543, "global_step": 415705, "epoch": 5008} {"train_loss": -27.255285263061523, "global_step": 415706, "epoch": 5008} {"train_loss": -26.587438583374023, "global_step": 415707, "epoch": 5008} {"train_loss": -26.839508056640625, "global_step": 415708, "epoch": 5008} {"train_loss": -26.933191299438477, "global_step": 415709, "epoch": 5008} {"train_loss": -27.152973175048828, "global_step": 415710, "epoch": 5008} {"train_loss": -26.927854537963867, "global_step": 415711, "epoch": 5008} {"train_loss": -27.034839630126953, "global_step": 415712, "epoch": 5008} {"train_loss": -26.992475509643555, "global_step": 415713, "epoch": 5008} {"train_loss": -26.8781795501709, "global_step": 415714, "epoch": 5008} {"train_loss": -27.311553955078125, "global_step": 415715, "epoch": 5008} {"train_loss": -26.865591049194336, "global_step": 415716, "epoch": 5008} {"train_loss": -27.33363151550293, "global_step": 415717, "epoch": 5008} {"train_loss": -26.567846298217773, "global_step": 415718, "epoch": 5008} {"train_loss": -27.02031898498535, "global_step": 415719, "epoch": 5008} {"train_loss": -27.212865829467773, "global_step": 415720, "epoch": 5008} {"train_loss": -27.294830322265625, "global_step": 415721, "epoch": 5008} {"train_loss": -27.070337295532227, "global_step": 415722, "epoch": 5008} {"train_loss": -27.631637573242188, "global_step": 415723, "epoch": 5008} {"train_loss": -26.895498275756836, "global_step": 415724, "epoch": 5008} {"train_loss": -26.949750900268555, "global_step": 415725, "epoch": 5008} {"train_loss": -26.972610473632812, "global_step": 415726, "epoch": 5008} {"train_loss": -26.38047218322754, "global_step": 415727, "epoch": 5008} {"train_loss": -27.082996368408203, "global_step": 415728, "epoch": 5008} {"train_loss": -26.616037368774414, "global_step": 415729, "epoch": 5008} {"train_loss": -26.932397842407227, "global_step": 415730, "epoch": 5008} {"train_loss": -26.819005966186523, "global_step": 415731, "epoch": 5008} {"train_loss": -26.73079490661621, "global_step": 415732, "epoch": 5008} {"train_loss": -26.742507934570312, "global_step": 415733, "epoch": 5008} {"train_loss": -26.701025009155273, "global_step": 415734, "epoch": 5008} {"train_loss": -26.64667320251465, "global_step": 415735, "epoch": 5008} {"train_loss": -26.941547393798828, "global_step": 415736, "epoch": 5008} {"train_loss": -26.760150909423828, "global_step": 415737, "epoch": 5008} {"train_loss": -26.9022159576416, "global_step": 415738, "epoch": 5008} {"train_loss": -26.463031768798828, "global_step": 415739, "epoch": 5008} {"train_loss": -26.60725975036621, "global_step": 415740, "epoch": 5008} {"train_loss": -26.27076530456543, "global_step": 415741, "epoch": 5008} {"train_loss": -26.405237197875977, "global_step": 415742, "epoch": 5008} {"train_loss": -26.57196044921875, "global_step": 415743, "epoch": 5008} {"train_loss": -25.954147338867188, "global_step": 415744, "epoch": 5008} {"train_loss": -26.0580997467041, "global_step": 415745, "epoch": 5008} {"train_loss": -26.639223971998835, "global_step": 415746, "epoch": 5008, "val_loss": 6527670.5} {"train_loss": -23.91254997253418, "global_step": 415747, "epoch": 5009} {"train_loss": -21.38184928894043, "global_step": 415748, "epoch": 5009} {"train_loss": -25.503963470458984, "global_step": 415749, "epoch": 5009} {"train_loss": -23.718481063842773, "global_step": 415750, "epoch": 5009} {"train_loss": -24.537580490112305, "global_step": 415751, "epoch": 5009} {"train_loss": -25.016225814819336, "global_step": 415752, "epoch": 5009} {"train_loss": -25.209562301635742, "global_step": 415753, "epoch": 5009} {"train_loss": -24.690357208251953, "global_step": 415754, "epoch": 5009} {"train_loss": -24.88997459411621, "global_step": 415755, "epoch": 5009} {"train_loss": -25.29538345336914, "global_step": 415756, "epoch": 5009} {"train_loss": -25.49664878845215, "global_step": 415757, "epoch": 5009} {"train_loss": -25.62653160095215, "global_step": 415758, "epoch": 5009} {"train_loss": -25.897083282470703, "global_step": 415759, "epoch": 5009} {"train_loss": -25.99538230895996, "global_step": 415760, "epoch": 5009} {"train_loss": -25.38348388671875, "global_step": 415761, "epoch": 5009} {"train_loss": -25.829015731811523, "global_step": 415762, "epoch": 5009} {"train_loss": -25.794158935546875, "global_step": 415763, "epoch": 5009} {"train_loss": -26.219648361206055, "global_step": 415764, "epoch": 5009} {"train_loss": -25.906530380249023, "global_step": 415765, "epoch": 5009} {"train_loss": -25.511716842651367, "global_step": 415766, "epoch": 5009} {"train_loss": -25.90325927734375, "global_step": 415767, "epoch": 5009} {"train_loss": -25.545862197875977, "global_step": 415768, "epoch": 5009} {"train_loss": -26.222736358642578, "global_step": 415769, "epoch": 5009} {"train_loss": -26.308624267578125, "global_step": 415770, "epoch": 5009} {"train_loss": -25.931848526000977, "global_step": 415771, "epoch": 5009} {"train_loss": -25.955673217773438, "global_step": 415772, "epoch": 5009} {"train_loss": -26.27313804626465, "global_step": 415773, "epoch": 5009} {"train_loss": -26.472909927368164, "global_step": 415774, "epoch": 5009} {"train_loss": -26.571243286132812, "global_step": 415775, "epoch": 5009} {"train_loss": -26.456445693969727, "global_step": 415776, "epoch": 5009} {"train_loss": -26.296588897705078, "global_step": 415777, "epoch": 5009} {"train_loss": -26.149473190307617, "global_step": 415778, "epoch": 5009} {"train_loss": -26.37483787536621, "global_step": 415779, "epoch": 5009} {"train_loss": -26.2012996673584, "global_step": 415780, "epoch": 5009} {"train_loss": -26.31349754333496, "global_step": 415781, "epoch": 5009} {"train_loss": -26.23969078063965, "global_step": 415782, "epoch": 5009} {"train_loss": -26.813928604125977, "global_step": 415783, "epoch": 5009} {"train_loss": -26.484619140625, "global_step": 415784, "epoch": 5009} {"train_loss": -26.59144401550293, "global_step": 415785, "epoch": 5009} {"train_loss": -26.5609073638916, "global_step": 415786, "epoch": 5009} {"train_loss": -26.56647300720215, "global_step": 415787, "epoch": 5009} {"train_loss": -26.66259765625, "global_step": 415788, "epoch": 5009} {"train_loss": -26.758529663085938, "global_step": 415789, "epoch": 5009} {"train_loss": -26.776105880737305, "global_step": 415790, "epoch": 5009} {"train_loss": -26.75617790222168, "global_step": 415791, "epoch": 5009} {"train_loss": -26.92522621154785, "global_step": 415792, "epoch": 5009} {"train_loss": -26.71969985961914, "global_step": 415793, "epoch": 5009} {"train_loss": -26.884119033813477, "global_step": 415794, "epoch": 5009} {"train_loss": -26.654815673828125, "global_step": 415795, "epoch": 5009} {"train_loss": -26.7868709564209, "global_step": 415796, "epoch": 5009} {"train_loss": -26.861896514892578, "global_step": 415797, "epoch": 5009} {"train_loss": -26.68499755859375, "global_step": 415798, "epoch": 5009} {"train_loss": -27.19990348815918, "global_step": 415799, "epoch": 5009} {"train_loss": -26.790578842163086, "global_step": 415800, "epoch": 5009} {"train_loss": -26.907812118530273, "global_step": 415801, "epoch": 5009} {"train_loss": -26.7611083984375, "global_step": 415802, "epoch": 5009} {"train_loss": -27.20655632019043, "global_step": 415803, "epoch": 5009} {"train_loss": -26.8272762298584, "global_step": 415804, "epoch": 5009} {"train_loss": -26.859838485717773, "global_step": 415805, "epoch": 5009} {"train_loss": -26.959232330322266, "global_step": 415806, "epoch": 5009} {"train_loss": -26.896459579467773, "global_step": 415807, "epoch": 5009} {"train_loss": -26.818700790405273, "global_step": 415808, "epoch": 5009} {"train_loss": -26.614990234375, "global_step": 415809, "epoch": 5009} {"train_loss": -26.66852378845215, "global_step": 415810, "epoch": 5009} {"train_loss": -26.7879695892334, "global_step": 415811, "epoch": 5009} {"train_loss": -26.837087631225586, "global_step": 415812, "epoch": 5009} {"train_loss": -26.086536407470703, "global_step": 415813, "epoch": 5009} {"train_loss": -26.564300537109375, "global_step": 415814, "epoch": 5009} {"train_loss": -26.80792808532715, "global_step": 415815, "epoch": 5009} {"train_loss": -26.438983917236328, "global_step": 415816, "epoch": 5009} {"train_loss": -26.725055694580078, "global_step": 415817, "epoch": 5009} {"train_loss": -27.175825119018555, "global_step": 415818, "epoch": 5009} {"train_loss": -26.61435317993164, "global_step": 415819, "epoch": 5009} {"train_loss": -26.386505126953125, "global_step": 415820, "epoch": 5009} {"train_loss": -26.73591423034668, "global_step": 415821, "epoch": 5009} {"train_loss": -26.512603759765625, "global_step": 415822, "epoch": 5009} {"train_loss": -26.472869873046875, "global_step": 415823, "epoch": 5009} {"train_loss": -26.3094425201416, "global_step": 415824, "epoch": 5009} {"train_loss": -26.78515625, "global_step": 415825, "epoch": 5009} {"train_loss": -26.713193893432617, "global_step": 415826, "epoch": 5009} {"train_loss": -26.915197372436523, "global_step": 415827, "epoch": 5009} {"train_loss": -26.50025749206543, "global_step": 415828, "epoch": 5009} {"train_loss": -26.239838220986975, "global_step": 415829, "epoch": 5009, "val_loss": 6536565.0} {"train_loss": -26.543813705444336, "global_step": 415830, "epoch": 5010} {"train_loss": -25.009769439697266, "global_step": 415831, "epoch": 5010} {"train_loss": -25.56220054626465, "global_step": 415832, "epoch": 5010} {"train_loss": -26.468433380126953, "global_step": 415833, "epoch": 5010} {"train_loss": -26.164703369140625, "global_step": 415834, "epoch": 5010} {"train_loss": -26.207380294799805, "global_step": 415835, "epoch": 5010} {"train_loss": -25.975116729736328, "global_step": 415836, "epoch": 5010} {"train_loss": -26.1628360748291, "global_step": 415837, "epoch": 5010} {"train_loss": -25.979394912719727, "global_step": 415838, "epoch": 5010} {"train_loss": -25.8939151763916, "global_step": 415839, "epoch": 5010} {"train_loss": -26.303882598876953, "global_step": 415840, "epoch": 5010} {"train_loss": -25.924543380737305, "global_step": 415841, "epoch": 5010} {"train_loss": -25.756223678588867, "global_step": 415842, "epoch": 5010} {"train_loss": -25.8361759185791, "global_step": 415843, "epoch": 5010} {"train_loss": -26.535541534423828, "global_step": 415844, "epoch": 5010} {"train_loss": -26.446691513061523, "global_step": 415845, "epoch": 5010} {"train_loss": -26.87739372253418, "global_step": 415846, "epoch": 5010} {"train_loss": -26.480329513549805, "global_step": 415847, "epoch": 5010} {"train_loss": -26.01947593688965, "global_step": 415848, "epoch": 5010} {"train_loss": -26.427398681640625, "global_step": 415849, "epoch": 5010} {"train_loss": -26.405075073242188, "global_step": 415850, "epoch": 5010} {"train_loss": -26.755817413330078, "global_step": 415851, "epoch": 5010} {"train_loss": -26.732624053955078, "global_step": 415852, "epoch": 5010} {"train_loss": -26.60597038269043, "global_step": 415853, "epoch": 5010} {"train_loss": -26.434497833251953, "global_step": 415854, "epoch": 5010} {"train_loss": -26.328571319580078, "global_step": 415855, "epoch": 5010} {"train_loss": -26.82293128967285, "global_step": 415856, "epoch": 5010} {"train_loss": -26.47564125061035, "global_step": 415857, "epoch": 5010} {"train_loss": -26.846027374267578, "global_step": 415858, "epoch": 5010} {"train_loss": -26.877838134765625, "global_step": 415859, "epoch": 5010} {"train_loss": -26.98508071899414, "global_step": 415860, "epoch": 5010} {"train_loss": -27.051198959350586, "global_step": 415861, "epoch": 5010} {"train_loss": -26.8903751373291, "global_step": 415862, "epoch": 5010} {"train_loss": -26.717004776000977, "global_step": 415863, "epoch": 5010} {"train_loss": -26.937625885009766, "global_step": 415864, "epoch": 5010} {"train_loss": -26.945417404174805, "global_step": 415865, "epoch": 5010} {"train_loss": -26.587926864624023, "global_step": 415866, "epoch": 5010} {"train_loss": -26.742801666259766, "global_step": 415867, "epoch": 5010} {"train_loss": -26.71463966369629, "global_step": 415868, "epoch": 5010} {"train_loss": -27.059843063354492, "global_step": 415869, "epoch": 5010} {"train_loss": -27.077957153320312, "global_step": 415870, "epoch": 5010} {"train_loss": -26.90821647644043, "global_step": 415871, "epoch": 5010} {"train_loss": -26.651193618774414, "global_step": 415872, "epoch": 5010} {"train_loss": -26.9970760345459, "global_step": 415873, "epoch": 5010} {"train_loss": -27.1671199798584, "global_step": 415874, "epoch": 5010} {"train_loss": -27.39626121520996, "global_step": 415875, "epoch": 5010} {"train_loss": -27.007068634033203, "global_step": 415876, "epoch": 5010} {"train_loss": -26.59332275390625, "global_step": 415877, "epoch": 5010} {"train_loss": -26.362009048461914, "global_step": 415878, "epoch": 5010} {"train_loss": -26.8872013092041, "global_step": 415879, "epoch": 5010} {"train_loss": -27.032184600830078, "global_step": 415880, "epoch": 5010} {"train_loss": -27.054014205932617, "global_step": 415881, "epoch": 5010} {"train_loss": -27.11737060546875, "global_step": 415882, "epoch": 5010} {"train_loss": -26.90658950805664, "global_step": 415883, "epoch": 5010} {"train_loss": -26.521427154541016, "global_step": 415884, "epoch": 5010} {"train_loss": -26.473459243774414, "global_step": 415885, "epoch": 5010} {"train_loss": -26.35084342956543, "global_step": 415886, "epoch": 5010} {"train_loss": -26.809919357299805, "global_step": 415887, "epoch": 5010} {"train_loss": -26.84284019470215, "global_step": 415888, "epoch": 5010} {"train_loss": -26.652204513549805, "global_step": 415889, "epoch": 5010} {"train_loss": -26.90718650817871, "global_step": 415890, "epoch": 5010} {"train_loss": -26.436695098876953, "global_step": 415891, "epoch": 5010} {"train_loss": -26.567798614501953, "global_step": 415892, "epoch": 5010} {"train_loss": -26.3760929107666, "global_step": 415893, "epoch": 5010} {"train_loss": -26.648847579956055, "global_step": 415894, "epoch": 5010} {"train_loss": -27.136886596679688, "global_step": 415895, "epoch": 5010} {"train_loss": -26.66554069519043, "global_step": 415896, "epoch": 5010} {"train_loss": -26.608352661132812, "global_step": 415897, "epoch": 5010} {"train_loss": -26.597875595092773, "global_step": 415898, "epoch": 5010} {"train_loss": -26.95891761779785, "global_step": 415899, "epoch": 5010} {"train_loss": -26.879425048828125, "global_step": 415900, "epoch": 5010} {"train_loss": -26.791723251342773, "global_step": 415901, "epoch": 5010} {"train_loss": -26.76051902770996, "global_step": 415902, "epoch": 5010} {"train_loss": -26.29558753967285, "global_step": 415903, "epoch": 5010} {"train_loss": -26.71893310546875, "global_step": 415904, "epoch": 5010} {"train_loss": -26.690521240234375, "global_step": 415905, "epoch": 5010} {"train_loss": -27.001012802124023, "global_step": 415906, "epoch": 5010} {"train_loss": -26.526702880859375, "global_step": 415907, "epoch": 5010} {"train_loss": -26.51984977722168, "global_step": 415908, "epoch": 5010} {"train_loss": -26.81549072265625, "global_step": 415909, "epoch": 5010} {"train_loss": -27.092126846313477, "global_step": 415910, "epoch": 5010} {"train_loss": -26.841022491455078, "global_step": 415911, "epoch": 5010} {"train_loss": -26.617997502706135, "global_step": 415912, "epoch": 5010, "val_loss": 6505560.5} {"train_loss": -25.6898136138916, "global_step": 415913, "epoch": 5011} {"train_loss": -25.482791900634766, "global_step": 415914, "epoch": 5011} {"train_loss": -26.133386611938477, "global_step": 415915, "epoch": 5011} {"train_loss": -25.49336051940918, "global_step": 415916, "epoch": 5011} {"train_loss": -25.87444496154785, "global_step": 415917, "epoch": 5011} {"train_loss": -26.271865844726562, "global_step": 415918, "epoch": 5011} {"train_loss": -26.174646377563477, "global_step": 415919, "epoch": 5011} {"train_loss": -26.120656967163086, "global_step": 415920, "epoch": 5011} {"train_loss": -25.828580856323242, "global_step": 415921, "epoch": 5011} {"train_loss": -26.50201988220215, "global_step": 415922, "epoch": 5011} {"train_loss": -25.955402374267578, "global_step": 415923, "epoch": 5011} {"train_loss": -26.11020278930664, "global_step": 415924, "epoch": 5011} {"train_loss": -26.6445255279541, "global_step": 415925, "epoch": 5011} {"train_loss": -25.7451229095459, "global_step": 415926, "epoch": 5011} {"train_loss": -26.833587646484375, "global_step": 415927, "epoch": 5011} {"train_loss": -26.62647819519043, "global_step": 415928, "epoch": 5011} {"train_loss": -26.18109703063965, "global_step": 415929, "epoch": 5011} {"train_loss": -26.524389266967773, "global_step": 415930, "epoch": 5011} {"train_loss": -26.04230308532715, "global_step": 415931, "epoch": 5011} {"train_loss": -26.465742111206055, "global_step": 415932, "epoch": 5011} {"train_loss": -26.155853271484375, "global_step": 415933, "epoch": 5011} {"train_loss": -26.693506240844727, "global_step": 415934, "epoch": 5011} {"train_loss": -26.277921676635742, "global_step": 415935, "epoch": 5011} {"train_loss": -26.657363891601562, "global_step": 415936, "epoch": 5011} {"train_loss": -26.4487361907959, "global_step": 415937, "epoch": 5011} {"train_loss": -26.75856590270996, "global_step": 415938, "epoch": 5011} {"train_loss": -26.456958770751953, "global_step": 415939, "epoch": 5011} {"train_loss": -26.843061447143555, "global_step": 415940, "epoch": 5011} {"train_loss": -26.842559814453125, "global_step": 415941, "epoch": 5011} {"train_loss": -26.841222763061523, "global_step": 415942, "epoch": 5011} {"train_loss": -26.333974838256836, "global_step": 415943, "epoch": 5011} {"train_loss": -26.68328857421875, "global_step": 415944, "epoch": 5011} {"train_loss": -26.639007568359375, "global_step": 415945, "epoch": 5011} {"train_loss": -26.794713973999023, "global_step": 415946, "epoch": 5011} {"train_loss": -26.504377365112305, "global_step": 415947, "epoch": 5011} {"train_loss": -26.62060546875, "global_step": 415948, "epoch": 5011} {"train_loss": -26.869281768798828, "global_step": 415949, "epoch": 5011} {"train_loss": -26.481653213500977, "global_step": 415950, "epoch": 5011} {"train_loss": -26.664228439331055, "global_step": 415951, "epoch": 5011} {"train_loss": -27.043659210205078, "global_step": 415952, "epoch": 5011} {"train_loss": -27.073110580444336, "global_step": 415953, "epoch": 5011} {"train_loss": -26.7880916595459, "global_step": 415954, "epoch": 5011} {"train_loss": -26.752197265625, "global_step": 415955, "epoch": 5011} {"train_loss": -27.11444664001465, "global_step": 415956, "epoch": 5011} {"train_loss": -26.673913955688477, "global_step": 415957, "epoch": 5011} {"train_loss": -27.2730712890625, "global_step": 415958, "epoch": 5011} {"train_loss": -26.775266647338867, "global_step": 415959, "epoch": 5011} {"train_loss": -26.76645851135254, "global_step": 415960, "epoch": 5011} {"train_loss": -26.5902099609375, "global_step": 415961, "epoch": 5011} {"train_loss": -26.61165428161621, "global_step": 415962, "epoch": 5011} {"train_loss": -26.97319984436035, "global_step": 415963, "epoch": 5011} {"train_loss": -26.9652042388916, "global_step": 415964, "epoch": 5011} {"train_loss": -26.50467300415039, "global_step": 415965, "epoch": 5011} {"train_loss": -26.786575317382812, "global_step": 415966, "epoch": 5011} {"train_loss": -27.042020797729492, "global_step": 415967, "epoch": 5011} {"train_loss": -26.6625919342041, "global_step": 415968, "epoch": 5011} {"train_loss": -26.636280059814453, "global_step": 415969, "epoch": 5011} {"train_loss": -26.888891220092773, "global_step": 415970, "epoch": 5011} {"train_loss": -26.6595516204834, "global_step": 415971, "epoch": 5011} {"train_loss": -26.89682388305664, "global_step": 415972, "epoch": 5011} {"train_loss": -27.13640785217285, "global_step": 415973, "epoch": 5011} {"train_loss": -26.8493595123291, "global_step": 415974, "epoch": 5011} {"train_loss": -26.69841957092285, "global_step": 415975, "epoch": 5011} {"train_loss": -27.238813400268555, "global_step": 415976, "epoch": 5011} {"train_loss": -26.312835693359375, "global_step": 415977, "epoch": 5011} {"train_loss": -25.958158493041992, "global_step": 415978, "epoch": 5011} {"train_loss": -26.645963668823242, "global_step": 415979, "epoch": 5011} {"train_loss": -26.93037986755371, "global_step": 415980, "epoch": 5011} {"train_loss": -26.42134666442871, "global_step": 415981, "epoch": 5011} {"train_loss": -26.88691520690918, "global_step": 415982, "epoch": 5011} {"train_loss": -27.087568283081055, "global_step": 415983, "epoch": 5011} {"train_loss": -26.894201278686523, "global_step": 415984, "epoch": 5011} {"train_loss": -26.6680908203125, "global_step": 415985, "epoch": 5011} {"train_loss": -26.979581832885742, "global_step": 415986, "epoch": 5011} {"train_loss": -27.277158737182617, "global_step": 415987, "epoch": 5011} {"train_loss": -27.096826553344727, "global_step": 415988, "epoch": 5011} {"train_loss": -27.20488929748535, "global_step": 415989, "epoch": 5011} {"train_loss": -26.732091903686523, "global_step": 415990, "epoch": 5011} {"train_loss": -26.952728271484375, "global_step": 415991, "epoch": 5011} {"train_loss": -27.095355987548828, "global_step": 415992, "epoch": 5011} {"train_loss": -26.80326271057129, "global_step": 415993, "epoch": 5011} {"train_loss": -26.902616500854492, "global_step": 415994, "epoch": 5011} {"train_loss": -26.63074079766331, "global_step": 415995, "epoch": 5011, "val_loss": 6531375.5} {"train_loss": -26.480382919311523, "global_step": 415996, "epoch": 5012} {"train_loss": -25.628833770751953, "global_step": 415997, "epoch": 5012} {"train_loss": -25.722034454345703, "global_step": 415998, "epoch": 5012} {"train_loss": -26.298004150390625, "global_step": 415999, "epoch": 5012} {"train_loss": -26.466476440429688, "global_step": 416000, "epoch": 5012} {"train_loss": -25.544675827026367, "global_step": 416001, "epoch": 5012} {"train_loss": -26.08151626586914, "global_step": 416002, "epoch": 5012} {"train_loss": -26.257726669311523, "global_step": 416003, "epoch": 5012} {"train_loss": -25.692691802978516, "global_step": 416004, "epoch": 5012} {"train_loss": -26.540008544921875, "global_step": 416005, "epoch": 5012} {"train_loss": -26.392505645751953, "global_step": 416006, "epoch": 5012} {"train_loss": -26.28547477722168, "global_step": 416007, "epoch": 5012} {"train_loss": -26.398202896118164, "global_step": 416008, "epoch": 5012} {"train_loss": -26.270313262939453, "global_step": 416009, "epoch": 5012} {"train_loss": -26.4847412109375, "global_step": 416010, "epoch": 5012} {"train_loss": -26.188709259033203, "global_step": 416011, "epoch": 5012} {"train_loss": -26.471792221069336, "global_step": 416012, "epoch": 5012} {"train_loss": -25.996784210205078, "global_step": 416013, "epoch": 5012} {"train_loss": -26.427331924438477, "global_step": 416014, "epoch": 5012} {"train_loss": -26.45222282409668, "global_step": 416015, "epoch": 5012} {"train_loss": -26.4394474029541, "global_step": 416016, "epoch": 5012} {"train_loss": -26.708173751831055, "global_step": 416017, "epoch": 5012} {"train_loss": -26.620624542236328, "global_step": 416018, "epoch": 5012} {"train_loss": -26.63962173461914, "global_step": 416019, "epoch": 5012} {"train_loss": -26.391864776611328, "global_step": 416020, "epoch": 5012} {"train_loss": -26.64304542541504, "global_step": 416021, "epoch": 5012} {"train_loss": -26.610137939453125, "global_step": 416022, "epoch": 5012} {"train_loss": -26.4119873046875, "global_step": 416023, "epoch": 5012} {"train_loss": -26.469745635986328, "global_step": 416024, "epoch": 5012} {"train_loss": -26.543426513671875, "global_step": 416025, "epoch": 5012} {"train_loss": -26.648834228515625, "global_step": 416026, "epoch": 5012} {"train_loss": -26.90509605407715, "global_step": 416027, "epoch": 5012} {"train_loss": -26.83139991760254, "global_step": 416028, "epoch": 5012} {"train_loss": -26.560033798217773, "global_step": 416029, "epoch": 5012} {"train_loss": -26.4778995513916, "global_step": 416030, "epoch": 5012} {"train_loss": -26.686920166015625, "global_step": 416031, "epoch": 5012} {"train_loss": -26.781177520751953, "global_step": 416032, "epoch": 5012} {"train_loss": -26.94815444946289, "global_step": 416033, "epoch": 5012} {"train_loss": -26.76447105407715, "global_step": 416034, "epoch": 5012} {"train_loss": -26.785602569580078, "global_step": 416035, "epoch": 5012} {"train_loss": -26.799911499023438, "global_step": 416036, "epoch": 5012} {"train_loss": -26.7860107421875, "global_step": 416037, "epoch": 5012} {"train_loss": -26.790607452392578, "global_step": 416038, "epoch": 5012} {"train_loss": -26.786182403564453, "global_step": 416039, "epoch": 5012} {"train_loss": -26.944061279296875, "global_step": 416040, "epoch": 5012} {"train_loss": -26.894962310791016, "global_step": 416041, "epoch": 5012} {"train_loss": -27.30194664001465, "global_step": 416042, "epoch": 5012} {"train_loss": -26.90656852722168, "global_step": 416043, "epoch": 5012} {"train_loss": -26.907690048217773, "global_step": 416044, "epoch": 5012} {"train_loss": -26.5401668548584, "global_step": 416045, "epoch": 5012} {"train_loss": -27.038665771484375, "global_step": 416046, "epoch": 5012} {"train_loss": -26.6672306060791, "global_step": 416047, "epoch": 5012} {"train_loss": -27.131549835205078, "global_step": 416048, "epoch": 5012} {"train_loss": -26.85409927368164, "global_step": 416049, "epoch": 5012} {"train_loss": -26.930240631103516, "global_step": 416050, "epoch": 5012} {"train_loss": -26.44720458984375, "global_step": 416051, "epoch": 5012} {"train_loss": -27.028594970703125, "global_step": 416052, "epoch": 5012} {"train_loss": -27.109619140625, "global_step": 416053, "epoch": 5012} {"train_loss": -26.611318588256836, "global_step": 416054, "epoch": 5012} {"train_loss": -27.068769454956055, "global_step": 416055, "epoch": 5012} {"train_loss": -26.51853370666504, "global_step": 416056, "epoch": 5012} {"train_loss": -27.085071563720703, "global_step": 416057, "epoch": 5012} {"train_loss": -26.52033042907715, "global_step": 416058, "epoch": 5012} {"train_loss": -26.949106216430664, "global_step": 416059, "epoch": 5012} {"train_loss": -27.313892364501953, "global_step": 416060, "epoch": 5012} {"train_loss": -26.455591201782227, "global_step": 416061, "epoch": 5012} {"train_loss": -26.845190048217773, "global_step": 416062, "epoch": 5012} {"train_loss": -26.793359756469727, "global_step": 416063, "epoch": 5012} {"train_loss": -26.852949142456055, "global_step": 416064, "epoch": 5012} {"train_loss": -26.61234474182129, "global_step": 416065, "epoch": 5012} {"train_loss": -26.408411026000977, "global_step": 416066, "epoch": 5012} {"train_loss": -26.372900009155273, "global_step": 416067, "epoch": 5012} {"train_loss": -26.73784828186035, "global_step": 416068, "epoch": 5012} {"train_loss": -26.420974731445312, "global_step": 416069, "epoch": 5012} {"train_loss": -26.45660400390625, "global_step": 416070, "epoch": 5012} {"train_loss": -26.573705673217773, "global_step": 416071, "epoch": 5012} {"train_loss": -26.84773063659668, "global_step": 416072, "epoch": 5012} {"train_loss": -26.54286003112793, "global_step": 416073, "epoch": 5012} {"train_loss": -26.569671630859375, "global_step": 416074, "epoch": 5012} {"train_loss": -26.652624130249023, "global_step": 416075, "epoch": 5012} {"train_loss": -26.50452995300293, "global_step": 416076, "epoch": 5012} {"train_loss": -26.459903717041016, "global_step": 416077, "epoch": 5012} {"train_loss": -26.613913915243494, "global_step": 416078, "epoch": 5012, "val_loss": 6425245.5} {"train_loss": -25.760482788085938, "global_step": 416079, "epoch": 5013} {"train_loss": -26.374746322631836, "global_step": 416080, "epoch": 5013} {"train_loss": -26.260498046875, "global_step": 416081, "epoch": 5013} {"train_loss": -25.6195011138916, "global_step": 416082, "epoch": 5013} {"train_loss": -26.2969970703125, "global_step": 416083, "epoch": 5013} {"train_loss": -26.131916046142578, "global_step": 416084, "epoch": 5013} {"train_loss": -26.576557159423828, "global_step": 416085, "epoch": 5013} {"train_loss": -25.819517135620117, "global_step": 416086, "epoch": 5013} {"train_loss": -26.234210968017578, "global_step": 416087, "epoch": 5013} {"train_loss": -26.149503707885742, "global_step": 416088, "epoch": 5013} {"train_loss": -26.750181198120117, "global_step": 416089, "epoch": 5013} {"train_loss": -26.673200607299805, "global_step": 416090, "epoch": 5013} {"train_loss": -26.22828483581543, "global_step": 416091, "epoch": 5013} {"train_loss": -26.7601318359375, "global_step": 416092, "epoch": 5013} {"train_loss": -26.770544052124023, "global_step": 416093, "epoch": 5013} {"train_loss": -26.65327262878418, "global_step": 416094, "epoch": 5013} {"train_loss": -26.628742218017578, "global_step": 416095, "epoch": 5013} {"train_loss": -26.691755294799805, "global_step": 416096, "epoch": 5013} {"train_loss": -26.44291114807129, "global_step": 416097, "epoch": 5013} {"train_loss": -27.196165084838867, "global_step": 416098, "epoch": 5013} {"train_loss": -26.831140518188477, "global_step": 416099, "epoch": 5013} {"train_loss": -26.901336669921875, "global_step": 416100, "epoch": 5013} {"train_loss": -26.889142990112305, "global_step": 416101, "epoch": 5013} {"train_loss": -26.778364181518555, "global_step": 416102, "epoch": 5013} {"train_loss": -26.893829345703125, "global_step": 416103, "epoch": 5013} {"train_loss": -26.654226303100586, "global_step": 416104, "epoch": 5013} {"train_loss": -26.692962646484375, "global_step": 416105, "epoch": 5013} {"train_loss": -26.482213973999023, "global_step": 416106, "epoch": 5013} {"train_loss": -26.4050350189209, "global_step": 416107, "epoch": 5013} {"train_loss": -27.059232711791992, "global_step": 416108, "epoch": 5013} {"train_loss": -26.734710693359375, "global_step": 416109, "epoch": 5013} {"train_loss": -27.072187423706055, "global_step": 416110, "epoch": 5013} {"train_loss": -26.714282989501953, "global_step": 416111, "epoch": 5013} {"train_loss": -26.4666805267334, "global_step": 416112, "epoch": 5013} {"train_loss": -26.87397575378418, "global_step": 416113, "epoch": 5013} {"train_loss": -26.377685546875, "global_step": 416114, "epoch": 5013} {"train_loss": -26.80085563659668, "global_step": 416115, "epoch": 5013} {"train_loss": -26.856372833251953, "global_step": 416116, "epoch": 5013} {"train_loss": -27.217456817626953, "global_step": 416117, "epoch": 5013} {"train_loss": -26.6057186126709, "global_step": 416118, "epoch": 5013} {"train_loss": -26.94923973083496, "global_step": 416119, "epoch": 5013} {"train_loss": -26.682783126831055, "global_step": 416120, "epoch": 5013} {"train_loss": -26.750600814819336, "global_step": 416121, "epoch": 5013} {"train_loss": -27.003711700439453, "global_step": 416122, "epoch": 5013} {"train_loss": -26.9450740814209, "global_step": 416123, "epoch": 5013} {"train_loss": -26.74747085571289, "global_step": 416124, "epoch": 5013} {"train_loss": -26.69544792175293, "global_step": 416125, "epoch": 5013} {"train_loss": -26.588911056518555, "global_step": 416126, "epoch": 5013} {"train_loss": -27.117542266845703, "global_step": 416127, "epoch": 5013} {"train_loss": -26.625198364257812, "global_step": 416128, "epoch": 5013} {"train_loss": -26.835693359375, "global_step": 416129, "epoch": 5013} {"train_loss": -27.205854415893555, "global_step": 416130, "epoch": 5013} {"train_loss": -27.05929946899414, "global_step": 416131, "epoch": 5013} {"train_loss": -26.841089248657227, "global_step": 416132, "epoch": 5013} {"train_loss": -26.736310958862305, "global_step": 416133, "epoch": 5013} {"train_loss": -26.696735382080078, "global_step": 416134, "epoch": 5013} {"train_loss": -27.024280548095703, "global_step": 416135, "epoch": 5013} {"train_loss": -26.502561569213867, "global_step": 416136, "epoch": 5013} {"train_loss": -26.465484619140625, "global_step": 416137, "epoch": 5013} {"train_loss": -26.572235107421875, "global_step": 416138, "epoch": 5013} {"train_loss": -26.2750301361084, "global_step": 416139, "epoch": 5013} {"train_loss": -26.616235733032227, "global_step": 416140, "epoch": 5013} {"train_loss": -26.006561279296875, "global_step": 416141, "epoch": 5013} {"train_loss": -26.540857315063477, "global_step": 416142, "epoch": 5013} {"train_loss": -26.41342544555664, "global_step": 416143, "epoch": 5013} {"train_loss": -25.839466094970703, "global_step": 416144, "epoch": 5013} {"train_loss": -26.629087448120117, "global_step": 416145, "epoch": 5013} {"train_loss": -26.29618263244629, "global_step": 416146, "epoch": 5013} {"train_loss": -26.29231071472168, "global_step": 416147, "epoch": 5013} {"train_loss": -26.30958366394043, "global_step": 416148, "epoch": 5013} {"train_loss": -26.809436798095703, "global_step": 416149, "epoch": 5013} {"train_loss": -26.62936782836914, "global_step": 416150, "epoch": 5013} {"train_loss": -26.613189697265625, "global_step": 416151, "epoch": 5013} {"train_loss": -26.133901596069336, "global_step": 416152, "epoch": 5013} {"train_loss": -26.680932998657227, "global_step": 416153, "epoch": 5013} {"train_loss": -26.584421157836914, "global_step": 416154, "epoch": 5013} {"train_loss": -26.610321044921875, "global_step": 416155, "epoch": 5013} {"train_loss": -26.23310661315918, "global_step": 416156, "epoch": 5013} {"train_loss": -26.40266227722168, "global_step": 416157, "epoch": 5013} {"train_loss": -26.355255126953125, "global_step": 416158, "epoch": 5013} {"train_loss": -26.296131134033203, "global_step": 416159, "epoch": 5013} {"train_loss": -26.89263343811035, "global_step": 416160, "epoch": 5013} {"train_loss": -26.608197660331268, "global_step": 416161, "epoch": 5013, "val_loss": 6582726.0} {"train_loss": -26.012561798095703, "global_step": 416162, "epoch": 5014} {"train_loss": -26.135278701782227, "global_step": 416163, "epoch": 5014} {"train_loss": -25.697641372680664, "global_step": 416164, "epoch": 5014} {"train_loss": -25.71510887145996, "global_step": 416165, "epoch": 5014} {"train_loss": -25.90570068359375, "global_step": 416166, "epoch": 5014} {"train_loss": -26.214414596557617, "global_step": 416167, "epoch": 5014} {"train_loss": -26.394134521484375, "global_step": 416168, "epoch": 5014} {"train_loss": -26.32858657836914, "global_step": 416169, "epoch": 5014} {"train_loss": -26.315221786499023, "global_step": 416170, "epoch": 5014} {"train_loss": -26.341352462768555, "global_step": 416171, "epoch": 5014} {"train_loss": -26.48785972595215, "global_step": 416172, "epoch": 5014} {"train_loss": -26.46112060546875, "global_step": 416173, "epoch": 5014} {"train_loss": -26.186094284057617, "global_step": 416174, "epoch": 5014} {"train_loss": -26.2600154876709, "global_step": 416175, "epoch": 5014} {"train_loss": -26.539648056030273, "global_step": 416176, "epoch": 5014} {"train_loss": -26.29673194885254, "global_step": 416177, "epoch": 5014} {"train_loss": -26.680999755859375, "global_step": 416178, "epoch": 5014} {"train_loss": -26.612079620361328, "global_step": 416179, "epoch": 5014} {"train_loss": -26.448211669921875, "global_step": 416180, "epoch": 5014} {"train_loss": -26.420032501220703, "global_step": 416181, "epoch": 5014} {"train_loss": -27.091062545776367, "global_step": 416182, "epoch": 5014} {"train_loss": -26.76348876953125, "global_step": 416183, "epoch": 5014} {"train_loss": -27.15815544128418, "global_step": 416184, "epoch": 5014} {"train_loss": -26.548187255859375, "global_step": 416185, "epoch": 5014} {"train_loss": -26.71856689453125, "global_step": 416186, "epoch": 5014} {"train_loss": -26.528762817382812, "global_step": 416187, "epoch": 5014} {"train_loss": -26.8316593170166, "global_step": 416188, "epoch": 5014} {"train_loss": -26.67445945739746, "global_step": 416189, "epoch": 5014} {"train_loss": -26.6639347076416, "global_step": 416190, "epoch": 5014} {"train_loss": -26.802122116088867, "global_step": 416191, "epoch": 5014} {"train_loss": -26.899709701538086, "global_step": 416192, "epoch": 5014} {"train_loss": -26.770111083984375, "global_step": 416193, "epoch": 5014} {"train_loss": -26.800216674804688, "global_step": 416194, "epoch": 5014} {"train_loss": -26.625234603881836, "global_step": 416195, "epoch": 5014} {"train_loss": -26.95162010192871, "global_step": 416196, "epoch": 5014} {"train_loss": -26.81441307067871, "global_step": 416197, "epoch": 5014} {"train_loss": -26.93023109436035, "global_step": 416198, "epoch": 5014} {"train_loss": -27.149524688720703, "global_step": 416199, "epoch": 5014} {"train_loss": -26.873926162719727, "global_step": 416200, "epoch": 5014} {"train_loss": -26.86539077758789, "global_step": 416201, "epoch": 5014} {"train_loss": -26.67452049255371, "global_step": 416202, "epoch": 5014} {"train_loss": -26.886831283569336, "global_step": 416203, "epoch": 5014} {"train_loss": -27.10874366760254, "global_step": 416204, "epoch": 5014} {"train_loss": -27.0689640045166, "global_step": 416205, "epoch": 5014} {"train_loss": -26.78862953186035, "global_step": 416206, "epoch": 5014} {"train_loss": -27.079877853393555, "global_step": 416207, "epoch": 5014} {"train_loss": -27.0246524810791, "global_step": 416208, "epoch": 5014} {"train_loss": -26.8392333984375, "global_step": 416209, "epoch": 5014} {"train_loss": -27.026090621948242, "global_step": 416210, "epoch": 5014} {"train_loss": -26.982614517211914, "global_step": 416211, "epoch": 5014} {"train_loss": -27.02802085876465, "global_step": 416212, "epoch": 5014} {"train_loss": -26.885223388671875, "global_step": 416213, "epoch": 5014} {"train_loss": -26.965961456298828, "global_step": 416214, "epoch": 5014} {"train_loss": -26.579843521118164, "global_step": 416215, "epoch": 5014} {"train_loss": -26.853952407836914, "global_step": 416216, "epoch": 5014} {"train_loss": -26.614917755126953, "global_step": 416217, "epoch": 5014} {"train_loss": -27.028045654296875, "global_step": 416218, "epoch": 5014} {"train_loss": -26.734771728515625, "global_step": 416219, "epoch": 5014} {"train_loss": -26.84427261352539, "global_step": 416220, "epoch": 5014} {"train_loss": -26.88275718688965, "global_step": 416221, "epoch": 5014} {"train_loss": -26.390668869018555, "global_step": 416222, "epoch": 5014} {"train_loss": -26.463226318359375, "global_step": 416223, "epoch": 5014} {"train_loss": -26.79315185546875, "global_step": 416224, "epoch": 5014} {"train_loss": -26.851953506469727, "global_step": 416225, "epoch": 5014} {"train_loss": -26.38248062133789, "global_step": 416226, "epoch": 5014} {"train_loss": -27.175662994384766, "global_step": 416227, "epoch": 5014} {"train_loss": -26.511032104492188, "global_step": 416228, "epoch": 5014} {"train_loss": -26.5642147064209, "global_step": 416229, "epoch": 5014} {"train_loss": -26.9758358001709, "global_step": 416230, "epoch": 5014} {"train_loss": -26.29850196838379, "global_step": 416231, "epoch": 5014} {"train_loss": -26.634632110595703, "global_step": 416232, "epoch": 5014} {"train_loss": -26.491653442382812, "global_step": 416233, "epoch": 5014} {"train_loss": -26.740720748901367, "global_step": 416234, "epoch": 5014} {"train_loss": -26.9945011138916, "global_step": 416235, "epoch": 5014} {"train_loss": -26.785953521728516, "global_step": 416236, "epoch": 5014} {"train_loss": -26.427122116088867, "global_step": 416237, "epoch": 5014} {"train_loss": -26.4231014251709, "global_step": 416238, "epoch": 5014} {"train_loss": -26.705053329467773, "global_step": 416239, "epoch": 5014} {"train_loss": -26.552209854125977, "global_step": 416240, "epoch": 5014} {"train_loss": -26.26025390625, "global_step": 416241, "epoch": 5014} {"train_loss": -26.4063663482666, "global_step": 416242, "epoch": 5014} {"train_loss": -26.650129318237305, "global_step": 416243, "epoch": 5014} {"train_loss": -26.650683621326124, "global_step": 416244, "epoch": 5014, "val_loss": 6525500.0} {"train_loss": -25.820520401000977, "global_step": 416245, "epoch": 5015} {"train_loss": -25.830671310424805, "global_step": 416246, "epoch": 5015} {"train_loss": -25.830411911010742, "global_step": 416247, "epoch": 5015} {"train_loss": -26.283859252929688, "global_step": 416248, "epoch": 5015} {"train_loss": -25.572900772094727, "global_step": 416249, "epoch": 5015} {"train_loss": -26.702268600463867, "global_step": 416250, "epoch": 5015} {"train_loss": -25.69170570373535, "global_step": 416251, "epoch": 5015} {"train_loss": -25.6292781829834, "global_step": 416252, "epoch": 5015} {"train_loss": -25.914875030517578, "global_step": 416253, "epoch": 5015} {"train_loss": -25.766103744506836, "global_step": 416254, "epoch": 5015} {"train_loss": -26.231863021850586, "global_step": 416255, "epoch": 5015} {"train_loss": -25.889541625976562, "global_step": 416256, "epoch": 5015} {"train_loss": -25.867572784423828, "global_step": 416257, "epoch": 5015} {"train_loss": -26.09864616394043, "global_step": 416258, "epoch": 5015} {"train_loss": -26.566482543945312, "global_step": 416259, "epoch": 5015} {"train_loss": -25.9168758392334, "global_step": 416260, "epoch": 5015} {"train_loss": -26.464841842651367, "global_step": 416261, "epoch": 5015} {"train_loss": -26.279184341430664, "global_step": 416262, "epoch": 5015} {"train_loss": -26.4754581451416, "global_step": 416263, "epoch": 5015} {"train_loss": -26.556690216064453, "global_step": 416264, "epoch": 5015} {"train_loss": -26.28468132019043, "global_step": 416265, "epoch": 5015} {"train_loss": -26.56709098815918, "global_step": 416266, "epoch": 5015} {"train_loss": -26.54231071472168, "global_step": 416267, "epoch": 5015} {"train_loss": -26.629749298095703, "global_step": 416268, "epoch": 5015} {"train_loss": -26.411657333374023, "global_step": 416269, "epoch": 5015} {"train_loss": -26.55072593688965, "global_step": 416270, "epoch": 5015} {"train_loss": -26.672544479370117, "global_step": 416271, "epoch": 5015} {"train_loss": -26.69927978515625, "global_step": 416272, "epoch": 5015} {"train_loss": -26.424081802368164, "global_step": 416273, "epoch": 5015} {"train_loss": -26.807559967041016, "global_step": 416274, "epoch": 5015} {"train_loss": -26.545352935791016, "global_step": 416275, "epoch": 5015} {"train_loss": -26.762765884399414, "global_step": 416276, "epoch": 5015} {"train_loss": -26.88783836364746, "global_step": 416277, "epoch": 5015} {"train_loss": -27.0910587310791, "global_step": 416278, "epoch": 5015} {"train_loss": -26.799060821533203, "global_step": 416279, "epoch": 5015} {"train_loss": -26.851903915405273, "global_step": 416280, "epoch": 5015} {"train_loss": -26.837860107421875, "global_step": 416281, "epoch": 5015} {"train_loss": -26.831390380859375, "global_step": 416282, "epoch": 5015} {"train_loss": -26.912628173828125, "global_step": 416283, "epoch": 5015} {"train_loss": -26.408435821533203, "global_step": 416284, "epoch": 5015} {"train_loss": -26.73728370666504, "global_step": 416285, "epoch": 5015} {"train_loss": -26.46565055847168, "global_step": 416286, "epoch": 5015} {"train_loss": -26.758991241455078, "global_step": 416287, "epoch": 5015} {"train_loss": -27.18765640258789, "global_step": 416288, "epoch": 5015} {"train_loss": -26.844343185424805, "global_step": 416289, "epoch": 5015} {"train_loss": -26.685266494750977, "global_step": 416290, "epoch": 5015} {"train_loss": -26.533727645874023, "global_step": 416291, "epoch": 5015} {"train_loss": -26.820032119750977, "global_step": 416292, "epoch": 5015} {"train_loss": -26.50921058654785, "global_step": 416293, "epoch": 5015} {"train_loss": -26.675073623657227, "global_step": 416294, "epoch": 5015} {"train_loss": -26.79099464416504, "global_step": 416295, "epoch": 5015} {"train_loss": -26.630346298217773, "global_step": 416296, "epoch": 5015} {"train_loss": -26.371301651000977, "global_step": 416297, "epoch": 5015} {"train_loss": -26.61285400390625, "global_step": 416298, "epoch": 5015} {"train_loss": -26.486021041870117, "global_step": 416299, "epoch": 5015} {"train_loss": -26.700424194335938, "global_step": 416300, "epoch": 5015} {"train_loss": -26.610971450805664, "global_step": 416301, "epoch": 5015} {"train_loss": -26.030426025390625, "global_step": 416302, "epoch": 5015} {"train_loss": -26.4599609375, "global_step": 416303, "epoch": 5015} {"train_loss": -26.489795684814453, "global_step": 416304, "epoch": 5015} {"train_loss": -26.822345733642578, "global_step": 416305, "epoch": 5015} {"train_loss": -26.538654327392578, "global_step": 416306, "epoch": 5015} {"train_loss": -26.505064010620117, "global_step": 416307, "epoch": 5015} {"train_loss": -26.48614501953125, "global_step": 416308, "epoch": 5015} {"train_loss": -26.43560218811035, "global_step": 416309, "epoch": 5015} {"train_loss": -26.522968292236328, "global_step": 416310, "epoch": 5015} {"train_loss": -26.513813018798828, "global_step": 416311, "epoch": 5015} {"train_loss": -26.85279655456543, "global_step": 416312, "epoch": 5015} {"train_loss": -26.325021743774414, "global_step": 416313, "epoch": 5015} {"train_loss": -26.677587509155273, "global_step": 416314, "epoch": 5015} {"train_loss": -27.01209831237793, "global_step": 416315, "epoch": 5015} {"train_loss": -27.048437118530273, "global_step": 416316, "epoch": 5015} {"train_loss": -26.3336124420166, "global_step": 416317, "epoch": 5015} {"train_loss": -26.976476669311523, "global_step": 416318, "epoch": 5015} {"train_loss": -26.89578628540039, "global_step": 416319, "epoch": 5015} {"train_loss": -26.886428833007812, "global_step": 416320, "epoch": 5015} {"train_loss": -26.554906845092773, "global_step": 416321, "epoch": 5015} {"train_loss": -26.9127254486084, "global_step": 416322, "epoch": 5015} {"train_loss": -26.815204620361328, "global_step": 416323, "epoch": 5015} {"train_loss": -26.889774322509766, "global_step": 416324, "epoch": 5015} {"train_loss": -26.879919052124023, "global_step": 416325, "epoch": 5015} {"train_loss": -26.540563583374023, "global_step": 416326, "epoch": 5015} {"train_loss": -26.531902680914087, "global_step": 416327, "epoch": 5015, "val_loss": 6466165.0} {"train_loss": -26.29054832458496, "global_step": 416328, "epoch": 5016} {"train_loss": -26.266279220581055, "global_step": 416329, "epoch": 5016} {"train_loss": -26.6915225982666, "global_step": 416330, "epoch": 5016} {"train_loss": -25.88577651977539, "global_step": 416331, "epoch": 5016} {"train_loss": -26.32318115234375, "global_step": 416332, "epoch": 5016} {"train_loss": -26.77766227722168, "global_step": 416333, "epoch": 5016} {"train_loss": -26.23451805114746, "global_step": 416334, "epoch": 5016} {"train_loss": -26.364810943603516, "global_step": 416335, "epoch": 5016} {"train_loss": -26.500690460205078, "global_step": 416336, "epoch": 5016} {"train_loss": -26.834491729736328, "global_step": 416337, "epoch": 5016} {"train_loss": -26.299163818359375, "global_step": 416338, "epoch": 5016} {"train_loss": -26.619827270507812, "global_step": 416339, "epoch": 5016} {"train_loss": -26.224109649658203, "global_step": 416340, "epoch": 5016} {"train_loss": -26.357166290283203, "global_step": 416341, "epoch": 5016} {"train_loss": -26.136014938354492, "global_step": 416342, "epoch": 5016} {"train_loss": -25.96027946472168, "global_step": 416343, "epoch": 5016} {"train_loss": -26.400938034057617, "global_step": 416344, "epoch": 5016} {"train_loss": -26.426313400268555, "global_step": 416345, "epoch": 5016} {"train_loss": -26.64353370666504, "global_step": 416346, "epoch": 5016} {"train_loss": -26.360769271850586, "global_step": 416347, "epoch": 5016} {"train_loss": -26.37237548828125, "global_step": 416348, "epoch": 5016} {"train_loss": -26.65608787536621, "global_step": 416349, "epoch": 5016} {"train_loss": -26.5628719329834, "global_step": 416350, "epoch": 5016} {"train_loss": -26.642822265625, "global_step": 416351, "epoch": 5016} {"train_loss": -26.93132972717285, "global_step": 416352, "epoch": 5016} {"train_loss": -26.486454010009766, "global_step": 416353, "epoch": 5016} {"train_loss": -26.805191040039062, "global_step": 416354, "epoch": 5016} {"train_loss": -26.660888671875, "global_step": 416355, "epoch": 5016} {"train_loss": -26.687210083007812, "global_step": 416356, "epoch": 5016} {"train_loss": -26.8198299407959, "global_step": 416357, "epoch": 5016} {"train_loss": -26.6280517578125, "global_step": 416358, "epoch": 5016} {"train_loss": -26.863840103149414, "global_step": 416359, "epoch": 5016} {"train_loss": -26.733966827392578, "global_step": 416360, "epoch": 5016} {"train_loss": -26.6544246673584, "global_step": 416361, "epoch": 5016} {"train_loss": -26.701032638549805, "global_step": 416362, "epoch": 5016} {"train_loss": -27.03568458557129, "global_step": 416363, "epoch": 5016} {"train_loss": -26.949010848999023, "global_step": 416364, "epoch": 5016} {"train_loss": -26.914846420288086, "global_step": 416365, "epoch": 5016} {"train_loss": -26.68877601623535, "global_step": 416366, "epoch": 5016} {"train_loss": -27.08466148376465, "global_step": 416367, "epoch": 5016} {"train_loss": -27.206151962280273, "global_step": 416368, "epoch": 5016} {"train_loss": -27.01211929321289, "global_step": 416369, "epoch": 5016} {"train_loss": -26.725250244140625, "global_step": 416370, "epoch": 5016} {"train_loss": -26.771997451782227, "global_step": 416371, "epoch": 5016} {"train_loss": -26.93244743347168, "global_step": 416372, "epoch": 5016} {"train_loss": -26.355274200439453, "global_step": 416373, "epoch": 5016} {"train_loss": -26.974084854125977, "global_step": 416374, "epoch": 5016} {"train_loss": -27.236013412475586, "global_step": 416375, "epoch": 5016} {"train_loss": -26.841169357299805, "global_step": 416376, "epoch": 5016} {"train_loss": -26.83125877380371, "global_step": 416377, "epoch": 5016} {"train_loss": -26.9881649017334, "global_step": 416378, "epoch": 5016} {"train_loss": -26.3170108795166, "global_step": 416379, "epoch": 5016} {"train_loss": -26.922819137573242, "global_step": 416380, "epoch": 5016} {"train_loss": -26.797277450561523, "global_step": 416381, "epoch": 5016} {"train_loss": -26.619348526000977, "global_step": 416382, "epoch": 5016} {"train_loss": -26.923908233642578, "global_step": 416383, "epoch": 5016} {"train_loss": -26.611881256103516, "global_step": 416384, "epoch": 5016} {"train_loss": -26.764663696289062, "global_step": 416385, "epoch": 5016} {"train_loss": -26.48664665222168, "global_step": 416386, "epoch": 5016} {"train_loss": -26.257307052612305, "global_step": 416387, "epoch": 5016} {"train_loss": -27.1219425201416, "global_step": 416388, "epoch": 5016} {"train_loss": -26.504852294921875, "global_step": 416389, "epoch": 5016} {"train_loss": -25.868865966796875, "global_step": 416390, "epoch": 5016} {"train_loss": -26.618452072143555, "global_step": 416391, "epoch": 5016} {"train_loss": -26.45989990234375, "global_step": 416392, "epoch": 5016} {"train_loss": -26.38848876953125, "global_step": 416393, "epoch": 5016} {"train_loss": -26.233596801757812, "global_step": 416394, "epoch": 5016} {"train_loss": -26.545013427734375, "global_step": 416395, "epoch": 5016} {"train_loss": -26.46656608581543, "global_step": 416396, "epoch": 5016} {"train_loss": -26.739166259765625, "global_step": 416397, "epoch": 5016} {"train_loss": -26.72730827331543, "global_step": 416398, "epoch": 5016} {"train_loss": -26.692594528198242, "global_step": 416399, "epoch": 5016} {"train_loss": -26.636457443237305, "global_step": 416400, "epoch": 5016} {"train_loss": -26.583837509155273, "global_step": 416401, "epoch": 5016} {"train_loss": -26.647674560546875, "global_step": 416402, "epoch": 5016} {"train_loss": -26.703582763671875, "global_step": 416403, "epoch": 5016} {"train_loss": -26.548507690429688, "global_step": 416404, "epoch": 5016} {"train_loss": -26.594938278198242, "global_step": 416405, "epoch": 5016} {"train_loss": -26.7512264251709, "global_step": 416406, "epoch": 5016} {"train_loss": -26.95465660095215, "global_step": 416407, "epoch": 5016} {"train_loss": -26.619586944580078, "global_step": 416408, "epoch": 5016} {"train_loss": -26.98624038696289, "global_step": 416409, "epoch": 5016} {"train_loss": -26.643201345420746, "global_step": 416410, "epoch": 5016, "val_loss": 6545505.5} {"train_loss": -26.519012451171875, "global_step": 416411, "epoch": 5017} {"train_loss": -26.03139305114746, "global_step": 416412, "epoch": 5017} {"train_loss": -25.506010055541992, "global_step": 416413, "epoch": 5017} {"train_loss": -24.903491973876953, "global_step": 416414, "epoch": 5017} {"train_loss": -25.375001907348633, "global_step": 416415, "epoch": 5017} {"train_loss": -26.307331085205078, "global_step": 416416, "epoch": 5017} {"train_loss": -25.7926025390625, "global_step": 416417, "epoch": 5017} {"train_loss": -26.26679039001465, "global_step": 416418, "epoch": 5017} {"train_loss": -26.487524032592773, "global_step": 416419, "epoch": 5017} {"train_loss": -26.312580108642578, "global_step": 416420, "epoch": 5017} {"train_loss": -26.38392448425293, "global_step": 416421, "epoch": 5017} {"train_loss": -26.5311279296875, "global_step": 416422, "epoch": 5017} {"train_loss": -26.42262077331543, "global_step": 416423, "epoch": 5017} {"train_loss": -26.3676700592041, "global_step": 416424, "epoch": 5017} {"train_loss": -26.3149471282959, "global_step": 416425, "epoch": 5017} {"train_loss": -26.514301300048828, "global_step": 416426, "epoch": 5017} {"train_loss": -26.63153648376465, "global_step": 416427, "epoch": 5017} {"train_loss": -26.605741500854492, "global_step": 416428, "epoch": 5017} {"train_loss": -26.6155948638916, "global_step": 416429, "epoch": 5017} {"train_loss": -26.55959129333496, "global_step": 416430, "epoch": 5017} {"train_loss": -26.426715850830078, "global_step": 416431, "epoch": 5017} {"train_loss": -26.635278701782227, "global_step": 416432, "epoch": 5017} {"train_loss": -26.664464950561523, "global_step": 416433, "epoch": 5017} {"train_loss": -26.25970458984375, "global_step": 416434, "epoch": 5017} {"train_loss": -26.560850143432617, "global_step": 416435, "epoch": 5017} {"train_loss": -26.732986450195312, "global_step": 416436, "epoch": 5017} {"train_loss": -26.794218063354492, "global_step": 416437, "epoch": 5017} {"train_loss": -26.906131744384766, "global_step": 416438, "epoch": 5017} {"train_loss": -26.969369888305664, "global_step": 416439, "epoch": 5017} {"train_loss": -26.593976974487305, "global_step": 416440, "epoch": 5017} {"train_loss": -26.685382843017578, "global_step": 416441, "epoch": 5017} {"train_loss": -26.593969345092773, "global_step": 416442, "epoch": 5017} {"train_loss": -26.935224533081055, "global_step": 416443, "epoch": 5017} {"train_loss": -26.689523696899414, "global_step": 416444, "epoch": 5017} {"train_loss": -26.667449951171875, "global_step": 416445, "epoch": 5017} {"train_loss": -27.205524444580078, "global_step": 416446, "epoch": 5017} {"train_loss": -27.14474868774414, "global_step": 416447, "epoch": 5017} {"train_loss": -26.499195098876953, "global_step": 416448, "epoch": 5017} {"train_loss": -26.7348575592041, "global_step": 416449, "epoch": 5017} {"train_loss": -26.87699317932129, "global_step": 416450, "epoch": 5017} {"train_loss": -26.998388290405273, "global_step": 416451, "epoch": 5017} {"train_loss": -26.857563018798828, "global_step": 416452, "epoch": 5017} {"train_loss": -26.899377822875977, "global_step": 416453, "epoch": 5017} {"train_loss": -26.726394653320312, "global_step": 416454, "epoch": 5017} {"train_loss": -26.96644401550293, "global_step": 416455, "epoch": 5017} {"train_loss": -26.457239151000977, "global_step": 416456, "epoch": 5017} {"train_loss": -26.21632194519043, "global_step": 416457, "epoch": 5017} {"train_loss": -26.3487606048584, "global_step": 416458, "epoch": 5017} {"train_loss": -26.36493492126465, "global_step": 416459, "epoch": 5017} {"train_loss": -26.879812240600586, "global_step": 416460, "epoch": 5017} {"train_loss": -26.86207389831543, "global_step": 416461, "epoch": 5017} {"train_loss": -26.4466552734375, "global_step": 416462, "epoch": 5017} {"train_loss": -26.8716983795166, "global_step": 416463, "epoch": 5017} {"train_loss": -26.43603515625, "global_step": 416464, "epoch": 5017} {"train_loss": -26.76416015625, "global_step": 416465, "epoch": 5017} {"train_loss": -26.99366569519043, "global_step": 416466, "epoch": 5017} {"train_loss": -26.82581901550293, "global_step": 416467, "epoch": 5017} {"train_loss": -27.000410079956055, "global_step": 416468, "epoch": 5017} {"train_loss": -26.92144775390625, "global_step": 416469, "epoch": 5017} {"train_loss": -26.89216423034668, "global_step": 416470, "epoch": 5017} {"train_loss": -26.842321395874023, "global_step": 416471, "epoch": 5017} {"train_loss": -26.84834098815918, "global_step": 416472, "epoch": 5017} {"train_loss": -26.8168888092041, "global_step": 416473, "epoch": 5017} {"train_loss": -26.65000343322754, "global_step": 416474, "epoch": 5017} {"train_loss": -26.657873153686523, "global_step": 416475, "epoch": 5017} {"train_loss": -26.788162231445312, "global_step": 416476, "epoch": 5017} {"train_loss": -26.351837158203125, "global_step": 416477, "epoch": 5017} {"train_loss": -26.955490112304688, "global_step": 416478, "epoch": 5017} {"train_loss": -26.965106964111328, "global_step": 416479, "epoch": 5017} {"train_loss": -26.74496841430664, "global_step": 416480, "epoch": 5017} {"train_loss": -26.862213134765625, "global_step": 416481, "epoch": 5017} {"train_loss": -26.464481353759766, "global_step": 416482, "epoch": 5017} {"train_loss": -26.684249877929688, "global_step": 416483, "epoch": 5017} {"train_loss": -26.35816764831543, "global_step": 416484, "epoch": 5017} {"train_loss": -26.74104118347168, "global_step": 416485, "epoch": 5017} {"train_loss": -26.72186279296875, "global_step": 416486, "epoch": 5017} {"train_loss": -26.824661254882812, "global_step": 416487, "epoch": 5017} {"train_loss": -26.31489372253418, "global_step": 416488, "epoch": 5017} {"train_loss": -26.80160903930664, "global_step": 416489, "epoch": 5017} {"train_loss": -26.684484481811523, "global_step": 416490, "epoch": 5017} {"train_loss": -26.87660026550293, "global_step": 416491, "epoch": 5017} {"train_loss": -26.7410888671875, "global_step": 416492, "epoch": 5017} {"train_loss": -26.608899311846997, "global_step": 416493, "epoch": 5017, "val_loss": 6550441.0} {"train_loss": -25.863906860351562, "global_step": 416494, "epoch": 5018} {"train_loss": -26.277057647705078, "global_step": 416495, "epoch": 5018} {"train_loss": -26.23615837097168, "global_step": 416496, "epoch": 5018} {"train_loss": -26.3862247467041, "global_step": 416497, "epoch": 5018} {"train_loss": -25.82246208190918, "global_step": 416498, "epoch": 5018} {"train_loss": -25.920307159423828, "global_step": 416499, "epoch": 5018} {"train_loss": -25.514570236206055, "global_step": 416500, "epoch": 5018} {"train_loss": -26.567197799682617, "global_step": 416501, "epoch": 5018} {"train_loss": -26.130722045898438, "global_step": 416502, "epoch": 5018} {"train_loss": -25.892871856689453, "global_step": 416503, "epoch": 5018} {"train_loss": -25.5471248626709, "global_step": 416504, "epoch": 5018} {"train_loss": -26.332477569580078, "global_step": 416505, "epoch": 5018} {"train_loss": -26.19208335876465, "global_step": 416506, "epoch": 5018} {"train_loss": -26.11244010925293, "global_step": 416507, "epoch": 5018} {"train_loss": -26.13657569885254, "global_step": 416508, "epoch": 5018} {"train_loss": -26.2941837310791, "global_step": 416509, "epoch": 5018} {"train_loss": -26.155797958374023, "global_step": 416510, "epoch": 5018} {"train_loss": -26.287200927734375, "global_step": 416511, "epoch": 5018} {"train_loss": -26.505023956298828, "global_step": 416512, "epoch": 5018} {"train_loss": -26.349592208862305, "global_step": 416513, "epoch": 5018} {"train_loss": -26.493289947509766, "global_step": 416514, "epoch": 5018} {"train_loss": -26.534687042236328, "global_step": 416515, "epoch": 5018} {"train_loss": -26.481292724609375, "global_step": 416516, "epoch": 5018} {"train_loss": -26.495996475219727, "global_step": 416517, "epoch": 5018} {"train_loss": -26.53315544128418, "global_step": 416518, "epoch": 5018} {"train_loss": -26.295093536376953, "global_step": 416519, "epoch": 5018} {"train_loss": -26.56572914123535, "global_step": 416520, "epoch": 5018} {"train_loss": -26.327167510986328, "global_step": 416521, "epoch": 5018} {"train_loss": -26.74967384338379, "global_step": 416522, "epoch": 5018} {"train_loss": -26.72694206237793, "global_step": 416523, "epoch": 5018} {"train_loss": -27.280838012695312, "global_step": 416524, "epoch": 5018} {"train_loss": -26.914569854736328, "global_step": 416525, "epoch": 5018} {"train_loss": -26.636098861694336, "global_step": 416526, "epoch": 5018} {"train_loss": -26.97859001159668, "global_step": 416527, "epoch": 5018} {"train_loss": -26.48249626159668, "global_step": 416528, "epoch": 5018} {"train_loss": -26.823083877563477, "global_step": 416529, "epoch": 5018} {"train_loss": -26.471357345581055, "global_step": 416530, "epoch": 5018} {"train_loss": -26.66377067565918, "global_step": 416531, "epoch": 5018} {"train_loss": -26.9393310546875, "global_step": 416532, "epoch": 5018} {"train_loss": -26.7983341217041, "global_step": 416533, "epoch": 5018} {"train_loss": -26.993417739868164, "global_step": 416534, "epoch": 5018} {"train_loss": -26.80289649963379, "global_step": 416535, "epoch": 5018} {"train_loss": -26.744794845581055, "global_step": 416536, "epoch": 5018} {"train_loss": -26.606403350830078, "global_step": 416537, "epoch": 5018} {"train_loss": -26.906225204467773, "global_step": 416538, "epoch": 5018} {"train_loss": -26.943954467773438, "global_step": 416539, "epoch": 5018} {"train_loss": -27.031591415405273, "global_step": 416540, "epoch": 5018} {"train_loss": -26.965564727783203, "global_step": 416541, "epoch": 5018} {"train_loss": -27.158878326416016, "global_step": 416542, "epoch": 5018} {"train_loss": -26.709814071655273, "global_step": 416543, "epoch": 5018} {"train_loss": -27.33270835876465, "global_step": 416544, "epoch": 5018} {"train_loss": -27.226877212524414, "global_step": 416545, "epoch": 5018} {"train_loss": -26.92347526550293, "global_step": 416546, "epoch": 5018} {"train_loss": -27.02298927307129, "global_step": 416547, "epoch": 5018} {"train_loss": -27.267414093017578, "global_step": 416548, "epoch": 5018} {"train_loss": -26.64212417602539, "global_step": 416549, "epoch": 5018} {"train_loss": -26.444766998291016, "global_step": 416550, "epoch": 5018} {"train_loss": -26.633045196533203, "global_step": 416551, "epoch": 5018} {"train_loss": -26.64679527282715, "global_step": 416552, "epoch": 5018} {"train_loss": -26.438949584960938, "global_step": 416553, "epoch": 5018} {"train_loss": -26.296796798706055, "global_step": 416554, "epoch": 5018} {"train_loss": -26.807037353515625, "global_step": 416555, "epoch": 5018} {"train_loss": -26.69045066833496, "global_step": 416556, "epoch": 5018} {"train_loss": -26.669910430908203, "global_step": 416557, "epoch": 5018} {"train_loss": -26.246322631835938, "global_step": 416558, "epoch": 5018} {"train_loss": -27.08185386657715, "global_step": 416559, "epoch": 5018} {"train_loss": -26.947534561157227, "global_step": 416560, "epoch": 5018} {"train_loss": -26.646163940429688, "global_step": 416561, "epoch": 5018} {"train_loss": -26.790760040283203, "global_step": 416562, "epoch": 5018} {"train_loss": -26.790212631225586, "global_step": 416563, "epoch": 5018} {"train_loss": -26.710037231445312, "global_step": 416564, "epoch": 5018} {"train_loss": -26.90118408203125, "global_step": 416565, "epoch": 5018} {"train_loss": -27.02919578552246, "global_step": 416566, "epoch": 5018} {"train_loss": -27.068246841430664, "global_step": 416567, "epoch": 5018} {"train_loss": -27.324451446533203, "global_step": 416568, "epoch": 5018} {"train_loss": -26.938024520874023, "global_step": 416569, "epoch": 5018} {"train_loss": -27.016342163085938, "global_step": 416570, "epoch": 5018} {"train_loss": -26.77631950378418, "global_step": 416571, "epoch": 5018} {"train_loss": -27.12418556213379, "global_step": 416572, "epoch": 5018} {"train_loss": -26.702024459838867, "global_step": 416573, "epoch": 5018} {"train_loss": -26.840787887573242, "global_step": 416574, "epoch": 5018} {"train_loss": -26.683929443359375, "global_step": 416575, "epoch": 5018} {"train_loss": -26.618393955460515, "global_step": 416576, "epoch": 5018, "val_loss": 6771734.5} {"train_loss": -24.502622604370117, "global_step": 416577, "epoch": 5019} {"train_loss": -22.624969482421875, "global_step": 416578, "epoch": 5019} {"train_loss": -23.907739639282227, "global_step": 416579, "epoch": 5019} {"train_loss": -24.08511734008789, "global_step": 416580, "epoch": 5019} {"train_loss": -23.7038631439209, "global_step": 416581, "epoch": 5019} {"train_loss": -25.33987045288086, "global_step": 416582, "epoch": 5019} {"train_loss": -24.962839126586914, "global_step": 416583, "epoch": 5019} {"train_loss": -24.741727828979492, "global_step": 416584, "epoch": 5019} {"train_loss": -25.487878799438477, "global_step": 416585, "epoch": 5019} {"train_loss": -25.561927795410156, "global_step": 416586, "epoch": 5019} {"train_loss": -25.281293869018555, "global_step": 416587, "epoch": 5019} {"train_loss": -25.20248031616211, "global_step": 416588, "epoch": 5019} {"train_loss": -25.41547203063965, "global_step": 416589, "epoch": 5019} {"train_loss": -25.18440818786621, "global_step": 416590, "epoch": 5019} {"train_loss": -25.744977951049805, "global_step": 416591, "epoch": 5019} {"train_loss": -25.866331100463867, "global_step": 416592, "epoch": 5019} {"train_loss": -25.35239028930664, "global_step": 416593, "epoch": 5019} {"train_loss": -25.629602432250977, "global_step": 416594, "epoch": 5019} {"train_loss": -25.769245147705078, "global_step": 416595, "epoch": 5019} {"train_loss": -25.943470001220703, "global_step": 416596, "epoch": 5019} {"train_loss": -25.9858341217041, "global_step": 416597, "epoch": 5019} {"train_loss": -25.874683380126953, "global_step": 416598, "epoch": 5019} {"train_loss": -25.7889461517334, "global_step": 416599, "epoch": 5019} {"train_loss": -25.724720001220703, "global_step": 416600, "epoch": 5019} {"train_loss": -25.728137969970703, "global_step": 416601, "epoch": 5019} {"train_loss": -26.259246826171875, "global_step": 416602, "epoch": 5019} {"train_loss": -26.090747833251953, "global_step": 416603, "epoch": 5019} {"train_loss": -26.239347457885742, "global_step": 416604, "epoch": 5019} {"train_loss": -26.034635543823242, "global_step": 416605, "epoch": 5019} {"train_loss": -25.9819278717041, "global_step": 416606, "epoch": 5019} {"train_loss": -26.0731143951416, "global_step": 416607, "epoch": 5019} {"train_loss": -26.369155883789062, "global_step": 416608, "epoch": 5019} {"train_loss": -26.230865478515625, "global_step": 416609, "epoch": 5019} {"train_loss": -25.9818058013916, "global_step": 416610, "epoch": 5019} {"train_loss": -26.58260154724121, "global_step": 416611, "epoch": 5019} {"train_loss": -26.224599838256836, "global_step": 416612, "epoch": 5019} {"train_loss": -26.450515747070312, "global_step": 416613, "epoch": 5019} {"train_loss": -26.46012306213379, "global_step": 416614, "epoch": 5019} {"train_loss": -26.501073837280273, "global_step": 416615, "epoch": 5019} {"train_loss": -26.055007934570312, "global_step": 416616, "epoch": 5019} {"train_loss": -26.33017921447754, "global_step": 416617, "epoch": 5019} {"train_loss": -26.67191505432129, "global_step": 416618, "epoch": 5019} {"train_loss": -26.45172119140625, "global_step": 416619, "epoch": 5019} {"train_loss": -26.247241973876953, "global_step": 416620, "epoch": 5019} {"train_loss": -26.89217185974121, "global_step": 416621, "epoch": 5019} {"train_loss": -26.20415687561035, "global_step": 416622, "epoch": 5019} {"train_loss": -26.71170997619629, "global_step": 416623, "epoch": 5019} {"train_loss": -26.90961265563965, "global_step": 416624, "epoch": 5019} {"train_loss": -26.439016342163086, "global_step": 416625, "epoch": 5019} {"train_loss": -26.79835319519043, "global_step": 416626, "epoch": 5019} {"train_loss": -26.706256866455078, "global_step": 416627, "epoch": 5019} {"train_loss": -26.519113540649414, "global_step": 416628, "epoch": 5019} {"train_loss": -26.92864418029785, "global_step": 416629, "epoch": 5019} {"train_loss": -26.990888595581055, "global_step": 416630, "epoch": 5019} {"train_loss": -26.416547775268555, "global_step": 416631, "epoch": 5019} {"train_loss": -26.620676040649414, "global_step": 416632, "epoch": 5019} {"train_loss": -26.790958404541016, "global_step": 416633, "epoch": 5019} {"train_loss": -27.032026290893555, "global_step": 416634, "epoch": 5019} {"train_loss": -27.30889320373535, "global_step": 416635, "epoch": 5019} {"train_loss": -26.842493057250977, "global_step": 416636, "epoch": 5019} {"train_loss": -26.661558151245117, "global_step": 416637, "epoch": 5019} {"train_loss": -26.516599655151367, "global_step": 416638, "epoch": 5019} {"train_loss": -26.508703231811523, "global_step": 416639, "epoch": 5019} {"train_loss": -26.82191276550293, "global_step": 416640, "epoch": 5019} {"train_loss": -27.0189208984375, "global_step": 416641, "epoch": 5019} {"train_loss": -26.83624267578125, "global_step": 416642, "epoch": 5019} {"train_loss": -26.9080810546875, "global_step": 416643, "epoch": 5019} {"train_loss": -26.690916061401367, "global_step": 416644, "epoch": 5019} {"train_loss": -26.692041397094727, "global_step": 416645, "epoch": 5019} {"train_loss": -26.9144344329834, "global_step": 416646, "epoch": 5019} {"train_loss": -27.1881160736084, "global_step": 416647, "epoch": 5019} {"train_loss": -26.810644149780273, "global_step": 416648, "epoch": 5019} {"train_loss": -26.638391494750977, "global_step": 416649, "epoch": 5019} {"train_loss": -26.741464614868164, "global_step": 416650, "epoch": 5019} {"train_loss": -26.916906356811523, "global_step": 416651, "epoch": 5019} {"train_loss": -27.136383056640625, "global_step": 416652, "epoch": 5019} {"train_loss": -27.0500431060791, "global_step": 416653, "epoch": 5019} {"train_loss": -26.694538116455078, "global_step": 416654, "epoch": 5019} {"train_loss": -26.659101486206055, "global_step": 416655, "epoch": 5019} {"train_loss": -26.496082305908203, "global_step": 416656, "epoch": 5019} {"train_loss": -26.600522994995117, "global_step": 416657, "epoch": 5019} {"train_loss": -26.783838272094727, "global_step": 416658, "epoch": 5019} {"train_loss": -26.18214184404856, "global_step": 416659, "epoch": 5019, "val_loss": 6588380.0} {"train_loss": -26.015613555908203, "global_step": 416660, "epoch": 5020} {"train_loss": -24.482772827148438, "global_step": 416661, "epoch": 5020} {"train_loss": -25.11505699157715, "global_step": 416662, "epoch": 5020} {"train_loss": -25.233083724975586, "global_step": 416663, "epoch": 5020} {"train_loss": -25.595922470092773, "global_step": 416664, "epoch": 5020} {"train_loss": -26.095468521118164, "global_step": 416665, "epoch": 5020} {"train_loss": -25.277328491210938, "global_step": 416666, "epoch": 5020} {"train_loss": -25.69439125061035, "global_step": 416667, "epoch": 5020} {"train_loss": -25.890195846557617, "global_step": 416668, "epoch": 5020} {"train_loss": -26.29770851135254, "global_step": 416669, "epoch": 5020} {"train_loss": -26.248334884643555, "global_step": 416670, "epoch": 5020} {"train_loss": -25.870059967041016, "global_step": 416671, "epoch": 5020} {"train_loss": -26.277515411376953, "global_step": 416672, "epoch": 5020} {"train_loss": -25.8621826171875, "global_step": 416673, "epoch": 5020} {"train_loss": -26.164709091186523, "global_step": 416674, "epoch": 5020} {"train_loss": -26.50307273864746, "global_step": 416675, "epoch": 5020} {"train_loss": -25.963565826416016, "global_step": 416676, "epoch": 5020} {"train_loss": -26.3802433013916, "global_step": 416677, "epoch": 5020} {"train_loss": -25.936735153198242, "global_step": 416678, "epoch": 5020} {"train_loss": -26.360971450805664, "global_step": 416679, "epoch": 5020} {"train_loss": -26.388547897338867, "global_step": 416680, "epoch": 5020} {"train_loss": -25.99823570251465, "global_step": 416681, "epoch": 5020} {"train_loss": -26.65016746520996, "global_step": 416682, "epoch": 5020} {"train_loss": -26.26068687438965, "global_step": 416683, "epoch": 5020} {"train_loss": -26.592884063720703, "global_step": 416684, "epoch": 5020} {"train_loss": -26.540388107299805, "global_step": 416685, "epoch": 5020} {"train_loss": -26.44025230407715, "global_step": 416686, "epoch": 5020} {"train_loss": -26.774473190307617, "global_step": 416687, "epoch": 5020} {"train_loss": -26.473974227905273, "global_step": 416688, "epoch": 5020} {"train_loss": -26.527301788330078, "global_step": 416689, "epoch": 5020} {"train_loss": -26.615924835205078, "global_step": 416690, "epoch": 5020} {"train_loss": -26.3721866607666, "global_step": 416691, "epoch": 5020} {"train_loss": -26.953887939453125, "global_step": 416692, "epoch": 5020} {"train_loss": -26.58246421813965, "global_step": 416693, "epoch": 5020} {"train_loss": -26.804288864135742, "global_step": 416694, "epoch": 5020} {"train_loss": -26.48695182800293, "global_step": 416695, "epoch": 5020} {"train_loss": -26.65570068359375, "global_step": 416696, "epoch": 5020} {"train_loss": -26.691043853759766, "global_step": 416697, "epoch": 5020} {"train_loss": -26.596227645874023, "global_step": 416698, "epoch": 5020} {"train_loss": -26.740619659423828, "global_step": 416699, "epoch": 5020} {"train_loss": -26.72098159790039, "global_step": 416700, "epoch": 5020} {"train_loss": -26.76885986328125, "global_step": 416701, "epoch": 5020} {"train_loss": -26.631916046142578, "global_step": 416702, "epoch": 5020} {"train_loss": -26.830198287963867, "global_step": 416703, "epoch": 5020} {"train_loss": -26.810632705688477, "global_step": 416704, "epoch": 5020} {"train_loss": -27.214162826538086, "global_step": 416705, "epoch": 5020} {"train_loss": -27.025894165039062, "global_step": 416706, "epoch": 5020} {"train_loss": -26.743579864501953, "global_step": 416707, "epoch": 5020} {"train_loss": -26.741851806640625, "global_step": 416708, "epoch": 5020} {"train_loss": -26.783252716064453, "global_step": 416709, "epoch": 5020} {"train_loss": -26.524200439453125, "global_step": 416710, "epoch": 5020} {"train_loss": -26.76728630065918, "global_step": 416711, "epoch": 5020} {"train_loss": -26.902374267578125, "global_step": 416712, "epoch": 5020} {"train_loss": -26.945026397705078, "global_step": 416713, "epoch": 5020} {"train_loss": -27.25269889831543, "global_step": 416714, "epoch": 5020} {"train_loss": -26.94561767578125, "global_step": 416715, "epoch": 5020} {"train_loss": -27.08564567565918, "global_step": 416716, "epoch": 5020} {"train_loss": -26.85137367248535, "global_step": 416717, "epoch": 5020} {"train_loss": -26.750471115112305, "global_step": 416718, "epoch": 5020} {"train_loss": -26.867618560791016, "global_step": 416719, "epoch": 5020} {"train_loss": -26.62250328063965, "global_step": 416720, "epoch": 5020} {"train_loss": -26.66206169128418, "global_step": 416721, "epoch": 5020} {"train_loss": -26.781024932861328, "global_step": 416722, "epoch": 5020} {"train_loss": -26.83600425720215, "global_step": 416723, "epoch": 5020} {"train_loss": -26.904926300048828, "global_step": 416724, "epoch": 5020} {"train_loss": -26.63455581665039, "global_step": 416725, "epoch": 5020} {"train_loss": -26.684955596923828, "global_step": 416726, "epoch": 5020} {"train_loss": -26.886682510375977, "global_step": 416727, "epoch": 5020} {"train_loss": -26.978418350219727, "global_step": 416728, "epoch": 5020} {"train_loss": -26.896835327148438, "global_step": 416729, "epoch": 5020} {"train_loss": -26.603988647460938, "global_step": 416730, "epoch": 5020} {"train_loss": -26.883752822875977, "global_step": 416731, "epoch": 5020} {"train_loss": -26.433053970336914, "global_step": 416732, "epoch": 5020} {"train_loss": -26.65777587890625, "global_step": 416733, "epoch": 5020} {"train_loss": -27.19000816345215, "global_step": 416734, "epoch": 5020} {"train_loss": -26.648359298706055, "global_step": 416735, "epoch": 5020} {"train_loss": -26.690372467041016, "global_step": 416736, "epoch": 5020} {"train_loss": -26.75058937072754, "global_step": 416737, "epoch": 5020} {"train_loss": -26.290815353393555, "global_step": 416738, "epoch": 5020} {"train_loss": -26.6788272857666, "global_step": 416739, "epoch": 5020} {"train_loss": -26.824085235595703, "global_step": 416740, "epoch": 5020} {"train_loss": -26.591938018798828, "global_step": 416741, "epoch": 5020} {"train_loss": -26.520349019981293, "global_step": 416742, "epoch": 5020, "val_loss": 6675717.0} {"train_loss": -26.438634872436523, "global_step": 416743, "epoch": 5021} {"train_loss": -26.35104751586914, "global_step": 416744, "epoch": 5021} {"train_loss": -26.596044540405273, "global_step": 416745, "epoch": 5021} {"train_loss": -26.057783126831055, "global_step": 416746, "epoch": 5021} {"train_loss": -25.97493553161621, "global_step": 416747, "epoch": 5021} {"train_loss": -26.163599014282227, "global_step": 416748, "epoch": 5021} {"train_loss": -26.024755477905273, "global_step": 416749, "epoch": 5021} {"train_loss": -26.185453414916992, "global_step": 416750, "epoch": 5021} {"train_loss": -26.5345458984375, "global_step": 416751, "epoch": 5021} {"train_loss": -26.30449867248535, "global_step": 416752, "epoch": 5021} {"train_loss": -26.392688751220703, "global_step": 416753, "epoch": 5021} {"train_loss": -26.332046508789062, "global_step": 416754, "epoch": 5021} {"train_loss": -26.450281143188477, "global_step": 416755, "epoch": 5021} {"train_loss": -26.246337890625, "global_step": 416756, "epoch": 5021} {"train_loss": -26.450592041015625, "global_step": 416757, "epoch": 5021} {"train_loss": -26.630340576171875, "global_step": 416758, "epoch": 5021} {"train_loss": -26.520727157592773, "global_step": 416759, "epoch": 5021} {"train_loss": -26.5598201751709, "global_step": 416760, "epoch": 5021} {"train_loss": -26.39827537536621, "global_step": 416761, "epoch": 5021} {"train_loss": -26.564533233642578, "global_step": 416762, "epoch": 5021} {"train_loss": -26.375593185424805, "global_step": 416763, "epoch": 5021} {"train_loss": -26.520742416381836, "global_step": 416764, "epoch": 5021} {"train_loss": -26.4422550201416, "global_step": 416765, "epoch": 5021} {"train_loss": -26.680377960205078, "global_step": 416766, "epoch": 5021} {"train_loss": -26.36332130432129, "global_step": 416767, "epoch": 5021} {"train_loss": -26.357208251953125, "global_step": 416768, "epoch": 5021} {"train_loss": -26.56137466430664, "global_step": 416769, "epoch": 5021} {"train_loss": -26.61345863342285, "global_step": 416770, "epoch": 5021} {"train_loss": -26.622482299804688, "global_step": 416771, "epoch": 5021} {"train_loss": -26.769819259643555, "global_step": 416772, "epoch": 5021} {"train_loss": -26.62371253967285, "global_step": 416773, "epoch": 5021} {"train_loss": -26.758255004882812, "global_step": 416774, "epoch": 5021} {"train_loss": -26.74024772644043, "global_step": 416775, "epoch": 5021} {"train_loss": -26.348865509033203, "global_step": 416776, "epoch": 5021} {"train_loss": -26.441938400268555, "global_step": 416777, "epoch": 5021} {"train_loss": -26.6175594329834, "global_step": 416778, "epoch": 5021} {"train_loss": -26.507287979125977, "global_step": 416779, "epoch": 5021} {"train_loss": -26.400653839111328, "global_step": 416780, "epoch": 5021} {"train_loss": -27.004383087158203, "global_step": 416781, "epoch": 5021} {"train_loss": -26.52618980407715, "global_step": 416782, "epoch": 5021} {"train_loss": -26.517568588256836, "global_step": 416783, "epoch": 5021} {"train_loss": -26.571874618530273, "global_step": 416784, "epoch": 5021} {"train_loss": -26.697385787963867, "global_step": 416785, "epoch": 5021} {"train_loss": -26.6039981842041, "global_step": 416786, "epoch": 5021} {"train_loss": -26.753278732299805, "global_step": 416787, "epoch": 5021} {"train_loss": -26.958505630493164, "global_step": 416788, "epoch": 5021} {"train_loss": -26.7354679107666, "global_step": 416789, "epoch": 5021} {"train_loss": -27.355194091796875, "global_step": 416790, "epoch": 5021} {"train_loss": -26.93973731994629, "global_step": 416791, "epoch": 5021} {"train_loss": -26.42999839782715, "global_step": 416792, "epoch": 5021} {"train_loss": -26.396820068359375, "global_step": 416793, "epoch": 5021} {"train_loss": -26.725250244140625, "global_step": 416794, "epoch": 5021} {"train_loss": -27.183740615844727, "global_step": 416795, "epoch": 5021} {"train_loss": -26.824844360351562, "global_step": 416796, "epoch": 5021} {"train_loss": -26.61261558532715, "global_step": 416797, "epoch": 5021} {"train_loss": -26.626989364624023, "global_step": 416798, "epoch": 5021} {"train_loss": -26.94486427307129, "global_step": 416799, "epoch": 5021} {"train_loss": -26.87153434753418, "global_step": 416800, "epoch": 5021} {"train_loss": -26.465530395507812, "global_step": 416801, "epoch": 5021} {"train_loss": -26.676044464111328, "global_step": 416802, "epoch": 5021} {"train_loss": -26.85938835144043, "global_step": 416803, "epoch": 5021} {"train_loss": -26.478168487548828, "global_step": 416804, "epoch": 5021} {"train_loss": -27.237958908081055, "global_step": 416805, "epoch": 5021} {"train_loss": -26.540678024291992, "global_step": 416806, "epoch": 5021} {"train_loss": -26.847614288330078, "global_step": 416807, "epoch": 5021} {"train_loss": -26.4420223236084, "global_step": 416808, "epoch": 5021} {"train_loss": -26.0414981842041, "global_step": 416809, "epoch": 5021} {"train_loss": -24.94831657409668, "global_step": 416810, "epoch": 5021} {"train_loss": -24.041894912719727, "global_step": 416811, "epoch": 5021} {"train_loss": -26.10660171508789, "global_step": 416812, "epoch": 5021} {"train_loss": -25.7098331451416, "global_step": 416813, "epoch": 5021} {"train_loss": -24.711660385131836, "global_step": 416814, "epoch": 5021} {"train_loss": -26.459583282470703, "global_step": 416815, "epoch": 5021} {"train_loss": -25.100309371948242, "global_step": 416816, "epoch": 5021} {"train_loss": -26.15349769592285, "global_step": 416817, "epoch": 5021} {"train_loss": -26.365650177001953, "global_step": 416818, "epoch": 5021} {"train_loss": -26.414356231689453, "global_step": 416819, "epoch": 5021} {"train_loss": -26.52640724182129, "global_step": 416820, "epoch": 5021} {"train_loss": -25.94498634338379, "global_step": 416821, "epoch": 5021} {"train_loss": -26.452253341674805, "global_step": 416822, "epoch": 5021} {"train_loss": -26.7879638671875, "global_step": 416823, "epoch": 5021} {"train_loss": -26.451887130737305, "global_step": 416824, "epoch": 5021} {"train_loss": -26.444107515266143, "global_step": 416825, "epoch": 5021, "val_loss": 6623207.5} {"train_loss": -26.083166122436523, "global_step": 416826, "epoch": 5022} {"train_loss": -26.520828247070312, "global_step": 416827, "epoch": 5022} {"train_loss": -26.136356353759766, "global_step": 416828, "epoch": 5022} {"train_loss": -25.929967880249023, "global_step": 416829, "epoch": 5022} {"train_loss": -25.909616470336914, "global_step": 416830, "epoch": 5022} {"train_loss": -25.96466064453125, "global_step": 416831, "epoch": 5022} {"train_loss": -26.361663818359375, "global_step": 416832, "epoch": 5022} {"train_loss": -26.54054832458496, "global_step": 416833, "epoch": 5022} {"train_loss": -26.168622970581055, "global_step": 416834, "epoch": 5022} {"train_loss": -26.344024658203125, "global_step": 416835, "epoch": 5022} {"train_loss": -26.3176326751709, "global_step": 416836, "epoch": 5022} {"train_loss": -25.883283615112305, "global_step": 416837, "epoch": 5022} {"train_loss": -26.214330673217773, "global_step": 416838, "epoch": 5022} {"train_loss": -26.728967666625977, "global_step": 416839, "epoch": 5022} {"train_loss": -26.346343994140625, "global_step": 416840, "epoch": 5022} {"train_loss": -26.375476837158203, "global_step": 416841, "epoch": 5022} {"train_loss": -26.755048751831055, "global_step": 416842, "epoch": 5022} {"train_loss": -26.564443588256836, "global_step": 416843, "epoch": 5022} {"train_loss": -26.405614852905273, "global_step": 416844, "epoch": 5022} {"train_loss": -26.63465690612793, "global_step": 416845, "epoch": 5022} {"train_loss": -26.436405181884766, "global_step": 416846, "epoch": 5022} {"train_loss": -26.5222225189209, "global_step": 416847, "epoch": 5022} {"train_loss": -26.723209381103516, "global_step": 416848, "epoch": 5022} {"train_loss": -26.480300903320312, "global_step": 416849, "epoch": 5022} {"train_loss": -26.48358154296875, "global_step": 416850, "epoch": 5022} {"train_loss": -26.368982315063477, "global_step": 416851, "epoch": 5022} {"train_loss": -26.59919548034668, "global_step": 416852, "epoch": 5022} {"train_loss": -26.621646881103516, "global_step": 416853, "epoch": 5022} {"train_loss": -26.859375, "global_step": 416854, "epoch": 5022} {"train_loss": -26.414844512939453, "global_step": 416855, "epoch": 5022} {"train_loss": -26.791372299194336, "global_step": 416856, "epoch": 5022} {"train_loss": -26.64234733581543, "global_step": 416857, "epoch": 5022} {"train_loss": -26.85141372680664, "global_step": 416858, "epoch": 5022} {"train_loss": -26.52984619140625, "global_step": 416859, "epoch": 5022} {"train_loss": -26.910959243774414, "global_step": 416860, "epoch": 5022} {"train_loss": -26.71860694885254, "global_step": 416861, "epoch": 5022} {"train_loss": -27.042407989501953, "global_step": 416862, "epoch": 5022} {"train_loss": -26.674896240234375, "global_step": 416863, "epoch": 5022} {"train_loss": -26.691099166870117, "global_step": 416864, "epoch": 5022} {"train_loss": -26.711170196533203, "global_step": 416865, "epoch": 5022} {"train_loss": -26.58344078063965, "global_step": 416866, "epoch": 5022} {"train_loss": -27.011266708374023, "global_step": 416867, "epoch": 5022} {"train_loss": -26.8043212890625, "global_step": 416868, "epoch": 5022} {"train_loss": -26.59720802307129, "global_step": 416869, "epoch": 5022} {"train_loss": -26.630971908569336, "global_step": 416870, "epoch": 5022} {"train_loss": -26.87932777404785, "global_step": 416871, "epoch": 5022} {"train_loss": -26.738101959228516, "global_step": 416872, "epoch": 5022} {"train_loss": -26.234445571899414, "global_step": 416873, "epoch": 5022} {"train_loss": -26.96833610534668, "global_step": 416874, "epoch": 5022} {"train_loss": -26.46784782409668, "global_step": 416875, "epoch": 5022} {"train_loss": -26.85072135925293, "global_step": 416876, "epoch": 5022} {"train_loss": -26.790388107299805, "global_step": 416877, "epoch": 5022} {"train_loss": -26.882715225219727, "global_step": 416878, "epoch": 5022} {"train_loss": -26.590856552124023, "global_step": 416879, "epoch": 5022} {"train_loss": -26.383167266845703, "global_step": 416880, "epoch": 5022} {"train_loss": -26.854990005493164, "global_step": 416881, "epoch": 5022} {"train_loss": -26.712202072143555, "global_step": 416882, "epoch": 5022} {"train_loss": -26.643320083618164, "global_step": 416883, "epoch": 5022} {"train_loss": -26.807050704956055, "global_step": 416884, "epoch": 5022} {"train_loss": -26.970550537109375, "global_step": 416885, "epoch": 5022} {"train_loss": -27.028167724609375, "global_step": 416886, "epoch": 5022} {"train_loss": -27.23726463317871, "global_step": 416887, "epoch": 5022} {"train_loss": -26.74946403503418, "global_step": 416888, "epoch": 5022} {"train_loss": -26.82881736755371, "global_step": 416889, "epoch": 5022} {"train_loss": -26.695117950439453, "global_step": 416890, "epoch": 5022} {"train_loss": -27.0747127532959, "global_step": 416891, "epoch": 5022} {"train_loss": -26.739994049072266, "global_step": 416892, "epoch": 5022} {"train_loss": -26.875995635986328, "global_step": 416893, "epoch": 5022} {"train_loss": -27.262033462524414, "global_step": 416894, "epoch": 5022} {"train_loss": -26.998022079467773, "global_step": 416895, "epoch": 5022} {"train_loss": -26.911529541015625, "global_step": 416896, "epoch": 5022} {"train_loss": -27.11049461364746, "global_step": 416897, "epoch": 5022} {"train_loss": -26.886444091796875, "global_step": 416898, "epoch": 5022} {"train_loss": -26.5457706451416, "global_step": 416899, "epoch": 5022} {"train_loss": -26.471759796142578, "global_step": 416900, "epoch": 5022} {"train_loss": -26.11604118347168, "global_step": 416901, "epoch": 5022} {"train_loss": -26.09779930114746, "global_step": 416902, "epoch": 5022} {"train_loss": -26.293548583984375, "global_step": 416903, "epoch": 5022} {"train_loss": -26.643224716186523, "global_step": 416904, "epoch": 5022} {"train_loss": -26.50836181640625, "global_step": 416905, "epoch": 5022} {"train_loss": -26.881549835205078, "global_step": 416906, "epoch": 5022} {"train_loss": -26.663610458374023, "global_step": 416907, "epoch": 5022} {"train_loss": -26.603889764073383, "global_step": 416908, "epoch": 5022, "val_loss": 6665517.0} {"train_loss": -25.452133178710938, "global_step": 416909, "epoch": 5023} {"train_loss": -25.07030487060547, "global_step": 416910, "epoch": 5023} {"train_loss": -25.346393585205078, "global_step": 416911, "epoch": 5023} {"train_loss": -25.959646224975586, "global_step": 416912, "epoch": 5023} {"train_loss": -25.45937156677246, "global_step": 416913, "epoch": 5023} {"train_loss": -26.309415817260742, "global_step": 416914, "epoch": 5023} {"train_loss": -25.942575454711914, "global_step": 416915, "epoch": 5023} {"train_loss": -25.990188598632812, "global_step": 416916, "epoch": 5023} {"train_loss": -25.90205192565918, "global_step": 416917, "epoch": 5023} {"train_loss": -25.8736572265625, "global_step": 416918, "epoch": 5023} {"train_loss": -25.92034912109375, "global_step": 416919, "epoch": 5023} {"train_loss": -26.4959716796875, "global_step": 416920, "epoch": 5023} {"train_loss": -26.10980796813965, "global_step": 416921, "epoch": 5023} {"train_loss": -26.489700317382812, "global_step": 416922, "epoch": 5023} {"train_loss": -26.40987205505371, "global_step": 416923, "epoch": 5023} {"train_loss": -26.478979110717773, "global_step": 416924, "epoch": 5023} {"train_loss": -26.5382137298584, "global_step": 416925, "epoch": 5023} {"train_loss": -26.285980224609375, "global_step": 416926, "epoch": 5023} {"train_loss": -26.69928550720215, "global_step": 416927, "epoch": 5023} {"train_loss": -26.291234970092773, "global_step": 416928, "epoch": 5023} {"train_loss": -26.394880294799805, "global_step": 416929, "epoch": 5023} {"train_loss": -26.66041374206543, "global_step": 416930, "epoch": 5023} {"train_loss": -26.41102409362793, "global_step": 416931, "epoch": 5023} {"train_loss": -26.670820236206055, "global_step": 416932, "epoch": 5023} {"train_loss": -26.578283309936523, "global_step": 416933, "epoch": 5023} {"train_loss": -26.528594970703125, "global_step": 416934, "epoch": 5023} {"train_loss": -26.6903076171875, "global_step": 416935, "epoch": 5023} {"train_loss": -26.80953025817871, "global_step": 416936, "epoch": 5023} {"train_loss": -26.711889266967773, "global_step": 416937, "epoch": 5023} {"train_loss": -26.770612716674805, "global_step": 416938, "epoch": 5023} {"train_loss": -26.90264320373535, "global_step": 416939, "epoch": 5023} {"train_loss": -26.77680778503418, "global_step": 416940, "epoch": 5023} {"train_loss": -26.710693359375, "global_step": 416941, "epoch": 5023} {"train_loss": -26.600341796875, "global_step": 416942, "epoch": 5023} {"train_loss": -26.992761611938477, "global_step": 416943, "epoch": 5023} {"train_loss": -26.834543228149414, "global_step": 416944, "epoch": 5023} {"train_loss": -27.083526611328125, "global_step": 416945, "epoch": 5023} {"train_loss": -27.014219284057617, "global_step": 416946, "epoch": 5023} {"train_loss": -26.695581436157227, "global_step": 416947, "epoch": 5023} {"train_loss": -26.60511589050293, "global_step": 416948, "epoch": 5023} {"train_loss": -26.983922958374023, "global_step": 416949, "epoch": 5023} {"train_loss": -26.852819442749023, "global_step": 416950, "epoch": 5023} {"train_loss": -26.606170654296875, "global_step": 416951, "epoch": 5023} {"train_loss": -26.947492599487305, "global_step": 416952, "epoch": 5023} {"train_loss": -26.598724365234375, "global_step": 416953, "epoch": 5023} {"train_loss": -26.783735275268555, "global_step": 416954, "epoch": 5023} {"train_loss": -27.192502975463867, "global_step": 416955, "epoch": 5023} {"train_loss": -27.224689483642578, "global_step": 416956, "epoch": 5023} {"train_loss": -26.61696434020996, "global_step": 416957, "epoch": 5023} {"train_loss": -27.131357192993164, "global_step": 416958, "epoch": 5023} {"train_loss": -27.33158302307129, "global_step": 416959, "epoch": 5023} {"train_loss": -27.055728912353516, "global_step": 416960, "epoch": 5023} {"train_loss": -27.023193359375, "global_step": 416961, "epoch": 5023} {"train_loss": -26.681161880493164, "global_step": 416962, "epoch": 5023} {"train_loss": -26.675390243530273, "global_step": 416963, "epoch": 5023} {"train_loss": -26.802072525024414, "global_step": 416964, "epoch": 5023} {"train_loss": -26.927515029907227, "global_step": 416965, "epoch": 5023} {"train_loss": -26.6003475189209, "global_step": 416966, "epoch": 5023} {"train_loss": -27.10004234313965, "global_step": 416967, "epoch": 5023} {"train_loss": -27.007108688354492, "global_step": 416968, "epoch": 5023} {"train_loss": -26.902637481689453, "global_step": 416969, "epoch": 5023} {"train_loss": -27.01338005065918, "global_step": 416970, "epoch": 5023} {"train_loss": -26.774412155151367, "global_step": 416971, "epoch": 5023} {"train_loss": -27.200870513916016, "global_step": 416972, "epoch": 5023} {"train_loss": -26.99928092956543, "global_step": 416973, "epoch": 5023} {"train_loss": -26.86310386657715, "global_step": 416974, "epoch": 5023} {"train_loss": -26.307758331298828, "global_step": 416975, "epoch": 5023} {"train_loss": -26.77338218688965, "global_step": 416976, "epoch": 5023} {"train_loss": -26.82000160217285, "global_step": 416977, "epoch": 5023} {"train_loss": -26.768753051757812, "global_step": 416978, "epoch": 5023} {"train_loss": -26.61781120300293, "global_step": 416979, "epoch": 5023} {"train_loss": -26.57346534729004, "global_step": 416980, "epoch": 5023} {"train_loss": -26.98345375061035, "global_step": 416981, "epoch": 5023} {"train_loss": -27.202503204345703, "global_step": 416982, "epoch": 5023} {"train_loss": -26.91681480407715, "global_step": 416983, "epoch": 5023} {"train_loss": -26.9412899017334, "global_step": 416984, "epoch": 5023} {"train_loss": -27.27924156188965, "global_step": 416985, "epoch": 5023} {"train_loss": -26.57826042175293, "global_step": 416986, "epoch": 5023} {"train_loss": -26.7205753326416, "global_step": 416987, "epoch": 5023} {"train_loss": -26.893112182617188, "global_step": 416988, "epoch": 5023} {"train_loss": -26.954654693603516, "global_step": 416989, "epoch": 5023} {"train_loss": -27.117597579956055, "global_step": 416990, "epoch": 5023} {"train_loss": -26.64123174368617, "global_step": 416991, "epoch": 5023, "val_loss": 6649782.0} {"train_loss": -26.62472915649414, "global_step": 416992, "epoch": 5024} {"train_loss": -26.913068771362305, "global_step": 416993, "epoch": 5024} {"train_loss": -26.480365753173828, "global_step": 416994, "epoch": 5024} {"train_loss": -26.358905792236328, "global_step": 416995, "epoch": 5024} {"train_loss": -26.955509185791016, "global_step": 416996, "epoch": 5024} {"train_loss": -26.60163688659668, "global_step": 416997, "epoch": 5024} {"train_loss": -26.754135131835938, "global_step": 416998, "epoch": 5024} {"train_loss": -26.623884201049805, "global_step": 416999, "epoch": 5024} {"train_loss": -26.815256118774414, "global_step": 417000, "epoch": 5024} {"train_loss": -26.456823348999023, "global_step": 417001, "epoch": 5024} {"train_loss": -26.857025146484375, "global_step": 417002, "epoch": 5024} {"train_loss": -27.0507755279541, "global_step": 417003, "epoch": 5024} {"train_loss": -26.543243408203125, "global_step": 417004, "epoch": 5024} {"train_loss": -26.7849063873291, "global_step": 417005, "epoch": 5024} {"train_loss": -26.45020866394043, "global_step": 417006, "epoch": 5024} {"train_loss": -26.7398624420166, "global_step": 417007, "epoch": 5024} {"train_loss": -26.610132217407227, "global_step": 417008, "epoch": 5024} {"train_loss": -26.506763458251953, "global_step": 417009, "epoch": 5024} {"train_loss": -26.980731964111328, "global_step": 417010, "epoch": 5024} {"train_loss": -26.804426193237305, "global_step": 417011, "epoch": 5024} {"train_loss": -26.061620712280273, "global_step": 417012, "epoch": 5024} {"train_loss": -26.26641273498535, "global_step": 417013, "epoch": 5024} {"train_loss": -26.136686325073242, "global_step": 417014, "epoch": 5024} {"train_loss": -26.95265769958496, "global_step": 417015, "epoch": 5024} {"train_loss": -26.4487247467041, "global_step": 417016, "epoch": 5024} {"train_loss": -27.031110763549805, "global_step": 417017, "epoch": 5024} {"train_loss": -26.32907485961914, "global_step": 417018, "epoch": 5024} {"train_loss": -27.179000854492188, "global_step": 417019, "epoch": 5024} {"train_loss": -26.58111000061035, "global_step": 417020, "epoch": 5024} {"train_loss": -26.507415771484375, "global_step": 417021, "epoch": 5024} {"train_loss": -27.027576446533203, "global_step": 417022, "epoch": 5024} {"train_loss": -26.723901748657227, "global_step": 417023, "epoch": 5024} {"train_loss": -26.925439834594727, "global_step": 417024, "epoch": 5024} {"train_loss": -27.226438522338867, "global_step": 417025, "epoch": 5024} {"train_loss": -26.74366569519043, "global_step": 417026, "epoch": 5024} {"train_loss": -26.555206298828125, "global_step": 417027, "epoch": 5024} {"train_loss": -26.945112228393555, "global_step": 417028, "epoch": 5024} {"train_loss": -26.601703643798828, "global_step": 417029, "epoch": 5024} {"train_loss": -26.595335006713867, "global_step": 417030, "epoch": 5024} {"train_loss": -26.732934951782227, "global_step": 417031, "epoch": 5024} {"train_loss": -26.640649795532227, "global_step": 417032, "epoch": 5024} {"train_loss": -26.800312042236328, "global_step": 417033, "epoch": 5024} {"train_loss": -26.995697021484375, "global_step": 417034, "epoch": 5024} {"train_loss": -26.664640426635742, "global_step": 417035, "epoch": 5024} {"train_loss": -26.65052604675293, "global_step": 417036, "epoch": 5024} {"train_loss": -26.733631134033203, "global_step": 417037, "epoch": 5024} {"train_loss": -26.960660934448242, "global_step": 417038, "epoch": 5024} {"train_loss": -27.27701759338379, "global_step": 417039, "epoch": 5024} {"train_loss": -26.8287353515625, "global_step": 417040, "epoch": 5024} {"train_loss": -27.032773971557617, "global_step": 417041, "epoch": 5024} {"train_loss": -27.02886962890625, "global_step": 417042, "epoch": 5024} {"train_loss": -26.879663467407227, "global_step": 417043, "epoch": 5024} {"train_loss": -27.364938735961914, "global_step": 417044, "epoch": 5024} {"train_loss": -27.18763542175293, "global_step": 417045, "epoch": 5024} {"train_loss": -27.18723487854004, "global_step": 417046, "epoch": 5024} {"train_loss": -26.747058868408203, "global_step": 417047, "epoch": 5024} {"train_loss": -26.753034591674805, "global_step": 417048, "epoch": 5024} {"train_loss": -26.78668785095215, "global_step": 417049, "epoch": 5024} {"train_loss": -27.063125610351562, "global_step": 417050, "epoch": 5024} {"train_loss": -27.102758407592773, "global_step": 417051, "epoch": 5024} {"train_loss": -26.883264541625977, "global_step": 417052, "epoch": 5024} {"train_loss": -26.876867294311523, "global_step": 417053, "epoch": 5024} {"train_loss": -26.5916690826416, "global_step": 417054, "epoch": 5024} {"train_loss": -26.75258445739746, "global_step": 417055, "epoch": 5024} {"train_loss": -27.09394645690918, "global_step": 417056, "epoch": 5024} {"train_loss": -26.784101486206055, "global_step": 417057, "epoch": 5024} {"train_loss": -27.295597076416016, "global_step": 417058, "epoch": 5024} {"train_loss": -26.838367462158203, "global_step": 417059, "epoch": 5024} {"train_loss": -27.01349449157715, "global_step": 417060, "epoch": 5024} {"train_loss": -26.84083366394043, "global_step": 417061, "epoch": 5024} {"train_loss": -26.957870483398438, "global_step": 417062, "epoch": 5024} {"train_loss": -26.881032943725586, "global_step": 417063, "epoch": 5024} {"train_loss": -27.035608291625977, "global_step": 417064, "epoch": 5024} {"train_loss": -27.1231632232666, "global_step": 417065, "epoch": 5024} {"train_loss": -26.70704460144043, "global_step": 417066, "epoch": 5024} {"train_loss": -26.47499656677246, "global_step": 417067, "epoch": 5024} {"train_loss": -26.6124324798584, "global_step": 417068, "epoch": 5024} {"train_loss": -26.608850479125977, "global_step": 417069, "epoch": 5024} {"train_loss": -26.595861434936523, "global_step": 417070, "epoch": 5024} {"train_loss": -26.178476333618164, "global_step": 417071, "epoch": 5024} {"train_loss": -26.322858810424805, "global_step": 417072, "epoch": 5024} {"train_loss": -26.486282348632812, "global_step": 417073, "epoch": 5024} {"train_loss": -26.75169970041298, "global_step": 417074, "epoch": 5024, "val_loss": 6746197.0} {"train_loss": -24.91236114501953, "global_step": 417075, "epoch": 5025} {"train_loss": -23.321884155273438, "global_step": 417076, "epoch": 5025} {"train_loss": -24.920141220092773, "global_step": 417077, "epoch": 5025} {"train_loss": -25.912281036376953, "global_step": 417078, "epoch": 5025} {"train_loss": -25.41010284423828, "global_step": 417079, "epoch": 5025} {"train_loss": -26.014190673828125, "global_step": 417080, "epoch": 5025} {"train_loss": -25.99956703186035, "global_step": 417081, "epoch": 5025} {"train_loss": -25.46198272705078, "global_step": 417082, "epoch": 5025} {"train_loss": -25.988677978515625, "global_step": 417083, "epoch": 5025} {"train_loss": -25.681720733642578, "global_step": 417084, "epoch": 5025} {"train_loss": -25.63642692565918, "global_step": 417085, "epoch": 5025} {"train_loss": -25.621755599975586, "global_step": 417086, "epoch": 5025} {"train_loss": -25.890625, "global_step": 417087, "epoch": 5025} {"train_loss": -25.984338760375977, "global_step": 417088, "epoch": 5025} {"train_loss": -26.081457138061523, "global_step": 417089, "epoch": 5025} {"train_loss": -25.90789794921875, "global_step": 417090, "epoch": 5025} {"train_loss": -25.972726821899414, "global_step": 417091, "epoch": 5025} {"train_loss": -26.260190963745117, "global_step": 417092, "epoch": 5025} {"train_loss": -26.2530517578125, "global_step": 417093, "epoch": 5025} {"train_loss": -26.333703994750977, "global_step": 417094, "epoch": 5025} {"train_loss": -26.591100692749023, "global_step": 417095, "epoch": 5025} {"train_loss": -26.191381454467773, "global_step": 417096, "epoch": 5025} {"train_loss": -26.440860748291016, "global_step": 417097, "epoch": 5025} {"train_loss": -26.352466583251953, "global_step": 417098, "epoch": 5025} {"train_loss": -26.153827667236328, "global_step": 417099, "epoch": 5025} {"train_loss": -26.64112663269043, "global_step": 417100, "epoch": 5025} {"train_loss": -26.794702529907227, "global_step": 417101, "epoch": 5025} {"train_loss": -26.435712814331055, "global_step": 417102, "epoch": 5025} {"train_loss": -26.6479434967041, "global_step": 417103, "epoch": 5025} {"train_loss": -26.32220458984375, "global_step": 417104, "epoch": 5025} {"train_loss": -26.489032745361328, "global_step": 417105, "epoch": 5025} {"train_loss": -26.58785057067871, "global_step": 417106, "epoch": 5025} {"train_loss": -26.525060653686523, "global_step": 417107, "epoch": 5025} {"train_loss": -26.469741821289062, "global_step": 417108, "epoch": 5025} {"train_loss": -26.650115966796875, "global_step": 417109, "epoch": 5025} {"train_loss": -26.70987892150879, "global_step": 417110, "epoch": 5025} {"train_loss": -26.99028968811035, "global_step": 417111, "epoch": 5025} {"train_loss": -26.583740234375, "global_step": 417112, "epoch": 5025} {"train_loss": -27.02898597717285, "global_step": 417113, "epoch": 5025} {"train_loss": -26.518146514892578, "global_step": 417114, "epoch": 5025} {"train_loss": -26.744186401367188, "global_step": 417115, "epoch": 5025} {"train_loss": -26.88416862487793, "global_step": 417116, "epoch": 5025} {"train_loss": -27.145551681518555, "global_step": 417117, "epoch": 5025} {"train_loss": -26.95236587524414, "global_step": 417118, "epoch": 5025} {"train_loss": -26.76922607421875, "global_step": 417119, "epoch": 5025} {"train_loss": -26.649133682250977, "global_step": 417120, "epoch": 5025} {"train_loss": -26.808368682861328, "global_step": 417121, "epoch": 5025} {"train_loss": -26.908910751342773, "global_step": 417122, "epoch": 5025} {"train_loss": -26.543384552001953, "global_step": 417123, "epoch": 5025} {"train_loss": -27.008392333984375, "global_step": 417124, "epoch": 5025} {"train_loss": -26.700281143188477, "global_step": 417125, "epoch": 5025} {"train_loss": -26.88494300842285, "global_step": 417126, "epoch": 5025} {"train_loss": -26.542938232421875, "global_step": 417127, "epoch": 5025} {"train_loss": -26.723989486694336, "global_step": 417128, "epoch": 5025} {"train_loss": -26.835620880126953, "global_step": 417129, "epoch": 5025} {"train_loss": -26.805639266967773, "global_step": 417130, "epoch": 5025} {"train_loss": -27.26417350769043, "global_step": 417131, "epoch": 5025} {"train_loss": -26.821613311767578, "global_step": 417132, "epoch": 5025} {"train_loss": -26.927637100219727, "global_step": 417133, "epoch": 5025} {"train_loss": -27.088171005249023, "global_step": 417134, "epoch": 5025} {"train_loss": -26.621068954467773, "global_step": 417135, "epoch": 5025} {"train_loss": -27.123132705688477, "global_step": 417136, "epoch": 5025} {"train_loss": -26.853076934814453, "global_step": 417137, "epoch": 5025} {"train_loss": -26.869794845581055, "global_step": 417138, "epoch": 5025} {"train_loss": -26.774316787719727, "global_step": 417139, "epoch": 5025} {"train_loss": -27.052520751953125, "global_step": 417140, "epoch": 5025} {"train_loss": -26.796497344970703, "global_step": 417141, "epoch": 5025} {"train_loss": -26.377899169921875, "global_step": 417142, "epoch": 5025} {"train_loss": -26.931928634643555, "global_step": 417143, "epoch": 5025} {"train_loss": -26.706430435180664, "global_step": 417144, "epoch": 5025} {"train_loss": -26.985116958618164, "global_step": 417145, "epoch": 5025} {"train_loss": -26.863245010375977, "global_step": 417146, "epoch": 5025} {"train_loss": -27.025293350219727, "global_step": 417147, "epoch": 5025} {"train_loss": -27.09064292907715, "global_step": 417148, "epoch": 5025} {"train_loss": -26.956830978393555, "global_step": 417149, "epoch": 5025} {"train_loss": -27.16473960876465, "global_step": 417150, "epoch": 5025} {"train_loss": -26.898895263671875, "global_step": 417151, "epoch": 5025} {"train_loss": -27.01582145690918, "global_step": 417152, "epoch": 5025} {"train_loss": -26.993804931640625, "global_step": 417153, "epoch": 5025} {"train_loss": -26.687835693359375, "global_step": 417154, "epoch": 5025} {"train_loss": -26.74395751953125, "global_step": 417155, "epoch": 5025} {"train_loss": -26.82013511657715, "global_step": 417156, "epoch": 5025} {"train_loss": -26.500590542712843, "global_step": 417157, "epoch": 5025, "val_loss": 6719348.0} {"train_loss": -26.45163345336914, "global_step": 417158, "epoch": 5026} {"train_loss": -25.30124282836914, "global_step": 417159, "epoch": 5026} {"train_loss": -25.2939453125, "global_step": 417160, "epoch": 5026} {"train_loss": -25.589736938476562, "global_step": 417161, "epoch": 5026} {"train_loss": -25.89117431640625, "global_step": 417162, "epoch": 5026} {"train_loss": -26.313013076782227, "global_step": 417163, "epoch": 5026} {"train_loss": -25.8439998626709, "global_step": 417164, "epoch": 5026} {"train_loss": -25.927221298217773, "global_step": 417165, "epoch": 5026} {"train_loss": -26.583740234375, "global_step": 417166, "epoch": 5026} {"train_loss": -25.9229679107666, "global_step": 417167, "epoch": 5026} {"train_loss": -26.166015625, "global_step": 417168, "epoch": 5026} {"train_loss": -26.26479148864746, "global_step": 417169, "epoch": 5026} {"train_loss": -25.770130157470703, "global_step": 417170, "epoch": 5026} {"train_loss": -25.9150333404541, "global_step": 417171, "epoch": 5026} {"train_loss": -26.696186065673828, "global_step": 417172, "epoch": 5026} {"train_loss": -26.07599449157715, "global_step": 417173, "epoch": 5026} {"train_loss": -26.717687606811523, "global_step": 417174, "epoch": 5026} {"train_loss": -26.534473419189453, "global_step": 417175, "epoch": 5026} {"train_loss": -26.450122833251953, "global_step": 417176, "epoch": 5026} {"train_loss": -26.847949981689453, "global_step": 417177, "epoch": 5026} {"train_loss": -26.681716918945312, "global_step": 417178, "epoch": 5026} {"train_loss": -26.89255714416504, "global_step": 417179, "epoch": 5026} {"train_loss": -26.838300704956055, "global_step": 417180, "epoch": 5026} {"train_loss": -26.350006103515625, "global_step": 417181, "epoch": 5026} {"train_loss": -26.548749923706055, "global_step": 417182, "epoch": 5026} {"train_loss": -26.794214248657227, "global_step": 417183, "epoch": 5026} {"train_loss": -26.556509017944336, "global_step": 417184, "epoch": 5026} {"train_loss": -26.80389976501465, "global_step": 417185, "epoch": 5026} {"train_loss": -26.427642822265625, "global_step": 417186, "epoch": 5026} {"train_loss": -26.7794132232666, "global_step": 417187, "epoch": 5026} {"train_loss": -26.9808349609375, "global_step": 417188, "epoch": 5026} {"train_loss": -26.822431564331055, "global_step": 417189, "epoch": 5026} {"train_loss": -26.8914794921875, "global_step": 417190, "epoch": 5026} {"train_loss": -26.762266159057617, "global_step": 417191, "epoch": 5026} {"train_loss": -26.92914390563965, "global_step": 417192, "epoch": 5026} {"train_loss": -27.013120651245117, "global_step": 417193, "epoch": 5026} {"train_loss": -26.895771026611328, "global_step": 417194, "epoch": 5026} {"train_loss": -26.849328994750977, "global_step": 417195, "epoch": 5026} {"train_loss": -26.87326431274414, "global_step": 417196, "epoch": 5026} {"train_loss": -26.874807357788086, "global_step": 417197, "epoch": 5026} {"train_loss": -27.094762802124023, "global_step": 417198, "epoch": 5026} {"train_loss": -26.734792709350586, "global_step": 417199, "epoch": 5026} {"train_loss": -27.154468536376953, "global_step": 417200, "epoch": 5026} {"train_loss": -26.63067626953125, "global_step": 417201, "epoch": 5026} {"train_loss": -27.294301986694336, "global_step": 417202, "epoch": 5026} {"train_loss": -27.252857208251953, "global_step": 417203, "epoch": 5026} {"train_loss": -26.861770629882812, "global_step": 417204, "epoch": 5026} {"train_loss": -26.982131958007812, "global_step": 417205, "epoch": 5026} {"train_loss": -26.96649169921875, "global_step": 417206, "epoch": 5026} {"train_loss": -26.688634872436523, "global_step": 417207, "epoch": 5026} {"train_loss": -27.105316162109375, "global_step": 417208, "epoch": 5026} {"train_loss": -27.053991317749023, "global_step": 417209, "epoch": 5026} {"train_loss": -27.29066276550293, "global_step": 417210, "epoch": 5026} {"train_loss": -26.92691993713379, "global_step": 417211, "epoch": 5026} {"train_loss": -26.705799102783203, "global_step": 417212, "epoch": 5026} {"train_loss": -27.157575607299805, "global_step": 417213, "epoch": 5026} {"train_loss": -26.76239013671875, "global_step": 417214, "epoch": 5026} {"train_loss": -26.55269432067871, "global_step": 417215, "epoch": 5026} {"train_loss": -26.514495849609375, "global_step": 417216, "epoch": 5026} {"train_loss": -25.8409423828125, "global_step": 417217, "epoch": 5026} {"train_loss": -26.226409912109375, "global_step": 417218, "epoch": 5026} {"train_loss": -26.426837921142578, "global_step": 417219, "epoch": 5026} {"train_loss": -26.051877975463867, "global_step": 417220, "epoch": 5026} {"train_loss": -26.574630737304688, "global_step": 417221, "epoch": 5026} {"train_loss": -26.813276290893555, "global_step": 417222, "epoch": 5026} {"train_loss": -26.546924591064453, "global_step": 417223, "epoch": 5026} {"train_loss": -26.730947494506836, "global_step": 417224, "epoch": 5026} {"train_loss": -26.037906646728516, "global_step": 417225, "epoch": 5026} {"train_loss": -26.894460678100586, "global_step": 417226, "epoch": 5026} {"train_loss": -26.378559112548828, "global_step": 417227, "epoch": 5026} {"train_loss": -26.340803146362305, "global_step": 417228, "epoch": 5026} {"train_loss": -26.425617218017578, "global_step": 417229, "epoch": 5026} {"train_loss": -26.88007926940918, "global_step": 417230, "epoch": 5026} {"train_loss": -26.440454483032227, "global_step": 417231, "epoch": 5026} {"train_loss": -26.73687744140625, "global_step": 417232, "epoch": 5026} {"train_loss": -26.759382247924805, "global_step": 417233, "epoch": 5026} {"train_loss": -26.214374542236328, "global_step": 417234, "epoch": 5026} {"train_loss": -26.21296501159668, "global_step": 417235, "epoch": 5026} {"train_loss": -26.239852905273438, "global_step": 417236, "epoch": 5026} {"train_loss": -26.652057647705078, "global_step": 417237, "epoch": 5026} {"train_loss": -26.668676376342773, "global_step": 417238, "epoch": 5026} {"train_loss": -26.499189376831055, "global_step": 417239, "epoch": 5026} {"train_loss": -26.584606768137, "global_step": 417240, "epoch": 5026, "val_loss": 6612982.0} {"train_loss": -26.41650390625, "global_step": 417241, "epoch": 5027} {"train_loss": -26.366870880126953, "global_step": 417242, "epoch": 5027} {"train_loss": -26.75665283203125, "global_step": 417243, "epoch": 5027} {"train_loss": -26.103071212768555, "global_step": 417244, "epoch": 5027} {"train_loss": -26.4905948638916, "global_step": 417245, "epoch": 5027} {"train_loss": -26.326068878173828, "global_step": 417246, "epoch": 5027} {"train_loss": -26.491933822631836, "global_step": 417247, "epoch": 5027} {"train_loss": -26.692060470581055, "global_step": 417248, "epoch": 5027} {"train_loss": -26.569482803344727, "global_step": 417249, "epoch": 5027} {"train_loss": -26.600482940673828, "global_step": 417250, "epoch": 5027} {"train_loss": -26.636816024780273, "global_step": 417251, "epoch": 5027} {"train_loss": -26.8325252532959, "global_step": 417252, "epoch": 5027} {"train_loss": -26.546466827392578, "global_step": 417253, "epoch": 5027} {"train_loss": -26.346105575561523, "global_step": 417254, "epoch": 5027} {"train_loss": -26.637853622436523, "global_step": 417255, "epoch": 5027} {"train_loss": -26.745512008666992, "global_step": 417256, "epoch": 5027} {"train_loss": -26.25648307800293, "global_step": 417257, "epoch": 5027} {"train_loss": -26.57295036315918, "global_step": 417258, "epoch": 5027} {"train_loss": -26.749820709228516, "global_step": 417259, "epoch": 5027} {"train_loss": -26.48060417175293, "global_step": 417260, "epoch": 5027} {"train_loss": -26.664337158203125, "global_step": 417261, "epoch": 5027} {"train_loss": -26.53373146057129, "global_step": 417262, "epoch": 5027} {"train_loss": -26.560514450073242, "global_step": 417263, "epoch": 5027} {"train_loss": -26.681577682495117, "global_step": 417264, "epoch": 5027} {"train_loss": -26.79841423034668, "global_step": 417265, "epoch": 5027} {"train_loss": -26.386722564697266, "global_step": 417266, "epoch": 5027} {"train_loss": -26.69716453552246, "global_step": 417267, "epoch": 5027} {"train_loss": -26.853925704956055, "global_step": 417268, "epoch": 5027} {"train_loss": -26.614831924438477, "global_step": 417269, "epoch": 5027} {"train_loss": -26.734268188476562, "global_step": 417270, "epoch": 5027} {"train_loss": -26.8110408782959, "global_step": 417271, "epoch": 5027} {"train_loss": -26.513181686401367, "global_step": 417272, "epoch": 5027} {"train_loss": -27.028076171875, "global_step": 417273, "epoch": 5027} {"train_loss": -26.85322380065918, "global_step": 417274, "epoch": 5027} {"train_loss": -26.78205680847168, "global_step": 417275, "epoch": 5027} {"train_loss": -26.813825607299805, "global_step": 417276, "epoch": 5027} {"train_loss": -26.732666015625, "global_step": 417277, "epoch": 5027} {"train_loss": -26.7059268951416, "global_step": 417278, "epoch": 5027} {"train_loss": -26.477310180664062, "global_step": 417279, "epoch": 5027} {"train_loss": -26.2636775970459, "global_step": 417280, "epoch": 5027} {"train_loss": -26.585935592651367, "global_step": 417281, "epoch": 5027} {"train_loss": -26.65508460998535, "global_step": 417282, "epoch": 5027} {"train_loss": -26.446990966796875, "global_step": 417283, "epoch": 5027} {"train_loss": -25.816879272460938, "global_step": 417284, "epoch": 5027} {"train_loss": -26.63445472717285, "global_step": 417285, "epoch": 5027} {"train_loss": -26.9855899810791, "global_step": 417286, "epoch": 5027} {"train_loss": -26.71148681640625, "global_step": 417287, "epoch": 5027} {"train_loss": -26.7541561126709, "global_step": 417288, "epoch": 5027} {"train_loss": -26.414142608642578, "global_step": 417289, "epoch": 5027} {"train_loss": -26.46306800842285, "global_step": 417290, "epoch": 5027} {"train_loss": -26.51771354675293, "global_step": 417291, "epoch": 5027} {"train_loss": -26.5544490814209, "global_step": 417292, "epoch": 5027} {"train_loss": -26.29510498046875, "global_step": 417293, "epoch": 5027} {"train_loss": -26.573684692382812, "global_step": 417294, "epoch": 5027} {"train_loss": -26.756580352783203, "global_step": 417295, "epoch": 5027} {"train_loss": -26.899463653564453, "global_step": 417296, "epoch": 5027} {"train_loss": -26.804306030273438, "global_step": 417297, "epoch": 5027} {"train_loss": -27.17896842956543, "global_step": 417298, "epoch": 5027} {"train_loss": -26.51908302307129, "global_step": 417299, "epoch": 5027} {"train_loss": -26.678518295288086, "global_step": 417300, "epoch": 5027} {"train_loss": -26.190778732299805, "global_step": 417301, "epoch": 5027} {"train_loss": -26.61781883239746, "global_step": 417302, "epoch": 5027} {"train_loss": -26.5792236328125, "global_step": 417303, "epoch": 5027} {"train_loss": -27.015317916870117, "global_step": 417304, "epoch": 5027} {"train_loss": -26.487985610961914, "global_step": 417305, "epoch": 5027} {"train_loss": -26.605154037475586, "global_step": 417306, "epoch": 5027} {"train_loss": -26.8577938079834, "global_step": 417307, "epoch": 5027} {"train_loss": -26.7887020111084, "global_step": 417308, "epoch": 5027} {"train_loss": -26.87088966369629, "global_step": 417309, "epoch": 5027} {"train_loss": -26.608118057250977, "global_step": 417310, "epoch": 5027} {"train_loss": -26.44722557067871, "global_step": 417311, "epoch": 5027} {"train_loss": -26.848600387573242, "global_step": 417312, "epoch": 5027} {"train_loss": -26.86475944519043, "global_step": 417313, "epoch": 5027} {"train_loss": -27.053394317626953, "global_step": 417314, "epoch": 5027} {"train_loss": -26.97304344177246, "global_step": 417315, "epoch": 5027} {"train_loss": -26.868650436401367, "global_step": 417316, "epoch": 5027} {"train_loss": -26.808902740478516, "global_step": 417317, "epoch": 5027} {"train_loss": -26.8745174407959, "global_step": 417318, "epoch": 5027} {"train_loss": -26.463489532470703, "global_step": 417319, "epoch": 5027} {"train_loss": -26.556793212890625, "global_step": 417320, "epoch": 5027} {"train_loss": -26.830778121948242, "global_step": 417321, "epoch": 5027} {"train_loss": -26.752429962158203, "global_step": 417322, "epoch": 5027} {"train_loss": -26.643622823508387, "global_step": 417323, "epoch": 5027, "val_loss": 6705126.0} {"train_loss": -26.460372924804688, "global_step": 417324, "epoch": 5028} {"train_loss": -26.44077491760254, "global_step": 417325, "epoch": 5028} {"train_loss": -26.718244552612305, "global_step": 417326, "epoch": 5028} {"train_loss": -26.37647819519043, "global_step": 417327, "epoch": 5028} {"train_loss": -26.30682945251465, "global_step": 417328, "epoch": 5028} {"train_loss": -26.48272705078125, "global_step": 417329, "epoch": 5028} {"train_loss": -26.4305419921875, "global_step": 417330, "epoch": 5028} {"train_loss": -26.48175621032715, "global_step": 417331, "epoch": 5028} {"train_loss": -25.9628963470459, "global_step": 417332, "epoch": 5028} {"train_loss": -26.212995529174805, "global_step": 417333, "epoch": 5028} {"train_loss": -26.36052894592285, "global_step": 417334, "epoch": 5028} {"train_loss": -26.50160026550293, "global_step": 417335, "epoch": 5028} {"train_loss": -26.620996475219727, "global_step": 417336, "epoch": 5028} {"train_loss": -26.4979305267334, "global_step": 417337, "epoch": 5028} {"train_loss": -26.652759552001953, "global_step": 417338, "epoch": 5028} {"train_loss": -26.872339248657227, "global_step": 417339, "epoch": 5028} {"train_loss": -26.50082778930664, "global_step": 417340, "epoch": 5028} {"train_loss": -26.442626953125, "global_step": 417341, "epoch": 5028} {"train_loss": -26.900476455688477, "global_step": 417342, "epoch": 5028} {"train_loss": -26.899494171142578, "global_step": 417343, "epoch": 5028} {"train_loss": -26.448974609375, "global_step": 417344, "epoch": 5028} {"train_loss": -26.51759147644043, "global_step": 417345, "epoch": 5028} {"train_loss": -26.654752731323242, "global_step": 417346, "epoch": 5028} {"train_loss": -26.8533935546875, "global_step": 417347, "epoch": 5028} {"train_loss": -26.737152099609375, "global_step": 417348, "epoch": 5028} {"train_loss": -26.9753475189209, "global_step": 417349, "epoch": 5028} {"train_loss": -27.032821655273438, "global_step": 417350, "epoch": 5028} {"train_loss": -26.631244659423828, "global_step": 417351, "epoch": 5028} {"train_loss": -27.056859970092773, "global_step": 417352, "epoch": 5028} {"train_loss": -26.60633659362793, "global_step": 417353, "epoch": 5028} {"train_loss": -27.079282760620117, "global_step": 417354, "epoch": 5028} {"train_loss": -26.718503952026367, "global_step": 417355, "epoch": 5028} {"train_loss": -26.79878807067871, "global_step": 417356, "epoch": 5028} {"train_loss": -27.063207626342773, "global_step": 417357, "epoch": 5028} {"train_loss": -27.133472442626953, "global_step": 417358, "epoch": 5028} {"train_loss": -27.292648315429688, "global_step": 417359, "epoch": 5028} {"train_loss": -26.9818172454834, "global_step": 417360, "epoch": 5028} {"train_loss": -26.95075798034668, "global_step": 417361, "epoch": 5028} {"train_loss": -27.227399826049805, "global_step": 417362, "epoch": 5028} {"train_loss": -26.95953369140625, "global_step": 417363, "epoch": 5028} {"train_loss": -26.78948402404785, "global_step": 417364, "epoch": 5028} {"train_loss": -26.743642807006836, "global_step": 417365, "epoch": 5028} {"train_loss": -26.630847930908203, "global_step": 417366, "epoch": 5028} {"train_loss": -26.715808868408203, "global_step": 417367, "epoch": 5028} {"train_loss": -26.990468978881836, "global_step": 417368, "epoch": 5028} {"train_loss": -26.7611141204834, "global_step": 417369, "epoch": 5028} {"train_loss": -27.242406845092773, "global_step": 417370, "epoch": 5028} {"train_loss": -27.3234920501709, "global_step": 417371, "epoch": 5028} {"train_loss": -26.612857818603516, "global_step": 417372, "epoch": 5028} {"train_loss": -26.19704246520996, "global_step": 417373, "epoch": 5028} {"train_loss": -26.668676376342773, "global_step": 417374, "epoch": 5028} {"train_loss": -26.63630485534668, "global_step": 417375, "epoch": 5028} {"train_loss": -26.54363441467285, "global_step": 417376, "epoch": 5028} {"train_loss": -26.7386474609375, "global_step": 417377, "epoch": 5028} {"train_loss": -26.551237106323242, "global_step": 417378, "epoch": 5028} {"train_loss": -26.717947006225586, "global_step": 417379, "epoch": 5028} {"train_loss": -26.544355392456055, "global_step": 417380, "epoch": 5028} {"train_loss": -26.937833786010742, "global_step": 417381, "epoch": 5028} {"train_loss": -26.960681915283203, "global_step": 417382, "epoch": 5028} {"train_loss": -26.731552124023438, "global_step": 417383, "epoch": 5028} {"train_loss": -26.402677536010742, "global_step": 417384, "epoch": 5028} {"train_loss": -26.883594512939453, "global_step": 417385, "epoch": 5028} {"train_loss": -26.91163444519043, "global_step": 417386, "epoch": 5028} {"train_loss": -26.60056495666504, "global_step": 417387, "epoch": 5028} {"train_loss": -27.018171310424805, "global_step": 417388, "epoch": 5028} {"train_loss": -26.491622924804688, "global_step": 417389, "epoch": 5028} {"train_loss": -27.076553344726562, "global_step": 417390, "epoch": 5028} {"train_loss": -26.70184898376465, "global_step": 417391, "epoch": 5028} {"train_loss": -27.0044002532959, "global_step": 417392, "epoch": 5028} {"train_loss": -26.611927032470703, "global_step": 417393, "epoch": 5028} {"train_loss": -27.068140029907227, "global_step": 417394, "epoch": 5028} {"train_loss": -26.94697380065918, "global_step": 417395, "epoch": 5028} {"train_loss": -26.943506240844727, "global_step": 417396, "epoch": 5028} {"train_loss": -26.708478927612305, "global_step": 417397, "epoch": 5028} {"train_loss": -27.09130859375, "global_step": 417398, "epoch": 5028} {"train_loss": -26.644392013549805, "global_step": 417399, "epoch": 5028} {"train_loss": -26.633747100830078, "global_step": 417400, "epoch": 5028} {"train_loss": -26.87578773498535, "global_step": 417401, "epoch": 5028} {"train_loss": -27.18646812438965, "global_step": 417402, "epoch": 5028} {"train_loss": -26.596893310546875, "global_step": 417403, "epoch": 5028} {"train_loss": -26.165189743041992, "global_step": 417404, "epoch": 5028} {"train_loss": -26.35035514831543, "global_step": 417405, "epoch": 5028} {"train_loss": -26.714803167136317, "global_step": 417406, "epoch": 5028, "val_loss": 6573688.5} {"train_loss": -26.26621437072754, "global_step": 417407, "epoch": 5029} {"train_loss": -26.515363693237305, "global_step": 417408, "epoch": 5029} {"train_loss": -26.531213760375977, "global_step": 417409, "epoch": 5029} {"train_loss": -26.596708297729492, "global_step": 417410, "epoch": 5029} {"train_loss": -26.754047393798828, "global_step": 417411, "epoch": 5029} {"train_loss": -26.2386417388916, "global_step": 417412, "epoch": 5029} {"train_loss": -26.149200439453125, "global_step": 417413, "epoch": 5029} {"train_loss": -26.558135986328125, "global_step": 417414, "epoch": 5029} {"train_loss": -26.49749755859375, "global_step": 417415, "epoch": 5029} {"train_loss": -26.2285213470459, "global_step": 417416, "epoch": 5029} {"train_loss": -26.60220718383789, "global_step": 417417, "epoch": 5029} {"train_loss": -26.517614364624023, "global_step": 417418, "epoch": 5029} {"train_loss": -26.717443466186523, "global_step": 417419, "epoch": 5029} {"train_loss": -26.70660972595215, "global_step": 417420, "epoch": 5029} {"train_loss": -26.373971939086914, "global_step": 417421, "epoch": 5029} {"train_loss": -26.66975975036621, "global_step": 417422, "epoch": 5029} {"train_loss": -26.607330322265625, "global_step": 417423, "epoch": 5029} {"train_loss": -26.45256996154785, "global_step": 417424, "epoch": 5029} {"train_loss": -26.551788330078125, "global_step": 417425, "epoch": 5029} {"train_loss": -26.780872344970703, "global_step": 417426, "epoch": 5029} {"train_loss": -26.500244140625, "global_step": 417427, "epoch": 5029} {"train_loss": -26.48044204711914, "global_step": 417428, "epoch": 5029} {"train_loss": -26.632104873657227, "global_step": 417429, "epoch": 5029} {"train_loss": -26.641632080078125, "global_step": 417430, "epoch": 5029} {"train_loss": -26.604894638061523, "global_step": 417431, "epoch": 5029} {"train_loss": -26.59114646911621, "global_step": 417432, "epoch": 5029} {"train_loss": -26.648944854736328, "global_step": 417433, "epoch": 5029} {"train_loss": -26.713211059570312, "global_step": 417434, "epoch": 5029} {"train_loss": -26.284072875976562, "global_step": 417435, "epoch": 5029} {"train_loss": -26.873807907104492, "global_step": 417436, "epoch": 5029} {"train_loss": -26.732269287109375, "global_step": 417437, "epoch": 5029} {"train_loss": -27.0493221282959, "global_step": 417438, "epoch": 5029} {"train_loss": -26.87548828125, "global_step": 417439, "epoch": 5029} {"train_loss": -26.9791259765625, "global_step": 417440, "epoch": 5029} {"train_loss": -26.754413604736328, "global_step": 417441, "epoch": 5029} {"train_loss": -26.81070899963379, "global_step": 417442, "epoch": 5029} {"train_loss": -26.79595947265625, "global_step": 417443, "epoch": 5029} {"train_loss": -26.691816329956055, "global_step": 417444, "epoch": 5029} {"train_loss": -26.88092041015625, "global_step": 417445, "epoch": 5029} {"train_loss": -27.007984161376953, "global_step": 417446, "epoch": 5029} {"train_loss": -27.012805938720703, "global_step": 417447, "epoch": 5029} {"train_loss": -27.122577667236328, "global_step": 417448, "epoch": 5029} {"train_loss": -26.84254264831543, "global_step": 417449, "epoch": 5029} {"train_loss": -26.897876739501953, "global_step": 417450, "epoch": 5029} {"train_loss": -27.2109317779541, "global_step": 417451, "epoch": 5029} {"train_loss": -26.502309799194336, "global_step": 417452, "epoch": 5029} {"train_loss": -27.1524715423584, "global_step": 417453, "epoch": 5029} {"train_loss": -26.756940841674805, "global_step": 417454, "epoch": 5029} {"train_loss": -27.001249313354492, "global_step": 417455, "epoch": 5029} {"train_loss": -26.840118408203125, "global_step": 417456, "epoch": 5029} {"train_loss": -26.287982940673828, "global_step": 417457, "epoch": 5029} {"train_loss": -26.652511596679688, "global_step": 417458, "epoch": 5029} {"train_loss": -26.465810775756836, "global_step": 417459, "epoch": 5029} {"train_loss": -26.41499137878418, "global_step": 417460, "epoch": 5029} {"train_loss": -27.033618927001953, "global_step": 417461, "epoch": 5029} {"train_loss": -26.872167587280273, "global_step": 417462, "epoch": 5029} {"train_loss": -26.65032958984375, "global_step": 417463, "epoch": 5029} {"train_loss": -26.60445213317871, "global_step": 417464, "epoch": 5029} {"train_loss": -26.4737606048584, "global_step": 417465, "epoch": 5029} {"train_loss": -26.77621841430664, "global_step": 417466, "epoch": 5029} {"train_loss": -26.90885353088379, "global_step": 417467, "epoch": 5029} {"train_loss": -26.82634925842285, "global_step": 417468, "epoch": 5029} {"train_loss": -26.66851806640625, "global_step": 417469, "epoch": 5029} {"train_loss": -26.69087028503418, "global_step": 417470, "epoch": 5029} {"train_loss": -26.303449630737305, "global_step": 417471, "epoch": 5029} {"train_loss": -26.6778507232666, "global_step": 417472, "epoch": 5029} {"train_loss": -26.58868980407715, "global_step": 417473, "epoch": 5029} {"train_loss": -27.06092643737793, "global_step": 417474, "epoch": 5029} {"train_loss": -26.696292877197266, "global_step": 417475, "epoch": 5029} {"train_loss": -26.554798126220703, "global_step": 417476, "epoch": 5029} {"train_loss": -26.420454025268555, "global_step": 417477, "epoch": 5029} {"train_loss": -27.040542602539062, "global_step": 417478, "epoch": 5029} {"train_loss": -27.00507164001465, "global_step": 417479, "epoch": 5029} {"train_loss": -26.848159790039062, "global_step": 417480, "epoch": 5029} {"train_loss": -26.82721519470215, "global_step": 417481, "epoch": 5029} {"train_loss": -26.632099151611328, "global_step": 417482, "epoch": 5029} {"train_loss": -26.91552734375, "global_step": 417483, "epoch": 5029} {"train_loss": -26.987913131713867, "global_step": 417484, "epoch": 5029} {"train_loss": -26.55414390563965, "global_step": 417485, "epoch": 5029} {"train_loss": -27.01752281188965, "global_step": 417486, "epoch": 5029} {"train_loss": -26.420215606689453, "global_step": 417487, "epoch": 5029} {"train_loss": -27.094282150268555, "global_step": 417488, "epoch": 5029} {"train_loss": -26.70446221225233, "global_step": 417489, "epoch": 5029, "val_loss": 6548318.0} {"train_loss": -25.959325790405273, "global_step": 417490, "epoch": 5030} {"train_loss": -26.292133331298828, "global_step": 417491, "epoch": 5030} {"train_loss": -26.181238174438477, "global_step": 417492, "epoch": 5030} {"train_loss": -25.71498680114746, "global_step": 417493, "epoch": 5030} {"train_loss": -26.353361129760742, "global_step": 417494, "epoch": 5030} {"train_loss": -26.312030792236328, "global_step": 417495, "epoch": 5030} {"train_loss": -26.679723739624023, "global_step": 417496, "epoch": 5030} {"train_loss": -26.288904190063477, "global_step": 417497, "epoch": 5030} {"train_loss": -26.327133178710938, "global_step": 417498, "epoch": 5030} {"train_loss": -26.346288681030273, "global_step": 417499, "epoch": 5030} {"train_loss": -26.592395782470703, "global_step": 417500, "epoch": 5030} {"train_loss": -26.070556640625, "global_step": 417501, "epoch": 5030} {"train_loss": -26.503509521484375, "global_step": 417502, "epoch": 5030} {"train_loss": -26.787389755249023, "global_step": 417503, "epoch": 5030} {"train_loss": -26.60556983947754, "global_step": 417504, "epoch": 5030} {"train_loss": -26.695615768432617, "global_step": 417505, "epoch": 5030} {"train_loss": -26.728561401367188, "global_step": 417506, "epoch": 5030} {"train_loss": -26.88999366760254, "global_step": 417507, "epoch": 5030} {"train_loss": -26.529531478881836, "global_step": 417508, "epoch": 5030} {"train_loss": -26.405136108398438, "global_step": 417509, "epoch": 5030} {"train_loss": -26.849166870117188, "global_step": 417510, "epoch": 5030} {"train_loss": -26.423791885375977, "global_step": 417511, "epoch": 5030} {"train_loss": -26.390058517456055, "global_step": 417512, "epoch": 5030} {"train_loss": -27.01218605041504, "global_step": 417513, "epoch": 5030} {"train_loss": -27.04852294921875, "global_step": 417514, "epoch": 5030} {"train_loss": -26.44913101196289, "global_step": 417515, "epoch": 5030} {"train_loss": -26.609174728393555, "global_step": 417516, "epoch": 5030} {"train_loss": -26.766721725463867, "global_step": 417517, "epoch": 5030} {"train_loss": -26.96040916442871, "global_step": 417518, "epoch": 5030} {"train_loss": -26.69512939453125, "global_step": 417519, "epoch": 5030} {"train_loss": -26.870471954345703, "global_step": 417520, "epoch": 5030} {"train_loss": -26.711322784423828, "global_step": 417521, "epoch": 5030} {"train_loss": -26.662494659423828, "global_step": 417522, "epoch": 5030} {"train_loss": -26.909927368164062, "global_step": 417523, "epoch": 5030} {"train_loss": -27.029401779174805, "global_step": 417524, "epoch": 5030} {"train_loss": -27.076435089111328, "global_step": 417525, "epoch": 5030} {"train_loss": -26.90301513671875, "global_step": 417526, "epoch": 5030} {"train_loss": -27.309101104736328, "global_step": 417527, "epoch": 5030} {"train_loss": -26.61249351501465, "global_step": 417528, "epoch": 5030} {"train_loss": -26.600717544555664, "global_step": 417529, "epoch": 5030} {"train_loss": -26.726476669311523, "global_step": 417530, "epoch": 5030} {"train_loss": -27.303503036499023, "global_step": 417531, "epoch": 5030} {"train_loss": -26.93450355529785, "global_step": 417532, "epoch": 5030} {"train_loss": -26.861047744750977, "global_step": 417533, "epoch": 5030} {"train_loss": -26.907806396484375, "global_step": 417534, "epoch": 5030} {"train_loss": -26.911712646484375, "global_step": 417535, "epoch": 5030} {"train_loss": -26.840845108032227, "global_step": 417536, "epoch": 5030} {"train_loss": -26.99493980407715, "global_step": 417537, "epoch": 5030} {"train_loss": -26.953662872314453, "global_step": 417538, "epoch": 5030} {"train_loss": -27.178571701049805, "global_step": 417539, "epoch": 5030} {"train_loss": -27.03606605529785, "global_step": 417540, "epoch": 5030} {"train_loss": -26.527135848999023, "global_step": 417541, "epoch": 5030} {"train_loss": -26.540847778320312, "global_step": 417542, "epoch": 5030} {"train_loss": -26.71294593811035, "global_step": 417543, "epoch": 5030} {"train_loss": -26.886823654174805, "global_step": 417544, "epoch": 5030} {"train_loss": -26.751195907592773, "global_step": 417545, "epoch": 5030} {"train_loss": -27.025232315063477, "global_step": 417546, "epoch": 5030} {"train_loss": -26.938276290893555, "global_step": 417547, "epoch": 5030} {"train_loss": -26.861968994140625, "global_step": 417548, "epoch": 5030} {"train_loss": -26.873071670532227, "global_step": 417549, "epoch": 5030} {"train_loss": -26.69318199157715, "global_step": 417550, "epoch": 5030} {"train_loss": -26.825977325439453, "global_step": 417551, "epoch": 5030} {"train_loss": -26.404687881469727, "global_step": 417552, "epoch": 5030} {"train_loss": -26.935657501220703, "global_step": 417553, "epoch": 5030} {"train_loss": -26.8747501373291, "global_step": 417554, "epoch": 5030} {"train_loss": -26.617074966430664, "global_step": 417555, "epoch": 5030} {"train_loss": -26.60325050354004, "global_step": 417556, "epoch": 5030} {"train_loss": -26.581573486328125, "global_step": 417557, "epoch": 5030} {"train_loss": -26.741260528564453, "global_step": 417558, "epoch": 5030} {"train_loss": -26.66982078552246, "global_step": 417559, "epoch": 5030} {"train_loss": -27.246328353881836, "global_step": 417560, "epoch": 5030} {"train_loss": -26.824283599853516, "global_step": 417561, "epoch": 5030} {"train_loss": -26.97304344177246, "global_step": 417562, "epoch": 5030} {"train_loss": -26.691150665283203, "global_step": 417563, "epoch": 5030} {"train_loss": -26.737668991088867, "global_step": 417564, "epoch": 5030} {"train_loss": -26.311941146850586, "global_step": 417565, "epoch": 5030} {"train_loss": -25.8713436126709, "global_step": 417566, "epoch": 5030} {"train_loss": -25.459522247314453, "global_step": 417567, "epoch": 5030} {"train_loss": -25.93404197692871, "global_step": 417568, "epoch": 5030} {"train_loss": -26.5460147857666, "global_step": 417569, "epoch": 5030} {"train_loss": -26.288177490234375, "global_step": 417570, "epoch": 5030} {"train_loss": -26.32826042175293, "global_step": 417571, "epoch": 5030} {"train_loss": -26.65866957515119, "global_step": 417572, "epoch": 5030, "val_loss": 6494894.0} {"train_loss": -26.395004272460938, "global_step": 417573, "epoch": 5031} {"train_loss": -25.72806167602539, "global_step": 417574, "epoch": 5031} {"train_loss": -26.111059188842773, "global_step": 417575, "epoch": 5031} {"train_loss": -25.946121215820312, "global_step": 417576, "epoch": 5031} {"train_loss": -25.91859245300293, "global_step": 417577, "epoch": 5031} {"train_loss": -26.03033447265625, "global_step": 417578, "epoch": 5031} {"train_loss": -26.150970458984375, "global_step": 417579, "epoch": 5031} {"train_loss": -26.43891716003418, "global_step": 417580, "epoch": 5031} {"train_loss": -25.93804359436035, "global_step": 417581, "epoch": 5031} {"train_loss": -26.7388858795166, "global_step": 417582, "epoch": 5031} {"train_loss": -26.33819580078125, "global_step": 417583, "epoch": 5031} {"train_loss": -26.19733238220215, "global_step": 417584, "epoch": 5031} {"train_loss": -26.351348876953125, "global_step": 417585, "epoch": 5031} {"train_loss": -26.549549102783203, "global_step": 417586, "epoch": 5031} {"train_loss": -26.690052032470703, "global_step": 417587, "epoch": 5031} {"train_loss": -26.233484268188477, "global_step": 417588, "epoch": 5031} {"train_loss": -26.693700790405273, "global_step": 417589, "epoch": 5031} {"train_loss": -26.465200424194336, "global_step": 417590, "epoch": 5031} {"train_loss": -26.510000228881836, "global_step": 417591, "epoch": 5031} {"train_loss": -26.58552360534668, "global_step": 417592, "epoch": 5031} {"train_loss": -26.840991973876953, "global_step": 417593, "epoch": 5031} {"train_loss": -26.571802139282227, "global_step": 417594, "epoch": 5031} {"train_loss": -26.437265396118164, "global_step": 417595, "epoch": 5031} {"train_loss": -26.495092391967773, "global_step": 417596, "epoch": 5031} {"train_loss": -26.869291305541992, "global_step": 417597, "epoch": 5031} {"train_loss": -26.817737579345703, "global_step": 417598, "epoch": 5031} {"train_loss": -26.258588790893555, "global_step": 417599, "epoch": 5031} {"train_loss": -26.804529190063477, "global_step": 417600, "epoch": 5031} {"train_loss": -26.76434898376465, "global_step": 417601, "epoch": 5031} {"train_loss": -26.81511878967285, "global_step": 417602, "epoch": 5031} {"train_loss": -26.693830490112305, "global_step": 417603, "epoch": 5031} {"train_loss": -26.8617000579834, "global_step": 417604, "epoch": 5031} {"train_loss": -26.748571395874023, "global_step": 417605, "epoch": 5031} {"train_loss": -27.062524795532227, "global_step": 417606, "epoch": 5031} {"train_loss": -26.650863647460938, "global_step": 417607, "epoch": 5031} {"train_loss": -26.9676570892334, "global_step": 417608, "epoch": 5031} {"train_loss": -26.894155502319336, "global_step": 417609, "epoch": 5031} {"train_loss": -27.08015251159668, "global_step": 417610, "epoch": 5031} {"train_loss": -26.6533203125, "global_step": 417611, "epoch": 5031} {"train_loss": -26.985071182250977, "global_step": 417612, "epoch": 5031} {"train_loss": -27.231000900268555, "global_step": 417613, "epoch": 5031} {"train_loss": -27.0224552154541, "global_step": 417614, "epoch": 5031} {"train_loss": -26.715097427368164, "global_step": 417615, "epoch": 5031} {"train_loss": -26.73335838317871, "global_step": 417616, "epoch": 5031} {"train_loss": -27.202972412109375, "global_step": 417617, "epoch": 5031} {"train_loss": -26.8226375579834, "global_step": 417618, "epoch": 5031} {"train_loss": -26.59394645690918, "global_step": 417619, "epoch": 5031} {"train_loss": -26.488122940063477, "global_step": 417620, "epoch": 5031} {"train_loss": -26.947912216186523, "global_step": 417621, "epoch": 5031} {"train_loss": -26.751508712768555, "global_step": 417622, "epoch": 5031} {"train_loss": -26.868432998657227, "global_step": 417623, "epoch": 5031} {"train_loss": -26.31414794921875, "global_step": 417624, "epoch": 5031} {"train_loss": -26.499372482299805, "global_step": 417625, "epoch": 5031} {"train_loss": -26.721099853515625, "global_step": 417626, "epoch": 5031} {"train_loss": -27.0161075592041, "global_step": 417627, "epoch": 5031} {"train_loss": -27.029376983642578, "global_step": 417628, "epoch": 5031} {"train_loss": -26.492752075195312, "global_step": 417629, "epoch": 5031} {"train_loss": -26.912948608398438, "global_step": 417630, "epoch": 5031} {"train_loss": -26.989017486572266, "global_step": 417631, "epoch": 5031} {"train_loss": -26.70599365234375, "global_step": 417632, "epoch": 5031} {"train_loss": -27.107105255126953, "global_step": 417633, "epoch": 5031} {"train_loss": -26.8924617767334, "global_step": 417634, "epoch": 5031} {"train_loss": -27.071386337280273, "global_step": 417635, "epoch": 5031} {"train_loss": -26.841861724853516, "global_step": 417636, "epoch": 5031} {"train_loss": -26.574045181274414, "global_step": 417637, "epoch": 5031} {"train_loss": -26.962778091430664, "global_step": 417638, "epoch": 5031} {"train_loss": -26.83711051940918, "global_step": 417639, "epoch": 5031} {"train_loss": -26.962141036987305, "global_step": 417640, "epoch": 5031} {"train_loss": -27.190698623657227, "global_step": 417641, "epoch": 5031} {"train_loss": -26.756763458251953, "global_step": 417642, "epoch": 5031} {"train_loss": -26.963895797729492, "global_step": 417643, "epoch": 5031} {"train_loss": -26.945199966430664, "global_step": 417644, "epoch": 5031} {"train_loss": -26.856842041015625, "global_step": 417645, "epoch": 5031} {"train_loss": -26.797637939453125, "global_step": 417646, "epoch": 5031} {"train_loss": -26.429468154907227, "global_step": 417647, "epoch": 5031} {"train_loss": -26.93037986755371, "global_step": 417648, "epoch": 5031} {"train_loss": -27.114789962768555, "global_step": 417649, "epoch": 5031} {"train_loss": -26.983057022094727, "global_step": 417650, "epoch": 5031} {"train_loss": -26.611083984375, "global_step": 417651, "epoch": 5031} {"train_loss": -26.57967185974121, "global_step": 417652, "epoch": 5031} {"train_loss": -26.849218368530273, "global_step": 417653, "epoch": 5031} {"train_loss": -26.91364097595215, "global_step": 417654, "epoch": 5031} {"train_loss": -26.703386996165815, "global_step": 417655, "epoch": 5031, "val_loss": 6562778.0} {"train_loss": -26.255346298217773, "global_step": 417656, "epoch": 5032} {"train_loss": -26.470075607299805, "global_step": 417657, "epoch": 5032} {"train_loss": -26.156442642211914, "global_step": 417658, "epoch": 5032} {"train_loss": -26.83774757385254, "global_step": 417659, "epoch": 5032} {"train_loss": -26.59626579284668, "global_step": 417660, "epoch": 5032} {"train_loss": -26.53266716003418, "global_step": 417661, "epoch": 5032} {"train_loss": -26.350021362304688, "global_step": 417662, "epoch": 5032} {"train_loss": -26.3763370513916, "global_step": 417663, "epoch": 5032} {"train_loss": -26.474363327026367, "global_step": 417664, "epoch": 5032} {"train_loss": -26.561908721923828, "global_step": 417665, "epoch": 5032} {"train_loss": -26.916913986206055, "global_step": 417666, "epoch": 5032} {"train_loss": -26.395963668823242, "global_step": 417667, "epoch": 5032} {"train_loss": -26.41925048828125, "global_step": 417668, "epoch": 5032} {"train_loss": -26.29060173034668, "global_step": 417669, "epoch": 5032} {"train_loss": -26.94302749633789, "global_step": 417670, "epoch": 5032} {"train_loss": -26.632429122924805, "global_step": 417671, "epoch": 5032} {"train_loss": -26.98198890686035, "global_step": 417672, "epoch": 5032} {"train_loss": -27.3321475982666, "global_step": 417673, "epoch": 5032} {"train_loss": -26.87579917907715, "global_step": 417674, "epoch": 5032} {"train_loss": -26.738935470581055, "global_step": 417675, "epoch": 5032} {"train_loss": -26.7958984375, "global_step": 417676, "epoch": 5032} {"train_loss": -26.878833770751953, "global_step": 417677, "epoch": 5032} {"train_loss": -26.79931640625, "global_step": 417678, "epoch": 5032} {"train_loss": -26.508691787719727, "global_step": 417679, "epoch": 5032} {"train_loss": -26.63826560974121, "global_step": 417680, "epoch": 5032} {"train_loss": -26.75494956970215, "global_step": 417681, "epoch": 5032} {"train_loss": -26.8853816986084, "global_step": 417682, "epoch": 5032} {"train_loss": -27.057479858398438, "global_step": 417683, "epoch": 5032} {"train_loss": -27.041889190673828, "global_step": 417684, "epoch": 5032} {"train_loss": -26.935712814331055, "global_step": 417685, "epoch": 5032} {"train_loss": -27.179792404174805, "global_step": 417686, "epoch": 5032} {"train_loss": -27.0696964263916, "global_step": 417687, "epoch": 5032} {"train_loss": -26.95313835144043, "global_step": 417688, "epoch": 5032} {"train_loss": -26.88795280456543, "global_step": 417689, "epoch": 5032} {"train_loss": -26.66925621032715, "global_step": 417690, "epoch": 5032} {"train_loss": -26.977781295776367, "global_step": 417691, "epoch": 5032} {"train_loss": -26.2556209564209, "global_step": 417692, "epoch": 5032} {"train_loss": -26.76922607421875, "global_step": 417693, "epoch": 5032} {"train_loss": -26.959997177124023, "global_step": 417694, "epoch": 5032} {"train_loss": -26.798908233642578, "global_step": 417695, "epoch": 5032} {"train_loss": -26.81842613220215, "global_step": 417696, "epoch": 5032} {"train_loss": -26.532623291015625, "global_step": 417697, "epoch": 5032} {"train_loss": -26.649442672729492, "global_step": 417698, "epoch": 5032} {"train_loss": -26.72076416015625, "global_step": 417699, "epoch": 5032} {"train_loss": -26.770965576171875, "global_step": 417700, "epoch": 5032} {"train_loss": -26.79376792907715, "global_step": 417701, "epoch": 5032} {"train_loss": -26.872480392456055, "global_step": 417702, "epoch": 5032} {"train_loss": -27.10707664489746, "global_step": 417703, "epoch": 5032} {"train_loss": -26.75043296813965, "global_step": 417704, "epoch": 5032} {"train_loss": -27.022602081298828, "global_step": 417705, "epoch": 5032} {"train_loss": -26.787885665893555, "global_step": 417706, "epoch": 5032} {"train_loss": -27.09694480895996, "global_step": 417707, "epoch": 5032} {"train_loss": -26.882770538330078, "global_step": 417708, "epoch": 5032} {"train_loss": -27.036970138549805, "global_step": 417709, "epoch": 5032} {"train_loss": -26.716318130493164, "global_step": 417710, "epoch": 5032} {"train_loss": -26.97865104675293, "global_step": 417711, "epoch": 5032} {"train_loss": -26.863447189331055, "global_step": 417712, "epoch": 5032} {"train_loss": -26.781269073486328, "global_step": 417713, "epoch": 5032} {"train_loss": -26.76486587524414, "global_step": 417714, "epoch": 5032} {"train_loss": -26.333539962768555, "global_step": 417715, "epoch": 5032} {"train_loss": -26.763486862182617, "global_step": 417716, "epoch": 5032} {"train_loss": -27.120014190673828, "global_step": 417717, "epoch": 5032} {"train_loss": -26.883344650268555, "global_step": 417718, "epoch": 5032} {"train_loss": -26.309106826782227, "global_step": 417719, "epoch": 5032} {"train_loss": -26.13813591003418, "global_step": 417720, "epoch": 5032} {"train_loss": -25.903532028198242, "global_step": 417721, "epoch": 5032} {"train_loss": -26.644113540649414, "global_step": 417722, "epoch": 5032} {"train_loss": -26.43877601623535, "global_step": 417723, "epoch": 5032} {"train_loss": -26.40614128112793, "global_step": 417724, "epoch": 5032} {"train_loss": -26.833112716674805, "global_step": 417725, "epoch": 5032} {"train_loss": -26.497716903686523, "global_step": 417726, "epoch": 5032} {"train_loss": -26.716535568237305, "global_step": 417727, "epoch": 5032} {"train_loss": -26.67461585998535, "global_step": 417728, "epoch": 5032} {"train_loss": -26.504150390625, "global_step": 417729, "epoch": 5032} {"train_loss": -26.756772994995117, "global_step": 417730, "epoch": 5032} {"train_loss": -26.6824951171875, "global_step": 417731, "epoch": 5032} {"train_loss": -26.762426376342773, "global_step": 417732, "epoch": 5032} {"train_loss": -26.67176628112793, "global_step": 417733, "epoch": 5032} {"train_loss": -26.38551902770996, "global_step": 417734, "epoch": 5032} {"train_loss": -26.516468048095703, "global_step": 417735, "epoch": 5032} {"train_loss": -26.736738204956055, "global_step": 417736, "epoch": 5032} {"train_loss": -26.733739852905273, "global_step": 417737, "epoch": 5032} {"train_loss": -26.704949252576714, "global_step": 417738, "epoch": 5032, "val_loss": 6676500.5} {"train_loss": -26.082067489624023, "global_step": 417739, "epoch": 5033} {"train_loss": -25.19817543029785, "global_step": 417740, "epoch": 5033} {"train_loss": -25.949054718017578, "global_step": 417741, "epoch": 5033} {"train_loss": -26.17689323425293, "global_step": 417742, "epoch": 5033} {"train_loss": -25.698795318603516, "global_step": 417743, "epoch": 5033} {"train_loss": -26.13389015197754, "global_step": 417744, "epoch": 5033} {"train_loss": -26.000791549682617, "global_step": 417745, "epoch": 5033} {"train_loss": -25.559049606323242, "global_step": 417746, "epoch": 5033} {"train_loss": -25.60955810546875, "global_step": 417747, "epoch": 5033} {"train_loss": -26.065542221069336, "global_step": 417748, "epoch": 5033} {"train_loss": -26.627826690673828, "global_step": 417749, "epoch": 5033} {"train_loss": -25.935596466064453, "global_step": 417750, "epoch": 5033} {"train_loss": -26.29949378967285, "global_step": 417751, "epoch": 5033} {"train_loss": -26.54277992248535, "global_step": 417752, "epoch": 5033} {"train_loss": -25.71295166015625, "global_step": 417753, "epoch": 5033} {"train_loss": -26.456958770751953, "global_step": 417754, "epoch": 5033} {"train_loss": -26.40167236328125, "global_step": 417755, "epoch": 5033} {"train_loss": -26.614770889282227, "global_step": 417756, "epoch": 5033} {"train_loss": -26.503406524658203, "global_step": 417757, "epoch": 5033} {"train_loss": -26.812744140625, "global_step": 417758, "epoch": 5033} {"train_loss": -25.7008113861084, "global_step": 417759, "epoch": 5033} {"train_loss": -26.452184677124023, "global_step": 417760, "epoch": 5033} {"train_loss": -26.286762237548828, "global_step": 417761, "epoch": 5033} {"train_loss": -26.018909454345703, "global_step": 417762, "epoch": 5033} {"train_loss": -26.651065826416016, "global_step": 417763, "epoch": 5033} {"train_loss": -26.24844741821289, "global_step": 417764, "epoch": 5033} {"train_loss": -26.68763542175293, "global_step": 417765, "epoch": 5033} {"train_loss": -26.357213973999023, "global_step": 417766, "epoch": 5033} {"train_loss": -26.694171905517578, "global_step": 417767, "epoch": 5033} {"train_loss": -26.58127784729004, "global_step": 417768, "epoch": 5033} {"train_loss": -26.583377838134766, "global_step": 417769, "epoch": 5033} {"train_loss": -26.81111717224121, "global_step": 417770, "epoch": 5033} {"train_loss": -26.38836097717285, "global_step": 417771, "epoch": 5033} {"train_loss": -26.509260177612305, "global_step": 417772, "epoch": 5033} {"train_loss": -26.959171295166016, "global_step": 417773, "epoch": 5033} {"train_loss": -26.7530460357666, "global_step": 417774, "epoch": 5033} {"train_loss": -26.8079776763916, "global_step": 417775, "epoch": 5033} {"train_loss": -26.637693405151367, "global_step": 417776, "epoch": 5033} {"train_loss": -26.80780601501465, "global_step": 417777, "epoch": 5033} {"train_loss": -26.388092041015625, "global_step": 417778, "epoch": 5033} {"train_loss": -26.804584503173828, "global_step": 417779, "epoch": 5033} {"train_loss": -26.93098258972168, "global_step": 417780, "epoch": 5033} {"train_loss": -26.71607780456543, "global_step": 417781, "epoch": 5033} {"train_loss": -27.047119140625, "global_step": 417782, "epoch": 5033} {"train_loss": -26.854019165039062, "global_step": 417783, "epoch": 5033} {"train_loss": -26.44512939453125, "global_step": 417784, "epoch": 5033} {"train_loss": -26.843164443969727, "global_step": 417785, "epoch": 5033} {"train_loss": -26.87558364868164, "global_step": 417786, "epoch": 5033} {"train_loss": -26.8460636138916, "global_step": 417787, "epoch": 5033} {"train_loss": -26.9613037109375, "global_step": 417788, "epoch": 5033} {"train_loss": -26.99561882019043, "global_step": 417789, "epoch": 5033} {"train_loss": -27.148584365844727, "global_step": 417790, "epoch": 5033} {"train_loss": -27.2078914642334, "global_step": 417791, "epoch": 5033} {"train_loss": -27.287479400634766, "global_step": 417792, "epoch": 5033} {"train_loss": -26.46331214904785, "global_step": 417793, "epoch": 5033} {"train_loss": -27.0802059173584, "global_step": 417794, "epoch": 5033} {"train_loss": -26.962732315063477, "global_step": 417795, "epoch": 5033} {"train_loss": -27.63753318786621, "global_step": 417796, "epoch": 5033} {"train_loss": -26.9229679107666, "global_step": 417797, "epoch": 5033} {"train_loss": -26.97906494140625, "global_step": 417798, "epoch": 5033} {"train_loss": -27.063446044921875, "global_step": 417799, "epoch": 5033} {"train_loss": -26.43086051940918, "global_step": 417800, "epoch": 5033} {"train_loss": -26.86030387878418, "global_step": 417801, "epoch": 5033} {"train_loss": -26.845733642578125, "global_step": 417802, "epoch": 5033} {"train_loss": -26.674238204956055, "global_step": 417803, "epoch": 5033} {"train_loss": -26.525827407836914, "global_step": 417804, "epoch": 5033} {"train_loss": -26.870023727416992, "global_step": 417805, "epoch": 5033} {"train_loss": -26.363037109375, "global_step": 417806, "epoch": 5033} {"train_loss": -26.525970458984375, "global_step": 417807, "epoch": 5033} {"train_loss": -26.519678115844727, "global_step": 417808, "epoch": 5033} {"train_loss": -26.95650291442871, "global_step": 417809, "epoch": 5033} {"train_loss": -26.7574405670166, "global_step": 417810, "epoch": 5033} {"train_loss": -26.926807403564453, "global_step": 417811, "epoch": 5033} {"train_loss": -26.548532485961914, "global_step": 417812, "epoch": 5033} {"train_loss": -27.243152618408203, "global_step": 417813, "epoch": 5033} {"train_loss": -26.3096923828125, "global_step": 417814, "epoch": 5033} {"train_loss": -27.006139755249023, "global_step": 417815, "epoch": 5033} {"train_loss": -26.691516876220703, "global_step": 417816, "epoch": 5033} {"train_loss": -27.048206329345703, "global_step": 417817, "epoch": 5033} {"train_loss": -27.0086669921875, "global_step": 417818, "epoch": 5033} {"train_loss": -26.85833740234375, "global_step": 417819, "epoch": 5033} {"train_loss": -27.245283126831055, "global_step": 417820, "epoch": 5033} {"train_loss": -26.623935906283826, "global_step": 417821, "epoch": 5033, "val_loss": 6638337.0} {"train_loss": -26.729019165039062, "global_step": 417822, "epoch": 5034} {"train_loss": -25.90574073791504, "global_step": 417823, "epoch": 5034} {"train_loss": -26.200210571289062, "global_step": 417824, "epoch": 5034} {"train_loss": -26.668004989624023, "global_step": 417825, "epoch": 5034} {"train_loss": -26.063735961914062, "global_step": 417826, "epoch": 5034} {"train_loss": -26.03009605407715, "global_step": 417827, "epoch": 5034} {"train_loss": -26.47953224182129, "global_step": 417828, "epoch": 5034} {"train_loss": -26.3876953125, "global_step": 417829, "epoch": 5034} {"train_loss": -25.999835968017578, "global_step": 417830, "epoch": 5034} {"train_loss": -25.896778106689453, "global_step": 417831, "epoch": 5034} {"train_loss": -26.366174697875977, "global_step": 417832, "epoch": 5034} {"train_loss": -26.90791130065918, "global_step": 417833, "epoch": 5034} {"train_loss": -26.684579849243164, "global_step": 417834, "epoch": 5034} {"train_loss": -26.39693260192871, "global_step": 417835, "epoch": 5034} {"train_loss": -26.589752197265625, "global_step": 417836, "epoch": 5034} {"train_loss": -26.59922218322754, "global_step": 417837, "epoch": 5034} {"train_loss": -26.960132598876953, "global_step": 417838, "epoch": 5034} {"train_loss": -26.809661865234375, "global_step": 417839, "epoch": 5034} {"train_loss": -26.69099235534668, "global_step": 417840, "epoch": 5034} {"train_loss": -27.05364418029785, "global_step": 417841, "epoch": 5034} {"train_loss": -26.30604362487793, "global_step": 417842, "epoch": 5034} {"train_loss": -26.868637084960938, "global_step": 417843, "epoch": 5034} {"train_loss": -26.978412628173828, "global_step": 417844, "epoch": 5034} {"train_loss": -26.511117935180664, "global_step": 417845, "epoch": 5034} {"train_loss": -26.826496124267578, "global_step": 417846, "epoch": 5034} {"train_loss": -26.544790267944336, "global_step": 417847, "epoch": 5034} {"train_loss": -26.882892608642578, "global_step": 417848, "epoch": 5034} {"train_loss": -26.719038009643555, "global_step": 417849, "epoch": 5034} {"train_loss": -26.64691162109375, "global_step": 417850, "epoch": 5034} {"train_loss": -26.514724731445312, "global_step": 417851, "epoch": 5034} {"train_loss": -26.309106826782227, "global_step": 417852, "epoch": 5034} {"train_loss": -26.5939998626709, "global_step": 417853, "epoch": 5034} {"train_loss": -26.595441818237305, "global_step": 417854, "epoch": 5034} {"train_loss": -26.748153686523438, "global_step": 417855, "epoch": 5034} {"train_loss": -26.8289852142334, "global_step": 417856, "epoch": 5034} {"train_loss": -26.465961456298828, "global_step": 417857, "epoch": 5034} {"train_loss": -26.778736114501953, "global_step": 417858, "epoch": 5034} {"train_loss": -26.646142959594727, "global_step": 417859, "epoch": 5034} {"train_loss": -27.497900009155273, "global_step": 417860, "epoch": 5034} {"train_loss": -26.861982345581055, "global_step": 417861, "epoch": 5034} {"train_loss": -26.58502197265625, "global_step": 417862, "epoch": 5034} {"train_loss": -26.341825485229492, "global_step": 417863, "epoch": 5034} {"train_loss": -26.635955810546875, "global_step": 417864, "epoch": 5034} {"train_loss": -27.104766845703125, "global_step": 417865, "epoch": 5034} {"train_loss": -27.191864013671875, "global_step": 417866, "epoch": 5034} {"train_loss": -26.66578483581543, "global_step": 417867, "epoch": 5034} {"train_loss": -26.652368545532227, "global_step": 417868, "epoch": 5034} {"train_loss": -27.410858154296875, "global_step": 417869, "epoch": 5034} {"train_loss": -27.07602882385254, "global_step": 417870, "epoch": 5034} {"train_loss": -26.75467872619629, "global_step": 417871, "epoch": 5034} {"train_loss": -27.028461456298828, "global_step": 417872, "epoch": 5034} {"train_loss": -26.953231811523438, "global_step": 417873, "epoch": 5034} {"train_loss": -26.85013771057129, "global_step": 417874, "epoch": 5034} {"train_loss": -26.861785888671875, "global_step": 417875, "epoch": 5034} {"train_loss": -27.101388931274414, "global_step": 417876, "epoch": 5034} {"train_loss": -26.99976921081543, "global_step": 417877, "epoch": 5034} {"train_loss": -26.51325035095215, "global_step": 417878, "epoch": 5034} {"train_loss": -26.452558517456055, "global_step": 417879, "epoch": 5034} {"train_loss": -26.78553581237793, "global_step": 417880, "epoch": 5034} {"train_loss": -26.647180557250977, "global_step": 417881, "epoch": 5034} {"train_loss": -26.14430809020996, "global_step": 417882, "epoch": 5034} {"train_loss": -26.25278663635254, "global_step": 417883, "epoch": 5034} {"train_loss": -26.514728546142578, "global_step": 417884, "epoch": 5034} {"train_loss": -26.488758087158203, "global_step": 417885, "epoch": 5034} {"train_loss": -26.444440841674805, "global_step": 417886, "epoch": 5034} {"train_loss": -26.048749923706055, "global_step": 417887, "epoch": 5034} {"train_loss": -26.74143409729004, "global_step": 417888, "epoch": 5034} {"train_loss": -26.69268226623535, "global_step": 417889, "epoch": 5034} {"train_loss": -26.57950210571289, "global_step": 417890, "epoch": 5034} {"train_loss": -26.608823776245117, "global_step": 417891, "epoch": 5034} {"train_loss": -26.77435302734375, "global_step": 417892, "epoch": 5034} {"train_loss": -26.736312866210938, "global_step": 417893, "epoch": 5034} {"train_loss": -26.957839965820312, "global_step": 417894, "epoch": 5034} {"train_loss": -27.098318099975586, "global_step": 417895, "epoch": 5034} {"train_loss": -26.75982093811035, "global_step": 417896, "epoch": 5034} {"train_loss": -26.460229873657227, "global_step": 417897, "epoch": 5034} {"train_loss": -26.674833297729492, "global_step": 417898, "epoch": 5034} {"train_loss": -26.454965591430664, "global_step": 417899, "epoch": 5034} {"train_loss": -26.8080997467041, "global_step": 417900, "epoch": 5034} {"train_loss": -26.835851669311523, "global_step": 417901, "epoch": 5034} {"train_loss": -26.5249080657959, "global_step": 417902, "epoch": 5034} {"train_loss": -26.984846115112305, "global_step": 417903, "epoch": 5034} {"train_loss": -26.66502954873694, "global_step": 417904, "epoch": 5034, "val_loss": 6516642.0} {"train_loss": -24.757627487182617, "global_step": 417905, "epoch": 5035} {"train_loss": -26.036529541015625, "global_step": 417906, "epoch": 5035} {"train_loss": -25.684799194335938, "global_step": 417907, "epoch": 5035} {"train_loss": -25.710020065307617, "global_step": 417908, "epoch": 5035} {"train_loss": -26.39386558532715, "global_step": 417909, "epoch": 5035} {"train_loss": -25.930561065673828, "global_step": 417910, "epoch": 5035} {"train_loss": -25.9603328704834, "global_step": 417911, "epoch": 5035} {"train_loss": -26.33265495300293, "global_step": 417912, "epoch": 5035} {"train_loss": -26.006982803344727, "global_step": 417913, "epoch": 5035} {"train_loss": -26.289794921875, "global_step": 417914, "epoch": 5035} {"train_loss": -26.068084716796875, "global_step": 417915, "epoch": 5035} {"train_loss": -26.210742950439453, "global_step": 417916, "epoch": 5035} {"train_loss": -26.614599227905273, "global_step": 417917, "epoch": 5035} {"train_loss": -25.780506134033203, "global_step": 417918, "epoch": 5035} {"train_loss": -26.15591812133789, "global_step": 417919, "epoch": 5035} {"train_loss": -26.230915069580078, "global_step": 417920, "epoch": 5035} {"train_loss": -26.73097038269043, "global_step": 417921, "epoch": 5035} {"train_loss": -26.4034423828125, "global_step": 417922, "epoch": 5035} {"train_loss": -26.161514282226562, "global_step": 417923, "epoch": 5035} {"train_loss": -26.31096839904785, "global_step": 417924, "epoch": 5035} {"train_loss": -26.22784996032715, "global_step": 417925, "epoch": 5035} {"train_loss": -26.43048095703125, "global_step": 417926, "epoch": 5035} {"train_loss": -26.39089012145996, "global_step": 417927, "epoch": 5035} {"train_loss": -26.65317153930664, "global_step": 417928, "epoch": 5035} {"train_loss": -26.42746353149414, "global_step": 417929, "epoch": 5035} {"train_loss": -26.647933959960938, "global_step": 417930, "epoch": 5035} {"train_loss": -26.5389347076416, "global_step": 417931, "epoch": 5035} {"train_loss": -26.81658363342285, "global_step": 417932, "epoch": 5035} {"train_loss": -26.699552536010742, "global_step": 417933, "epoch": 5035} {"train_loss": -26.62935447692871, "global_step": 417934, "epoch": 5035} {"train_loss": -26.689624786376953, "global_step": 417935, "epoch": 5035} {"train_loss": -26.810474395751953, "global_step": 417936, "epoch": 5035} {"train_loss": -26.76349449157715, "global_step": 417937, "epoch": 5035} {"train_loss": -26.796659469604492, "global_step": 417938, "epoch": 5035} {"train_loss": -26.35944175720215, "global_step": 417939, "epoch": 5035} {"train_loss": -27.086334228515625, "global_step": 417940, "epoch": 5035} {"train_loss": -26.50668716430664, "global_step": 417941, "epoch": 5035} {"train_loss": -26.6398983001709, "global_step": 417942, "epoch": 5035} {"train_loss": -26.607685089111328, "global_step": 417943, "epoch": 5035} {"train_loss": -26.77362060546875, "global_step": 417944, "epoch": 5035} {"train_loss": -26.792585372924805, "global_step": 417945, "epoch": 5035} {"train_loss": -27.059051513671875, "global_step": 417946, "epoch": 5035} {"train_loss": -26.955305099487305, "global_step": 417947, "epoch": 5035} {"train_loss": -27.073734283447266, "global_step": 417948, "epoch": 5035} {"train_loss": -26.80032730102539, "global_step": 417949, "epoch": 5035} {"train_loss": -26.860544204711914, "global_step": 417950, "epoch": 5035} {"train_loss": -26.864164352416992, "global_step": 417951, "epoch": 5035} {"train_loss": -26.79474449157715, "global_step": 417952, "epoch": 5035} {"train_loss": -26.626697540283203, "global_step": 417953, "epoch": 5035} {"train_loss": -26.873035430908203, "global_step": 417954, "epoch": 5035} {"train_loss": -27.332687377929688, "global_step": 417955, "epoch": 5035} {"train_loss": -26.789453506469727, "global_step": 417956, "epoch": 5035} {"train_loss": -27.002973556518555, "global_step": 417957, "epoch": 5035} {"train_loss": -26.982961654663086, "global_step": 417958, "epoch": 5035} {"train_loss": -26.601978302001953, "global_step": 417959, "epoch": 5035} {"train_loss": -26.938419342041016, "global_step": 417960, "epoch": 5035} {"train_loss": -26.856250762939453, "global_step": 417961, "epoch": 5035} {"train_loss": -26.929290771484375, "global_step": 417962, "epoch": 5035} {"train_loss": -26.90070915222168, "global_step": 417963, "epoch": 5035} {"train_loss": -26.732885360717773, "global_step": 417964, "epoch": 5035} {"train_loss": -26.895278930664062, "global_step": 417965, "epoch": 5035} {"train_loss": -26.68598747253418, "global_step": 417966, "epoch": 5035} {"train_loss": -27.004810333251953, "global_step": 417967, "epoch": 5035} {"train_loss": -26.87546157836914, "global_step": 417968, "epoch": 5035} {"train_loss": -26.569122314453125, "global_step": 417969, "epoch": 5035} {"train_loss": -26.862546920776367, "global_step": 417970, "epoch": 5035} {"train_loss": -26.533557891845703, "global_step": 417971, "epoch": 5035} {"train_loss": -26.098852157592773, "global_step": 417972, "epoch": 5035} {"train_loss": -25.43537712097168, "global_step": 417973, "epoch": 5035} {"train_loss": -25.81390953063965, "global_step": 417974, "epoch": 5035} {"train_loss": -26.210355758666992, "global_step": 417975, "epoch": 5035} {"train_loss": -26.425739288330078, "global_step": 417976, "epoch": 5035} {"train_loss": -26.232690811157227, "global_step": 417977, "epoch": 5035} {"train_loss": -26.57923698425293, "global_step": 417978, "epoch": 5035} {"train_loss": -25.942968368530273, "global_step": 417979, "epoch": 5035} {"train_loss": -25.78806495666504, "global_step": 417980, "epoch": 5035} {"train_loss": -26.7841796875, "global_step": 417981, "epoch": 5035} {"train_loss": -26.534616470336914, "global_step": 417982, "epoch": 5035} {"train_loss": -26.095426559448242, "global_step": 417983, "epoch": 5035} {"train_loss": -26.758203506469727, "global_step": 417984, "epoch": 5035} {"train_loss": -26.625873565673828, "global_step": 417985, "epoch": 5035} {"train_loss": -26.7531795501709, "global_step": 417986, "epoch": 5035} {"train_loss": -26.51627869203866, "global_step": 417987, "epoch": 5035, "val_loss": 6829381.0} {"train_loss": -26.714813232421875, "global_step": 417988, "epoch": 5036} {"train_loss": -26.403669357299805, "global_step": 417989, "epoch": 5036} {"train_loss": -26.285924911499023, "global_step": 417990, "epoch": 5036} {"train_loss": -26.566564559936523, "global_step": 417991, "epoch": 5036} {"train_loss": -26.402332305908203, "global_step": 417992, "epoch": 5036} {"train_loss": -26.72964859008789, "global_step": 417993, "epoch": 5036} {"train_loss": -26.32036781311035, "global_step": 417994, "epoch": 5036} {"train_loss": -26.663650512695312, "global_step": 417995, "epoch": 5036} {"train_loss": -26.596052169799805, "global_step": 417996, "epoch": 5036} {"train_loss": -26.18935203552246, "global_step": 417997, "epoch": 5036} {"train_loss": -26.47149658203125, "global_step": 417998, "epoch": 5036} {"train_loss": -26.715396881103516, "global_step": 417999, "epoch": 5036} {"train_loss": -27.000980377197266, "global_step": 418000, "epoch": 5036} {"train_loss": -26.5947208404541, "global_step": 418001, "epoch": 5036} {"train_loss": -26.51836585998535, "global_step": 418002, "epoch": 5036} {"train_loss": -26.585224151611328, "global_step": 418003, "epoch": 5036} {"train_loss": -26.679452896118164, "global_step": 418004, "epoch": 5036} {"train_loss": -26.31290626525879, "global_step": 418005, "epoch": 5036} {"train_loss": -26.430591583251953, "global_step": 418006, "epoch": 5036} {"train_loss": -26.9419002532959, "global_step": 418007, "epoch": 5036} {"train_loss": -26.822315216064453, "global_step": 418008, "epoch": 5036} {"train_loss": -26.617944717407227, "global_step": 418009, "epoch": 5036} {"train_loss": -27.043481826782227, "global_step": 418010, "epoch": 5036} {"train_loss": -26.796600341796875, "global_step": 418011, "epoch": 5036} {"train_loss": -26.412363052368164, "global_step": 418012, "epoch": 5036} {"train_loss": -26.992216110229492, "global_step": 418013, "epoch": 5036} {"train_loss": -26.44025230407715, "global_step": 418014, "epoch": 5036} {"train_loss": -27.04256248474121, "global_step": 418015, "epoch": 5036} {"train_loss": -26.91373634338379, "global_step": 418016, "epoch": 5036} {"train_loss": -26.596548080444336, "global_step": 418017, "epoch": 5036} {"train_loss": -26.97645378112793, "global_step": 418018, "epoch": 5036} {"train_loss": -26.58302879333496, "global_step": 418019, "epoch": 5036} {"train_loss": -26.492467880249023, "global_step": 418020, "epoch": 5036} {"train_loss": -27.022886276245117, "global_step": 418021, "epoch": 5036} {"train_loss": -26.826635360717773, "global_step": 418022, "epoch": 5036} {"train_loss": -27.048913955688477, "global_step": 418023, "epoch": 5036} {"train_loss": -26.859296798706055, "global_step": 418024, "epoch": 5036} {"train_loss": -26.98138427734375, "global_step": 418025, "epoch": 5036} {"train_loss": -26.87451171875, "global_step": 418026, "epoch": 5036} {"train_loss": -27.047876358032227, "global_step": 418027, "epoch": 5036} {"train_loss": -26.797510147094727, "global_step": 418028, "epoch": 5036} {"train_loss": -26.74846839904785, "global_step": 418029, "epoch": 5036} {"train_loss": -26.70414161682129, "global_step": 418030, "epoch": 5036} {"train_loss": -26.61063003540039, "global_step": 418031, "epoch": 5036} {"train_loss": -26.652021408081055, "global_step": 418032, "epoch": 5036} {"train_loss": -26.535099029541016, "global_step": 418033, "epoch": 5036} {"train_loss": -26.570920944213867, "global_step": 418034, "epoch": 5036} {"train_loss": -27.105024337768555, "global_step": 418035, "epoch": 5036} {"train_loss": -26.804101943969727, "global_step": 418036, "epoch": 5036} {"train_loss": -26.7087459564209, "global_step": 418037, "epoch": 5036} {"train_loss": -27.068395614624023, "global_step": 418038, "epoch": 5036} {"train_loss": -26.065473556518555, "global_step": 418039, "epoch": 5036} {"train_loss": -26.101581573486328, "global_step": 418040, "epoch": 5036} {"train_loss": -26.630069732666016, "global_step": 418041, "epoch": 5036} {"train_loss": -26.731428146362305, "global_step": 418042, "epoch": 5036} {"train_loss": -26.6029052734375, "global_step": 418043, "epoch": 5036} {"train_loss": -26.57623291015625, "global_step": 418044, "epoch": 5036} {"train_loss": -26.402088165283203, "global_step": 418045, "epoch": 5036} {"train_loss": -26.746601104736328, "global_step": 418046, "epoch": 5036} {"train_loss": -26.7657470703125, "global_step": 418047, "epoch": 5036} {"train_loss": -26.487173080444336, "global_step": 418048, "epoch": 5036} {"train_loss": -26.6119327545166, "global_step": 418049, "epoch": 5036} {"train_loss": -26.871545791625977, "global_step": 418050, "epoch": 5036} {"train_loss": -26.65939712524414, "global_step": 418051, "epoch": 5036} {"train_loss": -26.42414665222168, "global_step": 418052, "epoch": 5036} {"train_loss": -27.153867721557617, "global_step": 418053, "epoch": 5036} {"train_loss": -26.61178970336914, "global_step": 418054, "epoch": 5036} {"train_loss": -26.819229125976562, "global_step": 418055, "epoch": 5036} {"train_loss": -27.00587272644043, "global_step": 418056, "epoch": 5036} {"train_loss": -26.55118751525879, "global_step": 418057, "epoch": 5036} {"train_loss": -26.689788818359375, "global_step": 418058, "epoch": 5036} {"train_loss": -26.894256591796875, "global_step": 418059, "epoch": 5036} {"train_loss": -26.897226333618164, "global_step": 418060, "epoch": 5036} {"train_loss": -27.063501358032227, "global_step": 418061, "epoch": 5036} {"train_loss": -27.08563232421875, "global_step": 418062, "epoch": 5036} {"train_loss": -26.693317413330078, "global_step": 418063, "epoch": 5036} {"train_loss": -27.0522518157959, "global_step": 418064, "epoch": 5036} {"train_loss": -26.91900062561035, "global_step": 418065, "epoch": 5036} {"train_loss": -26.89206314086914, "global_step": 418066, "epoch": 5036} {"train_loss": -26.878631591796875, "global_step": 418067, "epoch": 5036} {"train_loss": -27.2401180267334, "global_step": 418068, "epoch": 5036} {"train_loss": -27.04802894592285, "global_step": 418069, "epoch": 5036} {"train_loss": -26.711834436439606, "global_step": 418070, "epoch": 5036, "val_loss": 6756141.0} {"train_loss": -26.4038143157959, "global_step": 418071, "epoch": 5037} {"train_loss": -25.6203670501709, "global_step": 418072, "epoch": 5037} {"train_loss": -23.527183532714844, "global_step": 418073, "epoch": 5037} {"train_loss": -22.82351303100586, "global_step": 418074, "epoch": 5037} {"train_loss": -25.98878288269043, "global_step": 418075, "epoch": 5037} {"train_loss": -25.06424331665039, "global_step": 418076, "epoch": 5037} {"train_loss": -25.046167373657227, "global_step": 418077, "epoch": 5037} {"train_loss": -25.18916130065918, "global_step": 418078, "epoch": 5037} {"train_loss": -25.795434951782227, "global_step": 418079, "epoch": 5037} {"train_loss": -25.13374137878418, "global_step": 418080, "epoch": 5037} {"train_loss": -26.13368034362793, "global_step": 418081, "epoch": 5037} {"train_loss": -26.029218673706055, "global_step": 418082, "epoch": 5037} {"train_loss": -25.451696395874023, "global_step": 418083, "epoch": 5037} {"train_loss": -25.945755004882812, "global_step": 418084, "epoch": 5037} {"train_loss": -26.097915649414062, "global_step": 418085, "epoch": 5037} {"train_loss": -26.04340934753418, "global_step": 418086, "epoch": 5037} {"train_loss": -25.879825592041016, "global_step": 418087, "epoch": 5037} {"train_loss": -26.252859115600586, "global_step": 418088, "epoch": 5037} {"train_loss": -26.03028678894043, "global_step": 418089, "epoch": 5037} {"train_loss": -26.315631866455078, "global_step": 418090, "epoch": 5037} {"train_loss": -25.91110610961914, "global_step": 418091, "epoch": 5037} {"train_loss": -26.71346092224121, "global_step": 418092, "epoch": 5037} {"train_loss": -26.375242233276367, "global_step": 418093, "epoch": 5037} {"train_loss": -25.870412826538086, "global_step": 418094, "epoch": 5037} {"train_loss": -26.447742462158203, "global_step": 418095, "epoch": 5037} {"train_loss": -26.094985961914062, "global_step": 418096, "epoch": 5037} {"train_loss": -25.881567001342773, "global_step": 418097, "epoch": 5037} {"train_loss": -26.52272605895996, "global_step": 418098, "epoch": 5037} {"train_loss": -26.574432373046875, "global_step": 418099, "epoch": 5037} {"train_loss": -26.386402130126953, "global_step": 418100, "epoch": 5037} {"train_loss": -26.723920822143555, "global_step": 418101, "epoch": 5037} {"train_loss": -26.182031631469727, "global_step": 418102, "epoch": 5037} {"train_loss": -26.502172470092773, "global_step": 418103, "epoch": 5037} {"train_loss": -26.649438858032227, "global_step": 418104, "epoch": 5037} {"train_loss": -26.431873321533203, "global_step": 418105, "epoch": 5037} {"train_loss": -26.80012321472168, "global_step": 418106, "epoch": 5037} {"train_loss": -26.2486515045166, "global_step": 418107, "epoch": 5037} {"train_loss": -26.544336318969727, "global_step": 418108, "epoch": 5037} {"train_loss": -26.226795196533203, "global_step": 418109, "epoch": 5037} {"train_loss": -26.572473526000977, "global_step": 418110, "epoch": 5037} {"train_loss": -26.456567764282227, "global_step": 418111, "epoch": 5037} {"train_loss": -26.154077529907227, "global_step": 418112, "epoch": 5037} {"train_loss": -26.404001235961914, "global_step": 418113, "epoch": 5037} {"train_loss": -26.8256893157959, "global_step": 418114, "epoch": 5037} {"train_loss": -26.637094497680664, "global_step": 418115, "epoch": 5037} {"train_loss": -26.1883544921875, "global_step": 418116, "epoch": 5037} {"train_loss": -26.292285919189453, "global_step": 418117, "epoch": 5037} {"train_loss": -26.661020278930664, "global_step": 418118, "epoch": 5037} {"train_loss": -26.52058219909668, "global_step": 418119, "epoch": 5037} {"train_loss": -26.80194664001465, "global_step": 418120, "epoch": 5037} {"train_loss": -26.72151756286621, "global_step": 418121, "epoch": 5037} {"train_loss": -26.64142417907715, "global_step": 418122, "epoch": 5037} {"train_loss": -26.655261993408203, "global_step": 418123, "epoch": 5037} {"train_loss": -26.566980361938477, "global_step": 418124, "epoch": 5037} {"train_loss": -26.884580612182617, "global_step": 418125, "epoch": 5037} {"train_loss": -27.123489379882812, "global_step": 418126, "epoch": 5037} {"train_loss": -26.876087188720703, "global_step": 418127, "epoch": 5037} {"train_loss": -26.873126983642578, "global_step": 418128, "epoch": 5037} {"train_loss": -26.81769371032715, "global_step": 418129, "epoch": 5037} {"train_loss": -26.911212921142578, "global_step": 418130, "epoch": 5037} {"train_loss": -27.07757568359375, "global_step": 418131, "epoch": 5037} {"train_loss": -26.853912353515625, "global_step": 418132, "epoch": 5037} {"train_loss": -26.984846115112305, "global_step": 418133, "epoch": 5037} {"train_loss": -27.019346237182617, "global_step": 418134, "epoch": 5037} {"train_loss": -26.672658920288086, "global_step": 418135, "epoch": 5037} {"train_loss": -26.90851402282715, "global_step": 418136, "epoch": 5037} {"train_loss": -26.601831436157227, "global_step": 418137, "epoch": 5037} {"train_loss": -26.803485870361328, "global_step": 418138, "epoch": 5037} {"train_loss": -26.501081466674805, "global_step": 418139, "epoch": 5037} {"train_loss": -26.842519760131836, "global_step": 418140, "epoch": 5037} {"train_loss": -27.138158798217773, "global_step": 418141, "epoch": 5037} {"train_loss": -27.030248641967773, "global_step": 418142, "epoch": 5037} {"train_loss": -26.742094039916992, "global_step": 418143, "epoch": 5037} {"train_loss": -26.74665641784668, "global_step": 418144, "epoch": 5037} {"train_loss": -26.875574111938477, "global_step": 418145, "epoch": 5037} {"train_loss": -27.208303451538086, "global_step": 418146, "epoch": 5037} {"train_loss": -26.81903648376465, "global_step": 418147, "epoch": 5037} {"train_loss": -26.535831451416016, "global_step": 418148, "epoch": 5037} {"train_loss": -25.960554122924805, "global_step": 418149, "epoch": 5037} {"train_loss": -26.706501007080078, "global_step": 418150, "epoch": 5037} {"train_loss": -26.25922203063965, "global_step": 418151, "epoch": 5037} {"train_loss": -26.651596069335938, "global_step": 418152, "epoch": 5037} {"train_loss": -26.3661719632436, "global_step": 418153, "epoch": 5037, "val_loss": 6887290.0} {"train_loss": -25.876611709594727, "global_step": 418154, "epoch": 5038} {"train_loss": -26.447895050048828, "global_step": 418155, "epoch": 5038} {"train_loss": -26.345687866210938, "global_step": 418156, "epoch": 5038} {"train_loss": -26.48213005065918, "global_step": 418157, "epoch": 5038} {"train_loss": -26.528366088867188, "global_step": 418158, "epoch": 5038} {"train_loss": -26.522815704345703, "global_step": 418159, "epoch": 5038} {"train_loss": -26.7178955078125, "global_step": 418160, "epoch": 5038} {"train_loss": -26.60869789123535, "global_step": 418161, "epoch": 5038} {"train_loss": -26.284912109375, "global_step": 418162, "epoch": 5038} {"train_loss": -26.361865997314453, "global_step": 418163, "epoch": 5038} {"train_loss": -26.870046615600586, "global_step": 418164, "epoch": 5038} {"train_loss": -26.38941764831543, "global_step": 418165, "epoch": 5038} {"train_loss": -26.799671173095703, "global_step": 418166, "epoch": 5038} {"train_loss": -26.591983795166016, "global_step": 418167, "epoch": 5038} {"train_loss": -26.84250259399414, "global_step": 418168, "epoch": 5038} {"train_loss": -26.76456642150879, "global_step": 418169, "epoch": 5038} {"train_loss": -26.90720558166504, "global_step": 418170, "epoch": 5038} {"train_loss": -26.59332847595215, "global_step": 418171, "epoch": 5038} {"train_loss": -26.996021270751953, "global_step": 418172, "epoch": 5038} {"train_loss": -26.879003524780273, "global_step": 418173, "epoch": 5038} {"train_loss": -26.61187171936035, "global_step": 418174, "epoch": 5038} {"train_loss": -26.800565719604492, "global_step": 418175, "epoch": 5038} {"train_loss": -27.273834228515625, "global_step": 418176, "epoch": 5038} {"train_loss": -26.492944717407227, "global_step": 418177, "epoch": 5038} {"train_loss": -26.94154167175293, "global_step": 418178, "epoch": 5038} {"train_loss": -26.771682739257812, "global_step": 418179, "epoch": 5038} {"train_loss": -26.833465576171875, "global_step": 418180, "epoch": 5038} {"train_loss": -27.261890411376953, "global_step": 418181, "epoch": 5038} {"train_loss": -27.050704956054688, "global_step": 418182, "epoch": 5038} {"train_loss": -26.469858169555664, "global_step": 418183, "epoch": 5038} {"train_loss": -27.196273803710938, "global_step": 418184, "epoch": 5038} {"train_loss": -26.993558883666992, "global_step": 418185, "epoch": 5038} {"train_loss": -26.996749877929688, "global_step": 418186, "epoch": 5038} {"train_loss": -26.885486602783203, "global_step": 418187, "epoch": 5038} {"train_loss": -26.73323631286621, "global_step": 418188, "epoch": 5038} {"train_loss": -26.510852813720703, "global_step": 418189, "epoch": 5038} {"train_loss": -26.42384147644043, "global_step": 418190, "epoch": 5038} {"train_loss": -26.639514923095703, "global_step": 418191, "epoch": 5038} {"train_loss": -26.94608497619629, "global_step": 418192, "epoch": 5038} {"train_loss": -27.0272159576416, "global_step": 418193, "epoch": 5038} {"train_loss": -27.09490966796875, "global_step": 418194, "epoch": 5038} {"train_loss": -26.830053329467773, "global_step": 418195, "epoch": 5038} {"train_loss": -26.818344116210938, "global_step": 418196, "epoch": 5038} {"train_loss": -26.843801498413086, "global_step": 418197, "epoch": 5038} {"train_loss": -26.964963912963867, "global_step": 418198, "epoch": 5038} {"train_loss": -26.689224243164062, "global_step": 418199, "epoch": 5038} {"train_loss": -26.826190948486328, "global_step": 418200, "epoch": 5038} {"train_loss": -27.18061637878418, "global_step": 418201, "epoch": 5038} {"train_loss": -26.875019073486328, "global_step": 418202, "epoch": 5038} {"train_loss": -26.7636661529541, "global_step": 418203, "epoch": 5038} {"train_loss": -27.232370376586914, "global_step": 418204, "epoch": 5038} {"train_loss": -26.60761070251465, "global_step": 418205, "epoch": 5038} {"train_loss": -26.683515548706055, "global_step": 418206, "epoch": 5038} {"train_loss": -26.823217391967773, "global_step": 418207, "epoch": 5038} {"train_loss": -26.545257568359375, "global_step": 418208, "epoch": 5038} {"train_loss": -26.985523223876953, "global_step": 418209, "epoch": 5038} {"train_loss": -26.612884521484375, "global_step": 418210, "epoch": 5038} {"train_loss": -26.326263427734375, "global_step": 418211, "epoch": 5038} {"train_loss": -26.6666316986084, "global_step": 418212, "epoch": 5038} {"train_loss": -26.388580322265625, "global_step": 418213, "epoch": 5038} {"train_loss": -26.492277145385742, "global_step": 418214, "epoch": 5038} {"train_loss": -26.8305606842041, "global_step": 418215, "epoch": 5038} {"train_loss": -26.353479385375977, "global_step": 418216, "epoch": 5038} {"train_loss": -26.586139678955078, "global_step": 418217, "epoch": 5038} {"train_loss": -26.859189987182617, "global_step": 418218, "epoch": 5038} {"train_loss": -26.411468505859375, "global_step": 418219, "epoch": 5038} {"train_loss": -26.487823486328125, "global_step": 418220, "epoch": 5038} {"train_loss": -27.0261287689209, "global_step": 418221, "epoch": 5038} {"train_loss": -26.061750411987305, "global_step": 418222, "epoch": 5038} {"train_loss": -26.845401763916016, "global_step": 418223, "epoch": 5038} {"train_loss": -26.23175048828125, "global_step": 418224, "epoch": 5038} {"train_loss": -26.553922653198242, "global_step": 418225, "epoch": 5038} {"train_loss": -26.71283531188965, "global_step": 418226, "epoch": 5038} {"train_loss": -26.427087783813477, "global_step": 418227, "epoch": 5038} {"train_loss": -26.54878044128418, "global_step": 418228, "epoch": 5038} {"train_loss": -26.46539878845215, "global_step": 418229, "epoch": 5038} {"train_loss": -26.409093856811523, "global_step": 418230, "epoch": 5038} {"train_loss": -26.628400802612305, "global_step": 418231, "epoch": 5038} {"train_loss": -26.80103874206543, "global_step": 418232, "epoch": 5038} {"train_loss": -26.44428825378418, "global_step": 418233, "epoch": 5038} {"train_loss": -26.87082862854004, "global_step": 418234, "epoch": 5038} {"train_loss": -26.984088897705078, "global_step": 418235, "epoch": 5038} {"train_loss": -26.713160181620037, "global_step": 418236, "epoch": 5038, "val_loss": 6871104.0} {"train_loss": -26.78260612487793, "global_step": 418237, "epoch": 5039} {"train_loss": -26.905323028564453, "global_step": 418238, "epoch": 5039} {"train_loss": -26.34734535217285, "global_step": 418239, "epoch": 5039} {"train_loss": -26.920978546142578, "global_step": 418240, "epoch": 5039} {"train_loss": -26.86872673034668, "global_step": 418241, "epoch": 5039} {"train_loss": -26.55315589904785, "global_step": 418242, "epoch": 5039} {"train_loss": -26.71766471862793, "global_step": 418243, "epoch": 5039} {"train_loss": -26.52558708190918, "global_step": 418244, "epoch": 5039} {"train_loss": -27.09071922302246, "global_step": 418245, "epoch": 5039} {"train_loss": -27.24013328552246, "global_step": 418246, "epoch": 5039} {"train_loss": -27.0887451171875, "global_step": 418247, "epoch": 5039} {"train_loss": -26.64593505859375, "global_step": 418248, "epoch": 5039} {"train_loss": -27.13144302368164, "global_step": 418249, "epoch": 5039} {"train_loss": -26.593647003173828, "global_step": 418250, "epoch": 5039} {"train_loss": -26.759546279907227, "global_step": 418251, "epoch": 5039} {"train_loss": -26.528186798095703, "global_step": 418252, "epoch": 5039} {"train_loss": -26.784931182861328, "global_step": 418253, "epoch": 5039} {"train_loss": -27.129901885986328, "global_step": 418254, "epoch": 5039} {"train_loss": -26.631139755249023, "global_step": 418255, "epoch": 5039} {"train_loss": -26.744115829467773, "global_step": 418256, "epoch": 5039} {"train_loss": -26.836196899414062, "global_step": 418257, "epoch": 5039} {"train_loss": -26.59798240661621, "global_step": 418258, "epoch": 5039} {"train_loss": -26.669095993041992, "global_step": 418259, "epoch": 5039} {"train_loss": -27.057653427124023, "global_step": 418260, "epoch": 5039} {"train_loss": -27.127307891845703, "global_step": 418261, "epoch": 5039} {"train_loss": -26.94783592224121, "global_step": 418262, "epoch": 5039} {"train_loss": -27.020849227905273, "global_step": 418263, "epoch": 5039} {"train_loss": -26.66672706604004, "global_step": 418264, "epoch": 5039} {"train_loss": -26.940555572509766, "global_step": 418265, "epoch": 5039} {"train_loss": -27.212299346923828, "global_step": 418266, "epoch": 5039} {"train_loss": -26.810400009155273, "global_step": 418267, "epoch": 5039} {"train_loss": -27.05777359008789, "global_step": 418268, "epoch": 5039} {"train_loss": -26.8463134765625, "global_step": 418269, "epoch": 5039} {"train_loss": -27.15372085571289, "global_step": 418270, "epoch": 5039} {"train_loss": -26.787351608276367, "global_step": 418271, "epoch": 5039} {"train_loss": -26.89607048034668, "global_step": 418272, "epoch": 5039} {"train_loss": -27.0311222076416, "global_step": 418273, "epoch": 5039} {"train_loss": -26.90191078186035, "global_step": 418274, "epoch": 5039} {"train_loss": -26.885608673095703, "global_step": 418275, "epoch": 5039} {"train_loss": -27.22371482849121, "global_step": 418276, "epoch": 5039} {"train_loss": -26.860483169555664, "global_step": 418277, "epoch": 5039} {"train_loss": -26.93898582458496, "global_step": 418278, "epoch": 5039} {"train_loss": -27.09278678894043, "global_step": 418279, "epoch": 5039} {"train_loss": -26.808969497680664, "global_step": 418280, "epoch": 5039} {"train_loss": -26.952234268188477, "global_step": 418281, "epoch": 5039} {"train_loss": -26.706104278564453, "global_step": 418282, "epoch": 5039} {"train_loss": -26.92010498046875, "global_step": 418283, "epoch": 5039} {"train_loss": -26.679983139038086, "global_step": 418284, "epoch": 5039} {"train_loss": -26.71237564086914, "global_step": 418285, "epoch": 5039} {"train_loss": -26.840742111206055, "global_step": 418286, "epoch": 5039} {"train_loss": -26.75213050842285, "global_step": 418287, "epoch": 5039} {"train_loss": -27.014190673828125, "global_step": 418288, "epoch": 5039} {"train_loss": -26.647205352783203, "global_step": 418289, "epoch": 5039} {"train_loss": -26.932199478149414, "global_step": 418290, "epoch": 5039} {"train_loss": -26.326202392578125, "global_step": 418291, "epoch": 5039} {"train_loss": -25.961811065673828, "global_step": 418292, "epoch": 5039} {"train_loss": -26.522302627563477, "global_step": 418293, "epoch": 5039} {"train_loss": -26.605504989624023, "global_step": 418294, "epoch": 5039} {"train_loss": -26.713855743408203, "global_step": 418295, "epoch": 5039} {"train_loss": -26.424518585205078, "global_step": 418296, "epoch": 5039} {"train_loss": -26.375356674194336, "global_step": 418297, "epoch": 5039} {"train_loss": -26.66669273376465, "global_step": 418298, "epoch": 5039} {"train_loss": -26.828317642211914, "global_step": 418299, "epoch": 5039} {"train_loss": -26.049131393432617, "global_step": 418300, "epoch": 5039} {"train_loss": -26.874433517456055, "global_step": 418301, "epoch": 5039} {"train_loss": -27.03271484375, "global_step": 418302, "epoch": 5039} {"train_loss": -26.614103317260742, "global_step": 418303, "epoch": 5039} {"train_loss": -27.043485641479492, "global_step": 418304, "epoch": 5039} {"train_loss": -26.691190719604492, "global_step": 418305, "epoch": 5039} {"train_loss": -26.773183822631836, "global_step": 418306, "epoch": 5039} {"train_loss": -26.544269561767578, "global_step": 418307, "epoch": 5039} {"train_loss": -26.81373405456543, "global_step": 418308, "epoch": 5039} {"train_loss": -26.64832878112793, "global_step": 418309, "epoch": 5039} {"train_loss": -26.443891525268555, "global_step": 418310, "epoch": 5039} {"train_loss": -26.60833168029785, "global_step": 418311, "epoch": 5039} {"train_loss": -26.00701332092285, "global_step": 418312, "epoch": 5039} {"train_loss": -26.593734741210938, "global_step": 418313, "epoch": 5039} {"train_loss": -26.781530380249023, "global_step": 418314, "epoch": 5039} {"train_loss": -26.67597007751465, "global_step": 418315, "epoch": 5039} {"train_loss": -26.614709854125977, "global_step": 418316, "epoch": 5039} {"train_loss": -26.698169708251953, "global_step": 418317, "epoch": 5039} {"train_loss": -26.95562744140625, "global_step": 418318, "epoch": 5039} {"train_loss": -26.770430461469903, "global_step": 418319, "epoch": 5039, "val_loss": 6919476.0} {"train_loss": -26.538930892944336, "global_step": 418320, "epoch": 5040} {"train_loss": -26.33328628540039, "global_step": 418321, "epoch": 5040} {"train_loss": -25.896045684814453, "global_step": 418322, "epoch": 5040} {"train_loss": -26.484643936157227, "global_step": 418323, "epoch": 5040} {"train_loss": -26.511672973632812, "global_step": 418324, "epoch": 5040} {"train_loss": -26.398340225219727, "global_step": 418325, "epoch": 5040} {"train_loss": -26.59822654724121, "global_step": 418326, "epoch": 5040} {"train_loss": -26.812301635742188, "global_step": 418327, "epoch": 5040} {"train_loss": -26.081012725830078, "global_step": 418328, "epoch": 5040} {"train_loss": -26.5997314453125, "global_step": 418329, "epoch": 5040} {"train_loss": -26.79524040222168, "global_step": 418330, "epoch": 5040} {"train_loss": -26.53443717956543, "global_step": 418331, "epoch": 5040} {"train_loss": -26.4981689453125, "global_step": 418332, "epoch": 5040} {"train_loss": -26.313257217407227, "global_step": 418333, "epoch": 5040} {"train_loss": -26.83668327331543, "global_step": 418334, "epoch": 5040} {"train_loss": -26.261474609375, "global_step": 418335, "epoch": 5040} {"train_loss": -26.8124942779541, "global_step": 418336, "epoch": 5040} {"train_loss": -26.37030601501465, "global_step": 418337, "epoch": 5040} {"train_loss": -26.403884887695312, "global_step": 418338, "epoch": 5040} {"train_loss": -26.513702392578125, "global_step": 418339, "epoch": 5040} {"train_loss": -26.160993576049805, "global_step": 418340, "epoch": 5040} {"train_loss": -26.7257137298584, "global_step": 418341, "epoch": 5040} {"train_loss": -26.439697265625, "global_step": 418342, "epoch": 5040} {"train_loss": -26.720178604125977, "global_step": 418343, "epoch": 5040} {"train_loss": -26.94422721862793, "global_step": 418344, "epoch": 5040} {"train_loss": -26.956228256225586, "global_step": 418345, "epoch": 5040} {"train_loss": -26.7608642578125, "global_step": 418346, "epoch": 5040} {"train_loss": -26.53596305847168, "global_step": 418347, "epoch": 5040} {"train_loss": -26.84971046447754, "global_step": 418348, "epoch": 5040} {"train_loss": -27.00852394104004, "global_step": 418349, "epoch": 5040} {"train_loss": -26.513065338134766, "global_step": 418350, "epoch": 5040} {"train_loss": -26.46759033203125, "global_step": 418351, "epoch": 5040} {"train_loss": -26.87436294555664, "global_step": 418352, "epoch": 5040} {"train_loss": -26.72871971130371, "global_step": 418353, "epoch": 5040} {"train_loss": -27.112808227539062, "global_step": 418354, "epoch": 5040} {"train_loss": -26.777755737304688, "global_step": 418355, "epoch": 5040} {"train_loss": -26.72149085998535, "global_step": 418356, "epoch": 5040} {"train_loss": -26.889850616455078, "global_step": 418357, "epoch": 5040} {"train_loss": -27.0102596282959, "global_step": 418358, "epoch": 5040} {"train_loss": -26.7779598236084, "global_step": 418359, "epoch": 5040} {"train_loss": -26.919275283813477, "global_step": 418360, "epoch": 5040} {"train_loss": -26.74580955505371, "global_step": 418361, "epoch": 5040} {"train_loss": -26.440967559814453, "global_step": 418362, "epoch": 5040} {"train_loss": -26.534574508666992, "global_step": 418363, "epoch": 5040} {"train_loss": -26.36146354675293, "global_step": 418364, "epoch": 5040} {"train_loss": -27.102313995361328, "global_step": 418365, "epoch": 5040} {"train_loss": -26.97052001953125, "global_step": 418366, "epoch": 5040} {"train_loss": -27.195768356323242, "global_step": 418367, "epoch": 5040} {"train_loss": -26.915006637573242, "global_step": 418368, "epoch": 5040} {"train_loss": -26.843006134033203, "global_step": 418369, "epoch": 5040} {"train_loss": -26.53810691833496, "global_step": 418370, "epoch": 5040} {"train_loss": -26.9149112701416, "global_step": 418371, "epoch": 5040} {"train_loss": -26.731298446655273, "global_step": 418372, "epoch": 5040} {"train_loss": -26.77509117126465, "global_step": 418373, "epoch": 5040} {"train_loss": -26.635009765625, "global_step": 418374, "epoch": 5040} {"train_loss": -26.56793212890625, "global_step": 418375, "epoch": 5040} {"train_loss": -27.147443771362305, "global_step": 418376, "epoch": 5040} {"train_loss": -27.198484420776367, "global_step": 418377, "epoch": 5040} {"train_loss": -26.80141258239746, "global_step": 418378, "epoch": 5040} {"train_loss": -26.894887924194336, "global_step": 418379, "epoch": 5040} {"train_loss": -27.343280792236328, "global_step": 418380, "epoch": 5040} {"train_loss": -27.083341598510742, "global_step": 418381, "epoch": 5040} {"train_loss": -26.98456382751465, "global_step": 418382, "epoch": 5040} {"train_loss": -27.06585121154785, "global_step": 418383, "epoch": 5040} {"train_loss": -27.361860275268555, "global_step": 418384, "epoch": 5040} {"train_loss": -26.886096954345703, "global_step": 418385, "epoch": 5040} {"train_loss": -26.91106605529785, "global_step": 418386, "epoch": 5040} {"train_loss": -26.801589965820312, "global_step": 418387, "epoch": 5040} {"train_loss": -26.979907989501953, "global_step": 418388, "epoch": 5040} {"train_loss": -26.847354888916016, "global_step": 418389, "epoch": 5040} {"train_loss": -27.112348556518555, "global_step": 418390, "epoch": 5040} {"train_loss": -26.921859741210938, "global_step": 418391, "epoch": 5040} {"train_loss": -26.773889541625977, "global_step": 418392, "epoch": 5040} {"train_loss": -26.616491317749023, "global_step": 418393, "epoch": 5040} {"train_loss": -26.295324325561523, "global_step": 418394, "epoch": 5040} {"train_loss": -26.492483139038086, "global_step": 418395, "epoch": 5040} {"train_loss": -26.72332191467285, "global_step": 418396, "epoch": 5040} {"train_loss": -26.70026206970215, "global_step": 418397, "epoch": 5040} {"train_loss": -26.841644287109375, "global_step": 418398, "epoch": 5040} {"train_loss": -27.02263832092285, "global_step": 418399, "epoch": 5040} {"train_loss": -26.6735782623291, "global_step": 418400, "epoch": 5040} {"train_loss": -26.7943172454834, "global_step": 418401, "epoch": 5040} {"train_loss": -26.72042757057282, "global_step": 418402, "epoch": 5040, "val_loss": 6926833.0} {"train_loss": -26.7039794921875, "global_step": 418403, "epoch": 5041} {"train_loss": -26.17874526977539, "global_step": 418404, "epoch": 5041} {"train_loss": -26.00813102722168, "global_step": 418405, "epoch": 5041} {"train_loss": -26.301420211791992, "global_step": 418406, "epoch": 5041} {"train_loss": -26.659231185913086, "global_step": 418407, "epoch": 5041} {"train_loss": -26.188215255737305, "global_step": 418408, "epoch": 5041} {"train_loss": -26.191247940063477, "global_step": 418409, "epoch": 5041} {"train_loss": -26.070087432861328, "global_step": 418410, "epoch": 5041} {"train_loss": -25.909276962280273, "global_step": 418411, "epoch": 5041} {"train_loss": -26.331159591674805, "global_step": 418412, "epoch": 5041} {"train_loss": -26.491064071655273, "global_step": 418413, "epoch": 5041} {"train_loss": -26.54908561706543, "global_step": 418414, "epoch": 5041} {"train_loss": -26.250730514526367, "global_step": 418415, "epoch": 5041} {"train_loss": -26.552152633666992, "global_step": 418416, "epoch": 5041} {"train_loss": -26.85780143737793, "global_step": 418417, "epoch": 5041} {"train_loss": -26.40598487854004, "global_step": 418418, "epoch": 5041} {"train_loss": -26.260717391967773, "global_step": 418419, "epoch": 5041} {"train_loss": -26.158971786499023, "global_step": 418420, "epoch": 5041} {"train_loss": -26.453405380249023, "global_step": 418421, "epoch": 5041} {"train_loss": -26.529632568359375, "global_step": 418422, "epoch": 5041} {"train_loss": -26.756818771362305, "global_step": 418423, "epoch": 5041} {"train_loss": -26.41261100769043, "global_step": 418424, "epoch": 5041} {"train_loss": -26.913867950439453, "global_step": 418425, "epoch": 5041} {"train_loss": -26.690143585205078, "global_step": 418426, "epoch": 5041} {"train_loss": -26.833820343017578, "global_step": 418427, "epoch": 5041} {"train_loss": -26.319982528686523, "global_step": 418428, "epoch": 5041} {"train_loss": -26.5579776763916, "global_step": 418429, "epoch": 5041} {"train_loss": -26.7365779876709, "global_step": 418430, "epoch": 5041} {"train_loss": -26.520538330078125, "global_step": 418431, "epoch": 5041} {"train_loss": -26.894485473632812, "global_step": 418432, "epoch": 5041} {"train_loss": -26.993701934814453, "global_step": 418433, "epoch": 5041} {"train_loss": -26.655027389526367, "global_step": 418434, "epoch": 5041} {"train_loss": -26.781265258789062, "global_step": 418435, "epoch": 5041} {"train_loss": -26.648038864135742, "global_step": 418436, "epoch": 5041} {"train_loss": -26.693042755126953, "global_step": 418437, "epoch": 5041} {"train_loss": -26.65827751159668, "global_step": 418438, "epoch": 5041} {"train_loss": -26.665632247924805, "global_step": 418439, "epoch": 5041} {"train_loss": -26.698017120361328, "global_step": 418440, "epoch": 5041} {"train_loss": -26.664764404296875, "global_step": 418441, "epoch": 5041} {"train_loss": -26.687463760375977, "global_step": 418442, "epoch": 5041} {"train_loss": -26.78875732421875, "global_step": 418443, "epoch": 5041} {"train_loss": -26.703149795532227, "global_step": 418444, "epoch": 5041} {"train_loss": -26.884906768798828, "global_step": 418445, "epoch": 5041} {"train_loss": -26.969762802124023, "global_step": 418446, "epoch": 5041} {"train_loss": -26.745656967163086, "global_step": 418447, "epoch": 5041} {"train_loss": -26.479795455932617, "global_step": 418448, "epoch": 5041} {"train_loss": -26.596548080444336, "global_step": 418449, "epoch": 5041} {"train_loss": -26.74761962890625, "global_step": 418450, "epoch": 5041} {"train_loss": -27.100299835205078, "global_step": 418451, "epoch": 5041} {"train_loss": -26.6683349609375, "global_step": 418452, "epoch": 5041} {"train_loss": -26.42359733581543, "global_step": 418453, "epoch": 5041} {"train_loss": -26.747283935546875, "global_step": 418454, "epoch": 5041} {"train_loss": -26.921161651611328, "global_step": 418455, "epoch": 5041} {"train_loss": -26.426513671875, "global_step": 418456, "epoch": 5041} {"train_loss": -27.0545654296875, "global_step": 418457, "epoch": 5041} {"train_loss": -26.7203311920166, "global_step": 418458, "epoch": 5041} {"train_loss": -26.368249893188477, "global_step": 418459, "epoch": 5041} {"train_loss": -26.865575790405273, "global_step": 418460, "epoch": 5041} {"train_loss": -26.64715003967285, "global_step": 418461, "epoch": 5041} {"train_loss": -26.605987548828125, "global_step": 418462, "epoch": 5041} {"train_loss": -26.993316650390625, "global_step": 418463, "epoch": 5041} {"train_loss": -26.718542098999023, "global_step": 418464, "epoch": 5041} {"train_loss": -26.979373931884766, "global_step": 418465, "epoch": 5041} {"train_loss": -26.632923126220703, "global_step": 418466, "epoch": 5041} {"train_loss": -26.975513458251953, "global_step": 418467, "epoch": 5041} {"train_loss": -26.75193214416504, "global_step": 418468, "epoch": 5041} {"train_loss": -26.71390724182129, "global_step": 418469, "epoch": 5041} {"train_loss": -26.788217544555664, "global_step": 418470, "epoch": 5041} {"train_loss": -26.904953002929688, "global_step": 418471, "epoch": 5041} {"train_loss": -26.72464370727539, "global_step": 418472, "epoch": 5041} {"train_loss": -26.520605087280273, "global_step": 418473, "epoch": 5041} {"train_loss": -26.81833839416504, "global_step": 418474, "epoch": 5041} {"train_loss": -26.499738693237305, "global_step": 418475, "epoch": 5041} {"train_loss": -26.341093063354492, "global_step": 418476, "epoch": 5041} {"train_loss": -26.758710861206055, "global_step": 418477, "epoch": 5041} {"train_loss": -26.91342544555664, "global_step": 418478, "epoch": 5041} {"train_loss": -26.3721981048584, "global_step": 418479, "epoch": 5041} {"train_loss": -26.667322158813477, "global_step": 418480, "epoch": 5041} {"train_loss": -26.76119041442871, "global_step": 418481, "epoch": 5041} {"train_loss": -26.910648345947266, "global_step": 418482, "epoch": 5041} {"train_loss": -26.72760581970215, "global_step": 418483, "epoch": 5041} {"train_loss": -26.829639434814453, "global_step": 418484, "epoch": 5041} {"train_loss": -26.61201619527426, "global_step": 418485, "epoch": 5041, "val_loss": 6978193.0} {"train_loss": -26.222766876220703, "global_step": 418486, "epoch": 5042} {"train_loss": -25.99700355529785, "global_step": 418487, "epoch": 5042} {"train_loss": -26.41645622253418, "global_step": 418488, "epoch": 5042} {"train_loss": -26.609655380249023, "global_step": 418489, "epoch": 5042} {"train_loss": -26.170734405517578, "global_step": 418490, "epoch": 5042} {"train_loss": -26.814847946166992, "global_step": 418491, "epoch": 5042} {"train_loss": -26.619848251342773, "global_step": 418492, "epoch": 5042} {"train_loss": -26.37613868713379, "global_step": 418493, "epoch": 5042} {"train_loss": -26.45575523376465, "global_step": 418494, "epoch": 5042} {"train_loss": -26.471609115600586, "global_step": 418495, "epoch": 5042} {"train_loss": -26.578235626220703, "global_step": 418496, "epoch": 5042} {"train_loss": -26.45734214782715, "global_step": 418497, "epoch": 5042} {"train_loss": -26.59894371032715, "global_step": 418498, "epoch": 5042} {"train_loss": -26.290124893188477, "global_step": 418499, "epoch": 5042} {"train_loss": -26.77411460876465, "global_step": 418500, "epoch": 5042} {"train_loss": -26.629337310791016, "global_step": 418501, "epoch": 5042} {"train_loss": -26.882999420166016, "global_step": 418502, "epoch": 5042} {"train_loss": -26.553335189819336, "global_step": 418503, "epoch": 5042} {"train_loss": -26.824691772460938, "global_step": 418504, "epoch": 5042} {"train_loss": -26.72430419921875, "global_step": 418505, "epoch": 5042} {"train_loss": -26.541950225830078, "global_step": 418506, "epoch": 5042} {"train_loss": -26.870004653930664, "global_step": 418507, "epoch": 5042} {"train_loss": -26.896188735961914, "global_step": 418508, "epoch": 5042} {"train_loss": -26.710363388061523, "global_step": 418509, "epoch": 5042} {"train_loss": -26.81966209411621, "global_step": 418510, "epoch": 5042} {"train_loss": -27.012741088867188, "global_step": 418511, "epoch": 5042} {"train_loss": -26.955625534057617, "global_step": 418512, "epoch": 5042} {"train_loss": -27.043603897094727, "global_step": 418513, "epoch": 5042} {"train_loss": -26.798425674438477, "global_step": 418514, "epoch": 5042} {"train_loss": -26.89910888671875, "global_step": 418515, "epoch": 5042} {"train_loss": -26.672866821289062, "global_step": 418516, "epoch": 5042} {"train_loss": -26.76136589050293, "global_step": 418517, "epoch": 5042} {"train_loss": -26.888004302978516, "global_step": 418518, "epoch": 5042} {"train_loss": -26.90630531311035, "global_step": 418519, "epoch": 5042} {"train_loss": -26.74835205078125, "global_step": 418520, "epoch": 5042} {"train_loss": -26.788000106811523, "global_step": 418521, "epoch": 5042} {"train_loss": -26.89034080505371, "global_step": 418522, "epoch": 5042} {"train_loss": -26.928068161010742, "global_step": 418523, "epoch": 5042} {"train_loss": -26.51242446899414, "global_step": 418524, "epoch": 5042} {"train_loss": -26.668500900268555, "global_step": 418525, "epoch": 5042} {"train_loss": -27.097339630126953, "global_step": 418526, "epoch": 5042} {"train_loss": -26.98377799987793, "global_step": 418527, "epoch": 5042} {"train_loss": -26.760961532592773, "global_step": 418528, "epoch": 5042} {"train_loss": -26.955463409423828, "global_step": 418529, "epoch": 5042} {"train_loss": -26.732440948486328, "global_step": 418530, "epoch": 5042} {"train_loss": -26.60235023498535, "global_step": 418531, "epoch": 5042} {"train_loss": -26.7128963470459, "global_step": 418532, "epoch": 5042} {"train_loss": -26.812747955322266, "global_step": 418533, "epoch": 5042} {"train_loss": -26.478351593017578, "global_step": 418534, "epoch": 5042} {"train_loss": -27.027652740478516, "global_step": 418535, "epoch": 5042} {"train_loss": -26.683197021484375, "global_step": 418536, "epoch": 5042} {"train_loss": -26.703882217407227, "global_step": 418537, "epoch": 5042} {"train_loss": -27.10407829284668, "global_step": 418538, "epoch": 5042} {"train_loss": -26.880659103393555, "global_step": 418539, "epoch": 5042} {"train_loss": -26.89094352722168, "global_step": 418540, "epoch": 5042} {"train_loss": -26.846662521362305, "global_step": 418541, "epoch": 5042} {"train_loss": -26.557870864868164, "global_step": 418542, "epoch": 5042} {"train_loss": -26.507795333862305, "global_step": 418543, "epoch": 5042} {"train_loss": -26.805683135986328, "global_step": 418544, "epoch": 5042} {"train_loss": -26.654447555541992, "global_step": 418545, "epoch": 5042} {"train_loss": -26.9088191986084, "global_step": 418546, "epoch": 5042} {"train_loss": -26.715051651000977, "global_step": 418547, "epoch": 5042} {"train_loss": -26.690778732299805, "global_step": 418548, "epoch": 5042} {"train_loss": -26.938343048095703, "global_step": 418549, "epoch": 5042} {"train_loss": -26.367847442626953, "global_step": 418550, "epoch": 5042} {"train_loss": -26.840307235717773, "global_step": 418551, "epoch": 5042} {"train_loss": -26.561477661132812, "global_step": 418552, "epoch": 5042} {"train_loss": -26.755691528320312, "global_step": 418553, "epoch": 5042} {"train_loss": -27.0899658203125, "global_step": 418554, "epoch": 5042} {"train_loss": -26.613513946533203, "global_step": 418555, "epoch": 5042} {"train_loss": -26.468900680541992, "global_step": 418556, "epoch": 5042} {"train_loss": -26.898061752319336, "global_step": 418557, "epoch": 5042} {"train_loss": -26.590757369995117, "global_step": 418558, "epoch": 5042} {"train_loss": -26.93177604675293, "global_step": 418559, "epoch": 5042} {"train_loss": -26.680490493774414, "global_step": 418560, "epoch": 5042} {"train_loss": -26.61823844909668, "global_step": 418561, "epoch": 5042} {"train_loss": -27.037839889526367, "global_step": 418562, "epoch": 5042} {"train_loss": -26.722558975219727, "global_step": 418563, "epoch": 5042} {"train_loss": -26.851734161376953, "global_step": 418564, "epoch": 5042} {"train_loss": -26.5870304107666, "global_step": 418565, "epoch": 5042} {"train_loss": -26.4179630279541, "global_step": 418566, "epoch": 5042} {"train_loss": -26.573333740234375, "global_step": 418567, "epoch": 5042} {"train_loss": -26.697580406464727, "global_step": 418568, "epoch": 5042, "val_loss": 7034021.0} {"train_loss": -26.099288940429688, "global_step": 418569, "epoch": 5043} {"train_loss": -26.174680709838867, "global_step": 418570, "epoch": 5043} {"train_loss": -26.045568466186523, "global_step": 418571, "epoch": 5043} {"train_loss": -26.141637802124023, "global_step": 418572, "epoch": 5043} {"train_loss": -26.269306182861328, "global_step": 418573, "epoch": 5043} {"train_loss": -26.260507583618164, "global_step": 418574, "epoch": 5043} {"train_loss": -26.2608642578125, "global_step": 418575, "epoch": 5043} {"train_loss": -26.655637741088867, "global_step": 418576, "epoch": 5043} {"train_loss": -26.550201416015625, "global_step": 418577, "epoch": 5043} {"train_loss": -26.227508544921875, "global_step": 418578, "epoch": 5043} {"train_loss": -26.5876522064209, "global_step": 418579, "epoch": 5043} {"train_loss": -26.514387130737305, "global_step": 418580, "epoch": 5043} {"train_loss": -26.75970458984375, "global_step": 418581, "epoch": 5043} {"train_loss": -26.9085693359375, "global_step": 418582, "epoch": 5043} {"train_loss": -26.606952667236328, "global_step": 418583, "epoch": 5043} {"train_loss": -26.90419578552246, "global_step": 418584, "epoch": 5043} {"train_loss": -26.59712791442871, "global_step": 418585, "epoch": 5043} {"train_loss": -26.85392189025879, "global_step": 418586, "epoch": 5043} {"train_loss": -27.064411163330078, "global_step": 418587, "epoch": 5043} {"train_loss": -26.916296005249023, "global_step": 418588, "epoch": 5043} {"train_loss": -27.0166072845459, "global_step": 418589, "epoch": 5043} {"train_loss": -26.680017471313477, "global_step": 418590, "epoch": 5043} {"train_loss": -27.235858917236328, "global_step": 418591, "epoch": 5043} {"train_loss": -26.781356811523438, "global_step": 418592, "epoch": 5043} {"train_loss": -26.947900772094727, "global_step": 418593, "epoch": 5043} {"train_loss": -26.648420333862305, "global_step": 418594, "epoch": 5043} {"train_loss": -27.08378028869629, "global_step": 418595, "epoch": 5043} {"train_loss": -26.746896743774414, "global_step": 418596, "epoch": 5043} {"train_loss": -26.97224998474121, "global_step": 418597, "epoch": 5043} {"train_loss": -26.87244987487793, "global_step": 418598, "epoch": 5043} {"train_loss": -27.174224853515625, "global_step": 418599, "epoch": 5043} {"train_loss": -26.990076065063477, "global_step": 418600, "epoch": 5043} {"train_loss": -26.976612091064453, "global_step": 418601, "epoch": 5043} {"train_loss": -26.867456436157227, "global_step": 418602, "epoch": 5043} {"train_loss": -26.93124771118164, "global_step": 418603, "epoch": 5043} {"train_loss": -26.78358268737793, "global_step": 418604, "epoch": 5043} {"train_loss": -26.918930053710938, "global_step": 418605, "epoch": 5043} {"train_loss": -26.69400978088379, "global_step": 418606, "epoch": 5043} {"train_loss": -26.641117095947266, "global_step": 418607, "epoch": 5043} {"train_loss": -26.77594566345215, "global_step": 418608, "epoch": 5043} {"train_loss": -26.29817008972168, "global_step": 418609, "epoch": 5043} {"train_loss": -26.321741104125977, "global_step": 418610, "epoch": 5043} {"train_loss": -26.666318893432617, "global_step": 418611, "epoch": 5043} {"train_loss": -27.003156661987305, "global_step": 418612, "epoch": 5043} {"train_loss": -26.81818962097168, "global_step": 418613, "epoch": 5043} {"train_loss": -26.759912490844727, "global_step": 418614, "epoch": 5043} {"train_loss": -26.58101463317871, "global_step": 418615, "epoch": 5043} {"train_loss": -26.603208541870117, "global_step": 418616, "epoch": 5043} {"train_loss": -26.98980140686035, "global_step": 418617, "epoch": 5043} {"train_loss": -26.900863647460938, "global_step": 418618, "epoch": 5043} {"train_loss": -26.85137367248535, "global_step": 418619, "epoch": 5043} {"train_loss": -26.678741455078125, "global_step": 418620, "epoch": 5043} {"train_loss": -27.133121490478516, "global_step": 418621, "epoch": 5043} {"train_loss": -27.09307289123535, "global_step": 418622, "epoch": 5043} {"train_loss": -27.017560958862305, "global_step": 418623, "epoch": 5043} {"train_loss": -26.878244400024414, "global_step": 418624, "epoch": 5043} {"train_loss": -26.809431076049805, "global_step": 418625, "epoch": 5043} {"train_loss": -27.173202514648438, "global_step": 418626, "epoch": 5043} {"train_loss": -26.87421989440918, "global_step": 418627, "epoch": 5043} {"train_loss": -27.035429000854492, "global_step": 418628, "epoch": 5043} {"train_loss": -26.38214111328125, "global_step": 418629, "epoch": 5043} {"train_loss": -26.69049644470215, "global_step": 418630, "epoch": 5043} {"train_loss": -26.888769149780273, "global_step": 418631, "epoch": 5043} {"train_loss": -26.535690307617188, "global_step": 418632, "epoch": 5043} {"train_loss": -26.69300651550293, "global_step": 418633, "epoch": 5043} {"train_loss": -26.77189064025879, "global_step": 418634, "epoch": 5043} {"train_loss": -27.004013061523438, "global_step": 418635, "epoch": 5043} {"train_loss": -26.90228271484375, "global_step": 418636, "epoch": 5043} {"train_loss": -26.99252700805664, "global_step": 418637, "epoch": 5043} {"train_loss": -26.76788330078125, "global_step": 418638, "epoch": 5043} {"train_loss": -27.0635929107666, "global_step": 418639, "epoch": 5043} {"train_loss": -26.977529525756836, "global_step": 418640, "epoch": 5043} {"train_loss": -26.870819091796875, "global_step": 418641, "epoch": 5043} {"train_loss": -26.667266845703125, "global_step": 418642, "epoch": 5043} {"train_loss": -26.93350601196289, "global_step": 418643, "epoch": 5043} {"train_loss": -27.188465118408203, "global_step": 418644, "epoch": 5043} {"train_loss": -26.951139450073242, "global_step": 418645, "epoch": 5043} {"train_loss": -26.773120880126953, "global_step": 418646, "epoch": 5043} {"train_loss": -26.68377113342285, "global_step": 418647, "epoch": 5043} {"train_loss": -26.603076934814453, "global_step": 418648, "epoch": 5043} {"train_loss": -26.5399227142334, "global_step": 418649, "epoch": 5043} {"train_loss": -26.817174911499023, "global_step": 418650, "epoch": 5043} {"train_loss": -26.764406663825714, "global_step": 418651, "epoch": 5043, "val_loss": 7011185.0} {"train_loss": -26.3804931640625, "global_step": 418652, "epoch": 5044} {"train_loss": -25.902990341186523, "global_step": 418653, "epoch": 5044} {"train_loss": -25.722497940063477, "global_step": 418654, "epoch": 5044} {"train_loss": -25.939172744750977, "global_step": 418655, "epoch": 5044} {"train_loss": -26.22089195251465, "global_step": 418656, "epoch": 5044} {"train_loss": -25.539182662963867, "global_step": 418657, "epoch": 5044} {"train_loss": -26.49609375, "global_step": 418658, "epoch": 5044} {"train_loss": -25.928747177124023, "global_step": 418659, "epoch": 5044} {"train_loss": -26.599821090698242, "global_step": 418660, "epoch": 5044} {"train_loss": -26.00341796875, "global_step": 418661, "epoch": 5044} {"train_loss": -26.4841365814209, "global_step": 418662, "epoch": 5044} {"train_loss": -26.457468032836914, "global_step": 418663, "epoch": 5044} {"train_loss": -25.972736358642578, "global_step": 418664, "epoch": 5044} {"train_loss": -26.188369750976562, "global_step": 418665, "epoch": 5044} {"train_loss": -25.984832763671875, "global_step": 418666, "epoch": 5044} {"train_loss": -26.64404296875, "global_step": 418667, "epoch": 5044} {"train_loss": -26.2142391204834, "global_step": 418668, "epoch": 5044} {"train_loss": -26.55865478515625, "global_step": 418669, "epoch": 5044} {"train_loss": -26.3591251373291, "global_step": 418670, "epoch": 5044} {"train_loss": -26.330585479736328, "global_step": 418671, "epoch": 5044} {"train_loss": -26.508514404296875, "global_step": 418672, "epoch": 5044} {"train_loss": -26.138036727905273, "global_step": 418673, "epoch": 5044} {"train_loss": -26.592084884643555, "global_step": 418674, "epoch": 5044} {"train_loss": -26.248762130737305, "global_step": 418675, "epoch": 5044} {"train_loss": -26.842426300048828, "global_step": 418676, "epoch": 5044} {"train_loss": -26.431604385375977, "global_step": 418677, "epoch": 5044} {"train_loss": -26.524229049682617, "global_step": 418678, "epoch": 5044} {"train_loss": -26.34663200378418, "global_step": 418679, "epoch": 5044} {"train_loss": -26.435861587524414, "global_step": 418680, "epoch": 5044} {"train_loss": -26.43280601501465, "global_step": 418681, "epoch": 5044} {"train_loss": -26.321924209594727, "global_step": 418682, "epoch": 5044} {"train_loss": -26.60845947265625, "global_step": 418683, "epoch": 5044} {"train_loss": -26.3695011138916, "global_step": 418684, "epoch": 5044} {"train_loss": -27.10865592956543, "global_step": 418685, "epoch": 5044} {"train_loss": -26.28956413269043, "global_step": 418686, "epoch": 5044} {"train_loss": -26.5479793548584, "global_step": 418687, "epoch": 5044} {"train_loss": -26.88824462890625, "global_step": 418688, "epoch": 5044} {"train_loss": -26.749820709228516, "global_step": 418689, "epoch": 5044} {"train_loss": -26.768085479736328, "global_step": 418690, "epoch": 5044} {"train_loss": -26.96953773498535, "global_step": 418691, "epoch": 5044} {"train_loss": -27.07834815979004, "global_step": 418692, "epoch": 5044} {"train_loss": -26.48151206970215, "global_step": 418693, "epoch": 5044} {"train_loss": -26.546707153320312, "global_step": 418694, "epoch": 5044} {"train_loss": -26.50800132751465, "global_step": 418695, "epoch": 5044} {"train_loss": -26.447988510131836, "global_step": 418696, "epoch": 5044} {"train_loss": -27.043554306030273, "global_step": 418697, "epoch": 5044} {"train_loss": -26.286767959594727, "global_step": 418698, "epoch": 5044} {"train_loss": -26.279508590698242, "global_step": 418699, "epoch": 5044} {"train_loss": -26.975793838500977, "global_step": 418700, "epoch": 5044} {"train_loss": -27.00421714782715, "global_step": 418701, "epoch": 5044} {"train_loss": -26.79352378845215, "global_step": 418702, "epoch": 5044} {"train_loss": -26.795339584350586, "global_step": 418703, "epoch": 5044} {"train_loss": -27.151081085205078, "global_step": 418704, "epoch": 5044} {"train_loss": -26.690887451171875, "global_step": 418705, "epoch": 5044} {"train_loss": -26.49091148376465, "global_step": 418706, "epoch": 5044} {"train_loss": -26.458829879760742, "global_step": 418707, "epoch": 5044} {"train_loss": -26.468900680541992, "global_step": 418708, "epoch": 5044} {"train_loss": -26.660730361938477, "global_step": 418709, "epoch": 5044} {"train_loss": -26.391569137573242, "global_step": 418710, "epoch": 5044} {"train_loss": -26.4633731842041, "global_step": 418711, "epoch": 5044} {"train_loss": -27.148670196533203, "global_step": 418712, "epoch": 5044} {"train_loss": -26.681903839111328, "global_step": 418713, "epoch": 5044} {"train_loss": -26.74810791015625, "global_step": 418714, "epoch": 5044} {"train_loss": -26.523406982421875, "global_step": 418715, "epoch": 5044} {"train_loss": -27.225561141967773, "global_step": 418716, "epoch": 5044} {"train_loss": -26.870773315429688, "global_step": 418717, "epoch": 5044} {"train_loss": -26.921178817749023, "global_step": 418718, "epoch": 5044} {"train_loss": -26.80474853515625, "global_step": 418719, "epoch": 5044} {"train_loss": -26.791553497314453, "global_step": 418720, "epoch": 5044} {"train_loss": -26.924081802368164, "global_step": 418721, "epoch": 5044} {"train_loss": -27.044309616088867, "global_step": 418722, "epoch": 5044} {"train_loss": -27.291126251220703, "global_step": 418723, "epoch": 5044} {"train_loss": -27.1608829498291, "global_step": 418724, "epoch": 5044} {"train_loss": -27.132230758666992, "global_step": 418725, "epoch": 5044} {"train_loss": -26.732877731323242, "global_step": 418726, "epoch": 5044} {"train_loss": -27.132843017578125, "global_step": 418727, "epoch": 5044} {"train_loss": -26.849140167236328, "global_step": 418728, "epoch": 5044} {"train_loss": -27.35310173034668, "global_step": 418729, "epoch": 5044} {"train_loss": -26.570409774780273, "global_step": 418730, "epoch": 5044} {"train_loss": -27.281179428100586, "global_step": 418731, "epoch": 5044} {"train_loss": -26.913862228393555, "global_step": 418732, "epoch": 5044} {"train_loss": -26.871551513671875, "global_step": 418733, "epoch": 5044} {"train_loss": -26.60684466074748, "global_step": 418734, "epoch": 5044, "val_loss": 7105110.0} {"train_loss": -26.648712158203125, "global_step": 418735, "epoch": 5045} {"train_loss": -26.813634872436523, "global_step": 418736, "epoch": 5045} {"train_loss": -26.427587509155273, "global_step": 418737, "epoch": 5045} {"train_loss": -26.522180557250977, "global_step": 418738, "epoch": 5045} {"train_loss": -26.73541831970215, "global_step": 418739, "epoch": 5045} {"train_loss": -26.61310386657715, "global_step": 418740, "epoch": 5045} {"train_loss": -26.79523277282715, "global_step": 418741, "epoch": 5045} {"train_loss": -26.433032989501953, "global_step": 418742, "epoch": 5045} {"train_loss": -26.97861099243164, "global_step": 418743, "epoch": 5045} {"train_loss": -26.846485137939453, "global_step": 418744, "epoch": 5045} {"train_loss": -26.6534366607666, "global_step": 418745, "epoch": 5045} {"train_loss": -25.7473201751709, "global_step": 418746, "epoch": 5045} {"train_loss": -26.088306427001953, "global_step": 418747, "epoch": 5045} {"train_loss": -26.403722763061523, "global_step": 418748, "epoch": 5045} {"train_loss": -26.51318359375, "global_step": 418749, "epoch": 5045} {"train_loss": -26.4332275390625, "global_step": 418750, "epoch": 5045} {"train_loss": -26.6176700592041, "global_step": 418751, "epoch": 5045} {"train_loss": -26.46721839904785, "global_step": 418752, "epoch": 5045} {"train_loss": -26.615909576416016, "global_step": 418753, "epoch": 5045} {"train_loss": -26.906818389892578, "global_step": 418754, "epoch": 5045} {"train_loss": -26.756927490234375, "global_step": 418755, "epoch": 5045} {"train_loss": -26.3902530670166, "global_step": 418756, "epoch": 5045} {"train_loss": -26.48121452331543, "global_step": 418757, "epoch": 5045} {"train_loss": -27.118030548095703, "global_step": 418758, "epoch": 5045} {"train_loss": -26.542285919189453, "global_step": 418759, "epoch": 5045} {"train_loss": -26.753625869750977, "global_step": 418760, "epoch": 5045} {"train_loss": -26.86138916015625, "global_step": 418761, "epoch": 5045} {"train_loss": -26.67359733581543, "global_step": 418762, "epoch": 5045} {"train_loss": -26.8863525390625, "global_step": 418763, "epoch": 5045} {"train_loss": -26.746191024780273, "global_step": 418764, "epoch": 5045} {"train_loss": -26.972705841064453, "global_step": 418765, "epoch": 5045} {"train_loss": -26.97810173034668, "global_step": 418766, "epoch": 5045} {"train_loss": -26.381582260131836, "global_step": 418767, "epoch": 5045} {"train_loss": -26.697784423828125, "global_step": 418768, "epoch": 5045} {"train_loss": -26.84956932067871, "global_step": 418769, "epoch": 5045} {"train_loss": -26.594806671142578, "global_step": 418770, "epoch": 5045} {"train_loss": -26.7926025390625, "global_step": 418771, "epoch": 5045} {"train_loss": -26.9982967376709, "global_step": 418772, "epoch": 5045} {"train_loss": -27.097335815429688, "global_step": 418773, "epoch": 5045} {"train_loss": -26.35847282409668, "global_step": 418774, "epoch": 5045} {"train_loss": -26.7714786529541, "global_step": 418775, "epoch": 5045} {"train_loss": -26.761337280273438, "global_step": 418776, "epoch": 5045} {"train_loss": -26.9625301361084, "global_step": 418777, "epoch": 5045} {"train_loss": -27.096277236938477, "global_step": 418778, "epoch": 5045} {"train_loss": -26.643415451049805, "global_step": 418779, "epoch": 5045} {"train_loss": -26.900541305541992, "global_step": 418780, "epoch": 5045} {"train_loss": -26.58180046081543, "global_step": 418781, "epoch": 5045} {"train_loss": -26.91294288635254, "global_step": 418782, "epoch": 5045} {"train_loss": -26.520404815673828, "global_step": 418783, "epoch": 5045} {"train_loss": -26.97344398498535, "global_step": 418784, "epoch": 5045} {"train_loss": -27.03316307067871, "global_step": 418785, "epoch": 5045} {"train_loss": -26.9779109954834, "global_step": 418786, "epoch": 5045} {"train_loss": -26.7475643157959, "global_step": 418787, "epoch": 5045} {"train_loss": -26.81693458557129, "global_step": 418788, "epoch": 5045} {"train_loss": -26.796289443969727, "global_step": 418789, "epoch": 5045} {"train_loss": -26.771697998046875, "global_step": 418790, "epoch": 5045} {"train_loss": -26.595304489135742, "global_step": 418791, "epoch": 5045} {"train_loss": -26.658166885375977, "global_step": 418792, "epoch": 5045} {"train_loss": -26.969024658203125, "global_step": 418793, "epoch": 5045} {"train_loss": -26.905521392822266, "global_step": 418794, "epoch": 5045} {"train_loss": -27.064382553100586, "global_step": 418795, "epoch": 5045} {"train_loss": -26.71272087097168, "global_step": 418796, "epoch": 5045} {"train_loss": -26.547529220581055, "global_step": 418797, "epoch": 5045} {"train_loss": -26.8987979888916, "global_step": 418798, "epoch": 5045} {"train_loss": -26.605609893798828, "global_step": 418799, "epoch": 5045} {"train_loss": -26.87166404724121, "global_step": 418800, "epoch": 5045} {"train_loss": -26.814477920532227, "global_step": 418801, "epoch": 5045} {"train_loss": -26.794219970703125, "global_step": 418802, "epoch": 5045} {"train_loss": -26.62826919555664, "global_step": 418803, "epoch": 5045} {"train_loss": -26.777942657470703, "global_step": 418804, "epoch": 5045} {"train_loss": -26.789819717407227, "global_step": 418805, "epoch": 5045} {"train_loss": -26.740644454956055, "global_step": 418806, "epoch": 5045} {"train_loss": -26.52235221862793, "global_step": 418807, "epoch": 5045} {"train_loss": -26.841943740844727, "global_step": 418808, "epoch": 5045} {"train_loss": -26.61383056640625, "global_step": 418809, "epoch": 5045} {"train_loss": -26.89478874206543, "global_step": 418810, "epoch": 5045} {"train_loss": -26.108240127563477, "global_step": 418811, "epoch": 5045} {"train_loss": -26.769184112548828, "global_step": 418812, "epoch": 5045} {"train_loss": -26.360544204711914, "global_step": 418813, "epoch": 5045} {"train_loss": -27.380538940429688, "global_step": 418814, "epoch": 5045} {"train_loss": -26.884510040283203, "global_step": 418815, "epoch": 5045} {"train_loss": -27.008325576782227, "global_step": 418816, "epoch": 5045} {"train_loss": -26.70750114716679, "global_step": 418817, "epoch": 5045, "val_loss": 6994140.0} {"train_loss": -26.157705307006836, "global_step": 418818, "epoch": 5046} {"train_loss": -25.412391662597656, "global_step": 418819, "epoch": 5046} {"train_loss": -26.092050552368164, "global_step": 418820, "epoch": 5046} {"train_loss": -26.19166374206543, "global_step": 418821, "epoch": 5046} {"train_loss": -26.128204345703125, "global_step": 418822, "epoch": 5046} {"train_loss": -25.917455673217773, "global_step": 418823, "epoch": 5046} {"train_loss": -26.426679611206055, "global_step": 418824, "epoch": 5046} {"train_loss": -26.234094619750977, "global_step": 418825, "epoch": 5046} {"train_loss": -25.925893783569336, "global_step": 418826, "epoch": 5046} {"train_loss": -26.148025512695312, "global_step": 418827, "epoch": 5046} {"train_loss": -26.468704223632812, "global_step": 418828, "epoch": 5046} {"train_loss": -26.486906051635742, "global_step": 418829, "epoch": 5046} {"train_loss": -26.510589599609375, "global_step": 418830, "epoch": 5046} {"train_loss": -26.58307456970215, "global_step": 418831, "epoch": 5046} {"train_loss": -26.673099517822266, "global_step": 418832, "epoch": 5046} {"train_loss": -26.566858291625977, "global_step": 418833, "epoch": 5046} {"train_loss": -26.5504207611084, "global_step": 418834, "epoch": 5046} {"train_loss": -26.641000747680664, "global_step": 418835, "epoch": 5046} {"train_loss": -26.345996856689453, "global_step": 418836, "epoch": 5046} {"train_loss": -26.633514404296875, "global_step": 418837, "epoch": 5046} {"train_loss": -26.793212890625, "global_step": 418838, "epoch": 5046} {"train_loss": -26.835622787475586, "global_step": 418839, "epoch": 5046} {"train_loss": -26.568220138549805, "global_step": 418840, "epoch": 5046} {"train_loss": -26.753183364868164, "global_step": 418841, "epoch": 5046} {"train_loss": -26.881113052368164, "global_step": 418842, "epoch": 5046} {"train_loss": -26.607263565063477, "global_step": 418843, "epoch": 5046} {"train_loss": -26.896451950073242, "global_step": 418844, "epoch": 5046} {"train_loss": -26.66542625427246, "global_step": 418845, "epoch": 5046} {"train_loss": -26.57320213317871, "global_step": 418846, "epoch": 5046} {"train_loss": -26.735971450805664, "global_step": 418847, "epoch": 5046} {"train_loss": -26.70770835876465, "global_step": 418848, "epoch": 5046} {"train_loss": -26.212482452392578, "global_step": 418849, "epoch": 5046} {"train_loss": -26.605789184570312, "global_step": 418850, "epoch": 5046} {"train_loss": -27.322879791259766, "global_step": 418851, "epoch": 5046} {"train_loss": -27.10761833190918, "global_step": 418852, "epoch": 5046} {"train_loss": -26.842041015625, "global_step": 418853, "epoch": 5046} {"train_loss": -26.907215118408203, "global_step": 418854, "epoch": 5046} {"train_loss": -27.005481719970703, "global_step": 418855, "epoch": 5046} {"train_loss": -27.119298934936523, "global_step": 418856, "epoch": 5046} {"train_loss": -26.695587158203125, "global_step": 418857, "epoch": 5046} {"train_loss": -27.154687881469727, "global_step": 418858, "epoch": 5046} {"train_loss": -27.045270919799805, "global_step": 418859, "epoch": 5046} {"train_loss": -26.77066421508789, "global_step": 418860, "epoch": 5046} {"train_loss": -27.0079402923584, "global_step": 418861, "epoch": 5046} {"train_loss": -27.034955978393555, "global_step": 418862, "epoch": 5046} {"train_loss": -26.99212646484375, "global_step": 418863, "epoch": 5046} {"train_loss": -27.018095016479492, "global_step": 418864, "epoch": 5046} {"train_loss": -26.794055938720703, "global_step": 418865, "epoch": 5046} {"train_loss": -26.984540939331055, "global_step": 418866, "epoch": 5046} {"train_loss": -26.86321449279785, "global_step": 418867, "epoch": 5046} {"train_loss": -27.390426635742188, "global_step": 418868, "epoch": 5046} {"train_loss": -26.825607299804688, "global_step": 418869, "epoch": 5046} {"train_loss": -27.182416915893555, "global_step": 418870, "epoch": 5046} {"train_loss": -26.842533111572266, "global_step": 418871, "epoch": 5046} {"train_loss": -26.608596801757812, "global_step": 418872, "epoch": 5046} {"train_loss": -27.02899169921875, "global_step": 418873, "epoch": 5046} {"train_loss": -26.94696044921875, "global_step": 418874, "epoch": 5046} {"train_loss": -26.73431396484375, "global_step": 418875, "epoch": 5046} {"train_loss": -26.762296676635742, "global_step": 418876, "epoch": 5046} {"train_loss": -27.02858543395996, "global_step": 418877, "epoch": 5046} {"train_loss": -26.695215225219727, "global_step": 418878, "epoch": 5046} {"train_loss": -26.581968307495117, "global_step": 418879, "epoch": 5046} {"train_loss": -25.98308753967285, "global_step": 418880, "epoch": 5046} {"train_loss": -26.025442123413086, "global_step": 418881, "epoch": 5046} {"train_loss": -26.204227447509766, "global_step": 418882, "epoch": 5046} {"train_loss": -26.34221839904785, "global_step": 418883, "epoch": 5046} {"train_loss": -26.434833526611328, "global_step": 418884, "epoch": 5046} {"train_loss": -26.7052001953125, "global_step": 418885, "epoch": 5046} {"train_loss": -26.881540298461914, "global_step": 418886, "epoch": 5046} {"train_loss": -26.9604549407959, "global_step": 418887, "epoch": 5046} {"train_loss": -26.343353271484375, "global_step": 418888, "epoch": 5046} {"train_loss": -27.1110782623291, "global_step": 418889, "epoch": 5046} {"train_loss": -26.939931869506836, "global_step": 418890, "epoch": 5046} {"train_loss": -27.019113540649414, "global_step": 418891, "epoch": 5046} {"train_loss": -26.87851333618164, "global_step": 418892, "epoch": 5046} {"train_loss": -26.825458526611328, "global_step": 418893, "epoch": 5046} {"train_loss": -26.596349716186523, "global_step": 418894, "epoch": 5046} {"train_loss": -26.70294761657715, "global_step": 418895, "epoch": 5046} {"train_loss": -26.802473068237305, "global_step": 418896, "epoch": 5046} {"train_loss": -26.531238555908203, "global_step": 418897, "epoch": 5046} {"train_loss": -27.035200119018555, "global_step": 418898, "epoch": 5046} {"train_loss": -26.935937881469727, "global_step": 418899, "epoch": 5046} {"train_loss": -26.671034387795324, "global_step": 418900, "epoch": 5046, "val_loss": 7103870.0} {"train_loss": -26.35396385192871, "global_step": 418901, "epoch": 5047} {"train_loss": -26.752399444580078, "global_step": 418902, "epoch": 5047} {"train_loss": -26.368927001953125, "global_step": 418903, "epoch": 5047} {"train_loss": -26.66546630859375, "global_step": 418904, "epoch": 5047} {"train_loss": -26.275634765625, "global_step": 418905, "epoch": 5047} {"train_loss": -26.296680450439453, "global_step": 418906, "epoch": 5047} {"train_loss": -26.442779541015625, "global_step": 418907, "epoch": 5047} {"train_loss": -26.65424156188965, "global_step": 418908, "epoch": 5047} {"train_loss": -26.6730899810791, "global_step": 418909, "epoch": 5047} {"train_loss": -26.63031578063965, "global_step": 418910, "epoch": 5047} {"train_loss": -26.955291748046875, "global_step": 418911, "epoch": 5047} {"train_loss": -26.739185333251953, "global_step": 418912, "epoch": 5047} {"train_loss": -27.02320671081543, "global_step": 418913, "epoch": 5047} {"train_loss": -26.80647087097168, "global_step": 418914, "epoch": 5047} {"train_loss": -26.137903213500977, "global_step": 418915, "epoch": 5047} {"train_loss": -26.515884399414062, "global_step": 418916, "epoch": 5047} {"train_loss": -26.86172866821289, "global_step": 418917, "epoch": 5047} {"train_loss": -26.54574966430664, "global_step": 418918, "epoch": 5047} {"train_loss": -26.713520050048828, "global_step": 418919, "epoch": 5047} {"train_loss": -26.47360610961914, "global_step": 418920, "epoch": 5047} {"train_loss": -26.566104888916016, "global_step": 418921, "epoch": 5047} {"train_loss": -26.774274826049805, "global_step": 418922, "epoch": 5047} {"train_loss": -26.472471237182617, "global_step": 418923, "epoch": 5047} {"train_loss": -26.785932540893555, "global_step": 418924, "epoch": 5047} {"train_loss": -26.851001739501953, "global_step": 418925, "epoch": 5047} {"train_loss": -26.62825584411621, "global_step": 418926, "epoch": 5047} {"train_loss": -26.881628036499023, "global_step": 418927, "epoch": 5047} {"train_loss": -26.90351676940918, "global_step": 418928, "epoch": 5047} {"train_loss": -26.551589965820312, "global_step": 418929, "epoch": 5047} {"train_loss": -26.733081817626953, "global_step": 418930, "epoch": 5047} {"train_loss": -27.185745239257812, "global_step": 418931, "epoch": 5047} {"train_loss": -26.862592697143555, "global_step": 418932, "epoch": 5047} {"train_loss": -26.671682357788086, "global_step": 418933, "epoch": 5047} {"train_loss": -26.865787506103516, "global_step": 418934, "epoch": 5047} {"train_loss": -27.177539825439453, "global_step": 418935, "epoch": 5047} {"train_loss": -26.664478302001953, "global_step": 418936, "epoch": 5047} {"train_loss": -27.124073028564453, "global_step": 418937, "epoch": 5047} {"train_loss": -26.7940616607666, "global_step": 418938, "epoch": 5047} {"train_loss": -26.789854049682617, "global_step": 418939, "epoch": 5047} {"train_loss": -26.677759170532227, "global_step": 418940, "epoch": 5047} {"train_loss": -27.222768783569336, "global_step": 418941, "epoch": 5047} {"train_loss": -27.074066162109375, "global_step": 418942, "epoch": 5047} {"train_loss": -27.122507095336914, "global_step": 418943, "epoch": 5047} {"train_loss": -26.565534591674805, "global_step": 418944, "epoch": 5047} {"train_loss": -26.4033260345459, "global_step": 418945, "epoch": 5047} {"train_loss": -26.750446319580078, "global_step": 418946, "epoch": 5047} {"train_loss": -26.817138671875, "global_step": 418947, "epoch": 5047} {"train_loss": -26.810657501220703, "global_step": 418948, "epoch": 5047} {"train_loss": -26.729782104492188, "global_step": 418949, "epoch": 5047} {"train_loss": -26.8789005279541, "global_step": 418950, "epoch": 5047} {"train_loss": -26.945526123046875, "global_step": 418951, "epoch": 5047} {"train_loss": -26.911649703979492, "global_step": 418952, "epoch": 5047} {"train_loss": -26.669530868530273, "global_step": 418953, "epoch": 5047} {"train_loss": -26.800458908081055, "global_step": 418954, "epoch": 5047} {"train_loss": -26.656042098999023, "global_step": 418955, "epoch": 5047} {"train_loss": -26.70142936706543, "global_step": 418956, "epoch": 5047} {"train_loss": -26.518070220947266, "global_step": 418957, "epoch": 5047} {"train_loss": -26.4075927734375, "global_step": 418958, "epoch": 5047} {"train_loss": -26.325958251953125, "global_step": 418959, "epoch": 5047} {"train_loss": -26.854650497436523, "global_step": 418960, "epoch": 5047} {"train_loss": -26.999176025390625, "global_step": 418961, "epoch": 5047} {"train_loss": -26.466299057006836, "global_step": 418962, "epoch": 5047} {"train_loss": -26.6800594329834, "global_step": 418963, "epoch": 5047} {"train_loss": -26.721633911132812, "global_step": 418964, "epoch": 5047} {"train_loss": -26.476245880126953, "global_step": 418965, "epoch": 5047} {"train_loss": -26.132862091064453, "global_step": 418966, "epoch": 5047} {"train_loss": -26.530715942382812, "global_step": 418967, "epoch": 5047} {"train_loss": -25.993741989135742, "global_step": 418968, "epoch": 5047} {"train_loss": -26.6767578125, "global_step": 418969, "epoch": 5047} {"train_loss": -25.8700008392334, "global_step": 418970, "epoch": 5047} {"train_loss": -26.13726806640625, "global_step": 418971, "epoch": 5047} {"train_loss": -26.642852783203125, "global_step": 418972, "epoch": 5047} {"train_loss": -26.56854820251465, "global_step": 418973, "epoch": 5047} {"train_loss": -26.3453426361084, "global_step": 418974, "epoch": 5047} {"train_loss": -26.345783233642578, "global_step": 418975, "epoch": 5047} {"train_loss": -26.695520401000977, "global_step": 418976, "epoch": 5047} {"train_loss": -26.39283561706543, "global_step": 418977, "epoch": 5047} {"train_loss": -26.793378829956055, "global_step": 418978, "epoch": 5047} {"train_loss": -26.613718032836914, "global_step": 418979, "epoch": 5047} {"train_loss": -26.112842559814453, "global_step": 418980, "epoch": 5047} {"train_loss": -26.45476722717285, "global_step": 418981, "epoch": 5047} {"train_loss": -26.81839942932129, "global_step": 418982, "epoch": 5047} {"train_loss": -26.64322492300746, "global_step": 418983, "epoch": 5047, "val_loss": 7007497.0} {"train_loss": -26.23748207092285, "global_step": 418984, "epoch": 5048} {"train_loss": -25.81794548034668, "global_step": 418985, "epoch": 5048} {"train_loss": -26.327747344970703, "global_step": 418986, "epoch": 5048} {"train_loss": -25.999134063720703, "global_step": 418987, "epoch": 5048} {"train_loss": -26.279943466186523, "global_step": 418988, "epoch": 5048} {"train_loss": -26.94415283203125, "global_step": 418989, "epoch": 5048} {"train_loss": -26.527734756469727, "global_step": 418990, "epoch": 5048} {"train_loss": -26.28955078125, "global_step": 418991, "epoch": 5048} {"train_loss": -26.600006103515625, "global_step": 418992, "epoch": 5048} {"train_loss": -26.656070709228516, "global_step": 418993, "epoch": 5048} {"train_loss": -26.451868057250977, "global_step": 418994, "epoch": 5048} {"train_loss": -26.55698585510254, "global_step": 418995, "epoch": 5048} {"train_loss": -26.14630699157715, "global_step": 418996, "epoch": 5048} {"train_loss": -26.895727157592773, "global_step": 418997, "epoch": 5048} {"train_loss": -26.81491470336914, "global_step": 418998, "epoch": 5048} {"train_loss": -26.616077423095703, "global_step": 418999, "epoch": 5048} {"train_loss": -26.851673126220703, "global_step": 419000, "epoch": 5048} {"train_loss": -26.87042808532715, "global_step": 419001, "epoch": 5048} {"train_loss": -26.980396270751953, "global_step": 419002, "epoch": 5048} {"train_loss": -26.996810913085938, "global_step": 419003, "epoch": 5048} {"train_loss": -26.473785400390625, "global_step": 419004, "epoch": 5048} {"train_loss": -26.850366592407227, "global_step": 419005, "epoch": 5048} {"train_loss": -26.77181053161621, "global_step": 419006, "epoch": 5048} {"train_loss": -27.299646377563477, "global_step": 419007, "epoch": 5048} {"train_loss": -26.92365837097168, "global_step": 419008, "epoch": 5048} {"train_loss": -26.865619659423828, "global_step": 419009, "epoch": 5048} {"train_loss": -26.82305908203125, "global_step": 419010, "epoch": 5048} {"train_loss": -26.606613159179688, "global_step": 419011, "epoch": 5048} {"train_loss": -26.7332763671875, "global_step": 419012, "epoch": 5048} {"train_loss": -26.834522247314453, "global_step": 419013, "epoch": 5048} {"train_loss": -26.941877365112305, "global_step": 419014, "epoch": 5048} {"train_loss": -26.76401138305664, "global_step": 419015, "epoch": 5048} {"train_loss": -26.711034774780273, "global_step": 419016, "epoch": 5048} {"train_loss": -27.05670738220215, "global_step": 419017, "epoch": 5048} {"train_loss": -27.152494430541992, "global_step": 419018, "epoch": 5048} {"train_loss": -27.092451095581055, "global_step": 419019, "epoch": 5048} {"train_loss": -26.8160343170166, "global_step": 419020, "epoch": 5048} {"train_loss": -27.26316261291504, "global_step": 419021, "epoch": 5048} {"train_loss": -26.818967819213867, "global_step": 419022, "epoch": 5048} {"train_loss": -26.783315658569336, "global_step": 419023, "epoch": 5048} {"train_loss": -26.755298614501953, "global_step": 419024, "epoch": 5048} {"train_loss": -26.786514282226562, "global_step": 419025, "epoch": 5048} {"train_loss": -27.028247833251953, "global_step": 419026, "epoch": 5048} {"train_loss": -27.06574821472168, "global_step": 419027, "epoch": 5048} {"train_loss": -26.809112548828125, "global_step": 419028, "epoch": 5048} {"train_loss": -27.116437911987305, "global_step": 419029, "epoch": 5048} {"train_loss": -26.998193740844727, "global_step": 419030, "epoch": 5048} {"train_loss": -26.857208251953125, "global_step": 419031, "epoch": 5048} {"train_loss": -26.688817977905273, "global_step": 419032, "epoch": 5048} {"train_loss": -27.13433265686035, "global_step": 419033, "epoch": 5048} {"train_loss": -27.037445068359375, "global_step": 419034, "epoch": 5048} {"train_loss": -26.75320816040039, "global_step": 419035, "epoch": 5048} {"train_loss": -26.800098419189453, "global_step": 419036, "epoch": 5048} {"train_loss": -26.93451499938965, "global_step": 419037, "epoch": 5048} {"train_loss": -26.863134384155273, "global_step": 419038, "epoch": 5048} {"train_loss": -26.807403564453125, "global_step": 419039, "epoch": 5048} {"train_loss": -26.853612899780273, "global_step": 419040, "epoch": 5048} {"train_loss": -26.9785213470459, "global_step": 419041, "epoch": 5048} {"train_loss": -26.706317901611328, "global_step": 419042, "epoch": 5048} {"train_loss": -26.940820693969727, "global_step": 419043, "epoch": 5048} {"train_loss": -27.064863204956055, "global_step": 419044, "epoch": 5048} {"train_loss": -26.919721603393555, "global_step": 419045, "epoch": 5048} {"train_loss": -26.837051391601562, "global_step": 419046, "epoch": 5048} {"train_loss": -27.00685691833496, "global_step": 419047, "epoch": 5048} {"train_loss": -27.0494441986084, "global_step": 419048, "epoch": 5048} {"train_loss": -26.782495498657227, "global_step": 419049, "epoch": 5048} {"train_loss": -27.133874893188477, "global_step": 419050, "epoch": 5048} {"train_loss": -26.854475021362305, "global_step": 419051, "epoch": 5048} {"train_loss": -27.0791072845459, "global_step": 419052, "epoch": 5048} {"train_loss": -26.76946449279785, "global_step": 419053, "epoch": 5048} {"train_loss": -26.691360473632812, "global_step": 419054, "epoch": 5048} {"train_loss": -27.2369327545166, "global_step": 419055, "epoch": 5048} {"train_loss": -26.99472999572754, "global_step": 419056, "epoch": 5048} {"train_loss": -27.1840763092041, "global_step": 419057, "epoch": 5048} {"train_loss": -26.7785587310791, "global_step": 419058, "epoch": 5048} {"train_loss": -26.861799240112305, "global_step": 419059, "epoch": 5048} {"train_loss": -26.298070907592773, "global_step": 419060, "epoch": 5048} {"train_loss": -26.5887508392334, "global_step": 419061, "epoch": 5048} {"train_loss": -26.558765411376953, "global_step": 419062, "epoch": 5048} {"train_loss": -26.6770076751709, "global_step": 419063, "epoch": 5048} {"train_loss": -27.046512603759766, "global_step": 419064, "epoch": 5048} {"train_loss": -26.82757568359375, "global_step": 419065, "epoch": 5048} {"train_loss": -26.79702983994082, "global_step": 419066, "epoch": 5048, "val_loss": 7118860.0} {"train_loss": -25.855331420898438, "global_step": 419067, "epoch": 5049} {"train_loss": -25.7523136138916, "global_step": 419068, "epoch": 5049} {"train_loss": -25.821380615234375, "global_step": 419069, "epoch": 5049} {"train_loss": -25.859460830688477, "global_step": 419070, "epoch": 5049} {"train_loss": -26.71965980529785, "global_step": 419071, "epoch": 5049} {"train_loss": -26.017532348632812, "global_step": 419072, "epoch": 5049} {"train_loss": -26.748382568359375, "global_step": 419073, "epoch": 5049} {"train_loss": -25.8248348236084, "global_step": 419074, "epoch": 5049} {"train_loss": -26.226999282836914, "global_step": 419075, "epoch": 5049} {"train_loss": -26.0069580078125, "global_step": 419076, "epoch": 5049} {"train_loss": -26.579111099243164, "global_step": 419077, "epoch": 5049} {"train_loss": -26.342578887939453, "global_step": 419078, "epoch": 5049} {"train_loss": -25.7043399810791, "global_step": 419079, "epoch": 5049} {"train_loss": -26.218292236328125, "global_step": 419080, "epoch": 5049} {"train_loss": -26.105512619018555, "global_step": 419081, "epoch": 5049} {"train_loss": -26.150583267211914, "global_step": 419082, "epoch": 5049} {"train_loss": -26.291349411010742, "global_step": 419083, "epoch": 5049} {"train_loss": -26.604040145874023, "global_step": 419084, "epoch": 5049} {"train_loss": -26.777820587158203, "global_step": 419085, "epoch": 5049} {"train_loss": -26.391286849975586, "global_step": 419086, "epoch": 5049} {"train_loss": -26.24458122253418, "global_step": 419087, "epoch": 5049} {"train_loss": -26.605030059814453, "global_step": 419088, "epoch": 5049} {"train_loss": -26.57978630065918, "global_step": 419089, "epoch": 5049} {"train_loss": -26.548267364501953, "global_step": 419090, "epoch": 5049} {"train_loss": -26.198150634765625, "global_step": 419091, "epoch": 5049} {"train_loss": -26.60810661315918, "global_step": 419092, "epoch": 5049} {"train_loss": -26.79755210876465, "global_step": 419093, "epoch": 5049} {"train_loss": -26.423559188842773, "global_step": 419094, "epoch": 5049} {"train_loss": -26.597076416015625, "global_step": 419095, "epoch": 5049} {"train_loss": -26.241559982299805, "global_step": 419096, "epoch": 5049} {"train_loss": -26.93265151977539, "global_step": 419097, "epoch": 5049} {"train_loss": -26.576818466186523, "global_step": 419098, "epoch": 5049} {"train_loss": -26.896223068237305, "global_step": 419099, "epoch": 5049} {"train_loss": -26.842233657836914, "global_step": 419100, "epoch": 5049} {"train_loss": -26.651227951049805, "global_step": 419101, "epoch": 5049} {"train_loss": -26.92879295349121, "global_step": 419102, "epoch": 5049} {"train_loss": -26.56378173828125, "global_step": 419103, "epoch": 5049} {"train_loss": -26.601272583007812, "global_step": 419104, "epoch": 5049} {"train_loss": -26.672712326049805, "global_step": 419105, "epoch": 5049} {"train_loss": -27.156574249267578, "global_step": 419106, "epoch": 5049} {"train_loss": -26.84663963317871, "global_step": 419107, "epoch": 5049} {"train_loss": -26.73079490661621, "global_step": 419108, "epoch": 5049} {"train_loss": -26.947071075439453, "global_step": 419109, "epoch": 5049} {"train_loss": -26.707380294799805, "global_step": 419110, "epoch": 5049} {"train_loss": -26.84800148010254, "global_step": 419111, "epoch": 5049} {"train_loss": -26.568317413330078, "global_step": 419112, "epoch": 5049} {"train_loss": -27.343597412109375, "global_step": 419113, "epoch": 5049} {"train_loss": -26.487537384033203, "global_step": 419114, "epoch": 5049} {"train_loss": -27.13055992126465, "global_step": 419115, "epoch": 5049} {"train_loss": -26.745397567749023, "global_step": 419116, "epoch": 5049} {"train_loss": -26.214094161987305, "global_step": 419117, "epoch": 5049} {"train_loss": -26.50153160095215, "global_step": 419118, "epoch": 5049} {"train_loss": -26.341222763061523, "global_step": 419119, "epoch": 5049} {"train_loss": -26.954044342041016, "global_step": 419120, "epoch": 5049} {"train_loss": -27.022785186767578, "global_step": 419121, "epoch": 5049} {"train_loss": -26.424442291259766, "global_step": 419122, "epoch": 5049} {"train_loss": -26.844274520874023, "global_step": 419123, "epoch": 5049} {"train_loss": -27.005523681640625, "global_step": 419124, "epoch": 5049} {"train_loss": -26.472192764282227, "global_step": 419125, "epoch": 5049} {"train_loss": -26.409698486328125, "global_step": 419126, "epoch": 5049} {"train_loss": -26.958953857421875, "global_step": 419127, "epoch": 5049} {"train_loss": -26.86411476135254, "global_step": 419128, "epoch": 5049} {"train_loss": -26.948057174682617, "global_step": 419129, "epoch": 5049} {"train_loss": -26.6757755279541, "global_step": 419130, "epoch": 5049} {"train_loss": -26.99598503112793, "global_step": 419131, "epoch": 5049} {"train_loss": -26.61992835998535, "global_step": 419132, "epoch": 5049} {"train_loss": -26.874237060546875, "global_step": 419133, "epoch": 5049} {"train_loss": -26.807775497436523, "global_step": 419134, "epoch": 5049} {"train_loss": -26.804168701171875, "global_step": 419135, "epoch": 5049} {"train_loss": -27.05864906311035, "global_step": 419136, "epoch": 5049} {"train_loss": -26.59340476989746, "global_step": 419137, "epoch": 5049} {"train_loss": -26.42621421813965, "global_step": 419138, "epoch": 5049} {"train_loss": -26.357208251953125, "global_step": 419139, "epoch": 5049} {"train_loss": -26.45269203186035, "global_step": 419140, "epoch": 5049} {"train_loss": -26.564441680908203, "global_step": 419141, "epoch": 5049} {"train_loss": -26.87190055847168, "global_step": 419142, "epoch": 5049} {"train_loss": -26.47633171081543, "global_step": 419143, "epoch": 5049} {"train_loss": -27.190149307250977, "global_step": 419144, "epoch": 5049} {"train_loss": -26.8409423828125, "global_step": 419145, "epoch": 5049} {"train_loss": -26.439136505126953, "global_step": 419146, "epoch": 5049} {"train_loss": -26.592243194580078, "global_step": 419147, "epoch": 5049} {"train_loss": -26.97956657409668, "global_step": 419148, "epoch": 5049} {"train_loss": -26.5819109031953, "global_step": 419149, "epoch": 5049, "val_loss": 7056913.0} {"train_loss": -26.39571189880371, "global_step": 419150, "epoch": 5050} {"train_loss": -26.250234603881836, "global_step": 419151, "epoch": 5050} {"train_loss": -26.674875259399414, "global_step": 419152, "epoch": 5050} {"train_loss": -25.913299560546875, "global_step": 419153, "epoch": 5050} {"train_loss": -26.071874618530273, "global_step": 419154, "epoch": 5050} {"train_loss": -25.720489501953125, "global_step": 419155, "epoch": 5050} {"train_loss": -25.65006446838379, "global_step": 419156, "epoch": 5050} {"train_loss": -26.1401424407959, "global_step": 419157, "epoch": 5050} {"train_loss": -26.034809112548828, "global_step": 419158, "epoch": 5050} {"train_loss": -26.44050407409668, "global_step": 419159, "epoch": 5050} {"train_loss": -25.98980712890625, "global_step": 419160, "epoch": 5050} {"train_loss": -26.389684677124023, "global_step": 419161, "epoch": 5050} {"train_loss": -26.35480308532715, "global_step": 419162, "epoch": 5050} {"train_loss": -25.86846923828125, "global_step": 419163, "epoch": 5050} {"train_loss": -26.451841354370117, "global_step": 419164, "epoch": 5050} {"train_loss": -26.42243003845215, "global_step": 419165, "epoch": 5050} {"train_loss": -26.494619369506836, "global_step": 419166, "epoch": 5050} {"train_loss": -26.255929946899414, "global_step": 419167, "epoch": 5050} {"train_loss": -26.65691566467285, "global_step": 419168, "epoch": 5050} {"train_loss": -26.703781127929688, "global_step": 419169, "epoch": 5050} {"train_loss": -26.4792537689209, "global_step": 419170, "epoch": 5050} {"train_loss": -26.515012741088867, "global_step": 419171, "epoch": 5050} {"train_loss": -26.381824493408203, "global_step": 419172, "epoch": 5050} {"train_loss": -26.38593864440918, "global_step": 419173, "epoch": 5050} {"train_loss": -26.477293014526367, "global_step": 419174, "epoch": 5050} {"train_loss": -26.471372604370117, "global_step": 419175, "epoch": 5050} {"train_loss": -26.69002342224121, "global_step": 419176, "epoch": 5050} {"train_loss": -26.5795955657959, "global_step": 419177, "epoch": 5050} {"train_loss": -26.57038688659668, "global_step": 419178, "epoch": 5050} {"train_loss": -26.70697593688965, "global_step": 419179, "epoch": 5050} {"train_loss": -27.05335807800293, "global_step": 419180, "epoch": 5050} {"train_loss": -26.3324031829834, "global_step": 419181, "epoch": 5050} {"train_loss": -26.808156967163086, "global_step": 419182, "epoch": 5050} {"train_loss": -26.599002838134766, "global_step": 419183, "epoch": 5050} {"train_loss": -26.983373641967773, "global_step": 419184, "epoch": 5050} {"train_loss": -26.85308837890625, "global_step": 419185, "epoch": 5050} {"train_loss": -26.8590030670166, "global_step": 419186, "epoch": 5050} {"train_loss": -26.840024948120117, "global_step": 419187, "epoch": 5050} {"train_loss": -26.53346824645996, "global_step": 419188, "epoch": 5050} {"train_loss": -26.50201988220215, "global_step": 419189, "epoch": 5050} {"train_loss": -26.808135986328125, "global_step": 419190, "epoch": 5050} {"train_loss": -26.852619171142578, "global_step": 419191, "epoch": 5050} {"train_loss": -27.2972412109375, "global_step": 419192, "epoch": 5050} {"train_loss": -26.59613037109375, "global_step": 419193, "epoch": 5050} {"train_loss": -26.87565040588379, "global_step": 419194, "epoch": 5050} {"train_loss": -27.165149688720703, "global_step": 419195, "epoch": 5050} {"train_loss": -26.612707138061523, "global_step": 419196, "epoch": 5050} {"train_loss": -26.740942001342773, "global_step": 419197, "epoch": 5050} {"train_loss": -26.71314811706543, "global_step": 419198, "epoch": 5050} {"train_loss": -27.077533721923828, "global_step": 419199, "epoch": 5050} {"train_loss": -26.811315536499023, "global_step": 419200, "epoch": 5050} {"train_loss": -26.714948654174805, "global_step": 419201, "epoch": 5050} {"train_loss": -26.803293228149414, "global_step": 419202, "epoch": 5050} {"train_loss": -26.938596725463867, "global_step": 419203, "epoch": 5050} {"train_loss": -27.15522575378418, "global_step": 419204, "epoch": 5050} {"train_loss": -26.848188400268555, "global_step": 419205, "epoch": 5050} {"train_loss": -26.661046981811523, "global_step": 419206, "epoch": 5050} {"train_loss": -26.818408966064453, "global_step": 419207, "epoch": 5050} {"train_loss": -26.663654327392578, "global_step": 419208, "epoch": 5050} {"train_loss": -26.55561637878418, "global_step": 419209, "epoch": 5050} {"train_loss": -26.22787857055664, "global_step": 419210, "epoch": 5050} {"train_loss": -26.2891845703125, "global_step": 419211, "epoch": 5050} {"train_loss": -26.716028213500977, "global_step": 419212, "epoch": 5050} {"train_loss": -27.403940200805664, "global_step": 419213, "epoch": 5050} {"train_loss": -27.243330001831055, "global_step": 419214, "epoch": 5050} {"train_loss": -27.00044059753418, "global_step": 419215, "epoch": 5050} {"train_loss": -26.687952041625977, "global_step": 419216, "epoch": 5050} {"train_loss": -26.892541885375977, "global_step": 419217, "epoch": 5050} {"train_loss": -26.523334503173828, "global_step": 419218, "epoch": 5050} {"train_loss": -27.07093620300293, "global_step": 419219, "epoch": 5050} {"train_loss": -27.106969833374023, "global_step": 419220, "epoch": 5050} {"train_loss": -26.968664169311523, "global_step": 419221, "epoch": 5050} {"train_loss": -26.9966983795166, "global_step": 419222, "epoch": 5050} {"train_loss": -27.0081729888916, "global_step": 419223, "epoch": 5050} {"train_loss": -27.229190826416016, "global_step": 419224, "epoch": 5050} {"train_loss": -27.053937911987305, "global_step": 419225, "epoch": 5050} {"train_loss": -26.964139938354492, "global_step": 419226, "epoch": 5050} {"train_loss": -27.28781509399414, "global_step": 419227, "epoch": 5050} {"train_loss": -27.120563507080078, "global_step": 419228, "epoch": 5050} {"train_loss": -26.74591636657715, "global_step": 419229, "epoch": 5050} {"train_loss": -26.86029624938965, "global_step": 419230, "epoch": 5050} {"train_loss": -26.82392692565918, "global_step": 419231, "epoch": 5050} {"train_loss": -26.662690495870198, "global_step": 419232, "epoch": 5050, "train/sim_max_reward_0": 1.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4500000": 1.0, "test/sim_max_reward_4500001": 1.0, "test/sim_max_reward_4500002": 1.0, "test/sim_max_reward_4500003": 1.0, "test/sim_max_reward_4500004": 1.0, "test/sim_max_reward_4500005": 1.0, "test/sim_max_reward_4500006": 1.0, "test/sim_max_reward_4500007": 0.0, "test/sim_max_reward_4500008": 1.0, "test/sim_max_reward_4500009": 1.0, "test/sim_max_reward_4500010": 1.0, "test/sim_max_reward_4500011": 1.0, "test/sim_max_reward_4500012": 1.0, "test/sim_max_reward_4500013": 0.0, "test/sim_max_reward_4500014": 1.0, "test/sim_max_reward_4500015": 1.0, "test/sim_max_reward_4500016": 1.0, "test/sim_max_reward_4500017": 1.0, "test/sim_max_reward_4500018": 0.0, "test/sim_max_reward_4500019": 0.0, "test/sim_max_reward_4500020": 1.0, "test/sim_max_reward_4500021": 1.0, "train/mean_score": 1.0, "test/mean_score": 0.8181818181818182, "val_loss": 7069286.0} {"train_loss": -26.674047470092773, "global_step": 419233, "epoch": 5051} {"train_loss": -26.189367294311523, "global_step": 419234, "epoch": 5051} {"train_loss": -26.410459518432617, "global_step": 419235, "epoch": 5051} {"train_loss": -26.85540199279785, "global_step": 419236, "epoch": 5051} {"train_loss": -26.15058708190918, "global_step": 419237, "epoch": 5051} {"train_loss": -25.549148559570312, "global_step": 419238, "epoch": 5051} {"train_loss": -25.04450798034668, "global_step": 419239, "epoch": 5051} {"train_loss": -24.473432540893555, "global_step": 419240, "epoch": 5051} {"train_loss": -25.401824951171875, "global_step": 419241, "epoch": 5051} {"train_loss": -26.17279624938965, "global_step": 419242, "epoch": 5051} {"train_loss": -26.115142822265625, "global_step": 419243, "epoch": 5051} {"train_loss": -26.15706443786621, "global_step": 419244, "epoch": 5051} {"train_loss": -26.26873207092285, "global_step": 419245, "epoch": 5051} {"train_loss": -26.475631713867188, "global_step": 419246, "epoch": 5051} {"train_loss": -26.691547393798828, "global_step": 419247, "epoch": 5051} {"train_loss": -26.415884017944336, "global_step": 419248, "epoch": 5051} {"train_loss": -26.297245025634766, "global_step": 419249, "epoch": 5051} {"train_loss": -26.2390079498291, "global_step": 419250, "epoch": 5051} {"train_loss": -26.66937255859375, "global_step": 419251, "epoch": 5051} {"train_loss": -26.745603561401367, "global_step": 419252, "epoch": 5051} {"train_loss": -26.271589279174805, "global_step": 419253, "epoch": 5051} {"train_loss": -26.64716911315918, "global_step": 419254, "epoch": 5051} {"train_loss": -26.33835792541504, "global_step": 419255, "epoch": 5051} {"train_loss": -26.592069625854492, "global_step": 419256, "epoch": 5051} {"train_loss": -26.62232780456543, "global_step": 419257, "epoch": 5051} {"train_loss": -26.63592529296875, "global_step": 419258, "epoch": 5051} {"train_loss": -26.4315128326416, "global_step": 419259, "epoch": 5051} {"train_loss": -26.592300415039062, "global_step": 419260, "epoch": 5051} {"train_loss": -26.574838638305664, "global_step": 419261, "epoch": 5051} {"train_loss": -26.382415771484375, "global_step": 419262, "epoch": 5051} {"train_loss": -26.972333908081055, "global_step": 419263, "epoch": 5051} {"train_loss": -26.76228141784668, "global_step": 419264, "epoch": 5051} {"train_loss": -26.65546226501465, "global_step": 419265, "epoch": 5051} {"train_loss": -26.63278579711914, "global_step": 419266, "epoch": 5051} {"train_loss": -26.55670738220215, "global_step": 419267, "epoch": 5051} {"train_loss": -26.738306045532227, "global_step": 419268, "epoch": 5051} {"train_loss": -26.724929809570312, "global_step": 419269, "epoch": 5051} {"train_loss": -26.700963973999023, "global_step": 419270, "epoch": 5051} {"train_loss": -26.789325714111328, "global_step": 419271, "epoch": 5051} {"train_loss": -26.738937377929688, "global_step": 419272, "epoch": 5051} {"train_loss": -26.86203384399414, "global_step": 419273, "epoch": 5051} {"train_loss": -26.524648666381836, "global_step": 419274, "epoch": 5051} {"train_loss": -26.894428253173828, "global_step": 419275, "epoch": 5051} {"train_loss": -26.8656005859375, "global_step": 419276, "epoch": 5051} {"train_loss": -26.398534774780273, "global_step": 419277, "epoch": 5051} {"train_loss": -26.798450469970703, "global_step": 419278, "epoch": 5051} {"train_loss": -27.108667373657227, "global_step": 419279, "epoch": 5051} {"train_loss": -27.112638473510742, "global_step": 419280, "epoch": 5051} {"train_loss": -27.073749542236328, "global_step": 419281, "epoch": 5051} {"train_loss": -26.850116729736328, "global_step": 419282, "epoch": 5051} {"train_loss": -26.970998764038086, "global_step": 419283, "epoch": 5051} {"train_loss": -26.839080810546875, "global_step": 419284, "epoch": 5051} {"train_loss": -26.887632369995117, "global_step": 419285, "epoch": 5051} {"train_loss": -27.056915283203125, "global_step": 419286, "epoch": 5051} {"train_loss": -27.005603790283203, "global_step": 419287, "epoch": 5051} {"train_loss": -26.62310791015625, "global_step": 419288, "epoch": 5051} {"train_loss": -26.85426139831543, "global_step": 419289, "epoch": 5051} {"train_loss": -27.0690975189209, "global_step": 419290, "epoch": 5051} {"train_loss": -26.77535057067871, "global_step": 419291, "epoch": 5051} {"train_loss": -27.248178482055664, "global_step": 419292, "epoch": 5051} {"train_loss": -26.878620147705078, "global_step": 419293, "epoch": 5051} {"train_loss": -26.767669677734375, "global_step": 419294, "epoch": 5051} {"train_loss": -27.105924606323242, "global_step": 419295, "epoch": 5051} {"train_loss": -27.119787216186523, "global_step": 419296, "epoch": 5051} {"train_loss": -26.957712173461914, "global_step": 419297, "epoch": 5051} {"train_loss": -27.024133682250977, "global_step": 419298, "epoch": 5051} {"train_loss": -26.6795597076416, "global_step": 419299, "epoch": 5051} {"train_loss": -26.872053146362305, "global_step": 419300, "epoch": 5051} {"train_loss": -27.082677841186523, "global_step": 419301, "epoch": 5051} {"train_loss": -27.04736328125, "global_step": 419302, "epoch": 5051} {"train_loss": -26.844837188720703, "global_step": 419303, "epoch": 5051} {"train_loss": -26.588232040405273, "global_step": 419304, "epoch": 5051} {"train_loss": -26.865793228149414, "global_step": 419305, "epoch": 5051} {"train_loss": -26.818603515625, "global_step": 419306, "epoch": 5051} {"train_loss": -26.747289657592773, "global_step": 419307, "epoch": 5051} {"train_loss": -27.006418228149414, "global_step": 419308, "epoch": 5051} {"train_loss": -26.864471435546875, "global_step": 419309, "epoch": 5051} {"train_loss": -26.7148380279541, "global_step": 419310, "epoch": 5051} {"train_loss": -26.559375762939453, "global_step": 419311, "epoch": 5051} {"train_loss": -26.1251163482666, "global_step": 419312, "epoch": 5051} {"train_loss": -25.986875534057617, "global_step": 419313, "epoch": 5051} {"train_loss": -25.882287979125977, "global_step": 419314, "epoch": 5051} {"train_loss": -26.61053930994976, "global_step": 419315, "epoch": 5051, "val_loss": 7117342.0} {"train_loss": -24.810306549072266, "global_step": 419316, "epoch": 5052} {"train_loss": -25.52853012084961, "global_step": 419317, "epoch": 5052} {"train_loss": -26.4383602142334, "global_step": 419318, "epoch": 5052} {"train_loss": -25.7276611328125, "global_step": 419319, "epoch": 5052} {"train_loss": -25.961515426635742, "global_step": 419320, "epoch": 5052} {"train_loss": -26.003889083862305, "global_step": 419321, "epoch": 5052} {"train_loss": -25.854312896728516, "global_step": 419322, "epoch": 5052} {"train_loss": -26.341766357421875, "global_step": 419323, "epoch": 5052} {"train_loss": -26.200605392456055, "global_step": 419324, "epoch": 5052} {"train_loss": -26.379968643188477, "global_step": 419325, "epoch": 5052} {"train_loss": -26.310001373291016, "global_step": 419326, "epoch": 5052} {"train_loss": -26.350605010986328, "global_step": 419327, "epoch": 5052} {"train_loss": -26.452838897705078, "global_step": 419328, "epoch": 5052} {"train_loss": -26.6376895904541, "global_step": 419329, "epoch": 5052} {"train_loss": -26.03946876525879, "global_step": 419330, "epoch": 5052} {"train_loss": -26.256086349487305, "global_step": 419331, "epoch": 5052} {"train_loss": -26.661115646362305, "global_step": 419332, "epoch": 5052} {"train_loss": -26.408721923828125, "global_step": 419333, "epoch": 5052} {"train_loss": -26.510974884033203, "global_step": 419334, "epoch": 5052} {"train_loss": -26.567041397094727, "global_step": 419335, "epoch": 5052} {"train_loss": -26.802841186523438, "global_step": 419336, "epoch": 5052} {"train_loss": -26.571949005126953, "global_step": 419337, "epoch": 5052} {"train_loss": -26.50373649597168, "global_step": 419338, "epoch": 5052} {"train_loss": -26.286035537719727, "global_step": 419339, "epoch": 5052} {"train_loss": -26.598417282104492, "global_step": 419340, "epoch": 5052} {"train_loss": -26.62923240661621, "global_step": 419341, "epoch": 5052} {"train_loss": -26.622777938842773, "global_step": 419342, "epoch": 5052} {"train_loss": -27.045703887939453, "global_step": 419343, "epoch": 5052} {"train_loss": -26.907657623291016, "global_step": 419344, "epoch": 5052} {"train_loss": -26.670623779296875, "global_step": 419345, "epoch": 5052} {"train_loss": -26.848554611206055, "global_step": 419346, "epoch": 5052} {"train_loss": -26.60931968688965, "global_step": 419347, "epoch": 5052} {"train_loss": -26.44841957092285, "global_step": 419348, "epoch": 5052} {"train_loss": -26.494604110717773, "global_step": 419349, "epoch": 5052} {"train_loss": -26.79524803161621, "global_step": 419350, "epoch": 5052} {"train_loss": -26.475818634033203, "global_step": 419351, "epoch": 5052} {"train_loss": -26.952880859375, "global_step": 419352, "epoch": 5052} {"train_loss": -26.828847885131836, "global_step": 419353, "epoch": 5052} {"train_loss": -26.297903060913086, "global_step": 419354, "epoch": 5052} {"train_loss": -26.951095581054688, "global_step": 419355, "epoch": 5052} {"train_loss": -26.722471237182617, "global_step": 419356, "epoch": 5052} {"train_loss": -27.280675888061523, "global_step": 419357, "epoch": 5052} {"train_loss": -26.75264549255371, "global_step": 419358, "epoch": 5052} {"train_loss": -26.447351455688477, "global_step": 419359, "epoch": 5052} {"train_loss": -26.65509605407715, "global_step": 419360, "epoch": 5052} {"train_loss": -26.926122665405273, "global_step": 419361, "epoch": 5052} {"train_loss": -27.02882194519043, "global_step": 419362, "epoch": 5052} {"train_loss": -27.022489547729492, "global_step": 419363, "epoch": 5052} {"train_loss": -26.916828155517578, "global_step": 419364, "epoch": 5052} {"train_loss": -26.57615089416504, "global_step": 419365, "epoch": 5052} {"train_loss": -26.814538955688477, "global_step": 419366, "epoch": 5052} {"train_loss": -26.4499454498291, "global_step": 419367, "epoch": 5052} {"train_loss": -26.67243766784668, "global_step": 419368, "epoch": 5052} {"train_loss": -26.61982536315918, "global_step": 419369, "epoch": 5052} {"train_loss": -26.824499130249023, "global_step": 419370, "epoch": 5052} {"train_loss": -27.149993896484375, "global_step": 419371, "epoch": 5052} {"train_loss": -26.836444854736328, "global_step": 419372, "epoch": 5052} {"train_loss": -26.982458114624023, "global_step": 419373, "epoch": 5052} {"train_loss": -26.625410079956055, "global_step": 419374, "epoch": 5052} {"train_loss": -26.500951766967773, "global_step": 419375, "epoch": 5052} {"train_loss": -26.8447208404541, "global_step": 419376, "epoch": 5052} {"train_loss": -26.811044692993164, "global_step": 419377, "epoch": 5052} {"train_loss": -26.7686767578125, "global_step": 419378, "epoch": 5052} {"train_loss": -26.557348251342773, "global_step": 419379, "epoch": 5052} {"train_loss": -26.5667781829834, "global_step": 419380, "epoch": 5052} {"train_loss": -26.18575096130371, "global_step": 419381, "epoch": 5052} {"train_loss": -26.360944747924805, "global_step": 419382, "epoch": 5052} {"train_loss": -26.444791793823242, "global_step": 419383, "epoch": 5052} {"train_loss": -27.102176666259766, "global_step": 419384, "epoch": 5052} {"train_loss": -26.59296989440918, "global_step": 419385, "epoch": 5052} {"train_loss": -26.599029541015625, "global_step": 419386, "epoch": 5052} {"train_loss": -26.669010162353516, "global_step": 419387, "epoch": 5052} {"train_loss": -26.81406593322754, "global_step": 419388, "epoch": 5052} {"train_loss": -26.71058464050293, "global_step": 419389, "epoch": 5052} {"train_loss": -26.4674015045166, "global_step": 419390, "epoch": 5052} {"train_loss": -26.9810733795166, "global_step": 419391, "epoch": 5052} {"train_loss": -26.857603073120117, "global_step": 419392, "epoch": 5052} {"train_loss": -26.584415435791016, "global_step": 419393, "epoch": 5052} {"train_loss": -26.664464950561523, "global_step": 419394, "epoch": 5052} {"train_loss": -26.55215835571289, "global_step": 419395, "epoch": 5052} {"train_loss": -26.51080322265625, "global_step": 419396, "epoch": 5052} {"train_loss": -26.813690185546875, "global_step": 419397, "epoch": 5052} {"train_loss": -26.55678337740611, "global_step": 419398, "epoch": 5052, "val_loss": 6985349.0} {"train_loss": -25.028928756713867, "global_step": 419399, "epoch": 5053} {"train_loss": -24.716978073120117, "global_step": 419400, "epoch": 5053} {"train_loss": -24.29715347290039, "global_step": 419401, "epoch": 5053} {"train_loss": -25.797082901000977, "global_step": 419402, "epoch": 5053} {"train_loss": -25.95305824279785, "global_step": 419403, "epoch": 5053} {"train_loss": -25.1259765625, "global_step": 419404, "epoch": 5053} {"train_loss": -26.51814842224121, "global_step": 419405, "epoch": 5053} {"train_loss": -25.47127914428711, "global_step": 419406, "epoch": 5053} {"train_loss": -26.140827178955078, "global_step": 419407, "epoch": 5053} {"train_loss": -25.794538497924805, "global_step": 419408, "epoch": 5053} {"train_loss": -26.06548500061035, "global_step": 419409, "epoch": 5053} {"train_loss": -25.935571670532227, "global_step": 419410, "epoch": 5053} {"train_loss": -26.01251792907715, "global_step": 419411, "epoch": 5053} {"train_loss": -26.309473037719727, "global_step": 419412, "epoch": 5053} {"train_loss": -26.122329711914062, "global_step": 419413, "epoch": 5053} {"train_loss": -26.5172061920166, "global_step": 419414, "epoch": 5053} {"train_loss": -26.116138458251953, "global_step": 419415, "epoch": 5053} {"train_loss": -26.833999633789062, "global_step": 419416, "epoch": 5053} {"train_loss": -26.405786514282227, "global_step": 419417, "epoch": 5053} {"train_loss": -26.200210571289062, "global_step": 419418, "epoch": 5053} {"train_loss": -26.447851181030273, "global_step": 419419, "epoch": 5053} {"train_loss": -26.065649032592773, "global_step": 419420, "epoch": 5053} {"train_loss": -26.60938835144043, "global_step": 419421, "epoch": 5053} {"train_loss": -26.246931076049805, "global_step": 419422, "epoch": 5053} {"train_loss": -26.448896408081055, "global_step": 419423, "epoch": 5053} {"train_loss": -26.916309356689453, "global_step": 419424, "epoch": 5053} {"train_loss": -26.76321792602539, "global_step": 419425, "epoch": 5053} {"train_loss": -27.11311912536621, "global_step": 419426, "epoch": 5053} {"train_loss": -26.427961349487305, "global_step": 419427, "epoch": 5053} {"train_loss": -26.657636642456055, "global_step": 419428, "epoch": 5053} {"train_loss": -26.699542999267578, "global_step": 419429, "epoch": 5053} {"train_loss": -27.163837432861328, "global_step": 419430, "epoch": 5053} {"train_loss": -26.755720138549805, "global_step": 419431, "epoch": 5053} {"train_loss": -26.612878799438477, "global_step": 419432, "epoch": 5053} {"train_loss": -26.726760864257812, "global_step": 419433, "epoch": 5053} {"train_loss": -26.824451446533203, "global_step": 419434, "epoch": 5053} {"train_loss": -26.926544189453125, "global_step": 419435, "epoch": 5053} {"train_loss": -26.9146785736084, "global_step": 419436, "epoch": 5053} {"train_loss": -26.70473289489746, "global_step": 419437, "epoch": 5053} {"train_loss": -27.18092918395996, "global_step": 419438, "epoch": 5053} {"train_loss": -26.383243560791016, "global_step": 419439, "epoch": 5053} {"train_loss": -26.688751220703125, "global_step": 419440, "epoch": 5053} {"train_loss": -26.804697036743164, "global_step": 419441, "epoch": 5053} {"train_loss": -26.7725887298584, "global_step": 419442, "epoch": 5053} {"train_loss": -27.237884521484375, "global_step": 419443, "epoch": 5053} {"train_loss": -26.61495018005371, "global_step": 419444, "epoch": 5053} {"train_loss": -26.859546661376953, "global_step": 419445, "epoch": 5053} {"train_loss": -26.499134063720703, "global_step": 419446, "epoch": 5053} {"train_loss": -26.916532516479492, "global_step": 419447, "epoch": 5053} {"train_loss": -26.792816162109375, "global_step": 419448, "epoch": 5053} {"train_loss": -26.6092472076416, "global_step": 419449, "epoch": 5053} {"train_loss": -26.933149337768555, "global_step": 419450, "epoch": 5053} {"train_loss": -26.83245849609375, "global_step": 419451, "epoch": 5053} {"train_loss": -26.622344970703125, "global_step": 419452, "epoch": 5053} {"train_loss": -27.095727920532227, "global_step": 419453, "epoch": 5053} {"train_loss": -27.126708984375, "global_step": 419454, "epoch": 5053} {"train_loss": -26.520254135131836, "global_step": 419455, "epoch": 5053} {"train_loss": -27.115345001220703, "global_step": 419456, "epoch": 5053} {"train_loss": -26.869705200195312, "global_step": 419457, "epoch": 5053} {"train_loss": -26.969348907470703, "global_step": 419458, "epoch": 5053} {"train_loss": -26.836074829101562, "global_step": 419459, "epoch": 5053} {"train_loss": -27.05256462097168, "global_step": 419460, "epoch": 5053} {"train_loss": -26.80865478515625, "global_step": 419461, "epoch": 5053} {"train_loss": -26.846296310424805, "global_step": 419462, "epoch": 5053} {"train_loss": -27.176013946533203, "global_step": 419463, "epoch": 5053} {"train_loss": -26.934289932250977, "global_step": 419464, "epoch": 5053} {"train_loss": -27.18625259399414, "global_step": 419465, "epoch": 5053} {"train_loss": -27.13336753845215, "global_step": 419466, "epoch": 5053} {"train_loss": -27.04530143737793, "global_step": 419467, "epoch": 5053} {"train_loss": -26.9594669342041, "global_step": 419468, "epoch": 5053} {"train_loss": -27.029844284057617, "global_step": 419469, "epoch": 5053} {"train_loss": -26.855756759643555, "global_step": 419470, "epoch": 5053} {"train_loss": -26.76227378845215, "global_step": 419471, "epoch": 5053} {"train_loss": -26.74298667907715, "global_step": 419472, "epoch": 5053} {"train_loss": -26.992780685424805, "global_step": 419473, "epoch": 5053} {"train_loss": -26.918533325195312, "global_step": 419474, "epoch": 5053} {"train_loss": -27.074665069580078, "global_step": 419475, "epoch": 5053} {"train_loss": -26.758249282836914, "global_step": 419476, "epoch": 5053} {"train_loss": -26.57073974609375, "global_step": 419477, "epoch": 5053} {"train_loss": -26.41208267211914, "global_step": 419478, "epoch": 5053} {"train_loss": -26.428625106811523, "global_step": 419479, "epoch": 5053} {"train_loss": -26.786396026611328, "global_step": 419480, "epoch": 5053} {"train_loss": -26.595888482518944, "global_step": 419481, "epoch": 5053, "val_loss": 6923935.0} {"train_loss": -22.848846435546875, "global_step": 419482, "epoch": 5054} {"train_loss": -24.49945640563965, "global_step": 419483, "epoch": 5054} {"train_loss": -25.429290771484375, "global_step": 419484, "epoch": 5054} {"train_loss": -25.234745025634766, "global_step": 419485, "epoch": 5054} {"train_loss": -25.1479549407959, "global_step": 419486, "epoch": 5054} {"train_loss": -25.36871337890625, "global_step": 419487, "epoch": 5054} {"train_loss": -25.967880249023438, "global_step": 419488, "epoch": 5054} {"train_loss": -25.6187801361084, "global_step": 419489, "epoch": 5054} {"train_loss": -25.91560173034668, "global_step": 419490, "epoch": 5054} {"train_loss": -25.662988662719727, "global_step": 419491, "epoch": 5054} {"train_loss": -25.607519149780273, "global_step": 419492, "epoch": 5054} {"train_loss": -26.20136833190918, "global_step": 419493, "epoch": 5054} {"train_loss": -26.034048080444336, "global_step": 419494, "epoch": 5054} {"train_loss": -25.9443359375, "global_step": 419495, "epoch": 5054} {"train_loss": -26.012725830078125, "global_step": 419496, "epoch": 5054} {"train_loss": -25.7371768951416, "global_step": 419497, "epoch": 5054} {"train_loss": -25.9168643951416, "global_step": 419498, "epoch": 5054} {"train_loss": -26.049972534179688, "global_step": 419499, "epoch": 5054} {"train_loss": -26.026594161987305, "global_step": 419500, "epoch": 5054} {"train_loss": -25.516082763671875, "global_step": 419501, "epoch": 5054} {"train_loss": -25.8174991607666, "global_step": 419502, "epoch": 5054} {"train_loss": -26.30413246154785, "global_step": 419503, "epoch": 5054} {"train_loss": -26.214685440063477, "global_step": 419504, "epoch": 5054} {"train_loss": -25.96137809753418, "global_step": 419505, "epoch": 5054} {"train_loss": -26.382598876953125, "global_step": 419506, "epoch": 5054} {"train_loss": -26.236820220947266, "global_step": 419507, "epoch": 5054} {"train_loss": -26.2219295501709, "global_step": 419508, "epoch": 5054} {"train_loss": -26.503971099853516, "global_step": 419509, "epoch": 5054} {"train_loss": -26.619403839111328, "global_step": 419510, "epoch": 5054} {"train_loss": -26.63324546813965, "global_step": 419511, "epoch": 5054} {"train_loss": -26.35682487487793, "global_step": 419512, "epoch": 5054} {"train_loss": -26.136260986328125, "global_step": 419513, "epoch": 5054} {"train_loss": -26.722564697265625, "global_step": 419514, "epoch": 5054} {"train_loss": -26.424697875976562, "global_step": 419515, "epoch": 5054} {"train_loss": -26.39808464050293, "global_step": 419516, "epoch": 5054} {"train_loss": -26.434463500976562, "global_step": 419517, "epoch": 5054} {"train_loss": -26.98712158203125, "global_step": 419518, "epoch": 5054} {"train_loss": -26.5865478515625, "global_step": 419519, "epoch": 5054} {"train_loss": -26.518102645874023, "global_step": 419520, "epoch": 5054} {"train_loss": -26.65874671936035, "global_step": 419521, "epoch": 5054} {"train_loss": -26.660629272460938, "global_step": 419522, "epoch": 5054} {"train_loss": -26.562788009643555, "global_step": 419523, "epoch": 5054} {"train_loss": -26.858539581298828, "global_step": 419524, "epoch": 5054} {"train_loss": -26.96150779724121, "global_step": 419525, "epoch": 5054} {"train_loss": -26.352405548095703, "global_step": 419526, "epoch": 5054} {"train_loss": -26.541248321533203, "global_step": 419527, "epoch": 5054} {"train_loss": -26.814441680908203, "global_step": 419528, "epoch": 5054} {"train_loss": -26.918989181518555, "global_step": 419529, "epoch": 5054} {"train_loss": -27.148502349853516, "global_step": 419530, "epoch": 5054} {"train_loss": -27.052045822143555, "global_step": 419531, "epoch": 5054} {"train_loss": -26.58443260192871, "global_step": 419532, "epoch": 5054} {"train_loss": -26.9090576171875, "global_step": 419533, "epoch": 5054} {"train_loss": -26.791534423828125, "global_step": 419534, "epoch": 5054} {"train_loss": -26.737457275390625, "global_step": 419535, "epoch": 5054} {"train_loss": -26.8231143951416, "global_step": 419536, "epoch": 5054} {"train_loss": -26.737817764282227, "global_step": 419537, "epoch": 5054} {"train_loss": -26.982471466064453, "global_step": 419538, "epoch": 5054} {"train_loss": -27.13739013671875, "global_step": 419539, "epoch": 5054} {"train_loss": -27.014545440673828, "global_step": 419540, "epoch": 5054} {"train_loss": -26.971769332885742, "global_step": 419541, "epoch": 5054} {"train_loss": -26.952497482299805, "global_step": 419542, "epoch": 5054} {"train_loss": -26.770883560180664, "global_step": 419543, "epoch": 5054} {"train_loss": -26.953649520874023, "global_step": 419544, "epoch": 5054} {"train_loss": -26.99039649963379, "global_step": 419545, "epoch": 5054} {"train_loss": -27.214059829711914, "global_step": 419546, "epoch": 5054} {"train_loss": -26.998218536376953, "global_step": 419547, "epoch": 5054} {"train_loss": -27.2710018157959, "global_step": 419548, "epoch": 5054} {"train_loss": -26.7556209564209, "global_step": 419549, "epoch": 5054} {"train_loss": -26.97004508972168, "global_step": 419550, "epoch": 5054} {"train_loss": -27.12091636657715, "global_step": 419551, "epoch": 5054} {"train_loss": -27.160837173461914, "global_step": 419552, "epoch": 5054} {"train_loss": -27.0364990234375, "global_step": 419553, "epoch": 5054} {"train_loss": -27.00886344909668, "global_step": 419554, "epoch": 5054} {"train_loss": -26.65640640258789, "global_step": 419555, "epoch": 5054} {"train_loss": -26.8896541595459, "global_step": 419556, "epoch": 5054} {"train_loss": -26.929330825805664, "global_step": 419557, "epoch": 5054} {"train_loss": -27.22647476196289, "global_step": 419558, "epoch": 5054} {"train_loss": -27.1899471282959, "global_step": 419559, "epoch": 5054} {"train_loss": -26.994094848632812, "global_step": 419560, "epoch": 5054} {"train_loss": -26.710920333862305, "global_step": 419561, "epoch": 5054} {"train_loss": -26.501413345336914, "global_step": 419562, "epoch": 5054} {"train_loss": -25.840045928955078, "global_step": 419563, "epoch": 5054} {"train_loss": -26.432117186396955, "global_step": 419564, "epoch": 5054, "val_loss": 6951533.0} {"train_loss": -21.150474548339844, "global_step": 419565, "epoch": 5055} {"train_loss": -23.71875762939453, "global_step": 419566, "epoch": 5055} {"train_loss": -25.236297607421875, "global_step": 419567, "epoch": 5055} {"train_loss": -23.855609893798828, "global_step": 419568, "epoch": 5055} {"train_loss": -25.04787254333496, "global_step": 419569, "epoch": 5055} {"train_loss": -25.053482055664062, "global_step": 419570, "epoch": 5055} {"train_loss": -25.219369888305664, "global_step": 419571, "epoch": 5055} {"train_loss": -25.490575790405273, "global_step": 419572, "epoch": 5055} {"train_loss": -25.74557876586914, "global_step": 419573, "epoch": 5055} {"train_loss": -25.56345558166504, "global_step": 419574, "epoch": 5055} {"train_loss": -25.002033233642578, "global_step": 419575, "epoch": 5055} {"train_loss": -25.69996452331543, "global_step": 419576, "epoch": 5055} {"train_loss": -25.68768882751465, "global_step": 419577, "epoch": 5055} {"train_loss": -25.581480026245117, "global_step": 419578, "epoch": 5055} {"train_loss": -25.982318878173828, "global_step": 419579, "epoch": 5055} {"train_loss": -25.839248657226562, "global_step": 419580, "epoch": 5055} {"train_loss": -25.685041427612305, "global_step": 419581, "epoch": 5055} {"train_loss": -25.942594528198242, "global_step": 419582, "epoch": 5055} {"train_loss": -25.95070457458496, "global_step": 419583, "epoch": 5055} {"train_loss": -26.041406631469727, "global_step": 419584, "epoch": 5055} {"train_loss": -26.336816787719727, "global_step": 419585, "epoch": 5055} {"train_loss": -25.9699764251709, "global_step": 419586, "epoch": 5055} {"train_loss": -25.878707885742188, "global_step": 419587, "epoch": 5055} {"train_loss": -25.927597045898438, "global_step": 419588, "epoch": 5055} {"train_loss": -25.82978630065918, "global_step": 419589, "epoch": 5055} {"train_loss": -26.06074333190918, "global_step": 419590, "epoch": 5055} {"train_loss": -26.193098068237305, "global_step": 419591, "epoch": 5055} {"train_loss": -26.08035659790039, "global_step": 419592, "epoch": 5055} {"train_loss": -26.04819107055664, "global_step": 419593, "epoch": 5055} {"train_loss": -26.250288009643555, "global_step": 419594, "epoch": 5055} {"train_loss": -26.741098403930664, "global_step": 419595, "epoch": 5055} {"train_loss": -26.15011978149414, "global_step": 419596, "epoch": 5055} {"train_loss": -26.29766845703125, "global_step": 419597, "epoch": 5055} {"train_loss": -26.029382705688477, "global_step": 419598, "epoch": 5055} {"train_loss": -26.277151107788086, "global_step": 419599, "epoch": 5055} {"train_loss": -26.518308639526367, "global_step": 419600, "epoch": 5055} {"train_loss": -26.554584503173828, "global_step": 419601, "epoch": 5055} {"train_loss": -26.136627197265625, "global_step": 419602, "epoch": 5055} {"train_loss": -26.725147247314453, "global_step": 419603, "epoch": 5055} {"train_loss": -26.7867488861084, "global_step": 419604, "epoch": 5055} {"train_loss": -26.32221031188965, "global_step": 419605, "epoch": 5055} {"train_loss": -26.78899574279785, "global_step": 419606, "epoch": 5055} {"train_loss": -26.472885131835938, "global_step": 419607, "epoch": 5055} {"train_loss": -26.754053115844727, "global_step": 419608, "epoch": 5055} {"train_loss": -26.466873168945312, "global_step": 419609, "epoch": 5055} {"train_loss": -26.7913875579834, "global_step": 419610, "epoch": 5055} {"train_loss": -26.971593856811523, "global_step": 419611, "epoch": 5055} {"train_loss": -26.638635635375977, "global_step": 419612, "epoch": 5055} {"train_loss": -26.66529655456543, "global_step": 419613, "epoch": 5055} {"train_loss": -26.73438835144043, "global_step": 419614, "epoch": 5055} {"train_loss": -26.4748477935791, "global_step": 419615, "epoch": 5055} {"train_loss": -26.739307403564453, "global_step": 419616, "epoch": 5055} {"train_loss": -26.90768814086914, "global_step": 419617, "epoch": 5055} {"train_loss": -26.77937126159668, "global_step": 419618, "epoch": 5055} {"train_loss": -26.547338485717773, "global_step": 419619, "epoch": 5055} {"train_loss": -26.8439884185791, "global_step": 419620, "epoch": 5055} {"train_loss": -26.7834529876709, "global_step": 419621, "epoch": 5055} {"train_loss": -26.468896865844727, "global_step": 419622, "epoch": 5055} {"train_loss": -26.975677490234375, "global_step": 419623, "epoch": 5055} {"train_loss": -26.636022567749023, "global_step": 419624, "epoch": 5055} {"train_loss": -26.27936363220215, "global_step": 419625, "epoch": 5055} {"train_loss": -26.574682235717773, "global_step": 419626, "epoch": 5055} {"train_loss": -26.609222412109375, "global_step": 419627, "epoch": 5055} {"train_loss": -26.660276412963867, "global_step": 419628, "epoch": 5055} {"train_loss": -26.263141632080078, "global_step": 419629, "epoch": 5055} {"train_loss": -26.496667861938477, "global_step": 419630, "epoch": 5055} {"train_loss": -26.175495147705078, "global_step": 419631, "epoch": 5055} {"train_loss": -26.931745529174805, "global_step": 419632, "epoch": 5055} {"train_loss": -26.712371826171875, "global_step": 419633, "epoch": 5055} {"train_loss": -26.627653121948242, "global_step": 419634, "epoch": 5055} {"train_loss": -26.807538986206055, "global_step": 419635, "epoch": 5055} {"train_loss": -26.725006103515625, "global_step": 419636, "epoch": 5055} {"train_loss": -26.504459381103516, "global_step": 419637, "epoch": 5055} {"train_loss": -26.708728790283203, "global_step": 419638, "epoch": 5055} {"train_loss": -26.59807777404785, "global_step": 419639, "epoch": 5055} {"train_loss": -26.674955368041992, "global_step": 419640, "epoch": 5055} {"train_loss": -26.75984001159668, "global_step": 419641, "epoch": 5055} {"train_loss": -26.938369750976562, "global_step": 419642, "epoch": 5055} {"train_loss": -26.590803146362305, "global_step": 419643, "epoch": 5055} {"train_loss": -27.066009521484375, "global_step": 419644, "epoch": 5055} {"train_loss": -26.642297744750977, "global_step": 419645, "epoch": 5055} {"train_loss": -26.601133346557617, "global_step": 419646, "epoch": 5055} {"train_loss": -26.194058636584913, "global_step": 419647, "epoch": 5055, "val_loss": 6898531.5} {"train_loss": -26.572546005249023, "global_step": 419648, "epoch": 5056} {"train_loss": -26.328847885131836, "global_step": 419649, "epoch": 5056} {"train_loss": -26.48333168029785, "global_step": 419650, "epoch": 5056} {"train_loss": -26.462324142456055, "global_step": 419651, "epoch": 5056} {"train_loss": -26.3524227142334, "global_step": 419652, "epoch": 5056} {"train_loss": -25.882516860961914, "global_step": 419653, "epoch": 5056} {"train_loss": -26.525495529174805, "global_step": 419654, "epoch": 5056} {"train_loss": -26.48940086364746, "global_step": 419655, "epoch": 5056} {"train_loss": -26.57075309753418, "global_step": 419656, "epoch": 5056} {"train_loss": -26.621789932250977, "global_step": 419657, "epoch": 5056} {"train_loss": -26.793737411499023, "global_step": 419658, "epoch": 5056} {"train_loss": -26.8582706451416, "global_step": 419659, "epoch": 5056} {"train_loss": -26.355792999267578, "global_step": 419660, "epoch": 5056} {"train_loss": -26.809885025024414, "global_step": 419661, "epoch": 5056} {"train_loss": -26.4775333404541, "global_step": 419662, "epoch": 5056} {"train_loss": -26.856159210205078, "global_step": 419663, "epoch": 5056} {"train_loss": -26.481338500976562, "global_step": 419664, "epoch": 5056} {"train_loss": -26.502798080444336, "global_step": 419665, "epoch": 5056} {"train_loss": -26.8223819732666, "global_step": 419666, "epoch": 5056} {"train_loss": -26.57112693786621, "global_step": 419667, "epoch": 5056} {"train_loss": -26.56598472595215, "global_step": 419668, "epoch": 5056} {"train_loss": -26.521032333374023, "global_step": 419669, "epoch": 5056} {"train_loss": -26.74701499938965, "global_step": 419670, "epoch": 5056} {"train_loss": -27.002843856811523, "global_step": 419671, "epoch": 5056} {"train_loss": -26.781415939331055, "global_step": 419672, "epoch": 5056} {"train_loss": -26.905797958374023, "global_step": 419673, "epoch": 5056} {"train_loss": -26.968530654907227, "global_step": 419674, "epoch": 5056} {"train_loss": -26.913461685180664, "global_step": 419675, "epoch": 5056} {"train_loss": -26.805448532104492, "global_step": 419676, "epoch": 5056} {"train_loss": -26.96809959411621, "global_step": 419677, "epoch": 5056} {"train_loss": -26.951175689697266, "global_step": 419678, "epoch": 5056} {"train_loss": -26.98016357421875, "global_step": 419679, "epoch": 5056} {"train_loss": -26.844409942626953, "global_step": 419680, "epoch": 5056} {"train_loss": -26.648208618164062, "global_step": 419681, "epoch": 5056} {"train_loss": -27.124603271484375, "global_step": 419682, "epoch": 5056} {"train_loss": -26.49684715270996, "global_step": 419683, "epoch": 5056} {"train_loss": -27.335987091064453, "global_step": 419684, "epoch": 5056} {"train_loss": -26.729816436767578, "global_step": 419685, "epoch": 5056} {"train_loss": -26.91424560546875, "global_step": 419686, "epoch": 5056} {"train_loss": -27.115447998046875, "global_step": 419687, "epoch": 5056} {"train_loss": -26.699254989624023, "global_step": 419688, "epoch": 5056} {"train_loss": -26.92947769165039, "global_step": 419689, "epoch": 5056} {"train_loss": -26.87603187561035, "global_step": 419690, "epoch": 5056} {"train_loss": -27.4056453704834, "global_step": 419691, "epoch": 5056} {"train_loss": -26.996875762939453, "global_step": 419692, "epoch": 5056} {"train_loss": -26.961694717407227, "global_step": 419693, "epoch": 5056} {"train_loss": -27.21493911743164, "global_step": 419694, "epoch": 5056} {"train_loss": -26.88325309753418, "global_step": 419695, "epoch": 5056} {"train_loss": -27.06085777282715, "global_step": 419696, "epoch": 5056} {"train_loss": -26.98565673828125, "global_step": 419697, "epoch": 5056} {"train_loss": -27.07451820373535, "global_step": 419698, "epoch": 5056} {"train_loss": -27.285221099853516, "global_step": 419699, "epoch": 5056} {"train_loss": -26.729108810424805, "global_step": 419700, "epoch": 5056} {"train_loss": -26.766071319580078, "global_step": 419701, "epoch": 5056} {"train_loss": -27.268766403198242, "global_step": 419702, "epoch": 5056} {"train_loss": -27.14996910095215, "global_step": 419703, "epoch": 5056} {"train_loss": -27.12843132019043, "global_step": 419704, "epoch": 5056} {"train_loss": -26.9589900970459, "global_step": 419705, "epoch": 5056} {"train_loss": -26.76584815979004, "global_step": 419706, "epoch": 5056} {"train_loss": -26.943185806274414, "global_step": 419707, "epoch": 5056} {"train_loss": -27.262048721313477, "global_step": 419708, "epoch": 5056} {"train_loss": -26.45511245727539, "global_step": 419709, "epoch": 5056} {"train_loss": -26.937326431274414, "global_step": 419710, "epoch": 5056} {"train_loss": -26.71760368347168, "global_step": 419711, "epoch": 5056} {"train_loss": -26.680007934570312, "global_step": 419712, "epoch": 5056} {"train_loss": -27.132558822631836, "global_step": 419713, "epoch": 5056} {"train_loss": -26.987897872924805, "global_step": 419714, "epoch": 5056} {"train_loss": -27.350696563720703, "global_step": 419715, "epoch": 5056} {"train_loss": -27.01214599609375, "global_step": 419716, "epoch": 5056} {"train_loss": -26.900922775268555, "global_step": 419717, "epoch": 5056} {"train_loss": -26.98593521118164, "global_step": 419718, "epoch": 5056} {"train_loss": -26.540969848632812, "global_step": 419719, "epoch": 5056} {"train_loss": -26.879987716674805, "global_step": 419720, "epoch": 5056} {"train_loss": -27.1044864654541, "global_step": 419721, "epoch": 5056} {"train_loss": -26.88724136352539, "global_step": 419722, "epoch": 5056} {"train_loss": -26.546558380126953, "global_step": 419723, "epoch": 5056} {"train_loss": -26.895282745361328, "global_step": 419724, "epoch": 5056} {"train_loss": -27.15851402282715, "global_step": 419725, "epoch": 5056} {"train_loss": -26.88838005065918, "global_step": 419726, "epoch": 5056} {"train_loss": -26.564294815063477, "global_step": 419727, "epoch": 5056} {"train_loss": -27.195016860961914, "global_step": 419728, "epoch": 5056} {"train_loss": -26.751911163330078, "global_step": 419729, "epoch": 5056} {"train_loss": -26.830602990575585, "global_step": 419730, "epoch": 5056, "val_loss": 7008133.0} {"train_loss": -25.44817543029785, "global_step": 419731, "epoch": 5057} {"train_loss": -21.5120792388916, "global_step": 419732, "epoch": 5057} {"train_loss": -17.090717315673828, "global_step": 419733, "epoch": 5057} {"train_loss": -24.429990768432617, "global_step": 419734, "epoch": 5057} {"train_loss": -20.145139694213867, "global_step": 419735, "epoch": 5057} {"train_loss": -23.655887603759766, "global_step": 419736, "epoch": 5057} {"train_loss": -21.83046531677246, "global_step": 419737, "epoch": 5057} {"train_loss": -23.939071655273438, "global_step": 419738, "epoch": 5057} {"train_loss": -23.70454216003418, "global_step": 419739, "epoch": 5057} {"train_loss": -23.599950790405273, "global_step": 419740, "epoch": 5057} {"train_loss": -24.321796417236328, "global_step": 419741, "epoch": 5057} {"train_loss": -25.04519271850586, "global_step": 419742, "epoch": 5057} {"train_loss": -24.639469146728516, "global_step": 419743, "epoch": 5057} {"train_loss": -24.435775756835938, "global_step": 419744, "epoch": 5057} {"train_loss": -25.01604652404785, "global_step": 419745, "epoch": 5057} {"train_loss": -25.3096866607666, "global_step": 419746, "epoch": 5057} {"train_loss": -25.1320858001709, "global_step": 419747, "epoch": 5057} {"train_loss": -24.94313621520996, "global_step": 419748, "epoch": 5057} {"train_loss": -25.155719757080078, "global_step": 419749, "epoch": 5057} {"train_loss": -25.23969268798828, "global_step": 419750, "epoch": 5057} {"train_loss": -25.524423599243164, "global_step": 419751, "epoch": 5057} {"train_loss": -24.968915939331055, "global_step": 419752, "epoch": 5057} {"train_loss": -25.192556381225586, "global_step": 419753, "epoch": 5057} {"train_loss": -25.26368522644043, "global_step": 419754, "epoch": 5057} {"train_loss": -25.445194244384766, "global_step": 419755, "epoch": 5057} {"train_loss": -25.447465896606445, "global_step": 419756, "epoch": 5057} {"train_loss": -25.29612159729004, "global_step": 419757, "epoch": 5057} {"train_loss": -25.665029525756836, "global_step": 419758, "epoch": 5057} {"train_loss": -25.4470272064209, "global_step": 419759, "epoch": 5057} {"train_loss": -25.525901794433594, "global_step": 419760, "epoch": 5057} {"train_loss": -25.496793746948242, "global_step": 419761, "epoch": 5057} {"train_loss": -25.554893493652344, "global_step": 419762, "epoch": 5057} {"train_loss": -25.49366569519043, "global_step": 419763, "epoch": 5057} {"train_loss": -25.88972282409668, "global_step": 419764, "epoch": 5057} {"train_loss": -25.77552604675293, "global_step": 419765, "epoch": 5057} {"train_loss": -26.1021785736084, "global_step": 419766, "epoch": 5057} {"train_loss": -25.955053329467773, "global_step": 419767, "epoch": 5057} {"train_loss": -26.0577449798584, "global_step": 419768, "epoch": 5057} {"train_loss": -25.749637603759766, "global_step": 419769, "epoch": 5057} {"train_loss": -25.924253463745117, "global_step": 419770, "epoch": 5057} {"train_loss": -26.338058471679688, "global_step": 419771, "epoch": 5057} {"train_loss": -26.280536651611328, "global_step": 419772, "epoch": 5057} {"train_loss": -26.550445556640625, "global_step": 419773, "epoch": 5057} {"train_loss": -26.2412052154541, "global_step": 419774, "epoch": 5057} {"train_loss": -26.338590621948242, "global_step": 419775, "epoch": 5057} {"train_loss": -26.319990158081055, "global_step": 419776, "epoch": 5057} {"train_loss": -26.499755859375, "global_step": 419777, "epoch": 5057} {"train_loss": -26.481443405151367, "global_step": 419778, "epoch": 5057} {"train_loss": -26.30929946899414, "global_step": 419779, "epoch": 5057} {"train_loss": -26.448144912719727, "global_step": 419780, "epoch": 5057} {"train_loss": -26.387027740478516, "global_step": 419781, "epoch": 5057} {"train_loss": -26.86752700805664, "global_step": 419782, "epoch": 5057} {"train_loss": -26.51177978515625, "global_step": 419783, "epoch": 5057} {"train_loss": -26.6420955657959, "global_step": 419784, "epoch": 5057} {"train_loss": -26.718542098999023, "global_step": 419785, "epoch": 5057} {"train_loss": -26.065725326538086, "global_step": 419786, "epoch": 5057} {"train_loss": -26.564268112182617, "global_step": 419787, "epoch": 5057} {"train_loss": -26.361286163330078, "global_step": 419788, "epoch": 5057} {"train_loss": -26.595657348632812, "global_step": 419789, "epoch": 5057} {"train_loss": -26.32388687133789, "global_step": 419790, "epoch": 5057} {"train_loss": -26.547504425048828, "global_step": 419791, "epoch": 5057} {"train_loss": -26.607757568359375, "global_step": 419792, "epoch": 5057} {"train_loss": -26.647729873657227, "global_step": 419793, "epoch": 5057} {"train_loss": -26.707578659057617, "global_step": 419794, "epoch": 5057} {"train_loss": -26.69575309753418, "global_step": 419795, "epoch": 5057} {"train_loss": -26.907825469970703, "global_step": 419796, "epoch": 5057} {"train_loss": -26.656356811523438, "global_step": 419797, "epoch": 5057} {"train_loss": -26.770200729370117, "global_step": 419798, "epoch": 5057} {"train_loss": -26.896106719970703, "global_step": 419799, "epoch": 5057} {"train_loss": -26.61994743347168, "global_step": 419800, "epoch": 5057} {"train_loss": -26.843463897705078, "global_step": 419801, "epoch": 5057} {"train_loss": -27.10548210144043, "global_step": 419802, "epoch": 5057} {"train_loss": -26.735044479370117, "global_step": 419803, "epoch": 5057} {"train_loss": -26.52127456665039, "global_step": 419804, "epoch": 5057} {"train_loss": -27.0076961517334, "global_step": 419805, "epoch": 5057} {"train_loss": -27.063751220703125, "global_step": 419806, "epoch": 5057} {"train_loss": -26.98084831237793, "global_step": 419807, "epoch": 5057} {"train_loss": -26.833221435546875, "global_step": 419808, "epoch": 5057} {"train_loss": -26.880481719970703, "global_step": 419809, "epoch": 5057} {"train_loss": -26.19329833984375, "global_step": 419810, "epoch": 5057} {"train_loss": -26.780872344970703, "global_step": 419811, "epoch": 5057} {"train_loss": -26.935720443725586, "global_step": 419812, "epoch": 5057} {"train_loss": -25.666822065790015, "global_step": 419813, "epoch": 5057, "val_loss": 6913270.5} {"train_loss": -25.924901962280273, "global_step": 419814, "epoch": 5058} {"train_loss": -25.903430938720703, "global_step": 419815, "epoch": 5058} {"train_loss": -26.099109649658203, "global_step": 419816, "epoch": 5058} {"train_loss": -26.471464157104492, "global_step": 419817, "epoch": 5058} {"train_loss": -26.222497940063477, "global_step": 419818, "epoch": 5058} {"train_loss": -25.905902862548828, "global_step": 419819, "epoch": 5058} {"train_loss": -26.37153434753418, "global_step": 419820, "epoch": 5058} {"train_loss": -26.29654312133789, "global_step": 419821, "epoch": 5058} {"train_loss": -26.02138328552246, "global_step": 419822, "epoch": 5058} {"train_loss": -26.407861709594727, "global_step": 419823, "epoch": 5058} {"train_loss": -26.618322372436523, "global_step": 419824, "epoch": 5058} {"train_loss": -26.414794921875, "global_step": 419825, "epoch": 5058} {"train_loss": -26.846689224243164, "global_step": 419826, "epoch": 5058} {"train_loss": -26.707395553588867, "global_step": 419827, "epoch": 5058} {"train_loss": -27.017602920532227, "global_step": 419828, "epoch": 5058} {"train_loss": -26.798242568969727, "global_step": 419829, "epoch": 5058} {"train_loss": -26.937955856323242, "global_step": 419830, "epoch": 5058} {"train_loss": -26.23974609375, "global_step": 419831, "epoch": 5058} {"train_loss": -26.585651397705078, "global_step": 419832, "epoch": 5058} {"train_loss": -26.789691925048828, "global_step": 419833, "epoch": 5058} {"train_loss": -26.844867706298828, "global_step": 419834, "epoch": 5058} {"train_loss": -26.491622924804688, "global_step": 419835, "epoch": 5058} {"train_loss": -26.698827743530273, "global_step": 419836, "epoch": 5058} {"train_loss": -26.921594619750977, "global_step": 419837, "epoch": 5058} {"train_loss": -27.027423858642578, "global_step": 419838, "epoch": 5058} {"train_loss": -26.99273681640625, "global_step": 419839, "epoch": 5058} {"train_loss": -26.673999786376953, "global_step": 419840, "epoch": 5058} {"train_loss": -26.6712646484375, "global_step": 419841, "epoch": 5058} {"train_loss": -26.79151725769043, "global_step": 419842, "epoch": 5058} {"train_loss": -26.679737091064453, "global_step": 419843, "epoch": 5058} {"train_loss": -26.980093002319336, "global_step": 419844, "epoch": 5058} {"train_loss": -26.90484619140625, "global_step": 419845, "epoch": 5058} {"train_loss": -26.597976684570312, "global_step": 419846, "epoch": 5058} {"train_loss": -27.059467315673828, "global_step": 419847, "epoch": 5058} {"train_loss": -26.979528427124023, "global_step": 419848, "epoch": 5058} {"train_loss": -27.005218505859375, "global_step": 419849, "epoch": 5058} {"train_loss": -27.00581932067871, "global_step": 419850, "epoch": 5058} {"train_loss": -26.808673858642578, "global_step": 419851, "epoch": 5058} {"train_loss": -27.148548126220703, "global_step": 419852, "epoch": 5058} {"train_loss": -27.08066177368164, "global_step": 419853, "epoch": 5058} {"train_loss": -26.810388565063477, "global_step": 419854, "epoch": 5058} {"train_loss": -26.827869415283203, "global_step": 419855, "epoch": 5058} {"train_loss": -26.823822021484375, "global_step": 419856, "epoch": 5058} {"train_loss": -26.728185653686523, "global_step": 419857, "epoch": 5058} {"train_loss": -26.83591651916504, "global_step": 419858, "epoch": 5058} {"train_loss": -26.894559860229492, "global_step": 419859, "epoch": 5058} {"train_loss": -27.164520263671875, "global_step": 419860, "epoch": 5058} {"train_loss": -26.616140365600586, "global_step": 419861, "epoch": 5058} {"train_loss": -27.297412872314453, "global_step": 419862, "epoch": 5058} {"train_loss": -26.858789443969727, "global_step": 419863, "epoch": 5058} {"train_loss": -26.998443603515625, "global_step": 419864, "epoch": 5058} {"train_loss": -26.841094970703125, "global_step": 419865, "epoch": 5058} {"train_loss": -26.93877601623535, "global_step": 419866, "epoch": 5058} {"train_loss": -26.75311279296875, "global_step": 419867, "epoch": 5058} {"train_loss": -26.7003231048584, "global_step": 419868, "epoch": 5058} {"train_loss": -26.73297691345215, "global_step": 419869, "epoch": 5058} {"train_loss": -26.933439254760742, "global_step": 419870, "epoch": 5058} {"train_loss": -26.46435546875, "global_step": 419871, "epoch": 5058} {"train_loss": -26.902578353881836, "global_step": 419872, "epoch": 5058} {"train_loss": -26.64495277404785, "global_step": 419873, "epoch": 5058} {"train_loss": -26.9436092376709, "global_step": 419874, "epoch": 5058} {"train_loss": -26.97174072265625, "global_step": 419875, "epoch": 5058} {"train_loss": -26.94093132019043, "global_step": 419876, "epoch": 5058} {"train_loss": -26.867538452148438, "global_step": 419877, "epoch": 5058} {"train_loss": -27.01263999938965, "global_step": 419878, "epoch": 5058} {"train_loss": -26.78694725036621, "global_step": 419879, "epoch": 5058} {"train_loss": -26.753662109375, "global_step": 419880, "epoch": 5058} {"train_loss": -27.02326011657715, "global_step": 419881, "epoch": 5058} {"train_loss": -26.957181930541992, "global_step": 419882, "epoch": 5058} {"train_loss": -26.823068618774414, "global_step": 419883, "epoch": 5058} {"train_loss": -27.071578979492188, "global_step": 419884, "epoch": 5058} {"train_loss": -26.53425407409668, "global_step": 419885, "epoch": 5058} {"train_loss": -26.642444610595703, "global_step": 419886, "epoch": 5058} {"train_loss": -26.700733184814453, "global_step": 419887, "epoch": 5058} {"train_loss": -26.86590003967285, "global_step": 419888, "epoch": 5058} {"train_loss": -27.006961822509766, "global_step": 419889, "epoch": 5058} {"train_loss": -26.899707794189453, "global_step": 419890, "epoch": 5058} {"train_loss": -26.9825382232666, "global_step": 419891, "epoch": 5058} {"train_loss": -27.00465965270996, "global_step": 419892, "epoch": 5058} {"train_loss": -26.71695899963379, "global_step": 419893, "epoch": 5058} {"train_loss": -27.10793113708496, "global_step": 419894, "epoch": 5058} {"train_loss": -27.163257598876953, "global_step": 419895, "epoch": 5058} {"train_loss": -26.76632035496723, "global_step": 419896, "epoch": 5058, "val_loss": 6911066.5} {"train_loss": -25.242040634155273, "global_step": 419897, "epoch": 5059} {"train_loss": -21.812973022460938, "global_step": 419898, "epoch": 5059} {"train_loss": -25.6488037109375, "global_step": 419899, "epoch": 5059} {"train_loss": -23.961217880249023, "global_step": 419900, "epoch": 5059} {"train_loss": -25.873931884765625, "global_step": 419901, "epoch": 5059} {"train_loss": -24.619482040405273, "global_step": 419902, "epoch": 5059} {"train_loss": -26.29041862487793, "global_step": 419903, "epoch": 5059} {"train_loss": -25.391077041625977, "global_step": 419904, "epoch": 5059} {"train_loss": -25.532453536987305, "global_step": 419905, "epoch": 5059} {"train_loss": -25.8355712890625, "global_step": 419906, "epoch": 5059} {"train_loss": -26.170215606689453, "global_step": 419907, "epoch": 5059} {"train_loss": -25.747968673706055, "global_step": 419908, "epoch": 5059} {"train_loss": -26.01665687561035, "global_step": 419909, "epoch": 5059} {"train_loss": -26.19304847717285, "global_step": 419910, "epoch": 5059} {"train_loss": -26.055404663085938, "global_step": 419911, "epoch": 5059} {"train_loss": -26.188648223876953, "global_step": 419912, "epoch": 5059} {"train_loss": -25.834699630737305, "global_step": 419913, "epoch": 5059} {"train_loss": -26.265216827392578, "global_step": 419914, "epoch": 5059} {"train_loss": -26.349706649780273, "global_step": 419915, "epoch": 5059} {"train_loss": -26.4837589263916, "global_step": 419916, "epoch": 5059} {"train_loss": -26.105676651000977, "global_step": 419917, "epoch": 5059} {"train_loss": -26.596776962280273, "global_step": 419918, "epoch": 5059} {"train_loss": -26.1523380279541, "global_step": 419919, "epoch": 5059} {"train_loss": -26.596158981323242, "global_step": 419920, "epoch": 5059} {"train_loss": -26.46473503112793, "global_step": 419921, "epoch": 5059} {"train_loss": -26.237817764282227, "global_step": 419922, "epoch": 5059} {"train_loss": -26.211530685424805, "global_step": 419923, "epoch": 5059} {"train_loss": -26.4226016998291, "global_step": 419924, "epoch": 5059} {"train_loss": -26.58258628845215, "global_step": 419925, "epoch": 5059} {"train_loss": -26.688261032104492, "global_step": 419926, "epoch": 5059} {"train_loss": -26.533185958862305, "global_step": 419927, "epoch": 5059} {"train_loss": -26.4894962310791, "global_step": 419928, "epoch": 5059} {"train_loss": -26.520767211914062, "global_step": 419929, "epoch": 5059} {"train_loss": -26.493179321289062, "global_step": 419930, "epoch": 5059} {"train_loss": -26.46455192565918, "global_step": 419931, "epoch": 5059} {"train_loss": -26.9555721282959, "global_step": 419932, "epoch": 5059} {"train_loss": -26.708730697631836, "global_step": 419933, "epoch": 5059} {"train_loss": -26.493162155151367, "global_step": 419934, "epoch": 5059} {"train_loss": -26.991071701049805, "global_step": 419935, "epoch": 5059} {"train_loss": -26.73223876953125, "global_step": 419936, "epoch": 5059} {"train_loss": -26.342859268188477, "global_step": 419937, "epoch": 5059} {"train_loss": -26.730573654174805, "global_step": 419938, "epoch": 5059} {"train_loss": -26.586994171142578, "global_step": 419939, "epoch": 5059} {"train_loss": -26.612171173095703, "global_step": 419940, "epoch": 5059} {"train_loss": -26.670820236206055, "global_step": 419941, "epoch": 5059} {"train_loss": -26.477130889892578, "global_step": 419942, "epoch": 5059} {"train_loss": -26.7989559173584, "global_step": 419943, "epoch": 5059} {"train_loss": -27.211328506469727, "global_step": 419944, "epoch": 5059} {"train_loss": -26.784337997436523, "global_step": 419945, "epoch": 5059} {"train_loss": -27.007068634033203, "global_step": 419946, "epoch": 5059} {"train_loss": -26.796606063842773, "global_step": 419947, "epoch": 5059} {"train_loss": -26.848718643188477, "global_step": 419948, "epoch": 5059} {"train_loss": -26.779403686523438, "global_step": 419949, "epoch": 5059} {"train_loss": -26.960630416870117, "global_step": 419950, "epoch": 5059} {"train_loss": -26.518238067626953, "global_step": 419951, "epoch": 5059} {"train_loss": -26.896615982055664, "global_step": 419952, "epoch": 5059} {"train_loss": -26.980817794799805, "global_step": 419953, "epoch": 5059} {"train_loss": -26.66511344909668, "global_step": 419954, "epoch": 5059} {"train_loss": -26.673261642456055, "global_step": 419955, "epoch": 5059} {"train_loss": -26.780664443969727, "global_step": 419956, "epoch": 5059} {"train_loss": -26.827320098876953, "global_step": 419957, "epoch": 5059} {"train_loss": -26.84681510925293, "global_step": 419958, "epoch": 5059} {"train_loss": -27.06732177734375, "global_step": 419959, "epoch": 5059} {"train_loss": -27.106046676635742, "global_step": 419960, "epoch": 5059} {"train_loss": -26.844873428344727, "global_step": 419961, "epoch": 5059} {"train_loss": -26.61285400390625, "global_step": 419962, "epoch": 5059} {"train_loss": -26.589853286743164, "global_step": 419963, "epoch": 5059} {"train_loss": -26.69817543029785, "global_step": 419964, "epoch": 5059} {"train_loss": -26.80841064453125, "global_step": 419965, "epoch": 5059} {"train_loss": -26.761274337768555, "global_step": 419966, "epoch": 5059} {"train_loss": -26.868864059448242, "global_step": 419967, "epoch": 5059} {"train_loss": -26.223331451416016, "global_step": 419968, "epoch": 5059} {"train_loss": -26.322484970092773, "global_step": 419969, "epoch": 5059} {"train_loss": -26.6785888671875, "global_step": 419970, "epoch": 5059} {"train_loss": -26.2576904296875, "global_step": 419971, "epoch": 5059} {"train_loss": -26.462421417236328, "global_step": 419972, "epoch": 5059} {"train_loss": -26.216955184936523, "global_step": 419973, "epoch": 5059} {"train_loss": -26.991113662719727, "global_step": 419974, "epoch": 5059} {"train_loss": -26.542224884033203, "global_step": 419975, "epoch": 5059} {"train_loss": -26.928119659423828, "global_step": 419976, "epoch": 5059} {"train_loss": -26.737462997436523, "global_step": 419977, "epoch": 5059} {"train_loss": -26.88654899597168, "global_step": 419978, "epoch": 5059} {"train_loss": -26.410161374563195, "global_step": 419979, "epoch": 5059, "val_loss": 6918825.0} {"train_loss": -25.471845626831055, "global_step": 419980, "epoch": 5060} {"train_loss": -25.813261032104492, "global_step": 419981, "epoch": 5060} {"train_loss": -26.27186393737793, "global_step": 419982, "epoch": 5060} {"train_loss": -25.981298446655273, "global_step": 419983, "epoch": 5060} {"train_loss": -26.280996322631836, "global_step": 419984, "epoch": 5060} {"train_loss": -25.893774032592773, "global_step": 419985, "epoch": 5060} {"train_loss": -26.186193466186523, "global_step": 419986, "epoch": 5060} {"train_loss": -26.286874771118164, "global_step": 419987, "epoch": 5060} {"train_loss": -26.195056915283203, "global_step": 419988, "epoch": 5060} {"train_loss": -26.76630973815918, "global_step": 419989, "epoch": 5060} {"train_loss": -26.31727409362793, "global_step": 419990, "epoch": 5060} {"train_loss": -26.783222198486328, "global_step": 419991, "epoch": 5060} {"train_loss": -26.718963623046875, "global_step": 419992, "epoch": 5060} {"train_loss": -26.3590145111084, "global_step": 419993, "epoch": 5060} {"train_loss": -26.34950065612793, "global_step": 419994, "epoch": 5060} {"train_loss": -26.805938720703125, "global_step": 419995, "epoch": 5060} {"train_loss": -26.480453491210938, "global_step": 419996, "epoch": 5060} {"train_loss": -26.233875274658203, "global_step": 419997, "epoch": 5060} {"train_loss": -26.53968620300293, "global_step": 419998, "epoch": 5060} {"train_loss": -26.5759220123291, "global_step": 419999, "epoch": 5060} {"train_loss": -26.90973472595215, "global_step": 420000, "epoch": 5060} {"train_loss": -26.651996612548828, "global_step": 420001, "epoch": 5060} {"train_loss": -27.19211196899414, "global_step": 420002, "epoch": 5060} {"train_loss": -26.796161651611328, "global_step": 420003, "epoch": 5060} {"train_loss": -26.46552085876465, "global_step": 420004, "epoch": 5060} {"train_loss": -27.013778686523438, "global_step": 420005, "epoch": 5060} {"train_loss": -26.676599502563477, "global_step": 420006, "epoch": 5060} {"train_loss": -26.540632247924805, "global_step": 420007, "epoch": 5060} {"train_loss": -27.321714401245117, "global_step": 420008, "epoch": 5060} {"train_loss": -26.610559463500977, "global_step": 420009, "epoch": 5060} {"train_loss": -26.941144943237305, "global_step": 420010, "epoch": 5060} {"train_loss": -26.816486358642578, "global_step": 420011, "epoch": 5060} {"train_loss": -27.111083984375, "global_step": 420012, "epoch": 5060} {"train_loss": -27.246856689453125, "global_step": 420013, "epoch": 5060} {"train_loss": -26.761703491210938, "global_step": 420014, "epoch": 5060} {"train_loss": -26.79254150390625, "global_step": 420015, "epoch": 5060} {"train_loss": -26.997095108032227, "global_step": 420016, "epoch": 5060} {"train_loss": -27.242237091064453, "global_step": 420017, "epoch": 5060} {"train_loss": -26.818464279174805, "global_step": 420018, "epoch": 5060} {"train_loss": -27.19122886657715, "global_step": 420019, "epoch": 5060} {"train_loss": -26.843860626220703, "global_step": 420020, "epoch": 5060} {"train_loss": -26.6959171295166, "global_step": 420021, "epoch": 5060} {"train_loss": -26.988101959228516, "global_step": 420022, "epoch": 5060} {"train_loss": -26.829938888549805, "global_step": 420023, "epoch": 5060} {"train_loss": -26.868993759155273, "global_step": 420024, "epoch": 5060} {"train_loss": -26.978363037109375, "global_step": 420025, "epoch": 5060} {"train_loss": -26.7772216796875, "global_step": 420026, "epoch": 5060} {"train_loss": -26.914011001586914, "global_step": 420027, "epoch": 5060} {"train_loss": -27.289602279663086, "global_step": 420028, "epoch": 5060} {"train_loss": -26.816162109375, "global_step": 420029, "epoch": 5060} {"train_loss": -27.037601470947266, "global_step": 420030, "epoch": 5060} {"train_loss": -27.04912757873535, "global_step": 420031, "epoch": 5060} {"train_loss": -26.883819580078125, "global_step": 420032, "epoch": 5060} {"train_loss": -27.145553588867188, "global_step": 420033, "epoch": 5060} {"train_loss": -27.109094619750977, "global_step": 420034, "epoch": 5060} {"train_loss": -27.039020538330078, "global_step": 420035, "epoch": 5060} {"train_loss": -26.65557289123535, "global_step": 420036, "epoch": 5060} {"train_loss": -27.185163497924805, "global_step": 420037, "epoch": 5060} {"train_loss": -26.93484878540039, "global_step": 420038, "epoch": 5060} {"train_loss": -26.84107780456543, "global_step": 420039, "epoch": 5060} {"train_loss": -26.608739852905273, "global_step": 420040, "epoch": 5060} {"train_loss": -27.1453914642334, "global_step": 420041, "epoch": 5060} {"train_loss": -26.931745529174805, "global_step": 420042, "epoch": 5060} {"train_loss": -26.39105796813965, "global_step": 420043, "epoch": 5060} {"train_loss": -26.221216201782227, "global_step": 420044, "epoch": 5060} {"train_loss": -26.5921630859375, "global_step": 420045, "epoch": 5060} {"train_loss": -26.676889419555664, "global_step": 420046, "epoch": 5060} {"train_loss": -27.1439208984375, "global_step": 420047, "epoch": 5060} {"train_loss": -26.458539962768555, "global_step": 420048, "epoch": 5060} {"train_loss": -26.77473258972168, "global_step": 420049, "epoch": 5060} {"train_loss": -26.69662857055664, "global_step": 420050, "epoch": 5060} {"train_loss": -26.579431533813477, "global_step": 420051, "epoch": 5060} {"train_loss": -26.613386154174805, "global_step": 420052, "epoch": 5060} {"train_loss": -26.591602325439453, "global_step": 420053, "epoch": 5060} {"train_loss": -26.6002197265625, "global_step": 420054, "epoch": 5060} {"train_loss": -26.732345581054688, "global_step": 420055, "epoch": 5060} {"train_loss": -26.643020629882812, "global_step": 420056, "epoch": 5060} {"train_loss": -26.52974510192871, "global_step": 420057, "epoch": 5060} {"train_loss": -27.39607048034668, "global_step": 420058, "epoch": 5060} {"train_loss": -26.62981605529785, "global_step": 420059, "epoch": 5060} {"train_loss": -26.727781295776367, "global_step": 420060, "epoch": 5060} {"train_loss": -26.570480346679688, "global_step": 420061, "epoch": 5060} {"train_loss": -26.70759867472821, "global_step": 420062, "epoch": 5060, "val_loss": 6956281.0} {"train_loss": -26.4036865234375, "global_step": 420063, "epoch": 5061} {"train_loss": -26.32317543029785, "global_step": 420064, "epoch": 5061} {"train_loss": -26.50483512878418, "global_step": 420065, "epoch": 5061} {"train_loss": -26.35187339782715, "global_step": 420066, "epoch": 5061} {"train_loss": -26.544178009033203, "global_step": 420067, "epoch": 5061} {"train_loss": -26.460657119750977, "global_step": 420068, "epoch": 5061} {"train_loss": -26.66908836364746, "global_step": 420069, "epoch": 5061} {"train_loss": -26.552392959594727, "global_step": 420070, "epoch": 5061} {"train_loss": -26.85231590270996, "global_step": 420071, "epoch": 5061} {"train_loss": -26.70294189453125, "global_step": 420072, "epoch": 5061} {"train_loss": -26.67041015625, "global_step": 420073, "epoch": 5061} {"train_loss": -26.945083618164062, "global_step": 420074, "epoch": 5061} {"train_loss": -26.57258415222168, "global_step": 420075, "epoch": 5061} {"train_loss": -26.554895401000977, "global_step": 420076, "epoch": 5061} {"train_loss": -26.42117691040039, "global_step": 420077, "epoch": 5061} {"train_loss": -26.800867080688477, "global_step": 420078, "epoch": 5061} {"train_loss": -27.05159568786621, "global_step": 420079, "epoch": 5061} {"train_loss": -26.6668643951416, "global_step": 420080, "epoch": 5061} {"train_loss": -26.718006134033203, "global_step": 420081, "epoch": 5061} {"train_loss": -26.42426109313965, "global_step": 420082, "epoch": 5061} {"train_loss": -26.58949089050293, "global_step": 420083, "epoch": 5061} {"train_loss": -26.520788192749023, "global_step": 420084, "epoch": 5061} {"train_loss": -27.0180721282959, "global_step": 420085, "epoch": 5061} {"train_loss": -26.9466495513916, "global_step": 420086, "epoch": 5061} {"train_loss": -26.918127059936523, "global_step": 420087, "epoch": 5061} {"train_loss": -27.03388023376465, "global_step": 420088, "epoch": 5061} {"train_loss": -26.577234268188477, "global_step": 420089, "epoch": 5061} {"train_loss": -26.9243221282959, "global_step": 420090, "epoch": 5061} {"train_loss": -26.6616268157959, "global_step": 420091, "epoch": 5061} {"train_loss": -26.9747371673584, "global_step": 420092, "epoch": 5061} {"train_loss": -26.8525447845459, "global_step": 420093, "epoch": 5061} {"train_loss": -26.80609703063965, "global_step": 420094, "epoch": 5061} {"train_loss": -26.999799728393555, "global_step": 420095, "epoch": 5061} {"train_loss": -26.8089599609375, "global_step": 420096, "epoch": 5061} {"train_loss": -26.96845054626465, "global_step": 420097, "epoch": 5061} {"train_loss": -26.751184463500977, "global_step": 420098, "epoch": 5061} {"train_loss": -27.274316787719727, "global_step": 420099, "epoch": 5061} {"train_loss": -27.0205078125, "global_step": 420100, "epoch": 5061} {"train_loss": -26.9942569732666, "global_step": 420101, "epoch": 5061} {"train_loss": -26.879993438720703, "global_step": 420102, "epoch": 5061} {"train_loss": -27.3230037689209, "global_step": 420103, "epoch": 5061} {"train_loss": -27.16927146911621, "global_step": 420104, "epoch": 5061} {"train_loss": -27.180585861206055, "global_step": 420105, "epoch": 5061} {"train_loss": -27.082422256469727, "global_step": 420106, "epoch": 5061} {"train_loss": -26.930883407592773, "global_step": 420107, "epoch": 5061} {"train_loss": -26.54990577697754, "global_step": 420108, "epoch": 5061} {"train_loss": -26.408689498901367, "global_step": 420109, "epoch": 5061} {"train_loss": -26.859045028686523, "global_step": 420110, "epoch": 5061} {"train_loss": -27.150609970092773, "global_step": 420111, "epoch": 5061} {"train_loss": -26.843305587768555, "global_step": 420112, "epoch": 5061} {"train_loss": -26.992090225219727, "global_step": 420113, "epoch": 5061} {"train_loss": -26.870267868041992, "global_step": 420114, "epoch": 5061} {"train_loss": -26.78193473815918, "global_step": 420115, "epoch": 5061} {"train_loss": -27.112930297851562, "global_step": 420116, "epoch": 5061} {"train_loss": -26.551340103149414, "global_step": 420117, "epoch": 5061} {"train_loss": -27.06589698791504, "global_step": 420118, "epoch": 5061} {"train_loss": -26.607221603393555, "global_step": 420119, "epoch": 5061} {"train_loss": -26.691617965698242, "global_step": 420120, "epoch": 5061} {"train_loss": -26.81757164001465, "global_step": 420121, "epoch": 5061} {"train_loss": -26.606351852416992, "global_step": 420122, "epoch": 5061} {"train_loss": -26.611730575561523, "global_step": 420123, "epoch": 5061} {"train_loss": -26.4870662689209, "global_step": 420124, "epoch": 5061} {"train_loss": -26.310888290405273, "global_step": 420125, "epoch": 5061} {"train_loss": -26.0461483001709, "global_step": 420126, "epoch": 5061} {"train_loss": -26.261600494384766, "global_step": 420127, "epoch": 5061} {"train_loss": -26.972402572631836, "global_step": 420128, "epoch": 5061} {"train_loss": -26.841108322143555, "global_step": 420129, "epoch": 5061} {"train_loss": -26.162595748901367, "global_step": 420130, "epoch": 5061} {"train_loss": -26.912229537963867, "global_step": 420131, "epoch": 5061} {"train_loss": -26.84690284729004, "global_step": 420132, "epoch": 5061} {"train_loss": -26.818572998046875, "global_step": 420133, "epoch": 5061} {"train_loss": -26.619550704956055, "global_step": 420134, "epoch": 5061} {"train_loss": -26.792505264282227, "global_step": 420135, "epoch": 5061} {"train_loss": -26.776838302612305, "global_step": 420136, "epoch": 5061} {"train_loss": -26.978443145751953, "global_step": 420137, "epoch": 5061} {"train_loss": -27.113195419311523, "global_step": 420138, "epoch": 5061} {"train_loss": -26.644916534423828, "global_step": 420139, "epoch": 5061} {"train_loss": -26.887975692749023, "global_step": 420140, "epoch": 5061} {"train_loss": -26.789657592773438, "global_step": 420141, "epoch": 5061} {"train_loss": -26.71880531311035, "global_step": 420142, "epoch": 5061} {"train_loss": -26.509540557861328, "global_step": 420143, "epoch": 5061} {"train_loss": -26.91891860961914, "global_step": 420144, "epoch": 5061} {"train_loss": -26.748216491147698, "global_step": 420145, "epoch": 5061, "val_loss": 7001266.5} {"train_loss": -26.389692306518555, "global_step": 420146, "epoch": 5062} {"train_loss": -26.266637802124023, "global_step": 420147, "epoch": 5062} {"train_loss": -26.188913345336914, "global_step": 420148, "epoch": 5062} {"train_loss": -26.48213005065918, "global_step": 420149, "epoch": 5062} {"train_loss": -26.546009063720703, "global_step": 420150, "epoch": 5062} {"train_loss": -26.34486198425293, "global_step": 420151, "epoch": 5062} {"train_loss": -26.461475372314453, "global_step": 420152, "epoch": 5062} {"train_loss": -26.499597549438477, "global_step": 420153, "epoch": 5062} {"train_loss": -26.144287109375, "global_step": 420154, "epoch": 5062} {"train_loss": -26.40536880493164, "global_step": 420155, "epoch": 5062} {"train_loss": -26.191726684570312, "global_step": 420156, "epoch": 5062} {"train_loss": -26.352994918823242, "global_step": 420157, "epoch": 5062} {"train_loss": -26.54052734375, "global_step": 420158, "epoch": 5062} {"train_loss": -26.310199737548828, "global_step": 420159, "epoch": 5062} {"train_loss": -27.135547637939453, "global_step": 420160, "epoch": 5062} {"train_loss": -26.12782096862793, "global_step": 420161, "epoch": 5062} {"train_loss": -26.85565757751465, "global_step": 420162, "epoch": 5062} {"train_loss": -26.420536041259766, "global_step": 420163, "epoch": 5062} {"train_loss": -26.354049682617188, "global_step": 420164, "epoch": 5062} {"train_loss": -26.794469833374023, "global_step": 420165, "epoch": 5062} {"train_loss": -26.678617477416992, "global_step": 420166, "epoch": 5062} {"train_loss": -26.522558212280273, "global_step": 420167, "epoch": 5062} {"train_loss": -26.718704223632812, "global_step": 420168, "epoch": 5062} {"train_loss": -27.246856689453125, "global_step": 420169, "epoch": 5062} {"train_loss": -27.117572784423828, "global_step": 420170, "epoch": 5062} {"train_loss": -26.841297149658203, "global_step": 420171, "epoch": 5062} {"train_loss": -26.556318283081055, "global_step": 420172, "epoch": 5062} {"train_loss": -26.86688232421875, "global_step": 420173, "epoch": 5062} {"train_loss": -26.654571533203125, "global_step": 420174, "epoch": 5062} {"train_loss": -26.589685440063477, "global_step": 420175, "epoch": 5062} {"train_loss": -26.490737915039062, "global_step": 420176, "epoch": 5062} {"train_loss": -26.9746150970459, "global_step": 420177, "epoch": 5062} {"train_loss": -26.30972671508789, "global_step": 420178, "epoch": 5062} {"train_loss": -26.60150146484375, "global_step": 420179, "epoch": 5062} {"train_loss": -26.7974796295166, "global_step": 420180, "epoch": 5062} {"train_loss": -27.0379638671875, "global_step": 420181, "epoch": 5062} {"train_loss": -27.11774253845215, "global_step": 420182, "epoch": 5062} {"train_loss": -27.03803062438965, "global_step": 420183, "epoch": 5062} {"train_loss": -26.936002731323242, "global_step": 420184, "epoch": 5062} {"train_loss": -26.846149444580078, "global_step": 420185, "epoch": 5062} {"train_loss": -27.0150146484375, "global_step": 420186, "epoch": 5062} {"train_loss": -26.70113182067871, "global_step": 420187, "epoch": 5062} {"train_loss": -27.001291275024414, "global_step": 420188, "epoch": 5062} {"train_loss": -26.98615074157715, "global_step": 420189, "epoch": 5062} {"train_loss": -26.70706558227539, "global_step": 420190, "epoch": 5062} {"train_loss": -27.07587242126465, "global_step": 420191, "epoch": 5062} {"train_loss": -26.8093204498291, "global_step": 420192, "epoch": 5062} {"train_loss": -26.57291030883789, "global_step": 420193, "epoch": 5062} {"train_loss": -27.02031898498535, "global_step": 420194, "epoch": 5062} {"train_loss": -27.347314834594727, "global_step": 420195, "epoch": 5062} {"train_loss": -26.82097816467285, "global_step": 420196, "epoch": 5062} {"train_loss": -26.90947914123535, "global_step": 420197, "epoch": 5062} {"train_loss": -26.955963134765625, "global_step": 420198, "epoch": 5062} {"train_loss": -26.817956924438477, "global_step": 420199, "epoch": 5062} {"train_loss": -26.775766372680664, "global_step": 420200, "epoch": 5062} {"train_loss": -27.208057403564453, "global_step": 420201, "epoch": 5062} {"train_loss": -27.276700973510742, "global_step": 420202, "epoch": 5062} {"train_loss": -26.807666778564453, "global_step": 420203, "epoch": 5062} {"train_loss": -26.686017990112305, "global_step": 420204, "epoch": 5062} {"train_loss": -27.063064575195312, "global_step": 420205, "epoch": 5062} {"train_loss": -27.29249382019043, "global_step": 420206, "epoch": 5062} {"train_loss": -27.035358428955078, "global_step": 420207, "epoch": 5062} {"train_loss": -27.09832763671875, "global_step": 420208, "epoch": 5062} {"train_loss": -26.920597076416016, "global_step": 420209, "epoch": 5062} {"train_loss": -26.703256607055664, "global_step": 420210, "epoch": 5062} {"train_loss": -26.899219512939453, "global_step": 420211, "epoch": 5062} {"train_loss": -27.1474552154541, "global_step": 420212, "epoch": 5062} {"train_loss": -27.21579360961914, "global_step": 420213, "epoch": 5062} {"train_loss": -26.71478271484375, "global_step": 420214, "epoch": 5062} {"train_loss": -26.97637939453125, "global_step": 420215, "epoch": 5062} {"train_loss": -26.815399169921875, "global_step": 420216, "epoch": 5062} {"train_loss": -26.876693725585938, "global_step": 420217, "epoch": 5062} {"train_loss": -27.26071548461914, "global_step": 420218, "epoch": 5062} {"train_loss": -27.30832290649414, "global_step": 420219, "epoch": 5062} {"train_loss": -26.9627628326416, "global_step": 420220, "epoch": 5062} {"train_loss": -26.729909896850586, "global_step": 420221, "epoch": 5062} {"train_loss": -27.219633102416992, "global_step": 420222, "epoch": 5062} {"train_loss": -26.85284996032715, "global_step": 420223, "epoch": 5062} {"train_loss": -26.06842041015625, "global_step": 420224, "epoch": 5062} {"train_loss": -27.037363052368164, "global_step": 420225, "epoch": 5062} {"train_loss": -26.904523849487305, "global_step": 420226, "epoch": 5062} {"train_loss": -26.829334259033203, "global_step": 420227, "epoch": 5062} {"train_loss": -26.783159830484045, "global_step": 420228, "epoch": 5062, "val_loss": 6944952.0} {"train_loss": -25.50963020324707, "global_step": 420229, "epoch": 5063} {"train_loss": -25.317550659179688, "global_step": 420230, "epoch": 5063} {"train_loss": -25.799551010131836, "global_step": 420231, "epoch": 5063} {"train_loss": -26.6564884185791, "global_step": 420232, "epoch": 5063} {"train_loss": -25.790985107421875, "global_step": 420233, "epoch": 5063} {"train_loss": -26.343713760375977, "global_step": 420234, "epoch": 5063} {"train_loss": -26.083032608032227, "global_step": 420235, "epoch": 5063} {"train_loss": -26.166793823242188, "global_step": 420236, "epoch": 5063} {"train_loss": -26.324798583984375, "global_step": 420237, "epoch": 5063} {"train_loss": -26.51435661315918, "global_step": 420238, "epoch": 5063} {"train_loss": -26.612634658813477, "global_step": 420239, "epoch": 5063} {"train_loss": -26.693634033203125, "global_step": 420240, "epoch": 5063} {"train_loss": -26.348861694335938, "global_step": 420241, "epoch": 5063} {"train_loss": -26.46795654296875, "global_step": 420242, "epoch": 5063} {"train_loss": -26.170576095581055, "global_step": 420243, "epoch": 5063} {"train_loss": -26.987939834594727, "global_step": 420244, "epoch": 5063} {"train_loss": -26.266845703125, "global_step": 420245, "epoch": 5063} {"train_loss": -26.556116104125977, "global_step": 420246, "epoch": 5063} {"train_loss": -26.289691925048828, "global_step": 420247, "epoch": 5063} {"train_loss": -26.45734214782715, "global_step": 420248, "epoch": 5063} {"train_loss": -26.6566104888916, "global_step": 420249, "epoch": 5063} {"train_loss": -26.638940811157227, "global_step": 420250, "epoch": 5063} {"train_loss": -26.421850204467773, "global_step": 420251, "epoch": 5063} {"train_loss": -26.382843017578125, "global_step": 420252, "epoch": 5063} {"train_loss": -26.08331871032715, "global_step": 420253, "epoch": 5063} {"train_loss": -26.727188110351562, "global_step": 420254, "epoch": 5063} {"train_loss": -26.923175811767578, "global_step": 420255, "epoch": 5063} {"train_loss": -26.704696655273438, "global_step": 420256, "epoch": 5063} {"train_loss": -26.49908447265625, "global_step": 420257, "epoch": 5063} {"train_loss": -26.916982650756836, "global_step": 420258, "epoch": 5063} {"train_loss": -26.787006378173828, "global_step": 420259, "epoch": 5063} {"train_loss": -27.220813751220703, "global_step": 420260, "epoch": 5063} {"train_loss": -26.48251724243164, "global_step": 420261, "epoch": 5063} {"train_loss": -26.686349868774414, "global_step": 420262, "epoch": 5063} {"train_loss": -26.88323974609375, "global_step": 420263, "epoch": 5063} {"train_loss": -27.078433990478516, "global_step": 420264, "epoch": 5063} {"train_loss": -26.444854736328125, "global_step": 420265, "epoch": 5063} {"train_loss": -26.881072998046875, "global_step": 420266, "epoch": 5063} {"train_loss": -26.346704483032227, "global_step": 420267, "epoch": 5063} {"train_loss": -27.110952377319336, "global_step": 420268, "epoch": 5063} {"train_loss": -26.624744415283203, "global_step": 420269, "epoch": 5063} {"train_loss": -26.90765953063965, "global_step": 420270, "epoch": 5063} {"train_loss": -26.837146759033203, "global_step": 420271, "epoch": 5063} {"train_loss": -26.967519760131836, "global_step": 420272, "epoch": 5063} {"train_loss": -26.82669448852539, "global_step": 420273, "epoch": 5063} {"train_loss": -27.002073287963867, "global_step": 420274, "epoch": 5063} {"train_loss": -27.160221099853516, "global_step": 420275, "epoch": 5063} {"train_loss": -26.74237632751465, "global_step": 420276, "epoch": 5063} {"train_loss": -27.105100631713867, "global_step": 420277, "epoch": 5063} {"train_loss": -26.69169044494629, "global_step": 420278, "epoch": 5063} {"train_loss": -26.90079116821289, "global_step": 420279, "epoch": 5063} {"train_loss": -26.7391357421875, "global_step": 420280, "epoch": 5063} {"train_loss": -26.414594650268555, "global_step": 420281, "epoch": 5063} {"train_loss": -26.2022705078125, "global_step": 420282, "epoch": 5063} {"train_loss": -26.618825912475586, "global_step": 420283, "epoch": 5063} {"train_loss": -26.753707885742188, "global_step": 420284, "epoch": 5063} {"train_loss": -26.821393966674805, "global_step": 420285, "epoch": 5063} {"train_loss": -26.94233512878418, "global_step": 420286, "epoch": 5063} {"train_loss": -26.783111572265625, "global_step": 420287, "epoch": 5063} {"train_loss": -27.004119873046875, "global_step": 420288, "epoch": 5063} {"train_loss": -26.647113800048828, "global_step": 420289, "epoch": 5063} {"train_loss": -26.872007369995117, "global_step": 420290, "epoch": 5063} {"train_loss": -26.75591468811035, "global_step": 420291, "epoch": 5063} {"train_loss": -26.942651748657227, "global_step": 420292, "epoch": 5063} {"train_loss": -26.899694442749023, "global_step": 420293, "epoch": 5063} {"train_loss": -26.570775985717773, "global_step": 420294, "epoch": 5063} {"train_loss": -26.637680053710938, "global_step": 420295, "epoch": 5063} {"train_loss": -26.986438751220703, "global_step": 420296, "epoch": 5063} {"train_loss": -27.17683219909668, "global_step": 420297, "epoch": 5063} {"train_loss": -26.768585205078125, "global_step": 420298, "epoch": 5063} {"train_loss": -26.672143936157227, "global_step": 420299, "epoch": 5063} {"train_loss": -27.091552734375, "global_step": 420300, "epoch": 5063} {"train_loss": -27.080541610717773, "global_step": 420301, "epoch": 5063} {"train_loss": -27.17608070373535, "global_step": 420302, "epoch": 5063} {"train_loss": -26.832605361938477, "global_step": 420303, "epoch": 5063} {"train_loss": -26.765766143798828, "global_step": 420304, "epoch": 5063} {"train_loss": -27.046649932861328, "global_step": 420305, "epoch": 5063} {"train_loss": -27.15439224243164, "global_step": 420306, "epoch": 5063} {"train_loss": -26.957141876220703, "global_step": 420307, "epoch": 5063} {"train_loss": -27.00543785095215, "global_step": 420308, "epoch": 5063} {"train_loss": -27.179615020751953, "global_step": 420309, "epoch": 5063} {"train_loss": -27.027429580688477, "global_step": 420310, "epoch": 5063} {"train_loss": -26.66124651805464, "global_step": 420311, "epoch": 5063, "val_loss": 7022368.0} {"train_loss": -26.240812301635742, "global_step": 420312, "epoch": 5064} {"train_loss": -25.89578628540039, "global_step": 420313, "epoch": 5064} {"train_loss": -25.365392684936523, "global_step": 420314, "epoch": 5064} {"train_loss": -25.966440200805664, "global_step": 420315, "epoch": 5064} {"train_loss": -26.377761840820312, "global_step": 420316, "epoch": 5064} {"train_loss": -25.620031356811523, "global_step": 420317, "epoch": 5064} {"train_loss": -25.81926918029785, "global_step": 420318, "epoch": 5064} {"train_loss": -25.913679122924805, "global_step": 420319, "epoch": 5064} {"train_loss": -26.271743774414062, "global_step": 420320, "epoch": 5064} {"train_loss": -26.34743309020996, "global_step": 420321, "epoch": 5064} {"train_loss": -26.10712242126465, "global_step": 420322, "epoch": 5064} {"train_loss": -26.20231056213379, "global_step": 420323, "epoch": 5064} {"train_loss": -26.19415283203125, "global_step": 420324, "epoch": 5064} {"train_loss": -26.072668075561523, "global_step": 420325, "epoch": 5064} {"train_loss": -26.646814346313477, "global_step": 420326, "epoch": 5064} {"train_loss": -26.28132438659668, "global_step": 420327, "epoch": 5064} {"train_loss": -26.509572982788086, "global_step": 420328, "epoch": 5064} {"train_loss": -26.3731746673584, "global_step": 420329, "epoch": 5064} {"train_loss": -26.22749137878418, "global_step": 420330, "epoch": 5064} {"train_loss": -26.709848403930664, "global_step": 420331, "epoch": 5064} {"train_loss": -26.561338424682617, "global_step": 420332, "epoch": 5064} {"train_loss": -26.686811447143555, "global_step": 420333, "epoch": 5064} {"train_loss": -26.73064613342285, "global_step": 420334, "epoch": 5064} {"train_loss": -26.767364501953125, "global_step": 420335, "epoch": 5064} {"train_loss": -26.757160186767578, "global_step": 420336, "epoch": 5064} {"train_loss": -26.304834365844727, "global_step": 420337, "epoch": 5064} {"train_loss": -26.494598388671875, "global_step": 420338, "epoch": 5064} {"train_loss": -26.46759605407715, "global_step": 420339, "epoch": 5064} {"train_loss": -26.36443519592285, "global_step": 420340, "epoch": 5064} {"train_loss": -26.10088539123535, "global_step": 420341, "epoch": 5064} {"train_loss": -26.723230361938477, "global_step": 420342, "epoch": 5064} {"train_loss": -26.28053092956543, "global_step": 420343, "epoch": 5064} {"train_loss": -26.728153228759766, "global_step": 420344, "epoch": 5064} {"train_loss": -26.506208419799805, "global_step": 420345, "epoch": 5064} {"train_loss": -26.749277114868164, "global_step": 420346, "epoch": 5064} {"train_loss": -26.75628662109375, "global_step": 420347, "epoch": 5064} {"train_loss": -26.717636108398438, "global_step": 420348, "epoch": 5064} {"train_loss": -27.09246826171875, "global_step": 420349, "epoch": 5064} {"train_loss": -26.581724166870117, "global_step": 420350, "epoch": 5064} {"train_loss": -26.801191329956055, "global_step": 420351, "epoch": 5064} {"train_loss": -27.011545181274414, "global_step": 420352, "epoch": 5064} {"train_loss": -26.8922176361084, "global_step": 420353, "epoch": 5064} {"train_loss": -27.329954147338867, "global_step": 420354, "epoch": 5064} {"train_loss": -26.838058471679688, "global_step": 420355, "epoch": 5064} {"train_loss": -26.993722915649414, "global_step": 420356, "epoch": 5064} {"train_loss": -26.59531593322754, "global_step": 420357, "epoch": 5064} {"train_loss": -27.22706413269043, "global_step": 420358, "epoch": 5064} {"train_loss": -27.087310791015625, "global_step": 420359, "epoch": 5064} {"train_loss": -26.890838623046875, "global_step": 420360, "epoch": 5064} {"train_loss": -26.95760154724121, "global_step": 420361, "epoch": 5064} {"train_loss": -27.011585235595703, "global_step": 420362, "epoch": 5064} {"train_loss": -26.96112060546875, "global_step": 420363, "epoch": 5064} {"train_loss": -27.40351676940918, "global_step": 420364, "epoch": 5064} {"train_loss": -26.54145622253418, "global_step": 420365, "epoch": 5064} {"train_loss": -27.057727813720703, "global_step": 420366, "epoch": 5064} {"train_loss": -26.72039794921875, "global_step": 420367, "epoch": 5064} {"train_loss": -27.118207931518555, "global_step": 420368, "epoch": 5064} {"train_loss": -26.80763053894043, "global_step": 420369, "epoch": 5064} {"train_loss": -26.903173446655273, "global_step": 420370, "epoch": 5064} {"train_loss": -27.02827262878418, "global_step": 420371, "epoch": 5064} {"train_loss": -26.707229614257812, "global_step": 420372, "epoch": 5064} {"train_loss": -26.921152114868164, "global_step": 420373, "epoch": 5064} {"train_loss": -27.02911949157715, "global_step": 420374, "epoch": 5064} {"train_loss": -26.713632583618164, "global_step": 420375, "epoch": 5064} {"train_loss": -27.043609619140625, "global_step": 420376, "epoch": 5064} {"train_loss": -26.995258331298828, "global_step": 420377, "epoch": 5064} {"train_loss": -27.02874755859375, "global_step": 420378, "epoch": 5064} {"train_loss": -27.247106552124023, "global_step": 420379, "epoch": 5064} {"train_loss": -26.86887550354004, "global_step": 420380, "epoch": 5064} {"train_loss": -26.663278579711914, "global_step": 420381, "epoch": 5064} {"train_loss": -26.852874755859375, "global_step": 420382, "epoch": 5064} {"train_loss": -27.261762619018555, "global_step": 420383, "epoch": 5064} {"train_loss": -27.090015411376953, "global_step": 420384, "epoch": 5064} {"train_loss": -26.777673721313477, "global_step": 420385, "epoch": 5064} {"train_loss": -26.93170166015625, "global_step": 420386, "epoch": 5064} {"train_loss": -26.728261947631836, "global_step": 420387, "epoch": 5064} {"train_loss": -26.704376220703125, "global_step": 420388, "epoch": 5064} {"train_loss": -27.0582218170166, "global_step": 420389, "epoch": 5064} {"train_loss": -26.54730224609375, "global_step": 420390, "epoch": 5064} {"train_loss": -26.855131149291992, "global_step": 420391, "epoch": 5064} {"train_loss": -26.52153968811035, "global_step": 420392, "epoch": 5064} {"train_loss": -26.803119659423828, "global_step": 420393, "epoch": 5064} {"train_loss": -26.65072657114052, "global_step": 420394, "epoch": 5064, "val_loss": 6980545.5} {"train_loss": -25.567306518554688, "global_step": 420395, "epoch": 5065} {"train_loss": -26.009490966796875, "global_step": 420396, "epoch": 5065} {"train_loss": -25.514413833618164, "global_step": 420397, "epoch": 5065} {"train_loss": -26.2701473236084, "global_step": 420398, "epoch": 5065} {"train_loss": -25.65342140197754, "global_step": 420399, "epoch": 5065} {"train_loss": -26.017980575561523, "global_step": 420400, "epoch": 5065} {"train_loss": -25.662128448486328, "global_step": 420401, "epoch": 5065} {"train_loss": -25.597211837768555, "global_step": 420402, "epoch": 5065} {"train_loss": -25.692340850830078, "global_step": 420403, "epoch": 5065} {"train_loss": -25.668426513671875, "global_step": 420404, "epoch": 5065} {"train_loss": -26.343774795532227, "global_step": 420405, "epoch": 5065} {"train_loss": -25.9447078704834, "global_step": 420406, "epoch": 5065} {"train_loss": -25.653106689453125, "global_step": 420407, "epoch": 5065} {"train_loss": -25.6696720123291, "global_step": 420408, "epoch": 5065} {"train_loss": -26.23054313659668, "global_step": 420409, "epoch": 5065} {"train_loss": -26.173681259155273, "global_step": 420410, "epoch": 5065} {"train_loss": -26.04911231994629, "global_step": 420411, "epoch": 5065} {"train_loss": -26.5133056640625, "global_step": 420412, "epoch": 5065} {"train_loss": -26.378345489501953, "global_step": 420413, "epoch": 5065} {"train_loss": -25.82037925720215, "global_step": 420414, "epoch": 5065} {"train_loss": -26.6544246673584, "global_step": 420415, "epoch": 5065} {"train_loss": -26.900320053100586, "global_step": 420416, "epoch": 5065} {"train_loss": -26.616491317749023, "global_step": 420417, "epoch": 5065} {"train_loss": -26.2452392578125, "global_step": 420418, "epoch": 5065} {"train_loss": -26.576141357421875, "global_step": 420419, "epoch": 5065} {"train_loss": -26.119657516479492, "global_step": 420420, "epoch": 5065} {"train_loss": -26.3892822265625, "global_step": 420421, "epoch": 5065} {"train_loss": -26.7669677734375, "global_step": 420422, "epoch": 5065} {"train_loss": -26.50726890563965, "global_step": 420423, "epoch": 5065} {"train_loss": -26.878705978393555, "global_step": 420424, "epoch": 5065} {"train_loss": -26.94679832458496, "global_step": 420425, "epoch": 5065} {"train_loss": -26.62969398498535, "global_step": 420426, "epoch": 5065} {"train_loss": -26.7323055267334, "global_step": 420427, "epoch": 5065} {"train_loss": -26.704547882080078, "global_step": 420428, "epoch": 5065} {"train_loss": -26.8338565826416, "global_step": 420429, "epoch": 5065} {"train_loss": -26.48914909362793, "global_step": 420430, "epoch": 5065} {"train_loss": -26.504291534423828, "global_step": 420431, "epoch": 5065} {"train_loss": -26.82257080078125, "global_step": 420432, "epoch": 5065} {"train_loss": -26.559690475463867, "global_step": 420433, "epoch": 5065} {"train_loss": -26.9002742767334, "global_step": 420434, "epoch": 5065} {"train_loss": -26.91339683532715, "global_step": 420435, "epoch": 5065} {"train_loss": -27.19598388671875, "global_step": 420436, "epoch": 5065} {"train_loss": -26.48699378967285, "global_step": 420437, "epoch": 5065} {"train_loss": -26.87074089050293, "global_step": 420438, "epoch": 5065} {"train_loss": -26.84077262878418, "global_step": 420439, "epoch": 5065} {"train_loss": -26.769733428955078, "global_step": 420440, "epoch": 5065} {"train_loss": -26.9405460357666, "global_step": 420441, "epoch": 5065} {"train_loss": -26.647064208984375, "global_step": 420442, "epoch": 5065} {"train_loss": -27.175434112548828, "global_step": 420443, "epoch": 5065} {"train_loss": -26.625905990600586, "global_step": 420444, "epoch": 5065} {"train_loss": -26.852914810180664, "global_step": 420445, "epoch": 5065} {"train_loss": -26.9083309173584, "global_step": 420446, "epoch": 5065} {"train_loss": -27.076322555541992, "global_step": 420447, "epoch": 5065} {"train_loss": -27.287073135375977, "global_step": 420448, "epoch": 5065} {"train_loss": -27.03461265563965, "global_step": 420449, "epoch": 5065} {"train_loss": -26.65260124206543, "global_step": 420450, "epoch": 5065} {"train_loss": -26.715158462524414, "global_step": 420451, "epoch": 5065} {"train_loss": -26.943174362182617, "global_step": 420452, "epoch": 5065} {"train_loss": -27.02861976623535, "global_step": 420453, "epoch": 5065} {"train_loss": -27.077106475830078, "global_step": 420454, "epoch": 5065} {"train_loss": -26.879735946655273, "global_step": 420455, "epoch": 5065} {"train_loss": -26.722431182861328, "global_step": 420456, "epoch": 5065} {"train_loss": -27.178491592407227, "global_step": 420457, "epoch": 5065} {"train_loss": -26.922109603881836, "global_step": 420458, "epoch": 5065} {"train_loss": -26.996606826782227, "global_step": 420459, "epoch": 5065} {"train_loss": -26.88172721862793, "global_step": 420460, "epoch": 5065} {"train_loss": -26.996875762939453, "global_step": 420461, "epoch": 5065} {"train_loss": -26.785980224609375, "global_step": 420462, "epoch": 5065} {"train_loss": -26.978103637695312, "global_step": 420463, "epoch": 5065} {"train_loss": -26.915624618530273, "global_step": 420464, "epoch": 5065} {"train_loss": -26.841373443603516, "global_step": 420465, "epoch": 5065} {"train_loss": -26.820270538330078, "global_step": 420466, "epoch": 5065} {"train_loss": -26.925806045532227, "global_step": 420467, "epoch": 5065} {"train_loss": -26.871795654296875, "global_step": 420468, "epoch": 5065} {"train_loss": -27.051259994506836, "global_step": 420469, "epoch": 5065} {"train_loss": -26.830402374267578, "global_step": 420470, "epoch": 5065} {"train_loss": -26.968353271484375, "global_step": 420471, "epoch": 5065} {"train_loss": -26.659414291381836, "global_step": 420472, "epoch": 5065} {"train_loss": -26.727933883666992, "global_step": 420473, "epoch": 5065} {"train_loss": -26.794519424438477, "global_step": 420474, "epoch": 5065} {"train_loss": -27.105792999267578, "global_step": 420475, "epoch": 5065} {"train_loss": -26.7178955078125, "global_step": 420476, "epoch": 5065} {"train_loss": -26.610674478921545, "global_step": 420477, "epoch": 5065, "val_loss": 7026967.0} {"train_loss": -25.751867294311523, "global_step": 420478, "epoch": 5066} {"train_loss": -25.04032325744629, "global_step": 420479, "epoch": 5066} {"train_loss": -25.451904296875, "global_step": 420480, "epoch": 5066} {"train_loss": -25.283658981323242, "global_step": 420481, "epoch": 5066} {"train_loss": -25.978185653686523, "global_step": 420482, "epoch": 5066} {"train_loss": -25.893461227416992, "global_step": 420483, "epoch": 5066} {"train_loss": -26.34547996520996, "global_step": 420484, "epoch": 5066} {"train_loss": -25.960926055908203, "global_step": 420485, "epoch": 5066} {"train_loss": -26.180561065673828, "global_step": 420486, "epoch": 5066} {"train_loss": -26.089948654174805, "global_step": 420487, "epoch": 5066} {"train_loss": -25.976348876953125, "global_step": 420488, "epoch": 5066} {"train_loss": -25.841073989868164, "global_step": 420489, "epoch": 5066} {"train_loss": -26.53766441345215, "global_step": 420490, "epoch": 5066} {"train_loss": -26.239660263061523, "global_step": 420491, "epoch": 5066} {"train_loss": -26.317630767822266, "global_step": 420492, "epoch": 5066} {"train_loss": -25.965063095092773, "global_step": 420493, "epoch": 5066} {"train_loss": -26.490436553955078, "global_step": 420494, "epoch": 5066} {"train_loss": -26.325180053710938, "global_step": 420495, "epoch": 5066} {"train_loss": -26.586944580078125, "global_step": 420496, "epoch": 5066} {"train_loss": -26.73418617248535, "global_step": 420497, "epoch": 5066} {"train_loss": -26.617050170898438, "global_step": 420498, "epoch": 5066} {"train_loss": -26.19073486328125, "global_step": 420499, "epoch": 5066} {"train_loss": -26.743722915649414, "global_step": 420500, "epoch": 5066} {"train_loss": -26.708837509155273, "global_step": 420501, "epoch": 5066} {"train_loss": -26.4740047454834, "global_step": 420502, "epoch": 5066} {"train_loss": -26.84200096130371, "global_step": 420503, "epoch": 5066} {"train_loss": -26.45734977722168, "global_step": 420504, "epoch": 5066} {"train_loss": -26.682836532592773, "global_step": 420505, "epoch": 5066} {"train_loss": -26.6826171875, "global_step": 420506, "epoch": 5066} {"train_loss": -26.887521743774414, "global_step": 420507, "epoch": 5066} {"train_loss": -26.683874130249023, "global_step": 420508, "epoch": 5066} {"train_loss": -27.04102897644043, "global_step": 420509, "epoch": 5066} {"train_loss": -26.494855880737305, "global_step": 420510, "epoch": 5066} {"train_loss": -26.83088493347168, "global_step": 420511, "epoch": 5066} {"train_loss": -26.68638038635254, "global_step": 420512, "epoch": 5066} {"train_loss": -26.245588302612305, "global_step": 420513, "epoch": 5066} {"train_loss": -26.929624557495117, "global_step": 420514, "epoch": 5066} {"train_loss": -26.82850456237793, "global_step": 420515, "epoch": 5066} {"train_loss": -26.87806510925293, "global_step": 420516, "epoch": 5066} {"train_loss": -26.5749454498291, "global_step": 420517, "epoch": 5066} {"train_loss": -26.888477325439453, "global_step": 420518, "epoch": 5066} {"train_loss": -26.634033203125, "global_step": 420519, "epoch": 5066} {"train_loss": -26.64985466003418, "global_step": 420520, "epoch": 5066} {"train_loss": -26.91437339782715, "global_step": 420521, "epoch": 5066} {"train_loss": -26.889850616455078, "global_step": 420522, "epoch": 5066} {"train_loss": -26.756561279296875, "global_step": 420523, "epoch": 5066} {"train_loss": -27.147668838500977, "global_step": 420524, "epoch": 5066} {"train_loss": -26.703832626342773, "global_step": 420525, "epoch": 5066} {"train_loss": -26.998258590698242, "global_step": 420526, "epoch": 5066} {"train_loss": -26.891172409057617, "global_step": 420527, "epoch": 5066} {"train_loss": -27.070301055908203, "global_step": 420528, "epoch": 5066} {"train_loss": -26.778722763061523, "global_step": 420529, "epoch": 5066} {"train_loss": -27.030176162719727, "global_step": 420530, "epoch": 5066} {"train_loss": -27.066564559936523, "global_step": 420531, "epoch": 5066} {"train_loss": -27.0528621673584, "global_step": 420532, "epoch": 5066} {"train_loss": -26.633283615112305, "global_step": 420533, "epoch": 5066} {"train_loss": -26.50300407409668, "global_step": 420534, "epoch": 5066} {"train_loss": -26.94154930114746, "global_step": 420535, "epoch": 5066} {"train_loss": -27.13399314880371, "global_step": 420536, "epoch": 5066} {"train_loss": -27.374099731445312, "global_step": 420537, "epoch": 5066} {"train_loss": -27.09438133239746, "global_step": 420538, "epoch": 5066} {"train_loss": -27.25543785095215, "global_step": 420539, "epoch": 5066} {"train_loss": -26.865758895874023, "global_step": 420540, "epoch": 5066} {"train_loss": -27.11054039001465, "global_step": 420541, "epoch": 5066} {"train_loss": -27.03925132751465, "global_step": 420542, "epoch": 5066} {"train_loss": -26.956562042236328, "global_step": 420543, "epoch": 5066} {"train_loss": -27.11264991760254, "global_step": 420544, "epoch": 5066} {"train_loss": -27.1429500579834, "global_step": 420545, "epoch": 5066} {"train_loss": -26.847211837768555, "global_step": 420546, "epoch": 5066} {"train_loss": -27.253711700439453, "global_step": 420547, "epoch": 5066} {"train_loss": -26.996397018432617, "global_step": 420548, "epoch": 5066} {"train_loss": -27.0903377532959, "global_step": 420549, "epoch": 5066} {"train_loss": -26.654516220092773, "global_step": 420550, "epoch": 5066} {"train_loss": -26.906085968017578, "global_step": 420551, "epoch": 5066} {"train_loss": -26.836658477783203, "global_step": 420552, "epoch": 5066} {"train_loss": -26.44129753112793, "global_step": 420553, "epoch": 5066} {"train_loss": -26.63518714904785, "global_step": 420554, "epoch": 5066} {"train_loss": -26.529470443725586, "global_step": 420555, "epoch": 5066} {"train_loss": -26.82417869567871, "global_step": 420556, "epoch": 5066} {"train_loss": -26.529218673706055, "global_step": 420557, "epoch": 5066} {"train_loss": -26.52324867248535, "global_step": 420558, "epoch": 5066} {"train_loss": -26.85096549987793, "global_step": 420559, "epoch": 5066} {"train_loss": -26.64753746124635, "global_step": 420560, "epoch": 5066, "val_loss": 7019349.0} {"train_loss": -22.854175567626953, "global_step": 420561, "epoch": 5067} {"train_loss": -24.672607421875, "global_step": 420562, "epoch": 5067} {"train_loss": -23.987003326416016, "global_step": 420563, "epoch": 5067} {"train_loss": -25.8436222076416, "global_step": 420564, "epoch": 5067} {"train_loss": -24.403303146362305, "global_step": 420565, "epoch": 5067} {"train_loss": -25.350818634033203, "global_step": 420566, "epoch": 5067} {"train_loss": -25.925048828125, "global_step": 420567, "epoch": 5067} {"train_loss": -25.120630264282227, "global_step": 420568, "epoch": 5067} {"train_loss": -25.625553131103516, "global_step": 420569, "epoch": 5067} {"train_loss": -25.66779899597168, "global_step": 420570, "epoch": 5067} {"train_loss": -25.77294921875, "global_step": 420571, "epoch": 5067} {"train_loss": -25.946264266967773, "global_step": 420572, "epoch": 5067} {"train_loss": -26.03973388671875, "global_step": 420573, "epoch": 5067} {"train_loss": -25.96000099182129, "global_step": 420574, "epoch": 5067} {"train_loss": -25.914960861206055, "global_step": 420575, "epoch": 5067} {"train_loss": -26.3341007232666, "global_step": 420576, "epoch": 5067} {"train_loss": -25.971973419189453, "global_step": 420577, "epoch": 5067} {"train_loss": -26.08254051208496, "global_step": 420578, "epoch": 5067} {"train_loss": -26.078125, "global_step": 420579, "epoch": 5067} {"train_loss": -25.73090934753418, "global_step": 420580, "epoch": 5067} {"train_loss": -26.2191162109375, "global_step": 420581, "epoch": 5067} {"train_loss": -26.321063995361328, "global_step": 420582, "epoch": 5067} {"train_loss": -26.127410888671875, "global_step": 420583, "epoch": 5067} {"train_loss": -25.999652862548828, "global_step": 420584, "epoch": 5067} {"train_loss": -26.362287521362305, "global_step": 420585, "epoch": 5067} {"train_loss": -26.250131607055664, "global_step": 420586, "epoch": 5067} {"train_loss": -26.336156845092773, "global_step": 420587, "epoch": 5067} {"train_loss": -26.62156105041504, "global_step": 420588, "epoch": 5067} {"train_loss": -26.6073055267334, "global_step": 420589, "epoch": 5067} {"train_loss": -26.41733741760254, "global_step": 420590, "epoch": 5067} {"train_loss": -26.523527145385742, "global_step": 420591, "epoch": 5067} {"train_loss": -26.706268310546875, "global_step": 420592, "epoch": 5067} {"train_loss": -26.97193717956543, "global_step": 420593, "epoch": 5067} {"train_loss": -26.2629337310791, "global_step": 420594, "epoch": 5067} {"train_loss": -26.76236343383789, "global_step": 420595, "epoch": 5067} {"train_loss": -26.693220138549805, "global_step": 420596, "epoch": 5067} {"train_loss": -26.263065338134766, "global_step": 420597, "epoch": 5067} {"train_loss": -26.41261100769043, "global_step": 420598, "epoch": 5067} {"train_loss": -26.560422897338867, "global_step": 420599, "epoch": 5067} {"train_loss": -26.731409072875977, "global_step": 420600, "epoch": 5067} {"train_loss": -26.967309951782227, "global_step": 420601, "epoch": 5067} {"train_loss": -27.2484188079834, "global_step": 420602, "epoch": 5067} {"train_loss": -26.856714248657227, "global_step": 420603, "epoch": 5067} {"train_loss": -26.593341827392578, "global_step": 420604, "epoch": 5067} {"train_loss": -27.231794357299805, "global_step": 420605, "epoch": 5067} {"train_loss": -26.810041427612305, "global_step": 420606, "epoch": 5067} {"train_loss": -27.12330436706543, "global_step": 420607, "epoch": 5067} {"train_loss": -26.68440818786621, "global_step": 420608, "epoch": 5067} {"train_loss": -26.815597534179688, "global_step": 420609, "epoch": 5067} {"train_loss": -26.696603775024414, "global_step": 420610, "epoch": 5067} {"train_loss": -26.75934410095215, "global_step": 420611, "epoch": 5067} {"train_loss": -26.745758056640625, "global_step": 420612, "epoch": 5067} {"train_loss": -26.691303253173828, "global_step": 420613, "epoch": 5067} {"train_loss": -26.650222778320312, "global_step": 420614, "epoch": 5067} {"train_loss": -26.958332061767578, "global_step": 420615, "epoch": 5067} {"train_loss": -26.706029891967773, "global_step": 420616, "epoch": 5067} {"train_loss": -27.102258682250977, "global_step": 420617, "epoch": 5067} {"train_loss": -26.941207885742188, "global_step": 420618, "epoch": 5067} {"train_loss": -26.91950798034668, "global_step": 420619, "epoch": 5067} {"train_loss": -27.171350479125977, "global_step": 420620, "epoch": 5067} {"train_loss": -27.2269287109375, "global_step": 420621, "epoch": 5067} {"train_loss": -26.976720809936523, "global_step": 420622, "epoch": 5067} {"train_loss": -26.751373291015625, "global_step": 420623, "epoch": 5067} {"train_loss": -27.0104923248291, "global_step": 420624, "epoch": 5067} {"train_loss": -26.614484786987305, "global_step": 420625, "epoch": 5067} {"train_loss": -26.896472930908203, "global_step": 420626, "epoch": 5067} {"train_loss": -26.940052032470703, "global_step": 420627, "epoch": 5067} {"train_loss": -27.12122917175293, "global_step": 420628, "epoch": 5067} {"train_loss": -26.995807647705078, "global_step": 420629, "epoch": 5067} {"train_loss": -27.031936645507812, "global_step": 420630, "epoch": 5067} {"train_loss": -26.518817901611328, "global_step": 420631, "epoch": 5067} {"train_loss": -26.848480224609375, "global_step": 420632, "epoch": 5067} {"train_loss": -26.964405059814453, "global_step": 420633, "epoch": 5067} {"train_loss": -27.027267456054688, "global_step": 420634, "epoch": 5067} {"train_loss": -26.879703521728516, "global_step": 420635, "epoch": 5067} {"train_loss": -26.50531005859375, "global_step": 420636, "epoch": 5067} {"train_loss": -26.09716796875, "global_step": 420637, "epoch": 5067} {"train_loss": -26.05110740661621, "global_step": 420638, "epoch": 5067} {"train_loss": -26.763275146484375, "global_step": 420639, "epoch": 5067} {"train_loss": -26.631515502929688, "global_step": 420640, "epoch": 5067} {"train_loss": -26.995336532592773, "global_step": 420641, "epoch": 5067} {"train_loss": -26.45440101623535, "global_step": 420642, "epoch": 5067} {"train_loss": -26.413330606667394, "global_step": 420643, "epoch": 5067, "val_loss": 6986658.0} {"train_loss": -25.108692169189453, "global_step": 420644, "epoch": 5068} {"train_loss": -24.26250648498535, "global_step": 420645, "epoch": 5068} {"train_loss": -25.044885635375977, "global_step": 420646, "epoch": 5068} {"train_loss": -25.277801513671875, "global_step": 420647, "epoch": 5068} {"train_loss": -25.264022827148438, "global_step": 420648, "epoch": 5068} {"train_loss": -25.238922119140625, "global_step": 420649, "epoch": 5068} {"train_loss": -25.697956085205078, "global_step": 420650, "epoch": 5068} {"train_loss": -25.6966495513916, "global_step": 420651, "epoch": 5068} {"train_loss": -25.453989028930664, "global_step": 420652, "epoch": 5068} {"train_loss": -25.746570587158203, "global_step": 420653, "epoch": 5068} {"train_loss": -25.862638473510742, "global_step": 420654, "epoch": 5068} {"train_loss": -25.837270736694336, "global_step": 420655, "epoch": 5068} {"train_loss": -25.99480628967285, "global_step": 420656, "epoch": 5068} {"train_loss": -26.199628829956055, "global_step": 420657, "epoch": 5068} {"train_loss": -26.165082931518555, "global_step": 420658, "epoch": 5068} {"train_loss": -25.96792984008789, "global_step": 420659, "epoch": 5068} {"train_loss": -26.3013973236084, "global_step": 420660, "epoch": 5068} {"train_loss": -26.0109806060791, "global_step": 420661, "epoch": 5068} {"train_loss": -25.77875328063965, "global_step": 420662, "epoch": 5068} {"train_loss": -25.692035675048828, "global_step": 420663, "epoch": 5068} {"train_loss": -26.240659713745117, "global_step": 420664, "epoch": 5068} {"train_loss": -26.602136611938477, "global_step": 420665, "epoch": 5068} {"train_loss": -26.285980224609375, "global_step": 420666, "epoch": 5068} {"train_loss": -26.238698959350586, "global_step": 420667, "epoch": 5068} {"train_loss": -26.43844985961914, "global_step": 420668, "epoch": 5068} {"train_loss": -26.63995933532715, "global_step": 420669, "epoch": 5068} {"train_loss": -26.732797622680664, "global_step": 420670, "epoch": 5068} {"train_loss": -26.375757217407227, "global_step": 420671, "epoch": 5068} {"train_loss": -26.369525909423828, "global_step": 420672, "epoch": 5068} {"train_loss": -26.381330490112305, "global_step": 420673, "epoch": 5068} {"train_loss": -26.6991024017334, "global_step": 420674, "epoch": 5068} {"train_loss": -26.645278930664062, "global_step": 420675, "epoch": 5068} {"train_loss": -26.800235748291016, "global_step": 420676, "epoch": 5068} {"train_loss": -26.614246368408203, "global_step": 420677, "epoch": 5068} {"train_loss": -26.73636245727539, "global_step": 420678, "epoch": 5068} {"train_loss": -26.926441192626953, "global_step": 420679, "epoch": 5068} {"train_loss": -26.770002365112305, "global_step": 420680, "epoch": 5068} {"train_loss": -27.27863883972168, "global_step": 420681, "epoch": 5068} {"train_loss": -26.313703536987305, "global_step": 420682, "epoch": 5068} {"train_loss": -26.785633087158203, "global_step": 420683, "epoch": 5068} {"train_loss": -26.9896240234375, "global_step": 420684, "epoch": 5068} {"train_loss": -26.463947296142578, "global_step": 420685, "epoch": 5068} {"train_loss": -26.98772621154785, "global_step": 420686, "epoch": 5068} {"train_loss": -26.640857696533203, "global_step": 420687, "epoch": 5068} {"train_loss": -27.109710693359375, "global_step": 420688, "epoch": 5068} {"train_loss": -26.854873657226562, "global_step": 420689, "epoch": 5068} {"train_loss": -26.7358341217041, "global_step": 420690, "epoch": 5068} {"train_loss": -26.872638702392578, "global_step": 420691, "epoch": 5068} {"train_loss": -26.918264389038086, "global_step": 420692, "epoch": 5068} {"train_loss": -26.835498809814453, "global_step": 420693, "epoch": 5068} {"train_loss": -26.94219970703125, "global_step": 420694, "epoch": 5068} {"train_loss": -26.794836044311523, "global_step": 420695, "epoch": 5068} {"train_loss": -26.814193725585938, "global_step": 420696, "epoch": 5068} {"train_loss": -26.9071044921875, "global_step": 420697, "epoch": 5068} {"train_loss": -26.7725830078125, "global_step": 420698, "epoch": 5068} {"train_loss": -26.825958251953125, "global_step": 420699, "epoch": 5068} {"train_loss": -26.712507247924805, "global_step": 420700, "epoch": 5068} {"train_loss": -27.186981201171875, "global_step": 420701, "epoch": 5068} {"train_loss": -26.97562026977539, "global_step": 420702, "epoch": 5068} {"train_loss": -26.722700119018555, "global_step": 420703, "epoch": 5068} {"train_loss": -27.055435180664062, "global_step": 420704, "epoch": 5068} {"train_loss": -27.188751220703125, "global_step": 420705, "epoch": 5068} {"train_loss": -26.411666870117188, "global_step": 420706, "epoch": 5068} {"train_loss": -26.647329330444336, "global_step": 420707, "epoch": 5068} {"train_loss": -26.891332626342773, "global_step": 420708, "epoch": 5068} {"train_loss": -27.288440704345703, "global_step": 420709, "epoch": 5068} {"train_loss": -26.452728271484375, "global_step": 420710, "epoch": 5068} {"train_loss": -26.965723037719727, "global_step": 420711, "epoch": 5068} {"train_loss": -26.88924217224121, "global_step": 420712, "epoch": 5068} {"train_loss": -26.617475509643555, "global_step": 420713, "epoch": 5068} {"train_loss": -26.891021728515625, "global_step": 420714, "epoch": 5068} {"train_loss": -26.864288330078125, "global_step": 420715, "epoch": 5068} {"train_loss": -26.85877799987793, "global_step": 420716, "epoch": 5068} {"train_loss": -26.829130172729492, "global_step": 420717, "epoch": 5068} {"train_loss": -26.90449333190918, "global_step": 420718, "epoch": 5068} {"train_loss": -26.755842208862305, "global_step": 420719, "epoch": 5068} {"train_loss": -26.861501693725586, "global_step": 420720, "epoch": 5068} {"train_loss": -26.91855239868164, "global_step": 420721, "epoch": 5068} {"train_loss": -26.651351928710938, "global_step": 420722, "epoch": 5068} {"train_loss": -26.870655059814453, "global_step": 420723, "epoch": 5068} {"train_loss": -26.7802677154541, "global_step": 420724, "epoch": 5068} {"train_loss": -26.271207809448242, "global_step": 420725, "epoch": 5068} {"train_loss": -26.50183319183717, "global_step": 420726, "epoch": 5068, "val_loss": 7075732.0} {"train_loss": -26.377050399780273, "global_step": 420727, "epoch": 5069} {"train_loss": -25.767221450805664, "global_step": 420728, "epoch": 5069} {"train_loss": -26.148340225219727, "global_step": 420729, "epoch": 5069} {"train_loss": -26.476293563842773, "global_step": 420730, "epoch": 5069} {"train_loss": -26.031085968017578, "global_step": 420731, "epoch": 5069} {"train_loss": -26.03265380859375, "global_step": 420732, "epoch": 5069} {"train_loss": -25.862897872924805, "global_step": 420733, "epoch": 5069} {"train_loss": -26.759199142456055, "global_step": 420734, "epoch": 5069} {"train_loss": -25.989904403686523, "global_step": 420735, "epoch": 5069} {"train_loss": -26.413532257080078, "global_step": 420736, "epoch": 5069} {"train_loss": -26.652463912963867, "global_step": 420737, "epoch": 5069} {"train_loss": -26.361928939819336, "global_step": 420738, "epoch": 5069} {"train_loss": -26.737720489501953, "global_step": 420739, "epoch": 5069} {"train_loss": -26.517044067382812, "global_step": 420740, "epoch": 5069} {"train_loss": -26.513687133789062, "global_step": 420741, "epoch": 5069} {"train_loss": -26.253860473632812, "global_step": 420742, "epoch": 5069} {"train_loss": -26.71026039123535, "global_step": 420743, "epoch": 5069} {"train_loss": -26.5063533782959, "global_step": 420744, "epoch": 5069} {"train_loss": -26.983488082885742, "global_step": 420745, "epoch": 5069} {"train_loss": -26.52802848815918, "global_step": 420746, "epoch": 5069} {"train_loss": -26.59282875061035, "global_step": 420747, "epoch": 5069} {"train_loss": -26.352371215820312, "global_step": 420748, "epoch": 5069} {"train_loss": -26.80694007873535, "global_step": 420749, "epoch": 5069} {"train_loss": -27.2869815826416, "global_step": 420750, "epoch": 5069} {"train_loss": -27.090070724487305, "global_step": 420751, "epoch": 5069} {"train_loss": -26.980377197265625, "global_step": 420752, "epoch": 5069} {"train_loss": -27.0227108001709, "global_step": 420753, "epoch": 5069} {"train_loss": -26.88398551940918, "global_step": 420754, "epoch": 5069} {"train_loss": -27.273212432861328, "global_step": 420755, "epoch": 5069} {"train_loss": -27.1622257232666, "global_step": 420756, "epoch": 5069} {"train_loss": -26.74554443359375, "global_step": 420757, "epoch": 5069} {"train_loss": -26.942768096923828, "global_step": 420758, "epoch": 5069} {"train_loss": -26.598119735717773, "global_step": 420759, "epoch": 5069} {"train_loss": -26.678876876831055, "global_step": 420760, "epoch": 5069} {"train_loss": -27.184345245361328, "global_step": 420761, "epoch": 5069} {"train_loss": -26.837005615234375, "global_step": 420762, "epoch": 5069} {"train_loss": -27.140256881713867, "global_step": 420763, "epoch": 5069} {"train_loss": -26.5690975189209, "global_step": 420764, "epoch": 5069} {"train_loss": -27.339811325073242, "global_step": 420765, "epoch": 5069} {"train_loss": -26.952558517456055, "global_step": 420766, "epoch": 5069} {"train_loss": -26.73381996154785, "global_step": 420767, "epoch": 5069} {"train_loss": -26.914569854736328, "global_step": 420768, "epoch": 5069} {"train_loss": -26.748401641845703, "global_step": 420769, "epoch": 5069} {"train_loss": -26.805356979370117, "global_step": 420770, "epoch": 5069} {"train_loss": -26.779865264892578, "global_step": 420771, "epoch": 5069} {"train_loss": -26.76888084411621, "global_step": 420772, "epoch": 5069} {"train_loss": -27.430280685424805, "global_step": 420773, "epoch": 5069} {"train_loss": -26.897275924682617, "global_step": 420774, "epoch": 5069} {"train_loss": -27.196063995361328, "global_step": 420775, "epoch": 5069} {"train_loss": -26.946044921875, "global_step": 420776, "epoch": 5069} {"train_loss": -26.999380111694336, "global_step": 420777, "epoch": 5069} {"train_loss": -27.241605758666992, "global_step": 420778, "epoch": 5069} {"train_loss": -27.047622680664062, "global_step": 420779, "epoch": 5069} {"train_loss": -26.659259796142578, "global_step": 420780, "epoch": 5069} {"train_loss": -26.907846450805664, "global_step": 420781, "epoch": 5069} {"train_loss": -26.718656539916992, "global_step": 420782, "epoch": 5069} {"train_loss": -27.41108512878418, "global_step": 420783, "epoch": 5069} {"train_loss": -27.13811683654785, "global_step": 420784, "epoch": 5069} {"train_loss": -26.963254928588867, "global_step": 420785, "epoch": 5069} {"train_loss": -26.81880760192871, "global_step": 420786, "epoch": 5069} {"train_loss": -26.87516212463379, "global_step": 420787, "epoch": 5069} {"train_loss": -26.847681045532227, "global_step": 420788, "epoch": 5069} {"train_loss": -26.204242706298828, "global_step": 420789, "epoch": 5069} {"train_loss": -26.058164596557617, "global_step": 420790, "epoch": 5069} {"train_loss": -25.973480224609375, "global_step": 420791, "epoch": 5069} {"train_loss": -25.308603286743164, "global_step": 420792, "epoch": 5069} {"train_loss": -24.38608169555664, "global_step": 420793, "epoch": 5069} {"train_loss": -25.319265365600586, "global_step": 420794, "epoch": 5069} {"train_loss": -26.627216339111328, "global_step": 420795, "epoch": 5069} {"train_loss": -26.2592716217041, "global_step": 420796, "epoch": 5069} {"train_loss": -25.692785263061523, "global_step": 420797, "epoch": 5069} {"train_loss": -26.138473510742188, "global_step": 420798, "epoch": 5069} {"train_loss": -26.487104415893555, "global_step": 420799, "epoch": 5069} {"train_loss": -25.844589233398438, "global_step": 420800, "epoch": 5069} {"train_loss": -26.816654205322266, "global_step": 420801, "epoch": 5069} {"train_loss": -26.092031478881836, "global_step": 420802, "epoch": 5069} {"train_loss": -26.8416748046875, "global_step": 420803, "epoch": 5069} {"train_loss": -26.500049591064453, "global_step": 420804, "epoch": 5069} {"train_loss": -26.17000389099121, "global_step": 420805, "epoch": 5069} {"train_loss": -26.241901397705078, "global_step": 420806, "epoch": 5069} {"train_loss": -26.401987075805664, "global_step": 420807, "epoch": 5069} {"train_loss": -26.57159996032715, "global_step": 420808, "epoch": 5069} {"train_loss": -26.596135426716632, "global_step": 420809, "epoch": 5069, "val_loss": 7133829.5} {"train_loss": -26.095487594604492, "global_step": 420810, "epoch": 5070} {"train_loss": -26.54583168029785, "global_step": 420811, "epoch": 5070} {"train_loss": -26.396203994750977, "global_step": 420812, "epoch": 5070} {"train_loss": -26.627838134765625, "global_step": 420813, "epoch": 5070} {"train_loss": -26.674291610717773, "global_step": 420814, "epoch": 5070} {"train_loss": -26.3488826751709, "global_step": 420815, "epoch": 5070} {"train_loss": -26.456445693969727, "global_step": 420816, "epoch": 5070} {"train_loss": -26.745996475219727, "global_step": 420817, "epoch": 5070} {"train_loss": -26.57706642150879, "global_step": 420818, "epoch": 5070} {"train_loss": -26.635107040405273, "global_step": 420819, "epoch": 5070} {"train_loss": -27.022876739501953, "global_step": 420820, "epoch": 5070} {"train_loss": -26.626203536987305, "global_step": 420821, "epoch": 5070} {"train_loss": -26.800024032592773, "global_step": 420822, "epoch": 5070} {"train_loss": -26.616809844970703, "global_step": 420823, "epoch": 5070} {"train_loss": -26.845849990844727, "global_step": 420824, "epoch": 5070} {"train_loss": -26.933408737182617, "global_step": 420825, "epoch": 5070} {"train_loss": -26.918603897094727, "global_step": 420826, "epoch": 5070} {"train_loss": -27.014902114868164, "global_step": 420827, "epoch": 5070} {"train_loss": -27.216825485229492, "global_step": 420828, "epoch": 5070} {"train_loss": -26.52033042907715, "global_step": 420829, "epoch": 5070} {"train_loss": -26.754255294799805, "global_step": 420830, "epoch": 5070} {"train_loss": -26.90509605407715, "global_step": 420831, "epoch": 5070} {"train_loss": -27.074298858642578, "global_step": 420832, "epoch": 5070} {"train_loss": -27.00800132751465, "global_step": 420833, "epoch": 5070} {"train_loss": -26.70734977722168, "global_step": 420834, "epoch": 5070} {"train_loss": -26.60833740234375, "global_step": 420835, "epoch": 5070} {"train_loss": -26.748966217041016, "global_step": 420836, "epoch": 5070} {"train_loss": -26.908018112182617, "global_step": 420837, "epoch": 5070} {"train_loss": -26.783849716186523, "global_step": 420838, "epoch": 5070} {"train_loss": -26.992929458618164, "global_step": 420839, "epoch": 5070} {"train_loss": -27.204336166381836, "global_step": 420840, "epoch": 5070} {"train_loss": -27.029409408569336, "global_step": 420841, "epoch": 5070} {"train_loss": -26.949111938476562, "global_step": 420842, "epoch": 5070} {"train_loss": -27.011127471923828, "global_step": 420843, "epoch": 5070} {"train_loss": -26.8316650390625, "global_step": 420844, "epoch": 5070} {"train_loss": -26.930036544799805, "global_step": 420845, "epoch": 5070} {"train_loss": -27.09732437133789, "global_step": 420846, "epoch": 5070} {"train_loss": -26.675674438476562, "global_step": 420847, "epoch": 5070} {"train_loss": -27.1291561126709, "global_step": 420848, "epoch": 5070} {"train_loss": -26.845632553100586, "global_step": 420849, "epoch": 5070} {"train_loss": -26.93902587890625, "global_step": 420850, "epoch": 5070} {"train_loss": -26.73126220703125, "global_step": 420851, "epoch": 5070} {"train_loss": -27.032367706298828, "global_step": 420852, "epoch": 5070} {"train_loss": -27.2523250579834, "global_step": 420853, "epoch": 5070} {"train_loss": -26.862268447875977, "global_step": 420854, "epoch": 5070} {"train_loss": -27.08829689025879, "global_step": 420855, "epoch": 5070} {"train_loss": -26.99920654296875, "global_step": 420856, "epoch": 5070} {"train_loss": -26.876623153686523, "global_step": 420857, "epoch": 5070} {"train_loss": -26.95682144165039, "global_step": 420858, "epoch": 5070} {"train_loss": -27.241689682006836, "global_step": 420859, "epoch": 5070} {"train_loss": -27.035058975219727, "global_step": 420860, "epoch": 5070} {"train_loss": -26.941869735717773, "global_step": 420861, "epoch": 5070} {"train_loss": -26.803815841674805, "global_step": 420862, "epoch": 5070} {"train_loss": -27.491125106811523, "global_step": 420863, "epoch": 5070} {"train_loss": -26.890548706054688, "global_step": 420864, "epoch": 5070} {"train_loss": -27.186872482299805, "global_step": 420865, "epoch": 5070} {"train_loss": -26.865564346313477, "global_step": 420866, "epoch": 5070} {"train_loss": -26.69112205505371, "global_step": 420867, "epoch": 5070} {"train_loss": -27.03350830078125, "global_step": 420868, "epoch": 5070} {"train_loss": -26.935123443603516, "global_step": 420869, "epoch": 5070} {"train_loss": -27.13665771484375, "global_step": 420870, "epoch": 5070} {"train_loss": -26.9693660736084, "global_step": 420871, "epoch": 5070} {"train_loss": -26.733097076416016, "global_step": 420872, "epoch": 5070} {"train_loss": -26.551380157470703, "global_step": 420873, "epoch": 5070} {"train_loss": -26.919218063354492, "global_step": 420874, "epoch": 5070} {"train_loss": -26.83680534362793, "global_step": 420875, "epoch": 5070} {"train_loss": -26.77569580078125, "global_step": 420876, "epoch": 5070} {"train_loss": -26.84769058227539, "global_step": 420877, "epoch": 5070} {"train_loss": -26.83452796936035, "global_step": 420878, "epoch": 5070} {"train_loss": -26.991483688354492, "global_step": 420879, "epoch": 5070} {"train_loss": -26.835418701171875, "global_step": 420880, "epoch": 5070} {"train_loss": -27.09598731994629, "global_step": 420881, "epoch": 5070} {"train_loss": -26.594440460205078, "global_step": 420882, "epoch": 5070} {"train_loss": -26.9249267578125, "global_step": 420883, "epoch": 5070} {"train_loss": -26.762710571289062, "global_step": 420884, "epoch": 5070} {"train_loss": -27.24225425720215, "global_step": 420885, "epoch": 5070} {"train_loss": -26.839746475219727, "global_step": 420886, "epoch": 5070} {"train_loss": -26.366744995117188, "global_step": 420887, "epoch": 5070} {"train_loss": -26.102405548095703, "global_step": 420888, "epoch": 5070} {"train_loss": -26.223852157592773, "global_step": 420889, "epoch": 5070} {"train_loss": -26.793554306030273, "global_step": 420890, "epoch": 5070} {"train_loss": -26.80169677734375, "global_step": 420891, "epoch": 5070} {"train_loss": -26.853257696312593, "global_step": 420892, "epoch": 5070, "val_loss": 7064441.0} {"train_loss": -26.060781478881836, "global_step": 420893, "epoch": 5071} {"train_loss": -24.399690628051758, "global_step": 420894, "epoch": 5071} {"train_loss": -26.033679962158203, "global_step": 420895, "epoch": 5071} {"train_loss": -25.469532012939453, "global_step": 420896, "epoch": 5071} {"train_loss": -25.10646629333496, "global_step": 420897, "epoch": 5071} {"train_loss": -26.170164108276367, "global_step": 420898, "epoch": 5071} {"train_loss": -25.38810920715332, "global_step": 420899, "epoch": 5071} {"train_loss": -26.191028594970703, "global_step": 420900, "epoch": 5071} {"train_loss": -25.673559188842773, "global_step": 420901, "epoch": 5071} {"train_loss": -26.1972713470459, "global_step": 420902, "epoch": 5071} {"train_loss": -26.093557357788086, "global_step": 420903, "epoch": 5071} {"train_loss": -26.35135841369629, "global_step": 420904, "epoch": 5071} {"train_loss": -26.29054069519043, "global_step": 420905, "epoch": 5071} {"train_loss": -25.778295516967773, "global_step": 420906, "epoch": 5071} {"train_loss": -26.343854904174805, "global_step": 420907, "epoch": 5071} {"train_loss": -26.383197784423828, "global_step": 420908, "epoch": 5071} {"train_loss": -25.927108764648438, "global_step": 420909, "epoch": 5071} {"train_loss": -26.5906982421875, "global_step": 420910, "epoch": 5071} {"train_loss": -26.053373336791992, "global_step": 420911, "epoch": 5071} {"train_loss": -26.511865615844727, "global_step": 420912, "epoch": 5071} {"train_loss": -26.210601806640625, "global_step": 420913, "epoch": 5071} {"train_loss": -26.436447143554688, "global_step": 420914, "epoch": 5071} {"train_loss": -26.43817710876465, "global_step": 420915, "epoch": 5071} {"train_loss": -26.538671493530273, "global_step": 420916, "epoch": 5071} {"train_loss": -26.463897705078125, "global_step": 420917, "epoch": 5071} {"train_loss": -26.282880783081055, "global_step": 420918, "epoch": 5071} {"train_loss": -26.613235473632812, "global_step": 420919, "epoch": 5071} {"train_loss": -26.247690200805664, "global_step": 420920, "epoch": 5071} {"train_loss": -26.110620498657227, "global_step": 420921, "epoch": 5071} {"train_loss": -26.466394424438477, "global_step": 420922, "epoch": 5071} {"train_loss": -26.4947509765625, "global_step": 420923, "epoch": 5071} {"train_loss": -26.756383895874023, "global_step": 420924, "epoch": 5071} {"train_loss": -26.37156105041504, "global_step": 420925, "epoch": 5071} {"train_loss": -26.506610870361328, "global_step": 420926, "epoch": 5071} {"train_loss": -26.336755752563477, "global_step": 420927, "epoch": 5071} {"train_loss": -26.603200912475586, "global_step": 420928, "epoch": 5071} {"train_loss": -26.799280166625977, "global_step": 420929, "epoch": 5071} {"train_loss": -26.994787216186523, "global_step": 420930, "epoch": 5071} {"train_loss": -26.77931022644043, "global_step": 420931, "epoch": 5071} {"train_loss": -26.952001571655273, "global_step": 420932, "epoch": 5071} {"train_loss": -26.69599723815918, "global_step": 420933, "epoch": 5071} {"train_loss": -26.799591064453125, "global_step": 420934, "epoch": 5071} {"train_loss": -27.073694229125977, "global_step": 420935, "epoch": 5071} {"train_loss": -26.857641220092773, "global_step": 420936, "epoch": 5071} {"train_loss": -26.931594848632812, "global_step": 420937, "epoch": 5071} {"train_loss": -26.571557998657227, "global_step": 420938, "epoch": 5071} {"train_loss": -26.685321807861328, "global_step": 420939, "epoch": 5071} {"train_loss": -26.6169376373291, "global_step": 420940, "epoch": 5071} {"train_loss": -26.67011833190918, "global_step": 420941, "epoch": 5071} {"train_loss": -27.137487411499023, "global_step": 420942, "epoch": 5071} {"train_loss": -26.90559196472168, "global_step": 420943, "epoch": 5071} {"train_loss": -27.2706241607666, "global_step": 420944, "epoch": 5071} {"train_loss": -27.02288818359375, "global_step": 420945, "epoch": 5071} {"train_loss": -27.09173011779785, "global_step": 420946, "epoch": 5071} {"train_loss": -26.828332901000977, "global_step": 420947, "epoch": 5071} {"train_loss": -26.805566787719727, "global_step": 420948, "epoch": 5071} {"train_loss": -27.231842041015625, "global_step": 420949, "epoch": 5071} {"train_loss": -27.136884689331055, "global_step": 420950, "epoch": 5071} {"train_loss": -27.112226486206055, "global_step": 420951, "epoch": 5071} {"train_loss": -27.356592178344727, "global_step": 420952, "epoch": 5071} {"train_loss": -26.983198165893555, "global_step": 420953, "epoch": 5071} {"train_loss": -26.976776123046875, "global_step": 420954, "epoch": 5071} {"train_loss": -26.835235595703125, "global_step": 420955, "epoch": 5071} {"train_loss": -26.946638107299805, "global_step": 420956, "epoch": 5071} {"train_loss": -26.976795196533203, "global_step": 420957, "epoch": 5071} {"train_loss": -27.211423873901367, "global_step": 420958, "epoch": 5071} {"train_loss": -26.723508834838867, "global_step": 420959, "epoch": 5071} {"train_loss": -26.745813369750977, "global_step": 420960, "epoch": 5071} {"train_loss": -26.946298599243164, "global_step": 420961, "epoch": 5071} {"train_loss": -26.76881217956543, "global_step": 420962, "epoch": 5071} {"train_loss": -26.938825607299805, "global_step": 420963, "epoch": 5071} {"train_loss": -26.776575088500977, "global_step": 420964, "epoch": 5071} {"train_loss": -26.283292770385742, "global_step": 420965, "epoch": 5071} {"train_loss": -26.651044845581055, "global_step": 420966, "epoch": 5071} {"train_loss": -26.7625732421875, "global_step": 420967, "epoch": 5071} {"train_loss": -26.91061782836914, "global_step": 420968, "epoch": 5071} {"train_loss": -26.320831298828125, "global_step": 420969, "epoch": 5071} {"train_loss": -26.200239181518555, "global_step": 420970, "epoch": 5071} {"train_loss": -26.099889755249023, "global_step": 420971, "epoch": 5071} {"train_loss": -26.598630905151367, "global_step": 420972, "epoch": 5071} {"train_loss": -26.488849639892578, "global_step": 420973, "epoch": 5071} {"train_loss": -26.908660888671875, "global_step": 420974, "epoch": 5071} {"train_loss": -26.5428845049387, "global_step": 420975, "epoch": 5071, "val_loss": 6990608.0} {"train_loss": -25.922414779663086, "global_step": 420976, "epoch": 5072} {"train_loss": -25.77601432800293, "global_step": 420977, "epoch": 5072} {"train_loss": -26.301685333251953, "global_step": 420978, "epoch": 5072} {"train_loss": -26.3228759765625, "global_step": 420979, "epoch": 5072} {"train_loss": -26.147663116455078, "global_step": 420980, "epoch": 5072} {"train_loss": -26.198373794555664, "global_step": 420981, "epoch": 5072} {"train_loss": -26.39397621154785, "global_step": 420982, "epoch": 5072} {"train_loss": -26.529373168945312, "global_step": 420983, "epoch": 5072} {"train_loss": -26.31613540649414, "global_step": 420984, "epoch": 5072} {"train_loss": -26.403879165649414, "global_step": 420985, "epoch": 5072} {"train_loss": -26.21270179748535, "global_step": 420986, "epoch": 5072} {"train_loss": -26.62050437927246, "global_step": 420987, "epoch": 5072} {"train_loss": -26.63775634765625, "global_step": 420988, "epoch": 5072} {"train_loss": -26.564496994018555, "global_step": 420989, "epoch": 5072} {"train_loss": -26.714752197265625, "global_step": 420990, "epoch": 5072} {"train_loss": -26.68271827697754, "global_step": 420991, "epoch": 5072} {"train_loss": -26.39422035217285, "global_step": 420992, "epoch": 5072} {"train_loss": -26.766525268554688, "global_step": 420993, "epoch": 5072} {"train_loss": -26.470539093017578, "global_step": 420994, "epoch": 5072} {"train_loss": -26.944849014282227, "global_step": 420995, "epoch": 5072} {"train_loss": -26.899219512939453, "global_step": 420996, "epoch": 5072} {"train_loss": -26.86285400390625, "global_step": 420997, "epoch": 5072} {"train_loss": -27.061725616455078, "global_step": 420998, "epoch": 5072} {"train_loss": -26.698089599609375, "global_step": 420999, "epoch": 5072} {"train_loss": -27.022464752197266, "global_step": 421000, "epoch": 5072} {"train_loss": -26.844146728515625, "global_step": 421001, "epoch": 5072} {"train_loss": -26.875669479370117, "global_step": 421002, "epoch": 5072} {"train_loss": -26.89680290222168, "global_step": 421003, "epoch": 5072} {"train_loss": -26.458417892456055, "global_step": 421004, "epoch": 5072} {"train_loss": -26.994672775268555, "global_step": 421005, "epoch": 5072} {"train_loss": -26.868513107299805, "global_step": 421006, "epoch": 5072} {"train_loss": -26.626951217651367, "global_step": 421007, "epoch": 5072} {"train_loss": -27.198286056518555, "global_step": 421008, "epoch": 5072} {"train_loss": -26.925138473510742, "global_step": 421009, "epoch": 5072} {"train_loss": -26.90461540222168, "global_step": 421010, "epoch": 5072} {"train_loss": -26.633316040039062, "global_step": 421011, "epoch": 5072} {"train_loss": -27.23259925842285, "global_step": 421012, "epoch": 5072} {"train_loss": -26.86060905456543, "global_step": 421013, "epoch": 5072} {"train_loss": -26.745397567749023, "global_step": 421014, "epoch": 5072} {"train_loss": -26.861433029174805, "global_step": 421015, "epoch": 5072} {"train_loss": -26.849706649780273, "global_step": 421016, "epoch": 5072} {"train_loss": -26.7053279876709, "global_step": 421017, "epoch": 5072} {"train_loss": -27.018461227416992, "global_step": 421018, "epoch": 5072} {"train_loss": -26.970312118530273, "global_step": 421019, "epoch": 5072} {"train_loss": -27.256994247436523, "global_step": 421020, "epoch": 5072} {"train_loss": -27.175739288330078, "global_step": 421021, "epoch": 5072} {"train_loss": -26.7962589263916, "global_step": 421022, "epoch": 5072} {"train_loss": -26.9354190826416, "global_step": 421023, "epoch": 5072} {"train_loss": -26.633127212524414, "global_step": 421024, "epoch": 5072} {"train_loss": -26.8985595703125, "global_step": 421025, "epoch": 5072} {"train_loss": -26.973840713500977, "global_step": 421026, "epoch": 5072} {"train_loss": -26.91840171813965, "global_step": 421027, "epoch": 5072} {"train_loss": -26.62749671936035, "global_step": 421028, "epoch": 5072} {"train_loss": -26.837636947631836, "global_step": 421029, "epoch": 5072} {"train_loss": -26.707380294799805, "global_step": 421030, "epoch": 5072} {"train_loss": -27.32488441467285, "global_step": 421031, "epoch": 5072} {"train_loss": -27.090925216674805, "global_step": 421032, "epoch": 5072} {"train_loss": -26.81040382385254, "global_step": 421033, "epoch": 5072} {"train_loss": -26.884729385375977, "global_step": 421034, "epoch": 5072} {"train_loss": -26.994470596313477, "global_step": 421035, "epoch": 5072} {"train_loss": -27.192005157470703, "global_step": 421036, "epoch": 5072} {"train_loss": -27.166168212890625, "global_step": 421037, "epoch": 5072} {"train_loss": -26.8060302734375, "global_step": 421038, "epoch": 5072} {"train_loss": -27.055286407470703, "global_step": 421039, "epoch": 5072} {"train_loss": -26.437475204467773, "global_step": 421040, "epoch": 5072} {"train_loss": -27.0697078704834, "global_step": 421041, "epoch": 5072} {"train_loss": -26.79133415222168, "global_step": 421042, "epoch": 5072} {"train_loss": -26.797382354736328, "global_step": 421043, "epoch": 5072} {"train_loss": -26.8598575592041, "global_step": 421044, "epoch": 5072} {"train_loss": -26.85797691345215, "global_step": 421045, "epoch": 5072} {"train_loss": -26.98075294494629, "global_step": 421046, "epoch": 5072} {"train_loss": -26.68450355529785, "global_step": 421047, "epoch": 5072} {"train_loss": -26.94280433654785, "global_step": 421048, "epoch": 5072} {"train_loss": -26.83786964416504, "global_step": 421049, "epoch": 5072} {"train_loss": -27.071613311767578, "global_step": 421050, "epoch": 5072} {"train_loss": -27.355945587158203, "global_step": 421051, "epoch": 5072} {"train_loss": -26.629623413085938, "global_step": 421052, "epoch": 5072} {"train_loss": -27.008655548095703, "global_step": 421053, "epoch": 5072} {"train_loss": -26.740264892578125, "global_step": 421054, "epoch": 5072} {"train_loss": -26.899551391601562, "global_step": 421055, "epoch": 5072} {"train_loss": -26.823827743530273, "global_step": 421056, "epoch": 5072} {"train_loss": -26.792600631713867, "global_step": 421057, "epoch": 5072} {"train_loss": -26.78326634326613, "global_step": 421058, "epoch": 5072, "val_loss": 7049925.0} {"train_loss": -26.326007843017578, "global_step": 421059, "epoch": 5073} {"train_loss": -25.5877628326416, "global_step": 421060, "epoch": 5073} {"train_loss": -25.91812515258789, "global_step": 421061, "epoch": 5073} {"train_loss": -26.60845375061035, "global_step": 421062, "epoch": 5073} {"train_loss": -26.373138427734375, "global_step": 421063, "epoch": 5073} {"train_loss": -26.663043975830078, "global_step": 421064, "epoch": 5073} {"train_loss": -26.770648956298828, "global_step": 421065, "epoch": 5073} {"train_loss": -26.420263290405273, "global_step": 421066, "epoch": 5073} {"train_loss": -26.94281005859375, "global_step": 421067, "epoch": 5073} {"train_loss": -26.82014274597168, "global_step": 421068, "epoch": 5073} {"train_loss": -26.701990127563477, "global_step": 421069, "epoch": 5073} {"train_loss": -26.655248641967773, "global_step": 421070, "epoch": 5073} {"train_loss": -26.86652946472168, "global_step": 421071, "epoch": 5073} {"train_loss": -26.690399169921875, "global_step": 421072, "epoch": 5073} {"train_loss": -27.001068115234375, "global_step": 421073, "epoch": 5073} {"train_loss": -27.00983238220215, "global_step": 421074, "epoch": 5073} {"train_loss": -26.87212562561035, "global_step": 421075, "epoch": 5073} {"train_loss": -26.782943725585938, "global_step": 421076, "epoch": 5073} {"train_loss": -26.886632919311523, "global_step": 421077, "epoch": 5073} {"train_loss": -26.723493576049805, "global_step": 421078, "epoch": 5073} {"train_loss": -26.6405029296875, "global_step": 421079, "epoch": 5073} {"train_loss": -26.643712997436523, "global_step": 421080, "epoch": 5073} {"train_loss": -27.296728134155273, "global_step": 421081, "epoch": 5073} {"train_loss": -26.9368896484375, "global_step": 421082, "epoch": 5073} {"train_loss": -26.485624313354492, "global_step": 421083, "epoch": 5073} {"train_loss": -26.872522354125977, "global_step": 421084, "epoch": 5073} {"train_loss": -26.67328453063965, "global_step": 421085, "epoch": 5073} {"train_loss": -26.96042251586914, "global_step": 421086, "epoch": 5073} {"train_loss": -26.877012252807617, "global_step": 421087, "epoch": 5073} {"train_loss": -26.66609001159668, "global_step": 421088, "epoch": 5073} {"train_loss": -26.5831241607666, "global_step": 421089, "epoch": 5073} {"train_loss": -26.88809585571289, "global_step": 421090, "epoch": 5073} {"train_loss": -26.873245239257812, "global_step": 421091, "epoch": 5073} {"train_loss": -27.107147216796875, "global_step": 421092, "epoch": 5073} {"train_loss": -26.601642608642578, "global_step": 421093, "epoch": 5073} {"train_loss": -26.993131637573242, "global_step": 421094, "epoch": 5073} {"train_loss": -27.01722526550293, "global_step": 421095, "epoch": 5073} {"train_loss": -26.767908096313477, "global_step": 421096, "epoch": 5073} {"train_loss": -27.18043327331543, "global_step": 421097, "epoch": 5073} {"train_loss": -27.16961097717285, "global_step": 421098, "epoch": 5073} {"train_loss": -27.060073852539062, "global_step": 421099, "epoch": 5073} {"train_loss": -27.029022216796875, "global_step": 421100, "epoch": 5073} {"train_loss": -26.842878341674805, "global_step": 421101, "epoch": 5073} {"train_loss": -27.090513229370117, "global_step": 421102, "epoch": 5073} {"train_loss": -26.591083526611328, "global_step": 421103, "epoch": 5073} {"train_loss": -26.752119064331055, "global_step": 421104, "epoch": 5073} {"train_loss": -26.747802734375, "global_step": 421105, "epoch": 5073} {"train_loss": -27.02617835998535, "global_step": 421106, "epoch": 5073} {"train_loss": -26.568044662475586, "global_step": 421107, "epoch": 5073} {"train_loss": -27.130517959594727, "global_step": 421108, "epoch": 5073} {"train_loss": -26.925769805908203, "global_step": 421109, "epoch": 5073} {"train_loss": -26.921018600463867, "global_step": 421110, "epoch": 5073} {"train_loss": -26.635984420776367, "global_step": 421111, "epoch": 5073} {"train_loss": -27.079727172851562, "global_step": 421112, "epoch": 5073} {"train_loss": -27.2627010345459, "global_step": 421113, "epoch": 5073} {"train_loss": -26.750534057617188, "global_step": 421114, "epoch": 5073} {"train_loss": -26.851959228515625, "global_step": 421115, "epoch": 5073} {"train_loss": -26.973346710205078, "global_step": 421116, "epoch": 5073} {"train_loss": -27.005292892456055, "global_step": 421117, "epoch": 5073} {"train_loss": -27.132299423217773, "global_step": 421118, "epoch": 5073} {"train_loss": -27.194690704345703, "global_step": 421119, "epoch": 5073} {"train_loss": -26.542495727539062, "global_step": 421120, "epoch": 5073} {"train_loss": -26.65815544128418, "global_step": 421121, "epoch": 5073} {"train_loss": -26.703170776367188, "global_step": 421122, "epoch": 5073} {"train_loss": -26.833288192749023, "global_step": 421123, "epoch": 5073} {"train_loss": -26.69061279296875, "global_step": 421124, "epoch": 5073} {"train_loss": -26.57281494140625, "global_step": 421125, "epoch": 5073} {"train_loss": -26.68402099609375, "global_step": 421126, "epoch": 5073} {"train_loss": -26.637393951416016, "global_step": 421127, "epoch": 5073} {"train_loss": -27.1166934967041, "global_step": 421128, "epoch": 5073} {"train_loss": -26.805334091186523, "global_step": 421129, "epoch": 5073} {"train_loss": -26.929962158203125, "global_step": 421130, "epoch": 5073} {"train_loss": -27.09187889099121, "global_step": 421131, "epoch": 5073} {"train_loss": -26.919164657592773, "global_step": 421132, "epoch": 5073} {"train_loss": -26.705615997314453, "global_step": 421133, "epoch": 5073} {"train_loss": -26.607715606689453, "global_step": 421134, "epoch": 5073} {"train_loss": -26.3341064453125, "global_step": 421135, "epoch": 5073} {"train_loss": -26.761341094970703, "global_step": 421136, "epoch": 5073} {"train_loss": -26.69954490661621, "global_step": 421137, "epoch": 5073} {"train_loss": -26.849567413330078, "global_step": 421138, "epoch": 5073} {"train_loss": -26.561918258666992, "global_step": 421139, "epoch": 5073} {"train_loss": -26.884323120117188, "global_step": 421140, "epoch": 5073} {"train_loss": -26.79620935830725, "global_step": 421141, "epoch": 5073, "val_loss": 7108099.0} {"train_loss": -26.36136817932129, "global_step": 421142, "epoch": 5074} {"train_loss": -26.22352409362793, "global_step": 421143, "epoch": 5074} {"train_loss": -26.236677169799805, "global_step": 421144, "epoch": 5074} {"train_loss": -26.36322021484375, "global_step": 421145, "epoch": 5074} {"train_loss": -26.261083602905273, "global_step": 421146, "epoch": 5074} {"train_loss": -26.1749210357666, "global_step": 421147, "epoch": 5074} {"train_loss": -26.351043701171875, "global_step": 421148, "epoch": 5074} {"train_loss": -26.345190048217773, "global_step": 421149, "epoch": 5074} {"train_loss": -26.10967445373535, "global_step": 421150, "epoch": 5074} {"train_loss": -26.955169677734375, "global_step": 421151, "epoch": 5074} {"train_loss": -26.017248153686523, "global_step": 421152, "epoch": 5074} {"train_loss": -26.428287506103516, "global_step": 421153, "epoch": 5074} {"train_loss": -26.723474502563477, "global_step": 421154, "epoch": 5074} {"train_loss": -26.594268798828125, "global_step": 421155, "epoch": 5074} {"train_loss": -26.6403751373291, "global_step": 421156, "epoch": 5074} {"train_loss": -26.704925537109375, "global_step": 421157, "epoch": 5074} {"train_loss": -27.125720977783203, "global_step": 421158, "epoch": 5074} {"train_loss": -26.580671310424805, "global_step": 421159, "epoch": 5074} {"train_loss": -26.35511589050293, "global_step": 421160, "epoch": 5074} {"train_loss": -26.932432174682617, "global_step": 421161, "epoch": 5074} {"train_loss": -26.655603408813477, "global_step": 421162, "epoch": 5074} {"train_loss": -26.61598777770996, "global_step": 421163, "epoch": 5074} {"train_loss": -26.79856300354004, "global_step": 421164, "epoch": 5074} {"train_loss": -26.36903190612793, "global_step": 421165, "epoch": 5074} {"train_loss": -27.01922035217285, "global_step": 421166, "epoch": 5074} {"train_loss": -26.844709396362305, "global_step": 421167, "epoch": 5074} {"train_loss": -26.820419311523438, "global_step": 421168, "epoch": 5074} {"train_loss": -26.496906280517578, "global_step": 421169, "epoch": 5074} {"train_loss": -26.632455825805664, "global_step": 421170, "epoch": 5074} {"train_loss": -27.197895050048828, "global_step": 421171, "epoch": 5074} {"train_loss": -26.980300903320312, "global_step": 421172, "epoch": 5074} {"train_loss": -26.785781860351562, "global_step": 421173, "epoch": 5074} {"train_loss": -26.789793014526367, "global_step": 421174, "epoch": 5074} {"train_loss": -27.141254425048828, "global_step": 421175, "epoch": 5074} {"train_loss": -27.189939498901367, "global_step": 421176, "epoch": 5074} {"train_loss": -26.967138290405273, "global_step": 421177, "epoch": 5074} {"train_loss": -26.9017333984375, "global_step": 421178, "epoch": 5074} {"train_loss": -26.787031173706055, "global_step": 421179, "epoch": 5074} {"train_loss": -27.115488052368164, "global_step": 421180, "epoch": 5074} {"train_loss": -26.86478042602539, "global_step": 421181, "epoch": 5074} {"train_loss": -26.888568878173828, "global_step": 421182, "epoch": 5074} {"train_loss": -26.81633949279785, "global_step": 421183, "epoch": 5074} {"train_loss": -26.460485458374023, "global_step": 421184, "epoch": 5074} {"train_loss": -26.13911247253418, "global_step": 421185, "epoch": 5074} {"train_loss": -27.0787296295166, "global_step": 421186, "epoch": 5074} {"train_loss": -26.572553634643555, "global_step": 421187, "epoch": 5074} {"train_loss": -26.430103302001953, "global_step": 421188, "epoch": 5074} {"train_loss": -27.01653480529785, "global_step": 421189, "epoch": 5074} {"train_loss": -26.88953971862793, "global_step": 421190, "epoch": 5074} {"train_loss": -26.40382194519043, "global_step": 421191, "epoch": 5074} {"train_loss": -26.557523727416992, "global_step": 421192, "epoch": 5074} {"train_loss": -26.88606071472168, "global_step": 421193, "epoch": 5074} {"train_loss": -26.831562042236328, "global_step": 421194, "epoch": 5074} {"train_loss": -27.124067306518555, "global_step": 421195, "epoch": 5074} {"train_loss": -26.74082374572754, "global_step": 421196, "epoch": 5074} {"train_loss": -26.879837036132812, "global_step": 421197, "epoch": 5074} {"train_loss": -26.698095321655273, "global_step": 421198, "epoch": 5074} {"train_loss": -26.967573165893555, "global_step": 421199, "epoch": 5074} {"train_loss": -26.98883628845215, "global_step": 421200, "epoch": 5074} {"train_loss": -26.689130783081055, "global_step": 421201, "epoch": 5074} {"train_loss": -27.2541446685791, "global_step": 421202, "epoch": 5074} {"train_loss": -26.725818634033203, "global_step": 421203, "epoch": 5074} {"train_loss": -26.77781105041504, "global_step": 421204, "epoch": 5074} {"train_loss": -26.841455459594727, "global_step": 421205, "epoch": 5074} {"train_loss": -26.741168975830078, "global_step": 421206, "epoch": 5074} {"train_loss": -26.95572853088379, "global_step": 421207, "epoch": 5074} {"train_loss": -26.62904930114746, "global_step": 421208, "epoch": 5074} {"train_loss": -26.666624069213867, "global_step": 421209, "epoch": 5074} {"train_loss": -26.59795570373535, "global_step": 421210, "epoch": 5074} {"train_loss": -27.140472412109375, "global_step": 421211, "epoch": 5074} {"train_loss": -26.771472930908203, "global_step": 421212, "epoch": 5074} {"train_loss": -26.98876953125, "global_step": 421213, "epoch": 5074} {"train_loss": -26.7778263092041, "global_step": 421214, "epoch": 5074} {"train_loss": -27.22702980041504, "global_step": 421215, "epoch": 5074} {"train_loss": -27.042373657226562, "global_step": 421216, "epoch": 5074} {"train_loss": -27.213764190673828, "global_step": 421217, "epoch": 5074} {"train_loss": -26.9209041595459, "global_step": 421218, "epoch": 5074} {"train_loss": -26.922765731811523, "global_step": 421219, "epoch": 5074} {"train_loss": -26.84332275390625, "global_step": 421220, "epoch": 5074} {"train_loss": -26.82398796081543, "global_step": 421221, "epoch": 5074} {"train_loss": -26.954620361328125, "global_step": 421222, "epoch": 5074} {"train_loss": -27.012914657592773, "global_step": 421223, "epoch": 5074} {"train_loss": -26.75187184437212, "global_step": 421224, "epoch": 5074, "val_loss": 7015995.0} {"train_loss": -25.887922286987305, "global_step": 421225, "epoch": 5075} {"train_loss": -25.393644332885742, "global_step": 421226, "epoch": 5075} {"train_loss": -26.174840927124023, "global_step": 421227, "epoch": 5075} {"train_loss": -26.560998916625977, "global_step": 421228, "epoch": 5075} {"train_loss": -26.06733512878418, "global_step": 421229, "epoch": 5075} {"train_loss": -26.20114517211914, "global_step": 421230, "epoch": 5075} {"train_loss": -26.115680694580078, "global_step": 421231, "epoch": 5075} {"train_loss": -26.47641944885254, "global_step": 421232, "epoch": 5075} {"train_loss": -26.360273361206055, "global_step": 421233, "epoch": 5075} {"train_loss": -26.124298095703125, "global_step": 421234, "epoch": 5075} {"train_loss": -26.68863868713379, "global_step": 421235, "epoch": 5075} {"train_loss": -25.993677139282227, "global_step": 421236, "epoch": 5075} {"train_loss": -26.4991512298584, "global_step": 421237, "epoch": 5075} {"train_loss": -26.210290908813477, "global_step": 421238, "epoch": 5075} {"train_loss": -26.424863815307617, "global_step": 421239, "epoch": 5075} {"train_loss": -26.448165893554688, "global_step": 421240, "epoch": 5075} {"train_loss": -26.385839462280273, "global_step": 421241, "epoch": 5075} {"train_loss": -26.79652214050293, "global_step": 421242, "epoch": 5075} {"train_loss": -26.4771671295166, "global_step": 421243, "epoch": 5075} {"train_loss": -26.588977813720703, "global_step": 421244, "epoch": 5075} {"train_loss": -26.645584106445312, "global_step": 421245, "epoch": 5075} {"train_loss": -26.836668014526367, "global_step": 421246, "epoch": 5075} {"train_loss": -26.6541748046875, "global_step": 421247, "epoch": 5075} {"train_loss": -26.554555892944336, "global_step": 421248, "epoch": 5075} {"train_loss": -26.545093536376953, "global_step": 421249, "epoch": 5075} {"train_loss": -26.898725509643555, "global_step": 421250, "epoch": 5075} {"train_loss": -26.47779655456543, "global_step": 421251, "epoch": 5075} {"train_loss": -26.50111198425293, "global_step": 421252, "epoch": 5075} {"train_loss": -27.10092544555664, "global_step": 421253, "epoch": 5075} {"train_loss": -26.681821823120117, "global_step": 421254, "epoch": 5075} {"train_loss": -26.782651901245117, "global_step": 421255, "epoch": 5075} {"train_loss": -26.780569076538086, "global_step": 421256, "epoch": 5075} {"train_loss": -26.862232208251953, "global_step": 421257, "epoch": 5075} {"train_loss": -26.523834228515625, "global_step": 421258, "epoch": 5075} {"train_loss": -26.436792373657227, "global_step": 421259, "epoch": 5075} {"train_loss": -27.22186279296875, "global_step": 421260, "epoch": 5075} {"train_loss": -26.85516357421875, "global_step": 421261, "epoch": 5075} {"train_loss": -26.836807250976562, "global_step": 421262, "epoch": 5075} {"train_loss": -26.927520751953125, "global_step": 421263, "epoch": 5075} {"train_loss": -26.975433349609375, "global_step": 421264, "epoch": 5075} {"train_loss": -26.68009376525879, "global_step": 421265, "epoch": 5075} {"train_loss": -26.403852462768555, "global_step": 421266, "epoch": 5075} {"train_loss": -26.644052505493164, "global_step": 421267, "epoch": 5075} {"train_loss": -27.001012802124023, "global_step": 421268, "epoch": 5075} {"train_loss": -26.9491024017334, "global_step": 421269, "epoch": 5075} {"train_loss": -27.194822311401367, "global_step": 421270, "epoch": 5075} {"train_loss": -26.830078125, "global_step": 421271, "epoch": 5075} {"train_loss": -27.103290557861328, "global_step": 421272, "epoch": 5075} {"train_loss": -26.942657470703125, "global_step": 421273, "epoch": 5075} {"train_loss": -26.849210739135742, "global_step": 421274, "epoch": 5075} {"train_loss": -26.688892364501953, "global_step": 421275, "epoch": 5075} {"train_loss": -26.587987899780273, "global_step": 421276, "epoch": 5075} {"train_loss": -26.957075119018555, "global_step": 421277, "epoch": 5075} {"train_loss": -27.07545280456543, "global_step": 421278, "epoch": 5075} {"train_loss": -26.89275550842285, "global_step": 421279, "epoch": 5075} {"train_loss": -26.914411544799805, "global_step": 421280, "epoch": 5075} {"train_loss": -26.92656898498535, "global_step": 421281, "epoch": 5075} {"train_loss": -26.992706298828125, "global_step": 421282, "epoch": 5075} {"train_loss": -26.668745040893555, "global_step": 421283, "epoch": 5075} {"train_loss": -26.986316680908203, "global_step": 421284, "epoch": 5075} {"train_loss": -26.637725830078125, "global_step": 421285, "epoch": 5075} {"train_loss": -26.78846549987793, "global_step": 421286, "epoch": 5075} {"train_loss": -26.920080184936523, "global_step": 421287, "epoch": 5075} {"train_loss": -26.383209228515625, "global_step": 421288, "epoch": 5075} {"train_loss": -26.569440841674805, "global_step": 421289, "epoch": 5075} {"train_loss": -26.82281494140625, "global_step": 421290, "epoch": 5075} {"train_loss": -26.902490615844727, "global_step": 421291, "epoch": 5075} {"train_loss": -26.73579216003418, "global_step": 421292, "epoch": 5075} {"train_loss": -26.822294235229492, "global_step": 421293, "epoch": 5075} {"train_loss": -26.49853515625, "global_step": 421294, "epoch": 5075} {"train_loss": -27.205341339111328, "global_step": 421295, "epoch": 5075} {"train_loss": -26.786096572875977, "global_step": 421296, "epoch": 5075} {"train_loss": -26.989248275756836, "global_step": 421297, "epoch": 5075} {"train_loss": -26.770172119140625, "global_step": 421298, "epoch": 5075} {"train_loss": -27.153120040893555, "global_step": 421299, "epoch": 5075} {"train_loss": -26.543842315673828, "global_step": 421300, "epoch": 5075} {"train_loss": -26.98567008972168, "global_step": 421301, "epoch": 5075} {"train_loss": -26.74566078186035, "global_step": 421302, "epoch": 5075} {"train_loss": -26.828052520751953, "global_step": 421303, "epoch": 5075} {"train_loss": -26.945959091186523, "global_step": 421304, "epoch": 5075} {"train_loss": -26.917394638061523, "global_step": 421305, "epoch": 5075} {"train_loss": -26.55299186706543, "global_step": 421306, "epoch": 5075} {"train_loss": -26.665162672479468, "global_step": 421307, "epoch": 5075, "val_loss": 7074547.0} {"train_loss": -25.587339401245117, "global_step": 421308, "epoch": 5076} {"train_loss": -25.10173988342285, "global_step": 421309, "epoch": 5076} {"train_loss": -26.096389770507812, "global_step": 421310, "epoch": 5076} {"train_loss": -25.605627059936523, "global_step": 421311, "epoch": 5076} {"train_loss": -26.0200252532959, "global_step": 421312, "epoch": 5076} {"train_loss": -25.295164108276367, "global_step": 421313, "epoch": 5076} {"train_loss": -26.079004287719727, "global_step": 421314, "epoch": 5076} {"train_loss": -25.922733306884766, "global_step": 421315, "epoch": 5076} {"train_loss": -26.568115234375, "global_step": 421316, "epoch": 5076} {"train_loss": -26.15228271484375, "global_step": 421317, "epoch": 5076} {"train_loss": -26.050403594970703, "global_step": 421318, "epoch": 5076} {"train_loss": -26.0659122467041, "global_step": 421319, "epoch": 5076} {"train_loss": -26.546056747436523, "global_step": 421320, "epoch": 5076} {"train_loss": -26.246810913085938, "global_step": 421321, "epoch": 5076} {"train_loss": -26.418066024780273, "global_step": 421322, "epoch": 5076} {"train_loss": -26.548856735229492, "global_step": 421323, "epoch": 5076} {"train_loss": -26.135984420776367, "global_step": 421324, "epoch": 5076} {"train_loss": -26.289417266845703, "global_step": 421325, "epoch": 5076} {"train_loss": -26.54123878479004, "global_step": 421326, "epoch": 5076} {"train_loss": -26.580434799194336, "global_step": 421327, "epoch": 5076} {"train_loss": -26.402450561523438, "global_step": 421328, "epoch": 5076} {"train_loss": -26.868383407592773, "global_step": 421329, "epoch": 5076} {"train_loss": -26.398513793945312, "global_step": 421330, "epoch": 5076} {"train_loss": -26.470935821533203, "global_step": 421331, "epoch": 5076} {"train_loss": -26.596546173095703, "global_step": 421332, "epoch": 5076} {"train_loss": -26.32099723815918, "global_step": 421333, "epoch": 5076} {"train_loss": -26.40394401550293, "global_step": 421334, "epoch": 5076} {"train_loss": -26.6066837310791, "global_step": 421335, "epoch": 5076} {"train_loss": -26.80558204650879, "global_step": 421336, "epoch": 5076} {"train_loss": -26.463546752929688, "global_step": 421337, "epoch": 5076} {"train_loss": -26.984725952148438, "global_step": 421338, "epoch": 5076} {"train_loss": -26.5306339263916, "global_step": 421339, "epoch": 5076} {"train_loss": -27.063446044921875, "global_step": 421340, "epoch": 5076} {"train_loss": -26.754194259643555, "global_step": 421341, "epoch": 5076} {"train_loss": -26.753833770751953, "global_step": 421342, "epoch": 5076} {"train_loss": -27.021772384643555, "global_step": 421343, "epoch": 5076} {"train_loss": -27.226770401000977, "global_step": 421344, "epoch": 5076} {"train_loss": -27.106550216674805, "global_step": 421345, "epoch": 5076} {"train_loss": -26.7808780670166, "global_step": 421346, "epoch": 5076} {"train_loss": -27.032140731811523, "global_step": 421347, "epoch": 5076} {"train_loss": -26.60523796081543, "global_step": 421348, "epoch": 5076} {"train_loss": -27.137502670288086, "global_step": 421349, "epoch": 5076} {"train_loss": -27.047460556030273, "global_step": 421350, "epoch": 5076} {"train_loss": -27.000110626220703, "global_step": 421351, "epoch": 5076} {"train_loss": -27.00876808166504, "global_step": 421352, "epoch": 5076} {"train_loss": -26.701465606689453, "global_step": 421353, "epoch": 5076} {"train_loss": -26.86191749572754, "global_step": 421354, "epoch": 5076} {"train_loss": -26.98147964477539, "global_step": 421355, "epoch": 5076} {"train_loss": -27.042346954345703, "global_step": 421356, "epoch": 5076} {"train_loss": -26.585290908813477, "global_step": 421357, "epoch": 5076} {"train_loss": -27.08064842224121, "global_step": 421358, "epoch": 5076} {"train_loss": -26.619653701782227, "global_step": 421359, "epoch": 5076} {"train_loss": -26.913101196289062, "global_step": 421360, "epoch": 5076} {"train_loss": -27.0161075592041, "global_step": 421361, "epoch": 5076} {"train_loss": -26.511510848999023, "global_step": 421362, "epoch": 5076} {"train_loss": -26.529987335205078, "global_step": 421363, "epoch": 5076} {"train_loss": -26.471784591674805, "global_step": 421364, "epoch": 5076} {"train_loss": -26.3107967376709, "global_step": 421365, "epoch": 5076} {"train_loss": -26.7557315826416, "global_step": 421366, "epoch": 5076} {"train_loss": -26.984704971313477, "global_step": 421367, "epoch": 5076} {"train_loss": -26.787097930908203, "global_step": 421368, "epoch": 5076} {"train_loss": -27.049972534179688, "global_step": 421369, "epoch": 5076} {"train_loss": -26.513660430908203, "global_step": 421370, "epoch": 5076} {"train_loss": -26.461441040039062, "global_step": 421371, "epoch": 5076} {"train_loss": -26.798864364624023, "global_step": 421372, "epoch": 5076} {"train_loss": -26.856420516967773, "global_step": 421373, "epoch": 5076} {"train_loss": -26.813745498657227, "global_step": 421374, "epoch": 5076} {"train_loss": -26.6016902923584, "global_step": 421375, "epoch": 5076} {"train_loss": -26.246612548828125, "global_step": 421376, "epoch": 5076} {"train_loss": -26.26991081237793, "global_step": 421377, "epoch": 5076} {"train_loss": -26.314716339111328, "global_step": 421378, "epoch": 5076} {"train_loss": -26.75469398498535, "global_step": 421379, "epoch": 5076} {"train_loss": -27.028364181518555, "global_step": 421380, "epoch": 5076} {"train_loss": -27.145124435424805, "global_step": 421381, "epoch": 5076} {"train_loss": -26.856454849243164, "global_step": 421382, "epoch": 5076} {"train_loss": -27.01654624938965, "global_step": 421383, "epoch": 5076} {"train_loss": -26.829172134399414, "global_step": 421384, "epoch": 5076} {"train_loss": -26.83294105529785, "global_step": 421385, "epoch": 5076} {"train_loss": -26.81024742126465, "global_step": 421386, "epoch": 5076} {"train_loss": -26.340845108032227, "global_step": 421387, "epoch": 5076} {"train_loss": -26.578641891479492, "global_step": 421388, "epoch": 5076} {"train_loss": -26.827802658081055, "global_step": 421389, "epoch": 5076} {"train_loss": -26.61482420312353, "global_step": 421390, "epoch": 5076, "val_loss": 7068236.0} {"train_loss": -23.720378875732422, "global_step": 421391, "epoch": 5077} {"train_loss": -25.561742782592773, "global_step": 421392, "epoch": 5077} {"train_loss": -25.671789169311523, "global_step": 421393, "epoch": 5077} {"train_loss": -25.131851196289062, "global_step": 421394, "epoch": 5077} {"train_loss": -25.544370651245117, "global_step": 421395, "epoch": 5077} {"train_loss": -25.20402717590332, "global_step": 421396, "epoch": 5077} {"train_loss": -25.572513580322266, "global_step": 421397, "epoch": 5077} {"train_loss": -25.918731689453125, "global_step": 421398, "epoch": 5077} {"train_loss": -25.909759521484375, "global_step": 421399, "epoch": 5077} {"train_loss": -25.909021377563477, "global_step": 421400, "epoch": 5077} {"train_loss": -25.51959228515625, "global_step": 421401, "epoch": 5077} {"train_loss": -25.99628257751465, "global_step": 421402, "epoch": 5077} {"train_loss": -25.669803619384766, "global_step": 421403, "epoch": 5077} {"train_loss": -26.00676918029785, "global_step": 421404, "epoch": 5077} {"train_loss": -25.928058624267578, "global_step": 421405, "epoch": 5077} {"train_loss": -25.9431095123291, "global_step": 421406, "epoch": 5077} {"train_loss": -26.009939193725586, "global_step": 421407, "epoch": 5077} {"train_loss": -25.945816040039062, "global_step": 421408, "epoch": 5077} {"train_loss": -26.12961196899414, "global_step": 421409, "epoch": 5077} {"train_loss": -26.255298614501953, "global_step": 421410, "epoch": 5077} {"train_loss": -26.12652587890625, "global_step": 421411, "epoch": 5077} {"train_loss": -26.046192169189453, "global_step": 421412, "epoch": 5077} {"train_loss": -26.755878448486328, "global_step": 421413, "epoch": 5077} {"train_loss": -26.46038818359375, "global_step": 421414, "epoch": 5077} {"train_loss": -26.026233673095703, "global_step": 421415, "epoch": 5077} {"train_loss": -26.538177490234375, "global_step": 421416, "epoch": 5077} {"train_loss": -26.287267684936523, "global_step": 421417, "epoch": 5077} {"train_loss": -26.705810546875, "global_step": 421418, "epoch": 5077} {"train_loss": -26.66617774963379, "global_step": 421419, "epoch": 5077} {"train_loss": -26.35430335998535, "global_step": 421420, "epoch": 5077} {"train_loss": -26.571537017822266, "global_step": 421421, "epoch": 5077} {"train_loss": -26.629907608032227, "global_step": 421422, "epoch": 5077} {"train_loss": -26.580896377563477, "global_step": 421423, "epoch": 5077} {"train_loss": -26.7230167388916, "global_step": 421424, "epoch": 5077} {"train_loss": -26.621572494506836, "global_step": 421425, "epoch": 5077} {"train_loss": -26.615280151367188, "global_step": 421426, "epoch": 5077} {"train_loss": -26.873998641967773, "global_step": 421427, "epoch": 5077} {"train_loss": -26.970197677612305, "global_step": 421428, "epoch": 5077} {"train_loss": -26.88760757446289, "global_step": 421429, "epoch": 5077} {"train_loss": -27.10837745666504, "global_step": 421430, "epoch": 5077} {"train_loss": -27.04656982421875, "global_step": 421431, "epoch": 5077} {"train_loss": -26.50587272644043, "global_step": 421432, "epoch": 5077} {"train_loss": -26.74822998046875, "global_step": 421433, "epoch": 5077} {"train_loss": -26.316059112548828, "global_step": 421434, "epoch": 5077} {"train_loss": -26.772192001342773, "global_step": 421435, "epoch": 5077} {"train_loss": -26.69879722595215, "global_step": 421436, "epoch": 5077} {"train_loss": -26.84604263305664, "global_step": 421437, "epoch": 5077} {"train_loss": -26.577579498291016, "global_step": 421438, "epoch": 5077} {"train_loss": -26.810230255126953, "global_step": 421439, "epoch": 5077} {"train_loss": -27.275192260742188, "global_step": 421440, "epoch": 5077} {"train_loss": -27.05954933166504, "global_step": 421441, "epoch": 5077} {"train_loss": -26.527862548828125, "global_step": 421442, "epoch": 5077} {"train_loss": -26.696924209594727, "global_step": 421443, "epoch": 5077} {"train_loss": -26.814071655273438, "global_step": 421444, "epoch": 5077} {"train_loss": -26.592573165893555, "global_step": 421445, "epoch": 5077} {"train_loss": -27.1114559173584, "global_step": 421446, "epoch": 5077} {"train_loss": -26.70612144470215, "global_step": 421447, "epoch": 5077} {"train_loss": -27.14459800720215, "global_step": 421448, "epoch": 5077} {"train_loss": -26.926794052124023, "global_step": 421449, "epoch": 5077} {"train_loss": -26.748754501342773, "global_step": 421450, "epoch": 5077} {"train_loss": -27.30523109436035, "global_step": 421451, "epoch": 5077} {"train_loss": -27.138324737548828, "global_step": 421452, "epoch": 5077} {"train_loss": -26.850378036499023, "global_step": 421453, "epoch": 5077} {"train_loss": -27.20985221862793, "global_step": 421454, "epoch": 5077} {"train_loss": -27.11825942993164, "global_step": 421455, "epoch": 5077} {"train_loss": -26.91334342956543, "global_step": 421456, "epoch": 5077} {"train_loss": -26.55793571472168, "global_step": 421457, "epoch": 5077} {"train_loss": -26.820194244384766, "global_step": 421458, "epoch": 5077} {"train_loss": -27.09266471862793, "global_step": 421459, "epoch": 5077} {"train_loss": -27.347341537475586, "global_step": 421460, "epoch": 5077} {"train_loss": -27.161951065063477, "global_step": 421461, "epoch": 5077} {"train_loss": -26.72664451599121, "global_step": 421462, "epoch": 5077} {"train_loss": -26.716947555541992, "global_step": 421463, "epoch": 5077} {"train_loss": -26.499540328979492, "global_step": 421464, "epoch": 5077} {"train_loss": -27.148950576782227, "global_step": 421465, "epoch": 5077} {"train_loss": -26.96030044555664, "global_step": 421466, "epoch": 5077} {"train_loss": -27.038312911987305, "global_step": 421467, "epoch": 5077} {"train_loss": -26.64334487915039, "global_step": 421468, "epoch": 5077} {"train_loss": -27.170917510986328, "global_step": 421469, "epoch": 5077} {"train_loss": -26.70074462890625, "global_step": 421470, "epoch": 5077} {"train_loss": -27.034570693969727, "global_step": 421471, "epoch": 5077} {"train_loss": -27.209033966064453, "global_step": 421472, "epoch": 5077} {"train_loss": -26.526510537388813, "global_step": 421473, "epoch": 5077, "val_loss": 6924366.0} {"train_loss": -26.184467315673828, "global_step": 421474, "epoch": 5078} {"train_loss": -26.092695236206055, "global_step": 421475, "epoch": 5078} {"train_loss": -26.384119033813477, "global_step": 421476, "epoch": 5078} {"train_loss": -25.61863136291504, "global_step": 421477, "epoch": 5078} {"train_loss": -26.158674240112305, "global_step": 421478, "epoch": 5078} {"train_loss": -26.233041763305664, "global_step": 421479, "epoch": 5078} {"train_loss": -26.6833553314209, "global_step": 421480, "epoch": 5078} {"train_loss": -26.608474731445312, "global_step": 421481, "epoch": 5078} {"train_loss": -26.1358642578125, "global_step": 421482, "epoch": 5078} {"train_loss": -26.325214385986328, "global_step": 421483, "epoch": 5078} {"train_loss": -26.44239616394043, "global_step": 421484, "epoch": 5078} {"train_loss": -26.538373947143555, "global_step": 421485, "epoch": 5078} {"train_loss": -26.538843154907227, "global_step": 421486, "epoch": 5078} {"train_loss": -26.30006217956543, "global_step": 421487, "epoch": 5078} {"train_loss": -26.67999839782715, "global_step": 421488, "epoch": 5078} {"train_loss": -26.51099967956543, "global_step": 421489, "epoch": 5078} {"train_loss": -26.661596298217773, "global_step": 421490, "epoch": 5078} {"train_loss": -26.5883846282959, "global_step": 421491, "epoch": 5078} {"train_loss": -26.57159423828125, "global_step": 421492, "epoch": 5078} {"train_loss": -26.899860382080078, "global_step": 421493, "epoch": 5078} {"train_loss": -26.664413452148438, "global_step": 421494, "epoch": 5078} {"train_loss": -26.804920196533203, "global_step": 421495, "epoch": 5078} {"train_loss": -26.81073570251465, "global_step": 421496, "epoch": 5078} {"train_loss": -26.695276260375977, "global_step": 421497, "epoch": 5078} {"train_loss": -26.618738174438477, "global_step": 421498, "epoch": 5078} {"train_loss": -26.807754516601562, "global_step": 421499, "epoch": 5078} {"train_loss": -26.85663414001465, "global_step": 421500, "epoch": 5078} {"train_loss": -26.793012619018555, "global_step": 421501, "epoch": 5078} {"train_loss": -26.859338760375977, "global_step": 421502, "epoch": 5078} {"train_loss": -26.885297775268555, "global_step": 421503, "epoch": 5078} {"train_loss": -26.650903701782227, "global_step": 421504, "epoch": 5078} {"train_loss": -26.396100997924805, "global_step": 421505, "epoch": 5078} {"train_loss": -26.93842124938965, "global_step": 421506, "epoch": 5078} {"train_loss": -26.63860511779785, "global_step": 421507, "epoch": 5078} {"train_loss": -27.165212631225586, "global_step": 421508, "epoch": 5078} {"train_loss": -26.781522750854492, "global_step": 421509, "epoch": 5078} {"train_loss": -26.688861846923828, "global_step": 421510, "epoch": 5078} {"train_loss": -26.646259307861328, "global_step": 421511, "epoch": 5078} {"train_loss": -26.773548126220703, "global_step": 421512, "epoch": 5078} {"train_loss": -26.9266414642334, "global_step": 421513, "epoch": 5078} {"train_loss": -26.763507843017578, "global_step": 421514, "epoch": 5078} {"train_loss": -26.712417602539062, "global_step": 421515, "epoch": 5078} {"train_loss": -26.7568359375, "global_step": 421516, "epoch": 5078} {"train_loss": -26.915332794189453, "global_step": 421517, "epoch": 5078} {"train_loss": -27.070770263671875, "global_step": 421518, "epoch": 5078} {"train_loss": -26.83428382873535, "global_step": 421519, "epoch": 5078} {"train_loss": -27.156803131103516, "global_step": 421520, "epoch": 5078} {"train_loss": -27.25787353515625, "global_step": 421521, "epoch": 5078} {"train_loss": -26.8299560546875, "global_step": 421522, "epoch": 5078} {"train_loss": -26.804548263549805, "global_step": 421523, "epoch": 5078} {"train_loss": -27.062952041625977, "global_step": 421524, "epoch": 5078} {"train_loss": -26.57411003112793, "global_step": 421525, "epoch": 5078} {"train_loss": -27.15036964416504, "global_step": 421526, "epoch": 5078} {"train_loss": -26.870290756225586, "global_step": 421527, "epoch": 5078} {"train_loss": -26.87436866760254, "global_step": 421528, "epoch": 5078} {"train_loss": -26.5692195892334, "global_step": 421529, "epoch": 5078} {"train_loss": -26.11421012878418, "global_step": 421530, "epoch": 5078} {"train_loss": -26.08928871154785, "global_step": 421531, "epoch": 5078} {"train_loss": -26.379257202148438, "global_step": 421532, "epoch": 5078} {"train_loss": -26.6904354095459, "global_step": 421533, "epoch": 5078} {"train_loss": -26.78559684753418, "global_step": 421534, "epoch": 5078} {"train_loss": -26.522687911987305, "global_step": 421535, "epoch": 5078} {"train_loss": -26.698205947875977, "global_step": 421536, "epoch": 5078} {"train_loss": -26.89411735534668, "global_step": 421537, "epoch": 5078} {"train_loss": -26.419809341430664, "global_step": 421538, "epoch": 5078} {"train_loss": -26.716535568237305, "global_step": 421539, "epoch": 5078} {"train_loss": -26.674375534057617, "global_step": 421540, "epoch": 5078} {"train_loss": -26.2012882232666, "global_step": 421541, "epoch": 5078} {"train_loss": -26.702972412109375, "global_step": 421542, "epoch": 5078} {"train_loss": -26.56412696838379, "global_step": 421543, "epoch": 5078} {"train_loss": -26.984237670898438, "global_step": 421544, "epoch": 5078} {"train_loss": -26.59356117248535, "global_step": 421545, "epoch": 5078} {"train_loss": -27.052204132080078, "global_step": 421546, "epoch": 5078} {"train_loss": -27.108783721923828, "global_step": 421547, "epoch": 5078} {"train_loss": -27.048566818237305, "global_step": 421548, "epoch": 5078} {"train_loss": -26.76934814453125, "global_step": 421549, "epoch": 5078} {"train_loss": -27.058679580688477, "global_step": 421550, "epoch": 5078} {"train_loss": -26.994287490844727, "global_step": 421551, "epoch": 5078} {"train_loss": -26.8966064453125, "global_step": 421552, "epoch": 5078} {"train_loss": -27.042938232421875, "global_step": 421553, "epoch": 5078} {"train_loss": -26.653669357299805, "global_step": 421554, "epoch": 5078} {"train_loss": -27.000335693359375, "global_step": 421555, "epoch": 5078} {"train_loss": -26.686165338539215, "global_step": 421556, "epoch": 5078, "val_loss": 6952305.5} {"train_loss": -25.93316650390625, "global_step": 421557, "epoch": 5079} {"train_loss": -25.95586585998535, "global_step": 421558, "epoch": 5079} {"train_loss": -26.567398071289062, "global_step": 421559, "epoch": 5079} {"train_loss": -26.014209747314453, "global_step": 421560, "epoch": 5079} {"train_loss": -26.418161392211914, "global_step": 421561, "epoch": 5079} {"train_loss": -26.513269424438477, "global_step": 421562, "epoch": 5079} {"train_loss": -26.438474655151367, "global_step": 421563, "epoch": 5079} {"train_loss": -26.275928497314453, "global_step": 421564, "epoch": 5079} {"train_loss": -26.487598419189453, "global_step": 421565, "epoch": 5079} {"train_loss": -26.478336334228516, "global_step": 421566, "epoch": 5079} {"train_loss": -26.355243682861328, "global_step": 421567, "epoch": 5079} {"train_loss": -26.599674224853516, "global_step": 421568, "epoch": 5079} {"train_loss": -26.49479103088379, "global_step": 421569, "epoch": 5079} {"train_loss": -26.763540267944336, "global_step": 421570, "epoch": 5079} {"train_loss": -26.873395919799805, "global_step": 421571, "epoch": 5079} {"train_loss": -26.57411003112793, "global_step": 421572, "epoch": 5079} {"train_loss": -26.699005126953125, "global_step": 421573, "epoch": 5079} {"train_loss": -26.811767578125, "global_step": 421574, "epoch": 5079} {"train_loss": -26.53163719177246, "global_step": 421575, "epoch": 5079} {"train_loss": -26.403812408447266, "global_step": 421576, "epoch": 5079} {"train_loss": -26.24365234375, "global_step": 421577, "epoch": 5079} {"train_loss": -26.503381729125977, "global_step": 421578, "epoch": 5079} {"train_loss": -26.29717445373535, "global_step": 421579, "epoch": 5079} {"train_loss": -26.88677406311035, "global_step": 421580, "epoch": 5079} {"train_loss": -26.91727638244629, "global_step": 421581, "epoch": 5079} {"train_loss": -26.44814109802246, "global_step": 421582, "epoch": 5079} {"train_loss": -26.659198760986328, "global_step": 421583, "epoch": 5079} {"train_loss": -26.933395385742188, "global_step": 421584, "epoch": 5079} {"train_loss": -26.610553741455078, "global_step": 421585, "epoch": 5079} {"train_loss": -26.83953857421875, "global_step": 421586, "epoch": 5079} {"train_loss": -26.76385498046875, "global_step": 421587, "epoch": 5079} {"train_loss": -26.696258544921875, "global_step": 421588, "epoch": 5079} {"train_loss": -27.27046012878418, "global_step": 421589, "epoch": 5079} {"train_loss": -26.760122299194336, "global_step": 421590, "epoch": 5079} {"train_loss": -26.587202072143555, "global_step": 421591, "epoch": 5079} {"train_loss": -27.0239200592041, "global_step": 421592, "epoch": 5079} {"train_loss": -26.897809982299805, "global_step": 421593, "epoch": 5079} {"train_loss": -26.90334129333496, "global_step": 421594, "epoch": 5079} {"train_loss": -26.68690299987793, "global_step": 421595, "epoch": 5079} {"train_loss": -26.739133834838867, "global_step": 421596, "epoch": 5079} {"train_loss": -26.882532119750977, "global_step": 421597, "epoch": 5079} {"train_loss": -27.08448600769043, "global_step": 421598, "epoch": 5079} {"train_loss": -27.1616268157959, "global_step": 421599, "epoch": 5079} {"train_loss": -26.950586318969727, "global_step": 421600, "epoch": 5079} {"train_loss": -26.711393356323242, "global_step": 421601, "epoch": 5079} {"train_loss": -26.912641525268555, "global_step": 421602, "epoch": 5079} {"train_loss": -26.738937377929688, "global_step": 421603, "epoch": 5079} {"train_loss": -27.305103302001953, "global_step": 421604, "epoch": 5079} {"train_loss": -27.007980346679688, "global_step": 421605, "epoch": 5079} {"train_loss": -26.685638427734375, "global_step": 421606, "epoch": 5079} {"train_loss": -26.83989906311035, "global_step": 421607, "epoch": 5079} {"train_loss": -26.963977813720703, "global_step": 421608, "epoch": 5079} {"train_loss": -26.74289894104004, "global_step": 421609, "epoch": 5079} {"train_loss": -26.630163192749023, "global_step": 421610, "epoch": 5079} {"train_loss": -26.741186141967773, "global_step": 421611, "epoch": 5079} {"train_loss": -26.30659294128418, "global_step": 421612, "epoch": 5079} {"train_loss": -26.500051498413086, "global_step": 421613, "epoch": 5079} {"train_loss": -26.79279136657715, "global_step": 421614, "epoch": 5079} {"train_loss": -26.439306259155273, "global_step": 421615, "epoch": 5079} {"train_loss": -26.832080841064453, "global_step": 421616, "epoch": 5079} {"train_loss": -26.911090850830078, "global_step": 421617, "epoch": 5079} {"train_loss": -26.351348876953125, "global_step": 421618, "epoch": 5079} {"train_loss": -27.0841007232666, "global_step": 421619, "epoch": 5079} {"train_loss": -26.6142635345459, "global_step": 421620, "epoch": 5079} {"train_loss": -26.50469970703125, "global_step": 421621, "epoch": 5079} {"train_loss": -26.0172176361084, "global_step": 421622, "epoch": 5079} {"train_loss": -26.1763973236084, "global_step": 421623, "epoch": 5079} {"train_loss": -26.613019943237305, "global_step": 421624, "epoch": 5079} {"train_loss": -26.408567428588867, "global_step": 421625, "epoch": 5079} {"train_loss": -25.823083877563477, "global_step": 421626, "epoch": 5079} {"train_loss": -25.89068603515625, "global_step": 421627, "epoch": 5079} {"train_loss": -25.92110252380371, "global_step": 421628, "epoch": 5079} {"train_loss": -26.602313995361328, "global_step": 421629, "epoch": 5079} {"train_loss": -25.954639434814453, "global_step": 421630, "epoch": 5079} {"train_loss": -25.893768310546875, "global_step": 421631, "epoch": 5079} {"train_loss": -26.689640045166016, "global_step": 421632, "epoch": 5079} {"train_loss": -26.187992095947266, "global_step": 421633, "epoch": 5079} {"train_loss": -26.298023223876953, "global_step": 421634, "epoch": 5079} {"train_loss": -26.644977569580078, "global_step": 421635, "epoch": 5079} {"train_loss": -26.874500274658203, "global_step": 421636, "epoch": 5079} {"train_loss": -26.97747230529785, "global_step": 421637, "epoch": 5079} {"train_loss": -26.394617080688477, "global_step": 421638, "epoch": 5079} {"train_loss": -26.59701083079878, "global_step": 421639, "epoch": 5079, "val_loss": 7080613.0} {"train_loss": -26.47452163696289, "global_step": 421640, "epoch": 5080} {"train_loss": -26.24090003967285, "global_step": 421641, "epoch": 5080} {"train_loss": -26.19561195373535, "global_step": 421642, "epoch": 5080} {"train_loss": -25.807086944580078, "global_step": 421643, "epoch": 5080} {"train_loss": -26.143238067626953, "global_step": 421644, "epoch": 5080} {"train_loss": -26.131818771362305, "global_step": 421645, "epoch": 5080} {"train_loss": -26.829492568969727, "global_step": 421646, "epoch": 5080} {"train_loss": -26.513681411743164, "global_step": 421647, "epoch": 5080} {"train_loss": -26.709264755249023, "global_step": 421648, "epoch": 5080} {"train_loss": -26.351346969604492, "global_step": 421649, "epoch": 5080} {"train_loss": -26.499231338500977, "global_step": 421650, "epoch": 5080} {"train_loss": -26.614782333374023, "global_step": 421651, "epoch": 5080} {"train_loss": -26.458221435546875, "global_step": 421652, "epoch": 5080} {"train_loss": -26.228967666625977, "global_step": 421653, "epoch": 5080} {"train_loss": -26.585845947265625, "global_step": 421654, "epoch": 5080} {"train_loss": -26.578723907470703, "global_step": 421655, "epoch": 5080} {"train_loss": -26.635025024414062, "global_step": 421656, "epoch": 5080} {"train_loss": -26.60181999206543, "global_step": 421657, "epoch": 5080} {"train_loss": -26.551685333251953, "global_step": 421658, "epoch": 5080} {"train_loss": -26.59113883972168, "global_step": 421659, "epoch": 5080} {"train_loss": -26.7193603515625, "global_step": 421660, "epoch": 5080} {"train_loss": -26.342065811157227, "global_step": 421661, "epoch": 5080} {"train_loss": -26.38985252380371, "global_step": 421662, "epoch": 5080} {"train_loss": -26.701786041259766, "global_step": 421663, "epoch": 5080} {"train_loss": -26.958892822265625, "global_step": 421664, "epoch": 5080} {"train_loss": -26.712417602539062, "global_step": 421665, "epoch": 5080} {"train_loss": -26.484594345092773, "global_step": 421666, "epoch": 5080} {"train_loss": -26.897451400756836, "global_step": 421667, "epoch": 5080} {"train_loss": -26.625991821289062, "global_step": 421668, "epoch": 5080} {"train_loss": -26.79522132873535, "global_step": 421669, "epoch": 5080} {"train_loss": -26.662412643432617, "global_step": 421670, "epoch": 5080} {"train_loss": -26.96771812438965, "global_step": 421671, "epoch": 5080} {"train_loss": -26.694616317749023, "global_step": 421672, "epoch": 5080} {"train_loss": -26.8466739654541, "global_step": 421673, "epoch": 5080} {"train_loss": -26.94709587097168, "global_step": 421674, "epoch": 5080} {"train_loss": -27.1446533203125, "global_step": 421675, "epoch": 5080} {"train_loss": -26.802947998046875, "global_step": 421676, "epoch": 5080} {"train_loss": -27.004587173461914, "global_step": 421677, "epoch": 5080} {"train_loss": -26.8986759185791, "global_step": 421678, "epoch": 5080} {"train_loss": -26.860401153564453, "global_step": 421679, "epoch": 5080} {"train_loss": -26.765640258789062, "global_step": 421680, "epoch": 5080} {"train_loss": -26.825498580932617, "global_step": 421681, "epoch": 5080} {"train_loss": -26.7783260345459, "global_step": 421682, "epoch": 5080} {"train_loss": -26.673538208007812, "global_step": 421683, "epoch": 5080} {"train_loss": -27.246719360351562, "global_step": 421684, "epoch": 5080} {"train_loss": -27.15513038635254, "global_step": 421685, "epoch": 5080} {"train_loss": -26.920276641845703, "global_step": 421686, "epoch": 5080} {"train_loss": -26.988393783569336, "global_step": 421687, "epoch": 5080} {"train_loss": -27.2103214263916, "global_step": 421688, "epoch": 5080} {"train_loss": -26.907352447509766, "global_step": 421689, "epoch": 5080} {"train_loss": -27.120624542236328, "global_step": 421690, "epoch": 5080} {"train_loss": -27.239431381225586, "global_step": 421691, "epoch": 5080} {"train_loss": -27.01352882385254, "global_step": 421692, "epoch": 5080} {"train_loss": -26.653900146484375, "global_step": 421693, "epoch": 5080} {"train_loss": -26.85970115661621, "global_step": 421694, "epoch": 5080} {"train_loss": -26.84199333190918, "global_step": 421695, "epoch": 5080} {"train_loss": -26.8511962890625, "global_step": 421696, "epoch": 5080} {"train_loss": -27.218183517456055, "global_step": 421697, "epoch": 5080} {"train_loss": -26.45918083190918, "global_step": 421698, "epoch": 5080} {"train_loss": -26.448474884033203, "global_step": 421699, "epoch": 5080} {"train_loss": -26.73600196838379, "global_step": 421700, "epoch": 5080} {"train_loss": -26.625436782836914, "global_step": 421701, "epoch": 5080} {"train_loss": -26.7047119140625, "global_step": 421702, "epoch": 5080} {"train_loss": -26.744184494018555, "global_step": 421703, "epoch": 5080} {"train_loss": -26.9483642578125, "global_step": 421704, "epoch": 5080} {"train_loss": -26.860076904296875, "global_step": 421705, "epoch": 5080} {"train_loss": -26.383737564086914, "global_step": 421706, "epoch": 5080} {"train_loss": -26.824085235595703, "global_step": 421707, "epoch": 5080} {"train_loss": -26.97416114807129, "global_step": 421708, "epoch": 5080} {"train_loss": -26.68928337097168, "global_step": 421709, "epoch": 5080} {"train_loss": -26.991445541381836, "global_step": 421710, "epoch": 5080} {"train_loss": -26.789474487304688, "global_step": 421711, "epoch": 5080} {"train_loss": -26.704450607299805, "global_step": 421712, "epoch": 5080} {"train_loss": -26.498010635375977, "global_step": 421713, "epoch": 5080} {"train_loss": -26.785120010375977, "global_step": 421714, "epoch": 5080} {"train_loss": -26.875396728515625, "global_step": 421715, "epoch": 5080} {"train_loss": -26.944244384765625, "global_step": 421716, "epoch": 5080} {"train_loss": -26.921003341674805, "global_step": 421717, "epoch": 5080} {"train_loss": -27.114959716796875, "global_step": 421718, "epoch": 5080} {"train_loss": -26.717681884765625, "global_step": 421719, "epoch": 5080} {"train_loss": -26.91016960144043, "global_step": 421720, "epoch": 5080} {"train_loss": -26.928863525390625, "global_step": 421721, "epoch": 5080} {"train_loss": -26.72997486160462, "global_step": 421722, "epoch": 5080, "val_loss": 7029712.0} {"train_loss": -25.902374267578125, "global_step": 421723, "epoch": 5081} {"train_loss": -26.167089462280273, "global_step": 421724, "epoch": 5081} {"train_loss": -26.28232192993164, "global_step": 421725, "epoch": 5081} {"train_loss": -26.24617576599121, "global_step": 421726, "epoch": 5081} {"train_loss": -25.5538387298584, "global_step": 421727, "epoch": 5081} {"train_loss": -25.715534210205078, "global_step": 421728, "epoch": 5081} {"train_loss": -26.288501739501953, "global_step": 421729, "epoch": 5081} {"train_loss": -25.705780029296875, "global_step": 421730, "epoch": 5081} {"train_loss": -26.031763076782227, "global_step": 421731, "epoch": 5081} {"train_loss": -26.038984298706055, "global_step": 421732, "epoch": 5081} {"train_loss": -25.872955322265625, "global_step": 421733, "epoch": 5081} {"train_loss": -26.263614654541016, "global_step": 421734, "epoch": 5081} {"train_loss": -26.104345321655273, "global_step": 421735, "epoch": 5081} {"train_loss": -25.98822021484375, "global_step": 421736, "epoch": 5081} {"train_loss": -26.40191078186035, "global_step": 421737, "epoch": 5081} {"train_loss": -26.24176025390625, "global_step": 421738, "epoch": 5081} {"train_loss": -26.364843368530273, "global_step": 421739, "epoch": 5081} {"train_loss": -26.337366104125977, "global_step": 421740, "epoch": 5081} {"train_loss": -26.267358779907227, "global_step": 421741, "epoch": 5081} {"train_loss": -26.646656036376953, "global_step": 421742, "epoch": 5081} {"train_loss": -26.637939453125, "global_step": 421743, "epoch": 5081} {"train_loss": -26.813364028930664, "global_step": 421744, "epoch": 5081} {"train_loss": -26.779565811157227, "global_step": 421745, "epoch": 5081} {"train_loss": -26.561994552612305, "global_step": 421746, "epoch": 5081} {"train_loss": -26.510053634643555, "global_step": 421747, "epoch": 5081} {"train_loss": -26.628820419311523, "global_step": 421748, "epoch": 5081} {"train_loss": -26.5491943359375, "global_step": 421749, "epoch": 5081} {"train_loss": -26.882368087768555, "global_step": 421750, "epoch": 5081} {"train_loss": -26.532379150390625, "global_step": 421751, "epoch": 5081} {"train_loss": -26.820837020874023, "global_step": 421752, "epoch": 5081} {"train_loss": -26.990644454956055, "global_step": 421753, "epoch": 5081} {"train_loss": -27.021345138549805, "global_step": 421754, "epoch": 5081} {"train_loss": -26.856525421142578, "global_step": 421755, "epoch": 5081} {"train_loss": -26.96013832092285, "global_step": 421756, "epoch": 5081} {"train_loss": -26.809219360351562, "global_step": 421757, "epoch": 5081} {"train_loss": -27.0041561126709, "global_step": 421758, "epoch": 5081} {"train_loss": -26.995285034179688, "global_step": 421759, "epoch": 5081} {"train_loss": -26.536605834960938, "global_step": 421760, "epoch": 5081} {"train_loss": -26.90028953552246, "global_step": 421761, "epoch": 5081} {"train_loss": -26.6796875, "global_step": 421762, "epoch": 5081} {"train_loss": -26.714582443237305, "global_step": 421763, "epoch": 5081} {"train_loss": -27.093774795532227, "global_step": 421764, "epoch": 5081} {"train_loss": -26.58075523376465, "global_step": 421765, "epoch": 5081} {"train_loss": -26.83418083190918, "global_step": 421766, "epoch": 5081} {"train_loss": -26.792617797851562, "global_step": 421767, "epoch": 5081} {"train_loss": -26.87786293029785, "global_step": 421768, "epoch": 5081} {"train_loss": -26.873395919799805, "global_step": 421769, "epoch": 5081} {"train_loss": -26.61773681640625, "global_step": 421770, "epoch": 5081} {"train_loss": -27.095691680908203, "global_step": 421771, "epoch": 5081} {"train_loss": -26.6439151763916, "global_step": 421772, "epoch": 5081} {"train_loss": -27.101211547851562, "global_step": 421773, "epoch": 5081} {"train_loss": -26.563894271850586, "global_step": 421774, "epoch": 5081} {"train_loss": -26.83721923828125, "global_step": 421775, "epoch": 5081} {"train_loss": -26.968610763549805, "global_step": 421776, "epoch": 5081} {"train_loss": -26.789306640625, "global_step": 421777, "epoch": 5081} {"train_loss": -26.982624053955078, "global_step": 421778, "epoch": 5081} {"train_loss": -26.92524528503418, "global_step": 421779, "epoch": 5081} {"train_loss": -26.59299659729004, "global_step": 421780, "epoch": 5081} {"train_loss": -26.900705337524414, "global_step": 421781, "epoch": 5081} {"train_loss": -27.017749786376953, "global_step": 421782, "epoch": 5081} {"train_loss": -26.845703125, "global_step": 421783, "epoch": 5081} {"train_loss": -26.882848739624023, "global_step": 421784, "epoch": 5081} {"train_loss": -26.96573829650879, "global_step": 421785, "epoch": 5081} {"train_loss": -26.967435836791992, "global_step": 421786, "epoch": 5081} {"train_loss": -26.958236694335938, "global_step": 421787, "epoch": 5081} {"train_loss": -26.772674560546875, "global_step": 421788, "epoch": 5081} {"train_loss": -26.690204620361328, "global_step": 421789, "epoch": 5081} {"train_loss": -26.4495849609375, "global_step": 421790, "epoch": 5081} {"train_loss": -26.995859146118164, "global_step": 421791, "epoch": 5081} {"train_loss": -26.92275047302246, "global_step": 421792, "epoch": 5081} {"train_loss": -26.488203048706055, "global_step": 421793, "epoch": 5081} {"train_loss": -26.561710357666016, "global_step": 421794, "epoch": 5081} {"train_loss": -26.879352569580078, "global_step": 421795, "epoch": 5081} {"train_loss": -26.702428817749023, "global_step": 421796, "epoch": 5081} {"train_loss": -26.46792984008789, "global_step": 421797, "epoch": 5081} {"train_loss": -26.77939224243164, "global_step": 421798, "epoch": 5081} {"train_loss": -26.581403732299805, "global_step": 421799, "epoch": 5081} {"train_loss": -26.885101318359375, "global_step": 421800, "epoch": 5081} {"train_loss": -26.718891143798828, "global_step": 421801, "epoch": 5081} {"train_loss": -26.688556671142578, "global_step": 421802, "epoch": 5081} {"train_loss": -26.907806396484375, "global_step": 421803, "epoch": 5081} {"train_loss": -26.52982521057129, "global_step": 421804, "epoch": 5081} {"train_loss": -26.62739445789751, "global_step": 421805, "epoch": 5081, "val_loss": 6986377.5} {"train_loss": -26.331207275390625, "global_step": 421806, "epoch": 5082} {"train_loss": -25.4198055267334, "global_step": 421807, "epoch": 5082} {"train_loss": -25.843170166015625, "global_step": 421808, "epoch": 5082} {"train_loss": -26.640836715698242, "global_step": 421809, "epoch": 5082} {"train_loss": -25.685312271118164, "global_step": 421810, "epoch": 5082} {"train_loss": -26.1514835357666, "global_step": 421811, "epoch": 5082} {"train_loss": -26.513721466064453, "global_step": 421812, "epoch": 5082} {"train_loss": -26.104894638061523, "global_step": 421813, "epoch": 5082} {"train_loss": -26.184356689453125, "global_step": 421814, "epoch": 5082} {"train_loss": -25.963056564331055, "global_step": 421815, "epoch": 5082} {"train_loss": -26.595190048217773, "global_step": 421816, "epoch": 5082} {"train_loss": -26.530073165893555, "global_step": 421817, "epoch": 5082} {"train_loss": -26.583677291870117, "global_step": 421818, "epoch": 5082} {"train_loss": -26.207263946533203, "global_step": 421819, "epoch": 5082} {"train_loss": -26.212543487548828, "global_step": 421820, "epoch": 5082} {"train_loss": -26.278385162353516, "global_step": 421821, "epoch": 5082} {"train_loss": -26.646780014038086, "global_step": 421822, "epoch": 5082} {"train_loss": -26.59061622619629, "global_step": 421823, "epoch": 5082} {"train_loss": -26.634479522705078, "global_step": 421824, "epoch": 5082} {"train_loss": -26.503347396850586, "global_step": 421825, "epoch": 5082} {"train_loss": -26.86846923828125, "global_step": 421826, "epoch": 5082} {"train_loss": -26.468555450439453, "global_step": 421827, "epoch": 5082} {"train_loss": -26.606189727783203, "global_step": 421828, "epoch": 5082} {"train_loss": -26.96575927734375, "global_step": 421829, "epoch": 5082} {"train_loss": -26.722793579101562, "global_step": 421830, "epoch": 5082} {"train_loss": -27.04023551940918, "global_step": 421831, "epoch": 5082} {"train_loss": -26.6189022064209, "global_step": 421832, "epoch": 5082} {"train_loss": -26.534875869750977, "global_step": 421833, "epoch": 5082} {"train_loss": -26.589086532592773, "global_step": 421834, "epoch": 5082} {"train_loss": -26.72808837890625, "global_step": 421835, "epoch": 5082} {"train_loss": -26.80817222595215, "global_step": 421836, "epoch": 5082} {"train_loss": -26.83405876159668, "global_step": 421837, "epoch": 5082} {"train_loss": -26.92913246154785, "global_step": 421838, "epoch": 5082} {"train_loss": -26.420896530151367, "global_step": 421839, "epoch": 5082} {"train_loss": -26.546863555908203, "global_step": 421840, "epoch": 5082} {"train_loss": -26.6530818939209, "global_step": 421841, "epoch": 5082} {"train_loss": -26.638517379760742, "global_step": 421842, "epoch": 5082} {"train_loss": -26.806095123291016, "global_step": 421843, "epoch": 5082} {"train_loss": -26.695947647094727, "global_step": 421844, "epoch": 5082} {"train_loss": -27.01541519165039, "global_step": 421845, "epoch": 5082} {"train_loss": -26.878747940063477, "global_step": 421846, "epoch": 5082} {"train_loss": -26.909360885620117, "global_step": 421847, "epoch": 5082} {"train_loss": -26.65862464904785, "global_step": 421848, "epoch": 5082} {"train_loss": -26.86813735961914, "global_step": 421849, "epoch": 5082} {"train_loss": -27.00105094909668, "global_step": 421850, "epoch": 5082} {"train_loss": -26.83209228515625, "global_step": 421851, "epoch": 5082} {"train_loss": -26.77219581604004, "global_step": 421852, "epoch": 5082} {"train_loss": -27.2813777923584, "global_step": 421853, "epoch": 5082} {"train_loss": -26.707061767578125, "global_step": 421854, "epoch": 5082} {"train_loss": -26.859088897705078, "global_step": 421855, "epoch": 5082} {"train_loss": -27.249235153198242, "global_step": 421856, "epoch": 5082} {"train_loss": -26.928009033203125, "global_step": 421857, "epoch": 5082} {"train_loss": -27.169158935546875, "global_step": 421858, "epoch": 5082} {"train_loss": -26.779394149780273, "global_step": 421859, "epoch": 5082} {"train_loss": -26.774444580078125, "global_step": 421860, "epoch": 5082} {"train_loss": -26.478857040405273, "global_step": 421861, "epoch": 5082} {"train_loss": -26.77374267578125, "global_step": 421862, "epoch": 5082} {"train_loss": -26.79570960998535, "global_step": 421863, "epoch": 5082} {"train_loss": -26.544076919555664, "global_step": 421864, "epoch": 5082} {"train_loss": -27.472620010375977, "global_step": 421865, "epoch": 5082} {"train_loss": -27.022226333618164, "global_step": 421866, "epoch": 5082} {"train_loss": -26.946502685546875, "global_step": 421867, "epoch": 5082} {"train_loss": -26.599027633666992, "global_step": 421868, "epoch": 5082} {"train_loss": -26.409948348999023, "global_step": 421869, "epoch": 5082} {"train_loss": -26.640344619750977, "global_step": 421870, "epoch": 5082} {"train_loss": -27.338659286499023, "global_step": 421871, "epoch": 5082} {"train_loss": -26.456220626831055, "global_step": 421872, "epoch": 5082} {"train_loss": -26.574756622314453, "global_step": 421873, "epoch": 5082} {"train_loss": -26.671422958374023, "global_step": 421874, "epoch": 5082} {"train_loss": -27.068817138671875, "global_step": 421875, "epoch": 5082} {"train_loss": -26.22138023376465, "global_step": 421876, "epoch": 5082} {"train_loss": -27.29864501953125, "global_step": 421877, "epoch": 5082} {"train_loss": -26.8660831451416, "global_step": 421878, "epoch": 5082} {"train_loss": -26.765899658203125, "global_step": 421879, "epoch": 5082} {"train_loss": -27.092681884765625, "global_step": 421880, "epoch": 5082} {"train_loss": -26.88014793395996, "global_step": 421881, "epoch": 5082} {"train_loss": -27.110950469970703, "global_step": 421882, "epoch": 5082} {"train_loss": -26.962158203125, "global_step": 421883, "epoch": 5082} {"train_loss": -26.963064193725586, "global_step": 421884, "epoch": 5082} {"train_loss": -27.2021541595459, "global_step": 421885, "epoch": 5082} {"train_loss": -27.0135498046875, "global_step": 421886, "epoch": 5082} {"train_loss": -27.249372482299805, "global_step": 421887, "epoch": 5082} {"train_loss": -26.702681001410426, "global_step": 421888, "epoch": 5082, "val_loss": 7026431.5} {"train_loss": -25.690673828125, "global_step": 421889, "epoch": 5083} {"train_loss": -25.607446670532227, "global_step": 421890, "epoch": 5083} {"train_loss": -26.393293380737305, "global_step": 421891, "epoch": 5083} {"train_loss": -25.956769943237305, "global_step": 421892, "epoch": 5083} {"train_loss": -26.27296257019043, "global_step": 421893, "epoch": 5083} {"train_loss": -26.24407958984375, "global_step": 421894, "epoch": 5083} {"train_loss": -26.636524200439453, "global_step": 421895, "epoch": 5083} {"train_loss": -26.575204849243164, "global_step": 421896, "epoch": 5083} {"train_loss": -26.01800537109375, "global_step": 421897, "epoch": 5083} {"train_loss": -26.2193660736084, "global_step": 421898, "epoch": 5083} {"train_loss": -26.37644386291504, "global_step": 421899, "epoch": 5083} {"train_loss": -26.04876136779785, "global_step": 421900, "epoch": 5083} {"train_loss": -26.559329986572266, "global_step": 421901, "epoch": 5083} {"train_loss": -26.711767196655273, "global_step": 421902, "epoch": 5083} {"train_loss": -26.428424835205078, "global_step": 421903, "epoch": 5083} {"train_loss": -26.6153621673584, "global_step": 421904, "epoch": 5083} {"train_loss": -26.70892906188965, "global_step": 421905, "epoch": 5083} {"train_loss": -26.6765079498291, "global_step": 421906, "epoch": 5083} {"train_loss": -26.608448028564453, "global_step": 421907, "epoch": 5083} {"train_loss": -26.6457576751709, "global_step": 421908, "epoch": 5083} {"train_loss": -26.950515747070312, "global_step": 421909, "epoch": 5083} {"train_loss": -26.7371768951416, "global_step": 421910, "epoch": 5083} {"train_loss": -27.301977157592773, "global_step": 421911, "epoch": 5083} {"train_loss": -27.13229751586914, "global_step": 421912, "epoch": 5083} {"train_loss": -27.306486129760742, "global_step": 421913, "epoch": 5083} {"train_loss": -26.763031005859375, "global_step": 421914, "epoch": 5083} {"train_loss": -27.11128044128418, "global_step": 421915, "epoch": 5083} {"train_loss": -27.058826446533203, "global_step": 421916, "epoch": 5083} {"train_loss": -26.962827682495117, "global_step": 421917, "epoch": 5083} {"train_loss": -26.76919937133789, "global_step": 421918, "epoch": 5083} {"train_loss": -26.864959716796875, "global_step": 421919, "epoch": 5083} {"train_loss": -27.0670223236084, "global_step": 421920, "epoch": 5083} {"train_loss": -26.9803409576416, "global_step": 421921, "epoch": 5083} {"train_loss": -27.061786651611328, "global_step": 421922, "epoch": 5083} {"train_loss": -27.2164249420166, "global_step": 421923, "epoch": 5083} {"train_loss": -27.0156307220459, "global_step": 421924, "epoch": 5083} {"train_loss": -26.6527042388916, "global_step": 421925, "epoch": 5083} {"train_loss": -26.785980224609375, "global_step": 421926, "epoch": 5083} {"train_loss": -26.74114990234375, "global_step": 421927, "epoch": 5083} {"train_loss": -26.71139907836914, "global_step": 421928, "epoch": 5083} {"train_loss": -26.599225997924805, "global_step": 421929, "epoch": 5083} {"train_loss": -26.2979679107666, "global_step": 421930, "epoch": 5083} {"train_loss": -26.505970001220703, "global_step": 421931, "epoch": 5083} {"train_loss": -26.534778594970703, "global_step": 421932, "epoch": 5083} {"train_loss": -27.045541763305664, "global_step": 421933, "epoch": 5083} {"train_loss": -26.454334259033203, "global_step": 421934, "epoch": 5083} {"train_loss": -26.957666397094727, "global_step": 421935, "epoch": 5083} {"train_loss": -27.000730514526367, "global_step": 421936, "epoch": 5083} {"train_loss": -26.8013858795166, "global_step": 421937, "epoch": 5083} {"train_loss": -26.78900146484375, "global_step": 421938, "epoch": 5083} {"train_loss": -26.61701011657715, "global_step": 421939, "epoch": 5083} {"train_loss": -26.63593864440918, "global_step": 421940, "epoch": 5083} {"train_loss": -26.468555450439453, "global_step": 421941, "epoch": 5083} {"train_loss": -26.861047744750977, "global_step": 421942, "epoch": 5083} {"train_loss": -26.612350463867188, "global_step": 421943, "epoch": 5083} {"train_loss": -26.488788604736328, "global_step": 421944, "epoch": 5083} {"train_loss": -26.825366973876953, "global_step": 421945, "epoch": 5083} {"train_loss": -26.82819175720215, "global_step": 421946, "epoch": 5083} {"train_loss": -27.019079208374023, "global_step": 421947, "epoch": 5083} {"train_loss": -27.31806755065918, "global_step": 421948, "epoch": 5083} {"train_loss": -26.86736488342285, "global_step": 421949, "epoch": 5083} {"train_loss": -27.062482833862305, "global_step": 421950, "epoch": 5083} {"train_loss": -26.924482345581055, "global_step": 421951, "epoch": 5083} {"train_loss": -26.853742599487305, "global_step": 421952, "epoch": 5083} {"train_loss": -26.753009796142578, "global_step": 421953, "epoch": 5083} {"train_loss": -27.062612533569336, "global_step": 421954, "epoch": 5083} {"train_loss": -26.55105972290039, "global_step": 421955, "epoch": 5083} {"train_loss": -27.064441680908203, "global_step": 421956, "epoch": 5083} {"train_loss": -26.778244018554688, "global_step": 421957, "epoch": 5083} {"train_loss": -26.709436416625977, "global_step": 421958, "epoch": 5083} {"train_loss": -26.646930694580078, "global_step": 421959, "epoch": 5083} {"train_loss": -26.797773361206055, "global_step": 421960, "epoch": 5083} {"train_loss": -27.10560417175293, "global_step": 421961, "epoch": 5083} {"train_loss": -26.737060546875, "global_step": 421962, "epoch": 5083} {"train_loss": -26.902515411376953, "global_step": 421963, "epoch": 5083} {"train_loss": -26.762439727783203, "global_step": 421964, "epoch": 5083} {"train_loss": -26.808324813842773, "global_step": 421965, "epoch": 5083} {"train_loss": -27.08778953552246, "global_step": 421966, "epoch": 5083} {"train_loss": -27.345911026000977, "global_step": 421967, "epoch": 5083} {"train_loss": -26.604734420776367, "global_step": 421968, "epoch": 5083} {"train_loss": -26.861902236938477, "global_step": 421969, "epoch": 5083} {"train_loss": -27.0328311920166, "global_step": 421970, "epoch": 5083} {"train_loss": -26.739402908876716, "global_step": 421971, "epoch": 5083, "val_loss": 7152536.0} {"train_loss": -26.71821403503418, "global_step": 421972, "epoch": 5084} {"train_loss": -26.066640853881836, "global_step": 421973, "epoch": 5084} {"train_loss": -26.041345596313477, "global_step": 421974, "epoch": 5084} {"train_loss": -26.758325576782227, "global_step": 421975, "epoch": 5084} {"train_loss": -26.16145133972168, "global_step": 421976, "epoch": 5084} {"train_loss": -26.49883460998535, "global_step": 421977, "epoch": 5084} {"train_loss": -26.011280059814453, "global_step": 421978, "epoch": 5084} {"train_loss": -26.3204288482666, "global_step": 421979, "epoch": 5084} {"train_loss": -26.775775909423828, "global_step": 421980, "epoch": 5084} {"train_loss": -26.345632553100586, "global_step": 421981, "epoch": 5084} {"train_loss": -26.444412231445312, "global_step": 421982, "epoch": 5084} {"train_loss": -26.24838638305664, "global_step": 421983, "epoch": 5084} {"train_loss": -26.64984130859375, "global_step": 421984, "epoch": 5084} {"train_loss": -26.754270553588867, "global_step": 421985, "epoch": 5084} {"train_loss": -26.528491973876953, "global_step": 421986, "epoch": 5084} {"train_loss": -26.545185089111328, "global_step": 421987, "epoch": 5084} {"train_loss": -26.31549644470215, "global_step": 421988, "epoch": 5084} {"train_loss": -26.505762100219727, "global_step": 421989, "epoch": 5084} {"train_loss": -26.717361450195312, "global_step": 421990, "epoch": 5084} {"train_loss": -26.805578231811523, "global_step": 421991, "epoch": 5084} {"train_loss": -26.54722023010254, "global_step": 421992, "epoch": 5084} {"train_loss": -26.916452407836914, "global_step": 421993, "epoch": 5084} {"train_loss": -26.5921573638916, "global_step": 421994, "epoch": 5084} {"train_loss": -26.734024047851562, "global_step": 421995, "epoch": 5084} {"train_loss": -26.91715431213379, "global_step": 421996, "epoch": 5084} {"train_loss": -26.639001846313477, "global_step": 421997, "epoch": 5084} {"train_loss": -26.642257690429688, "global_step": 421998, "epoch": 5084} {"train_loss": -26.6223087310791, "global_step": 421999, "epoch": 5084} {"train_loss": -26.76009178161621, "global_step": 422000, "epoch": 5084} {"train_loss": -26.968236923217773, "global_step": 422001, "epoch": 5084} {"train_loss": -26.749597549438477, "global_step": 422002, "epoch": 5084} {"train_loss": -26.396310806274414, "global_step": 422003, "epoch": 5084} {"train_loss": -26.53986930847168, "global_step": 422004, "epoch": 5084} {"train_loss": -26.5106143951416, "global_step": 422005, "epoch": 5084} {"train_loss": -26.600677490234375, "global_step": 422006, "epoch": 5084} {"train_loss": -26.316415786743164, "global_step": 422007, "epoch": 5084} {"train_loss": -26.75795555114746, "global_step": 422008, "epoch": 5084} {"train_loss": -26.843814849853516, "global_step": 422009, "epoch": 5084} {"train_loss": -26.814929962158203, "global_step": 422010, "epoch": 5084} {"train_loss": -26.664325714111328, "global_step": 422011, "epoch": 5084} {"train_loss": -26.745059967041016, "global_step": 422012, "epoch": 5084} {"train_loss": -26.815357208251953, "global_step": 422013, "epoch": 5084} {"train_loss": -26.539228439331055, "global_step": 422014, "epoch": 5084} {"train_loss": -27.20940589904785, "global_step": 422015, "epoch": 5084} {"train_loss": -27.01358985900879, "global_step": 422016, "epoch": 5084} {"train_loss": -26.890613555908203, "global_step": 422017, "epoch": 5084} {"train_loss": -26.729116439819336, "global_step": 422018, "epoch": 5084} {"train_loss": -26.7170352935791, "global_step": 422019, "epoch": 5084} {"train_loss": -26.631513595581055, "global_step": 422020, "epoch": 5084} {"train_loss": -27.0944766998291, "global_step": 422021, "epoch": 5084} {"train_loss": -26.494314193725586, "global_step": 422022, "epoch": 5084} {"train_loss": -26.47490882873535, "global_step": 422023, "epoch": 5084} {"train_loss": -26.16725730895996, "global_step": 422024, "epoch": 5084} {"train_loss": -26.109277725219727, "global_step": 422025, "epoch": 5084} {"train_loss": -26.946979522705078, "global_step": 422026, "epoch": 5084} {"train_loss": -26.648746490478516, "global_step": 422027, "epoch": 5084} {"train_loss": -26.62700843811035, "global_step": 422028, "epoch": 5084} {"train_loss": -26.977567672729492, "global_step": 422029, "epoch": 5084} {"train_loss": -26.725357055664062, "global_step": 422030, "epoch": 5084} {"train_loss": -26.619436264038086, "global_step": 422031, "epoch": 5084} {"train_loss": -26.563024520874023, "global_step": 422032, "epoch": 5084} {"train_loss": -27.300268173217773, "global_step": 422033, "epoch": 5084} {"train_loss": -27.216245651245117, "global_step": 422034, "epoch": 5084} {"train_loss": -26.89422035217285, "global_step": 422035, "epoch": 5084} {"train_loss": -27.229455947875977, "global_step": 422036, "epoch": 5084} {"train_loss": -26.86683464050293, "global_step": 422037, "epoch": 5084} {"train_loss": -26.661508560180664, "global_step": 422038, "epoch": 5084} {"train_loss": -27.263952255249023, "global_step": 422039, "epoch": 5084} {"train_loss": -26.78362464904785, "global_step": 422040, "epoch": 5084} {"train_loss": -27.001386642456055, "global_step": 422041, "epoch": 5084} {"train_loss": -26.6162166595459, "global_step": 422042, "epoch": 5084} {"train_loss": -26.96990394592285, "global_step": 422043, "epoch": 5084} {"train_loss": -27.185148239135742, "global_step": 422044, "epoch": 5084} {"train_loss": -26.77727699279785, "global_step": 422045, "epoch": 5084} {"train_loss": -26.6612491607666, "global_step": 422046, "epoch": 5084} {"train_loss": -27.198057174682617, "global_step": 422047, "epoch": 5084} {"train_loss": -26.69915771484375, "global_step": 422048, "epoch": 5084} {"train_loss": -26.83742332458496, "global_step": 422049, "epoch": 5084} {"train_loss": -26.83575439453125, "global_step": 422050, "epoch": 5084} {"train_loss": -26.576269149780273, "global_step": 422051, "epoch": 5084} {"train_loss": -27.110788345336914, "global_step": 422052, "epoch": 5084} {"train_loss": -26.865921020507812, "global_step": 422053, "epoch": 5084} {"train_loss": -26.692361693784417, "global_step": 422054, "epoch": 5084, "val_loss": 7157515.0} {"train_loss": -26.304086685180664, "global_step": 422055, "epoch": 5085} {"train_loss": -26.202417373657227, "global_step": 422056, "epoch": 5085} {"train_loss": -26.45513916015625, "global_step": 422057, "epoch": 5085} {"train_loss": -26.33025550842285, "global_step": 422058, "epoch": 5085} {"train_loss": -26.332839965820312, "global_step": 422059, "epoch": 5085} {"train_loss": -26.3922061920166, "global_step": 422060, "epoch": 5085} {"train_loss": -25.71735954284668, "global_step": 422061, "epoch": 5085} {"train_loss": -26.284915924072266, "global_step": 422062, "epoch": 5085} {"train_loss": -25.8265380859375, "global_step": 422063, "epoch": 5085} {"train_loss": -26.895212173461914, "global_step": 422064, "epoch": 5085} {"train_loss": -26.32623863220215, "global_step": 422065, "epoch": 5085} {"train_loss": -26.395288467407227, "global_step": 422066, "epoch": 5085} {"train_loss": -26.325851440429688, "global_step": 422067, "epoch": 5085} {"train_loss": -26.443866729736328, "global_step": 422068, "epoch": 5085} {"train_loss": -26.039215087890625, "global_step": 422069, "epoch": 5085} {"train_loss": -26.508075714111328, "global_step": 422070, "epoch": 5085} {"train_loss": -26.620365142822266, "global_step": 422071, "epoch": 5085} {"train_loss": -26.2078857421875, "global_step": 422072, "epoch": 5085} {"train_loss": -26.71194839477539, "global_step": 422073, "epoch": 5085} {"train_loss": -26.60272216796875, "global_step": 422074, "epoch": 5085} {"train_loss": -26.439865112304688, "global_step": 422075, "epoch": 5085} {"train_loss": -26.693710327148438, "global_step": 422076, "epoch": 5085} {"train_loss": -26.78724479675293, "global_step": 422077, "epoch": 5085} {"train_loss": -27.012052536010742, "global_step": 422078, "epoch": 5085} {"train_loss": -26.669198989868164, "global_step": 422079, "epoch": 5085} {"train_loss": -26.9456729888916, "global_step": 422080, "epoch": 5085} {"train_loss": -27.071630477905273, "global_step": 422081, "epoch": 5085} {"train_loss": -26.963132858276367, "global_step": 422082, "epoch": 5085} {"train_loss": -26.543493270874023, "global_step": 422083, "epoch": 5085} {"train_loss": -26.91951560974121, "global_step": 422084, "epoch": 5085} {"train_loss": -26.75909996032715, "global_step": 422085, "epoch": 5085} {"train_loss": -26.85009765625, "global_step": 422086, "epoch": 5085} {"train_loss": -26.924015045166016, "global_step": 422087, "epoch": 5085} {"train_loss": -26.82728385925293, "global_step": 422088, "epoch": 5085} {"train_loss": -26.436660766601562, "global_step": 422089, "epoch": 5085} {"train_loss": -27.018957138061523, "global_step": 422090, "epoch": 5085} {"train_loss": -26.560611724853516, "global_step": 422091, "epoch": 5085} {"train_loss": -26.798480987548828, "global_step": 422092, "epoch": 5085} {"train_loss": -26.6683349609375, "global_step": 422093, "epoch": 5085} {"train_loss": -26.755224227905273, "global_step": 422094, "epoch": 5085} {"train_loss": -27.11886978149414, "global_step": 422095, "epoch": 5085} {"train_loss": -26.801061630249023, "global_step": 422096, "epoch": 5085} {"train_loss": -26.875783920288086, "global_step": 422097, "epoch": 5085} {"train_loss": -26.891254425048828, "global_step": 422098, "epoch": 5085} {"train_loss": -27.164182662963867, "global_step": 422099, "epoch": 5085} {"train_loss": -26.709333419799805, "global_step": 422100, "epoch": 5085} {"train_loss": -26.804914474487305, "global_step": 422101, "epoch": 5085} {"train_loss": -26.87029457092285, "global_step": 422102, "epoch": 5085} {"train_loss": -26.66090202331543, "global_step": 422103, "epoch": 5085} {"train_loss": -26.612384796142578, "global_step": 422104, "epoch": 5085} {"train_loss": -26.5664119720459, "global_step": 422105, "epoch": 5085} {"train_loss": -26.70001220703125, "global_step": 422106, "epoch": 5085} {"train_loss": -26.723508834838867, "global_step": 422107, "epoch": 5085} {"train_loss": -27.31910514831543, "global_step": 422108, "epoch": 5085} {"train_loss": -27.181623458862305, "global_step": 422109, "epoch": 5085} {"train_loss": -26.744604110717773, "global_step": 422110, "epoch": 5085} {"train_loss": -27.183704376220703, "global_step": 422111, "epoch": 5085} {"train_loss": -26.877044677734375, "global_step": 422112, "epoch": 5085} {"train_loss": -26.94353675842285, "global_step": 422113, "epoch": 5085} {"train_loss": -26.830530166625977, "global_step": 422114, "epoch": 5085} {"train_loss": -27.141193389892578, "global_step": 422115, "epoch": 5085} {"train_loss": -27.060094833374023, "global_step": 422116, "epoch": 5085} {"train_loss": -26.990966796875, "global_step": 422117, "epoch": 5085} {"train_loss": -26.871992111206055, "global_step": 422118, "epoch": 5085} {"train_loss": -26.95310401916504, "global_step": 422119, "epoch": 5085} {"train_loss": -26.8206787109375, "global_step": 422120, "epoch": 5085} {"train_loss": -26.947601318359375, "global_step": 422121, "epoch": 5085} {"train_loss": -27.094396591186523, "global_step": 422122, "epoch": 5085} {"train_loss": -26.9089412689209, "global_step": 422123, "epoch": 5085} {"train_loss": -27.152379989624023, "global_step": 422124, "epoch": 5085} {"train_loss": -27.1618595123291, "global_step": 422125, "epoch": 5085} {"train_loss": -27.204465866088867, "global_step": 422126, "epoch": 5085} {"train_loss": -26.632221221923828, "global_step": 422127, "epoch": 5085} {"train_loss": -26.743009567260742, "global_step": 422128, "epoch": 5085} {"train_loss": -26.779523849487305, "global_step": 422129, "epoch": 5085} {"train_loss": -26.84259033203125, "global_step": 422130, "epoch": 5085} {"train_loss": -25.99457359313965, "global_step": 422131, "epoch": 5085} {"train_loss": -24.836896896362305, "global_step": 422132, "epoch": 5085} {"train_loss": -24.47670555114746, "global_step": 422133, "epoch": 5085} {"train_loss": -25.221906661987305, "global_step": 422134, "epoch": 5085} {"train_loss": -26.41330909729004, "global_step": 422135, "epoch": 5085} {"train_loss": -26.014881134033203, "global_step": 422136, "epoch": 5085} {"train_loss": -26.61754350777132, "global_step": 422137, "epoch": 5085, "val_loss": 7160144.0} {"train_loss": -24.64409637451172, "global_step": 422138, "epoch": 5086} {"train_loss": -26.20831871032715, "global_step": 422139, "epoch": 5086} {"train_loss": -25.536828994750977, "global_step": 422140, "epoch": 5086} {"train_loss": -26.390796661376953, "global_step": 422141, "epoch": 5086} {"train_loss": -25.371917724609375, "global_step": 422142, "epoch": 5086} {"train_loss": -25.774194717407227, "global_step": 422143, "epoch": 5086} {"train_loss": -25.5111026763916, "global_step": 422144, "epoch": 5086} {"train_loss": -26.209430694580078, "global_step": 422145, "epoch": 5086} {"train_loss": -25.854084014892578, "global_step": 422146, "epoch": 5086} {"train_loss": -26.38511085510254, "global_step": 422147, "epoch": 5086} {"train_loss": -25.569747924804688, "global_step": 422148, "epoch": 5086} {"train_loss": -26.22279167175293, "global_step": 422149, "epoch": 5086} {"train_loss": -26.052560806274414, "global_step": 422150, "epoch": 5086} {"train_loss": -25.80661392211914, "global_step": 422151, "epoch": 5086} {"train_loss": -26.04345703125, "global_step": 422152, "epoch": 5086} {"train_loss": -26.093835830688477, "global_step": 422153, "epoch": 5086} {"train_loss": -25.9024715423584, "global_step": 422154, "epoch": 5086} {"train_loss": -26.271839141845703, "global_step": 422155, "epoch": 5086} {"train_loss": -26.496978759765625, "global_step": 422156, "epoch": 5086} {"train_loss": -26.564985275268555, "global_step": 422157, "epoch": 5086} {"train_loss": -26.394254684448242, "global_step": 422158, "epoch": 5086} {"train_loss": -26.3122501373291, "global_step": 422159, "epoch": 5086} {"train_loss": -26.493955612182617, "global_step": 422160, "epoch": 5086} {"train_loss": -26.359716415405273, "global_step": 422161, "epoch": 5086} {"train_loss": -26.238752365112305, "global_step": 422162, "epoch": 5086} {"train_loss": -26.652109146118164, "global_step": 422163, "epoch": 5086} {"train_loss": -26.362274169921875, "global_step": 422164, "epoch": 5086} {"train_loss": -26.633804321289062, "global_step": 422165, "epoch": 5086} {"train_loss": -26.53450584411621, "global_step": 422166, "epoch": 5086} {"train_loss": -26.772937774658203, "global_step": 422167, "epoch": 5086} {"train_loss": -26.667272567749023, "global_step": 422168, "epoch": 5086} {"train_loss": -26.780481338500977, "global_step": 422169, "epoch": 5086} {"train_loss": -26.34583854675293, "global_step": 422170, "epoch": 5086} {"train_loss": -26.815710067749023, "global_step": 422171, "epoch": 5086} {"train_loss": -26.77943992614746, "global_step": 422172, "epoch": 5086} {"train_loss": -26.705251693725586, "global_step": 422173, "epoch": 5086} {"train_loss": -26.531103134155273, "global_step": 422174, "epoch": 5086} {"train_loss": -26.833606719970703, "global_step": 422175, "epoch": 5086} {"train_loss": -26.868255615234375, "global_step": 422176, "epoch": 5086} {"train_loss": -26.84132194519043, "global_step": 422177, "epoch": 5086} {"train_loss": -27.06269645690918, "global_step": 422178, "epoch": 5086} {"train_loss": -27.2772274017334, "global_step": 422179, "epoch": 5086} {"train_loss": -26.787450790405273, "global_step": 422180, "epoch": 5086} {"train_loss": -26.927444458007812, "global_step": 422181, "epoch": 5086} {"train_loss": -26.6971378326416, "global_step": 422182, "epoch": 5086} {"train_loss": -27.18507194519043, "global_step": 422183, "epoch": 5086} {"train_loss": -26.763315200805664, "global_step": 422184, "epoch": 5086} {"train_loss": -26.56563377380371, "global_step": 422185, "epoch": 5086} {"train_loss": -26.724414825439453, "global_step": 422186, "epoch": 5086} {"train_loss": -27.004430770874023, "global_step": 422187, "epoch": 5086} {"train_loss": -27.12679100036621, "global_step": 422188, "epoch": 5086} {"train_loss": -27.16096305847168, "global_step": 422189, "epoch": 5086} {"train_loss": -26.957489013671875, "global_step": 422190, "epoch": 5086} {"train_loss": -26.690603256225586, "global_step": 422191, "epoch": 5086} {"train_loss": -27.245380401611328, "global_step": 422192, "epoch": 5086} {"train_loss": -26.805368423461914, "global_step": 422193, "epoch": 5086} {"train_loss": -26.641845703125, "global_step": 422194, "epoch": 5086} {"train_loss": -26.730716705322266, "global_step": 422195, "epoch": 5086} {"train_loss": -26.864667892456055, "global_step": 422196, "epoch": 5086} {"train_loss": -26.522186279296875, "global_step": 422197, "epoch": 5086} {"train_loss": -26.85868263244629, "global_step": 422198, "epoch": 5086} {"train_loss": -27.00343894958496, "global_step": 422199, "epoch": 5086} {"train_loss": -27.318450927734375, "global_step": 422200, "epoch": 5086} {"train_loss": -26.77188491821289, "global_step": 422201, "epoch": 5086} {"train_loss": -26.584726333618164, "global_step": 422202, "epoch": 5086} {"train_loss": -26.74102783203125, "global_step": 422203, "epoch": 5086} {"train_loss": -26.945096969604492, "global_step": 422204, "epoch": 5086} {"train_loss": -27.044172286987305, "global_step": 422205, "epoch": 5086} {"train_loss": -26.755640029907227, "global_step": 422206, "epoch": 5086} {"train_loss": -26.2647762298584, "global_step": 422207, "epoch": 5086} {"train_loss": -26.618762969970703, "global_step": 422208, "epoch": 5086} {"train_loss": -26.753759384155273, "global_step": 422209, "epoch": 5086} {"train_loss": -26.67763328552246, "global_step": 422210, "epoch": 5086} {"train_loss": -26.977630615234375, "global_step": 422211, "epoch": 5086} {"train_loss": -27.035511016845703, "global_step": 422212, "epoch": 5086} {"train_loss": -26.796436309814453, "global_step": 422213, "epoch": 5086} {"train_loss": -26.798093795776367, "global_step": 422214, "epoch": 5086} {"train_loss": -26.49946403503418, "global_step": 422215, "epoch": 5086} {"train_loss": -26.628955841064453, "global_step": 422216, "epoch": 5086} {"train_loss": -26.756006240844727, "global_step": 422217, "epoch": 5086} {"train_loss": -26.66982078552246, "global_step": 422218, "epoch": 5086} {"train_loss": -27.091766357421875, "global_step": 422219, "epoch": 5086} {"train_loss": -26.540472513221832, "global_step": 422220, "epoch": 5086, "val_loss": 7059464.0} {"train_loss": -26.725561141967773, "global_step": 422221, "epoch": 5087} {"train_loss": -26.086395263671875, "global_step": 422222, "epoch": 5087} {"train_loss": -26.519697189331055, "global_step": 422223, "epoch": 5087} {"train_loss": -26.76410484313965, "global_step": 422224, "epoch": 5087} {"train_loss": -26.324705123901367, "global_step": 422225, "epoch": 5087} {"train_loss": -26.3167781829834, "global_step": 422226, "epoch": 5087} {"train_loss": -26.485767364501953, "global_step": 422227, "epoch": 5087} {"train_loss": -26.311237335205078, "global_step": 422228, "epoch": 5087} {"train_loss": -26.487014770507812, "global_step": 422229, "epoch": 5087} {"train_loss": -26.311670303344727, "global_step": 422230, "epoch": 5087} {"train_loss": -26.828229904174805, "global_step": 422231, "epoch": 5087} {"train_loss": -26.47348976135254, "global_step": 422232, "epoch": 5087} {"train_loss": -26.527250289916992, "global_step": 422233, "epoch": 5087} {"train_loss": -26.74134635925293, "global_step": 422234, "epoch": 5087} {"train_loss": -26.6762638092041, "global_step": 422235, "epoch": 5087} {"train_loss": -26.441741943359375, "global_step": 422236, "epoch": 5087} {"train_loss": -26.82828712463379, "global_step": 422237, "epoch": 5087} {"train_loss": -26.800048828125, "global_step": 422238, "epoch": 5087} {"train_loss": -26.612211227416992, "global_step": 422239, "epoch": 5087} {"train_loss": -26.717548370361328, "global_step": 422240, "epoch": 5087} {"train_loss": -26.59234046936035, "global_step": 422241, "epoch": 5087} {"train_loss": -26.619766235351562, "global_step": 422242, "epoch": 5087} {"train_loss": -26.89520835876465, "global_step": 422243, "epoch": 5087} {"train_loss": -26.94550895690918, "global_step": 422244, "epoch": 5087} {"train_loss": -26.850278854370117, "global_step": 422245, "epoch": 5087} {"train_loss": -26.651769638061523, "global_step": 422246, "epoch": 5087} {"train_loss": -26.7023983001709, "global_step": 422247, "epoch": 5087} {"train_loss": -26.91162109375, "global_step": 422248, "epoch": 5087} {"train_loss": -26.5993595123291, "global_step": 422249, "epoch": 5087} {"train_loss": -26.263864517211914, "global_step": 422250, "epoch": 5087} {"train_loss": -26.799728393554688, "global_step": 422251, "epoch": 5087} {"train_loss": -26.888418197631836, "global_step": 422252, "epoch": 5087} {"train_loss": -26.858570098876953, "global_step": 422253, "epoch": 5087} {"train_loss": -26.55743408203125, "global_step": 422254, "epoch": 5087} {"train_loss": -26.8209228515625, "global_step": 422255, "epoch": 5087} {"train_loss": -26.661239624023438, "global_step": 422256, "epoch": 5087} {"train_loss": -26.743453979492188, "global_step": 422257, "epoch": 5087} {"train_loss": -26.76262855529785, "global_step": 422258, "epoch": 5087} {"train_loss": -26.918548583984375, "global_step": 422259, "epoch": 5087} {"train_loss": -26.392139434814453, "global_step": 422260, "epoch": 5087} {"train_loss": -26.7310733795166, "global_step": 422261, "epoch": 5087} {"train_loss": -26.359540939331055, "global_step": 422262, "epoch": 5087} {"train_loss": -27.042367935180664, "global_step": 422263, "epoch": 5087} {"train_loss": -26.6306209564209, "global_step": 422264, "epoch": 5087} {"train_loss": -26.55780029296875, "global_step": 422265, "epoch": 5087} {"train_loss": -27.038375854492188, "global_step": 422266, "epoch": 5087} {"train_loss": -26.462522506713867, "global_step": 422267, "epoch": 5087} {"train_loss": -26.93348503112793, "global_step": 422268, "epoch": 5087} {"train_loss": -26.632165908813477, "global_step": 422269, "epoch": 5087} {"train_loss": -26.769739151000977, "global_step": 422270, "epoch": 5087} {"train_loss": -26.61345863342285, "global_step": 422271, "epoch": 5087} {"train_loss": -27.15695571899414, "global_step": 422272, "epoch": 5087} {"train_loss": -26.914831161499023, "global_step": 422273, "epoch": 5087} {"train_loss": -26.967151641845703, "global_step": 422274, "epoch": 5087} {"train_loss": -26.99016761779785, "global_step": 422275, "epoch": 5087} {"train_loss": -27.056737899780273, "global_step": 422276, "epoch": 5087} {"train_loss": -26.93454933166504, "global_step": 422277, "epoch": 5087} {"train_loss": -27.047086715698242, "global_step": 422278, "epoch": 5087} {"train_loss": -27.08490562438965, "global_step": 422279, "epoch": 5087} {"train_loss": -27.11476707458496, "global_step": 422280, "epoch": 5087} {"train_loss": -27.154340744018555, "global_step": 422281, "epoch": 5087} {"train_loss": -26.922412872314453, "global_step": 422282, "epoch": 5087} {"train_loss": -27.052865982055664, "global_step": 422283, "epoch": 5087} {"train_loss": -27.214252471923828, "global_step": 422284, "epoch": 5087} {"train_loss": -26.99823570251465, "global_step": 422285, "epoch": 5087} {"train_loss": -26.797622680664062, "global_step": 422286, "epoch": 5087} {"train_loss": -27.173009872436523, "global_step": 422287, "epoch": 5087} {"train_loss": -27.006305694580078, "global_step": 422288, "epoch": 5087} {"train_loss": -26.396696090698242, "global_step": 422289, "epoch": 5087} {"train_loss": -26.76338005065918, "global_step": 422290, "epoch": 5087} {"train_loss": -26.324533462524414, "global_step": 422291, "epoch": 5087} {"train_loss": -25.464017868041992, "global_step": 422292, "epoch": 5087} {"train_loss": -26.110767364501953, "global_step": 422293, "epoch": 5087} {"train_loss": -26.59967613220215, "global_step": 422294, "epoch": 5087} {"train_loss": -26.576101303100586, "global_step": 422295, "epoch": 5087} {"train_loss": -26.451181411743164, "global_step": 422296, "epoch": 5087} {"train_loss": -26.659637451171875, "global_step": 422297, "epoch": 5087} {"train_loss": -25.86603355407715, "global_step": 422298, "epoch": 5087} {"train_loss": -26.708120346069336, "global_step": 422299, "epoch": 5087} {"train_loss": -26.57474708557129, "global_step": 422300, "epoch": 5087} {"train_loss": -26.403003692626953, "global_step": 422301, "epoch": 5087} {"train_loss": -26.52362060546875, "global_step": 422302, "epoch": 5087} {"train_loss": -26.68093531964773, "global_step": 422303, "epoch": 5087, "val_loss": 7206906.0} {"train_loss": -24.85038185119629, "global_step": 422304, "epoch": 5088} {"train_loss": -25.1651554107666, "global_step": 422305, "epoch": 5088} {"train_loss": -25.87497329711914, "global_step": 422306, "epoch": 5088} {"train_loss": -25.42954444885254, "global_step": 422307, "epoch": 5088} {"train_loss": -25.88296890258789, "global_step": 422308, "epoch": 5088} {"train_loss": -25.388933181762695, "global_step": 422309, "epoch": 5088} {"train_loss": -26.05156898498535, "global_step": 422310, "epoch": 5088} {"train_loss": -25.647672653198242, "global_step": 422311, "epoch": 5088} {"train_loss": -26.01881217956543, "global_step": 422312, "epoch": 5088} {"train_loss": -25.60028648376465, "global_step": 422313, "epoch": 5088} {"train_loss": -25.91758155822754, "global_step": 422314, "epoch": 5088} {"train_loss": -26.55657958984375, "global_step": 422315, "epoch": 5088} {"train_loss": -25.778905868530273, "global_step": 422316, "epoch": 5088} {"train_loss": -26.71160888671875, "global_step": 422317, "epoch": 5088} {"train_loss": -25.967809677124023, "global_step": 422318, "epoch": 5088} {"train_loss": -26.155179977416992, "global_step": 422319, "epoch": 5088} {"train_loss": -26.164289474487305, "global_step": 422320, "epoch": 5088} {"train_loss": -26.24790382385254, "global_step": 422321, "epoch": 5088} {"train_loss": -26.691131591796875, "global_step": 422322, "epoch": 5088} {"train_loss": -26.304162979125977, "global_step": 422323, "epoch": 5088} {"train_loss": -26.3365421295166, "global_step": 422324, "epoch": 5088} {"train_loss": -26.591806411743164, "global_step": 422325, "epoch": 5088} {"train_loss": -26.437335968017578, "global_step": 422326, "epoch": 5088} {"train_loss": -26.313770294189453, "global_step": 422327, "epoch": 5088} {"train_loss": -26.62006950378418, "global_step": 422328, "epoch": 5088} {"train_loss": -26.55409049987793, "global_step": 422329, "epoch": 5088} {"train_loss": -26.613378524780273, "global_step": 422330, "epoch": 5088} {"train_loss": -26.982004165649414, "global_step": 422331, "epoch": 5088} {"train_loss": -26.60365867614746, "global_step": 422332, "epoch": 5088} {"train_loss": -26.474145889282227, "global_step": 422333, "epoch": 5088} {"train_loss": -26.6734561920166, "global_step": 422334, "epoch": 5088} {"train_loss": -26.84027099609375, "global_step": 422335, "epoch": 5088} {"train_loss": -26.92109489440918, "global_step": 422336, "epoch": 5088} {"train_loss": -26.671499252319336, "global_step": 422337, "epoch": 5088} {"train_loss": -27.128604888916016, "global_step": 422338, "epoch": 5088} {"train_loss": -27.043821334838867, "global_step": 422339, "epoch": 5088} {"train_loss": -26.57826042175293, "global_step": 422340, "epoch": 5088} {"train_loss": -26.84368324279785, "global_step": 422341, "epoch": 5088} {"train_loss": -26.484195709228516, "global_step": 422342, "epoch": 5088} {"train_loss": -26.884464263916016, "global_step": 422343, "epoch": 5088} {"train_loss": -26.72797966003418, "global_step": 422344, "epoch": 5088} {"train_loss": -27.290374755859375, "global_step": 422345, "epoch": 5088} {"train_loss": -27.1134090423584, "global_step": 422346, "epoch": 5088} {"train_loss": -26.833887100219727, "global_step": 422347, "epoch": 5088} {"train_loss": -27.271717071533203, "global_step": 422348, "epoch": 5088} {"train_loss": -26.88179588317871, "global_step": 422349, "epoch": 5088} {"train_loss": -26.6671085357666, "global_step": 422350, "epoch": 5088} {"train_loss": -27.04410743713379, "global_step": 422351, "epoch": 5088} {"train_loss": -27.335172653198242, "global_step": 422352, "epoch": 5088} {"train_loss": -26.77805519104004, "global_step": 422353, "epoch": 5088} {"train_loss": -26.900732040405273, "global_step": 422354, "epoch": 5088} {"train_loss": -26.958789825439453, "global_step": 422355, "epoch": 5088} {"train_loss": -26.9672908782959, "global_step": 422356, "epoch": 5088} {"train_loss": -26.6738224029541, "global_step": 422357, "epoch": 5088} {"train_loss": -26.648563385009766, "global_step": 422358, "epoch": 5088} {"train_loss": -26.97187614440918, "global_step": 422359, "epoch": 5088} {"train_loss": -26.720312118530273, "global_step": 422360, "epoch": 5088} {"train_loss": -26.7658748626709, "global_step": 422361, "epoch": 5088} {"train_loss": -27.299497604370117, "global_step": 422362, "epoch": 5088} {"train_loss": -26.764057159423828, "global_step": 422363, "epoch": 5088} {"train_loss": -26.95692253112793, "global_step": 422364, "epoch": 5088} {"train_loss": -26.679655075073242, "global_step": 422365, "epoch": 5088} {"train_loss": -27.004362106323242, "global_step": 422366, "epoch": 5088} {"train_loss": -26.72627067565918, "global_step": 422367, "epoch": 5088} {"train_loss": -26.892215728759766, "global_step": 422368, "epoch": 5088} {"train_loss": -26.486480712890625, "global_step": 422369, "epoch": 5088} {"train_loss": -26.698455810546875, "global_step": 422370, "epoch": 5088} {"train_loss": -26.856292724609375, "global_step": 422371, "epoch": 5088} {"train_loss": -26.735395431518555, "global_step": 422372, "epoch": 5088} {"train_loss": -26.937580108642578, "global_step": 422373, "epoch": 5088} {"train_loss": -26.650522232055664, "global_step": 422374, "epoch": 5088} {"train_loss": -26.67226219177246, "global_step": 422375, "epoch": 5088} {"train_loss": -26.54363441467285, "global_step": 422376, "epoch": 5088} {"train_loss": -26.828556060791016, "global_step": 422377, "epoch": 5088} {"train_loss": -26.379596710205078, "global_step": 422378, "epoch": 5088} {"train_loss": -26.907089233398438, "global_step": 422379, "epoch": 5088} {"train_loss": -26.382434844970703, "global_step": 422380, "epoch": 5088} {"train_loss": -26.91824722290039, "global_step": 422381, "epoch": 5088} {"train_loss": -26.9186954498291, "global_step": 422382, "epoch": 5088} {"train_loss": -26.398284912109375, "global_step": 422383, "epoch": 5088} {"train_loss": -26.48947525024414, "global_step": 422384, "epoch": 5088} {"train_loss": -26.518247604370117, "global_step": 422385, "epoch": 5088} {"train_loss": -26.564749108739647, "global_step": 422386, "epoch": 5088, "val_loss": 6989075.0} {"train_loss": -26.377790451049805, "global_step": 422387, "epoch": 5089} {"train_loss": -27.0225772857666, "global_step": 422388, "epoch": 5089} {"train_loss": -26.704553604125977, "global_step": 422389, "epoch": 5089} {"train_loss": -26.139892578125, "global_step": 422390, "epoch": 5089} {"train_loss": -26.748504638671875, "global_step": 422391, "epoch": 5089} {"train_loss": -26.49714469909668, "global_step": 422392, "epoch": 5089} {"train_loss": -26.532636642456055, "global_step": 422393, "epoch": 5089} {"train_loss": -26.613632202148438, "global_step": 422394, "epoch": 5089} {"train_loss": -26.625818252563477, "global_step": 422395, "epoch": 5089} {"train_loss": -26.418109893798828, "global_step": 422396, "epoch": 5089} {"train_loss": -26.80377197265625, "global_step": 422397, "epoch": 5089} {"train_loss": -26.732147216796875, "global_step": 422398, "epoch": 5089} {"train_loss": -26.992406845092773, "global_step": 422399, "epoch": 5089} {"train_loss": -26.798810958862305, "global_step": 422400, "epoch": 5089} {"train_loss": -26.684885025024414, "global_step": 422401, "epoch": 5089} {"train_loss": -26.58741569519043, "global_step": 422402, "epoch": 5089} {"train_loss": -26.9240779876709, "global_step": 422403, "epoch": 5089} {"train_loss": -26.94573974609375, "global_step": 422404, "epoch": 5089} {"train_loss": -26.614303588867188, "global_step": 422405, "epoch": 5089} {"train_loss": -26.966474533081055, "global_step": 422406, "epoch": 5089} {"train_loss": -26.687458038330078, "global_step": 422407, "epoch": 5089} {"train_loss": -27.381793975830078, "global_step": 422408, "epoch": 5089} {"train_loss": -26.95342445373535, "global_step": 422409, "epoch": 5089} {"train_loss": -26.70057487487793, "global_step": 422410, "epoch": 5089} {"train_loss": -27.17774772644043, "global_step": 422411, "epoch": 5089} {"train_loss": -26.592145919799805, "global_step": 422412, "epoch": 5089} {"train_loss": -26.64739990234375, "global_step": 422413, "epoch": 5089} {"train_loss": -26.53411865234375, "global_step": 422414, "epoch": 5089} {"train_loss": -26.950214385986328, "global_step": 422415, "epoch": 5089} {"train_loss": -26.904132843017578, "global_step": 422416, "epoch": 5089} {"train_loss": -26.76765251159668, "global_step": 422417, "epoch": 5089} {"train_loss": -27.105649948120117, "global_step": 422418, "epoch": 5089} {"train_loss": -26.920438766479492, "global_step": 422419, "epoch": 5089} {"train_loss": -26.930362701416016, "global_step": 422420, "epoch": 5089} {"train_loss": -26.59518814086914, "global_step": 422421, "epoch": 5089} {"train_loss": -26.924640655517578, "global_step": 422422, "epoch": 5089} {"train_loss": -26.74332618713379, "global_step": 422423, "epoch": 5089} {"train_loss": -27.110626220703125, "global_step": 422424, "epoch": 5089} {"train_loss": -27.0450496673584, "global_step": 422425, "epoch": 5089} {"train_loss": -27.05731773376465, "global_step": 422426, "epoch": 5089} {"train_loss": -27.082977294921875, "global_step": 422427, "epoch": 5089} {"train_loss": -26.68976402282715, "global_step": 422428, "epoch": 5089} {"train_loss": -27.172330856323242, "global_step": 422429, "epoch": 5089} {"train_loss": -27.379749298095703, "global_step": 422430, "epoch": 5089} {"train_loss": -27.250333786010742, "global_step": 422431, "epoch": 5089} {"train_loss": -27.163070678710938, "global_step": 422432, "epoch": 5089} {"train_loss": -26.813507080078125, "global_step": 422433, "epoch": 5089} {"train_loss": -26.939319610595703, "global_step": 422434, "epoch": 5089} {"train_loss": -26.715269088745117, "global_step": 422435, "epoch": 5089} {"train_loss": -26.989501953125, "global_step": 422436, "epoch": 5089} {"train_loss": -26.692407608032227, "global_step": 422437, "epoch": 5089} {"train_loss": -26.36786460876465, "global_step": 422438, "epoch": 5089} {"train_loss": -26.933401107788086, "global_step": 422439, "epoch": 5089} {"train_loss": -26.794921875, "global_step": 422440, "epoch": 5089} {"train_loss": -26.597089767456055, "global_step": 422441, "epoch": 5089} {"train_loss": -26.59348487854004, "global_step": 422442, "epoch": 5089} {"train_loss": -26.89326286315918, "global_step": 422443, "epoch": 5089} {"train_loss": -27.156787872314453, "global_step": 422444, "epoch": 5089} {"train_loss": -27.282148361206055, "global_step": 422445, "epoch": 5089} {"train_loss": -26.787397384643555, "global_step": 422446, "epoch": 5089} {"train_loss": -26.983373641967773, "global_step": 422447, "epoch": 5089} {"train_loss": -26.741153717041016, "global_step": 422448, "epoch": 5089} {"train_loss": -26.416797637939453, "global_step": 422449, "epoch": 5089} {"train_loss": -26.700397491455078, "global_step": 422450, "epoch": 5089} {"train_loss": -26.635156631469727, "global_step": 422451, "epoch": 5089} {"train_loss": -27.017065048217773, "global_step": 422452, "epoch": 5089} {"train_loss": -26.83868980407715, "global_step": 422453, "epoch": 5089} {"train_loss": -26.821395874023438, "global_step": 422454, "epoch": 5089} {"train_loss": -27.078638076782227, "global_step": 422455, "epoch": 5089} {"train_loss": -26.82708740234375, "global_step": 422456, "epoch": 5089} {"train_loss": -26.679357528686523, "global_step": 422457, "epoch": 5089} {"train_loss": -27.146942138671875, "global_step": 422458, "epoch": 5089} {"train_loss": -26.80340576171875, "global_step": 422459, "epoch": 5089} {"train_loss": -27.167402267456055, "global_step": 422460, "epoch": 5089} {"train_loss": -27.039892196655273, "global_step": 422461, "epoch": 5089} {"train_loss": -27.077550888061523, "global_step": 422462, "epoch": 5089} {"train_loss": -27.200796127319336, "global_step": 422463, "epoch": 5089} {"train_loss": -26.72963523864746, "global_step": 422464, "epoch": 5089} {"train_loss": -26.5153751373291, "global_step": 422465, "epoch": 5089} {"train_loss": -26.76334571838379, "global_step": 422466, "epoch": 5089} {"train_loss": -26.29911231994629, "global_step": 422467, "epoch": 5089} {"train_loss": -26.449934005737305, "global_step": 422468, "epoch": 5089} {"train_loss": -26.830023478312665, "global_step": 422469, "epoch": 5089, "val_loss": 7213742.0} {"train_loss": -26.65851402282715, "global_step": 422470, "epoch": 5090} {"train_loss": -25.889806747436523, "global_step": 422471, "epoch": 5090} {"train_loss": -26.17988395690918, "global_step": 422472, "epoch": 5090} {"train_loss": -26.127323150634766, "global_step": 422473, "epoch": 5090} {"train_loss": -25.873550415039062, "global_step": 422474, "epoch": 5090} {"train_loss": -25.97919273376465, "global_step": 422475, "epoch": 5090} {"train_loss": -26.118701934814453, "global_step": 422476, "epoch": 5090} {"train_loss": -26.097171783447266, "global_step": 422477, "epoch": 5090} {"train_loss": -26.385257720947266, "global_step": 422478, "epoch": 5090} {"train_loss": -26.432891845703125, "global_step": 422479, "epoch": 5090} {"train_loss": -25.977651596069336, "global_step": 422480, "epoch": 5090} {"train_loss": -26.111753463745117, "global_step": 422481, "epoch": 5090} {"train_loss": -26.20538902282715, "global_step": 422482, "epoch": 5090} {"train_loss": -26.467275619506836, "global_step": 422483, "epoch": 5090} {"train_loss": -26.110666275024414, "global_step": 422484, "epoch": 5090} {"train_loss": -26.36945152282715, "global_step": 422485, "epoch": 5090} {"train_loss": -26.1368408203125, "global_step": 422486, "epoch": 5090} {"train_loss": -26.253843307495117, "global_step": 422487, "epoch": 5090} {"train_loss": -26.053373336791992, "global_step": 422488, "epoch": 5090} {"train_loss": -26.4838809967041, "global_step": 422489, "epoch": 5090} {"train_loss": -26.037979125976562, "global_step": 422490, "epoch": 5090} {"train_loss": -26.578754425048828, "global_step": 422491, "epoch": 5090} {"train_loss": -26.82573890686035, "global_step": 422492, "epoch": 5090} {"train_loss": -26.667539596557617, "global_step": 422493, "epoch": 5090} {"train_loss": -26.470144271850586, "global_step": 422494, "epoch": 5090} {"train_loss": -26.578125, "global_step": 422495, "epoch": 5090} {"train_loss": -26.45322036743164, "global_step": 422496, "epoch": 5090} {"train_loss": -26.807462692260742, "global_step": 422497, "epoch": 5090} {"train_loss": -26.623388290405273, "global_step": 422498, "epoch": 5090} {"train_loss": -26.651472091674805, "global_step": 422499, "epoch": 5090} {"train_loss": -26.47234535217285, "global_step": 422500, "epoch": 5090} {"train_loss": -26.78736686706543, "global_step": 422501, "epoch": 5090} {"train_loss": -26.596546173095703, "global_step": 422502, "epoch": 5090} {"train_loss": -26.66119384765625, "global_step": 422503, "epoch": 5090} {"train_loss": -26.1118106842041, "global_step": 422504, "epoch": 5090} {"train_loss": -27.1397647857666, "global_step": 422505, "epoch": 5090} {"train_loss": -26.834442138671875, "global_step": 422506, "epoch": 5090} {"train_loss": -26.557209014892578, "global_step": 422507, "epoch": 5090} {"train_loss": -26.92828941345215, "global_step": 422508, "epoch": 5090} {"train_loss": -26.648040771484375, "global_step": 422509, "epoch": 5090} {"train_loss": -26.708322525024414, "global_step": 422510, "epoch": 5090} {"train_loss": -26.836530685424805, "global_step": 422511, "epoch": 5090} {"train_loss": -27.227563858032227, "global_step": 422512, "epoch": 5090} {"train_loss": -26.97724723815918, "global_step": 422513, "epoch": 5090} {"train_loss": -26.987417221069336, "global_step": 422514, "epoch": 5090} {"train_loss": -26.800495147705078, "global_step": 422515, "epoch": 5090} {"train_loss": -27.12335777282715, "global_step": 422516, "epoch": 5090} {"train_loss": -26.34303092956543, "global_step": 422517, "epoch": 5090} {"train_loss": -26.639636993408203, "global_step": 422518, "epoch": 5090} {"train_loss": -26.495580673217773, "global_step": 422519, "epoch": 5090} {"train_loss": -26.476593017578125, "global_step": 422520, "epoch": 5090} {"train_loss": -27.1070613861084, "global_step": 422521, "epoch": 5090} {"train_loss": -27.205480575561523, "global_step": 422522, "epoch": 5090} {"train_loss": -26.7551326751709, "global_step": 422523, "epoch": 5090} {"train_loss": -26.599994659423828, "global_step": 422524, "epoch": 5090} {"train_loss": -26.54775047302246, "global_step": 422525, "epoch": 5090} {"train_loss": -26.81260108947754, "global_step": 422526, "epoch": 5090} {"train_loss": -26.712194442749023, "global_step": 422527, "epoch": 5090} {"train_loss": -26.59097671508789, "global_step": 422528, "epoch": 5090} {"train_loss": -26.78899574279785, "global_step": 422529, "epoch": 5090} {"train_loss": -26.765676498413086, "global_step": 422530, "epoch": 5090} {"train_loss": -26.592695236206055, "global_step": 422531, "epoch": 5090} {"train_loss": -26.761260986328125, "global_step": 422532, "epoch": 5090} {"train_loss": -26.76287841796875, "global_step": 422533, "epoch": 5090} {"train_loss": -26.85190773010254, "global_step": 422534, "epoch": 5090} {"train_loss": -26.463623046875, "global_step": 422535, "epoch": 5090} {"train_loss": -26.565139770507812, "global_step": 422536, "epoch": 5090} {"train_loss": -26.577356338500977, "global_step": 422537, "epoch": 5090} {"train_loss": -26.8048095703125, "global_step": 422538, "epoch": 5090} {"train_loss": -26.55499267578125, "global_step": 422539, "epoch": 5090} {"train_loss": -26.303241729736328, "global_step": 422540, "epoch": 5090} {"train_loss": -26.59864616394043, "global_step": 422541, "epoch": 5090} {"train_loss": -27.056867599487305, "global_step": 422542, "epoch": 5090} {"train_loss": -26.544721603393555, "global_step": 422543, "epoch": 5090} {"train_loss": -26.539752960205078, "global_step": 422544, "epoch": 5090} {"train_loss": -26.524097442626953, "global_step": 422545, "epoch": 5090} {"train_loss": -26.644195556640625, "global_step": 422546, "epoch": 5090} {"train_loss": -26.50189781188965, "global_step": 422547, "epoch": 5090} {"train_loss": -26.685632705688477, "global_step": 422548, "epoch": 5090} {"train_loss": -26.513782501220703, "global_step": 422549, "epoch": 5090} {"train_loss": -26.933584213256836, "global_step": 422550, "epoch": 5090} {"train_loss": -26.686002731323242, "global_step": 422551, "epoch": 5090} {"train_loss": -26.555708069399177, "global_step": 422552, "epoch": 5090, "val_loss": 7107212.0} {"train_loss": -26.029081344604492, "global_step": 422553, "epoch": 5091} {"train_loss": -26.31499671936035, "global_step": 422554, "epoch": 5091} {"train_loss": -26.523466110229492, "global_step": 422555, "epoch": 5091} {"train_loss": -26.406335830688477, "global_step": 422556, "epoch": 5091} {"train_loss": -26.39695167541504, "global_step": 422557, "epoch": 5091} {"train_loss": -26.361560821533203, "global_step": 422558, "epoch": 5091} {"train_loss": -26.52326011657715, "global_step": 422559, "epoch": 5091} {"train_loss": -26.699405670166016, "global_step": 422560, "epoch": 5091} {"train_loss": -26.399932861328125, "global_step": 422561, "epoch": 5091} {"train_loss": -26.81937026977539, "global_step": 422562, "epoch": 5091} {"train_loss": -26.221759796142578, "global_step": 422563, "epoch": 5091} {"train_loss": -26.6934757232666, "global_step": 422564, "epoch": 5091} {"train_loss": -26.252660751342773, "global_step": 422565, "epoch": 5091} {"train_loss": -26.51356315612793, "global_step": 422566, "epoch": 5091} {"train_loss": -26.571231842041016, "global_step": 422567, "epoch": 5091} {"train_loss": -26.5823917388916, "global_step": 422568, "epoch": 5091} {"train_loss": -26.53119468688965, "global_step": 422569, "epoch": 5091} {"train_loss": -26.39155387878418, "global_step": 422570, "epoch": 5091} {"train_loss": -26.73150062561035, "global_step": 422571, "epoch": 5091} {"train_loss": -26.47149658203125, "global_step": 422572, "epoch": 5091} {"train_loss": -26.939233779907227, "global_step": 422573, "epoch": 5091} {"train_loss": -26.579273223876953, "global_step": 422574, "epoch": 5091} {"train_loss": -26.759130477905273, "global_step": 422575, "epoch": 5091} {"train_loss": -26.582355499267578, "global_step": 422576, "epoch": 5091} {"train_loss": -26.6986026763916, "global_step": 422577, "epoch": 5091} {"train_loss": -27.07284927368164, "global_step": 422578, "epoch": 5091} {"train_loss": -26.981287002563477, "global_step": 422579, "epoch": 5091} {"train_loss": -26.70722007751465, "global_step": 422580, "epoch": 5091} {"train_loss": -27.089401245117188, "global_step": 422581, "epoch": 5091} {"train_loss": -27.078033447265625, "global_step": 422582, "epoch": 5091} {"train_loss": -26.760211944580078, "global_step": 422583, "epoch": 5091} {"train_loss": -26.8946590423584, "global_step": 422584, "epoch": 5091} {"train_loss": -26.500547409057617, "global_step": 422585, "epoch": 5091} {"train_loss": -26.47295570373535, "global_step": 422586, "epoch": 5091} {"train_loss": -26.764617919921875, "global_step": 422587, "epoch": 5091} {"train_loss": -26.708282470703125, "global_step": 422588, "epoch": 5091} {"train_loss": -26.938032150268555, "global_step": 422589, "epoch": 5091} {"train_loss": -27.016626358032227, "global_step": 422590, "epoch": 5091} {"train_loss": -27.058197021484375, "global_step": 422591, "epoch": 5091} {"train_loss": -26.90644645690918, "global_step": 422592, "epoch": 5091} {"train_loss": -27.187259674072266, "global_step": 422593, "epoch": 5091} {"train_loss": -27.154809951782227, "global_step": 422594, "epoch": 5091} {"train_loss": -27.147184371948242, "global_step": 422595, "epoch": 5091} {"train_loss": -27.050382614135742, "global_step": 422596, "epoch": 5091} {"train_loss": -27.24560546875, "global_step": 422597, "epoch": 5091} {"train_loss": -27.120153427124023, "global_step": 422598, "epoch": 5091} {"train_loss": -27.19795799255371, "global_step": 422599, "epoch": 5091} {"train_loss": -26.9679012298584, "global_step": 422600, "epoch": 5091} {"train_loss": -27.218353271484375, "global_step": 422601, "epoch": 5091} {"train_loss": -27.04950523376465, "global_step": 422602, "epoch": 5091} {"train_loss": -26.937055587768555, "global_step": 422603, "epoch": 5091} {"train_loss": -26.81873893737793, "global_step": 422604, "epoch": 5091} {"train_loss": -26.471527099609375, "global_step": 422605, "epoch": 5091} {"train_loss": -26.465412139892578, "global_step": 422606, "epoch": 5091} {"train_loss": -27.198694229125977, "global_step": 422607, "epoch": 5091} {"train_loss": -26.9738712310791, "global_step": 422608, "epoch": 5091} {"train_loss": -26.9754695892334, "global_step": 422609, "epoch": 5091} {"train_loss": -26.724782943725586, "global_step": 422610, "epoch": 5091} {"train_loss": -26.790679931640625, "global_step": 422611, "epoch": 5091} {"train_loss": -26.205219268798828, "global_step": 422612, "epoch": 5091} {"train_loss": -26.187955856323242, "global_step": 422613, "epoch": 5091} {"train_loss": -26.423139572143555, "global_step": 422614, "epoch": 5091} {"train_loss": -26.93096923828125, "global_step": 422615, "epoch": 5091} {"train_loss": -26.478830337524414, "global_step": 422616, "epoch": 5091} {"train_loss": -26.645553588867188, "global_step": 422617, "epoch": 5091} {"train_loss": -26.683807373046875, "global_step": 422618, "epoch": 5091} {"train_loss": -26.569976806640625, "global_step": 422619, "epoch": 5091} {"train_loss": -27.126346588134766, "global_step": 422620, "epoch": 5091} {"train_loss": -26.670459747314453, "global_step": 422621, "epoch": 5091} {"train_loss": -26.424375534057617, "global_step": 422622, "epoch": 5091} {"train_loss": -26.599380493164062, "global_step": 422623, "epoch": 5091} {"train_loss": -26.965805053710938, "global_step": 422624, "epoch": 5091} {"train_loss": -27.025114059448242, "global_step": 422625, "epoch": 5091} {"train_loss": -26.756193161010742, "global_step": 422626, "epoch": 5091} {"train_loss": -26.944990158081055, "global_step": 422627, "epoch": 5091} {"train_loss": -26.844989776611328, "global_step": 422628, "epoch": 5091} {"train_loss": -26.66179847717285, "global_step": 422629, "epoch": 5091} {"train_loss": -27.03908348083496, "global_step": 422630, "epoch": 5091} {"train_loss": -26.591474533081055, "global_step": 422631, "epoch": 5091} {"train_loss": -27.05653953552246, "global_step": 422632, "epoch": 5091} {"train_loss": -26.941694259643555, "global_step": 422633, "epoch": 5091} {"train_loss": -26.8795108795166, "global_step": 422634, "epoch": 5091} {"train_loss": -26.742526801235705, "global_step": 422635, "epoch": 5091, "val_loss": 7145097.0} {"train_loss": -25.808670043945312, "global_step": 422636, "epoch": 5092} {"train_loss": -26.223255157470703, "global_step": 422637, "epoch": 5092} {"train_loss": -26.352697372436523, "global_step": 422638, "epoch": 5092} {"train_loss": -25.859073638916016, "global_step": 422639, "epoch": 5092} {"train_loss": -26.362695693969727, "global_step": 422640, "epoch": 5092} {"train_loss": -26.508459091186523, "global_step": 422641, "epoch": 5092} {"train_loss": -25.981855392456055, "global_step": 422642, "epoch": 5092} {"train_loss": -26.33169937133789, "global_step": 422643, "epoch": 5092} {"train_loss": -26.3748779296875, "global_step": 422644, "epoch": 5092} {"train_loss": -26.74580192565918, "global_step": 422645, "epoch": 5092} {"train_loss": -26.5079288482666, "global_step": 422646, "epoch": 5092} {"train_loss": -26.415319442749023, "global_step": 422647, "epoch": 5092} {"train_loss": -26.77948570251465, "global_step": 422648, "epoch": 5092} {"train_loss": -26.42274284362793, "global_step": 422649, "epoch": 5092} {"train_loss": -26.297895431518555, "global_step": 422650, "epoch": 5092} {"train_loss": -27.103452682495117, "global_step": 422651, "epoch": 5092} {"train_loss": -26.402524948120117, "global_step": 422652, "epoch": 5092} {"train_loss": -27.195343017578125, "global_step": 422653, "epoch": 5092} {"train_loss": -26.560760498046875, "global_step": 422654, "epoch": 5092} {"train_loss": -26.705291748046875, "global_step": 422655, "epoch": 5092} {"train_loss": -27.31049919128418, "global_step": 422656, "epoch": 5092} {"train_loss": -26.73781394958496, "global_step": 422657, "epoch": 5092} {"train_loss": -26.81251335144043, "global_step": 422658, "epoch": 5092} {"train_loss": -26.91765785217285, "global_step": 422659, "epoch": 5092} {"train_loss": -26.479211807250977, "global_step": 422660, "epoch": 5092} {"train_loss": -26.71099853515625, "global_step": 422661, "epoch": 5092} {"train_loss": -26.913745880126953, "global_step": 422662, "epoch": 5092} {"train_loss": -26.600980758666992, "global_step": 422663, "epoch": 5092} {"train_loss": -27.061847686767578, "global_step": 422664, "epoch": 5092} {"train_loss": -27.067113876342773, "global_step": 422665, "epoch": 5092} {"train_loss": -27.061254501342773, "global_step": 422666, "epoch": 5092} {"train_loss": -26.82929039001465, "global_step": 422667, "epoch": 5092} {"train_loss": -26.93405532836914, "global_step": 422668, "epoch": 5092} {"train_loss": -26.74599266052246, "global_step": 422669, "epoch": 5092} {"train_loss": -27.260839462280273, "global_step": 422670, "epoch": 5092} {"train_loss": -26.692956924438477, "global_step": 422671, "epoch": 5092} {"train_loss": -27.126056671142578, "global_step": 422672, "epoch": 5092} {"train_loss": -26.61136245727539, "global_step": 422673, "epoch": 5092} {"train_loss": -26.892850875854492, "global_step": 422674, "epoch": 5092} {"train_loss": -26.92066764831543, "global_step": 422675, "epoch": 5092} {"train_loss": -27.16522789001465, "global_step": 422676, "epoch": 5092} {"train_loss": -26.894697189331055, "global_step": 422677, "epoch": 5092} {"train_loss": -26.902502059936523, "global_step": 422678, "epoch": 5092} {"train_loss": -27.075952529907227, "global_step": 422679, "epoch": 5092} {"train_loss": -27.029006958007812, "global_step": 422680, "epoch": 5092} {"train_loss": -26.900440216064453, "global_step": 422681, "epoch": 5092} {"train_loss": -26.990478515625, "global_step": 422682, "epoch": 5092} {"train_loss": -26.973373413085938, "global_step": 422683, "epoch": 5092} {"train_loss": -26.757404327392578, "global_step": 422684, "epoch": 5092} {"train_loss": -26.81780433654785, "global_step": 422685, "epoch": 5092} {"train_loss": -27.1461124420166, "global_step": 422686, "epoch": 5092} {"train_loss": -26.660261154174805, "global_step": 422687, "epoch": 5092} {"train_loss": -27.039220809936523, "global_step": 422688, "epoch": 5092} {"train_loss": -26.871252059936523, "global_step": 422689, "epoch": 5092} {"train_loss": -26.96298599243164, "global_step": 422690, "epoch": 5092} {"train_loss": -27.078413009643555, "global_step": 422691, "epoch": 5092} {"train_loss": -27.371335983276367, "global_step": 422692, "epoch": 5092} {"train_loss": -27.154321670532227, "global_step": 422693, "epoch": 5092} {"train_loss": -27.1455135345459, "global_step": 422694, "epoch": 5092} {"train_loss": -27.07516860961914, "global_step": 422695, "epoch": 5092} {"train_loss": -26.904769897460938, "global_step": 422696, "epoch": 5092} {"train_loss": -26.852447509765625, "global_step": 422697, "epoch": 5092} {"train_loss": -26.85428237915039, "global_step": 422698, "epoch": 5092} {"train_loss": -26.266193389892578, "global_step": 422699, "epoch": 5092} {"train_loss": -25.954023361206055, "global_step": 422700, "epoch": 5092} {"train_loss": -25.923925399780273, "global_step": 422701, "epoch": 5092} {"train_loss": -26.525964736938477, "global_step": 422702, "epoch": 5092} {"train_loss": -26.2627010345459, "global_step": 422703, "epoch": 5092} {"train_loss": -26.196874618530273, "global_step": 422704, "epoch": 5092} {"train_loss": -26.594329833984375, "global_step": 422705, "epoch": 5092} {"train_loss": -26.635908126831055, "global_step": 422706, "epoch": 5092} {"train_loss": -26.299245834350586, "global_step": 422707, "epoch": 5092} {"train_loss": -26.003782272338867, "global_step": 422708, "epoch": 5092} {"train_loss": -26.95258140563965, "global_step": 422709, "epoch": 5092} {"train_loss": -27.023147583007812, "global_step": 422710, "epoch": 5092} {"train_loss": -26.663284301757812, "global_step": 422711, "epoch": 5092} {"train_loss": -26.55419921875, "global_step": 422712, "epoch": 5092} {"train_loss": -26.6214599609375, "global_step": 422713, "epoch": 5092} {"train_loss": -26.752227783203125, "global_step": 422714, "epoch": 5092} {"train_loss": -26.61159324645996, "global_step": 422715, "epoch": 5092} {"train_loss": -27.123620986938477, "global_step": 422716, "epoch": 5092} {"train_loss": -26.734827041625977, "global_step": 422717, "epoch": 5092} {"train_loss": -26.744938976793403, "global_step": 422718, "epoch": 5092, "val_loss": 7067200.0} {"train_loss": -26.5174503326416, "global_step": 422719, "epoch": 5093} {"train_loss": -26.48512077331543, "global_step": 422720, "epoch": 5093} {"train_loss": -26.436655044555664, "global_step": 422721, "epoch": 5093} {"train_loss": -25.851892471313477, "global_step": 422722, "epoch": 5093} {"train_loss": -26.992231369018555, "global_step": 422723, "epoch": 5093} {"train_loss": -26.452869415283203, "global_step": 422724, "epoch": 5093} {"train_loss": -26.575626373291016, "global_step": 422725, "epoch": 5093} {"train_loss": -26.718976974487305, "global_step": 422726, "epoch": 5093} {"train_loss": -26.770191192626953, "global_step": 422727, "epoch": 5093} {"train_loss": -26.419050216674805, "global_step": 422728, "epoch": 5093} {"train_loss": -26.4571533203125, "global_step": 422729, "epoch": 5093} {"train_loss": -26.635969161987305, "global_step": 422730, "epoch": 5093} {"train_loss": -26.63507652282715, "global_step": 422731, "epoch": 5093} {"train_loss": -26.624847412109375, "global_step": 422732, "epoch": 5093} {"train_loss": -27.199827194213867, "global_step": 422733, "epoch": 5093} {"train_loss": -26.427932739257812, "global_step": 422734, "epoch": 5093} {"train_loss": -26.7268123626709, "global_step": 422735, "epoch": 5093} {"train_loss": -26.785825729370117, "global_step": 422736, "epoch": 5093} {"train_loss": -26.9077091217041, "global_step": 422737, "epoch": 5093} {"train_loss": -26.550384521484375, "global_step": 422738, "epoch": 5093} {"train_loss": -26.4497127532959, "global_step": 422739, "epoch": 5093} {"train_loss": -26.589426040649414, "global_step": 422740, "epoch": 5093} {"train_loss": -27.013824462890625, "global_step": 422741, "epoch": 5093} {"train_loss": -27.004474639892578, "global_step": 422742, "epoch": 5093} {"train_loss": -26.85773277282715, "global_step": 422743, "epoch": 5093} {"train_loss": -26.71736717224121, "global_step": 422744, "epoch": 5093} {"train_loss": -27.038257598876953, "global_step": 422745, "epoch": 5093} {"train_loss": -26.759870529174805, "global_step": 422746, "epoch": 5093} {"train_loss": -27.45685386657715, "global_step": 422747, "epoch": 5093} {"train_loss": -27.117292404174805, "global_step": 422748, "epoch": 5093} {"train_loss": -26.677621841430664, "global_step": 422749, "epoch": 5093} {"train_loss": -26.97466468811035, "global_step": 422750, "epoch": 5093} {"train_loss": -26.818052291870117, "global_step": 422751, "epoch": 5093} {"train_loss": -26.55137062072754, "global_step": 422752, "epoch": 5093} {"train_loss": -27.0106143951416, "global_step": 422753, "epoch": 5093} {"train_loss": -26.8244686126709, "global_step": 422754, "epoch": 5093} {"train_loss": -27.100589752197266, "global_step": 422755, "epoch": 5093} {"train_loss": -26.653644561767578, "global_step": 422756, "epoch": 5093} {"train_loss": -26.854801177978516, "global_step": 422757, "epoch": 5093} {"train_loss": -26.73481559753418, "global_step": 422758, "epoch": 5093} {"train_loss": -26.389554977416992, "global_step": 422759, "epoch": 5093} {"train_loss": -26.669784545898438, "global_step": 422760, "epoch": 5093} {"train_loss": -26.5651912689209, "global_step": 422761, "epoch": 5093} {"train_loss": -26.72879409790039, "global_step": 422762, "epoch": 5093} {"train_loss": -26.805150985717773, "global_step": 422763, "epoch": 5093} {"train_loss": -26.8067684173584, "global_step": 422764, "epoch": 5093} {"train_loss": -26.89460563659668, "global_step": 422765, "epoch": 5093} {"train_loss": -26.770069122314453, "global_step": 422766, "epoch": 5093} {"train_loss": -26.869266510009766, "global_step": 422767, "epoch": 5093} {"train_loss": -26.84555435180664, "global_step": 422768, "epoch": 5093} {"train_loss": -26.700719833374023, "global_step": 422769, "epoch": 5093} {"train_loss": -26.86968421936035, "global_step": 422770, "epoch": 5093} {"train_loss": -26.957599639892578, "global_step": 422771, "epoch": 5093} {"train_loss": -26.55415153503418, "global_step": 422772, "epoch": 5093} {"train_loss": -27.21205711364746, "global_step": 422773, "epoch": 5093} {"train_loss": -26.77374267578125, "global_step": 422774, "epoch": 5093} {"train_loss": -26.830997467041016, "global_step": 422775, "epoch": 5093} {"train_loss": -26.894906997680664, "global_step": 422776, "epoch": 5093} {"train_loss": -26.591552734375, "global_step": 422777, "epoch": 5093} {"train_loss": -26.945951461791992, "global_step": 422778, "epoch": 5093} {"train_loss": -26.577991485595703, "global_step": 422779, "epoch": 5093} {"train_loss": -26.776159286499023, "global_step": 422780, "epoch": 5093} {"train_loss": -27.040878295898438, "global_step": 422781, "epoch": 5093} {"train_loss": -26.920446395874023, "global_step": 422782, "epoch": 5093} {"train_loss": -26.960546493530273, "global_step": 422783, "epoch": 5093} {"train_loss": -26.70570945739746, "global_step": 422784, "epoch": 5093} {"train_loss": -27.011377334594727, "global_step": 422785, "epoch": 5093} {"train_loss": -26.828907012939453, "global_step": 422786, "epoch": 5093} {"train_loss": -26.68195915222168, "global_step": 422787, "epoch": 5093} {"train_loss": -26.326919555664062, "global_step": 422788, "epoch": 5093} {"train_loss": -26.7408390045166, "global_step": 422789, "epoch": 5093} {"train_loss": -27.18635368347168, "global_step": 422790, "epoch": 5093} {"train_loss": -27.003271102905273, "global_step": 422791, "epoch": 5093} {"train_loss": -26.769514083862305, "global_step": 422792, "epoch": 5093} {"train_loss": -26.96152114868164, "global_step": 422793, "epoch": 5093} {"train_loss": -27.194934844970703, "global_step": 422794, "epoch": 5093} {"train_loss": -26.92695426940918, "global_step": 422795, "epoch": 5093} {"train_loss": -26.783117294311523, "global_step": 422796, "epoch": 5093} {"train_loss": -26.834814071655273, "global_step": 422797, "epoch": 5093} {"train_loss": -26.949689865112305, "global_step": 422798, "epoch": 5093} {"train_loss": -26.802143096923828, "global_step": 422799, "epoch": 5093} {"train_loss": -26.79180335998535, "global_step": 422800, "epoch": 5093} {"train_loss": -26.760162744177393, "global_step": 422801, "epoch": 5093, "val_loss": 6983957.0} {"train_loss": -25.203052520751953, "global_step": 422802, "epoch": 5094} {"train_loss": -25.043630599975586, "global_step": 422803, "epoch": 5094} {"train_loss": -26.291303634643555, "global_step": 422804, "epoch": 5094} {"train_loss": -25.97389030456543, "global_step": 422805, "epoch": 5094} {"train_loss": -26.057065963745117, "global_step": 422806, "epoch": 5094} {"train_loss": -26.0202693939209, "global_step": 422807, "epoch": 5094} {"train_loss": -26.172565460205078, "global_step": 422808, "epoch": 5094} {"train_loss": -25.566923141479492, "global_step": 422809, "epoch": 5094} {"train_loss": -26.12837028503418, "global_step": 422810, "epoch": 5094} {"train_loss": -26.39580726623535, "global_step": 422811, "epoch": 5094} {"train_loss": -26.0004825592041, "global_step": 422812, "epoch": 5094} {"train_loss": -26.628698348999023, "global_step": 422813, "epoch": 5094} {"train_loss": -26.437177658081055, "global_step": 422814, "epoch": 5094} {"train_loss": -26.344619750976562, "global_step": 422815, "epoch": 5094} {"train_loss": -26.3226318359375, "global_step": 422816, "epoch": 5094} {"train_loss": -26.376876831054688, "global_step": 422817, "epoch": 5094} {"train_loss": -26.190021514892578, "global_step": 422818, "epoch": 5094} {"train_loss": -26.6406307220459, "global_step": 422819, "epoch": 5094} {"train_loss": -26.76960563659668, "global_step": 422820, "epoch": 5094} {"train_loss": -26.660171508789062, "global_step": 422821, "epoch": 5094} {"train_loss": -26.410629272460938, "global_step": 422822, "epoch": 5094} {"train_loss": -26.638671875, "global_step": 422823, "epoch": 5094} {"train_loss": -26.2275447845459, "global_step": 422824, "epoch": 5094} {"train_loss": -26.77393913269043, "global_step": 422825, "epoch": 5094} {"train_loss": -26.15619468688965, "global_step": 422826, "epoch": 5094} {"train_loss": -26.383047103881836, "global_step": 422827, "epoch": 5094} {"train_loss": -26.788061141967773, "global_step": 422828, "epoch": 5094} {"train_loss": -26.294538497924805, "global_step": 422829, "epoch": 5094} {"train_loss": -26.5341739654541, "global_step": 422830, "epoch": 5094} {"train_loss": -26.587186813354492, "global_step": 422831, "epoch": 5094} {"train_loss": -27.019302368164062, "global_step": 422832, "epoch": 5094} {"train_loss": -26.51437759399414, "global_step": 422833, "epoch": 5094} {"train_loss": -26.746368408203125, "global_step": 422834, "epoch": 5094} {"train_loss": -26.20997428894043, "global_step": 422835, "epoch": 5094} {"train_loss": -26.46357536315918, "global_step": 422836, "epoch": 5094} {"train_loss": -26.87885856628418, "global_step": 422837, "epoch": 5094} {"train_loss": -26.871057510375977, "global_step": 422838, "epoch": 5094} {"train_loss": -27.117816925048828, "global_step": 422839, "epoch": 5094} {"train_loss": -26.726911544799805, "global_step": 422840, "epoch": 5094} {"train_loss": -26.463842391967773, "global_step": 422841, "epoch": 5094} {"train_loss": -26.867294311523438, "global_step": 422842, "epoch": 5094} {"train_loss": -26.49477195739746, "global_step": 422843, "epoch": 5094} {"train_loss": -26.623327255249023, "global_step": 422844, "epoch": 5094} {"train_loss": -26.954870223999023, "global_step": 422845, "epoch": 5094} {"train_loss": -26.720783233642578, "global_step": 422846, "epoch": 5094} {"train_loss": -26.74037742614746, "global_step": 422847, "epoch": 5094} {"train_loss": -26.972457885742188, "global_step": 422848, "epoch": 5094} {"train_loss": -26.861902236938477, "global_step": 422849, "epoch": 5094} {"train_loss": -26.6878604888916, "global_step": 422850, "epoch": 5094} {"train_loss": -27.046476364135742, "global_step": 422851, "epoch": 5094} {"train_loss": -26.999719619750977, "global_step": 422852, "epoch": 5094} {"train_loss": -26.829975128173828, "global_step": 422853, "epoch": 5094} {"train_loss": -26.841323852539062, "global_step": 422854, "epoch": 5094} {"train_loss": -26.875741958618164, "global_step": 422855, "epoch": 5094} {"train_loss": -27.070459365844727, "global_step": 422856, "epoch": 5094} {"train_loss": -27.1766414642334, "global_step": 422857, "epoch": 5094} {"train_loss": -27.114099502563477, "global_step": 422858, "epoch": 5094} {"train_loss": -26.8684024810791, "global_step": 422859, "epoch": 5094} {"train_loss": -27.034137725830078, "global_step": 422860, "epoch": 5094} {"train_loss": -26.90785026550293, "global_step": 422861, "epoch": 5094} {"train_loss": -27.144651412963867, "global_step": 422862, "epoch": 5094} {"train_loss": -27.266733169555664, "global_step": 422863, "epoch": 5094} {"train_loss": -27.207860946655273, "global_step": 422864, "epoch": 5094} {"train_loss": -26.95815086364746, "global_step": 422865, "epoch": 5094} {"train_loss": -26.449176788330078, "global_step": 422866, "epoch": 5094} {"train_loss": -26.929418563842773, "global_step": 422867, "epoch": 5094} {"train_loss": -26.797286987304688, "global_step": 422868, "epoch": 5094} {"train_loss": -26.421356201171875, "global_step": 422869, "epoch": 5094} {"train_loss": -26.4218807220459, "global_step": 422870, "epoch": 5094} {"train_loss": -26.643646240234375, "global_step": 422871, "epoch": 5094} {"train_loss": -27.0799503326416, "global_step": 422872, "epoch": 5094} {"train_loss": -26.490747451782227, "global_step": 422873, "epoch": 5094} {"train_loss": -26.919965744018555, "global_step": 422874, "epoch": 5094} {"train_loss": -26.47255516052246, "global_step": 422875, "epoch": 5094} {"train_loss": -27.074392318725586, "global_step": 422876, "epoch": 5094} {"train_loss": -27.15365982055664, "global_step": 422877, "epoch": 5094} {"train_loss": -26.874372482299805, "global_step": 422878, "epoch": 5094} {"train_loss": -26.32423210144043, "global_step": 422879, "epoch": 5094} {"train_loss": -27.173643112182617, "global_step": 422880, "epoch": 5094} {"train_loss": -26.19300651550293, "global_step": 422881, "epoch": 5094} {"train_loss": -26.498327255249023, "global_step": 422882, "epoch": 5094} {"train_loss": -26.77643394470215, "global_step": 422883, "epoch": 5094} {"train_loss": -26.61283980220197, "global_step": 422884, "epoch": 5094, "val_loss": 7107581.0} {"train_loss": -24.56711769104004, "global_step": 422885, "epoch": 5095} {"train_loss": -23.7007999420166, "global_step": 422886, "epoch": 5095} {"train_loss": -25.03516960144043, "global_step": 422887, "epoch": 5095} {"train_loss": -25.667829513549805, "global_step": 422888, "epoch": 5095} {"train_loss": -25.686304092407227, "global_step": 422889, "epoch": 5095} {"train_loss": -25.78201675415039, "global_step": 422890, "epoch": 5095} {"train_loss": -25.311826705932617, "global_step": 422891, "epoch": 5095} {"train_loss": -26.212549209594727, "global_step": 422892, "epoch": 5095} {"train_loss": -26.218658447265625, "global_step": 422893, "epoch": 5095} {"train_loss": -25.825489044189453, "global_step": 422894, "epoch": 5095} {"train_loss": -26.086217880249023, "global_step": 422895, "epoch": 5095} {"train_loss": -26.39060401916504, "global_step": 422896, "epoch": 5095} {"train_loss": -25.937219619750977, "global_step": 422897, "epoch": 5095} {"train_loss": -26.261640548706055, "global_step": 422898, "epoch": 5095} {"train_loss": -26.092365264892578, "global_step": 422899, "epoch": 5095} {"train_loss": -26.045373916625977, "global_step": 422900, "epoch": 5095} {"train_loss": -25.972187042236328, "global_step": 422901, "epoch": 5095} {"train_loss": -26.120935440063477, "global_step": 422902, "epoch": 5095} {"train_loss": -26.118881225585938, "global_step": 422903, "epoch": 5095} {"train_loss": -26.303604125976562, "global_step": 422904, "epoch": 5095} {"train_loss": -26.221466064453125, "global_step": 422905, "epoch": 5095} {"train_loss": -26.148746490478516, "global_step": 422906, "epoch": 5095} {"train_loss": -26.3638916015625, "global_step": 422907, "epoch": 5095} {"train_loss": -26.5766658782959, "global_step": 422908, "epoch": 5095} {"train_loss": -26.272445678710938, "global_step": 422909, "epoch": 5095} {"train_loss": -27.0133113861084, "global_step": 422910, "epoch": 5095} {"train_loss": -26.733417510986328, "global_step": 422911, "epoch": 5095} {"train_loss": -26.30818748474121, "global_step": 422912, "epoch": 5095} {"train_loss": -26.53098487854004, "global_step": 422913, "epoch": 5095} {"train_loss": -26.692590713500977, "global_step": 422914, "epoch": 5095} {"train_loss": -26.203678131103516, "global_step": 422915, "epoch": 5095} {"train_loss": -26.815433502197266, "global_step": 422916, "epoch": 5095} {"train_loss": -26.683490753173828, "global_step": 422917, "epoch": 5095} {"train_loss": -26.807575225830078, "global_step": 422918, "epoch": 5095} {"train_loss": -26.61227798461914, "global_step": 422919, "epoch": 5095} {"train_loss": -26.894201278686523, "global_step": 422920, "epoch": 5095} {"train_loss": -26.64845085144043, "global_step": 422921, "epoch": 5095} {"train_loss": -26.467884063720703, "global_step": 422922, "epoch": 5095} {"train_loss": -26.792932510375977, "global_step": 422923, "epoch": 5095} {"train_loss": -26.788644790649414, "global_step": 422924, "epoch": 5095} {"train_loss": -26.936025619506836, "global_step": 422925, "epoch": 5095} {"train_loss": -27.083724975585938, "global_step": 422926, "epoch": 5095} {"train_loss": -26.85370445251465, "global_step": 422927, "epoch": 5095} {"train_loss": -26.489770889282227, "global_step": 422928, "epoch": 5095} {"train_loss": -26.7305908203125, "global_step": 422929, "epoch": 5095} {"train_loss": -27.01521110534668, "global_step": 422930, "epoch": 5095} {"train_loss": -26.95407485961914, "global_step": 422931, "epoch": 5095} {"train_loss": -26.8425350189209, "global_step": 422932, "epoch": 5095} {"train_loss": -26.860681533813477, "global_step": 422933, "epoch": 5095} {"train_loss": -27.028472900390625, "global_step": 422934, "epoch": 5095} {"train_loss": -26.911008834838867, "global_step": 422935, "epoch": 5095} {"train_loss": -27.297698974609375, "global_step": 422936, "epoch": 5095} {"train_loss": -26.810453414916992, "global_step": 422937, "epoch": 5095} {"train_loss": -27.137243270874023, "global_step": 422938, "epoch": 5095} {"train_loss": -26.986169815063477, "global_step": 422939, "epoch": 5095} {"train_loss": -27.0067081451416, "global_step": 422940, "epoch": 5095} {"train_loss": -27.22410011291504, "global_step": 422941, "epoch": 5095} {"train_loss": -26.807092666625977, "global_step": 422942, "epoch": 5095} {"train_loss": -26.78299331665039, "global_step": 422943, "epoch": 5095} {"train_loss": -27.027271270751953, "global_step": 422944, "epoch": 5095} {"train_loss": -26.629663467407227, "global_step": 422945, "epoch": 5095} {"train_loss": -26.855026245117188, "global_step": 422946, "epoch": 5095} {"train_loss": -27.080398559570312, "global_step": 422947, "epoch": 5095} {"train_loss": -26.754724502563477, "global_step": 422948, "epoch": 5095} {"train_loss": -26.350446701049805, "global_step": 422949, "epoch": 5095} {"train_loss": -26.500564575195312, "global_step": 422950, "epoch": 5095} {"train_loss": -26.33619499206543, "global_step": 422951, "epoch": 5095} {"train_loss": -26.732868194580078, "global_step": 422952, "epoch": 5095} {"train_loss": -26.358556747436523, "global_step": 422953, "epoch": 5095} {"train_loss": -25.98528480529785, "global_step": 422954, "epoch": 5095} {"train_loss": -27.010513305664062, "global_step": 422955, "epoch": 5095} {"train_loss": -26.555395126342773, "global_step": 422956, "epoch": 5095} {"train_loss": -27.094593048095703, "global_step": 422957, "epoch": 5095} {"train_loss": -26.796457290649414, "global_step": 422958, "epoch": 5095} {"train_loss": -26.797260284423828, "global_step": 422959, "epoch": 5095} {"train_loss": -26.429718017578125, "global_step": 422960, "epoch": 5095} {"train_loss": -26.676061630249023, "global_step": 422961, "epoch": 5095} {"train_loss": -26.810089111328125, "global_step": 422962, "epoch": 5095} {"train_loss": -26.6744384765625, "global_step": 422963, "epoch": 5095} {"train_loss": -27.0760440826416, "global_step": 422964, "epoch": 5095} {"train_loss": -26.945322036743164, "global_step": 422965, "epoch": 5095} {"train_loss": -26.569122314453125, "global_step": 422966, "epoch": 5095} {"train_loss": -26.513897930283143, "global_step": 422967, "epoch": 5095, "val_loss": 7002056.0} {"train_loss": -26.149616241455078, "global_step": 422968, "epoch": 5096} {"train_loss": -26.198638916015625, "global_step": 422969, "epoch": 5096} {"train_loss": -25.98040771484375, "global_step": 422970, "epoch": 5096} {"train_loss": -26.323394775390625, "global_step": 422971, "epoch": 5096} {"train_loss": -26.493427276611328, "global_step": 422972, "epoch": 5096} {"train_loss": -26.23855972290039, "global_step": 422973, "epoch": 5096} {"train_loss": -26.56086540222168, "global_step": 422974, "epoch": 5096} {"train_loss": -26.17030143737793, "global_step": 422975, "epoch": 5096} {"train_loss": -26.48770523071289, "global_step": 422976, "epoch": 5096} {"train_loss": -26.002378463745117, "global_step": 422977, "epoch": 5096} {"train_loss": -26.790302276611328, "global_step": 422978, "epoch": 5096} {"train_loss": -26.18219566345215, "global_step": 422979, "epoch": 5096} {"train_loss": -26.414602279663086, "global_step": 422980, "epoch": 5096} {"train_loss": -26.55649185180664, "global_step": 422981, "epoch": 5096} {"train_loss": -26.607746124267578, "global_step": 422982, "epoch": 5096} {"train_loss": -26.429492950439453, "global_step": 422983, "epoch": 5096} {"train_loss": -26.468891143798828, "global_step": 422984, "epoch": 5096} {"train_loss": -26.40728759765625, "global_step": 422985, "epoch": 5096} {"train_loss": -26.44683265686035, "global_step": 422986, "epoch": 5096} {"train_loss": -27.024084091186523, "global_step": 422987, "epoch": 5096} {"train_loss": -26.636999130249023, "global_step": 422988, "epoch": 5096} {"train_loss": -26.487674713134766, "global_step": 422989, "epoch": 5096} {"train_loss": -26.71709632873535, "global_step": 422990, "epoch": 5096} {"train_loss": -26.651966094970703, "global_step": 422991, "epoch": 5096} {"train_loss": -27.01873779296875, "global_step": 422992, "epoch": 5096} {"train_loss": -26.7108097076416, "global_step": 422993, "epoch": 5096} {"train_loss": -27.05067253112793, "global_step": 422994, "epoch": 5096} {"train_loss": -26.721240997314453, "global_step": 422995, "epoch": 5096} {"train_loss": -26.739770889282227, "global_step": 422996, "epoch": 5096} {"train_loss": -26.714197158813477, "global_step": 422997, "epoch": 5096} {"train_loss": -26.883777618408203, "global_step": 422998, "epoch": 5096} {"train_loss": -27.158740997314453, "global_step": 422999, "epoch": 5096} {"train_loss": -27.043256759643555, "global_step": 423000, "epoch": 5096} {"train_loss": -26.89302635192871, "global_step": 423001, "epoch": 5096} {"train_loss": -26.87224769592285, "global_step": 423002, "epoch": 5096} {"train_loss": -27.10150146484375, "global_step": 423003, "epoch": 5096} {"train_loss": -27.288522720336914, "global_step": 423004, "epoch": 5096} {"train_loss": -26.71770668029785, "global_step": 423005, "epoch": 5096} {"train_loss": -26.75868034362793, "global_step": 423006, "epoch": 5096} {"train_loss": -26.701208114624023, "global_step": 423007, "epoch": 5096} {"train_loss": -27.2298526763916, "global_step": 423008, "epoch": 5096} {"train_loss": -26.880096435546875, "global_step": 423009, "epoch": 5096} {"train_loss": -26.865802764892578, "global_step": 423010, "epoch": 5096} {"train_loss": -27.188501358032227, "global_step": 423011, "epoch": 5096} {"train_loss": -27.0290470123291, "global_step": 423012, "epoch": 5096} {"train_loss": -26.870615005493164, "global_step": 423013, "epoch": 5096} {"train_loss": -26.911352157592773, "global_step": 423014, "epoch": 5096} {"train_loss": -27.10341453552246, "global_step": 423015, "epoch": 5096} {"train_loss": -26.667539596557617, "global_step": 423016, "epoch": 5096} {"train_loss": -26.54412841796875, "global_step": 423017, "epoch": 5096} {"train_loss": -26.277835845947266, "global_step": 423018, "epoch": 5096} {"train_loss": -26.201278686523438, "global_step": 423019, "epoch": 5096} {"train_loss": -25.767744064331055, "global_step": 423020, "epoch": 5096} {"train_loss": -26.427515029907227, "global_step": 423021, "epoch": 5096} {"train_loss": -26.87322998046875, "global_step": 423022, "epoch": 5096} {"train_loss": -26.731521606445312, "global_step": 423023, "epoch": 5096} {"train_loss": -26.232641220092773, "global_step": 423024, "epoch": 5096} {"train_loss": -26.8320369720459, "global_step": 423025, "epoch": 5096} {"train_loss": -27.010766983032227, "global_step": 423026, "epoch": 5096} {"train_loss": -26.34891700744629, "global_step": 423027, "epoch": 5096} {"train_loss": -26.370227813720703, "global_step": 423028, "epoch": 5096} {"train_loss": -26.787015914916992, "global_step": 423029, "epoch": 5096} {"train_loss": -26.744617462158203, "global_step": 423030, "epoch": 5096} {"train_loss": -26.44669532775879, "global_step": 423031, "epoch": 5096} {"train_loss": -26.65268325805664, "global_step": 423032, "epoch": 5096} {"train_loss": -26.770648956298828, "global_step": 423033, "epoch": 5096} {"train_loss": -27.13397789001465, "global_step": 423034, "epoch": 5096} {"train_loss": -26.652219772338867, "global_step": 423035, "epoch": 5096} {"train_loss": -26.541858673095703, "global_step": 423036, "epoch": 5096} {"train_loss": -26.711706161499023, "global_step": 423037, "epoch": 5096} {"train_loss": -26.716840744018555, "global_step": 423038, "epoch": 5096} {"train_loss": -26.69623374938965, "global_step": 423039, "epoch": 5096} {"train_loss": -26.68454933166504, "global_step": 423040, "epoch": 5096} {"train_loss": -27.34394645690918, "global_step": 423041, "epoch": 5096} {"train_loss": -26.826278686523438, "global_step": 423042, "epoch": 5096} {"train_loss": -26.768417358398438, "global_step": 423043, "epoch": 5096} {"train_loss": -26.43625259399414, "global_step": 423044, "epoch": 5096} {"train_loss": -26.91275978088379, "global_step": 423045, "epoch": 5096} {"train_loss": -26.65633201599121, "global_step": 423046, "epoch": 5096} {"train_loss": -26.743921279907227, "global_step": 423047, "epoch": 5096} {"train_loss": -27.092756271362305, "global_step": 423048, "epoch": 5096} {"train_loss": -26.656164169311523, "global_step": 423049, "epoch": 5096} {"train_loss": -26.68901466461549, "global_step": 423050, "epoch": 5096, "val_loss": 7143645.0} {"train_loss": -26.316848754882812, "global_step": 423051, "epoch": 5097} {"train_loss": -26.46721839904785, "global_step": 423052, "epoch": 5097} {"train_loss": -26.4881534576416, "global_step": 423053, "epoch": 5097} {"train_loss": -26.280969619750977, "global_step": 423054, "epoch": 5097} {"train_loss": -26.352832794189453, "global_step": 423055, "epoch": 5097} {"train_loss": -26.700727462768555, "global_step": 423056, "epoch": 5097} {"train_loss": -26.438053131103516, "global_step": 423057, "epoch": 5097} {"train_loss": -26.615812301635742, "global_step": 423058, "epoch": 5097} {"train_loss": -26.951553344726562, "global_step": 423059, "epoch": 5097} {"train_loss": -26.391193389892578, "global_step": 423060, "epoch": 5097} {"train_loss": -26.695104598999023, "global_step": 423061, "epoch": 5097} {"train_loss": -26.752965927124023, "global_step": 423062, "epoch": 5097} {"train_loss": -26.509124755859375, "global_step": 423063, "epoch": 5097} {"train_loss": -26.825061798095703, "global_step": 423064, "epoch": 5097} {"train_loss": -26.489892959594727, "global_step": 423065, "epoch": 5097} {"train_loss": -26.266284942626953, "global_step": 423066, "epoch": 5097} {"train_loss": -26.62139892578125, "global_step": 423067, "epoch": 5097} {"train_loss": -26.55816650390625, "global_step": 423068, "epoch": 5097} {"train_loss": -26.785181045532227, "global_step": 423069, "epoch": 5097} {"train_loss": -26.650405883789062, "global_step": 423070, "epoch": 5097} {"train_loss": -26.992950439453125, "global_step": 423071, "epoch": 5097} {"train_loss": -26.445173263549805, "global_step": 423072, "epoch": 5097} {"train_loss": -27.137054443359375, "global_step": 423073, "epoch": 5097} {"train_loss": -26.442853927612305, "global_step": 423074, "epoch": 5097} {"train_loss": -26.811193466186523, "global_step": 423075, "epoch": 5097} {"train_loss": -26.40974235534668, "global_step": 423076, "epoch": 5097} {"train_loss": -26.93329429626465, "global_step": 423077, "epoch": 5097} {"train_loss": -27.100021362304688, "global_step": 423078, "epoch": 5097} {"train_loss": -27.07501792907715, "global_step": 423079, "epoch": 5097} {"train_loss": -26.919391632080078, "global_step": 423080, "epoch": 5097} {"train_loss": -26.671300888061523, "global_step": 423081, "epoch": 5097} {"train_loss": -26.717649459838867, "global_step": 423082, "epoch": 5097} {"train_loss": -27.129297256469727, "global_step": 423083, "epoch": 5097} {"train_loss": -26.826318740844727, "global_step": 423084, "epoch": 5097} {"train_loss": -26.32535743713379, "global_step": 423085, "epoch": 5097} {"train_loss": -26.747838973999023, "global_step": 423086, "epoch": 5097} {"train_loss": -27.166614532470703, "global_step": 423087, "epoch": 5097} {"train_loss": -26.72170066833496, "global_step": 423088, "epoch": 5097} {"train_loss": -26.534513473510742, "global_step": 423089, "epoch": 5097} {"train_loss": -26.980512619018555, "global_step": 423090, "epoch": 5097} {"train_loss": -26.86309814453125, "global_step": 423091, "epoch": 5097} {"train_loss": -26.702911376953125, "global_step": 423092, "epoch": 5097} {"train_loss": -26.923593521118164, "global_step": 423093, "epoch": 5097} {"train_loss": -26.90248680114746, "global_step": 423094, "epoch": 5097} {"train_loss": -26.699609756469727, "global_step": 423095, "epoch": 5097} {"train_loss": -26.968505859375, "global_step": 423096, "epoch": 5097} {"train_loss": -27.0294246673584, "global_step": 423097, "epoch": 5097} {"train_loss": -27.07807731628418, "global_step": 423098, "epoch": 5097} {"train_loss": -26.86567497253418, "global_step": 423099, "epoch": 5097} {"train_loss": -26.7833194732666, "global_step": 423100, "epoch": 5097} {"train_loss": -26.46550941467285, "global_step": 423101, "epoch": 5097} {"train_loss": -26.685449600219727, "global_step": 423102, "epoch": 5097} {"train_loss": -27.003767013549805, "global_step": 423103, "epoch": 5097} {"train_loss": -26.884296417236328, "global_step": 423104, "epoch": 5097} {"train_loss": -26.92283058166504, "global_step": 423105, "epoch": 5097} {"train_loss": -27.20081901550293, "global_step": 423106, "epoch": 5097} {"train_loss": -27.283557891845703, "global_step": 423107, "epoch": 5097} {"train_loss": -26.75006103515625, "global_step": 423108, "epoch": 5097} {"train_loss": -27.023298263549805, "global_step": 423109, "epoch": 5097} {"train_loss": -27.220808029174805, "global_step": 423110, "epoch": 5097} {"train_loss": -27.14778709411621, "global_step": 423111, "epoch": 5097} {"train_loss": -26.677576065063477, "global_step": 423112, "epoch": 5097} {"train_loss": -26.7719669342041, "global_step": 423113, "epoch": 5097} {"train_loss": -27.01154136657715, "global_step": 423114, "epoch": 5097} {"train_loss": -26.668622970581055, "global_step": 423115, "epoch": 5097} {"train_loss": -26.79754066467285, "global_step": 423116, "epoch": 5097} {"train_loss": -26.90862464904785, "global_step": 423117, "epoch": 5097} {"train_loss": -26.958959579467773, "global_step": 423118, "epoch": 5097} {"train_loss": -26.89374351501465, "global_step": 423119, "epoch": 5097} {"train_loss": -26.796356201171875, "global_step": 423120, "epoch": 5097} {"train_loss": -26.654438018798828, "global_step": 423121, "epoch": 5097} {"train_loss": -26.612852096557617, "global_step": 423122, "epoch": 5097} {"train_loss": -26.948339462280273, "global_step": 423123, "epoch": 5097} {"train_loss": -26.634092330932617, "global_step": 423124, "epoch": 5097} {"train_loss": -25.971515655517578, "global_step": 423125, "epoch": 5097} {"train_loss": -26.1355037689209, "global_step": 423126, "epoch": 5097} {"train_loss": -25.98709487915039, "global_step": 423127, "epoch": 5097} {"train_loss": -26.609683990478516, "global_step": 423128, "epoch": 5097} {"train_loss": -26.714685440063477, "global_step": 423129, "epoch": 5097} {"train_loss": -26.470874786376953, "global_step": 423130, "epoch": 5097} {"train_loss": -26.10321044921875, "global_step": 423131, "epoch": 5097} {"train_loss": -26.598907470703125, "global_step": 423132, "epoch": 5097} {"train_loss": -26.712512119706854, "global_step": 423133, "epoch": 5097, "val_loss": 7160859.0} {"train_loss": -26.144384384155273, "global_step": 423134, "epoch": 5098} {"train_loss": -26.24606704711914, "global_step": 423135, "epoch": 5098} {"train_loss": -25.60003662109375, "global_step": 423136, "epoch": 5098} {"train_loss": -25.971723556518555, "global_step": 423137, "epoch": 5098} {"train_loss": -25.916391372680664, "global_step": 423138, "epoch": 5098} {"train_loss": -26.06500816345215, "global_step": 423139, "epoch": 5098} {"train_loss": -26.04957389831543, "global_step": 423140, "epoch": 5098} {"train_loss": -26.32623291015625, "global_step": 423141, "epoch": 5098} {"train_loss": -26.17401695251465, "global_step": 423142, "epoch": 5098} {"train_loss": -24.684228897094727, "global_step": 423143, "epoch": 5098} {"train_loss": -26.2994441986084, "global_step": 423144, "epoch": 5098} {"train_loss": -26.204944610595703, "global_step": 423145, "epoch": 5098} {"train_loss": -26.288288116455078, "global_step": 423146, "epoch": 5098} {"train_loss": -26.4190731048584, "global_step": 423147, "epoch": 5098} {"train_loss": -26.306396484375, "global_step": 423148, "epoch": 5098} {"train_loss": -26.2437744140625, "global_step": 423149, "epoch": 5098} {"train_loss": -26.58713150024414, "global_step": 423150, "epoch": 5098} {"train_loss": -26.165607452392578, "global_step": 423151, "epoch": 5098} {"train_loss": -26.75090980529785, "global_step": 423152, "epoch": 5098} {"train_loss": -26.311803817749023, "global_step": 423153, "epoch": 5098} {"train_loss": -26.27705192565918, "global_step": 423154, "epoch": 5098} {"train_loss": -26.231618881225586, "global_step": 423155, "epoch": 5098} {"train_loss": -26.620649337768555, "global_step": 423156, "epoch": 5098} {"train_loss": -26.387243270874023, "global_step": 423157, "epoch": 5098} {"train_loss": -26.726362228393555, "global_step": 423158, "epoch": 5098} {"train_loss": -26.594213485717773, "global_step": 423159, "epoch": 5098} {"train_loss": -26.888097763061523, "global_step": 423160, "epoch": 5098} {"train_loss": -26.711156845092773, "global_step": 423161, "epoch": 5098} {"train_loss": -26.610092163085938, "global_step": 423162, "epoch": 5098} {"train_loss": -26.71845817565918, "global_step": 423163, "epoch": 5098} {"train_loss": -26.565977096557617, "global_step": 423164, "epoch": 5098} {"train_loss": -26.617084503173828, "global_step": 423165, "epoch": 5098} {"train_loss": -27.0120906829834, "global_step": 423166, "epoch": 5098} {"train_loss": -26.87697410583496, "global_step": 423167, "epoch": 5098} {"train_loss": -26.568586349487305, "global_step": 423168, "epoch": 5098} {"train_loss": -26.87017822265625, "global_step": 423169, "epoch": 5098} {"train_loss": -26.65712547302246, "global_step": 423170, "epoch": 5098} {"train_loss": -26.955907821655273, "global_step": 423171, "epoch": 5098} {"train_loss": -27.113998413085938, "global_step": 423172, "epoch": 5098} {"train_loss": -26.999622344970703, "global_step": 423173, "epoch": 5098} {"train_loss": -27.028745651245117, "global_step": 423174, "epoch": 5098} {"train_loss": -26.797143936157227, "global_step": 423175, "epoch": 5098} {"train_loss": -26.70319938659668, "global_step": 423176, "epoch": 5098} {"train_loss": -26.914779663085938, "global_step": 423177, "epoch": 5098} {"train_loss": -26.81287956237793, "global_step": 423178, "epoch": 5098} {"train_loss": -27.18617057800293, "global_step": 423179, "epoch": 5098} {"train_loss": -27.284732818603516, "global_step": 423180, "epoch": 5098} {"train_loss": -26.94952392578125, "global_step": 423181, "epoch": 5098} {"train_loss": -27.191251754760742, "global_step": 423182, "epoch": 5098} {"train_loss": -26.982763290405273, "global_step": 423183, "epoch": 5098} {"train_loss": -26.84242820739746, "global_step": 423184, "epoch": 5098} {"train_loss": -26.704944610595703, "global_step": 423185, "epoch": 5098} {"train_loss": -26.796152114868164, "global_step": 423186, "epoch": 5098} {"train_loss": -26.967578887939453, "global_step": 423187, "epoch": 5098} {"train_loss": -27.042688369750977, "global_step": 423188, "epoch": 5098} {"train_loss": -26.906042098999023, "global_step": 423189, "epoch": 5098} {"train_loss": -26.841100692749023, "global_step": 423190, "epoch": 5098} {"train_loss": -27.34974479675293, "global_step": 423191, "epoch": 5098} {"train_loss": -26.894067764282227, "global_step": 423192, "epoch": 5098} {"train_loss": -26.833038330078125, "global_step": 423193, "epoch": 5098} {"train_loss": -26.84003257751465, "global_step": 423194, "epoch": 5098} {"train_loss": -27.183948516845703, "global_step": 423195, "epoch": 5098} {"train_loss": -27.13616943359375, "global_step": 423196, "epoch": 5098} {"train_loss": -27.223438262939453, "global_step": 423197, "epoch": 5098} {"train_loss": -26.818164825439453, "global_step": 423198, "epoch": 5098} {"train_loss": -26.91933250427246, "global_step": 423199, "epoch": 5098} {"train_loss": -26.864843368530273, "global_step": 423200, "epoch": 5098} {"train_loss": -27.07086753845215, "global_step": 423201, "epoch": 5098} {"train_loss": -26.241363525390625, "global_step": 423202, "epoch": 5098} {"train_loss": -26.092426300048828, "global_step": 423203, "epoch": 5098} {"train_loss": -26.22861099243164, "global_step": 423204, "epoch": 5098} {"train_loss": -26.131244659423828, "global_step": 423205, "epoch": 5098} {"train_loss": -26.2664737701416, "global_step": 423206, "epoch": 5098} {"train_loss": -26.57735252380371, "global_step": 423207, "epoch": 5098} {"train_loss": -26.458784103393555, "global_step": 423208, "epoch": 5098} {"train_loss": -26.362903594970703, "global_step": 423209, "epoch": 5098} {"train_loss": -26.12468910217285, "global_step": 423210, "epoch": 5098} {"train_loss": -26.71473503112793, "global_step": 423211, "epoch": 5098} {"train_loss": -26.383365631103516, "global_step": 423212, "epoch": 5098} {"train_loss": -26.511621475219727, "global_step": 423213, "epoch": 5098} {"train_loss": -26.45176124572754, "global_step": 423214, "epoch": 5098} {"train_loss": -26.625951766967773, "global_step": 423215, "epoch": 5098} {"train_loss": -26.626025027539356, "global_step": 423216, "epoch": 5098, "val_loss": 6944783.0} {"train_loss": -26.26358985900879, "global_step": 423217, "epoch": 5099} {"train_loss": -26.2249755859375, "global_step": 423218, "epoch": 5099} {"train_loss": -26.382293701171875, "global_step": 423219, "epoch": 5099} {"train_loss": -26.30182456970215, "global_step": 423220, "epoch": 5099} {"train_loss": -26.21876335144043, "global_step": 423221, "epoch": 5099} {"train_loss": -26.724761962890625, "global_step": 423222, "epoch": 5099} {"train_loss": -26.728437423706055, "global_step": 423223, "epoch": 5099} {"train_loss": -26.3231258392334, "global_step": 423224, "epoch": 5099} {"train_loss": -26.516489028930664, "global_step": 423225, "epoch": 5099} {"train_loss": -26.54253578186035, "global_step": 423226, "epoch": 5099} {"train_loss": -26.557382583618164, "global_step": 423227, "epoch": 5099} {"train_loss": -26.58805274963379, "global_step": 423228, "epoch": 5099} {"train_loss": -26.446929931640625, "global_step": 423229, "epoch": 5099} {"train_loss": -26.617029190063477, "global_step": 423230, "epoch": 5099} {"train_loss": -26.82285499572754, "global_step": 423231, "epoch": 5099} {"train_loss": -26.598560333251953, "global_step": 423232, "epoch": 5099} {"train_loss": -26.680328369140625, "global_step": 423233, "epoch": 5099} {"train_loss": -26.78204917907715, "global_step": 423234, "epoch": 5099} {"train_loss": -27.030231475830078, "global_step": 423235, "epoch": 5099} {"train_loss": -26.65479850769043, "global_step": 423236, "epoch": 5099} {"train_loss": -26.491361618041992, "global_step": 423237, "epoch": 5099} {"train_loss": -26.793554306030273, "global_step": 423238, "epoch": 5099} {"train_loss": -27.282608032226562, "global_step": 423239, "epoch": 5099} {"train_loss": -26.837554931640625, "global_step": 423240, "epoch": 5099} {"train_loss": -26.901697158813477, "global_step": 423241, "epoch": 5099} {"train_loss": -26.551834106445312, "global_step": 423242, "epoch": 5099} {"train_loss": -26.73801040649414, "global_step": 423243, "epoch": 5099} {"train_loss": -26.709115982055664, "global_step": 423244, "epoch": 5099} {"train_loss": -26.688385009765625, "global_step": 423245, "epoch": 5099} {"train_loss": -26.721704483032227, "global_step": 423246, "epoch": 5099} {"train_loss": -26.904272079467773, "global_step": 423247, "epoch": 5099} {"train_loss": -26.77762794494629, "global_step": 423248, "epoch": 5099} {"train_loss": -26.9233455657959, "global_step": 423249, "epoch": 5099} {"train_loss": -26.84222412109375, "global_step": 423250, "epoch": 5099} {"train_loss": -26.949979782104492, "global_step": 423251, "epoch": 5099} {"train_loss": -26.9199161529541, "global_step": 423252, "epoch": 5099} {"train_loss": -27.033552169799805, "global_step": 423253, "epoch": 5099} {"train_loss": -26.793212890625, "global_step": 423254, "epoch": 5099} {"train_loss": -27.190235137939453, "global_step": 423255, "epoch": 5099} {"train_loss": -26.986591339111328, "global_step": 423256, "epoch": 5099} {"train_loss": -26.734344482421875, "global_step": 423257, "epoch": 5099} {"train_loss": -27.06130027770996, "global_step": 423258, "epoch": 5099} {"train_loss": -27.3944091796875, "global_step": 423259, "epoch": 5099} {"train_loss": -26.907445907592773, "global_step": 423260, "epoch": 5099} {"train_loss": -27.11508560180664, "global_step": 423261, "epoch": 5099} {"train_loss": -27.218305587768555, "global_step": 423262, "epoch": 5099} {"train_loss": -26.906164169311523, "global_step": 423263, "epoch": 5099} {"train_loss": -27.00697898864746, "global_step": 423264, "epoch": 5099} {"train_loss": -26.9634952545166, "global_step": 423265, "epoch": 5099} {"train_loss": -26.983118057250977, "global_step": 423266, "epoch": 5099} {"train_loss": -27.25703239440918, "global_step": 423267, "epoch": 5099} {"train_loss": -26.88385581970215, "global_step": 423268, "epoch": 5099} {"train_loss": -26.864404678344727, "global_step": 423269, "epoch": 5099} {"train_loss": -26.91428565979004, "global_step": 423270, "epoch": 5099} {"train_loss": -26.74139404296875, "global_step": 423271, "epoch": 5099} {"train_loss": -27.13164710998535, "global_step": 423272, "epoch": 5099} {"train_loss": -26.718658447265625, "global_step": 423273, "epoch": 5099} {"train_loss": -26.903539657592773, "global_step": 423274, "epoch": 5099} {"train_loss": -27.055967330932617, "global_step": 423275, "epoch": 5099} {"train_loss": -26.421875, "global_step": 423276, "epoch": 5099} {"train_loss": -26.8928165435791, "global_step": 423277, "epoch": 5099} {"train_loss": -25.79715919494629, "global_step": 423278, "epoch": 5099} {"train_loss": -25.256681442260742, "global_step": 423279, "epoch": 5099} {"train_loss": -24.007797241210938, "global_step": 423280, "epoch": 5099} {"train_loss": -25.9201602935791, "global_step": 423281, "epoch": 5099} {"train_loss": -26.407108306884766, "global_step": 423282, "epoch": 5099} {"train_loss": -26.261152267456055, "global_step": 423283, "epoch": 5099} {"train_loss": -26.651611328125, "global_step": 423284, "epoch": 5099} {"train_loss": -26.24713134765625, "global_step": 423285, "epoch": 5099} {"train_loss": -26.994409561157227, "global_step": 423286, "epoch": 5099} {"train_loss": -26.604476928710938, "global_step": 423287, "epoch": 5099} {"train_loss": -26.73848533630371, "global_step": 423288, "epoch": 5099} {"train_loss": -26.50018882751465, "global_step": 423289, "epoch": 5099} {"train_loss": -26.752979278564453, "global_step": 423290, "epoch": 5099} {"train_loss": -26.556798934936523, "global_step": 423291, "epoch": 5099} {"train_loss": -26.60660171508789, "global_step": 423292, "epoch": 5099} {"train_loss": -26.561094284057617, "global_step": 423293, "epoch": 5099} {"train_loss": -26.580530166625977, "global_step": 423294, "epoch": 5099} {"train_loss": -27.074542999267578, "global_step": 423295, "epoch": 5099} {"train_loss": -26.841064453125, "global_step": 423296, "epoch": 5099} {"train_loss": -26.72633171081543, "global_step": 423297, "epoch": 5099} {"train_loss": -26.474990844726562, "global_step": 423298, "epoch": 5099} {"train_loss": -26.66274544129889, "global_step": 423299, "epoch": 5099, "val_loss": 7021416.0} {"train_loss": -26.318710327148438, "global_step": 423300, "epoch": 5100} {"train_loss": -26.28464698791504, "global_step": 423301, "epoch": 5100} {"train_loss": -26.550323486328125, "global_step": 423302, "epoch": 5100} {"train_loss": -26.38981056213379, "global_step": 423303, "epoch": 5100} {"train_loss": -26.458972930908203, "global_step": 423304, "epoch": 5100} {"train_loss": -26.181018829345703, "global_step": 423305, "epoch": 5100} {"train_loss": -26.208829879760742, "global_step": 423306, "epoch": 5100} {"train_loss": -27.07734489440918, "global_step": 423307, "epoch": 5100} {"train_loss": -26.522022247314453, "global_step": 423308, "epoch": 5100} {"train_loss": -26.37458610534668, "global_step": 423309, "epoch": 5100} {"train_loss": -26.365320205688477, "global_step": 423310, "epoch": 5100} {"train_loss": -26.711462020874023, "global_step": 423311, "epoch": 5100} {"train_loss": -26.614728927612305, "global_step": 423312, "epoch": 5100} {"train_loss": -26.204755783081055, "global_step": 423313, "epoch": 5100} {"train_loss": -26.46917152404785, "global_step": 423314, "epoch": 5100} {"train_loss": -26.948902130126953, "global_step": 423315, "epoch": 5100} {"train_loss": -26.608346939086914, "global_step": 423316, "epoch": 5100} {"train_loss": -26.805866241455078, "global_step": 423317, "epoch": 5100} {"train_loss": -26.73651695251465, "global_step": 423318, "epoch": 5100} {"train_loss": -26.860736846923828, "global_step": 423319, "epoch": 5100} {"train_loss": -26.755590438842773, "global_step": 423320, "epoch": 5100} {"train_loss": -27.02808952331543, "global_step": 423321, "epoch": 5100} {"train_loss": -26.77985954284668, "global_step": 423322, "epoch": 5100} {"train_loss": -27.20462989807129, "global_step": 423323, "epoch": 5100} {"train_loss": -27.01788330078125, "global_step": 423324, "epoch": 5100} {"train_loss": -26.933639526367188, "global_step": 423325, "epoch": 5100} {"train_loss": -26.789365768432617, "global_step": 423326, "epoch": 5100} {"train_loss": -26.89495849609375, "global_step": 423327, "epoch": 5100} {"train_loss": -27.105600357055664, "global_step": 423328, "epoch": 5100} {"train_loss": -26.501617431640625, "global_step": 423329, "epoch": 5100} {"train_loss": -26.6402645111084, "global_step": 423330, "epoch": 5100} {"train_loss": -27.116180419921875, "global_step": 423331, "epoch": 5100} {"train_loss": -27.0761775970459, "global_step": 423332, "epoch": 5100} {"train_loss": -26.788070678710938, "global_step": 423333, "epoch": 5100} {"train_loss": -26.83009147644043, "global_step": 423334, "epoch": 5100} {"train_loss": -27.086444854736328, "global_step": 423335, "epoch": 5100} {"train_loss": -26.830551147460938, "global_step": 423336, "epoch": 5100} {"train_loss": -26.568649291992188, "global_step": 423337, "epoch": 5100} {"train_loss": -26.545080184936523, "global_step": 423338, "epoch": 5100} {"train_loss": -27.38270378112793, "global_step": 423339, "epoch": 5100} {"train_loss": -26.822851181030273, "global_step": 423340, "epoch": 5100} {"train_loss": -26.773880004882812, "global_step": 423341, "epoch": 5100} {"train_loss": -26.987491607666016, "global_step": 423342, "epoch": 5100} {"train_loss": -26.604633331298828, "global_step": 423343, "epoch": 5100} {"train_loss": -26.89652442932129, "global_step": 423344, "epoch": 5100} {"train_loss": -26.947290420532227, "global_step": 423345, "epoch": 5100} {"train_loss": -26.65717887878418, "global_step": 423346, "epoch": 5100} {"train_loss": -26.827558517456055, "global_step": 423347, "epoch": 5100} {"train_loss": -26.24677085876465, "global_step": 423348, "epoch": 5100} {"train_loss": -26.75274658203125, "global_step": 423349, "epoch": 5100} {"train_loss": -26.743743896484375, "global_step": 423350, "epoch": 5100} {"train_loss": -26.839252471923828, "global_step": 423351, "epoch": 5100} {"train_loss": -26.542821884155273, "global_step": 423352, "epoch": 5100} {"train_loss": -26.42803955078125, "global_step": 423353, "epoch": 5100} {"train_loss": -26.462356567382812, "global_step": 423354, "epoch": 5100} {"train_loss": -26.693622589111328, "global_step": 423355, "epoch": 5100} {"train_loss": -26.96845054626465, "global_step": 423356, "epoch": 5100} {"train_loss": -27.088720321655273, "global_step": 423357, "epoch": 5100} {"train_loss": -26.817371368408203, "global_step": 423358, "epoch": 5100} {"train_loss": -26.7479190826416, "global_step": 423359, "epoch": 5100} {"train_loss": -27.207136154174805, "global_step": 423360, "epoch": 5100} {"train_loss": -27.149450302124023, "global_step": 423361, "epoch": 5100} {"train_loss": -26.755788803100586, "global_step": 423362, "epoch": 5100} {"train_loss": -26.920408248901367, "global_step": 423363, "epoch": 5100} {"train_loss": -27.54889488220215, "global_step": 423364, "epoch": 5100} {"train_loss": -26.900663375854492, "global_step": 423365, "epoch": 5100} {"train_loss": -27.13459587097168, "global_step": 423366, "epoch": 5100} {"train_loss": -27.214481353759766, "global_step": 423367, "epoch": 5100} {"train_loss": -27.22340202331543, "global_step": 423368, "epoch": 5100} {"train_loss": -26.92911720275879, "global_step": 423369, "epoch": 5100} {"train_loss": -27.083948135375977, "global_step": 423370, "epoch": 5100} {"train_loss": -27.166645050048828, "global_step": 423371, "epoch": 5100} {"train_loss": -27.125843048095703, "global_step": 423372, "epoch": 5100} {"train_loss": -27.008899688720703, "global_step": 423373, "epoch": 5100} {"train_loss": -26.774343490600586, "global_step": 423374, "epoch": 5100} {"train_loss": -26.62152099609375, "global_step": 423375, "epoch": 5100} {"train_loss": -27.144275665283203, "global_step": 423376, "epoch": 5100} {"train_loss": -26.933536529541016, "global_step": 423377, "epoch": 5100} {"train_loss": -26.638629913330078, "global_step": 423378, "epoch": 5100} {"train_loss": -26.986474990844727, "global_step": 423379, "epoch": 5100} {"train_loss": -26.838537216186523, "global_step": 423380, "epoch": 5100} {"train_loss": -26.71455192565918, "global_step": 423381, "epoch": 5100} {"train_loss": -26.784234196306713, "global_step": 423382, "epoch": 5100, "train/sim_max_reward_0": 0.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 0.0, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4500000": 1.0, "test/sim_max_reward_4500001": 1.0, "test/sim_max_reward_4500002": 1.0, "test/sim_max_reward_4500003": 1.0, "test/sim_max_reward_4500004": 1.0, "test/sim_max_reward_4500005": 1.0, "test/sim_max_reward_4500006": 1.0, "test/sim_max_reward_4500007": 1.0, "test/sim_max_reward_4500008": 1.0, "test/sim_max_reward_4500009": 1.0, "test/sim_max_reward_4500010": 1.0, "test/sim_max_reward_4500011": 1.0, "test/sim_max_reward_4500012": 1.0, "test/sim_max_reward_4500013": 1.0, "test/sim_max_reward_4500014": 1.0, "test/sim_max_reward_4500015": 1.0, "test/sim_max_reward_4500016": 1.0, "test/sim_max_reward_4500017": 1.0, "test/sim_max_reward_4500018": 0.0, "test/sim_max_reward_4500019": 1.0, "test/sim_max_reward_4500020": 1.0, "test/sim_max_reward_4500021": 1.0, "train/mean_score": 0.6666666666666666, "test/mean_score": 0.9545454545454546, "val_loss": 6918234.0} {"train_loss": -25.75152587890625, "global_step": 423383, "epoch": 5101} {"train_loss": -26.1165828704834, "global_step": 423384, "epoch": 5101} {"train_loss": -26.181121826171875, "global_step": 423385, "epoch": 5101} {"train_loss": -25.706552505493164, "global_step": 423386, "epoch": 5101} {"train_loss": -25.398792266845703, "global_step": 423387, "epoch": 5101} {"train_loss": -26.255355834960938, "global_step": 423388, "epoch": 5101} {"train_loss": -26.091064453125, "global_step": 423389, "epoch": 5101} {"train_loss": -26.352869033813477, "global_step": 423390, "epoch": 5101} {"train_loss": -26.289081573486328, "global_step": 423391, "epoch": 5101} {"train_loss": -26.293750762939453, "global_step": 423392, "epoch": 5101} {"train_loss": -26.096820831298828, "global_step": 423393, "epoch": 5101} {"train_loss": -25.97247886657715, "global_step": 423394, "epoch": 5101} {"train_loss": -26.48661231994629, "global_step": 423395, "epoch": 5101} {"train_loss": -26.314273834228516, "global_step": 423396, "epoch": 5101} {"train_loss": -25.995019912719727, "global_step": 423397, "epoch": 5101} {"train_loss": -26.371601104736328, "global_step": 423398, "epoch": 5101} {"train_loss": -26.496564865112305, "global_step": 423399, "epoch": 5101} {"train_loss": -26.44353675842285, "global_step": 423400, "epoch": 5101} {"train_loss": -26.527069091796875, "global_step": 423401, "epoch": 5101} {"train_loss": -27.08307456970215, "global_step": 423402, "epoch": 5101} {"train_loss": -26.448657989501953, "global_step": 423403, "epoch": 5101} {"train_loss": -26.4725284576416, "global_step": 423404, "epoch": 5101} {"train_loss": -26.413095474243164, "global_step": 423405, "epoch": 5101} {"train_loss": -26.24781608581543, "global_step": 423406, "epoch": 5101} {"train_loss": -26.481369018554688, "global_step": 423407, "epoch": 5101} {"train_loss": -26.6264705657959, "global_step": 423408, "epoch": 5101} {"train_loss": -26.600372314453125, "global_step": 423409, "epoch": 5101} {"train_loss": -26.8433780670166, "global_step": 423410, "epoch": 5101} {"train_loss": -26.851425170898438, "global_step": 423411, "epoch": 5101} {"train_loss": -26.751373291015625, "global_step": 423412, "epoch": 5101} {"train_loss": -26.71048927307129, "global_step": 423413, "epoch": 5101} {"train_loss": -26.927204132080078, "global_step": 423414, "epoch": 5101} {"train_loss": -26.84012794494629, "global_step": 423415, "epoch": 5101} {"train_loss": -26.617679595947266, "global_step": 423416, "epoch": 5101} {"train_loss": -27.11317253112793, "global_step": 423417, "epoch": 5101} {"train_loss": -26.84967613220215, "global_step": 423418, "epoch": 5101} {"train_loss": -26.782855987548828, "global_step": 423419, "epoch": 5101} {"train_loss": -27.052799224853516, "global_step": 423420, "epoch": 5101} {"train_loss": -26.77374267578125, "global_step": 423421, "epoch": 5101} {"train_loss": -26.891199111938477, "global_step": 423422, "epoch": 5101} {"train_loss": -27.004962921142578, "global_step": 423423, "epoch": 5101} {"train_loss": -26.769800186157227, "global_step": 423424, "epoch": 5101} {"train_loss": -26.581470489501953, "global_step": 423425, "epoch": 5101} {"train_loss": -26.5887451171875, "global_step": 423426, "epoch": 5101} {"train_loss": -26.820173263549805, "global_step": 423427, "epoch": 5101} {"train_loss": -26.782011032104492, "global_step": 423428, "epoch": 5101} {"train_loss": -26.650442123413086, "global_step": 423429, "epoch": 5101} {"train_loss": -26.445556640625, "global_step": 423430, "epoch": 5101} {"train_loss": -26.956619262695312, "global_step": 423431, "epoch": 5101} {"train_loss": -27.06731605529785, "global_step": 423432, "epoch": 5101} {"train_loss": -27.366811752319336, "global_step": 423433, "epoch": 5101} {"train_loss": -26.833637237548828, "global_step": 423434, "epoch": 5101} {"train_loss": -26.782556533813477, "global_step": 423435, "epoch": 5101} {"train_loss": -26.828577041625977, "global_step": 423436, "epoch": 5101} {"train_loss": -27.366804122924805, "global_step": 423437, "epoch": 5101} {"train_loss": -26.71510124206543, "global_step": 423438, "epoch": 5101} {"train_loss": -27.226449966430664, "global_step": 423439, "epoch": 5101} {"train_loss": -26.877765655517578, "global_step": 423440, "epoch": 5101} {"train_loss": -26.79597282409668, "global_step": 423441, "epoch": 5101} {"train_loss": -27.05293083190918, "global_step": 423442, "epoch": 5101} {"train_loss": -27.10445213317871, "global_step": 423443, "epoch": 5101} {"train_loss": -26.68548583984375, "global_step": 423444, "epoch": 5101} {"train_loss": -26.75497817993164, "global_step": 423445, "epoch": 5101} {"train_loss": -27.088708877563477, "global_step": 423446, "epoch": 5101} {"train_loss": -26.862106323242188, "global_step": 423447, "epoch": 5101} {"train_loss": -26.913803100585938, "global_step": 423448, "epoch": 5101} {"train_loss": -26.422164916992188, "global_step": 423449, "epoch": 5101} {"train_loss": -27.245960235595703, "global_step": 423450, "epoch": 5101} {"train_loss": -27.109228134155273, "global_step": 423451, "epoch": 5101} {"train_loss": -26.86634635925293, "global_step": 423452, "epoch": 5101} {"train_loss": -26.732868194580078, "global_step": 423453, "epoch": 5101} {"train_loss": -26.511859893798828, "global_step": 423454, "epoch": 5101} {"train_loss": -26.885639190673828, "global_step": 423455, "epoch": 5101} {"train_loss": -27.300891876220703, "global_step": 423456, "epoch": 5101} {"train_loss": -26.82172203063965, "global_step": 423457, "epoch": 5101} {"train_loss": -26.343994140625, "global_step": 423458, "epoch": 5101} {"train_loss": -26.779682159423828, "global_step": 423459, "epoch": 5101} {"train_loss": -26.57377052307129, "global_step": 423460, "epoch": 5101} {"train_loss": -26.813919067382812, "global_step": 423461, "epoch": 5101} {"train_loss": -26.717016220092773, "global_step": 423462, "epoch": 5101} {"train_loss": -26.858152389526367, "global_step": 423463, "epoch": 5101} {"train_loss": -26.642333984375, "global_step": 423464, "epoch": 5101} {"train_loss": -26.655318639364587, "global_step": 423465, "epoch": 5101, "val_loss": 6920369.0} {"train_loss": -26.017688751220703, "global_step": 423466, "epoch": 5102} {"train_loss": -25.49500846862793, "global_step": 423467, "epoch": 5102} {"train_loss": -26.262327194213867, "global_step": 423468, "epoch": 5102} {"train_loss": -26.49091911315918, "global_step": 423469, "epoch": 5102} {"train_loss": -25.934524536132812, "global_step": 423470, "epoch": 5102} {"train_loss": -26.0156307220459, "global_step": 423471, "epoch": 5102} {"train_loss": -26.72544288635254, "global_step": 423472, "epoch": 5102} {"train_loss": -26.15363883972168, "global_step": 423473, "epoch": 5102} {"train_loss": -26.219568252563477, "global_step": 423474, "epoch": 5102} {"train_loss": -26.707717895507812, "global_step": 423475, "epoch": 5102} {"train_loss": -26.212682723999023, "global_step": 423476, "epoch": 5102} {"train_loss": -26.184675216674805, "global_step": 423477, "epoch": 5102} {"train_loss": -26.392736434936523, "global_step": 423478, "epoch": 5102} {"train_loss": -26.475427627563477, "global_step": 423479, "epoch": 5102} {"train_loss": -26.371601104736328, "global_step": 423480, "epoch": 5102} {"train_loss": -26.37070083618164, "global_step": 423481, "epoch": 5102} {"train_loss": -26.2952880859375, "global_step": 423482, "epoch": 5102} {"train_loss": -26.04456901550293, "global_step": 423483, "epoch": 5102} {"train_loss": -26.054157257080078, "global_step": 423484, "epoch": 5102} {"train_loss": -27.00086784362793, "global_step": 423485, "epoch": 5102} {"train_loss": -26.47515869140625, "global_step": 423486, "epoch": 5102} {"train_loss": -26.7061767578125, "global_step": 423487, "epoch": 5102} {"train_loss": -26.790205001831055, "global_step": 423488, "epoch": 5102} {"train_loss": -26.769006729125977, "global_step": 423489, "epoch": 5102} {"train_loss": -26.596067428588867, "global_step": 423490, "epoch": 5102} {"train_loss": -27.012683868408203, "global_step": 423491, "epoch": 5102} {"train_loss": -26.70440673828125, "global_step": 423492, "epoch": 5102} {"train_loss": -26.597553253173828, "global_step": 423493, "epoch": 5102} {"train_loss": -26.79839515686035, "global_step": 423494, "epoch": 5102} {"train_loss": -26.566617965698242, "global_step": 423495, "epoch": 5102} {"train_loss": -26.88734245300293, "global_step": 423496, "epoch": 5102} {"train_loss": -26.68414878845215, "global_step": 423497, "epoch": 5102} {"train_loss": -26.478368759155273, "global_step": 423498, "epoch": 5102} {"train_loss": -26.74884033203125, "global_step": 423499, "epoch": 5102} {"train_loss": -26.73238182067871, "global_step": 423500, "epoch": 5102} {"train_loss": -27.006591796875, "global_step": 423501, "epoch": 5102} {"train_loss": -27.051599502563477, "global_step": 423502, "epoch": 5102} {"train_loss": -27.10599136352539, "global_step": 423503, "epoch": 5102} {"train_loss": -26.73188591003418, "global_step": 423504, "epoch": 5102} {"train_loss": -26.849409103393555, "global_step": 423505, "epoch": 5102} {"train_loss": -26.777875900268555, "global_step": 423506, "epoch": 5102} {"train_loss": -27.164905548095703, "global_step": 423507, "epoch": 5102} {"train_loss": -26.753864288330078, "global_step": 423508, "epoch": 5102} {"train_loss": -26.6735897064209, "global_step": 423509, "epoch": 5102} {"train_loss": -27.0325870513916, "global_step": 423510, "epoch": 5102} {"train_loss": -26.966894149780273, "global_step": 423511, "epoch": 5102} {"train_loss": -27.013824462890625, "global_step": 423512, "epoch": 5102} {"train_loss": -26.725452423095703, "global_step": 423513, "epoch": 5102} {"train_loss": -27.188669204711914, "global_step": 423514, "epoch": 5102} {"train_loss": -27.482542037963867, "global_step": 423515, "epoch": 5102} {"train_loss": -26.894195556640625, "global_step": 423516, "epoch": 5102} {"train_loss": -27.084131240844727, "global_step": 423517, "epoch": 5102} {"train_loss": -26.783466339111328, "global_step": 423518, "epoch": 5102} {"train_loss": -26.81722068786621, "global_step": 423519, "epoch": 5102} {"train_loss": -26.918188095092773, "global_step": 423520, "epoch": 5102} {"train_loss": -26.95045280456543, "global_step": 423521, "epoch": 5102} {"train_loss": -26.819965362548828, "global_step": 423522, "epoch": 5102} {"train_loss": -26.840137481689453, "global_step": 423523, "epoch": 5102} {"train_loss": -26.59669303894043, "global_step": 423524, "epoch": 5102} {"train_loss": -27.105731964111328, "global_step": 423525, "epoch": 5102} {"train_loss": -26.6390438079834, "global_step": 423526, "epoch": 5102} {"train_loss": -26.407312393188477, "global_step": 423527, "epoch": 5102} {"train_loss": -25.727954864501953, "global_step": 423528, "epoch": 5102} {"train_loss": -25.358314514160156, "global_step": 423529, "epoch": 5102} {"train_loss": -25.783313751220703, "global_step": 423530, "epoch": 5102} {"train_loss": -26.8316707611084, "global_step": 423531, "epoch": 5102} {"train_loss": -26.336139678955078, "global_step": 423532, "epoch": 5102} {"train_loss": -26.406070709228516, "global_step": 423533, "epoch": 5102} {"train_loss": -26.602689743041992, "global_step": 423534, "epoch": 5102} {"train_loss": -26.427244186401367, "global_step": 423535, "epoch": 5102} {"train_loss": -26.584808349609375, "global_step": 423536, "epoch": 5102} {"train_loss": -26.123838424682617, "global_step": 423537, "epoch": 5102} {"train_loss": -26.3073787689209, "global_step": 423538, "epoch": 5102} {"train_loss": -26.316818237304688, "global_step": 423539, "epoch": 5102} {"train_loss": -26.341815948486328, "global_step": 423540, "epoch": 5102} {"train_loss": -25.972570419311523, "global_step": 423541, "epoch": 5102} {"train_loss": -26.70387077331543, "global_step": 423542, "epoch": 5102} {"train_loss": -26.42363929748535, "global_step": 423543, "epoch": 5102} {"train_loss": -26.408864974975586, "global_step": 423544, "epoch": 5102} {"train_loss": -26.797550201416016, "global_step": 423545, "epoch": 5102} {"train_loss": -26.213415145874023, "global_step": 423546, "epoch": 5102} {"train_loss": -26.5819034576416, "global_step": 423547, "epoch": 5102} {"train_loss": -26.573394338768647, "global_step": 423548, "epoch": 5102, "val_loss": 6941351.0} {"train_loss": -25.743261337280273, "global_step": 423549, "epoch": 5103} {"train_loss": -26.210779190063477, "global_step": 423550, "epoch": 5103} {"train_loss": -25.801483154296875, "global_step": 423551, "epoch": 5103} {"train_loss": -26.485315322875977, "global_step": 423552, "epoch": 5103} {"train_loss": -26.099340438842773, "global_step": 423553, "epoch": 5103} {"train_loss": -25.906591415405273, "global_step": 423554, "epoch": 5103} {"train_loss": -26.291818618774414, "global_step": 423555, "epoch": 5103} {"train_loss": -26.060880661010742, "global_step": 423556, "epoch": 5103} {"train_loss": -26.469934463500977, "global_step": 423557, "epoch": 5103} {"train_loss": -26.273096084594727, "global_step": 423558, "epoch": 5103} {"train_loss": -26.674253463745117, "global_step": 423559, "epoch": 5103} {"train_loss": -26.429956436157227, "global_step": 423560, "epoch": 5103} {"train_loss": -26.57869529724121, "global_step": 423561, "epoch": 5103} {"train_loss": -26.47564125061035, "global_step": 423562, "epoch": 5103} {"train_loss": -26.47330665588379, "global_step": 423563, "epoch": 5103} {"train_loss": -26.65899658203125, "global_step": 423564, "epoch": 5103} {"train_loss": -26.64369773864746, "global_step": 423565, "epoch": 5103} {"train_loss": -26.659780502319336, "global_step": 423566, "epoch": 5103} {"train_loss": -26.779865264892578, "global_step": 423567, "epoch": 5103} {"train_loss": -26.5496768951416, "global_step": 423568, "epoch": 5103} {"train_loss": -26.552703857421875, "global_step": 423569, "epoch": 5103} {"train_loss": -27.061859130859375, "global_step": 423570, "epoch": 5103} {"train_loss": -27.2880859375, "global_step": 423571, "epoch": 5103} {"train_loss": -26.52960777282715, "global_step": 423572, "epoch": 5103} {"train_loss": -26.861663818359375, "global_step": 423573, "epoch": 5103} {"train_loss": -26.705036163330078, "global_step": 423574, "epoch": 5103} {"train_loss": -26.770740509033203, "global_step": 423575, "epoch": 5103} {"train_loss": -26.896894454956055, "global_step": 423576, "epoch": 5103} {"train_loss": -26.8271427154541, "global_step": 423577, "epoch": 5103} {"train_loss": -26.851972579956055, "global_step": 423578, "epoch": 5103} {"train_loss": -26.99713134765625, "global_step": 423579, "epoch": 5103} {"train_loss": -27.19940757751465, "global_step": 423580, "epoch": 5103} {"train_loss": -27.10212516784668, "global_step": 423581, "epoch": 5103} {"train_loss": -26.667850494384766, "global_step": 423582, "epoch": 5103} {"train_loss": -27.014251708984375, "global_step": 423583, "epoch": 5103} {"train_loss": -26.914960861206055, "global_step": 423584, "epoch": 5103} {"train_loss": -26.926599502563477, "global_step": 423585, "epoch": 5103} {"train_loss": -26.783096313476562, "global_step": 423586, "epoch": 5103} {"train_loss": -26.93548011779785, "global_step": 423587, "epoch": 5103} {"train_loss": -26.663419723510742, "global_step": 423588, "epoch": 5103} {"train_loss": -26.870197296142578, "global_step": 423589, "epoch": 5103} {"train_loss": -26.362348556518555, "global_step": 423590, "epoch": 5103} {"train_loss": -26.99359703063965, "global_step": 423591, "epoch": 5103} {"train_loss": -27.00690269470215, "global_step": 423592, "epoch": 5103} {"train_loss": -26.7889461517334, "global_step": 423593, "epoch": 5103} {"train_loss": -27.061681747436523, "global_step": 423594, "epoch": 5103} {"train_loss": -26.621662139892578, "global_step": 423595, "epoch": 5103} {"train_loss": -26.75351905822754, "global_step": 423596, "epoch": 5103} {"train_loss": -27.151809692382812, "global_step": 423597, "epoch": 5103} {"train_loss": -26.6740665435791, "global_step": 423598, "epoch": 5103} {"train_loss": -26.982898712158203, "global_step": 423599, "epoch": 5103} {"train_loss": -26.998449325561523, "global_step": 423600, "epoch": 5103} {"train_loss": -26.598840713500977, "global_step": 423601, "epoch": 5103} {"train_loss": -26.979162216186523, "global_step": 423602, "epoch": 5103} {"train_loss": -26.395416259765625, "global_step": 423603, "epoch": 5103} {"train_loss": -27.07093620300293, "global_step": 423604, "epoch": 5103} {"train_loss": -26.643585205078125, "global_step": 423605, "epoch": 5103} {"train_loss": -26.765478134155273, "global_step": 423606, "epoch": 5103} {"train_loss": -26.689878463745117, "global_step": 423607, "epoch": 5103} {"train_loss": -26.644800186157227, "global_step": 423608, "epoch": 5103} {"train_loss": -26.410497665405273, "global_step": 423609, "epoch": 5103} {"train_loss": -27.06422233581543, "global_step": 423610, "epoch": 5103} {"train_loss": -26.89838981628418, "global_step": 423611, "epoch": 5103} {"train_loss": -26.82541847229004, "global_step": 423612, "epoch": 5103} {"train_loss": -27.133747100830078, "global_step": 423613, "epoch": 5103} {"train_loss": -27.169179916381836, "global_step": 423614, "epoch": 5103} {"train_loss": -26.965681076049805, "global_step": 423615, "epoch": 5103} {"train_loss": -26.825794219970703, "global_step": 423616, "epoch": 5103} {"train_loss": -27.055362701416016, "global_step": 423617, "epoch": 5103} {"train_loss": -26.606842041015625, "global_step": 423618, "epoch": 5103} {"train_loss": -26.984216690063477, "global_step": 423619, "epoch": 5103} {"train_loss": -27.21552848815918, "global_step": 423620, "epoch": 5103} {"train_loss": -26.856246948242188, "global_step": 423621, "epoch": 5103} {"train_loss": -27.02264404296875, "global_step": 423622, "epoch": 5103} {"train_loss": -27.216388702392578, "global_step": 423623, "epoch": 5103} {"train_loss": -26.929107666015625, "global_step": 423624, "epoch": 5103} {"train_loss": -26.696935653686523, "global_step": 423625, "epoch": 5103} {"train_loss": -27.35102653503418, "global_step": 423626, "epoch": 5103} {"train_loss": -27.06005859375, "global_step": 423627, "epoch": 5103} {"train_loss": -27.000961303710938, "global_step": 423628, "epoch": 5103} {"train_loss": -26.71087074279785, "global_step": 423629, "epoch": 5103} {"train_loss": -27.20468521118164, "global_step": 423630, "epoch": 5103} {"train_loss": -26.742964089634906, "global_step": 423631, "epoch": 5103, "val_loss": 6914509.5} {"train_loss": -26.298755645751953, "global_step": 423632, "epoch": 5104} {"train_loss": -26.230499267578125, "global_step": 423633, "epoch": 5104} {"train_loss": -26.717084884643555, "global_step": 423634, "epoch": 5104} {"train_loss": -25.97041893005371, "global_step": 423635, "epoch": 5104} {"train_loss": -26.0159912109375, "global_step": 423636, "epoch": 5104} {"train_loss": -26.18829345703125, "global_step": 423637, "epoch": 5104} {"train_loss": -26.20233726501465, "global_step": 423638, "epoch": 5104} {"train_loss": -26.40118980407715, "global_step": 423639, "epoch": 5104} {"train_loss": -26.733325958251953, "global_step": 423640, "epoch": 5104} {"train_loss": -26.563562393188477, "global_step": 423641, "epoch": 5104} {"train_loss": -26.35574722290039, "global_step": 423642, "epoch": 5104} {"train_loss": -26.47316551208496, "global_step": 423643, "epoch": 5104} {"train_loss": -26.7648983001709, "global_step": 423644, "epoch": 5104} {"train_loss": -26.42376136779785, "global_step": 423645, "epoch": 5104} {"train_loss": -26.47242546081543, "global_step": 423646, "epoch": 5104} {"train_loss": -26.557544708251953, "global_step": 423647, "epoch": 5104} {"train_loss": -26.478296279907227, "global_step": 423648, "epoch": 5104} {"train_loss": -26.511377334594727, "global_step": 423649, "epoch": 5104} {"train_loss": -26.879074096679688, "global_step": 423650, "epoch": 5104} {"train_loss": -26.888916015625, "global_step": 423651, "epoch": 5104} {"train_loss": -26.87916374206543, "global_step": 423652, "epoch": 5104} {"train_loss": -26.511920928955078, "global_step": 423653, "epoch": 5104} {"train_loss": -26.70603370666504, "global_step": 423654, "epoch": 5104} {"train_loss": -26.9656982421875, "global_step": 423655, "epoch": 5104} {"train_loss": -26.76067543029785, "global_step": 423656, "epoch": 5104} {"train_loss": -26.572702407836914, "global_step": 423657, "epoch": 5104} {"train_loss": -26.49091148376465, "global_step": 423658, "epoch": 5104} {"train_loss": -26.406814575195312, "global_step": 423659, "epoch": 5104} {"train_loss": -26.77927589416504, "global_step": 423660, "epoch": 5104} {"train_loss": -26.942052841186523, "global_step": 423661, "epoch": 5104} {"train_loss": -26.548669815063477, "global_step": 423662, "epoch": 5104} {"train_loss": -26.533145904541016, "global_step": 423663, "epoch": 5104} {"train_loss": -26.8416690826416, "global_step": 423664, "epoch": 5104} {"train_loss": -26.937341690063477, "global_step": 423665, "epoch": 5104} {"train_loss": -26.9096736907959, "global_step": 423666, "epoch": 5104} {"train_loss": -27.094135284423828, "global_step": 423667, "epoch": 5104} {"train_loss": -26.94911003112793, "global_step": 423668, "epoch": 5104} {"train_loss": -26.902368545532227, "global_step": 423669, "epoch": 5104} {"train_loss": -26.920080184936523, "global_step": 423670, "epoch": 5104} {"train_loss": -26.980484008789062, "global_step": 423671, "epoch": 5104} {"train_loss": -27.34055519104004, "global_step": 423672, "epoch": 5104} {"train_loss": -26.655725479125977, "global_step": 423673, "epoch": 5104} {"train_loss": -26.87339210510254, "global_step": 423674, "epoch": 5104} {"train_loss": -26.6909236907959, "global_step": 423675, "epoch": 5104} {"train_loss": -26.76340675354004, "global_step": 423676, "epoch": 5104} {"train_loss": -26.98187255859375, "global_step": 423677, "epoch": 5104} {"train_loss": -27.55535316467285, "global_step": 423678, "epoch": 5104} {"train_loss": -26.8206787109375, "global_step": 423679, "epoch": 5104} {"train_loss": -27.17219352722168, "global_step": 423680, "epoch": 5104} {"train_loss": -26.881072998046875, "global_step": 423681, "epoch": 5104} {"train_loss": -26.986547470092773, "global_step": 423682, "epoch": 5104} {"train_loss": -27.188919067382812, "global_step": 423683, "epoch": 5104} {"train_loss": -26.9261474609375, "global_step": 423684, "epoch": 5104} {"train_loss": -26.793188095092773, "global_step": 423685, "epoch": 5104} {"train_loss": -26.948556900024414, "global_step": 423686, "epoch": 5104} {"train_loss": -27.06585121154785, "global_step": 423687, "epoch": 5104} {"train_loss": -26.7120304107666, "global_step": 423688, "epoch": 5104} {"train_loss": -26.321008682250977, "global_step": 423689, "epoch": 5104} {"train_loss": -26.110218048095703, "global_step": 423690, "epoch": 5104} {"train_loss": -25.67608642578125, "global_step": 423691, "epoch": 5104} {"train_loss": -25.641321182250977, "global_step": 423692, "epoch": 5104} {"train_loss": -25.845733642578125, "global_step": 423693, "epoch": 5104} {"train_loss": -26.375152587890625, "global_step": 423694, "epoch": 5104} {"train_loss": -26.060815811157227, "global_step": 423695, "epoch": 5104} {"train_loss": -25.788604736328125, "global_step": 423696, "epoch": 5104} {"train_loss": -26.238723754882812, "global_step": 423697, "epoch": 5104} {"train_loss": -25.92105484008789, "global_step": 423698, "epoch": 5104} {"train_loss": -26.09396743774414, "global_step": 423699, "epoch": 5104} {"train_loss": -26.32486343383789, "global_step": 423700, "epoch": 5104} {"train_loss": -26.5454158782959, "global_step": 423701, "epoch": 5104} {"train_loss": -26.10809326171875, "global_step": 423702, "epoch": 5104} {"train_loss": -26.601892471313477, "global_step": 423703, "epoch": 5104} {"train_loss": -26.56625747680664, "global_step": 423704, "epoch": 5104} {"train_loss": -25.793081283569336, "global_step": 423705, "epoch": 5104} {"train_loss": -26.920230865478516, "global_step": 423706, "epoch": 5104} {"train_loss": -26.047332763671875, "global_step": 423707, "epoch": 5104} {"train_loss": -26.400588989257812, "global_step": 423708, "epoch": 5104} {"train_loss": -26.5108642578125, "global_step": 423709, "epoch": 5104} {"train_loss": -26.68914794921875, "global_step": 423710, "epoch": 5104} {"train_loss": -26.01043701171875, "global_step": 423711, "epoch": 5104} {"train_loss": -26.8674259185791, "global_step": 423712, "epoch": 5104} {"train_loss": -26.748779296875, "global_step": 423713, "epoch": 5104} {"train_loss": -26.57512046630124, "global_step": 423714, "epoch": 5104, "val_loss": 6944670.0} {"train_loss": -25.412174224853516, "global_step": 423715, "epoch": 5105} {"train_loss": -26.260984420776367, "global_step": 423716, "epoch": 5105} {"train_loss": -25.368228912353516, "global_step": 423717, "epoch": 5105} {"train_loss": -25.83932876586914, "global_step": 423718, "epoch": 5105} {"train_loss": -26.16948890686035, "global_step": 423719, "epoch": 5105} {"train_loss": -26.3775691986084, "global_step": 423720, "epoch": 5105} {"train_loss": -25.6259822845459, "global_step": 423721, "epoch": 5105} {"train_loss": -26.15407371520996, "global_step": 423722, "epoch": 5105} {"train_loss": -25.883197784423828, "global_step": 423723, "epoch": 5105} {"train_loss": -26.289566040039062, "global_step": 423724, "epoch": 5105} {"train_loss": -26.09006690979004, "global_step": 423725, "epoch": 5105} {"train_loss": -26.41202163696289, "global_step": 423726, "epoch": 5105} {"train_loss": -26.3223876953125, "global_step": 423727, "epoch": 5105} {"train_loss": -25.91658592224121, "global_step": 423728, "epoch": 5105} {"train_loss": -26.42901611328125, "global_step": 423729, "epoch": 5105} {"train_loss": -26.281766891479492, "global_step": 423730, "epoch": 5105} {"train_loss": -26.45771598815918, "global_step": 423731, "epoch": 5105} {"train_loss": -26.36789321899414, "global_step": 423732, "epoch": 5105} {"train_loss": -26.447513580322266, "global_step": 423733, "epoch": 5105} {"train_loss": -26.539215087890625, "global_step": 423734, "epoch": 5105} {"train_loss": -26.56922721862793, "global_step": 423735, "epoch": 5105} {"train_loss": -26.204086303710938, "global_step": 423736, "epoch": 5105} {"train_loss": -27.005849838256836, "global_step": 423737, "epoch": 5105} {"train_loss": -26.808460235595703, "global_step": 423738, "epoch": 5105} {"train_loss": -26.276636123657227, "global_step": 423739, "epoch": 5105} {"train_loss": -26.724821090698242, "global_step": 423740, "epoch": 5105} {"train_loss": -26.614715576171875, "global_step": 423741, "epoch": 5105} {"train_loss": -26.461462020874023, "global_step": 423742, "epoch": 5105} {"train_loss": -26.757400512695312, "global_step": 423743, "epoch": 5105} {"train_loss": -27.071134567260742, "global_step": 423744, "epoch": 5105} {"train_loss": -26.8583927154541, "global_step": 423745, "epoch": 5105} {"train_loss": -27.01837158203125, "global_step": 423746, "epoch": 5105} {"train_loss": -26.941640853881836, "global_step": 423747, "epoch": 5105} {"train_loss": -26.486780166625977, "global_step": 423748, "epoch": 5105} {"train_loss": -26.96257972717285, "global_step": 423749, "epoch": 5105} {"train_loss": -26.6103515625, "global_step": 423750, "epoch": 5105} {"train_loss": -27.092618942260742, "global_step": 423751, "epoch": 5105} {"train_loss": -27.04737663269043, "global_step": 423752, "epoch": 5105} {"train_loss": -27.085153579711914, "global_step": 423753, "epoch": 5105} {"train_loss": -27.20607566833496, "global_step": 423754, "epoch": 5105} {"train_loss": -27.122161865234375, "global_step": 423755, "epoch": 5105} {"train_loss": -27.399810791015625, "global_step": 423756, "epoch": 5105} {"train_loss": -26.9620304107666, "global_step": 423757, "epoch": 5105} {"train_loss": -26.6954345703125, "global_step": 423758, "epoch": 5105} {"train_loss": -27.18729591369629, "global_step": 423759, "epoch": 5105} {"train_loss": -26.839111328125, "global_step": 423760, "epoch": 5105} {"train_loss": -27.046009063720703, "global_step": 423761, "epoch": 5105} {"train_loss": -26.644784927368164, "global_step": 423762, "epoch": 5105} {"train_loss": -27.32757568359375, "global_step": 423763, "epoch": 5105} {"train_loss": -26.7818546295166, "global_step": 423764, "epoch": 5105} {"train_loss": -27.074508666992188, "global_step": 423765, "epoch": 5105} {"train_loss": -26.916059494018555, "global_step": 423766, "epoch": 5105} {"train_loss": -26.9718017578125, "global_step": 423767, "epoch": 5105} {"train_loss": -26.568567276000977, "global_step": 423768, "epoch": 5105} {"train_loss": -26.780820846557617, "global_step": 423769, "epoch": 5105} {"train_loss": -26.65606117248535, "global_step": 423770, "epoch": 5105} {"train_loss": -26.737211227416992, "global_step": 423771, "epoch": 5105} {"train_loss": -26.897851943969727, "global_step": 423772, "epoch": 5105} {"train_loss": -26.654199600219727, "global_step": 423773, "epoch": 5105} {"train_loss": -26.979101181030273, "global_step": 423774, "epoch": 5105} {"train_loss": -26.856647491455078, "global_step": 423775, "epoch": 5105} {"train_loss": -26.551828384399414, "global_step": 423776, "epoch": 5105} {"train_loss": -26.068601608276367, "global_step": 423777, "epoch": 5105} {"train_loss": -25.872756958007812, "global_step": 423778, "epoch": 5105} {"train_loss": -25.39503288269043, "global_step": 423779, "epoch": 5105} {"train_loss": -25.14969825744629, "global_step": 423780, "epoch": 5105} {"train_loss": -25.974958419799805, "global_step": 423781, "epoch": 5105} {"train_loss": -26.54889488220215, "global_step": 423782, "epoch": 5105} {"train_loss": -25.868833541870117, "global_step": 423783, "epoch": 5105} {"train_loss": -26.316471099853516, "global_step": 423784, "epoch": 5105} {"train_loss": -26.55905532836914, "global_step": 423785, "epoch": 5105} {"train_loss": -25.706775665283203, "global_step": 423786, "epoch": 5105} {"train_loss": -26.214643478393555, "global_step": 423787, "epoch": 5105} {"train_loss": -26.180898666381836, "global_step": 423788, "epoch": 5105} {"train_loss": -26.45672035217285, "global_step": 423789, "epoch": 5105} {"train_loss": -26.354211807250977, "global_step": 423790, "epoch": 5105} {"train_loss": -26.578344345092773, "global_step": 423791, "epoch": 5105} {"train_loss": -26.421661376953125, "global_step": 423792, "epoch": 5105} {"train_loss": -26.81882667541504, "global_step": 423793, "epoch": 5105} {"train_loss": -26.268646240234375, "global_step": 423794, "epoch": 5105} {"train_loss": -26.282245635986328, "global_step": 423795, "epoch": 5105} {"train_loss": -26.91354751586914, "global_step": 423796, "epoch": 5105} {"train_loss": -26.505570859794158, "global_step": 423797, "epoch": 5105, "val_loss": 6913969.0} {"train_loss": -25.654478073120117, "global_step": 423798, "epoch": 5106} {"train_loss": -26.157596588134766, "global_step": 423799, "epoch": 5106} {"train_loss": -25.872419357299805, "global_step": 423800, "epoch": 5106} {"train_loss": -26.16126823425293, "global_step": 423801, "epoch": 5106} {"train_loss": -26.068933486938477, "global_step": 423802, "epoch": 5106} {"train_loss": -26.205305099487305, "global_step": 423803, "epoch": 5106} {"train_loss": -25.9923038482666, "global_step": 423804, "epoch": 5106} {"train_loss": -26.40060806274414, "global_step": 423805, "epoch": 5106} {"train_loss": -26.37708854675293, "global_step": 423806, "epoch": 5106} {"train_loss": -26.4449405670166, "global_step": 423807, "epoch": 5106} {"train_loss": -26.020099639892578, "global_step": 423808, "epoch": 5106} {"train_loss": -26.348905563354492, "global_step": 423809, "epoch": 5106} {"train_loss": -26.52361488342285, "global_step": 423810, "epoch": 5106} {"train_loss": -26.37967872619629, "global_step": 423811, "epoch": 5106} {"train_loss": -26.776357650756836, "global_step": 423812, "epoch": 5106} {"train_loss": -26.7291316986084, "global_step": 423813, "epoch": 5106} {"train_loss": -26.562768936157227, "global_step": 423814, "epoch": 5106} {"train_loss": -26.425500869750977, "global_step": 423815, "epoch": 5106} {"train_loss": -26.541706085205078, "global_step": 423816, "epoch": 5106} {"train_loss": -26.77764892578125, "global_step": 423817, "epoch": 5106} {"train_loss": -26.4185791015625, "global_step": 423818, "epoch": 5106} {"train_loss": -26.584455490112305, "global_step": 423819, "epoch": 5106} {"train_loss": -26.210681915283203, "global_step": 423820, "epoch": 5106} {"train_loss": -26.93463706970215, "global_step": 423821, "epoch": 5106} {"train_loss": -26.597349166870117, "global_step": 423822, "epoch": 5106} {"train_loss": -26.695209503173828, "global_step": 423823, "epoch": 5106} {"train_loss": -27.106786727905273, "global_step": 423824, "epoch": 5106} {"train_loss": -26.793292999267578, "global_step": 423825, "epoch": 5106} {"train_loss": -26.602752685546875, "global_step": 423826, "epoch": 5106} {"train_loss": -26.878881454467773, "global_step": 423827, "epoch": 5106} {"train_loss": -26.7021484375, "global_step": 423828, "epoch": 5106} {"train_loss": -26.869291305541992, "global_step": 423829, "epoch": 5106} {"train_loss": -26.711572647094727, "global_step": 423830, "epoch": 5106} {"train_loss": -26.79880714416504, "global_step": 423831, "epoch": 5106} {"train_loss": -26.673450469970703, "global_step": 423832, "epoch": 5106} {"train_loss": -26.65546226501465, "global_step": 423833, "epoch": 5106} {"train_loss": -26.870880126953125, "global_step": 423834, "epoch": 5106} {"train_loss": -26.980411529541016, "global_step": 423835, "epoch": 5106} {"train_loss": -26.7622127532959, "global_step": 423836, "epoch": 5106} {"train_loss": -27.641040802001953, "global_step": 423837, "epoch": 5106} {"train_loss": -26.969486236572266, "global_step": 423838, "epoch": 5106} {"train_loss": -26.79616355895996, "global_step": 423839, "epoch": 5106} {"train_loss": -27.088577270507812, "global_step": 423840, "epoch": 5106} {"train_loss": -26.846582412719727, "global_step": 423841, "epoch": 5106} {"train_loss": -26.70623779296875, "global_step": 423842, "epoch": 5106} {"train_loss": -26.705917358398438, "global_step": 423843, "epoch": 5106} {"train_loss": -26.913516998291016, "global_step": 423844, "epoch": 5106} {"train_loss": -26.65338134765625, "global_step": 423845, "epoch": 5106} {"train_loss": -27.126577377319336, "global_step": 423846, "epoch": 5106} {"train_loss": -26.9601993560791, "global_step": 423847, "epoch": 5106} {"train_loss": -26.996057510375977, "global_step": 423848, "epoch": 5106} {"train_loss": -26.73495864868164, "global_step": 423849, "epoch": 5106} {"train_loss": -26.650287628173828, "global_step": 423850, "epoch": 5106} {"train_loss": -26.383808135986328, "global_step": 423851, "epoch": 5106} {"train_loss": -26.056690216064453, "global_step": 423852, "epoch": 5106} {"train_loss": -24.51068115234375, "global_step": 423853, "epoch": 5106} {"train_loss": -25.42166519165039, "global_step": 423854, "epoch": 5106} {"train_loss": -26.605224609375, "global_step": 423855, "epoch": 5106} {"train_loss": -26.1575927734375, "global_step": 423856, "epoch": 5106} {"train_loss": -26.143136978149414, "global_step": 423857, "epoch": 5106} {"train_loss": -26.38752555847168, "global_step": 423858, "epoch": 5106} {"train_loss": -26.6920108795166, "global_step": 423859, "epoch": 5106} {"train_loss": -26.210540771484375, "global_step": 423860, "epoch": 5106} {"train_loss": -26.636062622070312, "global_step": 423861, "epoch": 5106} {"train_loss": -26.50191307067871, "global_step": 423862, "epoch": 5106} {"train_loss": -26.5239200592041, "global_step": 423863, "epoch": 5106} {"train_loss": -26.148069381713867, "global_step": 423864, "epoch": 5106} {"train_loss": -26.440710067749023, "global_step": 423865, "epoch": 5106} {"train_loss": -26.2495174407959, "global_step": 423866, "epoch": 5106} {"train_loss": -26.171619415283203, "global_step": 423867, "epoch": 5106} {"train_loss": -26.331497192382812, "global_step": 423868, "epoch": 5106} {"train_loss": -25.95804214477539, "global_step": 423869, "epoch": 5106} {"train_loss": -26.456018447875977, "global_step": 423870, "epoch": 5106} {"train_loss": -26.28220558166504, "global_step": 423871, "epoch": 5106} {"train_loss": -26.1964111328125, "global_step": 423872, "epoch": 5106} {"train_loss": -26.498077392578125, "global_step": 423873, "epoch": 5106} {"train_loss": -26.5194091796875, "global_step": 423874, "epoch": 5106} {"train_loss": -26.169469833374023, "global_step": 423875, "epoch": 5106} {"train_loss": -26.556867599487305, "global_step": 423876, "epoch": 5106} {"train_loss": -26.196802139282227, "global_step": 423877, "epoch": 5106} {"train_loss": -26.494617462158203, "global_step": 423878, "epoch": 5106} {"train_loss": -26.445343017578125, "global_step": 423879, "epoch": 5106} {"train_loss": -26.50608269565077, "global_step": 423880, "epoch": 5106, "val_loss": 6911189.0} {"train_loss": -26.08832359313965, "global_step": 423881, "epoch": 5107} {"train_loss": -25.807647705078125, "global_step": 423882, "epoch": 5107} {"train_loss": -26.748559951782227, "global_step": 423883, "epoch": 5107} {"train_loss": -26.34527015686035, "global_step": 423884, "epoch": 5107} {"train_loss": -26.708677291870117, "global_step": 423885, "epoch": 5107} {"train_loss": -26.363128662109375, "global_step": 423886, "epoch": 5107} {"train_loss": -26.54652976989746, "global_step": 423887, "epoch": 5107} {"train_loss": -26.463428497314453, "global_step": 423888, "epoch": 5107} {"train_loss": -26.419269561767578, "global_step": 423889, "epoch": 5107} {"train_loss": -26.6105899810791, "global_step": 423890, "epoch": 5107} {"train_loss": -26.633962631225586, "global_step": 423891, "epoch": 5107} {"train_loss": -26.51908302307129, "global_step": 423892, "epoch": 5107} {"train_loss": -26.65437889099121, "global_step": 423893, "epoch": 5107} {"train_loss": -26.753040313720703, "global_step": 423894, "epoch": 5107} {"train_loss": -26.71306800842285, "global_step": 423895, "epoch": 5107} {"train_loss": -26.52862548828125, "global_step": 423896, "epoch": 5107} {"train_loss": -26.7895565032959, "global_step": 423897, "epoch": 5107} {"train_loss": -26.88832664489746, "global_step": 423898, "epoch": 5107} {"train_loss": -26.813724517822266, "global_step": 423899, "epoch": 5107} {"train_loss": -26.876148223876953, "global_step": 423900, "epoch": 5107} {"train_loss": -26.514551162719727, "global_step": 423901, "epoch": 5107} {"train_loss": -27.044876098632812, "global_step": 423902, "epoch": 5107} {"train_loss": -26.5933895111084, "global_step": 423903, "epoch": 5107} {"train_loss": -26.9356689453125, "global_step": 423904, "epoch": 5107} {"train_loss": -26.894575119018555, "global_step": 423905, "epoch": 5107} {"train_loss": -26.86995506286621, "global_step": 423906, "epoch": 5107} {"train_loss": -26.978137969970703, "global_step": 423907, "epoch": 5107} {"train_loss": -27.468725204467773, "global_step": 423908, "epoch": 5107} {"train_loss": -27.04778480529785, "global_step": 423909, "epoch": 5107} {"train_loss": -27.179346084594727, "global_step": 423910, "epoch": 5107} {"train_loss": -26.85499382019043, "global_step": 423911, "epoch": 5107} {"train_loss": -27.012104034423828, "global_step": 423912, "epoch": 5107} {"train_loss": -27.074365615844727, "global_step": 423913, "epoch": 5107} {"train_loss": -27.185653686523438, "global_step": 423914, "epoch": 5107} {"train_loss": -26.931608200073242, "global_step": 423915, "epoch": 5107} {"train_loss": -26.551410675048828, "global_step": 423916, "epoch": 5107} {"train_loss": -26.971649169921875, "global_step": 423917, "epoch": 5107} {"train_loss": -27.1458740234375, "global_step": 423918, "epoch": 5107} {"train_loss": -26.882694244384766, "global_step": 423919, "epoch": 5107} {"train_loss": -26.84177589416504, "global_step": 423920, "epoch": 5107} {"train_loss": -26.90559959411621, "global_step": 423921, "epoch": 5107} {"train_loss": -26.971393585205078, "global_step": 423922, "epoch": 5107} {"train_loss": -27.070178985595703, "global_step": 423923, "epoch": 5107} {"train_loss": -26.90152359008789, "global_step": 423924, "epoch": 5107} {"train_loss": -26.875513076782227, "global_step": 423925, "epoch": 5107} {"train_loss": -26.8994140625, "global_step": 423926, "epoch": 5107} {"train_loss": -27.014667510986328, "global_step": 423927, "epoch": 5107} {"train_loss": -27.007978439331055, "global_step": 423928, "epoch": 5107} {"train_loss": -27.318439483642578, "global_step": 423929, "epoch": 5107} {"train_loss": -26.863183975219727, "global_step": 423930, "epoch": 5107} {"train_loss": -26.573713302612305, "global_step": 423931, "epoch": 5107} {"train_loss": -26.91523551940918, "global_step": 423932, "epoch": 5107} {"train_loss": -26.908660888671875, "global_step": 423933, "epoch": 5107} {"train_loss": -27.350269317626953, "global_step": 423934, "epoch": 5107} {"train_loss": -27.148609161376953, "global_step": 423935, "epoch": 5107} {"train_loss": -27.29938316345215, "global_step": 423936, "epoch": 5107} {"train_loss": -27.210485458374023, "global_step": 423937, "epoch": 5107} {"train_loss": -27.158966064453125, "global_step": 423938, "epoch": 5107} {"train_loss": -26.85529899597168, "global_step": 423939, "epoch": 5107} {"train_loss": -26.748926162719727, "global_step": 423940, "epoch": 5107} {"train_loss": -26.86577796936035, "global_step": 423941, "epoch": 5107} {"train_loss": -27.114181518554688, "global_step": 423942, "epoch": 5107} {"train_loss": -27.116724014282227, "global_step": 423943, "epoch": 5107} {"train_loss": -26.958026885986328, "global_step": 423944, "epoch": 5107} {"train_loss": -26.803918838500977, "global_step": 423945, "epoch": 5107} {"train_loss": -26.946399688720703, "global_step": 423946, "epoch": 5107} {"train_loss": -26.910688400268555, "global_step": 423947, "epoch": 5107} {"train_loss": -26.91059684753418, "global_step": 423948, "epoch": 5107} {"train_loss": -27.087961196899414, "global_step": 423949, "epoch": 5107} {"train_loss": -26.963708877563477, "global_step": 423950, "epoch": 5107} {"train_loss": -26.902179718017578, "global_step": 423951, "epoch": 5107} {"train_loss": -26.6329402923584, "global_step": 423952, "epoch": 5107} {"train_loss": -26.650787353515625, "global_step": 423953, "epoch": 5107} {"train_loss": -26.81162452697754, "global_step": 423954, "epoch": 5107} {"train_loss": -26.550373077392578, "global_step": 423955, "epoch": 5107} {"train_loss": -26.96963882446289, "global_step": 423956, "epoch": 5107} {"train_loss": -26.191944122314453, "global_step": 423957, "epoch": 5107} {"train_loss": -26.93946647644043, "global_step": 423958, "epoch": 5107} {"train_loss": -26.266443252563477, "global_step": 423959, "epoch": 5107} {"train_loss": -25.993728637695312, "global_step": 423960, "epoch": 5107} {"train_loss": -26.363941192626953, "global_step": 423961, "epoch": 5107} {"train_loss": -26.82868003845215, "global_step": 423962, "epoch": 5107} {"train_loss": -26.8163380450513, "global_step": 423963, "epoch": 5107, "val_loss": 6772427.5} {"train_loss": -25.51408576965332, "global_step": 423964, "epoch": 5108} {"train_loss": -25.423507690429688, "global_step": 423965, "epoch": 5108} {"train_loss": -25.384580612182617, "global_step": 423966, "epoch": 5108} {"train_loss": -25.5311336517334, "global_step": 423967, "epoch": 5108} {"train_loss": -25.679553985595703, "global_step": 423968, "epoch": 5108} {"train_loss": -25.228227615356445, "global_step": 423969, "epoch": 5108} {"train_loss": -25.39003562927246, "global_step": 423970, "epoch": 5108} {"train_loss": -25.7730712890625, "global_step": 423971, "epoch": 5108} {"train_loss": -26.37566566467285, "global_step": 423972, "epoch": 5108} {"train_loss": -26.27301025390625, "global_step": 423973, "epoch": 5108} {"train_loss": -25.719928741455078, "global_step": 423974, "epoch": 5108} {"train_loss": -26.177814483642578, "global_step": 423975, "epoch": 5108} {"train_loss": -25.89044761657715, "global_step": 423976, "epoch": 5108} {"train_loss": -26.256757736206055, "global_step": 423977, "epoch": 5108} {"train_loss": -26.14313316345215, "global_step": 423978, "epoch": 5108} {"train_loss": -26.388044357299805, "global_step": 423979, "epoch": 5108} {"train_loss": -26.201337814331055, "global_step": 423980, "epoch": 5108} {"train_loss": -26.3668155670166, "global_step": 423981, "epoch": 5108} {"train_loss": -25.986637115478516, "global_step": 423982, "epoch": 5108} {"train_loss": -26.18330955505371, "global_step": 423983, "epoch": 5108} {"train_loss": -26.434040069580078, "global_step": 423984, "epoch": 5108} {"train_loss": -26.287641525268555, "global_step": 423985, "epoch": 5108} {"train_loss": -26.549015045166016, "global_step": 423986, "epoch": 5108} {"train_loss": -26.58635902404785, "global_step": 423987, "epoch": 5108} {"train_loss": -26.503463745117188, "global_step": 423988, "epoch": 5108} {"train_loss": -26.506210327148438, "global_step": 423989, "epoch": 5108} {"train_loss": -26.557586669921875, "global_step": 423990, "epoch": 5108} {"train_loss": -26.506820678710938, "global_step": 423991, "epoch": 5108} {"train_loss": -26.419082641601562, "global_step": 423992, "epoch": 5108} {"train_loss": -26.64447021484375, "global_step": 423993, "epoch": 5108} {"train_loss": -26.59560203552246, "global_step": 423994, "epoch": 5108} {"train_loss": -26.76993751525879, "global_step": 423995, "epoch": 5108} {"train_loss": -26.674530029296875, "global_step": 423996, "epoch": 5108} {"train_loss": -26.905963897705078, "global_step": 423997, "epoch": 5108} {"train_loss": -26.832571029663086, "global_step": 423998, "epoch": 5108} {"train_loss": -26.883520126342773, "global_step": 423999, "epoch": 5108} {"train_loss": -26.753131866455078, "global_step": 424000, "epoch": 5108} {"train_loss": -26.796483993530273, "global_step": 424001, "epoch": 5108} {"train_loss": -27.00861167907715, "global_step": 424002, "epoch": 5108} {"train_loss": -26.317733764648438, "global_step": 424003, "epoch": 5108} {"train_loss": -26.6544189453125, "global_step": 424004, "epoch": 5108} {"train_loss": -26.975574493408203, "global_step": 424005, "epoch": 5108} {"train_loss": -26.800628662109375, "global_step": 424006, "epoch": 5108} {"train_loss": -26.920562744140625, "global_step": 424007, "epoch": 5108} {"train_loss": -26.342132568359375, "global_step": 424008, "epoch": 5108} {"train_loss": -26.913040161132812, "global_step": 424009, "epoch": 5108} {"train_loss": -27.07826805114746, "global_step": 424010, "epoch": 5108} {"train_loss": -26.79021644592285, "global_step": 424011, "epoch": 5108} {"train_loss": -27.006000518798828, "global_step": 424012, "epoch": 5108} {"train_loss": -26.7900333404541, "global_step": 424013, "epoch": 5108} {"train_loss": -27.03261375427246, "global_step": 424014, "epoch": 5108} {"train_loss": -26.959674835205078, "global_step": 424015, "epoch": 5108} {"train_loss": -27.11941909790039, "global_step": 424016, "epoch": 5108} {"train_loss": -26.886098861694336, "global_step": 424017, "epoch": 5108} {"train_loss": -26.81403160095215, "global_step": 424018, "epoch": 5108} {"train_loss": -26.8376407623291, "global_step": 424019, "epoch": 5108} {"train_loss": -27.1652774810791, "global_step": 424020, "epoch": 5108} {"train_loss": -26.835071563720703, "global_step": 424021, "epoch": 5108} {"train_loss": -26.886159896850586, "global_step": 424022, "epoch": 5108} {"train_loss": -27.13913917541504, "global_step": 424023, "epoch": 5108} {"train_loss": -27.25751304626465, "global_step": 424024, "epoch": 5108} {"train_loss": -27.176694869995117, "global_step": 424025, "epoch": 5108} {"train_loss": -27.002954483032227, "global_step": 424026, "epoch": 5108} {"train_loss": -27.469655990600586, "global_step": 424027, "epoch": 5108} {"train_loss": -26.838241577148438, "global_step": 424028, "epoch": 5108} {"train_loss": -26.613698959350586, "global_step": 424029, "epoch": 5108} {"train_loss": -27.273229598999023, "global_step": 424030, "epoch": 5108} {"train_loss": -26.491540908813477, "global_step": 424031, "epoch": 5108} {"train_loss": -26.960742950439453, "global_step": 424032, "epoch": 5108} {"train_loss": -27.087417602539062, "global_step": 424033, "epoch": 5108} {"train_loss": -27.06052589416504, "global_step": 424034, "epoch": 5108} {"train_loss": -27.14944839477539, "global_step": 424035, "epoch": 5108} {"train_loss": -26.926517486572266, "global_step": 424036, "epoch": 5108} {"train_loss": -26.843460083007812, "global_step": 424037, "epoch": 5108} {"train_loss": -26.87091636657715, "global_step": 424038, "epoch": 5108} {"train_loss": -26.682687759399414, "global_step": 424039, "epoch": 5108} {"train_loss": -26.993534088134766, "global_step": 424040, "epoch": 5108} {"train_loss": -26.5673885345459, "global_step": 424041, "epoch": 5108} {"train_loss": -26.186819076538086, "global_step": 424042, "epoch": 5108} {"train_loss": -26.820249557495117, "global_step": 424043, "epoch": 5108} {"train_loss": -26.615726470947266, "global_step": 424044, "epoch": 5108} {"train_loss": -26.583959579467773, "global_step": 424045, "epoch": 5108} {"train_loss": -26.604937633836126, "global_step": 424046, "epoch": 5108, "val_loss": 6880935.5} {"train_loss": -26.486724853515625, "global_step": 424047, "epoch": 5109} {"train_loss": -26.74753761291504, "global_step": 424048, "epoch": 5109} {"train_loss": -26.648468017578125, "global_step": 424049, "epoch": 5109} {"train_loss": -26.3687744140625, "global_step": 424050, "epoch": 5109} {"train_loss": -26.582571029663086, "global_step": 424051, "epoch": 5109} {"train_loss": -26.233572006225586, "global_step": 424052, "epoch": 5109} {"train_loss": -26.343957901000977, "global_step": 424053, "epoch": 5109} {"train_loss": -26.898252487182617, "global_step": 424054, "epoch": 5109} {"train_loss": -26.63154411315918, "global_step": 424055, "epoch": 5109} {"train_loss": -26.79897117614746, "global_step": 424056, "epoch": 5109} {"train_loss": -26.899991989135742, "global_step": 424057, "epoch": 5109} {"train_loss": -26.414899826049805, "global_step": 424058, "epoch": 5109} {"train_loss": -26.88933753967285, "global_step": 424059, "epoch": 5109} {"train_loss": -27.0428409576416, "global_step": 424060, "epoch": 5109} {"train_loss": -26.636743545532227, "global_step": 424061, "epoch": 5109} {"train_loss": -27.014999389648438, "global_step": 424062, "epoch": 5109} {"train_loss": -26.918506622314453, "global_step": 424063, "epoch": 5109} {"train_loss": -26.520160675048828, "global_step": 424064, "epoch": 5109} {"train_loss": -27.13392448425293, "global_step": 424065, "epoch": 5109} {"train_loss": -27.0871524810791, "global_step": 424066, "epoch": 5109} {"train_loss": -26.77446937561035, "global_step": 424067, "epoch": 5109} {"train_loss": -26.972936630249023, "global_step": 424068, "epoch": 5109} {"train_loss": -27.0937442779541, "global_step": 424069, "epoch": 5109} {"train_loss": -26.467382431030273, "global_step": 424070, "epoch": 5109} {"train_loss": -26.76824951171875, "global_step": 424071, "epoch": 5109} {"train_loss": -26.868213653564453, "global_step": 424072, "epoch": 5109} {"train_loss": -26.927778244018555, "global_step": 424073, "epoch": 5109} {"train_loss": -27.173080444335938, "global_step": 424074, "epoch": 5109} {"train_loss": -26.87171745300293, "global_step": 424075, "epoch": 5109} {"train_loss": -26.6510009765625, "global_step": 424076, "epoch": 5109} {"train_loss": -26.88812828063965, "global_step": 424077, "epoch": 5109} {"train_loss": -27.1307373046875, "global_step": 424078, "epoch": 5109} {"train_loss": -26.982770919799805, "global_step": 424079, "epoch": 5109} {"train_loss": -26.945953369140625, "global_step": 424080, "epoch": 5109} {"train_loss": -26.94437026977539, "global_step": 424081, "epoch": 5109} {"train_loss": -27.014209747314453, "global_step": 424082, "epoch": 5109} {"train_loss": -26.685546875, "global_step": 424083, "epoch": 5109} {"train_loss": -26.649738311767578, "global_step": 424084, "epoch": 5109} {"train_loss": -26.751495361328125, "global_step": 424085, "epoch": 5109} {"train_loss": -27.416616439819336, "global_step": 424086, "epoch": 5109} {"train_loss": -26.935659408569336, "global_step": 424087, "epoch": 5109} {"train_loss": -26.978580474853516, "global_step": 424088, "epoch": 5109} {"train_loss": -26.712421417236328, "global_step": 424089, "epoch": 5109} {"train_loss": -26.94753074645996, "global_step": 424090, "epoch": 5109} {"train_loss": -27.057147979736328, "global_step": 424091, "epoch": 5109} {"train_loss": -27.0114688873291, "global_step": 424092, "epoch": 5109} {"train_loss": -26.976415634155273, "global_step": 424093, "epoch": 5109} {"train_loss": -27.05853843688965, "global_step": 424094, "epoch": 5109} {"train_loss": -26.8948917388916, "global_step": 424095, "epoch": 5109} {"train_loss": -26.941802978515625, "global_step": 424096, "epoch": 5109} {"train_loss": -26.878751754760742, "global_step": 424097, "epoch": 5109} {"train_loss": -26.622364044189453, "global_step": 424098, "epoch": 5109} {"train_loss": -26.631811141967773, "global_step": 424099, "epoch": 5109} {"train_loss": -26.54561424255371, "global_step": 424100, "epoch": 5109} {"train_loss": -26.65070152282715, "global_step": 424101, "epoch": 5109} {"train_loss": -26.202503204345703, "global_step": 424102, "epoch": 5109} {"train_loss": -26.65046501159668, "global_step": 424103, "epoch": 5109} {"train_loss": -26.77522087097168, "global_step": 424104, "epoch": 5109} {"train_loss": -26.650623321533203, "global_step": 424105, "epoch": 5109} {"train_loss": -26.650558471679688, "global_step": 424106, "epoch": 5109} {"train_loss": -27.102964401245117, "global_step": 424107, "epoch": 5109} {"train_loss": -26.739166259765625, "global_step": 424108, "epoch": 5109} {"train_loss": -27.03097915649414, "global_step": 424109, "epoch": 5109} {"train_loss": -26.473743438720703, "global_step": 424110, "epoch": 5109} {"train_loss": -26.72718620300293, "global_step": 424111, "epoch": 5109} {"train_loss": -26.75605583190918, "global_step": 424112, "epoch": 5109} {"train_loss": -26.84773826599121, "global_step": 424113, "epoch": 5109} {"train_loss": -27.09238052368164, "global_step": 424114, "epoch": 5109} {"train_loss": -26.912214279174805, "global_step": 424115, "epoch": 5109} {"train_loss": -26.841772079467773, "global_step": 424116, "epoch": 5109} {"train_loss": -26.951465606689453, "global_step": 424117, "epoch": 5109} {"train_loss": -26.917133331298828, "global_step": 424118, "epoch": 5109} {"train_loss": -27.070465087890625, "global_step": 424119, "epoch": 5109} {"train_loss": -27.14093589782715, "global_step": 424120, "epoch": 5109} {"train_loss": -27.2005672454834, "global_step": 424121, "epoch": 5109} {"train_loss": -26.4235897064209, "global_step": 424122, "epoch": 5109} {"train_loss": -27.326074600219727, "global_step": 424123, "epoch": 5109} {"train_loss": -26.886571884155273, "global_step": 424124, "epoch": 5109} {"train_loss": -26.53748893737793, "global_step": 424125, "epoch": 5109} {"train_loss": -26.69019889831543, "global_step": 424126, "epoch": 5109} {"train_loss": -26.281558990478516, "global_step": 424127, "epoch": 5109} {"train_loss": -26.241697311401367, "global_step": 424128, "epoch": 5109} {"train_loss": -26.793031186942596, "global_step": 424129, "epoch": 5109, "val_loss": 6923933.5} {"train_loss": -25.604572296142578, "global_step": 424130, "epoch": 5110} {"train_loss": -24.527450561523438, "global_step": 424131, "epoch": 5110} {"train_loss": -24.575490951538086, "global_step": 424132, "epoch": 5110} {"train_loss": -25.51742172241211, "global_step": 424133, "epoch": 5110} {"train_loss": -25.6916561126709, "global_step": 424134, "epoch": 5110} {"train_loss": -24.84517478942871, "global_step": 424135, "epoch": 5110} {"train_loss": -26.416959762573242, "global_step": 424136, "epoch": 5110} {"train_loss": -25.455259323120117, "global_step": 424137, "epoch": 5110} {"train_loss": -25.758359909057617, "global_step": 424138, "epoch": 5110} {"train_loss": -26.038862228393555, "global_step": 424139, "epoch": 5110} {"train_loss": -26.065942764282227, "global_step": 424140, "epoch": 5110} {"train_loss": -25.90907859802246, "global_step": 424141, "epoch": 5110} {"train_loss": -26.033267974853516, "global_step": 424142, "epoch": 5110} {"train_loss": -25.563989639282227, "global_step": 424143, "epoch": 5110} {"train_loss": -25.534374237060547, "global_step": 424144, "epoch": 5110} {"train_loss": -26.109582901000977, "global_step": 424145, "epoch": 5110} {"train_loss": -26.042882919311523, "global_step": 424146, "epoch": 5110} {"train_loss": -25.918363571166992, "global_step": 424147, "epoch": 5110} {"train_loss": -26.29182243347168, "global_step": 424148, "epoch": 5110} {"train_loss": -26.40656852722168, "global_step": 424149, "epoch": 5110} {"train_loss": -26.37959098815918, "global_step": 424150, "epoch": 5110} {"train_loss": -26.284439086914062, "global_step": 424151, "epoch": 5110} {"train_loss": -26.168701171875, "global_step": 424152, "epoch": 5110} {"train_loss": -26.221649169921875, "global_step": 424153, "epoch": 5110} {"train_loss": -26.42267417907715, "global_step": 424154, "epoch": 5110} {"train_loss": -26.386804580688477, "global_step": 424155, "epoch": 5110} {"train_loss": -26.494184494018555, "global_step": 424156, "epoch": 5110} {"train_loss": -26.483564376831055, "global_step": 424157, "epoch": 5110} {"train_loss": -26.374408721923828, "global_step": 424158, "epoch": 5110} {"train_loss": -26.517751693725586, "global_step": 424159, "epoch": 5110} {"train_loss": -26.6986026763916, "global_step": 424160, "epoch": 5110} {"train_loss": -26.124509811401367, "global_step": 424161, "epoch": 5110} {"train_loss": -26.446990966796875, "global_step": 424162, "epoch": 5110} {"train_loss": -27.01094627380371, "global_step": 424163, "epoch": 5110} {"train_loss": -26.42584800720215, "global_step": 424164, "epoch": 5110} {"train_loss": -26.964059829711914, "global_step": 424165, "epoch": 5110} {"train_loss": -27.1113338470459, "global_step": 424166, "epoch": 5110} {"train_loss": -26.885095596313477, "global_step": 424167, "epoch": 5110} {"train_loss": -26.325159072875977, "global_step": 424168, "epoch": 5110} {"train_loss": -26.550186157226562, "global_step": 424169, "epoch": 5110} {"train_loss": -26.796518325805664, "global_step": 424170, "epoch": 5110} {"train_loss": -26.937103271484375, "global_step": 424171, "epoch": 5110} {"train_loss": -26.886615753173828, "global_step": 424172, "epoch": 5110} {"train_loss": -26.84930992126465, "global_step": 424173, "epoch": 5110} {"train_loss": -26.503711700439453, "global_step": 424174, "epoch": 5110} {"train_loss": -26.90321922302246, "global_step": 424175, "epoch": 5110} {"train_loss": -26.863447189331055, "global_step": 424176, "epoch": 5110} {"train_loss": -26.7462215423584, "global_step": 424177, "epoch": 5110} {"train_loss": -26.744342803955078, "global_step": 424178, "epoch": 5110} {"train_loss": -26.844724655151367, "global_step": 424179, "epoch": 5110} {"train_loss": -26.835418701171875, "global_step": 424180, "epoch": 5110} {"train_loss": -26.633014678955078, "global_step": 424181, "epoch": 5110} {"train_loss": -27.006824493408203, "global_step": 424182, "epoch": 5110} {"train_loss": -26.920541763305664, "global_step": 424183, "epoch": 5110} {"train_loss": -27.123687744140625, "global_step": 424184, "epoch": 5110} {"train_loss": -27.0134334564209, "global_step": 424185, "epoch": 5110} {"train_loss": -27.03118324279785, "global_step": 424186, "epoch": 5110} {"train_loss": -26.963043212890625, "global_step": 424187, "epoch": 5110} {"train_loss": -26.661453247070312, "global_step": 424188, "epoch": 5110} {"train_loss": -26.800729751586914, "global_step": 424189, "epoch": 5110} {"train_loss": -27.205968856811523, "global_step": 424190, "epoch": 5110} {"train_loss": -26.805532455444336, "global_step": 424191, "epoch": 5110} {"train_loss": -27.213550567626953, "global_step": 424192, "epoch": 5110} {"train_loss": -26.80206298828125, "global_step": 424193, "epoch": 5110} {"train_loss": -26.687284469604492, "global_step": 424194, "epoch": 5110} {"train_loss": -26.736282348632812, "global_step": 424195, "epoch": 5110} {"train_loss": -26.93924903869629, "global_step": 424196, "epoch": 5110} {"train_loss": -26.418842315673828, "global_step": 424197, "epoch": 5110} {"train_loss": -26.899133682250977, "global_step": 424198, "epoch": 5110} {"train_loss": -27.306684494018555, "global_step": 424199, "epoch": 5110} {"train_loss": -27.159589767456055, "global_step": 424200, "epoch": 5110} {"train_loss": -26.923187255859375, "global_step": 424201, "epoch": 5110} {"train_loss": -26.90065574645996, "global_step": 424202, "epoch": 5110} {"train_loss": -26.47677993774414, "global_step": 424203, "epoch": 5110} {"train_loss": -27.28681755065918, "global_step": 424204, "epoch": 5110} {"train_loss": -27.206436157226562, "global_step": 424205, "epoch": 5110} {"train_loss": -26.746850967407227, "global_step": 424206, "epoch": 5110} {"train_loss": -26.860584259033203, "global_step": 424207, "epoch": 5110} {"train_loss": -27.280969619750977, "global_step": 424208, "epoch": 5110} {"train_loss": -27.174091339111328, "global_step": 424209, "epoch": 5110} {"train_loss": -26.79202651977539, "global_step": 424210, "epoch": 5110} {"train_loss": -26.736398696899414, "global_step": 424211, "epoch": 5110} {"train_loss": -26.525194466832172, "global_step": 424212, "epoch": 5110, "val_loss": 6971201.0} {"train_loss": -26.294178009033203, "global_step": 424213, "epoch": 5111} {"train_loss": -25.738269805908203, "global_step": 424214, "epoch": 5111} {"train_loss": -26.565702438354492, "global_step": 424215, "epoch": 5111} {"train_loss": -26.208105087280273, "global_step": 424216, "epoch": 5111} {"train_loss": -26.650808334350586, "global_step": 424217, "epoch": 5111} {"train_loss": -26.05666160583496, "global_step": 424218, "epoch": 5111} {"train_loss": -26.600412368774414, "global_step": 424219, "epoch": 5111} {"train_loss": -26.6077823638916, "global_step": 424220, "epoch": 5111} {"train_loss": -26.286020278930664, "global_step": 424221, "epoch": 5111} {"train_loss": -26.39093589782715, "global_step": 424222, "epoch": 5111} {"train_loss": -26.61659812927246, "global_step": 424223, "epoch": 5111} {"train_loss": -26.24118423461914, "global_step": 424224, "epoch": 5111} {"train_loss": -26.612995147705078, "global_step": 424225, "epoch": 5111} {"train_loss": -26.478485107421875, "global_step": 424226, "epoch": 5111} {"train_loss": -26.628437042236328, "global_step": 424227, "epoch": 5111} {"train_loss": -26.53077507019043, "global_step": 424228, "epoch": 5111} {"train_loss": -26.730117797851562, "global_step": 424229, "epoch": 5111} {"train_loss": -26.843280792236328, "global_step": 424230, "epoch": 5111} {"train_loss": -26.822864532470703, "global_step": 424231, "epoch": 5111} {"train_loss": -26.513080596923828, "global_step": 424232, "epoch": 5111} {"train_loss": -26.893177032470703, "global_step": 424233, "epoch": 5111} {"train_loss": -26.895435333251953, "global_step": 424234, "epoch": 5111} {"train_loss": -26.722061157226562, "global_step": 424235, "epoch": 5111} {"train_loss": -26.700164794921875, "global_step": 424236, "epoch": 5111} {"train_loss": -27.03757667541504, "global_step": 424237, "epoch": 5111} {"train_loss": -26.969762802124023, "global_step": 424238, "epoch": 5111} {"train_loss": -26.95881462097168, "global_step": 424239, "epoch": 5111} {"train_loss": -27.167194366455078, "global_step": 424240, "epoch": 5111} {"train_loss": -26.92664909362793, "global_step": 424241, "epoch": 5111} {"train_loss": -26.590534210205078, "global_step": 424242, "epoch": 5111} {"train_loss": -26.972265243530273, "global_step": 424243, "epoch": 5111} {"train_loss": -26.88458251953125, "global_step": 424244, "epoch": 5111} {"train_loss": -26.892667770385742, "global_step": 424245, "epoch": 5111} {"train_loss": -26.912403106689453, "global_step": 424246, "epoch": 5111} {"train_loss": -26.836231231689453, "global_step": 424247, "epoch": 5111} {"train_loss": -26.73115348815918, "global_step": 424248, "epoch": 5111} {"train_loss": -26.962125778198242, "global_step": 424249, "epoch": 5111} {"train_loss": -26.618276596069336, "global_step": 424250, "epoch": 5111} {"train_loss": -26.731765747070312, "global_step": 424251, "epoch": 5111} {"train_loss": -26.889636993408203, "global_step": 424252, "epoch": 5111} {"train_loss": -27.22210693359375, "global_step": 424253, "epoch": 5111} {"train_loss": -26.989303588867188, "global_step": 424254, "epoch": 5111} {"train_loss": -27.01399803161621, "global_step": 424255, "epoch": 5111} {"train_loss": -26.608015060424805, "global_step": 424256, "epoch": 5111} {"train_loss": -26.805500030517578, "global_step": 424257, "epoch": 5111} {"train_loss": -26.99460220336914, "global_step": 424258, "epoch": 5111} {"train_loss": -26.832300186157227, "global_step": 424259, "epoch": 5111} {"train_loss": -26.81861686706543, "global_step": 424260, "epoch": 5111} {"train_loss": -26.8395938873291, "global_step": 424261, "epoch": 5111} {"train_loss": -26.92864990234375, "global_step": 424262, "epoch": 5111} {"train_loss": -27.13494300842285, "global_step": 424263, "epoch": 5111} {"train_loss": -27.210529327392578, "global_step": 424264, "epoch": 5111} {"train_loss": -26.925159454345703, "global_step": 424265, "epoch": 5111} {"train_loss": -26.919910430908203, "global_step": 424266, "epoch": 5111} {"train_loss": -27.18494987487793, "global_step": 424267, "epoch": 5111} {"train_loss": -27.204181671142578, "global_step": 424268, "epoch": 5111} {"train_loss": -27.289045333862305, "global_step": 424269, "epoch": 5111} {"train_loss": -27.01839256286621, "global_step": 424270, "epoch": 5111} {"train_loss": -27.153966903686523, "global_step": 424271, "epoch": 5111} {"train_loss": -27.195295333862305, "global_step": 424272, "epoch": 5111} {"train_loss": -27.134078979492188, "global_step": 424273, "epoch": 5111} {"train_loss": -26.834888458251953, "global_step": 424274, "epoch": 5111} {"train_loss": -26.839197158813477, "global_step": 424275, "epoch": 5111} {"train_loss": -26.9237003326416, "global_step": 424276, "epoch": 5111} {"train_loss": -26.81902503967285, "global_step": 424277, "epoch": 5111} {"train_loss": -26.88221549987793, "global_step": 424278, "epoch": 5111} {"train_loss": -26.851232528686523, "global_step": 424279, "epoch": 5111} {"train_loss": -26.631183624267578, "global_step": 424280, "epoch": 5111} {"train_loss": -26.454803466796875, "global_step": 424281, "epoch": 5111} {"train_loss": -26.447296142578125, "global_step": 424282, "epoch": 5111} {"train_loss": -26.753753662109375, "global_step": 424283, "epoch": 5111} {"train_loss": -26.801013946533203, "global_step": 424284, "epoch": 5111} {"train_loss": -27.12542724609375, "global_step": 424285, "epoch": 5111} {"train_loss": -26.1546688079834, "global_step": 424286, "epoch": 5111} {"train_loss": -26.640396118164062, "global_step": 424287, "epoch": 5111} {"train_loss": -26.67754554748535, "global_step": 424288, "epoch": 5111} {"train_loss": -26.651288986206055, "global_step": 424289, "epoch": 5111} {"train_loss": -26.906347274780273, "global_step": 424290, "epoch": 5111} {"train_loss": -26.248981475830078, "global_step": 424291, "epoch": 5111} {"train_loss": -26.53460693359375, "global_step": 424292, "epoch": 5111} {"train_loss": -26.68340492248535, "global_step": 424293, "epoch": 5111} {"train_loss": -26.32807731628418, "global_step": 424294, "epoch": 5111} {"train_loss": -26.748465595475164, "global_step": 424295, "epoch": 5111, "val_loss": 6882591.0} {"train_loss": -24.600156784057617, "global_step": 424296, "epoch": 5112} {"train_loss": -24.412588119506836, "global_step": 424297, "epoch": 5112} {"train_loss": -25.265064239501953, "global_step": 424298, "epoch": 5112} {"train_loss": -25.6746826171875, "global_step": 424299, "epoch": 5112} {"train_loss": -25.774799346923828, "global_step": 424300, "epoch": 5112} {"train_loss": -25.714080810546875, "global_step": 424301, "epoch": 5112} {"train_loss": -25.85687255859375, "global_step": 424302, "epoch": 5112} {"train_loss": -25.825185775756836, "global_step": 424303, "epoch": 5112} {"train_loss": -25.493070602416992, "global_step": 424304, "epoch": 5112} {"train_loss": -26.12006950378418, "global_step": 424305, "epoch": 5112} {"train_loss": -25.280715942382812, "global_step": 424306, "epoch": 5112} {"train_loss": -26.200592041015625, "global_step": 424307, "epoch": 5112} {"train_loss": -25.93317985534668, "global_step": 424308, "epoch": 5112} {"train_loss": -26.274404525756836, "global_step": 424309, "epoch": 5112} {"train_loss": -26.293502807617188, "global_step": 424310, "epoch": 5112} {"train_loss": -25.921201705932617, "global_step": 424311, "epoch": 5112} {"train_loss": -26.126922607421875, "global_step": 424312, "epoch": 5112} {"train_loss": -26.374191284179688, "global_step": 424313, "epoch": 5112} {"train_loss": -26.446277618408203, "global_step": 424314, "epoch": 5112} {"train_loss": -26.649032592773438, "global_step": 424315, "epoch": 5112} {"train_loss": -26.453739166259766, "global_step": 424316, "epoch": 5112} {"train_loss": -26.55189323425293, "global_step": 424317, "epoch": 5112} {"train_loss": -26.419713973999023, "global_step": 424318, "epoch": 5112} {"train_loss": -26.547210693359375, "global_step": 424319, "epoch": 5112} {"train_loss": -26.8999080657959, "global_step": 424320, "epoch": 5112} {"train_loss": -26.5859317779541, "global_step": 424321, "epoch": 5112} {"train_loss": -26.846771240234375, "global_step": 424322, "epoch": 5112} {"train_loss": -26.68012046813965, "global_step": 424323, "epoch": 5112} {"train_loss": -26.58684730529785, "global_step": 424324, "epoch": 5112} {"train_loss": -26.212804794311523, "global_step": 424325, "epoch": 5112} {"train_loss": -26.7705020904541, "global_step": 424326, "epoch": 5112} {"train_loss": -26.9350643157959, "global_step": 424327, "epoch": 5112} {"train_loss": -26.56692886352539, "global_step": 424328, "epoch": 5112} {"train_loss": -26.428668975830078, "global_step": 424329, "epoch": 5112} {"train_loss": -27.1102352142334, "global_step": 424330, "epoch": 5112} {"train_loss": -26.60318374633789, "global_step": 424331, "epoch": 5112} {"train_loss": -26.596426010131836, "global_step": 424332, "epoch": 5112} {"train_loss": -27.003433227539062, "global_step": 424333, "epoch": 5112} {"train_loss": -26.822729110717773, "global_step": 424334, "epoch": 5112} {"train_loss": -27.395803451538086, "global_step": 424335, "epoch": 5112} {"train_loss": -27.03763771057129, "global_step": 424336, "epoch": 5112} {"train_loss": -26.85323143005371, "global_step": 424337, "epoch": 5112} {"train_loss": -26.643253326416016, "global_step": 424338, "epoch": 5112} {"train_loss": -26.832372665405273, "global_step": 424339, "epoch": 5112} {"train_loss": -26.91974449157715, "global_step": 424340, "epoch": 5112} {"train_loss": -26.814462661743164, "global_step": 424341, "epoch": 5112} {"train_loss": -26.561307907104492, "global_step": 424342, "epoch": 5112} {"train_loss": -26.759397506713867, "global_step": 424343, "epoch": 5112} {"train_loss": -26.864805221557617, "global_step": 424344, "epoch": 5112} {"train_loss": -26.988311767578125, "global_step": 424345, "epoch": 5112} {"train_loss": -27.04817008972168, "global_step": 424346, "epoch": 5112} {"train_loss": -26.963266372680664, "global_step": 424347, "epoch": 5112} {"train_loss": -27.071460723876953, "global_step": 424348, "epoch": 5112} {"train_loss": -26.76401138305664, "global_step": 424349, "epoch": 5112} {"train_loss": -27.097070693969727, "global_step": 424350, "epoch": 5112} {"train_loss": -26.937963485717773, "global_step": 424351, "epoch": 5112} {"train_loss": -26.78407859802246, "global_step": 424352, "epoch": 5112} {"train_loss": -26.990478515625, "global_step": 424353, "epoch": 5112} {"train_loss": -27.04743766784668, "global_step": 424354, "epoch": 5112} {"train_loss": -26.857574462890625, "global_step": 424355, "epoch": 5112} {"train_loss": -26.79983901977539, "global_step": 424356, "epoch": 5112} {"train_loss": -26.66847801208496, "global_step": 424357, "epoch": 5112} {"train_loss": -26.722293853759766, "global_step": 424358, "epoch": 5112} {"train_loss": -26.9246883392334, "global_step": 424359, "epoch": 5112} {"train_loss": -26.73866081237793, "global_step": 424360, "epoch": 5112} {"train_loss": -26.27646827697754, "global_step": 424361, "epoch": 5112} {"train_loss": -26.39778709411621, "global_step": 424362, "epoch": 5112} {"train_loss": -26.67880630493164, "global_step": 424363, "epoch": 5112} {"train_loss": -27.145166397094727, "global_step": 424364, "epoch": 5112} {"train_loss": -26.6700439453125, "global_step": 424365, "epoch": 5112} {"train_loss": -26.864606857299805, "global_step": 424366, "epoch": 5112} {"train_loss": -27.133466720581055, "global_step": 424367, "epoch": 5112} {"train_loss": -26.581220626831055, "global_step": 424368, "epoch": 5112} {"train_loss": -26.609033584594727, "global_step": 424369, "epoch": 5112} {"train_loss": -26.4537296295166, "global_step": 424370, "epoch": 5112} {"train_loss": -26.871740341186523, "global_step": 424371, "epoch": 5112} {"train_loss": -26.742704391479492, "global_step": 424372, "epoch": 5112} {"train_loss": -27.21889305114746, "global_step": 424373, "epoch": 5112} {"train_loss": -26.965940475463867, "global_step": 424374, "epoch": 5112} {"train_loss": -26.892318725585938, "global_step": 424375, "epoch": 5112} {"train_loss": -27.131818771362305, "global_step": 424376, "epoch": 5112} {"train_loss": -27.09095573425293, "global_step": 424377, "epoch": 5112} {"train_loss": -26.562738510499518, "global_step": 424378, "epoch": 5112, "val_loss": 6816823.0} {"train_loss": -25.710432052612305, "global_step": 424379, "epoch": 5113} {"train_loss": -25.83985710144043, "global_step": 424380, "epoch": 5113} {"train_loss": -26.33936882019043, "global_step": 424381, "epoch": 5113} {"train_loss": -26.372812271118164, "global_step": 424382, "epoch": 5113} {"train_loss": -25.49857521057129, "global_step": 424383, "epoch": 5113} {"train_loss": -26.6076602935791, "global_step": 424384, "epoch": 5113} {"train_loss": -26.520919799804688, "global_step": 424385, "epoch": 5113} {"train_loss": -26.634521484375, "global_step": 424386, "epoch": 5113} {"train_loss": -26.723424911499023, "global_step": 424387, "epoch": 5113} {"train_loss": -26.56591796875, "global_step": 424388, "epoch": 5113} {"train_loss": -26.7067813873291, "global_step": 424389, "epoch": 5113} {"train_loss": -26.4820499420166, "global_step": 424390, "epoch": 5113} {"train_loss": -26.639310836791992, "global_step": 424391, "epoch": 5113} {"train_loss": -26.870885848999023, "global_step": 424392, "epoch": 5113} {"train_loss": -26.753772735595703, "global_step": 424393, "epoch": 5113} {"train_loss": -26.592548370361328, "global_step": 424394, "epoch": 5113} {"train_loss": -26.722990036010742, "global_step": 424395, "epoch": 5113} {"train_loss": -26.73213005065918, "global_step": 424396, "epoch": 5113} {"train_loss": -26.65191650390625, "global_step": 424397, "epoch": 5113} {"train_loss": -27.076984405517578, "global_step": 424398, "epoch": 5113} {"train_loss": -27.056921005249023, "global_step": 424399, "epoch": 5113} {"train_loss": -26.892114639282227, "global_step": 424400, "epoch": 5113} {"train_loss": -26.832931518554688, "global_step": 424401, "epoch": 5113} {"train_loss": -26.920461654663086, "global_step": 424402, "epoch": 5113} {"train_loss": -27.010242462158203, "global_step": 424403, "epoch": 5113} {"train_loss": -26.854516983032227, "global_step": 424404, "epoch": 5113} {"train_loss": -26.8201961517334, "global_step": 424405, "epoch": 5113} {"train_loss": -26.816619873046875, "global_step": 424406, "epoch": 5113} {"train_loss": -26.96864128112793, "global_step": 424407, "epoch": 5113} {"train_loss": -26.947467803955078, "global_step": 424408, "epoch": 5113} {"train_loss": -26.72391700744629, "global_step": 424409, "epoch": 5113} {"train_loss": -26.755783081054688, "global_step": 424410, "epoch": 5113} {"train_loss": -27.037817001342773, "global_step": 424411, "epoch": 5113} {"train_loss": -26.568927764892578, "global_step": 424412, "epoch": 5113} {"train_loss": -26.974720001220703, "global_step": 424413, "epoch": 5113} {"train_loss": -26.8895206451416, "global_step": 424414, "epoch": 5113} {"train_loss": -26.148603439331055, "global_step": 424415, "epoch": 5113} {"train_loss": -26.78529930114746, "global_step": 424416, "epoch": 5113} {"train_loss": -26.892271041870117, "global_step": 424417, "epoch": 5113} {"train_loss": -26.50567626953125, "global_step": 424418, "epoch": 5113} {"train_loss": -26.35650062561035, "global_step": 424419, "epoch": 5113} {"train_loss": -26.743009567260742, "global_step": 424420, "epoch": 5113} {"train_loss": -26.92970085144043, "global_step": 424421, "epoch": 5113} {"train_loss": -26.760080337524414, "global_step": 424422, "epoch": 5113} {"train_loss": -26.612030029296875, "global_step": 424423, "epoch": 5113} {"train_loss": -26.878870010375977, "global_step": 424424, "epoch": 5113} {"train_loss": -26.88800048828125, "global_step": 424425, "epoch": 5113} {"train_loss": -26.95952796936035, "global_step": 424426, "epoch": 5113} {"train_loss": -26.850940704345703, "global_step": 424427, "epoch": 5113} {"train_loss": -27.01893424987793, "global_step": 424428, "epoch": 5113} {"train_loss": -27.195459365844727, "global_step": 424429, "epoch": 5113} {"train_loss": -26.859363555908203, "global_step": 424430, "epoch": 5113} {"train_loss": -26.793716430664062, "global_step": 424431, "epoch": 5113} {"train_loss": -27.148910522460938, "global_step": 424432, "epoch": 5113} {"train_loss": -27.072265625, "global_step": 424433, "epoch": 5113} {"train_loss": -26.90286636352539, "global_step": 424434, "epoch": 5113} {"train_loss": -26.995269775390625, "global_step": 424435, "epoch": 5113} {"train_loss": -27.168975830078125, "global_step": 424436, "epoch": 5113} {"train_loss": -27.071557998657227, "global_step": 424437, "epoch": 5113} {"train_loss": -27.442975997924805, "global_step": 424438, "epoch": 5113} {"train_loss": -27.1854305267334, "global_step": 424439, "epoch": 5113} {"train_loss": -27.042896270751953, "global_step": 424440, "epoch": 5113} {"train_loss": -26.777326583862305, "global_step": 424441, "epoch": 5113} {"train_loss": -26.80671501159668, "global_step": 424442, "epoch": 5113} {"train_loss": -27.0030460357666, "global_step": 424443, "epoch": 5113} {"train_loss": -27.00544548034668, "global_step": 424444, "epoch": 5113} {"train_loss": -27.265384674072266, "global_step": 424445, "epoch": 5113} {"train_loss": -26.721105575561523, "global_step": 424446, "epoch": 5113} {"train_loss": -26.36958122253418, "global_step": 424447, "epoch": 5113} {"train_loss": -25.960718154907227, "global_step": 424448, "epoch": 5113} {"train_loss": -26.059553146362305, "global_step": 424449, "epoch": 5113} {"train_loss": -26.692459106445312, "global_step": 424450, "epoch": 5113} {"train_loss": -26.754072189331055, "global_step": 424451, "epoch": 5113} {"train_loss": -26.665985107421875, "global_step": 424452, "epoch": 5113} {"train_loss": -27.216571807861328, "global_step": 424453, "epoch": 5113} {"train_loss": -26.582021713256836, "global_step": 424454, "epoch": 5113} {"train_loss": -26.842239379882812, "global_step": 424455, "epoch": 5113} {"train_loss": -26.686756134033203, "global_step": 424456, "epoch": 5113} {"train_loss": -27.14510154724121, "global_step": 424457, "epoch": 5113} {"train_loss": -26.88958168029785, "global_step": 424458, "epoch": 5113} {"train_loss": -26.69097328186035, "global_step": 424459, "epoch": 5113} {"train_loss": -26.731908798217773, "global_step": 424460, "epoch": 5113} {"train_loss": -26.769296094595667, "global_step": 424461, "epoch": 5113, "val_loss": 7023377.0} {"train_loss": -24.951662063598633, "global_step": 424462, "epoch": 5114} {"train_loss": -25.106884002685547, "global_step": 424463, "epoch": 5114} {"train_loss": -25.53862762451172, "global_step": 424464, "epoch": 5114} {"train_loss": -25.396045684814453, "global_step": 424465, "epoch": 5114} {"train_loss": -25.9412841796875, "global_step": 424466, "epoch": 5114} {"train_loss": -25.366191864013672, "global_step": 424467, "epoch": 5114} {"train_loss": -26.288440704345703, "global_step": 424468, "epoch": 5114} {"train_loss": -25.14118766784668, "global_step": 424469, "epoch": 5114} {"train_loss": -25.93475341796875, "global_step": 424470, "epoch": 5114} {"train_loss": -26.10393714904785, "global_step": 424471, "epoch": 5114} {"train_loss": -26.396398544311523, "global_step": 424472, "epoch": 5114} {"train_loss": -25.928430557250977, "global_step": 424473, "epoch": 5114} {"train_loss": -25.859790802001953, "global_step": 424474, "epoch": 5114} {"train_loss": -25.754728317260742, "global_step": 424475, "epoch": 5114} {"train_loss": -26.43450355529785, "global_step": 424476, "epoch": 5114} {"train_loss": -26.609954833984375, "global_step": 424477, "epoch": 5114} {"train_loss": -26.426422119140625, "global_step": 424478, "epoch": 5114} {"train_loss": -26.45819664001465, "global_step": 424479, "epoch": 5114} {"train_loss": -26.472009658813477, "global_step": 424480, "epoch": 5114} {"train_loss": -26.0356388092041, "global_step": 424481, "epoch": 5114} {"train_loss": -26.236303329467773, "global_step": 424482, "epoch": 5114} {"train_loss": -26.339984893798828, "global_step": 424483, "epoch": 5114} {"train_loss": -26.320287704467773, "global_step": 424484, "epoch": 5114} {"train_loss": -26.35645866394043, "global_step": 424485, "epoch": 5114} {"train_loss": -26.824787139892578, "global_step": 424486, "epoch": 5114} {"train_loss": -26.399179458618164, "global_step": 424487, "epoch": 5114} {"train_loss": -26.889713287353516, "global_step": 424488, "epoch": 5114} {"train_loss": -26.50587272644043, "global_step": 424489, "epoch": 5114} {"train_loss": -26.107929229736328, "global_step": 424490, "epoch": 5114} {"train_loss": -26.330921173095703, "global_step": 424491, "epoch": 5114} {"train_loss": -26.31940269470215, "global_step": 424492, "epoch": 5114} {"train_loss": -26.724979400634766, "global_step": 424493, "epoch": 5114} {"train_loss": -26.68938636779785, "global_step": 424494, "epoch": 5114} {"train_loss": -26.671255111694336, "global_step": 424495, "epoch": 5114} {"train_loss": -27.0771427154541, "global_step": 424496, "epoch": 5114} {"train_loss": -26.93123435974121, "global_step": 424497, "epoch": 5114} {"train_loss": -26.694580078125, "global_step": 424498, "epoch": 5114} {"train_loss": -26.516021728515625, "global_step": 424499, "epoch": 5114} {"train_loss": -27.038803100585938, "global_step": 424500, "epoch": 5114} {"train_loss": -27.05337905883789, "global_step": 424501, "epoch": 5114} {"train_loss": -26.77583885192871, "global_step": 424502, "epoch": 5114} {"train_loss": -27.096942901611328, "global_step": 424503, "epoch": 5114} {"train_loss": -26.841650009155273, "global_step": 424504, "epoch": 5114} {"train_loss": -26.853870391845703, "global_step": 424505, "epoch": 5114} {"train_loss": -26.796695709228516, "global_step": 424506, "epoch": 5114} {"train_loss": -26.893545150756836, "global_step": 424507, "epoch": 5114} {"train_loss": -27.050573348999023, "global_step": 424508, "epoch": 5114} {"train_loss": -26.75821876525879, "global_step": 424509, "epoch": 5114} {"train_loss": -27.31252098083496, "global_step": 424510, "epoch": 5114} {"train_loss": -26.876264572143555, "global_step": 424511, "epoch": 5114} {"train_loss": -27.196481704711914, "global_step": 424512, "epoch": 5114} {"train_loss": -26.69405174255371, "global_step": 424513, "epoch": 5114} {"train_loss": -27.02374839782715, "global_step": 424514, "epoch": 5114} {"train_loss": -26.967741012573242, "global_step": 424515, "epoch": 5114} {"train_loss": -26.953556060791016, "global_step": 424516, "epoch": 5114} {"train_loss": -26.839994430541992, "global_step": 424517, "epoch": 5114} {"train_loss": -26.9985408782959, "global_step": 424518, "epoch": 5114} {"train_loss": -27.152448654174805, "global_step": 424519, "epoch": 5114} {"train_loss": -26.904321670532227, "global_step": 424520, "epoch": 5114} {"train_loss": -26.840316772460938, "global_step": 424521, "epoch": 5114} {"train_loss": -27.14825439453125, "global_step": 424522, "epoch": 5114} {"train_loss": -27.213098526000977, "global_step": 424523, "epoch": 5114} {"train_loss": -26.91107177734375, "global_step": 424524, "epoch": 5114} {"train_loss": -27.115081787109375, "global_step": 424525, "epoch": 5114} {"train_loss": -27.26055335998535, "global_step": 424526, "epoch": 5114} {"train_loss": -27.07056999206543, "global_step": 424527, "epoch": 5114} {"train_loss": -27.19562339782715, "global_step": 424528, "epoch": 5114} {"train_loss": -27.201679229736328, "global_step": 424529, "epoch": 5114} {"train_loss": -27.0394344329834, "global_step": 424530, "epoch": 5114} {"train_loss": -27.4986572265625, "global_step": 424531, "epoch": 5114} {"train_loss": -26.949743270874023, "global_step": 424532, "epoch": 5114} {"train_loss": -27.122573852539062, "global_step": 424533, "epoch": 5114} {"train_loss": -26.713092803955078, "global_step": 424534, "epoch": 5114} {"train_loss": -27.09541130065918, "global_step": 424535, "epoch": 5114} {"train_loss": -27.005735397338867, "global_step": 424536, "epoch": 5114} {"train_loss": -26.2982120513916, "global_step": 424537, "epoch": 5114} {"train_loss": -26.278533935546875, "global_step": 424538, "epoch": 5114} {"train_loss": -25.93011474609375, "global_step": 424539, "epoch": 5114} {"train_loss": -26.567060470581055, "global_step": 424540, "epoch": 5114} {"train_loss": -26.407434463500977, "global_step": 424541, "epoch": 5114} {"train_loss": -26.55829429626465, "global_step": 424542, "epoch": 5114} {"train_loss": -25.985502243041992, "global_step": 424543, "epoch": 5114} {"train_loss": -26.60843499884548, "global_step": 424544, "epoch": 5114, "val_loss": 6970362.0} {"train_loss": -25.669925689697266, "global_step": 424545, "epoch": 5115} {"train_loss": -25.187570571899414, "global_step": 424546, "epoch": 5115} {"train_loss": -26.240802764892578, "global_step": 424547, "epoch": 5115} {"train_loss": -25.76764488220215, "global_step": 424548, "epoch": 5115} {"train_loss": -25.300613403320312, "global_step": 424549, "epoch": 5115} {"train_loss": -26.600812911987305, "global_step": 424550, "epoch": 5115} {"train_loss": -25.653919219970703, "global_step": 424551, "epoch": 5115} {"train_loss": -26.3515625, "global_step": 424552, "epoch": 5115} {"train_loss": -26.22223472595215, "global_step": 424553, "epoch": 5115} {"train_loss": -26.020431518554688, "global_step": 424554, "epoch": 5115} {"train_loss": -26.193708419799805, "global_step": 424555, "epoch": 5115} {"train_loss": -26.49787712097168, "global_step": 424556, "epoch": 5115} {"train_loss": -25.87760353088379, "global_step": 424557, "epoch": 5115} {"train_loss": -26.577375411987305, "global_step": 424558, "epoch": 5115} {"train_loss": -26.018604278564453, "global_step": 424559, "epoch": 5115} {"train_loss": -26.694196701049805, "global_step": 424560, "epoch": 5115} {"train_loss": -26.745954513549805, "global_step": 424561, "epoch": 5115} {"train_loss": -26.161396026611328, "global_step": 424562, "epoch": 5115} {"train_loss": -26.67803955078125, "global_step": 424563, "epoch": 5115} {"train_loss": -26.395401000976562, "global_step": 424564, "epoch": 5115} {"train_loss": -26.15602684020996, "global_step": 424565, "epoch": 5115} {"train_loss": -26.406152725219727, "global_step": 424566, "epoch": 5115} {"train_loss": -26.5353946685791, "global_step": 424567, "epoch": 5115} {"train_loss": -26.768131256103516, "global_step": 424568, "epoch": 5115} {"train_loss": -26.734405517578125, "global_step": 424569, "epoch": 5115} {"train_loss": -26.824853897094727, "global_step": 424570, "epoch": 5115} {"train_loss": -26.88033103942871, "global_step": 424571, "epoch": 5115} {"train_loss": -26.68851089477539, "global_step": 424572, "epoch": 5115} {"train_loss": -26.69148063659668, "global_step": 424573, "epoch": 5115} {"train_loss": -26.726734161376953, "global_step": 424574, "epoch": 5115} {"train_loss": -26.912195205688477, "global_step": 424575, "epoch": 5115} {"train_loss": -26.813617706298828, "global_step": 424576, "epoch": 5115} {"train_loss": -26.60597038269043, "global_step": 424577, "epoch": 5115} {"train_loss": -26.6707820892334, "global_step": 424578, "epoch": 5115} {"train_loss": -26.821746826171875, "global_step": 424579, "epoch": 5115} {"train_loss": -26.852588653564453, "global_step": 424580, "epoch": 5115} {"train_loss": -26.632761001586914, "global_step": 424581, "epoch": 5115} {"train_loss": -26.896947860717773, "global_step": 424582, "epoch": 5115} {"train_loss": -27.086652755737305, "global_step": 424583, "epoch": 5115} {"train_loss": -26.543745040893555, "global_step": 424584, "epoch": 5115} {"train_loss": -26.755517959594727, "global_step": 424585, "epoch": 5115} {"train_loss": -27.33966064453125, "global_step": 424586, "epoch": 5115} {"train_loss": -26.93610191345215, "global_step": 424587, "epoch": 5115} {"train_loss": -26.988784790039062, "global_step": 424588, "epoch": 5115} {"train_loss": -27.500192642211914, "global_step": 424589, "epoch": 5115} {"train_loss": -26.786855697631836, "global_step": 424590, "epoch": 5115} {"train_loss": -26.745275497436523, "global_step": 424591, "epoch": 5115} {"train_loss": -26.902097702026367, "global_step": 424592, "epoch": 5115} {"train_loss": -26.875898361206055, "global_step": 424593, "epoch": 5115} {"train_loss": -27.12717628479004, "global_step": 424594, "epoch": 5115} {"train_loss": -26.8320255279541, "global_step": 424595, "epoch": 5115} {"train_loss": -26.8718318939209, "global_step": 424596, "epoch": 5115} {"train_loss": -27.3072509765625, "global_step": 424597, "epoch": 5115} {"train_loss": -26.947019577026367, "global_step": 424598, "epoch": 5115} {"train_loss": -26.961400985717773, "global_step": 424599, "epoch": 5115} {"train_loss": -26.748212814331055, "global_step": 424600, "epoch": 5115} {"train_loss": -26.770212173461914, "global_step": 424601, "epoch": 5115} {"train_loss": -26.737659454345703, "global_step": 424602, "epoch": 5115} {"train_loss": -26.766584396362305, "global_step": 424603, "epoch": 5115} {"train_loss": -26.434118270874023, "global_step": 424604, "epoch": 5115} {"train_loss": -26.7120304107666, "global_step": 424605, "epoch": 5115} {"train_loss": -26.934650421142578, "global_step": 424606, "epoch": 5115} {"train_loss": -27.343494415283203, "global_step": 424607, "epoch": 5115} {"train_loss": -26.979955673217773, "global_step": 424608, "epoch": 5115} {"train_loss": -27.006521224975586, "global_step": 424609, "epoch": 5115} {"train_loss": -26.982746124267578, "global_step": 424610, "epoch": 5115} {"train_loss": -27.284032821655273, "global_step": 424611, "epoch": 5115} {"train_loss": -26.54595947265625, "global_step": 424612, "epoch": 5115} {"train_loss": -26.723892211914062, "global_step": 424613, "epoch": 5115} {"train_loss": -26.66425895690918, "global_step": 424614, "epoch": 5115} {"train_loss": -26.76173210144043, "global_step": 424615, "epoch": 5115} {"train_loss": -26.494070053100586, "global_step": 424616, "epoch": 5115} {"train_loss": -26.972883224487305, "global_step": 424617, "epoch": 5115} {"train_loss": -26.94471549987793, "global_step": 424618, "epoch": 5115} {"train_loss": -27.51766014099121, "global_step": 424619, "epoch": 5115} {"train_loss": -26.9208984375, "global_step": 424620, "epoch": 5115} {"train_loss": -26.944869995117188, "global_step": 424621, "epoch": 5115} {"train_loss": -26.8974666595459, "global_step": 424622, "epoch": 5115} {"train_loss": -26.894433975219727, "global_step": 424623, "epoch": 5115} {"train_loss": -26.582563400268555, "global_step": 424624, "epoch": 5115} {"train_loss": -27.147357940673828, "global_step": 424625, "epoch": 5115} {"train_loss": -26.84119987487793, "global_step": 424626, "epoch": 5115} {"train_loss": -26.692036502332574, "global_step": 424627, "epoch": 5115, "val_loss": 6959973.0} {"train_loss": -26.601987838745117, "global_step": 424628, "epoch": 5116} {"train_loss": -26.02012062072754, "global_step": 424629, "epoch": 5116} {"train_loss": -25.960676193237305, "global_step": 424630, "epoch": 5116} {"train_loss": -25.729415893554688, "global_step": 424631, "epoch": 5116} {"train_loss": -26.56204605102539, "global_step": 424632, "epoch": 5116} {"train_loss": -26.42425537109375, "global_step": 424633, "epoch": 5116} {"train_loss": -25.81281089782715, "global_step": 424634, "epoch": 5116} {"train_loss": -26.426532745361328, "global_step": 424635, "epoch": 5116} {"train_loss": -26.545745849609375, "global_step": 424636, "epoch": 5116} {"train_loss": -26.509246826171875, "global_step": 424637, "epoch": 5116} {"train_loss": -26.44936180114746, "global_step": 424638, "epoch": 5116} {"train_loss": -26.5767822265625, "global_step": 424639, "epoch": 5116} {"train_loss": -25.719358444213867, "global_step": 424640, "epoch": 5116} {"train_loss": -26.46038246154785, "global_step": 424641, "epoch": 5116} {"train_loss": -26.351215362548828, "global_step": 424642, "epoch": 5116} {"train_loss": -26.014892578125, "global_step": 424643, "epoch": 5116} {"train_loss": -26.714435577392578, "global_step": 424644, "epoch": 5116} {"train_loss": -26.56086540222168, "global_step": 424645, "epoch": 5116} {"train_loss": -26.67751121520996, "global_step": 424646, "epoch": 5116} {"train_loss": -26.587865829467773, "global_step": 424647, "epoch": 5116} {"train_loss": -26.67367935180664, "global_step": 424648, "epoch": 5116} {"train_loss": -26.669677734375, "global_step": 424649, "epoch": 5116} {"train_loss": -26.879444122314453, "global_step": 424650, "epoch": 5116} {"train_loss": -26.76800537109375, "global_step": 424651, "epoch": 5116} {"train_loss": -27.0057315826416, "global_step": 424652, "epoch": 5116} {"train_loss": -26.744495391845703, "global_step": 424653, "epoch": 5116} {"train_loss": -26.449148178100586, "global_step": 424654, "epoch": 5116} {"train_loss": -26.9113712310791, "global_step": 424655, "epoch": 5116} {"train_loss": -26.50811767578125, "global_step": 424656, "epoch": 5116} {"train_loss": -26.674081802368164, "global_step": 424657, "epoch": 5116} {"train_loss": -26.505035400390625, "global_step": 424658, "epoch": 5116} {"train_loss": -26.801380157470703, "global_step": 424659, "epoch": 5116} {"train_loss": -27.119476318359375, "global_step": 424660, "epoch": 5116} {"train_loss": -27.010190963745117, "global_step": 424661, "epoch": 5116} {"train_loss": -26.706878662109375, "global_step": 424662, "epoch": 5116} {"train_loss": -26.734189987182617, "global_step": 424663, "epoch": 5116} {"train_loss": -26.852758407592773, "global_step": 424664, "epoch": 5116} {"train_loss": -26.841455459594727, "global_step": 424665, "epoch": 5116} {"train_loss": -27.0687313079834, "global_step": 424666, "epoch": 5116} {"train_loss": -26.9316349029541, "global_step": 424667, "epoch": 5116} {"train_loss": -26.967893600463867, "global_step": 424668, "epoch": 5116} {"train_loss": -26.88763999938965, "global_step": 424669, "epoch": 5116} {"train_loss": -26.963897705078125, "global_step": 424670, "epoch": 5116} {"train_loss": -26.719823837280273, "global_step": 424671, "epoch": 5116} {"train_loss": -27.208282470703125, "global_step": 424672, "epoch": 5116} {"train_loss": -27.192914962768555, "global_step": 424673, "epoch": 5116} {"train_loss": -26.828168869018555, "global_step": 424674, "epoch": 5116} {"train_loss": -27.050867080688477, "global_step": 424675, "epoch": 5116} {"train_loss": -26.783863067626953, "global_step": 424676, "epoch": 5116} {"train_loss": -27.02752113342285, "global_step": 424677, "epoch": 5116} {"train_loss": -27.197668075561523, "global_step": 424678, "epoch": 5116} {"train_loss": -26.965185165405273, "global_step": 424679, "epoch": 5116} {"train_loss": -27.037622451782227, "global_step": 424680, "epoch": 5116} {"train_loss": -27.232147216796875, "global_step": 424681, "epoch": 5116} {"train_loss": -27.032201766967773, "global_step": 424682, "epoch": 5116} {"train_loss": -26.86551856994629, "global_step": 424683, "epoch": 5116} {"train_loss": -26.73573112487793, "global_step": 424684, "epoch": 5116} {"train_loss": -26.713720321655273, "global_step": 424685, "epoch": 5116} {"train_loss": -27.074682235717773, "global_step": 424686, "epoch": 5116} {"train_loss": -27.157550811767578, "global_step": 424687, "epoch": 5116} {"train_loss": -26.97218894958496, "global_step": 424688, "epoch": 5116} {"train_loss": -26.88286781311035, "global_step": 424689, "epoch": 5116} {"train_loss": -27.031904220581055, "global_step": 424690, "epoch": 5116} {"train_loss": -26.777179718017578, "global_step": 424691, "epoch": 5116} {"train_loss": -27.429792404174805, "global_step": 424692, "epoch": 5116} {"train_loss": -26.507150650024414, "global_step": 424693, "epoch": 5116} {"train_loss": -26.888715744018555, "global_step": 424694, "epoch": 5116} {"train_loss": -27.09992027282715, "global_step": 424695, "epoch": 5116} {"train_loss": -27.031103134155273, "global_step": 424696, "epoch": 5116} {"train_loss": -26.708349227905273, "global_step": 424697, "epoch": 5116} {"train_loss": -26.834455490112305, "global_step": 424698, "epoch": 5116} {"train_loss": -26.857009887695312, "global_step": 424699, "epoch": 5116} {"train_loss": -27.46583366394043, "global_step": 424700, "epoch": 5116} {"train_loss": -27.072763442993164, "global_step": 424701, "epoch": 5116} {"train_loss": -27.074487686157227, "global_step": 424702, "epoch": 5116} {"train_loss": -26.9118709564209, "global_step": 424703, "epoch": 5116} {"train_loss": -27.018524169921875, "global_step": 424704, "epoch": 5116} {"train_loss": -27.105701446533203, "global_step": 424705, "epoch": 5116} {"train_loss": -26.962560653686523, "global_step": 424706, "epoch": 5116} {"train_loss": -26.95185661315918, "global_step": 424707, "epoch": 5116} {"train_loss": -27.13059425354004, "global_step": 424708, "epoch": 5116} {"train_loss": -27.08066749572754, "global_step": 424709, "epoch": 5116} {"train_loss": -26.784844846610564, "global_step": 424710, "epoch": 5116, "val_loss": 6969459.0} {"train_loss": -26.150531768798828, "global_step": 424711, "epoch": 5117} {"train_loss": -25.62790870666504, "global_step": 424712, "epoch": 5117} {"train_loss": -25.310829162597656, "global_step": 424713, "epoch": 5117} {"train_loss": -25.99176597595215, "global_step": 424714, "epoch": 5117} {"train_loss": -26.513004302978516, "global_step": 424715, "epoch": 5117} {"train_loss": -26.707456588745117, "global_step": 424716, "epoch": 5117} {"train_loss": -26.6331787109375, "global_step": 424717, "epoch": 5117} {"train_loss": -26.538883209228516, "global_step": 424718, "epoch": 5117} {"train_loss": -26.729389190673828, "global_step": 424719, "epoch": 5117} {"train_loss": -26.878498077392578, "global_step": 424720, "epoch": 5117} {"train_loss": -26.471790313720703, "global_step": 424721, "epoch": 5117} {"train_loss": -26.5726318359375, "global_step": 424722, "epoch": 5117} {"train_loss": -26.890766143798828, "global_step": 424723, "epoch": 5117} {"train_loss": -26.493940353393555, "global_step": 424724, "epoch": 5117} {"train_loss": -26.602039337158203, "global_step": 424725, "epoch": 5117} {"train_loss": -26.59882164001465, "global_step": 424726, "epoch": 5117} {"train_loss": -26.5972843170166, "global_step": 424727, "epoch": 5117} {"train_loss": -26.840055465698242, "global_step": 424728, "epoch": 5117} {"train_loss": -26.866785049438477, "global_step": 424729, "epoch": 5117} {"train_loss": -26.659528732299805, "global_step": 424730, "epoch": 5117} {"train_loss": -26.843473434448242, "global_step": 424731, "epoch": 5117} {"train_loss": -26.9757022857666, "global_step": 424732, "epoch": 5117} {"train_loss": -26.461044311523438, "global_step": 424733, "epoch": 5117} {"train_loss": -26.565906524658203, "global_step": 424734, "epoch": 5117} {"train_loss": -26.75355339050293, "global_step": 424735, "epoch": 5117} {"train_loss": -26.657806396484375, "global_step": 424736, "epoch": 5117} {"train_loss": -26.9183292388916, "global_step": 424737, "epoch": 5117} {"train_loss": -26.572681427001953, "global_step": 424738, "epoch": 5117} {"train_loss": -26.788501739501953, "global_step": 424739, "epoch": 5117} {"train_loss": -26.79790687561035, "global_step": 424740, "epoch": 5117} {"train_loss": -27.081663131713867, "global_step": 424741, "epoch": 5117} {"train_loss": -26.6522159576416, "global_step": 424742, "epoch": 5117} {"train_loss": -26.640869140625, "global_step": 424743, "epoch": 5117} {"train_loss": -26.7587890625, "global_step": 424744, "epoch": 5117} {"train_loss": -27.009693145751953, "global_step": 424745, "epoch": 5117} {"train_loss": -26.87679100036621, "global_step": 424746, "epoch": 5117} {"train_loss": -26.6226863861084, "global_step": 424747, "epoch": 5117} {"train_loss": -26.77191162109375, "global_step": 424748, "epoch": 5117} {"train_loss": -27.268848419189453, "global_step": 424749, "epoch": 5117} {"train_loss": -26.84814453125, "global_step": 424750, "epoch": 5117} {"train_loss": -27.051877975463867, "global_step": 424751, "epoch": 5117} {"train_loss": -26.992420196533203, "global_step": 424752, "epoch": 5117} {"train_loss": -27.115976333618164, "global_step": 424753, "epoch": 5117} {"train_loss": -26.961240768432617, "global_step": 424754, "epoch": 5117} {"train_loss": -27.313329696655273, "global_step": 424755, "epoch": 5117} {"train_loss": -26.988245010375977, "global_step": 424756, "epoch": 5117} {"train_loss": -27.2733097076416, "global_step": 424757, "epoch": 5117} {"train_loss": -26.799163818359375, "global_step": 424758, "epoch": 5117} {"train_loss": -26.585229873657227, "global_step": 424759, "epoch": 5117} {"train_loss": -27.040075302124023, "global_step": 424760, "epoch": 5117} {"train_loss": -26.89436149597168, "global_step": 424761, "epoch": 5117} {"train_loss": -26.8640193939209, "global_step": 424762, "epoch": 5117} {"train_loss": -26.690820693969727, "global_step": 424763, "epoch": 5117} {"train_loss": -27.132001876831055, "global_step": 424764, "epoch": 5117} {"train_loss": -26.53533363342285, "global_step": 424765, "epoch": 5117} {"train_loss": -26.898914337158203, "global_step": 424766, "epoch": 5117} {"train_loss": -27.218021392822266, "global_step": 424767, "epoch": 5117} {"train_loss": -26.160293579101562, "global_step": 424768, "epoch": 5117} {"train_loss": -26.911304473876953, "global_step": 424769, "epoch": 5117} {"train_loss": -27.046558380126953, "global_step": 424770, "epoch": 5117} {"train_loss": -26.665189743041992, "global_step": 424771, "epoch": 5117} {"train_loss": -26.710535049438477, "global_step": 424772, "epoch": 5117} {"train_loss": -27.01997184753418, "global_step": 424773, "epoch": 5117} {"train_loss": -26.393903732299805, "global_step": 424774, "epoch": 5117} {"train_loss": -27.1087646484375, "global_step": 424775, "epoch": 5117} {"train_loss": -26.740537643432617, "global_step": 424776, "epoch": 5117} {"train_loss": -26.615583419799805, "global_step": 424777, "epoch": 5117} {"train_loss": -26.80254554748535, "global_step": 424778, "epoch": 5117} {"train_loss": -27.186100006103516, "global_step": 424779, "epoch": 5117} {"train_loss": -26.631189346313477, "global_step": 424780, "epoch": 5117} {"train_loss": -26.8773250579834, "global_step": 424781, "epoch": 5117} {"train_loss": -26.99647331237793, "global_step": 424782, "epoch": 5117} {"train_loss": -26.754331588745117, "global_step": 424783, "epoch": 5117} {"train_loss": -26.95452880859375, "global_step": 424784, "epoch": 5117} {"train_loss": -27.080310821533203, "global_step": 424785, "epoch": 5117} {"train_loss": -27.046222686767578, "global_step": 424786, "epoch": 5117} {"train_loss": -27.204648971557617, "global_step": 424787, "epoch": 5117} {"train_loss": -26.915287017822266, "global_step": 424788, "epoch": 5117} {"train_loss": -26.907657623291016, "global_step": 424789, "epoch": 5117} {"train_loss": -26.81344985961914, "global_step": 424790, "epoch": 5117} {"train_loss": -26.9277400970459, "global_step": 424791, "epoch": 5117} {"train_loss": -26.602216720581055, "global_step": 424792, "epoch": 5117} {"train_loss": -26.773495455822314, "global_step": 424793, "epoch": 5117, "val_loss": 6898241.0} {"train_loss": -26.05646324157715, "global_step": 424794, "epoch": 5118} {"train_loss": -25.546173095703125, "global_step": 424795, "epoch": 5118} {"train_loss": -26.104419708251953, "global_step": 424796, "epoch": 5118} {"train_loss": -26.699872970581055, "global_step": 424797, "epoch": 5118} {"train_loss": -25.969772338867188, "global_step": 424798, "epoch": 5118} {"train_loss": -26.658538818359375, "global_step": 424799, "epoch": 5118} {"train_loss": -26.566633224487305, "global_step": 424800, "epoch": 5118} {"train_loss": -26.17340087890625, "global_step": 424801, "epoch": 5118} {"train_loss": -26.491626739501953, "global_step": 424802, "epoch": 5118} {"train_loss": -26.350988388061523, "global_step": 424803, "epoch": 5118} {"train_loss": -26.46761131286621, "global_step": 424804, "epoch": 5118} {"train_loss": -26.251956939697266, "global_step": 424805, "epoch": 5118} {"train_loss": -26.502222061157227, "global_step": 424806, "epoch": 5118} {"train_loss": -26.35664176940918, "global_step": 424807, "epoch": 5118} {"train_loss": -26.854581832885742, "global_step": 424808, "epoch": 5118} {"train_loss": -26.773181915283203, "global_step": 424809, "epoch": 5118} {"train_loss": -26.898696899414062, "global_step": 424810, "epoch": 5118} {"train_loss": -26.651519775390625, "global_step": 424811, "epoch": 5118} {"train_loss": -26.74616813659668, "global_step": 424812, "epoch": 5118} {"train_loss": -26.591867446899414, "global_step": 424813, "epoch": 5118} {"train_loss": -26.500385284423828, "global_step": 424814, "epoch": 5118} {"train_loss": -26.913604736328125, "global_step": 424815, "epoch": 5118} {"train_loss": -26.68927574157715, "global_step": 424816, "epoch": 5118} {"train_loss": -26.724462509155273, "global_step": 424817, "epoch": 5118} {"train_loss": -26.84716796875, "global_step": 424818, "epoch": 5118} {"train_loss": -26.311532974243164, "global_step": 424819, "epoch": 5118} {"train_loss": -26.871809005737305, "global_step": 424820, "epoch": 5118} {"train_loss": -26.716144561767578, "global_step": 424821, "epoch": 5118} {"train_loss": -26.54886245727539, "global_step": 424822, "epoch": 5118} {"train_loss": -26.906009674072266, "global_step": 424823, "epoch": 5118} {"train_loss": -26.996435165405273, "global_step": 424824, "epoch": 5118} {"train_loss": -26.885221481323242, "global_step": 424825, "epoch": 5118} {"train_loss": -26.85795021057129, "global_step": 424826, "epoch": 5118} {"train_loss": -26.944177627563477, "global_step": 424827, "epoch": 5118} {"train_loss": -26.697265625, "global_step": 424828, "epoch": 5118} {"train_loss": -27.114831924438477, "global_step": 424829, "epoch": 5118} {"train_loss": -26.681446075439453, "global_step": 424830, "epoch": 5118} {"train_loss": -27.1722354888916, "global_step": 424831, "epoch": 5118} {"train_loss": -26.94807243347168, "global_step": 424832, "epoch": 5118} {"train_loss": -27.1649112701416, "global_step": 424833, "epoch": 5118} {"train_loss": -27.045087814331055, "global_step": 424834, "epoch": 5118} {"train_loss": -27.2810001373291, "global_step": 424835, "epoch": 5118} {"train_loss": -27.079938888549805, "global_step": 424836, "epoch": 5118} {"train_loss": -27.163105010986328, "global_step": 424837, "epoch": 5118} {"train_loss": -26.91582679748535, "global_step": 424838, "epoch": 5118} {"train_loss": -27.084890365600586, "global_step": 424839, "epoch": 5118} {"train_loss": -27.272979736328125, "global_step": 424840, "epoch": 5118} {"train_loss": -26.395206451416016, "global_step": 424841, "epoch": 5118} {"train_loss": -26.3638916015625, "global_step": 424842, "epoch": 5118} {"train_loss": -26.189416885375977, "global_step": 424843, "epoch": 5118} {"train_loss": -26.197101593017578, "global_step": 424844, "epoch": 5118} {"train_loss": -26.5726375579834, "global_step": 424845, "epoch": 5118} {"train_loss": -27.13031578063965, "global_step": 424846, "epoch": 5118} {"train_loss": -26.259632110595703, "global_step": 424847, "epoch": 5118} {"train_loss": -26.571048736572266, "global_step": 424848, "epoch": 5118} {"train_loss": -26.67400550842285, "global_step": 424849, "epoch": 5118} {"train_loss": -26.162952423095703, "global_step": 424850, "epoch": 5118} {"train_loss": -26.02237319946289, "global_step": 424851, "epoch": 5118} {"train_loss": -26.93256187438965, "global_step": 424852, "epoch": 5118} {"train_loss": -26.405370712280273, "global_step": 424853, "epoch": 5118} {"train_loss": -26.348615646362305, "global_step": 424854, "epoch": 5118} {"train_loss": -26.857120513916016, "global_step": 424855, "epoch": 5118} {"train_loss": -26.372827529907227, "global_step": 424856, "epoch": 5118} {"train_loss": -26.126663208007812, "global_step": 424857, "epoch": 5118} {"train_loss": -26.898910522460938, "global_step": 424858, "epoch": 5118} {"train_loss": -26.393692016601562, "global_step": 424859, "epoch": 5118} {"train_loss": -26.825698852539062, "global_step": 424860, "epoch": 5118} {"train_loss": -26.790185928344727, "global_step": 424861, "epoch": 5118} {"train_loss": -26.529956817626953, "global_step": 424862, "epoch": 5118} {"train_loss": -26.782148361206055, "global_step": 424863, "epoch": 5118} {"train_loss": -26.7318115234375, "global_step": 424864, "epoch": 5118} {"train_loss": -26.645782470703125, "global_step": 424865, "epoch": 5118} {"train_loss": -26.54011344909668, "global_step": 424866, "epoch": 5118} {"train_loss": -26.734699249267578, "global_step": 424867, "epoch": 5118} {"train_loss": -26.640356063842773, "global_step": 424868, "epoch": 5118} {"train_loss": -26.64059829711914, "global_step": 424869, "epoch": 5118} {"train_loss": -26.700769424438477, "global_step": 424870, "epoch": 5118} {"train_loss": -26.50681495666504, "global_step": 424871, "epoch": 5118} {"train_loss": -26.52178382873535, "global_step": 424872, "epoch": 5118} {"train_loss": -26.86273765563965, "global_step": 424873, "epoch": 5118} {"train_loss": -26.556875228881836, "global_step": 424874, "epoch": 5118} {"train_loss": -26.76588249206543, "global_step": 424875, "epoch": 5118} {"train_loss": -26.63492046494082, "global_step": 424876, "epoch": 5118, "val_loss": 6864827.0} {"train_loss": -25.659448623657227, "global_step": 424877, "epoch": 5119} {"train_loss": -25.678909301757812, "global_step": 424878, "epoch": 5119} {"train_loss": -25.919055938720703, "global_step": 424879, "epoch": 5119} {"train_loss": -26.56709098815918, "global_step": 424880, "epoch": 5119} {"train_loss": -26.0061092376709, "global_step": 424881, "epoch": 5119} {"train_loss": -26.711645126342773, "global_step": 424882, "epoch": 5119} {"train_loss": -26.455036163330078, "global_step": 424883, "epoch": 5119} {"train_loss": -26.303220748901367, "global_step": 424884, "epoch": 5119} {"train_loss": -26.57306480407715, "global_step": 424885, "epoch": 5119} {"train_loss": -26.24625587463379, "global_step": 424886, "epoch": 5119} {"train_loss": -26.484399795532227, "global_step": 424887, "epoch": 5119} {"train_loss": -26.475635528564453, "global_step": 424888, "epoch": 5119} {"train_loss": -26.6099910736084, "global_step": 424889, "epoch": 5119} {"train_loss": -26.662220001220703, "global_step": 424890, "epoch": 5119} {"train_loss": -26.719833374023438, "global_step": 424891, "epoch": 5119} {"train_loss": -26.036300659179688, "global_step": 424892, "epoch": 5119} {"train_loss": -26.581632614135742, "global_step": 424893, "epoch": 5119} {"train_loss": -26.550134658813477, "global_step": 424894, "epoch": 5119} {"train_loss": -26.5219669342041, "global_step": 424895, "epoch": 5119} {"train_loss": -26.477033615112305, "global_step": 424896, "epoch": 5119} {"train_loss": -26.609174728393555, "global_step": 424897, "epoch": 5119} {"train_loss": -26.56290626525879, "global_step": 424898, "epoch": 5119} {"train_loss": -26.82459831237793, "global_step": 424899, "epoch": 5119} {"train_loss": -26.440479278564453, "global_step": 424900, "epoch": 5119} {"train_loss": -26.461505889892578, "global_step": 424901, "epoch": 5119} {"train_loss": -26.540435791015625, "global_step": 424902, "epoch": 5119} {"train_loss": -26.56961441040039, "global_step": 424903, "epoch": 5119} {"train_loss": -26.965652465820312, "global_step": 424904, "epoch": 5119} {"train_loss": -26.742603302001953, "global_step": 424905, "epoch": 5119} {"train_loss": -26.911020278930664, "global_step": 424906, "epoch": 5119} {"train_loss": -26.764789581298828, "global_step": 424907, "epoch": 5119} {"train_loss": -26.69061279296875, "global_step": 424908, "epoch": 5119} {"train_loss": -26.6844425201416, "global_step": 424909, "epoch": 5119} {"train_loss": -26.762121200561523, "global_step": 424910, "epoch": 5119} {"train_loss": -26.738889694213867, "global_step": 424911, "epoch": 5119} {"train_loss": -26.490331649780273, "global_step": 424912, "epoch": 5119} {"train_loss": -26.859333038330078, "global_step": 424913, "epoch": 5119} {"train_loss": -27.087934494018555, "global_step": 424914, "epoch": 5119} {"train_loss": -26.98837661743164, "global_step": 424915, "epoch": 5119} {"train_loss": -26.7551326751709, "global_step": 424916, "epoch": 5119} {"train_loss": -26.900684356689453, "global_step": 424917, "epoch": 5119} {"train_loss": -26.698944091796875, "global_step": 424918, "epoch": 5119} {"train_loss": -26.740116119384766, "global_step": 424919, "epoch": 5119} {"train_loss": -27.089460372924805, "global_step": 424920, "epoch": 5119} {"train_loss": -26.635669708251953, "global_step": 424921, "epoch": 5119} {"train_loss": -26.454870223999023, "global_step": 424922, "epoch": 5119} {"train_loss": -27.248706817626953, "global_step": 424923, "epoch": 5119} {"train_loss": -26.631805419921875, "global_step": 424924, "epoch": 5119} {"train_loss": -26.81538200378418, "global_step": 424925, "epoch": 5119} {"train_loss": -27.07158851623535, "global_step": 424926, "epoch": 5119} {"train_loss": -26.7558536529541, "global_step": 424927, "epoch": 5119} {"train_loss": -26.358325958251953, "global_step": 424928, "epoch": 5119} {"train_loss": -26.9157772064209, "global_step": 424929, "epoch": 5119} {"train_loss": -26.78816032409668, "global_step": 424930, "epoch": 5119} {"train_loss": -27.170948028564453, "global_step": 424931, "epoch": 5119} {"train_loss": -26.782705307006836, "global_step": 424932, "epoch": 5119} {"train_loss": -26.886606216430664, "global_step": 424933, "epoch": 5119} {"train_loss": -26.6875, "global_step": 424934, "epoch": 5119} {"train_loss": -26.792205810546875, "global_step": 424935, "epoch": 5119} {"train_loss": -26.949865341186523, "global_step": 424936, "epoch": 5119} {"train_loss": -27.0731258392334, "global_step": 424937, "epoch": 5119} {"train_loss": -26.768091201782227, "global_step": 424938, "epoch": 5119} {"train_loss": -26.857812881469727, "global_step": 424939, "epoch": 5119} {"train_loss": -27.252965927124023, "global_step": 424940, "epoch": 5119} {"train_loss": -26.4698543548584, "global_step": 424941, "epoch": 5119} {"train_loss": -26.7271728515625, "global_step": 424942, "epoch": 5119} {"train_loss": -26.439468383789062, "global_step": 424943, "epoch": 5119} {"train_loss": -26.772083282470703, "global_step": 424944, "epoch": 5119} {"train_loss": -26.496490478515625, "global_step": 424945, "epoch": 5119} {"train_loss": -26.742706298828125, "global_step": 424946, "epoch": 5119} {"train_loss": -26.44841957092285, "global_step": 424947, "epoch": 5119} {"train_loss": -26.859699249267578, "global_step": 424948, "epoch": 5119} {"train_loss": -27.321043014526367, "global_step": 424949, "epoch": 5119} {"train_loss": -27.1866455078125, "global_step": 424950, "epoch": 5119} {"train_loss": -26.6801700592041, "global_step": 424951, "epoch": 5119} {"train_loss": -27.094465255737305, "global_step": 424952, "epoch": 5119} {"train_loss": -26.793920516967773, "global_step": 424953, "epoch": 5119} {"train_loss": -26.464263916015625, "global_step": 424954, "epoch": 5119} {"train_loss": -26.9415225982666, "global_step": 424955, "epoch": 5119} {"train_loss": -26.747446060180664, "global_step": 424956, "epoch": 5119} {"train_loss": -26.132455825805664, "global_step": 424957, "epoch": 5119} {"train_loss": -26.083999633789062, "global_step": 424958, "epoch": 5119} {"train_loss": -26.63999120873141, "global_step": 424959, "epoch": 5119, "val_loss": 6937295.0} {"train_loss": -26.20306396484375, "global_step": 424960, "epoch": 5120} {"train_loss": -25.479421615600586, "global_step": 424961, "epoch": 5120} {"train_loss": -26.097217559814453, "global_step": 424962, "epoch": 5120} {"train_loss": -25.95991325378418, "global_step": 424963, "epoch": 5120} {"train_loss": -26.242284774780273, "global_step": 424964, "epoch": 5120} {"train_loss": -26.1072998046875, "global_step": 424965, "epoch": 5120} {"train_loss": -25.824018478393555, "global_step": 424966, "epoch": 5120} {"train_loss": -26.146162033081055, "global_step": 424967, "epoch": 5120} {"train_loss": -25.892684936523438, "global_step": 424968, "epoch": 5120} {"train_loss": -26.24224853515625, "global_step": 424969, "epoch": 5120} {"train_loss": -26.504064559936523, "global_step": 424970, "epoch": 5120} {"train_loss": -26.452451705932617, "global_step": 424971, "epoch": 5120} {"train_loss": -26.62871742248535, "global_step": 424972, "epoch": 5120} {"train_loss": -26.3441219329834, "global_step": 424973, "epoch": 5120} {"train_loss": -26.556537628173828, "global_step": 424974, "epoch": 5120} {"train_loss": -26.351551055908203, "global_step": 424975, "epoch": 5120} {"train_loss": -26.277362823486328, "global_step": 424976, "epoch": 5120} {"train_loss": -26.67923927307129, "global_step": 424977, "epoch": 5120} {"train_loss": -26.689273834228516, "global_step": 424978, "epoch": 5120} {"train_loss": -26.387800216674805, "global_step": 424979, "epoch": 5120} {"train_loss": -26.584985733032227, "global_step": 424980, "epoch": 5120} {"train_loss": -26.64792823791504, "global_step": 424981, "epoch": 5120} {"train_loss": -26.632421493530273, "global_step": 424982, "epoch": 5120} {"train_loss": -26.55057144165039, "global_step": 424983, "epoch": 5120} {"train_loss": -26.692663192749023, "global_step": 424984, "epoch": 5120} {"train_loss": -26.556385040283203, "global_step": 424985, "epoch": 5120} {"train_loss": -26.687469482421875, "global_step": 424986, "epoch": 5120} {"train_loss": -26.447168350219727, "global_step": 424987, "epoch": 5120} {"train_loss": -26.581302642822266, "global_step": 424988, "epoch": 5120} {"train_loss": -26.677587509155273, "global_step": 424989, "epoch": 5120} {"train_loss": -26.750110626220703, "global_step": 424990, "epoch": 5120} {"train_loss": -26.763452529907227, "global_step": 424991, "epoch": 5120} {"train_loss": -26.935571670532227, "global_step": 424992, "epoch": 5120} {"train_loss": -26.607929229736328, "global_step": 424993, "epoch": 5120} {"train_loss": -26.76368522644043, "global_step": 424994, "epoch": 5120} {"train_loss": -26.892353057861328, "global_step": 424995, "epoch": 5120} {"train_loss": -26.817001342773438, "global_step": 424996, "epoch": 5120} {"train_loss": -27.23195457458496, "global_step": 424997, "epoch": 5120} {"train_loss": -26.783655166625977, "global_step": 424998, "epoch": 5120} {"train_loss": -26.915388107299805, "global_step": 424999, "epoch": 5120} {"train_loss": -26.850873947143555, "global_step": 425000, "epoch": 5120} {"train_loss": -26.997629165649414, "global_step": 425001, "epoch": 5120} {"train_loss": -26.8306941986084, "global_step": 425002, "epoch": 5120} {"train_loss": -26.916330337524414, "global_step": 425003, "epoch": 5120} {"train_loss": -26.73495864868164, "global_step": 425004, "epoch": 5120} {"train_loss": -26.841449737548828, "global_step": 425005, "epoch": 5120} {"train_loss": -26.97687339782715, "global_step": 425006, "epoch": 5120} {"train_loss": -27.040435791015625, "global_step": 425007, "epoch": 5120} {"train_loss": -26.992605209350586, "global_step": 425008, "epoch": 5120} {"train_loss": -27.21868896484375, "global_step": 425009, "epoch": 5120} {"train_loss": -26.94879722595215, "global_step": 425010, "epoch": 5120} {"train_loss": -26.674560546875, "global_step": 425011, "epoch": 5120} {"train_loss": -26.8898868560791, "global_step": 425012, "epoch": 5120} {"train_loss": -27.0853214263916, "global_step": 425013, "epoch": 5120} {"train_loss": -27.068115234375, "global_step": 425014, "epoch": 5120} {"train_loss": -27.162500381469727, "global_step": 425015, "epoch": 5120} {"train_loss": -27.068525314331055, "global_step": 425016, "epoch": 5120} {"train_loss": -26.682861328125, "global_step": 425017, "epoch": 5120} {"train_loss": -26.81843376159668, "global_step": 425018, "epoch": 5120} {"train_loss": -26.479318618774414, "global_step": 425019, "epoch": 5120} {"train_loss": -26.464221954345703, "global_step": 425020, "epoch": 5120} {"train_loss": -26.67116355895996, "global_step": 425021, "epoch": 5120} {"train_loss": -26.60572624206543, "global_step": 425022, "epoch": 5120} {"train_loss": -27.04868507385254, "global_step": 425023, "epoch": 5120} {"train_loss": -26.604589462280273, "global_step": 425024, "epoch": 5120} {"train_loss": -26.603376388549805, "global_step": 425025, "epoch": 5120} {"train_loss": -26.89082908630371, "global_step": 425026, "epoch": 5120} {"train_loss": -26.71979331970215, "global_step": 425027, "epoch": 5120} {"train_loss": -26.758405685424805, "global_step": 425028, "epoch": 5120} {"train_loss": -26.876272201538086, "global_step": 425029, "epoch": 5120} {"train_loss": -26.8948974609375, "global_step": 425030, "epoch": 5120} {"train_loss": -27.04718017578125, "global_step": 425031, "epoch": 5120} {"train_loss": -26.830957412719727, "global_step": 425032, "epoch": 5120} {"train_loss": -26.49481773376465, "global_step": 425033, "epoch": 5120} {"train_loss": -26.70224380493164, "global_step": 425034, "epoch": 5120} {"train_loss": -26.937376022338867, "global_step": 425035, "epoch": 5120} {"train_loss": -27.279678344726562, "global_step": 425036, "epoch": 5120} {"train_loss": -26.59528160095215, "global_step": 425037, "epoch": 5120} {"train_loss": -26.645862579345703, "global_step": 425038, "epoch": 5120} {"train_loss": -26.750341415405273, "global_step": 425039, "epoch": 5120} {"train_loss": -26.7867374420166, "global_step": 425040, "epoch": 5120} {"train_loss": -26.83687400817871, "global_step": 425041, "epoch": 5120} {"train_loss": -26.6731770986534, "global_step": 425042, "epoch": 5120, "val_loss": 6878005.5} {"train_loss": -25.49052619934082, "global_step": 425043, "epoch": 5121} {"train_loss": -26.180280685424805, "global_step": 425044, "epoch": 5121} {"train_loss": -25.839773178100586, "global_step": 425045, "epoch": 5121} {"train_loss": -26.493444442749023, "global_step": 425046, "epoch": 5121} {"train_loss": -26.463703155517578, "global_step": 425047, "epoch": 5121} {"train_loss": -26.16071891784668, "global_step": 425048, "epoch": 5121} {"train_loss": -26.448530197143555, "global_step": 425049, "epoch": 5121} {"train_loss": -26.218107223510742, "global_step": 425050, "epoch": 5121} {"train_loss": -26.168127059936523, "global_step": 425051, "epoch": 5121} {"train_loss": -26.48225212097168, "global_step": 425052, "epoch": 5121} {"train_loss": -26.541446685791016, "global_step": 425053, "epoch": 5121} {"train_loss": -26.042539596557617, "global_step": 425054, "epoch": 5121} {"train_loss": -26.39163589477539, "global_step": 425055, "epoch": 5121} {"train_loss": -26.564533233642578, "global_step": 425056, "epoch": 5121} {"train_loss": -26.411413192749023, "global_step": 425057, "epoch": 5121} {"train_loss": -26.637495040893555, "global_step": 425058, "epoch": 5121} {"train_loss": -26.28753662109375, "global_step": 425059, "epoch": 5121} {"train_loss": -26.525165557861328, "global_step": 425060, "epoch": 5121} {"train_loss": -26.78154945373535, "global_step": 425061, "epoch": 5121} {"train_loss": -26.27777099609375, "global_step": 425062, "epoch": 5121} {"train_loss": -26.675495147705078, "global_step": 425063, "epoch": 5121} {"train_loss": -26.953216552734375, "global_step": 425064, "epoch": 5121} {"train_loss": -26.65461540222168, "global_step": 425065, "epoch": 5121} {"train_loss": -26.762115478515625, "global_step": 425066, "epoch": 5121} {"train_loss": -26.32209587097168, "global_step": 425067, "epoch": 5121} {"train_loss": -26.80244255065918, "global_step": 425068, "epoch": 5121} {"train_loss": -26.891754150390625, "global_step": 425069, "epoch": 5121} {"train_loss": -26.8580379486084, "global_step": 425070, "epoch": 5121} {"train_loss": -26.60697364807129, "global_step": 425071, "epoch": 5121} {"train_loss": -26.976720809936523, "global_step": 425072, "epoch": 5121} {"train_loss": -26.365583419799805, "global_step": 425073, "epoch": 5121} {"train_loss": -26.87879753112793, "global_step": 425074, "epoch": 5121} {"train_loss": -26.754804611206055, "global_step": 425075, "epoch": 5121} {"train_loss": -27.14600944519043, "global_step": 425076, "epoch": 5121} {"train_loss": -26.557910919189453, "global_step": 425077, "epoch": 5121} {"train_loss": -26.927265167236328, "global_step": 425078, "epoch": 5121} {"train_loss": -26.891454696655273, "global_step": 425079, "epoch": 5121} {"train_loss": -26.84412956237793, "global_step": 425080, "epoch": 5121} {"train_loss": -27.03474235534668, "global_step": 425081, "epoch": 5121} {"train_loss": -27.00201416015625, "global_step": 425082, "epoch": 5121} {"train_loss": -26.702945709228516, "global_step": 425083, "epoch": 5121} {"train_loss": -27.21573829650879, "global_step": 425084, "epoch": 5121} {"train_loss": -26.7916202545166, "global_step": 425085, "epoch": 5121} {"train_loss": -26.931833267211914, "global_step": 425086, "epoch": 5121} {"train_loss": -26.716962814331055, "global_step": 425087, "epoch": 5121} {"train_loss": -26.7340145111084, "global_step": 425088, "epoch": 5121} {"train_loss": -26.459766387939453, "global_step": 425089, "epoch": 5121} {"train_loss": -26.847951889038086, "global_step": 425090, "epoch": 5121} {"train_loss": -27.04305076599121, "global_step": 425091, "epoch": 5121} {"train_loss": -26.761798858642578, "global_step": 425092, "epoch": 5121} {"train_loss": -26.996946334838867, "global_step": 425093, "epoch": 5121} {"train_loss": -26.968128204345703, "global_step": 425094, "epoch": 5121} {"train_loss": -26.917016983032227, "global_step": 425095, "epoch": 5121} {"train_loss": -26.84160804748535, "global_step": 425096, "epoch": 5121} {"train_loss": -27.21720314025879, "global_step": 425097, "epoch": 5121} {"train_loss": -27.22954750061035, "global_step": 425098, "epoch": 5121} {"train_loss": -26.932300567626953, "global_step": 425099, "epoch": 5121} {"train_loss": -27.056262969970703, "global_step": 425100, "epoch": 5121} {"train_loss": -26.999670028686523, "global_step": 425101, "epoch": 5121} {"train_loss": -26.9990177154541, "global_step": 425102, "epoch": 5121} {"train_loss": -26.9727783203125, "global_step": 425103, "epoch": 5121} {"train_loss": -27.070199966430664, "global_step": 425104, "epoch": 5121} {"train_loss": -26.83144187927246, "global_step": 425105, "epoch": 5121} {"train_loss": -26.94197654724121, "global_step": 425106, "epoch": 5121} {"train_loss": -26.545278549194336, "global_step": 425107, "epoch": 5121} {"train_loss": -26.51580810546875, "global_step": 425108, "epoch": 5121} {"train_loss": -26.80153465270996, "global_step": 425109, "epoch": 5121} {"train_loss": -26.73175048828125, "global_step": 425110, "epoch": 5121} {"train_loss": -27.31062889099121, "global_step": 425111, "epoch": 5121} {"train_loss": -26.839218139648438, "global_step": 425112, "epoch": 5121} {"train_loss": -26.86939811706543, "global_step": 425113, "epoch": 5121} {"train_loss": -26.782434463500977, "global_step": 425114, "epoch": 5121} {"train_loss": -26.998273849487305, "global_step": 425115, "epoch": 5121} {"train_loss": -26.830127716064453, "global_step": 425116, "epoch": 5121} {"train_loss": -26.9886417388916, "global_step": 425117, "epoch": 5121} {"train_loss": -26.851652145385742, "global_step": 425118, "epoch": 5121} {"train_loss": -27.04224967956543, "global_step": 425119, "epoch": 5121} {"train_loss": -26.75577735900879, "global_step": 425120, "epoch": 5121} {"train_loss": -26.902997970581055, "global_step": 425121, "epoch": 5121} {"train_loss": -27.12558937072754, "global_step": 425122, "epoch": 5121} {"train_loss": -27.303424835205078, "global_step": 425123, "epoch": 5121} {"train_loss": -26.85733413696289, "global_step": 425124, "epoch": 5121} {"train_loss": -26.75293030796281, "global_step": 425125, "epoch": 5121, "val_loss": 6864227.0} {"train_loss": -26.518695831298828, "global_step": 425126, "epoch": 5122} {"train_loss": -26.46443748474121, "global_step": 425127, "epoch": 5122} {"train_loss": -26.456480026245117, "global_step": 425128, "epoch": 5122} {"train_loss": -26.408613204956055, "global_step": 425129, "epoch": 5122} {"train_loss": -26.542795181274414, "global_step": 425130, "epoch": 5122} {"train_loss": -26.580310821533203, "global_step": 425131, "epoch": 5122} {"train_loss": -26.248884201049805, "global_step": 425132, "epoch": 5122} {"train_loss": -26.701370239257812, "global_step": 425133, "epoch": 5122} {"train_loss": -26.544103622436523, "global_step": 425134, "epoch": 5122} {"train_loss": -26.620264053344727, "global_step": 425135, "epoch": 5122} {"train_loss": -26.025156021118164, "global_step": 425136, "epoch": 5122} {"train_loss": -26.24995231628418, "global_step": 425137, "epoch": 5122} {"train_loss": -26.81119728088379, "global_step": 425138, "epoch": 5122} {"train_loss": -26.353906631469727, "global_step": 425139, "epoch": 5122} {"train_loss": -26.678430557250977, "global_step": 425140, "epoch": 5122} {"train_loss": -25.878772735595703, "global_step": 425141, "epoch": 5122} {"train_loss": -26.5772647857666, "global_step": 425142, "epoch": 5122} {"train_loss": -26.28757667541504, "global_step": 425143, "epoch": 5122} {"train_loss": -26.591718673706055, "global_step": 425144, "epoch": 5122} {"train_loss": -26.608325958251953, "global_step": 425145, "epoch": 5122} {"train_loss": -26.960554122924805, "global_step": 425146, "epoch": 5122} {"train_loss": -26.58744239807129, "global_step": 425147, "epoch": 5122} {"train_loss": -26.78458595275879, "global_step": 425148, "epoch": 5122} {"train_loss": -26.460636138916016, "global_step": 425149, "epoch": 5122} {"train_loss": -27.093427658081055, "global_step": 425150, "epoch": 5122} {"train_loss": -26.83660888671875, "global_step": 425151, "epoch": 5122} {"train_loss": -26.910085678100586, "global_step": 425152, "epoch": 5122} {"train_loss": -26.771860122680664, "global_step": 425153, "epoch": 5122} {"train_loss": -27.10125732421875, "global_step": 425154, "epoch": 5122} {"train_loss": -26.756433486938477, "global_step": 425155, "epoch": 5122} {"train_loss": -27.127012252807617, "global_step": 425156, "epoch": 5122} {"train_loss": -26.565282821655273, "global_step": 425157, "epoch": 5122} {"train_loss": -26.91025161743164, "global_step": 425158, "epoch": 5122} {"train_loss": -26.681344985961914, "global_step": 425159, "epoch": 5122} {"train_loss": -26.83448600769043, "global_step": 425160, "epoch": 5122} {"train_loss": -26.530139923095703, "global_step": 425161, "epoch": 5122} {"train_loss": -26.965070724487305, "global_step": 425162, "epoch": 5122} {"train_loss": -27.148197174072266, "global_step": 425163, "epoch": 5122} {"train_loss": -26.614892959594727, "global_step": 425164, "epoch": 5122} {"train_loss": -26.9757137298584, "global_step": 425165, "epoch": 5122} {"train_loss": -27.107685089111328, "global_step": 425166, "epoch": 5122} {"train_loss": -26.794530868530273, "global_step": 425167, "epoch": 5122} {"train_loss": -27.127241134643555, "global_step": 425168, "epoch": 5122} {"train_loss": -26.500268936157227, "global_step": 425169, "epoch": 5122} {"train_loss": -26.809619903564453, "global_step": 425170, "epoch": 5122} {"train_loss": -27.07480812072754, "global_step": 425171, "epoch": 5122} {"train_loss": -26.503263473510742, "global_step": 425172, "epoch": 5122} {"train_loss": -27.00204849243164, "global_step": 425173, "epoch": 5122} {"train_loss": -26.7888240814209, "global_step": 425174, "epoch": 5122} {"train_loss": -26.971515655517578, "global_step": 425175, "epoch": 5122} {"train_loss": -26.991552352905273, "global_step": 425176, "epoch": 5122} {"train_loss": -26.857419967651367, "global_step": 425177, "epoch": 5122} {"train_loss": -26.78619384765625, "global_step": 425178, "epoch": 5122} {"train_loss": -26.76079750061035, "global_step": 425179, "epoch": 5122} {"train_loss": -26.9819278717041, "global_step": 425180, "epoch": 5122} {"train_loss": -27.061248779296875, "global_step": 425181, "epoch": 5122} {"train_loss": -26.895200729370117, "global_step": 425182, "epoch": 5122} {"train_loss": -27.345996856689453, "global_step": 425183, "epoch": 5122} {"train_loss": -27.016992568969727, "global_step": 425184, "epoch": 5122} {"train_loss": -27.008886337280273, "global_step": 425185, "epoch": 5122} {"train_loss": -26.973581314086914, "global_step": 425186, "epoch": 5122} {"train_loss": -26.703510284423828, "global_step": 425187, "epoch": 5122} {"train_loss": -26.980077743530273, "global_step": 425188, "epoch": 5122} {"train_loss": -27.150665283203125, "global_step": 425189, "epoch": 5122} {"train_loss": -27.056293487548828, "global_step": 425190, "epoch": 5122} {"train_loss": -27.162328720092773, "global_step": 425191, "epoch": 5122} {"train_loss": -26.960988998413086, "global_step": 425192, "epoch": 5122} {"train_loss": -27.059995651245117, "global_step": 425193, "epoch": 5122} {"train_loss": -27.1701602935791, "global_step": 425194, "epoch": 5122} {"train_loss": -26.702014923095703, "global_step": 425195, "epoch": 5122} {"train_loss": -27.17268180847168, "global_step": 425196, "epoch": 5122} {"train_loss": -26.62656021118164, "global_step": 425197, "epoch": 5122} {"train_loss": -27.13705825805664, "global_step": 425198, "epoch": 5122} {"train_loss": -26.885679244995117, "global_step": 425199, "epoch": 5122} {"train_loss": -26.554025650024414, "global_step": 425200, "epoch": 5122} {"train_loss": -26.909582138061523, "global_step": 425201, "epoch": 5122} {"train_loss": -26.395349502563477, "global_step": 425202, "epoch": 5122} {"train_loss": -26.610822677612305, "global_step": 425203, "epoch": 5122} {"train_loss": -26.809858322143555, "global_step": 425204, "epoch": 5122} {"train_loss": -26.578638076782227, "global_step": 425205, "epoch": 5122} {"train_loss": -26.33942222595215, "global_step": 425206, "epoch": 5122} {"train_loss": -26.424589157104492, "global_step": 425207, "epoch": 5122} {"train_loss": -26.747277156416192, "global_step": 425208, "epoch": 5122, "val_loss": 6988710.0} {"train_loss": -25.692428588867188, "global_step": 425209, "epoch": 5123} {"train_loss": -25.44846534729004, "global_step": 425210, "epoch": 5123} {"train_loss": -26.021240234375, "global_step": 425211, "epoch": 5123} {"train_loss": -25.997577667236328, "global_step": 425212, "epoch": 5123} {"train_loss": -26.010549545288086, "global_step": 425213, "epoch": 5123} {"train_loss": -25.9733829498291, "global_step": 425214, "epoch": 5123} {"train_loss": -25.927087783813477, "global_step": 425215, "epoch": 5123} {"train_loss": -26.280353546142578, "global_step": 425216, "epoch": 5123} {"train_loss": -26.101837158203125, "global_step": 425217, "epoch": 5123} {"train_loss": -26.049365997314453, "global_step": 425218, "epoch": 5123} {"train_loss": -26.360631942749023, "global_step": 425219, "epoch": 5123} {"train_loss": -25.91334342956543, "global_step": 425220, "epoch": 5123} {"train_loss": -26.56495475769043, "global_step": 425221, "epoch": 5123} {"train_loss": -26.28175926208496, "global_step": 425222, "epoch": 5123} {"train_loss": -26.639745712280273, "global_step": 425223, "epoch": 5123} {"train_loss": -26.0845947265625, "global_step": 425224, "epoch": 5123} {"train_loss": -26.424474716186523, "global_step": 425225, "epoch": 5123} {"train_loss": -26.41249656677246, "global_step": 425226, "epoch": 5123} {"train_loss": -27.00984764099121, "global_step": 425227, "epoch": 5123} {"train_loss": -26.532663345336914, "global_step": 425228, "epoch": 5123} {"train_loss": -26.38532829284668, "global_step": 425229, "epoch": 5123} {"train_loss": -26.61347007751465, "global_step": 425230, "epoch": 5123} {"train_loss": -26.706640243530273, "global_step": 425231, "epoch": 5123} {"train_loss": -26.94080924987793, "global_step": 425232, "epoch": 5123} {"train_loss": -26.8359375, "global_step": 425233, "epoch": 5123} {"train_loss": -26.4859619140625, "global_step": 425234, "epoch": 5123} {"train_loss": -26.673507690429688, "global_step": 425235, "epoch": 5123} {"train_loss": -26.629180908203125, "global_step": 425236, "epoch": 5123} {"train_loss": -26.675973892211914, "global_step": 425237, "epoch": 5123} {"train_loss": -26.582386016845703, "global_step": 425238, "epoch": 5123} {"train_loss": -26.7393798828125, "global_step": 425239, "epoch": 5123} {"train_loss": -26.9360408782959, "global_step": 425240, "epoch": 5123} {"train_loss": -26.737051010131836, "global_step": 425241, "epoch": 5123} {"train_loss": -26.77602195739746, "global_step": 425242, "epoch": 5123} {"train_loss": -27.226099014282227, "global_step": 425243, "epoch": 5123} {"train_loss": -26.956348419189453, "global_step": 425244, "epoch": 5123} {"train_loss": -27.08955192565918, "global_step": 425245, "epoch": 5123} {"train_loss": -27.306777954101562, "global_step": 425246, "epoch": 5123} {"train_loss": -26.826263427734375, "global_step": 425247, "epoch": 5123} {"train_loss": -26.757848739624023, "global_step": 425248, "epoch": 5123} {"train_loss": -27.23586082458496, "global_step": 425249, "epoch": 5123} {"train_loss": -26.56207847595215, "global_step": 425250, "epoch": 5123} {"train_loss": -26.945600509643555, "global_step": 425251, "epoch": 5123} {"train_loss": -27.092432022094727, "global_step": 425252, "epoch": 5123} {"train_loss": -27.188922882080078, "global_step": 425253, "epoch": 5123} {"train_loss": -27.00066566467285, "global_step": 425254, "epoch": 5123} {"train_loss": -27.094297409057617, "global_step": 425255, "epoch": 5123} {"train_loss": -27.01934242248535, "global_step": 425256, "epoch": 5123} {"train_loss": -27.127222061157227, "global_step": 425257, "epoch": 5123} {"train_loss": -26.99733543395996, "global_step": 425258, "epoch": 5123} {"train_loss": -26.8373966217041, "global_step": 425259, "epoch": 5123} {"train_loss": -26.880136489868164, "global_step": 425260, "epoch": 5123} {"train_loss": -27.20659828186035, "global_step": 425261, "epoch": 5123} {"train_loss": -26.81621742248535, "global_step": 425262, "epoch": 5123} {"train_loss": -26.67145347595215, "global_step": 425263, "epoch": 5123} {"train_loss": -27.3819580078125, "global_step": 425264, "epoch": 5123} {"train_loss": -26.537565231323242, "global_step": 425265, "epoch": 5123} {"train_loss": -26.080602645874023, "global_step": 425266, "epoch": 5123} {"train_loss": -25.96677589416504, "global_step": 425267, "epoch": 5123} {"train_loss": -26.4233341217041, "global_step": 425268, "epoch": 5123} {"train_loss": -26.88947105407715, "global_step": 425269, "epoch": 5123} {"train_loss": -26.293806076049805, "global_step": 425270, "epoch": 5123} {"train_loss": -26.899118423461914, "global_step": 425271, "epoch": 5123} {"train_loss": -26.67119789123535, "global_step": 425272, "epoch": 5123} {"train_loss": -26.513586044311523, "global_step": 425273, "epoch": 5123} {"train_loss": -26.701465606689453, "global_step": 425274, "epoch": 5123} {"train_loss": -26.905593872070312, "global_step": 425275, "epoch": 5123} {"train_loss": -26.607431411743164, "global_step": 425276, "epoch": 5123} {"train_loss": -26.78546714782715, "global_step": 425277, "epoch": 5123} {"train_loss": -26.79375648498535, "global_step": 425278, "epoch": 5123} {"train_loss": -26.767892837524414, "global_step": 425279, "epoch": 5123} {"train_loss": -26.715377807617188, "global_step": 425280, "epoch": 5123} {"train_loss": -26.60593032836914, "global_step": 425281, "epoch": 5123} {"train_loss": -26.777164459228516, "global_step": 425282, "epoch": 5123} {"train_loss": -26.97951316833496, "global_step": 425283, "epoch": 5123} {"train_loss": -26.844989776611328, "global_step": 425284, "epoch": 5123} {"train_loss": -26.892078399658203, "global_step": 425285, "epoch": 5123} {"train_loss": -26.84473991394043, "global_step": 425286, "epoch": 5123} {"train_loss": -27.159692764282227, "global_step": 425287, "epoch": 5123} {"train_loss": -26.664947509765625, "global_step": 425288, "epoch": 5123} {"train_loss": -27.00754165649414, "global_step": 425289, "epoch": 5123} {"train_loss": -26.987640380859375, "global_step": 425290, "epoch": 5123} {"train_loss": -26.64023603875953, "global_step": 425291, "epoch": 5123, "val_loss": 6933193.0} {"train_loss": -26.488752365112305, "global_step": 425292, "epoch": 5124} {"train_loss": -26.0587215423584, "global_step": 425293, "epoch": 5124} {"train_loss": -26.644147872924805, "global_step": 425294, "epoch": 5124} {"train_loss": -26.270709991455078, "global_step": 425295, "epoch": 5124} {"train_loss": -25.986846923828125, "global_step": 425296, "epoch": 5124} {"train_loss": -26.172948837280273, "global_step": 425297, "epoch": 5124} {"train_loss": -26.370635986328125, "global_step": 425298, "epoch": 5124} {"train_loss": -26.941272735595703, "global_step": 425299, "epoch": 5124} {"train_loss": -26.607452392578125, "global_step": 425300, "epoch": 5124} {"train_loss": -26.538284301757812, "global_step": 425301, "epoch": 5124} {"train_loss": -26.810087203979492, "global_step": 425302, "epoch": 5124} {"train_loss": -26.676923751831055, "global_step": 425303, "epoch": 5124} {"train_loss": -26.559417724609375, "global_step": 425304, "epoch": 5124} {"train_loss": -26.29804801940918, "global_step": 425305, "epoch": 5124} {"train_loss": -26.07562255859375, "global_step": 425306, "epoch": 5124} {"train_loss": -26.420780181884766, "global_step": 425307, "epoch": 5124} {"train_loss": -26.979633331298828, "global_step": 425308, "epoch": 5124} {"train_loss": -26.593769073486328, "global_step": 425309, "epoch": 5124} {"train_loss": -26.3408260345459, "global_step": 425310, "epoch": 5124} {"train_loss": -26.86807632446289, "global_step": 425311, "epoch": 5124} {"train_loss": -26.964263916015625, "global_step": 425312, "epoch": 5124} {"train_loss": -27.27687644958496, "global_step": 425313, "epoch": 5124} {"train_loss": -27.020559310913086, "global_step": 425314, "epoch": 5124} {"train_loss": -26.62078857421875, "global_step": 425315, "epoch": 5124} {"train_loss": -26.885303497314453, "global_step": 425316, "epoch": 5124} {"train_loss": -26.775100708007812, "global_step": 425317, "epoch": 5124} {"train_loss": -26.752283096313477, "global_step": 425318, "epoch": 5124} {"train_loss": -27.08045768737793, "global_step": 425319, "epoch": 5124} {"train_loss": -26.871362686157227, "global_step": 425320, "epoch": 5124} {"train_loss": -26.567548751831055, "global_step": 425321, "epoch": 5124} {"train_loss": -26.75634765625, "global_step": 425322, "epoch": 5124} {"train_loss": -26.81343650817871, "global_step": 425323, "epoch": 5124} {"train_loss": -26.916913986206055, "global_step": 425324, "epoch": 5124} {"train_loss": -26.958179473876953, "global_step": 425325, "epoch": 5124} {"train_loss": -26.699451446533203, "global_step": 425326, "epoch": 5124} {"train_loss": -26.668237686157227, "global_step": 425327, "epoch": 5124} {"train_loss": -26.852222442626953, "global_step": 425328, "epoch": 5124} {"train_loss": -27.091251373291016, "global_step": 425329, "epoch": 5124} {"train_loss": -25.964834213256836, "global_step": 425330, "epoch": 5124} {"train_loss": -26.64068031311035, "global_step": 425331, "epoch": 5124} {"train_loss": -26.6507625579834, "global_step": 425332, "epoch": 5124} {"train_loss": -26.582014083862305, "global_step": 425333, "epoch": 5124} {"train_loss": -26.793384552001953, "global_step": 425334, "epoch": 5124} {"train_loss": -26.794763565063477, "global_step": 425335, "epoch": 5124} {"train_loss": -26.813159942626953, "global_step": 425336, "epoch": 5124} {"train_loss": -26.911848068237305, "global_step": 425337, "epoch": 5124} {"train_loss": -26.95270347595215, "global_step": 425338, "epoch": 5124} {"train_loss": -26.81070899963379, "global_step": 425339, "epoch": 5124} {"train_loss": -27.005945205688477, "global_step": 425340, "epoch": 5124} {"train_loss": -27.10321044921875, "global_step": 425341, "epoch": 5124} {"train_loss": -27.008115768432617, "global_step": 425342, "epoch": 5124} {"train_loss": -26.630115509033203, "global_step": 425343, "epoch": 5124} {"train_loss": -27.2230281829834, "global_step": 425344, "epoch": 5124} {"train_loss": -26.972248077392578, "global_step": 425345, "epoch": 5124} {"train_loss": -27.057138442993164, "global_step": 425346, "epoch": 5124} {"train_loss": -26.98199462890625, "global_step": 425347, "epoch": 5124} {"train_loss": -26.719959259033203, "global_step": 425348, "epoch": 5124} {"train_loss": -26.534046173095703, "global_step": 425349, "epoch": 5124} {"train_loss": -26.6776123046875, "global_step": 425350, "epoch": 5124} {"train_loss": -26.79163932800293, "global_step": 425351, "epoch": 5124} {"train_loss": -27.06646156311035, "global_step": 425352, "epoch": 5124} {"train_loss": -27.059558868408203, "global_step": 425353, "epoch": 5124} {"train_loss": -26.943653106689453, "global_step": 425354, "epoch": 5124} {"train_loss": -26.70627212524414, "global_step": 425355, "epoch": 5124} {"train_loss": -27.178625106811523, "global_step": 425356, "epoch": 5124} {"train_loss": -26.948705673217773, "global_step": 425357, "epoch": 5124} {"train_loss": -27.243738174438477, "global_step": 425358, "epoch": 5124} {"train_loss": -26.577157974243164, "global_step": 425359, "epoch": 5124} {"train_loss": -26.905536651611328, "global_step": 425360, "epoch": 5124} {"train_loss": -26.965116500854492, "global_step": 425361, "epoch": 5124} {"train_loss": -26.625940322875977, "global_step": 425362, "epoch": 5124} {"train_loss": -27.2565975189209, "global_step": 425363, "epoch": 5124} {"train_loss": -27.09224510192871, "global_step": 425364, "epoch": 5124} {"train_loss": -26.92681312561035, "global_step": 425365, "epoch": 5124} {"train_loss": -27.2265567779541, "global_step": 425366, "epoch": 5124} {"train_loss": -27.018177032470703, "global_step": 425367, "epoch": 5124} {"train_loss": -27.18731689453125, "global_step": 425368, "epoch": 5124} {"train_loss": -27.638336181640625, "global_step": 425369, "epoch": 5124} {"train_loss": -26.848119735717773, "global_step": 425370, "epoch": 5124} {"train_loss": -27.073638916015625, "global_step": 425371, "epoch": 5124} {"train_loss": -26.993627548217773, "global_step": 425372, "epoch": 5124} {"train_loss": -26.641454696655273, "global_step": 425373, "epoch": 5124} {"train_loss": -26.783771101250707, "global_step": 425374, "epoch": 5124, "val_loss": 6963577.0} {"train_loss": -25.664655685424805, "global_step": 425375, "epoch": 5125} {"train_loss": -22.669391632080078, "global_step": 425376, "epoch": 5125} {"train_loss": -22.566566467285156, "global_step": 425377, "epoch": 5125} {"train_loss": -22.84018325805664, "global_step": 425378, "epoch": 5125} {"train_loss": -24.71063232421875, "global_step": 425379, "epoch": 5125} {"train_loss": -25.703140258789062, "global_step": 425380, "epoch": 5125} {"train_loss": -24.610836029052734, "global_step": 425381, "epoch": 5125} {"train_loss": -26.32501792907715, "global_step": 425382, "epoch": 5125} {"train_loss": -25.281232833862305, "global_step": 425383, "epoch": 5125} {"train_loss": -25.592182159423828, "global_step": 425384, "epoch": 5125} {"train_loss": -26.108076095581055, "global_step": 425385, "epoch": 5125} {"train_loss": -25.545236587524414, "global_step": 425386, "epoch": 5125} {"train_loss": -25.91485595703125, "global_step": 425387, "epoch": 5125} {"train_loss": -25.364362716674805, "global_step": 425388, "epoch": 5125} {"train_loss": -26.1097354888916, "global_step": 425389, "epoch": 5125} {"train_loss": -26.112689971923828, "global_step": 425390, "epoch": 5125} {"train_loss": -25.568086624145508, "global_step": 425391, "epoch": 5125} {"train_loss": -26.2652530670166, "global_step": 425392, "epoch": 5125} {"train_loss": -25.901798248291016, "global_step": 425393, "epoch": 5125} {"train_loss": -25.942432403564453, "global_step": 425394, "epoch": 5125} {"train_loss": -26.12326431274414, "global_step": 425395, "epoch": 5125} {"train_loss": -25.987049102783203, "global_step": 425396, "epoch": 5125} {"train_loss": -25.909894943237305, "global_step": 425397, "epoch": 5125} {"train_loss": -26.205612182617188, "global_step": 425398, "epoch": 5125} {"train_loss": -25.990903854370117, "global_step": 425399, "epoch": 5125} {"train_loss": -26.21087646484375, "global_step": 425400, "epoch": 5125} {"train_loss": -26.151763916015625, "global_step": 425401, "epoch": 5125} {"train_loss": -26.0559024810791, "global_step": 425402, "epoch": 5125} {"train_loss": -26.126066207885742, "global_step": 425403, "epoch": 5125} {"train_loss": -26.859119415283203, "global_step": 425404, "epoch": 5125} {"train_loss": -25.709686279296875, "global_step": 425405, "epoch": 5125} {"train_loss": -26.134851455688477, "global_step": 425406, "epoch": 5125} {"train_loss": -26.635038375854492, "global_step": 425407, "epoch": 5125} {"train_loss": -26.322174072265625, "global_step": 425408, "epoch": 5125} {"train_loss": -26.428058624267578, "global_step": 425409, "epoch": 5125} {"train_loss": -26.58124351501465, "global_step": 425410, "epoch": 5125} {"train_loss": -26.61246109008789, "global_step": 425411, "epoch": 5125} {"train_loss": -26.466283798217773, "global_step": 425412, "epoch": 5125} {"train_loss": -26.725784301757812, "global_step": 425413, "epoch": 5125} {"train_loss": -26.49085807800293, "global_step": 425414, "epoch": 5125} {"train_loss": -26.59881591796875, "global_step": 425415, "epoch": 5125} {"train_loss": -26.85542869567871, "global_step": 425416, "epoch": 5125} {"train_loss": -26.86435890197754, "global_step": 425417, "epoch": 5125} {"train_loss": -27.049386978149414, "global_step": 425418, "epoch": 5125} {"train_loss": -26.72336196899414, "global_step": 425419, "epoch": 5125} {"train_loss": -26.516128540039062, "global_step": 425420, "epoch": 5125} {"train_loss": -26.38726806640625, "global_step": 425421, "epoch": 5125} {"train_loss": -27.057783126831055, "global_step": 425422, "epoch": 5125} {"train_loss": -27.029571533203125, "global_step": 425423, "epoch": 5125} {"train_loss": -26.8364315032959, "global_step": 425424, "epoch": 5125} {"train_loss": -26.643665313720703, "global_step": 425425, "epoch": 5125} {"train_loss": -26.988910675048828, "global_step": 425426, "epoch": 5125} {"train_loss": -26.800464630126953, "global_step": 425427, "epoch": 5125} {"train_loss": -27.326019287109375, "global_step": 425428, "epoch": 5125} {"train_loss": -26.8817081451416, "global_step": 425429, "epoch": 5125} {"train_loss": -26.59000587463379, "global_step": 425430, "epoch": 5125} {"train_loss": -26.836706161499023, "global_step": 425431, "epoch": 5125} {"train_loss": -26.95539665222168, "global_step": 425432, "epoch": 5125} {"train_loss": -27.14458656311035, "global_step": 425433, "epoch": 5125} {"train_loss": -27.237884521484375, "global_step": 425434, "epoch": 5125} {"train_loss": -27.269577026367188, "global_step": 425435, "epoch": 5125} {"train_loss": -27.185688018798828, "global_step": 425436, "epoch": 5125} {"train_loss": -26.944677352905273, "global_step": 425437, "epoch": 5125} {"train_loss": -26.988744735717773, "global_step": 425438, "epoch": 5125} {"train_loss": -26.680164337158203, "global_step": 425439, "epoch": 5125} {"train_loss": -27.124469757080078, "global_step": 425440, "epoch": 5125} {"train_loss": -26.7307071685791, "global_step": 425441, "epoch": 5125} {"train_loss": -27.083032608032227, "global_step": 425442, "epoch": 5125} {"train_loss": -26.893056869506836, "global_step": 425443, "epoch": 5125} {"train_loss": -27.083984375, "global_step": 425444, "epoch": 5125} {"train_loss": -26.988828659057617, "global_step": 425445, "epoch": 5125} {"train_loss": -27.251379013061523, "global_step": 425446, "epoch": 5125} {"train_loss": -27.0600528717041, "global_step": 425447, "epoch": 5125} {"train_loss": -27.321369171142578, "global_step": 425448, "epoch": 5125} {"train_loss": -27.317838668823242, "global_step": 425449, "epoch": 5125} {"train_loss": -26.9779109954834, "global_step": 425450, "epoch": 5125} {"train_loss": -26.761322021484375, "global_step": 425451, "epoch": 5125} {"train_loss": -27.143945693969727, "global_step": 425452, "epoch": 5125} {"train_loss": -27.391799926757812, "global_step": 425453, "epoch": 5125} {"train_loss": -27.08436393737793, "global_step": 425454, "epoch": 5125} {"train_loss": -27.003259658813477, "global_step": 425455, "epoch": 5125} {"train_loss": -27.099273681640625, "global_step": 425456, "epoch": 5125} {"train_loss": -26.384558206581207, "global_step": 425457, "epoch": 5125, "val_loss": 6891224.0} {"train_loss": -26.556915283203125, "global_step": 425458, "epoch": 5126} {"train_loss": -25.533233642578125, "global_step": 425459, "epoch": 5126} {"train_loss": -25.41878318786621, "global_step": 425460, "epoch": 5126} {"train_loss": -26.3712158203125, "global_step": 425461, "epoch": 5126} {"train_loss": -25.612028121948242, "global_step": 425462, "epoch": 5126} {"train_loss": -26.168447494506836, "global_step": 425463, "epoch": 5126} {"train_loss": -25.88123893737793, "global_step": 425464, "epoch": 5126} {"train_loss": -26.376983642578125, "global_step": 425465, "epoch": 5126} {"train_loss": -26.353530883789062, "global_step": 425466, "epoch": 5126} {"train_loss": -26.191009521484375, "global_step": 425467, "epoch": 5126} {"train_loss": -26.636747360229492, "global_step": 425468, "epoch": 5126} {"train_loss": -26.627609252929688, "global_step": 425469, "epoch": 5126} {"train_loss": -26.58810806274414, "global_step": 425470, "epoch": 5126} {"train_loss": -26.155710220336914, "global_step": 425471, "epoch": 5126} {"train_loss": -26.939285278320312, "global_step": 425472, "epoch": 5126} {"train_loss": -26.570865631103516, "global_step": 425473, "epoch": 5126} {"train_loss": -26.417678833007812, "global_step": 425474, "epoch": 5126} {"train_loss": -26.760272979736328, "global_step": 425475, "epoch": 5126} {"train_loss": -26.48903465270996, "global_step": 425476, "epoch": 5126} {"train_loss": -26.4563045501709, "global_step": 425477, "epoch": 5126} {"train_loss": -26.558385848999023, "global_step": 425478, "epoch": 5126} {"train_loss": -26.757287979125977, "global_step": 425479, "epoch": 5126} {"train_loss": -26.8167724609375, "global_step": 425480, "epoch": 5126} {"train_loss": -26.315631866455078, "global_step": 425481, "epoch": 5126} {"train_loss": -26.823083877563477, "global_step": 425482, "epoch": 5126} {"train_loss": -26.668561935424805, "global_step": 425483, "epoch": 5126} {"train_loss": -26.8909854888916, "global_step": 425484, "epoch": 5126} {"train_loss": -26.827131271362305, "global_step": 425485, "epoch": 5126} {"train_loss": -26.751789093017578, "global_step": 425486, "epoch": 5126} {"train_loss": -26.724821090698242, "global_step": 425487, "epoch": 5126} {"train_loss": -26.95400047302246, "global_step": 425488, "epoch": 5126} {"train_loss": -26.763574600219727, "global_step": 425489, "epoch": 5126} {"train_loss": -26.614526748657227, "global_step": 425490, "epoch": 5126} {"train_loss": -26.81147575378418, "global_step": 425491, "epoch": 5126} {"train_loss": -26.706607818603516, "global_step": 425492, "epoch": 5126} {"train_loss": -26.804800033569336, "global_step": 425493, "epoch": 5126} {"train_loss": -26.762983322143555, "global_step": 425494, "epoch": 5126} {"train_loss": -26.581512451171875, "global_step": 425495, "epoch": 5126} {"train_loss": -26.58819580078125, "global_step": 425496, "epoch": 5126} {"train_loss": -27.149656295776367, "global_step": 425497, "epoch": 5126} {"train_loss": -27.152944564819336, "global_step": 425498, "epoch": 5126} {"train_loss": -26.64951515197754, "global_step": 425499, "epoch": 5126} {"train_loss": -26.562963485717773, "global_step": 425500, "epoch": 5126} {"train_loss": -26.970701217651367, "global_step": 425501, "epoch": 5126} {"train_loss": -26.788747787475586, "global_step": 425502, "epoch": 5126} {"train_loss": -26.657001495361328, "global_step": 425503, "epoch": 5126} {"train_loss": -26.918304443359375, "global_step": 425504, "epoch": 5126} {"train_loss": -26.42103385925293, "global_step": 425505, "epoch": 5126} {"train_loss": -27.028125762939453, "global_step": 425506, "epoch": 5126} {"train_loss": -26.6444034576416, "global_step": 425507, "epoch": 5126} {"train_loss": -26.717670440673828, "global_step": 425508, "epoch": 5126} {"train_loss": -26.891178131103516, "global_step": 425509, "epoch": 5126} {"train_loss": -26.7099666595459, "global_step": 425510, "epoch": 5126} {"train_loss": -26.82600212097168, "global_step": 425511, "epoch": 5126} {"train_loss": -26.901575088500977, "global_step": 425512, "epoch": 5126} {"train_loss": -26.969945907592773, "global_step": 425513, "epoch": 5126} {"train_loss": -26.6251277923584, "global_step": 425514, "epoch": 5126} {"train_loss": -26.7933292388916, "global_step": 425515, "epoch": 5126} {"train_loss": -26.52335548400879, "global_step": 425516, "epoch": 5126} {"train_loss": -27.16803550720215, "global_step": 425517, "epoch": 5126} {"train_loss": -27.145965576171875, "global_step": 425518, "epoch": 5126} {"train_loss": -26.853357315063477, "global_step": 425519, "epoch": 5126} {"train_loss": -27.129791259765625, "global_step": 425520, "epoch": 5126} {"train_loss": -26.711231231689453, "global_step": 425521, "epoch": 5126} {"train_loss": -26.86016273498535, "global_step": 425522, "epoch": 5126} {"train_loss": -27.1205997467041, "global_step": 425523, "epoch": 5126} {"train_loss": -27.4820499420166, "global_step": 425524, "epoch": 5126} {"train_loss": -27.240339279174805, "global_step": 425525, "epoch": 5126} {"train_loss": -27.18808937072754, "global_step": 425526, "epoch": 5126} {"train_loss": -26.959136962890625, "global_step": 425527, "epoch": 5126} {"train_loss": -27.14823341369629, "global_step": 425528, "epoch": 5126} {"train_loss": -26.795745849609375, "global_step": 425529, "epoch": 5126} {"train_loss": -27.25058364868164, "global_step": 425530, "epoch": 5126} {"train_loss": -27.254547119140625, "global_step": 425531, "epoch": 5126} {"train_loss": -26.898345947265625, "global_step": 425532, "epoch": 5126} {"train_loss": -27.239683151245117, "global_step": 425533, "epoch": 5126} {"train_loss": -26.936620712280273, "global_step": 425534, "epoch": 5126} {"train_loss": -27.184070587158203, "global_step": 425535, "epoch": 5126} {"train_loss": -27.022724151611328, "global_step": 425536, "epoch": 5126} {"train_loss": -27.0712890625, "global_step": 425537, "epoch": 5126} {"train_loss": -26.62594985961914, "global_step": 425538, "epoch": 5126} {"train_loss": -26.329925537109375, "global_step": 425539, "epoch": 5126} {"train_loss": -26.738594583718175, "global_step": 425540, "epoch": 5126, "val_loss": 6846342.0} {"train_loss": -25.57293701171875, "global_step": 425541, "epoch": 5127} {"train_loss": -24.78240394592285, "global_step": 425542, "epoch": 5127} {"train_loss": -25.915729522705078, "global_step": 425543, "epoch": 5127} {"train_loss": -25.765439987182617, "global_step": 425544, "epoch": 5127} {"train_loss": -25.45461654663086, "global_step": 425545, "epoch": 5127} {"train_loss": -25.341176986694336, "global_step": 425546, "epoch": 5127} {"train_loss": -25.808801651000977, "global_step": 425547, "epoch": 5127} {"train_loss": -26.36907958984375, "global_step": 425548, "epoch": 5127} {"train_loss": -26.22810173034668, "global_step": 425549, "epoch": 5127} {"train_loss": -25.76273536682129, "global_step": 425550, "epoch": 5127} {"train_loss": -26.142276763916016, "global_step": 425551, "epoch": 5127} {"train_loss": -26.253793716430664, "global_step": 425552, "epoch": 5127} {"train_loss": -26.1708927154541, "global_step": 425553, "epoch": 5127} {"train_loss": -26.17437171936035, "global_step": 425554, "epoch": 5127} {"train_loss": -26.2928524017334, "global_step": 425555, "epoch": 5127} {"train_loss": -26.533491134643555, "global_step": 425556, "epoch": 5127} {"train_loss": -26.3554630279541, "global_step": 425557, "epoch": 5127} {"train_loss": -26.387588500976562, "global_step": 425558, "epoch": 5127} {"train_loss": -26.577157974243164, "global_step": 425559, "epoch": 5127} {"train_loss": -26.736682891845703, "global_step": 425560, "epoch": 5127} {"train_loss": -26.198659896850586, "global_step": 425561, "epoch": 5127} {"train_loss": -26.619104385375977, "global_step": 425562, "epoch": 5127} {"train_loss": -26.413854598999023, "global_step": 425563, "epoch": 5127} {"train_loss": -26.720510482788086, "global_step": 425564, "epoch": 5127} {"train_loss": -26.7189884185791, "global_step": 425565, "epoch": 5127} {"train_loss": -26.738540649414062, "global_step": 425566, "epoch": 5127} {"train_loss": -26.5870304107666, "global_step": 425567, "epoch": 5127} {"train_loss": -26.6966609954834, "global_step": 425568, "epoch": 5127} {"train_loss": -26.449630737304688, "global_step": 425569, "epoch": 5127} {"train_loss": -26.416044235229492, "global_step": 425570, "epoch": 5127} {"train_loss": -26.59075355529785, "global_step": 425571, "epoch": 5127} {"train_loss": -26.640579223632812, "global_step": 425572, "epoch": 5127} {"train_loss": -26.55643081665039, "global_step": 425573, "epoch": 5127} {"train_loss": -26.79920768737793, "global_step": 425574, "epoch": 5127} {"train_loss": -26.600149154663086, "global_step": 425575, "epoch": 5127} {"train_loss": -26.460159301757812, "global_step": 425576, "epoch": 5127} {"train_loss": -26.84468650817871, "global_step": 425577, "epoch": 5127} {"train_loss": -26.8807373046875, "global_step": 425578, "epoch": 5127} {"train_loss": -26.842931747436523, "global_step": 425579, "epoch": 5127} {"train_loss": -26.730640411376953, "global_step": 425580, "epoch": 5127} {"train_loss": -26.4899845123291, "global_step": 425581, "epoch": 5127} {"train_loss": -26.842432022094727, "global_step": 425582, "epoch": 5127} {"train_loss": -26.797956466674805, "global_step": 425583, "epoch": 5127} {"train_loss": -26.95184898376465, "global_step": 425584, "epoch": 5127} {"train_loss": -26.775592803955078, "global_step": 425585, "epoch": 5127} {"train_loss": -26.794525146484375, "global_step": 425586, "epoch": 5127} {"train_loss": -26.637393951416016, "global_step": 425587, "epoch": 5127} {"train_loss": -26.53089714050293, "global_step": 425588, "epoch": 5127} {"train_loss": -26.77057456970215, "global_step": 425589, "epoch": 5127} {"train_loss": -27.110431671142578, "global_step": 425590, "epoch": 5127} {"train_loss": -27.32264518737793, "global_step": 425591, "epoch": 5127} {"train_loss": -26.839033126831055, "global_step": 425592, "epoch": 5127} {"train_loss": -27.174413681030273, "global_step": 425593, "epoch": 5127} {"train_loss": -26.981616973876953, "global_step": 425594, "epoch": 5127} {"train_loss": -27.388141632080078, "global_step": 425595, "epoch": 5127} {"train_loss": -26.818754196166992, "global_step": 425596, "epoch": 5127} {"train_loss": -26.775619506835938, "global_step": 425597, "epoch": 5127} {"train_loss": -27.009052276611328, "global_step": 425598, "epoch": 5127} {"train_loss": -26.65909194946289, "global_step": 425599, "epoch": 5127} {"train_loss": -27.131311416625977, "global_step": 425600, "epoch": 5127} {"train_loss": -26.828954696655273, "global_step": 425601, "epoch": 5127} {"train_loss": -26.75848388671875, "global_step": 425602, "epoch": 5127} {"train_loss": -26.68794059753418, "global_step": 425603, "epoch": 5127} {"train_loss": -26.778003692626953, "global_step": 425604, "epoch": 5127} {"train_loss": -27.476703643798828, "global_step": 425605, "epoch": 5127} {"train_loss": -27.01218032836914, "global_step": 425606, "epoch": 5127} {"train_loss": -27.157840728759766, "global_step": 425607, "epoch": 5127} {"train_loss": -26.754898071289062, "global_step": 425608, "epoch": 5127} {"train_loss": -27.166595458984375, "global_step": 425609, "epoch": 5127} {"train_loss": -26.706960678100586, "global_step": 425610, "epoch": 5127} {"train_loss": -26.93356704711914, "global_step": 425611, "epoch": 5127} {"train_loss": -26.883161544799805, "global_step": 425612, "epoch": 5127} {"train_loss": -26.808984756469727, "global_step": 425613, "epoch": 5127} {"train_loss": -26.840240478515625, "global_step": 425614, "epoch": 5127} {"train_loss": -26.4083194732666, "global_step": 425615, "epoch": 5127} {"train_loss": -26.460927963256836, "global_step": 425616, "epoch": 5127} {"train_loss": -27.07268714904785, "global_step": 425617, "epoch": 5127} {"train_loss": -26.760074615478516, "global_step": 425618, "epoch": 5127} {"train_loss": -27.17085075378418, "global_step": 425619, "epoch": 5127} {"train_loss": -26.859357833862305, "global_step": 425620, "epoch": 5127} {"train_loss": -26.7872257232666, "global_step": 425621, "epoch": 5127} {"train_loss": -26.4814510345459, "global_step": 425622, "epoch": 5127} {"train_loss": -26.60933060243905, "global_step": 425623, "epoch": 5127, "val_loss": 6825894.5} {"train_loss": -25.949506759643555, "global_step": 425624, "epoch": 5128} {"train_loss": -26.061145782470703, "global_step": 425625, "epoch": 5128} {"train_loss": -26.47946548461914, "global_step": 425626, "epoch": 5128} {"train_loss": -26.138507843017578, "global_step": 425627, "epoch": 5128} {"train_loss": -25.864255905151367, "global_step": 425628, "epoch": 5128} {"train_loss": -26.381275177001953, "global_step": 425629, "epoch": 5128} {"train_loss": -25.914615631103516, "global_step": 425630, "epoch": 5128} {"train_loss": -26.405424118041992, "global_step": 425631, "epoch": 5128} {"train_loss": -26.60079002380371, "global_step": 425632, "epoch": 5128} {"train_loss": -26.5363826751709, "global_step": 425633, "epoch": 5128} {"train_loss": -25.985870361328125, "global_step": 425634, "epoch": 5128} {"train_loss": -26.4133243560791, "global_step": 425635, "epoch": 5128} {"train_loss": -26.529102325439453, "global_step": 425636, "epoch": 5128} {"train_loss": -26.498071670532227, "global_step": 425637, "epoch": 5128} {"train_loss": -26.474491119384766, "global_step": 425638, "epoch": 5128} {"train_loss": -26.126562118530273, "global_step": 425639, "epoch": 5128} {"train_loss": -26.647130966186523, "global_step": 425640, "epoch": 5128} {"train_loss": -26.66460609436035, "global_step": 425641, "epoch": 5128} {"train_loss": -26.844594955444336, "global_step": 425642, "epoch": 5128} {"train_loss": -26.54376792907715, "global_step": 425643, "epoch": 5128} {"train_loss": -26.235443115234375, "global_step": 425644, "epoch": 5128} {"train_loss": -26.40620231628418, "global_step": 425645, "epoch": 5128} {"train_loss": -26.77505874633789, "global_step": 425646, "epoch": 5128} {"train_loss": -26.48054313659668, "global_step": 425647, "epoch": 5128} {"train_loss": -26.73304557800293, "global_step": 425648, "epoch": 5128} {"train_loss": -26.16282081604004, "global_step": 425649, "epoch": 5128} {"train_loss": -26.88828468322754, "global_step": 425650, "epoch": 5128} {"train_loss": -26.75969886779785, "global_step": 425651, "epoch": 5128} {"train_loss": -26.406126022338867, "global_step": 425652, "epoch": 5128} {"train_loss": -27.098865509033203, "global_step": 425653, "epoch": 5128} {"train_loss": -26.69065284729004, "global_step": 425654, "epoch": 5128} {"train_loss": -26.8856201171875, "global_step": 425655, "epoch": 5128} {"train_loss": -27.1510066986084, "global_step": 425656, "epoch": 5128} {"train_loss": -27.00124168395996, "global_step": 425657, "epoch": 5128} {"train_loss": -26.774169921875, "global_step": 425658, "epoch": 5128} {"train_loss": -26.77412223815918, "global_step": 425659, "epoch": 5128} {"train_loss": -26.457965850830078, "global_step": 425660, "epoch": 5128} {"train_loss": -26.75758171081543, "global_step": 425661, "epoch": 5128} {"train_loss": -26.839263916015625, "global_step": 425662, "epoch": 5128} {"train_loss": -26.81572914123535, "global_step": 425663, "epoch": 5128} {"train_loss": -26.857166290283203, "global_step": 425664, "epoch": 5128} {"train_loss": -26.878528594970703, "global_step": 425665, "epoch": 5128} {"train_loss": -26.591604232788086, "global_step": 425666, "epoch": 5128} {"train_loss": -26.791406631469727, "global_step": 425667, "epoch": 5128} {"train_loss": -27.00144386291504, "global_step": 425668, "epoch": 5128} {"train_loss": -27.10332679748535, "global_step": 425669, "epoch": 5128} {"train_loss": -27.025304794311523, "global_step": 425670, "epoch": 5128} {"train_loss": -26.865386962890625, "global_step": 425671, "epoch": 5128} {"train_loss": -26.5172061920166, "global_step": 425672, "epoch": 5128} {"train_loss": -27.069049835205078, "global_step": 425673, "epoch": 5128} {"train_loss": -27.234601974487305, "global_step": 425674, "epoch": 5128} {"train_loss": -27.351110458374023, "global_step": 425675, "epoch": 5128} {"train_loss": -27.225341796875, "global_step": 425676, "epoch": 5128} {"train_loss": -27.048608779907227, "global_step": 425677, "epoch": 5128} {"train_loss": -27.17949867248535, "global_step": 425678, "epoch": 5128} {"train_loss": -26.9713134765625, "global_step": 425679, "epoch": 5128} {"train_loss": -27.124704360961914, "global_step": 425680, "epoch": 5128} {"train_loss": -26.901611328125, "global_step": 425681, "epoch": 5128} {"train_loss": -27.024948120117188, "global_step": 425682, "epoch": 5128} {"train_loss": -27.004159927368164, "global_step": 425683, "epoch": 5128} {"train_loss": -26.79108238220215, "global_step": 425684, "epoch": 5128} {"train_loss": -27.02044105529785, "global_step": 425685, "epoch": 5128} {"train_loss": -26.933820724487305, "global_step": 425686, "epoch": 5128} {"train_loss": -27.114704132080078, "global_step": 425687, "epoch": 5128} {"train_loss": -26.84400749206543, "global_step": 425688, "epoch": 5128} {"train_loss": -27.014667510986328, "global_step": 425689, "epoch": 5128} {"train_loss": -26.718780517578125, "global_step": 425690, "epoch": 5128} {"train_loss": -26.798749923706055, "global_step": 425691, "epoch": 5128} {"train_loss": -26.95820426940918, "global_step": 425692, "epoch": 5128} {"train_loss": -26.915082931518555, "global_step": 425693, "epoch": 5128} {"train_loss": -26.785017013549805, "global_step": 425694, "epoch": 5128} {"train_loss": -26.830402374267578, "global_step": 425695, "epoch": 5128} {"train_loss": -26.732152938842773, "global_step": 425696, "epoch": 5128} {"train_loss": -26.814184188842773, "global_step": 425697, "epoch": 5128} {"train_loss": -26.864398956298828, "global_step": 425698, "epoch": 5128} {"train_loss": -26.90260887145996, "global_step": 425699, "epoch": 5128} {"train_loss": -27.045507431030273, "global_step": 425700, "epoch": 5128} {"train_loss": -26.910871505737305, "global_step": 425701, "epoch": 5128} {"train_loss": -27.2957820892334, "global_step": 425702, "epoch": 5128} {"train_loss": -27.088117599487305, "global_step": 425703, "epoch": 5128} {"train_loss": -26.810245513916016, "global_step": 425704, "epoch": 5128} {"train_loss": -26.87192153930664, "global_step": 425705, "epoch": 5128} {"train_loss": -26.74450699679823, "global_step": 425706, "epoch": 5128, "val_loss": 6912941.0} {"train_loss": -26.386159896850586, "global_step": 425707, "epoch": 5129} {"train_loss": -26.456573486328125, "global_step": 425708, "epoch": 5129} {"train_loss": -26.721603393554688, "global_step": 425709, "epoch": 5129} {"train_loss": -26.736387252807617, "global_step": 425710, "epoch": 5129} {"train_loss": -26.5684757232666, "global_step": 425711, "epoch": 5129} {"train_loss": -26.530231475830078, "global_step": 425712, "epoch": 5129} {"train_loss": -26.553180694580078, "global_step": 425713, "epoch": 5129} {"train_loss": -26.952123641967773, "global_step": 425714, "epoch": 5129} {"train_loss": -26.48002052307129, "global_step": 425715, "epoch": 5129} {"train_loss": -26.744665145874023, "global_step": 425716, "epoch": 5129} {"train_loss": -26.623050689697266, "global_step": 425717, "epoch": 5129} {"train_loss": -26.54155921936035, "global_step": 425718, "epoch": 5129} {"train_loss": -26.76651954650879, "global_step": 425719, "epoch": 5129} {"train_loss": -26.740497589111328, "global_step": 425720, "epoch": 5129} {"train_loss": -26.732425689697266, "global_step": 425721, "epoch": 5129} {"train_loss": -26.9988956451416, "global_step": 425722, "epoch": 5129} {"train_loss": -27.10413932800293, "global_step": 425723, "epoch": 5129} {"train_loss": -26.813058853149414, "global_step": 425724, "epoch": 5129} {"train_loss": -26.564361572265625, "global_step": 425725, "epoch": 5129} {"train_loss": -26.828760147094727, "global_step": 425726, "epoch": 5129} {"train_loss": -27.09224510192871, "global_step": 425727, "epoch": 5129} {"train_loss": -26.689533233642578, "global_step": 425728, "epoch": 5129} {"train_loss": -26.604963302612305, "global_step": 425729, "epoch": 5129} {"train_loss": -26.88649559020996, "global_step": 425730, "epoch": 5129} {"train_loss": -26.894683837890625, "global_step": 425731, "epoch": 5129} {"train_loss": -27.002643585205078, "global_step": 425732, "epoch": 5129} {"train_loss": -26.6922607421875, "global_step": 425733, "epoch": 5129} {"train_loss": -26.728490829467773, "global_step": 425734, "epoch": 5129} {"train_loss": -26.85456657409668, "global_step": 425735, "epoch": 5129} {"train_loss": -27.072492599487305, "global_step": 425736, "epoch": 5129} {"train_loss": -27.195966720581055, "global_step": 425737, "epoch": 5129} {"train_loss": -27.312108993530273, "global_step": 425738, "epoch": 5129} {"train_loss": -26.879486083984375, "global_step": 425739, "epoch": 5129} {"train_loss": -26.66999626159668, "global_step": 425740, "epoch": 5129} {"train_loss": -26.896894454956055, "global_step": 425741, "epoch": 5129} {"train_loss": -26.899621963500977, "global_step": 425742, "epoch": 5129} {"train_loss": -26.8824462890625, "global_step": 425743, "epoch": 5129} {"train_loss": -26.8580379486084, "global_step": 425744, "epoch": 5129} {"train_loss": -26.770740509033203, "global_step": 425745, "epoch": 5129} {"train_loss": -27.059961318969727, "global_step": 425746, "epoch": 5129} {"train_loss": -26.727447509765625, "global_step": 425747, "epoch": 5129} {"train_loss": -26.7175350189209, "global_step": 425748, "epoch": 5129} {"train_loss": -26.97757339477539, "global_step": 425749, "epoch": 5129} {"train_loss": -26.934019088745117, "global_step": 425750, "epoch": 5129} {"train_loss": -26.9412784576416, "global_step": 425751, "epoch": 5129} {"train_loss": -27.214887619018555, "global_step": 425752, "epoch": 5129} {"train_loss": -27.2730712890625, "global_step": 425753, "epoch": 5129} {"train_loss": -26.590818405151367, "global_step": 425754, "epoch": 5129} {"train_loss": -27.634796142578125, "global_step": 425755, "epoch": 5129} {"train_loss": -26.956674575805664, "global_step": 425756, "epoch": 5129} {"train_loss": -26.7500057220459, "global_step": 425757, "epoch": 5129} {"train_loss": -26.935216903686523, "global_step": 425758, "epoch": 5129} {"train_loss": -26.40268898010254, "global_step": 425759, "epoch": 5129} {"train_loss": -26.90509033203125, "global_step": 425760, "epoch": 5129} {"train_loss": -26.905933380126953, "global_step": 425761, "epoch": 5129} {"train_loss": -27.1156005859375, "global_step": 425762, "epoch": 5129} {"train_loss": -26.301008224487305, "global_step": 425763, "epoch": 5129} {"train_loss": -26.36474609375, "global_step": 425764, "epoch": 5129} {"train_loss": -25.899433135986328, "global_step": 425765, "epoch": 5129} {"train_loss": -25.785070419311523, "global_step": 425766, "epoch": 5129} {"train_loss": -26.46707534790039, "global_step": 425767, "epoch": 5129} {"train_loss": -26.920795440673828, "global_step": 425768, "epoch": 5129} {"train_loss": -26.1523494720459, "global_step": 425769, "epoch": 5129} {"train_loss": -26.47906494140625, "global_step": 425770, "epoch": 5129} {"train_loss": -26.17803955078125, "global_step": 425771, "epoch": 5129} {"train_loss": -26.0384578704834, "global_step": 425772, "epoch": 5129} {"train_loss": -26.272653579711914, "global_step": 425773, "epoch": 5129} {"train_loss": -26.301557540893555, "global_step": 425774, "epoch": 5129} {"train_loss": -25.60121726989746, "global_step": 425775, "epoch": 5129} {"train_loss": -26.66790199279785, "global_step": 425776, "epoch": 5129} {"train_loss": -26.0159912109375, "global_step": 425777, "epoch": 5129} {"train_loss": -26.049713134765625, "global_step": 425778, "epoch": 5129} {"train_loss": -25.915729522705078, "global_step": 425779, "epoch": 5129} {"train_loss": -26.021930694580078, "global_step": 425780, "epoch": 5129} {"train_loss": -26.057193756103516, "global_step": 425781, "epoch": 5129} {"train_loss": -26.504425048828125, "global_step": 425782, "epoch": 5129} {"train_loss": -25.984495162963867, "global_step": 425783, "epoch": 5129} {"train_loss": -26.3621883392334, "global_step": 425784, "epoch": 5129} {"train_loss": -26.666595458984375, "global_step": 425785, "epoch": 5129} {"train_loss": -26.70035743713379, "global_step": 425786, "epoch": 5129} {"train_loss": -26.532825469970703, "global_step": 425787, "epoch": 5129} {"train_loss": -26.560083389282227, "global_step": 425788, "epoch": 5129} {"train_loss": -26.65740406082337, "global_step": 425789, "epoch": 5129, "val_loss": 6821137.0} {"train_loss": -26.02138328552246, "global_step": 425790, "epoch": 5130} {"train_loss": -26.07660484313965, "global_step": 425791, "epoch": 5130} {"train_loss": -26.139562606811523, "global_step": 425792, "epoch": 5130} {"train_loss": -26.027423858642578, "global_step": 425793, "epoch": 5130} {"train_loss": -26.03254508972168, "global_step": 425794, "epoch": 5130} {"train_loss": -26.28472328186035, "global_step": 425795, "epoch": 5130} {"train_loss": -26.454954147338867, "global_step": 425796, "epoch": 5130} {"train_loss": -26.142444610595703, "global_step": 425797, "epoch": 5130} {"train_loss": -26.1261043548584, "global_step": 425798, "epoch": 5130} {"train_loss": -26.398038864135742, "global_step": 425799, "epoch": 5130} {"train_loss": -26.29754638671875, "global_step": 425800, "epoch": 5130} {"train_loss": -25.98235511779785, "global_step": 425801, "epoch": 5130} {"train_loss": -26.15970802307129, "global_step": 425802, "epoch": 5130} {"train_loss": -26.61407470703125, "global_step": 425803, "epoch": 5130} {"train_loss": -26.678680419921875, "global_step": 425804, "epoch": 5130} {"train_loss": -26.252079010009766, "global_step": 425805, "epoch": 5130} {"train_loss": -26.420618057250977, "global_step": 425806, "epoch": 5130} {"train_loss": -26.290586471557617, "global_step": 425807, "epoch": 5130} {"train_loss": -26.812971115112305, "global_step": 425808, "epoch": 5130} {"train_loss": -26.75504493713379, "global_step": 425809, "epoch": 5130} {"train_loss": -26.215778350830078, "global_step": 425810, "epoch": 5130} {"train_loss": -26.494653701782227, "global_step": 425811, "epoch": 5130} {"train_loss": -26.61667251586914, "global_step": 425812, "epoch": 5130} {"train_loss": -26.883777618408203, "global_step": 425813, "epoch": 5130} {"train_loss": -26.462732315063477, "global_step": 425814, "epoch": 5130} {"train_loss": -26.54359245300293, "global_step": 425815, "epoch": 5130} {"train_loss": -26.712982177734375, "global_step": 425816, "epoch": 5130} {"train_loss": -26.853271484375, "global_step": 425817, "epoch": 5130} {"train_loss": -26.583770751953125, "global_step": 425818, "epoch": 5130} {"train_loss": -26.99970054626465, "global_step": 425819, "epoch": 5130} {"train_loss": -26.285558700561523, "global_step": 425820, "epoch": 5130} {"train_loss": -26.625492095947266, "global_step": 425821, "epoch": 5130} {"train_loss": -26.957345962524414, "global_step": 425822, "epoch": 5130} {"train_loss": -27.208206176757812, "global_step": 425823, "epoch": 5130} {"train_loss": -26.862531661987305, "global_step": 425824, "epoch": 5130} {"train_loss": -26.79646110534668, "global_step": 425825, "epoch": 5130} {"train_loss": -27.23423194885254, "global_step": 425826, "epoch": 5130} {"train_loss": -26.97640037536621, "global_step": 425827, "epoch": 5130} {"train_loss": -27.153425216674805, "global_step": 425828, "epoch": 5130} {"train_loss": -26.72370719909668, "global_step": 425829, "epoch": 5130} {"train_loss": -27.153003692626953, "global_step": 425830, "epoch": 5130} {"train_loss": -26.76554298400879, "global_step": 425831, "epoch": 5130} {"train_loss": -27.242029190063477, "global_step": 425832, "epoch": 5130} {"train_loss": -26.93536376953125, "global_step": 425833, "epoch": 5130} {"train_loss": -27.03876304626465, "global_step": 425834, "epoch": 5130} {"train_loss": -27.09528923034668, "global_step": 425835, "epoch": 5130} {"train_loss": -26.9146785736084, "global_step": 425836, "epoch": 5130} {"train_loss": -26.9541072845459, "global_step": 425837, "epoch": 5130} {"train_loss": -27.10964012145996, "global_step": 425838, "epoch": 5130} {"train_loss": -27.150955200195312, "global_step": 425839, "epoch": 5130} {"train_loss": -26.805042266845703, "global_step": 425840, "epoch": 5130} {"train_loss": -26.88922119140625, "global_step": 425841, "epoch": 5130} {"train_loss": -26.628355026245117, "global_step": 425842, "epoch": 5130} {"train_loss": -27.11572265625, "global_step": 425843, "epoch": 5130} {"train_loss": -26.67945671081543, "global_step": 425844, "epoch": 5130} {"train_loss": -26.779767990112305, "global_step": 425845, "epoch": 5130} {"train_loss": -26.055078506469727, "global_step": 425846, "epoch": 5130} {"train_loss": -26.19044303894043, "global_step": 425847, "epoch": 5130} {"train_loss": -26.970808029174805, "global_step": 425848, "epoch": 5130} {"train_loss": -26.471405029296875, "global_step": 425849, "epoch": 5130} {"train_loss": -27.08172607421875, "global_step": 425850, "epoch": 5130} {"train_loss": -26.982807159423828, "global_step": 425851, "epoch": 5130} {"train_loss": -27.332944869995117, "global_step": 425852, "epoch": 5130} {"train_loss": -26.983905792236328, "global_step": 425853, "epoch": 5130} {"train_loss": -26.879343032836914, "global_step": 425854, "epoch": 5130} {"train_loss": -26.5965518951416, "global_step": 425855, "epoch": 5130} {"train_loss": -27.028568267822266, "global_step": 425856, "epoch": 5130} {"train_loss": -27.0401611328125, "global_step": 425857, "epoch": 5130} {"train_loss": -26.944446563720703, "global_step": 425858, "epoch": 5130} {"train_loss": -26.779584884643555, "global_step": 425859, "epoch": 5130} {"train_loss": -26.577619552612305, "global_step": 425860, "epoch": 5130} {"train_loss": -26.884069442749023, "global_step": 425861, "epoch": 5130} {"train_loss": -26.7916259765625, "global_step": 425862, "epoch": 5130} {"train_loss": -26.6621150970459, "global_step": 425863, "epoch": 5130} {"train_loss": -26.876224517822266, "global_step": 425864, "epoch": 5130} {"train_loss": -27.04685401916504, "global_step": 425865, "epoch": 5130} {"train_loss": -27.022724151611328, "global_step": 425866, "epoch": 5130} {"train_loss": -27.199283599853516, "global_step": 425867, "epoch": 5130} {"train_loss": -26.74921226501465, "global_step": 425868, "epoch": 5130} {"train_loss": -27.32789421081543, "global_step": 425869, "epoch": 5130} {"train_loss": -26.947118759155273, "global_step": 425870, "epoch": 5130} {"train_loss": -27.32389259338379, "global_step": 425871, "epoch": 5130} {"train_loss": -26.748167267764906, "global_step": 425872, "epoch": 5130, "val_loss": 6897500.0} {"train_loss": -26.248517990112305, "global_step": 425873, "epoch": 5131} {"train_loss": -26.27369499206543, "global_step": 425874, "epoch": 5131} {"train_loss": -26.47242546081543, "global_step": 425875, "epoch": 5131} {"train_loss": -26.376728057861328, "global_step": 425876, "epoch": 5131} {"train_loss": -26.5905818939209, "global_step": 425877, "epoch": 5131} {"train_loss": -26.486896514892578, "global_step": 425878, "epoch": 5131} {"train_loss": -26.54683494567871, "global_step": 425879, "epoch": 5131} {"train_loss": -26.68171501159668, "global_step": 425880, "epoch": 5131} {"train_loss": -26.75003433227539, "global_step": 425881, "epoch": 5131} {"train_loss": -26.690017700195312, "global_step": 425882, "epoch": 5131} {"train_loss": -26.47755241394043, "global_step": 425883, "epoch": 5131} {"train_loss": -26.6396484375, "global_step": 425884, "epoch": 5131} {"train_loss": -26.95220947265625, "global_step": 425885, "epoch": 5131} {"train_loss": -26.55495262145996, "global_step": 425886, "epoch": 5131} {"train_loss": -26.5115966796875, "global_step": 425887, "epoch": 5131} {"train_loss": -26.723438262939453, "global_step": 425888, "epoch": 5131} {"train_loss": -26.765348434448242, "global_step": 425889, "epoch": 5131} {"train_loss": -26.832294464111328, "global_step": 425890, "epoch": 5131} {"train_loss": -26.937580108642578, "global_step": 425891, "epoch": 5131} {"train_loss": -26.902698516845703, "global_step": 425892, "epoch": 5131} {"train_loss": -26.799978256225586, "global_step": 425893, "epoch": 5131} {"train_loss": -26.713275909423828, "global_step": 425894, "epoch": 5131} {"train_loss": -26.512176513671875, "global_step": 425895, "epoch": 5131} {"train_loss": -26.90756607055664, "global_step": 425896, "epoch": 5131} {"train_loss": -26.952728271484375, "global_step": 425897, "epoch": 5131} {"train_loss": -26.743576049804688, "global_step": 425898, "epoch": 5131} {"train_loss": -26.9764461517334, "global_step": 425899, "epoch": 5131} {"train_loss": -26.62213706970215, "global_step": 425900, "epoch": 5131} {"train_loss": -26.559986114501953, "global_step": 425901, "epoch": 5131} {"train_loss": -26.726943969726562, "global_step": 425902, "epoch": 5131} {"train_loss": -26.682697296142578, "global_step": 425903, "epoch": 5131} {"train_loss": -26.664472579956055, "global_step": 425904, "epoch": 5131} {"train_loss": -27.172937393188477, "global_step": 425905, "epoch": 5131} {"train_loss": -26.998075485229492, "global_step": 425906, "epoch": 5131} {"train_loss": -26.93063735961914, "global_step": 425907, "epoch": 5131} {"train_loss": -26.680206298828125, "global_step": 425908, "epoch": 5131} {"train_loss": -26.907896041870117, "global_step": 425909, "epoch": 5131} {"train_loss": -26.936262130737305, "global_step": 425910, "epoch": 5131} {"train_loss": -26.932636260986328, "global_step": 425911, "epoch": 5131} {"train_loss": -26.582752227783203, "global_step": 425912, "epoch": 5131} {"train_loss": -26.678424835205078, "global_step": 425913, "epoch": 5131} {"train_loss": -26.859155654907227, "global_step": 425914, "epoch": 5131} {"train_loss": -27.048965454101562, "global_step": 425915, "epoch": 5131} {"train_loss": -26.990671157836914, "global_step": 425916, "epoch": 5131} {"train_loss": -27.05262565612793, "global_step": 425917, "epoch": 5131} {"train_loss": -27.343088150024414, "global_step": 425918, "epoch": 5131} {"train_loss": -26.718881607055664, "global_step": 425919, "epoch": 5131} {"train_loss": -27.11394691467285, "global_step": 425920, "epoch": 5131} {"train_loss": -27.046628952026367, "global_step": 425921, "epoch": 5131} {"train_loss": -26.822219848632812, "global_step": 425922, "epoch": 5131} {"train_loss": -26.90744400024414, "global_step": 425923, "epoch": 5131} {"train_loss": -26.950714111328125, "global_step": 425924, "epoch": 5131} {"train_loss": -27.225736618041992, "global_step": 425925, "epoch": 5131} {"train_loss": -26.878442764282227, "global_step": 425926, "epoch": 5131} {"train_loss": -26.512420654296875, "global_step": 425927, "epoch": 5131} {"train_loss": -27.081518173217773, "global_step": 425928, "epoch": 5131} {"train_loss": -27.099756240844727, "global_step": 425929, "epoch": 5131} {"train_loss": -27.0134334564209, "global_step": 425930, "epoch": 5131} {"train_loss": -26.706846237182617, "global_step": 425931, "epoch": 5131} {"train_loss": -26.790851593017578, "global_step": 425932, "epoch": 5131} {"train_loss": -26.560827255249023, "global_step": 425933, "epoch": 5131} {"train_loss": -26.6216983795166, "global_step": 425934, "epoch": 5131} {"train_loss": -26.53486442565918, "global_step": 425935, "epoch": 5131} {"train_loss": -26.6210994720459, "global_step": 425936, "epoch": 5131} {"train_loss": -26.651447296142578, "global_step": 425937, "epoch": 5131} {"train_loss": -26.795780181884766, "global_step": 425938, "epoch": 5131} {"train_loss": -26.80535316467285, "global_step": 425939, "epoch": 5131} {"train_loss": -26.858823776245117, "global_step": 425940, "epoch": 5131} {"train_loss": -26.576221466064453, "global_step": 425941, "epoch": 5131} {"train_loss": -26.324462890625, "global_step": 425942, "epoch": 5131} {"train_loss": -27.520864486694336, "global_step": 425943, "epoch": 5131} {"train_loss": -26.850860595703125, "global_step": 425944, "epoch": 5131} {"train_loss": -26.486536026000977, "global_step": 425945, "epoch": 5131} {"train_loss": -26.56390380859375, "global_step": 425946, "epoch": 5131} {"train_loss": -26.49104881286621, "global_step": 425947, "epoch": 5131} {"train_loss": -26.882266998291016, "global_step": 425948, "epoch": 5131} {"train_loss": -26.933441162109375, "global_step": 425949, "epoch": 5131} {"train_loss": -26.553991317749023, "global_step": 425950, "epoch": 5131} {"train_loss": -27.17702293395996, "global_step": 425951, "epoch": 5131} {"train_loss": -26.729904174804688, "global_step": 425952, "epoch": 5131} {"train_loss": -26.86478042602539, "global_step": 425953, "epoch": 5131} {"train_loss": -26.617206573486328, "global_step": 425954, "epoch": 5131} {"train_loss": -26.77380644556988, "global_step": 425955, "epoch": 5131, "val_loss": 6906351.5} {"train_loss": -26.34613037109375, "global_step": 425956, "epoch": 5132} {"train_loss": -25.595672607421875, "global_step": 425957, "epoch": 5132} {"train_loss": -25.458742141723633, "global_step": 425958, "epoch": 5132} {"train_loss": -25.71114158630371, "global_step": 425959, "epoch": 5132} {"train_loss": -26.31827163696289, "global_step": 425960, "epoch": 5132} {"train_loss": -25.61665153503418, "global_step": 425961, "epoch": 5132} {"train_loss": -26.41883659362793, "global_step": 425962, "epoch": 5132} {"train_loss": -26.337066650390625, "global_step": 425963, "epoch": 5132} {"train_loss": -26.226104736328125, "global_step": 425964, "epoch": 5132} {"train_loss": -25.938278198242188, "global_step": 425965, "epoch": 5132} {"train_loss": -26.1572208404541, "global_step": 425966, "epoch": 5132} {"train_loss": -26.578725814819336, "global_step": 425967, "epoch": 5132} {"train_loss": -26.702457427978516, "global_step": 425968, "epoch": 5132} {"train_loss": -26.269926071166992, "global_step": 425969, "epoch": 5132} {"train_loss": -26.744007110595703, "global_step": 425970, "epoch": 5132} {"train_loss": -26.263235092163086, "global_step": 425971, "epoch": 5132} {"train_loss": -26.634992599487305, "global_step": 425972, "epoch": 5132} {"train_loss": -27.0550479888916, "global_step": 425973, "epoch": 5132} {"train_loss": -26.32770347595215, "global_step": 425974, "epoch": 5132} {"train_loss": -26.797809600830078, "global_step": 425975, "epoch": 5132} {"train_loss": -26.35284423828125, "global_step": 425976, "epoch": 5132} {"train_loss": -26.570159912109375, "global_step": 425977, "epoch": 5132} {"train_loss": -26.798171997070312, "global_step": 425978, "epoch": 5132} {"train_loss": -26.6160831451416, "global_step": 425979, "epoch": 5132} {"train_loss": -26.824888229370117, "global_step": 425980, "epoch": 5132} {"train_loss": -26.977746963500977, "global_step": 425981, "epoch": 5132} {"train_loss": -26.63933753967285, "global_step": 425982, "epoch": 5132} {"train_loss": -26.493947982788086, "global_step": 425983, "epoch": 5132} {"train_loss": -26.617919921875, "global_step": 425984, "epoch": 5132} {"train_loss": -26.83643913269043, "global_step": 425985, "epoch": 5132} {"train_loss": -26.789642333984375, "global_step": 425986, "epoch": 5132} {"train_loss": -27.037744522094727, "global_step": 425987, "epoch": 5132} {"train_loss": -26.946182250976562, "global_step": 425988, "epoch": 5132} {"train_loss": -26.989179611206055, "global_step": 425989, "epoch": 5132} {"train_loss": -26.453617095947266, "global_step": 425990, "epoch": 5132} {"train_loss": -27.093372344970703, "global_step": 425991, "epoch": 5132} {"train_loss": -26.55360221862793, "global_step": 425992, "epoch": 5132} {"train_loss": -27.12738037109375, "global_step": 425993, "epoch": 5132} {"train_loss": -27.00617790222168, "global_step": 425994, "epoch": 5132} {"train_loss": -26.861148834228516, "global_step": 425995, "epoch": 5132} {"train_loss": -27.2230167388916, "global_step": 425996, "epoch": 5132} {"train_loss": -26.97114372253418, "global_step": 425997, "epoch": 5132} {"train_loss": -27.253448486328125, "global_step": 425998, "epoch": 5132} {"train_loss": -26.774682998657227, "global_step": 425999, "epoch": 5132} {"train_loss": -27.265106201171875, "global_step": 426000, "epoch": 5132} {"train_loss": -27.357751846313477, "global_step": 426001, "epoch": 5132} {"train_loss": -26.985553741455078, "global_step": 426002, "epoch": 5132} {"train_loss": -27.2752628326416, "global_step": 426003, "epoch": 5132} {"train_loss": -27.295888900756836, "global_step": 426004, "epoch": 5132} {"train_loss": -26.874921798706055, "global_step": 426005, "epoch": 5132} {"train_loss": -26.823095321655273, "global_step": 426006, "epoch": 5132} {"train_loss": -26.738706588745117, "global_step": 426007, "epoch": 5132} {"train_loss": -26.445419311523438, "global_step": 426008, "epoch": 5132} {"train_loss": -26.7191219329834, "global_step": 426009, "epoch": 5132} {"train_loss": -26.860864639282227, "global_step": 426010, "epoch": 5132} {"train_loss": -26.73282814025879, "global_step": 426011, "epoch": 5132} {"train_loss": -25.658369064331055, "global_step": 426012, "epoch": 5132} {"train_loss": -25.179845809936523, "global_step": 426013, "epoch": 5132} {"train_loss": -25.709814071655273, "global_step": 426014, "epoch": 5132} {"train_loss": -27.10491371154785, "global_step": 426015, "epoch": 5132} {"train_loss": -26.819616317749023, "global_step": 426016, "epoch": 5132} {"train_loss": -25.851526260375977, "global_step": 426017, "epoch": 5132} {"train_loss": -25.94049072265625, "global_step": 426018, "epoch": 5132} {"train_loss": -26.475988388061523, "global_step": 426019, "epoch": 5132} {"train_loss": -26.821130752563477, "global_step": 426020, "epoch": 5132} {"train_loss": -26.245746612548828, "global_step": 426021, "epoch": 5132} {"train_loss": -26.744455337524414, "global_step": 426022, "epoch": 5132} {"train_loss": -26.687957763671875, "global_step": 426023, "epoch": 5132} {"train_loss": -26.350799560546875, "global_step": 426024, "epoch": 5132} {"train_loss": -26.606586456298828, "global_step": 426025, "epoch": 5132} {"train_loss": -26.700952529907227, "global_step": 426026, "epoch": 5132} {"train_loss": -26.5638370513916, "global_step": 426027, "epoch": 5132} {"train_loss": -26.510709762573242, "global_step": 426028, "epoch": 5132} {"train_loss": -26.477893829345703, "global_step": 426029, "epoch": 5132} {"train_loss": -27.054346084594727, "global_step": 426030, "epoch": 5132} {"train_loss": -26.522714614868164, "global_step": 426031, "epoch": 5132} {"train_loss": -26.869794845581055, "global_step": 426032, "epoch": 5132} {"train_loss": -26.288183212280273, "global_step": 426033, "epoch": 5132} {"train_loss": -26.636056900024414, "global_step": 426034, "epoch": 5132} {"train_loss": -26.657453536987305, "global_step": 426035, "epoch": 5132} {"train_loss": -26.39523696899414, "global_step": 426036, "epoch": 5132} {"train_loss": -26.544050216674805, "global_step": 426037, "epoch": 5132} {"train_loss": -26.588746358113116, "global_step": 426038, "epoch": 5132, "val_loss": 6872647.0} {"train_loss": -26.37598991394043, "global_step": 426039, "epoch": 5133} {"train_loss": -26.42278480529785, "global_step": 426040, "epoch": 5133} {"train_loss": -26.545974731445312, "global_step": 426041, "epoch": 5133} {"train_loss": -25.990081787109375, "global_step": 426042, "epoch": 5133} {"train_loss": -26.309253692626953, "global_step": 426043, "epoch": 5133} {"train_loss": -26.274723052978516, "global_step": 426044, "epoch": 5133} {"train_loss": -26.622106552124023, "global_step": 426045, "epoch": 5133} {"train_loss": -26.656370162963867, "global_step": 426046, "epoch": 5133} {"train_loss": -26.270483016967773, "global_step": 426047, "epoch": 5133} {"train_loss": -26.572553634643555, "global_step": 426048, "epoch": 5133} {"train_loss": -26.694690704345703, "global_step": 426049, "epoch": 5133} {"train_loss": -26.59137535095215, "global_step": 426050, "epoch": 5133} {"train_loss": -26.72714614868164, "global_step": 426051, "epoch": 5133} {"train_loss": -26.77827262878418, "global_step": 426052, "epoch": 5133} {"train_loss": -26.39979362487793, "global_step": 426053, "epoch": 5133} {"train_loss": -26.66074562072754, "global_step": 426054, "epoch": 5133} {"train_loss": -27.131296157836914, "global_step": 426055, "epoch": 5133} {"train_loss": -26.644927978515625, "global_step": 426056, "epoch": 5133} {"train_loss": -26.822843551635742, "global_step": 426057, "epoch": 5133} {"train_loss": -26.577611923217773, "global_step": 426058, "epoch": 5133} {"train_loss": -26.777917861938477, "global_step": 426059, "epoch": 5133} {"train_loss": -27.051116943359375, "global_step": 426060, "epoch": 5133} {"train_loss": -26.6397762298584, "global_step": 426061, "epoch": 5133} {"train_loss": -26.965850830078125, "global_step": 426062, "epoch": 5133} {"train_loss": -26.773000717163086, "global_step": 426063, "epoch": 5133} {"train_loss": -26.770172119140625, "global_step": 426064, "epoch": 5133} {"train_loss": -26.996118545532227, "global_step": 426065, "epoch": 5133} {"train_loss": -26.62088966369629, "global_step": 426066, "epoch": 5133} {"train_loss": -26.656461715698242, "global_step": 426067, "epoch": 5133} {"train_loss": -27.088102340698242, "global_step": 426068, "epoch": 5133} {"train_loss": -26.77536964416504, "global_step": 426069, "epoch": 5133} {"train_loss": -27.056745529174805, "global_step": 426070, "epoch": 5133} {"train_loss": -26.80088233947754, "global_step": 426071, "epoch": 5133} {"train_loss": -27.12660789489746, "global_step": 426072, "epoch": 5133} {"train_loss": -26.743677139282227, "global_step": 426073, "epoch": 5133} {"train_loss": -27.032852172851562, "global_step": 426074, "epoch": 5133} {"train_loss": -27.297178268432617, "global_step": 426075, "epoch": 5133} {"train_loss": -26.8631534576416, "global_step": 426076, "epoch": 5133} {"train_loss": -27.075693130493164, "global_step": 426077, "epoch": 5133} {"train_loss": -27.1120548248291, "global_step": 426078, "epoch": 5133} {"train_loss": -26.825149536132812, "global_step": 426079, "epoch": 5133} {"train_loss": -27.1754150390625, "global_step": 426080, "epoch": 5133} {"train_loss": -26.54548454284668, "global_step": 426081, "epoch": 5133} {"train_loss": -27.041894912719727, "global_step": 426082, "epoch": 5133} {"train_loss": -26.6495418548584, "global_step": 426083, "epoch": 5133} {"train_loss": -27.043386459350586, "global_step": 426084, "epoch": 5133} {"train_loss": -26.847579956054688, "global_step": 426085, "epoch": 5133} {"train_loss": -26.78785514831543, "global_step": 426086, "epoch": 5133} {"train_loss": -26.500293731689453, "global_step": 426087, "epoch": 5133} {"train_loss": -26.878849029541016, "global_step": 426088, "epoch": 5133} {"train_loss": -26.935712814331055, "global_step": 426089, "epoch": 5133} {"train_loss": -26.75628662109375, "global_step": 426090, "epoch": 5133} {"train_loss": -26.662094116210938, "global_step": 426091, "epoch": 5133} {"train_loss": -26.896076202392578, "global_step": 426092, "epoch": 5133} {"train_loss": -27.06787109375, "global_step": 426093, "epoch": 5133} {"train_loss": -26.692184448242188, "global_step": 426094, "epoch": 5133} {"train_loss": -27.056467056274414, "global_step": 426095, "epoch": 5133} {"train_loss": -26.80013084411621, "global_step": 426096, "epoch": 5133} {"train_loss": -26.950109481811523, "global_step": 426097, "epoch": 5133} {"train_loss": -27.19074821472168, "global_step": 426098, "epoch": 5133} {"train_loss": -26.54193687438965, "global_step": 426099, "epoch": 5133} {"train_loss": -26.808252334594727, "global_step": 426100, "epoch": 5133} {"train_loss": -27.51019287109375, "global_step": 426101, "epoch": 5133} {"train_loss": -27.056921005249023, "global_step": 426102, "epoch": 5133} {"train_loss": -27.203882217407227, "global_step": 426103, "epoch": 5133} {"train_loss": -26.7937068939209, "global_step": 426104, "epoch": 5133} {"train_loss": -27.1629695892334, "global_step": 426105, "epoch": 5133} {"train_loss": -27.185476303100586, "global_step": 426106, "epoch": 5133} {"train_loss": -26.80232048034668, "global_step": 426107, "epoch": 5133} {"train_loss": -27.040786743164062, "global_step": 426108, "epoch": 5133} {"train_loss": -27.149667739868164, "global_step": 426109, "epoch": 5133} {"train_loss": -26.802026748657227, "global_step": 426110, "epoch": 5133} {"train_loss": -27.419240951538086, "global_step": 426111, "epoch": 5133} {"train_loss": -26.850727081298828, "global_step": 426112, "epoch": 5133} {"train_loss": -27.0822811126709, "global_step": 426113, "epoch": 5133} {"train_loss": -27.018171310424805, "global_step": 426114, "epoch": 5133} {"train_loss": -26.71634292602539, "global_step": 426115, "epoch": 5133} {"train_loss": -27.130746841430664, "global_step": 426116, "epoch": 5133} {"train_loss": -26.9991397857666, "global_step": 426117, "epoch": 5133} {"train_loss": -26.891565322875977, "global_step": 426118, "epoch": 5133} {"train_loss": -27.0040225982666, "global_step": 426119, "epoch": 5133} {"train_loss": -27.011707305908203, "global_step": 426120, "epoch": 5133} {"train_loss": -26.861959549317877, "global_step": 426121, "epoch": 5133, "val_loss": 6940692.5} {"train_loss": -26.723224639892578, "global_step": 426122, "epoch": 5134} {"train_loss": -26.342893600463867, "global_step": 426123, "epoch": 5134} {"train_loss": -26.61273765563965, "global_step": 426124, "epoch": 5134} {"train_loss": -26.290863037109375, "global_step": 426125, "epoch": 5134} {"train_loss": -26.68829345703125, "global_step": 426126, "epoch": 5134} {"train_loss": -26.23076820373535, "global_step": 426127, "epoch": 5134} {"train_loss": -26.140478134155273, "global_step": 426128, "epoch": 5134} {"train_loss": -25.626102447509766, "global_step": 426129, "epoch": 5134} {"train_loss": -26.03717041015625, "global_step": 426130, "epoch": 5134} {"train_loss": -26.943822860717773, "global_step": 426131, "epoch": 5134} {"train_loss": -26.59107780456543, "global_step": 426132, "epoch": 5134} {"train_loss": -26.547880172729492, "global_step": 426133, "epoch": 5134} {"train_loss": -26.282520294189453, "global_step": 426134, "epoch": 5134} {"train_loss": -26.512664794921875, "global_step": 426135, "epoch": 5134} {"train_loss": -26.14838218688965, "global_step": 426136, "epoch": 5134} {"train_loss": -26.976638793945312, "global_step": 426137, "epoch": 5134} {"train_loss": -26.726001739501953, "global_step": 426138, "epoch": 5134} {"train_loss": -27.06194496154785, "global_step": 426139, "epoch": 5134} {"train_loss": -26.572528839111328, "global_step": 426140, "epoch": 5134} {"train_loss": -26.58243179321289, "global_step": 426141, "epoch": 5134} {"train_loss": -26.870386123657227, "global_step": 426142, "epoch": 5134} {"train_loss": -26.351333618164062, "global_step": 426143, "epoch": 5134} {"train_loss": -27.1336727142334, "global_step": 426144, "epoch": 5134} {"train_loss": -26.725305557250977, "global_step": 426145, "epoch": 5134} {"train_loss": -26.838834762573242, "global_step": 426146, "epoch": 5134} {"train_loss": -26.8520450592041, "global_step": 426147, "epoch": 5134} {"train_loss": -26.700225830078125, "global_step": 426148, "epoch": 5134} {"train_loss": -26.67229652404785, "global_step": 426149, "epoch": 5134} {"train_loss": -26.52779197692871, "global_step": 426150, "epoch": 5134} {"train_loss": -26.903167724609375, "global_step": 426151, "epoch": 5134} {"train_loss": -26.56349754333496, "global_step": 426152, "epoch": 5134} {"train_loss": -26.981582641601562, "global_step": 426153, "epoch": 5134} {"train_loss": -26.517078399658203, "global_step": 426154, "epoch": 5134} {"train_loss": -27.117124557495117, "global_step": 426155, "epoch": 5134} {"train_loss": -26.691608428955078, "global_step": 426156, "epoch": 5134} {"train_loss": -26.96857261657715, "global_step": 426157, "epoch": 5134} {"train_loss": -26.730884552001953, "global_step": 426158, "epoch": 5134} {"train_loss": -26.757434844970703, "global_step": 426159, "epoch": 5134} {"train_loss": -27.07240104675293, "global_step": 426160, "epoch": 5134} {"train_loss": -26.720468521118164, "global_step": 426161, "epoch": 5134} {"train_loss": -27.014728546142578, "global_step": 426162, "epoch": 5134} {"train_loss": -26.8218994140625, "global_step": 426163, "epoch": 5134} {"train_loss": -26.82026481628418, "global_step": 426164, "epoch": 5134} {"train_loss": -26.656103134155273, "global_step": 426165, "epoch": 5134} {"train_loss": -27.095203399658203, "global_step": 426166, "epoch": 5134} {"train_loss": -27.15118408203125, "global_step": 426167, "epoch": 5134} {"train_loss": -27.00005531311035, "global_step": 426168, "epoch": 5134} {"train_loss": -27.0225830078125, "global_step": 426169, "epoch": 5134} {"train_loss": -26.831457138061523, "global_step": 426170, "epoch": 5134} {"train_loss": -26.85400390625, "global_step": 426171, "epoch": 5134} {"train_loss": -26.90363883972168, "global_step": 426172, "epoch": 5134} {"train_loss": -26.964277267456055, "global_step": 426173, "epoch": 5134} {"train_loss": -27.019474029541016, "global_step": 426174, "epoch": 5134} {"train_loss": -27.199472427368164, "global_step": 426175, "epoch": 5134} {"train_loss": -27.268924713134766, "global_step": 426176, "epoch": 5134} {"train_loss": -26.2713680267334, "global_step": 426177, "epoch": 5134} {"train_loss": -26.126996994018555, "global_step": 426178, "epoch": 5134} {"train_loss": -26.398218154907227, "global_step": 426179, "epoch": 5134} {"train_loss": -26.51849937438965, "global_step": 426180, "epoch": 5134} {"train_loss": -26.83888053894043, "global_step": 426181, "epoch": 5134} {"train_loss": -26.07155418395996, "global_step": 426182, "epoch": 5134} {"train_loss": -26.37430763244629, "global_step": 426183, "epoch": 5134} {"train_loss": -26.66096305847168, "global_step": 426184, "epoch": 5134} {"train_loss": -26.62674903869629, "global_step": 426185, "epoch": 5134} {"train_loss": -26.556303024291992, "global_step": 426186, "epoch": 5134} {"train_loss": -26.324304580688477, "global_step": 426187, "epoch": 5134} {"train_loss": -25.746183395385742, "global_step": 426188, "epoch": 5134} {"train_loss": -25.612258911132812, "global_step": 426189, "epoch": 5134} {"train_loss": -26.65204429626465, "global_step": 426190, "epoch": 5134} {"train_loss": -26.512760162353516, "global_step": 426191, "epoch": 5134} {"train_loss": -26.68861198425293, "global_step": 426192, "epoch": 5134} {"train_loss": -26.685565948486328, "global_step": 426193, "epoch": 5134} {"train_loss": -26.800046920776367, "global_step": 426194, "epoch": 5134} {"train_loss": -26.610370635986328, "global_step": 426195, "epoch": 5134} {"train_loss": -26.566434860229492, "global_step": 426196, "epoch": 5134} {"train_loss": -26.879535675048828, "global_step": 426197, "epoch": 5134} {"train_loss": -27.001943588256836, "global_step": 426198, "epoch": 5134} {"train_loss": -26.703083038330078, "global_step": 426199, "epoch": 5134} {"train_loss": -26.3407039642334, "global_step": 426200, "epoch": 5134} {"train_loss": -26.75029945373535, "global_step": 426201, "epoch": 5134} {"train_loss": -27.0358943939209, "global_step": 426202, "epoch": 5134} {"train_loss": -27.51967430114746, "global_step": 426203, "epoch": 5134} {"train_loss": -26.687592563858953, "global_step": 426204, "epoch": 5134, "val_loss": 6852239.0} {"train_loss": -26.278614044189453, "global_step": 426205, "epoch": 5135} {"train_loss": -25.905200958251953, "global_step": 426206, "epoch": 5135} {"train_loss": -26.002685546875, "global_step": 426207, "epoch": 5135} {"train_loss": -26.274023056030273, "global_step": 426208, "epoch": 5135} {"train_loss": -26.39816665649414, "global_step": 426209, "epoch": 5135} {"train_loss": -26.328100204467773, "global_step": 426210, "epoch": 5135} {"train_loss": -26.2689208984375, "global_step": 426211, "epoch": 5135} {"train_loss": -26.63020133972168, "global_step": 426212, "epoch": 5135} {"train_loss": -26.627172470092773, "global_step": 426213, "epoch": 5135} {"train_loss": -26.172637939453125, "global_step": 426214, "epoch": 5135} {"train_loss": -26.690580368041992, "global_step": 426215, "epoch": 5135} {"train_loss": -26.192340850830078, "global_step": 426216, "epoch": 5135} {"train_loss": -26.407739639282227, "global_step": 426217, "epoch": 5135} {"train_loss": -26.179975509643555, "global_step": 426218, "epoch": 5135} {"train_loss": -26.782140731811523, "global_step": 426219, "epoch": 5135} {"train_loss": -26.609586715698242, "global_step": 426220, "epoch": 5135} {"train_loss": -26.6693172454834, "global_step": 426221, "epoch": 5135} {"train_loss": -26.255590438842773, "global_step": 426222, "epoch": 5135} {"train_loss": -26.598852157592773, "global_step": 426223, "epoch": 5135} {"train_loss": -26.736480712890625, "global_step": 426224, "epoch": 5135} {"train_loss": -26.653705596923828, "global_step": 426225, "epoch": 5135} {"train_loss": -26.6043758392334, "global_step": 426226, "epoch": 5135} {"train_loss": -26.70989990234375, "global_step": 426227, "epoch": 5135} {"train_loss": -26.792377471923828, "global_step": 426228, "epoch": 5135} {"train_loss": -26.797433853149414, "global_step": 426229, "epoch": 5135} {"train_loss": -26.765995025634766, "global_step": 426230, "epoch": 5135} {"train_loss": -26.76708984375, "global_step": 426231, "epoch": 5135} {"train_loss": -26.758563995361328, "global_step": 426232, "epoch": 5135} {"train_loss": -26.956317901611328, "global_step": 426233, "epoch": 5135} {"train_loss": -26.701990127563477, "global_step": 426234, "epoch": 5135} {"train_loss": -27.046737670898438, "global_step": 426235, "epoch": 5135} {"train_loss": -26.940610885620117, "global_step": 426236, "epoch": 5135} {"train_loss": -27.0133056640625, "global_step": 426237, "epoch": 5135} {"train_loss": -26.665124893188477, "global_step": 426238, "epoch": 5135} {"train_loss": -26.734594345092773, "global_step": 426239, "epoch": 5135} {"train_loss": -26.569141387939453, "global_step": 426240, "epoch": 5135} {"train_loss": -27.0014591217041, "global_step": 426241, "epoch": 5135} {"train_loss": -26.79424476623535, "global_step": 426242, "epoch": 5135} {"train_loss": -26.760099411010742, "global_step": 426243, "epoch": 5135} {"train_loss": -26.637409210205078, "global_step": 426244, "epoch": 5135} {"train_loss": -26.765522003173828, "global_step": 426245, "epoch": 5135} {"train_loss": -26.91165542602539, "global_step": 426246, "epoch": 5135} {"train_loss": -26.649839401245117, "global_step": 426247, "epoch": 5135} {"train_loss": -27.020862579345703, "global_step": 426248, "epoch": 5135} {"train_loss": -27.152616500854492, "global_step": 426249, "epoch": 5135} {"train_loss": -26.804044723510742, "global_step": 426250, "epoch": 5135} {"train_loss": -26.4677677154541, "global_step": 426251, "epoch": 5135} {"train_loss": -26.820783615112305, "global_step": 426252, "epoch": 5135} {"train_loss": -26.6239070892334, "global_step": 426253, "epoch": 5135} {"train_loss": -26.62232780456543, "global_step": 426254, "epoch": 5135} {"train_loss": -26.87537956237793, "global_step": 426255, "epoch": 5135} {"train_loss": -27.386266708374023, "global_step": 426256, "epoch": 5135} {"train_loss": -26.5889835357666, "global_step": 426257, "epoch": 5135} {"train_loss": -26.684711456298828, "global_step": 426258, "epoch": 5135} {"train_loss": -26.727359771728516, "global_step": 426259, "epoch": 5135} {"train_loss": -26.739490509033203, "global_step": 426260, "epoch": 5135} {"train_loss": -26.6042537689209, "global_step": 426261, "epoch": 5135} {"train_loss": -26.610309600830078, "global_step": 426262, "epoch": 5135} {"train_loss": -27.120559692382812, "global_step": 426263, "epoch": 5135} {"train_loss": -26.82020378112793, "global_step": 426264, "epoch": 5135} {"train_loss": -27.038923263549805, "global_step": 426265, "epoch": 5135} {"train_loss": -26.912185668945312, "global_step": 426266, "epoch": 5135} {"train_loss": -26.59522819519043, "global_step": 426267, "epoch": 5135} {"train_loss": -26.946979522705078, "global_step": 426268, "epoch": 5135} {"train_loss": -26.766469955444336, "global_step": 426269, "epoch": 5135} {"train_loss": -26.880542755126953, "global_step": 426270, "epoch": 5135} {"train_loss": -26.69219398498535, "global_step": 426271, "epoch": 5135} {"train_loss": -26.7431697845459, "global_step": 426272, "epoch": 5135} {"train_loss": -26.931995391845703, "global_step": 426273, "epoch": 5135} {"train_loss": -26.944116592407227, "global_step": 426274, "epoch": 5135} {"train_loss": -26.73824119567871, "global_step": 426275, "epoch": 5135} {"train_loss": -27.040363311767578, "global_step": 426276, "epoch": 5135} {"train_loss": -26.585107803344727, "global_step": 426277, "epoch": 5135} {"train_loss": -26.9915828704834, "global_step": 426278, "epoch": 5135} {"train_loss": -26.715259552001953, "global_step": 426279, "epoch": 5135} {"train_loss": -26.716344833374023, "global_step": 426280, "epoch": 5135} {"train_loss": -27.163267135620117, "global_step": 426281, "epoch": 5135} {"train_loss": -26.817529678344727, "global_step": 426282, "epoch": 5135} {"train_loss": -26.73160743713379, "global_step": 426283, "epoch": 5135} {"train_loss": -26.929540634155273, "global_step": 426284, "epoch": 5135} {"train_loss": -27.015872955322266, "global_step": 426285, "epoch": 5135} {"train_loss": -26.503564834594727, "global_step": 426286, "epoch": 5135} {"train_loss": -26.69472862151732, "global_step": 426287, "epoch": 5135, "val_loss": 7020643.0} {"train_loss": -24.43411636352539, "global_step": 426288, "epoch": 5136} {"train_loss": -24.859922409057617, "global_step": 426289, "epoch": 5136} {"train_loss": -25.373659133911133, "global_step": 426290, "epoch": 5136} {"train_loss": -25.54175567626953, "global_step": 426291, "epoch": 5136} {"train_loss": -25.828540802001953, "global_step": 426292, "epoch": 5136} {"train_loss": -25.666534423828125, "global_step": 426293, "epoch": 5136} {"train_loss": -25.508554458618164, "global_step": 426294, "epoch": 5136} {"train_loss": -26.251968383789062, "global_step": 426295, "epoch": 5136} {"train_loss": -25.56024742126465, "global_step": 426296, "epoch": 5136} {"train_loss": -25.75457191467285, "global_step": 426297, "epoch": 5136} {"train_loss": -25.777868270874023, "global_step": 426298, "epoch": 5136} {"train_loss": -26.293079376220703, "global_step": 426299, "epoch": 5136} {"train_loss": -26.09417152404785, "global_step": 426300, "epoch": 5136} {"train_loss": -25.991010665893555, "global_step": 426301, "epoch": 5136} {"train_loss": -26.19073486328125, "global_step": 426302, "epoch": 5136} {"train_loss": -26.16571617126465, "global_step": 426303, "epoch": 5136} {"train_loss": -26.384077072143555, "global_step": 426304, "epoch": 5136} {"train_loss": -26.296415328979492, "global_step": 426305, "epoch": 5136} {"train_loss": -26.4725341796875, "global_step": 426306, "epoch": 5136} {"train_loss": -26.093475341796875, "global_step": 426307, "epoch": 5136} {"train_loss": -26.278034210205078, "global_step": 426308, "epoch": 5136} {"train_loss": -26.50380516052246, "global_step": 426309, "epoch": 5136} {"train_loss": -26.5120792388916, "global_step": 426310, "epoch": 5136} {"train_loss": -26.62531852722168, "global_step": 426311, "epoch": 5136} {"train_loss": -26.58160400390625, "global_step": 426312, "epoch": 5136} {"train_loss": -26.39596939086914, "global_step": 426313, "epoch": 5136} {"train_loss": -26.657276153564453, "global_step": 426314, "epoch": 5136} {"train_loss": -26.773574829101562, "global_step": 426315, "epoch": 5136} {"train_loss": -26.389236450195312, "global_step": 426316, "epoch": 5136} {"train_loss": -26.969425201416016, "global_step": 426317, "epoch": 5136} {"train_loss": -26.309518814086914, "global_step": 426318, "epoch": 5136} {"train_loss": -26.795202255249023, "global_step": 426319, "epoch": 5136} {"train_loss": -26.59258460998535, "global_step": 426320, "epoch": 5136} {"train_loss": -26.392362594604492, "global_step": 426321, "epoch": 5136} {"train_loss": -26.5047550201416, "global_step": 426322, "epoch": 5136} {"train_loss": -26.84214210510254, "global_step": 426323, "epoch": 5136} {"train_loss": -27.051435470581055, "global_step": 426324, "epoch": 5136} {"train_loss": -26.884241104125977, "global_step": 426325, "epoch": 5136} {"train_loss": -26.836938858032227, "global_step": 426326, "epoch": 5136} {"train_loss": -26.617298126220703, "global_step": 426327, "epoch": 5136} {"train_loss": -27.363525390625, "global_step": 426328, "epoch": 5136} {"train_loss": -26.89740562438965, "global_step": 426329, "epoch": 5136} {"train_loss": -27.011810302734375, "global_step": 426330, "epoch": 5136} {"train_loss": -26.92170524597168, "global_step": 426331, "epoch": 5136} {"train_loss": -26.541715621948242, "global_step": 426332, "epoch": 5136} {"train_loss": -27.009204864501953, "global_step": 426333, "epoch": 5136} {"train_loss": -26.877988815307617, "global_step": 426334, "epoch": 5136} {"train_loss": -26.6274471282959, "global_step": 426335, "epoch": 5136} {"train_loss": -26.971899032592773, "global_step": 426336, "epoch": 5136} {"train_loss": -26.30682373046875, "global_step": 426337, "epoch": 5136} {"train_loss": -27.176061630249023, "global_step": 426338, "epoch": 5136} {"train_loss": -26.979650497436523, "global_step": 426339, "epoch": 5136} {"train_loss": -26.637723922729492, "global_step": 426340, "epoch": 5136} {"train_loss": -26.83587646484375, "global_step": 426341, "epoch": 5136} {"train_loss": -26.935993194580078, "global_step": 426342, "epoch": 5136} {"train_loss": -26.846145629882812, "global_step": 426343, "epoch": 5136} {"train_loss": -27.048297882080078, "global_step": 426344, "epoch": 5136} {"train_loss": -27.155126571655273, "global_step": 426345, "epoch": 5136} {"train_loss": -27.01080894470215, "global_step": 426346, "epoch": 5136} {"train_loss": -27.112939834594727, "global_step": 426347, "epoch": 5136} {"train_loss": -27.470632553100586, "global_step": 426348, "epoch": 5136} {"train_loss": -26.927387237548828, "global_step": 426349, "epoch": 5136} {"train_loss": -26.949865341186523, "global_step": 426350, "epoch": 5136} {"train_loss": -27.142532348632812, "global_step": 426351, "epoch": 5136} {"train_loss": -27.040145874023438, "global_step": 426352, "epoch": 5136} {"train_loss": -26.74684715270996, "global_step": 426353, "epoch": 5136} {"train_loss": -26.940759658813477, "global_step": 426354, "epoch": 5136} {"train_loss": -26.93012809753418, "global_step": 426355, "epoch": 5136} {"train_loss": -26.728757858276367, "global_step": 426356, "epoch": 5136} {"train_loss": -26.628402709960938, "global_step": 426357, "epoch": 5136} {"train_loss": -27.56396484375, "global_step": 426358, "epoch": 5136} {"train_loss": -26.743146896362305, "global_step": 426359, "epoch": 5136} {"train_loss": -26.297155380249023, "global_step": 426360, "epoch": 5136} {"train_loss": -25.59280776977539, "global_step": 426361, "epoch": 5136} {"train_loss": -25.423322677612305, "global_step": 426362, "epoch": 5136} {"train_loss": -26.5081844329834, "global_step": 426363, "epoch": 5136} {"train_loss": -26.707111358642578, "global_step": 426364, "epoch": 5136} {"train_loss": -26.514678955078125, "global_step": 426365, "epoch": 5136} {"train_loss": -26.12744140625, "global_step": 426366, "epoch": 5136} {"train_loss": -26.712942123413086, "global_step": 426367, "epoch": 5136} {"train_loss": -27.010669708251953, "global_step": 426368, "epoch": 5136} {"train_loss": -25.900531768798828, "global_step": 426369, "epoch": 5136} {"train_loss": -26.506769318178474, "global_step": 426370, "epoch": 5136, "val_loss": 6915878.0} {"train_loss": -25.88553810119629, "global_step": 426371, "epoch": 5137} {"train_loss": -26.175146102905273, "global_step": 426372, "epoch": 5137} {"train_loss": -26.143360137939453, "global_step": 426373, "epoch": 5137} {"train_loss": -26.255353927612305, "global_step": 426374, "epoch": 5137} {"train_loss": -25.86798667907715, "global_step": 426375, "epoch": 5137} {"train_loss": -25.993616104125977, "global_step": 426376, "epoch": 5137} {"train_loss": -26.1970272064209, "global_step": 426377, "epoch": 5137} {"train_loss": -26.540372848510742, "global_step": 426378, "epoch": 5137} {"train_loss": -26.19559097290039, "global_step": 426379, "epoch": 5137} {"train_loss": -26.153249740600586, "global_step": 426380, "epoch": 5137} {"train_loss": -26.621103286743164, "global_step": 426381, "epoch": 5137} {"train_loss": -26.17864990234375, "global_step": 426382, "epoch": 5137} {"train_loss": -25.83200454711914, "global_step": 426383, "epoch": 5137} {"train_loss": -26.636249542236328, "global_step": 426384, "epoch": 5137} {"train_loss": -26.43302345275879, "global_step": 426385, "epoch": 5137} {"train_loss": -26.394906997680664, "global_step": 426386, "epoch": 5137} {"train_loss": -26.50579833984375, "global_step": 426387, "epoch": 5137} {"train_loss": -26.52536392211914, "global_step": 426388, "epoch": 5137} {"train_loss": -26.628156661987305, "global_step": 426389, "epoch": 5137} {"train_loss": -26.546850204467773, "global_step": 426390, "epoch": 5137} {"train_loss": -26.74055290222168, "global_step": 426391, "epoch": 5137} {"train_loss": -26.47114372253418, "global_step": 426392, "epoch": 5137} {"train_loss": -26.65887451171875, "global_step": 426393, "epoch": 5137} {"train_loss": -26.506153106689453, "global_step": 426394, "epoch": 5137} {"train_loss": -26.82172203063965, "global_step": 426395, "epoch": 5137} {"train_loss": -26.86886978149414, "global_step": 426396, "epoch": 5137} {"train_loss": -26.773944854736328, "global_step": 426397, "epoch": 5137} {"train_loss": -26.86492919921875, "global_step": 426398, "epoch": 5137} {"train_loss": -27.094858169555664, "global_step": 426399, "epoch": 5137} {"train_loss": -26.601398468017578, "global_step": 426400, "epoch": 5137} {"train_loss": -26.95635986328125, "global_step": 426401, "epoch": 5137} {"train_loss": -26.9455509185791, "global_step": 426402, "epoch": 5137} {"train_loss": -26.7656307220459, "global_step": 426403, "epoch": 5137} {"train_loss": -26.867923736572266, "global_step": 426404, "epoch": 5137} {"train_loss": -27.005956649780273, "global_step": 426405, "epoch": 5137} {"train_loss": -27.074874877929688, "global_step": 426406, "epoch": 5137} {"train_loss": -26.934402465820312, "global_step": 426407, "epoch": 5137} {"train_loss": -26.841022491455078, "global_step": 426408, "epoch": 5137} {"train_loss": -27.084211349487305, "global_step": 426409, "epoch": 5137} {"train_loss": -26.98543357849121, "global_step": 426410, "epoch": 5137} {"train_loss": -26.98749351501465, "global_step": 426411, "epoch": 5137} {"train_loss": -26.84375, "global_step": 426412, "epoch": 5137} {"train_loss": -26.84943199157715, "global_step": 426413, "epoch": 5137} {"train_loss": -26.871240615844727, "global_step": 426414, "epoch": 5137} {"train_loss": -27.084716796875, "global_step": 426415, "epoch": 5137} {"train_loss": -26.988433837890625, "global_step": 426416, "epoch": 5137} {"train_loss": -26.88907814025879, "global_step": 426417, "epoch": 5137} {"train_loss": -26.98016357421875, "global_step": 426418, "epoch": 5137} {"train_loss": -27.094404220581055, "global_step": 426419, "epoch": 5137} {"train_loss": -26.90216636657715, "global_step": 426420, "epoch": 5137} {"train_loss": -26.59906005859375, "global_step": 426421, "epoch": 5137} {"train_loss": -27.11162757873535, "global_step": 426422, "epoch": 5137} {"train_loss": -27.265594482421875, "global_step": 426423, "epoch": 5137} {"train_loss": -27.017169952392578, "global_step": 426424, "epoch": 5137} {"train_loss": -27.001623153686523, "global_step": 426425, "epoch": 5137} {"train_loss": -26.6804256439209, "global_step": 426426, "epoch": 5137} {"train_loss": -26.670007705688477, "global_step": 426427, "epoch": 5137} {"train_loss": -27.041086196899414, "global_step": 426428, "epoch": 5137} {"train_loss": -27.2596378326416, "global_step": 426429, "epoch": 5137} {"train_loss": -26.787769317626953, "global_step": 426430, "epoch": 5137} {"train_loss": -26.92828941345215, "global_step": 426431, "epoch": 5137} {"train_loss": -26.82763671875, "global_step": 426432, "epoch": 5137} {"train_loss": -27.069793701171875, "global_step": 426433, "epoch": 5137} {"train_loss": -26.90805435180664, "global_step": 426434, "epoch": 5137} {"train_loss": -27.229816436767578, "global_step": 426435, "epoch": 5137} {"train_loss": -27.242053985595703, "global_step": 426436, "epoch": 5137} {"train_loss": -26.690290451049805, "global_step": 426437, "epoch": 5137} {"train_loss": -26.444482803344727, "global_step": 426438, "epoch": 5137} {"train_loss": -26.51799964904785, "global_step": 426439, "epoch": 5137} {"train_loss": -26.394058227539062, "global_step": 426440, "epoch": 5137} {"train_loss": -26.548831939697266, "global_step": 426441, "epoch": 5137} {"train_loss": -26.926013946533203, "global_step": 426442, "epoch": 5137} {"train_loss": -26.60602378845215, "global_step": 426443, "epoch": 5137} {"train_loss": -26.703968048095703, "global_step": 426444, "epoch": 5137} {"train_loss": -26.442325592041016, "global_step": 426445, "epoch": 5137} {"train_loss": -26.69390296936035, "global_step": 426446, "epoch": 5137} {"train_loss": -26.816455841064453, "global_step": 426447, "epoch": 5137} {"train_loss": -27.061420440673828, "global_step": 426448, "epoch": 5137} {"train_loss": -26.505395889282227, "global_step": 426449, "epoch": 5137} {"train_loss": -26.875442504882812, "global_step": 426450, "epoch": 5137} {"train_loss": -26.8845272064209, "global_step": 426451, "epoch": 5137} {"train_loss": -26.564802169799805, "global_step": 426452, "epoch": 5137} {"train_loss": -26.709911277495234, "global_step": 426453, "epoch": 5137, "val_loss": 7004753.0} {"train_loss": -26.515695571899414, "global_step": 426454, "epoch": 5138} {"train_loss": -26.8013858795166, "global_step": 426455, "epoch": 5138} {"train_loss": -26.604108810424805, "global_step": 426456, "epoch": 5138} {"train_loss": -26.26987075805664, "global_step": 426457, "epoch": 5138} {"train_loss": -26.338184356689453, "global_step": 426458, "epoch": 5138} {"train_loss": -26.323026657104492, "global_step": 426459, "epoch": 5138} {"train_loss": -26.0240535736084, "global_step": 426460, "epoch": 5138} {"train_loss": -26.00849723815918, "global_step": 426461, "epoch": 5138} {"train_loss": -26.212066650390625, "global_step": 426462, "epoch": 5138} {"train_loss": -26.42518424987793, "global_step": 426463, "epoch": 5138} {"train_loss": -26.576358795166016, "global_step": 426464, "epoch": 5138} {"train_loss": -26.4122314453125, "global_step": 426465, "epoch": 5138} {"train_loss": -26.647113800048828, "global_step": 426466, "epoch": 5138} {"train_loss": -26.350332260131836, "global_step": 426467, "epoch": 5138} {"train_loss": -26.574193954467773, "global_step": 426468, "epoch": 5138} {"train_loss": -26.61005210876465, "global_step": 426469, "epoch": 5138} {"train_loss": -26.72283935546875, "global_step": 426470, "epoch": 5138} {"train_loss": -26.6624755859375, "global_step": 426471, "epoch": 5138} {"train_loss": -26.5733585357666, "global_step": 426472, "epoch": 5138} {"train_loss": -26.225996017456055, "global_step": 426473, "epoch": 5138} {"train_loss": -26.60334587097168, "global_step": 426474, "epoch": 5138} {"train_loss": -26.790307998657227, "global_step": 426475, "epoch": 5138} {"train_loss": -26.6146297454834, "global_step": 426476, "epoch": 5138} {"train_loss": -26.89056396484375, "global_step": 426477, "epoch": 5138} {"train_loss": -26.473615646362305, "global_step": 426478, "epoch": 5138} {"train_loss": -26.887603759765625, "global_step": 426479, "epoch": 5138} {"train_loss": -26.4694881439209, "global_step": 426480, "epoch": 5138} {"train_loss": -26.592517852783203, "global_step": 426481, "epoch": 5138} {"train_loss": -26.883609771728516, "global_step": 426482, "epoch": 5138} {"train_loss": -26.772933959960938, "global_step": 426483, "epoch": 5138} {"train_loss": -26.839324951171875, "global_step": 426484, "epoch": 5138} {"train_loss": -26.6075439453125, "global_step": 426485, "epoch": 5138} {"train_loss": -27.079532623291016, "global_step": 426486, "epoch": 5138} {"train_loss": -26.803205490112305, "global_step": 426487, "epoch": 5138} {"train_loss": -27.169143676757812, "global_step": 426488, "epoch": 5138} {"train_loss": -27.127948760986328, "global_step": 426489, "epoch": 5138} {"train_loss": -26.808429718017578, "global_step": 426490, "epoch": 5138} {"train_loss": -26.869277954101562, "global_step": 426491, "epoch": 5138} {"train_loss": -26.79071617126465, "global_step": 426492, "epoch": 5138} {"train_loss": -26.902257919311523, "global_step": 426493, "epoch": 5138} {"train_loss": -26.8620662689209, "global_step": 426494, "epoch": 5138} {"train_loss": -27.168115615844727, "global_step": 426495, "epoch": 5138} {"train_loss": -26.792322158813477, "global_step": 426496, "epoch": 5138} {"train_loss": -27.108068466186523, "global_step": 426497, "epoch": 5138} {"train_loss": -26.984338760375977, "global_step": 426498, "epoch": 5138} {"train_loss": -27.074655532836914, "global_step": 426499, "epoch": 5138} {"train_loss": -27.145009994506836, "global_step": 426500, "epoch": 5138} {"train_loss": -26.845844268798828, "global_step": 426501, "epoch": 5138} {"train_loss": -26.768274307250977, "global_step": 426502, "epoch": 5138} {"train_loss": -27.103912353515625, "global_step": 426503, "epoch": 5138} {"train_loss": -27.03436851501465, "global_step": 426504, "epoch": 5138} {"train_loss": -26.301456451416016, "global_step": 426505, "epoch": 5138} {"train_loss": -27.106122970581055, "global_step": 426506, "epoch": 5138} {"train_loss": -26.900861740112305, "global_step": 426507, "epoch": 5138} {"train_loss": -26.775604248046875, "global_step": 426508, "epoch": 5138} {"train_loss": -27.187463760375977, "global_step": 426509, "epoch": 5138} {"train_loss": -27.257062911987305, "global_step": 426510, "epoch": 5138} {"train_loss": -26.94110679626465, "global_step": 426511, "epoch": 5138} {"train_loss": -26.91106605529785, "global_step": 426512, "epoch": 5138} {"train_loss": -27.129520416259766, "global_step": 426513, "epoch": 5138} {"train_loss": -26.696374893188477, "global_step": 426514, "epoch": 5138} {"train_loss": -27.17176628112793, "global_step": 426515, "epoch": 5138} {"train_loss": -26.42742919921875, "global_step": 426516, "epoch": 5138} {"train_loss": -26.41753578186035, "global_step": 426517, "epoch": 5138} {"train_loss": -26.959684371948242, "global_step": 426518, "epoch": 5138} {"train_loss": -26.768722534179688, "global_step": 426519, "epoch": 5138} {"train_loss": -26.8548583984375, "global_step": 426520, "epoch": 5138} {"train_loss": -26.311574935913086, "global_step": 426521, "epoch": 5138} {"train_loss": -27.03497314453125, "global_step": 426522, "epoch": 5138} {"train_loss": -26.818323135375977, "global_step": 426523, "epoch": 5138} {"train_loss": -26.952436447143555, "global_step": 426524, "epoch": 5138} {"train_loss": -27.074438095092773, "global_step": 426525, "epoch": 5138} {"train_loss": -27.010602951049805, "global_step": 426526, "epoch": 5138} {"train_loss": -26.57988929748535, "global_step": 426527, "epoch": 5138} {"train_loss": -26.773086547851562, "global_step": 426528, "epoch": 5138} {"train_loss": -26.81062126159668, "global_step": 426529, "epoch": 5138} {"train_loss": -26.983850479125977, "global_step": 426530, "epoch": 5138} {"train_loss": -26.673343658447266, "global_step": 426531, "epoch": 5138} {"train_loss": -26.88423728942871, "global_step": 426532, "epoch": 5138} {"train_loss": -26.916975021362305, "global_step": 426533, "epoch": 5138} {"train_loss": -26.7712345123291, "global_step": 426534, "epoch": 5138} {"train_loss": -26.586078643798828, "global_step": 426535, "epoch": 5138} {"train_loss": -26.75919247822589, "global_step": 426536, "epoch": 5138, "val_loss": 6941517.0} {"train_loss": -26.133819580078125, "global_step": 426537, "epoch": 5139} {"train_loss": -26.35440444946289, "global_step": 426538, "epoch": 5139} {"train_loss": -26.22627067565918, "global_step": 426539, "epoch": 5139} {"train_loss": -26.145465850830078, "global_step": 426540, "epoch": 5139} {"train_loss": -26.63850975036621, "global_step": 426541, "epoch": 5139} {"train_loss": -26.097578048706055, "global_step": 426542, "epoch": 5139} {"train_loss": -26.77552604675293, "global_step": 426543, "epoch": 5139} {"train_loss": -26.508573532104492, "global_step": 426544, "epoch": 5139} {"train_loss": -26.639047622680664, "global_step": 426545, "epoch": 5139} {"train_loss": -26.348724365234375, "global_step": 426546, "epoch": 5139} {"train_loss": -26.670896530151367, "global_step": 426547, "epoch": 5139} {"train_loss": -26.85190773010254, "global_step": 426548, "epoch": 5139} {"train_loss": -26.530927658081055, "global_step": 426549, "epoch": 5139} {"train_loss": -26.35042381286621, "global_step": 426550, "epoch": 5139} {"train_loss": -26.450061798095703, "global_step": 426551, "epoch": 5139} {"train_loss": -26.644418716430664, "global_step": 426552, "epoch": 5139} {"train_loss": -26.984954833984375, "global_step": 426553, "epoch": 5139} {"train_loss": -26.6164608001709, "global_step": 426554, "epoch": 5139} {"train_loss": -26.858495712280273, "global_step": 426555, "epoch": 5139} {"train_loss": -26.949798583984375, "global_step": 426556, "epoch": 5139} {"train_loss": -26.791772842407227, "global_step": 426557, "epoch": 5139} {"train_loss": -26.963529586791992, "global_step": 426558, "epoch": 5139} {"train_loss": -26.635589599609375, "global_step": 426559, "epoch": 5139} {"train_loss": -26.9841365814209, "global_step": 426560, "epoch": 5139} {"train_loss": -26.912649154663086, "global_step": 426561, "epoch": 5139} {"train_loss": -26.48126792907715, "global_step": 426562, "epoch": 5139} {"train_loss": -26.9508056640625, "global_step": 426563, "epoch": 5139} {"train_loss": -26.954065322875977, "global_step": 426564, "epoch": 5139} {"train_loss": -26.875524520874023, "global_step": 426565, "epoch": 5139} {"train_loss": -26.789865493774414, "global_step": 426566, "epoch": 5139} {"train_loss": -26.800262451171875, "global_step": 426567, "epoch": 5139} {"train_loss": -26.662195205688477, "global_step": 426568, "epoch": 5139} {"train_loss": -26.72633171081543, "global_step": 426569, "epoch": 5139} {"train_loss": -27.093748092651367, "global_step": 426570, "epoch": 5139} {"train_loss": -26.562381744384766, "global_step": 426571, "epoch": 5139} {"train_loss": -26.99110221862793, "global_step": 426572, "epoch": 5139} {"train_loss": -26.98834800720215, "global_step": 426573, "epoch": 5139} {"train_loss": -26.84722328186035, "global_step": 426574, "epoch": 5139} {"train_loss": -26.825977325439453, "global_step": 426575, "epoch": 5139} {"train_loss": -26.84528160095215, "global_step": 426576, "epoch": 5139} {"train_loss": -26.967041015625, "global_step": 426577, "epoch": 5139} {"train_loss": -26.8284969329834, "global_step": 426578, "epoch": 5139} {"train_loss": -27.06680679321289, "global_step": 426579, "epoch": 5139} {"train_loss": -27.158777236938477, "global_step": 426580, "epoch": 5139} {"train_loss": -26.90688133239746, "global_step": 426581, "epoch": 5139} {"train_loss": -27.08302879333496, "global_step": 426582, "epoch": 5139} {"train_loss": -27.300710678100586, "global_step": 426583, "epoch": 5139} {"train_loss": -27.016077041625977, "global_step": 426584, "epoch": 5139} {"train_loss": -26.80890464782715, "global_step": 426585, "epoch": 5139} {"train_loss": -27.14642906188965, "global_step": 426586, "epoch": 5139} {"train_loss": -27.121335983276367, "global_step": 426587, "epoch": 5139} {"train_loss": -26.6473331451416, "global_step": 426588, "epoch": 5139} {"train_loss": -27.17717933654785, "global_step": 426589, "epoch": 5139} {"train_loss": -27.39031982421875, "global_step": 426590, "epoch": 5139} {"train_loss": -26.504383087158203, "global_step": 426591, "epoch": 5139} {"train_loss": -26.89003562927246, "global_step": 426592, "epoch": 5139} {"train_loss": -26.878564834594727, "global_step": 426593, "epoch": 5139} {"train_loss": -26.669342041015625, "global_step": 426594, "epoch": 5139} {"train_loss": -26.85438346862793, "global_step": 426595, "epoch": 5139} {"train_loss": -27.18118667602539, "global_step": 426596, "epoch": 5139} {"train_loss": -26.944580078125, "global_step": 426597, "epoch": 5139} {"train_loss": -26.71354103088379, "global_step": 426598, "epoch": 5139} {"train_loss": -27.380695343017578, "global_step": 426599, "epoch": 5139} {"train_loss": -26.882251739501953, "global_step": 426600, "epoch": 5139} {"train_loss": -27.132715225219727, "global_step": 426601, "epoch": 5139} {"train_loss": -27.16566276550293, "global_step": 426602, "epoch": 5139} {"train_loss": -26.81818199157715, "global_step": 426603, "epoch": 5139} {"train_loss": -26.7911434173584, "global_step": 426604, "epoch": 5139} {"train_loss": -27.000165939331055, "global_step": 426605, "epoch": 5139} {"train_loss": -27.07891845703125, "global_step": 426606, "epoch": 5139} {"train_loss": -26.868383407592773, "global_step": 426607, "epoch": 5139} {"train_loss": -26.805973052978516, "global_step": 426608, "epoch": 5139} {"train_loss": -26.648971557617188, "global_step": 426609, "epoch": 5139} {"train_loss": -26.987829208374023, "global_step": 426610, "epoch": 5139} {"train_loss": -27.31646728515625, "global_step": 426611, "epoch": 5139} {"train_loss": -26.729873657226562, "global_step": 426612, "epoch": 5139} {"train_loss": -27.11578941345215, "global_step": 426613, "epoch": 5139} {"train_loss": -27.177289962768555, "global_step": 426614, "epoch": 5139} {"train_loss": -26.40540885925293, "global_step": 426615, "epoch": 5139} {"train_loss": -26.94428825378418, "global_step": 426616, "epoch": 5139} {"train_loss": -26.91632652282715, "global_step": 426617, "epoch": 5139} {"train_loss": -26.669116973876953, "global_step": 426618, "epoch": 5139} {"train_loss": -26.797823687633837, "global_step": 426619, "epoch": 5139, "val_loss": 6931210.0} {"train_loss": -26.586339950561523, "global_step": 426620, "epoch": 5140} {"train_loss": -26.070348739624023, "global_step": 426621, "epoch": 5140} {"train_loss": -26.260671615600586, "global_step": 426622, "epoch": 5140} {"train_loss": -26.309926986694336, "global_step": 426623, "epoch": 5140} {"train_loss": -26.508203506469727, "global_step": 426624, "epoch": 5140} {"train_loss": -26.617353439331055, "global_step": 426625, "epoch": 5140} {"train_loss": -26.248477935791016, "global_step": 426626, "epoch": 5140} {"train_loss": -26.316476821899414, "global_step": 426627, "epoch": 5140} {"train_loss": -26.78680992126465, "global_step": 426628, "epoch": 5140} {"train_loss": -26.58314323425293, "global_step": 426629, "epoch": 5140} {"train_loss": -26.52686882019043, "global_step": 426630, "epoch": 5140} {"train_loss": -26.694181442260742, "global_step": 426631, "epoch": 5140} {"train_loss": -26.460071563720703, "global_step": 426632, "epoch": 5140} {"train_loss": -26.234594345092773, "global_step": 426633, "epoch": 5140} {"train_loss": -26.691394805908203, "global_step": 426634, "epoch": 5140} {"train_loss": -26.412656784057617, "global_step": 426635, "epoch": 5140} {"train_loss": -26.433149337768555, "global_step": 426636, "epoch": 5140} {"train_loss": -26.453094482421875, "global_step": 426637, "epoch": 5140} {"train_loss": -26.799835205078125, "global_step": 426638, "epoch": 5140} {"train_loss": -26.421903610229492, "global_step": 426639, "epoch": 5140} {"train_loss": -26.711889266967773, "global_step": 426640, "epoch": 5140} {"train_loss": -26.587141036987305, "global_step": 426641, "epoch": 5140} {"train_loss": -26.47440528869629, "global_step": 426642, "epoch": 5140} {"train_loss": -26.64788818359375, "global_step": 426643, "epoch": 5140} {"train_loss": -27.146472930908203, "global_step": 426644, "epoch": 5140} {"train_loss": -26.460378646850586, "global_step": 426645, "epoch": 5140} {"train_loss": -26.63471031188965, "global_step": 426646, "epoch": 5140} {"train_loss": -26.79721450805664, "global_step": 426647, "epoch": 5140} {"train_loss": -26.907278060913086, "global_step": 426648, "epoch": 5140} {"train_loss": -26.6491641998291, "global_step": 426649, "epoch": 5140} {"train_loss": -26.352798461914062, "global_step": 426650, "epoch": 5140} {"train_loss": -26.50739860534668, "global_step": 426651, "epoch": 5140} {"train_loss": -26.8538875579834, "global_step": 426652, "epoch": 5140} {"train_loss": -26.88251304626465, "global_step": 426653, "epoch": 5140} {"train_loss": -26.8546142578125, "global_step": 426654, "epoch": 5140} {"train_loss": -26.61642837524414, "global_step": 426655, "epoch": 5140} {"train_loss": -26.80765151977539, "global_step": 426656, "epoch": 5140} {"train_loss": -26.770246505737305, "global_step": 426657, "epoch": 5140} {"train_loss": -27.137237548828125, "global_step": 426658, "epoch": 5140} {"train_loss": -27.117694854736328, "global_step": 426659, "epoch": 5140} {"train_loss": -26.739469528198242, "global_step": 426660, "epoch": 5140} {"train_loss": -27.065261840820312, "global_step": 426661, "epoch": 5140} {"train_loss": -26.307687759399414, "global_step": 426662, "epoch": 5140} {"train_loss": -26.906330108642578, "global_step": 426663, "epoch": 5140} {"train_loss": -26.74769401550293, "global_step": 426664, "epoch": 5140} {"train_loss": -27.12110710144043, "global_step": 426665, "epoch": 5140} {"train_loss": -26.664514541625977, "global_step": 426666, "epoch": 5140} {"train_loss": -26.881519317626953, "global_step": 426667, "epoch": 5140} {"train_loss": -26.445280075073242, "global_step": 426668, "epoch": 5140} {"train_loss": -26.895221710205078, "global_step": 426669, "epoch": 5140} {"train_loss": -26.5456485748291, "global_step": 426670, "epoch": 5140} {"train_loss": -26.98101806640625, "global_step": 426671, "epoch": 5140} {"train_loss": -26.78791618347168, "global_step": 426672, "epoch": 5140} {"train_loss": -26.93252944946289, "global_step": 426673, "epoch": 5140} {"train_loss": -26.95233726501465, "global_step": 426674, "epoch": 5140} {"train_loss": -27.093969345092773, "global_step": 426675, "epoch": 5140} {"train_loss": -26.9634952545166, "global_step": 426676, "epoch": 5140} {"train_loss": -26.711734771728516, "global_step": 426677, "epoch": 5140} {"train_loss": -26.62665367126465, "global_step": 426678, "epoch": 5140} {"train_loss": -26.812366485595703, "global_step": 426679, "epoch": 5140} {"train_loss": -27.223968505859375, "global_step": 426680, "epoch": 5140} {"train_loss": -27.347198486328125, "global_step": 426681, "epoch": 5140} {"train_loss": -26.83536148071289, "global_step": 426682, "epoch": 5140} {"train_loss": -26.82191276550293, "global_step": 426683, "epoch": 5140} {"train_loss": -27.12213134765625, "global_step": 426684, "epoch": 5140} {"train_loss": -27.071020126342773, "global_step": 426685, "epoch": 5140} {"train_loss": -26.6575984954834, "global_step": 426686, "epoch": 5140} {"train_loss": -27.14112663269043, "global_step": 426687, "epoch": 5140} {"train_loss": -27.301044464111328, "global_step": 426688, "epoch": 5140} {"train_loss": -27.15467643737793, "global_step": 426689, "epoch": 5140} {"train_loss": -27.198577880859375, "global_step": 426690, "epoch": 5140} {"train_loss": -26.89154052734375, "global_step": 426691, "epoch": 5140} {"train_loss": -27.236042022705078, "global_step": 426692, "epoch": 5140} {"train_loss": -27.014318466186523, "global_step": 426693, "epoch": 5140} {"train_loss": -26.48404884338379, "global_step": 426694, "epoch": 5140} {"train_loss": -27.0124454498291, "global_step": 426695, "epoch": 5140} {"train_loss": -26.945606231689453, "global_step": 426696, "epoch": 5140} {"train_loss": -27.03903579711914, "global_step": 426697, "epoch": 5140} {"train_loss": -27.125568389892578, "global_step": 426698, "epoch": 5140} {"train_loss": -26.74061393737793, "global_step": 426699, "epoch": 5140} {"train_loss": -27.077787399291992, "global_step": 426700, "epoch": 5140} {"train_loss": -26.9099063873291, "global_step": 426701, "epoch": 5140} {"train_loss": -26.776204787104962, "global_step": 426702, "epoch": 5140, "val_loss": 6909182.0} {"train_loss": -26.385345458984375, "global_step": 426703, "epoch": 5141} {"train_loss": -25.838916778564453, "global_step": 426704, "epoch": 5141} {"train_loss": -26.091672897338867, "global_step": 426705, "epoch": 5141} {"train_loss": -25.750778198242188, "global_step": 426706, "epoch": 5141} {"train_loss": -25.068571090698242, "global_step": 426707, "epoch": 5141} {"train_loss": -25.96120262145996, "global_step": 426708, "epoch": 5141} {"train_loss": -26.308218002319336, "global_step": 426709, "epoch": 5141} {"train_loss": -25.566770553588867, "global_step": 426710, "epoch": 5141} {"train_loss": -25.990650177001953, "global_step": 426711, "epoch": 5141} {"train_loss": -26.196653366088867, "global_step": 426712, "epoch": 5141} {"train_loss": -26.24631118774414, "global_step": 426713, "epoch": 5141} {"train_loss": -26.19807243347168, "global_step": 426714, "epoch": 5141} {"train_loss": -26.056371688842773, "global_step": 426715, "epoch": 5141} {"train_loss": -26.254623413085938, "global_step": 426716, "epoch": 5141} {"train_loss": -26.578466415405273, "global_step": 426717, "epoch": 5141} {"train_loss": -26.620101928710938, "global_step": 426718, "epoch": 5141} {"train_loss": -26.609134674072266, "global_step": 426719, "epoch": 5141} {"train_loss": -26.01283073425293, "global_step": 426720, "epoch": 5141} {"train_loss": -26.541040420532227, "global_step": 426721, "epoch": 5141} {"train_loss": -26.7799129486084, "global_step": 426722, "epoch": 5141} {"train_loss": -26.749805450439453, "global_step": 426723, "epoch": 5141} {"train_loss": -26.57242202758789, "global_step": 426724, "epoch": 5141} {"train_loss": -26.5084285736084, "global_step": 426725, "epoch": 5141} {"train_loss": -26.43133544921875, "global_step": 426726, "epoch": 5141} {"train_loss": -26.386632919311523, "global_step": 426727, "epoch": 5141} {"train_loss": -26.4184513092041, "global_step": 426728, "epoch": 5141} {"train_loss": -26.49627113342285, "global_step": 426729, "epoch": 5141} {"train_loss": -26.83392333984375, "global_step": 426730, "epoch": 5141} {"train_loss": -27.143857955932617, "global_step": 426731, "epoch": 5141} {"train_loss": -26.805749893188477, "global_step": 426732, "epoch": 5141} {"train_loss": -26.97898292541504, "global_step": 426733, "epoch": 5141} {"train_loss": -26.933767318725586, "global_step": 426734, "epoch": 5141} {"train_loss": -26.72248649597168, "global_step": 426735, "epoch": 5141} {"train_loss": -27.377439498901367, "global_step": 426736, "epoch": 5141} {"train_loss": -26.49103355407715, "global_step": 426737, "epoch": 5141} {"train_loss": -26.784799575805664, "global_step": 426738, "epoch": 5141} {"train_loss": -26.61799430847168, "global_step": 426739, "epoch": 5141} {"train_loss": -26.6521053314209, "global_step": 426740, "epoch": 5141} {"train_loss": -26.858518600463867, "global_step": 426741, "epoch": 5141} {"train_loss": -26.749536514282227, "global_step": 426742, "epoch": 5141} {"train_loss": -26.727075576782227, "global_step": 426743, "epoch": 5141} {"train_loss": -26.884733200073242, "global_step": 426744, "epoch": 5141} {"train_loss": -27.05521011352539, "global_step": 426745, "epoch": 5141} {"train_loss": -27.0410099029541, "global_step": 426746, "epoch": 5141} {"train_loss": -27.201831817626953, "global_step": 426747, "epoch": 5141} {"train_loss": -26.909412384033203, "global_step": 426748, "epoch": 5141} {"train_loss": -26.753034591674805, "global_step": 426749, "epoch": 5141} {"train_loss": -27.042871475219727, "global_step": 426750, "epoch": 5141} {"train_loss": -27.19199562072754, "global_step": 426751, "epoch": 5141} {"train_loss": -27.325439453125, "global_step": 426752, "epoch": 5141} {"train_loss": -27.219043731689453, "global_step": 426753, "epoch": 5141} {"train_loss": -26.799091339111328, "global_step": 426754, "epoch": 5141} {"train_loss": -26.81133460998535, "global_step": 426755, "epoch": 5141} {"train_loss": -26.840057373046875, "global_step": 426756, "epoch": 5141} {"train_loss": -27.176191329956055, "global_step": 426757, "epoch": 5141} {"train_loss": -26.760059356689453, "global_step": 426758, "epoch": 5141} {"train_loss": -27.06513786315918, "global_step": 426759, "epoch": 5141} {"train_loss": -26.974109649658203, "global_step": 426760, "epoch": 5141} {"train_loss": -26.83635902404785, "global_step": 426761, "epoch": 5141} {"train_loss": -26.9029598236084, "global_step": 426762, "epoch": 5141} {"train_loss": -26.581693649291992, "global_step": 426763, "epoch": 5141} {"train_loss": -26.672168731689453, "global_step": 426764, "epoch": 5141} {"train_loss": -26.49658203125, "global_step": 426765, "epoch": 5141} {"train_loss": -26.732572555541992, "global_step": 426766, "epoch": 5141} {"train_loss": -27.154409408569336, "global_step": 426767, "epoch": 5141} {"train_loss": -26.89210319519043, "global_step": 426768, "epoch": 5141} {"train_loss": -26.70377540588379, "global_step": 426769, "epoch": 5141} {"train_loss": -26.373666763305664, "global_step": 426770, "epoch": 5141} {"train_loss": -26.78525733947754, "global_step": 426771, "epoch": 5141} {"train_loss": -26.842864990234375, "global_step": 426772, "epoch": 5141} {"train_loss": -26.22639274597168, "global_step": 426773, "epoch": 5141} {"train_loss": -25.507638931274414, "global_step": 426774, "epoch": 5141} {"train_loss": -26.017988204956055, "global_step": 426775, "epoch": 5141} {"train_loss": -26.823163986206055, "global_step": 426776, "epoch": 5141} {"train_loss": -26.5030517578125, "global_step": 426777, "epoch": 5141} {"train_loss": -26.553760528564453, "global_step": 426778, "epoch": 5141} {"train_loss": -26.55218505859375, "global_step": 426779, "epoch": 5141} {"train_loss": -26.388690948486328, "global_step": 426780, "epoch": 5141} {"train_loss": -26.279794692993164, "global_step": 426781, "epoch": 5141} {"train_loss": -26.219202041625977, "global_step": 426782, "epoch": 5141} {"train_loss": -26.752424240112305, "global_step": 426783, "epoch": 5141} {"train_loss": -26.971826553344727, "global_step": 426784, "epoch": 5141} {"train_loss": -26.60066972295922, "global_step": 426785, "epoch": 5141, "val_loss": 6860432.5} {"train_loss": -25.7257022857666, "global_step": 426786, "epoch": 5142} {"train_loss": -26.327503204345703, "global_step": 426787, "epoch": 5142} {"train_loss": -25.903425216674805, "global_step": 426788, "epoch": 5142} {"train_loss": -25.86777687072754, "global_step": 426789, "epoch": 5142} {"train_loss": -26.536245346069336, "global_step": 426790, "epoch": 5142} {"train_loss": -26.29233741760254, "global_step": 426791, "epoch": 5142} {"train_loss": -26.54184913635254, "global_step": 426792, "epoch": 5142} {"train_loss": -26.600482940673828, "global_step": 426793, "epoch": 5142} {"train_loss": -26.593420028686523, "global_step": 426794, "epoch": 5142} {"train_loss": -26.615188598632812, "global_step": 426795, "epoch": 5142} {"train_loss": -26.512252807617188, "global_step": 426796, "epoch": 5142} {"train_loss": -26.609960556030273, "global_step": 426797, "epoch": 5142} {"train_loss": -26.2908935546875, "global_step": 426798, "epoch": 5142} {"train_loss": -26.871606826782227, "global_step": 426799, "epoch": 5142} {"train_loss": -26.923002243041992, "global_step": 426800, "epoch": 5142} {"train_loss": -26.6224308013916, "global_step": 426801, "epoch": 5142} {"train_loss": -26.628503799438477, "global_step": 426802, "epoch": 5142} {"train_loss": -26.770416259765625, "global_step": 426803, "epoch": 5142} {"train_loss": -26.794347763061523, "global_step": 426804, "epoch": 5142} {"train_loss": -26.803287506103516, "global_step": 426805, "epoch": 5142} {"train_loss": -27.27027702331543, "global_step": 426806, "epoch": 5142} {"train_loss": -26.941213607788086, "global_step": 426807, "epoch": 5142} {"train_loss": -26.750768661499023, "global_step": 426808, "epoch": 5142} {"train_loss": -26.78448486328125, "global_step": 426809, "epoch": 5142} {"train_loss": -26.89655876159668, "global_step": 426810, "epoch": 5142} {"train_loss": -27.148344039916992, "global_step": 426811, "epoch": 5142} {"train_loss": -26.859235763549805, "global_step": 426812, "epoch": 5142} {"train_loss": -27.024511337280273, "global_step": 426813, "epoch": 5142} {"train_loss": -27.076704025268555, "global_step": 426814, "epoch": 5142} {"train_loss": -26.556745529174805, "global_step": 426815, "epoch": 5142} {"train_loss": -27.060302734375, "global_step": 426816, "epoch": 5142} {"train_loss": -26.732791900634766, "global_step": 426817, "epoch": 5142} {"train_loss": -27.198715209960938, "global_step": 426818, "epoch": 5142} {"train_loss": -26.880908966064453, "global_step": 426819, "epoch": 5142} {"train_loss": -27.099334716796875, "global_step": 426820, "epoch": 5142} {"train_loss": -26.97373390197754, "global_step": 426821, "epoch": 5142} {"train_loss": -27.07305335998535, "global_step": 426822, "epoch": 5142} {"train_loss": -26.965322494506836, "global_step": 426823, "epoch": 5142} {"train_loss": -27.22199058532715, "global_step": 426824, "epoch": 5142} {"train_loss": -26.99249839782715, "global_step": 426825, "epoch": 5142} {"train_loss": -26.745283126831055, "global_step": 426826, "epoch": 5142} {"train_loss": -27.174219131469727, "global_step": 426827, "epoch": 5142} {"train_loss": -26.7407283782959, "global_step": 426828, "epoch": 5142} {"train_loss": -26.5723876953125, "global_step": 426829, "epoch": 5142} {"train_loss": -27.071523666381836, "global_step": 426830, "epoch": 5142} {"train_loss": -26.98862075805664, "global_step": 426831, "epoch": 5142} {"train_loss": -27.121816635131836, "global_step": 426832, "epoch": 5142} {"train_loss": -27.202299118041992, "global_step": 426833, "epoch": 5142} {"train_loss": -26.63527488708496, "global_step": 426834, "epoch": 5142} {"train_loss": -26.55655860900879, "global_step": 426835, "epoch": 5142} {"train_loss": -26.204572677612305, "global_step": 426836, "epoch": 5142} {"train_loss": -25.40061378479004, "global_step": 426837, "epoch": 5142} {"train_loss": -26.297332763671875, "global_step": 426838, "epoch": 5142} {"train_loss": -26.631072998046875, "global_step": 426839, "epoch": 5142} {"train_loss": -25.977758407592773, "global_step": 426840, "epoch": 5142} {"train_loss": -26.34037208557129, "global_step": 426841, "epoch": 5142} {"train_loss": -26.7126407623291, "global_step": 426842, "epoch": 5142} {"train_loss": -26.504226684570312, "global_step": 426843, "epoch": 5142} {"train_loss": -26.537155151367188, "global_step": 426844, "epoch": 5142} {"train_loss": -26.483642578125, "global_step": 426845, "epoch": 5142} {"train_loss": -26.422826766967773, "global_step": 426846, "epoch": 5142} {"train_loss": -26.519611358642578, "global_step": 426847, "epoch": 5142} {"train_loss": -26.79833984375, "global_step": 426848, "epoch": 5142} {"train_loss": -26.250085830688477, "global_step": 426849, "epoch": 5142} {"train_loss": -26.962451934814453, "global_step": 426850, "epoch": 5142} {"train_loss": -26.71615982055664, "global_step": 426851, "epoch": 5142} {"train_loss": -26.42881202697754, "global_step": 426852, "epoch": 5142} {"train_loss": -26.727039337158203, "global_step": 426853, "epoch": 5142} {"train_loss": -26.38921546936035, "global_step": 426854, "epoch": 5142} {"train_loss": -26.700239181518555, "global_step": 426855, "epoch": 5142} {"train_loss": -26.704755783081055, "global_step": 426856, "epoch": 5142} {"train_loss": -26.598133087158203, "global_step": 426857, "epoch": 5142} {"train_loss": -26.625600814819336, "global_step": 426858, "epoch": 5142} {"train_loss": -27.373083114624023, "global_step": 426859, "epoch": 5142} {"train_loss": -26.58979606628418, "global_step": 426860, "epoch": 5142} {"train_loss": -26.498565673828125, "global_step": 426861, "epoch": 5142} {"train_loss": -26.518091201782227, "global_step": 426862, "epoch": 5142} {"train_loss": -26.628503799438477, "global_step": 426863, "epoch": 5142} {"train_loss": -26.4755802154541, "global_step": 426864, "epoch": 5142} {"train_loss": -26.868900299072266, "global_step": 426865, "epoch": 5142} {"train_loss": -26.772705078125, "global_step": 426866, "epoch": 5142} {"train_loss": -26.745635986328125, "global_step": 426867, "epoch": 5142} {"train_loss": -26.663831802735846, "global_step": 426868, "epoch": 5142, "val_loss": 6923849.0} {"train_loss": -26.288049697875977, "global_step": 426869, "epoch": 5143} {"train_loss": -26.694509506225586, "global_step": 426870, "epoch": 5143} {"train_loss": -26.459970474243164, "global_step": 426871, "epoch": 5143} {"train_loss": -26.613927841186523, "global_step": 426872, "epoch": 5143} {"train_loss": -26.716278076171875, "global_step": 426873, "epoch": 5143} {"train_loss": -26.576444625854492, "global_step": 426874, "epoch": 5143} {"train_loss": -26.95637321472168, "global_step": 426875, "epoch": 5143} {"train_loss": -26.466693878173828, "global_step": 426876, "epoch": 5143} {"train_loss": -26.565195083618164, "global_step": 426877, "epoch": 5143} {"train_loss": -26.587072372436523, "global_step": 426878, "epoch": 5143} {"train_loss": -26.501312255859375, "global_step": 426879, "epoch": 5143} {"train_loss": -26.82972526550293, "global_step": 426880, "epoch": 5143} {"train_loss": -26.7633056640625, "global_step": 426881, "epoch": 5143} {"train_loss": -26.666418075561523, "global_step": 426882, "epoch": 5143} {"train_loss": -26.66847038269043, "global_step": 426883, "epoch": 5143} {"train_loss": -26.872634887695312, "global_step": 426884, "epoch": 5143} {"train_loss": -26.531604766845703, "global_step": 426885, "epoch": 5143} {"train_loss": -26.76912498474121, "global_step": 426886, "epoch": 5143} {"train_loss": -26.80971336364746, "global_step": 426887, "epoch": 5143} {"train_loss": -26.479736328125, "global_step": 426888, "epoch": 5143} {"train_loss": -26.717283248901367, "global_step": 426889, "epoch": 5143} {"train_loss": -26.811655044555664, "global_step": 426890, "epoch": 5143} {"train_loss": -27.2860164642334, "global_step": 426891, "epoch": 5143} {"train_loss": -26.836523056030273, "global_step": 426892, "epoch": 5143} {"train_loss": -26.81438636779785, "global_step": 426893, "epoch": 5143} {"train_loss": -26.75678825378418, "global_step": 426894, "epoch": 5143} {"train_loss": -26.85297966003418, "global_step": 426895, "epoch": 5143} {"train_loss": -26.885400772094727, "global_step": 426896, "epoch": 5143} {"train_loss": -26.573423385620117, "global_step": 426897, "epoch": 5143} {"train_loss": -27.15536880493164, "global_step": 426898, "epoch": 5143} {"train_loss": -27.01222038269043, "global_step": 426899, "epoch": 5143} {"train_loss": -26.76173210144043, "global_step": 426900, "epoch": 5143} {"train_loss": -26.595727920532227, "global_step": 426901, "epoch": 5143} {"train_loss": -26.52504539489746, "global_step": 426902, "epoch": 5143} {"train_loss": -26.850513458251953, "global_step": 426903, "epoch": 5143} {"train_loss": -26.398761749267578, "global_step": 426904, "epoch": 5143} {"train_loss": -26.389623641967773, "global_step": 426905, "epoch": 5143} {"train_loss": -26.283422470092773, "global_step": 426906, "epoch": 5143} {"train_loss": -26.972904205322266, "global_step": 426907, "epoch": 5143} {"train_loss": -27.026655197143555, "global_step": 426908, "epoch": 5143} {"train_loss": -26.640226364135742, "global_step": 426909, "epoch": 5143} {"train_loss": -26.609785079956055, "global_step": 426910, "epoch": 5143} {"train_loss": -26.97197914123535, "global_step": 426911, "epoch": 5143} {"train_loss": -27.044607162475586, "global_step": 426912, "epoch": 5143} {"train_loss": -26.84962272644043, "global_step": 426913, "epoch": 5143} {"train_loss": -26.669641494750977, "global_step": 426914, "epoch": 5143} {"train_loss": -26.866363525390625, "global_step": 426915, "epoch": 5143} {"train_loss": -26.584402084350586, "global_step": 426916, "epoch": 5143} {"train_loss": -26.97916603088379, "global_step": 426917, "epoch": 5143} {"train_loss": -26.8737735748291, "global_step": 426918, "epoch": 5143} {"train_loss": -26.686574935913086, "global_step": 426919, "epoch": 5143} {"train_loss": -26.966888427734375, "global_step": 426920, "epoch": 5143} {"train_loss": -26.987085342407227, "global_step": 426921, "epoch": 5143} {"train_loss": -27.00910758972168, "global_step": 426922, "epoch": 5143} {"train_loss": -26.821630477905273, "global_step": 426923, "epoch": 5143} {"train_loss": -26.557315826416016, "global_step": 426924, "epoch": 5143} {"train_loss": -26.680017471313477, "global_step": 426925, "epoch": 5143} {"train_loss": -27.264204025268555, "global_step": 426926, "epoch": 5143} {"train_loss": -27.152063369750977, "global_step": 426927, "epoch": 5143} {"train_loss": -27.142419815063477, "global_step": 426928, "epoch": 5143} {"train_loss": -26.74238395690918, "global_step": 426929, "epoch": 5143} {"train_loss": -27.359268188476562, "global_step": 426930, "epoch": 5143} {"train_loss": -27.071088790893555, "global_step": 426931, "epoch": 5143} {"train_loss": -26.549421310424805, "global_step": 426932, "epoch": 5143} {"train_loss": -27.016357421875, "global_step": 426933, "epoch": 5143} {"train_loss": -27.14568519592285, "global_step": 426934, "epoch": 5143} {"train_loss": -27.130441665649414, "global_step": 426935, "epoch": 5143} {"train_loss": -26.741641998291016, "global_step": 426936, "epoch": 5143} {"train_loss": -26.57318115234375, "global_step": 426937, "epoch": 5143} {"train_loss": -26.510400772094727, "global_step": 426938, "epoch": 5143} {"train_loss": -26.44740104675293, "global_step": 426939, "epoch": 5143} {"train_loss": -26.81072998046875, "global_step": 426940, "epoch": 5143} {"train_loss": -27.140106201171875, "global_step": 426941, "epoch": 5143} {"train_loss": -26.7914981842041, "global_step": 426942, "epoch": 5143} {"train_loss": -26.885526657104492, "global_step": 426943, "epoch": 5143} {"train_loss": -26.641752243041992, "global_step": 426944, "epoch": 5143} {"train_loss": -26.854450225830078, "global_step": 426945, "epoch": 5143} {"train_loss": -26.583953857421875, "global_step": 426946, "epoch": 5143} {"train_loss": -27.029815673828125, "global_step": 426947, "epoch": 5143} {"train_loss": -27.262235641479492, "global_step": 426948, "epoch": 5143} {"train_loss": -27.1174373626709, "global_step": 426949, "epoch": 5143} {"train_loss": -27.016027450561523, "global_step": 426950, "epoch": 5143} {"train_loss": -26.791268957666603, "global_step": 426951, "epoch": 5143, "val_loss": 6947805.0} {"train_loss": -26.809350967407227, "global_step": 426952, "epoch": 5144} {"train_loss": -25.645648956298828, "global_step": 426953, "epoch": 5144} {"train_loss": -24.606964111328125, "global_step": 426954, "epoch": 5144} {"train_loss": -25.929595947265625, "global_step": 426955, "epoch": 5144} {"train_loss": -26.861270904541016, "global_step": 426956, "epoch": 5144} {"train_loss": -25.74472427368164, "global_step": 426957, "epoch": 5144} {"train_loss": -26.092966079711914, "global_step": 426958, "epoch": 5144} {"train_loss": -26.599485397338867, "global_step": 426959, "epoch": 5144} {"train_loss": -26.574234008789062, "global_step": 426960, "epoch": 5144} {"train_loss": -26.144062042236328, "global_step": 426961, "epoch": 5144} {"train_loss": -26.705204010009766, "global_step": 426962, "epoch": 5144} {"train_loss": -26.0113582611084, "global_step": 426963, "epoch": 5144} {"train_loss": -26.782947540283203, "global_step": 426964, "epoch": 5144} {"train_loss": -26.481689453125, "global_step": 426965, "epoch": 5144} {"train_loss": -26.849512100219727, "global_step": 426966, "epoch": 5144} {"train_loss": -26.4873046875, "global_step": 426967, "epoch": 5144} {"train_loss": -26.786579132080078, "global_step": 426968, "epoch": 5144} {"train_loss": -26.541961669921875, "global_step": 426969, "epoch": 5144} {"train_loss": -26.618616104125977, "global_step": 426970, "epoch": 5144} {"train_loss": -26.65541648864746, "global_step": 426971, "epoch": 5144} {"train_loss": -26.42085075378418, "global_step": 426972, "epoch": 5144} {"train_loss": -26.658777236938477, "global_step": 426973, "epoch": 5144} {"train_loss": -26.697790145874023, "global_step": 426974, "epoch": 5144} {"train_loss": -26.59767723083496, "global_step": 426975, "epoch": 5144} {"train_loss": -26.8663387298584, "global_step": 426976, "epoch": 5144} {"train_loss": -26.432483673095703, "global_step": 426977, "epoch": 5144} {"train_loss": -26.792999267578125, "global_step": 426978, "epoch": 5144} {"train_loss": -27.083967208862305, "global_step": 426979, "epoch": 5144} {"train_loss": -26.78632926940918, "global_step": 426980, "epoch": 5144} {"train_loss": -26.688013076782227, "global_step": 426981, "epoch": 5144} {"train_loss": -27.095245361328125, "global_step": 426982, "epoch": 5144} {"train_loss": -26.77650260925293, "global_step": 426983, "epoch": 5144} {"train_loss": -26.93558120727539, "global_step": 426984, "epoch": 5144} {"train_loss": -26.952392578125, "global_step": 426985, "epoch": 5144} {"train_loss": -27.1156063079834, "global_step": 426986, "epoch": 5144} {"train_loss": -26.607471466064453, "global_step": 426987, "epoch": 5144} {"train_loss": -27.030200958251953, "global_step": 426988, "epoch": 5144} {"train_loss": -27.02157974243164, "global_step": 426989, "epoch": 5144} {"train_loss": -27.086673736572266, "global_step": 426990, "epoch": 5144} {"train_loss": -26.887786865234375, "global_step": 426991, "epoch": 5144} {"train_loss": -27.21140480041504, "global_step": 426992, "epoch": 5144} {"train_loss": -27.03364372253418, "global_step": 426993, "epoch": 5144} {"train_loss": -26.775476455688477, "global_step": 426994, "epoch": 5144} {"train_loss": -26.989164352416992, "global_step": 426995, "epoch": 5144} {"train_loss": -26.941009521484375, "global_step": 426996, "epoch": 5144} {"train_loss": -26.968088150024414, "global_step": 426997, "epoch": 5144} {"train_loss": -26.734622955322266, "global_step": 426998, "epoch": 5144} {"train_loss": -26.6900577545166, "global_step": 426999, "epoch": 5144} {"train_loss": -26.925384521484375, "global_step": 427000, "epoch": 5144} {"train_loss": -27.061798095703125, "global_step": 427001, "epoch": 5144} {"train_loss": -26.969263076782227, "global_step": 427002, "epoch": 5144} {"train_loss": -27.17652702331543, "global_step": 427003, "epoch": 5144} {"train_loss": -27.065387725830078, "global_step": 427004, "epoch": 5144} {"train_loss": -27.125980377197266, "global_step": 427005, "epoch": 5144} {"train_loss": -26.945337295532227, "global_step": 427006, "epoch": 5144} {"train_loss": -27.043195724487305, "global_step": 427007, "epoch": 5144} {"train_loss": -27.057870864868164, "global_step": 427008, "epoch": 5144} {"train_loss": -27.204214096069336, "global_step": 427009, "epoch": 5144} {"train_loss": -26.983448028564453, "global_step": 427010, "epoch": 5144} {"train_loss": -27.0059871673584, "global_step": 427011, "epoch": 5144} {"train_loss": -26.812061309814453, "global_step": 427012, "epoch": 5144} {"train_loss": -27.337574005126953, "global_step": 427013, "epoch": 5144} {"train_loss": -27.098419189453125, "global_step": 427014, "epoch": 5144} {"train_loss": -27.3398380279541, "global_step": 427015, "epoch": 5144} {"train_loss": -26.994754791259766, "global_step": 427016, "epoch": 5144} {"train_loss": -26.98032569885254, "global_step": 427017, "epoch": 5144} {"train_loss": -26.73324966430664, "global_step": 427018, "epoch": 5144} {"train_loss": -26.675399780273438, "global_step": 427019, "epoch": 5144} {"train_loss": -27.240148544311523, "global_step": 427020, "epoch": 5144} {"train_loss": -26.97242546081543, "global_step": 427021, "epoch": 5144} {"train_loss": -27.109546661376953, "global_step": 427022, "epoch": 5144} {"train_loss": -27.340681076049805, "global_step": 427023, "epoch": 5144} {"train_loss": -27.005807876586914, "global_step": 427024, "epoch": 5144} {"train_loss": -27.10565185546875, "global_step": 427025, "epoch": 5144} {"train_loss": -26.850866317749023, "global_step": 427026, "epoch": 5144} {"train_loss": -26.281967163085938, "global_step": 427027, "epoch": 5144} {"train_loss": -26.913549423217773, "global_step": 427028, "epoch": 5144} {"train_loss": -26.923370361328125, "global_step": 427029, "epoch": 5144} {"train_loss": -26.672311782836914, "global_step": 427030, "epoch": 5144} {"train_loss": -26.371444702148438, "global_step": 427031, "epoch": 5144} {"train_loss": -26.118066787719727, "global_step": 427032, "epoch": 5144} {"train_loss": -26.481613159179688, "global_step": 427033, "epoch": 5144} {"train_loss": -26.773669507130084, "global_step": 427034, "epoch": 5144, "val_loss": 6847833.5} {"train_loss": -24.889354705810547, "global_step": 427035, "epoch": 5145} {"train_loss": -24.84464454650879, "global_step": 427036, "epoch": 5145} {"train_loss": -26.07655143737793, "global_step": 427037, "epoch": 5145} {"train_loss": -25.530797958374023, "global_step": 427038, "epoch": 5145} {"train_loss": -26.226520538330078, "global_step": 427039, "epoch": 5145} {"train_loss": -25.675037384033203, "global_step": 427040, "epoch": 5145} {"train_loss": -26.48311424255371, "global_step": 427041, "epoch": 5145} {"train_loss": -25.929916381835938, "global_step": 427042, "epoch": 5145} {"train_loss": -26.317398071289062, "global_step": 427043, "epoch": 5145} {"train_loss": -26.486066818237305, "global_step": 427044, "epoch": 5145} {"train_loss": -26.22821044921875, "global_step": 427045, "epoch": 5145} {"train_loss": -26.14995765686035, "global_step": 427046, "epoch": 5145} {"train_loss": -26.04078483581543, "global_step": 427047, "epoch": 5145} {"train_loss": -26.256366729736328, "global_step": 427048, "epoch": 5145} {"train_loss": -26.905149459838867, "global_step": 427049, "epoch": 5145} {"train_loss": -26.1678466796875, "global_step": 427050, "epoch": 5145} {"train_loss": -26.387372970581055, "global_step": 427051, "epoch": 5145} {"train_loss": -26.17525291442871, "global_step": 427052, "epoch": 5145} {"train_loss": -26.56989860534668, "global_step": 427053, "epoch": 5145} {"train_loss": -25.996606826782227, "global_step": 427054, "epoch": 5145} {"train_loss": -26.278308868408203, "global_step": 427055, "epoch": 5145} {"train_loss": -26.591466903686523, "global_step": 427056, "epoch": 5145} {"train_loss": -26.3881778717041, "global_step": 427057, "epoch": 5145} {"train_loss": -26.489990234375, "global_step": 427058, "epoch": 5145} {"train_loss": -26.415206909179688, "global_step": 427059, "epoch": 5145} {"train_loss": -26.57330894470215, "global_step": 427060, "epoch": 5145} {"train_loss": -26.58273696899414, "global_step": 427061, "epoch": 5145} {"train_loss": -26.8757381439209, "global_step": 427062, "epoch": 5145} {"train_loss": -26.669599533081055, "global_step": 427063, "epoch": 5145} {"train_loss": -26.57999610900879, "global_step": 427064, "epoch": 5145} {"train_loss": -26.155746459960938, "global_step": 427065, "epoch": 5145} {"train_loss": -26.334314346313477, "global_step": 427066, "epoch": 5145} {"train_loss": -26.814401626586914, "global_step": 427067, "epoch": 5145} {"train_loss": -26.80564308166504, "global_step": 427068, "epoch": 5145} {"train_loss": -26.901294708251953, "global_step": 427069, "epoch": 5145} {"train_loss": -26.625885009765625, "global_step": 427070, "epoch": 5145} {"train_loss": -27.219772338867188, "global_step": 427071, "epoch": 5145} {"train_loss": -26.849985122680664, "global_step": 427072, "epoch": 5145} {"train_loss": -26.888294219970703, "global_step": 427073, "epoch": 5145} {"train_loss": -26.908512115478516, "global_step": 427074, "epoch": 5145} {"train_loss": -26.80470085144043, "global_step": 427075, "epoch": 5145} {"train_loss": -26.507505416870117, "global_step": 427076, "epoch": 5145} {"train_loss": -26.80367088317871, "global_step": 427077, "epoch": 5145} {"train_loss": -26.917715072631836, "global_step": 427078, "epoch": 5145} {"train_loss": -27.135578155517578, "global_step": 427079, "epoch": 5145} {"train_loss": -27.049182891845703, "global_step": 427080, "epoch": 5145} {"train_loss": -27.028430938720703, "global_step": 427081, "epoch": 5145} {"train_loss": -27.03365135192871, "global_step": 427082, "epoch": 5145} {"train_loss": -26.71681022644043, "global_step": 427083, "epoch": 5145} {"train_loss": -26.889911651611328, "global_step": 427084, "epoch": 5145} {"train_loss": -27.16082763671875, "global_step": 427085, "epoch": 5145} {"train_loss": -27.17168617248535, "global_step": 427086, "epoch": 5145} {"train_loss": -27.05620765686035, "global_step": 427087, "epoch": 5145} {"train_loss": -26.658655166625977, "global_step": 427088, "epoch": 5145} {"train_loss": -26.9267578125, "global_step": 427089, "epoch": 5145} {"train_loss": -26.885940551757812, "global_step": 427090, "epoch": 5145} {"train_loss": -26.77019691467285, "global_step": 427091, "epoch": 5145} {"train_loss": -27.028242111206055, "global_step": 427092, "epoch": 5145} {"train_loss": -26.73883628845215, "global_step": 427093, "epoch": 5145} {"train_loss": -26.898611068725586, "global_step": 427094, "epoch": 5145} {"train_loss": -27.073423385620117, "global_step": 427095, "epoch": 5145} {"train_loss": -27.126758575439453, "global_step": 427096, "epoch": 5145} {"train_loss": -26.897663116455078, "global_step": 427097, "epoch": 5145} {"train_loss": -26.7429141998291, "global_step": 427098, "epoch": 5145} {"train_loss": -26.81165885925293, "global_step": 427099, "epoch": 5145} {"train_loss": -26.840009689331055, "global_step": 427100, "epoch": 5145} {"train_loss": -27.48428726196289, "global_step": 427101, "epoch": 5145} {"train_loss": -27.05750846862793, "global_step": 427102, "epoch": 5145} {"train_loss": -26.924768447875977, "global_step": 427103, "epoch": 5145} {"train_loss": -26.856603622436523, "global_step": 427104, "epoch": 5145} {"train_loss": -26.84431266784668, "global_step": 427105, "epoch": 5145} {"train_loss": -26.893842697143555, "global_step": 427106, "epoch": 5145} {"train_loss": -27.1016788482666, "global_step": 427107, "epoch": 5145} {"train_loss": -27.025732040405273, "global_step": 427108, "epoch": 5145} {"train_loss": -27.06556510925293, "global_step": 427109, "epoch": 5145} {"train_loss": -26.819732666015625, "global_step": 427110, "epoch": 5145} {"train_loss": -26.882043838500977, "global_step": 427111, "epoch": 5145} {"train_loss": -27.2039852142334, "global_step": 427112, "epoch": 5145} {"train_loss": -27.038511276245117, "global_step": 427113, "epoch": 5145} {"train_loss": -26.848554611206055, "global_step": 427114, "epoch": 5145} {"train_loss": -26.539636611938477, "global_step": 427115, "epoch": 5145} {"train_loss": -26.77838134765625, "global_step": 427116, "epoch": 5145} {"train_loss": -26.64682089564312, "global_step": 427117, "epoch": 5145, "val_loss": 6980569.0} {"train_loss": -26.194995880126953, "global_step": 427118, "epoch": 5146} {"train_loss": -26.247955322265625, "global_step": 427119, "epoch": 5146} {"train_loss": -26.534765243530273, "global_step": 427120, "epoch": 5146} {"train_loss": -25.496749877929688, "global_step": 427121, "epoch": 5146} {"train_loss": -26.031482696533203, "global_step": 427122, "epoch": 5146} {"train_loss": -26.147876739501953, "global_step": 427123, "epoch": 5146} {"train_loss": -26.0201416015625, "global_step": 427124, "epoch": 5146} {"train_loss": -25.843963623046875, "global_step": 427125, "epoch": 5146} {"train_loss": -26.387420654296875, "global_step": 427126, "epoch": 5146} {"train_loss": -26.134057998657227, "global_step": 427127, "epoch": 5146} {"train_loss": -26.03034019470215, "global_step": 427128, "epoch": 5146} {"train_loss": -26.78037452697754, "global_step": 427129, "epoch": 5146} {"train_loss": -26.56117057800293, "global_step": 427130, "epoch": 5146} {"train_loss": -26.172956466674805, "global_step": 427131, "epoch": 5146} {"train_loss": -26.746906280517578, "global_step": 427132, "epoch": 5146} {"train_loss": -26.503103256225586, "global_step": 427133, "epoch": 5146} {"train_loss": -26.5303955078125, "global_step": 427134, "epoch": 5146} {"train_loss": -26.4287109375, "global_step": 427135, "epoch": 5146} {"train_loss": -26.456146240234375, "global_step": 427136, "epoch": 5146} {"train_loss": -26.261245727539062, "global_step": 427137, "epoch": 5146} {"train_loss": -26.261274337768555, "global_step": 427138, "epoch": 5146} {"train_loss": -26.50361442565918, "global_step": 427139, "epoch": 5146} {"train_loss": -26.72686195373535, "global_step": 427140, "epoch": 5146} {"train_loss": -26.462427139282227, "global_step": 427141, "epoch": 5146} {"train_loss": -26.544164657592773, "global_step": 427142, "epoch": 5146} {"train_loss": -26.501562118530273, "global_step": 427143, "epoch": 5146} {"train_loss": -26.84286880493164, "global_step": 427144, "epoch": 5146} {"train_loss": -26.88441276550293, "global_step": 427145, "epoch": 5146} {"train_loss": -26.369556427001953, "global_step": 427146, "epoch": 5146} {"train_loss": -26.77497673034668, "global_step": 427147, "epoch": 5146} {"train_loss": -26.608489990234375, "global_step": 427148, "epoch": 5146} {"train_loss": -26.938629150390625, "global_step": 427149, "epoch": 5146} {"train_loss": -26.59429359436035, "global_step": 427150, "epoch": 5146} {"train_loss": -26.84246253967285, "global_step": 427151, "epoch": 5146} {"train_loss": -26.67071533203125, "global_step": 427152, "epoch": 5146} {"train_loss": -26.97257423400879, "global_step": 427153, "epoch": 5146} {"train_loss": -26.903554916381836, "global_step": 427154, "epoch": 5146} {"train_loss": -26.8287410736084, "global_step": 427155, "epoch": 5146} {"train_loss": -26.609954833984375, "global_step": 427156, "epoch": 5146} {"train_loss": -26.957422256469727, "global_step": 427157, "epoch": 5146} {"train_loss": -26.8907413482666, "global_step": 427158, "epoch": 5146} {"train_loss": -26.71512794494629, "global_step": 427159, "epoch": 5146} {"train_loss": -26.51515007019043, "global_step": 427160, "epoch": 5146} {"train_loss": -27.15616798400879, "global_step": 427161, "epoch": 5146} {"train_loss": -26.784021377563477, "global_step": 427162, "epoch": 5146} {"train_loss": -26.57135581970215, "global_step": 427163, "epoch": 5146} {"train_loss": -26.908817291259766, "global_step": 427164, "epoch": 5146} {"train_loss": -26.771657943725586, "global_step": 427165, "epoch": 5146} {"train_loss": -27.026098251342773, "global_step": 427166, "epoch": 5146} {"train_loss": -26.8089656829834, "global_step": 427167, "epoch": 5146} {"train_loss": -27.31083106994629, "global_step": 427168, "epoch": 5146} {"train_loss": -26.9117374420166, "global_step": 427169, "epoch": 5146} {"train_loss": -26.88376235961914, "global_step": 427170, "epoch": 5146} {"train_loss": -27.03631019592285, "global_step": 427171, "epoch": 5146} {"train_loss": -27.01332664489746, "global_step": 427172, "epoch": 5146} {"train_loss": -26.826007843017578, "global_step": 427173, "epoch": 5146} {"train_loss": -27.27522087097168, "global_step": 427174, "epoch": 5146} {"train_loss": -26.771163940429688, "global_step": 427175, "epoch": 5146} {"train_loss": -26.692646026611328, "global_step": 427176, "epoch": 5146} {"train_loss": -26.57282066345215, "global_step": 427177, "epoch": 5146} {"train_loss": -26.776386260986328, "global_step": 427178, "epoch": 5146} {"train_loss": -26.928678512573242, "global_step": 427179, "epoch": 5146} {"train_loss": -26.861684799194336, "global_step": 427180, "epoch": 5146} {"train_loss": -26.58526611328125, "global_step": 427181, "epoch": 5146} {"train_loss": -26.9947566986084, "global_step": 427182, "epoch": 5146} {"train_loss": -26.863248825073242, "global_step": 427183, "epoch": 5146} {"train_loss": -27.413349151611328, "global_step": 427184, "epoch": 5146} {"train_loss": -26.843555450439453, "global_step": 427185, "epoch": 5146} {"train_loss": -26.870471954345703, "global_step": 427186, "epoch": 5146} {"train_loss": -27.05620765686035, "global_step": 427187, "epoch": 5146} {"train_loss": -26.7883243560791, "global_step": 427188, "epoch": 5146} {"train_loss": -26.975467681884766, "global_step": 427189, "epoch": 5146} {"train_loss": -26.992589950561523, "global_step": 427190, "epoch": 5146} {"train_loss": -26.958240509033203, "global_step": 427191, "epoch": 5146} {"train_loss": -26.886138916015625, "global_step": 427192, "epoch": 5146} {"train_loss": -27.13008689880371, "global_step": 427193, "epoch": 5146} {"train_loss": -26.841461181640625, "global_step": 427194, "epoch": 5146} {"train_loss": -27.161352157592773, "global_step": 427195, "epoch": 5146} {"train_loss": -26.919286727905273, "global_step": 427196, "epoch": 5146} {"train_loss": -27.113758087158203, "global_step": 427197, "epoch": 5146} {"train_loss": -26.957895278930664, "global_step": 427198, "epoch": 5146} {"train_loss": -27.100595474243164, "global_step": 427199, "epoch": 5146} {"train_loss": -26.688619659607667, "global_step": 427200, "epoch": 5146, "val_loss": 6915612.0} {"train_loss": -25.922882080078125, "global_step": 427201, "epoch": 5147} {"train_loss": -25.32076644897461, "global_step": 427202, "epoch": 5147} {"train_loss": -25.82818031311035, "global_step": 427203, "epoch": 5147} {"train_loss": -25.62579917907715, "global_step": 427204, "epoch": 5147} {"train_loss": -25.87359619140625, "global_step": 427205, "epoch": 5147} {"train_loss": -26.300445556640625, "global_step": 427206, "epoch": 5147} {"train_loss": -26.063465118408203, "global_step": 427207, "epoch": 5147} {"train_loss": -26.6115665435791, "global_step": 427208, "epoch": 5147} {"train_loss": -26.3232479095459, "global_step": 427209, "epoch": 5147} {"train_loss": -26.117467880249023, "global_step": 427210, "epoch": 5147} {"train_loss": -26.508764266967773, "global_step": 427211, "epoch": 5147} {"train_loss": -26.355443954467773, "global_step": 427212, "epoch": 5147} {"train_loss": -26.604969024658203, "global_step": 427213, "epoch": 5147} {"train_loss": -26.657196044921875, "global_step": 427214, "epoch": 5147} {"train_loss": -26.598587036132812, "global_step": 427215, "epoch": 5147} {"train_loss": -26.96571159362793, "global_step": 427216, "epoch": 5147} {"train_loss": -26.61384391784668, "global_step": 427217, "epoch": 5147} {"train_loss": -26.623151779174805, "global_step": 427218, "epoch": 5147} {"train_loss": -27.08074378967285, "global_step": 427219, "epoch": 5147} {"train_loss": -26.403076171875, "global_step": 427220, "epoch": 5147} {"train_loss": -26.765356063842773, "global_step": 427221, "epoch": 5147} {"train_loss": -26.355939865112305, "global_step": 427222, "epoch": 5147} {"train_loss": -26.860021591186523, "global_step": 427223, "epoch": 5147} {"train_loss": -27.069738388061523, "global_step": 427224, "epoch": 5147} {"train_loss": -26.49043846130371, "global_step": 427225, "epoch": 5147} {"train_loss": -26.847883224487305, "global_step": 427226, "epoch": 5147} {"train_loss": -26.872648239135742, "global_step": 427227, "epoch": 5147} {"train_loss": -26.68888282775879, "global_step": 427228, "epoch": 5147} {"train_loss": -27.028051376342773, "global_step": 427229, "epoch": 5147} {"train_loss": -26.71248435974121, "global_step": 427230, "epoch": 5147} {"train_loss": -26.873462677001953, "global_step": 427231, "epoch": 5147} {"train_loss": -26.895532608032227, "global_step": 427232, "epoch": 5147} {"train_loss": -26.862730026245117, "global_step": 427233, "epoch": 5147} {"train_loss": -26.98084831237793, "global_step": 427234, "epoch": 5147} {"train_loss": -26.650104522705078, "global_step": 427235, "epoch": 5147} {"train_loss": -26.82647705078125, "global_step": 427236, "epoch": 5147} {"train_loss": -27.02326774597168, "global_step": 427237, "epoch": 5147} {"train_loss": -26.789081573486328, "global_step": 427238, "epoch": 5147} {"train_loss": -26.789783477783203, "global_step": 427239, "epoch": 5147} {"train_loss": -26.911718368530273, "global_step": 427240, "epoch": 5147} {"train_loss": -26.665802001953125, "global_step": 427241, "epoch": 5147} {"train_loss": -26.788867950439453, "global_step": 427242, "epoch": 5147} {"train_loss": -27.12110710144043, "global_step": 427243, "epoch": 5147} {"train_loss": -26.759552001953125, "global_step": 427244, "epoch": 5147} {"train_loss": -26.719058990478516, "global_step": 427245, "epoch": 5147} {"train_loss": -27.107202529907227, "global_step": 427246, "epoch": 5147} {"train_loss": -26.816370010375977, "global_step": 427247, "epoch": 5147} {"train_loss": -26.773330688476562, "global_step": 427248, "epoch": 5147} {"train_loss": -26.709699630737305, "global_step": 427249, "epoch": 5147} {"train_loss": -26.783233642578125, "global_step": 427250, "epoch": 5147} {"train_loss": -26.952009201049805, "global_step": 427251, "epoch": 5147} {"train_loss": -26.705860137939453, "global_step": 427252, "epoch": 5147} {"train_loss": -26.990020751953125, "global_step": 427253, "epoch": 5147} {"train_loss": -26.7613582611084, "global_step": 427254, "epoch": 5147} {"train_loss": -26.91377067565918, "global_step": 427255, "epoch": 5147} {"train_loss": -26.892658233642578, "global_step": 427256, "epoch": 5147} {"train_loss": -26.749954223632812, "global_step": 427257, "epoch": 5147} {"train_loss": -26.478612899780273, "global_step": 427258, "epoch": 5147} {"train_loss": -26.88221549987793, "global_step": 427259, "epoch": 5147} {"train_loss": -27.002492904663086, "global_step": 427260, "epoch": 5147} {"train_loss": -26.510498046875, "global_step": 427261, "epoch": 5147} {"train_loss": -26.447925567626953, "global_step": 427262, "epoch": 5147} {"train_loss": -26.737991333007812, "global_step": 427263, "epoch": 5147} {"train_loss": -26.919408798217773, "global_step": 427264, "epoch": 5147} {"train_loss": -26.51361656188965, "global_step": 427265, "epoch": 5147} {"train_loss": -26.968786239624023, "global_step": 427266, "epoch": 5147} {"train_loss": -26.783227920532227, "global_step": 427267, "epoch": 5147} {"train_loss": -26.623071670532227, "global_step": 427268, "epoch": 5147} {"train_loss": -26.551176071166992, "global_step": 427269, "epoch": 5147} {"train_loss": -26.870397567749023, "global_step": 427270, "epoch": 5147} {"train_loss": -26.51932144165039, "global_step": 427271, "epoch": 5147} {"train_loss": -26.551847457885742, "global_step": 427272, "epoch": 5147} {"train_loss": -26.79554557800293, "global_step": 427273, "epoch": 5147} {"train_loss": -26.801013946533203, "global_step": 427274, "epoch": 5147} {"train_loss": -26.870193481445312, "global_step": 427275, "epoch": 5147} {"train_loss": -26.996793746948242, "global_step": 427276, "epoch": 5147} {"train_loss": -26.994016647338867, "global_step": 427277, "epoch": 5147} {"train_loss": -26.59694480895996, "global_step": 427278, "epoch": 5147} {"train_loss": -26.69719886779785, "global_step": 427279, "epoch": 5147} {"train_loss": -27.304431915283203, "global_step": 427280, "epoch": 5147} {"train_loss": -26.616382598876953, "global_step": 427281, "epoch": 5147} {"train_loss": -26.453954696655273, "global_step": 427282, "epoch": 5147} {"train_loss": -26.679686144173864, "global_step": 427283, "epoch": 5147, "val_loss": 6898450.0} {"train_loss": -26.02364158630371, "global_step": 427284, "epoch": 5148} {"train_loss": -26.349157333374023, "global_step": 427285, "epoch": 5148} {"train_loss": -26.277456283569336, "global_step": 427286, "epoch": 5148} {"train_loss": -26.445423126220703, "global_step": 427287, "epoch": 5148} {"train_loss": -25.7574462890625, "global_step": 427288, "epoch": 5148} {"train_loss": -26.600238800048828, "global_step": 427289, "epoch": 5148} {"train_loss": -26.173236846923828, "global_step": 427290, "epoch": 5148} {"train_loss": -26.3736515045166, "global_step": 427291, "epoch": 5148} {"train_loss": -26.12262535095215, "global_step": 427292, "epoch": 5148} {"train_loss": -26.54363441467285, "global_step": 427293, "epoch": 5148} {"train_loss": -26.762714385986328, "global_step": 427294, "epoch": 5148} {"train_loss": -26.72900390625, "global_step": 427295, "epoch": 5148} {"train_loss": -26.790075302124023, "global_step": 427296, "epoch": 5148} {"train_loss": -26.531538009643555, "global_step": 427297, "epoch": 5148} {"train_loss": -26.828763961791992, "global_step": 427298, "epoch": 5148} {"train_loss": -26.953018188476562, "global_step": 427299, "epoch": 5148} {"train_loss": -26.767126083374023, "global_step": 427300, "epoch": 5148} {"train_loss": -26.66582679748535, "global_step": 427301, "epoch": 5148} {"train_loss": -26.681135177612305, "global_step": 427302, "epoch": 5148} {"train_loss": -26.855798721313477, "global_step": 427303, "epoch": 5148} {"train_loss": -26.818552017211914, "global_step": 427304, "epoch": 5148} {"train_loss": -26.471698760986328, "global_step": 427305, "epoch": 5148} {"train_loss": -26.716724395751953, "global_step": 427306, "epoch": 5148} {"train_loss": -26.565216064453125, "global_step": 427307, "epoch": 5148} {"train_loss": -26.9279842376709, "global_step": 427308, "epoch": 5148} {"train_loss": -26.256977081298828, "global_step": 427309, "epoch": 5148} {"train_loss": -26.552295684814453, "global_step": 427310, "epoch": 5148} {"train_loss": -26.789051055908203, "global_step": 427311, "epoch": 5148} {"train_loss": -26.737659454345703, "global_step": 427312, "epoch": 5148} {"train_loss": -26.80561637878418, "global_step": 427313, "epoch": 5148} {"train_loss": -26.92793083190918, "global_step": 427314, "epoch": 5148} {"train_loss": -26.99074363708496, "global_step": 427315, "epoch": 5148} {"train_loss": -26.796741485595703, "global_step": 427316, "epoch": 5148} {"train_loss": -26.61631202697754, "global_step": 427317, "epoch": 5148} {"train_loss": -27.01426124572754, "global_step": 427318, "epoch": 5148} {"train_loss": -27.043476104736328, "global_step": 427319, "epoch": 5148} {"train_loss": -26.849151611328125, "global_step": 427320, "epoch": 5148} {"train_loss": -26.805627822875977, "global_step": 427321, "epoch": 5148} {"train_loss": -26.61355972290039, "global_step": 427322, "epoch": 5148} {"train_loss": -27.0535888671875, "global_step": 427323, "epoch": 5148} {"train_loss": -26.861846923828125, "global_step": 427324, "epoch": 5148} {"train_loss": -27.02179527282715, "global_step": 427325, "epoch": 5148} {"train_loss": -26.887205123901367, "global_step": 427326, "epoch": 5148} {"train_loss": -27.014429092407227, "global_step": 427327, "epoch": 5148} {"train_loss": -27.319849014282227, "global_step": 427328, "epoch": 5148} {"train_loss": -27.02655029296875, "global_step": 427329, "epoch": 5148} {"train_loss": -26.843616485595703, "global_step": 427330, "epoch": 5148} {"train_loss": -26.83884620666504, "global_step": 427331, "epoch": 5148} {"train_loss": -26.899999618530273, "global_step": 427332, "epoch": 5148} {"train_loss": -26.7077693939209, "global_step": 427333, "epoch": 5148} {"train_loss": -26.763263702392578, "global_step": 427334, "epoch": 5148} {"train_loss": -26.445966720581055, "global_step": 427335, "epoch": 5148} {"train_loss": -27.106252670288086, "global_step": 427336, "epoch": 5148} {"train_loss": -26.584009170532227, "global_step": 427337, "epoch": 5148} {"train_loss": -26.699039459228516, "global_step": 427338, "epoch": 5148} {"train_loss": -27.05698013305664, "global_step": 427339, "epoch": 5148} {"train_loss": -26.90326499938965, "global_step": 427340, "epoch": 5148} {"train_loss": -27.155548095703125, "global_step": 427341, "epoch": 5148} {"train_loss": -26.482580184936523, "global_step": 427342, "epoch": 5148} {"train_loss": -26.99298095703125, "global_step": 427343, "epoch": 5148} {"train_loss": -27.1960391998291, "global_step": 427344, "epoch": 5148} {"train_loss": -26.71845054626465, "global_step": 427345, "epoch": 5148} {"train_loss": -26.770709991455078, "global_step": 427346, "epoch": 5148} {"train_loss": -26.95734214782715, "global_step": 427347, "epoch": 5148} {"train_loss": -26.76014518737793, "global_step": 427348, "epoch": 5148} {"train_loss": -26.6715087890625, "global_step": 427349, "epoch": 5148} {"train_loss": -27.181812286376953, "global_step": 427350, "epoch": 5148} {"train_loss": -26.717697143554688, "global_step": 427351, "epoch": 5148} {"train_loss": -26.589197158813477, "global_step": 427352, "epoch": 5148} {"train_loss": -26.81646156311035, "global_step": 427353, "epoch": 5148} {"train_loss": -26.813444137573242, "global_step": 427354, "epoch": 5148} {"train_loss": -26.803342819213867, "global_step": 427355, "epoch": 5148} {"train_loss": -26.425628662109375, "global_step": 427356, "epoch": 5148} {"train_loss": -26.75506591796875, "global_step": 427357, "epoch": 5148} {"train_loss": -26.918432235717773, "global_step": 427358, "epoch": 5148} {"train_loss": -26.404693603515625, "global_step": 427359, "epoch": 5148} {"train_loss": -26.8226261138916, "global_step": 427360, "epoch": 5148} {"train_loss": -26.96722412109375, "global_step": 427361, "epoch": 5148} {"train_loss": -26.80341148376465, "global_step": 427362, "epoch": 5148} {"train_loss": -26.425724029541016, "global_step": 427363, "epoch": 5148} {"train_loss": -26.663227081298828, "global_step": 427364, "epoch": 5148} {"train_loss": -27.118871688842773, "global_step": 427365, "epoch": 5148} {"train_loss": -26.75588021795434, "global_step": 427366, "epoch": 5148, "val_loss": 6786848.0} {"train_loss": -25.61138916015625, "global_step": 427367, "epoch": 5149} {"train_loss": -25.079145431518555, "global_step": 427368, "epoch": 5149} {"train_loss": -25.145034790039062, "global_step": 427369, "epoch": 5149} {"train_loss": -26.295568466186523, "global_step": 427370, "epoch": 5149} {"train_loss": -25.875110626220703, "global_step": 427371, "epoch": 5149} {"train_loss": -26.128141403198242, "global_step": 427372, "epoch": 5149} {"train_loss": -25.914981842041016, "global_step": 427373, "epoch": 5149} {"train_loss": -26.266284942626953, "global_step": 427374, "epoch": 5149} {"train_loss": -26.626331329345703, "global_step": 427375, "epoch": 5149} {"train_loss": -26.08066177368164, "global_step": 427376, "epoch": 5149} {"train_loss": -26.437707901000977, "global_step": 427377, "epoch": 5149} {"train_loss": -26.214147567749023, "global_step": 427378, "epoch": 5149} {"train_loss": -26.385541915893555, "global_step": 427379, "epoch": 5149} {"train_loss": -26.47796630859375, "global_step": 427380, "epoch": 5149} {"train_loss": -26.19217300415039, "global_step": 427381, "epoch": 5149} {"train_loss": -26.383895874023438, "global_step": 427382, "epoch": 5149} {"train_loss": -26.55592155456543, "global_step": 427383, "epoch": 5149} {"train_loss": -26.43802833557129, "global_step": 427384, "epoch": 5149} {"train_loss": -26.519424438476562, "global_step": 427385, "epoch": 5149} {"train_loss": -26.498510360717773, "global_step": 427386, "epoch": 5149} {"train_loss": -26.512786865234375, "global_step": 427387, "epoch": 5149} {"train_loss": -26.380582809448242, "global_step": 427388, "epoch": 5149} {"train_loss": -26.220731735229492, "global_step": 427389, "epoch": 5149} {"train_loss": -26.63345718383789, "global_step": 427390, "epoch": 5149} {"train_loss": -26.8319091796875, "global_step": 427391, "epoch": 5149} {"train_loss": -27.00996208190918, "global_step": 427392, "epoch": 5149} {"train_loss": -27.111082077026367, "global_step": 427393, "epoch": 5149} {"train_loss": -26.965314865112305, "global_step": 427394, "epoch": 5149} {"train_loss": -26.798160552978516, "global_step": 427395, "epoch": 5149} {"train_loss": -26.704833984375, "global_step": 427396, "epoch": 5149} {"train_loss": -26.8348445892334, "global_step": 427397, "epoch": 5149} {"train_loss": -26.70413589477539, "global_step": 427398, "epoch": 5149} {"train_loss": -26.6781063079834, "global_step": 427399, "epoch": 5149} {"train_loss": -26.663782119750977, "global_step": 427400, "epoch": 5149} {"train_loss": -26.894866943359375, "global_step": 427401, "epoch": 5149} {"train_loss": -27.114301681518555, "global_step": 427402, "epoch": 5149} {"train_loss": -26.891281127929688, "global_step": 427403, "epoch": 5149} {"train_loss": -26.95757484436035, "global_step": 427404, "epoch": 5149} {"train_loss": -26.818073272705078, "global_step": 427405, "epoch": 5149} {"train_loss": -26.69439697265625, "global_step": 427406, "epoch": 5149} {"train_loss": -26.79767417907715, "global_step": 427407, "epoch": 5149} {"train_loss": -26.836151123046875, "global_step": 427408, "epoch": 5149} {"train_loss": -26.437591552734375, "global_step": 427409, "epoch": 5149} {"train_loss": -27.10248374938965, "global_step": 427410, "epoch": 5149} {"train_loss": -26.933103561401367, "global_step": 427411, "epoch": 5149} {"train_loss": -26.90232276916504, "global_step": 427412, "epoch": 5149} {"train_loss": -26.954803466796875, "global_step": 427413, "epoch": 5149} {"train_loss": -26.680383682250977, "global_step": 427414, "epoch": 5149} {"train_loss": -26.877355575561523, "global_step": 427415, "epoch": 5149} {"train_loss": -26.87167739868164, "global_step": 427416, "epoch": 5149} {"train_loss": -26.99005699157715, "global_step": 427417, "epoch": 5149} {"train_loss": -26.820575714111328, "global_step": 427418, "epoch": 5149} {"train_loss": -27.102508544921875, "global_step": 427419, "epoch": 5149} {"train_loss": -26.93256187438965, "global_step": 427420, "epoch": 5149} {"train_loss": -27.157791137695312, "global_step": 427421, "epoch": 5149} {"train_loss": -27.2191162109375, "global_step": 427422, "epoch": 5149} {"train_loss": -27.15765380859375, "global_step": 427423, "epoch": 5149} {"train_loss": -26.50374412536621, "global_step": 427424, "epoch": 5149} {"train_loss": -27.2752685546875, "global_step": 427425, "epoch": 5149} {"train_loss": -26.97681999206543, "global_step": 427426, "epoch": 5149} {"train_loss": -26.80908203125, "global_step": 427427, "epoch": 5149} {"train_loss": -26.980085372924805, "global_step": 427428, "epoch": 5149} {"train_loss": -26.88514518737793, "global_step": 427429, "epoch": 5149} {"train_loss": -26.899555206298828, "global_step": 427430, "epoch": 5149} {"train_loss": -26.63102149963379, "global_step": 427431, "epoch": 5149} {"train_loss": -26.19532585144043, "global_step": 427432, "epoch": 5149} {"train_loss": -25.718612670898438, "global_step": 427433, "epoch": 5149} {"train_loss": -26.121112823486328, "global_step": 427434, "epoch": 5149} {"train_loss": -26.05918312072754, "global_step": 427435, "epoch": 5149} {"train_loss": -26.0596981048584, "global_step": 427436, "epoch": 5149} {"train_loss": -26.813642501831055, "global_step": 427437, "epoch": 5149} {"train_loss": -26.609586715698242, "global_step": 427438, "epoch": 5149} {"train_loss": -26.49045753479004, "global_step": 427439, "epoch": 5149} {"train_loss": -26.79294204711914, "global_step": 427440, "epoch": 5149} {"train_loss": -26.224897384643555, "global_step": 427441, "epoch": 5149} {"train_loss": -26.658035278320312, "global_step": 427442, "epoch": 5149} {"train_loss": -26.497167587280273, "global_step": 427443, "epoch": 5149} {"train_loss": -26.696069717407227, "global_step": 427444, "epoch": 5149} {"train_loss": -26.716140747070312, "global_step": 427445, "epoch": 5149} {"train_loss": -27.009220123291016, "global_step": 427446, "epoch": 5149} {"train_loss": -26.870136260986328, "global_step": 427447, "epoch": 5149} {"train_loss": -26.43125343322754, "global_step": 427448, "epoch": 5149} {"train_loss": -26.597308331225292, "global_step": 427449, "epoch": 5149, "val_loss": 6876603.0} {"train_loss": -26.201953887939453, "global_step": 427450, "epoch": 5150} {"train_loss": -26.4727840423584, "global_step": 427451, "epoch": 5150} {"train_loss": -26.598134994506836, "global_step": 427452, "epoch": 5150} {"train_loss": -25.896957397460938, "global_step": 427453, "epoch": 5150} {"train_loss": -26.410724639892578, "global_step": 427454, "epoch": 5150} {"train_loss": -26.333484649658203, "global_step": 427455, "epoch": 5150} {"train_loss": -26.485071182250977, "global_step": 427456, "epoch": 5150} {"train_loss": -26.474700927734375, "global_step": 427457, "epoch": 5150} {"train_loss": -26.6561279296875, "global_step": 427458, "epoch": 5150} {"train_loss": -26.407257080078125, "global_step": 427459, "epoch": 5150} {"train_loss": -26.770401000976562, "global_step": 427460, "epoch": 5150} {"train_loss": -25.943471908569336, "global_step": 427461, "epoch": 5150} {"train_loss": -26.499725341796875, "global_step": 427462, "epoch": 5150} {"train_loss": -26.001134872436523, "global_step": 427463, "epoch": 5150} {"train_loss": -26.5726318359375, "global_step": 427464, "epoch": 5150} {"train_loss": -26.70269203186035, "global_step": 427465, "epoch": 5150} {"train_loss": -26.8210506439209, "global_step": 427466, "epoch": 5150} {"train_loss": -26.89508628845215, "global_step": 427467, "epoch": 5150} {"train_loss": -26.589635848999023, "global_step": 427468, "epoch": 5150} {"train_loss": -26.75722312927246, "global_step": 427469, "epoch": 5150} {"train_loss": -26.856494903564453, "global_step": 427470, "epoch": 5150} {"train_loss": -26.8028621673584, "global_step": 427471, "epoch": 5150} {"train_loss": -26.518308639526367, "global_step": 427472, "epoch": 5150} {"train_loss": -26.355972290039062, "global_step": 427473, "epoch": 5150} {"train_loss": -26.674224853515625, "global_step": 427474, "epoch": 5150} {"train_loss": -26.727426528930664, "global_step": 427475, "epoch": 5150} {"train_loss": -26.962751388549805, "global_step": 427476, "epoch": 5150} {"train_loss": -26.93364906311035, "global_step": 427477, "epoch": 5150} {"train_loss": -26.77174186706543, "global_step": 427478, "epoch": 5150} {"train_loss": -26.910327911376953, "global_step": 427479, "epoch": 5150} {"train_loss": -26.760883331298828, "global_step": 427480, "epoch": 5150} {"train_loss": -26.917383193969727, "global_step": 427481, "epoch": 5150} {"train_loss": -26.995441436767578, "global_step": 427482, "epoch": 5150} {"train_loss": -26.630512237548828, "global_step": 427483, "epoch": 5150} {"train_loss": -26.965423583984375, "global_step": 427484, "epoch": 5150} {"train_loss": -27.0350399017334, "global_step": 427485, "epoch": 5150} {"train_loss": -26.85987663269043, "global_step": 427486, "epoch": 5150} {"train_loss": -26.805633544921875, "global_step": 427487, "epoch": 5150} {"train_loss": -26.829544067382812, "global_step": 427488, "epoch": 5150} {"train_loss": -27.005643844604492, "global_step": 427489, "epoch": 5150} {"train_loss": -26.8710880279541, "global_step": 427490, "epoch": 5150} {"train_loss": -26.7849063873291, "global_step": 427491, "epoch": 5150} {"train_loss": -26.967700958251953, "global_step": 427492, "epoch": 5150} {"train_loss": -26.802448272705078, "global_step": 427493, "epoch": 5150} {"train_loss": -27.04994773864746, "global_step": 427494, "epoch": 5150} {"train_loss": -26.805408477783203, "global_step": 427495, "epoch": 5150} {"train_loss": -26.87843132019043, "global_step": 427496, "epoch": 5150} {"train_loss": -26.802814483642578, "global_step": 427497, "epoch": 5150} {"train_loss": -26.864561080932617, "global_step": 427498, "epoch": 5150} {"train_loss": -26.85306167602539, "global_step": 427499, "epoch": 5150} {"train_loss": -27.071441650390625, "global_step": 427500, "epoch": 5150} {"train_loss": -26.72541618347168, "global_step": 427501, "epoch": 5150} {"train_loss": -26.700210571289062, "global_step": 427502, "epoch": 5150} {"train_loss": -27.198001861572266, "global_step": 427503, "epoch": 5150} {"train_loss": -27.00848960876465, "global_step": 427504, "epoch": 5150} {"train_loss": -26.923925399780273, "global_step": 427505, "epoch": 5150} {"train_loss": -27.03208351135254, "global_step": 427506, "epoch": 5150} {"train_loss": -27.139856338500977, "global_step": 427507, "epoch": 5150} {"train_loss": -26.81341552734375, "global_step": 427508, "epoch": 5150} {"train_loss": -26.94069480895996, "global_step": 427509, "epoch": 5150} {"train_loss": -27.154541015625, "global_step": 427510, "epoch": 5150} {"train_loss": -26.71038246154785, "global_step": 427511, "epoch": 5150} {"train_loss": -27.211042404174805, "global_step": 427512, "epoch": 5150} {"train_loss": -26.854955673217773, "global_step": 427513, "epoch": 5150} {"train_loss": -27.324575424194336, "global_step": 427514, "epoch": 5150} {"train_loss": -27.083921432495117, "global_step": 427515, "epoch": 5150} {"train_loss": -26.921056747436523, "global_step": 427516, "epoch": 5150} {"train_loss": -27.299219131469727, "global_step": 427517, "epoch": 5150} {"train_loss": -26.920364379882812, "global_step": 427518, "epoch": 5150} {"train_loss": -27.19930076599121, "global_step": 427519, "epoch": 5150} {"train_loss": -26.92283058166504, "global_step": 427520, "epoch": 5150} {"train_loss": -26.103269577026367, "global_step": 427521, "epoch": 5150} {"train_loss": -24.332910537719727, "global_step": 427522, "epoch": 5150} {"train_loss": -21.69416618347168, "global_step": 427523, "epoch": 5150} {"train_loss": -25.537673950195312, "global_step": 427524, "epoch": 5150} {"train_loss": -25.544448852539062, "global_step": 427525, "epoch": 5150} {"train_loss": -25.951343536376953, "global_step": 427526, "epoch": 5150} {"train_loss": -25.589008331298828, "global_step": 427527, "epoch": 5150} {"train_loss": -26.092649459838867, "global_step": 427528, "epoch": 5150} {"train_loss": -25.399173736572266, "global_step": 427529, "epoch": 5150} {"train_loss": -25.910818099975586, "global_step": 427530, "epoch": 5150} {"train_loss": -26.489233016967773, "global_step": 427531, "epoch": 5150} {"train_loss": -26.568282460591877, "global_step": 427532, "epoch": 5150, "train/sim_max_reward_0": 0.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 0.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4500000": 1.0, "test/sim_max_reward_4500001": 1.0, "test/sim_max_reward_4500002": 1.0, "test/sim_max_reward_4500003": 1.0, "test/sim_max_reward_4500004": 1.0, "test/sim_max_reward_4500005": 1.0, "test/sim_max_reward_4500006": 1.0, "test/sim_max_reward_4500007": 1.0, "test/sim_max_reward_4500008": 1.0, "test/sim_max_reward_4500009": 1.0, "test/sim_max_reward_4500010": 1.0, "test/sim_max_reward_4500011": 1.0, "test/sim_max_reward_4500012": 1.0, "test/sim_max_reward_4500013": 1.0, "test/sim_max_reward_4500014": 1.0, "test/sim_max_reward_4500015": 1.0, "test/sim_max_reward_4500016": 1.0, "test/sim_max_reward_4500017": 1.0, "test/sim_max_reward_4500018": 1.0, "test/sim_max_reward_4500019": 0.0, "test/sim_max_reward_4500020": 1.0, "test/sim_max_reward_4500021": 1.0, "train/mean_score": 0.6666666666666666, "test/mean_score": 0.9545454545454546, "val_loss": 6809064.0} {"train_loss": -25.27342987060547, "global_step": 427533, "epoch": 5151} {"train_loss": -25.401657104492188, "global_step": 427534, "epoch": 5151} {"train_loss": -25.677154541015625, "global_step": 427535, "epoch": 5151} {"train_loss": -25.688989639282227, "global_step": 427536, "epoch": 5151} {"train_loss": -25.437917709350586, "global_step": 427537, "epoch": 5151} {"train_loss": -25.96004295349121, "global_step": 427538, "epoch": 5151} {"train_loss": -25.503398895263672, "global_step": 427539, "epoch": 5151} {"train_loss": -25.599807739257812, "global_step": 427540, "epoch": 5151} {"train_loss": -25.823644638061523, "global_step": 427541, "epoch": 5151} {"train_loss": -25.994705200195312, "global_step": 427542, "epoch": 5151} {"train_loss": -25.39885139465332, "global_step": 427543, "epoch": 5151} {"train_loss": -25.989667892456055, "global_step": 427544, "epoch": 5151} {"train_loss": -26.0385684967041, "global_step": 427545, "epoch": 5151} {"train_loss": -26.173864364624023, "global_step": 427546, "epoch": 5151} {"train_loss": -25.79508399963379, "global_step": 427547, "epoch": 5151} {"train_loss": -26.090463638305664, "global_step": 427548, "epoch": 5151} {"train_loss": -26.240625381469727, "global_step": 427549, "epoch": 5151} {"train_loss": -26.13350486755371, "global_step": 427550, "epoch": 5151} {"train_loss": -26.196882247924805, "global_step": 427551, "epoch": 5151} {"train_loss": -26.087051391601562, "global_step": 427552, "epoch": 5151} {"train_loss": -26.276229858398438, "global_step": 427553, "epoch": 5151} {"train_loss": -26.324426651000977, "global_step": 427554, "epoch": 5151} {"train_loss": -26.781347274780273, "global_step": 427555, "epoch": 5151} {"train_loss": -26.30478858947754, "global_step": 427556, "epoch": 5151} {"train_loss": -26.633169174194336, "global_step": 427557, "epoch": 5151} {"train_loss": -26.3626708984375, "global_step": 427558, "epoch": 5151} {"train_loss": -26.524658203125, "global_step": 427559, "epoch": 5151} {"train_loss": -26.622739791870117, "global_step": 427560, "epoch": 5151} {"train_loss": -26.366168975830078, "global_step": 427561, "epoch": 5151} {"train_loss": -26.224374771118164, "global_step": 427562, "epoch": 5151} {"train_loss": -26.6951904296875, "global_step": 427563, "epoch": 5151} {"train_loss": -26.640033721923828, "global_step": 427564, "epoch": 5151} {"train_loss": -26.619298934936523, "global_step": 427565, "epoch": 5151} {"train_loss": -26.86248207092285, "global_step": 427566, "epoch": 5151} {"train_loss": -27.126895904541016, "global_step": 427567, "epoch": 5151} {"train_loss": -26.884002685546875, "global_step": 427568, "epoch": 5151} {"train_loss": -26.847326278686523, "global_step": 427569, "epoch": 5151} {"train_loss": -26.718542098999023, "global_step": 427570, "epoch": 5151} {"train_loss": -26.703948974609375, "global_step": 427571, "epoch": 5151} {"train_loss": -26.925857543945312, "global_step": 427572, "epoch": 5151} {"train_loss": -26.762189865112305, "global_step": 427573, "epoch": 5151} {"train_loss": -26.74603271484375, "global_step": 427574, "epoch": 5151} {"train_loss": -26.99555015563965, "global_step": 427575, "epoch": 5151} {"train_loss": -27.182035446166992, "global_step": 427576, "epoch": 5151} {"train_loss": -26.71964454650879, "global_step": 427577, "epoch": 5151} {"train_loss": -26.816640853881836, "global_step": 427578, "epoch": 5151} {"train_loss": -27.0, "global_step": 427579, "epoch": 5151} {"train_loss": -26.906538009643555, "global_step": 427580, "epoch": 5151} {"train_loss": -26.563512802124023, "global_step": 427581, "epoch": 5151} {"train_loss": -26.912933349609375, "global_step": 427582, "epoch": 5151} {"train_loss": -27.078454971313477, "global_step": 427583, "epoch": 5151} {"train_loss": -26.786972045898438, "global_step": 427584, "epoch": 5151} {"train_loss": -27.018936157226562, "global_step": 427585, "epoch": 5151} {"train_loss": -26.761022567749023, "global_step": 427586, "epoch": 5151} {"train_loss": -26.75611686706543, "global_step": 427587, "epoch": 5151} {"train_loss": -26.696945190429688, "global_step": 427588, "epoch": 5151} {"train_loss": -27.084125518798828, "global_step": 427589, "epoch": 5151} {"train_loss": -27.063032150268555, "global_step": 427590, "epoch": 5151} {"train_loss": -27.09207534790039, "global_step": 427591, "epoch": 5151} {"train_loss": -27.124292373657227, "global_step": 427592, "epoch": 5151} {"train_loss": -27.07710075378418, "global_step": 427593, "epoch": 5151} {"train_loss": -26.724531173706055, "global_step": 427594, "epoch": 5151} {"train_loss": -26.96392822265625, "global_step": 427595, "epoch": 5151} {"train_loss": -27.132415771484375, "global_step": 427596, "epoch": 5151} {"train_loss": -27.21709632873535, "global_step": 427597, "epoch": 5151} {"train_loss": -26.574445724487305, "global_step": 427598, "epoch": 5151} {"train_loss": -27.083850860595703, "global_step": 427599, "epoch": 5151} {"train_loss": -27.1121826171875, "global_step": 427600, "epoch": 5151} {"train_loss": -26.981122970581055, "global_step": 427601, "epoch": 5151} {"train_loss": -26.87592124938965, "global_step": 427602, "epoch": 5151} {"train_loss": -26.923791885375977, "global_step": 427603, "epoch": 5151} {"train_loss": -27.083051681518555, "global_step": 427604, "epoch": 5151} {"train_loss": -26.556644439697266, "global_step": 427605, "epoch": 5151} {"train_loss": -26.7608585357666, "global_step": 427606, "epoch": 5151} {"train_loss": -26.462543487548828, "global_step": 427607, "epoch": 5151} {"train_loss": -26.397052764892578, "global_step": 427608, "epoch": 5151} {"train_loss": -26.597339630126953, "global_step": 427609, "epoch": 5151} {"train_loss": -27.300586700439453, "global_step": 427610, "epoch": 5151} {"train_loss": -26.647510528564453, "global_step": 427611, "epoch": 5151} {"train_loss": -26.849313735961914, "global_step": 427612, "epoch": 5151} {"train_loss": -27.060651779174805, "global_step": 427613, "epoch": 5151} {"train_loss": -26.79038429260254, "global_step": 427614, "epoch": 5151} {"train_loss": -26.576951452048426, "global_step": 427615, "epoch": 5151, "val_loss": 6803855.0} {"train_loss": -26.402088165283203, "global_step": 427616, "epoch": 5152} {"train_loss": -26.815832138061523, "global_step": 427617, "epoch": 5152} {"train_loss": -26.487201690673828, "global_step": 427618, "epoch": 5152} {"train_loss": -26.803054809570312, "global_step": 427619, "epoch": 5152} {"train_loss": -26.3638973236084, "global_step": 427620, "epoch": 5152} {"train_loss": -26.483678817749023, "global_step": 427621, "epoch": 5152} {"train_loss": -26.511808395385742, "global_step": 427622, "epoch": 5152} {"train_loss": -26.606184005737305, "global_step": 427623, "epoch": 5152} {"train_loss": -26.313556671142578, "global_step": 427624, "epoch": 5152} {"train_loss": -26.443464279174805, "global_step": 427625, "epoch": 5152} {"train_loss": -26.9007625579834, "global_step": 427626, "epoch": 5152} {"train_loss": -26.345870971679688, "global_step": 427627, "epoch": 5152} {"train_loss": -26.859222412109375, "global_step": 427628, "epoch": 5152} {"train_loss": -26.621307373046875, "global_step": 427629, "epoch": 5152} {"train_loss": -26.656620025634766, "global_step": 427630, "epoch": 5152} {"train_loss": -26.589984893798828, "global_step": 427631, "epoch": 5152} {"train_loss": -26.978347778320312, "global_step": 427632, "epoch": 5152} {"train_loss": -26.457544326782227, "global_step": 427633, "epoch": 5152} {"train_loss": -27.060470581054688, "global_step": 427634, "epoch": 5152} {"train_loss": -26.70863151550293, "global_step": 427635, "epoch": 5152} {"train_loss": -26.681257247924805, "global_step": 427636, "epoch": 5152} {"train_loss": -27.218725204467773, "global_step": 427637, "epoch": 5152} {"train_loss": -26.863691329956055, "global_step": 427638, "epoch": 5152} {"train_loss": -26.674421310424805, "global_step": 427639, "epoch": 5152} {"train_loss": -26.76556968688965, "global_step": 427640, "epoch": 5152} {"train_loss": -27.211505889892578, "global_step": 427641, "epoch": 5152} {"train_loss": -26.457361221313477, "global_step": 427642, "epoch": 5152} {"train_loss": -26.6583251953125, "global_step": 427643, "epoch": 5152} {"train_loss": -26.943334579467773, "global_step": 427644, "epoch": 5152} {"train_loss": -26.61844253540039, "global_step": 427645, "epoch": 5152} {"train_loss": -26.917621612548828, "global_step": 427646, "epoch": 5152} {"train_loss": -27.028778076171875, "global_step": 427647, "epoch": 5152} {"train_loss": -26.855010986328125, "global_step": 427648, "epoch": 5152} {"train_loss": -26.583173751831055, "global_step": 427649, "epoch": 5152} {"train_loss": -26.40277099609375, "global_step": 427650, "epoch": 5152} {"train_loss": -26.580411911010742, "global_step": 427651, "epoch": 5152} {"train_loss": -26.70237159729004, "global_step": 427652, "epoch": 5152} {"train_loss": -26.98048973083496, "global_step": 427653, "epoch": 5152} {"train_loss": -26.728240966796875, "global_step": 427654, "epoch": 5152} {"train_loss": -26.6533203125, "global_step": 427655, "epoch": 5152} {"train_loss": -26.741657257080078, "global_step": 427656, "epoch": 5152} {"train_loss": -26.88741111755371, "global_step": 427657, "epoch": 5152} {"train_loss": -26.734655380249023, "global_step": 427658, "epoch": 5152} {"train_loss": -27.185434341430664, "global_step": 427659, "epoch": 5152} {"train_loss": -26.782806396484375, "global_step": 427660, "epoch": 5152} {"train_loss": -27.0245361328125, "global_step": 427661, "epoch": 5152} {"train_loss": -26.86012840270996, "global_step": 427662, "epoch": 5152} {"train_loss": -26.6199951171875, "global_step": 427663, "epoch": 5152} {"train_loss": -27.022146224975586, "global_step": 427664, "epoch": 5152} {"train_loss": -26.692138671875, "global_step": 427665, "epoch": 5152} {"train_loss": -27.028167724609375, "global_step": 427666, "epoch": 5152} {"train_loss": -26.87751579284668, "global_step": 427667, "epoch": 5152} {"train_loss": -26.75276756286621, "global_step": 427668, "epoch": 5152} {"train_loss": -26.8297119140625, "global_step": 427669, "epoch": 5152} {"train_loss": -26.873199462890625, "global_step": 427670, "epoch": 5152} {"train_loss": -26.759984970092773, "global_step": 427671, "epoch": 5152} {"train_loss": -26.7694034576416, "global_step": 427672, "epoch": 5152} {"train_loss": -27.0006160736084, "global_step": 427673, "epoch": 5152} {"train_loss": -26.77197265625, "global_step": 427674, "epoch": 5152} {"train_loss": -26.683456420898438, "global_step": 427675, "epoch": 5152} {"train_loss": -27.042633056640625, "global_step": 427676, "epoch": 5152} {"train_loss": -27.321701049804688, "global_step": 427677, "epoch": 5152} {"train_loss": -26.438125610351562, "global_step": 427678, "epoch": 5152} {"train_loss": -26.588321685791016, "global_step": 427679, "epoch": 5152} {"train_loss": -26.87232780456543, "global_step": 427680, "epoch": 5152} {"train_loss": -27.04011344909668, "global_step": 427681, "epoch": 5152} {"train_loss": -27.098495483398438, "global_step": 427682, "epoch": 5152} {"train_loss": -26.410791397094727, "global_step": 427683, "epoch": 5152} {"train_loss": -26.92498779296875, "global_step": 427684, "epoch": 5152} {"train_loss": -27.048797607421875, "global_step": 427685, "epoch": 5152} {"train_loss": -26.945642471313477, "global_step": 427686, "epoch": 5152} {"train_loss": -27.167041778564453, "global_step": 427687, "epoch": 5152} {"train_loss": -27.002227783203125, "global_step": 427688, "epoch": 5152} {"train_loss": -27.254852294921875, "global_step": 427689, "epoch": 5152} {"train_loss": -26.70147132873535, "global_step": 427690, "epoch": 5152} {"train_loss": -26.698230743408203, "global_step": 427691, "epoch": 5152} {"train_loss": -27.19414710998535, "global_step": 427692, "epoch": 5152} {"train_loss": -26.9023380279541, "global_step": 427693, "epoch": 5152} {"train_loss": -26.97016716003418, "global_step": 427694, "epoch": 5152} {"train_loss": -26.826114654541016, "global_step": 427695, "epoch": 5152} {"train_loss": -27.049509048461914, "global_step": 427696, "epoch": 5152} {"train_loss": -27.05853843688965, "global_step": 427697, "epoch": 5152} {"train_loss": -26.800966883280193, "global_step": 427698, "epoch": 5152, "val_loss": 6870382.0} {"train_loss": -27.017309188842773, "global_step": 427699, "epoch": 5153} {"train_loss": -26.816421508789062, "global_step": 427700, "epoch": 5153} {"train_loss": -27.110986709594727, "global_step": 427701, "epoch": 5153} {"train_loss": -26.504831314086914, "global_step": 427702, "epoch": 5153} {"train_loss": -27.21527671813965, "global_step": 427703, "epoch": 5153} {"train_loss": -26.589710235595703, "global_step": 427704, "epoch": 5153} {"train_loss": -26.857868194580078, "global_step": 427705, "epoch": 5153} {"train_loss": -26.550922393798828, "global_step": 427706, "epoch": 5153} {"train_loss": -26.807861328125, "global_step": 427707, "epoch": 5153} {"train_loss": -26.779541015625, "global_step": 427708, "epoch": 5153} {"train_loss": -27.073978424072266, "global_step": 427709, "epoch": 5153} {"train_loss": -26.615192413330078, "global_step": 427710, "epoch": 5153} {"train_loss": -27.26801872253418, "global_step": 427711, "epoch": 5153} {"train_loss": -27.13423728942871, "global_step": 427712, "epoch": 5153} {"train_loss": -27.21417236328125, "global_step": 427713, "epoch": 5153} {"train_loss": -26.901107788085938, "global_step": 427714, "epoch": 5153} {"train_loss": -27.137739181518555, "global_step": 427715, "epoch": 5153} {"train_loss": -26.89866065979004, "global_step": 427716, "epoch": 5153} {"train_loss": -26.74982261657715, "global_step": 427717, "epoch": 5153} {"train_loss": -26.98939323425293, "global_step": 427718, "epoch": 5153} {"train_loss": -27.497638702392578, "global_step": 427719, "epoch": 5153} {"train_loss": -27.001535415649414, "global_step": 427720, "epoch": 5153} {"train_loss": -27.05706787109375, "global_step": 427721, "epoch": 5153} {"train_loss": -26.898202896118164, "global_step": 427722, "epoch": 5153} {"train_loss": -26.837934494018555, "global_step": 427723, "epoch": 5153} {"train_loss": -26.557493209838867, "global_step": 427724, "epoch": 5153} {"train_loss": -26.79201316833496, "global_step": 427725, "epoch": 5153} {"train_loss": -26.671560287475586, "global_step": 427726, "epoch": 5153} {"train_loss": -26.637121200561523, "global_step": 427727, "epoch": 5153} {"train_loss": -26.587194442749023, "global_step": 427728, "epoch": 5153} {"train_loss": -26.590351104736328, "global_step": 427729, "epoch": 5153} {"train_loss": -26.745319366455078, "global_step": 427730, "epoch": 5153} {"train_loss": -26.258960723876953, "global_step": 427731, "epoch": 5153} {"train_loss": -26.656991958618164, "global_step": 427732, "epoch": 5153} {"train_loss": -27.055408477783203, "global_step": 427733, "epoch": 5153} {"train_loss": -26.733234405517578, "global_step": 427734, "epoch": 5153} {"train_loss": -27.152606964111328, "global_step": 427735, "epoch": 5153} {"train_loss": -26.5180606842041, "global_step": 427736, "epoch": 5153} {"train_loss": -26.595117568969727, "global_step": 427737, "epoch": 5153} {"train_loss": -26.8031063079834, "global_step": 427738, "epoch": 5153} {"train_loss": -27.078083038330078, "global_step": 427739, "epoch": 5153} {"train_loss": -27.11396598815918, "global_step": 427740, "epoch": 5153} {"train_loss": -26.669925689697266, "global_step": 427741, "epoch": 5153} {"train_loss": -27.006595611572266, "global_step": 427742, "epoch": 5153} {"train_loss": -27.12151527404785, "global_step": 427743, "epoch": 5153} {"train_loss": -26.877639770507812, "global_step": 427744, "epoch": 5153} {"train_loss": -27.119787216186523, "global_step": 427745, "epoch": 5153} {"train_loss": -26.85980796813965, "global_step": 427746, "epoch": 5153} {"train_loss": -26.716867446899414, "global_step": 427747, "epoch": 5153} {"train_loss": -27.42361831665039, "global_step": 427748, "epoch": 5153} {"train_loss": -26.94477653503418, "global_step": 427749, "epoch": 5153} {"train_loss": -26.792449951171875, "global_step": 427750, "epoch": 5153} {"train_loss": -27.014123916625977, "global_step": 427751, "epoch": 5153} {"train_loss": -26.872314453125, "global_step": 427752, "epoch": 5153} {"train_loss": -26.923294067382812, "global_step": 427753, "epoch": 5153} {"train_loss": -26.945524215698242, "global_step": 427754, "epoch": 5153} {"train_loss": -26.722259521484375, "global_step": 427755, "epoch": 5153} {"train_loss": -26.47454261779785, "global_step": 427756, "epoch": 5153} {"train_loss": -26.580881118774414, "global_step": 427757, "epoch": 5153} {"train_loss": -26.506195068359375, "global_step": 427758, "epoch": 5153} {"train_loss": -27.548070907592773, "global_step": 427759, "epoch": 5153} {"train_loss": -27.081817626953125, "global_step": 427760, "epoch": 5153} {"train_loss": -26.65329360961914, "global_step": 427761, "epoch": 5153} {"train_loss": -26.877424240112305, "global_step": 427762, "epoch": 5153} {"train_loss": -26.93324089050293, "global_step": 427763, "epoch": 5153} {"train_loss": -26.93253517150879, "global_step": 427764, "epoch": 5153} {"train_loss": -26.92636489868164, "global_step": 427765, "epoch": 5153} {"train_loss": -26.81061363220215, "global_step": 427766, "epoch": 5153} {"train_loss": -26.781784057617188, "global_step": 427767, "epoch": 5153} {"train_loss": -26.944568634033203, "global_step": 427768, "epoch": 5153} {"train_loss": -27.226287841796875, "global_step": 427769, "epoch": 5153} {"train_loss": -26.930444717407227, "global_step": 427770, "epoch": 5153} {"train_loss": -26.99140739440918, "global_step": 427771, "epoch": 5153} {"train_loss": -26.794483184814453, "global_step": 427772, "epoch": 5153} {"train_loss": -26.77312660217285, "global_step": 427773, "epoch": 5153} {"train_loss": -26.775110244750977, "global_step": 427774, "epoch": 5153} {"train_loss": -27.058521270751953, "global_step": 427775, "epoch": 5153} {"train_loss": -26.899520874023438, "global_step": 427776, "epoch": 5153} {"train_loss": -26.847864151000977, "global_step": 427777, "epoch": 5153} {"train_loss": -26.768951416015625, "global_step": 427778, "epoch": 5153} {"train_loss": -26.848535537719727, "global_step": 427779, "epoch": 5153} {"train_loss": -27.037738800048828, "global_step": 427780, "epoch": 5153} {"train_loss": -26.883355313036816, "global_step": 427781, "epoch": 5153, "val_loss": 6951301.0} {"train_loss": -24.9409236907959, "global_step": 427782, "epoch": 5154} {"train_loss": -25.483444213867188, "global_step": 427783, "epoch": 5154} {"train_loss": -24.161624908447266, "global_step": 427784, "epoch": 5154} {"train_loss": -24.827112197875977, "global_step": 427785, "epoch": 5154} {"train_loss": -25.775373458862305, "global_step": 427786, "epoch": 5154} {"train_loss": -25.6588134765625, "global_step": 427787, "epoch": 5154} {"train_loss": -25.68477439880371, "global_step": 427788, "epoch": 5154} {"train_loss": -25.499197006225586, "global_step": 427789, "epoch": 5154} {"train_loss": -25.642744064331055, "global_step": 427790, "epoch": 5154} {"train_loss": -26.2676944732666, "global_step": 427791, "epoch": 5154} {"train_loss": -25.765127182006836, "global_step": 427792, "epoch": 5154} {"train_loss": -26.002161026000977, "global_step": 427793, "epoch": 5154} {"train_loss": -25.434532165527344, "global_step": 427794, "epoch": 5154} {"train_loss": -25.707937240600586, "global_step": 427795, "epoch": 5154} {"train_loss": -25.979887008666992, "global_step": 427796, "epoch": 5154} {"train_loss": -26.110218048095703, "global_step": 427797, "epoch": 5154} {"train_loss": -26.000410079956055, "global_step": 427798, "epoch": 5154} {"train_loss": -26.068044662475586, "global_step": 427799, "epoch": 5154} {"train_loss": -26.258193969726562, "global_step": 427800, "epoch": 5154} {"train_loss": -26.20879554748535, "global_step": 427801, "epoch": 5154} {"train_loss": -26.135761260986328, "global_step": 427802, "epoch": 5154} {"train_loss": -26.614755630493164, "global_step": 427803, "epoch": 5154} {"train_loss": -26.46832847595215, "global_step": 427804, "epoch": 5154} {"train_loss": -26.566028594970703, "global_step": 427805, "epoch": 5154} {"train_loss": -26.31245231628418, "global_step": 427806, "epoch": 5154} {"train_loss": -26.229572296142578, "global_step": 427807, "epoch": 5154} {"train_loss": -26.048328399658203, "global_step": 427808, "epoch": 5154} {"train_loss": -26.2740478515625, "global_step": 427809, "epoch": 5154} {"train_loss": -26.53096580505371, "global_step": 427810, "epoch": 5154} {"train_loss": -26.6119384765625, "global_step": 427811, "epoch": 5154} {"train_loss": -26.566669464111328, "global_step": 427812, "epoch": 5154} {"train_loss": -26.745349884033203, "global_step": 427813, "epoch": 5154} {"train_loss": -26.72806739807129, "global_step": 427814, "epoch": 5154} {"train_loss": -26.960205078125, "global_step": 427815, "epoch": 5154} {"train_loss": -26.70599937438965, "global_step": 427816, "epoch": 5154} {"train_loss": -26.711103439331055, "global_step": 427817, "epoch": 5154} {"train_loss": -26.63176918029785, "global_step": 427818, "epoch": 5154} {"train_loss": -26.609968185424805, "global_step": 427819, "epoch": 5154} {"train_loss": -26.517410278320312, "global_step": 427820, "epoch": 5154} {"train_loss": -26.80340003967285, "global_step": 427821, "epoch": 5154} {"train_loss": -26.84058952331543, "global_step": 427822, "epoch": 5154} {"train_loss": -26.843671798706055, "global_step": 427823, "epoch": 5154} {"train_loss": -26.803546905517578, "global_step": 427824, "epoch": 5154} {"train_loss": -26.6204891204834, "global_step": 427825, "epoch": 5154} {"train_loss": -27.251352310180664, "global_step": 427826, "epoch": 5154} {"train_loss": -26.498218536376953, "global_step": 427827, "epoch": 5154} {"train_loss": -26.709320068359375, "global_step": 427828, "epoch": 5154} {"train_loss": -26.674829483032227, "global_step": 427829, "epoch": 5154} {"train_loss": -26.62076187133789, "global_step": 427830, "epoch": 5154} {"train_loss": -27.30274772644043, "global_step": 427831, "epoch": 5154} {"train_loss": -26.470380783081055, "global_step": 427832, "epoch": 5154} {"train_loss": -26.90757179260254, "global_step": 427833, "epoch": 5154} {"train_loss": -26.61440086364746, "global_step": 427834, "epoch": 5154} {"train_loss": -26.6206111907959, "global_step": 427835, "epoch": 5154} {"train_loss": -26.7319278717041, "global_step": 427836, "epoch": 5154} {"train_loss": -26.77738380432129, "global_step": 427837, "epoch": 5154} {"train_loss": -26.673141479492188, "global_step": 427838, "epoch": 5154} {"train_loss": -26.81705093383789, "global_step": 427839, "epoch": 5154} {"train_loss": -26.858896255493164, "global_step": 427840, "epoch": 5154} {"train_loss": -27.013486862182617, "global_step": 427841, "epoch": 5154} {"train_loss": -26.9324893951416, "global_step": 427842, "epoch": 5154} {"train_loss": -26.7120418548584, "global_step": 427843, "epoch": 5154} {"train_loss": -26.75913429260254, "global_step": 427844, "epoch": 5154} {"train_loss": -26.7725830078125, "global_step": 427845, "epoch": 5154} {"train_loss": -27.0084285736084, "global_step": 427846, "epoch": 5154} {"train_loss": -27.25452995300293, "global_step": 427847, "epoch": 5154} {"train_loss": -27.00823974609375, "global_step": 427848, "epoch": 5154} {"train_loss": -27.2701473236084, "global_step": 427849, "epoch": 5154} {"train_loss": -27.0800838470459, "global_step": 427850, "epoch": 5154} {"train_loss": -27.197484970092773, "global_step": 427851, "epoch": 5154} {"train_loss": -27.016965866088867, "global_step": 427852, "epoch": 5154} {"train_loss": -27.088302612304688, "global_step": 427853, "epoch": 5154} {"train_loss": -27.079132080078125, "global_step": 427854, "epoch": 5154} {"train_loss": -27.334186553955078, "global_step": 427855, "epoch": 5154} {"train_loss": -27.017505645751953, "global_step": 427856, "epoch": 5154} {"train_loss": -26.85723304748535, "global_step": 427857, "epoch": 5154} {"train_loss": -26.95928955078125, "global_step": 427858, "epoch": 5154} {"train_loss": -27.030170440673828, "global_step": 427859, "epoch": 5154} {"train_loss": -26.91645622253418, "global_step": 427860, "epoch": 5154} {"train_loss": -27.247116088867188, "global_step": 427861, "epoch": 5154} {"train_loss": -26.8751163482666, "global_step": 427862, "epoch": 5154} {"train_loss": -27.096485137939453, "global_step": 427863, "epoch": 5154} {"train_loss": -26.521695010633355, "global_step": 427864, "epoch": 5154, "val_loss": 6997302.0} {"train_loss": -26.26961326599121, "global_step": 427865, "epoch": 5155} {"train_loss": -26.168317794799805, "global_step": 427866, "epoch": 5155} {"train_loss": -25.40238380432129, "global_step": 427867, "epoch": 5155} {"train_loss": -25.82876968383789, "global_step": 427868, "epoch": 5155} {"train_loss": -26.432147979736328, "global_step": 427869, "epoch": 5155} {"train_loss": -26.009174346923828, "global_step": 427870, "epoch": 5155} {"train_loss": -25.89102554321289, "global_step": 427871, "epoch": 5155} {"train_loss": -26.242414474487305, "global_step": 427872, "epoch": 5155} {"train_loss": -26.90460205078125, "global_step": 427873, "epoch": 5155} {"train_loss": -26.62283706665039, "global_step": 427874, "epoch": 5155} {"train_loss": -26.08206558227539, "global_step": 427875, "epoch": 5155} {"train_loss": -26.72332763671875, "global_step": 427876, "epoch": 5155} {"train_loss": -26.605701446533203, "global_step": 427877, "epoch": 5155} {"train_loss": -26.525959014892578, "global_step": 427878, "epoch": 5155} {"train_loss": -26.778167724609375, "global_step": 427879, "epoch": 5155} {"train_loss": -26.591262817382812, "global_step": 427880, "epoch": 5155} {"train_loss": -26.688962936401367, "global_step": 427881, "epoch": 5155} {"train_loss": -26.76934242248535, "global_step": 427882, "epoch": 5155} {"train_loss": -26.33642578125, "global_step": 427883, "epoch": 5155} {"train_loss": -26.62261962890625, "global_step": 427884, "epoch": 5155} {"train_loss": -26.583831787109375, "global_step": 427885, "epoch": 5155} {"train_loss": -26.627588272094727, "global_step": 427886, "epoch": 5155} {"train_loss": -26.508691787719727, "global_step": 427887, "epoch": 5155} {"train_loss": -26.7213134765625, "global_step": 427888, "epoch": 5155} {"train_loss": -26.780139923095703, "global_step": 427889, "epoch": 5155} {"train_loss": -26.594053268432617, "global_step": 427890, "epoch": 5155} {"train_loss": -26.731155395507812, "global_step": 427891, "epoch": 5155} {"train_loss": -26.944366455078125, "global_step": 427892, "epoch": 5155} {"train_loss": -26.838544845581055, "global_step": 427893, "epoch": 5155} {"train_loss": -27.094684600830078, "global_step": 427894, "epoch": 5155} {"train_loss": -27.269886016845703, "global_step": 427895, "epoch": 5155} {"train_loss": -27.121320724487305, "global_step": 427896, "epoch": 5155} {"train_loss": -26.96064567565918, "global_step": 427897, "epoch": 5155} {"train_loss": -26.759130477905273, "global_step": 427898, "epoch": 5155} {"train_loss": -26.723052978515625, "global_step": 427899, "epoch": 5155} {"train_loss": -27.254602432250977, "global_step": 427900, "epoch": 5155} {"train_loss": -26.917865753173828, "global_step": 427901, "epoch": 5155} {"train_loss": -26.582660675048828, "global_step": 427902, "epoch": 5155} {"train_loss": -27.104949951171875, "global_step": 427903, "epoch": 5155} {"train_loss": -26.91200828552246, "global_step": 427904, "epoch": 5155} {"train_loss": -26.943470001220703, "global_step": 427905, "epoch": 5155} {"train_loss": -27.108139038085938, "global_step": 427906, "epoch": 5155} {"train_loss": -26.671735763549805, "global_step": 427907, "epoch": 5155} {"train_loss": -26.669382095336914, "global_step": 427908, "epoch": 5155} {"train_loss": -26.892847061157227, "global_step": 427909, "epoch": 5155} {"train_loss": -26.364612579345703, "global_step": 427910, "epoch": 5155} {"train_loss": -26.86567497253418, "global_step": 427911, "epoch": 5155} {"train_loss": -27.18597412109375, "global_step": 427912, "epoch": 5155} {"train_loss": -26.847700119018555, "global_step": 427913, "epoch": 5155} {"train_loss": -26.77031898498535, "global_step": 427914, "epoch": 5155} {"train_loss": -26.784765243530273, "global_step": 427915, "epoch": 5155} {"train_loss": -26.74880027770996, "global_step": 427916, "epoch": 5155} {"train_loss": -27.4018611907959, "global_step": 427917, "epoch": 5155} {"train_loss": -26.911951065063477, "global_step": 427918, "epoch": 5155} {"train_loss": -26.615148544311523, "global_step": 427919, "epoch": 5155} {"train_loss": -26.917402267456055, "global_step": 427920, "epoch": 5155} {"train_loss": -27.084503173828125, "global_step": 427921, "epoch": 5155} {"train_loss": -27.116901397705078, "global_step": 427922, "epoch": 5155} {"train_loss": -26.99424171447754, "global_step": 427923, "epoch": 5155} {"train_loss": -26.639053344726562, "global_step": 427924, "epoch": 5155} {"train_loss": -26.847761154174805, "global_step": 427925, "epoch": 5155} {"train_loss": -26.858922958374023, "global_step": 427926, "epoch": 5155} {"train_loss": -26.706878662109375, "global_step": 427927, "epoch": 5155} {"train_loss": -26.94801139831543, "global_step": 427928, "epoch": 5155} {"train_loss": -26.491971969604492, "global_step": 427929, "epoch": 5155} {"train_loss": -26.777881622314453, "global_step": 427930, "epoch": 5155} {"train_loss": -27.115686416625977, "global_step": 427931, "epoch": 5155} {"train_loss": -27.103193283081055, "global_step": 427932, "epoch": 5155} {"train_loss": -26.62198829650879, "global_step": 427933, "epoch": 5155} {"train_loss": -26.718021392822266, "global_step": 427934, "epoch": 5155} {"train_loss": -26.831329345703125, "global_step": 427935, "epoch": 5155} {"train_loss": -26.93191909790039, "global_step": 427936, "epoch": 5155} {"train_loss": -26.68422508239746, "global_step": 427937, "epoch": 5155} {"train_loss": -26.613733291625977, "global_step": 427938, "epoch": 5155} {"train_loss": -27.230640411376953, "global_step": 427939, "epoch": 5155} {"train_loss": -27.460378646850586, "global_step": 427940, "epoch": 5155} {"train_loss": -27.006702423095703, "global_step": 427941, "epoch": 5155} {"train_loss": -26.918970108032227, "global_step": 427942, "epoch": 5155} {"train_loss": -26.8172607421875, "global_step": 427943, "epoch": 5155} {"train_loss": -26.858234405517578, "global_step": 427944, "epoch": 5155} {"train_loss": -26.900808334350586, "global_step": 427945, "epoch": 5155} {"train_loss": -26.7923526763916, "global_step": 427946, "epoch": 5155} {"train_loss": -26.73189399903079, "global_step": 427947, "epoch": 5155, "val_loss": 6906507.0} {"train_loss": -26.996816635131836, "global_step": 427948, "epoch": 5156} {"train_loss": -26.56201171875, "global_step": 427949, "epoch": 5156} {"train_loss": -26.652820587158203, "global_step": 427950, "epoch": 5156} {"train_loss": -26.335264205932617, "global_step": 427951, "epoch": 5156} {"train_loss": -26.465612411499023, "global_step": 427952, "epoch": 5156} {"train_loss": -26.733997344970703, "global_step": 427953, "epoch": 5156} {"train_loss": -26.617902755737305, "global_step": 427954, "epoch": 5156} {"train_loss": -26.71323013305664, "global_step": 427955, "epoch": 5156} {"train_loss": -26.634140014648438, "global_step": 427956, "epoch": 5156} {"train_loss": -26.280065536499023, "global_step": 427957, "epoch": 5156} {"train_loss": -26.47067642211914, "global_step": 427958, "epoch": 5156} {"train_loss": -26.227270126342773, "global_step": 427959, "epoch": 5156} {"train_loss": -26.30743408203125, "global_step": 427960, "epoch": 5156} {"train_loss": -25.989730834960938, "global_step": 427961, "epoch": 5156} {"train_loss": -26.46675682067871, "global_step": 427962, "epoch": 5156} {"train_loss": -26.14861488342285, "global_step": 427963, "epoch": 5156} {"train_loss": -26.295974731445312, "global_step": 427964, "epoch": 5156} {"train_loss": -26.782379150390625, "global_step": 427965, "epoch": 5156} {"train_loss": -26.577518463134766, "global_step": 427966, "epoch": 5156} {"train_loss": -26.66571044921875, "global_step": 427967, "epoch": 5156} {"train_loss": -26.60011100769043, "global_step": 427968, "epoch": 5156} {"train_loss": -26.454965591430664, "global_step": 427969, "epoch": 5156} {"train_loss": -26.641218185424805, "global_step": 427970, "epoch": 5156} {"train_loss": -26.4327449798584, "global_step": 427971, "epoch": 5156} {"train_loss": -26.6761531829834, "global_step": 427972, "epoch": 5156} {"train_loss": -26.86746597290039, "global_step": 427973, "epoch": 5156} {"train_loss": -26.503881454467773, "global_step": 427974, "epoch": 5156} {"train_loss": -26.837417602539062, "global_step": 427975, "epoch": 5156} {"train_loss": -26.58802604675293, "global_step": 427976, "epoch": 5156} {"train_loss": -27.04932975769043, "global_step": 427977, "epoch": 5156} {"train_loss": -26.667129516601562, "global_step": 427978, "epoch": 5156} {"train_loss": -26.814971923828125, "global_step": 427979, "epoch": 5156} {"train_loss": -27.01828956604004, "global_step": 427980, "epoch": 5156} {"train_loss": -26.70945167541504, "global_step": 427981, "epoch": 5156} {"train_loss": -26.9300594329834, "global_step": 427982, "epoch": 5156} {"train_loss": -26.639404296875, "global_step": 427983, "epoch": 5156} {"train_loss": -26.850223541259766, "global_step": 427984, "epoch": 5156} {"train_loss": -27.00373649597168, "global_step": 427985, "epoch": 5156} {"train_loss": -26.971792221069336, "global_step": 427986, "epoch": 5156} {"train_loss": -26.96253776550293, "global_step": 427987, "epoch": 5156} {"train_loss": -26.728940963745117, "global_step": 427988, "epoch": 5156} {"train_loss": -26.81267738342285, "global_step": 427989, "epoch": 5156} {"train_loss": -26.493255615234375, "global_step": 427990, "epoch": 5156} {"train_loss": -26.894384384155273, "global_step": 427991, "epoch": 5156} {"train_loss": -26.804534912109375, "global_step": 427992, "epoch": 5156} {"train_loss": -26.973846435546875, "global_step": 427993, "epoch": 5156} {"train_loss": -27.155668258666992, "global_step": 427994, "epoch": 5156} {"train_loss": -26.825536727905273, "global_step": 427995, "epoch": 5156} {"train_loss": -26.687408447265625, "global_step": 427996, "epoch": 5156} {"train_loss": -27.069976806640625, "global_step": 427997, "epoch": 5156} {"train_loss": -26.715656280517578, "global_step": 427998, "epoch": 5156} {"train_loss": -26.692975997924805, "global_step": 427999, "epoch": 5156} {"train_loss": -26.696395874023438, "global_step": 428000, "epoch": 5156} {"train_loss": -26.644392013549805, "global_step": 428001, "epoch": 5156} {"train_loss": -27.033405303955078, "global_step": 428002, "epoch": 5156} {"train_loss": -26.835086822509766, "global_step": 428003, "epoch": 5156} {"train_loss": -26.53016471862793, "global_step": 428004, "epoch": 5156} {"train_loss": -26.692163467407227, "global_step": 428005, "epoch": 5156} {"train_loss": -26.775257110595703, "global_step": 428006, "epoch": 5156} {"train_loss": -26.995817184448242, "global_step": 428007, "epoch": 5156} {"train_loss": -26.802154541015625, "global_step": 428008, "epoch": 5156} {"train_loss": -26.984731674194336, "global_step": 428009, "epoch": 5156} {"train_loss": -26.57139015197754, "global_step": 428010, "epoch": 5156} {"train_loss": -26.545978546142578, "global_step": 428011, "epoch": 5156} {"train_loss": -26.83330726623535, "global_step": 428012, "epoch": 5156} {"train_loss": -26.974119186401367, "global_step": 428013, "epoch": 5156} {"train_loss": -26.684274673461914, "global_step": 428014, "epoch": 5156} {"train_loss": -26.896574020385742, "global_step": 428015, "epoch": 5156} {"train_loss": -26.9175968170166, "global_step": 428016, "epoch": 5156} {"train_loss": -26.582202911376953, "global_step": 428017, "epoch": 5156} {"train_loss": -26.844079971313477, "global_step": 428018, "epoch": 5156} {"train_loss": -27.12335777282715, "global_step": 428019, "epoch": 5156} {"train_loss": -26.790653228759766, "global_step": 428020, "epoch": 5156} {"train_loss": -26.833892822265625, "global_step": 428021, "epoch": 5156} {"train_loss": -26.995649337768555, "global_step": 428022, "epoch": 5156} {"train_loss": -27.12262535095215, "global_step": 428023, "epoch": 5156} {"train_loss": -27.17597770690918, "global_step": 428024, "epoch": 5156} {"train_loss": -27.204315185546875, "global_step": 428025, "epoch": 5156} {"train_loss": -27.075153350830078, "global_step": 428026, "epoch": 5156} {"train_loss": -27.17873191833496, "global_step": 428027, "epoch": 5156} {"train_loss": -26.977346420288086, "global_step": 428028, "epoch": 5156} {"train_loss": -27.103845596313477, "global_step": 428029, "epoch": 5156} {"train_loss": -26.771438276911358, "global_step": 428030, "epoch": 5156, "val_loss": 7043538.0} {"train_loss": -26.297163009643555, "global_step": 428031, "epoch": 5157} {"train_loss": -26.507001876831055, "global_step": 428032, "epoch": 5157} {"train_loss": -26.47837257385254, "global_step": 428033, "epoch": 5157} {"train_loss": -26.432096481323242, "global_step": 428034, "epoch": 5157} {"train_loss": -26.447235107421875, "global_step": 428035, "epoch": 5157} {"train_loss": -26.55584716796875, "global_step": 428036, "epoch": 5157} {"train_loss": -26.30224609375, "global_step": 428037, "epoch": 5157} {"train_loss": -26.895238876342773, "global_step": 428038, "epoch": 5157} {"train_loss": -26.522369384765625, "global_step": 428039, "epoch": 5157} {"train_loss": -26.501127243041992, "global_step": 428040, "epoch": 5157} {"train_loss": -26.225971221923828, "global_step": 428041, "epoch": 5157} {"train_loss": -26.688589096069336, "global_step": 428042, "epoch": 5157} {"train_loss": -26.329267501831055, "global_step": 428043, "epoch": 5157} {"train_loss": -25.844989776611328, "global_step": 428044, "epoch": 5157} {"train_loss": -25.941680908203125, "global_step": 428045, "epoch": 5157} {"train_loss": -26.688343048095703, "global_step": 428046, "epoch": 5157} {"train_loss": -26.276578903198242, "global_step": 428047, "epoch": 5157} {"train_loss": -26.492761611938477, "global_step": 428048, "epoch": 5157} {"train_loss": -26.293420791625977, "global_step": 428049, "epoch": 5157} {"train_loss": -26.848779678344727, "global_step": 428050, "epoch": 5157} {"train_loss": -26.39558219909668, "global_step": 428051, "epoch": 5157} {"train_loss": -26.3221435546875, "global_step": 428052, "epoch": 5157} {"train_loss": -26.547346115112305, "global_step": 428053, "epoch": 5157} {"train_loss": -26.648473739624023, "global_step": 428054, "epoch": 5157} {"train_loss": -26.337690353393555, "global_step": 428055, "epoch": 5157} {"train_loss": -26.3294734954834, "global_step": 428056, "epoch": 5157} {"train_loss": -27.048263549804688, "global_step": 428057, "epoch": 5157} {"train_loss": -26.134510040283203, "global_step": 428058, "epoch": 5157} {"train_loss": -26.08637046813965, "global_step": 428059, "epoch": 5157} {"train_loss": -26.984899520874023, "global_step": 428060, "epoch": 5157} {"train_loss": -26.43512535095215, "global_step": 428061, "epoch": 5157} {"train_loss": -26.779773712158203, "global_step": 428062, "epoch": 5157} {"train_loss": -26.370519638061523, "global_step": 428063, "epoch": 5157} {"train_loss": -26.507394790649414, "global_step": 428064, "epoch": 5157} {"train_loss": -26.68979263305664, "global_step": 428065, "epoch": 5157} {"train_loss": -26.366153717041016, "global_step": 428066, "epoch": 5157} {"train_loss": -26.98213005065918, "global_step": 428067, "epoch": 5157} {"train_loss": -26.480026245117188, "global_step": 428068, "epoch": 5157} {"train_loss": -26.9377384185791, "global_step": 428069, "epoch": 5157} {"train_loss": -26.80322265625, "global_step": 428070, "epoch": 5157} {"train_loss": -26.88387107849121, "global_step": 428071, "epoch": 5157} {"train_loss": -26.50946044921875, "global_step": 428072, "epoch": 5157} {"train_loss": -26.55035972595215, "global_step": 428073, "epoch": 5157} {"train_loss": -26.754413604736328, "global_step": 428074, "epoch": 5157} {"train_loss": -26.881494522094727, "global_step": 428075, "epoch": 5157} {"train_loss": -26.529937744140625, "global_step": 428076, "epoch": 5157} {"train_loss": -26.8178653717041, "global_step": 428077, "epoch": 5157} {"train_loss": -26.673450469970703, "global_step": 428078, "epoch": 5157} {"train_loss": -26.61026382446289, "global_step": 428079, "epoch": 5157} {"train_loss": -26.989633560180664, "global_step": 428080, "epoch": 5157} {"train_loss": -26.706018447875977, "global_step": 428081, "epoch": 5157} {"train_loss": -26.799793243408203, "global_step": 428082, "epoch": 5157} {"train_loss": -26.63104248046875, "global_step": 428083, "epoch": 5157} {"train_loss": -27.143783569335938, "global_step": 428084, "epoch": 5157} {"train_loss": -26.93263053894043, "global_step": 428085, "epoch": 5157} {"train_loss": -26.8869686126709, "global_step": 428086, "epoch": 5157} {"train_loss": -27.0498046875, "global_step": 428087, "epoch": 5157} {"train_loss": -27.224889755249023, "global_step": 428088, "epoch": 5157} {"train_loss": -27.010421752929688, "global_step": 428089, "epoch": 5157} {"train_loss": -27.38718032836914, "global_step": 428090, "epoch": 5157} {"train_loss": -26.729719161987305, "global_step": 428091, "epoch": 5157} {"train_loss": -26.940937042236328, "global_step": 428092, "epoch": 5157} {"train_loss": -26.689441680908203, "global_step": 428093, "epoch": 5157} {"train_loss": -26.93316078186035, "global_step": 428094, "epoch": 5157} {"train_loss": -26.54276466369629, "global_step": 428095, "epoch": 5157} {"train_loss": -27.24342918395996, "global_step": 428096, "epoch": 5157} {"train_loss": -27.15939712524414, "global_step": 428097, "epoch": 5157} {"train_loss": -26.93084144592285, "global_step": 428098, "epoch": 5157} {"train_loss": -26.861255645751953, "global_step": 428099, "epoch": 5157} {"train_loss": -27.051950454711914, "global_step": 428100, "epoch": 5157} {"train_loss": -27.18781089782715, "global_step": 428101, "epoch": 5157} {"train_loss": -27.043689727783203, "global_step": 428102, "epoch": 5157} {"train_loss": -26.92534828186035, "global_step": 428103, "epoch": 5157} {"train_loss": -26.892908096313477, "global_step": 428104, "epoch": 5157} {"train_loss": -26.846206665039062, "global_step": 428105, "epoch": 5157} {"train_loss": -25.919635772705078, "global_step": 428106, "epoch": 5157} {"train_loss": -25.387544631958008, "global_step": 428107, "epoch": 5157} {"train_loss": -25.363561630249023, "global_step": 428108, "epoch": 5157} {"train_loss": -26.964879989624023, "global_step": 428109, "epoch": 5157} {"train_loss": -26.258581161499023, "global_step": 428110, "epoch": 5157} {"train_loss": -26.506689071655273, "global_step": 428111, "epoch": 5157} {"train_loss": -26.669891357421875, "global_step": 428112, "epoch": 5157} {"train_loss": -26.632418758897895, "global_step": 428113, "epoch": 5157, "val_loss": 6937856.0} {"train_loss": -25.369983673095703, "global_step": 428114, "epoch": 5158} {"train_loss": -26.248754501342773, "global_step": 428115, "epoch": 5158} {"train_loss": -26.27650260925293, "global_step": 428116, "epoch": 5158} {"train_loss": -25.874374389648438, "global_step": 428117, "epoch": 5158} {"train_loss": -26.460824966430664, "global_step": 428118, "epoch": 5158} {"train_loss": -25.80787467956543, "global_step": 428119, "epoch": 5158} {"train_loss": -25.989276885986328, "global_step": 428120, "epoch": 5158} {"train_loss": -26.438840866088867, "global_step": 428121, "epoch": 5158} {"train_loss": -25.744596481323242, "global_step": 428122, "epoch": 5158} {"train_loss": -26.041528701782227, "global_step": 428123, "epoch": 5158} {"train_loss": -26.373945236206055, "global_step": 428124, "epoch": 5158} {"train_loss": -26.32204246520996, "global_step": 428125, "epoch": 5158} {"train_loss": -25.93389320373535, "global_step": 428126, "epoch": 5158} {"train_loss": -26.15606689453125, "global_step": 428127, "epoch": 5158} {"train_loss": -26.559701919555664, "global_step": 428128, "epoch": 5158} {"train_loss": -26.30670166015625, "global_step": 428129, "epoch": 5158} {"train_loss": -26.19036865234375, "global_step": 428130, "epoch": 5158} {"train_loss": -26.488183975219727, "global_step": 428131, "epoch": 5158} {"train_loss": -26.550113677978516, "global_step": 428132, "epoch": 5158} {"train_loss": -26.480499267578125, "global_step": 428133, "epoch": 5158} {"train_loss": -26.698429107666016, "global_step": 428134, "epoch": 5158} {"train_loss": -26.21221351623535, "global_step": 428135, "epoch": 5158} {"train_loss": -26.71558952331543, "global_step": 428136, "epoch": 5158} {"train_loss": -26.58741569519043, "global_step": 428137, "epoch": 5158} {"train_loss": -26.192188262939453, "global_step": 428138, "epoch": 5158} {"train_loss": -26.48208999633789, "global_step": 428139, "epoch": 5158} {"train_loss": -26.5791072845459, "global_step": 428140, "epoch": 5158} {"train_loss": -26.6250057220459, "global_step": 428141, "epoch": 5158} {"train_loss": -26.747034072875977, "global_step": 428142, "epoch": 5158} {"train_loss": -26.720111846923828, "global_step": 428143, "epoch": 5158} {"train_loss": -26.869842529296875, "global_step": 428144, "epoch": 5158} {"train_loss": -26.86890983581543, "global_step": 428145, "epoch": 5158} {"train_loss": -26.8054141998291, "global_step": 428146, "epoch": 5158} {"train_loss": -26.869049072265625, "global_step": 428147, "epoch": 5158} {"train_loss": -26.686487197875977, "global_step": 428148, "epoch": 5158} {"train_loss": -26.648900985717773, "global_step": 428149, "epoch": 5158} {"train_loss": -26.635986328125, "global_step": 428150, "epoch": 5158} {"train_loss": -26.943967819213867, "global_step": 428151, "epoch": 5158} {"train_loss": -26.648529052734375, "global_step": 428152, "epoch": 5158} {"train_loss": -26.79638671875, "global_step": 428153, "epoch": 5158} {"train_loss": -26.618412017822266, "global_step": 428154, "epoch": 5158} {"train_loss": -26.947912216186523, "global_step": 428155, "epoch": 5158} {"train_loss": -26.65302085876465, "global_step": 428156, "epoch": 5158} {"train_loss": -26.74148941040039, "global_step": 428157, "epoch": 5158} {"train_loss": -26.91761589050293, "global_step": 428158, "epoch": 5158} {"train_loss": -27.016345977783203, "global_step": 428159, "epoch": 5158} {"train_loss": -26.975439071655273, "global_step": 428160, "epoch": 5158} {"train_loss": -26.777576446533203, "global_step": 428161, "epoch": 5158} {"train_loss": -26.973068237304688, "global_step": 428162, "epoch": 5158} {"train_loss": -26.836063385009766, "global_step": 428163, "epoch": 5158} {"train_loss": -26.875751495361328, "global_step": 428164, "epoch": 5158} {"train_loss": -26.742359161376953, "global_step": 428165, "epoch": 5158} {"train_loss": -27.115076065063477, "global_step": 428166, "epoch": 5158} {"train_loss": -27.049570083618164, "global_step": 428167, "epoch": 5158} {"train_loss": -27.06357192993164, "global_step": 428168, "epoch": 5158} {"train_loss": -27.08205223083496, "global_step": 428169, "epoch": 5158} {"train_loss": -26.98206901550293, "global_step": 428170, "epoch": 5158} {"train_loss": -27.24824333190918, "global_step": 428171, "epoch": 5158} {"train_loss": -27.029987335205078, "global_step": 428172, "epoch": 5158} {"train_loss": -27.056516647338867, "global_step": 428173, "epoch": 5158} {"train_loss": -27.134313583374023, "global_step": 428174, "epoch": 5158} {"train_loss": -26.89404296875, "global_step": 428175, "epoch": 5158} {"train_loss": -27.242523193359375, "global_step": 428176, "epoch": 5158} {"train_loss": -27.140302658081055, "global_step": 428177, "epoch": 5158} {"train_loss": -27.166427612304688, "global_step": 428178, "epoch": 5158} {"train_loss": -27.14105224609375, "global_step": 428179, "epoch": 5158} {"train_loss": -26.600784301757812, "global_step": 428180, "epoch": 5158} {"train_loss": -26.25775718688965, "global_step": 428181, "epoch": 5158} {"train_loss": -25.8956298828125, "global_step": 428182, "epoch": 5158} {"train_loss": -26.064899444580078, "global_step": 428183, "epoch": 5158} {"train_loss": -26.8424129486084, "global_step": 428184, "epoch": 5158} {"train_loss": -27.005218505859375, "global_step": 428185, "epoch": 5158} {"train_loss": -26.593000411987305, "global_step": 428186, "epoch": 5158} {"train_loss": -26.55006217956543, "global_step": 428187, "epoch": 5158} {"train_loss": -26.741113662719727, "global_step": 428188, "epoch": 5158} {"train_loss": -26.634693145751953, "global_step": 428189, "epoch": 5158} {"train_loss": -26.6378231048584, "global_step": 428190, "epoch": 5158} {"train_loss": -26.653982162475586, "global_step": 428191, "epoch": 5158} {"train_loss": -26.846158981323242, "global_step": 428192, "epoch": 5158} {"train_loss": -26.608840942382812, "global_step": 428193, "epoch": 5158} {"train_loss": -26.6519718170166, "global_step": 428194, "epoch": 5158} {"train_loss": -26.96408462524414, "global_step": 428195, "epoch": 5158} {"train_loss": -26.62554014734475, "global_step": 428196, "epoch": 5158, "val_loss": 6986008.5} {"train_loss": -25.97723960876465, "global_step": 428197, "epoch": 5159} {"train_loss": -26.28066062927246, "global_step": 428198, "epoch": 5159} {"train_loss": -26.4763240814209, "global_step": 428199, "epoch": 5159} {"train_loss": -26.113794326782227, "global_step": 428200, "epoch": 5159} {"train_loss": -26.575973510742188, "global_step": 428201, "epoch": 5159} {"train_loss": -26.315601348876953, "global_step": 428202, "epoch": 5159} {"train_loss": -26.768041610717773, "global_step": 428203, "epoch": 5159} {"train_loss": -26.289770126342773, "global_step": 428204, "epoch": 5159} {"train_loss": -26.4801025390625, "global_step": 428205, "epoch": 5159} {"train_loss": -26.719482421875, "global_step": 428206, "epoch": 5159} {"train_loss": -26.33894157409668, "global_step": 428207, "epoch": 5159} {"train_loss": -26.815576553344727, "global_step": 428208, "epoch": 5159} {"train_loss": -26.532094955444336, "global_step": 428209, "epoch": 5159} {"train_loss": -26.1994571685791, "global_step": 428210, "epoch": 5159} {"train_loss": -26.7447509765625, "global_step": 428211, "epoch": 5159} {"train_loss": -26.761993408203125, "global_step": 428212, "epoch": 5159} {"train_loss": -26.91839027404785, "global_step": 428213, "epoch": 5159} {"train_loss": -26.25526237487793, "global_step": 428214, "epoch": 5159} {"train_loss": -26.714014053344727, "global_step": 428215, "epoch": 5159} {"train_loss": -27.165151596069336, "global_step": 428216, "epoch": 5159} {"train_loss": -27.163436889648438, "global_step": 428217, "epoch": 5159} {"train_loss": -26.5465087890625, "global_step": 428218, "epoch": 5159} {"train_loss": -26.739805221557617, "global_step": 428219, "epoch": 5159} {"train_loss": -26.60854148864746, "global_step": 428220, "epoch": 5159} {"train_loss": -26.908594131469727, "global_step": 428221, "epoch": 5159} {"train_loss": -27.121509552001953, "global_step": 428222, "epoch": 5159} {"train_loss": -26.810895919799805, "global_step": 428223, "epoch": 5159} {"train_loss": -26.727567672729492, "global_step": 428224, "epoch": 5159} {"train_loss": -26.97381019592285, "global_step": 428225, "epoch": 5159} {"train_loss": -26.763507843017578, "global_step": 428226, "epoch": 5159} {"train_loss": -27.082050323486328, "global_step": 428227, "epoch": 5159} {"train_loss": -27.13897132873535, "global_step": 428228, "epoch": 5159} {"train_loss": -27.233243942260742, "global_step": 428229, "epoch": 5159} {"train_loss": -26.610883712768555, "global_step": 428230, "epoch": 5159} {"train_loss": -26.754240036010742, "global_step": 428231, "epoch": 5159} {"train_loss": -26.897001266479492, "global_step": 428232, "epoch": 5159} {"train_loss": -27.2222957611084, "global_step": 428233, "epoch": 5159} {"train_loss": -26.93356704711914, "global_step": 428234, "epoch": 5159} {"train_loss": -27.11812400817871, "global_step": 428235, "epoch": 5159} {"train_loss": -26.904687881469727, "global_step": 428236, "epoch": 5159} {"train_loss": -26.800825119018555, "global_step": 428237, "epoch": 5159} {"train_loss": -27.38666343688965, "global_step": 428238, "epoch": 5159} {"train_loss": -27.02754783630371, "global_step": 428239, "epoch": 5159} {"train_loss": -27.07200050354004, "global_step": 428240, "epoch": 5159} {"train_loss": -27.09421157836914, "global_step": 428241, "epoch": 5159} {"train_loss": -26.96002769470215, "global_step": 428242, "epoch": 5159} {"train_loss": -27.067102432250977, "global_step": 428243, "epoch": 5159} {"train_loss": -26.9890079498291, "global_step": 428244, "epoch": 5159} {"train_loss": -27.12702751159668, "global_step": 428245, "epoch": 5159} {"train_loss": -27.32301139831543, "global_step": 428246, "epoch": 5159} {"train_loss": -26.872236251831055, "global_step": 428247, "epoch": 5159} {"train_loss": -26.63924217224121, "global_step": 428248, "epoch": 5159} {"train_loss": -26.688648223876953, "global_step": 428249, "epoch": 5159} {"train_loss": -26.61504554748535, "global_step": 428250, "epoch": 5159} {"train_loss": -26.490564346313477, "global_step": 428251, "epoch": 5159} {"train_loss": -26.4340763092041, "global_step": 428252, "epoch": 5159} {"train_loss": -27.170862197875977, "global_step": 428253, "epoch": 5159} {"train_loss": -27.276514053344727, "global_step": 428254, "epoch": 5159} {"train_loss": -27.056684494018555, "global_step": 428255, "epoch": 5159} {"train_loss": -26.69416618347168, "global_step": 428256, "epoch": 5159} {"train_loss": -26.642868041992188, "global_step": 428257, "epoch": 5159} {"train_loss": -26.478864669799805, "global_step": 428258, "epoch": 5159} {"train_loss": -26.814289093017578, "global_step": 428259, "epoch": 5159} {"train_loss": -27.147916793823242, "global_step": 428260, "epoch": 5159} {"train_loss": -26.749191284179688, "global_step": 428261, "epoch": 5159} {"train_loss": -26.788593292236328, "global_step": 428262, "epoch": 5159} {"train_loss": -26.398908615112305, "global_step": 428263, "epoch": 5159} {"train_loss": -26.61663818359375, "global_step": 428264, "epoch": 5159} {"train_loss": -27.275562286376953, "global_step": 428265, "epoch": 5159} {"train_loss": -26.88041114807129, "global_step": 428266, "epoch": 5159} {"train_loss": -26.975061416625977, "global_step": 428267, "epoch": 5159} {"train_loss": -26.96490478515625, "global_step": 428268, "epoch": 5159} {"train_loss": -26.819814682006836, "global_step": 428269, "epoch": 5159} {"train_loss": -27.023557662963867, "global_step": 428270, "epoch": 5159} {"train_loss": -27.06632423400879, "global_step": 428271, "epoch": 5159} {"train_loss": -27.06211280822754, "global_step": 428272, "epoch": 5159} {"train_loss": -26.933502197265625, "global_step": 428273, "epoch": 5159} {"train_loss": -27.015247344970703, "global_step": 428274, "epoch": 5159} {"train_loss": -26.62482261657715, "global_step": 428275, "epoch": 5159} {"train_loss": -26.679418563842773, "global_step": 428276, "epoch": 5159} {"train_loss": -26.851028442382812, "global_step": 428277, "epoch": 5159} {"train_loss": -26.849842071533203, "global_step": 428278, "epoch": 5159} {"train_loss": -26.814078641225056, "global_step": 428279, "epoch": 5159, "val_loss": 6921614.0} {"train_loss": -27.1743221282959, "global_step": 428280, "epoch": 5160} {"train_loss": -26.200376510620117, "global_step": 428281, "epoch": 5160} {"train_loss": -26.495532989501953, "global_step": 428282, "epoch": 5160} {"train_loss": -26.481359481811523, "global_step": 428283, "epoch": 5160} {"train_loss": -26.53985595703125, "global_step": 428284, "epoch": 5160} {"train_loss": -27.03480339050293, "global_step": 428285, "epoch": 5160} {"train_loss": -26.595752716064453, "global_step": 428286, "epoch": 5160} {"train_loss": -26.40753173828125, "global_step": 428287, "epoch": 5160} {"train_loss": -26.82038688659668, "global_step": 428288, "epoch": 5160} {"train_loss": -26.668710708618164, "global_step": 428289, "epoch": 5160} {"train_loss": -27.080413818359375, "global_step": 428290, "epoch": 5160} {"train_loss": -26.72174072265625, "global_step": 428291, "epoch": 5160} {"train_loss": -26.767423629760742, "global_step": 428292, "epoch": 5160} {"train_loss": -26.681806564331055, "global_step": 428293, "epoch": 5160} {"train_loss": -26.499608993530273, "global_step": 428294, "epoch": 5160} {"train_loss": -26.83147621154785, "global_step": 428295, "epoch": 5160} {"train_loss": -26.742385864257812, "global_step": 428296, "epoch": 5160} {"train_loss": -27.04947280883789, "global_step": 428297, "epoch": 5160} {"train_loss": -27.038293838500977, "global_step": 428298, "epoch": 5160} {"train_loss": -26.77095603942871, "global_step": 428299, "epoch": 5160} {"train_loss": -26.661331176757812, "global_step": 428300, "epoch": 5160} {"train_loss": -26.834381103515625, "global_step": 428301, "epoch": 5160} {"train_loss": -26.713048934936523, "global_step": 428302, "epoch": 5160} {"train_loss": -26.616718292236328, "global_step": 428303, "epoch": 5160} {"train_loss": -26.443357467651367, "global_step": 428304, "epoch": 5160} {"train_loss": -27.022489547729492, "global_step": 428305, "epoch": 5160} {"train_loss": -26.6794490814209, "global_step": 428306, "epoch": 5160} {"train_loss": -26.99704933166504, "global_step": 428307, "epoch": 5160} {"train_loss": -26.865467071533203, "global_step": 428308, "epoch": 5160} {"train_loss": -27.093536376953125, "global_step": 428309, "epoch": 5160} {"train_loss": -26.994556427001953, "global_step": 428310, "epoch": 5160} {"train_loss": -26.438772201538086, "global_step": 428311, "epoch": 5160} {"train_loss": -26.966693878173828, "global_step": 428312, "epoch": 5160} {"train_loss": -27.32159423828125, "global_step": 428313, "epoch": 5160} {"train_loss": -26.64837646484375, "global_step": 428314, "epoch": 5160} {"train_loss": -26.5521240234375, "global_step": 428315, "epoch": 5160} {"train_loss": -27.040746688842773, "global_step": 428316, "epoch": 5160} {"train_loss": -26.809497833251953, "global_step": 428317, "epoch": 5160} {"train_loss": -26.9432373046875, "global_step": 428318, "epoch": 5160} {"train_loss": -26.71009635925293, "global_step": 428319, "epoch": 5160} {"train_loss": -26.827850341796875, "global_step": 428320, "epoch": 5160} {"train_loss": -27.008813858032227, "global_step": 428321, "epoch": 5160} {"train_loss": -26.906530380249023, "global_step": 428322, "epoch": 5160} {"train_loss": -27.10642433166504, "global_step": 428323, "epoch": 5160} {"train_loss": -27.03187370300293, "global_step": 428324, "epoch": 5160} {"train_loss": -27.2459659576416, "global_step": 428325, "epoch": 5160} {"train_loss": -26.669483184814453, "global_step": 428326, "epoch": 5160} {"train_loss": -27.557111740112305, "global_step": 428327, "epoch": 5160} {"train_loss": -27.247039794921875, "global_step": 428328, "epoch": 5160} {"train_loss": -26.726825714111328, "global_step": 428329, "epoch": 5160} {"train_loss": -27.009138107299805, "global_step": 428330, "epoch": 5160} {"train_loss": -27.075979232788086, "global_step": 428331, "epoch": 5160} {"train_loss": -27.18531608581543, "global_step": 428332, "epoch": 5160} {"train_loss": -27.037988662719727, "global_step": 428333, "epoch": 5160} {"train_loss": -26.77497673034668, "global_step": 428334, "epoch": 5160} {"train_loss": -26.843576431274414, "global_step": 428335, "epoch": 5160} {"train_loss": -26.825403213500977, "global_step": 428336, "epoch": 5160} {"train_loss": -26.37548828125, "global_step": 428337, "epoch": 5160} {"train_loss": -26.304128646850586, "global_step": 428338, "epoch": 5160} {"train_loss": -25.707977294921875, "global_step": 428339, "epoch": 5160} {"train_loss": -26.424203872680664, "global_step": 428340, "epoch": 5160} {"train_loss": -26.594696044921875, "global_step": 428341, "epoch": 5160} {"train_loss": -26.750410079956055, "global_step": 428342, "epoch": 5160} {"train_loss": -26.613876342773438, "global_step": 428343, "epoch": 5160} {"train_loss": -26.794889450073242, "global_step": 428344, "epoch": 5160} {"train_loss": -26.619489669799805, "global_step": 428345, "epoch": 5160} {"train_loss": -27.037372589111328, "global_step": 428346, "epoch": 5160} {"train_loss": -26.726058959960938, "global_step": 428347, "epoch": 5160} {"train_loss": -26.64878273010254, "global_step": 428348, "epoch": 5160} {"train_loss": -26.719526290893555, "global_step": 428349, "epoch": 5160} {"train_loss": -27.050485610961914, "global_step": 428350, "epoch": 5160} {"train_loss": -26.93804359436035, "global_step": 428351, "epoch": 5160} {"train_loss": -26.804767608642578, "global_step": 428352, "epoch": 5160} {"train_loss": -26.768295288085938, "global_step": 428353, "epoch": 5160} {"train_loss": -27.3310604095459, "global_step": 428354, "epoch": 5160} {"train_loss": -26.746479034423828, "global_step": 428355, "epoch": 5160} {"train_loss": -26.900671005249023, "global_step": 428356, "epoch": 5160} {"train_loss": -26.714202880859375, "global_step": 428357, "epoch": 5160} {"train_loss": -26.799341201782227, "global_step": 428358, "epoch": 5160} {"train_loss": -27.1295108795166, "global_step": 428359, "epoch": 5160} {"train_loss": -26.73809814453125, "global_step": 428360, "epoch": 5160} {"train_loss": -27.076284408569336, "global_step": 428361, "epoch": 5160} {"train_loss": -26.79943709775626, "global_step": 428362, "epoch": 5160, "val_loss": 6932058.5} {"train_loss": -26.7698974609375, "global_step": 428363, "epoch": 5161} {"train_loss": -26.882587432861328, "global_step": 428364, "epoch": 5161} {"train_loss": -26.65791893005371, "global_step": 428365, "epoch": 5161} {"train_loss": -26.830585479736328, "global_step": 428366, "epoch": 5161} {"train_loss": -26.516138076782227, "global_step": 428367, "epoch": 5161} {"train_loss": -26.80732536315918, "global_step": 428368, "epoch": 5161} {"train_loss": -26.946975708007812, "global_step": 428369, "epoch": 5161} {"train_loss": -26.76624870300293, "global_step": 428370, "epoch": 5161} {"train_loss": -26.649673461914062, "global_step": 428371, "epoch": 5161} {"train_loss": -26.93587303161621, "global_step": 428372, "epoch": 5161} {"train_loss": -26.847646713256836, "global_step": 428373, "epoch": 5161} {"train_loss": -26.606054306030273, "global_step": 428374, "epoch": 5161} {"train_loss": -26.99578857421875, "global_step": 428375, "epoch": 5161} {"train_loss": -26.841480255126953, "global_step": 428376, "epoch": 5161} {"train_loss": -26.554046630859375, "global_step": 428377, "epoch": 5161} {"train_loss": -27.135339736938477, "global_step": 428378, "epoch": 5161} {"train_loss": -26.766448974609375, "global_step": 428379, "epoch": 5161} {"train_loss": -26.54314613342285, "global_step": 428380, "epoch": 5161} {"train_loss": -27.125553131103516, "global_step": 428381, "epoch": 5161} {"train_loss": -26.298633575439453, "global_step": 428382, "epoch": 5161} {"train_loss": -26.641366958618164, "global_step": 428383, "epoch": 5161} {"train_loss": -26.813282012939453, "global_step": 428384, "epoch": 5161} {"train_loss": -26.958786010742188, "global_step": 428385, "epoch": 5161} {"train_loss": -26.800085067749023, "global_step": 428386, "epoch": 5161} {"train_loss": -26.620508193969727, "global_step": 428387, "epoch": 5161} {"train_loss": -26.518835067749023, "global_step": 428388, "epoch": 5161} {"train_loss": -26.80414390563965, "global_step": 428389, "epoch": 5161} {"train_loss": -26.70014762878418, "global_step": 428390, "epoch": 5161} {"train_loss": -26.72258949279785, "global_step": 428391, "epoch": 5161} {"train_loss": -26.691617965698242, "global_step": 428392, "epoch": 5161} {"train_loss": -26.37409782409668, "global_step": 428393, "epoch": 5161} {"train_loss": -26.858245849609375, "global_step": 428394, "epoch": 5161} {"train_loss": -26.83765983581543, "global_step": 428395, "epoch": 5161} {"train_loss": -26.50927734375, "global_step": 428396, "epoch": 5161} {"train_loss": -27.09369468688965, "global_step": 428397, "epoch": 5161} {"train_loss": -27.0485897064209, "global_step": 428398, "epoch": 5161} {"train_loss": -26.743717193603516, "global_step": 428399, "epoch": 5161} {"train_loss": -26.847339630126953, "global_step": 428400, "epoch": 5161} {"train_loss": -26.493356704711914, "global_step": 428401, "epoch": 5161} {"train_loss": -26.84553337097168, "global_step": 428402, "epoch": 5161} {"train_loss": -26.5162410736084, "global_step": 428403, "epoch": 5161} {"train_loss": -26.4042911529541, "global_step": 428404, "epoch": 5161} {"train_loss": -26.838781356811523, "global_step": 428405, "epoch": 5161} {"train_loss": -27.147993087768555, "global_step": 428406, "epoch": 5161} {"train_loss": -26.733198165893555, "global_step": 428407, "epoch": 5161} {"train_loss": -26.411680221557617, "global_step": 428408, "epoch": 5161} {"train_loss": -26.075397491455078, "global_step": 428409, "epoch": 5161} {"train_loss": -26.06633949279785, "global_step": 428410, "epoch": 5161} {"train_loss": -26.913909912109375, "global_step": 428411, "epoch": 5161} {"train_loss": -26.58436393737793, "global_step": 428412, "epoch": 5161} {"train_loss": -26.124536514282227, "global_step": 428413, "epoch": 5161} {"train_loss": -26.4499568939209, "global_step": 428414, "epoch": 5161} {"train_loss": -26.3614444732666, "global_step": 428415, "epoch": 5161} {"train_loss": -26.267187118530273, "global_step": 428416, "epoch": 5161} {"train_loss": -26.639184951782227, "global_step": 428417, "epoch": 5161} {"train_loss": -26.50929069519043, "global_step": 428418, "epoch": 5161} {"train_loss": -26.440479278564453, "global_step": 428419, "epoch": 5161} {"train_loss": -26.5045108795166, "global_step": 428420, "epoch": 5161} {"train_loss": -26.837417602539062, "global_step": 428421, "epoch": 5161} {"train_loss": -26.638254165649414, "global_step": 428422, "epoch": 5161} {"train_loss": -26.729772567749023, "global_step": 428423, "epoch": 5161} {"train_loss": -26.599750518798828, "global_step": 428424, "epoch": 5161} {"train_loss": -26.808048248291016, "global_step": 428425, "epoch": 5161} {"train_loss": -26.48370361328125, "global_step": 428426, "epoch": 5161} {"train_loss": -26.87537956237793, "global_step": 428427, "epoch": 5161} {"train_loss": -26.758838653564453, "global_step": 428428, "epoch": 5161} {"train_loss": -26.534317016601562, "global_step": 428429, "epoch": 5161} {"train_loss": -26.80672264099121, "global_step": 428430, "epoch": 5161} {"train_loss": -26.82965087890625, "global_step": 428431, "epoch": 5161} {"train_loss": -26.9644718170166, "global_step": 428432, "epoch": 5161} {"train_loss": -26.705289840698242, "global_step": 428433, "epoch": 5161} {"train_loss": -26.536733627319336, "global_step": 428434, "epoch": 5161} {"train_loss": -26.667984008789062, "global_step": 428435, "epoch": 5161} {"train_loss": -26.895593643188477, "global_step": 428436, "epoch": 5161} {"train_loss": -27.114654541015625, "global_step": 428437, "epoch": 5161} {"train_loss": -26.705738067626953, "global_step": 428438, "epoch": 5161} {"train_loss": -27.146276473999023, "global_step": 428439, "epoch": 5161} {"train_loss": -26.79888916015625, "global_step": 428440, "epoch": 5161} {"train_loss": -26.776752471923828, "global_step": 428441, "epoch": 5161} {"train_loss": -26.74371337890625, "global_step": 428442, "epoch": 5161} {"train_loss": -27.135894775390625, "global_step": 428443, "epoch": 5161} {"train_loss": -26.843368530273438, "global_step": 428444, "epoch": 5161} {"train_loss": -26.71361180960414, "global_step": 428445, "epoch": 5161, "val_loss": 6856217.5} {"train_loss": -25.529245376586914, "global_step": 428446, "epoch": 5162} {"train_loss": -25.89226722717285, "global_step": 428447, "epoch": 5162} {"train_loss": -25.58279800415039, "global_step": 428448, "epoch": 5162} {"train_loss": -26.24586296081543, "global_step": 428449, "epoch": 5162} {"train_loss": -26.15398597717285, "global_step": 428450, "epoch": 5162} {"train_loss": -26.34644889831543, "global_step": 428451, "epoch": 5162} {"train_loss": -26.070117950439453, "global_step": 428452, "epoch": 5162} {"train_loss": -26.537616729736328, "global_step": 428453, "epoch": 5162} {"train_loss": -26.181787490844727, "global_step": 428454, "epoch": 5162} {"train_loss": -26.0754451751709, "global_step": 428455, "epoch": 5162} {"train_loss": -26.439794540405273, "global_step": 428456, "epoch": 5162} {"train_loss": -26.14948844909668, "global_step": 428457, "epoch": 5162} {"train_loss": -26.65690040588379, "global_step": 428458, "epoch": 5162} {"train_loss": -26.496931076049805, "global_step": 428459, "epoch": 5162} {"train_loss": -26.50587272644043, "global_step": 428460, "epoch": 5162} {"train_loss": -25.868310928344727, "global_step": 428461, "epoch": 5162} {"train_loss": -26.58023452758789, "global_step": 428462, "epoch": 5162} {"train_loss": -26.080732345581055, "global_step": 428463, "epoch": 5162} {"train_loss": -26.185718536376953, "global_step": 428464, "epoch": 5162} {"train_loss": -26.76287269592285, "global_step": 428465, "epoch": 5162} {"train_loss": -26.07330322265625, "global_step": 428466, "epoch": 5162} {"train_loss": -26.516576766967773, "global_step": 428467, "epoch": 5162} {"train_loss": -26.56426429748535, "global_step": 428468, "epoch": 5162} {"train_loss": -26.65296745300293, "global_step": 428469, "epoch": 5162} {"train_loss": -26.736303329467773, "global_step": 428470, "epoch": 5162} {"train_loss": -26.924474716186523, "global_step": 428471, "epoch": 5162} {"train_loss": -26.119800567626953, "global_step": 428472, "epoch": 5162} {"train_loss": -26.60332679748535, "global_step": 428473, "epoch": 5162} {"train_loss": -26.538883209228516, "global_step": 428474, "epoch": 5162} {"train_loss": -26.675537109375, "global_step": 428475, "epoch": 5162} {"train_loss": -26.268869400024414, "global_step": 428476, "epoch": 5162} {"train_loss": -26.598678588867188, "global_step": 428477, "epoch": 5162} {"train_loss": -26.233230590820312, "global_step": 428478, "epoch": 5162} {"train_loss": -26.820646286010742, "global_step": 428479, "epoch": 5162} {"train_loss": -26.689483642578125, "global_step": 428480, "epoch": 5162} {"train_loss": -26.69428825378418, "global_step": 428481, "epoch": 5162} {"train_loss": -26.66668128967285, "global_step": 428482, "epoch": 5162} {"train_loss": -27.18184471130371, "global_step": 428483, "epoch": 5162} {"train_loss": -26.499921798706055, "global_step": 428484, "epoch": 5162} {"train_loss": -26.66352653503418, "global_step": 428485, "epoch": 5162} {"train_loss": -26.482969284057617, "global_step": 428486, "epoch": 5162} {"train_loss": -26.64405632019043, "global_step": 428487, "epoch": 5162} {"train_loss": -26.78632164001465, "global_step": 428488, "epoch": 5162} {"train_loss": -26.79941749572754, "global_step": 428489, "epoch": 5162} {"train_loss": -26.781137466430664, "global_step": 428490, "epoch": 5162} {"train_loss": -26.859060287475586, "global_step": 428491, "epoch": 5162} {"train_loss": -27.03936195373535, "global_step": 428492, "epoch": 5162} {"train_loss": -26.682357788085938, "global_step": 428493, "epoch": 5162} {"train_loss": -26.92095947265625, "global_step": 428494, "epoch": 5162} {"train_loss": -27.179723739624023, "global_step": 428495, "epoch": 5162} {"train_loss": -26.576745986938477, "global_step": 428496, "epoch": 5162} {"train_loss": -26.95066261291504, "global_step": 428497, "epoch": 5162} {"train_loss": -27.131860733032227, "global_step": 428498, "epoch": 5162} {"train_loss": -26.9954776763916, "global_step": 428499, "epoch": 5162} {"train_loss": -26.73343276977539, "global_step": 428500, "epoch": 5162} {"train_loss": -26.52338981628418, "global_step": 428501, "epoch": 5162} {"train_loss": -27.17099952697754, "global_step": 428502, "epoch": 5162} {"train_loss": -27.169513702392578, "global_step": 428503, "epoch": 5162} {"train_loss": -26.99749183654785, "global_step": 428504, "epoch": 5162} {"train_loss": -26.62763786315918, "global_step": 428505, "epoch": 5162} {"train_loss": -26.94921875, "global_step": 428506, "epoch": 5162} {"train_loss": -26.45920753479004, "global_step": 428507, "epoch": 5162} {"train_loss": -26.80303382873535, "global_step": 428508, "epoch": 5162} {"train_loss": -26.89912223815918, "global_step": 428509, "epoch": 5162} {"train_loss": -27.12738037109375, "global_step": 428510, "epoch": 5162} {"train_loss": -26.88557243347168, "global_step": 428511, "epoch": 5162} {"train_loss": -27.290327072143555, "global_step": 428512, "epoch": 5162} {"train_loss": -26.490848541259766, "global_step": 428513, "epoch": 5162} {"train_loss": -26.884428024291992, "global_step": 428514, "epoch": 5162} {"train_loss": -26.85772132873535, "global_step": 428515, "epoch": 5162} {"train_loss": -26.297607421875, "global_step": 428516, "epoch": 5162} {"train_loss": -26.16669273376465, "global_step": 428517, "epoch": 5162} {"train_loss": -25.820709228515625, "global_step": 428518, "epoch": 5162} {"train_loss": -26.40073013305664, "global_step": 428519, "epoch": 5162} {"train_loss": -26.075611114501953, "global_step": 428520, "epoch": 5162} {"train_loss": -26.25971031188965, "global_step": 428521, "epoch": 5162} {"train_loss": -26.777708053588867, "global_step": 428522, "epoch": 5162} {"train_loss": -25.979389190673828, "global_step": 428523, "epoch": 5162} {"train_loss": -26.401777267456055, "global_step": 428524, "epoch": 5162} {"train_loss": -26.705524444580078, "global_step": 428525, "epoch": 5162} {"train_loss": -26.443790435791016, "global_step": 428526, "epoch": 5162} {"train_loss": -26.513906478881836, "global_step": 428527, "epoch": 5162} {"train_loss": -26.546972412660896, "global_step": 428528, "epoch": 5162, "val_loss": 6998140.0} {"train_loss": -26.142263412475586, "global_step": 428529, "epoch": 5163} {"train_loss": -26.277450561523438, "global_step": 428530, "epoch": 5163} {"train_loss": -26.591297149658203, "global_step": 428531, "epoch": 5163} {"train_loss": -26.555341720581055, "global_step": 428532, "epoch": 5163} {"train_loss": -26.522619247436523, "global_step": 428533, "epoch": 5163} {"train_loss": -26.29083251953125, "global_step": 428534, "epoch": 5163} {"train_loss": -26.631317138671875, "global_step": 428535, "epoch": 5163} {"train_loss": -26.889081954956055, "global_step": 428536, "epoch": 5163} {"train_loss": -26.77857780456543, "global_step": 428537, "epoch": 5163} {"train_loss": -26.47638511657715, "global_step": 428538, "epoch": 5163} {"train_loss": -27.01007080078125, "global_step": 428539, "epoch": 5163} {"train_loss": -26.930509567260742, "global_step": 428540, "epoch": 5163} {"train_loss": -26.40433692932129, "global_step": 428541, "epoch": 5163} {"train_loss": -26.748144149780273, "global_step": 428542, "epoch": 5163} {"train_loss": -26.512052536010742, "global_step": 428543, "epoch": 5163} {"train_loss": -26.757741928100586, "global_step": 428544, "epoch": 5163} {"train_loss": -26.347766876220703, "global_step": 428545, "epoch": 5163} {"train_loss": -27.037931442260742, "global_step": 428546, "epoch": 5163} {"train_loss": -26.78077507019043, "global_step": 428547, "epoch": 5163} {"train_loss": -26.895246505737305, "global_step": 428548, "epoch": 5163} {"train_loss": -26.719812393188477, "global_step": 428549, "epoch": 5163} {"train_loss": -27.17462158203125, "global_step": 428550, "epoch": 5163} {"train_loss": -27.0753231048584, "global_step": 428551, "epoch": 5163} {"train_loss": -26.97346305847168, "global_step": 428552, "epoch": 5163} {"train_loss": -26.87676429748535, "global_step": 428553, "epoch": 5163} {"train_loss": -26.89517593383789, "global_step": 428554, "epoch": 5163} {"train_loss": -26.74248695373535, "global_step": 428555, "epoch": 5163} {"train_loss": -26.946725845336914, "global_step": 428556, "epoch": 5163} {"train_loss": -27.0546875, "global_step": 428557, "epoch": 5163} {"train_loss": -26.925500869750977, "global_step": 428558, "epoch": 5163} {"train_loss": -27.113082885742188, "global_step": 428559, "epoch": 5163} {"train_loss": -27.274951934814453, "global_step": 428560, "epoch": 5163} {"train_loss": -27.26190757751465, "global_step": 428561, "epoch": 5163} {"train_loss": -27.20064353942871, "global_step": 428562, "epoch": 5163} {"train_loss": -26.68671989440918, "global_step": 428563, "epoch": 5163} {"train_loss": -26.940637588500977, "global_step": 428564, "epoch": 5163} {"train_loss": -27.305200576782227, "global_step": 428565, "epoch": 5163} {"train_loss": -26.74225425720215, "global_step": 428566, "epoch": 5163} {"train_loss": -26.715219497680664, "global_step": 428567, "epoch": 5163} {"train_loss": -26.492694854736328, "global_step": 428568, "epoch": 5163} {"train_loss": -26.31941032409668, "global_step": 428569, "epoch": 5163} {"train_loss": -26.881208419799805, "global_step": 428570, "epoch": 5163} {"train_loss": -26.506591796875, "global_step": 428571, "epoch": 5163} {"train_loss": -27.135862350463867, "global_step": 428572, "epoch": 5163} {"train_loss": -26.402929306030273, "global_step": 428573, "epoch": 5163} {"train_loss": -26.13828468322754, "global_step": 428574, "epoch": 5163} {"train_loss": -26.72433853149414, "global_step": 428575, "epoch": 5163} {"train_loss": -27.3199462890625, "global_step": 428576, "epoch": 5163} {"train_loss": -26.588088989257812, "global_step": 428577, "epoch": 5163} {"train_loss": -26.463836669921875, "global_step": 428578, "epoch": 5163} {"train_loss": -26.470895767211914, "global_step": 428579, "epoch": 5163} {"train_loss": -26.434284210205078, "global_step": 428580, "epoch": 5163} {"train_loss": -27.04624366760254, "global_step": 428581, "epoch": 5163} {"train_loss": -26.945653915405273, "global_step": 428582, "epoch": 5163} {"train_loss": -26.7669734954834, "global_step": 428583, "epoch": 5163} {"train_loss": -27.222803115844727, "global_step": 428584, "epoch": 5163} {"train_loss": -27.097888946533203, "global_step": 428585, "epoch": 5163} {"train_loss": -27.113576889038086, "global_step": 428586, "epoch": 5163} {"train_loss": -27.046316146850586, "global_step": 428587, "epoch": 5163} {"train_loss": -26.97992515563965, "global_step": 428588, "epoch": 5163} {"train_loss": -26.830097198486328, "global_step": 428589, "epoch": 5163} {"train_loss": -27.194183349609375, "global_step": 428590, "epoch": 5163} {"train_loss": -26.9515380859375, "global_step": 428591, "epoch": 5163} {"train_loss": -26.69925308227539, "global_step": 428592, "epoch": 5163} {"train_loss": -27.03167724609375, "global_step": 428593, "epoch": 5163} {"train_loss": -26.889474868774414, "global_step": 428594, "epoch": 5163} {"train_loss": -27.19038200378418, "global_step": 428595, "epoch": 5163} {"train_loss": -27.14277458190918, "global_step": 428596, "epoch": 5163} {"train_loss": -27.456134796142578, "global_step": 428597, "epoch": 5163} {"train_loss": -26.780593872070312, "global_step": 428598, "epoch": 5163} {"train_loss": -26.921655654907227, "global_step": 428599, "epoch": 5163} {"train_loss": -26.796432495117188, "global_step": 428600, "epoch": 5163} {"train_loss": -26.99012565612793, "global_step": 428601, "epoch": 5163} {"train_loss": -27.04414176940918, "global_step": 428602, "epoch": 5163} {"train_loss": -27.25701332092285, "global_step": 428603, "epoch": 5163} {"train_loss": -26.882360458374023, "global_step": 428604, "epoch": 5163} {"train_loss": -27.067138671875, "global_step": 428605, "epoch": 5163} {"train_loss": -26.986297607421875, "global_step": 428606, "epoch": 5163} {"train_loss": -27.190567016601562, "global_step": 428607, "epoch": 5163} {"train_loss": -26.971435546875, "global_step": 428608, "epoch": 5163} {"train_loss": -26.784231185913086, "global_step": 428609, "epoch": 5163} {"train_loss": -26.8359432220459, "global_step": 428610, "epoch": 5163} {"train_loss": -26.846723671419074, "global_step": 428611, "epoch": 5163, "val_loss": 6904587.0} {"train_loss": -24.97658348083496, "global_step": 428612, "epoch": 5164} {"train_loss": -25.215070724487305, "global_step": 428613, "epoch": 5164} {"train_loss": -25.450197219848633, "global_step": 428614, "epoch": 5164} {"train_loss": -25.543188095092773, "global_step": 428615, "epoch": 5164} {"train_loss": -25.37202262878418, "global_step": 428616, "epoch": 5164} {"train_loss": -25.26942253112793, "global_step": 428617, "epoch": 5164} {"train_loss": -25.849531173706055, "global_step": 428618, "epoch": 5164} {"train_loss": -25.6090145111084, "global_step": 428619, "epoch": 5164} {"train_loss": -26.237323760986328, "global_step": 428620, "epoch": 5164} {"train_loss": -26.057575225830078, "global_step": 428621, "epoch": 5164} {"train_loss": -25.90907096862793, "global_step": 428622, "epoch": 5164} {"train_loss": -25.9936580657959, "global_step": 428623, "epoch": 5164} {"train_loss": -25.870092391967773, "global_step": 428624, "epoch": 5164} {"train_loss": -26.240522384643555, "global_step": 428625, "epoch": 5164} {"train_loss": -26.405139923095703, "global_step": 428626, "epoch": 5164} {"train_loss": -26.32635498046875, "global_step": 428627, "epoch": 5164} {"train_loss": -26.068716049194336, "global_step": 428628, "epoch": 5164} {"train_loss": -25.9500789642334, "global_step": 428629, "epoch": 5164} {"train_loss": -26.141759872436523, "global_step": 428630, "epoch": 5164} {"train_loss": -26.44256591796875, "global_step": 428631, "epoch": 5164} {"train_loss": -26.481870651245117, "global_step": 428632, "epoch": 5164} {"train_loss": -26.558155059814453, "global_step": 428633, "epoch": 5164} {"train_loss": -26.34500503540039, "global_step": 428634, "epoch": 5164} {"train_loss": -26.388397216796875, "global_step": 428635, "epoch": 5164} {"train_loss": -26.7737979888916, "global_step": 428636, "epoch": 5164} {"train_loss": -26.427570343017578, "global_step": 428637, "epoch": 5164} {"train_loss": -26.45453453063965, "global_step": 428638, "epoch": 5164} {"train_loss": -26.8199405670166, "global_step": 428639, "epoch": 5164} {"train_loss": -26.707523345947266, "global_step": 428640, "epoch": 5164} {"train_loss": -27.178424835205078, "global_step": 428641, "epoch": 5164} {"train_loss": -26.568078994750977, "global_step": 428642, "epoch": 5164} {"train_loss": -26.689977645874023, "global_step": 428643, "epoch": 5164} {"train_loss": -26.422443389892578, "global_step": 428644, "epoch": 5164} {"train_loss": -26.864013671875, "global_step": 428645, "epoch": 5164} {"train_loss": -26.893096923828125, "global_step": 428646, "epoch": 5164} {"train_loss": -26.188291549682617, "global_step": 428647, "epoch": 5164} {"train_loss": -26.62848472595215, "global_step": 428648, "epoch": 5164} {"train_loss": -27.124189376831055, "global_step": 428649, "epoch": 5164} {"train_loss": -26.926706314086914, "global_step": 428650, "epoch": 5164} {"train_loss": -27.01995849609375, "global_step": 428651, "epoch": 5164} {"train_loss": -26.922483444213867, "global_step": 428652, "epoch": 5164} {"train_loss": -27.137237548828125, "global_step": 428653, "epoch": 5164} {"train_loss": -26.507843017578125, "global_step": 428654, "epoch": 5164} {"train_loss": -26.805944442749023, "global_step": 428655, "epoch": 5164} {"train_loss": -26.982858657836914, "global_step": 428656, "epoch": 5164} {"train_loss": -27.0025577545166, "global_step": 428657, "epoch": 5164} {"train_loss": -27.081787109375, "global_step": 428658, "epoch": 5164} {"train_loss": -27.18538475036621, "global_step": 428659, "epoch": 5164} {"train_loss": -26.80353355407715, "global_step": 428660, "epoch": 5164} {"train_loss": -26.988691329956055, "global_step": 428661, "epoch": 5164} {"train_loss": -26.768468856811523, "global_step": 428662, "epoch": 5164} {"train_loss": -26.84364128112793, "global_step": 428663, "epoch": 5164} {"train_loss": -27.031818389892578, "global_step": 428664, "epoch": 5164} {"train_loss": -26.864105224609375, "global_step": 428665, "epoch": 5164} {"train_loss": -27.02754783630371, "global_step": 428666, "epoch": 5164} {"train_loss": -27.132978439331055, "global_step": 428667, "epoch": 5164} {"train_loss": -27.035932540893555, "global_step": 428668, "epoch": 5164} {"train_loss": -26.9337158203125, "global_step": 428669, "epoch": 5164} {"train_loss": -26.939184188842773, "global_step": 428670, "epoch": 5164} {"train_loss": -26.698766708374023, "global_step": 428671, "epoch": 5164} {"train_loss": -26.703062057495117, "global_step": 428672, "epoch": 5164} {"train_loss": -26.977569580078125, "global_step": 428673, "epoch": 5164} {"train_loss": -26.9219913482666, "global_step": 428674, "epoch": 5164} {"train_loss": -27.1754093170166, "global_step": 428675, "epoch": 5164} {"train_loss": -26.522451400756836, "global_step": 428676, "epoch": 5164} {"train_loss": -27.031930923461914, "global_step": 428677, "epoch": 5164} {"train_loss": -27.145172119140625, "global_step": 428678, "epoch": 5164} {"train_loss": -26.630590438842773, "global_step": 428679, "epoch": 5164} {"train_loss": -26.9190616607666, "global_step": 428680, "epoch": 5164} {"train_loss": -27.082883834838867, "global_step": 428681, "epoch": 5164} {"train_loss": -26.711944580078125, "global_step": 428682, "epoch": 5164} {"train_loss": -26.69989013671875, "global_step": 428683, "epoch": 5164} {"train_loss": -26.599157333374023, "global_step": 428684, "epoch": 5164} {"train_loss": -26.152515411376953, "global_step": 428685, "epoch": 5164} {"train_loss": -26.51981544494629, "global_step": 428686, "epoch": 5164} {"train_loss": -26.24673843383789, "global_step": 428687, "epoch": 5164} {"train_loss": -26.270999908447266, "global_step": 428688, "epoch": 5164} {"train_loss": -27.169570922851562, "global_step": 428689, "epoch": 5164} {"train_loss": -26.463415145874023, "global_step": 428690, "epoch": 5164} {"train_loss": -26.809467315673828, "global_step": 428691, "epoch": 5164} {"train_loss": -27.019922256469727, "global_step": 428692, "epoch": 5164} {"train_loss": -26.827341079711914, "global_step": 428693, "epoch": 5164} {"train_loss": -26.569801192685784, "global_step": 428694, "epoch": 5164, "val_loss": 6930115.5} {"train_loss": -24.931598663330078, "global_step": 428695, "epoch": 5165} {"train_loss": -25.875822067260742, "global_step": 428696, "epoch": 5165} {"train_loss": -25.913482666015625, "global_step": 428697, "epoch": 5165} {"train_loss": -25.020593643188477, "global_step": 428698, "epoch": 5165} {"train_loss": -25.625568389892578, "global_step": 428699, "epoch": 5165} {"train_loss": -25.584611892700195, "global_step": 428700, "epoch": 5165} {"train_loss": -25.590246200561523, "global_step": 428701, "epoch": 5165} {"train_loss": -26.46616554260254, "global_step": 428702, "epoch": 5165} {"train_loss": -26.0677433013916, "global_step": 428703, "epoch": 5165} {"train_loss": -25.967920303344727, "global_step": 428704, "epoch": 5165} {"train_loss": -26.31766128540039, "global_step": 428705, "epoch": 5165} {"train_loss": -26.39666175842285, "global_step": 428706, "epoch": 5165} {"train_loss": -26.34541130065918, "global_step": 428707, "epoch": 5165} {"train_loss": -26.027231216430664, "global_step": 428708, "epoch": 5165} {"train_loss": -26.23933219909668, "global_step": 428709, "epoch": 5165} {"train_loss": -26.3187255859375, "global_step": 428710, "epoch": 5165} {"train_loss": -26.336835861206055, "global_step": 428711, "epoch": 5165} {"train_loss": -26.527795791625977, "global_step": 428712, "epoch": 5165} {"train_loss": -26.45937156677246, "global_step": 428713, "epoch": 5165} {"train_loss": -26.302478790283203, "global_step": 428714, "epoch": 5165} {"train_loss": -26.434314727783203, "global_step": 428715, "epoch": 5165} {"train_loss": -26.38116455078125, "global_step": 428716, "epoch": 5165} {"train_loss": -26.194782257080078, "global_step": 428717, "epoch": 5165} {"train_loss": -26.392988204956055, "global_step": 428718, "epoch": 5165} {"train_loss": -26.696792602539062, "global_step": 428719, "epoch": 5165} {"train_loss": -26.858673095703125, "global_step": 428720, "epoch": 5165} {"train_loss": -26.634984970092773, "global_step": 428721, "epoch": 5165} {"train_loss": -26.56396484375, "global_step": 428722, "epoch": 5165} {"train_loss": -26.636011123657227, "global_step": 428723, "epoch": 5165} {"train_loss": -26.579288482666016, "global_step": 428724, "epoch": 5165} {"train_loss": -26.5885066986084, "global_step": 428725, "epoch": 5165} {"train_loss": -26.80091667175293, "global_step": 428726, "epoch": 5165} {"train_loss": -26.686532974243164, "global_step": 428727, "epoch": 5165} {"train_loss": -26.935413360595703, "global_step": 428728, "epoch": 5165} {"train_loss": -26.92909812927246, "global_step": 428729, "epoch": 5165} {"train_loss": -26.856830596923828, "global_step": 428730, "epoch": 5165} {"train_loss": -26.86594581604004, "global_step": 428731, "epoch": 5165} {"train_loss": -26.92597770690918, "global_step": 428732, "epoch": 5165} {"train_loss": -27.001056671142578, "global_step": 428733, "epoch": 5165} {"train_loss": -26.838098526000977, "global_step": 428734, "epoch": 5165} {"train_loss": -27.073963165283203, "global_step": 428735, "epoch": 5165} {"train_loss": -26.975788116455078, "global_step": 428736, "epoch": 5165} {"train_loss": -26.807697296142578, "global_step": 428737, "epoch": 5165} {"train_loss": -26.671802520751953, "global_step": 428738, "epoch": 5165} {"train_loss": -26.966394424438477, "global_step": 428739, "epoch": 5165} {"train_loss": -26.791385650634766, "global_step": 428740, "epoch": 5165} {"train_loss": -26.63884925842285, "global_step": 428741, "epoch": 5165} {"train_loss": -27.150434494018555, "global_step": 428742, "epoch": 5165} {"train_loss": -26.959943771362305, "global_step": 428743, "epoch": 5165} {"train_loss": -26.784406661987305, "global_step": 428744, "epoch": 5165} {"train_loss": -26.7147159576416, "global_step": 428745, "epoch": 5165} {"train_loss": -26.75054931640625, "global_step": 428746, "epoch": 5165} {"train_loss": -26.860761642456055, "global_step": 428747, "epoch": 5165} {"train_loss": -26.469247817993164, "global_step": 428748, "epoch": 5165} {"train_loss": -26.779699325561523, "global_step": 428749, "epoch": 5165} {"train_loss": -27.002023696899414, "global_step": 428750, "epoch": 5165} {"train_loss": -26.866180419921875, "global_step": 428751, "epoch": 5165} {"train_loss": -26.938169479370117, "global_step": 428752, "epoch": 5165} {"train_loss": -26.924509048461914, "global_step": 428753, "epoch": 5165} {"train_loss": -26.82695960998535, "global_step": 428754, "epoch": 5165} {"train_loss": -26.8444766998291, "global_step": 428755, "epoch": 5165} {"train_loss": -27.230331420898438, "global_step": 428756, "epoch": 5165} {"train_loss": -26.887189865112305, "global_step": 428757, "epoch": 5165} {"train_loss": -26.99806785583496, "global_step": 428758, "epoch": 5165} {"train_loss": -26.668716430664062, "global_step": 428759, "epoch": 5165} {"train_loss": -26.784427642822266, "global_step": 428760, "epoch": 5165} {"train_loss": -26.985279083251953, "global_step": 428761, "epoch": 5165} {"train_loss": -27.183807373046875, "global_step": 428762, "epoch": 5165} {"train_loss": -26.935129165649414, "global_step": 428763, "epoch": 5165} {"train_loss": -27.198699951171875, "global_step": 428764, "epoch": 5165} {"train_loss": -26.897785186767578, "global_step": 428765, "epoch": 5165} {"train_loss": -27.080841064453125, "global_step": 428766, "epoch": 5165} {"train_loss": -26.884504318237305, "global_step": 428767, "epoch": 5165} {"train_loss": -26.982807159423828, "global_step": 428768, "epoch": 5165} {"train_loss": -26.806812286376953, "global_step": 428769, "epoch": 5165} {"train_loss": -27.12513542175293, "global_step": 428770, "epoch": 5165} {"train_loss": -26.797155380249023, "global_step": 428771, "epoch": 5165} {"train_loss": -26.98255729675293, "global_step": 428772, "epoch": 5165} {"train_loss": -27.302753448486328, "global_step": 428773, "epoch": 5165} {"train_loss": -27.070301055908203, "global_step": 428774, "epoch": 5165} {"train_loss": -26.75147819519043, "global_step": 428775, "epoch": 5165} {"train_loss": -26.725244522094727, "global_step": 428776, "epoch": 5165} {"train_loss": -26.627449012664428, "global_step": 428777, "epoch": 5165, "val_loss": 7016506.0} {"train_loss": -25.209945678710938, "global_step": 428778, "epoch": 5166} {"train_loss": -24.63863754272461, "global_step": 428779, "epoch": 5166} {"train_loss": -24.816680908203125, "global_step": 428780, "epoch": 5166} {"train_loss": -25.018360137939453, "global_step": 428781, "epoch": 5166} {"train_loss": -24.996572494506836, "global_step": 428782, "epoch": 5166} {"train_loss": -24.778989791870117, "global_step": 428783, "epoch": 5166} {"train_loss": -24.734920501708984, "global_step": 428784, "epoch": 5166} {"train_loss": -25.35348892211914, "global_step": 428785, "epoch": 5166} {"train_loss": -25.272911071777344, "global_step": 428786, "epoch": 5166} {"train_loss": -25.33339500427246, "global_step": 428787, "epoch": 5166} {"train_loss": -26.21396827697754, "global_step": 428788, "epoch": 5166} {"train_loss": -25.974884033203125, "global_step": 428789, "epoch": 5166} {"train_loss": -26.18096351623535, "global_step": 428790, "epoch": 5166} {"train_loss": -26.155683517456055, "global_step": 428791, "epoch": 5166} {"train_loss": -25.976959228515625, "global_step": 428792, "epoch": 5166} {"train_loss": -26.10980796813965, "global_step": 428793, "epoch": 5166} {"train_loss": -26.443967819213867, "global_step": 428794, "epoch": 5166} {"train_loss": -26.31646156311035, "global_step": 428795, "epoch": 5166} {"train_loss": -26.2683048248291, "global_step": 428796, "epoch": 5166} {"train_loss": -26.411975860595703, "global_step": 428797, "epoch": 5166} {"train_loss": -26.503599166870117, "global_step": 428798, "epoch": 5166} {"train_loss": -26.3360652923584, "global_step": 428799, "epoch": 5166} {"train_loss": -26.24763298034668, "global_step": 428800, "epoch": 5166} {"train_loss": -26.79389762878418, "global_step": 428801, "epoch": 5166} {"train_loss": -26.575529098510742, "global_step": 428802, "epoch": 5166} {"train_loss": -26.806991577148438, "global_step": 428803, "epoch": 5166} {"train_loss": -26.532459259033203, "global_step": 428804, "epoch": 5166} {"train_loss": -26.688901901245117, "global_step": 428805, "epoch": 5166} {"train_loss": -26.845869064331055, "global_step": 428806, "epoch": 5166} {"train_loss": -26.739429473876953, "global_step": 428807, "epoch": 5166} {"train_loss": -26.708942413330078, "global_step": 428808, "epoch": 5166} {"train_loss": -26.579345703125, "global_step": 428809, "epoch": 5166} {"train_loss": -26.421918869018555, "global_step": 428810, "epoch": 5166} {"train_loss": -26.73854637145996, "global_step": 428811, "epoch": 5166} {"train_loss": -26.737524032592773, "global_step": 428812, "epoch": 5166} {"train_loss": -26.93073844909668, "global_step": 428813, "epoch": 5166} {"train_loss": -26.36269187927246, "global_step": 428814, "epoch": 5166} {"train_loss": -26.6648006439209, "global_step": 428815, "epoch": 5166} {"train_loss": -26.699369430541992, "global_step": 428816, "epoch": 5166} {"train_loss": -26.67909812927246, "global_step": 428817, "epoch": 5166} {"train_loss": -26.467151641845703, "global_step": 428818, "epoch": 5166} {"train_loss": -26.812681198120117, "global_step": 428819, "epoch": 5166} {"train_loss": -26.759449005126953, "global_step": 428820, "epoch": 5166} {"train_loss": -26.81073570251465, "global_step": 428821, "epoch": 5166} {"train_loss": -26.634862899780273, "global_step": 428822, "epoch": 5166} {"train_loss": -27.066370010375977, "global_step": 428823, "epoch": 5166} {"train_loss": -26.715717315673828, "global_step": 428824, "epoch": 5166} {"train_loss": -26.58843994140625, "global_step": 428825, "epoch": 5166} {"train_loss": -27.178613662719727, "global_step": 428826, "epoch": 5166} {"train_loss": -27.26204490661621, "global_step": 428827, "epoch": 5166} {"train_loss": -27.0079288482666, "global_step": 428828, "epoch": 5166} {"train_loss": -27.125940322875977, "global_step": 428829, "epoch": 5166} {"train_loss": -26.855371475219727, "global_step": 428830, "epoch": 5166} {"train_loss": -27.28853416442871, "global_step": 428831, "epoch": 5166} {"train_loss": -26.965530395507812, "global_step": 428832, "epoch": 5166} {"train_loss": -26.50498390197754, "global_step": 428833, "epoch": 5166} {"train_loss": -26.92300796508789, "global_step": 428834, "epoch": 5166} {"train_loss": -26.931554794311523, "global_step": 428835, "epoch": 5166} {"train_loss": -27.07253074645996, "global_step": 428836, "epoch": 5166} {"train_loss": -26.842395782470703, "global_step": 428837, "epoch": 5166} {"train_loss": -26.744489669799805, "global_step": 428838, "epoch": 5166} {"train_loss": -26.718780517578125, "global_step": 428839, "epoch": 5166} {"train_loss": -26.604440689086914, "global_step": 428840, "epoch": 5166} {"train_loss": -26.915945053100586, "global_step": 428841, "epoch": 5166} {"train_loss": -27.01171875, "global_step": 428842, "epoch": 5166} {"train_loss": -27.01222801208496, "global_step": 428843, "epoch": 5166} {"train_loss": -26.93180274963379, "global_step": 428844, "epoch": 5166} {"train_loss": -26.858600616455078, "global_step": 428845, "epoch": 5166} {"train_loss": -27.25591468811035, "global_step": 428846, "epoch": 5166} {"train_loss": -26.9631290435791, "global_step": 428847, "epoch": 5166} {"train_loss": -26.84027671813965, "global_step": 428848, "epoch": 5166} {"train_loss": -26.561054229736328, "global_step": 428849, "epoch": 5166} {"train_loss": -26.97907066345215, "global_step": 428850, "epoch": 5166} {"train_loss": -26.335906982421875, "global_step": 428851, "epoch": 5166} {"train_loss": -26.702367782592773, "global_step": 428852, "epoch": 5166} {"train_loss": -27.082046508789062, "global_step": 428853, "epoch": 5166} {"train_loss": -26.96758460998535, "global_step": 428854, "epoch": 5166} {"train_loss": -26.610315322875977, "global_step": 428855, "epoch": 5166} {"train_loss": -26.835744857788086, "global_step": 428856, "epoch": 5166} {"train_loss": -26.91971206665039, "global_step": 428857, "epoch": 5166} {"train_loss": -26.9793643951416, "global_step": 428858, "epoch": 5166} {"train_loss": -26.879255294799805, "global_step": 428859, "epoch": 5166} {"train_loss": -26.50927750461073, "global_step": 428860, "epoch": 5166, "val_loss": 6500383.0} {"train_loss": -26.07563591003418, "global_step": 428861, "epoch": 5167} {"train_loss": -25.50677490234375, "global_step": 428862, "epoch": 5167} {"train_loss": -26.068445205688477, "global_step": 428863, "epoch": 5167} {"train_loss": -26.6054744720459, "global_step": 428864, "epoch": 5167} {"train_loss": -26.525863647460938, "global_step": 428865, "epoch": 5167} {"train_loss": -26.36225700378418, "global_step": 428866, "epoch": 5167} {"train_loss": -26.35675621032715, "global_step": 428867, "epoch": 5167} {"train_loss": -26.4609432220459, "global_step": 428868, "epoch": 5167} {"train_loss": -26.798383712768555, "global_step": 428869, "epoch": 5167} {"train_loss": -26.438940048217773, "global_step": 428870, "epoch": 5167} {"train_loss": -26.25634765625, "global_step": 428871, "epoch": 5167} {"train_loss": -26.006454467773438, "global_step": 428872, "epoch": 5167} {"train_loss": -26.2628231048584, "global_step": 428873, "epoch": 5167} {"train_loss": -26.419513702392578, "global_step": 428874, "epoch": 5167} {"train_loss": -26.54242515563965, "global_step": 428875, "epoch": 5167} {"train_loss": -26.306354522705078, "global_step": 428876, "epoch": 5167} {"train_loss": -26.715063095092773, "global_step": 428877, "epoch": 5167} {"train_loss": -26.96548843383789, "global_step": 428878, "epoch": 5167} {"train_loss": -26.32321548461914, "global_step": 428879, "epoch": 5167} {"train_loss": -26.496475219726562, "global_step": 428880, "epoch": 5167} {"train_loss": -26.480701446533203, "global_step": 428881, "epoch": 5167} {"train_loss": -26.513288497924805, "global_step": 428882, "epoch": 5167} {"train_loss": -26.807092666625977, "global_step": 428883, "epoch": 5167} {"train_loss": -26.586883544921875, "global_step": 428884, "epoch": 5167} {"train_loss": -26.736148834228516, "global_step": 428885, "epoch": 5167} {"train_loss": -26.93050193786621, "global_step": 428886, "epoch": 5167} {"train_loss": -26.441320419311523, "global_step": 428887, "epoch": 5167} {"train_loss": -27.017459869384766, "global_step": 428888, "epoch": 5167} {"train_loss": -26.9324951171875, "global_step": 428889, "epoch": 5167} {"train_loss": -26.87604331970215, "global_step": 428890, "epoch": 5167} {"train_loss": -27.0096378326416, "global_step": 428891, "epoch": 5167} {"train_loss": -27.023767471313477, "global_step": 428892, "epoch": 5167} {"train_loss": -26.8431453704834, "global_step": 428893, "epoch": 5167} {"train_loss": -26.69917106628418, "global_step": 428894, "epoch": 5167} {"train_loss": -27.010650634765625, "global_step": 428895, "epoch": 5167} {"train_loss": -26.906110763549805, "global_step": 428896, "epoch": 5167} {"train_loss": -27.33331298828125, "global_step": 428897, "epoch": 5167} {"train_loss": -27.353534698486328, "global_step": 428898, "epoch": 5167} {"train_loss": -27.082019805908203, "global_step": 428899, "epoch": 5167} {"train_loss": -27.126819610595703, "global_step": 428900, "epoch": 5167} {"train_loss": -27.23178482055664, "global_step": 428901, "epoch": 5167} {"train_loss": -27.206586837768555, "global_step": 428902, "epoch": 5167} {"train_loss": -26.965641021728516, "global_step": 428903, "epoch": 5167} {"train_loss": -26.787097930908203, "global_step": 428904, "epoch": 5167} {"train_loss": -26.852075576782227, "global_step": 428905, "epoch": 5167} {"train_loss": -27.086729049682617, "global_step": 428906, "epoch": 5167} {"train_loss": -26.9244384765625, "global_step": 428907, "epoch": 5167} {"train_loss": -26.45660972595215, "global_step": 428908, "epoch": 5167} {"train_loss": -27.21307373046875, "global_step": 428909, "epoch": 5167} {"train_loss": -26.667957305908203, "global_step": 428910, "epoch": 5167} {"train_loss": -26.774097442626953, "global_step": 428911, "epoch": 5167} {"train_loss": -26.558765411376953, "global_step": 428912, "epoch": 5167} {"train_loss": -26.6037540435791, "global_step": 428913, "epoch": 5167} {"train_loss": -27.063425064086914, "global_step": 428914, "epoch": 5167} {"train_loss": -26.795459747314453, "global_step": 428915, "epoch": 5167} {"train_loss": -26.93147087097168, "global_step": 428916, "epoch": 5167} {"train_loss": -26.821273803710938, "global_step": 428917, "epoch": 5167} {"train_loss": -26.656702041625977, "global_step": 428918, "epoch": 5167} {"train_loss": -27.200647354125977, "global_step": 428919, "epoch": 5167} {"train_loss": -26.808197021484375, "global_step": 428920, "epoch": 5167} {"train_loss": -26.722213745117188, "global_step": 428921, "epoch": 5167} {"train_loss": -26.83970069885254, "global_step": 428922, "epoch": 5167} {"train_loss": -27.0903377532959, "global_step": 428923, "epoch": 5167} {"train_loss": -26.720258712768555, "global_step": 428924, "epoch": 5167} {"train_loss": -26.427515029907227, "global_step": 428925, "epoch": 5167} {"train_loss": -26.77608299255371, "global_step": 428926, "epoch": 5167} {"train_loss": -26.809751510620117, "global_step": 428927, "epoch": 5167} {"train_loss": -26.777185440063477, "global_step": 428928, "epoch": 5167} {"train_loss": -26.685501098632812, "global_step": 428929, "epoch": 5167} {"train_loss": -26.99957275390625, "global_step": 428930, "epoch": 5167} {"train_loss": -27.053241729736328, "global_step": 428931, "epoch": 5167} {"train_loss": -26.678327560424805, "global_step": 428932, "epoch": 5167} {"train_loss": -26.589025497436523, "global_step": 428933, "epoch": 5167} {"train_loss": -26.625158309936523, "global_step": 428934, "epoch": 5167} {"train_loss": -26.92286491394043, "global_step": 428935, "epoch": 5167} {"train_loss": -27.007307052612305, "global_step": 428936, "epoch": 5167} {"train_loss": -26.98965835571289, "global_step": 428937, "epoch": 5167} {"train_loss": -26.76171875, "global_step": 428938, "epoch": 5167} {"train_loss": -26.58668327331543, "global_step": 428939, "epoch": 5167} {"train_loss": -27.238525390625, "global_step": 428940, "epoch": 5167} {"train_loss": -26.57083511352539, "global_step": 428941, "epoch": 5167} {"train_loss": -27.109365463256836, "global_step": 428942, "epoch": 5167} {"train_loss": -26.73170342502824, "global_step": 428943, "epoch": 5167, "val_loss": 6568560.0} {"train_loss": -25.86614990234375, "global_step": 428944, "epoch": 5168} {"train_loss": -25.861658096313477, "global_step": 428945, "epoch": 5168} {"train_loss": -26.15915870666504, "global_step": 428946, "epoch": 5168} {"train_loss": -25.872791290283203, "global_step": 428947, "epoch": 5168} {"train_loss": -26.4083194732666, "global_step": 428948, "epoch": 5168} {"train_loss": -25.519611358642578, "global_step": 428949, "epoch": 5168} {"train_loss": -26.567813873291016, "global_step": 428950, "epoch": 5168} {"train_loss": -25.750934600830078, "global_step": 428951, "epoch": 5168} {"train_loss": -26.576618194580078, "global_step": 428952, "epoch": 5168} {"train_loss": -26.593229293823242, "global_step": 428953, "epoch": 5168} {"train_loss": -26.481348037719727, "global_step": 428954, "epoch": 5168} {"train_loss": -26.249067306518555, "global_step": 428955, "epoch": 5168} {"train_loss": -26.3138484954834, "global_step": 428956, "epoch": 5168} {"train_loss": -26.496383666992188, "global_step": 428957, "epoch": 5168} {"train_loss": -26.29701042175293, "global_step": 428958, "epoch": 5168} {"train_loss": -26.700849533081055, "global_step": 428959, "epoch": 5168} {"train_loss": -26.684579849243164, "global_step": 428960, "epoch": 5168} {"train_loss": -26.76214599609375, "global_step": 428961, "epoch": 5168} {"train_loss": -26.790191650390625, "global_step": 428962, "epoch": 5168} {"train_loss": -26.606061935424805, "global_step": 428963, "epoch": 5168} {"train_loss": -26.9525089263916, "global_step": 428964, "epoch": 5168} {"train_loss": -26.49993896484375, "global_step": 428965, "epoch": 5168} {"train_loss": -26.977741241455078, "global_step": 428966, "epoch": 5168} {"train_loss": -26.776586532592773, "global_step": 428967, "epoch": 5168} {"train_loss": -26.67460060119629, "global_step": 428968, "epoch": 5168} {"train_loss": -26.762170791625977, "global_step": 428969, "epoch": 5168} {"train_loss": -26.989044189453125, "global_step": 428970, "epoch": 5168} {"train_loss": -27.235990524291992, "global_step": 428971, "epoch": 5168} {"train_loss": -26.541534423828125, "global_step": 428972, "epoch": 5168} {"train_loss": -27.04395866394043, "global_step": 428973, "epoch": 5168} {"train_loss": -26.809064865112305, "global_step": 428974, "epoch": 5168} {"train_loss": -27.010974884033203, "global_step": 428975, "epoch": 5168} {"train_loss": -26.783477783203125, "global_step": 428976, "epoch": 5168} {"train_loss": -26.929243087768555, "global_step": 428977, "epoch": 5168} {"train_loss": -26.80450439453125, "global_step": 428978, "epoch": 5168} {"train_loss": -26.893131256103516, "global_step": 428979, "epoch": 5168} {"train_loss": -27.31770896911621, "global_step": 428980, "epoch": 5168} {"train_loss": -26.6679630279541, "global_step": 428981, "epoch": 5168} {"train_loss": -27.197248458862305, "global_step": 428982, "epoch": 5168} {"train_loss": -27.05445671081543, "global_step": 428983, "epoch": 5168} {"train_loss": -27.033788681030273, "global_step": 428984, "epoch": 5168} {"train_loss": -27.071353912353516, "global_step": 428985, "epoch": 5168} {"train_loss": -27.035425186157227, "global_step": 428986, "epoch": 5168} {"train_loss": -27.137470245361328, "global_step": 428987, "epoch": 5168} {"train_loss": -27.32044792175293, "global_step": 428988, "epoch": 5168} {"train_loss": -27.237873077392578, "global_step": 428989, "epoch": 5168} {"train_loss": -27.066946029663086, "global_step": 428990, "epoch": 5168} {"train_loss": -27.511402130126953, "global_step": 428991, "epoch": 5168} {"train_loss": -26.91790771484375, "global_step": 428992, "epoch": 5168} {"train_loss": -27.02724266052246, "global_step": 428993, "epoch": 5168} {"train_loss": -27.14847183227539, "global_step": 428994, "epoch": 5168} {"train_loss": -27.43385124206543, "global_step": 428995, "epoch": 5168} {"train_loss": -27.37396240234375, "global_step": 428996, "epoch": 5168} {"train_loss": -26.914514541625977, "global_step": 428997, "epoch": 5168} {"train_loss": -26.270788192749023, "global_step": 428998, "epoch": 5168} {"train_loss": -26.290847778320312, "global_step": 428999, "epoch": 5168} {"train_loss": -26.82173728942871, "global_step": 429000, "epoch": 5168} {"train_loss": -26.473920822143555, "global_step": 429001, "epoch": 5168} {"train_loss": -26.884662628173828, "global_step": 429002, "epoch": 5168} {"train_loss": -26.615814208984375, "global_step": 429003, "epoch": 5168} {"train_loss": -27.00672721862793, "global_step": 429004, "epoch": 5168} {"train_loss": -26.37556266784668, "global_step": 429005, "epoch": 5168} {"train_loss": -26.560272216796875, "global_step": 429006, "epoch": 5168} {"train_loss": -26.21473503112793, "global_step": 429007, "epoch": 5168} {"train_loss": -26.260339736938477, "global_step": 429008, "epoch": 5168} {"train_loss": -26.971250534057617, "global_step": 429009, "epoch": 5168} {"train_loss": -26.24934959411621, "global_step": 429010, "epoch": 5168} {"train_loss": -26.623916625976562, "global_step": 429011, "epoch": 5168} {"train_loss": -26.76177406311035, "global_step": 429012, "epoch": 5168} {"train_loss": -26.622976303100586, "global_step": 429013, "epoch": 5168} {"train_loss": -26.50615882873535, "global_step": 429014, "epoch": 5168} {"train_loss": -26.66585350036621, "global_step": 429015, "epoch": 5168} {"train_loss": -26.343830108642578, "global_step": 429016, "epoch": 5168} {"train_loss": -26.40252113342285, "global_step": 429017, "epoch": 5168} {"train_loss": -26.30281639099121, "global_step": 429018, "epoch": 5168} {"train_loss": -26.641021728515625, "global_step": 429019, "epoch": 5168} {"train_loss": -26.815832138061523, "global_step": 429020, "epoch": 5168} {"train_loss": -26.922317504882812, "global_step": 429021, "epoch": 5168} {"train_loss": -26.463464736938477, "global_step": 429022, "epoch": 5168} {"train_loss": -27.056934356689453, "global_step": 429023, "epoch": 5168} {"train_loss": -26.325101852416992, "global_step": 429024, "epoch": 5168} {"train_loss": -27.034366607666016, "global_step": 429025, "epoch": 5168} {"train_loss": -26.67573901256883, "global_step": 429026, "epoch": 5168, "val_loss": 6532018.0} {"train_loss": -25.978967666625977, "global_step": 429027, "epoch": 5169} {"train_loss": -25.65545082092285, "global_step": 429028, "epoch": 5169} {"train_loss": -25.99505615234375, "global_step": 429029, "epoch": 5169} {"train_loss": -25.82831382751465, "global_step": 429030, "epoch": 5169} {"train_loss": -25.742298126220703, "global_step": 429031, "epoch": 5169} {"train_loss": -25.714527130126953, "global_step": 429032, "epoch": 5169} {"train_loss": -25.54932975769043, "global_step": 429033, "epoch": 5169} {"train_loss": -25.77032470703125, "global_step": 429034, "epoch": 5169} {"train_loss": -25.860355377197266, "global_step": 429035, "epoch": 5169} {"train_loss": -26.08357810974121, "global_step": 429036, "epoch": 5169} {"train_loss": -25.872283935546875, "global_step": 429037, "epoch": 5169} {"train_loss": -26.74342918395996, "global_step": 429038, "epoch": 5169} {"train_loss": -25.992029190063477, "global_step": 429039, "epoch": 5169} {"train_loss": -26.454238891601562, "global_step": 429040, "epoch": 5169} {"train_loss": -25.934003829956055, "global_step": 429041, "epoch": 5169} {"train_loss": -26.59553337097168, "global_step": 429042, "epoch": 5169} {"train_loss": -25.73872184753418, "global_step": 429043, "epoch": 5169} {"train_loss": -26.386945724487305, "global_step": 429044, "epoch": 5169} {"train_loss": -26.006702423095703, "global_step": 429045, "epoch": 5169} {"train_loss": -26.360151290893555, "global_step": 429046, "epoch": 5169} {"train_loss": -25.90301513671875, "global_step": 429047, "epoch": 5169} {"train_loss": -26.11956214904785, "global_step": 429048, "epoch": 5169} {"train_loss": -26.394672393798828, "global_step": 429049, "epoch": 5169} {"train_loss": -26.20277976989746, "global_step": 429050, "epoch": 5169} {"train_loss": -26.619428634643555, "global_step": 429051, "epoch": 5169} {"train_loss": -26.092147827148438, "global_step": 429052, "epoch": 5169} {"train_loss": -26.651880264282227, "global_step": 429053, "epoch": 5169} {"train_loss": -26.451990127563477, "global_step": 429054, "epoch": 5169} {"train_loss": -26.683273315429688, "global_step": 429055, "epoch": 5169} {"train_loss": -26.655027389526367, "global_step": 429056, "epoch": 5169} {"train_loss": -26.60276222229004, "global_step": 429057, "epoch": 5169} {"train_loss": -26.886465072631836, "global_step": 429058, "epoch": 5169} {"train_loss": -26.56050682067871, "global_step": 429059, "epoch": 5169} {"train_loss": -26.74471092224121, "global_step": 429060, "epoch": 5169} {"train_loss": -26.806324005126953, "global_step": 429061, "epoch": 5169} {"train_loss": -26.6817684173584, "global_step": 429062, "epoch": 5169} {"train_loss": -26.768768310546875, "global_step": 429063, "epoch": 5169} {"train_loss": -26.823516845703125, "global_step": 429064, "epoch": 5169} {"train_loss": -26.739551544189453, "global_step": 429065, "epoch": 5169} {"train_loss": -26.783405303955078, "global_step": 429066, "epoch": 5169} {"train_loss": -26.68897819519043, "global_step": 429067, "epoch": 5169} {"train_loss": -26.490619659423828, "global_step": 429068, "epoch": 5169} {"train_loss": -26.812225341796875, "global_step": 429069, "epoch": 5169} {"train_loss": -26.268997192382812, "global_step": 429070, "epoch": 5169} {"train_loss": -26.548187255859375, "global_step": 429071, "epoch": 5169} {"train_loss": -26.782983779907227, "global_step": 429072, "epoch": 5169} {"train_loss": -26.515045166015625, "global_step": 429073, "epoch": 5169} {"train_loss": -26.885608673095703, "global_step": 429074, "epoch": 5169} {"train_loss": -26.709339141845703, "global_step": 429075, "epoch": 5169} {"train_loss": -26.8211727142334, "global_step": 429076, "epoch": 5169} {"train_loss": -26.80791664123535, "global_step": 429077, "epoch": 5169} {"train_loss": -27.472875595092773, "global_step": 429078, "epoch": 5169} {"train_loss": -26.852819442749023, "global_step": 429079, "epoch": 5169} {"train_loss": -26.933691024780273, "global_step": 429080, "epoch": 5169} {"train_loss": -26.797388076782227, "global_step": 429081, "epoch": 5169} {"train_loss": -26.7478084564209, "global_step": 429082, "epoch": 5169} {"train_loss": -26.732166290283203, "global_step": 429083, "epoch": 5169} {"train_loss": -26.7134952545166, "global_step": 429084, "epoch": 5169} {"train_loss": -27.282072067260742, "global_step": 429085, "epoch": 5169} {"train_loss": -26.905603408813477, "global_step": 429086, "epoch": 5169} {"train_loss": -26.865320205688477, "global_step": 429087, "epoch": 5169} {"train_loss": -26.802764892578125, "global_step": 429088, "epoch": 5169} {"train_loss": -26.840164184570312, "global_step": 429089, "epoch": 5169} {"train_loss": -26.956851959228516, "global_step": 429090, "epoch": 5169} {"train_loss": -27.16061782836914, "global_step": 429091, "epoch": 5169} {"train_loss": -26.98583984375, "global_step": 429092, "epoch": 5169} {"train_loss": -26.878950119018555, "global_step": 429093, "epoch": 5169} {"train_loss": -27.11859703063965, "global_step": 429094, "epoch": 5169} {"train_loss": -26.60141944885254, "global_step": 429095, "epoch": 5169} {"train_loss": -26.787961959838867, "global_step": 429096, "epoch": 5169} {"train_loss": -26.994842529296875, "global_step": 429097, "epoch": 5169} {"train_loss": -26.82254981994629, "global_step": 429098, "epoch": 5169} {"train_loss": -26.610000610351562, "global_step": 429099, "epoch": 5169} {"train_loss": -26.942480087280273, "global_step": 429100, "epoch": 5169} {"train_loss": -26.992334365844727, "global_step": 429101, "epoch": 5169} {"train_loss": -26.50623893737793, "global_step": 429102, "epoch": 5169} {"train_loss": -27.19403648376465, "global_step": 429103, "epoch": 5169} {"train_loss": -26.545469284057617, "global_step": 429104, "epoch": 5169} {"train_loss": -26.5577392578125, "global_step": 429105, "epoch": 5169} {"train_loss": -26.919397354125977, "global_step": 429106, "epoch": 5169} {"train_loss": -26.963760375976562, "global_step": 429107, "epoch": 5169} {"train_loss": -26.852020263671875, "global_step": 429108, "epoch": 5169} {"train_loss": -26.561982327196972, "global_step": 429109, "epoch": 5169, "val_loss": 6530459.0} {"train_loss": -25.779529571533203, "global_step": 429110, "epoch": 5170} {"train_loss": -25.3422794342041, "global_step": 429111, "epoch": 5170} {"train_loss": -26.121313095092773, "global_step": 429112, "epoch": 5170} {"train_loss": -25.709314346313477, "global_step": 429113, "epoch": 5170} {"train_loss": -26.462926864624023, "global_step": 429114, "epoch": 5170} {"train_loss": -25.635196685791016, "global_step": 429115, "epoch": 5170} {"train_loss": -26.76547622680664, "global_step": 429116, "epoch": 5170} {"train_loss": -26.195688247680664, "global_step": 429117, "epoch": 5170} {"train_loss": -27.01395606994629, "global_step": 429118, "epoch": 5170} {"train_loss": -26.109933853149414, "global_step": 429119, "epoch": 5170} {"train_loss": -26.517200469970703, "global_step": 429120, "epoch": 5170} {"train_loss": -26.92850112915039, "global_step": 429121, "epoch": 5170} {"train_loss": -26.226337432861328, "global_step": 429122, "epoch": 5170} {"train_loss": -26.549463272094727, "global_step": 429123, "epoch": 5170} {"train_loss": -26.598119735717773, "global_step": 429124, "epoch": 5170} {"train_loss": -26.22641372680664, "global_step": 429125, "epoch": 5170} {"train_loss": -26.839094161987305, "global_step": 429126, "epoch": 5170} {"train_loss": -27.03299331665039, "global_step": 429127, "epoch": 5170} {"train_loss": -26.6666259765625, "global_step": 429128, "epoch": 5170} {"train_loss": -26.564794540405273, "global_step": 429129, "epoch": 5170} {"train_loss": -26.966053009033203, "global_step": 429130, "epoch": 5170} {"train_loss": -26.816253662109375, "global_step": 429131, "epoch": 5170} {"train_loss": -26.994964599609375, "global_step": 429132, "epoch": 5170} {"train_loss": -26.471349716186523, "global_step": 429133, "epoch": 5170} {"train_loss": -26.612356185913086, "global_step": 429134, "epoch": 5170} {"train_loss": -26.894489288330078, "global_step": 429135, "epoch": 5170} {"train_loss": -26.7110538482666, "global_step": 429136, "epoch": 5170} {"train_loss": -26.91676139831543, "global_step": 429137, "epoch": 5170} {"train_loss": -26.854145050048828, "global_step": 429138, "epoch": 5170} {"train_loss": -26.783248901367188, "global_step": 429139, "epoch": 5170} {"train_loss": -26.82844352722168, "global_step": 429140, "epoch": 5170} {"train_loss": -26.59095573425293, "global_step": 429141, "epoch": 5170} {"train_loss": -26.865768432617188, "global_step": 429142, "epoch": 5170} {"train_loss": -26.9232120513916, "global_step": 429143, "epoch": 5170} {"train_loss": -26.864639282226562, "global_step": 429144, "epoch": 5170} {"train_loss": -26.89163589477539, "global_step": 429145, "epoch": 5170} {"train_loss": -26.997638702392578, "global_step": 429146, "epoch": 5170} {"train_loss": -27.246084213256836, "global_step": 429147, "epoch": 5170} {"train_loss": -26.80914306640625, "global_step": 429148, "epoch": 5170} {"train_loss": -26.801481246948242, "global_step": 429149, "epoch": 5170} {"train_loss": -27.345075607299805, "global_step": 429150, "epoch": 5170} {"train_loss": -26.614614486694336, "global_step": 429151, "epoch": 5170} {"train_loss": -26.748144149780273, "global_step": 429152, "epoch": 5170} {"train_loss": -26.606842041015625, "global_step": 429153, "epoch": 5170} {"train_loss": -26.54083824157715, "global_step": 429154, "epoch": 5170} {"train_loss": -26.843103408813477, "global_step": 429155, "epoch": 5170} {"train_loss": -26.89747428894043, "global_step": 429156, "epoch": 5170} {"train_loss": -26.750659942626953, "global_step": 429157, "epoch": 5170} {"train_loss": -26.933752059936523, "global_step": 429158, "epoch": 5170} {"train_loss": -27.12603187561035, "global_step": 429159, "epoch": 5170} {"train_loss": -26.870615005493164, "global_step": 429160, "epoch": 5170} {"train_loss": -27.019296646118164, "global_step": 429161, "epoch": 5170} {"train_loss": -27.082300186157227, "global_step": 429162, "epoch": 5170} {"train_loss": -26.709497451782227, "global_step": 429163, "epoch": 5170} {"train_loss": -26.673368453979492, "global_step": 429164, "epoch": 5170} {"train_loss": -26.83015251159668, "global_step": 429165, "epoch": 5170} {"train_loss": -26.626028060913086, "global_step": 429166, "epoch": 5170} {"train_loss": -26.84700584411621, "global_step": 429167, "epoch": 5170} {"train_loss": -26.878326416015625, "global_step": 429168, "epoch": 5170} {"train_loss": -26.674001693725586, "global_step": 429169, "epoch": 5170} {"train_loss": -26.82124137878418, "global_step": 429170, "epoch": 5170} {"train_loss": -27.081897735595703, "global_step": 429171, "epoch": 5170} {"train_loss": -27.188720703125, "global_step": 429172, "epoch": 5170} {"train_loss": -26.817707061767578, "global_step": 429173, "epoch": 5170} {"train_loss": -26.480634689331055, "global_step": 429174, "epoch": 5170} {"train_loss": -26.74029541015625, "global_step": 429175, "epoch": 5170} {"train_loss": -26.173751831054688, "global_step": 429176, "epoch": 5170} {"train_loss": -26.68117332458496, "global_step": 429177, "epoch": 5170} {"train_loss": -26.66427993774414, "global_step": 429178, "epoch": 5170} {"train_loss": -26.629291534423828, "global_step": 429179, "epoch": 5170} {"train_loss": -26.565771102905273, "global_step": 429180, "epoch": 5170} {"train_loss": -26.210309982299805, "global_step": 429181, "epoch": 5170} {"train_loss": -26.87738609313965, "global_step": 429182, "epoch": 5170} {"train_loss": -26.59226417541504, "global_step": 429183, "epoch": 5170} {"train_loss": -26.42481803894043, "global_step": 429184, "epoch": 5170} {"train_loss": -26.909692764282227, "global_step": 429185, "epoch": 5170} {"train_loss": -26.268491744995117, "global_step": 429186, "epoch": 5170} {"train_loss": -26.617206573486328, "global_step": 429187, "epoch": 5170} {"train_loss": -26.416309356689453, "global_step": 429188, "epoch": 5170} {"train_loss": -26.695524215698242, "global_step": 429189, "epoch": 5170} {"train_loss": -26.852741241455078, "global_step": 429190, "epoch": 5170} {"train_loss": -26.241361618041992, "global_step": 429191, "epoch": 5170} {"train_loss": -26.672772074320232, "global_step": 429192, "epoch": 5170, "val_loss": 6706432.5} {"train_loss": -26.627973556518555, "global_step": 429193, "epoch": 5171} {"train_loss": -26.316192626953125, "global_step": 429194, "epoch": 5171} {"train_loss": -26.470233917236328, "global_step": 429195, "epoch": 5171} {"train_loss": -26.64759635925293, "global_step": 429196, "epoch": 5171} {"train_loss": -26.321691513061523, "global_step": 429197, "epoch": 5171} {"train_loss": -26.8541259765625, "global_step": 429198, "epoch": 5171} {"train_loss": -26.49702262878418, "global_step": 429199, "epoch": 5171} {"train_loss": -26.341276168823242, "global_step": 429200, "epoch": 5171} {"train_loss": -26.768701553344727, "global_step": 429201, "epoch": 5171} {"train_loss": -26.850875854492188, "global_step": 429202, "epoch": 5171} {"train_loss": -26.487714767456055, "global_step": 429203, "epoch": 5171} {"train_loss": -27.03358268737793, "global_step": 429204, "epoch": 5171} {"train_loss": -26.869836807250977, "global_step": 429205, "epoch": 5171} {"train_loss": -26.6691951751709, "global_step": 429206, "epoch": 5171} {"train_loss": -27.069311141967773, "global_step": 429207, "epoch": 5171} {"train_loss": -26.89349937438965, "global_step": 429208, "epoch": 5171} {"train_loss": -26.662708282470703, "global_step": 429209, "epoch": 5171} {"train_loss": -27.030080795288086, "global_step": 429210, "epoch": 5171} {"train_loss": -26.766691207885742, "global_step": 429211, "epoch": 5171} {"train_loss": -26.96604347229004, "global_step": 429212, "epoch": 5171} {"train_loss": -26.80866050720215, "global_step": 429213, "epoch": 5171} {"train_loss": -26.9688777923584, "global_step": 429214, "epoch": 5171} {"train_loss": -26.673675537109375, "global_step": 429215, "epoch": 5171} {"train_loss": -27.213623046875, "global_step": 429216, "epoch": 5171} {"train_loss": -26.869977951049805, "global_step": 429217, "epoch": 5171} {"train_loss": -27.00129508972168, "global_step": 429218, "epoch": 5171} {"train_loss": -26.88274574279785, "global_step": 429219, "epoch": 5171} {"train_loss": -27.13572120666504, "global_step": 429220, "epoch": 5171} {"train_loss": -27.065479278564453, "global_step": 429221, "epoch": 5171} {"train_loss": -27.008502960205078, "global_step": 429222, "epoch": 5171} {"train_loss": -26.99140739440918, "global_step": 429223, "epoch": 5171} {"train_loss": -26.96195411682129, "global_step": 429224, "epoch": 5171} {"train_loss": -27.16309928894043, "global_step": 429225, "epoch": 5171} {"train_loss": -27.036270141601562, "global_step": 429226, "epoch": 5171} {"train_loss": -27.281564712524414, "global_step": 429227, "epoch": 5171} {"train_loss": -27.222501754760742, "global_step": 429228, "epoch": 5171} {"train_loss": -27.130796432495117, "global_step": 429229, "epoch": 5171} {"train_loss": -27.04903221130371, "global_step": 429230, "epoch": 5171} {"train_loss": -27.255460739135742, "global_step": 429231, "epoch": 5171} {"train_loss": -26.73565673828125, "global_step": 429232, "epoch": 5171} {"train_loss": -27.16725730895996, "global_step": 429233, "epoch": 5171} {"train_loss": -26.972257614135742, "global_step": 429234, "epoch": 5171} {"train_loss": -27.096837997436523, "global_step": 429235, "epoch": 5171} {"train_loss": -26.902048110961914, "global_step": 429236, "epoch": 5171} {"train_loss": -26.9666748046875, "global_step": 429237, "epoch": 5171} {"train_loss": -27.571563720703125, "global_step": 429238, "epoch": 5171} {"train_loss": -26.644601821899414, "global_step": 429239, "epoch": 5171} {"train_loss": -27.082082748413086, "global_step": 429240, "epoch": 5171} {"train_loss": -27.039350509643555, "global_step": 429241, "epoch": 5171} {"train_loss": -26.67244529724121, "global_step": 429242, "epoch": 5171} {"train_loss": -26.636960983276367, "global_step": 429243, "epoch": 5171} {"train_loss": -26.95273780822754, "global_step": 429244, "epoch": 5171} {"train_loss": -26.390363693237305, "global_step": 429245, "epoch": 5171} {"train_loss": -25.524831771850586, "global_step": 429246, "epoch": 5171} {"train_loss": -24.627017974853516, "global_step": 429247, "epoch": 5171} {"train_loss": -25.474044799804688, "global_step": 429248, "epoch": 5171} {"train_loss": -26.419782638549805, "global_step": 429249, "epoch": 5171} {"train_loss": -26.17840003967285, "global_step": 429250, "epoch": 5171} {"train_loss": -26.391386032104492, "global_step": 429251, "epoch": 5171} {"train_loss": -26.431299209594727, "global_step": 429252, "epoch": 5171} {"train_loss": -26.876819610595703, "global_step": 429253, "epoch": 5171} {"train_loss": -26.527088165283203, "global_step": 429254, "epoch": 5171} {"train_loss": -26.72498893737793, "global_step": 429255, "epoch": 5171} {"train_loss": -26.443775177001953, "global_step": 429256, "epoch": 5171} {"train_loss": -26.732934951782227, "global_step": 429257, "epoch": 5171} {"train_loss": -26.495914459228516, "global_step": 429258, "epoch": 5171} {"train_loss": -26.7335262298584, "global_step": 429259, "epoch": 5171} {"train_loss": -26.55126953125, "global_step": 429260, "epoch": 5171} {"train_loss": -26.700855255126953, "global_step": 429261, "epoch": 5171} {"train_loss": -26.870275497436523, "global_step": 429262, "epoch": 5171} {"train_loss": -27.061864852905273, "global_step": 429263, "epoch": 5171} {"train_loss": -26.597015380859375, "global_step": 429264, "epoch": 5171} {"train_loss": -27.020166397094727, "global_step": 429265, "epoch": 5171} {"train_loss": -26.6503963470459, "global_step": 429266, "epoch": 5171} {"train_loss": -26.696435928344727, "global_step": 429267, "epoch": 5171} {"train_loss": -26.433521270751953, "global_step": 429268, "epoch": 5171} {"train_loss": -27.07818603515625, "global_step": 429269, "epoch": 5171} {"train_loss": -26.47444725036621, "global_step": 429270, "epoch": 5171} {"train_loss": -26.964630126953125, "global_step": 429271, "epoch": 5171} {"train_loss": -26.710412979125977, "global_step": 429272, "epoch": 5171} {"train_loss": -27.041156768798828, "global_step": 429273, "epoch": 5171} {"train_loss": -26.538419723510742, "global_step": 429274, "epoch": 5171} {"train_loss": -26.735549559076148, "global_step": 429275, "epoch": 5171, "val_loss": 6578857.5} {"train_loss": -25.864826202392578, "global_step": 429276, "epoch": 5172} {"train_loss": -25.33321189880371, "global_step": 429277, "epoch": 5172} {"train_loss": -26.10318946838379, "global_step": 429278, "epoch": 5172} {"train_loss": -25.805561065673828, "global_step": 429279, "epoch": 5172} {"train_loss": -25.644617080688477, "global_step": 429280, "epoch": 5172} {"train_loss": -26.67022132873535, "global_step": 429281, "epoch": 5172} {"train_loss": -25.86456298828125, "global_step": 429282, "epoch": 5172} {"train_loss": -26.18674659729004, "global_step": 429283, "epoch": 5172} {"train_loss": -26.241140365600586, "global_step": 429284, "epoch": 5172} {"train_loss": -26.2838191986084, "global_step": 429285, "epoch": 5172} {"train_loss": -26.03273582458496, "global_step": 429286, "epoch": 5172} {"train_loss": -26.040252685546875, "global_step": 429287, "epoch": 5172} {"train_loss": -26.342792510986328, "global_step": 429288, "epoch": 5172} {"train_loss": -26.496484756469727, "global_step": 429289, "epoch": 5172} {"train_loss": -26.407373428344727, "global_step": 429290, "epoch": 5172} {"train_loss": -26.1157169342041, "global_step": 429291, "epoch": 5172} {"train_loss": -26.61614990234375, "global_step": 429292, "epoch": 5172} {"train_loss": -26.488468170166016, "global_step": 429293, "epoch": 5172} {"train_loss": -26.248188018798828, "global_step": 429294, "epoch": 5172} {"train_loss": -26.34379005432129, "global_step": 429295, "epoch": 5172} {"train_loss": -26.638193130493164, "global_step": 429296, "epoch": 5172} {"train_loss": -26.22330665588379, "global_step": 429297, "epoch": 5172} {"train_loss": -26.6805477142334, "global_step": 429298, "epoch": 5172} {"train_loss": -26.7836856842041, "global_step": 429299, "epoch": 5172} {"train_loss": -26.726926803588867, "global_step": 429300, "epoch": 5172} {"train_loss": -26.77634620666504, "global_step": 429301, "epoch": 5172} {"train_loss": -26.529449462890625, "global_step": 429302, "epoch": 5172} {"train_loss": -26.66436195373535, "global_step": 429303, "epoch": 5172} {"train_loss": -26.824914932250977, "global_step": 429304, "epoch": 5172} {"train_loss": -26.81879234313965, "global_step": 429305, "epoch": 5172} {"train_loss": -26.88205909729004, "global_step": 429306, "epoch": 5172} {"train_loss": -26.422910690307617, "global_step": 429307, "epoch": 5172} {"train_loss": -26.732343673706055, "global_step": 429308, "epoch": 5172} {"train_loss": -26.98528480529785, "global_step": 429309, "epoch": 5172} {"train_loss": -26.680267333984375, "global_step": 429310, "epoch": 5172} {"train_loss": -26.89013671875, "global_step": 429311, "epoch": 5172} {"train_loss": -26.780744552612305, "global_step": 429312, "epoch": 5172} {"train_loss": -26.88446044921875, "global_step": 429313, "epoch": 5172} {"train_loss": -27.053024291992188, "global_step": 429314, "epoch": 5172} {"train_loss": -26.921890258789062, "global_step": 429315, "epoch": 5172} {"train_loss": -26.71381950378418, "global_step": 429316, "epoch": 5172} {"train_loss": -26.849180221557617, "global_step": 429317, "epoch": 5172} {"train_loss": -26.89446449279785, "global_step": 429318, "epoch": 5172} {"train_loss": -26.683582305908203, "global_step": 429319, "epoch": 5172} {"train_loss": -26.842145919799805, "global_step": 429320, "epoch": 5172} {"train_loss": -26.673080444335938, "global_step": 429321, "epoch": 5172} {"train_loss": -27.01019859313965, "global_step": 429322, "epoch": 5172} {"train_loss": -26.759658813476562, "global_step": 429323, "epoch": 5172} {"train_loss": -26.954086303710938, "global_step": 429324, "epoch": 5172} {"train_loss": -26.538909912109375, "global_step": 429325, "epoch": 5172} {"train_loss": -26.731313705444336, "global_step": 429326, "epoch": 5172} {"train_loss": -26.67191505432129, "global_step": 429327, "epoch": 5172} {"train_loss": -26.925800323486328, "global_step": 429328, "epoch": 5172} {"train_loss": -27.259429931640625, "global_step": 429329, "epoch": 5172} {"train_loss": -27.48465919494629, "global_step": 429330, "epoch": 5172} {"train_loss": -27.0051212310791, "global_step": 429331, "epoch": 5172} {"train_loss": -27.0977783203125, "global_step": 429332, "epoch": 5172} {"train_loss": -26.95597267150879, "global_step": 429333, "epoch": 5172} {"train_loss": -27.1292781829834, "global_step": 429334, "epoch": 5172} {"train_loss": -26.947446823120117, "global_step": 429335, "epoch": 5172} {"train_loss": -26.905597686767578, "global_step": 429336, "epoch": 5172} {"train_loss": -26.675689697265625, "global_step": 429337, "epoch": 5172} {"train_loss": -26.851749420166016, "global_step": 429338, "epoch": 5172} {"train_loss": -26.995649337768555, "global_step": 429339, "epoch": 5172} {"train_loss": -26.932891845703125, "global_step": 429340, "epoch": 5172} {"train_loss": -26.772430419921875, "global_step": 429341, "epoch": 5172} {"train_loss": -26.613061904907227, "global_step": 429342, "epoch": 5172} {"train_loss": -26.822668075561523, "global_step": 429343, "epoch": 5172} {"train_loss": -26.625268936157227, "global_step": 429344, "epoch": 5172} {"train_loss": -26.783477783203125, "global_step": 429345, "epoch": 5172} {"train_loss": -27.117834091186523, "global_step": 429346, "epoch": 5172} {"train_loss": -26.843505859375, "global_step": 429347, "epoch": 5172} {"train_loss": -26.87688636779785, "global_step": 429348, "epoch": 5172} {"train_loss": -26.888599395751953, "global_step": 429349, "epoch": 5172} {"train_loss": -26.365636825561523, "global_step": 429350, "epoch": 5172} {"train_loss": -26.68219566345215, "global_step": 429351, "epoch": 5172} {"train_loss": -26.888425827026367, "global_step": 429352, "epoch": 5172} {"train_loss": -27.036436080932617, "global_step": 429353, "epoch": 5172} {"train_loss": -26.682424545288086, "global_step": 429354, "epoch": 5172} {"train_loss": -26.834442138671875, "global_step": 429355, "epoch": 5172} {"train_loss": -26.821002960205078, "global_step": 429356, "epoch": 5172} {"train_loss": -26.308700561523438, "global_step": 429357, "epoch": 5172} {"train_loss": -26.650022552674073, "global_step": 429358, "epoch": 5172, "val_loss": 6633321.0} {"train_loss": -25.867185592651367, "global_step": 429359, "epoch": 5173} {"train_loss": -25.58736801147461, "global_step": 429360, "epoch": 5173} {"train_loss": -26.12660026550293, "global_step": 429361, "epoch": 5173} {"train_loss": -26.23309326171875, "global_step": 429362, "epoch": 5173} {"train_loss": -26.133209228515625, "global_step": 429363, "epoch": 5173} {"train_loss": -26.390066146850586, "global_step": 429364, "epoch": 5173} {"train_loss": -26.422391891479492, "global_step": 429365, "epoch": 5173} {"train_loss": -26.281538009643555, "global_step": 429366, "epoch": 5173} {"train_loss": -25.825855255126953, "global_step": 429367, "epoch": 5173} {"train_loss": -26.44447135925293, "global_step": 429368, "epoch": 5173} {"train_loss": -26.534482955932617, "global_step": 429369, "epoch": 5173} {"train_loss": -26.54050064086914, "global_step": 429370, "epoch": 5173} {"train_loss": -26.279251098632812, "global_step": 429371, "epoch": 5173} {"train_loss": -26.289411544799805, "global_step": 429372, "epoch": 5173} {"train_loss": -26.520715713500977, "global_step": 429373, "epoch": 5173} {"train_loss": -26.482751846313477, "global_step": 429374, "epoch": 5173} {"train_loss": -26.844839096069336, "global_step": 429375, "epoch": 5173} {"train_loss": -26.39167594909668, "global_step": 429376, "epoch": 5173} {"train_loss": -26.74905776977539, "global_step": 429377, "epoch": 5173} {"train_loss": -26.47294044494629, "global_step": 429378, "epoch": 5173} {"train_loss": -26.435089111328125, "global_step": 429379, "epoch": 5173} {"train_loss": -26.58243179321289, "global_step": 429380, "epoch": 5173} {"train_loss": -26.41389274597168, "global_step": 429381, "epoch": 5173} {"train_loss": -26.61370277404785, "global_step": 429382, "epoch": 5173} {"train_loss": -26.508359909057617, "global_step": 429383, "epoch": 5173} {"train_loss": -26.651016235351562, "global_step": 429384, "epoch": 5173} {"train_loss": -26.70014762878418, "global_step": 429385, "epoch": 5173} {"train_loss": -26.470245361328125, "global_step": 429386, "epoch": 5173} {"train_loss": -26.44074821472168, "global_step": 429387, "epoch": 5173} {"train_loss": -26.870756149291992, "global_step": 429388, "epoch": 5173} {"train_loss": -26.192890167236328, "global_step": 429389, "epoch": 5173} {"train_loss": -26.815505981445312, "global_step": 429390, "epoch": 5173} {"train_loss": -27.075698852539062, "global_step": 429391, "epoch": 5173} {"train_loss": -26.9226016998291, "global_step": 429392, "epoch": 5173} {"train_loss": -26.683496475219727, "global_step": 429393, "epoch": 5173} {"train_loss": -26.946645736694336, "global_step": 429394, "epoch": 5173} {"train_loss": -27.16402244567871, "global_step": 429395, "epoch": 5173} {"train_loss": -27.13785743713379, "global_step": 429396, "epoch": 5173} {"train_loss": -27.273117065429688, "global_step": 429397, "epoch": 5173} {"train_loss": -27.275440216064453, "global_step": 429398, "epoch": 5173} {"train_loss": -26.89800453186035, "global_step": 429399, "epoch": 5173} {"train_loss": -26.98566246032715, "global_step": 429400, "epoch": 5173} {"train_loss": -27.174041748046875, "global_step": 429401, "epoch": 5173} {"train_loss": -26.95174217224121, "global_step": 429402, "epoch": 5173} {"train_loss": -26.837255477905273, "global_step": 429403, "epoch": 5173} {"train_loss": -27.315515518188477, "global_step": 429404, "epoch": 5173} {"train_loss": -27.170740127563477, "global_step": 429405, "epoch": 5173} {"train_loss": -27.166412353515625, "global_step": 429406, "epoch": 5173} {"train_loss": -27.379505157470703, "global_step": 429407, "epoch": 5173} {"train_loss": -27.226293563842773, "global_step": 429408, "epoch": 5173} {"train_loss": -27.254657745361328, "global_step": 429409, "epoch": 5173} {"train_loss": -27.358631134033203, "global_step": 429410, "epoch": 5173} {"train_loss": -27.334949493408203, "global_step": 429411, "epoch": 5173} {"train_loss": -27.2091007232666, "global_step": 429412, "epoch": 5173} {"train_loss": -26.904348373413086, "global_step": 429413, "epoch": 5173} {"train_loss": -26.399763107299805, "global_step": 429414, "epoch": 5173} {"train_loss": -27.098926544189453, "global_step": 429415, "epoch": 5173} {"train_loss": -26.881317138671875, "global_step": 429416, "epoch": 5173} {"train_loss": -26.35854148864746, "global_step": 429417, "epoch": 5173} {"train_loss": -26.740026473999023, "global_step": 429418, "epoch": 5173} {"train_loss": -26.455625534057617, "global_step": 429419, "epoch": 5173} {"train_loss": -26.690725326538086, "global_step": 429420, "epoch": 5173} {"train_loss": -26.192270278930664, "global_step": 429421, "epoch": 5173} {"train_loss": -27.057910919189453, "global_step": 429422, "epoch": 5173} {"train_loss": -26.651294708251953, "global_step": 429423, "epoch": 5173} {"train_loss": -26.30396842956543, "global_step": 429424, "epoch": 5173} {"train_loss": -26.218286514282227, "global_step": 429425, "epoch": 5173} {"train_loss": -26.834630966186523, "global_step": 429426, "epoch": 5173} {"train_loss": -26.494842529296875, "global_step": 429427, "epoch": 5173} {"train_loss": -26.121313095092773, "global_step": 429428, "epoch": 5173} {"train_loss": -26.478368759155273, "global_step": 429429, "epoch": 5173} {"train_loss": -26.80267906188965, "global_step": 429430, "epoch": 5173} {"train_loss": -26.507001876831055, "global_step": 429431, "epoch": 5173} {"train_loss": -26.828048706054688, "global_step": 429432, "epoch": 5173} {"train_loss": -26.92897605895996, "global_step": 429433, "epoch": 5173} {"train_loss": -26.8474178314209, "global_step": 429434, "epoch": 5173} {"train_loss": -26.84697914123535, "global_step": 429435, "epoch": 5173} {"train_loss": -26.615966796875, "global_step": 429436, "epoch": 5173} {"train_loss": -26.936065673828125, "global_step": 429437, "epoch": 5173} {"train_loss": -26.550989151000977, "global_step": 429438, "epoch": 5173} {"train_loss": -26.163867950439453, "global_step": 429439, "epoch": 5173} {"train_loss": -26.700794219970703, "global_step": 429440, "epoch": 5173} {"train_loss": -26.67620550868023, "global_step": 429441, "epoch": 5173, "val_loss": 6557701.0} {"train_loss": -25.997589111328125, "global_step": 429442, "epoch": 5174} {"train_loss": -26.195331573486328, "global_step": 429443, "epoch": 5174} {"train_loss": -26.16045570373535, "global_step": 429444, "epoch": 5174} {"train_loss": -26.61578941345215, "global_step": 429445, "epoch": 5174} {"train_loss": -26.438650131225586, "global_step": 429446, "epoch": 5174} {"train_loss": -25.790542602539062, "global_step": 429447, "epoch": 5174} {"train_loss": -26.398212432861328, "global_step": 429448, "epoch": 5174} {"train_loss": -26.20651626586914, "global_step": 429449, "epoch": 5174} {"train_loss": -26.360998153686523, "global_step": 429450, "epoch": 5174} {"train_loss": -26.185306549072266, "global_step": 429451, "epoch": 5174} {"train_loss": -26.67072105407715, "global_step": 429452, "epoch": 5174} {"train_loss": -26.470458984375, "global_step": 429453, "epoch": 5174} {"train_loss": -27.102766036987305, "global_step": 429454, "epoch": 5174} {"train_loss": -26.695287704467773, "global_step": 429455, "epoch": 5174} {"train_loss": -26.76094627380371, "global_step": 429456, "epoch": 5174} {"train_loss": -26.751798629760742, "global_step": 429457, "epoch": 5174} {"train_loss": -26.7521915435791, "global_step": 429458, "epoch": 5174} {"train_loss": -26.837818145751953, "global_step": 429459, "epoch": 5174} {"train_loss": -26.843402862548828, "global_step": 429460, "epoch": 5174} {"train_loss": -26.823719024658203, "global_step": 429461, "epoch": 5174} {"train_loss": -26.49203872680664, "global_step": 429462, "epoch": 5174} {"train_loss": -26.676721572875977, "global_step": 429463, "epoch": 5174} {"train_loss": -26.74713134765625, "global_step": 429464, "epoch": 5174} {"train_loss": -26.737451553344727, "global_step": 429465, "epoch": 5174} {"train_loss": -27.0616455078125, "global_step": 429466, "epoch": 5174} {"train_loss": -26.858739852905273, "global_step": 429467, "epoch": 5174} {"train_loss": -26.630277633666992, "global_step": 429468, "epoch": 5174} {"train_loss": -26.42719078063965, "global_step": 429469, "epoch": 5174} {"train_loss": -26.877405166625977, "global_step": 429470, "epoch": 5174} {"train_loss": -27.3803768157959, "global_step": 429471, "epoch": 5174} {"train_loss": -27.06926918029785, "global_step": 429472, "epoch": 5174} {"train_loss": -26.8203067779541, "global_step": 429473, "epoch": 5174} {"train_loss": -26.9851016998291, "global_step": 429474, "epoch": 5174} {"train_loss": -27.19208335876465, "global_step": 429475, "epoch": 5174} {"train_loss": -26.739606857299805, "global_step": 429476, "epoch": 5174} {"train_loss": -27.035154342651367, "global_step": 429477, "epoch": 5174} {"train_loss": -27.199193954467773, "global_step": 429478, "epoch": 5174} {"train_loss": -26.9034423828125, "global_step": 429479, "epoch": 5174} {"train_loss": -27.32789421081543, "global_step": 429480, "epoch": 5174} {"train_loss": -26.586090087890625, "global_step": 429481, "epoch": 5174} {"train_loss": -26.88641357421875, "global_step": 429482, "epoch": 5174} {"train_loss": -27.074390411376953, "global_step": 429483, "epoch": 5174} {"train_loss": -26.925827026367188, "global_step": 429484, "epoch": 5174} {"train_loss": -26.744787216186523, "global_step": 429485, "epoch": 5174} {"train_loss": -27.103124618530273, "global_step": 429486, "epoch": 5174} {"train_loss": -26.885595321655273, "global_step": 429487, "epoch": 5174} {"train_loss": -27.019824981689453, "global_step": 429488, "epoch": 5174} {"train_loss": -27.2498722076416, "global_step": 429489, "epoch": 5174} {"train_loss": -27.11298942565918, "global_step": 429490, "epoch": 5174} {"train_loss": -26.813764572143555, "global_step": 429491, "epoch": 5174} {"train_loss": -27.043973922729492, "global_step": 429492, "epoch": 5174} {"train_loss": -26.52699089050293, "global_step": 429493, "epoch": 5174} {"train_loss": -26.81987953186035, "global_step": 429494, "epoch": 5174} {"train_loss": -27.094940185546875, "global_step": 429495, "epoch": 5174} {"train_loss": -26.8289737701416, "global_step": 429496, "epoch": 5174} {"train_loss": -26.73370933532715, "global_step": 429497, "epoch": 5174} {"train_loss": -27.08082389831543, "global_step": 429498, "epoch": 5174} {"train_loss": -27.150833129882812, "global_step": 429499, "epoch": 5174} {"train_loss": -27.055877685546875, "global_step": 429500, "epoch": 5174} {"train_loss": -26.480268478393555, "global_step": 429501, "epoch": 5174} {"train_loss": -26.7287654876709, "global_step": 429502, "epoch": 5174} {"train_loss": -27.154260635375977, "global_step": 429503, "epoch": 5174} {"train_loss": -26.681442260742188, "global_step": 429504, "epoch": 5174} {"train_loss": -26.259597778320312, "global_step": 429505, "epoch": 5174} {"train_loss": -26.69552993774414, "global_step": 429506, "epoch": 5174} {"train_loss": -26.9454345703125, "global_step": 429507, "epoch": 5174} {"train_loss": -27.00569725036621, "global_step": 429508, "epoch": 5174} {"train_loss": -26.39497947692871, "global_step": 429509, "epoch": 5174} {"train_loss": -26.2247314453125, "global_step": 429510, "epoch": 5174} {"train_loss": -26.713241577148438, "global_step": 429511, "epoch": 5174} {"train_loss": -27.0319881439209, "global_step": 429512, "epoch": 5174} {"train_loss": -26.856048583984375, "global_step": 429513, "epoch": 5174} {"train_loss": -26.880781173706055, "global_step": 429514, "epoch": 5174} {"train_loss": -26.728626251220703, "global_step": 429515, "epoch": 5174} {"train_loss": -26.970367431640625, "global_step": 429516, "epoch": 5174} {"train_loss": -26.68259620666504, "global_step": 429517, "epoch": 5174} {"train_loss": -26.833059310913086, "global_step": 429518, "epoch": 5174} {"train_loss": -27.017370223999023, "global_step": 429519, "epoch": 5174} {"train_loss": -26.784393310546875, "global_step": 429520, "epoch": 5174} {"train_loss": -27.118900299072266, "global_step": 429521, "epoch": 5174} {"train_loss": -26.709548950195312, "global_step": 429522, "epoch": 5174} {"train_loss": -26.626638412475586, "global_step": 429523, "epoch": 5174} {"train_loss": -26.783770319927168, "global_step": 429524, "epoch": 5174, "val_loss": 6549552.5} {"train_loss": -25.434341430664062, "global_step": 429525, "epoch": 5175} {"train_loss": -25.714466094970703, "global_step": 429526, "epoch": 5175} {"train_loss": -26.402435302734375, "global_step": 429527, "epoch": 5175} {"train_loss": -25.91901969909668, "global_step": 429528, "epoch": 5175} {"train_loss": -25.46190643310547, "global_step": 429529, "epoch": 5175} {"train_loss": -26.32484245300293, "global_step": 429530, "epoch": 5175} {"train_loss": -25.775938034057617, "global_step": 429531, "epoch": 5175} {"train_loss": -26.4243106842041, "global_step": 429532, "epoch": 5175} {"train_loss": -25.93716812133789, "global_step": 429533, "epoch": 5175} {"train_loss": -26.0654354095459, "global_step": 429534, "epoch": 5175} {"train_loss": -26.4527645111084, "global_step": 429535, "epoch": 5175} {"train_loss": -25.89495849609375, "global_step": 429536, "epoch": 5175} {"train_loss": -25.950544357299805, "global_step": 429537, "epoch": 5175} {"train_loss": -26.257659912109375, "global_step": 429538, "epoch": 5175} {"train_loss": -26.33625602722168, "global_step": 429539, "epoch": 5175} {"train_loss": -26.643280029296875, "global_step": 429540, "epoch": 5175} {"train_loss": -26.376434326171875, "global_step": 429541, "epoch": 5175} {"train_loss": -26.299551010131836, "global_step": 429542, "epoch": 5175} {"train_loss": -26.349637985229492, "global_step": 429543, "epoch": 5175} {"train_loss": -26.57486343383789, "global_step": 429544, "epoch": 5175} {"train_loss": -26.61747169494629, "global_step": 429545, "epoch": 5175} {"train_loss": -26.717639923095703, "global_step": 429546, "epoch": 5175} {"train_loss": -26.594385147094727, "global_step": 429547, "epoch": 5175} {"train_loss": -26.502500534057617, "global_step": 429548, "epoch": 5175} {"train_loss": -26.687000274658203, "global_step": 429549, "epoch": 5175} {"train_loss": -26.950286865234375, "global_step": 429550, "epoch": 5175} {"train_loss": -26.74908447265625, "global_step": 429551, "epoch": 5175} {"train_loss": -26.903661727905273, "global_step": 429552, "epoch": 5175} {"train_loss": -26.898115158081055, "global_step": 429553, "epoch": 5175} {"train_loss": -26.866455078125, "global_step": 429554, "epoch": 5175} {"train_loss": -27.184614181518555, "global_step": 429555, "epoch": 5175} {"train_loss": -26.877918243408203, "global_step": 429556, "epoch": 5175} {"train_loss": -27.007614135742188, "global_step": 429557, "epoch": 5175} {"train_loss": -26.636615753173828, "global_step": 429558, "epoch": 5175} {"train_loss": -26.793333053588867, "global_step": 429559, "epoch": 5175} {"train_loss": -27.01812171936035, "global_step": 429560, "epoch": 5175} {"train_loss": -27.09002685546875, "global_step": 429561, "epoch": 5175} {"train_loss": -26.733469009399414, "global_step": 429562, "epoch": 5175} {"train_loss": -26.89802360534668, "global_step": 429563, "epoch": 5175} {"train_loss": -26.772144317626953, "global_step": 429564, "epoch": 5175} {"train_loss": -27.026350021362305, "global_step": 429565, "epoch": 5175} {"train_loss": -26.879133224487305, "global_step": 429566, "epoch": 5175} {"train_loss": -27.069482803344727, "global_step": 429567, "epoch": 5175} {"train_loss": -27.17868423461914, "global_step": 429568, "epoch": 5175} {"train_loss": -27.061511993408203, "global_step": 429569, "epoch": 5175} {"train_loss": -26.63405418395996, "global_step": 429570, "epoch": 5175} {"train_loss": -26.795063018798828, "global_step": 429571, "epoch": 5175} {"train_loss": -26.787076950073242, "global_step": 429572, "epoch": 5175} {"train_loss": -26.889251708984375, "global_step": 429573, "epoch": 5175} {"train_loss": -26.90113639831543, "global_step": 429574, "epoch": 5175} {"train_loss": -26.825712203979492, "global_step": 429575, "epoch": 5175} {"train_loss": -27.219587326049805, "global_step": 429576, "epoch": 5175} {"train_loss": -27.33544921875, "global_step": 429577, "epoch": 5175} {"train_loss": -26.888525009155273, "global_step": 429578, "epoch": 5175} {"train_loss": -26.93470573425293, "global_step": 429579, "epoch": 5175} {"train_loss": -27.01022720336914, "global_step": 429580, "epoch": 5175} {"train_loss": -27.067365646362305, "global_step": 429581, "epoch": 5175} {"train_loss": -27.29292106628418, "global_step": 429582, "epoch": 5175} {"train_loss": -26.716039657592773, "global_step": 429583, "epoch": 5175} {"train_loss": -26.911334991455078, "global_step": 429584, "epoch": 5175} {"train_loss": -26.87872886657715, "global_step": 429585, "epoch": 5175} {"train_loss": -26.47612953186035, "global_step": 429586, "epoch": 5175} {"train_loss": -27.368005752563477, "global_step": 429587, "epoch": 5175} {"train_loss": -26.93583106994629, "global_step": 429588, "epoch": 5175} {"train_loss": -26.987445831298828, "global_step": 429589, "epoch": 5175} {"train_loss": -27.00626564025879, "global_step": 429590, "epoch": 5175} {"train_loss": -26.710418701171875, "global_step": 429591, "epoch": 5175} {"train_loss": -26.51930046081543, "global_step": 429592, "epoch": 5175} {"train_loss": -26.95370864868164, "global_step": 429593, "epoch": 5175} {"train_loss": -26.74639320373535, "global_step": 429594, "epoch": 5175} {"train_loss": -27.186140060424805, "global_step": 429595, "epoch": 5175} {"train_loss": -26.884252548217773, "global_step": 429596, "epoch": 5175} {"train_loss": -26.906082153320312, "global_step": 429597, "epoch": 5175} {"train_loss": -26.926984786987305, "global_step": 429598, "epoch": 5175} {"train_loss": -27.442209243774414, "global_step": 429599, "epoch": 5175} {"train_loss": -27.123432159423828, "global_step": 429600, "epoch": 5175} {"train_loss": -26.981281280517578, "global_step": 429601, "epoch": 5175} {"train_loss": -26.88751220703125, "global_step": 429602, "epoch": 5175} {"train_loss": -26.85373306274414, "global_step": 429603, "epoch": 5175} {"train_loss": -27.10172462463379, "global_step": 429604, "epoch": 5175} {"train_loss": -26.871753692626953, "global_step": 429605, "epoch": 5175} {"train_loss": -26.839813232421875, "global_step": 429606, "epoch": 5175} {"train_loss": -26.71873320154397, "global_step": 429607, "epoch": 5175, "val_loss": 6595597.0} {"train_loss": -26.77297019958496, "global_step": 429608, "epoch": 5176} {"train_loss": -26.143970489501953, "global_step": 429609, "epoch": 5176} {"train_loss": -25.844343185424805, "global_step": 429610, "epoch": 5176} {"train_loss": -26.1480655670166, "global_step": 429611, "epoch": 5176} {"train_loss": -26.564544677734375, "global_step": 429612, "epoch": 5176} {"train_loss": -26.684865951538086, "global_step": 429613, "epoch": 5176} {"train_loss": -26.843168258666992, "global_step": 429614, "epoch": 5176} {"train_loss": -26.194000244140625, "global_step": 429615, "epoch": 5176} {"train_loss": -26.567655563354492, "global_step": 429616, "epoch": 5176} {"train_loss": -26.565174102783203, "global_step": 429617, "epoch": 5176} {"train_loss": -26.75898551940918, "global_step": 429618, "epoch": 5176} {"train_loss": -26.762598037719727, "global_step": 429619, "epoch": 5176} {"train_loss": -26.657669067382812, "global_step": 429620, "epoch": 5176} {"train_loss": -26.899911880493164, "global_step": 429621, "epoch": 5176} {"train_loss": -26.509435653686523, "global_step": 429622, "epoch": 5176} {"train_loss": -26.78668785095215, "global_step": 429623, "epoch": 5176} {"train_loss": -26.62957763671875, "global_step": 429624, "epoch": 5176} {"train_loss": -26.389127731323242, "global_step": 429625, "epoch": 5176} {"train_loss": -26.72023582458496, "global_step": 429626, "epoch": 5176} {"train_loss": -26.82588768005371, "global_step": 429627, "epoch": 5176} {"train_loss": -26.386432647705078, "global_step": 429628, "epoch": 5176} {"train_loss": -26.81638526916504, "global_step": 429629, "epoch": 5176} {"train_loss": -26.80535316467285, "global_step": 429630, "epoch": 5176} {"train_loss": -26.8278751373291, "global_step": 429631, "epoch": 5176} {"train_loss": -26.68561363220215, "global_step": 429632, "epoch": 5176} {"train_loss": -26.53226661682129, "global_step": 429633, "epoch": 5176} {"train_loss": -26.653217315673828, "global_step": 429634, "epoch": 5176} {"train_loss": -26.80157470703125, "global_step": 429635, "epoch": 5176} {"train_loss": -26.788415908813477, "global_step": 429636, "epoch": 5176} {"train_loss": -26.779010772705078, "global_step": 429637, "epoch": 5176} {"train_loss": -27.065221786499023, "global_step": 429638, "epoch": 5176} {"train_loss": -26.88429069519043, "global_step": 429639, "epoch": 5176} {"train_loss": -26.51691246032715, "global_step": 429640, "epoch": 5176} {"train_loss": -27.04766273498535, "global_step": 429641, "epoch": 5176} {"train_loss": -26.850248336791992, "global_step": 429642, "epoch": 5176} {"train_loss": -27.15122413635254, "global_step": 429643, "epoch": 5176} {"train_loss": -26.761219024658203, "global_step": 429644, "epoch": 5176} {"train_loss": -27.088306427001953, "global_step": 429645, "epoch": 5176} {"train_loss": -27.01384925842285, "global_step": 429646, "epoch": 5176} {"train_loss": -27.270709991455078, "global_step": 429647, "epoch": 5176} {"train_loss": -26.72157096862793, "global_step": 429648, "epoch": 5176} {"train_loss": -27.040380477905273, "global_step": 429649, "epoch": 5176} {"train_loss": -27.029956817626953, "global_step": 429650, "epoch": 5176} {"train_loss": -27.41961669921875, "global_step": 429651, "epoch": 5176} {"train_loss": -27.24769401550293, "global_step": 429652, "epoch": 5176} {"train_loss": -26.490163803100586, "global_step": 429653, "epoch": 5176} {"train_loss": -27.035236358642578, "global_step": 429654, "epoch": 5176} {"train_loss": -27.08306312561035, "global_step": 429655, "epoch": 5176} {"train_loss": -27.158666610717773, "global_step": 429656, "epoch": 5176} {"train_loss": -27.309194564819336, "global_step": 429657, "epoch": 5176} {"train_loss": -27.105756759643555, "global_step": 429658, "epoch": 5176} {"train_loss": -26.975128173828125, "global_step": 429659, "epoch": 5176} {"train_loss": -26.92915153503418, "global_step": 429660, "epoch": 5176} {"train_loss": -26.880645751953125, "global_step": 429661, "epoch": 5176} {"train_loss": -27.289663314819336, "global_step": 429662, "epoch": 5176} {"train_loss": -26.798309326171875, "global_step": 429663, "epoch": 5176} {"train_loss": -27.608976364135742, "global_step": 429664, "epoch": 5176} {"train_loss": -26.946630477905273, "global_step": 429665, "epoch": 5176} {"train_loss": -26.8048095703125, "global_step": 429666, "epoch": 5176} {"train_loss": -27.019514083862305, "global_step": 429667, "epoch": 5176} {"train_loss": -27.108795166015625, "global_step": 429668, "epoch": 5176} {"train_loss": -26.927448272705078, "global_step": 429669, "epoch": 5176} {"train_loss": -27.099889755249023, "global_step": 429670, "epoch": 5176} {"train_loss": -26.82636070251465, "global_step": 429671, "epoch": 5176} {"train_loss": -26.758813858032227, "global_step": 429672, "epoch": 5176} {"train_loss": -26.734289169311523, "global_step": 429673, "epoch": 5176} {"train_loss": -25.627182006835938, "global_step": 429674, "epoch": 5176} {"train_loss": -25.4473819732666, "global_step": 429675, "epoch": 5176} {"train_loss": -25.367177963256836, "global_step": 429676, "epoch": 5176} {"train_loss": -25.60723304748535, "global_step": 429677, "epoch": 5176} {"train_loss": -26.53264808654785, "global_step": 429678, "epoch": 5176} {"train_loss": -26.603057861328125, "global_step": 429679, "epoch": 5176} {"train_loss": -25.8724308013916, "global_step": 429680, "epoch": 5176} {"train_loss": -26.342802047729492, "global_step": 429681, "epoch": 5176} {"train_loss": -26.381155014038086, "global_step": 429682, "epoch": 5176} {"train_loss": -26.38001823425293, "global_step": 429683, "epoch": 5176} {"train_loss": -26.467248916625977, "global_step": 429684, "epoch": 5176} {"train_loss": -26.17764663696289, "global_step": 429685, "epoch": 5176} {"train_loss": -26.4781494140625, "global_step": 429686, "epoch": 5176} {"train_loss": -26.366235733032227, "global_step": 429687, "epoch": 5176} {"train_loss": -26.620193481445312, "global_step": 429688, "epoch": 5176} {"train_loss": -26.31800651550293, "global_step": 429689, "epoch": 5176} {"train_loss": -26.6731186372688, "global_step": 429690, "epoch": 5176, "val_loss": 6618143.0} {"train_loss": -24.5550537109375, "global_step": 429691, "epoch": 5177} {"train_loss": -25.55072593688965, "global_step": 429692, "epoch": 5177} {"train_loss": -25.759632110595703, "global_step": 429693, "epoch": 5177} {"train_loss": -25.118295669555664, "global_step": 429694, "epoch": 5177} {"train_loss": -26.355350494384766, "global_step": 429695, "epoch": 5177} {"train_loss": -25.81720542907715, "global_step": 429696, "epoch": 5177} {"train_loss": -26.027624130249023, "global_step": 429697, "epoch": 5177} {"train_loss": -26.198989868164062, "global_step": 429698, "epoch": 5177} {"train_loss": -26.6081485748291, "global_step": 429699, "epoch": 5177} {"train_loss": -26.275360107421875, "global_step": 429700, "epoch": 5177} {"train_loss": -26.371692657470703, "global_step": 429701, "epoch": 5177} {"train_loss": -26.128454208374023, "global_step": 429702, "epoch": 5177} {"train_loss": -26.253381729125977, "global_step": 429703, "epoch": 5177} {"train_loss": -26.12849235534668, "global_step": 429704, "epoch": 5177} {"train_loss": -26.339099884033203, "global_step": 429705, "epoch": 5177} {"train_loss": -26.305891036987305, "global_step": 429706, "epoch": 5177} {"train_loss": -26.38947105407715, "global_step": 429707, "epoch": 5177} {"train_loss": -26.341421127319336, "global_step": 429708, "epoch": 5177} {"train_loss": -26.396162033081055, "global_step": 429709, "epoch": 5177} {"train_loss": -26.856372833251953, "global_step": 429710, "epoch": 5177} {"train_loss": -26.52667808532715, "global_step": 429711, "epoch": 5177} {"train_loss": -26.826200485229492, "global_step": 429712, "epoch": 5177} {"train_loss": -26.607913970947266, "global_step": 429713, "epoch": 5177} {"train_loss": -26.365209579467773, "global_step": 429714, "epoch": 5177} {"train_loss": -26.601428985595703, "global_step": 429715, "epoch": 5177} {"train_loss": -26.647668838500977, "global_step": 429716, "epoch": 5177} {"train_loss": -26.6287841796875, "global_step": 429717, "epoch": 5177} {"train_loss": -26.66409683227539, "global_step": 429718, "epoch": 5177} {"train_loss": -26.7380313873291, "global_step": 429719, "epoch": 5177} {"train_loss": -26.5003604888916, "global_step": 429720, "epoch": 5177} {"train_loss": -26.54291343688965, "global_step": 429721, "epoch": 5177} {"train_loss": -26.692493438720703, "global_step": 429722, "epoch": 5177} {"train_loss": -26.651166915893555, "global_step": 429723, "epoch": 5177} {"train_loss": -26.941198348999023, "global_step": 429724, "epoch": 5177} {"train_loss": -26.418506622314453, "global_step": 429725, "epoch": 5177} {"train_loss": -26.832250595092773, "global_step": 429726, "epoch": 5177} {"train_loss": -26.4930477142334, "global_step": 429727, "epoch": 5177} {"train_loss": -27.011157989501953, "global_step": 429728, "epoch": 5177} {"train_loss": -26.944150924682617, "global_step": 429729, "epoch": 5177} {"train_loss": -26.9583797454834, "global_step": 429730, "epoch": 5177} {"train_loss": -26.976043701171875, "global_step": 429731, "epoch": 5177} {"train_loss": -26.789886474609375, "global_step": 429732, "epoch": 5177} {"train_loss": -26.811758041381836, "global_step": 429733, "epoch": 5177} {"train_loss": -27.01825523376465, "global_step": 429734, "epoch": 5177} {"train_loss": -27.383808135986328, "global_step": 429735, "epoch": 5177} {"train_loss": -27.244827270507812, "global_step": 429736, "epoch": 5177} {"train_loss": -26.727081298828125, "global_step": 429737, "epoch": 5177} {"train_loss": -26.93303871154785, "global_step": 429738, "epoch": 5177} {"train_loss": -26.87278175354004, "global_step": 429739, "epoch": 5177} {"train_loss": -26.78753089904785, "global_step": 429740, "epoch": 5177} {"train_loss": -26.877466201782227, "global_step": 429741, "epoch": 5177} {"train_loss": -27.562536239624023, "global_step": 429742, "epoch": 5177} {"train_loss": -27.062978744506836, "global_step": 429743, "epoch": 5177} {"train_loss": -27.016279220581055, "global_step": 429744, "epoch": 5177} {"train_loss": -27.077856063842773, "global_step": 429745, "epoch": 5177} {"train_loss": -26.960895538330078, "global_step": 429746, "epoch": 5177} {"train_loss": -27.02921485900879, "global_step": 429747, "epoch": 5177} {"train_loss": -27.178863525390625, "global_step": 429748, "epoch": 5177} {"train_loss": -26.778661727905273, "global_step": 429749, "epoch": 5177} {"train_loss": -27.087635040283203, "global_step": 429750, "epoch": 5177} {"train_loss": -26.99566650390625, "global_step": 429751, "epoch": 5177} {"train_loss": -26.320138931274414, "global_step": 429752, "epoch": 5177} {"train_loss": -27.128772735595703, "global_step": 429753, "epoch": 5177} {"train_loss": -26.7000675201416, "global_step": 429754, "epoch": 5177} {"train_loss": -26.765716552734375, "global_step": 429755, "epoch": 5177} {"train_loss": -26.87106704711914, "global_step": 429756, "epoch": 5177} {"train_loss": -27.089374542236328, "global_step": 429757, "epoch": 5177} {"train_loss": -27.141935348510742, "global_step": 429758, "epoch": 5177} {"train_loss": -26.819868087768555, "global_step": 429759, "epoch": 5177} {"train_loss": -26.747159957885742, "global_step": 429760, "epoch": 5177} {"train_loss": -26.489887237548828, "global_step": 429761, "epoch": 5177} {"train_loss": -26.6883544921875, "global_step": 429762, "epoch": 5177} {"train_loss": -26.471073150634766, "global_step": 429763, "epoch": 5177} {"train_loss": -26.291919708251953, "global_step": 429764, "epoch": 5177} {"train_loss": -26.9166316986084, "global_step": 429765, "epoch": 5177} {"train_loss": -26.964338302612305, "global_step": 429766, "epoch": 5177} {"train_loss": -26.763132095336914, "global_step": 429767, "epoch": 5177} {"train_loss": -26.930418014526367, "global_step": 429768, "epoch": 5177} {"train_loss": -26.700519561767578, "global_step": 429769, "epoch": 5177} {"train_loss": -27.08209228515625, "global_step": 429770, "epoch": 5177} {"train_loss": -26.660818099975586, "global_step": 429771, "epoch": 5177} {"train_loss": -27.19437026977539, "global_step": 429772, "epoch": 5177} {"train_loss": -26.659654226647802, "global_step": 429773, "epoch": 5177, "val_loss": 6633026.5} {"train_loss": -26.6170711517334, "global_step": 429774, "epoch": 5178} {"train_loss": -26.086416244506836, "global_step": 429775, "epoch": 5178} {"train_loss": -26.147796630859375, "global_step": 429776, "epoch": 5178} {"train_loss": -26.4284610748291, "global_step": 429777, "epoch": 5178} {"train_loss": -25.54694175720215, "global_step": 429778, "epoch": 5178} {"train_loss": -26.099445343017578, "global_step": 429779, "epoch": 5178} {"train_loss": -26.36391258239746, "global_step": 429780, "epoch": 5178} {"train_loss": -25.903186798095703, "global_step": 429781, "epoch": 5178} {"train_loss": -26.173023223876953, "global_step": 429782, "epoch": 5178} {"train_loss": -26.450611114501953, "global_step": 429783, "epoch": 5178} {"train_loss": -26.931507110595703, "global_step": 429784, "epoch": 5178} {"train_loss": -26.479339599609375, "global_step": 429785, "epoch": 5178} {"train_loss": -26.432775497436523, "global_step": 429786, "epoch": 5178} {"train_loss": -26.72071647644043, "global_step": 429787, "epoch": 5178} {"train_loss": -26.589216232299805, "global_step": 429788, "epoch": 5178} {"train_loss": -26.504901885986328, "global_step": 429789, "epoch": 5178} {"train_loss": -26.635461807250977, "global_step": 429790, "epoch": 5178} {"train_loss": -26.382543563842773, "global_step": 429791, "epoch": 5178} {"train_loss": -26.871723175048828, "global_step": 429792, "epoch": 5178} {"train_loss": -26.8856201171875, "global_step": 429793, "epoch": 5178} {"train_loss": -26.686019897460938, "global_step": 429794, "epoch": 5178} {"train_loss": -26.28476333618164, "global_step": 429795, "epoch": 5178} {"train_loss": -26.8928279876709, "global_step": 429796, "epoch": 5178} {"train_loss": -26.541501998901367, "global_step": 429797, "epoch": 5178} {"train_loss": -26.629541397094727, "global_step": 429798, "epoch": 5178} {"train_loss": -27.131473541259766, "global_step": 429799, "epoch": 5178} {"train_loss": -26.697010040283203, "global_step": 429800, "epoch": 5178} {"train_loss": -26.931394577026367, "global_step": 429801, "epoch": 5178} {"train_loss": -26.7930850982666, "global_step": 429802, "epoch": 5178} {"train_loss": -27.017980575561523, "global_step": 429803, "epoch": 5178} {"train_loss": -26.897876739501953, "global_step": 429804, "epoch": 5178} {"train_loss": -26.88606071472168, "global_step": 429805, "epoch": 5178} {"train_loss": -26.592559814453125, "global_step": 429806, "epoch": 5178} {"train_loss": -26.96875, "global_step": 429807, "epoch": 5178} {"train_loss": -27.08917236328125, "global_step": 429808, "epoch": 5178} {"train_loss": -26.739212036132812, "global_step": 429809, "epoch": 5178} {"train_loss": -26.827014923095703, "global_step": 429810, "epoch": 5178} {"train_loss": -26.96038818359375, "global_step": 429811, "epoch": 5178} {"train_loss": -26.998249053955078, "global_step": 429812, "epoch": 5178} {"train_loss": -26.73984718322754, "global_step": 429813, "epoch": 5178} {"train_loss": -26.825714111328125, "global_step": 429814, "epoch": 5178} {"train_loss": -26.69587516784668, "global_step": 429815, "epoch": 5178} {"train_loss": -26.795928955078125, "global_step": 429816, "epoch": 5178} {"train_loss": -27.171594619750977, "global_step": 429817, "epoch": 5178} {"train_loss": -27.08319664001465, "global_step": 429818, "epoch": 5178} {"train_loss": -26.904348373413086, "global_step": 429819, "epoch": 5178} {"train_loss": -27.111738204956055, "global_step": 429820, "epoch": 5178} {"train_loss": -27.160093307495117, "global_step": 429821, "epoch": 5178} {"train_loss": -26.777252197265625, "global_step": 429822, "epoch": 5178} {"train_loss": -26.363988876342773, "global_step": 429823, "epoch": 5178} {"train_loss": -26.59872817993164, "global_step": 429824, "epoch": 5178} {"train_loss": -27.01552391052246, "global_step": 429825, "epoch": 5178} {"train_loss": -26.699020385742188, "global_step": 429826, "epoch": 5178} {"train_loss": -26.9106388092041, "global_step": 429827, "epoch": 5178} {"train_loss": -27.277647018432617, "global_step": 429828, "epoch": 5178} {"train_loss": -26.606765747070312, "global_step": 429829, "epoch": 5178} {"train_loss": -26.930744171142578, "global_step": 429830, "epoch": 5178} {"train_loss": -26.71051025390625, "global_step": 429831, "epoch": 5178} {"train_loss": -27.223501205444336, "global_step": 429832, "epoch": 5178} {"train_loss": -26.88246726989746, "global_step": 429833, "epoch": 5178} {"train_loss": -26.77237319946289, "global_step": 429834, "epoch": 5178} {"train_loss": -27.05317497253418, "global_step": 429835, "epoch": 5178} {"train_loss": -26.650054931640625, "global_step": 429836, "epoch": 5178} {"train_loss": -27.131261825561523, "global_step": 429837, "epoch": 5178} {"train_loss": -27.217870712280273, "global_step": 429838, "epoch": 5178} {"train_loss": -26.92572021484375, "global_step": 429839, "epoch": 5178} {"train_loss": -26.8983211517334, "global_step": 429840, "epoch": 5178} {"train_loss": -27.04913902282715, "global_step": 429841, "epoch": 5178} {"train_loss": -27.04892921447754, "global_step": 429842, "epoch": 5178} {"train_loss": -26.82539176940918, "global_step": 429843, "epoch": 5178} {"train_loss": -26.86274528503418, "global_step": 429844, "epoch": 5178} {"train_loss": -27.084909439086914, "global_step": 429845, "epoch": 5178} {"train_loss": -27.043170928955078, "global_step": 429846, "epoch": 5178} {"train_loss": -27.007434844970703, "global_step": 429847, "epoch": 5178} {"train_loss": -26.510305404663086, "global_step": 429848, "epoch": 5178} {"train_loss": -27.437149047851562, "global_step": 429849, "epoch": 5178} {"train_loss": -27.167831420898438, "global_step": 429850, "epoch": 5178} {"train_loss": -27.028076171875, "global_step": 429851, "epoch": 5178} {"train_loss": -26.9215145111084, "global_step": 429852, "epoch": 5178} {"train_loss": -26.92988395690918, "global_step": 429853, "epoch": 5178} {"train_loss": -26.680011749267578, "global_step": 429854, "epoch": 5178} {"train_loss": -27.27688980102539, "global_step": 429855, "epoch": 5178} {"train_loss": -26.77315181134695, "global_step": 429856, "epoch": 5178, "val_loss": 6628116.0} {"train_loss": -26.2034912109375, "global_step": 429857, "epoch": 5179} {"train_loss": -26.330841064453125, "global_step": 429858, "epoch": 5179} {"train_loss": -26.48321533203125, "global_step": 429859, "epoch": 5179} {"train_loss": -26.830175399780273, "global_step": 429860, "epoch": 5179} {"train_loss": -26.071943283081055, "global_step": 429861, "epoch": 5179} {"train_loss": -26.284265518188477, "global_step": 429862, "epoch": 5179} {"train_loss": -26.563648223876953, "global_step": 429863, "epoch": 5179} {"train_loss": -25.795583724975586, "global_step": 429864, "epoch": 5179} {"train_loss": -26.14874839782715, "global_step": 429865, "epoch": 5179} {"train_loss": -26.49354362487793, "global_step": 429866, "epoch": 5179} {"train_loss": -26.01239013671875, "global_step": 429867, "epoch": 5179} {"train_loss": -26.4093017578125, "global_step": 429868, "epoch": 5179} {"train_loss": -26.527164459228516, "global_step": 429869, "epoch": 5179} {"train_loss": -26.207019805908203, "global_step": 429870, "epoch": 5179} {"train_loss": -27.109708786010742, "global_step": 429871, "epoch": 5179} {"train_loss": -26.871566772460938, "global_step": 429872, "epoch": 5179} {"train_loss": -27.001371383666992, "global_step": 429873, "epoch": 5179} {"train_loss": -26.563800811767578, "global_step": 429874, "epoch": 5179} {"train_loss": -26.93562889099121, "global_step": 429875, "epoch": 5179} {"train_loss": -26.801788330078125, "global_step": 429876, "epoch": 5179} {"train_loss": -26.862125396728516, "global_step": 429877, "epoch": 5179} {"train_loss": -26.934112548828125, "global_step": 429878, "epoch": 5179} {"train_loss": -27.016576766967773, "global_step": 429879, "epoch": 5179} {"train_loss": -26.755903244018555, "global_step": 429880, "epoch": 5179} {"train_loss": -26.8464412689209, "global_step": 429881, "epoch": 5179} {"train_loss": -26.69696044921875, "global_step": 429882, "epoch": 5179} {"train_loss": -26.973377227783203, "global_step": 429883, "epoch": 5179} {"train_loss": -26.54498291015625, "global_step": 429884, "epoch": 5179} {"train_loss": -27.0169620513916, "global_step": 429885, "epoch": 5179} {"train_loss": -26.68840980529785, "global_step": 429886, "epoch": 5179} {"train_loss": -27.04193687438965, "global_step": 429887, "epoch": 5179} {"train_loss": -26.866376876831055, "global_step": 429888, "epoch": 5179} {"train_loss": -26.859851837158203, "global_step": 429889, "epoch": 5179} {"train_loss": -26.6057186126709, "global_step": 429890, "epoch": 5179} {"train_loss": -27.17010498046875, "global_step": 429891, "epoch": 5179} {"train_loss": -27.02182388305664, "global_step": 429892, "epoch": 5179} {"train_loss": -26.910242080688477, "global_step": 429893, "epoch": 5179} {"train_loss": -26.9012451171875, "global_step": 429894, "epoch": 5179} {"train_loss": -26.915678024291992, "global_step": 429895, "epoch": 5179} {"train_loss": -27.22381591796875, "global_step": 429896, "epoch": 5179} {"train_loss": -27.020374298095703, "global_step": 429897, "epoch": 5179} {"train_loss": -26.794509887695312, "global_step": 429898, "epoch": 5179} {"train_loss": -27.082141876220703, "global_step": 429899, "epoch": 5179} {"train_loss": -27.10637855529785, "global_step": 429900, "epoch": 5179} {"train_loss": -26.98883628845215, "global_step": 429901, "epoch": 5179} {"train_loss": -27.1556396484375, "global_step": 429902, "epoch": 5179} {"train_loss": -26.950061798095703, "global_step": 429903, "epoch": 5179} {"train_loss": -26.881433486938477, "global_step": 429904, "epoch": 5179} {"train_loss": -27.493122100830078, "global_step": 429905, "epoch": 5179} {"train_loss": -26.98052978515625, "global_step": 429906, "epoch": 5179} {"train_loss": -26.74365234375, "global_step": 429907, "epoch": 5179} {"train_loss": -26.1922550201416, "global_step": 429908, "epoch": 5179} {"train_loss": -26.317068099975586, "global_step": 429909, "epoch": 5179} {"train_loss": -26.9539737701416, "global_step": 429910, "epoch": 5179} {"train_loss": -26.842071533203125, "global_step": 429911, "epoch": 5179} {"train_loss": -26.830402374267578, "global_step": 429912, "epoch": 5179} {"train_loss": -26.700109481811523, "global_step": 429913, "epoch": 5179} {"train_loss": -26.87801170349121, "global_step": 429914, "epoch": 5179} {"train_loss": -26.77166748046875, "global_step": 429915, "epoch": 5179} {"train_loss": -26.88178062438965, "global_step": 429916, "epoch": 5179} {"train_loss": -26.957935333251953, "global_step": 429917, "epoch": 5179} {"train_loss": -27.023590087890625, "global_step": 429918, "epoch": 5179} {"train_loss": -26.604063034057617, "global_step": 429919, "epoch": 5179} {"train_loss": -26.877700805664062, "global_step": 429920, "epoch": 5179} {"train_loss": -26.969945907592773, "global_step": 429921, "epoch": 5179} {"train_loss": -26.76155662536621, "global_step": 429922, "epoch": 5179} {"train_loss": -26.757221221923828, "global_step": 429923, "epoch": 5179} {"train_loss": -26.79599380493164, "global_step": 429924, "epoch": 5179} {"train_loss": -26.854877471923828, "global_step": 429925, "epoch": 5179} {"train_loss": -26.911230087280273, "global_step": 429926, "epoch": 5179} {"train_loss": -26.950571060180664, "global_step": 429927, "epoch": 5179} {"train_loss": -27.170822143554688, "global_step": 429928, "epoch": 5179} {"train_loss": -26.758207321166992, "global_step": 429929, "epoch": 5179} {"train_loss": -26.649744033813477, "global_step": 429930, "epoch": 5179} {"train_loss": -26.27109146118164, "global_step": 429931, "epoch": 5179} {"train_loss": -26.889789581298828, "global_step": 429932, "epoch": 5179} {"train_loss": -26.806015014648438, "global_step": 429933, "epoch": 5179} {"train_loss": -26.54994773864746, "global_step": 429934, "epoch": 5179} {"train_loss": -26.221389770507812, "global_step": 429935, "epoch": 5179} {"train_loss": -26.106515884399414, "global_step": 429936, "epoch": 5179} {"train_loss": -26.40681266784668, "global_step": 429937, "epoch": 5179} {"train_loss": -26.481420516967773, "global_step": 429938, "epoch": 5179} {"train_loss": -26.721007059855634, "global_step": 429939, "epoch": 5179, "val_loss": 6660588.0} {"train_loss": -26.30832862854004, "global_step": 429940, "epoch": 5180} {"train_loss": -26.5577449798584, "global_step": 429941, "epoch": 5180} {"train_loss": -26.7619571685791, "global_step": 429942, "epoch": 5180} {"train_loss": -26.358123779296875, "global_step": 429943, "epoch": 5180} {"train_loss": -26.145444869995117, "global_step": 429944, "epoch": 5180} {"train_loss": -26.228168487548828, "global_step": 429945, "epoch": 5180} {"train_loss": -26.590208053588867, "global_step": 429946, "epoch": 5180} {"train_loss": -26.439218521118164, "global_step": 429947, "epoch": 5180} {"train_loss": -26.833084106445312, "global_step": 429948, "epoch": 5180} {"train_loss": -26.15179443359375, "global_step": 429949, "epoch": 5180} {"train_loss": -26.87115478515625, "global_step": 429950, "epoch": 5180} {"train_loss": -26.391788482666016, "global_step": 429951, "epoch": 5180} {"train_loss": -26.793567657470703, "global_step": 429952, "epoch": 5180} {"train_loss": -26.526004791259766, "global_step": 429953, "epoch": 5180} {"train_loss": -26.828857421875, "global_step": 429954, "epoch": 5180} {"train_loss": -26.555164337158203, "global_step": 429955, "epoch": 5180} {"train_loss": -26.73468589782715, "global_step": 429956, "epoch": 5180} {"train_loss": -26.947866439819336, "global_step": 429957, "epoch": 5180} {"train_loss": -26.776905059814453, "global_step": 429958, "epoch": 5180} {"train_loss": -26.830768585205078, "global_step": 429959, "epoch": 5180} {"train_loss": -26.733051300048828, "global_step": 429960, "epoch": 5180} {"train_loss": -26.83597755432129, "global_step": 429961, "epoch": 5180} {"train_loss": -26.562421798706055, "global_step": 429962, "epoch": 5180} {"train_loss": -26.6861515045166, "global_step": 429963, "epoch": 5180} {"train_loss": -26.798254013061523, "global_step": 429964, "epoch": 5180} {"train_loss": -26.63494873046875, "global_step": 429965, "epoch": 5180} {"train_loss": -26.677282333374023, "global_step": 429966, "epoch": 5180} {"train_loss": -26.524066925048828, "global_step": 429967, "epoch": 5180} {"train_loss": -26.969573974609375, "global_step": 429968, "epoch": 5180} {"train_loss": -26.685455322265625, "global_step": 429969, "epoch": 5180} {"train_loss": -26.645572662353516, "global_step": 429970, "epoch": 5180} {"train_loss": -26.68402671813965, "global_step": 429971, "epoch": 5180} {"train_loss": -26.717798233032227, "global_step": 429972, "epoch": 5180} {"train_loss": -27.10841178894043, "global_step": 429973, "epoch": 5180} {"train_loss": -27.181182861328125, "global_step": 429974, "epoch": 5180} {"train_loss": -26.691791534423828, "global_step": 429975, "epoch": 5180} {"train_loss": -27.048124313354492, "global_step": 429976, "epoch": 5180} {"train_loss": -26.669097900390625, "global_step": 429977, "epoch": 5180} {"train_loss": -26.7278995513916, "global_step": 429978, "epoch": 5180} {"train_loss": -27.429346084594727, "global_step": 429979, "epoch": 5180} {"train_loss": -27.147205352783203, "global_step": 429980, "epoch": 5180} {"train_loss": -26.884601593017578, "global_step": 429981, "epoch": 5180} {"train_loss": -26.793622970581055, "global_step": 429982, "epoch": 5180} {"train_loss": -26.776611328125, "global_step": 429983, "epoch": 5180} {"train_loss": -26.90740966796875, "global_step": 429984, "epoch": 5180} {"train_loss": -27.05964469909668, "global_step": 429985, "epoch": 5180} {"train_loss": -26.627851486206055, "global_step": 429986, "epoch": 5180} {"train_loss": -26.850330352783203, "global_step": 429987, "epoch": 5180} {"train_loss": -27.194711685180664, "global_step": 429988, "epoch": 5180} {"train_loss": -26.9262752532959, "global_step": 429989, "epoch": 5180} {"train_loss": -27.23524284362793, "global_step": 429990, "epoch": 5180} {"train_loss": -27.3253116607666, "global_step": 429991, "epoch": 5180} {"train_loss": -27.3604793548584, "global_step": 429992, "epoch": 5180} {"train_loss": -26.756153106689453, "global_step": 429993, "epoch": 5180} {"train_loss": -27.0992488861084, "global_step": 429994, "epoch": 5180} {"train_loss": -27.219863891601562, "global_step": 429995, "epoch": 5180} {"train_loss": -26.9495792388916, "global_step": 429996, "epoch": 5180} {"train_loss": -27.260278701782227, "global_step": 429997, "epoch": 5180} {"train_loss": -26.852209091186523, "global_step": 429998, "epoch": 5180} {"train_loss": -27.384057998657227, "global_step": 429999, "epoch": 5180} {"train_loss": -27.127883911132812, "global_step": 430000, "epoch": 5180} {"train_loss": -26.512929916381836, "global_step": 430001, "epoch": 5180} {"train_loss": -26.248510360717773, "global_step": 430002, "epoch": 5180} {"train_loss": -25.756406784057617, "global_step": 430003, "epoch": 5180} {"train_loss": -26.507251739501953, "global_step": 430004, "epoch": 5180} {"train_loss": -26.74444007873535, "global_step": 430005, "epoch": 5180} {"train_loss": -26.38663673400879, "global_step": 430006, "epoch": 5180} {"train_loss": -26.2734317779541, "global_step": 430007, "epoch": 5180} {"train_loss": -26.77815055847168, "global_step": 430008, "epoch": 5180} {"train_loss": -26.461395263671875, "global_step": 430009, "epoch": 5180} {"train_loss": -25.9593505859375, "global_step": 430010, "epoch": 5180} {"train_loss": -26.572738647460938, "global_step": 430011, "epoch": 5180} {"train_loss": -26.154096603393555, "global_step": 430012, "epoch": 5180} {"train_loss": -26.441648483276367, "global_step": 430013, "epoch": 5180} {"train_loss": -27.40000343322754, "global_step": 430014, "epoch": 5180} {"train_loss": -26.547555923461914, "global_step": 430015, "epoch": 5180} {"train_loss": -26.36809730529785, "global_step": 430016, "epoch": 5180} {"train_loss": -26.94000244140625, "global_step": 430017, "epoch": 5180} {"train_loss": -26.953962326049805, "global_step": 430018, "epoch": 5180} {"train_loss": -26.56846046447754, "global_step": 430019, "epoch": 5180} {"train_loss": -26.563337326049805, "global_step": 430020, "epoch": 5180} {"train_loss": -26.483030319213867, "global_step": 430021, "epoch": 5180} {"train_loss": -26.728022954550134, "global_step": 430022, "epoch": 5180, "val_loss": 6702101.0} {"train_loss": -26.80655288696289, "global_step": 430023, "epoch": 5181} {"train_loss": -26.475194931030273, "global_step": 430024, "epoch": 5181} {"train_loss": -26.482593536376953, "global_step": 430025, "epoch": 5181} {"train_loss": -26.716718673706055, "global_step": 430026, "epoch": 5181} {"train_loss": -26.722238540649414, "global_step": 430027, "epoch": 5181} {"train_loss": -26.37068748474121, "global_step": 430028, "epoch": 5181} {"train_loss": -26.240346908569336, "global_step": 430029, "epoch": 5181} {"train_loss": -26.52548599243164, "global_step": 430030, "epoch": 5181} {"train_loss": -26.269174575805664, "global_step": 430031, "epoch": 5181} {"train_loss": -26.573217391967773, "global_step": 430032, "epoch": 5181} {"train_loss": -26.563379287719727, "global_step": 430033, "epoch": 5181} {"train_loss": -26.403669357299805, "global_step": 430034, "epoch": 5181} {"train_loss": -26.099348068237305, "global_step": 430035, "epoch": 5181} {"train_loss": -26.974828720092773, "global_step": 430036, "epoch": 5181} {"train_loss": -26.9853572845459, "global_step": 430037, "epoch": 5181} {"train_loss": -26.244373321533203, "global_step": 430038, "epoch": 5181} {"train_loss": -26.891523361206055, "global_step": 430039, "epoch": 5181} {"train_loss": -26.854108810424805, "global_step": 430040, "epoch": 5181} {"train_loss": -26.697830200195312, "global_step": 430041, "epoch": 5181} {"train_loss": -26.6795711517334, "global_step": 430042, "epoch": 5181} {"train_loss": -26.575178146362305, "global_step": 430043, "epoch": 5181} {"train_loss": -27.039432525634766, "global_step": 430044, "epoch": 5181} {"train_loss": -26.928258895874023, "global_step": 430045, "epoch": 5181} {"train_loss": -26.817922592163086, "global_step": 430046, "epoch": 5181} {"train_loss": -27.095809936523438, "global_step": 430047, "epoch": 5181} {"train_loss": -26.79703712463379, "global_step": 430048, "epoch": 5181} {"train_loss": -26.337411880493164, "global_step": 430049, "epoch": 5181} {"train_loss": -27.184900283813477, "global_step": 430050, "epoch": 5181} {"train_loss": -27.29520606994629, "global_step": 430051, "epoch": 5181} {"train_loss": -26.66326332092285, "global_step": 430052, "epoch": 5181} {"train_loss": -26.78779411315918, "global_step": 430053, "epoch": 5181} {"train_loss": -27.14645767211914, "global_step": 430054, "epoch": 5181} {"train_loss": -26.880691528320312, "global_step": 430055, "epoch": 5181} {"train_loss": -26.994586944580078, "global_step": 430056, "epoch": 5181} {"train_loss": -27.193984985351562, "global_step": 430057, "epoch": 5181} {"train_loss": -27.2864933013916, "global_step": 430058, "epoch": 5181} {"train_loss": -26.954877853393555, "global_step": 430059, "epoch": 5181} {"train_loss": -27.118310928344727, "global_step": 430060, "epoch": 5181} {"train_loss": -26.789709091186523, "global_step": 430061, "epoch": 5181} {"train_loss": -27.312856674194336, "global_step": 430062, "epoch": 5181} {"train_loss": -26.9525089263916, "global_step": 430063, "epoch": 5181} {"train_loss": -27.068546295166016, "global_step": 430064, "epoch": 5181} {"train_loss": -26.751251220703125, "global_step": 430065, "epoch": 5181} {"train_loss": -26.897626876831055, "global_step": 430066, "epoch": 5181} {"train_loss": -27.199127197265625, "global_step": 430067, "epoch": 5181} {"train_loss": -27.073461532592773, "global_step": 430068, "epoch": 5181} {"train_loss": -26.826562881469727, "global_step": 430069, "epoch": 5181} {"train_loss": -26.597949981689453, "global_step": 430070, "epoch": 5181} {"train_loss": -27.28179359436035, "global_step": 430071, "epoch": 5181} {"train_loss": -26.83363151550293, "global_step": 430072, "epoch": 5181} {"train_loss": -27.015859603881836, "global_step": 430073, "epoch": 5181} {"train_loss": -27.066572189331055, "global_step": 430074, "epoch": 5181} {"train_loss": -26.557905197143555, "global_step": 430075, "epoch": 5181} {"train_loss": -27.250452041625977, "global_step": 430076, "epoch": 5181} {"train_loss": -26.860578536987305, "global_step": 430077, "epoch": 5181} {"train_loss": -26.93975830078125, "global_step": 430078, "epoch": 5181} {"train_loss": -26.881244659423828, "global_step": 430079, "epoch": 5181} {"train_loss": -26.515090942382812, "global_step": 430080, "epoch": 5181} {"train_loss": -27.120670318603516, "global_step": 430081, "epoch": 5181} {"train_loss": -26.7705078125, "global_step": 430082, "epoch": 5181} {"train_loss": -26.989240646362305, "global_step": 430083, "epoch": 5181} {"train_loss": -26.66303825378418, "global_step": 430084, "epoch": 5181} {"train_loss": -26.606159210205078, "global_step": 430085, "epoch": 5181} {"train_loss": -26.937917709350586, "global_step": 430086, "epoch": 5181} {"train_loss": -26.823211669921875, "global_step": 430087, "epoch": 5181} {"train_loss": -26.966760635375977, "global_step": 430088, "epoch": 5181} {"train_loss": -26.842147827148438, "global_step": 430089, "epoch": 5181} {"train_loss": -26.441486358642578, "global_step": 430090, "epoch": 5181} {"train_loss": -26.1964168548584, "global_step": 430091, "epoch": 5181} {"train_loss": -25.182912826538086, "global_step": 430092, "epoch": 5181} {"train_loss": -25.088781356811523, "global_step": 430093, "epoch": 5181} {"train_loss": -26.419736862182617, "global_step": 430094, "epoch": 5181} {"train_loss": -25.58587646484375, "global_step": 430095, "epoch": 5181} {"train_loss": -25.89398193359375, "global_step": 430096, "epoch": 5181} {"train_loss": -25.882116317749023, "global_step": 430097, "epoch": 5181} {"train_loss": -25.422956466674805, "global_step": 430098, "epoch": 5181} {"train_loss": -25.817235946655273, "global_step": 430099, "epoch": 5181} {"train_loss": -26.051572799682617, "global_step": 430100, "epoch": 5181} {"train_loss": -26.003173828125, "global_step": 430101, "epoch": 5181} {"train_loss": -26.39240837097168, "global_step": 430102, "epoch": 5181} {"train_loss": -26.1812744140625, "global_step": 430103, "epoch": 5181} {"train_loss": -26.444446563720703, "global_step": 430104, "epoch": 5181} {"train_loss": -26.649392851864, "global_step": 430105, "epoch": 5181, "val_loss": 6685823.0} {"train_loss": -26.034229278564453, "global_step": 430106, "epoch": 5182} {"train_loss": -25.96234130859375, "global_step": 430107, "epoch": 5182} {"train_loss": -25.872058868408203, "global_step": 430108, "epoch": 5182} {"train_loss": -26.005512237548828, "global_step": 430109, "epoch": 5182} {"train_loss": -26.127775192260742, "global_step": 430110, "epoch": 5182} {"train_loss": -25.81464958190918, "global_step": 430111, "epoch": 5182} {"train_loss": -25.534940719604492, "global_step": 430112, "epoch": 5182} {"train_loss": -25.956867218017578, "global_step": 430113, "epoch": 5182} {"train_loss": -26.1312255859375, "global_step": 430114, "epoch": 5182} {"train_loss": -25.895841598510742, "global_step": 430115, "epoch": 5182} {"train_loss": -26.39911460876465, "global_step": 430116, "epoch": 5182} {"train_loss": -25.94062614440918, "global_step": 430117, "epoch": 5182} {"train_loss": -26.22342872619629, "global_step": 430118, "epoch": 5182} {"train_loss": -26.309606552124023, "global_step": 430119, "epoch": 5182} {"train_loss": -25.96820640563965, "global_step": 430120, "epoch": 5182} {"train_loss": -26.330747604370117, "global_step": 430121, "epoch": 5182} {"train_loss": -25.8807430267334, "global_step": 430122, "epoch": 5182} {"train_loss": -26.552648544311523, "global_step": 430123, "epoch": 5182} {"train_loss": -26.0710506439209, "global_step": 430124, "epoch": 5182} {"train_loss": -26.815275192260742, "global_step": 430125, "epoch": 5182} {"train_loss": -26.43219566345215, "global_step": 430126, "epoch": 5182} {"train_loss": -26.161569595336914, "global_step": 430127, "epoch": 5182} {"train_loss": -26.6177978515625, "global_step": 430128, "epoch": 5182} {"train_loss": -26.52461814880371, "global_step": 430129, "epoch": 5182} {"train_loss": -26.90924072265625, "global_step": 430130, "epoch": 5182} {"train_loss": -26.504608154296875, "global_step": 430131, "epoch": 5182} {"train_loss": -26.4720458984375, "global_step": 430132, "epoch": 5182} {"train_loss": -26.729568481445312, "global_step": 430133, "epoch": 5182} {"train_loss": -27.10015869140625, "global_step": 430134, "epoch": 5182} {"train_loss": -27.100910186767578, "global_step": 430135, "epoch": 5182} {"train_loss": -26.703327178955078, "global_step": 430136, "epoch": 5182} {"train_loss": -26.559844970703125, "global_step": 430137, "epoch": 5182} {"train_loss": -26.69287109375, "global_step": 430138, "epoch": 5182} {"train_loss": -27.20521354675293, "global_step": 430139, "epoch": 5182} {"train_loss": -26.892568588256836, "global_step": 430140, "epoch": 5182} {"train_loss": -26.618793487548828, "global_step": 430141, "epoch": 5182} {"train_loss": -27.042001724243164, "global_step": 430142, "epoch": 5182} {"train_loss": -27.250247955322266, "global_step": 430143, "epoch": 5182} {"train_loss": -26.85981559753418, "global_step": 430144, "epoch": 5182} {"train_loss": -27.129791259765625, "global_step": 430145, "epoch": 5182} {"train_loss": -27.396757125854492, "global_step": 430146, "epoch": 5182} {"train_loss": -27.337818145751953, "global_step": 430147, "epoch": 5182} {"train_loss": -27.032201766967773, "global_step": 430148, "epoch": 5182} {"train_loss": -27.066247940063477, "global_step": 430149, "epoch": 5182} {"train_loss": -26.881784439086914, "global_step": 430150, "epoch": 5182} {"train_loss": -26.763418197631836, "global_step": 430151, "epoch": 5182} {"train_loss": -27.193811416625977, "global_step": 430152, "epoch": 5182} {"train_loss": -26.6466121673584, "global_step": 430153, "epoch": 5182} {"train_loss": -27.004201889038086, "global_step": 430154, "epoch": 5182} {"train_loss": -26.80683708190918, "global_step": 430155, "epoch": 5182} {"train_loss": -27.467300415039062, "global_step": 430156, "epoch": 5182} {"train_loss": -26.923355102539062, "global_step": 430157, "epoch": 5182} {"train_loss": -27.199384689331055, "global_step": 430158, "epoch": 5182} {"train_loss": -27.0947208404541, "global_step": 430159, "epoch": 5182} {"train_loss": -27.194379806518555, "global_step": 430160, "epoch": 5182} {"train_loss": -27.096435546875, "global_step": 430161, "epoch": 5182} {"train_loss": -26.964773178100586, "global_step": 430162, "epoch": 5182} {"train_loss": -26.80435562133789, "global_step": 430163, "epoch": 5182} {"train_loss": -26.624677658081055, "global_step": 430164, "epoch": 5182} {"train_loss": -26.424890518188477, "global_step": 430165, "epoch": 5182} {"train_loss": -26.584537506103516, "global_step": 430166, "epoch": 5182} {"train_loss": -26.86725425720215, "global_step": 430167, "epoch": 5182} {"train_loss": -26.96454429626465, "global_step": 430168, "epoch": 5182} {"train_loss": -26.97674560546875, "global_step": 430169, "epoch": 5182} {"train_loss": -26.732715606689453, "global_step": 430170, "epoch": 5182} {"train_loss": -26.69986915588379, "global_step": 430171, "epoch": 5182} {"train_loss": -26.826398849487305, "global_step": 430172, "epoch": 5182} {"train_loss": -26.867212295532227, "global_step": 430173, "epoch": 5182} {"train_loss": -26.898359298706055, "global_step": 430174, "epoch": 5182} {"train_loss": -27.07210350036621, "global_step": 430175, "epoch": 5182} {"train_loss": -26.608312606811523, "global_step": 430176, "epoch": 5182} {"train_loss": -27.104049682617188, "global_step": 430177, "epoch": 5182} {"train_loss": -26.7800235748291, "global_step": 430178, "epoch": 5182} {"train_loss": -26.628955841064453, "global_step": 430179, "epoch": 5182} {"train_loss": -26.7937068939209, "global_step": 430180, "epoch": 5182} {"train_loss": -26.430505752563477, "global_step": 430181, "epoch": 5182} {"train_loss": -27.28852653503418, "global_step": 430182, "epoch": 5182} {"train_loss": -27.003498077392578, "global_step": 430183, "epoch": 5182} {"train_loss": -26.772546768188477, "global_step": 430184, "epoch": 5182} {"train_loss": -26.889917373657227, "global_step": 430185, "epoch": 5182} {"train_loss": -26.759061813354492, "global_step": 430186, "epoch": 5182} {"train_loss": -26.373193740844727, "global_step": 430187, "epoch": 5182} {"train_loss": -26.670208069215338, "global_step": 430188, "epoch": 5182, "val_loss": 6682217.5} {"train_loss": -26.562803268432617, "global_step": 430189, "epoch": 5183} {"train_loss": -26.245161056518555, "global_step": 430190, "epoch": 5183} {"train_loss": -26.9460506439209, "global_step": 430191, "epoch": 5183} {"train_loss": -26.735376358032227, "global_step": 430192, "epoch": 5183} {"train_loss": -27.025827407836914, "global_step": 430193, "epoch": 5183} {"train_loss": -26.515146255493164, "global_step": 430194, "epoch": 5183} {"train_loss": -26.571516036987305, "global_step": 430195, "epoch": 5183} {"train_loss": -26.6254825592041, "global_step": 430196, "epoch": 5183} {"train_loss": -26.6324520111084, "global_step": 430197, "epoch": 5183} {"train_loss": -26.375965118408203, "global_step": 430198, "epoch": 5183} {"train_loss": -26.421283721923828, "global_step": 430199, "epoch": 5183} {"train_loss": -26.5306396484375, "global_step": 430200, "epoch": 5183} {"train_loss": -26.970361709594727, "global_step": 430201, "epoch": 5183} {"train_loss": -26.330509185791016, "global_step": 430202, "epoch": 5183} {"train_loss": -26.740713119506836, "global_step": 430203, "epoch": 5183} {"train_loss": -26.88559913635254, "global_step": 430204, "epoch": 5183} {"train_loss": -26.58258056640625, "global_step": 430205, "epoch": 5183} {"train_loss": -26.787967681884766, "global_step": 430206, "epoch": 5183} {"train_loss": -26.985004425048828, "global_step": 430207, "epoch": 5183} {"train_loss": -26.627248764038086, "global_step": 430208, "epoch": 5183} {"train_loss": -27.03362464904785, "global_step": 430209, "epoch": 5183} {"train_loss": -26.59145164489746, "global_step": 430210, "epoch": 5183} {"train_loss": -27.110645294189453, "global_step": 430211, "epoch": 5183} {"train_loss": -27.210205078125, "global_step": 430212, "epoch": 5183} {"train_loss": -27.092273712158203, "global_step": 430213, "epoch": 5183} {"train_loss": -26.98518180847168, "global_step": 430214, "epoch": 5183} {"train_loss": -26.723743438720703, "global_step": 430215, "epoch": 5183} {"train_loss": -26.83717155456543, "global_step": 430216, "epoch": 5183} {"train_loss": -26.5513858795166, "global_step": 430217, "epoch": 5183} {"train_loss": -26.978910446166992, "global_step": 430218, "epoch": 5183} {"train_loss": -26.788476943969727, "global_step": 430219, "epoch": 5183} {"train_loss": -27.027536392211914, "global_step": 430220, "epoch": 5183} {"train_loss": -26.878936767578125, "global_step": 430221, "epoch": 5183} {"train_loss": -27.062427520751953, "global_step": 430222, "epoch": 5183} {"train_loss": -27.156158447265625, "global_step": 430223, "epoch": 5183} {"train_loss": -27.24460220336914, "global_step": 430224, "epoch": 5183} {"train_loss": -27.064477920532227, "global_step": 430225, "epoch": 5183} {"train_loss": -27.2723331451416, "global_step": 430226, "epoch": 5183} {"train_loss": -27.165136337280273, "global_step": 430227, "epoch": 5183} {"train_loss": -27.05484390258789, "global_step": 430228, "epoch": 5183} {"train_loss": -27.2011661529541, "global_step": 430229, "epoch": 5183} {"train_loss": -27.14715003967285, "global_step": 430230, "epoch": 5183} {"train_loss": -27.278268814086914, "global_step": 430231, "epoch": 5183} {"train_loss": -26.68342399597168, "global_step": 430232, "epoch": 5183} {"train_loss": -26.952478408813477, "global_step": 430233, "epoch": 5183} {"train_loss": -26.773096084594727, "global_step": 430234, "epoch": 5183} {"train_loss": -27.039281845092773, "global_step": 430235, "epoch": 5183} {"train_loss": -27.075119018554688, "global_step": 430236, "epoch": 5183} {"train_loss": -26.96650505065918, "global_step": 430237, "epoch": 5183} {"train_loss": -26.635974884033203, "global_step": 430238, "epoch": 5183} {"train_loss": -27.040685653686523, "global_step": 430239, "epoch": 5183} {"train_loss": -26.971881866455078, "global_step": 430240, "epoch": 5183} {"train_loss": -26.737165451049805, "global_step": 430241, "epoch": 5183} {"train_loss": -27.05337905883789, "global_step": 430242, "epoch": 5183} {"train_loss": -26.943359375, "global_step": 430243, "epoch": 5183} {"train_loss": -27.2523193359375, "global_step": 430244, "epoch": 5183} {"train_loss": -26.799955368041992, "global_step": 430245, "epoch": 5183} {"train_loss": -26.643903732299805, "global_step": 430246, "epoch": 5183} {"train_loss": -26.860868453979492, "global_step": 430247, "epoch": 5183} {"train_loss": -26.41144371032715, "global_step": 430248, "epoch": 5183} {"train_loss": -26.555072784423828, "global_step": 430249, "epoch": 5183} {"train_loss": -26.30292320251465, "global_step": 430250, "epoch": 5183} {"train_loss": -26.486108779907227, "global_step": 430251, "epoch": 5183} {"train_loss": -26.688207626342773, "global_step": 430252, "epoch": 5183} {"train_loss": -26.5051326751709, "global_step": 430253, "epoch": 5183} {"train_loss": -27.090600967407227, "global_step": 430254, "epoch": 5183} {"train_loss": -26.533477783203125, "global_step": 430255, "epoch": 5183} {"train_loss": -26.658191680908203, "global_step": 430256, "epoch": 5183} {"train_loss": -27.017053604125977, "global_step": 430257, "epoch": 5183} {"train_loss": -26.412860870361328, "global_step": 430258, "epoch": 5183} {"train_loss": -26.618457794189453, "global_step": 430259, "epoch": 5183} {"train_loss": -26.768651962280273, "global_step": 430260, "epoch": 5183} {"train_loss": -26.793094635009766, "global_step": 430261, "epoch": 5183} {"train_loss": -26.691442489624023, "global_step": 430262, "epoch": 5183} {"train_loss": -27.00628089904785, "global_step": 430263, "epoch": 5183} {"train_loss": -27.046125411987305, "global_step": 430264, "epoch": 5183} {"train_loss": -26.7137451171875, "global_step": 430265, "epoch": 5183} {"train_loss": -26.536457061767578, "global_step": 430266, "epoch": 5183} {"train_loss": -26.673437118530273, "global_step": 430267, "epoch": 5183} {"train_loss": -26.888355255126953, "global_step": 430268, "epoch": 5183} {"train_loss": -27.08095359802246, "global_step": 430269, "epoch": 5183} {"train_loss": -26.421884536743164, "global_step": 430270, "epoch": 5183} {"train_loss": -26.817675165383214, "global_step": 430271, "epoch": 5183, "val_loss": 6699032.0} {"train_loss": -25.9597110748291, "global_step": 430272, "epoch": 5184} {"train_loss": -26.064804077148438, "global_step": 430273, "epoch": 5184} {"train_loss": -26.12665367126465, "global_step": 430274, "epoch": 5184} {"train_loss": -25.940982818603516, "global_step": 430275, "epoch": 5184} {"train_loss": -26.58368492126465, "global_step": 430276, "epoch": 5184} {"train_loss": -26.178998947143555, "global_step": 430277, "epoch": 5184} {"train_loss": -26.50014305114746, "global_step": 430278, "epoch": 5184} {"train_loss": -25.977487564086914, "global_step": 430279, "epoch": 5184} {"train_loss": -26.174158096313477, "global_step": 430280, "epoch": 5184} {"train_loss": -26.458606719970703, "global_step": 430281, "epoch": 5184} {"train_loss": -26.77726173400879, "global_step": 430282, "epoch": 5184} {"train_loss": -26.5910587310791, "global_step": 430283, "epoch": 5184} {"train_loss": -26.503732681274414, "global_step": 430284, "epoch": 5184} {"train_loss": -26.37628173828125, "global_step": 430285, "epoch": 5184} {"train_loss": -26.467748641967773, "global_step": 430286, "epoch": 5184} {"train_loss": -26.7947998046875, "global_step": 430287, "epoch": 5184} {"train_loss": -26.44843864440918, "global_step": 430288, "epoch": 5184} {"train_loss": -26.936872482299805, "global_step": 430289, "epoch": 5184} {"train_loss": -26.5721492767334, "global_step": 430290, "epoch": 5184} {"train_loss": -26.899490356445312, "global_step": 430291, "epoch": 5184} {"train_loss": -26.916397094726562, "global_step": 430292, "epoch": 5184} {"train_loss": -27.109485626220703, "global_step": 430293, "epoch": 5184} {"train_loss": -26.624433517456055, "global_step": 430294, "epoch": 5184} {"train_loss": -26.5585880279541, "global_step": 430295, "epoch": 5184} {"train_loss": -26.9420166015625, "global_step": 430296, "epoch": 5184} {"train_loss": -26.761245727539062, "global_step": 430297, "epoch": 5184} {"train_loss": -26.899988174438477, "global_step": 430298, "epoch": 5184} {"train_loss": -26.84819984436035, "global_step": 430299, "epoch": 5184} {"train_loss": -26.8731746673584, "global_step": 430300, "epoch": 5184} {"train_loss": -26.709802627563477, "global_step": 430301, "epoch": 5184} {"train_loss": -26.549406051635742, "global_step": 430302, "epoch": 5184} {"train_loss": -26.893268585205078, "global_step": 430303, "epoch": 5184} {"train_loss": -27.043283462524414, "global_step": 430304, "epoch": 5184} {"train_loss": -27.24588394165039, "global_step": 430305, "epoch": 5184} {"train_loss": -26.76434326171875, "global_step": 430306, "epoch": 5184} {"train_loss": -26.789270401000977, "global_step": 430307, "epoch": 5184} {"train_loss": -27.151880264282227, "global_step": 430308, "epoch": 5184} {"train_loss": -27.055118560791016, "global_step": 430309, "epoch": 5184} {"train_loss": -27.039648056030273, "global_step": 430310, "epoch": 5184} {"train_loss": -26.9457950592041, "global_step": 430311, "epoch": 5184} {"train_loss": -27.336557388305664, "global_step": 430312, "epoch": 5184} {"train_loss": -27.06441307067871, "global_step": 430313, "epoch": 5184} {"train_loss": -26.944721221923828, "global_step": 430314, "epoch": 5184} {"train_loss": -26.779935836791992, "global_step": 430315, "epoch": 5184} {"train_loss": -27.05356216430664, "global_step": 430316, "epoch": 5184} {"train_loss": -27.22117042541504, "global_step": 430317, "epoch": 5184} {"train_loss": -26.519086837768555, "global_step": 430318, "epoch": 5184} {"train_loss": -26.926008224487305, "global_step": 430319, "epoch": 5184} {"train_loss": -27.32594108581543, "global_step": 430320, "epoch": 5184} {"train_loss": -27.16632652282715, "global_step": 430321, "epoch": 5184} {"train_loss": -26.785375595092773, "global_step": 430322, "epoch": 5184} {"train_loss": -26.83953285217285, "global_step": 430323, "epoch": 5184} {"train_loss": -27.22715187072754, "global_step": 430324, "epoch": 5184} {"train_loss": -27.087080001831055, "global_step": 430325, "epoch": 5184} {"train_loss": -26.82651710510254, "global_step": 430326, "epoch": 5184} {"train_loss": -27.36688804626465, "global_step": 430327, "epoch": 5184} {"train_loss": -26.960538864135742, "global_step": 430328, "epoch": 5184} {"train_loss": -26.753402709960938, "global_step": 430329, "epoch": 5184} {"train_loss": -26.820255279541016, "global_step": 430330, "epoch": 5184} {"train_loss": -26.832284927368164, "global_step": 430331, "epoch": 5184} {"train_loss": -26.469348907470703, "global_step": 430332, "epoch": 5184} {"train_loss": -26.561111450195312, "global_step": 430333, "epoch": 5184} {"train_loss": -26.722196578979492, "global_step": 430334, "epoch": 5184} {"train_loss": -27.06805419921875, "global_step": 430335, "epoch": 5184} {"train_loss": -26.647348403930664, "global_step": 430336, "epoch": 5184} {"train_loss": -27.046178817749023, "global_step": 430337, "epoch": 5184} {"train_loss": -27.34397315979004, "global_step": 430338, "epoch": 5184} {"train_loss": -27.0189208984375, "global_step": 430339, "epoch": 5184} {"train_loss": -26.961088180541992, "global_step": 430340, "epoch": 5184} {"train_loss": -26.850677490234375, "global_step": 430341, "epoch": 5184} {"train_loss": -26.974075317382812, "global_step": 430342, "epoch": 5184} {"train_loss": -26.629133224487305, "global_step": 430343, "epoch": 5184} {"train_loss": -27.050479888916016, "global_step": 430344, "epoch": 5184} {"train_loss": -26.88035011291504, "global_step": 430345, "epoch": 5184} {"train_loss": -26.872756958007812, "global_step": 430346, "epoch": 5184} {"train_loss": -27.102338790893555, "global_step": 430347, "epoch": 5184} {"train_loss": -27.022932052612305, "global_step": 430348, "epoch": 5184} {"train_loss": -26.828235626220703, "global_step": 430349, "epoch": 5184} {"train_loss": -26.199735641479492, "global_step": 430350, "epoch": 5184} {"train_loss": -26.06583595275879, "global_step": 430351, "epoch": 5184} {"train_loss": -26.43710708618164, "global_step": 430352, "epoch": 5184} {"train_loss": -27.28275489807129, "global_step": 430353, "epoch": 5184} {"train_loss": -26.775265475353564, "global_step": 430354, "epoch": 5184, "val_loss": 6634614.5} {"train_loss": -25.341768264770508, "global_step": 430355, "epoch": 5185} {"train_loss": -25.328174591064453, "global_step": 430356, "epoch": 5185} {"train_loss": -26.13226318359375, "global_step": 430357, "epoch": 5185} {"train_loss": -25.13564109802246, "global_step": 430358, "epoch": 5185} {"train_loss": -25.175155639648438, "global_step": 430359, "epoch": 5185} {"train_loss": -26.18999671936035, "global_step": 430360, "epoch": 5185} {"train_loss": -25.772302627563477, "global_step": 430361, "epoch": 5185} {"train_loss": -26.198816299438477, "global_step": 430362, "epoch": 5185} {"train_loss": -25.894947052001953, "global_step": 430363, "epoch": 5185} {"train_loss": -25.728240966796875, "global_step": 430364, "epoch": 5185} {"train_loss": -26.220205307006836, "global_step": 430365, "epoch": 5185} {"train_loss": -25.803110122680664, "global_step": 430366, "epoch": 5185} {"train_loss": -26.106739044189453, "global_step": 430367, "epoch": 5185} {"train_loss": -25.890676498413086, "global_step": 430368, "epoch": 5185} {"train_loss": -26.388341903686523, "global_step": 430369, "epoch": 5185} {"train_loss": -26.405841827392578, "global_step": 430370, "epoch": 5185} {"train_loss": -26.569623947143555, "global_step": 430371, "epoch": 5185} {"train_loss": -26.15765953063965, "global_step": 430372, "epoch": 5185} {"train_loss": -26.442243576049805, "global_step": 430373, "epoch": 5185} {"train_loss": -26.468921661376953, "global_step": 430374, "epoch": 5185} {"train_loss": -26.88446617126465, "global_step": 430375, "epoch": 5185} {"train_loss": -26.316686630249023, "global_step": 430376, "epoch": 5185} {"train_loss": -26.223556518554688, "global_step": 430377, "epoch": 5185} {"train_loss": -26.687274932861328, "global_step": 430378, "epoch": 5185} {"train_loss": -26.488300323486328, "global_step": 430379, "epoch": 5185} {"train_loss": -26.5784854888916, "global_step": 430380, "epoch": 5185} {"train_loss": -26.537336349487305, "global_step": 430381, "epoch": 5185} {"train_loss": -26.6726131439209, "global_step": 430382, "epoch": 5185} {"train_loss": -26.698522567749023, "global_step": 430383, "epoch": 5185} {"train_loss": -26.617053985595703, "global_step": 430384, "epoch": 5185} {"train_loss": -26.61956787109375, "global_step": 430385, "epoch": 5185} {"train_loss": -26.72877311706543, "global_step": 430386, "epoch": 5185} {"train_loss": -26.73042106628418, "global_step": 430387, "epoch": 5185} {"train_loss": -26.78377342224121, "global_step": 430388, "epoch": 5185} {"train_loss": -26.588916778564453, "global_step": 430389, "epoch": 5185} {"train_loss": -26.87396240234375, "global_step": 430390, "epoch": 5185} {"train_loss": -26.89542579650879, "global_step": 430391, "epoch": 5185} {"train_loss": -26.849090576171875, "global_step": 430392, "epoch": 5185} {"train_loss": -26.997806549072266, "global_step": 430393, "epoch": 5185} {"train_loss": -26.677602767944336, "global_step": 430394, "epoch": 5185} {"train_loss": -26.808950424194336, "global_step": 430395, "epoch": 5185} {"train_loss": -27.1087646484375, "global_step": 430396, "epoch": 5185} {"train_loss": -26.5470027923584, "global_step": 430397, "epoch": 5185} {"train_loss": -26.683317184448242, "global_step": 430398, "epoch": 5185} {"train_loss": -26.47230339050293, "global_step": 430399, "epoch": 5185} {"train_loss": -26.772491455078125, "global_step": 430400, "epoch": 5185} {"train_loss": -27.167011260986328, "global_step": 430401, "epoch": 5185} {"train_loss": -27.272851943969727, "global_step": 430402, "epoch": 5185} {"train_loss": -26.80120277404785, "global_step": 430403, "epoch": 5185} {"train_loss": -26.80759620666504, "global_step": 430404, "epoch": 5185} {"train_loss": -26.758926391601562, "global_step": 430405, "epoch": 5185} {"train_loss": -26.467529296875, "global_step": 430406, "epoch": 5185} {"train_loss": -27.051227569580078, "global_step": 430407, "epoch": 5185} {"train_loss": -26.551803588867188, "global_step": 430408, "epoch": 5185} {"train_loss": -26.686307907104492, "global_step": 430409, "epoch": 5185} {"train_loss": -26.564594268798828, "global_step": 430410, "epoch": 5185} {"train_loss": -26.639850616455078, "global_step": 430411, "epoch": 5185} {"train_loss": -26.657825469970703, "global_step": 430412, "epoch": 5185} {"train_loss": -26.7313289642334, "global_step": 430413, "epoch": 5185} {"train_loss": -27.134296417236328, "global_step": 430414, "epoch": 5185} {"train_loss": -26.6394100189209, "global_step": 430415, "epoch": 5185} {"train_loss": -27.00629997253418, "global_step": 430416, "epoch": 5185} {"train_loss": -26.953571319580078, "global_step": 430417, "epoch": 5185} {"train_loss": -26.843505859375, "global_step": 430418, "epoch": 5185} {"train_loss": -26.8480224609375, "global_step": 430419, "epoch": 5185} {"train_loss": -27.039234161376953, "global_step": 430420, "epoch": 5185} {"train_loss": -26.931365966796875, "global_step": 430421, "epoch": 5185} {"train_loss": -27.21107292175293, "global_step": 430422, "epoch": 5185} {"train_loss": -26.798444747924805, "global_step": 430423, "epoch": 5185} {"train_loss": -26.677032470703125, "global_step": 430424, "epoch": 5185} {"train_loss": -26.736408233642578, "global_step": 430425, "epoch": 5185} {"train_loss": -26.98090934753418, "global_step": 430426, "epoch": 5185} {"train_loss": -26.65851402282715, "global_step": 430427, "epoch": 5185} {"train_loss": -26.731348037719727, "global_step": 430428, "epoch": 5185} {"train_loss": -26.9086856842041, "global_step": 430429, "epoch": 5185} {"train_loss": -26.70572853088379, "global_step": 430430, "epoch": 5185} {"train_loss": -26.990392684936523, "global_step": 430431, "epoch": 5185} {"train_loss": -26.56453514099121, "global_step": 430432, "epoch": 5185} {"train_loss": -26.728342056274414, "global_step": 430433, "epoch": 5185} {"train_loss": -27.036596298217773, "global_step": 430434, "epoch": 5185} {"train_loss": -27.190149307250977, "global_step": 430435, "epoch": 5185} {"train_loss": -26.990636825561523, "global_step": 430436, "epoch": 5185} {"train_loss": -26.572644245193665, "global_step": 430437, "epoch": 5185, "val_loss": 6657536.0} {"train_loss": -27.369800567626953, "global_step": 430438, "epoch": 5186} {"train_loss": -26.80657386779785, "global_step": 430439, "epoch": 5186} {"train_loss": -26.63519287109375, "global_step": 430440, "epoch": 5186} {"train_loss": -26.76767921447754, "global_step": 430441, "epoch": 5186} {"train_loss": -26.569625854492188, "global_step": 430442, "epoch": 5186} {"train_loss": -26.731184005737305, "global_step": 430443, "epoch": 5186} {"train_loss": -26.602890014648438, "global_step": 430444, "epoch": 5186} {"train_loss": -26.919416427612305, "global_step": 430445, "epoch": 5186} {"train_loss": -26.755325317382812, "global_step": 430446, "epoch": 5186} {"train_loss": -26.741907119750977, "global_step": 430447, "epoch": 5186} {"train_loss": -26.923307418823242, "global_step": 430448, "epoch": 5186} {"train_loss": -26.913055419921875, "global_step": 430449, "epoch": 5186} {"train_loss": -26.42592430114746, "global_step": 430450, "epoch": 5186} {"train_loss": -26.38123893737793, "global_step": 430451, "epoch": 5186} {"train_loss": -26.77166175842285, "global_step": 430452, "epoch": 5186} {"train_loss": -26.986963272094727, "global_step": 430453, "epoch": 5186} {"train_loss": -26.866031646728516, "global_step": 430454, "epoch": 5186} {"train_loss": -26.552778244018555, "global_step": 430455, "epoch": 5186} {"train_loss": -26.692615509033203, "global_step": 430456, "epoch": 5186} {"train_loss": -26.8780517578125, "global_step": 430457, "epoch": 5186} {"train_loss": -26.816755294799805, "global_step": 430458, "epoch": 5186} {"train_loss": -26.619678497314453, "global_step": 430459, "epoch": 5186} {"train_loss": -26.90805435180664, "global_step": 430460, "epoch": 5186} {"train_loss": -26.642927169799805, "global_step": 430461, "epoch": 5186} {"train_loss": -27.032217025756836, "global_step": 430462, "epoch": 5186} {"train_loss": -26.80560302734375, "global_step": 430463, "epoch": 5186} {"train_loss": -27.002424240112305, "global_step": 430464, "epoch": 5186} {"train_loss": -26.876087188720703, "global_step": 430465, "epoch": 5186} {"train_loss": -26.834888458251953, "global_step": 430466, "epoch": 5186} {"train_loss": -27.136722564697266, "global_step": 430467, "epoch": 5186} {"train_loss": -26.647281646728516, "global_step": 430468, "epoch": 5186} {"train_loss": -26.893085479736328, "global_step": 430469, "epoch": 5186} {"train_loss": -27.065052032470703, "global_step": 430470, "epoch": 5186} {"train_loss": -26.83989906311035, "global_step": 430471, "epoch": 5186} {"train_loss": -26.705320358276367, "global_step": 430472, "epoch": 5186} {"train_loss": -26.50732421875, "global_step": 430473, "epoch": 5186} {"train_loss": -26.416351318359375, "global_step": 430474, "epoch": 5186} {"train_loss": -26.467971801757812, "global_step": 430475, "epoch": 5186} {"train_loss": -26.62442398071289, "global_step": 430476, "epoch": 5186} {"train_loss": -27.004201889038086, "global_step": 430477, "epoch": 5186} {"train_loss": -27.12652587890625, "global_step": 430478, "epoch": 5186} {"train_loss": -26.890283584594727, "global_step": 430479, "epoch": 5186} {"train_loss": -26.767805099487305, "global_step": 430480, "epoch": 5186} {"train_loss": -26.99847984313965, "global_step": 430481, "epoch": 5186} {"train_loss": -26.830617904663086, "global_step": 430482, "epoch": 5186} {"train_loss": -26.937259674072266, "global_step": 430483, "epoch": 5186} {"train_loss": -27.14689064025879, "global_step": 430484, "epoch": 5186} {"train_loss": -27.140716552734375, "global_step": 430485, "epoch": 5186} {"train_loss": -26.75271987915039, "global_step": 430486, "epoch": 5186} {"train_loss": -27.090911865234375, "global_step": 430487, "epoch": 5186} {"train_loss": -26.692657470703125, "global_step": 430488, "epoch": 5186} {"train_loss": -26.80745506286621, "global_step": 430489, "epoch": 5186} {"train_loss": -27.04351234436035, "global_step": 430490, "epoch": 5186} {"train_loss": -27.022846221923828, "global_step": 430491, "epoch": 5186} {"train_loss": -27.273880004882812, "global_step": 430492, "epoch": 5186} {"train_loss": -26.92618179321289, "global_step": 430493, "epoch": 5186} {"train_loss": -27.170080184936523, "global_step": 430494, "epoch": 5186} {"train_loss": -27.071699142456055, "global_step": 430495, "epoch": 5186} {"train_loss": -27.26641845703125, "global_step": 430496, "epoch": 5186} {"train_loss": -27.334264755249023, "global_step": 430497, "epoch": 5186} {"train_loss": -26.809782028198242, "global_step": 430498, "epoch": 5186} {"train_loss": -27.062646865844727, "global_step": 430499, "epoch": 5186} {"train_loss": -26.889392852783203, "global_step": 430500, "epoch": 5186} {"train_loss": -26.85934829711914, "global_step": 430501, "epoch": 5186} {"train_loss": -26.659910202026367, "global_step": 430502, "epoch": 5186} {"train_loss": -26.806196212768555, "global_step": 430503, "epoch": 5186} {"train_loss": -26.998046875, "global_step": 430504, "epoch": 5186} {"train_loss": -27.192310333251953, "global_step": 430505, "epoch": 5186} {"train_loss": -27.047286987304688, "global_step": 430506, "epoch": 5186} {"train_loss": -27.233240127563477, "global_step": 430507, "epoch": 5186} {"train_loss": -27.163816452026367, "global_step": 430508, "epoch": 5186} {"train_loss": -26.90162467956543, "global_step": 430509, "epoch": 5186} {"train_loss": -26.993762969970703, "global_step": 430510, "epoch": 5186} {"train_loss": -27.36555290222168, "global_step": 430511, "epoch": 5186} {"train_loss": -27.086292266845703, "global_step": 430512, "epoch": 5186} {"train_loss": -26.966577529907227, "global_step": 430513, "epoch": 5186} {"train_loss": -27.31766128540039, "global_step": 430514, "epoch": 5186} {"train_loss": -27.09541130065918, "global_step": 430515, "epoch": 5186} {"train_loss": -27.4467830657959, "global_step": 430516, "epoch": 5186} {"train_loss": -27.29473304748535, "global_step": 430517, "epoch": 5186} {"train_loss": -26.93415641784668, "global_step": 430518, "epoch": 5186} {"train_loss": -26.701704025268555, "global_step": 430519, "epoch": 5186} {"train_loss": -26.90843099571136, "global_step": 430520, "epoch": 5186, "val_loss": 6680326.0} {"train_loss": -25.927932739257812, "global_step": 430521, "epoch": 5187} {"train_loss": -25.28135871887207, "global_step": 430522, "epoch": 5187} {"train_loss": -23.7998046875, "global_step": 430523, "epoch": 5187} {"train_loss": -25.025747299194336, "global_step": 430524, "epoch": 5187} {"train_loss": -25.99861717224121, "global_step": 430525, "epoch": 5187} {"train_loss": -24.076051712036133, "global_step": 430526, "epoch": 5187} {"train_loss": -25.704334259033203, "global_step": 430527, "epoch": 5187} {"train_loss": -25.31916618347168, "global_step": 430528, "epoch": 5187} {"train_loss": -25.959491729736328, "global_step": 430529, "epoch": 5187} {"train_loss": -25.793710708618164, "global_step": 430530, "epoch": 5187} {"train_loss": -26.220062255859375, "global_step": 430531, "epoch": 5187} {"train_loss": -26.505125045776367, "global_step": 430532, "epoch": 5187} {"train_loss": -25.59535026550293, "global_step": 430533, "epoch": 5187} {"train_loss": -25.879703521728516, "global_step": 430534, "epoch": 5187} {"train_loss": -26.15018081665039, "global_step": 430535, "epoch": 5187} {"train_loss": -26.042280197143555, "global_step": 430536, "epoch": 5187} {"train_loss": -26.457691192626953, "global_step": 430537, "epoch": 5187} {"train_loss": -26.389490127563477, "global_step": 430538, "epoch": 5187} {"train_loss": -26.129199981689453, "global_step": 430539, "epoch": 5187} {"train_loss": -26.483373641967773, "global_step": 430540, "epoch": 5187} {"train_loss": -26.08684730529785, "global_step": 430541, "epoch": 5187} {"train_loss": -26.637033462524414, "global_step": 430542, "epoch": 5187} {"train_loss": -26.162946701049805, "global_step": 430543, "epoch": 5187} {"train_loss": -26.38258171081543, "global_step": 430544, "epoch": 5187} {"train_loss": -26.232135772705078, "global_step": 430545, "epoch": 5187} {"train_loss": -26.370853424072266, "global_step": 430546, "epoch": 5187} {"train_loss": -26.522001266479492, "global_step": 430547, "epoch": 5187} {"train_loss": -26.073713302612305, "global_step": 430548, "epoch": 5187} {"train_loss": -26.386938095092773, "global_step": 430549, "epoch": 5187} {"train_loss": -26.411273956298828, "global_step": 430550, "epoch": 5187} {"train_loss": -26.42254066467285, "global_step": 430551, "epoch": 5187} {"train_loss": -26.300765991210938, "global_step": 430552, "epoch": 5187} {"train_loss": -27.033737182617188, "global_step": 430553, "epoch": 5187} {"train_loss": -26.595413208007812, "global_step": 430554, "epoch": 5187} {"train_loss": -26.58125114440918, "global_step": 430555, "epoch": 5187} {"train_loss": -26.554397583007812, "global_step": 430556, "epoch": 5187} {"train_loss": -26.573877334594727, "global_step": 430557, "epoch": 5187} {"train_loss": -26.402578353881836, "global_step": 430558, "epoch": 5187} {"train_loss": -26.479877471923828, "global_step": 430559, "epoch": 5187} {"train_loss": -26.381153106689453, "global_step": 430560, "epoch": 5187} {"train_loss": -26.670804977416992, "global_step": 430561, "epoch": 5187} {"train_loss": -26.896677017211914, "global_step": 430562, "epoch": 5187} {"train_loss": -26.66920280456543, "global_step": 430563, "epoch": 5187} {"train_loss": -26.614439010620117, "global_step": 430564, "epoch": 5187} {"train_loss": -26.6177921295166, "global_step": 430565, "epoch": 5187} {"train_loss": -26.66388511657715, "global_step": 430566, "epoch": 5187} {"train_loss": -26.812711715698242, "global_step": 430567, "epoch": 5187} {"train_loss": -26.766977310180664, "global_step": 430568, "epoch": 5187} {"train_loss": -26.6804141998291, "global_step": 430569, "epoch": 5187} {"train_loss": -26.835729598999023, "global_step": 430570, "epoch": 5187} {"train_loss": -26.545883178710938, "global_step": 430571, "epoch": 5187} {"train_loss": -26.941974639892578, "global_step": 430572, "epoch": 5187} {"train_loss": -27.077198028564453, "global_step": 430573, "epoch": 5187} {"train_loss": -26.390216827392578, "global_step": 430574, "epoch": 5187} {"train_loss": -26.583425521850586, "global_step": 430575, "epoch": 5187} {"train_loss": -26.8552303314209, "global_step": 430576, "epoch": 5187} {"train_loss": -26.603256225585938, "global_step": 430577, "epoch": 5187} {"train_loss": -26.546689987182617, "global_step": 430578, "epoch": 5187} {"train_loss": -26.92915916442871, "global_step": 430579, "epoch": 5187} {"train_loss": -26.601181030273438, "global_step": 430580, "epoch": 5187} {"train_loss": -27.1792049407959, "global_step": 430581, "epoch": 5187} {"train_loss": -26.670515060424805, "global_step": 430582, "epoch": 5187} {"train_loss": -26.565006256103516, "global_step": 430583, "epoch": 5187} {"train_loss": -26.09120750427246, "global_step": 430584, "epoch": 5187} {"train_loss": -26.709753036499023, "global_step": 430585, "epoch": 5187} {"train_loss": -26.89578628540039, "global_step": 430586, "epoch": 5187} {"train_loss": -26.713178634643555, "global_step": 430587, "epoch": 5187} {"train_loss": -26.961069107055664, "global_step": 430588, "epoch": 5187} {"train_loss": -26.68311882019043, "global_step": 430589, "epoch": 5187} {"train_loss": -26.92624855041504, "global_step": 430590, "epoch": 5187} {"train_loss": -27.2783145904541, "global_step": 430591, "epoch": 5187} {"train_loss": -26.940698623657227, "global_step": 430592, "epoch": 5187} {"train_loss": -26.98068618774414, "global_step": 430593, "epoch": 5187} {"train_loss": -26.744892120361328, "global_step": 430594, "epoch": 5187} {"train_loss": -26.597036361694336, "global_step": 430595, "epoch": 5187} {"train_loss": -26.69556999206543, "global_step": 430596, "epoch": 5187} {"train_loss": -27.010629653930664, "global_step": 430597, "epoch": 5187} {"train_loss": -26.949176788330078, "global_step": 430598, "epoch": 5187} {"train_loss": -27.266454696655273, "global_step": 430599, "epoch": 5187} {"train_loss": -26.96388816833496, "global_step": 430600, "epoch": 5187} {"train_loss": -27.002975463867188, "global_step": 430601, "epoch": 5187} {"train_loss": -27.014892578125, "global_step": 430602, "epoch": 5187} {"train_loss": -26.449419458228423, "global_step": 430603, "epoch": 5187, "val_loss": 6600092.0} {"train_loss": -26.9724063873291, "global_step": 430604, "epoch": 5188} {"train_loss": -26.7043514251709, "global_step": 430605, "epoch": 5188} {"train_loss": -26.970306396484375, "global_step": 430606, "epoch": 5188} {"train_loss": -26.677133560180664, "global_step": 430607, "epoch": 5188} {"train_loss": -26.861066818237305, "global_step": 430608, "epoch": 5188} {"train_loss": -26.51326560974121, "global_step": 430609, "epoch": 5188} {"train_loss": -26.36319923400879, "global_step": 430610, "epoch": 5188} {"train_loss": -26.458038330078125, "global_step": 430611, "epoch": 5188} {"train_loss": -26.271209716796875, "global_step": 430612, "epoch": 5188} {"train_loss": -26.81977653503418, "global_step": 430613, "epoch": 5188} {"train_loss": -26.75929069519043, "global_step": 430614, "epoch": 5188} {"train_loss": -26.76765251159668, "global_step": 430615, "epoch": 5188} {"train_loss": -26.857410430908203, "global_step": 430616, "epoch": 5188} {"train_loss": -26.78340721130371, "global_step": 430617, "epoch": 5188} {"train_loss": -26.908124923706055, "global_step": 430618, "epoch": 5188} {"train_loss": -26.724227905273438, "global_step": 430619, "epoch": 5188} {"train_loss": -26.8923282623291, "global_step": 430620, "epoch": 5188} {"train_loss": -27.066831588745117, "global_step": 430621, "epoch": 5188} {"train_loss": -27.079919815063477, "global_step": 430622, "epoch": 5188} {"train_loss": -26.982574462890625, "global_step": 430623, "epoch": 5188} {"train_loss": -26.830245971679688, "global_step": 430624, "epoch": 5188} {"train_loss": -26.71222496032715, "global_step": 430625, "epoch": 5188} {"train_loss": -27.26614761352539, "global_step": 430626, "epoch": 5188} {"train_loss": -27.380422592163086, "global_step": 430627, "epoch": 5188} {"train_loss": -26.699609756469727, "global_step": 430628, "epoch": 5188} {"train_loss": -26.973669052124023, "global_step": 430629, "epoch": 5188} {"train_loss": -27.102405548095703, "global_step": 430630, "epoch": 5188} {"train_loss": -27.3240909576416, "global_step": 430631, "epoch": 5188} {"train_loss": -26.984542846679688, "global_step": 430632, "epoch": 5188} {"train_loss": -27.336637496948242, "global_step": 430633, "epoch": 5188} {"train_loss": -27.109607696533203, "global_step": 430634, "epoch": 5188} {"train_loss": -27.00286293029785, "global_step": 430635, "epoch": 5188} {"train_loss": -27.274866104125977, "global_step": 430636, "epoch": 5188} {"train_loss": -26.91770362854004, "global_step": 430637, "epoch": 5188} {"train_loss": -26.6556339263916, "global_step": 430638, "epoch": 5188} {"train_loss": -26.86099624633789, "global_step": 430639, "epoch": 5188} {"train_loss": -27.087446212768555, "global_step": 430640, "epoch": 5188} {"train_loss": -26.793806076049805, "global_step": 430641, "epoch": 5188} {"train_loss": -26.70063591003418, "global_step": 430642, "epoch": 5188} {"train_loss": -27.1013240814209, "global_step": 430643, "epoch": 5188} {"train_loss": -26.851633071899414, "global_step": 430644, "epoch": 5188} {"train_loss": -26.4742374420166, "global_step": 430645, "epoch": 5188} {"train_loss": -26.235645294189453, "global_step": 430646, "epoch": 5188} {"train_loss": -26.136999130249023, "global_step": 430647, "epoch": 5188} {"train_loss": -26.002887725830078, "global_step": 430648, "epoch": 5188} {"train_loss": -26.98640251159668, "global_step": 430649, "epoch": 5188} {"train_loss": -27.058923721313477, "global_step": 430650, "epoch": 5188} {"train_loss": -26.83880615234375, "global_step": 430651, "epoch": 5188} {"train_loss": -26.79526710510254, "global_step": 430652, "epoch": 5188} {"train_loss": -26.6964111328125, "global_step": 430653, "epoch": 5188} {"train_loss": -26.97477149963379, "global_step": 430654, "epoch": 5188} {"train_loss": -26.6938533782959, "global_step": 430655, "epoch": 5188} {"train_loss": -27.172138214111328, "global_step": 430656, "epoch": 5188} {"train_loss": -27.07391929626465, "global_step": 430657, "epoch": 5188} {"train_loss": -26.9859561920166, "global_step": 430658, "epoch": 5188} {"train_loss": -26.68609046936035, "global_step": 430659, "epoch": 5188} {"train_loss": -26.810455322265625, "global_step": 430660, "epoch": 5188} {"train_loss": -27.139938354492188, "global_step": 430661, "epoch": 5188} {"train_loss": -26.55219078063965, "global_step": 430662, "epoch": 5188} {"train_loss": -27.156564712524414, "global_step": 430663, "epoch": 5188} {"train_loss": -26.8468074798584, "global_step": 430664, "epoch": 5188} {"train_loss": -27.189151763916016, "global_step": 430665, "epoch": 5188} {"train_loss": -26.986072540283203, "global_step": 430666, "epoch": 5188} {"train_loss": -26.967416763305664, "global_step": 430667, "epoch": 5188} {"train_loss": -27.10554313659668, "global_step": 430668, "epoch": 5188} {"train_loss": -27.2905216217041, "global_step": 430669, "epoch": 5188} {"train_loss": -26.783594131469727, "global_step": 430670, "epoch": 5188} {"train_loss": -27.037281036376953, "global_step": 430671, "epoch": 5188} {"train_loss": -26.799970626831055, "global_step": 430672, "epoch": 5188} {"train_loss": -27.04884147644043, "global_step": 430673, "epoch": 5188} {"train_loss": -27.272785186767578, "global_step": 430674, "epoch": 5188} {"train_loss": -27.087915420532227, "global_step": 430675, "epoch": 5188} {"train_loss": -26.995914459228516, "global_step": 430676, "epoch": 5188} {"train_loss": -26.560400009155273, "global_step": 430677, "epoch": 5188} {"train_loss": -27.200437545776367, "global_step": 430678, "epoch": 5188} {"train_loss": -27.431537628173828, "global_step": 430679, "epoch": 5188} {"train_loss": -27.079687118530273, "global_step": 430680, "epoch": 5188} {"train_loss": -27.0739688873291, "global_step": 430681, "epoch": 5188} {"train_loss": -27.016218185424805, "global_step": 430682, "epoch": 5188} {"train_loss": -27.184247970581055, "global_step": 430683, "epoch": 5188} {"train_loss": -26.903348922729492, "global_step": 430684, "epoch": 5188} {"train_loss": -27.06245231628418, "global_step": 430685, "epoch": 5188} {"train_loss": -26.91637581515025, "global_step": 430686, "epoch": 5188, "val_loss": 6647571.0} {"train_loss": -26.492023468017578, "global_step": 430687, "epoch": 5189} {"train_loss": -25.272153854370117, "global_step": 430688, "epoch": 5189} {"train_loss": -25.032079696655273, "global_step": 430689, "epoch": 5189} {"train_loss": -25.358999252319336, "global_step": 430690, "epoch": 5189} {"train_loss": -25.199848175048828, "global_step": 430691, "epoch": 5189} {"train_loss": -25.63311767578125, "global_step": 430692, "epoch": 5189} {"train_loss": -25.546222686767578, "global_step": 430693, "epoch": 5189} {"train_loss": -26.29866600036621, "global_step": 430694, "epoch": 5189} {"train_loss": -25.592355728149414, "global_step": 430695, "epoch": 5189} {"train_loss": -25.752857208251953, "global_step": 430696, "epoch": 5189} {"train_loss": -26.1922550201416, "global_step": 430697, "epoch": 5189} {"train_loss": -26.033771514892578, "global_step": 430698, "epoch": 5189} {"train_loss": -26.22892189025879, "global_step": 430699, "epoch": 5189} {"train_loss": -26.347564697265625, "global_step": 430700, "epoch": 5189} {"train_loss": -26.511728286743164, "global_step": 430701, "epoch": 5189} {"train_loss": -26.51606559753418, "global_step": 430702, "epoch": 5189} {"train_loss": -26.34360694885254, "global_step": 430703, "epoch": 5189} {"train_loss": -25.962421417236328, "global_step": 430704, "epoch": 5189} {"train_loss": -26.53388023376465, "global_step": 430705, "epoch": 5189} {"train_loss": -26.344818115234375, "global_step": 430706, "epoch": 5189} {"train_loss": -26.444467544555664, "global_step": 430707, "epoch": 5189} {"train_loss": -26.961246490478516, "global_step": 430708, "epoch": 5189} {"train_loss": -26.615880966186523, "global_step": 430709, "epoch": 5189} {"train_loss": -26.646642684936523, "global_step": 430710, "epoch": 5189} {"train_loss": -26.950281143188477, "global_step": 430711, "epoch": 5189} {"train_loss": -26.41413688659668, "global_step": 430712, "epoch": 5189} {"train_loss": -26.722265243530273, "global_step": 430713, "epoch": 5189} {"train_loss": -27.01202392578125, "global_step": 430714, "epoch": 5189} {"train_loss": -26.69534683227539, "global_step": 430715, "epoch": 5189} {"train_loss": -26.729429244995117, "global_step": 430716, "epoch": 5189} {"train_loss": -26.828937530517578, "global_step": 430717, "epoch": 5189} {"train_loss": -27.063085556030273, "global_step": 430718, "epoch": 5189} {"train_loss": -27.025863647460938, "global_step": 430719, "epoch": 5189} {"train_loss": -27.102401733398438, "global_step": 430720, "epoch": 5189} {"train_loss": -27.012842178344727, "global_step": 430721, "epoch": 5189} {"train_loss": -26.913923263549805, "global_step": 430722, "epoch": 5189} {"train_loss": -26.56292152404785, "global_step": 430723, "epoch": 5189} {"train_loss": -26.739990234375, "global_step": 430724, "epoch": 5189} {"train_loss": -26.857498168945312, "global_step": 430725, "epoch": 5189} {"train_loss": -26.830432891845703, "global_step": 430726, "epoch": 5189} {"train_loss": -26.996244430541992, "global_step": 430727, "epoch": 5189} {"train_loss": -27.072336196899414, "global_step": 430728, "epoch": 5189} {"train_loss": -27.123641967773438, "global_step": 430729, "epoch": 5189} {"train_loss": -27.22800064086914, "global_step": 430730, "epoch": 5189} {"train_loss": -27.23197364807129, "global_step": 430731, "epoch": 5189} {"train_loss": -27.046201705932617, "global_step": 430732, "epoch": 5189} {"train_loss": -26.701658248901367, "global_step": 430733, "epoch": 5189} {"train_loss": -27.00982666015625, "global_step": 430734, "epoch": 5189} {"train_loss": -27.436450958251953, "global_step": 430735, "epoch": 5189} {"train_loss": -26.842554092407227, "global_step": 430736, "epoch": 5189} {"train_loss": -26.99915885925293, "global_step": 430737, "epoch": 5189} {"train_loss": -27.21697425842285, "global_step": 430738, "epoch": 5189} {"train_loss": -27.189849853515625, "global_step": 430739, "epoch": 5189} {"train_loss": -27.049596786499023, "global_step": 430740, "epoch": 5189} {"train_loss": -27.122297286987305, "global_step": 430741, "epoch": 5189} {"train_loss": -27.12503433227539, "global_step": 430742, "epoch": 5189} {"train_loss": -26.996179580688477, "global_step": 430743, "epoch": 5189} {"train_loss": -26.733123779296875, "global_step": 430744, "epoch": 5189} {"train_loss": -26.989587783813477, "global_step": 430745, "epoch": 5189} {"train_loss": -27.13468360900879, "global_step": 430746, "epoch": 5189} {"train_loss": -27.057281494140625, "global_step": 430747, "epoch": 5189} {"train_loss": -26.372116088867188, "global_step": 430748, "epoch": 5189} {"train_loss": -26.765050888061523, "global_step": 430749, "epoch": 5189} {"train_loss": -26.26458740234375, "global_step": 430750, "epoch": 5189} {"train_loss": -26.72954750061035, "global_step": 430751, "epoch": 5189} {"train_loss": -27.026554107666016, "global_step": 430752, "epoch": 5189} {"train_loss": -26.982425689697266, "global_step": 430753, "epoch": 5189} {"train_loss": -27.01444435119629, "global_step": 430754, "epoch": 5189} {"train_loss": -26.69831657409668, "global_step": 430755, "epoch": 5189} {"train_loss": -26.856143951416016, "global_step": 430756, "epoch": 5189} {"train_loss": -26.5494384765625, "global_step": 430757, "epoch": 5189} {"train_loss": -26.636920928955078, "global_step": 430758, "epoch": 5189} {"train_loss": -27.063922882080078, "global_step": 430759, "epoch": 5189} {"train_loss": -26.824756622314453, "global_step": 430760, "epoch": 5189} {"train_loss": -26.850622177124023, "global_step": 430761, "epoch": 5189} {"train_loss": -27.1522159576416, "global_step": 430762, "epoch": 5189} {"train_loss": -26.698196411132812, "global_step": 430763, "epoch": 5189} {"train_loss": -26.832311630249023, "global_step": 430764, "epoch": 5189} {"train_loss": -26.790586471557617, "global_step": 430765, "epoch": 5189} {"train_loss": -26.96302604675293, "global_step": 430766, "epoch": 5189} {"train_loss": -26.94368553161621, "global_step": 430767, "epoch": 5189} {"train_loss": -26.965625762939453, "global_step": 430768, "epoch": 5189} {"train_loss": -26.66727008589779, "global_step": 430769, "epoch": 5189, "val_loss": 6855048.0} {"train_loss": -25.962949752807617, "global_step": 430770, "epoch": 5190} {"train_loss": -26.528284072875977, "global_step": 430771, "epoch": 5190} {"train_loss": -26.123249053955078, "global_step": 430772, "epoch": 5190} {"train_loss": -26.44740104675293, "global_step": 430773, "epoch": 5190} {"train_loss": -26.12579345703125, "global_step": 430774, "epoch": 5190} {"train_loss": -26.597768783569336, "global_step": 430775, "epoch": 5190} {"train_loss": -26.358001708984375, "global_step": 430776, "epoch": 5190} {"train_loss": -26.430830001831055, "global_step": 430777, "epoch": 5190} {"train_loss": -26.01507568359375, "global_step": 430778, "epoch": 5190} {"train_loss": -26.940885543823242, "global_step": 430779, "epoch": 5190} {"train_loss": -26.81244468688965, "global_step": 430780, "epoch": 5190} {"train_loss": -25.945951461791992, "global_step": 430781, "epoch": 5190} {"train_loss": -26.410388946533203, "global_step": 430782, "epoch": 5190} {"train_loss": -26.534656524658203, "global_step": 430783, "epoch": 5190} {"train_loss": -26.549091339111328, "global_step": 430784, "epoch": 5190} {"train_loss": -26.735721588134766, "global_step": 430785, "epoch": 5190} {"train_loss": -26.729650497436523, "global_step": 430786, "epoch": 5190} {"train_loss": -26.398115158081055, "global_step": 430787, "epoch": 5190} {"train_loss": -26.672903060913086, "global_step": 430788, "epoch": 5190} {"train_loss": -26.902679443359375, "global_step": 430789, "epoch": 5190} {"train_loss": -26.570505142211914, "global_step": 430790, "epoch": 5190} {"train_loss": -26.51862144470215, "global_step": 430791, "epoch": 5190} {"train_loss": -26.834091186523438, "global_step": 430792, "epoch": 5190} {"train_loss": -26.864904403686523, "global_step": 430793, "epoch": 5190} {"train_loss": -26.654438018798828, "global_step": 430794, "epoch": 5190} {"train_loss": -26.7657413482666, "global_step": 430795, "epoch": 5190} {"train_loss": -27.163745880126953, "global_step": 430796, "epoch": 5190} {"train_loss": -26.732328414916992, "global_step": 430797, "epoch": 5190} {"train_loss": -26.839330673217773, "global_step": 430798, "epoch": 5190} {"train_loss": -26.825164794921875, "global_step": 430799, "epoch": 5190} {"train_loss": -26.72297477722168, "global_step": 430800, "epoch": 5190} {"train_loss": -26.637556076049805, "global_step": 430801, "epoch": 5190} {"train_loss": -27.19489860534668, "global_step": 430802, "epoch": 5190} {"train_loss": -26.8448486328125, "global_step": 430803, "epoch": 5190} {"train_loss": -26.90352439880371, "global_step": 430804, "epoch": 5190} {"train_loss": -26.88174819946289, "global_step": 430805, "epoch": 5190} {"train_loss": -26.750574111938477, "global_step": 430806, "epoch": 5190} {"train_loss": -27.124746322631836, "global_step": 430807, "epoch": 5190} {"train_loss": -26.557538986206055, "global_step": 430808, "epoch": 5190} {"train_loss": -26.87550163269043, "global_step": 430809, "epoch": 5190} {"train_loss": -27.162322998046875, "global_step": 430810, "epoch": 5190} {"train_loss": -26.977209091186523, "global_step": 430811, "epoch": 5190} {"train_loss": -26.99654197692871, "global_step": 430812, "epoch": 5190} {"train_loss": -27.05826187133789, "global_step": 430813, "epoch": 5190} {"train_loss": -27.1806583404541, "global_step": 430814, "epoch": 5190} {"train_loss": -27.0932674407959, "global_step": 430815, "epoch": 5190} {"train_loss": -27.0125732421875, "global_step": 430816, "epoch": 5190} {"train_loss": -26.969568252563477, "global_step": 430817, "epoch": 5190} {"train_loss": -26.832563400268555, "global_step": 430818, "epoch": 5190} {"train_loss": -27.005517959594727, "global_step": 430819, "epoch": 5190} {"train_loss": -26.878082275390625, "global_step": 430820, "epoch": 5190} {"train_loss": -27.005599975585938, "global_step": 430821, "epoch": 5190} {"train_loss": -27.068952560424805, "global_step": 430822, "epoch": 5190} {"train_loss": -27.02650260925293, "global_step": 430823, "epoch": 5190} {"train_loss": -27.27376365661621, "global_step": 430824, "epoch": 5190} {"train_loss": -26.906965255737305, "global_step": 430825, "epoch": 5190} {"train_loss": -26.576589584350586, "global_step": 430826, "epoch": 5190} {"train_loss": -26.906787872314453, "global_step": 430827, "epoch": 5190} {"train_loss": -26.7004337310791, "global_step": 430828, "epoch": 5190} {"train_loss": -26.985580444335938, "global_step": 430829, "epoch": 5190} {"train_loss": -26.74201774597168, "global_step": 430830, "epoch": 5190} {"train_loss": -27.0278377532959, "global_step": 430831, "epoch": 5190} {"train_loss": -27.05942153930664, "global_step": 430832, "epoch": 5190} {"train_loss": -26.77640724182129, "global_step": 430833, "epoch": 5190} {"train_loss": -26.93291664123535, "global_step": 430834, "epoch": 5190} {"train_loss": -26.751850128173828, "global_step": 430835, "epoch": 5190} {"train_loss": -26.42783546447754, "global_step": 430836, "epoch": 5190} {"train_loss": -26.8077335357666, "global_step": 430837, "epoch": 5190} {"train_loss": -26.84345054626465, "global_step": 430838, "epoch": 5190} {"train_loss": -26.689655303955078, "global_step": 430839, "epoch": 5190} {"train_loss": -27.4864444732666, "global_step": 430840, "epoch": 5190} {"train_loss": -27.230314254760742, "global_step": 430841, "epoch": 5190} {"train_loss": -26.625967025756836, "global_step": 430842, "epoch": 5190} {"train_loss": -26.932836532592773, "global_step": 430843, "epoch": 5190} {"train_loss": -27.061277389526367, "global_step": 430844, "epoch": 5190} {"train_loss": -27.063846588134766, "global_step": 430845, "epoch": 5190} {"train_loss": -27.233652114868164, "global_step": 430846, "epoch": 5190} {"train_loss": -26.689361572265625, "global_step": 430847, "epoch": 5190} {"train_loss": -26.731369018554688, "global_step": 430848, "epoch": 5190} {"train_loss": -26.8492488861084, "global_step": 430849, "epoch": 5190} {"train_loss": -26.467451095581055, "global_step": 430850, "epoch": 5190} {"train_loss": -26.972564697265625, "global_step": 430851, "epoch": 5190} {"train_loss": -26.807320307536298, "global_step": 430852, "epoch": 5190, "val_loss": 6724219.0} {"train_loss": -23.94623565673828, "global_step": 430853, "epoch": 5191} {"train_loss": -26.107166290283203, "global_step": 430854, "epoch": 5191} {"train_loss": -25.287372589111328, "global_step": 430855, "epoch": 5191} {"train_loss": -25.856115341186523, "global_step": 430856, "epoch": 5191} {"train_loss": -25.526132583618164, "global_step": 430857, "epoch": 5191} {"train_loss": -26.031293869018555, "global_step": 430858, "epoch": 5191} {"train_loss": -25.640180587768555, "global_step": 430859, "epoch": 5191} {"train_loss": -26.129247665405273, "global_step": 430860, "epoch": 5191} {"train_loss": -26.004993438720703, "global_step": 430861, "epoch": 5191} {"train_loss": -26.481298446655273, "global_step": 430862, "epoch": 5191} {"train_loss": -26.005399703979492, "global_step": 430863, "epoch": 5191} {"train_loss": -26.14703369140625, "global_step": 430864, "epoch": 5191} {"train_loss": -26.22174072265625, "global_step": 430865, "epoch": 5191} {"train_loss": -26.436365127563477, "global_step": 430866, "epoch": 5191} {"train_loss": -26.456180572509766, "global_step": 430867, "epoch": 5191} {"train_loss": -26.38848304748535, "global_step": 430868, "epoch": 5191} {"train_loss": -26.478025436401367, "global_step": 430869, "epoch": 5191} {"train_loss": -26.199243545532227, "global_step": 430870, "epoch": 5191} {"train_loss": -26.903181076049805, "global_step": 430871, "epoch": 5191} {"train_loss": -26.272397994995117, "global_step": 430872, "epoch": 5191} {"train_loss": -26.6214599609375, "global_step": 430873, "epoch": 5191} {"train_loss": -26.589590072631836, "global_step": 430874, "epoch": 5191} {"train_loss": -26.35023307800293, "global_step": 430875, "epoch": 5191} {"train_loss": -26.611364364624023, "global_step": 430876, "epoch": 5191} {"train_loss": -26.745004653930664, "global_step": 430877, "epoch": 5191} {"train_loss": -26.56276512145996, "global_step": 430878, "epoch": 5191} {"train_loss": -26.74544334411621, "global_step": 430879, "epoch": 5191} {"train_loss": -26.961408615112305, "global_step": 430880, "epoch": 5191} {"train_loss": -26.568572998046875, "global_step": 430881, "epoch": 5191} {"train_loss": -26.941808700561523, "global_step": 430882, "epoch": 5191} {"train_loss": -26.740863800048828, "global_step": 430883, "epoch": 5191} {"train_loss": -26.810956954956055, "global_step": 430884, "epoch": 5191} {"train_loss": -26.699743270874023, "global_step": 430885, "epoch": 5191} {"train_loss": -26.680877685546875, "global_step": 430886, "epoch": 5191} {"train_loss": -27.022785186767578, "global_step": 430887, "epoch": 5191} {"train_loss": -26.672149658203125, "global_step": 430888, "epoch": 5191} {"train_loss": -26.851367950439453, "global_step": 430889, "epoch": 5191} {"train_loss": -26.88861656188965, "global_step": 430890, "epoch": 5191} {"train_loss": -27.090620040893555, "global_step": 430891, "epoch": 5191} {"train_loss": -27.20125389099121, "global_step": 430892, "epoch": 5191} {"train_loss": -26.931812286376953, "global_step": 430893, "epoch": 5191} {"train_loss": -27.042749404907227, "global_step": 430894, "epoch": 5191} {"train_loss": -26.805774688720703, "global_step": 430895, "epoch": 5191} {"train_loss": -27.119892120361328, "global_step": 430896, "epoch": 5191} {"train_loss": -26.920751571655273, "global_step": 430897, "epoch": 5191} {"train_loss": -26.567182540893555, "global_step": 430898, "epoch": 5191} {"train_loss": -26.77020263671875, "global_step": 430899, "epoch": 5191} {"train_loss": -26.651891708374023, "global_step": 430900, "epoch": 5191} {"train_loss": -27.104822158813477, "global_step": 430901, "epoch": 5191} {"train_loss": -27.083026885986328, "global_step": 430902, "epoch": 5191} {"train_loss": -27.120267868041992, "global_step": 430903, "epoch": 5191} {"train_loss": -26.835500717163086, "global_step": 430904, "epoch": 5191} {"train_loss": -27.348724365234375, "global_step": 430905, "epoch": 5191} {"train_loss": -26.61366081237793, "global_step": 430906, "epoch": 5191} {"train_loss": -26.623991012573242, "global_step": 430907, "epoch": 5191} {"train_loss": -26.78375816345215, "global_step": 430908, "epoch": 5191} {"train_loss": -26.513092041015625, "global_step": 430909, "epoch": 5191} {"train_loss": -27.034637451171875, "global_step": 430910, "epoch": 5191} {"train_loss": -26.942245483398438, "global_step": 430911, "epoch": 5191} {"train_loss": -26.744094848632812, "global_step": 430912, "epoch": 5191} {"train_loss": -26.77248191833496, "global_step": 430913, "epoch": 5191} {"train_loss": -26.42860221862793, "global_step": 430914, "epoch": 5191} {"train_loss": -26.828222274780273, "global_step": 430915, "epoch": 5191} {"train_loss": -26.978384017944336, "global_step": 430916, "epoch": 5191} {"train_loss": -26.874664306640625, "global_step": 430917, "epoch": 5191} {"train_loss": -26.893543243408203, "global_step": 430918, "epoch": 5191} {"train_loss": -27.1455020904541, "global_step": 430919, "epoch": 5191} {"train_loss": -27.15785026550293, "global_step": 430920, "epoch": 5191} {"train_loss": -27.040735244750977, "global_step": 430921, "epoch": 5191} {"train_loss": -26.61746597290039, "global_step": 430922, "epoch": 5191} {"train_loss": -26.886030197143555, "global_step": 430923, "epoch": 5191} {"train_loss": -26.742002487182617, "global_step": 430924, "epoch": 5191} {"train_loss": -27.160552978515625, "global_step": 430925, "epoch": 5191} {"train_loss": -27.149795532226562, "global_step": 430926, "epoch": 5191} {"train_loss": -26.68451499938965, "global_step": 430927, "epoch": 5191} {"train_loss": -27.252939224243164, "global_step": 430928, "epoch": 5191} {"train_loss": -26.56208610534668, "global_step": 430929, "epoch": 5191} {"train_loss": -26.794004440307617, "global_step": 430930, "epoch": 5191} {"train_loss": -26.841949462890625, "global_step": 430931, "epoch": 5191} {"train_loss": -27.092975616455078, "global_step": 430932, "epoch": 5191} {"train_loss": -27.104108810424805, "global_step": 430933, "epoch": 5191} {"train_loss": -27.219579696655273, "global_step": 430934, "epoch": 5191} {"train_loss": -26.67158708227686, "global_step": 430935, "epoch": 5191, "val_loss": 6759566.0} {"train_loss": -26.230798721313477, "global_step": 430936, "epoch": 5192} {"train_loss": -25.488670349121094, "global_step": 430937, "epoch": 5192} {"train_loss": -24.989238739013672, "global_step": 430938, "epoch": 5192} {"train_loss": -24.6785888671875, "global_step": 430939, "epoch": 5192} {"train_loss": -25.53995704650879, "global_step": 430940, "epoch": 5192} {"train_loss": -25.7535457611084, "global_step": 430941, "epoch": 5192} {"train_loss": -25.21400260925293, "global_step": 430942, "epoch": 5192} {"train_loss": -25.96512794494629, "global_step": 430943, "epoch": 5192} {"train_loss": -26.4070987701416, "global_step": 430944, "epoch": 5192} {"train_loss": -26.106794357299805, "global_step": 430945, "epoch": 5192} {"train_loss": -26.389545440673828, "global_step": 430946, "epoch": 5192} {"train_loss": -26.49275779724121, "global_step": 430947, "epoch": 5192} {"train_loss": -26.172399520874023, "global_step": 430948, "epoch": 5192} {"train_loss": -26.502628326416016, "global_step": 430949, "epoch": 5192} {"train_loss": -26.746129989624023, "global_step": 430950, "epoch": 5192} {"train_loss": -26.045026779174805, "global_step": 430951, "epoch": 5192} {"train_loss": -26.831144332885742, "global_step": 430952, "epoch": 5192} {"train_loss": -26.709716796875, "global_step": 430953, "epoch": 5192} {"train_loss": -26.725269317626953, "global_step": 430954, "epoch": 5192} {"train_loss": -26.00360107421875, "global_step": 430955, "epoch": 5192} {"train_loss": -26.5200138092041, "global_step": 430956, "epoch": 5192} {"train_loss": -26.746240615844727, "global_step": 430957, "epoch": 5192} {"train_loss": -26.660791397094727, "global_step": 430958, "epoch": 5192} {"train_loss": -26.957754135131836, "global_step": 430959, "epoch": 5192} {"train_loss": -26.818038940429688, "global_step": 430960, "epoch": 5192} {"train_loss": -26.5089054107666, "global_step": 430961, "epoch": 5192} {"train_loss": -26.770872116088867, "global_step": 430962, "epoch": 5192} {"train_loss": -26.804462432861328, "global_step": 430963, "epoch": 5192} {"train_loss": -26.8309383392334, "global_step": 430964, "epoch": 5192} {"train_loss": -26.69826316833496, "global_step": 430965, "epoch": 5192} {"train_loss": -26.614912033081055, "global_step": 430966, "epoch": 5192} {"train_loss": -26.594207763671875, "global_step": 430967, "epoch": 5192} {"train_loss": -26.926132202148438, "global_step": 430968, "epoch": 5192} {"train_loss": -27.224140167236328, "global_step": 430969, "epoch": 5192} {"train_loss": -27.143085479736328, "global_step": 430970, "epoch": 5192} {"train_loss": -26.927438735961914, "global_step": 430971, "epoch": 5192} {"train_loss": -27.23749351501465, "global_step": 430972, "epoch": 5192} {"train_loss": -26.64582633972168, "global_step": 430973, "epoch": 5192} {"train_loss": -26.913257598876953, "global_step": 430974, "epoch": 5192} {"train_loss": -27.324298858642578, "global_step": 430975, "epoch": 5192} {"train_loss": -27.119709014892578, "global_step": 430976, "epoch": 5192} {"train_loss": -26.9360294342041, "global_step": 430977, "epoch": 5192} {"train_loss": -26.99664306640625, "global_step": 430978, "epoch": 5192} {"train_loss": -27.283605575561523, "global_step": 430979, "epoch": 5192} {"train_loss": -26.90034294128418, "global_step": 430980, "epoch": 5192} {"train_loss": -27.17255210876465, "global_step": 430981, "epoch": 5192} {"train_loss": -26.863916397094727, "global_step": 430982, "epoch": 5192} {"train_loss": -27.264856338500977, "global_step": 430983, "epoch": 5192} {"train_loss": -27.137720108032227, "global_step": 430984, "epoch": 5192} {"train_loss": -26.941492080688477, "global_step": 430985, "epoch": 5192} {"train_loss": -26.340463638305664, "global_step": 430986, "epoch": 5192} {"train_loss": -26.63117027282715, "global_step": 430987, "epoch": 5192} {"train_loss": -26.860492706298828, "global_step": 430988, "epoch": 5192} {"train_loss": -27.1455135345459, "global_step": 430989, "epoch": 5192} {"train_loss": -27.087583541870117, "global_step": 430990, "epoch": 5192} {"train_loss": -27.185749053955078, "global_step": 430991, "epoch": 5192} {"train_loss": -27.047693252563477, "global_step": 430992, "epoch": 5192} {"train_loss": -27.048126220703125, "global_step": 430993, "epoch": 5192} {"train_loss": -26.980789184570312, "global_step": 430994, "epoch": 5192} {"train_loss": -27.197275161743164, "global_step": 430995, "epoch": 5192} {"train_loss": -26.675317764282227, "global_step": 430996, "epoch": 5192} {"train_loss": -26.990463256835938, "global_step": 430997, "epoch": 5192} {"train_loss": -27.2735595703125, "global_step": 430998, "epoch": 5192} {"train_loss": -26.973066329956055, "global_step": 430999, "epoch": 5192} {"train_loss": -26.638105392456055, "global_step": 431000, "epoch": 5192} {"train_loss": -27.007116317749023, "global_step": 431001, "epoch": 5192} {"train_loss": -26.838499069213867, "global_step": 431002, "epoch": 5192} {"train_loss": -26.719837188720703, "global_step": 431003, "epoch": 5192} {"train_loss": -26.683561325073242, "global_step": 431004, "epoch": 5192} {"train_loss": -26.4510498046875, "global_step": 431005, "epoch": 5192} {"train_loss": -26.525043487548828, "global_step": 431006, "epoch": 5192} {"train_loss": -26.490381240844727, "global_step": 431007, "epoch": 5192} {"train_loss": -25.419843673706055, "global_step": 431008, "epoch": 5192} {"train_loss": -24.790231704711914, "global_step": 431009, "epoch": 5192} {"train_loss": -25.372039794921875, "global_step": 431010, "epoch": 5192} {"train_loss": -26.64545249938965, "global_step": 431011, "epoch": 5192} {"train_loss": -26.591114044189453, "global_step": 431012, "epoch": 5192} {"train_loss": -26.4193172454834, "global_step": 431013, "epoch": 5192} {"train_loss": -26.5797061920166, "global_step": 431014, "epoch": 5192} {"train_loss": -26.285079956054688, "global_step": 431015, "epoch": 5192} {"train_loss": -26.36353874206543, "global_step": 431016, "epoch": 5192} {"train_loss": -26.77351188659668, "global_step": 431017, "epoch": 5192} {"train_loss": -26.591703667698138, "global_step": 431018, "epoch": 5192, "val_loss": 6713124.0} {"train_loss": -26.201391220092773, "global_step": 431019, "epoch": 5193} {"train_loss": -26.238632202148438, "global_step": 431020, "epoch": 5193} {"train_loss": -26.275405883789062, "global_step": 431021, "epoch": 5193} {"train_loss": -26.233386993408203, "global_step": 431022, "epoch": 5193} {"train_loss": -25.797300338745117, "global_step": 431023, "epoch": 5193} {"train_loss": -26.5510196685791, "global_step": 431024, "epoch": 5193} {"train_loss": -26.269428253173828, "global_step": 431025, "epoch": 5193} {"train_loss": -26.5047607421875, "global_step": 431026, "epoch": 5193} {"train_loss": -26.347742080688477, "global_step": 431027, "epoch": 5193} {"train_loss": -26.381778717041016, "global_step": 431028, "epoch": 5193} {"train_loss": -26.68768882751465, "global_step": 431029, "epoch": 5193} {"train_loss": -26.55695915222168, "global_step": 431030, "epoch": 5193} {"train_loss": -26.55826759338379, "global_step": 431031, "epoch": 5193} {"train_loss": -26.805749893188477, "global_step": 431032, "epoch": 5193} {"train_loss": -26.625064849853516, "global_step": 431033, "epoch": 5193} {"train_loss": -26.504505157470703, "global_step": 431034, "epoch": 5193} {"train_loss": -26.9898624420166, "global_step": 431035, "epoch": 5193} {"train_loss": -26.6595458984375, "global_step": 431036, "epoch": 5193} {"train_loss": -26.707122802734375, "global_step": 431037, "epoch": 5193} {"train_loss": -26.475854873657227, "global_step": 431038, "epoch": 5193} {"train_loss": -26.515588760375977, "global_step": 431039, "epoch": 5193} {"train_loss": -26.766889572143555, "global_step": 431040, "epoch": 5193} {"train_loss": -27.01570701599121, "global_step": 431041, "epoch": 5193} {"train_loss": -26.803680419921875, "global_step": 431042, "epoch": 5193} {"train_loss": -26.80677604675293, "global_step": 431043, "epoch": 5193} {"train_loss": -26.890710830688477, "global_step": 431044, "epoch": 5193} {"train_loss": -26.8150691986084, "global_step": 431045, "epoch": 5193} {"train_loss": -27.056842803955078, "global_step": 431046, "epoch": 5193} {"train_loss": -26.6314697265625, "global_step": 431047, "epoch": 5193} {"train_loss": -26.65650749206543, "global_step": 431048, "epoch": 5193} {"train_loss": -26.96624183654785, "global_step": 431049, "epoch": 5193} {"train_loss": -26.883237838745117, "global_step": 431050, "epoch": 5193} {"train_loss": -27.06083106994629, "global_step": 431051, "epoch": 5193} {"train_loss": -26.67218589782715, "global_step": 431052, "epoch": 5193} {"train_loss": -26.771595001220703, "global_step": 431053, "epoch": 5193} {"train_loss": -26.960742950439453, "global_step": 431054, "epoch": 5193} {"train_loss": -26.930646896362305, "global_step": 431055, "epoch": 5193} {"train_loss": -27.377063751220703, "global_step": 431056, "epoch": 5193} {"train_loss": -26.815549850463867, "global_step": 431057, "epoch": 5193} {"train_loss": -26.682575225830078, "global_step": 431058, "epoch": 5193} {"train_loss": -26.821313858032227, "global_step": 431059, "epoch": 5193} {"train_loss": -27.3427791595459, "global_step": 431060, "epoch": 5193} {"train_loss": -26.70697593688965, "global_step": 431061, "epoch": 5193} {"train_loss": -26.761823654174805, "global_step": 431062, "epoch": 5193} {"train_loss": -26.811664581298828, "global_step": 431063, "epoch": 5193} {"train_loss": -27.329553604125977, "global_step": 431064, "epoch": 5193} {"train_loss": -26.963809967041016, "global_step": 431065, "epoch": 5193} {"train_loss": -26.930526733398438, "global_step": 431066, "epoch": 5193} {"train_loss": -26.725732803344727, "global_step": 431067, "epoch": 5193} {"train_loss": -26.792404174804688, "global_step": 431068, "epoch": 5193} {"train_loss": -26.755374908447266, "global_step": 431069, "epoch": 5193} {"train_loss": -26.920862197875977, "global_step": 431070, "epoch": 5193} {"train_loss": -27.3995418548584, "global_step": 431071, "epoch": 5193} {"train_loss": -27.110950469970703, "global_step": 431072, "epoch": 5193} {"train_loss": -27.287521362304688, "global_step": 431073, "epoch": 5193} {"train_loss": -26.810224533081055, "global_step": 431074, "epoch": 5193} {"train_loss": -26.98084831237793, "global_step": 431075, "epoch": 5193} {"train_loss": -26.946752548217773, "global_step": 431076, "epoch": 5193} {"train_loss": -27.35232925415039, "global_step": 431077, "epoch": 5193} {"train_loss": -27.056669235229492, "global_step": 431078, "epoch": 5193} {"train_loss": -26.823583602905273, "global_step": 431079, "epoch": 5193} {"train_loss": -26.734228134155273, "global_step": 431080, "epoch": 5193} {"train_loss": -27.21624183654785, "global_step": 431081, "epoch": 5193} {"train_loss": -27.2082576751709, "global_step": 431082, "epoch": 5193} {"train_loss": -27.079328536987305, "global_step": 431083, "epoch": 5193} {"train_loss": -27.2401065826416, "global_step": 431084, "epoch": 5193} {"train_loss": -26.99884033203125, "global_step": 431085, "epoch": 5193} {"train_loss": -26.802209854125977, "global_step": 431086, "epoch": 5193} {"train_loss": -27.373517990112305, "global_step": 431087, "epoch": 5193} {"train_loss": -26.93708610534668, "global_step": 431088, "epoch": 5193} {"train_loss": -26.864835739135742, "global_step": 431089, "epoch": 5193} {"train_loss": -26.572498321533203, "global_step": 431090, "epoch": 5193} {"train_loss": -26.388900756835938, "global_step": 431091, "epoch": 5193} {"train_loss": -27.022796630859375, "global_step": 431092, "epoch": 5193} {"train_loss": -26.699934005737305, "global_step": 431093, "epoch": 5193} {"train_loss": -26.708948135375977, "global_step": 431094, "epoch": 5193} {"train_loss": -26.92799186706543, "global_step": 431095, "epoch": 5193} {"train_loss": -26.326858520507812, "global_step": 431096, "epoch": 5193} {"train_loss": -26.413894653320312, "global_step": 431097, "epoch": 5193} {"train_loss": -26.894763946533203, "global_step": 431098, "epoch": 5193} {"train_loss": -26.471174240112305, "global_step": 431099, "epoch": 5193} {"train_loss": -26.72943687438965, "global_step": 431100, "epoch": 5193} {"train_loss": -26.787437324064324, "global_step": 431101, "epoch": 5193, "val_loss": 6644168.5} {"train_loss": -25.816877365112305, "global_step": 431102, "epoch": 5194} {"train_loss": -25.994592666625977, "global_step": 431103, "epoch": 5194} {"train_loss": -26.382965087890625, "global_step": 431104, "epoch": 5194} {"train_loss": -26.054428100585938, "global_step": 431105, "epoch": 5194} {"train_loss": -25.532148361206055, "global_step": 431106, "epoch": 5194} {"train_loss": -26.21436882019043, "global_step": 431107, "epoch": 5194} {"train_loss": -26.435651779174805, "global_step": 431108, "epoch": 5194} {"train_loss": -25.810749053955078, "global_step": 431109, "epoch": 5194} {"train_loss": -26.649261474609375, "global_step": 431110, "epoch": 5194} {"train_loss": -26.6279239654541, "global_step": 431111, "epoch": 5194} {"train_loss": -26.19293212890625, "global_step": 431112, "epoch": 5194} {"train_loss": -26.471637725830078, "global_step": 431113, "epoch": 5194} {"train_loss": -26.68519401550293, "global_step": 431114, "epoch": 5194} {"train_loss": -26.644882202148438, "global_step": 431115, "epoch": 5194} {"train_loss": -26.638599395751953, "global_step": 431116, "epoch": 5194} {"train_loss": -26.202157974243164, "global_step": 431117, "epoch": 5194} {"train_loss": -26.61859703063965, "global_step": 431118, "epoch": 5194} {"train_loss": -26.693634033203125, "global_step": 431119, "epoch": 5194} {"train_loss": -26.382593154907227, "global_step": 431120, "epoch": 5194} {"train_loss": -26.608739852905273, "global_step": 431121, "epoch": 5194} {"train_loss": -27.167835235595703, "global_step": 431122, "epoch": 5194} {"train_loss": -26.971668243408203, "global_step": 431123, "epoch": 5194} {"train_loss": -26.9490966796875, "global_step": 431124, "epoch": 5194} {"train_loss": -26.691205978393555, "global_step": 431125, "epoch": 5194} {"train_loss": -27.01934242248535, "global_step": 431126, "epoch": 5194} {"train_loss": -27.13862419128418, "global_step": 431127, "epoch": 5194} {"train_loss": -26.928125381469727, "global_step": 431128, "epoch": 5194} {"train_loss": -26.545642852783203, "global_step": 431129, "epoch": 5194} {"train_loss": -26.51169776916504, "global_step": 431130, "epoch": 5194} {"train_loss": -26.56113052368164, "global_step": 431131, "epoch": 5194} {"train_loss": -27.0322265625, "global_step": 431132, "epoch": 5194} {"train_loss": -27.026351928710938, "global_step": 431133, "epoch": 5194} {"train_loss": -26.702890396118164, "global_step": 431134, "epoch": 5194} {"train_loss": -26.824106216430664, "global_step": 431135, "epoch": 5194} {"train_loss": -26.932693481445312, "global_step": 431136, "epoch": 5194} {"train_loss": -26.882543563842773, "global_step": 431137, "epoch": 5194} {"train_loss": -27.270193099975586, "global_step": 431138, "epoch": 5194} {"train_loss": -26.952957153320312, "global_step": 431139, "epoch": 5194} {"train_loss": -27.121145248413086, "global_step": 431140, "epoch": 5194} {"train_loss": -26.944238662719727, "global_step": 431141, "epoch": 5194} {"train_loss": -27.23346519470215, "global_step": 431142, "epoch": 5194} {"train_loss": -27.310718536376953, "global_step": 431143, "epoch": 5194} {"train_loss": -26.89103126525879, "global_step": 431144, "epoch": 5194} {"train_loss": -27.018787384033203, "global_step": 431145, "epoch": 5194} {"train_loss": -27.2665958404541, "global_step": 431146, "epoch": 5194} {"train_loss": -26.639829635620117, "global_step": 431147, "epoch": 5194} {"train_loss": -27.168903350830078, "global_step": 431148, "epoch": 5194} {"train_loss": -27.208410263061523, "global_step": 431149, "epoch": 5194} {"train_loss": -26.5434513092041, "global_step": 431150, "epoch": 5194} {"train_loss": -26.98721694946289, "global_step": 431151, "epoch": 5194} {"train_loss": -27.093809127807617, "global_step": 431152, "epoch": 5194} {"train_loss": -27.005279541015625, "global_step": 431153, "epoch": 5194} {"train_loss": -27.21695899963379, "global_step": 431154, "epoch": 5194} {"train_loss": -27.023639678955078, "global_step": 431155, "epoch": 5194} {"train_loss": -27.309314727783203, "global_step": 431156, "epoch": 5194} {"train_loss": -26.6520938873291, "global_step": 431157, "epoch": 5194} {"train_loss": -26.888513565063477, "global_step": 431158, "epoch": 5194} {"train_loss": -27.049488067626953, "global_step": 431159, "epoch": 5194} {"train_loss": -26.76535987854004, "global_step": 431160, "epoch": 5194} {"train_loss": -26.4351749420166, "global_step": 431161, "epoch": 5194} {"train_loss": -26.665851593017578, "global_step": 431162, "epoch": 5194} {"train_loss": -26.912790298461914, "global_step": 431163, "epoch": 5194} {"train_loss": -26.842275619506836, "global_step": 431164, "epoch": 5194} {"train_loss": -26.516904830932617, "global_step": 431165, "epoch": 5194} {"train_loss": -26.60211753845215, "global_step": 431166, "epoch": 5194} {"train_loss": -26.975366592407227, "global_step": 431167, "epoch": 5194} {"train_loss": -26.445295333862305, "global_step": 431168, "epoch": 5194} {"train_loss": -27.267017364501953, "global_step": 431169, "epoch": 5194} {"train_loss": -26.678327560424805, "global_step": 431170, "epoch": 5194} {"train_loss": -27.076459884643555, "global_step": 431171, "epoch": 5194} {"train_loss": -26.816497802734375, "global_step": 431172, "epoch": 5194} {"train_loss": -26.707962036132812, "global_step": 431173, "epoch": 5194} {"train_loss": -27.032032012939453, "global_step": 431174, "epoch": 5194} {"train_loss": -26.851953506469727, "global_step": 431175, "epoch": 5194} {"train_loss": -26.569677352905273, "global_step": 431176, "epoch": 5194} {"train_loss": -26.775516510009766, "global_step": 431177, "epoch": 5194} {"train_loss": -26.8853702545166, "global_step": 431178, "epoch": 5194} {"train_loss": -27.005878448486328, "global_step": 431179, "epoch": 5194} {"train_loss": -26.452417373657227, "global_step": 431180, "epoch": 5194} {"train_loss": -25.690561294555664, "global_step": 431181, "epoch": 5194} {"train_loss": -26.058185577392578, "global_step": 431182, "epoch": 5194} {"train_loss": -26.108322143554688, "global_step": 431183, "epoch": 5194} {"train_loss": -26.71152052821883, "global_step": 431184, "epoch": 5194, "val_loss": 6755593.0} {"train_loss": -25.08332633972168, "global_step": 431185, "epoch": 5195} {"train_loss": -24.35133934020996, "global_step": 431186, "epoch": 5195} {"train_loss": -26.17180824279785, "global_step": 431187, "epoch": 5195} {"train_loss": -24.946800231933594, "global_step": 431188, "epoch": 5195} {"train_loss": -25.873098373413086, "global_step": 431189, "epoch": 5195} {"train_loss": -25.357696533203125, "global_step": 431190, "epoch": 5195} {"train_loss": -26.042325973510742, "global_step": 431191, "epoch": 5195} {"train_loss": -25.509801864624023, "global_step": 431192, "epoch": 5195} {"train_loss": -26.004302978515625, "global_step": 431193, "epoch": 5195} {"train_loss": -25.87310218811035, "global_step": 431194, "epoch": 5195} {"train_loss": -25.928272247314453, "global_step": 431195, "epoch": 5195} {"train_loss": -26.04733657836914, "global_step": 431196, "epoch": 5195} {"train_loss": -25.862287521362305, "global_step": 431197, "epoch": 5195} {"train_loss": -26.305805206298828, "global_step": 431198, "epoch": 5195} {"train_loss": -26.20199966430664, "global_step": 431199, "epoch": 5195} {"train_loss": -26.691373825073242, "global_step": 431200, "epoch": 5195} {"train_loss": -25.777572631835938, "global_step": 431201, "epoch": 5195} {"train_loss": -26.515241622924805, "global_step": 431202, "epoch": 5195} {"train_loss": -26.26173210144043, "global_step": 431203, "epoch": 5195} {"train_loss": -26.341108322143555, "global_step": 431204, "epoch": 5195} {"train_loss": -26.155649185180664, "global_step": 431205, "epoch": 5195} {"train_loss": -26.448566436767578, "global_step": 431206, "epoch": 5195} {"train_loss": -26.303497314453125, "global_step": 431207, "epoch": 5195} {"train_loss": -26.408369064331055, "global_step": 431208, "epoch": 5195} {"train_loss": -26.878812789916992, "global_step": 431209, "epoch": 5195} {"train_loss": -26.277347564697266, "global_step": 431210, "epoch": 5195} {"train_loss": -26.513757705688477, "global_step": 431211, "epoch": 5195} {"train_loss": -26.60164451599121, "global_step": 431212, "epoch": 5195} {"train_loss": -26.536569595336914, "global_step": 431213, "epoch": 5195} {"train_loss": -26.545520782470703, "global_step": 431214, "epoch": 5195} {"train_loss": -26.456806182861328, "global_step": 431215, "epoch": 5195} {"train_loss": -26.772993087768555, "global_step": 431216, "epoch": 5195} {"train_loss": -26.50174331665039, "global_step": 431217, "epoch": 5195} {"train_loss": -26.675540924072266, "global_step": 431218, "epoch": 5195} {"train_loss": -26.45403480529785, "global_step": 431219, "epoch": 5195} {"train_loss": -26.834716796875, "global_step": 431220, "epoch": 5195} {"train_loss": -26.64967155456543, "global_step": 431221, "epoch": 5195} {"train_loss": -26.77532386779785, "global_step": 431222, "epoch": 5195} {"train_loss": -26.852344512939453, "global_step": 431223, "epoch": 5195} {"train_loss": -26.605314254760742, "global_step": 431224, "epoch": 5195} {"train_loss": -26.68696403503418, "global_step": 431225, "epoch": 5195} {"train_loss": -27.00885581970215, "global_step": 431226, "epoch": 5195} {"train_loss": -26.68633460998535, "global_step": 431227, "epoch": 5195} {"train_loss": -26.68397331237793, "global_step": 431228, "epoch": 5195} {"train_loss": -26.798583984375, "global_step": 431229, "epoch": 5195} {"train_loss": -27.033191680908203, "global_step": 431230, "epoch": 5195} {"train_loss": -26.8680477142334, "global_step": 431231, "epoch": 5195} {"train_loss": -26.93305015563965, "global_step": 431232, "epoch": 5195} {"train_loss": -26.930622100830078, "global_step": 431233, "epoch": 5195} {"train_loss": -26.810882568359375, "global_step": 431234, "epoch": 5195} {"train_loss": -26.8095645904541, "global_step": 431235, "epoch": 5195} {"train_loss": -26.926300048828125, "global_step": 431236, "epoch": 5195} {"train_loss": -26.997695922851562, "global_step": 431237, "epoch": 5195} {"train_loss": -26.695112228393555, "global_step": 431238, "epoch": 5195} {"train_loss": -26.383676528930664, "global_step": 431239, "epoch": 5195} {"train_loss": -26.38990592956543, "global_step": 431240, "epoch": 5195} {"train_loss": -26.838354110717773, "global_step": 431241, "epoch": 5195} {"train_loss": -26.55482292175293, "global_step": 431242, "epoch": 5195} {"train_loss": -26.94917106628418, "global_step": 431243, "epoch": 5195} {"train_loss": -26.688995361328125, "global_step": 431244, "epoch": 5195} {"train_loss": -26.95879554748535, "global_step": 431245, "epoch": 5195} {"train_loss": -26.650440216064453, "global_step": 431246, "epoch": 5195} {"train_loss": -26.63111686706543, "global_step": 431247, "epoch": 5195} {"train_loss": -27.278974533081055, "global_step": 431248, "epoch": 5195} {"train_loss": -26.988330841064453, "global_step": 431249, "epoch": 5195} {"train_loss": -27.148340225219727, "global_step": 431250, "epoch": 5195} {"train_loss": -27.005233764648438, "global_step": 431251, "epoch": 5195} {"train_loss": -27.15680503845215, "global_step": 431252, "epoch": 5195} {"train_loss": -27.111358642578125, "global_step": 431253, "epoch": 5195} {"train_loss": -27.0841007232666, "global_step": 431254, "epoch": 5195} {"train_loss": -27.0434627532959, "global_step": 431255, "epoch": 5195} {"train_loss": -26.807119369506836, "global_step": 431256, "epoch": 5195} {"train_loss": -27.144094467163086, "global_step": 431257, "epoch": 5195} {"train_loss": -26.64301109313965, "global_step": 431258, "epoch": 5195} {"train_loss": -26.878076553344727, "global_step": 431259, "epoch": 5195} {"train_loss": -27.059192657470703, "global_step": 431260, "epoch": 5195} {"train_loss": -27.043380737304688, "global_step": 431261, "epoch": 5195} {"train_loss": -26.86042594909668, "global_step": 431262, "epoch": 5195} {"train_loss": -27.143152236938477, "global_step": 431263, "epoch": 5195} {"train_loss": -27.365528106689453, "global_step": 431264, "epoch": 5195} {"train_loss": -27.029016494750977, "global_step": 431265, "epoch": 5195} {"train_loss": -26.858448028564453, "global_step": 431266, "epoch": 5195} {"train_loss": -26.555404318384376, "global_step": 431267, "epoch": 5195, "val_loss": 6832632.0} {"train_loss": -24.783098220825195, "global_step": 431268, "epoch": 5196} {"train_loss": -24.68329429626465, "global_step": 431269, "epoch": 5196} {"train_loss": -25.105276107788086, "global_step": 431270, "epoch": 5196} {"train_loss": -25.515506744384766, "global_step": 431271, "epoch": 5196} {"train_loss": -25.416229248046875, "global_step": 431272, "epoch": 5196} {"train_loss": -24.532089233398438, "global_step": 431273, "epoch": 5196} {"train_loss": -25.9296875, "global_step": 431274, "epoch": 5196} {"train_loss": -25.678861618041992, "global_step": 431275, "epoch": 5196} {"train_loss": -25.77707290649414, "global_step": 431276, "epoch": 5196} {"train_loss": -25.9664249420166, "global_step": 431277, "epoch": 5196} {"train_loss": -25.49114990234375, "global_step": 431278, "epoch": 5196} {"train_loss": -25.72699546813965, "global_step": 431279, "epoch": 5196} {"train_loss": -26.28618812561035, "global_step": 431280, "epoch": 5196} {"train_loss": -25.94024085998535, "global_step": 431281, "epoch": 5196} {"train_loss": -26.292871475219727, "global_step": 431282, "epoch": 5196} {"train_loss": -26.1152400970459, "global_step": 431283, "epoch": 5196} {"train_loss": -26.34490394592285, "global_step": 431284, "epoch": 5196} {"train_loss": -26.312681198120117, "global_step": 431285, "epoch": 5196} {"train_loss": -25.907867431640625, "global_step": 431286, "epoch": 5196} {"train_loss": -26.362869262695312, "global_step": 431287, "epoch": 5196} {"train_loss": -26.396881103515625, "global_step": 431288, "epoch": 5196} {"train_loss": -26.298608779907227, "global_step": 431289, "epoch": 5196} {"train_loss": -26.320959091186523, "global_step": 431290, "epoch": 5196} {"train_loss": -26.494861602783203, "global_step": 431291, "epoch": 5196} {"train_loss": -25.9119930267334, "global_step": 431292, "epoch": 5196} {"train_loss": -26.405170440673828, "global_step": 431293, "epoch": 5196} {"train_loss": -26.400793075561523, "global_step": 431294, "epoch": 5196} {"train_loss": -26.780996322631836, "global_step": 431295, "epoch": 5196} {"train_loss": -26.4107723236084, "global_step": 431296, "epoch": 5196} {"train_loss": -26.586654663085938, "global_step": 431297, "epoch": 5196} {"train_loss": -26.486923217773438, "global_step": 431298, "epoch": 5196} {"train_loss": -26.74281120300293, "global_step": 431299, "epoch": 5196} {"train_loss": -26.967819213867188, "global_step": 431300, "epoch": 5196} {"train_loss": -26.74856948852539, "global_step": 431301, "epoch": 5196} {"train_loss": -26.53794288635254, "global_step": 431302, "epoch": 5196} {"train_loss": -26.538618087768555, "global_step": 431303, "epoch": 5196} {"train_loss": -26.667072296142578, "global_step": 431304, "epoch": 5196} {"train_loss": -26.4118595123291, "global_step": 431305, "epoch": 5196} {"train_loss": -26.5189151763916, "global_step": 431306, "epoch": 5196} {"train_loss": -26.643756866455078, "global_step": 431307, "epoch": 5196} {"train_loss": -26.817304611206055, "global_step": 431308, "epoch": 5196} {"train_loss": -26.76234245300293, "global_step": 431309, "epoch": 5196} {"train_loss": -26.757055282592773, "global_step": 431310, "epoch": 5196} {"train_loss": -27.029199600219727, "global_step": 431311, "epoch": 5196} {"train_loss": -26.964521408081055, "global_step": 431312, "epoch": 5196} {"train_loss": -26.898767471313477, "global_step": 431313, "epoch": 5196} {"train_loss": -27.064468383789062, "global_step": 431314, "epoch": 5196} {"train_loss": -27.07208824157715, "global_step": 431315, "epoch": 5196} {"train_loss": -26.927078247070312, "global_step": 431316, "epoch": 5196} {"train_loss": -27.048694610595703, "global_step": 431317, "epoch": 5196} {"train_loss": -27.041166305541992, "global_step": 431318, "epoch": 5196} {"train_loss": -26.748722076416016, "global_step": 431319, "epoch": 5196} {"train_loss": -27.344518661499023, "global_step": 431320, "epoch": 5196} {"train_loss": -26.863698959350586, "global_step": 431321, "epoch": 5196} {"train_loss": -26.704635620117188, "global_step": 431322, "epoch": 5196} {"train_loss": -27.290164947509766, "global_step": 431323, "epoch": 5196} {"train_loss": -27.042627334594727, "global_step": 431324, "epoch": 5196} {"train_loss": -26.63321876525879, "global_step": 431325, "epoch": 5196} {"train_loss": -27.13104248046875, "global_step": 431326, "epoch": 5196} {"train_loss": -26.95759391784668, "global_step": 431327, "epoch": 5196} {"train_loss": -26.972904205322266, "global_step": 431328, "epoch": 5196} {"train_loss": -26.872394561767578, "global_step": 431329, "epoch": 5196} {"train_loss": -26.770156860351562, "global_step": 431330, "epoch": 5196} {"train_loss": -27.2556095123291, "global_step": 431331, "epoch": 5196} {"train_loss": -26.689138412475586, "global_step": 431332, "epoch": 5196} {"train_loss": -26.715320587158203, "global_step": 431333, "epoch": 5196} {"train_loss": -26.9948673248291, "global_step": 431334, "epoch": 5196} {"train_loss": -26.67997169494629, "global_step": 431335, "epoch": 5196} {"train_loss": -26.56501579284668, "global_step": 431336, "epoch": 5196} {"train_loss": -26.87360954284668, "global_step": 431337, "epoch": 5196} {"train_loss": -26.89277458190918, "global_step": 431338, "epoch": 5196} {"train_loss": -26.885404586791992, "global_step": 431339, "epoch": 5196} {"train_loss": -27.164905548095703, "global_step": 431340, "epoch": 5196} {"train_loss": -26.972692489624023, "global_step": 431341, "epoch": 5196} {"train_loss": -27.058364868164062, "global_step": 431342, "epoch": 5196} {"train_loss": -27.17508888244629, "global_step": 431343, "epoch": 5196} {"train_loss": -27.189966201782227, "global_step": 431344, "epoch": 5196} {"train_loss": -27.147680282592773, "global_step": 431345, "epoch": 5196} {"train_loss": -27.19106101989746, "global_step": 431346, "epoch": 5196} {"train_loss": -27.040409088134766, "global_step": 431347, "epoch": 5196} {"train_loss": -27.082752227783203, "global_step": 431348, "epoch": 5196} {"train_loss": -27.052997589111328, "global_step": 431349, "epoch": 5196} {"train_loss": -26.54313689542104, "global_step": 431350, "epoch": 5196, "val_loss": 6813553.0} {"train_loss": -26.449182510375977, "global_step": 431351, "epoch": 5197} {"train_loss": -25.682065963745117, "global_step": 431352, "epoch": 5197} {"train_loss": -25.83049964904785, "global_step": 431353, "epoch": 5197} {"train_loss": -26.17268180847168, "global_step": 431354, "epoch": 5197} {"train_loss": -26.421131134033203, "global_step": 431355, "epoch": 5197} {"train_loss": -26.18473243713379, "global_step": 431356, "epoch": 5197} {"train_loss": -26.884611129760742, "global_step": 431357, "epoch": 5197} {"train_loss": -26.648151397705078, "global_step": 431358, "epoch": 5197} {"train_loss": -26.828479766845703, "global_step": 431359, "epoch": 5197} {"train_loss": -26.73077964782715, "global_step": 431360, "epoch": 5197} {"train_loss": -27.137853622436523, "global_step": 431361, "epoch": 5197} {"train_loss": -26.822690963745117, "global_step": 431362, "epoch": 5197} {"train_loss": -26.762958526611328, "global_step": 431363, "epoch": 5197} {"train_loss": -26.686542510986328, "global_step": 431364, "epoch": 5197} {"train_loss": -26.688873291015625, "global_step": 431365, "epoch": 5197} {"train_loss": -27.10453224182129, "global_step": 431366, "epoch": 5197} {"train_loss": -26.53717613220215, "global_step": 431367, "epoch": 5197} {"train_loss": -27.2469425201416, "global_step": 431368, "epoch": 5197} {"train_loss": -26.739831924438477, "global_step": 431369, "epoch": 5197} {"train_loss": -27.0198974609375, "global_step": 431370, "epoch": 5197} {"train_loss": -27.312179565429688, "global_step": 431371, "epoch": 5197} {"train_loss": -27.037155151367188, "global_step": 431372, "epoch": 5197} {"train_loss": -26.93233299255371, "global_step": 431373, "epoch": 5197} {"train_loss": -27.19862174987793, "global_step": 431374, "epoch": 5197} {"train_loss": -26.9438419342041, "global_step": 431375, "epoch": 5197} {"train_loss": -27.00519371032715, "global_step": 431376, "epoch": 5197} {"train_loss": -27.046405792236328, "global_step": 431377, "epoch": 5197} {"train_loss": -27.017309188842773, "global_step": 431378, "epoch": 5197} {"train_loss": -26.98634910583496, "global_step": 431379, "epoch": 5197} {"train_loss": -27.325658798217773, "global_step": 431380, "epoch": 5197} {"train_loss": -27.37992286682129, "global_step": 431381, "epoch": 5197} {"train_loss": -26.964685440063477, "global_step": 431382, "epoch": 5197} {"train_loss": -27.30909538269043, "global_step": 431383, "epoch": 5197} {"train_loss": -27.313085556030273, "global_step": 431384, "epoch": 5197} {"train_loss": -26.962682723999023, "global_step": 431385, "epoch": 5197} {"train_loss": -27.304777145385742, "global_step": 431386, "epoch": 5197} {"train_loss": -27.26312828063965, "global_step": 431387, "epoch": 5197} {"train_loss": -27.112028121948242, "global_step": 431388, "epoch": 5197} {"train_loss": -27.018756866455078, "global_step": 431389, "epoch": 5197} {"train_loss": -26.853958129882812, "global_step": 431390, "epoch": 5197} {"train_loss": -27.223413467407227, "global_step": 431391, "epoch": 5197} {"train_loss": -27.010040283203125, "global_step": 431392, "epoch": 5197} {"train_loss": -27.05718994140625, "global_step": 431393, "epoch": 5197} {"train_loss": -27.327472686767578, "global_step": 431394, "epoch": 5197} {"train_loss": -27.29939079284668, "global_step": 431395, "epoch": 5197} {"train_loss": -27.0587158203125, "global_step": 431396, "epoch": 5197} {"train_loss": -27.090070724487305, "global_step": 431397, "epoch": 5197} {"train_loss": -27.03657341003418, "global_step": 431398, "epoch": 5197} {"train_loss": -27.259796142578125, "global_step": 431399, "epoch": 5197} {"train_loss": -27.30049705505371, "global_step": 431400, "epoch": 5197} {"train_loss": -27.054235458374023, "global_step": 431401, "epoch": 5197} {"train_loss": -27.175729751586914, "global_step": 431402, "epoch": 5197} {"train_loss": -27.111249923706055, "global_step": 431403, "epoch": 5197} {"train_loss": -26.746490478515625, "global_step": 431404, "epoch": 5197} {"train_loss": -26.730016708374023, "global_step": 431405, "epoch": 5197} {"train_loss": -26.675039291381836, "global_step": 431406, "epoch": 5197} {"train_loss": -26.995874404907227, "global_step": 431407, "epoch": 5197} {"train_loss": -27.163564682006836, "global_step": 431408, "epoch": 5197} {"train_loss": -26.68060874938965, "global_step": 431409, "epoch": 5197} {"train_loss": -26.755029678344727, "global_step": 431410, "epoch": 5197} {"train_loss": -26.523839950561523, "global_step": 431411, "epoch": 5197} {"train_loss": -26.553028106689453, "global_step": 431412, "epoch": 5197} {"train_loss": -27.4398250579834, "global_step": 431413, "epoch": 5197} {"train_loss": -26.947790145874023, "global_step": 431414, "epoch": 5197} {"train_loss": -26.66943359375, "global_step": 431415, "epoch": 5197} {"train_loss": -26.390417098999023, "global_step": 431416, "epoch": 5197} {"train_loss": -26.55878257751465, "global_step": 431417, "epoch": 5197} {"train_loss": -26.21111488342285, "global_step": 431418, "epoch": 5197} {"train_loss": -25.704303741455078, "global_step": 431419, "epoch": 5197} {"train_loss": -26.604663848876953, "global_step": 431420, "epoch": 5197} {"train_loss": -26.49460220336914, "global_step": 431421, "epoch": 5197} {"train_loss": -26.235504150390625, "global_step": 431422, "epoch": 5197} {"train_loss": -25.854944229125977, "global_step": 431423, "epoch": 5197} {"train_loss": -26.554357528686523, "global_step": 431424, "epoch": 5197} {"train_loss": -25.89066505432129, "global_step": 431425, "epoch": 5197} {"train_loss": -26.096105575561523, "global_step": 431426, "epoch": 5197} {"train_loss": -26.4508056640625, "global_step": 431427, "epoch": 5197} {"train_loss": -26.20351219177246, "global_step": 431428, "epoch": 5197} {"train_loss": -26.412139892578125, "global_step": 431429, "epoch": 5197} {"train_loss": -26.300052642822266, "global_step": 431430, "epoch": 5197} {"train_loss": -26.55906105041504, "global_step": 431431, "epoch": 5197} {"train_loss": -26.4683837890625, "global_step": 431432, "epoch": 5197} {"train_loss": -26.762904040784722, "global_step": 431433, "epoch": 5197, "val_loss": 6731867.0} {"train_loss": -26.359968185424805, "global_step": 431434, "epoch": 5198} {"train_loss": -25.76717185974121, "global_step": 431435, "epoch": 5198} {"train_loss": -26.239307403564453, "global_step": 431436, "epoch": 5198} {"train_loss": -25.637739181518555, "global_step": 431437, "epoch": 5198} {"train_loss": -26.27328872680664, "global_step": 431438, "epoch": 5198} {"train_loss": -25.99225425720215, "global_step": 431439, "epoch": 5198} {"train_loss": -26.4271240234375, "global_step": 431440, "epoch": 5198} {"train_loss": -26.008853912353516, "global_step": 431441, "epoch": 5198} {"train_loss": -26.211469650268555, "global_step": 431442, "epoch": 5198} {"train_loss": -26.101041793823242, "global_step": 431443, "epoch": 5198} {"train_loss": -26.717391967773438, "global_step": 431444, "epoch": 5198} {"train_loss": -26.45277214050293, "global_step": 431445, "epoch": 5198} {"train_loss": -26.418079376220703, "global_step": 431446, "epoch": 5198} {"train_loss": -26.48602294921875, "global_step": 431447, "epoch": 5198} {"train_loss": -26.331256866455078, "global_step": 431448, "epoch": 5198} {"train_loss": -26.470632553100586, "global_step": 431449, "epoch": 5198} {"train_loss": -26.624258041381836, "global_step": 431450, "epoch": 5198} {"train_loss": -26.639856338500977, "global_step": 431451, "epoch": 5198} {"train_loss": -26.511449813842773, "global_step": 431452, "epoch": 5198} {"train_loss": -26.747455596923828, "global_step": 431453, "epoch": 5198} {"train_loss": -26.838586807250977, "global_step": 431454, "epoch": 5198} {"train_loss": -26.44551658630371, "global_step": 431455, "epoch": 5198} {"train_loss": -26.97751235961914, "global_step": 431456, "epoch": 5198} {"train_loss": -26.609689712524414, "global_step": 431457, "epoch": 5198} {"train_loss": -26.4292049407959, "global_step": 431458, "epoch": 5198} {"train_loss": -26.667743682861328, "global_step": 431459, "epoch": 5198} {"train_loss": -26.813383102416992, "global_step": 431460, "epoch": 5198} {"train_loss": -26.41143226623535, "global_step": 431461, "epoch": 5198} {"train_loss": -26.711502075195312, "global_step": 431462, "epoch": 5198} {"train_loss": -27.0931396484375, "global_step": 431463, "epoch": 5198} {"train_loss": -26.67799949645996, "global_step": 431464, "epoch": 5198} {"train_loss": -26.77741050720215, "global_step": 431465, "epoch": 5198} {"train_loss": -26.954984664916992, "global_step": 431466, "epoch": 5198} {"train_loss": -26.98487663269043, "global_step": 431467, "epoch": 5198} {"train_loss": -26.76862144470215, "global_step": 431468, "epoch": 5198} {"train_loss": -26.834272384643555, "global_step": 431469, "epoch": 5198} {"train_loss": -26.920507431030273, "global_step": 431470, "epoch": 5198} {"train_loss": -26.800092697143555, "global_step": 431471, "epoch": 5198} {"train_loss": -26.8693790435791, "global_step": 431472, "epoch": 5198} {"train_loss": -27.01141929626465, "global_step": 431473, "epoch": 5198} {"train_loss": -26.8889102935791, "global_step": 431474, "epoch": 5198} {"train_loss": -27.282867431640625, "global_step": 431475, "epoch": 5198} {"train_loss": -27.006549835205078, "global_step": 431476, "epoch": 5198} {"train_loss": -27.170578002929688, "global_step": 431477, "epoch": 5198} {"train_loss": -26.801761627197266, "global_step": 431478, "epoch": 5198} {"train_loss": -26.890783309936523, "global_step": 431479, "epoch": 5198} {"train_loss": -26.914098739624023, "global_step": 431480, "epoch": 5198} {"train_loss": -27.076740264892578, "global_step": 431481, "epoch": 5198} {"train_loss": -27.249805450439453, "global_step": 431482, "epoch": 5198} {"train_loss": -26.763578414916992, "global_step": 431483, "epoch": 5198} {"train_loss": -26.824975967407227, "global_step": 431484, "epoch": 5198} {"train_loss": -26.77765464782715, "global_step": 431485, "epoch": 5198} {"train_loss": -27.334989547729492, "global_step": 431486, "epoch": 5198} {"train_loss": -26.6717529296875, "global_step": 431487, "epoch": 5198} {"train_loss": -26.8599853515625, "global_step": 431488, "epoch": 5198} {"train_loss": -26.85565185546875, "global_step": 431489, "epoch": 5198} {"train_loss": -26.907358169555664, "global_step": 431490, "epoch": 5198} {"train_loss": -26.998462677001953, "global_step": 431491, "epoch": 5198} {"train_loss": -27.10141372680664, "global_step": 431492, "epoch": 5198} {"train_loss": -27.0723934173584, "global_step": 431493, "epoch": 5198} {"train_loss": -26.86866569519043, "global_step": 431494, "epoch": 5198} {"train_loss": -26.84408950805664, "global_step": 431495, "epoch": 5198} {"train_loss": -27.203983306884766, "global_step": 431496, "epoch": 5198} {"train_loss": -27.068378448486328, "global_step": 431497, "epoch": 5198} {"train_loss": -26.723474502563477, "global_step": 431498, "epoch": 5198} {"train_loss": -27.225433349609375, "global_step": 431499, "epoch": 5198} {"train_loss": -26.916967391967773, "global_step": 431500, "epoch": 5198} {"train_loss": -26.45284080505371, "global_step": 431501, "epoch": 5198} {"train_loss": -26.449676513671875, "global_step": 431502, "epoch": 5198} {"train_loss": -26.6461181640625, "global_step": 431503, "epoch": 5198} {"train_loss": -27.013959884643555, "global_step": 431504, "epoch": 5198} {"train_loss": -26.7379150390625, "global_step": 431505, "epoch": 5198} {"train_loss": -26.713220596313477, "global_step": 431506, "epoch": 5198} {"train_loss": -26.65962028503418, "global_step": 431507, "epoch": 5198} {"train_loss": -26.9388484954834, "global_step": 431508, "epoch": 5198} {"train_loss": -26.513916015625, "global_step": 431509, "epoch": 5198} {"train_loss": -26.870563507080078, "global_step": 431510, "epoch": 5198} {"train_loss": -27.110830307006836, "global_step": 431511, "epoch": 5198} {"train_loss": -26.9366455078125, "global_step": 431512, "epoch": 5198} {"train_loss": -26.81591796875, "global_step": 431513, "epoch": 5198} {"train_loss": -26.934423446655273, "global_step": 431514, "epoch": 5198} {"train_loss": -26.8369197845459, "global_step": 431515, "epoch": 5198} {"train_loss": -26.713789560708655, "global_step": 431516, "epoch": 5198, "val_loss": 6793244.0} {"train_loss": -26.284439086914062, "global_step": 431517, "epoch": 5199} {"train_loss": -25.887603759765625, "global_step": 431518, "epoch": 5199} {"train_loss": -25.320798873901367, "global_step": 431519, "epoch": 5199} {"train_loss": -25.83172607421875, "global_step": 431520, "epoch": 5199} {"train_loss": -25.256778717041016, "global_step": 431521, "epoch": 5199} {"train_loss": -26.371870040893555, "global_step": 431522, "epoch": 5199} {"train_loss": -25.29117774963379, "global_step": 431523, "epoch": 5199} {"train_loss": -25.777973175048828, "global_step": 431524, "epoch": 5199} {"train_loss": -25.99928092956543, "global_step": 431525, "epoch": 5199} {"train_loss": -26.648595809936523, "global_step": 431526, "epoch": 5199} {"train_loss": -26.2547607421875, "global_step": 431527, "epoch": 5199} {"train_loss": -26.2623291015625, "global_step": 431528, "epoch": 5199} {"train_loss": -26.11233901977539, "global_step": 431529, "epoch": 5199} {"train_loss": -26.72633934020996, "global_step": 431530, "epoch": 5199} {"train_loss": -26.400854110717773, "global_step": 431531, "epoch": 5199} {"train_loss": -26.61634635925293, "global_step": 431532, "epoch": 5199} {"train_loss": -26.040637969970703, "global_step": 431533, "epoch": 5199} {"train_loss": -26.9259033203125, "global_step": 431534, "epoch": 5199} {"train_loss": -26.418737411499023, "global_step": 431535, "epoch": 5199} {"train_loss": -26.611242294311523, "global_step": 431536, "epoch": 5199} {"train_loss": -26.56495475769043, "global_step": 431537, "epoch": 5199} {"train_loss": -26.75226402282715, "global_step": 431538, "epoch": 5199} {"train_loss": -26.080846786499023, "global_step": 431539, "epoch": 5199} {"train_loss": -26.793249130249023, "global_step": 431540, "epoch": 5199} {"train_loss": -26.058380126953125, "global_step": 431541, "epoch": 5199} {"train_loss": -26.622034072875977, "global_step": 431542, "epoch": 5199} {"train_loss": -26.689329147338867, "global_step": 431543, "epoch": 5199} {"train_loss": -26.72327995300293, "global_step": 431544, "epoch": 5199} {"train_loss": -26.866262435913086, "global_step": 431545, "epoch": 5199} {"train_loss": -26.66377830505371, "global_step": 431546, "epoch": 5199} {"train_loss": -26.53883171081543, "global_step": 431547, "epoch": 5199} {"train_loss": -26.899778366088867, "global_step": 431548, "epoch": 5199} {"train_loss": -26.705841064453125, "global_step": 431549, "epoch": 5199} {"train_loss": -26.84577751159668, "global_step": 431550, "epoch": 5199} {"train_loss": -26.468585968017578, "global_step": 431551, "epoch": 5199} {"train_loss": -26.92755126953125, "global_step": 431552, "epoch": 5199} {"train_loss": -26.9491024017334, "global_step": 431553, "epoch": 5199} {"train_loss": -26.75250244140625, "global_step": 431554, "epoch": 5199} {"train_loss": -27.034887313842773, "global_step": 431555, "epoch": 5199} {"train_loss": -27.003416061401367, "global_step": 431556, "epoch": 5199} {"train_loss": -26.927453994750977, "global_step": 431557, "epoch": 5199} {"train_loss": -26.635700225830078, "global_step": 431558, "epoch": 5199} {"train_loss": -27.089426040649414, "global_step": 431559, "epoch": 5199} {"train_loss": -27.042266845703125, "global_step": 431560, "epoch": 5199} {"train_loss": -27.223241806030273, "global_step": 431561, "epoch": 5199} {"train_loss": -26.529993057250977, "global_step": 431562, "epoch": 5199} {"train_loss": -26.4403076171875, "global_step": 431563, "epoch": 5199} {"train_loss": -26.908161163330078, "global_step": 431564, "epoch": 5199} {"train_loss": -26.987409591674805, "global_step": 431565, "epoch": 5199} {"train_loss": -27.14582633972168, "global_step": 431566, "epoch": 5199} {"train_loss": -27.18525505065918, "global_step": 431567, "epoch": 5199} {"train_loss": -26.840402603149414, "global_step": 431568, "epoch": 5199} {"train_loss": -26.9278564453125, "global_step": 431569, "epoch": 5199} {"train_loss": -27.10481071472168, "global_step": 431570, "epoch": 5199} {"train_loss": -26.924192428588867, "global_step": 431571, "epoch": 5199} {"train_loss": -27.16876220703125, "global_step": 431572, "epoch": 5199} {"train_loss": -26.817129135131836, "global_step": 431573, "epoch": 5199} {"train_loss": -26.876440048217773, "global_step": 431574, "epoch": 5199} {"train_loss": -27.10755729675293, "global_step": 431575, "epoch": 5199} {"train_loss": -26.78805923461914, "global_step": 431576, "epoch": 5199} {"train_loss": -27.186532974243164, "global_step": 431577, "epoch": 5199} {"train_loss": -26.973648071289062, "global_step": 431578, "epoch": 5199} {"train_loss": -27.112714767456055, "global_step": 431579, "epoch": 5199} {"train_loss": -27.05120849609375, "global_step": 431580, "epoch": 5199} {"train_loss": -27.183887481689453, "global_step": 431581, "epoch": 5199} {"train_loss": -27.095670700073242, "global_step": 431582, "epoch": 5199} {"train_loss": -27.109426498413086, "global_step": 431583, "epoch": 5199} {"train_loss": -26.879133224487305, "global_step": 431584, "epoch": 5199} {"train_loss": -26.590118408203125, "global_step": 431585, "epoch": 5199} {"train_loss": -26.730817794799805, "global_step": 431586, "epoch": 5199} {"train_loss": -27.266721725463867, "global_step": 431587, "epoch": 5199} {"train_loss": -27.196857452392578, "global_step": 431588, "epoch": 5199} {"train_loss": -26.383289337158203, "global_step": 431589, "epoch": 5199} {"train_loss": -26.54461669921875, "global_step": 431590, "epoch": 5199} {"train_loss": -26.46235466003418, "global_step": 431591, "epoch": 5199} {"train_loss": -26.595067977905273, "global_step": 431592, "epoch": 5199} {"train_loss": -27.014450073242188, "global_step": 431593, "epoch": 5199} {"train_loss": -27.13239860534668, "global_step": 431594, "epoch": 5199} {"train_loss": -27.15064811706543, "global_step": 431595, "epoch": 5199} {"train_loss": -27.021387100219727, "global_step": 431596, "epoch": 5199} {"train_loss": -26.707050323486328, "global_step": 431597, "epoch": 5199} {"train_loss": -26.540918350219727, "global_step": 431598, "epoch": 5199} {"train_loss": -26.6669560857566, "global_step": 431599, "epoch": 5199, "val_loss": 6920911.0} {"train_loss": -27.012617111206055, "global_step": 431600, "epoch": 5200} {"train_loss": -25.785297393798828, "global_step": 431601, "epoch": 5200} {"train_loss": -26.39153480529785, "global_step": 431602, "epoch": 5200} {"train_loss": -26.7156925201416, "global_step": 431603, "epoch": 5200} {"train_loss": -26.35157585144043, "global_step": 431604, "epoch": 5200} {"train_loss": -26.7830810546875, "global_step": 431605, "epoch": 5200} {"train_loss": -26.555410385131836, "global_step": 431606, "epoch": 5200} {"train_loss": -26.542316436767578, "global_step": 431607, "epoch": 5200} {"train_loss": -26.570398330688477, "global_step": 431608, "epoch": 5200} {"train_loss": -26.3708553314209, "global_step": 431609, "epoch": 5200} {"train_loss": -26.757959365844727, "global_step": 431610, "epoch": 5200} {"train_loss": -26.188940048217773, "global_step": 431611, "epoch": 5200} {"train_loss": -26.68121337890625, "global_step": 431612, "epoch": 5200} {"train_loss": -26.399688720703125, "global_step": 431613, "epoch": 5200} {"train_loss": -26.83389663696289, "global_step": 431614, "epoch": 5200} {"train_loss": -26.79164695739746, "global_step": 431615, "epoch": 5200} {"train_loss": -26.678518295288086, "global_step": 431616, "epoch": 5200} {"train_loss": -26.32911491394043, "global_step": 431617, "epoch": 5200} {"train_loss": -26.788227081298828, "global_step": 431618, "epoch": 5200} {"train_loss": -26.422164916992188, "global_step": 431619, "epoch": 5200} {"train_loss": -26.897306442260742, "global_step": 431620, "epoch": 5200} {"train_loss": -26.592260360717773, "global_step": 431621, "epoch": 5200} {"train_loss": -27.126373291015625, "global_step": 431622, "epoch": 5200} {"train_loss": -26.6107177734375, "global_step": 431623, "epoch": 5200} {"train_loss": -26.9451847076416, "global_step": 431624, "epoch": 5200} {"train_loss": -26.899438858032227, "global_step": 431625, "epoch": 5200} {"train_loss": -26.890426635742188, "global_step": 431626, "epoch": 5200} {"train_loss": -26.549890518188477, "global_step": 431627, "epoch": 5200} {"train_loss": -26.9410343170166, "global_step": 431628, "epoch": 5200} {"train_loss": -27.08447265625, "global_step": 431629, "epoch": 5200} {"train_loss": -26.382232666015625, "global_step": 431630, "epoch": 5200} {"train_loss": -26.769948959350586, "global_step": 431631, "epoch": 5200} {"train_loss": -26.683156967163086, "global_step": 431632, "epoch": 5200} {"train_loss": -26.990854263305664, "global_step": 431633, "epoch": 5200} {"train_loss": -27.17377281188965, "global_step": 431634, "epoch": 5200} {"train_loss": -27.130720138549805, "global_step": 431635, "epoch": 5200} {"train_loss": -27.288772583007812, "global_step": 431636, "epoch": 5200} {"train_loss": -27.0615177154541, "global_step": 431637, "epoch": 5200} {"train_loss": -27.344507217407227, "global_step": 431638, "epoch": 5200} {"train_loss": -27.036212921142578, "global_step": 431639, "epoch": 5200} {"train_loss": -26.944162368774414, "global_step": 431640, "epoch": 5200} {"train_loss": -27.153278350830078, "global_step": 431641, "epoch": 5200} {"train_loss": -26.9113712310791, "global_step": 431642, "epoch": 5200} {"train_loss": -27.34303092956543, "global_step": 431643, "epoch": 5200} {"train_loss": -26.867956161499023, "global_step": 431644, "epoch": 5200} {"train_loss": -26.928022384643555, "global_step": 431645, "epoch": 5200} {"train_loss": -26.5750732421875, "global_step": 431646, "epoch": 5200} {"train_loss": -27.238279342651367, "global_step": 431647, "epoch": 5200} {"train_loss": -27.064563751220703, "global_step": 431648, "epoch": 5200} {"train_loss": -26.96929931640625, "global_step": 431649, "epoch": 5200} {"train_loss": -26.548730850219727, "global_step": 431650, "epoch": 5200} {"train_loss": -27.116989135742188, "global_step": 431651, "epoch": 5200} {"train_loss": -26.82745933532715, "global_step": 431652, "epoch": 5200} {"train_loss": -26.97015380859375, "global_step": 431653, "epoch": 5200} {"train_loss": -27.20599365234375, "global_step": 431654, "epoch": 5200} {"train_loss": -27.058679580688477, "global_step": 431655, "epoch": 5200} {"train_loss": -26.47470474243164, "global_step": 431656, "epoch": 5200} {"train_loss": -26.918960571289062, "global_step": 431657, "epoch": 5200} {"train_loss": -26.804203033447266, "global_step": 431658, "epoch": 5200} {"train_loss": -26.387861251831055, "global_step": 431659, "epoch": 5200} {"train_loss": -26.570951461791992, "global_step": 431660, "epoch": 5200} {"train_loss": -26.54981803894043, "global_step": 431661, "epoch": 5200} {"train_loss": -27.034528732299805, "global_step": 431662, "epoch": 5200} {"train_loss": -26.780637741088867, "global_step": 431663, "epoch": 5200} {"train_loss": -26.706403732299805, "global_step": 431664, "epoch": 5200} {"train_loss": -26.495330810546875, "global_step": 431665, "epoch": 5200} {"train_loss": -26.77274513244629, "global_step": 431666, "epoch": 5200} {"train_loss": -27.036548614501953, "global_step": 431667, "epoch": 5200} {"train_loss": -26.82661247253418, "global_step": 431668, "epoch": 5200} {"train_loss": -26.56431007385254, "global_step": 431669, "epoch": 5200} {"train_loss": -26.389219284057617, "global_step": 431670, "epoch": 5200} {"train_loss": -26.69552993774414, "global_step": 431671, "epoch": 5200} {"train_loss": -26.84014320373535, "global_step": 431672, "epoch": 5200} {"train_loss": -26.978260040283203, "global_step": 431673, "epoch": 5200} {"train_loss": -26.74004554748535, "global_step": 431674, "epoch": 5200} {"train_loss": -26.85065269470215, "global_step": 431675, "epoch": 5200} {"train_loss": -27.430938720703125, "global_step": 431676, "epoch": 5200} {"train_loss": -26.800901412963867, "global_step": 431677, "epoch": 5200} {"train_loss": -26.932453155517578, "global_step": 431678, "epoch": 5200} {"train_loss": -26.916227340698242, "global_step": 431679, "epoch": 5200} {"train_loss": -26.769393920898438, "global_step": 431680, "epoch": 5200} {"train_loss": -27.1898193359375, "global_step": 431681, "epoch": 5200} {"train_loss": -26.8028209180717, "global_step": 431682, "epoch": 5200, "train/sim_max_reward_0": 1.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4500000": 1.0, "test/sim_max_reward_4500001": 1.0, "test/sim_max_reward_4500002": 1.0, "test/sim_max_reward_4500003": 1.0, "test/sim_max_reward_4500004": 1.0, "test/sim_max_reward_4500005": 1.0, "test/sim_max_reward_4500006": 1.0, "test/sim_max_reward_4500007": 0.0, "test/sim_max_reward_4500008": 1.0, "test/sim_max_reward_4500009": 1.0, "test/sim_max_reward_4500010": 1.0, "test/sim_max_reward_4500011": 1.0, "test/sim_max_reward_4500012": 1.0, "test/sim_max_reward_4500013": 0.0, "test/sim_max_reward_4500014": 1.0, "test/sim_max_reward_4500015": 1.0, "test/sim_max_reward_4500016": 1.0, "test/sim_max_reward_4500017": 1.0, "test/sim_max_reward_4500018": 1.0, "test/sim_max_reward_4500019": 1.0, "test/sim_max_reward_4500020": 1.0, "test/sim_max_reward_4500021": 1.0, "train/mean_score": 1.0, "test/mean_score": 0.9090909090909091, "val_loss": 6884995.0} {"train_loss": -26.01673698425293, "global_step": 431683, "epoch": 5201} {"train_loss": -26.58548927307129, "global_step": 431684, "epoch": 5201} {"train_loss": -26.2945499420166, "global_step": 431685, "epoch": 5201} {"train_loss": -26.586811065673828, "global_step": 431686, "epoch": 5201} {"train_loss": -26.48187828063965, "global_step": 431687, "epoch": 5201} {"train_loss": -26.22733497619629, "global_step": 431688, "epoch": 5201} {"train_loss": -26.383365631103516, "global_step": 431689, "epoch": 5201} {"train_loss": -26.6759033203125, "global_step": 431690, "epoch": 5201} {"train_loss": -26.38453483581543, "global_step": 431691, "epoch": 5201} {"train_loss": -26.907791137695312, "global_step": 431692, "epoch": 5201} {"train_loss": -26.582075119018555, "global_step": 431693, "epoch": 5201} {"train_loss": -26.213720321655273, "global_step": 431694, "epoch": 5201} {"train_loss": -26.293073654174805, "global_step": 431695, "epoch": 5201} {"train_loss": -26.545745849609375, "global_step": 431696, "epoch": 5201} {"train_loss": -26.37700843811035, "global_step": 431697, "epoch": 5201} {"train_loss": -26.461423873901367, "global_step": 431698, "epoch": 5201} {"train_loss": -26.76300621032715, "global_step": 431699, "epoch": 5201} {"train_loss": -26.328521728515625, "global_step": 431700, "epoch": 5201} {"train_loss": -26.834762573242188, "global_step": 431701, "epoch": 5201} {"train_loss": -26.935016632080078, "global_step": 431702, "epoch": 5201} {"train_loss": -26.771726608276367, "global_step": 431703, "epoch": 5201} {"train_loss": -26.75546646118164, "global_step": 431704, "epoch": 5201} {"train_loss": -26.968708038330078, "global_step": 431705, "epoch": 5201} {"train_loss": -26.826614379882812, "global_step": 431706, "epoch": 5201} {"train_loss": -26.424591064453125, "global_step": 431707, "epoch": 5201} {"train_loss": -26.81947135925293, "global_step": 431708, "epoch": 5201} {"train_loss": -26.8149356842041, "global_step": 431709, "epoch": 5201} {"train_loss": -26.956594467163086, "global_step": 431710, "epoch": 5201} {"train_loss": -26.950088500976562, "global_step": 431711, "epoch": 5201} {"train_loss": -27.140644073486328, "global_step": 431712, "epoch": 5201} {"train_loss": -26.996335983276367, "global_step": 431713, "epoch": 5201} {"train_loss": -26.738866806030273, "global_step": 431714, "epoch": 5201} {"train_loss": -26.83949851989746, "global_step": 431715, "epoch": 5201} {"train_loss": -27.084808349609375, "global_step": 431716, "epoch": 5201} {"train_loss": -26.558942794799805, "global_step": 431717, "epoch": 5201} {"train_loss": -27.071149826049805, "global_step": 431718, "epoch": 5201} {"train_loss": -26.942670822143555, "global_step": 431719, "epoch": 5201} {"train_loss": -27.38752555847168, "global_step": 431720, "epoch": 5201} {"train_loss": -27.215381622314453, "global_step": 431721, "epoch": 5201} {"train_loss": -26.98939323425293, "global_step": 431722, "epoch": 5201} {"train_loss": -27.34161949157715, "global_step": 431723, "epoch": 5201} {"train_loss": -26.98349952697754, "global_step": 431724, "epoch": 5201} {"train_loss": -26.894983291625977, "global_step": 431725, "epoch": 5201} {"train_loss": -27.357498168945312, "global_step": 431726, "epoch": 5201} {"train_loss": -26.92561149597168, "global_step": 431727, "epoch": 5201} {"train_loss": -26.72963523864746, "global_step": 431728, "epoch": 5201} {"train_loss": -27.122472763061523, "global_step": 431729, "epoch": 5201} {"train_loss": -26.86860466003418, "global_step": 431730, "epoch": 5201} {"train_loss": -26.645864486694336, "global_step": 431731, "epoch": 5201} {"train_loss": -26.915790557861328, "global_step": 431732, "epoch": 5201} {"train_loss": -26.784992218017578, "global_step": 431733, "epoch": 5201} {"train_loss": -27.44830894470215, "global_step": 431734, "epoch": 5201} {"train_loss": -26.39096450805664, "global_step": 431735, "epoch": 5201} {"train_loss": -26.980737686157227, "global_step": 431736, "epoch": 5201} {"train_loss": -26.972211837768555, "global_step": 431737, "epoch": 5201} {"train_loss": -26.784292221069336, "global_step": 431738, "epoch": 5201} {"train_loss": -26.801538467407227, "global_step": 431739, "epoch": 5201} {"train_loss": -27.07520866394043, "global_step": 431740, "epoch": 5201} {"train_loss": -27.170103073120117, "global_step": 431741, "epoch": 5201} {"train_loss": -26.75567054748535, "global_step": 431742, "epoch": 5201} {"train_loss": -26.934675216674805, "global_step": 431743, "epoch": 5201} {"train_loss": -26.566198348999023, "global_step": 431744, "epoch": 5201} {"train_loss": -26.617965698242188, "global_step": 431745, "epoch": 5201} {"train_loss": -26.16046142578125, "global_step": 431746, "epoch": 5201} {"train_loss": -26.566787719726562, "global_step": 431747, "epoch": 5201} {"train_loss": -26.964954376220703, "global_step": 431748, "epoch": 5201} {"train_loss": -26.6766300201416, "global_step": 431749, "epoch": 5201} {"train_loss": -27.273422241210938, "global_step": 431750, "epoch": 5201} {"train_loss": -27.2083797454834, "global_step": 431751, "epoch": 5201} {"train_loss": -26.591054916381836, "global_step": 431752, "epoch": 5201} {"train_loss": -27.053613662719727, "global_step": 431753, "epoch": 5201} {"train_loss": -27.047916412353516, "global_step": 431754, "epoch": 5201} {"train_loss": -26.805639266967773, "global_step": 431755, "epoch": 5201} {"train_loss": -27.151098251342773, "global_step": 431756, "epoch": 5201} {"train_loss": -27.174036026000977, "global_step": 431757, "epoch": 5201} {"train_loss": -26.959110260009766, "global_step": 431758, "epoch": 5201} {"train_loss": -26.93672752380371, "global_step": 431759, "epoch": 5201} {"train_loss": -27.132434844970703, "global_step": 431760, "epoch": 5201} {"train_loss": -26.731229782104492, "global_step": 431761, "epoch": 5201} {"train_loss": -26.578454971313477, "global_step": 431762, "epoch": 5201} {"train_loss": -26.53095054626465, "global_step": 431763, "epoch": 5201} {"train_loss": -26.486541748046875, "global_step": 431764, "epoch": 5201} {"train_loss": -26.768593064273695, "global_step": 431765, "epoch": 5201, "val_loss": 6872732.0} {"train_loss": -25.1253662109375, "global_step": 431766, "epoch": 5202} {"train_loss": -25.222103118896484, "global_step": 431767, "epoch": 5202} {"train_loss": -25.932849884033203, "global_step": 431768, "epoch": 5202} {"train_loss": -24.942806243896484, "global_step": 431769, "epoch": 5202} {"train_loss": -25.745153427124023, "global_step": 431770, "epoch": 5202} {"train_loss": -25.832813262939453, "global_step": 431771, "epoch": 5202} {"train_loss": -25.482168197631836, "global_step": 431772, "epoch": 5202} {"train_loss": -25.451181411743164, "global_step": 431773, "epoch": 5202} {"train_loss": -26.306074142456055, "global_step": 431774, "epoch": 5202} {"train_loss": -25.87135124206543, "global_step": 431775, "epoch": 5202} {"train_loss": -26.1741886138916, "global_step": 431776, "epoch": 5202} {"train_loss": -26.283960342407227, "global_step": 431777, "epoch": 5202} {"train_loss": -25.937246322631836, "global_step": 431778, "epoch": 5202} {"train_loss": -26.643970489501953, "global_step": 431779, "epoch": 5202} {"train_loss": -26.17998695373535, "global_step": 431780, "epoch": 5202} {"train_loss": -26.3261661529541, "global_step": 431781, "epoch": 5202} {"train_loss": -26.5361328125, "global_step": 431782, "epoch": 5202} {"train_loss": -26.180723190307617, "global_step": 431783, "epoch": 5202} {"train_loss": -26.521331787109375, "global_step": 431784, "epoch": 5202} {"train_loss": -26.57708168029785, "global_step": 431785, "epoch": 5202} {"train_loss": -26.319091796875, "global_step": 431786, "epoch": 5202} {"train_loss": -26.503416061401367, "global_step": 431787, "epoch": 5202} {"train_loss": -26.73748207092285, "global_step": 431788, "epoch": 5202} {"train_loss": -26.339120864868164, "global_step": 431789, "epoch": 5202} {"train_loss": -26.4217472076416, "global_step": 431790, "epoch": 5202} {"train_loss": -26.586706161499023, "global_step": 431791, "epoch": 5202} {"train_loss": -26.38203239440918, "global_step": 431792, "epoch": 5202} {"train_loss": -26.0881290435791, "global_step": 431793, "epoch": 5202} {"train_loss": -26.7128849029541, "global_step": 431794, "epoch": 5202} {"train_loss": -26.826650619506836, "global_step": 431795, "epoch": 5202} {"train_loss": -26.472980499267578, "global_step": 431796, "epoch": 5202} {"train_loss": -26.711668014526367, "global_step": 431797, "epoch": 5202} {"train_loss": -26.301618576049805, "global_step": 431798, "epoch": 5202} {"train_loss": -26.872333526611328, "global_step": 431799, "epoch": 5202} {"train_loss": -27.11279296875, "global_step": 431800, "epoch": 5202} {"train_loss": -26.540307998657227, "global_step": 431801, "epoch": 5202} {"train_loss": -26.582117080688477, "global_step": 431802, "epoch": 5202} {"train_loss": -26.920978546142578, "global_step": 431803, "epoch": 5202} {"train_loss": -26.83619499206543, "global_step": 431804, "epoch": 5202} {"train_loss": -26.599424362182617, "global_step": 431805, "epoch": 5202} {"train_loss": -26.894662857055664, "global_step": 431806, "epoch": 5202} {"train_loss": -27.015424728393555, "global_step": 431807, "epoch": 5202} {"train_loss": -27.254003524780273, "global_step": 431808, "epoch": 5202} {"train_loss": -26.873498916625977, "global_step": 431809, "epoch": 5202} {"train_loss": -27.214338302612305, "global_step": 431810, "epoch": 5202} {"train_loss": -27.0797119140625, "global_step": 431811, "epoch": 5202} {"train_loss": -27.142343521118164, "global_step": 431812, "epoch": 5202} {"train_loss": -27.14093017578125, "global_step": 431813, "epoch": 5202} {"train_loss": -27.3498477935791, "global_step": 431814, "epoch": 5202} {"train_loss": -27.457321166992188, "global_step": 431815, "epoch": 5202} {"train_loss": -27.395904541015625, "global_step": 431816, "epoch": 5202} {"train_loss": -26.954397201538086, "global_step": 431817, "epoch": 5202} {"train_loss": -26.9320068359375, "global_step": 431818, "epoch": 5202} {"train_loss": -26.986074447631836, "global_step": 431819, "epoch": 5202} {"train_loss": -26.912994384765625, "global_step": 431820, "epoch": 5202} {"train_loss": -26.971332550048828, "global_step": 431821, "epoch": 5202} {"train_loss": -27.020322799682617, "global_step": 431822, "epoch": 5202} {"train_loss": -26.820837020874023, "global_step": 431823, "epoch": 5202} {"train_loss": -27.00653076171875, "global_step": 431824, "epoch": 5202} {"train_loss": -27.210269927978516, "global_step": 431825, "epoch": 5202} {"train_loss": -26.813756942749023, "global_step": 431826, "epoch": 5202} {"train_loss": -27.451486587524414, "global_step": 431827, "epoch": 5202} {"train_loss": -27.104963302612305, "global_step": 431828, "epoch": 5202} {"train_loss": -27.04188346862793, "global_step": 431829, "epoch": 5202} {"train_loss": -27.274703979492188, "global_step": 431830, "epoch": 5202} {"train_loss": -27.065372467041016, "global_step": 431831, "epoch": 5202} {"train_loss": -27.13043212890625, "global_step": 431832, "epoch": 5202} {"train_loss": -27.365570068359375, "global_step": 431833, "epoch": 5202} {"train_loss": -27.519454956054688, "global_step": 431834, "epoch": 5202} {"train_loss": -27.3284969329834, "global_step": 431835, "epoch": 5202} {"train_loss": -26.930927276611328, "global_step": 431836, "epoch": 5202} {"train_loss": -26.853296279907227, "global_step": 431837, "epoch": 5202} {"train_loss": -26.91961097717285, "global_step": 431838, "epoch": 5202} {"train_loss": -27.00986099243164, "global_step": 431839, "epoch": 5202} {"train_loss": -26.832382202148438, "global_step": 431840, "epoch": 5202} {"train_loss": -27.37409019470215, "global_step": 431841, "epoch": 5202} {"train_loss": -26.619293212890625, "global_step": 431842, "epoch": 5202} {"train_loss": -26.48065185546875, "global_step": 431843, "epoch": 5202} {"train_loss": -25.693771362304688, "global_step": 431844, "epoch": 5202} {"train_loss": -25.93758201599121, "global_step": 431845, "epoch": 5202} {"train_loss": -26.509931564331055, "global_step": 431846, "epoch": 5202} {"train_loss": -26.83534812927246, "global_step": 431847, "epoch": 5202} {"train_loss": -26.681042383952313, "global_step": 431848, "epoch": 5202, "val_loss": 6866022.5} {"train_loss": -23.71718406677246, "global_step": 431849, "epoch": 5203} {"train_loss": -25.751178741455078, "global_step": 431850, "epoch": 5203} {"train_loss": -24.926950454711914, "global_step": 431851, "epoch": 5203} {"train_loss": -26.174545288085938, "global_step": 431852, "epoch": 5203} {"train_loss": -25.156801223754883, "global_step": 431853, "epoch": 5203} {"train_loss": -25.89533805847168, "global_step": 431854, "epoch": 5203} {"train_loss": -25.972431182861328, "global_step": 431855, "epoch": 5203} {"train_loss": -25.334985733032227, "global_step": 431856, "epoch": 5203} {"train_loss": -25.79388427734375, "global_step": 431857, "epoch": 5203} {"train_loss": -25.960372924804688, "global_step": 431858, "epoch": 5203} {"train_loss": -26.112873077392578, "global_step": 431859, "epoch": 5203} {"train_loss": -26.336984634399414, "global_step": 431860, "epoch": 5203} {"train_loss": -26.23431396484375, "global_step": 431861, "epoch": 5203} {"train_loss": -25.928075790405273, "global_step": 431862, "epoch": 5203} {"train_loss": -26.42854118347168, "global_step": 431863, "epoch": 5203} {"train_loss": -26.513690948486328, "global_step": 431864, "epoch": 5203} {"train_loss": -26.221759796142578, "global_step": 431865, "epoch": 5203} {"train_loss": -26.249561309814453, "global_step": 431866, "epoch": 5203} {"train_loss": -26.38373374938965, "global_step": 431867, "epoch": 5203} {"train_loss": -25.904632568359375, "global_step": 431868, "epoch": 5203} {"train_loss": -26.503705978393555, "global_step": 431869, "epoch": 5203} {"train_loss": -26.516921997070312, "global_step": 431870, "epoch": 5203} {"train_loss": -26.659543991088867, "global_step": 431871, "epoch": 5203} {"train_loss": -26.39198112487793, "global_step": 431872, "epoch": 5203} {"train_loss": -26.474767684936523, "global_step": 431873, "epoch": 5203} {"train_loss": -26.505090713500977, "global_step": 431874, "epoch": 5203} {"train_loss": -26.55708122253418, "global_step": 431875, "epoch": 5203} {"train_loss": -26.967466354370117, "global_step": 431876, "epoch": 5203} {"train_loss": -26.833393096923828, "global_step": 431877, "epoch": 5203} {"train_loss": -26.66011619567871, "global_step": 431878, "epoch": 5203} {"train_loss": -26.536441802978516, "global_step": 431879, "epoch": 5203} {"train_loss": -26.99129295349121, "global_step": 431880, "epoch": 5203} {"train_loss": -26.848718643188477, "global_step": 431881, "epoch": 5203} {"train_loss": -26.741621017456055, "global_step": 431882, "epoch": 5203} {"train_loss": -26.391193389892578, "global_step": 431883, "epoch": 5203} {"train_loss": -27.076147079467773, "global_step": 431884, "epoch": 5203} {"train_loss": -26.66294288635254, "global_step": 431885, "epoch": 5203} {"train_loss": -26.619688034057617, "global_step": 431886, "epoch": 5203} {"train_loss": -26.460641860961914, "global_step": 431887, "epoch": 5203} {"train_loss": -26.668949127197266, "global_step": 431888, "epoch": 5203} {"train_loss": -26.91574478149414, "global_step": 431889, "epoch": 5203} {"train_loss": -26.73554039001465, "global_step": 431890, "epoch": 5203} {"train_loss": -27.00736427307129, "global_step": 431891, "epoch": 5203} {"train_loss": -26.558069229125977, "global_step": 431892, "epoch": 5203} {"train_loss": -26.856739044189453, "global_step": 431893, "epoch": 5203} {"train_loss": -26.53216552734375, "global_step": 431894, "epoch": 5203} {"train_loss": -26.851184844970703, "global_step": 431895, "epoch": 5203} {"train_loss": -26.871265411376953, "global_step": 431896, "epoch": 5203} {"train_loss": -26.42426109313965, "global_step": 431897, "epoch": 5203} {"train_loss": -27.09100914001465, "global_step": 431898, "epoch": 5203} {"train_loss": -27.094568252563477, "global_step": 431899, "epoch": 5203} {"train_loss": -27.0516357421875, "global_step": 431900, "epoch": 5203} {"train_loss": -27.044696807861328, "global_step": 431901, "epoch": 5203} {"train_loss": -27.044153213500977, "global_step": 431902, "epoch": 5203} {"train_loss": -27.406219482421875, "global_step": 431903, "epoch": 5203} {"train_loss": -26.949329376220703, "global_step": 431904, "epoch": 5203} {"train_loss": -27.11263084411621, "global_step": 431905, "epoch": 5203} {"train_loss": -27.10328483581543, "global_step": 431906, "epoch": 5203} {"train_loss": -27.215620040893555, "global_step": 431907, "epoch": 5203} {"train_loss": -26.7961483001709, "global_step": 431908, "epoch": 5203} {"train_loss": -27.280994415283203, "global_step": 431909, "epoch": 5203} {"train_loss": -27.011320114135742, "global_step": 431910, "epoch": 5203} {"train_loss": -26.9544620513916, "global_step": 431911, "epoch": 5203} {"train_loss": -27.350629806518555, "global_step": 431912, "epoch": 5203} {"train_loss": -26.810016632080078, "global_step": 431913, "epoch": 5203} {"train_loss": -27.11554527282715, "global_step": 431914, "epoch": 5203} {"train_loss": -27.386520385742188, "global_step": 431915, "epoch": 5203} {"train_loss": -26.95066261291504, "global_step": 431916, "epoch": 5203} {"train_loss": -27.4008731842041, "global_step": 431917, "epoch": 5203} {"train_loss": -27.38203239440918, "global_step": 431918, "epoch": 5203} {"train_loss": -26.756011962890625, "global_step": 431919, "epoch": 5203} {"train_loss": -26.74961280822754, "global_step": 431920, "epoch": 5203} {"train_loss": -27.0881290435791, "global_step": 431921, "epoch": 5203} {"train_loss": -26.809925079345703, "global_step": 431922, "epoch": 5203} {"train_loss": -27.025653839111328, "global_step": 431923, "epoch": 5203} {"train_loss": -27.08868408203125, "global_step": 431924, "epoch": 5203} {"train_loss": -26.97413444519043, "global_step": 431925, "epoch": 5203} {"train_loss": -26.907978057861328, "global_step": 431926, "epoch": 5203} {"train_loss": -26.83143424987793, "global_step": 431927, "epoch": 5203} {"train_loss": -27.2330379486084, "global_step": 431928, "epoch": 5203} {"train_loss": -27.208454132080078, "global_step": 431929, "epoch": 5203} {"train_loss": -26.986835479736328, "global_step": 431930, "epoch": 5203} {"train_loss": -26.643289198358374, "global_step": 431931, "epoch": 5203, "val_loss": 6904257.0} {"train_loss": -26.3013858795166, "global_step": 431932, "epoch": 5204} {"train_loss": -26.516443252563477, "global_step": 431933, "epoch": 5204} {"train_loss": -26.706384658813477, "global_step": 431934, "epoch": 5204} {"train_loss": -27.036258697509766, "global_step": 431935, "epoch": 5204} {"train_loss": -26.658039093017578, "global_step": 431936, "epoch": 5204} {"train_loss": -26.866674423217773, "global_step": 431937, "epoch": 5204} {"train_loss": -26.664764404296875, "global_step": 431938, "epoch": 5204} {"train_loss": -25.94071388244629, "global_step": 431939, "epoch": 5204} {"train_loss": -25.81216812133789, "global_step": 431940, "epoch": 5204} {"train_loss": -26.062976837158203, "global_step": 431941, "epoch": 5204} {"train_loss": -26.51703453063965, "global_step": 431942, "epoch": 5204} {"train_loss": -27.00758171081543, "global_step": 431943, "epoch": 5204} {"train_loss": -26.284748077392578, "global_step": 431944, "epoch": 5204} {"train_loss": -26.1795597076416, "global_step": 431945, "epoch": 5204} {"train_loss": -26.625720977783203, "global_step": 431946, "epoch": 5204} {"train_loss": -26.230939865112305, "global_step": 431947, "epoch": 5204} {"train_loss": -26.306324005126953, "global_step": 431948, "epoch": 5204} {"train_loss": -26.867938995361328, "global_step": 431949, "epoch": 5204} {"train_loss": -26.779367446899414, "global_step": 431950, "epoch": 5204} {"train_loss": -26.12808609008789, "global_step": 431951, "epoch": 5204} {"train_loss": -26.867582321166992, "global_step": 431952, "epoch": 5204} {"train_loss": -26.544031143188477, "global_step": 431953, "epoch": 5204} {"train_loss": -26.99112319946289, "global_step": 431954, "epoch": 5204} {"train_loss": -26.82906150817871, "global_step": 431955, "epoch": 5204} {"train_loss": -26.99616813659668, "global_step": 431956, "epoch": 5204} {"train_loss": -26.77716064453125, "global_step": 431957, "epoch": 5204} {"train_loss": -26.2148494720459, "global_step": 431958, "epoch": 5204} {"train_loss": -26.926136016845703, "global_step": 431959, "epoch": 5204} {"train_loss": -26.77241325378418, "global_step": 431960, "epoch": 5204} {"train_loss": -26.85542106628418, "global_step": 431961, "epoch": 5204} {"train_loss": -26.769580841064453, "global_step": 431962, "epoch": 5204} {"train_loss": -26.74334716796875, "global_step": 431963, "epoch": 5204} {"train_loss": -26.471105575561523, "global_step": 431964, "epoch": 5204} {"train_loss": -26.625614166259766, "global_step": 431965, "epoch": 5204} {"train_loss": -26.7264347076416, "global_step": 431966, "epoch": 5204} {"train_loss": -26.668075561523438, "global_step": 431967, "epoch": 5204} {"train_loss": -26.588165283203125, "global_step": 431968, "epoch": 5204} {"train_loss": -26.729276657104492, "global_step": 431969, "epoch": 5204} {"train_loss": -26.892993927001953, "global_step": 431970, "epoch": 5204} {"train_loss": -27.019744873046875, "global_step": 431971, "epoch": 5204} {"train_loss": -26.764856338500977, "global_step": 431972, "epoch": 5204} {"train_loss": -26.4057674407959, "global_step": 431973, "epoch": 5204} {"train_loss": -26.78487205505371, "global_step": 431974, "epoch": 5204} {"train_loss": -26.848363876342773, "global_step": 431975, "epoch": 5204} {"train_loss": -27.045454025268555, "global_step": 431976, "epoch": 5204} {"train_loss": -26.864553451538086, "global_step": 431977, "epoch": 5204} {"train_loss": -27.001188278198242, "global_step": 431978, "epoch": 5204} {"train_loss": -26.790857315063477, "global_step": 431979, "epoch": 5204} {"train_loss": -26.726957321166992, "global_step": 431980, "epoch": 5204} {"train_loss": -27.008316040039062, "global_step": 431981, "epoch": 5204} {"train_loss": -26.73357582092285, "global_step": 431982, "epoch": 5204} {"train_loss": -26.83924674987793, "global_step": 431983, "epoch": 5204} {"train_loss": -26.795759201049805, "global_step": 431984, "epoch": 5204} {"train_loss": -26.721622467041016, "global_step": 431985, "epoch": 5204} {"train_loss": -26.961008071899414, "global_step": 431986, "epoch": 5204} {"train_loss": -26.8476505279541, "global_step": 431987, "epoch": 5204} {"train_loss": -26.67791748046875, "global_step": 431988, "epoch": 5204} {"train_loss": -26.989288330078125, "global_step": 431989, "epoch": 5204} {"train_loss": -26.63046646118164, "global_step": 431990, "epoch": 5204} {"train_loss": -26.495161056518555, "global_step": 431991, "epoch": 5204} {"train_loss": -26.76611328125, "global_step": 431992, "epoch": 5204} {"train_loss": -26.52557945251465, "global_step": 431993, "epoch": 5204} {"train_loss": -26.96539878845215, "global_step": 431994, "epoch": 5204} {"train_loss": -26.825437545776367, "global_step": 431995, "epoch": 5204} {"train_loss": -26.8564395904541, "global_step": 431996, "epoch": 5204} {"train_loss": -27.135791778564453, "global_step": 431997, "epoch": 5204} {"train_loss": -26.932910919189453, "global_step": 431998, "epoch": 5204} {"train_loss": -26.663043975830078, "global_step": 431999, "epoch": 5204} {"train_loss": -26.8029727935791, "global_step": 432000, "epoch": 5204} {"train_loss": -26.685989379882812, "global_step": 432001, "epoch": 5204} {"train_loss": -26.9792537689209, "global_step": 432002, "epoch": 5204} {"train_loss": -26.6061954498291, "global_step": 432003, "epoch": 5204} {"train_loss": -27.061767578125, "global_step": 432004, "epoch": 5204} {"train_loss": -26.915180206298828, "global_step": 432005, "epoch": 5204} {"train_loss": -26.752164840698242, "global_step": 432006, "epoch": 5204} {"train_loss": -26.91015625, "global_step": 432007, "epoch": 5204} {"train_loss": -27.017654418945312, "global_step": 432008, "epoch": 5204} {"train_loss": -27.153593063354492, "global_step": 432009, "epoch": 5204} {"train_loss": -26.735111236572266, "global_step": 432010, "epoch": 5204} {"train_loss": -26.92609214782715, "global_step": 432011, "epoch": 5204} {"train_loss": -27.07526206970215, "global_step": 432012, "epoch": 5204} {"train_loss": -26.983993530273438, "global_step": 432013, "epoch": 5204} {"train_loss": -26.731000739407826, "global_step": 432014, "epoch": 5204, "val_loss": 6814837.0} {"train_loss": -26.221511840820312, "global_step": 432015, "epoch": 5205} {"train_loss": -26.1424503326416, "global_step": 432016, "epoch": 5205} {"train_loss": -26.710073471069336, "global_step": 432017, "epoch": 5205} {"train_loss": -26.613967895507812, "global_step": 432018, "epoch": 5205} {"train_loss": -26.794530868530273, "global_step": 432019, "epoch": 5205} {"train_loss": -26.625329971313477, "global_step": 432020, "epoch": 5205} {"train_loss": -26.516021728515625, "global_step": 432021, "epoch": 5205} {"train_loss": -26.884366989135742, "global_step": 432022, "epoch": 5205} {"train_loss": -27.14442253112793, "global_step": 432023, "epoch": 5205} {"train_loss": -26.607757568359375, "global_step": 432024, "epoch": 5205} {"train_loss": -27.058019638061523, "global_step": 432025, "epoch": 5205} {"train_loss": -26.6287899017334, "global_step": 432026, "epoch": 5205} {"train_loss": -26.975482940673828, "global_step": 432027, "epoch": 5205} {"train_loss": -26.648284912109375, "global_step": 432028, "epoch": 5205} {"train_loss": -26.9764404296875, "global_step": 432029, "epoch": 5205} {"train_loss": -26.76997184753418, "global_step": 432030, "epoch": 5205} {"train_loss": -26.680871963500977, "global_step": 432031, "epoch": 5205} {"train_loss": -27.043792724609375, "global_step": 432032, "epoch": 5205} {"train_loss": -27.0101318359375, "global_step": 432033, "epoch": 5205} {"train_loss": -27.398990631103516, "global_step": 432034, "epoch": 5205} {"train_loss": -27.337156295776367, "global_step": 432035, "epoch": 5205} {"train_loss": -27.0372257232666, "global_step": 432036, "epoch": 5205} {"train_loss": -26.997333526611328, "global_step": 432037, "epoch": 5205} {"train_loss": -26.77251625061035, "global_step": 432038, "epoch": 5205} {"train_loss": -27.12183952331543, "global_step": 432039, "epoch": 5205} {"train_loss": -26.967695236206055, "global_step": 432040, "epoch": 5205} {"train_loss": -27.111974716186523, "global_step": 432041, "epoch": 5205} {"train_loss": -26.62833023071289, "global_step": 432042, "epoch": 5205} {"train_loss": -27.073434829711914, "global_step": 432043, "epoch": 5205} {"train_loss": -26.940967559814453, "global_step": 432044, "epoch": 5205} {"train_loss": -27.002338409423828, "global_step": 432045, "epoch": 5205} {"train_loss": -26.564741134643555, "global_step": 432046, "epoch": 5205} {"train_loss": -26.607351303100586, "global_step": 432047, "epoch": 5205} {"train_loss": -26.733190536499023, "global_step": 432048, "epoch": 5205} {"train_loss": -27.293441772460938, "global_step": 432049, "epoch": 5205} {"train_loss": -27.09095573425293, "global_step": 432050, "epoch": 5205} {"train_loss": -26.953733444213867, "global_step": 432051, "epoch": 5205} {"train_loss": -27.14090919494629, "global_step": 432052, "epoch": 5205} {"train_loss": -26.76246452331543, "global_step": 432053, "epoch": 5205} {"train_loss": -26.75679588317871, "global_step": 432054, "epoch": 5205} {"train_loss": -26.854196548461914, "global_step": 432055, "epoch": 5205} {"train_loss": -27.04408073425293, "global_step": 432056, "epoch": 5205} {"train_loss": -26.7044734954834, "global_step": 432057, "epoch": 5205} {"train_loss": -26.71217155456543, "global_step": 432058, "epoch": 5205} {"train_loss": -26.823760986328125, "global_step": 432059, "epoch": 5205} {"train_loss": -26.619831085205078, "global_step": 432060, "epoch": 5205} {"train_loss": -26.843463897705078, "global_step": 432061, "epoch": 5205} {"train_loss": -26.95570182800293, "global_step": 432062, "epoch": 5205} {"train_loss": -27.143890380859375, "global_step": 432063, "epoch": 5205} {"train_loss": -26.302343368530273, "global_step": 432064, "epoch": 5205} {"train_loss": -26.358755111694336, "global_step": 432065, "epoch": 5205} {"train_loss": -27.082763671875, "global_step": 432066, "epoch": 5205} {"train_loss": -26.886625289916992, "global_step": 432067, "epoch": 5205} {"train_loss": -27.237060546875, "global_step": 432068, "epoch": 5205} {"train_loss": -26.788455963134766, "global_step": 432069, "epoch": 5205} {"train_loss": -27.109149932861328, "global_step": 432070, "epoch": 5205} {"train_loss": -26.8681583404541, "global_step": 432071, "epoch": 5205} {"train_loss": -26.82453727722168, "global_step": 432072, "epoch": 5205} {"train_loss": -27.159332275390625, "global_step": 432073, "epoch": 5205} {"train_loss": -26.71295166015625, "global_step": 432074, "epoch": 5205} {"train_loss": -26.8814640045166, "global_step": 432075, "epoch": 5205} {"train_loss": -27.019189834594727, "global_step": 432076, "epoch": 5205} {"train_loss": -27.040393829345703, "global_step": 432077, "epoch": 5205} {"train_loss": -26.88837242126465, "global_step": 432078, "epoch": 5205} {"train_loss": -27.16888999938965, "global_step": 432079, "epoch": 5205} {"train_loss": -26.933969497680664, "global_step": 432080, "epoch": 5205} {"train_loss": -26.8511905670166, "global_step": 432081, "epoch": 5205} {"train_loss": -27.008331298828125, "global_step": 432082, "epoch": 5205} {"train_loss": -26.933629989624023, "global_step": 432083, "epoch": 5205} {"train_loss": -26.960681915283203, "global_step": 432084, "epoch": 5205} {"train_loss": -26.85711097717285, "global_step": 432085, "epoch": 5205} {"train_loss": -26.942296981811523, "global_step": 432086, "epoch": 5205} {"train_loss": -26.7769718170166, "global_step": 432087, "epoch": 5205} {"train_loss": -27.147253036499023, "global_step": 432088, "epoch": 5205} {"train_loss": -27.199359893798828, "global_step": 432089, "epoch": 5205} {"train_loss": -27.087438583374023, "global_step": 432090, "epoch": 5205} {"train_loss": -27.3006591796875, "global_step": 432091, "epoch": 5205} {"train_loss": -26.9315128326416, "global_step": 432092, "epoch": 5205} {"train_loss": -26.888288497924805, "global_step": 432093, "epoch": 5205} {"train_loss": -26.619327545166016, "global_step": 432094, "epoch": 5205} {"train_loss": -26.945444107055664, "global_step": 432095, "epoch": 5205} {"train_loss": -26.96016502380371, "global_step": 432096, "epoch": 5205} {"train_loss": -26.90301748068936, "global_step": 432097, "epoch": 5205, "val_loss": 6814953.0} {"train_loss": -26.897146224975586, "global_step": 432098, "epoch": 5206} {"train_loss": -27.0966796875, "global_step": 432099, "epoch": 5206} {"train_loss": -26.584442138671875, "global_step": 432100, "epoch": 5206} {"train_loss": -26.651391983032227, "global_step": 432101, "epoch": 5206} {"train_loss": -26.673913955688477, "global_step": 432102, "epoch": 5206} {"train_loss": -26.40256118774414, "global_step": 432103, "epoch": 5206} {"train_loss": -26.64118003845215, "global_step": 432104, "epoch": 5206} {"train_loss": -26.745010375976562, "global_step": 432105, "epoch": 5206} {"train_loss": -26.891742706298828, "global_step": 432106, "epoch": 5206} {"train_loss": -26.828556060791016, "global_step": 432107, "epoch": 5206} {"train_loss": -27.10055923461914, "global_step": 432108, "epoch": 5206} {"train_loss": -27.009769439697266, "global_step": 432109, "epoch": 5206} {"train_loss": -26.509748458862305, "global_step": 432110, "epoch": 5206} {"train_loss": -26.786108016967773, "global_step": 432111, "epoch": 5206} {"train_loss": -26.954984664916992, "global_step": 432112, "epoch": 5206} {"train_loss": -27.0098876953125, "global_step": 432113, "epoch": 5206} {"train_loss": -26.769262313842773, "global_step": 432114, "epoch": 5206} {"train_loss": -26.982025146484375, "global_step": 432115, "epoch": 5206} {"train_loss": -26.557498931884766, "global_step": 432116, "epoch": 5206} {"train_loss": -26.361722946166992, "global_step": 432117, "epoch": 5206} {"train_loss": -26.62131118774414, "global_step": 432118, "epoch": 5206} {"train_loss": -27.043628692626953, "global_step": 432119, "epoch": 5206} {"train_loss": -27.07526206970215, "global_step": 432120, "epoch": 5206} {"train_loss": -26.835378646850586, "global_step": 432121, "epoch": 5206} {"train_loss": -26.748029708862305, "global_step": 432122, "epoch": 5206} {"train_loss": -26.40578269958496, "global_step": 432123, "epoch": 5206} {"train_loss": -26.682357788085938, "global_step": 432124, "epoch": 5206} {"train_loss": -26.75980567932129, "global_step": 432125, "epoch": 5206} {"train_loss": -26.793167114257812, "global_step": 432126, "epoch": 5206} {"train_loss": -26.865985870361328, "global_step": 432127, "epoch": 5206} {"train_loss": -26.947925567626953, "global_step": 432128, "epoch": 5206} {"train_loss": -26.526914596557617, "global_step": 432129, "epoch": 5206} {"train_loss": -27.146825790405273, "global_step": 432130, "epoch": 5206} {"train_loss": -27.018817901611328, "global_step": 432131, "epoch": 5206} {"train_loss": -26.9533634185791, "global_step": 432132, "epoch": 5206} {"train_loss": -27.021820068359375, "global_step": 432133, "epoch": 5206} {"train_loss": -27.03125, "global_step": 432134, "epoch": 5206} {"train_loss": -26.626047134399414, "global_step": 432135, "epoch": 5206} {"train_loss": -26.778675079345703, "global_step": 432136, "epoch": 5206} {"train_loss": -26.723770141601562, "global_step": 432137, "epoch": 5206} {"train_loss": -26.695966720581055, "global_step": 432138, "epoch": 5206} {"train_loss": -26.844940185546875, "global_step": 432139, "epoch": 5206} {"train_loss": -26.853240966796875, "global_step": 432140, "epoch": 5206} {"train_loss": -27.043704986572266, "global_step": 432141, "epoch": 5206} {"train_loss": -27.28322410583496, "global_step": 432142, "epoch": 5206} {"train_loss": -26.8684024810791, "global_step": 432143, "epoch": 5206} {"train_loss": -27.207990646362305, "global_step": 432144, "epoch": 5206} {"train_loss": -27.050939559936523, "global_step": 432145, "epoch": 5206} {"train_loss": -27.123672485351562, "global_step": 432146, "epoch": 5206} {"train_loss": -26.975910186767578, "global_step": 432147, "epoch": 5206} {"train_loss": -27.086734771728516, "global_step": 432148, "epoch": 5206} {"train_loss": -27.29670524597168, "global_step": 432149, "epoch": 5206} {"train_loss": -26.764982223510742, "global_step": 432150, "epoch": 5206} {"train_loss": -27.20734214782715, "global_step": 432151, "epoch": 5206} {"train_loss": -26.887842178344727, "global_step": 432152, "epoch": 5206} {"train_loss": -26.9282169342041, "global_step": 432153, "epoch": 5206} {"train_loss": -27.02081298828125, "global_step": 432154, "epoch": 5206} {"train_loss": -27.000980377197266, "global_step": 432155, "epoch": 5206} {"train_loss": -27.000030517578125, "global_step": 432156, "epoch": 5206} {"train_loss": -27.275989532470703, "global_step": 432157, "epoch": 5206} {"train_loss": -27.086740493774414, "global_step": 432158, "epoch": 5206} {"train_loss": -27.3183650970459, "global_step": 432159, "epoch": 5206} {"train_loss": -26.630157470703125, "global_step": 432160, "epoch": 5206} {"train_loss": -27.48707389831543, "global_step": 432161, "epoch": 5206} {"train_loss": -26.622364044189453, "global_step": 432162, "epoch": 5206} {"train_loss": -27.08782386779785, "global_step": 432163, "epoch": 5206} {"train_loss": -27.134408950805664, "global_step": 432164, "epoch": 5206} {"train_loss": -26.846546173095703, "global_step": 432165, "epoch": 5206} {"train_loss": -26.91106605529785, "global_step": 432166, "epoch": 5206} {"train_loss": -26.992521286010742, "global_step": 432167, "epoch": 5206} {"train_loss": -26.837371826171875, "global_step": 432168, "epoch": 5206} {"train_loss": -27.144275665283203, "global_step": 432169, "epoch": 5206} {"train_loss": -27.067676544189453, "global_step": 432170, "epoch": 5206} {"train_loss": -26.8165340423584, "global_step": 432171, "epoch": 5206} {"train_loss": -27.009408950805664, "global_step": 432172, "epoch": 5206} {"train_loss": -27.12799072265625, "global_step": 432173, "epoch": 5206} {"train_loss": -26.7308292388916, "global_step": 432174, "epoch": 5206} {"train_loss": -26.764759063720703, "global_step": 432175, "epoch": 5206} {"train_loss": -26.985021591186523, "global_step": 432176, "epoch": 5206} {"train_loss": -27.060773849487305, "global_step": 432177, "epoch": 5206} {"train_loss": -26.757383346557617, "global_step": 432178, "epoch": 5206} {"train_loss": -26.557880401611328, "global_step": 432179, "epoch": 5206} {"train_loss": -26.89628373571189, "global_step": 432180, "epoch": 5206, "val_loss": 6855069.0} {"train_loss": -26.466238021850586, "global_step": 432181, "epoch": 5207} {"train_loss": -25.503936767578125, "global_step": 432182, "epoch": 5207} {"train_loss": -26.186609268188477, "global_step": 432183, "epoch": 5207} {"train_loss": -25.576868057250977, "global_step": 432184, "epoch": 5207} {"train_loss": -26.66938591003418, "global_step": 432185, "epoch": 5207} {"train_loss": -26.162124633789062, "global_step": 432186, "epoch": 5207} {"train_loss": -26.343671798706055, "global_step": 432187, "epoch": 5207} {"train_loss": -25.99458122253418, "global_step": 432188, "epoch": 5207} {"train_loss": -26.206567764282227, "global_step": 432189, "epoch": 5207} {"train_loss": -26.368045806884766, "global_step": 432190, "epoch": 5207} {"train_loss": -26.603351593017578, "global_step": 432191, "epoch": 5207} {"train_loss": -26.860260009765625, "global_step": 432192, "epoch": 5207} {"train_loss": -26.68744468688965, "global_step": 432193, "epoch": 5207} {"train_loss": -26.506086349487305, "global_step": 432194, "epoch": 5207} {"train_loss": -26.548635482788086, "global_step": 432195, "epoch": 5207} {"train_loss": -26.8909912109375, "global_step": 432196, "epoch": 5207} {"train_loss": -26.8498592376709, "global_step": 432197, "epoch": 5207} {"train_loss": -26.464567184448242, "global_step": 432198, "epoch": 5207} {"train_loss": -26.803823471069336, "global_step": 432199, "epoch": 5207} {"train_loss": -26.671554565429688, "global_step": 432200, "epoch": 5207} {"train_loss": -26.799945831298828, "global_step": 432201, "epoch": 5207} {"train_loss": -26.690412521362305, "global_step": 432202, "epoch": 5207} {"train_loss": -26.591886520385742, "global_step": 432203, "epoch": 5207} {"train_loss": -26.989816665649414, "global_step": 432204, "epoch": 5207} {"train_loss": -27.07248306274414, "global_step": 432205, "epoch": 5207} {"train_loss": -26.71282958984375, "global_step": 432206, "epoch": 5207} {"train_loss": -27.2137393951416, "global_step": 432207, "epoch": 5207} {"train_loss": -26.59869956970215, "global_step": 432208, "epoch": 5207} {"train_loss": -26.909072875976562, "global_step": 432209, "epoch": 5207} {"train_loss": -26.45392417907715, "global_step": 432210, "epoch": 5207} {"train_loss": -26.772464752197266, "global_step": 432211, "epoch": 5207} {"train_loss": -26.66094398498535, "global_step": 432212, "epoch": 5207} {"train_loss": -27.18120765686035, "global_step": 432213, "epoch": 5207} {"train_loss": -26.945819854736328, "global_step": 432214, "epoch": 5207} {"train_loss": -26.55775260925293, "global_step": 432215, "epoch": 5207} {"train_loss": -26.895526885986328, "global_step": 432216, "epoch": 5207} {"train_loss": -27.03325843811035, "global_step": 432217, "epoch": 5207} {"train_loss": -26.830963134765625, "global_step": 432218, "epoch": 5207} {"train_loss": -26.6586971282959, "global_step": 432219, "epoch": 5207} {"train_loss": -26.774585723876953, "global_step": 432220, "epoch": 5207} {"train_loss": -27.038732528686523, "global_step": 432221, "epoch": 5207} {"train_loss": -26.613525390625, "global_step": 432222, "epoch": 5207} {"train_loss": -26.4340763092041, "global_step": 432223, "epoch": 5207} {"train_loss": -26.736417770385742, "global_step": 432224, "epoch": 5207} {"train_loss": -27.051544189453125, "global_step": 432225, "epoch": 5207} {"train_loss": -26.642459869384766, "global_step": 432226, "epoch": 5207} {"train_loss": -27.023365020751953, "global_step": 432227, "epoch": 5207} {"train_loss": -27.150434494018555, "global_step": 432228, "epoch": 5207} {"train_loss": -26.84107780456543, "global_step": 432229, "epoch": 5207} {"train_loss": -26.75860595703125, "global_step": 432230, "epoch": 5207} {"train_loss": -26.50433349609375, "global_step": 432231, "epoch": 5207} {"train_loss": -26.672983169555664, "global_step": 432232, "epoch": 5207} {"train_loss": -26.88081169128418, "global_step": 432233, "epoch": 5207} {"train_loss": -27.05006217956543, "global_step": 432234, "epoch": 5207} {"train_loss": -26.737157821655273, "global_step": 432235, "epoch": 5207} {"train_loss": -26.848499298095703, "global_step": 432236, "epoch": 5207} {"train_loss": -27.162601470947266, "global_step": 432237, "epoch": 5207} {"train_loss": -27.266891479492188, "global_step": 432238, "epoch": 5207} {"train_loss": -26.24049949645996, "global_step": 432239, "epoch": 5207} {"train_loss": -26.4044246673584, "global_step": 432240, "epoch": 5207} {"train_loss": -26.484067916870117, "global_step": 432241, "epoch": 5207} {"train_loss": -26.920181274414062, "global_step": 432242, "epoch": 5207} {"train_loss": -26.503442764282227, "global_step": 432243, "epoch": 5207} {"train_loss": -26.694564819335938, "global_step": 432244, "epoch": 5207} {"train_loss": -26.66615104675293, "global_step": 432245, "epoch": 5207} {"train_loss": -26.834264755249023, "global_step": 432246, "epoch": 5207} {"train_loss": -27.079715728759766, "global_step": 432247, "epoch": 5207} {"train_loss": -26.9732666015625, "global_step": 432248, "epoch": 5207} {"train_loss": -26.810239791870117, "global_step": 432249, "epoch": 5207} {"train_loss": -26.993947982788086, "global_step": 432250, "epoch": 5207} {"train_loss": -26.997390747070312, "global_step": 432251, "epoch": 5207} {"train_loss": -26.997528076171875, "global_step": 432252, "epoch": 5207} {"train_loss": -27.037139892578125, "global_step": 432253, "epoch": 5207} {"train_loss": -26.81389808654785, "global_step": 432254, "epoch": 5207} {"train_loss": -27.23432731628418, "global_step": 432255, "epoch": 5207} {"train_loss": -27.406253814697266, "global_step": 432256, "epoch": 5207} {"train_loss": -26.82858657836914, "global_step": 432257, "epoch": 5207} {"train_loss": -26.826684951782227, "global_step": 432258, "epoch": 5207} {"train_loss": -26.96933937072754, "global_step": 432259, "epoch": 5207} {"train_loss": -26.99067497253418, "global_step": 432260, "epoch": 5207} {"train_loss": -27.186542510986328, "global_step": 432261, "epoch": 5207} {"train_loss": -27.00760841369629, "global_step": 432262, "epoch": 5207} {"train_loss": -26.746723152068725, "global_step": 432263, "epoch": 5207, "val_loss": 6833648.0} {"train_loss": -26.60984230041504, "global_step": 432264, "epoch": 5208} {"train_loss": -26.54361343383789, "global_step": 432265, "epoch": 5208} {"train_loss": -26.5930233001709, "global_step": 432266, "epoch": 5208} {"train_loss": -27.1739444732666, "global_step": 432267, "epoch": 5208} {"train_loss": -27.007944107055664, "global_step": 432268, "epoch": 5208} {"train_loss": -26.69189453125, "global_step": 432269, "epoch": 5208} {"train_loss": -27.057714462280273, "global_step": 432270, "epoch": 5208} {"train_loss": -27.226388931274414, "global_step": 432271, "epoch": 5208} {"train_loss": -26.441120147705078, "global_step": 432272, "epoch": 5208} {"train_loss": -26.665475845336914, "global_step": 432273, "epoch": 5208} {"train_loss": -26.598913192749023, "global_step": 432274, "epoch": 5208} {"train_loss": -26.9250545501709, "global_step": 432275, "epoch": 5208} {"train_loss": -26.882566452026367, "global_step": 432276, "epoch": 5208} {"train_loss": -26.867151260375977, "global_step": 432277, "epoch": 5208} {"train_loss": -26.919021606445312, "global_step": 432278, "epoch": 5208} {"train_loss": -26.838958740234375, "global_step": 432279, "epoch": 5208} {"train_loss": -26.979516983032227, "global_step": 432280, "epoch": 5208} {"train_loss": -26.638153076171875, "global_step": 432281, "epoch": 5208} {"train_loss": -27.034711837768555, "global_step": 432282, "epoch": 5208} {"train_loss": -27.032316207885742, "global_step": 432283, "epoch": 5208} {"train_loss": -26.676511764526367, "global_step": 432284, "epoch": 5208} {"train_loss": -27.05716323852539, "global_step": 432285, "epoch": 5208} {"train_loss": -26.77606773376465, "global_step": 432286, "epoch": 5208} {"train_loss": -26.83577537536621, "global_step": 432287, "epoch": 5208} {"train_loss": -26.953338623046875, "global_step": 432288, "epoch": 5208} {"train_loss": -27.06597900390625, "global_step": 432289, "epoch": 5208} {"train_loss": -27.053272247314453, "global_step": 432290, "epoch": 5208} {"train_loss": -27.166330337524414, "global_step": 432291, "epoch": 5208} {"train_loss": -27.0307559967041, "global_step": 432292, "epoch": 5208} {"train_loss": -26.980154037475586, "global_step": 432293, "epoch": 5208} {"train_loss": -26.85015869140625, "global_step": 432294, "epoch": 5208} {"train_loss": -27.23638343811035, "global_step": 432295, "epoch": 5208} {"train_loss": -26.90900230407715, "global_step": 432296, "epoch": 5208} {"train_loss": -26.95277214050293, "global_step": 432297, "epoch": 5208} {"train_loss": -27.063934326171875, "global_step": 432298, "epoch": 5208} {"train_loss": -26.94534683227539, "global_step": 432299, "epoch": 5208} {"train_loss": -27.04853630065918, "global_step": 432300, "epoch": 5208} {"train_loss": -27.29081153869629, "global_step": 432301, "epoch": 5208} {"train_loss": -27.287168502807617, "global_step": 432302, "epoch": 5208} {"train_loss": -27.06483268737793, "global_step": 432303, "epoch": 5208} {"train_loss": -27.20842933654785, "global_step": 432304, "epoch": 5208} {"train_loss": -27.10755729675293, "global_step": 432305, "epoch": 5208} {"train_loss": -26.89768409729004, "global_step": 432306, "epoch": 5208} {"train_loss": -27.49249267578125, "global_step": 432307, "epoch": 5208} {"train_loss": -27.058963775634766, "global_step": 432308, "epoch": 5208} {"train_loss": -27.223499298095703, "global_step": 432309, "epoch": 5208} {"train_loss": -27.322986602783203, "global_step": 432310, "epoch": 5208} {"train_loss": -27.040348052978516, "global_step": 432311, "epoch": 5208} {"train_loss": -26.876062393188477, "global_step": 432312, "epoch": 5208} {"train_loss": -27.277204513549805, "global_step": 432313, "epoch": 5208} {"train_loss": -26.385452270507812, "global_step": 432314, "epoch": 5208} {"train_loss": -25.95881462097168, "global_step": 432315, "epoch": 5208} {"train_loss": -25.59214210510254, "global_step": 432316, "epoch": 5208} {"train_loss": -25.977048873901367, "global_step": 432317, "epoch": 5208} {"train_loss": -25.140478134155273, "global_step": 432318, "epoch": 5208} {"train_loss": -26.0051212310791, "global_step": 432319, "epoch": 5208} {"train_loss": -27.128803253173828, "global_step": 432320, "epoch": 5208} {"train_loss": -25.994489669799805, "global_step": 432321, "epoch": 5208} {"train_loss": -26.5919189453125, "global_step": 432322, "epoch": 5208} {"train_loss": -26.95180320739746, "global_step": 432323, "epoch": 5208} {"train_loss": -26.132360458374023, "global_step": 432324, "epoch": 5208} {"train_loss": -26.657489776611328, "global_step": 432325, "epoch": 5208} {"train_loss": -26.4682559967041, "global_step": 432326, "epoch": 5208} {"train_loss": -26.652286529541016, "global_step": 432327, "epoch": 5208} {"train_loss": -26.207473754882812, "global_step": 432328, "epoch": 5208} {"train_loss": -27.034833908081055, "global_step": 432329, "epoch": 5208} {"train_loss": -26.2845401763916, "global_step": 432330, "epoch": 5208} {"train_loss": -26.285903930664062, "global_step": 432331, "epoch": 5208} {"train_loss": -26.165136337280273, "global_step": 432332, "epoch": 5208} {"train_loss": -26.46048355102539, "global_step": 432333, "epoch": 5208} {"train_loss": -26.31647300720215, "global_step": 432334, "epoch": 5208} {"train_loss": -26.0549259185791, "global_step": 432335, "epoch": 5208} {"train_loss": -26.474695205688477, "global_step": 432336, "epoch": 5208} {"train_loss": -26.468427658081055, "global_step": 432337, "epoch": 5208} {"train_loss": -26.709009170532227, "global_step": 432338, "epoch": 5208} {"train_loss": -26.87031364440918, "global_step": 432339, "epoch": 5208} {"train_loss": -27.001989364624023, "global_step": 432340, "epoch": 5208} {"train_loss": -26.708221435546875, "global_step": 432341, "epoch": 5208} {"train_loss": -26.73074722290039, "global_step": 432342, "epoch": 5208} {"train_loss": -26.833776473999023, "global_step": 432343, "epoch": 5208} {"train_loss": -26.696441650390625, "global_step": 432344, "epoch": 5208} {"train_loss": -26.95473289489746, "global_step": 432345, "epoch": 5208} {"train_loss": -26.747432318078467, "global_step": 432346, "epoch": 5208, "val_loss": 6872683.5} {"train_loss": -26.684940338134766, "global_step": 432347, "epoch": 5209} {"train_loss": -26.459226608276367, "global_step": 432348, "epoch": 5209} {"train_loss": -26.684289932250977, "global_step": 432349, "epoch": 5209} {"train_loss": -26.487354278564453, "global_step": 432350, "epoch": 5209} {"train_loss": -26.146392822265625, "global_step": 432351, "epoch": 5209} {"train_loss": -26.18842887878418, "global_step": 432352, "epoch": 5209} {"train_loss": -26.5604190826416, "global_step": 432353, "epoch": 5209} {"train_loss": -26.74240493774414, "global_step": 432354, "epoch": 5209} {"train_loss": -26.6802921295166, "global_step": 432355, "epoch": 5209} {"train_loss": -26.21950340270996, "global_step": 432356, "epoch": 5209} {"train_loss": -26.724645614624023, "global_step": 432357, "epoch": 5209} {"train_loss": -26.82906150817871, "global_step": 432358, "epoch": 5209} {"train_loss": -27.113529205322266, "global_step": 432359, "epoch": 5209} {"train_loss": -26.776966094970703, "global_step": 432360, "epoch": 5209} {"train_loss": -26.646284103393555, "global_step": 432361, "epoch": 5209} {"train_loss": -26.7042236328125, "global_step": 432362, "epoch": 5209} {"train_loss": -26.897308349609375, "global_step": 432363, "epoch": 5209} {"train_loss": -26.771961212158203, "global_step": 432364, "epoch": 5209} {"train_loss": -26.887466430664062, "global_step": 432365, "epoch": 5209} {"train_loss": -27.049230575561523, "global_step": 432366, "epoch": 5209} {"train_loss": -26.526752471923828, "global_step": 432367, "epoch": 5209} {"train_loss": -26.71417808532715, "global_step": 432368, "epoch": 5209} {"train_loss": -26.83408546447754, "global_step": 432369, "epoch": 5209} {"train_loss": -26.927793502807617, "global_step": 432370, "epoch": 5209} {"train_loss": -26.998823165893555, "global_step": 432371, "epoch": 5209} {"train_loss": -26.592859268188477, "global_step": 432372, "epoch": 5209} {"train_loss": -26.8558292388916, "global_step": 432373, "epoch": 5209} {"train_loss": -26.906538009643555, "global_step": 432374, "epoch": 5209} {"train_loss": -26.79331398010254, "global_step": 432375, "epoch": 5209} {"train_loss": -27.007307052612305, "global_step": 432376, "epoch": 5209} {"train_loss": -26.955286026000977, "global_step": 432377, "epoch": 5209} {"train_loss": -26.448383331298828, "global_step": 432378, "epoch": 5209} {"train_loss": -26.634185791015625, "global_step": 432379, "epoch": 5209} {"train_loss": -27.042285919189453, "global_step": 432380, "epoch": 5209} {"train_loss": -26.912494659423828, "global_step": 432381, "epoch": 5209} {"train_loss": -26.93507957458496, "global_step": 432382, "epoch": 5209} {"train_loss": -26.4748592376709, "global_step": 432383, "epoch": 5209} {"train_loss": -27.04766845703125, "global_step": 432384, "epoch": 5209} {"train_loss": -27.2093505859375, "global_step": 432385, "epoch": 5209} {"train_loss": -27.087736129760742, "global_step": 432386, "epoch": 5209} {"train_loss": -27.3504695892334, "global_step": 432387, "epoch": 5209} {"train_loss": -26.78839111328125, "global_step": 432388, "epoch": 5209} {"train_loss": -26.999759674072266, "global_step": 432389, "epoch": 5209} {"train_loss": -27.420923233032227, "global_step": 432390, "epoch": 5209} {"train_loss": -27.21246910095215, "global_step": 432391, "epoch": 5209} {"train_loss": -26.430145263671875, "global_step": 432392, "epoch": 5209} {"train_loss": -26.422372817993164, "global_step": 432393, "epoch": 5209} {"train_loss": -26.2951717376709, "global_step": 432394, "epoch": 5209} {"train_loss": -26.61860466003418, "global_step": 432395, "epoch": 5209} {"train_loss": -27.056066513061523, "global_step": 432396, "epoch": 5209} {"train_loss": -26.98101806640625, "global_step": 432397, "epoch": 5209} {"train_loss": -27.169605255126953, "global_step": 432398, "epoch": 5209} {"train_loss": -27.087194442749023, "global_step": 432399, "epoch": 5209} {"train_loss": -27.49155616760254, "global_step": 432400, "epoch": 5209} {"train_loss": -27.607166290283203, "global_step": 432401, "epoch": 5209} {"train_loss": -26.786285400390625, "global_step": 432402, "epoch": 5209} {"train_loss": -27.074832916259766, "global_step": 432403, "epoch": 5209} {"train_loss": -26.736526489257812, "global_step": 432404, "epoch": 5209} {"train_loss": -26.933950424194336, "global_step": 432405, "epoch": 5209} {"train_loss": -26.87672233581543, "global_step": 432406, "epoch": 5209} {"train_loss": -27.182117462158203, "global_step": 432407, "epoch": 5209} {"train_loss": -27.176227569580078, "global_step": 432408, "epoch": 5209} {"train_loss": -27.03761100769043, "global_step": 432409, "epoch": 5209} {"train_loss": -26.69681739807129, "global_step": 432410, "epoch": 5209} {"train_loss": -26.671560287475586, "global_step": 432411, "epoch": 5209} {"train_loss": -26.515539169311523, "global_step": 432412, "epoch": 5209} {"train_loss": -26.29815101623535, "global_step": 432413, "epoch": 5209} {"train_loss": -26.718585968017578, "global_step": 432414, "epoch": 5209} {"train_loss": -26.921106338500977, "global_step": 432415, "epoch": 5209} {"train_loss": -26.461261749267578, "global_step": 432416, "epoch": 5209} {"train_loss": -26.082365036010742, "global_step": 432417, "epoch": 5209} {"train_loss": -25.728551864624023, "global_step": 432418, "epoch": 5209} {"train_loss": -25.661436080932617, "global_step": 432419, "epoch": 5209} {"train_loss": -26.604537963867188, "global_step": 432420, "epoch": 5209} {"train_loss": -25.09175682067871, "global_step": 432421, "epoch": 5209} {"train_loss": -25.761999130249023, "global_step": 432422, "epoch": 5209} {"train_loss": -25.932647705078125, "global_step": 432423, "epoch": 5209} {"train_loss": -26.313465118408203, "global_step": 432424, "epoch": 5209} {"train_loss": -26.414941787719727, "global_step": 432425, "epoch": 5209} {"train_loss": -26.482446670532227, "global_step": 432426, "epoch": 5209} {"train_loss": -26.601551055908203, "global_step": 432427, "epoch": 5209} {"train_loss": -26.35332679748535, "global_step": 432428, "epoch": 5209} {"train_loss": -26.68955490388066, "global_step": 432429, "epoch": 5209, "val_loss": 6852615.0} {"train_loss": -26.261981964111328, "global_step": 432430, "epoch": 5210} {"train_loss": -26.102188110351562, "global_step": 432431, "epoch": 5210} {"train_loss": -26.19373893737793, "global_step": 432432, "epoch": 5210} {"train_loss": -26.456954956054688, "global_step": 432433, "epoch": 5210} {"train_loss": -26.22893714904785, "global_step": 432434, "epoch": 5210} {"train_loss": -26.1049861907959, "global_step": 432435, "epoch": 5210} {"train_loss": -26.769027709960938, "global_step": 432436, "epoch": 5210} {"train_loss": -26.20063591003418, "global_step": 432437, "epoch": 5210} {"train_loss": -26.575048446655273, "global_step": 432438, "epoch": 5210} {"train_loss": -26.153059005737305, "global_step": 432439, "epoch": 5210} {"train_loss": -26.419591903686523, "global_step": 432440, "epoch": 5210} {"train_loss": -26.505746841430664, "global_step": 432441, "epoch": 5210} {"train_loss": -26.3287296295166, "global_step": 432442, "epoch": 5210} {"train_loss": -26.345014572143555, "global_step": 432443, "epoch": 5210} {"train_loss": -26.43814468383789, "global_step": 432444, "epoch": 5210} {"train_loss": -26.588171005249023, "global_step": 432445, "epoch": 5210} {"train_loss": -26.402624130249023, "global_step": 432446, "epoch": 5210} {"train_loss": -26.619245529174805, "global_step": 432447, "epoch": 5210} {"train_loss": -26.71192741394043, "global_step": 432448, "epoch": 5210} {"train_loss": -26.665058135986328, "global_step": 432449, "epoch": 5210} {"train_loss": -26.632532119750977, "global_step": 432450, "epoch": 5210} {"train_loss": -26.841968536376953, "global_step": 432451, "epoch": 5210} {"train_loss": -26.924238204956055, "global_step": 432452, "epoch": 5210} {"train_loss": -26.39347267150879, "global_step": 432453, "epoch": 5210} {"train_loss": -26.470703125, "global_step": 432454, "epoch": 5210} {"train_loss": -26.400436401367188, "global_step": 432455, "epoch": 5210} {"train_loss": -26.66328239440918, "global_step": 432456, "epoch": 5210} {"train_loss": -26.594165802001953, "global_step": 432457, "epoch": 5210} {"train_loss": -26.618757247924805, "global_step": 432458, "epoch": 5210} {"train_loss": -27.034687042236328, "global_step": 432459, "epoch": 5210} {"train_loss": -26.98439598083496, "global_step": 432460, "epoch": 5210} {"train_loss": -27.189279556274414, "global_step": 432461, "epoch": 5210} {"train_loss": -27.12811851501465, "global_step": 432462, "epoch": 5210} {"train_loss": -27.314847946166992, "global_step": 432463, "epoch": 5210} {"train_loss": -27.140302658081055, "global_step": 432464, "epoch": 5210} {"train_loss": -26.850873947143555, "global_step": 432465, "epoch": 5210} {"train_loss": -26.91847038269043, "global_step": 432466, "epoch": 5210} {"train_loss": -26.775714874267578, "global_step": 432467, "epoch": 5210} {"train_loss": -27.086790084838867, "global_step": 432468, "epoch": 5210} {"train_loss": -27.188098907470703, "global_step": 432469, "epoch": 5210} {"train_loss": -27.220300674438477, "global_step": 432470, "epoch": 5210} {"train_loss": -26.9444580078125, "global_step": 432471, "epoch": 5210} {"train_loss": -27.10381507873535, "global_step": 432472, "epoch": 5210} {"train_loss": -26.94846534729004, "global_step": 432473, "epoch": 5210} {"train_loss": -26.89291763305664, "global_step": 432474, "epoch": 5210} {"train_loss": -27.0611515045166, "global_step": 432475, "epoch": 5210} {"train_loss": -26.847524642944336, "global_step": 432476, "epoch": 5210} {"train_loss": -27.188674926757812, "global_step": 432477, "epoch": 5210} {"train_loss": -27.1424560546875, "global_step": 432478, "epoch": 5210} {"train_loss": -27.400466918945312, "global_step": 432479, "epoch": 5210} {"train_loss": -27.001279830932617, "global_step": 432480, "epoch": 5210} {"train_loss": -26.99053955078125, "global_step": 432481, "epoch": 5210} {"train_loss": -27.213794708251953, "global_step": 432482, "epoch": 5210} {"train_loss": -26.88108253479004, "global_step": 432483, "epoch": 5210} {"train_loss": -26.952880859375, "global_step": 432484, "epoch": 5210} {"train_loss": -26.961095809936523, "global_step": 432485, "epoch": 5210} {"train_loss": -26.85970115661621, "global_step": 432486, "epoch": 5210} {"train_loss": -27.340131759643555, "global_step": 432487, "epoch": 5210} {"train_loss": -26.646961212158203, "global_step": 432488, "epoch": 5210} {"train_loss": -26.263137817382812, "global_step": 432489, "epoch": 5210} {"train_loss": -26.487146377563477, "global_step": 432490, "epoch": 5210} {"train_loss": -26.651153564453125, "global_step": 432491, "epoch": 5210} {"train_loss": -26.82086753845215, "global_step": 432492, "epoch": 5210} {"train_loss": -26.937482833862305, "global_step": 432493, "epoch": 5210} {"train_loss": -26.90981101989746, "global_step": 432494, "epoch": 5210} {"train_loss": -26.783649444580078, "global_step": 432495, "epoch": 5210} {"train_loss": -27.032541275024414, "global_step": 432496, "epoch": 5210} {"train_loss": -27.092920303344727, "global_step": 432497, "epoch": 5210} {"train_loss": -27.021697998046875, "global_step": 432498, "epoch": 5210} {"train_loss": -26.9281063079834, "global_step": 432499, "epoch": 5210} {"train_loss": -26.96225929260254, "global_step": 432500, "epoch": 5210} {"train_loss": -27.157806396484375, "global_step": 432501, "epoch": 5210} {"train_loss": -27.180707931518555, "global_step": 432502, "epoch": 5210} {"train_loss": -27.09650230407715, "global_step": 432503, "epoch": 5210} {"train_loss": -27.31743812561035, "global_step": 432504, "epoch": 5210} {"train_loss": -26.968896865844727, "global_step": 432505, "epoch": 5210} {"train_loss": -27.172351837158203, "global_step": 432506, "epoch": 5210} {"train_loss": -27.01755714416504, "global_step": 432507, "epoch": 5210} {"train_loss": -26.84406089782715, "global_step": 432508, "epoch": 5210} {"train_loss": -26.756296157836914, "global_step": 432509, "epoch": 5210} {"train_loss": -26.916187286376953, "global_step": 432510, "epoch": 5210} {"train_loss": -27.01495361328125, "global_step": 432511, "epoch": 5210} {"train_loss": -26.820216190384095, "global_step": 432512, "epoch": 5210, "val_loss": 6959975.0} {"train_loss": -26.293928146362305, "global_step": 432513, "epoch": 5211} {"train_loss": -26.306781768798828, "global_step": 432514, "epoch": 5211} {"train_loss": -26.23115348815918, "global_step": 432515, "epoch": 5211} {"train_loss": -26.56317710876465, "global_step": 432516, "epoch": 5211} {"train_loss": -26.434476852416992, "global_step": 432517, "epoch": 5211} {"train_loss": -26.051244735717773, "global_step": 432518, "epoch": 5211} {"train_loss": -25.981794357299805, "global_step": 432519, "epoch": 5211} {"train_loss": -26.54023551940918, "global_step": 432520, "epoch": 5211} {"train_loss": -26.368234634399414, "global_step": 432521, "epoch": 5211} {"train_loss": -26.549970626831055, "global_step": 432522, "epoch": 5211} {"train_loss": -26.8104248046875, "global_step": 432523, "epoch": 5211} {"train_loss": -26.875106811523438, "global_step": 432524, "epoch": 5211} {"train_loss": -26.573938369750977, "global_step": 432525, "epoch": 5211} {"train_loss": -26.54736328125, "global_step": 432526, "epoch": 5211} {"train_loss": -26.83204460144043, "global_step": 432527, "epoch": 5211} {"train_loss": -27.071786880493164, "global_step": 432528, "epoch": 5211} {"train_loss": -26.65363883972168, "global_step": 432529, "epoch": 5211} {"train_loss": -26.46516227722168, "global_step": 432530, "epoch": 5211} {"train_loss": -26.427392959594727, "global_step": 432531, "epoch": 5211} {"train_loss": -26.935728073120117, "global_step": 432532, "epoch": 5211} {"train_loss": -26.568418502807617, "global_step": 432533, "epoch": 5211} {"train_loss": -26.52937889099121, "global_step": 432534, "epoch": 5211} {"train_loss": -26.741119384765625, "global_step": 432535, "epoch": 5211} {"train_loss": -27.129148483276367, "global_step": 432536, "epoch": 5211} {"train_loss": -26.590330123901367, "global_step": 432537, "epoch": 5211} {"train_loss": -26.8050594329834, "global_step": 432538, "epoch": 5211} {"train_loss": -26.848098754882812, "global_step": 432539, "epoch": 5211} {"train_loss": -26.809457778930664, "global_step": 432540, "epoch": 5211} {"train_loss": -26.461729049682617, "global_step": 432541, "epoch": 5211} {"train_loss": -26.948129653930664, "global_step": 432542, "epoch": 5211} {"train_loss": -26.589767456054688, "global_step": 432543, "epoch": 5211} {"train_loss": -26.715620040893555, "global_step": 432544, "epoch": 5211} {"train_loss": -27.00335121154785, "global_step": 432545, "epoch": 5211} {"train_loss": -26.855762481689453, "global_step": 432546, "epoch": 5211} {"train_loss": -27.033674240112305, "global_step": 432547, "epoch": 5211} {"train_loss": -26.79190444946289, "global_step": 432548, "epoch": 5211} {"train_loss": -27.049528121948242, "global_step": 432549, "epoch": 5211} {"train_loss": -26.9764347076416, "global_step": 432550, "epoch": 5211} {"train_loss": -26.967248916625977, "global_step": 432551, "epoch": 5211} {"train_loss": -27.070404052734375, "global_step": 432552, "epoch": 5211} {"train_loss": -26.98598289489746, "global_step": 432553, "epoch": 5211} {"train_loss": -26.92555046081543, "global_step": 432554, "epoch": 5211} {"train_loss": -27.08493995666504, "global_step": 432555, "epoch": 5211} {"train_loss": -27.34649658203125, "global_step": 432556, "epoch": 5211} {"train_loss": -27.022308349609375, "global_step": 432557, "epoch": 5211} {"train_loss": -27.22052001953125, "global_step": 432558, "epoch": 5211} {"train_loss": -26.970260620117188, "global_step": 432559, "epoch": 5211} {"train_loss": -26.875158309936523, "global_step": 432560, "epoch": 5211} {"train_loss": -26.955402374267578, "global_step": 432561, "epoch": 5211} {"train_loss": -27.078617095947266, "global_step": 432562, "epoch": 5211} {"train_loss": -27.37733268737793, "global_step": 432563, "epoch": 5211} {"train_loss": -27.09760093688965, "global_step": 432564, "epoch": 5211} {"train_loss": -26.87605094909668, "global_step": 432565, "epoch": 5211} {"train_loss": -26.86685562133789, "global_step": 432566, "epoch": 5211} {"train_loss": -26.88899040222168, "global_step": 432567, "epoch": 5211} {"train_loss": -27.2099609375, "global_step": 432568, "epoch": 5211} {"train_loss": -27.340063095092773, "global_step": 432569, "epoch": 5211} {"train_loss": -26.801389694213867, "global_step": 432570, "epoch": 5211} {"train_loss": -26.836423873901367, "global_step": 432571, "epoch": 5211} {"train_loss": -27.1541748046875, "global_step": 432572, "epoch": 5211} {"train_loss": -27.027740478515625, "global_step": 432573, "epoch": 5211} {"train_loss": -26.688983917236328, "global_step": 432574, "epoch": 5211} {"train_loss": -26.470556259155273, "global_step": 432575, "epoch": 5211} {"train_loss": -26.7454891204834, "global_step": 432576, "epoch": 5211} {"train_loss": -26.574766159057617, "global_step": 432577, "epoch": 5211} {"train_loss": -26.87183952331543, "global_step": 432578, "epoch": 5211} {"train_loss": -27.0831356048584, "global_step": 432579, "epoch": 5211} {"train_loss": -26.313817977905273, "global_step": 432580, "epoch": 5211} {"train_loss": -26.7696475982666, "global_step": 432581, "epoch": 5211} {"train_loss": -26.879240036010742, "global_step": 432582, "epoch": 5211} {"train_loss": -26.342252731323242, "global_step": 432583, "epoch": 5211} {"train_loss": -26.720895767211914, "global_step": 432584, "epoch": 5211} {"train_loss": -26.412092208862305, "global_step": 432585, "epoch": 5211} {"train_loss": -26.06647300720215, "global_step": 432586, "epoch": 5211} {"train_loss": -27.001800537109375, "global_step": 432587, "epoch": 5211} {"train_loss": -26.689228057861328, "global_step": 432588, "epoch": 5211} {"train_loss": -26.226049423217773, "global_step": 432589, "epoch": 5211} {"train_loss": -26.688873291015625, "global_step": 432590, "epoch": 5211} {"train_loss": -26.833242416381836, "global_step": 432591, "epoch": 5211} {"train_loss": -26.64945411682129, "global_step": 432592, "epoch": 5211} {"train_loss": -26.576719284057617, "global_step": 432593, "epoch": 5211} {"train_loss": -26.71478271484375, "global_step": 432594, "epoch": 5211} {"train_loss": -26.765791100191784, "global_step": 432595, "epoch": 5211, "val_loss": 6856671.5} {"train_loss": -26.751501083374023, "global_step": 432596, "epoch": 5212} {"train_loss": -26.369373321533203, "global_step": 432597, "epoch": 5212} {"train_loss": -26.49019432067871, "global_step": 432598, "epoch": 5212} {"train_loss": -26.855627059936523, "global_step": 432599, "epoch": 5212} {"train_loss": -26.631900787353516, "global_step": 432600, "epoch": 5212} {"train_loss": -26.640151977539062, "global_step": 432601, "epoch": 5212} {"train_loss": -26.379968643188477, "global_step": 432602, "epoch": 5212} {"train_loss": -26.844379425048828, "global_step": 432603, "epoch": 5212} {"train_loss": -26.469228744506836, "global_step": 432604, "epoch": 5212} {"train_loss": -26.630767822265625, "global_step": 432605, "epoch": 5212} {"train_loss": -26.621219635009766, "global_step": 432606, "epoch": 5212} {"train_loss": -26.763166427612305, "global_step": 432607, "epoch": 5212} {"train_loss": -26.6142578125, "global_step": 432608, "epoch": 5212} {"train_loss": -26.58037757873535, "global_step": 432609, "epoch": 5212} {"train_loss": -26.867822647094727, "global_step": 432610, "epoch": 5212} {"train_loss": -26.876401901245117, "global_step": 432611, "epoch": 5212} {"train_loss": -26.8782958984375, "global_step": 432612, "epoch": 5212} {"train_loss": -26.62055015563965, "global_step": 432613, "epoch": 5212} {"train_loss": -27.122547149658203, "global_step": 432614, "epoch": 5212} {"train_loss": -27.071441650390625, "global_step": 432615, "epoch": 5212} {"train_loss": -26.815277099609375, "global_step": 432616, "epoch": 5212} {"train_loss": -26.880529403686523, "global_step": 432617, "epoch": 5212} {"train_loss": -26.98023796081543, "global_step": 432618, "epoch": 5212} {"train_loss": -26.754545211791992, "global_step": 432619, "epoch": 5212} {"train_loss": -26.743505477905273, "global_step": 432620, "epoch": 5212} {"train_loss": -26.64212417602539, "global_step": 432621, "epoch": 5212} {"train_loss": -26.91912841796875, "global_step": 432622, "epoch": 5212} {"train_loss": -26.8369083404541, "global_step": 432623, "epoch": 5212} {"train_loss": -27.14491081237793, "global_step": 432624, "epoch": 5212} {"train_loss": -26.829833984375, "global_step": 432625, "epoch": 5212} {"train_loss": -26.73201560974121, "global_step": 432626, "epoch": 5212} {"train_loss": -26.562101364135742, "global_step": 432627, "epoch": 5212} {"train_loss": -26.806610107421875, "global_step": 432628, "epoch": 5212} {"train_loss": -27.307941436767578, "global_step": 432629, "epoch": 5212} {"train_loss": -26.782384872436523, "global_step": 432630, "epoch": 5212} {"train_loss": -26.86151123046875, "global_step": 432631, "epoch": 5212} {"train_loss": -27.031478881835938, "global_step": 432632, "epoch": 5212} {"train_loss": -27.08684730529785, "global_step": 432633, "epoch": 5212} {"train_loss": -27.03822135925293, "global_step": 432634, "epoch": 5212} {"train_loss": -26.811487197875977, "global_step": 432635, "epoch": 5212} {"train_loss": -27.06690788269043, "global_step": 432636, "epoch": 5212} {"train_loss": -26.66715431213379, "global_step": 432637, "epoch": 5212} {"train_loss": -27.2646427154541, "global_step": 432638, "epoch": 5212} {"train_loss": -27.142078399658203, "global_step": 432639, "epoch": 5212} {"train_loss": -27.002029418945312, "global_step": 432640, "epoch": 5212} {"train_loss": -26.83169937133789, "global_step": 432641, "epoch": 5212} {"train_loss": -26.925458908081055, "global_step": 432642, "epoch": 5212} {"train_loss": -27.162464141845703, "global_step": 432643, "epoch": 5212} {"train_loss": -27.030338287353516, "global_step": 432644, "epoch": 5212} {"train_loss": -27.1075496673584, "global_step": 432645, "epoch": 5212} {"train_loss": -26.802282333374023, "global_step": 432646, "epoch": 5212} {"train_loss": -27.019184112548828, "global_step": 432647, "epoch": 5212} {"train_loss": -27.15732192993164, "global_step": 432648, "epoch": 5212} {"train_loss": -27.12336540222168, "global_step": 432649, "epoch": 5212} {"train_loss": -26.9314022064209, "global_step": 432650, "epoch": 5212} {"train_loss": -27.192230224609375, "global_step": 432651, "epoch": 5212} {"train_loss": -26.74017906188965, "global_step": 432652, "epoch": 5212} {"train_loss": -26.984817504882812, "global_step": 432653, "epoch": 5212} {"train_loss": -26.69013023376465, "global_step": 432654, "epoch": 5212} {"train_loss": -26.855005264282227, "global_step": 432655, "epoch": 5212} {"train_loss": -26.35418701171875, "global_step": 432656, "epoch": 5212} {"train_loss": -26.763153076171875, "global_step": 432657, "epoch": 5212} {"train_loss": -26.403675079345703, "global_step": 432658, "epoch": 5212} {"train_loss": -26.817630767822266, "global_step": 432659, "epoch": 5212} {"train_loss": -27.043930053710938, "global_step": 432660, "epoch": 5212} {"train_loss": -26.80681800842285, "global_step": 432661, "epoch": 5212} {"train_loss": -27.098114013671875, "global_step": 432662, "epoch": 5212} {"train_loss": -26.825063705444336, "global_step": 432663, "epoch": 5212} {"train_loss": -26.745651245117188, "global_step": 432664, "epoch": 5212} {"train_loss": -26.901657104492188, "global_step": 432665, "epoch": 5212} {"train_loss": -27.461374282836914, "global_step": 432666, "epoch": 5212} {"train_loss": -26.703622817993164, "global_step": 432667, "epoch": 5212} {"train_loss": -26.886310577392578, "global_step": 432668, "epoch": 5212} {"train_loss": -27.05122184753418, "global_step": 432669, "epoch": 5212} {"train_loss": -26.723981857299805, "global_step": 432670, "epoch": 5212} {"train_loss": -26.956897735595703, "global_step": 432671, "epoch": 5212} {"train_loss": -27.040088653564453, "global_step": 432672, "epoch": 5212} {"train_loss": -26.646656036376953, "global_step": 432673, "epoch": 5212} {"train_loss": -27.28376579284668, "global_step": 432674, "epoch": 5212} {"train_loss": -26.868337631225586, "global_step": 432675, "epoch": 5212} {"train_loss": -26.961322784423828, "global_step": 432676, "epoch": 5212} {"train_loss": -26.92193031311035, "global_step": 432677, "epoch": 5212} {"train_loss": -26.8499308896352, "global_step": 432678, "epoch": 5212, "val_loss": 6873810.0} {"train_loss": -23.6295223236084, "global_step": 432679, "epoch": 5213} {"train_loss": -22.902795791625977, "global_step": 432680, "epoch": 5213} {"train_loss": -26.5526180267334, "global_step": 432681, "epoch": 5213} {"train_loss": -24.189855575561523, "global_step": 432682, "epoch": 5213} {"train_loss": -26.27674674987793, "global_step": 432683, "epoch": 5213} {"train_loss": -24.25562858581543, "global_step": 432684, "epoch": 5213} {"train_loss": -25.683984756469727, "global_step": 432685, "epoch": 5213} {"train_loss": -25.543699264526367, "global_step": 432686, "epoch": 5213} {"train_loss": -25.504947662353516, "global_step": 432687, "epoch": 5213} {"train_loss": -26.352481842041016, "global_step": 432688, "epoch": 5213} {"train_loss": -26.038745880126953, "global_step": 432689, "epoch": 5213} {"train_loss": -25.784032821655273, "global_step": 432690, "epoch": 5213} {"train_loss": -26.297077178955078, "global_step": 432691, "epoch": 5213} {"train_loss": -26.340335845947266, "global_step": 432692, "epoch": 5213} {"train_loss": -26.412338256835938, "global_step": 432693, "epoch": 5213} {"train_loss": -26.181726455688477, "global_step": 432694, "epoch": 5213} {"train_loss": -25.941381454467773, "global_step": 432695, "epoch": 5213} {"train_loss": -26.036376953125, "global_step": 432696, "epoch": 5213} {"train_loss": -26.48919105529785, "global_step": 432697, "epoch": 5213} {"train_loss": -26.548917770385742, "global_step": 432698, "epoch": 5213} {"train_loss": -26.18690299987793, "global_step": 432699, "epoch": 5213} {"train_loss": -26.492578506469727, "global_step": 432700, "epoch": 5213} {"train_loss": -26.43509864807129, "global_step": 432701, "epoch": 5213} {"train_loss": -26.18532371520996, "global_step": 432702, "epoch": 5213} {"train_loss": -26.681909561157227, "global_step": 432703, "epoch": 5213} {"train_loss": -26.732772827148438, "global_step": 432704, "epoch": 5213} {"train_loss": -26.61504554748535, "global_step": 432705, "epoch": 5213} {"train_loss": -26.134740829467773, "global_step": 432706, "epoch": 5213} {"train_loss": -26.33199119567871, "global_step": 432707, "epoch": 5213} {"train_loss": -26.63980484008789, "global_step": 432708, "epoch": 5213} {"train_loss": -26.2114315032959, "global_step": 432709, "epoch": 5213} {"train_loss": -26.535802841186523, "global_step": 432710, "epoch": 5213} {"train_loss": -26.182849884033203, "global_step": 432711, "epoch": 5213} {"train_loss": -26.84364891052246, "global_step": 432712, "epoch": 5213} {"train_loss": -26.51389503479004, "global_step": 432713, "epoch": 5213} {"train_loss": -26.395511627197266, "global_step": 432714, "epoch": 5213} {"train_loss": -26.774261474609375, "global_step": 432715, "epoch": 5213} {"train_loss": -26.33570671081543, "global_step": 432716, "epoch": 5213} {"train_loss": -26.719762802124023, "global_step": 432717, "epoch": 5213} {"train_loss": -26.644824981689453, "global_step": 432718, "epoch": 5213} {"train_loss": -26.752735137939453, "global_step": 432719, "epoch": 5213} {"train_loss": -26.687192916870117, "global_step": 432720, "epoch": 5213} {"train_loss": -26.594959259033203, "global_step": 432721, "epoch": 5213} {"train_loss": -26.858320236206055, "global_step": 432722, "epoch": 5213} {"train_loss": -26.66849136352539, "global_step": 432723, "epoch": 5213} {"train_loss": -26.98308753967285, "global_step": 432724, "epoch": 5213} {"train_loss": -26.532873153686523, "global_step": 432725, "epoch": 5213} {"train_loss": -26.557600021362305, "global_step": 432726, "epoch": 5213} {"train_loss": -26.912900924682617, "global_step": 432727, "epoch": 5213} {"train_loss": -27.16183853149414, "global_step": 432728, "epoch": 5213} {"train_loss": -26.592084884643555, "global_step": 432729, "epoch": 5213} {"train_loss": -26.92657470703125, "global_step": 432730, "epoch": 5213} {"train_loss": -26.6103572845459, "global_step": 432731, "epoch": 5213} {"train_loss": -26.460241317749023, "global_step": 432732, "epoch": 5213} {"train_loss": -26.6524600982666, "global_step": 432733, "epoch": 5213} {"train_loss": -26.28619384765625, "global_step": 432734, "epoch": 5213} {"train_loss": -26.73260498046875, "global_step": 432735, "epoch": 5213} {"train_loss": -26.9182186126709, "global_step": 432736, "epoch": 5213} {"train_loss": -27.114789962768555, "global_step": 432737, "epoch": 5213} {"train_loss": -26.7589054107666, "global_step": 432738, "epoch": 5213} {"train_loss": -27.184133529663086, "global_step": 432739, "epoch": 5213} {"train_loss": -26.972274780273438, "global_step": 432740, "epoch": 5213} {"train_loss": -26.7722110748291, "global_step": 432741, "epoch": 5213} {"train_loss": -27.227558135986328, "global_step": 432742, "epoch": 5213} {"train_loss": -27.282644271850586, "global_step": 432743, "epoch": 5213} {"train_loss": -26.755125045776367, "global_step": 432744, "epoch": 5213} {"train_loss": -26.663135528564453, "global_step": 432745, "epoch": 5213} {"train_loss": -27.177841186523438, "global_step": 432746, "epoch": 5213} {"train_loss": -26.766223907470703, "global_step": 432747, "epoch": 5213} {"train_loss": -26.823205947875977, "global_step": 432748, "epoch": 5213} {"train_loss": -27.07111167907715, "global_step": 432749, "epoch": 5213} {"train_loss": -27.018884658813477, "global_step": 432750, "epoch": 5213} {"train_loss": -26.828754425048828, "global_step": 432751, "epoch": 5213} {"train_loss": -26.703519821166992, "global_step": 432752, "epoch": 5213} {"train_loss": -26.733158111572266, "global_step": 432753, "epoch": 5213} {"train_loss": -27.046247482299805, "global_step": 432754, "epoch": 5213} {"train_loss": -26.905426025390625, "global_step": 432755, "epoch": 5213} {"train_loss": -26.80396842956543, "global_step": 432756, "epoch": 5213} {"train_loss": -27.20100212097168, "global_step": 432757, "epoch": 5213} {"train_loss": -26.40753746032715, "global_step": 432758, "epoch": 5213} {"train_loss": -26.836782455444336, "global_step": 432759, "epoch": 5213} {"train_loss": -26.74603271484375, "global_step": 432760, "epoch": 5213} {"train_loss": -26.461663763207124, "global_step": 432761, "epoch": 5213, "val_loss": 6762984.0} {"train_loss": -26.63665199279785, "global_step": 432762, "epoch": 5214} {"train_loss": -26.46575927734375, "global_step": 432763, "epoch": 5214} {"train_loss": -26.207965850830078, "global_step": 432764, "epoch": 5214} {"train_loss": -26.594202041625977, "global_step": 432765, "epoch": 5214} {"train_loss": -26.77370262145996, "global_step": 432766, "epoch": 5214} {"train_loss": -26.94561767578125, "global_step": 432767, "epoch": 5214} {"train_loss": -26.404754638671875, "global_step": 432768, "epoch": 5214} {"train_loss": -26.599103927612305, "global_step": 432769, "epoch": 5214} {"train_loss": -26.533191680908203, "global_step": 432770, "epoch": 5214} {"train_loss": -26.632205963134766, "global_step": 432771, "epoch": 5214} {"train_loss": -26.65565299987793, "global_step": 432772, "epoch": 5214} {"train_loss": -26.770584106445312, "global_step": 432773, "epoch": 5214} {"train_loss": -26.51129722595215, "global_step": 432774, "epoch": 5214} {"train_loss": -26.5355167388916, "global_step": 432775, "epoch": 5214} {"train_loss": -26.7708740234375, "global_step": 432776, "epoch": 5214} {"train_loss": -27.030065536499023, "global_step": 432777, "epoch": 5214} {"train_loss": -26.840728759765625, "global_step": 432778, "epoch": 5214} {"train_loss": -26.67367935180664, "global_step": 432779, "epoch": 5214} {"train_loss": -27.32813835144043, "global_step": 432780, "epoch": 5214} {"train_loss": -26.7769775390625, "global_step": 432781, "epoch": 5214} {"train_loss": -26.51685905456543, "global_step": 432782, "epoch": 5214} {"train_loss": -26.899097442626953, "global_step": 432783, "epoch": 5214} {"train_loss": -26.92214012145996, "global_step": 432784, "epoch": 5214} {"train_loss": -26.70452308654785, "global_step": 432785, "epoch": 5214} {"train_loss": -26.8929443359375, "global_step": 432786, "epoch": 5214} {"train_loss": -27.01886558532715, "global_step": 432787, "epoch": 5214} {"train_loss": -27.033628463745117, "global_step": 432788, "epoch": 5214} {"train_loss": -27.194501876831055, "global_step": 432789, "epoch": 5214} {"train_loss": -26.906530380249023, "global_step": 432790, "epoch": 5214} {"train_loss": -26.885833740234375, "global_step": 432791, "epoch": 5214} {"train_loss": -26.980880737304688, "global_step": 432792, "epoch": 5214} {"train_loss": -27.228219985961914, "global_step": 432793, "epoch": 5214} {"train_loss": -26.677417755126953, "global_step": 432794, "epoch": 5214} {"train_loss": -26.85682487487793, "global_step": 432795, "epoch": 5214} {"train_loss": -27.109418869018555, "global_step": 432796, "epoch": 5214} {"train_loss": -27.213245391845703, "global_step": 432797, "epoch": 5214} {"train_loss": -26.91048240661621, "global_step": 432798, "epoch": 5214} {"train_loss": -26.67982292175293, "global_step": 432799, "epoch": 5214} {"train_loss": -27.033029556274414, "global_step": 432800, "epoch": 5214} {"train_loss": -27.009130477905273, "global_step": 432801, "epoch": 5214} {"train_loss": -27.08941078186035, "global_step": 432802, "epoch": 5214} {"train_loss": -26.88945960998535, "global_step": 432803, "epoch": 5214} {"train_loss": -27.121627807617188, "global_step": 432804, "epoch": 5214} {"train_loss": -27.086511611938477, "global_step": 432805, "epoch": 5214} {"train_loss": -26.91765785217285, "global_step": 432806, "epoch": 5214} {"train_loss": -26.975482940673828, "global_step": 432807, "epoch": 5214} {"train_loss": -27.124906539916992, "global_step": 432808, "epoch": 5214} {"train_loss": -26.92022705078125, "global_step": 432809, "epoch": 5214} {"train_loss": -27.34452247619629, "global_step": 432810, "epoch": 5214} {"train_loss": -26.993581771850586, "global_step": 432811, "epoch": 5214} {"train_loss": -26.85041618347168, "global_step": 432812, "epoch": 5214} {"train_loss": -27.280298233032227, "global_step": 432813, "epoch": 5214} {"train_loss": -27.0186824798584, "global_step": 432814, "epoch": 5214} {"train_loss": -26.918027877807617, "global_step": 432815, "epoch": 5214} {"train_loss": -27.17225456237793, "global_step": 432816, "epoch": 5214} {"train_loss": -26.679656982421875, "global_step": 432817, "epoch": 5214} {"train_loss": -26.99256706237793, "global_step": 432818, "epoch": 5214} {"train_loss": -27.206348419189453, "global_step": 432819, "epoch": 5214} {"train_loss": -27.173734664916992, "global_step": 432820, "epoch": 5214} {"train_loss": -26.9543399810791, "global_step": 432821, "epoch": 5214} {"train_loss": -27.0721378326416, "global_step": 432822, "epoch": 5214} {"train_loss": -27.10699462890625, "global_step": 432823, "epoch": 5214} {"train_loss": -27.131351470947266, "global_step": 432824, "epoch": 5214} {"train_loss": -26.809961318969727, "global_step": 432825, "epoch": 5214} {"train_loss": -26.648855209350586, "global_step": 432826, "epoch": 5214} {"train_loss": -27.04986572265625, "global_step": 432827, "epoch": 5214} {"train_loss": -27.07293701171875, "global_step": 432828, "epoch": 5214} {"train_loss": -26.513336181640625, "global_step": 432829, "epoch": 5214} {"train_loss": -26.88067626953125, "global_step": 432830, "epoch": 5214} {"train_loss": -27.263463973999023, "global_step": 432831, "epoch": 5214} {"train_loss": -26.911874771118164, "global_step": 432832, "epoch": 5214} {"train_loss": -27.173568725585938, "global_step": 432833, "epoch": 5214} {"train_loss": -26.915231704711914, "global_step": 432834, "epoch": 5214} {"train_loss": -26.9383602142334, "global_step": 432835, "epoch": 5214} {"train_loss": -26.91786003112793, "global_step": 432836, "epoch": 5214} {"train_loss": -27.049823760986328, "global_step": 432837, "epoch": 5214} {"train_loss": -26.850988388061523, "global_step": 432838, "epoch": 5214} {"train_loss": -26.9036922454834, "global_step": 432839, "epoch": 5214} {"train_loss": -27.109333038330078, "global_step": 432840, "epoch": 5214} {"train_loss": -27.0190486907959, "global_step": 432841, "epoch": 5214} {"train_loss": -26.806798934936523, "global_step": 432842, "epoch": 5214} {"train_loss": -26.45002555847168, "global_step": 432843, "epoch": 5214} {"train_loss": -26.89496141456696, "global_step": 432844, "epoch": 5214, "val_loss": 6707215.0} {"train_loss": -24.490243911743164, "global_step": 432845, "epoch": 5215} {"train_loss": -22.944387435913086, "global_step": 432846, "epoch": 5215} {"train_loss": -21.624197006225586, "global_step": 432847, "epoch": 5215} {"train_loss": -24.721553802490234, "global_step": 432848, "epoch": 5215} {"train_loss": -25.573823928833008, "global_step": 432849, "epoch": 5215} {"train_loss": -24.61725425720215, "global_step": 432850, "epoch": 5215} {"train_loss": -25.207176208496094, "global_step": 432851, "epoch": 5215} {"train_loss": -24.929386138916016, "global_step": 432852, "epoch": 5215} {"train_loss": -25.020601272583008, "global_step": 432853, "epoch": 5215} {"train_loss": -25.235322952270508, "global_step": 432854, "epoch": 5215} {"train_loss": -25.835798263549805, "global_step": 432855, "epoch": 5215} {"train_loss": -24.90106964111328, "global_step": 432856, "epoch": 5215} {"train_loss": -25.073993682861328, "global_step": 432857, "epoch": 5215} {"train_loss": -25.402069091796875, "global_step": 432858, "epoch": 5215} {"train_loss": -26.050811767578125, "global_step": 432859, "epoch": 5215} {"train_loss": -25.45769691467285, "global_step": 432860, "epoch": 5215} {"train_loss": -25.82049560546875, "global_step": 432861, "epoch": 5215} {"train_loss": -25.688257217407227, "global_step": 432862, "epoch": 5215} {"train_loss": -25.439950942993164, "global_step": 432863, "epoch": 5215} {"train_loss": -25.992935180664062, "global_step": 432864, "epoch": 5215} {"train_loss": -25.845361709594727, "global_step": 432865, "epoch": 5215} {"train_loss": -25.98677635192871, "global_step": 432866, "epoch": 5215} {"train_loss": -25.83428382873535, "global_step": 432867, "epoch": 5215} {"train_loss": -25.839460372924805, "global_step": 432868, "epoch": 5215} {"train_loss": -25.8995304107666, "global_step": 432869, "epoch": 5215} {"train_loss": -26.340961456298828, "global_step": 432870, "epoch": 5215} {"train_loss": -26.30938720703125, "global_step": 432871, "epoch": 5215} {"train_loss": -25.90114402770996, "global_step": 432872, "epoch": 5215} {"train_loss": -26.293792724609375, "global_step": 432873, "epoch": 5215} {"train_loss": -26.385114669799805, "global_step": 432874, "epoch": 5215} {"train_loss": -26.2972412109375, "global_step": 432875, "epoch": 5215} {"train_loss": -26.245573043823242, "global_step": 432876, "epoch": 5215} {"train_loss": -26.506885528564453, "global_step": 432877, "epoch": 5215} {"train_loss": -26.72284507751465, "global_step": 432878, "epoch": 5215} {"train_loss": -26.508691787719727, "global_step": 432879, "epoch": 5215} {"train_loss": -26.29962730407715, "global_step": 432880, "epoch": 5215} {"train_loss": -26.480701446533203, "global_step": 432881, "epoch": 5215} {"train_loss": -26.59979820251465, "global_step": 432882, "epoch": 5215} {"train_loss": -26.789167404174805, "global_step": 432883, "epoch": 5215} {"train_loss": -26.734912872314453, "global_step": 432884, "epoch": 5215} {"train_loss": -26.64960289001465, "global_step": 432885, "epoch": 5215} {"train_loss": -26.904088973999023, "global_step": 432886, "epoch": 5215} {"train_loss": -26.70526123046875, "global_step": 432887, "epoch": 5215} {"train_loss": -26.57135009765625, "global_step": 432888, "epoch": 5215} {"train_loss": -27.055484771728516, "global_step": 432889, "epoch": 5215} {"train_loss": -26.868738174438477, "global_step": 432890, "epoch": 5215} {"train_loss": -26.257776260375977, "global_step": 432891, "epoch": 5215} {"train_loss": -26.968143463134766, "global_step": 432892, "epoch": 5215} {"train_loss": -26.588315963745117, "global_step": 432893, "epoch": 5215} {"train_loss": -26.6739501953125, "global_step": 432894, "epoch": 5215} {"train_loss": -27.00995445251465, "global_step": 432895, "epoch": 5215} {"train_loss": -26.527633666992188, "global_step": 432896, "epoch": 5215} {"train_loss": -26.83782958984375, "global_step": 432897, "epoch": 5215} {"train_loss": -26.906686782836914, "global_step": 432898, "epoch": 5215} {"train_loss": -27.055036544799805, "global_step": 432899, "epoch": 5215} {"train_loss": -26.780994415283203, "global_step": 432900, "epoch": 5215} {"train_loss": -26.988433837890625, "global_step": 432901, "epoch": 5215} {"train_loss": -26.70831298828125, "global_step": 432902, "epoch": 5215} {"train_loss": -26.510486602783203, "global_step": 432903, "epoch": 5215} {"train_loss": -27.036218643188477, "global_step": 432904, "epoch": 5215} {"train_loss": -26.82222557067871, "global_step": 432905, "epoch": 5215} {"train_loss": -27.043241500854492, "global_step": 432906, "epoch": 5215} {"train_loss": -26.59974479675293, "global_step": 432907, "epoch": 5215} {"train_loss": -26.63899803161621, "global_step": 432908, "epoch": 5215} {"train_loss": -26.989240646362305, "global_step": 432909, "epoch": 5215} {"train_loss": -26.993810653686523, "global_step": 432910, "epoch": 5215} {"train_loss": -27.02955436706543, "global_step": 432911, "epoch": 5215} {"train_loss": -26.813098907470703, "global_step": 432912, "epoch": 5215} {"train_loss": -26.85043716430664, "global_step": 432913, "epoch": 5215} {"train_loss": -26.698877334594727, "global_step": 432914, "epoch": 5215} {"train_loss": -26.893756866455078, "global_step": 432915, "epoch": 5215} {"train_loss": -26.779447555541992, "global_step": 432916, "epoch": 5215} {"train_loss": -27.083847045898438, "global_step": 432917, "epoch": 5215} {"train_loss": -27.0684757232666, "global_step": 432918, "epoch": 5215} {"train_loss": -27.156982421875, "global_step": 432919, "epoch": 5215} {"train_loss": -26.84211540222168, "global_step": 432920, "epoch": 5215} {"train_loss": -27.035888671875, "global_step": 432921, "epoch": 5215} {"train_loss": -27.44287109375, "global_step": 432922, "epoch": 5215} {"train_loss": -27.105878829956055, "global_step": 432923, "epoch": 5215} {"train_loss": -27.073169708251953, "global_step": 432924, "epoch": 5215} {"train_loss": -27.02081871032715, "global_step": 432925, "epoch": 5215} {"train_loss": -27.1741943359375, "global_step": 432926, "epoch": 5215} {"train_loss": -26.276316217629308, "global_step": 432927, "epoch": 5215, "val_loss": 6804938.5} {"train_loss": -27.0340576171875, "global_step": 432928, "epoch": 5216} {"train_loss": -26.904495239257812, "global_step": 432929, "epoch": 5216} {"train_loss": -26.88692283630371, "global_step": 432930, "epoch": 5216} {"train_loss": -26.782123565673828, "global_step": 432931, "epoch": 5216} {"train_loss": -26.82880210876465, "global_step": 432932, "epoch": 5216} {"train_loss": -26.911115646362305, "global_step": 432933, "epoch": 5216} {"train_loss": -26.887012481689453, "global_step": 432934, "epoch": 5216} {"train_loss": -26.627338409423828, "global_step": 432935, "epoch": 5216} {"train_loss": -26.84689712524414, "global_step": 432936, "epoch": 5216} {"train_loss": -26.763364791870117, "global_step": 432937, "epoch": 5216} {"train_loss": -26.838281631469727, "global_step": 432938, "epoch": 5216} {"train_loss": -27.086496353149414, "global_step": 432939, "epoch": 5216} {"train_loss": -26.883316040039062, "global_step": 432940, "epoch": 5216} {"train_loss": -27.142684936523438, "global_step": 432941, "epoch": 5216} {"train_loss": -26.57183837890625, "global_step": 432942, "epoch": 5216} {"train_loss": -27.320348739624023, "global_step": 432943, "epoch": 5216} {"train_loss": -27.021533966064453, "global_step": 432944, "epoch": 5216} {"train_loss": -26.950281143188477, "global_step": 432945, "epoch": 5216} {"train_loss": -26.97458267211914, "global_step": 432946, "epoch": 5216} {"train_loss": -26.488662719726562, "global_step": 432947, "epoch": 5216} {"train_loss": -26.762680053710938, "global_step": 432948, "epoch": 5216} {"train_loss": -27.0988712310791, "global_step": 432949, "epoch": 5216} {"train_loss": -26.9160099029541, "global_step": 432950, "epoch": 5216} {"train_loss": -27.198286056518555, "global_step": 432951, "epoch": 5216} {"train_loss": -26.747211456298828, "global_step": 432952, "epoch": 5216} {"train_loss": -26.736608505249023, "global_step": 432953, "epoch": 5216} {"train_loss": -26.93206787109375, "global_step": 432954, "epoch": 5216} {"train_loss": -26.408390045166016, "global_step": 432955, "epoch": 5216} {"train_loss": -27.20966911315918, "global_step": 432956, "epoch": 5216} {"train_loss": -26.86652183532715, "global_step": 432957, "epoch": 5216} {"train_loss": -26.615644454956055, "global_step": 432958, "epoch": 5216} {"train_loss": -26.357818603515625, "global_step": 432959, "epoch": 5216} {"train_loss": -26.769445419311523, "global_step": 432960, "epoch": 5216} {"train_loss": -26.608123779296875, "global_step": 432961, "epoch": 5216} {"train_loss": -26.902326583862305, "global_step": 432962, "epoch": 5216} {"train_loss": -26.396169662475586, "global_step": 432963, "epoch": 5216} {"train_loss": -26.486536026000977, "global_step": 432964, "epoch": 5216} {"train_loss": -26.6375732421875, "global_step": 432965, "epoch": 5216} {"train_loss": -27.04242515563965, "global_step": 432966, "epoch": 5216} {"train_loss": -26.8725528717041, "global_step": 432967, "epoch": 5216} {"train_loss": -26.56232261657715, "global_step": 432968, "epoch": 5216} {"train_loss": -26.849523544311523, "global_step": 432969, "epoch": 5216} {"train_loss": -26.260107040405273, "global_step": 432970, "epoch": 5216} {"train_loss": -26.82618522644043, "global_step": 432971, "epoch": 5216} {"train_loss": -26.590768814086914, "global_step": 432972, "epoch": 5216} {"train_loss": -27.295026779174805, "global_step": 432973, "epoch": 5216} {"train_loss": -26.78106689453125, "global_step": 432974, "epoch": 5216} {"train_loss": -26.896137237548828, "global_step": 432975, "epoch": 5216} {"train_loss": -26.91975212097168, "global_step": 432976, "epoch": 5216} {"train_loss": -26.895801544189453, "global_step": 432977, "epoch": 5216} {"train_loss": -26.754602432250977, "global_step": 432978, "epoch": 5216} {"train_loss": -26.75737953186035, "global_step": 432979, "epoch": 5216} {"train_loss": -27.22607421875, "global_step": 432980, "epoch": 5216} {"train_loss": -26.8211669921875, "global_step": 432981, "epoch": 5216} {"train_loss": -27.02532386779785, "global_step": 432982, "epoch": 5216} {"train_loss": -27.069616317749023, "global_step": 432983, "epoch": 5216} {"train_loss": -27.077533721923828, "global_step": 432984, "epoch": 5216} {"train_loss": -27.184476852416992, "global_step": 432985, "epoch": 5216} {"train_loss": -27.067819595336914, "global_step": 432986, "epoch": 5216} {"train_loss": -26.958271026611328, "global_step": 432987, "epoch": 5216} {"train_loss": -27.151731491088867, "global_step": 432988, "epoch": 5216} {"train_loss": -27.339420318603516, "global_step": 432989, "epoch": 5216} {"train_loss": -27.327585220336914, "global_step": 432990, "epoch": 5216} {"train_loss": -27.088281631469727, "global_step": 432991, "epoch": 5216} {"train_loss": -27.199472427368164, "global_step": 432992, "epoch": 5216} {"train_loss": -27.222314834594727, "global_step": 432993, "epoch": 5216} {"train_loss": -27.092100143432617, "global_step": 432994, "epoch": 5216} {"train_loss": -27.406888961791992, "global_step": 432995, "epoch": 5216} {"train_loss": -27.04803466796875, "global_step": 432996, "epoch": 5216} {"train_loss": -27.30988883972168, "global_step": 432997, "epoch": 5216} {"train_loss": -26.789823532104492, "global_step": 432998, "epoch": 5216} {"train_loss": -27.108734130859375, "global_step": 432999, "epoch": 5216} {"train_loss": -27.311059951782227, "global_step": 433000, "epoch": 5216} {"train_loss": -26.919300079345703, "global_step": 433001, "epoch": 5216} {"train_loss": -27.01967430114746, "global_step": 433002, "epoch": 5216} {"train_loss": -27.120975494384766, "global_step": 433003, "epoch": 5216} {"train_loss": -27.158960342407227, "global_step": 433004, "epoch": 5216} {"train_loss": -27.20574378967285, "global_step": 433005, "epoch": 5216} {"train_loss": -26.958587646484375, "global_step": 433006, "epoch": 5216} {"train_loss": -27.089828491210938, "global_step": 433007, "epoch": 5216} {"train_loss": -27.0001163482666, "global_step": 433008, "epoch": 5216} {"train_loss": -27.082136154174805, "global_step": 433009, "epoch": 5216} {"train_loss": -26.93247615860169, "global_step": 433010, "epoch": 5216, "val_loss": 6921858.0} {"train_loss": -26.676244735717773, "global_step": 433011, "epoch": 5217} {"train_loss": -26.00006103515625, "global_step": 433012, "epoch": 5217} {"train_loss": -25.955961227416992, "global_step": 433013, "epoch": 5217} {"train_loss": -26.087940216064453, "global_step": 433014, "epoch": 5217} {"train_loss": -26.584070205688477, "global_step": 433015, "epoch": 5217} {"train_loss": -26.878530502319336, "global_step": 433016, "epoch": 5217} {"train_loss": -26.437408447265625, "global_step": 433017, "epoch": 5217} {"train_loss": -26.90839958190918, "global_step": 433018, "epoch": 5217} {"train_loss": -26.279340744018555, "global_step": 433019, "epoch": 5217} {"train_loss": -26.059772491455078, "global_step": 433020, "epoch": 5217} {"train_loss": -26.88006591796875, "global_step": 433021, "epoch": 5217} {"train_loss": -26.243871688842773, "global_step": 433022, "epoch": 5217} {"train_loss": -26.6180477142334, "global_step": 433023, "epoch": 5217} {"train_loss": -26.187057495117188, "global_step": 433024, "epoch": 5217} {"train_loss": -26.714033126831055, "global_step": 433025, "epoch": 5217} {"train_loss": -26.332843780517578, "global_step": 433026, "epoch": 5217} {"train_loss": -26.49326515197754, "global_step": 433027, "epoch": 5217} {"train_loss": -26.202350616455078, "global_step": 433028, "epoch": 5217} {"train_loss": -26.453418731689453, "global_step": 433029, "epoch": 5217} {"train_loss": -26.390151977539062, "global_step": 433030, "epoch": 5217} {"train_loss": -26.481891632080078, "global_step": 433031, "epoch": 5217} {"train_loss": -26.763946533203125, "global_step": 433032, "epoch": 5217} {"train_loss": -26.6463680267334, "global_step": 433033, "epoch": 5217} {"train_loss": -26.422260284423828, "global_step": 433034, "epoch": 5217} {"train_loss": -26.79317283630371, "global_step": 433035, "epoch": 5217} {"train_loss": -26.186542510986328, "global_step": 433036, "epoch": 5217} {"train_loss": -26.67188835144043, "global_step": 433037, "epoch": 5217} {"train_loss": -26.539770126342773, "global_step": 433038, "epoch": 5217} {"train_loss": -26.722015380859375, "global_step": 433039, "epoch": 5217} {"train_loss": -27.09449577331543, "global_step": 433040, "epoch": 5217} {"train_loss": -26.505990982055664, "global_step": 433041, "epoch": 5217} {"train_loss": -26.38925552368164, "global_step": 433042, "epoch": 5217} {"train_loss": -26.938613891601562, "global_step": 433043, "epoch": 5217} {"train_loss": -26.41224479675293, "global_step": 433044, "epoch": 5217} {"train_loss": -27.110441207885742, "global_step": 433045, "epoch": 5217} {"train_loss": -26.57488441467285, "global_step": 433046, "epoch": 5217} {"train_loss": -26.782062530517578, "global_step": 433047, "epoch": 5217} {"train_loss": -27.020360946655273, "global_step": 433048, "epoch": 5217} {"train_loss": -27.130130767822266, "global_step": 433049, "epoch": 5217} {"train_loss": -26.819013595581055, "global_step": 433050, "epoch": 5217} {"train_loss": -26.623212814331055, "global_step": 433051, "epoch": 5217} {"train_loss": -26.745412826538086, "global_step": 433052, "epoch": 5217} {"train_loss": -27.010324478149414, "global_step": 433053, "epoch": 5217} {"train_loss": -26.895750045776367, "global_step": 433054, "epoch": 5217} {"train_loss": -27.00824546813965, "global_step": 433055, "epoch": 5217} {"train_loss": -26.802194595336914, "global_step": 433056, "epoch": 5217} {"train_loss": -26.936023712158203, "global_step": 433057, "epoch": 5217} {"train_loss": -27.024877548217773, "global_step": 433058, "epoch": 5217} {"train_loss": -26.866418838500977, "global_step": 433059, "epoch": 5217} {"train_loss": -26.841938018798828, "global_step": 433060, "epoch": 5217} {"train_loss": -27.134565353393555, "global_step": 433061, "epoch": 5217} {"train_loss": -27.236936569213867, "global_step": 433062, "epoch": 5217} {"train_loss": -27.068883895874023, "global_step": 433063, "epoch": 5217} {"train_loss": -27.345748901367188, "global_step": 433064, "epoch": 5217} {"train_loss": -27.10980796813965, "global_step": 433065, "epoch": 5217} {"train_loss": -26.95338249206543, "global_step": 433066, "epoch": 5217} {"train_loss": -27.2714786529541, "global_step": 433067, "epoch": 5217} {"train_loss": -27.078882217407227, "global_step": 433068, "epoch": 5217} {"train_loss": -27.06392478942871, "global_step": 433069, "epoch": 5217} {"train_loss": -27.038293838500977, "global_step": 433070, "epoch": 5217} {"train_loss": -27.1630916595459, "global_step": 433071, "epoch": 5217} {"train_loss": -27.059518814086914, "global_step": 433072, "epoch": 5217} {"train_loss": -26.92926025390625, "global_step": 433073, "epoch": 5217} {"train_loss": -27.131494522094727, "global_step": 433074, "epoch": 5217} {"train_loss": -26.948041915893555, "global_step": 433075, "epoch": 5217} {"train_loss": -26.627410888671875, "global_step": 433076, "epoch": 5217} {"train_loss": -26.269128799438477, "global_step": 433077, "epoch": 5217} {"train_loss": -25.816761016845703, "global_step": 433078, "epoch": 5217} {"train_loss": -25.8415470123291, "global_step": 433079, "epoch": 5217} {"train_loss": -26.48972511291504, "global_step": 433080, "epoch": 5217} {"train_loss": -26.789636611938477, "global_step": 433081, "epoch": 5217} {"train_loss": -25.64020347595215, "global_step": 433082, "epoch": 5217} {"train_loss": -26.615995407104492, "global_step": 433083, "epoch": 5217} {"train_loss": -26.984619140625, "global_step": 433084, "epoch": 5217} {"train_loss": -25.741748809814453, "global_step": 433085, "epoch": 5217} {"train_loss": -26.795652389526367, "global_step": 433086, "epoch": 5217} {"train_loss": -26.58820915222168, "global_step": 433087, "epoch": 5217} {"train_loss": -26.109210968017578, "global_step": 433088, "epoch": 5217} {"train_loss": -26.846960067749023, "global_step": 433089, "epoch": 5217} {"train_loss": -26.271833419799805, "global_step": 433090, "epoch": 5217} {"train_loss": -26.559650421142578, "global_step": 433091, "epoch": 5217} {"train_loss": -26.08819580078125, "global_step": 433092, "epoch": 5217} {"train_loss": -26.645533021674098, "global_step": 433093, "epoch": 5217, "val_loss": 7071531.0} {"train_loss": -25.7493839263916, "global_step": 433094, "epoch": 5218} {"train_loss": -25.242097854614258, "global_step": 433095, "epoch": 5218} {"train_loss": -25.69134521484375, "global_step": 433096, "epoch": 5218} {"train_loss": -26.374486923217773, "global_step": 433097, "epoch": 5218} {"train_loss": -25.665979385375977, "global_step": 433098, "epoch": 5218} {"train_loss": -26.362470626831055, "global_step": 433099, "epoch": 5218} {"train_loss": -26.06815528869629, "global_step": 433100, "epoch": 5218} {"train_loss": -26.409631729125977, "global_step": 433101, "epoch": 5218} {"train_loss": -26.03206443786621, "global_step": 433102, "epoch": 5218} {"train_loss": -26.405149459838867, "global_step": 433103, "epoch": 5218} {"train_loss": -26.417261123657227, "global_step": 433104, "epoch": 5218} {"train_loss": -26.0368595123291, "global_step": 433105, "epoch": 5218} {"train_loss": -26.32854652404785, "global_step": 433106, "epoch": 5218} {"train_loss": -26.4032039642334, "global_step": 433107, "epoch": 5218} {"train_loss": -26.8308048248291, "global_step": 433108, "epoch": 5218} {"train_loss": -26.423978805541992, "global_step": 433109, "epoch": 5218} {"train_loss": -26.2274112701416, "global_step": 433110, "epoch": 5218} {"train_loss": -26.71075439453125, "global_step": 433111, "epoch": 5218} {"train_loss": -26.5526123046875, "global_step": 433112, "epoch": 5218} {"train_loss": -26.63661766052246, "global_step": 433113, "epoch": 5218} {"train_loss": -26.877979278564453, "global_step": 433114, "epoch": 5218} {"train_loss": -26.593976974487305, "global_step": 433115, "epoch": 5218} {"train_loss": -26.591022491455078, "global_step": 433116, "epoch": 5218} {"train_loss": -26.3475284576416, "global_step": 433117, "epoch": 5218} {"train_loss": -26.67667579650879, "global_step": 433118, "epoch": 5218} {"train_loss": -26.554784774780273, "global_step": 433119, "epoch": 5218} {"train_loss": -26.636127471923828, "global_step": 433120, "epoch": 5218} {"train_loss": -27.053457260131836, "global_step": 433121, "epoch": 5218} {"train_loss": -27.024890899658203, "global_step": 433122, "epoch": 5218} {"train_loss": -27.268335342407227, "global_step": 433123, "epoch": 5218} {"train_loss": -27.25506019592285, "global_step": 433124, "epoch": 5218} {"train_loss": -26.829822540283203, "global_step": 433125, "epoch": 5218} {"train_loss": -27.11459732055664, "global_step": 433126, "epoch": 5218} {"train_loss": -27.071170806884766, "global_step": 433127, "epoch": 5218} {"train_loss": -27.19314956665039, "global_step": 433128, "epoch": 5218} {"train_loss": -26.770231246948242, "global_step": 433129, "epoch": 5218} {"train_loss": -27.260229110717773, "global_step": 433130, "epoch": 5218} {"train_loss": -26.9301815032959, "global_step": 433131, "epoch": 5218} {"train_loss": -27.108755111694336, "global_step": 433132, "epoch": 5218} {"train_loss": -27.0703067779541, "global_step": 433133, "epoch": 5218} {"train_loss": -27.105121612548828, "global_step": 433134, "epoch": 5218} {"train_loss": -26.78792381286621, "global_step": 433135, "epoch": 5218} {"train_loss": -26.906320571899414, "global_step": 433136, "epoch": 5218} {"train_loss": -26.901569366455078, "global_step": 433137, "epoch": 5218} {"train_loss": -27.42681884765625, "global_step": 433138, "epoch": 5218} {"train_loss": -27.286649703979492, "global_step": 433139, "epoch": 5218} {"train_loss": -27.037683486938477, "global_step": 433140, "epoch": 5218} {"train_loss": -26.737201690673828, "global_step": 433141, "epoch": 5218} {"train_loss": -26.746484756469727, "global_step": 433142, "epoch": 5218} {"train_loss": -26.80128288269043, "global_step": 433143, "epoch": 5218} {"train_loss": -27.348255157470703, "global_step": 433144, "epoch": 5218} {"train_loss": -27.09513282775879, "global_step": 433145, "epoch": 5218} {"train_loss": -27.17963218688965, "global_step": 433146, "epoch": 5218} {"train_loss": -27.167871475219727, "global_step": 433147, "epoch": 5218} {"train_loss": -27.181665420532227, "global_step": 433148, "epoch": 5218} {"train_loss": -26.985692977905273, "global_step": 433149, "epoch": 5218} {"train_loss": -26.87032127380371, "global_step": 433150, "epoch": 5218} {"train_loss": -26.709213256835938, "global_step": 433151, "epoch": 5218} {"train_loss": -27.130435943603516, "global_step": 433152, "epoch": 5218} {"train_loss": -26.886341094970703, "global_step": 433153, "epoch": 5218} {"train_loss": -26.695226669311523, "global_step": 433154, "epoch": 5218} {"train_loss": -26.91167640686035, "global_step": 433155, "epoch": 5218} {"train_loss": -26.932758331298828, "global_step": 433156, "epoch": 5218} {"train_loss": -26.553546905517578, "global_step": 433157, "epoch": 5218} {"train_loss": -27.126880645751953, "global_step": 433158, "epoch": 5218} {"train_loss": -26.954553604125977, "global_step": 433159, "epoch": 5218} {"train_loss": -27.29143714904785, "global_step": 433160, "epoch": 5218} {"train_loss": -26.884794235229492, "global_step": 433161, "epoch": 5218} {"train_loss": -26.653156280517578, "global_step": 433162, "epoch": 5218} {"train_loss": -26.252288818359375, "global_step": 433163, "epoch": 5218} {"train_loss": -26.541242599487305, "global_step": 433164, "epoch": 5218} {"train_loss": -26.755395889282227, "global_step": 433165, "epoch": 5218} {"train_loss": -26.36942481994629, "global_step": 433166, "epoch": 5218} {"train_loss": -26.798574447631836, "global_step": 433167, "epoch": 5218} {"train_loss": -26.867645263671875, "global_step": 433168, "epoch": 5218} {"train_loss": -27.128149032592773, "global_step": 433169, "epoch": 5218} {"train_loss": -26.993932723999023, "global_step": 433170, "epoch": 5218} {"train_loss": -27.019567489624023, "global_step": 433171, "epoch": 5218} {"train_loss": -26.739465713500977, "global_step": 433172, "epoch": 5218} {"train_loss": -26.8310489654541, "global_step": 433173, "epoch": 5218} {"train_loss": -27.104562759399414, "global_step": 433174, "epoch": 5218} {"train_loss": -26.75018310546875, "global_step": 433175, "epoch": 5218} {"train_loss": -26.733780849410827, "global_step": 433176, "epoch": 5218, "val_loss": 6870914.0} {"train_loss": -25.517244338989258, "global_step": 433177, "epoch": 5219} {"train_loss": -26.054107666015625, "global_step": 433178, "epoch": 5219} {"train_loss": -26.00648307800293, "global_step": 433179, "epoch": 5219} {"train_loss": -26.443830490112305, "global_step": 433180, "epoch": 5219} {"train_loss": -26.296255111694336, "global_step": 433181, "epoch": 5219} {"train_loss": -26.249557495117188, "global_step": 433182, "epoch": 5219} {"train_loss": -26.877090454101562, "global_step": 433183, "epoch": 5219} {"train_loss": -26.151325225830078, "global_step": 433184, "epoch": 5219} {"train_loss": -26.787145614624023, "global_step": 433185, "epoch": 5219} {"train_loss": -26.417743682861328, "global_step": 433186, "epoch": 5219} {"train_loss": -26.540332794189453, "global_step": 433187, "epoch": 5219} {"train_loss": -26.664281845092773, "global_step": 433188, "epoch": 5219} {"train_loss": -26.761184692382812, "global_step": 433189, "epoch": 5219} {"train_loss": -26.676044464111328, "global_step": 433190, "epoch": 5219} {"train_loss": -26.642276763916016, "global_step": 433191, "epoch": 5219} {"train_loss": -26.474472045898438, "global_step": 433192, "epoch": 5219} {"train_loss": -27.366119384765625, "global_step": 433193, "epoch": 5219} {"train_loss": -26.479007720947266, "global_step": 433194, "epoch": 5219} {"train_loss": -26.7451114654541, "global_step": 433195, "epoch": 5219} {"train_loss": -26.945159912109375, "global_step": 433196, "epoch": 5219} {"train_loss": -27.1778621673584, "global_step": 433197, "epoch": 5219} {"train_loss": -26.990636825561523, "global_step": 433198, "epoch": 5219} {"train_loss": -26.475250244140625, "global_step": 433199, "epoch": 5219} {"train_loss": -26.653034210205078, "global_step": 433200, "epoch": 5219} {"train_loss": -26.642932891845703, "global_step": 433201, "epoch": 5219} {"train_loss": -26.855478286743164, "global_step": 433202, "epoch": 5219} {"train_loss": -26.865392684936523, "global_step": 433203, "epoch": 5219} {"train_loss": -27.00116539001465, "global_step": 433204, "epoch": 5219} {"train_loss": -26.701093673706055, "global_step": 433205, "epoch": 5219} {"train_loss": -26.839370727539062, "global_step": 433206, "epoch": 5219} {"train_loss": -26.645511627197266, "global_step": 433207, "epoch": 5219} {"train_loss": -26.4547119140625, "global_step": 433208, "epoch": 5219} {"train_loss": -26.924468994140625, "global_step": 433209, "epoch": 5219} {"train_loss": -26.6597843170166, "global_step": 433210, "epoch": 5219} {"train_loss": -27.181781768798828, "global_step": 433211, "epoch": 5219} {"train_loss": -27.1117000579834, "global_step": 433212, "epoch": 5219} {"train_loss": -27.191320419311523, "global_step": 433213, "epoch": 5219} {"train_loss": -26.817829132080078, "global_step": 433214, "epoch": 5219} {"train_loss": -26.933685302734375, "global_step": 433215, "epoch": 5219} {"train_loss": -26.93916130065918, "global_step": 433216, "epoch": 5219} {"train_loss": -26.896509170532227, "global_step": 433217, "epoch": 5219} {"train_loss": -26.930179595947266, "global_step": 433218, "epoch": 5219} {"train_loss": -27.43292236328125, "global_step": 433219, "epoch": 5219} {"train_loss": -26.771514892578125, "global_step": 433220, "epoch": 5219} {"train_loss": -26.761646270751953, "global_step": 433221, "epoch": 5219} {"train_loss": -26.835010528564453, "global_step": 433222, "epoch": 5219} {"train_loss": -26.67038917541504, "global_step": 433223, "epoch": 5219} {"train_loss": -27.0008544921875, "global_step": 433224, "epoch": 5219} {"train_loss": -26.91956901550293, "global_step": 433225, "epoch": 5219} {"train_loss": -27.046192169189453, "global_step": 433226, "epoch": 5219} {"train_loss": -27.050174713134766, "global_step": 433227, "epoch": 5219} {"train_loss": -27.362262725830078, "global_step": 433228, "epoch": 5219} {"train_loss": -26.909656524658203, "global_step": 433229, "epoch": 5219} {"train_loss": -27.13641929626465, "global_step": 433230, "epoch": 5219} {"train_loss": -27.185108184814453, "global_step": 433231, "epoch": 5219} {"train_loss": -27.454116821289062, "global_step": 433232, "epoch": 5219} {"train_loss": -27.23219871520996, "global_step": 433233, "epoch": 5219} {"train_loss": -26.857303619384766, "global_step": 433234, "epoch": 5219} {"train_loss": -27.01407241821289, "global_step": 433235, "epoch": 5219} {"train_loss": -26.531259536743164, "global_step": 433236, "epoch": 5219} {"train_loss": -27.057226181030273, "global_step": 433237, "epoch": 5219} {"train_loss": -26.63604164123535, "global_step": 433238, "epoch": 5219} {"train_loss": -26.523778915405273, "global_step": 433239, "epoch": 5219} {"train_loss": -26.75699234008789, "global_step": 433240, "epoch": 5219} {"train_loss": -26.5693359375, "global_step": 433241, "epoch": 5219} {"train_loss": -26.4263858795166, "global_step": 433242, "epoch": 5219} {"train_loss": -26.679920196533203, "global_step": 433243, "epoch": 5219} {"train_loss": -27.1199951171875, "global_step": 433244, "epoch": 5219} {"train_loss": -26.510950088500977, "global_step": 433245, "epoch": 5219} {"train_loss": -26.893707275390625, "global_step": 433246, "epoch": 5219} {"train_loss": -26.858875274658203, "global_step": 433247, "epoch": 5219} {"train_loss": -26.645496368408203, "global_step": 433248, "epoch": 5219} {"train_loss": -26.88856315612793, "global_step": 433249, "epoch": 5219} {"train_loss": -26.83876609802246, "global_step": 433250, "epoch": 5219} {"train_loss": -26.707763671875, "global_step": 433251, "epoch": 5219} {"train_loss": -26.627782821655273, "global_step": 433252, "epoch": 5219} {"train_loss": -27.2946720123291, "global_step": 433253, "epoch": 5219} {"train_loss": -26.99285316467285, "global_step": 433254, "epoch": 5219} {"train_loss": -26.796131134033203, "global_step": 433255, "epoch": 5219} {"train_loss": -26.956363677978516, "global_step": 433256, "epoch": 5219} {"train_loss": -27.00507164001465, "global_step": 433257, "epoch": 5219} {"train_loss": -27.139774322509766, "global_step": 433258, "epoch": 5219} {"train_loss": -26.79475614248988, "global_step": 433259, "epoch": 5219, "val_loss": 6796197.0} {"train_loss": -26.570587158203125, "global_step": 433260, "epoch": 5220} {"train_loss": -26.548852920532227, "global_step": 433261, "epoch": 5220} {"train_loss": -26.466337203979492, "global_step": 433262, "epoch": 5220} {"train_loss": -26.142797470092773, "global_step": 433263, "epoch": 5220} {"train_loss": -26.635522842407227, "global_step": 433264, "epoch": 5220} {"train_loss": -26.69843864440918, "global_step": 433265, "epoch": 5220} {"train_loss": -26.414365768432617, "global_step": 433266, "epoch": 5220} {"train_loss": -26.081350326538086, "global_step": 433267, "epoch": 5220} {"train_loss": -26.51370620727539, "global_step": 433268, "epoch": 5220} {"train_loss": -26.527088165283203, "global_step": 433269, "epoch": 5220} {"train_loss": -26.2887020111084, "global_step": 433270, "epoch": 5220} {"train_loss": -26.694599151611328, "global_step": 433271, "epoch": 5220} {"train_loss": -26.502283096313477, "global_step": 433272, "epoch": 5220} {"train_loss": -26.482757568359375, "global_step": 433273, "epoch": 5220} {"train_loss": -26.598281860351562, "global_step": 433274, "epoch": 5220} {"train_loss": -26.67069435119629, "global_step": 433275, "epoch": 5220} {"train_loss": -26.71546745300293, "global_step": 433276, "epoch": 5220} {"train_loss": -26.851032257080078, "global_step": 433277, "epoch": 5220} {"train_loss": -26.903274536132812, "global_step": 433278, "epoch": 5220} {"train_loss": -26.598392486572266, "global_step": 433279, "epoch": 5220} {"train_loss": -26.835498809814453, "global_step": 433280, "epoch": 5220} {"train_loss": -26.67205810546875, "global_step": 433281, "epoch": 5220} {"train_loss": -26.75312614440918, "global_step": 433282, "epoch": 5220} {"train_loss": -26.9514217376709, "global_step": 433283, "epoch": 5220} {"train_loss": -26.40287208557129, "global_step": 433284, "epoch": 5220} {"train_loss": -26.268848419189453, "global_step": 433285, "epoch": 5220} {"train_loss": -26.908056259155273, "global_step": 433286, "epoch": 5220} {"train_loss": -26.86402702331543, "global_step": 433287, "epoch": 5220} {"train_loss": -26.7012882232666, "global_step": 433288, "epoch": 5220} {"train_loss": -26.989831924438477, "global_step": 433289, "epoch": 5220} {"train_loss": -27.175537109375, "global_step": 433290, "epoch": 5220} {"train_loss": -27.047876358032227, "global_step": 433291, "epoch": 5220} {"train_loss": -27.0903263092041, "global_step": 433292, "epoch": 5220} {"train_loss": -27.051916122436523, "global_step": 433293, "epoch": 5220} {"train_loss": -27.3332462310791, "global_step": 433294, "epoch": 5220} {"train_loss": -26.9359073638916, "global_step": 433295, "epoch": 5220} {"train_loss": -27.341388702392578, "global_step": 433296, "epoch": 5220} {"train_loss": -27.267248153686523, "global_step": 433297, "epoch": 5220} {"train_loss": -26.97355079650879, "global_step": 433298, "epoch": 5220} {"train_loss": -27.200214385986328, "global_step": 433299, "epoch": 5220} {"train_loss": -27.4616641998291, "global_step": 433300, "epoch": 5220} {"train_loss": -27.00933265686035, "global_step": 433301, "epoch": 5220} {"train_loss": -26.666584014892578, "global_step": 433302, "epoch": 5220} {"train_loss": -27.084928512573242, "global_step": 433303, "epoch": 5220} {"train_loss": -26.562673568725586, "global_step": 433304, "epoch": 5220} {"train_loss": -27.00339698791504, "global_step": 433305, "epoch": 5220} {"train_loss": -26.970752716064453, "global_step": 433306, "epoch": 5220} {"train_loss": -26.655893325805664, "global_step": 433307, "epoch": 5220} {"train_loss": -26.840106964111328, "global_step": 433308, "epoch": 5220} {"train_loss": -26.723175048828125, "global_step": 433309, "epoch": 5220} {"train_loss": -26.785226821899414, "global_step": 433310, "epoch": 5220} {"train_loss": -26.9105281829834, "global_step": 433311, "epoch": 5220} {"train_loss": -26.547815322875977, "global_step": 433312, "epoch": 5220} {"train_loss": -26.490869522094727, "global_step": 433313, "epoch": 5220} {"train_loss": -26.77646827697754, "global_step": 433314, "epoch": 5220} {"train_loss": -26.507055282592773, "global_step": 433315, "epoch": 5220} {"train_loss": -26.43743896484375, "global_step": 433316, "epoch": 5220} {"train_loss": -26.505741119384766, "global_step": 433317, "epoch": 5220} {"train_loss": -26.699115753173828, "global_step": 433318, "epoch": 5220} {"train_loss": -26.79245376586914, "global_step": 433319, "epoch": 5220} {"train_loss": -26.707807540893555, "global_step": 433320, "epoch": 5220} {"train_loss": -27.1351261138916, "global_step": 433321, "epoch": 5220} {"train_loss": -26.72930908203125, "global_step": 433322, "epoch": 5220} {"train_loss": -26.93999671936035, "global_step": 433323, "epoch": 5220} {"train_loss": -27.094152450561523, "global_step": 433324, "epoch": 5220} {"train_loss": -27.053808212280273, "global_step": 433325, "epoch": 5220} {"train_loss": -27.21099853515625, "global_step": 433326, "epoch": 5220} {"train_loss": -26.782882690429688, "global_step": 433327, "epoch": 5220} {"train_loss": -26.631711959838867, "global_step": 433328, "epoch": 5220} {"train_loss": -25.86126136779785, "global_step": 433329, "epoch": 5220} {"train_loss": -25.755340576171875, "global_step": 433330, "epoch": 5220} {"train_loss": -25.86322593688965, "global_step": 433331, "epoch": 5220} {"train_loss": -26.650854110717773, "global_step": 433332, "epoch": 5220} {"train_loss": -26.859390258789062, "global_step": 433333, "epoch": 5220} {"train_loss": -26.728178024291992, "global_step": 433334, "epoch": 5220} {"train_loss": -26.292993545532227, "global_step": 433335, "epoch": 5220} {"train_loss": -26.8543701171875, "global_step": 433336, "epoch": 5220} {"train_loss": -26.229074478149414, "global_step": 433337, "epoch": 5220} {"train_loss": -26.69159507751465, "global_step": 433338, "epoch": 5220} {"train_loss": -26.454654693603516, "global_step": 433339, "epoch": 5220} {"train_loss": -26.2961368560791, "global_step": 433340, "epoch": 5220} {"train_loss": -26.921838760375977, "global_step": 433341, "epoch": 5220} {"train_loss": -26.727577439273695, "global_step": 433342, "epoch": 5220, "val_loss": 6796003.0} {"train_loss": -25.8123722076416, "global_step": 433343, "epoch": 5221} {"train_loss": -26.464590072631836, "global_step": 433344, "epoch": 5221} {"train_loss": -25.917682647705078, "global_step": 433345, "epoch": 5221} {"train_loss": -26.553668975830078, "global_step": 433346, "epoch": 5221} {"train_loss": -26.12821388244629, "global_step": 433347, "epoch": 5221} {"train_loss": -26.047677993774414, "global_step": 433348, "epoch": 5221} {"train_loss": -26.231128692626953, "global_step": 433349, "epoch": 5221} {"train_loss": -26.11052894592285, "global_step": 433350, "epoch": 5221} {"train_loss": -26.539148330688477, "global_step": 433351, "epoch": 5221} {"train_loss": -26.356311798095703, "global_step": 433352, "epoch": 5221} {"train_loss": -26.203662872314453, "global_step": 433353, "epoch": 5221} {"train_loss": -26.244184494018555, "global_step": 433354, "epoch": 5221} {"train_loss": -26.59109878540039, "global_step": 433355, "epoch": 5221} {"train_loss": -26.462671279907227, "global_step": 433356, "epoch": 5221} {"train_loss": -26.490304946899414, "global_step": 433357, "epoch": 5221} {"train_loss": -26.55531120300293, "global_step": 433358, "epoch": 5221} {"train_loss": -26.386566162109375, "global_step": 433359, "epoch": 5221} {"train_loss": -26.753620147705078, "global_step": 433360, "epoch": 5221} {"train_loss": -26.879886627197266, "global_step": 433361, "epoch": 5221} {"train_loss": -26.7938232421875, "global_step": 433362, "epoch": 5221} {"train_loss": -27.088285446166992, "global_step": 433363, "epoch": 5221} {"train_loss": -26.739398956298828, "global_step": 433364, "epoch": 5221} {"train_loss": -26.652475357055664, "global_step": 433365, "epoch": 5221} {"train_loss": -26.809194564819336, "global_step": 433366, "epoch": 5221} {"train_loss": -26.948184967041016, "global_step": 433367, "epoch": 5221} {"train_loss": -26.671552658081055, "global_step": 433368, "epoch": 5221} {"train_loss": -26.885709762573242, "global_step": 433369, "epoch": 5221} {"train_loss": -26.537382125854492, "global_step": 433370, "epoch": 5221} {"train_loss": -26.907440185546875, "global_step": 433371, "epoch": 5221} {"train_loss": -26.62404441833496, "global_step": 433372, "epoch": 5221} {"train_loss": -26.69671058654785, "global_step": 433373, "epoch": 5221} {"train_loss": -26.7990779876709, "global_step": 433374, "epoch": 5221} {"train_loss": -27.283283233642578, "global_step": 433375, "epoch": 5221} {"train_loss": -26.844940185546875, "global_step": 433376, "epoch": 5221} {"train_loss": -27.4274959564209, "global_step": 433377, "epoch": 5221} {"train_loss": -26.897382736206055, "global_step": 433378, "epoch": 5221} {"train_loss": -26.791568756103516, "global_step": 433379, "epoch": 5221} {"train_loss": -27.050336837768555, "global_step": 433380, "epoch": 5221} {"train_loss": -27.001651763916016, "global_step": 433381, "epoch": 5221} {"train_loss": -26.69452476501465, "global_step": 433382, "epoch": 5221} {"train_loss": -27.068578720092773, "global_step": 433383, "epoch": 5221} {"train_loss": -27.07880973815918, "global_step": 433384, "epoch": 5221} {"train_loss": -26.996490478515625, "global_step": 433385, "epoch": 5221} {"train_loss": -27.263294219970703, "global_step": 433386, "epoch": 5221} {"train_loss": -27.417333602905273, "global_step": 433387, "epoch": 5221} {"train_loss": -26.7193660736084, "global_step": 433388, "epoch": 5221} {"train_loss": -27.099262237548828, "global_step": 433389, "epoch": 5221} {"train_loss": -26.90838623046875, "global_step": 433390, "epoch": 5221} {"train_loss": -26.810606002807617, "global_step": 433391, "epoch": 5221} {"train_loss": -27.01611328125, "global_step": 433392, "epoch": 5221} {"train_loss": -26.81342124938965, "global_step": 433393, "epoch": 5221} {"train_loss": -26.9350528717041, "global_step": 433394, "epoch": 5221} {"train_loss": -27.376203536987305, "global_step": 433395, "epoch": 5221} {"train_loss": -26.687591552734375, "global_step": 433396, "epoch": 5221} {"train_loss": -27.08380126953125, "global_step": 433397, "epoch": 5221} {"train_loss": -26.728378295898438, "global_step": 433398, "epoch": 5221} {"train_loss": -27.0712833404541, "global_step": 433399, "epoch": 5221} {"train_loss": -27.094568252563477, "global_step": 433400, "epoch": 5221} {"train_loss": -26.675073623657227, "global_step": 433401, "epoch": 5221} {"train_loss": -26.643354415893555, "global_step": 433402, "epoch": 5221} {"train_loss": -26.64838981628418, "global_step": 433403, "epoch": 5221} {"train_loss": -26.786975860595703, "global_step": 433404, "epoch": 5221} {"train_loss": -26.87628746032715, "global_step": 433405, "epoch": 5221} {"train_loss": -26.9693603515625, "global_step": 433406, "epoch": 5221} {"train_loss": -26.860553741455078, "global_step": 433407, "epoch": 5221} {"train_loss": -26.785736083984375, "global_step": 433408, "epoch": 5221} {"train_loss": -26.96731948852539, "global_step": 433409, "epoch": 5221} {"train_loss": -26.75705337524414, "global_step": 433410, "epoch": 5221} {"train_loss": -26.9525203704834, "global_step": 433411, "epoch": 5221} {"train_loss": -27.02622413635254, "global_step": 433412, "epoch": 5221} {"train_loss": -26.975366592407227, "global_step": 433413, "epoch": 5221} {"train_loss": -27.002197265625, "global_step": 433414, "epoch": 5221} {"train_loss": -26.98042106628418, "global_step": 433415, "epoch": 5221} {"train_loss": -27.141956329345703, "global_step": 433416, "epoch": 5221} {"train_loss": -26.39569664001465, "global_step": 433417, "epoch": 5221} {"train_loss": -26.93668556213379, "global_step": 433418, "epoch": 5221} {"train_loss": -26.75629234313965, "global_step": 433419, "epoch": 5221} {"train_loss": -27.027151107788086, "global_step": 433420, "epoch": 5221} {"train_loss": -26.76081657409668, "global_step": 433421, "epoch": 5221} {"train_loss": -27.194904327392578, "global_step": 433422, "epoch": 5221} {"train_loss": -26.7430362701416, "global_step": 433423, "epoch": 5221} {"train_loss": -27.00811195373535, "global_step": 433424, "epoch": 5221} {"train_loss": -26.790986716029156, "global_step": 433425, "epoch": 5221, "val_loss": 6831208.0} {"train_loss": -26.506229400634766, "global_step": 433426, "epoch": 5222} {"train_loss": -26.79572868347168, "global_step": 433427, "epoch": 5222} {"train_loss": -26.278661727905273, "global_step": 433428, "epoch": 5222} {"train_loss": -26.6179141998291, "global_step": 433429, "epoch": 5222} {"train_loss": -26.338415145874023, "global_step": 433430, "epoch": 5222} {"train_loss": -26.81939125061035, "global_step": 433431, "epoch": 5222} {"train_loss": -26.426679611206055, "global_step": 433432, "epoch": 5222} {"train_loss": -26.76637077331543, "global_step": 433433, "epoch": 5222} {"train_loss": -26.67752456665039, "global_step": 433434, "epoch": 5222} {"train_loss": -26.788732528686523, "global_step": 433435, "epoch": 5222} {"train_loss": -26.4981632232666, "global_step": 433436, "epoch": 5222} {"train_loss": -26.865156173706055, "global_step": 433437, "epoch": 5222} {"train_loss": -26.3668155670166, "global_step": 433438, "epoch": 5222} {"train_loss": -26.549362182617188, "global_step": 433439, "epoch": 5222} {"train_loss": -26.873830795288086, "global_step": 433440, "epoch": 5222} {"train_loss": -27.007070541381836, "global_step": 433441, "epoch": 5222} {"train_loss": -26.817712783813477, "global_step": 433442, "epoch": 5222} {"train_loss": -26.573781967163086, "global_step": 433443, "epoch": 5222} {"train_loss": -26.93745231628418, "global_step": 433444, "epoch": 5222} {"train_loss": -26.845434188842773, "global_step": 433445, "epoch": 5222} {"train_loss": -26.628812789916992, "global_step": 433446, "epoch": 5222} {"train_loss": -26.72490882873535, "global_step": 433447, "epoch": 5222} {"train_loss": -27.02081298828125, "global_step": 433448, "epoch": 5222} {"train_loss": -26.752084732055664, "global_step": 433449, "epoch": 5222} {"train_loss": -26.77933692932129, "global_step": 433450, "epoch": 5222} {"train_loss": -27.055744171142578, "global_step": 433451, "epoch": 5222} {"train_loss": -27.07586669921875, "global_step": 433452, "epoch": 5222} {"train_loss": -27.153608322143555, "global_step": 433453, "epoch": 5222} {"train_loss": -27.056100845336914, "global_step": 433454, "epoch": 5222} {"train_loss": -27.13166618347168, "global_step": 433455, "epoch": 5222} {"train_loss": -27.248931884765625, "global_step": 433456, "epoch": 5222} {"train_loss": -26.95172691345215, "global_step": 433457, "epoch": 5222} {"train_loss": -26.810535430908203, "global_step": 433458, "epoch": 5222} {"train_loss": -27.183807373046875, "global_step": 433459, "epoch": 5222} {"train_loss": -27.034305572509766, "global_step": 433460, "epoch": 5222} {"train_loss": -26.934003829956055, "global_step": 433461, "epoch": 5222} {"train_loss": -26.688770294189453, "global_step": 433462, "epoch": 5222} {"train_loss": -26.813993453979492, "global_step": 433463, "epoch": 5222} {"train_loss": -26.519977569580078, "global_step": 433464, "epoch": 5222} {"train_loss": -26.785810470581055, "global_step": 433465, "epoch": 5222} {"train_loss": -26.870038986206055, "global_step": 433466, "epoch": 5222} {"train_loss": -26.827911376953125, "global_step": 433467, "epoch": 5222} {"train_loss": -26.765066146850586, "global_step": 433468, "epoch": 5222} {"train_loss": -26.96065330505371, "global_step": 433469, "epoch": 5222} {"train_loss": -26.761316299438477, "global_step": 433470, "epoch": 5222} {"train_loss": -26.7459659576416, "global_step": 433471, "epoch": 5222} {"train_loss": -27.15705680847168, "global_step": 433472, "epoch": 5222} {"train_loss": -27.132665634155273, "global_step": 433473, "epoch": 5222} {"train_loss": -26.929311752319336, "global_step": 433474, "epoch": 5222} {"train_loss": -26.89678955078125, "global_step": 433475, "epoch": 5222} {"train_loss": -26.983152389526367, "global_step": 433476, "epoch": 5222} {"train_loss": -26.975772857666016, "global_step": 433477, "epoch": 5222} {"train_loss": -26.844648361206055, "global_step": 433478, "epoch": 5222} {"train_loss": -27.256391525268555, "global_step": 433479, "epoch": 5222} {"train_loss": -27.13877296447754, "global_step": 433480, "epoch": 5222} {"train_loss": -27.007617950439453, "global_step": 433481, "epoch": 5222} {"train_loss": -26.921722412109375, "global_step": 433482, "epoch": 5222} {"train_loss": -26.74264907836914, "global_step": 433483, "epoch": 5222} {"train_loss": -27.2177791595459, "global_step": 433484, "epoch": 5222} {"train_loss": -26.863569259643555, "global_step": 433485, "epoch": 5222} {"train_loss": -27.19439125061035, "global_step": 433486, "epoch": 5222} {"train_loss": -26.741689682006836, "global_step": 433487, "epoch": 5222} {"train_loss": -27.40364646911621, "global_step": 433488, "epoch": 5222} {"train_loss": -26.65301513671875, "global_step": 433489, "epoch": 5222} {"train_loss": -27.31270408630371, "global_step": 433490, "epoch": 5222} {"train_loss": -26.705707550048828, "global_step": 433491, "epoch": 5222} {"train_loss": -26.922428131103516, "global_step": 433492, "epoch": 5222} {"train_loss": -26.851490020751953, "global_step": 433493, "epoch": 5222} {"train_loss": -27.26679801940918, "global_step": 433494, "epoch": 5222} {"train_loss": -26.941898345947266, "global_step": 433495, "epoch": 5222} {"train_loss": -27.061925888061523, "global_step": 433496, "epoch": 5222} {"train_loss": -27.03363037109375, "global_step": 433497, "epoch": 5222} {"train_loss": -26.44208335876465, "global_step": 433498, "epoch": 5222} {"train_loss": -26.99629783630371, "global_step": 433499, "epoch": 5222} {"train_loss": -27.07177734375, "global_step": 433500, "epoch": 5222} {"train_loss": -26.6867618560791, "global_step": 433501, "epoch": 5222} {"train_loss": -26.689428329467773, "global_step": 433502, "epoch": 5222} {"train_loss": -26.893491744995117, "global_step": 433503, "epoch": 5222} {"train_loss": -26.666669845581055, "global_step": 433504, "epoch": 5222} {"train_loss": -27.068775177001953, "global_step": 433505, "epoch": 5222} {"train_loss": -26.75019645690918, "global_step": 433506, "epoch": 5222} {"train_loss": -26.95810890197754, "global_step": 433507, "epoch": 5222} {"train_loss": -26.880521613431263, "global_step": 433508, "epoch": 5222, "val_loss": 6844553.0} {"train_loss": -26.886411666870117, "global_step": 433509, "epoch": 5223} {"train_loss": -26.423389434814453, "global_step": 433510, "epoch": 5223} {"train_loss": -25.954694747924805, "global_step": 433511, "epoch": 5223} {"train_loss": -25.9467830657959, "global_step": 433512, "epoch": 5223} {"train_loss": -26.13226318359375, "global_step": 433513, "epoch": 5223} {"train_loss": -26.4719295501709, "global_step": 433514, "epoch": 5223} {"train_loss": -25.9920654296875, "global_step": 433515, "epoch": 5223} {"train_loss": -26.127429962158203, "global_step": 433516, "epoch": 5223} {"train_loss": -25.92881202697754, "global_step": 433517, "epoch": 5223} {"train_loss": -26.381006240844727, "global_step": 433518, "epoch": 5223} {"train_loss": -26.837360382080078, "global_step": 433519, "epoch": 5223} {"train_loss": -26.458393096923828, "global_step": 433520, "epoch": 5223} {"train_loss": -26.260892868041992, "global_step": 433521, "epoch": 5223} {"train_loss": -26.20611572265625, "global_step": 433522, "epoch": 5223} {"train_loss": -26.55771827697754, "global_step": 433523, "epoch": 5223} {"train_loss": -26.941791534423828, "global_step": 433524, "epoch": 5223} {"train_loss": -26.76236343383789, "global_step": 433525, "epoch": 5223} {"train_loss": -26.4239501953125, "global_step": 433526, "epoch": 5223} {"train_loss": -26.65247917175293, "global_step": 433527, "epoch": 5223} {"train_loss": -26.567584991455078, "global_step": 433528, "epoch": 5223} {"train_loss": -26.3353271484375, "global_step": 433529, "epoch": 5223} {"train_loss": -26.204938888549805, "global_step": 433530, "epoch": 5223} {"train_loss": -26.895751953125, "global_step": 433531, "epoch": 5223} {"train_loss": -26.691492080688477, "global_step": 433532, "epoch": 5223} {"train_loss": -26.672574996948242, "global_step": 433533, "epoch": 5223} {"train_loss": -26.653858184814453, "global_step": 433534, "epoch": 5223} {"train_loss": -26.643543243408203, "global_step": 433535, "epoch": 5223} {"train_loss": -26.681751251220703, "global_step": 433536, "epoch": 5223} {"train_loss": -26.803632736206055, "global_step": 433537, "epoch": 5223} {"train_loss": -27.082998275756836, "global_step": 433538, "epoch": 5223} {"train_loss": -26.98587417602539, "global_step": 433539, "epoch": 5223} {"train_loss": -27.316625595092773, "global_step": 433540, "epoch": 5223} {"train_loss": -26.730173110961914, "global_step": 433541, "epoch": 5223} {"train_loss": -26.88978385925293, "global_step": 433542, "epoch": 5223} {"train_loss": -27.019651412963867, "global_step": 433543, "epoch": 5223} {"train_loss": -27.173368453979492, "global_step": 433544, "epoch": 5223} {"train_loss": -26.789199829101562, "global_step": 433545, "epoch": 5223} {"train_loss": -27.260290145874023, "global_step": 433546, "epoch": 5223} {"train_loss": -27.053619384765625, "global_step": 433547, "epoch": 5223} {"train_loss": -27.145261764526367, "global_step": 433548, "epoch": 5223} {"train_loss": -26.807828903198242, "global_step": 433549, "epoch": 5223} {"train_loss": -26.56378746032715, "global_step": 433550, "epoch": 5223} {"train_loss": -26.557907104492188, "global_step": 433551, "epoch": 5223} {"train_loss": -27.209177017211914, "global_step": 433552, "epoch": 5223} {"train_loss": -27.362079620361328, "global_step": 433553, "epoch": 5223} {"train_loss": -26.663684844970703, "global_step": 433554, "epoch": 5223} {"train_loss": -26.909250259399414, "global_step": 433555, "epoch": 5223} {"train_loss": -26.595788955688477, "global_step": 433556, "epoch": 5223} {"train_loss": -26.636865615844727, "global_step": 433557, "epoch": 5223} {"train_loss": -27.152524948120117, "global_step": 433558, "epoch": 5223} {"train_loss": -26.640247344970703, "global_step": 433559, "epoch": 5223} {"train_loss": -26.96063804626465, "global_step": 433560, "epoch": 5223} {"train_loss": -26.914661407470703, "global_step": 433561, "epoch": 5223} {"train_loss": -27.06626319885254, "global_step": 433562, "epoch": 5223} {"train_loss": -26.879322052001953, "global_step": 433563, "epoch": 5223} {"train_loss": -27.03635597229004, "global_step": 433564, "epoch": 5223} {"train_loss": -26.862340927124023, "global_step": 433565, "epoch": 5223} {"train_loss": -26.84296989440918, "global_step": 433566, "epoch": 5223} {"train_loss": -27.112136840820312, "global_step": 433567, "epoch": 5223} {"train_loss": -27.119338989257812, "global_step": 433568, "epoch": 5223} {"train_loss": -27.1077823638916, "global_step": 433569, "epoch": 5223} {"train_loss": -27.439599990844727, "global_step": 433570, "epoch": 5223} {"train_loss": -27.373077392578125, "global_step": 433571, "epoch": 5223} {"train_loss": -27.245656967163086, "global_step": 433572, "epoch": 5223} {"train_loss": -26.718067169189453, "global_step": 433573, "epoch": 5223} {"train_loss": -26.97706413269043, "global_step": 433574, "epoch": 5223} {"train_loss": -27.075698852539062, "global_step": 433575, "epoch": 5223} {"train_loss": -27.14863395690918, "global_step": 433576, "epoch": 5223} {"train_loss": -26.683069229125977, "global_step": 433577, "epoch": 5223} {"train_loss": -27.089664459228516, "global_step": 433578, "epoch": 5223} {"train_loss": -27.232685089111328, "global_step": 433579, "epoch": 5223} {"train_loss": -26.993854522705078, "global_step": 433580, "epoch": 5223} {"train_loss": -27.043838500976562, "global_step": 433581, "epoch": 5223} {"train_loss": -26.90122413635254, "global_step": 433582, "epoch": 5223} {"train_loss": -26.439313888549805, "global_step": 433583, "epoch": 5223} {"train_loss": -26.233816146850586, "global_step": 433584, "epoch": 5223} {"train_loss": -27.016921997070312, "global_step": 433585, "epoch": 5223} {"train_loss": -26.936969757080078, "global_step": 433586, "epoch": 5223} {"train_loss": -26.782840728759766, "global_step": 433587, "epoch": 5223} {"train_loss": -26.81658363342285, "global_step": 433588, "epoch": 5223} {"train_loss": -26.30795669555664, "global_step": 433589, "epoch": 5223} {"train_loss": -26.71786880493164, "global_step": 433590, "epoch": 5223} {"train_loss": -26.776259295911675, "global_step": 433591, "epoch": 5223, "val_loss": 6672066.0} {"train_loss": -26.600439071655273, "global_step": 433592, "epoch": 5224} {"train_loss": -26.353240966796875, "global_step": 433593, "epoch": 5224} {"train_loss": -26.469823837280273, "global_step": 433594, "epoch": 5224} {"train_loss": -26.661344528198242, "global_step": 433595, "epoch": 5224} {"train_loss": -26.896503448486328, "global_step": 433596, "epoch": 5224} {"train_loss": -26.02381706237793, "global_step": 433597, "epoch": 5224} {"train_loss": -26.176481246948242, "global_step": 433598, "epoch": 5224} {"train_loss": -26.131444931030273, "global_step": 433599, "epoch": 5224} {"train_loss": -26.698169708251953, "global_step": 433600, "epoch": 5224} {"train_loss": -26.676715850830078, "global_step": 433601, "epoch": 5224} {"train_loss": -27.183856964111328, "global_step": 433602, "epoch": 5224} {"train_loss": -26.425312042236328, "global_step": 433603, "epoch": 5224} {"train_loss": -26.72947120666504, "global_step": 433604, "epoch": 5224} {"train_loss": -26.35835838317871, "global_step": 433605, "epoch": 5224} {"train_loss": -26.7702693939209, "global_step": 433606, "epoch": 5224} {"train_loss": -26.704431533813477, "global_step": 433607, "epoch": 5224} {"train_loss": -26.628448486328125, "global_step": 433608, "epoch": 5224} {"train_loss": -26.8348331451416, "global_step": 433609, "epoch": 5224} {"train_loss": -26.3176326751709, "global_step": 433610, "epoch": 5224} {"train_loss": -26.734445571899414, "global_step": 433611, "epoch": 5224} {"train_loss": -26.811981201171875, "global_step": 433612, "epoch": 5224} {"train_loss": -26.84626579284668, "global_step": 433613, "epoch": 5224} {"train_loss": -26.589895248413086, "global_step": 433614, "epoch": 5224} {"train_loss": -26.732152938842773, "global_step": 433615, "epoch": 5224} {"train_loss": -26.906293869018555, "global_step": 433616, "epoch": 5224} {"train_loss": -26.972736358642578, "global_step": 433617, "epoch": 5224} {"train_loss": -26.89544105529785, "global_step": 433618, "epoch": 5224} {"train_loss": -26.828733444213867, "global_step": 433619, "epoch": 5224} {"train_loss": -27.012983322143555, "global_step": 433620, "epoch": 5224} {"train_loss": -26.52131462097168, "global_step": 433621, "epoch": 5224} {"train_loss": -26.61060905456543, "global_step": 433622, "epoch": 5224} {"train_loss": -26.78662109375, "global_step": 433623, "epoch": 5224} {"train_loss": -26.777069091796875, "global_step": 433624, "epoch": 5224} {"train_loss": -27.148523330688477, "global_step": 433625, "epoch": 5224} {"train_loss": -26.82965660095215, "global_step": 433626, "epoch": 5224} {"train_loss": -26.67303466796875, "global_step": 433627, "epoch": 5224} {"train_loss": -27.033411026000977, "global_step": 433628, "epoch": 5224} {"train_loss": -27.055023193359375, "global_step": 433629, "epoch": 5224} {"train_loss": -26.850082397460938, "global_step": 433630, "epoch": 5224} {"train_loss": -26.81597900390625, "global_step": 433631, "epoch": 5224} {"train_loss": -26.698410034179688, "global_step": 433632, "epoch": 5224} {"train_loss": -26.97161293029785, "global_step": 433633, "epoch": 5224} {"train_loss": -27.174585342407227, "global_step": 433634, "epoch": 5224} {"train_loss": -27.0200252532959, "global_step": 433635, "epoch": 5224} {"train_loss": -26.995838165283203, "global_step": 433636, "epoch": 5224} {"train_loss": -26.768163681030273, "global_step": 433637, "epoch": 5224} {"train_loss": -27.027755737304688, "global_step": 433638, "epoch": 5224} {"train_loss": -26.373371124267578, "global_step": 433639, "epoch": 5224} {"train_loss": -26.998687744140625, "global_step": 433640, "epoch": 5224} {"train_loss": -26.919754028320312, "global_step": 433641, "epoch": 5224} {"train_loss": -27.25196647644043, "global_step": 433642, "epoch": 5224} {"train_loss": -27.21050453186035, "global_step": 433643, "epoch": 5224} {"train_loss": -26.6806640625, "global_step": 433644, "epoch": 5224} {"train_loss": -26.847822189331055, "global_step": 433645, "epoch": 5224} {"train_loss": -26.97450065612793, "global_step": 433646, "epoch": 5224} {"train_loss": -27.084760665893555, "global_step": 433647, "epoch": 5224} {"train_loss": -26.8847713470459, "global_step": 433648, "epoch": 5224} {"train_loss": -27.171716690063477, "global_step": 433649, "epoch": 5224} {"train_loss": -26.757917404174805, "global_step": 433650, "epoch": 5224} {"train_loss": -26.694223403930664, "global_step": 433651, "epoch": 5224} {"train_loss": -26.82516860961914, "global_step": 433652, "epoch": 5224} {"train_loss": -27.1751651763916, "global_step": 433653, "epoch": 5224} {"train_loss": -26.922378540039062, "global_step": 433654, "epoch": 5224} {"train_loss": -26.978605270385742, "global_step": 433655, "epoch": 5224} {"train_loss": -26.725561141967773, "global_step": 433656, "epoch": 5224} {"train_loss": -26.836225509643555, "global_step": 433657, "epoch": 5224} {"train_loss": -27.005035400390625, "global_step": 433658, "epoch": 5224} {"train_loss": -26.663528442382812, "global_step": 433659, "epoch": 5224} {"train_loss": -26.584081649780273, "global_step": 433660, "epoch": 5224} {"train_loss": -27.21807861328125, "global_step": 433661, "epoch": 5224} {"train_loss": -27.03228759765625, "global_step": 433662, "epoch": 5224} {"train_loss": -27.04200553894043, "global_step": 433663, "epoch": 5224} {"train_loss": -26.45537757873535, "global_step": 433664, "epoch": 5224} {"train_loss": -26.718463897705078, "global_step": 433665, "epoch": 5224} {"train_loss": -26.71504020690918, "global_step": 433666, "epoch": 5224} {"train_loss": -26.596572875976562, "global_step": 433667, "epoch": 5224} {"train_loss": -26.9973201751709, "global_step": 433668, "epoch": 5224} {"train_loss": -26.612146377563477, "global_step": 433669, "epoch": 5224} {"train_loss": -26.94471549987793, "global_step": 433670, "epoch": 5224} {"train_loss": -26.768239974975586, "global_step": 433671, "epoch": 5224} {"train_loss": -26.84987449645996, "global_step": 433672, "epoch": 5224} {"train_loss": -26.997961044311523, "global_step": 433673, "epoch": 5224} {"train_loss": -26.801409480083418, "global_step": 433674, "epoch": 5224, "val_loss": 6829601.0} {"train_loss": -26.462717056274414, "global_step": 433675, "epoch": 5225} {"train_loss": -26.116535186767578, "global_step": 433676, "epoch": 5225} {"train_loss": -25.97035026550293, "global_step": 433677, "epoch": 5225} {"train_loss": -26.344358444213867, "global_step": 433678, "epoch": 5225} {"train_loss": -26.47418785095215, "global_step": 433679, "epoch": 5225} {"train_loss": -26.427648544311523, "global_step": 433680, "epoch": 5225} {"train_loss": -26.396326065063477, "global_step": 433681, "epoch": 5225} {"train_loss": -26.224491119384766, "global_step": 433682, "epoch": 5225} {"train_loss": -26.647085189819336, "global_step": 433683, "epoch": 5225} {"train_loss": -26.5524959564209, "global_step": 433684, "epoch": 5225} {"train_loss": -26.826313018798828, "global_step": 433685, "epoch": 5225} {"train_loss": -26.647663116455078, "global_step": 433686, "epoch": 5225} {"train_loss": -26.2034854888916, "global_step": 433687, "epoch": 5225} {"train_loss": -26.966339111328125, "global_step": 433688, "epoch": 5225} {"train_loss": -26.980243682861328, "global_step": 433689, "epoch": 5225} {"train_loss": -26.7080078125, "global_step": 433690, "epoch": 5225} {"train_loss": -27.15277671813965, "global_step": 433691, "epoch": 5225} {"train_loss": -26.804458618164062, "global_step": 433692, "epoch": 5225} {"train_loss": -27.052175521850586, "global_step": 433693, "epoch": 5225} {"train_loss": -27.0219669342041, "global_step": 433694, "epoch": 5225} {"train_loss": -26.779279708862305, "global_step": 433695, "epoch": 5225} {"train_loss": -26.745405197143555, "global_step": 433696, "epoch": 5225} {"train_loss": -26.835020065307617, "global_step": 433697, "epoch": 5225} {"train_loss": -26.671096801757812, "global_step": 433698, "epoch": 5225} {"train_loss": -26.77491569519043, "global_step": 433699, "epoch": 5225} {"train_loss": -27.461267471313477, "global_step": 433700, "epoch": 5225} {"train_loss": -26.8438663482666, "global_step": 433701, "epoch": 5225} {"train_loss": -26.807092666625977, "global_step": 433702, "epoch": 5225} {"train_loss": -26.9915714263916, "global_step": 433703, "epoch": 5225} {"train_loss": -26.97943115234375, "global_step": 433704, "epoch": 5225} {"train_loss": -26.927793502807617, "global_step": 433705, "epoch": 5225} {"train_loss": -26.720212936401367, "global_step": 433706, "epoch": 5225} {"train_loss": -26.975439071655273, "global_step": 433707, "epoch": 5225} {"train_loss": -26.350494384765625, "global_step": 433708, "epoch": 5225} {"train_loss": -26.7757625579834, "global_step": 433709, "epoch": 5225} {"train_loss": -27.07795524597168, "global_step": 433710, "epoch": 5225} {"train_loss": -27.045612335205078, "global_step": 433711, "epoch": 5225} {"train_loss": -26.82594871520996, "global_step": 433712, "epoch": 5225} {"train_loss": -26.939481735229492, "global_step": 433713, "epoch": 5225} {"train_loss": -26.678131103515625, "global_step": 433714, "epoch": 5225} {"train_loss": -26.615066528320312, "global_step": 433715, "epoch": 5225} {"train_loss": -27.13593101501465, "global_step": 433716, "epoch": 5225} {"train_loss": -26.721288681030273, "global_step": 433717, "epoch": 5225} {"train_loss": -26.98223304748535, "global_step": 433718, "epoch": 5225} {"train_loss": -26.767667770385742, "global_step": 433719, "epoch": 5225} {"train_loss": -27.36798667907715, "global_step": 433720, "epoch": 5225} {"train_loss": -26.522436141967773, "global_step": 433721, "epoch": 5225} {"train_loss": -26.80506706237793, "global_step": 433722, "epoch": 5225} {"train_loss": -27.069543838500977, "global_step": 433723, "epoch": 5225} {"train_loss": -27.158618927001953, "global_step": 433724, "epoch": 5225} {"train_loss": -27.004764556884766, "global_step": 433725, "epoch": 5225} {"train_loss": -26.90755271911621, "global_step": 433726, "epoch": 5225} {"train_loss": -27.052581787109375, "global_step": 433727, "epoch": 5225} {"train_loss": -27.045068740844727, "global_step": 433728, "epoch": 5225} {"train_loss": -27.129669189453125, "global_step": 433729, "epoch": 5225} {"train_loss": -26.857507705688477, "global_step": 433730, "epoch": 5225} {"train_loss": -26.57177734375, "global_step": 433731, "epoch": 5225} {"train_loss": -27.236799240112305, "global_step": 433732, "epoch": 5225} {"train_loss": -27.05963706970215, "global_step": 433733, "epoch": 5225} {"train_loss": -26.564529418945312, "global_step": 433734, "epoch": 5225} {"train_loss": -26.853759765625, "global_step": 433735, "epoch": 5225} {"train_loss": -27.286975860595703, "global_step": 433736, "epoch": 5225} {"train_loss": -27.353652954101562, "global_step": 433737, "epoch": 5225} {"train_loss": -26.88970947265625, "global_step": 433738, "epoch": 5225} {"train_loss": -27.09419059753418, "global_step": 433739, "epoch": 5225} {"train_loss": -26.959796905517578, "global_step": 433740, "epoch": 5225} {"train_loss": -26.816314697265625, "global_step": 433741, "epoch": 5225} {"train_loss": -26.8851261138916, "global_step": 433742, "epoch": 5225} {"train_loss": -26.83405113220215, "global_step": 433743, "epoch": 5225} {"train_loss": -26.83660316467285, "global_step": 433744, "epoch": 5225} {"train_loss": -26.83327293395996, "global_step": 433745, "epoch": 5225} {"train_loss": -26.5690860748291, "global_step": 433746, "epoch": 5225} {"train_loss": -27.094375610351562, "global_step": 433747, "epoch": 5225} {"train_loss": -26.952117919921875, "global_step": 433748, "epoch": 5225} {"train_loss": -26.880285263061523, "global_step": 433749, "epoch": 5225} {"train_loss": -26.83544921875, "global_step": 433750, "epoch": 5225} {"train_loss": -27.225210189819336, "global_step": 433751, "epoch": 5225} {"train_loss": -26.897541046142578, "global_step": 433752, "epoch": 5225} {"train_loss": -26.8558349609375, "global_step": 433753, "epoch": 5225} {"train_loss": -26.96465492248535, "global_step": 433754, "epoch": 5225} {"train_loss": -26.6817684173584, "global_step": 433755, "epoch": 5225} {"train_loss": -26.768848419189453, "global_step": 433756, "epoch": 5225} {"train_loss": -26.84349983858775, "global_step": 433757, "epoch": 5225, "val_loss": 6780795.0} {"train_loss": -26.242572784423828, "global_step": 433758, "epoch": 5226} {"train_loss": -25.353506088256836, "global_step": 433759, "epoch": 5226} {"train_loss": -25.269826889038086, "global_step": 433760, "epoch": 5226} {"train_loss": -24.6700382232666, "global_step": 433761, "epoch": 5226} {"train_loss": -25.803876876831055, "global_step": 433762, "epoch": 5226} {"train_loss": -25.90790367126465, "global_step": 433763, "epoch": 5226} {"train_loss": -25.928394317626953, "global_step": 433764, "epoch": 5226} {"train_loss": -26.56056022644043, "global_step": 433765, "epoch": 5226} {"train_loss": -26.095489501953125, "global_step": 433766, "epoch": 5226} {"train_loss": -25.81804847717285, "global_step": 433767, "epoch": 5226} {"train_loss": -26.5106143951416, "global_step": 433768, "epoch": 5226} {"train_loss": -25.723865509033203, "global_step": 433769, "epoch": 5226} {"train_loss": -26.437963485717773, "global_step": 433770, "epoch": 5226} {"train_loss": -25.969818115234375, "global_step": 433771, "epoch": 5226} {"train_loss": -26.635833740234375, "global_step": 433772, "epoch": 5226} {"train_loss": -26.331647872924805, "global_step": 433773, "epoch": 5226} {"train_loss": -26.538949966430664, "global_step": 433774, "epoch": 5226} {"train_loss": -26.559125900268555, "global_step": 433775, "epoch": 5226} {"train_loss": -26.573606491088867, "global_step": 433776, "epoch": 5226} {"train_loss": -26.638381958007812, "global_step": 433777, "epoch": 5226} {"train_loss": -26.521270751953125, "global_step": 433778, "epoch": 5226} {"train_loss": -26.2684383392334, "global_step": 433779, "epoch": 5226} {"train_loss": -26.760549545288086, "global_step": 433780, "epoch": 5226} {"train_loss": -26.69677734375, "global_step": 433781, "epoch": 5226} {"train_loss": -26.300962448120117, "global_step": 433782, "epoch": 5226} {"train_loss": -26.807519912719727, "global_step": 433783, "epoch": 5226} {"train_loss": -26.5466251373291, "global_step": 433784, "epoch": 5226} {"train_loss": -26.693323135375977, "global_step": 433785, "epoch": 5226} {"train_loss": -26.760862350463867, "global_step": 433786, "epoch": 5226} {"train_loss": -26.935327529907227, "global_step": 433787, "epoch": 5226} {"train_loss": -26.310504913330078, "global_step": 433788, "epoch": 5226} {"train_loss": -26.57000160217285, "global_step": 433789, "epoch": 5226} {"train_loss": -26.913040161132812, "global_step": 433790, "epoch": 5226} {"train_loss": -26.96400260925293, "global_step": 433791, "epoch": 5226} {"train_loss": -27.0727596282959, "global_step": 433792, "epoch": 5226} {"train_loss": -27.190153121948242, "global_step": 433793, "epoch": 5226} {"train_loss": -26.716522216796875, "global_step": 433794, "epoch": 5226} {"train_loss": -27.040374755859375, "global_step": 433795, "epoch": 5226} {"train_loss": -26.72271728515625, "global_step": 433796, "epoch": 5226} {"train_loss": -26.700164794921875, "global_step": 433797, "epoch": 5226} {"train_loss": -27.020170211791992, "global_step": 433798, "epoch": 5226} {"train_loss": -27.4920597076416, "global_step": 433799, "epoch": 5226} {"train_loss": -27.294397354125977, "global_step": 433800, "epoch": 5226} {"train_loss": -26.88520622253418, "global_step": 433801, "epoch": 5226} {"train_loss": -26.665517807006836, "global_step": 433802, "epoch": 5226} {"train_loss": -26.958511352539062, "global_step": 433803, "epoch": 5226} {"train_loss": -26.7415714263916, "global_step": 433804, "epoch": 5226} {"train_loss": -26.78896141052246, "global_step": 433805, "epoch": 5226} {"train_loss": -26.63156509399414, "global_step": 433806, "epoch": 5226} {"train_loss": -27.2731990814209, "global_step": 433807, "epoch": 5226} {"train_loss": -27.011676788330078, "global_step": 433808, "epoch": 5226} {"train_loss": -26.887231826782227, "global_step": 433809, "epoch": 5226} {"train_loss": -26.67828941345215, "global_step": 433810, "epoch": 5226} {"train_loss": -26.871713638305664, "global_step": 433811, "epoch": 5226} {"train_loss": -27.459287643432617, "global_step": 433812, "epoch": 5226} {"train_loss": -27.378448486328125, "global_step": 433813, "epoch": 5226} {"train_loss": -27.029972076416016, "global_step": 433814, "epoch": 5226} {"train_loss": -27.22503089904785, "global_step": 433815, "epoch": 5226} {"train_loss": -27.24228858947754, "global_step": 433816, "epoch": 5226} {"train_loss": -27.096052169799805, "global_step": 433817, "epoch": 5226} {"train_loss": -27.243085861206055, "global_step": 433818, "epoch": 5226} {"train_loss": -27.371490478515625, "global_step": 433819, "epoch": 5226} {"train_loss": -26.949682235717773, "global_step": 433820, "epoch": 5226} {"train_loss": -26.875823974609375, "global_step": 433821, "epoch": 5226} {"train_loss": -26.832483291625977, "global_step": 433822, "epoch": 5226} {"train_loss": -27.08001708984375, "global_step": 433823, "epoch": 5226} {"train_loss": -27.12729835510254, "global_step": 433824, "epoch": 5226} {"train_loss": -27.151174545288086, "global_step": 433825, "epoch": 5226} {"train_loss": -27.27516746520996, "global_step": 433826, "epoch": 5226} {"train_loss": -26.973896026611328, "global_step": 433827, "epoch": 5226} {"train_loss": -26.990243911743164, "global_step": 433828, "epoch": 5226} {"train_loss": -26.71803092956543, "global_step": 433829, "epoch": 5226} {"train_loss": -27.058149337768555, "global_step": 433830, "epoch": 5226} {"train_loss": -27.253433227539062, "global_step": 433831, "epoch": 5226} {"train_loss": -26.515857696533203, "global_step": 433832, "epoch": 5226} {"train_loss": -26.75571060180664, "global_step": 433833, "epoch": 5226} {"train_loss": -27.00336265563965, "global_step": 433834, "epoch": 5226} {"train_loss": -26.751678466796875, "global_step": 433835, "epoch": 5226} {"train_loss": -26.749364852905273, "global_step": 433836, "epoch": 5226} {"train_loss": -27.23469352722168, "global_step": 433837, "epoch": 5226} {"train_loss": -27.043121337890625, "global_step": 433838, "epoch": 5226} {"train_loss": -26.832157135009766, "global_step": 433839, "epoch": 5226} {"train_loss": -26.709376208753472, "global_step": 433840, "epoch": 5226, "val_loss": 6771372.0} {"train_loss": -26.441604614257812, "global_step": 433841, "epoch": 5227} {"train_loss": -26.72006607055664, "global_step": 433842, "epoch": 5227} {"train_loss": -25.607236862182617, "global_step": 433843, "epoch": 5227} {"train_loss": -26.376333236694336, "global_step": 433844, "epoch": 5227} {"train_loss": -25.79707145690918, "global_step": 433845, "epoch": 5227} {"train_loss": -26.308012008666992, "global_step": 433846, "epoch": 5227} {"train_loss": -26.680662155151367, "global_step": 433847, "epoch": 5227} {"train_loss": -25.880456924438477, "global_step": 433848, "epoch": 5227} {"train_loss": -26.337186813354492, "global_step": 433849, "epoch": 5227} {"train_loss": -25.91133689880371, "global_step": 433850, "epoch": 5227} {"train_loss": -25.721723556518555, "global_step": 433851, "epoch": 5227} {"train_loss": -26.070276260375977, "global_step": 433852, "epoch": 5227} {"train_loss": -26.118200302124023, "global_step": 433853, "epoch": 5227} {"train_loss": -26.2832088470459, "global_step": 433854, "epoch": 5227} {"train_loss": -26.542362213134766, "global_step": 433855, "epoch": 5227} {"train_loss": -26.336462020874023, "global_step": 433856, "epoch": 5227} {"train_loss": -26.2686710357666, "global_step": 433857, "epoch": 5227} {"train_loss": -26.344985961914062, "global_step": 433858, "epoch": 5227} {"train_loss": -26.08172607421875, "global_step": 433859, "epoch": 5227} {"train_loss": -26.48969078063965, "global_step": 433860, "epoch": 5227} {"train_loss": -26.476865768432617, "global_step": 433861, "epoch": 5227} {"train_loss": -26.469863891601562, "global_step": 433862, "epoch": 5227} {"train_loss": -26.796293258666992, "global_step": 433863, "epoch": 5227} {"train_loss": -26.528669357299805, "global_step": 433864, "epoch": 5227} {"train_loss": -26.47709083557129, "global_step": 433865, "epoch": 5227} {"train_loss": -26.93165397644043, "global_step": 433866, "epoch": 5227} {"train_loss": -27.031208038330078, "global_step": 433867, "epoch": 5227} {"train_loss": -26.875701904296875, "global_step": 433868, "epoch": 5227} {"train_loss": -26.67209815979004, "global_step": 433869, "epoch": 5227} {"train_loss": -26.8616943359375, "global_step": 433870, "epoch": 5227} {"train_loss": -26.60438346862793, "global_step": 433871, "epoch": 5227} {"train_loss": -26.78262710571289, "global_step": 433872, "epoch": 5227} {"train_loss": -27.148767471313477, "global_step": 433873, "epoch": 5227} {"train_loss": -26.398908615112305, "global_step": 433874, "epoch": 5227} {"train_loss": -26.700956344604492, "global_step": 433875, "epoch": 5227} {"train_loss": -26.829730987548828, "global_step": 433876, "epoch": 5227} {"train_loss": -26.611759185791016, "global_step": 433877, "epoch": 5227} {"train_loss": -26.788557052612305, "global_step": 433878, "epoch": 5227} {"train_loss": -27.039627075195312, "global_step": 433879, "epoch": 5227} {"train_loss": -27.26641273498535, "global_step": 433880, "epoch": 5227} {"train_loss": -26.81171226501465, "global_step": 433881, "epoch": 5227} {"train_loss": -27.192123413085938, "global_step": 433882, "epoch": 5227} {"train_loss": -26.952228546142578, "global_step": 433883, "epoch": 5227} {"train_loss": -26.748920440673828, "global_step": 433884, "epoch": 5227} {"train_loss": -27.171552658081055, "global_step": 433885, "epoch": 5227} {"train_loss": -26.872716903686523, "global_step": 433886, "epoch": 5227} {"train_loss": -27.10004234313965, "global_step": 433887, "epoch": 5227} {"train_loss": -26.85650062561035, "global_step": 433888, "epoch": 5227} {"train_loss": -27.190710067749023, "global_step": 433889, "epoch": 5227} {"train_loss": -27.12656593322754, "global_step": 433890, "epoch": 5227} {"train_loss": -27.0657958984375, "global_step": 433891, "epoch": 5227} {"train_loss": -27.41097068786621, "global_step": 433892, "epoch": 5227} {"train_loss": -27.141748428344727, "global_step": 433893, "epoch": 5227} {"train_loss": -26.62569236755371, "global_step": 433894, "epoch": 5227} {"train_loss": -26.716602325439453, "global_step": 433895, "epoch": 5227} {"train_loss": -27.02610206604004, "global_step": 433896, "epoch": 5227} {"train_loss": -26.9147891998291, "global_step": 433897, "epoch": 5227} {"train_loss": -26.772977828979492, "global_step": 433898, "epoch": 5227} {"train_loss": -27.159109115600586, "global_step": 433899, "epoch": 5227} {"train_loss": -26.74989128112793, "global_step": 433900, "epoch": 5227} {"train_loss": -26.93623161315918, "global_step": 433901, "epoch": 5227} {"train_loss": -26.74945640563965, "global_step": 433902, "epoch": 5227} {"train_loss": -27.15363883972168, "global_step": 433903, "epoch": 5227} {"train_loss": -26.605457305908203, "global_step": 433904, "epoch": 5227} {"train_loss": -26.92170524597168, "global_step": 433905, "epoch": 5227} {"train_loss": -27.10064125061035, "global_step": 433906, "epoch": 5227} {"train_loss": -26.770233154296875, "global_step": 433907, "epoch": 5227} {"train_loss": -27.10703468322754, "global_step": 433908, "epoch": 5227} {"train_loss": -26.9819393157959, "global_step": 433909, "epoch": 5227} {"train_loss": -26.867599487304688, "global_step": 433910, "epoch": 5227} {"train_loss": -26.214147567749023, "global_step": 433911, "epoch": 5227} {"train_loss": -25.528318405151367, "global_step": 433912, "epoch": 5227} {"train_loss": -25.0372257232666, "global_step": 433913, "epoch": 5227} {"train_loss": -25.875961303710938, "global_step": 433914, "epoch": 5227} {"train_loss": -26.22479248046875, "global_step": 433915, "epoch": 5227} {"train_loss": -26.61993408203125, "global_step": 433916, "epoch": 5227} {"train_loss": -26.425268173217773, "global_step": 433917, "epoch": 5227} {"train_loss": -26.17816734313965, "global_step": 433918, "epoch": 5227} {"train_loss": -26.781570434570312, "global_step": 433919, "epoch": 5227} {"train_loss": -26.43373680114746, "global_step": 433920, "epoch": 5227} {"train_loss": -26.765644073486328, "global_step": 433921, "epoch": 5227} {"train_loss": -26.51993179321289, "global_step": 433922, "epoch": 5227} {"train_loss": -26.633494572467114, "global_step": 433923, "epoch": 5227, "val_loss": 6743686.0} {"train_loss": -26.28509521484375, "global_step": 433924, "epoch": 5228} {"train_loss": -26.40741539001465, "global_step": 433925, "epoch": 5228} {"train_loss": -26.396839141845703, "global_step": 433926, "epoch": 5228} {"train_loss": -26.171512603759766, "global_step": 433927, "epoch": 5228} {"train_loss": -26.33054542541504, "global_step": 433928, "epoch": 5228} {"train_loss": -26.233245849609375, "global_step": 433929, "epoch": 5228} {"train_loss": -26.487096786499023, "global_step": 433930, "epoch": 5228} {"train_loss": -25.848920822143555, "global_step": 433931, "epoch": 5228} {"train_loss": -26.55848503112793, "global_step": 433932, "epoch": 5228} {"train_loss": -26.54971694946289, "global_step": 433933, "epoch": 5228} {"train_loss": -26.35113525390625, "global_step": 433934, "epoch": 5228} {"train_loss": -26.723852157592773, "global_step": 433935, "epoch": 5228} {"train_loss": -26.772592544555664, "global_step": 433936, "epoch": 5228} {"train_loss": -26.623687744140625, "global_step": 433937, "epoch": 5228} {"train_loss": -26.674978256225586, "global_step": 433938, "epoch": 5228} {"train_loss": -26.809192657470703, "global_step": 433939, "epoch": 5228} {"train_loss": -26.696533203125, "global_step": 433940, "epoch": 5228} {"train_loss": -26.510334014892578, "global_step": 433941, "epoch": 5228} {"train_loss": -26.869592666625977, "global_step": 433942, "epoch": 5228} {"train_loss": -26.863428115844727, "global_step": 433943, "epoch": 5228} {"train_loss": -27.06068992614746, "global_step": 433944, "epoch": 5228} {"train_loss": -26.602758407592773, "global_step": 433945, "epoch": 5228} {"train_loss": -27.032821655273438, "global_step": 433946, "epoch": 5228} {"train_loss": -27.06928062438965, "global_step": 433947, "epoch": 5228} {"train_loss": -27.13575553894043, "global_step": 433948, "epoch": 5228} {"train_loss": -26.965497970581055, "global_step": 433949, "epoch": 5228} {"train_loss": -26.8355770111084, "global_step": 433950, "epoch": 5228} {"train_loss": -26.61969566345215, "global_step": 433951, "epoch": 5228} {"train_loss": -27.12485122680664, "global_step": 433952, "epoch": 5228} {"train_loss": -26.57649040222168, "global_step": 433953, "epoch": 5228} {"train_loss": -27.25892448425293, "global_step": 433954, "epoch": 5228} {"train_loss": -27.39238929748535, "global_step": 433955, "epoch": 5228} {"train_loss": -27.000654220581055, "global_step": 433956, "epoch": 5228} {"train_loss": -26.978565216064453, "global_step": 433957, "epoch": 5228} {"train_loss": -26.858753204345703, "global_step": 433958, "epoch": 5228} {"train_loss": -27.138158798217773, "global_step": 433959, "epoch": 5228} {"train_loss": -26.761865615844727, "global_step": 433960, "epoch": 5228} {"train_loss": -27.080535888671875, "global_step": 433961, "epoch": 5228} {"train_loss": -26.97028923034668, "global_step": 433962, "epoch": 5228} {"train_loss": -26.85602378845215, "global_step": 433963, "epoch": 5228} {"train_loss": -27.345947265625, "global_step": 433964, "epoch": 5228} {"train_loss": -27.203123092651367, "global_step": 433965, "epoch": 5228} {"train_loss": -27.122650146484375, "global_step": 433966, "epoch": 5228} {"train_loss": -27.13917350769043, "global_step": 433967, "epoch": 5228} {"train_loss": -27.11385154724121, "global_step": 433968, "epoch": 5228} {"train_loss": -26.60114097595215, "global_step": 433969, "epoch": 5228} {"train_loss": -26.446374893188477, "global_step": 433970, "epoch": 5228} {"train_loss": -26.83038902282715, "global_step": 433971, "epoch": 5228} {"train_loss": -26.109628677368164, "global_step": 433972, "epoch": 5228} {"train_loss": -26.267139434814453, "global_step": 433973, "epoch": 5228} {"train_loss": -26.994001388549805, "global_step": 433974, "epoch": 5228} {"train_loss": -26.824359893798828, "global_step": 433975, "epoch": 5228} {"train_loss": -26.776508331298828, "global_step": 433976, "epoch": 5228} {"train_loss": -25.9368953704834, "global_step": 433977, "epoch": 5228} {"train_loss": -26.172016143798828, "global_step": 433978, "epoch": 5228} {"train_loss": -26.877765655517578, "global_step": 433979, "epoch": 5228} {"train_loss": -26.89615249633789, "global_step": 433980, "epoch": 5228} {"train_loss": -25.978479385375977, "global_step": 433981, "epoch": 5228} {"train_loss": -26.30938148498535, "global_step": 433982, "epoch": 5228} {"train_loss": -26.090978622436523, "global_step": 433983, "epoch": 5228} {"train_loss": -26.516599655151367, "global_step": 433984, "epoch": 5228} {"train_loss": -26.547088623046875, "global_step": 433985, "epoch": 5228} {"train_loss": -26.26140785217285, "global_step": 433986, "epoch": 5228} {"train_loss": -26.585657119750977, "global_step": 433987, "epoch": 5228} {"train_loss": -26.641571044921875, "global_step": 433988, "epoch": 5228} {"train_loss": -26.8250732421875, "global_step": 433989, "epoch": 5228} {"train_loss": -26.499841690063477, "global_step": 433990, "epoch": 5228} {"train_loss": -26.94354248046875, "global_step": 433991, "epoch": 5228} {"train_loss": -26.749042510986328, "global_step": 433992, "epoch": 5228} {"train_loss": -26.67397117614746, "global_step": 433993, "epoch": 5228} {"train_loss": -26.834142684936523, "global_step": 433994, "epoch": 5228} {"train_loss": -26.694555282592773, "global_step": 433995, "epoch": 5228} {"train_loss": -26.810169219970703, "global_step": 433996, "epoch": 5228} {"train_loss": -26.795230865478516, "global_step": 433997, "epoch": 5228} {"train_loss": -26.73272705078125, "global_step": 433998, "epoch": 5228} {"train_loss": -26.723499298095703, "global_step": 433999, "epoch": 5228} {"train_loss": -26.903959274291992, "global_step": 434000, "epoch": 5228} {"train_loss": -26.818572998046875, "global_step": 434001, "epoch": 5228} {"train_loss": -27.053308486938477, "global_step": 434002, "epoch": 5228} {"train_loss": -26.683557510375977, "global_step": 434003, "epoch": 5228} {"train_loss": -26.782712936401367, "global_step": 434004, "epoch": 5228} {"train_loss": -26.880722045898438, "global_step": 434005, "epoch": 5228} {"train_loss": -26.708011512296746, "global_step": 434006, "epoch": 5228, "val_loss": 6906816.0} {"train_loss": -26.177114486694336, "global_step": 434007, "epoch": 5229} {"train_loss": -26.728809356689453, "global_step": 434008, "epoch": 5229} {"train_loss": -26.147436141967773, "global_step": 434009, "epoch": 5229} {"train_loss": -25.899728775024414, "global_step": 434010, "epoch": 5229} {"train_loss": -26.09461784362793, "global_step": 434011, "epoch": 5229} {"train_loss": -26.72688102722168, "global_step": 434012, "epoch": 5229} {"train_loss": -26.61484718322754, "global_step": 434013, "epoch": 5229} {"train_loss": -26.434925079345703, "global_step": 434014, "epoch": 5229} {"train_loss": -26.79683494567871, "global_step": 434015, "epoch": 5229} {"train_loss": -26.43023681640625, "global_step": 434016, "epoch": 5229} {"train_loss": -26.97247886657715, "global_step": 434017, "epoch": 5229} {"train_loss": -26.58163833618164, "global_step": 434018, "epoch": 5229} {"train_loss": -26.302600860595703, "global_step": 434019, "epoch": 5229} {"train_loss": -26.394092559814453, "global_step": 434020, "epoch": 5229} {"train_loss": -26.5805606842041, "global_step": 434021, "epoch": 5229} {"train_loss": -26.726760864257812, "global_step": 434022, "epoch": 5229} {"train_loss": -26.96925163269043, "global_step": 434023, "epoch": 5229} {"train_loss": -26.646642684936523, "global_step": 434024, "epoch": 5229} {"train_loss": -26.540435791015625, "global_step": 434025, "epoch": 5229} {"train_loss": -26.619293212890625, "global_step": 434026, "epoch": 5229} {"train_loss": -26.75300407409668, "global_step": 434027, "epoch": 5229} {"train_loss": -26.71738052368164, "global_step": 434028, "epoch": 5229} {"train_loss": -26.825719833374023, "global_step": 434029, "epoch": 5229} {"train_loss": -26.958282470703125, "global_step": 434030, "epoch": 5229} {"train_loss": -27.124433517456055, "global_step": 434031, "epoch": 5229} {"train_loss": -26.594778060913086, "global_step": 434032, "epoch": 5229} {"train_loss": -27.042234420776367, "global_step": 434033, "epoch": 5229} {"train_loss": -27.17140007019043, "global_step": 434034, "epoch": 5229} {"train_loss": -27.182302474975586, "global_step": 434035, "epoch": 5229} {"train_loss": -26.978803634643555, "global_step": 434036, "epoch": 5229} {"train_loss": -26.673608779907227, "global_step": 434037, "epoch": 5229} {"train_loss": -26.77003288269043, "global_step": 434038, "epoch": 5229} {"train_loss": -27.313608169555664, "global_step": 434039, "epoch": 5229} {"train_loss": -27.22663688659668, "global_step": 434040, "epoch": 5229} {"train_loss": -27.112104415893555, "global_step": 434041, "epoch": 5229} {"train_loss": -27.032470703125, "global_step": 434042, "epoch": 5229} {"train_loss": -26.91273307800293, "global_step": 434043, "epoch": 5229} {"train_loss": -26.73193359375, "global_step": 434044, "epoch": 5229} {"train_loss": -27.000822067260742, "global_step": 434045, "epoch": 5229} {"train_loss": -26.805511474609375, "global_step": 434046, "epoch": 5229} {"train_loss": -26.884906768798828, "global_step": 434047, "epoch": 5229} {"train_loss": -26.962982177734375, "global_step": 434048, "epoch": 5229} {"train_loss": -26.683683395385742, "global_step": 434049, "epoch": 5229} {"train_loss": -26.742843627929688, "global_step": 434050, "epoch": 5229} {"train_loss": -26.540756225585938, "global_step": 434051, "epoch": 5229} {"train_loss": -26.873706817626953, "global_step": 434052, "epoch": 5229} {"train_loss": -27.152576446533203, "global_step": 434053, "epoch": 5229} {"train_loss": -27.003957748413086, "global_step": 434054, "epoch": 5229} {"train_loss": -27.026153564453125, "global_step": 434055, "epoch": 5229} {"train_loss": -26.5006103515625, "global_step": 434056, "epoch": 5229} {"train_loss": -26.738178253173828, "global_step": 434057, "epoch": 5229} {"train_loss": -27.470260620117188, "global_step": 434058, "epoch": 5229} {"train_loss": -27.260343551635742, "global_step": 434059, "epoch": 5229} {"train_loss": -26.71315574645996, "global_step": 434060, "epoch": 5229} {"train_loss": -27.099308013916016, "global_step": 434061, "epoch": 5229} {"train_loss": -27.115646362304688, "global_step": 434062, "epoch": 5229} {"train_loss": -26.82175064086914, "global_step": 434063, "epoch": 5229} {"train_loss": -26.8112735748291, "global_step": 434064, "epoch": 5229} {"train_loss": -27.10123062133789, "global_step": 434065, "epoch": 5229} {"train_loss": -26.797388076782227, "global_step": 434066, "epoch": 5229} {"train_loss": -26.295957565307617, "global_step": 434067, "epoch": 5229} {"train_loss": -26.836593627929688, "global_step": 434068, "epoch": 5229} {"train_loss": -26.497867584228516, "global_step": 434069, "epoch": 5229} {"train_loss": -26.991870880126953, "global_step": 434070, "epoch": 5229} {"train_loss": -26.688520431518555, "global_step": 434071, "epoch": 5229} {"train_loss": -26.964157104492188, "global_step": 434072, "epoch": 5229} {"train_loss": -26.921401977539062, "global_step": 434073, "epoch": 5229} {"train_loss": -27.217554092407227, "global_step": 434074, "epoch": 5229} {"train_loss": -27.097314834594727, "global_step": 434075, "epoch": 5229} {"train_loss": -27.035480499267578, "global_step": 434076, "epoch": 5229} {"train_loss": -26.933216094970703, "global_step": 434077, "epoch": 5229} {"train_loss": -27.088809967041016, "global_step": 434078, "epoch": 5229} {"train_loss": -26.71784019470215, "global_step": 434079, "epoch": 5229} {"train_loss": -26.386306762695312, "global_step": 434080, "epoch": 5229} {"train_loss": -26.8345890045166, "global_step": 434081, "epoch": 5229} {"train_loss": -27.067163467407227, "global_step": 434082, "epoch": 5229} {"train_loss": -27.00095558166504, "global_step": 434083, "epoch": 5229} {"train_loss": -27.021808624267578, "global_step": 434084, "epoch": 5229} {"train_loss": -26.995092391967773, "global_step": 434085, "epoch": 5229} {"train_loss": -26.64628028869629, "global_step": 434086, "epoch": 5229} {"train_loss": -26.797189712524414, "global_step": 434087, "epoch": 5229} {"train_loss": -27.35051918029785, "global_step": 434088, "epoch": 5229} {"train_loss": -26.808755897613892, "global_step": 434089, "epoch": 5229, "val_loss": 6642641.5} {"train_loss": -26.027624130249023, "global_step": 434090, "epoch": 5230} {"train_loss": -26.208337783813477, "global_step": 434091, "epoch": 5230} {"train_loss": -26.266687393188477, "global_step": 434092, "epoch": 5230} {"train_loss": -26.002548217773438, "global_step": 434093, "epoch": 5230} {"train_loss": -26.076324462890625, "global_step": 434094, "epoch": 5230} {"train_loss": -26.620580673217773, "global_step": 434095, "epoch": 5230} {"train_loss": -26.0407772064209, "global_step": 434096, "epoch": 5230} {"train_loss": -26.501617431640625, "global_step": 434097, "epoch": 5230} {"train_loss": -26.5434627532959, "global_step": 434098, "epoch": 5230} {"train_loss": -26.4071102142334, "global_step": 434099, "epoch": 5230} {"train_loss": -25.975473403930664, "global_step": 434100, "epoch": 5230} {"train_loss": -26.553955078125, "global_step": 434101, "epoch": 5230} {"train_loss": -26.269317626953125, "global_step": 434102, "epoch": 5230} {"train_loss": -26.567968368530273, "global_step": 434103, "epoch": 5230} {"train_loss": -25.955657958984375, "global_step": 434104, "epoch": 5230} {"train_loss": -26.45229148864746, "global_step": 434105, "epoch": 5230} {"train_loss": -26.377187728881836, "global_step": 434106, "epoch": 5230} {"train_loss": -26.60239601135254, "global_step": 434107, "epoch": 5230} {"train_loss": -26.50537109375, "global_step": 434108, "epoch": 5230} {"train_loss": -26.46156120300293, "global_step": 434109, "epoch": 5230} {"train_loss": -26.634443283081055, "global_step": 434110, "epoch": 5230} {"train_loss": -26.34956169128418, "global_step": 434111, "epoch": 5230} {"train_loss": -26.942975997924805, "global_step": 434112, "epoch": 5230} {"train_loss": -26.755762100219727, "global_step": 434113, "epoch": 5230} {"train_loss": -26.96982192993164, "global_step": 434114, "epoch": 5230} {"train_loss": -26.7240047454834, "global_step": 434115, "epoch": 5230} {"train_loss": -26.877126693725586, "global_step": 434116, "epoch": 5230} {"train_loss": -26.639368057250977, "global_step": 434117, "epoch": 5230} {"train_loss": -27.182477951049805, "global_step": 434118, "epoch": 5230} {"train_loss": -26.775989532470703, "global_step": 434119, "epoch": 5230} {"train_loss": -27.08575439453125, "global_step": 434120, "epoch": 5230} {"train_loss": -27.091236114501953, "global_step": 434121, "epoch": 5230} {"train_loss": -26.433807373046875, "global_step": 434122, "epoch": 5230} {"train_loss": -27.000518798828125, "global_step": 434123, "epoch": 5230} {"train_loss": -26.703144073486328, "global_step": 434124, "epoch": 5230} {"train_loss": -26.912872314453125, "global_step": 434125, "epoch": 5230} {"train_loss": -26.728504180908203, "global_step": 434126, "epoch": 5230} {"train_loss": -27.24834632873535, "global_step": 434127, "epoch": 5230} {"train_loss": -27.062585830688477, "global_step": 434128, "epoch": 5230} {"train_loss": -27.054767608642578, "global_step": 434129, "epoch": 5230} {"train_loss": -26.600317001342773, "global_step": 434130, "epoch": 5230} {"train_loss": -26.895401000976562, "global_step": 434131, "epoch": 5230} {"train_loss": -26.755029678344727, "global_step": 434132, "epoch": 5230} {"train_loss": -27.050689697265625, "global_step": 434133, "epoch": 5230} {"train_loss": -27.0007266998291, "global_step": 434134, "epoch": 5230} {"train_loss": -27.158308029174805, "global_step": 434135, "epoch": 5230} {"train_loss": -26.605478286743164, "global_step": 434136, "epoch": 5230} {"train_loss": -27.334665298461914, "global_step": 434137, "epoch": 5230} {"train_loss": -26.711645126342773, "global_step": 434138, "epoch": 5230} {"train_loss": -27.25001335144043, "global_step": 434139, "epoch": 5230} {"train_loss": -27.057714462280273, "global_step": 434140, "epoch": 5230} {"train_loss": -26.838647842407227, "global_step": 434141, "epoch": 5230} {"train_loss": -26.956501007080078, "global_step": 434142, "epoch": 5230} {"train_loss": -26.982572555541992, "global_step": 434143, "epoch": 5230} {"train_loss": -26.668720245361328, "global_step": 434144, "epoch": 5230} {"train_loss": -26.629119873046875, "global_step": 434145, "epoch": 5230} {"train_loss": -26.742145538330078, "global_step": 434146, "epoch": 5230} {"train_loss": -26.975574493408203, "global_step": 434147, "epoch": 5230} {"train_loss": -27.29987144470215, "global_step": 434148, "epoch": 5230} {"train_loss": -26.77703285217285, "global_step": 434149, "epoch": 5230} {"train_loss": -26.791357040405273, "global_step": 434150, "epoch": 5230} {"train_loss": -26.39788818359375, "global_step": 434151, "epoch": 5230} {"train_loss": -26.925634384155273, "global_step": 434152, "epoch": 5230} {"train_loss": -27.273771286010742, "global_step": 434153, "epoch": 5230} {"train_loss": -27.04951286315918, "global_step": 434154, "epoch": 5230} {"train_loss": -26.87590980529785, "global_step": 434155, "epoch": 5230} {"train_loss": -26.233325958251953, "global_step": 434156, "epoch": 5230} {"train_loss": -27.1680908203125, "global_step": 434157, "epoch": 5230} {"train_loss": -27.08920669555664, "global_step": 434158, "epoch": 5230} {"train_loss": -26.754220962524414, "global_step": 434159, "epoch": 5230} {"train_loss": -26.75111198425293, "global_step": 434160, "epoch": 5230} {"train_loss": -27.08721923828125, "global_step": 434161, "epoch": 5230} {"train_loss": -26.946399688720703, "global_step": 434162, "epoch": 5230} {"train_loss": -26.9903621673584, "global_step": 434163, "epoch": 5230} {"train_loss": -27.187274932861328, "global_step": 434164, "epoch": 5230} {"train_loss": -26.89676856994629, "global_step": 434165, "epoch": 5230} {"train_loss": -26.883039474487305, "global_step": 434166, "epoch": 5230} {"train_loss": -26.961816787719727, "global_step": 434167, "epoch": 5230} {"train_loss": -26.95966148376465, "global_step": 434168, "epoch": 5230} {"train_loss": -27.171716690063477, "global_step": 434169, "epoch": 5230} {"train_loss": -27.389524459838867, "global_step": 434170, "epoch": 5230} {"train_loss": -26.827741622924805, "global_step": 434171, "epoch": 5230} {"train_loss": -26.776584969945702, "global_step": 434172, "epoch": 5230, "val_loss": 6634810.5} {"train_loss": -26.234708786010742, "global_step": 434173, "epoch": 5231} {"train_loss": -26.0142765045166, "global_step": 434174, "epoch": 5231} {"train_loss": -26.408893585205078, "global_step": 434175, "epoch": 5231} {"train_loss": -26.5434627532959, "global_step": 434176, "epoch": 5231} {"train_loss": -25.586145401000977, "global_step": 434177, "epoch": 5231} {"train_loss": -25.496965408325195, "global_step": 434178, "epoch": 5231} {"train_loss": -26.109792709350586, "global_step": 434179, "epoch": 5231} {"train_loss": -26.631256103515625, "global_step": 434180, "epoch": 5231} {"train_loss": -25.892663955688477, "global_step": 434181, "epoch": 5231} {"train_loss": -26.822742462158203, "global_step": 434182, "epoch": 5231} {"train_loss": -26.411352157592773, "global_step": 434183, "epoch": 5231} {"train_loss": -26.55365562438965, "global_step": 434184, "epoch": 5231} {"train_loss": -25.977771759033203, "global_step": 434185, "epoch": 5231} {"train_loss": -26.405466079711914, "global_step": 434186, "epoch": 5231} {"train_loss": -26.141935348510742, "global_step": 434187, "epoch": 5231} {"train_loss": -26.690114974975586, "global_step": 434188, "epoch": 5231} {"train_loss": -26.42974281311035, "global_step": 434189, "epoch": 5231} {"train_loss": -26.585805892944336, "global_step": 434190, "epoch": 5231} {"train_loss": -26.620508193969727, "global_step": 434191, "epoch": 5231} {"train_loss": -26.946279525756836, "global_step": 434192, "epoch": 5231} {"train_loss": -26.516712188720703, "global_step": 434193, "epoch": 5231} {"train_loss": -26.660070419311523, "global_step": 434194, "epoch": 5231} {"train_loss": -26.70461082458496, "global_step": 434195, "epoch": 5231} {"train_loss": -26.5689640045166, "global_step": 434196, "epoch": 5231} {"train_loss": -26.983097076416016, "global_step": 434197, "epoch": 5231} {"train_loss": -26.974035263061523, "global_step": 434198, "epoch": 5231} {"train_loss": -26.178022384643555, "global_step": 434199, "epoch": 5231} {"train_loss": -26.456640243530273, "global_step": 434200, "epoch": 5231} {"train_loss": -26.61600112915039, "global_step": 434201, "epoch": 5231} {"train_loss": -26.57919692993164, "global_step": 434202, "epoch": 5231} {"train_loss": -26.86771583557129, "global_step": 434203, "epoch": 5231} {"train_loss": -26.995685577392578, "global_step": 434204, "epoch": 5231} {"train_loss": -26.40448570251465, "global_step": 434205, "epoch": 5231} {"train_loss": -26.811386108398438, "global_step": 434206, "epoch": 5231} {"train_loss": -26.94449806213379, "global_step": 434207, "epoch": 5231} {"train_loss": -26.866931915283203, "global_step": 434208, "epoch": 5231} {"train_loss": -27.364240646362305, "global_step": 434209, "epoch": 5231} {"train_loss": -26.83492088317871, "global_step": 434210, "epoch": 5231} {"train_loss": -26.849353790283203, "global_step": 434211, "epoch": 5231} {"train_loss": -26.876317977905273, "global_step": 434212, "epoch": 5231} {"train_loss": -26.900054931640625, "global_step": 434213, "epoch": 5231} {"train_loss": -26.761768341064453, "global_step": 434214, "epoch": 5231} {"train_loss": -26.795684814453125, "global_step": 434215, "epoch": 5231} {"train_loss": -26.966114044189453, "global_step": 434216, "epoch": 5231} {"train_loss": -27.08652114868164, "global_step": 434217, "epoch": 5231} {"train_loss": -26.958820343017578, "global_step": 434218, "epoch": 5231} {"train_loss": -26.741180419921875, "global_step": 434219, "epoch": 5231} {"train_loss": -27.099884033203125, "global_step": 434220, "epoch": 5231} {"train_loss": -26.952529907226562, "global_step": 434221, "epoch": 5231} {"train_loss": -27.05177116394043, "global_step": 434222, "epoch": 5231} {"train_loss": -26.789243698120117, "global_step": 434223, "epoch": 5231} {"train_loss": -26.8066349029541, "global_step": 434224, "epoch": 5231} {"train_loss": -26.862287521362305, "global_step": 434225, "epoch": 5231} {"train_loss": -27.274587631225586, "global_step": 434226, "epoch": 5231} {"train_loss": -27.049665451049805, "global_step": 434227, "epoch": 5231} {"train_loss": -26.791173934936523, "global_step": 434228, "epoch": 5231} {"train_loss": -26.9007625579834, "global_step": 434229, "epoch": 5231} {"train_loss": -26.815214157104492, "global_step": 434230, "epoch": 5231} {"train_loss": -27.318567276000977, "global_step": 434231, "epoch": 5231} {"train_loss": -27.427692413330078, "global_step": 434232, "epoch": 5231} {"train_loss": -27.346036911010742, "global_step": 434233, "epoch": 5231} {"train_loss": -26.496137619018555, "global_step": 434234, "epoch": 5231} {"train_loss": -26.974536895751953, "global_step": 434235, "epoch": 5231} {"train_loss": -26.847055435180664, "global_step": 434236, "epoch": 5231} {"train_loss": -26.645187377929688, "global_step": 434237, "epoch": 5231} {"train_loss": -26.867786407470703, "global_step": 434238, "epoch": 5231} {"train_loss": -26.743764877319336, "global_step": 434239, "epoch": 5231} {"train_loss": -26.626510620117188, "global_step": 434240, "epoch": 5231} {"train_loss": -27.024871826171875, "global_step": 434241, "epoch": 5231} {"train_loss": -27.097599029541016, "global_step": 434242, "epoch": 5231} {"train_loss": -26.636093139648438, "global_step": 434243, "epoch": 5231} {"train_loss": -27.1189022064209, "global_step": 434244, "epoch": 5231} {"train_loss": -27.108083724975586, "global_step": 434245, "epoch": 5231} {"train_loss": -26.879104614257812, "global_step": 434246, "epoch": 5231} {"train_loss": -26.60283851623535, "global_step": 434247, "epoch": 5231} {"train_loss": -27.068395614624023, "global_step": 434248, "epoch": 5231} {"train_loss": -26.817472457885742, "global_step": 434249, "epoch": 5231} {"train_loss": -27.04706382751465, "global_step": 434250, "epoch": 5231} {"train_loss": -27.279834747314453, "global_step": 434251, "epoch": 5231} {"train_loss": -27.22565269470215, "global_step": 434252, "epoch": 5231} {"train_loss": -26.776132583618164, "global_step": 434253, "epoch": 5231} {"train_loss": -26.799524307250977, "global_step": 434254, "epoch": 5231} {"train_loss": -26.749798579388354, "global_step": 434255, "epoch": 5231, "val_loss": 6759749.0} {"train_loss": -26.378881454467773, "global_step": 434256, "epoch": 5232} {"train_loss": -26.1734676361084, "global_step": 434257, "epoch": 5232} {"train_loss": -26.425703048706055, "global_step": 434258, "epoch": 5232} {"train_loss": -26.45423698425293, "global_step": 434259, "epoch": 5232} {"train_loss": -26.378976821899414, "global_step": 434260, "epoch": 5232} {"train_loss": -26.417587280273438, "global_step": 434261, "epoch": 5232} {"train_loss": -26.418289184570312, "global_step": 434262, "epoch": 5232} {"train_loss": -26.85751724243164, "global_step": 434263, "epoch": 5232} {"train_loss": -26.652185440063477, "global_step": 434264, "epoch": 5232} {"train_loss": -26.746679306030273, "global_step": 434265, "epoch": 5232} {"train_loss": -26.947803497314453, "global_step": 434266, "epoch": 5232} {"train_loss": -26.80999183654785, "global_step": 434267, "epoch": 5232} {"train_loss": -26.970447540283203, "global_step": 434268, "epoch": 5232} {"train_loss": -26.341093063354492, "global_step": 434269, "epoch": 5232} {"train_loss": -26.91205406188965, "global_step": 434270, "epoch": 5232} {"train_loss": -26.79378318786621, "global_step": 434271, "epoch": 5232} {"train_loss": -26.843280792236328, "global_step": 434272, "epoch": 5232} {"train_loss": -26.951160430908203, "global_step": 434273, "epoch": 5232} {"train_loss": -26.667226791381836, "global_step": 434274, "epoch": 5232} {"train_loss": -26.77202796936035, "global_step": 434275, "epoch": 5232} {"train_loss": -26.91558265686035, "global_step": 434276, "epoch": 5232} {"train_loss": -26.916717529296875, "global_step": 434277, "epoch": 5232} {"train_loss": -27.01869010925293, "global_step": 434278, "epoch": 5232} {"train_loss": -26.993457794189453, "global_step": 434279, "epoch": 5232} {"train_loss": -27.028539657592773, "global_step": 434280, "epoch": 5232} {"train_loss": -27.012914657592773, "global_step": 434281, "epoch": 5232} {"train_loss": -27.021142959594727, "global_step": 434282, "epoch": 5232} {"train_loss": -27.0830135345459, "global_step": 434283, "epoch": 5232} {"train_loss": -26.89912223815918, "global_step": 434284, "epoch": 5232} {"train_loss": -26.936307907104492, "global_step": 434285, "epoch": 5232} {"train_loss": -27.386945724487305, "global_step": 434286, "epoch": 5232} {"train_loss": -26.858978271484375, "global_step": 434287, "epoch": 5232} {"train_loss": -27.010705947875977, "global_step": 434288, "epoch": 5232} {"train_loss": -26.775861740112305, "global_step": 434289, "epoch": 5232} {"train_loss": -27.215967178344727, "global_step": 434290, "epoch": 5232} {"train_loss": -27.014135360717773, "global_step": 434291, "epoch": 5232} {"train_loss": -26.890777587890625, "global_step": 434292, "epoch": 5232} {"train_loss": -27.000986099243164, "global_step": 434293, "epoch": 5232} {"train_loss": -26.62820816040039, "global_step": 434294, "epoch": 5232} {"train_loss": -27.019987106323242, "global_step": 434295, "epoch": 5232} {"train_loss": -26.867624282836914, "global_step": 434296, "epoch": 5232} {"train_loss": -27.071090698242188, "global_step": 434297, "epoch": 5232} {"train_loss": -26.9548282623291, "global_step": 434298, "epoch": 5232} {"train_loss": -27.04530143737793, "global_step": 434299, "epoch": 5232} {"train_loss": -27.206756591796875, "global_step": 434300, "epoch": 5232} {"train_loss": -27.450794219970703, "global_step": 434301, "epoch": 5232} {"train_loss": -27.11935806274414, "global_step": 434302, "epoch": 5232} {"train_loss": -26.4726505279541, "global_step": 434303, "epoch": 5232} {"train_loss": -27.205236434936523, "global_step": 434304, "epoch": 5232} {"train_loss": -26.7213077545166, "global_step": 434305, "epoch": 5232} {"train_loss": -26.926136016845703, "global_step": 434306, "epoch": 5232} {"train_loss": -26.581939697265625, "global_step": 434307, "epoch": 5232} {"train_loss": -26.742761611938477, "global_step": 434308, "epoch": 5232} {"train_loss": -26.497650146484375, "global_step": 434309, "epoch": 5232} {"train_loss": -26.523298263549805, "global_step": 434310, "epoch": 5232} {"train_loss": -26.65410804748535, "global_step": 434311, "epoch": 5232} {"train_loss": -26.80466079711914, "global_step": 434312, "epoch": 5232} {"train_loss": -26.632659912109375, "global_step": 434313, "epoch": 5232} {"train_loss": -26.799795150756836, "global_step": 434314, "epoch": 5232} {"train_loss": -27.148252487182617, "global_step": 434315, "epoch": 5232} {"train_loss": -26.649789810180664, "global_step": 434316, "epoch": 5232} {"train_loss": -26.903644561767578, "global_step": 434317, "epoch": 5232} {"train_loss": -27.101049423217773, "global_step": 434318, "epoch": 5232} {"train_loss": -26.93937110900879, "global_step": 434319, "epoch": 5232} {"train_loss": -26.6678524017334, "global_step": 434320, "epoch": 5232} {"train_loss": -26.66387939453125, "global_step": 434321, "epoch": 5232} {"train_loss": -27.1933650970459, "global_step": 434322, "epoch": 5232} {"train_loss": -26.667896270751953, "global_step": 434323, "epoch": 5232} {"train_loss": -27.113788604736328, "global_step": 434324, "epoch": 5232} {"train_loss": -26.703887939453125, "global_step": 434325, "epoch": 5232} {"train_loss": -26.53169059753418, "global_step": 434326, "epoch": 5232} {"train_loss": -26.370878219604492, "global_step": 434327, "epoch": 5232} {"train_loss": -26.424884796142578, "global_step": 434328, "epoch": 5232} {"train_loss": -26.67133903503418, "global_step": 434329, "epoch": 5232} {"train_loss": -26.6792049407959, "global_step": 434330, "epoch": 5232} {"train_loss": -26.91729164123535, "global_step": 434331, "epoch": 5232} {"train_loss": -27.1428279876709, "global_step": 434332, "epoch": 5232} {"train_loss": -26.960346221923828, "global_step": 434333, "epoch": 5232} {"train_loss": -26.764739990234375, "global_step": 434334, "epoch": 5232} {"train_loss": -26.484384536743164, "global_step": 434335, "epoch": 5232} {"train_loss": -26.8192195892334, "global_step": 434336, "epoch": 5232} {"train_loss": -26.348974227905273, "global_step": 434337, "epoch": 5232} {"train_loss": -26.807225055005176, "global_step": 434338, "epoch": 5232, "val_loss": 6779769.0} {"train_loss": -25.91266441345215, "global_step": 434339, "epoch": 5233} {"train_loss": -26.44404411315918, "global_step": 434340, "epoch": 5233} {"train_loss": -26.70379638671875, "global_step": 434341, "epoch": 5233} {"train_loss": -26.9217529296875, "global_step": 434342, "epoch": 5233} {"train_loss": -26.83208656311035, "global_step": 434343, "epoch": 5233} {"train_loss": -27.0789852142334, "global_step": 434344, "epoch": 5233} {"train_loss": -26.795324325561523, "global_step": 434345, "epoch": 5233} {"train_loss": -26.939847946166992, "global_step": 434346, "epoch": 5233} {"train_loss": -26.58890151977539, "global_step": 434347, "epoch": 5233} {"train_loss": -27.07989501953125, "global_step": 434348, "epoch": 5233} {"train_loss": -26.996938705444336, "global_step": 434349, "epoch": 5233} {"train_loss": -26.452564239501953, "global_step": 434350, "epoch": 5233} {"train_loss": -26.46637535095215, "global_step": 434351, "epoch": 5233} {"train_loss": -26.548812866210938, "global_step": 434352, "epoch": 5233} {"train_loss": -26.767932891845703, "global_step": 434353, "epoch": 5233} {"train_loss": -26.904077529907227, "global_step": 434354, "epoch": 5233} {"train_loss": -26.614789962768555, "global_step": 434355, "epoch": 5233} {"train_loss": -27.0369873046875, "global_step": 434356, "epoch": 5233} {"train_loss": -26.693601608276367, "global_step": 434357, "epoch": 5233} {"train_loss": -27.137353897094727, "global_step": 434358, "epoch": 5233} {"train_loss": -26.684783935546875, "global_step": 434359, "epoch": 5233} {"train_loss": -26.83475685119629, "global_step": 434360, "epoch": 5233} {"train_loss": -27.0836238861084, "global_step": 434361, "epoch": 5233} {"train_loss": -26.90229606628418, "global_step": 434362, "epoch": 5233} {"train_loss": -26.466825485229492, "global_step": 434363, "epoch": 5233} {"train_loss": -26.71771812438965, "global_step": 434364, "epoch": 5233} {"train_loss": -26.959476470947266, "global_step": 434365, "epoch": 5233} {"train_loss": -27.00146484375, "global_step": 434366, "epoch": 5233} {"train_loss": -26.777912139892578, "global_step": 434367, "epoch": 5233} {"train_loss": -26.885501861572266, "global_step": 434368, "epoch": 5233} {"train_loss": -26.91996192932129, "global_step": 434369, "epoch": 5233} {"train_loss": -26.94817543029785, "global_step": 434370, "epoch": 5233} {"train_loss": -26.731958389282227, "global_step": 434371, "epoch": 5233} {"train_loss": -26.513690948486328, "global_step": 434372, "epoch": 5233} {"train_loss": -26.919391632080078, "global_step": 434373, "epoch": 5233} {"train_loss": -26.776092529296875, "global_step": 434374, "epoch": 5233} {"train_loss": -27.2523136138916, "global_step": 434375, "epoch": 5233} {"train_loss": -26.737628936767578, "global_step": 434376, "epoch": 5233} {"train_loss": -27.143524169921875, "global_step": 434377, "epoch": 5233} {"train_loss": -26.989398956298828, "global_step": 434378, "epoch": 5233} {"train_loss": -27.044769287109375, "global_step": 434379, "epoch": 5233} {"train_loss": -27.439146041870117, "global_step": 434380, "epoch": 5233} {"train_loss": -26.94879722595215, "global_step": 434381, "epoch": 5233} {"train_loss": -27.14141845703125, "global_step": 434382, "epoch": 5233} {"train_loss": -27.00848960876465, "global_step": 434383, "epoch": 5233} {"train_loss": -27.22586441040039, "global_step": 434384, "epoch": 5233} {"train_loss": -26.897546768188477, "global_step": 434385, "epoch": 5233} {"train_loss": -26.66228675842285, "global_step": 434386, "epoch": 5233} {"train_loss": -26.682950973510742, "global_step": 434387, "epoch": 5233} {"train_loss": -26.94073486328125, "global_step": 434388, "epoch": 5233} {"train_loss": -26.905797958374023, "global_step": 434389, "epoch": 5233} {"train_loss": -26.792572021484375, "global_step": 434390, "epoch": 5233} {"train_loss": -27.0162353515625, "global_step": 434391, "epoch": 5233} {"train_loss": -27.246353149414062, "global_step": 434392, "epoch": 5233} {"train_loss": -26.821914672851562, "global_step": 434393, "epoch": 5233} {"train_loss": -26.89912986755371, "global_step": 434394, "epoch": 5233} {"train_loss": -26.98723793029785, "global_step": 434395, "epoch": 5233} {"train_loss": -27.113561630249023, "global_step": 434396, "epoch": 5233} {"train_loss": -26.903242111206055, "global_step": 434397, "epoch": 5233} {"train_loss": -26.72756004333496, "global_step": 434398, "epoch": 5233} {"train_loss": -26.694238662719727, "global_step": 434399, "epoch": 5233} {"train_loss": -27.007787704467773, "global_step": 434400, "epoch": 5233} {"train_loss": -26.721994400024414, "global_step": 434401, "epoch": 5233} {"train_loss": -26.916614532470703, "global_step": 434402, "epoch": 5233} {"train_loss": -26.845502853393555, "global_step": 434403, "epoch": 5233} {"train_loss": -26.6007080078125, "global_step": 434404, "epoch": 5233} {"train_loss": -26.994125366210938, "global_step": 434405, "epoch": 5233} {"train_loss": -26.28548240661621, "global_step": 434406, "epoch": 5233} {"train_loss": -26.19586753845215, "global_step": 434407, "epoch": 5233} {"train_loss": -26.832427978515625, "global_step": 434408, "epoch": 5233} {"train_loss": -26.52760124206543, "global_step": 434409, "epoch": 5233} {"train_loss": -26.404499053955078, "global_step": 434410, "epoch": 5233} {"train_loss": -26.834197998046875, "global_step": 434411, "epoch": 5233} {"train_loss": -26.418731689453125, "global_step": 434412, "epoch": 5233} {"train_loss": -26.146841049194336, "global_step": 434413, "epoch": 5233} {"train_loss": -26.764087677001953, "global_step": 434414, "epoch": 5233} {"train_loss": -26.707599639892578, "global_step": 434415, "epoch": 5233} {"train_loss": -26.577741622924805, "global_step": 434416, "epoch": 5233} {"train_loss": -26.75957679748535, "global_step": 434417, "epoch": 5233} {"train_loss": -26.631078720092773, "global_step": 434418, "epoch": 5233} {"train_loss": -26.618579864501953, "global_step": 434419, "epoch": 5233} {"train_loss": -26.86846351623535, "global_step": 434420, "epoch": 5233} {"train_loss": -26.795592618275837, "global_step": 434421, "epoch": 5233, "val_loss": 6597132.5} {"train_loss": -26.394948959350586, "global_step": 434422, "epoch": 5234} {"train_loss": -25.424650192260742, "global_step": 434423, "epoch": 5234} {"train_loss": -25.917699813842773, "global_step": 434424, "epoch": 5234} {"train_loss": -25.9052791595459, "global_step": 434425, "epoch": 5234} {"train_loss": -24.363479614257812, "global_step": 434426, "epoch": 5234} {"train_loss": -25.364978790283203, "global_step": 434427, "epoch": 5234} {"train_loss": -25.641077041625977, "global_step": 434428, "epoch": 5234} {"train_loss": -25.5699405670166, "global_step": 434429, "epoch": 5234} {"train_loss": -26.475421905517578, "global_step": 434430, "epoch": 5234} {"train_loss": -26.22701072692871, "global_step": 434431, "epoch": 5234} {"train_loss": -25.99308204650879, "global_step": 434432, "epoch": 5234} {"train_loss": -26.19809341430664, "global_step": 434433, "epoch": 5234} {"train_loss": -26.026899337768555, "global_step": 434434, "epoch": 5234} {"train_loss": -26.240859985351562, "global_step": 434435, "epoch": 5234} {"train_loss": -26.110488891601562, "global_step": 434436, "epoch": 5234} {"train_loss": -26.847522735595703, "global_step": 434437, "epoch": 5234} {"train_loss": -26.54862403869629, "global_step": 434438, "epoch": 5234} {"train_loss": -26.44814109802246, "global_step": 434439, "epoch": 5234} {"train_loss": -26.566320419311523, "global_step": 434440, "epoch": 5234} {"train_loss": -26.260868072509766, "global_step": 434441, "epoch": 5234} {"train_loss": -26.822046279907227, "global_step": 434442, "epoch": 5234} {"train_loss": -26.147232055664062, "global_step": 434443, "epoch": 5234} {"train_loss": -26.94916343688965, "global_step": 434444, "epoch": 5234} {"train_loss": -26.620010375976562, "global_step": 434445, "epoch": 5234} {"train_loss": -26.71811866760254, "global_step": 434446, "epoch": 5234} {"train_loss": -26.75382423400879, "global_step": 434447, "epoch": 5234} {"train_loss": -26.675058364868164, "global_step": 434448, "epoch": 5234} {"train_loss": -26.349287033081055, "global_step": 434449, "epoch": 5234} {"train_loss": -26.339773178100586, "global_step": 434450, "epoch": 5234} {"train_loss": -26.996618270874023, "global_step": 434451, "epoch": 5234} {"train_loss": -27.059946060180664, "global_step": 434452, "epoch": 5234} {"train_loss": -26.679914474487305, "global_step": 434453, "epoch": 5234} {"train_loss": -26.650476455688477, "global_step": 434454, "epoch": 5234} {"train_loss": -26.948251724243164, "global_step": 434455, "epoch": 5234} {"train_loss": -26.549442291259766, "global_step": 434456, "epoch": 5234} {"train_loss": -26.956884384155273, "global_step": 434457, "epoch": 5234} {"train_loss": -26.845434188842773, "global_step": 434458, "epoch": 5234} {"train_loss": -26.761188507080078, "global_step": 434459, "epoch": 5234} {"train_loss": -26.723804473876953, "global_step": 434460, "epoch": 5234} {"train_loss": -27.09634780883789, "global_step": 434461, "epoch": 5234} {"train_loss": -26.73219108581543, "global_step": 434462, "epoch": 5234} {"train_loss": -26.68250846862793, "global_step": 434463, "epoch": 5234} {"train_loss": -26.887319564819336, "global_step": 434464, "epoch": 5234} {"train_loss": -27.2807674407959, "global_step": 434465, "epoch": 5234} {"train_loss": -27.0710391998291, "global_step": 434466, "epoch": 5234} {"train_loss": -26.49894142150879, "global_step": 434467, "epoch": 5234} {"train_loss": -26.758405685424805, "global_step": 434468, "epoch": 5234} {"train_loss": -26.78773307800293, "global_step": 434469, "epoch": 5234} {"train_loss": -26.427459716796875, "global_step": 434470, "epoch": 5234} {"train_loss": -26.720876693725586, "global_step": 434471, "epoch": 5234} {"train_loss": -26.806028366088867, "global_step": 434472, "epoch": 5234} {"train_loss": -26.632490158081055, "global_step": 434473, "epoch": 5234} {"train_loss": -26.878284454345703, "global_step": 434474, "epoch": 5234} {"train_loss": -26.80982780456543, "global_step": 434475, "epoch": 5234} {"train_loss": -26.593469619750977, "global_step": 434476, "epoch": 5234} {"train_loss": -26.6353702545166, "global_step": 434477, "epoch": 5234} {"train_loss": -26.501432418823242, "global_step": 434478, "epoch": 5234} {"train_loss": -26.49957275390625, "global_step": 434479, "epoch": 5234} {"train_loss": -27.094247817993164, "global_step": 434480, "epoch": 5234} {"train_loss": -26.34653091430664, "global_step": 434481, "epoch": 5234} {"train_loss": -26.74555778503418, "global_step": 434482, "epoch": 5234} {"train_loss": -26.555578231811523, "global_step": 434483, "epoch": 5234} {"train_loss": -26.442686080932617, "global_step": 434484, "epoch": 5234} {"train_loss": -27.430912017822266, "global_step": 434485, "epoch": 5234} {"train_loss": -26.796844482421875, "global_step": 434486, "epoch": 5234} {"train_loss": -26.316513061523438, "global_step": 434487, "epoch": 5234} {"train_loss": -27.006244659423828, "global_step": 434488, "epoch": 5234} {"train_loss": -26.33920669555664, "global_step": 434489, "epoch": 5234} {"train_loss": -26.300281524658203, "global_step": 434490, "epoch": 5234} {"train_loss": -26.172330856323242, "global_step": 434491, "epoch": 5234} {"train_loss": -26.44764518737793, "global_step": 434492, "epoch": 5234} {"train_loss": -26.38213539123535, "global_step": 434493, "epoch": 5234} {"train_loss": -26.840986251831055, "global_step": 434494, "epoch": 5234} {"train_loss": -26.611005783081055, "global_step": 434495, "epoch": 5234} {"train_loss": -26.830799102783203, "global_step": 434496, "epoch": 5234} {"train_loss": -26.787811279296875, "global_step": 434497, "epoch": 5234} {"train_loss": -26.823923110961914, "global_step": 434498, "epoch": 5234} {"train_loss": -26.53851890563965, "global_step": 434499, "epoch": 5234} {"train_loss": -26.692829132080078, "global_step": 434500, "epoch": 5234} {"train_loss": -26.963306427001953, "global_step": 434501, "epoch": 5234} {"train_loss": -26.6046199798584, "global_step": 434502, "epoch": 5234} {"train_loss": -26.90451431274414, "global_step": 434503, "epoch": 5234} {"train_loss": -26.5378876421825, "global_step": 434504, "epoch": 5234, "val_loss": 6681710.5} {"train_loss": -26.64191246032715, "global_step": 434505, "epoch": 5235} {"train_loss": -26.084516525268555, "global_step": 434506, "epoch": 5235} {"train_loss": -26.46587562561035, "global_step": 434507, "epoch": 5235} {"train_loss": -26.408111572265625, "global_step": 434508, "epoch": 5235} {"train_loss": -26.498748779296875, "global_step": 434509, "epoch": 5235} {"train_loss": -26.130414962768555, "global_step": 434510, "epoch": 5235} {"train_loss": -26.403921127319336, "global_step": 434511, "epoch": 5235} {"train_loss": -26.704792022705078, "global_step": 434512, "epoch": 5235} {"train_loss": -26.41532325744629, "global_step": 434513, "epoch": 5235} {"train_loss": -26.708852767944336, "global_step": 434514, "epoch": 5235} {"train_loss": -26.414182662963867, "global_step": 434515, "epoch": 5235} {"train_loss": -26.608240127563477, "global_step": 434516, "epoch": 5235} {"train_loss": -26.941755294799805, "global_step": 434517, "epoch": 5235} {"train_loss": -26.857818603515625, "global_step": 434518, "epoch": 5235} {"train_loss": -26.418933868408203, "global_step": 434519, "epoch": 5235} {"train_loss": -26.356800079345703, "global_step": 434520, "epoch": 5235} {"train_loss": -26.647958755493164, "global_step": 434521, "epoch": 5235} {"train_loss": -26.842697143554688, "global_step": 434522, "epoch": 5235} {"train_loss": -27.096744537353516, "global_step": 434523, "epoch": 5235} {"train_loss": -26.487506866455078, "global_step": 434524, "epoch": 5235} {"train_loss": -26.95635414123535, "global_step": 434525, "epoch": 5235} {"train_loss": -27.0695858001709, "global_step": 434526, "epoch": 5235} {"train_loss": -26.77772331237793, "global_step": 434527, "epoch": 5235} {"train_loss": -26.802352905273438, "global_step": 434528, "epoch": 5235} {"train_loss": -26.55864906311035, "global_step": 434529, "epoch": 5235} {"train_loss": -26.40839195251465, "global_step": 434530, "epoch": 5235} {"train_loss": -26.58880043029785, "global_step": 434531, "epoch": 5235} {"train_loss": -26.92360496520996, "global_step": 434532, "epoch": 5235} {"train_loss": -26.477079391479492, "global_step": 434533, "epoch": 5235} {"train_loss": -26.973011016845703, "global_step": 434534, "epoch": 5235} {"train_loss": -27.038949966430664, "global_step": 434535, "epoch": 5235} {"train_loss": -27.18389320373535, "global_step": 434536, "epoch": 5235} {"train_loss": -27.120391845703125, "global_step": 434537, "epoch": 5235} {"train_loss": -26.939908981323242, "global_step": 434538, "epoch": 5235} {"train_loss": -27.169815063476562, "global_step": 434539, "epoch": 5235} {"train_loss": -26.789203643798828, "global_step": 434540, "epoch": 5235} {"train_loss": -26.937952041625977, "global_step": 434541, "epoch": 5235} {"train_loss": -26.46760368347168, "global_step": 434542, "epoch": 5235} {"train_loss": -26.976423263549805, "global_step": 434543, "epoch": 5235} {"train_loss": -27.09235954284668, "global_step": 434544, "epoch": 5235} {"train_loss": -27.127614974975586, "global_step": 434545, "epoch": 5235} {"train_loss": -26.84004020690918, "global_step": 434546, "epoch": 5235} {"train_loss": -26.9597225189209, "global_step": 434547, "epoch": 5235} {"train_loss": -27.23334312438965, "global_step": 434548, "epoch": 5235} {"train_loss": -26.827672958374023, "global_step": 434549, "epoch": 5235} {"train_loss": -27.065067291259766, "global_step": 434550, "epoch": 5235} {"train_loss": -26.904327392578125, "global_step": 434551, "epoch": 5235} {"train_loss": -27.119871139526367, "global_step": 434552, "epoch": 5235} {"train_loss": -26.6260986328125, "global_step": 434553, "epoch": 5235} {"train_loss": -27.013174057006836, "global_step": 434554, "epoch": 5235} {"train_loss": -26.943439483642578, "global_step": 434555, "epoch": 5235} {"train_loss": -26.79108238220215, "global_step": 434556, "epoch": 5235} {"train_loss": -26.61211585998535, "global_step": 434557, "epoch": 5235} {"train_loss": -27.023365020751953, "global_step": 434558, "epoch": 5235} {"train_loss": -26.480676651000977, "global_step": 434559, "epoch": 5235} {"train_loss": -26.75689697265625, "global_step": 434560, "epoch": 5235} {"train_loss": -26.78949546813965, "global_step": 434561, "epoch": 5235} {"train_loss": -26.979766845703125, "global_step": 434562, "epoch": 5235} {"train_loss": -26.899621963500977, "global_step": 434563, "epoch": 5235} {"train_loss": -26.69186782836914, "global_step": 434564, "epoch": 5235} {"train_loss": -27.138477325439453, "global_step": 434565, "epoch": 5235} {"train_loss": -26.74672508239746, "global_step": 434566, "epoch": 5235} {"train_loss": -26.957059860229492, "global_step": 434567, "epoch": 5235} {"train_loss": -27.25612449645996, "global_step": 434568, "epoch": 5235} {"train_loss": -27.191877365112305, "global_step": 434569, "epoch": 5235} {"train_loss": -27.058263778686523, "global_step": 434570, "epoch": 5235} {"train_loss": -26.796436309814453, "global_step": 434571, "epoch": 5235} {"train_loss": -27.053070068359375, "global_step": 434572, "epoch": 5235} {"train_loss": -27.20806884765625, "global_step": 434573, "epoch": 5235} {"train_loss": -26.820154190063477, "global_step": 434574, "epoch": 5235} {"train_loss": -26.979812622070312, "global_step": 434575, "epoch": 5235} {"train_loss": -26.88397789001465, "global_step": 434576, "epoch": 5235} {"train_loss": -27.056503295898438, "global_step": 434577, "epoch": 5235} {"train_loss": -26.508716583251953, "global_step": 434578, "epoch": 5235} {"train_loss": -26.866926193237305, "global_step": 434579, "epoch": 5235} {"train_loss": -26.836898803710938, "global_step": 434580, "epoch": 5235} {"train_loss": -27.002532958984375, "global_step": 434581, "epoch": 5235} {"train_loss": -27.076751708984375, "global_step": 434582, "epoch": 5235} {"train_loss": -26.785985946655273, "global_step": 434583, "epoch": 5235} {"train_loss": -26.508275985717773, "global_step": 434584, "epoch": 5235} {"train_loss": -26.50177574157715, "global_step": 434585, "epoch": 5235} {"train_loss": -26.77500343322754, "global_step": 434586, "epoch": 5235} {"train_loss": -26.81465045515313, "global_step": 434587, "epoch": 5235, "val_loss": 6602803.5} {"train_loss": -26.327680587768555, "global_step": 434588, "epoch": 5236} {"train_loss": -26.62156105041504, "global_step": 434589, "epoch": 5236} {"train_loss": -26.091033935546875, "global_step": 434590, "epoch": 5236} {"train_loss": -26.47607421875, "global_step": 434591, "epoch": 5236} {"train_loss": -26.20249366760254, "global_step": 434592, "epoch": 5236} {"train_loss": -26.30259132385254, "global_step": 434593, "epoch": 5236} {"train_loss": -26.59535026550293, "global_step": 434594, "epoch": 5236} {"train_loss": -26.889760971069336, "global_step": 434595, "epoch": 5236} {"train_loss": -26.511754989624023, "global_step": 434596, "epoch": 5236} {"train_loss": -26.52764320373535, "global_step": 434597, "epoch": 5236} {"train_loss": -26.515533447265625, "global_step": 434598, "epoch": 5236} {"train_loss": -26.88043785095215, "global_step": 434599, "epoch": 5236} {"train_loss": -26.49918556213379, "global_step": 434600, "epoch": 5236} {"train_loss": -26.785226821899414, "global_step": 434601, "epoch": 5236} {"train_loss": -26.426748275756836, "global_step": 434602, "epoch": 5236} {"train_loss": -26.88762855529785, "global_step": 434603, "epoch": 5236} {"train_loss": -26.920963287353516, "global_step": 434604, "epoch": 5236} {"train_loss": -26.83424186706543, "global_step": 434605, "epoch": 5236} {"train_loss": -26.867572784423828, "global_step": 434606, "epoch": 5236} {"train_loss": -26.650354385375977, "global_step": 434607, "epoch": 5236} {"train_loss": -27.183216094970703, "global_step": 434608, "epoch": 5236} {"train_loss": -26.765457153320312, "global_step": 434609, "epoch": 5236} {"train_loss": -26.98788833618164, "global_step": 434610, "epoch": 5236} {"train_loss": -26.99287223815918, "global_step": 434611, "epoch": 5236} {"train_loss": -26.952960968017578, "global_step": 434612, "epoch": 5236} {"train_loss": -27.25275993347168, "global_step": 434613, "epoch": 5236} {"train_loss": -26.975637435913086, "global_step": 434614, "epoch": 5236} {"train_loss": -26.67241859436035, "global_step": 434615, "epoch": 5236} {"train_loss": -26.6882381439209, "global_step": 434616, "epoch": 5236} {"train_loss": -26.918020248413086, "global_step": 434617, "epoch": 5236} {"train_loss": -27.326095581054688, "global_step": 434618, "epoch": 5236} {"train_loss": -27.009052276611328, "global_step": 434619, "epoch": 5236} {"train_loss": -27.040552139282227, "global_step": 434620, "epoch": 5236} {"train_loss": -26.9940242767334, "global_step": 434621, "epoch": 5236} {"train_loss": -27.33682632446289, "global_step": 434622, "epoch": 5236} {"train_loss": -26.961469650268555, "global_step": 434623, "epoch": 5236} {"train_loss": -26.248291015625, "global_step": 434624, "epoch": 5236} {"train_loss": -27.120267868041992, "global_step": 434625, "epoch": 5236} {"train_loss": -27.181610107421875, "global_step": 434626, "epoch": 5236} {"train_loss": -26.61415672302246, "global_step": 434627, "epoch": 5236} {"train_loss": -26.811756134033203, "global_step": 434628, "epoch": 5236} {"train_loss": -27.104175567626953, "global_step": 434629, "epoch": 5236} {"train_loss": -26.892160415649414, "global_step": 434630, "epoch": 5236} {"train_loss": -26.641199111938477, "global_step": 434631, "epoch": 5236} {"train_loss": -26.66082191467285, "global_step": 434632, "epoch": 5236} {"train_loss": -26.745874404907227, "global_step": 434633, "epoch": 5236} {"train_loss": -26.745086669921875, "global_step": 434634, "epoch": 5236} {"train_loss": -26.80855369567871, "global_step": 434635, "epoch": 5236} {"train_loss": -26.64509391784668, "global_step": 434636, "epoch": 5236} {"train_loss": -27.019880294799805, "global_step": 434637, "epoch": 5236} {"train_loss": -26.69581413269043, "global_step": 434638, "epoch": 5236} {"train_loss": -27.115161895751953, "global_step": 434639, "epoch": 5236} {"train_loss": -27.222442626953125, "global_step": 434640, "epoch": 5236} {"train_loss": -26.802295684814453, "global_step": 434641, "epoch": 5236} {"train_loss": -27.20766258239746, "global_step": 434642, "epoch": 5236} {"train_loss": -27.122146606445312, "global_step": 434643, "epoch": 5236} {"train_loss": -27.08296012878418, "global_step": 434644, "epoch": 5236} {"train_loss": -27.42024803161621, "global_step": 434645, "epoch": 5236} {"train_loss": -26.998273849487305, "global_step": 434646, "epoch": 5236} {"train_loss": -26.857254028320312, "global_step": 434647, "epoch": 5236} {"train_loss": -27.00348472595215, "global_step": 434648, "epoch": 5236} {"train_loss": -27.332935333251953, "global_step": 434649, "epoch": 5236} {"train_loss": -27.191572189331055, "global_step": 434650, "epoch": 5236} {"train_loss": -27.1186466217041, "global_step": 434651, "epoch": 5236} {"train_loss": -27.10792350769043, "global_step": 434652, "epoch": 5236} {"train_loss": -27.017118453979492, "global_step": 434653, "epoch": 5236} {"train_loss": -27.195547103881836, "global_step": 434654, "epoch": 5236} {"train_loss": -26.777708053588867, "global_step": 434655, "epoch": 5236} {"train_loss": -26.89581871032715, "global_step": 434656, "epoch": 5236} {"train_loss": -27.003250122070312, "global_step": 434657, "epoch": 5236} {"train_loss": -26.631528854370117, "global_step": 434658, "epoch": 5236} {"train_loss": -26.890195846557617, "global_step": 434659, "epoch": 5236} {"train_loss": -26.156082153320312, "global_step": 434660, "epoch": 5236} {"train_loss": -26.564146041870117, "global_step": 434661, "epoch": 5236} {"train_loss": -26.8654842376709, "global_step": 434662, "epoch": 5236} {"train_loss": -26.569787979125977, "global_step": 434663, "epoch": 5236} {"train_loss": -26.88728141784668, "global_step": 434664, "epoch": 5236} {"train_loss": -26.158472061157227, "global_step": 434665, "epoch": 5236} {"train_loss": -26.478857040405273, "global_step": 434666, "epoch": 5236} {"train_loss": -26.471866607666016, "global_step": 434667, "epoch": 5236} {"train_loss": -26.25300407409668, "global_step": 434668, "epoch": 5236} {"train_loss": -26.497055053710938, "global_step": 434669, "epoch": 5236} {"train_loss": -26.82457590677652, "global_step": 434670, "epoch": 5236, "val_loss": 6600698.0} {"train_loss": -26.25946044921875, "global_step": 434671, "epoch": 5237} {"train_loss": -25.754138946533203, "global_step": 434672, "epoch": 5237} {"train_loss": -26.490869522094727, "global_step": 434673, "epoch": 5237} {"train_loss": -26.16314697265625, "global_step": 434674, "epoch": 5237} {"train_loss": -25.81804847717285, "global_step": 434675, "epoch": 5237} {"train_loss": -26.13226318359375, "global_step": 434676, "epoch": 5237} {"train_loss": -26.183612823486328, "global_step": 434677, "epoch": 5237} {"train_loss": -26.093555450439453, "global_step": 434678, "epoch": 5237} {"train_loss": -25.883886337280273, "global_step": 434679, "epoch": 5237} {"train_loss": -26.5083065032959, "global_step": 434680, "epoch": 5237} {"train_loss": -26.7232666015625, "global_step": 434681, "epoch": 5237} {"train_loss": -26.569250106811523, "global_step": 434682, "epoch": 5237} {"train_loss": -26.36248779296875, "global_step": 434683, "epoch": 5237} {"train_loss": -26.621301651000977, "global_step": 434684, "epoch": 5237} {"train_loss": -26.4776554107666, "global_step": 434685, "epoch": 5237} {"train_loss": -26.640213012695312, "global_step": 434686, "epoch": 5237} {"train_loss": -26.35017204284668, "global_step": 434687, "epoch": 5237} {"train_loss": -26.8427791595459, "global_step": 434688, "epoch": 5237} {"train_loss": -26.731536865234375, "global_step": 434689, "epoch": 5237} {"train_loss": -26.757211685180664, "global_step": 434690, "epoch": 5237} {"train_loss": -26.9588565826416, "global_step": 434691, "epoch": 5237} {"train_loss": -26.457504272460938, "global_step": 434692, "epoch": 5237} {"train_loss": -27.08465003967285, "global_step": 434693, "epoch": 5237} {"train_loss": -26.685928344726562, "global_step": 434694, "epoch": 5237} {"train_loss": -26.9315242767334, "global_step": 434695, "epoch": 5237} {"train_loss": -27.048254013061523, "global_step": 434696, "epoch": 5237} {"train_loss": -26.974807739257812, "global_step": 434697, "epoch": 5237} {"train_loss": -26.70318031311035, "global_step": 434698, "epoch": 5237} {"train_loss": -26.424560546875, "global_step": 434699, "epoch": 5237} {"train_loss": -26.574542999267578, "global_step": 434700, "epoch": 5237} {"train_loss": -26.866357803344727, "global_step": 434701, "epoch": 5237} {"train_loss": -26.871234893798828, "global_step": 434702, "epoch": 5237} {"train_loss": -27.212121963500977, "global_step": 434703, "epoch": 5237} {"train_loss": -27.211095809936523, "global_step": 434704, "epoch": 5237} {"train_loss": -27.36073112487793, "global_step": 434705, "epoch": 5237} {"train_loss": -26.99102210998535, "global_step": 434706, "epoch": 5237} {"train_loss": -26.855382919311523, "global_step": 434707, "epoch": 5237} {"train_loss": -27.148914337158203, "global_step": 434708, "epoch": 5237} {"train_loss": -27.05934715270996, "global_step": 434709, "epoch": 5237} {"train_loss": -27.10784339904785, "global_step": 434710, "epoch": 5237} {"train_loss": -27.3701171875, "global_step": 434711, "epoch": 5237} {"train_loss": -27.182470321655273, "global_step": 434712, "epoch": 5237} {"train_loss": -27.32036781311035, "global_step": 434713, "epoch": 5237} {"train_loss": -26.881927490234375, "global_step": 434714, "epoch": 5237} {"train_loss": -26.66082191467285, "global_step": 434715, "epoch": 5237} {"train_loss": -27.105377197265625, "global_step": 434716, "epoch": 5237} {"train_loss": -27.474390029907227, "global_step": 434717, "epoch": 5237} {"train_loss": -26.976776123046875, "global_step": 434718, "epoch": 5237} {"train_loss": -26.934064865112305, "global_step": 434719, "epoch": 5237} {"train_loss": -26.541662216186523, "global_step": 434720, "epoch": 5237} {"train_loss": -26.548572540283203, "global_step": 434721, "epoch": 5237} {"train_loss": -26.57802391052246, "global_step": 434722, "epoch": 5237} {"train_loss": -26.626773834228516, "global_step": 434723, "epoch": 5237} {"train_loss": -27.0024471282959, "global_step": 434724, "epoch": 5237} {"train_loss": -26.552749633789062, "global_step": 434725, "epoch": 5237} {"train_loss": -26.102075576782227, "global_step": 434726, "epoch": 5237} {"train_loss": -24.8883113861084, "global_step": 434727, "epoch": 5237} {"train_loss": -24.82001304626465, "global_step": 434728, "epoch": 5237} {"train_loss": -26.3494815826416, "global_step": 434729, "epoch": 5237} {"train_loss": -26.425048828125, "global_step": 434730, "epoch": 5237} {"train_loss": -25.6110782623291, "global_step": 434731, "epoch": 5237} {"train_loss": -26.69384765625, "global_step": 434732, "epoch": 5237} {"train_loss": -26.107282638549805, "global_step": 434733, "epoch": 5237} {"train_loss": -25.913049697875977, "global_step": 434734, "epoch": 5237} {"train_loss": -26.59372901916504, "global_step": 434735, "epoch": 5237} {"train_loss": -26.8098087310791, "global_step": 434736, "epoch": 5237} {"train_loss": -26.914554595947266, "global_step": 434737, "epoch": 5237} {"train_loss": -26.341135025024414, "global_step": 434738, "epoch": 5237} {"train_loss": -26.6671199798584, "global_step": 434739, "epoch": 5237} {"train_loss": -26.527013778686523, "global_step": 434740, "epoch": 5237} {"train_loss": -26.736745834350586, "global_step": 434741, "epoch": 5237} {"train_loss": -26.88701820373535, "global_step": 434742, "epoch": 5237} {"train_loss": -26.564786911010742, "global_step": 434743, "epoch": 5237} {"train_loss": -26.992944717407227, "global_step": 434744, "epoch": 5237} {"train_loss": -26.416181564331055, "global_step": 434745, "epoch": 5237} {"train_loss": -27.044214248657227, "global_step": 434746, "epoch": 5237} {"train_loss": -26.728139877319336, "global_step": 434747, "epoch": 5237} {"train_loss": -26.952219009399414, "global_step": 434748, "epoch": 5237} {"train_loss": -26.7241153717041, "global_step": 434749, "epoch": 5237} {"train_loss": -26.862462997436523, "global_step": 434750, "epoch": 5237} {"train_loss": -27.21339988708496, "global_step": 434751, "epoch": 5237} {"train_loss": -27.058216094970703, "global_step": 434752, "epoch": 5237} {"train_loss": -26.655361244477422, "global_step": 434753, "epoch": 5237, "val_loss": 6510490.0} {"train_loss": -27.045934677124023, "global_step": 434754, "epoch": 5238} {"train_loss": -26.945581436157227, "global_step": 434755, "epoch": 5238} {"train_loss": -26.7210750579834, "global_step": 434756, "epoch": 5238} {"train_loss": -26.905744552612305, "global_step": 434757, "epoch": 5238} {"train_loss": -26.995145797729492, "global_step": 434758, "epoch": 5238} {"train_loss": -26.582117080688477, "global_step": 434759, "epoch": 5238} {"train_loss": -26.638290405273438, "global_step": 434760, "epoch": 5238} {"train_loss": -26.9451961517334, "global_step": 434761, "epoch": 5238} {"train_loss": -26.757638931274414, "global_step": 434762, "epoch": 5238} {"train_loss": -26.94855308532715, "global_step": 434763, "epoch": 5238} {"train_loss": -26.807880401611328, "global_step": 434764, "epoch": 5238} {"train_loss": -26.975494384765625, "global_step": 434765, "epoch": 5238} {"train_loss": -27.090545654296875, "global_step": 434766, "epoch": 5238} {"train_loss": -26.98492431640625, "global_step": 434767, "epoch": 5238} {"train_loss": -26.928974151611328, "global_step": 434768, "epoch": 5238} {"train_loss": -27.023681640625, "global_step": 434769, "epoch": 5238} {"train_loss": -27.30088233947754, "global_step": 434770, "epoch": 5238} {"train_loss": -26.82122230529785, "global_step": 434771, "epoch": 5238} {"train_loss": -26.938220977783203, "global_step": 434772, "epoch": 5238} {"train_loss": -26.838550567626953, "global_step": 434773, "epoch": 5238} {"train_loss": -26.974103927612305, "global_step": 434774, "epoch": 5238} {"train_loss": -27.20880699157715, "global_step": 434775, "epoch": 5238} {"train_loss": -26.887876510620117, "global_step": 434776, "epoch": 5238} {"train_loss": -26.672361373901367, "global_step": 434777, "epoch": 5238} {"train_loss": -27.0974178314209, "global_step": 434778, "epoch": 5238} {"train_loss": -27.197492599487305, "global_step": 434779, "epoch": 5238} {"train_loss": -26.727792739868164, "global_step": 434780, "epoch": 5238} {"train_loss": -26.91568946838379, "global_step": 434781, "epoch": 5238} {"train_loss": -26.928800582885742, "global_step": 434782, "epoch": 5238} {"train_loss": -27.390155792236328, "global_step": 434783, "epoch": 5238} {"train_loss": -27.202991485595703, "global_step": 434784, "epoch": 5238} {"train_loss": -26.83022117614746, "global_step": 434785, "epoch": 5238} {"train_loss": -27.1824951171875, "global_step": 434786, "epoch": 5238} {"train_loss": -26.8579044342041, "global_step": 434787, "epoch": 5238} {"train_loss": -26.982288360595703, "global_step": 434788, "epoch": 5238} {"train_loss": -27.459707260131836, "global_step": 434789, "epoch": 5238} {"train_loss": -26.872379302978516, "global_step": 434790, "epoch": 5238} {"train_loss": -26.88455581665039, "global_step": 434791, "epoch": 5238} {"train_loss": -27.075885772705078, "global_step": 434792, "epoch": 5238} {"train_loss": -26.511648178100586, "global_step": 434793, "epoch": 5238} {"train_loss": -26.573694229125977, "global_step": 434794, "epoch": 5238} {"train_loss": -26.344451904296875, "global_step": 434795, "epoch": 5238} {"train_loss": -27.05679702758789, "global_step": 434796, "epoch": 5238} {"train_loss": -26.80543327331543, "global_step": 434797, "epoch": 5238} {"train_loss": -26.719358444213867, "global_step": 434798, "epoch": 5238} {"train_loss": -26.690155029296875, "global_step": 434799, "epoch": 5238} {"train_loss": -26.72903823852539, "global_step": 434800, "epoch": 5238} {"train_loss": -26.745298385620117, "global_step": 434801, "epoch": 5238} {"train_loss": -26.88374137878418, "global_step": 434802, "epoch": 5238} {"train_loss": -26.90351676940918, "global_step": 434803, "epoch": 5238} {"train_loss": -26.447744369506836, "global_step": 434804, "epoch": 5238} {"train_loss": -26.762405395507812, "global_step": 434805, "epoch": 5238} {"train_loss": -26.759382247924805, "global_step": 434806, "epoch": 5238} {"train_loss": -26.91579246520996, "global_step": 434807, "epoch": 5238} {"train_loss": -26.991046905517578, "global_step": 434808, "epoch": 5238} {"train_loss": -27.04334831237793, "global_step": 434809, "epoch": 5238} {"train_loss": -26.870075225830078, "global_step": 434810, "epoch": 5238} {"train_loss": -26.698225021362305, "global_step": 434811, "epoch": 5238} {"train_loss": -26.70243263244629, "global_step": 434812, "epoch": 5238} {"train_loss": -27.114639282226562, "global_step": 434813, "epoch": 5238} {"train_loss": -27.159765243530273, "global_step": 434814, "epoch": 5238} {"train_loss": -27.081695556640625, "global_step": 434815, "epoch": 5238} {"train_loss": -26.952789306640625, "global_step": 434816, "epoch": 5238} {"train_loss": -27.250757217407227, "global_step": 434817, "epoch": 5238} {"train_loss": -27.22993278503418, "global_step": 434818, "epoch": 5238} {"train_loss": -26.922285079956055, "global_step": 434819, "epoch": 5238} {"train_loss": -27.38064956665039, "global_step": 434820, "epoch": 5238} {"train_loss": -26.85640525817871, "global_step": 434821, "epoch": 5238} {"train_loss": -27.217853546142578, "global_step": 434822, "epoch": 5238} {"train_loss": -27.108240127563477, "global_step": 434823, "epoch": 5238} {"train_loss": -26.862430572509766, "global_step": 434824, "epoch": 5238} {"train_loss": -27.028400421142578, "global_step": 434825, "epoch": 5238} {"train_loss": -27.07826042175293, "global_step": 434826, "epoch": 5238} {"train_loss": -26.904956817626953, "global_step": 434827, "epoch": 5238} {"train_loss": -26.897329330444336, "global_step": 434828, "epoch": 5238} {"train_loss": -27.0931339263916, "global_step": 434829, "epoch": 5238} {"train_loss": -27.008411407470703, "global_step": 434830, "epoch": 5238} {"train_loss": -26.6683406829834, "global_step": 434831, "epoch": 5238} {"train_loss": -26.878650665283203, "global_step": 434832, "epoch": 5238} {"train_loss": -27.141021728515625, "global_step": 434833, "epoch": 5238} {"train_loss": -27.286996841430664, "global_step": 434834, "epoch": 5238} {"train_loss": -26.751087188720703, "global_step": 434835, "epoch": 5238} {"train_loss": -26.938559750476514, "global_step": 434836, "epoch": 5238, "val_loss": 6515784.0} {"train_loss": -26.429874420166016, "global_step": 434837, "epoch": 5239} {"train_loss": -26.252124786376953, "global_step": 434838, "epoch": 5239} {"train_loss": -26.3609619140625, "global_step": 434839, "epoch": 5239} {"train_loss": -26.570117950439453, "global_step": 434840, "epoch": 5239} {"train_loss": -26.86500358581543, "global_step": 434841, "epoch": 5239} {"train_loss": -26.58710289001465, "global_step": 434842, "epoch": 5239} {"train_loss": -25.960468292236328, "global_step": 434843, "epoch": 5239} {"train_loss": -26.404895782470703, "global_step": 434844, "epoch": 5239} {"train_loss": -26.523853302001953, "global_step": 434845, "epoch": 5239} {"train_loss": -26.801755905151367, "global_step": 434846, "epoch": 5239} {"train_loss": -26.74175453186035, "global_step": 434847, "epoch": 5239} {"train_loss": -26.7866268157959, "global_step": 434848, "epoch": 5239} {"train_loss": -26.488340377807617, "global_step": 434849, "epoch": 5239} {"train_loss": -26.573774337768555, "global_step": 434850, "epoch": 5239} {"train_loss": -26.6649112701416, "global_step": 434851, "epoch": 5239} {"train_loss": -26.573516845703125, "global_step": 434852, "epoch": 5239} {"train_loss": -26.597936630249023, "global_step": 434853, "epoch": 5239} {"train_loss": -26.27044677734375, "global_step": 434854, "epoch": 5239} {"train_loss": -26.941242218017578, "global_step": 434855, "epoch": 5239} {"train_loss": -26.8787841796875, "global_step": 434856, "epoch": 5239} {"train_loss": -26.620996475219727, "global_step": 434857, "epoch": 5239} {"train_loss": -26.625946044921875, "global_step": 434858, "epoch": 5239} {"train_loss": -27.124011993408203, "global_step": 434859, "epoch": 5239} {"train_loss": -27.020689010620117, "global_step": 434860, "epoch": 5239} {"train_loss": -26.898069381713867, "global_step": 434861, "epoch": 5239} {"train_loss": -26.75855827331543, "global_step": 434862, "epoch": 5239} {"train_loss": -26.884857177734375, "global_step": 434863, "epoch": 5239} {"train_loss": -26.8118953704834, "global_step": 434864, "epoch": 5239} {"train_loss": -26.765161514282227, "global_step": 434865, "epoch": 5239} {"train_loss": -26.890365600585938, "global_step": 434866, "epoch": 5239} {"train_loss": -26.7446231842041, "global_step": 434867, "epoch": 5239} {"train_loss": -26.67234230041504, "global_step": 434868, "epoch": 5239} {"train_loss": -27.029584884643555, "global_step": 434869, "epoch": 5239} {"train_loss": -27.044544219970703, "global_step": 434870, "epoch": 5239} {"train_loss": -26.807392120361328, "global_step": 434871, "epoch": 5239} {"train_loss": -26.762704849243164, "global_step": 434872, "epoch": 5239} {"train_loss": -27.008655548095703, "global_step": 434873, "epoch": 5239} {"train_loss": -27.0407772064209, "global_step": 434874, "epoch": 5239} {"train_loss": -27.035314559936523, "global_step": 434875, "epoch": 5239} {"train_loss": -26.805891036987305, "global_step": 434876, "epoch": 5239} {"train_loss": -27.108478546142578, "global_step": 434877, "epoch": 5239} {"train_loss": -27.026697158813477, "global_step": 434878, "epoch": 5239} {"train_loss": -26.877988815307617, "global_step": 434879, "epoch": 5239} {"train_loss": -27.01041030883789, "global_step": 434880, "epoch": 5239} {"train_loss": -26.3809814453125, "global_step": 434881, "epoch": 5239} {"train_loss": -26.450031280517578, "global_step": 434882, "epoch": 5239} {"train_loss": -27.00782585144043, "global_step": 434883, "epoch": 5239} {"train_loss": -26.944599151611328, "global_step": 434884, "epoch": 5239} {"train_loss": -26.9576416015625, "global_step": 434885, "epoch": 5239} {"train_loss": -26.734542846679688, "global_step": 434886, "epoch": 5239} {"train_loss": -26.771228790283203, "global_step": 434887, "epoch": 5239} {"train_loss": -26.6705379486084, "global_step": 434888, "epoch": 5239} {"train_loss": -26.78450584411621, "global_step": 434889, "epoch": 5239} {"train_loss": -27.00189781188965, "global_step": 434890, "epoch": 5239} {"train_loss": -26.822345733642578, "global_step": 434891, "epoch": 5239} {"train_loss": -26.865034103393555, "global_step": 434892, "epoch": 5239} {"train_loss": -26.900171279907227, "global_step": 434893, "epoch": 5239} {"train_loss": -27.018768310546875, "global_step": 434894, "epoch": 5239} {"train_loss": -27.216232299804688, "global_step": 434895, "epoch": 5239} {"train_loss": -27.054162979125977, "global_step": 434896, "epoch": 5239} {"train_loss": -27.175745010375977, "global_step": 434897, "epoch": 5239} {"train_loss": -27.147266387939453, "global_step": 434898, "epoch": 5239} {"train_loss": -27.018293380737305, "global_step": 434899, "epoch": 5239} {"train_loss": -27.07880973815918, "global_step": 434900, "epoch": 5239} {"train_loss": -26.444721221923828, "global_step": 434901, "epoch": 5239} {"train_loss": -26.014652252197266, "global_step": 434902, "epoch": 5239} {"train_loss": -26.1142635345459, "global_step": 434903, "epoch": 5239} {"train_loss": -26.814130783081055, "global_step": 434904, "epoch": 5239} {"train_loss": -26.7702693939209, "global_step": 434905, "epoch": 5239} {"train_loss": -26.577539443969727, "global_step": 434906, "epoch": 5239} {"train_loss": -26.97467613220215, "global_step": 434907, "epoch": 5239} {"train_loss": -27.012475967407227, "global_step": 434908, "epoch": 5239} {"train_loss": -26.69244384765625, "global_step": 434909, "epoch": 5239} {"train_loss": -27.191268920898438, "global_step": 434910, "epoch": 5239} {"train_loss": -26.88677406311035, "global_step": 434911, "epoch": 5239} {"train_loss": -26.852802276611328, "global_step": 434912, "epoch": 5239} {"train_loss": -27.271020889282227, "global_step": 434913, "epoch": 5239} {"train_loss": -26.95635986328125, "global_step": 434914, "epoch": 5239} {"train_loss": -26.965606689453125, "global_step": 434915, "epoch": 5239} {"train_loss": -26.42414665222168, "global_step": 434916, "epoch": 5239} {"train_loss": -26.674362182617188, "global_step": 434917, "epoch": 5239} {"train_loss": -26.599958419799805, "global_step": 434918, "epoch": 5239} {"train_loss": -26.78317113669522, "global_step": 434919, "epoch": 5239, "val_loss": 6658070.0} {"train_loss": -26.403522491455078, "global_step": 434920, "epoch": 5240} {"train_loss": -26.54659080505371, "global_step": 434921, "epoch": 5240} {"train_loss": -27.10400390625, "global_step": 434922, "epoch": 5240} {"train_loss": -26.595945358276367, "global_step": 434923, "epoch": 5240} {"train_loss": -26.399580001831055, "global_step": 434924, "epoch": 5240} {"train_loss": -26.780847549438477, "global_step": 434925, "epoch": 5240} {"train_loss": -26.575225830078125, "global_step": 434926, "epoch": 5240} {"train_loss": -26.775373458862305, "global_step": 434927, "epoch": 5240} {"train_loss": -26.87726402282715, "global_step": 434928, "epoch": 5240} {"train_loss": -27.013975143432617, "global_step": 434929, "epoch": 5240} {"train_loss": -26.74395751953125, "global_step": 434930, "epoch": 5240} {"train_loss": -27.0479679107666, "global_step": 434931, "epoch": 5240} {"train_loss": -26.99526023864746, "global_step": 434932, "epoch": 5240} {"train_loss": -27.023996353149414, "global_step": 434933, "epoch": 5240} {"train_loss": -27.005842208862305, "global_step": 434934, "epoch": 5240} {"train_loss": -27.146026611328125, "global_step": 434935, "epoch": 5240} {"train_loss": -26.88629150390625, "global_step": 434936, "epoch": 5240} {"train_loss": -26.937231063842773, "global_step": 434937, "epoch": 5240} {"train_loss": -26.74323844909668, "global_step": 434938, "epoch": 5240} {"train_loss": -27.00697135925293, "global_step": 434939, "epoch": 5240} {"train_loss": -26.891515731811523, "global_step": 434940, "epoch": 5240} {"train_loss": -26.706838607788086, "global_step": 434941, "epoch": 5240} {"train_loss": -27.357446670532227, "global_step": 434942, "epoch": 5240} {"train_loss": -27.05328369140625, "global_step": 434943, "epoch": 5240} {"train_loss": -26.87566566467285, "global_step": 434944, "epoch": 5240} {"train_loss": -27.234577178955078, "global_step": 434945, "epoch": 5240} {"train_loss": -27.3411922454834, "global_step": 434946, "epoch": 5240} {"train_loss": -27.275007247924805, "global_step": 434947, "epoch": 5240} {"train_loss": -27.10321044921875, "global_step": 434948, "epoch": 5240} {"train_loss": -27.1722469329834, "global_step": 434949, "epoch": 5240} {"train_loss": -27.117856979370117, "global_step": 434950, "epoch": 5240} {"train_loss": -27.075345993041992, "global_step": 434951, "epoch": 5240} {"train_loss": -26.856733322143555, "global_step": 434952, "epoch": 5240} {"train_loss": -26.941242218017578, "global_step": 434953, "epoch": 5240} {"train_loss": -27.086889266967773, "global_step": 434954, "epoch": 5240} {"train_loss": -27.40532875061035, "global_step": 434955, "epoch": 5240} {"train_loss": -26.68294334411621, "global_step": 434956, "epoch": 5240} {"train_loss": -27.029661178588867, "global_step": 434957, "epoch": 5240} {"train_loss": -26.96954345703125, "global_step": 434958, "epoch": 5240} {"train_loss": -26.634740829467773, "global_step": 434959, "epoch": 5240} {"train_loss": -26.75798988342285, "global_step": 434960, "epoch": 5240} {"train_loss": -26.591999053955078, "global_step": 434961, "epoch": 5240} {"train_loss": -27.0434513092041, "global_step": 434962, "epoch": 5240} {"train_loss": -26.780609130859375, "global_step": 434963, "epoch": 5240} {"train_loss": -27.12293815612793, "global_step": 434964, "epoch": 5240} {"train_loss": -26.811634063720703, "global_step": 434965, "epoch": 5240} {"train_loss": -27.20533561706543, "global_step": 434966, "epoch": 5240} {"train_loss": -26.963703155517578, "global_step": 434967, "epoch": 5240} {"train_loss": -27.145095825195312, "global_step": 434968, "epoch": 5240} {"train_loss": -27.1260986328125, "global_step": 434969, "epoch": 5240} {"train_loss": -27.0760555267334, "global_step": 434970, "epoch": 5240} {"train_loss": -26.9768123626709, "global_step": 434971, "epoch": 5240} {"train_loss": -26.912052154541016, "global_step": 434972, "epoch": 5240} {"train_loss": -27.452930450439453, "global_step": 434973, "epoch": 5240} {"train_loss": -27.20285987854004, "global_step": 434974, "epoch": 5240} {"train_loss": -26.913970947265625, "global_step": 434975, "epoch": 5240} {"train_loss": -26.9154109954834, "global_step": 434976, "epoch": 5240} {"train_loss": -26.903003692626953, "global_step": 434977, "epoch": 5240} {"train_loss": -26.990386962890625, "global_step": 434978, "epoch": 5240} {"train_loss": -26.9066162109375, "global_step": 434979, "epoch": 5240} {"train_loss": -27.089771270751953, "global_step": 434980, "epoch": 5240} {"train_loss": -26.600812911987305, "global_step": 434981, "epoch": 5240} {"train_loss": -26.514631271362305, "global_step": 434982, "epoch": 5240} {"train_loss": -26.1663761138916, "global_step": 434983, "epoch": 5240} {"train_loss": -26.68072509765625, "global_step": 434984, "epoch": 5240} {"train_loss": -26.929330825805664, "global_step": 434985, "epoch": 5240} {"train_loss": -26.667713165283203, "global_step": 434986, "epoch": 5240} {"train_loss": -26.822065353393555, "global_step": 434987, "epoch": 5240} {"train_loss": -26.543272018432617, "global_step": 434988, "epoch": 5240} {"train_loss": -26.864667892456055, "global_step": 434989, "epoch": 5240} {"train_loss": -26.956159591674805, "global_step": 434990, "epoch": 5240} {"train_loss": -27.114166259765625, "global_step": 434991, "epoch": 5240} {"train_loss": -26.739444732666016, "global_step": 434992, "epoch": 5240} {"train_loss": -27.050724029541016, "global_step": 434993, "epoch": 5240} {"train_loss": -27.501510620117188, "global_step": 434994, "epoch": 5240} {"train_loss": -26.696399688720703, "global_step": 434995, "epoch": 5240} {"train_loss": -26.942096710205078, "global_step": 434996, "epoch": 5240} {"train_loss": -27.054346084594727, "global_step": 434997, "epoch": 5240} {"train_loss": -26.997400283813477, "global_step": 434998, "epoch": 5240} {"train_loss": -26.777830123901367, "global_step": 434999, "epoch": 5240} {"train_loss": -26.855148315429688, "global_step": 435000, "epoch": 5240} {"train_loss": -27.01595115661621, "global_step": 435001, "epoch": 5240} {"train_loss": -26.91728171383042, "global_step": 435002, "epoch": 5240, "val_loss": 6653760.0} {"train_loss": -26.32912254333496, "global_step": 435003, "epoch": 5241} {"train_loss": -25.952320098876953, "global_step": 435004, "epoch": 5241} {"train_loss": -26.4882755279541, "global_step": 435005, "epoch": 5241} {"train_loss": -26.259567260742188, "global_step": 435006, "epoch": 5241} {"train_loss": -26.756330490112305, "global_step": 435007, "epoch": 5241} {"train_loss": -26.495269775390625, "global_step": 435008, "epoch": 5241} {"train_loss": -26.46038246154785, "global_step": 435009, "epoch": 5241} {"train_loss": -27.03754997253418, "global_step": 435010, "epoch": 5241} {"train_loss": -26.788986206054688, "global_step": 435011, "epoch": 5241} {"train_loss": -26.72919273376465, "global_step": 435012, "epoch": 5241} {"train_loss": -27.00623893737793, "global_step": 435013, "epoch": 5241} {"train_loss": -26.92768669128418, "global_step": 435014, "epoch": 5241} {"train_loss": -26.913618087768555, "global_step": 435015, "epoch": 5241} {"train_loss": -27.032440185546875, "global_step": 435016, "epoch": 5241} {"train_loss": -26.869115829467773, "global_step": 435017, "epoch": 5241} {"train_loss": -27.01704216003418, "global_step": 435018, "epoch": 5241} {"train_loss": -27.19013023376465, "global_step": 435019, "epoch": 5241} {"train_loss": -26.826587677001953, "global_step": 435020, "epoch": 5241} {"train_loss": -26.8892765045166, "global_step": 435021, "epoch": 5241} {"train_loss": -27.112295150756836, "global_step": 435022, "epoch": 5241} {"train_loss": -26.793487548828125, "global_step": 435023, "epoch": 5241} {"train_loss": -26.81617546081543, "global_step": 435024, "epoch": 5241} {"train_loss": -26.765851974487305, "global_step": 435025, "epoch": 5241} {"train_loss": -27.322721481323242, "global_step": 435026, "epoch": 5241} {"train_loss": -27.08692741394043, "global_step": 435027, "epoch": 5241} {"train_loss": -26.756006240844727, "global_step": 435028, "epoch": 5241} {"train_loss": -27.104541778564453, "global_step": 435029, "epoch": 5241} {"train_loss": -26.8294734954834, "global_step": 435030, "epoch": 5241} {"train_loss": -27.021787643432617, "global_step": 435031, "epoch": 5241} {"train_loss": -27.3934268951416, "global_step": 435032, "epoch": 5241} {"train_loss": -26.82073974609375, "global_step": 435033, "epoch": 5241} {"train_loss": -26.904865264892578, "global_step": 435034, "epoch": 5241} {"train_loss": -26.788679122924805, "global_step": 435035, "epoch": 5241} {"train_loss": -27.082319259643555, "global_step": 435036, "epoch": 5241} {"train_loss": -26.84731101989746, "global_step": 435037, "epoch": 5241} {"train_loss": -27.03265380859375, "global_step": 435038, "epoch": 5241} {"train_loss": -27.14790916442871, "global_step": 435039, "epoch": 5241} {"train_loss": -27.011816024780273, "global_step": 435040, "epoch": 5241} {"train_loss": -27.156341552734375, "global_step": 435041, "epoch": 5241} {"train_loss": -26.69585609436035, "global_step": 435042, "epoch": 5241} {"train_loss": -26.8353328704834, "global_step": 435043, "epoch": 5241} {"train_loss": -27.259204864501953, "global_step": 435044, "epoch": 5241} {"train_loss": -27.249618530273438, "global_step": 435045, "epoch": 5241} {"train_loss": -26.868289947509766, "global_step": 435046, "epoch": 5241} {"train_loss": -26.59486198425293, "global_step": 435047, "epoch": 5241} {"train_loss": -26.937585830688477, "global_step": 435048, "epoch": 5241} {"train_loss": -27.059906005859375, "global_step": 435049, "epoch": 5241} {"train_loss": -26.90625, "global_step": 435050, "epoch": 5241} {"train_loss": -26.728885650634766, "global_step": 435051, "epoch": 5241} {"train_loss": -27.20453453063965, "global_step": 435052, "epoch": 5241} {"train_loss": -26.589706420898438, "global_step": 435053, "epoch": 5241} {"train_loss": -26.869359970092773, "global_step": 435054, "epoch": 5241} {"train_loss": -26.67641258239746, "global_step": 435055, "epoch": 5241} {"train_loss": -27.103336334228516, "global_step": 435056, "epoch": 5241} {"train_loss": -26.98053550720215, "global_step": 435057, "epoch": 5241} {"train_loss": -26.87627601623535, "global_step": 435058, "epoch": 5241} {"train_loss": -26.92948341369629, "global_step": 435059, "epoch": 5241} {"train_loss": -26.644500732421875, "global_step": 435060, "epoch": 5241} {"train_loss": -26.46630859375, "global_step": 435061, "epoch": 5241} {"train_loss": -26.779157638549805, "global_step": 435062, "epoch": 5241} {"train_loss": -27.465106964111328, "global_step": 435063, "epoch": 5241} {"train_loss": -26.5414981842041, "global_step": 435064, "epoch": 5241} {"train_loss": -26.880584716796875, "global_step": 435065, "epoch": 5241} {"train_loss": -26.77920913696289, "global_step": 435066, "epoch": 5241} {"train_loss": -26.754255294799805, "global_step": 435067, "epoch": 5241} {"train_loss": -26.926910400390625, "global_step": 435068, "epoch": 5241} {"train_loss": -26.764158248901367, "global_step": 435069, "epoch": 5241} {"train_loss": -26.464941024780273, "global_step": 435070, "epoch": 5241} {"train_loss": -26.880796432495117, "global_step": 435071, "epoch": 5241} {"train_loss": -26.731801986694336, "global_step": 435072, "epoch": 5241} {"train_loss": -26.751562118530273, "global_step": 435073, "epoch": 5241} {"train_loss": -27.15486717224121, "global_step": 435074, "epoch": 5241} {"train_loss": -27.117694854736328, "global_step": 435075, "epoch": 5241} {"train_loss": -27.09174156188965, "global_step": 435076, "epoch": 5241} {"train_loss": -26.730573654174805, "global_step": 435077, "epoch": 5241} {"train_loss": -26.9149112701416, "global_step": 435078, "epoch": 5241} {"train_loss": -26.5319766998291, "global_step": 435079, "epoch": 5241} {"train_loss": -26.949329376220703, "global_step": 435080, "epoch": 5241} {"train_loss": -26.699798583984375, "global_step": 435081, "epoch": 5241} {"train_loss": -26.229934692382812, "global_step": 435082, "epoch": 5241} {"train_loss": -26.7263126373291, "global_step": 435083, "epoch": 5241} {"train_loss": -26.216733932495117, "global_step": 435084, "epoch": 5241} {"train_loss": -26.847249915800898, "global_step": 435085, "epoch": 5241, "val_loss": 6627912.0} {"train_loss": -26.55263328552246, "global_step": 435086, "epoch": 5242} {"train_loss": -25.52829933166504, "global_step": 435087, "epoch": 5242} {"train_loss": -25.896011352539062, "global_step": 435088, "epoch": 5242} {"train_loss": -26.095212936401367, "global_step": 435089, "epoch": 5242} {"train_loss": -26.97246742248535, "global_step": 435090, "epoch": 5242} {"train_loss": -26.0762996673584, "global_step": 435091, "epoch": 5242} {"train_loss": -26.935169219970703, "global_step": 435092, "epoch": 5242} {"train_loss": -26.39801025390625, "global_step": 435093, "epoch": 5242} {"train_loss": -26.66926383972168, "global_step": 435094, "epoch": 5242} {"train_loss": -26.91364097595215, "global_step": 435095, "epoch": 5242} {"train_loss": -26.6325626373291, "global_step": 435096, "epoch": 5242} {"train_loss": -26.929494857788086, "global_step": 435097, "epoch": 5242} {"train_loss": -26.672626495361328, "global_step": 435098, "epoch": 5242} {"train_loss": -26.64385414123535, "global_step": 435099, "epoch": 5242} {"train_loss": -26.7875919342041, "global_step": 435100, "epoch": 5242} {"train_loss": -26.708759307861328, "global_step": 435101, "epoch": 5242} {"train_loss": -26.77366065979004, "global_step": 435102, "epoch": 5242} {"train_loss": -26.417774200439453, "global_step": 435103, "epoch": 5242} {"train_loss": -26.69879150390625, "global_step": 435104, "epoch": 5242} {"train_loss": -27.075658798217773, "global_step": 435105, "epoch": 5242} {"train_loss": -26.86732292175293, "global_step": 435106, "epoch": 5242} {"train_loss": -26.5413818359375, "global_step": 435107, "epoch": 5242} {"train_loss": -27.01177406311035, "global_step": 435108, "epoch": 5242} {"train_loss": -26.84730339050293, "global_step": 435109, "epoch": 5242} {"train_loss": -26.747339248657227, "global_step": 435110, "epoch": 5242} {"train_loss": -26.80572509765625, "global_step": 435111, "epoch": 5242} {"train_loss": -26.857898712158203, "global_step": 435112, "epoch": 5242} {"train_loss": -26.786848068237305, "global_step": 435113, "epoch": 5242} {"train_loss": -27.0983943939209, "global_step": 435114, "epoch": 5242} {"train_loss": -26.801044464111328, "global_step": 435115, "epoch": 5242} {"train_loss": -27.081838607788086, "global_step": 435116, "epoch": 5242} {"train_loss": -26.92243003845215, "global_step": 435117, "epoch": 5242} {"train_loss": -26.697021484375, "global_step": 435118, "epoch": 5242} {"train_loss": -26.9074764251709, "global_step": 435119, "epoch": 5242} {"train_loss": -26.95746421813965, "global_step": 435120, "epoch": 5242} {"train_loss": -26.857751846313477, "global_step": 435121, "epoch": 5242} {"train_loss": -26.96516227722168, "global_step": 435122, "epoch": 5242} {"train_loss": -27.134445190429688, "global_step": 435123, "epoch": 5242} {"train_loss": -26.672657012939453, "global_step": 435124, "epoch": 5242} {"train_loss": -27.18531608581543, "global_step": 435125, "epoch": 5242} {"train_loss": -27.270849227905273, "global_step": 435126, "epoch": 5242} {"train_loss": -26.992467880249023, "global_step": 435127, "epoch": 5242} {"train_loss": -26.928424835205078, "global_step": 435128, "epoch": 5242} {"train_loss": -26.768970489501953, "global_step": 435129, "epoch": 5242} {"train_loss": -26.9953670501709, "global_step": 435130, "epoch": 5242} {"train_loss": -27.14853858947754, "global_step": 435131, "epoch": 5242} {"train_loss": -26.769922256469727, "global_step": 435132, "epoch": 5242} {"train_loss": -27.2769832611084, "global_step": 435133, "epoch": 5242} {"train_loss": -27.4326171875, "global_step": 435134, "epoch": 5242} {"train_loss": -26.803558349609375, "global_step": 435135, "epoch": 5242} {"train_loss": -26.433197021484375, "global_step": 435136, "epoch": 5242} {"train_loss": -26.48874282836914, "global_step": 435137, "epoch": 5242} {"train_loss": -26.746036529541016, "global_step": 435138, "epoch": 5242} {"train_loss": -27.334014892578125, "global_step": 435139, "epoch": 5242} {"train_loss": -26.774677276611328, "global_step": 435140, "epoch": 5242} {"train_loss": -26.67803382873535, "global_step": 435141, "epoch": 5242} {"train_loss": -26.820560455322266, "global_step": 435142, "epoch": 5242} {"train_loss": -26.961023330688477, "global_step": 435143, "epoch": 5242} {"train_loss": -26.828369140625, "global_step": 435144, "epoch": 5242} {"train_loss": -26.630273818969727, "global_step": 435145, "epoch": 5242} {"train_loss": -26.636890411376953, "global_step": 435146, "epoch": 5242} {"train_loss": -26.70729637145996, "global_step": 435147, "epoch": 5242} {"train_loss": -27.022052764892578, "global_step": 435148, "epoch": 5242} {"train_loss": -26.851810455322266, "global_step": 435149, "epoch": 5242} {"train_loss": -27.077091217041016, "global_step": 435150, "epoch": 5242} {"train_loss": -26.492938995361328, "global_step": 435151, "epoch": 5242} {"train_loss": -26.6065731048584, "global_step": 435152, "epoch": 5242} {"train_loss": -26.770465850830078, "global_step": 435153, "epoch": 5242} {"train_loss": -27.13776969909668, "global_step": 435154, "epoch": 5242} {"train_loss": -26.696826934814453, "global_step": 435155, "epoch": 5242} {"train_loss": -27.12959098815918, "global_step": 435156, "epoch": 5242} {"train_loss": -27.047876358032227, "global_step": 435157, "epoch": 5242} {"train_loss": -26.874069213867188, "global_step": 435158, "epoch": 5242} {"train_loss": -26.94098472595215, "global_step": 435159, "epoch": 5242} {"train_loss": -27.018421173095703, "global_step": 435160, "epoch": 5242} {"train_loss": -26.572162628173828, "global_step": 435161, "epoch": 5242} {"train_loss": -27.07207679748535, "global_step": 435162, "epoch": 5242} {"train_loss": -27.144269943237305, "global_step": 435163, "epoch": 5242} {"train_loss": -27.00750160217285, "global_step": 435164, "epoch": 5242} {"train_loss": -27.09394645690918, "global_step": 435165, "epoch": 5242} {"train_loss": -27.106525421142578, "global_step": 435166, "epoch": 5242} {"train_loss": -26.84990882873535, "global_step": 435167, "epoch": 5242} {"train_loss": -26.821095110422156, "global_step": 435168, "epoch": 5242, "val_loss": 6545855.0} {"train_loss": -26.171234130859375, "global_step": 435169, "epoch": 5243} {"train_loss": -25.884140014648438, "global_step": 435170, "epoch": 5243} {"train_loss": -26.63639259338379, "global_step": 435171, "epoch": 5243} {"train_loss": -26.99814224243164, "global_step": 435172, "epoch": 5243} {"train_loss": -26.23583984375, "global_step": 435173, "epoch": 5243} {"train_loss": -26.55365562438965, "global_step": 435174, "epoch": 5243} {"train_loss": -26.23445701599121, "global_step": 435175, "epoch": 5243} {"train_loss": -25.641712188720703, "global_step": 435176, "epoch": 5243} {"train_loss": -26.232778549194336, "global_step": 435177, "epoch": 5243} {"train_loss": -26.453123092651367, "global_step": 435178, "epoch": 5243} {"train_loss": -26.361127853393555, "global_step": 435179, "epoch": 5243} {"train_loss": -26.78055191040039, "global_step": 435180, "epoch": 5243} {"train_loss": -26.83930778503418, "global_step": 435181, "epoch": 5243} {"train_loss": -26.493213653564453, "global_step": 435182, "epoch": 5243} {"train_loss": -26.872879028320312, "global_step": 435183, "epoch": 5243} {"train_loss": -26.857868194580078, "global_step": 435184, "epoch": 5243} {"train_loss": -26.458295822143555, "global_step": 435185, "epoch": 5243} {"train_loss": -26.938385009765625, "global_step": 435186, "epoch": 5243} {"train_loss": -26.540790557861328, "global_step": 435187, "epoch": 5243} {"train_loss": -26.655988693237305, "global_step": 435188, "epoch": 5243} {"train_loss": -26.51222038269043, "global_step": 435189, "epoch": 5243} {"train_loss": -26.451171875, "global_step": 435190, "epoch": 5243} {"train_loss": -26.311044692993164, "global_step": 435191, "epoch": 5243} {"train_loss": -26.885766983032227, "global_step": 435192, "epoch": 5243} {"train_loss": -26.670780181884766, "global_step": 435193, "epoch": 5243} {"train_loss": -26.726638793945312, "global_step": 435194, "epoch": 5243} {"train_loss": -26.886611938476562, "global_step": 435195, "epoch": 5243} {"train_loss": -26.786712646484375, "global_step": 435196, "epoch": 5243} {"train_loss": -27.196624755859375, "global_step": 435197, "epoch": 5243} {"train_loss": -26.957748413085938, "global_step": 435198, "epoch": 5243} {"train_loss": -27.196401596069336, "global_step": 435199, "epoch": 5243} {"train_loss": -27.264799118041992, "global_step": 435200, "epoch": 5243} {"train_loss": -26.679126739501953, "global_step": 435201, "epoch": 5243} {"train_loss": -26.96673011779785, "global_step": 435202, "epoch": 5243} {"train_loss": -26.875507354736328, "global_step": 435203, "epoch": 5243} {"train_loss": -26.910242080688477, "global_step": 435204, "epoch": 5243} {"train_loss": -26.99591064453125, "global_step": 435205, "epoch": 5243} {"train_loss": -27.021575927734375, "global_step": 435206, "epoch": 5243} {"train_loss": -27.143396377563477, "global_step": 435207, "epoch": 5243} {"train_loss": -27.110036849975586, "global_step": 435208, "epoch": 5243} {"train_loss": -27.192615509033203, "global_step": 435209, "epoch": 5243} {"train_loss": -26.905933380126953, "global_step": 435210, "epoch": 5243} {"train_loss": -26.829071044921875, "global_step": 435211, "epoch": 5243} {"train_loss": -26.809772491455078, "global_step": 435212, "epoch": 5243} {"train_loss": -27.044950485229492, "global_step": 435213, "epoch": 5243} {"train_loss": -27.30792808532715, "global_step": 435214, "epoch": 5243} {"train_loss": -26.74409294128418, "global_step": 435215, "epoch": 5243} {"train_loss": -26.634418487548828, "global_step": 435216, "epoch": 5243} {"train_loss": -26.466516494750977, "global_step": 435217, "epoch": 5243} {"train_loss": -26.61246681213379, "global_step": 435218, "epoch": 5243} {"train_loss": -26.974584579467773, "global_step": 435219, "epoch": 5243} {"train_loss": -27.119293212890625, "global_step": 435220, "epoch": 5243} {"train_loss": -26.614450454711914, "global_step": 435221, "epoch": 5243} {"train_loss": -26.96783447265625, "global_step": 435222, "epoch": 5243} {"train_loss": -26.618925094604492, "global_step": 435223, "epoch": 5243} {"train_loss": -26.794055938720703, "global_step": 435224, "epoch": 5243} {"train_loss": -26.63638687133789, "global_step": 435225, "epoch": 5243} {"train_loss": -26.862661361694336, "global_step": 435226, "epoch": 5243} {"train_loss": -26.841588973999023, "global_step": 435227, "epoch": 5243} {"train_loss": -26.6428279876709, "global_step": 435228, "epoch": 5243} {"train_loss": -27.04961585998535, "global_step": 435229, "epoch": 5243} {"train_loss": -26.256460189819336, "global_step": 435230, "epoch": 5243} {"train_loss": -26.635330200195312, "global_step": 435231, "epoch": 5243} {"train_loss": -26.363210678100586, "global_step": 435232, "epoch": 5243} {"train_loss": -26.8418025970459, "global_step": 435233, "epoch": 5243} {"train_loss": -26.819461822509766, "global_step": 435234, "epoch": 5243} {"train_loss": -26.986730575561523, "global_step": 435235, "epoch": 5243} {"train_loss": -26.571069717407227, "global_step": 435236, "epoch": 5243} {"train_loss": -26.764623641967773, "global_step": 435237, "epoch": 5243} {"train_loss": -26.656951904296875, "global_step": 435238, "epoch": 5243} {"train_loss": -27.167774200439453, "global_step": 435239, "epoch": 5243} {"train_loss": -27.04398536682129, "global_step": 435240, "epoch": 5243} {"train_loss": -26.88692283630371, "global_step": 435241, "epoch": 5243} {"train_loss": -27.2021427154541, "global_step": 435242, "epoch": 5243} {"train_loss": -26.4890079498291, "global_step": 435243, "epoch": 5243} {"train_loss": -27.020832061767578, "global_step": 435244, "epoch": 5243} {"train_loss": -26.858722686767578, "global_step": 435245, "epoch": 5243} {"train_loss": -26.57065773010254, "global_step": 435246, "epoch": 5243} {"train_loss": -26.885669708251953, "global_step": 435247, "epoch": 5243} {"train_loss": -27.49493980407715, "global_step": 435248, "epoch": 5243} {"train_loss": -26.8260440826416, "global_step": 435249, "epoch": 5243} {"train_loss": -26.930923461914062, "global_step": 435250, "epoch": 5243} {"train_loss": -26.774208528449737, "global_step": 435251, "epoch": 5243, "val_loss": 6579084.0} {"train_loss": -26.710336685180664, "global_step": 435252, "epoch": 5244} {"train_loss": -26.339990615844727, "global_step": 435253, "epoch": 5244} {"train_loss": -26.585235595703125, "global_step": 435254, "epoch": 5244} {"train_loss": -26.902746200561523, "global_step": 435255, "epoch": 5244} {"train_loss": -26.882776260375977, "global_step": 435256, "epoch": 5244} {"train_loss": -26.828332901000977, "global_step": 435257, "epoch": 5244} {"train_loss": -26.98305320739746, "global_step": 435258, "epoch": 5244} {"train_loss": -26.68610954284668, "global_step": 435259, "epoch": 5244} {"train_loss": -26.550012588500977, "global_step": 435260, "epoch": 5244} {"train_loss": -26.696943283081055, "global_step": 435261, "epoch": 5244} {"train_loss": -26.859622955322266, "global_step": 435262, "epoch": 5244} {"train_loss": -27.104543685913086, "global_step": 435263, "epoch": 5244} {"train_loss": -26.75616455078125, "global_step": 435264, "epoch": 5244} {"train_loss": -26.402297973632812, "global_step": 435265, "epoch": 5244} {"train_loss": -26.06159782409668, "global_step": 435266, "epoch": 5244} {"train_loss": -26.416614532470703, "global_step": 435267, "epoch": 5244} {"train_loss": -26.67424964904785, "global_step": 435268, "epoch": 5244} {"train_loss": -26.8969783782959, "global_step": 435269, "epoch": 5244} {"train_loss": -26.876571655273438, "global_step": 435270, "epoch": 5244} {"train_loss": -26.695953369140625, "global_step": 435271, "epoch": 5244} {"train_loss": -26.709930419921875, "global_step": 435272, "epoch": 5244} {"train_loss": -26.90976905822754, "global_step": 435273, "epoch": 5244} {"train_loss": -26.85638427734375, "global_step": 435274, "epoch": 5244} {"train_loss": -26.828413009643555, "global_step": 435275, "epoch": 5244} {"train_loss": -26.999286651611328, "global_step": 435276, "epoch": 5244} {"train_loss": -26.76202392578125, "global_step": 435277, "epoch": 5244} {"train_loss": -26.862516403198242, "global_step": 435278, "epoch": 5244} {"train_loss": -26.641035079956055, "global_step": 435279, "epoch": 5244} {"train_loss": -27.108261108398438, "global_step": 435280, "epoch": 5244} {"train_loss": -26.714618682861328, "global_step": 435281, "epoch": 5244} {"train_loss": -26.826847076416016, "global_step": 435282, "epoch": 5244} {"train_loss": -27.018957138061523, "global_step": 435283, "epoch": 5244} {"train_loss": -27.154081344604492, "global_step": 435284, "epoch": 5244} {"train_loss": -27.344135284423828, "global_step": 435285, "epoch": 5244} {"train_loss": -27.241376876831055, "global_step": 435286, "epoch": 5244} {"train_loss": -27.143476486206055, "global_step": 435287, "epoch": 5244} {"train_loss": -27.03143310546875, "global_step": 435288, "epoch": 5244} {"train_loss": -26.98565101623535, "global_step": 435289, "epoch": 5244} {"train_loss": -26.943592071533203, "global_step": 435290, "epoch": 5244} {"train_loss": -27.003198623657227, "global_step": 435291, "epoch": 5244} {"train_loss": -26.98123550415039, "global_step": 435292, "epoch": 5244} {"train_loss": -27.319162368774414, "global_step": 435293, "epoch": 5244} {"train_loss": -26.9397029876709, "global_step": 435294, "epoch": 5244} {"train_loss": -27.45697021484375, "global_step": 435295, "epoch": 5244} {"train_loss": -27.22804069519043, "global_step": 435296, "epoch": 5244} {"train_loss": -27.303373336791992, "global_step": 435297, "epoch": 5244} {"train_loss": -27.05984878540039, "global_step": 435298, "epoch": 5244} {"train_loss": -27.002838134765625, "global_step": 435299, "epoch": 5244} {"train_loss": -26.510602951049805, "global_step": 435300, "epoch": 5244} {"train_loss": -26.954742431640625, "global_step": 435301, "epoch": 5244} {"train_loss": -27.226160049438477, "global_step": 435302, "epoch": 5244} {"train_loss": -26.851099014282227, "global_step": 435303, "epoch": 5244} {"train_loss": -26.788129806518555, "global_step": 435304, "epoch": 5244} {"train_loss": -26.719318389892578, "global_step": 435305, "epoch": 5244} {"train_loss": -27.12961196899414, "global_step": 435306, "epoch": 5244} {"train_loss": -27.013227462768555, "global_step": 435307, "epoch": 5244} {"train_loss": -26.742862701416016, "global_step": 435308, "epoch": 5244} {"train_loss": -27.041711807250977, "global_step": 435309, "epoch": 5244} {"train_loss": -26.980947494506836, "global_step": 435310, "epoch": 5244} {"train_loss": -26.834531784057617, "global_step": 435311, "epoch": 5244} {"train_loss": -26.39166259765625, "global_step": 435312, "epoch": 5244} {"train_loss": -26.588153839111328, "global_step": 435313, "epoch": 5244} {"train_loss": -26.10516357421875, "global_step": 435314, "epoch": 5244} {"train_loss": -25.83407974243164, "global_step": 435315, "epoch": 5244} {"train_loss": -26.810199737548828, "global_step": 435316, "epoch": 5244} {"train_loss": -26.503376007080078, "global_step": 435317, "epoch": 5244} {"train_loss": -26.4917049407959, "global_step": 435318, "epoch": 5244} {"train_loss": -26.726484298706055, "global_step": 435319, "epoch": 5244} {"train_loss": -26.646289825439453, "global_step": 435320, "epoch": 5244} {"train_loss": -26.72153663635254, "global_step": 435321, "epoch": 5244} {"train_loss": -26.63973045349121, "global_step": 435322, "epoch": 5244} {"train_loss": -26.85999870300293, "global_step": 435323, "epoch": 5244} {"train_loss": -26.94170570373535, "global_step": 435324, "epoch": 5244} {"train_loss": -26.81857681274414, "global_step": 435325, "epoch": 5244} {"train_loss": -26.68389320373535, "global_step": 435326, "epoch": 5244} {"train_loss": -26.64277458190918, "global_step": 435327, "epoch": 5244} {"train_loss": -26.80255699157715, "global_step": 435328, "epoch": 5244} {"train_loss": -26.98834800720215, "global_step": 435329, "epoch": 5244} {"train_loss": -26.7404842376709, "global_step": 435330, "epoch": 5244} {"train_loss": -27.087629318237305, "global_step": 435331, "epoch": 5244} {"train_loss": -26.46259880065918, "global_step": 435332, "epoch": 5244} {"train_loss": -27.327991485595703, "global_step": 435333, "epoch": 5244} {"train_loss": -26.832713046705866, "global_step": 435334, "epoch": 5244, "val_loss": 6658561.0} {"train_loss": -26.353057861328125, "global_step": 435335, "epoch": 5245} {"train_loss": -26.0181827545166, "global_step": 435336, "epoch": 5245} {"train_loss": -25.891067504882812, "global_step": 435337, "epoch": 5245} {"train_loss": -26.42757225036621, "global_step": 435338, "epoch": 5245} {"train_loss": -26.56135368347168, "global_step": 435339, "epoch": 5245} {"train_loss": -26.2346248626709, "global_step": 435340, "epoch": 5245} {"train_loss": -26.58612060546875, "global_step": 435341, "epoch": 5245} {"train_loss": -26.358600616455078, "global_step": 435342, "epoch": 5245} {"train_loss": -26.524642944335938, "global_step": 435343, "epoch": 5245} {"train_loss": -26.756147384643555, "global_step": 435344, "epoch": 5245} {"train_loss": -26.498559951782227, "global_step": 435345, "epoch": 5245} {"train_loss": -26.359445571899414, "global_step": 435346, "epoch": 5245} {"train_loss": -26.357873916625977, "global_step": 435347, "epoch": 5245} {"train_loss": -26.612751007080078, "global_step": 435348, "epoch": 5245} {"train_loss": -26.869184494018555, "global_step": 435349, "epoch": 5245} {"train_loss": -26.54597282409668, "global_step": 435350, "epoch": 5245} {"train_loss": -26.972137451171875, "global_step": 435351, "epoch": 5245} {"train_loss": -26.51519775390625, "global_step": 435352, "epoch": 5245} {"train_loss": -26.46932029724121, "global_step": 435353, "epoch": 5245} {"train_loss": -26.535720825195312, "global_step": 435354, "epoch": 5245} {"train_loss": -26.635822296142578, "global_step": 435355, "epoch": 5245} {"train_loss": -26.8602237701416, "global_step": 435356, "epoch": 5245} {"train_loss": -26.816308975219727, "global_step": 435357, "epoch": 5245} {"train_loss": -27.034626007080078, "global_step": 435358, "epoch": 5245} {"train_loss": -26.441162109375, "global_step": 435359, "epoch": 5245} {"train_loss": -27.23394775390625, "global_step": 435360, "epoch": 5245} {"train_loss": -26.0982723236084, "global_step": 435361, "epoch": 5245} {"train_loss": -26.664621353149414, "global_step": 435362, "epoch": 5245} {"train_loss": -26.612577438354492, "global_step": 435363, "epoch": 5245} {"train_loss": -26.842554092407227, "global_step": 435364, "epoch": 5245} {"train_loss": -26.93058204650879, "global_step": 435365, "epoch": 5245} {"train_loss": -27.13364601135254, "global_step": 435366, "epoch": 5245} {"train_loss": -26.632831573486328, "global_step": 435367, "epoch": 5245} {"train_loss": -27.151996612548828, "global_step": 435368, "epoch": 5245} {"train_loss": -26.71943473815918, "global_step": 435369, "epoch": 5245} {"train_loss": -26.718997955322266, "global_step": 435370, "epoch": 5245} {"train_loss": -26.9349365234375, "global_step": 435371, "epoch": 5245} {"train_loss": -26.630401611328125, "global_step": 435372, "epoch": 5245} {"train_loss": -26.850116729736328, "global_step": 435373, "epoch": 5245} {"train_loss": -27.27412223815918, "global_step": 435374, "epoch": 5245} {"train_loss": -26.643301010131836, "global_step": 435375, "epoch": 5245} {"train_loss": -27.042444229125977, "global_step": 435376, "epoch": 5245} {"train_loss": -27.00042724609375, "global_step": 435377, "epoch": 5245} {"train_loss": -26.850271224975586, "global_step": 435378, "epoch": 5245} {"train_loss": -26.977869033813477, "global_step": 435379, "epoch": 5245} {"train_loss": -26.940185546875, "global_step": 435380, "epoch": 5245} {"train_loss": -26.898502349853516, "global_step": 435381, "epoch": 5245} {"train_loss": -26.80950927734375, "global_step": 435382, "epoch": 5245} {"train_loss": -27.039112091064453, "global_step": 435383, "epoch": 5245} {"train_loss": -26.720565795898438, "global_step": 435384, "epoch": 5245} {"train_loss": -27.01380729675293, "global_step": 435385, "epoch": 5245} {"train_loss": -26.945478439331055, "global_step": 435386, "epoch": 5245} {"train_loss": -26.9927978515625, "global_step": 435387, "epoch": 5245} {"train_loss": -26.749143600463867, "global_step": 435388, "epoch": 5245} {"train_loss": -26.9097900390625, "global_step": 435389, "epoch": 5245} {"train_loss": -26.98870277404785, "global_step": 435390, "epoch": 5245} {"train_loss": -27.3548526763916, "global_step": 435391, "epoch": 5245} {"train_loss": -27.239532470703125, "global_step": 435392, "epoch": 5245} {"train_loss": -27.1553897857666, "global_step": 435393, "epoch": 5245} {"train_loss": -26.905303955078125, "global_step": 435394, "epoch": 5245} {"train_loss": -26.701282501220703, "global_step": 435395, "epoch": 5245} {"train_loss": -26.680286407470703, "global_step": 435396, "epoch": 5245} {"train_loss": -26.63787269592285, "global_step": 435397, "epoch": 5245} {"train_loss": -26.49338722229004, "global_step": 435398, "epoch": 5245} {"train_loss": -27.076940536499023, "global_step": 435399, "epoch": 5245} {"train_loss": -26.864660263061523, "global_step": 435400, "epoch": 5245} {"train_loss": -26.85542106628418, "global_step": 435401, "epoch": 5245} {"train_loss": -26.742435455322266, "global_step": 435402, "epoch": 5245} {"train_loss": -26.81915855407715, "global_step": 435403, "epoch": 5245} {"train_loss": -27.014942169189453, "global_step": 435404, "epoch": 5245} {"train_loss": -26.9033260345459, "global_step": 435405, "epoch": 5245} {"train_loss": -26.775922775268555, "global_step": 435406, "epoch": 5245} {"train_loss": -26.748136520385742, "global_step": 435407, "epoch": 5245} {"train_loss": -27.014698028564453, "global_step": 435408, "epoch": 5245} {"train_loss": -26.697126388549805, "global_step": 435409, "epoch": 5245} {"train_loss": -26.958255767822266, "global_step": 435410, "epoch": 5245} {"train_loss": -27.0333251953125, "global_step": 435411, "epoch": 5245} {"train_loss": -26.91529655456543, "global_step": 435412, "epoch": 5245} {"train_loss": -26.837848663330078, "global_step": 435413, "epoch": 5245} {"train_loss": -26.97467613220215, "global_step": 435414, "epoch": 5245} {"train_loss": -26.92972183227539, "global_step": 435415, "epoch": 5245} {"train_loss": -27.077917098999023, "global_step": 435416, "epoch": 5245} {"train_loss": -26.775726548160414, "global_step": 435417, "epoch": 5245, "val_loss": 6720742.0} {"train_loss": -26.4007625579834, "global_step": 435418, "epoch": 5246} {"train_loss": -26.75973892211914, "global_step": 435419, "epoch": 5246} {"train_loss": -26.324697494506836, "global_step": 435420, "epoch": 5246} {"train_loss": -27.017499923706055, "global_step": 435421, "epoch": 5246} {"train_loss": -27.018117904663086, "global_step": 435422, "epoch": 5246} {"train_loss": -26.619998931884766, "global_step": 435423, "epoch": 5246} {"train_loss": -26.722827911376953, "global_step": 435424, "epoch": 5246} {"train_loss": -26.8048038482666, "global_step": 435425, "epoch": 5246} {"train_loss": -27.004913330078125, "global_step": 435426, "epoch": 5246} {"train_loss": -27.313312530517578, "global_step": 435427, "epoch": 5246} {"train_loss": -27.019775390625, "global_step": 435428, "epoch": 5246} {"train_loss": -27.021753311157227, "global_step": 435429, "epoch": 5246} {"train_loss": -26.93219566345215, "global_step": 435430, "epoch": 5246} {"train_loss": -26.99126625061035, "global_step": 435431, "epoch": 5246} {"train_loss": -27.0175838470459, "global_step": 435432, "epoch": 5246} {"train_loss": -26.640905380249023, "global_step": 435433, "epoch": 5246} {"train_loss": -27.170093536376953, "global_step": 435434, "epoch": 5246} {"train_loss": -26.93406105041504, "global_step": 435435, "epoch": 5246} {"train_loss": -26.994571685791016, "global_step": 435436, "epoch": 5246} {"train_loss": -26.883365631103516, "global_step": 435437, "epoch": 5246} {"train_loss": -26.9636287689209, "global_step": 435438, "epoch": 5246} {"train_loss": -27.08688735961914, "global_step": 435439, "epoch": 5246} {"train_loss": -27.025848388671875, "global_step": 435440, "epoch": 5246} {"train_loss": -26.452253341674805, "global_step": 435441, "epoch": 5246} {"train_loss": -26.5476131439209, "global_step": 435442, "epoch": 5246} {"train_loss": -26.7862548828125, "global_step": 435443, "epoch": 5246} {"train_loss": -27.133535385131836, "global_step": 435444, "epoch": 5246} {"train_loss": -26.755441665649414, "global_step": 435445, "epoch": 5246} {"train_loss": -26.268604278564453, "global_step": 435446, "epoch": 5246} {"train_loss": -26.05816650390625, "global_step": 435447, "epoch": 5246} {"train_loss": -26.3283748626709, "global_step": 435448, "epoch": 5246} {"train_loss": -26.54804039001465, "global_step": 435449, "epoch": 5246} {"train_loss": -26.753284454345703, "global_step": 435450, "epoch": 5246} {"train_loss": -26.660837173461914, "global_step": 435451, "epoch": 5246} {"train_loss": -26.900476455688477, "global_step": 435452, "epoch": 5246} {"train_loss": -26.71784019470215, "global_step": 435453, "epoch": 5246} {"train_loss": -26.53421974182129, "global_step": 435454, "epoch": 5246} {"train_loss": -26.925230026245117, "global_step": 435455, "epoch": 5246} {"train_loss": -26.893163681030273, "global_step": 435456, "epoch": 5246} {"train_loss": -26.874664306640625, "global_step": 435457, "epoch": 5246} {"train_loss": -26.641387939453125, "global_step": 435458, "epoch": 5246} {"train_loss": -27.040990829467773, "global_step": 435459, "epoch": 5246} {"train_loss": -27.02374267578125, "global_step": 435460, "epoch": 5246} {"train_loss": -26.53059196472168, "global_step": 435461, "epoch": 5246} {"train_loss": -26.470685958862305, "global_step": 435462, "epoch": 5246} {"train_loss": -27.00355339050293, "global_step": 435463, "epoch": 5246} {"train_loss": -26.833173751831055, "global_step": 435464, "epoch": 5246} {"train_loss": -26.787683486938477, "global_step": 435465, "epoch": 5246} {"train_loss": -26.97833824157715, "global_step": 435466, "epoch": 5246} {"train_loss": -26.5738468170166, "global_step": 435467, "epoch": 5246} {"train_loss": -26.820493698120117, "global_step": 435468, "epoch": 5246} {"train_loss": -26.590429306030273, "global_step": 435469, "epoch": 5246} {"train_loss": -27.046161651611328, "global_step": 435470, "epoch": 5246} {"train_loss": -27.018264770507812, "global_step": 435471, "epoch": 5246} {"train_loss": -26.798358917236328, "global_step": 435472, "epoch": 5246} {"train_loss": -27.090118408203125, "global_step": 435473, "epoch": 5246} {"train_loss": -26.886255264282227, "global_step": 435474, "epoch": 5246} {"train_loss": -26.918746948242188, "global_step": 435475, "epoch": 5246} {"train_loss": -27.107873916625977, "global_step": 435476, "epoch": 5246} {"train_loss": -27.00852394104004, "global_step": 435477, "epoch": 5246} {"train_loss": -26.718536376953125, "global_step": 435478, "epoch": 5246} {"train_loss": -26.831586837768555, "global_step": 435479, "epoch": 5246} {"train_loss": -27.10016441345215, "global_step": 435480, "epoch": 5246} {"train_loss": -26.94980239868164, "global_step": 435481, "epoch": 5246} {"train_loss": -26.876117706298828, "global_step": 435482, "epoch": 5246} {"train_loss": -27.179412841796875, "global_step": 435483, "epoch": 5246} {"train_loss": -27.154356002807617, "global_step": 435484, "epoch": 5246} {"train_loss": -26.859088897705078, "global_step": 435485, "epoch": 5246} {"train_loss": -26.91743278503418, "global_step": 435486, "epoch": 5246} {"train_loss": -27.339370727539062, "global_step": 435487, "epoch": 5246} {"train_loss": -26.849994659423828, "global_step": 435488, "epoch": 5246} {"train_loss": -26.812620162963867, "global_step": 435489, "epoch": 5246} {"train_loss": -26.94272804260254, "global_step": 435490, "epoch": 5246} {"train_loss": -27.01630210876465, "global_step": 435491, "epoch": 5246} {"train_loss": -27.176733016967773, "global_step": 435492, "epoch": 5246} {"train_loss": -26.756290435791016, "global_step": 435493, "epoch": 5246} {"train_loss": -27.03407096862793, "global_step": 435494, "epoch": 5246} {"train_loss": -26.87847900390625, "global_step": 435495, "epoch": 5246} {"train_loss": -26.391660690307617, "global_step": 435496, "epoch": 5246} {"train_loss": -26.630054473876953, "global_step": 435497, "epoch": 5246} {"train_loss": -26.736587524414062, "global_step": 435498, "epoch": 5246} {"train_loss": -27.0496883392334, "global_step": 435499, "epoch": 5246} {"train_loss": -26.8522295894393, "global_step": 435500, "epoch": 5246, "val_loss": 6691865.0} {"train_loss": -24.57246208190918, "global_step": 435501, "epoch": 5247} {"train_loss": -23.469961166381836, "global_step": 435502, "epoch": 5247} {"train_loss": -24.802860260009766, "global_step": 435503, "epoch": 5247} {"train_loss": -25.355546951293945, "global_step": 435504, "epoch": 5247} {"train_loss": -24.874008178710938, "global_step": 435505, "epoch": 5247} {"train_loss": -25.69985008239746, "global_step": 435506, "epoch": 5247} {"train_loss": -25.516454696655273, "global_step": 435507, "epoch": 5247} {"train_loss": -25.825937271118164, "global_step": 435508, "epoch": 5247} {"train_loss": -25.243539810180664, "global_step": 435509, "epoch": 5247} {"train_loss": -26.051727294921875, "global_step": 435510, "epoch": 5247} {"train_loss": -25.77564811706543, "global_step": 435511, "epoch": 5247} {"train_loss": -26.0616397857666, "global_step": 435512, "epoch": 5247} {"train_loss": -25.896865844726562, "global_step": 435513, "epoch": 5247} {"train_loss": -25.922128677368164, "global_step": 435514, "epoch": 5247} {"train_loss": -25.781036376953125, "global_step": 435515, "epoch": 5247} {"train_loss": -26.076618194580078, "global_step": 435516, "epoch": 5247} {"train_loss": -26.129858016967773, "global_step": 435517, "epoch": 5247} {"train_loss": -25.995880126953125, "global_step": 435518, "epoch": 5247} {"train_loss": -25.85861587524414, "global_step": 435519, "epoch": 5247} {"train_loss": -26.079214096069336, "global_step": 435520, "epoch": 5247} {"train_loss": -25.92621421813965, "global_step": 435521, "epoch": 5247} {"train_loss": -26.355993270874023, "global_step": 435522, "epoch": 5247} {"train_loss": -26.192142486572266, "global_step": 435523, "epoch": 5247} {"train_loss": -26.322589874267578, "global_step": 435524, "epoch": 5247} {"train_loss": -26.208038330078125, "global_step": 435525, "epoch": 5247} {"train_loss": -26.146499633789062, "global_step": 435526, "epoch": 5247} {"train_loss": -26.329557418823242, "global_step": 435527, "epoch": 5247} {"train_loss": -26.16499137878418, "global_step": 435528, "epoch": 5247} {"train_loss": -26.26637077331543, "global_step": 435529, "epoch": 5247} {"train_loss": -26.246932983398438, "global_step": 435530, "epoch": 5247} {"train_loss": -26.438262939453125, "global_step": 435531, "epoch": 5247} {"train_loss": -26.45615005493164, "global_step": 435532, "epoch": 5247} {"train_loss": -26.62615966796875, "global_step": 435533, "epoch": 5247} {"train_loss": -26.392654418945312, "global_step": 435534, "epoch": 5247} {"train_loss": -26.659494400024414, "global_step": 435535, "epoch": 5247} {"train_loss": -26.941181182861328, "global_step": 435536, "epoch": 5247} {"train_loss": -26.869260787963867, "global_step": 435537, "epoch": 5247} {"train_loss": -26.586959838867188, "global_step": 435538, "epoch": 5247} {"train_loss": -26.511707305908203, "global_step": 435539, "epoch": 5247} {"train_loss": -26.603885650634766, "global_step": 435540, "epoch": 5247} {"train_loss": -26.5214900970459, "global_step": 435541, "epoch": 5247} {"train_loss": -26.646753311157227, "global_step": 435542, "epoch": 5247} {"train_loss": -26.894147872924805, "global_step": 435543, "epoch": 5247} {"train_loss": -26.55828285217285, "global_step": 435544, "epoch": 5247} {"train_loss": -26.915075302124023, "global_step": 435545, "epoch": 5247} {"train_loss": -26.64533042907715, "global_step": 435546, "epoch": 5247} {"train_loss": -27.039655685424805, "global_step": 435547, "epoch": 5247} {"train_loss": -27.111347198486328, "global_step": 435548, "epoch": 5247} {"train_loss": -26.936084747314453, "global_step": 435549, "epoch": 5247} {"train_loss": -26.63197135925293, "global_step": 435550, "epoch": 5247} {"train_loss": -26.921674728393555, "global_step": 435551, "epoch": 5247} {"train_loss": -26.64149284362793, "global_step": 435552, "epoch": 5247} {"train_loss": -26.9920654296875, "global_step": 435553, "epoch": 5247} {"train_loss": -26.994220733642578, "global_step": 435554, "epoch": 5247} {"train_loss": -27.223358154296875, "global_step": 435555, "epoch": 5247} {"train_loss": -26.9069881439209, "global_step": 435556, "epoch": 5247} {"train_loss": -26.899396896362305, "global_step": 435557, "epoch": 5247} {"train_loss": -26.787839889526367, "global_step": 435558, "epoch": 5247} {"train_loss": -27.578397750854492, "global_step": 435559, "epoch": 5247} {"train_loss": -27.154638290405273, "global_step": 435560, "epoch": 5247} {"train_loss": -27.309890747070312, "global_step": 435561, "epoch": 5247} {"train_loss": -27.159835815429688, "global_step": 435562, "epoch": 5247} {"train_loss": -26.9625301361084, "global_step": 435563, "epoch": 5247} {"train_loss": -27.10502052307129, "global_step": 435564, "epoch": 5247} {"train_loss": -27.228748321533203, "global_step": 435565, "epoch": 5247} {"train_loss": -27.174392700195312, "global_step": 435566, "epoch": 5247} {"train_loss": -27.283161163330078, "global_step": 435567, "epoch": 5247} {"train_loss": -26.918935775756836, "global_step": 435568, "epoch": 5247} {"train_loss": -26.856576919555664, "global_step": 435569, "epoch": 5247} {"train_loss": -27.137603759765625, "global_step": 435570, "epoch": 5247} {"train_loss": -27.321399688720703, "global_step": 435571, "epoch": 5247} {"train_loss": -27.1390438079834, "global_step": 435572, "epoch": 5247} {"train_loss": -27.224206924438477, "global_step": 435573, "epoch": 5247} {"train_loss": -26.77337074279785, "global_step": 435574, "epoch": 5247} {"train_loss": -26.438140869140625, "global_step": 435575, "epoch": 5247} {"train_loss": -26.128555297851562, "global_step": 435576, "epoch": 5247} {"train_loss": -25.41693687438965, "global_step": 435577, "epoch": 5247} {"train_loss": -25.708600997924805, "global_step": 435578, "epoch": 5247} {"train_loss": -27.042388916015625, "global_step": 435579, "epoch": 5247} {"train_loss": -26.850818634033203, "global_step": 435580, "epoch": 5247} {"train_loss": -26.38697624206543, "global_step": 435581, "epoch": 5247} {"train_loss": -26.780736923217773, "global_step": 435582, "epoch": 5247} {"train_loss": -26.446397023028638, "global_step": 435583, "epoch": 5247, "val_loss": 6759497.0} {"train_loss": -26.399627685546875, "global_step": 435584, "epoch": 5248} {"train_loss": -25.73090934753418, "global_step": 435585, "epoch": 5248} {"train_loss": -26.080062866210938, "global_step": 435586, "epoch": 5248} {"train_loss": -26.348554611206055, "global_step": 435587, "epoch": 5248} {"train_loss": -26.04498863220215, "global_step": 435588, "epoch": 5248} {"train_loss": -26.169830322265625, "global_step": 435589, "epoch": 5248} {"train_loss": -26.20355224609375, "global_step": 435590, "epoch": 5248} {"train_loss": -25.8409366607666, "global_step": 435591, "epoch": 5248} {"train_loss": -26.361661911010742, "global_step": 435592, "epoch": 5248} {"train_loss": -26.57246971130371, "global_step": 435593, "epoch": 5248} {"train_loss": -26.17643165588379, "global_step": 435594, "epoch": 5248} {"train_loss": -26.4508113861084, "global_step": 435595, "epoch": 5248} {"train_loss": -26.413074493408203, "global_step": 435596, "epoch": 5248} {"train_loss": -25.78006362915039, "global_step": 435597, "epoch": 5248} {"train_loss": -26.5257511138916, "global_step": 435598, "epoch": 5248} {"train_loss": -26.14943504333496, "global_step": 435599, "epoch": 5248} {"train_loss": -26.35249900817871, "global_step": 435600, "epoch": 5248} {"train_loss": -26.45476722717285, "global_step": 435601, "epoch": 5248} {"train_loss": -26.184940338134766, "global_step": 435602, "epoch": 5248} {"train_loss": -26.65876579284668, "global_step": 435603, "epoch": 5248} {"train_loss": -26.502735137939453, "global_step": 435604, "epoch": 5248} {"train_loss": -26.36151123046875, "global_step": 435605, "epoch": 5248} {"train_loss": -26.661985397338867, "global_step": 435606, "epoch": 5248} {"train_loss": -26.571088790893555, "global_step": 435607, "epoch": 5248} {"train_loss": -26.593915939331055, "global_step": 435608, "epoch": 5248} {"train_loss": -27.091094970703125, "global_step": 435609, "epoch": 5248} {"train_loss": -26.669462203979492, "global_step": 435610, "epoch": 5248} {"train_loss": -26.927820205688477, "global_step": 435611, "epoch": 5248} {"train_loss": -27.163297653198242, "global_step": 435612, "epoch": 5248} {"train_loss": -26.71307373046875, "global_step": 435613, "epoch": 5248} {"train_loss": -26.79768943786621, "global_step": 435614, "epoch": 5248} {"train_loss": -26.900684356689453, "global_step": 435615, "epoch": 5248} {"train_loss": -26.796295166015625, "global_step": 435616, "epoch": 5248} {"train_loss": -26.990863800048828, "global_step": 435617, "epoch": 5248} {"train_loss": -26.6447696685791, "global_step": 435618, "epoch": 5248} {"train_loss": -26.932382583618164, "global_step": 435619, "epoch": 5248} {"train_loss": -26.65631103515625, "global_step": 435620, "epoch": 5248} {"train_loss": -26.85947036743164, "global_step": 435621, "epoch": 5248} {"train_loss": -27.305906295776367, "global_step": 435622, "epoch": 5248} {"train_loss": -27.103986740112305, "global_step": 435623, "epoch": 5248} {"train_loss": -26.905242919921875, "global_step": 435624, "epoch": 5248} {"train_loss": -27.115341186523438, "global_step": 435625, "epoch": 5248} {"train_loss": -26.948596954345703, "global_step": 435626, "epoch": 5248} {"train_loss": -27.038318634033203, "global_step": 435627, "epoch": 5248} {"train_loss": -27.15321922302246, "global_step": 435628, "epoch": 5248} {"train_loss": -26.99540138244629, "global_step": 435629, "epoch": 5248} {"train_loss": -26.650806427001953, "global_step": 435630, "epoch": 5248} {"train_loss": -26.7586727142334, "global_step": 435631, "epoch": 5248} {"train_loss": -26.756427764892578, "global_step": 435632, "epoch": 5248} {"train_loss": -26.839405059814453, "global_step": 435633, "epoch": 5248} {"train_loss": -26.8267879486084, "global_step": 435634, "epoch": 5248} {"train_loss": -26.818052291870117, "global_step": 435635, "epoch": 5248} {"train_loss": -27.21185874938965, "global_step": 435636, "epoch": 5248} {"train_loss": -26.734960556030273, "global_step": 435637, "epoch": 5248} {"train_loss": -26.8645076751709, "global_step": 435638, "epoch": 5248} {"train_loss": -26.880767822265625, "global_step": 435639, "epoch": 5248} {"train_loss": -26.999109268188477, "global_step": 435640, "epoch": 5248} {"train_loss": -27.42511558532715, "global_step": 435641, "epoch": 5248} {"train_loss": -26.66912269592285, "global_step": 435642, "epoch": 5248} {"train_loss": -26.853967666625977, "global_step": 435643, "epoch": 5248} {"train_loss": -27.0365047454834, "global_step": 435644, "epoch": 5248} {"train_loss": -27.012006759643555, "global_step": 435645, "epoch": 5248} {"train_loss": -27.126569747924805, "global_step": 435646, "epoch": 5248} {"train_loss": -26.851612091064453, "global_step": 435647, "epoch": 5248} {"train_loss": -27.04277992248535, "global_step": 435648, "epoch": 5248} {"train_loss": -26.938953399658203, "global_step": 435649, "epoch": 5248} {"train_loss": -26.89286231994629, "global_step": 435650, "epoch": 5248} {"train_loss": -27.007526397705078, "global_step": 435651, "epoch": 5248} {"train_loss": -27.332815170288086, "global_step": 435652, "epoch": 5248} {"train_loss": -26.85169792175293, "global_step": 435653, "epoch": 5248} {"train_loss": -27.31537437438965, "global_step": 435654, "epoch": 5248} {"train_loss": -26.743072509765625, "global_step": 435655, "epoch": 5248} {"train_loss": -26.816883087158203, "global_step": 435656, "epoch": 5248} {"train_loss": -27.072668075561523, "global_step": 435657, "epoch": 5248} {"train_loss": -26.80873680114746, "global_step": 435658, "epoch": 5248} {"train_loss": -26.84998893737793, "global_step": 435659, "epoch": 5248} {"train_loss": -27.13836097717285, "global_step": 435660, "epoch": 5248} {"train_loss": -26.736677169799805, "global_step": 435661, "epoch": 5248} {"train_loss": -27.042150497436523, "global_step": 435662, "epoch": 5248} {"train_loss": -27.024911880493164, "global_step": 435663, "epoch": 5248} {"train_loss": -27.123769760131836, "global_step": 435664, "epoch": 5248} {"train_loss": -27.083328247070312, "global_step": 435665, "epoch": 5248} {"train_loss": -26.74024876054511, "global_step": 435666, "epoch": 5248, "val_loss": 6698843.0} {"train_loss": -25.79204750061035, "global_step": 435667, "epoch": 5249} {"train_loss": -23.766950607299805, "global_step": 435668, "epoch": 5249} {"train_loss": -23.999122619628906, "global_step": 435669, "epoch": 5249} {"train_loss": -26.632919311523438, "global_step": 435670, "epoch": 5249} {"train_loss": -25.243005752563477, "global_step": 435671, "epoch": 5249} {"train_loss": -25.697553634643555, "global_step": 435672, "epoch": 5249} {"train_loss": -26.111270904541016, "global_step": 435673, "epoch": 5249} {"train_loss": -26.351003646850586, "global_step": 435674, "epoch": 5249} {"train_loss": -25.94453239440918, "global_step": 435675, "epoch": 5249} {"train_loss": -26.01112937927246, "global_step": 435676, "epoch": 5249} {"train_loss": -26.598114013671875, "global_step": 435677, "epoch": 5249} {"train_loss": -25.972829818725586, "global_step": 435678, "epoch": 5249} {"train_loss": -26.183399200439453, "global_step": 435679, "epoch": 5249} {"train_loss": -25.84156608581543, "global_step": 435680, "epoch": 5249} {"train_loss": -25.86261558532715, "global_step": 435681, "epoch": 5249} {"train_loss": -26.6566104888916, "global_step": 435682, "epoch": 5249} {"train_loss": -25.978055953979492, "global_step": 435683, "epoch": 5249} {"train_loss": -26.88311195373535, "global_step": 435684, "epoch": 5249} {"train_loss": -26.54127311706543, "global_step": 435685, "epoch": 5249} {"train_loss": -26.21793556213379, "global_step": 435686, "epoch": 5249} {"train_loss": -26.3875675201416, "global_step": 435687, "epoch": 5249} {"train_loss": -26.363300323486328, "global_step": 435688, "epoch": 5249} {"train_loss": -26.68562889099121, "global_step": 435689, "epoch": 5249} {"train_loss": -26.402435302734375, "global_step": 435690, "epoch": 5249} {"train_loss": -26.70624351501465, "global_step": 435691, "epoch": 5249} {"train_loss": -26.945087432861328, "global_step": 435692, "epoch": 5249} {"train_loss": -26.61572265625, "global_step": 435693, "epoch": 5249} {"train_loss": -27.017187118530273, "global_step": 435694, "epoch": 5249} {"train_loss": -27.03786277770996, "global_step": 435695, "epoch": 5249} {"train_loss": -26.340421676635742, "global_step": 435696, "epoch": 5249} {"train_loss": -27.26138687133789, "global_step": 435697, "epoch": 5249} {"train_loss": -26.612531661987305, "global_step": 435698, "epoch": 5249} {"train_loss": -26.506338119506836, "global_step": 435699, "epoch": 5249} {"train_loss": -26.915021896362305, "global_step": 435700, "epoch": 5249} {"train_loss": -26.758508682250977, "global_step": 435701, "epoch": 5249} {"train_loss": -26.90824317932129, "global_step": 435702, "epoch": 5249} {"train_loss": -26.895971298217773, "global_step": 435703, "epoch": 5249} {"train_loss": -26.619415283203125, "global_step": 435704, "epoch": 5249} {"train_loss": -26.805402755737305, "global_step": 435705, "epoch": 5249} {"train_loss": -26.558490753173828, "global_step": 435706, "epoch": 5249} {"train_loss": -26.899078369140625, "global_step": 435707, "epoch": 5249} {"train_loss": -26.866132736206055, "global_step": 435708, "epoch": 5249} {"train_loss": -26.88995361328125, "global_step": 435709, "epoch": 5249} {"train_loss": -27.155200958251953, "global_step": 435710, "epoch": 5249} {"train_loss": -26.976184844970703, "global_step": 435711, "epoch": 5249} {"train_loss": -26.825607299804688, "global_step": 435712, "epoch": 5249} {"train_loss": -26.745798110961914, "global_step": 435713, "epoch": 5249} {"train_loss": -27.13495445251465, "global_step": 435714, "epoch": 5249} {"train_loss": -27.193883895874023, "global_step": 435715, "epoch": 5249} {"train_loss": -26.942230224609375, "global_step": 435716, "epoch": 5249} {"train_loss": -27.04890251159668, "global_step": 435717, "epoch": 5249} {"train_loss": -26.885156631469727, "global_step": 435718, "epoch": 5249} {"train_loss": -26.775583267211914, "global_step": 435719, "epoch": 5249} {"train_loss": -27.074939727783203, "global_step": 435720, "epoch": 5249} {"train_loss": -27.396108627319336, "global_step": 435721, "epoch": 5249} {"train_loss": -27.050397872924805, "global_step": 435722, "epoch": 5249} {"train_loss": -26.7056827545166, "global_step": 435723, "epoch": 5249} {"train_loss": -27.316694259643555, "global_step": 435724, "epoch": 5249} {"train_loss": -27.082050323486328, "global_step": 435725, "epoch": 5249} {"train_loss": -27.206195831298828, "global_step": 435726, "epoch": 5249} {"train_loss": -27.12603187561035, "global_step": 435727, "epoch": 5249} {"train_loss": -26.915735244750977, "global_step": 435728, "epoch": 5249} {"train_loss": -27.03211784362793, "global_step": 435729, "epoch": 5249} {"train_loss": -26.733266830444336, "global_step": 435730, "epoch": 5249} {"train_loss": -26.59088134765625, "global_step": 435731, "epoch": 5249} {"train_loss": -27.226978302001953, "global_step": 435732, "epoch": 5249} {"train_loss": -26.67400550842285, "global_step": 435733, "epoch": 5249} {"train_loss": -26.661710739135742, "global_step": 435734, "epoch": 5249} {"train_loss": -26.817001342773438, "global_step": 435735, "epoch": 5249} {"train_loss": -26.6124210357666, "global_step": 435736, "epoch": 5249} {"train_loss": -26.971969604492188, "global_step": 435737, "epoch": 5249} {"train_loss": -26.861501693725586, "global_step": 435738, "epoch": 5249} {"train_loss": -26.750106811523438, "global_step": 435739, "epoch": 5249} {"train_loss": -27.060321807861328, "global_step": 435740, "epoch": 5249} {"train_loss": -26.975910186767578, "global_step": 435741, "epoch": 5249} {"train_loss": -26.751728057861328, "global_step": 435742, "epoch": 5249} {"train_loss": -27.276105880737305, "global_step": 435743, "epoch": 5249} {"train_loss": -26.925785064697266, "global_step": 435744, "epoch": 5249} {"train_loss": -26.584745407104492, "global_step": 435745, "epoch": 5249} {"train_loss": -27.06043815612793, "global_step": 435746, "epoch": 5249} {"train_loss": -26.968984603881836, "global_step": 435747, "epoch": 5249} {"train_loss": -26.078393936157227, "global_step": 435748, "epoch": 5249} {"train_loss": -26.613397506346185, "global_step": 435749, "epoch": 5249, "val_loss": 6647285.0} {"train_loss": -25.97974967956543, "global_step": 435750, "epoch": 5250} {"train_loss": -26.57301139831543, "global_step": 435751, "epoch": 5250} {"train_loss": -25.405256271362305, "global_step": 435752, "epoch": 5250} {"train_loss": -26.22962760925293, "global_step": 435753, "epoch": 5250} {"train_loss": -25.8748722076416, "global_step": 435754, "epoch": 5250} {"train_loss": -25.575302124023438, "global_step": 435755, "epoch": 5250} {"train_loss": -26.109149932861328, "global_step": 435756, "epoch": 5250} {"train_loss": -26.35442543029785, "global_step": 435757, "epoch": 5250} {"train_loss": -25.67626953125, "global_step": 435758, "epoch": 5250} {"train_loss": -26.21487808227539, "global_step": 435759, "epoch": 5250} {"train_loss": -26.086347579956055, "global_step": 435760, "epoch": 5250} {"train_loss": -26.745014190673828, "global_step": 435761, "epoch": 5250} {"train_loss": -26.016271591186523, "global_step": 435762, "epoch": 5250} {"train_loss": -26.344823837280273, "global_step": 435763, "epoch": 5250} {"train_loss": -26.318073272705078, "global_step": 435764, "epoch": 5250} {"train_loss": -26.371442794799805, "global_step": 435765, "epoch": 5250} {"train_loss": -26.328474044799805, "global_step": 435766, "epoch": 5250} {"train_loss": -26.749774932861328, "global_step": 435767, "epoch": 5250} {"train_loss": -26.6070499420166, "global_step": 435768, "epoch": 5250} {"train_loss": -26.483484268188477, "global_step": 435769, "epoch": 5250} {"train_loss": -26.214704513549805, "global_step": 435770, "epoch": 5250} {"train_loss": -26.40472984313965, "global_step": 435771, "epoch": 5250} {"train_loss": -26.50836753845215, "global_step": 435772, "epoch": 5250} {"train_loss": -26.499164581298828, "global_step": 435773, "epoch": 5250} {"train_loss": -26.488773345947266, "global_step": 435774, "epoch": 5250} {"train_loss": -26.83420753479004, "global_step": 435775, "epoch": 5250} {"train_loss": -26.584964752197266, "global_step": 435776, "epoch": 5250} {"train_loss": -26.90089225769043, "global_step": 435777, "epoch": 5250} {"train_loss": -26.5096378326416, "global_step": 435778, "epoch": 5250} {"train_loss": -26.67937660217285, "global_step": 435779, "epoch": 5250} {"train_loss": -26.480762481689453, "global_step": 435780, "epoch": 5250} {"train_loss": -26.777923583984375, "global_step": 435781, "epoch": 5250} {"train_loss": -26.936847686767578, "global_step": 435782, "epoch": 5250} {"train_loss": -26.904447555541992, "global_step": 435783, "epoch": 5250} {"train_loss": -27.266971588134766, "global_step": 435784, "epoch": 5250} {"train_loss": -27.33990478515625, "global_step": 435785, "epoch": 5250} {"train_loss": -26.886188507080078, "global_step": 435786, "epoch": 5250} {"train_loss": -27.12204933166504, "global_step": 435787, "epoch": 5250} {"train_loss": -27.3232364654541, "global_step": 435788, "epoch": 5250} {"train_loss": -26.862686157226562, "global_step": 435789, "epoch": 5250} {"train_loss": -27.104084014892578, "global_step": 435790, "epoch": 5250} {"train_loss": -26.890766143798828, "global_step": 435791, "epoch": 5250} {"train_loss": -27.022628784179688, "global_step": 435792, "epoch": 5250} {"train_loss": -26.495162963867188, "global_step": 435793, "epoch": 5250} {"train_loss": -26.991485595703125, "global_step": 435794, "epoch": 5250} {"train_loss": -26.89405632019043, "global_step": 435795, "epoch": 5250} {"train_loss": -26.784626007080078, "global_step": 435796, "epoch": 5250} {"train_loss": -26.960739135742188, "global_step": 435797, "epoch": 5250} {"train_loss": -27.409353256225586, "global_step": 435798, "epoch": 5250} {"train_loss": -26.705493927001953, "global_step": 435799, "epoch": 5250} {"train_loss": -26.886184692382812, "global_step": 435800, "epoch": 5250} {"train_loss": -27.30440330505371, "global_step": 435801, "epoch": 5250} {"train_loss": -26.8880615234375, "global_step": 435802, "epoch": 5250} {"train_loss": -26.77724266052246, "global_step": 435803, "epoch": 5250} {"train_loss": -27.049829483032227, "global_step": 435804, "epoch": 5250} {"train_loss": -26.771360397338867, "global_step": 435805, "epoch": 5250} {"train_loss": -26.758981704711914, "global_step": 435806, "epoch": 5250} {"train_loss": -27.048513412475586, "global_step": 435807, "epoch": 5250} {"train_loss": -26.99237632751465, "global_step": 435808, "epoch": 5250} {"train_loss": -27.3792667388916, "global_step": 435809, "epoch": 5250} {"train_loss": -26.616857528686523, "global_step": 435810, "epoch": 5250} {"train_loss": -26.445178985595703, "global_step": 435811, "epoch": 5250} {"train_loss": -26.70342445373535, "global_step": 435812, "epoch": 5250} {"train_loss": -27.024763107299805, "global_step": 435813, "epoch": 5250} {"train_loss": -26.494680404663086, "global_step": 435814, "epoch": 5250} {"train_loss": -26.50702476501465, "global_step": 435815, "epoch": 5250} {"train_loss": -26.758630752563477, "global_step": 435816, "epoch": 5250} {"train_loss": -26.966047286987305, "global_step": 435817, "epoch": 5250} {"train_loss": -26.274267196655273, "global_step": 435818, "epoch": 5250} {"train_loss": -26.537824630737305, "global_step": 435819, "epoch": 5250} {"train_loss": -26.424091339111328, "global_step": 435820, "epoch": 5250} {"train_loss": -27.1960391998291, "global_step": 435821, "epoch": 5250} {"train_loss": -26.180395126342773, "global_step": 435822, "epoch": 5250} {"train_loss": -26.684680938720703, "global_step": 435823, "epoch": 5250} {"train_loss": -26.13134765625, "global_step": 435824, "epoch": 5250} {"train_loss": -26.589035034179688, "global_step": 435825, "epoch": 5250} {"train_loss": -26.056970596313477, "global_step": 435826, "epoch": 5250} {"train_loss": -26.81412124633789, "global_step": 435827, "epoch": 5250} {"train_loss": -26.30322265625, "global_step": 435828, "epoch": 5250} {"train_loss": -26.515668869018555, "global_step": 435829, "epoch": 5250} {"train_loss": -26.812103271484375, "global_step": 435830, "epoch": 5250} {"train_loss": -26.46719741821289, "global_step": 435831, "epoch": 5250} {"train_loss": -26.62185951600592, "global_step": 435832, "epoch": 5250, "train/sim_max_reward_0": 1.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4500000": 1.0, "test/sim_max_reward_4500001": 1.0, "test/sim_max_reward_4500002": 1.0, "test/sim_max_reward_4500003": 1.0, "test/sim_max_reward_4500004": 1.0, "test/sim_max_reward_4500005": 1.0, "test/sim_max_reward_4500006": 1.0, "test/sim_max_reward_4500007": 1.0, "test/sim_max_reward_4500008": 1.0, "test/sim_max_reward_4500009": 1.0, "test/sim_max_reward_4500010": 1.0, "test/sim_max_reward_4500011": 1.0, "test/sim_max_reward_4500012": 1.0, "test/sim_max_reward_4500013": 0.0, "test/sim_max_reward_4500014": 1.0, "test/sim_max_reward_4500015": 1.0, "test/sim_max_reward_4500016": 1.0, "test/sim_max_reward_4500017": 1.0, "test/sim_max_reward_4500018": 1.0, "test/sim_max_reward_4500019": 1.0, "test/sim_max_reward_4500020": 1.0, "test/sim_max_reward_4500021": 1.0, "train/mean_score": 1.0, "test/mean_score": 0.9545454545454546, "val_loss": 6676992.0} {"train_loss": -26.521331787109375, "global_step": 435833, "epoch": 5251} {"train_loss": -26.66269874572754, "global_step": 435834, "epoch": 5251} {"train_loss": -26.399988174438477, "global_step": 435835, "epoch": 5251} {"train_loss": -26.458234786987305, "global_step": 435836, "epoch": 5251} {"train_loss": -26.717884063720703, "global_step": 435837, "epoch": 5251} {"train_loss": -26.11395263671875, "global_step": 435838, "epoch": 5251} {"train_loss": -26.400964736938477, "global_step": 435839, "epoch": 5251} {"train_loss": -26.558734893798828, "global_step": 435840, "epoch": 5251} {"train_loss": -26.699399948120117, "global_step": 435841, "epoch": 5251} {"train_loss": -26.905004501342773, "global_step": 435842, "epoch": 5251} {"train_loss": -26.615671157836914, "global_step": 435843, "epoch": 5251} {"train_loss": -26.843469619750977, "global_step": 435844, "epoch": 5251} {"train_loss": -26.56838035583496, "global_step": 435845, "epoch": 5251} {"train_loss": -26.184911727905273, "global_step": 435846, "epoch": 5251} {"train_loss": -26.633975982666016, "global_step": 435847, "epoch": 5251} {"train_loss": -26.988296508789062, "global_step": 435848, "epoch": 5251} {"train_loss": -27.043542861938477, "global_step": 435849, "epoch": 5251} {"train_loss": -26.83684730529785, "global_step": 435850, "epoch": 5251} {"train_loss": -26.98636245727539, "global_step": 435851, "epoch": 5251} {"train_loss": -27.39682960510254, "global_step": 435852, "epoch": 5251} {"train_loss": -26.874027252197266, "global_step": 435853, "epoch": 5251} {"train_loss": -26.595849990844727, "global_step": 435854, "epoch": 5251} {"train_loss": -26.5550537109375, "global_step": 435855, "epoch": 5251} {"train_loss": -26.80414390563965, "global_step": 435856, "epoch": 5251} {"train_loss": -26.889001846313477, "global_step": 435857, "epoch": 5251} {"train_loss": -27.275598526000977, "global_step": 435858, "epoch": 5251} {"train_loss": -27.40106201171875, "global_step": 435859, "epoch": 5251} {"train_loss": -27.026708602905273, "global_step": 435860, "epoch": 5251} {"train_loss": -27.296411514282227, "global_step": 435861, "epoch": 5251} {"train_loss": -26.955097198486328, "global_step": 435862, "epoch": 5251} {"train_loss": -27.1147403717041, "global_step": 435863, "epoch": 5251} {"train_loss": -27.218252182006836, "global_step": 435864, "epoch": 5251} {"train_loss": -27.153717041015625, "global_step": 435865, "epoch": 5251} {"train_loss": -27.279977798461914, "global_step": 435866, "epoch": 5251} {"train_loss": -27.35226821899414, "global_step": 435867, "epoch": 5251} {"train_loss": -26.972400665283203, "global_step": 435868, "epoch": 5251} {"train_loss": -26.90638542175293, "global_step": 435869, "epoch": 5251} {"train_loss": -27.260120391845703, "global_step": 435870, "epoch": 5251} {"train_loss": -26.941547393798828, "global_step": 435871, "epoch": 5251} {"train_loss": -26.893192291259766, "global_step": 435872, "epoch": 5251} {"train_loss": -26.5031795501709, "global_step": 435873, "epoch": 5251} {"train_loss": -26.418176651000977, "global_step": 435874, "epoch": 5251} {"train_loss": -27.05413818359375, "global_step": 435875, "epoch": 5251} {"train_loss": -26.637603759765625, "global_step": 435876, "epoch": 5251} {"train_loss": -26.980117797851562, "global_step": 435877, "epoch": 5251} {"train_loss": -27.312063217163086, "global_step": 435878, "epoch": 5251} {"train_loss": -27.00831413269043, "global_step": 435879, "epoch": 5251} {"train_loss": -27.244964599609375, "global_step": 435880, "epoch": 5251} {"train_loss": -27.136838912963867, "global_step": 435881, "epoch": 5251} {"train_loss": -27.117950439453125, "global_step": 435882, "epoch": 5251} {"train_loss": -27.109670639038086, "global_step": 435883, "epoch": 5251} {"train_loss": -26.981658935546875, "global_step": 435884, "epoch": 5251} {"train_loss": -27.053531646728516, "global_step": 435885, "epoch": 5251} {"train_loss": -27.12860679626465, "global_step": 435886, "epoch": 5251} {"train_loss": -27.05934715270996, "global_step": 435887, "epoch": 5251} {"train_loss": -26.952207565307617, "global_step": 435888, "epoch": 5251} {"train_loss": -27.071441650390625, "global_step": 435889, "epoch": 5251} {"train_loss": -27.05828857421875, "global_step": 435890, "epoch": 5251} {"train_loss": -27.03951072692871, "global_step": 435891, "epoch": 5251} {"train_loss": -26.98383903503418, "global_step": 435892, "epoch": 5251} {"train_loss": -26.88325309753418, "global_step": 435893, "epoch": 5251} {"train_loss": -27.16473388671875, "global_step": 435894, "epoch": 5251} {"train_loss": -27.138565063476562, "global_step": 435895, "epoch": 5251} {"train_loss": -26.508569717407227, "global_step": 435896, "epoch": 5251} {"train_loss": -25.734329223632812, "global_step": 435897, "epoch": 5251} {"train_loss": -25.948089599609375, "global_step": 435898, "epoch": 5251} {"train_loss": -26.77848243713379, "global_step": 435899, "epoch": 5251} {"train_loss": -26.78952407836914, "global_step": 435900, "epoch": 5251} {"train_loss": -26.63656997680664, "global_step": 435901, "epoch": 5251} {"train_loss": -26.442550659179688, "global_step": 435902, "epoch": 5251} {"train_loss": -27.03407096862793, "global_step": 435903, "epoch": 5251} {"train_loss": -26.386905670166016, "global_step": 435904, "epoch": 5251} {"train_loss": -26.620962142944336, "global_step": 435905, "epoch": 5251} {"train_loss": -26.729476928710938, "global_step": 435906, "epoch": 5251} {"train_loss": -26.494028091430664, "global_step": 435907, "epoch": 5251} {"train_loss": -26.778045654296875, "global_step": 435908, "epoch": 5251} {"train_loss": -26.5837345123291, "global_step": 435909, "epoch": 5251} {"train_loss": -26.462934494018555, "global_step": 435910, "epoch": 5251} {"train_loss": -26.8497257232666, "global_step": 435911, "epoch": 5251} {"train_loss": -26.245624542236328, "global_step": 435912, "epoch": 5251} {"train_loss": -26.862558364868164, "global_step": 435913, "epoch": 5251} {"train_loss": -26.71284294128418, "global_step": 435914, "epoch": 5251} {"train_loss": -26.820273272962456, "global_step": 435915, "epoch": 5251, "val_loss": 6689189.5} {"train_loss": -26.135986328125, "global_step": 435916, "epoch": 5252} {"train_loss": -26.07037353515625, "global_step": 435917, "epoch": 5252} {"train_loss": -26.20887565612793, "global_step": 435918, "epoch": 5252} {"train_loss": -26.274694442749023, "global_step": 435919, "epoch": 5252} {"train_loss": -26.68202781677246, "global_step": 435920, "epoch": 5252} {"train_loss": -26.6140079498291, "global_step": 435921, "epoch": 5252} {"train_loss": -26.8514461517334, "global_step": 435922, "epoch": 5252} {"train_loss": -26.127567291259766, "global_step": 435923, "epoch": 5252} {"train_loss": -26.5497989654541, "global_step": 435924, "epoch": 5252} {"train_loss": -26.807565689086914, "global_step": 435925, "epoch": 5252} {"train_loss": -26.56846046447754, "global_step": 435926, "epoch": 5252} {"train_loss": -26.360315322875977, "global_step": 435927, "epoch": 5252} {"train_loss": -26.501129150390625, "global_step": 435928, "epoch": 5252} {"train_loss": -26.703296661376953, "global_step": 435929, "epoch": 5252} {"train_loss": -26.716232299804688, "global_step": 435930, "epoch": 5252} {"train_loss": -26.5388126373291, "global_step": 435931, "epoch": 5252} {"train_loss": -26.6124267578125, "global_step": 435932, "epoch": 5252} {"train_loss": -26.654836654663086, "global_step": 435933, "epoch": 5252} {"train_loss": -26.64922523498535, "global_step": 435934, "epoch": 5252} {"train_loss": -27.1618595123291, "global_step": 435935, "epoch": 5252} {"train_loss": -26.653162002563477, "global_step": 435936, "epoch": 5252} {"train_loss": -26.728864669799805, "global_step": 435937, "epoch": 5252} {"train_loss": -26.63604736328125, "global_step": 435938, "epoch": 5252} {"train_loss": -26.745731353759766, "global_step": 435939, "epoch": 5252} {"train_loss": -26.59952163696289, "global_step": 435940, "epoch": 5252} {"train_loss": -26.757272720336914, "global_step": 435941, "epoch": 5252} {"train_loss": -26.982580184936523, "global_step": 435942, "epoch": 5252} {"train_loss": -27.086868286132812, "global_step": 435943, "epoch": 5252} {"train_loss": -26.907974243164062, "global_step": 435944, "epoch": 5252} {"train_loss": -27.0944766998291, "global_step": 435945, "epoch": 5252} {"train_loss": -27.19984245300293, "global_step": 435946, "epoch": 5252} {"train_loss": -26.9110164642334, "global_step": 435947, "epoch": 5252} {"train_loss": -27.128406524658203, "global_step": 435948, "epoch": 5252} {"train_loss": -27.136884689331055, "global_step": 435949, "epoch": 5252} {"train_loss": -27.236230850219727, "global_step": 435950, "epoch": 5252} {"train_loss": -27.156295776367188, "global_step": 435951, "epoch": 5252} {"train_loss": -27.29764175415039, "global_step": 435952, "epoch": 5252} {"train_loss": -27.227869033813477, "global_step": 435953, "epoch": 5252} {"train_loss": -26.685590744018555, "global_step": 435954, "epoch": 5252} {"train_loss": -27.1042423248291, "global_step": 435955, "epoch": 5252} {"train_loss": -27.2408390045166, "global_step": 435956, "epoch": 5252} {"train_loss": -27.072839736938477, "global_step": 435957, "epoch": 5252} {"train_loss": -27.0685977935791, "global_step": 435958, "epoch": 5252} {"train_loss": -26.917572021484375, "global_step": 435959, "epoch": 5252} {"train_loss": -26.57735252380371, "global_step": 435960, "epoch": 5252} {"train_loss": -27.24818992614746, "global_step": 435961, "epoch": 5252} {"train_loss": -26.85861587524414, "global_step": 435962, "epoch": 5252} {"train_loss": -26.492650985717773, "global_step": 435963, "epoch": 5252} {"train_loss": -25.4837589263916, "global_step": 435964, "epoch": 5252} {"train_loss": -25.149002075195312, "global_step": 435965, "epoch": 5252} {"train_loss": -25.468278884887695, "global_step": 435966, "epoch": 5252} {"train_loss": -26.60125732421875, "global_step": 435967, "epoch": 5252} {"train_loss": -27.213537216186523, "global_step": 435968, "epoch": 5252} {"train_loss": -26.143728256225586, "global_step": 435969, "epoch": 5252} {"train_loss": -26.694843292236328, "global_step": 435970, "epoch": 5252} {"train_loss": -27.036117553710938, "global_step": 435971, "epoch": 5252} {"train_loss": -26.682477951049805, "global_step": 435972, "epoch": 5252} {"train_loss": -26.497812271118164, "global_step": 435973, "epoch": 5252} {"train_loss": -26.69536781311035, "global_step": 435974, "epoch": 5252} {"train_loss": -26.80780029296875, "global_step": 435975, "epoch": 5252} {"train_loss": -26.59405517578125, "global_step": 435976, "epoch": 5252} {"train_loss": -26.686126708984375, "global_step": 435977, "epoch": 5252} {"train_loss": -26.644001007080078, "global_step": 435978, "epoch": 5252} {"train_loss": -26.720417022705078, "global_step": 435979, "epoch": 5252} {"train_loss": -26.4852294921875, "global_step": 435980, "epoch": 5252} {"train_loss": -26.388916015625, "global_step": 435981, "epoch": 5252} {"train_loss": -26.73825454711914, "global_step": 435982, "epoch": 5252} {"train_loss": -26.77591323852539, "global_step": 435983, "epoch": 5252} {"train_loss": -26.90167808532715, "global_step": 435984, "epoch": 5252} {"train_loss": -26.77632713317871, "global_step": 435985, "epoch": 5252} {"train_loss": -26.513818740844727, "global_step": 435986, "epoch": 5252} {"train_loss": -26.644174575805664, "global_step": 435987, "epoch": 5252} {"train_loss": -26.7707576751709, "global_step": 435988, "epoch": 5252} {"train_loss": -26.913272857666016, "global_step": 435989, "epoch": 5252} {"train_loss": -26.58582878112793, "global_step": 435990, "epoch": 5252} {"train_loss": -26.819311141967773, "global_step": 435991, "epoch": 5252} {"train_loss": -26.6938419342041, "global_step": 435992, "epoch": 5252} {"train_loss": -27.247623443603516, "global_step": 435993, "epoch": 5252} {"train_loss": -26.695234298706055, "global_step": 435994, "epoch": 5252} {"train_loss": -26.45926856994629, "global_step": 435995, "epoch": 5252} {"train_loss": -26.654523849487305, "global_step": 435996, "epoch": 5252} {"train_loss": -27.08417320251465, "global_step": 435997, "epoch": 5252} {"train_loss": -26.712290775345032, "global_step": 435998, "epoch": 5252, "val_loss": 6684398.0} {"train_loss": -26.20526695251465, "global_step": 435999, "epoch": 5253} {"train_loss": -26.248489379882812, "global_step": 436000, "epoch": 5253} {"train_loss": -26.75848388671875, "global_step": 436001, "epoch": 5253} {"train_loss": -26.319128036499023, "global_step": 436002, "epoch": 5253} {"train_loss": -26.4018611907959, "global_step": 436003, "epoch": 5253} {"train_loss": -26.63190269470215, "global_step": 436004, "epoch": 5253} {"train_loss": -26.866769790649414, "global_step": 436005, "epoch": 5253} {"train_loss": -26.45643424987793, "global_step": 436006, "epoch": 5253} {"train_loss": -26.829498291015625, "global_step": 436007, "epoch": 5253} {"train_loss": -26.645343780517578, "global_step": 436008, "epoch": 5253} {"train_loss": -26.530872344970703, "global_step": 436009, "epoch": 5253} {"train_loss": -26.532392501831055, "global_step": 436010, "epoch": 5253} {"train_loss": -26.883771896362305, "global_step": 436011, "epoch": 5253} {"train_loss": -27.179367065429688, "global_step": 436012, "epoch": 5253} {"train_loss": -26.71346092224121, "global_step": 436013, "epoch": 5253} {"train_loss": -26.342931747436523, "global_step": 436014, "epoch": 5253} {"train_loss": -26.76145362854004, "global_step": 436015, "epoch": 5253} {"train_loss": -27.199872970581055, "global_step": 436016, "epoch": 5253} {"train_loss": -26.994827270507812, "global_step": 436017, "epoch": 5253} {"train_loss": -27.053003311157227, "global_step": 436018, "epoch": 5253} {"train_loss": -26.544025421142578, "global_step": 436019, "epoch": 5253} {"train_loss": -27.182392120361328, "global_step": 436020, "epoch": 5253} {"train_loss": -26.875690460205078, "global_step": 436021, "epoch": 5253} {"train_loss": -26.854169845581055, "global_step": 436022, "epoch": 5253} {"train_loss": -26.707733154296875, "global_step": 436023, "epoch": 5253} {"train_loss": -26.798322677612305, "global_step": 436024, "epoch": 5253} {"train_loss": -26.18848991394043, "global_step": 436025, "epoch": 5253} {"train_loss": -26.90478515625, "global_step": 436026, "epoch": 5253} {"train_loss": -27.082691192626953, "global_step": 436027, "epoch": 5253} {"train_loss": -26.782245635986328, "global_step": 436028, "epoch": 5253} {"train_loss": -26.762876510620117, "global_step": 436029, "epoch": 5253} {"train_loss": -27.171552658081055, "global_step": 436030, "epoch": 5253} {"train_loss": -26.91452407836914, "global_step": 436031, "epoch": 5253} {"train_loss": -26.781726837158203, "global_step": 436032, "epoch": 5253} {"train_loss": -26.34186363220215, "global_step": 436033, "epoch": 5253} {"train_loss": -26.24771499633789, "global_step": 436034, "epoch": 5253} {"train_loss": -26.722700119018555, "global_step": 436035, "epoch": 5253} {"train_loss": -26.858911514282227, "global_step": 436036, "epoch": 5253} {"train_loss": -27.027027130126953, "global_step": 436037, "epoch": 5253} {"train_loss": -26.65997886657715, "global_step": 436038, "epoch": 5253} {"train_loss": -26.76460075378418, "global_step": 436039, "epoch": 5253} {"train_loss": -27.293684005737305, "global_step": 436040, "epoch": 5253} {"train_loss": -26.69580078125, "global_step": 436041, "epoch": 5253} {"train_loss": -27.1030216217041, "global_step": 436042, "epoch": 5253} {"train_loss": -27.124372482299805, "global_step": 436043, "epoch": 5253} {"train_loss": -26.897785186767578, "global_step": 436044, "epoch": 5253} {"train_loss": -26.66178321838379, "global_step": 436045, "epoch": 5253} {"train_loss": -26.999425888061523, "global_step": 436046, "epoch": 5253} {"train_loss": -26.930246353149414, "global_step": 436047, "epoch": 5253} {"train_loss": -27.040250778198242, "global_step": 436048, "epoch": 5253} {"train_loss": -27.112934112548828, "global_step": 436049, "epoch": 5253} {"train_loss": -26.913028717041016, "global_step": 436050, "epoch": 5253} {"train_loss": -27.383258819580078, "global_step": 436051, "epoch": 5253} {"train_loss": -27.100820541381836, "global_step": 436052, "epoch": 5253} {"train_loss": -27.183109283447266, "global_step": 436053, "epoch": 5253} {"train_loss": -26.571386337280273, "global_step": 436054, "epoch": 5253} {"train_loss": -27.262937545776367, "global_step": 436055, "epoch": 5253} {"train_loss": -26.7014102935791, "global_step": 436056, "epoch": 5253} {"train_loss": -26.762659072875977, "global_step": 436057, "epoch": 5253} {"train_loss": -26.62766456604004, "global_step": 436058, "epoch": 5253} {"train_loss": -26.860675811767578, "global_step": 436059, "epoch": 5253} {"train_loss": -27.043771743774414, "global_step": 436060, "epoch": 5253} {"train_loss": -26.7665958404541, "global_step": 436061, "epoch": 5253} {"train_loss": -26.650922775268555, "global_step": 436062, "epoch": 5253} {"train_loss": -26.865869522094727, "global_step": 436063, "epoch": 5253} {"train_loss": -26.587543487548828, "global_step": 436064, "epoch": 5253} {"train_loss": -26.748991012573242, "global_step": 436065, "epoch": 5253} {"train_loss": -27.04010581970215, "global_step": 436066, "epoch": 5253} {"train_loss": -26.910205841064453, "global_step": 436067, "epoch": 5253} {"train_loss": -27.351165771484375, "global_step": 436068, "epoch": 5253} {"train_loss": -26.378250122070312, "global_step": 436069, "epoch": 5253} {"train_loss": -27.208770751953125, "global_step": 436070, "epoch": 5253} {"train_loss": -26.6299991607666, "global_step": 436071, "epoch": 5253} {"train_loss": -26.83253288269043, "global_step": 436072, "epoch": 5253} {"train_loss": -26.841083526611328, "global_step": 436073, "epoch": 5253} {"train_loss": -26.374698638916016, "global_step": 436074, "epoch": 5253} {"train_loss": -27.023401260375977, "global_step": 436075, "epoch": 5253} {"train_loss": -26.633691787719727, "global_step": 436076, "epoch": 5253} {"train_loss": -26.64499282836914, "global_step": 436077, "epoch": 5253} {"train_loss": -27.06900978088379, "global_step": 436078, "epoch": 5253} {"train_loss": -27.075098037719727, "global_step": 436079, "epoch": 5253} {"train_loss": -26.952192306518555, "global_step": 436080, "epoch": 5253} {"train_loss": -26.836265334163805, "global_step": 436081, "epoch": 5253, "val_loss": 6736678.5} {"train_loss": -26.040618896484375, "global_step": 436082, "epoch": 5254} {"train_loss": -26.43665885925293, "global_step": 436083, "epoch": 5254} {"train_loss": -26.13408851623535, "global_step": 436084, "epoch": 5254} {"train_loss": -26.4842472076416, "global_step": 436085, "epoch": 5254} {"train_loss": -26.4996280670166, "global_step": 436086, "epoch": 5254} {"train_loss": -26.307233810424805, "global_step": 436087, "epoch": 5254} {"train_loss": -26.758197784423828, "global_step": 436088, "epoch": 5254} {"train_loss": -26.146894454956055, "global_step": 436089, "epoch": 5254} {"train_loss": -26.75030517578125, "global_step": 436090, "epoch": 5254} {"train_loss": -26.330615997314453, "global_step": 436091, "epoch": 5254} {"train_loss": -26.3968448638916, "global_step": 436092, "epoch": 5254} {"train_loss": -26.544971466064453, "global_step": 436093, "epoch": 5254} {"train_loss": -26.629968643188477, "global_step": 436094, "epoch": 5254} {"train_loss": -26.5883731842041, "global_step": 436095, "epoch": 5254} {"train_loss": -26.63138771057129, "global_step": 436096, "epoch": 5254} {"train_loss": -26.49763298034668, "global_step": 436097, "epoch": 5254} {"train_loss": -26.20977783203125, "global_step": 436098, "epoch": 5254} {"train_loss": -26.71150016784668, "global_step": 436099, "epoch": 5254} {"train_loss": -26.546300888061523, "global_step": 436100, "epoch": 5254} {"train_loss": -26.767454147338867, "global_step": 436101, "epoch": 5254} {"train_loss": -27.06251335144043, "global_step": 436102, "epoch": 5254} {"train_loss": -26.921125411987305, "global_step": 436103, "epoch": 5254} {"train_loss": -26.929113388061523, "global_step": 436104, "epoch": 5254} {"train_loss": -27.268280029296875, "global_step": 436105, "epoch": 5254} {"train_loss": -27.110742568969727, "global_step": 436106, "epoch": 5254} {"train_loss": -26.78828239440918, "global_step": 436107, "epoch": 5254} {"train_loss": -26.901044845581055, "global_step": 436108, "epoch": 5254} {"train_loss": -27.380695343017578, "global_step": 436109, "epoch": 5254} {"train_loss": -26.99532127380371, "global_step": 436110, "epoch": 5254} {"train_loss": -27.20077896118164, "global_step": 436111, "epoch": 5254} {"train_loss": -27.218103408813477, "global_step": 436112, "epoch": 5254} {"train_loss": -26.87263298034668, "global_step": 436113, "epoch": 5254} {"train_loss": -26.896595001220703, "global_step": 436114, "epoch": 5254} {"train_loss": -26.80517578125, "global_step": 436115, "epoch": 5254} {"train_loss": -26.333402633666992, "global_step": 436116, "epoch": 5254} {"train_loss": -26.537561416625977, "global_step": 436117, "epoch": 5254} {"train_loss": -26.5428409576416, "global_step": 436118, "epoch": 5254} {"train_loss": -27.060504913330078, "global_step": 436119, "epoch": 5254} {"train_loss": -26.963117599487305, "global_step": 436120, "epoch": 5254} {"train_loss": -26.79981803894043, "global_step": 436121, "epoch": 5254} {"train_loss": -26.8828067779541, "global_step": 436122, "epoch": 5254} {"train_loss": -27.195758819580078, "global_step": 436123, "epoch": 5254} {"train_loss": -27.01362419128418, "global_step": 436124, "epoch": 5254} {"train_loss": -26.843374252319336, "global_step": 436125, "epoch": 5254} {"train_loss": -26.835296630859375, "global_step": 436126, "epoch": 5254} {"train_loss": -26.833271026611328, "global_step": 436127, "epoch": 5254} {"train_loss": -26.46901512145996, "global_step": 436128, "epoch": 5254} {"train_loss": -26.798608779907227, "global_step": 436129, "epoch": 5254} {"train_loss": -26.703414916992188, "global_step": 436130, "epoch": 5254} {"train_loss": -26.243118286132812, "global_step": 436131, "epoch": 5254} {"train_loss": -26.703882217407227, "global_step": 436132, "epoch": 5254} {"train_loss": -27.273645401000977, "global_step": 436133, "epoch": 5254} {"train_loss": -26.55356788635254, "global_step": 436134, "epoch": 5254} {"train_loss": -27.06104850769043, "global_step": 436135, "epoch": 5254} {"train_loss": -26.74924087524414, "global_step": 436136, "epoch": 5254} {"train_loss": -27.41120719909668, "global_step": 436137, "epoch": 5254} {"train_loss": -26.941762924194336, "global_step": 436138, "epoch": 5254} {"train_loss": -26.555973052978516, "global_step": 436139, "epoch": 5254} {"train_loss": -26.749181747436523, "global_step": 436140, "epoch": 5254} {"train_loss": -27.03236198425293, "global_step": 436141, "epoch": 5254} {"train_loss": -27.00214195251465, "global_step": 436142, "epoch": 5254} {"train_loss": -26.88039207458496, "global_step": 436143, "epoch": 5254} {"train_loss": -27.145246505737305, "global_step": 436144, "epoch": 5254} {"train_loss": -26.755725860595703, "global_step": 436145, "epoch": 5254} {"train_loss": -26.94087791442871, "global_step": 436146, "epoch": 5254} {"train_loss": -26.5635986328125, "global_step": 436147, "epoch": 5254} {"train_loss": -26.8704776763916, "global_step": 436148, "epoch": 5254} {"train_loss": -27.07281494140625, "global_step": 436149, "epoch": 5254} {"train_loss": -27.164976119995117, "global_step": 436150, "epoch": 5254} {"train_loss": -26.740081787109375, "global_step": 436151, "epoch": 5254} {"train_loss": -26.892621994018555, "global_step": 436152, "epoch": 5254} {"train_loss": -26.776763916015625, "global_step": 436153, "epoch": 5254} {"train_loss": -27.05392837524414, "global_step": 436154, "epoch": 5254} {"train_loss": -26.899606704711914, "global_step": 436155, "epoch": 5254} {"train_loss": -26.65241813659668, "global_step": 436156, "epoch": 5254} {"train_loss": -27.164447784423828, "global_step": 436157, "epoch": 5254} {"train_loss": -27.09870719909668, "global_step": 436158, "epoch": 5254} {"train_loss": -27.012563705444336, "global_step": 436159, "epoch": 5254} {"train_loss": -26.91303825378418, "global_step": 436160, "epoch": 5254} {"train_loss": -26.997961044311523, "global_step": 436161, "epoch": 5254} {"train_loss": -27.110549926757812, "global_step": 436162, "epoch": 5254} {"train_loss": -26.935022354125977, "global_step": 436163, "epoch": 5254} {"train_loss": -26.795790890613233, "global_step": 436164, "epoch": 5254, "val_loss": 6611796.0} {"train_loss": -26.385244369506836, "global_step": 436165, "epoch": 5255} {"train_loss": -26.550174713134766, "global_step": 436166, "epoch": 5255} {"train_loss": -26.764089584350586, "global_step": 436167, "epoch": 5255} {"train_loss": -26.580188751220703, "global_step": 436168, "epoch": 5255} {"train_loss": -26.808338165283203, "global_step": 436169, "epoch": 5255} {"train_loss": -26.560443878173828, "global_step": 436170, "epoch": 5255} {"train_loss": -26.72308349609375, "global_step": 436171, "epoch": 5255} {"train_loss": -26.86832618713379, "global_step": 436172, "epoch": 5255} {"train_loss": -26.626178741455078, "global_step": 436173, "epoch": 5255} {"train_loss": -26.818227767944336, "global_step": 436174, "epoch": 5255} {"train_loss": -26.97054100036621, "global_step": 436175, "epoch": 5255} {"train_loss": -26.50599479675293, "global_step": 436176, "epoch": 5255} {"train_loss": -26.516681671142578, "global_step": 436177, "epoch": 5255} {"train_loss": -26.710554122924805, "global_step": 436178, "epoch": 5255} {"train_loss": -27.115036010742188, "global_step": 436179, "epoch": 5255} {"train_loss": -26.755538940429688, "global_step": 436180, "epoch": 5255} {"train_loss": -26.940826416015625, "global_step": 436181, "epoch": 5255} {"train_loss": -26.85284423828125, "global_step": 436182, "epoch": 5255} {"train_loss": -26.635644912719727, "global_step": 436183, "epoch": 5255} {"train_loss": -27.232702255249023, "global_step": 436184, "epoch": 5255} {"train_loss": -26.700927734375, "global_step": 436185, "epoch": 5255} {"train_loss": -27.227893829345703, "global_step": 436186, "epoch": 5255} {"train_loss": -27.117589950561523, "global_step": 436187, "epoch": 5255} {"train_loss": -27.131305694580078, "global_step": 436188, "epoch": 5255} {"train_loss": -26.70466423034668, "global_step": 436189, "epoch": 5255} {"train_loss": -27.0455379486084, "global_step": 436190, "epoch": 5255} {"train_loss": -26.621906280517578, "global_step": 436191, "epoch": 5255} {"train_loss": -26.802682876586914, "global_step": 436192, "epoch": 5255} {"train_loss": -26.99639320373535, "global_step": 436193, "epoch": 5255} {"train_loss": -27.136892318725586, "global_step": 436194, "epoch": 5255} {"train_loss": -26.91670036315918, "global_step": 436195, "epoch": 5255} {"train_loss": -26.209949493408203, "global_step": 436196, "epoch": 5255} {"train_loss": -26.956933975219727, "global_step": 436197, "epoch": 5255} {"train_loss": -27.00813102722168, "global_step": 436198, "epoch": 5255} {"train_loss": -26.17091178894043, "global_step": 436199, "epoch": 5255} {"train_loss": -26.534696578979492, "global_step": 436200, "epoch": 5255} {"train_loss": -26.459341049194336, "global_step": 436201, "epoch": 5255} {"train_loss": -26.507160186767578, "global_step": 436202, "epoch": 5255} {"train_loss": -26.59522819519043, "global_step": 436203, "epoch": 5255} {"train_loss": -26.9052791595459, "global_step": 436204, "epoch": 5255} {"train_loss": -26.889984130859375, "global_step": 436205, "epoch": 5255} {"train_loss": -26.570947647094727, "global_step": 436206, "epoch": 5255} {"train_loss": -26.401111602783203, "global_step": 436207, "epoch": 5255} {"train_loss": -26.7439022064209, "global_step": 436208, "epoch": 5255} {"train_loss": -26.963647842407227, "global_step": 436209, "epoch": 5255} {"train_loss": -26.930749893188477, "global_step": 436210, "epoch": 5255} {"train_loss": -27.018491744995117, "global_step": 436211, "epoch": 5255} {"train_loss": -26.79864501953125, "global_step": 436212, "epoch": 5255} {"train_loss": -26.77435302734375, "global_step": 436213, "epoch": 5255} {"train_loss": -27.280990600585938, "global_step": 436214, "epoch": 5255} {"train_loss": -26.90138053894043, "global_step": 436215, "epoch": 5255} {"train_loss": -26.942279815673828, "global_step": 436216, "epoch": 5255} {"train_loss": -27.0137996673584, "global_step": 436217, "epoch": 5255} {"train_loss": -26.778867721557617, "global_step": 436218, "epoch": 5255} {"train_loss": -26.858076095581055, "global_step": 436219, "epoch": 5255} {"train_loss": -26.805761337280273, "global_step": 436220, "epoch": 5255} {"train_loss": -26.528186798095703, "global_step": 436221, "epoch": 5255} {"train_loss": -26.65549659729004, "global_step": 436222, "epoch": 5255} {"train_loss": -27.1475887298584, "global_step": 436223, "epoch": 5255} {"train_loss": -27.088891983032227, "global_step": 436224, "epoch": 5255} {"train_loss": -26.877729415893555, "global_step": 436225, "epoch": 5255} {"train_loss": -26.96702003479004, "global_step": 436226, "epoch": 5255} {"train_loss": -26.832019805908203, "global_step": 436227, "epoch": 5255} {"train_loss": -26.983243942260742, "global_step": 436228, "epoch": 5255} {"train_loss": -27.26629066467285, "global_step": 436229, "epoch": 5255} {"train_loss": -26.998733520507812, "global_step": 436230, "epoch": 5255} {"train_loss": -27.027725219726562, "global_step": 436231, "epoch": 5255} {"train_loss": -26.936542510986328, "global_step": 436232, "epoch": 5255} {"train_loss": -26.770843505859375, "global_step": 436233, "epoch": 5255} {"train_loss": -26.798303604125977, "global_step": 436234, "epoch": 5255} {"train_loss": -27.17228126525879, "global_step": 436235, "epoch": 5255} {"train_loss": -27.174856185913086, "global_step": 436236, "epoch": 5255} {"train_loss": -26.856298446655273, "global_step": 436237, "epoch": 5255} {"train_loss": -27.076736450195312, "global_step": 436238, "epoch": 5255} {"train_loss": -27.13699722290039, "global_step": 436239, "epoch": 5255} {"train_loss": -27.297840118408203, "global_step": 436240, "epoch": 5255} {"train_loss": -27.0567626953125, "global_step": 436241, "epoch": 5255} {"train_loss": -26.830310821533203, "global_step": 436242, "epoch": 5255} {"train_loss": -27.28657341003418, "global_step": 436243, "epoch": 5255} {"train_loss": -27.013757705688477, "global_step": 436244, "epoch": 5255} {"train_loss": -27.30466079711914, "global_step": 436245, "epoch": 5255} {"train_loss": -27.334430694580078, "global_step": 436246, "epoch": 5255} {"train_loss": -26.86420525700213, "global_step": 436247, "epoch": 5255, "val_loss": 6566878.0} {"train_loss": -26.50616455078125, "global_step": 436248, "epoch": 5256} {"train_loss": -26.443958282470703, "global_step": 436249, "epoch": 5256} {"train_loss": -26.007343292236328, "global_step": 436250, "epoch": 5256} {"train_loss": -26.183826446533203, "global_step": 436251, "epoch": 5256} {"train_loss": -26.62025260925293, "global_step": 436252, "epoch": 5256} {"train_loss": -26.073272705078125, "global_step": 436253, "epoch": 5256} {"train_loss": -25.519954681396484, "global_step": 436254, "epoch": 5256} {"train_loss": -25.59891128540039, "global_step": 436255, "epoch": 5256} {"train_loss": -26.35231590270996, "global_step": 436256, "epoch": 5256} {"train_loss": -25.755939483642578, "global_step": 436257, "epoch": 5256} {"train_loss": -26.44000816345215, "global_step": 436258, "epoch": 5256} {"train_loss": -26.23713493347168, "global_step": 436259, "epoch": 5256} {"train_loss": -26.57330894470215, "global_step": 436260, "epoch": 5256} {"train_loss": -26.15030288696289, "global_step": 436261, "epoch": 5256} {"train_loss": -26.661773681640625, "global_step": 436262, "epoch": 5256} {"train_loss": -26.214651107788086, "global_step": 436263, "epoch": 5256} {"train_loss": -26.626056671142578, "global_step": 436264, "epoch": 5256} {"train_loss": -26.901926040649414, "global_step": 436265, "epoch": 5256} {"train_loss": -26.46356773376465, "global_step": 436266, "epoch": 5256} {"train_loss": -26.465808868408203, "global_step": 436267, "epoch": 5256} {"train_loss": -26.953231811523438, "global_step": 436268, "epoch": 5256} {"train_loss": -26.770313262939453, "global_step": 436269, "epoch": 5256} {"train_loss": -26.779407501220703, "global_step": 436270, "epoch": 5256} {"train_loss": -26.50068473815918, "global_step": 436271, "epoch": 5256} {"train_loss": -26.796039581298828, "global_step": 436272, "epoch": 5256} {"train_loss": -26.759092330932617, "global_step": 436273, "epoch": 5256} {"train_loss": -26.6721248626709, "global_step": 436274, "epoch": 5256} {"train_loss": -26.51957130432129, "global_step": 436275, "epoch": 5256} {"train_loss": -26.85296630859375, "global_step": 436276, "epoch": 5256} {"train_loss": -27.137527465820312, "global_step": 436277, "epoch": 5256} {"train_loss": -27.0067195892334, "global_step": 436278, "epoch": 5256} {"train_loss": -26.919782638549805, "global_step": 436279, "epoch": 5256} {"train_loss": -26.70879554748535, "global_step": 436280, "epoch": 5256} {"train_loss": -26.95098304748535, "global_step": 436281, "epoch": 5256} {"train_loss": -26.901123046875, "global_step": 436282, "epoch": 5256} {"train_loss": -26.981616973876953, "global_step": 436283, "epoch": 5256} {"train_loss": -26.84088706970215, "global_step": 436284, "epoch": 5256} {"train_loss": -26.78973960876465, "global_step": 436285, "epoch": 5256} {"train_loss": -26.993911743164062, "global_step": 436286, "epoch": 5256} {"train_loss": -26.8962345123291, "global_step": 436287, "epoch": 5256} {"train_loss": -27.124784469604492, "global_step": 436288, "epoch": 5256} {"train_loss": -27.033660888671875, "global_step": 436289, "epoch": 5256} {"train_loss": -27.253753662109375, "global_step": 436290, "epoch": 5256} {"train_loss": -27.004196166992188, "global_step": 436291, "epoch": 5256} {"train_loss": -27.42286491394043, "global_step": 436292, "epoch": 5256} {"train_loss": -26.87628173828125, "global_step": 436293, "epoch": 5256} {"train_loss": -27.253326416015625, "global_step": 436294, "epoch": 5256} {"train_loss": -26.9835147857666, "global_step": 436295, "epoch": 5256} {"train_loss": -26.798566818237305, "global_step": 436296, "epoch": 5256} {"train_loss": -26.88625144958496, "global_step": 436297, "epoch": 5256} {"train_loss": -26.8782901763916, "global_step": 436298, "epoch": 5256} {"train_loss": -27.18812370300293, "global_step": 436299, "epoch": 5256} {"train_loss": -27.523767471313477, "global_step": 436300, "epoch": 5256} {"train_loss": -27.289295196533203, "global_step": 436301, "epoch": 5256} {"train_loss": -27.104034423828125, "global_step": 436302, "epoch": 5256} {"train_loss": -27.202804565429688, "global_step": 436303, "epoch": 5256} {"train_loss": -27.262174606323242, "global_step": 436304, "epoch": 5256} {"train_loss": -26.92494773864746, "global_step": 436305, "epoch": 5256} {"train_loss": -26.86474609375, "global_step": 436306, "epoch": 5256} {"train_loss": -27.391681671142578, "global_step": 436307, "epoch": 5256} {"train_loss": -27.44666862487793, "global_step": 436308, "epoch": 5256} {"train_loss": -27.123462677001953, "global_step": 436309, "epoch": 5256} {"train_loss": -26.788578033447266, "global_step": 436310, "epoch": 5256} {"train_loss": -26.94659996032715, "global_step": 436311, "epoch": 5256} {"train_loss": -27.162158966064453, "global_step": 436312, "epoch": 5256} {"train_loss": -26.566869735717773, "global_step": 436313, "epoch": 5256} {"train_loss": -26.983442306518555, "global_step": 436314, "epoch": 5256} {"train_loss": -26.759857177734375, "global_step": 436315, "epoch": 5256} {"train_loss": -25.67494773864746, "global_step": 436316, "epoch": 5256} {"train_loss": -25.898544311523438, "global_step": 436317, "epoch": 5256} {"train_loss": -25.613378524780273, "global_step": 436318, "epoch": 5256} {"train_loss": -26.13484001159668, "global_step": 436319, "epoch": 5256} {"train_loss": -26.922000885009766, "global_step": 436320, "epoch": 5256} {"train_loss": -26.595169067382812, "global_step": 436321, "epoch": 5256} {"train_loss": -26.1455020904541, "global_step": 436322, "epoch": 5256} {"train_loss": -26.912866592407227, "global_step": 436323, "epoch": 5256} {"train_loss": -26.568761825561523, "global_step": 436324, "epoch": 5256} {"train_loss": -26.366077423095703, "global_step": 436325, "epoch": 5256} {"train_loss": -27.03217124938965, "global_step": 436326, "epoch": 5256} {"train_loss": -26.762365341186523, "global_step": 436327, "epoch": 5256} {"train_loss": -26.616668701171875, "global_step": 436328, "epoch": 5256} {"train_loss": -26.546613693237305, "global_step": 436329, "epoch": 5256} {"train_loss": -26.71856218360993, "global_step": 436330, "epoch": 5256, "val_loss": 6634023.5} {"train_loss": -26.415185928344727, "global_step": 436331, "epoch": 5257} {"train_loss": -26.00919532775879, "global_step": 436332, "epoch": 5257} {"train_loss": -26.564428329467773, "global_step": 436333, "epoch": 5257} {"train_loss": -25.857513427734375, "global_step": 436334, "epoch": 5257} {"train_loss": -26.21295738220215, "global_step": 436335, "epoch": 5257} {"train_loss": -26.06392478942871, "global_step": 436336, "epoch": 5257} {"train_loss": -26.07525634765625, "global_step": 436337, "epoch": 5257} {"train_loss": -26.235029220581055, "global_step": 436338, "epoch": 5257} {"train_loss": -26.435449600219727, "global_step": 436339, "epoch": 5257} {"train_loss": -26.35622215270996, "global_step": 436340, "epoch": 5257} {"train_loss": -26.364599227905273, "global_step": 436341, "epoch": 5257} {"train_loss": -26.35943603515625, "global_step": 436342, "epoch": 5257} {"train_loss": -26.10066032409668, "global_step": 436343, "epoch": 5257} {"train_loss": -26.492755889892578, "global_step": 436344, "epoch": 5257} {"train_loss": -26.530765533447266, "global_step": 436345, "epoch": 5257} {"train_loss": -26.34392738342285, "global_step": 436346, "epoch": 5257} {"train_loss": -26.620893478393555, "global_step": 436347, "epoch": 5257} {"train_loss": -26.50721549987793, "global_step": 436348, "epoch": 5257} {"train_loss": -26.71552848815918, "global_step": 436349, "epoch": 5257} {"train_loss": -26.48126792907715, "global_step": 436350, "epoch": 5257} {"train_loss": -26.826635360717773, "global_step": 436351, "epoch": 5257} {"train_loss": -26.651281356811523, "global_step": 436352, "epoch": 5257} {"train_loss": -26.625263214111328, "global_step": 436353, "epoch": 5257} {"train_loss": -27.09766960144043, "global_step": 436354, "epoch": 5257} {"train_loss": -26.749267578125, "global_step": 436355, "epoch": 5257} {"train_loss": -27.08839988708496, "global_step": 436356, "epoch": 5257} {"train_loss": -26.840595245361328, "global_step": 436357, "epoch": 5257} {"train_loss": -27.010217666625977, "global_step": 436358, "epoch": 5257} {"train_loss": -26.93450927734375, "global_step": 436359, "epoch": 5257} {"train_loss": -26.600610733032227, "global_step": 436360, "epoch": 5257} {"train_loss": -26.870325088500977, "global_step": 436361, "epoch": 5257} {"train_loss": -26.99579429626465, "global_step": 436362, "epoch": 5257} {"train_loss": -27.119184494018555, "global_step": 436363, "epoch": 5257} {"train_loss": -26.663593292236328, "global_step": 436364, "epoch": 5257} {"train_loss": -27.100727081298828, "global_step": 436365, "epoch": 5257} {"train_loss": -26.897729873657227, "global_step": 436366, "epoch": 5257} {"train_loss": -26.94550132751465, "global_step": 436367, "epoch": 5257} {"train_loss": -27.075647354125977, "global_step": 436368, "epoch": 5257} {"train_loss": -27.107547760009766, "global_step": 436369, "epoch": 5257} {"train_loss": -26.933826446533203, "global_step": 436370, "epoch": 5257} {"train_loss": -26.896528244018555, "global_step": 436371, "epoch": 5257} {"train_loss": -26.887287139892578, "global_step": 436372, "epoch": 5257} {"train_loss": -26.9252872467041, "global_step": 436373, "epoch": 5257} {"train_loss": -26.642105102539062, "global_step": 436374, "epoch": 5257} {"train_loss": -26.802331924438477, "global_step": 436375, "epoch": 5257} {"train_loss": -27.287586212158203, "global_step": 436376, "epoch": 5257} {"train_loss": -27.1549015045166, "global_step": 436377, "epoch": 5257} {"train_loss": -26.70064353942871, "global_step": 436378, "epoch": 5257} {"train_loss": -26.660490036010742, "global_step": 436379, "epoch": 5257} {"train_loss": -26.91676902770996, "global_step": 436380, "epoch": 5257} {"train_loss": -26.972192764282227, "global_step": 436381, "epoch": 5257} {"train_loss": -27.217992782592773, "global_step": 436382, "epoch": 5257} {"train_loss": -27.015832901000977, "global_step": 436383, "epoch": 5257} {"train_loss": -26.8453426361084, "global_step": 436384, "epoch": 5257} {"train_loss": -26.888898849487305, "global_step": 436385, "epoch": 5257} {"train_loss": -27.135894775390625, "global_step": 436386, "epoch": 5257} {"train_loss": -27.37409019470215, "global_step": 436387, "epoch": 5257} {"train_loss": -27.02007484436035, "global_step": 436388, "epoch": 5257} {"train_loss": -27.225830078125, "global_step": 436389, "epoch": 5257} {"train_loss": -27.037206649780273, "global_step": 436390, "epoch": 5257} {"train_loss": -26.80584144592285, "global_step": 436391, "epoch": 5257} {"train_loss": -26.83857536315918, "global_step": 436392, "epoch": 5257} {"train_loss": -26.883832931518555, "global_step": 436393, "epoch": 5257} {"train_loss": -27.295867919921875, "global_step": 436394, "epoch": 5257} {"train_loss": -27.213491439819336, "global_step": 436395, "epoch": 5257} {"train_loss": -27.073657989501953, "global_step": 436396, "epoch": 5257} {"train_loss": -26.874881744384766, "global_step": 436397, "epoch": 5257} {"train_loss": -26.575292587280273, "global_step": 436398, "epoch": 5257} {"train_loss": -27.062576293945312, "global_step": 436399, "epoch": 5257} {"train_loss": -26.86098289489746, "global_step": 436400, "epoch": 5257} {"train_loss": -27.10297203063965, "global_step": 436401, "epoch": 5257} {"train_loss": -27.033246994018555, "global_step": 436402, "epoch": 5257} {"train_loss": -27.04947280883789, "global_step": 436403, "epoch": 5257} {"train_loss": -27.04900550842285, "global_step": 436404, "epoch": 5257} {"train_loss": -26.700490951538086, "global_step": 436405, "epoch": 5257} {"train_loss": -26.946542739868164, "global_step": 436406, "epoch": 5257} {"train_loss": -26.508291244506836, "global_step": 436407, "epoch": 5257} {"train_loss": -26.46052360534668, "global_step": 436408, "epoch": 5257} {"train_loss": -26.41327476501465, "global_step": 436409, "epoch": 5257} {"train_loss": -26.631689071655273, "global_step": 436410, "epoch": 5257} {"train_loss": -26.907428741455078, "global_step": 436411, "epoch": 5257} {"train_loss": -26.823537826538086, "global_step": 436412, "epoch": 5257} {"train_loss": -26.7715566014669, "global_step": 436413, "epoch": 5257, "val_loss": 6667934.0} {"train_loss": -26.647302627563477, "global_step": 436414, "epoch": 5258} {"train_loss": -26.374624252319336, "global_step": 436415, "epoch": 5258} {"train_loss": -26.308746337890625, "global_step": 436416, "epoch": 5258} {"train_loss": -25.95570945739746, "global_step": 436417, "epoch": 5258} {"train_loss": -26.764371871948242, "global_step": 436418, "epoch": 5258} {"train_loss": -26.684833526611328, "global_step": 436419, "epoch": 5258} {"train_loss": -26.76087760925293, "global_step": 436420, "epoch": 5258} {"train_loss": -26.691669464111328, "global_step": 436421, "epoch": 5258} {"train_loss": -26.520055770874023, "global_step": 436422, "epoch": 5258} {"train_loss": -26.609756469726562, "global_step": 436423, "epoch": 5258} {"train_loss": -26.717731475830078, "global_step": 436424, "epoch": 5258} {"train_loss": -26.816892623901367, "global_step": 436425, "epoch": 5258} {"train_loss": -26.928110122680664, "global_step": 436426, "epoch": 5258} {"train_loss": -26.735776901245117, "global_step": 436427, "epoch": 5258} {"train_loss": -26.697839736938477, "global_step": 436428, "epoch": 5258} {"train_loss": -26.60444450378418, "global_step": 436429, "epoch": 5258} {"train_loss": -26.47589111328125, "global_step": 436430, "epoch": 5258} {"train_loss": -26.81158447265625, "global_step": 436431, "epoch": 5258} {"train_loss": -26.886133193969727, "global_step": 436432, "epoch": 5258} {"train_loss": -26.947614669799805, "global_step": 436433, "epoch": 5258} {"train_loss": -27.19333839416504, "global_step": 436434, "epoch": 5258} {"train_loss": -27.04233169555664, "global_step": 436435, "epoch": 5258} {"train_loss": -26.79682731628418, "global_step": 436436, "epoch": 5258} {"train_loss": -27.0057315826416, "global_step": 436437, "epoch": 5258} {"train_loss": -26.86447525024414, "global_step": 436438, "epoch": 5258} {"train_loss": -26.706933975219727, "global_step": 436439, "epoch": 5258} {"train_loss": -27.144376754760742, "global_step": 436440, "epoch": 5258} {"train_loss": -26.498876571655273, "global_step": 436441, "epoch": 5258} {"train_loss": -26.419055938720703, "global_step": 436442, "epoch": 5258} {"train_loss": -26.961090087890625, "global_step": 436443, "epoch": 5258} {"train_loss": -26.795745849609375, "global_step": 436444, "epoch": 5258} {"train_loss": -25.889312744140625, "global_step": 436445, "epoch": 5258} {"train_loss": -26.462026596069336, "global_step": 436446, "epoch": 5258} {"train_loss": -27.110593795776367, "global_step": 436447, "epoch": 5258} {"train_loss": -26.93767738342285, "global_step": 436448, "epoch": 5258} {"train_loss": -27.073230743408203, "global_step": 436449, "epoch": 5258} {"train_loss": -26.956897735595703, "global_step": 436450, "epoch": 5258} {"train_loss": -26.9442081451416, "global_step": 436451, "epoch": 5258} {"train_loss": -26.430313110351562, "global_step": 436452, "epoch": 5258} {"train_loss": -27.15518569946289, "global_step": 436453, "epoch": 5258} {"train_loss": -26.87415885925293, "global_step": 436454, "epoch": 5258} {"train_loss": -27.010007858276367, "global_step": 436455, "epoch": 5258} {"train_loss": -26.828903198242188, "global_step": 436456, "epoch": 5258} {"train_loss": -26.884552001953125, "global_step": 436457, "epoch": 5258} {"train_loss": -26.768171310424805, "global_step": 436458, "epoch": 5258} {"train_loss": -26.547216415405273, "global_step": 436459, "epoch": 5258} {"train_loss": -26.82527732849121, "global_step": 436460, "epoch": 5258} {"train_loss": -27.066150665283203, "global_step": 436461, "epoch": 5258} {"train_loss": -26.919540405273438, "global_step": 436462, "epoch": 5258} {"train_loss": -26.86878776550293, "global_step": 436463, "epoch": 5258} {"train_loss": -26.866703033447266, "global_step": 436464, "epoch": 5258} {"train_loss": -26.725040435791016, "global_step": 436465, "epoch": 5258} {"train_loss": -26.722183227539062, "global_step": 436466, "epoch": 5258} {"train_loss": -26.920093536376953, "global_step": 436467, "epoch": 5258} {"train_loss": -26.79668617248535, "global_step": 436468, "epoch": 5258} {"train_loss": -27.121173858642578, "global_step": 436469, "epoch": 5258} {"train_loss": -26.838605880737305, "global_step": 436470, "epoch": 5258} {"train_loss": -27.137414932250977, "global_step": 436471, "epoch": 5258} {"train_loss": -27.113988876342773, "global_step": 436472, "epoch": 5258} {"train_loss": -26.995361328125, "global_step": 436473, "epoch": 5258} {"train_loss": -26.747220993041992, "global_step": 436474, "epoch": 5258} {"train_loss": -26.961408615112305, "global_step": 436475, "epoch": 5258} {"train_loss": -26.832677841186523, "global_step": 436476, "epoch": 5258} {"train_loss": -26.974960327148438, "global_step": 436477, "epoch": 5258} {"train_loss": -26.698810577392578, "global_step": 436478, "epoch": 5258} {"train_loss": -27.127180099487305, "global_step": 436479, "epoch": 5258} {"train_loss": -27.133670806884766, "global_step": 436480, "epoch": 5258} {"train_loss": -27.001129150390625, "global_step": 436481, "epoch": 5258} {"train_loss": -26.345142364501953, "global_step": 436482, "epoch": 5258} {"train_loss": -27.00385856628418, "global_step": 436483, "epoch": 5258} {"train_loss": -26.717426300048828, "global_step": 436484, "epoch": 5258} {"train_loss": -26.460721969604492, "global_step": 436485, "epoch": 5258} {"train_loss": -26.547290802001953, "global_step": 436486, "epoch": 5258} {"train_loss": -26.13022232055664, "global_step": 436487, "epoch": 5258} {"train_loss": -26.324695587158203, "global_step": 436488, "epoch": 5258} {"train_loss": -26.318119049072266, "global_step": 436489, "epoch": 5258} {"train_loss": -26.473325729370117, "global_step": 436490, "epoch": 5258} {"train_loss": -26.956003189086914, "global_step": 436491, "epoch": 5258} {"train_loss": -26.804834365844727, "global_step": 436492, "epoch": 5258} {"train_loss": -26.558629989624023, "global_step": 436493, "epoch": 5258} {"train_loss": -26.6148738861084, "global_step": 436494, "epoch": 5258} {"train_loss": -26.67795753479004, "global_step": 436495, "epoch": 5258} {"train_loss": -26.7570296597768, "global_step": 436496, "epoch": 5258, "val_loss": 6536410.0} {"train_loss": -26.054487228393555, "global_step": 436497, "epoch": 5259} {"train_loss": -26.30645751953125, "global_step": 436498, "epoch": 5259} {"train_loss": -26.084217071533203, "global_step": 436499, "epoch": 5259} {"train_loss": -25.297945022583008, "global_step": 436500, "epoch": 5259} {"train_loss": -26.188735961914062, "global_step": 436501, "epoch": 5259} {"train_loss": -25.802505493164062, "global_step": 436502, "epoch": 5259} {"train_loss": -25.83424186706543, "global_step": 436503, "epoch": 5259} {"train_loss": -26.35928726196289, "global_step": 436504, "epoch": 5259} {"train_loss": -26.418170928955078, "global_step": 436505, "epoch": 5259} {"train_loss": -26.053953170776367, "global_step": 436506, "epoch": 5259} {"train_loss": -26.30866050720215, "global_step": 436507, "epoch": 5259} {"train_loss": -26.071796417236328, "global_step": 436508, "epoch": 5259} {"train_loss": -26.4373722076416, "global_step": 436509, "epoch": 5259} {"train_loss": -26.553510665893555, "global_step": 436510, "epoch": 5259} {"train_loss": -26.553119659423828, "global_step": 436511, "epoch": 5259} {"train_loss": -26.434011459350586, "global_step": 436512, "epoch": 5259} {"train_loss": -26.46904945373535, "global_step": 436513, "epoch": 5259} {"train_loss": -26.706266403198242, "global_step": 436514, "epoch": 5259} {"train_loss": -26.647397994995117, "global_step": 436515, "epoch": 5259} {"train_loss": -26.583881378173828, "global_step": 436516, "epoch": 5259} {"train_loss": -26.898883819580078, "global_step": 436517, "epoch": 5259} {"train_loss": -26.79596519470215, "global_step": 436518, "epoch": 5259} {"train_loss": -26.53436279296875, "global_step": 436519, "epoch": 5259} {"train_loss": -26.523584365844727, "global_step": 436520, "epoch": 5259} {"train_loss": -27.097436904907227, "global_step": 436521, "epoch": 5259} {"train_loss": -27.096174240112305, "global_step": 436522, "epoch": 5259} {"train_loss": -26.64531898498535, "global_step": 436523, "epoch": 5259} {"train_loss": -27.36948013305664, "global_step": 436524, "epoch": 5259} {"train_loss": -26.75494384765625, "global_step": 436525, "epoch": 5259} {"train_loss": -27.25526237487793, "global_step": 436526, "epoch": 5259} {"train_loss": -27.012088775634766, "global_step": 436527, "epoch": 5259} {"train_loss": -26.659637451171875, "global_step": 436528, "epoch": 5259} {"train_loss": -26.640043258666992, "global_step": 436529, "epoch": 5259} {"train_loss": -26.879383087158203, "global_step": 436530, "epoch": 5259} {"train_loss": -27.241504669189453, "global_step": 436531, "epoch": 5259} {"train_loss": -27.04349708557129, "global_step": 436532, "epoch": 5259} {"train_loss": -26.832494735717773, "global_step": 436533, "epoch": 5259} {"train_loss": -26.833181381225586, "global_step": 436534, "epoch": 5259} {"train_loss": -27.116424560546875, "global_step": 436535, "epoch": 5259} {"train_loss": -27.221343994140625, "global_step": 436536, "epoch": 5259} {"train_loss": -26.820632934570312, "global_step": 436537, "epoch": 5259} {"train_loss": -27.031620025634766, "global_step": 436538, "epoch": 5259} {"train_loss": -27.309640884399414, "global_step": 436539, "epoch": 5259} {"train_loss": -26.89458656311035, "global_step": 436540, "epoch": 5259} {"train_loss": -27.04041862487793, "global_step": 436541, "epoch": 5259} {"train_loss": -26.764148712158203, "global_step": 436542, "epoch": 5259} {"train_loss": -27.338348388671875, "global_step": 436543, "epoch": 5259} {"train_loss": -27.044235229492188, "global_step": 436544, "epoch": 5259} {"train_loss": -27.257923126220703, "global_step": 436545, "epoch": 5259} {"train_loss": -26.7840576171875, "global_step": 436546, "epoch": 5259} {"train_loss": -27.008636474609375, "global_step": 436547, "epoch": 5259} {"train_loss": -26.985065460205078, "global_step": 436548, "epoch": 5259} {"train_loss": -26.95892333984375, "global_step": 436549, "epoch": 5259} {"train_loss": -27.720325469970703, "global_step": 436550, "epoch": 5259} {"train_loss": -26.976743698120117, "global_step": 436551, "epoch": 5259} {"train_loss": -27.220645904541016, "global_step": 436552, "epoch": 5259} {"train_loss": -27.312036514282227, "global_step": 436553, "epoch": 5259} {"train_loss": -26.966028213500977, "global_step": 436554, "epoch": 5259} {"train_loss": -26.72675895690918, "global_step": 436555, "epoch": 5259} {"train_loss": -27.21357536315918, "global_step": 436556, "epoch": 5259} {"train_loss": -26.794036865234375, "global_step": 436557, "epoch": 5259} {"train_loss": -26.686853408813477, "global_step": 436558, "epoch": 5259} {"train_loss": -26.978235244750977, "global_step": 436559, "epoch": 5259} {"train_loss": -26.544422149658203, "global_step": 436560, "epoch": 5259} {"train_loss": -27.04347038269043, "global_step": 436561, "epoch": 5259} {"train_loss": -26.920984268188477, "global_step": 436562, "epoch": 5259} {"train_loss": -26.845691680908203, "global_step": 436563, "epoch": 5259} {"train_loss": -26.623037338256836, "global_step": 436564, "epoch": 5259} {"train_loss": -26.765628814697266, "global_step": 436565, "epoch": 5259} {"train_loss": -26.929773330688477, "global_step": 436566, "epoch": 5259} {"train_loss": -26.732223510742188, "global_step": 436567, "epoch": 5259} {"train_loss": -26.87702751159668, "global_step": 436568, "epoch": 5259} {"train_loss": -27.11467933654785, "global_step": 436569, "epoch": 5259} {"train_loss": -26.535551071166992, "global_step": 436570, "epoch": 5259} {"train_loss": -26.84119987487793, "global_step": 436571, "epoch": 5259} {"train_loss": -26.624353408813477, "global_step": 436572, "epoch": 5259} {"train_loss": -26.72895622253418, "global_step": 436573, "epoch": 5259} {"train_loss": -26.716535568237305, "global_step": 436574, "epoch": 5259} {"train_loss": -27.050556182861328, "global_step": 436575, "epoch": 5259} {"train_loss": -26.645294189453125, "global_step": 436576, "epoch": 5259} {"train_loss": -26.6044864654541, "global_step": 436577, "epoch": 5259} {"train_loss": -27.103635787963867, "global_step": 436578, "epoch": 5259} {"train_loss": -26.756764032754553, "global_step": 436579, "epoch": 5259, "val_loss": 6700448.0} {"train_loss": -26.631025314331055, "global_step": 436580, "epoch": 5260} {"train_loss": -25.830615997314453, "global_step": 436581, "epoch": 5260} {"train_loss": -26.606964111328125, "global_step": 436582, "epoch": 5260} {"train_loss": -26.415327072143555, "global_step": 436583, "epoch": 5260} {"train_loss": -26.77072525024414, "global_step": 436584, "epoch": 5260} {"train_loss": -26.80024528503418, "global_step": 436585, "epoch": 5260} {"train_loss": -26.694595336914062, "global_step": 436586, "epoch": 5260} {"train_loss": -26.568288803100586, "global_step": 436587, "epoch": 5260} {"train_loss": -26.723142623901367, "global_step": 436588, "epoch": 5260} {"train_loss": -26.737995147705078, "global_step": 436589, "epoch": 5260} {"train_loss": -26.44879150390625, "global_step": 436590, "epoch": 5260} {"train_loss": -26.53264808654785, "global_step": 436591, "epoch": 5260} {"train_loss": -26.671329498291016, "global_step": 436592, "epoch": 5260} {"train_loss": -26.700342178344727, "global_step": 436593, "epoch": 5260} {"train_loss": -26.881988525390625, "global_step": 436594, "epoch": 5260} {"train_loss": -26.608728408813477, "global_step": 436595, "epoch": 5260} {"train_loss": -26.64198112487793, "global_step": 436596, "epoch": 5260} {"train_loss": -26.562713623046875, "global_step": 436597, "epoch": 5260} {"train_loss": -26.943012237548828, "global_step": 436598, "epoch": 5260} {"train_loss": -26.740331649780273, "global_step": 436599, "epoch": 5260} {"train_loss": -26.85856056213379, "global_step": 436600, "epoch": 5260} {"train_loss": -27.079654693603516, "global_step": 436601, "epoch": 5260} {"train_loss": -26.9731388092041, "global_step": 436602, "epoch": 5260} {"train_loss": -26.35500144958496, "global_step": 436603, "epoch": 5260} {"train_loss": -27.109460830688477, "global_step": 436604, "epoch": 5260} {"train_loss": -26.907012939453125, "global_step": 436605, "epoch": 5260} {"train_loss": -26.8029727935791, "global_step": 436606, "epoch": 5260} {"train_loss": -26.627676010131836, "global_step": 436607, "epoch": 5260} {"train_loss": -27.13031578063965, "global_step": 436608, "epoch": 5260} {"train_loss": -26.978229522705078, "global_step": 436609, "epoch": 5260} {"train_loss": -27.02450942993164, "global_step": 436610, "epoch": 5260} {"train_loss": -27.098241806030273, "global_step": 436611, "epoch": 5260} {"train_loss": -27.082029342651367, "global_step": 436612, "epoch": 5260} {"train_loss": -26.8312931060791, "global_step": 436613, "epoch": 5260} {"train_loss": -27.28560447692871, "global_step": 436614, "epoch": 5260} {"train_loss": -26.794340133666992, "global_step": 436615, "epoch": 5260} {"train_loss": -26.852619171142578, "global_step": 436616, "epoch": 5260} {"train_loss": -26.6099910736084, "global_step": 436617, "epoch": 5260} {"train_loss": -26.827911376953125, "global_step": 436618, "epoch": 5260} {"train_loss": -27.154077529907227, "global_step": 436619, "epoch": 5260} {"train_loss": -26.722089767456055, "global_step": 436620, "epoch": 5260} {"train_loss": -26.804853439331055, "global_step": 436621, "epoch": 5260} {"train_loss": -26.905981063842773, "global_step": 436622, "epoch": 5260} {"train_loss": -27.35035514831543, "global_step": 436623, "epoch": 5260} {"train_loss": -26.956579208374023, "global_step": 436624, "epoch": 5260} {"train_loss": -26.836206436157227, "global_step": 436625, "epoch": 5260} {"train_loss": -26.72416114807129, "global_step": 436626, "epoch": 5260} {"train_loss": -26.800891876220703, "global_step": 436627, "epoch": 5260} {"train_loss": -27.225387573242188, "global_step": 436628, "epoch": 5260} {"train_loss": -26.60120964050293, "global_step": 436629, "epoch": 5260} {"train_loss": -26.972787857055664, "global_step": 436630, "epoch": 5260} {"train_loss": -27.019739151000977, "global_step": 436631, "epoch": 5260} {"train_loss": -26.712705612182617, "global_step": 436632, "epoch": 5260} {"train_loss": -26.568683624267578, "global_step": 436633, "epoch": 5260} {"train_loss": -26.380176544189453, "global_step": 436634, "epoch": 5260} {"train_loss": -26.976715087890625, "global_step": 436635, "epoch": 5260} {"train_loss": -26.848417282104492, "global_step": 436636, "epoch": 5260} {"train_loss": -27.03167724609375, "global_step": 436637, "epoch": 5260} {"train_loss": -26.77345848083496, "global_step": 436638, "epoch": 5260} {"train_loss": -27.021596908569336, "global_step": 436639, "epoch": 5260} {"train_loss": -26.7554874420166, "global_step": 436640, "epoch": 5260} {"train_loss": -27.242664337158203, "global_step": 436641, "epoch": 5260} {"train_loss": -26.889108657836914, "global_step": 436642, "epoch": 5260} {"train_loss": -26.6059627532959, "global_step": 436643, "epoch": 5260} {"train_loss": -26.884912490844727, "global_step": 436644, "epoch": 5260} {"train_loss": -26.962812423706055, "global_step": 436645, "epoch": 5260} {"train_loss": -26.812393188476562, "global_step": 436646, "epoch": 5260} {"train_loss": -27.0137882232666, "global_step": 436647, "epoch": 5260} {"train_loss": -26.972309112548828, "global_step": 436648, "epoch": 5260} {"train_loss": -26.959808349609375, "global_step": 436649, "epoch": 5260} {"train_loss": -26.86689567565918, "global_step": 436650, "epoch": 5260} {"train_loss": -26.71234703063965, "global_step": 436651, "epoch": 5260} {"train_loss": -27.159515380859375, "global_step": 436652, "epoch": 5260} {"train_loss": -26.808216094970703, "global_step": 436653, "epoch": 5260} {"train_loss": -26.95623779296875, "global_step": 436654, "epoch": 5260} {"train_loss": -27.507038116455078, "global_step": 436655, "epoch": 5260} {"train_loss": -27.074132919311523, "global_step": 436656, "epoch": 5260} {"train_loss": -26.97112464904785, "global_step": 436657, "epoch": 5260} {"train_loss": -27.19087791442871, "global_step": 436658, "epoch": 5260} {"train_loss": -26.788131713867188, "global_step": 436659, "epoch": 5260} {"train_loss": -27.359655380249023, "global_step": 436660, "epoch": 5260} {"train_loss": -27.220518112182617, "global_step": 436661, "epoch": 5260} {"train_loss": -26.851817234452948, "global_step": 436662, "epoch": 5260, "val_loss": 6609130.5} {"train_loss": -27.031347274780273, "global_step": 436663, "epoch": 5261} {"train_loss": -26.93500328063965, "global_step": 436664, "epoch": 5261} {"train_loss": -26.46955680847168, "global_step": 436665, "epoch": 5261} {"train_loss": -26.557641983032227, "global_step": 436666, "epoch": 5261} {"train_loss": -26.826704025268555, "global_step": 436667, "epoch": 5261} {"train_loss": -26.535009384155273, "global_step": 436668, "epoch": 5261} {"train_loss": -25.971755981445312, "global_step": 436669, "epoch": 5261} {"train_loss": -26.185102462768555, "global_step": 436670, "epoch": 5261} {"train_loss": -26.399747848510742, "global_step": 436671, "epoch": 5261} {"train_loss": -27.019834518432617, "global_step": 436672, "epoch": 5261} {"train_loss": -26.85666275024414, "global_step": 436673, "epoch": 5261} {"train_loss": -26.84808349609375, "global_step": 436674, "epoch": 5261} {"train_loss": -26.70102882385254, "global_step": 436675, "epoch": 5261} {"train_loss": -26.611820220947266, "global_step": 436676, "epoch": 5261} {"train_loss": -27.19449806213379, "global_step": 436677, "epoch": 5261} {"train_loss": -26.95903968811035, "global_step": 436678, "epoch": 5261} {"train_loss": -27.02619743347168, "global_step": 436679, "epoch": 5261} {"train_loss": -26.446638107299805, "global_step": 436680, "epoch": 5261} {"train_loss": -26.93951416015625, "global_step": 436681, "epoch": 5261} {"train_loss": -26.77594566345215, "global_step": 436682, "epoch": 5261} {"train_loss": -26.718555450439453, "global_step": 436683, "epoch": 5261} {"train_loss": -26.7364559173584, "global_step": 436684, "epoch": 5261} {"train_loss": -26.76429557800293, "global_step": 436685, "epoch": 5261} {"train_loss": -27.133209228515625, "global_step": 436686, "epoch": 5261} {"train_loss": -26.79169273376465, "global_step": 436687, "epoch": 5261} {"train_loss": -26.8230037689209, "global_step": 436688, "epoch": 5261} {"train_loss": -26.921293258666992, "global_step": 436689, "epoch": 5261} {"train_loss": -26.904102325439453, "global_step": 436690, "epoch": 5261} {"train_loss": -27.47870445251465, "global_step": 436691, "epoch": 5261} {"train_loss": -26.80206871032715, "global_step": 436692, "epoch": 5261} {"train_loss": -27.254907608032227, "global_step": 436693, "epoch": 5261} {"train_loss": -26.655588150024414, "global_step": 436694, "epoch": 5261} {"train_loss": -27.462278366088867, "global_step": 436695, "epoch": 5261} {"train_loss": -27.199121475219727, "global_step": 436696, "epoch": 5261} {"train_loss": -27.130157470703125, "global_step": 436697, "epoch": 5261} {"train_loss": -26.998571395874023, "global_step": 436698, "epoch": 5261} {"train_loss": -26.787841796875, "global_step": 436699, "epoch": 5261} {"train_loss": -27.29987907409668, "global_step": 436700, "epoch": 5261} {"train_loss": -27.145917892456055, "global_step": 436701, "epoch": 5261} {"train_loss": -27.011205673217773, "global_step": 436702, "epoch": 5261} {"train_loss": -27.077329635620117, "global_step": 436703, "epoch": 5261} {"train_loss": -27.15631103515625, "global_step": 436704, "epoch": 5261} {"train_loss": -27.105417251586914, "global_step": 436705, "epoch": 5261} {"train_loss": -27.089252471923828, "global_step": 436706, "epoch": 5261} {"train_loss": -26.616653442382812, "global_step": 436707, "epoch": 5261} {"train_loss": -27.02231788635254, "global_step": 436708, "epoch": 5261} {"train_loss": -27.012104034423828, "global_step": 436709, "epoch": 5261} {"train_loss": -27.07423210144043, "global_step": 436710, "epoch": 5261} {"train_loss": -26.9677791595459, "global_step": 436711, "epoch": 5261} {"train_loss": -27.154199600219727, "global_step": 436712, "epoch": 5261} {"train_loss": -27.152151107788086, "global_step": 436713, "epoch": 5261} {"train_loss": -26.879621505737305, "global_step": 436714, "epoch": 5261} {"train_loss": -27.054609298706055, "global_step": 436715, "epoch": 5261} {"train_loss": -26.54139518737793, "global_step": 436716, "epoch": 5261} {"train_loss": -26.0157413482666, "global_step": 436717, "epoch": 5261} {"train_loss": -25.399438858032227, "global_step": 436718, "epoch": 5261} {"train_loss": -25.084442138671875, "global_step": 436719, "epoch": 5261} {"train_loss": -26.529993057250977, "global_step": 436720, "epoch": 5261} {"train_loss": -26.45648193359375, "global_step": 436721, "epoch": 5261} {"train_loss": -27.21698570251465, "global_step": 436722, "epoch": 5261} {"train_loss": -26.405908584594727, "global_step": 436723, "epoch": 5261} {"train_loss": -26.408315658569336, "global_step": 436724, "epoch": 5261} {"train_loss": -26.808576583862305, "global_step": 436725, "epoch": 5261} {"train_loss": -26.46770668029785, "global_step": 436726, "epoch": 5261} {"train_loss": -26.47702407836914, "global_step": 436727, "epoch": 5261} {"train_loss": -26.996753692626953, "global_step": 436728, "epoch": 5261} {"train_loss": -26.81951332092285, "global_step": 436729, "epoch": 5261} {"train_loss": -26.416913986206055, "global_step": 436730, "epoch": 5261} {"train_loss": -26.790388107299805, "global_step": 436731, "epoch": 5261} {"train_loss": -26.73695945739746, "global_step": 436732, "epoch": 5261} {"train_loss": -26.723386764526367, "global_step": 436733, "epoch": 5261} {"train_loss": -26.9664306640625, "global_step": 436734, "epoch": 5261} {"train_loss": -26.602008819580078, "global_step": 436735, "epoch": 5261} {"train_loss": -26.873884201049805, "global_step": 436736, "epoch": 5261} {"train_loss": -26.881317138671875, "global_step": 436737, "epoch": 5261} {"train_loss": -26.77620506286621, "global_step": 436738, "epoch": 5261} {"train_loss": -27.14325523376465, "global_step": 436739, "epoch": 5261} {"train_loss": -26.662677764892578, "global_step": 436740, "epoch": 5261} {"train_loss": -27.182600021362305, "global_step": 436741, "epoch": 5261} {"train_loss": -26.817319869995117, "global_step": 436742, "epoch": 5261} {"train_loss": -26.80073356628418, "global_step": 436743, "epoch": 5261} {"train_loss": -27.05742835998535, "global_step": 436744, "epoch": 5261} {"train_loss": -26.813971416059747, "global_step": 436745, "epoch": 5261, "val_loss": 6614826.5} {"train_loss": -26.293310165405273, "global_step": 436746, "epoch": 5262} {"train_loss": -26.423086166381836, "global_step": 436747, "epoch": 5262} {"train_loss": -26.619903564453125, "global_step": 436748, "epoch": 5262} {"train_loss": -26.576364517211914, "global_step": 436749, "epoch": 5262} {"train_loss": -26.363855361938477, "global_step": 436750, "epoch": 5262} {"train_loss": -26.55341148376465, "global_step": 436751, "epoch": 5262} {"train_loss": -26.642841339111328, "global_step": 436752, "epoch": 5262} {"train_loss": -27.05775260925293, "global_step": 436753, "epoch": 5262} {"train_loss": -26.752180099487305, "global_step": 436754, "epoch": 5262} {"train_loss": -26.872119903564453, "global_step": 436755, "epoch": 5262} {"train_loss": -26.944875717163086, "global_step": 436756, "epoch": 5262} {"train_loss": -26.948938369750977, "global_step": 436757, "epoch": 5262} {"train_loss": -26.738388061523438, "global_step": 436758, "epoch": 5262} {"train_loss": -26.946075439453125, "global_step": 436759, "epoch": 5262} {"train_loss": -26.956335067749023, "global_step": 436760, "epoch": 5262} {"train_loss": -27.086820602416992, "global_step": 436761, "epoch": 5262} {"train_loss": -26.671142578125, "global_step": 436762, "epoch": 5262} {"train_loss": -26.782690048217773, "global_step": 436763, "epoch": 5262} {"train_loss": -27.271106719970703, "global_step": 436764, "epoch": 5262} {"train_loss": -26.766523361206055, "global_step": 436765, "epoch": 5262} {"train_loss": -27.11174964904785, "global_step": 436766, "epoch": 5262} {"train_loss": -26.99053382873535, "global_step": 436767, "epoch": 5262} {"train_loss": -27.129852294921875, "global_step": 436768, "epoch": 5262} {"train_loss": -27.135889053344727, "global_step": 436769, "epoch": 5262} {"train_loss": -27.027002334594727, "global_step": 436770, "epoch": 5262} {"train_loss": -27.287771224975586, "global_step": 436771, "epoch": 5262} {"train_loss": -27.251447677612305, "global_step": 436772, "epoch": 5262} {"train_loss": -27.17225456237793, "global_step": 436773, "epoch": 5262} {"train_loss": -27.245346069335938, "global_step": 436774, "epoch": 5262} {"train_loss": -26.795202255249023, "global_step": 436775, "epoch": 5262} {"train_loss": -27.15620231628418, "global_step": 436776, "epoch": 5262} {"train_loss": -26.82427978515625, "global_step": 436777, "epoch": 5262} {"train_loss": -27.1458797454834, "global_step": 436778, "epoch": 5262} {"train_loss": -26.828710556030273, "global_step": 436779, "epoch": 5262} {"train_loss": -26.87980079650879, "global_step": 436780, "epoch": 5262} {"train_loss": -26.8090877532959, "global_step": 436781, "epoch": 5262} {"train_loss": -26.979736328125, "global_step": 436782, "epoch": 5262} {"train_loss": -27.276060104370117, "global_step": 436783, "epoch": 5262} {"train_loss": -26.519519805908203, "global_step": 436784, "epoch": 5262} {"train_loss": -26.595172882080078, "global_step": 436785, "epoch": 5262} {"train_loss": -26.837697982788086, "global_step": 436786, "epoch": 5262} {"train_loss": -27.27777099609375, "global_step": 436787, "epoch": 5262} {"train_loss": -26.9995059967041, "global_step": 436788, "epoch": 5262} {"train_loss": -26.858428955078125, "global_step": 436789, "epoch": 5262} {"train_loss": -26.604360580444336, "global_step": 436790, "epoch": 5262} {"train_loss": -26.817270278930664, "global_step": 436791, "epoch": 5262} {"train_loss": -26.90254020690918, "global_step": 436792, "epoch": 5262} {"train_loss": -26.85735511779785, "global_step": 436793, "epoch": 5262} {"train_loss": -26.676055908203125, "global_step": 436794, "epoch": 5262} {"train_loss": -26.6719970703125, "global_step": 436795, "epoch": 5262} {"train_loss": -26.8649845123291, "global_step": 436796, "epoch": 5262} {"train_loss": -26.966054916381836, "global_step": 436797, "epoch": 5262} {"train_loss": -27.221521377563477, "global_step": 436798, "epoch": 5262} {"train_loss": -26.862762451171875, "global_step": 436799, "epoch": 5262} {"train_loss": -27.09760856628418, "global_step": 436800, "epoch": 5262} {"train_loss": -27.04481315612793, "global_step": 436801, "epoch": 5262} {"train_loss": -26.988698959350586, "global_step": 436802, "epoch": 5262} {"train_loss": -27.003625869750977, "global_step": 436803, "epoch": 5262} {"train_loss": -26.853118896484375, "global_step": 436804, "epoch": 5262} {"train_loss": -26.67426872253418, "global_step": 436805, "epoch": 5262} {"train_loss": -26.924701690673828, "global_step": 436806, "epoch": 5262} {"train_loss": -26.77960205078125, "global_step": 436807, "epoch": 5262} {"train_loss": -27.024560928344727, "global_step": 436808, "epoch": 5262} {"train_loss": -26.81805419921875, "global_step": 436809, "epoch": 5262} {"train_loss": -26.9417781829834, "global_step": 436810, "epoch": 5262} {"train_loss": -26.948389053344727, "global_step": 436811, "epoch": 5262} {"train_loss": -27.045602798461914, "global_step": 436812, "epoch": 5262} {"train_loss": -26.747882843017578, "global_step": 436813, "epoch": 5262} {"train_loss": -27.012741088867188, "global_step": 436814, "epoch": 5262} {"train_loss": -26.914823532104492, "global_step": 436815, "epoch": 5262} {"train_loss": -27.087003707885742, "global_step": 436816, "epoch": 5262} {"train_loss": -26.78367042541504, "global_step": 436817, "epoch": 5262} {"train_loss": -27.40478515625, "global_step": 436818, "epoch": 5262} {"train_loss": -26.6668758392334, "global_step": 436819, "epoch": 5262} {"train_loss": -27.331592559814453, "global_step": 436820, "epoch": 5262} {"train_loss": -26.796802520751953, "global_step": 436821, "epoch": 5262} {"train_loss": -26.92377281188965, "global_step": 436822, "epoch": 5262} {"train_loss": -27.224231719970703, "global_step": 436823, "epoch": 5262} {"train_loss": -27.219806671142578, "global_step": 436824, "epoch": 5262} {"train_loss": -27.094465255737305, "global_step": 436825, "epoch": 5262} {"train_loss": -26.8999080657959, "global_step": 436826, "epoch": 5262} {"train_loss": -26.969816207885742, "global_step": 436827, "epoch": 5262} {"train_loss": -26.911213978227362, "global_step": 436828, "epoch": 5262, "val_loss": 6643356.0} {"train_loss": -26.166873931884766, "global_step": 436829, "epoch": 5263} {"train_loss": -26.778772354125977, "global_step": 436830, "epoch": 5263} {"train_loss": -26.743688583374023, "global_step": 436831, "epoch": 5263} {"train_loss": -26.648157119750977, "global_step": 436832, "epoch": 5263} {"train_loss": -26.37432289123535, "global_step": 436833, "epoch": 5263} {"train_loss": -26.48423194885254, "global_step": 436834, "epoch": 5263} {"train_loss": -26.7294979095459, "global_step": 436835, "epoch": 5263} {"train_loss": -26.875761032104492, "global_step": 436836, "epoch": 5263} {"train_loss": -26.408645629882812, "global_step": 436837, "epoch": 5263} {"train_loss": -26.51936149597168, "global_step": 436838, "epoch": 5263} {"train_loss": -26.7585506439209, "global_step": 436839, "epoch": 5263} {"train_loss": -26.69394302368164, "global_step": 436840, "epoch": 5263} {"train_loss": -26.716388702392578, "global_step": 436841, "epoch": 5263} {"train_loss": -26.913162231445312, "global_step": 436842, "epoch": 5263} {"train_loss": -26.634765625, "global_step": 436843, "epoch": 5263} {"train_loss": -27.032764434814453, "global_step": 436844, "epoch": 5263} {"train_loss": -26.892454147338867, "global_step": 436845, "epoch": 5263} {"train_loss": -26.61978530883789, "global_step": 436846, "epoch": 5263} {"train_loss": -27.0430908203125, "global_step": 436847, "epoch": 5263} {"train_loss": -26.93361473083496, "global_step": 436848, "epoch": 5263} {"train_loss": -27.017520904541016, "global_step": 436849, "epoch": 5263} {"train_loss": -26.759611129760742, "global_step": 436850, "epoch": 5263} {"train_loss": -26.4232177734375, "global_step": 436851, "epoch": 5263} {"train_loss": -26.798572540283203, "global_step": 436852, "epoch": 5263} {"train_loss": -26.864776611328125, "global_step": 436853, "epoch": 5263} {"train_loss": -26.75420570373535, "global_step": 436854, "epoch": 5263} {"train_loss": -27.008825302124023, "global_step": 436855, "epoch": 5263} {"train_loss": -27.14908218383789, "global_step": 436856, "epoch": 5263} {"train_loss": -26.831396102905273, "global_step": 436857, "epoch": 5263} {"train_loss": -27.059101104736328, "global_step": 436858, "epoch": 5263} {"train_loss": -26.861282348632812, "global_step": 436859, "epoch": 5263} {"train_loss": -27.1876277923584, "global_step": 436860, "epoch": 5263} {"train_loss": -27.078022003173828, "global_step": 436861, "epoch": 5263} {"train_loss": -26.717443466186523, "global_step": 436862, "epoch": 5263} {"train_loss": -27.067174911499023, "global_step": 436863, "epoch": 5263} {"train_loss": -27.056415557861328, "global_step": 436864, "epoch": 5263} {"train_loss": -27.30535888671875, "global_step": 436865, "epoch": 5263} {"train_loss": -26.907434463500977, "global_step": 436866, "epoch": 5263} {"train_loss": -27.02898597717285, "global_step": 436867, "epoch": 5263} {"train_loss": -27.234272003173828, "global_step": 436868, "epoch": 5263} {"train_loss": -26.7445011138916, "global_step": 436869, "epoch": 5263} {"train_loss": -26.893346786499023, "global_step": 436870, "epoch": 5263} {"train_loss": -26.61822509765625, "global_step": 436871, "epoch": 5263} {"train_loss": -27.06928825378418, "global_step": 436872, "epoch": 5263} {"train_loss": -27.31471061706543, "global_step": 436873, "epoch": 5263} {"train_loss": -26.69537353515625, "global_step": 436874, "epoch": 5263} {"train_loss": -26.832199096679688, "global_step": 436875, "epoch": 5263} {"train_loss": -26.77815055847168, "global_step": 436876, "epoch": 5263} {"train_loss": -27.1716365814209, "global_step": 436877, "epoch": 5263} {"train_loss": -27.1064453125, "global_step": 436878, "epoch": 5263} {"train_loss": -26.726810455322266, "global_step": 436879, "epoch": 5263} {"train_loss": -26.607141494750977, "global_step": 436880, "epoch": 5263} {"train_loss": -26.964313507080078, "global_step": 436881, "epoch": 5263} {"train_loss": -27.134403228759766, "global_step": 436882, "epoch": 5263} {"train_loss": -26.722610473632812, "global_step": 436883, "epoch": 5263} {"train_loss": -27.14312744140625, "global_step": 436884, "epoch": 5263} {"train_loss": -26.960845947265625, "global_step": 436885, "epoch": 5263} {"train_loss": -26.93678092956543, "global_step": 436886, "epoch": 5263} {"train_loss": -26.583362579345703, "global_step": 436887, "epoch": 5263} {"train_loss": -26.7802791595459, "global_step": 436888, "epoch": 5263} {"train_loss": -27.133935928344727, "global_step": 436889, "epoch": 5263} {"train_loss": -27.316883087158203, "global_step": 436890, "epoch": 5263} {"train_loss": -26.685123443603516, "global_step": 436891, "epoch": 5263} {"train_loss": -26.63863182067871, "global_step": 436892, "epoch": 5263} {"train_loss": -26.792097091674805, "global_step": 436893, "epoch": 5263} {"train_loss": -26.638696670532227, "global_step": 436894, "epoch": 5263} {"train_loss": -27.127607345581055, "global_step": 436895, "epoch": 5263} {"train_loss": -27.14393424987793, "global_step": 436896, "epoch": 5263} {"train_loss": -27.08405876159668, "global_step": 436897, "epoch": 5263} {"train_loss": -27.2076473236084, "global_step": 436898, "epoch": 5263} {"train_loss": -26.87006187438965, "global_step": 436899, "epoch": 5263} {"train_loss": -26.583328247070312, "global_step": 436900, "epoch": 5263} {"train_loss": -26.899688720703125, "global_step": 436901, "epoch": 5263} {"train_loss": -27.11689567565918, "global_step": 436902, "epoch": 5263} {"train_loss": -27.4957218170166, "global_step": 436903, "epoch": 5263} {"train_loss": -26.999135971069336, "global_step": 436904, "epoch": 5263} {"train_loss": -26.881616592407227, "global_step": 436905, "epoch": 5263} {"train_loss": -26.88962745666504, "global_step": 436906, "epoch": 5263} {"train_loss": -26.978229522705078, "global_step": 436907, "epoch": 5263} {"train_loss": -26.891386032104492, "global_step": 436908, "epoch": 5263} {"train_loss": -26.920398712158203, "global_step": 436909, "epoch": 5263} {"train_loss": -26.879552841186523, "global_step": 436910, "epoch": 5263} {"train_loss": -26.875229847000305, "global_step": 436911, "epoch": 5263, "val_loss": 6546189.0} {"train_loss": -26.456098556518555, "global_step": 436912, "epoch": 5264} {"train_loss": -26.765823364257812, "global_step": 436913, "epoch": 5264} {"train_loss": -26.952362060546875, "global_step": 436914, "epoch": 5264} {"train_loss": -26.868188858032227, "global_step": 436915, "epoch": 5264} {"train_loss": -26.29323387145996, "global_step": 436916, "epoch": 5264} {"train_loss": -26.743061065673828, "global_step": 436917, "epoch": 5264} {"train_loss": -26.775548934936523, "global_step": 436918, "epoch": 5264} {"train_loss": -26.584630966186523, "global_step": 436919, "epoch": 5264} {"train_loss": -26.476123809814453, "global_step": 436920, "epoch": 5264} {"train_loss": -27.003631591796875, "global_step": 436921, "epoch": 5264} {"train_loss": -26.450927734375, "global_step": 436922, "epoch": 5264} {"train_loss": -26.898237228393555, "global_step": 436923, "epoch": 5264} {"train_loss": -26.418256759643555, "global_step": 436924, "epoch": 5264} {"train_loss": -26.4263916015625, "global_step": 436925, "epoch": 5264} {"train_loss": -26.431528091430664, "global_step": 436926, "epoch": 5264} {"train_loss": -26.855228424072266, "global_step": 436927, "epoch": 5264} {"train_loss": -26.4376163482666, "global_step": 436928, "epoch": 5264} {"train_loss": -27.31255531311035, "global_step": 436929, "epoch": 5264} {"train_loss": -26.93075942993164, "global_step": 436930, "epoch": 5264} {"train_loss": -26.484899520874023, "global_step": 436931, "epoch": 5264} {"train_loss": -27.063566207885742, "global_step": 436932, "epoch": 5264} {"train_loss": -26.433486938476562, "global_step": 436933, "epoch": 5264} {"train_loss": -26.70655632019043, "global_step": 436934, "epoch": 5264} {"train_loss": -26.849058151245117, "global_step": 436935, "epoch": 5264} {"train_loss": -26.7426815032959, "global_step": 436936, "epoch": 5264} {"train_loss": -26.849130630493164, "global_step": 436937, "epoch": 5264} {"train_loss": -26.981006622314453, "global_step": 436938, "epoch": 5264} {"train_loss": -26.853809356689453, "global_step": 436939, "epoch": 5264} {"train_loss": -26.92305564880371, "global_step": 436940, "epoch": 5264} {"train_loss": -27.122406005859375, "global_step": 436941, "epoch": 5264} {"train_loss": -26.915714263916016, "global_step": 436942, "epoch": 5264} {"train_loss": -26.707538604736328, "global_step": 436943, "epoch": 5264} {"train_loss": -26.973007202148438, "global_step": 436944, "epoch": 5264} {"train_loss": -26.583845138549805, "global_step": 436945, "epoch": 5264} {"train_loss": -27.218006134033203, "global_step": 436946, "epoch": 5264} {"train_loss": -26.702274322509766, "global_step": 436947, "epoch": 5264} {"train_loss": -27.010950088500977, "global_step": 436948, "epoch": 5264} {"train_loss": -27.005231857299805, "global_step": 436949, "epoch": 5264} {"train_loss": -26.930822372436523, "global_step": 436950, "epoch": 5264} {"train_loss": -26.675973892211914, "global_step": 436951, "epoch": 5264} {"train_loss": -27.100309371948242, "global_step": 436952, "epoch": 5264} {"train_loss": -26.8646297454834, "global_step": 436953, "epoch": 5264} {"train_loss": -27.22063636779785, "global_step": 436954, "epoch": 5264} {"train_loss": -27.062585830688477, "global_step": 436955, "epoch": 5264} {"train_loss": -26.84339714050293, "global_step": 436956, "epoch": 5264} {"train_loss": -27.176528930664062, "global_step": 436957, "epoch": 5264} {"train_loss": -27.280271530151367, "global_step": 436958, "epoch": 5264} {"train_loss": -26.57161521911621, "global_step": 436959, "epoch": 5264} {"train_loss": -26.814489364624023, "global_step": 436960, "epoch": 5264} {"train_loss": -27.218708038330078, "global_step": 436961, "epoch": 5264} {"train_loss": -26.772491455078125, "global_step": 436962, "epoch": 5264} {"train_loss": -26.86429786682129, "global_step": 436963, "epoch": 5264} {"train_loss": -27.138824462890625, "global_step": 436964, "epoch": 5264} {"train_loss": -26.48101234436035, "global_step": 436965, "epoch": 5264} {"train_loss": -27.279693603515625, "global_step": 436966, "epoch": 5264} {"train_loss": -26.832807540893555, "global_step": 436967, "epoch": 5264} {"train_loss": -26.542783737182617, "global_step": 436968, "epoch": 5264} {"train_loss": -27.160175323486328, "global_step": 436969, "epoch": 5264} {"train_loss": -26.5308837890625, "global_step": 436970, "epoch": 5264} {"train_loss": -26.24747657775879, "global_step": 436971, "epoch": 5264} {"train_loss": -27.033227920532227, "global_step": 436972, "epoch": 5264} {"train_loss": -26.78387451171875, "global_step": 436973, "epoch": 5264} {"train_loss": -27.0946044921875, "global_step": 436974, "epoch": 5264} {"train_loss": -26.777978897094727, "global_step": 436975, "epoch": 5264} {"train_loss": -26.710248947143555, "global_step": 436976, "epoch": 5264} {"train_loss": -26.864049911499023, "global_step": 436977, "epoch": 5264} {"train_loss": -26.925506591796875, "global_step": 436978, "epoch": 5264} {"train_loss": -27.047534942626953, "global_step": 436979, "epoch": 5264} {"train_loss": -27.13435935974121, "global_step": 436980, "epoch": 5264} {"train_loss": -27.07777976989746, "global_step": 436981, "epoch": 5264} {"train_loss": -26.842788696289062, "global_step": 436982, "epoch": 5264} {"train_loss": -27.101728439331055, "global_step": 436983, "epoch": 5264} {"train_loss": -27.02666664123535, "global_step": 436984, "epoch": 5264} {"train_loss": -26.986204147338867, "global_step": 436985, "epoch": 5264} {"train_loss": -27.160810470581055, "global_step": 436986, "epoch": 5264} {"train_loss": -26.833784103393555, "global_step": 436987, "epoch": 5264} {"train_loss": -27.04023551940918, "global_step": 436988, "epoch": 5264} {"train_loss": -26.63934326171875, "global_step": 436989, "epoch": 5264} {"train_loss": -26.88529396057129, "global_step": 436990, "epoch": 5264} {"train_loss": -27.33234977722168, "global_step": 436991, "epoch": 5264} {"train_loss": -26.803211212158203, "global_step": 436992, "epoch": 5264} {"train_loss": -27.3153133392334, "global_step": 436993, "epoch": 5264} {"train_loss": -26.868384510637767, "global_step": 436994, "epoch": 5264, "val_loss": 6642987.5} {"train_loss": -26.7150936126709, "global_step": 436995, "epoch": 5265} {"train_loss": -26.484756469726562, "global_step": 436996, "epoch": 5265} {"train_loss": -26.630084991455078, "global_step": 436997, "epoch": 5265} {"train_loss": -26.234649658203125, "global_step": 436998, "epoch": 5265} {"train_loss": -26.11747169494629, "global_step": 436999, "epoch": 5265} {"train_loss": -26.169788360595703, "global_step": 437000, "epoch": 5265} {"train_loss": -26.6007022857666, "global_step": 437001, "epoch": 5265} {"train_loss": -26.56568717956543, "global_step": 437002, "epoch": 5265} {"train_loss": -26.694372177124023, "global_step": 437003, "epoch": 5265} {"train_loss": -26.61237907409668, "global_step": 437004, "epoch": 5265} {"train_loss": -26.65504264831543, "global_step": 437005, "epoch": 5265} {"train_loss": -26.499418258666992, "global_step": 437006, "epoch": 5265} {"train_loss": -26.401111602783203, "global_step": 437007, "epoch": 5265} {"train_loss": -26.666385650634766, "global_step": 437008, "epoch": 5265} {"train_loss": -26.192829132080078, "global_step": 437009, "epoch": 5265} {"train_loss": -26.382617950439453, "global_step": 437010, "epoch": 5265} {"train_loss": -26.246627807617188, "global_step": 437011, "epoch": 5265} {"train_loss": -26.6202449798584, "global_step": 437012, "epoch": 5265} {"train_loss": -26.386306762695312, "global_step": 437013, "epoch": 5265} {"train_loss": -26.785734176635742, "global_step": 437014, "epoch": 5265} {"train_loss": -26.569183349609375, "global_step": 437015, "epoch": 5265} {"train_loss": -26.540699005126953, "global_step": 437016, "epoch": 5265} {"train_loss": -26.11394691467285, "global_step": 437017, "epoch": 5265} {"train_loss": -26.492401123046875, "global_step": 437018, "epoch": 5265} {"train_loss": -26.847692489624023, "global_step": 437019, "epoch": 5265} {"train_loss": -26.519561767578125, "global_step": 437020, "epoch": 5265} {"train_loss": -26.69965171813965, "global_step": 437021, "epoch": 5265} {"train_loss": -26.716501235961914, "global_step": 437022, "epoch": 5265} {"train_loss": -26.6002197265625, "global_step": 437023, "epoch": 5265} {"train_loss": -26.169921875, "global_step": 437024, "epoch": 5265} {"train_loss": -26.85377311706543, "global_step": 437025, "epoch": 5265} {"train_loss": -26.500885009765625, "global_step": 437026, "epoch": 5265} {"train_loss": -26.717742919921875, "global_step": 437027, "epoch": 5265} {"train_loss": -26.714445114135742, "global_step": 437028, "epoch": 5265} {"train_loss": -26.98526954650879, "global_step": 437029, "epoch": 5265} {"train_loss": -26.8880615234375, "global_step": 437030, "epoch": 5265} {"train_loss": -27.089746475219727, "global_step": 437031, "epoch": 5265} {"train_loss": -26.87491226196289, "global_step": 437032, "epoch": 5265} {"train_loss": -26.7592716217041, "global_step": 437033, "epoch": 5265} {"train_loss": -26.662139892578125, "global_step": 437034, "epoch": 5265} {"train_loss": -26.758045196533203, "global_step": 437035, "epoch": 5265} {"train_loss": -26.852670669555664, "global_step": 437036, "epoch": 5265} {"train_loss": -27.212961196899414, "global_step": 437037, "epoch": 5265} {"train_loss": -27.076330184936523, "global_step": 437038, "epoch": 5265} {"train_loss": -26.948633193969727, "global_step": 437039, "epoch": 5265} {"train_loss": -26.958810806274414, "global_step": 437040, "epoch": 5265} {"train_loss": -27.30824089050293, "global_step": 437041, "epoch": 5265} {"train_loss": -26.9915828704834, "global_step": 437042, "epoch": 5265} {"train_loss": -26.931264877319336, "global_step": 437043, "epoch": 5265} {"train_loss": -27.245838165283203, "global_step": 437044, "epoch": 5265} {"train_loss": -27.130847930908203, "global_step": 437045, "epoch": 5265} {"train_loss": -27.401777267456055, "global_step": 437046, "epoch": 5265} {"train_loss": -27.054401397705078, "global_step": 437047, "epoch": 5265} {"train_loss": -27.136463165283203, "global_step": 437048, "epoch": 5265} {"train_loss": -26.76643180847168, "global_step": 437049, "epoch": 5265} {"train_loss": -27.106124877929688, "global_step": 437050, "epoch": 5265} {"train_loss": -27.021528244018555, "global_step": 437051, "epoch": 5265} {"train_loss": -26.99567222595215, "global_step": 437052, "epoch": 5265} {"train_loss": -26.766332626342773, "global_step": 437053, "epoch": 5265} {"train_loss": -26.982666015625, "global_step": 437054, "epoch": 5265} {"train_loss": -27.2366886138916, "global_step": 437055, "epoch": 5265} {"train_loss": -27.179105758666992, "global_step": 437056, "epoch": 5265} {"train_loss": -27.28639793395996, "global_step": 437057, "epoch": 5265} {"train_loss": -27.389562606811523, "global_step": 437058, "epoch": 5265} {"train_loss": -27.04070472717285, "global_step": 437059, "epoch": 5265} {"train_loss": -27.2591495513916, "global_step": 437060, "epoch": 5265} {"train_loss": -27.054044723510742, "global_step": 437061, "epoch": 5265} {"train_loss": -26.764495849609375, "global_step": 437062, "epoch": 5265} {"train_loss": -27.239049911499023, "global_step": 437063, "epoch": 5265} {"train_loss": -27.471237182617188, "global_step": 437064, "epoch": 5265} {"train_loss": -26.911176681518555, "global_step": 437065, "epoch": 5265} {"train_loss": -26.52734375, "global_step": 437066, "epoch": 5265} {"train_loss": -26.535364151000977, "global_step": 437067, "epoch": 5265} {"train_loss": -26.458417892456055, "global_step": 437068, "epoch": 5265} {"train_loss": -26.99186134338379, "global_step": 437069, "epoch": 5265} {"train_loss": -26.78187370300293, "global_step": 437070, "epoch": 5265} {"train_loss": -26.43601417541504, "global_step": 437071, "epoch": 5265} {"train_loss": -26.34174156188965, "global_step": 437072, "epoch": 5265} {"train_loss": -26.746337890625, "global_step": 437073, "epoch": 5265} {"train_loss": -26.963287353515625, "global_step": 437074, "epoch": 5265} {"train_loss": -26.594175338745117, "global_step": 437075, "epoch": 5265} {"train_loss": -26.539203643798828, "global_step": 437076, "epoch": 5265} {"train_loss": -26.762000692896095, "global_step": 437077, "epoch": 5265, "val_loss": 6708283.0} {"train_loss": -26.26495933532715, "global_step": 437078, "epoch": 5266} {"train_loss": -26.167654037475586, "global_step": 437079, "epoch": 5266} {"train_loss": -26.372577667236328, "global_step": 437080, "epoch": 5266} {"train_loss": -26.571630477905273, "global_step": 437081, "epoch": 5266} {"train_loss": -26.587064743041992, "global_step": 437082, "epoch": 5266} {"train_loss": -26.56110191345215, "global_step": 437083, "epoch": 5266} {"train_loss": -26.307178497314453, "global_step": 437084, "epoch": 5266} {"train_loss": -26.625293731689453, "global_step": 437085, "epoch": 5266} {"train_loss": -26.547109603881836, "global_step": 437086, "epoch": 5266} {"train_loss": -26.73090171813965, "global_step": 437087, "epoch": 5266} {"train_loss": -26.42592430114746, "global_step": 437088, "epoch": 5266} {"train_loss": -26.371341705322266, "global_step": 437089, "epoch": 5266} {"train_loss": -26.710525512695312, "global_step": 437090, "epoch": 5266} {"train_loss": -26.577238082885742, "global_step": 437091, "epoch": 5266} {"train_loss": -26.55059814453125, "global_step": 437092, "epoch": 5266} {"train_loss": -27.081281661987305, "global_step": 437093, "epoch": 5266} {"train_loss": -26.627105712890625, "global_step": 437094, "epoch": 5266} {"train_loss": -26.10828971862793, "global_step": 437095, "epoch": 5266} {"train_loss": -26.879425048828125, "global_step": 437096, "epoch": 5266} {"train_loss": -26.39007568359375, "global_step": 437097, "epoch": 5266} {"train_loss": -26.992414474487305, "global_step": 437098, "epoch": 5266} {"train_loss": -26.59574317932129, "global_step": 437099, "epoch": 5266} {"train_loss": -26.90226173400879, "global_step": 437100, "epoch": 5266} {"train_loss": -26.524280548095703, "global_step": 437101, "epoch": 5266} {"train_loss": -26.574737548828125, "global_step": 437102, "epoch": 5266} {"train_loss": -27.0312442779541, "global_step": 437103, "epoch": 5266} {"train_loss": -27.17919921875, "global_step": 437104, "epoch": 5266} {"train_loss": -26.569904327392578, "global_step": 437105, "epoch": 5266} {"train_loss": -27.05038833618164, "global_step": 437106, "epoch": 5266} {"train_loss": -26.76934242248535, "global_step": 437107, "epoch": 5266} {"train_loss": -27.343530654907227, "global_step": 437108, "epoch": 5266} {"train_loss": -27.197803497314453, "global_step": 437109, "epoch": 5266} {"train_loss": -26.936126708984375, "global_step": 437110, "epoch": 5266} {"train_loss": -26.996906280517578, "global_step": 437111, "epoch": 5266} {"train_loss": -27.034326553344727, "global_step": 437112, "epoch": 5266} {"train_loss": -26.823606491088867, "global_step": 437113, "epoch": 5266} {"train_loss": -27.121673583984375, "global_step": 437114, "epoch": 5266} {"train_loss": -27.2979679107666, "global_step": 437115, "epoch": 5266} {"train_loss": -27.076831817626953, "global_step": 437116, "epoch": 5266} {"train_loss": -26.871809005737305, "global_step": 437117, "epoch": 5266} {"train_loss": -27.0881290435791, "global_step": 437118, "epoch": 5266} {"train_loss": -27.154865264892578, "global_step": 437119, "epoch": 5266} {"train_loss": -27.222166061401367, "global_step": 437120, "epoch": 5266} {"train_loss": -26.606170654296875, "global_step": 437121, "epoch": 5266} {"train_loss": -26.96671485900879, "global_step": 437122, "epoch": 5266} {"train_loss": -27.189184188842773, "global_step": 437123, "epoch": 5266} {"train_loss": -27.320301055908203, "global_step": 437124, "epoch": 5266} {"train_loss": -27.116779327392578, "global_step": 437125, "epoch": 5266} {"train_loss": -26.831466674804688, "global_step": 437126, "epoch": 5266} {"train_loss": -26.911834716796875, "global_step": 437127, "epoch": 5266} {"train_loss": -26.778350830078125, "global_step": 437128, "epoch": 5266} {"train_loss": -27.160858154296875, "global_step": 437129, "epoch": 5266} {"train_loss": -27.39548110961914, "global_step": 437130, "epoch": 5266} {"train_loss": -26.849241256713867, "global_step": 437131, "epoch": 5266} {"train_loss": -27.497106552124023, "global_step": 437132, "epoch": 5266} {"train_loss": -27.113941192626953, "global_step": 437133, "epoch": 5266} {"train_loss": -26.891653060913086, "global_step": 437134, "epoch": 5266} {"train_loss": -27.24024772644043, "global_step": 437135, "epoch": 5266} {"train_loss": -26.932043075561523, "global_step": 437136, "epoch": 5266} {"train_loss": -27.21673011779785, "global_step": 437137, "epoch": 5266} {"train_loss": -26.949249267578125, "global_step": 437138, "epoch": 5266} {"train_loss": -27.47711753845215, "global_step": 437139, "epoch": 5266} {"train_loss": -26.85248374938965, "global_step": 437140, "epoch": 5266} {"train_loss": -27.1543025970459, "global_step": 437141, "epoch": 5266} {"train_loss": -26.746850967407227, "global_step": 437142, "epoch": 5266} {"train_loss": -27.071014404296875, "global_step": 437143, "epoch": 5266} {"train_loss": -26.988935470581055, "global_step": 437144, "epoch": 5266} {"train_loss": -26.825971603393555, "global_step": 437145, "epoch": 5266} {"train_loss": -26.43311882019043, "global_step": 437146, "epoch": 5266} {"train_loss": -26.47169303894043, "global_step": 437147, "epoch": 5266} {"train_loss": -27.46856689453125, "global_step": 437148, "epoch": 5266} {"train_loss": -26.545385360717773, "global_step": 437149, "epoch": 5266} {"train_loss": -26.35930824279785, "global_step": 437150, "epoch": 5266} {"train_loss": -25.955841064453125, "global_step": 437151, "epoch": 5266} {"train_loss": -27.063709259033203, "global_step": 437152, "epoch": 5266} {"train_loss": -26.624353408813477, "global_step": 437153, "epoch": 5266} {"train_loss": -26.493927001953125, "global_step": 437154, "epoch": 5266} {"train_loss": -26.569171905517578, "global_step": 437155, "epoch": 5266} {"train_loss": -26.73899269104004, "global_step": 437156, "epoch": 5266} {"train_loss": -26.456212997436523, "global_step": 437157, "epoch": 5266} {"train_loss": -26.596454620361328, "global_step": 437158, "epoch": 5266} {"train_loss": -26.68425941467285, "global_step": 437159, "epoch": 5266} {"train_loss": -26.802355111363422, "global_step": 437160, "epoch": 5266, "val_loss": 6591032.5} {"train_loss": -24.109525680541992, "global_step": 437161, "epoch": 5267} {"train_loss": -25.088581085205078, "global_step": 437162, "epoch": 5267} {"train_loss": -25.9892578125, "global_step": 437163, "epoch": 5267} {"train_loss": -24.83064079284668, "global_step": 437164, "epoch": 5267} {"train_loss": -25.921247482299805, "global_step": 437165, "epoch": 5267} {"train_loss": -25.070953369140625, "global_step": 437166, "epoch": 5267} {"train_loss": -26.02162742614746, "global_step": 437167, "epoch": 5267} {"train_loss": -26.355310440063477, "global_step": 437168, "epoch": 5267} {"train_loss": -25.79535484313965, "global_step": 437169, "epoch": 5267} {"train_loss": -26.36910057067871, "global_step": 437170, "epoch": 5267} {"train_loss": -26.18316650390625, "global_step": 437171, "epoch": 5267} {"train_loss": -26.309850692749023, "global_step": 437172, "epoch": 5267} {"train_loss": -26.46367835998535, "global_step": 437173, "epoch": 5267} {"train_loss": -26.168750762939453, "global_step": 437174, "epoch": 5267} {"train_loss": -26.218048095703125, "global_step": 437175, "epoch": 5267} {"train_loss": -26.38326072692871, "global_step": 437176, "epoch": 5267} {"train_loss": -26.321441650390625, "global_step": 437177, "epoch": 5267} {"train_loss": -26.248498916625977, "global_step": 437178, "epoch": 5267} {"train_loss": -26.194849014282227, "global_step": 437179, "epoch": 5267} {"train_loss": -26.4267520904541, "global_step": 437180, "epoch": 5267} {"train_loss": -26.364500045776367, "global_step": 437181, "epoch": 5267} {"train_loss": -26.600988388061523, "global_step": 437182, "epoch": 5267} {"train_loss": -26.568225860595703, "global_step": 437183, "epoch": 5267} {"train_loss": -26.655029296875, "global_step": 437184, "epoch": 5267} {"train_loss": -26.68446159362793, "global_step": 437185, "epoch": 5267} {"train_loss": -26.77142906188965, "global_step": 437186, "epoch": 5267} {"train_loss": -26.93121910095215, "global_step": 437187, "epoch": 5267} {"train_loss": -26.837024688720703, "global_step": 437188, "epoch": 5267} {"train_loss": -26.763702392578125, "global_step": 437189, "epoch": 5267} {"train_loss": -26.758237838745117, "global_step": 437190, "epoch": 5267} {"train_loss": -26.7023868560791, "global_step": 437191, "epoch": 5267} {"train_loss": -26.486913681030273, "global_step": 437192, "epoch": 5267} {"train_loss": -26.243432998657227, "global_step": 437193, "epoch": 5267} {"train_loss": -26.519550323486328, "global_step": 437194, "epoch": 5267} {"train_loss": -26.512176513671875, "global_step": 437195, "epoch": 5267} {"train_loss": -26.818700790405273, "global_step": 437196, "epoch": 5267} {"train_loss": -26.519245147705078, "global_step": 437197, "epoch": 5267} {"train_loss": -26.891448974609375, "global_step": 437198, "epoch": 5267} {"train_loss": -26.526601791381836, "global_step": 437199, "epoch": 5267} {"train_loss": -27.231201171875, "global_step": 437200, "epoch": 5267} {"train_loss": -26.795446395874023, "global_step": 437201, "epoch": 5267} {"train_loss": -26.951841354370117, "global_step": 437202, "epoch": 5267} {"train_loss": -26.923786163330078, "global_step": 437203, "epoch": 5267} {"train_loss": -27.025115966796875, "global_step": 437204, "epoch": 5267} {"train_loss": -26.994770050048828, "global_step": 437205, "epoch": 5267} {"train_loss": -27.03957176208496, "global_step": 437206, "epoch": 5267} {"train_loss": -26.923070907592773, "global_step": 437207, "epoch": 5267} {"train_loss": -27.047449111938477, "global_step": 437208, "epoch": 5267} {"train_loss": -27.02497673034668, "global_step": 437209, "epoch": 5267} {"train_loss": -27.139204025268555, "global_step": 437210, "epoch": 5267} {"train_loss": -27.07822608947754, "global_step": 437211, "epoch": 5267} {"train_loss": -26.895444869995117, "global_step": 437212, "epoch": 5267} {"train_loss": -27.042646408081055, "global_step": 437213, "epoch": 5267} {"train_loss": -26.57770347595215, "global_step": 437214, "epoch": 5267} {"train_loss": -26.89056968688965, "global_step": 437215, "epoch": 5267} {"train_loss": -26.7221736907959, "global_step": 437216, "epoch": 5267} {"train_loss": -27.149404525756836, "global_step": 437217, "epoch": 5267} {"train_loss": -26.94898796081543, "global_step": 437218, "epoch": 5267} {"train_loss": -26.96484375, "global_step": 437219, "epoch": 5267} {"train_loss": -26.976245880126953, "global_step": 437220, "epoch": 5267} {"train_loss": -26.90150260925293, "global_step": 437221, "epoch": 5267} {"train_loss": -26.971017837524414, "global_step": 437222, "epoch": 5267} {"train_loss": -26.782917022705078, "global_step": 437223, "epoch": 5267} {"train_loss": -27.11773681640625, "global_step": 437224, "epoch": 5267} {"train_loss": -26.891401290893555, "global_step": 437225, "epoch": 5267} {"train_loss": -27.037443161010742, "global_step": 437226, "epoch": 5267} {"train_loss": -26.884252548217773, "global_step": 437227, "epoch": 5267} {"train_loss": -27.117406845092773, "global_step": 437228, "epoch": 5267} {"train_loss": -26.82847023010254, "global_step": 437229, "epoch": 5267} {"train_loss": -27.38343620300293, "global_step": 437230, "epoch": 5267} {"train_loss": -27.168888092041016, "global_step": 437231, "epoch": 5267} {"train_loss": -26.75726318359375, "global_step": 437232, "epoch": 5267} {"train_loss": -26.640207290649414, "global_step": 437233, "epoch": 5267} {"train_loss": -26.81818199157715, "global_step": 437234, "epoch": 5267} {"train_loss": -27.116546630859375, "global_step": 437235, "epoch": 5267} {"train_loss": -26.852100372314453, "global_step": 437236, "epoch": 5267} {"train_loss": -27.083892822265625, "global_step": 437237, "epoch": 5267} {"train_loss": -27.138803482055664, "global_step": 437238, "epoch": 5267} {"train_loss": -27.276691436767578, "global_step": 437239, "epoch": 5267} {"train_loss": -26.585803985595703, "global_step": 437240, "epoch": 5267} {"train_loss": -27.170751571655273, "global_step": 437241, "epoch": 5267} {"train_loss": -27.094879150390625, "global_step": 437242, "epoch": 5267} {"train_loss": -26.642019662512354, "global_step": 437243, "epoch": 5267, "val_loss": 6768258.0} {"train_loss": -27.071130752563477, "global_step": 437244, "epoch": 5268} {"train_loss": -26.393171310424805, "global_step": 437245, "epoch": 5268} {"train_loss": -26.036279678344727, "global_step": 437246, "epoch": 5268} {"train_loss": -26.3449764251709, "global_step": 437247, "epoch": 5268} {"train_loss": -26.52790641784668, "global_step": 437248, "epoch": 5268} {"train_loss": -26.287561416625977, "global_step": 437249, "epoch": 5268} {"train_loss": -26.553754806518555, "global_step": 437250, "epoch": 5268} {"train_loss": -26.97464370727539, "global_step": 437251, "epoch": 5268} {"train_loss": -26.001514434814453, "global_step": 437252, "epoch": 5268} {"train_loss": -26.42144775390625, "global_step": 437253, "epoch": 5268} {"train_loss": -26.64947509765625, "global_step": 437254, "epoch": 5268} {"train_loss": -26.703840255737305, "global_step": 437255, "epoch": 5268} {"train_loss": -26.422210693359375, "global_step": 437256, "epoch": 5268} {"train_loss": -26.622053146362305, "global_step": 437257, "epoch": 5268} {"train_loss": -26.548303604125977, "global_step": 437258, "epoch": 5268} {"train_loss": -26.82466697692871, "global_step": 437259, "epoch": 5268} {"train_loss": -26.470701217651367, "global_step": 437260, "epoch": 5268} {"train_loss": -26.756399154663086, "global_step": 437261, "epoch": 5268} {"train_loss": -26.89324378967285, "global_step": 437262, "epoch": 5268} {"train_loss": -26.775976181030273, "global_step": 437263, "epoch": 5268} {"train_loss": -26.806848526000977, "global_step": 437264, "epoch": 5268} {"train_loss": -26.724531173706055, "global_step": 437265, "epoch": 5268} {"train_loss": -26.556018829345703, "global_step": 437266, "epoch": 5268} {"train_loss": -26.63246726989746, "global_step": 437267, "epoch": 5268} {"train_loss": -26.987964630126953, "global_step": 437268, "epoch": 5268} {"train_loss": -26.960397720336914, "global_step": 437269, "epoch": 5268} {"train_loss": -26.795862197875977, "global_step": 437270, "epoch": 5268} {"train_loss": -27.061689376831055, "global_step": 437271, "epoch": 5268} {"train_loss": -27.4360408782959, "global_step": 437272, "epoch": 5268} {"train_loss": -26.734296798706055, "global_step": 437273, "epoch": 5268} {"train_loss": -26.93768882751465, "global_step": 437274, "epoch": 5268} {"train_loss": -27.124958038330078, "global_step": 437275, "epoch": 5268} {"train_loss": -27.077682495117188, "global_step": 437276, "epoch": 5268} {"train_loss": -26.770599365234375, "global_step": 437277, "epoch": 5268} {"train_loss": -27.035236358642578, "global_step": 437278, "epoch": 5268} {"train_loss": -27.0816593170166, "global_step": 437279, "epoch": 5268} {"train_loss": -27.014856338500977, "global_step": 437280, "epoch": 5268} {"train_loss": -27.5728816986084, "global_step": 437281, "epoch": 5268} {"train_loss": -26.776357650756836, "global_step": 437282, "epoch": 5268} {"train_loss": -27.185230255126953, "global_step": 437283, "epoch": 5268} {"train_loss": -27.323246002197266, "global_step": 437284, "epoch": 5268} {"train_loss": -27.03557777404785, "global_step": 437285, "epoch": 5268} {"train_loss": -27.33955955505371, "global_step": 437286, "epoch": 5268} {"train_loss": -26.73200798034668, "global_step": 437287, "epoch": 5268} {"train_loss": -26.064977645874023, "global_step": 437288, "epoch": 5268} {"train_loss": -26.576934814453125, "global_step": 437289, "epoch": 5268} {"train_loss": -26.573328018188477, "global_step": 437290, "epoch": 5268} {"train_loss": -26.770477294921875, "global_step": 437291, "epoch": 5268} {"train_loss": -26.713043212890625, "global_step": 437292, "epoch": 5268} {"train_loss": -26.1267032623291, "global_step": 437293, "epoch": 5268} {"train_loss": -26.214786529541016, "global_step": 437294, "epoch": 5268} {"train_loss": -25.94341468811035, "global_step": 437295, "epoch": 5268} {"train_loss": -26.594196319580078, "global_step": 437296, "epoch": 5268} {"train_loss": -26.35638427734375, "global_step": 437297, "epoch": 5268} {"train_loss": -26.97285270690918, "global_step": 437298, "epoch": 5268} {"train_loss": -26.710723876953125, "global_step": 437299, "epoch": 5268} {"train_loss": -26.814599990844727, "global_step": 437300, "epoch": 5268} {"train_loss": -26.78839683532715, "global_step": 437301, "epoch": 5268} {"train_loss": -26.855758666992188, "global_step": 437302, "epoch": 5268} {"train_loss": -27.1202449798584, "global_step": 437303, "epoch": 5268} {"train_loss": -27.18269157409668, "global_step": 437304, "epoch": 5268} {"train_loss": -27.028051376342773, "global_step": 437305, "epoch": 5268} {"train_loss": -27.061010360717773, "global_step": 437306, "epoch": 5268} {"train_loss": -26.5987491607666, "global_step": 437307, "epoch": 5268} {"train_loss": -26.925540924072266, "global_step": 437308, "epoch": 5268} {"train_loss": -26.455642700195312, "global_step": 437309, "epoch": 5268} {"train_loss": -27.170883178710938, "global_step": 437310, "epoch": 5268} {"train_loss": -26.773426055908203, "global_step": 437311, "epoch": 5268} {"train_loss": -27.078296661376953, "global_step": 437312, "epoch": 5268} {"train_loss": -27.012052536010742, "global_step": 437313, "epoch": 5268} {"train_loss": -27.075336456298828, "global_step": 437314, "epoch": 5268} {"train_loss": -26.784423828125, "global_step": 437315, "epoch": 5268} {"train_loss": -27.36819839477539, "global_step": 437316, "epoch": 5268} {"train_loss": -26.776798248291016, "global_step": 437317, "epoch": 5268} {"train_loss": -26.939664840698242, "global_step": 437318, "epoch": 5268} {"train_loss": -26.952713012695312, "global_step": 437319, "epoch": 5268} {"train_loss": -27.384414672851562, "global_step": 437320, "epoch": 5268} {"train_loss": -27.14832878112793, "global_step": 437321, "epoch": 5268} {"train_loss": -26.47906494140625, "global_step": 437322, "epoch": 5268} {"train_loss": -27.180570602416992, "global_step": 437323, "epoch": 5268} {"train_loss": -26.9829044342041, "global_step": 437324, "epoch": 5268} {"train_loss": -27.346515655517578, "global_step": 437325, "epoch": 5268} {"train_loss": -26.803088728203832, "global_step": 437326, "epoch": 5268, "val_loss": 6634454.0} {"train_loss": -26.669300079345703, "global_step": 437327, "epoch": 5269} {"train_loss": -26.723163604736328, "global_step": 437328, "epoch": 5269} {"train_loss": -26.79620361328125, "global_step": 437329, "epoch": 5269} {"train_loss": -26.843891143798828, "global_step": 437330, "epoch": 5269} {"train_loss": -26.695087432861328, "global_step": 437331, "epoch": 5269} {"train_loss": -26.70222282409668, "global_step": 437332, "epoch": 5269} {"train_loss": -26.943017959594727, "global_step": 437333, "epoch": 5269} {"train_loss": -26.743749618530273, "global_step": 437334, "epoch": 5269} {"train_loss": -26.643152236938477, "global_step": 437335, "epoch": 5269} {"train_loss": -26.955976486206055, "global_step": 437336, "epoch": 5269} {"train_loss": -26.68645668029785, "global_step": 437337, "epoch": 5269} {"train_loss": -26.698522567749023, "global_step": 437338, "epoch": 5269} {"train_loss": -26.66680335998535, "global_step": 437339, "epoch": 5269} {"train_loss": -26.589466094970703, "global_step": 437340, "epoch": 5269} {"train_loss": -26.49831199645996, "global_step": 437341, "epoch": 5269} {"train_loss": -27.208845138549805, "global_step": 437342, "epoch": 5269} {"train_loss": -26.924341201782227, "global_step": 437343, "epoch": 5269} {"train_loss": -26.928434371948242, "global_step": 437344, "epoch": 5269} {"train_loss": -26.996442794799805, "global_step": 437345, "epoch": 5269} {"train_loss": -26.68161392211914, "global_step": 437346, "epoch": 5269} {"train_loss": -27.15205192565918, "global_step": 437347, "epoch": 5269} {"train_loss": -26.747024536132812, "global_step": 437348, "epoch": 5269} {"train_loss": -26.536483764648438, "global_step": 437349, "epoch": 5269} {"train_loss": -26.76702880859375, "global_step": 437350, "epoch": 5269} {"train_loss": -26.56622314453125, "global_step": 437351, "epoch": 5269} {"train_loss": -26.654678344726562, "global_step": 437352, "epoch": 5269} {"train_loss": -26.81785011291504, "global_step": 437353, "epoch": 5269} {"train_loss": -27.107135772705078, "global_step": 437354, "epoch": 5269} {"train_loss": -26.9057559967041, "global_step": 437355, "epoch": 5269} {"train_loss": -26.83228874206543, "global_step": 437356, "epoch": 5269} {"train_loss": -26.817670822143555, "global_step": 437357, "epoch": 5269} {"train_loss": -27.08249282836914, "global_step": 437358, "epoch": 5269} {"train_loss": -27.0507869720459, "global_step": 437359, "epoch": 5269} {"train_loss": -26.948171615600586, "global_step": 437360, "epoch": 5269} {"train_loss": -27.109024047851562, "global_step": 437361, "epoch": 5269} {"train_loss": -26.88568687438965, "global_step": 437362, "epoch": 5269} {"train_loss": -27.048669815063477, "global_step": 437363, "epoch": 5269} {"train_loss": -26.819503784179688, "global_step": 437364, "epoch": 5269} {"train_loss": -26.92560386657715, "global_step": 437365, "epoch": 5269} {"train_loss": -27.003705978393555, "global_step": 437366, "epoch": 5269} {"train_loss": -27.360498428344727, "global_step": 437367, "epoch": 5269} {"train_loss": -26.9639835357666, "global_step": 437368, "epoch": 5269} {"train_loss": -27.153100967407227, "global_step": 437369, "epoch": 5269} {"train_loss": -27.151647567749023, "global_step": 437370, "epoch": 5269} {"train_loss": -27.0634822845459, "global_step": 437371, "epoch": 5269} {"train_loss": -27.1739559173584, "global_step": 437372, "epoch": 5269} {"train_loss": -27.015628814697266, "global_step": 437373, "epoch": 5269} {"train_loss": -27.339529037475586, "global_step": 437374, "epoch": 5269} {"train_loss": -26.935033798217773, "global_step": 437375, "epoch": 5269} {"train_loss": -27.42811393737793, "global_step": 437376, "epoch": 5269} {"train_loss": -26.935529708862305, "global_step": 437377, "epoch": 5269} {"train_loss": -27.18355369567871, "global_step": 437378, "epoch": 5269} {"train_loss": -27.000009536743164, "global_step": 437379, "epoch": 5269} {"train_loss": -27.373676300048828, "global_step": 437380, "epoch": 5269} {"train_loss": -26.8612003326416, "global_step": 437381, "epoch": 5269} {"train_loss": -26.910261154174805, "global_step": 437382, "epoch": 5269} {"train_loss": -27.234939575195312, "global_step": 437383, "epoch": 5269} {"train_loss": -26.797565460205078, "global_step": 437384, "epoch": 5269} {"train_loss": -26.754423141479492, "global_step": 437385, "epoch": 5269} {"train_loss": -27.118452072143555, "global_step": 437386, "epoch": 5269} {"train_loss": -26.922504425048828, "global_step": 437387, "epoch": 5269} {"train_loss": -26.48862075805664, "global_step": 437388, "epoch": 5269} {"train_loss": -26.748199462890625, "global_step": 437389, "epoch": 5269} {"train_loss": -27.053442001342773, "global_step": 437390, "epoch": 5269} {"train_loss": -26.71646499633789, "global_step": 437391, "epoch": 5269} {"train_loss": -27.230321884155273, "global_step": 437392, "epoch": 5269} {"train_loss": -26.4427433013916, "global_step": 437393, "epoch": 5269} {"train_loss": -26.41420555114746, "global_step": 437394, "epoch": 5269} {"train_loss": -27.156259536743164, "global_step": 437395, "epoch": 5269} {"train_loss": -26.26593589782715, "global_step": 437396, "epoch": 5269} {"train_loss": -26.74134635925293, "global_step": 437397, "epoch": 5269} {"train_loss": -26.79829216003418, "global_step": 437398, "epoch": 5269} {"train_loss": -26.421966552734375, "global_step": 437399, "epoch": 5269} {"train_loss": -26.745819091796875, "global_step": 437400, "epoch": 5269} {"train_loss": -26.55325698852539, "global_step": 437401, "epoch": 5269} {"train_loss": -26.551151275634766, "global_step": 437402, "epoch": 5269} {"train_loss": -26.479248046875, "global_step": 437403, "epoch": 5269} {"train_loss": -26.94595718383789, "global_step": 437404, "epoch": 5269} {"train_loss": -26.73695945739746, "global_step": 437405, "epoch": 5269} {"train_loss": -26.989660263061523, "global_step": 437406, "epoch": 5269} {"train_loss": -26.19913101196289, "global_step": 437407, "epoch": 5269} {"train_loss": -26.7791690826416, "global_step": 437408, "epoch": 5269} {"train_loss": -26.83887895331325, "global_step": 437409, "epoch": 5269, "val_loss": 6660791.0} {"train_loss": -25.333099365234375, "global_step": 437410, "epoch": 5270} {"train_loss": -26.132776260375977, "global_step": 437411, "epoch": 5270} {"train_loss": -26.230854034423828, "global_step": 437412, "epoch": 5270} {"train_loss": -25.979740142822266, "global_step": 437413, "epoch": 5270} {"train_loss": -26.286834716796875, "global_step": 437414, "epoch": 5270} {"train_loss": -26.254369735717773, "global_step": 437415, "epoch": 5270} {"train_loss": -26.5147647857666, "global_step": 437416, "epoch": 5270} {"train_loss": -26.81580924987793, "global_step": 437417, "epoch": 5270} {"train_loss": -26.453571319580078, "global_step": 437418, "epoch": 5270} {"train_loss": -26.016408920288086, "global_step": 437419, "epoch": 5270} {"train_loss": -26.702590942382812, "global_step": 437420, "epoch": 5270} {"train_loss": -26.24204444885254, "global_step": 437421, "epoch": 5270} {"train_loss": -26.26658058166504, "global_step": 437422, "epoch": 5270} {"train_loss": -26.51423454284668, "global_step": 437423, "epoch": 5270} {"train_loss": -26.666641235351562, "global_step": 437424, "epoch": 5270} {"train_loss": -26.50397300720215, "global_step": 437425, "epoch": 5270} {"train_loss": -26.347137451171875, "global_step": 437426, "epoch": 5270} {"train_loss": -26.663015365600586, "global_step": 437427, "epoch": 5270} {"train_loss": -26.494455337524414, "global_step": 437428, "epoch": 5270} {"train_loss": -26.82928466796875, "global_step": 437429, "epoch": 5270} {"train_loss": -26.4445858001709, "global_step": 437430, "epoch": 5270} {"train_loss": -26.866474151611328, "global_step": 437431, "epoch": 5270} {"train_loss": -26.556196212768555, "global_step": 437432, "epoch": 5270} {"train_loss": -26.637800216674805, "global_step": 437433, "epoch": 5270} {"train_loss": -26.647871017456055, "global_step": 437434, "epoch": 5270} {"train_loss": -26.70342445373535, "global_step": 437435, "epoch": 5270} {"train_loss": -26.829553604125977, "global_step": 437436, "epoch": 5270} {"train_loss": -26.74955177307129, "global_step": 437437, "epoch": 5270} {"train_loss": -27.125497817993164, "global_step": 437438, "epoch": 5270} {"train_loss": -27.055082321166992, "global_step": 437439, "epoch": 5270} {"train_loss": -26.841415405273438, "global_step": 437440, "epoch": 5270} {"train_loss": -26.763105392456055, "global_step": 437441, "epoch": 5270} {"train_loss": -26.721572875976562, "global_step": 437442, "epoch": 5270} {"train_loss": -27.000690460205078, "global_step": 437443, "epoch": 5270} {"train_loss": -27.19671058654785, "global_step": 437444, "epoch": 5270} {"train_loss": -26.72334861755371, "global_step": 437445, "epoch": 5270} {"train_loss": -26.882217407226562, "global_step": 437446, "epoch": 5270} {"train_loss": -27.399580001831055, "global_step": 437447, "epoch": 5270} {"train_loss": -27.15170669555664, "global_step": 437448, "epoch": 5270} {"train_loss": -26.854251861572266, "global_step": 437449, "epoch": 5270} {"train_loss": -26.94793128967285, "global_step": 437450, "epoch": 5270} {"train_loss": -27.05055809020996, "global_step": 437451, "epoch": 5270} {"train_loss": -27.29180335998535, "global_step": 437452, "epoch": 5270} {"train_loss": -27.081302642822266, "global_step": 437453, "epoch": 5270} {"train_loss": -26.6591854095459, "global_step": 437454, "epoch": 5270} {"train_loss": -27.27703857421875, "global_step": 437455, "epoch": 5270} {"train_loss": -27.06880760192871, "global_step": 437456, "epoch": 5270} {"train_loss": -26.874059677124023, "global_step": 437457, "epoch": 5270} {"train_loss": -26.887710571289062, "global_step": 437458, "epoch": 5270} {"train_loss": -27.137052536010742, "global_step": 437459, "epoch": 5270} {"train_loss": -26.920185089111328, "global_step": 437460, "epoch": 5270} {"train_loss": -26.95271110534668, "global_step": 437461, "epoch": 5270} {"train_loss": -27.3200740814209, "global_step": 437462, "epoch": 5270} {"train_loss": -27.010578155517578, "global_step": 437463, "epoch": 5270} {"train_loss": -27.133752822875977, "global_step": 437464, "epoch": 5270} {"train_loss": -27.237613677978516, "global_step": 437465, "epoch": 5270} {"train_loss": -26.902790069580078, "global_step": 437466, "epoch": 5270} {"train_loss": -27.014814376831055, "global_step": 437467, "epoch": 5270} {"train_loss": -27.217748641967773, "global_step": 437468, "epoch": 5270} {"train_loss": -26.944482803344727, "global_step": 437469, "epoch": 5270} {"train_loss": -27.12885093688965, "global_step": 437470, "epoch": 5270} {"train_loss": -27.290002822875977, "global_step": 437471, "epoch": 5270} {"train_loss": -26.937824249267578, "global_step": 437472, "epoch": 5270} {"train_loss": -27.025562286376953, "global_step": 437473, "epoch": 5270} {"train_loss": -27.221933364868164, "global_step": 437474, "epoch": 5270} {"train_loss": -27.29425048828125, "global_step": 437475, "epoch": 5270} {"train_loss": -27.007644653320312, "global_step": 437476, "epoch": 5270} {"train_loss": -27.055328369140625, "global_step": 437477, "epoch": 5270} {"train_loss": -26.639179229736328, "global_step": 437478, "epoch": 5270} {"train_loss": -27.06632423400879, "global_step": 437479, "epoch": 5270} {"train_loss": -26.85861587524414, "global_step": 437480, "epoch": 5270} {"train_loss": -26.762741088867188, "global_step": 437481, "epoch": 5270} {"train_loss": -25.824201583862305, "global_step": 437482, "epoch": 5270} {"train_loss": -24.372940063476562, "global_step": 437483, "epoch": 5270} {"train_loss": -25.924896240234375, "global_step": 437484, "epoch": 5270} {"train_loss": -26.62588882446289, "global_step": 437485, "epoch": 5270} {"train_loss": -26.350666046142578, "global_step": 437486, "epoch": 5270} {"train_loss": -26.86099624633789, "global_step": 437487, "epoch": 5270} {"train_loss": -25.869476318359375, "global_step": 437488, "epoch": 5270} {"train_loss": -26.443023681640625, "global_step": 437489, "epoch": 5270} {"train_loss": -26.54749870300293, "global_step": 437490, "epoch": 5270} {"train_loss": -26.697647094726562, "global_step": 437491, "epoch": 5270} {"train_loss": -26.719912747302686, "global_step": 437492, "epoch": 5270, "val_loss": 6627454.0} {"train_loss": -24.06207847595215, "global_step": 437493, "epoch": 5271} {"train_loss": -26.147180557250977, "global_step": 437494, "epoch": 5271} {"train_loss": -24.976383209228516, "global_step": 437495, "epoch": 5271} {"train_loss": -26.001916885375977, "global_step": 437496, "epoch": 5271} {"train_loss": -25.369112014770508, "global_step": 437497, "epoch": 5271} {"train_loss": -25.81190299987793, "global_step": 437498, "epoch": 5271} {"train_loss": -25.389480590820312, "global_step": 437499, "epoch": 5271} {"train_loss": -25.408241271972656, "global_step": 437500, "epoch": 5271} {"train_loss": -26.123870849609375, "global_step": 437501, "epoch": 5271} {"train_loss": -25.84262466430664, "global_step": 437502, "epoch": 5271} {"train_loss": -26.308195114135742, "global_step": 437503, "epoch": 5271} {"train_loss": -26.00026512145996, "global_step": 437504, "epoch": 5271} {"train_loss": -26.07196044921875, "global_step": 437505, "epoch": 5271} {"train_loss": -26.102035522460938, "global_step": 437506, "epoch": 5271} {"train_loss": -26.164880752563477, "global_step": 437507, "epoch": 5271} {"train_loss": -26.184030532836914, "global_step": 437508, "epoch": 5271} {"train_loss": -26.386274337768555, "global_step": 437509, "epoch": 5271} {"train_loss": -25.943403244018555, "global_step": 437510, "epoch": 5271} {"train_loss": -26.071691513061523, "global_step": 437511, "epoch": 5271} {"train_loss": -26.855426788330078, "global_step": 437512, "epoch": 5271} {"train_loss": -26.645349502563477, "global_step": 437513, "epoch": 5271} {"train_loss": -26.20148277282715, "global_step": 437514, "epoch": 5271} {"train_loss": -26.43751335144043, "global_step": 437515, "epoch": 5271} {"train_loss": -26.52008056640625, "global_step": 437516, "epoch": 5271} {"train_loss": -26.287839889526367, "global_step": 437517, "epoch": 5271} {"train_loss": -26.73988151550293, "global_step": 437518, "epoch": 5271} {"train_loss": -26.424896240234375, "global_step": 437519, "epoch": 5271} {"train_loss": -26.71221923828125, "global_step": 437520, "epoch": 5271} {"train_loss": -26.43025779724121, "global_step": 437521, "epoch": 5271} {"train_loss": -26.718656539916992, "global_step": 437522, "epoch": 5271} {"train_loss": -26.64301109313965, "global_step": 437523, "epoch": 5271} {"train_loss": -26.405820846557617, "global_step": 437524, "epoch": 5271} {"train_loss": -26.442739486694336, "global_step": 437525, "epoch": 5271} {"train_loss": -27.0749568939209, "global_step": 437526, "epoch": 5271} {"train_loss": -26.609601974487305, "global_step": 437527, "epoch": 5271} {"train_loss": -26.70106315612793, "global_step": 437528, "epoch": 5271} {"train_loss": -26.708276748657227, "global_step": 437529, "epoch": 5271} {"train_loss": -27.225244522094727, "global_step": 437530, "epoch": 5271} {"train_loss": -26.855213165283203, "global_step": 437531, "epoch": 5271} {"train_loss": -26.67011070251465, "global_step": 437532, "epoch": 5271} {"train_loss": -26.8846492767334, "global_step": 437533, "epoch": 5271} {"train_loss": -26.80091667175293, "global_step": 437534, "epoch": 5271} {"train_loss": -26.787023544311523, "global_step": 437535, "epoch": 5271} {"train_loss": -26.734954833984375, "global_step": 437536, "epoch": 5271} {"train_loss": -26.928735733032227, "global_step": 437537, "epoch": 5271} {"train_loss": -26.808761596679688, "global_step": 437538, "epoch": 5271} {"train_loss": -27.238126754760742, "global_step": 437539, "epoch": 5271} {"train_loss": -27.012069702148438, "global_step": 437540, "epoch": 5271} {"train_loss": -26.987783432006836, "global_step": 437541, "epoch": 5271} {"train_loss": -27.020721435546875, "global_step": 437542, "epoch": 5271} {"train_loss": -27.0112361907959, "global_step": 437543, "epoch": 5271} {"train_loss": -26.984027862548828, "global_step": 437544, "epoch": 5271} {"train_loss": -27.114059448242188, "global_step": 437545, "epoch": 5271} {"train_loss": -27.32358741760254, "global_step": 437546, "epoch": 5271} {"train_loss": -27.035282135009766, "global_step": 437547, "epoch": 5271} {"train_loss": -27.19314956665039, "global_step": 437548, "epoch": 5271} {"train_loss": -27.34723472595215, "global_step": 437549, "epoch": 5271} {"train_loss": -27.3884220123291, "global_step": 437550, "epoch": 5271} {"train_loss": -26.97088050842285, "global_step": 437551, "epoch": 5271} {"train_loss": -26.99354362487793, "global_step": 437552, "epoch": 5271} {"train_loss": -27.069091796875, "global_step": 437553, "epoch": 5271} {"train_loss": -26.99842643737793, "global_step": 437554, "epoch": 5271} {"train_loss": -26.676950454711914, "global_step": 437555, "epoch": 5271} {"train_loss": -26.867767333984375, "global_step": 437556, "epoch": 5271} {"train_loss": -26.636926651000977, "global_step": 437557, "epoch": 5271} {"train_loss": -27.079853057861328, "global_step": 437558, "epoch": 5271} {"train_loss": -26.78826904296875, "global_step": 437559, "epoch": 5271} {"train_loss": -26.787134170532227, "global_step": 437560, "epoch": 5271} {"train_loss": -27.03826332092285, "global_step": 437561, "epoch": 5271} {"train_loss": -26.801483154296875, "global_step": 437562, "epoch": 5271} {"train_loss": -26.468799591064453, "global_step": 437563, "epoch": 5271} {"train_loss": -26.709821701049805, "global_step": 437564, "epoch": 5271} {"train_loss": -26.82010269165039, "global_step": 437565, "epoch": 5271} {"train_loss": -26.983123779296875, "global_step": 437566, "epoch": 5271} {"train_loss": -26.738122940063477, "global_step": 437567, "epoch": 5271} {"train_loss": -26.820556640625, "global_step": 437568, "epoch": 5271} {"train_loss": -27.2591495513916, "global_step": 437569, "epoch": 5271} {"train_loss": -26.84586524963379, "global_step": 437570, "epoch": 5271} {"train_loss": -26.765905380249023, "global_step": 437571, "epoch": 5271} {"train_loss": -27.07758903503418, "global_step": 437572, "epoch": 5271} {"train_loss": -27.211328506469727, "global_step": 437573, "epoch": 5271} {"train_loss": -26.94573974609375, "global_step": 437574, "epoch": 5271} {"train_loss": -26.611886633447853, "global_step": 437575, "epoch": 5271, "val_loss": 6676441.0} {"train_loss": -25.45073699951172, "global_step": 437576, "epoch": 5272} {"train_loss": -25.7616024017334, "global_step": 437577, "epoch": 5272} {"train_loss": -26.311975479125977, "global_step": 437578, "epoch": 5272} {"train_loss": -26.57421875, "global_step": 437579, "epoch": 5272} {"train_loss": -25.85267448425293, "global_step": 437580, "epoch": 5272} {"train_loss": -26.566303253173828, "global_step": 437581, "epoch": 5272} {"train_loss": -26.356821060180664, "global_step": 437582, "epoch": 5272} {"train_loss": -26.14930534362793, "global_step": 437583, "epoch": 5272} {"train_loss": -26.47879981994629, "global_step": 437584, "epoch": 5272} {"train_loss": -26.199615478515625, "global_step": 437585, "epoch": 5272} {"train_loss": -26.752796173095703, "global_step": 437586, "epoch": 5272} {"train_loss": -26.356420516967773, "global_step": 437587, "epoch": 5272} {"train_loss": -26.753376007080078, "global_step": 437588, "epoch": 5272} {"train_loss": -26.21921730041504, "global_step": 437589, "epoch": 5272} {"train_loss": -26.413969039916992, "global_step": 437590, "epoch": 5272} {"train_loss": -26.51136589050293, "global_step": 437591, "epoch": 5272} {"train_loss": -26.491779327392578, "global_step": 437592, "epoch": 5272} {"train_loss": -26.374256134033203, "global_step": 437593, "epoch": 5272} {"train_loss": -26.81414222717285, "global_step": 437594, "epoch": 5272} {"train_loss": -26.416059494018555, "global_step": 437595, "epoch": 5272} {"train_loss": -26.919052124023438, "global_step": 437596, "epoch": 5272} {"train_loss": -26.535593032836914, "global_step": 437597, "epoch": 5272} {"train_loss": -26.837427139282227, "global_step": 437598, "epoch": 5272} {"train_loss": -26.997583389282227, "global_step": 437599, "epoch": 5272} {"train_loss": -27.0462646484375, "global_step": 437600, "epoch": 5272} {"train_loss": -26.77743911743164, "global_step": 437601, "epoch": 5272} {"train_loss": -26.997777938842773, "global_step": 437602, "epoch": 5272} {"train_loss": -26.439359664916992, "global_step": 437603, "epoch": 5272} {"train_loss": -26.769184112548828, "global_step": 437604, "epoch": 5272} {"train_loss": -26.681177139282227, "global_step": 437605, "epoch": 5272} {"train_loss": -26.89344596862793, "global_step": 437606, "epoch": 5272} {"train_loss": -26.856399536132812, "global_step": 437607, "epoch": 5272} {"train_loss": -26.788105010986328, "global_step": 437608, "epoch": 5272} {"train_loss": -26.6601619720459, "global_step": 437609, "epoch": 5272} {"train_loss": -27.032079696655273, "global_step": 437610, "epoch": 5272} {"train_loss": -26.772214889526367, "global_step": 437611, "epoch": 5272} {"train_loss": -26.925031661987305, "global_step": 437612, "epoch": 5272} {"train_loss": -27.279821395874023, "global_step": 437613, "epoch": 5272} {"train_loss": -26.8924560546875, "global_step": 437614, "epoch": 5272} {"train_loss": -27.261474609375, "global_step": 437615, "epoch": 5272} {"train_loss": -27.397140502929688, "global_step": 437616, "epoch": 5272} {"train_loss": -26.816232681274414, "global_step": 437617, "epoch": 5272} {"train_loss": -27.116296768188477, "global_step": 437618, "epoch": 5272} {"train_loss": -27.09226417541504, "global_step": 437619, "epoch": 5272} {"train_loss": -27.273008346557617, "global_step": 437620, "epoch": 5272} {"train_loss": -27.05951499938965, "global_step": 437621, "epoch": 5272} {"train_loss": -27.385351181030273, "global_step": 437622, "epoch": 5272} {"train_loss": -27.06307029724121, "global_step": 437623, "epoch": 5272} {"train_loss": -26.732587814331055, "global_step": 437624, "epoch": 5272} {"train_loss": -27.03400993347168, "global_step": 437625, "epoch": 5272} {"train_loss": -27.034809112548828, "global_step": 437626, "epoch": 5272} {"train_loss": -27.220447540283203, "global_step": 437627, "epoch": 5272} {"train_loss": -26.41282081604004, "global_step": 437628, "epoch": 5272} {"train_loss": -26.80853843688965, "global_step": 437629, "epoch": 5272} {"train_loss": -26.90645408630371, "global_step": 437630, "epoch": 5272} {"train_loss": -27.070104598999023, "global_step": 437631, "epoch": 5272} {"train_loss": -26.8456974029541, "global_step": 437632, "epoch": 5272} {"train_loss": -27.139678955078125, "global_step": 437633, "epoch": 5272} {"train_loss": -27.122421264648438, "global_step": 437634, "epoch": 5272} {"train_loss": -27.193653106689453, "global_step": 437635, "epoch": 5272} {"train_loss": -27.309234619140625, "global_step": 437636, "epoch": 5272} {"train_loss": -27.07229995727539, "global_step": 437637, "epoch": 5272} {"train_loss": -27.035037994384766, "global_step": 437638, "epoch": 5272} {"train_loss": -27.00862693786621, "global_step": 437639, "epoch": 5272} {"train_loss": -27.332080841064453, "global_step": 437640, "epoch": 5272} {"train_loss": -27.049741744995117, "global_step": 437641, "epoch": 5272} {"train_loss": -27.034330368041992, "global_step": 437642, "epoch": 5272} {"train_loss": -27.166980743408203, "global_step": 437643, "epoch": 5272} {"train_loss": -27.30360221862793, "global_step": 437644, "epoch": 5272} {"train_loss": -27.20172119140625, "global_step": 437645, "epoch": 5272} {"train_loss": -26.903783798217773, "global_step": 437646, "epoch": 5272} {"train_loss": -27.152908325195312, "global_step": 437647, "epoch": 5272} {"train_loss": -27.14606285095215, "global_step": 437648, "epoch": 5272} {"train_loss": -27.02113151550293, "global_step": 437649, "epoch": 5272} {"train_loss": -27.174503326416016, "global_step": 437650, "epoch": 5272} {"train_loss": -27.04269790649414, "global_step": 437651, "epoch": 5272} {"train_loss": -27.167478561401367, "global_step": 437652, "epoch": 5272} {"train_loss": -27.06534767150879, "global_step": 437653, "epoch": 5272} {"train_loss": -26.85273551940918, "global_step": 437654, "epoch": 5272} {"train_loss": -27.01597023010254, "global_step": 437655, "epoch": 5272} {"train_loss": -26.717023849487305, "global_step": 437656, "epoch": 5272} {"train_loss": -27.253314971923828, "global_step": 437657, "epoch": 5272} {"train_loss": -26.84675366045481, "global_step": 437658, "epoch": 5272, "val_loss": 6564114.5} {"train_loss": -26.6878719329834, "global_step": 437659, "epoch": 5273} {"train_loss": -27.03362464904785, "global_step": 437660, "epoch": 5273} {"train_loss": -26.988555908203125, "global_step": 437661, "epoch": 5273} {"train_loss": -26.750940322875977, "global_step": 437662, "epoch": 5273} {"train_loss": -26.77473258972168, "global_step": 437663, "epoch": 5273} {"train_loss": -27.02570152282715, "global_step": 437664, "epoch": 5273} {"train_loss": -26.723346710205078, "global_step": 437665, "epoch": 5273} {"train_loss": -26.900989532470703, "global_step": 437666, "epoch": 5273} {"train_loss": -26.03154945373535, "global_step": 437667, "epoch": 5273} {"train_loss": -27.065229415893555, "global_step": 437668, "epoch": 5273} {"train_loss": -26.58485221862793, "global_step": 437669, "epoch": 5273} {"train_loss": -26.57269859313965, "global_step": 437670, "epoch": 5273} {"train_loss": -27.139575958251953, "global_step": 437671, "epoch": 5273} {"train_loss": -26.254724502563477, "global_step": 437672, "epoch": 5273} {"train_loss": -26.752466201782227, "global_step": 437673, "epoch": 5273} {"train_loss": -26.71982765197754, "global_step": 437674, "epoch": 5273} {"train_loss": -26.598230361938477, "global_step": 437675, "epoch": 5273} {"train_loss": -26.47791862487793, "global_step": 437676, "epoch": 5273} {"train_loss": -26.869251251220703, "global_step": 437677, "epoch": 5273} {"train_loss": -26.6813907623291, "global_step": 437678, "epoch": 5273} {"train_loss": -26.837066650390625, "global_step": 437679, "epoch": 5273} {"train_loss": -26.77609634399414, "global_step": 437680, "epoch": 5273} {"train_loss": -26.651885986328125, "global_step": 437681, "epoch": 5273} {"train_loss": -26.248456954956055, "global_step": 437682, "epoch": 5273} {"train_loss": -26.494892120361328, "global_step": 437683, "epoch": 5273} {"train_loss": -26.62393569946289, "global_step": 437684, "epoch": 5273} {"train_loss": -27.02921485900879, "global_step": 437685, "epoch": 5273} {"train_loss": -26.738492965698242, "global_step": 437686, "epoch": 5273} {"train_loss": -26.76740074157715, "global_step": 437687, "epoch": 5273} {"train_loss": -27.06201171875, "global_step": 437688, "epoch": 5273} {"train_loss": -27.20918846130371, "global_step": 437689, "epoch": 5273} {"train_loss": -27.071380615234375, "global_step": 437690, "epoch": 5273} {"train_loss": -27.008935928344727, "global_step": 437691, "epoch": 5273} {"train_loss": -27.476348876953125, "global_step": 437692, "epoch": 5273} {"train_loss": -26.657873153686523, "global_step": 437693, "epoch": 5273} {"train_loss": -27.2600040435791, "global_step": 437694, "epoch": 5273} {"train_loss": -27.092313766479492, "global_step": 437695, "epoch": 5273} {"train_loss": -27.0575008392334, "global_step": 437696, "epoch": 5273} {"train_loss": -26.60288429260254, "global_step": 437697, "epoch": 5273} {"train_loss": -27.00623893737793, "global_step": 437698, "epoch": 5273} {"train_loss": -27.08967399597168, "global_step": 437699, "epoch": 5273} {"train_loss": -27.283735275268555, "global_step": 437700, "epoch": 5273} {"train_loss": -27.46735954284668, "global_step": 437701, "epoch": 5273} {"train_loss": -26.704809188842773, "global_step": 437702, "epoch": 5273} {"train_loss": -26.786352157592773, "global_step": 437703, "epoch": 5273} {"train_loss": -27.225845336914062, "global_step": 437704, "epoch": 5273} {"train_loss": -27.012296676635742, "global_step": 437705, "epoch": 5273} {"train_loss": -27.36575698852539, "global_step": 437706, "epoch": 5273} {"train_loss": -27.29762077331543, "global_step": 437707, "epoch": 5273} {"train_loss": -26.733373641967773, "global_step": 437708, "epoch": 5273} {"train_loss": -26.640424728393555, "global_step": 437709, "epoch": 5273} {"train_loss": -26.884687423706055, "global_step": 437710, "epoch": 5273} {"train_loss": -27.003576278686523, "global_step": 437711, "epoch": 5273} {"train_loss": -27.148563385009766, "global_step": 437712, "epoch": 5273} {"train_loss": -26.740772247314453, "global_step": 437713, "epoch": 5273} {"train_loss": -26.541845321655273, "global_step": 437714, "epoch": 5273} {"train_loss": -26.879796981811523, "global_step": 437715, "epoch": 5273} {"train_loss": -27.27971839904785, "global_step": 437716, "epoch": 5273} {"train_loss": -26.90586280822754, "global_step": 437717, "epoch": 5273} {"train_loss": -27.18259620666504, "global_step": 437718, "epoch": 5273} {"train_loss": -27.008203506469727, "global_step": 437719, "epoch": 5273} {"train_loss": -26.950550079345703, "global_step": 437720, "epoch": 5273} {"train_loss": -27.109344482421875, "global_step": 437721, "epoch": 5273} {"train_loss": -26.67331886291504, "global_step": 437722, "epoch": 5273} {"train_loss": -26.679929733276367, "global_step": 437723, "epoch": 5273} {"train_loss": -27.024763107299805, "global_step": 437724, "epoch": 5273} {"train_loss": -27.071033477783203, "global_step": 437725, "epoch": 5273} {"train_loss": -26.766254425048828, "global_step": 437726, "epoch": 5273} {"train_loss": -27.03827476501465, "global_step": 437727, "epoch": 5273} {"train_loss": -27.378997802734375, "global_step": 437728, "epoch": 5273} {"train_loss": -27.100183486938477, "global_step": 437729, "epoch": 5273} {"train_loss": -27.301488876342773, "global_step": 437730, "epoch": 5273} {"train_loss": -27.0323486328125, "global_step": 437731, "epoch": 5273} {"train_loss": -26.8696231842041, "global_step": 437732, "epoch": 5273} {"train_loss": -27.043554306030273, "global_step": 437733, "epoch": 5273} {"train_loss": -27.050750732421875, "global_step": 437734, "epoch": 5273} {"train_loss": -26.886768341064453, "global_step": 437735, "epoch": 5273} {"train_loss": -27.119192123413086, "global_step": 437736, "epoch": 5273} {"train_loss": -26.745519638061523, "global_step": 437737, "epoch": 5273} {"train_loss": -26.51515007019043, "global_step": 437738, "epoch": 5273} {"train_loss": -26.52790641784668, "global_step": 437739, "epoch": 5273} {"train_loss": -26.851226806640625, "global_step": 437740, "epoch": 5273} {"train_loss": -26.90205277592303, "global_step": 437741, "epoch": 5273, "val_loss": 6611091.0} {"train_loss": -26.29669761657715, "global_step": 437742, "epoch": 5274} {"train_loss": -25.798145294189453, "global_step": 437743, "epoch": 5274} {"train_loss": -25.33970069885254, "global_step": 437744, "epoch": 5274} {"train_loss": -26.7368106842041, "global_step": 437745, "epoch": 5274} {"train_loss": -26.437702178955078, "global_step": 437746, "epoch": 5274} {"train_loss": -26.328649520874023, "global_step": 437747, "epoch": 5274} {"train_loss": -26.484394073486328, "global_step": 437748, "epoch": 5274} {"train_loss": -26.094091415405273, "global_step": 437749, "epoch": 5274} {"train_loss": -26.419544219970703, "global_step": 437750, "epoch": 5274} {"train_loss": -26.53997802734375, "global_step": 437751, "epoch": 5274} {"train_loss": -26.383056640625, "global_step": 437752, "epoch": 5274} {"train_loss": -26.245559692382812, "global_step": 437753, "epoch": 5274} {"train_loss": -26.628812789916992, "global_step": 437754, "epoch": 5274} {"train_loss": -26.460010528564453, "global_step": 437755, "epoch": 5274} {"train_loss": -26.933950424194336, "global_step": 437756, "epoch": 5274} {"train_loss": -26.901269912719727, "global_step": 437757, "epoch": 5274} {"train_loss": -26.758955001831055, "global_step": 437758, "epoch": 5274} {"train_loss": -26.948617935180664, "global_step": 437759, "epoch": 5274} {"train_loss": -26.886932373046875, "global_step": 437760, "epoch": 5274} {"train_loss": -26.824234008789062, "global_step": 437761, "epoch": 5274} {"train_loss": -26.706195831298828, "global_step": 437762, "epoch": 5274} {"train_loss": -27.025548934936523, "global_step": 437763, "epoch": 5274} {"train_loss": -26.727771759033203, "global_step": 437764, "epoch": 5274} {"train_loss": -27.12786293029785, "global_step": 437765, "epoch": 5274} {"train_loss": -27.010223388671875, "global_step": 437766, "epoch": 5274} {"train_loss": -26.78595542907715, "global_step": 437767, "epoch": 5274} {"train_loss": -27.067487716674805, "global_step": 437768, "epoch": 5274} {"train_loss": -27.002347946166992, "global_step": 437769, "epoch": 5274} {"train_loss": -27.066293716430664, "global_step": 437770, "epoch": 5274} {"train_loss": -26.84395408630371, "global_step": 437771, "epoch": 5274} {"train_loss": -26.96738624572754, "global_step": 437772, "epoch": 5274} {"train_loss": -27.121240615844727, "global_step": 437773, "epoch": 5274} {"train_loss": -26.62100601196289, "global_step": 437774, "epoch": 5274} {"train_loss": -27.240087509155273, "global_step": 437775, "epoch": 5274} {"train_loss": -27.037841796875, "global_step": 437776, "epoch": 5274} {"train_loss": -27.01559829711914, "global_step": 437777, "epoch": 5274} {"train_loss": -27.01569175720215, "global_step": 437778, "epoch": 5274} {"train_loss": -27.277441024780273, "global_step": 437779, "epoch": 5274} {"train_loss": -26.949121475219727, "global_step": 437780, "epoch": 5274} {"train_loss": -26.779067993164062, "global_step": 437781, "epoch": 5274} {"train_loss": -26.915851593017578, "global_step": 437782, "epoch": 5274} {"train_loss": -27.224515914916992, "global_step": 437783, "epoch": 5274} {"train_loss": -26.776382446289062, "global_step": 437784, "epoch": 5274} {"train_loss": -26.990530014038086, "global_step": 437785, "epoch": 5274} {"train_loss": -26.770986557006836, "global_step": 437786, "epoch": 5274} {"train_loss": -26.918304443359375, "global_step": 437787, "epoch": 5274} {"train_loss": -26.737241744995117, "global_step": 437788, "epoch": 5274} {"train_loss": -26.849212646484375, "global_step": 437789, "epoch": 5274} {"train_loss": -26.696332931518555, "global_step": 437790, "epoch": 5274} {"train_loss": -27.077951431274414, "global_step": 437791, "epoch": 5274} {"train_loss": -26.945764541625977, "global_step": 437792, "epoch": 5274} {"train_loss": -27.113134384155273, "global_step": 437793, "epoch": 5274} {"train_loss": -27.001678466796875, "global_step": 437794, "epoch": 5274} {"train_loss": -26.586816787719727, "global_step": 437795, "epoch": 5274} {"train_loss": -26.377893447875977, "global_step": 437796, "epoch": 5274} {"train_loss": -26.39837646484375, "global_step": 437797, "epoch": 5274} {"train_loss": -26.801172256469727, "global_step": 437798, "epoch": 5274} {"train_loss": -26.4365234375, "global_step": 437799, "epoch": 5274} {"train_loss": -26.85329246520996, "global_step": 437800, "epoch": 5274} {"train_loss": -26.488250732421875, "global_step": 437801, "epoch": 5274} {"train_loss": -26.840591430664062, "global_step": 437802, "epoch": 5274} {"train_loss": -27.220630645751953, "global_step": 437803, "epoch": 5274} {"train_loss": -26.55799674987793, "global_step": 437804, "epoch": 5274} {"train_loss": -26.640567779541016, "global_step": 437805, "epoch": 5274} {"train_loss": -27.021841049194336, "global_step": 437806, "epoch": 5274} {"train_loss": -26.667707443237305, "global_step": 437807, "epoch": 5274} {"train_loss": -26.874469757080078, "global_step": 437808, "epoch": 5274} {"train_loss": -26.8776912689209, "global_step": 437809, "epoch": 5274} {"train_loss": -26.925540924072266, "global_step": 437810, "epoch": 5274} {"train_loss": -26.233509063720703, "global_step": 437811, "epoch": 5274} {"train_loss": -26.748682022094727, "global_step": 437812, "epoch": 5274} {"train_loss": -26.642541885375977, "global_step": 437813, "epoch": 5274} {"train_loss": -27.06084632873535, "global_step": 437814, "epoch": 5274} {"train_loss": -26.26740837097168, "global_step": 437815, "epoch": 5274} {"train_loss": -27.058673858642578, "global_step": 437816, "epoch": 5274} {"train_loss": -26.728534698486328, "global_step": 437817, "epoch": 5274} {"train_loss": -27.1442813873291, "global_step": 437818, "epoch": 5274} {"train_loss": -27.070667266845703, "global_step": 437819, "epoch": 5274} {"train_loss": -26.799213409423828, "global_step": 437820, "epoch": 5274} {"train_loss": -26.875934600830078, "global_step": 437821, "epoch": 5274} {"train_loss": -26.993865966796875, "global_step": 437822, "epoch": 5274} {"train_loss": -26.824716567993164, "global_step": 437823, "epoch": 5274} {"train_loss": -26.752204734158802, "global_step": 437824, "epoch": 5274, "val_loss": 6626441.5} {"train_loss": -26.190881729125977, "global_step": 437825, "epoch": 5275} {"train_loss": -26.24410057067871, "global_step": 437826, "epoch": 5275} {"train_loss": -26.708471298217773, "global_step": 437827, "epoch": 5275} {"train_loss": -26.486886978149414, "global_step": 437828, "epoch": 5275} {"train_loss": -26.56153678894043, "global_step": 437829, "epoch": 5275} {"train_loss": -26.337085723876953, "global_step": 437830, "epoch": 5275} {"train_loss": -26.910165786743164, "global_step": 437831, "epoch": 5275} {"train_loss": -26.546899795532227, "global_step": 437832, "epoch": 5275} {"train_loss": -26.95370864868164, "global_step": 437833, "epoch": 5275} {"train_loss": -26.909561157226562, "global_step": 437834, "epoch": 5275} {"train_loss": -26.63818359375, "global_step": 437835, "epoch": 5275} {"train_loss": -26.346872329711914, "global_step": 437836, "epoch": 5275} {"train_loss": -26.773374557495117, "global_step": 437837, "epoch": 5275} {"train_loss": -26.862390518188477, "global_step": 437838, "epoch": 5275} {"train_loss": -26.419097900390625, "global_step": 437839, "epoch": 5275} {"train_loss": -26.980213165283203, "global_step": 437840, "epoch": 5275} {"train_loss": -26.78547477722168, "global_step": 437841, "epoch": 5275} {"train_loss": -26.9913387298584, "global_step": 437842, "epoch": 5275} {"train_loss": -26.897245407104492, "global_step": 437843, "epoch": 5275} {"train_loss": -27.07942008972168, "global_step": 437844, "epoch": 5275} {"train_loss": -26.94416618347168, "global_step": 437845, "epoch": 5275} {"train_loss": -26.809528350830078, "global_step": 437846, "epoch": 5275} {"train_loss": -26.474578857421875, "global_step": 437847, "epoch": 5275} {"train_loss": -26.965295791625977, "global_step": 437848, "epoch": 5275} {"train_loss": -26.8790225982666, "global_step": 437849, "epoch": 5275} {"train_loss": -27.0911808013916, "global_step": 437850, "epoch": 5275} {"train_loss": -26.80913734436035, "global_step": 437851, "epoch": 5275} {"train_loss": -27.45052146911621, "global_step": 437852, "epoch": 5275} {"train_loss": -27.096364974975586, "global_step": 437853, "epoch": 5275} {"train_loss": -27.186429977416992, "global_step": 437854, "epoch": 5275} {"train_loss": -27.20711326599121, "global_step": 437855, "epoch": 5275} {"train_loss": -27.203771591186523, "global_step": 437856, "epoch": 5275} {"train_loss": -27.27278709411621, "global_step": 437857, "epoch": 5275} {"train_loss": -26.854429244995117, "global_step": 437858, "epoch": 5275} {"train_loss": -26.96895408630371, "global_step": 437859, "epoch": 5275} {"train_loss": -27.274322509765625, "global_step": 437860, "epoch": 5275} {"train_loss": -27.37664794921875, "global_step": 437861, "epoch": 5275} {"train_loss": -27.244169235229492, "global_step": 437862, "epoch": 5275} {"train_loss": -26.919097900390625, "global_step": 437863, "epoch": 5275} {"train_loss": -27.3986759185791, "global_step": 437864, "epoch": 5275} {"train_loss": -26.974136352539062, "global_step": 437865, "epoch": 5275} {"train_loss": -27.169544219970703, "global_step": 437866, "epoch": 5275} {"train_loss": -26.90192985534668, "global_step": 437867, "epoch": 5275} {"train_loss": -27.021289825439453, "global_step": 437868, "epoch": 5275} {"train_loss": -26.5725154876709, "global_step": 437869, "epoch": 5275} {"train_loss": -26.245481491088867, "global_step": 437870, "epoch": 5275} {"train_loss": -26.419736862182617, "global_step": 437871, "epoch": 5275} {"train_loss": -26.364850997924805, "global_step": 437872, "epoch": 5275} {"train_loss": -26.87312126159668, "global_step": 437873, "epoch": 5275} {"train_loss": -26.944055557250977, "global_step": 437874, "epoch": 5275} {"train_loss": -26.573047637939453, "global_step": 437875, "epoch": 5275} {"train_loss": -26.6770076751709, "global_step": 437876, "epoch": 5275} {"train_loss": -26.768888473510742, "global_step": 437877, "epoch": 5275} {"train_loss": -26.61980628967285, "global_step": 437878, "epoch": 5275} {"train_loss": -26.918277740478516, "global_step": 437879, "epoch": 5275} {"train_loss": -27.22247886657715, "global_step": 437880, "epoch": 5275} {"train_loss": -26.631322860717773, "global_step": 437881, "epoch": 5275} {"train_loss": -26.88623046875, "global_step": 437882, "epoch": 5275} {"train_loss": -26.96942710876465, "global_step": 437883, "epoch": 5275} {"train_loss": -27.06939125061035, "global_step": 437884, "epoch": 5275} {"train_loss": -26.961639404296875, "global_step": 437885, "epoch": 5275} {"train_loss": -26.915847778320312, "global_step": 437886, "epoch": 5275} {"train_loss": -26.703994750976562, "global_step": 437887, "epoch": 5275} {"train_loss": -27.101139068603516, "global_step": 437888, "epoch": 5275} {"train_loss": -26.825284957885742, "global_step": 437889, "epoch": 5275} {"train_loss": -27.078155517578125, "global_step": 437890, "epoch": 5275} {"train_loss": -27.213703155517578, "global_step": 437891, "epoch": 5275} {"train_loss": -26.9152774810791, "global_step": 437892, "epoch": 5275} {"train_loss": -27.195804595947266, "global_step": 437893, "epoch": 5275} {"train_loss": -26.728504180908203, "global_step": 437894, "epoch": 5275} {"train_loss": -27.209457397460938, "global_step": 437895, "epoch": 5275} {"train_loss": -26.79302406311035, "global_step": 437896, "epoch": 5275} {"train_loss": -26.9747314453125, "global_step": 437897, "epoch": 5275} {"train_loss": -27.026193618774414, "global_step": 437898, "epoch": 5275} {"train_loss": -26.823699951171875, "global_step": 437899, "epoch": 5275} {"train_loss": -27.06195068359375, "global_step": 437900, "epoch": 5275} {"train_loss": -27.164703369140625, "global_step": 437901, "epoch": 5275} {"train_loss": -27.101764678955078, "global_step": 437902, "epoch": 5275} {"train_loss": -26.712324142456055, "global_step": 437903, "epoch": 5275} {"train_loss": -27.12139892578125, "global_step": 437904, "epoch": 5275} {"train_loss": -26.684736251831055, "global_step": 437905, "epoch": 5275} {"train_loss": -27.251300811767578, "global_step": 437906, "epoch": 5275} {"train_loss": -26.890213771038745, "global_step": 437907, "epoch": 5275, "val_loss": 6652260.5} {"train_loss": -25.6510009765625, "global_step": 437908, "epoch": 5276} {"train_loss": -25.954153060913086, "global_step": 437909, "epoch": 5276} {"train_loss": -26.028034210205078, "global_step": 437910, "epoch": 5276} {"train_loss": -26.696664810180664, "global_step": 437911, "epoch": 5276} {"train_loss": -25.98419761657715, "global_step": 437912, "epoch": 5276} {"train_loss": -25.54408836364746, "global_step": 437913, "epoch": 5276} {"train_loss": -26.05417251586914, "global_step": 437914, "epoch": 5276} {"train_loss": -25.690631866455078, "global_step": 437915, "epoch": 5276} {"train_loss": -26.35663414001465, "global_step": 437916, "epoch": 5276} {"train_loss": -26.56148338317871, "global_step": 437917, "epoch": 5276} {"train_loss": -25.78122901916504, "global_step": 437918, "epoch": 5276} {"train_loss": -25.824634552001953, "global_step": 437919, "epoch": 5276} {"train_loss": -26.3765869140625, "global_step": 437920, "epoch": 5276} {"train_loss": -26.58388328552246, "global_step": 437921, "epoch": 5276} {"train_loss": -26.14485740661621, "global_step": 437922, "epoch": 5276} {"train_loss": -26.09384536743164, "global_step": 437923, "epoch": 5276} {"train_loss": -26.2419490814209, "global_step": 437924, "epoch": 5276} {"train_loss": -25.991851806640625, "global_step": 437925, "epoch": 5276} {"train_loss": -25.776636123657227, "global_step": 437926, "epoch": 5276} {"train_loss": -26.3348445892334, "global_step": 437927, "epoch": 5276} {"train_loss": -26.24390983581543, "global_step": 437928, "epoch": 5276} {"train_loss": -26.53303337097168, "global_step": 437929, "epoch": 5276} {"train_loss": -26.338022232055664, "global_step": 437930, "epoch": 5276} {"train_loss": -26.585174560546875, "global_step": 437931, "epoch": 5276} {"train_loss": -26.71820640563965, "global_step": 437932, "epoch": 5276} {"train_loss": -26.69947624206543, "global_step": 437933, "epoch": 5276} {"train_loss": -26.67445182800293, "global_step": 437934, "epoch": 5276} {"train_loss": -26.703311920166016, "global_step": 437935, "epoch": 5276} {"train_loss": -26.781513214111328, "global_step": 437936, "epoch": 5276} {"train_loss": -26.779987335205078, "global_step": 437937, "epoch": 5276} {"train_loss": -26.855091094970703, "global_step": 437938, "epoch": 5276} {"train_loss": -26.544998168945312, "global_step": 437939, "epoch": 5276} {"train_loss": -26.33770751953125, "global_step": 437940, "epoch": 5276} {"train_loss": -26.982330322265625, "global_step": 437941, "epoch": 5276} {"train_loss": -26.9136905670166, "global_step": 437942, "epoch": 5276} {"train_loss": -26.820205688476562, "global_step": 437943, "epoch": 5276} {"train_loss": -26.731184005737305, "global_step": 437944, "epoch": 5276} {"train_loss": -27.38138198852539, "global_step": 437945, "epoch": 5276} {"train_loss": -26.830434799194336, "global_step": 437946, "epoch": 5276} {"train_loss": -27.125, "global_step": 437947, "epoch": 5276} {"train_loss": -26.58131217956543, "global_step": 437948, "epoch": 5276} {"train_loss": -26.93250846862793, "global_step": 437949, "epoch": 5276} {"train_loss": -27.13517189025879, "global_step": 437950, "epoch": 5276} {"train_loss": -27.13706398010254, "global_step": 437951, "epoch": 5276} {"train_loss": -26.827960968017578, "global_step": 437952, "epoch": 5276} {"train_loss": -26.946929931640625, "global_step": 437953, "epoch": 5276} {"train_loss": -26.830245971679688, "global_step": 437954, "epoch": 5276} {"train_loss": -26.741796493530273, "global_step": 437955, "epoch": 5276} {"train_loss": -27.227863311767578, "global_step": 437956, "epoch": 5276} {"train_loss": -26.73621940612793, "global_step": 437957, "epoch": 5276} {"train_loss": -26.670942306518555, "global_step": 437958, "epoch": 5276} {"train_loss": -27.12153434753418, "global_step": 437959, "epoch": 5276} {"train_loss": -27.477773666381836, "global_step": 437960, "epoch": 5276} {"train_loss": -27.190494537353516, "global_step": 437961, "epoch": 5276} {"train_loss": -27.098241806030273, "global_step": 437962, "epoch": 5276} {"train_loss": -26.96770668029785, "global_step": 437963, "epoch": 5276} {"train_loss": -26.988733291625977, "global_step": 437964, "epoch": 5276} {"train_loss": -26.931461334228516, "global_step": 437965, "epoch": 5276} {"train_loss": -26.8253116607666, "global_step": 437966, "epoch": 5276} {"train_loss": -27.019840240478516, "global_step": 437967, "epoch": 5276} {"train_loss": -26.956989288330078, "global_step": 437968, "epoch": 5276} {"train_loss": -26.92620849609375, "global_step": 437969, "epoch": 5276} {"train_loss": -27.274091720581055, "global_step": 437970, "epoch": 5276} {"train_loss": -27.090612411499023, "global_step": 437971, "epoch": 5276} {"train_loss": -27.126483917236328, "global_step": 437972, "epoch": 5276} {"train_loss": -27.291418075561523, "global_step": 437973, "epoch": 5276} {"train_loss": -26.985187530517578, "global_step": 437974, "epoch": 5276} {"train_loss": -27.242979049682617, "global_step": 437975, "epoch": 5276} {"train_loss": -27.147611618041992, "global_step": 437976, "epoch": 5276} {"train_loss": -27.066125869750977, "global_step": 437977, "epoch": 5276} {"train_loss": -27.11517906188965, "global_step": 437978, "epoch": 5276} {"train_loss": -27.246429443359375, "global_step": 437979, "epoch": 5276} {"train_loss": -27.005552291870117, "global_step": 437980, "epoch": 5276} {"train_loss": -27.4473934173584, "global_step": 437981, "epoch": 5276} {"train_loss": -27.295286178588867, "global_step": 437982, "epoch": 5276} {"train_loss": -27.33696937561035, "global_step": 437983, "epoch": 5276} {"train_loss": -27.12445640563965, "global_step": 437984, "epoch": 5276} {"train_loss": -27.302783966064453, "global_step": 437985, "epoch": 5276} {"train_loss": -27.257816314697266, "global_step": 437986, "epoch": 5276} {"train_loss": -27.037418365478516, "global_step": 437987, "epoch": 5276} {"train_loss": -27.024667739868164, "global_step": 437988, "epoch": 5276} {"train_loss": -26.721725463867188, "global_step": 437989, "epoch": 5276} {"train_loss": -26.748565375086773, "global_step": 437990, "epoch": 5276, "val_loss": 6677355.0} {"train_loss": -26.107954025268555, "global_step": 437991, "epoch": 5277} {"train_loss": -24.987600326538086, "global_step": 437992, "epoch": 5277} {"train_loss": -24.176197052001953, "global_step": 437993, "epoch": 5277} {"train_loss": -25.524106979370117, "global_step": 437994, "epoch": 5277} {"train_loss": -25.79905128479004, "global_step": 437995, "epoch": 5277} {"train_loss": -25.788618087768555, "global_step": 437996, "epoch": 5277} {"train_loss": -25.6545467376709, "global_step": 437997, "epoch": 5277} {"train_loss": -26.3209228515625, "global_step": 437998, "epoch": 5277} {"train_loss": -25.36871910095215, "global_step": 437999, "epoch": 5277} {"train_loss": -26.206533432006836, "global_step": 438000, "epoch": 5277} {"train_loss": -26.044544219970703, "global_step": 438001, "epoch": 5277} {"train_loss": -26.146875381469727, "global_step": 438002, "epoch": 5277} {"train_loss": -26.052383422851562, "global_step": 438003, "epoch": 5277} {"train_loss": -26.076251983642578, "global_step": 438004, "epoch": 5277} {"train_loss": -26.381423950195312, "global_step": 438005, "epoch": 5277} {"train_loss": -26.375524520874023, "global_step": 438006, "epoch": 5277} {"train_loss": -26.095523834228516, "global_step": 438007, "epoch": 5277} {"train_loss": -26.517322540283203, "global_step": 438008, "epoch": 5277} {"train_loss": -26.541418075561523, "global_step": 438009, "epoch": 5277} {"train_loss": -26.193647384643555, "global_step": 438010, "epoch": 5277} {"train_loss": -26.52777671813965, "global_step": 438011, "epoch": 5277} {"train_loss": -26.526264190673828, "global_step": 438012, "epoch": 5277} {"train_loss": -26.66131019592285, "global_step": 438013, "epoch": 5277} {"train_loss": -27.032928466796875, "global_step": 438014, "epoch": 5277} {"train_loss": -26.539794921875, "global_step": 438015, "epoch": 5277} {"train_loss": -26.55348777770996, "global_step": 438016, "epoch": 5277} {"train_loss": -26.920761108398438, "global_step": 438017, "epoch": 5277} {"train_loss": -26.961395263671875, "global_step": 438018, "epoch": 5277} {"train_loss": -26.69099235534668, "global_step": 438019, "epoch": 5277} {"train_loss": -26.676584243774414, "global_step": 438020, "epoch": 5277} {"train_loss": -26.916242599487305, "global_step": 438021, "epoch": 5277} {"train_loss": -26.75858497619629, "global_step": 438022, "epoch": 5277} {"train_loss": -26.657529830932617, "global_step": 438023, "epoch": 5277} {"train_loss": -26.444473266601562, "global_step": 438024, "epoch": 5277} {"train_loss": -26.802947998046875, "global_step": 438025, "epoch": 5277} {"train_loss": -26.997583389282227, "global_step": 438026, "epoch": 5277} {"train_loss": -26.848508834838867, "global_step": 438027, "epoch": 5277} {"train_loss": -26.897186279296875, "global_step": 438028, "epoch": 5277} {"train_loss": -27.191328048706055, "global_step": 438029, "epoch": 5277} {"train_loss": -26.989505767822266, "global_step": 438030, "epoch": 5277} {"train_loss": -27.041357040405273, "global_step": 438031, "epoch": 5277} {"train_loss": -26.93292808532715, "global_step": 438032, "epoch": 5277} {"train_loss": -26.696374893188477, "global_step": 438033, "epoch": 5277} {"train_loss": -27.202646255493164, "global_step": 438034, "epoch": 5277} {"train_loss": -27.162689208984375, "global_step": 438035, "epoch": 5277} {"train_loss": -26.687393188476562, "global_step": 438036, "epoch": 5277} {"train_loss": -27.234359741210938, "global_step": 438037, "epoch": 5277} {"train_loss": -27.24658203125, "global_step": 438038, "epoch": 5277} {"train_loss": -27.226367950439453, "global_step": 438039, "epoch": 5277} {"train_loss": -26.765439987182617, "global_step": 438040, "epoch": 5277} {"train_loss": -26.819440841674805, "global_step": 438041, "epoch": 5277} {"train_loss": -26.9908390045166, "global_step": 438042, "epoch": 5277} {"train_loss": -27.021442413330078, "global_step": 438043, "epoch": 5277} {"train_loss": -27.072534561157227, "global_step": 438044, "epoch": 5277} {"train_loss": -27.1358642578125, "global_step": 438045, "epoch": 5277} {"train_loss": -26.80574607849121, "global_step": 438046, "epoch": 5277} {"train_loss": -26.856430053710938, "global_step": 438047, "epoch": 5277} {"train_loss": -26.953998565673828, "global_step": 438048, "epoch": 5277} {"train_loss": -27.2372989654541, "global_step": 438049, "epoch": 5277} {"train_loss": -27.0933780670166, "global_step": 438050, "epoch": 5277} {"train_loss": -27.151153564453125, "global_step": 438051, "epoch": 5277} {"train_loss": -26.94841957092285, "global_step": 438052, "epoch": 5277} {"train_loss": -27.326202392578125, "global_step": 438053, "epoch": 5277} {"train_loss": -27.013586044311523, "global_step": 438054, "epoch": 5277} {"train_loss": -27.02971839904785, "global_step": 438055, "epoch": 5277} {"train_loss": -26.993423461914062, "global_step": 438056, "epoch": 5277} {"train_loss": -27.46234130859375, "global_step": 438057, "epoch": 5277} {"train_loss": -27.368438720703125, "global_step": 438058, "epoch": 5277} {"train_loss": -27.243179321289062, "global_step": 438059, "epoch": 5277} {"train_loss": -27.117517471313477, "global_step": 438060, "epoch": 5277} {"train_loss": -27.038923263549805, "global_step": 438061, "epoch": 5277} {"train_loss": -26.996856689453125, "global_step": 438062, "epoch": 5277} {"train_loss": -27.440906524658203, "global_step": 438063, "epoch": 5277} {"train_loss": -27.022146224975586, "global_step": 438064, "epoch": 5277} {"train_loss": -26.928613662719727, "global_step": 438065, "epoch": 5277} {"train_loss": -27.02436637878418, "global_step": 438066, "epoch": 5277} {"train_loss": -27.115528106689453, "global_step": 438067, "epoch": 5277} {"train_loss": -26.9967098236084, "global_step": 438068, "epoch": 5277} {"train_loss": -27.309316635131836, "global_step": 438069, "epoch": 5277} {"train_loss": -27.025009155273438, "global_step": 438070, "epoch": 5277} {"train_loss": -27.255573272705078, "global_step": 438071, "epoch": 5277} {"train_loss": -26.537067413330078, "global_step": 438072, "epoch": 5277} {"train_loss": -26.693200996123164, "global_step": 438073, "epoch": 5277, "val_loss": 6663896.5} {"train_loss": -25.545394897460938, "global_step": 438074, "epoch": 5278} {"train_loss": -25.692291259765625, "global_step": 438075, "epoch": 5278} {"train_loss": -25.45289421081543, "global_step": 438076, "epoch": 5278} {"train_loss": -25.439167022705078, "global_step": 438077, "epoch": 5278} {"train_loss": -26.212621688842773, "global_step": 438078, "epoch": 5278} {"train_loss": -25.415258407592773, "global_step": 438079, "epoch": 5278} {"train_loss": -26.032150268554688, "global_step": 438080, "epoch": 5278} {"train_loss": -26.3079891204834, "global_step": 438081, "epoch": 5278} {"train_loss": -26.15768814086914, "global_step": 438082, "epoch": 5278} {"train_loss": -25.77962303161621, "global_step": 438083, "epoch": 5278} {"train_loss": -26.537771224975586, "global_step": 438084, "epoch": 5278} {"train_loss": -26.0861873626709, "global_step": 438085, "epoch": 5278} {"train_loss": -26.36419677734375, "global_step": 438086, "epoch": 5278} {"train_loss": -26.16459083557129, "global_step": 438087, "epoch": 5278} {"train_loss": -26.67279052734375, "global_step": 438088, "epoch": 5278} {"train_loss": -26.35462760925293, "global_step": 438089, "epoch": 5278} {"train_loss": -26.471027374267578, "global_step": 438090, "epoch": 5278} {"train_loss": -26.663166046142578, "global_step": 438091, "epoch": 5278} {"train_loss": -26.4683837890625, "global_step": 438092, "epoch": 5278} {"train_loss": -26.361312866210938, "global_step": 438093, "epoch": 5278} {"train_loss": -26.34173011779785, "global_step": 438094, "epoch": 5278} {"train_loss": -26.5386905670166, "global_step": 438095, "epoch": 5278} {"train_loss": -26.372669219970703, "global_step": 438096, "epoch": 5278} {"train_loss": -26.652469635009766, "global_step": 438097, "epoch": 5278} {"train_loss": -26.5950984954834, "global_step": 438098, "epoch": 5278} {"train_loss": -26.780126571655273, "global_step": 438099, "epoch": 5278} {"train_loss": -26.350976943969727, "global_step": 438100, "epoch": 5278} {"train_loss": -26.787322998046875, "global_step": 438101, "epoch": 5278} {"train_loss": -26.64893913269043, "global_step": 438102, "epoch": 5278} {"train_loss": -26.654264450073242, "global_step": 438103, "epoch": 5278} {"train_loss": -26.952747344970703, "global_step": 438104, "epoch": 5278} {"train_loss": -26.883026123046875, "global_step": 438105, "epoch": 5278} {"train_loss": -26.691364288330078, "global_step": 438106, "epoch": 5278} {"train_loss": -26.439472198486328, "global_step": 438107, "epoch": 5278} {"train_loss": -26.781721115112305, "global_step": 438108, "epoch": 5278} {"train_loss": -26.7011775970459, "global_step": 438109, "epoch": 5278} {"train_loss": -26.755706787109375, "global_step": 438110, "epoch": 5278} {"train_loss": -27.25715446472168, "global_step": 438111, "epoch": 5278} {"train_loss": -26.912458419799805, "global_step": 438112, "epoch": 5278} {"train_loss": -26.7186336517334, "global_step": 438113, "epoch": 5278} {"train_loss": -26.968769073486328, "global_step": 438114, "epoch": 5278} {"train_loss": -26.98834228515625, "global_step": 438115, "epoch": 5278} {"train_loss": -26.611417770385742, "global_step": 438116, "epoch": 5278} {"train_loss": -26.98579978942871, "global_step": 438117, "epoch": 5278} {"train_loss": -26.757246017456055, "global_step": 438118, "epoch": 5278} {"train_loss": -26.770883560180664, "global_step": 438119, "epoch": 5278} {"train_loss": -26.788959503173828, "global_step": 438120, "epoch": 5278} {"train_loss": -27.065515518188477, "global_step": 438121, "epoch": 5278} {"train_loss": -27.1207218170166, "global_step": 438122, "epoch": 5278} {"train_loss": -27.19877052307129, "global_step": 438123, "epoch": 5278} {"train_loss": -27.567068099975586, "global_step": 438124, "epoch": 5278} {"train_loss": -26.982091903686523, "global_step": 438125, "epoch": 5278} {"train_loss": -26.922534942626953, "global_step": 438126, "epoch": 5278} {"train_loss": -26.81940269470215, "global_step": 438127, "epoch": 5278} {"train_loss": -26.824262619018555, "global_step": 438128, "epoch": 5278} {"train_loss": -26.77907371520996, "global_step": 438129, "epoch": 5278} {"train_loss": -26.947484970092773, "global_step": 438130, "epoch": 5278} {"train_loss": -27.44765281677246, "global_step": 438131, "epoch": 5278} {"train_loss": -26.8399658203125, "global_step": 438132, "epoch": 5278} {"train_loss": -26.9510498046875, "global_step": 438133, "epoch": 5278} {"train_loss": -27.094324111938477, "global_step": 438134, "epoch": 5278} {"train_loss": -26.99321937561035, "global_step": 438135, "epoch": 5278} {"train_loss": -26.871234893798828, "global_step": 438136, "epoch": 5278} {"train_loss": -26.662160873413086, "global_step": 438137, "epoch": 5278} {"train_loss": -26.527494430541992, "global_step": 438138, "epoch": 5278} {"train_loss": -26.7542667388916, "global_step": 438139, "epoch": 5278} {"train_loss": -26.354406356811523, "global_step": 438140, "epoch": 5278} {"train_loss": -26.891117095947266, "global_step": 438141, "epoch": 5278} {"train_loss": -26.90186882019043, "global_step": 438142, "epoch": 5278} {"train_loss": -26.428466796875, "global_step": 438143, "epoch": 5278} {"train_loss": -26.4571475982666, "global_step": 438144, "epoch": 5278} {"train_loss": -26.561498641967773, "global_step": 438145, "epoch": 5278} {"train_loss": -26.964950561523438, "global_step": 438146, "epoch": 5278} {"train_loss": -26.83674430847168, "global_step": 438147, "epoch": 5278} {"train_loss": -26.53376579284668, "global_step": 438148, "epoch": 5278} {"train_loss": -27.232177734375, "global_step": 438149, "epoch": 5278} {"train_loss": -27.030969619750977, "global_step": 438150, "epoch": 5278} {"train_loss": -26.798486709594727, "global_step": 438151, "epoch": 5278} {"train_loss": -26.98528480529785, "global_step": 438152, "epoch": 5278} {"train_loss": -27.004215240478516, "global_step": 438153, "epoch": 5278} {"train_loss": -26.997705459594727, "global_step": 438154, "epoch": 5278} {"train_loss": -27.02353858947754, "global_step": 438155, "epoch": 5278} {"train_loss": -26.656770867037487, "global_step": 438156, "epoch": 5278, "val_loss": 6560659.0} {"train_loss": -26.47829246520996, "global_step": 438157, "epoch": 5279} {"train_loss": -26.03277015686035, "global_step": 438158, "epoch": 5279} {"train_loss": -25.39191246032715, "global_step": 438159, "epoch": 5279} {"train_loss": -26.149824142456055, "global_step": 438160, "epoch": 5279} {"train_loss": -25.318090438842773, "global_step": 438161, "epoch": 5279} {"train_loss": -26.244836807250977, "global_step": 438162, "epoch": 5279} {"train_loss": -25.892715454101562, "global_step": 438163, "epoch": 5279} {"train_loss": -26.233936309814453, "global_step": 438164, "epoch": 5279} {"train_loss": -26.131607055664062, "global_step": 438165, "epoch": 5279} {"train_loss": -25.907424926757812, "global_step": 438166, "epoch": 5279} {"train_loss": -25.96917152404785, "global_step": 438167, "epoch": 5279} {"train_loss": -26.254236221313477, "global_step": 438168, "epoch": 5279} {"train_loss": -25.789697647094727, "global_step": 438169, "epoch": 5279} {"train_loss": -26.14088249206543, "global_step": 438170, "epoch": 5279} {"train_loss": -26.18255043029785, "global_step": 438171, "epoch": 5279} {"train_loss": -26.239990234375, "global_step": 438172, "epoch": 5279} {"train_loss": -26.233861923217773, "global_step": 438173, "epoch": 5279} {"train_loss": -26.34027671813965, "global_step": 438174, "epoch": 5279} {"train_loss": -26.382659912109375, "global_step": 438175, "epoch": 5279} {"train_loss": -26.11396598815918, "global_step": 438176, "epoch": 5279} {"train_loss": -26.195363998413086, "global_step": 438177, "epoch": 5279} {"train_loss": -26.485395431518555, "global_step": 438178, "epoch": 5279} {"train_loss": -26.271635055541992, "global_step": 438179, "epoch": 5279} {"train_loss": -26.84492301940918, "global_step": 438180, "epoch": 5279} {"train_loss": -26.5095272064209, "global_step": 438181, "epoch": 5279} {"train_loss": -26.235273361206055, "global_step": 438182, "epoch": 5279} {"train_loss": -27.091327667236328, "global_step": 438183, "epoch": 5279} {"train_loss": -26.542861938476562, "global_step": 438184, "epoch": 5279} {"train_loss": -26.5487060546875, "global_step": 438185, "epoch": 5279} {"train_loss": -26.67780876159668, "global_step": 438186, "epoch": 5279} {"train_loss": -26.484643936157227, "global_step": 438187, "epoch": 5279} {"train_loss": -26.8673095703125, "global_step": 438188, "epoch": 5279} {"train_loss": -26.981830596923828, "global_step": 438189, "epoch": 5279} {"train_loss": -26.970260620117188, "global_step": 438190, "epoch": 5279} {"train_loss": -26.378095626831055, "global_step": 438191, "epoch": 5279} {"train_loss": -26.4013729095459, "global_step": 438192, "epoch": 5279} {"train_loss": -26.891315460205078, "global_step": 438193, "epoch": 5279} {"train_loss": -26.800281524658203, "global_step": 438194, "epoch": 5279} {"train_loss": -26.922494888305664, "global_step": 438195, "epoch": 5279} {"train_loss": -26.955957412719727, "global_step": 438196, "epoch": 5279} {"train_loss": -26.638477325439453, "global_step": 438197, "epoch": 5279} {"train_loss": -27.251867294311523, "global_step": 438198, "epoch": 5279} {"train_loss": -27.211257934570312, "global_step": 438199, "epoch": 5279} {"train_loss": -27.139389038085938, "global_step": 438200, "epoch": 5279} {"train_loss": -26.7600154876709, "global_step": 438201, "epoch": 5279} {"train_loss": -26.85816764831543, "global_step": 438202, "epoch": 5279} {"train_loss": -26.9954891204834, "global_step": 438203, "epoch": 5279} {"train_loss": -27.199613571166992, "global_step": 438204, "epoch": 5279} {"train_loss": -27.28595542907715, "global_step": 438205, "epoch": 5279} {"train_loss": -27.084562301635742, "global_step": 438206, "epoch": 5279} {"train_loss": -27.096500396728516, "global_step": 438207, "epoch": 5279} {"train_loss": -27.454126358032227, "global_step": 438208, "epoch": 5279} {"train_loss": -27.181854248046875, "global_step": 438209, "epoch": 5279} {"train_loss": -27.03388786315918, "global_step": 438210, "epoch": 5279} {"train_loss": -26.864887237548828, "global_step": 438211, "epoch": 5279} {"train_loss": -26.80539894104004, "global_step": 438212, "epoch": 5279} {"train_loss": -26.5855770111084, "global_step": 438213, "epoch": 5279} {"train_loss": -26.76240348815918, "global_step": 438214, "epoch": 5279} {"train_loss": -27.422199249267578, "global_step": 438215, "epoch": 5279} {"train_loss": -27.006704330444336, "global_step": 438216, "epoch": 5279} {"train_loss": -27.187833786010742, "global_step": 438217, "epoch": 5279} {"train_loss": -27.297306060791016, "global_step": 438218, "epoch": 5279} {"train_loss": -26.973281860351562, "global_step": 438219, "epoch": 5279} {"train_loss": -27.53887367248535, "global_step": 438220, "epoch": 5279} {"train_loss": -27.208393096923828, "global_step": 438221, "epoch": 5279} {"train_loss": -27.18402671813965, "global_step": 438222, "epoch": 5279} {"train_loss": -27.16131591796875, "global_step": 438223, "epoch": 5279} {"train_loss": -27.023115158081055, "global_step": 438224, "epoch": 5279} {"train_loss": -26.857267379760742, "global_step": 438225, "epoch": 5279} {"train_loss": -26.977163314819336, "global_step": 438226, "epoch": 5279} {"train_loss": -27.23440933227539, "global_step": 438227, "epoch": 5279} {"train_loss": -27.088733673095703, "global_step": 438228, "epoch": 5279} {"train_loss": -27.26605796813965, "global_step": 438229, "epoch": 5279} {"train_loss": -27.21773338317871, "global_step": 438230, "epoch": 5279} {"train_loss": -26.908849716186523, "global_step": 438231, "epoch": 5279} {"train_loss": -26.989288330078125, "global_step": 438232, "epoch": 5279} {"train_loss": -27.1167049407959, "global_step": 438233, "epoch": 5279} {"train_loss": -26.895782470703125, "global_step": 438234, "epoch": 5279} {"train_loss": -26.944049835205078, "global_step": 438235, "epoch": 5279} {"train_loss": -26.790607452392578, "global_step": 438236, "epoch": 5279} {"train_loss": -26.729841232299805, "global_step": 438237, "epoch": 5279} {"train_loss": -26.23710060119629, "global_step": 438238, "epoch": 5279} {"train_loss": -26.705234596528204, "global_step": 438239, "epoch": 5279, "val_loss": 6602571.0} {"train_loss": -23.63421058654785, "global_step": 438240, "epoch": 5280} {"train_loss": -24.02882194519043, "global_step": 438241, "epoch": 5280} {"train_loss": -24.566328048706055, "global_step": 438242, "epoch": 5280} {"train_loss": -25.516977310180664, "global_step": 438243, "epoch": 5280} {"train_loss": -24.479053497314453, "global_step": 438244, "epoch": 5280} {"train_loss": -25.768014907836914, "global_step": 438245, "epoch": 5280} {"train_loss": -24.594934463500977, "global_step": 438246, "epoch": 5280} {"train_loss": -25.3223819732666, "global_step": 438247, "epoch": 5280} {"train_loss": -25.484054565429688, "global_step": 438248, "epoch": 5280} {"train_loss": -25.535497665405273, "global_step": 438249, "epoch": 5280} {"train_loss": -25.5618896484375, "global_step": 438250, "epoch": 5280} {"train_loss": -26.055347442626953, "global_step": 438251, "epoch": 5280} {"train_loss": -25.761701583862305, "global_step": 438252, "epoch": 5280} {"train_loss": -25.903778076171875, "global_step": 438253, "epoch": 5280} {"train_loss": -25.767194747924805, "global_step": 438254, "epoch": 5280} {"train_loss": -25.8745174407959, "global_step": 438255, "epoch": 5280} {"train_loss": -25.93409538269043, "global_step": 438256, "epoch": 5280} {"train_loss": -26.232269287109375, "global_step": 438257, "epoch": 5280} {"train_loss": -26.04230308532715, "global_step": 438258, "epoch": 5280} {"train_loss": -26.10247230529785, "global_step": 438259, "epoch": 5280} {"train_loss": -26.17169189453125, "global_step": 438260, "epoch": 5280} {"train_loss": -26.316455841064453, "global_step": 438261, "epoch": 5280} {"train_loss": -26.59299659729004, "global_step": 438262, "epoch": 5280} {"train_loss": -26.228418350219727, "global_step": 438263, "epoch": 5280} {"train_loss": -26.445911407470703, "global_step": 438264, "epoch": 5280} {"train_loss": -26.50263786315918, "global_step": 438265, "epoch": 5280} {"train_loss": -26.5832576751709, "global_step": 438266, "epoch": 5280} {"train_loss": -26.46930503845215, "global_step": 438267, "epoch": 5280} {"train_loss": -26.36313247680664, "global_step": 438268, "epoch": 5280} {"train_loss": -26.285785675048828, "global_step": 438269, "epoch": 5280} {"train_loss": -26.649616241455078, "global_step": 438270, "epoch": 5280} {"train_loss": -26.810260772705078, "global_step": 438271, "epoch": 5280} {"train_loss": -26.529043197631836, "global_step": 438272, "epoch": 5280} {"train_loss": -26.795684814453125, "global_step": 438273, "epoch": 5280} {"train_loss": -26.500492095947266, "global_step": 438274, "epoch": 5280} {"train_loss": -26.531904220581055, "global_step": 438275, "epoch": 5280} {"train_loss": -26.867162704467773, "global_step": 438276, "epoch": 5280} {"train_loss": -26.9967098236084, "global_step": 438277, "epoch": 5280} {"train_loss": -26.726612091064453, "global_step": 438278, "epoch": 5280} {"train_loss": -26.53041648864746, "global_step": 438279, "epoch": 5280} {"train_loss": -26.984512329101562, "global_step": 438280, "epoch": 5280} {"train_loss": -26.760330200195312, "global_step": 438281, "epoch": 5280} {"train_loss": -26.781579971313477, "global_step": 438282, "epoch": 5280} {"train_loss": -26.9113712310791, "global_step": 438283, "epoch": 5280} {"train_loss": -26.771997451782227, "global_step": 438284, "epoch": 5280} {"train_loss": -26.9694881439209, "global_step": 438285, "epoch": 5280} {"train_loss": -26.98140525817871, "global_step": 438286, "epoch": 5280} {"train_loss": -26.9660587310791, "global_step": 438287, "epoch": 5280} {"train_loss": -27.304031372070312, "global_step": 438288, "epoch": 5280} {"train_loss": -27.183088302612305, "global_step": 438289, "epoch": 5280} {"train_loss": -27.041833877563477, "global_step": 438290, "epoch": 5280} {"train_loss": -26.897846221923828, "global_step": 438291, "epoch": 5280} {"train_loss": -26.9722957611084, "global_step": 438292, "epoch": 5280} {"train_loss": -27.437088012695312, "global_step": 438293, "epoch": 5280} {"train_loss": -26.7353458404541, "global_step": 438294, "epoch": 5280} {"train_loss": -26.957563400268555, "global_step": 438295, "epoch": 5280} {"train_loss": -26.756921768188477, "global_step": 438296, "epoch": 5280} {"train_loss": -27.153982162475586, "global_step": 438297, "epoch": 5280} {"train_loss": -26.86748695373535, "global_step": 438298, "epoch": 5280} {"train_loss": -27.00140953063965, "global_step": 438299, "epoch": 5280} {"train_loss": -26.565448760986328, "global_step": 438300, "epoch": 5280} {"train_loss": -26.660497665405273, "global_step": 438301, "epoch": 5280} {"train_loss": -26.7236385345459, "global_step": 438302, "epoch": 5280} {"train_loss": -26.910627365112305, "global_step": 438303, "epoch": 5280} {"train_loss": -27.024993896484375, "global_step": 438304, "epoch": 5280} {"train_loss": -26.953832626342773, "global_step": 438305, "epoch": 5280} {"train_loss": -26.820953369140625, "global_step": 438306, "epoch": 5280} {"train_loss": -27.17108154296875, "global_step": 438307, "epoch": 5280} {"train_loss": -26.76899528503418, "global_step": 438308, "epoch": 5280} {"train_loss": -26.899433135986328, "global_step": 438309, "epoch": 5280} {"train_loss": -26.878870010375977, "global_step": 438310, "epoch": 5280} {"train_loss": -27.26507568359375, "global_step": 438311, "epoch": 5280} {"train_loss": -27.065656661987305, "global_step": 438312, "epoch": 5280} {"train_loss": -27.214832305908203, "global_step": 438313, "epoch": 5280} {"train_loss": -26.80170249938965, "global_step": 438314, "epoch": 5280} {"train_loss": -27.019790649414062, "global_step": 438315, "epoch": 5280} {"train_loss": -27.204328536987305, "global_step": 438316, "epoch": 5280} {"train_loss": -26.938501358032227, "global_step": 438317, "epoch": 5280} {"train_loss": -26.920568466186523, "global_step": 438318, "epoch": 5280} {"train_loss": -26.853185653686523, "global_step": 438319, "epoch": 5280} {"train_loss": -27.070316314697266, "global_step": 438320, "epoch": 5280} {"train_loss": -27.11590576171875, "global_step": 438321, "epoch": 5280} {"train_loss": -26.49075979209808, "global_step": 438322, "epoch": 5280, "val_loss": 6538753.0} {"train_loss": -26.411962509155273, "global_step": 438323, "epoch": 5281} {"train_loss": -26.03274917602539, "global_step": 438324, "epoch": 5281} {"train_loss": -26.029850006103516, "global_step": 438325, "epoch": 5281} {"train_loss": -26.43722915649414, "global_step": 438326, "epoch": 5281} {"train_loss": -26.47877311706543, "global_step": 438327, "epoch": 5281} {"train_loss": -26.752460479736328, "global_step": 438328, "epoch": 5281} {"train_loss": -26.525848388671875, "global_step": 438329, "epoch": 5281} {"train_loss": -26.51948356628418, "global_step": 438330, "epoch": 5281} {"train_loss": -26.45175552368164, "global_step": 438331, "epoch": 5281} {"train_loss": -26.47210693359375, "global_step": 438332, "epoch": 5281} {"train_loss": -26.957441329956055, "global_step": 438333, "epoch": 5281} {"train_loss": -26.97267723083496, "global_step": 438334, "epoch": 5281} {"train_loss": -26.953022003173828, "global_step": 438335, "epoch": 5281} {"train_loss": -26.83827018737793, "global_step": 438336, "epoch": 5281} {"train_loss": -26.976587295532227, "global_step": 438337, "epoch": 5281} {"train_loss": -26.62396812438965, "global_step": 438338, "epoch": 5281} {"train_loss": -26.97783851623535, "global_step": 438339, "epoch": 5281} {"train_loss": -26.891977310180664, "global_step": 438340, "epoch": 5281} {"train_loss": -26.764516830444336, "global_step": 438341, "epoch": 5281} {"train_loss": -26.531753540039062, "global_step": 438342, "epoch": 5281} {"train_loss": -26.864105224609375, "global_step": 438343, "epoch": 5281} {"train_loss": -26.774423599243164, "global_step": 438344, "epoch": 5281} {"train_loss": -26.69447135925293, "global_step": 438345, "epoch": 5281} {"train_loss": -26.77750587463379, "global_step": 438346, "epoch": 5281} {"train_loss": -26.78016471862793, "global_step": 438347, "epoch": 5281} {"train_loss": -27.22242546081543, "global_step": 438348, "epoch": 5281} {"train_loss": -26.65338134765625, "global_step": 438349, "epoch": 5281} {"train_loss": -27.0623722076416, "global_step": 438350, "epoch": 5281} {"train_loss": -26.54798698425293, "global_step": 438351, "epoch": 5281} {"train_loss": -26.699050903320312, "global_step": 438352, "epoch": 5281} {"train_loss": -27.104660034179688, "global_step": 438353, "epoch": 5281} {"train_loss": -26.90850830078125, "global_step": 438354, "epoch": 5281} {"train_loss": -26.85919761657715, "global_step": 438355, "epoch": 5281} {"train_loss": -26.936872482299805, "global_step": 438356, "epoch": 5281} {"train_loss": -27.093841552734375, "global_step": 438357, "epoch": 5281} {"train_loss": -26.946393966674805, "global_step": 438358, "epoch": 5281} {"train_loss": -27.17752456665039, "global_step": 438359, "epoch": 5281} {"train_loss": -27.055307388305664, "global_step": 438360, "epoch": 5281} {"train_loss": -27.120412826538086, "global_step": 438361, "epoch": 5281} {"train_loss": -26.99091148376465, "global_step": 438362, "epoch": 5281} {"train_loss": -27.210433959960938, "global_step": 438363, "epoch": 5281} {"train_loss": -27.054777145385742, "global_step": 438364, "epoch": 5281} {"train_loss": -27.102781295776367, "global_step": 438365, "epoch": 5281} {"train_loss": -26.98402976989746, "global_step": 438366, "epoch": 5281} {"train_loss": -27.38623046875, "global_step": 438367, "epoch": 5281} {"train_loss": -27.22653579711914, "global_step": 438368, "epoch": 5281} {"train_loss": -26.7758846282959, "global_step": 438369, "epoch": 5281} {"train_loss": -26.735675811767578, "global_step": 438370, "epoch": 5281} {"train_loss": -25.963438034057617, "global_step": 438371, "epoch": 5281} {"train_loss": -26.524810791015625, "global_step": 438372, "epoch": 5281} {"train_loss": -27.2612247467041, "global_step": 438373, "epoch": 5281} {"train_loss": -26.71693992614746, "global_step": 438374, "epoch": 5281} {"train_loss": -26.68951416015625, "global_step": 438375, "epoch": 5281} {"train_loss": -27.139358520507812, "global_step": 438376, "epoch": 5281} {"train_loss": -26.510351181030273, "global_step": 438377, "epoch": 5281} {"train_loss": -26.685766220092773, "global_step": 438378, "epoch": 5281} {"train_loss": -26.580230712890625, "global_step": 438379, "epoch": 5281} {"train_loss": -26.871015548706055, "global_step": 438380, "epoch": 5281} {"train_loss": -26.49796485900879, "global_step": 438381, "epoch": 5281} {"train_loss": -26.253437042236328, "global_step": 438382, "epoch": 5281} {"train_loss": -26.9885311126709, "global_step": 438383, "epoch": 5281} {"train_loss": -26.826833724975586, "global_step": 438384, "epoch": 5281} {"train_loss": -26.42626953125, "global_step": 438385, "epoch": 5281} {"train_loss": -26.538105010986328, "global_step": 438386, "epoch": 5281} {"train_loss": -26.914997100830078, "global_step": 438387, "epoch": 5281} {"train_loss": -26.951324462890625, "global_step": 438388, "epoch": 5281} {"train_loss": -27.235366821289062, "global_step": 438389, "epoch": 5281} {"train_loss": -26.548925399780273, "global_step": 438390, "epoch": 5281} {"train_loss": -27.151697158813477, "global_step": 438391, "epoch": 5281} {"train_loss": -26.924671173095703, "global_step": 438392, "epoch": 5281} {"train_loss": -27.021900177001953, "global_step": 438393, "epoch": 5281} {"train_loss": -26.674402236938477, "global_step": 438394, "epoch": 5281} {"train_loss": -27.009296417236328, "global_step": 438395, "epoch": 5281} {"train_loss": -27.050458908081055, "global_step": 438396, "epoch": 5281} {"train_loss": -27.186664581298828, "global_step": 438397, "epoch": 5281} {"train_loss": -26.81491470336914, "global_step": 438398, "epoch": 5281} {"train_loss": -26.840356826782227, "global_step": 438399, "epoch": 5281} {"train_loss": -26.472192764282227, "global_step": 438400, "epoch": 5281} {"train_loss": -26.831884384155273, "global_step": 438401, "epoch": 5281} {"train_loss": -27.34966468811035, "global_step": 438402, "epoch": 5281} {"train_loss": -26.9941349029541, "global_step": 438403, "epoch": 5281} {"train_loss": -26.834320068359375, "global_step": 438404, "epoch": 5281} {"train_loss": -26.800909938582453, "global_step": 438405, "epoch": 5281, "val_loss": 6662630.0} {"train_loss": -26.430038452148438, "global_step": 438406, "epoch": 5282} {"train_loss": -26.51715660095215, "global_step": 438407, "epoch": 5282} {"train_loss": -26.37063980102539, "global_step": 438408, "epoch": 5282} {"train_loss": -26.20210838317871, "global_step": 438409, "epoch": 5282} {"train_loss": -26.89706802368164, "global_step": 438410, "epoch": 5282} {"train_loss": -26.406320571899414, "global_step": 438411, "epoch": 5282} {"train_loss": -26.452655792236328, "global_step": 438412, "epoch": 5282} {"train_loss": -26.61008071899414, "global_step": 438413, "epoch": 5282} {"train_loss": -26.690542221069336, "global_step": 438414, "epoch": 5282} {"train_loss": -26.87981605529785, "global_step": 438415, "epoch": 5282} {"train_loss": -27.047470092773438, "global_step": 438416, "epoch": 5282} {"train_loss": -26.84665298461914, "global_step": 438417, "epoch": 5282} {"train_loss": -26.7653865814209, "global_step": 438418, "epoch": 5282} {"train_loss": -26.744037628173828, "global_step": 438419, "epoch": 5282} {"train_loss": -27.116525650024414, "global_step": 438420, "epoch": 5282} {"train_loss": -27.066625595092773, "global_step": 438421, "epoch": 5282} {"train_loss": -26.7978515625, "global_step": 438422, "epoch": 5282} {"train_loss": -26.695913314819336, "global_step": 438423, "epoch": 5282} {"train_loss": -27.073566436767578, "global_step": 438424, "epoch": 5282} {"train_loss": -26.96417808532715, "global_step": 438425, "epoch": 5282} {"train_loss": -26.712284088134766, "global_step": 438426, "epoch": 5282} {"train_loss": -27.148929595947266, "global_step": 438427, "epoch": 5282} {"train_loss": -26.989404678344727, "global_step": 438428, "epoch": 5282} {"train_loss": -26.789342880249023, "global_step": 438429, "epoch": 5282} {"train_loss": -26.888330459594727, "global_step": 438430, "epoch": 5282} {"train_loss": -26.89676856994629, "global_step": 438431, "epoch": 5282} {"train_loss": -26.641660690307617, "global_step": 438432, "epoch": 5282} {"train_loss": -27.255399703979492, "global_step": 438433, "epoch": 5282} {"train_loss": -27.138874053955078, "global_step": 438434, "epoch": 5282} {"train_loss": -27.270963668823242, "global_step": 438435, "epoch": 5282} {"train_loss": -27.08258056640625, "global_step": 438436, "epoch": 5282} {"train_loss": -27.24115562438965, "global_step": 438437, "epoch": 5282} {"train_loss": -27.328826904296875, "global_step": 438438, "epoch": 5282} {"train_loss": -27.04269790649414, "global_step": 438439, "epoch": 5282} {"train_loss": -27.037586212158203, "global_step": 438440, "epoch": 5282} {"train_loss": -26.964954376220703, "global_step": 438441, "epoch": 5282} {"train_loss": -27.051008224487305, "global_step": 438442, "epoch": 5282} {"train_loss": -27.463459014892578, "global_step": 438443, "epoch": 5282} {"train_loss": -27.280914306640625, "global_step": 438444, "epoch": 5282} {"train_loss": -27.149580001831055, "global_step": 438445, "epoch": 5282} {"train_loss": -26.96784782409668, "global_step": 438446, "epoch": 5282} {"train_loss": -26.6545467376709, "global_step": 438447, "epoch": 5282} {"train_loss": -26.950769424438477, "global_step": 438448, "epoch": 5282} {"train_loss": -27.444684982299805, "global_step": 438449, "epoch": 5282} {"train_loss": -26.803070068359375, "global_step": 438450, "epoch": 5282} {"train_loss": -26.941761016845703, "global_step": 438451, "epoch": 5282} {"train_loss": -26.569318771362305, "global_step": 438452, "epoch": 5282} {"train_loss": -26.771108627319336, "global_step": 438453, "epoch": 5282} {"train_loss": -26.9998722076416, "global_step": 438454, "epoch": 5282} {"train_loss": -26.92532730102539, "global_step": 438455, "epoch": 5282} {"train_loss": -26.63901710510254, "global_step": 438456, "epoch": 5282} {"train_loss": -26.839445114135742, "global_step": 438457, "epoch": 5282} {"train_loss": -26.657886505126953, "global_step": 438458, "epoch": 5282} {"train_loss": -26.305423736572266, "global_step": 438459, "epoch": 5282} {"train_loss": -26.7340145111084, "global_step": 438460, "epoch": 5282} {"train_loss": -26.715728759765625, "global_step": 438461, "epoch": 5282} {"train_loss": -26.53549575805664, "global_step": 438462, "epoch": 5282} {"train_loss": -26.802051544189453, "global_step": 438463, "epoch": 5282} {"train_loss": -26.545764923095703, "global_step": 438464, "epoch": 5282} {"train_loss": -26.793319702148438, "global_step": 438465, "epoch": 5282} {"train_loss": -26.880115509033203, "global_step": 438466, "epoch": 5282} {"train_loss": -26.711008071899414, "global_step": 438467, "epoch": 5282} {"train_loss": -27.12298011779785, "global_step": 438468, "epoch": 5282} {"train_loss": -26.7093505859375, "global_step": 438469, "epoch": 5282} {"train_loss": -27.099390029907227, "global_step": 438470, "epoch": 5282} {"train_loss": -27.103723526000977, "global_step": 438471, "epoch": 5282} {"train_loss": -26.720869064331055, "global_step": 438472, "epoch": 5282} {"train_loss": -26.685871124267578, "global_step": 438473, "epoch": 5282} {"train_loss": -26.999744415283203, "global_step": 438474, "epoch": 5282} {"train_loss": -26.573654174804688, "global_step": 438475, "epoch": 5282} {"train_loss": -26.78885269165039, "global_step": 438476, "epoch": 5282} {"train_loss": -26.892484664916992, "global_step": 438477, "epoch": 5282} {"train_loss": -26.9040470123291, "global_step": 438478, "epoch": 5282} {"train_loss": -27.112945556640625, "global_step": 438479, "epoch": 5282} {"train_loss": -26.54227066040039, "global_step": 438480, "epoch": 5282} {"train_loss": -26.7973690032959, "global_step": 438481, "epoch": 5282} {"train_loss": -26.815820693969727, "global_step": 438482, "epoch": 5282} {"train_loss": -26.83051109313965, "global_step": 438483, "epoch": 5282} {"train_loss": -26.9566650390625, "global_step": 438484, "epoch": 5282} {"train_loss": -26.76788330078125, "global_step": 438485, "epoch": 5282} {"train_loss": -27.05322265625, "global_step": 438486, "epoch": 5282} {"train_loss": -27.121191024780273, "global_step": 438487, "epoch": 5282} {"train_loss": -26.892927468541156, "global_step": 438488, "epoch": 5282, "val_loss": 6597602.0} {"train_loss": -24.7393856048584, "global_step": 438489, "epoch": 5283} {"train_loss": -26.78534507751465, "global_step": 438490, "epoch": 5283} {"train_loss": -25.564956665039062, "global_step": 438491, "epoch": 5283} {"train_loss": -26.118743896484375, "global_step": 438492, "epoch": 5283} {"train_loss": -25.639850616455078, "global_step": 438493, "epoch": 5283} {"train_loss": -24.871551513671875, "global_step": 438494, "epoch": 5283} {"train_loss": -25.286603927612305, "global_step": 438495, "epoch": 5283} {"train_loss": -25.885549545288086, "global_step": 438496, "epoch": 5283} {"train_loss": -26.37679100036621, "global_step": 438497, "epoch": 5283} {"train_loss": -25.817914962768555, "global_step": 438498, "epoch": 5283} {"train_loss": -26.147443771362305, "global_step": 438499, "epoch": 5283} {"train_loss": -26.141645431518555, "global_step": 438500, "epoch": 5283} {"train_loss": -26.376697540283203, "global_step": 438501, "epoch": 5283} {"train_loss": -26.029510498046875, "global_step": 438502, "epoch": 5283} {"train_loss": -26.770544052124023, "global_step": 438503, "epoch": 5283} {"train_loss": -26.32379150390625, "global_step": 438504, "epoch": 5283} {"train_loss": -26.518651962280273, "global_step": 438505, "epoch": 5283} {"train_loss": -26.406171798706055, "global_step": 438506, "epoch": 5283} {"train_loss": -26.142866134643555, "global_step": 438507, "epoch": 5283} {"train_loss": -26.327295303344727, "global_step": 438508, "epoch": 5283} {"train_loss": -26.49371337890625, "global_step": 438509, "epoch": 5283} {"train_loss": -26.452356338500977, "global_step": 438510, "epoch": 5283} {"train_loss": -26.657489776611328, "global_step": 438511, "epoch": 5283} {"train_loss": -26.581378936767578, "global_step": 438512, "epoch": 5283} {"train_loss": -26.76446533203125, "global_step": 438513, "epoch": 5283} {"train_loss": -26.595478057861328, "global_step": 438514, "epoch": 5283} {"train_loss": -26.7654972076416, "global_step": 438515, "epoch": 5283} {"train_loss": -26.79444694519043, "global_step": 438516, "epoch": 5283} {"train_loss": -26.73939323425293, "global_step": 438517, "epoch": 5283} {"train_loss": -26.43710708618164, "global_step": 438518, "epoch": 5283} {"train_loss": -27.174848556518555, "global_step": 438519, "epoch": 5283} {"train_loss": -26.519092559814453, "global_step": 438520, "epoch": 5283} {"train_loss": -26.64039421081543, "global_step": 438521, "epoch": 5283} {"train_loss": -26.930606842041016, "global_step": 438522, "epoch": 5283} {"train_loss": -26.859521865844727, "global_step": 438523, "epoch": 5283} {"train_loss": -27.06854248046875, "global_step": 438524, "epoch": 5283} {"train_loss": -27.0892276763916, "global_step": 438525, "epoch": 5283} {"train_loss": -27.084325790405273, "global_step": 438526, "epoch": 5283} {"train_loss": -27.005603790283203, "global_step": 438527, "epoch": 5283} {"train_loss": -26.9650936126709, "global_step": 438528, "epoch": 5283} {"train_loss": -27.1593017578125, "global_step": 438529, "epoch": 5283} {"train_loss": -26.9526424407959, "global_step": 438530, "epoch": 5283} {"train_loss": -27.307830810546875, "global_step": 438531, "epoch": 5283} {"train_loss": -26.97779655456543, "global_step": 438532, "epoch": 5283} {"train_loss": -27.158096313476562, "global_step": 438533, "epoch": 5283} {"train_loss": -27.26216697692871, "global_step": 438534, "epoch": 5283} {"train_loss": -27.218921661376953, "global_step": 438535, "epoch": 5283} {"train_loss": -27.33949089050293, "global_step": 438536, "epoch": 5283} {"train_loss": -27.107030868530273, "global_step": 438537, "epoch": 5283} {"train_loss": -27.071043014526367, "global_step": 438538, "epoch": 5283} {"train_loss": -27.306005477905273, "global_step": 438539, "epoch": 5283} {"train_loss": -27.44281578063965, "global_step": 438540, "epoch": 5283} {"train_loss": -26.838781356811523, "global_step": 438541, "epoch": 5283} {"train_loss": -27.08173942565918, "global_step": 438542, "epoch": 5283} {"train_loss": -27.491458892822266, "global_step": 438543, "epoch": 5283} {"train_loss": -26.7499942779541, "global_step": 438544, "epoch": 5283} {"train_loss": -27.1134033203125, "global_step": 438545, "epoch": 5283} {"train_loss": -27.247602462768555, "global_step": 438546, "epoch": 5283} {"train_loss": -27.751874923706055, "global_step": 438547, "epoch": 5283} {"train_loss": -26.80852699279785, "global_step": 438548, "epoch": 5283} {"train_loss": -27.00838279724121, "global_step": 438549, "epoch": 5283} {"train_loss": -26.875110626220703, "global_step": 438550, "epoch": 5283} {"train_loss": -27.2689266204834, "global_step": 438551, "epoch": 5283} {"train_loss": -26.45477294921875, "global_step": 438552, "epoch": 5283} {"train_loss": -26.425399780273438, "global_step": 438553, "epoch": 5283} {"train_loss": -25.67401695251465, "global_step": 438554, "epoch": 5283} {"train_loss": -25.44232749938965, "global_step": 438555, "epoch": 5283} {"train_loss": -26.199201583862305, "global_step": 438556, "epoch": 5283} {"train_loss": -26.500059127807617, "global_step": 438557, "epoch": 5283} {"train_loss": -26.16505241394043, "global_step": 438558, "epoch": 5283} {"train_loss": -26.255781173706055, "global_step": 438559, "epoch": 5283} {"train_loss": -26.589319229125977, "global_step": 438560, "epoch": 5283} {"train_loss": -26.371231079101562, "global_step": 438561, "epoch": 5283} {"train_loss": -26.707157135009766, "global_step": 438562, "epoch": 5283} {"train_loss": -26.83893394470215, "global_step": 438563, "epoch": 5283} {"train_loss": -26.17572593688965, "global_step": 438564, "epoch": 5283} {"train_loss": -27.059858322143555, "global_step": 438565, "epoch": 5283} {"train_loss": -26.839187622070312, "global_step": 438566, "epoch": 5283} {"train_loss": -26.420185089111328, "global_step": 438567, "epoch": 5283} {"train_loss": -26.73763084411621, "global_step": 438568, "epoch": 5283} {"train_loss": -26.703601837158203, "global_step": 438569, "epoch": 5283} {"train_loss": -26.709659576416016, "global_step": 438570, "epoch": 5283} {"train_loss": -26.613066592848444, "global_step": 438571, "epoch": 5283, "val_loss": 6621710.5} {"train_loss": -24.960025787353516, "global_step": 438572, "epoch": 5284} {"train_loss": -25.83723258972168, "global_step": 438573, "epoch": 5284} {"train_loss": -26.41033935546875, "global_step": 438574, "epoch": 5284} {"train_loss": -25.553558349609375, "global_step": 438575, "epoch": 5284} {"train_loss": -26.296545028686523, "global_step": 438576, "epoch": 5284} {"train_loss": -25.805662155151367, "global_step": 438577, "epoch": 5284} {"train_loss": -26.015348434448242, "global_step": 438578, "epoch": 5284} {"train_loss": -26.269983291625977, "global_step": 438579, "epoch": 5284} {"train_loss": -25.837182998657227, "global_step": 438580, "epoch": 5284} {"train_loss": -26.15089225769043, "global_step": 438581, "epoch": 5284} {"train_loss": -26.149805068969727, "global_step": 438582, "epoch": 5284} {"train_loss": -25.96843910217285, "global_step": 438583, "epoch": 5284} {"train_loss": -26.6323184967041, "global_step": 438584, "epoch": 5284} {"train_loss": -26.331457138061523, "global_step": 438585, "epoch": 5284} {"train_loss": -26.3656005859375, "global_step": 438586, "epoch": 5284} {"train_loss": -26.596593856811523, "global_step": 438587, "epoch": 5284} {"train_loss": -26.357797622680664, "global_step": 438588, "epoch": 5284} {"train_loss": -26.531097412109375, "global_step": 438589, "epoch": 5284} {"train_loss": -26.654773712158203, "global_step": 438590, "epoch": 5284} {"train_loss": -26.596073150634766, "global_step": 438591, "epoch": 5284} {"train_loss": -26.81691551208496, "global_step": 438592, "epoch": 5284} {"train_loss": -26.58668327331543, "global_step": 438593, "epoch": 5284} {"train_loss": -27.045278549194336, "global_step": 438594, "epoch": 5284} {"train_loss": -26.543630599975586, "global_step": 438595, "epoch": 5284} {"train_loss": -27.345218658447266, "global_step": 438596, "epoch": 5284} {"train_loss": -26.73678970336914, "global_step": 438597, "epoch": 5284} {"train_loss": -26.859766006469727, "global_step": 438598, "epoch": 5284} {"train_loss": -26.972639083862305, "global_step": 438599, "epoch": 5284} {"train_loss": -26.70672035217285, "global_step": 438600, "epoch": 5284} {"train_loss": -26.676166534423828, "global_step": 438601, "epoch": 5284} {"train_loss": -26.85465431213379, "global_step": 438602, "epoch": 5284} {"train_loss": -27.16062355041504, "global_step": 438603, "epoch": 5284} {"train_loss": -27.02640151977539, "global_step": 438604, "epoch": 5284} {"train_loss": -27.369815826416016, "global_step": 438605, "epoch": 5284} {"train_loss": -26.79245376586914, "global_step": 438606, "epoch": 5284} {"train_loss": -27.203840255737305, "global_step": 438607, "epoch": 5284} {"train_loss": -26.85126304626465, "global_step": 438608, "epoch": 5284} {"train_loss": -26.855224609375, "global_step": 438609, "epoch": 5284} {"train_loss": -27.252368927001953, "global_step": 438610, "epoch": 5284} {"train_loss": -26.984289169311523, "global_step": 438611, "epoch": 5284} {"train_loss": -27.30213737487793, "global_step": 438612, "epoch": 5284} {"train_loss": -27.3784122467041, "global_step": 438613, "epoch": 5284} {"train_loss": -27.093908309936523, "global_step": 438614, "epoch": 5284} {"train_loss": -26.72638511657715, "global_step": 438615, "epoch": 5284} {"train_loss": -27.160486221313477, "global_step": 438616, "epoch": 5284} {"train_loss": -27.0283203125, "global_step": 438617, "epoch": 5284} {"train_loss": -26.87567710876465, "global_step": 438618, "epoch": 5284} {"train_loss": -26.917036056518555, "global_step": 438619, "epoch": 5284} {"train_loss": -26.811237335205078, "global_step": 438620, "epoch": 5284} {"train_loss": -26.976484298706055, "global_step": 438621, "epoch": 5284} {"train_loss": -26.682941436767578, "global_step": 438622, "epoch": 5284} {"train_loss": -27.1242618560791, "global_step": 438623, "epoch": 5284} {"train_loss": -26.8934268951416, "global_step": 438624, "epoch": 5284} {"train_loss": -26.74480628967285, "global_step": 438625, "epoch": 5284} {"train_loss": -26.889249801635742, "global_step": 438626, "epoch": 5284} {"train_loss": -27.17169189453125, "global_step": 438627, "epoch": 5284} {"train_loss": -26.769819259643555, "global_step": 438628, "epoch": 5284} {"train_loss": -26.77802085876465, "global_step": 438629, "epoch": 5284} {"train_loss": -27.113204956054688, "global_step": 438630, "epoch": 5284} {"train_loss": -27.02021598815918, "global_step": 438631, "epoch": 5284} {"train_loss": -27.059619903564453, "global_step": 438632, "epoch": 5284} {"train_loss": -27.165124893188477, "global_step": 438633, "epoch": 5284} {"train_loss": -27.13361930847168, "global_step": 438634, "epoch": 5284} {"train_loss": -26.978336334228516, "global_step": 438635, "epoch": 5284} {"train_loss": -27.389179229736328, "global_step": 438636, "epoch": 5284} {"train_loss": -27.0948543548584, "global_step": 438637, "epoch": 5284} {"train_loss": -27.173513412475586, "global_step": 438638, "epoch": 5284} {"train_loss": -27.310306549072266, "global_step": 438639, "epoch": 5284} {"train_loss": -27.037809371948242, "global_step": 438640, "epoch": 5284} {"train_loss": -27.381134033203125, "global_step": 438641, "epoch": 5284} {"train_loss": -27.072769165039062, "global_step": 438642, "epoch": 5284} {"train_loss": -26.849637985229492, "global_step": 438643, "epoch": 5284} {"train_loss": -27.030445098876953, "global_step": 438644, "epoch": 5284} {"train_loss": -26.99566078186035, "global_step": 438645, "epoch": 5284} {"train_loss": -27.226171493530273, "global_step": 438646, "epoch": 5284} {"train_loss": -27.012531280517578, "global_step": 438647, "epoch": 5284} {"train_loss": -26.81439208984375, "global_step": 438648, "epoch": 5284} {"train_loss": -26.847442626953125, "global_step": 438649, "epoch": 5284} {"train_loss": -27.22614097595215, "global_step": 438650, "epoch": 5284} {"train_loss": -27.1948184967041, "global_step": 438651, "epoch": 5284} {"train_loss": -27.336530685424805, "global_step": 438652, "epoch": 5284} {"train_loss": -26.499704360961914, "global_step": 438653, "epoch": 5284} {"train_loss": -26.79275257616158, "global_step": 438654, "epoch": 5284, "val_loss": 6585054.5} {"train_loss": -26.534698486328125, "global_step": 438655, "epoch": 5285} {"train_loss": -26.506086349487305, "global_step": 438656, "epoch": 5285} {"train_loss": -25.81159019470215, "global_step": 438657, "epoch": 5285} {"train_loss": -26.58978843688965, "global_step": 438658, "epoch": 5285} {"train_loss": -26.2906551361084, "global_step": 438659, "epoch": 5285} {"train_loss": -25.731592178344727, "global_step": 438660, "epoch": 5285} {"train_loss": -26.808923721313477, "global_step": 438661, "epoch": 5285} {"train_loss": -26.19795799255371, "global_step": 438662, "epoch": 5285} {"train_loss": -26.06463623046875, "global_step": 438663, "epoch": 5285} {"train_loss": -26.489547729492188, "global_step": 438664, "epoch": 5285} {"train_loss": -26.362207412719727, "global_step": 438665, "epoch": 5285} {"train_loss": -26.5673885345459, "global_step": 438666, "epoch": 5285} {"train_loss": -26.588565826416016, "global_step": 438667, "epoch": 5285} {"train_loss": -27.052793502807617, "global_step": 438668, "epoch": 5285} {"train_loss": -26.56268882751465, "global_step": 438669, "epoch": 5285} {"train_loss": -27.175947189331055, "global_step": 438670, "epoch": 5285} {"train_loss": -26.675586700439453, "global_step": 438671, "epoch": 5285} {"train_loss": -26.7661190032959, "global_step": 438672, "epoch": 5285} {"train_loss": -26.8483943939209, "global_step": 438673, "epoch": 5285} {"train_loss": -26.832971572875977, "global_step": 438674, "epoch": 5285} {"train_loss": -26.532888412475586, "global_step": 438675, "epoch": 5285} {"train_loss": -26.619129180908203, "global_step": 438676, "epoch": 5285} {"train_loss": -26.957233428955078, "global_step": 438677, "epoch": 5285} {"train_loss": -26.921051025390625, "global_step": 438678, "epoch": 5285} {"train_loss": -26.879352569580078, "global_step": 438679, "epoch": 5285} {"train_loss": -27.07675552368164, "global_step": 438680, "epoch": 5285} {"train_loss": -26.947193145751953, "global_step": 438681, "epoch": 5285} {"train_loss": -27.01910400390625, "global_step": 438682, "epoch": 5285} {"train_loss": -26.638227462768555, "global_step": 438683, "epoch": 5285} {"train_loss": -26.962207794189453, "global_step": 438684, "epoch": 5285} {"train_loss": -26.707782745361328, "global_step": 438685, "epoch": 5285} {"train_loss": -27.089563369750977, "global_step": 438686, "epoch": 5285} {"train_loss": -26.556039810180664, "global_step": 438687, "epoch": 5285} {"train_loss": -26.361326217651367, "global_step": 438688, "epoch": 5285} {"train_loss": -26.629425048828125, "global_step": 438689, "epoch": 5285} {"train_loss": -26.847192764282227, "global_step": 438690, "epoch": 5285} {"train_loss": -26.646472930908203, "global_step": 438691, "epoch": 5285} {"train_loss": -26.850479125976562, "global_step": 438692, "epoch": 5285} {"train_loss": -26.750213623046875, "global_step": 438693, "epoch": 5285} {"train_loss": -27.07256507873535, "global_step": 438694, "epoch": 5285} {"train_loss": -27.016738891601562, "global_step": 438695, "epoch": 5285} {"train_loss": -26.901691436767578, "global_step": 438696, "epoch": 5285} {"train_loss": -26.9338321685791, "global_step": 438697, "epoch": 5285} {"train_loss": -26.963953018188477, "global_step": 438698, "epoch": 5285} {"train_loss": -26.9753360748291, "global_step": 438699, "epoch": 5285} {"train_loss": -27.1332950592041, "global_step": 438700, "epoch": 5285} {"train_loss": -27.0915470123291, "global_step": 438701, "epoch": 5285} {"train_loss": -26.976898193359375, "global_step": 438702, "epoch": 5285} {"train_loss": -26.567243576049805, "global_step": 438703, "epoch": 5285} {"train_loss": -27.03230094909668, "global_step": 438704, "epoch": 5285} {"train_loss": -26.798892974853516, "global_step": 438705, "epoch": 5285} {"train_loss": -26.990034103393555, "global_step": 438706, "epoch": 5285} {"train_loss": -26.917699813842773, "global_step": 438707, "epoch": 5285} {"train_loss": -27.02841567993164, "global_step": 438708, "epoch": 5285} {"train_loss": -27.048755645751953, "global_step": 438709, "epoch": 5285} {"train_loss": -26.95655632019043, "global_step": 438710, "epoch": 5285} {"train_loss": -26.96625328063965, "global_step": 438711, "epoch": 5285} {"train_loss": -26.987390518188477, "global_step": 438712, "epoch": 5285} {"train_loss": -26.98675537109375, "global_step": 438713, "epoch": 5285} {"train_loss": -27.11896324157715, "global_step": 438714, "epoch": 5285} {"train_loss": -26.849716186523438, "global_step": 438715, "epoch": 5285} {"train_loss": -26.954870223999023, "global_step": 438716, "epoch": 5285} {"train_loss": -26.8057861328125, "global_step": 438717, "epoch": 5285} {"train_loss": -27.08231544494629, "global_step": 438718, "epoch": 5285} {"train_loss": -27.50302505493164, "global_step": 438719, "epoch": 5285} {"train_loss": -26.870351791381836, "global_step": 438720, "epoch": 5285} {"train_loss": -27.128173828125, "global_step": 438721, "epoch": 5285} {"train_loss": -27.1451358795166, "global_step": 438722, "epoch": 5285} {"train_loss": -27.089086532592773, "global_step": 438723, "epoch": 5285} {"train_loss": -26.82198143005371, "global_step": 438724, "epoch": 5285} {"train_loss": -27.275802612304688, "global_step": 438725, "epoch": 5285} {"train_loss": -26.810287475585938, "global_step": 438726, "epoch": 5285} {"train_loss": -27.367822647094727, "global_step": 438727, "epoch": 5285} {"train_loss": -26.832639694213867, "global_step": 438728, "epoch": 5285} {"train_loss": -26.844512939453125, "global_step": 438729, "epoch": 5285} {"train_loss": -26.45765495300293, "global_step": 438730, "epoch": 5285} {"train_loss": -27.09149742126465, "global_step": 438731, "epoch": 5285} {"train_loss": -26.92152214050293, "global_step": 438732, "epoch": 5285} {"train_loss": -26.91864013671875, "global_step": 438733, "epoch": 5285} {"train_loss": -27.19025230407715, "global_step": 438734, "epoch": 5285} {"train_loss": -27.077795028686523, "global_step": 438735, "epoch": 5285} {"train_loss": -27.34815788269043, "global_step": 438736, "epoch": 5285} {"train_loss": -26.84391458350492, "global_step": 438737, "epoch": 5285, "val_loss": 6583271.0} {"train_loss": -26.002700805664062, "global_step": 438738, "epoch": 5286} {"train_loss": -25.63112449645996, "global_step": 438739, "epoch": 5286} {"train_loss": -25.22875213623047, "global_step": 438740, "epoch": 5286} {"train_loss": -26.2529296875, "global_step": 438741, "epoch": 5286} {"train_loss": -26.316511154174805, "global_step": 438742, "epoch": 5286} {"train_loss": -26.297576904296875, "global_step": 438743, "epoch": 5286} {"train_loss": -26.1795711517334, "global_step": 438744, "epoch": 5286} {"train_loss": -26.463748931884766, "global_step": 438745, "epoch": 5286} {"train_loss": -26.094099044799805, "global_step": 438746, "epoch": 5286} {"train_loss": -26.457944869995117, "global_step": 438747, "epoch": 5286} {"train_loss": -26.222944259643555, "global_step": 438748, "epoch": 5286} {"train_loss": -26.59844970703125, "global_step": 438749, "epoch": 5286} {"train_loss": -26.4323787689209, "global_step": 438750, "epoch": 5286} {"train_loss": -26.826379776000977, "global_step": 438751, "epoch": 5286} {"train_loss": -26.7539119720459, "global_step": 438752, "epoch": 5286} {"train_loss": -26.699186325073242, "global_step": 438753, "epoch": 5286} {"train_loss": -26.65275001525879, "global_step": 438754, "epoch": 5286} {"train_loss": -26.708709716796875, "global_step": 438755, "epoch": 5286} {"train_loss": -26.61687660217285, "global_step": 438756, "epoch": 5286} {"train_loss": -26.71864128112793, "global_step": 438757, "epoch": 5286} {"train_loss": -26.795001983642578, "global_step": 438758, "epoch": 5286} {"train_loss": -26.98380470275879, "global_step": 438759, "epoch": 5286} {"train_loss": -27.207273483276367, "global_step": 438760, "epoch": 5286} {"train_loss": -27.02542495727539, "global_step": 438761, "epoch": 5286} {"train_loss": -27.349149703979492, "global_step": 438762, "epoch": 5286} {"train_loss": -26.99995231628418, "global_step": 438763, "epoch": 5286} {"train_loss": -26.93805503845215, "global_step": 438764, "epoch": 5286} {"train_loss": -26.92184829711914, "global_step": 438765, "epoch": 5286} {"train_loss": -27.30849266052246, "global_step": 438766, "epoch": 5286} {"train_loss": -27.18830680847168, "global_step": 438767, "epoch": 5286} {"train_loss": -27.299158096313477, "global_step": 438768, "epoch": 5286} {"train_loss": -26.7993221282959, "global_step": 438769, "epoch": 5286} {"train_loss": -26.838544845581055, "global_step": 438770, "epoch": 5286} {"train_loss": -27.146320343017578, "global_step": 438771, "epoch": 5286} {"train_loss": -26.96454429626465, "global_step": 438772, "epoch": 5286} {"train_loss": -26.95353126525879, "global_step": 438773, "epoch": 5286} {"train_loss": -27.30030632019043, "global_step": 438774, "epoch": 5286} {"train_loss": -27.094165802001953, "global_step": 438775, "epoch": 5286} {"train_loss": -27.370285034179688, "global_step": 438776, "epoch": 5286} {"train_loss": -27.369232177734375, "global_step": 438777, "epoch": 5286} {"train_loss": -26.718381881713867, "global_step": 438778, "epoch": 5286} {"train_loss": -27.164011001586914, "global_step": 438779, "epoch": 5286} {"train_loss": -27.238317489624023, "global_step": 438780, "epoch": 5286} {"train_loss": -26.811670303344727, "global_step": 438781, "epoch": 5286} {"train_loss": -27.433820724487305, "global_step": 438782, "epoch": 5286} {"train_loss": -27.36687660217285, "global_step": 438783, "epoch": 5286} {"train_loss": -27.29120445251465, "global_step": 438784, "epoch": 5286} {"train_loss": -27.058135986328125, "global_step": 438785, "epoch": 5286} {"train_loss": -27.020416259765625, "global_step": 438786, "epoch": 5286} {"train_loss": -27.098987579345703, "global_step": 438787, "epoch": 5286} {"train_loss": -26.560577392578125, "global_step": 438788, "epoch": 5286} {"train_loss": -26.838516235351562, "global_step": 438789, "epoch": 5286} {"train_loss": -26.806615829467773, "global_step": 438790, "epoch": 5286} {"train_loss": -27.063634872436523, "global_step": 438791, "epoch": 5286} {"train_loss": -27.535816192626953, "global_step": 438792, "epoch": 5286} {"train_loss": -26.8757381439209, "global_step": 438793, "epoch": 5286} {"train_loss": -27.23554801940918, "global_step": 438794, "epoch": 5286} {"train_loss": -26.842947006225586, "global_step": 438795, "epoch": 5286} {"train_loss": -27.10761070251465, "global_step": 438796, "epoch": 5286} {"train_loss": -27.174131393432617, "global_step": 438797, "epoch": 5286} {"train_loss": -26.81818199157715, "global_step": 438798, "epoch": 5286} {"train_loss": -26.930023193359375, "global_step": 438799, "epoch": 5286} {"train_loss": -27.038654327392578, "global_step": 438800, "epoch": 5286} {"train_loss": -26.93097496032715, "global_step": 438801, "epoch": 5286} {"train_loss": -26.62929344177246, "global_step": 438802, "epoch": 5286} {"train_loss": -26.591062545776367, "global_step": 438803, "epoch": 5286} {"train_loss": -26.531055450439453, "global_step": 438804, "epoch": 5286} {"train_loss": -26.2340087890625, "global_step": 438805, "epoch": 5286} {"train_loss": -26.60782814025879, "global_step": 438806, "epoch": 5286} {"train_loss": -26.886884689331055, "global_step": 438807, "epoch": 5286} {"train_loss": -26.8328800201416, "global_step": 438808, "epoch": 5286} {"train_loss": -26.70734214782715, "global_step": 438809, "epoch": 5286} {"train_loss": -26.659963607788086, "global_step": 438810, "epoch": 5286} {"train_loss": -26.798730850219727, "global_step": 438811, "epoch": 5286} {"train_loss": -26.505247116088867, "global_step": 438812, "epoch": 5286} {"train_loss": -26.828266143798828, "global_step": 438813, "epoch": 5286} {"train_loss": -26.603647232055664, "global_step": 438814, "epoch": 5286} {"train_loss": -26.832324981689453, "global_step": 438815, "epoch": 5286} {"train_loss": -26.503637313842773, "global_step": 438816, "epoch": 5286} {"train_loss": -26.37744140625, "global_step": 438817, "epoch": 5286} {"train_loss": -26.462888717651367, "global_step": 438818, "epoch": 5286} {"train_loss": -26.895919799804688, "global_step": 438819, "epoch": 5286} {"train_loss": -26.785544659717974, "global_step": 438820, "epoch": 5286, "val_loss": 6679196.0} {"train_loss": -25.569664001464844, "global_step": 438821, "epoch": 5287} {"train_loss": -24.712066650390625, "global_step": 438822, "epoch": 5287} {"train_loss": -26.071487426757812, "global_step": 438823, "epoch": 5287} {"train_loss": -26.329145431518555, "global_step": 438824, "epoch": 5287} {"train_loss": -26.033777236938477, "global_step": 438825, "epoch": 5287} {"train_loss": -26.423980712890625, "global_step": 438826, "epoch": 5287} {"train_loss": -26.116806030273438, "global_step": 438827, "epoch": 5287} {"train_loss": -25.975330352783203, "global_step": 438828, "epoch": 5287} {"train_loss": -26.414846420288086, "global_step": 438829, "epoch": 5287} {"train_loss": -26.508703231811523, "global_step": 438830, "epoch": 5287} {"train_loss": -26.539459228515625, "global_step": 438831, "epoch": 5287} {"train_loss": -26.635425567626953, "global_step": 438832, "epoch": 5287} {"train_loss": -26.7362003326416, "global_step": 438833, "epoch": 5287} {"train_loss": -26.5068359375, "global_step": 438834, "epoch": 5287} {"train_loss": -26.531240463256836, "global_step": 438835, "epoch": 5287} {"train_loss": -26.63409423828125, "global_step": 438836, "epoch": 5287} {"train_loss": -26.270618438720703, "global_step": 438837, "epoch": 5287} {"train_loss": -26.442224502563477, "global_step": 438838, "epoch": 5287} {"train_loss": -26.56497573852539, "global_step": 438839, "epoch": 5287} {"train_loss": -26.652997970581055, "global_step": 438840, "epoch": 5287} {"train_loss": -26.68763542175293, "global_step": 438841, "epoch": 5287} {"train_loss": -27.0750675201416, "global_step": 438842, "epoch": 5287} {"train_loss": -26.810699462890625, "global_step": 438843, "epoch": 5287} {"train_loss": -26.910017013549805, "global_step": 438844, "epoch": 5287} {"train_loss": -26.8612117767334, "global_step": 438845, "epoch": 5287} {"train_loss": -26.601179122924805, "global_step": 438846, "epoch": 5287} {"train_loss": -26.985553741455078, "global_step": 438847, "epoch": 5287} {"train_loss": -26.97535514831543, "global_step": 438848, "epoch": 5287} {"train_loss": -26.671964645385742, "global_step": 438849, "epoch": 5287} {"train_loss": -27.29140281677246, "global_step": 438850, "epoch": 5287} {"train_loss": -26.87774658203125, "global_step": 438851, "epoch": 5287} {"train_loss": -27.00103759765625, "global_step": 438852, "epoch": 5287} {"train_loss": -27.093297958374023, "global_step": 438853, "epoch": 5287} {"train_loss": -26.9100284576416, "global_step": 438854, "epoch": 5287} {"train_loss": -27.18149185180664, "global_step": 438855, "epoch": 5287} {"train_loss": -26.95960807800293, "global_step": 438856, "epoch": 5287} {"train_loss": -26.453689575195312, "global_step": 438857, "epoch": 5287} {"train_loss": -27.56113052368164, "global_step": 438858, "epoch": 5287} {"train_loss": -27.0677547454834, "global_step": 438859, "epoch": 5287} {"train_loss": -26.80194091796875, "global_step": 438860, "epoch": 5287} {"train_loss": -27.015546798706055, "global_step": 438861, "epoch": 5287} {"train_loss": -26.683340072631836, "global_step": 438862, "epoch": 5287} {"train_loss": -26.560443878173828, "global_step": 438863, "epoch": 5287} {"train_loss": -26.727155685424805, "global_step": 438864, "epoch": 5287} {"train_loss": -27.082242965698242, "global_step": 438865, "epoch": 5287} {"train_loss": -26.8664608001709, "global_step": 438866, "epoch": 5287} {"train_loss": -26.5877628326416, "global_step": 438867, "epoch": 5287} {"train_loss": -26.96839714050293, "global_step": 438868, "epoch": 5287} {"train_loss": -26.627105712890625, "global_step": 438869, "epoch": 5287} {"train_loss": -26.902612686157227, "global_step": 438870, "epoch": 5287} {"train_loss": -26.83436393737793, "global_step": 438871, "epoch": 5287} {"train_loss": -26.53010368347168, "global_step": 438872, "epoch": 5287} {"train_loss": -27.043176651000977, "global_step": 438873, "epoch": 5287} {"train_loss": -26.928821563720703, "global_step": 438874, "epoch": 5287} {"train_loss": -26.948511123657227, "global_step": 438875, "epoch": 5287} {"train_loss": -26.48883056640625, "global_step": 438876, "epoch": 5287} {"train_loss": -27.009658813476562, "global_step": 438877, "epoch": 5287} {"train_loss": -26.975934982299805, "global_step": 438878, "epoch": 5287} {"train_loss": -26.788915634155273, "global_step": 438879, "epoch": 5287} {"train_loss": -26.45094108581543, "global_step": 438880, "epoch": 5287} {"train_loss": -26.66608238220215, "global_step": 438881, "epoch": 5287} {"train_loss": -27.099288940429688, "global_step": 438882, "epoch": 5287} {"train_loss": -26.886520385742188, "global_step": 438883, "epoch": 5287} {"train_loss": -26.94854736328125, "global_step": 438884, "epoch": 5287} {"train_loss": -26.91339683532715, "global_step": 438885, "epoch": 5287} {"train_loss": -27.0915470123291, "global_step": 438886, "epoch": 5287} {"train_loss": -26.972936630249023, "global_step": 438887, "epoch": 5287} {"train_loss": -26.92120933532715, "global_step": 438888, "epoch": 5287} {"train_loss": -27.059772491455078, "global_step": 438889, "epoch": 5287} {"train_loss": -26.90302085876465, "global_step": 438890, "epoch": 5287} {"train_loss": -27.00296401977539, "global_step": 438891, "epoch": 5287} {"train_loss": -27.051029205322266, "global_step": 438892, "epoch": 5287} {"train_loss": -27.31443214416504, "global_step": 438893, "epoch": 5287} {"train_loss": -27.24432373046875, "global_step": 438894, "epoch": 5287} {"train_loss": -27.22556495666504, "global_step": 438895, "epoch": 5287} {"train_loss": -27.1215877532959, "global_step": 438896, "epoch": 5287} {"train_loss": -27.353357315063477, "global_step": 438897, "epoch": 5287} {"train_loss": -27.047422409057617, "global_step": 438898, "epoch": 5287} {"train_loss": -26.950475692749023, "global_step": 438899, "epoch": 5287} {"train_loss": -27.120573043823242, "global_step": 438900, "epoch": 5287} {"train_loss": -26.983556747436523, "global_step": 438901, "epoch": 5287} {"train_loss": -26.921606063842773, "global_step": 438902, "epoch": 5287} {"train_loss": -26.772297594920698, "global_step": 438903, "epoch": 5287, "val_loss": 6553685.0} {"train_loss": -25.52364158630371, "global_step": 438904, "epoch": 5288} {"train_loss": -24.778732299804688, "global_step": 438905, "epoch": 5288} {"train_loss": -25.1389217376709, "global_step": 438906, "epoch": 5288} {"train_loss": -25.611469268798828, "global_step": 438907, "epoch": 5288} {"train_loss": -26.2694149017334, "global_step": 438908, "epoch": 5288} {"train_loss": -25.14706802368164, "global_step": 438909, "epoch": 5288} {"train_loss": -26.09797477722168, "global_step": 438910, "epoch": 5288} {"train_loss": -25.695743560791016, "global_step": 438911, "epoch": 5288} {"train_loss": -26.4156551361084, "global_step": 438912, "epoch": 5288} {"train_loss": -25.98093032836914, "global_step": 438913, "epoch": 5288} {"train_loss": -26.046674728393555, "global_step": 438914, "epoch": 5288} {"train_loss": -25.83540153503418, "global_step": 438915, "epoch": 5288} {"train_loss": -26.104679107666016, "global_step": 438916, "epoch": 5288} {"train_loss": -26.131305694580078, "global_step": 438917, "epoch": 5288} {"train_loss": -26.29638671875, "global_step": 438918, "epoch": 5288} {"train_loss": -26.064916610717773, "global_step": 438919, "epoch": 5288} {"train_loss": -26.55156898498535, "global_step": 438920, "epoch": 5288} {"train_loss": -26.5911808013916, "global_step": 438921, "epoch": 5288} {"train_loss": -26.5186710357666, "global_step": 438922, "epoch": 5288} {"train_loss": -26.537769317626953, "global_step": 438923, "epoch": 5288} {"train_loss": -26.335357666015625, "global_step": 438924, "epoch": 5288} {"train_loss": -26.584247589111328, "global_step": 438925, "epoch": 5288} {"train_loss": -26.49664878845215, "global_step": 438926, "epoch": 5288} {"train_loss": -26.43113136291504, "global_step": 438927, "epoch": 5288} {"train_loss": -26.50741958618164, "global_step": 438928, "epoch": 5288} {"train_loss": -26.70670509338379, "global_step": 438929, "epoch": 5288} {"train_loss": -26.94805908203125, "global_step": 438930, "epoch": 5288} {"train_loss": -26.732223510742188, "global_step": 438931, "epoch": 5288} {"train_loss": -26.940231323242188, "global_step": 438932, "epoch": 5288} {"train_loss": -26.776330947875977, "global_step": 438933, "epoch": 5288} {"train_loss": -26.9929256439209, "global_step": 438934, "epoch": 5288} {"train_loss": -26.7041015625, "global_step": 438935, "epoch": 5288} {"train_loss": -26.65753746032715, "global_step": 438936, "epoch": 5288} {"train_loss": -26.70265007019043, "global_step": 438937, "epoch": 5288} {"train_loss": -27.039579391479492, "global_step": 438938, "epoch": 5288} {"train_loss": -26.778356552124023, "global_step": 438939, "epoch": 5288} {"train_loss": -26.662841796875, "global_step": 438940, "epoch": 5288} {"train_loss": -26.786924362182617, "global_step": 438941, "epoch": 5288} {"train_loss": -26.9639892578125, "global_step": 438942, "epoch": 5288} {"train_loss": -26.805830001831055, "global_step": 438943, "epoch": 5288} {"train_loss": -27.157453536987305, "global_step": 438944, "epoch": 5288} {"train_loss": -27.19717788696289, "global_step": 438945, "epoch": 5288} {"train_loss": -26.96921730041504, "global_step": 438946, "epoch": 5288} {"train_loss": -27.336261749267578, "global_step": 438947, "epoch": 5288} {"train_loss": -27.324064254760742, "global_step": 438948, "epoch": 5288} {"train_loss": -27.597532272338867, "global_step": 438949, "epoch": 5288} {"train_loss": -27.00739097595215, "global_step": 438950, "epoch": 5288} {"train_loss": -26.83643913269043, "global_step": 438951, "epoch": 5288} {"train_loss": -26.807891845703125, "global_step": 438952, "epoch": 5288} {"train_loss": -26.814777374267578, "global_step": 438953, "epoch": 5288} {"train_loss": -26.967639923095703, "global_step": 438954, "epoch": 5288} {"train_loss": -26.908096313476562, "global_step": 438955, "epoch": 5288} {"train_loss": -26.632150650024414, "global_step": 438956, "epoch": 5288} {"train_loss": -26.32940673828125, "global_step": 438957, "epoch": 5288} {"train_loss": -26.96158218383789, "global_step": 438958, "epoch": 5288} {"train_loss": -27.3061466217041, "global_step": 438959, "epoch": 5288} {"train_loss": -26.770584106445312, "global_step": 438960, "epoch": 5288} {"train_loss": -26.92371940612793, "global_step": 438961, "epoch": 5288} {"train_loss": -27.06483268737793, "global_step": 438962, "epoch": 5288} {"train_loss": -27.343610763549805, "global_step": 438963, "epoch": 5288} {"train_loss": -27.27850914001465, "global_step": 438964, "epoch": 5288} {"train_loss": -27.18572425842285, "global_step": 438965, "epoch": 5288} {"train_loss": -27.071842193603516, "global_step": 438966, "epoch": 5288} {"train_loss": -26.845563888549805, "global_step": 438967, "epoch": 5288} {"train_loss": -26.89804458618164, "global_step": 438968, "epoch": 5288} {"train_loss": -26.999143600463867, "global_step": 438969, "epoch": 5288} {"train_loss": -27.4412841796875, "global_step": 438970, "epoch": 5288} {"train_loss": -26.781787872314453, "global_step": 438971, "epoch": 5288} {"train_loss": -27.428958892822266, "global_step": 438972, "epoch": 5288} {"train_loss": -27.186376571655273, "global_step": 438973, "epoch": 5288} {"train_loss": -27.21477699279785, "global_step": 438974, "epoch": 5288} {"train_loss": -27.1737060546875, "global_step": 438975, "epoch": 5288} {"train_loss": -27.26813316345215, "global_step": 438976, "epoch": 5288} {"train_loss": -26.66106605529785, "global_step": 438977, "epoch": 5288} {"train_loss": -27.09971046447754, "global_step": 438978, "epoch": 5288} {"train_loss": -26.658288955688477, "global_step": 438979, "epoch": 5288} {"train_loss": -26.7481632232666, "global_step": 438980, "epoch": 5288} {"train_loss": -26.820831298828125, "global_step": 438981, "epoch": 5288} {"train_loss": -27.20746421813965, "global_step": 438982, "epoch": 5288} {"train_loss": -27.21253776550293, "global_step": 438983, "epoch": 5288} {"train_loss": -27.441144943237305, "global_step": 438984, "epoch": 5288} {"train_loss": -27.12094497680664, "global_step": 438985, "epoch": 5288} {"train_loss": -26.709974082119494, "global_step": 438986, "epoch": 5288, "val_loss": 6566587.0} {"train_loss": -25.570987701416016, "global_step": 438987, "epoch": 5289} {"train_loss": -26.447193145751953, "global_step": 438988, "epoch": 5289} {"train_loss": -26.334014892578125, "global_step": 438989, "epoch": 5289} {"train_loss": -26.54900550842285, "global_step": 438990, "epoch": 5289} {"train_loss": -26.26862144470215, "global_step": 438991, "epoch": 5289} {"train_loss": -26.2609806060791, "global_step": 438992, "epoch": 5289} {"train_loss": -26.238056182861328, "global_step": 438993, "epoch": 5289} {"train_loss": -26.59653091430664, "global_step": 438994, "epoch": 5289} {"train_loss": -26.538618087768555, "global_step": 438995, "epoch": 5289} {"train_loss": -26.887470245361328, "global_step": 438996, "epoch": 5289} {"train_loss": -26.672765731811523, "global_step": 438997, "epoch": 5289} {"train_loss": -27.074478149414062, "global_step": 438998, "epoch": 5289} {"train_loss": -26.821630477905273, "global_step": 438999, "epoch": 5289} {"train_loss": -26.656347274780273, "global_step": 439000, "epoch": 5289} {"train_loss": -27.04496192932129, "global_step": 439001, "epoch": 5289} {"train_loss": -26.646392822265625, "global_step": 439002, "epoch": 5289} {"train_loss": -26.68289566040039, "global_step": 439003, "epoch": 5289} {"train_loss": -26.716690063476562, "global_step": 439004, "epoch": 5289} {"train_loss": -26.683881759643555, "global_step": 439005, "epoch": 5289} {"train_loss": -26.91855239868164, "global_step": 439006, "epoch": 5289} {"train_loss": -26.954023361206055, "global_step": 439007, "epoch": 5289} {"train_loss": -26.516742706298828, "global_step": 439008, "epoch": 5289} {"train_loss": -27.096343994140625, "global_step": 439009, "epoch": 5289} {"train_loss": -27.110614776611328, "global_step": 439010, "epoch": 5289} {"train_loss": -26.994726181030273, "global_step": 439011, "epoch": 5289} {"train_loss": -26.88311195373535, "global_step": 439012, "epoch": 5289} {"train_loss": -26.906904220581055, "global_step": 439013, "epoch": 5289} {"train_loss": -26.889404296875, "global_step": 439014, "epoch": 5289} {"train_loss": -26.98569679260254, "global_step": 439015, "epoch": 5289} {"train_loss": -27.074792861938477, "global_step": 439016, "epoch": 5289} {"train_loss": -26.840076446533203, "global_step": 439017, "epoch": 5289} {"train_loss": -26.595930099487305, "global_step": 439018, "epoch": 5289} {"train_loss": -27.027545928955078, "global_step": 439019, "epoch": 5289} {"train_loss": -26.657617568969727, "global_step": 439020, "epoch": 5289} {"train_loss": -26.80901527404785, "global_step": 439021, "epoch": 5289} {"train_loss": -27.10541343688965, "global_step": 439022, "epoch": 5289} {"train_loss": -27.104093551635742, "global_step": 439023, "epoch": 5289} {"train_loss": -26.91788101196289, "global_step": 439024, "epoch": 5289} {"train_loss": -26.85218620300293, "global_step": 439025, "epoch": 5289} {"train_loss": -26.896108627319336, "global_step": 439026, "epoch": 5289} {"train_loss": -27.03921890258789, "global_step": 439027, "epoch": 5289} {"train_loss": -26.970157623291016, "global_step": 439028, "epoch": 5289} {"train_loss": -26.678754806518555, "global_step": 439029, "epoch": 5289} {"train_loss": -26.499710083007812, "global_step": 439030, "epoch": 5289} {"train_loss": -26.994016647338867, "global_step": 439031, "epoch": 5289} {"train_loss": -27.342559814453125, "global_step": 439032, "epoch": 5289} {"train_loss": -27.0533390045166, "global_step": 439033, "epoch": 5289} {"train_loss": -27.39838981628418, "global_step": 439034, "epoch": 5289} {"train_loss": -27.46002197265625, "global_step": 439035, "epoch": 5289} {"train_loss": -27.118741989135742, "global_step": 439036, "epoch": 5289} {"train_loss": -26.845020294189453, "global_step": 439037, "epoch": 5289} {"train_loss": -26.741315841674805, "global_step": 439038, "epoch": 5289} {"train_loss": -26.937040328979492, "global_step": 439039, "epoch": 5289} {"train_loss": -27.444005966186523, "global_step": 439040, "epoch": 5289} {"train_loss": -27.23317527770996, "global_step": 439041, "epoch": 5289} {"train_loss": -26.973346710205078, "global_step": 439042, "epoch": 5289} {"train_loss": -27.140527725219727, "global_step": 439043, "epoch": 5289} {"train_loss": -26.345584869384766, "global_step": 439044, "epoch": 5289} {"train_loss": -26.60357666015625, "global_step": 439045, "epoch": 5289} {"train_loss": -26.871017456054688, "global_step": 439046, "epoch": 5289} {"train_loss": -26.8131103515625, "global_step": 439047, "epoch": 5289} {"train_loss": -26.734357833862305, "global_step": 439048, "epoch": 5289} {"train_loss": -26.721296310424805, "global_step": 439049, "epoch": 5289} {"train_loss": -27.339574813842773, "global_step": 439050, "epoch": 5289} {"train_loss": -26.959028244018555, "global_step": 439051, "epoch": 5289} {"train_loss": -26.609785079956055, "global_step": 439052, "epoch": 5289} {"train_loss": -26.990869522094727, "global_step": 439053, "epoch": 5289} {"train_loss": -26.83880043029785, "global_step": 439054, "epoch": 5289} {"train_loss": -27.227994918823242, "global_step": 439055, "epoch": 5289} {"train_loss": -26.801794052124023, "global_step": 439056, "epoch": 5289} {"train_loss": -26.850040435791016, "global_step": 439057, "epoch": 5289} {"train_loss": -27.2816104888916, "global_step": 439058, "epoch": 5289} {"train_loss": -27.230926513671875, "global_step": 439059, "epoch": 5289} {"train_loss": -27.00593376159668, "global_step": 439060, "epoch": 5289} {"train_loss": -27.329254150390625, "global_step": 439061, "epoch": 5289} {"train_loss": -27.488561630249023, "global_step": 439062, "epoch": 5289} {"train_loss": -27.003570556640625, "global_step": 439063, "epoch": 5289} {"train_loss": -27.29059410095215, "global_step": 439064, "epoch": 5289} {"train_loss": -26.863697052001953, "global_step": 439065, "epoch": 5289} {"train_loss": -26.621862411499023, "global_step": 439066, "epoch": 5289} {"train_loss": -26.71795082092285, "global_step": 439067, "epoch": 5289} {"train_loss": -26.535634994506836, "global_step": 439068, "epoch": 5289} {"train_loss": -26.869940631360894, "global_step": 439069, "epoch": 5289, "val_loss": 6592233.0} {"train_loss": -26.574771881103516, "global_step": 439070, "epoch": 5290} {"train_loss": -25.158811569213867, "global_step": 439071, "epoch": 5290} {"train_loss": -25.25320816040039, "global_step": 439072, "epoch": 5290} {"train_loss": -26.424591064453125, "global_step": 439073, "epoch": 5290} {"train_loss": -25.6547794342041, "global_step": 439074, "epoch": 5290} {"train_loss": -25.947851181030273, "global_step": 439075, "epoch": 5290} {"train_loss": -25.623464584350586, "global_step": 439076, "epoch": 5290} {"train_loss": -26.146467208862305, "global_step": 439077, "epoch": 5290} {"train_loss": -25.196670532226562, "global_step": 439078, "epoch": 5290} {"train_loss": -26.118310928344727, "global_step": 439079, "epoch": 5290} {"train_loss": -25.47161293029785, "global_step": 439080, "epoch": 5290} {"train_loss": -26.156024932861328, "global_step": 439081, "epoch": 5290} {"train_loss": -25.934316635131836, "global_step": 439082, "epoch": 5290} {"train_loss": -25.806909561157227, "global_step": 439083, "epoch": 5290} {"train_loss": -26.461206436157227, "global_step": 439084, "epoch": 5290} {"train_loss": -25.593252182006836, "global_step": 439085, "epoch": 5290} {"train_loss": -26.199689865112305, "global_step": 439086, "epoch": 5290} {"train_loss": -26.294214248657227, "global_step": 439087, "epoch": 5290} {"train_loss": -26.27277946472168, "global_step": 439088, "epoch": 5290} {"train_loss": -26.0904483795166, "global_step": 439089, "epoch": 5290} {"train_loss": -26.413122177124023, "global_step": 439090, "epoch": 5290} {"train_loss": -26.382715225219727, "global_step": 439091, "epoch": 5290} {"train_loss": -25.864429473876953, "global_step": 439092, "epoch": 5290} {"train_loss": -26.47653579711914, "global_step": 439093, "epoch": 5290} {"train_loss": -26.529088973999023, "global_step": 439094, "epoch": 5290} {"train_loss": -26.1355037689209, "global_step": 439095, "epoch": 5290} {"train_loss": -26.238208770751953, "global_step": 439096, "epoch": 5290} {"train_loss": -26.062259674072266, "global_step": 439097, "epoch": 5290} {"train_loss": -26.658252716064453, "global_step": 439098, "epoch": 5290} {"train_loss": -26.620136260986328, "global_step": 439099, "epoch": 5290} {"train_loss": -26.517486572265625, "global_step": 439100, "epoch": 5290} {"train_loss": -26.643564224243164, "global_step": 439101, "epoch": 5290} {"train_loss": -26.605138778686523, "global_step": 439102, "epoch": 5290} {"train_loss": -26.74712562561035, "global_step": 439103, "epoch": 5290} {"train_loss": -27.047510147094727, "global_step": 439104, "epoch": 5290} {"train_loss": -26.571643829345703, "global_step": 439105, "epoch": 5290} {"train_loss": -26.5974178314209, "global_step": 439106, "epoch": 5290} {"train_loss": -26.634662628173828, "global_step": 439107, "epoch": 5290} {"train_loss": -26.68100929260254, "global_step": 439108, "epoch": 5290} {"train_loss": -26.848413467407227, "global_step": 439109, "epoch": 5290} {"train_loss": -27.16678810119629, "global_step": 439110, "epoch": 5290} {"train_loss": -27.070520401000977, "global_step": 439111, "epoch": 5290} {"train_loss": -27.272436141967773, "global_step": 439112, "epoch": 5290} {"train_loss": -26.967615127563477, "global_step": 439113, "epoch": 5290} {"train_loss": -27.072193145751953, "global_step": 439114, "epoch": 5290} {"train_loss": -26.759496688842773, "global_step": 439115, "epoch": 5290} {"train_loss": -26.829145431518555, "global_step": 439116, "epoch": 5290} {"train_loss": -27.051721572875977, "global_step": 439117, "epoch": 5290} {"train_loss": -27.253005981445312, "global_step": 439118, "epoch": 5290} {"train_loss": -27.014612197875977, "global_step": 439119, "epoch": 5290} {"train_loss": -26.884765625, "global_step": 439120, "epoch": 5290} {"train_loss": -26.981470108032227, "global_step": 439121, "epoch": 5290} {"train_loss": -26.97161865234375, "global_step": 439122, "epoch": 5290} {"train_loss": -27.212726593017578, "global_step": 439123, "epoch": 5290} {"train_loss": -27.158084869384766, "global_step": 439124, "epoch": 5290} {"train_loss": -27.206573486328125, "global_step": 439125, "epoch": 5290} {"train_loss": -27.45493507385254, "global_step": 439126, "epoch": 5290} {"train_loss": -27.045318603515625, "global_step": 439127, "epoch": 5290} {"train_loss": -27.4045352935791, "global_step": 439128, "epoch": 5290} {"train_loss": -27.10268211364746, "global_step": 439129, "epoch": 5290} {"train_loss": -27.22871208190918, "global_step": 439130, "epoch": 5290} {"train_loss": -27.131574630737305, "global_step": 439131, "epoch": 5290} {"train_loss": -27.0961971282959, "global_step": 439132, "epoch": 5290} {"train_loss": -26.561559677124023, "global_step": 439133, "epoch": 5290} {"train_loss": -27.278470993041992, "global_step": 439134, "epoch": 5290} {"train_loss": -27.28998374938965, "global_step": 439135, "epoch": 5290} {"train_loss": -26.807586669921875, "global_step": 439136, "epoch": 5290} {"train_loss": -26.82449722290039, "global_step": 439137, "epoch": 5290} {"train_loss": -27.404376983642578, "global_step": 439138, "epoch": 5290} {"train_loss": -27.079986572265625, "global_step": 439139, "epoch": 5290} {"train_loss": -27.21758460998535, "global_step": 439140, "epoch": 5290} {"train_loss": -26.826684951782227, "global_step": 439141, "epoch": 5290} {"train_loss": -26.88102149963379, "global_step": 439142, "epoch": 5290} {"train_loss": -26.46384620666504, "global_step": 439143, "epoch": 5290} {"train_loss": -26.43643569946289, "global_step": 439144, "epoch": 5290} {"train_loss": -27.047277450561523, "global_step": 439145, "epoch": 5290} {"train_loss": -26.926746368408203, "global_step": 439146, "epoch": 5290} {"train_loss": -26.7100772857666, "global_step": 439147, "epoch": 5290} {"train_loss": -26.932449340820312, "global_step": 439148, "epoch": 5290} {"train_loss": -27.172327041625977, "global_step": 439149, "epoch": 5290} {"train_loss": -27.082326889038086, "global_step": 439150, "epoch": 5290} {"train_loss": -26.757410049438477, "global_step": 439151, "epoch": 5290} {"train_loss": -26.619323592588128, "global_step": 439152, "epoch": 5290, "val_loss": 6632759.0} {"train_loss": -26.132543563842773, "global_step": 439153, "epoch": 5291} {"train_loss": -25.29018211364746, "global_step": 439154, "epoch": 5291} {"train_loss": -26.084836959838867, "global_step": 439155, "epoch": 5291} {"train_loss": -25.69532585144043, "global_step": 439156, "epoch": 5291} {"train_loss": -25.876983642578125, "global_step": 439157, "epoch": 5291} {"train_loss": -25.945302963256836, "global_step": 439158, "epoch": 5291} {"train_loss": -26.009057998657227, "global_step": 439159, "epoch": 5291} {"train_loss": -26.295373916625977, "global_step": 439160, "epoch": 5291} {"train_loss": -26.46846580505371, "global_step": 439161, "epoch": 5291} {"train_loss": -26.09930419921875, "global_step": 439162, "epoch": 5291} {"train_loss": -26.263792037963867, "global_step": 439163, "epoch": 5291} {"train_loss": -26.448293685913086, "global_step": 439164, "epoch": 5291} {"train_loss": -26.15055274963379, "global_step": 439165, "epoch": 5291} {"train_loss": -26.30574607849121, "global_step": 439166, "epoch": 5291} {"train_loss": -26.318500518798828, "global_step": 439167, "epoch": 5291} {"train_loss": -26.69974708557129, "global_step": 439168, "epoch": 5291} {"train_loss": -26.12325096130371, "global_step": 439169, "epoch": 5291} {"train_loss": -26.484161376953125, "global_step": 439170, "epoch": 5291} {"train_loss": -26.784320831298828, "global_step": 439171, "epoch": 5291} {"train_loss": -26.995071411132812, "global_step": 439172, "epoch": 5291} {"train_loss": -26.7169189453125, "global_step": 439173, "epoch": 5291} {"train_loss": -26.82036781311035, "global_step": 439174, "epoch": 5291} {"train_loss": -26.735736846923828, "global_step": 439175, "epoch": 5291} {"train_loss": -26.6767578125, "global_step": 439176, "epoch": 5291} {"train_loss": -26.77937889099121, "global_step": 439177, "epoch": 5291} {"train_loss": -26.633520126342773, "global_step": 439178, "epoch": 5291} {"train_loss": -26.506681442260742, "global_step": 439179, "epoch": 5291} {"train_loss": -26.37192153930664, "global_step": 439180, "epoch": 5291} {"train_loss": -26.817962646484375, "global_step": 439181, "epoch": 5291} {"train_loss": -26.890939712524414, "global_step": 439182, "epoch": 5291} {"train_loss": -27.05039405822754, "global_step": 439183, "epoch": 5291} {"train_loss": -26.768911361694336, "global_step": 439184, "epoch": 5291} {"train_loss": -27.048425674438477, "global_step": 439185, "epoch": 5291} {"train_loss": -26.81658935546875, "global_step": 439186, "epoch": 5291} {"train_loss": -27.077655792236328, "global_step": 439187, "epoch": 5291} {"train_loss": -26.61213493347168, "global_step": 439188, "epoch": 5291} {"train_loss": -27.00592613220215, "global_step": 439189, "epoch": 5291} {"train_loss": -27.265869140625, "global_step": 439190, "epoch": 5291} {"train_loss": -26.69856071472168, "global_step": 439191, "epoch": 5291} {"train_loss": -26.969379425048828, "global_step": 439192, "epoch": 5291} {"train_loss": -26.691404342651367, "global_step": 439193, "epoch": 5291} {"train_loss": -27.007490158081055, "global_step": 439194, "epoch": 5291} {"train_loss": -26.876218795776367, "global_step": 439195, "epoch": 5291} {"train_loss": -26.9688777923584, "global_step": 439196, "epoch": 5291} {"train_loss": -27.145938873291016, "global_step": 439197, "epoch": 5291} {"train_loss": -26.7560977935791, "global_step": 439198, "epoch": 5291} {"train_loss": -27.117395401000977, "global_step": 439199, "epoch": 5291} {"train_loss": -26.972248077392578, "global_step": 439200, "epoch": 5291} {"train_loss": -27.29098892211914, "global_step": 439201, "epoch": 5291} {"train_loss": -27.187183380126953, "global_step": 439202, "epoch": 5291} {"train_loss": -26.560937881469727, "global_step": 439203, "epoch": 5291} {"train_loss": -26.736066818237305, "global_step": 439204, "epoch": 5291} {"train_loss": -27.310565948486328, "global_step": 439205, "epoch": 5291} {"train_loss": -26.611194610595703, "global_step": 439206, "epoch": 5291} {"train_loss": -27.17203712463379, "global_step": 439207, "epoch": 5291} {"train_loss": -27.114765167236328, "global_step": 439208, "epoch": 5291} {"train_loss": -27.14741325378418, "global_step": 439209, "epoch": 5291} {"train_loss": -27.17145347595215, "global_step": 439210, "epoch": 5291} {"train_loss": -27.390466690063477, "global_step": 439211, "epoch": 5291} {"train_loss": -27.016925811767578, "global_step": 439212, "epoch": 5291} {"train_loss": -26.978967666625977, "global_step": 439213, "epoch": 5291} {"train_loss": -26.98639488220215, "global_step": 439214, "epoch": 5291} {"train_loss": -26.914335250854492, "global_step": 439215, "epoch": 5291} {"train_loss": -26.90241050720215, "global_step": 439216, "epoch": 5291} {"train_loss": -26.331029891967773, "global_step": 439217, "epoch": 5291} {"train_loss": -27.174116134643555, "global_step": 439218, "epoch": 5291} {"train_loss": -27.086902618408203, "global_step": 439219, "epoch": 5291} {"train_loss": -26.978759765625, "global_step": 439220, "epoch": 5291} {"train_loss": -26.893482208251953, "global_step": 439221, "epoch": 5291} {"train_loss": -26.770788192749023, "global_step": 439222, "epoch": 5291} {"train_loss": -26.563751220703125, "global_step": 439223, "epoch": 5291} {"train_loss": -26.748458862304688, "global_step": 439224, "epoch": 5291} {"train_loss": -26.923276901245117, "global_step": 439225, "epoch": 5291} {"train_loss": -26.85529899597168, "global_step": 439226, "epoch": 5291} {"train_loss": -27.345746994018555, "global_step": 439227, "epoch": 5291} {"train_loss": -26.866682052612305, "global_step": 439228, "epoch": 5291} {"train_loss": -26.631521224975586, "global_step": 439229, "epoch": 5291} {"train_loss": -26.890005111694336, "global_step": 439230, "epoch": 5291} {"train_loss": -27.060815811157227, "global_step": 439231, "epoch": 5291} {"train_loss": -27.138050079345703, "global_step": 439232, "epoch": 5291} {"train_loss": -27.0828800201416, "global_step": 439233, "epoch": 5291} {"train_loss": -27.1629695892334, "global_step": 439234, "epoch": 5291} {"train_loss": -26.752472911972596, "global_step": 439235, "epoch": 5291, "val_loss": 6646121.0} {"train_loss": -26.902944564819336, "global_step": 439236, "epoch": 5292} {"train_loss": -26.80122184753418, "global_step": 439237, "epoch": 5292} {"train_loss": -26.937213897705078, "global_step": 439238, "epoch": 5292} {"train_loss": -26.584762573242188, "global_step": 439239, "epoch": 5292} {"train_loss": -26.77547264099121, "global_step": 439240, "epoch": 5292} {"train_loss": -26.764820098876953, "global_step": 439241, "epoch": 5292} {"train_loss": -27.123899459838867, "global_step": 439242, "epoch": 5292} {"train_loss": -27.055700302124023, "global_step": 439243, "epoch": 5292} {"train_loss": -26.564069747924805, "global_step": 439244, "epoch": 5292} {"train_loss": -26.6850643157959, "global_step": 439245, "epoch": 5292} {"train_loss": -26.657751083374023, "global_step": 439246, "epoch": 5292} {"train_loss": -26.96588706970215, "global_step": 439247, "epoch": 5292} {"train_loss": -26.63233757019043, "global_step": 439248, "epoch": 5292} {"train_loss": -26.543472290039062, "global_step": 439249, "epoch": 5292} {"train_loss": -26.61028480529785, "global_step": 439250, "epoch": 5292} {"train_loss": -27.1267147064209, "global_step": 439251, "epoch": 5292} {"train_loss": -26.413894653320312, "global_step": 439252, "epoch": 5292} {"train_loss": -27.116514205932617, "global_step": 439253, "epoch": 5292} {"train_loss": -27.10993003845215, "global_step": 439254, "epoch": 5292} {"train_loss": -26.809133529663086, "global_step": 439255, "epoch": 5292} {"train_loss": -26.546161651611328, "global_step": 439256, "epoch": 5292} {"train_loss": -27.128416061401367, "global_step": 439257, "epoch": 5292} {"train_loss": -26.741559982299805, "global_step": 439258, "epoch": 5292} {"train_loss": -26.970203399658203, "global_step": 439259, "epoch": 5292} {"train_loss": -26.942901611328125, "global_step": 439260, "epoch": 5292} {"train_loss": -26.769636154174805, "global_step": 439261, "epoch": 5292} {"train_loss": -27.0262451171875, "global_step": 439262, "epoch": 5292} {"train_loss": -26.764501571655273, "global_step": 439263, "epoch": 5292} {"train_loss": -27.005823135375977, "global_step": 439264, "epoch": 5292} {"train_loss": -26.83050537109375, "global_step": 439265, "epoch": 5292} {"train_loss": -26.89100456237793, "global_step": 439266, "epoch": 5292} {"train_loss": -26.914091110229492, "global_step": 439267, "epoch": 5292} {"train_loss": -26.588489532470703, "global_step": 439268, "epoch": 5292} {"train_loss": -26.848438262939453, "global_step": 439269, "epoch": 5292} {"train_loss": -26.784109115600586, "global_step": 439270, "epoch": 5292} {"train_loss": -27.01604652404785, "global_step": 439271, "epoch": 5292} {"train_loss": -26.574420928955078, "global_step": 439272, "epoch": 5292} {"train_loss": -26.78876304626465, "global_step": 439273, "epoch": 5292} {"train_loss": -26.71783447265625, "global_step": 439274, "epoch": 5292} {"train_loss": -27.13909912109375, "global_step": 439275, "epoch": 5292} {"train_loss": -26.692829132080078, "global_step": 439276, "epoch": 5292} {"train_loss": -26.80476188659668, "global_step": 439277, "epoch": 5292} {"train_loss": -27.062091827392578, "global_step": 439278, "epoch": 5292} {"train_loss": -27.0180721282959, "global_step": 439279, "epoch": 5292} {"train_loss": -26.478673934936523, "global_step": 439280, "epoch": 5292} {"train_loss": -26.91663932800293, "global_step": 439281, "epoch": 5292} {"train_loss": -27.201276779174805, "global_step": 439282, "epoch": 5292} {"train_loss": -27.155576705932617, "global_step": 439283, "epoch": 5292} {"train_loss": -27.427845001220703, "global_step": 439284, "epoch": 5292} {"train_loss": -27.134780883789062, "global_step": 439285, "epoch": 5292} {"train_loss": -27.020841598510742, "global_step": 439286, "epoch": 5292} {"train_loss": -27.212223052978516, "global_step": 439287, "epoch": 5292} {"train_loss": -26.779556274414062, "global_step": 439288, "epoch": 5292} {"train_loss": -27.159910202026367, "global_step": 439289, "epoch": 5292} {"train_loss": -27.157602310180664, "global_step": 439290, "epoch": 5292} {"train_loss": -27.23787498474121, "global_step": 439291, "epoch": 5292} {"train_loss": -27.146936416625977, "global_step": 439292, "epoch": 5292} {"train_loss": -27.347736358642578, "global_step": 439293, "epoch": 5292} {"train_loss": -26.6900634765625, "global_step": 439294, "epoch": 5292} {"train_loss": -27.14013671875, "global_step": 439295, "epoch": 5292} {"train_loss": -27.07838249206543, "global_step": 439296, "epoch": 5292} {"train_loss": -26.963531494140625, "global_step": 439297, "epoch": 5292} {"train_loss": -27.09480094909668, "global_step": 439298, "epoch": 5292} {"train_loss": -26.982837677001953, "global_step": 439299, "epoch": 5292} {"train_loss": -27.361255645751953, "global_step": 439300, "epoch": 5292} {"train_loss": -27.031147003173828, "global_step": 439301, "epoch": 5292} {"train_loss": -27.566360473632812, "global_step": 439302, "epoch": 5292} {"train_loss": -27.09861183166504, "global_step": 439303, "epoch": 5292} {"train_loss": -27.027563095092773, "global_step": 439304, "epoch": 5292} {"train_loss": -27.3903751373291, "global_step": 439305, "epoch": 5292} {"train_loss": -26.959386825561523, "global_step": 439306, "epoch": 5292} {"train_loss": -26.937667846679688, "global_step": 439307, "epoch": 5292} {"train_loss": -27.1356258392334, "global_step": 439308, "epoch": 5292} {"train_loss": -27.41530418395996, "global_step": 439309, "epoch": 5292} {"train_loss": -26.96343421936035, "global_step": 439310, "epoch": 5292} {"train_loss": -27.477643966674805, "global_step": 439311, "epoch": 5292} {"train_loss": -26.5081844329834, "global_step": 439312, "epoch": 5292} {"train_loss": -25.76275062561035, "global_step": 439313, "epoch": 5292} {"train_loss": -24.114078521728516, "global_step": 439314, "epoch": 5292} {"train_loss": -22.97967529296875, "global_step": 439315, "epoch": 5292} {"train_loss": -25.314258575439453, "global_step": 439316, "epoch": 5292} {"train_loss": -25.56207847595215, "global_step": 439317, "epoch": 5292} {"train_loss": -26.809742617319866, "global_step": 439318, "epoch": 5292, "val_loss": 6836036.0} {"train_loss": -24.27631950378418, "global_step": 439319, "epoch": 5293} {"train_loss": -24.432920455932617, "global_step": 439320, "epoch": 5293} {"train_loss": -24.138086318969727, "global_step": 439321, "epoch": 5293} {"train_loss": -25.618854522705078, "global_step": 439322, "epoch": 5293} {"train_loss": -24.716001510620117, "global_step": 439323, "epoch": 5293} {"train_loss": -25.409347534179688, "global_step": 439324, "epoch": 5293} {"train_loss": -25.32048988342285, "global_step": 439325, "epoch": 5293} {"train_loss": -25.438955307006836, "global_step": 439326, "epoch": 5293} {"train_loss": -25.67664909362793, "global_step": 439327, "epoch": 5293} {"train_loss": -25.682912826538086, "global_step": 439328, "epoch": 5293} {"train_loss": -25.405588150024414, "global_step": 439329, "epoch": 5293} {"train_loss": -25.514034271240234, "global_step": 439330, "epoch": 5293} {"train_loss": -25.64847755432129, "global_step": 439331, "epoch": 5293} {"train_loss": -25.389907836914062, "global_step": 439332, "epoch": 5293} {"train_loss": -25.99319839477539, "global_step": 439333, "epoch": 5293} {"train_loss": -25.83625602722168, "global_step": 439334, "epoch": 5293} {"train_loss": -25.911090850830078, "global_step": 439335, "epoch": 5293} {"train_loss": -25.983205795288086, "global_step": 439336, "epoch": 5293} {"train_loss": -25.641239166259766, "global_step": 439337, "epoch": 5293} {"train_loss": -25.822057723999023, "global_step": 439338, "epoch": 5293} {"train_loss": -26.260034561157227, "global_step": 439339, "epoch": 5293} {"train_loss": -26.2181453704834, "global_step": 439340, "epoch": 5293} {"train_loss": -26.04743766784668, "global_step": 439341, "epoch": 5293} {"train_loss": -25.917760848999023, "global_step": 439342, "epoch": 5293} {"train_loss": -26.17572021484375, "global_step": 439343, "epoch": 5293} {"train_loss": -26.024215698242188, "global_step": 439344, "epoch": 5293} {"train_loss": -26.372228622436523, "global_step": 439345, "epoch": 5293} {"train_loss": -26.421995162963867, "global_step": 439346, "epoch": 5293} {"train_loss": -26.142364501953125, "global_step": 439347, "epoch": 5293} {"train_loss": -26.504438400268555, "global_step": 439348, "epoch": 5293} {"train_loss": -26.633289337158203, "global_step": 439349, "epoch": 5293} {"train_loss": -26.558237075805664, "global_step": 439350, "epoch": 5293} {"train_loss": -26.8981876373291, "global_step": 439351, "epoch": 5293} {"train_loss": -26.613513946533203, "global_step": 439352, "epoch": 5293} {"train_loss": -26.87015724182129, "global_step": 439353, "epoch": 5293} {"train_loss": -26.779001235961914, "global_step": 439354, "epoch": 5293} {"train_loss": -26.555023193359375, "global_step": 439355, "epoch": 5293} {"train_loss": -26.527652740478516, "global_step": 439356, "epoch": 5293} {"train_loss": -26.486948013305664, "global_step": 439357, "epoch": 5293} {"train_loss": -27.08119010925293, "global_step": 439358, "epoch": 5293} {"train_loss": -27.086252212524414, "global_step": 439359, "epoch": 5293} {"train_loss": -26.395139694213867, "global_step": 439360, "epoch": 5293} {"train_loss": -26.912128448486328, "global_step": 439361, "epoch": 5293} {"train_loss": -27.091394424438477, "global_step": 439362, "epoch": 5293} {"train_loss": -26.994110107421875, "global_step": 439363, "epoch": 5293} {"train_loss": -27.1904296875, "global_step": 439364, "epoch": 5293} {"train_loss": -27.0979061126709, "global_step": 439365, "epoch": 5293} {"train_loss": -26.730010986328125, "global_step": 439366, "epoch": 5293} {"train_loss": -26.54522132873535, "global_step": 439367, "epoch": 5293} {"train_loss": -27.180856704711914, "global_step": 439368, "epoch": 5293} {"train_loss": -27.25623893737793, "global_step": 439369, "epoch": 5293} {"train_loss": -27.077795028686523, "global_step": 439370, "epoch": 5293} {"train_loss": -26.870328903198242, "global_step": 439371, "epoch": 5293} {"train_loss": -26.901493072509766, "global_step": 439372, "epoch": 5293} {"train_loss": -26.7453556060791, "global_step": 439373, "epoch": 5293} {"train_loss": -27.1207218170166, "global_step": 439374, "epoch": 5293} {"train_loss": -27.152603149414062, "global_step": 439375, "epoch": 5293} {"train_loss": -26.975818634033203, "global_step": 439376, "epoch": 5293} {"train_loss": -27.301366806030273, "global_step": 439377, "epoch": 5293} {"train_loss": -26.917861938476562, "global_step": 439378, "epoch": 5293} {"train_loss": -27.08219337463379, "global_step": 439379, "epoch": 5293} {"train_loss": -27.025232315063477, "global_step": 439380, "epoch": 5293} {"train_loss": -26.674909591674805, "global_step": 439381, "epoch": 5293} {"train_loss": -27.1480770111084, "global_step": 439382, "epoch": 5293} {"train_loss": -27.17852210998535, "global_step": 439383, "epoch": 5293} {"train_loss": -27.09730339050293, "global_step": 439384, "epoch": 5293} {"train_loss": -27.361684799194336, "global_step": 439385, "epoch": 5293} {"train_loss": -27.397079467773438, "global_step": 439386, "epoch": 5293} {"train_loss": -27.18105125427246, "global_step": 439387, "epoch": 5293} {"train_loss": -26.902908325195312, "global_step": 439388, "epoch": 5293} {"train_loss": -27.11549186706543, "global_step": 439389, "epoch": 5293} {"train_loss": -27.179828643798828, "global_step": 439390, "epoch": 5293} {"train_loss": -26.95662498474121, "global_step": 439391, "epoch": 5293} {"train_loss": -27.284332275390625, "global_step": 439392, "epoch": 5293} {"train_loss": -27.584394454956055, "global_step": 439393, "epoch": 5293} {"train_loss": -26.78024673461914, "global_step": 439394, "epoch": 5293} {"train_loss": -27.22010612487793, "global_step": 439395, "epoch": 5293} {"train_loss": -27.41265296936035, "global_step": 439396, "epoch": 5293} {"train_loss": -27.517202377319336, "global_step": 439397, "epoch": 5293} {"train_loss": -27.534147262573242, "global_step": 439398, "epoch": 5293} {"train_loss": -27.185199737548828, "global_step": 439399, "epoch": 5293} {"train_loss": -26.817419052124023, "global_step": 439400, "epoch": 5293} {"train_loss": -26.535630099744683, "global_step": 439401, "epoch": 5293, "val_loss": 6540210.0} {"train_loss": -26.110366821289062, "global_step": 439402, "epoch": 5294} {"train_loss": -25.360191345214844, "global_step": 439403, "epoch": 5294} {"train_loss": -25.8984432220459, "global_step": 439404, "epoch": 5294} {"train_loss": -26.42799949645996, "global_step": 439405, "epoch": 5294} {"train_loss": -25.869979858398438, "global_step": 439406, "epoch": 5294} {"train_loss": -25.760122299194336, "global_step": 439407, "epoch": 5294} {"train_loss": -26.765766143798828, "global_step": 439408, "epoch": 5294} {"train_loss": -26.326887130737305, "global_step": 439409, "epoch": 5294} {"train_loss": -26.2925968170166, "global_step": 439410, "epoch": 5294} {"train_loss": -26.527921676635742, "global_step": 439411, "epoch": 5294} {"train_loss": -26.336395263671875, "global_step": 439412, "epoch": 5294} {"train_loss": -26.49013328552246, "global_step": 439413, "epoch": 5294} {"train_loss": -26.7658634185791, "global_step": 439414, "epoch": 5294} {"train_loss": -26.63291358947754, "global_step": 439415, "epoch": 5294} {"train_loss": -26.489526748657227, "global_step": 439416, "epoch": 5294} {"train_loss": -26.97666358947754, "global_step": 439417, "epoch": 5294} {"train_loss": -26.797012329101562, "global_step": 439418, "epoch": 5294} {"train_loss": -26.604333877563477, "global_step": 439419, "epoch": 5294} {"train_loss": -26.52449607849121, "global_step": 439420, "epoch": 5294} {"train_loss": -26.849103927612305, "global_step": 439421, "epoch": 5294} {"train_loss": -26.783313751220703, "global_step": 439422, "epoch": 5294} {"train_loss": -26.62554359436035, "global_step": 439423, "epoch": 5294} {"train_loss": -26.807470321655273, "global_step": 439424, "epoch": 5294} {"train_loss": -26.428632736206055, "global_step": 439425, "epoch": 5294} {"train_loss": -26.53363037109375, "global_step": 439426, "epoch": 5294} {"train_loss": -26.887908935546875, "global_step": 439427, "epoch": 5294} {"train_loss": -26.715545654296875, "global_step": 439428, "epoch": 5294} {"train_loss": -26.327245712280273, "global_step": 439429, "epoch": 5294} {"train_loss": -27.271957397460938, "global_step": 439430, "epoch": 5294} {"train_loss": -26.769168853759766, "global_step": 439431, "epoch": 5294} {"train_loss": -26.440088272094727, "global_step": 439432, "epoch": 5294} {"train_loss": -27.277997970581055, "global_step": 439433, "epoch": 5294} {"train_loss": -26.35194206237793, "global_step": 439434, "epoch": 5294} {"train_loss": -27.077289581298828, "global_step": 439435, "epoch": 5294} {"train_loss": -26.87109375, "global_step": 439436, "epoch": 5294} {"train_loss": -27.15449333190918, "global_step": 439437, "epoch": 5294} {"train_loss": -26.690887451171875, "global_step": 439438, "epoch": 5294} {"train_loss": -26.935108184814453, "global_step": 439439, "epoch": 5294} {"train_loss": -27.136625289916992, "global_step": 439440, "epoch": 5294} {"train_loss": -27.0633487701416, "global_step": 439441, "epoch": 5294} {"train_loss": -27.053186416625977, "global_step": 439442, "epoch": 5294} {"train_loss": -27.3514347076416, "global_step": 439443, "epoch": 5294} {"train_loss": -27.31243896484375, "global_step": 439444, "epoch": 5294} {"train_loss": -26.971776962280273, "global_step": 439445, "epoch": 5294} {"train_loss": -27.47071647644043, "global_step": 439446, "epoch": 5294} {"train_loss": -27.2232608795166, "global_step": 439447, "epoch": 5294} {"train_loss": -26.8084659576416, "global_step": 439448, "epoch": 5294} {"train_loss": -26.947647094726562, "global_step": 439449, "epoch": 5294} {"train_loss": -27.29959487915039, "global_step": 439450, "epoch": 5294} {"train_loss": -26.761783599853516, "global_step": 439451, "epoch": 5294} {"train_loss": -27.396936416625977, "global_step": 439452, "epoch": 5294} {"train_loss": -27.05618667602539, "global_step": 439453, "epoch": 5294} {"train_loss": -26.702802658081055, "global_step": 439454, "epoch": 5294} {"train_loss": -26.964679718017578, "global_step": 439455, "epoch": 5294} {"train_loss": -26.759733200073242, "global_step": 439456, "epoch": 5294} {"train_loss": -26.881885528564453, "global_step": 439457, "epoch": 5294} {"train_loss": -27.041528701782227, "global_step": 439458, "epoch": 5294} {"train_loss": -27.3082332611084, "global_step": 439459, "epoch": 5294} {"train_loss": -27.0721435546875, "global_step": 439460, "epoch": 5294} {"train_loss": -27.0159912109375, "global_step": 439461, "epoch": 5294} {"train_loss": -27.274377822875977, "global_step": 439462, "epoch": 5294} {"train_loss": -27.151639938354492, "global_step": 439463, "epoch": 5294} {"train_loss": -27.332275390625, "global_step": 439464, "epoch": 5294} {"train_loss": -26.856229782104492, "global_step": 439465, "epoch": 5294} {"train_loss": -27.44459342956543, "global_step": 439466, "epoch": 5294} {"train_loss": -26.858123779296875, "global_step": 439467, "epoch": 5294} {"train_loss": -27.06659507751465, "global_step": 439468, "epoch": 5294} {"train_loss": -26.908649444580078, "global_step": 439469, "epoch": 5294} {"train_loss": -27.203073501586914, "global_step": 439470, "epoch": 5294} {"train_loss": -27.075727462768555, "global_step": 439471, "epoch": 5294} {"train_loss": -27.258047103881836, "global_step": 439472, "epoch": 5294} {"train_loss": -27.222803115844727, "global_step": 439473, "epoch": 5294} {"train_loss": -26.994033813476562, "global_step": 439474, "epoch": 5294} {"train_loss": -26.2851619720459, "global_step": 439475, "epoch": 5294} {"train_loss": -26.45667839050293, "global_step": 439476, "epoch": 5294} {"train_loss": -26.947118759155273, "global_step": 439477, "epoch": 5294} {"train_loss": -26.538232803344727, "global_step": 439478, "epoch": 5294} {"train_loss": -26.475605010986328, "global_step": 439479, "epoch": 5294} {"train_loss": -26.63580894470215, "global_step": 439480, "epoch": 5294} {"train_loss": -26.61138343811035, "global_step": 439481, "epoch": 5294} {"train_loss": -26.89473533630371, "global_step": 439482, "epoch": 5294} {"train_loss": -26.83734130859375, "global_step": 439483, "epoch": 5294} {"train_loss": -26.814977806734753, "global_step": 439484, "epoch": 5294, "val_loss": 6660480.0} {"train_loss": -26.095855712890625, "global_step": 439485, "epoch": 5295} {"train_loss": -26.324237823486328, "global_step": 439486, "epoch": 5295} {"train_loss": -26.546056747436523, "global_step": 439487, "epoch": 5295} {"train_loss": -26.348657608032227, "global_step": 439488, "epoch": 5295} {"train_loss": -26.384037017822266, "global_step": 439489, "epoch": 5295} {"train_loss": -26.29707145690918, "global_step": 439490, "epoch": 5295} {"train_loss": -26.63517189025879, "global_step": 439491, "epoch": 5295} {"train_loss": -26.355438232421875, "global_step": 439492, "epoch": 5295} {"train_loss": -26.67047119140625, "global_step": 439493, "epoch": 5295} {"train_loss": -26.5112247467041, "global_step": 439494, "epoch": 5295} {"train_loss": -26.745405197143555, "global_step": 439495, "epoch": 5295} {"train_loss": -27.005842208862305, "global_step": 439496, "epoch": 5295} {"train_loss": -26.8779354095459, "global_step": 439497, "epoch": 5295} {"train_loss": -26.680374145507812, "global_step": 439498, "epoch": 5295} {"train_loss": -26.614994049072266, "global_step": 439499, "epoch": 5295} {"train_loss": -26.77861976623535, "global_step": 439500, "epoch": 5295} {"train_loss": -26.679357528686523, "global_step": 439501, "epoch": 5295} {"train_loss": -27.218154907226562, "global_step": 439502, "epoch": 5295} {"train_loss": -26.734241485595703, "global_step": 439503, "epoch": 5295} {"train_loss": -27.07680320739746, "global_step": 439504, "epoch": 5295} {"train_loss": -26.76507568359375, "global_step": 439505, "epoch": 5295} {"train_loss": -26.529651641845703, "global_step": 439506, "epoch": 5295} {"train_loss": -26.558317184448242, "global_step": 439507, "epoch": 5295} {"train_loss": -26.989683151245117, "global_step": 439508, "epoch": 5295} {"train_loss": -26.9528751373291, "global_step": 439509, "epoch": 5295} {"train_loss": -27.042510986328125, "global_step": 439510, "epoch": 5295} {"train_loss": -26.47771644592285, "global_step": 439511, "epoch": 5295} {"train_loss": -26.94040298461914, "global_step": 439512, "epoch": 5295} {"train_loss": -26.9101505279541, "global_step": 439513, "epoch": 5295} {"train_loss": -27.05523681640625, "global_step": 439514, "epoch": 5295} {"train_loss": -27.06015968322754, "global_step": 439515, "epoch": 5295} {"train_loss": -26.902667999267578, "global_step": 439516, "epoch": 5295} {"train_loss": -27.256940841674805, "global_step": 439517, "epoch": 5295} {"train_loss": -27.035608291625977, "global_step": 439518, "epoch": 5295} {"train_loss": -26.723861694335938, "global_step": 439519, "epoch": 5295} {"train_loss": -27.113378524780273, "global_step": 439520, "epoch": 5295} {"train_loss": -27.131147384643555, "global_step": 439521, "epoch": 5295} {"train_loss": -26.888080596923828, "global_step": 439522, "epoch": 5295} {"train_loss": -26.809452056884766, "global_step": 439523, "epoch": 5295} {"train_loss": -27.155059814453125, "global_step": 439524, "epoch": 5295} {"train_loss": -27.15777587890625, "global_step": 439525, "epoch": 5295} {"train_loss": -27.16791343688965, "global_step": 439526, "epoch": 5295} {"train_loss": -27.2632999420166, "global_step": 439527, "epoch": 5295} {"train_loss": -26.98377799987793, "global_step": 439528, "epoch": 5295} {"train_loss": -26.864774703979492, "global_step": 439529, "epoch": 5295} {"train_loss": -26.97174072265625, "global_step": 439530, "epoch": 5295} {"train_loss": -27.31245231628418, "global_step": 439531, "epoch": 5295} {"train_loss": -27.280502319335938, "global_step": 439532, "epoch": 5295} {"train_loss": -26.901121139526367, "global_step": 439533, "epoch": 5295} {"train_loss": -26.95293617248535, "global_step": 439534, "epoch": 5295} {"train_loss": -27.053674697875977, "global_step": 439535, "epoch": 5295} {"train_loss": -27.268468856811523, "global_step": 439536, "epoch": 5295} {"train_loss": -26.969837188720703, "global_step": 439537, "epoch": 5295} {"train_loss": -26.903223037719727, "global_step": 439538, "epoch": 5295} {"train_loss": -26.643665313720703, "global_step": 439539, "epoch": 5295} {"train_loss": -26.594284057617188, "global_step": 439540, "epoch": 5295} {"train_loss": -26.36669921875, "global_step": 439541, "epoch": 5295} {"train_loss": -27.355182647705078, "global_step": 439542, "epoch": 5295} {"train_loss": -26.4201717376709, "global_step": 439543, "epoch": 5295} {"train_loss": -26.138519287109375, "global_step": 439544, "epoch": 5295} {"train_loss": -26.92194938659668, "global_step": 439545, "epoch": 5295} {"train_loss": -26.796783447265625, "global_step": 439546, "epoch": 5295} {"train_loss": -26.11695671081543, "global_step": 439547, "epoch": 5295} {"train_loss": -26.9127197265625, "global_step": 439548, "epoch": 5295} {"train_loss": -26.470895767211914, "global_step": 439549, "epoch": 5295} {"train_loss": -26.947601318359375, "global_step": 439550, "epoch": 5295} {"train_loss": -26.750593185424805, "global_step": 439551, "epoch": 5295} {"train_loss": -26.895116806030273, "global_step": 439552, "epoch": 5295} {"train_loss": -26.263843536376953, "global_step": 439553, "epoch": 5295} {"train_loss": -27.104589462280273, "global_step": 439554, "epoch": 5295} {"train_loss": -26.6004581451416, "global_step": 439555, "epoch": 5295} {"train_loss": -27.084558486938477, "global_step": 439556, "epoch": 5295} {"train_loss": -26.785816192626953, "global_step": 439557, "epoch": 5295} {"train_loss": -26.813720703125, "global_step": 439558, "epoch": 5295} {"train_loss": -26.7591609954834, "global_step": 439559, "epoch": 5295} {"train_loss": -26.931859970092773, "global_step": 439560, "epoch": 5295} {"train_loss": -26.641260147094727, "global_step": 439561, "epoch": 5295} {"train_loss": -26.793298721313477, "global_step": 439562, "epoch": 5295} {"train_loss": -27.050092697143555, "global_step": 439563, "epoch": 5295} {"train_loss": -27.16474723815918, "global_step": 439564, "epoch": 5295} {"train_loss": -26.48298454284668, "global_step": 439565, "epoch": 5295} {"train_loss": -27.049457550048828, "global_step": 439566, "epoch": 5295} {"train_loss": -26.812429267239857, "global_step": 439567, "epoch": 5295, "val_loss": 6571069.0} {"train_loss": -26.7255859375, "global_step": 439568, "epoch": 5296} {"train_loss": -26.850234985351562, "global_step": 439569, "epoch": 5296} {"train_loss": -26.68523597717285, "global_step": 439570, "epoch": 5296} {"train_loss": -26.601551055908203, "global_step": 439571, "epoch": 5296} {"train_loss": -26.97393226623535, "global_step": 439572, "epoch": 5296} {"train_loss": -26.559066772460938, "global_step": 439573, "epoch": 5296} {"train_loss": -26.647668838500977, "global_step": 439574, "epoch": 5296} {"train_loss": -26.571577072143555, "global_step": 439575, "epoch": 5296} {"train_loss": -26.776819229125977, "global_step": 439576, "epoch": 5296} {"train_loss": -26.97702980041504, "global_step": 439577, "epoch": 5296} {"train_loss": -26.802799224853516, "global_step": 439578, "epoch": 5296} {"train_loss": -26.487009048461914, "global_step": 439579, "epoch": 5296} {"train_loss": -26.61379051208496, "global_step": 439580, "epoch": 5296} {"train_loss": -27.0195369720459, "global_step": 439581, "epoch": 5296} {"train_loss": -26.967126846313477, "global_step": 439582, "epoch": 5296} {"train_loss": -26.97382926940918, "global_step": 439583, "epoch": 5296} {"train_loss": -26.91194725036621, "global_step": 439584, "epoch": 5296} {"train_loss": -26.609149932861328, "global_step": 439585, "epoch": 5296} {"train_loss": -26.35773277282715, "global_step": 439586, "epoch": 5296} {"train_loss": -27.041406631469727, "global_step": 439587, "epoch": 5296} {"train_loss": -26.806249618530273, "global_step": 439588, "epoch": 5296} {"train_loss": -26.703052520751953, "global_step": 439589, "epoch": 5296} {"train_loss": -26.68609046936035, "global_step": 439590, "epoch": 5296} {"train_loss": -26.820825576782227, "global_step": 439591, "epoch": 5296} {"train_loss": -26.7640323638916, "global_step": 439592, "epoch": 5296} {"train_loss": -27.26554298400879, "global_step": 439593, "epoch": 5296} {"train_loss": -26.864267349243164, "global_step": 439594, "epoch": 5296} {"train_loss": -27.191761016845703, "global_step": 439595, "epoch": 5296} {"train_loss": -26.863189697265625, "global_step": 439596, "epoch": 5296} {"train_loss": -27.035058975219727, "global_step": 439597, "epoch": 5296} {"train_loss": -26.912168502807617, "global_step": 439598, "epoch": 5296} {"train_loss": -27.189655303955078, "global_step": 439599, "epoch": 5296} {"train_loss": -27.086044311523438, "global_step": 439600, "epoch": 5296} {"train_loss": -26.907133102416992, "global_step": 439601, "epoch": 5296} {"train_loss": -26.926305770874023, "global_step": 439602, "epoch": 5296} {"train_loss": -25.99604606628418, "global_step": 439603, "epoch": 5296} {"train_loss": -25.270938873291016, "global_step": 439604, "epoch": 5296} {"train_loss": -25.990949630737305, "global_step": 439605, "epoch": 5296} {"train_loss": -26.55689811706543, "global_step": 439606, "epoch": 5296} {"train_loss": -26.204870223999023, "global_step": 439607, "epoch": 5296} {"train_loss": -26.241363525390625, "global_step": 439608, "epoch": 5296} {"train_loss": -26.681730270385742, "global_step": 439609, "epoch": 5296} {"train_loss": -26.343862533569336, "global_step": 439610, "epoch": 5296} {"train_loss": -26.01322364807129, "global_step": 439611, "epoch": 5296} {"train_loss": -26.487518310546875, "global_step": 439612, "epoch": 5296} {"train_loss": -26.460723876953125, "global_step": 439613, "epoch": 5296} {"train_loss": -26.5360164642334, "global_step": 439614, "epoch": 5296} {"train_loss": -26.749393463134766, "global_step": 439615, "epoch": 5296} {"train_loss": -26.75306510925293, "global_step": 439616, "epoch": 5296} {"train_loss": -26.7747802734375, "global_step": 439617, "epoch": 5296} {"train_loss": -27.097442626953125, "global_step": 439618, "epoch": 5296} {"train_loss": -26.503820419311523, "global_step": 439619, "epoch": 5296} {"train_loss": -26.587188720703125, "global_step": 439620, "epoch": 5296} {"train_loss": -26.67575454711914, "global_step": 439621, "epoch": 5296} {"train_loss": -26.634235382080078, "global_step": 439622, "epoch": 5296} {"train_loss": -26.755359649658203, "global_step": 439623, "epoch": 5296} {"train_loss": -27.094165802001953, "global_step": 439624, "epoch": 5296} {"train_loss": -26.917449951171875, "global_step": 439625, "epoch": 5296} {"train_loss": -26.94227409362793, "global_step": 439626, "epoch": 5296} {"train_loss": -26.9454345703125, "global_step": 439627, "epoch": 5296} {"train_loss": -26.517332077026367, "global_step": 439628, "epoch": 5296} {"train_loss": -27.22574806213379, "global_step": 439629, "epoch": 5296} {"train_loss": -26.698028564453125, "global_step": 439630, "epoch": 5296} {"train_loss": -26.745203018188477, "global_step": 439631, "epoch": 5296} {"train_loss": -26.993432998657227, "global_step": 439632, "epoch": 5296} {"train_loss": -27.186569213867188, "global_step": 439633, "epoch": 5296} {"train_loss": -27.32088279724121, "global_step": 439634, "epoch": 5296} {"train_loss": -27.097253799438477, "global_step": 439635, "epoch": 5296} {"train_loss": -27.23309326171875, "global_step": 439636, "epoch": 5296} {"train_loss": -26.701568603515625, "global_step": 439637, "epoch": 5296} {"train_loss": -27.042007446289062, "global_step": 439638, "epoch": 5296} {"train_loss": -26.96942710876465, "global_step": 439639, "epoch": 5296} {"train_loss": -27.009418487548828, "global_step": 439640, "epoch": 5296} {"train_loss": -26.674814224243164, "global_step": 439641, "epoch": 5296} {"train_loss": -27.14277458190918, "global_step": 439642, "epoch": 5296} {"train_loss": -26.76252555847168, "global_step": 439643, "epoch": 5296} {"train_loss": -27.228778839111328, "global_step": 439644, "epoch": 5296} {"train_loss": -27.022619247436523, "global_step": 439645, "epoch": 5296} {"train_loss": -26.87177085876465, "global_step": 439646, "epoch": 5296} {"train_loss": -27.03076171875, "global_step": 439647, "epoch": 5296} {"train_loss": -27.611572265625, "global_step": 439648, "epoch": 5296} {"train_loss": -27.06537437438965, "global_step": 439649, "epoch": 5296} {"train_loss": -26.79426441422428, "global_step": 439650, "epoch": 5296, "val_loss": 6555874.0} {"train_loss": -26.77671241760254, "global_step": 439651, "epoch": 5297} {"train_loss": -25.86297607421875, "global_step": 439652, "epoch": 5297} {"train_loss": -26.415271759033203, "global_step": 439653, "epoch": 5297} {"train_loss": -26.589435577392578, "global_step": 439654, "epoch": 5297} {"train_loss": -26.23716163635254, "global_step": 439655, "epoch": 5297} {"train_loss": -26.24612808227539, "global_step": 439656, "epoch": 5297} {"train_loss": -26.580785751342773, "global_step": 439657, "epoch": 5297} {"train_loss": -26.501056671142578, "global_step": 439658, "epoch": 5297} {"train_loss": -26.890954971313477, "global_step": 439659, "epoch": 5297} {"train_loss": -26.91619873046875, "global_step": 439660, "epoch": 5297} {"train_loss": -26.663909912109375, "global_step": 439661, "epoch": 5297} {"train_loss": -26.985504150390625, "global_step": 439662, "epoch": 5297} {"train_loss": -27.076566696166992, "global_step": 439663, "epoch": 5297} {"train_loss": -26.36646842956543, "global_step": 439664, "epoch": 5297} {"train_loss": -27.138427734375, "global_step": 439665, "epoch": 5297} {"train_loss": -26.447168350219727, "global_step": 439666, "epoch": 5297} {"train_loss": -26.7703857421875, "global_step": 439667, "epoch": 5297} {"train_loss": -26.47723960876465, "global_step": 439668, "epoch": 5297} {"train_loss": -26.845829010009766, "global_step": 439669, "epoch": 5297} {"train_loss": -26.67337989807129, "global_step": 439670, "epoch": 5297} {"train_loss": -26.460302352905273, "global_step": 439671, "epoch": 5297} {"train_loss": -26.98898696899414, "global_step": 439672, "epoch": 5297} {"train_loss": -26.899946212768555, "global_step": 439673, "epoch": 5297} {"train_loss": -26.815082550048828, "global_step": 439674, "epoch": 5297} {"train_loss": -26.74578857421875, "global_step": 439675, "epoch": 5297} {"train_loss": -26.641361236572266, "global_step": 439676, "epoch": 5297} {"train_loss": -27.0416259765625, "global_step": 439677, "epoch": 5297} {"train_loss": -27.0714111328125, "global_step": 439678, "epoch": 5297} {"train_loss": -26.79684829711914, "global_step": 439679, "epoch": 5297} {"train_loss": -27.029769897460938, "global_step": 439680, "epoch": 5297} {"train_loss": -27.056751251220703, "global_step": 439681, "epoch": 5297} {"train_loss": -26.951818466186523, "global_step": 439682, "epoch": 5297} {"train_loss": -26.814401626586914, "global_step": 439683, "epoch": 5297} {"train_loss": -27.358280181884766, "global_step": 439684, "epoch": 5297} {"train_loss": -27.120880126953125, "global_step": 439685, "epoch": 5297} {"train_loss": -27.093219757080078, "global_step": 439686, "epoch": 5297} {"train_loss": -26.971546173095703, "global_step": 439687, "epoch": 5297} {"train_loss": -26.94648551940918, "global_step": 439688, "epoch": 5297} {"train_loss": -26.923828125, "global_step": 439689, "epoch": 5297} {"train_loss": -26.62822914123535, "global_step": 439690, "epoch": 5297} {"train_loss": -26.894193649291992, "global_step": 439691, "epoch": 5297} {"train_loss": -26.847599029541016, "global_step": 439692, "epoch": 5297} {"train_loss": -27.08426856994629, "global_step": 439693, "epoch": 5297} {"train_loss": -26.646575927734375, "global_step": 439694, "epoch": 5297} {"train_loss": -26.49586296081543, "global_step": 439695, "epoch": 5297} {"train_loss": -27.12818717956543, "global_step": 439696, "epoch": 5297} {"train_loss": -26.88081169128418, "global_step": 439697, "epoch": 5297} {"train_loss": -26.804157257080078, "global_step": 439698, "epoch": 5297} {"train_loss": -26.59827995300293, "global_step": 439699, "epoch": 5297} {"train_loss": -26.907926559448242, "global_step": 439700, "epoch": 5297} {"train_loss": -27.07114601135254, "global_step": 439701, "epoch": 5297} {"train_loss": -26.842390060424805, "global_step": 439702, "epoch": 5297} {"train_loss": -27.043676376342773, "global_step": 439703, "epoch": 5297} {"train_loss": -26.85178565979004, "global_step": 439704, "epoch": 5297} {"train_loss": -27.05878257751465, "global_step": 439705, "epoch": 5297} {"train_loss": -26.65121841430664, "global_step": 439706, "epoch": 5297} {"train_loss": -26.595556259155273, "global_step": 439707, "epoch": 5297} {"train_loss": -27.14674186706543, "global_step": 439708, "epoch": 5297} {"train_loss": -26.97353172302246, "global_step": 439709, "epoch": 5297} {"train_loss": -26.641464233398438, "global_step": 439710, "epoch": 5297} {"train_loss": -27.118865966796875, "global_step": 439711, "epoch": 5297} {"train_loss": -26.90349769592285, "global_step": 439712, "epoch": 5297} {"train_loss": -26.980260848999023, "global_step": 439713, "epoch": 5297} {"train_loss": -26.865680694580078, "global_step": 439714, "epoch": 5297} {"train_loss": -27.007471084594727, "global_step": 439715, "epoch": 5297} {"train_loss": -27.1434268951416, "global_step": 439716, "epoch": 5297} {"train_loss": -26.7982177734375, "global_step": 439717, "epoch": 5297} {"train_loss": -26.89910888671875, "global_step": 439718, "epoch": 5297} {"train_loss": -26.66632080078125, "global_step": 439719, "epoch": 5297} {"train_loss": -26.995187759399414, "global_step": 439720, "epoch": 5297} {"train_loss": -26.723285675048828, "global_step": 439721, "epoch": 5297} {"train_loss": -26.899311065673828, "global_step": 439722, "epoch": 5297} {"train_loss": -26.9677734375, "global_step": 439723, "epoch": 5297} {"train_loss": -27.116180419921875, "global_step": 439724, "epoch": 5297} {"train_loss": -27.006010055541992, "global_step": 439725, "epoch": 5297} {"train_loss": -27.147537231445312, "global_step": 439726, "epoch": 5297} {"train_loss": -26.761747360229492, "global_step": 439727, "epoch": 5297} {"train_loss": -27.151533126831055, "global_step": 439728, "epoch": 5297} {"train_loss": -26.99953269958496, "global_step": 439729, "epoch": 5297} {"train_loss": -26.95147705078125, "global_step": 439730, "epoch": 5297} {"train_loss": -26.871353149414062, "global_step": 439731, "epoch": 5297} {"train_loss": -27.066532135009766, "global_step": 439732, "epoch": 5297} {"train_loss": -26.832940664636084, "global_step": 439733, "epoch": 5297, "val_loss": 6593951.0} {"train_loss": -26.913427352905273, "global_step": 439734, "epoch": 5298} {"train_loss": -26.803403854370117, "global_step": 439735, "epoch": 5298} {"train_loss": -26.627450942993164, "global_step": 439736, "epoch": 5298} {"train_loss": -27.152372360229492, "global_step": 439737, "epoch": 5298} {"train_loss": -26.971662521362305, "global_step": 439738, "epoch": 5298} {"train_loss": -27.0666561126709, "global_step": 439739, "epoch": 5298} {"train_loss": -26.739599227905273, "global_step": 439740, "epoch": 5298} {"train_loss": -26.98433494567871, "global_step": 439741, "epoch": 5298} {"train_loss": -26.918310165405273, "global_step": 439742, "epoch": 5298} {"train_loss": -26.849536895751953, "global_step": 439743, "epoch": 5298} {"train_loss": -26.7369441986084, "global_step": 439744, "epoch": 5298} {"train_loss": -26.450525283813477, "global_step": 439745, "epoch": 5298} {"train_loss": -26.720197677612305, "global_step": 439746, "epoch": 5298} {"train_loss": -26.686859130859375, "global_step": 439747, "epoch": 5298} {"train_loss": -26.88199806213379, "global_step": 439748, "epoch": 5298} {"train_loss": -26.631895065307617, "global_step": 439749, "epoch": 5298} {"train_loss": -26.56591796875, "global_step": 439750, "epoch": 5298} {"train_loss": -27.083118438720703, "global_step": 439751, "epoch": 5298} {"train_loss": -26.714984893798828, "global_step": 439752, "epoch": 5298} {"train_loss": -26.702478408813477, "global_step": 439753, "epoch": 5298} {"train_loss": -26.584461212158203, "global_step": 439754, "epoch": 5298} {"train_loss": -26.7374267578125, "global_step": 439755, "epoch": 5298} {"train_loss": -26.995487213134766, "global_step": 439756, "epoch": 5298} {"train_loss": -26.69776725769043, "global_step": 439757, "epoch": 5298} {"train_loss": -27.038837432861328, "global_step": 439758, "epoch": 5298} {"train_loss": -26.770185470581055, "global_step": 439759, "epoch": 5298} {"train_loss": -26.789554595947266, "global_step": 439760, "epoch": 5298} {"train_loss": -26.765213012695312, "global_step": 439761, "epoch": 5298} {"train_loss": -26.94361686706543, "global_step": 439762, "epoch": 5298} {"train_loss": -26.836715698242188, "global_step": 439763, "epoch": 5298} {"train_loss": -26.779584884643555, "global_step": 439764, "epoch": 5298} {"train_loss": -26.832212448120117, "global_step": 439765, "epoch": 5298} {"train_loss": -26.757543563842773, "global_step": 439766, "epoch": 5298} {"train_loss": -26.772138595581055, "global_step": 439767, "epoch": 5298} {"train_loss": -27.00947380065918, "global_step": 439768, "epoch": 5298} {"train_loss": -26.76423454284668, "global_step": 439769, "epoch": 5298} {"train_loss": -26.865798950195312, "global_step": 439770, "epoch": 5298} {"train_loss": -26.794666290283203, "global_step": 439771, "epoch": 5298} {"train_loss": -26.752058029174805, "global_step": 439772, "epoch": 5298} {"train_loss": -26.592975616455078, "global_step": 439773, "epoch": 5298} {"train_loss": -26.986974716186523, "global_step": 439774, "epoch": 5298} {"train_loss": -27.288671493530273, "global_step": 439775, "epoch": 5298} {"train_loss": -26.968494415283203, "global_step": 439776, "epoch": 5298} {"train_loss": -26.960920333862305, "global_step": 439777, "epoch": 5298} {"train_loss": -27.225116729736328, "global_step": 439778, "epoch": 5298} {"train_loss": -27.319171905517578, "global_step": 439779, "epoch": 5298} {"train_loss": -27.19976234436035, "global_step": 439780, "epoch": 5298} {"train_loss": -26.94715690612793, "global_step": 439781, "epoch": 5298} {"train_loss": -27.0416202545166, "global_step": 439782, "epoch": 5298} {"train_loss": -27.21797752380371, "global_step": 439783, "epoch": 5298} {"train_loss": -27.00555992126465, "global_step": 439784, "epoch": 5298} {"train_loss": -27.3846435546875, "global_step": 439785, "epoch": 5298} {"train_loss": -27.162372589111328, "global_step": 439786, "epoch": 5298} {"train_loss": -27.0520076751709, "global_step": 439787, "epoch": 5298} {"train_loss": -26.840829849243164, "global_step": 439788, "epoch": 5298} {"train_loss": -26.870946884155273, "global_step": 439789, "epoch": 5298} {"train_loss": -26.869001388549805, "global_step": 439790, "epoch": 5298} {"train_loss": -27.06624412536621, "global_step": 439791, "epoch": 5298} {"train_loss": -27.27227210998535, "global_step": 439792, "epoch": 5298} {"train_loss": -26.82675552368164, "global_step": 439793, "epoch": 5298} {"train_loss": -27.198575973510742, "global_step": 439794, "epoch": 5298} {"train_loss": -26.977609634399414, "global_step": 439795, "epoch": 5298} {"train_loss": -26.976057052612305, "global_step": 439796, "epoch": 5298} {"train_loss": -26.372472763061523, "global_step": 439797, "epoch": 5298} {"train_loss": -25.795934677124023, "global_step": 439798, "epoch": 5298} {"train_loss": -26.242273330688477, "global_step": 439799, "epoch": 5298} {"train_loss": -27.034839630126953, "global_step": 439800, "epoch": 5298} {"train_loss": -27.09214210510254, "global_step": 439801, "epoch": 5298} {"train_loss": -26.72786521911621, "global_step": 439802, "epoch": 5298} {"train_loss": -26.602909088134766, "global_step": 439803, "epoch": 5298} {"train_loss": -26.482471466064453, "global_step": 439804, "epoch": 5298} {"train_loss": -26.612207412719727, "global_step": 439805, "epoch": 5298} {"train_loss": -26.959680557250977, "global_step": 439806, "epoch": 5298} {"train_loss": -26.6791934967041, "global_step": 439807, "epoch": 5298} {"train_loss": -27.016342163085938, "global_step": 439808, "epoch": 5298} {"train_loss": -27.12166404724121, "global_step": 439809, "epoch": 5298} {"train_loss": -26.744176864624023, "global_step": 439810, "epoch": 5298} {"train_loss": -26.59256935119629, "global_step": 439811, "epoch": 5298} {"train_loss": -26.691486358642578, "global_step": 439812, "epoch": 5298} {"train_loss": -26.586872100830078, "global_step": 439813, "epoch": 5298} {"train_loss": -26.966333389282227, "global_step": 439814, "epoch": 5298} {"train_loss": -26.39267349243164, "global_step": 439815, "epoch": 5298} {"train_loss": -26.866715052041663, "global_step": 439816, "epoch": 5298, "val_loss": 6653049.0} {"train_loss": -26.75685691833496, "global_step": 439817, "epoch": 5299} {"train_loss": -26.48634147644043, "global_step": 439818, "epoch": 5299} {"train_loss": -26.45284080505371, "global_step": 439819, "epoch": 5299} {"train_loss": -26.211538314819336, "global_step": 439820, "epoch": 5299} {"train_loss": -26.363758087158203, "global_step": 439821, "epoch": 5299} {"train_loss": -26.801950454711914, "global_step": 439822, "epoch": 5299} {"train_loss": -26.81831169128418, "global_step": 439823, "epoch": 5299} {"train_loss": -26.87666893005371, "global_step": 439824, "epoch": 5299} {"train_loss": -26.54829216003418, "global_step": 439825, "epoch": 5299} {"train_loss": -27.05451774597168, "global_step": 439826, "epoch": 5299} {"train_loss": -26.952289581298828, "global_step": 439827, "epoch": 5299} {"train_loss": -26.459081649780273, "global_step": 439828, "epoch": 5299} {"train_loss": -27.055631637573242, "global_step": 439829, "epoch": 5299} {"train_loss": -26.648080825805664, "global_step": 439830, "epoch": 5299} {"train_loss": -27.201904296875, "global_step": 439831, "epoch": 5299} {"train_loss": -27.00149917602539, "global_step": 439832, "epoch": 5299} {"train_loss": -26.35516357421875, "global_step": 439833, "epoch": 5299} {"train_loss": -26.7313175201416, "global_step": 439834, "epoch": 5299} {"train_loss": -26.89337158203125, "global_step": 439835, "epoch": 5299} {"train_loss": -27.066877365112305, "global_step": 439836, "epoch": 5299} {"train_loss": -26.978967666625977, "global_step": 439837, "epoch": 5299} {"train_loss": -26.700708389282227, "global_step": 439838, "epoch": 5299} {"train_loss": -27.0386962890625, "global_step": 439839, "epoch": 5299} {"train_loss": -27.2142276763916, "global_step": 439840, "epoch": 5299} {"train_loss": -27.470869064331055, "global_step": 439841, "epoch": 5299} {"train_loss": -26.992294311523438, "global_step": 439842, "epoch": 5299} {"train_loss": -27.172473907470703, "global_step": 439843, "epoch": 5299} {"train_loss": -27.037918090820312, "global_step": 439844, "epoch": 5299} {"train_loss": -27.09787940979004, "global_step": 439845, "epoch": 5299} {"train_loss": -27.127429962158203, "global_step": 439846, "epoch": 5299} {"train_loss": -26.928125381469727, "global_step": 439847, "epoch": 5299} {"train_loss": -27.171125411987305, "global_step": 439848, "epoch": 5299} {"train_loss": -26.88117790222168, "global_step": 439849, "epoch": 5299} {"train_loss": -27.08365821838379, "global_step": 439850, "epoch": 5299} {"train_loss": -27.0336971282959, "global_step": 439851, "epoch": 5299} {"train_loss": -26.994516372680664, "global_step": 439852, "epoch": 5299} {"train_loss": -27.095996856689453, "global_step": 439853, "epoch": 5299} {"train_loss": -27.206268310546875, "global_step": 439854, "epoch": 5299} {"train_loss": -26.74494743347168, "global_step": 439855, "epoch": 5299} {"train_loss": -26.882659912109375, "global_step": 439856, "epoch": 5299} {"train_loss": -27.13852310180664, "global_step": 439857, "epoch": 5299} {"train_loss": -27.024372100830078, "global_step": 439858, "epoch": 5299} {"train_loss": -27.247724533081055, "global_step": 439859, "epoch": 5299} {"train_loss": -27.188995361328125, "global_step": 439860, "epoch": 5299} {"train_loss": -26.732267379760742, "global_step": 439861, "epoch": 5299} {"train_loss": -26.66465187072754, "global_step": 439862, "epoch": 5299} {"train_loss": -26.639270782470703, "global_step": 439863, "epoch": 5299} {"train_loss": -26.871021270751953, "global_step": 439864, "epoch": 5299} {"train_loss": -26.89430046081543, "global_step": 439865, "epoch": 5299} {"train_loss": -26.794574737548828, "global_step": 439866, "epoch": 5299} {"train_loss": -26.922605514526367, "global_step": 439867, "epoch": 5299} {"train_loss": -26.458251953125, "global_step": 439868, "epoch": 5299} {"train_loss": -26.6375789642334, "global_step": 439869, "epoch": 5299} {"train_loss": -27.063138961791992, "global_step": 439870, "epoch": 5299} {"train_loss": -27.05695152282715, "global_step": 439871, "epoch": 5299} {"train_loss": -26.685749053955078, "global_step": 439872, "epoch": 5299} {"train_loss": -26.59193992614746, "global_step": 439873, "epoch": 5299} {"train_loss": -26.565778732299805, "global_step": 439874, "epoch": 5299} {"train_loss": -26.53232192993164, "global_step": 439875, "epoch": 5299} {"train_loss": -26.714847564697266, "global_step": 439876, "epoch": 5299} {"train_loss": -26.613489151000977, "global_step": 439877, "epoch": 5299} {"train_loss": -26.86292839050293, "global_step": 439878, "epoch": 5299} {"train_loss": -26.69562339782715, "global_step": 439879, "epoch": 5299} {"train_loss": -26.96087646484375, "global_step": 439880, "epoch": 5299} {"train_loss": -27.035444259643555, "global_step": 439881, "epoch": 5299} {"train_loss": -26.93317985534668, "global_step": 439882, "epoch": 5299} {"train_loss": -26.544782638549805, "global_step": 439883, "epoch": 5299} {"train_loss": -27.15799903869629, "global_step": 439884, "epoch": 5299} {"train_loss": -26.963109970092773, "global_step": 439885, "epoch": 5299} {"train_loss": -27.187360763549805, "global_step": 439886, "epoch": 5299} {"train_loss": -27.068323135375977, "global_step": 439887, "epoch": 5299} {"train_loss": -26.889554977416992, "global_step": 439888, "epoch": 5299} {"train_loss": -26.827198028564453, "global_step": 439889, "epoch": 5299} {"train_loss": -27.28692626953125, "global_step": 439890, "epoch": 5299} {"train_loss": -26.99073600769043, "global_step": 439891, "epoch": 5299} {"train_loss": -26.92597770690918, "global_step": 439892, "epoch": 5299} {"train_loss": -26.586688995361328, "global_step": 439893, "epoch": 5299} {"train_loss": -27.02959632873535, "global_step": 439894, "epoch": 5299} {"train_loss": -27.03779411315918, "global_step": 439895, "epoch": 5299} {"train_loss": -27.108081817626953, "global_step": 439896, "epoch": 5299} {"train_loss": -27.16668128967285, "global_step": 439897, "epoch": 5299} {"train_loss": -26.991491317749023, "global_step": 439898, "epoch": 5299} {"train_loss": -26.882972648344843, "global_step": 439899, "epoch": 5299, "val_loss": 6527821.5} {"train_loss": -27.01779556274414, "global_step": 439900, "epoch": 5300} {"train_loss": -26.849624633789062, "global_step": 439901, "epoch": 5300} {"train_loss": -26.627668380737305, "global_step": 439902, "epoch": 5300} {"train_loss": -26.7139835357666, "global_step": 439903, "epoch": 5300} {"train_loss": -26.5920352935791, "global_step": 439904, "epoch": 5300} {"train_loss": -26.755538940429688, "global_step": 439905, "epoch": 5300} {"train_loss": -27.108673095703125, "global_step": 439906, "epoch": 5300} {"train_loss": -26.781095504760742, "global_step": 439907, "epoch": 5300} {"train_loss": -26.742528915405273, "global_step": 439908, "epoch": 5300} {"train_loss": -27.056598663330078, "global_step": 439909, "epoch": 5300} {"train_loss": -26.6879940032959, "global_step": 439910, "epoch": 5300} {"train_loss": -26.67610740661621, "global_step": 439911, "epoch": 5300} {"train_loss": -26.68109703063965, "global_step": 439912, "epoch": 5300} {"train_loss": -26.91745948791504, "global_step": 439913, "epoch": 5300} {"train_loss": -26.96363639831543, "global_step": 439914, "epoch": 5300} {"train_loss": -26.946455001831055, "global_step": 439915, "epoch": 5300} {"train_loss": -27.06727409362793, "global_step": 439916, "epoch": 5300} {"train_loss": -26.970945358276367, "global_step": 439917, "epoch": 5300} {"train_loss": -27.018157958984375, "global_step": 439918, "epoch": 5300} {"train_loss": -27.135766983032227, "global_step": 439919, "epoch": 5300} {"train_loss": -27.04656410217285, "global_step": 439920, "epoch": 5300} {"train_loss": -26.936405181884766, "global_step": 439921, "epoch": 5300} {"train_loss": -26.58296012878418, "global_step": 439922, "epoch": 5300} {"train_loss": -26.878482818603516, "global_step": 439923, "epoch": 5300} {"train_loss": -26.7430362701416, "global_step": 439924, "epoch": 5300} {"train_loss": -26.720829010009766, "global_step": 439925, "epoch": 5300} {"train_loss": -26.762252807617188, "global_step": 439926, "epoch": 5300} {"train_loss": -27.16082763671875, "global_step": 439927, "epoch": 5300} {"train_loss": -27.244537353515625, "global_step": 439928, "epoch": 5300} {"train_loss": -27.113061904907227, "global_step": 439929, "epoch": 5300} {"train_loss": -27.235397338867188, "global_step": 439930, "epoch": 5300} {"train_loss": -27.0865421295166, "global_step": 439931, "epoch": 5300} {"train_loss": -27.029260635375977, "global_step": 439932, "epoch": 5300} {"train_loss": -26.58072280883789, "global_step": 439933, "epoch": 5300} {"train_loss": -26.653284072875977, "global_step": 439934, "epoch": 5300} {"train_loss": -27.12269401550293, "global_step": 439935, "epoch": 5300} {"train_loss": -27.241958618164062, "global_step": 439936, "epoch": 5300} {"train_loss": -26.922468185424805, "global_step": 439937, "epoch": 5300} {"train_loss": -26.721195220947266, "global_step": 439938, "epoch": 5300} {"train_loss": -26.71381950378418, "global_step": 439939, "epoch": 5300} {"train_loss": -26.487028121948242, "global_step": 439940, "epoch": 5300} {"train_loss": -26.733640670776367, "global_step": 439941, "epoch": 5300} {"train_loss": -26.998056411743164, "global_step": 439942, "epoch": 5300} {"train_loss": -27.104135513305664, "global_step": 439943, "epoch": 5300} {"train_loss": -27.17982292175293, "global_step": 439944, "epoch": 5300} {"train_loss": -26.954328536987305, "global_step": 439945, "epoch": 5300} {"train_loss": -26.62068748474121, "global_step": 439946, "epoch": 5300} {"train_loss": -26.6694278717041, "global_step": 439947, "epoch": 5300} {"train_loss": -26.60101318359375, "global_step": 439948, "epoch": 5300} {"train_loss": -26.880552291870117, "global_step": 439949, "epoch": 5300} {"train_loss": -27.03263282775879, "global_step": 439950, "epoch": 5300} {"train_loss": -26.637969970703125, "global_step": 439951, "epoch": 5300} {"train_loss": -26.707387924194336, "global_step": 439952, "epoch": 5300} {"train_loss": -27.1846981048584, "global_step": 439953, "epoch": 5300} {"train_loss": -26.6258544921875, "global_step": 439954, "epoch": 5300} {"train_loss": -26.344568252563477, "global_step": 439955, "epoch": 5300} {"train_loss": -26.487234115600586, "global_step": 439956, "epoch": 5300} {"train_loss": -26.817218780517578, "global_step": 439957, "epoch": 5300} {"train_loss": -26.555845260620117, "global_step": 439958, "epoch": 5300} {"train_loss": -26.681293487548828, "global_step": 439959, "epoch": 5300} {"train_loss": -26.832019805908203, "global_step": 439960, "epoch": 5300} {"train_loss": -26.768686294555664, "global_step": 439961, "epoch": 5300} {"train_loss": -26.951932907104492, "global_step": 439962, "epoch": 5300} {"train_loss": -27.322980880737305, "global_step": 439963, "epoch": 5300} {"train_loss": -27.519987106323242, "global_step": 439964, "epoch": 5300} {"train_loss": -26.895605087280273, "global_step": 439965, "epoch": 5300} {"train_loss": -27.131460189819336, "global_step": 439966, "epoch": 5300} {"train_loss": -26.653364181518555, "global_step": 439967, "epoch": 5300} {"train_loss": -27.122793197631836, "global_step": 439968, "epoch": 5300} {"train_loss": -27.306598663330078, "global_step": 439969, "epoch": 5300} {"train_loss": -26.680822372436523, "global_step": 439970, "epoch": 5300} {"train_loss": -27.355772018432617, "global_step": 439971, "epoch": 5300} {"train_loss": -27.220428466796875, "global_step": 439972, "epoch": 5300} {"train_loss": -26.967716217041016, "global_step": 439973, "epoch": 5300} {"train_loss": -26.89011001586914, "global_step": 439974, "epoch": 5300} {"train_loss": -27.23300552368164, "global_step": 439975, "epoch": 5300} {"train_loss": -27.030384063720703, "global_step": 439976, "epoch": 5300} {"train_loss": -27.030332565307617, "global_step": 439977, "epoch": 5300} {"train_loss": -27.21036720275879, "global_step": 439978, "epoch": 5300} {"train_loss": -27.138696670532227, "global_step": 439979, "epoch": 5300} {"train_loss": -27.365955352783203, "global_step": 439980, "epoch": 5300} {"train_loss": -27.476755142211914, "global_step": 439981, "epoch": 5300} {"train_loss": -26.92512477736875, "global_step": 439982, "epoch": 5300, "train/sim_max_reward_0": 0.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 0.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4500000": 1.0, "test/sim_max_reward_4500001": 1.0, "test/sim_max_reward_4500002": 1.0, "test/sim_max_reward_4500003": 1.0, "test/sim_max_reward_4500004": 1.0, "test/sim_max_reward_4500005": 1.0, "test/sim_max_reward_4500006": 1.0, "test/sim_max_reward_4500007": 0.0, "test/sim_max_reward_4500008": 1.0, "test/sim_max_reward_4500009": 1.0, "test/sim_max_reward_4500010": 1.0, "test/sim_max_reward_4500011": 1.0, "test/sim_max_reward_4500012": 1.0, "test/sim_max_reward_4500013": 1.0, "test/sim_max_reward_4500014": 1.0, "test/sim_max_reward_4500015": 1.0, "test/sim_max_reward_4500016": 1.0, "test/sim_max_reward_4500017": 1.0, "test/sim_max_reward_4500018": 0.0, "test/sim_max_reward_4500019": 1.0, "test/sim_max_reward_4500020": 1.0, "test/sim_max_reward_4500021": 1.0, "train/mean_score": 0.6666666666666666, "test/mean_score": 0.9090909090909091, "val_loss": 6639391.5} {"train_loss": -26.573028564453125, "global_step": 439983, "epoch": 5301} {"train_loss": -26.799535751342773, "global_step": 439984, "epoch": 5301} {"train_loss": -26.586267471313477, "global_step": 439985, "epoch": 5301} {"train_loss": -26.318044662475586, "global_step": 439986, "epoch": 5301} {"train_loss": -26.6751708984375, "global_step": 439987, "epoch": 5301} {"train_loss": -26.568527221679688, "global_step": 439988, "epoch": 5301} {"train_loss": -26.744155883789062, "global_step": 439989, "epoch": 5301} {"train_loss": -26.97258949279785, "global_step": 439990, "epoch": 5301} {"train_loss": -26.850662231445312, "global_step": 439991, "epoch": 5301} {"train_loss": -26.803924560546875, "global_step": 439992, "epoch": 5301} {"train_loss": -26.74382972717285, "global_step": 439993, "epoch": 5301} {"train_loss": -26.827560424804688, "global_step": 439994, "epoch": 5301} {"train_loss": -26.650686264038086, "global_step": 439995, "epoch": 5301} {"train_loss": -27.131759643554688, "global_step": 439996, "epoch": 5301} {"train_loss": -26.72706413269043, "global_step": 439997, "epoch": 5301} {"train_loss": -26.708051681518555, "global_step": 439998, "epoch": 5301} {"train_loss": -27.275365829467773, "global_step": 439999, "epoch": 5301} {"train_loss": -26.97991371154785, "global_step": 440000, "epoch": 5301} {"train_loss": -26.753576278686523, "global_step": 440001, "epoch": 5301} {"train_loss": -26.95290184020996, "global_step": 440002, "epoch": 5301} {"train_loss": -26.554723739624023, "global_step": 440003, "epoch": 5301} {"train_loss": -27.0677433013916, "global_step": 440004, "epoch": 5301} {"train_loss": -26.96760368347168, "global_step": 440005, "epoch": 5301} {"train_loss": -27.078693389892578, "global_step": 440006, "epoch": 5301} {"train_loss": -26.98221206665039, "global_step": 440007, "epoch": 5301} {"train_loss": -26.834884643554688, "global_step": 440008, "epoch": 5301} {"train_loss": -26.7507381439209, "global_step": 440009, "epoch": 5301} {"train_loss": -26.70344352722168, "global_step": 440010, "epoch": 5301} {"train_loss": -27.005176544189453, "global_step": 440011, "epoch": 5301} {"train_loss": -27.234094619750977, "global_step": 440012, "epoch": 5301} {"train_loss": -26.848773956298828, "global_step": 440013, "epoch": 5301} {"train_loss": -26.60186195373535, "global_step": 440014, "epoch": 5301} {"train_loss": -27.319990158081055, "global_step": 440015, "epoch": 5301} {"train_loss": -27.070249557495117, "global_step": 440016, "epoch": 5301} {"train_loss": -26.80689811706543, "global_step": 440017, "epoch": 5301} {"train_loss": -26.627567291259766, "global_step": 440018, "epoch": 5301} {"train_loss": -27.11566734313965, "global_step": 440019, "epoch": 5301} {"train_loss": -27.108081817626953, "global_step": 440020, "epoch": 5301} {"train_loss": -27.1102352142334, "global_step": 440021, "epoch": 5301} {"train_loss": -26.81097412109375, "global_step": 440022, "epoch": 5301} {"train_loss": -26.891645431518555, "global_step": 440023, "epoch": 5301} {"train_loss": -26.976215362548828, "global_step": 440024, "epoch": 5301} {"train_loss": -26.52847671508789, "global_step": 440025, "epoch": 5301} {"train_loss": -26.632429122924805, "global_step": 440026, "epoch": 5301} {"train_loss": -26.74032974243164, "global_step": 440027, "epoch": 5301} {"train_loss": -27.079269409179688, "global_step": 440028, "epoch": 5301} {"train_loss": -27.283044815063477, "global_step": 440029, "epoch": 5301} {"train_loss": -26.966999053955078, "global_step": 440030, "epoch": 5301} {"train_loss": -26.85321617126465, "global_step": 440031, "epoch": 5301} {"train_loss": -27.502233505249023, "global_step": 440032, "epoch": 5301} {"train_loss": -27.217864990234375, "global_step": 440033, "epoch": 5301} {"train_loss": -26.817657470703125, "global_step": 440034, "epoch": 5301} {"train_loss": -26.970544815063477, "global_step": 440035, "epoch": 5301} {"train_loss": -27.186542510986328, "global_step": 440036, "epoch": 5301} {"train_loss": -27.072019577026367, "global_step": 440037, "epoch": 5301} {"train_loss": -26.862781524658203, "global_step": 440038, "epoch": 5301} {"train_loss": -26.78494644165039, "global_step": 440039, "epoch": 5301} {"train_loss": -26.554800033569336, "global_step": 440040, "epoch": 5301} {"train_loss": -26.085805892944336, "global_step": 440041, "epoch": 5301} {"train_loss": -26.909515380859375, "global_step": 440042, "epoch": 5301} {"train_loss": -27.284452438354492, "global_step": 440043, "epoch": 5301} {"train_loss": -26.974470138549805, "global_step": 440044, "epoch": 5301} {"train_loss": -26.731525421142578, "global_step": 440045, "epoch": 5301} {"train_loss": -26.631183624267578, "global_step": 440046, "epoch": 5301} {"train_loss": -26.533315658569336, "global_step": 440047, "epoch": 5301} {"train_loss": -26.778411865234375, "global_step": 440048, "epoch": 5301} {"train_loss": -26.98557472229004, "global_step": 440049, "epoch": 5301} {"train_loss": -26.553552627563477, "global_step": 440050, "epoch": 5301} {"train_loss": -26.965253829956055, "global_step": 440051, "epoch": 5301} {"train_loss": -26.961557388305664, "global_step": 440052, "epoch": 5301} {"train_loss": -26.699848175048828, "global_step": 440053, "epoch": 5301} {"train_loss": -26.986127853393555, "global_step": 440054, "epoch": 5301} {"train_loss": -26.773681640625, "global_step": 440055, "epoch": 5301} {"train_loss": -26.78205680847168, "global_step": 440056, "epoch": 5301} {"train_loss": -27.068527221679688, "global_step": 440057, "epoch": 5301} {"train_loss": -26.985157012939453, "global_step": 440058, "epoch": 5301} {"train_loss": -27.33076286315918, "global_step": 440059, "epoch": 5301} {"train_loss": -27.11541748046875, "global_step": 440060, "epoch": 5301} {"train_loss": -26.6903076171875, "global_step": 440061, "epoch": 5301} {"train_loss": -27.164941787719727, "global_step": 440062, "epoch": 5301} {"train_loss": -27.099828720092773, "global_step": 440063, "epoch": 5301} {"train_loss": -26.87906837463379, "global_step": 440064, "epoch": 5301} {"train_loss": -26.888772435935145, "global_step": 440065, "epoch": 5301, "val_loss": 6665250.0} {"train_loss": -26.198118209838867, "global_step": 440066, "epoch": 5302} {"train_loss": -26.218936920166016, "global_step": 440067, "epoch": 5302} {"train_loss": -26.095746994018555, "global_step": 440068, "epoch": 5302} {"train_loss": -26.092248916625977, "global_step": 440069, "epoch": 5302} {"train_loss": -26.485462188720703, "global_step": 440070, "epoch": 5302} {"train_loss": -25.87470817565918, "global_step": 440071, "epoch": 5302} {"train_loss": -26.27583122253418, "global_step": 440072, "epoch": 5302} {"train_loss": -26.16639518737793, "global_step": 440073, "epoch": 5302} {"train_loss": -26.391138076782227, "global_step": 440074, "epoch": 5302} {"train_loss": -26.318899154663086, "global_step": 440075, "epoch": 5302} {"train_loss": -26.78346061706543, "global_step": 440076, "epoch": 5302} {"train_loss": -26.562585830688477, "global_step": 440077, "epoch": 5302} {"train_loss": -26.739643096923828, "global_step": 440078, "epoch": 5302} {"train_loss": -26.483922958374023, "global_step": 440079, "epoch": 5302} {"train_loss": -26.381772994995117, "global_step": 440080, "epoch": 5302} {"train_loss": -26.7882080078125, "global_step": 440081, "epoch": 5302} {"train_loss": -26.674957275390625, "global_step": 440082, "epoch": 5302} {"train_loss": -26.428924560546875, "global_step": 440083, "epoch": 5302} {"train_loss": -26.893407821655273, "global_step": 440084, "epoch": 5302} {"train_loss": -26.45270347595215, "global_step": 440085, "epoch": 5302} {"train_loss": -26.818578720092773, "global_step": 440086, "epoch": 5302} {"train_loss": -26.661396026611328, "global_step": 440087, "epoch": 5302} {"train_loss": -26.81939125061035, "global_step": 440088, "epoch": 5302} {"train_loss": -26.689435958862305, "global_step": 440089, "epoch": 5302} {"train_loss": -26.67359733581543, "global_step": 440090, "epoch": 5302} {"train_loss": -26.850873947143555, "global_step": 440091, "epoch": 5302} {"train_loss": -26.7976016998291, "global_step": 440092, "epoch": 5302} {"train_loss": -27.0594539642334, "global_step": 440093, "epoch": 5302} {"train_loss": -26.910099029541016, "global_step": 440094, "epoch": 5302} {"train_loss": -27.240131378173828, "global_step": 440095, "epoch": 5302} {"train_loss": -26.47669792175293, "global_step": 440096, "epoch": 5302} {"train_loss": -26.788644790649414, "global_step": 440097, "epoch": 5302} {"train_loss": -26.72419548034668, "global_step": 440098, "epoch": 5302} {"train_loss": -27.064289093017578, "global_step": 440099, "epoch": 5302} {"train_loss": -27.138090133666992, "global_step": 440100, "epoch": 5302} {"train_loss": -26.84674644470215, "global_step": 440101, "epoch": 5302} {"train_loss": -26.880842208862305, "global_step": 440102, "epoch": 5302} {"train_loss": -27.133121490478516, "global_step": 440103, "epoch": 5302} {"train_loss": -26.5380916595459, "global_step": 440104, "epoch": 5302} {"train_loss": -27.180463790893555, "global_step": 440105, "epoch": 5302} {"train_loss": -27.22273063659668, "global_step": 440106, "epoch": 5302} {"train_loss": -27.004749298095703, "global_step": 440107, "epoch": 5302} {"train_loss": -27.25908851623535, "global_step": 440108, "epoch": 5302} {"train_loss": -26.93194580078125, "global_step": 440109, "epoch": 5302} {"train_loss": -26.70195960998535, "global_step": 440110, "epoch": 5302} {"train_loss": -27.401479721069336, "global_step": 440111, "epoch": 5302} {"train_loss": -27.271154403686523, "global_step": 440112, "epoch": 5302} {"train_loss": -27.2273006439209, "global_step": 440113, "epoch": 5302} {"train_loss": -26.8000545501709, "global_step": 440114, "epoch": 5302} {"train_loss": -27.105947494506836, "global_step": 440115, "epoch": 5302} {"train_loss": -27.025074005126953, "global_step": 440116, "epoch": 5302} {"train_loss": -27.0441837310791, "global_step": 440117, "epoch": 5302} {"train_loss": -26.916004180908203, "global_step": 440118, "epoch": 5302} {"train_loss": -26.9122314453125, "global_step": 440119, "epoch": 5302} {"train_loss": -27.252124786376953, "global_step": 440120, "epoch": 5302} {"train_loss": -27.4591121673584, "global_step": 440121, "epoch": 5302} {"train_loss": -27.283761978149414, "global_step": 440122, "epoch": 5302} {"train_loss": -26.887067794799805, "global_step": 440123, "epoch": 5302} {"train_loss": -27.060089111328125, "global_step": 440124, "epoch": 5302} {"train_loss": -27.387176513671875, "global_step": 440125, "epoch": 5302} {"train_loss": -26.723281860351562, "global_step": 440126, "epoch": 5302} {"train_loss": -26.718658447265625, "global_step": 440127, "epoch": 5302} {"train_loss": -25.790464401245117, "global_step": 440128, "epoch": 5302} {"train_loss": -25.258268356323242, "global_step": 440129, "epoch": 5302} {"train_loss": -26.1339111328125, "global_step": 440130, "epoch": 5302} {"train_loss": -26.7217960357666, "global_step": 440131, "epoch": 5302} {"train_loss": -26.181842803955078, "global_step": 440132, "epoch": 5302} {"train_loss": -26.105234146118164, "global_step": 440133, "epoch": 5302} {"train_loss": -26.16301918029785, "global_step": 440134, "epoch": 5302} {"train_loss": -27.071821212768555, "global_step": 440135, "epoch": 5302} {"train_loss": -26.232574462890625, "global_step": 440136, "epoch": 5302} {"train_loss": -26.393625259399414, "global_step": 440137, "epoch": 5302} {"train_loss": -26.830286026000977, "global_step": 440138, "epoch": 5302} {"train_loss": -26.28875732421875, "global_step": 440139, "epoch": 5302} {"train_loss": -26.62615966796875, "global_step": 440140, "epoch": 5302} {"train_loss": -26.590341567993164, "global_step": 440141, "epoch": 5302} {"train_loss": -26.655736923217773, "global_step": 440142, "epoch": 5302} {"train_loss": -26.846698760986328, "global_step": 440143, "epoch": 5302} {"train_loss": -26.68671989440918, "global_step": 440144, "epoch": 5302} {"train_loss": -26.50445556640625, "global_step": 440145, "epoch": 5302} {"train_loss": -26.68535804748535, "global_step": 440146, "epoch": 5302} {"train_loss": -26.242910385131836, "global_step": 440147, "epoch": 5302} {"train_loss": -26.699456892817853, "global_step": 440148, "epoch": 5302, "val_loss": 6580163.0} {"train_loss": -25.65704917907715, "global_step": 440149, "epoch": 5303} {"train_loss": -26.39203453063965, "global_step": 440150, "epoch": 5303} {"train_loss": -25.954212188720703, "global_step": 440151, "epoch": 5303} {"train_loss": -26.276113510131836, "global_step": 440152, "epoch": 5303} {"train_loss": -26.116561889648438, "global_step": 440153, "epoch": 5303} {"train_loss": -26.350812911987305, "global_step": 440154, "epoch": 5303} {"train_loss": -26.191986083984375, "global_step": 440155, "epoch": 5303} {"train_loss": -26.783721923828125, "global_step": 440156, "epoch": 5303} {"train_loss": -26.438623428344727, "global_step": 440157, "epoch": 5303} {"train_loss": -26.702472686767578, "global_step": 440158, "epoch": 5303} {"train_loss": -26.68387222290039, "global_step": 440159, "epoch": 5303} {"train_loss": -26.37896156311035, "global_step": 440160, "epoch": 5303} {"train_loss": -26.667272567749023, "global_step": 440161, "epoch": 5303} {"train_loss": -26.362075805664062, "global_step": 440162, "epoch": 5303} {"train_loss": -26.7347412109375, "global_step": 440163, "epoch": 5303} {"train_loss": -26.25922966003418, "global_step": 440164, "epoch": 5303} {"train_loss": -26.661237716674805, "global_step": 440165, "epoch": 5303} {"train_loss": -26.537450790405273, "global_step": 440166, "epoch": 5303} {"train_loss": -26.911298751831055, "global_step": 440167, "epoch": 5303} {"train_loss": -26.682138442993164, "global_step": 440168, "epoch": 5303} {"train_loss": -26.731658935546875, "global_step": 440169, "epoch": 5303} {"train_loss": -26.779870986938477, "global_step": 440170, "epoch": 5303} {"train_loss": -26.727197647094727, "global_step": 440171, "epoch": 5303} {"train_loss": -26.74252700805664, "global_step": 440172, "epoch": 5303} {"train_loss": -27.297779083251953, "global_step": 440173, "epoch": 5303} {"train_loss": -27.027978897094727, "global_step": 440174, "epoch": 5303} {"train_loss": -27.02347183227539, "global_step": 440175, "epoch": 5303} {"train_loss": -26.92230224609375, "global_step": 440176, "epoch": 5303} {"train_loss": -26.780099868774414, "global_step": 440177, "epoch": 5303} {"train_loss": -26.849567413330078, "global_step": 440178, "epoch": 5303} {"train_loss": -27.09842872619629, "global_step": 440179, "epoch": 5303} {"train_loss": -26.8164119720459, "global_step": 440180, "epoch": 5303} {"train_loss": -26.849456787109375, "global_step": 440181, "epoch": 5303} {"train_loss": -26.9469051361084, "global_step": 440182, "epoch": 5303} {"train_loss": -27.296491622924805, "global_step": 440183, "epoch": 5303} {"train_loss": -27.2666015625, "global_step": 440184, "epoch": 5303} {"train_loss": -26.803043365478516, "global_step": 440185, "epoch": 5303} {"train_loss": -27.108789443969727, "global_step": 440186, "epoch": 5303} {"train_loss": -27.108625411987305, "global_step": 440187, "epoch": 5303} {"train_loss": -27.076004028320312, "global_step": 440188, "epoch": 5303} {"train_loss": -27.162031173706055, "global_step": 440189, "epoch": 5303} {"train_loss": -26.9471378326416, "global_step": 440190, "epoch": 5303} {"train_loss": -27.169702529907227, "global_step": 440191, "epoch": 5303} {"train_loss": -27.495574951171875, "global_step": 440192, "epoch": 5303} {"train_loss": -26.980260848999023, "global_step": 440193, "epoch": 5303} {"train_loss": -27.021215438842773, "global_step": 440194, "epoch": 5303} {"train_loss": -27.503448486328125, "global_step": 440195, "epoch": 5303} {"train_loss": -26.805164337158203, "global_step": 440196, "epoch": 5303} {"train_loss": -27.043933868408203, "global_step": 440197, "epoch": 5303} {"train_loss": -27.1981201171875, "global_step": 440198, "epoch": 5303} {"train_loss": -27.310266494750977, "global_step": 440199, "epoch": 5303} {"train_loss": -26.864124298095703, "global_step": 440200, "epoch": 5303} {"train_loss": -26.760297775268555, "global_step": 440201, "epoch": 5303} {"train_loss": -26.04766845703125, "global_step": 440202, "epoch": 5303} {"train_loss": -26.05986976623535, "global_step": 440203, "epoch": 5303} {"train_loss": -25.692895889282227, "global_step": 440204, "epoch": 5303} {"train_loss": -25.03875732421875, "global_step": 440205, "epoch": 5303} {"train_loss": -26.486433029174805, "global_step": 440206, "epoch": 5303} {"train_loss": -26.523168563842773, "global_step": 440207, "epoch": 5303} {"train_loss": -26.465869903564453, "global_step": 440208, "epoch": 5303} {"train_loss": -26.3162899017334, "global_step": 440209, "epoch": 5303} {"train_loss": -26.997129440307617, "global_step": 440210, "epoch": 5303} {"train_loss": -26.691450119018555, "global_step": 440211, "epoch": 5303} {"train_loss": -26.67391014099121, "global_step": 440212, "epoch": 5303} {"train_loss": -26.818342208862305, "global_step": 440213, "epoch": 5303} {"train_loss": -26.543975830078125, "global_step": 440214, "epoch": 5303} {"train_loss": -26.7774658203125, "global_step": 440215, "epoch": 5303} {"train_loss": -26.750951766967773, "global_step": 440216, "epoch": 5303} {"train_loss": -26.325153350830078, "global_step": 440217, "epoch": 5303} {"train_loss": -27.028900146484375, "global_step": 440218, "epoch": 5303} {"train_loss": -26.9005184173584, "global_step": 440219, "epoch": 5303} {"train_loss": -26.66578483581543, "global_step": 440220, "epoch": 5303} {"train_loss": -26.711566925048828, "global_step": 440221, "epoch": 5303} {"train_loss": -26.791645050048828, "global_step": 440222, "epoch": 5303} {"train_loss": -27.08975601196289, "global_step": 440223, "epoch": 5303} {"train_loss": -26.78424644470215, "global_step": 440224, "epoch": 5303} {"train_loss": -26.947072982788086, "global_step": 440225, "epoch": 5303} {"train_loss": -27.026559829711914, "global_step": 440226, "epoch": 5303} {"train_loss": -27.322790145874023, "global_step": 440227, "epoch": 5303} {"train_loss": -26.93580436706543, "global_step": 440228, "epoch": 5303} {"train_loss": -27.451099395751953, "global_step": 440229, "epoch": 5303} {"train_loss": -26.797887802124023, "global_step": 440230, "epoch": 5303} {"train_loss": -26.74084238259189, "global_step": 440231, "epoch": 5303, "val_loss": 6602104.0} {"train_loss": -26.048999786376953, "global_step": 440232, "epoch": 5304} {"train_loss": -26.01238441467285, "global_step": 440233, "epoch": 5304} {"train_loss": -26.34746742248535, "global_step": 440234, "epoch": 5304} {"train_loss": -26.469831466674805, "global_step": 440235, "epoch": 5304} {"train_loss": -26.2525634765625, "global_step": 440236, "epoch": 5304} {"train_loss": -26.78841209411621, "global_step": 440237, "epoch": 5304} {"train_loss": -26.410755157470703, "global_step": 440238, "epoch": 5304} {"train_loss": -26.206029891967773, "global_step": 440239, "epoch": 5304} {"train_loss": -26.951181411743164, "global_step": 440240, "epoch": 5304} {"train_loss": -26.56605339050293, "global_step": 440241, "epoch": 5304} {"train_loss": -25.94868278503418, "global_step": 440242, "epoch": 5304} {"train_loss": -26.330738067626953, "global_step": 440243, "epoch": 5304} {"train_loss": -26.349584579467773, "global_step": 440244, "epoch": 5304} {"train_loss": -26.653854370117188, "global_step": 440245, "epoch": 5304} {"train_loss": -26.70529556274414, "global_step": 440246, "epoch": 5304} {"train_loss": -26.875295639038086, "global_step": 440247, "epoch": 5304} {"train_loss": -26.395292282104492, "global_step": 440248, "epoch": 5304} {"train_loss": -26.69406509399414, "global_step": 440249, "epoch": 5304} {"train_loss": -26.53131675720215, "global_step": 440250, "epoch": 5304} {"train_loss": -26.548627853393555, "global_step": 440251, "epoch": 5304} {"train_loss": -26.773046493530273, "global_step": 440252, "epoch": 5304} {"train_loss": -26.464569091796875, "global_step": 440253, "epoch": 5304} {"train_loss": -26.559284210205078, "global_step": 440254, "epoch": 5304} {"train_loss": -26.795398712158203, "global_step": 440255, "epoch": 5304} {"train_loss": -26.96116065979004, "global_step": 440256, "epoch": 5304} {"train_loss": -26.63526725769043, "global_step": 440257, "epoch": 5304} {"train_loss": -26.793493270874023, "global_step": 440258, "epoch": 5304} {"train_loss": -26.856210708618164, "global_step": 440259, "epoch": 5304} {"train_loss": -26.79071044921875, "global_step": 440260, "epoch": 5304} {"train_loss": -27.1109619140625, "global_step": 440261, "epoch": 5304} {"train_loss": -26.87958335876465, "global_step": 440262, "epoch": 5304} {"train_loss": -26.848371505737305, "global_step": 440263, "epoch": 5304} {"train_loss": -26.82808494567871, "global_step": 440264, "epoch": 5304} {"train_loss": -27.303564071655273, "global_step": 440265, "epoch": 5304} {"train_loss": -26.942960739135742, "global_step": 440266, "epoch": 5304} {"train_loss": -27.497785568237305, "global_step": 440267, "epoch": 5304} {"train_loss": -26.93855857849121, "global_step": 440268, "epoch": 5304} {"train_loss": -27.05024528503418, "global_step": 440269, "epoch": 5304} {"train_loss": -27.229597091674805, "global_step": 440270, "epoch": 5304} {"train_loss": -27.03714370727539, "global_step": 440271, "epoch": 5304} {"train_loss": -27.3425235748291, "global_step": 440272, "epoch": 5304} {"train_loss": -26.897855758666992, "global_step": 440273, "epoch": 5304} {"train_loss": -27.36041831970215, "global_step": 440274, "epoch": 5304} {"train_loss": -27.12054443359375, "global_step": 440275, "epoch": 5304} {"train_loss": -27.15382957458496, "global_step": 440276, "epoch": 5304} {"train_loss": -27.193944931030273, "global_step": 440277, "epoch": 5304} {"train_loss": -27.313947677612305, "global_step": 440278, "epoch": 5304} {"train_loss": -26.908203125, "global_step": 440279, "epoch": 5304} {"train_loss": -26.956762313842773, "global_step": 440280, "epoch": 5304} {"train_loss": -27.075376510620117, "global_step": 440281, "epoch": 5304} {"train_loss": -27.034687042236328, "global_step": 440282, "epoch": 5304} {"train_loss": -27.1751766204834, "global_step": 440283, "epoch": 5304} {"train_loss": -27.196792602539062, "global_step": 440284, "epoch": 5304} {"train_loss": -27.103796005249023, "global_step": 440285, "epoch": 5304} {"train_loss": -27.503437042236328, "global_step": 440286, "epoch": 5304} {"train_loss": -26.79707908630371, "global_step": 440287, "epoch": 5304} {"train_loss": -26.766101837158203, "global_step": 440288, "epoch": 5304} {"train_loss": -26.818140029907227, "global_step": 440289, "epoch": 5304} {"train_loss": -26.75861930847168, "global_step": 440290, "epoch": 5304} {"train_loss": -26.993188858032227, "global_step": 440291, "epoch": 5304} {"train_loss": -26.889795303344727, "global_step": 440292, "epoch": 5304} {"train_loss": -27.07979393005371, "global_step": 440293, "epoch": 5304} {"train_loss": -26.734210968017578, "global_step": 440294, "epoch": 5304} {"train_loss": -26.934106826782227, "global_step": 440295, "epoch": 5304} {"train_loss": -27.1513671875, "global_step": 440296, "epoch": 5304} {"train_loss": -26.354333877563477, "global_step": 440297, "epoch": 5304} {"train_loss": -26.301498413085938, "global_step": 440298, "epoch": 5304} {"train_loss": -26.466522216796875, "global_step": 440299, "epoch": 5304} {"train_loss": -26.506444931030273, "global_step": 440300, "epoch": 5304} {"train_loss": -26.502410888671875, "global_step": 440301, "epoch": 5304} {"train_loss": -26.604114532470703, "global_step": 440302, "epoch": 5304} {"train_loss": -26.74981117248535, "global_step": 440303, "epoch": 5304} {"train_loss": -26.821807861328125, "global_step": 440304, "epoch": 5304} {"train_loss": -26.789031982421875, "global_step": 440305, "epoch": 5304} {"train_loss": -27.125837326049805, "global_step": 440306, "epoch": 5304} {"train_loss": -26.957660675048828, "global_step": 440307, "epoch": 5304} {"train_loss": -26.902002334594727, "global_step": 440308, "epoch": 5304} {"train_loss": -27.092451095581055, "global_step": 440309, "epoch": 5304} {"train_loss": -27.15506935119629, "global_step": 440310, "epoch": 5304} {"train_loss": -27.15049171447754, "global_step": 440311, "epoch": 5304} {"train_loss": -26.848896026611328, "global_step": 440312, "epoch": 5304} {"train_loss": -27.158832550048828, "global_step": 440313, "epoch": 5304} {"train_loss": -26.792016753231188, "global_step": 440314, "epoch": 5304, "val_loss": 6551301.0} {"train_loss": -26.2034854888916, "global_step": 440315, "epoch": 5305} {"train_loss": -26.212589263916016, "global_step": 440316, "epoch": 5305} {"train_loss": -26.118619918823242, "global_step": 440317, "epoch": 5305} {"train_loss": -26.446277618408203, "global_step": 440318, "epoch": 5305} {"train_loss": -25.85394287109375, "global_step": 440319, "epoch": 5305} {"train_loss": -27.05787467956543, "global_step": 440320, "epoch": 5305} {"train_loss": -26.5805606842041, "global_step": 440321, "epoch": 5305} {"train_loss": -26.353275299072266, "global_step": 440322, "epoch": 5305} {"train_loss": -27.066299438476562, "global_step": 440323, "epoch": 5305} {"train_loss": -26.354267120361328, "global_step": 440324, "epoch": 5305} {"train_loss": -26.812414169311523, "global_step": 440325, "epoch": 5305} {"train_loss": -26.7056941986084, "global_step": 440326, "epoch": 5305} {"train_loss": -26.756628036499023, "global_step": 440327, "epoch": 5305} {"train_loss": -26.520910263061523, "global_step": 440328, "epoch": 5305} {"train_loss": -26.75129508972168, "global_step": 440329, "epoch": 5305} {"train_loss": -26.609827041625977, "global_step": 440330, "epoch": 5305} {"train_loss": -26.90553092956543, "global_step": 440331, "epoch": 5305} {"train_loss": -26.878894805908203, "global_step": 440332, "epoch": 5305} {"train_loss": -27.137344360351562, "global_step": 440333, "epoch": 5305} {"train_loss": -26.726415634155273, "global_step": 440334, "epoch": 5305} {"train_loss": -26.73640251159668, "global_step": 440335, "epoch": 5305} {"train_loss": -26.8232479095459, "global_step": 440336, "epoch": 5305} {"train_loss": -27.243452072143555, "global_step": 440337, "epoch": 5305} {"train_loss": -26.86496353149414, "global_step": 440338, "epoch": 5305} {"train_loss": -27.249902725219727, "global_step": 440339, "epoch": 5305} {"train_loss": -26.84844970703125, "global_step": 440340, "epoch": 5305} {"train_loss": -27.33680534362793, "global_step": 440341, "epoch": 5305} {"train_loss": -27.25374412536621, "global_step": 440342, "epoch": 5305} {"train_loss": -27.0776424407959, "global_step": 440343, "epoch": 5305} {"train_loss": -26.814664840698242, "global_step": 440344, "epoch": 5305} {"train_loss": -27.37470817565918, "global_step": 440345, "epoch": 5305} {"train_loss": -26.836505889892578, "global_step": 440346, "epoch": 5305} {"train_loss": -27.319238662719727, "global_step": 440347, "epoch": 5305} {"train_loss": -27.347244262695312, "global_step": 440348, "epoch": 5305} {"train_loss": -27.170486450195312, "global_step": 440349, "epoch": 5305} {"train_loss": -26.937244415283203, "global_step": 440350, "epoch": 5305} {"train_loss": -27.03045082092285, "global_step": 440351, "epoch": 5305} {"train_loss": -27.19318199157715, "global_step": 440352, "epoch": 5305} {"train_loss": -27.017858505249023, "global_step": 440353, "epoch": 5305} {"train_loss": -26.504072189331055, "global_step": 440354, "epoch": 5305} {"train_loss": -27.32306480407715, "global_step": 440355, "epoch": 5305} {"train_loss": -27.077844619750977, "global_step": 440356, "epoch": 5305} {"train_loss": -26.70383644104004, "global_step": 440357, "epoch": 5305} {"train_loss": -27.214941024780273, "global_step": 440358, "epoch": 5305} {"train_loss": -26.929615020751953, "global_step": 440359, "epoch": 5305} {"train_loss": -26.909101486206055, "global_step": 440360, "epoch": 5305} {"train_loss": -27.034921646118164, "global_step": 440361, "epoch": 5305} {"train_loss": -26.94428062438965, "global_step": 440362, "epoch": 5305} {"train_loss": -26.670917510986328, "global_step": 440363, "epoch": 5305} {"train_loss": -26.61020851135254, "global_step": 440364, "epoch": 5305} {"train_loss": -26.905933380126953, "global_step": 440365, "epoch": 5305} {"train_loss": -26.7281494140625, "global_step": 440366, "epoch": 5305} {"train_loss": -26.949552536010742, "global_step": 440367, "epoch": 5305} {"train_loss": -26.875980377197266, "global_step": 440368, "epoch": 5305} {"train_loss": -26.904052734375, "global_step": 440369, "epoch": 5305} {"train_loss": -26.641096115112305, "global_step": 440370, "epoch": 5305} {"train_loss": -26.92400550842285, "global_step": 440371, "epoch": 5305} {"train_loss": -26.818500518798828, "global_step": 440372, "epoch": 5305} {"train_loss": -26.75617027282715, "global_step": 440373, "epoch": 5305} {"train_loss": -26.500879287719727, "global_step": 440374, "epoch": 5305} {"train_loss": -26.892736434936523, "global_step": 440375, "epoch": 5305} {"train_loss": -26.553247451782227, "global_step": 440376, "epoch": 5305} {"train_loss": -27.23689842224121, "global_step": 440377, "epoch": 5305} {"train_loss": -27.07929039001465, "global_step": 440378, "epoch": 5305} {"train_loss": -26.40342140197754, "global_step": 440379, "epoch": 5305} {"train_loss": -26.815631866455078, "global_step": 440380, "epoch": 5305} {"train_loss": -26.805423736572266, "global_step": 440381, "epoch": 5305} {"train_loss": -26.660724639892578, "global_step": 440382, "epoch": 5305} {"train_loss": -26.840682983398438, "global_step": 440383, "epoch": 5305} {"train_loss": -27.079437255859375, "global_step": 440384, "epoch": 5305} {"train_loss": -26.603992462158203, "global_step": 440385, "epoch": 5305} {"train_loss": -27.25299072265625, "global_step": 440386, "epoch": 5305} {"train_loss": -26.899311065673828, "global_step": 440387, "epoch": 5305} {"train_loss": -26.709909439086914, "global_step": 440388, "epoch": 5305} {"train_loss": -26.513425827026367, "global_step": 440389, "epoch": 5305} {"train_loss": -27.028059005737305, "global_step": 440390, "epoch": 5305} {"train_loss": -26.808032989501953, "global_step": 440391, "epoch": 5305} {"train_loss": -26.61240577697754, "global_step": 440392, "epoch": 5305} {"train_loss": -26.925811767578125, "global_step": 440393, "epoch": 5305} {"train_loss": -26.7713565826416, "global_step": 440394, "epoch": 5305} {"train_loss": -26.87457847595215, "global_step": 440395, "epoch": 5305} {"train_loss": -26.783864974975586, "global_step": 440396, "epoch": 5305} {"train_loss": -26.844461762761494, "global_step": 440397, "epoch": 5305, "val_loss": 6627153.5} {"train_loss": -26.478357315063477, "global_step": 440398, "epoch": 5306} {"train_loss": -26.777109146118164, "global_step": 440399, "epoch": 5306} {"train_loss": -26.55975914001465, "global_step": 440400, "epoch": 5306} {"train_loss": -26.692174911499023, "global_step": 440401, "epoch": 5306} {"train_loss": -26.63593864440918, "global_step": 440402, "epoch": 5306} {"train_loss": -26.7091121673584, "global_step": 440403, "epoch": 5306} {"train_loss": -26.851659774780273, "global_step": 440404, "epoch": 5306} {"train_loss": -27.009763717651367, "global_step": 440405, "epoch": 5306} {"train_loss": -26.61270523071289, "global_step": 440406, "epoch": 5306} {"train_loss": -26.78986167907715, "global_step": 440407, "epoch": 5306} {"train_loss": -26.705835342407227, "global_step": 440408, "epoch": 5306} {"train_loss": -26.780492782592773, "global_step": 440409, "epoch": 5306} {"train_loss": -26.97021484375, "global_step": 440410, "epoch": 5306} {"train_loss": -27.308149337768555, "global_step": 440411, "epoch": 5306} {"train_loss": -26.70611572265625, "global_step": 440412, "epoch": 5306} {"train_loss": -26.41293716430664, "global_step": 440413, "epoch": 5306} {"train_loss": -26.61299705505371, "global_step": 440414, "epoch": 5306} {"train_loss": -26.6787052154541, "global_step": 440415, "epoch": 5306} {"train_loss": -27.430374145507812, "global_step": 440416, "epoch": 5306} {"train_loss": -26.47246742248535, "global_step": 440417, "epoch": 5306} {"train_loss": -26.64179801940918, "global_step": 440418, "epoch": 5306} {"train_loss": -26.785303115844727, "global_step": 440419, "epoch": 5306} {"train_loss": -26.97080421447754, "global_step": 440420, "epoch": 5306} {"train_loss": -27.077680587768555, "global_step": 440421, "epoch": 5306} {"train_loss": -26.696868896484375, "global_step": 440422, "epoch": 5306} {"train_loss": -27.026227951049805, "global_step": 440423, "epoch": 5306} {"train_loss": -26.91303062438965, "global_step": 440424, "epoch": 5306} {"train_loss": -26.7702693939209, "global_step": 440425, "epoch": 5306} {"train_loss": -26.969837188720703, "global_step": 440426, "epoch": 5306} {"train_loss": -26.810413360595703, "global_step": 440427, "epoch": 5306} {"train_loss": -27.067230224609375, "global_step": 440428, "epoch": 5306} {"train_loss": -27.193927764892578, "global_step": 440429, "epoch": 5306} {"train_loss": -27.090478897094727, "global_step": 440430, "epoch": 5306} {"train_loss": -26.924108505249023, "global_step": 440431, "epoch": 5306} {"train_loss": -26.837284088134766, "global_step": 440432, "epoch": 5306} {"train_loss": -26.705631256103516, "global_step": 440433, "epoch": 5306} {"train_loss": -26.82733154296875, "global_step": 440434, "epoch": 5306} {"train_loss": -27.180744171142578, "global_step": 440435, "epoch": 5306} {"train_loss": -27.10467529296875, "global_step": 440436, "epoch": 5306} {"train_loss": -27.121793746948242, "global_step": 440437, "epoch": 5306} {"train_loss": -27.253080368041992, "global_step": 440438, "epoch": 5306} {"train_loss": -27.138158798217773, "global_step": 440439, "epoch": 5306} {"train_loss": -26.78754234313965, "global_step": 440440, "epoch": 5306} {"train_loss": -26.740514755249023, "global_step": 440441, "epoch": 5306} {"train_loss": -27.088733673095703, "global_step": 440442, "epoch": 5306} {"train_loss": -27.237409591674805, "global_step": 440443, "epoch": 5306} {"train_loss": -27.175642013549805, "global_step": 440444, "epoch": 5306} {"train_loss": -27.277484893798828, "global_step": 440445, "epoch": 5306} {"train_loss": -27.39298439025879, "global_step": 440446, "epoch": 5306} {"train_loss": -26.8796443939209, "global_step": 440447, "epoch": 5306} {"train_loss": -27.3704833984375, "global_step": 440448, "epoch": 5306} {"train_loss": -27.051162719726562, "global_step": 440449, "epoch": 5306} {"train_loss": -26.98162269592285, "global_step": 440450, "epoch": 5306} {"train_loss": -27.158613204956055, "global_step": 440451, "epoch": 5306} {"train_loss": -27.133764266967773, "global_step": 440452, "epoch": 5306} {"train_loss": -26.769067764282227, "global_step": 440453, "epoch": 5306} {"train_loss": -27.365453720092773, "global_step": 440454, "epoch": 5306} {"train_loss": -27.050735473632812, "global_step": 440455, "epoch": 5306} {"train_loss": -27.18207359313965, "global_step": 440456, "epoch": 5306} {"train_loss": -27.18792724609375, "global_step": 440457, "epoch": 5306} {"train_loss": -27.160959243774414, "global_step": 440458, "epoch": 5306} {"train_loss": -26.992441177368164, "global_step": 440459, "epoch": 5306} {"train_loss": -27.121679306030273, "global_step": 440460, "epoch": 5306} {"train_loss": -26.872156143188477, "global_step": 440461, "epoch": 5306} {"train_loss": -26.791486740112305, "global_step": 440462, "epoch": 5306} {"train_loss": -26.654052734375, "global_step": 440463, "epoch": 5306} {"train_loss": -26.69447898864746, "global_step": 440464, "epoch": 5306} {"train_loss": -26.954858779907227, "global_step": 440465, "epoch": 5306} {"train_loss": -27.11273193359375, "global_step": 440466, "epoch": 5306} {"train_loss": -27.16568374633789, "global_step": 440467, "epoch": 5306} {"train_loss": -26.808216094970703, "global_step": 440468, "epoch": 5306} {"train_loss": -27.07447624206543, "global_step": 440469, "epoch": 5306} {"train_loss": -27.071643829345703, "global_step": 440470, "epoch": 5306} {"train_loss": -26.691503524780273, "global_step": 440471, "epoch": 5306} {"train_loss": -26.617511749267578, "global_step": 440472, "epoch": 5306} {"train_loss": -26.98292350769043, "global_step": 440473, "epoch": 5306} {"train_loss": -26.900405883789062, "global_step": 440474, "epoch": 5306} {"train_loss": -26.981781005859375, "global_step": 440475, "epoch": 5306} {"train_loss": -26.778308868408203, "global_step": 440476, "epoch": 5306} {"train_loss": -26.807239532470703, "global_step": 440477, "epoch": 5306} {"train_loss": -25.71084976196289, "global_step": 440478, "epoch": 5306} {"train_loss": -25.67888832092285, "global_step": 440479, "epoch": 5306} {"train_loss": -26.88101056110428, "global_step": 440480, "epoch": 5306, "val_loss": 6513697.0} {"train_loss": -25.600982666015625, "global_step": 440481, "epoch": 5307} {"train_loss": -24.484718322753906, "global_step": 440482, "epoch": 5307} {"train_loss": -25.163291931152344, "global_step": 440483, "epoch": 5307} {"train_loss": -25.352575302124023, "global_step": 440484, "epoch": 5307} {"train_loss": -25.432165145874023, "global_step": 440485, "epoch": 5307} {"train_loss": -25.303380966186523, "global_step": 440486, "epoch": 5307} {"train_loss": -25.451269149780273, "global_step": 440487, "epoch": 5307} {"train_loss": -25.38836669921875, "global_step": 440488, "epoch": 5307} {"train_loss": -25.476444244384766, "global_step": 440489, "epoch": 5307} {"train_loss": -25.730878829956055, "global_step": 440490, "epoch": 5307} {"train_loss": -26.07513427734375, "global_step": 440491, "epoch": 5307} {"train_loss": -26.134546279907227, "global_step": 440492, "epoch": 5307} {"train_loss": -25.14810562133789, "global_step": 440493, "epoch": 5307} {"train_loss": -26.1621036529541, "global_step": 440494, "epoch": 5307} {"train_loss": -25.63040542602539, "global_step": 440495, "epoch": 5307} {"train_loss": -26.16303825378418, "global_step": 440496, "epoch": 5307} {"train_loss": -26.215118408203125, "global_step": 440497, "epoch": 5307} {"train_loss": -26.256093978881836, "global_step": 440498, "epoch": 5307} {"train_loss": -26.5380916595459, "global_step": 440499, "epoch": 5307} {"train_loss": -26.445470809936523, "global_step": 440500, "epoch": 5307} {"train_loss": -26.00776481628418, "global_step": 440501, "epoch": 5307} {"train_loss": -26.67791748046875, "global_step": 440502, "epoch": 5307} {"train_loss": -25.97776222229004, "global_step": 440503, "epoch": 5307} {"train_loss": -26.349267959594727, "global_step": 440504, "epoch": 5307} {"train_loss": -26.344696044921875, "global_step": 440505, "epoch": 5307} {"train_loss": -26.1993408203125, "global_step": 440506, "epoch": 5307} {"train_loss": -26.67957878112793, "global_step": 440507, "epoch": 5307} {"train_loss": -26.71150016784668, "global_step": 440508, "epoch": 5307} {"train_loss": -26.655445098876953, "global_step": 440509, "epoch": 5307} {"train_loss": -26.3979549407959, "global_step": 440510, "epoch": 5307} {"train_loss": -26.38051414489746, "global_step": 440511, "epoch": 5307} {"train_loss": -26.76338768005371, "global_step": 440512, "epoch": 5307} {"train_loss": -26.588850021362305, "global_step": 440513, "epoch": 5307} {"train_loss": -26.806039810180664, "global_step": 440514, "epoch": 5307} {"train_loss": -26.7817440032959, "global_step": 440515, "epoch": 5307} {"train_loss": -26.8088321685791, "global_step": 440516, "epoch": 5307} {"train_loss": -26.546585083007812, "global_step": 440517, "epoch": 5307} {"train_loss": -26.77752685546875, "global_step": 440518, "epoch": 5307} {"train_loss": -27.158645629882812, "global_step": 440519, "epoch": 5307} {"train_loss": -26.615589141845703, "global_step": 440520, "epoch": 5307} {"train_loss": -27.165632247924805, "global_step": 440521, "epoch": 5307} {"train_loss": -27.154523849487305, "global_step": 440522, "epoch": 5307} {"train_loss": -26.958181381225586, "global_step": 440523, "epoch": 5307} {"train_loss": -27.011920928955078, "global_step": 440524, "epoch": 5307} {"train_loss": -27.182458877563477, "global_step": 440525, "epoch": 5307} {"train_loss": -27.0537109375, "global_step": 440526, "epoch": 5307} {"train_loss": -27.007551193237305, "global_step": 440527, "epoch": 5307} {"train_loss": -26.974409103393555, "global_step": 440528, "epoch": 5307} {"train_loss": -26.91987419128418, "global_step": 440529, "epoch": 5307} {"train_loss": -27.4488468170166, "global_step": 440530, "epoch": 5307} {"train_loss": -27.21941566467285, "global_step": 440531, "epoch": 5307} {"train_loss": -27.232257843017578, "global_step": 440532, "epoch": 5307} {"train_loss": -27.077234268188477, "global_step": 440533, "epoch": 5307} {"train_loss": -27.28057861328125, "global_step": 440534, "epoch": 5307} {"train_loss": -27.469406127929688, "global_step": 440535, "epoch": 5307} {"train_loss": -27.40424919128418, "global_step": 440536, "epoch": 5307} {"train_loss": -27.139652252197266, "global_step": 440537, "epoch": 5307} {"train_loss": -27.254003524780273, "global_step": 440538, "epoch": 5307} {"train_loss": -27.407697677612305, "global_step": 440539, "epoch": 5307} {"train_loss": -27.016265869140625, "global_step": 440540, "epoch": 5307} {"train_loss": -27.050718307495117, "global_step": 440541, "epoch": 5307} {"train_loss": -26.65606689453125, "global_step": 440542, "epoch": 5307} {"train_loss": -26.739887237548828, "global_step": 440543, "epoch": 5307} {"train_loss": -27.006275177001953, "global_step": 440544, "epoch": 5307} {"train_loss": -27.368301391601562, "global_step": 440545, "epoch": 5307} {"train_loss": -27.27747917175293, "global_step": 440546, "epoch": 5307} {"train_loss": -27.546812057495117, "global_step": 440547, "epoch": 5307} {"train_loss": -27.192716598510742, "global_step": 440548, "epoch": 5307} {"train_loss": -27.253223419189453, "global_step": 440549, "epoch": 5307} {"train_loss": -27.295263290405273, "global_step": 440550, "epoch": 5307} {"train_loss": -26.9735107421875, "global_step": 440551, "epoch": 5307} {"train_loss": -26.6207218170166, "global_step": 440552, "epoch": 5307} {"train_loss": -26.918607711791992, "global_step": 440553, "epoch": 5307} {"train_loss": -26.98431396484375, "global_step": 440554, "epoch": 5307} {"train_loss": -27.106891632080078, "global_step": 440555, "epoch": 5307} {"train_loss": -26.945281982421875, "global_step": 440556, "epoch": 5307} {"train_loss": -27.161062240600586, "global_step": 440557, "epoch": 5307} {"train_loss": -26.94300651550293, "global_step": 440558, "epoch": 5307} {"train_loss": -26.920196533203125, "global_step": 440559, "epoch": 5307} {"train_loss": -27.198835372924805, "global_step": 440560, "epoch": 5307} {"train_loss": -26.541257858276367, "global_step": 440561, "epoch": 5307} {"train_loss": -27.084461212158203, "global_step": 440562, "epoch": 5307} {"train_loss": -26.64300640519843, "global_step": 440563, "epoch": 5307, "val_loss": 6615725.0} {"train_loss": -26.672271728515625, "global_step": 440564, "epoch": 5308} {"train_loss": -26.811986923217773, "global_step": 440565, "epoch": 5308} {"train_loss": -26.253406524658203, "global_step": 440566, "epoch": 5308} {"train_loss": -26.513248443603516, "global_step": 440567, "epoch": 5308} {"train_loss": -26.506683349609375, "global_step": 440568, "epoch": 5308} {"train_loss": -26.57317543029785, "global_step": 440569, "epoch": 5308} {"train_loss": -26.8458251953125, "global_step": 440570, "epoch": 5308} {"train_loss": -26.527990341186523, "global_step": 440571, "epoch": 5308} {"train_loss": -26.73872184753418, "global_step": 440572, "epoch": 5308} {"train_loss": -26.964481353759766, "global_step": 440573, "epoch": 5308} {"train_loss": -27.103321075439453, "global_step": 440574, "epoch": 5308} {"train_loss": -27.095947265625, "global_step": 440575, "epoch": 5308} {"train_loss": -27.14375114440918, "global_step": 440576, "epoch": 5308} {"train_loss": -26.870512008666992, "global_step": 440577, "epoch": 5308} {"train_loss": -27.07242774963379, "global_step": 440578, "epoch": 5308} {"train_loss": -26.790143966674805, "global_step": 440579, "epoch": 5308} {"train_loss": -26.933837890625, "global_step": 440580, "epoch": 5308} {"train_loss": -27.132001876831055, "global_step": 440581, "epoch": 5308} {"train_loss": -26.85210609436035, "global_step": 440582, "epoch": 5308} {"train_loss": -27.053918838500977, "global_step": 440583, "epoch": 5308} {"train_loss": -26.897632598876953, "global_step": 440584, "epoch": 5308} {"train_loss": -27.0397891998291, "global_step": 440585, "epoch": 5308} {"train_loss": -26.61105728149414, "global_step": 440586, "epoch": 5308} {"train_loss": -26.991857528686523, "global_step": 440587, "epoch": 5308} {"train_loss": -27.159809112548828, "global_step": 440588, "epoch": 5308} {"train_loss": -27.363727569580078, "global_step": 440589, "epoch": 5308} {"train_loss": -26.940351486206055, "global_step": 440590, "epoch": 5308} {"train_loss": -27.0510311126709, "global_step": 440591, "epoch": 5308} {"train_loss": -26.986413955688477, "global_step": 440592, "epoch": 5308} {"train_loss": -27.20545768737793, "global_step": 440593, "epoch": 5308} {"train_loss": -27.039520263671875, "global_step": 440594, "epoch": 5308} {"train_loss": -26.84834861755371, "global_step": 440595, "epoch": 5308} {"train_loss": -26.983179092407227, "global_step": 440596, "epoch": 5308} {"train_loss": -27.098752975463867, "global_step": 440597, "epoch": 5308} {"train_loss": -26.9420223236084, "global_step": 440598, "epoch": 5308} {"train_loss": -27.146535873413086, "global_step": 440599, "epoch": 5308} {"train_loss": -26.80218505859375, "global_step": 440600, "epoch": 5308} {"train_loss": -27.134235382080078, "global_step": 440601, "epoch": 5308} {"train_loss": -27.385501861572266, "global_step": 440602, "epoch": 5308} {"train_loss": -26.887720108032227, "global_step": 440603, "epoch": 5308} {"train_loss": -27.344385147094727, "global_step": 440604, "epoch": 5308} {"train_loss": -27.363412857055664, "global_step": 440605, "epoch": 5308} {"train_loss": -27.0836124420166, "global_step": 440606, "epoch": 5308} {"train_loss": -27.52564811706543, "global_step": 440607, "epoch": 5308} {"train_loss": -27.408843994140625, "global_step": 440608, "epoch": 5308} {"train_loss": -27.190082550048828, "global_step": 440609, "epoch": 5308} {"train_loss": -26.955493927001953, "global_step": 440610, "epoch": 5308} {"train_loss": -26.450708389282227, "global_step": 440611, "epoch": 5308} {"train_loss": -26.273523330688477, "global_step": 440612, "epoch": 5308} {"train_loss": -26.11903190612793, "global_step": 440613, "epoch": 5308} {"train_loss": -25.291433334350586, "global_step": 440614, "epoch": 5308} {"train_loss": -24.753883361816406, "global_step": 440615, "epoch": 5308} {"train_loss": -25.6466121673584, "global_step": 440616, "epoch": 5308} {"train_loss": -25.288602828979492, "global_step": 440617, "epoch": 5308} {"train_loss": -25.564550399780273, "global_step": 440618, "epoch": 5308} {"train_loss": -26.000661849975586, "global_step": 440619, "epoch": 5308} {"train_loss": -26.138885498046875, "global_step": 440620, "epoch": 5308} {"train_loss": -26.07642936706543, "global_step": 440621, "epoch": 5308} {"train_loss": -26.237157821655273, "global_step": 440622, "epoch": 5308} {"train_loss": -25.988142013549805, "global_step": 440623, "epoch": 5308} {"train_loss": -26.2611083984375, "global_step": 440624, "epoch": 5308} {"train_loss": -26.286563873291016, "global_step": 440625, "epoch": 5308} {"train_loss": -26.672473907470703, "global_step": 440626, "epoch": 5308} {"train_loss": -26.691486358642578, "global_step": 440627, "epoch": 5308} {"train_loss": -26.1031436920166, "global_step": 440628, "epoch": 5308} {"train_loss": -26.85223388671875, "global_step": 440629, "epoch": 5308} {"train_loss": -26.49249839782715, "global_step": 440630, "epoch": 5308} {"train_loss": -26.767240524291992, "global_step": 440631, "epoch": 5308} {"train_loss": -26.701278686523438, "global_step": 440632, "epoch": 5308} {"train_loss": -26.530725479125977, "global_step": 440633, "epoch": 5308} {"train_loss": -26.795957565307617, "global_step": 440634, "epoch": 5308} {"train_loss": -26.74842643737793, "global_step": 440635, "epoch": 5308} {"train_loss": -26.659698486328125, "global_step": 440636, "epoch": 5308} {"train_loss": -26.407629013061523, "global_step": 440637, "epoch": 5308} {"train_loss": -27.075773239135742, "global_step": 440638, "epoch": 5308} {"train_loss": -26.945371627807617, "global_step": 440639, "epoch": 5308} {"train_loss": -26.677831649780273, "global_step": 440640, "epoch": 5308} {"train_loss": -26.67215919494629, "global_step": 440641, "epoch": 5308} {"train_loss": -26.8531494140625, "global_step": 440642, "epoch": 5308} {"train_loss": -26.80318260192871, "global_step": 440643, "epoch": 5308} {"train_loss": -27.022125244140625, "global_step": 440644, "epoch": 5308} {"train_loss": -26.862838745117188, "global_step": 440645, "epoch": 5308} {"train_loss": -26.73851203918457, "global_step": 440646, "epoch": 5308, "val_loss": 6664393.0} {"train_loss": -26.396665573120117, "global_step": 440647, "epoch": 5309} {"train_loss": -26.196435928344727, "global_step": 440648, "epoch": 5309} {"train_loss": -26.39959716796875, "global_step": 440649, "epoch": 5309} {"train_loss": -25.992834091186523, "global_step": 440650, "epoch": 5309} {"train_loss": -26.573394775390625, "global_step": 440651, "epoch": 5309} {"train_loss": -26.1392822265625, "global_step": 440652, "epoch": 5309} {"train_loss": -25.619674682617188, "global_step": 440653, "epoch": 5309} {"train_loss": -26.52349281311035, "global_step": 440654, "epoch": 5309} {"train_loss": -26.277387619018555, "global_step": 440655, "epoch": 5309} {"train_loss": -25.879932403564453, "global_step": 440656, "epoch": 5309} {"train_loss": -26.526647567749023, "global_step": 440657, "epoch": 5309} {"train_loss": -26.7359619140625, "global_step": 440658, "epoch": 5309} {"train_loss": -26.37400245666504, "global_step": 440659, "epoch": 5309} {"train_loss": -26.731067657470703, "global_step": 440660, "epoch": 5309} {"train_loss": -26.37946128845215, "global_step": 440661, "epoch": 5309} {"train_loss": -26.650470733642578, "global_step": 440662, "epoch": 5309} {"train_loss": -26.663816452026367, "global_step": 440663, "epoch": 5309} {"train_loss": -26.665592193603516, "global_step": 440664, "epoch": 5309} {"train_loss": -26.84765625, "global_step": 440665, "epoch": 5309} {"train_loss": -26.7696590423584, "global_step": 440666, "epoch": 5309} {"train_loss": -26.900419235229492, "global_step": 440667, "epoch": 5309} {"train_loss": -26.848678588867188, "global_step": 440668, "epoch": 5309} {"train_loss": -26.969770431518555, "global_step": 440669, "epoch": 5309} {"train_loss": -26.839757919311523, "global_step": 440670, "epoch": 5309} {"train_loss": -26.537677764892578, "global_step": 440671, "epoch": 5309} {"train_loss": -27.065900802612305, "global_step": 440672, "epoch": 5309} {"train_loss": -26.515533447265625, "global_step": 440673, "epoch": 5309} {"train_loss": -26.76590347290039, "global_step": 440674, "epoch": 5309} {"train_loss": -26.986257553100586, "global_step": 440675, "epoch": 5309} {"train_loss": -26.93922233581543, "global_step": 440676, "epoch": 5309} {"train_loss": -26.7996883392334, "global_step": 440677, "epoch": 5309} {"train_loss": -26.866180419921875, "global_step": 440678, "epoch": 5309} {"train_loss": -26.730941772460938, "global_step": 440679, "epoch": 5309} {"train_loss": -27.131011962890625, "global_step": 440680, "epoch": 5309} {"train_loss": -27.012983322143555, "global_step": 440681, "epoch": 5309} {"train_loss": -26.977188110351562, "global_step": 440682, "epoch": 5309} {"train_loss": -27.22088623046875, "global_step": 440683, "epoch": 5309} {"train_loss": -26.931537628173828, "global_step": 440684, "epoch": 5309} {"train_loss": -26.804357528686523, "global_step": 440685, "epoch": 5309} {"train_loss": -27.220327377319336, "global_step": 440686, "epoch": 5309} {"train_loss": -26.94611930847168, "global_step": 440687, "epoch": 5309} {"train_loss": -27.0001220703125, "global_step": 440688, "epoch": 5309} {"train_loss": -27.149343490600586, "global_step": 440689, "epoch": 5309} {"train_loss": -27.244693756103516, "global_step": 440690, "epoch": 5309} {"train_loss": -27.348468780517578, "global_step": 440691, "epoch": 5309} {"train_loss": -26.836750030517578, "global_step": 440692, "epoch": 5309} {"train_loss": -27.361547470092773, "global_step": 440693, "epoch": 5309} {"train_loss": -26.902423858642578, "global_step": 440694, "epoch": 5309} {"train_loss": -26.95174217224121, "global_step": 440695, "epoch": 5309} {"train_loss": -27.251752853393555, "global_step": 440696, "epoch": 5309} {"train_loss": -27.182973861694336, "global_step": 440697, "epoch": 5309} {"train_loss": -27.1381893157959, "global_step": 440698, "epoch": 5309} {"train_loss": -27.028064727783203, "global_step": 440699, "epoch": 5309} {"train_loss": -26.834447860717773, "global_step": 440700, "epoch": 5309} {"train_loss": -27.05665397644043, "global_step": 440701, "epoch": 5309} {"train_loss": -26.937971115112305, "global_step": 440702, "epoch": 5309} {"train_loss": -26.908472061157227, "global_step": 440703, "epoch": 5309} {"train_loss": -26.385709762573242, "global_step": 440704, "epoch": 5309} {"train_loss": -26.202497482299805, "global_step": 440705, "epoch": 5309} {"train_loss": -26.749780654907227, "global_step": 440706, "epoch": 5309} {"train_loss": -27.091999053955078, "global_step": 440707, "epoch": 5309} {"train_loss": -26.911151885986328, "global_step": 440708, "epoch": 5309} {"train_loss": -27.13037109375, "global_step": 440709, "epoch": 5309} {"train_loss": -26.73235511779785, "global_step": 440710, "epoch": 5309} {"train_loss": -26.739185333251953, "global_step": 440711, "epoch": 5309} {"train_loss": -26.615131378173828, "global_step": 440712, "epoch": 5309} {"train_loss": -26.994873046875, "global_step": 440713, "epoch": 5309} {"train_loss": -26.65504264831543, "global_step": 440714, "epoch": 5309} {"train_loss": -27.0942325592041, "global_step": 440715, "epoch": 5309} {"train_loss": -26.764129638671875, "global_step": 440716, "epoch": 5309} {"train_loss": -27.00678825378418, "global_step": 440717, "epoch": 5309} {"train_loss": -27.00190544128418, "global_step": 440718, "epoch": 5309} {"train_loss": -26.960941314697266, "global_step": 440719, "epoch": 5309} {"train_loss": -27.238269805908203, "global_step": 440720, "epoch": 5309} {"train_loss": -26.71636390686035, "global_step": 440721, "epoch": 5309} {"train_loss": -27.046361923217773, "global_step": 440722, "epoch": 5309} {"train_loss": -26.850061416625977, "global_step": 440723, "epoch": 5309} {"train_loss": -27.146595001220703, "global_step": 440724, "epoch": 5309} {"train_loss": -27.073989868164062, "global_step": 440725, "epoch": 5309} {"train_loss": -26.836523056030273, "global_step": 440726, "epoch": 5309} {"train_loss": -27.218494415283203, "global_step": 440727, "epoch": 5309} {"train_loss": -26.79914665222168, "global_step": 440728, "epoch": 5309} {"train_loss": -26.805105508091938, "global_step": 440729, "epoch": 5309, "val_loss": 6652191.5} {"train_loss": -26.642608642578125, "global_step": 440730, "epoch": 5310} {"train_loss": -27.174341201782227, "global_step": 440731, "epoch": 5310} {"train_loss": -26.914968490600586, "global_step": 440732, "epoch": 5310} {"train_loss": -26.75271987915039, "global_step": 440733, "epoch": 5310} {"train_loss": -26.59547233581543, "global_step": 440734, "epoch": 5310} {"train_loss": -26.626916885375977, "global_step": 440735, "epoch": 5310} {"train_loss": -26.817041397094727, "global_step": 440736, "epoch": 5310} {"train_loss": -26.693395614624023, "global_step": 440737, "epoch": 5310} {"train_loss": -26.74675941467285, "global_step": 440738, "epoch": 5310} {"train_loss": -27.244277954101562, "global_step": 440739, "epoch": 5310} {"train_loss": -26.74714469909668, "global_step": 440740, "epoch": 5310} {"train_loss": -26.897903442382812, "global_step": 440741, "epoch": 5310} {"train_loss": -26.9395809173584, "global_step": 440742, "epoch": 5310} {"train_loss": -26.875818252563477, "global_step": 440743, "epoch": 5310} {"train_loss": -27.039077758789062, "global_step": 440744, "epoch": 5310} {"train_loss": -27.027313232421875, "global_step": 440745, "epoch": 5310} {"train_loss": -26.616180419921875, "global_step": 440746, "epoch": 5310} {"train_loss": -27.245773315429688, "global_step": 440747, "epoch": 5310} {"train_loss": -27.167621612548828, "global_step": 440748, "epoch": 5310} {"train_loss": -26.961557388305664, "global_step": 440749, "epoch": 5310} {"train_loss": -27.088098526000977, "global_step": 440750, "epoch": 5310} {"train_loss": -26.912784576416016, "global_step": 440751, "epoch": 5310} {"train_loss": -27.301252365112305, "global_step": 440752, "epoch": 5310} {"train_loss": -27.210859298706055, "global_step": 440753, "epoch": 5310} {"train_loss": -26.743820190429688, "global_step": 440754, "epoch": 5310} {"train_loss": -26.88091468811035, "global_step": 440755, "epoch": 5310} {"train_loss": -27.101394653320312, "global_step": 440756, "epoch": 5310} {"train_loss": -27.10438346862793, "global_step": 440757, "epoch": 5310} {"train_loss": -27.342548370361328, "global_step": 440758, "epoch": 5310} {"train_loss": -27.269245147705078, "global_step": 440759, "epoch": 5310} {"train_loss": -27.211929321289062, "global_step": 440760, "epoch": 5310} {"train_loss": -27.05087661743164, "global_step": 440761, "epoch": 5310} {"train_loss": -26.89105796813965, "global_step": 440762, "epoch": 5310} {"train_loss": -27.109609603881836, "global_step": 440763, "epoch": 5310} {"train_loss": -26.734607696533203, "global_step": 440764, "epoch": 5310} {"train_loss": -26.884389877319336, "global_step": 440765, "epoch": 5310} {"train_loss": -27.077335357666016, "global_step": 440766, "epoch": 5310} {"train_loss": -27.3414249420166, "global_step": 440767, "epoch": 5310} {"train_loss": -27.02046012878418, "global_step": 440768, "epoch": 5310} {"train_loss": -27.243093490600586, "global_step": 440769, "epoch": 5310} {"train_loss": -26.9256649017334, "global_step": 440770, "epoch": 5310} {"train_loss": -26.95871353149414, "global_step": 440771, "epoch": 5310} {"train_loss": -27.19091796875, "global_step": 440772, "epoch": 5310} {"train_loss": -27.10540199279785, "global_step": 440773, "epoch": 5310} {"train_loss": -27.091012954711914, "global_step": 440774, "epoch": 5310} {"train_loss": -27.0738468170166, "global_step": 440775, "epoch": 5310} {"train_loss": -26.769872665405273, "global_step": 440776, "epoch": 5310} {"train_loss": -26.49397087097168, "global_step": 440777, "epoch": 5310} {"train_loss": -26.866031646728516, "global_step": 440778, "epoch": 5310} {"train_loss": -27.085676193237305, "global_step": 440779, "epoch": 5310} {"train_loss": -26.943334579467773, "global_step": 440780, "epoch": 5310} {"train_loss": -26.84052085876465, "global_step": 440781, "epoch": 5310} {"train_loss": -27.366275787353516, "global_step": 440782, "epoch": 5310} {"train_loss": -26.780033111572266, "global_step": 440783, "epoch": 5310} {"train_loss": -27.076557159423828, "global_step": 440784, "epoch": 5310} {"train_loss": -27.27615737915039, "global_step": 440785, "epoch": 5310} {"train_loss": -26.99471092224121, "global_step": 440786, "epoch": 5310} {"train_loss": -26.940778732299805, "global_step": 440787, "epoch": 5310} {"train_loss": -27.406463623046875, "global_step": 440788, "epoch": 5310} {"train_loss": -27.238937377929688, "global_step": 440789, "epoch": 5310} {"train_loss": -27.225568771362305, "global_step": 440790, "epoch": 5310} {"train_loss": -26.87174415588379, "global_step": 440791, "epoch": 5310} {"train_loss": -27.04206657409668, "global_step": 440792, "epoch": 5310} {"train_loss": -26.833499908447266, "global_step": 440793, "epoch": 5310} {"train_loss": -27.108469009399414, "global_step": 440794, "epoch": 5310} {"train_loss": -26.554523468017578, "global_step": 440795, "epoch": 5310} {"train_loss": -27.047082901000977, "global_step": 440796, "epoch": 5310} {"train_loss": -26.929443359375, "global_step": 440797, "epoch": 5310} {"train_loss": -26.944562911987305, "global_step": 440798, "epoch": 5310} {"train_loss": -27.0659236907959, "global_step": 440799, "epoch": 5310} {"train_loss": -27.155750274658203, "global_step": 440800, "epoch": 5310} {"train_loss": -27.127105712890625, "global_step": 440801, "epoch": 5310} {"train_loss": -26.551197052001953, "global_step": 440802, "epoch": 5310} {"train_loss": -26.86760902404785, "global_step": 440803, "epoch": 5310} {"train_loss": -26.911670684814453, "global_step": 440804, "epoch": 5310} {"train_loss": -27.15058708190918, "global_step": 440805, "epoch": 5310} {"train_loss": -26.95916175842285, "global_step": 440806, "epoch": 5310} {"train_loss": -27.22201919555664, "global_step": 440807, "epoch": 5310} {"train_loss": -27.00469398498535, "global_step": 440808, "epoch": 5310} {"train_loss": -27.119277954101562, "global_step": 440809, "epoch": 5310} {"train_loss": -27.119089126586914, "global_step": 440810, "epoch": 5310} {"train_loss": -27.209003448486328, "global_step": 440811, "epoch": 5310} {"train_loss": -26.993198532656013, "global_step": 440812, "epoch": 5310, "val_loss": 6718426.0} {"train_loss": -26.533796310424805, "global_step": 440813, "epoch": 5311} {"train_loss": -25.2936954498291, "global_step": 440814, "epoch": 5311} {"train_loss": -25.744617462158203, "global_step": 440815, "epoch": 5311} {"train_loss": -26.515073776245117, "global_step": 440816, "epoch": 5311} {"train_loss": -26.478668212890625, "global_step": 440817, "epoch": 5311} {"train_loss": -26.518390655517578, "global_step": 440818, "epoch": 5311} {"train_loss": -26.89179801940918, "global_step": 440819, "epoch": 5311} {"train_loss": -26.47822380065918, "global_step": 440820, "epoch": 5311} {"train_loss": -26.91499900817871, "global_step": 440821, "epoch": 5311} {"train_loss": -26.3571834564209, "global_step": 440822, "epoch": 5311} {"train_loss": -26.432998657226562, "global_step": 440823, "epoch": 5311} {"train_loss": -26.398853302001953, "global_step": 440824, "epoch": 5311} {"train_loss": -26.699966430664062, "global_step": 440825, "epoch": 5311} {"train_loss": -26.69928550720215, "global_step": 440826, "epoch": 5311} {"train_loss": -26.672155380249023, "global_step": 440827, "epoch": 5311} {"train_loss": -26.40204429626465, "global_step": 440828, "epoch": 5311} {"train_loss": -26.84077262878418, "global_step": 440829, "epoch": 5311} {"train_loss": -26.792282104492188, "global_step": 440830, "epoch": 5311} {"train_loss": -26.964658737182617, "global_step": 440831, "epoch": 5311} {"train_loss": -26.81702995300293, "global_step": 440832, "epoch": 5311} {"train_loss": -27.05743408203125, "global_step": 440833, "epoch": 5311} {"train_loss": -26.682458877563477, "global_step": 440834, "epoch": 5311} {"train_loss": -26.804447174072266, "global_step": 440835, "epoch": 5311} {"train_loss": -26.70147132873535, "global_step": 440836, "epoch": 5311} {"train_loss": -27.113285064697266, "global_step": 440837, "epoch": 5311} {"train_loss": -26.91069984436035, "global_step": 440838, "epoch": 5311} {"train_loss": -26.699914932250977, "global_step": 440839, "epoch": 5311} {"train_loss": -26.773160934448242, "global_step": 440840, "epoch": 5311} {"train_loss": -27.131689071655273, "global_step": 440841, "epoch": 5311} {"train_loss": -27.285388946533203, "global_step": 440842, "epoch": 5311} {"train_loss": -27.0241641998291, "global_step": 440843, "epoch": 5311} {"train_loss": -26.796558380126953, "global_step": 440844, "epoch": 5311} {"train_loss": -26.953948974609375, "global_step": 440845, "epoch": 5311} {"train_loss": -26.984039306640625, "global_step": 440846, "epoch": 5311} {"train_loss": -27.02960777282715, "global_step": 440847, "epoch": 5311} {"train_loss": -26.885839462280273, "global_step": 440848, "epoch": 5311} {"train_loss": -26.836307525634766, "global_step": 440849, "epoch": 5311} {"train_loss": -27.379440307617188, "global_step": 440850, "epoch": 5311} {"train_loss": -27.11004638671875, "global_step": 440851, "epoch": 5311} {"train_loss": -27.153289794921875, "global_step": 440852, "epoch": 5311} {"train_loss": -26.90728759765625, "global_step": 440853, "epoch": 5311} {"train_loss": -26.66071891784668, "global_step": 440854, "epoch": 5311} {"train_loss": -26.928760528564453, "global_step": 440855, "epoch": 5311} {"train_loss": -26.941648483276367, "global_step": 440856, "epoch": 5311} {"train_loss": -26.755945205688477, "global_step": 440857, "epoch": 5311} {"train_loss": -26.93560791015625, "global_step": 440858, "epoch": 5311} {"train_loss": -26.649707794189453, "global_step": 440859, "epoch": 5311} {"train_loss": -27.0552978515625, "global_step": 440860, "epoch": 5311} {"train_loss": -27.369800567626953, "global_step": 440861, "epoch": 5311} {"train_loss": -27.079954147338867, "global_step": 440862, "epoch": 5311} {"train_loss": -26.21400260925293, "global_step": 440863, "epoch": 5311} {"train_loss": -26.19028091430664, "global_step": 440864, "epoch": 5311} {"train_loss": -25.908933639526367, "global_step": 440865, "epoch": 5311} {"train_loss": -25.35743522644043, "global_step": 440866, "epoch": 5311} {"train_loss": -26.7904109954834, "global_step": 440867, "epoch": 5311} {"train_loss": -26.455915451049805, "global_step": 440868, "epoch": 5311} {"train_loss": -26.57056999206543, "global_step": 440869, "epoch": 5311} {"train_loss": -26.55158042907715, "global_step": 440870, "epoch": 5311} {"train_loss": -26.970117568969727, "global_step": 440871, "epoch": 5311} {"train_loss": -26.507938385009766, "global_step": 440872, "epoch": 5311} {"train_loss": -26.652448654174805, "global_step": 440873, "epoch": 5311} {"train_loss": -26.670608520507812, "global_step": 440874, "epoch": 5311} {"train_loss": -26.82464599609375, "global_step": 440875, "epoch": 5311} {"train_loss": -26.889249801635742, "global_step": 440876, "epoch": 5311} {"train_loss": -26.72865867614746, "global_step": 440877, "epoch": 5311} {"train_loss": -26.822265625, "global_step": 440878, "epoch": 5311} {"train_loss": -26.6923885345459, "global_step": 440879, "epoch": 5311} {"train_loss": -26.91375732421875, "global_step": 440880, "epoch": 5311} {"train_loss": -26.794391632080078, "global_step": 440881, "epoch": 5311} {"train_loss": -26.886091232299805, "global_step": 440882, "epoch": 5311} {"train_loss": -26.67896842956543, "global_step": 440883, "epoch": 5311} {"train_loss": -26.838977813720703, "global_step": 440884, "epoch": 5311} {"train_loss": -26.8786563873291, "global_step": 440885, "epoch": 5311} {"train_loss": -26.80820655822754, "global_step": 440886, "epoch": 5311} {"train_loss": -26.93610191345215, "global_step": 440887, "epoch": 5311} {"train_loss": -27.064550399780273, "global_step": 440888, "epoch": 5311} {"train_loss": -26.595062255859375, "global_step": 440889, "epoch": 5311} {"train_loss": -27.174762725830078, "global_step": 440890, "epoch": 5311} {"train_loss": -26.741308212280273, "global_step": 440891, "epoch": 5311} {"train_loss": -27.23676109313965, "global_step": 440892, "epoch": 5311} {"train_loss": -27.2838134765625, "global_step": 440893, "epoch": 5311} {"train_loss": -27.104232788085938, "global_step": 440894, "epoch": 5311} {"train_loss": -26.736704010561287, "global_step": 440895, "epoch": 5311, "val_loss": 6633627.0} {"train_loss": -26.04009437561035, "global_step": 440896, "epoch": 5312} {"train_loss": -26.568944931030273, "global_step": 440897, "epoch": 5312} {"train_loss": -26.1893367767334, "global_step": 440898, "epoch": 5312} {"train_loss": -26.80243492126465, "global_step": 440899, "epoch": 5312} {"train_loss": -26.748401641845703, "global_step": 440900, "epoch": 5312} {"train_loss": -26.48560905456543, "global_step": 440901, "epoch": 5312} {"train_loss": -27.109846115112305, "global_step": 440902, "epoch": 5312} {"train_loss": -26.49262046813965, "global_step": 440903, "epoch": 5312} {"train_loss": -26.37593650817871, "global_step": 440904, "epoch": 5312} {"train_loss": -26.4818172454834, "global_step": 440905, "epoch": 5312} {"train_loss": -26.90181541442871, "global_step": 440906, "epoch": 5312} {"train_loss": -26.57132911682129, "global_step": 440907, "epoch": 5312} {"train_loss": -26.870319366455078, "global_step": 440908, "epoch": 5312} {"train_loss": -26.586755752563477, "global_step": 440909, "epoch": 5312} {"train_loss": -26.80963706970215, "global_step": 440910, "epoch": 5312} {"train_loss": -26.362241744995117, "global_step": 440911, "epoch": 5312} {"train_loss": -26.85732078552246, "global_step": 440912, "epoch": 5312} {"train_loss": -26.984899520874023, "global_step": 440913, "epoch": 5312} {"train_loss": -26.948205947875977, "global_step": 440914, "epoch": 5312} {"train_loss": -26.708600997924805, "global_step": 440915, "epoch": 5312} {"train_loss": -26.689130783081055, "global_step": 440916, "epoch": 5312} {"train_loss": -26.64667320251465, "global_step": 440917, "epoch": 5312} {"train_loss": -26.961841583251953, "global_step": 440918, "epoch": 5312} {"train_loss": -26.419340133666992, "global_step": 440919, "epoch": 5312} {"train_loss": -26.585412979125977, "global_step": 440920, "epoch": 5312} {"train_loss": -27.106231689453125, "global_step": 440921, "epoch": 5312} {"train_loss": -27.024932861328125, "global_step": 440922, "epoch": 5312} {"train_loss": -27.0449275970459, "global_step": 440923, "epoch": 5312} {"train_loss": -26.794300079345703, "global_step": 440924, "epoch": 5312} {"train_loss": -26.912748336791992, "global_step": 440925, "epoch": 5312} {"train_loss": -27.18461036682129, "global_step": 440926, "epoch": 5312} {"train_loss": -26.904027938842773, "global_step": 440927, "epoch": 5312} {"train_loss": -26.8660945892334, "global_step": 440928, "epoch": 5312} {"train_loss": -26.945755004882812, "global_step": 440929, "epoch": 5312} {"train_loss": -27.254751205444336, "global_step": 440930, "epoch": 5312} {"train_loss": -26.8284969329834, "global_step": 440931, "epoch": 5312} {"train_loss": -27.341510772705078, "global_step": 440932, "epoch": 5312} {"train_loss": -27.184946060180664, "global_step": 440933, "epoch": 5312} {"train_loss": -27.129806518554688, "global_step": 440934, "epoch": 5312} {"train_loss": -26.80006980895996, "global_step": 440935, "epoch": 5312} {"train_loss": -27.16634178161621, "global_step": 440936, "epoch": 5312} {"train_loss": -27.06477165222168, "global_step": 440937, "epoch": 5312} {"train_loss": -26.8929500579834, "global_step": 440938, "epoch": 5312} {"train_loss": -26.840803146362305, "global_step": 440939, "epoch": 5312} {"train_loss": -27.3237361907959, "global_step": 440940, "epoch": 5312} {"train_loss": -27.034753799438477, "global_step": 440941, "epoch": 5312} {"train_loss": -26.87449073791504, "global_step": 440942, "epoch": 5312} {"train_loss": -27.36297035217285, "global_step": 440943, "epoch": 5312} {"train_loss": -27.232614517211914, "global_step": 440944, "epoch": 5312} {"train_loss": -27.38958168029785, "global_step": 440945, "epoch": 5312} {"train_loss": -27.060718536376953, "global_step": 440946, "epoch": 5312} {"train_loss": -27.181528091430664, "global_step": 440947, "epoch": 5312} {"train_loss": -25.909875869750977, "global_step": 440948, "epoch": 5312} {"train_loss": -24.744552612304688, "global_step": 440949, "epoch": 5312} {"train_loss": -25.583805084228516, "global_step": 440950, "epoch": 5312} {"train_loss": -26.301227569580078, "global_step": 440951, "epoch": 5312} {"train_loss": -26.555322647094727, "global_step": 440952, "epoch": 5312} {"train_loss": -26.49920082092285, "global_step": 440953, "epoch": 5312} {"train_loss": -25.94573974609375, "global_step": 440954, "epoch": 5312} {"train_loss": -26.85630226135254, "global_step": 440955, "epoch": 5312} {"train_loss": -26.05390739440918, "global_step": 440956, "epoch": 5312} {"train_loss": -26.4305419921875, "global_step": 440957, "epoch": 5312} {"train_loss": -26.173635482788086, "global_step": 440958, "epoch": 5312} {"train_loss": -26.640241622924805, "global_step": 440959, "epoch": 5312} {"train_loss": -26.85137367248535, "global_step": 440960, "epoch": 5312} {"train_loss": -26.391799926757812, "global_step": 440961, "epoch": 5312} {"train_loss": -26.544458389282227, "global_step": 440962, "epoch": 5312} {"train_loss": -26.84827995300293, "global_step": 440963, "epoch": 5312} {"train_loss": -26.79608154296875, "global_step": 440964, "epoch": 5312} {"train_loss": -26.46087646484375, "global_step": 440965, "epoch": 5312} {"train_loss": -26.749347686767578, "global_step": 440966, "epoch": 5312} {"train_loss": -26.858291625976562, "global_step": 440967, "epoch": 5312} {"train_loss": -26.436742782592773, "global_step": 440968, "epoch": 5312} {"train_loss": -26.884784698486328, "global_step": 440969, "epoch": 5312} {"train_loss": -26.733518600463867, "global_step": 440970, "epoch": 5312} {"train_loss": -26.40630531311035, "global_step": 440971, "epoch": 5312} {"train_loss": -26.735864639282227, "global_step": 440972, "epoch": 5312} {"train_loss": -27.07636070251465, "global_step": 440973, "epoch": 5312} {"train_loss": -26.67502784729004, "global_step": 440974, "epoch": 5312} {"train_loss": -26.545501708984375, "global_step": 440975, "epoch": 5312} {"train_loss": -26.302021026611328, "global_step": 440976, "epoch": 5312} {"train_loss": -26.824054718017578, "global_step": 440977, "epoch": 5312} {"train_loss": -26.7319691209908, "global_step": 440978, "epoch": 5312, "val_loss": 6697649.5} {"train_loss": -26.720605850219727, "global_step": 440979, "epoch": 5313} {"train_loss": -26.55106544494629, "global_step": 440980, "epoch": 5313} {"train_loss": -27.007843017578125, "global_step": 440981, "epoch": 5313} {"train_loss": -26.684125900268555, "global_step": 440982, "epoch": 5313} {"train_loss": -26.6093692779541, "global_step": 440983, "epoch": 5313} {"train_loss": -26.907440185546875, "global_step": 440984, "epoch": 5313} {"train_loss": -27.010229110717773, "global_step": 440985, "epoch": 5313} {"train_loss": -26.935901641845703, "global_step": 440986, "epoch": 5313} {"train_loss": -27.230833053588867, "global_step": 440987, "epoch": 5313} {"train_loss": -26.818220138549805, "global_step": 440988, "epoch": 5313} {"train_loss": -26.956029891967773, "global_step": 440989, "epoch": 5313} {"train_loss": -26.9246768951416, "global_step": 440990, "epoch": 5313} {"train_loss": -27.361175537109375, "global_step": 440991, "epoch": 5313} {"train_loss": -26.733413696289062, "global_step": 440992, "epoch": 5313} {"train_loss": -27.423526763916016, "global_step": 440993, "epoch": 5313} {"train_loss": -27.025680541992188, "global_step": 440994, "epoch": 5313} {"train_loss": -27.009626388549805, "global_step": 440995, "epoch": 5313} {"train_loss": -27.290990829467773, "global_step": 440996, "epoch": 5313} {"train_loss": -27.13960838317871, "global_step": 440997, "epoch": 5313} {"train_loss": -27.382070541381836, "global_step": 440998, "epoch": 5313} {"train_loss": -27.086294174194336, "global_step": 440999, "epoch": 5313} {"train_loss": -26.998519897460938, "global_step": 441000, "epoch": 5313} {"train_loss": -26.926923751831055, "global_step": 441001, "epoch": 5313} {"train_loss": -26.83304786682129, "global_step": 441002, "epoch": 5313} {"train_loss": -27.370010375976562, "global_step": 441003, "epoch": 5313} {"train_loss": -26.60956382751465, "global_step": 441004, "epoch": 5313} {"train_loss": -27.0710506439209, "global_step": 441005, "epoch": 5313} {"train_loss": -27.374982833862305, "global_step": 441006, "epoch": 5313} {"train_loss": -26.82208824157715, "global_step": 441007, "epoch": 5313} {"train_loss": -26.72991943359375, "global_step": 441008, "epoch": 5313} {"train_loss": -27.092731475830078, "global_step": 441009, "epoch": 5313} {"train_loss": -26.928180694580078, "global_step": 441010, "epoch": 5313} {"train_loss": -27.064533233642578, "global_step": 441011, "epoch": 5313} {"train_loss": -26.847888946533203, "global_step": 441012, "epoch": 5313} {"train_loss": -27.360349655151367, "global_step": 441013, "epoch": 5313} {"train_loss": -27.299381256103516, "global_step": 441014, "epoch": 5313} {"train_loss": -26.79082679748535, "global_step": 441015, "epoch": 5313} {"train_loss": -26.412540435791016, "global_step": 441016, "epoch": 5313} {"train_loss": -27.48447608947754, "global_step": 441017, "epoch": 5313} {"train_loss": -27.12763023376465, "global_step": 441018, "epoch": 5313} {"train_loss": -26.89741325378418, "global_step": 441019, "epoch": 5313} {"train_loss": -26.7926082611084, "global_step": 441020, "epoch": 5313} {"train_loss": -26.807052612304688, "global_step": 441021, "epoch": 5313} {"train_loss": -26.907794952392578, "global_step": 441022, "epoch": 5313} {"train_loss": -27.00294303894043, "global_step": 441023, "epoch": 5313} {"train_loss": -26.89430046081543, "global_step": 441024, "epoch": 5313} {"train_loss": -26.987396240234375, "global_step": 441025, "epoch": 5313} {"train_loss": -26.93586540222168, "global_step": 441026, "epoch": 5313} {"train_loss": -26.827253341674805, "global_step": 441027, "epoch": 5313} {"train_loss": -27.130615234375, "global_step": 441028, "epoch": 5313} {"train_loss": -27.1569881439209, "global_step": 441029, "epoch": 5313} {"train_loss": -26.841978073120117, "global_step": 441030, "epoch": 5313} {"train_loss": -26.69358253479004, "global_step": 441031, "epoch": 5313} {"train_loss": -26.729480743408203, "global_step": 441032, "epoch": 5313} {"train_loss": -27.152332305908203, "global_step": 441033, "epoch": 5313} {"train_loss": -26.726980209350586, "global_step": 441034, "epoch": 5313} {"train_loss": -26.611875534057617, "global_step": 441035, "epoch": 5313} {"train_loss": -27.017642974853516, "global_step": 441036, "epoch": 5313} {"train_loss": -26.6332950592041, "global_step": 441037, "epoch": 5313} {"train_loss": -26.934345245361328, "global_step": 441038, "epoch": 5313} {"train_loss": -26.87522315979004, "global_step": 441039, "epoch": 5313} {"train_loss": -26.921796798706055, "global_step": 441040, "epoch": 5313} {"train_loss": -26.948867797851562, "global_step": 441041, "epoch": 5313} {"train_loss": -27.135705947875977, "global_step": 441042, "epoch": 5313} {"train_loss": -26.69171714782715, "global_step": 441043, "epoch": 5313} {"train_loss": -26.838504791259766, "global_step": 441044, "epoch": 5313} {"train_loss": -26.552005767822266, "global_step": 441045, "epoch": 5313} {"train_loss": -26.758529663085938, "global_step": 441046, "epoch": 5313} {"train_loss": -26.8291072845459, "global_step": 441047, "epoch": 5313} {"train_loss": -26.53839111328125, "global_step": 441048, "epoch": 5313} {"train_loss": -27.172311782836914, "global_step": 441049, "epoch": 5313} {"train_loss": -27.051538467407227, "global_step": 441050, "epoch": 5313} {"train_loss": -26.79670524597168, "global_step": 441051, "epoch": 5313} {"train_loss": -26.79157829284668, "global_step": 441052, "epoch": 5313} {"train_loss": -26.73647117614746, "global_step": 441053, "epoch": 5313} {"train_loss": -26.679401397705078, "global_step": 441054, "epoch": 5313} {"train_loss": -27.08697509765625, "global_step": 441055, "epoch": 5313} {"train_loss": -27.443708419799805, "global_step": 441056, "epoch": 5313} {"train_loss": -27.171005249023438, "global_step": 441057, "epoch": 5313} {"train_loss": -27.378997802734375, "global_step": 441058, "epoch": 5313} {"train_loss": -26.91056251525879, "global_step": 441059, "epoch": 5313} {"train_loss": -26.755859375, "global_step": 441060, "epoch": 5313} {"train_loss": -26.949299708906427, "global_step": 441061, "epoch": 5313, "val_loss": 6672599.0} {"train_loss": -27.04538917541504, "global_step": 441062, "epoch": 5314} {"train_loss": -27.15913200378418, "global_step": 441063, "epoch": 5314} {"train_loss": -26.493152618408203, "global_step": 441064, "epoch": 5314} {"train_loss": -27.002904891967773, "global_step": 441065, "epoch": 5314} {"train_loss": -26.8225154876709, "global_step": 441066, "epoch": 5314} {"train_loss": -26.8048095703125, "global_step": 441067, "epoch": 5314} {"train_loss": -26.29090690612793, "global_step": 441068, "epoch": 5314} {"train_loss": -26.860584259033203, "global_step": 441069, "epoch": 5314} {"train_loss": -27.09028434753418, "global_step": 441070, "epoch": 5314} {"train_loss": -26.687808990478516, "global_step": 441071, "epoch": 5314} {"train_loss": -26.342374801635742, "global_step": 441072, "epoch": 5314} {"train_loss": -26.419340133666992, "global_step": 441073, "epoch": 5314} {"train_loss": -26.376367568969727, "global_step": 441074, "epoch": 5314} {"train_loss": -26.878564834594727, "global_step": 441075, "epoch": 5314} {"train_loss": -26.734174728393555, "global_step": 441076, "epoch": 5314} {"train_loss": -26.651586532592773, "global_step": 441077, "epoch": 5314} {"train_loss": -26.547086715698242, "global_step": 441078, "epoch": 5314} {"train_loss": -27.00410270690918, "global_step": 441079, "epoch": 5314} {"train_loss": -26.739303588867188, "global_step": 441080, "epoch": 5314} {"train_loss": -27.137907028198242, "global_step": 441081, "epoch": 5314} {"train_loss": -26.580121994018555, "global_step": 441082, "epoch": 5314} {"train_loss": -27.126678466796875, "global_step": 441083, "epoch": 5314} {"train_loss": -26.835254669189453, "global_step": 441084, "epoch": 5314} {"train_loss": -26.619617462158203, "global_step": 441085, "epoch": 5314} {"train_loss": -27.114948272705078, "global_step": 441086, "epoch": 5314} {"train_loss": -26.843326568603516, "global_step": 441087, "epoch": 5314} {"train_loss": -26.62821388244629, "global_step": 441088, "epoch": 5314} {"train_loss": -26.971027374267578, "global_step": 441089, "epoch": 5314} {"train_loss": -26.85004234313965, "global_step": 441090, "epoch": 5314} {"train_loss": -27.159183502197266, "global_step": 441091, "epoch": 5314} {"train_loss": -27.280431747436523, "global_step": 441092, "epoch": 5314} {"train_loss": -26.560155868530273, "global_step": 441093, "epoch": 5314} {"train_loss": -27.003271102905273, "global_step": 441094, "epoch": 5314} {"train_loss": -26.854019165039062, "global_step": 441095, "epoch": 5314} {"train_loss": -26.78971290588379, "global_step": 441096, "epoch": 5314} {"train_loss": -26.899160385131836, "global_step": 441097, "epoch": 5314} {"train_loss": -27.0543212890625, "global_step": 441098, "epoch": 5314} {"train_loss": -26.751317977905273, "global_step": 441099, "epoch": 5314} {"train_loss": -26.998249053955078, "global_step": 441100, "epoch": 5314} {"train_loss": -27.398334503173828, "global_step": 441101, "epoch": 5314} {"train_loss": -26.892898559570312, "global_step": 441102, "epoch": 5314} {"train_loss": -27.260961532592773, "global_step": 441103, "epoch": 5314} {"train_loss": -27.32000732421875, "global_step": 441104, "epoch": 5314} {"train_loss": -26.746963500976562, "global_step": 441105, "epoch": 5314} {"train_loss": -27.15409278869629, "global_step": 441106, "epoch": 5314} {"train_loss": -27.05830192565918, "global_step": 441107, "epoch": 5314} {"train_loss": -26.972944259643555, "global_step": 441108, "epoch": 5314} {"train_loss": -27.036640167236328, "global_step": 441109, "epoch": 5314} {"train_loss": -27.3043212890625, "global_step": 441110, "epoch": 5314} {"train_loss": -26.825170516967773, "global_step": 441111, "epoch": 5314} {"train_loss": -26.935504913330078, "global_step": 441112, "epoch": 5314} {"train_loss": -27.001392364501953, "global_step": 441113, "epoch": 5314} {"train_loss": -26.873849868774414, "global_step": 441114, "epoch": 5314} {"train_loss": -26.8769588470459, "global_step": 441115, "epoch": 5314} {"train_loss": -27.10597038269043, "global_step": 441116, "epoch": 5314} {"train_loss": -26.78057861328125, "global_step": 441117, "epoch": 5314} {"train_loss": -26.1619930267334, "global_step": 441118, "epoch": 5314} {"train_loss": -26.75960350036621, "global_step": 441119, "epoch": 5314} {"train_loss": -27.113351821899414, "global_step": 441120, "epoch": 5314} {"train_loss": -27.083715438842773, "global_step": 441121, "epoch": 5314} {"train_loss": -26.875751495361328, "global_step": 441122, "epoch": 5314} {"train_loss": -26.84601402282715, "global_step": 441123, "epoch": 5314} {"train_loss": -27.436185836791992, "global_step": 441124, "epoch": 5314} {"train_loss": -26.924686431884766, "global_step": 441125, "epoch": 5314} {"train_loss": -26.913320541381836, "global_step": 441126, "epoch": 5314} {"train_loss": -27.442480087280273, "global_step": 441127, "epoch": 5314} {"train_loss": -26.71136474609375, "global_step": 441128, "epoch": 5314} {"train_loss": -27.225446701049805, "global_step": 441129, "epoch": 5314} {"train_loss": -26.77284812927246, "global_step": 441130, "epoch": 5314} {"train_loss": -27.419462203979492, "global_step": 441131, "epoch": 5314} {"train_loss": -26.957056045532227, "global_step": 441132, "epoch": 5314} {"train_loss": -27.04401969909668, "global_step": 441133, "epoch": 5314} {"train_loss": -27.00714683532715, "global_step": 441134, "epoch": 5314} {"train_loss": -26.915510177612305, "global_step": 441135, "epoch": 5314} {"train_loss": -26.813817977905273, "global_step": 441136, "epoch": 5314} {"train_loss": -27.231266021728516, "global_step": 441137, "epoch": 5314} {"train_loss": -26.95008659362793, "global_step": 441138, "epoch": 5314} {"train_loss": -26.93855094909668, "global_step": 441139, "epoch": 5314} {"train_loss": -26.9016056060791, "global_step": 441140, "epoch": 5314} {"train_loss": -26.82232666015625, "global_step": 441141, "epoch": 5314} {"train_loss": -26.807043075561523, "global_step": 441142, "epoch": 5314} {"train_loss": -26.75872230529785, "global_step": 441143, "epoch": 5314} {"train_loss": -26.91135298487652, "global_step": 441144, "epoch": 5314, "val_loss": 6699764.0} {"train_loss": -26.68304443359375, "global_step": 441145, "epoch": 5315} {"train_loss": -26.366743087768555, "global_step": 441146, "epoch": 5315} {"train_loss": -26.30043601989746, "global_step": 441147, "epoch": 5315} {"train_loss": -26.99781608581543, "global_step": 441148, "epoch": 5315} {"train_loss": -26.690998077392578, "global_step": 441149, "epoch": 5315} {"train_loss": -26.792816162109375, "global_step": 441150, "epoch": 5315} {"train_loss": -26.987024307250977, "global_step": 441151, "epoch": 5315} {"train_loss": -26.516620635986328, "global_step": 441152, "epoch": 5315} {"train_loss": -26.819656372070312, "global_step": 441153, "epoch": 5315} {"train_loss": -26.687284469604492, "global_step": 441154, "epoch": 5315} {"train_loss": -26.86370849609375, "global_step": 441155, "epoch": 5315} {"train_loss": -26.84832763671875, "global_step": 441156, "epoch": 5315} {"train_loss": -26.727619171142578, "global_step": 441157, "epoch": 5315} {"train_loss": -26.628631591796875, "global_step": 441158, "epoch": 5315} {"train_loss": -27.06748390197754, "global_step": 441159, "epoch": 5315} {"train_loss": -26.834569931030273, "global_step": 441160, "epoch": 5315} {"train_loss": -26.971088409423828, "global_step": 441161, "epoch": 5315} {"train_loss": -26.64765739440918, "global_step": 441162, "epoch": 5315} {"train_loss": -26.809860229492188, "global_step": 441163, "epoch": 5315} {"train_loss": -26.76531410217285, "global_step": 441164, "epoch": 5315} {"train_loss": -26.798730850219727, "global_step": 441165, "epoch": 5315} {"train_loss": -26.7314453125, "global_step": 441166, "epoch": 5315} {"train_loss": -26.635862350463867, "global_step": 441167, "epoch": 5315} {"train_loss": -27.0119571685791, "global_step": 441168, "epoch": 5315} {"train_loss": -26.945138931274414, "global_step": 441169, "epoch": 5315} {"train_loss": -27.069416046142578, "global_step": 441170, "epoch": 5315} {"train_loss": -26.73859977722168, "global_step": 441171, "epoch": 5315} {"train_loss": -27.054523468017578, "global_step": 441172, "epoch": 5315} {"train_loss": -26.36818504333496, "global_step": 441173, "epoch": 5315} {"train_loss": -26.69246482849121, "global_step": 441174, "epoch": 5315} {"train_loss": -26.431970596313477, "global_step": 441175, "epoch": 5315} {"train_loss": -26.969446182250977, "global_step": 441176, "epoch": 5315} {"train_loss": -27.09242057800293, "global_step": 441177, "epoch": 5315} {"train_loss": -27.191913604736328, "global_step": 441178, "epoch": 5315} {"train_loss": -26.93428611755371, "global_step": 441179, "epoch": 5315} {"train_loss": -27.24212646484375, "global_step": 441180, "epoch": 5315} {"train_loss": -27.14613914489746, "global_step": 441181, "epoch": 5315} {"train_loss": -27.0565242767334, "global_step": 441182, "epoch": 5315} {"train_loss": -26.892963409423828, "global_step": 441183, "epoch": 5315} {"train_loss": -26.953033447265625, "global_step": 441184, "epoch": 5315} {"train_loss": -26.336332321166992, "global_step": 441185, "epoch": 5315} {"train_loss": -27.200607299804688, "global_step": 441186, "epoch": 5315} {"train_loss": -27.4136962890625, "global_step": 441187, "epoch": 5315} {"train_loss": -27.105619430541992, "global_step": 441188, "epoch": 5315} {"train_loss": -27.019338607788086, "global_step": 441189, "epoch": 5315} {"train_loss": -27.358566284179688, "global_step": 441190, "epoch": 5315} {"train_loss": -26.869094848632812, "global_step": 441191, "epoch": 5315} {"train_loss": -27.05721092224121, "global_step": 441192, "epoch": 5315} {"train_loss": -26.7506160736084, "global_step": 441193, "epoch": 5315} {"train_loss": -27.188507080078125, "global_step": 441194, "epoch": 5315} {"train_loss": -26.94195556640625, "global_step": 441195, "epoch": 5315} {"train_loss": -27.26227378845215, "global_step": 441196, "epoch": 5315} {"train_loss": -26.71185874938965, "global_step": 441197, "epoch": 5315} {"train_loss": -26.88818359375, "global_step": 441198, "epoch": 5315} {"train_loss": -27.130773544311523, "global_step": 441199, "epoch": 5315} {"train_loss": -27.179412841796875, "global_step": 441200, "epoch": 5315} {"train_loss": -26.5895938873291, "global_step": 441201, "epoch": 5315} {"train_loss": -27.29400062561035, "global_step": 441202, "epoch": 5315} {"train_loss": -26.6506404876709, "global_step": 441203, "epoch": 5315} {"train_loss": -26.835540771484375, "global_step": 441204, "epoch": 5315} {"train_loss": -26.98750877380371, "global_step": 441205, "epoch": 5315} {"train_loss": -27.067596435546875, "global_step": 441206, "epoch": 5315} {"train_loss": -26.81427574157715, "global_step": 441207, "epoch": 5315} {"train_loss": -26.7392635345459, "global_step": 441208, "epoch": 5315} {"train_loss": -26.590681076049805, "global_step": 441209, "epoch": 5315} {"train_loss": -26.6573429107666, "global_step": 441210, "epoch": 5315} {"train_loss": -26.59393882751465, "global_step": 441211, "epoch": 5315} {"train_loss": -26.650054931640625, "global_step": 441212, "epoch": 5315} {"train_loss": -26.654218673706055, "global_step": 441213, "epoch": 5315} {"train_loss": -27.08643913269043, "global_step": 441214, "epoch": 5315} {"train_loss": -27.113454818725586, "global_step": 441215, "epoch": 5315} {"train_loss": -27.266427993774414, "global_step": 441216, "epoch": 5315} {"train_loss": -27.251867294311523, "global_step": 441217, "epoch": 5315} {"train_loss": -27.244312286376953, "global_step": 441218, "epoch": 5315} {"train_loss": -27.152973175048828, "global_step": 441219, "epoch": 5315} {"train_loss": -27.1114501953125, "global_step": 441220, "epoch": 5315} {"train_loss": -26.78754997253418, "global_step": 441221, "epoch": 5315} {"train_loss": -26.685089111328125, "global_step": 441222, "epoch": 5315} {"train_loss": -27.35392189025879, "global_step": 441223, "epoch": 5315} {"train_loss": -27.331119537353516, "global_step": 441224, "epoch": 5315} {"train_loss": -27.10251235961914, "global_step": 441225, "epoch": 5315} {"train_loss": -26.91672134399414, "global_step": 441226, "epoch": 5315} {"train_loss": -26.902659565569408, "global_step": 441227, "epoch": 5315, "val_loss": 6666202.0} {"train_loss": -25.654516220092773, "global_step": 441228, "epoch": 5316} {"train_loss": -25.66936683654785, "global_step": 441229, "epoch": 5316} {"train_loss": -26.301422119140625, "global_step": 441230, "epoch": 5316} {"train_loss": -26.586584091186523, "global_step": 441231, "epoch": 5316} {"train_loss": -25.884002685546875, "global_step": 441232, "epoch": 5316} {"train_loss": -26.411596298217773, "global_step": 441233, "epoch": 5316} {"train_loss": -26.399066925048828, "global_step": 441234, "epoch": 5316} {"train_loss": -26.480182647705078, "global_step": 441235, "epoch": 5316} {"train_loss": -26.649255752563477, "global_step": 441236, "epoch": 5316} {"train_loss": -26.40143394470215, "global_step": 441237, "epoch": 5316} {"train_loss": -26.6654052734375, "global_step": 441238, "epoch": 5316} {"train_loss": -26.480955123901367, "global_step": 441239, "epoch": 5316} {"train_loss": -26.77292251586914, "global_step": 441240, "epoch": 5316} {"train_loss": -26.62497329711914, "global_step": 441241, "epoch": 5316} {"train_loss": -27.1054744720459, "global_step": 441242, "epoch": 5316} {"train_loss": -26.630008697509766, "global_step": 441243, "epoch": 5316} {"train_loss": -26.791187286376953, "global_step": 441244, "epoch": 5316} {"train_loss": -26.647634506225586, "global_step": 441245, "epoch": 5316} {"train_loss": -26.847213745117188, "global_step": 441246, "epoch": 5316} {"train_loss": -26.747655868530273, "global_step": 441247, "epoch": 5316} {"train_loss": -26.7100830078125, "global_step": 441248, "epoch": 5316} {"train_loss": -26.826507568359375, "global_step": 441249, "epoch": 5316} {"train_loss": -26.928491592407227, "global_step": 441250, "epoch": 5316} {"train_loss": -26.864139556884766, "global_step": 441251, "epoch": 5316} {"train_loss": -27.003000259399414, "global_step": 441252, "epoch": 5316} {"train_loss": -27.45765495300293, "global_step": 441253, "epoch": 5316} {"train_loss": -26.795827865600586, "global_step": 441254, "epoch": 5316} {"train_loss": -26.902774810791016, "global_step": 441255, "epoch": 5316} {"train_loss": -27.0145263671875, "global_step": 441256, "epoch": 5316} {"train_loss": -27.24177360534668, "global_step": 441257, "epoch": 5316} {"train_loss": -27.080190658569336, "global_step": 441258, "epoch": 5316} {"train_loss": -26.89082145690918, "global_step": 441259, "epoch": 5316} {"train_loss": -27.10971450805664, "global_step": 441260, "epoch": 5316} {"train_loss": -26.73893165588379, "global_step": 441261, "epoch": 5316} {"train_loss": -27.28626823425293, "global_step": 441262, "epoch": 5316} {"train_loss": -27.143585205078125, "global_step": 441263, "epoch": 5316} {"train_loss": -27.035125732421875, "global_step": 441264, "epoch": 5316} {"train_loss": -27.10039710998535, "global_step": 441265, "epoch": 5316} {"train_loss": -27.00685691833496, "global_step": 441266, "epoch": 5316} {"train_loss": -27.269323348999023, "global_step": 441267, "epoch": 5316} {"train_loss": -27.223234176635742, "global_step": 441268, "epoch": 5316} {"train_loss": -27.1342830657959, "global_step": 441269, "epoch": 5316} {"train_loss": -27.2548770904541, "global_step": 441270, "epoch": 5316} {"train_loss": -27.104162216186523, "global_step": 441271, "epoch": 5316} {"train_loss": -27.069326400756836, "global_step": 441272, "epoch": 5316} {"train_loss": -27.3873291015625, "global_step": 441273, "epoch": 5316} {"train_loss": -26.81243896484375, "global_step": 441274, "epoch": 5316} {"train_loss": -27.049560546875, "global_step": 441275, "epoch": 5316} {"train_loss": -27.0634708404541, "global_step": 441276, "epoch": 5316} {"train_loss": -26.98390007019043, "global_step": 441277, "epoch": 5316} {"train_loss": -26.963531494140625, "global_step": 441278, "epoch": 5316} {"train_loss": -26.988616943359375, "global_step": 441279, "epoch": 5316} {"train_loss": -27.26025390625, "global_step": 441280, "epoch": 5316} {"train_loss": -27.42462730407715, "global_step": 441281, "epoch": 5316} {"train_loss": -26.929529190063477, "global_step": 441282, "epoch": 5316} {"train_loss": -26.7711181640625, "global_step": 441283, "epoch": 5316} {"train_loss": -26.455224990844727, "global_step": 441284, "epoch": 5316} {"train_loss": -26.747800827026367, "global_step": 441285, "epoch": 5316} {"train_loss": -26.611785888671875, "global_step": 441286, "epoch": 5316} {"train_loss": -26.660974502563477, "global_step": 441287, "epoch": 5316} {"train_loss": -26.947370529174805, "global_step": 441288, "epoch": 5316} {"train_loss": -27.222614288330078, "global_step": 441289, "epoch": 5316} {"train_loss": -26.74663734436035, "global_step": 441290, "epoch": 5316} {"train_loss": -26.3787841796875, "global_step": 441291, "epoch": 5316} {"train_loss": -25.856006622314453, "global_step": 441292, "epoch": 5316} {"train_loss": -25.918161392211914, "global_step": 441293, "epoch": 5316} {"train_loss": -26.421024322509766, "global_step": 441294, "epoch": 5316} {"train_loss": -26.759937286376953, "global_step": 441295, "epoch": 5316} {"train_loss": -26.91724967956543, "global_step": 441296, "epoch": 5316} {"train_loss": -26.72092056274414, "global_step": 441297, "epoch": 5316} {"train_loss": -27.128934860229492, "global_step": 441298, "epoch": 5316} {"train_loss": -26.491641998291016, "global_step": 441299, "epoch": 5316} {"train_loss": -26.71523094177246, "global_step": 441300, "epoch": 5316} {"train_loss": -26.583541870117188, "global_step": 441301, "epoch": 5316} {"train_loss": -26.873245239257812, "global_step": 441302, "epoch": 5316} {"train_loss": -26.495553970336914, "global_step": 441303, "epoch": 5316} {"train_loss": -27.007883071899414, "global_step": 441304, "epoch": 5316} {"train_loss": -26.767505645751953, "global_step": 441305, "epoch": 5316} {"train_loss": -26.759992599487305, "global_step": 441306, "epoch": 5316} {"train_loss": -27.3369140625, "global_step": 441307, "epoch": 5316} {"train_loss": -27.00373649597168, "global_step": 441308, "epoch": 5316} {"train_loss": -26.18584632873535, "global_step": 441309, "epoch": 5316} {"train_loss": -26.783305018781178, "global_step": 441310, "epoch": 5316, "val_loss": 6661584.0} {"train_loss": -26.5965576171875, "global_step": 441311, "epoch": 5317} {"train_loss": -26.664819717407227, "global_step": 441312, "epoch": 5317} {"train_loss": -26.31732177734375, "global_step": 441313, "epoch": 5317} {"train_loss": -26.60573387145996, "global_step": 441314, "epoch": 5317} {"train_loss": -26.811248779296875, "global_step": 441315, "epoch": 5317} {"train_loss": -26.62226676940918, "global_step": 441316, "epoch": 5317} {"train_loss": -26.541284561157227, "global_step": 441317, "epoch": 5317} {"train_loss": -26.536352157592773, "global_step": 441318, "epoch": 5317} {"train_loss": -26.502429962158203, "global_step": 441319, "epoch": 5317} {"train_loss": -26.9716854095459, "global_step": 441320, "epoch": 5317} {"train_loss": -26.4838809967041, "global_step": 441321, "epoch": 5317} {"train_loss": -27.069080352783203, "global_step": 441322, "epoch": 5317} {"train_loss": -27.10603904724121, "global_step": 441323, "epoch": 5317} {"train_loss": -27.11126708984375, "global_step": 441324, "epoch": 5317} {"train_loss": -26.884601593017578, "global_step": 441325, "epoch": 5317} {"train_loss": -27.368656158447266, "global_step": 441326, "epoch": 5317} {"train_loss": -26.961034774780273, "global_step": 441327, "epoch": 5317} {"train_loss": -27.231647491455078, "global_step": 441328, "epoch": 5317} {"train_loss": -26.706588745117188, "global_step": 441329, "epoch": 5317} {"train_loss": -27.33198356628418, "global_step": 441330, "epoch": 5317} {"train_loss": -27.280912399291992, "global_step": 441331, "epoch": 5317} {"train_loss": -26.846845626831055, "global_step": 441332, "epoch": 5317} {"train_loss": -27.00620460510254, "global_step": 441333, "epoch": 5317} {"train_loss": -27.00728416442871, "global_step": 441334, "epoch": 5317} {"train_loss": -27.266437530517578, "global_step": 441335, "epoch": 5317} {"train_loss": -27.285070419311523, "global_step": 441336, "epoch": 5317} {"train_loss": -27.04620933532715, "global_step": 441337, "epoch": 5317} {"train_loss": -26.56351661682129, "global_step": 441338, "epoch": 5317} {"train_loss": -26.98221206665039, "global_step": 441339, "epoch": 5317} {"train_loss": -27.04585075378418, "global_step": 441340, "epoch": 5317} {"train_loss": -27.31715202331543, "global_step": 441341, "epoch": 5317} {"train_loss": -26.95110511779785, "global_step": 441342, "epoch": 5317} {"train_loss": -27.47466468811035, "global_step": 441343, "epoch": 5317} {"train_loss": -27.141651153564453, "global_step": 441344, "epoch": 5317} {"train_loss": -27.046222686767578, "global_step": 441345, "epoch": 5317} {"train_loss": -26.766645431518555, "global_step": 441346, "epoch": 5317} {"train_loss": -26.853071212768555, "global_step": 441347, "epoch": 5317} {"train_loss": -27.049671173095703, "global_step": 441348, "epoch": 5317} {"train_loss": -27.03595542907715, "global_step": 441349, "epoch": 5317} {"train_loss": -26.61625099182129, "global_step": 441350, "epoch": 5317} {"train_loss": -26.629684448242188, "global_step": 441351, "epoch": 5317} {"train_loss": -27.521947860717773, "global_step": 441352, "epoch": 5317} {"train_loss": -27.277210235595703, "global_step": 441353, "epoch": 5317} {"train_loss": -26.57550621032715, "global_step": 441354, "epoch": 5317} {"train_loss": -26.44683837890625, "global_step": 441355, "epoch": 5317} {"train_loss": -26.7423152923584, "global_step": 441356, "epoch": 5317} {"train_loss": -26.97771644592285, "global_step": 441357, "epoch": 5317} {"train_loss": -27.188568115234375, "global_step": 441358, "epoch": 5317} {"train_loss": -26.743473052978516, "global_step": 441359, "epoch": 5317} {"train_loss": -26.7575740814209, "global_step": 441360, "epoch": 5317} {"train_loss": -27.098072052001953, "global_step": 441361, "epoch": 5317} {"train_loss": -26.719751358032227, "global_step": 441362, "epoch": 5317} {"train_loss": -27.01215934753418, "global_step": 441363, "epoch": 5317} {"train_loss": -26.65009880065918, "global_step": 441364, "epoch": 5317} {"train_loss": -27.008132934570312, "global_step": 441365, "epoch": 5317} {"train_loss": -26.8079833984375, "global_step": 441366, "epoch": 5317} {"train_loss": -26.83978843688965, "global_step": 441367, "epoch": 5317} {"train_loss": -26.295377731323242, "global_step": 441368, "epoch": 5317} {"train_loss": -26.43707847595215, "global_step": 441369, "epoch": 5317} {"train_loss": -26.660736083984375, "global_step": 441370, "epoch": 5317} {"train_loss": -26.898054122924805, "global_step": 441371, "epoch": 5317} {"train_loss": -26.768232345581055, "global_step": 441372, "epoch": 5317} {"train_loss": -26.82522964477539, "global_step": 441373, "epoch": 5317} {"train_loss": -26.764896392822266, "global_step": 441374, "epoch": 5317} {"train_loss": -26.850860595703125, "global_step": 441375, "epoch": 5317} {"train_loss": -26.396865844726562, "global_step": 441376, "epoch": 5317} {"train_loss": -26.61423110961914, "global_step": 441377, "epoch": 5317} {"train_loss": -26.584686279296875, "global_step": 441378, "epoch": 5317} {"train_loss": -26.6165828704834, "global_step": 441379, "epoch": 5317} {"train_loss": -27.194143295288086, "global_step": 441380, "epoch": 5317} {"train_loss": -26.79294776916504, "global_step": 441381, "epoch": 5317} {"train_loss": -27.182172775268555, "global_step": 441382, "epoch": 5317} {"train_loss": -26.92315101623535, "global_step": 441383, "epoch": 5317} {"train_loss": -26.744647979736328, "global_step": 441384, "epoch": 5317} {"train_loss": -26.741424560546875, "global_step": 441385, "epoch": 5317} {"train_loss": -26.7426700592041, "global_step": 441386, "epoch": 5317} {"train_loss": -26.93704605102539, "global_step": 441387, "epoch": 5317} {"train_loss": -27.0783634185791, "global_step": 441388, "epoch": 5317} {"train_loss": -26.760547637939453, "global_step": 441389, "epoch": 5317} {"train_loss": -27.072790145874023, "global_step": 441390, "epoch": 5317} {"train_loss": -27.08074951171875, "global_step": 441391, "epoch": 5317} {"train_loss": -27.004663467407227, "global_step": 441392, "epoch": 5317} {"train_loss": -26.881924571761164, "global_step": 441393, "epoch": 5317, "val_loss": 6564658.0} {"train_loss": -26.902572631835938, "global_step": 441394, "epoch": 5318} {"train_loss": -26.50312614440918, "global_step": 441395, "epoch": 5318} {"train_loss": -26.998767852783203, "global_step": 441396, "epoch": 5318} {"train_loss": -26.520925521850586, "global_step": 441397, "epoch": 5318} {"train_loss": -26.9090633392334, "global_step": 441398, "epoch": 5318} {"train_loss": -26.82942008972168, "global_step": 441399, "epoch": 5318} {"train_loss": -26.442602157592773, "global_step": 441400, "epoch": 5318} {"train_loss": -26.895299911499023, "global_step": 441401, "epoch": 5318} {"train_loss": -26.878950119018555, "global_step": 441402, "epoch": 5318} {"train_loss": -26.688465118408203, "global_step": 441403, "epoch": 5318} {"train_loss": -27.040851593017578, "global_step": 441404, "epoch": 5318} {"train_loss": -26.655057907104492, "global_step": 441405, "epoch": 5318} {"train_loss": -26.831527709960938, "global_step": 441406, "epoch": 5318} {"train_loss": -26.788114547729492, "global_step": 441407, "epoch": 5318} {"train_loss": -26.8244686126709, "global_step": 441408, "epoch": 5318} {"train_loss": -26.714553833007812, "global_step": 441409, "epoch": 5318} {"train_loss": -26.858442306518555, "global_step": 441410, "epoch": 5318} {"train_loss": -27.09539794921875, "global_step": 441411, "epoch": 5318} {"train_loss": -26.742420196533203, "global_step": 441412, "epoch": 5318} {"train_loss": -26.569921493530273, "global_step": 441413, "epoch": 5318} {"train_loss": -26.803192138671875, "global_step": 441414, "epoch": 5318} {"train_loss": -26.791351318359375, "global_step": 441415, "epoch": 5318} {"train_loss": -26.665563583374023, "global_step": 441416, "epoch": 5318} {"train_loss": -26.687646865844727, "global_step": 441417, "epoch": 5318} {"train_loss": -26.825031280517578, "global_step": 441418, "epoch": 5318} {"train_loss": -26.850805282592773, "global_step": 441419, "epoch": 5318} {"train_loss": -26.895578384399414, "global_step": 441420, "epoch": 5318} {"train_loss": -26.86161231994629, "global_step": 441421, "epoch": 5318} {"train_loss": -26.911611557006836, "global_step": 441422, "epoch": 5318} {"train_loss": -26.6219425201416, "global_step": 441423, "epoch": 5318} {"train_loss": -26.871488571166992, "global_step": 441424, "epoch": 5318} {"train_loss": -27.07142448425293, "global_step": 441425, "epoch": 5318} {"train_loss": -26.64188575744629, "global_step": 441426, "epoch": 5318} {"train_loss": -27.127410888671875, "global_step": 441427, "epoch": 5318} {"train_loss": -26.824371337890625, "global_step": 441428, "epoch": 5318} {"train_loss": -27.032867431640625, "global_step": 441429, "epoch": 5318} {"train_loss": -26.6500244140625, "global_step": 441430, "epoch": 5318} {"train_loss": -27.31623649597168, "global_step": 441431, "epoch": 5318} {"train_loss": -27.061925888061523, "global_step": 441432, "epoch": 5318} {"train_loss": -27.271469116210938, "global_step": 441433, "epoch": 5318} {"train_loss": -27.04033851623535, "global_step": 441434, "epoch": 5318} {"train_loss": -27.14472007751465, "global_step": 441435, "epoch": 5318} {"train_loss": -27.18635368347168, "global_step": 441436, "epoch": 5318} {"train_loss": -26.868316650390625, "global_step": 441437, "epoch": 5318} {"train_loss": -26.75616455078125, "global_step": 441438, "epoch": 5318} {"train_loss": -27.0188045501709, "global_step": 441439, "epoch": 5318} {"train_loss": -27.068662643432617, "global_step": 441440, "epoch": 5318} {"train_loss": -26.80055046081543, "global_step": 441441, "epoch": 5318} {"train_loss": -26.908557891845703, "global_step": 441442, "epoch": 5318} {"train_loss": -27.195913314819336, "global_step": 441443, "epoch": 5318} {"train_loss": -27.24201774597168, "global_step": 441444, "epoch": 5318} {"train_loss": -27.237960815429688, "global_step": 441445, "epoch": 5318} {"train_loss": -27.26545524597168, "global_step": 441446, "epoch": 5318} {"train_loss": -27.009933471679688, "global_step": 441447, "epoch": 5318} {"train_loss": -27.356281280517578, "global_step": 441448, "epoch": 5318} {"train_loss": -27.4176082611084, "global_step": 441449, "epoch": 5318} {"train_loss": -27.109832763671875, "global_step": 441450, "epoch": 5318} {"train_loss": -27.03675651550293, "global_step": 441451, "epoch": 5318} {"train_loss": -26.995328903198242, "global_step": 441452, "epoch": 5318} {"train_loss": -27.2136173248291, "global_step": 441453, "epoch": 5318} {"train_loss": -27.019880294799805, "global_step": 441454, "epoch": 5318} {"train_loss": -26.91596031188965, "global_step": 441455, "epoch": 5318} {"train_loss": -27.283716201782227, "global_step": 441456, "epoch": 5318} {"train_loss": -26.759815216064453, "global_step": 441457, "epoch": 5318} {"train_loss": -27.229129791259766, "global_step": 441458, "epoch": 5318} {"train_loss": -27.463598251342773, "global_step": 441459, "epoch": 5318} {"train_loss": -27.201017379760742, "global_step": 441460, "epoch": 5318} {"train_loss": -27.097564697265625, "global_step": 441461, "epoch": 5318} {"train_loss": -26.880695343017578, "global_step": 441462, "epoch": 5318} {"train_loss": -27.07413673400879, "global_step": 441463, "epoch": 5318} {"train_loss": -27.224090576171875, "global_step": 441464, "epoch": 5318} {"train_loss": -27.258380889892578, "global_step": 441465, "epoch": 5318} {"train_loss": -27.067047119140625, "global_step": 441466, "epoch": 5318} {"train_loss": -27.15326499938965, "global_step": 441467, "epoch": 5318} {"train_loss": -26.769805908203125, "global_step": 441468, "epoch": 5318} {"train_loss": -26.655858993530273, "global_step": 441469, "epoch": 5318} {"train_loss": -26.24810791015625, "global_step": 441470, "epoch": 5318} {"train_loss": -25.722387313842773, "global_step": 441471, "epoch": 5318} {"train_loss": -25.695148468017578, "global_step": 441472, "epoch": 5318} {"train_loss": -26.38469886779785, "global_step": 441473, "epoch": 5318} {"train_loss": -26.899118423461914, "global_step": 441474, "epoch": 5318} {"train_loss": -26.54481315612793, "global_step": 441475, "epoch": 5318} {"train_loss": -26.883608323981964, "global_step": 441476, "epoch": 5318, "val_loss": 6703000.5} {"train_loss": -26.446645736694336, "global_step": 441477, "epoch": 5319} {"train_loss": -26.12325096130371, "global_step": 441478, "epoch": 5319} {"train_loss": -25.9595890045166, "global_step": 441479, "epoch": 5319} {"train_loss": -26.501087188720703, "global_step": 441480, "epoch": 5319} {"train_loss": -26.213354110717773, "global_step": 441481, "epoch": 5319} {"train_loss": -26.39592933654785, "global_step": 441482, "epoch": 5319} {"train_loss": -26.25497817993164, "global_step": 441483, "epoch": 5319} {"train_loss": -26.43678092956543, "global_step": 441484, "epoch": 5319} {"train_loss": -26.309492111206055, "global_step": 441485, "epoch": 5319} {"train_loss": -26.64157485961914, "global_step": 441486, "epoch": 5319} {"train_loss": -26.52656364440918, "global_step": 441487, "epoch": 5319} {"train_loss": -26.612518310546875, "global_step": 441488, "epoch": 5319} {"train_loss": -26.425846099853516, "global_step": 441489, "epoch": 5319} {"train_loss": -27.013696670532227, "global_step": 441490, "epoch": 5319} {"train_loss": -26.352624893188477, "global_step": 441491, "epoch": 5319} {"train_loss": -26.98963737487793, "global_step": 441492, "epoch": 5319} {"train_loss": -26.475116729736328, "global_step": 441493, "epoch": 5319} {"train_loss": -26.820905685424805, "global_step": 441494, "epoch": 5319} {"train_loss": -26.567174911499023, "global_step": 441495, "epoch": 5319} {"train_loss": -26.848724365234375, "global_step": 441496, "epoch": 5319} {"train_loss": -26.824804306030273, "global_step": 441497, "epoch": 5319} {"train_loss": -27.138904571533203, "global_step": 441498, "epoch": 5319} {"train_loss": -26.9198055267334, "global_step": 441499, "epoch": 5319} {"train_loss": -26.930532455444336, "global_step": 441500, "epoch": 5319} {"train_loss": -27.090002059936523, "global_step": 441501, "epoch": 5319} {"train_loss": -26.856216430664062, "global_step": 441502, "epoch": 5319} {"train_loss": -26.91485595703125, "global_step": 441503, "epoch": 5319} {"train_loss": -27.1881046295166, "global_step": 441504, "epoch": 5319} {"train_loss": -26.813241958618164, "global_step": 441505, "epoch": 5319} {"train_loss": -27.108158111572266, "global_step": 441506, "epoch": 5319} {"train_loss": -26.65056800842285, "global_step": 441507, "epoch": 5319} {"train_loss": -26.654315948486328, "global_step": 441508, "epoch": 5319} {"train_loss": -26.849470138549805, "global_step": 441509, "epoch": 5319} {"train_loss": -27.29859733581543, "global_step": 441510, "epoch": 5319} {"train_loss": -26.869766235351562, "global_step": 441511, "epoch": 5319} {"train_loss": -27.317840576171875, "global_step": 441512, "epoch": 5319} {"train_loss": -26.890705108642578, "global_step": 441513, "epoch": 5319} {"train_loss": -27.011762619018555, "global_step": 441514, "epoch": 5319} {"train_loss": -27.34412956237793, "global_step": 441515, "epoch": 5319} {"train_loss": -26.845930099487305, "global_step": 441516, "epoch": 5319} {"train_loss": -26.810277938842773, "global_step": 441517, "epoch": 5319} {"train_loss": -27.09002685546875, "global_step": 441518, "epoch": 5319} {"train_loss": -27.350122451782227, "global_step": 441519, "epoch": 5319} {"train_loss": -27.348224639892578, "global_step": 441520, "epoch": 5319} {"train_loss": -27.107690811157227, "global_step": 441521, "epoch": 5319} {"train_loss": -26.97344398498535, "global_step": 441522, "epoch": 5319} {"train_loss": -27.079763412475586, "global_step": 441523, "epoch": 5319} {"train_loss": -27.305572509765625, "global_step": 441524, "epoch": 5319} {"train_loss": -27.00129508972168, "global_step": 441525, "epoch": 5319} {"train_loss": -27.1541805267334, "global_step": 441526, "epoch": 5319} {"train_loss": -26.89728355407715, "global_step": 441527, "epoch": 5319} {"train_loss": -26.782316207885742, "global_step": 441528, "epoch": 5319} {"train_loss": -26.91326332092285, "global_step": 441529, "epoch": 5319} {"train_loss": -27.27154541015625, "global_step": 441530, "epoch": 5319} {"train_loss": -26.91035270690918, "global_step": 441531, "epoch": 5319} {"train_loss": -27.111841201782227, "global_step": 441532, "epoch": 5319} {"train_loss": -27.24580192565918, "global_step": 441533, "epoch": 5319} {"train_loss": -26.993133544921875, "global_step": 441534, "epoch": 5319} {"train_loss": -27.15362548828125, "global_step": 441535, "epoch": 5319} {"train_loss": -27.32373046875, "global_step": 441536, "epoch": 5319} {"train_loss": -27.118799209594727, "global_step": 441537, "epoch": 5319} {"train_loss": -26.975189208984375, "global_step": 441538, "epoch": 5319} {"train_loss": -26.995832443237305, "global_step": 441539, "epoch": 5319} {"train_loss": -27.317413330078125, "global_step": 441540, "epoch": 5319} {"train_loss": -27.14141273498535, "global_step": 441541, "epoch": 5319} {"train_loss": -26.968366622924805, "global_step": 441542, "epoch": 5319} {"train_loss": -27.466123580932617, "global_step": 441543, "epoch": 5319} {"train_loss": -26.953582763671875, "global_step": 441544, "epoch": 5319} {"train_loss": -26.6214656829834, "global_step": 441545, "epoch": 5319} {"train_loss": -27.251440048217773, "global_step": 441546, "epoch": 5319} {"train_loss": -26.962757110595703, "global_step": 441547, "epoch": 5319} {"train_loss": -26.789295196533203, "global_step": 441548, "epoch": 5319} {"train_loss": -26.856245040893555, "global_step": 441549, "epoch": 5319} {"train_loss": -27.26947593688965, "global_step": 441550, "epoch": 5319} {"train_loss": -26.995885848999023, "global_step": 441551, "epoch": 5319} {"train_loss": -26.85358238220215, "global_step": 441552, "epoch": 5319} {"train_loss": -27.0405216217041, "global_step": 441553, "epoch": 5319} {"train_loss": -27.061880111694336, "global_step": 441554, "epoch": 5319} {"train_loss": -27.3011417388916, "global_step": 441555, "epoch": 5319} {"train_loss": -27.029865264892578, "global_step": 441556, "epoch": 5319} {"train_loss": -26.950607299804688, "global_step": 441557, "epoch": 5319} {"train_loss": -27.084386825561523, "global_step": 441558, "epoch": 5319} {"train_loss": -26.914682503206183, "global_step": 441559, "epoch": 5319, "val_loss": 6689414.5} {"train_loss": -25.745697021484375, "global_step": 441560, "epoch": 5320} {"train_loss": -26.172483444213867, "global_step": 441561, "epoch": 5320} {"train_loss": -26.16375732421875, "global_step": 441562, "epoch": 5320} {"train_loss": -25.046911239624023, "global_step": 441563, "epoch": 5320} {"train_loss": -25.507232666015625, "global_step": 441564, "epoch": 5320} {"train_loss": -26.2878360748291, "global_step": 441565, "epoch": 5320} {"train_loss": -25.716642379760742, "global_step": 441566, "epoch": 5320} {"train_loss": -26.059019088745117, "global_step": 441567, "epoch": 5320} {"train_loss": -26.06104850769043, "global_step": 441568, "epoch": 5320} {"train_loss": -26.467731475830078, "global_step": 441569, "epoch": 5320} {"train_loss": -26.039960861206055, "global_step": 441570, "epoch": 5320} {"train_loss": -26.457563400268555, "global_step": 441571, "epoch": 5320} {"train_loss": -25.875131607055664, "global_step": 441572, "epoch": 5320} {"train_loss": -26.28678321838379, "global_step": 441573, "epoch": 5320} {"train_loss": -26.37158203125, "global_step": 441574, "epoch": 5320} {"train_loss": -26.150516510009766, "global_step": 441575, "epoch": 5320} {"train_loss": -26.146331787109375, "global_step": 441576, "epoch": 5320} {"train_loss": -26.58866310119629, "global_step": 441577, "epoch": 5320} {"train_loss": -26.232162475585938, "global_step": 441578, "epoch": 5320} {"train_loss": -26.77643394470215, "global_step": 441579, "epoch": 5320} {"train_loss": -26.333322525024414, "global_step": 441580, "epoch": 5320} {"train_loss": -26.347135543823242, "global_step": 441581, "epoch": 5320} {"train_loss": -26.61542320251465, "global_step": 441582, "epoch": 5320} {"train_loss": -26.60456657409668, "global_step": 441583, "epoch": 5320} {"train_loss": -27.09942054748535, "global_step": 441584, "epoch": 5320} {"train_loss": -26.705678939819336, "global_step": 441585, "epoch": 5320} {"train_loss": -26.416156768798828, "global_step": 441586, "epoch": 5320} {"train_loss": -26.67925453186035, "global_step": 441587, "epoch": 5320} {"train_loss": -27.06943130493164, "global_step": 441588, "epoch": 5320} {"train_loss": -26.67579460144043, "global_step": 441589, "epoch": 5320} {"train_loss": -26.39816665649414, "global_step": 441590, "epoch": 5320} {"train_loss": -26.61219596862793, "global_step": 441591, "epoch": 5320} {"train_loss": -27.218307495117188, "global_step": 441592, "epoch": 5320} {"train_loss": -26.739852905273438, "global_step": 441593, "epoch": 5320} {"train_loss": -26.709705352783203, "global_step": 441594, "epoch": 5320} {"train_loss": -26.619653701782227, "global_step": 441595, "epoch": 5320} {"train_loss": -26.89499855041504, "global_step": 441596, "epoch": 5320} {"train_loss": -26.536212921142578, "global_step": 441597, "epoch": 5320} {"train_loss": -26.804407119750977, "global_step": 441598, "epoch": 5320} {"train_loss": -26.882160186767578, "global_step": 441599, "epoch": 5320} {"train_loss": -26.900968551635742, "global_step": 441600, "epoch": 5320} {"train_loss": -26.926237106323242, "global_step": 441601, "epoch": 5320} {"train_loss": -26.7935848236084, "global_step": 441602, "epoch": 5320} {"train_loss": -27.032812118530273, "global_step": 441603, "epoch": 5320} {"train_loss": -26.737375259399414, "global_step": 441604, "epoch": 5320} {"train_loss": -27.2460880279541, "global_step": 441605, "epoch": 5320} {"train_loss": -26.572797775268555, "global_step": 441606, "epoch": 5320} {"train_loss": -27.177570343017578, "global_step": 441607, "epoch": 5320} {"train_loss": -26.97540855407715, "global_step": 441608, "epoch": 5320} {"train_loss": -27.25750160217285, "global_step": 441609, "epoch": 5320} {"train_loss": -26.99355125427246, "global_step": 441610, "epoch": 5320} {"train_loss": -27.17954444885254, "global_step": 441611, "epoch": 5320} {"train_loss": -26.853485107421875, "global_step": 441612, "epoch": 5320} {"train_loss": -27.010257720947266, "global_step": 441613, "epoch": 5320} {"train_loss": -26.762556076049805, "global_step": 441614, "epoch": 5320} {"train_loss": -27.000934600830078, "global_step": 441615, "epoch": 5320} {"train_loss": -27.1768798828125, "global_step": 441616, "epoch": 5320} {"train_loss": -26.856962203979492, "global_step": 441617, "epoch": 5320} {"train_loss": -27.27324867248535, "global_step": 441618, "epoch": 5320} {"train_loss": -26.816137313842773, "global_step": 441619, "epoch": 5320} {"train_loss": -27.052082061767578, "global_step": 441620, "epoch": 5320} {"train_loss": -27.26801872253418, "global_step": 441621, "epoch": 5320} {"train_loss": -27.3293399810791, "global_step": 441622, "epoch": 5320} {"train_loss": -26.8809871673584, "global_step": 441623, "epoch": 5320} {"train_loss": -26.912738800048828, "global_step": 441624, "epoch": 5320} {"train_loss": -27.14963722229004, "global_step": 441625, "epoch": 5320} {"train_loss": -27.30781364440918, "global_step": 441626, "epoch": 5320} {"train_loss": -27.240386962890625, "global_step": 441627, "epoch": 5320} {"train_loss": -26.936767578125, "global_step": 441628, "epoch": 5320} {"train_loss": -26.792173385620117, "global_step": 441629, "epoch": 5320} {"train_loss": -26.7662353515625, "global_step": 441630, "epoch": 5320} {"train_loss": -27.01276206970215, "global_step": 441631, "epoch": 5320} {"train_loss": -27.131763458251953, "global_step": 441632, "epoch": 5320} {"train_loss": -26.891178131103516, "global_step": 441633, "epoch": 5320} {"train_loss": -27.088363647460938, "global_step": 441634, "epoch": 5320} {"train_loss": -26.98859977722168, "global_step": 441635, "epoch": 5320} {"train_loss": -27.078527450561523, "global_step": 441636, "epoch": 5320} {"train_loss": -26.93003273010254, "global_step": 441637, "epoch": 5320} {"train_loss": -27.312620162963867, "global_step": 441638, "epoch": 5320} {"train_loss": -26.7019100189209, "global_step": 441639, "epoch": 5320} {"train_loss": -26.971364974975586, "global_step": 441640, "epoch": 5320} {"train_loss": -27.03159523010254, "global_step": 441641, "epoch": 5320} {"train_loss": -26.707613956497376, "global_step": 441642, "epoch": 5320, "val_loss": 6678957.0} {"train_loss": -26.831796646118164, "global_step": 441643, "epoch": 5321} {"train_loss": -25.74542808532715, "global_step": 441644, "epoch": 5321} {"train_loss": -26.720144271850586, "global_step": 441645, "epoch": 5321} {"train_loss": -26.354284286499023, "global_step": 441646, "epoch": 5321} {"train_loss": -26.67557716369629, "global_step": 441647, "epoch": 5321} {"train_loss": -25.947912216186523, "global_step": 441648, "epoch": 5321} {"train_loss": -26.282312393188477, "global_step": 441649, "epoch": 5321} {"train_loss": -26.316247940063477, "global_step": 441650, "epoch": 5321} {"train_loss": -26.3255558013916, "global_step": 441651, "epoch": 5321} {"train_loss": -26.329883575439453, "global_step": 441652, "epoch": 5321} {"train_loss": -26.323413848876953, "global_step": 441653, "epoch": 5321} {"train_loss": -26.73211669921875, "global_step": 441654, "epoch": 5321} {"train_loss": -26.55106544494629, "global_step": 441655, "epoch": 5321} {"train_loss": -26.4851131439209, "global_step": 441656, "epoch": 5321} {"train_loss": -27.028522491455078, "global_step": 441657, "epoch": 5321} {"train_loss": -27.035863876342773, "global_step": 441658, "epoch": 5321} {"train_loss": -26.54376792907715, "global_step": 441659, "epoch": 5321} {"train_loss": -26.9403076171875, "global_step": 441660, "epoch": 5321} {"train_loss": -26.665332794189453, "global_step": 441661, "epoch": 5321} {"train_loss": -26.822528839111328, "global_step": 441662, "epoch": 5321} {"train_loss": -26.550134658813477, "global_step": 441663, "epoch": 5321} {"train_loss": -26.816455841064453, "global_step": 441664, "epoch": 5321} {"train_loss": -26.78009033203125, "global_step": 441665, "epoch": 5321} {"train_loss": -27.042343139648438, "global_step": 441666, "epoch": 5321} {"train_loss": -26.72782325744629, "global_step": 441667, "epoch": 5321} {"train_loss": -26.7636661529541, "global_step": 441668, "epoch": 5321} {"train_loss": -26.917194366455078, "global_step": 441669, "epoch": 5321} {"train_loss": -26.84140396118164, "global_step": 441670, "epoch": 5321} {"train_loss": -26.936279296875, "global_step": 441671, "epoch": 5321} {"train_loss": -27.2823429107666, "global_step": 441672, "epoch": 5321} {"train_loss": -27.1951847076416, "global_step": 441673, "epoch": 5321} {"train_loss": -26.823139190673828, "global_step": 441674, "epoch": 5321} {"train_loss": -27.05000877380371, "global_step": 441675, "epoch": 5321} {"train_loss": -27.04559326171875, "global_step": 441676, "epoch": 5321} {"train_loss": -26.756559371948242, "global_step": 441677, "epoch": 5321} {"train_loss": -26.84132957458496, "global_step": 441678, "epoch": 5321} {"train_loss": -26.979108810424805, "global_step": 441679, "epoch": 5321} {"train_loss": -27.033105850219727, "global_step": 441680, "epoch": 5321} {"train_loss": -27.119464874267578, "global_step": 441681, "epoch": 5321} {"train_loss": -26.83575439453125, "global_step": 441682, "epoch": 5321} {"train_loss": -26.687774658203125, "global_step": 441683, "epoch": 5321} {"train_loss": -27.026020050048828, "global_step": 441684, "epoch": 5321} {"train_loss": -27.3774471282959, "global_step": 441685, "epoch": 5321} {"train_loss": -27.235107421875, "global_step": 441686, "epoch": 5321} {"train_loss": -26.623563766479492, "global_step": 441687, "epoch": 5321} {"train_loss": -27.20856285095215, "global_step": 441688, "epoch": 5321} {"train_loss": -27.08658218383789, "global_step": 441689, "epoch": 5321} {"train_loss": -27.398237228393555, "global_step": 441690, "epoch": 5321} {"train_loss": -26.910797119140625, "global_step": 441691, "epoch": 5321} {"train_loss": -27.175016403198242, "global_step": 441692, "epoch": 5321} {"train_loss": -26.961820602416992, "global_step": 441693, "epoch": 5321} {"train_loss": -27.07818031311035, "global_step": 441694, "epoch": 5321} {"train_loss": -26.82845115661621, "global_step": 441695, "epoch": 5321} {"train_loss": -27.097976684570312, "global_step": 441696, "epoch": 5321} {"train_loss": -27.179046630859375, "global_step": 441697, "epoch": 5321} {"train_loss": -27.194015502929688, "global_step": 441698, "epoch": 5321} {"train_loss": -27.117528915405273, "global_step": 441699, "epoch": 5321} {"train_loss": -26.461278915405273, "global_step": 441700, "epoch": 5321} {"train_loss": -26.86663818359375, "global_step": 441701, "epoch": 5321} {"train_loss": -27.286664962768555, "global_step": 441702, "epoch": 5321} {"train_loss": -26.820972442626953, "global_step": 441703, "epoch": 5321} {"train_loss": -26.980148315429688, "global_step": 441704, "epoch": 5321} {"train_loss": -26.883625030517578, "global_step": 441705, "epoch": 5321} {"train_loss": -27.239028930664062, "global_step": 441706, "epoch": 5321} {"train_loss": -27.331296920776367, "global_step": 441707, "epoch": 5321} {"train_loss": -27.228052139282227, "global_step": 441708, "epoch": 5321} {"train_loss": -26.974390029907227, "global_step": 441709, "epoch": 5321} {"train_loss": -27.25494384765625, "global_step": 441710, "epoch": 5321} {"train_loss": -27.00349235534668, "global_step": 441711, "epoch": 5321} {"train_loss": -27.325366973876953, "global_step": 441712, "epoch": 5321} {"train_loss": -26.990304946899414, "global_step": 441713, "epoch": 5321} {"train_loss": -27.001150131225586, "global_step": 441714, "epoch": 5321} {"train_loss": -27.050220489501953, "global_step": 441715, "epoch": 5321} {"train_loss": -26.956212997436523, "global_step": 441716, "epoch": 5321} {"train_loss": -26.79697608947754, "global_step": 441717, "epoch": 5321} {"train_loss": -27.262357711791992, "global_step": 441718, "epoch": 5321} {"train_loss": -27.1378116607666, "global_step": 441719, "epoch": 5321} {"train_loss": -26.90191650390625, "global_step": 441720, "epoch": 5321} {"train_loss": -27.177289962768555, "global_step": 441721, "epoch": 5321} {"train_loss": -26.801162719726562, "global_step": 441722, "epoch": 5321} {"train_loss": -27.078571319580078, "global_step": 441723, "epoch": 5321} {"train_loss": -27.252103805541992, "global_step": 441724, "epoch": 5321} {"train_loss": -26.89441246584237, "global_step": 441725, "epoch": 5321, "val_loss": 6707070.0} {"train_loss": -26.77353858947754, "global_step": 441726, "epoch": 5322} {"train_loss": -26.692602157592773, "global_step": 441727, "epoch": 5322} {"train_loss": -26.29062843322754, "global_step": 441728, "epoch": 5322} {"train_loss": -26.57895278930664, "global_step": 441729, "epoch": 5322} {"train_loss": -26.69025230407715, "global_step": 441730, "epoch": 5322} {"train_loss": -26.64186668395996, "global_step": 441731, "epoch": 5322} {"train_loss": -26.849700927734375, "global_step": 441732, "epoch": 5322} {"train_loss": -26.350589752197266, "global_step": 441733, "epoch": 5322} {"train_loss": -27.020599365234375, "global_step": 441734, "epoch": 5322} {"train_loss": -26.4783935546875, "global_step": 441735, "epoch": 5322} {"train_loss": -26.41007423400879, "global_step": 441736, "epoch": 5322} {"train_loss": -26.7935733795166, "global_step": 441737, "epoch": 5322} {"train_loss": -26.370508193969727, "global_step": 441738, "epoch": 5322} {"train_loss": -26.721710205078125, "global_step": 441739, "epoch": 5322} {"train_loss": -26.86372184753418, "global_step": 441740, "epoch": 5322} {"train_loss": -26.18768310546875, "global_step": 441741, "epoch": 5322} {"train_loss": -26.295822143554688, "global_step": 441742, "epoch": 5322} {"train_loss": -26.37689208984375, "global_step": 441743, "epoch": 5322} {"train_loss": -26.841108322143555, "global_step": 441744, "epoch": 5322} {"train_loss": -26.975492477416992, "global_step": 441745, "epoch": 5322} {"train_loss": -26.63640785217285, "global_step": 441746, "epoch": 5322} {"train_loss": -26.84868812561035, "global_step": 441747, "epoch": 5322} {"train_loss": -26.737272262573242, "global_step": 441748, "epoch": 5322} {"train_loss": -26.860593795776367, "global_step": 441749, "epoch": 5322} {"train_loss": -26.503332138061523, "global_step": 441750, "epoch": 5322} {"train_loss": -26.676416397094727, "global_step": 441751, "epoch": 5322} {"train_loss": -26.935287475585938, "global_step": 441752, "epoch": 5322} {"train_loss": -26.560806274414062, "global_step": 441753, "epoch": 5322} {"train_loss": -27.28944206237793, "global_step": 441754, "epoch": 5322} {"train_loss": -26.9625244140625, "global_step": 441755, "epoch": 5322} {"train_loss": -26.661487579345703, "global_step": 441756, "epoch": 5322} {"train_loss": -26.99163246154785, "global_step": 441757, "epoch": 5322} {"train_loss": -26.95102310180664, "global_step": 441758, "epoch": 5322} {"train_loss": -27.107297897338867, "global_step": 441759, "epoch": 5322} {"train_loss": -26.81308364868164, "global_step": 441760, "epoch": 5322} {"train_loss": -27.079553604125977, "global_step": 441761, "epoch": 5322} {"train_loss": -26.9644832611084, "global_step": 441762, "epoch": 5322} {"train_loss": -27.00945472717285, "global_step": 441763, "epoch": 5322} {"train_loss": -27.001224517822266, "global_step": 441764, "epoch": 5322} {"train_loss": -26.903827667236328, "global_step": 441765, "epoch": 5322} {"train_loss": -27.377607345581055, "global_step": 441766, "epoch": 5322} {"train_loss": -27.047388076782227, "global_step": 441767, "epoch": 5322} {"train_loss": -27.0999813079834, "global_step": 441768, "epoch": 5322} {"train_loss": -27.320388793945312, "global_step": 441769, "epoch": 5322} {"train_loss": -27.10984230041504, "global_step": 441770, "epoch": 5322} {"train_loss": -27.239856719970703, "global_step": 441771, "epoch": 5322} {"train_loss": -26.541357040405273, "global_step": 441772, "epoch": 5322} {"train_loss": -26.714120864868164, "global_step": 441773, "epoch": 5322} {"train_loss": -26.143585205078125, "global_step": 441774, "epoch": 5322} {"train_loss": -26.512094497680664, "global_step": 441775, "epoch": 5322} {"train_loss": -26.992446899414062, "global_step": 441776, "epoch": 5322} {"train_loss": -27.048078536987305, "global_step": 441777, "epoch": 5322} {"train_loss": -26.762128829956055, "global_step": 441778, "epoch": 5322} {"train_loss": -26.957433700561523, "global_step": 441779, "epoch": 5322} {"train_loss": -27.175128936767578, "global_step": 441780, "epoch": 5322} {"train_loss": -27.117109298706055, "global_step": 441781, "epoch": 5322} {"train_loss": -27.030670166015625, "global_step": 441782, "epoch": 5322} {"train_loss": -26.725366592407227, "global_step": 441783, "epoch": 5322} {"train_loss": -27.048322677612305, "global_step": 441784, "epoch": 5322} {"train_loss": -27.076480865478516, "global_step": 441785, "epoch": 5322} {"train_loss": -26.813772201538086, "global_step": 441786, "epoch": 5322} {"train_loss": -26.594635009765625, "global_step": 441787, "epoch": 5322} {"train_loss": -26.728193283081055, "global_step": 441788, "epoch": 5322} {"train_loss": -27.007068634033203, "global_step": 441789, "epoch": 5322} {"train_loss": -27.27842140197754, "global_step": 441790, "epoch": 5322} {"train_loss": -27.22285270690918, "global_step": 441791, "epoch": 5322} {"train_loss": -27.171634674072266, "global_step": 441792, "epoch": 5322} {"train_loss": -26.837976455688477, "global_step": 441793, "epoch": 5322} {"train_loss": -27.27161979675293, "global_step": 441794, "epoch": 5322} {"train_loss": -27.0183048248291, "global_step": 441795, "epoch": 5322} {"train_loss": -26.77315330505371, "global_step": 441796, "epoch": 5322} {"train_loss": -27.067279815673828, "global_step": 441797, "epoch": 5322} {"train_loss": -27.353656768798828, "global_step": 441798, "epoch": 5322} {"train_loss": -27.13654136657715, "global_step": 441799, "epoch": 5322} {"train_loss": -27.30537223815918, "global_step": 441800, "epoch": 5322} {"train_loss": -27.066923141479492, "global_step": 441801, "epoch": 5322} {"train_loss": -27.020322799682617, "global_step": 441802, "epoch": 5322} {"train_loss": -26.965316772460938, "global_step": 441803, "epoch": 5322} {"train_loss": -27.114517211914062, "global_step": 441804, "epoch": 5322} {"train_loss": -27.05902099609375, "global_step": 441805, "epoch": 5322} {"train_loss": -27.00359535217285, "global_step": 441806, "epoch": 5322} {"train_loss": -26.934988021850586, "global_step": 441807, "epoch": 5322} {"train_loss": -26.881669285785723, "global_step": 441808, "epoch": 5322, "val_loss": 6785438.0} {"train_loss": -25.33271026611328, "global_step": 441809, "epoch": 5323} {"train_loss": -24.721595764160156, "global_step": 441810, "epoch": 5323} {"train_loss": -24.42620277404785, "global_step": 441811, "epoch": 5323} {"train_loss": -24.62540054321289, "global_step": 441812, "epoch": 5323} {"train_loss": -25.9385929107666, "global_step": 441813, "epoch": 5323} {"train_loss": -25.846994400024414, "global_step": 441814, "epoch": 5323} {"train_loss": -25.548494338989258, "global_step": 441815, "epoch": 5323} {"train_loss": -26.183263778686523, "global_step": 441816, "epoch": 5323} {"train_loss": -25.502843856811523, "global_step": 441817, "epoch": 5323} {"train_loss": -26.083759307861328, "global_step": 441818, "epoch": 5323} {"train_loss": -26.025304794311523, "global_step": 441819, "epoch": 5323} {"train_loss": -25.43333625793457, "global_step": 441820, "epoch": 5323} {"train_loss": -25.857044219970703, "global_step": 441821, "epoch": 5323} {"train_loss": -25.770734786987305, "global_step": 441822, "epoch": 5323} {"train_loss": -26.111154556274414, "global_step": 441823, "epoch": 5323} {"train_loss": -26.214712142944336, "global_step": 441824, "epoch": 5323} {"train_loss": -26.277999877929688, "global_step": 441825, "epoch": 5323} {"train_loss": -25.665719985961914, "global_step": 441826, "epoch": 5323} {"train_loss": -26.065631866455078, "global_step": 441827, "epoch": 5323} {"train_loss": -25.833093643188477, "global_step": 441828, "epoch": 5323} {"train_loss": -26.37188720703125, "global_step": 441829, "epoch": 5323} {"train_loss": -26.040761947631836, "global_step": 441830, "epoch": 5323} {"train_loss": -26.484100341796875, "global_step": 441831, "epoch": 5323} {"train_loss": -26.56231689453125, "global_step": 441832, "epoch": 5323} {"train_loss": -26.31318473815918, "global_step": 441833, "epoch": 5323} {"train_loss": -26.42937660217285, "global_step": 441834, "epoch": 5323} {"train_loss": -26.32025146484375, "global_step": 441835, "epoch": 5323} {"train_loss": -26.31348991394043, "global_step": 441836, "epoch": 5323} {"train_loss": -26.349546432495117, "global_step": 441837, "epoch": 5323} {"train_loss": -26.380905151367188, "global_step": 441838, "epoch": 5323} {"train_loss": -26.97525405883789, "global_step": 441839, "epoch": 5323} {"train_loss": -26.7186222076416, "global_step": 441840, "epoch": 5323} {"train_loss": -26.901533126831055, "global_step": 441841, "epoch": 5323} {"train_loss": -26.443164825439453, "global_step": 441842, "epoch": 5323} {"train_loss": -27.110742568969727, "global_step": 441843, "epoch": 5323} {"train_loss": -26.776519775390625, "global_step": 441844, "epoch": 5323} {"train_loss": -26.770099639892578, "global_step": 441845, "epoch": 5323} {"train_loss": -26.83137321472168, "global_step": 441846, "epoch": 5323} {"train_loss": -27.032886505126953, "global_step": 441847, "epoch": 5323} {"train_loss": -26.774641036987305, "global_step": 441848, "epoch": 5323} {"train_loss": -26.96187400817871, "global_step": 441849, "epoch": 5323} {"train_loss": -26.850629806518555, "global_step": 441850, "epoch": 5323} {"train_loss": -26.991010665893555, "global_step": 441851, "epoch": 5323} {"train_loss": -26.988418579101562, "global_step": 441852, "epoch": 5323} {"train_loss": -27.219425201416016, "global_step": 441853, "epoch": 5323} {"train_loss": -27.209930419921875, "global_step": 441854, "epoch": 5323} {"train_loss": -26.8686466217041, "global_step": 441855, "epoch": 5323} {"train_loss": -27.065189361572266, "global_step": 441856, "epoch": 5323} {"train_loss": -26.908126831054688, "global_step": 441857, "epoch": 5323} {"train_loss": -26.91322135925293, "global_step": 441858, "epoch": 5323} {"train_loss": -26.842641830444336, "global_step": 441859, "epoch": 5323} {"train_loss": -26.929779052734375, "global_step": 441860, "epoch": 5323} {"train_loss": -26.667673110961914, "global_step": 441861, "epoch": 5323} {"train_loss": -27.065290451049805, "global_step": 441862, "epoch": 5323} {"train_loss": -27.360082626342773, "global_step": 441863, "epoch": 5323} {"train_loss": -26.9865779876709, "global_step": 441864, "epoch": 5323} {"train_loss": -26.560993194580078, "global_step": 441865, "epoch": 5323} {"train_loss": -26.396930694580078, "global_step": 441866, "epoch": 5323} {"train_loss": -27.121667861938477, "global_step": 441867, "epoch": 5323} {"train_loss": -26.92182731628418, "global_step": 441868, "epoch": 5323} {"train_loss": -27.033430099487305, "global_step": 441869, "epoch": 5323} {"train_loss": -27.17622184753418, "global_step": 441870, "epoch": 5323} {"train_loss": -26.8975887298584, "global_step": 441871, "epoch": 5323} {"train_loss": -27.3310604095459, "global_step": 441872, "epoch": 5323} {"train_loss": -26.814741134643555, "global_step": 441873, "epoch": 5323} {"train_loss": -27.170995712280273, "global_step": 441874, "epoch": 5323} {"train_loss": -27.16102409362793, "global_step": 441875, "epoch": 5323} {"train_loss": -26.83990478515625, "global_step": 441876, "epoch": 5323} {"train_loss": -27.4514217376709, "global_step": 441877, "epoch": 5323} {"train_loss": -27.04170799255371, "global_step": 441878, "epoch": 5323} {"train_loss": -27.18849754333496, "global_step": 441879, "epoch": 5323} {"train_loss": -27.126718521118164, "global_step": 441880, "epoch": 5323} {"train_loss": -26.882312774658203, "global_step": 441881, "epoch": 5323} {"train_loss": -26.972822189331055, "global_step": 441882, "epoch": 5323} {"train_loss": -27.33722496032715, "global_step": 441883, "epoch": 5323} {"train_loss": -26.90545082092285, "global_step": 441884, "epoch": 5323} {"train_loss": -26.671781539916992, "global_step": 441885, "epoch": 5323} {"train_loss": -27.286001205444336, "global_step": 441886, "epoch": 5323} {"train_loss": -26.890283584594727, "global_step": 441887, "epoch": 5323} {"train_loss": -27.477371215820312, "global_step": 441888, "epoch": 5323} {"train_loss": -27.1358585357666, "global_step": 441889, "epoch": 5323} {"train_loss": -27.523035049438477, "global_step": 441890, "epoch": 5323} {"train_loss": -26.590813165687653, "global_step": 441891, "epoch": 5323, "val_loss": 6653361.0} {"train_loss": -24.130722045898438, "global_step": 441892, "epoch": 5324} {"train_loss": -22.643407821655273, "global_step": 441893, "epoch": 5324} {"train_loss": -24.76360321044922, "global_step": 441894, "epoch": 5324} {"train_loss": -26.000574111938477, "global_step": 441895, "epoch": 5324} {"train_loss": -25.02130126953125, "global_step": 441896, "epoch": 5324} {"train_loss": -26.705244064331055, "global_step": 441897, "epoch": 5324} {"train_loss": -25.09751319885254, "global_step": 441898, "epoch": 5324} {"train_loss": -26.28098487854004, "global_step": 441899, "epoch": 5324} {"train_loss": -25.21602439880371, "global_step": 441900, "epoch": 5324} {"train_loss": -26.017841339111328, "global_step": 441901, "epoch": 5324} {"train_loss": -25.922330856323242, "global_step": 441902, "epoch": 5324} {"train_loss": -25.79742431640625, "global_step": 441903, "epoch": 5324} {"train_loss": -26.14777183532715, "global_step": 441904, "epoch": 5324} {"train_loss": -26.121307373046875, "global_step": 441905, "epoch": 5324} {"train_loss": -25.861648559570312, "global_step": 441906, "epoch": 5324} {"train_loss": -25.92805290222168, "global_step": 441907, "epoch": 5324} {"train_loss": -26.064716339111328, "global_step": 441908, "epoch": 5324} {"train_loss": -26.088687896728516, "global_step": 441909, "epoch": 5324} {"train_loss": -26.01139259338379, "global_step": 441910, "epoch": 5324} {"train_loss": -26.454023361206055, "global_step": 441911, "epoch": 5324} {"train_loss": -26.19361686706543, "global_step": 441912, "epoch": 5324} {"train_loss": -26.183835983276367, "global_step": 441913, "epoch": 5324} {"train_loss": -26.6929988861084, "global_step": 441914, "epoch": 5324} {"train_loss": -26.6927547454834, "global_step": 441915, "epoch": 5324} {"train_loss": -26.835763931274414, "global_step": 441916, "epoch": 5324} {"train_loss": -26.096338272094727, "global_step": 441917, "epoch": 5324} {"train_loss": -26.571313858032227, "global_step": 441918, "epoch": 5324} {"train_loss": -26.332782745361328, "global_step": 441919, "epoch": 5324} {"train_loss": -26.6230525970459, "global_step": 441920, "epoch": 5324} {"train_loss": -26.413227081298828, "global_step": 441921, "epoch": 5324} {"train_loss": -26.783065795898438, "global_step": 441922, "epoch": 5324} {"train_loss": -26.62332534790039, "global_step": 441923, "epoch": 5324} {"train_loss": -26.85972023010254, "global_step": 441924, "epoch": 5324} {"train_loss": -26.662805557250977, "global_step": 441925, "epoch": 5324} {"train_loss": -26.753162384033203, "global_step": 441926, "epoch": 5324} {"train_loss": -26.909940719604492, "global_step": 441927, "epoch": 5324} {"train_loss": -26.850629806518555, "global_step": 441928, "epoch": 5324} {"train_loss": -26.883039474487305, "global_step": 441929, "epoch": 5324} {"train_loss": -26.864416122436523, "global_step": 441930, "epoch": 5324} {"train_loss": -26.813785552978516, "global_step": 441931, "epoch": 5324} {"train_loss": -27.198270797729492, "global_step": 441932, "epoch": 5324} {"train_loss": -27.0238037109375, "global_step": 441933, "epoch": 5324} {"train_loss": -26.3465518951416, "global_step": 441934, "epoch": 5324} {"train_loss": -27.17133903503418, "global_step": 441935, "epoch": 5324} {"train_loss": -27.31076431274414, "global_step": 441936, "epoch": 5324} {"train_loss": -26.985132217407227, "global_step": 441937, "epoch": 5324} {"train_loss": -26.943113327026367, "global_step": 441938, "epoch": 5324} {"train_loss": -27.023569107055664, "global_step": 441939, "epoch": 5324} {"train_loss": -27.115564346313477, "global_step": 441940, "epoch": 5324} {"train_loss": -26.6531925201416, "global_step": 441941, "epoch": 5324} {"train_loss": -27.162006378173828, "global_step": 441942, "epoch": 5324} {"train_loss": -27.30559730529785, "global_step": 441943, "epoch": 5324} {"train_loss": -27.00180435180664, "global_step": 441944, "epoch": 5324} {"train_loss": -26.627134323120117, "global_step": 441945, "epoch": 5324} {"train_loss": -27.047353744506836, "global_step": 441946, "epoch": 5324} {"train_loss": -27.053396224975586, "global_step": 441947, "epoch": 5324} {"train_loss": -26.934667587280273, "global_step": 441948, "epoch": 5324} {"train_loss": -26.956562042236328, "global_step": 441949, "epoch": 5324} {"train_loss": -27.14104652404785, "global_step": 441950, "epoch": 5324} {"train_loss": -27.027082443237305, "global_step": 441951, "epoch": 5324} {"train_loss": -27.441267013549805, "global_step": 441952, "epoch": 5324} {"train_loss": -26.93854331970215, "global_step": 441953, "epoch": 5324} {"train_loss": -27.171056747436523, "global_step": 441954, "epoch": 5324} {"train_loss": -26.87737464904785, "global_step": 441955, "epoch": 5324} {"train_loss": -27.31793785095215, "global_step": 441956, "epoch": 5324} {"train_loss": -27.087493896484375, "global_step": 441957, "epoch": 5324} {"train_loss": -26.949039459228516, "global_step": 441958, "epoch": 5324} {"train_loss": -26.822620391845703, "global_step": 441959, "epoch": 5324} {"train_loss": -27.461877822875977, "global_step": 441960, "epoch": 5324} {"train_loss": -27.093902587890625, "global_step": 441961, "epoch": 5324} {"train_loss": -27.329614639282227, "global_step": 441962, "epoch": 5324} {"train_loss": -27.296335220336914, "global_step": 441963, "epoch": 5324} {"train_loss": -26.56801414489746, "global_step": 441964, "epoch": 5324} {"train_loss": -26.7226505279541, "global_step": 441965, "epoch": 5324} {"train_loss": -27.001455307006836, "global_step": 441966, "epoch": 5324} {"train_loss": -26.89215087890625, "global_step": 441967, "epoch": 5324} {"train_loss": -27.3435001373291, "global_step": 441968, "epoch": 5324} {"train_loss": -26.9949893951416, "global_step": 441969, "epoch": 5324} {"train_loss": -27.15436363220215, "global_step": 441970, "epoch": 5324} {"train_loss": -27.193363189697266, "global_step": 441971, "epoch": 5324} {"train_loss": -27.144989013671875, "global_step": 441972, "epoch": 5324} {"train_loss": -26.550830841064453, "global_step": 441973, "epoch": 5324} {"train_loss": -26.6044543622488, "global_step": 441974, "epoch": 5324, "val_loss": 6719658.5} {"train_loss": -26.7159366607666, "global_step": 441975, "epoch": 5325} {"train_loss": -25.9791202545166, "global_step": 441976, "epoch": 5325} {"train_loss": -26.386396408081055, "global_step": 441977, "epoch": 5325} {"train_loss": -26.466711044311523, "global_step": 441978, "epoch": 5325} {"train_loss": -27.091983795166016, "global_step": 441979, "epoch": 5325} {"train_loss": -26.61679458618164, "global_step": 441980, "epoch": 5325} {"train_loss": -26.89985466003418, "global_step": 441981, "epoch": 5325} {"train_loss": -26.748754501342773, "global_step": 441982, "epoch": 5325} {"train_loss": -26.80254554748535, "global_step": 441983, "epoch": 5325} {"train_loss": -26.8597412109375, "global_step": 441984, "epoch": 5325} {"train_loss": -26.99891471862793, "global_step": 441985, "epoch": 5325} {"train_loss": -27.00599479675293, "global_step": 441986, "epoch": 5325} {"train_loss": -27.023426055908203, "global_step": 441987, "epoch": 5325} {"train_loss": -27.013029098510742, "global_step": 441988, "epoch": 5325} {"train_loss": -26.891143798828125, "global_step": 441989, "epoch": 5325} {"train_loss": -27.176156997680664, "global_step": 441990, "epoch": 5325} {"train_loss": -27.23164176940918, "global_step": 441991, "epoch": 5325} {"train_loss": -27.01553726196289, "global_step": 441992, "epoch": 5325} {"train_loss": -26.632648468017578, "global_step": 441993, "epoch": 5325} {"train_loss": -26.89898681640625, "global_step": 441994, "epoch": 5325} {"train_loss": -26.952743530273438, "global_step": 441995, "epoch": 5325} {"train_loss": -26.78944206237793, "global_step": 441996, "epoch": 5325} {"train_loss": -27.216257095336914, "global_step": 441997, "epoch": 5325} {"train_loss": -27.329328536987305, "global_step": 441998, "epoch": 5325} {"train_loss": -27.147192001342773, "global_step": 441999, "epoch": 5325} {"train_loss": -26.99763298034668, "global_step": 442000, "epoch": 5325} {"train_loss": -27.391754150390625, "global_step": 442001, "epoch": 5325} {"train_loss": -26.800382614135742, "global_step": 442002, "epoch": 5325} {"train_loss": -27.15178871154785, "global_step": 442003, "epoch": 5325} {"train_loss": -26.692747116088867, "global_step": 442004, "epoch": 5325} {"train_loss": -27.3044490814209, "global_step": 442005, "epoch": 5325} {"train_loss": -26.7611141204834, "global_step": 442006, "epoch": 5325} {"train_loss": -27.175222396850586, "global_step": 442007, "epoch": 5325} {"train_loss": -27.345563888549805, "global_step": 442008, "epoch": 5325} {"train_loss": -26.920642852783203, "global_step": 442009, "epoch": 5325} {"train_loss": -27.021442413330078, "global_step": 442010, "epoch": 5325} {"train_loss": -27.475683212280273, "global_step": 442011, "epoch": 5325} {"train_loss": -27.296960830688477, "global_step": 442012, "epoch": 5325} {"train_loss": -26.755163192749023, "global_step": 442013, "epoch": 5325} {"train_loss": -27.019718170166016, "global_step": 442014, "epoch": 5325} {"train_loss": -26.882104873657227, "global_step": 442015, "epoch": 5325} {"train_loss": -26.963031768798828, "global_step": 442016, "epoch": 5325} {"train_loss": -27.04290199279785, "global_step": 442017, "epoch": 5325} {"train_loss": -27.50441551208496, "global_step": 442018, "epoch": 5325} {"train_loss": -26.9910945892334, "global_step": 442019, "epoch": 5325} {"train_loss": -27.152557373046875, "global_step": 442020, "epoch": 5325} {"train_loss": -26.90997886657715, "global_step": 442021, "epoch": 5325} {"train_loss": -27.135770797729492, "global_step": 442022, "epoch": 5325} {"train_loss": -26.877277374267578, "global_step": 442023, "epoch": 5325} {"train_loss": -27.049407958984375, "global_step": 442024, "epoch": 5325} {"train_loss": -26.69056510925293, "global_step": 442025, "epoch": 5325} {"train_loss": -26.896207809448242, "global_step": 442026, "epoch": 5325} {"train_loss": -26.97161865234375, "global_step": 442027, "epoch": 5325} {"train_loss": -27.068445205688477, "global_step": 442028, "epoch": 5325} {"train_loss": -26.800750732421875, "global_step": 442029, "epoch": 5325} {"train_loss": -26.837961196899414, "global_step": 442030, "epoch": 5325} {"train_loss": -27.32392692565918, "global_step": 442031, "epoch": 5325} {"train_loss": -27.368555068969727, "global_step": 442032, "epoch": 5325} {"train_loss": -27.086400985717773, "global_step": 442033, "epoch": 5325} {"train_loss": -27.166234970092773, "global_step": 442034, "epoch": 5325} {"train_loss": -26.862823486328125, "global_step": 442035, "epoch": 5325} {"train_loss": -27.626432418823242, "global_step": 442036, "epoch": 5325} {"train_loss": -27.368005752563477, "global_step": 442037, "epoch": 5325} {"train_loss": -27.025012969970703, "global_step": 442038, "epoch": 5325} {"train_loss": -27.019866943359375, "global_step": 442039, "epoch": 5325} {"train_loss": -26.70654296875, "global_step": 442040, "epoch": 5325} {"train_loss": -26.765295028686523, "global_step": 442041, "epoch": 5325} {"train_loss": -27.43011474609375, "global_step": 442042, "epoch": 5325} {"train_loss": -26.95654296875, "global_step": 442043, "epoch": 5325} {"train_loss": -27.074481964111328, "global_step": 442044, "epoch": 5325} {"train_loss": -27.08772087097168, "global_step": 442045, "epoch": 5325} {"train_loss": -27.191770553588867, "global_step": 442046, "epoch": 5325} {"train_loss": -26.9516658782959, "global_step": 442047, "epoch": 5325} {"train_loss": -26.712438583374023, "global_step": 442048, "epoch": 5325} {"train_loss": -26.850454330444336, "global_step": 442049, "epoch": 5325} {"train_loss": -26.989530563354492, "global_step": 442050, "epoch": 5325} {"train_loss": -27.095869064331055, "global_step": 442051, "epoch": 5325} {"train_loss": -26.67048454284668, "global_step": 442052, "epoch": 5325} {"train_loss": -26.854307174682617, "global_step": 442053, "epoch": 5325} {"train_loss": -27.360254287719727, "global_step": 442054, "epoch": 5325} {"train_loss": -26.893512725830078, "global_step": 442055, "epoch": 5325} {"train_loss": -26.69428825378418, "global_step": 442056, "epoch": 5325} {"train_loss": -26.963944239788745, "global_step": 442057, "epoch": 5325, "val_loss": 6767572.5} {"train_loss": -18.790889739990234, "global_step": 442058, "epoch": 5326} {"train_loss": -23.689334869384766, "global_step": 442059, "epoch": 5326} {"train_loss": -23.617883682250977, "global_step": 442060, "epoch": 5326} {"train_loss": -23.744352340698242, "global_step": 442061, "epoch": 5326} {"train_loss": -23.798715591430664, "global_step": 442062, "epoch": 5326} {"train_loss": -24.734426498413086, "global_step": 442063, "epoch": 5326} {"train_loss": -23.50956916809082, "global_step": 442064, "epoch": 5326} {"train_loss": -24.93644142150879, "global_step": 442065, "epoch": 5326} {"train_loss": -24.973318099975586, "global_step": 442066, "epoch": 5326} {"train_loss": -24.826955795288086, "global_step": 442067, "epoch": 5326} {"train_loss": -25.429656982421875, "global_step": 442068, "epoch": 5326} {"train_loss": -25.582212448120117, "global_step": 442069, "epoch": 5326} {"train_loss": -25.2739315032959, "global_step": 442070, "epoch": 5326} {"train_loss": -25.846643447875977, "global_step": 442071, "epoch": 5326} {"train_loss": -25.628498077392578, "global_step": 442072, "epoch": 5326} {"train_loss": -25.53011131286621, "global_step": 442073, "epoch": 5326} {"train_loss": -25.948078155517578, "global_step": 442074, "epoch": 5326} {"train_loss": -25.691425323486328, "global_step": 442075, "epoch": 5326} {"train_loss": -25.612262725830078, "global_step": 442076, "epoch": 5326} {"train_loss": -25.762327194213867, "global_step": 442077, "epoch": 5326} {"train_loss": -26.151037216186523, "global_step": 442078, "epoch": 5326} {"train_loss": -25.975046157836914, "global_step": 442079, "epoch": 5326} {"train_loss": -25.972646713256836, "global_step": 442080, "epoch": 5326} {"train_loss": -25.731287002563477, "global_step": 442081, "epoch": 5326} {"train_loss": -26.4305419921875, "global_step": 442082, "epoch": 5326} {"train_loss": -26.069650650024414, "global_step": 442083, "epoch": 5326} {"train_loss": -26.233678817749023, "global_step": 442084, "epoch": 5326} {"train_loss": -26.224048614501953, "global_step": 442085, "epoch": 5326} {"train_loss": -26.432525634765625, "global_step": 442086, "epoch": 5326} {"train_loss": -26.258508682250977, "global_step": 442087, "epoch": 5326} {"train_loss": -26.259408950805664, "global_step": 442088, "epoch": 5326} {"train_loss": -26.26734733581543, "global_step": 442089, "epoch": 5326} {"train_loss": -26.374570846557617, "global_step": 442090, "epoch": 5326} {"train_loss": -26.267913818359375, "global_step": 442091, "epoch": 5326} {"train_loss": -26.631641387939453, "global_step": 442092, "epoch": 5326} {"train_loss": -26.53605079650879, "global_step": 442093, "epoch": 5326} {"train_loss": -26.113998413085938, "global_step": 442094, "epoch": 5326} {"train_loss": -25.742965698242188, "global_step": 442095, "epoch": 5326} {"train_loss": -26.642017364501953, "global_step": 442096, "epoch": 5326} {"train_loss": -26.74088478088379, "global_step": 442097, "epoch": 5326} {"train_loss": -26.35883903503418, "global_step": 442098, "epoch": 5326} {"train_loss": -26.771839141845703, "global_step": 442099, "epoch": 5326} {"train_loss": -26.966527938842773, "global_step": 442100, "epoch": 5326} {"train_loss": -26.691648483276367, "global_step": 442101, "epoch": 5326} {"train_loss": -26.886463165283203, "global_step": 442102, "epoch": 5326} {"train_loss": -26.45649528503418, "global_step": 442103, "epoch": 5326} {"train_loss": -26.928512573242188, "global_step": 442104, "epoch": 5326} {"train_loss": -26.74932289123535, "global_step": 442105, "epoch": 5326} {"train_loss": -27.089466094970703, "global_step": 442106, "epoch": 5326} {"train_loss": -26.601648330688477, "global_step": 442107, "epoch": 5326} {"train_loss": -26.720685958862305, "global_step": 442108, "epoch": 5326} {"train_loss": -26.76441764831543, "global_step": 442109, "epoch": 5326} {"train_loss": -26.837011337280273, "global_step": 442110, "epoch": 5326} {"train_loss": -26.748022079467773, "global_step": 442111, "epoch": 5326} {"train_loss": -26.784347534179688, "global_step": 442112, "epoch": 5326} {"train_loss": -27.07142448425293, "global_step": 442113, "epoch": 5326} {"train_loss": -27.1722469329834, "global_step": 442114, "epoch": 5326} {"train_loss": -26.96856117248535, "global_step": 442115, "epoch": 5326} {"train_loss": -26.989471435546875, "global_step": 442116, "epoch": 5326} {"train_loss": -26.764373779296875, "global_step": 442117, "epoch": 5326} {"train_loss": -27.177576065063477, "global_step": 442118, "epoch": 5326} {"train_loss": -27.076862335205078, "global_step": 442119, "epoch": 5326} {"train_loss": -26.84442138671875, "global_step": 442120, "epoch": 5326} {"train_loss": -27.003387451171875, "global_step": 442121, "epoch": 5326} {"train_loss": -26.97432518005371, "global_step": 442122, "epoch": 5326} {"train_loss": -26.77734375, "global_step": 442123, "epoch": 5326} {"train_loss": -26.906665802001953, "global_step": 442124, "epoch": 5326} {"train_loss": -27.387418746948242, "global_step": 442125, "epoch": 5326} {"train_loss": -27.051172256469727, "global_step": 442126, "epoch": 5326} {"train_loss": -26.99789810180664, "global_step": 442127, "epoch": 5326} {"train_loss": -27.185998916625977, "global_step": 442128, "epoch": 5326} {"train_loss": -26.950464248657227, "global_step": 442129, "epoch": 5326} {"train_loss": -27.13643455505371, "global_step": 442130, "epoch": 5326} {"train_loss": -27.092288970947266, "global_step": 442131, "epoch": 5326} {"train_loss": -26.936386108398438, "global_step": 442132, "epoch": 5326} {"train_loss": -26.808435440063477, "global_step": 442133, "epoch": 5326} {"train_loss": -27.307275772094727, "global_step": 442134, "epoch": 5326} {"train_loss": -26.792743682861328, "global_step": 442135, "epoch": 5326} {"train_loss": -27.187042236328125, "global_step": 442136, "epoch": 5326} {"train_loss": -27.124744415283203, "global_step": 442137, "epoch": 5326} {"train_loss": -26.850324630737305, "global_step": 442138, "epoch": 5326} {"train_loss": -26.99281120300293, "global_step": 442139, "epoch": 5326} {"train_loss": -26.23813677408609, "global_step": 442140, "epoch": 5326, "val_loss": 6624041.0} {"train_loss": -27.13686180114746, "global_step": 442141, "epoch": 5327} {"train_loss": -26.909765243530273, "global_step": 442142, "epoch": 5327} {"train_loss": -27.049047470092773, "global_step": 442143, "epoch": 5327} {"train_loss": -27.2528076171875, "global_step": 442144, "epoch": 5327} {"train_loss": -26.647062301635742, "global_step": 442145, "epoch": 5327} {"train_loss": -26.746540069580078, "global_step": 442146, "epoch": 5327} {"train_loss": -26.58955192565918, "global_step": 442147, "epoch": 5327} {"train_loss": -26.792749404907227, "global_step": 442148, "epoch": 5327} {"train_loss": -26.562341690063477, "global_step": 442149, "epoch": 5327} {"train_loss": -26.57179069519043, "global_step": 442150, "epoch": 5327} {"train_loss": -26.705718994140625, "global_step": 442151, "epoch": 5327} {"train_loss": -26.922454833984375, "global_step": 442152, "epoch": 5327} {"train_loss": -26.888916015625, "global_step": 442153, "epoch": 5327} {"train_loss": -26.28839683532715, "global_step": 442154, "epoch": 5327} {"train_loss": -26.72808837890625, "global_step": 442155, "epoch": 5327} {"train_loss": -26.700672149658203, "global_step": 442156, "epoch": 5327} {"train_loss": -26.680496215820312, "global_step": 442157, "epoch": 5327} {"train_loss": -27.04339599609375, "global_step": 442158, "epoch": 5327} {"train_loss": -27.597135543823242, "global_step": 442159, "epoch": 5327} {"train_loss": -26.46051025390625, "global_step": 442160, "epoch": 5327} {"train_loss": -27.264951705932617, "global_step": 442161, "epoch": 5327} {"train_loss": -26.84498405456543, "global_step": 442162, "epoch": 5327} {"train_loss": -26.950414657592773, "global_step": 442163, "epoch": 5327} {"train_loss": -26.77473258972168, "global_step": 442164, "epoch": 5327} {"train_loss": -26.962366104125977, "global_step": 442165, "epoch": 5327} {"train_loss": -26.61701011657715, "global_step": 442166, "epoch": 5327} {"train_loss": -26.875873565673828, "global_step": 442167, "epoch": 5327} {"train_loss": -27.182477951049805, "global_step": 442168, "epoch": 5327} {"train_loss": -26.68086814880371, "global_step": 442169, "epoch": 5327} {"train_loss": -26.971006393432617, "global_step": 442170, "epoch": 5327} {"train_loss": -27.37684440612793, "global_step": 442171, "epoch": 5327} {"train_loss": -26.685998916625977, "global_step": 442172, "epoch": 5327} {"train_loss": -27.23137855529785, "global_step": 442173, "epoch": 5327} {"train_loss": -27.438695907592773, "global_step": 442174, "epoch": 5327} {"train_loss": -27.141101837158203, "global_step": 442175, "epoch": 5327} {"train_loss": -27.414609909057617, "global_step": 442176, "epoch": 5327} {"train_loss": -27.329620361328125, "global_step": 442177, "epoch": 5327} {"train_loss": -27.15140724182129, "global_step": 442178, "epoch": 5327} {"train_loss": -27.08314323425293, "global_step": 442179, "epoch": 5327} {"train_loss": -26.885028839111328, "global_step": 442180, "epoch": 5327} {"train_loss": -27.090087890625, "global_step": 442181, "epoch": 5327} {"train_loss": -27.07720947265625, "global_step": 442182, "epoch": 5327} {"train_loss": -27.058149337768555, "global_step": 442183, "epoch": 5327} {"train_loss": -26.972333908081055, "global_step": 442184, "epoch": 5327} {"train_loss": -27.08222770690918, "global_step": 442185, "epoch": 5327} {"train_loss": -27.503726959228516, "global_step": 442186, "epoch": 5327} {"train_loss": -27.088123321533203, "global_step": 442187, "epoch": 5327} {"train_loss": -27.308673858642578, "global_step": 442188, "epoch": 5327} {"train_loss": -27.204090118408203, "global_step": 442189, "epoch": 5327} {"train_loss": -26.873926162719727, "global_step": 442190, "epoch": 5327} {"train_loss": -27.041828155517578, "global_step": 442191, "epoch": 5327} {"train_loss": -27.249235153198242, "global_step": 442192, "epoch": 5327} {"train_loss": -26.891870498657227, "global_step": 442193, "epoch": 5327} {"train_loss": -26.9716796875, "global_step": 442194, "epoch": 5327} {"train_loss": -27.30438804626465, "global_step": 442195, "epoch": 5327} {"train_loss": -27.03623390197754, "global_step": 442196, "epoch": 5327} {"train_loss": -26.81247901916504, "global_step": 442197, "epoch": 5327} {"train_loss": -27.193130493164062, "global_step": 442198, "epoch": 5327} {"train_loss": -26.955963134765625, "global_step": 442199, "epoch": 5327} {"train_loss": -27.189407348632812, "global_step": 442200, "epoch": 5327} {"train_loss": -26.93868064880371, "global_step": 442201, "epoch": 5327} {"train_loss": -26.972156524658203, "global_step": 442202, "epoch": 5327} {"train_loss": -27.0452938079834, "global_step": 442203, "epoch": 5327} {"train_loss": -26.60102653503418, "global_step": 442204, "epoch": 5327} {"train_loss": -27.018756866455078, "global_step": 442205, "epoch": 5327} {"train_loss": -26.77113914489746, "global_step": 442206, "epoch": 5327} {"train_loss": -26.578144073486328, "global_step": 442207, "epoch": 5327} {"train_loss": -26.806745529174805, "global_step": 442208, "epoch": 5327} {"train_loss": -26.5267276763916, "global_step": 442209, "epoch": 5327} {"train_loss": -26.966938018798828, "global_step": 442210, "epoch": 5327} {"train_loss": -26.671552658081055, "global_step": 442211, "epoch": 5327} {"train_loss": -26.78901481628418, "global_step": 442212, "epoch": 5327} {"train_loss": -27.267139434814453, "global_step": 442213, "epoch": 5327} {"train_loss": -26.883136749267578, "global_step": 442214, "epoch": 5327} {"train_loss": -27.164459228515625, "global_step": 442215, "epoch": 5327} {"train_loss": -26.830907821655273, "global_step": 442216, "epoch": 5327} {"train_loss": -26.621973037719727, "global_step": 442217, "epoch": 5327} {"train_loss": -26.2911319732666, "global_step": 442218, "epoch": 5327} {"train_loss": -26.8570556640625, "global_step": 442219, "epoch": 5327} {"train_loss": -26.91022300720215, "global_step": 442220, "epoch": 5327} {"train_loss": -27.091588973999023, "global_step": 442221, "epoch": 5327} {"train_loss": -27.130151748657227, "global_step": 442222, "epoch": 5327} {"train_loss": -26.972452094755976, "global_step": 442223, "epoch": 5327, "val_loss": 6631294.0} {"train_loss": -26.248071670532227, "global_step": 442224, "epoch": 5328} {"train_loss": -26.149490356445312, "global_step": 442225, "epoch": 5328} {"train_loss": -26.220998764038086, "global_step": 442226, "epoch": 5328} {"train_loss": -26.737354278564453, "global_step": 442227, "epoch": 5328} {"train_loss": -26.99550437927246, "global_step": 442228, "epoch": 5328} {"train_loss": -26.622974395751953, "global_step": 442229, "epoch": 5328} {"train_loss": -26.711872100830078, "global_step": 442230, "epoch": 5328} {"train_loss": -26.76607322692871, "global_step": 442231, "epoch": 5328} {"train_loss": -26.848907470703125, "global_step": 442232, "epoch": 5328} {"train_loss": -26.5989990234375, "global_step": 442233, "epoch": 5328} {"train_loss": -26.5060977935791, "global_step": 442234, "epoch": 5328} {"train_loss": -26.757726669311523, "global_step": 442235, "epoch": 5328} {"train_loss": -26.924428939819336, "global_step": 442236, "epoch": 5328} {"train_loss": -26.406957626342773, "global_step": 442237, "epoch": 5328} {"train_loss": -26.25648307800293, "global_step": 442238, "epoch": 5328} {"train_loss": -26.905994415283203, "global_step": 442239, "epoch": 5328} {"train_loss": -26.343976974487305, "global_step": 442240, "epoch": 5328} {"train_loss": -26.289203643798828, "global_step": 442241, "epoch": 5328} {"train_loss": -26.62933349609375, "global_step": 442242, "epoch": 5328} {"train_loss": -26.86077308654785, "global_step": 442243, "epoch": 5328} {"train_loss": -26.155790328979492, "global_step": 442244, "epoch": 5328} {"train_loss": -26.629779815673828, "global_step": 442245, "epoch": 5328} {"train_loss": -26.69095230102539, "global_step": 442246, "epoch": 5328} {"train_loss": -26.76900291442871, "global_step": 442247, "epoch": 5328} {"train_loss": -26.679555892944336, "global_step": 442248, "epoch": 5328} {"train_loss": -26.79390525817871, "global_step": 442249, "epoch": 5328} {"train_loss": -26.5288028717041, "global_step": 442250, "epoch": 5328} {"train_loss": -27.2550106048584, "global_step": 442251, "epoch": 5328} {"train_loss": -26.90093421936035, "global_step": 442252, "epoch": 5328} {"train_loss": -26.8560848236084, "global_step": 442253, "epoch": 5328} {"train_loss": -26.621320724487305, "global_step": 442254, "epoch": 5328} {"train_loss": -26.7344913482666, "global_step": 442255, "epoch": 5328} {"train_loss": -26.784265518188477, "global_step": 442256, "epoch": 5328} {"train_loss": -27.016244888305664, "global_step": 442257, "epoch": 5328} {"train_loss": -26.738006591796875, "global_step": 442258, "epoch": 5328} {"train_loss": -27.167072296142578, "global_step": 442259, "epoch": 5328} {"train_loss": -26.58400535583496, "global_step": 442260, "epoch": 5328} {"train_loss": -26.773279190063477, "global_step": 442261, "epoch": 5328} {"train_loss": -26.889362335205078, "global_step": 442262, "epoch": 5328} {"train_loss": -27.218677520751953, "global_step": 442263, "epoch": 5328} {"train_loss": -27.0664119720459, "global_step": 442264, "epoch": 5328} {"train_loss": -27.0650691986084, "global_step": 442265, "epoch": 5328} {"train_loss": -27.235015869140625, "global_step": 442266, "epoch": 5328} {"train_loss": -26.753116607666016, "global_step": 442267, "epoch": 5328} {"train_loss": -26.936609268188477, "global_step": 442268, "epoch": 5328} {"train_loss": -27.03812599182129, "global_step": 442269, "epoch": 5328} {"train_loss": -27.244338989257812, "global_step": 442270, "epoch": 5328} {"train_loss": -27.243741989135742, "global_step": 442271, "epoch": 5328} {"train_loss": -27.106693267822266, "global_step": 442272, "epoch": 5328} {"train_loss": -26.889667510986328, "global_step": 442273, "epoch": 5328} {"train_loss": -27.163227081298828, "global_step": 442274, "epoch": 5328} {"train_loss": -26.682113647460938, "global_step": 442275, "epoch": 5328} {"train_loss": -26.84857749938965, "global_step": 442276, "epoch": 5328} {"train_loss": -27.44512367248535, "global_step": 442277, "epoch": 5328} {"train_loss": -27.194517135620117, "global_step": 442278, "epoch": 5328} {"train_loss": -27.248550415039062, "global_step": 442279, "epoch": 5328} {"train_loss": -27.577136993408203, "global_step": 442280, "epoch": 5328} {"train_loss": -27.318267822265625, "global_step": 442281, "epoch": 5328} {"train_loss": -27.140094757080078, "global_step": 442282, "epoch": 5328} {"train_loss": -27.476917266845703, "global_step": 442283, "epoch": 5328} {"train_loss": -26.957616806030273, "global_step": 442284, "epoch": 5328} {"train_loss": -27.133474349975586, "global_step": 442285, "epoch": 5328} {"train_loss": -27.04050636291504, "global_step": 442286, "epoch": 5328} {"train_loss": -27.399707794189453, "global_step": 442287, "epoch": 5328} {"train_loss": -27.285093307495117, "global_step": 442288, "epoch": 5328} {"train_loss": -26.91574478149414, "global_step": 442289, "epoch": 5328} {"train_loss": -27.294179916381836, "global_step": 442290, "epoch": 5328} {"train_loss": -27.115711212158203, "global_step": 442291, "epoch": 5328} {"train_loss": -26.94496726989746, "global_step": 442292, "epoch": 5328} {"train_loss": -26.71259117126465, "global_step": 442293, "epoch": 5328} {"train_loss": -26.000198364257812, "global_step": 442294, "epoch": 5328} {"train_loss": -25.66324234008789, "global_step": 442295, "epoch": 5328} {"train_loss": -25.59878921508789, "global_step": 442296, "epoch": 5328} {"train_loss": -26.57855796813965, "global_step": 442297, "epoch": 5328} {"train_loss": -26.464813232421875, "global_step": 442298, "epoch": 5328} {"train_loss": -26.70875358581543, "global_step": 442299, "epoch": 5328} {"train_loss": -26.633710861206055, "global_step": 442300, "epoch": 5328} {"train_loss": -26.781354904174805, "global_step": 442301, "epoch": 5328} {"train_loss": -26.533187866210938, "global_step": 442302, "epoch": 5328} {"train_loss": -26.740453720092773, "global_step": 442303, "epoch": 5328} {"train_loss": -26.6735782623291, "global_step": 442304, "epoch": 5328} {"train_loss": -26.824665069580078, "global_step": 442305, "epoch": 5328} {"train_loss": -26.81532285299646, "global_step": 442306, "epoch": 5328, "val_loss": 6743668.5} {"train_loss": -26.137922286987305, "global_step": 442307, "epoch": 5329} {"train_loss": -26.25083351135254, "global_step": 442308, "epoch": 5329} {"train_loss": -26.12888526916504, "global_step": 442309, "epoch": 5329} {"train_loss": -26.35658073425293, "global_step": 442310, "epoch": 5329} {"train_loss": -26.090280532836914, "global_step": 442311, "epoch": 5329} {"train_loss": -26.637714385986328, "global_step": 442312, "epoch": 5329} {"train_loss": -26.87725257873535, "global_step": 442313, "epoch": 5329} {"train_loss": -26.361886978149414, "global_step": 442314, "epoch": 5329} {"train_loss": -26.261795043945312, "global_step": 442315, "epoch": 5329} {"train_loss": -27.037267684936523, "global_step": 442316, "epoch": 5329} {"train_loss": -26.436063766479492, "global_step": 442317, "epoch": 5329} {"train_loss": -26.59089469909668, "global_step": 442318, "epoch": 5329} {"train_loss": -26.797149658203125, "global_step": 442319, "epoch": 5329} {"train_loss": -26.662275314331055, "global_step": 442320, "epoch": 5329} {"train_loss": -26.839492797851562, "global_step": 442321, "epoch": 5329} {"train_loss": -26.5244140625, "global_step": 442322, "epoch": 5329} {"train_loss": -26.5647029876709, "global_step": 442323, "epoch": 5329} {"train_loss": -26.41318702697754, "global_step": 442324, "epoch": 5329} {"train_loss": -26.4249210357666, "global_step": 442325, "epoch": 5329} {"train_loss": -26.83717155456543, "global_step": 442326, "epoch": 5329} {"train_loss": -26.835004806518555, "global_step": 442327, "epoch": 5329} {"train_loss": -26.675750732421875, "global_step": 442328, "epoch": 5329} {"train_loss": -26.600086212158203, "global_step": 442329, "epoch": 5329} {"train_loss": -26.89753532409668, "global_step": 442330, "epoch": 5329} {"train_loss": -26.451953887939453, "global_step": 442331, "epoch": 5329} {"train_loss": -26.36439323425293, "global_step": 442332, "epoch": 5329} {"train_loss": -26.9228572845459, "global_step": 442333, "epoch": 5329} {"train_loss": -26.534276962280273, "global_step": 442334, "epoch": 5329} {"train_loss": -26.80110740661621, "global_step": 442335, "epoch": 5329} {"train_loss": -26.76077651977539, "global_step": 442336, "epoch": 5329} {"train_loss": -26.862201690673828, "global_step": 442337, "epoch": 5329} {"train_loss": -27.240020751953125, "global_step": 442338, "epoch": 5329} {"train_loss": -27.04408073425293, "global_step": 442339, "epoch": 5329} {"train_loss": -27.038949966430664, "global_step": 442340, "epoch": 5329} {"train_loss": -27.074132919311523, "global_step": 442341, "epoch": 5329} {"train_loss": -27.073667526245117, "global_step": 442342, "epoch": 5329} {"train_loss": -27.198862075805664, "global_step": 442343, "epoch": 5329} {"train_loss": -26.758380889892578, "global_step": 442344, "epoch": 5329} {"train_loss": -27.105316162109375, "global_step": 442345, "epoch": 5329} {"train_loss": -27.02541160583496, "global_step": 442346, "epoch": 5329} {"train_loss": -26.952716827392578, "global_step": 442347, "epoch": 5329} {"train_loss": -26.859893798828125, "global_step": 442348, "epoch": 5329} {"train_loss": -27.304685592651367, "global_step": 442349, "epoch": 5329} {"train_loss": -27.015003204345703, "global_step": 442350, "epoch": 5329} {"train_loss": -26.976911544799805, "global_step": 442351, "epoch": 5329} {"train_loss": -27.179529190063477, "global_step": 442352, "epoch": 5329} {"train_loss": -26.884204864501953, "global_step": 442353, "epoch": 5329} {"train_loss": -26.793399810791016, "global_step": 442354, "epoch": 5329} {"train_loss": -27.3002986907959, "global_step": 442355, "epoch": 5329} {"train_loss": -26.918750762939453, "global_step": 442356, "epoch": 5329} {"train_loss": -27.509225845336914, "global_step": 442357, "epoch": 5329} {"train_loss": -26.93442726135254, "global_step": 442358, "epoch": 5329} {"train_loss": -26.806787490844727, "global_step": 442359, "epoch": 5329} {"train_loss": -26.978315353393555, "global_step": 442360, "epoch": 5329} {"train_loss": -27.210107803344727, "global_step": 442361, "epoch": 5329} {"train_loss": -26.668502807617188, "global_step": 442362, "epoch": 5329} {"train_loss": -26.652185440063477, "global_step": 442363, "epoch": 5329} {"train_loss": -26.86829948425293, "global_step": 442364, "epoch": 5329} {"train_loss": -26.555994033813477, "global_step": 442365, "epoch": 5329} {"train_loss": -27.195453643798828, "global_step": 442366, "epoch": 5329} {"train_loss": -26.694936752319336, "global_step": 442367, "epoch": 5329} {"train_loss": -26.989013671875, "global_step": 442368, "epoch": 5329} {"train_loss": -26.553354263305664, "global_step": 442369, "epoch": 5329} {"train_loss": -26.841171264648438, "global_step": 442370, "epoch": 5329} {"train_loss": -27.074735641479492, "global_step": 442371, "epoch": 5329} {"train_loss": -27.107757568359375, "global_step": 442372, "epoch": 5329} {"train_loss": -26.979536056518555, "global_step": 442373, "epoch": 5329} {"train_loss": -27.067703247070312, "global_step": 442374, "epoch": 5329} {"train_loss": -26.60239601135254, "global_step": 442375, "epoch": 5329} {"train_loss": -27.120819091796875, "global_step": 442376, "epoch": 5329} {"train_loss": -27.48099708557129, "global_step": 442377, "epoch": 5329} {"train_loss": -26.855712890625, "global_step": 442378, "epoch": 5329} {"train_loss": -27.161731719970703, "global_step": 442379, "epoch": 5329} {"train_loss": -26.8598575592041, "global_step": 442380, "epoch": 5329} {"train_loss": -26.77766227722168, "global_step": 442381, "epoch": 5329} {"train_loss": -26.995080947875977, "global_step": 442382, "epoch": 5329} {"train_loss": -27.13910484313965, "global_step": 442383, "epoch": 5329} {"train_loss": -27.457075119018555, "global_step": 442384, "epoch": 5329} {"train_loss": -26.948699951171875, "global_step": 442385, "epoch": 5329} {"train_loss": -27.181686401367188, "global_step": 442386, "epoch": 5329} {"train_loss": -27.160369873046875, "global_step": 442387, "epoch": 5329} {"train_loss": -27.079172134399414, "global_step": 442388, "epoch": 5329} {"train_loss": -26.84847670865346, "global_step": 442389, "epoch": 5329, "val_loss": 6751453.0} {"train_loss": -26.70429801940918, "global_step": 442390, "epoch": 5330} {"train_loss": -26.466053009033203, "global_step": 442391, "epoch": 5330} {"train_loss": -26.7491397857666, "global_step": 442392, "epoch": 5330} {"train_loss": -26.683380126953125, "global_step": 442393, "epoch": 5330} {"train_loss": -26.97808265686035, "global_step": 442394, "epoch": 5330} {"train_loss": -26.8173828125, "global_step": 442395, "epoch": 5330} {"train_loss": -26.97608757019043, "global_step": 442396, "epoch": 5330} {"train_loss": -26.738691329956055, "global_step": 442397, "epoch": 5330} {"train_loss": -26.710205078125, "global_step": 442398, "epoch": 5330} {"train_loss": -26.4743709564209, "global_step": 442399, "epoch": 5330} {"train_loss": -26.891111373901367, "global_step": 442400, "epoch": 5330} {"train_loss": -26.91035270690918, "global_step": 442401, "epoch": 5330} {"train_loss": -27.123132705688477, "global_step": 442402, "epoch": 5330} {"train_loss": -26.9622745513916, "global_step": 442403, "epoch": 5330} {"train_loss": -27.107196807861328, "global_step": 442404, "epoch": 5330} {"train_loss": -26.783239364624023, "global_step": 442405, "epoch": 5330} {"train_loss": -27.229963302612305, "global_step": 442406, "epoch": 5330} {"train_loss": -26.775409698486328, "global_step": 442407, "epoch": 5330} {"train_loss": -26.976648330688477, "global_step": 442408, "epoch": 5330} {"train_loss": -26.941741943359375, "global_step": 442409, "epoch": 5330} {"train_loss": -26.936368942260742, "global_step": 442410, "epoch": 5330} {"train_loss": -27.43250846862793, "global_step": 442411, "epoch": 5330} {"train_loss": -26.99104118347168, "global_step": 442412, "epoch": 5330} {"train_loss": -26.961103439331055, "global_step": 442413, "epoch": 5330} {"train_loss": -26.789112091064453, "global_step": 442414, "epoch": 5330} {"train_loss": -27.009082794189453, "global_step": 442415, "epoch": 5330} {"train_loss": -27.360061645507812, "global_step": 442416, "epoch": 5330} {"train_loss": -27.166494369506836, "global_step": 442417, "epoch": 5330} {"train_loss": -26.889209747314453, "global_step": 442418, "epoch": 5330} {"train_loss": -27.012989044189453, "global_step": 442419, "epoch": 5330} {"train_loss": -27.13189697265625, "global_step": 442420, "epoch": 5330} {"train_loss": -26.74043083190918, "global_step": 442421, "epoch": 5330} {"train_loss": -26.920429229736328, "global_step": 442422, "epoch": 5330} {"train_loss": -26.882156372070312, "global_step": 442423, "epoch": 5330} {"train_loss": -27.338363647460938, "global_step": 442424, "epoch": 5330} {"train_loss": -27.112171173095703, "global_step": 442425, "epoch": 5330} {"train_loss": -27.142292022705078, "global_step": 442426, "epoch": 5330} {"train_loss": -26.480283737182617, "global_step": 442427, "epoch": 5330} {"train_loss": -26.997608184814453, "global_step": 442428, "epoch": 5330} {"train_loss": -26.29400634765625, "global_step": 442429, "epoch": 5330} {"train_loss": -26.534894943237305, "global_step": 442430, "epoch": 5330} {"train_loss": -26.866199493408203, "global_step": 442431, "epoch": 5330} {"train_loss": -27.020788192749023, "global_step": 442432, "epoch": 5330} {"train_loss": -27.114347457885742, "global_step": 442433, "epoch": 5330} {"train_loss": -27.293872833251953, "global_step": 442434, "epoch": 5330} {"train_loss": -26.94302749633789, "global_step": 442435, "epoch": 5330} {"train_loss": -26.88250160217285, "global_step": 442436, "epoch": 5330} {"train_loss": -26.90821647644043, "global_step": 442437, "epoch": 5330} {"train_loss": -26.978870391845703, "global_step": 442438, "epoch": 5330} {"train_loss": -26.808698654174805, "global_step": 442439, "epoch": 5330} {"train_loss": -26.488788604736328, "global_step": 442440, "epoch": 5330} {"train_loss": -26.927417755126953, "global_step": 442441, "epoch": 5330} {"train_loss": -27.009618759155273, "global_step": 442442, "epoch": 5330} {"train_loss": -26.824462890625, "global_step": 442443, "epoch": 5330} {"train_loss": -27.084867477416992, "global_step": 442444, "epoch": 5330} {"train_loss": -27.23093032836914, "global_step": 442445, "epoch": 5330} {"train_loss": -26.574079513549805, "global_step": 442446, "epoch": 5330} {"train_loss": -26.88385581970215, "global_step": 442447, "epoch": 5330} {"train_loss": -27.152185440063477, "global_step": 442448, "epoch": 5330} {"train_loss": -27.20978355407715, "global_step": 442449, "epoch": 5330} {"train_loss": -26.816823959350586, "global_step": 442450, "epoch": 5330} {"train_loss": -27.194456100463867, "global_step": 442451, "epoch": 5330} {"train_loss": -27.14949607849121, "global_step": 442452, "epoch": 5330} {"train_loss": -27.019025802612305, "global_step": 442453, "epoch": 5330} {"train_loss": -26.947301864624023, "global_step": 442454, "epoch": 5330} {"train_loss": -27.270343780517578, "global_step": 442455, "epoch": 5330} {"train_loss": -27.136646270751953, "global_step": 442456, "epoch": 5330} {"train_loss": -26.974863052368164, "global_step": 442457, "epoch": 5330} {"train_loss": -27.025131225585938, "global_step": 442458, "epoch": 5330} {"train_loss": -27.350433349609375, "global_step": 442459, "epoch": 5330} {"train_loss": -27.33802604675293, "global_step": 442460, "epoch": 5330} {"train_loss": -27.395313262939453, "global_step": 442461, "epoch": 5330} {"train_loss": -27.25545310974121, "global_step": 442462, "epoch": 5330} {"train_loss": -26.918180465698242, "global_step": 442463, "epoch": 5330} {"train_loss": -27.3187255859375, "global_step": 442464, "epoch": 5330} {"train_loss": -27.46695899963379, "global_step": 442465, "epoch": 5330} {"train_loss": -27.07289695739746, "global_step": 442466, "epoch": 5330} {"train_loss": -26.954919815063477, "global_step": 442467, "epoch": 5330} {"train_loss": -27.052148818969727, "global_step": 442468, "epoch": 5330} {"train_loss": -27.21734046936035, "global_step": 442469, "epoch": 5330} {"train_loss": -26.7503719329834, "global_step": 442470, "epoch": 5330} {"train_loss": -27.200164794921875, "global_step": 442471, "epoch": 5330} {"train_loss": -26.975074814026613, "global_step": 442472, "epoch": 5330, "val_loss": 6734202.0} {"train_loss": -26.62751579284668, "global_step": 442473, "epoch": 5331} {"train_loss": -25.91803550720215, "global_step": 442474, "epoch": 5331} {"train_loss": -26.703699111938477, "global_step": 442475, "epoch": 5331} {"train_loss": -26.236448287963867, "global_step": 442476, "epoch": 5331} {"train_loss": -25.811609268188477, "global_step": 442477, "epoch": 5331} {"train_loss": -26.396604537963867, "global_step": 442478, "epoch": 5331} {"train_loss": -26.626129150390625, "global_step": 442479, "epoch": 5331} {"train_loss": -25.675973892211914, "global_step": 442480, "epoch": 5331} {"train_loss": -26.44479751586914, "global_step": 442481, "epoch": 5331} {"train_loss": -26.670166015625, "global_step": 442482, "epoch": 5331} {"train_loss": -26.883350372314453, "global_step": 442483, "epoch": 5331} {"train_loss": -27.010343551635742, "global_step": 442484, "epoch": 5331} {"train_loss": -26.566537857055664, "global_step": 442485, "epoch": 5331} {"train_loss": -26.698118209838867, "global_step": 442486, "epoch": 5331} {"train_loss": -26.9267635345459, "global_step": 442487, "epoch": 5331} {"train_loss": -26.658344268798828, "global_step": 442488, "epoch": 5331} {"train_loss": -26.814355850219727, "global_step": 442489, "epoch": 5331} {"train_loss": -26.50556755065918, "global_step": 442490, "epoch": 5331} {"train_loss": -27.0640869140625, "global_step": 442491, "epoch": 5331} {"train_loss": -26.853078842163086, "global_step": 442492, "epoch": 5331} {"train_loss": -26.832977294921875, "global_step": 442493, "epoch": 5331} {"train_loss": -26.512067794799805, "global_step": 442494, "epoch": 5331} {"train_loss": -26.8720703125, "global_step": 442495, "epoch": 5331} {"train_loss": -26.947986602783203, "global_step": 442496, "epoch": 5331} {"train_loss": -27.2280216217041, "global_step": 442497, "epoch": 5331} {"train_loss": -27.009191513061523, "global_step": 442498, "epoch": 5331} {"train_loss": -27.040136337280273, "global_step": 442499, "epoch": 5331} {"train_loss": -26.725431442260742, "global_step": 442500, "epoch": 5331} {"train_loss": -26.612628936767578, "global_step": 442501, "epoch": 5331} {"train_loss": -26.6644229888916, "global_step": 442502, "epoch": 5331} {"train_loss": -27.2170352935791, "global_step": 442503, "epoch": 5331} {"train_loss": -27.162338256835938, "global_step": 442504, "epoch": 5331} {"train_loss": -26.645252227783203, "global_step": 442505, "epoch": 5331} {"train_loss": -26.673986434936523, "global_step": 442506, "epoch": 5331} {"train_loss": -27.01637840270996, "global_step": 442507, "epoch": 5331} {"train_loss": -27.34272575378418, "global_step": 442508, "epoch": 5331} {"train_loss": -26.962799072265625, "global_step": 442509, "epoch": 5331} {"train_loss": -26.948627471923828, "global_step": 442510, "epoch": 5331} {"train_loss": -27.163471221923828, "global_step": 442511, "epoch": 5331} {"train_loss": -26.974393844604492, "global_step": 442512, "epoch": 5331} {"train_loss": -27.45179557800293, "global_step": 442513, "epoch": 5331} {"train_loss": -27.1276798248291, "global_step": 442514, "epoch": 5331} {"train_loss": -27.145063400268555, "global_step": 442515, "epoch": 5331} {"train_loss": -27.199462890625, "global_step": 442516, "epoch": 5331} {"train_loss": -27.08740234375, "global_step": 442517, "epoch": 5331} {"train_loss": -26.791706085205078, "global_step": 442518, "epoch": 5331} {"train_loss": -27.007705688476562, "global_step": 442519, "epoch": 5331} {"train_loss": -27.033323287963867, "global_step": 442520, "epoch": 5331} {"train_loss": -27.449918746948242, "global_step": 442521, "epoch": 5331} {"train_loss": -27.337646484375, "global_step": 442522, "epoch": 5331} {"train_loss": -27.244415283203125, "global_step": 442523, "epoch": 5331} {"train_loss": -27.33051109313965, "global_step": 442524, "epoch": 5331} {"train_loss": -27.22761344909668, "global_step": 442525, "epoch": 5331} {"train_loss": -27.323810577392578, "global_step": 442526, "epoch": 5331} {"train_loss": -26.963537216186523, "global_step": 442527, "epoch": 5331} {"train_loss": -26.837799072265625, "global_step": 442528, "epoch": 5331} {"train_loss": -26.882659912109375, "global_step": 442529, "epoch": 5331} {"train_loss": -27.098865509033203, "global_step": 442530, "epoch": 5331} {"train_loss": -27.004261016845703, "global_step": 442531, "epoch": 5331} {"train_loss": -27.653791427612305, "global_step": 442532, "epoch": 5331} {"train_loss": -26.98882484436035, "global_step": 442533, "epoch": 5331} {"train_loss": -26.810089111328125, "global_step": 442534, "epoch": 5331} {"train_loss": -26.896421432495117, "global_step": 442535, "epoch": 5331} {"train_loss": -27.075712203979492, "global_step": 442536, "epoch": 5331} {"train_loss": -26.785785675048828, "global_step": 442537, "epoch": 5331} {"train_loss": -26.92255210876465, "global_step": 442538, "epoch": 5331} {"train_loss": -26.541278839111328, "global_step": 442539, "epoch": 5331} {"train_loss": -26.733779907226562, "global_step": 442540, "epoch": 5331} {"train_loss": -26.132932662963867, "global_step": 442541, "epoch": 5331} {"train_loss": -26.6026668548584, "global_step": 442542, "epoch": 5331} {"train_loss": -27.07183837890625, "global_step": 442543, "epoch": 5331} {"train_loss": -26.926599502563477, "global_step": 442544, "epoch": 5331} {"train_loss": -26.433401107788086, "global_step": 442545, "epoch": 5331} {"train_loss": -26.9890193939209, "global_step": 442546, "epoch": 5331} {"train_loss": -26.843902587890625, "global_step": 442547, "epoch": 5331} {"train_loss": -26.41619300842285, "global_step": 442548, "epoch": 5331} {"train_loss": -26.588647842407227, "global_step": 442549, "epoch": 5331} {"train_loss": -26.725234985351562, "global_step": 442550, "epoch": 5331} {"train_loss": -27.029443740844727, "global_step": 442551, "epoch": 5331} {"train_loss": -26.985458374023438, "global_step": 442552, "epoch": 5331} {"train_loss": -26.842817306518555, "global_step": 442553, "epoch": 5331} {"train_loss": -27.231435775756836, "global_step": 442554, "epoch": 5331} {"train_loss": -26.844345184693854, "global_step": 442555, "epoch": 5331, "val_loss": 6626142.0} {"train_loss": -26.54764747619629, "global_step": 442556, "epoch": 5332} {"train_loss": -26.62276268005371, "global_step": 442557, "epoch": 5332} {"train_loss": -26.61429786682129, "global_step": 442558, "epoch": 5332} {"train_loss": -26.354394912719727, "global_step": 442559, "epoch": 5332} {"train_loss": -26.88358497619629, "global_step": 442560, "epoch": 5332} {"train_loss": -26.21240234375, "global_step": 442561, "epoch": 5332} {"train_loss": -26.49483299255371, "global_step": 442562, "epoch": 5332} {"train_loss": -26.718433380126953, "global_step": 442563, "epoch": 5332} {"train_loss": -27.05805015563965, "global_step": 442564, "epoch": 5332} {"train_loss": -26.46187400817871, "global_step": 442565, "epoch": 5332} {"train_loss": -26.876916885375977, "global_step": 442566, "epoch": 5332} {"train_loss": -26.830585479736328, "global_step": 442567, "epoch": 5332} {"train_loss": -26.74997329711914, "global_step": 442568, "epoch": 5332} {"train_loss": -26.727127075195312, "global_step": 442569, "epoch": 5332} {"train_loss": -26.67352294921875, "global_step": 442570, "epoch": 5332} {"train_loss": -26.819259643554688, "global_step": 442571, "epoch": 5332} {"train_loss": -26.900739669799805, "global_step": 442572, "epoch": 5332} {"train_loss": -27.06080436706543, "global_step": 442573, "epoch": 5332} {"train_loss": -27.365619659423828, "global_step": 442574, "epoch": 5332} {"train_loss": -26.99728775024414, "global_step": 442575, "epoch": 5332} {"train_loss": -27.016218185424805, "global_step": 442576, "epoch": 5332} {"train_loss": -26.8272762298584, "global_step": 442577, "epoch": 5332} {"train_loss": -26.78839683532715, "global_step": 442578, "epoch": 5332} {"train_loss": -26.728485107421875, "global_step": 442579, "epoch": 5332} {"train_loss": -26.486743927001953, "global_step": 442580, "epoch": 5332} {"train_loss": -26.896289825439453, "global_step": 442581, "epoch": 5332} {"train_loss": -26.621139526367188, "global_step": 442582, "epoch": 5332} {"train_loss": -26.65907096862793, "global_step": 442583, "epoch": 5332} {"train_loss": -26.82343864440918, "global_step": 442584, "epoch": 5332} {"train_loss": -26.8034725189209, "global_step": 442585, "epoch": 5332} {"train_loss": -26.573637008666992, "global_step": 442586, "epoch": 5332} {"train_loss": -26.307422637939453, "global_step": 442587, "epoch": 5332} {"train_loss": -26.946685791015625, "global_step": 442588, "epoch": 5332} {"train_loss": -26.742612838745117, "global_step": 442589, "epoch": 5332} {"train_loss": -26.969837188720703, "global_step": 442590, "epoch": 5332} {"train_loss": -27.124998092651367, "global_step": 442591, "epoch": 5332} {"train_loss": -26.661731719970703, "global_step": 442592, "epoch": 5332} {"train_loss": -26.55860710144043, "global_step": 442593, "epoch": 5332} {"train_loss": -26.711191177368164, "global_step": 442594, "epoch": 5332} {"train_loss": -26.7259464263916, "global_step": 442595, "epoch": 5332} {"train_loss": -26.806304931640625, "global_step": 442596, "epoch": 5332} {"train_loss": -27.00086784362793, "global_step": 442597, "epoch": 5332} {"train_loss": -27.229101181030273, "global_step": 442598, "epoch": 5332} {"train_loss": -27.444355010986328, "global_step": 442599, "epoch": 5332} {"train_loss": -26.635608673095703, "global_step": 442600, "epoch": 5332} {"train_loss": -26.717670440673828, "global_step": 442601, "epoch": 5332} {"train_loss": -27.150793075561523, "global_step": 442602, "epoch": 5332} {"train_loss": -26.721832275390625, "global_step": 442603, "epoch": 5332} {"train_loss": -26.952566146850586, "global_step": 442604, "epoch": 5332} {"train_loss": -26.910459518432617, "global_step": 442605, "epoch": 5332} {"train_loss": -26.65656089782715, "global_step": 442606, "epoch": 5332} {"train_loss": -26.998493194580078, "global_step": 442607, "epoch": 5332} {"train_loss": -26.85066032409668, "global_step": 442608, "epoch": 5332} {"train_loss": -27.2761287689209, "global_step": 442609, "epoch": 5332} {"train_loss": -27.1892147064209, "global_step": 442610, "epoch": 5332} {"train_loss": -27.250823974609375, "global_step": 442611, "epoch": 5332} {"train_loss": -26.966083526611328, "global_step": 442612, "epoch": 5332} {"train_loss": -27.188562393188477, "global_step": 442613, "epoch": 5332} {"train_loss": -27.278501510620117, "global_step": 442614, "epoch": 5332} {"train_loss": -26.975248336791992, "global_step": 442615, "epoch": 5332} {"train_loss": -27.484384536743164, "global_step": 442616, "epoch": 5332} {"train_loss": -26.932159423828125, "global_step": 442617, "epoch": 5332} {"train_loss": -26.799219131469727, "global_step": 442618, "epoch": 5332} {"train_loss": -27.320093154907227, "global_step": 442619, "epoch": 5332} {"train_loss": -26.953596115112305, "global_step": 442620, "epoch": 5332} {"train_loss": -27.0320987701416, "global_step": 442621, "epoch": 5332} {"train_loss": -27.108539581298828, "global_step": 442622, "epoch": 5332} {"train_loss": -27.245468139648438, "global_step": 442623, "epoch": 5332} {"train_loss": -26.923181533813477, "global_step": 442624, "epoch": 5332} {"train_loss": -27.10101318359375, "global_step": 442625, "epoch": 5332} {"train_loss": -27.132110595703125, "global_step": 442626, "epoch": 5332} {"train_loss": -27.28814125061035, "global_step": 442627, "epoch": 5332} {"train_loss": -27.021469116210938, "global_step": 442628, "epoch": 5332} {"train_loss": -26.7314395904541, "global_step": 442629, "epoch": 5332} {"train_loss": -27.133996963500977, "global_step": 442630, "epoch": 5332} {"train_loss": -26.748193740844727, "global_step": 442631, "epoch": 5332} {"train_loss": -27.091022491455078, "global_step": 442632, "epoch": 5332} {"train_loss": -27.125585556030273, "global_step": 442633, "epoch": 5332} {"train_loss": -27.353534698486328, "global_step": 442634, "epoch": 5332} {"train_loss": -27.12225341796875, "global_step": 442635, "epoch": 5332} {"train_loss": -27.239124298095703, "global_step": 442636, "epoch": 5332} {"train_loss": -26.79143714904785, "global_step": 442637, "epoch": 5332} {"train_loss": -26.90651797099286, "global_step": 442638, "epoch": 5332, "val_loss": 6681248.0} {"train_loss": -26.31061363220215, "global_step": 442639, "epoch": 5333} {"train_loss": -24.68312644958496, "global_step": 442640, "epoch": 5333} {"train_loss": -24.39320945739746, "global_step": 442641, "epoch": 5333} {"train_loss": -24.456802368164062, "global_step": 442642, "epoch": 5333} {"train_loss": -26.209003448486328, "global_step": 442643, "epoch": 5333} {"train_loss": -25.84836196899414, "global_step": 442644, "epoch": 5333} {"train_loss": -25.606637954711914, "global_step": 442645, "epoch": 5333} {"train_loss": -25.700239181518555, "global_step": 442646, "epoch": 5333} {"train_loss": -25.66337013244629, "global_step": 442647, "epoch": 5333} {"train_loss": -25.66001319885254, "global_step": 442648, "epoch": 5333} {"train_loss": -26.354333877563477, "global_step": 442649, "epoch": 5333} {"train_loss": -25.964807510375977, "global_step": 442650, "epoch": 5333} {"train_loss": -26.200702667236328, "global_step": 442651, "epoch": 5333} {"train_loss": -26.321197509765625, "global_step": 442652, "epoch": 5333} {"train_loss": -26.268163681030273, "global_step": 442653, "epoch": 5333} {"train_loss": -26.5574951171875, "global_step": 442654, "epoch": 5333} {"train_loss": -26.562253952026367, "global_step": 442655, "epoch": 5333} {"train_loss": -26.41692543029785, "global_step": 442656, "epoch": 5333} {"train_loss": -26.222925186157227, "global_step": 442657, "epoch": 5333} {"train_loss": -26.815073013305664, "global_step": 442658, "epoch": 5333} {"train_loss": -26.31770896911621, "global_step": 442659, "epoch": 5333} {"train_loss": -26.892322540283203, "global_step": 442660, "epoch": 5333} {"train_loss": -26.461063385009766, "global_step": 442661, "epoch": 5333} {"train_loss": -26.474767684936523, "global_step": 442662, "epoch": 5333} {"train_loss": -27.00819206237793, "global_step": 442663, "epoch": 5333} {"train_loss": -26.620807647705078, "global_step": 442664, "epoch": 5333} {"train_loss": -26.724445343017578, "global_step": 442665, "epoch": 5333} {"train_loss": -26.50031089782715, "global_step": 442666, "epoch": 5333} {"train_loss": -26.447675704956055, "global_step": 442667, "epoch": 5333} {"train_loss": -26.573150634765625, "global_step": 442668, "epoch": 5333} {"train_loss": -26.67227554321289, "global_step": 442669, "epoch": 5333} {"train_loss": -26.637405395507812, "global_step": 442670, "epoch": 5333} {"train_loss": -26.523969650268555, "global_step": 442671, "epoch": 5333} {"train_loss": -26.857763290405273, "global_step": 442672, "epoch": 5333} {"train_loss": -27.23833656311035, "global_step": 442673, "epoch": 5333} {"train_loss": -26.613351821899414, "global_step": 442674, "epoch": 5333} {"train_loss": -27.073266983032227, "global_step": 442675, "epoch": 5333} {"train_loss": -26.779882431030273, "global_step": 442676, "epoch": 5333} {"train_loss": -26.953678131103516, "global_step": 442677, "epoch": 5333} {"train_loss": -26.972639083862305, "global_step": 442678, "epoch": 5333} {"train_loss": -27.083669662475586, "global_step": 442679, "epoch": 5333} {"train_loss": -26.8771915435791, "global_step": 442680, "epoch": 5333} {"train_loss": -26.994983673095703, "global_step": 442681, "epoch": 5333} {"train_loss": -26.983108520507812, "global_step": 442682, "epoch": 5333} {"train_loss": -26.98371696472168, "global_step": 442683, "epoch": 5333} {"train_loss": -27.1536808013916, "global_step": 442684, "epoch": 5333} {"train_loss": -27.027984619140625, "global_step": 442685, "epoch": 5333} {"train_loss": -26.20426368713379, "global_step": 442686, "epoch": 5333} {"train_loss": -26.792804718017578, "global_step": 442687, "epoch": 5333} {"train_loss": -27.181543350219727, "global_step": 442688, "epoch": 5333} {"train_loss": -27.043060302734375, "global_step": 442689, "epoch": 5333} {"train_loss": -26.94549560546875, "global_step": 442690, "epoch": 5333} {"train_loss": -27.479578018188477, "global_step": 442691, "epoch": 5333} {"train_loss": -27.17862892150879, "global_step": 442692, "epoch": 5333} {"train_loss": -26.923730850219727, "global_step": 442693, "epoch": 5333} {"train_loss": -26.976560592651367, "global_step": 442694, "epoch": 5333} {"train_loss": -27.269001007080078, "global_step": 442695, "epoch": 5333} {"train_loss": -27.043807983398438, "global_step": 442696, "epoch": 5333} {"train_loss": -27.086145401000977, "global_step": 442697, "epoch": 5333} {"train_loss": -27.42708396911621, "global_step": 442698, "epoch": 5333} {"train_loss": -27.24599266052246, "global_step": 442699, "epoch": 5333} {"train_loss": -27.29656982421875, "global_step": 442700, "epoch": 5333} {"train_loss": -27.260486602783203, "global_step": 442701, "epoch": 5333} {"train_loss": -26.995508193969727, "global_step": 442702, "epoch": 5333} {"train_loss": -26.47035789489746, "global_step": 442703, "epoch": 5333} {"train_loss": -27.302549362182617, "global_step": 442704, "epoch": 5333} {"train_loss": -27.371545791625977, "global_step": 442705, "epoch": 5333} {"train_loss": -27.094970703125, "global_step": 442706, "epoch": 5333} {"train_loss": -26.998992919921875, "global_step": 442707, "epoch": 5333} {"train_loss": -27.10791015625, "global_step": 442708, "epoch": 5333} {"train_loss": -26.856220245361328, "global_step": 442709, "epoch": 5333} {"train_loss": -27.261621475219727, "global_step": 442710, "epoch": 5333} {"train_loss": -27.15817642211914, "global_step": 442711, "epoch": 5333} {"train_loss": -27.597131729125977, "global_step": 442712, "epoch": 5333} {"train_loss": -26.790719985961914, "global_step": 442713, "epoch": 5333} {"train_loss": -27.05915641784668, "global_step": 442714, "epoch": 5333} {"train_loss": -26.87129020690918, "global_step": 442715, "epoch": 5333} {"train_loss": -27.488256454467773, "global_step": 442716, "epoch": 5333} {"train_loss": -26.940229415893555, "global_step": 442717, "epoch": 5333} {"train_loss": -26.8045711517334, "global_step": 442718, "epoch": 5333} {"train_loss": -26.987531661987305, "global_step": 442719, "epoch": 5333} {"train_loss": -27.1650333404541, "global_step": 442720, "epoch": 5333} {"train_loss": -26.714688473437207, "global_step": 442721, "epoch": 5333, "val_loss": 6691012.0} {"train_loss": -26.383771896362305, "global_step": 442722, "epoch": 5334} {"train_loss": -26.542997360229492, "global_step": 442723, "epoch": 5334} {"train_loss": -26.873437881469727, "global_step": 442724, "epoch": 5334} {"train_loss": -26.511001586914062, "global_step": 442725, "epoch": 5334} {"train_loss": -26.63935661315918, "global_step": 442726, "epoch": 5334} {"train_loss": -26.763504028320312, "global_step": 442727, "epoch": 5334} {"train_loss": -26.83735466003418, "global_step": 442728, "epoch": 5334} {"train_loss": -26.891555786132812, "global_step": 442729, "epoch": 5334} {"train_loss": -26.604970932006836, "global_step": 442730, "epoch": 5334} {"train_loss": -26.436920166015625, "global_step": 442731, "epoch": 5334} {"train_loss": -26.038421630859375, "global_step": 442732, "epoch": 5334} {"train_loss": -26.850494384765625, "global_step": 442733, "epoch": 5334} {"train_loss": -26.602323532104492, "global_step": 442734, "epoch": 5334} {"train_loss": -26.894287109375, "global_step": 442735, "epoch": 5334} {"train_loss": -26.953699111938477, "global_step": 442736, "epoch": 5334} {"train_loss": -26.692035675048828, "global_step": 442737, "epoch": 5334} {"train_loss": -26.95330810546875, "global_step": 442738, "epoch": 5334} {"train_loss": -26.741113662719727, "global_step": 442739, "epoch": 5334} {"train_loss": -27.074460983276367, "global_step": 442740, "epoch": 5334} {"train_loss": -26.80755043029785, "global_step": 442741, "epoch": 5334} {"train_loss": -26.759765625, "global_step": 442742, "epoch": 5334} {"train_loss": -26.6558837890625, "global_step": 442743, "epoch": 5334} {"train_loss": -27.2393798828125, "global_step": 442744, "epoch": 5334} {"train_loss": -27.17255210876465, "global_step": 442745, "epoch": 5334} {"train_loss": -27.033483505249023, "global_step": 442746, "epoch": 5334} {"train_loss": -26.707748413085938, "global_step": 442747, "epoch": 5334} {"train_loss": -26.923419952392578, "global_step": 442748, "epoch": 5334} {"train_loss": -26.889480590820312, "global_step": 442749, "epoch": 5334} {"train_loss": -26.92388916015625, "global_step": 442750, "epoch": 5334} {"train_loss": -26.422269821166992, "global_step": 442751, "epoch": 5334} {"train_loss": -26.808019638061523, "global_step": 442752, "epoch": 5334} {"train_loss": -27.381555557250977, "global_step": 442753, "epoch": 5334} {"train_loss": -26.866788864135742, "global_step": 442754, "epoch": 5334} {"train_loss": -26.816272735595703, "global_step": 442755, "epoch": 5334} {"train_loss": -27.148944854736328, "global_step": 442756, "epoch": 5334} {"train_loss": -27.2273006439209, "global_step": 442757, "epoch": 5334} {"train_loss": -26.42974853515625, "global_step": 442758, "epoch": 5334} {"train_loss": -26.803451538085938, "global_step": 442759, "epoch": 5334} {"train_loss": -26.755910873413086, "global_step": 442760, "epoch": 5334} {"train_loss": -26.893756866455078, "global_step": 442761, "epoch": 5334} {"train_loss": -27.065099716186523, "global_step": 442762, "epoch": 5334} {"train_loss": -27.080429077148438, "global_step": 442763, "epoch": 5334} {"train_loss": -27.307172775268555, "global_step": 442764, "epoch": 5334} {"train_loss": -27.185535430908203, "global_step": 442765, "epoch": 5334} {"train_loss": -26.986791610717773, "global_step": 442766, "epoch": 5334} {"train_loss": -26.948089599609375, "global_step": 442767, "epoch": 5334} {"train_loss": -26.97541618347168, "global_step": 442768, "epoch": 5334} {"train_loss": -27.432065963745117, "global_step": 442769, "epoch": 5334} {"train_loss": -27.2336483001709, "global_step": 442770, "epoch": 5334} {"train_loss": -27.415491104125977, "global_step": 442771, "epoch": 5334} {"train_loss": -27.099212646484375, "global_step": 442772, "epoch": 5334} {"train_loss": -27.04334831237793, "global_step": 442773, "epoch": 5334} {"train_loss": -27.441904067993164, "global_step": 442774, "epoch": 5334} {"train_loss": -27.045318603515625, "global_step": 442775, "epoch": 5334} {"train_loss": -27.19183349609375, "global_step": 442776, "epoch": 5334} {"train_loss": -26.959213256835938, "global_step": 442777, "epoch": 5334} {"train_loss": -27.206912994384766, "global_step": 442778, "epoch": 5334} {"train_loss": -27.14234733581543, "global_step": 442779, "epoch": 5334} {"train_loss": -26.930572509765625, "global_step": 442780, "epoch": 5334} {"train_loss": -27.152225494384766, "global_step": 442781, "epoch": 5334} {"train_loss": -27.096435546875, "global_step": 442782, "epoch": 5334} {"train_loss": -27.3031005859375, "global_step": 442783, "epoch": 5334} {"train_loss": -26.974435806274414, "global_step": 442784, "epoch": 5334} {"train_loss": -26.990137100219727, "global_step": 442785, "epoch": 5334} {"train_loss": -26.789325714111328, "global_step": 442786, "epoch": 5334} {"train_loss": -26.690649032592773, "global_step": 442787, "epoch": 5334} {"train_loss": -27.036169052124023, "global_step": 442788, "epoch": 5334} {"train_loss": -26.843740463256836, "global_step": 442789, "epoch": 5334} {"train_loss": -26.645414352416992, "global_step": 442790, "epoch": 5334} {"train_loss": -26.39776611328125, "global_step": 442791, "epoch": 5334} {"train_loss": -26.79554557800293, "global_step": 442792, "epoch": 5334} {"train_loss": -26.696563720703125, "global_step": 442793, "epoch": 5334} {"train_loss": -26.954931259155273, "global_step": 442794, "epoch": 5334} {"train_loss": -26.96143913269043, "global_step": 442795, "epoch": 5334} {"train_loss": -27.160253524780273, "global_step": 442796, "epoch": 5334} {"train_loss": -26.912097930908203, "global_step": 442797, "epoch": 5334} {"train_loss": -27.1810302734375, "global_step": 442798, "epoch": 5334} {"train_loss": -26.95432472229004, "global_step": 442799, "epoch": 5334} {"train_loss": -26.87127685546875, "global_step": 442800, "epoch": 5334} {"train_loss": -27.010908126831055, "global_step": 442801, "epoch": 5334} {"train_loss": -27.20585060119629, "global_step": 442802, "epoch": 5334} {"train_loss": -26.989044189453125, "global_step": 442803, "epoch": 5334} {"train_loss": -26.920269265232317, "global_step": 442804, "epoch": 5334, "val_loss": 6723265.0} {"train_loss": -26.305957794189453, "global_step": 442805, "epoch": 5335} {"train_loss": -25.5133113861084, "global_step": 442806, "epoch": 5335} {"train_loss": -25.707965850830078, "global_step": 442807, "epoch": 5335} {"train_loss": -25.863433837890625, "global_step": 442808, "epoch": 5335} {"train_loss": -25.957319259643555, "global_step": 442809, "epoch": 5335} {"train_loss": -26.28767204284668, "global_step": 442810, "epoch": 5335} {"train_loss": -26.34979248046875, "global_step": 442811, "epoch": 5335} {"train_loss": -26.275339126586914, "global_step": 442812, "epoch": 5335} {"train_loss": -26.978174209594727, "global_step": 442813, "epoch": 5335} {"train_loss": -26.519947052001953, "global_step": 442814, "epoch": 5335} {"train_loss": -26.512338638305664, "global_step": 442815, "epoch": 5335} {"train_loss": -26.460241317749023, "global_step": 442816, "epoch": 5335} {"train_loss": -26.77150535583496, "global_step": 442817, "epoch": 5335} {"train_loss": -26.41523551940918, "global_step": 442818, "epoch": 5335} {"train_loss": -26.86429786682129, "global_step": 442819, "epoch": 5335} {"train_loss": -26.891326904296875, "global_step": 442820, "epoch": 5335} {"train_loss": -26.818893432617188, "global_step": 442821, "epoch": 5335} {"train_loss": -26.82892417907715, "global_step": 442822, "epoch": 5335} {"train_loss": -26.650043487548828, "global_step": 442823, "epoch": 5335} {"train_loss": -26.874420166015625, "global_step": 442824, "epoch": 5335} {"train_loss": -26.606048583984375, "global_step": 442825, "epoch": 5335} {"train_loss": -26.593917846679688, "global_step": 442826, "epoch": 5335} {"train_loss": -26.642248153686523, "global_step": 442827, "epoch": 5335} {"train_loss": -26.627893447875977, "global_step": 442828, "epoch": 5335} {"train_loss": -27.123523712158203, "global_step": 442829, "epoch": 5335} {"train_loss": -26.86177635192871, "global_step": 442830, "epoch": 5335} {"train_loss": -26.837976455688477, "global_step": 442831, "epoch": 5335} {"train_loss": -27.21503257751465, "global_step": 442832, "epoch": 5335} {"train_loss": -26.97504997253418, "global_step": 442833, "epoch": 5335} {"train_loss": -26.882949829101562, "global_step": 442834, "epoch": 5335} {"train_loss": -26.810556411743164, "global_step": 442835, "epoch": 5335} {"train_loss": -27.0839786529541, "global_step": 442836, "epoch": 5335} {"train_loss": -27.0141658782959, "global_step": 442837, "epoch": 5335} {"train_loss": -26.8704833984375, "global_step": 442838, "epoch": 5335} {"train_loss": -26.465057373046875, "global_step": 442839, "epoch": 5335} {"train_loss": -26.943344116210938, "global_step": 442840, "epoch": 5335} {"train_loss": -26.650882720947266, "global_step": 442841, "epoch": 5335} {"train_loss": -27.098007202148438, "global_step": 442842, "epoch": 5335} {"train_loss": -27.117429733276367, "global_step": 442843, "epoch": 5335} {"train_loss": -27.21540641784668, "global_step": 442844, "epoch": 5335} {"train_loss": -27.01386833190918, "global_step": 442845, "epoch": 5335} {"train_loss": -27.352697372436523, "global_step": 442846, "epoch": 5335} {"train_loss": -27.609567642211914, "global_step": 442847, "epoch": 5335} {"train_loss": -26.8205623626709, "global_step": 442848, "epoch": 5335} {"train_loss": -27.05329704284668, "global_step": 442849, "epoch": 5335} {"train_loss": -26.878957748413086, "global_step": 442850, "epoch": 5335} {"train_loss": -26.941455841064453, "global_step": 442851, "epoch": 5335} {"train_loss": -27.15268898010254, "global_step": 442852, "epoch": 5335} {"train_loss": -27.31768226623535, "global_step": 442853, "epoch": 5335} {"train_loss": -27.16290283203125, "global_step": 442854, "epoch": 5335} {"train_loss": -27.060171127319336, "global_step": 442855, "epoch": 5335} {"train_loss": -26.81867790222168, "global_step": 442856, "epoch": 5335} {"train_loss": -27.18275260925293, "global_step": 442857, "epoch": 5335} {"train_loss": -27.30731201171875, "global_step": 442858, "epoch": 5335} {"train_loss": -27.46232032775879, "global_step": 442859, "epoch": 5335} {"train_loss": -27.153425216674805, "global_step": 442860, "epoch": 5335} {"train_loss": -27.226415634155273, "global_step": 442861, "epoch": 5335} {"train_loss": -27.245019912719727, "global_step": 442862, "epoch": 5335} {"train_loss": -27.28435707092285, "global_step": 442863, "epoch": 5335} {"train_loss": -27.139814376831055, "global_step": 442864, "epoch": 5335} {"train_loss": -26.987218856811523, "global_step": 442865, "epoch": 5335} {"train_loss": -27.260419845581055, "global_step": 442866, "epoch": 5335} {"train_loss": -27.00442886352539, "global_step": 442867, "epoch": 5335} {"train_loss": -26.732919692993164, "global_step": 442868, "epoch": 5335} {"train_loss": -26.93368911743164, "global_step": 442869, "epoch": 5335} {"train_loss": -27.195026397705078, "global_step": 442870, "epoch": 5335} {"train_loss": -27.41717529296875, "global_step": 442871, "epoch": 5335} {"train_loss": -27.2086181640625, "global_step": 442872, "epoch": 5335} {"train_loss": -27.20157241821289, "global_step": 442873, "epoch": 5335} {"train_loss": -26.709766387939453, "global_step": 442874, "epoch": 5335} {"train_loss": -26.895233154296875, "global_step": 442875, "epoch": 5335} {"train_loss": -27.24410057067871, "global_step": 442876, "epoch": 5335} {"train_loss": -27.280471801757812, "global_step": 442877, "epoch": 5335} {"train_loss": -27.062833786010742, "global_step": 442878, "epoch": 5335} {"train_loss": -27.03639030456543, "global_step": 442879, "epoch": 5335} {"train_loss": -26.7576904296875, "global_step": 442880, "epoch": 5335} {"train_loss": -26.92157554626465, "global_step": 442881, "epoch": 5335} {"train_loss": -26.853185653686523, "global_step": 442882, "epoch": 5335} {"train_loss": -26.605253219604492, "global_step": 442883, "epoch": 5335} {"train_loss": -26.698766708374023, "global_step": 442884, "epoch": 5335} {"train_loss": -27.360952377319336, "global_step": 442885, "epoch": 5335} {"train_loss": -26.9814510345459, "global_step": 442886, "epoch": 5335} {"train_loss": -26.88849341151226, "global_step": 442887, "epoch": 5335, "val_loss": 6663182.0} {"train_loss": -26.62111473083496, "global_step": 442888, "epoch": 5336} {"train_loss": -27.007064819335938, "global_step": 442889, "epoch": 5336} {"train_loss": -25.984359741210938, "global_step": 442890, "epoch": 5336} {"train_loss": -26.3277587890625, "global_step": 442891, "epoch": 5336} {"train_loss": -26.48013687133789, "global_step": 442892, "epoch": 5336} {"train_loss": -27.09128761291504, "global_step": 442893, "epoch": 5336} {"train_loss": -26.672231674194336, "global_step": 442894, "epoch": 5336} {"train_loss": -26.226526260375977, "global_step": 442895, "epoch": 5336} {"train_loss": -26.516260147094727, "global_step": 442896, "epoch": 5336} {"train_loss": -27.11810302734375, "global_step": 442897, "epoch": 5336} {"train_loss": -26.30536460876465, "global_step": 442898, "epoch": 5336} {"train_loss": -26.554540634155273, "global_step": 442899, "epoch": 5336} {"train_loss": -26.8587589263916, "global_step": 442900, "epoch": 5336} {"train_loss": -26.83497428894043, "global_step": 442901, "epoch": 5336} {"train_loss": -26.62042808532715, "global_step": 442902, "epoch": 5336} {"train_loss": -26.837574005126953, "global_step": 442903, "epoch": 5336} {"train_loss": -26.68408203125, "global_step": 442904, "epoch": 5336} {"train_loss": -26.64497184753418, "global_step": 442905, "epoch": 5336} {"train_loss": -26.460834503173828, "global_step": 442906, "epoch": 5336} {"train_loss": -26.992101669311523, "global_step": 442907, "epoch": 5336} {"train_loss": -26.3528995513916, "global_step": 442908, "epoch": 5336} {"train_loss": -27.044818878173828, "global_step": 442909, "epoch": 5336} {"train_loss": -26.6445255279541, "global_step": 442910, "epoch": 5336} {"train_loss": -26.958471298217773, "global_step": 442911, "epoch": 5336} {"train_loss": -27.20582389831543, "global_step": 442912, "epoch": 5336} {"train_loss": -26.882770538330078, "global_step": 442913, "epoch": 5336} {"train_loss": -27.042203903198242, "global_step": 442914, "epoch": 5336} {"train_loss": -27.047216415405273, "global_step": 442915, "epoch": 5336} {"train_loss": -27.024438858032227, "global_step": 442916, "epoch": 5336} {"train_loss": -26.840835571289062, "global_step": 442917, "epoch": 5336} {"train_loss": -27.241168975830078, "global_step": 442918, "epoch": 5336} {"train_loss": -26.745227813720703, "global_step": 442919, "epoch": 5336} {"train_loss": -26.9958438873291, "global_step": 442920, "epoch": 5336} {"train_loss": -27.07526969909668, "global_step": 442921, "epoch": 5336} {"train_loss": -27.008886337280273, "global_step": 442922, "epoch": 5336} {"train_loss": -26.868505477905273, "global_step": 442923, "epoch": 5336} {"train_loss": -26.879547119140625, "global_step": 442924, "epoch": 5336} {"train_loss": -27.09946060180664, "global_step": 442925, "epoch": 5336} {"train_loss": -26.971240997314453, "global_step": 442926, "epoch": 5336} {"train_loss": -26.84893798828125, "global_step": 442927, "epoch": 5336} {"train_loss": -27.184906005859375, "global_step": 442928, "epoch": 5336} {"train_loss": -26.8162899017334, "global_step": 442929, "epoch": 5336} {"train_loss": -26.986083984375, "global_step": 442930, "epoch": 5336} {"train_loss": -26.988677978515625, "global_step": 442931, "epoch": 5336} {"train_loss": -26.84511375427246, "global_step": 442932, "epoch": 5336} {"train_loss": -27.004514694213867, "global_step": 442933, "epoch": 5336} {"train_loss": -27.072629928588867, "global_step": 442934, "epoch": 5336} {"train_loss": -26.981082916259766, "global_step": 442935, "epoch": 5336} {"train_loss": -26.940099716186523, "global_step": 442936, "epoch": 5336} {"train_loss": -27.160959243774414, "global_step": 442937, "epoch": 5336} {"train_loss": -26.902973175048828, "global_step": 442938, "epoch": 5336} {"train_loss": -27.05072593688965, "global_step": 442939, "epoch": 5336} {"train_loss": -27.3485107421875, "global_step": 442940, "epoch": 5336} {"train_loss": -26.8903865814209, "global_step": 442941, "epoch": 5336} {"train_loss": -26.838102340698242, "global_step": 442942, "epoch": 5336} {"train_loss": -26.87603187561035, "global_step": 442943, "epoch": 5336} {"train_loss": -26.5980167388916, "global_step": 442944, "epoch": 5336} {"train_loss": -26.470855712890625, "global_step": 442945, "epoch": 5336} {"train_loss": -26.984039306640625, "global_step": 442946, "epoch": 5336} {"train_loss": -26.744714736938477, "global_step": 442947, "epoch": 5336} {"train_loss": -26.893346786499023, "global_step": 442948, "epoch": 5336} {"train_loss": -26.91731071472168, "global_step": 442949, "epoch": 5336} {"train_loss": -27.07330894470215, "global_step": 442950, "epoch": 5336} {"train_loss": -26.82380485534668, "global_step": 442951, "epoch": 5336} {"train_loss": -26.685388565063477, "global_step": 442952, "epoch": 5336} {"train_loss": -26.67732048034668, "global_step": 442953, "epoch": 5336} {"train_loss": -26.52908706665039, "global_step": 442954, "epoch": 5336} {"train_loss": -27.020267486572266, "global_step": 442955, "epoch": 5336} {"train_loss": -26.782678604125977, "global_step": 442956, "epoch": 5336} {"train_loss": -26.495468139648438, "global_step": 442957, "epoch": 5336} {"train_loss": -27.377349853515625, "global_step": 442958, "epoch": 5336} {"train_loss": -26.817249298095703, "global_step": 442959, "epoch": 5336} {"train_loss": -26.90675926208496, "global_step": 442960, "epoch": 5336} {"train_loss": -26.92923355102539, "global_step": 442961, "epoch": 5336} {"train_loss": -26.773427963256836, "global_step": 442962, "epoch": 5336} {"train_loss": -26.7543888092041, "global_step": 442963, "epoch": 5336} {"train_loss": -26.907760620117188, "global_step": 442964, "epoch": 5336} {"train_loss": -26.872268676757812, "global_step": 442965, "epoch": 5336} {"train_loss": -26.948810577392578, "global_step": 442966, "epoch": 5336} {"train_loss": -27.07401466369629, "global_step": 442967, "epoch": 5336} {"train_loss": -27.11060905456543, "global_step": 442968, "epoch": 5336} {"train_loss": -26.628921508789062, "global_step": 442969, "epoch": 5336} {"train_loss": -26.8353208289089, "global_step": 442970, "epoch": 5336, "val_loss": 6606274.0} {"train_loss": -27.04495620727539, "global_step": 442971, "epoch": 5337} {"train_loss": -25.6229190826416, "global_step": 442972, "epoch": 5337} {"train_loss": -26.159177780151367, "global_step": 442973, "epoch": 5337} {"train_loss": -26.4893798828125, "global_step": 442974, "epoch": 5337} {"train_loss": -26.537118911743164, "global_step": 442975, "epoch": 5337} {"train_loss": -25.871877670288086, "global_step": 442976, "epoch": 5337} {"train_loss": -26.870380401611328, "global_step": 442977, "epoch": 5337} {"train_loss": -26.7860164642334, "global_step": 442978, "epoch": 5337} {"train_loss": -26.881122589111328, "global_step": 442979, "epoch": 5337} {"train_loss": -26.37104606628418, "global_step": 442980, "epoch": 5337} {"train_loss": -26.9620361328125, "global_step": 442981, "epoch": 5337} {"train_loss": -26.786468505859375, "global_step": 442982, "epoch": 5337} {"train_loss": -26.616077423095703, "global_step": 442983, "epoch": 5337} {"train_loss": -26.817800521850586, "global_step": 442984, "epoch": 5337} {"train_loss": -26.442541122436523, "global_step": 442985, "epoch": 5337} {"train_loss": -26.710172653198242, "global_step": 442986, "epoch": 5337} {"train_loss": -26.632322311401367, "global_step": 442987, "epoch": 5337} {"train_loss": -26.861495971679688, "global_step": 442988, "epoch": 5337} {"train_loss": -26.897979736328125, "global_step": 442989, "epoch": 5337} {"train_loss": -26.847091674804688, "global_step": 442990, "epoch": 5337} {"train_loss": -26.966968536376953, "global_step": 442991, "epoch": 5337} {"train_loss": -26.943387985229492, "global_step": 442992, "epoch": 5337} {"train_loss": -27.2166748046875, "global_step": 442993, "epoch": 5337} {"train_loss": -27.0773983001709, "global_step": 442994, "epoch": 5337} {"train_loss": -26.825281143188477, "global_step": 442995, "epoch": 5337} {"train_loss": -26.769580841064453, "global_step": 442996, "epoch": 5337} {"train_loss": -26.66437339782715, "global_step": 442997, "epoch": 5337} {"train_loss": -26.830286026000977, "global_step": 442998, "epoch": 5337} {"train_loss": -27.088348388671875, "global_step": 442999, "epoch": 5337} {"train_loss": -27.004810333251953, "global_step": 443000, "epoch": 5337} {"train_loss": -26.855167388916016, "global_step": 443001, "epoch": 5337} {"train_loss": -27.38933753967285, "global_step": 443002, "epoch": 5337} {"train_loss": -27.115034103393555, "global_step": 443003, "epoch": 5337} {"train_loss": -26.65691566467285, "global_step": 443004, "epoch": 5337} {"train_loss": -26.990671157836914, "global_step": 443005, "epoch": 5337} {"train_loss": -27.147003173828125, "global_step": 443006, "epoch": 5337} {"train_loss": -26.709630966186523, "global_step": 443007, "epoch": 5337} {"train_loss": -26.828372955322266, "global_step": 443008, "epoch": 5337} {"train_loss": -26.979694366455078, "global_step": 443009, "epoch": 5337} {"train_loss": -26.97186851501465, "global_step": 443010, "epoch": 5337} {"train_loss": -26.788833618164062, "global_step": 443011, "epoch": 5337} {"train_loss": -26.972644805908203, "global_step": 443012, "epoch": 5337} {"train_loss": -26.981210708618164, "global_step": 443013, "epoch": 5337} {"train_loss": -26.819625854492188, "global_step": 443014, "epoch": 5337} {"train_loss": -26.742517471313477, "global_step": 443015, "epoch": 5337} {"train_loss": -27.570117950439453, "global_step": 443016, "epoch": 5337} {"train_loss": -26.626962661743164, "global_step": 443017, "epoch": 5337} {"train_loss": -26.763391494750977, "global_step": 443018, "epoch": 5337} {"train_loss": -26.801166534423828, "global_step": 443019, "epoch": 5337} {"train_loss": -27.272809982299805, "global_step": 443020, "epoch": 5337} {"train_loss": -27.109888076782227, "global_step": 443021, "epoch": 5337} {"train_loss": -26.564300537109375, "global_step": 443022, "epoch": 5337} {"train_loss": -27.04070472717285, "global_step": 443023, "epoch": 5337} {"train_loss": -27.019718170166016, "global_step": 443024, "epoch": 5337} {"train_loss": -26.7261905670166, "global_step": 443025, "epoch": 5337} {"train_loss": -27.179059982299805, "global_step": 443026, "epoch": 5337} {"train_loss": -26.827062606811523, "global_step": 443027, "epoch": 5337} {"train_loss": -27.3147029876709, "global_step": 443028, "epoch": 5337} {"train_loss": -27.0195369720459, "global_step": 443029, "epoch": 5337} {"train_loss": -26.869184494018555, "global_step": 443030, "epoch": 5337} {"train_loss": -26.946069717407227, "global_step": 443031, "epoch": 5337} {"train_loss": -27.02817726135254, "global_step": 443032, "epoch": 5337} {"train_loss": -26.9541015625, "global_step": 443033, "epoch": 5337} {"train_loss": -27.019556045532227, "global_step": 443034, "epoch": 5337} {"train_loss": -27.0653076171875, "global_step": 443035, "epoch": 5337} {"train_loss": -26.85536766052246, "global_step": 443036, "epoch": 5337} {"train_loss": -26.722278594970703, "global_step": 443037, "epoch": 5337} {"train_loss": -27.05824851989746, "global_step": 443038, "epoch": 5337} {"train_loss": -26.9658145904541, "global_step": 443039, "epoch": 5337} {"train_loss": -26.638952255249023, "global_step": 443040, "epoch": 5337} {"train_loss": -27.431838989257812, "global_step": 443041, "epoch": 5337} {"train_loss": -27.31293296813965, "global_step": 443042, "epoch": 5337} {"train_loss": -27.029752731323242, "global_step": 443043, "epoch": 5337} {"train_loss": -27.167016983032227, "global_step": 443044, "epoch": 5337} {"train_loss": -26.95271873474121, "global_step": 443045, "epoch": 5337} {"train_loss": -26.885961532592773, "global_step": 443046, "epoch": 5337} {"train_loss": -26.954442977905273, "global_step": 443047, "epoch": 5337} {"train_loss": -27.212493896484375, "global_step": 443048, "epoch": 5337} {"train_loss": -27.194082260131836, "global_step": 443049, "epoch": 5337} {"train_loss": -26.80437660217285, "global_step": 443050, "epoch": 5337} {"train_loss": -26.959501266479492, "global_step": 443051, "epoch": 5337} {"train_loss": -27.043569564819336, "global_step": 443052, "epoch": 5337} {"train_loss": -26.87371419424034, "global_step": 443053, "epoch": 5337, "val_loss": 6704940.0} {"train_loss": -26.630767822265625, "global_step": 443054, "epoch": 5338} {"train_loss": -25.71476173400879, "global_step": 443055, "epoch": 5338} {"train_loss": -25.81452751159668, "global_step": 443056, "epoch": 5338} {"train_loss": -25.220447540283203, "global_step": 443057, "epoch": 5338} {"train_loss": -25.489774703979492, "global_step": 443058, "epoch": 5338} {"train_loss": -26.499120712280273, "global_step": 443059, "epoch": 5338} {"train_loss": -26.162267684936523, "global_step": 443060, "epoch": 5338} {"train_loss": -25.201993942260742, "global_step": 443061, "epoch": 5338} {"train_loss": -26.42913246154785, "global_step": 443062, "epoch": 5338} {"train_loss": -26.055927276611328, "global_step": 443063, "epoch": 5338} {"train_loss": -26.167760848999023, "global_step": 443064, "epoch": 5338} {"train_loss": -26.017282485961914, "global_step": 443065, "epoch": 5338} {"train_loss": -26.065460205078125, "global_step": 443066, "epoch": 5338} {"train_loss": -26.622846603393555, "global_step": 443067, "epoch": 5338} {"train_loss": -26.24664878845215, "global_step": 443068, "epoch": 5338} {"train_loss": -26.51008415222168, "global_step": 443069, "epoch": 5338} {"train_loss": -26.277912139892578, "global_step": 443070, "epoch": 5338} {"train_loss": -26.621240615844727, "global_step": 443071, "epoch": 5338} {"train_loss": -26.412322998046875, "global_step": 443072, "epoch": 5338} {"train_loss": -26.357330322265625, "global_step": 443073, "epoch": 5338} {"train_loss": -26.42938804626465, "global_step": 443074, "epoch": 5338} {"train_loss": -26.59149742126465, "global_step": 443075, "epoch": 5338} {"train_loss": -26.59226417541504, "global_step": 443076, "epoch": 5338} {"train_loss": -26.666715621948242, "global_step": 443077, "epoch": 5338} {"train_loss": -26.446792602539062, "global_step": 443078, "epoch": 5338} {"train_loss": -26.921232223510742, "global_step": 443079, "epoch": 5338} {"train_loss": -26.684864044189453, "global_step": 443080, "epoch": 5338} {"train_loss": -27.0006160736084, "global_step": 443081, "epoch": 5338} {"train_loss": -26.65279197692871, "global_step": 443082, "epoch": 5338} {"train_loss": -26.840280532836914, "global_step": 443083, "epoch": 5338} {"train_loss": -26.901214599609375, "global_step": 443084, "epoch": 5338} {"train_loss": -26.86878776550293, "global_step": 443085, "epoch": 5338} {"train_loss": -27.1829833984375, "global_step": 443086, "epoch": 5338} {"train_loss": -26.840076446533203, "global_step": 443087, "epoch": 5338} {"train_loss": -26.67268180847168, "global_step": 443088, "epoch": 5338} {"train_loss": -27.103439331054688, "global_step": 443089, "epoch": 5338} {"train_loss": -26.723819732666016, "global_step": 443090, "epoch": 5338} {"train_loss": -26.928159713745117, "global_step": 443091, "epoch": 5338} {"train_loss": -27.1016845703125, "global_step": 443092, "epoch": 5338} {"train_loss": -26.97334098815918, "global_step": 443093, "epoch": 5338} {"train_loss": -27.17707633972168, "global_step": 443094, "epoch": 5338} {"train_loss": -26.78936767578125, "global_step": 443095, "epoch": 5338} {"train_loss": -27.230993270874023, "global_step": 443096, "epoch": 5338} {"train_loss": -27.020252227783203, "global_step": 443097, "epoch": 5338} {"train_loss": -27.02679443359375, "global_step": 443098, "epoch": 5338} {"train_loss": -27.01148796081543, "global_step": 443099, "epoch": 5338} {"train_loss": -27.276391983032227, "global_step": 443100, "epoch": 5338} {"train_loss": -27.064741134643555, "global_step": 443101, "epoch": 5338} {"train_loss": -27.0228214263916, "global_step": 443102, "epoch": 5338} {"train_loss": -27.1329288482666, "global_step": 443103, "epoch": 5338} {"train_loss": -27.096939086914062, "global_step": 443104, "epoch": 5338} {"train_loss": -27.096506118774414, "global_step": 443105, "epoch": 5338} {"train_loss": -27.121397018432617, "global_step": 443106, "epoch": 5338} {"train_loss": -27.0594425201416, "global_step": 443107, "epoch": 5338} {"train_loss": -26.853668212890625, "global_step": 443108, "epoch": 5338} {"train_loss": -27.541412353515625, "global_step": 443109, "epoch": 5338} {"train_loss": -27.139423370361328, "global_step": 443110, "epoch": 5338} {"train_loss": -27.079971313476562, "global_step": 443111, "epoch": 5338} {"train_loss": -26.581024169921875, "global_step": 443112, "epoch": 5338} {"train_loss": -27.32283592224121, "global_step": 443113, "epoch": 5338} {"train_loss": -27.11103630065918, "global_step": 443114, "epoch": 5338} {"train_loss": -27.32563591003418, "global_step": 443115, "epoch": 5338} {"train_loss": -27.14339256286621, "global_step": 443116, "epoch": 5338} {"train_loss": -26.936857223510742, "global_step": 443117, "epoch": 5338} {"train_loss": -27.0994930267334, "global_step": 443118, "epoch": 5338} {"train_loss": -26.58249855041504, "global_step": 443119, "epoch": 5338} {"train_loss": -27.204486846923828, "global_step": 443120, "epoch": 5338} {"train_loss": -26.865808486938477, "global_step": 443121, "epoch": 5338} {"train_loss": -27.2733154296875, "global_step": 443122, "epoch": 5338} {"train_loss": -26.824909210205078, "global_step": 443123, "epoch": 5338} {"train_loss": -27.293659210205078, "global_step": 443124, "epoch": 5338} {"train_loss": -26.713821411132812, "global_step": 443125, "epoch": 5338} {"train_loss": -27.03865623474121, "global_step": 443126, "epoch": 5338} {"train_loss": -26.960296630859375, "global_step": 443127, "epoch": 5338} {"train_loss": -27.107532501220703, "global_step": 443128, "epoch": 5338} {"train_loss": -27.436054229736328, "global_step": 443129, "epoch": 5338} {"train_loss": -27.176416397094727, "global_step": 443130, "epoch": 5338} {"train_loss": -26.997268676757812, "global_step": 443131, "epoch": 5338} {"train_loss": -26.613000869750977, "global_step": 443132, "epoch": 5338} {"train_loss": -27.04277992248535, "global_step": 443133, "epoch": 5338} {"train_loss": -27.301990509033203, "global_step": 443134, "epoch": 5338} {"train_loss": -27.069721221923828, "global_step": 443135, "epoch": 5338} {"train_loss": -26.78035154687353, "global_step": 443136, "epoch": 5338, "val_loss": 6612089.0} {"train_loss": -26.325841903686523, "global_step": 443137, "epoch": 5339} {"train_loss": -25.76619529724121, "global_step": 443138, "epoch": 5339} {"train_loss": -24.970460891723633, "global_step": 443139, "epoch": 5339} {"train_loss": -24.856412887573242, "global_step": 443140, "epoch": 5339} {"train_loss": -26.280780792236328, "global_step": 443141, "epoch": 5339} {"train_loss": -25.733840942382812, "global_step": 443142, "epoch": 5339} {"train_loss": -25.37355613708496, "global_step": 443143, "epoch": 5339} {"train_loss": -25.941638946533203, "global_step": 443144, "epoch": 5339} {"train_loss": -25.9810791015625, "global_step": 443145, "epoch": 5339} {"train_loss": -26.117116928100586, "global_step": 443146, "epoch": 5339} {"train_loss": -26.292774200439453, "global_step": 443147, "epoch": 5339} {"train_loss": -25.9150333404541, "global_step": 443148, "epoch": 5339} {"train_loss": -26.361072540283203, "global_step": 443149, "epoch": 5339} {"train_loss": -26.242944717407227, "global_step": 443150, "epoch": 5339} {"train_loss": -26.40142822265625, "global_step": 443151, "epoch": 5339} {"train_loss": -26.51810073852539, "global_step": 443152, "epoch": 5339} {"train_loss": -26.002655029296875, "global_step": 443153, "epoch": 5339} {"train_loss": -26.33357810974121, "global_step": 443154, "epoch": 5339} {"train_loss": -26.149627685546875, "global_step": 443155, "epoch": 5339} {"train_loss": -26.343555450439453, "global_step": 443156, "epoch": 5339} {"train_loss": -26.420629501342773, "global_step": 443157, "epoch": 5339} {"train_loss": -26.213266372680664, "global_step": 443158, "epoch": 5339} {"train_loss": -26.05739402770996, "global_step": 443159, "epoch": 5339} {"train_loss": -26.39643669128418, "global_step": 443160, "epoch": 5339} {"train_loss": -26.408737182617188, "global_step": 443161, "epoch": 5339} {"train_loss": -26.380212783813477, "global_step": 443162, "epoch": 5339} {"train_loss": -26.39229393005371, "global_step": 443163, "epoch": 5339} {"train_loss": -26.92302894592285, "global_step": 443164, "epoch": 5339} {"train_loss": -26.5594539642334, "global_step": 443165, "epoch": 5339} {"train_loss": -26.78074073791504, "global_step": 443166, "epoch": 5339} {"train_loss": -26.8061466217041, "global_step": 443167, "epoch": 5339} {"train_loss": -27.050373077392578, "global_step": 443168, "epoch": 5339} {"train_loss": -26.58733558654785, "global_step": 443169, "epoch": 5339} {"train_loss": -26.6995849609375, "global_step": 443170, "epoch": 5339} {"train_loss": -26.7535457611084, "global_step": 443171, "epoch": 5339} {"train_loss": -27.027912139892578, "global_step": 443172, "epoch": 5339} {"train_loss": -26.654111862182617, "global_step": 443173, "epoch": 5339} {"train_loss": -26.86328125, "global_step": 443174, "epoch": 5339} {"train_loss": -26.806060791015625, "global_step": 443175, "epoch": 5339} {"train_loss": -26.8727970123291, "global_step": 443176, "epoch": 5339} {"train_loss": -26.83961296081543, "global_step": 443177, "epoch": 5339} {"train_loss": -26.97809410095215, "global_step": 443178, "epoch": 5339} {"train_loss": -27.167882919311523, "global_step": 443179, "epoch": 5339} {"train_loss": -26.988494873046875, "global_step": 443180, "epoch": 5339} {"train_loss": -27.054712295532227, "global_step": 443181, "epoch": 5339} {"train_loss": -27.011932373046875, "global_step": 443182, "epoch": 5339} {"train_loss": -27.012807846069336, "global_step": 443183, "epoch": 5339} {"train_loss": -27.4672794342041, "global_step": 443184, "epoch": 5339} {"train_loss": -26.957813262939453, "global_step": 443185, "epoch": 5339} {"train_loss": -27.025421142578125, "global_step": 443186, "epoch": 5339} {"train_loss": -26.962182998657227, "global_step": 443187, "epoch": 5339} {"train_loss": -27.281646728515625, "global_step": 443188, "epoch": 5339} {"train_loss": -27.121158599853516, "global_step": 443189, "epoch": 5339} {"train_loss": -27.21992301940918, "global_step": 443190, "epoch": 5339} {"train_loss": -27.389225006103516, "global_step": 443191, "epoch": 5339} {"train_loss": -27.146625518798828, "global_step": 443192, "epoch": 5339} {"train_loss": -27.367053985595703, "global_step": 443193, "epoch": 5339} {"train_loss": -27.085586547851562, "global_step": 443194, "epoch": 5339} {"train_loss": -27.05306053161621, "global_step": 443195, "epoch": 5339} {"train_loss": -27.062360763549805, "global_step": 443196, "epoch": 5339} {"train_loss": -27.416593551635742, "global_step": 443197, "epoch": 5339} {"train_loss": -27.295337677001953, "global_step": 443198, "epoch": 5339} {"train_loss": -27.112340927124023, "global_step": 443199, "epoch": 5339} {"train_loss": -27.08711814880371, "global_step": 443200, "epoch": 5339} {"train_loss": -26.991962432861328, "global_step": 443201, "epoch": 5339} {"train_loss": -26.9593448638916, "global_step": 443202, "epoch": 5339} {"train_loss": -26.90836524963379, "global_step": 443203, "epoch": 5339} {"train_loss": -26.82073402404785, "global_step": 443204, "epoch": 5339} {"train_loss": -27.443159103393555, "global_step": 443205, "epoch": 5339} {"train_loss": -27.0656681060791, "global_step": 443206, "epoch": 5339} {"train_loss": -27.27027702331543, "global_step": 443207, "epoch": 5339} {"train_loss": -27.282995223999023, "global_step": 443208, "epoch": 5339} {"train_loss": -27.460037231445312, "global_step": 443209, "epoch": 5339} {"train_loss": -27.334089279174805, "global_step": 443210, "epoch": 5339} {"train_loss": -27.264379501342773, "global_step": 443211, "epoch": 5339} {"train_loss": -26.956226348876953, "global_step": 443212, "epoch": 5339} {"train_loss": -27.136606216430664, "global_step": 443213, "epoch": 5339} {"train_loss": -27.36319351196289, "global_step": 443214, "epoch": 5339} {"train_loss": -27.305448532104492, "global_step": 443215, "epoch": 5339} {"train_loss": -26.672317504882812, "global_step": 443216, "epoch": 5339} {"train_loss": -26.50348472595215, "global_step": 443217, "epoch": 5339} {"train_loss": -26.511566162109375, "global_step": 443218, "epoch": 5339} {"train_loss": -26.718854720333972, "global_step": 443219, "epoch": 5339, "val_loss": 6618286.0} {"train_loss": -24.008249282836914, "global_step": 443220, "epoch": 5340} {"train_loss": -21.84662437438965, "global_step": 443221, "epoch": 5340} {"train_loss": -24.522216796875, "global_step": 443222, "epoch": 5340} {"train_loss": -23.82933235168457, "global_step": 443223, "epoch": 5340} {"train_loss": -24.52747344970703, "global_step": 443224, "epoch": 5340} {"train_loss": -24.82098388671875, "global_step": 443225, "epoch": 5340} {"train_loss": -24.94818115234375, "global_step": 443226, "epoch": 5340} {"train_loss": -24.79299545288086, "global_step": 443227, "epoch": 5340} {"train_loss": -25.519758224487305, "global_step": 443228, "epoch": 5340} {"train_loss": -24.900959014892578, "global_step": 443229, "epoch": 5340} {"train_loss": -25.139585494995117, "global_step": 443230, "epoch": 5340} {"train_loss": -25.83039665222168, "global_step": 443231, "epoch": 5340} {"train_loss": -25.355501174926758, "global_step": 443232, "epoch": 5340} {"train_loss": -24.927051544189453, "global_step": 443233, "epoch": 5340} {"train_loss": -25.43292236328125, "global_step": 443234, "epoch": 5340} {"train_loss": -25.696399688720703, "global_step": 443235, "epoch": 5340} {"train_loss": -25.867883682250977, "global_step": 443236, "epoch": 5340} {"train_loss": -25.239965438842773, "global_step": 443237, "epoch": 5340} {"train_loss": -25.469181060791016, "global_step": 443238, "epoch": 5340} {"train_loss": -25.852371215820312, "global_step": 443239, "epoch": 5340} {"train_loss": -26.026947021484375, "global_step": 443240, "epoch": 5340} {"train_loss": -25.88958168029785, "global_step": 443241, "epoch": 5340} {"train_loss": -25.64143180847168, "global_step": 443242, "epoch": 5340} {"train_loss": -25.774982452392578, "global_step": 443243, "epoch": 5340} {"train_loss": -26.042104721069336, "global_step": 443244, "epoch": 5340} {"train_loss": -26.240726470947266, "global_step": 443245, "epoch": 5340} {"train_loss": -26.16778564453125, "global_step": 443246, "epoch": 5340} {"train_loss": -26.186279296875, "global_step": 443247, "epoch": 5340} {"train_loss": -25.920989990234375, "global_step": 443248, "epoch": 5340} {"train_loss": -26.20427894592285, "global_step": 443249, "epoch": 5340} {"train_loss": -26.342193603515625, "global_step": 443250, "epoch": 5340} {"train_loss": -26.379531860351562, "global_step": 443251, "epoch": 5340} {"train_loss": -26.53325843811035, "global_step": 443252, "epoch": 5340} {"train_loss": -26.280303955078125, "global_step": 443253, "epoch": 5340} {"train_loss": -26.250524520874023, "global_step": 443254, "epoch": 5340} {"train_loss": -26.552417755126953, "global_step": 443255, "epoch": 5340} {"train_loss": -26.633319854736328, "global_step": 443256, "epoch": 5340} {"train_loss": -26.198007583618164, "global_step": 443257, "epoch": 5340} {"train_loss": -26.423263549804688, "global_step": 443258, "epoch": 5340} {"train_loss": -26.248010635375977, "global_step": 443259, "epoch": 5340} {"train_loss": -26.493865966796875, "global_step": 443260, "epoch": 5340} {"train_loss": -26.71624755859375, "global_step": 443261, "epoch": 5340} {"train_loss": -26.644311904907227, "global_step": 443262, "epoch": 5340} {"train_loss": -26.651784896850586, "global_step": 443263, "epoch": 5340} {"train_loss": -26.81791114807129, "global_step": 443264, "epoch": 5340} {"train_loss": -26.635034561157227, "global_step": 443265, "epoch": 5340} {"train_loss": -26.682174682617188, "global_step": 443266, "epoch": 5340} {"train_loss": -27.025699615478516, "global_step": 443267, "epoch": 5340} {"train_loss": -26.83607292175293, "global_step": 443268, "epoch": 5340} {"train_loss": -27.426679611206055, "global_step": 443269, "epoch": 5340} {"train_loss": -26.3692626953125, "global_step": 443270, "epoch": 5340} {"train_loss": -27.026824951171875, "global_step": 443271, "epoch": 5340} {"train_loss": -26.895751953125, "global_step": 443272, "epoch": 5340} {"train_loss": -26.613489151000977, "global_step": 443273, "epoch": 5340} {"train_loss": -26.504587173461914, "global_step": 443274, "epoch": 5340} {"train_loss": -26.995527267456055, "global_step": 443275, "epoch": 5340} {"train_loss": -26.891992568969727, "global_step": 443276, "epoch": 5340} {"train_loss": -26.834882736206055, "global_step": 443277, "epoch": 5340} {"train_loss": -26.887426376342773, "global_step": 443278, "epoch": 5340} {"train_loss": -27.11421775817871, "global_step": 443279, "epoch": 5340} {"train_loss": -27.129545211791992, "global_step": 443280, "epoch": 5340} {"train_loss": -27.384296417236328, "global_step": 443281, "epoch": 5340} {"train_loss": -27.19807243347168, "global_step": 443282, "epoch": 5340} {"train_loss": -27.358678817749023, "global_step": 443283, "epoch": 5340} {"train_loss": -27.135120391845703, "global_step": 443284, "epoch": 5340} {"train_loss": -26.874820709228516, "global_step": 443285, "epoch": 5340} {"train_loss": -27.1079158782959, "global_step": 443286, "epoch": 5340} {"train_loss": -27.11813735961914, "global_step": 443287, "epoch": 5340} {"train_loss": -27.2790470123291, "global_step": 443288, "epoch": 5340} {"train_loss": -27.102869033813477, "global_step": 443289, "epoch": 5340} {"train_loss": -27.180200576782227, "global_step": 443290, "epoch": 5340} {"train_loss": -27.645116806030273, "global_step": 443291, "epoch": 5340} {"train_loss": -26.6915225982666, "global_step": 443292, "epoch": 5340} {"train_loss": -26.812231063842773, "global_step": 443293, "epoch": 5340} {"train_loss": -27.03076171875, "global_step": 443294, "epoch": 5340} {"train_loss": -27.029279708862305, "global_step": 443295, "epoch": 5340} {"train_loss": -27.01375389099121, "global_step": 443296, "epoch": 5340} {"train_loss": -27.09235954284668, "global_step": 443297, "epoch": 5340} {"train_loss": -26.967756271362305, "global_step": 443298, "epoch": 5340} {"train_loss": -26.942625045776367, "global_step": 443299, "epoch": 5340} {"train_loss": -26.99567222595215, "global_step": 443300, "epoch": 5340} {"train_loss": -26.690704345703125, "global_step": 443301, "epoch": 5340} {"train_loss": -26.28772344933935, "global_step": 443302, "epoch": 5340, "val_loss": 6600742.0} {"train_loss": -26.970977783203125, "global_step": 443303, "epoch": 5341} {"train_loss": -26.66187858581543, "global_step": 443304, "epoch": 5341} {"train_loss": -26.672460556030273, "global_step": 443305, "epoch": 5341} {"train_loss": -26.303848266601562, "global_step": 443306, "epoch": 5341} {"train_loss": -26.795486450195312, "global_step": 443307, "epoch": 5341} {"train_loss": -27.079126358032227, "global_step": 443308, "epoch": 5341} {"train_loss": -27.278446197509766, "global_step": 443309, "epoch": 5341} {"train_loss": -26.82379722595215, "global_step": 443310, "epoch": 5341} {"train_loss": -27.28803825378418, "global_step": 443311, "epoch": 5341} {"train_loss": -26.88960838317871, "global_step": 443312, "epoch": 5341} {"train_loss": -27.009857177734375, "global_step": 443313, "epoch": 5341} {"train_loss": -27.1621150970459, "global_step": 443314, "epoch": 5341} {"train_loss": -27.4730281829834, "global_step": 443315, "epoch": 5341} {"train_loss": -26.75269889831543, "global_step": 443316, "epoch": 5341} {"train_loss": -27.05820083618164, "global_step": 443317, "epoch": 5341} {"train_loss": -27.199188232421875, "global_step": 443318, "epoch": 5341} {"train_loss": -26.818246841430664, "global_step": 443319, "epoch": 5341} {"train_loss": -26.6922607421875, "global_step": 443320, "epoch": 5341} {"train_loss": -27.31463050842285, "global_step": 443321, "epoch": 5341} {"train_loss": -27.188425064086914, "global_step": 443322, "epoch": 5341} {"train_loss": -26.889755249023438, "global_step": 443323, "epoch": 5341} {"train_loss": -27.06656837463379, "global_step": 443324, "epoch": 5341} {"train_loss": -27.46381187438965, "global_step": 443325, "epoch": 5341} {"train_loss": -27.274398803710938, "global_step": 443326, "epoch": 5341} {"train_loss": -27.116601943969727, "global_step": 443327, "epoch": 5341} {"train_loss": -26.816436767578125, "global_step": 443328, "epoch": 5341} {"train_loss": -27.006635665893555, "global_step": 443329, "epoch": 5341} {"train_loss": -27.116872787475586, "global_step": 443330, "epoch": 5341} {"train_loss": -27.10512351989746, "global_step": 443331, "epoch": 5341} {"train_loss": -27.33719825744629, "global_step": 443332, "epoch": 5341} {"train_loss": -27.1425724029541, "global_step": 443333, "epoch": 5341} {"train_loss": -27.220600128173828, "global_step": 443334, "epoch": 5341} {"train_loss": -27.00062370300293, "global_step": 443335, "epoch": 5341} {"train_loss": -27.305652618408203, "global_step": 443336, "epoch": 5341} {"train_loss": -27.198888778686523, "global_step": 443337, "epoch": 5341} {"train_loss": -26.9694766998291, "global_step": 443338, "epoch": 5341} {"train_loss": -27.03183937072754, "global_step": 443339, "epoch": 5341} {"train_loss": -27.02923011779785, "global_step": 443340, "epoch": 5341} {"train_loss": -26.8553466796875, "global_step": 443341, "epoch": 5341} {"train_loss": -27.0010929107666, "global_step": 443342, "epoch": 5341} {"train_loss": -27.195531845092773, "global_step": 443343, "epoch": 5341} {"train_loss": -26.54981803894043, "global_step": 443344, "epoch": 5341} {"train_loss": -27.01177406311035, "global_step": 443345, "epoch": 5341} {"train_loss": -26.8204345703125, "global_step": 443346, "epoch": 5341} {"train_loss": -26.828510284423828, "global_step": 443347, "epoch": 5341} {"train_loss": -27.016096115112305, "global_step": 443348, "epoch": 5341} {"train_loss": -26.83746337890625, "global_step": 443349, "epoch": 5341} {"train_loss": -26.389368057250977, "global_step": 443350, "epoch": 5341} {"train_loss": -26.77728271484375, "global_step": 443351, "epoch": 5341} {"train_loss": -26.540191650390625, "global_step": 443352, "epoch": 5341} {"train_loss": -26.571683883666992, "global_step": 443353, "epoch": 5341} {"train_loss": -26.950469970703125, "global_step": 443354, "epoch": 5341} {"train_loss": -26.52170181274414, "global_step": 443355, "epoch": 5341} {"train_loss": -26.807165145874023, "global_step": 443356, "epoch": 5341} {"train_loss": -26.972375869750977, "global_step": 443357, "epoch": 5341} {"train_loss": -26.977569580078125, "global_step": 443358, "epoch": 5341} {"train_loss": -26.92184829711914, "global_step": 443359, "epoch": 5341} {"train_loss": -27.19380760192871, "global_step": 443360, "epoch": 5341} {"train_loss": -27.329727172851562, "global_step": 443361, "epoch": 5341} {"train_loss": -27.021459579467773, "global_step": 443362, "epoch": 5341} {"train_loss": -26.6298770904541, "global_step": 443363, "epoch": 5341} {"train_loss": -27.2388973236084, "global_step": 443364, "epoch": 5341} {"train_loss": -26.74561882019043, "global_step": 443365, "epoch": 5341} {"train_loss": -26.914457321166992, "global_step": 443366, "epoch": 5341} {"train_loss": -26.967151641845703, "global_step": 443367, "epoch": 5341} {"train_loss": -26.984716415405273, "global_step": 443368, "epoch": 5341} {"train_loss": -26.710922241210938, "global_step": 443369, "epoch": 5341} {"train_loss": -26.760095596313477, "global_step": 443370, "epoch": 5341} {"train_loss": -27.127105712890625, "global_step": 443371, "epoch": 5341} {"train_loss": -27.138263702392578, "global_step": 443372, "epoch": 5341} {"train_loss": -26.92725944519043, "global_step": 443373, "epoch": 5341} {"train_loss": -27.134984970092773, "global_step": 443374, "epoch": 5341} {"train_loss": -27.230209350585938, "global_step": 443375, "epoch": 5341} {"train_loss": -26.976545333862305, "global_step": 443376, "epoch": 5341} {"train_loss": -26.93293571472168, "global_step": 443377, "epoch": 5341} {"train_loss": -26.71075439453125, "global_step": 443378, "epoch": 5341} {"train_loss": -26.815515518188477, "global_step": 443379, "epoch": 5341} {"train_loss": -26.759429931640625, "global_step": 443380, "epoch": 5341} {"train_loss": -27.18670654296875, "global_step": 443381, "epoch": 5341} {"train_loss": -26.5003604888916, "global_step": 443382, "epoch": 5341} {"train_loss": -26.951242446899414, "global_step": 443383, "epoch": 5341} {"train_loss": -27.03218650817871, "global_step": 443384, "epoch": 5341} {"train_loss": -26.957190042518707, "global_step": 443385, "epoch": 5341, "val_loss": 6578266.5} {"train_loss": -25.914426803588867, "global_step": 443386, "epoch": 5342} {"train_loss": -24.84061050415039, "global_step": 443387, "epoch": 5342} {"train_loss": -25.698017120361328, "global_step": 443388, "epoch": 5342} {"train_loss": -26.246353149414062, "global_step": 443389, "epoch": 5342} {"train_loss": -25.95400047302246, "global_step": 443390, "epoch": 5342} {"train_loss": -25.165884017944336, "global_step": 443391, "epoch": 5342} {"train_loss": -26.565418243408203, "global_step": 443392, "epoch": 5342} {"train_loss": -25.905658721923828, "global_step": 443393, "epoch": 5342} {"train_loss": -26.459035873413086, "global_step": 443394, "epoch": 5342} {"train_loss": -26.19516372680664, "global_step": 443395, "epoch": 5342} {"train_loss": -26.500457763671875, "global_step": 443396, "epoch": 5342} {"train_loss": -25.93560218811035, "global_step": 443397, "epoch": 5342} {"train_loss": -26.486459732055664, "global_step": 443398, "epoch": 5342} {"train_loss": -26.188663482666016, "global_step": 443399, "epoch": 5342} {"train_loss": -26.54388999938965, "global_step": 443400, "epoch": 5342} {"train_loss": -26.713520050048828, "global_step": 443401, "epoch": 5342} {"train_loss": -26.0119686126709, "global_step": 443402, "epoch": 5342} {"train_loss": -26.333911895751953, "global_step": 443403, "epoch": 5342} {"train_loss": -26.763986587524414, "global_step": 443404, "epoch": 5342} {"train_loss": -26.58509635925293, "global_step": 443405, "epoch": 5342} {"train_loss": -26.65325355529785, "global_step": 443406, "epoch": 5342} {"train_loss": -27.0272159576416, "global_step": 443407, "epoch": 5342} {"train_loss": -26.9041748046875, "global_step": 443408, "epoch": 5342} {"train_loss": -26.85658073425293, "global_step": 443409, "epoch": 5342} {"train_loss": -26.691425323486328, "global_step": 443410, "epoch": 5342} {"train_loss": -26.91034507751465, "global_step": 443411, "epoch": 5342} {"train_loss": -26.647586822509766, "global_step": 443412, "epoch": 5342} {"train_loss": -26.9527645111084, "global_step": 443413, "epoch": 5342} {"train_loss": -27.01104736328125, "global_step": 443414, "epoch": 5342} {"train_loss": -26.82439613342285, "global_step": 443415, "epoch": 5342} {"train_loss": -26.617645263671875, "global_step": 443416, "epoch": 5342} {"train_loss": -26.88645362854004, "global_step": 443417, "epoch": 5342} {"train_loss": -27.121734619140625, "global_step": 443418, "epoch": 5342} {"train_loss": -27.007232666015625, "global_step": 443419, "epoch": 5342} {"train_loss": -27.144392013549805, "global_step": 443420, "epoch": 5342} {"train_loss": -27.098846435546875, "global_step": 443421, "epoch": 5342} {"train_loss": -26.989248275756836, "global_step": 443422, "epoch": 5342} {"train_loss": -26.82529640197754, "global_step": 443423, "epoch": 5342} {"train_loss": -26.541288375854492, "global_step": 443424, "epoch": 5342} {"train_loss": -27.197463989257812, "global_step": 443425, "epoch": 5342} {"train_loss": -27.030548095703125, "global_step": 443426, "epoch": 5342} {"train_loss": -26.949193954467773, "global_step": 443427, "epoch": 5342} {"train_loss": -27.10672378540039, "global_step": 443428, "epoch": 5342} {"train_loss": -27.19862937927246, "global_step": 443429, "epoch": 5342} {"train_loss": -27.087278366088867, "global_step": 443430, "epoch": 5342} {"train_loss": -26.953611373901367, "global_step": 443431, "epoch": 5342} {"train_loss": -26.714990615844727, "global_step": 443432, "epoch": 5342} {"train_loss": -27.397357940673828, "global_step": 443433, "epoch": 5342} {"train_loss": -26.71937370300293, "global_step": 443434, "epoch": 5342} {"train_loss": -26.933551788330078, "global_step": 443435, "epoch": 5342} {"train_loss": -26.851552963256836, "global_step": 443436, "epoch": 5342} {"train_loss": -26.965356826782227, "global_step": 443437, "epoch": 5342} {"train_loss": -27.14150047302246, "global_step": 443438, "epoch": 5342} {"train_loss": -27.511463165283203, "global_step": 443439, "epoch": 5342} {"train_loss": -27.0644474029541, "global_step": 443440, "epoch": 5342} {"train_loss": -27.156946182250977, "global_step": 443441, "epoch": 5342} {"train_loss": -27.31867790222168, "global_step": 443442, "epoch": 5342} {"train_loss": -26.887723922729492, "global_step": 443443, "epoch": 5342} {"train_loss": -26.40897560119629, "global_step": 443444, "epoch": 5342} {"train_loss": -26.60943031311035, "global_step": 443445, "epoch": 5342} {"train_loss": -27.141462326049805, "global_step": 443446, "epoch": 5342} {"train_loss": -26.726179122924805, "global_step": 443447, "epoch": 5342} {"train_loss": -26.324934005737305, "global_step": 443448, "epoch": 5342} {"train_loss": -26.434717178344727, "global_step": 443449, "epoch": 5342} {"train_loss": -26.9462833404541, "global_step": 443450, "epoch": 5342} {"train_loss": -26.675739288330078, "global_step": 443451, "epoch": 5342} {"train_loss": -26.796161651611328, "global_step": 443452, "epoch": 5342} {"train_loss": -26.9366512298584, "global_step": 443453, "epoch": 5342} {"train_loss": -27.00147819519043, "global_step": 443454, "epoch": 5342} {"train_loss": -26.846628189086914, "global_step": 443455, "epoch": 5342} {"train_loss": -26.920927047729492, "global_step": 443456, "epoch": 5342} {"train_loss": -26.816186904907227, "global_step": 443457, "epoch": 5342} {"train_loss": -26.9931583404541, "global_step": 443458, "epoch": 5342} {"train_loss": -27.048236846923828, "global_step": 443459, "epoch": 5342} {"train_loss": -26.9240665435791, "global_step": 443460, "epoch": 5342} {"train_loss": -26.879186630249023, "global_step": 443461, "epoch": 5342} {"train_loss": -26.55523109436035, "global_step": 443462, "epoch": 5342} {"train_loss": -27.126235961914062, "global_step": 443463, "epoch": 5342} {"train_loss": -27.025537490844727, "global_step": 443464, "epoch": 5342} {"train_loss": -27.34711265563965, "global_step": 443465, "epoch": 5342} {"train_loss": -26.931720733642578, "global_step": 443466, "epoch": 5342} {"train_loss": -26.9252986907959, "global_step": 443467, "epoch": 5342} {"train_loss": -26.722914132727198, "global_step": 443468, "epoch": 5342, "val_loss": 6537511.0} {"train_loss": -26.18389320373535, "global_step": 443469, "epoch": 5343} {"train_loss": -26.287084579467773, "global_step": 443470, "epoch": 5343} {"train_loss": -26.47873306274414, "global_step": 443471, "epoch": 5343} {"train_loss": -26.467960357666016, "global_step": 443472, "epoch": 5343} {"train_loss": -26.047149658203125, "global_step": 443473, "epoch": 5343} {"train_loss": -26.366134643554688, "global_step": 443474, "epoch": 5343} {"train_loss": -26.715534210205078, "global_step": 443475, "epoch": 5343} {"train_loss": -26.161636352539062, "global_step": 443476, "epoch": 5343} {"train_loss": -26.478759765625, "global_step": 443477, "epoch": 5343} {"train_loss": -26.606679916381836, "global_step": 443478, "epoch": 5343} {"train_loss": -26.611066818237305, "global_step": 443479, "epoch": 5343} {"train_loss": -26.903364181518555, "global_step": 443480, "epoch": 5343} {"train_loss": -26.70318603515625, "global_step": 443481, "epoch": 5343} {"train_loss": -26.868139266967773, "global_step": 443482, "epoch": 5343} {"train_loss": -26.62758445739746, "global_step": 443483, "epoch": 5343} {"train_loss": -26.842117309570312, "global_step": 443484, "epoch": 5343} {"train_loss": -26.72711181640625, "global_step": 443485, "epoch": 5343} {"train_loss": -26.712818145751953, "global_step": 443486, "epoch": 5343} {"train_loss": -26.798736572265625, "global_step": 443487, "epoch": 5343} {"train_loss": -27.12446403503418, "global_step": 443488, "epoch": 5343} {"train_loss": -26.723913192749023, "global_step": 443489, "epoch": 5343} {"train_loss": -27.013751983642578, "global_step": 443490, "epoch": 5343} {"train_loss": -26.98740005493164, "global_step": 443491, "epoch": 5343} {"train_loss": -26.824909210205078, "global_step": 443492, "epoch": 5343} {"train_loss": -27.517866134643555, "global_step": 443493, "epoch": 5343} {"train_loss": -26.764663696289062, "global_step": 443494, "epoch": 5343} {"train_loss": -26.85396385192871, "global_step": 443495, "epoch": 5343} {"train_loss": -27.00298500061035, "global_step": 443496, "epoch": 5343} {"train_loss": -26.714263916015625, "global_step": 443497, "epoch": 5343} {"train_loss": -26.996179580688477, "global_step": 443498, "epoch": 5343} {"train_loss": -27.00261878967285, "global_step": 443499, "epoch": 5343} {"train_loss": -27.062580108642578, "global_step": 443500, "epoch": 5343} {"train_loss": -27.211780548095703, "global_step": 443501, "epoch": 5343} {"train_loss": -26.73237419128418, "global_step": 443502, "epoch": 5343} {"train_loss": -26.957534790039062, "global_step": 443503, "epoch": 5343} {"train_loss": -27.073877334594727, "global_step": 443504, "epoch": 5343} {"train_loss": -26.7289981842041, "global_step": 443505, "epoch": 5343} {"train_loss": -27.078113555908203, "global_step": 443506, "epoch": 5343} {"train_loss": -26.940399169921875, "global_step": 443507, "epoch": 5343} {"train_loss": -27.072208404541016, "global_step": 443508, "epoch": 5343} {"train_loss": -26.964872360229492, "global_step": 443509, "epoch": 5343} {"train_loss": -26.900604248046875, "global_step": 443510, "epoch": 5343} {"train_loss": -26.95073890686035, "global_step": 443511, "epoch": 5343} {"train_loss": -26.877826690673828, "global_step": 443512, "epoch": 5343} {"train_loss": -26.9090518951416, "global_step": 443513, "epoch": 5343} {"train_loss": -27.064899444580078, "global_step": 443514, "epoch": 5343} {"train_loss": -27.152359008789062, "global_step": 443515, "epoch": 5343} {"train_loss": -27.137409210205078, "global_step": 443516, "epoch": 5343} {"train_loss": -27.11566162109375, "global_step": 443517, "epoch": 5343} {"train_loss": -26.8763427734375, "global_step": 443518, "epoch": 5343} {"train_loss": -26.783538818359375, "global_step": 443519, "epoch": 5343} {"train_loss": -26.824369430541992, "global_step": 443520, "epoch": 5343} {"train_loss": -26.987049102783203, "global_step": 443521, "epoch": 5343} {"train_loss": -26.512908935546875, "global_step": 443522, "epoch": 5343} {"train_loss": -26.69169044494629, "global_step": 443523, "epoch": 5343} {"train_loss": -27.208179473876953, "global_step": 443524, "epoch": 5343} {"train_loss": -27.461633682250977, "global_step": 443525, "epoch": 5343} {"train_loss": -26.994592666625977, "global_step": 443526, "epoch": 5343} {"train_loss": -27.3792724609375, "global_step": 443527, "epoch": 5343} {"train_loss": -27.02923011779785, "global_step": 443528, "epoch": 5343} {"train_loss": -27.06977653503418, "global_step": 443529, "epoch": 5343} {"train_loss": -27.26715660095215, "global_step": 443530, "epoch": 5343} {"train_loss": -27.053735733032227, "global_step": 443531, "epoch": 5343} {"train_loss": -27.017791748046875, "global_step": 443532, "epoch": 5343} {"train_loss": -27.1309814453125, "global_step": 443533, "epoch": 5343} {"train_loss": -27.140119552612305, "global_step": 443534, "epoch": 5343} {"train_loss": -27.0942325592041, "global_step": 443535, "epoch": 5343} {"train_loss": -26.978137969970703, "global_step": 443536, "epoch": 5343} {"train_loss": -26.988279342651367, "global_step": 443537, "epoch": 5343} {"train_loss": -26.775598526000977, "global_step": 443538, "epoch": 5343} {"train_loss": -27.032373428344727, "global_step": 443539, "epoch": 5343} {"train_loss": -27.206878662109375, "global_step": 443540, "epoch": 5343} {"train_loss": -27.020414352416992, "global_step": 443541, "epoch": 5343} {"train_loss": -26.579132080078125, "global_step": 443542, "epoch": 5343} {"train_loss": -26.51849937438965, "global_step": 443543, "epoch": 5343} {"train_loss": -26.9948787689209, "global_step": 443544, "epoch": 5343} {"train_loss": -27.074792861938477, "global_step": 443545, "epoch": 5343} {"train_loss": -27.4293270111084, "global_step": 443546, "epoch": 5343} {"train_loss": -27.43255615234375, "global_step": 443547, "epoch": 5343} {"train_loss": -26.6494197845459, "global_step": 443548, "epoch": 5343} {"train_loss": -26.389493942260742, "global_step": 443549, "epoch": 5343} {"train_loss": -26.714941024780273, "global_step": 443550, "epoch": 5343} {"train_loss": -26.88411579361881, "global_step": 443551, "epoch": 5343, "val_loss": 6642385.0} {"train_loss": -25.38378143310547, "global_step": 443552, "epoch": 5344} {"train_loss": -23.977535247802734, "global_step": 443553, "epoch": 5344} {"train_loss": -23.98781394958496, "global_step": 443554, "epoch": 5344} {"train_loss": -25.6649169921875, "global_step": 443555, "epoch": 5344} {"train_loss": -24.598173141479492, "global_step": 443556, "epoch": 5344} {"train_loss": -25.778244018554688, "global_step": 443557, "epoch": 5344} {"train_loss": -25.450956344604492, "global_step": 443558, "epoch": 5344} {"train_loss": -25.562761306762695, "global_step": 443559, "epoch": 5344} {"train_loss": -25.94294548034668, "global_step": 443560, "epoch": 5344} {"train_loss": -25.748193740844727, "global_step": 443561, "epoch": 5344} {"train_loss": -25.500324249267578, "global_step": 443562, "epoch": 5344} {"train_loss": -26.078359603881836, "global_step": 443563, "epoch": 5344} {"train_loss": -26.170612335205078, "global_step": 443564, "epoch": 5344} {"train_loss": -26.085296630859375, "global_step": 443565, "epoch": 5344} {"train_loss": -25.71430015563965, "global_step": 443566, "epoch": 5344} {"train_loss": -26.10688591003418, "global_step": 443567, "epoch": 5344} {"train_loss": -26.4395809173584, "global_step": 443568, "epoch": 5344} {"train_loss": -25.851917266845703, "global_step": 443569, "epoch": 5344} {"train_loss": -26.039304733276367, "global_step": 443570, "epoch": 5344} {"train_loss": -26.404102325439453, "global_step": 443571, "epoch": 5344} {"train_loss": -26.513751983642578, "global_step": 443572, "epoch": 5344} {"train_loss": -26.003141403198242, "global_step": 443573, "epoch": 5344} {"train_loss": -26.240955352783203, "global_step": 443574, "epoch": 5344} {"train_loss": -26.46441078186035, "global_step": 443575, "epoch": 5344} {"train_loss": -26.59490394592285, "global_step": 443576, "epoch": 5344} {"train_loss": -26.48160743713379, "global_step": 443577, "epoch": 5344} {"train_loss": -26.550729751586914, "global_step": 443578, "epoch": 5344} {"train_loss": -26.571334838867188, "global_step": 443579, "epoch": 5344} {"train_loss": -26.577960968017578, "global_step": 443580, "epoch": 5344} {"train_loss": -26.6993408203125, "global_step": 443581, "epoch": 5344} {"train_loss": -26.573150634765625, "global_step": 443582, "epoch": 5344} {"train_loss": -26.647476196289062, "global_step": 443583, "epoch": 5344} {"train_loss": -26.917724609375, "global_step": 443584, "epoch": 5344} {"train_loss": -26.6517276763916, "global_step": 443585, "epoch": 5344} {"train_loss": -26.60379409790039, "global_step": 443586, "epoch": 5344} {"train_loss": -26.672733306884766, "global_step": 443587, "epoch": 5344} {"train_loss": -27.103565216064453, "global_step": 443588, "epoch": 5344} {"train_loss": -26.920148849487305, "global_step": 443589, "epoch": 5344} {"train_loss": -26.8179931640625, "global_step": 443590, "epoch": 5344} {"train_loss": -26.893177032470703, "global_step": 443591, "epoch": 5344} {"train_loss": -27.096363067626953, "global_step": 443592, "epoch": 5344} {"train_loss": -26.800052642822266, "global_step": 443593, "epoch": 5344} {"train_loss": -26.691028594970703, "global_step": 443594, "epoch": 5344} {"train_loss": -27.1484317779541, "global_step": 443595, "epoch": 5344} {"train_loss": -27.45159912109375, "global_step": 443596, "epoch": 5344} {"train_loss": -27.033267974853516, "global_step": 443597, "epoch": 5344} {"train_loss": -26.69809341430664, "global_step": 443598, "epoch": 5344} {"train_loss": -26.861541748046875, "global_step": 443599, "epoch": 5344} {"train_loss": -27.09259605407715, "global_step": 443600, "epoch": 5344} {"train_loss": -27.165876388549805, "global_step": 443601, "epoch": 5344} {"train_loss": -27.122556686401367, "global_step": 443602, "epoch": 5344} {"train_loss": -26.857147216796875, "global_step": 443603, "epoch": 5344} {"train_loss": -27.222375869750977, "global_step": 443604, "epoch": 5344} {"train_loss": -27.168231964111328, "global_step": 443605, "epoch": 5344} {"train_loss": -26.8081111907959, "global_step": 443606, "epoch": 5344} {"train_loss": -27.16143226623535, "global_step": 443607, "epoch": 5344} {"train_loss": -27.325180053710938, "global_step": 443608, "epoch": 5344} {"train_loss": -27.23475456237793, "global_step": 443609, "epoch": 5344} {"train_loss": -27.095294952392578, "global_step": 443610, "epoch": 5344} {"train_loss": -26.789264678955078, "global_step": 443611, "epoch": 5344} {"train_loss": -27.082645416259766, "global_step": 443612, "epoch": 5344} {"train_loss": -26.9361572265625, "global_step": 443613, "epoch": 5344} {"train_loss": -27.18672752380371, "global_step": 443614, "epoch": 5344} {"train_loss": -27.065128326416016, "global_step": 443615, "epoch": 5344} {"train_loss": -26.78363037109375, "global_step": 443616, "epoch": 5344} {"train_loss": -27.023523330688477, "global_step": 443617, "epoch": 5344} {"train_loss": -27.012998580932617, "global_step": 443618, "epoch": 5344} {"train_loss": -26.853857040405273, "global_step": 443619, "epoch": 5344} {"train_loss": -26.9119815826416, "global_step": 443620, "epoch": 5344} {"train_loss": -27.3248348236084, "global_step": 443621, "epoch": 5344} {"train_loss": -26.823776245117188, "global_step": 443622, "epoch": 5344} {"train_loss": -27.0206241607666, "global_step": 443623, "epoch": 5344} {"train_loss": -27.17353630065918, "global_step": 443624, "epoch": 5344} {"train_loss": -27.529027938842773, "global_step": 443625, "epoch": 5344} {"train_loss": -27.31340980529785, "global_step": 443626, "epoch": 5344} {"train_loss": -27.355310440063477, "global_step": 443627, "epoch": 5344} {"train_loss": -27.45606803894043, "global_step": 443628, "epoch": 5344} {"train_loss": -27.1822566986084, "global_step": 443629, "epoch": 5344} {"train_loss": -27.088476181030273, "global_step": 443630, "epoch": 5344} {"train_loss": -27.187137603759766, "global_step": 443631, "epoch": 5344} {"train_loss": -26.988744735717773, "global_step": 443632, "epoch": 5344} {"train_loss": -27.349531173706055, "global_step": 443633, "epoch": 5344} {"train_loss": -26.614397393651757, "global_step": 443634, "epoch": 5344, "val_loss": 6624039.0} {"train_loss": -25.776769638061523, "global_step": 443635, "epoch": 5345} {"train_loss": -25.949783325195312, "global_step": 443636, "epoch": 5345} {"train_loss": -25.455265045166016, "global_step": 443637, "epoch": 5345} {"train_loss": -25.369112014770508, "global_step": 443638, "epoch": 5345} {"train_loss": -26.825361251831055, "global_step": 443639, "epoch": 5345} {"train_loss": -25.493131637573242, "global_step": 443640, "epoch": 5345} {"train_loss": -26.65557861328125, "global_step": 443641, "epoch": 5345} {"train_loss": -26.23993492126465, "global_step": 443642, "epoch": 5345} {"train_loss": -26.35853385925293, "global_step": 443643, "epoch": 5345} {"train_loss": -26.5589542388916, "global_step": 443644, "epoch": 5345} {"train_loss": -26.979572296142578, "global_step": 443645, "epoch": 5345} {"train_loss": -26.87044334411621, "global_step": 443646, "epoch": 5345} {"train_loss": -26.3123836517334, "global_step": 443647, "epoch": 5345} {"train_loss": -26.684431076049805, "global_step": 443648, "epoch": 5345} {"train_loss": -26.616621017456055, "global_step": 443649, "epoch": 5345} {"train_loss": -26.24140739440918, "global_step": 443650, "epoch": 5345} {"train_loss": -26.88335609436035, "global_step": 443651, "epoch": 5345} {"train_loss": -26.316913604736328, "global_step": 443652, "epoch": 5345} {"train_loss": -26.63071632385254, "global_step": 443653, "epoch": 5345} {"train_loss": -26.791269302368164, "global_step": 443654, "epoch": 5345} {"train_loss": -26.570907592773438, "global_step": 443655, "epoch": 5345} {"train_loss": -26.496549606323242, "global_step": 443656, "epoch": 5345} {"train_loss": -26.50896644592285, "global_step": 443657, "epoch": 5345} {"train_loss": -26.811132431030273, "global_step": 443658, "epoch": 5345} {"train_loss": -26.820560455322266, "global_step": 443659, "epoch": 5345} {"train_loss": -26.55427360534668, "global_step": 443660, "epoch": 5345} {"train_loss": -26.332202911376953, "global_step": 443661, "epoch": 5345} {"train_loss": -26.788055419921875, "global_step": 443662, "epoch": 5345} {"train_loss": -26.95051383972168, "global_step": 443663, "epoch": 5345} {"train_loss": -26.723844528198242, "global_step": 443664, "epoch": 5345} {"train_loss": -26.53688621520996, "global_step": 443665, "epoch": 5345} {"train_loss": -26.745227813720703, "global_step": 443666, "epoch": 5345} {"train_loss": -27.117910385131836, "global_step": 443667, "epoch": 5345} {"train_loss": -26.95965003967285, "global_step": 443668, "epoch": 5345} {"train_loss": -26.70476722717285, "global_step": 443669, "epoch": 5345} {"train_loss": -27.1687068939209, "global_step": 443670, "epoch": 5345} {"train_loss": -26.690927505493164, "global_step": 443671, "epoch": 5345} {"train_loss": -27.088735580444336, "global_step": 443672, "epoch": 5345} {"train_loss": -27.0891056060791, "global_step": 443673, "epoch": 5345} {"train_loss": -27.145349502563477, "global_step": 443674, "epoch": 5345} {"train_loss": -27.15921974182129, "global_step": 443675, "epoch": 5345} {"train_loss": -27.069971084594727, "global_step": 443676, "epoch": 5345} {"train_loss": -27.095731735229492, "global_step": 443677, "epoch": 5345} {"train_loss": -27.14702796936035, "global_step": 443678, "epoch": 5345} {"train_loss": -27.059560775756836, "global_step": 443679, "epoch": 5345} {"train_loss": -26.87188720703125, "global_step": 443680, "epoch": 5345} {"train_loss": -27.279129028320312, "global_step": 443681, "epoch": 5345} {"train_loss": -26.98834800720215, "global_step": 443682, "epoch": 5345} {"train_loss": -27.353641510009766, "global_step": 443683, "epoch": 5345} {"train_loss": -26.747644424438477, "global_step": 443684, "epoch": 5345} {"train_loss": -27.044971466064453, "global_step": 443685, "epoch": 5345} {"train_loss": -27.291982650756836, "global_step": 443686, "epoch": 5345} {"train_loss": -27.36163902282715, "global_step": 443687, "epoch": 5345} {"train_loss": -27.100080490112305, "global_step": 443688, "epoch": 5345} {"train_loss": -27.020727157592773, "global_step": 443689, "epoch": 5345} {"train_loss": -27.065078735351562, "global_step": 443690, "epoch": 5345} {"train_loss": -26.906713485717773, "global_step": 443691, "epoch": 5345} {"train_loss": -26.882343292236328, "global_step": 443692, "epoch": 5345} {"train_loss": -26.79440689086914, "global_step": 443693, "epoch": 5345} {"train_loss": -27.31361198425293, "global_step": 443694, "epoch": 5345} {"train_loss": -27.344953536987305, "global_step": 443695, "epoch": 5345} {"train_loss": -26.973325729370117, "global_step": 443696, "epoch": 5345} {"train_loss": -27.43230628967285, "global_step": 443697, "epoch": 5345} {"train_loss": -27.165939331054688, "global_step": 443698, "epoch": 5345} {"train_loss": -27.1242618560791, "global_step": 443699, "epoch": 5345} {"train_loss": -27.40625, "global_step": 443700, "epoch": 5345} {"train_loss": -26.60679054260254, "global_step": 443701, "epoch": 5345} {"train_loss": -26.78656005859375, "global_step": 443702, "epoch": 5345} {"train_loss": -27.0489444732666, "global_step": 443703, "epoch": 5345} {"train_loss": -27.12506675720215, "global_step": 443704, "epoch": 5345} {"train_loss": -26.84151268005371, "global_step": 443705, "epoch": 5345} {"train_loss": -27.029987335205078, "global_step": 443706, "epoch": 5345} {"train_loss": -26.67824363708496, "global_step": 443707, "epoch": 5345} {"train_loss": -26.745487213134766, "global_step": 443708, "epoch": 5345} {"train_loss": -26.380924224853516, "global_step": 443709, "epoch": 5345} {"train_loss": -26.584583282470703, "global_step": 443710, "epoch": 5345} {"train_loss": -26.894702911376953, "global_step": 443711, "epoch": 5345} {"train_loss": -26.9409122467041, "global_step": 443712, "epoch": 5345} {"train_loss": -26.883771896362305, "global_step": 443713, "epoch": 5345} {"train_loss": -26.868900299072266, "global_step": 443714, "epoch": 5345} {"train_loss": -26.7431697845459, "global_step": 443715, "epoch": 5345} {"train_loss": -26.615198135375977, "global_step": 443716, "epoch": 5345} {"train_loss": -26.780962335058007, "global_step": 443717, "epoch": 5345, "val_loss": 6657081.5} {"train_loss": -26.167577743530273, "global_step": 443718, "epoch": 5346} {"train_loss": -25.766019821166992, "global_step": 443719, "epoch": 5346} {"train_loss": -26.445138931274414, "global_step": 443720, "epoch": 5346} {"train_loss": -26.429529190063477, "global_step": 443721, "epoch": 5346} {"train_loss": -26.81361198425293, "global_step": 443722, "epoch": 5346} {"train_loss": -26.607282638549805, "global_step": 443723, "epoch": 5346} {"train_loss": -26.445545196533203, "global_step": 443724, "epoch": 5346} {"train_loss": -26.99517250061035, "global_step": 443725, "epoch": 5346} {"train_loss": -26.80164909362793, "global_step": 443726, "epoch": 5346} {"train_loss": -26.65673828125, "global_step": 443727, "epoch": 5346} {"train_loss": -26.394001007080078, "global_step": 443728, "epoch": 5346} {"train_loss": -26.450000762939453, "global_step": 443729, "epoch": 5346} {"train_loss": -26.811399459838867, "global_step": 443730, "epoch": 5346} {"train_loss": -26.573591232299805, "global_step": 443731, "epoch": 5346} {"train_loss": -26.7824649810791, "global_step": 443732, "epoch": 5346} {"train_loss": -27.063724517822266, "global_step": 443733, "epoch": 5346} {"train_loss": -26.635663986206055, "global_step": 443734, "epoch": 5346} {"train_loss": -26.849903106689453, "global_step": 443735, "epoch": 5346} {"train_loss": -26.871185302734375, "global_step": 443736, "epoch": 5346} {"train_loss": -26.543237686157227, "global_step": 443737, "epoch": 5346} {"train_loss": -26.779516220092773, "global_step": 443738, "epoch": 5346} {"train_loss": -27.046911239624023, "global_step": 443739, "epoch": 5346} {"train_loss": -26.853363037109375, "global_step": 443740, "epoch": 5346} {"train_loss": -26.942626953125, "global_step": 443741, "epoch": 5346} {"train_loss": -26.469467163085938, "global_step": 443742, "epoch": 5346} {"train_loss": -26.81292724609375, "global_step": 443743, "epoch": 5346} {"train_loss": -26.570249557495117, "global_step": 443744, "epoch": 5346} {"train_loss": -26.862167358398438, "global_step": 443745, "epoch": 5346} {"train_loss": -26.56744956970215, "global_step": 443746, "epoch": 5346} {"train_loss": -26.71485710144043, "global_step": 443747, "epoch": 5346} {"train_loss": -26.734527587890625, "global_step": 443748, "epoch": 5346} {"train_loss": -27.202787399291992, "global_step": 443749, "epoch": 5346} {"train_loss": -26.54591941833496, "global_step": 443750, "epoch": 5346} {"train_loss": -27.10409927368164, "global_step": 443751, "epoch": 5346} {"train_loss": -26.997928619384766, "global_step": 443752, "epoch": 5346} {"train_loss": -26.633771896362305, "global_step": 443753, "epoch": 5346} {"train_loss": -26.886798858642578, "global_step": 443754, "epoch": 5346} {"train_loss": -26.83475685119629, "global_step": 443755, "epoch": 5346} {"train_loss": -26.8779354095459, "global_step": 443756, "epoch": 5346} {"train_loss": -26.68629264831543, "global_step": 443757, "epoch": 5346} {"train_loss": -26.597064971923828, "global_step": 443758, "epoch": 5346} {"train_loss": -26.63912010192871, "global_step": 443759, "epoch": 5346} {"train_loss": -26.87831687927246, "global_step": 443760, "epoch": 5346} {"train_loss": -27.259855270385742, "global_step": 443761, "epoch": 5346} {"train_loss": -26.930246353149414, "global_step": 443762, "epoch": 5346} {"train_loss": -27.07486915588379, "global_step": 443763, "epoch": 5346} {"train_loss": -27.09918212890625, "global_step": 443764, "epoch": 5346} {"train_loss": -26.544736862182617, "global_step": 443765, "epoch": 5346} {"train_loss": -27.216318130493164, "global_step": 443766, "epoch": 5346} {"train_loss": -26.969833374023438, "global_step": 443767, "epoch": 5346} {"train_loss": -26.89841079711914, "global_step": 443768, "epoch": 5346} {"train_loss": -27.245874404907227, "global_step": 443769, "epoch": 5346} {"train_loss": -27.0113582611084, "global_step": 443770, "epoch": 5346} {"train_loss": -27.35627555847168, "global_step": 443771, "epoch": 5346} {"train_loss": -26.64312171936035, "global_step": 443772, "epoch": 5346} {"train_loss": -27.105350494384766, "global_step": 443773, "epoch": 5346} {"train_loss": -27.106489181518555, "global_step": 443774, "epoch": 5346} {"train_loss": -27.051023483276367, "global_step": 443775, "epoch": 5346} {"train_loss": -27.27692985534668, "global_step": 443776, "epoch": 5346} {"train_loss": -27.285314559936523, "global_step": 443777, "epoch": 5346} {"train_loss": -27.29379653930664, "global_step": 443778, "epoch": 5346} {"train_loss": -26.476709365844727, "global_step": 443779, "epoch": 5346} {"train_loss": -26.741178512573242, "global_step": 443780, "epoch": 5346} {"train_loss": -27.080398559570312, "global_step": 443781, "epoch": 5346} {"train_loss": -26.659238815307617, "global_step": 443782, "epoch": 5346} {"train_loss": -27.079334259033203, "global_step": 443783, "epoch": 5346} {"train_loss": -26.940704345703125, "global_step": 443784, "epoch": 5346} {"train_loss": -27.263525009155273, "global_step": 443785, "epoch": 5346} {"train_loss": -27.028608322143555, "global_step": 443786, "epoch": 5346} {"train_loss": -27.185684204101562, "global_step": 443787, "epoch": 5346} {"train_loss": -27.264673233032227, "global_step": 443788, "epoch": 5346} {"train_loss": -27.157896041870117, "global_step": 443789, "epoch": 5346} {"train_loss": -26.806501388549805, "global_step": 443790, "epoch": 5346} {"train_loss": -26.925058364868164, "global_step": 443791, "epoch": 5346} {"train_loss": -27.20890235900879, "global_step": 443792, "epoch": 5346} {"train_loss": -27.06040382385254, "global_step": 443793, "epoch": 5346} {"train_loss": -27.59809684753418, "global_step": 443794, "epoch": 5346} {"train_loss": -27.058027267456055, "global_step": 443795, "epoch": 5346} {"train_loss": -26.97797966003418, "global_step": 443796, "epoch": 5346} {"train_loss": -27.49496841430664, "global_step": 443797, "epoch": 5346} {"train_loss": -27.084781646728516, "global_step": 443798, "epoch": 5346} {"train_loss": -26.919178009033203, "global_step": 443799, "epoch": 5346} {"train_loss": -26.898708320525756, "global_step": 443800, "epoch": 5346, "val_loss": 6571361.5} {"train_loss": -26.514623641967773, "global_step": 443801, "epoch": 5347} {"train_loss": -25.433366775512695, "global_step": 443802, "epoch": 5347} {"train_loss": -25.183759689331055, "global_step": 443803, "epoch": 5347} {"train_loss": -24.83057975769043, "global_step": 443804, "epoch": 5347} {"train_loss": -24.757526397705078, "global_step": 443805, "epoch": 5347} {"train_loss": -24.659461975097656, "global_step": 443806, "epoch": 5347} {"train_loss": -26.139036178588867, "global_step": 443807, "epoch": 5347} {"train_loss": -25.47005271911621, "global_step": 443808, "epoch": 5347} {"train_loss": -26.247455596923828, "global_step": 443809, "epoch": 5347} {"train_loss": -25.839269638061523, "global_step": 443810, "epoch": 5347} {"train_loss": -26.250289916992188, "global_step": 443811, "epoch": 5347} {"train_loss": -26.202184677124023, "global_step": 443812, "epoch": 5347} {"train_loss": -26.205856323242188, "global_step": 443813, "epoch": 5347} {"train_loss": -26.391992568969727, "global_step": 443814, "epoch": 5347} {"train_loss": -26.521072387695312, "global_step": 443815, "epoch": 5347} {"train_loss": -26.20722770690918, "global_step": 443816, "epoch": 5347} {"train_loss": -26.67902946472168, "global_step": 443817, "epoch": 5347} {"train_loss": -26.701709747314453, "global_step": 443818, "epoch": 5347} {"train_loss": -26.802419662475586, "global_step": 443819, "epoch": 5347} {"train_loss": -26.628198623657227, "global_step": 443820, "epoch": 5347} {"train_loss": -26.330280303955078, "global_step": 443821, "epoch": 5347} {"train_loss": -26.7484188079834, "global_step": 443822, "epoch": 5347} {"train_loss": -26.2428035736084, "global_step": 443823, "epoch": 5347} {"train_loss": -26.74912452697754, "global_step": 443824, "epoch": 5347} {"train_loss": -27.2080078125, "global_step": 443825, "epoch": 5347} {"train_loss": -26.769485473632812, "global_step": 443826, "epoch": 5347} {"train_loss": -26.645782470703125, "global_step": 443827, "epoch": 5347} {"train_loss": -27.064069747924805, "global_step": 443828, "epoch": 5347} {"train_loss": -26.613636016845703, "global_step": 443829, "epoch": 5347} {"train_loss": -26.91261100769043, "global_step": 443830, "epoch": 5347} {"train_loss": -26.753034591674805, "global_step": 443831, "epoch": 5347} {"train_loss": -26.551929473876953, "global_step": 443832, "epoch": 5347} {"train_loss": -26.751001358032227, "global_step": 443833, "epoch": 5347} {"train_loss": -26.90597915649414, "global_step": 443834, "epoch": 5347} {"train_loss": -27.011463165283203, "global_step": 443835, "epoch": 5347} {"train_loss": -26.861921310424805, "global_step": 443836, "epoch": 5347} {"train_loss": -27.3076114654541, "global_step": 443837, "epoch": 5347} {"train_loss": -27.059125900268555, "global_step": 443838, "epoch": 5347} {"train_loss": -27.322498321533203, "global_step": 443839, "epoch": 5347} {"train_loss": -26.909503936767578, "global_step": 443840, "epoch": 5347} {"train_loss": -27.40900993347168, "global_step": 443841, "epoch": 5347} {"train_loss": -27.060800552368164, "global_step": 443842, "epoch": 5347} {"train_loss": -27.076398849487305, "global_step": 443843, "epoch": 5347} {"train_loss": -26.84396743774414, "global_step": 443844, "epoch": 5347} {"train_loss": -26.781757354736328, "global_step": 443845, "epoch": 5347} {"train_loss": -27.14287757873535, "global_step": 443846, "epoch": 5347} {"train_loss": -26.745542526245117, "global_step": 443847, "epoch": 5347} {"train_loss": -26.986099243164062, "global_step": 443848, "epoch": 5347} {"train_loss": -26.897052764892578, "global_step": 443849, "epoch": 5347} {"train_loss": -26.987079620361328, "global_step": 443850, "epoch": 5347} {"train_loss": -27.389020919799805, "global_step": 443851, "epoch": 5347} {"train_loss": -27.2186222076416, "global_step": 443852, "epoch": 5347} {"train_loss": -27.66974449157715, "global_step": 443853, "epoch": 5347} {"train_loss": -27.27509117126465, "global_step": 443854, "epoch": 5347} {"train_loss": -27.12550163269043, "global_step": 443855, "epoch": 5347} {"train_loss": -27.202611923217773, "global_step": 443856, "epoch": 5347} {"train_loss": -26.924442291259766, "global_step": 443857, "epoch": 5347} {"train_loss": -27.137582778930664, "global_step": 443858, "epoch": 5347} {"train_loss": -27.311120986938477, "global_step": 443859, "epoch": 5347} {"train_loss": -26.78129005432129, "global_step": 443860, "epoch": 5347} {"train_loss": -27.002965927124023, "global_step": 443861, "epoch": 5347} {"train_loss": -27.13812828063965, "global_step": 443862, "epoch": 5347} {"train_loss": -27.201217651367188, "global_step": 443863, "epoch": 5347} {"train_loss": -27.13453483581543, "global_step": 443864, "epoch": 5347} {"train_loss": -26.9320068359375, "global_step": 443865, "epoch": 5347} {"train_loss": -27.240095138549805, "global_step": 443866, "epoch": 5347} {"train_loss": -27.193500518798828, "global_step": 443867, "epoch": 5347} {"train_loss": -27.412555694580078, "global_step": 443868, "epoch": 5347} {"train_loss": -27.102313995361328, "global_step": 443869, "epoch": 5347} {"train_loss": -27.117277145385742, "global_step": 443870, "epoch": 5347} {"train_loss": -27.530872344970703, "global_step": 443871, "epoch": 5347} {"train_loss": -27.200803756713867, "global_step": 443872, "epoch": 5347} {"train_loss": -26.838552474975586, "global_step": 443873, "epoch": 5347} {"train_loss": -27.181737899780273, "global_step": 443874, "epoch": 5347} {"train_loss": -26.4976749420166, "global_step": 443875, "epoch": 5347} {"train_loss": -27.11334228515625, "global_step": 443876, "epoch": 5347} {"train_loss": -27.02422523498535, "global_step": 443877, "epoch": 5347} {"train_loss": -27.15985679626465, "global_step": 443878, "epoch": 5347} {"train_loss": -27.220264434814453, "global_step": 443879, "epoch": 5347} {"train_loss": -26.907453536987305, "global_step": 443880, "epoch": 5347} {"train_loss": -27.242773056030273, "global_step": 443881, "epoch": 5347} {"train_loss": -27.13006591796875, "global_step": 443882, "epoch": 5347} {"train_loss": -26.771458016820702, "global_step": 443883, "epoch": 5347, "val_loss": 6592811.5} {"train_loss": -26.32587242126465, "global_step": 443884, "epoch": 5348} {"train_loss": -25.415735244750977, "global_step": 443885, "epoch": 5348} {"train_loss": -26.536100387573242, "global_step": 443886, "epoch": 5348} {"train_loss": -26.982105255126953, "global_step": 443887, "epoch": 5348} {"train_loss": -26.608001708984375, "global_step": 443888, "epoch": 5348} {"train_loss": -26.560815811157227, "global_step": 443889, "epoch": 5348} {"train_loss": -26.741596221923828, "global_step": 443890, "epoch": 5348} {"train_loss": -26.9741153717041, "global_step": 443891, "epoch": 5348} {"train_loss": -26.213220596313477, "global_step": 443892, "epoch": 5348} {"train_loss": -26.566761016845703, "global_step": 443893, "epoch": 5348} {"train_loss": -26.246997833251953, "global_step": 443894, "epoch": 5348} {"train_loss": -26.89069175720215, "global_step": 443895, "epoch": 5348} {"train_loss": -26.216150283813477, "global_step": 443896, "epoch": 5348} {"train_loss": -26.72539710998535, "global_step": 443897, "epoch": 5348} {"train_loss": -26.431427001953125, "global_step": 443898, "epoch": 5348} {"train_loss": -27.0423641204834, "global_step": 443899, "epoch": 5348} {"train_loss": -26.640522003173828, "global_step": 443900, "epoch": 5348} {"train_loss": -26.727567672729492, "global_step": 443901, "epoch": 5348} {"train_loss": -27.02750587463379, "global_step": 443902, "epoch": 5348} {"train_loss": -26.73121452331543, "global_step": 443903, "epoch": 5348} {"train_loss": -26.63749122619629, "global_step": 443904, "epoch": 5348} {"train_loss": -26.75028419494629, "global_step": 443905, "epoch": 5348} {"train_loss": -26.539587020874023, "global_step": 443906, "epoch": 5348} {"train_loss": -26.75288200378418, "global_step": 443907, "epoch": 5348} {"train_loss": -27.1540584564209, "global_step": 443908, "epoch": 5348} {"train_loss": -26.97781753540039, "global_step": 443909, "epoch": 5348} {"train_loss": -27.019351959228516, "global_step": 443910, "epoch": 5348} {"train_loss": -27.0284423828125, "global_step": 443911, "epoch": 5348} {"train_loss": -27.005102157592773, "global_step": 443912, "epoch": 5348} {"train_loss": -27.04483413696289, "global_step": 443913, "epoch": 5348} {"train_loss": -26.79963493347168, "global_step": 443914, "epoch": 5348} {"train_loss": -27.051603317260742, "global_step": 443915, "epoch": 5348} {"train_loss": -26.83306884765625, "global_step": 443916, "epoch": 5348} {"train_loss": -27.04851722717285, "global_step": 443917, "epoch": 5348} {"train_loss": -27.251800537109375, "global_step": 443918, "epoch": 5348} {"train_loss": -26.815378189086914, "global_step": 443919, "epoch": 5348} {"train_loss": -27.348066329956055, "global_step": 443920, "epoch": 5348} {"train_loss": -27.126638412475586, "global_step": 443921, "epoch": 5348} {"train_loss": -27.368167877197266, "global_step": 443922, "epoch": 5348} {"train_loss": -27.167219161987305, "global_step": 443923, "epoch": 5348} {"train_loss": -26.858673095703125, "global_step": 443924, "epoch": 5348} {"train_loss": -26.917600631713867, "global_step": 443925, "epoch": 5348} {"train_loss": -27.127283096313477, "global_step": 443926, "epoch": 5348} {"train_loss": -27.361806869506836, "global_step": 443927, "epoch": 5348} {"train_loss": -27.310184478759766, "global_step": 443928, "epoch": 5348} {"train_loss": -27.469268798828125, "global_step": 443929, "epoch": 5348} {"train_loss": -27.1457462310791, "global_step": 443930, "epoch": 5348} {"train_loss": -27.100744247436523, "global_step": 443931, "epoch": 5348} {"train_loss": -27.07940101623535, "global_step": 443932, "epoch": 5348} {"train_loss": -27.146081924438477, "global_step": 443933, "epoch": 5348} {"train_loss": -27.3373966217041, "global_step": 443934, "epoch": 5348} {"train_loss": -27.082305908203125, "global_step": 443935, "epoch": 5348} {"train_loss": -27.235929489135742, "global_step": 443936, "epoch": 5348} {"train_loss": -27.047391891479492, "global_step": 443937, "epoch": 5348} {"train_loss": -26.7985897064209, "global_step": 443938, "epoch": 5348} {"train_loss": -27.087432861328125, "global_step": 443939, "epoch": 5348} {"train_loss": -26.968887329101562, "global_step": 443940, "epoch": 5348} {"train_loss": -27.199243545532227, "global_step": 443941, "epoch": 5348} {"train_loss": -27.54827880859375, "global_step": 443942, "epoch": 5348} {"train_loss": -27.27760124206543, "global_step": 443943, "epoch": 5348} {"train_loss": -26.8474063873291, "global_step": 443944, "epoch": 5348} {"train_loss": -26.736478805541992, "global_step": 443945, "epoch": 5348} {"train_loss": -26.458417892456055, "global_step": 443946, "epoch": 5348} {"train_loss": -26.751209259033203, "global_step": 443947, "epoch": 5348} {"train_loss": -27.036874771118164, "global_step": 443948, "epoch": 5348} {"train_loss": -26.769458770751953, "global_step": 443949, "epoch": 5348} {"train_loss": -27.038217544555664, "global_step": 443950, "epoch": 5348} {"train_loss": -26.62091064453125, "global_step": 443951, "epoch": 5348} {"train_loss": -26.818403244018555, "global_step": 443952, "epoch": 5348} {"train_loss": -26.968036651611328, "global_step": 443953, "epoch": 5348} {"train_loss": -26.445545196533203, "global_step": 443954, "epoch": 5348} {"train_loss": -26.946918487548828, "global_step": 443955, "epoch": 5348} {"train_loss": -26.668426513671875, "global_step": 443956, "epoch": 5348} {"train_loss": -26.542255401611328, "global_step": 443957, "epoch": 5348} {"train_loss": -26.65801429748535, "global_step": 443958, "epoch": 5348} {"train_loss": -26.859968185424805, "global_step": 443959, "epoch": 5348} {"train_loss": -26.1221923828125, "global_step": 443960, "epoch": 5348} {"train_loss": -27.235260009765625, "global_step": 443961, "epoch": 5348} {"train_loss": -27.173093795776367, "global_step": 443962, "epoch": 5348} {"train_loss": -26.57275390625, "global_step": 443963, "epoch": 5348} {"train_loss": -26.661304473876953, "global_step": 443964, "epoch": 5348} {"train_loss": -27.048887252807617, "global_step": 443965, "epoch": 5348} {"train_loss": -26.87084317494588, "global_step": 443966, "epoch": 5348, "val_loss": 6522532.0} {"train_loss": -26.549243927001953, "global_step": 443967, "epoch": 5349} {"train_loss": -26.156360626220703, "global_step": 443968, "epoch": 5349} {"train_loss": -26.488479614257812, "global_step": 443969, "epoch": 5349} {"train_loss": -26.53683853149414, "global_step": 443970, "epoch": 5349} {"train_loss": -26.170087814331055, "global_step": 443971, "epoch": 5349} {"train_loss": -25.949848175048828, "global_step": 443972, "epoch": 5349} {"train_loss": -26.683958053588867, "global_step": 443973, "epoch": 5349} {"train_loss": -26.697473526000977, "global_step": 443974, "epoch": 5349} {"train_loss": -26.402099609375, "global_step": 443975, "epoch": 5349} {"train_loss": -26.83603858947754, "global_step": 443976, "epoch": 5349} {"train_loss": -26.905241012573242, "global_step": 443977, "epoch": 5349} {"train_loss": -26.500507354736328, "global_step": 443978, "epoch": 5349} {"train_loss": -26.620046615600586, "global_step": 443979, "epoch": 5349} {"train_loss": -26.529382705688477, "global_step": 443980, "epoch": 5349} {"train_loss": -27.005786895751953, "global_step": 443981, "epoch": 5349} {"train_loss": -26.590560913085938, "global_step": 443982, "epoch": 5349} {"train_loss": -26.861724853515625, "global_step": 443983, "epoch": 5349} {"train_loss": -26.70658302307129, "global_step": 443984, "epoch": 5349} {"train_loss": -26.7377872467041, "global_step": 443985, "epoch": 5349} {"train_loss": -26.77216911315918, "global_step": 443986, "epoch": 5349} {"train_loss": -26.402631759643555, "global_step": 443987, "epoch": 5349} {"train_loss": -26.857257843017578, "global_step": 443988, "epoch": 5349} {"train_loss": -26.54638671875, "global_step": 443989, "epoch": 5349} {"train_loss": -26.911212921142578, "global_step": 443990, "epoch": 5349} {"train_loss": -27.016895294189453, "global_step": 443991, "epoch": 5349} {"train_loss": -26.922534942626953, "global_step": 443992, "epoch": 5349} {"train_loss": -27.079763412475586, "global_step": 443993, "epoch": 5349} {"train_loss": -26.878637313842773, "global_step": 443994, "epoch": 5349} {"train_loss": -26.859411239624023, "global_step": 443995, "epoch": 5349} {"train_loss": -27.02860450744629, "global_step": 443996, "epoch": 5349} {"train_loss": -26.880884170532227, "global_step": 443997, "epoch": 5349} {"train_loss": -27.261337280273438, "global_step": 443998, "epoch": 5349} {"train_loss": -26.824783325195312, "global_step": 443999, "epoch": 5349} {"train_loss": -26.704303741455078, "global_step": 444000, "epoch": 5349} {"train_loss": -27.541540145874023, "global_step": 444001, "epoch": 5349} {"train_loss": -27.25959587097168, "global_step": 444002, "epoch": 5349} {"train_loss": -27.468393325805664, "global_step": 444003, "epoch": 5349} {"train_loss": -27.052978515625, "global_step": 444004, "epoch": 5349} {"train_loss": -27.064319610595703, "global_step": 444005, "epoch": 5349} {"train_loss": -27.080780029296875, "global_step": 444006, "epoch": 5349} {"train_loss": -27.262006759643555, "global_step": 444007, "epoch": 5349} {"train_loss": -26.982019424438477, "global_step": 444008, "epoch": 5349} {"train_loss": -27.21063232421875, "global_step": 444009, "epoch": 5349} {"train_loss": -27.14023780822754, "global_step": 444010, "epoch": 5349} {"train_loss": -27.107328414916992, "global_step": 444011, "epoch": 5349} {"train_loss": -27.213300704956055, "global_step": 444012, "epoch": 5349} {"train_loss": -27.512226104736328, "global_step": 444013, "epoch": 5349} {"train_loss": -27.047977447509766, "global_step": 444014, "epoch": 5349} {"train_loss": -26.860595703125, "global_step": 444015, "epoch": 5349} {"train_loss": -27.008020401000977, "global_step": 444016, "epoch": 5349} {"train_loss": -27.15278434753418, "global_step": 444017, "epoch": 5349} {"train_loss": -27.41390037536621, "global_step": 444018, "epoch": 5349} {"train_loss": -26.936826705932617, "global_step": 444019, "epoch": 5349} {"train_loss": -26.904333114624023, "global_step": 444020, "epoch": 5349} {"train_loss": -27.050525665283203, "global_step": 444021, "epoch": 5349} {"train_loss": -27.1462345123291, "global_step": 444022, "epoch": 5349} {"train_loss": -26.930627822875977, "global_step": 444023, "epoch": 5349} {"train_loss": -27.600011825561523, "global_step": 444024, "epoch": 5349} {"train_loss": -27.10637855529785, "global_step": 444025, "epoch": 5349} {"train_loss": -26.83601188659668, "global_step": 444026, "epoch": 5349} {"train_loss": -27.002283096313477, "global_step": 444027, "epoch": 5349} {"train_loss": -27.15997314453125, "global_step": 444028, "epoch": 5349} {"train_loss": -27.48382568359375, "global_step": 444029, "epoch": 5349} {"train_loss": -27.299407958984375, "global_step": 444030, "epoch": 5349} {"train_loss": -26.749303817749023, "global_step": 444031, "epoch": 5349} {"train_loss": -26.877593994140625, "global_step": 444032, "epoch": 5349} {"train_loss": -27.0639591217041, "global_step": 444033, "epoch": 5349} {"train_loss": -27.128942489624023, "global_step": 444034, "epoch": 5349} {"train_loss": -27.078327178955078, "global_step": 444035, "epoch": 5349} {"train_loss": -27.36771011352539, "global_step": 444036, "epoch": 5349} {"train_loss": -27.533544540405273, "global_step": 444037, "epoch": 5349} {"train_loss": -27.31268310546875, "global_step": 444038, "epoch": 5349} {"train_loss": -26.80367088317871, "global_step": 444039, "epoch": 5349} {"train_loss": -26.729101181030273, "global_step": 444040, "epoch": 5349} {"train_loss": -27.205371856689453, "global_step": 444041, "epoch": 5349} {"train_loss": -26.719985961914062, "global_step": 444042, "epoch": 5349} {"train_loss": -26.837238311767578, "global_step": 444043, "epoch": 5349} {"train_loss": -27.07988929748535, "global_step": 444044, "epoch": 5349} {"train_loss": -26.94459342956543, "global_step": 444045, "epoch": 5349} {"train_loss": -27.086889266967773, "global_step": 444046, "epoch": 5349} {"train_loss": -26.83098793029785, "global_step": 444047, "epoch": 5349} {"train_loss": -26.9647216796875, "global_step": 444048, "epoch": 5349} {"train_loss": -26.94650695984622, "global_step": 444049, "epoch": 5349, "val_loss": 6599770.5} {"train_loss": -26.907468795776367, "global_step": 444050, "epoch": 5350} {"train_loss": -26.81280517578125, "global_step": 444051, "epoch": 5350} {"train_loss": -26.696949005126953, "global_step": 444052, "epoch": 5350} {"train_loss": -26.851022720336914, "global_step": 444053, "epoch": 5350} {"train_loss": -26.218698501586914, "global_step": 444054, "epoch": 5350} {"train_loss": -26.013391494750977, "global_step": 444055, "epoch": 5350} {"train_loss": -26.314197540283203, "global_step": 444056, "epoch": 5350} {"train_loss": -26.871850967407227, "global_step": 444057, "epoch": 5350} {"train_loss": -27.20013427734375, "global_step": 444058, "epoch": 5350} {"train_loss": -26.896406173706055, "global_step": 444059, "epoch": 5350} {"train_loss": -27.089868545532227, "global_step": 444060, "epoch": 5350} {"train_loss": -27.02652931213379, "global_step": 444061, "epoch": 5350} {"train_loss": -26.83851432800293, "global_step": 444062, "epoch": 5350} {"train_loss": -27.071069717407227, "global_step": 444063, "epoch": 5350} {"train_loss": -26.998144149780273, "global_step": 444064, "epoch": 5350} {"train_loss": -27.05592155456543, "global_step": 444065, "epoch": 5350} {"train_loss": -27.1832332611084, "global_step": 444066, "epoch": 5350} {"train_loss": -26.812103271484375, "global_step": 444067, "epoch": 5350} {"train_loss": -26.838293075561523, "global_step": 444068, "epoch": 5350} {"train_loss": -26.941089630126953, "global_step": 444069, "epoch": 5350} {"train_loss": -26.944461822509766, "global_step": 444070, "epoch": 5350} {"train_loss": -26.854928970336914, "global_step": 444071, "epoch": 5350} {"train_loss": -26.670026779174805, "global_step": 444072, "epoch": 5350} {"train_loss": -26.908802032470703, "global_step": 444073, "epoch": 5350} {"train_loss": -27.31092643737793, "global_step": 444074, "epoch": 5350} {"train_loss": -27.06499671936035, "global_step": 444075, "epoch": 5350} {"train_loss": -26.809133529663086, "global_step": 444076, "epoch": 5350} {"train_loss": -27.1246395111084, "global_step": 444077, "epoch": 5350} {"train_loss": -27.073638916015625, "global_step": 444078, "epoch": 5350} {"train_loss": -26.990461349487305, "global_step": 444079, "epoch": 5350} {"train_loss": -26.73589515686035, "global_step": 444080, "epoch": 5350} {"train_loss": -27.268651962280273, "global_step": 444081, "epoch": 5350} {"train_loss": -26.9746150970459, "global_step": 444082, "epoch": 5350} {"train_loss": -27.15115737915039, "global_step": 444083, "epoch": 5350} {"train_loss": -27.07794189453125, "global_step": 444084, "epoch": 5350} {"train_loss": -27.289657592773438, "global_step": 444085, "epoch": 5350} {"train_loss": -26.73927116394043, "global_step": 444086, "epoch": 5350} {"train_loss": -26.995691299438477, "global_step": 444087, "epoch": 5350} {"train_loss": -26.910388946533203, "global_step": 444088, "epoch": 5350} {"train_loss": -27.29561424255371, "global_step": 444089, "epoch": 5350} {"train_loss": -27.1634464263916, "global_step": 444090, "epoch": 5350} {"train_loss": -27.376739501953125, "global_step": 444091, "epoch": 5350} {"train_loss": -27.019147872924805, "global_step": 444092, "epoch": 5350} {"train_loss": -27.046899795532227, "global_step": 444093, "epoch": 5350} {"train_loss": -26.92494773864746, "global_step": 444094, "epoch": 5350} {"train_loss": -27.064029693603516, "global_step": 444095, "epoch": 5350} {"train_loss": -27.008153915405273, "global_step": 444096, "epoch": 5350} {"train_loss": -26.937915802001953, "global_step": 444097, "epoch": 5350} {"train_loss": -27.036901473999023, "global_step": 444098, "epoch": 5350} {"train_loss": -27.146894454956055, "global_step": 444099, "epoch": 5350} {"train_loss": -27.1502742767334, "global_step": 444100, "epoch": 5350} {"train_loss": -26.817890167236328, "global_step": 444101, "epoch": 5350} {"train_loss": -26.81060218811035, "global_step": 444102, "epoch": 5350} {"train_loss": -26.731550216674805, "global_step": 444103, "epoch": 5350} {"train_loss": -26.740467071533203, "global_step": 444104, "epoch": 5350} {"train_loss": -26.978179931640625, "global_step": 444105, "epoch": 5350} {"train_loss": -26.862165451049805, "global_step": 444106, "epoch": 5350} {"train_loss": -27.1358699798584, "global_step": 444107, "epoch": 5350} {"train_loss": -26.539264678955078, "global_step": 444108, "epoch": 5350} {"train_loss": -26.87379264831543, "global_step": 444109, "epoch": 5350} {"train_loss": -26.959192276000977, "global_step": 444110, "epoch": 5350} {"train_loss": -26.9267635345459, "global_step": 444111, "epoch": 5350} {"train_loss": -27.015796661376953, "global_step": 444112, "epoch": 5350} {"train_loss": -26.923330307006836, "global_step": 444113, "epoch": 5350} {"train_loss": -27.02972984313965, "global_step": 444114, "epoch": 5350} {"train_loss": -27.05840492248535, "global_step": 444115, "epoch": 5350} {"train_loss": -26.684789657592773, "global_step": 444116, "epoch": 5350} {"train_loss": -26.946048736572266, "global_step": 444117, "epoch": 5350} {"train_loss": -27.289709091186523, "global_step": 444118, "epoch": 5350} {"train_loss": -26.860992431640625, "global_step": 444119, "epoch": 5350} {"train_loss": -26.653783798217773, "global_step": 444120, "epoch": 5350} {"train_loss": -27.277379989624023, "global_step": 444121, "epoch": 5350} {"train_loss": -26.49118423461914, "global_step": 444122, "epoch": 5350} {"train_loss": -26.900014877319336, "global_step": 444123, "epoch": 5350} {"train_loss": -26.635984420776367, "global_step": 444124, "epoch": 5350} {"train_loss": -26.671323776245117, "global_step": 444125, "epoch": 5350} {"train_loss": -26.81147575378418, "global_step": 444126, "epoch": 5350} {"train_loss": -27.1606502532959, "global_step": 444127, "epoch": 5350} {"train_loss": -26.753219604492188, "global_step": 444128, "epoch": 5350} {"train_loss": -27.129663467407227, "global_step": 444129, "epoch": 5350} {"train_loss": -27.17287254333496, "global_step": 444130, "epoch": 5350} {"train_loss": -26.69136619567871, "global_step": 444131, "epoch": 5350} {"train_loss": -26.93979773463973, "global_step": 444132, "epoch": 5350, "train/sim_max_reward_0": 1.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 0.0, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4500000": 1.0, "test/sim_max_reward_4500001": 1.0, "test/sim_max_reward_4500002": 1.0, "test/sim_max_reward_4500003": 1.0, "test/sim_max_reward_4500004": 1.0, "test/sim_max_reward_4500005": 1.0, "test/sim_max_reward_4500006": 1.0, "test/sim_max_reward_4500007": 0.0, "test/sim_max_reward_4500008": 1.0, "test/sim_max_reward_4500009": 1.0, "test/sim_max_reward_4500010": 1.0, "test/sim_max_reward_4500011": 1.0, "test/sim_max_reward_4500012": 1.0, "test/sim_max_reward_4500013": 0.0, "test/sim_max_reward_4500014": 1.0, "test/sim_max_reward_4500015": 1.0, "test/sim_max_reward_4500016": 1.0, "test/sim_max_reward_4500017": 1.0, "test/sim_max_reward_4500018": 1.0, "test/sim_max_reward_4500019": 0.0, "test/sim_max_reward_4500020": 1.0, "test/sim_max_reward_4500021": 1.0, "train/mean_score": 0.8333333333333334, "test/mean_score": 0.8636363636363636, "val_loss": 6692311.0} {"train_loss": -26.97271156311035, "global_step": 444133, "epoch": 5351} {"train_loss": -26.368579864501953, "global_step": 444134, "epoch": 5351} {"train_loss": -26.604522705078125, "global_step": 444135, "epoch": 5351} {"train_loss": -26.89716148376465, "global_step": 444136, "epoch": 5351} {"train_loss": -26.187793731689453, "global_step": 444137, "epoch": 5351} {"train_loss": -26.466489791870117, "global_step": 444138, "epoch": 5351} {"train_loss": -26.691059112548828, "global_step": 444139, "epoch": 5351} {"train_loss": -26.586355209350586, "global_step": 444140, "epoch": 5351} {"train_loss": -26.56510353088379, "global_step": 444141, "epoch": 5351} {"train_loss": -26.625024795532227, "global_step": 444142, "epoch": 5351} {"train_loss": -26.531518936157227, "global_step": 444143, "epoch": 5351} {"train_loss": -26.462900161743164, "global_step": 444144, "epoch": 5351} {"train_loss": -26.705219268798828, "global_step": 444145, "epoch": 5351} {"train_loss": -26.37871742248535, "global_step": 444146, "epoch": 5351} {"train_loss": -27.053861618041992, "global_step": 444147, "epoch": 5351} {"train_loss": -26.260648727416992, "global_step": 444148, "epoch": 5351} {"train_loss": -26.90980339050293, "global_step": 444149, "epoch": 5351} {"train_loss": -26.822412490844727, "global_step": 444150, "epoch": 5351} {"train_loss": -26.764196395874023, "global_step": 444151, "epoch": 5351} {"train_loss": -26.978778839111328, "global_step": 444152, "epoch": 5351} {"train_loss": -27.06463623046875, "global_step": 444153, "epoch": 5351} {"train_loss": -26.857818603515625, "global_step": 444154, "epoch": 5351} {"train_loss": -27.06195068359375, "global_step": 444155, "epoch": 5351} {"train_loss": -27.205230712890625, "global_step": 444156, "epoch": 5351} {"train_loss": -26.984643936157227, "global_step": 444157, "epoch": 5351} {"train_loss": -26.737537384033203, "global_step": 444158, "epoch": 5351} {"train_loss": -26.502561569213867, "global_step": 444159, "epoch": 5351} {"train_loss": -27.166040420532227, "global_step": 444160, "epoch": 5351} {"train_loss": -27.135089874267578, "global_step": 444161, "epoch": 5351} {"train_loss": -26.947925567626953, "global_step": 444162, "epoch": 5351} {"train_loss": -26.95330238342285, "global_step": 444163, "epoch": 5351} {"train_loss": -27.420774459838867, "global_step": 444164, "epoch": 5351} {"train_loss": -26.796558380126953, "global_step": 444165, "epoch": 5351} {"train_loss": -27.12196922302246, "global_step": 444166, "epoch": 5351} {"train_loss": -27.1088809967041, "global_step": 444167, "epoch": 5351} {"train_loss": -26.646438598632812, "global_step": 444168, "epoch": 5351} {"train_loss": -26.76405906677246, "global_step": 444169, "epoch": 5351} {"train_loss": -26.976673126220703, "global_step": 444170, "epoch": 5351} {"train_loss": -27.358295440673828, "global_step": 444171, "epoch": 5351} {"train_loss": -27.03358268737793, "global_step": 444172, "epoch": 5351} {"train_loss": -27.330366134643555, "global_step": 444173, "epoch": 5351} {"train_loss": -26.9460391998291, "global_step": 444174, "epoch": 5351} {"train_loss": -27.1321964263916, "global_step": 444175, "epoch": 5351} {"train_loss": -27.213699340820312, "global_step": 444176, "epoch": 5351} {"train_loss": -26.970998764038086, "global_step": 444177, "epoch": 5351} {"train_loss": -27.2148380279541, "global_step": 444178, "epoch": 5351} {"train_loss": -26.967863082885742, "global_step": 444179, "epoch": 5351} {"train_loss": -26.789926528930664, "global_step": 444180, "epoch": 5351} {"train_loss": -27.162832260131836, "global_step": 444181, "epoch": 5351} {"train_loss": -27.195714950561523, "global_step": 444182, "epoch": 5351} {"train_loss": -27.097900390625, "global_step": 444183, "epoch": 5351} {"train_loss": -27.31298828125, "global_step": 444184, "epoch": 5351} {"train_loss": -26.848215103149414, "global_step": 444185, "epoch": 5351} {"train_loss": -26.55792808532715, "global_step": 444186, "epoch": 5351} {"train_loss": -27.12421226501465, "global_step": 444187, "epoch": 5351} {"train_loss": -27.169010162353516, "global_step": 444188, "epoch": 5351} {"train_loss": -26.692829132080078, "global_step": 444189, "epoch": 5351} {"train_loss": -26.87531852722168, "global_step": 444190, "epoch": 5351} {"train_loss": -27.024694442749023, "global_step": 444191, "epoch": 5351} {"train_loss": -27.0274715423584, "global_step": 444192, "epoch": 5351} {"train_loss": -27.04084587097168, "global_step": 444193, "epoch": 5351} {"train_loss": -27.013925552368164, "global_step": 444194, "epoch": 5351} {"train_loss": -27.05683708190918, "global_step": 444195, "epoch": 5351} {"train_loss": -26.81353187561035, "global_step": 444196, "epoch": 5351} {"train_loss": -26.644317626953125, "global_step": 444197, "epoch": 5351} {"train_loss": -27.131250381469727, "global_step": 444198, "epoch": 5351} {"train_loss": -27.0200138092041, "global_step": 444199, "epoch": 5351} {"train_loss": -27.497129440307617, "global_step": 444200, "epoch": 5351} {"train_loss": -27.183629989624023, "global_step": 444201, "epoch": 5351} {"train_loss": -27.0792236328125, "global_step": 444202, "epoch": 5351} {"train_loss": -26.708539962768555, "global_step": 444203, "epoch": 5351} {"train_loss": -27.284717559814453, "global_step": 444204, "epoch": 5351} {"train_loss": -27.05019187927246, "global_step": 444205, "epoch": 5351} {"train_loss": -26.69093132019043, "global_step": 444206, "epoch": 5351} {"train_loss": -27.230426788330078, "global_step": 444207, "epoch": 5351} {"train_loss": -26.8671817779541, "global_step": 444208, "epoch": 5351} {"train_loss": -27.160993576049805, "global_step": 444209, "epoch": 5351} {"train_loss": -27.343374252319336, "global_step": 444210, "epoch": 5351} {"train_loss": -26.98182487487793, "global_step": 444211, "epoch": 5351} {"train_loss": -26.856962203979492, "global_step": 444212, "epoch": 5351} {"train_loss": -27.48410987854004, "global_step": 444213, "epoch": 5351} {"train_loss": -26.880319595336914, "global_step": 444214, "epoch": 5351} {"train_loss": -26.926514338298016, "global_step": 444215, "epoch": 5351, "val_loss": 6488930.0} {"train_loss": -26.0401611328125, "global_step": 444216, "epoch": 5352} {"train_loss": -25.74518394470215, "global_step": 444217, "epoch": 5352} {"train_loss": -26.287139892578125, "global_step": 444218, "epoch": 5352} {"train_loss": -26.2948055267334, "global_step": 444219, "epoch": 5352} {"train_loss": -25.911880493164062, "global_step": 444220, "epoch": 5352} {"train_loss": -25.974506378173828, "global_step": 444221, "epoch": 5352} {"train_loss": -25.853052139282227, "global_step": 444222, "epoch": 5352} {"train_loss": -26.219934463500977, "global_step": 444223, "epoch": 5352} {"train_loss": -25.867889404296875, "global_step": 444224, "epoch": 5352} {"train_loss": -26.333850860595703, "global_step": 444225, "epoch": 5352} {"train_loss": -26.20639991760254, "global_step": 444226, "epoch": 5352} {"train_loss": -26.694875717163086, "global_step": 444227, "epoch": 5352} {"train_loss": -26.437814712524414, "global_step": 444228, "epoch": 5352} {"train_loss": -26.429798126220703, "global_step": 444229, "epoch": 5352} {"train_loss": -26.05572509765625, "global_step": 444230, "epoch": 5352} {"train_loss": -25.888935089111328, "global_step": 444231, "epoch": 5352} {"train_loss": -26.25421714782715, "global_step": 444232, "epoch": 5352} {"train_loss": -26.320707321166992, "global_step": 444233, "epoch": 5352} {"train_loss": -26.430627822875977, "global_step": 444234, "epoch": 5352} {"train_loss": -26.499792098999023, "global_step": 444235, "epoch": 5352} {"train_loss": -26.269439697265625, "global_step": 444236, "epoch": 5352} {"train_loss": -26.602392196655273, "global_step": 444237, "epoch": 5352} {"train_loss": -26.251728057861328, "global_step": 444238, "epoch": 5352} {"train_loss": -26.629623413085938, "global_step": 444239, "epoch": 5352} {"train_loss": -26.175291061401367, "global_step": 444240, "epoch": 5352} {"train_loss": -26.32454490661621, "global_step": 444241, "epoch": 5352} {"train_loss": -27.151931762695312, "global_step": 444242, "epoch": 5352} {"train_loss": -26.669696807861328, "global_step": 444243, "epoch": 5352} {"train_loss": -26.563861846923828, "global_step": 444244, "epoch": 5352} {"train_loss": -26.63213539123535, "global_step": 444245, "epoch": 5352} {"train_loss": -26.38282585144043, "global_step": 444246, "epoch": 5352} {"train_loss": -26.60260581970215, "global_step": 444247, "epoch": 5352} {"train_loss": -27.05506706237793, "global_step": 444248, "epoch": 5352} {"train_loss": -26.7115478515625, "global_step": 444249, "epoch": 5352} {"train_loss": -26.510330200195312, "global_step": 444250, "epoch": 5352} {"train_loss": -26.800434112548828, "global_step": 444251, "epoch": 5352} {"train_loss": -26.722745895385742, "global_step": 444252, "epoch": 5352} {"train_loss": -26.957929611206055, "global_step": 444253, "epoch": 5352} {"train_loss": -26.655780792236328, "global_step": 444254, "epoch": 5352} {"train_loss": -26.705249786376953, "global_step": 444255, "epoch": 5352} {"train_loss": -27.1452693939209, "global_step": 444256, "epoch": 5352} {"train_loss": -26.979536056518555, "global_step": 444257, "epoch": 5352} {"train_loss": -26.762372970581055, "global_step": 444258, "epoch": 5352} {"train_loss": -27.18585205078125, "global_step": 444259, "epoch": 5352} {"train_loss": -27.02583122253418, "global_step": 444260, "epoch": 5352} {"train_loss": -27.297637939453125, "global_step": 444261, "epoch": 5352} {"train_loss": -26.817310333251953, "global_step": 444262, "epoch": 5352} {"train_loss": -27.145166397094727, "global_step": 444263, "epoch": 5352} {"train_loss": -26.896194458007812, "global_step": 444264, "epoch": 5352} {"train_loss": -27.541473388671875, "global_step": 444265, "epoch": 5352} {"train_loss": -26.96656608581543, "global_step": 444266, "epoch": 5352} {"train_loss": -26.659015655517578, "global_step": 444267, "epoch": 5352} {"train_loss": -26.973844528198242, "global_step": 444268, "epoch": 5352} {"train_loss": -27.171003341674805, "global_step": 444269, "epoch": 5352} {"train_loss": -27.00165367126465, "global_step": 444270, "epoch": 5352} {"train_loss": -26.8133487701416, "global_step": 444271, "epoch": 5352} {"train_loss": -27.165149688720703, "global_step": 444272, "epoch": 5352} {"train_loss": -27.48388671875, "global_step": 444273, "epoch": 5352} {"train_loss": -26.927520751953125, "global_step": 444274, "epoch": 5352} {"train_loss": -26.872220993041992, "global_step": 444275, "epoch": 5352} {"train_loss": -26.827444076538086, "global_step": 444276, "epoch": 5352} {"train_loss": -27.111902236938477, "global_step": 444277, "epoch": 5352} {"train_loss": -27.139307022094727, "global_step": 444278, "epoch": 5352} {"train_loss": -27.1418514251709, "global_step": 444279, "epoch": 5352} {"train_loss": -26.812732696533203, "global_step": 444280, "epoch": 5352} {"train_loss": -27.11334800720215, "global_step": 444281, "epoch": 5352} {"train_loss": -26.812976837158203, "global_step": 444282, "epoch": 5352} {"train_loss": -27.14942741394043, "global_step": 444283, "epoch": 5352} {"train_loss": -27.02839469909668, "global_step": 444284, "epoch": 5352} {"train_loss": -26.847578048706055, "global_step": 444285, "epoch": 5352} {"train_loss": -27.053701400756836, "global_step": 444286, "epoch": 5352} {"train_loss": -27.339963912963867, "global_step": 444287, "epoch": 5352} {"train_loss": -27.055845260620117, "global_step": 444288, "epoch": 5352} {"train_loss": -27.39800453186035, "global_step": 444289, "epoch": 5352} {"train_loss": -27.172754287719727, "global_step": 444290, "epoch": 5352} {"train_loss": -27.259611129760742, "global_step": 444291, "epoch": 5352} {"train_loss": -26.692066192626953, "global_step": 444292, "epoch": 5352} {"train_loss": -27.247068405151367, "global_step": 444293, "epoch": 5352} {"train_loss": -27.171314239501953, "global_step": 444294, "epoch": 5352} {"train_loss": -26.92011070251465, "global_step": 444295, "epoch": 5352} {"train_loss": -26.835729598999023, "global_step": 444296, "epoch": 5352} {"train_loss": -27.091278076171875, "global_step": 444297, "epoch": 5352} {"train_loss": -26.737773941223878, "global_step": 444298, "epoch": 5352, "val_loss": 6679579.0} {"train_loss": -26.698633193969727, "global_step": 444299, "epoch": 5353} {"train_loss": -26.64301109313965, "global_step": 444300, "epoch": 5353} {"train_loss": -26.64935874938965, "global_step": 444301, "epoch": 5353} {"train_loss": -27.077695846557617, "global_step": 444302, "epoch": 5353} {"train_loss": -26.58184814453125, "global_step": 444303, "epoch": 5353} {"train_loss": -27.166278839111328, "global_step": 444304, "epoch": 5353} {"train_loss": -26.580820083618164, "global_step": 444305, "epoch": 5353} {"train_loss": -26.86524772644043, "global_step": 444306, "epoch": 5353} {"train_loss": -27.04302978515625, "global_step": 444307, "epoch": 5353} {"train_loss": -26.735015869140625, "global_step": 444308, "epoch": 5353} {"train_loss": -26.935754776000977, "global_step": 444309, "epoch": 5353} {"train_loss": -26.9509334564209, "global_step": 444310, "epoch": 5353} {"train_loss": -27.098651885986328, "global_step": 444311, "epoch": 5353} {"train_loss": -27.138782501220703, "global_step": 444312, "epoch": 5353} {"train_loss": -27.125675201416016, "global_step": 444313, "epoch": 5353} {"train_loss": -26.740131378173828, "global_step": 444314, "epoch": 5353} {"train_loss": -27.191999435424805, "global_step": 444315, "epoch": 5353} {"train_loss": -27.283573150634766, "global_step": 444316, "epoch": 5353} {"train_loss": -27.039569854736328, "global_step": 444317, "epoch": 5353} {"train_loss": -27.207229614257812, "global_step": 444318, "epoch": 5353} {"train_loss": -27.027389526367188, "global_step": 444319, "epoch": 5353} {"train_loss": -27.191436767578125, "global_step": 444320, "epoch": 5353} {"train_loss": -27.27321434020996, "global_step": 444321, "epoch": 5353} {"train_loss": -27.098569869995117, "global_step": 444322, "epoch": 5353} {"train_loss": -26.91010856628418, "global_step": 444323, "epoch": 5353} {"train_loss": -26.9887752532959, "global_step": 444324, "epoch": 5353} {"train_loss": -27.07720947265625, "global_step": 444325, "epoch": 5353} {"train_loss": -26.939722061157227, "global_step": 444326, "epoch": 5353} {"train_loss": -27.312414169311523, "global_step": 444327, "epoch": 5353} {"train_loss": -27.141265869140625, "global_step": 444328, "epoch": 5353} {"train_loss": -27.229217529296875, "global_step": 444329, "epoch": 5353} {"train_loss": -27.15606689453125, "global_step": 444330, "epoch": 5353} {"train_loss": -27.311111450195312, "global_step": 444331, "epoch": 5353} {"train_loss": -26.671283721923828, "global_step": 444332, "epoch": 5353} {"train_loss": -27.073659896850586, "global_step": 444333, "epoch": 5353} {"train_loss": -26.944732666015625, "global_step": 444334, "epoch": 5353} {"train_loss": -27.085906982421875, "global_step": 444335, "epoch": 5353} {"train_loss": -27.229171752929688, "global_step": 444336, "epoch": 5353} {"train_loss": -27.241201400756836, "global_step": 444337, "epoch": 5353} {"train_loss": -26.6871280670166, "global_step": 444338, "epoch": 5353} {"train_loss": -27.39963722229004, "global_step": 444339, "epoch": 5353} {"train_loss": -26.507734298706055, "global_step": 444340, "epoch": 5353} {"train_loss": -26.692861557006836, "global_step": 444341, "epoch": 5353} {"train_loss": -26.718143463134766, "global_step": 444342, "epoch": 5353} {"train_loss": -26.345869064331055, "global_step": 444343, "epoch": 5353} {"train_loss": -26.977750778198242, "global_step": 444344, "epoch": 5353} {"train_loss": -26.591644287109375, "global_step": 444345, "epoch": 5353} {"train_loss": -26.788421630859375, "global_step": 444346, "epoch": 5353} {"train_loss": -26.691816329956055, "global_step": 444347, "epoch": 5353} {"train_loss": -26.66837501525879, "global_step": 444348, "epoch": 5353} {"train_loss": -26.430866241455078, "global_step": 444349, "epoch": 5353} {"train_loss": -26.17563819885254, "global_step": 444350, "epoch": 5353} {"train_loss": -26.322599411010742, "global_step": 444351, "epoch": 5353} {"train_loss": -26.565580368041992, "global_step": 444352, "epoch": 5353} {"train_loss": -26.431211471557617, "global_step": 444353, "epoch": 5353} {"train_loss": -26.49366569519043, "global_step": 444354, "epoch": 5353} {"train_loss": -26.692541122436523, "global_step": 444355, "epoch": 5353} {"train_loss": -27.167699813842773, "global_step": 444356, "epoch": 5353} {"train_loss": -26.711084365844727, "global_step": 444357, "epoch": 5353} {"train_loss": -26.825403213500977, "global_step": 444358, "epoch": 5353} {"train_loss": -27.112628936767578, "global_step": 444359, "epoch": 5353} {"train_loss": -27.01068115234375, "global_step": 444360, "epoch": 5353} {"train_loss": -27.0602970123291, "global_step": 444361, "epoch": 5353} {"train_loss": -27.026508331298828, "global_step": 444362, "epoch": 5353} {"train_loss": -26.898374557495117, "global_step": 444363, "epoch": 5353} {"train_loss": -27.016193389892578, "global_step": 444364, "epoch": 5353} {"train_loss": -26.798049926757812, "global_step": 444365, "epoch": 5353} {"train_loss": -27.08430290222168, "global_step": 444366, "epoch": 5353} {"train_loss": -26.73370933532715, "global_step": 444367, "epoch": 5353} {"train_loss": -26.960052490234375, "global_step": 444368, "epoch": 5353} {"train_loss": -27.317386627197266, "global_step": 444369, "epoch": 5353} {"train_loss": -26.85120964050293, "global_step": 444370, "epoch": 5353} {"train_loss": -26.93779945373535, "global_step": 444371, "epoch": 5353} {"train_loss": -27.34187889099121, "global_step": 444372, "epoch": 5353} {"train_loss": -27.257095336914062, "global_step": 444373, "epoch": 5353} {"train_loss": -27.16065788269043, "global_step": 444374, "epoch": 5353} {"train_loss": -27.10175895690918, "global_step": 444375, "epoch": 5353} {"train_loss": -27.04646873474121, "global_step": 444376, "epoch": 5353} {"train_loss": -26.984289169311523, "global_step": 444377, "epoch": 5353} {"train_loss": -27.52009391784668, "global_step": 444378, "epoch": 5353} {"train_loss": -26.665700912475586, "global_step": 444379, "epoch": 5353} {"train_loss": -27.010480880737305, "global_step": 444380, "epoch": 5353} {"train_loss": -26.92708642798734, "global_step": 444381, "epoch": 5353, "val_loss": 6560034.0} {"train_loss": -26.54501724243164, "global_step": 444382, "epoch": 5354} {"train_loss": -25.493846893310547, "global_step": 444383, "epoch": 5354} {"train_loss": -24.93119239807129, "global_step": 444384, "epoch": 5354} {"train_loss": -26.08969497680664, "global_step": 444385, "epoch": 5354} {"train_loss": -25.949689865112305, "global_step": 444386, "epoch": 5354} {"train_loss": -24.62950325012207, "global_step": 444387, "epoch": 5354} {"train_loss": -26.518035888671875, "global_step": 444388, "epoch": 5354} {"train_loss": -26.43796157836914, "global_step": 444389, "epoch": 5354} {"train_loss": -26.778064727783203, "global_step": 444390, "epoch": 5354} {"train_loss": -26.526636123657227, "global_step": 444391, "epoch": 5354} {"train_loss": -26.33721351623535, "global_step": 444392, "epoch": 5354} {"train_loss": -26.717939376831055, "global_step": 444393, "epoch": 5354} {"train_loss": -25.87686538696289, "global_step": 444394, "epoch": 5354} {"train_loss": -26.4852352142334, "global_step": 444395, "epoch": 5354} {"train_loss": -26.56226921081543, "global_step": 444396, "epoch": 5354} {"train_loss": -26.8200740814209, "global_step": 444397, "epoch": 5354} {"train_loss": -26.878463745117188, "global_step": 444398, "epoch": 5354} {"train_loss": -26.7006893157959, "global_step": 444399, "epoch": 5354} {"train_loss": -27.002161026000977, "global_step": 444400, "epoch": 5354} {"train_loss": -26.758825302124023, "global_step": 444401, "epoch": 5354} {"train_loss": -26.74362564086914, "global_step": 444402, "epoch": 5354} {"train_loss": -26.59840202331543, "global_step": 444403, "epoch": 5354} {"train_loss": -26.71254539489746, "global_step": 444404, "epoch": 5354} {"train_loss": -26.942508697509766, "global_step": 444405, "epoch": 5354} {"train_loss": -26.854541778564453, "global_step": 444406, "epoch": 5354} {"train_loss": -26.933490753173828, "global_step": 444407, "epoch": 5354} {"train_loss": -26.727466583251953, "global_step": 444408, "epoch": 5354} {"train_loss": -27.21731948852539, "global_step": 444409, "epoch": 5354} {"train_loss": -26.536550521850586, "global_step": 444410, "epoch": 5354} {"train_loss": -26.810501098632812, "global_step": 444411, "epoch": 5354} {"train_loss": -26.750059127807617, "global_step": 444412, "epoch": 5354} {"train_loss": -27.293935775756836, "global_step": 444413, "epoch": 5354} {"train_loss": -26.78995704650879, "global_step": 444414, "epoch": 5354} {"train_loss": -26.968387603759766, "global_step": 444415, "epoch": 5354} {"train_loss": -27.085800170898438, "global_step": 444416, "epoch": 5354} {"train_loss": -27.125226974487305, "global_step": 444417, "epoch": 5354} {"train_loss": -26.332977294921875, "global_step": 444418, "epoch": 5354} {"train_loss": -26.56074333190918, "global_step": 444419, "epoch": 5354} {"train_loss": -27.06898307800293, "global_step": 444420, "epoch": 5354} {"train_loss": -26.919204711914062, "global_step": 444421, "epoch": 5354} {"train_loss": -26.24839210510254, "global_step": 444422, "epoch": 5354} {"train_loss": -26.788761138916016, "global_step": 444423, "epoch": 5354} {"train_loss": -26.8564395904541, "global_step": 444424, "epoch": 5354} {"train_loss": -26.727880477905273, "global_step": 444425, "epoch": 5354} {"train_loss": -26.71807861328125, "global_step": 444426, "epoch": 5354} {"train_loss": -27.1632022857666, "global_step": 444427, "epoch": 5354} {"train_loss": -26.993661880493164, "global_step": 444428, "epoch": 5354} {"train_loss": -27.02082633972168, "global_step": 444429, "epoch": 5354} {"train_loss": -26.875171661376953, "global_step": 444430, "epoch": 5354} {"train_loss": -26.696582794189453, "global_step": 444431, "epoch": 5354} {"train_loss": -27.143936157226562, "global_step": 444432, "epoch": 5354} {"train_loss": -26.947509765625, "global_step": 444433, "epoch": 5354} {"train_loss": -27.007413864135742, "global_step": 444434, "epoch": 5354} {"train_loss": -26.784101486206055, "global_step": 444435, "epoch": 5354} {"train_loss": -27.28759765625, "global_step": 444436, "epoch": 5354} {"train_loss": -27.171817779541016, "global_step": 444437, "epoch": 5354} {"train_loss": -27.1014404296875, "global_step": 444438, "epoch": 5354} {"train_loss": -26.6291561126709, "global_step": 444439, "epoch": 5354} {"train_loss": -27.271482467651367, "global_step": 444440, "epoch": 5354} {"train_loss": -26.966205596923828, "global_step": 444441, "epoch": 5354} {"train_loss": -26.985538482666016, "global_step": 444442, "epoch": 5354} {"train_loss": -26.923791885375977, "global_step": 444443, "epoch": 5354} {"train_loss": -26.89240074157715, "global_step": 444444, "epoch": 5354} {"train_loss": -27.34388542175293, "global_step": 444445, "epoch": 5354} {"train_loss": -26.69307518005371, "global_step": 444446, "epoch": 5354} {"train_loss": -26.747045516967773, "global_step": 444447, "epoch": 5354} {"train_loss": -27.324188232421875, "global_step": 444448, "epoch": 5354} {"train_loss": -26.89715576171875, "global_step": 444449, "epoch": 5354} {"train_loss": -26.60603141784668, "global_step": 444450, "epoch": 5354} {"train_loss": -26.86553382873535, "global_step": 444451, "epoch": 5354} {"train_loss": -26.78508949279785, "global_step": 444452, "epoch": 5354} {"train_loss": -26.595365524291992, "global_step": 444453, "epoch": 5354} {"train_loss": -26.9390811920166, "global_step": 444454, "epoch": 5354} {"train_loss": -26.762847900390625, "global_step": 444455, "epoch": 5354} {"train_loss": -26.83538818359375, "global_step": 444456, "epoch": 5354} {"train_loss": -26.68246841430664, "global_step": 444457, "epoch": 5354} {"train_loss": -27.069990158081055, "global_step": 444458, "epoch": 5354} {"train_loss": -27.177770614624023, "global_step": 444459, "epoch": 5354} {"train_loss": -26.8657169342041, "global_step": 444460, "epoch": 5354} {"train_loss": -27.060293197631836, "global_step": 444461, "epoch": 5354} {"train_loss": -27.004587173461914, "global_step": 444462, "epoch": 5354} {"train_loss": -27.337066650390625, "global_step": 444463, "epoch": 5354} {"train_loss": -26.761044513748352, "global_step": 444464, "epoch": 5354, "val_loss": 6622759.5} {"train_loss": -26.574432373046875, "global_step": 444465, "epoch": 5355} {"train_loss": -26.824609756469727, "global_step": 444466, "epoch": 5355} {"train_loss": -26.882261276245117, "global_step": 444467, "epoch": 5355} {"train_loss": -26.37471580505371, "global_step": 444468, "epoch": 5355} {"train_loss": -26.1673526763916, "global_step": 444469, "epoch": 5355} {"train_loss": -26.561429977416992, "global_step": 444470, "epoch": 5355} {"train_loss": -26.64054298400879, "global_step": 444471, "epoch": 5355} {"train_loss": -26.042165756225586, "global_step": 444472, "epoch": 5355} {"train_loss": -26.719213485717773, "global_step": 444473, "epoch": 5355} {"train_loss": -27.14809226989746, "global_step": 444474, "epoch": 5355} {"train_loss": -27.01458740234375, "global_step": 444475, "epoch": 5355} {"train_loss": -27.114856719970703, "global_step": 444476, "epoch": 5355} {"train_loss": -26.9277286529541, "global_step": 444477, "epoch": 5355} {"train_loss": -26.460336685180664, "global_step": 444478, "epoch": 5355} {"train_loss": -26.839481353759766, "global_step": 444479, "epoch": 5355} {"train_loss": -26.944177627563477, "global_step": 444480, "epoch": 5355} {"train_loss": -26.77605628967285, "global_step": 444481, "epoch": 5355} {"train_loss": -26.74954605102539, "global_step": 444482, "epoch": 5355} {"train_loss": -27.010162353515625, "global_step": 444483, "epoch": 5355} {"train_loss": -27.308454513549805, "global_step": 444484, "epoch": 5355} {"train_loss": -27.07391929626465, "global_step": 444485, "epoch": 5355} {"train_loss": -27.117462158203125, "global_step": 444486, "epoch": 5355} {"train_loss": -27.150440216064453, "global_step": 444487, "epoch": 5355} {"train_loss": -26.649335861206055, "global_step": 444488, "epoch": 5355} {"train_loss": -27.00726890563965, "global_step": 444489, "epoch": 5355} {"train_loss": -27.068044662475586, "global_step": 444490, "epoch": 5355} {"train_loss": -26.81777000427246, "global_step": 444491, "epoch": 5355} {"train_loss": -26.949995040893555, "global_step": 444492, "epoch": 5355} {"train_loss": -27.209766387939453, "global_step": 444493, "epoch": 5355} {"train_loss": -26.98017692565918, "global_step": 444494, "epoch": 5355} {"train_loss": -27.031530380249023, "global_step": 444495, "epoch": 5355} {"train_loss": -26.756439208984375, "global_step": 444496, "epoch": 5355} {"train_loss": -27.045063018798828, "global_step": 444497, "epoch": 5355} {"train_loss": -26.83225440979004, "global_step": 444498, "epoch": 5355} {"train_loss": -26.970218658447266, "global_step": 444499, "epoch": 5355} {"train_loss": -27.140188217163086, "global_step": 444500, "epoch": 5355} {"train_loss": -27.088430404663086, "global_step": 444501, "epoch": 5355} {"train_loss": -26.723188400268555, "global_step": 444502, "epoch": 5355} {"train_loss": -26.9867000579834, "global_step": 444503, "epoch": 5355} {"train_loss": -26.718412399291992, "global_step": 444504, "epoch": 5355} {"train_loss": -26.7239990234375, "global_step": 444505, "epoch": 5355} {"train_loss": -27.1737003326416, "global_step": 444506, "epoch": 5355} {"train_loss": -26.664966583251953, "global_step": 444507, "epoch": 5355} {"train_loss": -26.72511100769043, "global_step": 444508, "epoch": 5355} {"train_loss": -26.86590576171875, "global_step": 444509, "epoch": 5355} {"train_loss": -26.984235763549805, "global_step": 444510, "epoch": 5355} {"train_loss": -26.982803344726562, "global_step": 444511, "epoch": 5355} {"train_loss": -26.791065216064453, "global_step": 444512, "epoch": 5355} {"train_loss": -27.000600814819336, "global_step": 444513, "epoch": 5355} {"train_loss": -27.43897819519043, "global_step": 444514, "epoch": 5355} {"train_loss": -26.61066246032715, "global_step": 444515, "epoch": 5355} {"train_loss": -26.695234298706055, "global_step": 444516, "epoch": 5355} {"train_loss": -26.963056564331055, "global_step": 444517, "epoch": 5355} {"train_loss": -26.90357780456543, "global_step": 444518, "epoch": 5355} {"train_loss": -27.08294105529785, "global_step": 444519, "epoch": 5355} {"train_loss": -27.135961532592773, "global_step": 444520, "epoch": 5355} {"train_loss": -26.95136070251465, "global_step": 444521, "epoch": 5355} {"train_loss": -26.886154174804688, "global_step": 444522, "epoch": 5355} {"train_loss": -27.44063377380371, "global_step": 444523, "epoch": 5355} {"train_loss": -26.9177188873291, "global_step": 444524, "epoch": 5355} {"train_loss": -26.84381103515625, "global_step": 444525, "epoch": 5355} {"train_loss": -26.938451766967773, "global_step": 444526, "epoch": 5355} {"train_loss": -26.8123836517334, "global_step": 444527, "epoch": 5355} {"train_loss": -27.145374298095703, "global_step": 444528, "epoch": 5355} {"train_loss": -26.988000869750977, "global_step": 444529, "epoch": 5355} {"train_loss": -26.94671630859375, "global_step": 444530, "epoch": 5355} {"train_loss": -26.690032958984375, "global_step": 444531, "epoch": 5355} {"train_loss": -26.779956817626953, "global_step": 444532, "epoch": 5355} {"train_loss": -26.958343505859375, "global_step": 444533, "epoch": 5355} {"train_loss": -27.193445205688477, "global_step": 444534, "epoch": 5355} {"train_loss": -26.785892486572266, "global_step": 444535, "epoch": 5355} {"train_loss": -27.21400260925293, "global_step": 444536, "epoch": 5355} {"train_loss": -27.176319122314453, "global_step": 444537, "epoch": 5355} {"train_loss": -27.221603393554688, "global_step": 444538, "epoch": 5355} {"train_loss": -27.10154151916504, "global_step": 444539, "epoch": 5355} {"train_loss": -27.02267837524414, "global_step": 444540, "epoch": 5355} {"train_loss": -26.921112060546875, "global_step": 444541, "epoch": 5355} {"train_loss": -27.275983810424805, "global_step": 444542, "epoch": 5355} {"train_loss": -26.84078025817871, "global_step": 444543, "epoch": 5355} {"train_loss": -27.20952796936035, "global_step": 444544, "epoch": 5355} {"train_loss": -26.916244506835938, "global_step": 444545, "epoch": 5355} {"train_loss": -27.236082077026367, "global_step": 444546, "epoch": 5355} {"train_loss": -26.937889673623694, "global_step": 444547, "epoch": 5355, "val_loss": 6624139.0} {"train_loss": -26.839832305908203, "global_step": 444548, "epoch": 5356} {"train_loss": -26.10007667541504, "global_step": 444549, "epoch": 5356} {"train_loss": -26.574970245361328, "global_step": 444550, "epoch": 5356} {"train_loss": -26.219120025634766, "global_step": 444551, "epoch": 5356} {"train_loss": -25.82950782775879, "global_step": 444552, "epoch": 5356} {"train_loss": -26.033857345581055, "global_step": 444553, "epoch": 5356} {"train_loss": -26.493972778320312, "global_step": 444554, "epoch": 5356} {"train_loss": -26.511932373046875, "global_step": 444555, "epoch": 5356} {"train_loss": -26.01143455505371, "global_step": 444556, "epoch": 5356} {"train_loss": -26.2827205657959, "global_step": 444557, "epoch": 5356} {"train_loss": -26.064855575561523, "global_step": 444558, "epoch": 5356} {"train_loss": -26.34309959411621, "global_step": 444559, "epoch": 5356} {"train_loss": -26.284204483032227, "global_step": 444560, "epoch": 5356} {"train_loss": -26.686521530151367, "global_step": 444561, "epoch": 5356} {"train_loss": -25.972579956054688, "global_step": 444562, "epoch": 5356} {"train_loss": -26.43010902404785, "global_step": 444563, "epoch": 5356} {"train_loss": -26.10918617248535, "global_step": 444564, "epoch": 5356} {"train_loss": -26.057382583618164, "global_step": 444565, "epoch": 5356} {"train_loss": -26.109973907470703, "global_step": 444566, "epoch": 5356} {"train_loss": -25.93342399597168, "global_step": 444567, "epoch": 5356} {"train_loss": -26.5477237701416, "global_step": 444568, "epoch": 5356} {"train_loss": -26.246145248413086, "global_step": 444569, "epoch": 5356} {"train_loss": -26.31980323791504, "global_step": 444570, "epoch": 5356} {"train_loss": -26.381128311157227, "global_step": 444571, "epoch": 5356} {"train_loss": -26.3983154296875, "global_step": 444572, "epoch": 5356} {"train_loss": -26.59274673461914, "global_step": 444573, "epoch": 5356} {"train_loss": -26.8818359375, "global_step": 444574, "epoch": 5356} {"train_loss": -26.875940322875977, "global_step": 444575, "epoch": 5356} {"train_loss": -26.530853271484375, "global_step": 444576, "epoch": 5356} {"train_loss": -26.5728759765625, "global_step": 444577, "epoch": 5356} {"train_loss": -26.59815788269043, "global_step": 444578, "epoch": 5356} {"train_loss": -26.700214385986328, "global_step": 444579, "epoch": 5356} {"train_loss": -27.2382869720459, "global_step": 444580, "epoch": 5356} {"train_loss": -26.64693260192871, "global_step": 444581, "epoch": 5356} {"train_loss": -27.019195556640625, "global_step": 444582, "epoch": 5356} {"train_loss": -26.64942741394043, "global_step": 444583, "epoch": 5356} {"train_loss": -26.814111709594727, "global_step": 444584, "epoch": 5356} {"train_loss": -26.76983070373535, "global_step": 444585, "epoch": 5356} {"train_loss": -26.814382553100586, "global_step": 444586, "epoch": 5356} {"train_loss": -27.18574333190918, "global_step": 444587, "epoch": 5356} {"train_loss": -26.961713790893555, "global_step": 444588, "epoch": 5356} {"train_loss": -26.820697784423828, "global_step": 444589, "epoch": 5356} {"train_loss": -27.258014678955078, "global_step": 444590, "epoch": 5356} {"train_loss": -26.991718292236328, "global_step": 444591, "epoch": 5356} {"train_loss": -27.044538497924805, "global_step": 444592, "epoch": 5356} {"train_loss": -27.028671264648438, "global_step": 444593, "epoch": 5356} {"train_loss": -27.201505661010742, "global_step": 444594, "epoch": 5356} {"train_loss": -27.455835342407227, "global_step": 444595, "epoch": 5356} {"train_loss": -27.12841796875, "global_step": 444596, "epoch": 5356} {"train_loss": -27.531503677368164, "global_step": 444597, "epoch": 5356} {"train_loss": -27.182947158813477, "global_step": 444598, "epoch": 5356} {"train_loss": -27.3814697265625, "global_step": 444599, "epoch": 5356} {"train_loss": -26.64619255065918, "global_step": 444600, "epoch": 5356} {"train_loss": -26.99567222595215, "global_step": 444601, "epoch": 5356} {"train_loss": -27.234455108642578, "global_step": 444602, "epoch": 5356} {"train_loss": -27.397241592407227, "global_step": 444603, "epoch": 5356} {"train_loss": -27.280996322631836, "global_step": 444604, "epoch": 5356} {"train_loss": -26.863204956054688, "global_step": 444605, "epoch": 5356} {"train_loss": -27.09173583984375, "global_step": 444606, "epoch": 5356} {"train_loss": -27.098936080932617, "global_step": 444607, "epoch": 5356} {"train_loss": -27.115453720092773, "global_step": 444608, "epoch": 5356} {"train_loss": -26.9937744140625, "global_step": 444609, "epoch": 5356} {"train_loss": -27.24798583984375, "global_step": 444610, "epoch": 5356} {"train_loss": -27.114484786987305, "global_step": 444611, "epoch": 5356} {"train_loss": -26.981220245361328, "global_step": 444612, "epoch": 5356} {"train_loss": -27.4965763092041, "global_step": 444613, "epoch": 5356} {"train_loss": -26.56329345703125, "global_step": 444614, "epoch": 5356} {"train_loss": -26.240720748901367, "global_step": 444615, "epoch": 5356} {"train_loss": -26.01974868774414, "global_step": 444616, "epoch": 5356} {"train_loss": -26.219518661499023, "global_step": 444617, "epoch": 5356} {"train_loss": -26.384485244750977, "global_step": 444618, "epoch": 5356} {"train_loss": -26.9654598236084, "global_step": 444619, "epoch": 5356} {"train_loss": -27.045461654663086, "global_step": 444620, "epoch": 5356} {"train_loss": -26.746267318725586, "global_step": 444621, "epoch": 5356} {"train_loss": -27.074548721313477, "global_step": 444622, "epoch": 5356} {"train_loss": -27.3017635345459, "global_step": 444623, "epoch": 5356} {"train_loss": -26.625171661376953, "global_step": 444624, "epoch": 5356} {"train_loss": -27.063034057617188, "global_step": 444625, "epoch": 5356} {"train_loss": -26.980798721313477, "global_step": 444626, "epoch": 5356} {"train_loss": -26.819196701049805, "global_step": 444627, "epoch": 5356} {"train_loss": -26.7558650970459, "global_step": 444628, "epoch": 5356} {"train_loss": -27.053613662719727, "global_step": 444629, "epoch": 5356} {"train_loss": -26.73678954250841, "global_step": 444630, "epoch": 5356, "val_loss": 6723300.0} {"train_loss": -25.282777786254883, "global_step": 444631, "epoch": 5357} {"train_loss": -26.15614128112793, "global_step": 444632, "epoch": 5357} {"train_loss": -25.81770896911621, "global_step": 444633, "epoch": 5357} {"train_loss": -26.552091598510742, "global_step": 444634, "epoch": 5357} {"train_loss": -26.388410568237305, "global_step": 444635, "epoch": 5357} {"train_loss": -26.222675323486328, "global_step": 444636, "epoch": 5357} {"train_loss": -26.865467071533203, "global_step": 444637, "epoch": 5357} {"train_loss": -26.419574737548828, "global_step": 444638, "epoch": 5357} {"train_loss": -26.507984161376953, "global_step": 444639, "epoch": 5357} {"train_loss": -26.27652931213379, "global_step": 444640, "epoch": 5357} {"train_loss": -26.5911808013916, "global_step": 444641, "epoch": 5357} {"train_loss": -26.5069580078125, "global_step": 444642, "epoch": 5357} {"train_loss": -26.690122604370117, "global_step": 444643, "epoch": 5357} {"train_loss": -26.9202938079834, "global_step": 444644, "epoch": 5357} {"train_loss": -26.4924373626709, "global_step": 444645, "epoch": 5357} {"train_loss": -26.82195472717285, "global_step": 444646, "epoch": 5357} {"train_loss": -26.400012969970703, "global_step": 444647, "epoch": 5357} {"train_loss": -26.536823272705078, "global_step": 444648, "epoch": 5357} {"train_loss": -26.943729400634766, "global_step": 444649, "epoch": 5357} {"train_loss": -26.90069007873535, "global_step": 444650, "epoch": 5357} {"train_loss": -26.779102325439453, "global_step": 444651, "epoch": 5357} {"train_loss": -26.932153701782227, "global_step": 444652, "epoch": 5357} {"train_loss": -27.01340675354004, "global_step": 444653, "epoch": 5357} {"train_loss": -27.035009384155273, "global_step": 444654, "epoch": 5357} {"train_loss": -26.70284080505371, "global_step": 444655, "epoch": 5357} {"train_loss": -27.163480758666992, "global_step": 444656, "epoch": 5357} {"train_loss": -27.064533233642578, "global_step": 444657, "epoch": 5357} {"train_loss": -26.896427154541016, "global_step": 444658, "epoch": 5357} {"train_loss": -27.228132247924805, "global_step": 444659, "epoch": 5357} {"train_loss": -27.045583724975586, "global_step": 444660, "epoch": 5357} {"train_loss": -26.81951904296875, "global_step": 444661, "epoch": 5357} {"train_loss": -26.713062286376953, "global_step": 444662, "epoch": 5357} {"train_loss": -26.814197540283203, "global_step": 444663, "epoch": 5357} {"train_loss": -26.692697525024414, "global_step": 444664, "epoch": 5357} {"train_loss": -27.08406639099121, "global_step": 444665, "epoch": 5357} {"train_loss": -27.185230255126953, "global_step": 444666, "epoch": 5357} {"train_loss": -26.935754776000977, "global_step": 444667, "epoch": 5357} {"train_loss": -27.01946449279785, "global_step": 444668, "epoch": 5357} {"train_loss": -27.030414581298828, "global_step": 444669, "epoch": 5357} {"train_loss": -27.4002685546875, "global_step": 444670, "epoch": 5357} {"train_loss": -27.02113914489746, "global_step": 444671, "epoch": 5357} {"train_loss": -27.378604888916016, "global_step": 444672, "epoch": 5357} {"train_loss": -26.847156524658203, "global_step": 444673, "epoch": 5357} {"train_loss": -27.23495864868164, "global_step": 444674, "epoch": 5357} {"train_loss": -27.329282760620117, "global_step": 444675, "epoch": 5357} {"train_loss": -26.79570960998535, "global_step": 444676, "epoch": 5357} {"train_loss": -27.136138916015625, "global_step": 444677, "epoch": 5357} {"train_loss": -27.114606857299805, "global_step": 444678, "epoch": 5357} {"train_loss": -26.871313095092773, "global_step": 444679, "epoch": 5357} {"train_loss": -27.4180908203125, "global_step": 444680, "epoch": 5357} {"train_loss": -26.931543350219727, "global_step": 444681, "epoch": 5357} {"train_loss": -26.810667037963867, "global_step": 444682, "epoch": 5357} {"train_loss": -27.26471519470215, "global_step": 444683, "epoch": 5357} {"train_loss": -26.7780818939209, "global_step": 444684, "epoch": 5357} {"train_loss": -27.207422256469727, "global_step": 444685, "epoch": 5357} {"train_loss": -27.016828536987305, "global_step": 444686, "epoch": 5357} {"train_loss": -27.0488338470459, "global_step": 444687, "epoch": 5357} {"train_loss": -26.60489845275879, "global_step": 444688, "epoch": 5357} {"train_loss": -26.872907638549805, "global_step": 444689, "epoch": 5357} {"train_loss": -27.2991886138916, "global_step": 444690, "epoch": 5357} {"train_loss": -27.136356353759766, "global_step": 444691, "epoch": 5357} {"train_loss": -27.042951583862305, "global_step": 444692, "epoch": 5357} {"train_loss": -27.005939483642578, "global_step": 444693, "epoch": 5357} {"train_loss": -27.339933395385742, "global_step": 444694, "epoch": 5357} {"train_loss": -26.822620391845703, "global_step": 444695, "epoch": 5357} {"train_loss": -27.226654052734375, "global_step": 444696, "epoch": 5357} {"train_loss": -26.972578048706055, "global_step": 444697, "epoch": 5357} {"train_loss": -26.966415405273438, "global_step": 444698, "epoch": 5357} {"train_loss": -27.2545223236084, "global_step": 444699, "epoch": 5357} {"train_loss": -27.254505157470703, "global_step": 444700, "epoch": 5357} {"train_loss": -27.179677963256836, "global_step": 444701, "epoch": 5357} {"train_loss": -27.344274520874023, "global_step": 444702, "epoch": 5357} {"train_loss": -27.188907623291016, "global_step": 444703, "epoch": 5357} {"train_loss": -27.111896514892578, "global_step": 444704, "epoch": 5357} {"train_loss": -27.19050407409668, "global_step": 444705, "epoch": 5357} {"train_loss": -27.110563278198242, "global_step": 444706, "epoch": 5357} {"train_loss": -26.97564697265625, "global_step": 444707, "epoch": 5357} {"train_loss": -26.75983238220215, "global_step": 444708, "epoch": 5357} {"train_loss": -27.137298583984375, "global_step": 444709, "epoch": 5357} {"train_loss": -27.16037368774414, "global_step": 444710, "epoch": 5357} {"train_loss": -27.2106990814209, "global_step": 444711, "epoch": 5357} {"train_loss": -27.363880157470703, "global_step": 444712, "epoch": 5357} {"train_loss": -26.88710306925946, "global_step": 444713, "epoch": 5357, "val_loss": 6643362.0} {"train_loss": -26.70537757873535, "global_step": 444714, "epoch": 5358} {"train_loss": -26.2991943359375, "global_step": 444715, "epoch": 5358} {"train_loss": -26.38825035095215, "global_step": 444716, "epoch": 5358} {"train_loss": -25.601993560791016, "global_step": 444717, "epoch": 5358} {"train_loss": -25.811370849609375, "global_step": 444718, "epoch": 5358} {"train_loss": -26.587554931640625, "global_step": 444719, "epoch": 5358} {"train_loss": -26.280414581298828, "global_step": 444720, "epoch": 5358} {"train_loss": -25.657758712768555, "global_step": 444721, "epoch": 5358} {"train_loss": -26.065948486328125, "global_step": 444722, "epoch": 5358} {"train_loss": -26.525724411010742, "global_step": 444723, "epoch": 5358} {"train_loss": -26.13595962524414, "global_step": 444724, "epoch": 5358} {"train_loss": -26.482542037963867, "global_step": 444725, "epoch": 5358} {"train_loss": -26.475452423095703, "global_step": 444726, "epoch": 5358} {"train_loss": -26.64369010925293, "global_step": 444727, "epoch": 5358} {"train_loss": -26.365385055541992, "global_step": 444728, "epoch": 5358} {"train_loss": -26.511804580688477, "global_step": 444729, "epoch": 5358} {"train_loss": -26.359909057617188, "global_step": 444730, "epoch": 5358} {"train_loss": -26.535314559936523, "global_step": 444731, "epoch": 5358} {"train_loss": -26.75299072265625, "global_step": 444732, "epoch": 5358} {"train_loss": -26.836774826049805, "global_step": 444733, "epoch": 5358} {"train_loss": -26.7275390625, "global_step": 444734, "epoch": 5358} {"train_loss": -26.99885368347168, "global_step": 444735, "epoch": 5358} {"train_loss": -26.58368492126465, "global_step": 444736, "epoch": 5358} {"train_loss": -26.651885986328125, "global_step": 444737, "epoch": 5358} {"train_loss": -26.62135124206543, "global_step": 444738, "epoch": 5358} {"train_loss": -26.900720596313477, "global_step": 444739, "epoch": 5358} {"train_loss": -26.87543296813965, "global_step": 444740, "epoch": 5358} {"train_loss": -26.602542877197266, "global_step": 444741, "epoch": 5358} {"train_loss": -26.50653076171875, "global_step": 444742, "epoch": 5358} {"train_loss": -26.81534194946289, "global_step": 444743, "epoch": 5358} {"train_loss": -27.079496383666992, "global_step": 444744, "epoch": 5358} {"train_loss": -26.743423461914062, "global_step": 444745, "epoch": 5358} {"train_loss": -27.052576065063477, "global_step": 444746, "epoch": 5358} {"train_loss": -27.130563735961914, "global_step": 444747, "epoch": 5358} {"train_loss": -26.78143310546875, "global_step": 444748, "epoch": 5358} {"train_loss": -26.484878540039062, "global_step": 444749, "epoch": 5358} {"train_loss": -26.96482276916504, "global_step": 444750, "epoch": 5358} {"train_loss": -26.964771270751953, "global_step": 444751, "epoch": 5358} {"train_loss": -27.372589111328125, "global_step": 444752, "epoch": 5358} {"train_loss": -26.9617862701416, "global_step": 444753, "epoch": 5358} {"train_loss": -27.334491729736328, "global_step": 444754, "epoch": 5358} {"train_loss": -26.94329261779785, "global_step": 444755, "epoch": 5358} {"train_loss": -27.069440841674805, "global_step": 444756, "epoch": 5358} {"train_loss": -27.25527000427246, "global_step": 444757, "epoch": 5358} {"train_loss": -27.0866641998291, "global_step": 444758, "epoch": 5358} {"train_loss": -26.520248413085938, "global_step": 444759, "epoch": 5358} {"train_loss": -26.947290420532227, "global_step": 444760, "epoch": 5358} {"train_loss": -26.727237701416016, "global_step": 444761, "epoch": 5358} {"train_loss": -26.8082332611084, "global_step": 444762, "epoch": 5358} {"train_loss": -27.076078414916992, "global_step": 444763, "epoch": 5358} {"train_loss": -27.236730575561523, "global_step": 444764, "epoch": 5358} {"train_loss": -27.231399536132812, "global_step": 444765, "epoch": 5358} {"train_loss": -26.917821884155273, "global_step": 444766, "epoch": 5358} {"train_loss": -26.85296058654785, "global_step": 444767, "epoch": 5358} {"train_loss": -26.89702796936035, "global_step": 444768, "epoch": 5358} {"train_loss": -26.746763229370117, "global_step": 444769, "epoch": 5358} {"train_loss": -26.67701530456543, "global_step": 444770, "epoch": 5358} {"train_loss": -26.747852325439453, "global_step": 444771, "epoch": 5358} {"train_loss": -27.039716720581055, "global_step": 444772, "epoch": 5358} {"train_loss": -26.948789596557617, "global_step": 444773, "epoch": 5358} {"train_loss": -27.07662010192871, "global_step": 444774, "epoch": 5358} {"train_loss": -27.383193969726562, "global_step": 444775, "epoch": 5358} {"train_loss": -27.286405563354492, "global_step": 444776, "epoch": 5358} {"train_loss": -27.297107696533203, "global_step": 444777, "epoch": 5358} {"train_loss": -26.84712791442871, "global_step": 444778, "epoch": 5358} {"train_loss": -27.257848739624023, "global_step": 444779, "epoch": 5358} {"train_loss": -27.432025909423828, "global_step": 444780, "epoch": 5358} {"train_loss": -27.1282958984375, "global_step": 444781, "epoch": 5358} {"train_loss": -27.034753799438477, "global_step": 444782, "epoch": 5358} {"train_loss": -27.175748825073242, "global_step": 444783, "epoch": 5358} {"train_loss": -27.224218368530273, "global_step": 444784, "epoch": 5358} {"train_loss": -27.3294620513916, "global_step": 444785, "epoch": 5358} {"train_loss": -27.473846435546875, "global_step": 444786, "epoch": 5358} {"train_loss": -27.12067985534668, "global_step": 444787, "epoch": 5358} {"train_loss": -27.051538467407227, "global_step": 444788, "epoch": 5358} {"train_loss": -27.00765037536621, "global_step": 444789, "epoch": 5358} {"train_loss": -27.113662719726562, "global_step": 444790, "epoch": 5358} {"train_loss": -27.001855850219727, "global_step": 444791, "epoch": 5358} {"train_loss": -26.8789005279541, "global_step": 444792, "epoch": 5358} {"train_loss": -27.291982650756836, "global_step": 444793, "epoch": 5358} {"train_loss": -27.106847763061523, "global_step": 444794, "epoch": 5358} {"train_loss": -27.137561798095703, "global_step": 444795, "epoch": 5358} {"train_loss": -26.837670016001507, "global_step": 444796, "epoch": 5358, "val_loss": 6553483.0} {"train_loss": -27.12942886352539, "global_step": 444797, "epoch": 5359} {"train_loss": -26.664575576782227, "global_step": 444798, "epoch": 5359} {"train_loss": -26.600208282470703, "global_step": 444799, "epoch": 5359} {"train_loss": -26.426776885986328, "global_step": 444800, "epoch": 5359} {"train_loss": -26.40631675720215, "global_step": 444801, "epoch": 5359} {"train_loss": -25.951196670532227, "global_step": 444802, "epoch": 5359} {"train_loss": -26.535110473632812, "global_step": 444803, "epoch": 5359} {"train_loss": -26.654743194580078, "global_step": 444804, "epoch": 5359} {"train_loss": -26.476215362548828, "global_step": 444805, "epoch": 5359} {"train_loss": -26.683984756469727, "global_step": 444806, "epoch": 5359} {"train_loss": -26.252944946289062, "global_step": 444807, "epoch": 5359} {"train_loss": -27.222875595092773, "global_step": 444808, "epoch": 5359} {"train_loss": -26.64988136291504, "global_step": 444809, "epoch": 5359} {"train_loss": -26.842756271362305, "global_step": 444810, "epoch": 5359} {"train_loss": -26.88895034790039, "global_step": 444811, "epoch": 5359} {"train_loss": -26.627634048461914, "global_step": 444812, "epoch": 5359} {"train_loss": -27.03609275817871, "global_step": 444813, "epoch": 5359} {"train_loss": -26.787397384643555, "global_step": 444814, "epoch": 5359} {"train_loss": -26.897418975830078, "global_step": 444815, "epoch": 5359} {"train_loss": -26.438947677612305, "global_step": 444816, "epoch": 5359} {"train_loss": -26.918256759643555, "global_step": 444817, "epoch": 5359} {"train_loss": -26.96832847595215, "global_step": 444818, "epoch": 5359} {"train_loss": -27.02166175842285, "global_step": 444819, "epoch": 5359} {"train_loss": -27.191030502319336, "global_step": 444820, "epoch": 5359} {"train_loss": -27.29276466369629, "global_step": 444821, "epoch": 5359} {"train_loss": -26.713937759399414, "global_step": 444822, "epoch": 5359} {"train_loss": -27.017614364624023, "global_step": 444823, "epoch": 5359} {"train_loss": -27.185338973999023, "global_step": 444824, "epoch": 5359} {"train_loss": -27.040613174438477, "global_step": 444825, "epoch": 5359} {"train_loss": -26.999725341796875, "global_step": 444826, "epoch": 5359} {"train_loss": -26.715381622314453, "global_step": 444827, "epoch": 5359} {"train_loss": -27.36195182800293, "global_step": 444828, "epoch": 5359} {"train_loss": -27.1949520111084, "global_step": 444829, "epoch": 5359} {"train_loss": -26.933536529541016, "global_step": 444830, "epoch": 5359} {"train_loss": -27.26047134399414, "global_step": 444831, "epoch": 5359} {"train_loss": -27.18853187561035, "global_step": 444832, "epoch": 5359} {"train_loss": -26.60025978088379, "global_step": 444833, "epoch": 5359} {"train_loss": -27.165430068969727, "global_step": 444834, "epoch": 5359} {"train_loss": -27.183935165405273, "global_step": 444835, "epoch": 5359} {"train_loss": -27.161243438720703, "global_step": 444836, "epoch": 5359} {"train_loss": -27.079736709594727, "global_step": 444837, "epoch": 5359} {"train_loss": -27.115262985229492, "global_step": 444838, "epoch": 5359} {"train_loss": -26.99916648864746, "global_step": 444839, "epoch": 5359} {"train_loss": -27.188995361328125, "global_step": 444840, "epoch": 5359} {"train_loss": -27.35011100769043, "global_step": 444841, "epoch": 5359} {"train_loss": -27.0535831451416, "global_step": 444842, "epoch": 5359} {"train_loss": -26.82061767578125, "global_step": 444843, "epoch": 5359} {"train_loss": -27.19768714904785, "global_step": 444844, "epoch": 5359} {"train_loss": -26.840656280517578, "global_step": 444845, "epoch": 5359} {"train_loss": -27.146427154541016, "global_step": 444846, "epoch": 5359} {"train_loss": -27.24169921875, "global_step": 444847, "epoch": 5359} {"train_loss": -26.94748878479004, "global_step": 444848, "epoch": 5359} {"train_loss": -27.342533111572266, "global_step": 444849, "epoch": 5359} {"train_loss": -27.033979415893555, "global_step": 444850, "epoch": 5359} {"train_loss": -26.918411254882812, "global_step": 444851, "epoch": 5359} {"train_loss": -27.166519165039062, "global_step": 444852, "epoch": 5359} {"train_loss": -26.538354873657227, "global_step": 444853, "epoch": 5359} {"train_loss": -27.203702926635742, "global_step": 444854, "epoch": 5359} {"train_loss": -27.373517990112305, "global_step": 444855, "epoch": 5359} {"train_loss": -27.17217445373535, "global_step": 444856, "epoch": 5359} {"train_loss": -26.831771850585938, "global_step": 444857, "epoch": 5359} {"train_loss": -27.08106803894043, "global_step": 444858, "epoch": 5359} {"train_loss": -27.104455947875977, "global_step": 444859, "epoch": 5359} {"train_loss": -26.834735870361328, "global_step": 444860, "epoch": 5359} {"train_loss": -26.805540084838867, "global_step": 444861, "epoch": 5359} {"train_loss": -26.84678077697754, "global_step": 444862, "epoch": 5359} {"train_loss": -26.809864044189453, "global_step": 444863, "epoch": 5359} {"train_loss": -27.112890243530273, "global_step": 444864, "epoch": 5359} {"train_loss": -26.461124420166016, "global_step": 444865, "epoch": 5359} {"train_loss": -27.16059684753418, "global_step": 444866, "epoch": 5359} {"train_loss": -26.751346588134766, "global_step": 444867, "epoch": 5359} {"train_loss": -27.105497360229492, "global_step": 444868, "epoch": 5359} {"train_loss": -26.96943473815918, "global_step": 444869, "epoch": 5359} {"train_loss": -26.493484497070312, "global_step": 444870, "epoch": 5359} {"train_loss": -26.844823837280273, "global_step": 444871, "epoch": 5359} {"train_loss": -27.017621994018555, "global_step": 444872, "epoch": 5359} {"train_loss": -26.84014892578125, "global_step": 444873, "epoch": 5359} {"train_loss": -26.514432907104492, "global_step": 444874, "epoch": 5359} {"train_loss": -27.1099853515625, "global_step": 444875, "epoch": 5359} {"train_loss": -26.87102699279785, "global_step": 444876, "epoch": 5359} {"train_loss": -27.22466468811035, "global_step": 444877, "epoch": 5359} {"train_loss": -26.818466186523438, "global_step": 444878, "epoch": 5359} {"train_loss": -26.924393596419367, "global_step": 444879, "epoch": 5359, "val_loss": 6602340.5} {"train_loss": -25.735227584838867, "global_step": 444880, "epoch": 5360} {"train_loss": -26.673246383666992, "global_step": 444881, "epoch": 5360} {"train_loss": -25.796253204345703, "global_step": 444882, "epoch": 5360} {"train_loss": -25.622303009033203, "global_step": 444883, "epoch": 5360} {"train_loss": -25.843481063842773, "global_step": 444884, "epoch": 5360} {"train_loss": -26.475250244140625, "global_step": 444885, "epoch": 5360} {"train_loss": -26.053176879882812, "global_step": 444886, "epoch": 5360} {"train_loss": -26.163503646850586, "global_step": 444887, "epoch": 5360} {"train_loss": -26.21622657775879, "global_step": 444888, "epoch": 5360} {"train_loss": -26.421030044555664, "global_step": 444889, "epoch": 5360} {"train_loss": -26.50858497619629, "global_step": 444890, "epoch": 5360} {"train_loss": -26.184926986694336, "global_step": 444891, "epoch": 5360} {"train_loss": -26.472578048706055, "global_step": 444892, "epoch": 5360} {"train_loss": -26.467823028564453, "global_step": 444893, "epoch": 5360} {"train_loss": -26.710657119750977, "global_step": 444894, "epoch": 5360} {"train_loss": -26.299331665039062, "global_step": 444895, "epoch": 5360} {"train_loss": -26.846540451049805, "global_step": 444896, "epoch": 5360} {"train_loss": -26.462202072143555, "global_step": 444897, "epoch": 5360} {"train_loss": -26.50653076171875, "global_step": 444898, "epoch": 5360} {"train_loss": -26.74744987487793, "global_step": 444899, "epoch": 5360} {"train_loss": -26.613306045532227, "global_step": 444900, "epoch": 5360} {"train_loss": -26.871490478515625, "global_step": 444901, "epoch": 5360} {"train_loss": -27.021183013916016, "global_step": 444902, "epoch": 5360} {"train_loss": -26.86927604675293, "global_step": 444903, "epoch": 5360} {"train_loss": -26.70549964904785, "global_step": 444904, "epoch": 5360} {"train_loss": -26.906530380249023, "global_step": 444905, "epoch": 5360} {"train_loss": -26.600311279296875, "global_step": 444906, "epoch": 5360} {"train_loss": -26.898849487304688, "global_step": 444907, "epoch": 5360} {"train_loss": -26.67371940612793, "global_step": 444908, "epoch": 5360} {"train_loss": -26.70814323425293, "global_step": 444909, "epoch": 5360} {"train_loss": -26.92750358581543, "global_step": 444910, "epoch": 5360} {"train_loss": -26.90791130065918, "global_step": 444911, "epoch": 5360} {"train_loss": -26.975421905517578, "global_step": 444912, "epoch": 5360} {"train_loss": -26.689329147338867, "global_step": 444913, "epoch": 5360} {"train_loss": -27.02967643737793, "global_step": 444914, "epoch": 5360} {"train_loss": -27.063398361206055, "global_step": 444915, "epoch": 5360} {"train_loss": -26.970233917236328, "global_step": 444916, "epoch": 5360} {"train_loss": -26.955142974853516, "global_step": 444917, "epoch": 5360} {"train_loss": -26.835620880126953, "global_step": 444918, "epoch": 5360} {"train_loss": -27.09185218811035, "global_step": 444919, "epoch": 5360} {"train_loss": -26.975366592407227, "global_step": 444920, "epoch": 5360} {"train_loss": -27.104522705078125, "global_step": 444921, "epoch": 5360} {"train_loss": -26.933704376220703, "global_step": 444922, "epoch": 5360} {"train_loss": -27.005237579345703, "global_step": 444923, "epoch": 5360} {"train_loss": -26.86957359313965, "global_step": 444924, "epoch": 5360} {"train_loss": -27.109516143798828, "global_step": 444925, "epoch": 5360} {"train_loss": -26.976276397705078, "global_step": 444926, "epoch": 5360} {"train_loss": -27.52199363708496, "global_step": 444927, "epoch": 5360} {"train_loss": -26.608057022094727, "global_step": 444928, "epoch": 5360} {"train_loss": -27.05126953125, "global_step": 444929, "epoch": 5360} {"train_loss": -27.138599395751953, "global_step": 444930, "epoch": 5360} {"train_loss": -27.169504165649414, "global_step": 444931, "epoch": 5360} {"train_loss": -27.116779327392578, "global_step": 444932, "epoch": 5360} {"train_loss": -26.911039352416992, "global_step": 444933, "epoch": 5360} {"train_loss": -27.215255737304688, "global_step": 444934, "epoch": 5360} {"train_loss": -27.150775909423828, "global_step": 444935, "epoch": 5360} {"train_loss": -26.6837215423584, "global_step": 444936, "epoch": 5360} {"train_loss": -26.69091796875, "global_step": 444937, "epoch": 5360} {"train_loss": -27.195642471313477, "global_step": 444938, "epoch": 5360} {"train_loss": -26.714435577392578, "global_step": 444939, "epoch": 5360} {"train_loss": -27.213306427001953, "global_step": 444940, "epoch": 5360} {"train_loss": -27.44866371154785, "global_step": 444941, "epoch": 5360} {"train_loss": -26.678791046142578, "global_step": 444942, "epoch": 5360} {"train_loss": -27.115066528320312, "global_step": 444943, "epoch": 5360} {"train_loss": -26.932662963867188, "global_step": 444944, "epoch": 5360} {"train_loss": -26.891407012939453, "global_step": 444945, "epoch": 5360} {"train_loss": -27.16010093688965, "global_step": 444946, "epoch": 5360} {"train_loss": -27.14495277404785, "global_step": 444947, "epoch": 5360} {"train_loss": -26.859365463256836, "global_step": 444948, "epoch": 5360} {"train_loss": -26.959674835205078, "global_step": 444949, "epoch": 5360} {"train_loss": -27.35626220703125, "global_step": 444950, "epoch": 5360} {"train_loss": -26.543378829956055, "global_step": 444951, "epoch": 5360} {"train_loss": -26.65386390686035, "global_step": 444952, "epoch": 5360} {"train_loss": -27.020923614501953, "global_step": 444953, "epoch": 5360} {"train_loss": -27.28565788269043, "global_step": 444954, "epoch": 5360} {"train_loss": -27.013675689697266, "global_step": 444955, "epoch": 5360} {"train_loss": -27.266752243041992, "global_step": 444956, "epoch": 5360} {"train_loss": -27.10660743713379, "global_step": 444957, "epoch": 5360} {"train_loss": -26.532323837280273, "global_step": 444958, "epoch": 5360} {"train_loss": -26.927356719970703, "global_step": 444959, "epoch": 5360} {"train_loss": -26.75345230102539, "global_step": 444960, "epoch": 5360} {"train_loss": -27.202070236206055, "global_step": 444961, "epoch": 5360} {"train_loss": -26.807080004588666, "global_step": 444962, "epoch": 5360, "val_loss": 6576820.0} {"train_loss": -26.503454208374023, "global_step": 444963, "epoch": 5361} {"train_loss": -26.623126983642578, "global_step": 444964, "epoch": 5361} {"train_loss": -26.292621612548828, "global_step": 444965, "epoch": 5361} {"train_loss": -26.535629272460938, "global_step": 444966, "epoch": 5361} {"train_loss": -26.63764762878418, "global_step": 444967, "epoch": 5361} {"train_loss": -25.930219650268555, "global_step": 444968, "epoch": 5361} {"train_loss": -27.111440658569336, "global_step": 444969, "epoch": 5361} {"train_loss": -26.371362686157227, "global_step": 444970, "epoch": 5361} {"train_loss": -26.550918579101562, "global_step": 444971, "epoch": 5361} {"train_loss": -26.26263999938965, "global_step": 444972, "epoch": 5361} {"train_loss": -27.03510856628418, "global_step": 444973, "epoch": 5361} {"train_loss": -26.676233291625977, "global_step": 444974, "epoch": 5361} {"train_loss": -26.651941299438477, "global_step": 444975, "epoch": 5361} {"train_loss": -27.178842544555664, "global_step": 444976, "epoch": 5361} {"train_loss": -26.9986572265625, "global_step": 444977, "epoch": 5361} {"train_loss": -26.945541381835938, "global_step": 444978, "epoch": 5361} {"train_loss": -26.953393936157227, "global_step": 444979, "epoch": 5361} {"train_loss": -26.8179874420166, "global_step": 444980, "epoch": 5361} {"train_loss": -26.950061798095703, "global_step": 444981, "epoch": 5361} {"train_loss": -27.256982803344727, "global_step": 444982, "epoch": 5361} {"train_loss": -27.0642147064209, "global_step": 444983, "epoch": 5361} {"train_loss": -26.84710121154785, "global_step": 444984, "epoch": 5361} {"train_loss": -27.151569366455078, "global_step": 444985, "epoch": 5361} {"train_loss": -26.678714752197266, "global_step": 444986, "epoch": 5361} {"train_loss": -27.150222778320312, "global_step": 444987, "epoch": 5361} {"train_loss": -26.91643714904785, "global_step": 444988, "epoch": 5361} {"train_loss": -26.772932052612305, "global_step": 444989, "epoch": 5361} {"train_loss": -26.803266525268555, "global_step": 444990, "epoch": 5361} {"train_loss": -27.12091064453125, "global_step": 444991, "epoch": 5361} {"train_loss": -27.4758358001709, "global_step": 444992, "epoch": 5361} {"train_loss": -27.04982566833496, "global_step": 444993, "epoch": 5361} {"train_loss": -26.896100997924805, "global_step": 444994, "epoch": 5361} {"train_loss": -26.917728424072266, "global_step": 444995, "epoch": 5361} {"train_loss": -27.151891708374023, "global_step": 444996, "epoch": 5361} {"train_loss": -26.6986026763916, "global_step": 444997, "epoch": 5361} {"train_loss": -27.332456588745117, "global_step": 444998, "epoch": 5361} {"train_loss": -26.856922149658203, "global_step": 444999, "epoch": 5361} {"train_loss": -27.053335189819336, "global_step": 445000, "epoch": 5361} {"train_loss": -27.316059112548828, "global_step": 445001, "epoch": 5361} {"train_loss": -26.93743896484375, "global_step": 445002, "epoch": 5361} {"train_loss": -27.12325096130371, "global_step": 445003, "epoch": 5361} {"train_loss": -26.81379508972168, "global_step": 445004, "epoch": 5361} {"train_loss": -27.12079429626465, "global_step": 445005, "epoch": 5361} {"train_loss": -27.071462631225586, "global_step": 445006, "epoch": 5361} {"train_loss": -27.092588424682617, "global_step": 445007, "epoch": 5361} {"train_loss": -26.945892333984375, "global_step": 445008, "epoch": 5361} {"train_loss": -26.721471786499023, "global_step": 445009, "epoch": 5361} {"train_loss": -26.55575942993164, "global_step": 445010, "epoch": 5361} {"train_loss": -27.28289794921875, "global_step": 445011, "epoch": 5361} {"train_loss": -27.043527603149414, "global_step": 445012, "epoch": 5361} {"train_loss": -27.24880027770996, "global_step": 445013, "epoch": 5361} {"train_loss": -26.801050186157227, "global_step": 445014, "epoch": 5361} {"train_loss": -27.135099411010742, "global_step": 445015, "epoch": 5361} {"train_loss": -27.17410659790039, "global_step": 445016, "epoch": 5361} {"train_loss": -27.07047462463379, "global_step": 445017, "epoch": 5361} {"train_loss": -27.179677963256836, "global_step": 445018, "epoch": 5361} {"train_loss": -27.136383056640625, "global_step": 445019, "epoch": 5361} {"train_loss": -26.68776512145996, "global_step": 445020, "epoch": 5361} {"train_loss": -26.7492733001709, "global_step": 445021, "epoch": 5361} {"train_loss": -27.1292724609375, "global_step": 445022, "epoch": 5361} {"train_loss": -27.122350692749023, "global_step": 445023, "epoch": 5361} {"train_loss": -27.07611656188965, "global_step": 445024, "epoch": 5361} {"train_loss": -27.11573600769043, "global_step": 445025, "epoch": 5361} {"train_loss": -27.285491943359375, "global_step": 445026, "epoch": 5361} {"train_loss": -27.222415924072266, "global_step": 445027, "epoch": 5361} {"train_loss": -27.1466064453125, "global_step": 445028, "epoch": 5361} {"train_loss": -27.31551170349121, "global_step": 445029, "epoch": 5361} {"train_loss": -27.094867706298828, "global_step": 445030, "epoch": 5361} {"train_loss": -27.055816650390625, "global_step": 445031, "epoch": 5361} {"train_loss": -27.0225772857666, "global_step": 445032, "epoch": 5361} {"train_loss": -26.827301025390625, "global_step": 445033, "epoch": 5361} {"train_loss": -26.90870475769043, "global_step": 445034, "epoch": 5361} {"train_loss": -26.92633628845215, "global_step": 445035, "epoch": 5361} {"train_loss": -27.16766929626465, "global_step": 445036, "epoch": 5361} {"train_loss": -27.064611434936523, "global_step": 445037, "epoch": 5361} {"train_loss": -26.844482421875, "global_step": 445038, "epoch": 5361} {"train_loss": -26.517414093017578, "global_step": 445039, "epoch": 5361} {"train_loss": -26.895450592041016, "global_step": 445040, "epoch": 5361} {"train_loss": -26.89882469177246, "global_step": 445041, "epoch": 5361} {"train_loss": -27.135038375854492, "global_step": 445042, "epoch": 5361} {"train_loss": -27.116575241088867, "global_step": 445043, "epoch": 5361} {"train_loss": -26.947540283203125, "global_step": 445044, "epoch": 5361} {"train_loss": -26.93176641808935, "global_step": 445045, "epoch": 5361, "val_loss": 6537818.0} {"train_loss": -25.813562393188477, "global_step": 445046, "epoch": 5362} {"train_loss": -26.779706954956055, "global_step": 445047, "epoch": 5362} {"train_loss": -26.524011611938477, "global_step": 445048, "epoch": 5362} {"train_loss": -26.237348556518555, "global_step": 445049, "epoch": 5362} {"train_loss": -26.591745376586914, "global_step": 445050, "epoch": 5362} {"train_loss": -26.722421646118164, "global_step": 445051, "epoch": 5362} {"train_loss": -26.770841598510742, "global_step": 445052, "epoch": 5362} {"train_loss": -26.464460372924805, "global_step": 445053, "epoch": 5362} {"train_loss": -27.205997467041016, "global_step": 445054, "epoch": 5362} {"train_loss": -26.715423583984375, "global_step": 445055, "epoch": 5362} {"train_loss": -26.74956703186035, "global_step": 445056, "epoch": 5362} {"train_loss": -26.875228881835938, "global_step": 445057, "epoch": 5362} {"train_loss": -26.837207794189453, "global_step": 445058, "epoch": 5362} {"train_loss": -26.584613800048828, "global_step": 445059, "epoch": 5362} {"train_loss": -26.585607528686523, "global_step": 445060, "epoch": 5362} {"train_loss": -26.419769287109375, "global_step": 445061, "epoch": 5362} {"train_loss": -26.714298248291016, "global_step": 445062, "epoch": 5362} {"train_loss": -26.689176559448242, "global_step": 445063, "epoch": 5362} {"train_loss": -26.81354331970215, "global_step": 445064, "epoch": 5362} {"train_loss": -26.7531681060791, "global_step": 445065, "epoch": 5362} {"train_loss": -27.037841796875, "global_step": 445066, "epoch": 5362} {"train_loss": -26.820240020751953, "global_step": 445067, "epoch": 5362} {"train_loss": -27.190906524658203, "global_step": 445068, "epoch": 5362} {"train_loss": -27.208343505859375, "global_step": 445069, "epoch": 5362} {"train_loss": -26.739431381225586, "global_step": 445070, "epoch": 5362} {"train_loss": -26.808795928955078, "global_step": 445071, "epoch": 5362} {"train_loss": -27.03486442565918, "global_step": 445072, "epoch": 5362} {"train_loss": -27.20566749572754, "global_step": 445073, "epoch": 5362} {"train_loss": -26.95206642150879, "global_step": 445074, "epoch": 5362} {"train_loss": -26.915197372436523, "global_step": 445075, "epoch": 5362} {"train_loss": -27.076766967773438, "global_step": 445076, "epoch": 5362} {"train_loss": -26.937397003173828, "global_step": 445077, "epoch": 5362} {"train_loss": -27.255834579467773, "global_step": 445078, "epoch": 5362} {"train_loss": -26.82577896118164, "global_step": 445079, "epoch": 5362} {"train_loss": -27.23028564453125, "global_step": 445080, "epoch": 5362} {"train_loss": -26.94171142578125, "global_step": 445081, "epoch": 5362} {"train_loss": -26.70924186706543, "global_step": 445082, "epoch": 5362} {"train_loss": -27.264036178588867, "global_step": 445083, "epoch": 5362} {"train_loss": -27.041675567626953, "global_step": 445084, "epoch": 5362} {"train_loss": -27.10031509399414, "global_step": 445085, "epoch": 5362} {"train_loss": -27.07126808166504, "global_step": 445086, "epoch": 5362} {"train_loss": -26.963098526000977, "global_step": 445087, "epoch": 5362} {"train_loss": -26.862720489501953, "global_step": 445088, "epoch": 5362} {"train_loss": -27.16493034362793, "global_step": 445089, "epoch": 5362} {"train_loss": -26.697790145874023, "global_step": 445090, "epoch": 5362} {"train_loss": -26.792999267578125, "global_step": 445091, "epoch": 5362} {"train_loss": -26.54131507873535, "global_step": 445092, "epoch": 5362} {"train_loss": -27.07756996154785, "global_step": 445093, "epoch": 5362} {"train_loss": -26.984100341796875, "global_step": 445094, "epoch": 5362} {"train_loss": -27.079084396362305, "global_step": 445095, "epoch": 5362} {"train_loss": -27.469223022460938, "global_step": 445096, "epoch": 5362} {"train_loss": -27.124719619750977, "global_step": 445097, "epoch": 5362} {"train_loss": -27.220352172851562, "global_step": 445098, "epoch": 5362} {"train_loss": -27.073251724243164, "global_step": 445099, "epoch": 5362} {"train_loss": -27.032150268554688, "global_step": 445100, "epoch": 5362} {"train_loss": -27.118743896484375, "global_step": 445101, "epoch": 5362} {"train_loss": -26.844526290893555, "global_step": 445102, "epoch": 5362} {"train_loss": -26.998779296875, "global_step": 445103, "epoch": 5362} {"train_loss": -26.986684799194336, "global_step": 445104, "epoch": 5362} {"train_loss": -27.138641357421875, "global_step": 445105, "epoch": 5362} {"train_loss": -27.085493087768555, "global_step": 445106, "epoch": 5362} {"train_loss": -26.576370239257812, "global_step": 445107, "epoch": 5362} {"train_loss": -26.7309513092041, "global_step": 445108, "epoch": 5362} {"train_loss": -26.577489852905273, "global_step": 445109, "epoch": 5362} {"train_loss": -26.90586280822754, "global_step": 445110, "epoch": 5362} {"train_loss": -27.3656005859375, "global_step": 445111, "epoch": 5362} {"train_loss": -26.69732666015625, "global_step": 445112, "epoch": 5362} {"train_loss": -26.857309341430664, "global_step": 445113, "epoch": 5362} {"train_loss": -26.931909561157227, "global_step": 445114, "epoch": 5362} {"train_loss": -26.302734375, "global_step": 445115, "epoch": 5362} {"train_loss": -26.450820922851562, "global_step": 445116, "epoch": 5362} {"train_loss": -25.87806510925293, "global_step": 445117, "epoch": 5362} {"train_loss": -26.38762855529785, "global_step": 445118, "epoch": 5362} {"train_loss": -26.111331939697266, "global_step": 445119, "epoch": 5362} {"train_loss": -26.900531768798828, "global_step": 445120, "epoch": 5362} {"train_loss": -26.48086929321289, "global_step": 445121, "epoch": 5362} {"train_loss": -26.6629638671875, "global_step": 445122, "epoch": 5362} {"train_loss": -26.411787033081055, "global_step": 445123, "epoch": 5362} {"train_loss": -26.599746704101562, "global_step": 445124, "epoch": 5362} {"train_loss": -26.81104850769043, "global_step": 445125, "epoch": 5362} {"train_loss": -26.885034561157227, "global_step": 445126, "epoch": 5362} {"train_loss": -26.831085205078125, "global_step": 445127, "epoch": 5362} {"train_loss": -26.803243200462983, "global_step": 445128, "epoch": 5362, "val_loss": 6529961.5} {"train_loss": -25.236053466796875, "global_step": 445129, "epoch": 5363} {"train_loss": -25.421152114868164, "global_step": 445130, "epoch": 5363} {"train_loss": -26.42083740234375, "global_step": 445131, "epoch": 5363} {"train_loss": -25.77130699157715, "global_step": 445132, "epoch": 5363} {"train_loss": -26.30352210998535, "global_step": 445133, "epoch": 5363} {"train_loss": -25.757638931274414, "global_step": 445134, "epoch": 5363} {"train_loss": -26.5052433013916, "global_step": 445135, "epoch": 5363} {"train_loss": -26.40903091430664, "global_step": 445136, "epoch": 5363} {"train_loss": -26.249359130859375, "global_step": 445137, "epoch": 5363} {"train_loss": -26.396886825561523, "global_step": 445138, "epoch": 5363} {"train_loss": -26.205341339111328, "global_step": 445139, "epoch": 5363} {"train_loss": -26.71546745300293, "global_step": 445140, "epoch": 5363} {"train_loss": -26.61333656311035, "global_step": 445141, "epoch": 5363} {"train_loss": -26.634714126586914, "global_step": 445142, "epoch": 5363} {"train_loss": -26.520421981811523, "global_step": 445143, "epoch": 5363} {"train_loss": -26.576358795166016, "global_step": 445144, "epoch": 5363} {"train_loss": -26.432302474975586, "global_step": 445145, "epoch": 5363} {"train_loss": -26.78004264831543, "global_step": 445146, "epoch": 5363} {"train_loss": -26.64042091369629, "global_step": 445147, "epoch": 5363} {"train_loss": -26.71453857421875, "global_step": 445148, "epoch": 5363} {"train_loss": -26.867752075195312, "global_step": 445149, "epoch": 5363} {"train_loss": -26.76612663269043, "global_step": 445150, "epoch": 5363} {"train_loss": -26.75180435180664, "global_step": 445151, "epoch": 5363} {"train_loss": -26.72369384765625, "global_step": 445152, "epoch": 5363} {"train_loss": -26.73295021057129, "global_step": 445153, "epoch": 5363} {"train_loss": -26.919111251831055, "global_step": 445154, "epoch": 5363} {"train_loss": -27.093442916870117, "global_step": 445155, "epoch": 5363} {"train_loss": -27.118000030517578, "global_step": 445156, "epoch": 5363} {"train_loss": -26.991392135620117, "global_step": 445157, "epoch": 5363} {"train_loss": -26.979089736938477, "global_step": 445158, "epoch": 5363} {"train_loss": -27.0743408203125, "global_step": 445159, "epoch": 5363} {"train_loss": -27.17054557800293, "global_step": 445160, "epoch": 5363} {"train_loss": -27.062274932861328, "global_step": 445161, "epoch": 5363} {"train_loss": -27.106399536132812, "global_step": 445162, "epoch": 5363} {"train_loss": -27.016647338867188, "global_step": 445163, "epoch": 5363} {"train_loss": -27.0700740814209, "global_step": 445164, "epoch": 5363} {"train_loss": -26.707571029663086, "global_step": 445165, "epoch": 5363} {"train_loss": -27.19026756286621, "global_step": 445166, "epoch": 5363} {"train_loss": -27.057294845581055, "global_step": 445167, "epoch": 5363} {"train_loss": -27.00727653503418, "global_step": 445168, "epoch": 5363} {"train_loss": -26.951868057250977, "global_step": 445169, "epoch": 5363} {"train_loss": -27.063953399658203, "global_step": 445170, "epoch": 5363} {"train_loss": -26.543088912963867, "global_step": 445171, "epoch": 5363} {"train_loss": -27.31867790222168, "global_step": 445172, "epoch": 5363} {"train_loss": -27.2635440826416, "global_step": 445173, "epoch": 5363} {"train_loss": -26.93048095703125, "global_step": 445174, "epoch": 5363} {"train_loss": -27.192157745361328, "global_step": 445175, "epoch": 5363} {"train_loss": -27.187763214111328, "global_step": 445176, "epoch": 5363} {"train_loss": -27.21417236328125, "global_step": 445177, "epoch": 5363} {"train_loss": -27.373544692993164, "global_step": 445178, "epoch": 5363} {"train_loss": -27.233442306518555, "global_step": 445179, "epoch": 5363} {"train_loss": -27.2368221282959, "global_step": 445180, "epoch": 5363} {"train_loss": -26.877222061157227, "global_step": 445181, "epoch": 5363} {"train_loss": -26.676345825195312, "global_step": 445182, "epoch": 5363} {"train_loss": -27.10308265686035, "global_step": 445183, "epoch": 5363} {"train_loss": -27.038660049438477, "global_step": 445184, "epoch": 5363} {"train_loss": -26.440168380737305, "global_step": 445185, "epoch": 5363} {"train_loss": -27.2729434967041, "global_step": 445186, "epoch": 5363} {"train_loss": -27.255905151367188, "global_step": 445187, "epoch": 5363} {"train_loss": -27.60129737854004, "global_step": 445188, "epoch": 5363} {"train_loss": -26.713275909423828, "global_step": 445189, "epoch": 5363} {"train_loss": -26.67667579650879, "global_step": 445190, "epoch": 5363} {"train_loss": -26.538137435913086, "global_step": 445191, "epoch": 5363} {"train_loss": -26.738967895507812, "global_step": 445192, "epoch": 5363} {"train_loss": -26.908344268798828, "global_step": 445193, "epoch": 5363} {"train_loss": -26.230676651000977, "global_step": 445194, "epoch": 5363} {"train_loss": -26.15308952331543, "global_step": 445195, "epoch": 5363} {"train_loss": -27.044189453125, "global_step": 445196, "epoch": 5363} {"train_loss": -26.891027450561523, "global_step": 445197, "epoch": 5363} {"train_loss": -26.91280174255371, "global_step": 445198, "epoch": 5363} {"train_loss": -26.898401260375977, "global_step": 445199, "epoch": 5363} {"train_loss": -26.716388702392578, "global_step": 445200, "epoch": 5363} {"train_loss": -26.91888999938965, "global_step": 445201, "epoch": 5363} {"train_loss": -27.269519805908203, "global_step": 445202, "epoch": 5363} {"train_loss": -26.778717041015625, "global_step": 445203, "epoch": 5363} {"train_loss": -27.05129051208496, "global_step": 445204, "epoch": 5363} {"train_loss": -26.518041610717773, "global_step": 445205, "epoch": 5363} {"train_loss": -26.898710250854492, "global_step": 445206, "epoch": 5363} {"train_loss": -27.295166015625, "global_step": 445207, "epoch": 5363} {"train_loss": -27.2060604095459, "global_step": 445208, "epoch": 5363} {"train_loss": -26.799169540405273, "global_step": 445209, "epoch": 5363} {"train_loss": -26.8453369140625, "global_step": 445210, "epoch": 5363} {"train_loss": -26.811604924948817, "global_step": 445211, "epoch": 5363, "val_loss": 6577418.5} {"train_loss": -26.687047958374023, "global_step": 445212, "epoch": 5364} {"train_loss": -26.409683227539062, "global_step": 445213, "epoch": 5364} {"train_loss": -25.679691314697266, "global_step": 445214, "epoch": 5364} {"train_loss": -25.33742904663086, "global_step": 445215, "epoch": 5364} {"train_loss": -25.154239654541016, "global_step": 445216, "epoch": 5364} {"train_loss": -26.46595573425293, "global_step": 445217, "epoch": 5364} {"train_loss": -26.324588775634766, "global_step": 445218, "epoch": 5364} {"train_loss": -26.2659854888916, "global_step": 445219, "epoch": 5364} {"train_loss": -26.125762939453125, "global_step": 445220, "epoch": 5364} {"train_loss": -26.8331298828125, "global_step": 445221, "epoch": 5364} {"train_loss": -26.636159896850586, "global_step": 445222, "epoch": 5364} {"train_loss": -26.8450870513916, "global_step": 445223, "epoch": 5364} {"train_loss": -26.42234230041504, "global_step": 445224, "epoch": 5364} {"train_loss": -26.746374130249023, "global_step": 445225, "epoch": 5364} {"train_loss": -27.064416885375977, "global_step": 445226, "epoch": 5364} {"train_loss": -27.026391983032227, "global_step": 445227, "epoch": 5364} {"train_loss": -26.994373321533203, "global_step": 445228, "epoch": 5364} {"train_loss": -26.72247314453125, "global_step": 445229, "epoch": 5364} {"train_loss": -26.465560913085938, "global_step": 445230, "epoch": 5364} {"train_loss": -26.761890411376953, "global_step": 445231, "epoch": 5364} {"train_loss": -26.878564834594727, "global_step": 445232, "epoch": 5364} {"train_loss": -27.016178131103516, "global_step": 445233, "epoch": 5364} {"train_loss": -26.8864803314209, "global_step": 445234, "epoch": 5364} {"train_loss": -26.504135131835938, "global_step": 445235, "epoch": 5364} {"train_loss": -27.192340850830078, "global_step": 445236, "epoch": 5364} {"train_loss": -26.93564224243164, "global_step": 445237, "epoch": 5364} {"train_loss": -26.940719604492188, "global_step": 445238, "epoch": 5364} {"train_loss": -26.718915939331055, "global_step": 445239, "epoch": 5364} {"train_loss": -26.897653579711914, "global_step": 445240, "epoch": 5364} {"train_loss": -27.038803100585938, "global_step": 445241, "epoch": 5364} {"train_loss": -26.897125244140625, "global_step": 445242, "epoch": 5364} {"train_loss": -26.966947555541992, "global_step": 445243, "epoch": 5364} {"train_loss": -27.145090103149414, "global_step": 445244, "epoch": 5364} {"train_loss": -26.960363388061523, "global_step": 445245, "epoch": 5364} {"train_loss": -26.866262435913086, "global_step": 445246, "epoch": 5364} {"train_loss": -27.04852867126465, "global_step": 445247, "epoch": 5364} {"train_loss": -26.79334831237793, "global_step": 445248, "epoch": 5364} {"train_loss": -26.954187393188477, "global_step": 445249, "epoch": 5364} {"train_loss": -26.711715698242188, "global_step": 445250, "epoch": 5364} {"train_loss": -27.28773307800293, "global_step": 445251, "epoch": 5364} {"train_loss": -26.838415145874023, "global_step": 445252, "epoch": 5364} {"train_loss": -26.882080078125, "global_step": 445253, "epoch": 5364} {"train_loss": -26.59148597717285, "global_step": 445254, "epoch": 5364} {"train_loss": -26.6641788482666, "global_step": 445255, "epoch": 5364} {"train_loss": -26.73560905456543, "global_step": 445256, "epoch": 5364} {"train_loss": -27.014394760131836, "global_step": 445257, "epoch": 5364} {"train_loss": -27.313159942626953, "global_step": 445258, "epoch": 5364} {"train_loss": -26.790180206298828, "global_step": 445259, "epoch": 5364} {"train_loss": -26.320463180541992, "global_step": 445260, "epoch": 5364} {"train_loss": -26.60066032409668, "global_step": 445261, "epoch": 5364} {"train_loss": -26.46612548828125, "global_step": 445262, "epoch": 5364} {"train_loss": -26.95488929748535, "global_step": 445263, "epoch": 5364} {"train_loss": -26.827939987182617, "global_step": 445264, "epoch": 5364} {"train_loss": -26.45222282409668, "global_step": 445265, "epoch": 5364} {"train_loss": -26.78348159790039, "global_step": 445266, "epoch": 5364} {"train_loss": -27.25819206237793, "global_step": 445267, "epoch": 5364} {"train_loss": -27.09637451171875, "global_step": 445268, "epoch": 5364} {"train_loss": -26.706079483032227, "global_step": 445269, "epoch": 5364} {"train_loss": -26.614309310913086, "global_step": 445270, "epoch": 5364} {"train_loss": -26.90459632873535, "global_step": 445271, "epoch": 5364} {"train_loss": -26.96932029724121, "global_step": 445272, "epoch": 5364} {"train_loss": -26.897567749023438, "global_step": 445273, "epoch": 5364} {"train_loss": -26.8785400390625, "global_step": 445274, "epoch": 5364} {"train_loss": -27.028100967407227, "global_step": 445275, "epoch": 5364} {"train_loss": -26.918603897094727, "global_step": 445276, "epoch": 5364} {"train_loss": -26.89072608947754, "global_step": 445277, "epoch": 5364} {"train_loss": -26.608896255493164, "global_step": 445278, "epoch": 5364} {"train_loss": -26.7039737701416, "global_step": 445279, "epoch": 5364} {"train_loss": -26.73213768005371, "global_step": 445280, "epoch": 5364} {"train_loss": -26.707700729370117, "global_step": 445281, "epoch": 5364} {"train_loss": -26.93377113342285, "global_step": 445282, "epoch": 5364} {"train_loss": -26.95606803894043, "global_step": 445283, "epoch": 5364} {"train_loss": -26.834522247314453, "global_step": 445284, "epoch": 5364} {"train_loss": -26.920501708984375, "global_step": 445285, "epoch": 5364} {"train_loss": -27.06452751159668, "global_step": 445286, "epoch": 5364} {"train_loss": -27.08465003967285, "global_step": 445287, "epoch": 5364} {"train_loss": -27.275293350219727, "global_step": 445288, "epoch": 5364} {"train_loss": -26.897314071655273, "global_step": 445289, "epoch": 5364} {"train_loss": -26.8518009185791, "global_step": 445290, "epoch": 5364} {"train_loss": -26.9993896484375, "global_step": 445291, "epoch": 5364} {"train_loss": -27.356748580932617, "global_step": 445292, "epoch": 5364} {"train_loss": -27.379541397094727, "global_step": 445293, "epoch": 5364} {"train_loss": -26.792165526424547, "global_step": 445294, "epoch": 5364, "val_loss": 6626570.5} {"train_loss": -25.84299087524414, "global_step": 445295, "epoch": 5365} {"train_loss": -25.41840171813965, "global_step": 445296, "epoch": 5365} {"train_loss": -25.412160873413086, "global_step": 445297, "epoch": 5365} {"train_loss": -26.25568199157715, "global_step": 445298, "epoch": 5365} {"train_loss": -26.405689239501953, "global_step": 445299, "epoch": 5365} {"train_loss": -26.030187606811523, "global_step": 445300, "epoch": 5365} {"train_loss": -26.113813400268555, "global_step": 445301, "epoch": 5365} {"train_loss": -26.674829483032227, "global_step": 445302, "epoch": 5365} {"train_loss": -26.459030151367188, "global_step": 445303, "epoch": 5365} {"train_loss": -27.03022575378418, "global_step": 445304, "epoch": 5365} {"train_loss": -26.703657150268555, "global_step": 445305, "epoch": 5365} {"train_loss": -26.617517471313477, "global_step": 445306, "epoch": 5365} {"train_loss": -26.862030029296875, "global_step": 445307, "epoch": 5365} {"train_loss": -26.467086791992188, "global_step": 445308, "epoch": 5365} {"train_loss": -26.847604751586914, "global_step": 445309, "epoch": 5365} {"train_loss": -26.68171501159668, "global_step": 445310, "epoch": 5365} {"train_loss": -26.605915069580078, "global_step": 445311, "epoch": 5365} {"train_loss": -26.7526798248291, "global_step": 445312, "epoch": 5365} {"train_loss": -26.34647560119629, "global_step": 445313, "epoch": 5365} {"train_loss": -26.862964630126953, "global_step": 445314, "epoch": 5365} {"train_loss": -26.71152114868164, "global_step": 445315, "epoch": 5365} {"train_loss": -26.451263427734375, "global_step": 445316, "epoch": 5365} {"train_loss": -27.05246353149414, "global_step": 445317, "epoch": 5365} {"train_loss": -26.60491943359375, "global_step": 445318, "epoch": 5365} {"train_loss": -27.15411376953125, "global_step": 445319, "epoch": 5365} {"train_loss": -26.9332275390625, "global_step": 445320, "epoch": 5365} {"train_loss": -26.74384880065918, "global_step": 445321, "epoch": 5365} {"train_loss": -26.92633628845215, "global_step": 445322, "epoch": 5365} {"train_loss": -27.0644588470459, "global_step": 445323, "epoch": 5365} {"train_loss": -26.747800827026367, "global_step": 445324, "epoch": 5365} {"train_loss": -27.360553741455078, "global_step": 445325, "epoch": 5365} {"train_loss": -27.28034019470215, "global_step": 445326, "epoch": 5365} {"train_loss": -26.9096736907959, "global_step": 445327, "epoch": 5365} {"train_loss": -26.82013511657715, "global_step": 445328, "epoch": 5365} {"train_loss": -27.19757652282715, "global_step": 445329, "epoch": 5365} {"train_loss": -26.952478408813477, "global_step": 445330, "epoch": 5365} {"train_loss": -27.289697647094727, "global_step": 445331, "epoch": 5365} {"train_loss": -26.641712188720703, "global_step": 445332, "epoch": 5365} {"train_loss": -26.722949981689453, "global_step": 445333, "epoch": 5365} {"train_loss": -27.07329750061035, "global_step": 445334, "epoch": 5365} {"train_loss": -26.833505630493164, "global_step": 445335, "epoch": 5365} {"train_loss": -27.115324020385742, "global_step": 445336, "epoch": 5365} {"train_loss": -26.6453857421875, "global_step": 445337, "epoch": 5365} {"train_loss": -26.967321395874023, "global_step": 445338, "epoch": 5365} {"train_loss": -26.92447853088379, "global_step": 445339, "epoch": 5365} {"train_loss": -26.932214736938477, "global_step": 445340, "epoch": 5365} {"train_loss": -27.025653839111328, "global_step": 445341, "epoch": 5365} {"train_loss": -26.85141372680664, "global_step": 445342, "epoch": 5365} {"train_loss": -27.16829490661621, "global_step": 445343, "epoch": 5365} {"train_loss": -27.048681259155273, "global_step": 445344, "epoch": 5365} {"train_loss": -26.948530197143555, "global_step": 445345, "epoch": 5365} {"train_loss": -26.836750030517578, "global_step": 445346, "epoch": 5365} {"train_loss": -26.554309844970703, "global_step": 445347, "epoch": 5365} {"train_loss": -27.175989151000977, "global_step": 445348, "epoch": 5365} {"train_loss": -26.947113037109375, "global_step": 445349, "epoch": 5365} {"train_loss": -27.229141235351562, "global_step": 445350, "epoch": 5365} {"train_loss": -26.9134464263916, "global_step": 445351, "epoch": 5365} {"train_loss": -26.73831558227539, "global_step": 445352, "epoch": 5365} {"train_loss": -27.299962997436523, "global_step": 445353, "epoch": 5365} {"train_loss": -27.45062255859375, "global_step": 445354, "epoch": 5365} {"train_loss": -27.333105087280273, "global_step": 445355, "epoch": 5365} {"train_loss": -26.727941513061523, "global_step": 445356, "epoch": 5365} {"train_loss": -26.924060821533203, "global_step": 445357, "epoch": 5365} {"train_loss": -26.856735229492188, "global_step": 445358, "epoch": 5365} {"train_loss": -27.277006149291992, "global_step": 445359, "epoch": 5365} {"train_loss": -27.402204513549805, "global_step": 445360, "epoch": 5365} {"train_loss": -27.109806060791016, "global_step": 445361, "epoch": 5365} {"train_loss": -26.510074615478516, "global_step": 445362, "epoch": 5365} {"train_loss": -26.78775978088379, "global_step": 445363, "epoch": 5365} {"train_loss": -25.901416778564453, "global_step": 445364, "epoch": 5365} {"train_loss": -24.72608184814453, "global_step": 445365, "epoch": 5365} {"train_loss": -23.117216110229492, "global_step": 445366, "epoch": 5365} {"train_loss": -25.721220016479492, "global_step": 445367, "epoch": 5365} {"train_loss": -25.084218978881836, "global_step": 445368, "epoch": 5365} {"train_loss": -26.35727310180664, "global_step": 445369, "epoch": 5365} {"train_loss": -25.526166915893555, "global_step": 445370, "epoch": 5365} {"train_loss": -25.901288986206055, "global_step": 445371, "epoch": 5365} {"train_loss": -25.695261001586914, "global_step": 445372, "epoch": 5365} {"train_loss": -26.258319854736328, "global_step": 445373, "epoch": 5365} {"train_loss": -25.970930099487305, "global_step": 445374, "epoch": 5365} {"train_loss": -25.974960327148438, "global_step": 445375, "epoch": 5365} {"train_loss": -26.26987075805664, "global_step": 445376, "epoch": 5365} {"train_loss": -26.61624515487487, "global_step": 445377, "epoch": 5365, "val_loss": 6730102.0} {"train_loss": -25.75514030456543, "global_step": 445378, "epoch": 5366} {"train_loss": -25.799163818359375, "global_step": 445379, "epoch": 5366} {"train_loss": -26.182117462158203, "global_step": 445380, "epoch": 5366} {"train_loss": -26.09144401550293, "global_step": 445381, "epoch": 5366} {"train_loss": -26.089834213256836, "global_step": 445382, "epoch": 5366} {"train_loss": -25.87043571472168, "global_step": 445383, "epoch": 5366} {"train_loss": -26.360050201416016, "global_step": 445384, "epoch": 5366} {"train_loss": -26.22315788269043, "global_step": 445385, "epoch": 5366} {"train_loss": -26.1433162689209, "global_step": 445386, "epoch": 5366} {"train_loss": -26.25726318359375, "global_step": 445387, "epoch": 5366} {"train_loss": -26.72028160095215, "global_step": 445388, "epoch": 5366} {"train_loss": -26.691198348999023, "global_step": 445389, "epoch": 5366} {"train_loss": -26.518726348876953, "global_step": 445390, "epoch": 5366} {"train_loss": -26.549591064453125, "global_step": 445391, "epoch": 5366} {"train_loss": -26.487707138061523, "global_step": 445392, "epoch": 5366} {"train_loss": -26.433197021484375, "global_step": 445393, "epoch": 5366} {"train_loss": -26.494216918945312, "global_step": 445394, "epoch": 5366} {"train_loss": -26.252471923828125, "global_step": 445395, "epoch": 5366} {"train_loss": -26.65720558166504, "global_step": 445396, "epoch": 5366} {"train_loss": -26.769775390625, "global_step": 445397, "epoch": 5366} {"train_loss": -26.372543334960938, "global_step": 445398, "epoch": 5366} {"train_loss": -26.377700805664062, "global_step": 445399, "epoch": 5366} {"train_loss": -26.88427734375, "global_step": 445400, "epoch": 5366} {"train_loss": -26.775604248046875, "global_step": 445401, "epoch": 5366} {"train_loss": -27.265233993530273, "global_step": 445402, "epoch": 5366} {"train_loss": -26.487293243408203, "global_step": 445403, "epoch": 5366} {"train_loss": -26.67474937438965, "global_step": 445404, "epoch": 5366} {"train_loss": -26.975482940673828, "global_step": 445405, "epoch": 5366} {"train_loss": -26.94947624206543, "global_step": 445406, "epoch": 5366} {"train_loss": -26.6954345703125, "global_step": 445407, "epoch": 5366} {"train_loss": -26.60919189453125, "global_step": 445408, "epoch": 5366} {"train_loss": -27.018970489501953, "global_step": 445409, "epoch": 5366} {"train_loss": -27.201581954956055, "global_step": 445410, "epoch": 5366} {"train_loss": -27.13484001159668, "global_step": 445411, "epoch": 5366} {"train_loss": -27.19135093688965, "global_step": 445412, "epoch": 5366} {"train_loss": -27.209522247314453, "global_step": 445413, "epoch": 5366} {"train_loss": -26.993051528930664, "global_step": 445414, "epoch": 5366} {"train_loss": -27.20281410217285, "global_step": 445415, "epoch": 5366} {"train_loss": -27.005399703979492, "global_step": 445416, "epoch": 5366} {"train_loss": -26.925994873046875, "global_step": 445417, "epoch": 5366} {"train_loss": -26.991256713867188, "global_step": 445418, "epoch": 5366} {"train_loss": -27.036401748657227, "global_step": 445419, "epoch": 5366} {"train_loss": -27.125925064086914, "global_step": 445420, "epoch": 5366} {"train_loss": -26.954395294189453, "global_step": 445421, "epoch": 5366} {"train_loss": -26.988086700439453, "global_step": 445422, "epoch": 5366} {"train_loss": -26.98404884338379, "global_step": 445423, "epoch": 5366} {"train_loss": -26.971704483032227, "global_step": 445424, "epoch": 5366} {"train_loss": -27.00384521484375, "global_step": 445425, "epoch": 5366} {"train_loss": -26.798538208007812, "global_step": 445426, "epoch": 5366} {"train_loss": -27.35785484313965, "global_step": 445427, "epoch": 5366} {"train_loss": -27.06195640563965, "global_step": 445428, "epoch": 5366} {"train_loss": -26.773645401000977, "global_step": 445429, "epoch": 5366} {"train_loss": -26.882553100585938, "global_step": 445430, "epoch": 5366} {"train_loss": -27.225004196166992, "global_step": 445431, "epoch": 5366} {"train_loss": -26.85052490234375, "global_step": 445432, "epoch": 5366} {"train_loss": -26.92047691345215, "global_step": 445433, "epoch": 5366} {"train_loss": -26.392333984375, "global_step": 445434, "epoch": 5366} {"train_loss": -26.304046630859375, "global_step": 445435, "epoch": 5366} {"train_loss": -27.027698516845703, "global_step": 445436, "epoch": 5366} {"train_loss": -27.20831298828125, "global_step": 445437, "epoch": 5366} {"train_loss": -26.796432495117188, "global_step": 445438, "epoch": 5366} {"train_loss": -26.848546981811523, "global_step": 445439, "epoch": 5366} {"train_loss": -26.46769142150879, "global_step": 445440, "epoch": 5366} {"train_loss": -26.450458526611328, "global_step": 445441, "epoch": 5366} {"train_loss": -26.536346435546875, "global_step": 445442, "epoch": 5366} {"train_loss": -26.375829696655273, "global_step": 445443, "epoch": 5366} {"train_loss": -26.888568878173828, "global_step": 445444, "epoch": 5366} {"train_loss": -26.422122955322266, "global_step": 445445, "epoch": 5366} {"train_loss": -26.42567253112793, "global_step": 445446, "epoch": 5366} {"train_loss": -27.05483055114746, "global_step": 445447, "epoch": 5366} {"train_loss": -26.695453643798828, "global_step": 445448, "epoch": 5366} {"train_loss": -26.73233413696289, "global_step": 445449, "epoch": 5366} {"train_loss": -26.855497360229492, "global_step": 445450, "epoch": 5366} {"train_loss": -27.070804595947266, "global_step": 445451, "epoch": 5366} {"train_loss": -26.843719482421875, "global_step": 445452, "epoch": 5366} {"train_loss": -26.75519371032715, "global_step": 445453, "epoch": 5366} {"train_loss": -26.897418975830078, "global_step": 445454, "epoch": 5366} {"train_loss": -26.84626579284668, "global_step": 445455, "epoch": 5366} {"train_loss": -26.5754451751709, "global_step": 445456, "epoch": 5366} {"train_loss": -26.86333656311035, "global_step": 445457, "epoch": 5366} {"train_loss": -27.086706161499023, "global_step": 445458, "epoch": 5366} {"train_loss": -26.77420997619629, "global_step": 445459, "epoch": 5366} {"train_loss": -26.724340852484644, "global_step": 445460, "epoch": 5366, "val_loss": 6569482.5} {"train_loss": -26.350271224975586, "global_step": 445461, "epoch": 5367} {"train_loss": -26.57020378112793, "global_step": 445462, "epoch": 5367} {"train_loss": -26.070844650268555, "global_step": 445463, "epoch": 5367} {"train_loss": -25.43550682067871, "global_step": 445464, "epoch": 5367} {"train_loss": -26.177236557006836, "global_step": 445465, "epoch": 5367} {"train_loss": -25.211318969726562, "global_step": 445466, "epoch": 5367} {"train_loss": -25.506122589111328, "global_step": 445467, "epoch": 5367} {"train_loss": -25.795032501220703, "global_step": 445468, "epoch": 5367} {"train_loss": -26.26413345336914, "global_step": 445469, "epoch": 5367} {"train_loss": -25.840213775634766, "global_step": 445470, "epoch": 5367} {"train_loss": -25.674047470092773, "global_step": 445471, "epoch": 5367} {"train_loss": -26.32684326171875, "global_step": 445472, "epoch": 5367} {"train_loss": -25.985462188720703, "global_step": 445473, "epoch": 5367} {"train_loss": -26.497739791870117, "global_step": 445474, "epoch": 5367} {"train_loss": -26.103307723999023, "global_step": 445475, "epoch": 5367} {"train_loss": -26.240888595581055, "global_step": 445476, "epoch": 5367} {"train_loss": -26.511625289916992, "global_step": 445477, "epoch": 5367} {"train_loss": -26.440759658813477, "global_step": 445478, "epoch": 5367} {"train_loss": -26.86756706237793, "global_step": 445479, "epoch": 5367} {"train_loss": -26.1616268157959, "global_step": 445480, "epoch": 5367} {"train_loss": -26.850971221923828, "global_step": 445481, "epoch": 5367} {"train_loss": -26.651294708251953, "global_step": 445482, "epoch": 5367} {"train_loss": -26.563146591186523, "global_step": 445483, "epoch": 5367} {"train_loss": -26.92414665222168, "global_step": 445484, "epoch": 5367} {"train_loss": -26.318710327148438, "global_step": 445485, "epoch": 5367} {"train_loss": -26.71721839904785, "global_step": 445486, "epoch": 5367} {"train_loss": -26.711633682250977, "global_step": 445487, "epoch": 5367} {"train_loss": -26.589019775390625, "global_step": 445488, "epoch": 5367} {"train_loss": -26.800491333007812, "global_step": 445489, "epoch": 5367} {"train_loss": -26.937925338745117, "global_step": 445490, "epoch": 5367} {"train_loss": -26.918302536010742, "global_step": 445491, "epoch": 5367} {"train_loss": -26.719593048095703, "global_step": 445492, "epoch": 5367} {"train_loss": -27.039661407470703, "global_step": 445493, "epoch": 5367} {"train_loss": -26.688806533813477, "global_step": 445494, "epoch": 5367} {"train_loss": -27.30022621154785, "global_step": 445495, "epoch": 5367} {"train_loss": -27.340051651000977, "global_step": 445496, "epoch": 5367} {"train_loss": -27.029462814331055, "global_step": 445497, "epoch": 5367} {"train_loss": -26.825336456298828, "global_step": 445498, "epoch": 5367} {"train_loss": -26.752721786499023, "global_step": 445499, "epoch": 5367} {"train_loss": -26.67896842956543, "global_step": 445500, "epoch": 5367} {"train_loss": -27.005826950073242, "global_step": 445501, "epoch": 5367} {"train_loss": -26.95143699645996, "global_step": 445502, "epoch": 5367} {"train_loss": -27.163116455078125, "global_step": 445503, "epoch": 5367} {"train_loss": -27.315393447875977, "global_step": 445504, "epoch": 5367} {"train_loss": -27.027082443237305, "global_step": 445505, "epoch": 5367} {"train_loss": -26.982196807861328, "global_step": 445506, "epoch": 5367} {"train_loss": -27.0263671875, "global_step": 445507, "epoch": 5367} {"train_loss": -27.300765991210938, "global_step": 445508, "epoch": 5367} {"train_loss": -26.953359603881836, "global_step": 445509, "epoch": 5367} {"train_loss": -27.319110870361328, "global_step": 445510, "epoch": 5367} {"train_loss": -26.917890548706055, "global_step": 445511, "epoch": 5367} {"train_loss": -27.4310245513916, "global_step": 445512, "epoch": 5367} {"train_loss": -27.093515396118164, "global_step": 445513, "epoch": 5367} {"train_loss": -27.048364639282227, "global_step": 445514, "epoch": 5367} {"train_loss": -27.42091941833496, "global_step": 445515, "epoch": 5367} {"train_loss": -27.18794059753418, "global_step": 445516, "epoch": 5367} {"train_loss": -27.08913230895996, "global_step": 445517, "epoch": 5367} {"train_loss": -26.95527458190918, "global_step": 445518, "epoch": 5367} {"train_loss": -27.34002113342285, "global_step": 445519, "epoch": 5367} {"train_loss": -26.776212692260742, "global_step": 445520, "epoch": 5367} {"train_loss": -27.166372299194336, "global_step": 445521, "epoch": 5367} {"train_loss": -26.869932174682617, "global_step": 445522, "epoch": 5367} {"train_loss": -27.04094886779785, "global_step": 445523, "epoch": 5367} {"train_loss": -26.695173263549805, "global_step": 445524, "epoch": 5367} {"train_loss": -26.9464111328125, "global_step": 445525, "epoch": 5367} {"train_loss": -27.14292335510254, "global_step": 445526, "epoch": 5367} {"train_loss": -26.7565860748291, "global_step": 445527, "epoch": 5367} {"train_loss": -26.93695068359375, "global_step": 445528, "epoch": 5367} {"train_loss": -27.10719871520996, "global_step": 445529, "epoch": 5367} {"train_loss": -26.84185791015625, "global_step": 445530, "epoch": 5367} {"train_loss": -26.964340209960938, "global_step": 445531, "epoch": 5367} {"train_loss": -26.525211334228516, "global_step": 445532, "epoch": 5367} {"train_loss": -26.635650634765625, "global_step": 445533, "epoch": 5367} {"train_loss": -27.14045524597168, "global_step": 445534, "epoch": 5367} {"train_loss": -26.073392868041992, "global_step": 445535, "epoch": 5367} {"train_loss": -26.26619529724121, "global_step": 445536, "epoch": 5367} {"train_loss": -27.024709701538086, "global_step": 445537, "epoch": 5367} {"train_loss": -26.214038848876953, "global_step": 445538, "epoch": 5367} {"train_loss": -26.79168128967285, "global_step": 445539, "epoch": 5367} {"train_loss": -26.609228134155273, "global_step": 445540, "epoch": 5367} {"train_loss": -26.388654708862305, "global_step": 445541, "epoch": 5367} {"train_loss": -26.650867462158203, "global_step": 445542, "epoch": 5367} {"train_loss": -26.697159433939373, "global_step": 445543, "epoch": 5367, "val_loss": 6556843.0} {"train_loss": -26.522871017456055, "global_step": 445544, "epoch": 5368} {"train_loss": -26.53260612487793, "global_step": 445545, "epoch": 5368} {"train_loss": -26.58721923828125, "global_step": 445546, "epoch": 5368} {"train_loss": -25.933080673217773, "global_step": 445547, "epoch": 5368} {"train_loss": -26.189105987548828, "global_step": 445548, "epoch": 5368} {"train_loss": -26.486499786376953, "global_step": 445549, "epoch": 5368} {"train_loss": -26.39227867126465, "global_step": 445550, "epoch": 5368} {"train_loss": -26.487897872924805, "global_step": 445551, "epoch": 5368} {"train_loss": -26.901275634765625, "global_step": 445552, "epoch": 5368} {"train_loss": -26.28922462463379, "global_step": 445553, "epoch": 5368} {"train_loss": -26.815786361694336, "global_step": 445554, "epoch": 5368} {"train_loss": -26.363622665405273, "global_step": 445555, "epoch": 5368} {"train_loss": -26.761554718017578, "global_step": 445556, "epoch": 5368} {"train_loss": -26.84739112854004, "global_step": 445557, "epoch": 5368} {"train_loss": -26.738439559936523, "global_step": 445558, "epoch": 5368} {"train_loss": -26.919897079467773, "global_step": 445559, "epoch": 5368} {"train_loss": -26.546661376953125, "global_step": 445560, "epoch": 5368} {"train_loss": -26.931020736694336, "global_step": 445561, "epoch": 5368} {"train_loss": -27.216405868530273, "global_step": 445562, "epoch": 5368} {"train_loss": -26.80182456970215, "global_step": 445563, "epoch": 5368} {"train_loss": -26.59579849243164, "global_step": 445564, "epoch": 5368} {"train_loss": -26.82439613342285, "global_step": 445565, "epoch": 5368} {"train_loss": -26.667556762695312, "global_step": 445566, "epoch": 5368} {"train_loss": -26.75434684753418, "global_step": 445567, "epoch": 5368} {"train_loss": -26.680646896362305, "global_step": 445568, "epoch": 5368} {"train_loss": -26.84638023376465, "global_step": 445569, "epoch": 5368} {"train_loss": -27.132429122924805, "global_step": 445570, "epoch": 5368} {"train_loss": -27.032379150390625, "global_step": 445571, "epoch": 5368} {"train_loss": -27.15651512145996, "global_step": 445572, "epoch": 5368} {"train_loss": -27.07155418395996, "global_step": 445573, "epoch": 5368} {"train_loss": -27.10633659362793, "global_step": 445574, "epoch": 5368} {"train_loss": -26.98701286315918, "global_step": 445575, "epoch": 5368} {"train_loss": -27.037092208862305, "global_step": 445576, "epoch": 5368} {"train_loss": -27.133432388305664, "global_step": 445577, "epoch": 5368} {"train_loss": -27.19044303894043, "global_step": 445578, "epoch": 5368} {"train_loss": -27.126447677612305, "global_step": 445579, "epoch": 5368} {"train_loss": -27.185962677001953, "global_step": 445580, "epoch": 5368} {"train_loss": -27.2250919342041, "global_step": 445581, "epoch": 5368} {"train_loss": -26.952411651611328, "global_step": 445582, "epoch": 5368} {"train_loss": -26.863208770751953, "global_step": 445583, "epoch": 5368} {"train_loss": -26.781103134155273, "global_step": 445584, "epoch": 5368} {"train_loss": -27.360822677612305, "global_step": 445585, "epoch": 5368} {"train_loss": -26.944305419921875, "global_step": 445586, "epoch": 5368} {"train_loss": -27.2237606048584, "global_step": 445587, "epoch": 5368} {"train_loss": -27.00435447692871, "global_step": 445588, "epoch": 5368} {"train_loss": -27.1612606048584, "global_step": 445589, "epoch": 5368} {"train_loss": -27.307754516601562, "global_step": 445590, "epoch": 5368} {"train_loss": -27.02064323425293, "global_step": 445591, "epoch": 5368} {"train_loss": -27.22108268737793, "global_step": 445592, "epoch": 5368} {"train_loss": -27.001569747924805, "global_step": 445593, "epoch": 5368} {"train_loss": -26.98748779296875, "global_step": 445594, "epoch": 5368} {"train_loss": -27.183563232421875, "global_step": 445595, "epoch": 5368} {"train_loss": -27.150793075561523, "global_step": 445596, "epoch": 5368} {"train_loss": -27.27566909790039, "global_step": 445597, "epoch": 5368} {"train_loss": -27.06123161315918, "global_step": 445598, "epoch": 5368} {"train_loss": -27.282373428344727, "global_step": 445599, "epoch": 5368} {"train_loss": -26.74725914001465, "global_step": 445600, "epoch": 5368} {"train_loss": -27.12109375, "global_step": 445601, "epoch": 5368} {"train_loss": -27.23663902282715, "global_step": 445602, "epoch": 5368} {"train_loss": -27.066242218017578, "global_step": 445603, "epoch": 5368} {"train_loss": -26.979877471923828, "global_step": 445604, "epoch": 5368} {"train_loss": -27.35834312438965, "global_step": 445605, "epoch": 5368} {"train_loss": -26.900537490844727, "global_step": 445606, "epoch": 5368} {"train_loss": -27.2876033782959, "global_step": 445607, "epoch": 5368} {"train_loss": -27.226892471313477, "global_step": 445608, "epoch": 5368} {"train_loss": -27.015399932861328, "global_step": 445609, "epoch": 5368} {"train_loss": -27.2889347076416, "global_step": 445610, "epoch": 5368} {"train_loss": -26.82546043395996, "global_step": 445611, "epoch": 5368} {"train_loss": -26.795629501342773, "global_step": 445612, "epoch": 5368} {"train_loss": -27.243738174438477, "global_step": 445613, "epoch": 5368} {"train_loss": -26.83070945739746, "global_step": 445614, "epoch": 5368} {"train_loss": -26.476764678955078, "global_step": 445615, "epoch": 5368} {"train_loss": -25.580093383789062, "global_step": 445616, "epoch": 5368} {"train_loss": -26.505292892456055, "global_step": 445617, "epoch": 5368} {"train_loss": -27.128097534179688, "global_step": 445618, "epoch": 5368} {"train_loss": -26.104450225830078, "global_step": 445619, "epoch": 5368} {"train_loss": -26.705007553100586, "global_step": 445620, "epoch": 5368} {"train_loss": -26.956674575805664, "global_step": 445621, "epoch": 5368} {"train_loss": -26.24883460998535, "global_step": 445622, "epoch": 5368} {"train_loss": -27.013158798217773, "global_step": 445623, "epoch": 5368} {"train_loss": -26.741565704345703, "global_step": 445624, "epoch": 5368} {"train_loss": -26.60272216796875, "global_step": 445625, "epoch": 5368} {"train_loss": -26.86725747441671, "global_step": 445626, "epoch": 5368, "val_loss": 6575535.0} {"train_loss": -26.139074325561523, "global_step": 445627, "epoch": 5369} {"train_loss": -26.568445205688477, "global_step": 445628, "epoch": 5369} {"train_loss": -26.46257972717285, "global_step": 445629, "epoch": 5369} {"train_loss": -25.809040069580078, "global_step": 445630, "epoch": 5369} {"train_loss": -26.466461181640625, "global_step": 445631, "epoch": 5369} {"train_loss": -26.36042594909668, "global_step": 445632, "epoch": 5369} {"train_loss": -26.095884323120117, "global_step": 445633, "epoch": 5369} {"train_loss": -26.705352783203125, "global_step": 445634, "epoch": 5369} {"train_loss": -26.229846954345703, "global_step": 445635, "epoch": 5369} {"train_loss": -26.667871475219727, "global_step": 445636, "epoch": 5369} {"train_loss": -26.38929557800293, "global_step": 445637, "epoch": 5369} {"train_loss": -26.71528434753418, "global_step": 445638, "epoch": 5369} {"train_loss": -26.3601131439209, "global_step": 445639, "epoch": 5369} {"train_loss": -26.70694351196289, "global_step": 445640, "epoch": 5369} {"train_loss": -26.851245880126953, "global_step": 445641, "epoch": 5369} {"train_loss": -26.6965389251709, "global_step": 445642, "epoch": 5369} {"train_loss": -26.9739933013916, "global_step": 445643, "epoch": 5369} {"train_loss": -26.600248336791992, "global_step": 445644, "epoch": 5369} {"train_loss": -26.907318115234375, "global_step": 445645, "epoch": 5369} {"train_loss": -26.717817306518555, "global_step": 445646, "epoch": 5369} {"train_loss": -26.956308364868164, "global_step": 445647, "epoch": 5369} {"train_loss": -26.839635848999023, "global_step": 445648, "epoch": 5369} {"train_loss": -26.690353393554688, "global_step": 445649, "epoch": 5369} {"train_loss": -26.863264083862305, "global_step": 445650, "epoch": 5369} {"train_loss": -27.193897247314453, "global_step": 445651, "epoch": 5369} {"train_loss": -26.80571937561035, "global_step": 445652, "epoch": 5369} {"train_loss": -26.967945098876953, "global_step": 445653, "epoch": 5369} {"train_loss": -27.41755485534668, "global_step": 445654, "epoch": 5369} {"train_loss": -26.920446395874023, "global_step": 445655, "epoch": 5369} {"train_loss": -26.880966186523438, "global_step": 445656, "epoch": 5369} {"train_loss": -26.987852096557617, "global_step": 445657, "epoch": 5369} {"train_loss": -26.98638916015625, "global_step": 445658, "epoch": 5369} {"train_loss": -27.25618553161621, "global_step": 445659, "epoch": 5369} {"train_loss": -26.775070190429688, "global_step": 445660, "epoch": 5369} {"train_loss": -26.997039794921875, "global_step": 445661, "epoch": 5369} {"train_loss": -27.207082748413086, "global_step": 445662, "epoch": 5369} {"train_loss": -26.683996200561523, "global_step": 445663, "epoch": 5369} {"train_loss": -27.055139541625977, "global_step": 445664, "epoch": 5369} {"train_loss": -26.656070709228516, "global_step": 445665, "epoch": 5369} {"train_loss": -27.0836181640625, "global_step": 445666, "epoch": 5369} {"train_loss": -26.916799545288086, "global_step": 445667, "epoch": 5369} {"train_loss": -27.282495498657227, "global_step": 445668, "epoch": 5369} {"train_loss": -27.075641632080078, "global_step": 445669, "epoch": 5369} {"train_loss": -27.062788009643555, "global_step": 445670, "epoch": 5369} {"train_loss": -26.96109390258789, "global_step": 445671, "epoch": 5369} {"train_loss": -27.001220703125, "global_step": 445672, "epoch": 5369} {"train_loss": -27.197723388671875, "global_step": 445673, "epoch": 5369} {"train_loss": -27.07991600036621, "global_step": 445674, "epoch": 5369} {"train_loss": -27.03363037109375, "global_step": 445675, "epoch": 5369} {"train_loss": -27.343469619750977, "global_step": 445676, "epoch": 5369} {"train_loss": -27.146005630493164, "global_step": 445677, "epoch": 5369} {"train_loss": -27.18368911743164, "global_step": 445678, "epoch": 5369} {"train_loss": -27.188892364501953, "global_step": 445679, "epoch": 5369} {"train_loss": -27.344038009643555, "global_step": 445680, "epoch": 5369} {"train_loss": -27.434219360351562, "global_step": 445681, "epoch": 5369} {"train_loss": -27.398046493530273, "global_step": 445682, "epoch": 5369} {"train_loss": -27.138629913330078, "global_step": 445683, "epoch": 5369} {"train_loss": -27.0073184967041, "global_step": 445684, "epoch": 5369} {"train_loss": -26.65744972229004, "global_step": 445685, "epoch": 5369} {"train_loss": -27.42579460144043, "global_step": 445686, "epoch": 5369} {"train_loss": -27.175588607788086, "global_step": 445687, "epoch": 5369} {"train_loss": -27.04043960571289, "global_step": 445688, "epoch": 5369} {"train_loss": -27.025671005249023, "global_step": 445689, "epoch": 5369} {"train_loss": -27.24065589904785, "global_step": 445690, "epoch": 5369} {"train_loss": -27.112491607666016, "global_step": 445691, "epoch": 5369} {"train_loss": -26.85626220703125, "global_step": 445692, "epoch": 5369} {"train_loss": -27.115570068359375, "global_step": 445693, "epoch": 5369} {"train_loss": -27.208053588867188, "global_step": 445694, "epoch": 5369} {"train_loss": -26.79842185974121, "global_step": 445695, "epoch": 5369} {"train_loss": -26.52967643737793, "global_step": 445696, "epoch": 5369} {"train_loss": -26.679950714111328, "global_step": 445697, "epoch": 5369} {"train_loss": -26.642276763916016, "global_step": 445698, "epoch": 5369} {"train_loss": -27.129962921142578, "global_step": 445699, "epoch": 5369} {"train_loss": -26.818490982055664, "global_step": 445700, "epoch": 5369} {"train_loss": -26.995594024658203, "global_step": 445701, "epoch": 5369} {"train_loss": -26.856576919555664, "global_step": 445702, "epoch": 5369} {"train_loss": -26.523828506469727, "global_step": 445703, "epoch": 5369} {"train_loss": -26.770618438720703, "global_step": 445704, "epoch": 5369} {"train_loss": -27.364749908447266, "global_step": 445705, "epoch": 5369} {"train_loss": -27.01895523071289, "global_step": 445706, "epoch": 5369} {"train_loss": -26.58112907409668, "global_step": 445707, "epoch": 5369} {"train_loss": -26.695409774780273, "global_step": 445708, "epoch": 5369} {"train_loss": -26.895253491688923, "global_step": 445709, "epoch": 5369, "val_loss": 6497172.0} {"train_loss": -26.020971298217773, "global_step": 445710, "epoch": 5370} {"train_loss": -26.0157470703125, "global_step": 445711, "epoch": 5370} {"train_loss": -26.5184268951416, "global_step": 445712, "epoch": 5370} {"train_loss": -25.9639892578125, "global_step": 445713, "epoch": 5370} {"train_loss": -26.1109676361084, "global_step": 445714, "epoch": 5370} {"train_loss": -26.61663246154785, "global_step": 445715, "epoch": 5370} {"train_loss": -26.4261531829834, "global_step": 445716, "epoch": 5370} {"train_loss": -26.73550796508789, "global_step": 445717, "epoch": 5370} {"train_loss": -26.572721481323242, "global_step": 445718, "epoch": 5370} {"train_loss": -26.35141372680664, "global_step": 445719, "epoch": 5370} {"train_loss": -27.005807876586914, "global_step": 445720, "epoch": 5370} {"train_loss": -26.559833526611328, "global_step": 445721, "epoch": 5370} {"train_loss": -26.722570419311523, "global_step": 445722, "epoch": 5370} {"train_loss": -26.748620986938477, "global_step": 445723, "epoch": 5370} {"train_loss": -26.776952743530273, "global_step": 445724, "epoch": 5370} {"train_loss": -26.896570205688477, "global_step": 445725, "epoch": 5370} {"train_loss": -27.01007080078125, "global_step": 445726, "epoch": 5370} {"train_loss": -26.923166275024414, "global_step": 445727, "epoch": 5370} {"train_loss": -26.5848388671875, "global_step": 445728, "epoch": 5370} {"train_loss": -26.759469985961914, "global_step": 445729, "epoch": 5370} {"train_loss": -26.69687271118164, "global_step": 445730, "epoch": 5370} {"train_loss": -27.002782821655273, "global_step": 445731, "epoch": 5370} {"train_loss": -26.690519332885742, "global_step": 445732, "epoch": 5370} {"train_loss": -26.674530029296875, "global_step": 445733, "epoch": 5370} {"train_loss": -26.522205352783203, "global_step": 445734, "epoch": 5370} {"train_loss": -26.811664581298828, "global_step": 445735, "epoch": 5370} {"train_loss": -26.9294376373291, "global_step": 445736, "epoch": 5370} {"train_loss": -26.617462158203125, "global_step": 445737, "epoch": 5370} {"train_loss": -26.62941551208496, "global_step": 445738, "epoch": 5370} {"train_loss": -26.991840362548828, "global_step": 445739, "epoch": 5370} {"train_loss": -26.926671981811523, "global_step": 445740, "epoch": 5370} {"train_loss": -26.76215171813965, "global_step": 445741, "epoch": 5370} {"train_loss": -26.670690536499023, "global_step": 445742, "epoch": 5370} {"train_loss": -26.989404678344727, "global_step": 445743, "epoch": 5370} {"train_loss": -26.867938995361328, "global_step": 445744, "epoch": 5370} {"train_loss": -26.91876792907715, "global_step": 445745, "epoch": 5370} {"train_loss": -27.008432388305664, "global_step": 445746, "epoch": 5370} {"train_loss": -26.775659561157227, "global_step": 445747, "epoch": 5370} {"train_loss": -26.873615264892578, "global_step": 445748, "epoch": 5370} {"train_loss": -27.054792404174805, "global_step": 445749, "epoch": 5370} {"train_loss": -27.271728515625, "global_step": 445750, "epoch": 5370} {"train_loss": -26.982086181640625, "global_step": 445751, "epoch": 5370} {"train_loss": -27.047277450561523, "global_step": 445752, "epoch": 5370} {"train_loss": -27.12692642211914, "global_step": 445753, "epoch": 5370} {"train_loss": -27.059423446655273, "global_step": 445754, "epoch": 5370} {"train_loss": -27.173675537109375, "global_step": 445755, "epoch": 5370} {"train_loss": -27.120105743408203, "global_step": 445756, "epoch": 5370} {"train_loss": -27.198965072631836, "global_step": 445757, "epoch": 5370} {"train_loss": -27.09393310546875, "global_step": 445758, "epoch": 5370} {"train_loss": -27.029132843017578, "global_step": 445759, "epoch": 5370} {"train_loss": -27.046064376831055, "global_step": 445760, "epoch": 5370} {"train_loss": -26.92013931274414, "global_step": 445761, "epoch": 5370} {"train_loss": -27.398773193359375, "global_step": 445762, "epoch": 5370} {"train_loss": -27.313581466674805, "global_step": 445763, "epoch": 5370} {"train_loss": -27.06548500061035, "global_step": 445764, "epoch": 5370} {"train_loss": -26.9942569732666, "global_step": 445765, "epoch": 5370} {"train_loss": -26.906646728515625, "global_step": 445766, "epoch": 5370} {"train_loss": -27.24448585510254, "global_step": 445767, "epoch": 5370} {"train_loss": -27.015338897705078, "global_step": 445768, "epoch": 5370} {"train_loss": -27.770273208618164, "global_step": 445769, "epoch": 5370} {"train_loss": -27.25681495666504, "global_step": 445770, "epoch": 5370} {"train_loss": -27.37495994567871, "global_step": 445771, "epoch": 5370} {"train_loss": -27.32215690612793, "global_step": 445772, "epoch": 5370} {"train_loss": -27.145959854125977, "global_step": 445773, "epoch": 5370} {"train_loss": -27.621368408203125, "global_step": 445774, "epoch": 5370} {"train_loss": -26.852319717407227, "global_step": 445775, "epoch": 5370} {"train_loss": -27.0589599609375, "global_step": 445776, "epoch": 5370} {"train_loss": -26.79957389831543, "global_step": 445777, "epoch": 5370} {"train_loss": -27.12110710144043, "global_step": 445778, "epoch": 5370} {"train_loss": -27.086851119995117, "global_step": 445779, "epoch": 5370} {"train_loss": -27.1512451171875, "global_step": 445780, "epoch": 5370} {"train_loss": -27.2674560546875, "global_step": 445781, "epoch": 5370} {"train_loss": -26.978229522705078, "global_step": 445782, "epoch": 5370} {"train_loss": -26.706409454345703, "global_step": 445783, "epoch": 5370} {"train_loss": -26.669055938720703, "global_step": 445784, "epoch": 5370} {"train_loss": -27.179458618164062, "global_step": 445785, "epoch": 5370} {"train_loss": -26.63222312927246, "global_step": 445786, "epoch": 5370} {"train_loss": -26.73823356628418, "global_step": 445787, "epoch": 5370} {"train_loss": -26.784231185913086, "global_step": 445788, "epoch": 5370} {"train_loss": -26.600061416625977, "global_step": 445789, "epoch": 5370} {"train_loss": -26.680700302124023, "global_step": 445790, "epoch": 5370} {"train_loss": -26.70209312438965, "global_step": 445791, "epoch": 5370} {"train_loss": -26.878119319318287, "global_step": 445792, "epoch": 5370, "val_loss": 6580336.0} {"train_loss": -24.76662254333496, "global_step": 445793, "epoch": 5371} {"train_loss": -23.66499900817871, "global_step": 445794, "epoch": 5371} {"train_loss": -25.485811233520508, "global_step": 445795, "epoch": 5371} {"train_loss": -25.64420509338379, "global_step": 445796, "epoch": 5371} {"train_loss": -25.636703491210938, "global_step": 445797, "epoch": 5371} {"train_loss": -25.75390625, "global_step": 445798, "epoch": 5371} {"train_loss": -26.376394271850586, "global_step": 445799, "epoch": 5371} {"train_loss": -25.98993492126465, "global_step": 445800, "epoch": 5371} {"train_loss": -26.004444122314453, "global_step": 445801, "epoch": 5371} {"train_loss": -26.5072021484375, "global_step": 445802, "epoch": 5371} {"train_loss": -26.08229637145996, "global_step": 445803, "epoch": 5371} {"train_loss": -26.28596305847168, "global_step": 445804, "epoch": 5371} {"train_loss": -26.331558227539062, "global_step": 445805, "epoch": 5371} {"train_loss": -26.530447006225586, "global_step": 445806, "epoch": 5371} {"train_loss": -26.476011276245117, "global_step": 445807, "epoch": 5371} {"train_loss": -26.644702911376953, "global_step": 445808, "epoch": 5371} {"train_loss": -26.20652198791504, "global_step": 445809, "epoch": 5371} {"train_loss": -26.73673439025879, "global_step": 445810, "epoch": 5371} {"train_loss": -26.615522384643555, "global_step": 445811, "epoch": 5371} {"train_loss": -26.331052780151367, "global_step": 445812, "epoch": 5371} {"train_loss": -26.417394638061523, "global_step": 445813, "epoch": 5371} {"train_loss": -26.667028427124023, "global_step": 445814, "epoch": 5371} {"train_loss": -26.674545288085938, "global_step": 445815, "epoch": 5371} {"train_loss": -26.60200309753418, "global_step": 445816, "epoch": 5371} {"train_loss": -26.395994186401367, "global_step": 445817, "epoch": 5371} {"train_loss": -26.7729434967041, "global_step": 445818, "epoch": 5371} {"train_loss": -26.41778564453125, "global_step": 445819, "epoch": 5371} {"train_loss": -26.636144638061523, "global_step": 445820, "epoch": 5371} {"train_loss": -27.097702026367188, "global_step": 445821, "epoch": 5371} {"train_loss": -27.14703941345215, "global_step": 445822, "epoch": 5371} {"train_loss": -26.909992218017578, "global_step": 445823, "epoch": 5371} {"train_loss": -27.005889892578125, "global_step": 445824, "epoch": 5371} {"train_loss": -27.23876953125, "global_step": 445825, "epoch": 5371} {"train_loss": -26.745588302612305, "global_step": 445826, "epoch": 5371} {"train_loss": -26.844953536987305, "global_step": 445827, "epoch": 5371} {"train_loss": -27.10333824157715, "global_step": 445828, "epoch": 5371} {"train_loss": -27.28401756286621, "global_step": 445829, "epoch": 5371} {"train_loss": -27.06633949279785, "global_step": 445830, "epoch": 5371} {"train_loss": -27.26787757873535, "global_step": 445831, "epoch": 5371} {"train_loss": -27.196317672729492, "global_step": 445832, "epoch": 5371} {"train_loss": -27.595304489135742, "global_step": 445833, "epoch": 5371} {"train_loss": -27.250288009643555, "global_step": 445834, "epoch": 5371} {"train_loss": -27.2152156829834, "global_step": 445835, "epoch": 5371} {"train_loss": -26.87969398498535, "global_step": 445836, "epoch": 5371} {"train_loss": -27.126739501953125, "global_step": 445837, "epoch": 5371} {"train_loss": -26.9011173248291, "global_step": 445838, "epoch": 5371} {"train_loss": -27.15011978149414, "global_step": 445839, "epoch": 5371} {"train_loss": -27.161563873291016, "global_step": 445840, "epoch": 5371} {"train_loss": -27.214834213256836, "global_step": 445841, "epoch": 5371} {"train_loss": -27.12202262878418, "global_step": 445842, "epoch": 5371} {"train_loss": -27.201162338256836, "global_step": 445843, "epoch": 5371} {"train_loss": -27.266040802001953, "global_step": 445844, "epoch": 5371} {"train_loss": -27.236129760742188, "global_step": 445845, "epoch": 5371} {"train_loss": -27.199247360229492, "global_step": 445846, "epoch": 5371} {"train_loss": -26.9488582611084, "global_step": 445847, "epoch": 5371} {"train_loss": -27.173583984375, "global_step": 445848, "epoch": 5371} {"train_loss": -27.209125518798828, "global_step": 445849, "epoch": 5371} {"train_loss": -27.265226364135742, "global_step": 445850, "epoch": 5371} {"train_loss": -26.75667381286621, "global_step": 445851, "epoch": 5371} {"train_loss": -27.406354904174805, "global_step": 445852, "epoch": 5371} {"train_loss": -27.168508529663086, "global_step": 445853, "epoch": 5371} {"train_loss": -27.15867042541504, "global_step": 445854, "epoch": 5371} {"train_loss": -27.071338653564453, "global_step": 445855, "epoch": 5371} {"train_loss": -27.54505729675293, "global_step": 445856, "epoch": 5371} {"train_loss": -26.948368072509766, "global_step": 445857, "epoch": 5371} {"train_loss": -27.443723678588867, "global_step": 445858, "epoch": 5371} {"train_loss": -27.041940689086914, "global_step": 445859, "epoch": 5371} {"train_loss": -27.38702964782715, "global_step": 445860, "epoch": 5371} {"train_loss": -27.303455352783203, "global_step": 445861, "epoch": 5371} {"train_loss": -27.176544189453125, "global_step": 445862, "epoch": 5371} {"train_loss": -27.314777374267578, "global_step": 445863, "epoch": 5371} {"train_loss": -26.780445098876953, "global_step": 445864, "epoch": 5371} {"train_loss": -27.062763214111328, "global_step": 445865, "epoch": 5371} {"train_loss": -26.97786521911621, "global_step": 445866, "epoch": 5371} {"train_loss": -27.021148681640625, "global_step": 445867, "epoch": 5371} {"train_loss": -26.69329833984375, "global_step": 445868, "epoch": 5371} {"train_loss": -26.615583419799805, "global_step": 445869, "epoch": 5371} {"train_loss": -26.54034423828125, "global_step": 445870, "epoch": 5371} {"train_loss": -26.571863174438477, "global_step": 445871, "epoch": 5371} {"train_loss": -26.86287498474121, "global_step": 445872, "epoch": 5371} {"train_loss": -27.0755558013916, "global_step": 445873, "epoch": 5371} {"train_loss": -26.388437271118164, "global_step": 445874, "epoch": 5371} {"train_loss": -26.751670423760473, "global_step": 445875, "epoch": 5371, "val_loss": 6602553.0} {"train_loss": -26.52668571472168, "global_step": 445876, "epoch": 5372} {"train_loss": -26.180810928344727, "global_step": 445877, "epoch": 5372} {"train_loss": -26.36556053161621, "global_step": 445878, "epoch": 5372} {"train_loss": -26.0052490234375, "global_step": 445879, "epoch": 5372} {"train_loss": -26.870283126831055, "global_step": 445880, "epoch": 5372} {"train_loss": -26.051977157592773, "global_step": 445881, "epoch": 5372} {"train_loss": -26.51373863220215, "global_step": 445882, "epoch": 5372} {"train_loss": -26.234317779541016, "global_step": 445883, "epoch": 5372} {"train_loss": -26.845748901367188, "global_step": 445884, "epoch": 5372} {"train_loss": -26.31416893005371, "global_step": 445885, "epoch": 5372} {"train_loss": -26.787952423095703, "global_step": 445886, "epoch": 5372} {"train_loss": -26.320209503173828, "global_step": 445887, "epoch": 5372} {"train_loss": -26.404285430908203, "global_step": 445888, "epoch": 5372} {"train_loss": -26.63154411315918, "global_step": 445889, "epoch": 5372} {"train_loss": -26.844633102416992, "global_step": 445890, "epoch": 5372} {"train_loss": -26.61252784729004, "global_step": 445891, "epoch": 5372} {"train_loss": -26.766149520874023, "global_step": 445892, "epoch": 5372} {"train_loss": -26.601133346557617, "global_step": 445893, "epoch": 5372} {"train_loss": -26.263916015625, "global_step": 445894, "epoch": 5372} {"train_loss": -26.68768310546875, "global_step": 445895, "epoch": 5372} {"train_loss": -26.75518798828125, "global_step": 445896, "epoch": 5372} {"train_loss": -26.6474666595459, "global_step": 445897, "epoch": 5372} {"train_loss": -26.973562240600586, "global_step": 445898, "epoch": 5372} {"train_loss": -26.60430335998535, "global_step": 445899, "epoch": 5372} {"train_loss": -27.313833236694336, "global_step": 445900, "epoch": 5372} {"train_loss": -27.0626220703125, "global_step": 445901, "epoch": 5372} {"train_loss": -26.7825984954834, "global_step": 445902, "epoch": 5372} {"train_loss": -26.8831729888916, "global_step": 445903, "epoch": 5372} {"train_loss": -26.847339630126953, "global_step": 445904, "epoch": 5372} {"train_loss": -26.832324981689453, "global_step": 445905, "epoch": 5372} {"train_loss": -27.345396041870117, "global_step": 445906, "epoch": 5372} {"train_loss": -26.964094161987305, "global_step": 445907, "epoch": 5372} {"train_loss": -27.129499435424805, "global_step": 445908, "epoch": 5372} {"train_loss": -27.142974853515625, "global_step": 445909, "epoch": 5372} {"train_loss": -27.006879806518555, "global_step": 445910, "epoch": 5372} {"train_loss": -27.345935821533203, "global_step": 445911, "epoch": 5372} {"train_loss": -27.14143180847168, "global_step": 445912, "epoch": 5372} {"train_loss": -27.228246688842773, "global_step": 445913, "epoch": 5372} {"train_loss": -27.0594482421875, "global_step": 445914, "epoch": 5372} {"train_loss": -27.06829261779785, "global_step": 445915, "epoch": 5372} {"train_loss": -27.539337158203125, "global_step": 445916, "epoch": 5372} {"train_loss": -27.28472328186035, "global_step": 445917, "epoch": 5372} {"train_loss": -26.974393844604492, "global_step": 445918, "epoch": 5372} {"train_loss": -27.176870346069336, "global_step": 445919, "epoch": 5372} {"train_loss": -27.490894317626953, "global_step": 445920, "epoch": 5372} {"train_loss": -27.174795150756836, "global_step": 445921, "epoch": 5372} {"train_loss": -27.143783569335938, "global_step": 445922, "epoch": 5372} {"train_loss": -27.20497703552246, "global_step": 445923, "epoch": 5372} {"train_loss": -27.09052848815918, "global_step": 445924, "epoch": 5372} {"train_loss": -27.152753829956055, "global_step": 445925, "epoch": 5372} {"train_loss": -27.749500274658203, "global_step": 445926, "epoch": 5372} {"train_loss": -27.092945098876953, "global_step": 445927, "epoch": 5372} {"train_loss": -27.39344596862793, "global_step": 445928, "epoch": 5372} {"train_loss": -26.9925537109375, "global_step": 445929, "epoch": 5372} {"train_loss": -26.880859375, "global_step": 445930, "epoch": 5372} {"train_loss": -27.50970458984375, "global_step": 445931, "epoch": 5372} {"train_loss": -27.335031509399414, "global_step": 445932, "epoch": 5372} {"train_loss": -27.3558292388916, "global_step": 445933, "epoch": 5372} {"train_loss": -27.0643253326416, "global_step": 445934, "epoch": 5372} {"train_loss": -26.99542236328125, "global_step": 445935, "epoch": 5372} {"train_loss": -26.682363510131836, "global_step": 445936, "epoch": 5372} {"train_loss": -27.076786041259766, "global_step": 445937, "epoch": 5372} {"train_loss": -27.292139053344727, "global_step": 445938, "epoch": 5372} {"train_loss": -27.129364013671875, "global_step": 445939, "epoch": 5372} {"train_loss": -26.72114372253418, "global_step": 445940, "epoch": 5372} {"train_loss": -26.805145263671875, "global_step": 445941, "epoch": 5372} {"train_loss": -27.244190216064453, "global_step": 445942, "epoch": 5372} {"train_loss": -27.129276275634766, "global_step": 445943, "epoch": 5372} {"train_loss": -27.0170841217041, "global_step": 445944, "epoch": 5372} {"train_loss": -27.25367546081543, "global_step": 445945, "epoch": 5372} {"train_loss": -26.86970329284668, "global_step": 445946, "epoch": 5372} {"train_loss": -27.092533111572266, "global_step": 445947, "epoch": 5372} {"train_loss": -27.15998649597168, "global_step": 445948, "epoch": 5372} {"train_loss": -27.344160079956055, "global_step": 445949, "epoch": 5372} {"train_loss": -26.875244140625, "global_step": 445950, "epoch": 5372} {"train_loss": -26.93525505065918, "global_step": 445951, "epoch": 5372} {"train_loss": -26.895355224609375, "global_step": 445952, "epoch": 5372} {"train_loss": -27.016845703125, "global_step": 445953, "epoch": 5372} {"train_loss": -27.214706420898438, "global_step": 445954, "epoch": 5372} {"train_loss": -27.183008193969727, "global_step": 445955, "epoch": 5372} {"train_loss": -26.781097412109375, "global_step": 445956, "epoch": 5372} {"train_loss": -26.506881713867188, "global_step": 445957, "epoch": 5372} {"train_loss": -26.954153106873292, "global_step": 445958, "epoch": 5372, "val_loss": 6546397.0} {"train_loss": -25.843042373657227, "global_step": 445959, "epoch": 5373} {"train_loss": -26.4782657623291, "global_step": 445960, "epoch": 5373} {"train_loss": -26.145536422729492, "global_step": 445961, "epoch": 5373} {"train_loss": -26.3862247467041, "global_step": 445962, "epoch": 5373} {"train_loss": -25.761138916015625, "global_step": 445963, "epoch": 5373} {"train_loss": -26.774829864501953, "global_step": 445964, "epoch": 5373} {"train_loss": -26.555418014526367, "global_step": 445965, "epoch": 5373} {"train_loss": -26.378995895385742, "global_step": 445966, "epoch": 5373} {"train_loss": -26.899137496948242, "global_step": 445967, "epoch": 5373} {"train_loss": -26.25278091430664, "global_step": 445968, "epoch": 5373} {"train_loss": -26.967334747314453, "global_step": 445969, "epoch": 5373} {"train_loss": -26.566654205322266, "global_step": 445970, "epoch": 5373} {"train_loss": -26.94642448425293, "global_step": 445971, "epoch": 5373} {"train_loss": -26.394311904907227, "global_step": 445972, "epoch": 5373} {"train_loss": -26.437103271484375, "global_step": 445973, "epoch": 5373} {"train_loss": -26.7747745513916, "global_step": 445974, "epoch": 5373} {"train_loss": -27.034879684448242, "global_step": 445975, "epoch": 5373} {"train_loss": -26.880216598510742, "global_step": 445976, "epoch": 5373} {"train_loss": -26.815942764282227, "global_step": 445977, "epoch": 5373} {"train_loss": -26.586477279663086, "global_step": 445978, "epoch": 5373} {"train_loss": -26.96274185180664, "global_step": 445979, "epoch": 5373} {"train_loss": -26.515155792236328, "global_step": 445980, "epoch": 5373} {"train_loss": -26.95989418029785, "global_step": 445981, "epoch": 5373} {"train_loss": -26.98866844177246, "global_step": 445982, "epoch": 5373} {"train_loss": -26.92682456970215, "global_step": 445983, "epoch": 5373} {"train_loss": -27.024438858032227, "global_step": 445984, "epoch": 5373} {"train_loss": -26.876850128173828, "global_step": 445985, "epoch": 5373} {"train_loss": -26.8474178314209, "global_step": 445986, "epoch": 5373} {"train_loss": -26.808307647705078, "global_step": 445987, "epoch": 5373} {"train_loss": -26.883197784423828, "global_step": 445988, "epoch": 5373} {"train_loss": -27.080841064453125, "global_step": 445989, "epoch": 5373} {"train_loss": -26.941024780273438, "global_step": 445990, "epoch": 5373} {"train_loss": -27.292722702026367, "global_step": 445991, "epoch": 5373} {"train_loss": -27.337970733642578, "global_step": 445992, "epoch": 5373} {"train_loss": -27.008508682250977, "global_step": 445993, "epoch": 5373} {"train_loss": -26.869068145751953, "global_step": 445994, "epoch": 5373} {"train_loss": -27.045745849609375, "global_step": 445995, "epoch": 5373} {"train_loss": -27.156143188476562, "global_step": 445996, "epoch": 5373} {"train_loss": -27.59124755859375, "global_step": 445997, "epoch": 5373} {"train_loss": -27.443130493164062, "global_step": 445998, "epoch": 5373} {"train_loss": -27.169940948486328, "global_step": 445999, "epoch": 5373} {"train_loss": -27.096338272094727, "global_step": 446000, "epoch": 5373} {"train_loss": -27.210956573486328, "global_step": 446001, "epoch": 5373} {"train_loss": -27.22147560119629, "global_step": 446002, "epoch": 5373} {"train_loss": -27.09136962890625, "global_step": 446003, "epoch": 5373} {"train_loss": -27.848485946655273, "global_step": 446004, "epoch": 5373} {"train_loss": -27.135046005249023, "global_step": 446005, "epoch": 5373} {"train_loss": -27.23789405822754, "global_step": 446006, "epoch": 5373} {"train_loss": -27.01653480529785, "global_step": 446007, "epoch": 5373} {"train_loss": -27.18220329284668, "global_step": 446008, "epoch": 5373} {"train_loss": -27.288192749023438, "global_step": 446009, "epoch": 5373} {"train_loss": -27.222387313842773, "global_step": 446010, "epoch": 5373} {"train_loss": -27.156579971313477, "global_step": 446011, "epoch": 5373} {"train_loss": -27.022296905517578, "global_step": 446012, "epoch": 5373} {"train_loss": -27.30315589904785, "global_step": 446013, "epoch": 5373} {"train_loss": -27.235593795776367, "global_step": 446014, "epoch": 5373} {"train_loss": -27.248111724853516, "global_step": 446015, "epoch": 5373} {"train_loss": -26.866540908813477, "global_step": 446016, "epoch": 5373} {"train_loss": -26.58585548400879, "global_step": 446017, "epoch": 5373} {"train_loss": -26.485855102539062, "global_step": 446018, "epoch": 5373} {"train_loss": -25.947433471679688, "global_step": 446019, "epoch": 5373} {"train_loss": -26.06878089904785, "global_step": 446020, "epoch": 5373} {"train_loss": -27.12147331237793, "global_step": 446021, "epoch": 5373} {"train_loss": -26.532712936401367, "global_step": 446022, "epoch": 5373} {"train_loss": -26.134382247924805, "global_step": 446023, "epoch": 5373} {"train_loss": -26.638580322265625, "global_step": 446024, "epoch": 5373} {"train_loss": -26.283096313476562, "global_step": 446025, "epoch": 5373} {"train_loss": -27.163984298706055, "global_step": 446026, "epoch": 5373} {"train_loss": -26.70810890197754, "global_step": 446027, "epoch": 5373} {"train_loss": -26.862625122070312, "global_step": 446028, "epoch": 5373} {"train_loss": -26.356098175048828, "global_step": 446029, "epoch": 5373} {"train_loss": -26.79135513305664, "global_step": 446030, "epoch": 5373} {"train_loss": -26.573322296142578, "global_step": 446031, "epoch": 5373} {"train_loss": -26.786596298217773, "global_step": 446032, "epoch": 5373} {"train_loss": -26.80060386657715, "global_step": 446033, "epoch": 5373} {"train_loss": -27.340991973876953, "global_step": 446034, "epoch": 5373} {"train_loss": -26.41815185546875, "global_step": 446035, "epoch": 5373} {"train_loss": -26.204381942749023, "global_step": 446036, "epoch": 5373} {"train_loss": -26.92399024963379, "global_step": 446037, "epoch": 5373} {"train_loss": -26.951086044311523, "global_step": 446038, "epoch": 5373} {"train_loss": -26.389667510986328, "global_step": 446039, "epoch": 5373} {"train_loss": -26.67280387878418, "global_step": 446040, "epoch": 5373} {"train_loss": -26.811993357646895, "global_step": 446041, "epoch": 5373, "val_loss": 6544376.0} {"train_loss": -24.196598052978516, "global_step": 446042, "epoch": 5374} {"train_loss": -25.773513793945312, "global_step": 446043, "epoch": 5374} {"train_loss": -25.437803268432617, "global_step": 446044, "epoch": 5374} {"train_loss": -24.867197036743164, "global_step": 446045, "epoch": 5374} {"train_loss": -26.241439819335938, "global_step": 446046, "epoch": 5374} {"train_loss": -26.770782470703125, "global_step": 446047, "epoch": 5374} {"train_loss": -25.851102828979492, "global_step": 446048, "epoch": 5374} {"train_loss": -26.124984741210938, "global_step": 446049, "epoch": 5374} {"train_loss": -26.379663467407227, "global_step": 446050, "epoch": 5374} {"train_loss": -26.557519912719727, "global_step": 446051, "epoch": 5374} {"train_loss": -26.041589736938477, "global_step": 446052, "epoch": 5374} {"train_loss": -26.597579956054688, "global_step": 446053, "epoch": 5374} {"train_loss": -26.064062118530273, "global_step": 446054, "epoch": 5374} {"train_loss": -26.22944450378418, "global_step": 446055, "epoch": 5374} {"train_loss": -26.6640682220459, "global_step": 446056, "epoch": 5374} {"train_loss": -26.139551162719727, "global_step": 446057, "epoch": 5374} {"train_loss": -26.811725616455078, "global_step": 446058, "epoch": 5374} {"train_loss": -26.386737823486328, "global_step": 446059, "epoch": 5374} {"train_loss": -26.57850456237793, "global_step": 446060, "epoch": 5374} {"train_loss": -26.230199813842773, "global_step": 446061, "epoch": 5374} {"train_loss": -26.4747257232666, "global_step": 446062, "epoch": 5374} {"train_loss": -26.510223388671875, "global_step": 446063, "epoch": 5374} {"train_loss": -26.372705459594727, "global_step": 446064, "epoch": 5374} {"train_loss": -26.390243530273438, "global_step": 446065, "epoch": 5374} {"train_loss": -27.043872833251953, "global_step": 446066, "epoch": 5374} {"train_loss": -26.47159767150879, "global_step": 446067, "epoch": 5374} {"train_loss": -26.883453369140625, "global_step": 446068, "epoch": 5374} {"train_loss": -27.043588638305664, "global_step": 446069, "epoch": 5374} {"train_loss": -27.052587509155273, "global_step": 446070, "epoch": 5374} {"train_loss": -27.125009536743164, "global_step": 446071, "epoch": 5374} {"train_loss": -26.58497428894043, "global_step": 446072, "epoch": 5374} {"train_loss": -27.05209732055664, "global_step": 446073, "epoch": 5374} {"train_loss": -26.709766387939453, "global_step": 446074, "epoch": 5374} {"train_loss": -27.1362361907959, "global_step": 446075, "epoch": 5374} {"train_loss": -27.33790397644043, "global_step": 446076, "epoch": 5374} {"train_loss": -27.123815536499023, "global_step": 446077, "epoch": 5374} {"train_loss": -26.839569091796875, "global_step": 446078, "epoch": 5374} {"train_loss": -26.768762588500977, "global_step": 446079, "epoch": 5374} {"train_loss": -26.588470458984375, "global_step": 446080, "epoch": 5374} {"train_loss": -26.97931480407715, "global_step": 446081, "epoch": 5374} {"train_loss": -26.83660316467285, "global_step": 446082, "epoch": 5374} {"train_loss": -26.814533233642578, "global_step": 446083, "epoch": 5374} {"train_loss": -27.342771530151367, "global_step": 446084, "epoch": 5374} {"train_loss": -26.7489070892334, "global_step": 446085, "epoch": 5374} {"train_loss": -27.164478302001953, "global_step": 446086, "epoch": 5374} {"train_loss": -26.635889053344727, "global_step": 446087, "epoch": 5374} {"train_loss": -26.904966354370117, "global_step": 446088, "epoch": 5374} {"train_loss": -26.91463279724121, "global_step": 446089, "epoch": 5374} {"train_loss": -27.015323638916016, "global_step": 446090, "epoch": 5374} {"train_loss": -27.246723175048828, "global_step": 446091, "epoch": 5374} {"train_loss": -26.862966537475586, "global_step": 446092, "epoch": 5374} {"train_loss": -26.9770565032959, "global_step": 446093, "epoch": 5374} {"train_loss": -26.99549674987793, "global_step": 446094, "epoch": 5374} {"train_loss": -27.044458389282227, "global_step": 446095, "epoch": 5374} {"train_loss": -26.829015731811523, "global_step": 446096, "epoch": 5374} {"train_loss": -26.875640869140625, "global_step": 446097, "epoch": 5374} {"train_loss": -26.807844161987305, "global_step": 446098, "epoch": 5374} {"train_loss": -27.204206466674805, "global_step": 446099, "epoch": 5374} {"train_loss": -26.953237533569336, "global_step": 446100, "epoch": 5374} {"train_loss": -26.540372848510742, "global_step": 446101, "epoch": 5374} {"train_loss": -27.3935489654541, "global_step": 446102, "epoch": 5374} {"train_loss": -27.288726806640625, "global_step": 446103, "epoch": 5374} {"train_loss": -27.084516525268555, "global_step": 446104, "epoch": 5374} {"train_loss": -27.050296783447266, "global_step": 446105, "epoch": 5374} {"train_loss": -26.670093536376953, "global_step": 446106, "epoch": 5374} {"train_loss": -26.481836318969727, "global_step": 446107, "epoch": 5374} {"train_loss": -26.254907608032227, "global_step": 446108, "epoch": 5374} {"train_loss": -26.905813217163086, "global_step": 446109, "epoch": 5374} {"train_loss": -26.715112686157227, "global_step": 446110, "epoch": 5374} {"train_loss": -27.291513442993164, "global_step": 446111, "epoch": 5374} {"train_loss": -27.03928565979004, "global_step": 446112, "epoch": 5374} {"train_loss": -26.761432647705078, "global_step": 446113, "epoch": 5374} {"train_loss": -27.41650390625, "global_step": 446114, "epoch": 5374} {"train_loss": -27.16254997253418, "global_step": 446115, "epoch": 5374} {"train_loss": -27.28879165649414, "global_step": 446116, "epoch": 5374} {"train_loss": -27.144819259643555, "global_step": 446117, "epoch": 5374} {"train_loss": -27.301654815673828, "global_step": 446118, "epoch": 5374} {"train_loss": -26.971654891967773, "global_step": 446119, "epoch": 5374} {"train_loss": -27.210956573486328, "global_step": 446120, "epoch": 5374} {"train_loss": -26.8259334564209, "global_step": 446121, "epoch": 5374} {"train_loss": -26.681982040405273, "global_step": 446122, "epoch": 5374} {"train_loss": -26.29050064086914, "global_step": 446123, "epoch": 5374} {"train_loss": -26.715185326266003, "global_step": 446124, "epoch": 5374, "val_loss": 6641281.0} {"train_loss": -26.566761016845703, "global_step": 446125, "epoch": 5375} {"train_loss": -26.16114616394043, "global_step": 446126, "epoch": 5375} {"train_loss": -26.154022216796875, "global_step": 446127, "epoch": 5375} {"train_loss": -25.516977310180664, "global_step": 446128, "epoch": 5375} {"train_loss": -25.394773483276367, "global_step": 446129, "epoch": 5375} {"train_loss": -26.346771240234375, "global_step": 446130, "epoch": 5375} {"train_loss": -26.20723533630371, "global_step": 446131, "epoch": 5375} {"train_loss": -26.655927658081055, "global_step": 446132, "epoch": 5375} {"train_loss": -25.709943771362305, "global_step": 446133, "epoch": 5375} {"train_loss": -26.6119441986084, "global_step": 446134, "epoch": 5375} {"train_loss": -26.6058406829834, "global_step": 446135, "epoch": 5375} {"train_loss": -26.40369987487793, "global_step": 446136, "epoch": 5375} {"train_loss": -25.929956436157227, "global_step": 446137, "epoch": 5375} {"train_loss": -26.7497501373291, "global_step": 446138, "epoch": 5375} {"train_loss": -26.517126083374023, "global_step": 446139, "epoch": 5375} {"train_loss": -26.569290161132812, "global_step": 446140, "epoch": 5375} {"train_loss": -26.483442306518555, "global_step": 446141, "epoch": 5375} {"train_loss": -26.52534294128418, "global_step": 446142, "epoch": 5375} {"train_loss": -26.563861846923828, "global_step": 446143, "epoch": 5375} {"train_loss": -26.823383331298828, "global_step": 446144, "epoch": 5375} {"train_loss": -26.75587272644043, "global_step": 446145, "epoch": 5375} {"train_loss": -27.11030387878418, "global_step": 446146, "epoch": 5375} {"train_loss": -26.497838973999023, "global_step": 446147, "epoch": 5375} {"train_loss": -26.768171310424805, "global_step": 446148, "epoch": 5375} {"train_loss": -27.113327026367188, "global_step": 446149, "epoch": 5375} {"train_loss": -26.588531494140625, "global_step": 446150, "epoch": 5375} {"train_loss": -26.396596908569336, "global_step": 446151, "epoch": 5375} {"train_loss": -26.868682861328125, "global_step": 446152, "epoch": 5375} {"train_loss": -27.135366439819336, "global_step": 446153, "epoch": 5375} {"train_loss": -27.046411514282227, "global_step": 446154, "epoch": 5375} {"train_loss": -26.936237335205078, "global_step": 446155, "epoch": 5375} {"train_loss": -26.92193603515625, "global_step": 446156, "epoch": 5375} {"train_loss": -26.92538833618164, "global_step": 446157, "epoch": 5375} {"train_loss": -26.9728946685791, "global_step": 446158, "epoch": 5375} {"train_loss": -26.918598175048828, "global_step": 446159, "epoch": 5375} {"train_loss": -27.058368682861328, "global_step": 446160, "epoch": 5375} {"train_loss": -26.605920791625977, "global_step": 446161, "epoch": 5375} {"train_loss": -26.720306396484375, "global_step": 446162, "epoch": 5375} {"train_loss": -26.4780330657959, "global_step": 446163, "epoch": 5375} {"train_loss": -27.161508560180664, "global_step": 446164, "epoch": 5375} {"train_loss": -26.8673038482666, "global_step": 446165, "epoch": 5375} {"train_loss": -27.023895263671875, "global_step": 446166, "epoch": 5375} {"train_loss": -27.028879165649414, "global_step": 446167, "epoch": 5375} {"train_loss": -26.696252822875977, "global_step": 446168, "epoch": 5375} {"train_loss": -26.763355255126953, "global_step": 446169, "epoch": 5375} {"train_loss": -26.760669708251953, "global_step": 446170, "epoch": 5375} {"train_loss": -26.860382080078125, "global_step": 446171, "epoch": 5375} {"train_loss": -26.570520401000977, "global_step": 446172, "epoch": 5375} {"train_loss": -26.975982666015625, "global_step": 446173, "epoch": 5375} {"train_loss": -26.810754776000977, "global_step": 446174, "epoch": 5375} {"train_loss": -26.83935546875, "global_step": 446175, "epoch": 5375} {"train_loss": -26.79816246032715, "global_step": 446176, "epoch": 5375} {"train_loss": -26.366561889648438, "global_step": 446177, "epoch": 5375} {"train_loss": -26.489892959594727, "global_step": 446178, "epoch": 5375} {"train_loss": -26.97043800354004, "global_step": 446179, "epoch": 5375} {"train_loss": -26.3328800201416, "global_step": 446180, "epoch": 5375} {"train_loss": -26.91053581237793, "global_step": 446181, "epoch": 5375} {"train_loss": -26.73666763305664, "global_step": 446182, "epoch": 5375} {"train_loss": -26.868906021118164, "global_step": 446183, "epoch": 5375} {"train_loss": -27.152816772460938, "global_step": 446184, "epoch": 5375} {"train_loss": -26.86810874938965, "global_step": 446185, "epoch": 5375} {"train_loss": -26.917041778564453, "global_step": 446186, "epoch": 5375} {"train_loss": -26.8011417388916, "global_step": 446187, "epoch": 5375} {"train_loss": -26.971872329711914, "global_step": 446188, "epoch": 5375} {"train_loss": -27.150592803955078, "global_step": 446189, "epoch": 5375} {"train_loss": -27.0755558013916, "global_step": 446190, "epoch": 5375} {"train_loss": -27.03545570373535, "global_step": 446191, "epoch": 5375} {"train_loss": -26.981489181518555, "global_step": 446192, "epoch": 5375} {"train_loss": -27.00745964050293, "global_step": 446193, "epoch": 5375} {"train_loss": -27.02219009399414, "global_step": 446194, "epoch": 5375} {"train_loss": -26.897159576416016, "global_step": 446195, "epoch": 5375} {"train_loss": -27.273956298828125, "global_step": 446196, "epoch": 5375} {"train_loss": -26.80506706237793, "global_step": 446197, "epoch": 5375} {"train_loss": -27.117050170898438, "global_step": 446198, "epoch": 5375} {"train_loss": -26.746475219726562, "global_step": 446199, "epoch": 5375} {"train_loss": -27.354162216186523, "global_step": 446200, "epoch": 5375} {"train_loss": -27.149023056030273, "global_step": 446201, "epoch": 5375} {"train_loss": -27.770721435546875, "global_step": 446202, "epoch": 5375} {"train_loss": -27.01322364807129, "global_step": 446203, "epoch": 5375} {"train_loss": -26.69024658203125, "global_step": 446204, "epoch": 5375} {"train_loss": -27.111724853515625, "global_step": 446205, "epoch": 5375} {"train_loss": -26.698240280151367, "global_step": 446206, "epoch": 5375} {"train_loss": -26.72444626222174, "global_step": 446207, "epoch": 5375, "val_loss": 6512033.0} {"train_loss": -25.816699981689453, "global_step": 446208, "epoch": 5376} {"train_loss": -25.572105407714844, "global_step": 446209, "epoch": 5376} {"train_loss": -25.768640518188477, "global_step": 446210, "epoch": 5376} {"train_loss": -26.0199031829834, "global_step": 446211, "epoch": 5376} {"train_loss": -26.031417846679688, "global_step": 446212, "epoch": 5376} {"train_loss": -26.007816314697266, "global_step": 446213, "epoch": 5376} {"train_loss": -26.26752281188965, "global_step": 446214, "epoch": 5376} {"train_loss": -26.39357566833496, "global_step": 446215, "epoch": 5376} {"train_loss": -26.13543701171875, "global_step": 446216, "epoch": 5376} {"train_loss": -25.81418228149414, "global_step": 446217, "epoch": 5376} {"train_loss": -26.38427734375, "global_step": 446218, "epoch": 5376} {"train_loss": -26.33338737487793, "global_step": 446219, "epoch": 5376} {"train_loss": -26.92081642150879, "global_step": 446220, "epoch": 5376} {"train_loss": -26.61787223815918, "global_step": 446221, "epoch": 5376} {"train_loss": -26.634342193603516, "global_step": 446222, "epoch": 5376} {"train_loss": -26.610803604125977, "global_step": 446223, "epoch": 5376} {"train_loss": -26.791711807250977, "global_step": 446224, "epoch": 5376} {"train_loss": -26.61342430114746, "global_step": 446225, "epoch": 5376} {"train_loss": -26.97983169555664, "global_step": 446226, "epoch": 5376} {"train_loss": -26.4527530670166, "global_step": 446227, "epoch": 5376} {"train_loss": -27.030309677124023, "global_step": 446228, "epoch": 5376} {"train_loss": -26.804279327392578, "global_step": 446229, "epoch": 5376} {"train_loss": -26.411788940429688, "global_step": 446230, "epoch": 5376} {"train_loss": -26.75763511657715, "global_step": 446231, "epoch": 5376} {"train_loss": -26.752826690673828, "global_step": 446232, "epoch": 5376} {"train_loss": -26.4721736907959, "global_step": 446233, "epoch": 5376} {"train_loss": -26.866073608398438, "global_step": 446234, "epoch": 5376} {"train_loss": -26.81131935119629, "global_step": 446235, "epoch": 5376} {"train_loss": -27.105688095092773, "global_step": 446236, "epoch": 5376} {"train_loss": -27.19061279296875, "global_step": 446237, "epoch": 5376} {"train_loss": -27.126379013061523, "global_step": 446238, "epoch": 5376} {"train_loss": -27.264554977416992, "global_step": 446239, "epoch": 5376} {"train_loss": -26.862258911132812, "global_step": 446240, "epoch": 5376} {"train_loss": -27.0285701751709, "global_step": 446241, "epoch": 5376} {"train_loss": -27.002500534057617, "global_step": 446242, "epoch": 5376} {"train_loss": -26.828943252563477, "global_step": 446243, "epoch": 5376} {"train_loss": -27.24538230895996, "global_step": 446244, "epoch": 5376} {"train_loss": -27.213048934936523, "global_step": 446245, "epoch": 5376} {"train_loss": -27.01618003845215, "global_step": 446246, "epoch": 5376} {"train_loss": -27.233396530151367, "global_step": 446247, "epoch": 5376} {"train_loss": -26.98221206665039, "global_step": 446248, "epoch": 5376} {"train_loss": -26.832015991210938, "global_step": 446249, "epoch": 5376} {"train_loss": -27.139875411987305, "global_step": 446250, "epoch": 5376} {"train_loss": -26.8912410736084, "global_step": 446251, "epoch": 5376} {"train_loss": -26.75306510925293, "global_step": 446252, "epoch": 5376} {"train_loss": -27.22412109375, "global_step": 446253, "epoch": 5376} {"train_loss": -26.964710235595703, "global_step": 446254, "epoch": 5376} {"train_loss": -27.178241729736328, "global_step": 446255, "epoch": 5376} {"train_loss": -26.968887329101562, "global_step": 446256, "epoch": 5376} {"train_loss": -26.814733505249023, "global_step": 446257, "epoch": 5376} {"train_loss": -26.95932388305664, "global_step": 446258, "epoch": 5376} {"train_loss": -27.378976821899414, "global_step": 446259, "epoch": 5376} {"train_loss": -27.249984741210938, "global_step": 446260, "epoch": 5376} {"train_loss": -27.155065536499023, "global_step": 446261, "epoch": 5376} {"train_loss": -27.17817497253418, "global_step": 446262, "epoch": 5376} {"train_loss": -27.00885009765625, "global_step": 446263, "epoch": 5376} {"train_loss": -27.300256729125977, "global_step": 446264, "epoch": 5376} {"train_loss": -26.755212783813477, "global_step": 446265, "epoch": 5376} {"train_loss": -27.027328491210938, "global_step": 446266, "epoch": 5376} {"train_loss": -26.837696075439453, "global_step": 446267, "epoch": 5376} {"train_loss": -27.160999298095703, "global_step": 446268, "epoch": 5376} {"train_loss": -27.20328140258789, "global_step": 446269, "epoch": 5376} {"train_loss": -27.107919692993164, "global_step": 446270, "epoch": 5376} {"train_loss": -26.904279708862305, "global_step": 446271, "epoch": 5376} {"train_loss": -27.243967056274414, "global_step": 446272, "epoch": 5376} {"train_loss": -27.1612606048584, "global_step": 446273, "epoch": 5376} {"train_loss": -27.23394775390625, "global_step": 446274, "epoch": 5376} {"train_loss": -26.852075576782227, "global_step": 446275, "epoch": 5376} {"train_loss": -26.629261016845703, "global_step": 446276, "epoch": 5376} {"train_loss": -26.255842208862305, "global_step": 446277, "epoch": 5376} {"train_loss": -26.25080680847168, "global_step": 446278, "epoch": 5376} {"train_loss": -26.5640869140625, "global_step": 446279, "epoch": 5376} {"train_loss": -27.16383171081543, "global_step": 446280, "epoch": 5376} {"train_loss": -26.56268310546875, "global_step": 446281, "epoch": 5376} {"train_loss": -26.98480224609375, "global_step": 446282, "epoch": 5376} {"train_loss": -27.180017471313477, "global_step": 446283, "epoch": 5376} {"train_loss": -26.965757369995117, "global_step": 446284, "epoch": 5376} {"train_loss": -27.021045684814453, "global_step": 446285, "epoch": 5376} {"train_loss": -26.96380615234375, "global_step": 446286, "epoch": 5376} {"train_loss": -26.948266983032227, "global_step": 446287, "epoch": 5376} {"train_loss": -26.947223663330078, "global_step": 446288, "epoch": 5376} {"train_loss": -27.1147518157959, "global_step": 446289, "epoch": 5376} {"train_loss": -26.809404350188842, "global_step": 446290, "epoch": 5376, "val_loss": 6536257.5} {"train_loss": -26.559228897094727, "global_step": 446291, "epoch": 5377} {"train_loss": -25.560354232788086, "global_step": 446292, "epoch": 5377} {"train_loss": -25.796314239501953, "global_step": 446293, "epoch": 5377} {"train_loss": -26.256973266601562, "global_step": 446294, "epoch": 5377} {"train_loss": -26.6173095703125, "global_step": 446295, "epoch": 5377} {"train_loss": -25.78428077697754, "global_step": 446296, "epoch": 5377} {"train_loss": -26.81884765625, "global_step": 446297, "epoch": 5377} {"train_loss": -26.233396530151367, "global_step": 446298, "epoch": 5377} {"train_loss": -26.412866592407227, "global_step": 446299, "epoch": 5377} {"train_loss": -26.574369430541992, "global_step": 446300, "epoch": 5377} {"train_loss": -26.741729736328125, "global_step": 446301, "epoch": 5377} {"train_loss": -26.68503761291504, "global_step": 446302, "epoch": 5377} {"train_loss": -26.38101577758789, "global_step": 446303, "epoch": 5377} {"train_loss": -26.725332260131836, "global_step": 446304, "epoch": 5377} {"train_loss": -26.634347915649414, "global_step": 446305, "epoch": 5377} {"train_loss": -26.510400772094727, "global_step": 446306, "epoch": 5377} {"train_loss": -26.673480987548828, "global_step": 446307, "epoch": 5377} {"train_loss": -26.691213607788086, "global_step": 446308, "epoch": 5377} {"train_loss": -26.91900634765625, "global_step": 446309, "epoch": 5377} {"train_loss": -26.527917861938477, "global_step": 446310, "epoch": 5377} {"train_loss": -27.057846069335938, "global_step": 446311, "epoch": 5377} {"train_loss": -26.567365646362305, "global_step": 446312, "epoch": 5377} {"train_loss": -26.640222549438477, "global_step": 446313, "epoch": 5377} {"train_loss": -26.915790557861328, "global_step": 446314, "epoch": 5377} {"train_loss": -26.639911651611328, "global_step": 446315, "epoch": 5377} {"train_loss": -26.909881591796875, "global_step": 446316, "epoch": 5377} {"train_loss": -26.893558502197266, "global_step": 446317, "epoch": 5377} {"train_loss": -27.08086585998535, "global_step": 446318, "epoch": 5377} {"train_loss": -26.71967887878418, "global_step": 446319, "epoch": 5377} {"train_loss": -27.165815353393555, "global_step": 446320, "epoch": 5377} {"train_loss": -27.10992431640625, "global_step": 446321, "epoch": 5377} {"train_loss": -27.005895614624023, "global_step": 446322, "epoch": 5377} {"train_loss": -26.83332633972168, "global_step": 446323, "epoch": 5377} {"train_loss": -27.47018814086914, "global_step": 446324, "epoch": 5377} {"train_loss": -26.89210319519043, "global_step": 446325, "epoch": 5377} {"train_loss": -27.059589385986328, "global_step": 446326, "epoch": 5377} {"train_loss": -27.280149459838867, "global_step": 446327, "epoch": 5377} {"train_loss": -27.153852462768555, "global_step": 446328, "epoch": 5377} {"train_loss": -27.169036865234375, "global_step": 446329, "epoch": 5377} {"train_loss": -26.96601676940918, "global_step": 446330, "epoch": 5377} {"train_loss": -26.985809326171875, "global_step": 446331, "epoch": 5377} {"train_loss": -27.327014923095703, "global_step": 446332, "epoch": 5377} {"train_loss": -27.370771408081055, "global_step": 446333, "epoch": 5377} {"train_loss": -27.37884521484375, "global_step": 446334, "epoch": 5377} {"train_loss": -26.990259170532227, "global_step": 446335, "epoch": 5377} {"train_loss": -27.195398330688477, "global_step": 446336, "epoch": 5377} {"train_loss": -26.87445068359375, "global_step": 446337, "epoch": 5377} {"train_loss": -27.016813278198242, "global_step": 446338, "epoch": 5377} {"train_loss": -27.183002471923828, "global_step": 446339, "epoch": 5377} {"train_loss": -26.7850399017334, "global_step": 446340, "epoch": 5377} {"train_loss": -26.674680709838867, "global_step": 446341, "epoch": 5377} {"train_loss": -27.11751365661621, "global_step": 446342, "epoch": 5377} {"train_loss": -26.716800689697266, "global_step": 446343, "epoch": 5377} {"train_loss": -27.201948165893555, "global_step": 446344, "epoch": 5377} {"train_loss": -27.188013076782227, "global_step": 446345, "epoch": 5377} {"train_loss": -26.768207550048828, "global_step": 446346, "epoch": 5377} {"train_loss": -27.45680046081543, "global_step": 446347, "epoch": 5377} {"train_loss": -26.889041900634766, "global_step": 446348, "epoch": 5377} {"train_loss": -26.97059440612793, "global_step": 446349, "epoch": 5377} {"train_loss": -26.978775024414062, "global_step": 446350, "epoch": 5377} {"train_loss": -27.370420455932617, "global_step": 446351, "epoch": 5377} {"train_loss": -27.18758201599121, "global_step": 446352, "epoch": 5377} {"train_loss": -27.039709091186523, "global_step": 446353, "epoch": 5377} {"train_loss": -27.034635543823242, "global_step": 446354, "epoch": 5377} {"train_loss": -26.843475341796875, "global_step": 446355, "epoch": 5377} {"train_loss": -26.73486328125, "global_step": 446356, "epoch": 5377} {"train_loss": -26.978504180908203, "global_step": 446357, "epoch": 5377} {"train_loss": -27.21097755432129, "global_step": 446358, "epoch": 5377} {"train_loss": -27.12493896484375, "global_step": 446359, "epoch": 5377} {"train_loss": -27.245792388916016, "global_step": 446360, "epoch": 5377} {"train_loss": -27.41326332092285, "global_step": 446361, "epoch": 5377} {"train_loss": -27.03335952758789, "global_step": 446362, "epoch": 5377} {"train_loss": -26.993799209594727, "global_step": 446363, "epoch": 5377} {"train_loss": -27.055524826049805, "global_step": 446364, "epoch": 5377} {"train_loss": -27.4471435546875, "global_step": 446365, "epoch": 5377} {"train_loss": -27.326541900634766, "global_step": 446366, "epoch": 5377} {"train_loss": -27.203954696655273, "global_step": 446367, "epoch": 5377} {"train_loss": -27.03169059753418, "global_step": 446368, "epoch": 5377} {"train_loss": -26.91584587097168, "global_step": 446369, "epoch": 5377} {"train_loss": -27.1144962310791, "global_step": 446370, "epoch": 5377} {"train_loss": -27.278451919555664, "global_step": 446371, "epoch": 5377} {"train_loss": -26.98518943786621, "global_step": 446372, "epoch": 5377} {"train_loss": -26.9069990364902, "global_step": 446373, "epoch": 5377, "val_loss": 6552767.0} {"train_loss": -27.65964126586914, "global_step": 446374, "epoch": 5378} {"train_loss": -27.077640533447266, "global_step": 446375, "epoch": 5378} {"train_loss": -27.066974639892578, "global_step": 446376, "epoch": 5378} {"train_loss": -26.986572265625, "global_step": 446377, "epoch": 5378} {"train_loss": -26.8255615234375, "global_step": 446378, "epoch": 5378} {"train_loss": -26.927404403686523, "global_step": 446379, "epoch": 5378} {"train_loss": -27.0380802154541, "global_step": 446380, "epoch": 5378} {"train_loss": -27.034616470336914, "global_step": 446381, "epoch": 5378} {"train_loss": -26.71567153930664, "global_step": 446382, "epoch": 5378} {"train_loss": -26.612640380859375, "global_step": 446383, "epoch": 5378} {"train_loss": -27.14027214050293, "global_step": 446384, "epoch": 5378} {"train_loss": -27.087507247924805, "global_step": 446385, "epoch": 5378} {"train_loss": -26.948989868164062, "global_step": 446386, "epoch": 5378} {"train_loss": -26.560476303100586, "global_step": 446387, "epoch": 5378} {"train_loss": -27.28522300720215, "global_step": 446388, "epoch": 5378} {"train_loss": -27.193740844726562, "global_step": 446389, "epoch": 5378} {"train_loss": -26.931188583374023, "global_step": 446390, "epoch": 5378} {"train_loss": -26.828022003173828, "global_step": 446391, "epoch": 5378} {"train_loss": -27.039295196533203, "global_step": 446392, "epoch": 5378} {"train_loss": -27.06463623046875, "global_step": 446393, "epoch": 5378} {"train_loss": -26.982629776000977, "global_step": 446394, "epoch": 5378} {"train_loss": -26.987030029296875, "global_step": 446395, "epoch": 5378} {"train_loss": -26.843427658081055, "global_step": 446396, "epoch": 5378} {"train_loss": -26.872060775756836, "global_step": 446397, "epoch": 5378} {"train_loss": -27.182666778564453, "global_step": 446398, "epoch": 5378} {"train_loss": -26.955297470092773, "global_step": 446399, "epoch": 5378} {"train_loss": -26.915943145751953, "global_step": 446400, "epoch": 5378} {"train_loss": -26.990497589111328, "global_step": 446401, "epoch": 5378} {"train_loss": -26.870344161987305, "global_step": 446402, "epoch": 5378} {"train_loss": -27.082904815673828, "global_step": 446403, "epoch": 5378} {"train_loss": -26.942930221557617, "global_step": 446404, "epoch": 5378} {"train_loss": -27.41575050354004, "global_step": 446405, "epoch": 5378} {"train_loss": -27.107831954956055, "global_step": 446406, "epoch": 5378} {"train_loss": -27.20757484436035, "global_step": 446407, "epoch": 5378} {"train_loss": -26.661029815673828, "global_step": 446408, "epoch": 5378} {"train_loss": -27.127777099609375, "global_step": 446409, "epoch": 5378} {"train_loss": -26.961069107055664, "global_step": 446410, "epoch": 5378} {"train_loss": -27.12766456604004, "global_step": 446411, "epoch": 5378} {"train_loss": -27.493078231811523, "global_step": 446412, "epoch": 5378} {"train_loss": -27.185626983642578, "global_step": 446413, "epoch": 5378} {"train_loss": -26.9119930267334, "global_step": 446414, "epoch": 5378} {"train_loss": -26.963659286499023, "global_step": 446415, "epoch": 5378} {"train_loss": -27.061681747436523, "global_step": 446416, "epoch": 5378} {"train_loss": -26.535781860351562, "global_step": 446417, "epoch": 5378} {"train_loss": -26.997838973999023, "global_step": 446418, "epoch": 5378} {"train_loss": -26.918014526367188, "global_step": 446419, "epoch": 5378} {"train_loss": -27.227354049682617, "global_step": 446420, "epoch": 5378} {"train_loss": -26.988855361938477, "global_step": 446421, "epoch": 5378} {"train_loss": -27.168975830078125, "global_step": 446422, "epoch": 5378} {"train_loss": -27.027318954467773, "global_step": 446423, "epoch": 5378} {"train_loss": -26.816791534423828, "global_step": 446424, "epoch": 5378} {"train_loss": -27.362958908081055, "global_step": 446425, "epoch": 5378} {"train_loss": -26.836090087890625, "global_step": 446426, "epoch": 5378} {"train_loss": -27.180973052978516, "global_step": 446427, "epoch": 5378} {"train_loss": -26.72193717956543, "global_step": 446428, "epoch": 5378} {"train_loss": -26.886411666870117, "global_step": 446429, "epoch": 5378} {"train_loss": -27.37166404724121, "global_step": 446430, "epoch": 5378} {"train_loss": -26.975616455078125, "global_step": 446431, "epoch": 5378} {"train_loss": -26.993377685546875, "global_step": 446432, "epoch": 5378} {"train_loss": -27.29854393005371, "global_step": 446433, "epoch": 5378} {"train_loss": -27.024662017822266, "global_step": 446434, "epoch": 5378} {"train_loss": -26.8339900970459, "global_step": 446435, "epoch": 5378} {"train_loss": -27.28207778930664, "global_step": 446436, "epoch": 5378} {"train_loss": -27.040124893188477, "global_step": 446437, "epoch": 5378} {"train_loss": -27.2685546875, "global_step": 446438, "epoch": 5378} {"train_loss": -27.315505981445312, "global_step": 446439, "epoch": 5378} {"train_loss": -27.295835494995117, "global_step": 446440, "epoch": 5378} {"train_loss": -27.28008460998535, "global_step": 446441, "epoch": 5378} {"train_loss": -26.934070587158203, "global_step": 446442, "epoch": 5378} {"train_loss": -27.17091941833496, "global_step": 446443, "epoch": 5378} {"train_loss": -27.162927627563477, "global_step": 446444, "epoch": 5378} {"train_loss": -26.8407039642334, "global_step": 446445, "epoch": 5378} {"train_loss": -26.532480239868164, "global_step": 446446, "epoch": 5378} {"train_loss": -26.261764526367188, "global_step": 446447, "epoch": 5378} {"train_loss": -26.88824462890625, "global_step": 446448, "epoch": 5378} {"train_loss": -26.81245994567871, "global_step": 446449, "epoch": 5378} {"train_loss": -27.27225112915039, "global_step": 446450, "epoch": 5378} {"train_loss": -27.039487838745117, "global_step": 446451, "epoch": 5378} {"train_loss": -26.693450927734375, "global_step": 446452, "epoch": 5378} {"train_loss": -27.215219497680664, "global_step": 446453, "epoch": 5378} {"train_loss": -26.743061065673828, "global_step": 446454, "epoch": 5378} {"train_loss": -27.154449462890625, "global_step": 446455, "epoch": 5378} {"train_loss": -27.013638967491058, "global_step": 446456, "epoch": 5378, "val_loss": 6620188.0} {"train_loss": -25.569726943969727, "global_step": 446457, "epoch": 5379} {"train_loss": -25.526065826416016, "global_step": 446458, "epoch": 5379} {"train_loss": -26.018396377563477, "global_step": 446459, "epoch": 5379} {"train_loss": -25.915821075439453, "global_step": 446460, "epoch": 5379} {"train_loss": -26.656476974487305, "global_step": 446461, "epoch": 5379} {"train_loss": -26.35129737854004, "global_step": 446462, "epoch": 5379} {"train_loss": -25.992938995361328, "global_step": 446463, "epoch": 5379} {"train_loss": -26.424026489257812, "global_step": 446464, "epoch": 5379} {"train_loss": -26.45120620727539, "global_step": 446465, "epoch": 5379} {"train_loss": -26.0217227935791, "global_step": 446466, "epoch": 5379} {"train_loss": -26.67718505859375, "global_step": 446467, "epoch": 5379} {"train_loss": -26.57733154296875, "global_step": 446468, "epoch": 5379} {"train_loss": -26.362552642822266, "global_step": 446469, "epoch": 5379} {"train_loss": -26.30034828186035, "global_step": 446470, "epoch": 5379} {"train_loss": -26.457874298095703, "global_step": 446471, "epoch": 5379} {"train_loss": -26.527379989624023, "global_step": 446472, "epoch": 5379} {"train_loss": -26.433095932006836, "global_step": 446473, "epoch": 5379} {"train_loss": -26.502424240112305, "global_step": 446474, "epoch": 5379} {"train_loss": -26.54729652404785, "global_step": 446475, "epoch": 5379} {"train_loss": -26.744525909423828, "global_step": 446476, "epoch": 5379} {"train_loss": -26.769672393798828, "global_step": 446477, "epoch": 5379} {"train_loss": -26.75996208190918, "global_step": 446478, "epoch": 5379} {"train_loss": -26.880456924438477, "global_step": 446479, "epoch": 5379} {"train_loss": -26.661462783813477, "global_step": 446480, "epoch": 5379} {"train_loss": -26.867279052734375, "global_step": 446481, "epoch": 5379} {"train_loss": -26.580718994140625, "global_step": 446482, "epoch": 5379} {"train_loss": -27.127225875854492, "global_step": 446483, "epoch": 5379} {"train_loss": -26.86128044128418, "global_step": 446484, "epoch": 5379} {"train_loss": -26.655658721923828, "global_step": 446485, "epoch": 5379} {"train_loss": -26.862762451171875, "global_step": 446486, "epoch": 5379} {"train_loss": -26.847570419311523, "global_step": 446487, "epoch": 5379} {"train_loss": -26.48415184020996, "global_step": 446488, "epoch": 5379} {"train_loss": -27.119604110717773, "global_step": 446489, "epoch": 5379} {"train_loss": -26.85087013244629, "global_step": 446490, "epoch": 5379} {"train_loss": -26.90740394592285, "global_step": 446491, "epoch": 5379} {"train_loss": -26.79329490661621, "global_step": 446492, "epoch": 5379} {"train_loss": -26.749006271362305, "global_step": 446493, "epoch": 5379} {"train_loss": -26.878210067749023, "global_step": 446494, "epoch": 5379} {"train_loss": -27.190832138061523, "global_step": 446495, "epoch": 5379} {"train_loss": -27.08973503112793, "global_step": 446496, "epoch": 5379} {"train_loss": -26.83131980895996, "global_step": 446497, "epoch": 5379} {"train_loss": -26.73660659790039, "global_step": 446498, "epoch": 5379} {"train_loss": -27.10329246520996, "global_step": 446499, "epoch": 5379} {"train_loss": -27.445764541625977, "global_step": 446500, "epoch": 5379} {"train_loss": -27.003732681274414, "global_step": 446501, "epoch": 5379} {"train_loss": -27.323938369750977, "global_step": 446502, "epoch": 5379} {"train_loss": -27.870676040649414, "global_step": 446503, "epoch": 5379} {"train_loss": -27.2685546875, "global_step": 446504, "epoch": 5379} {"train_loss": -27.465620040893555, "global_step": 446505, "epoch": 5379} {"train_loss": -26.784198760986328, "global_step": 446506, "epoch": 5379} {"train_loss": -27.205078125, "global_step": 446507, "epoch": 5379} {"train_loss": -27.21565818786621, "global_step": 446508, "epoch": 5379} {"train_loss": -26.974145889282227, "global_step": 446509, "epoch": 5379} {"train_loss": -26.962202072143555, "global_step": 446510, "epoch": 5379} {"train_loss": -27.309925079345703, "global_step": 446511, "epoch": 5379} {"train_loss": -26.865766525268555, "global_step": 446512, "epoch": 5379} {"train_loss": -26.97931480407715, "global_step": 446513, "epoch": 5379} {"train_loss": -27.202106475830078, "global_step": 446514, "epoch": 5379} {"train_loss": -27.24770164489746, "global_step": 446515, "epoch": 5379} {"train_loss": -27.598608016967773, "global_step": 446516, "epoch": 5379} {"train_loss": -27.05071449279785, "global_step": 446517, "epoch": 5379} {"train_loss": -27.163015365600586, "global_step": 446518, "epoch": 5379} {"train_loss": -26.810791015625, "global_step": 446519, "epoch": 5379} {"train_loss": -26.97222328186035, "global_step": 446520, "epoch": 5379} {"train_loss": -26.69563865661621, "global_step": 446521, "epoch": 5379} {"train_loss": -26.4765567779541, "global_step": 446522, "epoch": 5379} {"train_loss": -26.967960357666016, "global_step": 446523, "epoch": 5379} {"train_loss": -26.91398048400879, "global_step": 446524, "epoch": 5379} {"train_loss": -27.104297637939453, "global_step": 446525, "epoch": 5379} {"train_loss": -26.890363693237305, "global_step": 446526, "epoch": 5379} {"train_loss": -26.451608657836914, "global_step": 446527, "epoch": 5379} {"train_loss": -27.194448471069336, "global_step": 446528, "epoch": 5379} {"train_loss": -26.583831787109375, "global_step": 446529, "epoch": 5379} {"train_loss": -26.024127960205078, "global_step": 446530, "epoch": 5379} {"train_loss": -24.419157028198242, "global_step": 446531, "epoch": 5379} {"train_loss": -23.356714248657227, "global_step": 446532, "epoch": 5379} {"train_loss": -25.00860023498535, "global_step": 446533, "epoch": 5379} {"train_loss": -25.9647274017334, "global_step": 446534, "epoch": 5379} {"train_loss": -25.678634643554688, "global_step": 446535, "epoch": 5379} {"train_loss": -25.762922286987305, "global_step": 446536, "epoch": 5379} {"train_loss": -26.19794273376465, "global_step": 446537, "epoch": 5379} {"train_loss": -26.16535758972168, "global_step": 446538, "epoch": 5379} {"train_loss": -26.626392663243305, "global_step": 446539, "epoch": 5379, "val_loss": 6662479.0} {"train_loss": -25.860071182250977, "global_step": 446540, "epoch": 5380} {"train_loss": -25.681568145751953, "global_step": 446541, "epoch": 5380} {"train_loss": -25.60379981994629, "global_step": 446542, "epoch": 5380} {"train_loss": -25.248092651367188, "global_step": 446543, "epoch": 5380} {"train_loss": -25.784839630126953, "global_step": 446544, "epoch": 5380} {"train_loss": -25.5645694732666, "global_step": 446545, "epoch": 5380} {"train_loss": -25.590574264526367, "global_step": 446546, "epoch": 5380} {"train_loss": -25.9023380279541, "global_step": 446547, "epoch": 5380} {"train_loss": -25.703296661376953, "global_step": 446548, "epoch": 5380} {"train_loss": -26.183002471923828, "global_step": 446549, "epoch": 5380} {"train_loss": -25.881488800048828, "global_step": 446550, "epoch": 5380} {"train_loss": -25.99985694885254, "global_step": 446551, "epoch": 5380} {"train_loss": -26.188461303710938, "global_step": 446552, "epoch": 5380} {"train_loss": -26.372655868530273, "global_step": 446553, "epoch": 5380} {"train_loss": -26.134613037109375, "global_step": 446554, "epoch": 5380} {"train_loss": -26.266590118408203, "global_step": 446555, "epoch": 5380} {"train_loss": -26.054540634155273, "global_step": 446556, "epoch": 5380} {"train_loss": -26.562437057495117, "global_step": 446557, "epoch": 5380} {"train_loss": -26.365026473999023, "global_step": 446558, "epoch": 5380} {"train_loss": -26.69388198852539, "global_step": 446559, "epoch": 5380} {"train_loss": -26.505151748657227, "global_step": 446560, "epoch": 5380} {"train_loss": -26.340106964111328, "global_step": 446561, "epoch": 5380} {"train_loss": -26.726118087768555, "global_step": 446562, "epoch": 5380} {"train_loss": -26.70954704284668, "global_step": 446563, "epoch": 5380} {"train_loss": -26.393178939819336, "global_step": 446564, "epoch": 5380} {"train_loss": -26.638242721557617, "global_step": 446565, "epoch": 5380} {"train_loss": -26.699417114257812, "global_step": 446566, "epoch": 5380} {"train_loss": -26.628387451171875, "global_step": 446567, "epoch": 5380} {"train_loss": -26.354887008666992, "global_step": 446568, "epoch": 5380} {"train_loss": -26.434314727783203, "global_step": 446569, "epoch": 5380} {"train_loss": -26.729284286499023, "global_step": 446570, "epoch": 5380} {"train_loss": -26.61334228515625, "global_step": 446571, "epoch": 5380} {"train_loss": -26.664724349975586, "global_step": 446572, "epoch": 5380} {"train_loss": -26.713735580444336, "global_step": 446573, "epoch": 5380} {"train_loss": -27.23774528503418, "global_step": 446574, "epoch": 5380} {"train_loss": -26.668188095092773, "global_step": 446575, "epoch": 5380} {"train_loss": -26.968481063842773, "global_step": 446576, "epoch": 5380} {"train_loss": -26.692960739135742, "global_step": 446577, "epoch": 5380} {"train_loss": -26.996347427368164, "global_step": 446578, "epoch": 5380} {"train_loss": -27.136871337890625, "global_step": 446579, "epoch": 5380} {"train_loss": -26.706533432006836, "global_step": 446580, "epoch": 5380} {"train_loss": -26.79884147644043, "global_step": 446581, "epoch": 5380} {"train_loss": -26.891813278198242, "global_step": 446582, "epoch": 5380} {"train_loss": -27.182538986206055, "global_step": 446583, "epoch": 5380} {"train_loss": -27.239511489868164, "global_step": 446584, "epoch": 5380} {"train_loss": -26.86446189880371, "global_step": 446585, "epoch": 5380} {"train_loss": -26.9860897064209, "global_step": 446586, "epoch": 5380} {"train_loss": -27.39866065979004, "global_step": 446587, "epoch": 5380} {"train_loss": -27.0524959564209, "global_step": 446588, "epoch": 5380} {"train_loss": -27.275226593017578, "global_step": 446589, "epoch": 5380} {"train_loss": -27.132055282592773, "global_step": 446590, "epoch": 5380} {"train_loss": -27.107641220092773, "global_step": 446591, "epoch": 5380} {"train_loss": -26.883228302001953, "global_step": 446592, "epoch": 5380} {"train_loss": -27.02894401550293, "global_step": 446593, "epoch": 5380} {"train_loss": -26.59429359436035, "global_step": 446594, "epoch": 5380} {"train_loss": -26.715045928955078, "global_step": 446595, "epoch": 5380} {"train_loss": -27.129186630249023, "global_step": 446596, "epoch": 5380} {"train_loss": -27.347684860229492, "global_step": 446597, "epoch": 5380} {"train_loss": -27.264081954956055, "global_step": 446598, "epoch": 5380} {"train_loss": -27.0340576171875, "global_step": 446599, "epoch": 5380} {"train_loss": -27.116565704345703, "global_step": 446600, "epoch": 5380} {"train_loss": -27.40522575378418, "global_step": 446601, "epoch": 5380} {"train_loss": -27.4623966217041, "global_step": 446602, "epoch": 5380} {"train_loss": -26.867605209350586, "global_step": 446603, "epoch": 5380} {"train_loss": -27.479467391967773, "global_step": 446604, "epoch": 5380} {"train_loss": -26.98359489440918, "global_step": 446605, "epoch": 5380} {"train_loss": -26.993000030517578, "global_step": 446606, "epoch": 5380} {"train_loss": -27.389148712158203, "global_step": 446607, "epoch": 5380} {"train_loss": -27.09675407409668, "global_step": 446608, "epoch": 5380} {"train_loss": -27.408803939819336, "global_step": 446609, "epoch": 5380} {"train_loss": -27.349103927612305, "global_step": 446610, "epoch": 5380} {"train_loss": -27.225500106811523, "global_step": 446611, "epoch": 5380} {"train_loss": -27.253997802734375, "global_step": 446612, "epoch": 5380} {"train_loss": -27.10214614868164, "global_step": 446613, "epoch": 5380} {"train_loss": -26.53339958190918, "global_step": 446614, "epoch": 5380} {"train_loss": -26.414518356323242, "global_step": 446615, "epoch": 5380} {"train_loss": -27.055883407592773, "global_step": 446616, "epoch": 5380} {"train_loss": -26.8642578125, "global_step": 446617, "epoch": 5380} {"train_loss": -27.17414665222168, "global_step": 446618, "epoch": 5380} {"train_loss": -26.85634422302246, "global_step": 446619, "epoch": 5380} {"train_loss": -26.725622177124023, "global_step": 446620, "epoch": 5380} {"train_loss": -26.719640731811523, "global_step": 446621, "epoch": 5380} {"train_loss": -26.70862749398473, "global_step": 446622, "epoch": 5380, "val_loss": 6603945.0} {"train_loss": -26.32350730895996, "global_step": 446623, "epoch": 5381} {"train_loss": -26.171056747436523, "global_step": 446624, "epoch": 5381} {"train_loss": -26.850360870361328, "global_step": 446625, "epoch": 5381} {"train_loss": -26.455738067626953, "global_step": 446626, "epoch": 5381} {"train_loss": -26.911157608032227, "global_step": 446627, "epoch": 5381} {"train_loss": -26.95625877380371, "global_step": 446628, "epoch": 5381} {"train_loss": -26.814987182617188, "global_step": 446629, "epoch": 5381} {"train_loss": -26.403669357299805, "global_step": 446630, "epoch": 5381} {"train_loss": -26.8825740814209, "global_step": 446631, "epoch": 5381} {"train_loss": -27.10149574279785, "global_step": 446632, "epoch": 5381} {"train_loss": -26.63796043395996, "global_step": 446633, "epoch": 5381} {"train_loss": -26.952295303344727, "global_step": 446634, "epoch": 5381} {"train_loss": -26.88996696472168, "global_step": 446635, "epoch": 5381} {"train_loss": -26.623220443725586, "global_step": 446636, "epoch": 5381} {"train_loss": -27.09064292907715, "global_step": 446637, "epoch": 5381} {"train_loss": -26.96125602722168, "global_step": 446638, "epoch": 5381} {"train_loss": -26.841032028198242, "global_step": 446639, "epoch": 5381} {"train_loss": -27.018014907836914, "global_step": 446640, "epoch": 5381} {"train_loss": -27.19403076171875, "global_step": 446641, "epoch": 5381} {"train_loss": -26.75068473815918, "global_step": 446642, "epoch": 5381} {"train_loss": -26.5661563873291, "global_step": 446643, "epoch": 5381} {"train_loss": -26.792926788330078, "global_step": 446644, "epoch": 5381} {"train_loss": -27.0541934967041, "global_step": 446645, "epoch": 5381} {"train_loss": -26.7376766204834, "global_step": 446646, "epoch": 5381} {"train_loss": -26.96142578125, "global_step": 446647, "epoch": 5381} {"train_loss": -27.022504806518555, "global_step": 446648, "epoch": 5381} {"train_loss": -27.047256469726562, "global_step": 446649, "epoch": 5381} {"train_loss": -26.65882682800293, "global_step": 446650, "epoch": 5381} {"train_loss": -26.535337448120117, "global_step": 446651, "epoch": 5381} {"train_loss": -26.81475257873535, "global_step": 446652, "epoch": 5381} {"train_loss": -27.040985107421875, "global_step": 446653, "epoch": 5381} {"train_loss": -27.038681030273438, "global_step": 446654, "epoch": 5381} {"train_loss": -27.105182647705078, "global_step": 446655, "epoch": 5381} {"train_loss": -26.625707626342773, "global_step": 446656, "epoch": 5381} {"train_loss": -27.1645450592041, "global_step": 446657, "epoch": 5381} {"train_loss": -27.074920654296875, "global_step": 446658, "epoch": 5381} {"train_loss": -26.841760635375977, "global_step": 446659, "epoch": 5381} {"train_loss": -26.799039840698242, "global_step": 446660, "epoch": 5381} {"train_loss": -26.814987182617188, "global_step": 446661, "epoch": 5381} {"train_loss": -26.74399757385254, "global_step": 446662, "epoch": 5381} {"train_loss": -27.14739418029785, "global_step": 446663, "epoch": 5381} {"train_loss": -26.601606369018555, "global_step": 446664, "epoch": 5381} {"train_loss": -26.654829025268555, "global_step": 446665, "epoch": 5381} {"train_loss": -26.473989486694336, "global_step": 446666, "epoch": 5381} {"train_loss": -27.13848876953125, "global_step": 446667, "epoch": 5381} {"train_loss": -27.250492095947266, "global_step": 446668, "epoch": 5381} {"train_loss": -26.9974365234375, "global_step": 446669, "epoch": 5381} {"train_loss": -27.045307159423828, "global_step": 446670, "epoch": 5381} {"train_loss": -27.26568603515625, "global_step": 446671, "epoch": 5381} {"train_loss": -27.29994773864746, "global_step": 446672, "epoch": 5381} {"train_loss": -26.781686782836914, "global_step": 446673, "epoch": 5381} {"train_loss": -26.914169311523438, "global_step": 446674, "epoch": 5381} {"train_loss": -26.821399688720703, "global_step": 446675, "epoch": 5381} {"train_loss": -26.8056697845459, "global_step": 446676, "epoch": 5381} {"train_loss": -27.451147079467773, "global_step": 446677, "epoch": 5381} {"train_loss": -26.956314086914062, "global_step": 446678, "epoch": 5381} {"train_loss": -27.347248077392578, "global_step": 446679, "epoch": 5381} {"train_loss": -26.9764461517334, "global_step": 446680, "epoch": 5381} {"train_loss": -27.154958724975586, "global_step": 446681, "epoch": 5381} {"train_loss": -27.061124801635742, "global_step": 446682, "epoch": 5381} {"train_loss": -27.138391494750977, "global_step": 446683, "epoch": 5381} {"train_loss": -27.486846923828125, "global_step": 446684, "epoch": 5381} {"train_loss": -27.136444091796875, "global_step": 446685, "epoch": 5381} {"train_loss": -27.218311309814453, "global_step": 446686, "epoch": 5381} {"train_loss": -27.130634307861328, "global_step": 446687, "epoch": 5381} {"train_loss": -26.675649642944336, "global_step": 446688, "epoch": 5381} {"train_loss": -26.75031089782715, "global_step": 446689, "epoch": 5381} {"train_loss": -26.554441452026367, "global_step": 446690, "epoch": 5381} {"train_loss": -26.647863388061523, "global_step": 446691, "epoch": 5381} {"train_loss": -26.711095809936523, "global_step": 446692, "epoch": 5381} {"train_loss": -27.413976669311523, "global_step": 446693, "epoch": 5381} {"train_loss": -27.223081588745117, "global_step": 446694, "epoch": 5381} {"train_loss": -27.062408447265625, "global_step": 446695, "epoch": 5381} {"train_loss": -27.120559692382812, "global_step": 446696, "epoch": 5381} {"train_loss": -26.680883407592773, "global_step": 446697, "epoch": 5381} {"train_loss": -26.98736572265625, "global_step": 446698, "epoch": 5381} {"train_loss": -27.025012969970703, "global_step": 446699, "epoch": 5381} {"train_loss": -27.072866439819336, "global_step": 446700, "epoch": 5381} {"train_loss": -27.377685546875, "global_step": 446701, "epoch": 5381} {"train_loss": -27.249425888061523, "global_step": 446702, "epoch": 5381} {"train_loss": -26.842252731323242, "global_step": 446703, "epoch": 5381} {"train_loss": -27.763452529907227, "global_step": 446704, "epoch": 5381} {"train_loss": -26.947089022900684, "global_step": 446705, "epoch": 5381, "val_loss": 6535074.0} {"train_loss": -25.595272064208984, "global_step": 446706, "epoch": 5382} {"train_loss": -26.322906494140625, "global_step": 446707, "epoch": 5382} {"train_loss": -26.2641544342041, "global_step": 446708, "epoch": 5382} {"train_loss": -26.328216552734375, "global_step": 446709, "epoch": 5382} {"train_loss": -26.22092628479004, "global_step": 446710, "epoch": 5382} {"train_loss": -26.10562515258789, "global_step": 446711, "epoch": 5382} {"train_loss": -26.194580078125, "global_step": 446712, "epoch": 5382} {"train_loss": -26.38563346862793, "global_step": 446713, "epoch": 5382} {"train_loss": -26.475996017456055, "global_step": 446714, "epoch": 5382} {"train_loss": -26.26161766052246, "global_step": 446715, "epoch": 5382} {"train_loss": -26.4567813873291, "global_step": 446716, "epoch": 5382} {"train_loss": -26.663848876953125, "global_step": 446717, "epoch": 5382} {"train_loss": -26.708251953125, "global_step": 446718, "epoch": 5382} {"train_loss": -26.598546981811523, "global_step": 446719, "epoch": 5382} {"train_loss": -26.618371963500977, "global_step": 446720, "epoch": 5382} {"train_loss": -26.8741512298584, "global_step": 446721, "epoch": 5382} {"train_loss": -26.985815048217773, "global_step": 446722, "epoch": 5382} {"train_loss": -26.240140914916992, "global_step": 446723, "epoch": 5382} {"train_loss": -26.76711082458496, "global_step": 446724, "epoch": 5382} {"train_loss": -26.701904296875, "global_step": 446725, "epoch": 5382} {"train_loss": -26.659454345703125, "global_step": 446726, "epoch": 5382} {"train_loss": -26.90069580078125, "global_step": 446727, "epoch": 5382} {"train_loss": -26.7426815032959, "global_step": 446728, "epoch": 5382} {"train_loss": -26.672651290893555, "global_step": 446729, "epoch": 5382} {"train_loss": -26.969776153564453, "global_step": 446730, "epoch": 5382} {"train_loss": -26.767719268798828, "global_step": 446731, "epoch": 5382} {"train_loss": -26.97495460510254, "global_step": 446732, "epoch": 5382} {"train_loss": -27.08734703063965, "global_step": 446733, "epoch": 5382} {"train_loss": -26.970712661743164, "global_step": 446734, "epoch": 5382} {"train_loss": -27.07557487487793, "global_step": 446735, "epoch": 5382} {"train_loss": -26.963560104370117, "global_step": 446736, "epoch": 5382} {"train_loss": -27.454015731811523, "global_step": 446737, "epoch": 5382} {"train_loss": -26.956253051757812, "global_step": 446738, "epoch": 5382} {"train_loss": -27.274673461914062, "global_step": 446739, "epoch": 5382} {"train_loss": -26.98994255065918, "global_step": 446740, "epoch": 5382} {"train_loss": -26.886011123657227, "global_step": 446741, "epoch": 5382} {"train_loss": -26.780866622924805, "global_step": 446742, "epoch": 5382} {"train_loss": -26.943439483642578, "global_step": 446743, "epoch": 5382} {"train_loss": -27.08558464050293, "global_step": 446744, "epoch": 5382} {"train_loss": -26.848468780517578, "global_step": 446745, "epoch": 5382} {"train_loss": -26.95669937133789, "global_step": 446746, "epoch": 5382} {"train_loss": -27.072052001953125, "global_step": 446747, "epoch": 5382} {"train_loss": -27.105453491210938, "global_step": 446748, "epoch": 5382} {"train_loss": -27.237091064453125, "global_step": 446749, "epoch": 5382} {"train_loss": -27.20760154724121, "global_step": 446750, "epoch": 5382} {"train_loss": -27.257354736328125, "global_step": 446751, "epoch": 5382} {"train_loss": -26.761640548706055, "global_step": 446752, "epoch": 5382} {"train_loss": -27.138824462890625, "global_step": 446753, "epoch": 5382} {"train_loss": -27.38666343688965, "global_step": 446754, "epoch": 5382} {"train_loss": -27.07895278930664, "global_step": 446755, "epoch": 5382} {"train_loss": -27.072607040405273, "global_step": 446756, "epoch": 5382} {"train_loss": -27.283462524414062, "global_step": 446757, "epoch": 5382} {"train_loss": -27.18121337890625, "global_step": 446758, "epoch": 5382} {"train_loss": -26.92632484436035, "global_step": 446759, "epoch": 5382} {"train_loss": -27.534366607666016, "global_step": 446760, "epoch": 5382} {"train_loss": -27.009811401367188, "global_step": 446761, "epoch": 5382} {"train_loss": -27.20892333984375, "global_step": 446762, "epoch": 5382} {"train_loss": -27.306798934936523, "global_step": 446763, "epoch": 5382} {"train_loss": -27.227985382080078, "global_step": 446764, "epoch": 5382} {"train_loss": -27.320850372314453, "global_step": 446765, "epoch": 5382} {"train_loss": -27.136871337890625, "global_step": 446766, "epoch": 5382} {"train_loss": -27.237152099609375, "global_step": 446767, "epoch": 5382} {"train_loss": -27.259138107299805, "global_step": 446768, "epoch": 5382} {"train_loss": -27.323246002197266, "global_step": 446769, "epoch": 5382} {"train_loss": -27.28835105895996, "global_step": 446770, "epoch": 5382} {"train_loss": -27.279342651367188, "global_step": 446771, "epoch": 5382} {"train_loss": -27.309600830078125, "global_step": 446772, "epoch": 5382} {"train_loss": -27.390798568725586, "global_step": 446773, "epoch": 5382} {"train_loss": -27.156513214111328, "global_step": 446774, "epoch": 5382} {"train_loss": -27.455419540405273, "global_step": 446775, "epoch": 5382} {"train_loss": -27.569934844970703, "global_step": 446776, "epoch": 5382} {"train_loss": -26.665952682495117, "global_step": 446777, "epoch": 5382} {"train_loss": -26.601877212524414, "global_step": 446778, "epoch": 5382} {"train_loss": -25.3619441986084, "global_step": 446779, "epoch": 5382} {"train_loss": -23.9138240814209, "global_step": 446780, "epoch": 5382} {"train_loss": -23.77774429321289, "global_step": 446781, "epoch": 5382} {"train_loss": -25.8061466217041, "global_step": 446782, "epoch": 5382} {"train_loss": -25.904129028320312, "global_step": 446783, "epoch": 5382} {"train_loss": -25.58270835876465, "global_step": 446784, "epoch": 5382} {"train_loss": -25.953210830688477, "global_step": 446785, "epoch": 5382} {"train_loss": -26.08184242248535, "global_step": 446786, "epoch": 5382} {"train_loss": -25.756134033203125, "global_step": 446787, "epoch": 5382} {"train_loss": -26.7473534273814, "global_step": 446788, "epoch": 5382, "val_loss": 6498231.0} {"train_loss": -25.63726806640625, "global_step": 446789, "epoch": 5383} {"train_loss": -26.216354370117188, "global_step": 446790, "epoch": 5383} {"train_loss": -25.74165153503418, "global_step": 446791, "epoch": 5383} {"train_loss": -25.970184326171875, "global_step": 446792, "epoch": 5383} {"train_loss": -25.538232803344727, "global_step": 446793, "epoch": 5383} {"train_loss": -26.041467666625977, "global_step": 446794, "epoch": 5383} {"train_loss": -26.29660415649414, "global_step": 446795, "epoch": 5383} {"train_loss": -26.460407257080078, "global_step": 446796, "epoch": 5383} {"train_loss": -26.18037223815918, "global_step": 446797, "epoch": 5383} {"train_loss": -26.58475112915039, "global_step": 446798, "epoch": 5383} {"train_loss": -26.079730987548828, "global_step": 446799, "epoch": 5383} {"train_loss": -26.300277709960938, "global_step": 446800, "epoch": 5383} {"train_loss": -26.51287269592285, "global_step": 446801, "epoch": 5383} {"train_loss": -26.161487579345703, "global_step": 446802, "epoch": 5383} {"train_loss": -26.406646728515625, "global_step": 446803, "epoch": 5383} {"train_loss": -26.238004684448242, "global_step": 446804, "epoch": 5383} {"train_loss": -26.131244659423828, "global_step": 446805, "epoch": 5383} {"train_loss": -26.593610763549805, "global_step": 446806, "epoch": 5383} {"train_loss": -26.498096466064453, "global_step": 446807, "epoch": 5383} {"train_loss": -26.55925941467285, "global_step": 446808, "epoch": 5383} {"train_loss": -26.407163619995117, "global_step": 446809, "epoch": 5383} {"train_loss": -26.49903678894043, "global_step": 446810, "epoch": 5383} {"train_loss": -26.460220336914062, "global_step": 446811, "epoch": 5383} {"train_loss": -26.935407638549805, "global_step": 446812, "epoch": 5383} {"train_loss": -26.536474227905273, "global_step": 446813, "epoch": 5383} {"train_loss": -26.637222290039062, "global_step": 446814, "epoch": 5383} {"train_loss": -26.547086715698242, "global_step": 446815, "epoch": 5383} {"train_loss": -26.778715133666992, "global_step": 446816, "epoch": 5383} {"train_loss": -27.154388427734375, "global_step": 446817, "epoch": 5383} {"train_loss": -26.669538497924805, "global_step": 446818, "epoch": 5383} {"train_loss": -26.633031845092773, "global_step": 446819, "epoch": 5383} {"train_loss": -26.80240821838379, "global_step": 446820, "epoch": 5383} {"train_loss": -26.983060836791992, "global_step": 446821, "epoch": 5383} {"train_loss": -26.679121017456055, "global_step": 446822, "epoch": 5383} {"train_loss": -26.94510269165039, "global_step": 446823, "epoch": 5383} {"train_loss": -26.529117584228516, "global_step": 446824, "epoch": 5383} {"train_loss": -27.0500431060791, "global_step": 446825, "epoch": 5383} {"train_loss": -27.088998794555664, "global_step": 446826, "epoch": 5383} {"train_loss": -27.147113800048828, "global_step": 446827, "epoch": 5383} {"train_loss": -27.044713973999023, "global_step": 446828, "epoch": 5383} {"train_loss": -27.16168785095215, "global_step": 446829, "epoch": 5383} {"train_loss": -26.904218673706055, "global_step": 446830, "epoch": 5383} {"train_loss": -27.345783233642578, "global_step": 446831, "epoch": 5383} {"train_loss": -27.61700439453125, "global_step": 446832, "epoch": 5383} {"train_loss": -26.9493350982666, "global_step": 446833, "epoch": 5383} {"train_loss": -26.742984771728516, "global_step": 446834, "epoch": 5383} {"train_loss": -27.27815818786621, "global_step": 446835, "epoch": 5383} {"train_loss": -27.520538330078125, "global_step": 446836, "epoch": 5383} {"train_loss": -27.07207679748535, "global_step": 446837, "epoch": 5383} {"train_loss": -27.4311466217041, "global_step": 446838, "epoch": 5383} {"train_loss": -27.422285079956055, "global_step": 446839, "epoch": 5383} {"train_loss": -27.22258949279785, "global_step": 446840, "epoch": 5383} {"train_loss": -27.135791778564453, "global_step": 446841, "epoch": 5383} {"train_loss": -26.9116153717041, "global_step": 446842, "epoch": 5383} {"train_loss": -27.007831573486328, "global_step": 446843, "epoch": 5383} {"train_loss": -26.99184226989746, "global_step": 446844, "epoch": 5383} {"train_loss": -27.157506942749023, "global_step": 446845, "epoch": 5383} {"train_loss": -27.060510635375977, "global_step": 446846, "epoch": 5383} {"train_loss": -27.264371871948242, "global_step": 446847, "epoch": 5383} {"train_loss": -27.293018341064453, "global_step": 446848, "epoch": 5383} {"train_loss": -27.37282371520996, "global_step": 446849, "epoch": 5383} {"train_loss": -27.391321182250977, "global_step": 446850, "epoch": 5383} {"train_loss": -27.0570011138916, "global_step": 446851, "epoch": 5383} {"train_loss": -27.545700073242188, "global_step": 446852, "epoch": 5383} {"train_loss": -27.699316024780273, "global_step": 446853, "epoch": 5383} {"train_loss": -27.24024772644043, "global_step": 446854, "epoch": 5383} {"train_loss": -27.09755516052246, "global_step": 446855, "epoch": 5383} {"train_loss": -27.21284294128418, "global_step": 446856, "epoch": 5383} {"train_loss": -26.975645065307617, "global_step": 446857, "epoch": 5383} {"train_loss": -26.757593154907227, "global_step": 446858, "epoch": 5383} {"train_loss": -26.85574722290039, "global_step": 446859, "epoch": 5383} {"train_loss": -27.267744064331055, "global_step": 446860, "epoch": 5383} {"train_loss": -27.073575973510742, "global_step": 446861, "epoch": 5383} {"train_loss": -27.021228790283203, "global_step": 446862, "epoch": 5383} {"train_loss": -27.430463790893555, "global_step": 446863, "epoch": 5383} {"train_loss": -26.910078048706055, "global_step": 446864, "epoch": 5383} {"train_loss": -27.494770050048828, "global_step": 446865, "epoch": 5383} {"train_loss": -27.25986099243164, "global_step": 446866, "epoch": 5383} {"train_loss": -27.3361873626709, "global_step": 446867, "epoch": 5383} {"train_loss": -26.860013961791992, "global_step": 446868, "epoch": 5383} {"train_loss": -27.2200870513916, "global_step": 446869, "epoch": 5383} {"train_loss": -26.896533966064453, "global_step": 446870, "epoch": 5383} {"train_loss": -26.84876961305917, "global_step": 446871, "epoch": 5383, "val_loss": 6584163.0} {"train_loss": -25.607898712158203, "global_step": 446872, "epoch": 5384} {"train_loss": -25.54169273376465, "global_step": 446873, "epoch": 5384} {"train_loss": -25.46332359313965, "global_step": 446874, "epoch": 5384} {"train_loss": -25.9348087310791, "global_step": 446875, "epoch": 5384} {"train_loss": -25.582605361938477, "global_step": 446876, "epoch": 5384} {"train_loss": -25.532819747924805, "global_step": 446877, "epoch": 5384} {"train_loss": -26.152124404907227, "global_step": 446878, "epoch": 5384} {"train_loss": -25.913196563720703, "global_step": 446879, "epoch": 5384} {"train_loss": -26.185773849487305, "global_step": 446880, "epoch": 5384} {"train_loss": -25.70916175842285, "global_step": 446881, "epoch": 5384} {"train_loss": -26.18975830078125, "global_step": 446882, "epoch": 5384} {"train_loss": -26.437335968017578, "global_step": 446883, "epoch": 5384} {"train_loss": -26.574691772460938, "global_step": 446884, "epoch": 5384} {"train_loss": -26.564655303955078, "global_step": 446885, "epoch": 5384} {"train_loss": -26.43495750427246, "global_step": 446886, "epoch": 5384} {"train_loss": -26.048837661743164, "global_step": 446887, "epoch": 5384} {"train_loss": -26.51495933532715, "global_step": 446888, "epoch": 5384} {"train_loss": -26.266357421875, "global_step": 446889, "epoch": 5384} {"train_loss": -26.634033203125, "global_step": 446890, "epoch": 5384} {"train_loss": -26.61500358581543, "global_step": 446891, "epoch": 5384} {"train_loss": -26.2630615234375, "global_step": 446892, "epoch": 5384} {"train_loss": -26.9603271484375, "global_step": 446893, "epoch": 5384} {"train_loss": -26.615238189697266, "global_step": 446894, "epoch": 5384} {"train_loss": -26.670190811157227, "global_step": 446895, "epoch": 5384} {"train_loss": -27.068052291870117, "global_step": 446896, "epoch": 5384} {"train_loss": -26.56106948852539, "global_step": 446897, "epoch": 5384} {"train_loss": -26.91951560974121, "global_step": 446898, "epoch": 5384} {"train_loss": -26.810943603515625, "global_step": 446899, "epoch": 5384} {"train_loss": -26.81157875061035, "global_step": 446900, "epoch": 5384} {"train_loss": -26.975378036499023, "global_step": 446901, "epoch": 5384} {"train_loss": -26.672626495361328, "global_step": 446902, "epoch": 5384} {"train_loss": -26.529417037963867, "global_step": 446903, "epoch": 5384} {"train_loss": -26.712753295898438, "global_step": 446904, "epoch": 5384} {"train_loss": -26.797021865844727, "global_step": 446905, "epoch": 5384} {"train_loss": -26.848220825195312, "global_step": 446906, "epoch": 5384} {"train_loss": -26.890493392944336, "global_step": 446907, "epoch": 5384} {"train_loss": -27.0760555267334, "global_step": 446908, "epoch": 5384} {"train_loss": -26.989660263061523, "global_step": 446909, "epoch": 5384} {"train_loss": -26.546926498413086, "global_step": 446910, "epoch": 5384} {"train_loss": -27.005887985229492, "global_step": 446911, "epoch": 5384} {"train_loss": -27.134946823120117, "global_step": 446912, "epoch": 5384} {"train_loss": -27.245248794555664, "global_step": 446913, "epoch": 5384} {"train_loss": -27.15009117126465, "global_step": 446914, "epoch": 5384} {"train_loss": -27.040552139282227, "global_step": 446915, "epoch": 5384} {"train_loss": -26.924076080322266, "global_step": 446916, "epoch": 5384} {"train_loss": -27.2545108795166, "global_step": 446917, "epoch": 5384} {"train_loss": -27.46243667602539, "global_step": 446918, "epoch": 5384} {"train_loss": -26.96616554260254, "global_step": 446919, "epoch": 5384} {"train_loss": -27.085067749023438, "global_step": 446920, "epoch": 5384} {"train_loss": -26.77622413635254, "global_step": 446921, "epoch": 5384} {"train_loss": -27.31135368347168, "global_step": 446922, "epoch": 5384} {"train_loss": -26.875045776367188, "global_step": 446923, "epoch": 5384} {"train_loss": -26.907730102539062, "global_step": 446924, "epoch": 5384} {"train_loss": -27.132110595703125, "global_step": 446925, "epoch": 5384} {"train_loss": -26.973773956298828, "global_step": 446926, "epoch": 5384} {"train_loss": -26.74176597595215, "global_step": 446927, "epoch": 5384} {"train_loss": -27.229040145874023, "global_step": 446928, "epoch": 5384} {"train_loss": -27.216739654541016, "global_step": 446929, "epoch": 5384} {"train_loss": -26.878864288330078, "global_step": 446930, "epoch": 5384} {"train_loss": -27.36346435546875, "global_step": 446931, "epoch": 5384} {"train_loss": -26.956151962280273, "global_step": 446932, "epoch": 5384} {"train_loss": -27.313922882080078, "global_step": 446933, "epoch": 5384} {"train_loss": -26.880786895751953, "global_step": 446934, "epoch": 5384} {"train_loss": -26.75714683532715, "global_step": 446935, "epoch": 5384} {"train_loss": -27.265348434448242, "global_step": 446936, "epoch": 5384} {"train_loss": -27.170080184936523, "global_step": 446937, "epoch": 5384} {"train_loss": -27.259540557861328, "global_step": 446938, "epoch": 5384} {"train_loss": -26.746368408203125, "global_step": 446939, "epoch": 5384} {"train_loss": -27.03828239440918, "global_step": 446940, "epoch": 5384} {"train_loss": -27.454071044921875, "global_step": 446941, "epoch": 5384} {"train_loss": -27.152435302734375, "global_step": 446942, "epoch": 5384} {"train_loss": -27.153982162475586, "global_step": 446943, "epoch": 5384} {"train_loss": -27.057331085205078, "global_step": 446944, "epoch": 5384} {"train_loss": -27.162382125854492, "global_step": 446945, "epoch": 5384} {"train_loss": -27.125940322875977, "global_step": 446946, "epoch": 5384} {"train_loss": -27.254215240478516, "global_step": 446947, "epoch": 5384} {"train_loss": -27.229223251342773, "global_step": 446948, "epoch": 5384} {"train_loss": -27.323348999023438, "global_step": 446949, "epoch": 5384} {"train_loss": -26.742856979370117, "global_step": 446950, "epoch": 5384} {"train_loss": -26.99114990234375, "global_step": 446951, "epoch": 5384} {"train_loss": -26.800464630126953, "global_step": 446952, "epoch": 5384} {"train_loss": -27.127349853515625, "global_step": 446953, "epoch": 5384} {"train_loss": -26.779522080019294, "global_step": 446954, "epoch": 5384, "val_loss": 6477026.0} {"train_loss": -26.015249252319336, "global_step": 446955, "epoch": 5385} {"train_loss": -25.795806884765625, "global_step": 446956, "epoch": 5385} {"train_loss": -26.170480728149414, "global_step": 446957, "epoch": 5385} {"train_loss": -26.461721420288086, "global_step": 446958, "epoch": 5385} {"train_loss": -26.454572677612305, "global_step": 446959, "epoch": 5385} {"train_loss": -26.39093017578125, "global_step": 446960, "epoch": 5385} {"train_loss": -26.566791534423828, "global_step": 446961, "epoch": 5385} {"train_loss": -26.00208854675293, "global_step": 446962, "epoch": 5385} {"train_loss": -26.50371742248535, "global_step": 446963, "epoch": 5385} {"train_loss": -26.75348472595215, "global_step": 446964, "epoch": 5385} {"train_loss": -26.18182945251465, "global_step": 446965, "epoch": 5385} {"train_loss": -26.831466674804688, "global_step": 446966, "epoch": 5385} {"train_loss": -26.71088981628418, "global_step": 446967, "epoch": 5385} {"train_loss": -26.444488525390625, "global_step": 446968, "epoch": 5385} {"train_loss": -26.3715763092041, "global_step": 446969, "epoch": 5385} {"train_loss": -26.27485466003418, "global_step": 446970, "epoch": 5385} {"train_loss": -26.494470596313477, "global_step": 446971, "epoch": 5385} {"train_loss": -26.531885147094727, "global_step": 446972, "epoch": 5385} {"train_loss": -26.926122665405273, "global_step": 446973, "epoch": 5385} {"train_loss": -26.621809005737305, "global_step": 446974, "epoch": 5385} {"train_loss": -26.992298126220703, "global_step": 446975, "epoch": 5385} {"train_loss": -26.401514053344727, "global_step": 446976, "epoch": 5385} {"train_loss": -26.32879638671875, "global_step": 446977, "epoch": 5385} {"train_loss": -26.6838321685791, "global_step": 446978, "epoch": 5385} {"train_loss": -26.569721221923828, "global_step": 446979, "epoch": 5385} {"train_loss": -26.614822387695312, "global_step": 446980, "epoch": 5385} {"train_loss": -26.520294189453125, "global_step": 446981, "epoch": 5385} {"train_loss": -27.01914405822754, "global_step": 446982, "epoch": 5385} {"train_loss": -26.64242935180664, "global_step": 446983, "epoch": 5385} {"train_loss": -26.447961807250977, "global_step": 446984, "epoch": 5385} {"train_loss": -26.71442985534668, "global_step": 446985, "epoch": 5385} {"train_loss": -27.004194259643555, "global_step": 446986, "epoch": 5385} {"train_loss": -27.033411026000977, "global_step": 446987, "epoch": 5385} {"train_loss": -26.97835350036621, "global_step": 446988, "epoch": 5385} {"train_loss": -27.31088638305664, "global_step": 446989, "epoch": 5385} {"train_loss": -27.3747501373291, "global_step": 446990, "epoch": 5385} {"train_loss": -27.059919357299805, "global_step": 446991, "epoch": 5385} {"train_loss": -27.180835723876953, "global_step": 446992, "epoch": 5385} {"train_loss": -26.991010665893555, "global_step": 446993, "epoch": 5385} {"train_loss": -27.057971954345703, "global_step": 446994, "epoch": 5385} {"train_loss": -26.85328483581543, "global_step": 446995, "epoch": 5385} {"train_loss": -27.100147247314453, "global_step": 446996, "epoch": 5385} {"train_loss": -27.364959716796875, "global_step": 446997, "epoch": 5385} {"train_loss": -27.08161735534668, "global_step": 446998, "epoch": 5385} {"train_loss": -27.189071655273438, "global_step": 446999, "epoch": 5385} {"train_loss": -27.233728408813477, "global_step": 447000, "epoch": 5385} {"train_loss": -26.98858642578125, "global_step": 447001, "epoch": 5385} {"train_loss": -27.432600021362305, "global_step": 447002, "epoch": 5385} {"train_loss": -27.41706657409668, "global_step": 447003, "epoch": 5385} {"train_loss": -27.193832397460938, "global_step": 447004, "epoch": 5385} {"train_loss": -26.921798706054688, "global_step": 447005, "epoch": 5385} {"train_loss": -27.2840576171875, "global_step": 447006, "epoch": 5385} {"train_loss": -27.25699234008789, "global_step": 447007, "epoch": 5385} {"train_loss": -27.241418838500977, "global_step": 447008, "epoch": 5385} {"train_loss": -27.44772720336914, "global_step": 447009, "epoch": 5385} {"train_loss": -27.173980712890625, "global_step": 447010, "epoch": 5385} {"train_loss": -26.947622299194336, "global_step": 447011, "epoch": 5385} {"train_loss": -27.132556915283203, "global_step": 447012, "epoch": 5385} {"train_loss": -27.241865158081055, "global_step": 447013, "epoch": 5385} {"train_loss": -27.01248550415039, "global_step": 447014, "epoch": 5385} {"train_loss": -27.108457565307617, "global_step": 447015, "epoch": 5385} {"train_loss": -27.327062606811523, "global_step": 447016, "epoch": 5385} {"train_loss": -27.072956085205078, "global_step": 447017, "epoch": 5385} {"train_loss": -26.8062801361084, "global_step": 447018, "epoch": 5385} {"train_loss": -27.1789608001709, "global_step": 447019, "epoch": 5385} {"train_loss": -26.891096115112305, "global_step": 447020, "epoch": 5385} {"train_loss": -26.66162109375, "global_step": 447021, "epoch": 5385} {"train_loss": -27.12223243713379, "global_step": 447022, "epoch": 5385} {"train_loss": -27.27432632446289, "global_step": 447023, "epoch": 5385} {"train_loss": -26.83746337890625, "global_step": 447024, "epoch": 5385} {"train_loss": -26.714086532592773, "global_step": 447025, "epoch": 5385} {"train_loss": -26.904010772705078, "global_step": 447026, "epoch": 5385} {"train_loss": -26.7371826171875, "global_step": 447027, "epoch": 5385} {"train_loss": -27.055591583251953, "global_step": 447028, "epoch": 5385} {"train_loss": -27.030118942260742, "global_step": 447029, "epoch": 5385} {"train_loss": -26.926197052001953, "global_step": 447030, "epoch": 5385} {"train_loss": -27.045454025268555, "global_step": 447031, "epoch": 5385} {"train_loss": -26.835601806640625, "global_step": 447032, "epoch": 5385} {"train_loss": -26.751813888549805, "global_step": 447033, "epoch": 5385} {"train_loss": -27.30185890197754, "global_step": 447034, "epoch": 5385} {"train_loss": -27.27802848815918, "global_step": 447035, "epoch": 5385} {"train_loss": -26.8150634765625, "global_step": 447036, "epoch": 5385} {"train_loss": -26.849737213318605, "global_step": 447037, "epoch": 5385, "val_loss": 6621511.0} {"train_loss": -24.80628776550293, "global_step": 447038, "epoch": 5386} {"train_loss": -25.407445907592773, "global_step": 447039, "epoch": 5386} {"train_loss": -26.457794189453125, "global_step": 447040, "epoch": 5386} {"train_loss": -24.660673141479492, "global_step": 447041, "epoch": 5386} {"train_loss": -25.461753845214844, "global_step": 447042, "epoch": 5386} {"train_loss": -25.662277221679688, "global_step": 447043, "epoch": 5386} {"train_loss": -25.797338485717773, "global_step": 447044, "epoch": 5386} {"train_loss": -25.749555587768555, "global_step": 447045, "epoch": 5386} {"train_loss": -25.596786499023438, "global_step": 447046, "epoch": 5386} {"train_loss": -26.028791427612305, "global_step": 447047, "epoch": 5386} {"train_loss": -26.0452938079834, "global_step": 447048, "epoch": 5386} {"train_loss": -25.893468856811523, "global_step": 447049, "epoch": 5386} {"train_loss": -26.489133834838867, "global_step": 447050, "epoch": 5386} {"train_loss": -25.907690048217773, "global_step": 447051, "epoch": 5386} {"train_loss": -26.34906578063965, "global_step": 447052, "epoch": 5386} {"train_loss": -26.2439022064209, "global_step": 447053, "epoch": 5386} {"train_loss": -26.22052001953125, "global_step": 447054, "epoch": 5386} {"train_loss": -26.425662994384766, "global_step": 447055, "epoch": 5386} {"train_loss": -26.130075454711914, "global_step": 447056, "epoch": 5386} {"train_loss": -26.55811882019043, "global_step": 447057, "epoch": 5386} {"train_loss": -26.506549835205078, "global_step": 447058, "epoch": 5386} {"train_loss": -26.27088737487793, "global_step": 447059, "epoch": 5386} {"train_loss": -26.38100242614746, "global_step": 447060, "epoch": 5386} {"train_loss": -26.30756950378418, "global_step": 447061, "epoch": 5386} {"train_loss": -26.3206729888916, "global_step": 447062, "epoch": 5386} {"train_loss": -26.7425537109375, "global_step": 447063, "epoch": 5386} {"train_loss": -26.409942626953125, "global_step": 447064, "epoch": 5386} {"train_loss": -26.743656158447266, "global_step": 447065, "epoch": 5386} {"train_loss": -26.426593780517578, "global_step": 447066, "epoch": 5386} {"train_loss": -26.68853187561035, "global_step": 447067, "epoch": 5386} {"train_loss": -27.018110275268555, "global_step": 447068, "epoch": 5386} {"train_loss": -26.599287033081055, "global_step": 447069, "epoch": 5386} {"train_loss": -26.82012367248535, "global_step": 447070, "epoch": 5386} {"train_loss": -26.8482666015625, "global_step": 447071, "epoch": 5386} {"train_loss": -27.075546264648438, "global_step": 447072, "epoch": 5386} {"train_loss": -26.963632583618164, "global_step": 447073, "epoch": 5386} {"train_loss": -26.857450485229492, "global_step": 447074, "epoch": 5386} {"train_loss": -27.002431869506836, "global_step": 447075, "epoch": 5386} {"train_loss": -26.920291900634766, "global_step": 447076, "epoch": 5386} {"train_loss": -26.782501220703125, "global_step": 447077, "epoch": 5386} {"train_loss": -27.21820068359375, "global_step": 447078, "epoch": 5386} {"train_loss": -26.726734161376953, "global_step": 447079, "epoch": 5386} {"train_loss": -26.975568771362305, "global_step": 447080, "epoch": 5386} {"train_loss": -26.892480850219727, "global_step": 447081, "epoch": 5386} {"train_loss": -26.779348373413086, "global_step": 447082, "epoch": 5386} {"train_loss": -26.864917755126953, "global_step": 447083, "epoch": 5386} {"train_loss": -26.978036880493164, "global_step": 447084, "epoch": 5386} {"train_loss": -27.008838653564453, "global_step": 447085, "epoch": 5386} {"train_loss": -27.260541915893555, "global_step": 447086, "epoch": 5386} {"train_loss": -27.20050048828125, "global_step": 447087, "epoch": 5386} {"train_loss": -27.33045768737793, "global_step": 447088, "epoch": 5386} {"train_loss": -27.319990158081055, "global_step": 447089, "epoch": 5386} {"train_loss": -27.08868408203125, "global_step": 447090, "epoch": 5386} {"train_loss": -26.798139572143555, "global_step": 447091, "epoch": 5386} {"train_loss": -27.03718376159668, "global_step": 447092, "epoch": 5386} {"train_loss": -27.12822914123535, "global_step": 447093, "epoch": 5386} {"train_loss": -26.86343765258789, "global_step": 447094, "epoch": 5386} {"train_loss": -26.9844913482666, "global_step": 447095, "epoch": 5386} {"train_loss": -27.37173843383789, "global_step": 447096, "epoch": 5386} {"train_loss": -27.143112182617188, "global_step": 447097, "epoch": 5386} {"train_loss": -27.4191951751709, "global_step": 447098, "epoch": 5386} {"train_loss": -27.10699462890625, "global_step": 447099, "epoch": 5386} {"train_loss": -27.105335235595703, "global_step": 447100, "epoch": 5386} {"train_loss": -27.283308029174805, "global_step": 447101, "epoch": 5386} {"train_loss": -27.138879776000977, "global_step": 447102, "epoch": 5386} {"train_loss": -26.953857421875, "global_step": 447103, "epoch": 5386} {"train_loss": -27.196664810180664, "global_step": 447104, "epoch": 5386} {"train_loss": -27.297117233276367, "global_step": 447105, "epoch": 5386} {"train_loss": -26.925357818603516, "global_step": 447106, "epoch": 5386} {"train_loss": -26.935565948486328, "global_step": 447107, "epoch": 5386} {"train_loss": -27.378671646118164, "global_step": 447108, "epoch": 5386} {"train_loss": -27.10125732421875, "global_step": 447109, "epoch": 5386} {"train_loss": -26.830921173095703, "global_step": 447110, "epoch": 5386} {"train_loss": -27.138599395751953, "global_step": 447111, "epoch": 5386} {"train_loss": -27.117773056030273, "global_step": 447112, "epoch": 5386} {"train_loss": -27.684049606323242, "global_step": 447113, "epoch": 5386} {"train_loss": -27.148786544799805, "global_step": 447114, "epoch": 5386} {"train_loss": -27.22673988342285, "global_step": 447115, "epoch": 5386} {"train_loss": -27.160810470581055, "global_step": 447116, "epoch": 5386} {"train_loss": -27.13884925842285, "global_step": 447117, "epoch": 5386} {"train_loss": -26.979949951171875, "global_step": 447118, "epoch": 5386} {"train_loss": -27.378009796142578, "global_step": 447119, "epoch": 5386} {"train_loss": -26.72908573840038, "global_step": 447120, "epoch": 5386, "val_loss": 6616297.0} {"train_loss": -26.0609073638916, "global_step": 447121, "epoch": 5387} {"train_loss": -25.595172882080078, "global_step": 447122, "epoch": 5387} {"train_loss": -26.404712677001953, "global_step": 447123, "epoch": 5387} {"train_loss": -26.7655086517334, "global_step": 447124, "epoch": 5387} {"train_loss": -25.761198043823242, "global_step": 447125, "epoch": 5387} {"train_loss": -26.651254653930664, "global_step": 447126, "epoch": 5387} {"train_loss": -26.414411544799805, "global_step": 447127, "epoch": 5387} {"train_loss": -26.39666748046875, "global_step": 447128, "epoch": 5387} {"train_loss": -26.56109619140625, "global_step": 447129, "epoch": 5387} {"train_loss": -26.625965118408203, "global_step": 447130, "epoch": 5387} {"train_loss": -26.744718551635742, "global_step": 447131, "epoch": 5387} {"train_loss": -26.828262329101562, "global_step": 447132, "epoch": 5387} {"train_loss": -26.44841957092285, "global_step": 447133, "epoch": 5387} {"train_loss": -26.5462589263916, "global_step": 447134, "epoch": 5387} {"train_loss": -26.66546630859375, "global_step": 447135, "epoch": 5387} {"train_loss": -26.739973068237305, "global_step": 447136, "epoch": 5387} {"train_loss": -26.82159423828125, "global_step": 447137, "epoch": 5387} {"train_loss": -26.465229034423828, "global_step": 447138, "epoch": 5387} {"train_loss": -26.701175689697266, "global_step": 447139, "epoch": 5387} {"train_loss": -26.746723175048828, "global_step": 447140, "epoch": 5387} {"train_loss": -26.81658363342285, "global_step": 447141, "epoch": 5387} {"train_loss": -26.80494499206543, "global_step": 447142, "epoch": 5387} {"train_loss": -26.7777156829834, "global_step": 447143, "epoch": 5387} {"train_loss": -26.537933349609375, "global_step": 447144, "epoch": 5387} {"train_loss": -26.824493408203125, "global_step": 447145, "epoch": 5387} {"train_loss": -27.05084800720215, "global_step": 447146, "epoch": 5387} {"train_loss": -26.917205810546875, "global_step": 447147, "epoch": 5387} {"train_loss": -26.680906295776367, "global_step": 447148, "epoch": 5387} {"train_loss": -27.067289352416992, "global_step": 447149, "epoch": 5387} {"train_loss": -27.066980361938477, "global_step": 447150, "epoch": 5387} {"train_loss": -26.737157821655273, "global_step": 447151, "epoch": 5387} {"train_loss": -27.216089248657227, "global_step": 447152, "epoch": 5387} {"train_loss": -27.026865005493164, "global_step": 447153, "epoch": 5387} {"train_loss": -27.169660568237305, "global_step": 447154, "epoch": 5387} {"train_loss": -27.488727569580078, "global_step": 447155, "epoch": 5387} {"train_loss": -26.918472290039062, "global_step": 447156, "epoch": 5387} {"train_loss": -27.215600967407227, "global_step": 447157, "epoch": 5387} {"train_loss": -27.38545036315918, "global_step": 447158, "epoch": 5387} {"train_loss": -27.509626388549805, "global_step": 447159, "epoch": 5387} {"train_loss": -27.11821937561035, "global_step": 447160, "epoch": 5387} {"train_loss": -27.03171157836914, "global_step": 447161, "epoch": 5387} {"train_loss": -27.378498077392578, "global_step": 447162, "epoch": 5387} {"train_loss": -27.5314998626709, "global_step": 447163, "epoch": 5387} {"train_loss": -27.37529945373535, "global_step": 447164, "epoch": 5387} {"train_loss": -27.117095947265625, "global_step": 447165, "epoch": 5387} {"train_loss": -27.357275009155273, "global_step": 447166, "epoch": 5387} {"train_loss": -27.367877960205078, "global_step": 447167, "epoch": 5387} {"train_loss": -26.883268356323242, "global_step": 447168, "epoch": 5387} {"train_loss": -27.116018295288086, "global_step": 447169, "epoch": 5387} {"train_loss": -27.117429733276367, "global_step": 447170, "epoch": 5387} {"train_loss": -27.349552154541016, "global_step": 447171, "epoch": 5387} {"train_loss": -27.32843589782715, "global_step": 447172, "epoch": 5387} {"train_loss": -27.1937255859375, "global_step": 447173, "epoch": 5387} {"train_loss": -27.20551872253418, "global_step": 447174, "epoch": 5387} {"train_loss": -26.885404586791992, "global_step": 447175, "epoch": 5387} {"train_loss": -27.12066078186035, "global_step": 447176, "epoch": 5387} {"train_loss": -26.894916534423828, "global_step": 447177, "epoch": 5387} {"train_loss": -26.98395347595215, "global_step": 447178, "epoch": 5387} {"train_loss": -26.693532943725586, "global_step": 447179, "epoch": 5387} {"train_loss": -27.120330810546875, "global_step": 447180, "epoch": 5387} {"train_loss": -27.165616989135742, "global_step": 447181, "epoch": 5387} {"train_loss": -26.7628231048584, "global_step": 447182, "epoch": 5387} {"train_loss": -27.155517578125, "global_step": 447183, "epoch": 5387} {"train_loss": -26.99342155456543, "global_step": 447184, "epoch": 5387} {"train_loss": -27.35877799987793, "global_step": 447185, "epoch": 5387} {"train_loss": -26.968854904174805, "global_step": 447186, "epoch": 5387} {"train_loss": -26.446807861328125, "global_step": 447187, "epoch": 5387} {"train_loss": -26.741031646728516, "global_step": 447188, "epoch": 5387} {"train_loss": -26.8041934967041, "global_step": 447189, "epoch": 5387} {"train_loss": -26.686893463134766, "global_step": 447190, "epoch": 5387} {"train_loss": -26.998859405517578, "global_step": 447191, "epoch": 5387} {"train_loss": -27.040027618408203, "global_step": 447192, "epoch": 5387} {"train_loss": -26.642074584960938, "global_step": 447193, "epoch": 5387} {"train_loss": -26.78718376159668, "global_step": 447194, "epoch": 5387} {"train_loss": -26.831832885742188, "global_step": 447195, "epoch": 5387} {"train_loss": -27.221662521362305, "global_step": 447196, "epoch": 5387} {"train_loss": -26.537580490112305, "global_step": 447197, "epoch": 5387} {"train_loss": -26.86646842956543, "global_step": 447198, "epoch": 5387} {"train_loss": -26.452634811401367, "global_step": 447199, "epoch": 5387} {"train_loss": -27.153949737548828, "global_step": 447200, "epoch": 5387} {"train_loss": -26.544742584228516, "global_step": 447201, "epoch": 5387} {"train_loss": -27.17952537536621, "global_step": 447202, "epoch": 5387} {"train_loss": -26.87804741457284, "global_step": 447203, "epoch": 5387, "val_loss": 6651362.5} {"train_loss": -26.76773452758789, "global_step": 447204, "epoch": 5388} {"train_loss": -26.99592399597168, "global_step": 447205, "epoch": 5388} {"train_loss": -26.859222412109375, "global_step": 447206, "epoch": 5388} {"train_loss": -26.849288940429688, "global_step": 447207, "epoch": 5388} {"train_loss": -26.934555053710938, "global_step": 447208, "epoch": 5388} {"train_loss": -26.564050674438477, "global_step": 447209, "epoch": 5388} {"train_loss": -26.496545791625977, "global_step": 447210, "epoch": 5388} {"train_loss": -26.917844772338867, "global_step": 447211, "epoch": 5388} {"train_loss": -26.801111221313477, "global_step": 447212, "epoch": 5388} {"train_loss": -26.655014038085938, "global_step": 447213, "epoch": 5388} {"train_loss": -26.978515625, "global_step": 447214, "epoch": 5388} {"train_loss": -26.9431209564209, "global_step": 447215, "epoch": 5388} {"train_loss": -26.972980499267578, "global_step": 447216, "epoch": 5388} {"train_loss": -26.886951446533203, "global_step": 447217, "epoch": 5388} {"train_loss": -27.176101684570312, "global_step": 447218, "epoch": 5388} {"train_loss": -27.218103408813477, "global_step": 447219, "epoch": 5388} {"train_loss": -27.23744010925293, "global_step": 447220, "epoch": 5388} {"train_loss": -26.96236228942871, "global_step": 447221, "epoch": 5388} {"train_loss": -27.03359031677246, "global_step": 447222, "epoch": 5388} {"train_loss": -27.089441299438477, "global_step": 447223, "epoch": 5388} {"train_loss": -26.927051544189453, "global_step": 447224, "epoch": 5388} {"train_loss": -27.097803115844727, "global_step": 447225, "epoch": 5388} {"train_loss": -27.3057804107666, "global_step": 447226, "epoch": 5388} {"train_loss": -27.406850814819336, "global_step": 447227, "epoch": 5388} {"train_loss": -26.8115177154541, "global_step": 447228, "epoch": 5388} {"train_loss": -27.1132755279541, "global_step": 447229, "epoch": 5388} {"train_loss": -26.996509552001953, "global_step": 447230, "epoch": 5388} {"train_loss": -27.348058700561523, "global_step": 447231, "epoch": 5388} {"train_loss": -27.21754264831543, "global_step": 447232, "epoch": 5388} {"train_loss": -27.095748901367188, "global_step": 447233, "epoch": 5388} {"train_loss": -27.35500144958496, "global_step": 447234, "epoch": 5388} {"train_loss": -27.473297119140625, "global_step": 447235, "epoch": 5388} {"train_loss": -26.708677291870117, "global_step": 447236, "epoch": 5388} {"train_loss": -27.523914337158203, "global_step": 447237, "epoch": 5388} {"train_loss": -27.21320915222168, "global_step": 447238, "epoch": 5388} {"train_loss": -26.9611759185791, "global_step": 447239, "epoch": 5388} {"train_loss": -27.018707275390625, "global_step": 447240, "epoch": 5388} {"train_loss": -26.948694229125977, "global_step": 447241, "epoch": 5388} {"train_loss": -27.01276206970215, "global_step": 447242, "epoch": 5388} {"train_loss": -27.210494995117188, "global_step": 447243, "epoch": 5388} {"train_loss": -27.454687118530273, "global_step": 447244, "epoch": 5388} {"train_loss": -27.136194229125977, "global_step": 447245, "epoch": 5388} {"train_loss": -26.981037139892578, "global_step": 447246, "epoch": 5388} {"train_loss": -27.242902755737305, "global_step": 447247, "epoch": 5388} {"train_loss": -27.36103630065918, "global_step": 447248, "epoch": 5388} {"train_loss": -27.059173583984375, "global_step": 447249, "epoch": 5388} {"train_loss": -27.167572021484375, "global_step": 447250, "epoch": 5388} {"train_loss": -27.240076065063477, "global_step": 447251, "epoch": 5388} {"train_loss": -26.894947052001953, "global_step": 447252, "epoch": 5388} {"train_loss": -26.8730525970459, "global_step": 447253, "epoch": 5388} {"train_loss": -26.842329025268555, "global_step": 447254, "epoch": 5388} {"train_loss": -27.147510528564453, "global_step": 447255, "epoch": 5388} {"train_loss": -26.815969467163086, "global_step": 447256, "epoch": 5388} {"train_loss": -26.69415855407715, "global_step": 447257, "epoch": 5388} {"train_loss": -27.350799560546875, "global_step": 447258, "epoch": 5388} {"train_loss": -27.27887535095215, "global_step": 447259, "epoch": 5388} {"train_loss": -26.758716583251953, "global_step": 447260, "epoch": 5388} {"train_loss": -26.787994384765625, "global_step": 447261, "epoch": 5388} {"train_loss": -26.280187606811523, "global_step": 447262, "epoch": 5388} {"train_loss": -27.097187042236328, "global_step": 447263, "epoch": 5388} {"train_loss": -26.866613388061523, "global_step": 447264, "epoch": 5388} {"train_loss": -27.05255126953125, "global_step": 447265, "epoch": 5388} {"train_loss": -26.2473087310791, "global_step": 447266, "epoch": 5388} {"train_loss": -26.88958740234375, "global_step": 447267, "epoch": 5388} {"train_loss": -27.13187026977539, "global_step": 447268, "epoch": 5388} {"train_loss": -26.734350204467773, "global_step": 447269, "epoch": 5388} {"train_loss": -27.149585723876953, "global_step": 447270, "epoch": 5388} {"train_loss": -26.856536865234375, "global_step": 447271, "epoch": 5388} {"train_loss": -27.088712692260742, "global_step": 447272, "epoch": 5388} {"train_loss": -26.828290939331055, "global_step": 447273, "epoch": 5388} {"train_loss": -27.350189208984375, "global_step": 447274, "epoch": 5388} {"train_loss": -26.99471092224121, "global_step": 447275, "epoch": 5388} {"train_loss": -27.02754020690918, "global_step": 447276, "epoch": 5388} {"train_loss": -27.24192237854004, "global_step": 447277, "epoch": 5388} {"train_loss": -26.96815299987793, "global_step": 447278, "epoch": 5388} {"train_loss": -27.098066329956055, "global_step": 447279, "epoch": 5388} {"train_loss": -26.932697296142578, "global_step": 447280, "epoch": 5388} {"train_loss": -27.130380630493164, "global_step": 447281, "epoch": 5388} {"train_loss": -27.14886474609375, "global_step": 447282, "epoch": 5388} {"train_loss": -27.15205955505371, "global_step": 447283, "epoch": 5388} {"train_loss": -27.28476905822754, "global_step": 447284, "epoch": 5388} {"train_loss": -27.16310691833496, "global_step": 447285, "epoch": 5388} {"train_loss": -27.037299144698913, "global_step": 447286, "epoch": 5388, "val_loss": 6605960.5} {"train_loss": -26.80973243713379, "global_step": 447287, "epoch": 5389} {"train_loss": -26.890256881713867, "global_step": 447288, "epoch": 5389} {"train_loss": -26.6451358795166, "global_step": 447289, "epoch": 5389} {"train_loss": -26.64577293395996, "global_step": 447290, "epoch": 5389} {"train_loss": -26.624313354492188, "global_step": 447291, "epoch": 5389} {"train_loss": -26.652664184570312, "global_step": 447292, "epoch": 5389} {"train_loss": -26.347503662109375, "global_step": 447293, "epoch": 5389} {"train_loss": -26.576623916625977, "global_step": 447294, "epoch": 5389} {"train_loss": -26.620031356811523, "global_step": 447295, "epoch": 5389} {"train_loss": -27.092639923095703, "global_step": 447296, "epoch": 5389} {"train_loss": -26.900562286376953, "global_step": 447297, "epoch": 5389} {"train_loss": -26.839160919189453, "global_step": 447298, "epoch": 5389} {"train_loss": -26.815311431884766, "global_step": 447299, "epoch": 5389} {"train_loss": -26.7779541015625, "global_step": 447300, "epoch": 5389} {"train_loss": -26.64287757873535, "global_step": 447301, "epoch": 5389} {"train_loss": -26.637908935546875, "global_step": 447302, "epoch": 5389} {"train_loss": -27.02008056640625, "global_step": 447303, "epoch": 5389} {"train_loss": -27.121789932250977, "global_step": 447304, "epoch": 5389} {"train_loss": -27.481342315673828, "global_step": 447305, "epoch": 5389} {"train_loss": -26.9285831451416, "global_step": 447306, "epoch": 5389} {"train_loss": -27.211164474487305, "global_step": 447307, "epoch": 5389} {"train_loss": -27.349720001220703, "global_step": 447308, "epoch": 5389} {"train_loss": -27.09144401550293, "global_step": 447309, "epoch": 5389} {"train_loss": -27.05006217956543, "global_step": 447310, "epoch": 5389} {"train_loss": -26.943286895751953, "global_step": 447311, "epoch": 5389} {"train_loss": -26.943775177001953, "global_step": 447312, "epoch": 5389} {"train_loss": -26.81570816040039, "global_step": 447313, "epoch": 5389} {"train_loss": -27.433584213256836, "global_step": 447314, "epoch": 5389} {"train_loss": -27.330183029174805, "global_step": 447315, "epoch": 5389} {"train_loss": -27.003650665283203, "global_step": 447316, "epoch": 5389} {"train_loss": -26.871719360351562, "global_step": 447317, "epoch": 5389} {"train_loss": -27.173486709594727, "global_step": 447318, "epoch": 5389} {"train_loss": -27.20709228515625, "global_step": 447319, "epoch": 5389} {"train_loss": -27.128711700439453, "global_step": 447320, "epoch": 5389} {"train_loss": -26.69700050354004, "global_step": 447321, "epoch": 5389} {"train_loss": -26.8504638671875, "global_step": 447322, "epoch": 5389} {"train_loss": -27.43035888671875, "global_step": 447323, "epoch": 5389} {"train_loss": -26.66729736328125, "global_step": 447324, "epoch": 5389} {"train_loss": -26.346790313720703, "global_step": 447325, "epoch": 5389} {"train_loss": -26.80023765563965, "global_step": 447326, "epoch": 5389} {"train_loss": -26.418607711791992, "global_step": 447327, "epoch": 5389} {"train_loss": -26.86130714416504, "global_step": 447328, "epoch": 5389} {"train_loss": -26.982105255126953, "global_step": 447329, "epoch": 5389} {"train_loss": -26.95038414001465, "global_step": 447330, "epoch": 5389} {"train_loss": -26.62586784362793, "global_step": 447331, "epoch": 5389} {"train_loss": -26.241605758666992, "global_step": 447332, "epoch": 5389} {"train_loss": -27.164915084838867, "global_step": 447333, "epoch": 5389} {"train_loss": -26.67999839782715, "global_step": 447334, "epoch": 5389} {"train_loss": -26.954370498657227, "global_step": 447335, "epoch": 5389} {"train_loss": -26.64560890197754, "global_step": 447336, "epoch": 5389} {"train_loss": -26.61671257019043, "global_step": 447337, "epoch": 5389} {"train_loss": -26.9807186126709, "global_step": 447338, "epoch": 5389} {"train_loss": -26.550134658813477, "global_step": 447339, "epoch": 5389} {"train_loss": -26.722997665405273, "global_step": 447340, "epoch": 5389} {"train_loss": -26.6782169342041, "global_step": 447341, "epoch": 5389} {"train_loss": -27.094762802124023, "global_step": 447342, "epoch": 5389} {"train_loss": -27.03352165222168, "global_step": 447343, "epoch": 5389} {"train_loss": -27.122446060180664, "global_step": 447344, "epoch": 5389} {"train_loss": -26.625410079956055, "global_step": 447345, "epoch": 5389} {"train_loss": -27.0880069732666, "global_step": 447346, "epoch": 5389} {"train_loss": -26.702184677124023, "global_step": 447347, "epoch": 5389} {"train_loss": -26.944860458374023, "global_step": 447348, "epoch": 5389} {"train_loss": -26.80905532836914, "global_step": 447349, "epoch": 5389} {"train_loss": -26.81781578063965, "global_step": 447350, "epoch": 5389} {"train_loss": -27.44439125061035, "global_step": 447351, "epoch": 5389} {"train_loss": -27.168720245361328, "global_step": 447352, "epoch": 5389} {"train_loss": -26.845121383666992, "global_step": 447353, "epoch": 5389} {"train_loss": -26.689788818359375, "global_step": 447354, "epoch": 5389} {"train_loss": -27.18069839477539, "global_step": 447355, "epoch": 5389} {"train_loss": -27.1647891998291, "global_step": 447356, "epoch": 5389} {"train_loss": -26.826337814331055, "global_step": 447357, "epoch": 5389} {"train_loss": -27.042377471923828, "global_step": 447358, "epoch": 5389} {"train_loss": -26.64835548400879, "global_step": 447359, "epoch": 5389} {"train_loss": -26.940603256225586, "global_step": 447360, "epoch": 5389} {"train_loss": -26.788599014282227, "global_step": 447361, "epoch": 5389} {"train_loss": -27.062183380126953, "global_step": 447362, "epoch": 5389} {"train_loss": -27.005054473876953, "global_step": 447363, "epoch": 5389} {"train_loss": -26.603790283203125, "global_step": 447364, "epoch": 5389} {"train_loss": -26.846479415893555, "global_step": 447365, "epoch": 5389} {"train_loss": -26.853717803955078, "global_step": 447366, "epoch": 5389} {"train_loss": -26.5218505859375, "global_step": 447367, "epoch": 5389} {"train_loss": -27.169111251831055, "global_step": 447368, "epoch": 5389} {"train_loss": -26.869127135678948, "global_step": 447369, "epoch": 5389, "val_loss": 6635347.0} {"train_loss": -26.824987411499023, "global_step": 447370, "epoch": 5390} {"train_loss": -26.708820343017578, "global_step": 447371, "epoch": 5390} {"train_loss": -26.595458984375, "global_step": 447372, "epoch": 5390} {"train_loss": -26.896997451782227, "global_step": 447373, "epoch": 5390} {"train_loss": -26.925464630126953, "global_step": 447374, "epoch": 5390} {"train_loss": -26.45892906188965, "global_step": 447375, "epoch": 5390} {"train_loss": -26.694324493408203, "global_step": 447376, "epoch": 5390} {"train_loss": -26.594375610351562, "global_step": 447377, "epoch": 5390} {"train_loss": -26.673282623291016, "global_step": 447378, "epoch": 5390} {"train_loss": -26.942209243774414, "global_step": 447379, "epoch": 5390} {"train_loss": -26.838300704956055, "global_step": 447380, "epoch": 5390} {"train_loss": -26.80488395690918, "global_step": 447381, "epoch": 5390} {"train_loss": -26.71839714050293, "global_step": 447382, "epoch": 5390} {"train_loss": -27.05901527404785, "global_step": 447383, "epoch": 5390} {"train_loss": -26.839420318603516, "global_step": 447384, "epoch": 5390} {"train_loss": -26.862119674682617, "global_step": 447385, "epoch": 5390} {"train_loss": -26.7421817779541, "global_step": 447386, "epoch": 5390} {"train_loss": -26.989547729492188, "global_step": 447387, "epoch": 5390} {"train_loss": -27.120590209960938, "global_step": 447388, "epoch": 5390} {"train_loss": -26.95332908630371, "global_step": 447389, "epoch": 5390} {"train_loss": -26.666879653930664, "global_step": 447390, "epoch": 5390} {"train_loss": -27.464645385742188, "global_step": 447391, "epoch": 5390} {"train_loss": -27.14105224609375, "global_step": 447392, "epoch": 5390} {"train_loss": -27.241193771362305, "global_step": 447393, "epoch": 5390} {"train_loss": -27.10052490234375, "global_step": 447394, "epoch": 5390} {"train_loss": -26.719629287719727, "global_step": 447395, "epoch": 5390} {"train_loss": -26.61175537109375, "global_step": 447396, "epoch": 5390} {"train_loss": -26.844623565673828, "global_step": 447397, "epoch": 5390} {"train_loss": -27.028076171875, "global_step": 447398, "epoch": 5390} {"train_loss": -26.936691284179688, "global_step": 447399, "epoch": 5390} {"train_loss": -27.01728630065918, "global_step": 447400, "epoch": 5390} {"train_loss": -26.862930297851562, "global_step": 447401, "epoch": 5390} {"train_loss": -27.382659912109375, "global_step": 447402, "epoch": 5390} {"train_loss": -26.62106704711914, "global_step": 447403, "epoch": 5390} {"train_loss": -26.591527938842773, "global_step": 447404, "epoch": 5390} {"train_loss": -27.1201114654541, "global_step": 447405, "epoch": 5390} {"train_loss": -26.842512130737305, "global_step": 447406, "epoch": 5390} {"train_loss": -26.7982234954834, "global_step": 447407, "epoch": 5390} {"train_loss": -27.377805709838867, "global_step": 447408, "epoch": 5390} {"train_loss": -27.324310302734375, "global_step": 447409, "epoch": 5390} {"train_loss": -26.948837280273438, "global_step": 447410, "epoch": 5390} {"train_loss": -27.375661849975586, "global_step": 447411, "epoch": 5390} {"train_loss": -27.42707633972168, "global_step": 447412, "epoch": 5390} {"train_loss": -26.72208595275879, "global_step": 447413, "epoch": 5390} {"train_loss": -26.918548583984375, "global_step": 447414, "epoch": 5390} {"train_loss": -27.074127197265625, "global_step": 447415, "epoch": 5390} {"train_loss": -26.8402156829834, "global_step": 447416, "epoch": 5390} {"train_loss": -26.9931640625, "global_step": 447417, "epoch": 5390} {"train_loss": -26.5884952545166, "global_step": 447418, "epoch": 5390} {"train_loss": -27.106765747070312, "global_step": 447419, "epoch": 5390} {"train_loss": -27.3023624420166, "global_step": 447420, "epoch": 5390} {"train_loss": -27.20448112487793, "global_step": 447421, "epoch": 5390} {"train_loss": -27.227869033813477, "global_step": 447422, "epoch": 5390} {"train_loss": -26.93021011352539, "global_step": 447423, "epoch": 5390} {"train_loss": -26.817768096923828, "global_step": 447424, "epoch": 5390} {"train_loss": -27.033117294311523, "global_step": 447425, "epoch": 5390} {"train_loss": -27.260650634765625, "global_step": 447426, "epoch": 5390} {"train_loss": -26.777063369750977, "global_step": 447427, "epoch": 5390} {"train_loss": -26.5922794342041, "global_step": 447428, "epoch": 5390} {"train_loss": -27.093311309814453, "global_step": 447429, "epoch": 5390} {"train_loss": -27.1580810546875, "global_step": 447430, "epoch": 5390} {"train_loss": -26.767316818237305, "global_step": 447431, "epoch": 5390} {"train_loss": -26.879636764526367, "global_step": 447432, "epoch": 5390} {"train_loss": -26.925901412963867, "global_step": 447433, "epoch": 5390} {"train_loss": -27.35825538635254, "global_step": 447434, "epoch": 5390} {"train_loss": -27.418750762939453, "global_step": 447435, "epoch": 5390} {"train_loss": -26.7919979095459, "global_step": 447436, "epoch": 5390} {"train_loss": -26.86374282836914, "global_step": 447437, "epoch": 5390} {"train_loss": -27.487890243530273, "global_step": 447438, "epoch": 5390} {"train_loss": -26.790836334228516, "global_step": 447439, "epoch": 5390} {"train_loss": -26.713321685791016, "global_step": 447440, "epoch": 5390} {"train_loss": -26.5894832611084, "global_step": 447441, "epoch": 5390} {"train_loss": -27.44256591796875, "global_step": 447442, "epoch": 5390} {"train_loss": -27.154279708862305, "global_step": 447443, "epoch": 5390} {"train_loss": -26.705442428588867, "global_step": 447444, "epoch": 5390} {"train_loss": -27.2606201171875, "global_step": 447445, "epoch": 5390} {"train_loss": -26.755369186401367, "global_step": 447446, "epoch": 5390} {"train_loss": -27.042587280273438, "global_step": 447447, "epoch": 5390} {"train_loss": -26.781879425048828, "global_step": 447448, "epoch": 5390} {"train_loss": -26.975296020507812, "global_step": 447449, "epoch": 5390} {"train_loss": -26.6574764251709, "global_step": 447450, "epoch": 5390} {"train_loss": -26.88067054748535, "global_step": 447451, "epoch": 5390} {"train_loss": -26.952388074024615, "global_step": 447452, "epoch": 5390, "val_loss": 6601709.5} {"train_loss": -25.74065589904785, "global_step": 447453, "epoch": 5391} {"train_loss": -26.443161010742188, "global_step": 447454, "epoch": 5391} {"train_loss": -26.10540199279785, "global_step": 447455, "epoch": 5391} {"train_loss": -26.826507568359375, "global_step": 447456, "epoch": 5391} {"train_loss": -26.1198673248291, "global_step": 447457, "epoch": 5391} {"train_loss": -26.42609977722168, "global_step": 447458, "epoch": 5391} {"train_loss": -26.32059097290039, "global_step": 447459, "epoch": 5391} {"train_loss": -26.5631160736084, "global_step": 447460, "epoch": 5391} {"train_loss": -26.502241134643555, "global_step": 447461, "epoch": 5391} {"train_loss": -26.79282569885254, "global_step": 447462, "epoch": 5391} {"train_loss": -26.966720581054688, "global_step": 447463, "epoch": 5391} {"train_loss": -26.967620849609375, "global_step": 447464, "epoch": 5391} {"train_loss": -26.718244552612305, "global_step": 447465, "epoch": 5391} {"train_loss": -26.713510513305664, "global_step": 447466, "epoch": 5391} {"train_loss": -26.702096939086914, "global_step": 447467, "epoch": 5391} {"train_loss": -26.851215362548828, "global_step": 447468, "epoch": 5391} {"train_loss": -27.09311866760254, "global_step": 447469, "epoch": 5391} {"train_loss": -26.404285430908203, "global_step": 447470, "epoch": 5391} {"train_loss": -26.219940185546875, "global_step": 447471, "epoch": 5391} {"train_loss": -26.711761474609375, "global_step": 447472, "epoch": 5391} {"train_loss": -26.704626083374023, "global_step": 447473, "epoch": 5391} {"train_loss": -26.51506996154785, "global_step": 447474, "epoch": 5391} {"train_loss": -26.830930709838867, "global_step": 447475, "epoch": 5391} {"train_loss": -26.99159049987793, "global_step": 447476, "epoch": 5391} {"train_loss": -26.725528717041016, "global_step": 447477, "epoch": 5391} {"train_loss": -27.073083877563477, "global_step": 447478, "epoch": 5391} {"train_loss": -26.623266220092773, "global_step": 447479, "epoch": 5391} {"train_loss": -26.701263427734375, "global_step": 447480, "epoch": 5391} {"train_loss": -26.94215965270996, "global_step": 447481, "epoch": 5391} {"train_loss": -26.69746208190918, "global_step": 447482, "epoch": 5391} {"train_loss": -26.789661407470703, "global_step": 447483, "epoch": 5391} {"train_loss": -26.709949493408203, "global_step": 447484, "epoch": 5391} {"train_loss": -27.129880905151367, "global_step": 447485, "epoch": 5391} {"train_loss": -27.184967041015625, "global_step": 447486, "epoch": 5391} {"train_loss": -26.821990966796875, "global_step": 447487, "epoch": 5391} {"train_loss": -26.818124771118164, "global_step": 447488, "epoch": 5391} {"train_loss": -27.062803268432617, "global_step": 447489, "epoch": 5391} {"train_loss": -26.799306869506836, "global_step": 447490, "epoch": 5391} {"train_loss": -27.237903594970703, "global_step": 447491, "epoch": 5391} {"train_loss": -26.761449813842773, "global_step": 447492, "epoch": 5391} {"train_loss": -27.34263038635254, "global_step": 447493, "epoch": 5391} {"train_loss": -26.760425567626953, "global_step": 447494, "epoch": 5391} {"train_loss": -26.730289459228516, "global_step": 447495, "epoch": 5391} {"train_loss": -27.2412052154541, "global_step": 447496, "epoch": 5391} {"train_loss": -27.210474014282227, "global_step": 447497, "epoch": 5391} {"train_loss": -27.229394912719727, "global_step": 447498, "epoch": 5391} {"train_loss": -27.149274826049805, "global_step": 447499, "epoch": 5391} {"train_loss": -27.421228408813477, "global_step": 447500, "epoch": 5391} {"train_loss": -27.400259017944336, "global_step": 447501, "epoch": 5391} {"train_loss": -27.36773681640625, "global_step": 447502, "epoch": 5391} {"train_loss": -27.412250518798828, "global_step": 447503, "epoch": 5391} {"train_loss": -27.184783935546875, "global_step": 447504, "epoch": 5391} {"train_loss": -27.035959243774414, "global_step": 447505, "epoch": 5391} {"train_loss": -27.12457275390625, "global_step": 447506, "epoch": 5391} {"train_loss": -27.568952560424805, "global_step": 447507, "epoch": 5391} {"train_loss": -27.43464469909668, "global_step": 447508, "epoch": 5391} {"train_loss": -27.3749942779541, "global_step": 447509, "epoch": 5391} {"train_loss": -27.396814346313477, "global_step": 447510, "epoch": 5391} {"train_loss": -27.578527450561523, "global_step": 447511, "epoch": 5391} {"train_loss": -26.969974517822266, "global_step": 447512, "epoch": 5391} {"train_loss": -27.087207794189453, "global_step": 447513, "epoch": 5391} {"train_loss": -27.132877349853516, "global_step": 447514, "epoch": 5391} {"train_loss": -26.96527099609375, "global_step": 447515, "epoch": 5391} {"train_loss": -26.76014518737793, "global_step": 447516, "epoch": 5391} {"train_loss": -27.171506881713867, "global_step": 447517, "epoch": 5391} {"train_loss": -26.912866592407227, "global_step": 447518, "epoch": 5391} {"train_loss": -26.69540786743164, "global_step": 447519, "epoch": 5391} {"train_loss": -26.421716690063477, "global_step": 447520, "epoch": 5391} {"train_loss": -26.441675186157227, "global_step": 447521, "epoch": 5391} {"train_loss": -26.170917510986328, "global_step": 447522, "epoch": 5391} {"train_loss": -26.263525009155273, "global_step": 447523, "epoch": 5391} {"train_loss": -26.32752799987793, "global_step": 447524, "epoch": 5391} {"train_loss": -26.54962158203125, "global_step": 447525, "epoch": 5391} {"train_loss": -26.353498458862305, "global_step": 447526, "epoch": 5391} {"train_loss": -26.88702392578125, "global_step": 447527, "epoch": 5391} {"train_loss": -26.995630264282227, "global_step": 447528, "epoch": 5391} {"train_loss": -26.72775650024414, "global_step": 447529, "epoch": 5391} {"train_loss": -26.628870010375977, "global_step": 447530, "epoch": 5391} {"train_loss": -26.5142765045166, "global_step": 447531, "epoch": 5391} {"train_loss": -26.862844467163086, "global_step": 447532, "epoch": 5391} {"train_loss": -26.840078353881836, "global_step": 447533, "epoch": 5391} {"train_loss": -26.818708419799805, "global_step": 447534, "epoch": 5391} {"train_loss": -26.857565684490893, "global_step": 447535, "epoch": 5391, "val_loss": 6548127.0} {"train_loss": -25.988569259643555, "global_step": 447536, "epoch": 5392} {"train_loss": -25.895706176757812, "global_step": 447537, "epoch": 5392} {"train_loss": -25.704608917236328, "global_step": 447538, "epoch": 5392} {"train_loss": -26.134750366210938, "global_step": 447539, "epoch": 5392} {"train_loss": -26.36859130859375, "global_step": 447540, "epoch": 5392} {"train_loss": -26.32415199279785, "global_step": 447541, "epoch": 5392} {"train_loss": -25.87061882019043, "global_step": 447542, "epoch": 5392} {"train_loss": -26.513669967651367, "global_step": 447543, "epoch": 5392} {"train_loss": -26.08608055114746, "global_step": 447544, "epoch": 5392} {"train_loss": -26.84700584411621, "global_step": 447545, "epoch": 5392} {"train_loss": -26.5705623626709, "global_step": 447546, "epoch": 5392} {"train_loss": -26.547840118408203, "global_step": 447547, "epoch": 5392} {"train_loss": -26.421695709228516, "global_step": 447548, "epoch": 5392} {"train_loss": -26.7081298828125, "global_step": 447549, "epoch": 5392} {"train_loss": -26.2177791595459, "global_step": 447550, "epoch": 5392} {"train_loss": -26.788782119750977, "global_step": 447551, "epoch": 5392} {"train_loss": -26.388120651245117, "global_step": 447552, "epoch": 5392} {"train_loss": -26.844791412353516, "global_step": 447553, "epoch": 5392} {"train_loss": -26.711139678955078, "global_step": 447554, "epoch": 5392} {"train_loss": -26.761762619018555, "global_step": 447555, "epoch": 5392} {"train_loss": -26.54132080078125, "global_step": 447556, "epoch": 5392} {"train_loss": -26.8975887298584, "global_step": 447557, "epoch": 5392} {"train_loss": -26.5064754486084, "global_step": 447558, "epoch": 5392} {"train_loss": -26.69677734375, "global_step": 447559, "epoch": 5392} {"train_loss": -26.742589950561523, "global_step": 447560, "epoch": 5392} {"train_loss": -27.03484535217285, "global_step": 447561, "epoch": 5392} {"train_loss": -26.5611572265625, "global_step": 447562, "epoch": 5392} {"train_loss": -27.05877113342285, "global_step": 447563, "epoch": 5392} {"train_loss": -26.967008590698242, "global_step": 447564, "epoch": 5392} {"train_loss": -27.08392906188965, "global_step": 447565, "epoch": 5392} {"train_loss": -26.9024600982666, "global_step": 447566, "epoch": 5392} {"train_loss": -26.99850845336914, "global_step": 447567, "epoch": 5392} {"train_loss": -27.219533920288086, "global_step": 447568, "epoch": 5392} {"train_loss": -27.208539962768555, "global_step": 447569, "epoch": 5392} {"train_loss": -27.019269943237305, "global_step": 447570, "epoch": 5392} {"train_loss": -27.128376007080078, "global_step": 447571, "epoch": 5392} {"train_loss": -27.013105392456055, "global_step": 447572, "epoch": 5392} {"train_loss": -26.911224365234375, "global_step": 447573, "epoch": 5392} {"train_loss": -27.02945327758789, "global_step": 447574, "epoch": 5392} {"train_loss": -27.206140518188477, "global_step": 447575, "epoch": 5392} {"train_loss": -27.183557510375977, "global_step": 447576, "epoch": 5392} {"train_loss": -27.124103546142578, "global_step": 447577, "epoch": 5392} {"train_loss": -27.209104537963867, "global_step": 447578, "epoch": 5392} {"train_loss": -27.358728408813477, "global_step": 447579, "epoch": 5392} {"train_loss": -26.9998836517334, "global_step": 447580, "epoch": 5392} {"train_loss": -26.991851806640625, "global_step": 447581, "epoch": 5392} {"train_loss": -27.134429931640625, "global_step": 447582, "epoch": 5392} {"train_loss": -27.51460838317871, "global_step": 447583, "epoch": 5392} {"train_loss": -27.28606605529785, "global_step": 447584, "epoch": 5392} {"train_loss": -27.19789695739746, "global_step": 447585, "epoch": 5392} {"train_loss": -27.195627212524414, "global_step": 447586, "epoch": 5392} {"train_loss": -27.3044490814209, "global_step": 447587, "epoch": 5392} {"train_loss": -27.351810455322266, "global_step": 447588, "epoch": 5392} {"train_loss": -26.913076400756836, "global_step": 447589, "epoch": 5392} {"train_loss": -27.460119247436523, "global_step": 447590, "epoch": 5392} {"train_loss": -27.282617568969727, "global_step": 447591, "epoch": 5392} {"train_loss": -27.1602725982666, "global_step": 447592, "epoch": 5392} {"train_loss": -27.23902702331543, "global_step": 447593, "epoch": 5392} {"train_loss": -27.293603897094727, "global_step": 447594, "epoch": 5392} {"train_loss": -26.84799575805664, "global_step": 447595, "epoch": 5392} {"train_loss": -26.860980987548828, "global_step": 447596, "epoch": 5392} {"train_loss": -26.65228271484375, "global_step": 447597, "epoch": 5392} {"train_loss": -26.720746994018555, "global_step": 447598, "epoch": 5392} {"train_loss": -26.568525314331055, "global_step": 447599, "epoch": 5392} {"train_loss": -26.978626251220703, "global_step": 447600, "epoch": 5392} {"train_loss": -26.622907638549805, "global_step": 447601, "epoch": 5392} {"train_loss": -26.790851593017578, "global_step": 447602, "epoch": 5392} {"train_loss": -26.903156280517578, "global_step": 447603, "epoch": 5392} {"train_loss": -27.483871459960938, "global_step": 447604, "epoch": 5392} {"train_loss": -27.203567504882812, "global_step": 447605, "epoch": 5392} {"train_loss": -26.68109130859375, "global_step": 447606, "epoch": 5392} {"train_loss": -26.85465431213379, "global_step": 447607, "epoch": 5392} {"train_loss": -27.354766845703125, "global_step": 447608, "epoch": 5392} {"train_loss": -26.916641235351562, "global_step": 447609, "epoch": 5392} {"train_loss": -27.42390251159668, "global_step": 447610, "epoch": 5392} {"train_loss": -27.296222686767578, "global_step": 447611, "epoch": 5392} {"train_loss": -27.19403648376465, "global_step": 447612, "epoch": 5392} {"train_loss": -26.995412826538086, "global_step": 447613, "epoch": 5392} {"train_loss": -27.395069122314453, "global_step": 447614, "epoch": 5392} {"train_loss": -26.94243812561035, "global_step": 447615, "epoch": 5392} {"train_loss": -27.049468994140625, "global_step": 447616, "epoch": 5392} {"train_loss": -27.1286563873291, "global_step": 447617, "epoch": 5392} {"train_loss": -26.867780386683453, "global_step": 447618, "epoch": 5392, "val_loss": 6682949.0} {"train_loss": -24.47003173828125, "global_step": 447619, "epoch": 5393} {"train_loss": -24.374160766601562, "global_step": 447620, "epoch": 5393} {"train_loss": -26.3648624420166, "global_step": 447621, "epoch": 5393} {"train_loss": -25.910125732421875, "global_step": 447622, "epoch": 5393} {"train_loss": -24.932849884033203, "global_step": 447623, "epoch": 5393} {"train_loss": -26.18988609313965, "global_step": 447624, "epoch": 5393} {"train_loss": -26.073486328125, "global_step": 447625, "epoch": 5393} {"train_loss": -25.936269760131836, "global_step": 447626, "epoch": 5393} {"train_loss": -25.591703414916992, "global_step": 447627, "epoch": 5393} {"train_loss": -26.0274658203125, "global_step": 447628, "epoch": 5393} {"train_loss": -26.42091941833496, "global_step": 447629, "epoch": 5393} {"train_loss": -26.401498794555664, "global_step": 447630, "epoch": 5393} {"train_loss": -26.43885612487793, "global_step": 447631, "epoch": 5393} {"train_loss": -26.222925186157227, "global_step": 447632, "epoch": 5393} {"train_loss": -26.224308013916016, "global_step": 447633, "epoch": 5393} {"train_loss": -26.51362419128418, "global_step": 447634, "epoch": 5393} {"train_loss": -26.771997451782227, "global_step": 447635, "epoch": 5393} {"train_loss": -26.284626007080078, "global_step": 447636, "epoch": 5393} {"train_loss": -26.82526969909668, "global_step": 447637, "epoch": 5393} {"train_loss": -26.558652877807617, "global_step": 447638, "epoch": 5393} {"train_loss": -26.593347549438477, "global_step": 447639, "epoch": 5393} {"train_loss": -26.810810089111328, "global_step": 447640, "epoch": 5393} {"train_loss": -26.77503776550293, "global_step": 447641, "epoch": 5393} {"train_loss": -26.44131851196289, "global_step": 447642, "epoch": 5393} {"train_loss": -26.59634780883789, "global_step": 447643, "epoch": 5393} {"train_loss": -26.791168212890625, "global_step": 447644, "epoch": 5393} {"train_loss": -26.501977920532227, "global_step": 447645, "epoch": 5393} {"train_loss": -26.915790557861328, "global_step": 447646, "epoch": 5393} {"train_loss": -26.79388999938965, "global_step": 447647, "epoch": 5393} {"train_loss": -26.54511833190918, "global_step": 447648, "epoch": 5393} {"train_loss": -26.7257137298584, "global_step": 447649, "epoch": 5393} {"train_loss": -27.2547550201416, "global_step": 447650, "epoch": 5393} {"train_loss": -26.5905818939209, "global_step": 447651, "epoch": 5393} {"train_loss": -26.60856056213379, "global_step": 447652, "epoch": 5393} {"train_loss": -26.761737823486328, "global_step": 447653, "epoch": 5393} {"train_loss": -26.630035400390625, "global_step": 447654, "epoch": 5393} {"train_loss": -26.295454025268555, "global_step": 447655, "epoch": 5393} {"train_loss": -26.817575454711914, "global_step": 447656, "epoch": 5393} {"train_loss": -26.970291137695312, "global_step": 447657, "epoch": 5393} {"train_loss": -26.919891357421875, "global_step": 447658, "epoch": 5393} {"train_loss": -27.006946563720703, "global_step": 447659, "epoch": 5393} {"train_loss": -26.748746871948242, "global_step": 447660, "epoch": 5393} {"train_loss": -27.019947052001953, "global_step": 447661, "epoch": 5393} {"train_loss": -26.804367065429688, "global_step": 447662, "epoch": 5393} {"train_loss": -26.70796012878418, "global_step": 447663, "epoch": 5393} {"train_loss": -27.16023063659668, "global_step": 447664, "epoch": 5393} {"train_loss": -26.894428253173828, "global_step": 447665, "epoch": 5393} {"train_loss": -26.7707576751709, "global_step": 447666, "epoch": 5393} {"train_loss": -27.213415145874023, "global_step": 447667, "epoch": 5393} {"train_loss": -26.91383934020996, "global_step": 447668, "epoch": 5393} {"train_loss": -27.1348934173584, "global_step": 447669, "epoch": 5393} {"train_loss": -26.395238876342773, "global_step": 447670, "epoch": 5393} {"train_loss": -26.892301559448242, "global_step": 447671, "epoch": 5393} {"train_loss": -26.798328399658203, "global_step": 447672, "epoch": 5393} {"train_loss": -26.830976486206055, "global_step": 447673, "epoch": 5393} {"train_loss": -26.84112548828125, "global_step": 447674, "epoch": 5393} {"train_loss": -26.88702392578125, "global_step": 447675, "epoch": 5393} {"train_loss": -27.116064071655273, "global_step": 447676, "epoch": 5393} {"train_loss": -26.952871322631836, "global_step": 447677, "epoch": 5393} {"train_loss": -26.770465850830078, "global_step": 447678, "epoch": 5393} {"train_loss": -26.909820556640625, "global_step": 447679, "epoch": 5393} {"train_loss": -27.166845321655273, "global_step": 447680, "epoch": 5393} {"train_loss": -26.9172420501709, "global_step": 447681, "epoch": 5393} {"train_loss": -26.5797061920166, "global_step": 447682, "epoch": 5393} {"train_loss": -26.577945709228516, "global_step": 447683, "epoch": 5393} {"train_loss": -27.31641960144043, "global_step": 447684, "epoch": 5393} {"train_loss": -26.638629913330078, "global_step": 447685, "epoch": 5393} {"train_loss": -27.153730392456055, "global_step": 447686, "epoch": 5393} {"train_loss": -26.93006706237793, "global_step": 447687, "epoch": 5393} {"train_loss": -27.107168197631836, "global_step": 447688, "epoch": 5393} {"train_loss": -26.66727066040039, "global_step": 447689, "epoch": 5393} {"train_loss": -27.05097770690918, "global_step": 447690, "epoch": 5393} {"train_loss": -27.2132625579834, "global_step": 447691, "epoch": 5393} {"train_loss": -26.866552352905273, "global_step": 447692, "epoch": 5393} {"train_loss": -27.00347900390625, "global_step": 447693, "epoch": 5393} {"train_loss": -26.881305694580078, "global_step": 447694, "epoch": 5393} {"train_loss": -26.71298599243164, "global_step": 447695, "epoch": 5393} {"train_loss": -27.100305557250977, "global_step": 447696, "epoch": 5393} {"train_loss": -26.630401611328125, "global_step": 447697, "epoch": 5393} {"train_loss": -26.99550437927246, "global_step": 447698, "epoch": 5393} {"train_loss": -26.702733993530273, "global_step": 447699, "epoch": 5393} {"train_loss": -27.176084518432617, "global_step": 447700, "epoch": 5393} {"train_loss": -26.646218380296087, "global_step": 447701, "epoch": 5393, "val_loss": 6531394.0} {"train_loss": -25.514942169189453, "global_step": 447702, "epoch": 5394} {"train_loss": -25.998687744140625, "global_step": 447703, "epoch": 5394} {"train_loss": -26.064321517944336, "global_step": 447704, "epoch": 5394} {"train_loss": -26.00994300842285, "global_step": 447705, "epoch": 5394} {"train_loss": -26.42864990234375, "global_step": 447706, "epoch": 5394} {"train_loss": -26.382648468017578, "global_step": 447707, "epoch": 5394} {"train_loss": -26.188169479370117, "global_step": 447708, "epoch": 5394} {"train_loss": -26.773548126220703, "global_step": 447709, "epoch": 5394} {"train_loss": -26.439453125, "global_step": 447710, "epoch": 5394} {"train_loss": -26.660058975219727, "global_step": 447711, "epoch": 5394} {"train_loss": -26.306751251220703, "global_step": 447712, "epoch": 5394} {"train_loss": -26.570728302001953, "global_step": 447713, "epoch": 5394} {"train_loss": -26.491058349609375, "global_step": 447714, "epoch": 5394} {"train_loss": -26.61530113220215, "global_step": 447715, "epoch": 5394} {"train_loss": -26.781604766845703, "global_step": 447716, "epoch": 5394} {"train_loss": -26.450780868530273, "global_step": 447717, "epoch": 5394} {"train_loss": -26.47736930847168, "global_step": 447718, "epoch": 5394} {"train_loss": -26.64954948425293, "global_step": 447719, "epoch": 5394} {"train_loss": -26.339696884155273, "global_step": 447720, "epoch": 5394} {"train_loss": -27.049238204956055, "global_step": 447721, "epoch": 5394} {"train_loss": -26.66791343688965, "global_step": 447722, "epoch": 5394} {"train_loss": -26.497831344604492, "global_step": 447723, "epoch": 5394} {"train_loss": -26.598773956298828, "global_step": 447724, "epoch": 5394} {"train_loss": -26.441822052001953, "global_step": 447725, "epoch": 5394} {"train_loss": -26.9937686920166, "global_step": 447726, "epoch": 5394} {"train_loss": -26.851062774658203, "global_step": 447727, "epoch": 5394} {"train_loss": -26.546735763549805, "global_step": 447728, "epoch": 5394} {"train_loss": -27.010175704956055, "global_step": 447729, "epoch": 5394} {"train_loss": -26.684768676757812, "global_step": 447730, "epoch": 5394} {"train_loss": -26.6632022857666, "global_step": 447731, "epoch": 5394} {"train_loss": -26.854700088500977, "global_step": 447732, "epoch": 5394} {"train_loss": -26.954421997070312, "global_step": 447733, "epoch": 5394} {"train_loss": -26.799345016479492, "global_step": 447734, "epoch": 5394} {"train_loss": -26.775827407836914, "global_step": 447735, "epoch": 5394} {"train_loss": -26.85590171813965, "global_step": 447736, "epoch": 5394} {"train_loss": -26.882770538330078, "global_step": 447737, "epoch": 5394} {"train_loss": -26.914289474487305, "global_step": 447738, "epoch": 5394} {"train_loss": -27.162389755249023, "global_step": 447739, "epoch": 5394} {"train_loss": -27.09821128845215, "global_step": 447740, "epoch": 5394} {"train_loss": -27.016345977783203, "global_step": 447741, "epoch": 5394} {"train_loss": -27.322010040283203, "global_step": 447742, "epoch": 5394} {"train_loss": -27.158899307250977, "global_step": 447743, "epoch": 5394} {"train_loss": -27.27762222290039, "global_step": 447744, "epoch": 5394} {"train_loss": -26.958759307861328, "global_step": 447745, "epoch": 5394} {"train_loss": -27.30409049987793, "global_step": 447746, "epoch": 5394} {"train_loss": -26.848474502563477, "global_step": 447747, "epoch": 5394} {"train_loss": -27.270299911499023, "global_step": 447748, "epoch": 5394} {"train_loss": -27.22796058654785, "global_step": 447749, "epoch": 5394} {"train_loss": -26.97548484802246, "global_step": 447750, "epoch": 5394} {"train_loss": -27.16782569885254, "global_step": 447751, "epoch": 5394} {"train_loss": -27.294086456298828, "global_step": 447752, "epoch": 5394} {"train_loss": -27.5234375, "global_step": 447753, "epoch": 5394} {"train_loss": -27.25052833557129, "global_step": 447754, "epoch": 5394} {"train_loss": -27.126386642456055, "global_step": 447755, "epoch": 5394} {"train_loss": -27.487018585205078, "global_step": 447756, "epoch": 5394} {"train_loss": -27.181921005249023, "global_step": 447757, "epoch": 5394} {"train_loss": -27.304004669189453, "global_step": 447758, "epoch": 5394} {"train_loss": -26.42896842956543, "global_step": 447759, "epoch": 5394} {"train_loss": -26.923505783081055, "global_step": 447760, "epoch": 5394} {"train_loss": -26.775360107421875, "global_step": 447761, "epoch": 5394} {"train_loss": -27.44307518005371, "global_step": 447762, "epoch": 5394} {"train_loss": -27.211164474487305, "global_step": 447763, "epoch": 5394} {"train_loss": -27.01947021484375, "global_step": 447764, "epoch": 5394} {"train_loss": -27.297199249267578, "global_step": 447765, "epoch": 5394} {"train_loss": -27.18316650390625, "global_step": 447766, "epoch": 5394} {"train_loss": -27.260791778564453, "global_step": 447767, "epoch": 5394} {"train_loss": -27.436420440673828, "global_step": 447768, "epoch": 5394} {"train_loss": -27.130029678344727, "global_step": 447769, "epoch": 5394} {"train_loss": -27.289947509765625, "global_step": 447770, "epoch": 5394} {"train_loss": -26.717559814453125, "global_step": 447771, "epoch": 5394} {"train_loss": -26.436145782470703, "global_step": 447772, "epoch": 5394} {"train_loss": -26.851232528686523, "global_step": 447773, "epoch": 5394} {"train_loss": -27.00147819519043, "global_step": 447774, "epoch": 5394} {"train_loss": -26.302759170532227, "global_step": 447775, "epoch": 5394} {"train_loss": -26.650304794311523, "global_step": 447776, "epoch": 5394} {"train_loss": -26.938236236572266, "global_step": 447777, "epoch": 5394} {"train_loss": -26.974994659423828, "global_step": 447778, "epoch": 5394} {"train_loss": -26.881778717041016, "global_step": 447779, "epoch": 5394} {"train_loss": -26.768173217773438, "global_step": 447780, "epoch": 5394} {"train_loss": -26.639257431030273, "global_step": 447781, "epoch": 5394} {"train_loss": -26.296667098999023, "global_step": 447782, "epoch": 5394} {"train_loss": -26.848011016845703, "global_step": 447783, "epoch": 5394} {"train_loss": -26.838478318179945, "global_step": 447784, "epoch": 5394, "val_loss": 6566938.0} {"train_loss": -25.453039169311523, "global_step": 447785, "epoch": 5395} {"train_loss": -25.43764877319336, "global_step": 447786, "epoch": 5395} {"train_loss": -26.103271484375, "global_step": 447787, "epoch": 5395} {"train_loss": -26.285348892211914, "global_step": 447788, "epoch": 5395} {"train_loss": -25.656360626220703, "global_step": 447789, "epoch": 5395} {"train_loss": -25.6599178314209, "global_step": 447790, "epoch": 5395} {"train_loss": -26.42726707458496, "global_step": 447791, "epoch": 5395} {"train_loss": -26.036300659179688, "global_step": 447792, "epoch": 5395} {"train_loss": -26.815963745117188, "global_step": 447793, "epoch": 5395} {"train_loss": -26.52381706237793, "global_step": 447794, "epoch": 5395} {"train_loss": -26.572538375854492, "global_step": 447795, "epoch": 5395} {"train_loss": -26.54585075378418, "global_step": 447796, "epoch": 5395} {"train_loss": -26.554990768432617, "global_step": 447797, "epoch": 5395} {"train_loss": -26.645898818969727, "global_step": 447798, "epoch": 5395} {"train_loss": -26.545881271362305, "global_step": 447799, "epoch": 5395} {"train_loss": -26.780811309814453, "global_step": 447800, "epoch": 5395} {"train_loss": -26.17917823791504, "global_step": 447801, "epoch": 5395} {"train_loss": -26.383859634399414, "global_step": 447802, "epoch": 5395} {"train_loss": -26.61768913269043, "global_step": 447803, "epoch": 5395} {"train_loss": -26.70966911315918, "global_step": 447804, "epoch": 5395} {"train_loss": -26.65826988220215, "global_step": 447805, "epoch": 5395} {"train_loss": -26.612262725830078, "global_step": 447806, "epoch": 5395} {"train_loss": -26.968259811401367, "global_step": 447807, "epoch": 5395} {"train_loss": -26.85174560546875, "global_step": 447808, "epoch": 5395} {"train_loss": -26.74751091003418, "global_step": 447809, "epoch": 5395} {"train_loss": -26.78455924987793, "global_step": 447810, "epoch": 5395} {"train_loss": -26.877294540405273, "global_step": 447811, "epoch": 5395} {"train_loss": -26.508092880249023, "global_step": 447812, "epoch": 5395} {"train_loss": -27.005338668823242, "global_step": 447813, "epoch": 5395} {"train_loss": -26.70892906188965, "global_step": 447814, "epoch": 5395} {"train_loss": -27.192523956298828, "global_step": 447815, "epoch": 5395} {"train_loss": -26.708913803100586, "global_step": 447816, "epoch": 5395} {"train_loss": -27.084644317626953, "global_step": 447817, "epoch": 5395} {"train_loss": -27.15936279296875, "global_step": 447818, "epoch": 5395} {"train_loss": -26.723718643188477, "global_step": 447819, "epoch": 5395} {"train_loss": -27.293237686157227, "global_step": 447820, "epoch": 5395} {"train_loss": -26.902936935424805, "global_step": 447821, "epoch": 5395} {"train_loss": -27.21622657775879, "global_step": 447822, "epoch": 5395} {"train_loss": -26.907882690429688, "global_step": 447823, "epoch": 5395} {"train_loss": -27.268545150756836, "global_step": 447824, "epoch": 5395} {"train_loss": -27.44622802734375, "global_step": 447825, "epoch": 5395} {"train_loss": -27.243091583251953, "global_step": 447826, "epoch": 5395} {"train_loss": -27.26808738708496, "global_step": 447827, "epoch": 5395} {"train_loss": -26.699609756469727, "global_step": 447828, "epoch": 5395} {"train_loss": -27.38822364807129, "global_step": 447829, "epoch": 5395} {"train_loss": -27.2896785736084, "global_step": 447830, "epoch": 5395} {"train_loss": -27.31056022644043, "global_step": 447831, "epoch": 5395} {"train_loss": -27.079498291015625, "global_step": 447832, "epoch": 5395} {"train_loss": -27.466291427612305, "global_step": 447833, "epoch": 5395} {"train_loss": -26.97637939453125, "global_step": 447834, "epoch": 5395} {"train_loss": -27.4634952545166, "global_step": 447835, "epoch": 5395} {"train_loss": -26.995859146118164, "global_step": 447836, "epoch": 5395} {"train_loss": -27.336462020874023, "global_step": 447837, "epoch": 5395} {"train_loss": -27.269155502319336, "global_step": 447838, "epoch": 5395} {"train_loss": -27.14853858947754, "global_step": 447839, "epoch": 5395} {"train_loss": -27.20343589782715, "global_step": 447840, "epoch": 5395} {"train_loss": -27.222640991210938, "global_step": 447841, "epoch": 5395} {"train_loss": -27.269739151000977, "global_step": 447842, "epoch": 5395} {"train_loss": -27.55389404296875, "global_step": 447843, "epoch": 5395} {"train_loss": -27.014331817626953, "global_step": 447844, "epoch": 5395} {"train_loss": -26.92597007751465, "global_step": 447845, "epoch": 5395} {"train_loss": -26.93104362487793, "global_step": 447846, "epoch": 5395} {"train_loss": -26.21489906311035, "global_step": 447847, "epoch": 5395} {"train_loss": -25.943790435791016, "global_step": 447848, "epoch": 5395} {"train_loss": -25.68186378479004, "global_step": 447849, "epoch": 5395} {"train_loss": -26.28668785095215, "global_step": 447850, "epoch": 5395} {"train_loss": -26.191831588745117, "global_step": 447851, "epoch": 5395} {"train_loss": -26.64985466003418, "global_step": 447852, "epoch": 5395} {"train_loss": -26.22818374633789, "global_step": 447853, "epoch": 5395} {"train_loss": -26.747390747070312, "global_step": 447854, "epoch": 5395} {"train_loss": -26.5947265625, "global_step": 447855, "epoch": 5395} {"train_loss": -26.571191787719727, "global_step": 447856, "epoch": 5395} {"train_loss": -27.07490348815918, "global_step": 447857, "epoch": 5395} {"train_loss": -26.5125732421875, "global_step": 447858, "epoch": 5395} {"train_loss": -26.735248565673828, "global_step": 447859, "epoch": 5395} {"train_loss": -26.7755184173584, "global_step": 447860, "epoch": 5395} {"train_loss": -26.771814346313477, "global_step": 447861, "epoch": 5395} {"train_loss": -26.971927642822266, "global_step": 447862, "epoch": 5395} {"train_loss": -26.50054359436035, "global_step": 447863, "epoch": 5395} {"train_loss": -26.679779052734375, "global_step": 447864, "epoch": 5395} {"train_loss": -26.718780517578125, "global_step": 447865, "epoch": 5395} {"train_loss": -26.782276153564453, "global_step": 447866, "epoch": 5395} {"train_loss": -26.722170588481855, "global_step": 447867, "epoch": 5395, "val_loss": 6720359.5} {"train_loss": -26.110889434814453, "global_step": 447868, "epoch": 5396} {"train_loss": -26.3011474609375, "global_step": 447869, "epoch": 5396} {"train_loss": -26.564533233642578, "global_step": 447870, "epoch": 5396} {"train_loss": -26.166248321533203, "global_step": 447871, "epoch": 5396} {"train_loss": -26.51738929748535, "global_step": 447872, "epoch": 5396} {"train_loss": -26.21954917907715, "global_step": 447873, "epoch": 5396} {"train_loss": -26.51202964782715, "global_step": 447874, "epoch": 5396} {"train_loss": -26.464111328125, "global_step": 447875, "epoch": 5396} {"train_loss": -26.503021240234375, "global_step": 447876, "epoch": 5396} {"train_loss": -26.393232345581055, "global_step": 447877, "epoch": 5396} {"train_loss": -27.08698081970215, "global_step": 447878, "epoch": 5396} {"train_loss": -26.6292724609375, "global_step": 447879, "epoch": 5396} {"train_loss": -26.837635040283203, "global_step": 447880, "epoch": 5396} {"train_loss": -26.844715118408203, "global_step": 447881, "epoch": 5396} {"train_loss": -26.755359649658203, "global_step": 447882, "epoch": 5396} {"train_loss": -27.016080856323242, "global_step": 447883, "epoch": 5396} {"train_loss": -26.941492080688477, "global_step": 447884, "epoch": 5396} {"train_loss": -26.87729263305664, "global_step": 447885, "epoch": 5396} {"train_loss": -27.360788345336914, "global_step": 447886, "epoch": 5396} {"train_loss": -26.640226364135742, "global_step": 447887, "epoch": 5396} {"train_loss": -27.147619247436523, "global_step": 447888, "epoch": 5396} {"train_loss": -26.96431541442871, "global_step": 447889, "epoch": 5396} {"train_loss": -26.75164222717285, "global_step": 447890, "epoch": 5396} {"train_loss": -27.24928092956543, "global_step": 447891, "epoch": 5396} {"train_loss": -27.19451904296875, "global_step": 447892, "epoch": 5396} {"train_loss": -27.24896812438965, "global_step": 447893, "epoch": 5396} {"train_loss": -27.05975914001465, "global_step": 447894, "epoch": 5396} {"train_loss": -27.116987228393555, "global_step": 447895, "epoch": 5396} {"train_loss": -27.132659912109375, "global_step": 447896, "epoch": 5396} {"train_loss": -27.350133895874023, "global_step": 447897, "epoch": 5396} {"train_loss": -26.763303756713867, "global_step": 447898, "epoch": 5396} {"train_loss": -26.963972091674805, "global_step": 447899, "epoch": 5396} {"train_loss": -27.006261825561523, "global_step": 447900, "epoch": 5396} {"train_loss": -27.24603843688965, "global_step": 447901, "epoch": 5396} {"train_loss": -27.198959350585938, "global_step": 447902, "epoch": 5396} {"train_loss": -27.01822280883789, "global_step": 447903, "epoch": 5396} {"train_loss": -27.15339469909668, "global_step": 447904, "epoch": 5396} {"train_loss": -27.257490158081055, "global_step": 447905, "epoch": 5396} {"train_loss": -26.949670791625977, "global_step": 447906, "epoch": 5396} {"train_loss": -26.78907585144043, "global_step": 447907, "epoch": 5396} {"train_loss": -27.007226943969727, "global_step": 447908, "epoch": 5396} {"train_loss": -27.059736251831055, "global_step": 447909, "epoch": 5396} {"train_loss": -27.022634506225586, "global_step": 447910, "epoch": 5396} {"train_loss": -26.900583267211914, "global_step": 447911, "epoch": 5396} {"train_loss": -26.90162467956543, "global_step": 447912, "epoch": 5396} {"train_loss": -26.893659591674805, "global_step": 447913, "epoch": 5396} {"train_loss": -26.9548282623291, "global_step": 447914, "epoch": 5396} {"train_loss": -27.250141143798828, "global_step": 447915, "epoch": 5396} {"train_loss": -27.119787216186523, "global_step": 447916, "epoch": 5396} {"train_loss": -26.7988338470459, "global_step": 447917, "epoch": 5396} {"train_loss": -27.032550811767578, "global_step": 447918, "epoch": 5396} {"train_loss": -27.06121253967285, "global_step": 447919, "epoch": 5396} {"train_loss": -26.931310653686523, "global_step": 447920, "epoch": 5396} {"train_loss": -27.13471031188965, "global_step": 447921, "epoch": 5396} {"train_loss": -26.894956588745117, "global_step": 447922, "epoch": 5396} {"train_loss": -26.707752227783203, "global_step": 447923, "epoch": 5396} {"train_loss": -26.696985244750977, "global_step": 447924, "epoch": 5396} {"train_loss": -26.896148681640625, "global_step": 447925, "epoch": 5396} {"train_loss": -26.718341827392578, "global_step": 447926, "epoch": 5396} {"train_loss": -26.788022994995117, "global_step": 447927, "epoch": 5396} {"train_loss": -26.426502227783203, "global_step": 447928, "epoch": 5396} {"train_loss": -26.42333984375, "global_step": 447929, "epoch": 5396} {"train_loss": -26.644750595092773, "global_step": 447930, "epoch": 5396} {"train_loss": -26.456037521362305, "global_step": 447931, "epoch": 5396} {"train_loss": -26.168228149414062, "global_step": 447932, "epoch": 5396} {"train_loss": -26.66745948791504, "global_step": 447933, "epoch": 5396} {"train_loss": -26.451343536376953, "global_step": 447934, "epoch": 5396} {"train_loss": -26.555225372314453, "global_step": 447935, "epoch": 5396} {"train_loss": -26.9285831451416, "global_step": 447936, "epoch": 5396} {"train_loss": -26.73672866821289, "global_step": 447937, "epoch": 5396} {"train_loss": -26.760879516601562, "global_step": 447938, "epoch": 5396} {"train_loss": -26.771240234375, "global_step": 447939, "epoch": 5396} {"train_loss": -26.798166275024414, "global_step": 447940, "epoch": 5396} {"train_loss": -26.771270751953125, "global_step": 447941, "epoch": 5396} {"train_loss": -26.99969482421875, "global_step": 447942, "epoch": 5396} {"train_loss": -26.896305084228516, "global_step": 447943, "epoch": 5396} {"train_loss": -27.07102394104004, "global_step": 447944, "epoch": 5396} {"train_loss": -26.557775497436523, "global_step": 447945, "epoch": 5396} {"train_loss": -26.886890411376953, "global_step": 447946, "epoch": 5396} {"train_loss": -27.589923858642578, "global_step": 447947, "epoch": 5396} {"train_loss": -26.858245849609375, "global_step": 447948, "epoch": 5396} {"train_loss": -27.058164596557617, "global_step": 447949, "epoch": 5396} {"train_loss": -26.836659006325597, "global_step": 447950, "epoch": 5396, "val_loss": 6516985.0} {"train_loss": -26.99308204650879, "global_step": 447951, "epoch": 5397} {"train_loss": -27.173858642578125, "global_step": 447952, "epoch": 5397} {"train_loss": -26.9084529876709, "global_step": 447953, "epoch": 5397} {"train_loss": -27.065465927124023, "global_step": 447954, "epoch": 5397} {"train_loss": -26.41757583618164, "global_step": 447955, "epoch": 5397} {"train_loss": -26.805631637573242, "global_step": 447956, "epoch": 5397} {"train_loss": -27.192636489868164, "global_step": 447957, "epoch": 5397} {"train_loss": -26.960477828979492, "global_step": 447958, "epoch": 5397} {"train_loss": -26.8026123046875, "global_step": 447959, "epoch": 5397} {"train_loss": -26.797460556030273, "global_step": 447960, "epoch": 5397} {"train_loss": -27.298673629760742, "global_step": 447961, "epoch": 5397} {"train_loss": -26.6689395904541, "global_step": 447962, "epoch": 5397} {"train_loss": -26.9751033782959, "global_step": 447963, "epoch": 5397} {"train_loss": -27.185699462890625, "global_step": 447964, "epoch": 5397} {"train_loss": -26.925373077392578, "global_step": 447965, "epoch": 5397} {"train_loss": -27.345563888549805, "global_step": 447966, "epoch": 5397} {"train_loss": -26.826187133789062, "global_step": 447967, "epoch": 5397} {"train_loss": -27.1456356048584, "global_step": 447968, "epoch": 5397} {"train_loss": -26.994415283203125, "global_step": 447969, "epoch": 5397} {"train_loss": -26.746768951416016, "global_step": 447970, "epoch": 5397} {"train_loss": -26.961023330688477, "global_step": 447971, "epoch": 5397} {"train_loss": -27.203567504882812, "global_step": 447972, "epoch": 5397} {"train_loss": -26.8629207611084, "global_step": 447973, "epoch": 5397} {"train_loss": -27.0474796295166, "global_step": 447974, "epoch": 5397} {"train_loss": -26.676450729370117, "global_step": 447975, "epoch": 5397} {"train_loss": -27.037677764892578, "global_step": 447976, "epoch": 5397} {"train_loss": -26.81695556640625, "global_step": 447977, "epoch": 5397} {"train_loss": -27.089324951171875, "global_step": 447978, "epoch": 5397} {"train_loss": -27.3335018157959, "global_step": 447979, "epoch": 5397} {"train_loss": -27.1962947845459, "global_step": 447980, "epoch": 5397} {"train_loss": -27.228443145751953, "global_step": 447981, "epoch": 5397} {"train_loss": -26.92254638671875, "global_step": 447982, "epoch": 5397} {"train_loss": -26.906991958618164, "global_step": 447983, "epoch": 5397} {"train_loss": -27.365522384643555, "global_step": 447984, "epoch": 5397} {"train_loss": -26.792448043823242, "global_step": 447985, "epoch": 5397} {"train_loss": -27.147842407226562, "global_step": 447986, "epoch": 5397} {"train_loss": -27.0902099609375, "global_step": 447987, "epoch": 5397} {"train_loss": -27.41046714782715, "global_step": 447988, "epoch": 5397} {"train_loss": -27.284738540649414, "global_step": 447989, "epoch": 5397} {"train_loss": -26.770294189453125, "global_step": 447990, "epoch": 5397} {"train_loss": -26.945968627929688, "global_step": 447991, "epoch": 5397} {"train_loss": -27.143701553344727, "global_step": 447992, "epoch": 5397} {"train_loss": -27.082056045532227, "global_step": 447993, "epoch": 5397} {"train_loss": -27.077131271362305, "global_step": 447994, "epoch": 5397} {"train_loss": -27.222448348999023, "global_step": 447995, "epoch": 5397} {"train_loss": -26.796812057495117, "global_step": 447996, "epoch": 5397} {"train_loss": -26.898893356323242, "global_step": 447997, "epoch": 5397} {"train_loss": -26.878828048706055, "global_step": 447998, "epoch": 5397} {"train_loss": -27.233539581298828, "global_step": 447999, "epoch": 5397} {"train_loss": -27.2017879486084, "global_step": 448000, "epoch": 5397} {"train_loss": -27.16839599609375, "global_step": 448001, "epoch": 5397} {"train_loss": -27.008569717407227, "global_step": 448002, "epoch": 5397} {"train_loss": -27.021406173706055, "global_step": 448003, "epoch": 5397} {"train_loss": -27.02294921875, "global_step": 448004, "epoch": 5397} {"train_loss": -27.563861846923828, "global_step": 448005, "epoch": 5397} {"train_loss": -26.87708854675293, "global_step": 448006, "epoch": 5397} {"train_loss": -26.85230827331543, "global_step": 448007, "epoch": 5397} {"train_loss": -26.40852928161621, "global_step": 448008, "epoch": 5397} {"train_loss": -26.55999183654785, "global_step": 448009, "epoch": 5397} {"train_loss": -26.97102165222168, "global_step": 448010, "epoch": 5397} {"train_loss": -26.283166885375977, "global_step": 448011, "epoch": 5397} {"train_loss": -26.721277236938477, "global_step": 448012, "epoch": 5397} {"train_loss": -26.801843643188477, "global_step": 448013, "epoch": 5397} {"train_loss": -26.708459854125977, "global_step": 448014, "epoch": 5397} {"train_loss": -27.074039459228516, "global_step": 448015, "epoch": 5397} {"train_loss": -26.860666275024414, "global_step": 448016, "epoch": 5397} {"train_loss": -26.59433937072754, "global_step": 448017, "epoch": 5397} {"train_loss": -26.507415771484375, "global_step": 448018, "epoch": 5397} {"train_loss": -27.062414169311523, "global_step": 448019, "epoch": 5397} {"train_loss": -27.031208038330078, "global_step": 448020, "epoch": 5397} {"train_loss": -27.161701202392578, "global_step": 448021, "epoch": 5397} {"train_loss": -26.659433364868164, "global_step": 448022, "epoch": 5397} {"train_loss": -26.901987075805664, "global_step": 448023, "epoch": 5397} {"train_loss": -27.092187881469727, "global_step": 448024, "epoch": 5397} {"train_loss": -26.73885154724121, "global_step": 448025, "epoch": 5397} {"train_loss": -27.274362564086914, "global_step": 448026, "epoch": 5397} {"train_loss": -27.05267906188965, "global_step": 448027, "epoch": 5397} {"train_loss": -26.820837020874023, "global_step": 448028, "epoch": 5397} {"train_loss": -26.83379554748535, "global_step": 448029, "epoch": 5397} {"train_loss": -27.07427406311035, "global_step": 448030, "epoch": 5397} {"train_loss": -27.041706085205078, "global_step": 448031, "epoch": 5397} {"train_loss": -26.81465721130371, "global_step": 448032, "epoch": 5397} {"train_loss": -26.96559588880424, "global_step": 448033, "epoch": 5397, "val_loss": 6605093.0} {"train_loss": -26.4512939453125, "global_step": 448034, "epoch": 5398} {"train_loss": -26.40323257446289, "global_step": 448035, "epoch": 5398} {"train_loss": -26.411941528320312, "global_step": 448036, "epoch": 5398} {"train_loss": -26.802001953125, "global_step": 448037, "epoch": 5398} {"train_loss": -26.024518966674805, "global_step": 448038, "epoch": 5398} {"train_loss": -26.731847763061523, "global_step": 448039, "epoch": 5398} {"train_loss": -26.63117027282715, "global_step": 448040, "epoch": 5398} {"train_loss": -26.559823989868164, "global_step": 448041, "epoch": 5398} {"train_loss": -26.870512008666992, "global_step": 448042, "epoch": 5398} {"train_loss": -26.94032096862793, "global_step": 448043, "epoch": 5398} {"train_loss": -26.777597427368164, "global_step": 448044, "epoch": 5398} {"train_loss": -27.366113662719727, "global_step": 448045, "epoch": 5398} {"train_loss": -26.582382202148438, "global_step": 448046, "epoch": 5398} {"train_loss": -27.094715118408203, "global_step": 448047, "epoch": 5398} {"train_loss": -27.043012619018555, "global_step": 448048, "epoch": 5398} {"train_loss": -27.180316925048828, "global_step": 448049, "epoch": 5398} {"train_loss": -26.98200035095215, "global_step": 448050, "epoch": 5398} {"train_loss": -26.98829460144043, "global_step": 448051, "epoch": 5398} {"train_loss": -27.307363510131836, "global_step": 448052, "epoch": 5398} {"train_loss": -27.073583602905273, "global_step": 448053, "epoch": 5398} {"train_loss": -27.1651554107666, "global_step": 448054, "epoch": 5398} {"train_loss": -26.873931884765625, "global_step": 448055, "epoch": 5398} {"train_loss": -27.095823287963867, "global_step": 448056, "epoch": 5398} {"train_loss": -26.874225616455078, "global_step": 448057, "epoch": 5398} {"train_loss": -27.30866813659668, "global_step": 448058, "epoch": 5398} {"train_loss": -26.865026473999023, "global_step": 448059, "epoch": 5398} {"train_loss": -27.142866134643555, "global_step": 448060, "epoch": 5398} {"train_loss": -27.16388511657715, "global_step": 448061, "epoch": 5398} {"train_loss": -27.126773834228516, "global_step": 448062, "epoch": 5398} {"train_loss": -27.016738891601562, "global_step": 448063, "epoch": 5398} {"train_loss": -27.444250106811523, "global_step": 448064, "epoch": 5398} {"train_loss": -26.88686180114746, "global_step": 448065, "epoch": 5398} {"train_loss": -26.914953231811523, "global_step": 448066, "epoch": 5398} {"train_loss": -26.930700302124023, "global_step": 448067, "epoch": 5398} {"train_loss": -27.291608810424805, "global_step": 448068, "epoch": 5398} {"train_loss": -27.2209415435791, "global_step": 448069, "epoch": 5398} {"train_loss": -27.031661987304688, "global_step": 448070, "epoch": 5398} {"train_loss": -26.945371627807617, "global_step": 448071, "epoch": 5398} {"train_loss": -27.01503562927246, "global_step": 448072, "epoch": 5398} {"train_loss": -26.882604598999023, "global_step": 448073, "epoch": 5398} {"train_loss": -27.1190242767334, "global_step": 448074, "epoch": 5398} {"train_loss": -27.311737060546875, "global_step": 448075, "epoch": 5398} {"train_loss": -27.079879760742188, "global_step": 448076, "epoch": 5398} {"train_loss": -26.997827529907227, "global_step": 448077, "epoch": 5398} {"train_loss": -27.019977569580078, "global_step": 448078, "epoch": 5398} {"train_loss": -26.9623966217041, "global_step": 448079, "epoch": 5398} {"train_loss": -27.353168487548828, "global_step": 448080, "epoch": 5398} {"train_loss": -27.027372360229492, "global_step": 448081, "epoch": 5398} {"train_loss": -26.889097213745117, "global_step": 448082, "epoch": 5398} {"train_loss": -27.064619064331055, "global_step": 448083, "epoch": 5398} {"train_loss": -27.0539493560791, "global_step": 448084, "epoch": 5398} {"train_loss": -26.82441520690918, "global_step": 448085, "epoch": 5398} {"train_loss": -27.486310958862305, "global_step": 448086, "epoch": 5398} {"train_loss": -26.773059844970703, "global_step": 448087, "epoch": 5398} {"train_loss": -26.624616622924805, "global_step": 448088, "epoch": 5398} {"train_loss": -26.7773494720459, "global_step": 448089, "epoch": 5398} {"train_loss": -26.709735870361328, "global_step": 448090, "epoch": 5398} {"train_loss": -26.432104110717773, "global_step": 448091, "epoch": 5398} {"train_loss": -26.386579513549805, "global_step": 448092, "epoch": 5398} {"train_loss": -26.370203018188477, "global_step": 448093, "epoch": 5398} {"train_loss": -27.223310470581055, "global_step": 448094, "epoch": 5398} {"train_loss": -26.750019073486328, "global_step": 448095, "epoch": 5398} {"train_loss": -27.202987670898438, "global_step": 448096, "epoch": 5398} {"train_loss": -27.06027603149414, "global_step": 448097, "epoch": 5398} {"train_loss": -26.78785514831543, "global_step": 448098, "epoch": 5398} {"train_loss": -26.85100746154785, "global_step": 448099, "epoch": 5398} {"train_loss": -26.764028549194336, "global_step": 448100, "epoch": 5398} {"train_loss": -26.897634506225586, "global_step": 448101, "epoch": 5398} {"train_loss": -27.16547203063965, "global_step": 448102, "epoch": 5398} {"train_loss": -27.137372970581055, "global_step": 448103, "epoch": 5398} {"train_loss": -26.827062606811523, "global_step": 448104, "epoch": 5398} {"train_loss": -26.857507705688477, "global_step": 448105, "epoch": 5398} {"train_loss": -27.195714950561523, "global_step": 448106, "epoch": 5398} {"train_loss": -27.131811141967773, "global_step": 448107, "epoch": 5398} {"train_loss": -26.70204734802246, "global_step": 448108, "epoch": 5398} {"train_loss": -26.752899169921875, "global_step": 448109, "epoch": 5398} {"train_loss": -26.97250747680664, "global_step": 448110, "epoch": 5398} {"train_loss": -26.99049949645996, "global_step": 448111, "epoch": 5398} {"train_loss": -27.147602081298828, "global_step": 448112, "epoch": 5398} {"train_loss": -26.81292152404785, "global_step": 448113, "epoch": 5398} {"train_loss": -27.151620864868164, "global_step": 448114, "epoch": 5398} {"train_loss": -26.827062606811523, "global_step": 448115, "epoch": 5398} {"train_loss": -26.943348528390906, "global_step": 448116, "epoch": 5398, "val_loss": 6621415.0} {"train_loss": -27.109655380249023, "global_step": 448117, "epoch": 5399} {"train_loss": -26.461462020874023, "global_step": 448118, "epoch": 5399} {"train_loss": -26.710437774658203, "global_step": 448119, "epoch": 5399} {"train_loss": -26.89470863342285, "global_step": 448120, "epoch": 5399} {"train_loss": -26.273534774780273, "global_step": 448121, "epoch": 5399} {"train_loss": -26.607959747314453, "global_step": 448122, "epoch": 5399} {"train_loss": -26.26888084411621, "global_step": 448123, "epoch": 5399} {"train_loss": -26.662412643432617, "global_step": 448124, "epoch": 5399} {"train_loss": -26.778039932250977, "global_step": 448125, "epoch": 5399} {"train_loss": -26.659032821655273, "global_step": 448126, "epoch": 5399} {"train_loss": -26.639814376831055, "global_step": 448127, "epoch": 5399} {"train_loss": -27.15869140625, "global_step": 448128, "epoch": 5399} {"train_loss": -26.661087036132812, "global_step": 448129, "epoch": 5399} {"train_loss": -26.550159454345703, "global_step": 448130, "epoch": 5399} {"train_loss": -26.774311065673828, "global_step": 448131, "epoch": 5399} {"train_loss": -26.97273063659668, "global_step": 448132, "epoch": 5399} {"train_loss": -27.001739501953125, "global_step": 448133, "epoch": 5399} {"train_loss": -27.086339950561523, "global_step": 448134, "epoch": 5399} {"train_loss": -26.89603614807129, "global_step": 448135, "epoch": 5399} {"train_loss": -26.77496910095215, "global_step": 448136, "epoch": 5399} {"train_loss": -27.21502685546875, "global_step": 448137, "epoch": 5399} {"train_loss": -27.025470733642578, "global_step": 448138, "epoch": 5399} {"train_loss": -27.122678756713867, "global_step": 448139, "epoch": 5399} {"train_loss": -26.954364776611328, "global_step": 448140, "epoch": 5399} {"train_loss": -26.604358673095703, "global_step": 448141, "epoch": 5399} {"train_loss": -27.101444244384766, "global_step": 448142, "epoch": 5399} {"train_loss": -26.911375045776367, "global_step": 448143, "epoch": 5399} {"train_loss": -27.120492935180664, "global_step": 448144, "epoch": 5399} {"train_loss": -27.2398738861084, "global_step": 448145, "epoch": 5399} {"train_loss": -27.204883575439453, "global_step": 448146, "epoch": 5399} {"train_loss": -27.165058135986328, "global_step": 448147, "epoch": 5399} {"train_loss": -27.228784561157227, "global_step": 448148, "epoch": 5399} {"train_loss": -26.950342178344727, "global_step": 448149, "epoch": 5399} {"train_loss": -27.203510284423828, "global_step": 448150, "epoch": 5399} {"train_loss": -27.27898597717285, "global_step": 448151, "epoch": 5399} {"train_loss": -27.156396865844727, "global_step": 448152, "epoch": 5399} {"train_loss": -27.356098175048828, "global_step": 448153, "epoch": 5399} {"train_loss": -26.9144287109375, "global_step": 448154, "epoch": 5399} {"train_loss": -26.88142204284668, "global_step": 448155, "epoch": 5399} {"train_loss": -26.91512107849121, "global_step": 448156, "epoch": 5399} {"train_loss": -27.216337203979492, "global_step": 448157, "epoch": 5399} {"train_loss": -27.307249069213867, "global_step": 448158, "epoch": 5399} {"train_loss": -26.78904151916504, "global_step": 448159, "epoch": 5399} {"train_loss": -26.869739532470703, "global_step": 448160, "epoch": 5399} {"train_loss": -27.18202781677246, "global_step": 448161, "epoch": 5399} {"train_loss": -27.21234130859375, "global_step": 448162, "epoch": 5399} {"train_loss": -27.042516708374023, "global_step": 448163, "epoch": 5399} {"train_loss": -27.091352462768555, "global_step": 448164, "epoch": 5399} {"train_loss": -26.72810173034668, "global_step": 448165, "epoch": 5399} {"train_loss": -26.944028854370117, "global_step": 448166, "epoch": 5399} {"train_loss": -27.226980209350586, "global_step": 448167, "epoch": 5399} {"train_loss": -26.968719482421875, "global_step": 448168, "epoch": 5399} {"train_loss": -26.97039222717285, "global_step": 448169, "epoch": 5399} {"train_loss": -26.478912353515625, "global_step": 448170, "epoch": 5399} {"train_loss": -26.09560203552246, "global_step": 448171, "epoch": 5399} {"train_loss": -26.605661392211914, "global_step": 448172, "epoch": 5399} {"train_loss": -26.864957809448242, "global_step": 448173, "epoch": 5399} {"train_loss": -26.764413833618164, "global_step": 448174, "epoch": 5399} {"train_loss": -26.585098266601562, "global_step": 448175, "epoch": 5399} {"train_loss": -26.865570068359375, "global_step": 448176, "epoch": 5399} {"train_loss": -26.894750595092773, "global_step": 448177, "epoch": 5399} {"train_loss": -27.115802764892578, "global_step": 448178, "epoch": 5399} {"train_loss": -26.76283073425293, "global_step": 448179, "epoch": 5399} {"train_loss": -26.766706466674805, "global_step": 448180, "epoch": 5399} {"train_loss": -26.548389434814453, "global_step": 448181, "epoch": 5399} {"train_loss": -26.634923934936523, "global_step": 448182, "epoch": 5399} {"train_loss": -26.935256958007812, "global_step": 448183, "epoch": 5399} {"train_loss": -26.38882827758789, "global_step": 448184, "epoch": 5399} {"train_loss": -26.80344581604004, "global_step": 448185, "epoch": 5399} {"train_loss": -26.935819625854492, "global_step": 448186, "epoch": 5399} {"train_loss": -26.92658042907715, "global_step": 448187, "epoch": 5399} {"train_loss": -26.784421920776367, "global_step": 448188, "epoch": 5399} {"train_loss": -26.64198875427246, "global_step": 448189, "epoch": 5399} {"train_loss": -26.996252059936523, "global_step": 448190, "epoch": 5399} {"train_loss": -26.612659454345703, "global_step": 448191, "epoch": 5399} {"train_loss": -26.57146644592285, "global_step": 448192, "epoch": 5399} {"train_loss": -27.135974884033203, "global_step": 448193, "epoch": 5399} {"train_loss": -26.79196548461914, "global_step": 448194, "epoch": 5399} {"train_loss": -26.963516235351562, "global_step": 448195, "epoch": 5399} {"train_loss": -26.765233993530273, "global_step": 448196, "epoch": 5399} {"train_loss": -26.8845157623291, "global_step": 448197, "epoch": 5399} {"train_loss": -26.84269142150879, "global_step": 448198, "epoch": 5399} {"train_loss": -26.8967336861484, "global_step": 448199, "epoch": 5399, "val_loss": 6554134.5} {"train_loss": -24.638341903686523, "global_step": 448200, "epoch": 5400} {"train_loss": -25.730361938476562, "global_step": 448201, "epoch": 5400} {"train_loss": -25.5730037689209, "global_step": 448202, "epoch": 5400} {"train_loss": -25.40606117248535, "global_step": 448203, "epoch": 5400} {"train_loss": -25.788883209228516, "global_step": 448204, "epoch": 5400} {"train_loss": -25.8410587310791, "global_step": 448205, "epoch": 5400} {"train_loss": -25.827070236206055, "global_step": 448206, "epoch": 5400} {"train_loss": -25.905872344970703, "global_step": 448207, "epoch": 5400} {"train_loss": -26.14983558654785, "global_step": 448208, "epoch": 5400} {"train_loss": -26.147024154663086, "global_step": 448209, "epoch": 5400} {"train_loss": -26.31475257873535, "global_step": 448210, "epoch": 5400} {"train_loss": -26.2688045501709, "global_step": 448211, "epoch": 5400} {"train_loss": -26.560672760009766, "global_step": 448212, "epoch": 5400} {"train_loss": -26.369979858398438, "global_step": 448213, "epoch": 5400} {"train_loss": -26.73274040222168, "global_step": 448214, "epoch": 5400} {"train_loss": -26.307544708251953, "global_step": 448215, "epoch": 5400} {"train_loss": -26.862640380859375, "global_step": 448216, "epoch": 5400} {"train_loss": -26.206836700439453, "global_step": 448217, "epoch": 5400} {"train_loss": -26.393787384033203, "global_step": 448218, "epoch": 5400} {"train_loss": -26.20037841796875, "global_step": 448219, "epoch": 5400} {"train_loss": -26.42217445373535, "global_step": 448220, "epoch": 5400} {"train_loss": -26.532947540283203, "global_step": 448221, "epoch": 5400} {"train_loss": -26.513137817382812, "global_step": 448222, "epoch": 5400} {"train_loss": -26.644956588745117, "global_step": 448223, "epoch": 5400} {"train_loss": -26.549671173095703, "global_step": 448224, "epoch": 5400} {"train_loss": -26.43794059753418, "global_step": 448225, "epoch": 5400} {"train_loss": -26.765979766845703, "global_step": 448226, "epoch": 5400} {"train_loss": -26.8819522857666, "global_step": 448227, "epoch": 5400} {"train_loss": -26.458662033081055, "global_step": 448228, "epoch": 5400} {"train_loss": -26.86958885192871, "global_step": 448229, "epoch": 5400} {"train_loss": -26.68170166015625, "global_step": 448230, "epoch": 5400} {"train_loss": -26.666183471679688, "global_step": 448231, "epoch": 5400} {"train_loss": -26.7786808013916, "global_step": 448232, "epoch": 5400} {"train_loss": -26.7705078125, "global_step": 448233, "epoch": 5400} {"train_loss": -27.0574893951416, "global_step": 448234, "epoch": 5400} {"train_loss": -26.6417179107666, "global_step": 448235, "epoch": 5400} {"train_loss": -27.173364639282227, "global_step": 448236, "epoch": 5400} {"train_loss": -26.80640983581543, "global_step": 448237, "epoch": 5400} {"train_loss": -27.059640884399414, "global_step": 448238, "epoch": 5400} {"train_loss": -26.953388214111328, "global_step": 448239, "epoch": 5400} {"train_loss": -26.4406795501709, "global_step": 448240, "epoch": 5400} {"train_loss": -26.689594268798828, "global_step": 448241, "epoch": 5400} {"train_loss": -27.064985275268555, "global_step": 448242, "epoch": 5400} {"train_loss": -26.83077049255371, "global_step": 448243, "epoch": 5400} {"train_loss": -26.694395065307617, "global_step": 448244, "epoch": 5400} {"train_loss": -26.643951416015625, "global_step": 448245, "epoch": 5400} {"train_loss": -26.64936637878418, "global_step": 448246, "epoch": 5400} {"train_loss": -26.845014572143555, "global_step": 448247, "epoch": 5400} {"train_loss": -27.1901912689209, "global_step": 448248, "epoch": 5400} {"train_loss": -26.908361434936523, "global_step": 448249, "epoch": 5400} {"train_loss": -27.126340866088867, "global_step": 448250, "epoch": 5400} {"train_loss": -27.079145431518555, "global_step": 448251, "epoch": 5400} {"train_loss": -27.202245712280273, "global_step": 448252, "epoch": 5400} {"train_loss": -27.15394401550293, "global_step": 448253, "epoch": 5400} {"train_loss": -26.943639755249023, "global_step": 448254, "epoch": 5400} {"train_loss": -27.191787719726562, "global_step": 448255, "epoch": 5400} {"train_loss": -26.91365623474121, "global_step": 448256, "epoch": 5400} {"train_loss": -26.881427764892578, "global_step": 448257, "epoch": 5400} {"train_loss": -26.93963623046875, "global_step": 448258, "epoch": 5400} {"train_loss": -27.127790451049805, "global_step": 448259, "epoch": 5400} {"train_loss": -26.924352645874023, "global_step": 448260, "epoch": 5400} {"train_loss": -26.806005477905273, "global_step": 448261, "epoch": 5400} {"train_loss": -27.042490005493164, "global_step": 448262, "epoch": 5400} {"train_loss": -27.17551612854004, "global_step": 448263, "epoch": 5400} {"train_loss": -27.0461368560791, "global_step": 448264, "epoch": 5400} {"train_loss": -27.225311279296875, "global_step": 448265, "epoch": 5400} {"train_loss": -27.22767448425293, "global_step": 448266, "epoch": 5400} {"train_loss": -26.812103271484375, "global_step": 448267, "epoch": 5400} {"train_loss": -27.171804428100586, "global_step": 448268, "epoch": 5400} {"train_loss": -26.932035446166992, "global_step": 448269, "epoch": 5400} {"train_loss": -27.08526039123535, "global_step": 448270, "epoch": 5400} {"train_loss": -27.0305118560791, "global_step": 448271, "epoch": 5400} {"train_loss": -27.12643814086914, "global_step": 448272, "epoch": 5400} {"train_loss": -26.9245548248291, "global_step": 448273, "epoch": 5400} {"train_loss": -26.781967163085938, "global_step": 448274, "epoch": 5400} {"train_loss": -26.864912033081055, "global_step": 448275, "epoch": 5400} {"train_loss": -26.796619415283203, "global_step": 448276, "epoch": 5400} {"train_loss": -27.239221572875977, "global_step": 448277, "epoch": 5400} {"train_loss": -26.85450553894043, "global_step": 448278, "epoch": 5400} {"train_loss": -26.415180206298828, "global_step": 448279, "epoch": 5400} {"train_loss": -26.786237716674805, "global_step": 448280, "epoch": 5400} {"train_loss": -27.046844482421875, "global_step": 448281, "epoch": 5400} {"train_loss": -26.663045377616424, "global_step": 448282, "epoch": 5400, "train/sim_max_reward_0": 0.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4500000": 1.0, "test/sim_max_reward_4500001": 1.0, "test/sim_max_reward_4500002": 1.0, "test/sim_max_reward_4500003": 1.0, "test/sim_max_reward_4500004": 1.0, "test/sim_max_reward_4500005": 1.0, "test/sim_max_reward_4500006": 1.0, "test/sim_max_reward_4500007": 0.0, "test/sim_max_reward_4500008": 1.0, "test/sim_max_reward_4500009": 1.0, "test/sim_max_reward_4500010": 1.0, "test/sim_max_reward_4500011": 1.0, "test/sim_max_reward_4500012": 1.0, "test/sim_max_reward_4500013": 1.0, "test/sim_max_reward_4500014": 1.0, "test/sim_max_reward_4500015": 1.0, "test/sim_max_reward_4500016": 1.0, "test/sim_max_reward_4500017": 1.0, "test/sim_max_reward_4500018": 1.0, "test/sim_max_reward_4500019": 1.0, "test/sim_max_reward_4500020": 1.0, "test/sim_max_reward_4500021": 1.0, "train/mean_score": 0.8333333333333334, "test/mean_score": 0.9545454545454546, "val_loss": 6643642.0} {"train_loss": -26.24397850036621, "global_step": 448283, "epoch": 5401} {"train_loss": -26.394742965698242, "global_step": 448284, "epoch": 5401} {"train_loss": -26.54965591430664, "global_step": 448285, "epoch": 5401} {"train_loss": -26.60719871520996, "global_step": 448286, "epoch": 5401} {"train_loss": -26.324548721313477, "global_step": 448287, "epoch": 5401} {"train_loss": -25.53839683532715, "global_step": 448288, "epoch": 5401} {"train_loss": -26.44559097290039, "global_step": 448289, "epoch": 5401} {"train_loss": -25.5654239654541, "global_step": 448290, "epoch": 5401} {"train_loss": -26.154621124267578, "global_step": 448291, "epoch": 5401} {"train_loss": -26.3348388671875, "global_step": 448292, "epoch": 5401} {"train_loss": -25.907758712768555, "global_step": 448293, "epoch": 5401} {"train_loss": -26.216211318969727, "global_step": 448294, "epoch": 5401} {"train_loss": -26.232776641845703, "global_step": 448295, "epoch": 5401} {"train_loss": -25.87123680114746, "global_step": 448296, "epoch": 5401} {"train_loss": -26.360645294189453, "global_step": 448297, "epoch": 5401} {"train_loss": -26.363636016845703, "global_step": 448298, "epoch": 5401} {"train_loss": -26.19524574279785, "global_step": 448299, "epoch": 5401} {"train_loss": -26.19471549987793, "global_step": 448300, "epoch": 5401} {"train_loss": -26.289358139038086, "global_step": 448301, "epoch": 5401} {"train_loss": -26.635007858276367, "global_step": 448302, "epoch": 5401} {"train_loss": -26.585906982421875, "global_step": 448303, "epoch": 5401} {"train_loss": -26.5920352935791, "global_step": 448304, "epoch": 5401} {"train_loss": -26.94650650024414, "global_step": 448305, "epoch": 5401} {"train_loss": -26.382694244384766, "global_step": 448306, "epoch": 5401} {"train_loss": -26.753387451171875, "global_step": 448307, "epoch": 5401} {"train_loss": -26.425918579101562, "global_step": 448308, "epoch": 5401} {"train_loss": -26.49518394470215, "global_step": 448309, "epoch": 5401} {"train_loss": -26.569995880126953, "global_step": 448310, "epoch": 5401} {"train_loss": -26.512664794921875, "global_step": 448311, "epoch": 5401} {"train_loss": -26.565778732299805, "global_step": 448312, "epoch": 5401} {"train_loss": -26.7549991607666, "global_step": 448313, "epoch": 5401} {"train_loss": -26.654178619384766, "global_step": 448314, "epoch": 5401} {"train_loss": -26.993213653564453, "global_step": 448315, "epoch": 5401} {"train_loss": -26.429285049438477, "global_step": 448316, "epoch": 5401} {"train_loss": -26.856800079345703, "global_step": 448317, "epoch": 5401} {"train_loss": -26.829694747924805, "global_step": 448318, "epoch": 5401} {"train_loss": -26.97623062133789, "global_step": 448319, "epoch": 5401} {"train_loss": -26.964630126953125, "global_step": 448320, "epoch": 5401} {"train_loss": -26.74837303161621, "global_step": 448321, "epoch": 5401} {"train_loss": -26.891576766967773, "global_step": 448322, "epoch": 5401} {"train_loss": -26.94927406311035, "global_step": 448323, "epoch": 5401} {"train_loss": -26.790800094604492, "global_step": 448324, "epoch": 5401} {"train_loss": -26.857046127319336, "global_step": 448325, "epoch": 5401} {"train_loss": -27.286718368530273, "global_step": 448326, "epoch": 5401} {"train_loss": -27.00323486328125, "global_step": 448327, "epoch": 5401} {"train_loss": -27.188613891601562, "global_step": 448328, "epoch": 5401} {"train_loss": -27.23052978515625, "global_step": 448329, "epoch": 5401} {"train_loss": -27.31378173828125, "global_step": 448330, "epoch": 5401} {"train_loss": -27.094282150268555, "global_step": 448331, "epoch": 5401} {"train_loss": -27.066116333007812, "global_step": 448332, "epoch": 5401} {"train_loss": -27.203842163085938, "global_step": 448333, "epoch": 5401} {"train_loss": -26.86408042907715, "global_step": 448334, "epoch": 5401} {"train_loss": -27.296558380126953, "global_step": 448335, "epoch": 5401} {"train_loss": -26.726825714111328, "global_step": 448336, "epoch": 5401} {"train_loss": -27.299575805664062, "global_step": 448337, "epoch": 5401} {"train_loss": -27.179758071899414, "global_step": 448338, "epoch": 5401} {"train_loss": -27.218997955322266, "global_step": 448339, "epoch": 5401} {"train_loss": -27.243093490600586, "global_step": 448340, "epoch": 5401} {"train_loss": -27.261749267578125, "global_step": 448341, "epoch": 5401} {"train_loss": -27.187559127807617, "global_step": 448342, "epoch": 5401} {"train_loss": -26.814193725585938, "global_step": 448343, "epoch": 5401} {"train_loss": -27.38492774963379, "global_step": 448344, "epoch": 5401} {"train_loss": -27.03362464904785, "global_step": 448345, "epoch": 5401} {"train_loss": -27.18296241760254, "global_step": 448346, "epoch": 5401} {"train_loss": -26.805877685546875, "global_step": 448347, "epoch": 5401} {"train_loss": -27.26576805114746, "global_step": 448348, "epoch": 5401} {"train_loss": -27.009057998657227, "global_step": 448349, "epoch": 5401} {"train_loss": -27.295867919921875, "global_step": 448350, "epoch": 5401} {"train_loss": -27.151464462280273, "global_step": 448351, "epoch": 5401} {"train_loss": -26.927953720092773, "global_step": 448352, "epoch": 5401} {"train_loss": -27.03122329711914, "global_step": 448353, "epoch": 5401} {"train_loss": -27.388477325439453, "global_step": 448354, "epoch": 5401} {"train_loss": -26.892242431640625, "global_step": 448355, "epoch": 5401} {"train_loss": -26.598295211791992, "global_step": 448356, "epoch": 5401} {"train_loss": -27.45513343811035, "global_step": 448357, "epoch": 5401} {"train_loss": -26.90728759765625, "global_step": 448358, "epoch": 5401} {"train_loss": -26.473011016845703, "global_step": 448359, "epoch": 5401} {"train_loss": -27.182697296142578, "global_step": 448360, "epoch": 5401} {"train_loss": -26.442548751831055, "global_step": 448361, "epoch": 5401} {"train_loss": -27.096837997436523, "global_step": 448362, "epoch": 5401} {"train_loss": -26.969236373901367, "global_step": 448363, "epoch": 5401} {"train_loss": -27.067581176757812, "global_step": 448364, "epoch": 5401} {"train_loss": -26.764037028852716, "global_step": 448365, "epoch": 5401, "val_loss": 6597563.5} {"train_loss": -27.107269287109375, "global_step": 448366, "epoch": 5402} {"train_loss": -26.383026123046875, "global_step": 448367, "epoch": 5402} {"train_loss": -26.81562614440918, "global_step": 448368, "epoch": 5402} {"train_loss": -26.804920196533203, "global_step": 448369, "epoch": 5402} {"train_loss": -27.021015167236328, "global_step": 448370, "epoch": 5402} {"train_loss": -27.0913028717041, "global_step": 448371, "epoch": 5402} {"train_loss": -26.821836471557617, "global_step": 448372, "epoch": 5402} {"train_loss": -26.711536407470703, "global_step": 448373, "epoch": 5402} {"train_loss": -26.66111183166504, "global_step": 448374, "epoch": 5402} {"train_loss": -26.549835205078125, "global_step": 448375, "epoch": 5402} {"train_loss": -26.71966552734375, "global_step": 448376, "epoch": 5402} {"train_loss": -26.59022331237793, "global_step": 448377, "epoch": 5402} {"train_loss": -26.529163360595703, "global_step": 448378, "epoch": 5402} {"train_loss": -26.571455001831055, "global_step": 448379, "epoch": 5402} {"train_loss": -26.769271850585938, "global_step": 448380, "epoch": 5402} {"train_loss": -26.825727462768555, "global_step": 448381, "epoch": 5402} {"train_loss": -27.040164947509766, "global_step": 448382, "epoch": 5402} {"train_loss": -26.9019775390625, "global_step": 448383, "epoch": 5402} {"train_loss": -26.6832275390625, "global_step": 448384, "epoch": 5402} {"train_loss": -26.867340087890625, "global_step": 448385, "epoch": 5402} {"train_loss": -26.714590072631836, "global_step": 448386, "epoch": 5402} {"train_loss": -27.1143856048584, "global_step": 448387, "epoch": 5402} {"train_loss": -27.061511993408203, "global_step": 448388, "epoch": 5402} {"train_loss": -27.058425903320312, "global_step": 448389, "epoch": 5402} {"train_loss": -26.978031158447266, "global_step": 448390, "epoch": 5402} {"train_loss": -26.7645320892334, "global_step": 448391, "epoch": 5402} {"train_loss": -26.86850929260254, "global_step": 448392, "epoch": 5402} {"train_loss": -27.374608993530273, "global_step": 448393, "epoch": 5402} {"train_loss": -26.9816951751709, "global_step": 448394, "epoch": 5402} {"train_loss": -26.8277587890625, "global_step": 448395, "epoch": 5402} {"train_loss": -26.709808349609375, "global_step": 448396, "epoch": 5402} {"train_loss": -27.28363037109375, "global_step": 448397, "epoch": 5402} {"train_loss": -27.156774520874023, "global_step": 448398, "epoch": 5402} {"train_loss": -26.635934829711914, "global_step": 448399, "epoch": 5402} {"train_loss": -26.85382652282715, "global_step": 448400, "epoch": 5402} {"train_loss": -26.944812774658203, "global_step": 448401, "epoch": 5402} {"train_loss": -26.8984317779541, "global_step": 448402, "epoch": 5402} {"train_loss": -27.143335342407227, "global_step": 448403, "epoch": 5402} {"train_loss": -26.85697364807129, "global_step": 448404, "epoch": 5402} {"train_loss": -27.198530197143555, "global_step": 448405, "epoch": 5402} {"train_loss": -27.42742919921875, "global_step": 448406, "epoch": 5402} {"train_loss": -27.0509090423584, "global_step": 448407, "epoch": 5402} {"train_loss": -27.572559356689453, "global_step": 448408, "epoch": 5402} {"train_loss": -27.254749298095703, "global_step": 448409, "epoch": 5402} {"train_loss": -27.225326538085938, "global_step": 448410, "epoch": 5402} {"train_loss": -27.398237228393555, "global_step": 448411, "epoch": 5402} {"train_loss": -27.072998046875, "global_step": 448412, "epoch": 5402} {"train_loss": -27.190204620361328, "global_step": 448413, "epoch": 5402} {"train_loss": -27.04188346862793, "global_step": 448414, "epoch": 5402} {"train_loss": -26.86408805847168, "global_step": 448415, "epoch": 5402} {"train_loss": -26.93552589416504, "global_step": 448416, "epoch": 5402} {"train_loss": -26.846851348876953, "global_step": 448417, "epoch": 5402} {"train_loss": -26.796756744384766, "global_step": 448418, "epoch": 5402} {"train_loss": -27.222152709960938, "global_step": 448419, "epoch": 5402} {"train_loss": -27.191181182861328, "global_step": 448420, "epoch": 5402} {"train_loss": -26.713659286499023, "global_step": 448421, "epoch": 5402} {"train_loss": -27.126007080078125, "global_step": 448422, "epoch": 5402} {"train_loss": -27.013824462890625, "global_step": 448423, "epoch": 5402} {"train_loss": -26.810083389282227, "global_step": 448424, "epoch": 5402} {"train_loss": -26.668487548828125, "global_step": 448425, "epoch": 5402} {"train_loss": -26.576940536499023, "global_step": 448426, "epoch": 5402} {"train_loss": -26.025772094726562, "global_step": 448427, "epoch": 5402} {"train_loss": -26.665149688720703, "global_step": 448428, "epoch": 5402} {"train_loss": -26.93729591369629, "global_step": 448429, "epoch": 5402} {"train_loss": -27.326032638549805, "global_step": 448430, "epoch": 5402} {"train_loss": -27.019378662109375, "global_step": 448431, "epoch": 5402} {"train_loss": -27.2242431640625, "global_step": 448432, "epoch": 5402} {"train_loss": -26.85906982421875, "global_step": 448433, "epoch": 5402} {"train_loss": -26.680557250976562, "global_step": 448434, "epoch": 5402} {"train_loss": -26.866491317749023, "global_step": 448435, "epoch": 5402} {"train_loss": -27.015670776367188, "global_step": 448436, "epoch": 5402} {"train_loss": -27.081256866455078, "global_step": 448437, "epoch": 5402} {"train_loss": -27.032703399658203, "global_step": 448438, "epoch": 5402} {"train_loss": -27.267257690429688, "global_step": 448439, "epoch": 5402} {"train_loss": -27.010883331298828, "global_step": 448440, "epoch": 5402} {"train_loss": -27.1898193359375, "global_step": 448441, "epoch": 5402} {"train_loss": -27.483190536499023, "global_step": 448442, "epoch": 5402} {"train_loss": -27.5069580078125, "global_step": 448443, "epoch": 5402} {"train_loss": -27.013395309448242, "global_step": 448444, "epoch": 5402} {"train_loss": -27.00737953186035, "global_step": 448445, "epoch": 5402} {"train_loss": -26.94515037536621, "global_step": 448446, "epoch": 5402} {"train_loss": -26.996612548828125, "global_step": 448447, "epoch": 5402} {"train_loss": -26.95543371912945, "global_step": 448448, "epoch": 5402, "val_loss": 6632980.5} {"train_loss": -25.06073760986328, "global_step": 448449, "epoch": 5403} {"train_loss": -24.255369186401367, "global_step": 448450, "epoch": 5403} {"train_loss": -26.6726016998291, "global_step": 448451, "epoch": 5403} {"train_loss": -24.704275131225586, "global_step": 448452, "epoch": 5403} {"train_loss": -26.278522491455078, "global_step": 448453, "epoch": 5403} {"train_loss": -26.009180068969727, "global_step": 448454, "epoch": 5403} {"train_loss": -26.81038475036621, "global_step": 448455, "epoch": 5403} {"train_loss": -25.82073402404785, "global_step": 448456, "epoch": 5403} {"train_loss": -26.58424186706543, "global_step": 448457, "epoch": 5403} {"train_loss": -26.20228385925293, "global_step": 448458, "epoch": 5403} {"train_loss": -26.453283309936523, "global_step": 448459, "epoch": 5403} {"train_loss": -26.376935958862305, "global_step": 448460, "epoch": 5403} {"train_loss": -26.37029457092285, "global_step": 448461, "epoch": 5403} {"train_loss": -26.596044540405273, "global_step": 448462, "epoch": 5403} {"train_loss": -26.471044540405273, "global_step": 448463, "epoch": 5403} {"train_loss": -26.1170597076416, "global_step": 448464, "epoch": 5403} {"train_loss": -26.661853790283203, "global_step": 448465, "epoch": 5403} {"train_loss": -26.730396270751953, "global_step": 448466, "epoch": 5403} {"train_loss": -26.51222038269043, "global_step": 448467, "epoch": 5403} {"train_loss": -26.856128692626953, "global_step": 448468, "epoch": 5403} {"train_loss": -26.88749122619629, "global_step": 448469, "epoch": 5403} {"train_loss": -26.47027587890625, "global_step": 448470, "epoch": 5403} {"train_loss": -27.078693389892578, "global_step": 448471, "epoch": 5403} {"train_loss": -27.027332305908203, "global_step": 448472, "epoch": 5403} {"train_loss": -26.731470108032227, "global_step": 448473, "epoch": 5403} {"train_loss": -26.628875732421875, "global_step": 448474, "epoch": 5403} {"train_loss": -26.46659278869629, "global_step": 448475, "epoch": 5403} {"train_loss": -26.614105224609375, "global_step": 448476, "epoch": 5403} {"train_loss": -26.704742431640625, "global_step": 448477, "epoch": 5403} {"train_loss": -26.605789184570312, "global_step": 448478, "epoch": 5403} {"train_loss": -26.828031539916992, "global_step": 448479, "epoch": 5403} {"train_loss": -26.6090030670166, "global_step": 448480, "epoch": 5403} {"train_loss": -27.032758712768555, "global_step": 448481, "epoch": 5403} {"train_loss": -26.866546630859375, "global_step": 448482, "epoch": 5403} {"train_loss": -26.215682983398438, "global_step": 448483, "epoch": 5403} {"train_loss": -26.942035675048828, "global_step": 448484, "epoch": 5403} {"train_loss": -27.04568862915039, "global_step": 448485, "epoch": 5403} {"train_loss": -26.555774688720703, "global_step": 448486, "epoch": 5403} {"train_loss": -26.7220401763916, "global_step": 448487, "epoch": 5403} {"train_loss": -26.74188804626465, "global_step": 448488, "epoch": 5403} {"train_loss": -27.1951847076416, "global_step": 448489, "epoch": 5403} {"train_loss": -26.75996971130371, "global_step": 448490, "epoch": 5403} {"train_loss": -27.274198532104492, "global_step": 448491, "epoch": 5403} {"train_loss": -27.194555282592773, "global_step": 448492, "epoch": 5403} {"train_loss": -26.795896530151367, "global_step": 448493, "epoch": 5403} {"train_loss": -27.035449981689453, "global_step": 448494, "epoch": 5403} {"train_loss": -27.23798942565918, "global_step": 448495, "epoch": 5403} {"train_loss": -27.119760513305664, "global_step": 448496, "epoch": 5403} {"train_loss": -27.395999908447266, "global_step": 448497, "epoch": 5403} {"train_loss": -27.03662109375, "global_step": 448498, "epoch": 5403} {"train_loss": -26.956037521362305, "global_step": 448499, "epoch": 5403} {"train_loss": -27.114294052124023, "global_step": 448500, "epoch": 5403} {"train_loss": -27.115131378173828, "global_step": 448501, "epoch": 5403} {"train_loss": -27.356000900268555, "global_step": 448502, "epoch": 5403} {"train_loss": -27.186315536499023, "global_step": 448503, "epoch": 5403} {"train_loss": -27.20757484436035, "global_step": 448504, "epoch": 5403} {"train_loss": -27.104650497436523, "global_step": 448505, "epoch": 5403} {"train_loss": -26.929401397705078, "global_step": 448506, "epoch": 5403} {"train_loss": -27.113525390625, "global_step": 448507, "epoch": 5403} {"train_loss": -27.083810806274414, "global_step": 448508, "epoch": 5403} {"train_loss": -27.419599533081055, "global_step": 448509, "epoch": 5403} {"train_loss": -27.553760528564453, "global_step": 448510, "epoch": 5403} {"train_loss": -27.2729549407959, "global_step": 448511, "epoch": 5403} {"train_loss": -27.038610458374023, "global_step": 448512, "epoch": 5403} {"train_loss": -26.634536743164062, "global_step": 448513, "epoch": 5403} {"train_loss": -26.82642936706543, "global_step": 448514, "epoch": 5403} {"train_loss": -27.037063598632812, "global_step": 448515, "epoch": 5403} {"train_loss": -27.426471710205078, "global_step": 448516, "epoch": 5403} {"train_loss": -26.987905502319336, "global_step": 448517, "epoch": 5403} {"train_loss": -26.917768478393555, "global_step": 448518, "epoch": 5403} {"train_loss": -26.75931167602539, "global_step": 448519, "epoch": 5403} {"train_loss": -26.839746475219727, "global_step": 448520, "epoch": 5403} {"train_loss": -27.104888916015625, "global_step": 448521, "epoch": 5403} {"train_loss": -27.111082077026367, "global_step": 448522, "epoch": 5403} {"train_loss": -26.855701446533203, "global_step": 448523, "epoch": 5403} {"train_loss": -26.696760177612305, "global_step": 448524, "epoch": 5403} {"train_loss": -26.938690185546875, "global_step": 448525, "epoch": 5403} {"train_loss": -27.14459228515625, "global_step": 448526, "epoch": 5403} {"train_loss": -27.057693481445312, "global_step": 448527, "epoch": 5403} {"train_loss": -26.799640655517578, "global_step": 448528, "epoch": 5403} {"train_loss": -26.821271896362305, "global_step": 448529, "epoch": 5403} {"train_loss": -27.069278717041016, "global_step": 448530, "epoch": 5403} {"train_loss": -26.768714996705572, "global_step": 448531, "epoch": 5403, "val_loss": 6716094.0} {"train_loss": -26.76068687438965, "global_step": 448532, "epoch": 5404} {"train_loss": -26.125818252563477, "global_step": 448533, "epoch": 5404} {"train_loss": -26.426786422729492, "global_step": 448534, "epoch": 5404} {"train_loss": -27.008697509765625, "global_step": 448535, "epoch": 5404} {"train_loss": -26.53352928161621, "global_step": 448536, "epoch": 5404} {"train_loss": -26.514387130737305, "global_step": 448537, "epoch": 5404} {"train_loss": -26.699331283569336, "global_step": 448538, "epoch": 5404} {"train_loss": -26.480276107788086, "global_step": 448539, "epoch": 5404} {"train_loss": -26.901092529296875, "global_step": 448540, "epoch": 5404} {"train_loss": -26.90570068359375, "global_step": 448541, "epoch": 5404} {"train_loss": -26.66691017150879, "global_step": 448542, "epoch": 5404} {"train_loss": -26.917545318603516, "global_step": 448543, "epoch": 5404} {"train_loss": -26.917600631713867, "global_step": 448544, "epoch": 5404} {"train_loss": -26.995838165283203, "global_step": 448545, "epoch": 5404} {"train_loss": -26.95473289489746, "global_step": 448546, "epoch": 5404} {"train_loss": -26.945959091186523, "global_step": 448547, "epoch": 5404} {"train_loss": -26.677234649658203, "global_step": 448548, "epoch": 5404} {"train_loss": -27.095367431640625, "global_step": 448549, "epoch": 5404} {"train_loss": -27.130664825439453, "global_step": 448550, "epoch": 5404} {"train_loss": -26.99094009399414, "global_step": 448551, "epoch": 5404} {"train_loss": -26.630218505859375, "global_step": 448552, "epoch": 5404} {"train_loss": -27.10264015197754, "global_step": 448553, "epoch": 5404} {"train_loss": -27.22257423400879, "global_step": 448554, "epoch": 5404} {"train_loss": -26.75494384765625, "global_step": 448555, "epoch": 5404} {"train_loss": -26.958942413330078, "global_step": 448556, "epoch": 5404} {"train_loss": -27.146472930908203, "global_step": 448557, "epoch": 5404} {"train_loss": -27.284305572509766, "global_step": 448558, "epoch": 5404} {"train_loss": -27.039966583251953, "global_step": 448559, "epoch": 5404} {"train_loss": -27.373523712158203, "global_step": 448560, "epoch": 5404} {"train_loss": -27.623016357421875, "global_step": 448561, "epoch": 5404} {"train_loss": -27.100717544555664, "global_step": 448562, "epoch": 5404} {"train_loss": -26.805479049682617, "global_step": 448563, "epoch": 5404} {"train_loss": -27.087438583374023, "global_step": 448564, "epoch": 5404} {"train_loss": -27.1617374420166, "global_step": 448565, "epoch": 5404} {"train_loss": -26.981704711914062, "global_step": 448566, "epoch": 5404} {"train_loss": -27.472116470336914, "global_step": 448567, "epoch": 5404} {"train_loss": -27.008955001831055, "global_step": 448568, "epoch": 5404} {"train_loss": -26.843809127807617, "global_step": 448569, "epoch": 5404} {"train_loss": -26.839466094970703, "global_step": 448570, "epoch": 5404} {"train_loss": -26.94319725036621, "global_step": 448571, "epoch": 5404} {"train_loss": -27.36775779724121, "global_step": 448572, "epoch": 5404} {"train_loss": -27.35853385925293, "global_step": 448573, "epoch": 5404} {"train_loss": -27.139801025390625, "global_step": 448574, "epoch": 5404} {"train_loss": -27.45564079284668, "global_step": 448575, "epoch": 5404} {"train_loss": -27.390430450439453, "global_step": 448576, "epoch": 5404} {"train_loss": -26.99481773376465, "global_step": 448577, "epoch": 5404} {"train_loss": -27.169696807861328, "global_step": 448578, "epoch": 5404} {"train_loss": -27.490293502807617, "global_step": 448579, "epoch": 5404} {"train_loss": -27.108001708984375, "global_step": 448580, "epoch": 5404} {"train_loss": -27.25775146484375, "global_step": 448581, "epoch": 5404} {"train_loss": -26.623517990112305, "global_step": 448582, "epoch": 5404} {"train_loss": -26.0399227142334, "global_step": 448583, "epoch": 5404} {"train_loss": -25.193740844726562, "global_step": 448584, "epoch": 5404} {"train_loss": -25.553007125854492, "global_step": 448585, "epoch": 5404} {"train_loss": -26.038373947143555, "global_step": 448586, "epoch": 5404} {"train_loss": -26.246564865112305, "global_step": 448587, "epoch": 5404} {"train_loss": -27.242029190063477, "global_step": 448588, "epoch": 5404} {"train_loss": -25.95796012878418, "global_step": 448589, "epoch": 5404} {"train_loss": -26.160940170288086, "global_step": 448590, "epoch": 5404} {"train_loss": -26.62782096862793, "global_step": 448591, "epoch": 5404} {"train_loss": -26.264389038085938, "global_step": 448592, "epoch": 5404} {"train_loss": -26.704145431518555, "global_step": 448593, "epoch": 5404} {"train_loss": -26.499170303344727, "global_step": 448594, "epoch": 5404} {"train_loss": -26.6314640045166, "global_step": 448595, "epoch": 5404} {"train_loss": -26.764144897460938, "global_step": 448596, "epoch": 5404} {"train_loss": -26.56595230102539, "global_step": 448597, "epoch": 5404} {"train_loss": -26.754968643188477, "global_step": 448598, "epoch": 5404} {"train_loss": -26.75440788269043, "global_step": 448599, "epoch": 5404} {"train_loss": -26.710554122924805, "global_step": 448600, "epoch": 5404} {"train_loss": -26.65717887878418, "global_step": 448601, "epoch": 5404} {"train_loss": -26.690460205078125, "global_step": 448602, "epoch": 5404} {"train_loss": -26.632169723510742, "global_step": 448603, "epoch": 5404} {"train_loss": -26.59332275390625, "global_step": 448604, "epoch": 5404} {"train_loss": -26.46076774597168, "global_step": 448605, "epoch": 5404} {"train_loss": -26.744873046875, "global_step": 448606, "epoch": 5404} {"train_loss": -26.776880264282227, "global_step": 448607, "epoch": 5404} {"train_loss": -26.81488037109375, "global_step": 448608, "epoch": 5404} {"train_loss": -26.885791778564453, "global_step": 448609, "epoch": 5404} {"train_loss": -26.860477447509766, "global_step": 448610, "epoch": 5404} {"train_loss": -26.900903701782227, "global_step": 448611, "epoch": 5404} {"train_loss": -26.53089714050293, "global_step": 448612, "epoch": 5404} {"train_loss": -27.02009391784668, "global_step": 448613, "epoch": 5404} {"train_loss": -26.80731872190912, "global_step": 448614, "epoch": 5404, "val_loss": 6590514.0} {"train_loss": -26.54961585998535, "global_step": 448615, "epoch": 5405} {"train_loss": -26.536779403686523, "global_step": 448616, "epoch": 5405} {"train_loss": -26.40852165222168, "global_step": 448617, "epoch": 5405} {"train_loss": -27.006772994995117, "global_step": 448618, "epoch": 5405} {"train_loss": -26.933130264282227, "global_step": 448619, "epoch": 5405} {"train_loss": -26.734649658203125, "global_step": 448620, "epoch": 5405} {"train_loss": -26.433368682861328, "global_step": 448621, "epoch": 5405} {"train_loss": -26.5284423828125, "global_step": 448622, "epoch": 5405} {"train_loss": -26.5530948638916, "global_step": 448623, "epoch": 5405} {"train_loss": -26.765615463256836, "global_step": 448624, "epoch": 5405} {"train_loss": -27.046283721923828, "global_step": 448625, "epoch": 5405} {"train_loss": -26.861377716064453, "global_step": 448626, "epoch": 5405} {"train_loss": -27.031452178955078, "global_step": 448627, "epoch": 5405} {"train_loss": -27.151599884033203, "global_step": 448628, "epoch": 5405} {"train_loss": -26.763025283813477, "global_step": 448629, "epoch": 5405} {"train_loss": -26.604639053344727, "global_step": 448630, "epoch": 5405} {"train_loss": -27.178064346313477, "global_step": 448631, "epoch": 5405} {"train_loss": -27.200056076049805, "global_step": 448632, "epoch": 5405} {"train_loss": -27.090551376342773, "global_step": 448633, "epoch": 5405} {"train_loss": -27.22722816467285, "global_step": 448634, "epoch": 5405} {"train_loss": -27.1943302154541, "global_step": 448635, "epoch": 5405} {"train_loss": -26.70865821838379, "global_step": 448636, "epoch": 5405} {"train_loss": -27.176115036010742, "global_step": 448637, "epoch": 5405} {"train_loss": -27.36805534362793, "global_step": 448638, "epoch": 5405} {"train_loss": -27.03619956970215, "global_step": 448639, "epoch": 5405} {"train_loss": -27.076416015625, "global_step": 448640, "epoch": 5405} {"train_loss": -27.385040283203125, "global_step": 448641, "epoch": 5405} {"train_loss": -27.645429611206055, "global_step": 448642, "epoch": 5405} {"train_loss": -27.056318283081055, "global_step": 448643, "epoch": 5405} {"train_loss": -27.066991806030273, "global_step": 448644, "epoch": 5405} {"train_loss": -27.235464096069336, "global_step": 448645, "epoch": 5405} {"train_loss": -27.013141632080078, "global_step": 448646, "epoch": 5405} {"train_loss": -27.519956588745117, "global_step": 448647, "epoch": 5405} {"train_loss": -27.234167098999023, "global_step": 448648, "epoch": 5405} {"train_loss": -27.22430992126465, "global_step": 448649, "epoch": 5405} {"train_loss": -27.369556427001953, "global_step": 448650, "epoch": 5405} {"train_loss": -27.079694747924805, "global_step": 448651, "epoch": 5405} {"train_loss": -26.97516441345215, "global_step": 448652, "epoch": 5405} {"train_loss": -26.412839889526367, "global_step": 448653, "epoch": 5405} {"train_loss": -26.604642868041992, "global_step": 448654, "epoch": 5405} {"train_loss": -26.583648681640625, "global_step": 448655, "epoch": 5405} {"train_loss": -26.655675888061523, "global_step": 448656, "epoch": 5405} {"train_loss": -27.598007202148438, "global_step": 448657, "epoch": 5405} {"train_loss": -27.24713706970215, "global_step": 448658, "epoch": 5405} {"train_loss": -26.939014434814453, "global_step": 448659, "epoch": 5405} {"train_loss": -26.586639404296875, "global_step": 448660, "epoch": 5405} {"train_loss": -27.294519424438477, "global_step": 448661, "epoch": 5405} {"train_loss": -27.370656967163086, "global_step": 448662, "epoch": 5405} {"train_loss": -27.131179809570312, "global_step": 448663, "epoch": 5405} {"train_loss": -26.75908851623535, "global_step": 448664, "epoch": 5405} {"train_loss": -26.778919219970703, "global_step": 448665, "epoch": 5405} {"train_loss": -26.906335830688477, "global_step": 448666, "epoch": 5405} {"train_loss": -26.755313873291016, "global_step": 448667, "epoch": 5405} {"train_loss": -26.582904815673828, "global_step": 448668, "epoch": 5405} {"train_loss": -25.882131576538086, "global_step": 448669, "epoch": 5405} {"train_loss": -26.912397384643555, "global_step": 448670, "epoch": 5405} {"train_loss": -26.785898208618164, "global_step": 448671, "epoch": 5405} {"train_loss": -27.027490615844727, "global_step": 448672, "epoch": 5405} {"train_loss": -26.80767822265625, "global_step": 448673, "epoch": 5405} {"train_loss": -26.700300216674805, "global_step": 448674, "epoch": 5405} {"train_loss": -26.953231811523438, "global_step": 448675, "epoch": 5405} {"train_loss": -26.627227783203125, "global_step": 448676, "epoch": 5405} {"train_loss": -27.411718368530273, "global_step": 448677, "epoch": 5405} {"train_loss": -27.015295028686523, "global_step": 448678, "epoch": 5405} {"train_loss": -27.285297393798828, "global_step": 448679, "epoch": 5405} {"train_loss": -26.69173240661621, "global_step": 448680, "epoch": 5405} {"train_loss": -27.008163452148438, "global_step": 448681, "epoch": 5405} {"train_loss": -27.070606231689453, "global_step": 448682, "epoch": 5405} {"train_loss": -27.167896270751953, "global_step": 448683, "epoch": 5405} {"train_loss": -27.117273330688477, "global_step": 448684, "epoch": 5405} {"train_loss": -27.05244255065918, "global_step": 448685, "epoch": 5405} {"train_loss": -27.487171173095703, "global_step": 448686, "epoch": 5405} {"train_loss": -27.05755043029785, "global_step": 448687, "epoch": 5405} {"train_loss": -27.271326065063477, "global_step": 448688, "epoch": 5405} {"train_loss": -27.296783447265625, "global_step": 448689, "epoch": 5405} {"train_loss": -27.191205978393555, "global_step": 448690, "epoch": 5405} {"train_loss": -27.03606605529785, "global_step": 448691, "epoch": 5405} {"train_loss": -27.02250099182129, "global_step": 448692, "epoch": 5405} {"train_loss": -27.11341667175293, "global_step": 448693, "epoch": 5405} {"train_loss": -27.221786499023438, "global_step": 448694, "epoch": 5405} {"train_loss": -26.807416915893555, "global_step": 448695, "epoch": 5405} {"train_loss": -26.439544677734375, "global_step": 448696, "epoch": 5405} {"train_loss": -26.970019283064875, "global_step": 448697, "epoch": 5405, "val_loss": 6747779.5} {"train_loss": -19.29937171936035, "global_step": 448698, "epoch": 5406} {"train_loss": -23.54717445373535, "global_step": 448699, "epoch": 5406} {"train_loss": -21.752717971801758, "global_step": 448700, "epoch": 5406} {"train_loss": -23.97000503540039, "global_step": 448701, "epoch": 5406} {"train_loss": -23.371070861816406, "global_step": 448702, "epoch": 5406} {"train_loss": -23.64674186706543, "global_step": 448703, "epoch": 5406} {"train_loss": -24.274972915649414, "global_step": 448704, "epoch": 5406} {"train_loss": -24.546743392944336, "global_step": 448705, "epoch": 5406} {"train_loss": -24.400476455688477, "global_step": 448706, "epoch": 5406} {"train_loss": -24.895816802978516, "global_step": 448707, "epoch": 5406} {"train_loss": -24.419536590576172, "global_step": 448708, "epoch": 5406} {"train_loss": -24.49298667907715, "global_step": 448709, "epoch": 5406} {"train_loss": -24.96400260925293, "global_step": 448710, "epoch": 5406} {"train_loss": -25.17581558227539, "global_step": 448711, "epoch": 5406} {"train_loss": -24.83327293395996, "global_step": 448712, "epoch": 5406} {"train_loss": -25.21832847595215, "global_step": 448713, "epoch": 5406} {"train_loss": -25.6405086517334, "global_step": 448714, "epoch": 5406} {"train_loss": -24.793344497680664, "global_step": 448715, "epoch": 5406} {"train_loss": -25.290693283081055, "global_step": 448716, "epoch": 5406} {"train_loss": -24.98922348022461, "global_step": 448717, "epoch": 5406} {"train_loss": -25.348783493041992, "global_step": 448718, "epoch": 5406} {"train_loss": -25.586877822875977, "global_step": 448719, "epoch": 5406} {"train_loss": -25.582563400268555, "global_step": 448720, "epoch": 5406} {"train_loss": -25.304182052612305, "global_step": 448721, "epoch": 5406} {"train_loss": -25.683820724487305, "global_step": 448722, "epoch": 5406} {"train_loss": -25.643659591674805, "global_step": 448723, "epoch": 5406} {"train_loss": -25.9057559967041, "global_step": 448724, "epoch": 5406} {"train_loss": -25.847421646118164, "global_step": 448725, "epoch": 5406} {"train_loss": -25.833057403564453, "global_step": 448726, "epoch": 5406} {"train_loss": -25.978845596313477, "global_step": 448727, "epoch": 5406} {"train_loss": -26.067102432250977, "global_step": 448728, "epoch": 5406} {"train_loss": -26.197473526000977, "global_step": 448729, "epoch": 5406} {"train_loss": -26.061126708984375, "global_step": 448730, "epoch": 5406} {"train_loss": -25.986499786376953, "global_step": 448731, "epoch": 5406} {"train_loss": -26.661718368530273, "global_step": 448732, "epoch": 5406} {"train_loss": -25.93560791015625, "global_step": 448733, "epoch": 5406} {"train_loss": -26.158533096313477, "global_step": 448734, "epoch": 5406} {"train_loss": -26.413137435913086, "global_step": 448735, "epoch": 5406} {"train_loss": -26.243139266967773, "global_step": 448736, "epoch": 5406} {"train_loss": -26.065353393554688, "global_step": 448737, "epoch": 5406} {"train_loss": -26.424421310424805, "global_step": 448738, "epoch": 5406} {"train_loss": -26.441421508789062, "global_step": 448739, "epoch": 5406} {"train_loss": -26.567346572875977, "global_step": 448740, "epoch": 5406} {"train_loss": -26.40865135192871, "global_step": 448741, "epoch": 5406} {"train_loss": -26.810102462768555, "global_step": 448742, "epoch": 5406} {"train_loss": -26.347082138061523, "global_step": 448743, "epoch": 5406} {"train_loss": -26.533899307250977, "global_step": 448744, "epoch": 5406} {"train_loss": -26.826501846313477, "global_step": 448745, "epoch": 5406} {"train_loss": -26.721576690673828, "global_step": 448746, "epoch": 5406} {"train_loss": -26.47579002380371, "global_step": 448747, "epoch": 5406} {"train_loss": -26.5140438079834, "global_step": 448748, "epoch": 5406} {"train_loss": -26.685590744018555, "global_step": 448749, "epoch": 5406} {"train_loss": -26.63177490234375, "global_step": 448750, "epoch": 5406} {"train_loss": -27.072824478149414, "global_step": 448751, "epoch": 5406} {"train_loss": -26.591455459594727, "global_step": 448752, "epoch": 5406} {"train_loss": -26.60931968688965, "global_step": 448753, "epoch": 5406} {"train_loss": -27.17032814025879, "global_step": 448754, "epoch": 5406} {"train_loss": -26.912078857421875, "global_step": 448755, "epoch": 5406} {"train_loss": -26.72298240661621, "global_step": 448756, "epoch": 5406} {"train_loss": -27.03946876525879, "global_step": 448757, "epoch": 5406} {"train_loss": -26.66932487487793, "global_step": 448758, "epoch": 5406} {"train_loss": -27.135879516601562, "global_step": 448759, "epoch": 5406} {"train_loss": -26.82059097290039, "global_step": 448760, "epoch": 5406} {"train_loss": -26.724777221679688, "global_step": 448761, "epoch": 5406} {"train_loss": -27.14064598083496, "global_step": 448762, "epoch": 5406} {"train_loss": -27.17706871032715, "global_step": 448763, "epoch": 5406} {"train_loss": -27.118988037109375, "global_step": 448764, "epoch": 5406} {"train_loss": -26.99329948425293, "global_step": 448765, "epoch": 5406} {"train_loss": -26.864171981811523, "global_step": 448766, "epoch": 5406} {"train_loss": -27.122079849243164, "global_step": 448767, "epoch": 5406} {"train_loss": -27.104873657226562, "global_step": 448768, "epoch": 5406} {"train_loss": -26.895889282226562, "global_step": 448769, "epoch": 5406} {"train_loss": -26.786869049072266, "global_step": 448770, "epoch": 5406} {"train_loss": -27.075397491455078, "global_step": 448771, "epoch": 5406} {"train_loss": -26.70945167541504, "global_step": 448772, "epoch": 5406} {"train_loss": -27.342248916625977, "global_step": 448773, "epoch": 5406} {"train_loss": -27.085187911987305, "global_step": 448774, "epoch": 5406} {"train_loss": -27.013458251953125, "global_step": 448775, "epoch": 5406} {"train_loss": -26.663227081298828, "global_step": 448776, "epoch": 5406} {"train_loss": -26.972553253173828, "global_step": 448777, "epoch": 5406} {"train_loss": -26.948022842407227, "global_step": 448778, "epoch": 5406} {"train_loss": -27.005756378173828, "global_step": 448779, "epoch": 5406} {"train_loss": -25.968618829566314, "global_step": 448780, "epoch": 5406, "val_loss": 6555768.0} {"train_loss": -26.32977867126465, "global_step": 448781, "epoch": 5407} {"train_loss": -25.525901794433594, "global_step": 448782, "epoch": 5407} {"train_loss": -25.888996124267578, "global_step": 448783, "epoch": 5407} {"train_loss": -26.291025161743164, "global_step": 448784, "epoch": 5407} {"train_loss": -26.42567253112793, "global_step": 448785, "epoch": 5407} {"train_loss": -26.70869255065918, "global_step": 448786, "epoch": 5407} {"train_loss": -26.53093910217285, "global_step": 448787, "epoch": 5407} {"train_loss": -26.569482803344727, "global_step": 448788, "epoch": 5407} {"train_loss": -26.81731605529785, "global_step": 448789, "epoch": 5407} {"train_loss": -26.494199752807617, "global_step": 448790, "epoch": 5407} {"train_loss": -26.7606201171875, "global_step": 448791, "epoch": 5407} {"train_loss": -26.607105255126953, "global_step": 448792, "epoch": 5407} {"train_loss": -26.543827056884766, "global_step": 448793, "epoch": 5407} {"train_loss": -26.557825088500977, "global_step": 448794, "epoch": 5407} {"train_loss": -26.83367347717285, "global_step": 448795, "epoch": 5407} {"train_loss": -27.122364044189453, "global_step": 448796, "epoch": 5407} {"train_loss": -26.4512882232666, "global_step": 448797, "epoch": 5407} {"train_loss": -26.75306510925293, "global_step": 448798, "epoch": 5407} {"train_loss": -26.71734046936035, "global_step": 448799, "epoch": 5407} {"train_loss": -26.84284019470215, "global_step": 448800, "epoch": 5407} {"train_loss": -27.05258560180664, "global_step": 448801, "epoch": 5407} {"train_loss": -26.783308029174805, "global_step": 448802, "epoch": 5407} {"train_loss": -26.94504165649414, "global_step": 448803, "epoch": 5407} {"train_loss": -27.06989097595215, "global_step": 448804, "epoch": 5407} {"train_loss": -27.09218406677246, "global_step": 448805, "epoch": 5407} {"train_loss": -26.62965965270996, "global_step": 448806, "epoch": 5407} {"train_loss": -26.81424331665039, "global_step": 448807, "epoch": 5407} {"train_loss": -26.965246200561523, "global_step": 448808, "epoch": 5407} {"train_loss": -27.085561752319336, "global_step": 448809, "epoch": 5407} {"train_loss": -27.089513778686523, "global_step": 448810, "epoch": 5407} {"train_loss": -27.30035972595215, "global_step": 448811, "epoch": 5407} {"train_loss": -27.199316024780273, "global_step": 448812, "epoch": 5407} {"train_loss": -26.963171005249023, "global_step": 448813, "epoch": 5407} {"train_loss": -26.675107955932617, "global_step": 448814, "epoch": 5407} {"train_loss": -27.275360107421875, "global_step": 448815, "epoch": 5407} {"train_loss": -27.277236938476562, "global_step": 448816, "epoch": 5407} {"train_loss": -27.034833908081055, "global_step": 448817, "epoch": 5407} {"train_loss": -27.00156021118164, "global_step": 448818, "epoch": 5407} {"train_loss": -27.190893173217773, "global_step": 448819, "epoch": 5407} {"train_loss": -26.92787742614746, "global_step": 448820, "epoch": 5407} {"train_loss": -27.014129638671875, "global_step": 448821, "epoch": 5407} {"train_loss": -27.309534072875977, "global_step": 448822, "epoch": 5407} {"train_loss": -27.36201286315918, "global_step": 448823, "epoch": 5407} {"train_loss": -27.434778213500977, "global_step": 448824, "epoch": 5407} {"train_loss": -27.11920738220215, "global_step": 448825, "epoch": 5407} {"train_loss": -26.913909912109375, "global_step": 448826, "epoch": 5407} {"train_loss": -27.382965087890625, "global_step": 448827, "epoch": 5407} {"train_loss": -27.08552360534668, "global_step": 448828, "epoch": 5407} {"train_loss": -27.34724998474121, "global_step": 448829, "epoch": 5407} {"train_loss": -26.813461303710938, "global_step": 448830, "epoch": 5407} {"train_loss": -27.042097091674805, "global_step": 448831, "epoch": 5407} {"train_loss": -26.72776222229004, "global_step": 448832, "epoch": 5407} {"train_loss": -27.201251983642578, "global_step": 448833, "epoch": 5407} {"train_loss": -27.030750274658203, "global_step": 448834, "epoch": 5407} {"train_loss": -26.91472816467285, "global_step": 448835, "epoch": 5407} {"train_loss": -27.393991470336914, "global_step": 448836, "epoch": 5407} {"train_loss": -26.732391357421875, "global_step": 448837, "epoch": 5407} {"train_loss": -27.219518661499023, "global_step": 448838, "epoch": 5407} {"train_loss": -27.043569564819336, "global_step": 448839, "epoch": 5407} {"train_loss": -27.154443740844727, "global_step": 448840, "epoch": 5407} {"train_loss": -27.27735710144043, "global_step": 448841, "epoch": 5407} {"train_loss": -27.302091598510742, "global_step": 448842, "epoch": 5407} {"train_loss": -27.01820182800293, "global_step": 448843, "epoch": 5407} {"train_loss": -27.1008358001709, "global_step": 448844, "epoch": 5407} {"train_loss": -27.111988067626953, "global_step": 448845, "epoch": 5407} {"train_loss": -26.74721336364746, "global_step": 448846, "epoch": 5407} {"train_loss": -26.817768096923828, "global_step": 448847, "epoch": 5407} {"train_loss": -27.171875, "global_step": 448848, "epoch": 5407} {"train_loss": -26.803903579711914, "global_step": 448849, "epoch": 5407} {"train_loss": -26.722461700439453, "global_step": 448850, "epoch": 5407} {"train_loss": -27.27302360534668, "global_step": 448851, "epoch": 5407} {"train_loss": -27.091283798217773, "global_step": 448852, "epoch": 5407} {"train_loss": -26.859750747680664, "global_step": 448853, "epoch": 5407} {"train_loss": -27.129199981689453, "global_step": 448854, "epoch": 5407} {"train_loss": -27.233198165893555, "global_step": 448855, "epoch": 5407} {"train_loss": -27.186315536499023, "global_step": 448856, "epoch": 5407} {"train_loss": -27.365802764892578, "global_step": 448857, "epoch": 5407} {"train_loss": -26.926654815673828, "global_step": 448858, "epoch": 5407} {"train_loss": -26.981855392456055, "global_step": 448859, "epoch": 5407} {"train_loss": -26.788837432861328, "global_step": 448860, "epoch": 5407} {"train_loss": -27.387807846069336, "global_step": 448861, "epoch": 5407} {"train_loss": -27.222379684448242, "global_step": 448862, "epoch": 5407} {"train_loss": -26.938993522919805, "global_step": 448863, "epoch": 5407, "val_loss": 6493669.0} {"train_loss": -26.449811935424805, "global_step": 448864, "epoch": 5408} {"train_loss": -26.731794357299805, "global_step": 448865, "epoch": 5408} {"train_loss": -26.763717651367188, "global_step": 448866, "epoch": 5408} {"train_loss": -26.7556095123291, "global_step": 448867, "epoch": 5408} {"train_loss": -26.414403915405273, "global_step": 448868, "epoch": 5408} {"train_loss": -26.322378158569336, "global_step": 448869, "epoch": 5408} {"train_loss": -26.734586715698242, "global_step": 448870, "epoch": 5408} {"train_loss": -26.75547218322754, "global_step": 448871, "epoch": 5408} {"train_loss": -26.271554946899414, "global_step": 448872, "epoch": 5408} {"train_loss": -27.123151779174805, "global_step": 448873, "epoch": 5408} {"train_loss": -26.68140983581543, "global_step": 448874, "epoch": 5408} {"train_loss": -26.314884185791016, "global_step": 448875, "epoch": 5408} {"train_loss": -26.560810089111328, "global_step": 448876, "epoch": 5408} {"train_loss": -27.064529418945312, "global_step": 448877, "epoch": 5408} {"train_loss": -26.611557006835938, "global_step": 448878, "epoch": 5408} {"train_loss": -27.075977325439453, "global_step": 448879, "epoch": 5408} {"train_loss": -27.141530990600586, "global_step": 448880, "epoch": 5408} {"train_loss": -26.938068389892578, "global_step": 448881, "epoch": 5408} {"train_loss": -26.92864990234375, "global_step": 448882, "epoch": 5408} {"train_loss": -27.029367446899414, "global_step": 448883, "epoch": 5408} {"train_loss": -26.96954917907715, "global_step": 448884, "epoch": 5408} {"train_loss": -26.810026168823242, "global_step": 448885, "epoch": 5408} {"train_loss": -26.746280670166016, "global_step": 448886, "epoch": 5408} {"train_loss": -27.02640724182129, "global_step": 448887, "epoch": 5408} {"train_loss": -26.983503341674805, "global_step": 448888, "epoch": 5408} {"train_loss": -27.15144157409668, "global_step": 448889, "epoch": 5408} {"train_loss": -27.14886474609375, "global_step": 448890, "epoch": 5408} {"train_loss": -27.307241439819336, "global_step": 448891, "epoch": 5408} {"train_loss": -26.835773468017578, "global_step": 448892, "epoch": 5408} {"train_loss": -26.999799728393555, "global_step": 448893, "epoch": 5408} {"train_loss": -27.1503849029541, "global_step": 448894, "epoch": 5408} {"train_loss": -27.224512100219727, "global_step": 448895, "epoch": 5408} {"train_loss": -27.519983291625977, "global_step": 448896, "epoch": 5408} {"train_loss": -27.13984489440918, "global_step": 448897, "epoch": 5408} {"train_loss": -27.3847599029541, "global_step": 448898, "epoch": 5408} {"train_loss": -27.133056640625, "global_step": 448899, "epoch": 5408} {"train_loss": -27.319564819335938, "global_step": 448900, "epoch": 5408} {"train_loss": -27.18836784362793, "global_step": 448901, "epoch": 5408} {"train_loss": -27.035531997680664, "global_step": 448902, "epoch": 5408} {"train_loss": -26.802724838256836, "global_step": 448903, "epoch": 5408} {"train_loss": -27.22489356994629, "global_step": 448904, "epoch": 5408} {"train_loss": -27.022369384765625, "global_step": 448905, "epoch": 5408} {"train_loss": -26.9099178314209, "global_step": 448906, "epoch": 5408} {"train_loss": -27.145090103149414, "global_step": 448907, "epoch": 5408} {"train_loss": -27.26885986328125, "global_step": 448908, "epoch": 5408} {"train_loss": -27.276966094970703, "global_step": 448909, "epoch": 5408} {"train_loss": -27.233488082885742, "global_step": 448910, "epoch": 5408} {"train_loss": -27.294591903686523, "global_step": 448911, "epoch": 5408} {"train_loss": -27.22074317932129, "global_step": 448912, "epoch": 5408} {"train_loss": -27.140262603759766, "global_step": 448913, "epoch": 5408} {"train_loss": -27.238922119140625, "global_step": 448914, "epoch": 5408} {"train_loss": -27.059186935424805, "global_step": 448915, "epoch": 5408} {"train_loss": -26.77362632751465, "global_step": 448916, "epoch": 5408} {"train_loss": -26.920257568359375, "global_step": 448917, "epoch": 5408} {"train_loss": -26.696237564086914, "global_step": 448918, "epoch": 5408} {"train_loss": -27.069448471069336, "global_step": 448919, "epoch": 5408} {"train_loss": -26.9515323638916, "global_step": 448920, "epoch": 5408} {"train_loss": -26.968473434448242, "global_step": 448921, "epoch": 5408} {"train_loss": -26.930622100830078, "global_step": 448922, "epoch": 5408} {"train_loss": -27.05245018005371, "global_step": 448923, "epoch": 5408} {"train_loss": -26.813562393188477, "global_step": 448924, "epoch": 5408} {"train_loss": -27.422473907470703, "global_step": 448925, "epoch": 5408} {"train_loss": -26.8483943939209, "global_step": 448926, "epoch": 5408} {"train_loss": -27.2154598236084, "global_step": 448927, "epoch": 5408} {"train_loss": -26.657413482666016, "global_step": 448928, "epoch": 5408} {"train_loss": -26.98539161682129, "global_step": 448929, "epoch": 5408} {"train_loss": -26.97959327697754, "global_step": 448930, "epoch": 5408} {"train_loss": -27.05792236328125, "global_step": 448931, "epoch": 5408} {"train_loss": -27.24116325378418, "global_step": 448932, "epoch": 5408} {"train_loss": -26.46683692932129, "global_step": 448933, "epoch": 5408} {"train_loss": -27.486087799072266, "global_step": 448934, "epoch": 5408} {"train_loss": -26.8834228515625, "global_step": 448935, "epoch": 5408} {"train_loss": -27.218463897705078, "global_step": 448936, "epoch": 5408} {"train_loss": -26.7209415435791, "global_step": 448937, "epoch": 5408} {"train_loss": -27.03236198425293, "global_step": 448938, "epoch": 5408} {"train_loss": -27.229772567749023, "global_step": 448939, "epoch": 5408} {"train_loss": -26.745868682861328, "global_step": 448940, "epoch": 5408} {"train_loss": -26.439985275268555, "global_step": 448941, "epoch": 5408} {"train_loss": -26.22454833984375, "global_step": 448942, "epoch": 5408} {"train_loss": -25.884103775024414, "global_step": 448943, "epoch": 5408} {"train_loss": -25.315431594848633, "global_step": 448944, "epoch": 5408} {"train_loss": -26.318115234375, "global_step": 448945, "epoch": 5408} {"train_loss": -26.9108445500753, "global_step": 448946, "epoch": 5408, "val_loss": 6536624.0} {"train_loss": -23.250877380371094, "global_step": 448947, "epoch": 5409} {"train_loss": -25.621417999267578, "global_step": 448948, "epoch": 5409} {"train_loss": -24.12259292602539, "global_step": 448949, "epoch": 5409} {"train_loss": -25.47488784790039, "global_step": 448950, "epoch": 5409} {"train_loss": -23.676767349243164, "global_step": 448951, "epoch": 5409} {"train_loss": -25.353012084960938, "global_step": 448952, "epoch": 5409} {"train_loss": -25.034381866455078, "global_step": 448953, "epoch": 5409} {"train_loss": -25.261014938354492, "global_step": 448954, "epoch": 5409} {"train_loss": -25.12165641784668, "global_step": 448955, "epoch": 5409} {"train_loss": -26.175405502319336, "global_step": 448956, "epoch": 5409} {"train_loss": -25.203937530517578, "global_step": 448957, "epoch": 5409} {"train_loss": -25.291353225708008, "global_step": 448958, "epoch": 5409} {"train_loss": -25.73445701599121, "global_step": 448959, "epoch": 5409} {"train_loss": -25.930326461791992, "global_step": 448960, "epoch": 5409} {"train_loss": -26.19797134399414, "global_step": 448961, "epoch": 5409} {"train_loss": -25.98026466369629, "global_step": 448962, "epoch": 5409} {"train_loss": -26.00483512878418, "global_step": 448963, "epoch": 5409} {"train_loss": -25.75955581665039, "global_step": 448964, "epoch": 5409} {"train_loss": -25.846689224243164, "global_step": 448965, "epoch": 5409} {"train_loss": -26.130826950073242, "global_step": 448966, "epoch": 5409} {"train_loss": -26.15389060974121, "global_step": 448967, "epoch": 5409} {"train_loss": -26.173486709594727, "global_step": 448968, "epoch": 5409} {"train_loss": -26.173303604125977, "global_step": 448969, "epoch": 5409} {"train_loss": -26.11256980895996, "global_step": 448970, "epoch": 5409} {"train_loss": -26.462751388549805, "global_step": 448971, "epoch": 5409} {"train_loss": -26.579710006713867, "global_step": 448972, "epoch": 5409} {"train_loss": -26.239105224609375, "global_step": 448973, "epoch": 5409} {"train_loss": -26.418842315673828, "global_step": 448974, "epoch": 5409} {"train_loss": -26.60296058654785, "global_step": 448975, "epoch": 5409} {"train_loss": -26.505996704101562, "global_step": 448976, "epoch": 5409} {"train_loss": -26.428251266479492, "global_step": 448977, "epoch": 5409} {"train_loss": -26.530858993530273, "global_step": 448978, "epoch": 5409} {"train_loss": -26.662582397460938, "global_step": 448979, "epoch": 5409} {"train_loss": -26.763248443603516, "global_step": 448980, "epoch": 5409} {"train_loss": -26.40089225769043, "global_step": 448981, "epoch": 5409} {"train_loss": -26.6373348236084, "global_step": 448982, "epoch": 5409} {"train_loss": -26.210983276367188, "global_step": 448983, "epoch": 5409} {"train_loss": -26.810626983642578, "global_step": 448984, "epoch": 5409} {"train_loss": -26.753223419189453, "global_step": 448985, "epoch": 5409} {"train_loss": -26.790597915649414, "global_step": 448986, "epoch": 5409} {"train_loss": -26.648181915283203, "global_step": 448987, "epoch": 5409} {"train_loss": -26.9194278717041, "global_step": 448988, "epoch": 5409} {"train_loss": -27.099369049072266, "global_step": 448989, "epoch": 5409} {"train_loss": -26.848285675048828, "global_step": 448990, "epoch": 5409} {"train_loss": -26.736820220947266, "global_step": 448991, "epoch": 5409} {"train_loss": -27.191436767578125, "global_step": 448992, "epoch": 5409} {"train_loss": -27.2061824798584, "global_step": 448993, "epoch": 5409} {"train_loss": -26.934980392456055, "global_step": 448994, "epoch": 5409} {"train_loss": -26.590961456298828, "global_step": 448995, "epoch": 5409} {"train_loss": -26.838272094726562, "global_step": 448996, "epoch": 5409} {"train_loss": -26.810333251953125, "global_step": 448997, "epoch": 5409} {"train_loss": -27.1648006439209, "global_step": 448998, "epoch": 5409} {"train_loss": -26.9238224029541, "global_step": 448999, "epoch": 5409} {"train_loss": -26.844684600830078, "global_step": 449000, "epoch": 5409} {"train_loss": -26.989337921142578, "global_step": 449001, "epoch": 5409} {"train_loss": -27.097843170166016, "global_step": 449002, "epoch": 5409} {"train_loss": -26.703826904296875, "global_step": 449003, "epoch": 5409} {"train_loss": -26.72147560119629, "global_step": 449004, "epoch": 5409} {"train_loss": -26.261398315429688, "global_step": 449005, "epoch": 5409} {"train_loss": -26.907703399658203, "global_step": 449006, "epoch": 5409} {"train_loss": -26.948989868164062, "global_step": 449007, "epoch": 5409} {"train_loss": -27.05921745300293, "global_step": 449008, "epoch": 5409} {"train_loss": -27.147016525268555, "global_step": 449009, "epoch": 5409} {"train_loss": -26.802631378173828, "global_step": 449010, "epoch": 5409} {"train_loss": -27.11708641052246, "global_step": 449011, "epoch": 5409} {"train_loss": -27.093713760375977, "global_step": 449012, "epoch": 5409} {"train_loss": -27.592588424682617, "global_step": 449013, "epoch": 5409} {"train_loss": -26.884033203125, "global_step": 449014, "epoch": 5409} {"train_loss": -27.12372398376465, "global_step": 449015, "epoch": 5409} {"train_loss": -26.98060417175293, "global_step": 449016, "epoch": 5409} {"train_loss": -27.165937423706055, "global_step": 449017, "epoch": 5409} {"train_loss": -27.437255859375, "global_step": 449018, "epoch": 5409} {"train_loss": -27.029367446899414, "global_step": 449019, "epoch": 5409} {"train_loss": -27.14605140686035, "global_step": 449020, "epoch": 5409} {"train_loss": -26.835092544555664, "global_step": 449021, "epoch": 5409} {"train_loss": -27.410669326782227, "global_step": 449022, "epoch": 5409} {"train_loss": -26.866601943969727, "global_step": 449023, "epoch": 5409} {"train_loss": -26.886133193969727, "global_step": 449024, "epoch": 5409} {"train_loss": -26.62546157836914, "global_step": 449025, "epoch": 5409} {"train_loss": -26.58363914489746, "global_step": 449026, "epoch": 5409} {"train_loss": -26.99920654296875, "global_step": 449027, "epoch": 5409} {"train_loss": -27.225910186767578, "global_step": 449028, "epoch": 5409} {"train_loss": -26.44783288886748, "global_step": 449029, "epoch": 5409, "val_loss": 6477536.0} {"train_loss": -24.635543823242188, "global_step": 449030, "epoch": 5410} {"train_loss": -24.968509674072266, "global_step": 449031, "epoch": 5410} {"train_loss": -26.55791664123535, "global_step": 449032, "epoch": 5410} {"train_loss": -25.232547760009766, "global_step": 449033, "epoch": 5410} {"train_loss": -26.649106979370117, "global_step": 449034, "epoch": 5410} {"train_loss": -25.859394073486328, "global_step": 449035, "epoch": 5410} {"train_loss": -26.332788467407227, "global_step": 449036, "epoch": 5410} {"train_loss": -26.34706687927246, "global_step": 449037, "epoch": 5410} {"train_loss": -26.458148956298828, "global_step": 449038, "epoch": 5410} {"train_loss": -26.73434829711914, "global_step": 449039, "epoch": 5410} {"train_loss": -26.349994659423828, "global_step": 449040, "epoch": 5410} {"train_loss": -26.544330596923828, "global_step": 449041, "epoch": 5410} {"train_loss": -26.720727920532227, "global_step": 449042, "epoch": 5410} {"train_loss": -26.66805076599121, "global_step": 449043, "epoch": 5410} {"train_loss": -26.471403121948242, "global_step": 449044, "epoch": 5410} {"train_loss": -26.586063385009766, "global_step": 449045, "epoch": 5410} {"train_loss": -26.22627067565918, "global_step": 449046, "epoch": 5410} {"train_loss": -26.793493270874023, "global_step": 449047, "epoch": 5410} {"train_loss": -26.793048858642578, "global_step": 449048, "epoch": 5410} {"train_loss": -26.73688316345215, "global_step": 449049, "epoch": 5410} {"train_loss": -26.80341148376465, "global_step": 449050, "epoch": 5410} {"train_loss": -26.849517822265625, "global_step": 449051, "epoch": 5410} {"train_loss": -26.84486961364746, "global_step": 449052, "epoch": 5410} {"train_loss": -27.021697998046875, "global_step": 449053, "epoch": 5410} {"train_loss": -26.584564208984375, "global_step": 449054, "epoch": 5410} {"train_loss": -27.15749168395996, "global_step": 449055, "epoch": 5410} {"train_loss": -26.7989501953125, "global_step": 449056, "epoch": 5410} {"train_loss": -26.7398624420166, "global_step": 449057, "epoch": 5410} {"train_loss": -27.225662231445312, "global_step": 449058, "epoch": 5410} {"train_loss": -27.266773223876953, "global_step": 449059, "epoch": 5410} {"train_loss": -27.17914390563965, "global_step": 449060, "epoch": 5410} {"train_loss": -27.187292098999023, "global_step": 449061, "epoch": 5410} {"train_loss": -26.666059494018555, "global_step": 449062, "epoch": 5410} {"train_loss": -27.256452560424805, "global_step": 449063, "epoch": 5410} {"train_loss": -26.746442794799805, "global_step": 449064, "epoch": 5410} {"train_loss": -26.99921989440918, "global_step": 449065, "epoch": 5410} {"train_loss": -27.28290367126465, "global_step": 449066, "epoch": 5410} {"train_loss": -27.364898681640625, "global_step": 449067, "epoch": 5410} {"train_loss": -26.848224639892578, "global_step": 449068, "epoch": 5410} {"train_loss": -27.029508590698242, "global_step": 449069, "epoch": 5410} {"train_loss": -26.935434341430664, "global_step": 449070, "epoch": 5410} {"train_loss": -27.211606979370117, "global_step": 449071, "epoch": 5410} {"train_loss": -26.8770694732666, "global_step": 449072, "epoch": 5410} {"train_loss": -27.088056564331055, "global_step": 449073, "epoch": 5410} {"train_loss": -27.115680694580078, "global_step": 449074, "epoch": 5410} {"train_loss": -26.673803329467773, "global_step": 449075, "epoch": 5410} {"train_loss": -27.1605224609375, "global_step": 449076, "epoch": 5410} {"train_loss": -27.301227569580078, "global_step": 449077, "epoch": 5410} {"train_loss": -27.178632736206055, "global_step": 449078, "epoch": 5410} {"train_loss": -26.979482650756836, "global_step": 449079, "epoch": 5410} {"train_loss": -26.73479652404785, "global_step": 449080, "epoch": 5410} {"train_loss": -27.131162643432617, "global_step": 449081, "epoch": 5410} {"train_loss": -27.284198760986328, "global_step": 449082, "epoch": 5410} {"train_loss": -27.174087524414062, "global_step": 449083, "epoch": 5410} {"train_loss": -26.940643310546875, "global_step": 449084, "epoch": 5410} {"train_loss": -27.079090118408203, "global_step": 449085, "epoch": 5410} {"train_loss": -27.506855010986328, "global_step": 449086, "epoch": 5410} {"train_loss": -27.295034408569336, "global_step": 449087, "epoch": 5410} {"train_loss": -26.8453369140625, "global_step": 449088, "epoch": 5410} {"train_loss": -26.925058364868164, "global_step": 449089, "epoch": 5410} {"train_loss": -27.1613712310791, "global_step": 449090, "epoch": 5410} {"train_loss": -27.053552627563477, "global_step": 449091, "epoch": 5410} {"train_loss": -27.19781494140625, "global_step": 449092, "epoch": 5410} {"train_loss": -27.1418514251709, "global_step": 449093, "epoch": 5410} {"train_loss": -27.165990829467773, "global_step": 449094, "epoch": 5410} {"train_loss": -27.32891273498535, "global_step": 449095, "epoch": 5410} {"train_loss": -26.9202938079834, "global_step": 449096, "epoch": 5410} {"train_loss": -27.22660255432129, "global_step": 449097, "epoch": 5410} {"train_loss": -26.4769287109375, "global_step": 449098, "epoch": 5410} {"train_loss": -26.26950454711914, "global_step": 449099, "epoch": 5410} {"train_loss": -26.966474533081055, "global_step": 449100, "epoch": 5410} {"train_loss": -27.343204498291016, "global_step": 449101, "epoch": 5410} {"train_loss": -27.099252700805664, "global_step": 449102, "epoch": 5410} {"train_loss": -27.314823150634766, "global_step": 449103, "epoch": 5410} {"train_loss": -27.231922149658203, "global_step": 449104, "epoch": 5410} {"train_loss": -27.386865615844727, "global_step": 449105, "epoch": 5410} {"train_loss": -27.181299209594727, "global_step": 449106, "epoch": 5410} {"train_loss": -27.049468994140625, "global_step": 449107, "epoch": 5410} {"train_loss": -27.29010581970215, "global_step": 449108, "epoch": 5410} {"train_loss": -27.169477462768555, "global_step": 449109, "epoch": 5410} {"train_loss": -27.160436630249023, "global_step": 449110, "epoch": 5410} {"train_loss": -27.139175415039062, "global_step": 449111, "epoch": 5410} {"train_loss": -26.877861620431922, "global_step": 449112, "epoch": 5410, "val_loss": 6532957.0} {"train_loss": -26.945343017578125, "global_step": 449113, "epoch": 5411} {"train_loss": -26.631834030151367, "global_step": 449114, "epoch": 5411} {"train_loss": -26.90626335144043, "global_step": 449115, "epoch": 5411} {"train_loss": -26.35068702697754, "global_step": 449116, "epoch": 5411} {"train_loss": -26.917499542236328, "global_step": 449117, "epoch": 5411} {"train_loss": -26.89759635925293, "global_step": 449118, "epoch": 5411} {"train_loss": -27.0960693359375, "global_step": 449119, "epoch": 5411} {"train_loss": -26.819934844970703, "global_step": 449120, "epoch": 5411} {"train_loss": -26.831073760986328, "global_step": 449121, "epoch": 5411} {"train_loss": -26.752729415893555, "global_step": 449122, "epoch": 5411} {"train_loss": -26.919347763061523, "global_step": 449123, "epoch": 5411} {"train_loss": -26.87249183654785, "global_step": 449124, "epoch": 5411} {"train_loss": -26.992422103881836, "global_step": 449125, "epoch": 5411} {"train_loss": -26.768064498901367, "global_step": 449126, "epoch": 5411} {"train_loss": -26.766372680664062, "global_step": 449127, "epoch": 5411} {"train_loss": -26.838886260986328, "global_step": 449128, "epoch": 5411} {"train_loss": -27.032888412475586, "global_step": 449129, "epoch": 5411} {"train_loss": -26.984466552734375, "global_step": 449130, "epoch": 5411} {"train_loss": -27.393543243408203, "global_step": 449131, "epoch": 5411} {"train_loss": -26.6500186920166, "global_step": 449132, "epoch": 5411} {"train_loss": -27.15411376953125, "global_step": 449133, "epoch": 5411} {"train_loss": -26.91237449645996, "global_step": 449134, "epoch": 5411} {"train_loss": -27.004230499267578, "global_step": 449135, "epoch": 5411} {"train_loss": -27.054706573486328, "global_step": 449136, "epoch": 5411} {"train_loss": -27.25396156311035, "global_step": 449137, "epoch": 5411} {"train_loss": -27.396503448486328, "global_step": 449138, "epoch": 5411} {"train_loss": -27.05779457092285, "global_step": 449139, "epoch": 5411} {"train_loss": -27.15818214416504, "global_step": 449140, "epoch": 5411} {"train_loss": -26.961347579956055, "global_step": 449141, "epoch": 5411} {"train_loss": -27.359699249267578, "global_step": 449142, "epoch": 5411} {"train_loss": -26.857467651367188, "global_step": 449143, "epoch": 5411} {"train_loss": -27.198617935180664, "global_step": 449144, "epoch": 5411} {"train_loss": -26.981082916259766, "global_step": 449145, "epoch": 5411} {"train_loss": -27.375497817993164, "global_step": 449146, "epoch": 5411} {"train_loss": -27.254201889038086, "global_step": 449147, "epoch": 5411} {"train_loss": -26.73428726196289, "global_step": 449148, "epoch": 5411} {"train_loss": -26.680419921875, "global_step": 449149, "epoch": 5411} {"train_loss": -27.1106014251709, "global_step": 449150, "epoch": 5411} {"train_loss": -27.106842041015625, "global_step": 449151, "epoch": 5411} {"train_loss": -27.270278930664062, "global_step": 449152, "epoch": 5411} {"train_loss": -26.94098472595215, "global_step": 449153, "epoch": 5411} {"train_loss": -27.234375, "global_step": 449154, "epoch": 5411} {"train_loss": -27.520307540893555, "global_step": 449155, "epoch": 5411} {"train_loss": -27.33070182800293, "global_step": 449156, "epoch": 5411} {"train_loss": -27.46661376953125, "global_step": 449157, "epoch": 5411} {"train_loss": -27.09412956237793, "global_step": 449158, "epoch": 5411} {"train_loss": -26.913787841796875, "global_step": 449159, "epoch": 5411} {"train_loss": -27.19010353088379, "global_step": 449160, "epoch": 5411} {"train_loss": -27.209091186523438, "global_step": 449161, "epoch": 5411} {"train_loss": -27.303003311157227, "global_step": 449162, "epoch": 5411} {"train_loss": -27.386951446533203, "global_step": 449163, "epoch": 5411} {"train_loss": -27.199987411499023, "global_step": 449164, "epoch": 5411} {"train_loss": -27.1489200592041, "global_step": 449165, "epoch": 5411} {"train_loss": -26.998493194580078, "global_step": 449166, "epoch": 5411} {"train_loss": -26.909055709838867, "global_step": 449167, "epoch": 5411} {"train_loss": -27.35735511779785, "global_step": 449168, "epoch": 5411} {"train_loss": -27.051977157592773, "global_step": 449169, "epoch": 5411} {"train_loss": -27.334875106811523, "global_step": 449170, "epoch": 5411} {"train_loss": -27.005369186401367, "global_step": 449171, "epoch": 5411} {"train_loss": -27.14942741394043, "global_step": 449172, "epoch": 5411} {"train_loss": -27.286855697631836, "global_step": 449173, "epoch": 5411} {"train_loss": -26.982746124267578, "global_step": 449174, "epoch": 5411} {"train_loss": -27.093358993530273, "global_step": 449175, "epoch": 5411} {"train_loss": -26.973779678344727, "global_step": 449176, "epoch": 5411} {"train_loss": -27.086240768432617, "global_step": 449177, "epoch": 5411} {"train_loss": -27.235273361206055, "global_step": 449178, "epoch": 5411} {"train_loss": -26.688810348510742, "global_step": 449179, "epoch": 5411} {"train_loss": -26.1886043548584, "global_step": 449180, "epoch": 5411} {"train_loss": -26.490095138549805, "global_step": 449181, "epoch": 5411} {"train_loss": -26.903223037719727, "global_step": 449182, "epoch": 5411} {"train_loss": -26.42887306213379, "global_step": 449183, "epoch": 5411} {"train_loss": -26.387479782104492, "global_step": 449184, "epoch": 5411} {"train_loss": -26.55489158630371, "global_step": 449185, "epoch": 5411} {"train_loss": -25.8994197845459, "global_step": 449186, "epoch": 5411} {"train_loss": -26.162256240844727, "global_step": 449187, "epoch": 5411} {"train_loss": -27.239072799682617, "global_step": 449188, "epoch": 5411} {"train_loss": -26.264190673828125, "global_step": 449189, "epoch": 5411} {"train_loss": -26.13614273071289, "global_step": 449190, "epoch": 5411} {"train_loss": -27.0817928314209, "global_step": 449191, "epoch": 5411} {"train_loss": -26.682464599609375, "global_step": 449192, "epoch": 5411} {"train_loss": -27.147424697875977, "global_step": 449193, "epoch": 5411} {"train_loss": -26.64263916015625, "global_step": 449194, "epoch": 5411} {"train_loss": -26.9628252925643, "global_step": 449195, "epoch": 5411, "val_loss": 6625956.0} {"train_loss": -25.356433868408203, "global_step": 449196, "epoch": 5412} {"train_loss": -26.029722213745117, "global_step": 449197, "epoch": 5412} {"train_loss": -25.748926162719727, "global_step": 449198, "epoch": 5412} {"train_loss": -25.903467178344727, "global_step": 449199, "epoch": 5412} {"train_loss": -25.96735191345215, "global_step": 449200, "epoch": 5412} {"train_loss": -26.277664184570312, "global_step": 449201, "epoch": 5412} {"train_loss": -26.155603408813477, "global_step": 449202, "epoch": 5412} {"train_loss": -25.63101577758789, "global_step": 449203, "epoch": 5412} {"train_loss": -26.569326400756836, "global_step": 449204, "epoch": 5412} {"train_loss": -25.997665405273438, "global_step": 449205, "epoch": 5412} {"train_loss": -25.999128341674805, "global_step": 449206, "epoch": 5412} {"train_loss": -26.187774658203125, "global_step": 449207, "epoch": 5412} {"train_loss": -26.223251342773438, "global_step": 449208, "epoch": 5412} {"train_loss": -26.278223037719727, "global_step": 449209, "epoch": 5412} {"train_loss": -26.301761627197266, "global_step": 449210, "epoch": 5412} {"train_loss": -26.186838150024414, "global_step": 449211, "epoch": 5412} {"train_loss": -26.360502243041992, "global_step": 449212, "epoch": 5412} {"train_loss": -26.764123916625977, "global_step": 449213, "epoch": 5412} {"train_loss": -26.89133644104004, "global_step": 449214, "epoch": 5412} {"train_loss": -26.42405128479004, "global_step": 449215, "epoch": 5412} {"train_loss": -26.509424209594727, "global_step": 449216, "epoch": 5412} {"train_loss": -26.7412109375, "global_step": 449217, "epoch": 5412} {"train_loss": -26.59712028503418, "global_step": 449218, "epoch": 5412} {"train_loss": -26.710790634155273, "global_step": 449219, "epoch": 5412} {"train_loss": -27.008609771728516, "global_step": 449220, "epoch": 5412} {"train_loss": -26.79658317565918, "global_step": 449221, "epoch": 5412} {"train_loss": -26.717092514038086, "global_step": 449222, "epoch": 5412} {"train_loss": -26.474069595336914, "global_step": 449223, "epoch": 5412} {"train_loss": -26.85580825805664, "global_step": 449224, "epoch": 5412} {"train_loss": -27.195789337158203, "global_step": 449225, "epoch": 5412} {"train_loss": -26.71645164489746, "global_step": 449226, "epoch": 5412} {"train_loss": -27.0062255859375, "global_step": 449227, "epoch": 5412} {"train_loss": -26.8892822265625, "global_step": 449228, "epoch": 5412} {"train_loss": -27.02264976501465, "global_step": 449229, "epoch": 5412} {"train_loss": -27.21240234375, "global_step": 449230, "epoch": 5412} {"train_loss": -26.822830200195312, "global_step": 449231, "epoch": 5412} {"train_loss": -27.01262855529785, "global_step": 449232, "epoch": 5412} {"train_loss": -26.969141006469727, "global_step": 449233, "epoch": 5412} {"train_loss": -26.972492218017578, "global_step": 449234, "epoch": 5412} {"train_loss": -26.5178279876709, "global_step": 449235, "epoch": 5412} {"train_loss": -27.01547622680664, "global_step": 449236, "epoch": 5412} {"train_loss": -26.9150390625, "global_step": 449237, "epoch": 5412} {"train_loss": -26.788410186767578, "global_step": 449238, "epoch": 5412} {"train_loss": -27.480016708374023, "global_step": 449239, "epoch": 5412} {"train_loss": -26.837682723999023, "global_step": 449240, "epoch": 5412} {"train_loss": -27.109394073486328, "global_step": 449241, "epoch": 5412} {"train_loss": -26.65773582458496, "global_step": 449242, "epoch": 5412} {"train_loss": -26.920902252197266, "global_step": 449243, "epoch": 5412} {"train_loss": -26.676013946533203, "global_step": 449244, "epoch": 5412} {"train_loss": -27.145069122314453, "global_step": 449245, "epoch": 5412} {"train_loss": -27.06190299987793, "global_step": 449246, "epoch": 5412} {"train_loss": -27.002111434936523, "global_step": 449247, "epoch": 5412} {"train_loss": -26.953588485717773, "global_step": 449248, "epoch": 5412} {"train_loss": -27.469282150268555, "global_step": 449249, "epoch": 5412} {"train_loss": -27.01078224182129, "global_step": 449250, "epoch": 5412} {"train_loss": -26.863393783569336, "global_step": 449251, "epoch": 5412} {"train_loss": -26.955554962158203, "global_step": 449252, "epoch": 5412} {"train_loss": -27.462055206298828, "global_step": 449253, "epoch": 5412} {"train_loss": -26.9984130859375, "global_step": 449254, "epoch": 5412} {"train_loss": -27.25927734375, "global_step": 449255, "epoch": 5412} {"train_loss": -27.241443634033203, "global_step": 449256, "epoch": 5412} {"train_loss": -27.254785537719727, "global_step": 449257, "epoch": 5412} {"train_loss": -27.05344581604004, "global_step": 449258, "epoch": 5412} {"train_loss": -27.185012817382812, "global_step": 449259, "epoch": 5412} {"train_loss": -27.17299461364746, "global_step": 449260, "epoch": 5412} {"train_loss": -27.057392120361328, "global_step": 449261, "epoch": 5412} {"train_loss": -26.82212257385254, "global_step": 449262, "epoch": 5412} {"train_loss": -26.52520751953125, "global_step": 449263, "epoch": 5412} {"train_loss": -26.8214054107666, "global_step": 449264, "epoch": 5412} {"train_loss": -27.104780197143555, "global_step": 449265, "epoch": 5412} {"train_loss": -26.545257568359375, "global_step": 449266, "epoch": 5412} {"train_loss": -26.886316299438477, "global_step": 449267, "epoch": 5412} {"train_loss": -27.083723068237305, "global_step": 449268, "epoch": 5412} {"train_loss": -26.67337989807129, "global_step": 449269, "epoch": 5412} {"train_loss": -26.677478790283203, "global_step": 449270, "epoch": 5412} {"train_loss": -26.89814567565918, "global_step": 449271, "epoch": 5412} {"train_loss": -26.95969009399414, "global_step": 449272, "epoch": 5412} {"train_loss": -26.942052841186523, "global_step": 449273, "epoch": 5412} {"train_loss": -26.823652267456055, "global_step": 449274, "epoch": 5412} {"train_loss": -27.200902938842773, "global_step": 449275, "epoch": 5412} {"train_loss": -27.174413681030273, "global_step": 449276, "epoch": 5412} {"train_loss": -26.704580307006836, "global_step": 449277, "epoch": 5412} {"train_loss": -26.75308133320636, "global_step": 449278, "epoch": 5412, "val_loss": 6570811.0} {"train_loss": -26.602949142456055, "global_step": 449279, "epoch": 5413} {"train_loss": -26.71976661682129, "global_step": 449280, "epoch": 5413} {"train_loss": -26.763275146484375, "global_step": 449281, "epoch": 5413} {"train_loss": -27.015674591064453, "global_step": 449282, "epoch": 5413} {"train_loss": -26.796222686767578, "global_step": 449283, "epoch": 5413} {"train_loss": -26.77400779724121, "global_step": 449284, "epoch": 5413} {"train_loss": -26.54352378845215, "global_step": 449285, "epoch": 5413} {"train_loss": -26.56165885925293, "global_step": 449286, "epoch": 5413} {"train_loss": -26.649328231811523, "global_step": 449287, "epoch": 5413} {"train_loss": -26.95269203186035, "global_step": 449288, "epoch": 5413} {"train_loss": -26.58168601989746, "global_step": 449289, "epoch": 5413} {"train_loss": -26.613306045532227, "global_step": 449290, "epoch": 5413} {"train_loss": -26.874921798706055, "global_step": 449291, "epoch": 5413} {"train_loss": -27.099761962890625, "global_step": 449292, "epoch": 5413} {"train_loss": -26.61370277404785, "global_step": 449293, "epoch": 5413} {"train_loss": -27.113447189331055, "global_step": 449294, "epoch": 5413} {"train_loss": -27.044479370117188, "global_step": 449295, "epoch": 5413} {"train_loss": -27.26303482055664, "global_step": 449296, "epoch": 5413} {"train_loss": -27.04005241394043, "global_step": 449297, "epoch": 5413} {"train_loss": -27.115148544311523, "global_step": 449298, "epoch": 5413} {"train_loss": -26.876264572143555, "global_step": 449299, "epoch": 5413} {"train_loss": -26.929367065429688, "global_step": 449300, "epoch": 5413} {"train_loss": -26.936105728149414, "global_step": 449301, "epoch": 5413} {"train_loss": -27.147552490234375, "global_step": 449302, "epoch": 5413} {"train_loss": -27.211944580078125, "global_step": 449303, "epoch": 5413} {"train_loss": -26.722076416015625, "global_step": 449304, "epoch": 5413} {"train_loss": -27.32215690612793, "global_step": 449305, "epoch": 5413} {"train_loss": -27.274658203125, "global_step": 449306, "epoch": 5413} {"train_loss": -27.1778507232666, "global_step": 449307, "epoch": 5413} {"train_loss": -27.346363067626953, "global_step": 449308, "epoch": 5413} {"train_loss": -27.1439151763916, "global_step": 449309, "epoch": 5413} {"train_loss": -27.679061889648438, "global_step": 449310, "epoch": 5413} {"train_loss": -27.12054443359375, "global_step": 449311, "epoch": 5413} {"train_loss": -27.327728271484375, "global_step": 449312, "epoch": 5413} {"train_loss": -27.31764030456543, "global_step": 449313, "epoch": 5413} {"train_loss": -27.16037368774414, "global_step": 449314, "epoch": 5413} {"train_loss": -27.145429611206055, "global_step": 449315, "epoch": 5413} {"train_loss": -27.318862915039062, "global_step": 449316, "epoch": 5413} {"train_loss": -27.095441818237305, "global_step": 449317, "epoch": 5413} {"train_loss": -27.186643600463867, "global_step": 449318, "epoch": 5413} {"train_loss": -26.881513595581055, "global_step": 449319, "epoch": 5413} {"train_loss": -27.282079696655273, "global_step": 449320, "epoch": 5413} {"train_loss": -27.55364418029785, "global_step": 449321, "epoch": 5413} {"train_loss": -27.152942657470703, "global_step": 449322, "epoch": 5413} {"train_loss": -27.3539981842041, "global_step": 449323, "epoch": 5413} {"train_loss": -26.86102294921875, "global_step": 449324, "epoch": 5413} {"train_loss": -27.14386558532715, "global_step": 449325, "epoch": 5413} {"train_loss": -26.656103134155273, "global_step": 449326, "epoch": 5413} {"train_loss": -26.717493057250977, "global_step": 449327, "epoch": 5413} {"train_loss": -26.977319717407227, "global_step": 449328, "epoch": 5413} {"train_loss": -27.135770797729492, "global_step": 449329, "epoch": 5413} {"train_loss": -27.04400634765625, "global_step": 449330, "epoch": 5413} {"train_loss": -26.829315185546875, "global_step": 449331, "epoch": 5413} {"train_loss": -26.6425724029541, "global_step": 449332, "epoch": 5413} {"train_loss": -26.470666885375977, "global_step": 449333, "epoch": 5413} {"train_loss": -26.851049423217773, "global_step": 449334, "epoch": 5413} {"train_loss": -27.166418075561523, "global_step": 449335, "epoch": 5413} {"train_loss": -27.181884765625, "global_step": 449336, "epoch": 5413} {"train_loss": -26.713041305541992, "global_step": 449337, "epoch": 5413} {"train_loss": -26.79300308227539, "global_step": 449338, "epoch": 5413} {"train_loss": -27.010828018188477, "global_step": 449339, "epoch": 5413} {"train_loss": -26.975919723510742, "global_step": 449340, "epoch": 5413} {"train_loss": -27.233657836914062, "global_step": 449341, "epoch": 5413} {"train_loss": -27.212133407592773, "global_step": 449342, "epoch": 5413} {"train_loss": -26.558069229125977, "global_step": 449343, "epoch": 5413} {"train_loss": -27.107929229736328, "global_step": 449344, "epoch": 5413} {"train_loss": -26.794172286987305, "global_step": 449345, "epoch": 5413} {"train_loss": -27.139495849609375, "global_step": 449346, "epoch": 5413} {"train_loss": -26.862497329711914, "global_step": 449347, "epoch": 5413} {"train_loss": -27.282262802124023, "global_step": 449348, "epoch": 5413} {"train_loss": -27.327810287475586, "global_step": 449349, "epoch": 5413} {"train_loss": -27.451068878173828, "global_step": 449350, "epoch": 5413} {"train_loss": -26.83747673034668, "global_step": 449351, "epoch": 5413} {"train_loss": -27.16755485534668, "global_step": 449352, "epoch": 5413} {"train_loss": -27.463388442993164, "global_step": 449353, "epoch": 5413} {"train_loss": -27.268335342407227, "global_step": 449354, "epoch": 5413} {"train_loss": -27.29486656188965, "global_step": 449355, "epoch": 5413} {"train_loss": -27.704145431518555, "global_step": 449356, "epoch": 5413} {"train_loss": -26.81991958618164, "global_step": 449357, "epoch": 5413} {"train_loss": -27.031829833984375, "global_step": 449358, "epoch": 5413} {"train_loss": -27.207843780517578, "global_step": 449359, "epoch": 5413} {"train_loss": -27.194965362548828, "global_step": 449360, "epoch": 5413} {"train_loss": -27.032295594732446, "global_step": 449361, "epoch": 5413, "val_loss": 6601180.0} {"train_loss": -27.214475631713867, "global_step": 449362, "epoch": 5414} {"train_loss": -26.894697189331055, "global_step": 449363, "epoch": 5414} {"train_loss": -26.674015045166016, "global_step": 449364, "epoch": 5414} {"train_loss": -26.517444610595703, "global_step": 449365, "epoch": 5414} {"train_loss": -26.541479110717773, "global_step": 449366, "epoch": 5414} {"train_loss": -26.6297664642334, "global_step": 449367, "epoch": 5414} {"train_loss": -26.854089736938477, "global_step": 449368, "epoch": 5414} {"train_loss": -26.563764572143555, "global_step": 449369, "epoch": 5414} {"train_loss": -26.88043785095215, "global_step": 449370, "epoch": 5414} {"train_loss": -26.624929428100586, "global_step": 449371, "epoch": 5414} {"train_loss": -26.72528648376465, "global_step": 449372, "epoch": 5414} {"train_loss": -26.712329864501953, "global_step": 449373, "epoch": 5414} {"train_loss": -26.93875503540039, "global_step": 449374, "epoch": 5414} {"train_loss": -26.737289428710938, "global_step": 449375, "epoch": 5414} {"train_loss": -26.905303955078125, "global_step": 449376, "epoch": 5414} {"train_loss": -26.57000160217285, "global_step": 449377, "epoch": 5414} {"train_loss": -26.941617965698242, "global_step": 449378, "epoch": 5414} {"train_loss": -27.02095603942871, "global_step": 449379, "epoch": 5414} {"train_loss": -26.64105796813965, "global_step": 449380, "epoch": 5414} {"train_loss": -26.733057022094727, "global_step": 449381, "epoch": 5414} {"train_loss": -26.859073638916016, "global_step": 449382, "epoch": 5414} {"train_loss": -27.297199249267578, "global_step": 449383, "epoch": 5414} {"train_loss": -26.92707633972168, "global_step": 449384, "epoch": 5414} {"train_loss": -27.203832626342773, "global_step": 449385, "epoch": 5414} {"train_loss": -27.162281036376953, "global_step": 449386, "epoch": 5414} {"train_loss": -26.9129638671875, "global_step": 449387, "epoch": 5414} {"train_loss": -26.974105834960938, "global_step": 449388, "epoch": 5414} {"train_loss": -26.604949951171875, "global_step": 449389, "epoch": 5414} {"train_loss": -26.953580856323242, "global_step": 449390, "epoch": 5414} {"train_loss": -26.795618057250977, "global_step": 449391, "epoch": 5414} {"train_loss": -26.833972930908203, "global_step": 449392, "epoch": 5414} {"train_loss": -26.843114852905273, "global_step": 449393, "epoch": 5414} {"train_loss": -27.027057647705078, "global_step": 449394, "epoch": 5414} {"train_loss": -26.816797256469727, "global_step": 449395, "epoch": 5414} {"train_loss": -26.99251365661621, "global_step": 449396, "epoch": 5414} {"train_loss": -26.94191551208496, "global_step": 449397, "epoch": 5414} {"train_loss": -27.160810470581055, "global_step": 449398, "epoch": 5414} {"train_loss": -26.91169548034668, "global_step": 449399, "epoch": 5414} {"train_loss": -27.211267471313477, "global_step": 449400, "epoch": 5414} {"train_loss": -27.32395362854004, "global_step": 449401, "epoch": 5414} {"train_loss": -26.940662384033203, "global_step": 449402, "epoch": 5414} {"train_loss": -27.371173858642578, "global_step": 449403, "epoch": 5414} {"train_loss": -27.009292602539062, "global_step": 449404, "epoch": 5414} {"train_loss": -27.103656768798828, "global_step": 449405, "epoch": 5414} {"train_loss": -27.229598999023438, "global_step": 449406, "epoch": 5414} {"train_loss": -27.117263793945312, "global_step": 449407, "epoch": 5414} {"train_loss": -27.01698112487793, "global_step": 449408, "epoch": 5414} {"train_loss": -27.219099044799805, "global_step": 449409, "epoch": 5414} {"train_loss": -27.075284957885742, "global_step": 449410, "epoch": 5414} {"train_loss": -27.067529678344727, "global_step": 449411, "epoch": 5414} {"train_loss": -27.022741317749023, "global_step": 449412, "epoch": 5414} {"train_loss": -26.962263107299805, "global_step": 449413, "epoch": 5414} {"train_loss": -26.85053825378418, "global_step": 449414, "epoch": 5414} {"train_loss": -27.4871883392334, "global_step": 449415, "epoch": 5414} {"train_loss": -26.802448272705078, "global_step": 449416, "epoch": 5414} {"train_loss": -26.929306030273438, "global_step": 449417, "epoch": 5414} {"train_loss": -26.97806167602539, "global_step": 449418, "epoch": 5414} {"train_loss": -27.105260848999023, "global_step": 449419, "epoch": 5414} {"train_loss": -27.08258056640625, "global_step": 449420, "epoch": 5414} {"train_loss": -26.625823974609375, "global_step": 449421, "epoch": 5414} {"train_loss": -27.237659454345703, "global_step": 449422, "epoch": 5414} {"train_loss": -27.840194702148438, "global_step": 449423, "epoch": 5414} {"train_loss": -27.51704216003418, "global_step": 449424, "epoch": 5414} {"train_loss": -26.5654239654541, "global_step": 449425, "epoch": 5414} {"train_loss": -26.59683609008789, "global_step": 449426, "epoch": 5414} {"train_loss": -26.90707778930664, "global_step": 449427, "epoch": 5414} {"train_loss": -26.95734214782715, "global_step": 449428, "epoch": 5414} {"train_loss": -26.985599517822266, "global_step": 449429, "epoch": 5414} {"train_loss": -27.056955337524414, "global_step": 449430, "epoch": 5414} {"train_loss": -27.019973754882812, "global_step": 449431, "epoch": 5414} {"train_loss": -27.434528350830078, "global_step": 449432, "epoch": 5414} {"train_loss": -26.955230712890625, "global_step": 449433, "epoch": 5414} {"train_loss": -26.978605270385742, "global_step": 449434, "epoch": 5414} {"train_loss": -27.04192543029785, "global_step": 449435, "epoch": 5414} {"train_loss": -26.714599609375, "global_step": 449436, "epoch": 5414} {"train_loss": -27.213794708251953, "global_step": 449437, "epoch": 5414} {"train_loss": -27.335859298706055, "global_step": 449438, "epoch": 5414} {"train_loss": -27.32960319519043, "global_step": 449439, "epoch": 5414} {"train_loss": -27.342193603515625, "global_step": 449440, "epoch": 5414} {"train_loss": -26.953699111938477, "global_step": 449441, "epoch": 5414} {"train_loss": -27.419885635375977, "global_step": 449442, "epoch": 5414} {"train_loss": -27.144927978515625, "global_step": 449443, "epoch": 5414} {"train_loss": -26.989920397838915, "global_step": 449444, "epoch": 5414, "val_loss": 6561721.5} {"train_loss": -26.426218032836914, "global_step": 449445, "epoch": 5415} {"train_loss": -26.576740264892578, "global_step": 449446, "epoch": 5415} {"train_loss": -26.13319206237793, "global_step": 449447, "epoch": 5415} {"train_loss": -26.03409767150879, "global_step": 449448, "epoch": 5415} {"train_loss": -25.92325210571289, "global_step": 449449, "epoch": 5415} {"train_loss": -26.713308334350586, "global_step": 449450, "epoch": 5415} {"train_loss": -27.118091583251953, "global_step": 449451, "epoch": 5415} {"train_loss": -26.3978271484375, "global_step": 449452, "epoch": 5415} {"train_loss": -26.404998779296875, "global_step": 449453, "epoch": 5415} {"train_loss": -27.051023483276367, "global_step": 449454, "epoch": 5415} {"train_loss": -26.206998825073242, "global_step": 449455, "epoch": 5415} {"train_loss": -26.39371681213379, "global_step": 449456, "epoch": 5415} {"train_loss": -26.626981735229492, "global_step": 449457, "epoch": 5415} {"train_loss": -26.761030197143555, "global_step": 449458, "epoch": 5415} {"train_loss": -26.842954635620117, "global_step": 449459, "epoch": 5415} {"train_loss": -26.101322174072266, "global_step": 449460, "epoch": 5415} {"train_loss": -26.475610733032227, "global_step": 449461, "epoch": 5415} {"train_loss": -26.630258560180664, "global_step": 449462, "epoch": 5415} {"train_loss": -26.562591552734375, "global_step": 449463, "epoch": 5415} {"train_loss": -26.937641143798828, "global_step": 449464, "epoch": 5415} {"train_loss": -26.649961471557617, "global_step": 449465, "epoch": 5415} {"train_loss": -27.25737953186035, "global_step": 449466, "epoch": 5415} {"train_loss": -26.526031494140625, "global_step": 449467, "epoch": 5415} {"train_loss": -26.556806564331055, "global_step": 449468, "epoch": 5415} {"train_loss": -26.651111602783203, "global_step": 449469, "epoch": 5415} {"train_loss": -26.810596466064453, "global_step": 449470, "epoch": 5415} {"train_loss": -26.545425415039062, "global_step": 449471, "epoch": 5415} {"train_loss": -26.8554744720459, "global_step": 449472, "epoch": 5415} {"train_loss": -26.914005279541016, "global_step": 449473, "epoch": 5415} {"train_loss": -27.049345016479492, "global_step": 449474, "epoch": 5415} {"train_loss": -26.96487808227539, "global_step": 449475, "epoch": 5415} {"train_loss": -26.728696823120117, "global_step": 449476, "epoch": 5415} {"train_loss": -26.89411735534668, "global_step": 449477, "epoch": 5415} {"train_loss": -27.230566024780273, "global_step": 449478, "epoch": 5415} {"train_loss": -27.240604400634766, "global_step": 449479, "epoch": 5415} {"train_loss": -27.010406494140625, "global_step": 449480, "epoch": 5415} {"train_loss": -26.629764556884766, "global_step": 449481, "epoch": 5415} {"train_loss": -26.730314254760742, "global_step": 449482, "epoch": 5415} {"train_loss": -26.9808406829834, "global_step": 449483, "epoch": 5415} {"train_loss": -27.31532096862793, "global_step": 449484, "epoch": 5415} {"train_loss": -27.606740951538086, "global_step": 449485, "epoch": 5415} {"train_loss": -27.236053466796875, "global_step": 449486, "epoch": 5415} {"train_loss": -27.40913200378418, "global_step": 449487, "epoch": 5415} {"train_loss": -27.235492706298828, "global_step": 449488, "epoch": 5415} {"train_loss": -27.263214111328125, "global_step": 449489, "epoch": 5415} {"train_loss": -27.124164581298828, "global_step": 449490, "epoch": 5415} {"train_loss": -27.262643814086914, "global_step": 449491, "epoch": 5415} {"train_loss": -26.940521240234375, "global_step": 449492, "epoch": 5415} {"train_loss": -27.530689239501953, "global_step": 449493, "epoch": 5415} {"train_loss": -27.20784568786621, "global_step": 449494, "epoch": 5415} {"train_loss": -27.26421546936035, "global_step": 449495, "epoch": 5415} {"train_loss": -27.312530517578125, "global_step": 449496, "epoch": 5415} {"train_loss": -27.045984268188477, "global_step": 449497, "epoch": 5415} {"train_loss": -26.99908447265625, "global_step": 449498, "epoch": 5415} {"train_loss": -26.92366600036621, "global_step": 449499, "epoch": 5415} {"train_loss": -27.114383697509766, "global_step": 449500, "epoch": 5415} {"train_loss": -27.037931442260742, "global_step": 449501, "epoch": 5415} {"train_loss": -27.0679931640625, "global_step": 449502, "epoch": 5415} {"train_loss": -27.26983070373535, "global_step": 449503, "epoch": 5415} {"train_loss": -27.432758331298828, "global_step": 449504, "epoch": 5415} {"train_loss": -27.187408447265625, "global_step": 449505, "epoch": 5415} {"train_loss": -27.223316192626953, "global_step": 449506, "epoch": 5415} {"train_loss": -27.221715927124023, "global_step": 449507, "epoch": 5415} {"train_loss": -27.255849838256836, "global_step": 449508, "epoch": 5415} {"train_loss": -27.253284454345703, "global_step": 449509, "epoch": 5415} {"train_loss": -27.504724502563477, "global_step": 449510, "epoch": 5415} {"train_loss": -27.138355255126953, "global_step": 449511, "epoch": 5415} {"train_loss": -27.284597396850586, "global_step": 449512, "epoch": 5415} {"train_loss": -27.055212020874023, "global_step": 449513, "epoch": 5415} {"train_loss": -26.894758224487305, "global_step": 449514, "epoch": 5415} {"train_loss": -26.2231388092041, "global_step": 449515, "epoch": 5415} {"train_loss": -25.422649383544922, "global_step": 449516, "epoch": 5415} {"train_loss": -25.471752166748047, "global_step": 449517, "epoch": 5415} {"train_loss": -26.829771041870117, "global_step": 449518, "epoch": 5415} {"train_loss": -26.849069595336914, "global_step": 449519, "epoch": 5415} {"train_loss": -26.614118576049805, "global_step": 449520, "epoch": 5415} {"train_loss": -27.009521484375, "global_step": 449521, "epoch": 5415} {"train_loss": -26.797590255737305, "global_step": 449522, "epoch": 5415} {"train_loss": -26.804418563842773, "global_step": 449523, "epoch": 5415} {"train_loss": -26.727462768554688, "global_step": 449524, "epoch": 5415} {"train_loss": -26.662322998046875, "global_step": 449525, "epoch": 5415} {"train_loss": -26.795429229736328, "global_step": 449526, "epoch": 5415} {"train_loss": -26.845572552049017, "global_step": 449527, "epoch": 5415, "val_loss": 6484950.0} {"train_loss": -26.334278106689453, "global_step": 449528, "epoch": 5416} {"train_loss": -25.482646942138672, "global_step": 449529, "epoch": 5416} {"train_loss": -25.672637939453125, "global_step": 449530, "epoch": 5416} {"train_loss": -25.91204261779785, "global_step": 449531, "epoch": 5416} {"train_loss": -26.51922607421875, "global_step": 449532, "epoch": 5416} {"train_loss": -25.63477897644043, "global_step": 449533, "epoch": 5416} {"train_loss": -26.102548599243164, "global_step": 449534, "epoch": 5416} {"train_loss": -26.01252555847168, "global_step": 449535, "epoch": 5416} {"train_loss": -26.25421142578125, "global_step": 449536, "epoch": 5416} {"train_loss": -26.457321166992188, "global_step": 449537, "epoch": 5416} {"train_loss": -26.47763442993164, "global_step": 449538, "epoch": 5416} {"train_loss": -26.628366470336914, "global_step": 449539, "epoch": 5416} {"train_loss": -26.34320068359375, "global_step": 449540, "epoch": 5416} {"train_loss": -26.31390953063965, "global_step": 449541, "epoch": 5416} {"train_loss": -26.647872924804688, "global_step": 449542, "epoch": 5416} {"train_loss": -26.583154678344727, "global_step": 449543, "epoch": 5416} {"train_loss": -26.1436767578125, "global_step": 449544, "epoch": 5416} {"train_loss": -26.194501876831055, "global_step": 449545, "epoch": 5416} {"train_loss": -26.12210464477539, "global_step": 449546, "epoch": 5416} {"train_loss": -26.77716636657715, "global_step": 449547, "epoch": 5416} {"train_loss": -26.411468505859375, "global_step": 449548, "epoch": 5416} {"train_loss": -26.64906120300293, "global_step": 449549, "epoch": 5416} {"train_loss": -26.551727294921875, "global_step": 449550, "epoch": 5416} {"train_loss": -26.596546173095703, "global_step": 449551, "epoch": 5416} {"train_loss": -27.017730712890625, "global_step": 449552, "epoch": 5416} {"train_loss": -27.025115966796875, "global_step": 449553, "epoch": 5416} {"train_loss": -26.694650650024414, "global_step": 449554, "epoch": 5416} {"train_loss": -26.835590362548828, "global_step": 449555, "epoch": 5416} {"train_loss": -27.19879722595215, "global_step": 449556, "epoch": 5416} {"train_loss": -27.118986129760742, "global_step": 449557, "epoch": 5416} {"train_loss": -27.191205978393555, "global_step": 449558, "epoch": 5416} {"train_loss": -26.861404418945312, "global_step": 449559, "epoch": 5416} {"train_loss": -26.894620895385742, "global_step": 449560, "epoch": 5416} {"train_loss": -26.932392120361328, "global_step": 449561, "epoch": 5416} {"train_loss": -27.01922035217285, "global_step": 449562, "epoch": 5416} {"train_loss": -27.532764434814453, "global_step": 449563, "epoch": 5416} {"train_loss": -26.955123901367188, "global_step": 449564, "epoch": 5416} {"train_loss": -27.011377334594727, "global_step": 449565, "epoch": 5416} {"train_loss": -26.987689971923828, "global_step": 449566, "epoch": 5416} {"train_loss": -27.129480361938477, "global_step": 449567, "epoch": 5416} {"train_loss": -27.38604736328125, "global_step": 449568, "epoch": 5416} {"train_loss": -27.2065486907959, "global_step": 449569, "epoch": 5416} {"train_loss": -26.933820724487305, "global_step": 449570, "epoch": 5416} {"train_loss": -27.187454223632812, "global_step": 449571, "epoch": 5416} {"train_loss": -26.87721061706543, "global_step": 449572, "epoch": 5416} {"train_loss": -27.282201766967773, "global_step": 449573, "epoch": 5416} {"train_loss": -27.270246505737305, "global_step": 449574, "epoch": 5416} {"train_loss": -27.1846866607666, "global_step": 449575, "epoch": 5416} {"train_loss": -27.13686180114746, "global_step": 449576, "epoch": 5416} {"train_loss": -27.459125518798828, "global_step": 449577, "epoch": 5416} {"train_loss": -27.29718589782715, "global_step": 449578, "epoch": 5416} {"train_loss": -27.267730712890625, "global_step": 449579, "epoch": 5416} {"train_loss": -27.443206787109375, "global_step": 449580, "epoch": 5416} {"train_loss": -27.140979766845703, "global_step": 449581, "epoch": 5416} {"train_loss": -27.1834716796875, "global_step": 449582, "epoch": 5416} {"train_loss": -27.137723922729492, "global_step": 449583, "epoch": 5416} {"train_loss": -27.32636833190918, "global_step": 449584, "epoch": 5416} {"train_loss": -26.574188232421875, "global_step": 449585, "epoch": 5416} {"train_loss": -26.877222061157227, "global_step": 449586, "epoch": 5416} {"train_loss": -26.7077579498291, "global_step": 449587, "epoch": 5416} {"train_loss": -27.20747184753418, "global_step": 449588, "epoch": 5416} {"train_loss": -27.325469970703125, "global_step": 449589, "epoch": 5416} {"train_loss": -26.945526123046875, "global_step": 449590, "epoch": 5416} {"train_loss": -26.81589698791504, "global_step": 449591, "epoch": 5416} {"train_loss": -27.107458114624023, "global_step": 449592, "epoch": 5416} {"train_loss": -26.980239868164062, "global_step": 449593, "epoch": 5416} {"train_loss": -26.55897331237793, "global_step": 449594, "epoch": 5416} {"train_loss": -26.775482177734375, "global_step": 449595, "epoch": 5416} {"train_loss": -26.742773056030273, "global_step": 449596, "epoch": 5416} {"train_loss": -26.8624210357666, "global_step": 449597, "epoch": 5416} {"train_loss": -26.69154930114746, "global_step": 449598, "epoch": 5416} {"train_loss": -27.04475212097168, "global_step": 449599, "epoch": 5416} {"train_loss": -26.823810577392578, "global_step": 449600, "epoch": 5416} {"train_loss": -27.04022216796875, "global_step": 449601, "epoch": 5416} {"train_loss": -26.982013702392578, "global_step": 449602, "epoch": 5416} {"train_loss": -27.16781997680664, "global_step": 449603, "epoch": 5416} {"train_loss": -27.1427059173584, "global_step": 449604, "epoch": 5416} {"train_loss": -26.707242965698242, "global_step": 449605, "epoch": 5416} {"train_loss": -26.5112361907959, "global_step": 449606, "epoch": 5416} {"train_loss": -26.698230743408203, "global_step": 449607, "epoch": 5416} {"train_loss": -26.8709716796875, "global_step": 449608, "epoch": 5416} {"train_loss": -26.736921310424805, "global_step": 449609, "epoch": 5416} {"train_loss": -26.803661668157, "global_step": 449610, "epoch": 5416, "val_loss": 6432841.5} {"train_loss": -26.82240104675293, "global_step": 449611, "epoch": 5417} {"train_loss": -27.072729110717773, "global_step": 449612, "epoch": 5417} {"train_loss": -26.844512939453125, "global_step": 449613, "epoch": 5417} {"train_loss": -26.283838272094727, "global_step": 449614, "epoch": 5417} {"train_loss": -26.78847312927246, "global_step": 449615, "epoch": 5417} {"train_loss": -27.071264266967773, "global_step": 449616, "epoch": 5417} {"train_loss": -27.174509048461914, "global_step": 449617, "epoch": 5417} {"train_loss": -26.87548828125, "global_step": 449618, "epoch": 5417} {"train_loss": -26.96824073791504, "global_step": 449619, "epoch": 5417} {"train_loss": -26.502838134765625, "global_step": 449620, "epoch": 5417} {"train_loss": -26.7661190032959, "global_step": 449621, "epoch": 5417} {"train_loss": -26.542007446289062, "global_step": 449622, "epoch": 5417} {"train_loss": -27.125104904174805, "global_step": 449623, "epoch": 5417} {"train_loss": -27.084537506103516, "global_step": 449624, "epoch": 5417} {"train_loss": -26.96900749206543, "global_step": 449625, "epoch": 5417} {"train_loss": -26.926687240600586, "global_step": 449626, "epoch": 5417} {"train_loss": -27.06390380859375, "global_step": 449627, "epoch": 5417} {"train_loss": -27.1077880859375, "global_step": 449628, "epoch": 5417} {"train_loss": -26.925989151000977, "global_step": 449629, "epoch": 5417} {"train_loss": -27.096601486206055, "global_step": 449630, "epoch": 5417} {"train_loss": -26.77130126953125, "global_step": 449631, "epoch": 5417} {"train_loss": -26.767765045166016, "global_step": 449632, "epoch": 5417} {"train_loss": -26.85365104675293, "global_step": 449633, "epoch": 5417} {"train_loss": -26.866077423095703, "global_step": 449634, "epoch": 5417} {"train_loss": -27.171594619750977, "global_step": 449635, "epoch": 5417} {"train_loss": -27.004919052124023, "global_step": 449636, "epoch": 5417} {"train_loss": -26.873865127563477, "global_step": 449637, "epoch": 5417} {"train_loss": -26.899274826049805, "global_step": 449638, "epoch": 5417} {"train_loss": -26.70758056640625, "global_step": 449639, "epoch": 5417} {"train_loss": -26.864404678344727, "global_step": 449640, "epoch": 5417} {"train_loss": -27.128864288330078, "global_step": 449641, "epoch": 5417} {"train_loss": -27.15742301940918, "global_step": 449642, "epoch": 5417} {"train_loss": -26.933637619018555, "global_step": 449643, "epoch": 5417} {"train_loss": -27.238306045532227, "global_step": 449644, "epoch": 5417} {"train_loss": -27.07832908630371, "global_step": 449645, "epoch": 5417} {"train_loss": -27.000980377197266, "global_step": 449646, "epoch": 5417} {"train_loss": -26.857473373413086, "global_step": 449647, "epoch": 5417} {"train_loss": -26.80179214477539, "global_step": 449648, "epoch": 5417} {"train_loss": -27.067564010620117, "global_step": 449649, "epoch": 5417} {"train_loss": -26.8646240234375, "global_step": 449650, "epoch": 5417} {"train_loss": -27.22381591796875, "global_step": 449651, "epoch": 5417} {"train_loss": -26.833585739135742, "global_step": 449652, "epoch": 5417} {"train_loss": -26.753253936767578, "global_step": 449653, "epoch": 5417} {"train_loss": -26.505285263061523, "global_step": 449654, "epoch": 5417} {"train_loss": -26.83749771118164, "global_step": 449655, "epoch": 5417} {"train_loss": -26.843765258789062, "global_step": 449656, "epoch": 5417} {"train_loss": -26.666767120361328, "global_step": 449657, "epoch": 5417} {"train_loss": -27.186004638671875, "global_step": 449658, "epoch": 5417} {"train_loss": -27.282873153686523, "global_step": 449659, "epoch": 5417} {"train_loss": -27.184701919555664, "global_step": 449660, "epoch": 5417} {"train_loss": -27.49234962463379, "global_step": 449661, "epoch": 5417} {"train_loss": -26.88751792907715, "global_step": 449662, "epoch": 5417} {"train_loss": -26.85248374938965, "global_step": 449663, "epoch": 5417} {"train_loss": -27.114383697509766, "global_step": 449664, "epoch": 5417} {"train_loss": -27.082019805908203, "global_step": 449665, "epoch": 5417} {"train_loss": -26.793664932250977, "global_step": 449666, "epoch": 5417} {"train_loss": -27.059186935424805, "global_step": 449667, "epoch": 5417} {"train_loss": -27.280561447143555, "global_step": 449668, "epoch": 5417} {"train_loss": -26.99698829650879, "global_step": 449669, "epoch": 5417} {"train_loss": -27.18511962890625, "global_step": 449670, "epoch": 5417} {"train_loss": -27.026050567626953, "global_step": 449671, "epoch": 5417} {"train_loss": -27.18963623046875, "global_step": 449672, "epoch": 5417} {"train_loss": -27.030622482299805, "global_step": 449673, "epoch": 5417} {"train_loss": -27.073843002319336, "global_step": 449674, "epoch": 5417} {"train_loss": -27.186904907226562, "global_step": 449675, "epoch": 5417} {"train_loss": -26.9920711517334, "global_step": 449676, "epoch": 5417} {"train_loss": -26.624448776245117, "global_step": 449677, "epoch": 5417} {"train_loss": -27.109582901000977, "global_step": 449678, "epoch": 5417} {"train_loss": -27.28506851196289, "global_step": 449679, "epoch": 5417} {"train_loss": -26.52445411682129, "global_step": 449680, "epoch": 5417} {"train_loss": -26.757165908813477, "global_step": 449681, "epoch": 5417} {"train_loss": -26.715469360351562, "global_step": 449682, "epoch": 5417} {"train_loss": -27.218610763549805, "global_step": 449683, "epoch": 5417} {"train_loss": -26.840112686157227, "global_step": 449684, "epoch": 5417} {"train_loss": -27.04559898376465, "global_step": 449685, "epoch": 5417} {"train_loss": -27.22907066345215, "global_step": 449686, "epoch": 5417} {"train_loss": -26.8978214263916, "global_step": 449687, "epoch": 5417} {"train_loss": -27.270374298095703, "global_step": 449688, "epoch": 5417} {"train_loss": -27.140689849853516, "global_step": 449689, "epoch": 5417} {"train_loss": -27.434499740600586, "global_step": 449690, "epoch": 5417} {"train_loss": -27.09686851501465, "global_step": 449691, "epoch": 5417} {"train_loss": -26.807920455932617, "global_step": 449692, "epoch": 5417} {"train_loss": -26.971701334757977, "global_step": 449693, "epoch": 5417, "val_loss": 6528861.0} {"train_loss": -26.8046932220459, "global_step": 449694, "epoch": 5418} {"train_loss": -26.457977294921875, "global_step": 449695, "epoch": 5418} {"train_loss": -26.763269424438477, "global_step": 449696, "epoch": 5418} {"train_loss": -26.50994300842285, "global_step": 449697, "epoch": 5418} {"train_loss": -27.011991500854492, "global_step": 449698, "epoch": 5418} {"train_loss": -26.858198165893555, "global_step": 449699, "epoch": 5418} {"train_loss": -26.979734420776367, "global_step": 449700, "epoch": 5418} {"train_loss": -26.6551456451416, "global_step": 449701, "epoch": 5418} {"train_loss": -26.49871826171875, "global_step": 449702, "epoch": 5418} {"train_loss": -26.827640533447266, "global_step": 449703, "epoch": 5418} {"train_loss": -26.827795028686523, "global_step": 449704, "epoch": 5418} {"train_loss": -26.859394073486328, "global_step": 449705, "epoch": 5418} {"train_loss": -26.34554100036621, "global_step": 449706, "epoch": 5418} {"train_loss": -26.90510368347168, "global_step": 449707, "epoch": 5418} {"train_loss": -26.8106632232666, "global_step": 449708, "epoch": 5418} {"train_loss": -27.0483455657959, "global_step": 449709, "epoch": 5418} {"train_loss": -26.858280181884766, "global_step": 449710, "epoch": 5418} {"train_loss": -26.91105079650879, "global_step": 449711, "epoch": 5418} {"train_loss": -26.845691680908203, "global_step": 449712, "epoch": 5418} {"train_loss": -26.44681167602539, "global_step": 449713, "epoch": 5418} {"train_loss": -26.792999267578125, "global_step": 449714, "epoch": 5418} {"train_loss": -26.872888565063477, "global_step": 449715, "epoch": 5418} {"train_loss": -26.145368576049805, "global_step": 449716, "epoch": 5418} {"train_loss": -26.618133544921875, "global_step": 449717, "epoch": 5418} {"train_loss": -27.1363468170166, "global_step": 449718, "epoch": 5418} {"train_loss": -26.970685958862305, "global_step": 449719, "epoch": 5418} {"train_loss": -26.6854305267334, "global_step": 449720, "epoch": 5418} {"train_loss": -27.075519561767578, "global_step": 449721, "epoch": 5418} {"train_loss": -26.5664119720459, "global_step": 449722, "epoch": 5418} {"train_loss": -26.909473419189453, "global_step": 449723, "epoch": 5418} {"train_loss": -26.89985466003418, "global_step": 449724, "epoch": 5418} {"train_loss": -27.122217178344727, "global_step": 449725, "epoch": 5418} {"train_loss": -27.14948844909668, "global_step": 449726, "epoch": 5418} {"train_loss": -26.876514434814453, "global_step": 449727, "epoch": 5418} {"train_loss": -27.369199752807617, "global_step": 449728, "epoch": 5418} {"train_loss": -26.90580177307129, "global_step": 449729, "epoch": 5418} {"train_loss": -27.143095016479492, "global_step": 449730, "epoch": 5418} {"train_loss": -26.808759689331055, "global_step": 449731, "epoch": 5418} {"train_loss": -27.139936447143555, "global_step": 449732, "epoch": 5418} {"train_loss": -26.766387939453125, "global_step": 449733, "epoch": 5418} {"train_loss": -26.657699584960938, "global_step": 449734, "epoch": 5418} {"train_loss": -27.036212921142578, "global_step": 449735, "epoch": 5418} {"train_loss": -27.30362892150879, "global_step": 449736, "epoch": 5418} {"train_loss": -27.01551628112793, "global_step": 449737, "epoch": 5418} {"train_loss": -26.809375762939453, "global_step": 449738, "epoch": 5418} {"train_loss": -27.080183029174805, "global_step": 449739, "epoch": 5418} {"train_loss": -26.7120304107666, "global_step": 449740, "epoch": 5418} {"train_loss": -27.08989906311035, "global_step": 449741, "epoch": 5418} {"train_loss": -27.315261840820312, "global_step": 449742, "epoch": 5418} {"train_loss": -27.231992721557617, "global_step": 449743, "epoch": 5418} {"train_loss": -27.06166648864746, "global_step": 449744, "epoch": 5418} {"train_loss": -26.794189453125, "global_step": 449745, "epoch": 5418} {"train_loss": -26.726409912109375, "global_step": 449746, "epoch": 5418} {"train_loss": -27.289630889892578, "global_step": 449747, "epoch": 5418} {"train_loss": -27.500104904174805, "global_step": 449748, "epoch": 5418} {"train_loss": -27.15252685546875, "global_step": 449749, "epoch": 5418} {"train_loss": -27.210363388061523, "global_step": 449750, "epoch": 5418} {"train_loss": -26.886032104492188, "global_step": 449751, "epoch": 5418} {"train_loss": -27.24091148376465, "global_step": 449752, "epoch": 5418} {"train_loss": -27.509475708007812, "global_step": 449753, "epoch": 5418} {"train_loss": -27.11962890625, "global_step": 449754, "epoch": 5418} {"train_loss": -27.073888778686523, "global_step": 449755, "epoch": 5418} {"train_loss": -27.058963775634766, "global_step": 449756, "epoch": 5418} {"train_loss": -27.30076026916504, "global_step": 449757, "epoch": 5418} {"train_loss": -27.421295166015625, "global_step": 449758, "epoch": 5418} {"train_loss": -26.811986923217773, "global_step": 449759, "epoch": 5418} {"train_loss": -26.8048152923584, "global_step": 449760, "epoch": 5418} {"train_loss": -26.96128273010254, "global_step": 449761, "epoch": 5418} {"train_loss": -26.960844039916992, "global_step": 449762, "epoch": 5418} {"train_loss": -26.903919219970703, "global_step": 449763, "epoch": 5418} {"train_loss": -27.236774444580078, "global_step": 449764, "epoch": 5418} {"train_loss": -26.721744537353516, "global_step": 449765, "epoch": 5418} {"train_loss": -26.925495147705078, "global_step": 449766, "epoch": 5418} {"train_loss": -26.750959396362305, "global_step": 449767, "epoch": 5418} {"train_loss": -26.786710739135742, "global_step": 449768, "epoch": 5418} {"train_loss": -27.335372924804688, "global_step": 449769, "epoch": 5418} {"train_loss": -27.118188858032227, "global_step": 449770, "epoch": 5418} {"train_loss": -26.30579948425293, "global_step": 449771, "epoch": 5418} {"train_loss": -26.690298080444336, "global_step": 449772, "epoch": 5418} {"train_loss": -27.006799697875977, "global_step": 449773, "epoch": 5418} {"train_loss": -27.1536865234375, "global_step": 449774, "epoch": 5418} {"train_loss": -26.724323272705078, "global_step": 449775, "epoch": 5418} {"train_loss": -26.934018767023662, "global_step": 449776, "epoch": 5418, "val_loss": 6567908.0} {"train_loss": -26.771692276000977, "global_step": 449777, "epoch": 5419} {"train_loss": -26.161291122436523, "global_step": 449778, "epoch": 5419} {"train_loss": -26.613691329956055, "global_step": 449779, "epoch": 5419} {"train_loss": -26.674137115478516, "global_step": 449780, "epoch": 5419} {"train_loss": -27.27058219909668, "global_step": 449781, "epoch": 5419} {"train_loss": -26.660253524780273, "global_step": 449782, "epoch": 5419} {"train_loss": -26.69063377380371, "global_step": 449783, "epoch": 5419} {"train_loss": -26.493017196655273, "global_step": 449784, "epoch": 5419} {"train_loss": -26.61297607421875, "global_step": 449785, "epoch": 5419} {"train_loss": -26.950063705444336, "global_step": 449786, "epoch": 5419} {"train_loss": -27.142553329467773, "global_step": 449787, "epoch": 5419} {"train_loss": -26.88129234313965, "global_step": 449788, "epoch": 5419} {"train_loss": -26.378042221069336, "global_step": 449789, "epoch": 5419} {"train_loss": -26.888355255126953, "global_step": 449790, "epoch": 5419} {"train_loss": -26.736026763916016, "global_step": 449791, "epoch": 5419} {"train_loss": -26.615262985229492, "global_step": 449792, "epoch": 5419} {"train_loss": -26.846054077148438, "global_step": 449793, "epoch": 5419} {"train_loss": -26.974889755249023, "global_step": 449794, "epoch": 5419} {"train_loss": -27.030118942260742, "global_step": 449795, "epoch": 5419} {"train_loss": -26.92450523376465, "global_step": 449796, "epoch": 5419} {"train_loss": -27.037261962890625, "global_step": 449797, "epoch": 5419} {"train_loss": -26.62050437927246, "global_step": 449798, "epoch": 5419} {"train_loss": -27.136474609375, "global_step": 449799, "epoch": 5419} {"train_loss": -26.8017520904541, "global_step": 449800, "epoch": 5419} {"train_loss": -26.71536636352539, "global_step": 449801, "epoch": 5419} {"train_loss": -27.182119369506836, "global_step": 449802, "epoch": 5419} {"train_loss": -27.30075454711914, "global_step": 449803, "epoch": 5419} {"train_loss": -26.890207290649414, "global_step": 449804, "epoch": 5419} {"train_loss": -27.24513053894043, "global_step": 449805, "epoch": 5419} {"train_loss": -26.7748966217041, "global_step": 449806, "epoch": 5419} {"train_loss": -27.02557945251465, "global_step": 449807, "epoch": 5419} {"train_loss": -27.002676010131836, "global_step": 449808, "epoch": 5419} {"train_loss": -26.90635108947754, "global_step": 449809, "epoch": 5419} {"train_loss": -26.976327896118164, "global_step": 449810, "epoch": 5419} {"train_loss": -27.360265731811523, "global_step": 449811, "epoch": 5419} {"train_loss": -27.183124542236328, "global_step": 449812, "epoch": 5419} {"train_loss": -27.18204116821289, "global_step": 449813, "epoch": 5419} {"train_loss": -27.27589225769043, "global_step": 449814, "epoch": 5419} {"train_loss": -26.69580078125, "global_step": 449815, "epoch": 5419} {"train_loss": -26.9901180267334, "global_step": 449816, "epoch": 5419} {"train_loss": -27.1954345703125, "global_step": 449817, "epoch": 5419} {"train_loss": -27.019683837890625, "global_step": 449818, "epoch": 5419} {"train_loss": -27.325597763061523, "global_step": 449819, "epoch": 5419} {"train_loss": -27.30792236328125, "global_step": 449820, "epoch": 5419} {"train_loss": -27.025104522705078, "global_step": 449821, "epoch": 5419} {"train_loss": -26.947614669799805, "global_step": 449822, "epoch": 5419} {"train_loss": -26.727014541625977, "global_step": 449823, "epoch": 5419} {"train_loss": -27.1909122467041, "global_step": 449824, "epoch": 5419} {"train_loss": -26.657012939453125, "global_step": 449825, "epoch": 5419} {"train_loss": -27.23638343811035, "global_step": 449826, "epoch": 5419} {"train_loss": -26.7003173828125, "global_step": 449827, "epoch": 5419} {"train_loss": -26.47492790222168, "global_step": 449828, "epoch": 5419} {"train_loss": -27.214323043823242, "global_step": 449829, "epoch": 5419} {"train_loss": -27.099353790283203, "global_step": 449830, "epoch": 5419} {"train_loss": -26.479154586791992, "global_step": 449831, "epoch": 5419} {"train_loss": -27.197574615478516, "global_step": 449832, "epoch": 5419} {"train_loss": -26.991846084594727, "global_step": 449833, "epoch": 5419} {"train_loss": -26.89688491821289, "global_step": 449834, "epoch": 5419} {"train_loss": -26.578882217407227, "global_step": 449835, "epoch": 5419} {"train_loss": -27.41016960144043, "global_step": 449836, "epoch": 5419} {"train_loss": -26.992523193359375, "global_step": 449837, "epoch": 5419} {"train_loss": -26.956953048706055, "global_step": 449838, "epoch": 5419} {"train_loss": -26.992368698120117, "global_step": 449839, "epoch": 5419} {"train_loss": -26.960071563720703, "global_step": 449840, "epoch": 5419} {"train_loss": -26.81689453125, "global_step": 449841, "epoch": 5419} {"train_loss": -27.1485652923584, "global_step": 449842, "epoch": 5419} {"train_loss": -27.286508560180664, "global_step": 449843, "epoch": 5419} {"train_loss": -26.7884521484375, "global_step": 449844, "epoch": 5419} {"train_loss": -27.061145782470703, "global_step": 449845, "epoch": 5419} {"train_loss": -27.33017349243164, "global_step": 449846, "epoch": 5419} {"train_loss": -26.72474479675293, "global_step": 449847, "epoch": 5419} {"train_loss": -26.834213256835938, "global_step": 449848, "epoch": 5419} {"train_loss": -27.2055721282959, "global_step": 449849, "epoch": 5419} {"train_loss": -26.82662010192871, "global_step": 449850, "epoch": 5419} {"train_loss": -26.9405517578125, "global_step": 449851, "epoch": 5419} {"train_loss": -26.72306251525879, "global_step": 449852, "epoch": 5419} {"train_loss": -26.886438369750977, "global_step": 449853, "epoch": 5419} {"train_loss": -27.052387237548828, "global_step": 449854, "epoch": 5419} {"train_loss": -27.04465675354004, "global_step": 449855, "epoch": 5419} {"train_loss": -27.1342716217041, "global_step": 449856, "epoch": 5419} {"train_loss": -27.04571533203125, "global_step": 449857, "epoch": 5419} {"train_loss": -27.234180450439453, "global_step": 449858, "epoch": 5419} {"train_loss": -26.953287630196076, "global_step": 449859, "epoch": 5419, "val_loss": 6524196.0} {"train_loss": -26.698347091674805, "global_step": 449860, "epoch": 5420} {"train_loss": -26.949899673461914, "global_step": 449861, "epoch": 5420} {"train_loss": -26.479475021362305, "global_step": 449862, "epoch": 5420} {"train_loss": -26.23257827758789, "global_step": 449863, "epoch": 5420} {"train_loss": -26.43265724182129, "global_step": 449864, "epoch": 5420} {"train_loss": -26.4530029296875, "global_step": 449865, "epoch": 5420} {"train_loss": -26.252050399780273, "global_step": 449866, "epoch": 5420} {"train_loss": -25.6645565032959, "global_step": 449867, "epoch": 5420} {"train_loss": -26.596715927124023, "global_step": 449868, "epoch": 5420} {"train_loss": -26.68816566467285, "global_step": 449869, "epoch": 5420} {"train_loss": -26.39975929260254, "global_step": 449870, "epoch": 5420} {"train_loss": -26.755945205688477, "global_step": 449871, "epoch": 5420} {"train_loss": -26.95441246032715, "global_step": 449872, "epoch": 5420} {"train_loss": -26.50274085998535, "global_step": 449873, "epoch": 5420} {"train_loss": -26.893285751342773, "global_step": 449874, "epoch": 5420} {"train_loss": -26.42226219177246, "global_step": 449875, "epoch": 5420} {"train_loss": -26.884368896484375, "global_step": 449876, "epoch": 5420} {"train_loss": -26.7619686126709, "global_step": 449877, "epoch": 5420} {"train_loss": -27.1975040435791, "global_step": 449878, "epoch": 5420} {"train_loss": -27.05579948425293, "global_step": 449879, "epoch": 5420} {"train_loss": -26.792816162109375, "global_step": 449880, "epoch": 5420} {"train_loss": -26.990589141845703, "global_step": 449881, "epoch": 5420} {"train_loss": -26.93828773498535, "global_step": 449882, "epoch": 5420} {"train_loss": -26.8573055267334, "global_step": 449883, "epoch": 5420} {"train_loss": -26.819013595581055, "global_step": 449884, "epoch": 5420} {"train_loss": -26.8478946685791, "global_step": 449885, "epoch": 5420} {"train_loss": -27.0817928314209, "global_step": 449886, "epoch": 5420} {"train_loss": -27.13385009765625, "global_step": 449887, "epoch": 5420} {"train_loss": -27.063222885131836, "global_step": 449888, "epoch": 5420} {"train_loss": -26.9688720703125, "global_step": 449889, "epoch": 5420} {"train_loss": -26.93989372253418, "global_step": 449890, "epoch": 5420} {"train_loss": -27.100614547729492, "global_step": 449891, "epoch": 5420} {"train_loss": -27.1027774810791, "global_step": 449892, "epoch": 5420} {"train_loss": -26.994619369506836, "global_step": 449893, "epoch": 5420} {"train_loss": -26.816333770751953, "global_step": 449894, "epoch": 5420} {"train_loss": -26.447660446166992, "global_step": 449895, "epoch": 5420} {"train_loss": -27.1098575592041, "global_step": 449896, "epoch": 5420} {"train_loss": -26.905597686767578, "global_step": 449897, "epoch": 5420} {"train_loss": -26.877227783203125, "global_step": 449898, "epoch": 5420} {"train_loss": -26.906147003173828, "global_step": 449899, "epoch": 5420} {"train_loss": -26.568984985351562, "global_step": 449900, "epoch": 5420} {"train_loss": -27.193029403686523, "global_step": 449901, "epoch": 5420} {"train_loss": -26.864288330078125, "global_step": 449902, "epoch": 5420} {"train_loss": -26.656530380249023, "global_step": 449903, "epoch": 5420} {"train_loss": -26.635944366455078, "global_step": 449904, "epoch": 5420} {"train_loss": -27.109058380126953, "global_step": 449905, "epoch": 5420} {"train_loss": -27.119983673095703, "global_step": 449906, "epoch": 5420} {"train_loss": -26.360803604125977, "global_step": 449907, "epoch": 5420} {"train_loss": -27.141691207885742, "global_step": 449908, "epoch": 5420} {"train_loss": -27.043781280517578, "global_step": 449909, "epoch": 5420} {"train_loss": -26.868844985961914, "global_step": 449910, "epoch": 5420} {"train_loss": -26.993635177612305, "global_step": 449911, "epoch": 5420} {"train_loss": -27.36213493347168, "global_step": 449912, "epoch": 5420} {"train_loss": -26.828638076782227, "global_step": 449913, "epoch": 5420} {"train_loss": -27.108810424804688, "global_step": 449914, "epoch": 5420} {"train_loss": -27.270450592041016, "global_step": 449915, "epoch": 5420} {"train_loss": -27.411584854125977, "global_step": 449916, "epoch": 5420} {"train_loss": -26.986114501953125, "global_step": 449917, "epoch": 5420} {"train_loss": -27.129392623901367, "global_step": 449918, "epoch": 5420} {"train_loss": -27.33062171936035, "global_step": 449919, "epoch": 5420} {"train_loss": -27.086851119995117, "global_step": 449920, "epoch": 5420} {"train_loss": -27.317922592163086, "global_step": 449921, "epoch": 5420} {"train_loss": -27.039722442626953, "global_step": 449922, "epoch": 5420} {"train_loss": -27.117828369140625, "global_step": 449923, "epoch": 5420} {"train_loss": -26.8765869140625, "global_step": 449924, "epoch": 5420} {"train_loss": -27.037246704101562, "global_step": 449925, "epoch": 5420} {"train_loss": -27.207157135009766, "global_step": 449926, "epoch": 5420} {"train_loss": -27.07161521911621, "global_step": 449927, "epoch": 5420} {"train_loss": -27.062597274780273, "global_step": 449928, "epoch": 5420} {"train_loss": -26.757665634155273, "global_step": 449929, "epoch": 5420} {"train_loss": -26.652923583984375, "global_step": 449930, "epoch": 5420} {"train_loss": -26.8236083984375, "global_step": 449931, "epoch": 5420} {"train_loss": -26.73418617248535, "global_step": 449932, "epoch": 5420} {"train_loss": -26.573301315307617, "global_step": 449933, "epoch": 5420} {"train_loss": -26.7016544342041, "global_step": 449934, "epoch": 5420} {"train_loss": -26.481399536132812, "global_step": 449935, "epoch": 5420} {"train_loss": -26.54178810119629, "global_step": 449936, "epoch": 5420} {"train_loss": -26.69305992126465, "global_step": 449937, "epoch": 5420} {"train_loss": -26.644031524658203, "global_step": 449938, "epoch": 5420} {"train_loss": -26.86456298828125, "global_step": 449939, "epoch": 5420} {"train_loss": -26.888864517211914, "global_step": 449940, "epoch": 5420} {"train_loss": -27.073638916015625, "global_step": 449941, "epoch": 5420} {"train_loss": -26.86322897026338, "global_step": 449942, "epoch": 5420, "val_loss": 6594151.0} {"train_loss": -26.291967391967773, "global_step": 449943, "epoch": 5421} {"train_loss": -26.78460693359375, "global_step": 449944, "epoch": 5421} {"train_loss": -26.821735382080078, "global_step": 449945, "epoch": 5421} {"train_loss": -26.510089874267578, "global_step": 449946, "epoch": 5421} {"train_loss": -26.885534286499023, "global_step": 449947, "epoch": 5421} {"train_loss": -26.809507369995117, "global_step": 449948, "epoch": 5421} {"train_loss": -26.89133071899414, "global_step": 449949, "epoch": 5421} {"train_loss": -26.79412269592285, "global_step": 449950, "epoch": 5421} {"train_loss": -26.84138298034668, "global_step": 449951, "epoch": 5421} {"train_loss": -26.96437644958496, "global_step": 449952, "epoch": 5421} {"train_loss": -26.823827743530273, "global_step": 449953, "epoch": 5421} {"train_loss": -26.654935836791992, "global_step": 449954, "epoch": 5421} {"train_loss": -26.57801628112793, "global_step": 449955, "epoch": 5421} {"train_loss": -26.72749137878418, "global_step": 449956, "epoch": 5421} {"train_loss": -26.682531356811523, "global_step": 449957, "epoch": 5421} {"train_loss": -26.555683135986328, "global_step": 449958, "epoch": 5421} {"train_loss": -26.422626495361328, "global_step": 449959, "epoch": 5421} {"train_loss": -26.733783721923828, "global_step": 449960, "epoch": 5421} {"train_loss": -26.642255783081055, "global_step": 449961, "epoch": 5421} {"train_loss": -26.840295791625977, "global_step": 449962, "epoch": 5421} {"train_loss": -27.22389793395996, "global_step": 449963, "epoch": 5421} {"train_loss": -26.970998764038086, "global_step": 449964, "epoch": 5421} {"train_loss": -26.72234535217285, "global_step": 449965, "epoch": 5421} {"train_loss": -26.947790145874023, "global_step": 449966, "epoch": 5421} {"train_loss": -26.943429946899414, "global_step": 449967, "epoch": 5421} {"train_loss": -27.205535888671875, "global_step": 449968, "epoch": 5421} {"train_loss": -26.936817169189453, "global_step": 449969, "epoch": 5421} {"train_loss": -26.83552360534668, "global_step": 449970, "epoch": 5421} {"train_loss": -26.823110580444336, "global_step": 449971, "epoch": 5421} {"train_loss": -27.032306671142578, "global_step": 449972, "epoch": 5421} {"train_loss": -26.99184226989746, "global_step": 449973, "epoch": 5421} {"train_loss": -27.065250396728516, "global_step": 449974, "epoch": 5421} {"train_loss": -26.905227661132812, "global_step": 449975, "epoch": 5421} {"train_loss": -27.01026725769043, "global_step": 449976, "epoch": 5421} {"train_loss": -27.04610252380371, "global_step": 449977, "epoch": 5421} {"train_loss": -26.962820053100586, "global_step": 449978, "epoch": 5421} {"train_loss": -27.175207138061523, "global_step": 449979, "epoch": 5421} {"train_loss": -27.08609390258789, "global_step": 449980, "epoch": 5421} {"train_loss": -27.409168243408203, "global_step": 449981, "epoch": 5421} {"train_loss": -27.148635864257812, "global_step": 449982, "epoch": 5421} {"train_loss": -26.9713191986084, "global_step": 449983, "epoch": 5421} {"train_loss": -26.9177303314209, "global_step": 449984, "epoch": 5421} {"train_loss": -27.204120635986328, "global_step": 449985, "epoch": 5421} {"train_loss": -27.208555221557617, "global_step": 449986, "epoch": 5421} {"train_loss": -26.987079620361328, "global_step": 449987, "epoch": 5421} {"train_loss": -26.977270126342773, "global_step": 449988, "epoch": 5421} {"train_loss": -26.890625, "global_step": 449989, "epoch": 5421} {"train_loss": -26.751724243164062, "global_step": 449990, "epoch": 5421} {"train_loss": -26.8339900970459, "global_step": 449991, "epoch": 5421} {"train_loss": -26.919055938720703, "global_step": 449992, "epoch": 5421} {"train_loss": -27.084686279296875, "global_step": 449993, "epoch": 5421} {"train_loss": -27.513402938842773, "global_step": 449994, "epoch": 5421} {"train_loss": -26.697629928588867, "global_step": 449995, "epoch": 5421} {"train_loss": -26.734243392944336, "global_step": 449996, "epoch": 5421} {"train_loss": -26.537097930908203, "global_step": 449997, "epoch": 5421} {"train_loss": -27.254697799682617, "global_step": 449998, "epoch": 5421} {"train_loss": -26.846349716186523, "global_step": 449999, "epoch": 5421} {"train_loss": -26.903106689453125, "global_step": 450000, "epoch": 5421} {"train_loss": -27.16730308532715, "global_step": 450001, "epoch": 5421} {"train_loss": -26.99598503112793, "global_step": 450002, "epoch": 5421} {"train_loss": -26.50514030456543, "global_step": 450003, "epoch": 5421} {"train_loss": -26.61573600769043, "global_step": 450004, "epoch": 5421} {"train_loss": -27.17698097229004, "global_step": 450005, "epoch": 5421} {"train_loss": -27.027454376220703, "global_step": 450006, "epoch": 5421} {"train_loss": -27.19732666015625, "global_step": 450007, "epoch": 5421} {"train_loss": -27.13688087463379, "global_step": 450008, "epoch": 5421} {"train_loss": -26.943735122680664, "global_step": 450009, "epoch": 5421} {"train_loss": -26.838871002197266, "global_step": 450010, "epoch": 5421} {"train_loss": -26.8895206451416, "global_step": 450011, "epoch": 5421} {"train_loss": -27.0948543548584, "global_step": 450012, "epoch": 5421} {"train_loss": -27.239288330078125, "global_step": 450013, "epoch": 5421} {"train_loss": -27.176671981811523, "global_step": 450014, "epoch": 5421} {"train_loss": -27.17323112487793, "global_step": 450015, "epoch": 5421} {"train_loss": -27.415851593017578, "global_step": 450016, "epoch": 5421} {"train_loss": -27.348560333251953, "global_step": 450017, "epoch": 5421} {"train_loss": -27.203876495361328, "global_step": 450018, "epoch": 5421} {"train_loss": -26.705612182617188, "global_step": 450019, "epoch": 5421} {"train_loss": -27.025684356689453, "global_step": 450020, "epoch": 5421} {"train_loss": -27.125701904296875, "global_step": 450021, "epoch": 5421} {"train_loss": -27.095102310180664, "global_step": 450022, "epoch": 5421} {"train_loss": -27.276647567749023, "global_step": 450023, "epoch": 5421} {"train_loss": -27.20560646057129, "global_step": 450024, "epoch": 5421} {"train_loss": -26.968302623335138, "global_step": 450025, "epoch": 5421, "val_loss": 6541710.0} {"train_loss": -25.7683162689209, "global_step": 450026, "epoch": 5422} {"train_loss": -26.364843368530273, "global_step": 450027, "epoch": 5422} {"train_loss": -26.667240142822266, "global_step": 450028, "epoch": 5422} {"train_loss": -25.688617706298828, "global_step": 450029, "epoch": 5422} {"train_loss": -25.71839714050293, "global_step": 450030, "epoch": 5422} {"train_loss": -26.5355167388916, "global_step": 450031, "epoch": 5422} {"train_loss": -25.899219512939453, "global_step": 450032, "epoch": 5422} {"train_loss": -25.87018394470215, "global_step": 450033, "epoch": 5422} {"train_loss": -26.58989906311035, "global_step": 450034, "epoch": 5422} {"train_loss": -26.18417739868164, "global_step": 450035, "epoch": 5422} {"train_loss": -26.8824405670166, "global_step": 450036, "epoch": 5422} {"train_loss": -26.37288475036621, "global_step": 450037, "epoch": 5422} {"train_loss": -26.63959312438965, "global_step": 450038, "epoch": 5422} {"train_loss": -26.70246696472168, "global_step": 450039, "epoch": 5422} {"train_loss": -26.189050674438477, "global_step": 450040, "epoch": 5422} {"train_loss": -26.78693199157715, "global_step": 450041, "epoch": 5422} {"train_loss": -26.7408447265625, "global_step": 450042, "epoch": 5422} {"train_loss": -26.63410758972168, "global_step": 450043, "epoch": 5422} {"train_loss": -26.983123779296875, "global_step": 450044, "epoch": 5422} {"train_loss": -26.816131591796875, "global_step": 450045, "epoch": 5422} {"train_loss": -27.04387855529785, "global_step": 450046, "epoch": 5422} {"train_loss": -26.721515655517578, "global_step": 450047, "epoch": 5422} {"train_loss": -27.13264274597168, "global_step": 450048, "epoch": 5422} {"train_loss": -26.63232421875, "global_step": 450049, "epoch": 5422} {"train_loss": -27.053022384643555, "global_step": 450050, "epoch": 5422} {"train_loss": -26.767292022705078, "global_step": 450051, "epoch": 5422} {"train_loss": -26.953046798706055, "global_step": 450052, "epoch": 5422} {"train_loss": -26.872156143188477, "global_step": 450053, "epoch": 5422} {"train_loss": -26.818349838256836, "global_step": 450054, "epoch": 5422} {"train_loss": -26.968488693237305, "global_step": 450055, "epoch": 5422} {"train_loss": -26.893909454345703, "global_step": 450056, "epoch": 5422} {"train_loss": -26.762042999267578, "global_step": 450057, "epoch": 5422} {"train_loss": -26.89344596862793, "global_step": 450058, "epoch": 5422} {"train_loss": -27.07757568359375, "global_step": 450059, "epoch": 5422} {"train_loss": -27.037031173706055, "global_step": 450060, "epoch": 5422} {"train_loss": -26.79860496520996, "global_step": 450061, "epoch": 5422} {"train_loss": -27.066650390625, "global_step": 450062, "epoch": 5422} {"train_loss": -27.35700798034668, "global_step": 450063, "epoch": 5422} {"train_loss": -27.001983642578125, "global_step": 450064, "epoch": 5422} {"train_loss": -27.007307052612305, "global_step": 450065, "epoch": 5422} {"train_loss": -26.87580680847168, "global_step": 450066, "epoch": 5422} {"train_loss": -27.237873077392578, "global_step": 450067, "epoch": 5422} {"train_loss": -27.22346305847168, "global_step": 450068, "epoch": 5422} {"train_loss": -27.23895835876465, "global_step": 450069, "epoch": 5422} {"train_loss": -27.31790542602539, "global_step": 450070, "epoch": 5422} {"train_loss": -27.152484893798828, "global_step": 450071, "epoch": 5422} {"train_loss": -27.542057037353516, "global_step": 450072, "epoch": 5422} {"train_loss": -27.331281661987305, "global_step": 450073, "epoch": 5422} {"train_loss": -26.730579376220703, "global_step": 450074, "epoch": 5422} {"train_loss": -27.5864200592041, "global_step": 450075, "epoch": 5422} {"train_loss": -27.04534339904785, "global_step": 450076, "epoch": 5422} {"train_loss": -27.0391845703125, "global_step": 450077, "epoch": 5422} {"train_loss": -27.230024337768555, "global_step": 450078, "epoch": 5422} {"train_loss": -27.324628829956055, "global_step": 450079, "epoch": 5422} {"train_loss": -27.271909713745117, "global_step": 450080, "epoch": 5422} {"train_loss": -27.227436065673828, "global_step": 450081, "epoch": 5422} {"train_loss": -27.059940338134766, "global_step": 450082, "epoch": 5422} {"train_loss": -27.342304229736328, "global_step": 450083, "epoch": 5422} {"train_loss": -27.01978874206543, "global_step": 450084, "epoch": 5422} {"train_loss": -27.041303634643555, "global_step": 450085, "epoch": 5422} {"train_loss": -27.141921997070312, "global_step": 450086, "epoch": 5422} {"train_loss": -27.270648956298828, "global_step": 450087, "epoch": 5422} {"train_loss": -26.99696159362793, "global_step": 450088, "epoch": 5422} {"train_loss": -27.241300582885742, "global_step": 450089, "epoch": 5422} {"train_loss": -27.34982681274414, "global_step": 450090, "epoch": 5422} {"train_loss": -26.932153701782227, "global_step": 450091, "epoch": 5422} {"train_loss": -27.0220890045166, "global_step": 450092, "epoch": 5422} {"train_loss": -27.1345272064209, "global_step": 450093, "epoch": 5422} {"train_loss": -27.108789443969727, "global_step": 450094, "epoch": 5422} {"train_loss": -26.89092445373535, "global_step": 450095, "epoch": 5422} {"train_loss": -27.24480628967285, "global_step": 450096, "epoch": 5422} {"train_loss": -27.139448165893555, "global_step": 450097, "epoch": 5422} {"train_loss": -27.149829864501953, "global_step": 450098, "epoch": 5422} {"train_loss": -26.98145866394043, "global_step": 450099, "epoch": 5422} {"train_loss": -26.798267364501953, "global_step": 450100, "epoch": 5422} {"train_loss": -26.376001358032227, "global_step": 450101, "epoch": 5422} {"train_loss": -25.29169273376465, "global_step": 450102, "epoch": 5422} {"train_loss": -23.714082717895508, "global_step": 450103, "epoch": 5422} {"train_loss": -24.20819664001465, "global_step": 450104, "epoch": 5422} {"train_loss": -26.20692253112793, "global_step": 450105, "epoch": 5422} {"train_loss": -26.068811416625977, "global_step": 450106, "epoch": 5422} {"train_loss": -26.263696670532227, "global_step": 450107, "epoch": 5422} {"train_loss": -26.75571632385254, "global_step": 450108, "epoch": 5422, "val_loss": 6587352.0} {"train_loss": -25.234663009643555, "global_step": 450109, "epoch": 5423} {"train_loss": -25.232982635498047, "global_step": 450110, "epoch": 5423} {"train_loss": -25.497238159179688, "global_step": 450111, "epoch": 5423} {"train_loss": -25.343961715698242, "global_step": 450112, "epoch": 5423} {"train_loss": -25.622766494750977, "global_step": 450113, "epoch": 5423} {"train_loss": -25.804899215698242, "global_step": 450114, "epoch": 5423} {"train_loss": -25.550256729125977, "global_step": 450115, "epoch": 5423} {"train_loss": -25.879989624023438, "global_step": 450116, "epoch": 5423} {"train_loss": -26.240549087524414, "global_step": 450117, "epoch": 5423} {"train_loss": -25.83125114440918, "global_step": 450118, "epoch": 5423} {"train_loss": -25.421262741088867, "global_step": 450119, "epoch": 5423} {"train_loss": -26.353729248046875, "global_step": 450120, "epoch": 5423} {"train_loss": -25.845626831054688, "global_step": 450121, "epoch": 5423} {"train_loss": -25.919235229492188, "global_step": 450122, "epoch": 5423} {"train_loss": -26.262908935546875, "global_step": 450123, "epoch": 5423} {"train_loss": -26.1928653717041, "global_step": 450124, "epoch": 5423} {"train_loss": -26.071882247924805, "global_step": 450125, "epoch": 5423} {"train_loss": -25.744171142578125, "global_step": 450126, "epoch": 5423} {"train_loss": -26.377172470092773, "global_step": 450127, "epoch": 5423} {"train_loss": -26.184818267822266, "global_step": 450128, "epoch": 5423} {"train_loss": -26.69817543029785, "global_step": 450129, "epoch": 5423} {"train_loss": -26.229461669921875, "global_step": 450130, "epoch": 5423} {"train_loss": -26.565088272094727, "global_step": 450131, "epoch": 5423} {"train_loss": -26.22360610961914, "global_step": 450132, "epoch": 5423} {"train_loss": -26.89529800415039, "global_step": 450133, "epoch": 5423} {"train_loss": -26.37469482421875, "global_step": 450134, "epoch": 5423} {"train_loss": -26.482458114624023, "global_step": 450135, "epoch": 5423} {"train_loss": -26.465911865234375, "global_step": 450136, "epoch": 5423} {"train_loss": -26.584033966064453, "global_step": 450137, "epoch": 5423} {"train_loss": -26.835254669189453, "global_step": 450138, "epoch": 5423} {"train_loss": -26.859296798706055, "global_step": 450139, "epoch": 5423} {"train_loss": -27.101123809814453, "global_step": 450140, "epoch": 5423} {"train_loss": -26.689590454101562, "global_step": 450141, "epoch": 5423} {"train_loss": -26.752370834350586, "global_step": 450142, "epoch": 5423} {"train_loss": -26.9886417388916, "global_step": 450143, "epoch": 5423} {"train_loss": -26.9979305267334, "global_step": 450144, "epoch": 5423} {"train_loss": -26.858800888061523, "global_step": 450145, "epoch": 5423} {"train_loss": -26.688684463500977, "global_step": 450146, "epoch": 5423} {"train_loss": -26.95966148376465, "global_step": 450147, "epoch": 5423} {"train_loss": -26.31451988220215, "global_step": 450148, "epoch": 5423} {"train_loss": -27.019315719604492, "global_step": 450149, "epoch": 5423} {"train_loss": -26.9947509765625, "global_step": 450150, "epoch": 5423} {"train_loss": -26.479440689086914, "global_step": 450151, "epoch": 5423} {"train_loss": -27.121545791625977, "global_step": 450152, "epoch": 5423} {"train_loss": -26.568227767944336, "global_step": 450153, "epoch": 5423} {"train_loss": -27.070356369018555, "global_step": 450154, "epoch": 5423} {"train_loss": -27.24480628967285, "global_step": 450155, "epoch": 5423} {"train_loss": -26.906652450561523, "global_step": 450156, "epoch": 5423} {"train_loss": -27.367725372314453, "global_step": 450157, "epoch": 5423} {"train_loss": -26.78610610961914, "global_step": 450158, "epoch": 5423} {"train_loss": -27.072065353393555, "global_step": 450159, "epoch": 5423} {"train_loss": -27.109729766845703, "global_step": 450160, "epoch": 5423} {"train_loss": -26.917072296142578, "global_step": 450161, "epoch": 5423} {"train_loss": -27.07447624206543, "global_step": 450162, "epoch": 5423} {"train_loss": -27.076648712158203, "global_step": 450163, "epoch": 5423} {"train_loss": -26.915103912353516, "global_step": 450164, "epoch": 5423} {"train_loss": -27.178354263305664, "global_step": 450165, "epoch": 5423} {"train_loss": -27.49260902404785, "global_step": 450166, "epoch": 5423} {"train_loss": -27.40382957458496, "global_step": 450167, "epoch": 5423} {"train_loss": -26.970319747924805, "global_step": 450168, "epoch": 5423} {"train_loss": -27.106922149658203, "global_step": 450169, "epoch": 5423} {"train_loss": -27.406131744384766, "global_step": 450170, "epoch": 5423} {"train_loss": -27.296716690063477, "global_step": 450171, "epoch": 5423} {"train_loss": -26.806293487548828, "global_step": 450172, "epoch": 5423} {"train_loss": -27.53920555114746, "global_step": 450173, "epoch": 5423} {"train_loss": -27.52378273010254, "global_step": 450174, "epoch": 5423} {"train_loss": -27.7699031829834, "global_step": 450175, "epoch": 5423} {"train_loss": -27.112192153930664, "global_step": 450176, "epoch": 5423} {"train_loss": -26.951440811157227, "global_step": 450177, "epoch": 5423} {"train_loss": -26.820409774780273, "global_step": 450178, "epoch": 5423} {"train_loss": -27.14583396911621, "global_step": 450179, "epoch": 5423} {"train_loss": -26.763446807861328, "global_step": 450180, "epoch": 5423} {"train_loss": -27.074615478515625, "global_step": 450181, "epoch": 5423} {"train_loss": -27.36728286743164, "global_step": 450182, "epoch": 5423} {"train_loss": -26.69733238220215, "global_step": 450183, "epoch": 5423} {"train_loss": -27.079938888549805, "global_step": 450184, "epoch": 5423} {"train_loss": -27.09564781188965, "global_step": 450185, "epoch": 5423} {"train_loss": -26.950637817382812, "global_step": 450186, "epoch": 5423} {"train_loss": -26.55510902404785, "global_step": 450187, "epoch": 5423} {"train_loss": -26.615610122680664, "global_step": 450188, "epoch": 5423} {"train_loss": -26.596973419189453, "global_step": 450189, "epoch": 5423} {"train_loss": -27.1384220123291, "global_step": 450190, "epoch": 5423} {"train_loss": -26.66981901605445, "global_step": 450191, "epoch": 5423, "val_loss": 6643141.0} {"train_loss": -24.855796813964844, "global_step": 450192, "epoch": 5424} {"train_loss": -25.35009765625, "global_step": 450193, "epoch": 5424} {"train_loss": -25.918262481689453, "global_step": 450194, "epoch": 5424} {"train_loss": -25.483421325683594, "global_step": 450195, "epoch": 5424} {"train_loss": -25.867151260375977, "global_step": 450196, "epoch": 5424} {"train_loss": -25.37530517578125, "global_step": 450197, "epoch": 5424} {"train_loss": -25.7282657623291, "global_step": 450198, "epoch": 5424} {"train_loss": -25.882308959960938, "global_step": 450199, "epoch": 5424} {"train_loss": -25.898649215698242, "global_step": 450200, "epoch": 5424} {"train_loss": -26.513883590698242, "global_step": 450201, "epoch": 5424} {"train_loss": -26.264633178710938, "global_step": 450202, "epoch": 5424} {"train_loss": -26.492572784423828, "global_step": 450203, "epoch": 5424} {"train_loss": -26.52923011779785, "global_step": 450204, "epoch": 5424} {"train_loss": -26.33387565612793, "global_step": 450205, "epoch": 5424} {"train_loss": -26.41071891784668, "global_step": 450206, "epoch": 5424} {"train_loss": -26.366453170776367, "global_step": 450207, "epoch": 5424} {"train_loss": -26.243778228759766, "global_step": 450208, "epoch": 5424} {"train_loss": -26.882476806640625, "global_step": 450209, "epoch": 5424} {"train_loss": -26.524682998657227, "global_step": 450210, "epoch": 5424} {"train_loss": -26.308883666992188, "global_step": 450211, "epoch": 5424} {"train_loss": -26.51789665222168, "global_step": 450212, "epoch": 5424} {"train_loss": -26.415313720703125, "global_step": 450213, "epoch": 5424} {"train_loss": -26.574262619018555, "global_step": 450214, "epoch": 5424} {"train_loss": -26.543384552001953, "global_step": 450215, "epoch": 5424} {"train_loss": -26.717199325561523, "global_step": 450216, "epoch": 5424} {"train_loss": -26.53826904296875, "global_step": 450217, "epoch": 5424} {"train_loss": -26.956769943237305, "global_step": 450218, "epoch": 5424} {"train_loss": -26.442840576171875, "global_step": 450219, "epoch": 5424} {"train_loss": -26.696115493774414, "global_step": 450220, "epoch": 5424} {"train_loss": -26.698171615600586, "global_step": 450221, "epoch": 5424} {"train_loss": -26.639881134033203, "global_step": 450222, "epoch": 5424} {"train_loss": -27.059049606323242, "global_step": 450223, "epoch": 5424} {"train_loss": -27.25116539001465, "global_step": 450224, "epoch": 5424} {"train_loss": -26.8593692779541, "global_step": 450225, "epoch": 5424} {"train_loss": -27.364776611328125, "global_step": 450226, "epoch": 5424} {"train_loss": -26.997968673706055, "global_step": 450227, "epoch": 5424} {"train_loss": -27.027851104736328, "global_step": 450228, "epoch": 5424} {"train_loss": -26.82032585144043, "global_step": 450229, "epoch": 5424} {"train_loss": -26.739532470703125, "global_step": 450230, "epoch": 5424} {"train_loss": -27.274768829345703, "global_step": 450231, "epoch": 5424} {"train_loss": -27.011335372924805, "global_step": 450232, "epoch": 5424} {"train_loss": -26.912220001220703, "global_step": 450233, "epoch": 5424} {"train_loss": -26.888385772705078, "global_step": 450234, "epoch": 5424} {"train_loss": -27.189172744750977, "global_step": 450235, "epoch": 5424} {"train_loss": -26.926593780517578, "global_step": 450236, "epoch": 5424} {"train_loss": -27.047332763671875, "global_step": 450237, "epoch": 5424} {"train_loss": -27.155414581298828, "global_step": 450238, "epoch": 5424} {"train_loss": -27.172515869140625, "global_step": 450239, "epoch": 5424} {"train_loss": -27.096181869506836, "global_step": 450240, "epoch": 5424} {"train_loss": -27.5703125, "global_step": 450241, "epoch": 5424} {"train_loss": -27.043548583984375, "global_step": 450242, "epoch": 5424} {"train_loss": -26.86576271057129, "global_step": 450243, "epoch": 5424} {"train_loss": -26.9822998046875, "global_step": 450244, "epoch": 5424} {"train_loss": -27.292978286743164, "global_step": 450245, "epoch": 5424} {"train_loss": -27.160175323486328, "global_step": 450246, "epoch": 5424} {"train_loss": -26.983108520507812, "global_step": 450247, "epoch": 5424} {"train_loss": -27.13313102722168, "global_step": 450248, "epoch": 5424} {"train_loss": -27.09795570373535, "global_step": 450249, "epoch": 5424} {"train_loss": -27.197858810424805, "global_step": 450250, "epoch": 5424} {"train_loss": -27.22381019592285, "global_step": 450251, "epoch": 5424} {"train_loss": -27.162946701049805, "global_step": 450252, "epoch": 5424} {"train_loss": -26.8958740234375, "global_step": 450253, "epoch": 5424} {"train_loss": -26.64383316040039, "global_step": 450254, "epoch": 5424} {"train_loss": -26.874820709228516, "global_step": 450255, "epoch": 5424} {"train_loss": -27.35272216796875, "global_step": 450256, "epoch": 5424} {"train_loss": -27.246337890625, "global_step": 450257, "epoch": 5424} {"train_loss": -26.741010665893555, "global_step": 450258, "epoch": 5424} {"train_loss": -26.8579044342041, "global_step": 450259, "epoch": 5424} {"train_loss": -26.612030029296875, "global_step": 450260, "epoch": 5424} {"train_loss": -26.900959014892578, "global_step": 450261, "epoch": 5424} {"train_loss": -26.734161376953125, "global_step": 450262, "epoch": 5424} {"train_loss": -27.36553955078125, "global_step": 450263, "epoch": 5424} {"train_loss": -27.0506534576416, "global_step": 450264, "epoch": 5424} {"train_loss": -26.54304313659668, "global_step": 450265, "epoch": 5424} {"train_loss": -26.838104248046875, "global_step": 450266, "epoch": 5424} {"train_loss": -26.873733520507812, "global_step": 450267, "epoch": 5424} {"train_loss": -27.179122924804688, "global_step": 450268, "epoch": 5424} {"train_loss": -27.14786148071289, "global_step": 450269, "epoch": 5424} {"train_loss": -27.091474533081055, "global_step": 450270, "epoch": 5424} {"train_loss": -26.70649528503418, "global_step": 450271, "epoch": 5424} {"train_loss": -26.650293350219727, "global_step": 450272, "epoch": 5424} {"train_loss": -27.10282325744629, "global_step": 450273, "epoch": 5424} {"train_loss": -26.72368284018643, "global_step": 450274, "epoch": 5424, "val_loss": 6516711.5} {"train_loss": -26.617340087890625, "global_step": 450275, "epoch": 5425} {"train_loss": -25.723066329956055, "global_step": 450276, "epoch": 5425} {"train_loss": -25.835119247436523, "global_step": 450277, "epoch": 5425} {"train_loss": -26.447126388549805, "global_step": 450278, "epoch": 5425} {"train_loss": -26.414342880249023, "global_step": 450279, "epoch": 5425} {"train_loss": -26.414579391479492, "global_step": 450280, "epoch": 5425} {"train_loss": -26.67194938659668, "global_step": 450281, "epoch": 5425} {"train_loss": -26.480512619018555, "global_step": 450282, "epoch": 5425} {"train_loss": -26.765222549438477, "global_step": 450283, "epoch": 5425} {"train_loss": -26.521244049072266, "global_step": 450284, "epoch": 5425} {"train_loss": -26.636022567749023, "global_step": 450285, "epoch": 5425} {"train_loss": -26.556127548217773, "global_step": 450286, "epoch": 5425} {"train_loss": -26.95383644104004, "global_step": 450287, "epoch": 5425} {"train_loss": -26.220325469970703, "global_step": 450288, "epoch": 5425} {"train_loss": -26.5643310546875, "global_step": 450289, "epoch": 5425} {"train_loss": -26.65199851989746, "global_step": 450290, "epoch": 5425} {"train_loss": -26.402185440063477, "global_step": 450291, "epoch": 5425} {"train_loss": -26.98404312133789, "global_step": 450292, "epoch": 5425} {"train_loss": -26.770328521728516, "global_step": 450293, "epoch": 5425} {"train_loss": -26.854272842407227, "global_step": 450294, "epoch": 5425} {"train_loss": -26.8005428314209, "global_step": 450295, "epoch": 5425} {"train_loss": -26.664709091186523, "global_step": 450296, "epoch": 5425} {"train_loss": -26.530675888061523, "global_step": 450297, "epoch": 5425} {"train_loss": -27.044179916381836, "global_step": 450298, "epoch": 5425} {"train_loss": -27.038223266601562, "global_step": 450299, "epoch": 5425} {"train_loss": -27.083959579467773, "global_step": 450300, "epoch": 5425} {"train_loss": -27.235260009765625, "global_step": 450301, "epoch": 5425} {"train_loss": -27.007131576538086, "global_step": 450302, "epoch": 5425} {"train_loss": -26.402013778686523, "global_step": 450303, "epoch": 5425} {"train_loss": -26.822067260742188, "global_step": 450304, "epoch": 5425} {"train_loss": -26.92194175720215, "global_step": 450305, "epoch": 5425} {"train_loss": -27.22163200378418, "global_step": 450306, "epoch": 5425} {"train_loss": -26.664966583251953, "global_step": 450307, "epoch": 5425} {"train_loss": -27.146326065063477, "global_step": 450308, "epoch": 5425} {"train_loss": -27.410888671875, "global_step": 450309, "epoch": 5425} {"train_loss": -27.49587059020996, "global_step": 450310, "epoch": 5425} {"train_loss": -27.297870635986328, "global_step": 450311, "epoch": 5425} {"train_loss": -27.2524356842041, "global_step": 450312, "epoch": 5425} {"train_loss": -27.04852867126465, "global_step": 450313, "epoch": 5425} {"train_loss": -26.914173126220703, "global_step": 450314, "epoch": 5425} {"train_loss": -27.14166259765625, "global_step": 450315, "epoch": 5425} {"train_loss": -27.081159591674805, "global_step": 450316, "epoch": 5425} {"train_loss": -27.450056076049805, "global_step": 450317, "epoch": 5425} {"train_loss": -27.030155181884766, "global_step": 450318, "epoch": 5425} {"train_loss": -27.355127334594727, "global_step": 450319, "epoch": 5425} {"train_loss": -27.161712646484375, "global_step": 450320, "epoch": 5425} {"train_loss": -27.1982479095459, "global_step": 450321, "epoch": 5425} {"train_loss": -27.2819766998291, "global_step": 450322, "epoch": 5425} {"train_loss": -27.45145606994629, "global_step": 450323, "epoch": 5425} {"train_loss": -27.262451171875, "global_step": 450324, "epoch": 5425} {"train_loss": -27.337194442749023, "global_step": 450325, "epoch": 5425} {"train_loss": -26.941816329956055, "global_step": 450326, "epoch": 5425} {"train_loss": -26.96539306640625, "global_step": 450327, "epoch": 5425} {"train_loss": -26.82376480102539, "global_step": 450328, "epoch": 5425} {"train_loss": -26.64222526550293, "global_step": 450329, "epoch": 5425} {"train_loss": -27.050628662109375, "global_step": 450330, "epoch": 5425} {"train_loss": -27.505878448486328, "global_step": 450331, "epoch": 5425} {"train_loss": -27.211872100830078, "global_step": 450332, "epoch": 5425} {"train_loss": -27.2980899810791, "global_step": 450333, "epoch": 5425} {"train_loss": -27.31095314025879, "global_step": 450334, "epoch": 5425} {"train_loss": -27.051712036132812, "global_step": 450335, "epoch": 5425} {"train_loss": -27.054473876953125, "global_step": 450336, "epoch": 5425} {"train_loss": -27.092945098876953, "global_step": 450337, "epoch": 5425} {"train_loss": -27.043304443359375, "global_step": 450338, "epoch": 5425} {"train_loss": -27.13883399963379, "global_step": 450339, "epoch": 5425} {"train_loss": -27.33699607849121, "global_step": 450340, "epoch": 5425} {"train_loss": -27.210607528686523, "global_step": 450341, "epoch": 5425} {"train_loss": -27.40997314453125, "global_step": 450342, "epoch": 5425} {"train_loss": -27.526792526245117, "global_step": 450343, "epoch": 5425} {"train_loss": -26.883481979370117, "global_step": 450344, "epoch": 5425} {"train_loss": -26.906696319580078, "global_step": 450345, "epoch": 5425} {"train_loss": -27.074804306030273, "global_step": 450346, "epoch": 5425} {"train_loss": -26.128965377807617, "global_step": 450347, "epoch": 5425} {"train_loss": -25.571561813354492, "global_step": 450348, "epoch": 5425} {"train_loss": -25.648040771484375, "global_step": 450349, "epoch": 5425} {"train_loss": -26.2627010345459, "global_step": 450350, "epoch": 5425} {"train_loss": -26.392866134643555, "global_step": 450351, "epoch": 5425} {"train_loss": -26.416671752929688, "global_step": 450352, "epoch": 5425} {"train_loss": -26.472990036010742, "global_step": 450353, "epoch": 5425} {"train_loss": -26.133380889892578, "global_step": 450354, "epoch": 5425} {"train_loss": -26.996118545532227, "global_step": 450355, "epoch": 5425} {"train_loss": -26.661298751831055, "global_step": 450356, "epoch": 5425} {"train_loss": -26.866583697767144, "global_step": 450357, "epoch": 5425, "val_loss": 6593717.0} {"train_loss": -25.931371688842773, "global_step": 450358, "epoch": 5426} {"train_loss": -26.61227798461914, "global_step": 450359, "epoch": 5426} {"train_loss": -26.140274047851562, "global_step": 450360, "epoch": 5426} {"train_loss": -26.60650634765625, "global_step": 450361, "epoch": 5426} {"train_loss": -26.267667770385742, "global_step": 450362, "epoch": 5426} {"train_loss": -26.368398666381836, "global_step": 450363, "epoch": 5426} {"train_loss": -26.338428497314453, "global_step": 450364, "epoch": 5426} {"train_loss": -26.416025161743164, "global_step": 450365, "epoch": 5426} {"train_loss": -26.47626304626465, "global_step": 450366, "epoch": 5426} {"train_loss": -26.82331657409668, "global_step": 450367, "epoch": 5426} {"train_loss": -26.39584732055664, "global_step": 450368, "epoch": 5426} {"train_loss": -26.527481079101562, "global_step": 450369, "epoch": 5426} {"train_loss": -26.452106475830078, "global_step": 450370, "epoch": 5426} {"train_loss": -26.613210678100586, "global_step": 450371, "epoch": 5426} {"train_loss": -26.5612735748291, "global_step": 450372, "epoch": 5426} {"train_loss": -26.774946212768555, "global_step": 450373, "epoch": 5426} {"train_loss": -26.85682487487793, "global_step": 450374, "epoch": 5426} {"train_loss": -26.860639572143555, "global_step": 450375, "epoch": 5426} {"train_loss": -26.89004898071289, "global_step": 450376, "epoch": 5426} {"train_loss": -26.789203643798828, "global_step": 450377, "epoch": 5426} {"train_loss": -26.723663330078125, "global_step": 450378, "epoch": 5426} {"train_loss": -26.63368034362793, "global_step": 450379, "epoch": 5426} {"train_loss": -27.087018966674805, "global_step": 450380, "epoch": 5426} {"train_loss": -26.69058609008789, "global_step": 450381, "epoch": 5426} {"train_loss": -26.776203155517578, "global_step": 450382, "epoch": 5426} {"train_loss": -27.007558822631836, "global_step": 450383, "epoch": 5426} {"train_loss": -26.835540771484375, "global_step": 450384, "epoch": 5426} {"train_loss": -27.058862686157227, "global_step": 450385, "epoch": 5426} {"train_loss": -27.099760055541992, "global_step": 450386, "epoch": 5426} {"train_loss": -27.048664093017578, "global_step": 450387, "epoch": 5426} {"train_loss": -27.14691162109375, "global_step": 450388, "epoch": 5426} {"train_loss": -26.99655532836914, "global_step": 450389, "epoch": 5426} {"train_loss": -27.00764274597168, "global_step": 450390, "epoch": 5426} {"train_loss": -26.73077392578125, "global_step": 450391, "epoch": 5426} {"train_loss": -26.8901424407959, "global_step": 450392, "epoch": 5426} {"train_loss": -27.152929306030273, "global_step": 450393, "epoch": 5426} {"train_loss": -27.40459632873535, "global_step": 450394, "epoch": 5426} {"train_loss": -26.940122604370117, "global_step": 450395, "epoch": 5426} {"train_loss": -27.246429443359375, "global_step": 450396, "epoch": 5426} {"train_loss": -27.255523681640625, "global_step": 450397, "epoch": 5426} {"train_loss": -26.867414474487305, "global_step": 450398, "epoch": 5426} {"train_loss": -26.932214736938477, "global_step": 450399, "epoch": 5426} {"train_loss": -27.154462814331055, "global_step": 450400, "epoch": 5426} {"train_loss": -27.267797470092773, "global_step": 450401, "epoch": 5426} {"train_loss": -27.6434326171875, "global_step": 450402, "epoch": 5426} {"train_loss": -27.463293075561523, "global_step": 450403, "epoch": 5426} {"train_loss": -27.4652099609375, "global_step": 450404, "epoch": 5426} {"train_loss": -26.885162353515625, "global_step": 450405, "epoch": 5426} {"train_loss": -27.011091232299805, "global_step": 450406, "epoch": 5426} {"train_loss": -27.051746368408203, "global_step": 450407, "epoch": 5426} {"train_loss": -27.04275894165039, "global_step": 450408, "epoch": 5426} {"train_loss": -27.095006942749023, "global_step": 450409, "epoch": 5426} {"train_loss": -27.0542049407959, "global_step": 450410, "epoch": 5426} {"train_loss": -27.41583824157715, "global_step": 450411, "epoch": 5426} {"train_loss": -26.982757568359375, "global_step": 450412, "epoch": 5426} {"train_loss": -27.228668212890625, "global_step": 450413, "epoch": 5426} {"train_loss": -27.477466583251953, "global_step": 450414, "epoch": 5426} {"train_loss": -27.262510299682617, "global_step": 450415, "epoch": 5426} {"train_loss": -27.47768211364746, "global_step": 450416, "epoch": 5426} {"train_loss": -27.643774032592773, "global_step": 450417, "epoch": 5426} {"train_loss": -27.370742797851562, "global_step": 450418, "epoch": 5426} {"train_loss": -27.334674835205078, "global_step": 450419, "epoch": 5426} {"train_loss": -27.229156494140625, "global_step": 450420, "epoch": 5426} {"train_loss": -26.850635528564453, "global_step": 450421, "epoch": 5426} {"train_loss": -27.22552490234375, "global_step": 450422, "epoch": 5426} {"train_loss": -26.90234375, "global_step": 450423, "epoch": 5426} {"train_loss": -27.086074829101562, "global_step": 450424, "epoch": 5426} {"train_loss": -26.864831924438477, "global_step": 450425, "epoch": 5426} {"train_loss": -26.806049346923828, "global_step": 450426, "epoch": 5426} {"train_loss": -27.081602096557617, "global_step": 450427, "epoch": 5426} {"train_loss": -26.90378189086914, "global_step": 450428, "epoch": 5426} {"train_loss": -26.862409591674805, "global_step": 450429, "epoch": 5426} {"train_loss": -27.228918075561523, "global_step": 450430, "epoch": 5426} {"train_loss": -27.294635772705078, "global_step": 450431, "epoch": 5426} {"train_loss": -27.06263542175293, "global_step": 450432, "epoch": 5426} {"train_loss": -26.730093002319336, "global_step": 450433, "epoch": 5426} {"train_loss": -27.190494537353516, "global_step": 450434, "epoch": 5426} {"train_loss": -26.737289428710938, "global_step": 450435, "epoch": 5426} {"train_loss": -27.040699005126953, "global_step": 450436, "epoch": 5426} {"train_loss": -26.879514694213867, "global_step": 450437, "epoch": 5426} {"train_loss": -27.289459228515625, "global_step": 450438, "epoch": 5426} {"train_loss": -26.836490631103516, "global_step": 450439, "epoch": 5426} {"train_loss": -26.941999826086573, "global_step": 450440, "epoch": 5426, "val_loss": 6459599.0} {"train_loss": -26.4375057220459, "global_step": 450441, "epoch": 5427} {"train_loss": -26.72104835510254, "global_step": 450442, "epoch": 5427} {"train_loss": -26.67559814453125, "global_step": 450443, "epoch": 5427} {"train_loss": -26.97376823425293, "global_step": 450444, "epoch": 5427} {"train_loss": -26.614709854125977, "global_step": 450445, "epoch": 5427} {"train_loss": -26.4202823638916, "global_step": 450446, "epoch": 5427} {"train_loss": -26.81549644470215, "global_step": 450447, "epoch": 5427} {"train_loss": -26.691394805908203, "global_step": 450448, "epoch": 5427} {"train_loss": -26.63405418395996, "global_step": 450449, "epoch": 5427} {"train_loss": -26.803945541381836, "global_step": 450450, "epoch": 5427} {"train_loss": -26.54267692565918, "global_step": 450451, "epoch": 5427} {"train_loss": -26.289365768432617, "global_step": 450452, "epoch": 5427} {"train_loss": -26.857833862304688, "global_step": 450453, "epoch": 5427} {"train_loss": -26.66839599609375, "global_step": 450454, "epoch": 5427} {"train_loss": -26.602005004882812, "global_step": 450455, "epoch": 5427} {"train_loss": -26.89153480529785, "global_step": 450456, "epoch": 5427} {"train_loss": -26.426843643188477, "global_step": 450457, "epoch": 5427} {"train_loss": -27.109189987182617, "global_step": 450458, "epoch": 5427} {"train_loss": -27.082014083862305, "global_step": 450459, "epoch": 5427} {"train_loss": -26.8265323638916, "global_step": 450460, "epoch": 5427} {"train_loss": -26.732229232788086, "global_step": 450461, "epoch": 5427} {"train_loss": -27.004108428955078, "global_step": 450462, "epoch": 5427} {"train_loss": -27.11338233947754, "global_step": 450463, "epoch": 5427} {"train_loss": -27.118030548095703, "global_step": 450464, "epoch": 5427} {"train_loss": -26.78230094909668, "global_step": 450465, "epoch": 5427} {"train_loss": -26.73748207092285, "global_step": 450466, "epoch": 5427} {"train_loss": -27.24908447265625, "global_step": 450467, "epoch": 5427} {"train_loss": -27.180078506469727, "global_step": 450468, "epoch": 5427} {"train_loss": -26.572677612304688, "global_step": 450469, "epoch": 5427} {"train_loss": -27.0689640045166, "global_step": 450470, "epoch": 5427} {"train_loss": -26.953155517578125, "global_step": 450471, "epoch": 5427} {"train_loss": -26.925668716430664, "global_step": 450472, "epoch": 5427} {"train_loss": -27.333179473876953, "global_step": 450473, "epoch": 5427} {"train_loss": -26.8028621673584, "global_step": 450474, "epoch": 5427} {"train_loss": -27.267892837524414, "global_step": 450475, "epoch": 5427} {"train_loss": -27.154632568359375, "global_step": 450476, "epoch": 5427} {"train_loss": -26.75482177734375, "global_step": 450477, "epoch": 5427} {"train_loss": -27.038740158081055, "global_step": 450478, "epoch": 5427} {"train_loss": -27.215246200561523, "global_step": 450479, "epoch": 5427} {"train_loss": -27.06696891784668, "global_step": 450480, "epoch": 5427} {"train_loss": -26.970401763916016, "global_step": 450481, "epoch": 5427} {"train_loss": -27.068456649780273, "global_step": 450482, "epoch": 5427} {"train_loss": -27.394453048706055, "global_step": 450483, "epoch": 5427} {"train_loss": -27.133264541625977, "global_step": 450484, "epoch": 5427} {"train_loss": -27.17258644104004, "global_step": 450485, "epoch": 5427} {"train_loss": -27.16497802734375, "global_step": 450486, "epoch": 5427} {"train_loss": -27.0610294342041, "global_step": 450487, "epoch": 5427} {"train_loss": -27.047468185424805, "global_step": 450488, "epoch": 5427} {"train_loss": -26.975555419921875, "global_step": 450489, "epoch": 5427} {"train_loss": -27.456567764282227, "global_step": 450490, "epoch": 5427} {"train_loss": -26.888412475585938, "global_step": 450491, "epoch": 5427} {"train_loss": -26.98944664001465, "global_step": 450492, "epoch": 5427} {"train_loss": -27.104406356811523, "global_step": 450493, "epoch": 5427} {"train_loss": -27.23731803894043, "global_step": 450494, "epoch": 5427} {"train_loss": -27.063161849975586, "global_step": 450495, "epoch": 5427} {"train_loss": -27.15264320373535, "global_step": 450496, "epoch": 5427} {"train_loss": -27.08846092224121, "global_step": 450497, "epoch": 5427} {"train_loss": -26.959461212158203, "global_step": 450498, "epoch": 5427} {"train_loss": -27.0765323638916, "global_step": 450499, "epoch": 5427} {"train_loss": -27.07924461364746, "global_step": 450500, "epoch": 5427} {"train_loss": -26.908933639526367, "global_step": 450501, "epoch": 5427} {"train_loss": -27.300445556640625, "global_step": 450502, "epoch": 5427} {"train_loss": -27.320180892944336, "global_step": 450503, "epoch": 5427} {"train_loss": -27.0084285736084, "global_step": 450504, "epoch": 5427} {"train_loss": -27.373138427734375, "global_step": 450505, "epoch": 5427} {"train_loss": -27.277408599853516, "global_step": 450506, "epoch": 5427} {"train_loss": -27.303836822509766, "global_step": 450507, "epoch": 5427} {"train_loss": -26.75690269470215, "global_step": 450508, "epoch": 5427} {"train_loss": -26.936777114868164, "global_step": 450509, "epoch": 5427} {"train_loss": -26.015552520751953, "global_step": 450510, "epoch": 5427} {"train_loss": -25.8429012298584, "global_step": 450511, "epoch": 5427} {"train_loss": -25.725915908813477, "global_step": 450512, "epoch": 5427} {"train_loss": -25.93328285217285, "global_step": 450513, "epoch": 5427} {"train_loss": -26.3216495513916, "global_step": 450514, "epoch": 5427} {"train_loss": -26.40472984313965, "global_step": 450515, "epoch": 5427} {"train_loss": -26.436237335205078, "global_step": 450516, "epoch": 5427} {"train_loss": -25.88990592956543, "global_step": 450517, "epoch": 5427} {"train_loss": -26.540029525756836, "global_step": 450518, "epoch": 5427} {"train_loss": -26.580413818359375, "global_step": 450519, "epoch": 5427} {"train_loss": -26.66415786743164, "global_step": 450520, "epoch": 5427} {"train_loss": -26.30405044555664, "global_step": 450521, "epoch": 5427} {"train_loss": -26.56672477722168, "global_step": 450522, "epoch": 5427} {"train_loss": -26.854738993817065, "global_step": 450523, "epoch": 5427, "val_loss": 6560113.0} {"train_loss": -26.500486373901367, "global_step": 450524, "epoch": 5428} {"train_loss": -26.006622314453125, "global_step": 450525, "epoch": 5428} {"train_loss": -25.624897003173828, "global_step": 450526, "epoch": 5428} {"train_loss": -26.058195114135742, "global_step": 450527, "epoch": 5428} {"train_loss": -25.590312957763672, "global_step": 450528, "epoch": 5428} {"train_loss": -26.070234298706055, "global_step": 450529, "epoch": 5428} {"train_loss": -26.495380401611328, "global_step": 450530, "epoch": 5428} {"train_loss": -26.39813232421875, "global_step": 450531, "epoch": 5428} {"train_loss": -26.304418563842773, "global_step": 450532, "epoch": 5428} {"train_loss": -26.146833419799805, "global_step": 450533, "epoch": 5428} {"train_loss": -26.323820114135742, "global_step": 450534, "epoch": 5428} {"train_loss": -26.62460708618164, "global_step": 450535, "epoch": 5428} {"train_loss": -26.568756103515625, "global_step": 450536, "epoch": 5428} {"train_loss": -26.594411849975586, "global_step": 450537, "epoch": 5428} {"train_loss": -26.22968864440918, "global_step": 450538, "epoch": 5428} {"train_loss": -26.22356605529785, "global_step": 450539, "epoch": 5428} {"train_loss": -26.500085830688477, "global_step": 450540, "epoch": 5428} {"train_loss": -26.632055282592773, "global_step": 450541, "epoch": 5428} {"train_loss": -26.490814208984375, "global_step": 450542, "epoch": 5428} {"train_loss": -26.643598556518555, "global_step": 450543, "epoch": 5428} {"train_loss": -26.854421615600586, "global_step": 450544, "epoch": 5428} {"train_loss": -26.566709518432617, "global_step": 450545, "epoch": 5428} {"train_loss": -27.055044174194336, "global_step": 450546, "epoch": 5428} {"train_loss": -26.878585815429688, "global_step": 450547, "epoch": 5428} {"train_loss": -26.89181900024414, "global_step": 450548, "epoch": 5428} {"train_loss": -26.747766494750977, "global_step": 450549, "epoch": 5428} {"train_loss": -27.345911026000977, "global_step": 450550, "epoch": 5428} {"train_loss": -26.590728759765625, "global_step": 450551, "epoch": 5428} {"train_loss": -26.96466064453125, "global_step": 450552, "epoch": 5428} {"train_loss": -26.7596378326416, "global_step": 450553, "epoch": 5428} {"train_loss": -26.824630737304688, "global_step": 450554, "epoch": 5428} {"train_loss": -27.513275146484375, "global_step": 450555, "epoch": 5428} {"train_loss": -26.8432674407959, "global_step": 450556, "epoch": 5428} {"train_loss": -26.949634552001953, "global_step": 450557, "epoch": 5428} {"train_loss": -27.057071685791016, "global_step": 450558, "epoch": 5428} {"train_loss": -27.2160701751709, "global_step": 450559, "epoch": 5428} {"train_loss": -27.521512985229492, "global_step": 450560, "epoch": 5428} {"train_loss": -27.055906295776367, "global_step": 450561, "epoch": 5428} {"train_loss": -26.905654907226562, "global_step": 450562, "epoch": 5428} {"train_loss": -27.182758331298828, "global_step": 450563, "epoch": 5428} {"train_loss": -27.172460556030273, "global_step": 450564, "epoch": 5428} {"train_loss": -27.05802345275879, "global_step": 450565, "epoch": 5428} {"train_loss": -27.118749618530273, "global_step": 450566, "epoch": 5428} {"train_loss": -27.103498458862305, "global_step": 450567, "epoch": 5428} {"train_loss": -26.630889892578125, "global_step": 450568, "epoch": 5428} {"train_loss": -27.07032585144043, "global_step": 450569, "epoch": 5428} {"train_loss": -26.74069595336914, "global_step": 450570, "epoch": 5428} {"train_loss": -27.12116050720215, "global_step": 450571, "epoch": 5428} {"train_loss": -27.102066040039062, "global_step": 450572, "epoch": 5428} {"train_loss": -27.171833038330078, "global_step": 450573, "epoch": 5428} {"train_loss": -27.17262077331543, "global_step": 450574, "epoch": 5428} {"train_loss": -27.028961181640625, "global_step": 450575, "epoch": 5428} {"train_loss": -26.936132431030273, "global_step": 450576, "epoch": 5428} {"train_loss": -26.73114013671875, "global_step": 450577, "epoch": 5428} {"train_loss": -27.12504005432129, "global_step": 450578, "epoch": 5428} {"train_loss": -26.631702423095703, "global_step": 450579, "epoch": 5428} {"train_loss": -27.162765502929688, "global_step": 450580, "epoch": 5428} {"train_loss": -26.81488037109375, "global_step": 450581, "epoch": 5428} {"train_loss": -27.121780395507812, "global_step": 450582, "epoch": 5428} {"train_loss": -27.113174438476562, "global_step": 450583, "epoch": 5428} {"train_loss": -27.26783561706543, "global_step": 450584, "epoch": 5428} {"train_loss": -27.34930992126465, "global_step": 450585, "epoch": 5428} {"train_loss": -26.584705352783203, "global_step": 450586, "epoch": 5428} {"train_loss": -26.776464462280273, "global_step": 450587, "epoch": 5428} {"train_loss": -26.81068229675293, "global_step": 450588, "epoch": 5428} {"train_loss": -27.251068115234375, "global_step": 450589, "epoch": 5428} {"train_loss": -27.252166748046875, "global_step": 450590, "epoch": 5428} {"train_loss": -27.008344650268555, "global_step": 450591, "epoch": 5428} {"train_loss": -27.342756271362305, "global_step": 450592, "epoch": 5428} {"train_loss": -27.356225967407227, "global_step": 450593, "epoch": 5428} {"train_loss": -27.50507164001465, "global_step": 450594, "epoch": 5428} {"train_loss": -26.879653930664062, "global_step": 450595, "epoch": 5428} {"train_loss": -27.738683700561523, "global_step": 450596, "epoch": 5428} {"train_loss": -27.286291122436523, "global_step": 450597, "epoch": 5428} {"train_loss": -26.975427627563477, "global_step": 450598, "epoch": 5428} {"train_loss": -27.377838134765625, "global_step": 450599, "epoch": 5428} {"train_loss": -26.91505241394043, "global_step": 450600, "epoch": 5428} {"train_loss": -27.287118911743164, "global_step": 450601, "epoch": 5428} {"train_loss": -27.085102081298828, "global_step": 450602, "epoch": 5428} {"train_loss": -26.7481689453125, "global_step": 450603, "epoch": 5428} {"train_loss": -26.847501754760742, "global_step": 450604, "epoch": 5428} {"train_loss": -27.534626007080078, "global_step": 450605, "epoch": 5428} {"train_loss": -26.860668067472528, "global_step": 450606, "epoch": 5428, "val_loss": 6560822.0} {"train_loss": -26.687097549438477, "global_step": 450607, "epoch": 5429} {"train_loss": -26.179065704345703, "global_step": 450608, "epoch": 5429} {"train_loss": -26.013608932495117, "global_step": 450609, "epoch": 5429} {"train_loss": -26.591873168945312, "global_step": 450610, "epoch": 5429} {"train_loss": -26.63470458984375, "global_step": 450611, "epoch": 5429} {"train_loss": -26.375959396362305, "global_step": 450612, "epoch": 5429} {"train_loss": -26.569067001342773, "global_step": 450613, "epoch": 5429} {"train_loss": -26.596633911132812, "global_step": 450614, "epoch": 5429} {"train_loss": -26.718505859375, "global_step": 450615, "epoch": 5429} {"train_loss": -26.753843307495117, "global_step": 450616, "epoch": 5429} {"train_loss": -26.5084228515625, "global_step": 450617, "epoch": 5429} {"train_loss": -25.987506866455078, "global_step": 450618, "epoch": 5429} {"train_loss": -27.20778465270996, "global_step": 450619, "epoch": 5429} {"train_loss": -26.870031356811523, "global_step": 450620, "epoch": 5429} {"train_loss": -27.13020896911621, "global_step": 450621, "epoch": 5429} {"train_loss": -26.569320678710938, "global_step": 450622, "epoch": 5429} {"train_loss": -26.854406356811523, "global_step": 450623, "epoch": 5429} {"train_loss": -26.900959014892578, "global_step": 450624, "epoch": 5429} {"train_loss": -26.712743759155273, "global_step": 450625, "epoch": 5429} {"train_loss": -27.180639266967773, "global_step": 450626, "epoch": 5429} {"train_loss": -26.92667007446289, "global_step": 450627, "epoch": 5429} {"train_loss": -26.8123836517334, "global_step": 450628, "epoch": 5429} {"train_loss": -26.98870277404785, "global_step": 450629, "epoch": 5429} {"train_loss": -26.990066528320312, "global_step": 450630, "epoch": 5429} {"train_loss": -26.793813705444336, "global_step": 450631, "epoch": 5429} {"train_loss": -27.080068588256836, "global_step": 450632, "epoch": 5429} {"train_loss": -27.311735153198242, "global_step": 450633, "epoch": 5429} {"train_loss": -27.145339965820312, "global_step": 450634, "epoch": 5429} {"train_loss": -27.128149032592773, "global_step": 450635, "epoch": 5429} {"train_loss": -27.030248641967773, "global_step": 450636, "epoch": 5429} {"train_loss": -27.30059242248535, "global_step": 450637, "epoch": 5429} {"train_loss": -26.811267852783203, "global_step": 450638, "epoch": 5429} {"train_loss": -27.1263370513916, "global_step": 450639, "epoch": 5429} {"train_loss": -27.16449546813965, "global_step": 450640, "epoch": 5429} {"train_loss": -27.151412963867188, "global_step": 450641, "epoch": 5429} {"train_loss": -26.99550437927246, "global_step": 450642, "epoch": 5429} {"train_loss": -26.98063087463379, "global_step": 450643, "epoch": 5429} {"train_loss": -27.269681930541992, "global_step": 450644, "epoch": 5429} {"train_loss": -27.112049102783203, "global_step": 450645, "epoch": 5429} {"train_loss": -27.25125503540039, "global_step": 450646, "epoch": 5429} {"train_loss": -27.201251983642578, "global_step": 450647, "epoch": 5429} {"train_loss": -26.757795333862305, "global_step": 450648, "epoch": 5429} {"train_loss": -26.211135864257812, "global_step": 450649, "epoch": 5429} {"train_loss": -26.33091163635254, "global_step": 450650, "epoch": 5429} {"train_loss": -26.874866485595703, "global_step": 450651, "epoch": 5429} {"train_loss": -26.991479873657227, "global_step": 450652, "epoch": 5429} {"train_loss": -26.56092643737793, "global_step": 450653, "epoch": 5429} {"train_loss": -26.74078941345215, "global_step": 450654, "epoch": 5429} {"train_loss": -26.777570724487305, "global_step": 450655, "epoch": 5429} {"train_loss": -26.9479923248291, "global_step": 450656, "epoch": 5429} {"train_loss": -27.014917373657227, "global_step": 450657, "epoch": 5429} {"train_loss": -27.078794479370117, "global_step": 450658, "epoch": 5429} {"train_loss": -26.761188507080078, "global_step": 450659, "epoch": 5429} {"train_loss": -26.958921432495117, "global_step": 450660, "epoch": 5429} {"train_loss": -27.421222686767578, "global_step": 450661, "epoch": 5429} {"train_loss": -27.34671974182129, "global_step": 450662, "epoch": 5429} {"train_loss": -26.699308395385742, "global_step": 450663, "epoch": 5429} {"train_loss": -26.786334991455078, "global_step": 450664, "epoch": 5429} {"train_loss": -27.166278839111328, "global_step": 450665, "epoch": 5429} {"train_loss": -26.986042022705078, "global_step": 450666, "epoch": 5429} {"train_loss": -27.283390045166016, "global_step": 450667, "epoch": 5429} {"train_loss": -27.153284072875977, "global_step": 450668, "epoch": 5429} {"train_loss": -27.238616943359375, "global_step": 450669, "epoch": 5429} {"train_loss": -27.264509201049805, "global_step": 450670, "epoch": 5429} {"train_loss": -27.468862533569336, "global_step": 450671, "epoch": 5429} {"train_loss": -27.14198875427246, "global_step": 450672, "epoch": 5429} {"train_loss": -27.34388542175293, "global_step": 450673, "epoch": 5429} {"train_loss": -27.125314712524414, "global_step": 450674, "epoch": 5429} {"train_loss": -27.566511154174805, "global_step": 450675, "epoch": 5429} {"train_loss": -26.65082359313965, "global_step": 450676, "epoch": 5429} {"train_loss": -26.79498863220215, "global_step": 450677, "epoch": 5429} {"train_loss": -26.727344512939453, "global_step": 450678, "epoch": 5429} {"train_loss": -26.509033203125, "global_step": 450679, "epoch": 5429} {"train_loss": -26.21522331237793, "global_step": 450680, "epoch": 5429} {"train_loss": -25.620813369750977, "global_step": 450681, "epoch": 5429} {"train_loss": -26.468000411987305, "global_step": 450682, "epoch": 5429} {"train_loss": -26.542041778564453, "global_step": 450683, "epoch": 5429} {"train_loss": -26.926427841186523, "global_step": 450684, "epoch": 5429} {"train_loss": -25.789600372314453, "global_step": 450685, "epoch": 5429} {"train_loss": -26.366010665893555, "global_step": 450686, "epoch": 5429} {"train_loss": -26.544641494750977, "global_step": 450687, "epoch": 5429} {"train_loss": -26.254608154296875, "global_step": 450688, "epoch": 5429} {"train_loss": -26.823243060743952, "global_step": 450689, "epoch": 5429, "val_loss": 6531426.0} {"train_loss": -26.311044692993164, "global_step": 450690, "epoch": 5430} {"train_loss": -25.497400283813477, "global_step": 450691, "epoch": 5430} {"train_loss": -26.276601791381836, "global_step": 450692, "epoch": 5430} {"train_loss": -26.489490509033203, "global_step": 450693, "epoch": 5430} {"train_loss": -26.28269386291504, "global_step": 450694, "epoch": 5430} {"train_loss": -26.681684494018555, "global_step": 450695, "epoch": 5430} {"train_loss": -26.096912384033203, "global_step": 450696, "epoch": 5430} {"train_loss": -26.4730224609375, "global_step": 450697, "epoch": 5430} {"train_loss": -26.417264938354492, "global_step": 450698, "epoch": 5430} {"train_loss": -26.3512020111084, "global_step": 450699, "epoch": 5430} {"train_loss": -26.70855140686035, "global_step": 450700, "epoch": 5430} {"train_loss": -26.63248062133789, "global_step": 450701, "epoch": 5430} {"train_loss": -26.91737174987793, "global_step": 450702, "epoch": 5430} {"train_loss": -26.747522354125977, "global_step": 450703, "epoch": 5430} {"train_loss": -26.63787841796875, "global_step": 450704, "epoch": 5430} {"train_loss": -26.461042404174805, "global_step": 450705, "epoch": 5430} {"train_loss": -26.799518585205078, "global_step": 450706, "epoch": 5430} {"train_loss": -26.54819679260254, "global_step": 450707, "epoch": 5430} {"train_loss": -26.53885269165039, "global_step": 450708, "epoch": 5430} {"train_loss": -26.38435173034668, "global_step": 450709, "epoch": 5430} {"train_loss": -26.964319229125977, "global_step": 450710, "epoch": 5430} {"train_loss": -26.57264518737793, "global_step": 450711, "epoch": 5430} {"train_loss": -26.71477699279785, "global_step": 450712, "epoch": 5430} {"train_loss": -26.8397274017334, "global_step": 450713, "epoch": 5430} {"train_loss": -26.698827743530273, "global_step": 450714, "epoch": 5430} {"train_loss": -26.480026245117188, "global_step": 450715, "epoch": 5430} {"train_loss": -26.929418563842773, "global_step": 450716, "epoch": 5430} {"train_loss": -26.920001983642578, "global_step": 450717, "epoch": 5430} {"train_loss": -26.84577751159668, "global_step": 450718, "epoch": 5430} {"train_loss": -27.017181396484375, "global_step": 450719, "epoch": 5430} {"train_loss": -26.7454833984375, "global_step": 450720, "epoch": 5430} {"train_loss": -27.157428741455078, "global_step": 450721, "epoch": 5430} {"train_loss": -26.809326171875, "global_step": 450722, "epoch": 5430} {"train_loss": -27.11297035217285, "global_step": 450723, "epoch": 5430} {"train_loss": -26.8703556060791, "global_step": 450724, "epoch": 5430} {"train_loss": -27.075393676757812, "global_step": 450725, "epoch": 5430} {"train_loss": -26.563955307006836, "global_step": 450726, "epoch": 5430} {"train_loss": -26.836139678955078, "global_step": 450727, "epoch": 5430} {"train_loss": -27.122711181640625, "global_step": 450728, "epoch": 5430} {"train_loss": -26.937469482421875, "global_step": 450729, "epoch": 5430} {"train_loss": -27.222280502319336, "global_step": 450730, "epoch": 5430} {"train_loss": -27.090728759765625, "global_step": 450731, "epoch": 5430} {"train_loss": -27.037841796875, "global_step": 450732, "epoch": 5430} {"train_loss": -27.182571411132812, "global_step": 450733, "epoch": 5430} {"train_loss": -27.333906173706055, "global_step": 450734, "epoch": 5430} {"train_loss": -27.475727081298828, "global_step": 450735, "epoch": 5430} {"train_loss": -27.309717178344727, "global_step": 450736, "epoch": 5430} {"train_loss": -27.379072189331055, "global_step": 450737, "epoch": 5430} {"train_loss": -27.397363662719727, "global_step": 450738, "epoch": 5430} {"train_loss": -27.353809356689453, "global_step": 450739, "epoch": 5430} {"train_loss": -27.365270614624023, "global_step": 450740, "epoch": 5430} {"train_loss": -27.239643096923828, "global_step": 450741, "epoch": 5430} {"train_loss": -26.953882217407227, "global_step": 450742, "epoch": 5430} {"train_loss": -26.653594970703125, "global_step": 450743, "epoch": 5430} {"train_loss": -26.710269927978516, "global_step": 450744, "epoch": 5430} {"train_loss": -27.4200439453125, "global_step": 450745, "epoch": 5430} {"train_loss": -27.176410675048828, "global_step": 450746, "epoch": 5430} {"train_loss": -27.04524803161621, "global_step": 450747, "epoch": 5430} {"train_loss": -26.74604606628418, "global_step": 450748, "epoch": 5430} {"train_loss": -26.55059242248535, "global_step": 450749, "epoch": 5430} {"train_loss": -26.862070083618164, "global_step": 450750, "epoch": 5430} {"train_loss": -26.873340606689453, "global_step": 450751, "epoch": 5430} {"train_loss": -27.018827438354492, "global_step": 450752, "epoch": 5430} {"train_loss": -26.53076171875, "global_step": 450753, "epoch": 5430} {"train_loss": -26.7393856048584, "global_step": 450754, "epoch": 5430} {"train_loss": -26.93634033203125, "global_step": 450755, "epoch": 5430} {"train_loss": -26.832361221313477, "global_step": 450756, "epoch": 5430} {"train_loss": -26.906295776367188, "global_step": 450757, "epoch": 5430} {"train_loss": -26.989110946655273, "global_step": 450758, "epoch": 5430} {"train_loss": -27.156370162963867, "global_step": 450759, "epoch": 5430} {"train_loss": -27.2320499420166, "global_step": 450760, "epoch": 5430} {"train_loss": -27.2128849029541, "global_step": 450761, "epoch": 5430} {"train_loss": -27.20441246032715, "global_step": 450762, "epoch": 5430} {"train_loss": -26.937387466430664, "global_step": 450763, "epoch": 5430} {"train_loss": -26.931320190429688, "global_step": 450764, "epoch": 5430} {"train_loss": -27.41228675842285, "global_step": 450765, "epoch": 5430} {"train_loss": -27.202274322509766, "global_step": 450766, "epoch": 5430} {"train_loss": -27.06267738342285, "global_step": 450767, "epoch": 5430} {"train_loss": -27.36090660095215, "global_step": 450768, "epoch": 5430} {"train_loss": -26.89150047302246, "global_step": 450769, "epoch": 5430} {"train_loss": -27.098081588745117, "global_step": 450770, "epoch": 5430} {"train_loss": -26.865055084228516, "global_step": 450771, "epoch": 5430} {"train_loss": -26.87318475562406, "global_step": 450772, "epoch": 5430, "val_loss": 6537870.5} {"train_loss": -26.795331954956055, "global_step": 450773, "epoch": 5431} {"train_loss": -26.922239303588867, "global_step": 450774, "epoch": 5431} {"train_loss": -27.017087936401367, "global_step": 450775, "epoch": 5431} {"train_loss": -26.31597900390625, "global_step": 450776, "epoch": 5431} {"train_loss": -26.727283477783203, "global_step": 450777, "epoch": 5431} {"train_loss": -26.41963005065918, "global_step": 450778, "epoch": 5431} {"train_loss": -26.885522842407227, "global_step": 450779, "epoch": 5431} {"train_loss": -26.576324462890625, "global_step": 450780, "epoch": 5431} {"train_loss": -26.940540313720703, "global_step": 450781, "epoch": 5431} {"train_loss": -26.61359977722168, "global_step": 450782, "epoch": 5431} {"train_loss": -26.984588623046875, "global_step": 450783, "epoch": 5431} {"train_loss": -27.172189712524414, "global_step": 450784, "epoch": 5431} {"train_loss": -26.881338119506836, "global_step": 450785, "epoch": 5431} {"train_loss": -26.59958267211914, "global_step": 450786, "epoch": 5431} {"train_loss": -26.978235244750977, "global_step": 450787, "epoch": 5431} {"train_loss": -27.4774169921875, "global_step": 450788, "epoch": 5431} {"train_loss": -27.43512535095215, "global_step": 450789, "epoch": 5431} {"train_loss": -27.06036949157715, "global_step": 450790, "epoch": 5431} {"train_loss": -27.23860740661621, "global_step": 450791, "epoch": 5431} {"train_loss": -27.269123077392578, "global_step": 450792, "epoch": 5431} {"train_loss": -27.281482696533203, "global_step": 450793, "epoch": 5431} {"train_loss": -27.393081665039062, "global_step": 450794, "epoch": 5431} {"train_loss": -27.360349655151367, "global_step": 450795, "epoch": 5431} {"train_loss": -27.386762619018555, "global_step": 450796, "epoch": 5431} {"train_loss": -27.137731552124023, "global_step": 450797, "epoch": 5431} {"train_loss": -26.992944717407227, "global_step": 450798, "epoch": 5431} {"train_loss": -27.294403076171875, "global_step": 450799, "epoch": 5431} {"train_loss": -27.22994041442871, "global_step": 450800, "epoch": 5431} {"train_loss": -27.485504150390625, "global_step": 450801, "epoch": 5431} {"train_loss": -27.359357833862305, "global_step": 450802, "epoch": 5431} {"train_loss": -27.534378051757812, "global_step": 450803, "epoch": 5431} {"train_loss": -27.15620231628418, "global_step": 450804, "epoch": 5431} {"train_loss": -27.31146812438965, "global_step": 450805, "epoch": 5431} {"train_loss": -27.07207679748535, "global_step": 450806, "epoch": 5431} {"train_loss": -27.181262969970703, "global_step": 450807, "epoch": 5431} {"train_loss": -27.158309936523438, "global_step": 450808, "epoch": 5431} {"train_loss": -26.913864135742188, "global_step": 450809, "epoch": 5431} {"train_loss": -27.298480987548828, "global_step": 450810, "epoch": 5431} {"train_loss": -27.057851791381836, "global_step": 450811, "epoch": 5431} {"train_loss": -27.299652099609375, "global_step": 450812, "epoch": 5431} {"train_loss": -27.58904457092285, "global_step": 450813, "epoch": 5431} {"train_loss": -27.44086265563965, "global_step": 450814, "epoch": 5431} {"train_loss": -27.18320083618164, "global_step": 450815, "epoch": 5431} {"train_loss": -26.79790687561035, "global_step": 450816, "epoch": 5431} {"train_loss": -26.86456871032715, "global_step": 450817, "epoch": 5431} {"train_loss": -27.36332130432129, "global_step": 450818, "epoch": 5431} {"train_loss": -27.055932998657227, "global_step": 450819, "epoch": 5431} {"train_loss": -27.20611572265625, "global_step": 450820, "epoch": 5431} {"train_loss": -27.226383209228516, "global_step": 450821, "epoch": 5431} {"train_loss": -27.305572509765625, "global_step": 450822, "epoch": 5431} {"train_loss": -27.062002182006836, "global_step": 450823, "epoch": 5431} {"train_loss": -27.117929458618164, "global_step": 450824, "epoch": 5431} {"train_loss": -27.295989990234375, "global_step": 450825, "epoch": 5431} {"train_loss": -27.693302154541016, "global_step": 450826, "epoch": 5431} {"train_loss": -27.227643966674805, "global_step": 450827, "epoch": 5431} {"train_loss": -27.474332809448242, "global_step": 450828, "epoch": 5431} {"train_loss": -26.9316349029541, "global_step": 450829, "epoch": 5431} {"train_loss": -26.9350643157959, "global_step": 450830, "epoch": 5431} {"train_loss": -26.114099502563477, "global_step": 450831, "epoch": 5431} {"train_loss": -25.61920166015625, "global_step": 450832, "epoch": 5431} {"train_loss": -25.815244674682617, "global_step": 450833, "epoch": 5431} {"train_loss": -26.55816650390625, "global_step": 450834, "epoch": 5431} {"train_loss": -26.577722549438477, "global_step": 450835, "epoch": 5431} {"train_loss": -26.510663986206055, "global_step": 450836, "epoch": 5431} {"train_loss": -26.922473907470703, "global_step": 450837, "epoch": 5431} {"train_loss": -26.683303833007812, "global_step": 450838, "epoch": 5431} {"train_loss": -26.38532066345215, "global_step": 450839, "epoch": 5431} {"train_loss": -26.68596839904785, "global_step": 450840, "epoch": 5431} {"train_loss": -25.96107292175293, "global_step": 450841, "epoch": 5431} {"train_loss": -26.8663387298584, "global_step": 450842, "epoch": 5431} {"train_loss": -26.3217830657959, "global_step": 450843, "epoch": 5431} {"train_loss": -26.649810791015625, "global_step": 450844, "epoch": 5431} {"train_loss": -26.9516544342041, "global_step": 450845, "epoch": 5431} {"train_loss": -26.761926651000977, "global_step": 450846, "epoch": 5431} {"train_loss": -26.744892120361328, "global_step": 450847, "epoch": 5431} {"train_loss": -27.032926559448242, "global_step": 450848, "epoch": 5431} {"train_loss": -26.797964096069336, "global_step": 450849, "epoch": 5431} {"train_loss": -26.67901611328125, "global_step": 450850, "epoch": 5431} {"train_loss": -26.8377742767334, "global_step": 450851, "epoch": 5431} {"train_loss": -26.3131046295166, "global_step": 450852, "epoch": 5431} {"train_loss": -26.97189712524414, "global_step": 450853, "epoch": 5431} {"train_loss": -26.892108917236328, "global_step": 450854, "epoch": 5431} {"train_loss": -26.93805069521249, "global_step": 450855, "epoch": 5431, "val_loss": 6553841.0} {"train_loss": -26.298847198486328, "global_step": 450856, "epoch": 5432} {"train_loss": -26.722192764282227, "global_step": 450857, "epoch": 5432} {"train_loss": -26.53065299987793, "global_step": 450858, "epoch": 5432} {"train_loss": -25.807641983032227, "global_step": 450859, "epoch": 5432} {"train_loss": -26.170642852783203, "global_step": 450860, "epoch": 5432} {"train_loss": -26.242719650268555, "global_step": 450861, "epoch": 5432} {"train_loss": -26.184741973876953, "global_step": 450862, "epoch": 5432} {"train_loss": -26.591445922851562, "global_step": 450863, "epoch": 5432} {"train_loss": -25.36543846130371, "global_step": 450864, "epoch": 5432} {"train_loss": -26.275949478149414, "global_step": 450865, "epoch": 5432} {"train_loss": -26.149005889892578, "global_step": 450866, "epoch": 5432} {"train_loss": -26.28424072265625, "global_step": 450867, "epoch": 5432} {"train_loss": -26.4113712310791, "global_step": 450868, "epoch": 5432} {"train_loss": -26.051990509033203, "global_step": 450869, "epoch": 5432} {"train_loss": -26.304428100585938, "global_step": 450870, "epoch": 5432} {"train_loss": -26.4486083984375, "global_step": 450871, "epoch": 5432} {"train_loss": -26.26801109313965, "global_step": 450872, "epoch": 5432} {"train_loss": -26.446081161499023, "global_step": 450873, "epoch": 5432} {"train_loss": -26.895029067993164, "global_step": 450874, "epoch": 5432} {"train_loss": -26.783233642578125, "global_step": 450875, "epoch": 5432} {"train_loss": -26.871326446533203, "global_step": 450876, "epoch": 5432} {"train_loss": -26.588333129882812, "global_step": 450877, "epoch": 5432} {"train_loss": -26.74200439453125, "global_step": 450878, "epoch": 5432} {"train_loss": -26.666595458984375, "global_step": 450879, "epoch": 5432} {"train_loss": -26.718244552612305, "global_step": 450880, "epoch": 5432} {"train_loss": -26.60638999938965, "global_step": 450881, "epoch": 5432} {"train_loss": -26.95149040222168, "global_step": 450882, "epoch": 5432} {"train_loss": -26.514617919921875, "global_step": 450883, "epoch": 5432} {"train_loss": -26.703510284423828, "global_step": 450884, "epoch": 5432} {"train_loss": -26.984058380126953, "global_step": 450885, "epoch": 5432} {"train_loss": -26.913501739501953, "global_step": 450886, "epoch": 5432} {"train_loss": -26.73749351501465, "global_step": 450887, "epoch": 5432} {"train_loss": -26.596906661987305, "global_step": 450888, "epoch": 5432} {"train_loss": -27.05671501159668, "global_step": 450889, "epoch": 5432} {"train_loss": -26.71290397644043, "global_step": 450890, "epoch": 5432} {"train_loss": -26.821197509765625, "global_step": 450891, "epoch": 5432} {"train_loss": -27.19502067565918, "global_step": 450892, "epoch": 5432} {"train_loss": -27.345178604125977, "global_step": 450893, "epoch": 5432} {"train_loss": -27.410581588745117, "global_step": 450894, "epoch": 5432} {"train_loss": -27.276121139526367, "global_step": 450895, "epoch": 5432} {"train_loss": -27.21295166015625, "global_step": 450896, "epoch": 5432} {"train_loss": -26.824827194213867, "global_step": 450897, "epoch": 5432} {"train_loss": -27.164663314819336, "global_step": 450898, "epoch": 5432} {"train_loss": -27.164636611938477, "global_step": 450899, "epoch": 5432} {"train_loss": -27.146961212158203, "global_step": 450900, "epoch": 5432} {"train_loss": -27.188796997070312, "global_step": 450901, "epoch": 5432} {"train_loss": -27.21148681640625, "global_step": 450902, "epoch": 5432} {"train_loss": -27.103269577026367, "global_step": 450903, "epoch": 5432} {"train_loss": -27.323461532592773, "global_step": 450904, "epoch": 5432} {"train_loss": -27.125015258789062, "global_step": 450905, "epoch": 5432} {"train_loss": -27.207799911499023, "global_step": 450906, "epoch": 5432} {"train_loss": -27.193328857421875, "global_step": 450907, "epoch": 5432} {"train_loss": -27.15943717956543, "global_step": 450908, "epoch": 5432} {"train_loss": -27.231748580932617, "global_step": 450909, "epoch": 5432} {"train_loss": -27.287109375, "global_step": 450910, "epoch": 5432} {"train_loss": -27.03846549987793, "global_step": 450911, "epoch": 5432} {"train_loss": -26.98883056640625, "global_step": 450912, "epoch": 5432} {"train_loss": -27.4150447845459, "global_step": 450913, "epoch": 5432} {"train_loss": -27.0645809173584, "global_step": 450914, "epoch": 5432} {"train_loss": -26.968297958374023, "global_step": 450915, "epoch": 5432} {"train_loss": -26.96369743347168, "global_step": 450916, "epoch": 5432} {"train_loss": -27.376096725463867, "global_step": 450917, "epoch": 5432} {"train_loss": -27.367223739624023, "global_step": 450918, "epoch": 5432} {"train_loss": -27.227514266967773, "global_step": 450919, "epoch": 5432} {"train_loss": -27.1253662109375, "global_step": 450920, "epoch": 5432} {"train_loss": -27.31829833984375, "global_step": 450921, "epoch": 5432} {"train_loss": -27.231094360351562, "global_step": 450922, "epoch": 5432} {"train_loss": -27.18619155883789, "global_step": 450923, "epoch": 5432} {"train_loss": -26.916894912719727, "global_step": 450924, "epoch": 5432} {"train_loss": -26.955801010131836, "global_step": 450925, "epoch": 5432} {"train_loss": -26.787036895751953, "global_step": 450926, "epoch": 5432} {"train_loss": -27.353368759155273, "global_step": 450927, "epoch": 5432} {"train_loss": -26.786483764648438, "global_step": 450928, "epoch": 5432} {"train_loss": -26.83765983581543, "global_step": 450929, "epoch": 5432} {"train_loss": -27.195409774780273, "global_step": 450930, "epoch": 5432} {"train_loss": -27.096277236938477, "global_step": 450931, "epoch": 5432} {"train_loss": -26.83333396911621, "global_step": 450932, "epoch": 5432} {"train_loss": -27.059064865112305, "global_step": 450933, "epoch": 5432} {"train_loss": -27.16457176208496, "global_step": 450934, "epoch": 5432} {"train_loss": -27.07566261291504, "global_step": 450935, "epoch": 5432} {"train_loss": -27.0992374420166, "global_step": 450936, "epoch": 5432} {"train_loss": -27.389440536499023, "global_step": 450937, "epoch": 5432} {"train_loss": -26.874062572617127, "global_step": 450938, "epoch": 5432, "val_loss": 6549338.0} {"train_loss": -25.88411521911621, "global_step": 450939, "epoch": 5433} {"train_loss": -26.618276596069336, "global_step": 450940, "epoch": 5433} {"train_loss": -26.81601905822754, "global_step": 450941, "epoch": 5433} {"train_loss": -26.332813262939453, "global_step": 450942, "epoch": 5433} {"train_loss": -26.727956771850586, "global_step": 450943, "epoch": 5433} {"train_loss": -26.9218807220459, "global_step": 450944, "epoch": 5433} {"train_loss": -26.433746337890625, "global_step": 450945, "epoch": 5433} {"train_loss": -26.844297409057617, "global_step": 450946, "epoch": 5433} {"train_loss": -26.600332260131836, "global_step": 450947, "epoch": 5433} {"train_loss": -26.913862228393555, "global_step": 450948, "epoch": 5433} {"train_loss": -26.85511589050293, "global_step": 450949, "epoch": 5433} {"train_loss": -26.80287742614746, "global_step": 450950, "epoch": 5433} {"train_loss": -27.36408042907715, "global_step": 450951, "epoch": 5433} {"train_loss": -27.028614044189453, "global_step": 450952, "epoch": 5433} {"train_loss": -26.931482315063477, "global_step": 450953, "epoch": 5433} {"train_loss": -26.913068771362305, "global_step": 450954, "epoch": 5433} {"train_loss": -27.15559959411621, "global_step": 450955, "epoch": 5433} {"train_loss": -26.615076065063477, "global_step": 450956, "epoch": 5433} {"train_loss": -26.938379287719727, "global_step": 450957, "epoch": 5433} {"train_loss": -26.89841079711914, "global_step": 450958, "epoch": 5433} {"train_loss": -26.967947006225586, "global_step": 450959, "epoch": 5433} {"train_loss": -27.1843318939209, "global_step": 450960, "epoch": 5433} {"train_loss": -26.87933921813965, "global_step": 450961, "epoch": 5433} {"train_loss": -27.028345108032227, "global_step": 450962, "epoch": 5433} {"train_loss": -26.846576690673828, "global_step": 450963, "epoch": 5433} {"train_loss": -26.876157760620117, "global_step": 450964, "epoch": 5433} {"train_loss": -26.876562118530273, "global_step": 450965, "epoch": 5433} {"train_loss": -26.92026710510254, "global_step": 450966, "epoch": 5433} {"train_loss": -27.37587547302246, "global_step": 450967, "epoch": 5433} {"train_loss": -27.34222412109375, "global_step": 450968, "epoch": 5433} {"train_loss": -26.92512321472168, "global_step": 450969, "epoch": 5433} {"train_loss": -26.788742065429688, "global_step": 450970, "epoch": 5433} {"train_loss": -27.235639572143555, "global_step": 450971, "epoch": 5433} {"train_loss": -27.0108585357666, "global_step": 450972, "epoch": 5433} {"train_loss": -26.631689071655273, "global_step": 450973, "epoch": 5433} {"train_loss": -26.91629981994629, "global_step": 450974, "epoch": 5433} {"train_loss": -27.0939884185791, "global_step": 450975, "epoch": 5433} {"train_loss": -27.421344757080078, "global_step": 450976, "epoch": 5433} {"train_loss": -27.024404525756836, "global_step": 450977, "epoch": 5433} {"train_loss": -27.029220581054688, "global_step": 450978, "epoch": 5433} {"train_loss": -26.8699951171875, "global_step": 450979, "epoch": 5433} {"train_loss": -27.498172760009766, "global_step": 450980, "epoch": 5433} {"train_loss": -27.0258846282959, "global_step": 450981, "epoch": 5433} {"train_loss": -27.042388916015625, "global_step": 450982, "epoch": 5433} {"train_loss": -26.918241500854492, "global_step": 450983, "epoch": 5433} {"train_loss": -27.0708065032959, "global_step": 450984, "epoch": 5433} {"train_loss": -27.2030029296875, "global_step": 450985, "epoch": 5433} {"train_loss": -27.180326461791992, "global_step": 450986, "epoch": 5433} {"train_loss": -27.268762588500977, "global_step": 450987, "epoch": 5433} {"train_loss": -27.26411247253418, "global_step": 450988, "epoch": 5433} {"train_loss": -27.251508712768555, "global_step": 450989, "epoch": 5433} {"train_loss": -27.305561065673828, "global_step": 450990, "epoch": 5433} {"train_loss": -26.918386459350586, "global_step": 450991, "epoch": 5433} {"train_loss": -27.298542022705078, "global_step": 450992, "epoch": 5433} {"train_loss": -27.242191314697266, "global_step": 450993, "epoch": 5433} {"train_loss": -27.108346939086914, "global_step": 450994, "epoch": 5433} {"train_loss": -27.130857467651367, "global_step": 450995, "epoch": 5433} {"train_loss": -27.022357940673828, "global_step": 450996, "epoch": 5433} {"train_loss": -27.157733917236328, "global_step": 450997, "epoch": 5433} {"train_loss": -27.30994987487793, "global_step": 450998, "epoch": 5433} {"train_loss": -26.77689552307129, "global_step": 450999, "epoch": 5433} {"train_loss": -27.235015869140625, "global_step": 451000, "epoch": 5433} {"train_loss": -26.906665802001953, "global_step": 451001, "epoch": 5433} {"train_loss": -26.861051559448242, "global_step": 451002, "epoch": 5433} {"train_loss": -26.924652099609375, "global_step": 451003, "epoch": 5433} {"train_loss": -27.156818389892578, "global_step": 451004, "epoch": 5433} {"train_loss": -27.156620025634766, "global_step": 451005, "epoch": 5433} {"train_loss": -27.24753189086914, "global_step": 451006, "epoch": 5433} {"train_loss": -26.796649932861328, "global_step": 451007, "epoch": 5433} {"train_loss": -26.879287719726562, "global_step": 451008, "epoch": 5433} {"train_loss": -27.288232803344727, "global_step": 451009, "epoch": 5433} {"train_loss": -26.938318252563477, "global_step": 451010, "epoch": 5433} {"train_loss": -26.808307647705078, "global_step": 451011, "epoch": 5433} {"train_loss": -27.132543563842773, "global_step": 451012, "epoch": 5433} {"train_loss": -27.36859703063965, "global_step": 451013, "epoch": 5433} {"train_loss": -27.18287467956543, "global_step": 451014, "epoch": 5433} {"train_loss": -27.183887481689453, "global_step": 451015, "epoch": 5433} {"train_loss": -26.187719345092773, "global_step": 451016, "epoch": 5433} {"train_loss": -26.5125675201416, "global_step": 451017, "epoch": 5433} {"train_loss": -27.107431411743164, "global_step": 451018, "epoch": 5433} {"train_loss": -27.100610733032227, "global_step": 451019, "epoch": 5433} {"train_loss": -26.614892959594727, "global_step": 451020, "epoch": 5433} {"train_loss": -26.99762840730598, "global_step": 451021, "epoch": 5433, "val_loss": 6557251.5} {"train_loss": -24.594987869262695, "global_step": 451022, "epoch": 5434} {"train_loss": -26.44740104675293, "global_step": 451023, "epoch": 5434} {"train_loss": -25.51791763305664, "global_step": 451024, "epoch": 5434} {"train_loss": -26.965646743774414, "global_step": 451025, "epoch": 5434} {"train_loss": -25.7988224029541, "global_step": 451026, "epoch": 5434} {"train_loss": -26.150197982788086, "global_step": 451027, "epoch": 5434} {"train_loss": -26.084625244140625, "global_step": 451028, "epoch": 5434} {"train_loss": -26.264484405517578, "global_step": 451029, "epoch": 5434} {"train_loss": -26.812671661376953, "global_step": 451030, "epoch": 5434} {"train_loss": -26.342443466186523, "global_step": 451031, "epoch": 5434} {"train_loss": -26.242612838745117, "global_step": 451032, "epoch": 5434} {"train_loss": -26.570764541625977, "global_step": 451033, "epoch": 5434} {"train_loss": -26.467132568359375, "global_step": 451034, "epoch": 5434} {"train_loss": -26.778844833374023, "global_step": 451035, "epoch": 5434} {"train_loss": -26.3866024017334, "global_step": 451036, "epoch": 5434} {"train_loss": -26.499616622924805, "global_step": 451037, "epoch": 5434} {"train_loss": -26.4783878326416, "global_step": 451038, "epoch": 5434} {"train_loss": -26.593536376953125, "global_step": 451039, "epoch": 5434} {"train_loss": -26.376794815063477, "global_step": 451040, "epoch": 5434} {"train_loss": -26.63776206970215, "global_step": 451041, "epoch": 5434} {"train_loss": -27.004730224609375, "global_step": 451042, "epoch": 5434} {"train_loss": -26.461868286132812, "global_step": 451043, "epoch": 5434} {"train_loss": -26.376453399658203, "global_step": 451044, "epoch": 5434} {"train_loss": -27.080387115478516, "global_step": 451045, "epoch": 5434} {"train_loss": -26.788236618041992, "global_step": 451046, "epoch": 5434} {"train_loss": -26.520566940307617, "global_step": 451047, "epoch": 5434} {"train_loss": -26.9093017578125, "global_step": 451048, "epoch": 5434} {"train_loss": -26.53460693359375, "global_step": 451049, "epoch": 5434} {"train_loss": -26.955078125, "global_step": 451050, "epoch": 5434} {"train_loss": -26.60390281677246, "global_step": 451051, "epoch": 5434} {"train_loss": -26.96002769470215, "global_step": 451052, "epoch": 5434} {"train_loss": -26.7976131439209, "global_step": 451053, "epoch": 5434} {"train_loss": -26.775867462158203, "global_step": 451054, "epoch": 5434} {"train_loss": -26.65777587890625, "global_step": 451055, "epoch": 5434} {"train_loss": -27.103851318359375, "global_step": 451056, "epoch": 5434} {"train_loss": -26.9471492767334, "global_step": 451057, "epoch": 5434} {"train_loss": -26.963062286376953, "global_step": 451058, "epoch": 5434} {"train_loss": -27.2724666595459, "global_step": 451059, "epoch": 5434} {"train_loss": -27.07220458984375, "global_step": 451060, "epoch": 5434} {"train_loss": -27.244766235351562, "global_step": 451061, "epoch": 5434} {"train_loss": -27.125085830688477, "global_step": 451062, "epoch": 5434} {"train_loss": -26.992767333984375, "global_step": 451063, "epoch": 5434} {"train_loss": -27.03948402404785, "global_step": 451064, "epoch": 5434} {"train_loss": -26.963184356689453, "global_step": 451065, "epoch": 5434} {"train_loss": -27.164255142211914, "global_step": 451066, "epoch": 5434} {"train_loss": -27.046833038330078, "global_step": 451067, "epoch": 5434} {"train_loss": -27.30474281311035, "global_step": 451068, "epoch": 5434} {"train_loss": -27.050748825073242, "global_step": 451069, "epoch": 5434} {"train_loss": -27.156757354736328, "global_step": 451070, "epoch": 5434} {"train_loss": -26.87822914123535, "global_step": 451071, "epoch": 5434} {"train_loss": -27.487720489501953, "global_step": 451072, "epoch": 5434} {"train_loss": -27.76658058166504, "global_step": 451073, "epoch": 5434} {"train_loss": -26.287582397460938, "global_step": 451074, "epoch": 5434} {"train_loss": -26.2401123046875, "global_step": 451075, "epoch": 5434} {"train_loss": -25.91298484802246, "global_step": 451076, "epoch": 5434} {"train_loss": -26.72840690612793, "global_step": 451077, "epoch": 5434} {"train_loss": -26.934385299682617, "global_step": 451078, "epoch": 5434} {"train_loss": -26.91135597229004, "global_step": 451079, "epoch": 5434} {"train_loss": -27.201719284057617, "global_step": 451080, "epoch": 5434} {"train_loss": -26.66643714904785, "global_step": 451081, "epoch": 5434} {"train_loss": -27.072519302368164, "global_step": 451082, "epoch": 5434} {"train_loss": -26.953174591064453, "global_step": 451083, "epoch": 5434} {"train_loss": -27.180072784423828, "global_step": 451084, "epoch": 5434} {"train_loss": -27.11146354675293, "global_step": 451085, "epoch": 5434} {"train_loss": -26.78399085998535, "global_step": 451086, "epoch": 5434} {"train_loss": -26.852624893188477, "global_step": 451087, "epoch": 5434} {"train_loss": -26.821866989135742, "global_step": 451088, "epoch": 5434} {"train_loss": -26.85955810546875, "global_step": 451089, "epoch": 5434} {"train_loss": -27.23858070373535, "global_step": 451090, "epoch": 5434} {"train_loss": -27.046411514282227, "global_step": 451091, "epoch": 5434} {"train_loss": -27.0367488861084, "global_step": 451092, "epoch": 5434} {"train_loss": -27.1221866607666, "global_step": 451093, "epoch": 5434} {"train_loss": -27.001203536987305, "global_step": 451094, "epoch": 5434} {"train_loss": -26.864093780517578, "global_step": 451095, "epoch": 5434} {"train_loss": -26.842376708984375, "global_step": 451096, "epoch": 5434} {"train_loss": -26.869064331054688, "global_step": 451097, "epoch": 5434} {"train_loss": -26.760034561157227, "global_step": 451098, "epoch": 5434} {"train_loss": -27.295698165893555, "global_step": 451099, "epoch": 5434} {"train_loss": -26.921009063720703, "global_step": 451100, "epoch": 5434} {"train_loss": -26.807287216186523, "global_step": 451101, "epoch": 5434} {"train_loss": -27.049604415893555, "global_step": 451102, "epoch": 5434} {"train_loss": -27.55283546447754, "global_step": 451103, "epoch": 5434} {"train_loss": -26.79669623777091, "global_step": 451104, "epoch": 5434, "val_loss": 6435351.0} {"train_loss": -26.623727798461914, "global_step": 451105, "epoch": 5435} {"train_loss": -26.40708351135254, "global_step": 451106, "epoch": 5435} {"train_loss": -26.608753204345703, "global_step": 451107, "epoch": 5435} {"train_loss": -26.429990768432617, "global_step": 451108, "epoch": 5435} {"train_loss": -27.079580307006836, "global_step": 451109, "epoch": 5435} {"train_loss": -26.117706298828125, "global_step": 451110, "epoch": 5435} {"train_loss": -26.426660537719727, "global_step": 451111, "epoch": 5435} {"train_loss": -26.61736488342285, "global_step": 451112, "epoch": 5435} {"train_loss": -26.496423721313477, "global_step": 451113, "epoch": 5435} {"train_loss": -26.546354293823242, "global_step": 451114, "epoch": 5435} {"train_loss": -26.5142822265625, "global_step": 451115, "epoch": 5435} {"train_loss": -27.10013771057129, "global_step": 451116, "epoch": 5435} {"train_loss": -26.94171142578125, "global_step": 451117, "epoch": 5435} {"train_loss": -26.97544288635254, "global_step": 451118, "epoch": 5435} {"train_loss": -26.67132568359375, "global_step": 451119, "epoch": 5435} {"train_loss": -26.531269073486328, "global_step": 451120, "epoch": 5435} {"train_loss": -26.537927627563477, "global_step": 451121, "epoch": 5435} {"train_loss": -27.149887084960938, "global_step": 451122, "epoch": 5435} {"train_loss": -26.88506507873535, "global_step": 451123, "epoch": 5435} {"train_loss": -26.948511123657227, "global_step": 451124, "epoch": 5435} {"train_loss": -26.794666290283203, "global_step": 451125, "epoch": 5435} {"train_loss": -26.719146728515625, "global_step": 451126, "epoch": 5435} {"train_loss": -26.9625244140625, "global_step": 451127, "epoch": 5435} {"train_loss": -26.893939971923828, "global_step": 451128, "epoch": 5435} {"train_loss": -26.698551177978516, "global_step": 451129, "epoch": 5435} {"train_loss": -26.672758102416992, "global_step": 451130, "epoch": 5435} {"train_loss": -26.842315673828125, "global_step": 451131, "epoch": 5435} {"train_loss": -26.928735733032227, "global_step": 451132, "epoch": 5435} {"train_loss": -27.134321212768555, "global_step": 451133, "epoch": 5435} {"train_loss": -27.457258224487305, "global_step": 451134, "epoch": 5435} {"train_loss": -27.041181564331055, "global_step": 451135, "epoch": 5435} {"train_loss": -26.83431053161621, "global_step": 451136, "epoch": 5435} {"train_loss": -27.223052978515625, "global_step": 451137, "epoch": 5435} {"train_loss": -26.92486572265625, "global_step": 451138, "epoch": 5435} {"train_loss": -27.297229766845703, "global_step": 451139, "epoch": 5435} {"train_loss": -27.16303825378418, "global_step": 451140, "epoch": 5435} {"train_loss": -27.122161865234375, "global_step": 451141, "epoch": 5435} {"train_loss": -26.954639434814453, "global_step": 451142, "epoch": 5435} {"train_loss": -27.170246124267578, "global_step": 451143, "epoch": 5435} {"train_loss": -27.001020431518555, "global_step": 451144, "epoch": 5435} {"train_loss": -27.3989315032959, "global_step": 451145, "epoch": 5435} {"train_loss": -27.225168228149414, "global_step": 451146, "epoch": 5435} {"train_loss": -27.10194969177246, "global_step": 451147, "epoch": 5435} {"train_loss": -26.969955444335938, "global_step": 451148, "epoch": 5435} {"train_loss": -27.006366729736328, "global_step": 451149, "epoch": 5435} {"train_loss": -27.078643798828125, "global_step": 451150, "epoch": 5435} {"train_loss": -27.02242088317871, "global_step": 451151, "epoch": 5435} {"train_loss": -26.933862686157227, "global_step": 451152, "epoch": 5435} {"train_loss": -26.687885284423828, "global_step": 451153, "epoch": 5435} {"train_loss": -26.129596710205078, "global_step": 451154, "epoch": 5435} {"train_loss": -26.461349487304688, "global_step": 451155, "epoch": 5435} {"train_loss": -26.66814613342285, "global_step": 451156, "epoch": 5435} {"train_loss": -26.605276107788086, "global_step": 451157, "epoch": 5435} {"train_loss": -26.9858455657959, "global_step": 451158, "epoch": 5435} {"train_loss": -26.76102638244629, "global_step": 451159, "epoch": 5435} {"train_loss": -26.592390060424805, "global_step": 451160, "epoch": 5435} {"train_loss": -27.146167755126953, "global_step": 451161, "epoch": 5435} {"train_loss": -26.911712646484375, "global_step": 451162, "epoch": 5435} {"train_loss": -26.904926300048828, "global_step": 451163, "epoch": 5435} {"train_loss": -26.911462783813477, "global_step": 451164, "epoch": 5435} {"train_loss": -26.751867294311523, "global_step": 451165, "epoch": 5435} {"train_loss": -26.879425048828125, "global_step": 451166, "epoch": 5435} {"train_loss": -27.02589225769043, "global_step": 451167, "epoch": 5435} {"train_loss": -27.133075714111328, "global_step": 451168, "epoch": 5435} {"train_loss": -26.890121459960938, "global_step": 451169, "epoch": 5435} {"train_loss": -26.569171905517578, "global_step": 451170, "epoch": 5435} {"train_loss": -26.978473663330078, "global_step": 451171, "epoch": 5435} {"train_loss": -26.772418975830078, "global_step": 451172, "epoch": 5435} {"train_loss": -26.704309463500977, "global_step": 451173, "epoch": 5435} {"train_loss": -27.070556640625, "global_step": 451174, "epoch": 5435} {"train_loss": -26.80067253112793, "global_step": 451175, "epoch": 5435} {"train_loss": -26.79298210144043, "global_step": 451176, "epoch": 5435} {"train_loss": -26.947280883789062, "global_step": 451177, "epoch": 5435} {"train_loss": -26.909381866455078, "global_step": 451178, "epoch": 5435} {"train_loss": -26.746503829956055, "global_step": 451179, "epoch": 5435} {"train_loss": -26.86819839477539, "global_step": 451180, "epoch": 5435} {"train_loss": -27.34629249572754, "global_step": 451181, "epoch": 5435} {"train_loss": -26.831674575805664, "global_step": 451182, "epoch": 5435} {"train_loss": -27.235563278198242, "global_step": 451183, "epoch": 5435} {"train_loss": -26.704160690307617, "global_step": 451184, "epoch": 5435} {"train_loss": -26.923139572143555, "global_step": 451185, "epoch": 5435} {"train_loss": -26.99526023864746, "global_step": 451186, "epoch": 5435} {"train_loss": -26.85792309404856, "global_step": 451187, "epoch": 5435, "val_loss": 6459690.0} {"train_loss": -26.776700973510742, "global_step": 451188, "epoch": 5436} {"train_loss": -26.849477767944336, "global_step": 451189, "epoch": 5436} {"train_loss": -26.662397384643555, "global_step": 451190, "epoch": 5436} {"train_loss": -27.20216178894043, "global_step": 451191, "epoch": 5436} {"train_loss": -26.596832275390625, "global_step": 451192, "epoch": 5436} {"train_loss": -26.49689292907715, "global_step": 451193, "epoch": 5436} {"train_loss": -26.70863151550293, "global_step": 451194, "epoch": 5436} {"train_loss": -27.03669548034668, "global_step": 451195, "epoch": 5436} {"train_loss": -26.837005615234375, "global_step": 451196, "epoch": 5436} {"train_loss": -26.56918716430664, "global_step": 451197, "epoch": 5436} {"train_loss": -26.78321647644043, "global_step": 451198, "epoch": 5436} {"train_loss": -26.58733558654785, "global_step": 451199, "epoch": 5436} {"train_loss": -26.86349868774414, "global_step": 451200, "epoch": 5436} {"train_loss": -27.025312423706055, "global_step": 451201, "epoch": 5436} {"train_loss": -26.383569717407227, "global_step": 451202, "epoch": 5436} {"train_loss": -27.139373779296875, "global_step": 451203, "epoch": 5436} {"train_loss": -27.004602432250977, "global_step": 451204, "epoch": 5436} {"train_loss": -27.105030059814453, "global_step": 451205, "epoch": 5436} {"train_loss": -26.95221519470215, "global_step": 451206, "epoch": 5436} {"train_loss": -27.263517379760742, "global_step": 451207, "epoch": 5436} {"train_loss": -27.416364669799805, "global_step": 451208, "epoch": 5436} {"train_loss": -26.887731552124023, "global_step": 451209, "epoch": 5436} {"train_loss": -27.055530548095703, "global_step": 451210, "epoch": 5436} {"train_loss": -26.920148849487305, "global_step": 451211, "epoch": 5436} {"train_loss": -27.295608520507812, "global_step": 451212, "epoch": 5436} {"train_loss": -27.243200302124023, "global_step": 451213, "epoch": 5436} {"train_loss": -27.04010581970215, "global_step": 451214, "epoch": 5436} {"train_loss": -27.386199951171875, "global_step": 451215, "epoch": 5436} {"train_loss": -27.287677764892578, "global_step": 451216, "epoch": 5436} {"train_loss": -27.204328536987305, "global_step": 451217, "epoch": 5436} {"train_loss": -27.105712890625, "global_step": 451218, "epoch": 5436} {"train_loss": -27.282855987548828, "global_step": 451219, "epoch": 5436} {"train_loss": -27.254491806030273, "global_step": 451220, "epoch": 5436} {"train_loss": -27.319263458251953, "global_step": 451221, "epoch": 5436} {"train_loss": -26.7694034576416, "global_step": 451222, "epoch": 5436} {"train_loss": -26.929513931274414, "global_step": 451223, "epoch": 5436} {"train_loss": -26.906904220581055, "global_step": 451224, "epoch": 5436} {"train_loss": -27.095783233642578, "global_step": 451225, "epoch": 5436} {"train_loss": -26.931659698486328, "global_step": 451226, "epoch": 5436} {"train_loss": -27.2363224029541, "global_step": 451227, "epoch": 5436} {"train_loss": -27.137174606323242, "global_step": 451228, "epoch": 5436} {"train_loss": -26.891864776611328, "global_step": 451229, "epoch": 5436} {"train_loss": -27.07969093322754, "global_step": 451230, "epoch": 5436} {"train_loss": -27.391042709350586, "global_step": 451231, "epoch": 5436} {"train_loss": -27.2327823638916, "global_step": 451232, "epoch": 5436} {"train_loss": -27.138391494750977, "global_step": 451233, "epoch": 5436} {"train_loss": -27.3642578125, "global_step": 451234, "epoch": 5436} {"train_loss": -27.232803344726562, "global_step": 451235, "epoch": 5436} {"train_loss": -26.95173454284668, "global_step": 451236, "epoch": 5436} {"train_loss": -27.19358253479004, "global_step": 451237, "epoch": 5436} {"train_loss": -27.27106285095215, "global_step": 451238, "epoch": 5436} {"train_loss": -27.048505783081055, "global_step": 451239, "epoch": 5436} {"train_loss": -27.20772361755371, "global_step": 451240, "epoch": 5436} {"train_loss": -27.257434844970703, "global_step": 451241, "epoch": 5436} {"train_loss": -27.051977157592773, "global_step": 451242, "epoch": 5436} {"train_loss": -27.031579971313477, "global_step": 451243, "epoch": 5436} {"train_loss": -26.876972198486328, "global_step": 451244, "epoch": 5436} {"train_loss": -27.161178588867188, "global_step": 451245, "epoch": 5436} {"train_loss": -26.87890625, "global_step": 451246, "epoch": 5436} {"train_loss": -27.08526611328125, "global_step": 451247, "epoch": 5436} {"train_loss": -27.16153907775879, "global_step": 451248, "epoch": 5436} {"train_loss": -27.229711532592773, "global_step": 451249, "epoch": 5436} {"train_loss": -26.8530330657959, "global_step": 451250, "epoch": 5436} {"train_loss": -27.212890625, "global_step": 451251, "epoch": 5436} {"train_loss": -26.839969635009766, "global_step": 451252, "epoch": 5436} {"train_loss": -27.062543869018555, "global_step": 451253, "epoch": 5436} {"train_loss": -27.380569458007812, "global_step": 451254, "epoch": 5436} {"train_loss": -27.062698364257812, "global_step": 451255, "epoch": 5436} {"train_loss": -26.797903060913086, "global_step": 451256, "epoch": 5436} {"train_loss": -27.014678955078125, "global_step": 451257, "epoch": 5436} {"train_loss": -26.874908447265625, "global_step": 451258, "epoch": 5436} {"train_loss": -26.844701766967773, "global_step": 451259, "epoch": 5436} {"train_loss": -26.911773681640625, "global_step": 451260, "epoch": 5436} {"train_loss": -26.784564971923828, "global_step": 451261, "epoch": 5436} {"train_loss": -27.135156631469727, "global_step": 451262, "epoch": 5436} {"train_loss": -26.937788009643555, "global_step": 451263, "epoch": 5436} {"train_loss": -26.95635986328125, "global_step": 451264, "epoch": 5436} {"train_loss": -26.85870361328125, "global_step": 451265, "epoch": 5436} {"train_loss": -27.518041610717773, "global_step": 451266, "epoch": 5436} {"train_loss": -27.665929794311523, "global_step": 451267, "epoch": 5436} {"train_loss": -27.04172134399414, "global_step": 451268, "epoch": 5436} {"train_loss": -27.10316276550293, "global_step": 451269, "epoch": 5436} {"train_loss": -27.02902414712561, "global_step": 451270, "epoch": 5436, "val_loss": 6423047.0} {"train_loss": -25.54157066345215, "global_step": 451271, "epoch": 5437} {"train_loss": -25.455490112304688, "global_step": 451272, "epoch": 5437} {"train_loss": -24.91365623474121, "global_step": 451273, "epoch": 5437} {"train_loss": -25.43001365661621, "global_step": 451274, "epoch": 5437} {"train_loss": -25.177663803100586, "global_step": 451275, "epoch": 5437} {"train_loss": -25.529630661010742, "global_step": 451276, "epoch": 5437} {"train_loss": -24.629657745361328, "global_step": 451277, "epoch": 5437} {"train_loss": -26.279935836791992, "global_step": 451278, "epoch": 5437} {"train_loss": -25.04131507873535, "global_step": 451279, "epoch": 5437} {"train_loss": -26.053028106689453, "global_step": 451280, "epoch": 5437} {"train_loss": -26.285877227783203, "global_step": 451281, "epoch": 5437} {"train_loss": -26.48151969909668, "global_step": 451282, "epoch": 5437} {"train_loss": -26.29627799987793, "global_step": 451283, "epoch": 5437} {"train_loss": -25.806934356689453, "global_step": 451284, "epoch": 5437} {"train_loss": -25.906635284423828, "global_step": 451285, "epoch": 5437} {"train_loss": -26.321619033813477, "global_step": 451286, "epoch": 5437} {"train_loss": -26.190954208374023, "global_step": 451287, "epoch": 5437} {"train_loss": -26.441925048828125, "global_step": 451288, "epoch": 5437} {"train_loss": -26.201154708862305, "global_step": 451289, "epoch": 5437} {"train_loss": -26.133075714111328, "global_step": 451290, "epoch": 5437} {"train_loss": -26.370588302612305, "global_step": 451291, "epoch": 5437} {"train_loss": -26.772409439086914, "global_step": 451292, "epoch": 5437} {"train_loss": -26.45163917541504, "global_step": 451293, "epoch": 5437} {"train_loss": -26.5017032623291, "global_step": 451294, "epoch": 5437} {"train_loss": -26.673315048217773, "global_step": 451295, "epoch": 5437} {"train_loss": -26.83154296875, "global_step": 451296, "epoch": 5437} {"train_loss": -26.755895614624023, "global_step": 451297, "epoch": 5437} {"train_loss": -26.87515640258789, "global_step": 451298, "epoch": 5437} {"train_loss": -26.81561279296875, "global_step": 451299, "epoch": 5437} {"train_loss": -26.94514274597168, "global_step": 451300, "epoch": 5437} {"train_loss": -26.658939361572266, "global_step": 451301, "epoch": 5437} {"train_loss": -26.800207138061523, "global_step": 451302, "epoch": 5437} {"train_loss": -26.540058135986328, "global_step": 451303, "epoch": 5437} {"train_loss": -27.136795043945312, "global_step": 451304, "epoch": 5437} {"train_loss": -26.675827026367188, "global_step": 451305, "epoch": 5437} {"train_loss": -27.197858810424805, "global_step": 451306, "epoch": 5437} {"train_loss": -27.102264404296875, "global_step": 451307, "epoch": 5437} {"train_loss": -26.557764053344727, "global_step": 451308, "epoch": 5437} {"train_loss": -26.759342193603516, "global_step": 451309, "epoch": 5437} {"train_loss": -27.165075302124023, "global_step": 451310, "epoch": 5437} {"train_loss": -26.927114486694336, "global_step": 451311, "epoch": 5437} {"train_loss": -27.09412956237793, "global_step": 451312, "epoch": 5437} {"train_loss": -27.1550350189209, "global_step": 451313, "epoch": 5437} {"train_loss": -27.490585327148438, "global_step": 451314, "epoch": 5437} {"train_loss": -27.08289909362793, "global_step": 451315, "epoch": 5437} {"train_loss": -27.070499420166016, "global_step": 451316, "epoch": 5437} {"train_loss": -27.18951988220215, "global_step": 451317, "epoch": 5437} {"train_loss": -26.92013931274414, "global_step": 451318, "epoch": 5437} {"train_loss": -27.184370040893555, "global_step": 451319, "epoch": 5437} {"train_loss": -26.922992706298828, "global_step": 451320, "epoch": 5437} {"train_loss": -27.099689483642578, "global_step": 451321, "epoch": 5437} {"train_loss": -27.1523494720459, "global_step": 451322, "epoch": 5437} {"train_loss": -27.1684627532959, "global_step": 451323, "epoch": 5437} {"train_loss": -27.155792236328125, "global_step": 451324, "epoch": 5437} {"train_loss": -27.102636337280273, "global_step": 451325, "epoch": 5437} {"train_loss": -27.083282470703125, "global_step": 451326, "epoch": 5437} {"train_loss": -27.050384521484375, "global_step": 451327, "epoch": 5437} {"train_loss": -27.57669448852539, "global_step": 451328, "epoch": 5437} {"train_loss": -27.409372329711914, "global_step": 451329, "epoch": 5437} {"train_loss": -27.4141788482666, "global_step": 451330, "epoch": 5437} {"train_loss": -27.28333854675293, "global_step": 451331, "epoch": 5437} {"train_loss": -27.2858829498291, "global_step": 451332, "epoch": 5437} {"train_loss": -27.296920776367188, "global_step": 451333, "epoch": 5437} {"train_loss": -27.26788330078125, "global_step": 451334, "epoch": 5437} {"train_loss": -26.998945236206055, "global_step": 451335, "epoch": 5437} {"train_loss": -26.584564208984375, "global_step": 451336, "epoch": 5437} {"train_loss": -26.318029403686523, "global_step": 451337, "epoch": 5437} {"train_loss": -26.39019203186035, "global_step": 451338, "epoch": 5437} {"train_loss": -26.63307762145996, "global_step": 451339, "epoch": 5437} {"train_loss": -26.565793991088867, "global_step": 451340, "epoch": 5437} {"train_loss": -25.852588653564453, "global_step": 451341, "epoch": 5437} {"train_loss": -25.88697624206543, "global_step": 451342, "epoch": 5437} {"train_loss": -26.682947158813477, "global_step": 451343, "epoch": 5437} {"train_loss": -26.603500366210938, "global_step": 451344, "epoch": 5437} {"train_loss": -26.643171310424805, "global_step": 451345, "epoch": 5437} {"train_loss": -26.897872924804688, "global_step": 451346, "epoch": 5437} {"train_loss": -26.6173152923584, "global_step": 451347, "epoch": 5437} {"train_loss": -26.587158203125, "global_step": 451348, "epoch": 5437} {"train_loss": -27.302627563476562, "global_step": 451349, "epoch": 5437} {"train_loss": -26.74971580505371, "global_step": 451350, "epoch": 5437} {"train_loss": -26.96412467956543, "global_step": 451351, "epoch": 5437} {"train_loss": -26.796768188476562, "global_step": 451352, "epoch": 5437} {"train_loss": -26.621622683053992, "global_step": 451353, "epoch": 5437, "val_loss": 6564945.5} {"train_loss": -26.42388916015625, "global_step": 451354, "epoch": 5438} {"train_loss": -25.366270065307617, "global_step": 451355, "epoch": 5438} {"train_loss": -25.828760147094727, "global_step": 451356, "epoch": 5438} {"train_loss": -25.275684356689453, "global_step": 451357, "epoch": 5438} {"train_loss": -26.259082794189453, "global_step": 451358, "epoch": 5438} {"train_loss": -26.28531265258789, "global_step": 451359, "epoch": 5438} {"train_loss": -26.257476806640625, "global_step": 451360, "epoch": 5438} {"train_loss": -26.537311553955078, "global_step": 451361, "epoch": 5438} {"train_loss": -26.647418975830078, "global_step": 451362, "epoch": 5438} {"train_loss": -26.365615844726562, "global_step": 451363, "epoch": 5438} {"train_loss": -26.5567626953125, "global_step": 451364, "epoch": 5438} {"train_loss": -26.788305282592773, "global_step": 451365, "epoch": 5438} {"train_loss": -26.270490646362305, "global_step": 451366, "epoch": 5438} {"train_loss": -26.32451820373535, "global_step": 451367, "epoch": 5438} {"train_loss": -26.978010177612305, "global_step": 451368, "epoch": 5438} {"train_loss": -26.65167808532715, "global_step": 451369, "epoch": 5438} {"train_loss": -26.456069946289062, "global_step": 451370, "epoch": 5438} {"train_loss": -26.6021671295166, "global_step": 451371, "epoch": 5438} {"train_loss": -26.4492130279541, "global_step": 451372, "epoch": 5438} {"train_loss": -26.853759765625, "global_step": 451373, "epoch": 5438} {"train_loss": -26.652551651000977, "global_step": 451374, "epoch": 5438} {"train_loss": -26.85215187072754, "global_step": 451375, "epoch": 5438} {"train_loss": -26.845840454101562, "global_step": 451376, "epoch": 5438} {"train_loss": -26.69573974609375, "global_step": 451377, "epoch": 5438} {"train_loss": -27.11097526550293, "global_step": 451378, "epoch": 5438} {"train_loss": -26.82073974609375, "global_step": 451379, "epoch": 5438} {"train_loss": -27.14008903503418, "global_step": 451380, "epoch": 5438} {"train_loss": -26.683008193969727, "global_step": 451381, "epoch": 5438} {"train_loss": -27.15362548828125, "global_step": 451382, "epoch": 5438} {"train_loss": -26.896045684814453, "global_step": 451383, "epoch": 5438} {"train_loss": -27.105594635009766, "global_step": 451384, "epoch": 5438} {"train_loss": -27.2094669342041, "global_step": 451385, "epoch": 5438} {"train_loss": -27.24163246154785, "global_step": 451386, "epoch": 5438} {"train_loss": -26.912221908569336, "global_step": 451387, "epoch": 5438} {"train_loss": -27.086719512939453, "global_step": 451388, "epoch": 5438} {"train_loss": -26.88221549987793, "global_step": 451389, "epoch": 5438} {"train_loss": -27.307220458984375, "global_step": 451390, "epoch": 5438} {"train_loss": -27.16497230529785, "global_step": 451391, "epoch": 5438} {"train_loss": -27.047271728515625, "global_step": 451392, "epoch": 5438} {"train_loss": -27.360944747924805, "global_step": 451393, "epoch": 5438} {"train_loss": -27.05295753479004, "global_step": 451394, "epoch": 5438} {"train_loss": -26.69239616394043, "global_step": 451395, "epoch": 5438} {"train_loss": -26.651123046875, "global_step": 451396, "epoch": 5438} {"train_loss": -27.075109481811523, "global_step": 451397, "epoch": 5438} {"train_loss": -27.112680435180664, "global_step": 451398, "epoch": 5438} {"train_loss": -27.2203369140625, "global_step": 451399, "epoch": 5438} {"train_loss": -27.41385269165039, "global_step": 451400, "epoch": 5438} {"train_loss": -27.0277042388916, "global_step": 451401, "epoch": 5438} {"train_loss": -26.711523056030273, "global_step": 451402, "epoch": 5438} {"train_loss": -27.225143432617188, "global_step": 451403, "epoch": 5438} {"train_loss": -26.6832275390625, "global_step": 451404, "epoch": 5438} {"train_loss": -26.55585289001465, "global_step": 451405, "epoch": 5438} {"train_loss": -26.773035049438477, "global_step": 451406, "epoch": 5438} {"train_loss": -26.690759658813477, "global_step": 451407, "epoch": 5438} {"train_loss": -26.638147354125977, "global_step": 451408, "epoch": 5438} {"train_loss": -27.15097427368164, "global_step": 451409, "epoch": 5438} {"train_loss": -27.07405662536621, "global_step": 451410, "epoch": 5438} {"train_loss": -27.277801513671875, "global_step": 451411, "epoch": 5438} {"train_loss": -26.91352653503418, "global_step": 451412, "epoch": 5438} {"train_loss": -26.944019317626953, "global_step": 451413, "epoch": 5438} {"train_loss": -27.060321807861328, "global_step": 451414, "epoch": 5438} {"train_loss": -27.042692184448242, "global_step": 451415, "epoch": 5438} {"train_loss": -26.933683395385742, "global_step": 451416, "epoch": 5438} {"train_loss": -27.224218368530273, "global_step": 451417, "epoch": 5438} {"train_loss": -27.090503692626953, "global_step": 451418, "epoch": 5438} {"train_loss": -26.8610782623291, "global_step": 451419, "epoch": 5438} {"train_loss": -26.772567749023438, "global_step": 451420, "epoch": 5438} {"train_loss": -27.1456298828125, "global_step": 451421, "epoch": 5438} {"train_loss": -26.719619750976562, "global_step": 451422, "epoch": 5438} {"train_loss": -27.135089874267578, "global_step": 451423, "epoch": 5438} {"train_loss": -27.225980758666992, "global_step": 451424, "epoch": 5438} {"train_loss": -27.094030380249023, "global_step": 451425, "epoch": 5438} {"train_loss": -27.086139678955078, "global_step": 451426, "epoch": 5438} {"train_loss": -27.290708541870117, "global_step": 451427, "epoch": 5438} {"train_loss": -27.093671798706055, "global_step": 451428, "epoch": 5438} {"train_loss": -27.22283363342285, "global_step": 451429, "epoch": 5438} {"train_loss": -27.3831729888916, "global_step": 451430, "epoch": 5438} {"train_loss": -26.781299591064453, "global_step": 451431, "epoch": 5438} {"train_loss": -27.029621124267578, "global_step": 451432, "epoch": 5438} {"train_loss": -27.411924362182617, "global_step": 451433, "epoch": 5438} {"train_loss": -26.921045303344727, "global_step": 451434, "epoch": 5438} {"train_loss": -26.889911651611328, "global_step": 451435, "epoch": 5438} {"train_loss": -26.860352159982703, "global_step": 451436, "epoch": 5438, "val_loss": 6495986.5} {"train_loss": -26.321094512939453, "global_step": 451437, "epoch": 5439} {"train_loss": -26.594013214111328, "global_step": 451438, "epoch": 5439} {"train_loss": -26.507577896118164, "global_step": 451439, "epoch": 5439} {"train_loss": -26.819982528686523, "global_step": 451440, "epoch": 5439} {"train_loss": -26.59726333618164, "global_step": 451441, "epoch": 5439} {"train_loss": -26.058765411376953, "global_step": 451442, "epoch": 5439} {"train_loss": -26.235687255859375, "global_step": 451443, "epoch": 5439} {"train_loss": -26.527570724487305, "global_step": 451444, "epoch": 5439} {"train_loss": -26.75172233581543, "global_step": 451445, "epoch": 5439} {"train_loss": -26.400684356689453, "global_step": 451446, "epoch": 5439} {"train_loss": -27.096704483032227, "global_step": 451447, "epoch": 5439} {"train_loss": -27.0284366607666, "global_step": 451448, "epoch": 5439} {"train_loss": -26.858108520507812, "global_step": 451449, "epoch": 5439} {"train_loss": -27.173110961914062, "global_step": 451450, "epoch": 5439} {"train_loss": -26.911664962768555, "global_step": 451451, "epoch": 5439} {"train_loss": -26.854333877563477, "global_step": 451452, "epoch": 5439} {"train_loss": -26.64984703063965, "global_step": 451453, "epoch": 5439} {"train_loss": -26.7618350982666, "global_step": 451454, "epoch": 5439} {"train_loss": -26.618091583251953, "global_step": 451455, "epoch": 5439} {"train_loss": -26.578338623046875, "global_step": 451456, "epoch": 5439} {"train_loss": -27.077880859375, "global_step": 451457, "epoch": 5439} {"train_loss": -26.79816246032715, "global_step": 451458, "epoch": 5439} {"train_loss": -26.941898345947266, "global_step": 451459, "epoch": 5439} {"train_loss": -26.892148971557617, "global_step": 451460, "epoch": 5439} {"train_loss": -26.959379196166992, "global_step": 451461, "epoch": 5439} {"train_loss": -26.602375030517578, "global_step": 451462, "epoch": 5439} {"train_loss": -27.006067276000977, "global_step": 451463, "epoch": 5439} {"train_loss": -27.183279037475586, "global_step": 451464, "epoch": 5439} {"train_loss": -26.81241226196289, "global_step": 451465, "epoch": 5439} {"train_loss": -27.05708885192871, "global_step": 451466, "epoch": 5439} {"train_loss": -26.593780517578125, "global_step": 451467, "epoch": 5439} {"train_loss": -26.96942138671875, "global_step": 451468, "epoch": 5439} {"train_loss": -27.427270889282227, "global_step": 451469, "epoch": 5439} {"train_loss": -26.940439224243164, "global_step": 451470, "epoch": 5439} {"train_loss": -27.312223434448242, "global_step": 451471, "epoch": 5439} {"train_loss": -27.106861114501953, "global_step": 451472, "epoch": 5439} {"train_loss": -26.768579483032227, "global_step": 451473, "epoch": 5439} {"train_loss": -27.018102645874023, "global_step": 451474, "epoch": 5439} {"train_loss": -27.043649673461914, "global_step": 451475, "epoch": 5439} {"train_loss": -27.334442138671875, "global_step": 451476, "epoch": 5439} {"train_loss": -26.98794937133789, "global_step": 451477, "epoch": 5439} {"train_loss": -27.239105224609375, "global_step": 451478, "epoch": 5439} {"train_loss": -26.986541748046875, "global_step": 451479, "epoch": 5439} {"train_loss": -27.014820098876953, "global_step": 451480, "epoch": 5439} {"train_loss": -26.976551055908203, "global_step": 451481, "epoch": 5439} {"train_loss": -27.329090118408203, "global_step": 451482, "epoch": 5439} {"train_loss": -27.311328887939453, "global_step": 451483, "epoch": 5439} {"train_loss": -26.97931480407715, "global_step": 451484, "epoch": 5439} {"train_loss": -27.195907592773438, "global_step": 451485, "epoch": 5439} {"train_loss": -27.188840866088867, "global_step": 451486, "epoch": 5439} {"train_loss": -26.985137939453125, "global_step": 451487, "epoch": 5439} {"train_loss": -27.219812393188477, "global_step": 451488, "epoch": 5439} {"train_loss": -27.212692260742188, "global_step": 451489, "epoch": 5439} {"train_loss": -26.815143585205078, "global_step": 451490, "epoch": 5439} {"train_loss": -27.2099609375, "global_step": 451491, "epoch": 5439} {"train_loss": -26.833826065063477, "global_step": 451492, "epoch": 5439} {"train_loss": -27.378149032592773, "global_step": 451493, "epoch": 5439} {"train_loss": -27.207569122314453, "global_step": 451494, "epoch": 5439} {"train_loss": -27.395660400390625, "global_step": 451495, "epoch": 5439} {"train_loss": -27.241662979125977, "global_step": 451496, "epoch": 5439} {"train_loss": -27.140527725219727, "global_step": 451497, "epoch": 5439} {"train_loss": -26.8136043548584, "global_step": 451498, "epoch": 5439} {"train_loss": -26.610015869140625, "global_step": 451499, "epoch": 5439} {"train_loss": -26.691253662109375, "global_step": 451500, "epoch": 5439} {"train_loss": -26.99479103088379, "global_step": 451501, "epoch": 5439} {"train_loss": -26.661224365234375, "global_step": 451502, "epoch": 5439} {"train_loss": -27.092559814453125, "global_step": 451503, "epoch": 5439} {"train_loss": -27.108001708984375, "global_step": 451504, "epoch": 5439} {"train_loss": -26.788053512573242, "global_step": 451505, "epoch": 5439} {"train_loss": -26.856618881225586, "global_step": 451506, "epoch": 5439} {"train_loss": -26.630212783813477, "global_step": 451507, "epoch": 5439} {"train_loss": -27.012073516845703, "global_step": 451508, "epoch": 5439} {"train_loss": -26.5778751373291, "global_step": 451509, "epoch": 5439} {"train_loss": -26.902807235717773, "global_step": 451510, "epoch": 5439} {"train_loss": -26.842809677124023, "global_step": 451511, "epoch": 5439} {"train_loss": -26.816190719604492, "global_step": 451512, "epoch": 5439} {"train_loss": -26.657968521118164, "global_step": 451513, "epoch": 5439} {"train_loss": -26.836217880249023, "global_step": 451514, "epoch": 5439} {"train_loss": -27.03030776977539, "global_step": 451515, "epoch": 5439} {"train_loss": -27.179548263549805, "global_step": 451516, "epoch": 5439} {"train_loss": -26.975278854370117, "global_step": 451517, "epoch": 5439} {"train_loss": -26.722217559814453, "global_step": 451518, "epoch": 5439} {"train_loss": -26.909769839551075, "global_step": 451519, "epoch": 5439, "val_loss": 6552622.5} {"train_loss": -27.095703125, "global_step": 451520, "epoch": 5440} {"train_loss": -26.8521785736084, "global_step": 451521, "epoch": 5440} {"train_loss": -26.415658950805664, "global_step": 451522, "epoch": 5440} {"train_loss": -26.20941162109375, "global_step": 451523, "epoch": 5440} {"train_loss": -26.609167098999023, "global_step": 451524, "epoch": 5440} {"train_loss": -26.184473037719727, "global_step": 451525, "epoch": 5440} {"train_loss": -27.103302001953125, "global_step": 451526, "epoch": 5440} {"train_loss": -26.944808959960938, "global_step": 451527, "epoch": 5440} {"train_loss": -26.382781982421875, "global_step": 451528, "epoch": 5440} {"train_loss": -26.70929527282715, "global_step": 451529, "epoch": 5440} {"train_loss": -27.04140281677246, "global_step": 451530, "epoch": 5440} {"train_loss": -27.193567276000977, "global_step": 451531, "epoch": 5440} {"train_loss": -26.749258041381836, "global_step": 451532, "epoch": 5440} {"train_loss": -26.86493492126465, "global_step": 451533, "epoch": 5440} {"train_loss": -26.672590255737305, "global_step": 451534, "epoch": 5440} {"train_loss": -27.22711753845215, "global_step": 451535, "epoch": 5440} {"train_loss": -27.001489639282227, "global_step": 451536, "epoch": 5440} {"train_loss": -26.79778480529785, "global_step": 451537, "epoch": 5440} {"train_loss": -27.023162841796875, "global_step": 451538, "epoch": 5440} {"train_loss": -27.05322265625, "global_step": 451539, "epoch": 5440} {"train_loss": -27.191404342651367, "global_step": 451540, "epoch": 5440} {"train_loss": -27.294879913330078, "global_step": 451541, "epoch": 5440} {"train_loss": -27.205718994140625, "global_step": 451542, "epoch": 5440} {"train_loss": -27.071500778198242, "global_step": 451543, "epoch": 5440} {"train_loss": -27.174802780151367, "global_step": 451544, "epoch": 5440} {"train_loss": -27.156347274780273, "global_step": 451545, "epoch": 5440} {"train_loss": -27.192243576049805, "global_step": 451546, "epoch": 5440} {"train_loss": -27.26519203186035, "global_step": 451547, "epoch": 5440} {"train_loss": -26.676565170288086, "global_step": 451548, "epoch": 5440} {"train_loss": -26.75909996032715, "global_step": 451549, "epoch": 5440} {"train_loss": -26.972761154174805, "global_step": 451550, "epoch": 5440} {"train_loss": -27.34305191040039, "global_step": 451551, "epoch": 5440} {"train_loss": -26.812408447265625, "global_step": 451552, "epoch": 5440} {"train_loss": -27.233230590820312, "global_step": 451553, "epoch": 5440} {"train_loss": -27.3173770904541, "global_step": 451554, "epoch": 5440} {"train_loss": -27.216760635375977, "global_step": 451555, "epoch": 5440} {"train_loss": -27.465139389038086, "global_step": 451556, "epoch": 5440} {"train_loss": -27.715757369995117, "global_step": 451557, "epoch": 5440} {"train_loss": -27.365631103515625, "global_step": 451558, "epoch": 5440} {"train_loss": -27.255956649780273, "global_step": 451559, "epoch": 5440} {"train_loss": -27.240201950073242, "global_step": 451560, "epoch": 5440} {"train_loss": -27.376739501953125, "global_step": 451561, "epoch": 5440} {"train_loss": -27.350778579711914, "global_step": 451562, "epoch": 5440} {"train_loss": -27.04401969909668, "global_step": 451563, "epoch": 5440} {"train_loss": -27.3621826171875, "global_step": 451564, "epoch": 5440} {"train_loss": -27.32000160217285, "global_step": 451565, "epoch": 5440} {"train_loss": -27.3571720123291, "global_step": 451566, "epoch": 5440} {"train_loss": -27.434839248657227, "global_step": 451567, "epoch": 5440} {"train_loss": -27.40338134765625, "global_step": 451568, "epoch": 5440} {"train_loss": -27.2017879486084, "global_step": 451569, "epoch": 5440} {"train_loss": -27.27115249633789, "global_step": 451570, "epoch": 5440} {"train_loss": -26.936965942382812, "global_step": 451571, "epoch": 5440} {"train_loss": -27.283254623413086, "global_step": 451572, "epoch": 5440} {"train_loss": -26.912023544311523, "global_step": 451573, "epoch": 5440} {"train_loss": -26.7099666595459, "global_step": 451574, "epoch": 5440} {"train_loss": -26.674402236938477, "global_step": 451575, "epoch": 5440} {"train_loss": -26.225866317749023, "global_step": 451576, "epoch": 5440} {"train_loss": -26.168500900268555, "global_step": 451577, "epoch": 5440} {"train_loss": -26.247480392456055, "global_step": 451578, "epoch": 5440} {"train_loss": -26.065698623657227, "global_step": 451579, "epoch": 5440} {"train_loss": -26.533935546875, "global_step": 451580, "epoch": 5440} {"train_loss": -27.007648468017578, "global_step": 451581, "epoch": 5440} {"train_loss": -26.41364860534668, "global_step": 451582, "epoch": 5440} {"train_loss": -26.28211784362793, "global_step": 451583, "epoch": 5440} {"train_loss": -26.336669921875, "global_step": 451584, "epoch": 5440} {"train_loss": -25.907556533813477, "global_step": 451585, "epoch": 5440} {"train_loss": -26.360998153686523, "global_step": 451586, "epoch": 5440} {"train_loss": -26.5933895111084, "global_step": 451587, "epoch": 5440} {"train_loss": -26.760574340820312, "global_step": 451588, "epoch": 5440} {"train_loss": -26.65949821472168, "global_step": 451589, "epoch": 5440} {"train_loss": -26.82693862915039, "global_step": 451590, "epoch": 5440} {"train_loss": -26.806310653686523, "global_step": 451591, "epoch": 5440} {"train_loss": -26.98262596130371, "global_step": 451592, "epoch": 5440} {"train_loss": -27.141286849975586, "global_step": 451593, "epoch": 5440} {"train_loss": -27.102563858032227, "global_step": 451594, "epoch": 5440} {"train_loss": -26.75374412536621, "global_step": 451595, "epoch": 5440} {"train_loss": -26.7680721282959, "global_step": 451596, "epoch": 5440} {"train_loss": -26.695581436157227, "global_step": 451597, "epoch": 5440} {"train_loss": -27.0689697265625, "global_step": 451598, "epoch": 5440} {"train_loss": -26.973133087158203, "global_step": 451599, "epoch": 5440} {"train_loss": -27.128122329711914, "global_step": 451600, "epoch": 5440} {"train_loss": -27.0715274810791, "global_step": 451601, "epoch": 5440} {"train_loss": -26.92722242424287, "global_step": 451602, "epoch": 5440, "val_loss": 6503028.0} {"train_loss": -26.523956298828125, "global_step": 451603, "epoch": 5441} {"train_loss": -26.759021759033203, "global_step": 451604, "epoch": 5441} {"train_loss": -26.251941680908203, "global_step": 451605, "epoch": 5441} {"train_loss": -26.459659576416016, "global_step": 451606, "epoch": 5441} {"train_loss": -26.53985023498535, "global_step": 451607, "epoch": 5441} {"train_loss": -26.635961532592773, "global_step": 451608, "epoch": 5441} {"train_loss": -26.689132690429688, "global_step": 451609, "epoch": 5441} {"train_loss": -26.25848960876465, "global_step": 451610, "epoch": 5441} {"train_loss": -26.491846084594727, "global_step": 451611, "epoch": 5441} {"train_loss": -26.661375045776367, "global_step": 451612, "epoch": 5441} {"train_loss": -26.922550201416016, "global_step": 451613, "epoch": 5441} {"train_loss": -27.142261505126953, "global_step": 451614, "epoch": 5441} {"train_loss": -26.9058780670166, "global_step": 451615, "epoch": 5441} {"train_loss": -26.934757232666016, "global_step": 451616, "epoch": 5441} {"train_loss": -27.052038192749023, "global_step": 451617, "epoch": 5441} {"train_loss": -27.288818359375, "global_step": 451618, "epoch": 5441} {"train_loss": -26.8088321685791, "global_step": 451619, "epoch": 5441} {"train_loss": -26.715932846069336, "global_step": 451620, "epoch": 5441} {"train_loss": -26.9400691986084, "global_step": 451621, "epoch": 5441} {"train_loss": -26.86328125, "global_step": 451622, "epoch": 5441} {"train_loss": -27.376571655273438, "global_step": 451623, "epoch": 5441} {"train_loss": -26.996362686157227, "global_step": 451624, "epoch": 5441} {"train_loss": -26.84885025024414, "global_step": 451625, "epoch": 5441} {"train_loss": -27.63065528869629, "global_step": 451626, "epoch": 5441} {"train_loss": -26.543933868408203, "global_step": 451627, "epoch": 5441} {"train_loss": -26.795211791992188, "global_step": 451628, "epoch": 5441} {"train_loss": -26.720996856689453, "global_step": 451629, "epoch": 5441} {"train_loss": -27.038908004760742, "global_step": 451630, "epoch": 5441} {"train_loss": -27.02678871154785, "global_step": 451631, "epoch": 5441} {"train_loss": -27.384546279907227, "global_step": 451632, "epoch": 5441} {"train_loss": -27.455280303955078, "global_step": 451633, "epoch": 5441} {"train_loss": -27.15569496154785, "global_step": 451634, "epoch": 5441} {"train_loss": -27.075021743774414, "global_step": 451635, "epoch": 5441} {"train_loss": -27.54176139831543, "global_step": 451636, "epoch": 5441} {"train_loss": -26.926733016967773, "global_step": 451637, "epoch": 5441} {"train_loss": -27.28590202331543, "global_step": 451638, "epoch": 5441} {"train_loss": -27.471302032470703, "global_step": 451639, "epoch": 5441} {"train_loss": -27.168481826782227, "global_step": 451640, "epoch": 5441} {"train_loss": -26.97760009765625, "global_step": 451641, "epoch": 5441} {"train_loss": -26.862369537353516, "global_step": 451642, "epoch": 5441} {"train_loss": -27.140888214111328, "global_step": 451643, "epoch": 5441} {"train_loss": -27.403966903686523, "global_step": 451644, "epoch": 5441} {"train_loss": -27.303302764892578, "global_step": 451645, "epoch": 5441} {"train_loss": -27.214160919189453, "global_step": 451646, "epoch": 5441} {"train_loss": -27.228952407836914, "global_step": 451647, "epoch": 5441} {"train_loss": -27.162200927734375, "global_step": 451648, "epoch": 5441} {"train_loss": -27.005537033081055, "global_step": 451649, "epoch": 5441} {"train_loss": -27.137775421142578, "global_step": 451650, "epoch": 5441} {"train_loss": -26.99370765686035, "global_step": 451651, "epoch": 5441} {"train_loss": -27.3016300201416, "global_step": 451652, "epoch": 5441} {"train_loss": -26.958593368530273, "global_step": 451653, "epoch": 5441} {"train_loss": -27.15180015563965, "global_step": 451654, "epoch": 5441} {"train_loss": -27.253692626953125, "global_step": 451655, "epoch": 5441} {"train_loss": -27.176538467407227, "global_step": 451656, "epoch": 5441} {"train_loss": -27.213703155517578, "global_step": 451657, "epoch": 5441} {"train_loss": -27.05649757385254, "global_step": 451658, "epoch": 5441} {"train_loss": -26.902587890625, "global_step": 451659, "epoch": 5441} {"train_loss": -27.6181583404541, "global_step": 451660, "epoch": 5441} {"train_loss": -27.092458724975586, "global_step": 451661, "epoch": 5441} {"train_loss": -27.29730796813965, "global_step": 451662, "epoch": 5441} {"train_loss": -26.848005294799805, "global_step": 451663, "epoch": 5441} {"train_loss": -26.642667770385742, "global_step": 451664, "epoch": 5441} {"train_loss": -26.199522018432617, "global_step": 451665, "epoch": 5441} {"train_loss": -25.895124435424805, "global_step": 451666, "epoch": 5441} {"train_loss": -25.54511260986328, "global_step": 451667, "epoch": 5441} {"train_loss": -26.298505783081055, "global_step": 451668, "epoch": 5441} {"train_loss": -26.85054588317871, "global_step": 451669, "epoch": 5441} {"train_loss": -26.718725204467773, "global_step": 451670, "epoch": 5441} {"train_loss": -26.794281005859375, "global_step": 451671, "epoch": 5441} {"train_loss": -27.009260177612305, "global_step": 451672, "epoch": 5441} {"train_loss": -26.460315704345703, "global_step": 451673, "epoch": 5441} {"train_loss": -27.083770751953125, "global_step": 451674, "epoch": 5441} {"train_loss": -26.98215675354004, "global_step": 451675, "epoch": 5441} {"train_loss": -26.61309814453125, "global_step": 451676, "epoch": 5441} {"train_loss": -27.38067054748535, "global_step": 451677, "epoch": 5441} {"train_loss": -26.729888916015625, "global_step": 451678, "epoch": 5441} {"train_loss": -27.48651123046875, "global_step": 451679, "epoch": 5441} {"train_loss": -26.77725601196289, "global_step": 451680, "epoch": 5441} {"train_loss": -27.042097091674805, "global_step": 451681, "epoch": 5441} {"train_loss": -26.87837028503418, "global_step": 451682, "epoch": 5441} {"train_loss": -26.8233585357666, "global_step": 451683, "epoch": 5441} {"train_loss": -27.208677291870117, "global_step": 451684, "epoch": 5441} {"train_loss": -26.927987018263483, "global_step": 451685, "epoch": 5441, "val_loss": 6487728.0} {"train_loss": -27.031747817993164, "global_step": 451686, "epoch": 5442} {"train_loss": -26.853490829467773, "global_step": 451687, "epoch": 5442} {"train_loss": -26.55759620666504, "global_step": 451688, "epoch": 5442} {"train_loss": -26.940753936767578, "global_step": 451689, "epoch": 5442} {"train_loss": -26.870824813842773, "global_step": 451690, "epoch": 5442} {"train_loss": -27.074909210205078, "global_step": 451691, "epoch": 5442} {"train_loss": -27.033178329467773, "global_step": 451692, "epoch": 5442} {"train_loss": -26.770401000976562, "global_step": 451693, "epoch": 5442} {"train_loss": -26.895444869995117, "global_step": 451694, "epoch": 5442} {"train_loss": -26.802534103393555, "global_step": 451695, "epoch": 5442} {"train_loss": -27.082950592041016, "global_step": 451696, "epoch": 5442} {"train_loss": -26.887683868408203, "global_step": 451697, "epoch": 5442} {"train_loss": -27.189870834350586, "global_step": 451698, "epoch": 5442} {"train_loss": -27.128986358642578, "global_step": 451699, "epoch": 5442} {"train_loss": -27.07600975036621, "global_step": 451700, "epoch": 5442} {"train_loss": -26.997833251953125, "global_step": 451701, "epoch": 5442} {"train_loss": -27.263748168945312, "global_step": 451702, "epoch": 5442} {"train_loss": -26.9951229095459, "global_step": 451703, "epoch": 5442} {"train_loss": -27.30270767211914, "global_step": 451704, "epoch": 5442} {"train_loss": -27.054187774658203, "global_step": 451705, "epoch": 5442} {"train_loss": -26.666833877563477, "global_step": 451706, "epoch": 5442} {"train_loss": -26.870962142944336, "global_step": 451707, "epoch": 5442} {"train_loss": -26.990772247314453, "global_step": 451708, "epoch": 5442} {"train_loss": -27.145959854125977, "global_step": 451709, "epoch": 5442} {"train_loss": -26.886579513549805, "global_step": 451710, "epoch": 5442} {"train_loss": -27.35116958618164, "global_step": 451711, "epoch": 5442} {"train_loss": -27.240814208984375, "global_step": 451712, "epoch": 5442} {"train_loss": -27.20387840270996, "global_step": 451713, "epoch": 5442} {"train_loss": -27.30707359313965, "global_step": 451714, "epoch": 5442} {"train_loss": -27.202009201049805, "global_step": 451715, "epoch": 5442} {"train_loss": -27.003393173217773, "global_step": 451716, "epoch": 5442} {"train_loss": -27.22637939453125, "global_step": 451717, "epoch": 5442} {"train_loss": -26.87568473815918, "global_step": 451718, "epoch": 5442} {"train_loss": -27.053510665893555, "global_step": 451719, "epoch": 5442} {"train_loss": -27.72367286682129, "global_step": 451720, "epoch": 5442} {"train_loss": -27.2471981048584, "global_step": 451721, "epoch": 5442} {"train_loss": -26.964624404907227, "global_step": 451722, "epoch": 5442} {"train_loss": -27.253576278686523, "global_step": 451723, "epoch": 5442} {"train_loss": -27.171630859375, "global_step": 451724, "epoch": 5442} {"train_loss": -26.907255172729492, "global_step": 451725, "epoch": 5442} {"train_loss": -26.915647506713867, "global_step": 451726, "epoch": 5442} {"train_loss": -27.447345733642578, "global_step": 451727, "epoch": 5442} {"train_loss": -27.571918487548828, "global_step": 451728, "epoch": 5442} {"train_loss": -27.430219650268555, "global_step": 451729, "epoch": 5442} {"train_loss": -27.53763771057129, "global_step": 451730, "epoch": 5442} {"train_loss": -27.448698043823242, "global_step": 451731, "epoch": 5442} {"train_loss": -27.2331600189209, "global_step": 451732, "epoch": 5442} {"train_loss": -27.22138786315918, "global_step": 451733, "epoch": 5442} {"train_loss": -26.69696044921875, "global_step": 451734, "epoch": 5442} {"train_loss": -27.093347549438477, "global_step": 451735, "epoch": 5442} {"train_loss": -26.42951011657715, "global_step": 451736, "epoch": 5442} {"train_loss": -25.93474769592285, "global_step": 451737, "epoch": 5442} {"train_loss": -26.598770141601562, "global_step": 451738, "epoch": 5442} {"train_loss": -26.91299819946289, "global_step": 451739, "epoch": 5442} {"train_loss": -26.01418113708496, "global_step": 451740, "epoch": 5442} {"train_loss": -26.47125816345215, "global_step": 451741, "epoch": 5442} {"train_loss": -26.303197860717773, "global_step": 451742, "epoch": 5442} {"train_loss": -26.886016845703125, "global_step": 451743, "epoch": 5442} {"train_loss": -26.557580947875977, "global_step": 451744, "epoch": 5442} {"train_loss": -26.486780166625977, "global_step": 451745, "epoch": 5442} {"train_loss": -26.6517333984375, "global_step": 451746, "epoch": 5442} {"train_loss": -26.887937545776367, "global_step": 451747, "epoch": 5442} {"train_loss": -26.615314483642578, "global_step": 451748, "epoch": 5442} {"train_loss": -26.993200302124023, "global_step": 451749, "epoch": 5442} {"train_loss": -26.815576553344727, "global_step": 451750, "epoch": 5442} {"train_loss": -26.653553009033203, "global_step": 451751, "epoch": 5442} {"train_loss": -26.481786727905273, "global_step": 451752, "epoch": 5442} {"train_loss": -26.861902236938477, "global_step": 451753, "epoch": 5442} {"train_loss": -26.822851181030273, "global_step": 451754, "epoch": 5442} {"train_loss": -26.57480239868164, "global_step": 451755, "epoch": 5442} {"train_loss": -26.935144424438477, "global_step": 451756, "epoch": 5442} {"train_loss": -27.018402099609375, "global_step": 451757, "epoch": 5442} {"train_loss": -26.647018432617188, "global_step": 451758, "epoch": 5442} {"train_loss": -26.49464225769043, "global_step": 451759, "epoch": 5442} {"train_loss": -26.879703521728516, "global_step": 451760, "epoch": 5442} {"train_loss": -26.37274169921875, "global_step": 451761, "epoch": 5442} {"train_loss": -26.684980392456055, "global_step": 451762, "epoch": 5442} {"train_loss": -26.606531143188477, "global_step": 451763, "epoch": 5442} {"train_loss": -27.04220962524414, "global_step": 451764, "epoch": 5442} {"train_loss": -26.920446395874023, "global_step": 451765, "epoch": 5442} {"train_loss": -27.12577247619629, "global_step": 451766, "epoch": 5442} {"train_loss": -26.88753318786621, "global_step": 451767, "epoch": 5442} {"train_loss": -26.93998520632824, "global_step": 451768, "epoch": 5442, "val_loss": 6524593.5} {"train_loss": -27.083709716796875, "global_step": 451769, "epoch": 5443} {"train_loss": -26.583637237548828, "global_step": 451770, "epoch": 5443} {"train_loss": -27.0273380279541, "global_step": 451771, "epoch": 5443} {"train_loss": -26.156763076782227, "global_step": 451772, "epoch": 5443} {"train_loss": -26.518878936767578, "global_step": 451773, "epoch": 5443} {"train_loss": -27.163318634033203, "global_step": 451774, "epoch": 5443} {"train_loss": -26.4483642578125, "global_step": 451775, "epoch": 5443} {"train_loss": -26.934629440307617, "global_step": 451776, "epoch": 5443} {"train_loss": -26.94257164001465, "global_step": 451777, "epoch": 5443} {"train_loss": -26.825674057006836, "global_step": 451778, "epoch": 5443} {"train_loss": -26.783475875854492, "global_step": 451779, "epoch": 5443} {"train_loss": -26.837316513061523, "global_step": 451780, "epoch": 5443} {"train_loss": -27.13117027282715, "global_step": 451781, "epoch": 5443} {"train_loss": -26.848493576049805, "global_step": 451782, "epoch": 5443} {"train_loss": -27.199462890625, "global_step": 451783, "epoch": 5443} {"train_loss": -27.114425659179688, "global_step": 451784, "epoch": 5443} {"train_loss": -27.366281509399414, "global_step": 451785, "epoch": 5443} {"train_loss": -26.828161239624023, "global_step": 451786, "epoch": 5443} {"train_loss": -27.074304580688477, "global_step": 451787, "epoch": 5443} {"train_loss": -27.35249137878418, "global_step": 451788, "epoch": 5443} {"train_loss": -26.760589599609375, "global_step": 451789, "epoch": 5443} {"train_loss": -27.35698890686035, "global_step": 451790, "epoch": 5443} {"train_loss": -26.71551513671875, "global_step": 451791, "epoch": 5443} {"train_loss": -26.88181495666504, "global_step": 451792, "epoch": 5443} {"train_loss": -27.16889762878418, "global_step": 451793, "epoch": 5443} {"train_loss": -27.143386840820312, "global_step": 451794, "epoch": 5443} {"train_loss": -27.32166862487793, "global_step": 451795, "epoch": 5443} {"train_loss": -27.101526260375977, "global_step": 451796, "epoch": 5443} {"train_loss": -27.251190185546875, "global_step": 451797, "epoch": 5443} {"train_loss": -26.848907470703125, "global_step": 451798, "epoch": 5443} {"train_loss": -27.152917861938477, "global_step": 451799, "epoch": 5443} {"train_loss": -27.111328125, "global_step": 451800, "epoch": 5443} {"train_loss": -27.011823654174805, "global_step": 451801, "epoch": 5443} {"train_loss": -27.241958618164062, "global_step": 451802, "epoch": 5443} {"train_loss": -27.013235092163086, "global_step": 451803, "epoch": 5443} {"train_loss": -26.7119083404541, "global_step": 451804, "epoch": 5443} {"train_loss": -27.138004302978516, "global_step": 451805, "epoch": 5443} {"train_loss": -27.232181549072266, "global_step": 451806, "epoch": 5443} {"train_loss": -27.618457794189453, "global_step": 451807, "epoch": 5443} {"train_loss": -27.33978271484375, "global_step": 451808, "epoch": 5443} {"train_loss": -27.12415885925293, "global_step": 451809, "epoch": 5443} {"train_loss": -27.026935577392578, "global_step": 451810, "epoch": 5443} {"train_loss": -27.36208152770996, "global_step": 451811, "epoch": 5443} {"train_loss": -27.76739501953125, "global_step": 451812, "epoch": 5443} {"train_loss": -27.28104591369629, "global_step": 451813, "epoch": 5443} {"train_loss": -26.905338287353516, "global_step": 451814, "epoch": 5443} {"train_loss": -27.298309326171875, "global_step": 451815, "epoch": 5443} {"train_loss": -27.171722412109375, "global_step": 451816, "epoch": 5443} {"train_loss": -27.259130477905273, "global_step": 451817, "epoch": 5443} {"train_loss": -27.215717315673828, "global_step": 451818, "epoch": 5443} {"train_loss": -27.196744918823242, "global_step": 451819, "epoch": 5443} {"train_loss": -27.5244197845459, "global_step": 451820, "epoch": 5443} {"train_loss": -27.075483322143555, "global_step": 451821, "epoch": 5443} {"train_loss": -27.187280654907227, "global_step": 451822, "epoch": 5443} {"train_loss": -27.180465698242188, "global_step": 451823, "epoch": 5443} {"train_loss": -26.996606826782227, "global_step": 451824, "epoch": 5443} {"train_loss": -26.945032119750977, "global_step": 451825, "epoch": 5443} {"train_loss": -27.10932731628418, "global_step": 451826, "epoch": 5443} {"train_loss": -27.199111938476562, "global_step": 451827, "epoch": 5443} {"train_loss": -26.935510635375977, "global_step": 451828, "epoch": 5443} {"train_loss": -26.729984283447266, "global_step": 451829, "epoch": 5443} {"train_loss": -25.900129318237305, "global_step": 451830, "epoch": 5443} {"train_loss": -25.096426010131836, "global_step": 451831, "epoch": 5443} {"train_loss": -25.221952438354492, "global_step": 451832, "epoch": 5443} {"train_loss": -26.760629653930664, "global_step": 451833, "epoch": 5443} {"train_loss": -25.750186920166016, "global_step": 451834, "epoch": 5443} {"train_loss": -26.5023193359375, "global_step": 451835, "epoch": 5443} {"train_loss": -26.5471248626709, "global_step": 451836, "epoch": 5443} {"train_loss": -26.758508682250977, "global_step": 451837, "epoch": 5443} {"train_loss": -26.61134910583496, "global_step": 451838, "epoch": 5443} {"train_loss": -27.237747192382812, "global_step": 451839, "epoch": 5443} {"train_loss": -26.749799728393555, "global_step": 451840, "epoch": 5443} {"train_loss": -26.873456954956055, "global_step": 451841, "epoch": 5443} {"train_loss": -26.6458683013916, "global_step": 451842, "epoch": 5443} {"train_loss": -26.24267578125, "global_step": 451843, "epoch": 5443} {"train_loss": -26.828693389892578, "global_step": 451844, "epoch": 5443} {"train_loss": -26.56568717956543, "global_step": 451845, "epoch": 5443} {"train_loss": -26.68177604675293, "global_step": 451846, "epoch": 5443} {"train_loss": -26.784025192260742, "global_step": 451847, "epoch": 5443} {"train_loss": -26.477054595947266, "global_step": 451848, "epoch": 5443} {"train_loss": -26.648822784423828, "global_step": 451849, "epoch": 5443} {"train_loss": -26.734922409057617, "global_step": 451850, "epoch": 5443} {"train_loss": -26.91023224520396, "global_step": 451851, "epoch": 5443, "val_loss": 6503761.5} {"train_loss": -25.456260681152344, "global_step": 451852, "epoch": 5444} {"train_loss": -26.19038200378418, "global_step": 451853, "epoch": 5444} {"train_loss": -25.67354393005371, "global_step": 451854, "epoch": 5444} {"train_loss": -25.2414493560791, "global_step": 451855, "epoch": 5444} {"train_loss": -26.126474380493164, "global_step": 451856, "epoch": 5444} {"train_loss": -25.228984832763672, "global_step": 451857, "epoch": 5444} {"train_loss": -26.260791778564453, "global_step": 451858, "epoch": 5444} {"train_loss": -25.797040939331055, "global_step": 451859, "epoch": 5444} {"train_loss": -26.1361141204834, "global_step": 451860, "epoch": 5444} {"train_loss": -25.9965877532959, "global_step": 451861, "epoch": 5444} {"train_loss": -26.363492965698242, "global_step": 451862, "epoch": 5444} {"train_loss": -26.471506118774414, "global_step": 451863, "epoch": 5444} {"train_loss": -26.237689971923828, "global_step": 451864, "epoch": 5444} {"train_loss": -26.381006240844727, "global_step": 451865, "epoch": 5444} {"train_loss": -26.740554809570312, "global_step": 451866, "epoch": 5444} {"train_loss": -26.55269432067871, "global_step": 451867, "epoch": 5444} {"train_loss": -26.62424659729004, "global_step": 451868, "epoch": 5444} {"train_loss": -26.37554359436035, "global_step": 451869, "epoch": 5444} {"train_loss": -26.586400985717773, "global_step": 451870, "epoch": 5444} {"train_loss": -26.6312255859375, "global_step": 451871, "epoch": 5444} {"train_loss": -26.201038360595703, "global_step": 451872, "epoch": 5444} {"train_loss": -26.821752548217773, "global_step": 451873, "epoch": 5444} {"train_loss": -26.7708797454834, "global_step": 451874, "epoch": 5444} {"train_loss": -26.46551513671875, "global_step": 451875, "epoch": 5444} {"train_loss": -26.596393585205078, "global_step": 451876, "epoch": 5444} {"train_loss": -26.761075973510742, "global_step": 451877, "epoch": 5444} {"train_loss": -26.865949630737305, "global_step": 451878, "epoch": 5444} {"train_loss": -26.689680099487305, "global_step": 451879, "epoch": 5444} {"train_loss": -26.768573760986328, "global_step": 451880, "epoch": 5444} {"train_loss": -27.122577667236328, "global_step": 451881, "epoch": 5444} {"train_loss": -26.944814682006836, "global_step": 451882, "epoch": 5444} {"train_loss": -26.871259689331055, "global_step": 451883, "epoch": 5444} {"train_loss": -26.968902587890625, "global_step": 451884, "epoch": 5444} {"train_loss": -26.980518341064453, "global_step": 451885, "epoch": 5444} {"train_loss": -27.020334243774414, "global_step": 451886, "epoch": 5444} {"train_loss": -26.9129581451416, "global_step": 451887, "epoch": 5444} {"train_loss": -26.936262130737305, "global_step": 451888, "epoch": 5444} {"train_loss": -27.20346450805664, "global_step": 451889, "epoch": 5444} {"train_loss": -26.9210147857666, "global_step": 451890, "epoch": 5444} {"train_loss": -27.234235763549805, "global_step": 451891, "epoch": 5444} {"train_loss": -27.036331176757812, "global_step": 451892, "epoch": 5444} {"train_loss": -27.194278717041016, "global_step": 451893, "epoch": 5444} {"train_loss": -27.07470703125, "global_step": 451894, "epoch": 5444} {"train_loss": -27.078027725219727, "global_step": 451895, "epoch": 5444} {"train_loss": -26.89320182800293, "global_step": 451896, "epoch": 5444} {"train_loss": -26.848011016845703, "global_step": 451897, "epoch": 5444} {"train_loss": -27.045684814453125, "global_step": 451898, "epoch": 5444} {"train_loss": -27.170835494995117, "global_step": 451899, "epoch": 5444} {"train_loss": -27.292150497436523, "global_step": 451900, "epoch": 5444} {"train_loss": -26.881444931030273, "global_step": 451901, "epoch": 5444} {"train_loss": -27.319639205932617, "global_step": 451902, "epoch": 5444} {"train_loss": -27.45369529724121, "global_step": 451903, "epoch": 5444} {"train_loss": -27.208532333374023, "global_step": 451904, "epoch": 5444} {"train_loss": -27.022541046142578, "global_step": 451905, "epoch": 5444} {"train_loss": -27.46268081665039, "global_step": 451906, "epoch": 5444} {"train_loss": -27.020832061767578, "global_step": 451907, "epoch": 5444} {"train_loss": -27.485517501831055, "global_step": 451908, "epoch": 5444} {"train_loss": -26.881534576416016, "global_step": 451909, "epoch": 5444} {"train_loss": -26.8404598236084, "global_step": 451910, "epoch": 5444} {"train_loss": -26.579587936401367, "global_step": 451911, "epoch": 5444} {"train_loss": -26.94605827331543, "global_step": 451912, "epoch": 5444} {"train_loss": -27.541173934936523, "global_step": 451913, "epoch": 5444} {"train_loss": -27.18763542175293, "global_step": 451914, "epoch": 5444} {"train_loss": -26.69587516784668, "global_step": 451915, "epoch": 5444} {"train_loss": -26.43558120727539, "global_step": 451916, "epoch": 5444} {"train_loss": -26.99652671813965, "global_step": 451917, "epoch": 5444} {"train_loss": -26.754281997680664, "global_step": 451918, "epoch": 5444} {"train_loss": -26.62717628479004, "global_step": 451919, "epoch": 5444} {"train_loss": -27.319538116455078, "global_step": 451920, "epoch": 5444} {"train_loss": -27.1412296295166, "global_step": 451921, "epoch": 5444} {"train_loss": -26.88973045349121, "global_step": 451922, "epoch": 5444} {"train_loss": -26.86542320251465, "global_step": 451923, "epoch": 5444} {"train_loss": -26.797231674194336, "global_step": 451924, "epoch": 5444} {"train_loss": -27.47406005859375, "global_step": 451925, "epoch": 5444} {"train_loss": -27.38075065612793, "global_step": 451926, "epoch": 5444} {"train_loss": -26.7290096282959, "global_step": 451927, "epoch": 5444} {"train_loss": -27.260395050048828, "global_step": 451928, "epoch": 5444} {"train_loss": -27.21051597595215, "global_step": 451929, "epoch": 5444} {"train_loss": -27.008344650268555, "global_step": 451930, "epoch": 5444} {"train_loss": -26.721099853515625, "global_step": 451931, "epoch": 5444} {"train_loss": -27.279829025268555, "global_step": 451932, "epoch": 5444} {"train_loss": -27.262348175048828, "global_step": 451933, "epoch": 5444} {"train_loss": -26.788411450673298, "global_step": 451934, "epoch": 5444, "val_loss": 6481776.0} {"train_loss": -27.17629051208496, "global_step": 451935, "epoch": 5445} {"train_loss": -26.380538940429688, "global_step": 451936, "epoch": 5445} {"train_loss": -26.717309951782227, "global_step": 451937, "epoch": 5445} {"train_loss": -26.641942977905273, "global_step": 451938, "epoch": 5445} {"train_loss": -26.959949493408203, "global_step": 451939, "epoch": 5445} {"train_loss": -26.931501388549805, "global_step": 451940, "epoch": 5445} {"train_loss": -26.88702392578125, "global_step": 451941, "epoch": 5445} {"train_loss": -26.540807723999023, "global_step": 451942, "epoch": 5445} {"train_loss": -26.8314151763916, "global_step": 451943, "epoch": 5445} {"train_loss": -26.83403968811035, "global_step": 451944, "epoch": 5445} {"train_loss": -26.66495704650879, "global_step": 451945, "epoch": 5445} {"train_loss": -27.08723258972168, "global_step": 451946, "epoch": 5445} {"train_loss": -26.72458839416504, "global_step": 451947, "epoch": 5445} {"train_loss": -26.990137100219727, "global_step": 451948, "epoch": 5445} {"train_loss": -26.933393478393555, "global_step": 451949, "epoch": 5445} {"train_loss": -26.597074508666992, "global_step": 451950, "epoch": 5445} {"train_loss": -26.760833740234375, "global_step": 451951, "epoch": 5445} {"train_loss": -27.059967041015625, "global_step": 451952, "epoch": 5445} {"train_loss": -27.25860023498535, "global_step": 451953, "epoch": 5445} {"train_loss": -27.086835861206055, "global_step": 451954, "epoch": 5445} {"train_loss": -27.39238929748535, "global_step": 451955, "epoch": 5445} {"train_loss": -27.041940689086914, "global_step": 451956, "epoch": 5445} {"train_loss": -26.92328453063965, "global_step": 451957, "epoch": 5445} {"train_loss": -26.907068252563477, "global_step": 451958, "epoch": 5445} {"train_loss": -26.82008171081543, "global_step": 451959, "epoch": 5445} {"train_loss": -27.144412994384766, "global_step": 451960, "epoch": 5445} {"train_loss": -27.226770401000977, "global_step": 451961, "epoch": 5445} {"train_loss": -27.35845947265625, "global_step": 451962, "epoch": 5445} {"train_loss": -27.249265670776367, "global_step": 451963, "epoch": 5445} {"train_loss": -27.17988395690918, "global_step": 451964, "epoch": 5445} {"train_loss": -27.345905303955078, "global_step": 451965, "epoch": 5445} {"train_loss": -27.279821395874023, "global_step": 451966, "epoch": 5445} {"train_loss": -27.13822364807129, "global_step": 451967, "epoch": 5445} {"train_loss": -27.161645889282227, "global_step": 451968, "epoch": 5445} {"train_loss": -27.0297908782959, "global_step": 451969, "epoch": 5445} {"train_loss": -27.238819122314453, "global_step": 451970, "epoch": 5445} {"train_loss": -27.23455238342285, "global_step": 451971, "epoch": 5445} {"train_loss": -27.174829483032227, "global_step": 451972, "epoch": 5445} {"train_loss": -27.01283073425293, "global_step": 451973, "epoch": 5445} {"train_loss": -27.509387969970703, "global_step": 451974, "epoch": 5445} {"train_loss": -27.191030502319336, "global_step": 451975, "epoch": 5445} {"train_loss": -27.375043869018555, "global_step": 451976, "epoch": 5445} {"train_loss": -27.28348731994629, "global_step": 451977, "epoch": 5445} {"train_loss": -27.11756706237793, "global_step": 451978, "epoch": 5445} {"train_loss": -26.94964027404785, "global_step": 451979, "epoch": 5445} {"train_loss": -27.225311279296875, "global_step": 451980, "epoch": 5445} {"train_loss": -26.97967529296875, "global_step": 451981, "epoch": 5445} {"train_loss": -27.240005493164062, "global_step": 451982, "epoch": 5445} {"train_loss": -27.456079483032227, "global_step": 451983, "epoch": 5445} {"train_loss": -27.142261505126953, "global_step": 451984, "epoch": 5445} {"train_loss": -27.113483428955078, "global_step": 451985, "epoch": 5445} {"train_loss": -27.13006019592285, "global_step": 451986, "epoch": 5445} {"train_loss": -27.147968292236328, "global_step": 451987, "epoch": 5445} {"train_loss": -27.338043212890625, "global_step": 451988, "epoch": 5445} {"train_loss": -26.840845108032227, "global_step": 451989, "epoch": 5445} {"train_loss": -27.126245498657227, "global_step": 451990, "epoch": 5445} {"train_loss": -27.15186882019043, "global_step": 451991, "epoch": 5445} {"train_loss": -27.010421752929688, "global_step": 451992, "epoch": 5445} {"train_loss": -27.511938095092773, "global_step": 451993, "epoch": 5445} {"train_loss": -26.913755416870117, "global_step": 451994, "epoch": 5445} {"train_loss": -27.150556564331055, "global_step": 451995, "epoch": 5445} {"train_loss": -27.37733268737793, "global_step": 451996, "epoch": 5445} {"train_loss": -27.029645919799805, "global_step": 451997, "epoch": 5445} {"train_loss": -27.124425888061523, "global_step": 451998, "epoch": 5445} {"train_loss": -27.417272567749023, "global_step": 451999, "epoch": 5445} {"train_loss": -27.0384521484375, "global_step": 452000, "epoch": 5445} {"train_loss": -27.2178897857666, "global_step": 452001, "epoch": 5445} {"train_loss": -27.122812271118164, "global_step": 452002, "epoch": 5445} {"train_loss": -27.167804718017578, "global_step": 452003, "epoch": 5445} {"train_loss": -26.94466209411621, "global_step": 452004, "epoch": 5445} {"train_loss": -27.2523193359375, "global_step": 452005, "epoch": 5445} {"train_loss": -27.5721435546875, "global_step": 452006, "epoch": 5445} {"train_loss": -27.042236328125, "global_step": 452007, "epoch": 5445} {"train_loss": -26.999486923217773, "global_step": 452008, "epoch": 5445} {"train_loss": -27.199405670166016, "global_step": 452009, "epoch": 5445} {"train_loss": -27.054431915283203, "global_step": 452010, "epoch": 5445} {"train_loss": -27.19675636291504, "global_step": 452011, "epoch": 5445} {"train_loss": -27.14999771118164, "global_step": 452012, "epoch": 5445} {"train_loss": -26.967899322509766, "global_step": 452013, "epoch": 5445} {"train_loss": -27.120779037475586, "global_step": 452014, "epoch": 5445} {"train_loss": -27.223474502563477, "global_step": 452015, "epoch": 5445} {"train_loss": -27.01559829711914, "global_step": 452016, "epoch": 5445} {"train_loss": -27.077039649687617, "global_step": 452017, "epoch": 5445, "val_loss": 6550380.0} {"train_loss": -26.546680450439453, "global_step": 452018, "epoch": 5446} {"train_loss": -26.194616317749023, "global_step": 452019, "epoch": 5446} {"train_loss": -25.78065299987793, "global_step": 452020, "epoch": 5446} {"train_loss": -26.6064453125, "global_step": 452021, "epoch": 5446} {"train_loss": -26.042316436767578, "global_step": 452022, "epoch": 5446} {"train_loss": -26.068357467651367, "global_step": 452023, "epoch": 5446} {"train_loss": -26.318750381469727, "global_step": 452024, "epoch": 5446} {"train_loss": -26.078237533569336, "global_step": 452025, "epoch": 5446} {"train_loss": -27.15999412536621, "global_step": 452026, "epoch": 5446} {"train_loss": -26.91119384765625, "global_step": 452027, "epoch": 5446} {"train_loss": -26.557233810424805, "global_step": 452028, "epoch": 5446} {"train_loss": -26.860797882080078, "global_step": 452029, "epoch": 5446} {"train_loss": -26.961034774780273, "global_step": 452030, "epoch": 5446} {"train_loss": -26.882612228393555, "global_step": 452031, "epoch": 5446} {"train_loss": -27.22800636291504, "global_step": 452032, "epoch": 5446} {"train_loss": -26.84000015258789, "global_step": 452033, "epoch": 5446} {"train_loss": -26.65805435180664, "global_step": 452034, "epoch": 5446} {"train_loss": -27.221357345581055, "global_step": 452035, "epoch": 5446} {"train_loss": -26.98321533203125, "global_step": 452036, "epoch": 5446} {"train_loss": -27.187726974487305, "global_step": 452037, "epoch": 5446} {"train_loss": -26.914642333984375, "global_step": 452038, "epoch": 5446} {"train_loss": -27.0866756439209, "global_step": 452039, "epoch": 5446} {"train_loss": -26.876163482666016, "global_step": 452040, "epoch": 5446} {"train_loss": -27.14802360534668, "global_step": 452041, "epoch": 5446} {"train_loss": -26.908578872680664, "global_step": 452042, "epoch": 5446} {"train_loss": -27.0770206451416, "global_step": 452043, "epoch": 5446} {"train_loss": -27.148584365844727, "global_step": 452044, "epoch": 5446} {"train_loss": -27.14276695251465, "global_step": 452045, "epoch": 5446} {"train_loss": -26.773365020751953, "global_step": 452046, "epoch": 5446} {"train_loss": -27.012842178344727, "global_step": 452047, "epoch": 5446} {"train_loss": -27.084720611572266, "global_step": 452048, "epoch": 5446} {"train_loss": -27.501270294189453, "global_step": 452049, "epoch": 5446} {"train_loss": -26.832273483276367, "global_step": 452050, "epoch": 5446} {"train_loss": -26.513870239257812, "global_step": 452051, "epoch": 5446} {"train_loss": -26.83349609375, "global_step": 452052, "epoch": 5446} {"train_loss": -27.24969482421875, "global_step": 452053, "epoch": 5446} {"train_loss": -27.053091049194336, "global_step": 452054, "epoch": 5446} {"train_loss": -26.8504581451416, "global_step": 452055, "epoch": 5446} {"train_loss": -26.690771102905273, "global_step": 452056, "epoch": 5446} {"train_loss": -27.472320556640625, "global_step": 452057, "epoch": 5446} {"train_loss": -26.916980743408203, "global_step": 452058, "epoch": 5446} {"train_loss": -26.87371826171875, "global_step": 452059, "epoch": 5446} {"train_loss": -27.066675186157227, "global_step": 452060, "epoch": 5446} {"train_loss": -26.948423385620117, "global_step": 452061, "epoch": 5446} {"train_loss": -27.174304962158203, "global_step": 452062, "epoch": 5446} {"train_loss": -27.263341903686523, "global_step": 452063, "epoch": 5446} {"train_loss": -27.438032150268555, "global_step": 452064, "epoch": 5446} {"train_loss": -26.790924072265625, "global_step": 452065, "epoch": 5446} {"train_loss": -27.112049102783203, "global_step": 452066, "epoch": 5446} {"train_loss": -26.8248233795166, "global_step": 452067, "epoch": 5446} {"train_loss": -26.926130294799805, "global_step": 452068, "epoch": 5446} {"train_loss": -26.920063018798828, "global_step": 452069, "epoch": 5446} {"train_loss": -27.005945205688477, "global_step": 452070, "epoch": 5446} {"train_loss": -27.138427734375, "global_step": 452071, "epoch": 5446} {"train_loss": -26.913848876953125, "global_step": 452072, "epoch": 5446} {"train_loss": -27.01752281188965, "global_step": 452073, "epoch": 5446} {"train_loss": -26.8316650390625, "global_step": 452074, "epoch": 5446} {"train_loss": -26.898160934448242, "global_step": 452075, "epoch": 5446} {"train_loss": -27.165613174438477, "global_step": 452076, "epoch": 5446} {"train_loss": -26.969852447509766, "global_step": 452077, "epoch": 5446} {"train_loss": -27.250335693359375, "global_step": 452078, "epoch": 5446} {"train_loss": -26.94577980041504, "global_step": 452079, "epoch": 5446} {"train_loss": -26.803028106689453, "global_step": 452080, "epoch": 5446} {"train_loss": -26.96663475036621, "global_step": 452081, "epoch": 5446} {"train_loss": -26.969388961791992, "global_step": 452082, "epoch": 5446} {"train_loss": -27.278024673461914, "global_step": 452083, "epoch": 5446} {"train_loss": -26.829212188720703, "global_step": 452084, "epoch": 5446} {"train_loss": -26.60161781311035, "global_step": 452085, "epoch": 5446} {"train_loss": -27.077392578125, "global_step": 452086, "epoch": 5446} {"train_loss": -26.9411678314209, "global_step": 452087, "epoch": 5446} {"train_loss": -27.021894454956055, "global_step": 452088, "epoch": 5446} {"train_loss": -26.89277458190918, "global_step": 452089, "epoch": 5446} {"train_loss": -27.67399024963379, "global_step": 452090, "epoch": 5446} {"train_loss": -27.132251739501953, "global_step": 452091, "epoch": 5446} {"train_loss": -26.999975204467773, "global_step": 452092, "epoch": 5446} {"train_loss": -26.895002365112305, "global_step": 452093, "epoch": 5446} {"train_loss": -26.957626342773438, "global_step": 452094, "epoch": 5446} {"train_loss": -27.126611709594727, "global_step": 452095, "epoch": 5446} {"train_loss": -26.942472457885742, "global_step": 452096, "epoch": 5446} {"train_loss": -27.03664207458496, "global_step": 452097, "epoch": 5446} {"train_loss": -27.012426376342773, "global_step": 452098, "epoch": 5446} {"train_loss": -27.219562530517578, "global_step": 452099, "epoch": 5446} {"train_loss": -26.92601948473827, "global_step": 452100, "epoch": 5446, "val_loss": 6509348.0} {"train_loss": -26.392087936401367, "global_step": 452101, "epoch": 5447} {"train_loss": -26.669382095336914, "global_step": 452102, "epoch": 5447} {"train_loss": -26.834741592407227, "global_step": 452103, "epoch": 5447} {"train_loss": -26.389387130737305, "global_step": 452104, "epoch": 5447} {"train_loss": -26.63209342956543, "global_step": 452105, "epoch": 5447} {"train_loss": -26.8361759185791, "global_step": 452106, "epoch": 5447} {"train_loss": -26.68690299987793, "global_step": 452107, "epoch": 5447} {"train_loss": -26.808393478393555, "global_step": 452108, "epoch": 5447} {"train_loss": -26.864126205444336, "global_step": 452109, "epoch": 5447} {"train_loss": -26.94580078125, "global_step": 452110, "epoch": 5447} {"train_loss": -26.717029571533203, "global_step": 452111, "epoch": 5447} {"train_loss": -26.933507919311523, "global_step": 452112, "epoch": 5447} {"train_loss": -26.861066818237305, "global_step": 452113, "epoch": 5447} {"train_loss": -26.601362228393555, "global_step": 452114, "epoch": 5447} {"train_loss": -27.040924072265625, "global_step": 452115, "epoch": 5447} {"train_loss": -26.84994888305664, "global_step": 452116, "epoch": 5447} {"train_loss": -26.778717041015625, "global_step": 452117, "epoch": 5447} {"train_loss": -27.323862075805664, "global_step": 452118, "epoch": 5447} {"train_loss": -26.7083740234375, "global_step": 452119, "epoch": 5447} {"train_loss": -26.725488662719727, "global_step": 452120, "epoch": 5447} {"train_loss": -26.953771591186523, "global_step": 452121, "epoch": 5447} {"train_loss": -26.837024688720703, "global_step": 452122, "epoch": 5447} {"train_loss": -27.335187911987305, "global_step": 452123, "epoch": 5447} {"train_loss": -26.629810333251953, "global_step": 452124, "epoch": 5447} {"train_loss": -26.67313003540039, "global_step": 452125, "epoch": 5447} {"train_loss": -27.2059268951416, "global_step": 452126, "epoch": 5447} {"train_loss": -26.95315933227539, "global_step": 452127, "epoch": 5447} {"train_loss": -26.885242462158203, "global_step": 452128, "epoch": 5447} {"train_loss": -26.78755760192871, "global_step": 452129, "epoch": 5447} {"train_loss": -26.821069717407227, "global_step": 452130, "epoch": 5447} {"train_loss": -26.983768463134766, "global_step": 452131, "epoch": 5447} {"train_loss": -26.38551139831543, "global_step": 452132, "epoch": 5447} {"train_loss": -26.741220474243164, "global_step": 452133, "epoch": 5447} {"train_loss": -26.872114181518555, "global_step": 452134, "epoch": 5447} {"train_loss": -26.85184669494629, "global_step": 452135, "epoch": 5447} {"train_loss": -26.719934463500977, "global_step": 452136, "epoch": 5447} {"train_loss": -26.851469039916992, "global_step": 452137, "epoch": 5447} {"train_loss": -26.92292594909668, "global_step": 452138, "epoch": 5447} {"train_loss": -27.154890060424805, "global_step": 452139, "epoch": 5447} {"train_loss": -27.13691520690918, "global_step": 452140, "epoch": 5447} {"train_loss": -26.994766235351562, "global_step": 452141, "epoch": 5447} {"train_loss": -26.873563766479492, "global_step": 452142, "epoch": 5447} {"train_loss": -27.401355743408203, "global_step": 452143, "epoch": 5447} {"train_loss": -26.763595581054688, "global_step": 452144, "epoch": 5447} {"train_loss": -26.9652156829834, "global_step": 452145, "epoch": 5447} {"train_loss": -27.040557861328125, "global_step": 452146, "epoch": 5447} {"train_loss": -27.241857528686523, "global_step": 452147, "epoch": 5447} {"train_loss": -26.985034942626953, "global_step": 452148, "epoch": 5447} {"train_loss": -26.988788604736328, "global_step": 452149, "epoch": 5447} {"train_loss": -27.257413864135742, "global_step": 452150, "epoch": 5447} {"train_loss": -27.403533935546875, "global_step": 452151, "epoch": 5447} {"train_loss": -27.15655517578125, "global_step": 452152, "epoch": 5447} {"train_loss": -27.526447296142578, "global_step": 452153, "epoch": 5447} {"train_loss": -27.30340003967285, "global_step": 452154, "epoch": 5447} {"train_loss": -27.061054229736328, "global_step": 452155, "epoch": 5447} {"train_loss": -27.180265426635742, "global_step": 452156, "epoch": 5447} {"train_loss": -26.88239097595215, "global_step": 452157, "epoch": 5447} {"train_loss": -27.118452072143555, "global_step": 452158, "epoch": 5447} {"train_loss": -27.30640983581543, "global_step": 452159, "epoch": 5447} {"train_loss": -27.149274826049805, "global_step": 452160, "epoch": 5447} {"train_loss": -27.001794815063477, "global_step": 452161, "epoch": 5447} {"train_loss": -27.298131942749023, "global_step": 452162, "epoch": 5447} {"train_loss": -27.116430282592773, "global_step": 452163, "epoch": 5447} {"train_loss": -27.20806884765625, "global_step": 452164, "epoch": 5447} {"train_loss": -27.362030029296875, "global_step": 452165, "epoch": 5447} {"train_loss": -27.189193725585938, "global_step": 452166, "epoch": 5447} {"train_loss": -27.159351348876953, "global_step": 452167, "epoch": 5447} {"train_loss": -26.895063400268555, "global_step": 452168, "epoch": 5447} {"train_loss": -26.928314208984375, "global_step": 452169, "epoch": 5447} {"train_loss": -26.922595977783203, "global_step": 452170, "epoch": 5447} {"train_loss": -26.872690200805664, "global_step": 452171, "epoch": 5447} {"train_loss": -26.819822311401367, "global_step": 452172, "epoch": 5447} {"train_loss": -27.0517578125, "global_step": 452173, "epoch": 5447} {"train_loss": -27.057342529296875, "global_step": 452174, "epoch": 5447} {"train_loss": -27.278656005859375, "global_step": 452175, "epoch": 5447} {"train_loss": -26.416040420532227, "global_step": 452176, "epoch": 5447} {"train_loss": -26.42657470703125, "global_step": 452177, "epoch": 5447} {"train_loss": -26.3237247467041, "global_step": 452178, "epoch": 5447} {"train_loss": -26.882551193237305, "global_step": 452179, "epoch": 5447} {"train_loss": -26.581586837768555, "global_step": 452180, "epoch": 5447} {"train_loss": -27.229684829711914, "global_step": 452181, "epoch": 5447} {"train_loss": -26.89080810546875, "global_step": 452182, "epoch": 5447} {"train_loss": -26.94157451032156, "global_step": 452183, "epoch": 5447, "val_loss": 6485893.0} {"train_loss": -26.57568359375, "global_step": 452184, "epoch": 5448} {"train_loss": -26.63228416442871, "global_step": 452185, "epoch": 5448} {"train_loss": -25.756635665893555, "global_step": 452186, "epoch": 5448} {"train_loss": -26.493886947631836, "global_step": 452187, "epoch": 5448} {"train_loss": -26.802753448486328, "global_step": 452188, "epoch": 5448} {"train_loss": -26.479969024658203, "global_step": 452189, "epoch": 5448} {"train_loss": -26.590864181518555, "global_step": 452190, "epoch": 5448} {"train_loss": -27.04281997680664, "global_step": 452191, "epoch": 5448} {"train_loss": -26.511499404907227, "global_step": 452192, "epoch": 5448} {"train_loss": -26.776803970336914, "global_step": 452193, "epoch": 5448} {"train_loss": -26.235675811767578, "global_step": 452194, "epoch": 5448} {"train_loss": -26.649185180664062, "global_step": 452195, "epoch": 5448} {"train_loss": -26.70216178894043, "global_step": 452196, "epoch": 5448} {"train_loss": -26.663000106811523, "global_step": 452197, "epoch": 5448} {"train_loss": -27.157217025756836, "global_step": 452198, "epoch": 5448} {"train_loss": -26.71375846862793, "global_step": 452199, "epoch": 5448} {"train_loss": -27.089313507080078, "global_step": 452200, "epoch": 5448} {"train_loss": -26.850488662719727, "global_step": 452201, "epoch": 5448} {"train_loss": -27.05925941467285, "global_step": 452202, "epoch": 5448} {"train_loss": -26.9243106842041, "global_step": 452203, "epoch": 5448} {"train_loss": -27.26384925842285, "global_step": 452204, "epoch": 5448} {"train_loss": -27.016836166381836, "global_step": 452205, "epoch": 5448} {"train_loss": -26.97855567932129, "global_step": 452206, "epoch": 5448} {"train_loss": -26.631376266479492, "global_step": 452207, "epoch": 5448} {"train_loss": -27.432104110717773, "global_step": 452208, "epoch": 5448} {"train_loss": -27.016651153564453, "global_step": 452209, "epoch": 5448} {"train_loss": -26.79840660095215, "global_step": 452210, "epoch": 5448} {"train_loss": -27.15216636657715, "global_step": 452211, "epoch": 5448} {"train_loss": -27.01836585998535, "global_step": 452212, "epoch": 5448} {"train_loss": -27.13667106628418, "global_step": 452213, "epoch": 5448} {"train_loss": -27.236663818359375, "global_step": 452214, "epoch": 5448} {"train_loss": -27.003814697265625, "global_step": 452215, "epoch": 5448} {"train_loss": -27.2748966217041, "global_step": 452216, "epoch": 5448} {"train_loss": -27.134485244750977, "global_step": 452217, "epoch": 5448} {"train_loss": -27.029541015625, "global_step": 452218, "epoch": 5448} {"train_loss": -27.022375106811523, "global_step": 452219, "epoch": 5448} {"train_loss": -27.443225860595703, "global_step": 452220, "epoch": 5448} {"train_loss": -26.9698486328125, "global_step": 452221, "epoch": 5448} {"train_loss": -27.198041915893555, "global_step": 452222, "epoch": 5448} {"train_loss": -26.996850967407227, "global_step": 452223, "epoch": 5448} {"train_loss": -26.84393310546875, "global_step": 452224, "epoch": 5448} {"train_loss": -27.029926300048828, "global_step": 452225, "epoch": 5448} {"train_loss": -27.283727645874023, "global_step": 452226, "epoch": 5448} {"train_loss": -27.381128311157227, "global_step": 452227, "epoch": 5448} {"train_loss": -27.395959854125977, "global_step": 452228, "epoch": 5448} {"train_loss": -27.20574378967285, "global_step": 452229, "epoch": 5448} {"train_loss": -27.330533981323242, "global_step": 452230, "epoch": 5448} {"train_loss": -26.94771385192871, "global_step": 452231, "epoch": 5448} {"train_loss": -26.99281120300293, "global_step": 452232, "epoch": 5448} {"train_loss": -27.13783073425293, "global_step": 452233, "epoch": 5448} {"train_loss": -27.21644401550293, "global_step": 452234, "epoch": 5448} {"train_loss": -26.961231231689453, "global_step": 452235, "epoch": 5448} {"train_loss": -27.256757736206055, "global_step": 452236, "epoch": 5448} {"train_loss": -27.1928653717041, "global_step": 452237, "epoch": 5448} {"train_loss": -27.356525421142578, "global_step": 452238, "epoch": 5448} {"train_loss": -27.41464614868164, "global_step": 452239, "epoch": 5448} {"train_loss": -27.1023006439209, "global_step": 452240, "epoch": 5448} {"train_loss": -26.84994888305664, "global_step": 452241, "epoch": 5448} {"train_loss": -26.958463668823242, "global_step": 452242, "epoch": 5448} {"train_loss": -26.56257438659668, "global_step": 452243, "epoch": 5448} {"train_loss": -25.90608024597168, "global_step": 452244, "epoch": 5448} {"train_loss": -26.801990509033203, "global_step": 452245, "epoch": 5448} {"train_loss": -26.97855567932129, "global_step": 452246, "epoch": 5448} {"train_loss": -26.789371490478516, "global_step": 452247, "epoch": 5448} {"train_loss": -26.617895126342773, "global_step": 452248, "epoch": 5448} {"train_loss": -26.765268325805664, "global_step": 452249, "epoch": 5448} {"train_loss": -26.83489418029785, "global_step": 452250, "epoch": 5448} {"train_loss": -26.50188636779785, "global_step": 452251, "epoch": 5448} {"train_loss": -26.832014083862305, "global_step": 452252, "epoch": 5448} {"train_loss": -26.644672393798828, "global_step": 452253, "epoch": 5448} {"train_loss": -26.783849716186523, "global_step": 452254, "epoch": 5448} {"train_loss": -26.780303955078125, "global_step": 452255, "epoch": 5448} {"train_loss": -26.894454956054688, "global_step": 452256, "epoch": 5448} {"train_loss": -27.089475631713867, "global_step": 452257, "epoch": 5448} {"train_loss": -26.540882110595703, "global_step": 452258, "epoch": 5448} {"train_loss": -27.09915542602539, "global_step": 452259, "epoch": 5448} {"train_loss": -26.840787887573242, "global_step": 452260, "epoch": 5448} {"train_loss": -27.010364532470703, "global_step": 452261, "epoch": 5448} {"train_loss": -26.588748931884766, "global_step": 452262, "epoch": 5448} {"train_loss": -27.066946029663086, "global_step": 452263, "epoch": 5448} {"train_loss": -26.988309860229492, "global_step": 452264, "epoch": 5448} {"train_loss": -26.82728385925293, "global_step": 452265, "epoch": 5448} {"train_loss": -26.93967612392931, "global_step": 452266, "epoch": 5448, "val_loss": 6467321.0} {"train_loss": -26.210668563842773, "global_step": 452267, "epoch": 5449} {"train_loss": -26.700077056884766, "global_step": 452268, "epoch": 5449} {"train_loss": -26.39533805847168, "global_step": 452269, "epoch": 5449} {"train_loss": -26.472370147705078, "global_step": 452270, "epoch": 5449} {"train_loss": -26.70576286315918, "global_step": 452271, "epoch": 5449} {"train_loss": -26.71319580078125, "global_step": 452272, "epoch": 5449} {"train_loss": -26.576208114624023, "global_step": 452273, "epoch": 5449} {"train_loss": -26.578672409057617, "global_step": 452274, "epoch": 5449} {"train_loss": -26.86174964904785, "global_step": 452275, "epoch": 5449} {"train_loss": -26.667245864868164, "global_step": 452276, "epoch": 5449} {"train_loss": -26.559900283813477, "global_step": 452277, "epoch": 5449} {"train_loss": -26.715625762939453, "global_step": 452278, "epoch": 5449} {"train_loss": -27.035058975219727, "global_step": 452279, "epoch": 5449} {"train_loss": -27.029111862182617, "global_step": 452280, "epoch": 5449} {"train_loss": -26.726648330688477, "global_step": 452281, "epoch": 5449} {"train_loss": -26.852258682250977, "global_step": 452282, "epoch": 5449} {"train_loss": -26.930906295776367, "global_step": 452283, "epoch": 5449} {"train_loss": -26.679346084594727, "global_step": 452284, "epoch": 5449} {"train_loss": -26.839771270751953, "global_step": 452285, "epoch": 5449} {"train_loss": -27.033924102783203, "global_step": 452286, "epoch": 5449} {"train_loss": -27.0593318939209, "global_step": 452287, "epoch": 5449} {"train_loss": -27.042346954345703, "global_step": 452288, "epoch": 5449} {"train_loss": -26.81157875061035, "global_step": 452289, "epoch": 5449} {"train_loss": -26.7861385345459, "global_step": 452290, "epoch": 5449} {"train_loss": -26.869802474975586, "global_step": 452291, "epoch": 5449} {"train_loss": -26.749902725219727, "global_step": 452292, "epoch": 5449} {"train_loss": -27.010150909423828, "global_step": 452293, "epoch": 5449} {"train_loss": -26.81837272644043, "global_step": 452294, "epoch": 5449} {"train_loss": -26.744464874267578, "global_step": 452295, "epoch": 5449} {"train_loss": -26.98396873474121, "global_step": 452296, "epoch": 5449} {"train_loss": -26.829336166381836, "global_step": 452297, "epoch": 5449} {"train_loss": -27.067609786987305, "global_step": 452298, "epoch": 5449} {"train_loss": -27.22273063659668, "global_step": 452299, "epoch": 5449} {"train_loss": -26.817052841186523, "global_step": 452300, "epoch": 5449} {"train_loss": -26.811206817626953, "global_step": 452301, "epoch": 5449} {"train_loss": -27.123245239257812, "global_step": 452302, "epoch": 5449} {"train_loss": -26.9111270904541, "global_step": 452303, "epoch": 5449} {"train_loss": -26.685577392578125, "global_step": 452304, "epoch": 5449} {"train_loss": -26.73798942565918, "global_step": 452305, "epoch": 5449} {"train_loss": -26.848485946655273, "global_step": 452306, "epoch": 5449} {"train_loss": -26.89226722717285, "global_step": 452307, "epoch": 5449} {"train_loss": -26.84299659729004, "global_step": 452308, "epoch": 5449} {"train_loss": -27.148237228393555, "global_step": 452309, "epoch": 5449} {"train_loss": -27.54543113708496, "global_step": 452310, "epoch": 5449} {"train_loss": -26.666044235229492, "global_step": 452311, "epoch": 5449} {"train_loss": -27.158918380737305, "global_step": 452312, "epoch": 5449} {"train_loss": -26.788257598876953, "global_step": 452313, "epoch": 5449} {"train_loss": -27.147062301635742, "global_step": 452314, "epoch": 5449} {"train_loss": -27.16094398498535, "global_step": 452315, "epoch": 5449} {"train_loss": -27.11492347717285, "global_step": 452316, "epoch": 5449} {"train_loss": -26.84284019470215, "global_step": 452317, "epoch": 5449} {"train_loss": -27.11493492126465, "global_step": 452318, "epoch": 5449} {"train_loss": -27.201345443725586, "global_step": 452319, "epoch": 5449} {"train_loss": -27.050580978393555, "global_step": 452320, "epoch": 5449} {"train_loss": -26.899539947509766, "global_step": 452321, "epoch": 5449} {"train_loss": -27.0476131439209, "global_step": 452322, "epoch": 5449} {"train_loss": -27.430280685424805, "global_step": 452323, "epoch": 5449} {"train_loss": -27.38274574279785, "global_step": 452324, "epoch": 5449} {"train_loss": -27.513534545898438, "global_step": 452325, "epoch": 5449} {"train_loss": -27.4929256439209, "global_step": 452326, "epoch": 5449} {"train_loss": -27.039295196533203, "global_step": 452327, "epoch": 5449} {"train_loss": -27.2617130279541, "global_step": 452328, "epoch": 5449} {"train_loss": -26.665002822875977, "global_step": 452329, "epoch": 5449} {"train_loss": -26.9818058013916, "global_step": 452330, "epoch": 5449} {"train_loss": -26.931821823120117, "global_step": 452331, "epoch": 5449} {"train_loss": -27.36345863342285, "global_step": 452332, "epoch": 5449} {"train_loss": -27.16744041442871, "global_step": 452333, "epoch": 5449} {"train_loss": -27.18928337097168, "global_step": 452334, "epoch": 5449} {"train_loss": -27.200641632080078, "global_step": 452335, "epoch": 5449} {"train_loss": -27.49128532409668, "global_step": 452336, "epoch": 5449} {"train_loss": -27.561431884765625, "global_step": 452337, "epoch": 5449} {"train_loss": -27.237354278564453, "global_step": 452338, "epoch": 5449} {"train_loss": -27.634765625, "global_step": 452339, "epoch": 5449} {"train_loss": -26.975940704345703, "global_step": 452340, "epoch": 5449} {"train_loss": -27.046239852905273, "global_step": 452341, "epoch": 5449} {"train_loss": -27.025449752807617, "global_step": 452342, "epoch": 5449} {"train_loss": -27.53912353515625, "global_step": 452343, "epoch": 5449} {"train_loss": -27.33749771118164, "global_step": 452344, "epoch": 5449} {"train_loss": -27.46957778930664, "global_step": 452345, "epoch": 5449} {"train_loss": -27.53055763244629, "global_step": 452346, "epoch": 5449} {"train_loss": -26.99383544921875, "global_step": 452347, "epoch": 5449} {"train_loss": -27.147924423217773, "global_step": 452348, "epoch": 5449} {"train_loss": -26.993352568293194, "global_step": 452349, "epoch": 5449, "val_loss": 6615271.5} {"train_loss": -26.93170166015625, "global_step": 452350, "epoch": 5450} {"train_loss": -26.150558471679688, "global_step": 452351, "epoch": 5450} {"train_loss": -26.009057998657227, "global_step": 452352, "epoch": 5450} {"train_loss": -25.74517822265625, "global_step": 452353, "epoch": 5450} {"train_loss": -25.88227653503418, "global_step": 452354, "epoch": 5450} {"train_loss": -26.437036514282227, "global_step": 452355, "epoch": 5450} {"train_loss": -26.44459342956543, "global_step": 452356, "epoch": 5450} {"train_loss": -26.51995277404785, "global_step": 452357, "epoch": 5450} {"train_loss": -26.02947998046875, "global_step": 452358, "epoch": 5450} {"train_loss": -25.218460083007812, "global_step": 452359, "epoch": 5450} {"train_loss": -26.389490127563477, "global_step": 452360, "epoch": 5450} {"train_loss": -26.517621994018555, "global_step": 452361, "epoch": 5450} {"train_loss": -26.226139068603516, "global_step": 452362, "epoch": 5450} {"train_loss": -26.60489273071289, "global_step": 452363, "epoch": 5450} {"train_loss": -26.648910522460938, "global_step": 452364, "epoch": 5450} {"train_loss": -26.20051383972168, "global_step": 452365, "epoch": 5450} {"train_loss": -26.8192081451416, "global_step": 452366, "epoch": 5450} {"train_loss": -26.47199058532715, "global_step": 452367, "epoch": 5450} {"train_loss": -26.18659019470215, "global_step": 452368, "epoch": 5450} {"train_loss": -26.601215362548828, "global_step": 452369, "epoch": 5450} {"train_loss": -26.413328170776367, "global_step": 452370, "epoch": 5450} {"train_loss": -26.570005416870117, "global_step": 452371, "epoch": 5450} {"train_loss": -27.14396095275879, "global_step": 452372, "epoch": 5450} {"train_loss": -26.644519805908203, "global_step": 452373, "epoch": 5450} {"train_loss": -26.7863712310791, "global_step": 452374, "epoch": 5450} {"train_loss": -26.941450119018555, "global_step": 452375, "epoch": 5450} {"train_loss": -26.660043716430664, "global_step": 452376, "epoch": 5450} {"train_loss": -26.835784912109375, "global_step": 452377, "epoch": 5450} {"train_loss": -26.7149600982666, "global_step": 452378, "epoch": 5450} {"train_loss": -26.6353816986084, "global_step": 452379, "epoch": 5450} {"train_loss": -26.734750747680664, "global_step": 452380, "epoch": 5450} {"train_loss": -27.223102569580078, "global_step": 452381, "epoch": 5450} {"train_loss": -27.187030792236328, "global_step": 452382, "epoch": 5450} {"train_loss": -26.932825088500977, "global_step": 452383, "epoch": 5450} {"train_loss": -26.727872848510742, "global_step": 452384, "epoch": 5450} {"train_loss": -26.907867431640625, "global_step": 452385, "epoch": 5450} {"train_loss": -27.303485870361328, "global_step": 452386, "epoch": 5450} {"train_loss": -27.134002685546875, "global_step": 452387, "epoch": 5450} {"train_loss": -27.114765167236328, "global_step": 452388, "epoch": 5450} {"train_loss": -27.04644203186035, "global_step": 452389, "epoch": 5450} {"train_loss": -27.211181640625, "global_step": 452390, "epoch": 5450} {"train_loss": -26.990158081054688, "global_step": 452391, "epoch": 5450} {"train_loss": -27.245258331298828, "global_step": 452392, "epoch": 5450} {"train_loss": -27.08497428894043, "global_step": 452393, "epoch": 5450} {"train_loss": -27.391815185546875, "global_step": 452394, "epoch": 5450} {"train_loss": -27.528348922729492, "global_step": 452395, "epoch": 5450} {"train_loss": -26.929746627807617, "global_step": 452396, "epoch": 5450} {"train_loss": -26.908361434936523, "global_step": 452397, "epoch": 5450} {"train_loss": -27.271137237548828, "global_step": 452398, "epoch": 5450} {"train_loss": -27.17475700378418, "global_step": 452399, "epoch": 5450} {"train_loss": -27.21333885192871, "global_step": 452400, "epoch": 5450} {"train_loss": -27.408069610595703, "global_step": 452401, "epoch": 5450} {"train_loss": -27.595630645751953, "global_step": 452402, "epoch": 5450} {"train_loss": -27.460031509399414, "global_step": 452403, "epoch": 5450} {"train_loss": -27.178226470947266, "global_step": 452404, "epoch": 5450} {"train_loss": -27.109045028686523, "global_step": 452405, "epoch": 5450} {"train_loss": -27.53472328186035, "global_step": 452406, "epoch": 5450} {"train_loss": -27.218530654907227, "global_step": 452407, "epoch": 5450} {"train_loss": -27.516803741455078, "global_step": 452408, "epoch": 5450} {"train_loss": -27.07075309753418, "global_step": 452409, "epoch": 5450} {"train_loss": -27.302814483642578, "global_step": 452410, "epoch": 5450} {"train_loss": -27.394575119018555, "global_step": 452411, "epoch": 5450} {"train_loss": -27.2705020904541, "global_step": 452412, "epoch": 5450} {"train_loss": -27.511220932006836, "global_step": 452413, "epoch": 5450} {"train_loss": -27.017505645751953, "global_step": 452414, "epoch": 5450} {"train_loss": -26.9539852142334, "global_step": 452415, "epoch": 5450} {"train_loss": -26.520055770874023, "global_step": 452416, "epoch": 5450} {"train_loss": -26.730295181274414, "global_step": 452417, "epoch": 5450} {"train_loss": -27.2384033203125, "global_step": 452418, "epoch": 5450} {"train_loss": -27.06538200378418, "global_step": 452419, "epoch": 5450} {"train_loss": -26.92978286743164, "global_step": 452420, "epoch": 5450} {"train_loss": -26.670032501220703, "global_step": 452421, "epoch": 5450} {"train_loss": -26.371137619018555, "global_step": 452422, "epoch": 5450} {"train_loss": -26.84766960144043, "global_step": 452423, "epoch": 5450} {"train_loss": -27.194604873657227, "global_step": 452424, "epoch": 5450} {"train_loss": -26.791635513305664, "global_step": 452425, "epoch": 5450} {"train_loss": -26.461584091186523, "global_step": 452426, "epoch": 5450} {"train_loss": -27.012195587158203, "global_step": 452427, "epoch": 5450} {"train_loss": -26.938552856445312, "global_step": 452428, "epoch": 5450} {"train_loss": -26.72613525390625, "global_step": 452429, "epoch": 5450} {"train_loss": -26.86173439025879, "global_step": 452430, "epoch": 5450} {"train_loss": -26.654224395751953, "global_step": 452431, "epoch": 5450} {"train_loss": -26.835547987237035, "global_step": 452432, "epoch": 5450, "train/sim_max_reward_0": 1.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4500000": 1.0, "test/sim_max_reward_4500001": 1.0, "test/sim_max_reward_4500002": 1.0, "test/sim_max_reward_4500003": 1.0, "test/sim_max_reward_4500004": 1.0, "test/sim_max_reward_4500005": 1.0, "test/sim_max_reward_4500006": 1.0, "test/sim_max_reward_4500007": 0.0, "test/sim_max_reward_4500008": 1.0, "test/sim_max_reward_4500009": 1.0, "test/sim_max_reward_4500010": 1.0, "test/sim_max_reward_4500011": 1.0, "test/sim_max_reward_4500012": 1.0, "test/sim_max_reward_4500013": 1.0, "test/sim_max_reward_4500014": 1.0, "test/sim_max_reward_4500015": 1.0, "test/sim_max_reward_4500016": 1.0, "test/sim_max_reward_4500017": 1.0, "test/sim_max_reward_4500018": 0.0, "test/sim_max_reward_4500019": 1.0, "test/sim_max_reward_4500020": 1.0, "test/sim_max_reward_4500021": 1.0, "train/mean_score": 1.0, "test/mean_score": 0.9090909090909091, "val_loss": 6575441.5} {"train_loss": -25.816757202148438, "global_step": 452433, "epoch": 5451} {"train_loss": -25.111061096191406, "global_step": 452434, "epoch": 5451} {"train_loss": -26.170795440673828, "global_step": 452435, "epoch": 5451} {"train_loss": -25.813007354736328, "global_step": 452436, "epoch": 5451} {"train_loss": -26.215103149414062, "global_step": 452437, "epoch": 5451} {"train_loss": -25.60317039489746, "global_step": 452438, "epoch": 5451} {"train_loss": -25.83765983581543, "global_step": 452439, "epoch": 5451} {"train_loss": -26.3984317779541, "global_step": 452440, "epoch": 5451} {"train_loss": -25.63882827758789, "global_step": 452441, "epoch": 5451} {"train_loss": -26.095884323120117, "global_step": 452442, "epoch": 5451} {"train_loss": -26.16373062133789, "global_step": 452443, "epoch": 5451} {"train_loss": -26.19841957092285, "global_step": 452444, "epoch": 5451} {"train_loss": -26.058063507080078, "global_step": 452445, "epoch": 5451} {"train_loss": -25.889013290405273, "global_step": 452446, "epoch": 5451} {"train_loss": -26.433063507080078, "global_step": 452447, "epoch": 5451} {"train_loss": -25.95633316040039, "global_step": 452448, "epoch": 5451} {"train_loss": -26.246185302734375, "global_step": 452449, "epoch": 5451} {"train_loss": -26.30152702331543, "global_step": 452450, "epoch": 5451} {"train_loss": -26.275686264038086, "global_step": 452451, "epoch": 5451} {"train_loss": -26.337594985961914, "global_step": 452452, "epoch": 5451} {"train_loss": -26.459354400634766, "global_step": 452453, "epoch": 5451} {"train_loss": -26.48298454284668, "global_step": 452454, "epoch": 5451} {"train_loss": -26.708337783813477, "global_step": 452455, "epoch": 5451} {"train_loss": -26.436002731323242, "global_step": 452456, "epoch": 5451} {"train_loss": -26.86359214782715, "global_step": 452457, "epoch": 5451} {"train_loss": -26.781208038330078, "global_step": 452458, "epoch": 5451} {"train_loss": -26.572540283203125, "global_step": 452459, "epoch": 5451} {"train_loss": -26.580060958862305, "global_step": 452460, "epoch": 5451} {"train_loss": -26.744348526000977, "global_step": 452461, "epoch": 5451} {"train_loss": -26.507659912109375, "global_step": 452462, "epoch": 5451} {"train_loss": -27.135114669799805, "global_step": 452463, "epoch": 5451} {"train_loss": -26.767505645751953, "global_step": 452464, "epoch": 5451} {"train_loss": -26.682592391967773, "global_step": 452465, "epoch": 5451} {"train_loss": -26.8875732421875, "global_step": 452466, "epoch": 5451} {"train_loss": -26.85235023498535, "global_step": 452467, "epoch": 5451} {"train_loss": -26.798675537109375, "global_step": 452468, "epoch": 5451} {"train_loss": -27.118072509765625, "global_step": 452469, "epoch": 5451} {"train_loss": -26.833765029907227, "global_step": 452470, "epoch": 5451} {"train_loss": -26.940134048461914, "global_step": 452471, "epoch": 5451} {"train_loss": -26.858539581298828, "global_step": 452472, "epoch": 5451} {"train_loss": -27.0006160736084, "global_step": 452473, "epoch": 5451} {"train_loss": -26.90472984313965, "global_step": 452474, "epoch": 5451} {"train_loss": -27.198068618774414, "global_step": 452475, "epoch": 5451} {"train_loss": -27.479162216186523, "global_step": 452476, "epoch": 5451} {"train_loss": -27.247867584228516, "global_step": 452477, "epoch": 5451} {"train_loss": -27.046249389648438, "global_step": 452478, "epoch": 5451} {"train_loss": -27.003952026367188, "global_step": 452479, "epoch": 5451} {"train_loss": -27.028976440429688, "global_step": 452480, "epoch": 5451} {"train_loss": -27.263904571533203, "global_step": 452481, "epoch": 5451} {"train_loss": -27.044803619384766, "global_step": 452482, "epoch": 5451} {"train_loss": -27.138843536376953, "global_step": 452483, "epoch": 5451} {"train_loss": -27.257497787475586, "global_step": 452484, "epoch": 5451} {"train_loss": -27.509923934936523, "global_step": 452485, "epoch": 5451} {"train_loss": -27.269912719726562, "global_step": 452486, "epoch": 5451} {"train_loss": -27.18928337097168, "global_step": 452487, "epoch": 5451} {"train_loss": -27.133527755737305, "global_step": 452488, "epoch": 5451} {"train_loss": -26.86566734313965, "global_step": 452489, "epoch": 5451} {"train_loss": -27.498132705688477, "global_step": 452490, "epoch": 5451} {"train_loss": -27.112985610961914, "global_step": 452491, "epoch": 5451} {"train_loss": -26.90268898010254, "global_step": 452492, "epoch": 5451} {"train_loss": -27.135923385620117, "global_step": 452493, "epoch": 5451} {"train_loss": -27.0422306060791, "global_step": 452494, "epoch": 5451} {"train_loss": -27.289081573486328, "global_step": 452495, "epoch": 5451} {"train_loss": -27.237585067749023, "global_step": 452496, "epoch": 5451} {"train_loss": -26.984939575195312, "global_step": 452497, "epoch": 5451} {"train_loss": -27.23660659790039, "global_step": 452498, "epoch": 5451} {"train_loss": -27.31103515625, "global_step": 452499, "epoch": 5451} {"train_loss": -27.078351974487305, "global_step": 452500, "epoch": 5451} {"train_loss": -26.96430778503418, "global_step": 452501, "epoch": 5451} {"train_loss": -26.756799697875977, "global_step": 452502, "epoch": 5451} {"train_loss": -26.786725997924805, "global_step": 452503, "epoch": 5451} {"train_loss": -27.22279167175293, "global_step": 452504, "epoch": 5451} {"train_loss": -27.176679611206055, "global_step": 452505, "epoch": 5451} {"train_loss": -26.858306884765625, "global_step": 452506, "epoch": 5451} {"train_loss": -26.787988662719727, "global_step": 452507, "epoch": 5451} {"train_loss": -27.2364444732666, "global_step": 452508, "epoch": 5451} {"train_loss": -27.189950942993164, "global_step": 452509, "epoch": 5451} {"train_loss": -26.878376007080078, "global_step": 452510, "epoch": 5451} {"train_loss": -26.580413818359375, "global_step": 452511, "epoch": 5451} {"train_loss": -26.963720321655273, "global_step": 452512, "epoch": 5451} {"train_loss": -27.305646896362305, "global_step": 452513, "epoch": 5451} {"train_loss": -27.057153701782227, "global_step": 452514, "epoch": 5451} {"train_loss": -26.753017402557006, "global_step": 452515, "epoch": 5451, "val_loss": 6568298.0} {"train_loss": -26.446287155151367, "global_step": 452516, "epoch": 5452} {"train_loss": -26.48348045349121, "global_step": 452517, "epoch": 5452} {"train_loss": -26.534414291381836, "global_step": 452518, "epoch": 5452} {"train_loss": -26.751846313476562, "global_step": 452519, "epoch": 5452} {"train_loss": -26.372318267822266, "global_step": 452520, "epoch": 5452} {"train_loss": -27.12646484375, "global_step": 452521, "epoch": 5452} {"train_loss": -26.311481475830078, "global_step": 452522, "epoch": 5452} {"train_loss": -26.702747344970703, "global_step": 452523, "epoch": 5452} {"train_loss": -27.01812171936035, "global_step": 452524, "epoch": 5452} {"train_loss": -26.957305908203125, "global_step": 452525, "epoch": 5452} {"train_loss": -26.920684814453125, "global_step": 452526, "epoch": 5452} {"train_loss": -26.52350425720215, "global_step": 452527, "epoch": 5452} {"train_loss": -27.027557373046875, "global_step": 452528, "epoch": 5452} {"train_loss": -27.1792049407959, "global_step": 452529, "epoch": 5452} {"train_loss": -27.103933334350586, "global_step": 452530, "epoch": 5452} {"train_loss": -26.95903968811035, "global_step": 452531, "epoch": 5452} {"train_loss": -26.97574806213379, "global_step": 452532, "epoch": 5452} {"train_loss": -27.204147338867188, "global_step": 452533, "epoch": 5452} {"train_loss": -27.21962547302246, "global_step": 452534, "epoch": 5452} {"train_loss": -27.34029197692871, "global_step": 452535, "epoch": 5452} {"train_loss": -26.7895450592041, "global_step": 452536, "epoch": 5452} {"train_loss": -27.066314697265625, "global_step": 452537, "epoch": 5452} {"train_loss": -27.128116607666016, "global_step": 452538, "epoch": 5452} {"train_loss": -27.202680587768555, "global_step": 452539, "epoch": 5452} {"train_loss": -26.925596237182617, "global_step": 452540, "epoch": 5452} {"train_loss": -27.042724609375, "global_step": 452541, "epoch": 5452} {"train_loss": -27.152362823486328, "global_step": 452542, "epoch": 5452} {"train_loss": -27.561996459960938, "global_step": 452543, "epoch": 5452} {"train_loss": -27.398889541625977, "global_step": 452544, "epoch": 5452} {"train_loss": -27.408863067626953, "global_step": 452545, "epoch": 5452} {"train_loss": -26.984281539916992, "global_step": 452546, "epoch": 5452} {"train_loss": -27.091596603393555, "global_step": 452547, "epoch": 5452} {"train_loss": -27.104917526245117, "global_step": 452548, "epoch": 5452} {"train_loss": -26.920907974243164, "global_step": 452549, "epoch": 5452} {"train_loss": -27.056406021118164, "global_step": 452550, "epoch": 5452} {"train_loss": -26.94085121154785, "global_step": 452551, "epoch": 5452} {"train_loss": -26.35201072692871, "global_step": 452552, "epoch": 5452} {"train_loss": -26.444395065307617, "global_step": 452553, "epoch": 5452} {"train_loss": -25.396089553833008, "global_step": 452554, "epoch": 5452} {"train_loss": -25.615942001342773, "global_step": 452555, "epoch": 5452} {"train_loss": -26.846012115478516, "global_step": 452556, "epoch": 5452} {"train_loss": -26.318729400634766, "global_step": 452557, "epoch": 5452} {"train_loss": -26.210752487182617, "global_step": 452558, "epoch": 5452} {"train_loss": -27.142169952392578, "global_step": 452559, "epoch": 5452} {"train_loss": -27.027328491210938, "global_step": 452560, "epoch": 5452} {"train_loss": -27.1377010345459, "global_step": 452561, "epoch": 5452} {"train_loss": -26.903278350830078, "global_step": 452562, "epoch": 5452} {"train_loss": -26.844518661499023, "global_step": 452563, "epoch": 5452} {"train_loss": -27.136138916015625, "global_step": 452564, "epoch": 5452} {"train_loss": -27.203908920288086, "global_step": 452565, "epoch": 5452} {"train_loss": -26.7291259765625, "global_step": 452566, "epoch": 5452} {"train_loss": -27.1219425201416, "global_step": 452567, "epoch": 5452} {"train_loss": -26.72870445251465, "global_step": 452568, "epoch": 5452} {"train_loss": -26.949798583984375, "global_step": 452569, "epoch": 5452} {"train_loss": -26.573883056640625, "global_step": 452570, "epoch": 5452} {"train_loss": -27.117822647094727, "global_step": 452571, "epoch": 5452} {"train_loss": -27.273832321166992, "global_step": 452572, "epoch": 5452} {"train_loss": -27.048831939697266, "global_step": 452573, "epoch": 5452} {"train_loss": -27.096887588500977, "global_step": 452574, "epoch": 5452} {"train_loss": -26.898386001586914, "global_step": 452575, "epoch": 5452} {"train_loss": -27.1430721282959, "global_step": 452576, "epoch": 5452} {"train_loss": -26.98858642578125, "global_step": 452577, "epoch": 5452} {"train_loss": -26.965784072875977, "global_step": 452578, "epoch": 5452} {"train_loss": -26.7286434173584, "global_step": 452579, "epoch": 5452} {"train_loss": -27.268951416015625, "global_step": 452580, "epoch": 5452} {"train_loss": -26.921619415283203, "global_step": 452581, "epoch": 5452} {"train_loss": -27.182287216186523, "global_step": 452582, "epoch": 5452} {"train_loss": -26.95252799987793, "global_step": 452583, "epoch": 5452} {"train_loss": -27.01824378967285, "global_step": 452584, "epoch": 5452} {"train_loss": -26.9847469329834, "global_step": 452585, "epoch": 5452} {"train_loss": -26.958515167236328, "global_step": 452586, "epoch": 5452} {"train_loss": -27.05475425720215, "global_step": 452587, "epoch": 5452} {"train_loss": -26.89729118347168, "global_step": 452588, "epoch": 5452} {"train_loss": -26.84344482421875, "global_step": 452589, "epoch": 5452} {"train_loss": -26.950281143188477, "global_step": 452590, "epoch": 5452} {"train_loss": -27.34967613220215, "global_step": 452591, "epoch": 5452} {"train_loss": -27.36724281311035, "global_step": 452592, "epoch": 5452} {"train_loss": -27.315515518188477, "global_step": 452593, "epoch": 5452} {"train_loss": -27.348896026611328, "global_step": 452594, "epoch": 5452} {"train_loss": -27.531604766845703, "global_step": 452595, "epoch": 5452} {"train_loss": -27.139245986938477, "global_step": 452596, "epoch": 5452} {"train_loss": -27.24920082092285, "global_step": 452597, "epoch": 5452} {"train_loss": -26.947049979703973, "global_step": 452598, "epoch": 5452, "val_loss": 6667229.0} {"train_loss": -26.563135147094727, "global_step": 452599, "epoch": 5453} {"train_loss": -26.732934951782227, "global_step": 452600, "epoch": 5453} {"train_loss": -26.48042869567871, "global_step": 452601, "epoch": 5453} {"train_loss": -26.26841163635254, "global_step": 452602, "epoch": 5453} {"train_loss": -26.31631851196289, "global_step": 452603, "epoch": 5453} {"train_loss": -26.63559341430664, "global_step": 452604, "epoch": 5453} {"train_loss": -26.119281768798828, "global_step": 452605, "epoch": 5453} {"train_loss": -27.019567489624023, "global_step": 452606, "epoch": 5453} {"train_loss": -27.120391845703125, "global_step": 452607, "epoch": 5453} {"train_loss": -26.61870765686035, "global_step": 452608, "epoch": 5453} {"train_loss": -26.99468994140625, "global_step": 452609, "epoch": 5453} {"train_loss": -26.519208908081055, "global_step": 452610, "epoch": 5453} {"train_loss": -26.6701602935791, "global_step": 452611, "epoch": 5453} {"train_loss": -26.74625015258789, "global_step": 452612, "epoch": 5453} {"train_loss": -26.77716636657715, "global_step": 452613, "epoch": 5453} {"train_loss": -26.591644287109375, "global_step": 452614, "epoch": 5453} {"train_loss": -27.11322593688965, "global_step": 452615, "epoch": 5453} {"train_loss": -26.9571533203125, "global_step": 452616, "epoch": 5453} {"train_loss": -26.79351234436035, "global_step": 452617, "epoch": 5453} {"train_loss": -26.975635528564453, "global_step": 452618, "epoch": 5453} {"train_loss": -26.830366134643555, "global_step": 452619, "epoch": 5453} {"train_loss": -26.888174057006836, "global_step": 452620, "epoch": 5453} {"train_loss": -27.48188591003418, "global_step": 452621, "epoch": 5453} {"train_loss": -26.775678634643555, "global_step": 452622, "epoch": 5453} {"train_loss": -27.299243927001953, "global_step": 452623, "epoch": 5453} {"train_loss": -27.140838623046875, "global_step": 452624, "epoch": 5453} {"train_loss": -26.9404354095459, "global_step": 452625, "epoch": 5453} {"train_loss": -27.263288497924805, "global_step": 452626, "epoch": 5453} {"train_loss": -27.30816650390625, "global_step": 452627, "epoch": 5453} {"train_loss": -26.979467391967773, "global_step": 452628, "epoch": 5453} {"train_loss": -27.067121505737305, "global_step": 452629, "epoch": 5453} {"train_loss": -26.965545654296875, "global_step": 452630, "epoch": 5453} {"train_loss": -27.019826889038086, "global_step": 452631, "epoch": 5453} {"train_loss": -27.39862632751465, "global_step": 452632, "epoch": 5453} {"train_loss": -26.9820613861084, "global_step": 452633, "epoch": 5453} {"train_loss": -27.16192626953125, "global_step": 452634, "epoch": 5453} {"train_loss": -27.04713249206543, "global_step": 452635, "epoch": 5453} {"train_loss": -27.185688018798828, "global_step": 452636, "epoch": 5453} {"train_loss": -27.055585861206055, "global_step": 452637, "epoch": 5453} {"train_loss": -27.303943634033203, "global_step": 452638, "epoch": 5453} {"train_loss": -27.11738395690918, "global_step": 452639, "epoch": 5453} {"train_loss": -27.298608779907227, "global_step": 452640, "epoch": 5453} {"train_loss": -27.165231704711914, "global_step": 452641, "epoch": 5453} {"train_loss": -27.219955444335938, "global_step": 452642, "epoch": 5453} {"train_loss": -27.018613815307617, "global_step": 452643, "epoch": 5453} {"train_loss": -27.2028865814209, "global_step": 452644, "epoch": 5453} {"train_loss": -27.33820152282715, "global_step": 452645, "epoch": 5453} {"train_loss": -26.93869972229004, "global_step": 452646, "epoch": 5453} {"train_loss": -27.12190055847168, "global_step": 452647, "epoch": 5453} {"train_loss": -26.954320907592773, "global_step": 452648, "epoch": 5453} {"train_loss": -26.979846954345703, "global_step": 452649, "epoch": 5453} {"train_loss": -27.150421142578125, "global_step": 452650, "epoch": 5453} {"train_loss": -27.715124130249023, "global_step": 452651, "epoch": 5453} {"train_loss": -27.266565322875977, "global_step": 452652, "epoch": 5453} {"train_loss": -27.450641632080078, "global_step": 452653, "epoch": 5453} {"train_loss": -27.077651977539062, "global_step": 452654, "epoch": 5453} {"train_loss": -27.093799591064453, "global_step": 452655, "epoch": 5453} {"train_loss": -27.0069522857666, "global_step": 452656, "epoch": 5453} {"train_loss": -26.64484214782715, "global_step": 452657, "epoch": 5453} {"train_loss": -26.980609893798828, "global_step": 452658, "epoch": 5453} {"train_loss": -25.967334747314453, "global_step": 452659, "epoch": 5453} {"train_loss": -26.593908309936523, "global_step": 452660, "epoch": 5453} {"train_loss": -26.946338653564453, "global_step": 452661, "epoch": 5453} {"train_loss": -26.438007354736328, "global_step": 452662, "epoch": 5453} {"train_loss": -26.785314559936523, "global_step": 452663, "epoch": 5453} {"train_loss": -26.27997398376465, "global_step": 452664, "epoch": 5453} {"train_loss": -26.400800704956055, "global_step": 452665, "epoch": 5453} {"train_loss": -26.563983917236328, "global_step": 452666, "epoch": 5453} {"train_loss": -26.92408561706543, "global_step": 452667, "epoch": 5453} {"train_loss": -26.55055809020996, "global_step": 452668, "epoch": 5453} {"train_loss": -26.7799072265625, "global_step": 452669, "epoch": 5453} {"train_loss": -26.537097930908203, "global_step": 452670, "epoch": 5453} {"train_loss": -25.91163444519043, "global_step": 452671, "epoch": 5453} {"train_loss": -26.91025733947754, "global_step": 452672, "epoch": 5453} {"train_loss": -26.55087661743164, "global_step": 452673, "epoch": 5453} {"train_loss": -27.107831954956055, "global_step": 452674, "epoch": 5453} {"train_loss": -27.029544830322266, "global_step": 452675, "epoch": 5453} {"train_loss": -26.726886749267578, "global_step": 452676, "epoch": 5453} {"train_loss": -26.704858779907227, "global_step": 452677, "epoch": 5453} {"train_loss": -26.96539306640625, "global_step": 452678, "epoch": 5453} {"train_loss": -26.80645179748535, "global_step": 452679, "epoch": 5453} {"train_loss": -26.728519439697266, "global_step": 452680, "epoch": 5453} {"train_loss": -26.88852510107569, "global_step": 452681, "epoch": 5453, "val_loss": 6477380.0} {"train_loss": -25.503555297851562, "global_step": 452682, "epoch": 5454} {"train_loss": -25.035512924194336, "global_step": 452683, "epoch": 5454} {"train_loss": -25.60340690612793, "global_step": 452684, "epoch": 5454} {"train_loss": -25.105443954467773, "global_step": 452685, "epoch": 5454} {"train_loss": -24.748472213745117, "global_step": 452686, "epoch": 5454} {"train_loss": -26.081104278564453, "global_step": 452687, "epoch": 5454} {"train_loss": -25.528425216674805, "global_step": 452688, "epoch": 5454} {"train_loss": -25.655826568603516, "global_step": 452689, "epoch": 5454} {"train_loss": -25.0631160736084, "global_step": 452690, "epoch": 5454} {"train_loss": -26.081531524658203, "global_step": 452691, "epoch": 5454} {"train_loss": -25.52687644958496, "global_step": 452692, "epoch": 5454} {"train_loss": -26.009504318237305, "global_step": 452693, "epoch": 5454} {"train_loss": -26.143163681030273, "global_step": 452694, "epoch": 5454} {"train_loss": -25.987207412719727, "global_step": 452695, "epoch": 5454} {"train_loss": -26.00628662109375, "global_step": 452696, "epoch": 5454} {"train_loss": -26.293781280517578, "global_step": 452697, "epoch": 5454} {"train_loss": -26.176258087158203, "global_step": 452698, "epoch": 5454} {"train_loss": -26.210205078125, "global_step": 452699, "epoch": 5454} {"train_loss": -25.97821617126465, "global_step": 452700, "epoch": 5454} {"train_loss": -25.897275924682617, "global_step": 452701, "epoch": 5454} {"train_loss": -26.729032516479492, "global_step": 452702, "epoch": 5454} {"train_loss": -26.35446548461914, "global_step": 452703, "epoch": 5454} {"train_loss": -26.46199607849121, "global_step": 452704, "epoch": 5454} {"train_loss": -26.637527465820312, "global_step": 452705, "epoch": 5454} {"train_loss": -26.5578556060791, "global_step": 452706, "epoch": 5454} {"train_loss": -26.715131759643555, "global_step": 452707, "epoch": 5454} {"train_loss": -26.693140029907227, "global_step": 452708, "epoch": 5454} {"train_loss": -26.556549072265625, "global_step": 452709, "epoch": 5454} {"train_loss": -26.672208786010742, "global_step": 452710, "epoch": 5454} {"train_loss": -26.572607040405273, "global_step": 452711, "epoch": 5454} {"train_loss": -26.75420570373535, "global_step": 452712, "epoch": 5454} {"train_loss": -26.8529109954834, "global_step": 452713, "epoch": 5454} {"train_loss": -26.871997833251953, "global_step": 452714, "epoch": 5454} {"train_loss": -26.72686195373535, "global_step": 452715, "epoch": 5454} {"train_loss": -26.853429794311523, "global_step": 452716, "epoch": 5454} {"train_loss": -26.82639503479004, "global_step": 452717, "epoch": 5454} {"train_loss": -26.874923706054688, "global_step": 452718, "epoch": 5454} {"train_loss": -26.632980346679688, "global_step": 452719, "epoch": 5454} {"train_loss": -26.886240005493164, "global_step": 452720, "epoch": 5454} {"train_loss": -27.017454147338867, "global_step": 452721, "epoch": 5454} {"train_loss": -27.193613052368164, "global_step": 452722, "epoch": 5454} {"train_loss": -27.0924015045166, "global_step": 452723, "epoch": 5454} {"train_loss": -26.905517578125, "global_step": 452724, "epoch": 5454} {"train_loss": -26.89593505859375, "global_step": 452725, "epoch": 5454} {"train_loss": -27.346572875976562, "global_step": 452726, "epoch": 5454} {"train_loss": -26.968664169311523, "global_step": 452727, "epoch": 5454} {"train_loss": -27.028522491455078, "global_step": 452728, "epoch": 5454} {"train_loss": -27.2778377532959, "global_step": 452729, "epoch": 5454} {"train_loss": -27.249271392822266, "global_step": 452730, "epoch": 5454} {"train_loss": -27.05232810974121, "global_step": 452731, "epoch": 5454} {"train_loss": -27.246679306030273, "global_step": 452732, "epoch": 5454} {"train_loss": -27.08051872253418, "global_step": 452733, "epoch": 5454} {"train_loss": -27.086862564086914, "global_step": 452734, "epoch": 5454} {"train_loss": -27.093341827392578, "global_step": 452735, "epoch": 5454} {"train_loss": -27.17766761779785, "global_step": 452736, "epoch": 5454} {"train_loss": -27.051416397094727, "global_step": 452737, "epoch": 5454} {"train_loss": -26.976093292236328, "global_step": 452738, "epoch": 5454} {"train_loss": -26.954980850219727, "global_step": 452739, "epoch": 5454} {"train_loss": -26.9295711517334, "global_step": 452740, "epoch": 5454} {"train_loss": -26.988744735717773, "global_step": 452741, "epoch": 5454} {"train_loss": -27.413623809814453, "global_step": 452742, "epoch": 5454} {"train_loss": -27.298084259033203, "global_step": 452743, "epoch": 5454} {"train_loss": -27.0042724609375, "global_step": 452744, "epoch": 5454} {"train_loss": -27.154956817626953, "global_step": 452745, "epoch": 5454} {"train_loss": -27.36334800720215, "global_step": 452746, "epoch": 5454} {"train_loss": -27.04506492614746, "global_step": 452747, "epoch": 5454} {"train_loss": -27.072904586791992, "global_step": 452748, "epoch": 5454} {"train_loss": -27.5101318359375, "global_step": 452749, "epoch": 5454} {"train_loss": -26.9149169921875, "global_step": 452750, "epoch": 5454} {"train_loss": -27.202606201171875, "global_step": 452751, "epoch": 5454} {"train_loss": -27.02638053894043, "global_step": 452752, "epoch": 5454} {"train_loss": -27.219451904296875, "global_step": 452753, "epoch": 5454} {"train_loss": -27.384368896484375, "global_step": 452754, "epoch": 5454} {"train_loss": -27.14320182800293, "global_step": 452755, "epoch": 5454} {"train_loss": -27.50600242614746, "global_step": 452756, "epoch": 5454} {"train_loss": -27.067529678344727, "global_step": 452757, "epoch": 5454} {"train_loss": -27.405908584594727, "global_step": 452758, "epoch": 5454} {"train_loss": -26.988651275634766, "global_step": 452759, "epoch": 5454} {"train_loss": -27.115966796875, "global_step": 452760, "epoch": 5454} {"train_loss": -26.716516494750977, "global_step": 452761, "epoch": 5454} {"train_loss": -27.15777015686035, "global_step": 452762, "epoch": 5454} {"train_loss": -26.90314292907715, "global_step": 452763, "epoch": 5454} {"train_loss": -26.68383010036974, "global_step": 452764, "epoch": 5454, "val_loss": 6535389.5} {"train_loss": -26.09454345703125, "global_step": 452765, "epoch": 5455} {"train_loss": -26.150827407836914, "global_step": 452766, "epoch": 5455} {"train_loss": -25.780637741088867, "global_step": 452767, "epoch": 5455} {"train_loss": -25.60566520690918, "global_step": 452768, "epoch": 5455} {"train_loss": -26.04425621032715, "global_step": 452769, "epoch": 5455} {"train_loss": -25.708410263061523, "global_step": 452770, "epoch": 5455} {"train_loss": -25.95635414123535, "global_step": 452771, "epoch": 5455} {"train_loss": -26.609821319580078, "global_step": 452772, "epoch": 5455} {"train_loss": -26.29351234436035, "global_step": 452773, "epoch": 5455} {"train_loss": -26.448211669921875, "global_step": 452774, "epoch": 5455} {"train_loss": -26.45429801940918, "global_step": 452775, "epoch": 5455} {"train_loss": -26.681232452392578, "global_step": 452776, "epoch": 5455} {"train_loss": -26.436359405517578, "global_step": 452777, "epoch": 5455} {"train_loss": -26.249120712280273, "global_step": 452778, "epoch": 5455} {"train_loss": -26.608413696289062, "global_step": 452779, "epoch": 5455} {"train_loss": -26.944799423217773, "global_step": 452780, "epoch": 5455} {"train_loss": -26.740747451782227, "global_step": 452781, "epoch": 5455} {"train_loss": -26.692609786987305, "global_step": 452782, "epoch": 5455} {"train_loss": -26.294178009033203, "global_step": 452783, "epoch": 5455} {"train_loss": -26.9901123046875, "global_step": 452784, "epoch": 5455} {"train_loss": -26.82337760925293, "global_step": 452785, "epoch": 5455} {"train_loss": -26.908178329467773, "global_step": 452786, "epoch": 5455} {"train_loss": -26.85894775390625, "global_step": 452787, "epoch": 5455} {"train_loss": -27.181074142456055, "global_step": 452788, "epoch": 5455} {"train_loss": -27.091733932495117, "global_step": 452789, "epoch": 5455} {"train_loss": -27.390302658081055, "global_step": 452790, "epoch": 5455} {"train_loss": -27.003345489501953, "global_step": 452791, "epoch": 5455} {"train_loss": -26.8938045501709, "global_step": 452792, "epoch": 5455} {"train_loss": -27.14509391784668, "global_step": 452793, "epoch": 5455} {"train_loss": -26.984039306640625, "global_step": 452794, "epoch": 5455} {"train_loss": -27.019744873046875, "global_step": 452795, "epoch": 5455} {"train_loss": -27.297895431518555, "global_step": 452796, "epoch": 5455} {"train_loss": -27.131742477416992, "global_step": 452797, "epoch": 5455} {"train_loss": -26.862354278564453, "global_step": 452798, "epoch": 5455} {"train_loss": -27.198047637939453, "global_step": 452799, "epoch": 5455} {"train_loss": -26.93206787109375, "global_step": 452800, "epoch": 5455} {"train_loss": -26.97543716430664, "global_step": 452801, "epoch": 5455} {"train_loss": -27.275373458862305, "global_step": 452802, "epoch": 5455} {"train_loss": -27.108102798461914, "global_step": 452803, "epoch": 5455} {"train_loss": -27.426549911499023, "global_step": 452804, "epoch": 5455} {"train_loss": -26.941999435424805, "global_step": 452805, "epoch": 5455} {"train_loss": -27.15033531188965, "global_step": 452806, "epoch": 5455} {"train_loss": -27.126907348632812, "global_step": 452807, "epoch": 5455} {"train_loss": -27.498411178588867, "global_step": 452808, "epoch": 5455} {"train_loss": -26.9503116607666, "global_step": 452809, "epoch": 5455} {"train_loss": -27.239959716796875, "global_step": 452810, "epoch": 5455} {"train_loss": -27.1666202545166, "global_step": 452811, "epoch": 5455} {"train_loss": -27.354894638061523, "global_step": 452812, "epoch": 5455} {"train_loss": -27.230680465698242, "global_step": 452813, "epoch": 5455} {"train_loss": -27.422515869140625, "global_step": 452814, "epoch": 5455} {"train_loss": -27.478839874267578, "global_step": 452815, "epoch": 5455} {"train_loss": -27.23874855041504, "global_step": 452816, "epoch": 5455} {"train_loss": -27.439085006713867, "global_step": 452817, "epoch": 5455} {"train_loss": -26.77613639831543, "global_step": 452818, "epoch": 5455} {"train_loss": -27.77033042907715, "global_step": 452819, "epoch": 5455} {"train_loss": -27.33724021911621, "global_step": 452820, "epoch": 5455} {"train_loss": -27.395767211914062, "global_step": 452821, "epoch": 5455} {"train_loss": -27.21868324279785, "global_step": 452822, "epoch": 5455} {"train_loss": -27.54920768737793, "global_step": 452823, "epoch": 5455} {"train_loss": -27.04951286315918, "global_step": 452824, "epoch": 5455} {"train_loss": -27.581684112548828, "global_step": 452825, "epoch": 5455} {"train_loss": -27.172964096069336, "global_step": 452826, "epoch": 5455} {"train_loss": -26.9674129486084, "global_step": 452827, "epoch": 5455} {"train_loss": -26.374725341796875, "global_step": 452828, "epoch": 5455} {"train_loss": -25.163541793823242, "global_step": 452829, "epoch": 5455} {"train_loss": -24.032087326049805, "global_step": 452830, "epoch": 5455} {"train_loss": -24.41912269592285, "global_step": 452831, "epoch": 5455} {"train_loss": -25.903553009033203, "global_step": 452832, "epoch": 5455} {"train_loss": -25.4637451171875, "global_step": 452833, "epoch": 5455} {"train_loss": -25.902231216430664, "global_step": 452834, "epoch": 5455} {"train_loss": -26.08127784729004, "global_step": 452835, "epoch": 5455} {"train_loss": -26.03350257873535, "global_step": 452836, "epoch": 5455} {"train_loss": -26.175806045532227, "global_step": 452837, "epoch": 5455} {"train_loss": -26.19085121154785, "global_step": 452838, "epoch": 5455} {"train_loss": -26.261518478393555, "global_step": 452839, "epoch": 5455} {"train_loss": -26.736175537109375, "global_step": 452840, "epoch": 5455} {"train_loss": -25.939971923828125, "global_step": 452841, "epoch": 5455} {"train_loss": -26.525434494018555, "global_step": 452842, "epoch": 5455} {"train_loss": -26.218006134033203, "global_step": 452843, "epoch": 5455} {"train_loss": -26.120019912719727, "global_step": 452844, "epoch": 5455} {"train_loss": -26.430484771728516, "global_step": 452845, "epoch": 5455} {"train_loss": -26.51954460144043, "global_step": 452846, "epoch": 5455} {"train_loss": -26.68775629710002, "global_step": 452847, "epoch": 5455, "val_loss": 6360173.0} {"train_loss": -25.982925415039062, "global_step": 452848, "epoch": 5456} {"train_loss": -24.90071678161621, "global_step": 452849, "epoch": 5456} {"train_loss": -25.931562423706055, "global_step": 452850, "epoch": 5456} {"train_loss": -25.649429321289062, "global_step": 452851, "epoch": 5456} {"train_loss": -25.830652236938477, "global_step": 452852, "epoch": 5456} {"train_loss": -25.904178619384766, "global_step": 452853, "epoch": 5456} {"train_loss": -26.250844955444336, "global_step": 452854, "epoch": 5456} {"train_loss": -26.170461654663086, "global_step": 452855, "epoch": 5456} {"train_loss": -26.550077438354492, "global_step": 452856, "epoch": 5456} {"train_loss": -26.137800216674805, "global_step": 452857, "epoch": 5456} {"train_loss": -26.217803955078125, "global_step": 452858, "epoch": 5456} {"train_loss": -26.39240837097168, "global_step": 452859, "epoch": 5456} {"train_loss": -26.37467384338379, "global_step": 452860, "epoch": 5456} {"train_loss": -26.558685302734375, "global_step": 452861, "epoch": 5456} {"train_loss": -26.21021842956543, "global_step": 452862, "epoch": 5456} {"train_loss": -26.396686553955078, "global_step": 452863, "epoch": 5456} {"train_loss": -26.45132827758789, "global_step": 452864, "epoch": 5456} {"train_loss": -26.406248092651367, "global_step": 452865, "epoch": 5456} {"train_loss": -26.85466957092285, "global_step": 452866, "epoch": 5456} {"train_loss": -26.360082626342773, "global_step": 452867, "epoch": 5456} {"train_loss": -26.885034561157227, "global_step": 452868, "epoch": 5456} {"train_loss": -26.305830001831055, "global_step": 452869, "epoch": 5456} {"train_loss": -27.054183959960938, "global_step": 452870, "epoch": 5456} {"train_loss": -26.169485092163086, "global_step": 452871, "epoch": 5456} {"train_loss": -27.161930084228516, "global_step": 452872, "epoch": 5456} {"train_loss": -26.69137954711914, "global_step": 452873, "epoch": 5456} {"train_loss": -26.79119300842285, "global_step": 452874, "epoch": 5456} {"train_loss": -26.919885635375977, "global_step": 452875, "epoch": 5456} {"train_loss": -26.774795532226562, "global_step": 452876, "epoch": 5456} {"train_loss": -26.925861358642578, "global_step": 452877, "epoch": 5456} {"train_loss": -26.921361923217773, "global_step": 452878, "epoch": 5456} {"train_loss": -27.002893447875977, "global_step": 452879, "epoch": 5456} {"train_loss": -26.845630645751953, "global_step": 452880, "epoch": 5456} {"train_loss": -26.82813835144043, "global_step": 452881, "epoch": 5456} {"train_loss": -27.05536460876465, "global_step": 452882, "epoch": 5456} {"train_loss": -26.86948585510254, "global_step": 452883, "epoch": 5456} {"train_loss": -27.108007431030273, "global_step": 452884, "epoch": 5456} {"train_loss": -27.276752471923828, "global_step": 452885, "epoch": 5456} {"train_loss": -27.239965438842773, "global_step": 452886, "epoch": 5456} {"train_loss": -27.02152442932129, "global_step": 452887, "epoch": 5456} {"train_loss": -27.242572784423828, "global_step": 452888, "epoch": 5456} {"train_loss": -26.7473087310791, "global_step": 452889, "epoch": 5456} {"train_loss": -27.00290298461914, "global_step": 452890, "epoch": 5456} {"train_loss": -27.068220138549805, "global_step": 452891, "epoch": 5456} {"train_loss": -27.04364585876465, "global_step": 452892, "epoch": 5456} {"train_loss": -27.113874435424805, "global_step": 452893, "epoch": 5456} {"train_loss": -26.865264892578125, "global_step": 452894, "epoch": 5456} {"train_loss": -27.074329376220703, "global_step": 452895, "epoch": 5456} {"train_loss": -27.38972282409668, "global_step": 452896, "epoch": 5456} {"train_loss": -27.450414657592773, "global_step": 452897, "epoch": 5456} {"train_loss": -26.986114501953125, "global_step": 452898, "epoch": 5456} {"train_loss": -27.222253799438477, "global_step": 452899, "epoch": 5456} {"train_loss": -27.372812271118164, "global_step": 452900, "epoch": 5456} {"train_loss": -26.994421005249023, "global_step": 452901, "epoch": 5456} {"train_loss": -27.2635498046875, "global_step": 452902, "epoch": 5456} {"train_loss": -27.120527267456055, "global_step": 452903, "epoch": 5456} {"train_loss": -27.517826080322266, "global_step": 452904, "epoch": 5456} {"train_loss": -27.1689395904541, "global_step": 452905, "epoch": 5456} {"train_loss": -27.123504638671875, "global_step": 452906, "epoch": 5456} {"train_loss": -26.981128692626953, "global_step": 452907, "epoch": 5456} {"train_loss": -27.123184204101562, "global_step": 452908, "epoch": 5456} {"train_loss": -27.167306900024414, "global_step": 452909, "epoch": 5456} {"train_loss": -27.093902587890625, "global_step": 452910, "epoch": 5456} {"train_loss": -27.371545791625977, "global_step": 452911, "epoch": 5456} {"train_loss": -27.298187255859375, "global_step": 452912, "epoch": 5456} {"train_loss": -27.17612075805664, "global_step": 452913, "epoch": 5456} {"train_loss": -27.065963745117188, "global_step": 452914, "epoch": 5456} {"train_loss": -27.5025577545166, "global_step": 452915, "epoch": 5456} {"train_loss": -27.149005889892578, "global_step": 452916, "epoch": 5456} {"train_loss": -27.516559600830078, "global_step": 452917, "epoch": 5456} {"train_loss": -27.013391494750977, "global_step": 452918, "epoch": 5456} {"train_loss": -27.03683853149414, "global_step": 452919, "epoch": 5456} {"train_loss": -27.37649917602539, "global_step": 452920, "epoch": 5456} {"train_loss": -27.40937614440918, "global_step": 452921, "epoch": 5456} {"train_loss": -26.942941665649414, "global_step": 452922, "epoch": 5456} {"train_loss": -27.0263671875, "global_step": 452923, "epoch": 5456} {"train_loss": -26.911020278930664, "global_step": 452924, "epoch": 5456} {"train_loss": -26.809890747070312, "global_step": 452925, "epoch": 5456} {"train_loss": -26.96640396118164, "global_step": 452926, "epoch": 5456} {"train_loss": -27.229053497314453, "global_step": 452927, "epoch": 5456} {"train_loss": -26.996551513671875, "global_step": 452928, "epoch": 5456} {"train_loss": -27.116743087768555, "global_step": 452929, "epoch": 5456} {"train_loss": -26.860076674495836, "global_step": 452930, "epoch": 5456, "val_loss": 6707014.0} {"train_loss": -27.10175895690918, "global_step": 452931, "epoch": 5457} {"train_loss": -26.50758934020996, "global_step": 452932, "epoch": 5457} {"train_loss": -26.530561447143555, "global_step": 452933, "epoch": 5457} {"train_loss": -26.674360275268555, "global_step": 452934, "epoch": 5457} {"train_loss": -26.41147232055664, "global_step": 452935, "epoch": 5457} {"train_loss": -26.880834579467773, "global_step": 452936, "epoch": 5457} {"train_loss": -26.667165756225586, "global_step": 452937, "epoch": 5457} {"train_loss": -26.907068252563477, "global_step": 452938, "epoch": 5457} {"train_loss": -26.90232276916504, "global_step": 452939, "epoch": 5457} {"train_loss": -26.87115478515625, "global_step": 452940, "epoch": 5457} {"train_loss": -26.769184112548828, "global_step": 452941, "epoch": 5457} {"train_loss": -26.891469955444336, "global_step": 452942, "epoch": 5457} {"train_loss": -27.04107093811035, "global_step": 452943, "epoch": 5457} {"train_loss": -27.018442153930664, "global_step": 452944, "epoch": 5457} {"train_loss": -26.921255111694336, "global_step": 452945, "epoch": 5457} {"train_loss": -26.791248321533203, "global_step": 452946, "epoch": 5457} {"train_loss": -26.841358184814453, "global_step": 452947, "epoch": 5457} {"train_loss": -26.695892333984375, "global_step": 452948, "epoch": 5457} {"train_loss": -27.137338638305664, "global_step": 452949, "epoch": 5457} {"train_loss": -27.28602409362793, "global_step": 452950, "epoch": 5457} {"train_loss": -27.428186416625977, "global_step": 452951, "epoch": 5457} {"train_loss": -26.883222579956055, "global_step": 452952, "epoch": 5457} {"train_loss": -27.3632755279541, "global_step": 452953, "epoch": 5457} {"train_loss": -27.1552791595459, "global_step": 452954, "epoch": 5457} {"train_loss": -27.0257511138916, "global_step": 452955, "epoch": 5457} {"train_loss": -27.103321075439453, "global_step": 452956, "epoch": 5457} {"train_loss": -27.15924644470215, "global_step": 452957, "epoch": 5457} {"train_loss": -27.39790153503418, "global_step": 452958, "epoch": 5457} {"train_loss": -27.464223861694336, "global_step": 452959, "epoch": 5457} {"train_loss": -27.2399959564209, "global_step": 452960, "epoch": 5457} {"train_loss": -27.372364044189453, "global_step": 452961, "epoch": 5457} {"train_loss": -27.284521102905273, "global_step": 452962, "epoch": 5457} {"train_loss": -27.15936851501465, "global_step": 452963, "epoch": 5457} {"train_loss": -27.2069091796875, "global_step": 452964, "epoch": 5457} {"train_loss": -27.471601486206055, "global_step": 452965, "epoch": 5457} {"train_loss": -26.80940055847168, "global_step": 452966, "epoch": 5457} {"train_loss": -26.34380531311035, "global_step": 452967, "epoch": 5457} {"train_loss": -26.856388092041016, "global_step": 452968, "epoch": 5457} {"train_loss": -27.043365478515625, "global_step": 452969, "epoch": 5457} {"train_loss": -27.3351993560791, "global_step": 452970, "epoch": 5457} {"train_loss": -27.19220542907715, "global_step": 452971, "epoch": 5457} {"train_loss": -27.112863540649414, "global_step": 452972, "epoch": 5457} {"train_loss": -27.13956069946289, "global_step": 452973, "epoch": 5457} {"train_loss": -27.576791763305664, "global_step": 452974, "epoch": 5457} {"train_loss": -27.085432052612305, "global_step": 452975, "epoch": 5457} {"train_loss": -27.407957077026367, "global_step": 452976, "epoch": 5457} {"train_loss": -27.099958419799805, "global_step": 452977, "epoch": 5457} {"train_loss": -26.817102432250977, "global_step": 452978, "epoch": 5457} {"train_loss": -27.45424461364746, "global_step": 452979, "epoch": 5457} {"train_loss": -27.362995147705078, "global_step": 452980, "epoch": 5457} {"train_loss": -27.399755477905273, "global_step": 452981, "epoch": 5457} {"train_loss": -26.894577026367188, "global_step": 452982, "epoch": 5457} {"train_loss": -27.263219833374023, "global_step": 452983, "epoch": 5457} {"train_loss": -27.219297409057617, "global_step": 452984, "epoch": 5457} {"train_loss": -27.33491325378418, "global_step": 452985, "epoch": 5457} {"train_loss": -27.250661849975586, "global_step": 452986, "epoch": 5457} {"train_loss": -26.66499137878418, "global_step": 452987, "epoch": 5457} {"train_loss": -26.84160804748535, "global_step": 452988, "epoch": 5457} {"train_loss": -26.890329360961914, "global_step": 452989, "epoch": 5457} {"train_loss": -26.996780395507812, "global_step": 452990, "epoch": 5457} {"train_loss": -27.01263999938965, "global_step": 452991, "epoch": 5457} {"train_loss": -27.022607803344727, "global_step": 452992, "epoch": 5457} {"train_loss": -26.82782554626465, "global_step": 452993, "epoch": 5457} {"train_loss": -27.032855987548828, "global_step": 452994, "epoch": 5457} {"train_loss": -26.870527267456055, "global_step": 452995, "epoch": 5457} {"train_loss": -27.224109649658203, "global_step": 452996, "epoch": 5457} {"train_loss": -26.527135848999023, "global_step": 452997, "epoch": 5457} {"train_loss": -27.296361923217773, "global_step": 452998, "epoch": 5457} {"train_loss": -27.272735595703125, "global_step": 452999, "epoch": 5457} {"train_loss": -27.19464111328125, "global_step": 453000, "epoch": 5457} {"train_loss": -26.952192306518555, "global_step": 453001, "epoch": 5457} {"train_loss": -27.361169815063477, "global_step": 453002, "epoch": 5457} {"train_loss": -27.0788631439209, "global_step": 453003, "epoch": 5457} {"train_loss": -26.64827537536621, "global_step": 453004, "epoch": 5457} {"train_loss": -27.483121871948242, "global_step": 453005, "epoch": 5457} {"train_loss": -27.078479766845703, "global_step": 453006, "epoch": 5457} {"train_loss": -26.934106826782227, "global_step": 453007, "epoch": 5457} {"train_loss": -27.167591094970703, "global_step": 453008, "epoch": 5457} {"train_loss": -26.90592384338379, "global_step": 453009, "epoch": 5457} {"train_loss": -27.03647804260254, "global_step": 453010, "epoch": 5457} {"train_loss": -27.240478515625, "global_step": 453011, "epoch": 5457} {"train_loss": -26.857324600219727, "global_step": 453012, "epoch": 5457} {"train_loss": -27.047474849654968, "global_step": 453013, "epoch": 5457, "val_loss": 6658085.0} {"train_loss": -27.123823165893555, "global_step": 453014, "epoch": 5458} {"train_loss": -27.038618087768555, "global_step": 453015, "epoch": 5458} {"train_loss": -26.70674705505371, "global_step": 453016, "epoch": 5458} {"train_loss": -26.81751823425293, "global_step": 453017, "epoch": 5458} {"train_loss": -26.76154136657715, "global_step": 453018, "epoch": 5458} {"train_loss": -26.405609130859375, "global_step": 453019, "epoch": 5458} {"train_loss": -26.876096725463867, "global_step": 453020, "epoch": 5458} {"train_loss": -26.654254913330078, "global_step": 453021, "epoch": 5458} {"train_loss": -26.646453857421875, "global_step": 453022, "epoch": 5458} {"train_loss": -26.661035537719727, "global_step": 453023, "epoch": 5458} {"train_loss": -26.372161865234375, "global_step": 453024, "epoch": 5458} {"train_loss": -26.56263542175293, "global_step": 453025, "epoch": 5458} {"train_loss": -26.670520782470703, "global_step": 453026, "epoch": 5458} {"train_loss": -26.421417236328125, "global_step": 453027, "epoch": 5458} {"train_loss": -26.704666137695312, "global_step": 453028, "epoch": 5458} {"train_loss": -26.661828994750977, "global_step": 453029, "epoch": 5458} {"train_loss": -26.513916015625, "global_step": 453030, "epoch": 5458} {"train_loss": -26.70731544494629, "global_step": 453031, "epoch": 5458} {"train_loss": -26.932031631469727, "global_step": 453032, "epoch": 5458} {"train_loss": -26.893781661987305, "global_step": 453033, "epoch": 5458} {"train_loss": -26.73233985900879, "global_step": 453034, "epoch": 5458} {"train_loss": -26.97797203063965, "global_step": 453035, "epoch": 5458} {"train_loss": -27.122400283813477, "global_step": 453036, "epoch": 5458} {"train_loss": -26.97820472717285, "global_step": 453037, "epoch": 5458} {"train_loss": -26.982101440429688, "global_step": 453038, "epoch": 5458} {"train_loss": -27.243818283081055, "global_step": 453039, "epoch": 5458} {"train_loss": -27.188587188720703, "global_step": 453040, "epoch": 5458} {"train_loss": -27.559797286987305, "global_step": 453041, "epoch": 5458} {"train_loss": -26.986852645874023, "global_step": 453042, "epoch": 5458} {"train_loss": -26.829782485961914, "global_step": 453043, "epoch": 5458} {"train_loss": -26.955713272094727, "global_step": 453044, "epoch": 5458} {"train_loss": -26.51369285583496, "global_step": 453045, "epoch": 5458} {"train_loss": -26.9895076751709, "global_step": 453046, "epoch": 5458} {"train_loss": -27.029874801635742, "global_step": 453047, "epoch": 5458} {"train_loss": -27.29347038269043, "global_step": 453048, "epoch": 5458} {"train_loss": -27.238494873046875, "global_step": 453049, "epoch": 5458} {"train_loss": -26.7199764251709, "global_step": 453050, "epoch": 5458} {"train_loss": -26.665525436401367, "global_step": 453051, "epoch": 5458} {"train_loss": -26.5860595703125, "global_step": 453052, "epoch": 5458} {"train_loss": -26.481412887573242, "global_step": 453053, "epoch": 5458} {"train_loss": -27.032318115234375, "global_step": 453054, "epoch": 5458} {"train_loss": -27.05952262878418, "global_step": 453055, "epoch": 5458} {"train_loss": -26.56667137145996, "global_step": 453056, "epoch": 5458} {"train_loss": -27.268537521362305, "global_step": 453057, "epoch": 5458} {"train_loss": -26.796918869018555, "global_step": 453058, "epoch": 5458} {"train_loss": -26.962491989135742, "global_step": 453059, "epoch": 5458} {"train_loss": -26.933374404907227, "global_step": 453060, "epoch": 5458} {"train_loss": -26.958362579345703, "global_step": 453061, "epoch": 5458} {"train_loss": -26.9489688873291, "global_step": 453062, "epoch": 5458} {"train_loss": -26.979894638061523, "global_step": 453063, "epoch": 5458} {"train_loss": -27.37323570251465, "global_step": 453064, "epoch": 5458} {"train_loss": -26.782962799072266, "global_step": 453065, "epoch": 5458} {"train_loss": -26.899396896362305, "global_step": 453066, "epoch": 5458} {"train_loss": -26.701398849487305, "global_step": 453067, "epoch": 5458} {"train_loss": -26.74897575378418, "global_step": 453068, "epoch": 5458} {"train_loss": -26.9468936920166, "global_step": 453069, "epoch": 5458} {"train_loss": -26.587543487548828, "global_step": 453070, "epoch": 5458} {"train_loss": -26.861486434936523, "global_step": 453071, "epoch": 5458} {"train_loss": -27.1322078704834, "global_step": 453072, "epoch": 5458} {"train_loss": -27.112716674804688, "global_step": 453073, "epoch": 5458} {"train_loss": -27.021320343017578, "global_step": 453074, "epoch": 5458} {"train_loss": -27.079360961914062, "global_step": 453075, "epoch": 5458} {"train_loss": -27.121967315673828, "global_step": 453076, "epoch": 5458} {"train_loss": -27.131162643432617, "global_step": 453077, "epoch": 5458} {"train_loss": -27.284521102905273, "global_step": 453078, "epoch": 5458} {"train_loss": -27.220685958862305, "global_step": 453079, "epoch": 5458} {"train_loss": -27.177051544189453, "global_step": 453080, "epoch": 5458} {"train_loss": -27.00290298461914, "global_step": 453081, "epoch": 5458} {"train_loss": -27.4339656829834, "global_step": 453082, "epoch": 5458} {"train_loss": -26.76735496520996, "global_step": 453083, "epoch": 5458} {"train_loss": -27.18079948425293, "global_step": 453084, "epoch": 5458} {"train_loss": -26.970443725585938, "global_step": 453085, "epoch": 5458} {"train_loss": -27.01380729675293, "global_step": 453086, "epoch": 5458} {"train_loss": -26.923627853393555, "global_step": 453087, "epoch": 5458} {"train_loss": -26.893604278564453, "global_step": 453088, "epoch": 5458} {"train_loss": -27.025897979736328, "global_step": 453089, "epoch": 5458} {"train_loss": -27.13160514831543, "global_step": 453090, "epoch": 5458} {"train_loss": -26.87664222717285, "global_step": 453091, "epoch": 5458} {"train_loss": -27.044458389282227, "global_step": 453092, "epoch": 5458} {"train_loss": -27.027074813842773, "global_step": 453093, "epoch": 5458} {"train_loss": -27.47220230102539, "global_step": 453094, "epoch": 5458} {"train_loss": -27.022052764892578, "global_step": 453095, "epoch": 5458} {"train_loss": -26.924236918070232, "global_step": 453096, "epoch": 5458, "val_loss": 6670524.0} {"train_loss": -26.609283447265625, "global_step": 453097, "epoch": 5459} {"train_loss": -26.41634178161621, "global_step": 453098, "epoch": 5459} {"train_loss": -26.589258193969727, "global_step": 453099, "epoch": 5459} {"train_loss": -26.92352294921875, "global_step": 453100, "epoch": 5459} {"train_loss": -26.508453369140625, "global_step": 453101, "epoch": 5459} {"train_loss": -26.582746505737305, "global_step": 453102, "epoch": 5459} {"train_loss": -26.682235717773438, "global_step": 453103, "epoch": 5459} {"train_loss": -26.48981285095215, "global_step": 453104, "epoch": 5459} {"train_loss": -26.982999801635742, "global_step": 453105, "epoch": 5459} {"train_loss": -27.122522354125977, "global_step": 453106, "epoch": 5459} {"train_loss": -27.196340560913086, "global_step": 453107, "epoch": 5459} {"train_loss": -27.10300064086914, "global_step": 453108, "epoch": 5459} {"train_loss": -26.98382568359375, "global_step": 453109, "epoch": 5459} {"train_loss": -27.078536987304688, "global_step": 453110, "epoch": 5459} {"train_loss": -26.95134925842285, "global_step": 453111, "epoch": 5459} {"train_loss": -26.789722442626953, "global_step": 453112, "epoch": 5459} {"train_loss": -27.26661491394043, "global_step": 453113, "epoch": 5459} {"train_loss": -27.068876266479492, "global_step": 453114, "epoch": 5459} {"train_loss": -26.96066665649414, "global_step": 453115, "epoch": 5459} {"train_loss": -26.861719131469727, "global_step": 453116, "epoch": 5459} {"train_loss": -27.19882583618164, "global_step": 453117, "epoch": 5459} {"train_loss": -27.11903190612793, "global_step": 453118, "epoch": 5459} {"train_loss": -27.19636344909668, "global_step": 453119, "epoch": 5459} {"train_loss": -27.07050132751465, "global_step": 453120, "epoch": 5459} {"train_loss": -27.1118106842041, "global_step": 453121, "epoch": 5459} {"train_loss": -27.41226577758789, "global_step": 453122, "epoch": 5459} {"train_loss": -27.429296493530273, "global_step": 453123, "epoch": 5459} {"train_loss": -27.479185104370117, "global_step": 453124, "epoch": 5459} {"train_loss": -27.31379508972168, "global_step": 453125, "epoch": 5459} {"train_loss": -27.177398681640625, "global_step": 453126, "epoch": 5459} {"train_loss": -27.225387573242188, "global_step": 453127, "epoch": 5459} {"train_loss": -27.463729858398438, "global_step": 453128, "epoch": 5459} {"train_loss": -27.23109245300293, "global_step": 453129, "epoch": 5459} {"train_loss": -27.13551139831543, "global_step": 453130, "epoch": 5459} {"train_loss": -26.791513442993164, "global_step": 453131, "epoch": 5459} {"train_loss": -27.167041778564453, "global_step": 453132, "epoch": 5459} {"train_loss": -27.022296905517578, "global_step": 453133, "epoch": 5459} {"train_loss": -27.341638565063477, "global_step": 453134, "epoch": 5459} {"train_loss": -27.093923568725586, "global_step": 453135, "epoch": 5459} {"train_loss": -27.231658935546875, "global_step": 453136, "epoch": 5459} {"train_loss": -26.917434692382812, "global_step": 453137, "epoch": 5459} {"train_loss": -27.23190689086914, "global_step": 453138, "epoch": 5459} {"train_loss": -27.125715255737305, "global_step": 453139, "epoch": 5459} {"train_loss": -27.11237907409668, "global_step": 453140, "epoch": 5459} {"train_loss": -26.693374633789062, "global_step": 453141, "epoch": 5459} {"train_loss": -27.112506866455078, "global_step": 453142, "epoch": 5459} {"train_loss": -27.39657974243164, "global_step": 453143, "epoch": 5459} {"train_loss": -26.679412841796875, "global_step": 453144, "epoch": 5459} {"train_loss": -26.920185089111328, "global_step": 453145, "epoch": 5459} {"train_loss": -27.047651290893555, "global_step": 453146, "epoch": 5459} {"train_loss": -27.3277530670166, "global_step": 453147, "epoch": 5459} {"train_loss": -27.084585189819336, "global_step": 453148, "epoch": 5459} {"train_loss": -27.484542846679688, "global_step": 453149, "epoch": 5459} {"train_loss": -27.0545654296875, "global_step": 453150, "epoch": 5459} {"train_loss": -26.669300079345703, "global_step": 453151, "epoch": 5459} {"train_loss": -27.148874282836914, "global_step": 453152, "epoch": 5459} {"train_loss": -27.135528564453125, "global_step": 453153, "epoch": 5459} {"train_loss": -27.192068099975586, "global_step": 453154, "epoch": 5459} {"train_loss": -27.275365829467773, "global_step": 453155, "epoch": 5459} {"train_loss": -27.016666412353516, "global_step": 453156, "epoch": 5459} {"train_loss": -27.00200843811035, "global_step": 453157, "epoch": 5459} {"train_loss": -27.05853843688965, "global_step": 453158, "epoch": 5459} {"train_loss": -27.41474723815918, "global_step": 453159, "epoch": 5459} {"train_loss": -27.17909049987793, "global_step": 453160, "epoch": 5459} {"train_loss": -26.961034774780273, "global_step": 453161, "epoch": 5459} {"train_loss": -27.47700309753418, "global_step": 453162, "epoch": 5459} {"train_loss": -27.375934600830078, "global_step": 453163, "epoch": 5459} {"train_loss": -27.144012451171875, "global_step": 453164, "epoch": 5459} {"train_loss": -27.212833404541016, "global_step": 453165, "epoch": 5459} {"train_loss": -27.282148361206055, "global_step": 453166, "epoch": 5459} {"train_loss": -26.865888595581055, "global_step": 453167, "epoch": 5459} {"train_loss": -27.030317306518555, "global_step": 453168, "epoch": 5459} {"train_loss": -27.1629695892334, "global_step": 453169, "epoch": 5459} {"train_loss": -26.99445152282715, "global_step": 453170, "epoch": 5459} {"train_loss": -26.95577049255371, "global_step": 453171, "epoch": 5459} {"train_loss": -26.600492477416992, "global_step": 453172, "epoch": 5459} {"train_loss": -26.49811363220215, "global_step": 453173, "epoch": 5459} {"train_loss": -26.583005905151367, "global_step": 453174, "epoch": 5459} {"train_loss": -26.6058292388916, "global_step": 453175, "epoch": 5459} {"train_loss": -26.927831649780273, "global_step": 453176, "epoch": 5459} {"train_loss": -26.63348388671875, "global_step": 453177, "epoch": 5459} {"train_loss": -26.746723175048828, "global_step": 453178, "epoch": 5459} {"train_loss": -27.04656564183982, "global_step": 453179, "epoch": 5459, "val_loss": 6763726.0} {"train_loss": -25.112401962280273, "global_step": 453180, "epoch": 5460} {"train_loss": -25.996850967407227, "global_step": 453181, "epoch": 5460} {"train_loss": -25.078420639038086, "global_step": 453182, "epoch": 5460} {"train_loss": -25.95660972595215, "global_step": 453183, "epoch": 5460} {"train_loss": -25.854969024658203, "global_step": 453184, "epoch": 5460} {"train_loss": -25.98166847229004, "global_step": 453185, "epoch": 5460} {"train_loss": -26.155012130737305, "global_step": 453186, "epoch": 5460} {"train_loss": -25.739004135131836, "global_step": 453187, "epoch": 5460} {"train_loss": -26.49981117248535, "global_step": 453188, "epoch": 5460} {"train_loss": -25.813974380493164, "global_step": 453189, "epoch": 5460} {"train_loss": -26.4005184173584, "global_step": 453190, "epoch": 5460} {"train_loss": -26.582595825195312, "global_step": 453191, "epoch": 5460} {"train_loss": -26.514636993408203, "global_step": 453192, "epoch": 5460} {"train_loss": -26.360883712768555, "global_step": 453193, "epoch": 5460} {"train_loss": -26.4841365814209, "global_step": 453194, "epoch": 5460} {"train_loss": -26.296463012695312, "global_step": 453195, "epoch": 5460} {"train_loss": -26.195831298828125, "global_step": 453196, "epoch": 5460} {"train_loss": -26.663557052612305, "global_step": 453197, "epoch": 5460} {"train_loss": -26.346044540405273, "global_step": 453198, "epoch": 5460} {"train_loss": -26.3364200592041, "global_step": 453199, "epoch": 5460} {"train_loss": -26.287092208862305, "global_step": 453200, "epoch": 5460} {"train_loss": -26.501928329467773, "global_step": 453201, "epoch": 5460} {"train_loss": -26.764989852905273, "global_step": 453202, "epoch": 5460} {"train_loss": -26.490711212158203, "global_step": 453203, "epoch": 5460} {"train_loss": -26.490514755249023, "global_step": 453204, "epoch": 5460} {"train_loss": -26.387311935424805, "global_step": 453205, "epoch": 5460} {"train_loss": -26.432968139648438, "global_step": 453206, "epoch": 5460} {"train_loss": -26.573883056640625, "global_step": 453207, "epoch": 5460} {"train_loss": -26.53803825378418, "global_step": 453208, "epoch": 5460} {"train_loss": -26.70819664001465, "global_step": 453209, "epoch": 5460} {"train_loss": -26.42242431640625, "global_step": 453210, "epoch": 5460} {"train_loss": -26.751813888549805, "global_step": 453211, "epoch": 5460} {"train_loss": -26.950952529907227, "global_step": 453212, "epoch": 5460} {"train_loss": -27.125354766845703, "global_step": 453213, "epoch": 5460} {"train_loss": -26.852575302124023, "global_step": 453214, "epoch": 5460} {"train_loss": -26.75434684753418, "global_step": 453215, "epoch": 5460} {"train_loss": -26.732940673828125, "global_step": 453216, "epoch": 5460} {"train_loss": -26.921789169311523, "global_step": 453217, "epoch": 5460} {"train_loss": -27.18186378479004, "global_step": 453218, "epoch": 5460} {"train_loss": -27.2786865234375, "global_step": 453219, "epoch": 5460} {"train_loss": -27.180139541625977, "global_step": 453220, "epoch": 5460} {"train_loss": -27.078332901000977, "global_step": 453221, "epoch": 5460} {"train_loss": -27.335224151611328, "global_step": 453222, "epoch": 5460} {"train_loss": -27.382787704467773, "global_step": 453223, "epoch": 5460} {"train_loss": -27.416181564331055, "global_step": 453224, "epoch": 5460} {"train_loss": -27.194421768188477, "global_step": 453225, "epoch": 5460} {"train_loss": -26.862573623657227, "global_step": 453226, "epoch": 5460} {"train_loss": -27.425769805908203, "global_step": 453227, "epoch": 5460} {"train_loss": -26.984619140625, "global_step": 453228, "epoch": 5460} {"train_loss": -27.23297119140625, "global_step": 453229, "epoch": 5460} {"train_loss": -26.983579635620117, "global_step": 453230, "epoch": 5460} {"train_loss": -27.352954864501953, "global_step": 453231, "epoch": 5460} {"train_loss": -27.358001708984375, "global_step": 453232, "epoch": 5460} {"train_loss": -27.438657760620117, "global_step": 453233, "epoch": 5460} {"train_loss": -27.435510635375977, "global_step": 453234, "epoch": 5460} {"train_loss": -27.433034896850586, "global_step": 453235, "epoch": 5460} {"train_loss": -27.01344108581543, "global_step": 453236, "epoch": 5460} {"train_loss": -27.1396541595459, "global_step": 453237, "epoch": 5460} {"train_loss": -27.107885360717773, "global_step": 453238, "epoch": 5460} {"train_loss": -27.287220001220703, "global_step": 453239, "epoch": 5460} {"train_loss": -27.034452438354492, "global_step": 453240, "epoch": 5460} {"train_loss": -27.320287704467773, "global_step": 453241, "epoch": 5460} {"train_loss": -27.286100387573242, "global_step": 453242, "epoch": 5460} {"train_loss": -27.1314697265625, "global_step": 453243, "epoch": 5460} {"train_loss": -26.957014083862305, "global_step": 453244, "epoch": 5460} {"train_loss": -27.104084014892578, "global_step": 453245, "epoch": 5460} {"train_loss": -26.72075843811035, "global_step": 453246, "epoch": 5460} {"train_loss": -26.46742057800293, "global_step": 453247, "epoch": 5460} {"train_loss": -25.872156143188477, "global_step": 453248, "epoch": 5460} {"train_loss": -25.98990821838379, "global_step": 453249, "epoch": 5460} {"train_loss": -26.90357780456543, "global_step": 453250, "epoch": 5460} {"train_loss": -27.0498104095459, "global_step": 453251, "epoch": 5460} {"train_loss": -26.77754020690918, "global_step": 453252, "epoch": 5460} {"train_loss": -27.342187881469727, "global_step": 453253, "epoch": 5460} {"train_loss": -26.964263916015625, "global_step": 453254, "epoch": 5460} {"train_loss": -27.1436767578125, "global_step": 453255, "epoch": 5460} {"train_loss": -27.259775161743164, "global_step": 453256, "epoch": 5460} {"train_loss": -27.131616592407227, "global_step": 453257, "epoch": 5460} {"train_loss": -27.00986099243164, "global_step": 453258, "epoch": 5460} {"train_loss": -26.984912872314453, "global_step": 453259, "epoch": 5460} {"train_loss": -27.09730339050293, "global_step": 453260, "epoch": 5460} {"train_loss": -27.025732040405273, "global_step": 453261, "epoch": 5460} {"train_loss": -26.733093445559582, "global_step": 453262, "epoch": 5460, "val_loss": 6701810.0} {"train_loss": -23.517663955688477, "global_step": 453263, "epoch": 5461} {"train_loss": -24.367002487182617, "global_step": 453264, "epoch": 5461} {"train_loss": -25.060317993164062, "global_step": 453265, "epoch": 5461} {"train_loss": -24.783588409423828, "global_step": 453266, "epoch": 5461} {"train_loss": -25.5364933013916, "global_step": 453267, "epoch": 5461} {"train_loss": -24.73439598083496, "global_step": 453268, "epoch": 5461} {"train_loss": -25.50847053527832, "global_step": 453269, "epoch": 5461} {"train_loss": -25.613174438476562, "global_step": 453270, "epoch": 5461} {"train_loss": -25.258304595947266, "global_step": 453271, "epoch": 5461} {"train_loss": -26.204792022705078, "global_step": 453272, "epoch": 5461} {"train_loss": -25.747303009033203, "global_step": 453273, "epoch": 5461} {"train_loss": -25.4596004486084, "global_step": 453274, "epoch": 5461} {"train_loss": -25.896203994750977, "global_step": 453275, "epoch": 5461} {"train_loss": -26.0900821685791, "global_step": 453276, "epoch": 5461} {"train_loss": -26.278472900390625, "global_step": 453277, "epoch": 5461} {"train_loss": -26.1671142578125, "global_step": 453278, "epoch": 5461} {"train_loss": -25.683515548706055, "global_step": 453279, "epoch": 5461} {"train_loss": -26.232879638671875, "global_step": 453280, "epoch": 5461} {"train_loss": -26.4642276763916, "global_step": 453281, "epoch": 5461} {"train_loss": -26.63661003112793, "global_step": 453282, "epoch": 5461} {"train_loss": -26.406848907470703, "global_step": 453283, "epoch": 5461} {"train_loss": -26.38515281677246, "global_step": 453284, "epoch": 5461} {"train_loss": -26.443994522094727, "global_step": 453285, "epoch": 5461} {"train_loss": -26.53975486755371, "global_step": 453286, "epoch": 5461} {"train_loss": -26.58253288269043, "global_step": 453287, "epoch": 5461} {"train_loss": -26.601160049438477, "global_step": 453288, "epoch": 5461} {"train_loss": -26.673053741455078, "global_step": 453289, "epoch": 5461} {"train_loss": -27.19061279296875, "global_step": 453290, "epoch": 5461} {"train_loss": -26.927602767944336, "global_step": 453291, "epoch": 5461} {"train_loss": -27.091825485229492, "global_step": 453292, "epoch": 5461} {"train_loss": -26.696990966796875, "global_step": 453293, "epoch": 5461} {"train_loss": -26.79837417602539, "global_step": 453294, "epoch": 5461} {"train_loss": -26.753034591674805, "global_step": 453295, "epoch": 5461} {"train_loss": -26.909021377563477, "global_step": 453296, "epoch": 5461} {"train_loss": -26.663314819335938, "global_step": 453297, "epoch": 5461} {"train_loss": -26.766626358032227, "global_step": 453298, "epoch": 5461} {"train_loss": -26.77278709411621, "global_step": 453299, "epoch": 5461} {"train_loss": -27.11285972595215, "global_step": 453300, "epoch": 5461} {"train_loss": -27.0948486328125, "global_step": 453301, "epoch": 5461} {"train_loss": -26.894824981689453, "global_step": 453302, "epoch": 5461} {"train_loss": -26.753894805908203, "global_step": 453303, "epoch": 5461} {"train_loss": -27.19940757751465, "global_step": 453304, "epoch": 5461} {"train_loss": -27.01044273376465, "global_step": 453305, "epoch": 5461} {"train_loss": -26.801923751831055, "global_step": 453306, "epoch": 5461} {"train_loss": -27.182775497436523, "global_step": 453307, "epoch": 5461} {"train_loss": -27.00992202758789, "global_step": 453308, "epoch": 5461} {"train_loss": -27.202392578125, "global_step": 453309, "epoch": 5461} {"train_loss": -26.73902702331543, "global_step": 453310, "epoch": 5461} {"train_loss": -26.871124267578125, "global_step": 453311, "epoch": 5461} {"train_loss": -27.17131996154785, "global_step": 453312, "epoch": 5461} {"train_loss": -27.0188045501709, "global_step": 453313, "epoch": 5461} {"train_loss": -26.723779678344727, "global_step": 453314, "epoch": 5461} {"train_loss": -27.1922550201416, "global_step": 453315, "epoch": 5461} {"train_loss": -26.820356369018555, "global_step": 453316, "epoch": 5461} {"train_loss": -27.078372955322266, "global_step": 453317, "epoch": 5461} {"train_loss": -26.572656631469727, "global_step": 453318, "epoch": 5461} {"train_loss": -27.0279541015625, "global_step": 453319, "epoch": 5461} {"train_loss": -26.943832397460938, "global_step": 453320, "epoch": 5461} {"train_loss": -27.35672950744629, "global_step": 453321, "epoch": 5461} {"train_loss": -26.751855850219727, "global_step": 453322, "epoch": 5461} {"train_loss": -26.894210815429688, "global_step": 453323, "epoch": 5461} {"train_loss": -26.982614517211914, "global_step": 453324, "epoch": 5461} {"train_loss": -26.90237808227539, "global_step": 453325, "epoch": 5461} {"train_loss": -27.200525283813477, "global_step": 453326, "epoch": 5461} {"train_loss": -26.56568717956543, "global_step": 453327, "epoch": 5461} {"train_loss": -26.565793991088867, "global_step": 453328, "epoch": 5461} {"train_loss": -27.234567642211914, "global_step": 453329, "epoch": 5461} {"train_loss": -26.135324478149414, "global_step": 453330, "epoch": 5461} {"train_loss": -27.035551071166992, "global_step": 453331, "epoch": 5461} {"train_loss": -26.278324127197266, "global_step": 453332, "epoch": 5461} {"train_loss": -26.594892501831055, "global_step": 453333, "epoch": 5461} {"train_loss": -26.51923179626465, "global_step": 453334, "epoch": 5461} {"train_loss": -26.982145309448242, "global_step": 453335, "epoch": 5461} {"train_loss": -26.925779342651367, "global_step": 453336, "epoch": 5461} {"train_loss": -26.8695068359375, "global_step": 453337, "epoch": 5461} {"train_loss": -26.914148330688477, "global_step": 453338, "epoch": 5461} {"train_loss": -26.93683433532715, "global_step": 453339, "epoch": 5461} {"train_loss": -26.89200210571289, "global_step": 453340, "epoch": 5461} {"train_loss": -27.114294052124023, "global_step": 453341, "epoch": 5461} {"train_loss": -26.85100746154785, "global_step": 453342, "epoch": 5461} {"train_loss": -27.120849609375, "global_step": 453343, "epoch": 5461} {"train_loss": -27.2410831451416, "global_step": 453344, "epoch": 5461} {"train_loss": -26.56943716485816, "global_step": 453345, "epoch": 5461, "val_loss": 6692150.5} {"train_loss": -27.094207763671875, "global_step": 453346, "epoch": 5462} {"train_loss": -26.793867111206055, "global_step": 453347, "epoch": 5462} {"train_loss": -27.012317657470703, "global_step": 453348, "epoch": 5462} {"train_loss": -26.834930419921875, "global_step": 453349, "epoch": 5462} {"train_loss": -26.633508682250977, "global_step": 453350, "epoch": 5462} {"train_loss": -26.81385612487793, "global_step": 453351, "epoch": 5462} {"train_loss": -27.02263832092285, "global_step": 453352, "epoch": 5462} {"train_loss": -26.915119171142578, "global_step": 453353, "epoch": 5462} {"train_loss": -26.733734130859375, "global_step": 453354, "epoch": 5462} {"train_loss": -26.931604385375977, "global_step": 453355, "epoch": 5462} {"train_loss": -27.085142135620117, "global_step": 453356, "epoch": 5462} {"train_loss": -27.04477882385254, "global_step": 453357, "epoch": 5462} {"train_loss": -27.259918212890625, "global_step": 453358, "epoch": 5462} {"train_loss": -26.687408447265625, "global_step": 453359, "epoch": 5462} {"train_loss": -27.1405029296875, "global_step": 453360, "epoch": 5462} {"train_loss": -26.683942794799805, "global_step": 453361, "epoch": 5462} {"train_loss": -27.22112464904785, "global_step": 453362, "epoch": 5462} {"train_loss": -26.871448516845703, "global_step": 453363, "epoch": 5462} {"train_loss": -26.876754760742188, "global_step": 453364, "epoch": 5462} {"train_loss": -27.330724716186523, "global_step": 453365, "epoch": 5462} {"train_loss": -27.1030216217041, "global_step": 453366, "epoch": 5462} {"train_loss": -26.945728302001953, "global_step": 453367, "epoch": 5462} {"train_loss": -27.223438262939453, "global_step": 453368, "epoch": 5462} {"train_loss": -27.04543113708496, "global_step": 453369, "epoch": 5462} {"train_loss": -27.014179229736328, "global_step": 453370, "epoch": 5462} {"train_loss": -26.863651275634766, "global_step": 453371, "epoch": 5462} {"train_loss": -27.18186378479004, "global_step": 453372, "epoch": 5462} {"train_loss": -27.164899826049805, "global_step": 453373, "epoch": 5462} {"train_loss": -27.00141716003418, "global_step": 453374, "epoch": 5462} {"train_loss": -27.346866607666016, "global_step": 453375, "epoch": 5462} {"train_loss": -27.05091667175293, "global_step": 453376, "epoch": 5462} {"train_loss": -27.13094139099121, "global_step": 453377, "epoch": 5462} {"train_loss": -27.104150772094727, "global_step": 453378, "epoch": 5462} {"train_loss": -27.35247802734375, "global_step": 453379, "epoch": 5462} {"train_loss": -27.100528717041016, "global_step": 453380, "epoch": 5462} {"train_loss": -27.621503829956055, "global_step": 453381, "epoch": 5462} {"train_loss": -27.19234275817871, "global_step": 453382, "epoch": 5462} {"train_loss": -27.143741607666016, "global_step": 453383, "epoch": 5462} {"train_loss": -27.27186393737793, "global_step": 453384, "epoch": 5462} {"train_loss": -27.290136337280273, "global_step": 453385, "epoch": 5462} {"train_loss": -27.30683708190918, "global_step": 453386, "epoch": 5462} {"train_loss": -27.25480079650879, "global_step": 453387, "epoch": 5462} {"train_loss": -27.48078727722168, "global_step": 453388, "epoch": 5462} {"train_loss": -26.912500381469727, "global_step": 453389, "epoch": 5462} {"train_loss": -27.188831329345703, "global_step": 453390, "epoch": 5462} {"train_loss": -27.144277572631836, "global_step": 453391, "epoch": 5462} {"train_loss": -27.03993797302246, "global_step": 453392, "epoch": 5462} {"train_loss": -27.0189151763916, "global_step": 453393, "epoch": 5462} {"train_loss": -27.27032470703125, "global_step": 453394, "epoch": 5462} {"train_loss": -27.066925048828125, "global_step": 453395, "epoch": 5462} {"train_loss": -26.586200714111328, "global_step": 453396, "epoch": 5462} {"train_loss": -26.682727813720703, "global_step": 453397, "epoch": 5462} {"train_loss": -27.045684814453125, "global_step": 453398, "epoch": 5462} {"train_loss": -27.372915267944336, "global_step": 453399, "epoch": 5462} {"train_loss": -26.75591468811035, "global_step": 453400, "epoch": 5462} {"train_loss": -27.22307777404785, "global_step": 453401, "epoch": 5462} {"train_loss": -27.082548141479492, "global_step": 453402, "epoch": 5462} {"train_loss": -26.975229263305664, "global_step": 453403, "epoch": 5462} {"train_loss": -27.108081817626953, "global_step": 453404, "epoch": 5462} {"train_loss": -27.044326782226562, "global_step": 453405, "epoch": 5462} {"train_loss": -26.932037353515625, "global_step": 453406, "epoch": 5462} {"train_loss": -27.221206665039062, "global_step": 453407, "epoch": 5462} {"train_loss": -26.457569122314453, "global_step": 453408, "epoch": 5462} {"train_loss": -26.700429916381836, "global_step": 453409, "epoch": 5462} {"train_loss": -26.780858993530273, "global_step": 453410, "epoch": 5462} {"train_loss": -27.125934600830078, "global_step": 453411, "epoch": 5462} {"train_loss": -26.932987213134766, "global_step": 453412, "epoch": 5462} {"train_loss": -26.60931396484375, "global_step": 453413, "epoch": 5462} {"train_loss": -26.949697494506836, "global_step": 453414, "epoch": 5462} {"train_loss": -27.339950561523438, "global_step": 453415, "epoch": 5462} {"train_loss": -26.981281280517578, "global_step": 453416, "epoch": 5462} {"train_loss": -27.164356231689453, "global_step": 453417, "epoch": 5462} {"train_loss": -26.77858543395996, "global_step": 453418, "epoch": 5462} {"train_loss": -26.6890811920166, "global_step": 453419, "epoch": 5462} {"train_loss": -27.35297203063965, "global_step": 453420, "epoch": 5462} {"train_loss": -26.903900146484375, "global_step": 453421, "epoch": 5462} {"train_loss": -27.04532241821289, "global_step": 453422, "epoch": 5462} {"train_loss": -27.396686553955078, "global_step": 453423, "epoch": 5462} {"train_loss": -27.471654891967773, "global_step": 453424, "epoch": 5462} {"train_loss": -27.198827743530273, "global_step": 453425, "epoch": 5462} {"train_loss": -27.084875106811523, "global_step": 453426, "epoch": 5462} {"train_loss": -27.311716079711914, "global_step": 453427, "epoch": 5462} {"train_loss": -27.056145886340772, "global_step": 453428, "epoch": 5462, "val_loss": 6618836.0} {"train_loss": -26.32407569885254, "global_step": 453429, "epoch": 5463} {"train_loss": -26.006803512573242, "global_step": 453430, "epoch": 5463} {"train_loss": -25.663421630859375, "global_step": 453431, "epoch": 5463} {"train_loss": -25.80512809753418, "global_step": 453432, "epoch": 5463} {"train_loss": -26.381372451782227, "global_step": 453433, "epoch": 5463} {"train_loss": -26.07374382019043, "global_step": 453434, "epoch": 5463} {"train_loss": -26.8858585357666, "global_step": 453435, "epoch": 5463} {"train_loss": -26.59590721130371, "global_step": 453436, "epoch": 5463} {"train_loss": -26.510669708251953, "global_step": 453437, "epoch": 5463} {"train_loss": -26.529157638549805, "global_step": 453438, "epoch": 5463} {"train_loss": -26.315717697143555, "global_step": 453439, "epoch": 5463} {"train_loss": -26.5313777923584, "global_step": 453440, "epoch": 5463} {"train_loss": -26.324399948120117, "global_step": 453441, "epoch": 5463} {"train_loss": -26.872772216796875, "global_step": 453442, "epoch": 5463} {"train_loss": -26.660907745361328, "global_step": 453443, "epoch": 5463} {"train_loss": -26.296051025390625, "global_step": 453444, "epoch": 5463} {"train_loss": -26.514541625976562, "global_step": 453445, "epoch": 5463} {"train_loss": -26.785049438476562, "global_step": 453446, "epoch": 5463} {"train_loss": -26.778610229492188, "global_step": 453447, "epoch": 5463} {"train_loss": -26.44292640686035, "global_step": 453448, "epoch": 5463} {"train_loss": -26.773496627807617, "global_step": 453449, "epoch": 5463} {"train_loss": -26.947357177734375, "global_step": 453450, "epoch": 5463} {"train_loss": -26.89565086364746, "global_step": 453451, "epoch": 5463} {"train_loss": -26.89247703552246, "global_step": 453452, "epoch": 5463} {"train_loss": -27.145349502563477, "global_step": 453453, "epoch": 5463} {"train_loss": -27.197717666625977, "global_step": 453454, "epoch": 5463} {"train_loss": -27.21272087097168, "global_step": 453455, "epoch": 5463} {"train_loss": -26.887521743774414, "global_step": 453456, "epoch": 5463} {"train_loss": -27.00676918029785, "global_step": 453457, "epoch": 5463} {"train_loss": -27.185821533203125, "global_step": 453458, "epoch": 5463} {"train_loss": -26.768712997436523, "global_step": 453459, "epoch": 5463} {"train_loss": -27.22817039489746, "global_step": 453460, "epoch": 5463} {"train_loss": -26.946386337280273, "global_step": 453461, "epoch": 5463} {"train_loss": -27.118698120117188, "global_step": 453462, "epoch": 5463} {"train_loss": -27.053363800048828, "global_step": 453463, "epoch": 5463} {"train_loss": -26.978973388671875, "global_step": 453464, "epoch": 5463} {"train_loss": -27.5882568359375, "global_step": 453465, "epoch": 5463} {"train_loss": -26.8115177154541, "global_step": 453466, "epoch": 5463} {"train_loss": -26.848974227905273, "global_step": 453467, "epoch": 5463} {"train_loss": -26.950164794921875, "global_step": 453468, "epoch": 5463} {"train_loss": -26.712757110595703, "global_step": 453469, "epoch": 5463} {"train_loss": -26.78118324279785, "global_step": 453470, "epoch": 5463} {"train_loss": -26.683216094970703, "global_step": 453471, "epoch": 5463} {"train_loss": -26.627216339111328, "global_step": 453472, "epoch": 5463} {"train_loss": -26.965686798095703, "global_step": 453473, "epoch": 5463} {"train_loss": -27.148534774780273, "global_step": 453474, "epoch": 5463} {"train_loss": -27.161666870117188, "global_step": 453475, "epoch": 5463} {"train_loss": -27.165088653564453, "global_step": 453476, "epoch": 5463} {"train_loss": -26.8726863861084, "global_step": 453477, "epoch": 5463} {"train_loss": -27.060245513916016, "global_step": 453478, "epoch": 5463} {"train_loss": -27.25044822692871, "global_step": 453479, "epoch": 5463} {"train_loss": -27.324615478515625, "global_step": 453480, "epoch": 5463} {"train_loss": -26.886173248291016, "global_step": 453481, "epoch": 5463} {"train_loss": -27.03897476196289, "global_step": 453482, "epoch": 5463} {"train_loss": -27.179126739501953, "global_step": 453483, "epoch": 5463} {"train_loss": -26.722150802612305, "global_step": 453484, "epoch": 5463} {"train_loss": -27.358509063720703, "global_step": 453485, "epoch": 5463} {"train_loss": -27.28557777404785, "global_step": 453486, "epoch": 5463} {"train_loss": -27.286706924438477, "global_step": 453487, "epoch": 5463} {"train_loss": -26.92896842956543, "global_step": 453488, "epoch": 5463} {"train_loss": -27.22224998474121, "global_step": 453489, "epoch": 5463} {"train_loss": -26.757665634155273, "global_step": 453490, "epoch": 5463} {"train_loss": -27.297544479370117, "global_step": 453491, "epoch": 5463} {"train_loss": -27.10088539123535, "global_step": 453492, "epoch": 5463} {"train_loss": -27.1213436126709, "global_step": 453493, "epoch": 5463} {"train_loss": -27.336389541625977, "global_step": 453494, "epoch": 5463} {"train_loss": -27.430282592773438, "global_step": 453495, "epoch": 5463} {"train_loss": -26.79827880859375, "global_step": 453496, "epoch": 5463} {"train_loss": -27.2672061920166, "global_step": 453497, "epoch": 5463} {"train_loss": -27.09391212463379, "global_step": 453498, "epoch": 5463} {"train_loss": -27.369409561157227, "global_step": 453499, "epoch": 5463} {"train_loss": -27.49114990234375, "global_step": 453500, "epoch": 5463} {"train_loss": -27.230504989624023, "global_step": 453501, "epoch": 5463} {"train_loss": -27.0277099609375, "global_step": 453502, "epoch": 5463} {"train_loss": -26.537668228149414, "global_step": 453503, "epoch": 5463} {"train_loss": -27.069135665893555, "global_step": 453504, "epoch": 5463} {"train_loss": -26.971765518188477, "global_step": 453505, "epoch": 5463} {"train_loss": -27.426227569580078, "global_step": 453506, "epoch": 5463} {"train_loss": -27.276676177978516, "global_step": 453507, "epoch": 5463} {"train_loss": -27.44611930847168, "global_step": 453508, "epoch": 5463} {"train_loss": -27.090478897094727, "global_step": 453509, "epoch": 5463} {"train_loss": -27.064855575561523, "global_step": 453510, "epoch": 5463} {"train_loss": -26.910793442323982, "global_step": 453511, "epoch": 5463, "val_loss": 6698804.0} {"train_loss": -26.851856231689453, "global_step": 453512, "epoch": 5464} {"train_loss": -26.778583526611328, "global_step": 453513, "epoch": 5464} {"train_loss": -26.749130249023438, "global_step": 453514, "epoch": 5464} {"train_loss": -27.053876876831055, "global_step": 453515, "epoch": 5464} {"train_loss": -26.77791404724121, "global_step": 453516, "epoch": 5464} {"train_loss": -27.11908531188965, "global_step": 453517, "epoch": 5464} {"train_loss": -26.771499633789062, "global_step": 453518, "epoch": 5464} {"train_loss": -26.87652015686035, "global_step": 453519, "epoch": 5464} {"train_loss": -27.357898712158203, "global_step": 453520, "epoch": 5464} {"train_loss": -27.415037155151367, "global_step": 453521, "epoch": 5464} {"train_loss": -26.696643829345703, "global_step": 453522, "epoch": 5464} {"train_loss": -27.002582550048828, "global_step": 453523, "epoch": 5464} {"train_loss": -27.369543075561523, "global_step": 453524, "epoch": 5464} {"train_loss": -26.598600387573242, "global_step": 453525, "epoch": 5464} {"train_loss": -26.906614303588867, "global_step": 453526, "epoch": 5464} {"train_loss": -27.011520385742188, "global_step": 453527, "epoch": 5464} {"train_loss": -27.25005531311035, "global_step": 453528, "epoch": 5464} {"train_loss": -26.79620933532715, "global_step": 453529, "epoch": 5464} {"train_loss": -27.443317413330078, "global_step": 453530, "epoch": 5464} {"train_loss": -27.24871826171875, "global_step": 453531, "epoch": 5464} {"train_loss": -27.212448120117188, "global_step": 453532, "epoch": 5464} {"train_loss": -26.99736976623535, "global_step": 453533, "epoch": 5464} {"train_loss": -27.1022891998291, "global_step": 453534, "epoch": 5464} {"train_loss": -26.991437911987305, "global_step": 453535, "epoch": 5464} {"train_loss": -26.723907470703125, "global_step": 453536, "epoch": 5464} {"train_loss": -26.676828384399414, "global_step": 453537, "epoch": 5464} {"train_loss": -27.069995880126953, "global_step": 453538, "epoch": 5464} {"train_loss": -26.608579635620117, "global_step": 453539, "epoch": 5464} {"train_loss": -26.86858558654785, "global_step": 453540, "epoch": 5464} {"train_loss": -26.999359130859375, "global_step": 453541, "epoch": 5464} {"train_loss": -27.19618034362793, "global_step": 453542, "epoch": 5464} {"train_loss": -26.7033634185791, "global_step": 453543, "epoch": 5464} {"train_loss": -27.058338165283203, "global_step": 453544, "epoch": 5464} {"train_loss": -26.652179718017578, "global_step": 453545, "epoch": 5464} {"train_loss": -27.1466064453125, "global_step": 453546, "epoch": 5464} {"train_loss": -26.627073287963867, "global_step": 453547, "epoch": 5464} {"train_loss": -26.5816593170166, "global_step": 453548, "epoch": 5464} {"train_loss": -26.444660186767578, "global_step": 453549, "epoch": 5464} {"train_loss": -27.26656150817871, "global_step": 453550, "epoch": 5464} {"train_loss": -27.078596115112305, "global_step": 453551, "epoch": 5464} {"train_loss": -26.71728515625, "global_step": 453552, "epoch": 5464} {"train_loss": -26.864538192749023, "global_step": 453553, "epoch": 5464} {"train_loss": -27.310590744018555, "global_step": 453554, "epoch": 5464} {"train_loss": -27.266651153564453, "global_step": 453555, "epoch": 5464} {"train_loss": -26.753087997436523, "global_step": 453556, "epoch": 5464} {"train_loss": -26.9390811920166, "global_step": 453557, "epoch": 5464} {"train_loss": -27.114797592163086, "global_step": 453558, "epoch": 5464} {"train_loss": -26.646936416625977, "global_step": 453559, "epoch": 5464} {"train_loss": -27.2756290435791, "global_step": 453560, "epoch": 5464} {"train_loss": -27.101652145385742, "global_step": 453561, "epoch": 5464} {"train_loss": -27.096649169921875, "global_step": 453562, "epoch": 5464} {"train_loss": -27.011316299438477, "global_step": 453563, "epoch": 5464} {"train_loss": -27.24708366394043, "global_step": 453564, "epoch": 5464} {"train_loss": -26.635150909423828, "global_step": 453565, "epoch": 5464} {"train_loss": -27.591922760009766, "global_step": 453566, "epoch": 5464} {"train_loss": -27.514118194580078, "global_step": 453567, "epoch": 5464} {"train_loss": -27.052845001220703, "global_step": 453568, "epoch": 5464} {"train_loss": -26.98078727722168, "global_step": 453569, "epoch": 5464} {"train_loss": -27.00921630859375, "global_step": 453570, "epoch": 5464} {"train_loss": -27.350549697875977, "global_step": 453571, "epoch": 5464} {"train_loss": -27.050458908081055, "global_step": 453572, "epoch": 5464} {"train_loss": -27.22902488708496, "global_step": 453573, "epoch": 5464} {"train_loss": -27.455982208251953, "global_step": 453574, "epoch": 5464} {"train_loss": -26.927997589111328, "global_step": 453575, "epoch": 5464} {"train_loss": -27.06331443786621, "global_step": 453576, "epoch": 5464} {"train_loss": -27.018878936767578, "global_step": 453577, "epoch": 5464} {"train_loss": -27.012853622436523, "global_step": 453578, "epoch": 5464} {"train_loss": -27.174833297729492, "global_step": 453579, "epoch": 5464} {"train_loss": -27.005613327026367, "global_step": 453580, "epoch": 5464} {"train_loss": -27.329065322875977, "global_step": 453581, "epoch": 5464} {"train_loss": -26.903486251831055, "global_step": 453582, "epoch": 5464} {"train_loss": -27.07254409790039, "global_step": 453583, "epoch": 5464} {"train_loss": -27.055402755737305, "global_step": 453584, "epoch": 5464} {"train_loss": -26.725818634033203, "global_step": 453585, "epoch": 5464} {"train_loss": -26.93975830078125, "global_step": 453586, "epoch": 5464} {"train_loss": -26.86414909362793, "global_step": 453587, "epoch": 5464} {"train_loss": -27.22198486328125, "global_step": 453588, "epoch": 5464} {"train_loss": -27.22743034362793, "global_step": 453589, "epoch": 5464} {"train_loss": -27.051288604736328, "global_step": 453590, "epoch": 5464} {"train_loss": -27.316131591796875, "global_step": 453591, "epoch": 5464} {"train_loss": -27.20127296447754, "global_step": 453592, "epoch": 5464} {"train_loss": -27.024280548095703, "global_step": 453593, "epoch": 5464} {"train_loss": -27.005220849829985, "global_step": 453594, "epoch": 5464, "val_loss": 6723742.0} {"train_loss": -26.564315795898438, "global_step": 453595, "epoch": 5465} {"train_loss": -26.912872314453125, "global_step": 453596, "epoch": 5465} {"train_loss": -26.87693214416504, "global_step": 453597, "epoch": 5465} {"train_loss": -26.816965103149414, "global_step": 453598, "epoch": 5465} {"train_loss": -26.707448959350586, "global_step": 453599, "epoch": 5465} {"train_loss": -27.04072380065918, "global_step": 453600, "epoch": 5465} {"train_loss": -26.871551513671875, "global_step": 453601, "epoch": 5465} {"train_loss": -26.818174362182617, "global_step": 453602, "epoch": 5465} {"train_loss": -26.7613468170166, "global_step": 453603, "epoch": 5465} {"train_loss": -26.94272804260254, "global_step": 453604, "epoch": 5465} {"train_loss": -26.935644149780273, "global_step": 453605, "epoch": 5465} {"train_loss": -27.12346839904785, "global_step": 453606, "epoch": 5465} {"train_loss": -26.69339942932129, "global_step": 453607, "epoch": 5465} {"train_loss": -27.037464141845703, "global_step": 453608, "epoch": 5465} {"train_loss": -27.016271591186523, "global_step": 453609, "epoch": 5465} {"train_loss": -26.996732711791992, "global_step": 453610, "epoch": 5465} {"train_loss": -26.835514068603516, "global_step": 453611, "epoch": 5465} {"train_loss": -26.653106689453125, "global_step": 453612, "epoch": 5465} {"train_loss": -26.986255645751953, "global_step": 453613, "epoch": 5465} {"train_loss": -26.688339233398438, "global_step": 453614, "epoch": 5465} {"train_loss": -27.234851837158203, "global_step": 453615, "epoch": 5465} {"train_loss": -26.948450088500977, "global_step": 453616, "epoch": 5465} {"train_loss": -26.90732765197754, "global_step": 453617, "epoch": 5465} {"train_loss": -27.30091667175293, "global_step": 453618, "epoch": 5465} {"train_loss": -27.227502822875977, "global_step": 453619, "epoch": 5465} {"train_loss": -27.189395904541016, "global_step": 453620, "epoch": 5465} {"train_loss": -27.079605102539062, "global_step": 453621, "epoch": 5465} {"train_loss": -26.31028175354004, "global_step": 453622, "epoch": 5465} {"train_loss": -27.02312660217285, "global_step": 453623, "epoch": 5465} {"train_loss": -27.12312889099121, "global_step": 453624, "epoch": 5465} {"train_loss": -27.133405685424805, "global_step": 453625, "epoch": 5465} {"train_loss": -27.1588134765625, "global_step": 453626, "epoch": 5465} {"train_loss": -26.97548484802246, "global_step": 453627, "epoch": 5465} {"train_loss": -26.758405685424805, "global_step": 453628, "epoch": 5465} {"train_loss": -27.02658462524414, "global_step": 453629, "epoch": 5465} {"train_loss": -27.41324806213379, "global_step": 453630, "epoch": 5465} {"train_loss": -26.866321563720703, "global_step": 453631, "epoch": 5465} {"train_loss": -26.851083755493164, "global_step": 453632, "epoch": 5465} {"train_loss": -27.28873062133789, "global_step": 453633, "epoch": 5465} {"train_loss": -27.2773380279541, "global_step": 453634, "epoch": 5465} {"train_loss": -26.9244441986084, "global_step": 453635, "epoch": 5465} {"train_loss": -26.57490348815918, "global_step": 453636, "epoch": 5465} {"train_loss": -27.09244155883789, "global_step": 453637, "epoch": 5465} {"train_loss": -26.61465835571289, "global_step": 453638, "epoch": 5465} {"train_loss": -27.21767234802246, "global_step": 453639, "epoch": 5465} {"train_loss": -27.12725257873535, "global_step": 453640, "epoch": 5465} {"train_loss": -26.879724502563477, "global_step": 453641, "epoch": 5465} {"train_loss": -27.05743408203125, "global_step": 453642, "epoch": 5465} {"train_loss": -27.27020835876465, "global_step": 453643, "epoch": 5465} {"train_loss": -26.878437042236328, "global_step": 453644, "epoch": 5465} {"train_loss": -27.217992782592773, "global_step": 453645, "epoch": 5465} {"train_loss": -26.905181884765625, "global_step": 453646, "epoch": 5465} {"train_loss": -27.139440536499023, "global_step": 453647, "epoch": 5465} {"train_loss": -27.36444664001465, "global_step": 453648, "epoch": 5465} {"train_loss": -26.624128341674805, "global_step": 453649, "epoch": 5465} {"train_loss": -27.037235260009766, "global_step": 453650, "epoch": 5465} {"train_loss": -26.954755783081055, "global_step": 453651, "epoch": 5465} {"train_loss": -27.038232803344727, "global_step": 453652, "epoch": 5465} {"train_loss": -27.042768478393555, "global_step": 453653, "epoch": 5465} {"train_loss": -27.07264518737793, "global_step": 453654, "epoch": 5465} {"train_loss": -26.93778419494629, "global_step": 453655, "epoch": 5465} {"train_loss": -27.17717933654785, "global_step": 453656, "epoch": 5465} {"train_loss": -27.398162841796875, "global_step": 453657, "epoch": 5465} {"train_loss": -26.8796443939209, "global_step": 453658, "epoch": 5465} {"train_loss": -26.746795654296875, "global_step": 453659, "epoch": 5465} {"train_loss": -26.5992431640625, "global_step": 453660, "epoch": 5465} {"train_loss": -26.87868309020996, "global_step": 453661, "epoch": 5465} {"train_loss": -27.16788673400879, "global_step": 453662, "epoch": 5465} {"train_loss": -26.90701675415039, "global_step": 453663, "epoch": 5465} {"train_loss": -26.662017822265625, "global_step": 453664, "epoch": 5465} {"train_loss": -27.146560668945312, "global_step": 453665, "epoch": 5465} {"train_loss": -27.305410385131836, "global_step": 453666, "epoch": 5465} {"train_loss": -27.258026123046875, "global_step": 453667, "epoch": 5465} {"train_loss": -27.05014991760254, "global_step": 453668, "epoch": 5465} {"train_loss": -27.0050048828125, "global_step": 453669, "epoch": 5465} {"train_loss": -27.24806022644043, "global_step": 453670, "epoch": 5465} {"train_loss": -26.308795928955078, "global_step": 453671, "epoch": 5465} {"train_loss": -26.99152946472168, "global_step": 453672, "epoch": 5465} {"train_loss": -26.85416030883789, "global_step": 453673, "epoch": 5465} {"train_loss": -27.17827796936035, "global_step": 453674, "epoch": 5465} {"train_loss": -27.084186553955078, "global_step": 453675, "epoch": 5465} {"train_loss": -26.615097045898438, "global_step": 453676, "epoch": 5465} {"train_loss": -26.989141119531837, "global_step": 453677, "epoch": 5465, "val_loss": 6673626.0} {"train_loss": -26.15150260925293, "global_step": 453678, "epoch": 5466} {"train_loss": -26.899368286132812, "global_step": 453679, "epoch": 5466} {"train_loss": -26.232404708862305, "global_step": 453680, "epoch": 5466} {"train_loss": -26.48981285095215, "global_step": 453681, "epoch": 5466} {"train_loss": -25.86847496032715, "global_step": 453682, "epoch": 5466} {"train_loss": -26.088788986206055, "global_step": 453683, "epoch": 5466} {"train_loss": -26.527734756469727, "global_step": 453684, "epoch": 5466} {"train_loss": -26.3026180267334, "global_step": 453685, "epoch": 5466} {"train_loss": -26.1649112701416, "global_step": 453686, "epoch": 5466} {"train_loss": -26.5001163482666, "global_step": 453687, "epoch": 5466} {"train_loss": -26.608488082885742, "global_step": 453688, "epoch": 5466} {"train_loss": -26.388168334960938, "global_step": 453689, "epoch": 5466} {"train_loss": -26.549524307250977, "global_step": 453690, "epoch": 5466} {"train_loss": -26.616979598999023, "global_step": 453691, "epoch": 5466} {"train_loss": -26.370569229125977, "global_step": 453692, "epoch": 5466} {"train_loss": -26.734607696533203, "global_step": 453693, "epoch": 5466} {"train_loss": -26.8757381439209, "global_step": 453694, "epoch": 5466} {"train_loss": -27.118078231811523, "global_step": 453695, "epoch": 5466} {"train_loss": -26.837982177734375, "global_step": 453696, "epoch": 5466} {"train_loss": -26.799047470092773, "global_step": 453697, "epoch": 5466} {"train_loss": -26.80430030822754, "global_step": 453698, "epoch": 5466} {"train_loss": -26.762338638305664, "global_step": 453699, "epoch": 5466} {"train_loss": -26.970199584960938, "global_step": 453700, "epoch": 5466} {"train_loss": -27.007715225219727, "global_step": 453701, "epoch": 5466} {"train_loss": -27.149240493774414, "global_step": 453702, "epoch": 5466} {"train_loss": -26.832935333251953, "global_step": 453703, "epoch": 5466} {"train_loss": -26.969593048095703, "global_step": 453704, "epoch": 5466} {"train_loss": -27.03290367126465, "global_step": 453705, "epoch": 5466} {"train_loss": -26.941064834594727, "global_step": 453706, "epoch": 5466} {"train_loss": -27.299728393554688, "global_step": 453707, "epoch": 5466} {"train_loss": -26.85259437561035, "global_step": 453708, "epoch": 5466} {"train_loss": -27.117584228515625, "global_step": 453709, "epoch": 5466} {"train_loss": -27.00396156311035, "global_step": 453710, "epoch": 5466} {"train_loss": -26.7683162689209, "global_step": 453711, "epoch": 5466} {"train_loss": -26.992202758789062, "global_step": 453712, "epoch": 5466} {"train_loss": -27.181928634643555, "global_step": 453713, "epoch": 5466} {"train_loss": -27.151233673095703, "global_step": 453714, "epoch": 5466} {"train_loss": -26.803546905517578, "global_step": 453715, "epoch": 5466} {"train_loss": -27.133527755737305, "global_step": 453716, "epoch": 5466} {"train_loss": -27.359455108642578, "global_step": 453717, "epoch": 5466} {"train_loss": -27.09517478942871, "global_step": 453718, "epoch": 5466} {"train_loss": -27.25189781188965, "global_step": 453719, "epoch": 5466} {"train_loss": -27.095489501953125, "global_step": 453720, "epoch": 5466} {"train_loss": -27.0983943939209, "global_step": 453721, "epoch": 5466} {"train_loss": -26.893512725830078, "global_step": 453722, "epoch": 5466} {"train_loss": -27.10483741760254, "global_step": 453723, "epoch": 5466} {"train_loss": -27.236087799072266, "global_step": 453724, "epoch": 5466} {"train_loss": -27.2135009765625, "global_step": 453725, "epoch": 5466} {"train_loss": -26.397785186767578, "global_step": 453726, "epoch": 5466} {"train_loss": -26.815656661987305, "global_step": 453727, "epoch": 5466} {"train_loss": -27.45269203186035, "global_step": 453728, "epoch": 5466} {"train_loss": -26.86871910095215, "global_step": 453729, "epoch": 5466} {"train_loss": -26.28647232055664, "global_step": 453730, "epoch": 5466} {"train_loss": -26.873945236206055, "global_step": 453731, "epoch": 5466} {"train_loss": -26.879621505737305, "global_step": 453732, "epoch": 5466} {"train_loss": -27.023853302001953, "global_step": 453733, "epoch": 5466} {"train_loss": -26.909626007080078, "global_step": 453734, "epoch": 5466} {"train_loss": -26.41151237487793, "global_step": 453735, "epoch": 5466} {"train_loss": -26.980133056640625, "global_step": 453736, "epoch": 5466} {"train_loss": -26.753503799438477, "global_step": 453737, "epoch": 5466} {"train_loss": -26.811695098876953, "global_step": 453738, "epoch": 5466} {"train_loss": -27.3509464263916, "global_step": 453739, "epoch": 5466} {"train_loss": -26.986942291259766, "global_step": 453740, "epoch": 5466} {"train_loss": -27.221921920776367, "global_step": 453741, "epoch": 5466} {"train_loss": -26.81892204284668, "global_step": 453742, "epoch": 5466} {"train_loss": -27.290164947509766, "global_step": 453743, "epoch": 5466} {"train_loss": -27.18603515625, "global_step": 453744, "epoch": 5466} {"train_loss": -27.413110733032227, "global_step": 453745, "epoch": 5466} {"train_loss": -27.044559478759766, "global_step": 453746, "epoch": 5466} {"train_loss": -27.223175048828125, "global_step": 453747, "epoch": 5466} {"train_loss": -27.10426902770996, "global_step": 453748, "epoch": 5466} {"train_loss": -27.018041610717773, "global_step": 453749, "epoch": 5466} {"train_loss": -27.003437042236328, "global_step": 453750, "epoch": 5466} {"train_loss": -27.182889938354492, "global_step": 453751, "epoch": 5466} {"train_loss": -27.09104347229004, "global_step": 453752, "epoch": 5466} {"train_loss": -27.0743408203125, "global_step": 453753, "epoch": 5466} {"train_loss": -27.384140014648438, "global_step": 453754, "epoch": 5466} {"train_loss": -27.518091201782227, "global_step": 453755, "epoch": 5466} {"train_loss": -27.43379783630371, "global_step": 453756, "epoch": 5466} {"train_loss": -27.187274932861328, "global_step": 453757, "epoch": 5466} {"train_loss": -27.17669677734375, "global_step": 453758, "epoch": 5466} {"train_loss": -27.005578994750977, "global_step": 453759, "epoch": 5466} {"train_loss": -26.905276861535498, "global_step": 453760, "epoch": 5466, "val_loss": 6646265.0} {"train_loss": -26.730268478393555, "global_step": 453761, "epoch": 5467} {"train_loss": -26.647424697875977, "global_step": 453762, "epoch": 5467} {"train_loss": -26.588525772094727, "global_step": 453763, "epoch": 5467} {"train_loss": -26.25721549987793, "global_step": 453764, "epoch": 5467} {"train_loss": -26.708271026611328, "global_step": 453765, "epoch": 5467} {"train_loss": -26.543106079101562, "global_step": 453766, "epoch": 5467} {"train_loss": -26.458398818969727, "global_step": 453767, "epoch": 5467} {"train_loss": -26.97491455078125, "global_step": 453768, "epoch": 5467} {"train_loss": -26.60760498046875, "global_step": 453769, "epoch": 5467} {"train_loss": -26.622589111328125, "global_step": 453770, "epoch": 5467} {"train_loss": -27.090951919555664, "global_step": 453771, "epoch": 5467} {"train_loss": -26.994220733642578, "global_step": 453772, "epoch": 5467} {"train_loss": -26.711322784423828, "global_step": 453773, "epoch": 5467} {"train_loss": -26.973407745361328, "global_step": 453774, "epoch": 5467} {"train_loss": -26.836286544799805, "global_step": 453775, "epoch": 5467} {"train_loss": -27.150800704956055, "global_step": 453776, "epoch": 5467} {"train_loss": -26.96186637878418, "global_step": 453777, "epoch": 5467} {"train_loss": -26.969852447509766, "global_step": 453778, "epoch": 5467} {"train_loss": -27.195987701416016, "global_step": 453779, "epoch": 5467} {"train_loss": -26.879491806030273, "global_step": 453780, "epoch": 5467} {"train_loss": -26.430511474609375, "global_step": 453781, "epoch": 5467} {"train_loss": -26.643630981445312, "global_step": 453782, "epoch": 5467} {"train_loss": -27.177600860595703, "global_step": 453783, "epoch": 5467} {"train_loss": -26.6697998046875, "global_step": 453784, "epoch": 5467} {"train_loss": -26.5559139251709, "global_step": 453785, "epoch": 5467} {"train_loss": -26.800952911376953, "global_step": 453786, "epoch": 5467} {"train_loss": -26.935338973999023, "global_step": 453787, "epoch": 5467} {"train_loss": -26.86054039001465, "global_step": 453788, "epoch": 5467} {"train_loss": -27.176706314086914, "global_step": 453789, "epoch": 5467} {"train_loss": -27.0571346282959, "global_step": 453790, "epoch": 5467} {"train_loss": -26.996198654174805, "global_step": 453791, "epoch": 5467} {"train_loss": -26.75516128540039, "global_step": 453792, "epoch": 5467} {"train_loss": -26.805133819580078, "global_step": 453793, "epoch": 5467} {"train_loss": -27.14417839050293, "global_step": 453794, "epoch": 5467} {"train_loss": -26.971710205078125, "global_step": 453795, "epoch": 5467} {"train_loss": -26.968000411987305, "global_step": 453796, "epoch": 5467} {"train_loss": -26.864856719970703, "global_step": 453797, "epoch": 5467} {"train_loss": -27.281524658203125, "global_step": 453798, "epoch": 5467} {"train_loss": -27.357763290405273, "global_step": 453799, "epoch": 5467} {"train_loss": -27.239233016967773, "global_step": 453800, "epoch": 5467} {"train_loss": -27.365100860595703, "global_step": 453801, "epoch": 5467} {"train_loss": -27.06686782836914, "global_step": 453802, "epoch": 5467} {"train_loss": -27.21356773376465, "global_step": 453803, "epoch": 5467} {"train_loss": -27.17951774597168, "global_step": 453804, "epoch": 5467} {"train_loss": -26.922460556030273, "global_step": 453805, "epoch": 5467} {"train_loss": -26.799854278564453, "global_step": 453806, "epoch": 5467} {"train_loss": -27.063634872436523, "global_step": 453807, "epoch": 5467} {"train_loss": -26.973865509033203, "global_step": 453808, "epoch": 5467} {"train_loss": -27.028573989868164, "global_step": 453809, "epoch": 5467} {"train_loss": -27.301450729370117, "global_step": 453810, "epoch": 5467} {"train_loss": -27.16387367248535, "global_step": 453811, "epoch": 5467} {"train_loss": -27.057113647460938, "global_step": 453812, "epoch": 5467} {"train_loss": -27.21822166442871, "global_step": 453813, "epoch": 5467} {"train_loss": -27.1434268951416, "global_step": 453814, "epoch": 5467} {"train_loss": -27.010541915893555, "global_step": 453815, "epoch": 5467} {"train_loss": -27.311437606811523, "global_step": 453816, "epoch": 5467} {"train_loss": -26.85102653503418, "global_step": 453817, "epoch": 5467} {"train_loss": -26.869190216064453, "global_step": 453818, "epoch": 5467} {"train_loss": -26.30253028869629, "global_step": 453819, "epoch": 5467} {"train_loss": -26.643171310424805, "global_step": 453820, "epoch": 5467} {"train_loss": -27.086414337158203, "global_step": 453821, "epoch": 5467} {"train_loss": -26.840253829956055, "global_step": 453822, "epoch": 5467} {"train_loss": -26.934558868408203, "global_step": 453823, "epoch": 5467} {"train_loss": -26.89935302734375, "global_step": 453824, "epoch": 5467} {"train_loss": -26.72559928894043, "global_step": 453825, "epoch": 5467} {"train_loss": -27.10320472717285, "global_step": 453826, "epoch": 5467} {"train_loss": -27.381439208984375, "global_step": 453827, "epoch": 5467} {"train_loss": -26.61195182800293, "global_step": 453828, "epoch": 5467} {"train_loss": -26.8347225189209, "global_step": 453829, "epoch": 5467} {"train_loss": -26.933679580688477, "global_step": 453830, "epoch": 5467} {"train_loss": -27.00649070739746, "global_step": 453831, "epoch": 5467} {"train_loss": -27.053028106689453, "global_step": 453832, "epoch": 5467} {"train_loss": -26.835901260375977, "global_step": 453833, "epoch": 5467} {"train_loss": -27.233198165893555, "global_step": 453834, "epoch": 5467} {"train_loss": -26.898923873901367, "global_step": 453835, "epoch": 5467} {"train_loss": -27.286664962768555, "global_step": 453836, "epoch": 5467} {"train_loss": -27.100675582885742, "global_step": 453837, "epoch": 5467} {"train_loss": -27.325246810913086, "global_step": 453838, "epoch": 5467} {"train_loss": -26.7729549407959, "global_step": 453839, "epoch": 5467} {"train_loss": -27.23381996154785, "global_step": 453840, "epoch": 5467} {"train_loss": -27.29794692993164, "global_step": 453841, "epoch": 5467} {"train_loss": -27.18878173828125, "global_step": 453842, "epoch": 5467} {"train_loss": -26.942192514258696, "global_step": 453843, "epoch": 5467, "val_loss": 6638622.0} {"train_loss": -26.557575225830078, "global_step": 453844, "epoch": 5468} {"train_loss": -26.534116744995117, "global_step": 453845, "epoch": 5468} {"train_loss": -26.939401626586914, "global_step": 453846, "epoch": 5468} {"train_loss": -26.730615615844727, "global_step": 453847, "epoch": 5468} {"train_loss": -26.465482711791992, "global_step": 453848, "epoch": 5468} {"train_loss": -26.50531578063965, "global_step": 453849, "epoch": 5468} {"train_loss": -26.737836837768555, "global_step": 453850, "epoch": 5468} {"train_loss": -26.969745635986328, "global_step": 453851, "epoch": 5468} {"train_loss": -26.62764549255371, "global_step": 453852, "epoch": 5468} {"train_loss": -26.685216903686523, "global_step": 453853, "epoch": 5468} {"train_loss": -26.3565616607666, "global_step": 453854, "epoch": 5468} {"train_loss": -26.9149112701416, "global_step": 453855, "epoch": 5468} {"train_loss": -26.50713539123535, "global_step": 453856, "epoch": 5468} {"train_loss": -27.143543243408203, "global_step": 453857, "epoch": 5468} {"train_loss": -26.958303451538086, "global_step": 453858, "epoch": 5468} {"train_loss": -26.87461280822754, "global_step": 453859, "epoch": 5468} {"train_loss": -26.803287506103516, "global_step": 453860, "epoch": 5468} {"train_loss": -26.915510177612305, "global_step": 453861, "epoch": 5468} {"train_loss": -26.72456932067871, "global_step": 453862, "epoch": 5468} {"train_loss": -26.767683029174805, "global_step": 453863, "epoch": 5468} {"train_loss": -26.888996124267578, "global_step": 453864, "epoch": 5468} {"train_loss": -26.99995231628418, "global_step": 453865, "epoch": 5468} {"train_loss": -26.938932418823242, "global_step": 453866, "epoch": 5468} {"train_loss": -27.077869415283203, "global_step": 453867, "epoch": 5468} {"train_loss": -27.213171005249023, "global_step": 453868, "epoch": 5468} {"train_loss": -26.8134822845459, "global_step": 453869, "epoch": 5468} {"train_loss": -27.005598068237305, "global_step": 453870, "epoch": 5468} {"train_loss": -27.319894790649414, "global_step": 453871, "epoch": 5468} {"train_loss": -27.123275756835938, "global_step": 453872, "epoch": 5468} {"train_loss": -26.778289794921875, "global_step": 453873, "epoch": 5468} {"train_loss": -27.15789222717285, "global_step": 453874, "epoch": 5468} {"train_loss": -27.094263076782227, "global_step": 453875, "epoch": 5468} {"train_loss": -26.84293556213379, "global_step": 453876, "epoch": 5468} {"train_loss": -27.41420555114746, "global_step": 453877, "epoch": 5468} {"train_loss": -27.359994888305664, "global_step": 453878, "epoch": 5468} {"train_loss": -27.270238876342773, "global_step": 453879, "epoch": 5468} {"train_loss": -26.992218017578125, "global_step": 453880, "epoch": 5468} {"train_loss": -26.93232536315918, "global_step": 453881, "epoch": 5468} {"train_loss": -27.06778335571289, "global_step": 453882, "epoch": 5468} {"train_loss": -26.778528213500977, "global_step": 453883, "epoch": 5468} {"train_loss": -27.00896644592285, "global_step": 453884, "epoch": 5468} {"train_loss": -27.1314754486084, "global_step": 453885, "epoch": 5468} {"train_loss": -26.888141632080078, "global_step": 453886, "epoch": 5468} {"train_loss": -27.329757690429688, "global_step": 453887, "epoch": 5468} {"train_loss": -27.305700302124023, "global_step": 453888, "epoch": 5468} {"train_loss": -27.13212013244629, "global_step": 453889, "epoch": 5468} {"train_loss": -27.132526397705078, "global_step": 453890, "epoch": 5468} {"train_loss": -27.222320556640625, "global_step": 453891, "epoch": 5468} {"train_loss": -26.909460067749023, "global_step": 453892, "epoch": 5468} {"train_loss": -27.146345138549805, "global_step": 453893, "epoch": 5468} {"train_loss": -27.173145294189453, "global_step": 453894, "epoch": 5468} {"train_loss": -27.0502872467041, "global_step": 453895, "epoch": 5468} {"train_loss": -27.189672470092773, "global_step": 453896, "epoch": 5468} {"train_loss": -26.955707550048828, "global_step": 453897, "epoch": 5468} {"train_loss": -27.36041831970215, "global_step": 453898, "epoch": 5468} {"train_loss": -27.0964298248291, "global_step": 453899, "epoch": 5468} {"train_loss": -26.87244987487793, "global_step": 453900, "epoch": 5468} {"train_loss": -27.46723747253418, "global_step": 453901, "epoch": 5468} {"train_loss": -26.71173095703125, "global_step": 453902, "epoch": 5468} {"train_loss": -27.103897094726562, "global_step": 453903, "epoch": 5468} {"train_loss": -26.874069213867188, "global_step": 453904, "epoch": 5468} {"train_loss": -26.479787826538086, "global_step": 453905, "epoch": 5468} {"train_loss": -25.9704532623291, "global_step": 453906, "epoch": 5468} {"train_loss": -25.742712020874023, "global_step": 453907, "epoch": 5468} {"train_loss": -26.059484481811523, "global_step": 453908, "epoch": 5468} {"train_loss": -26.980209350585938, "global_step": 453909, "epoch": 5468} {"train_loss": -26.357269287109375, "global_step": 453910, "epoch": 5468} {"train_loss": -26.642980575561523, "global_step": 453911, "epoch": 5468} {"train_loss": -26.909931182861328, "global_step": 453912, "epoch": 5468} {"train_loss": -26.796920776367188, "global_step": 453913, "epoch": 5468} {"train_loss": -26.542163848876953, "global_step": 453914, "epoch": 5468} {"train_loss": -26.935760498046875, "global_step": 453915, "epoch": 5468} {"train_loss": -26.559782028198242, "global_step": 453916, "epoch": 5468} {"train_loss": -26.529218673706055, "global_step": 453917, "epoch": 5468} {"train_loss": -26.456159591674805, "global_step": 453918, "epoch": 5468} {"train_loss": -26.5050048828125, "global_step": 453919, "epoch": 5468} {"train_loss": -26.613622665405273, "global_step": 453920, "epoch": 5468} {"train_loss": -26.644468307495117, "global_step": 453921, "epoch": 5468} {"train_loss": -26.644556045532227, "global_step": 453922, "epoch": 5468} {"train_loss": -26.958606719970703, "global_step": 453923, "epoch": 5468} {"train_loss": -26.7203311920166, "global_step": 453924, "epoch": 5468} {"train_loss": -26.621780395507812, "global_step": 453925, "epoch": 5468} {"train_loss": -26.868448923869305, "global_step": 453926, "epoch": 5468, "val_loss": 6605152.5} {"train_loss": -26.543420791625977, "global_step": 453927, "epoch": 5469} {"train_loss": -26.055988311767578, "global_step": 453928, "epoch": 5469} {"train_loss": -26.490070343017578, "global_step": 453929, "epoch": 5469} {"train_loss": -26.2213134765625, "global_step": 453930, "epoch": 5469} {"train_loss": -26.46211051940918, "global_step": 453931, "epoch": 5469} {"train_loss": -26.347797393798828, "global_step": 453932, "epoch": 5469} {"train_loss": -26.9024715423584, "global_step": 453933, "epoch": 5469} {"train_loss": -26.564355850219727, "global_step": 453934, "epoch": 5469} {"train_loss": -26.632230758666992, "global_step": 453935, "epoch": 5469} {"train_loss": -27.0913143157959, "global_step": 453936, "epoch": 5469} {"train_loss": -27.201536178588867, "global_step": 453937, "epoch": 5469} {"train_loss": -26.478071212768555, "global_step": 453938, "epoch": 5469} {"train_loss": -26.71333122253418, "global_step": 453939, "epoch": 5469} {"train_loss": -26.829986572265625, "global_step": 453940, "epoch": 5469} {"train_loss": -26.547815322875977, "global_step": 453941, "epoch": 5469} {"train_loss": -27.061445236206055, "global_step": 453942, "epoch": 5469} {"train_loss": -26.719106674194336, "global_step": 453943, "epoch": 5469} {"train_loss": -27.342939376831055, "global_step": 453944, "epoch": 5469} {"train_loss": -27.004980087280273, "global_step": 453945, "epoch": 5469} {"train_loss": -26.913305282592773, "global_step": 453946, "epoch": 5469} {"train_loss": -26.90283203125, "global_step": 453947, "epoch": 5469} {"train_loss": -26.81741714477539, "global_step": 453948, "epoch": 5469} {"train_loss": -26.767621994018555, "global_step": 453949, "epoch": 5469} {"train_loss": -27.137073516845703, "global_step": 453950, "epoch": 5469} {"train_loss": -27.137882232666016, "global_step": 453951, "epoch": 5469} {"train_loss": -27.353271484375, "global_step": 453952, "epoch": 5469} {"train_loss": -27.280658721923828, "global_step": 453953, "epoch": 5469} {"train_loss": -27.027191162109375, "global_step": 453954, "epoch": 5469} {"train_loss": -26.866540908813477, "global_step": 453955, "epoch": 5469} {"train_loss": -27.309045791625977, "global_step": 453956, "epoch": 5469} {"train_loss": -26.72663688659668, "global_step": 453957, "epoch": 5469} {"train_loss": -26.599597930908203, "global_step": 453958, "epoch": 5469} {"train_loss": -27.066452026367188, "global_step": 453959, "epoch": 5469} {"train_loss": -27.15740394592285, "global_step": 453960, "epoch": 5469} {"train_loss": -27.589752197265625, "global_step": 453961, "epoch": 5469} {"train_loss": -27.226764678955078, "global_step": 453962, "epoch": 5469} {"train_loss": -27.169281005859375, "global_step": 453963, "epoch": 5469} {"train_loss": -26.952123641967773, "global_step": 453964, "epoch": 5469} {"train_loss": -27.293354034423828, "global_step": 453965, "epoch": 5469} {"train_loss": -26.648038864135742, "global_step": 453966, "epoch": 5469} {"train_loss": -27.152149200439453, "global_step": 453967, "epoch": 5469} {"train_loss": -27.02007484436035, "global_step": 453968, "epoch": 5469} {"train_loss": -26.965219497680664, "global_step": 453969, "epoch": 5469} {"train_loss": -27.30305290222168, "global_step": 453970, "epoch": 5469} {"train_loss": -27.219518661499023, "global_step": 453971, "epoch": 5469} {"train_loss": -26.93057632446289, "global_step": 453972, "epoch": 5469} {"train_loss": -27.2642765045166, "global_step": 453973, "epoch": 5469} {"train_loss": -27.019025802612305, "global_step": 453974, "epoch": 5469} {"train_loss": -27.663930892944336, "global_step": 453975, "epoch": 5469} {"train_loss": -27.339569091796875, "global_step": 453976, "epoch": 5469} {"train_loss": -26.908979415893555, "global_step": 453977, "epoch": 5469} {"train_loss": -27.11665153503418, "global_step": 453978, "epoch": 5469} {"train_loss": -27.094314575195312, "global_step": 453979, "epoch": 5469} {"train_loss": -27.374027252197266, "global_step": 453980, "epoch": 5469} {"train_loss": -26.95554542541504, "global_step": 453981, "epoch": 5469} {"train_loss": -27.08045768737793, "global_step": 453982, "epoch": 5469} {"train_loss": -27.003026962280273, "global_step": 453983, "epoch": 5469} {"train_loss": -27.23456382751465, "global_step": 453984, "epoch": 5469} {"train_loss": -26.944639205932617, "global_step": 453985, "epoch": 5469} {"train_loss": -27.29119300842285, "global_step": 453986, "epoch": 5469} {"train_loss": -27.12006950378418, "global_step": 453987, "epoch": 5469} {"train_loss": -27.163299560546875, "global_step": 453988, "epoch": 5469} {"train_loss": -27.3939266204834, "global_step": 453989, "epoch": 5469} {"train_loss": -27.19170570373535, "global_step": 453990, "epoch": 5469} {"train_loss": -27.23603630065918, "global_step": 453991, "epoch": 5469} {"train_loss": -27.0046329498291, "global_step": 453992, "epoch": 5469} {"train_loss": -27.064716339111328, "global_step": 453993, "epoch": 5469} {"train_loss": -27.422658920288086, "global_step": 453994, "epoch": 5469} {"train_loss": -27.21785545349121, "global_step": 453995, "epoch": 5469} {"train_loss": -26.894697189331055, "global_step": 453996, "epoch": 5469} {"train_loss": -26.984464645385742, "global_step": 453997, "epoch": 5469} {"train_loss": -26.97464942932129, "global_step": 453998, "epoch": 5469} {"train_loss": -27.35284423828125, "global_step": 453999, "epoch": 5469} {"train_loss": -27.086669921875, "global_step": 454000, "epoch": 5469} {"train_loss": -26.99262046813965, "global_step": 454001, "epoch": 5469} {"train_loss": -26.691558837890625, "global_step": 454002, "epoch": 5469} {"train_loss": -27.323957443237305, "global_step": 454003, "epoch": 5469} {"train_loss": -27.13800048828125, "global_step": 454004, "epoch": 5469} {"train_loss": -27.0654296875, "global_step": 454005, "epoch": 5469} {"train_loss": -27.5611515045166, "global_step": 454006, "epoch": 5469} {"train_loss": -26.950544357299805, "global_step": 454007, "epoch": 5469} {"train_loss": -27.5838680267334, "global_step": 454008, "epoch": 5469} {"train_loss": -27.017043377979693, "global_step": 454009, "epoch": 5469, "val_loss": 6632762.0} {"train_loss": -25.933969497680664, "global_step": 454010, "epoch": 5470} {"train_loss": -26.358144760131836, "global_step": 454011, "epoch": 5470} {"train_loss": -26.11383628845215, "global_step": 454012, "epoch": 5470} {"train_loss": -25.451698303222656, "global_step": 454013, "epoch": 5470} {"train_loss": -25.445926666259766, "global_step": 454014, "epoch": 5470} {"train_loss": -25.676584243774414, "global_step": 454015, "epoch": 5470} {"train_loss": -25.16357421875, "global_step": 454016, "epoch": 5470} {"train_loss": -26.3179988861084, "global_step": 454017, "epoch": 5470} {"train_loss": -26.164981842041016, "global_step": 454018, "epoch": 5470} {"train_loss": -25.852689743041992, "global_step": 454019, "epoch": 5470} {"train_loss": -26.441883087158203, "global_step": 454020, "epoch": 5470} {"train_loss": -26.304513931274414, "global_step": 454021, "epoch": 5470} {"train_loss": -25.685516357421875, "global_step": 454022, "epoch": 5470} {"train_loss": -26.06760597229004, "global_step": 454023, "epoch": 5470} {"train_loss": -26.467023849487305, "global_step": 454024, "epoch": 5470} {"train_loss": -26.11480712890625, "global_step": 454025, "epoch": 5470} {"train_loss": -26.80242347717285, "global_step": 454026, "epoch": 5470} {"train_loss": -26.423242568969727, "global_step": 454027, "epoch": 5470} {"train_loss": -26.39680290222168, "global_step": 454028, "epoch": 5470} {"train_loss": -26.682453155517578, "global_step": 454029, "epoch": 5470} {"train_loss": -26.471038818359375, "global_step": 454030, "epoch": 5470} {"train_loss": -26.41541862487793, "global_step": 454031, "epoch": 5470} {"train_loss": -26.601903915405273, "global_step": 454032, "epoch": 5470} {"train_loss": -26.9417667388916, "global_step": 454033, "epoch": 5470} {"train_loss": -26.906967163085938, "global_step": 454034, "epoch": 5470} {"train_loss": -26.429113388061523, "global_step": 454035, "epoch": 5470} {"train_loss": -26.510595321655273, "global_step": 454036, "epoch": 5470} {"train_loss": -26.915266036987305, "global_step": 454037, "epoch": 5470} {"train_loss": -26.579809188842773, "global_step": 454038, "epoch": 5470} {"train_loss": -26.997055053710938, "global_step": 454039, "epoch": 5470} {"train_loss": -27.0843448638916, "global_step": 454040, "epoch": 5470} {"train_loss": -26.71876335144043, "global_step": 454041, "epoch": 5470} {"train_loss": -26.709943771362305, "global_step": 454042, "epoch": 5470} {"train_loss": -26.995502471923828, "global_step": 454043, "epoch": 5470} {"train_loss": -26.652524948120117, "global_step": 454044, "epoch": 5470} {"train_loss": -26.854171752929688, "global_step": 454045, "epoch": 5470} {"train_loss": -26.812164306640625, "global_step": 454046, "epoch": 5470} {"train_loss": -26.71124839782715, "global_step": 454047, "epoch": 5470} {"train_loss": -26.650686264038086, "global_step": 454048, "epoch": 5470} {"train_loss": -27.206268310546875, "global_step": 454049, "epoch": 5470} {"train_loss": -26.904321670532227, "global_step": 454050, "epoch": 5470} {"train_loss": -26.673358917236328, "global_step": 454051, "epoch": 5470} {"train_loss": -26.888715744018555, "global_step": 454052, "epoch": 5470} {"train_loss": -27.136199951171875, "global_step": 454053, "epoch": 5470} {"train_loss": -26.910400390625, "global_step": 454054, "epoch": 5470} {"train_loss": -27.0860652923584, "global_step": 454055, "epoch": 5470} {"train_loss": -26.764066696166992, "global_step": 454056, "epoch": 5470} {"train_loss": -27.100805282592773, "global_step": 454057, "epoch": 5470} {"train_loss": -26.992496490478516, "global_step": 454058, "epoch": 5470} {"train_loss": -27.056640625, "global_step": 454059, "epoch": 5470} {"train_loss": -27.50200843811035, "global_step": 454060, "epoch": 5470} {"train_loss": -27.50380516052246, "global_step": 454061, "epoch": 5470} {"train_loss": -27.149320602416992, "global_step": 454062, "epoch": 5470} {"train_loss": -27.319915771484375, "global_step": 454063, "epoch": 5470} {"train_loss": -27.039249420166016, "global_step": 454064, "epoch": 5470} {"train_loss": -27.23084831237793, "global_step": 454065, "epoch": 5470} {"train_loss": -27.458602905273438, "global_step": 454066, "epoch": 5470} {"train_loss": -27.3463077545166, "global_step": 454067, "epoch": 5470} {"train_loss": -27.344446182250977, "global_step": 454068, "epoch": 5470} {"train_loss": -27.541690826416016, "global_step": 454069, "epoch": 5470} {"train_loss": -27.17084312438965, "global_step": 454070, "epoch": 5470} {"train_loss": -27.438501358032227, "global_step": 454071, "epoch": 5470} {"train_loss": -27.292505264282227, "global_step": 454072, "epoch": 5470} {"train_loss": -27.075244903564453, "global_step": 454073, "epoch": 5470} {"train_loss": -27.503131866455078, "global_step": 454074, "epoch": 5470} {"train_loss": -26.97865867614746, "global_step": 454075, "epoch": 5470} {"train_loss": -27.15540885925293, "global_step": 454076, "epoch": 5470} {"train_loss": -27.321508407592773, "global_step": 454077, "epoch": 5470} {"train_loss": -27.272912979125977, "global_step": 454078, "epoch": 5470} {"train_loss": -26.89792823791504, "global_step": 454079, "epoch": 5470} {"train_loss": -27.078937530517578, "global_step": 454080, "epoch": 5470} {"train_loss": -27.0114803314209, "global_step": 454081, "epoch": 5470} {"train_loss": -27.03150749206543, "global_step": 454082, "epoch": 5470} {"train_loss": -27.16399574279785, "global_step": 454083, "epoch": 5470} {"train_loss": -27.125574111938477, "global_step": 454084, "epoch": 5470} {"train_loss": -26.728864669799805, "global_step": 454085, "epoch": 5470} {"train_loss": -26.982526779174805, "global_step": 454086, "epoch": 5470} {"train_loss": -27.080942153930664, "global_step": 454087, "epoch": 5470} {"train_loss": -27.233274459838867, "global_step": 454088, "epoch": 5470} {"train_loss": -26.80353355407715, "global_step": 454089, "epoch": 5470} {"train_loss": -27.024789810180664, "global_step": 454090, "epoch": 5470} {"train_loss": -26.641218185424805, "global_step": 454091, "epoch": 5470} {"train_loss": -26.77914568889572, "global_step": 454092, "epoch": 5470, "val_loss": 6592090.0} {"train_loss": -25.979202270507812, "global_step": 454093, "epoch": 5471} {"train_loss": -26.073776245117188, "global_step": 454094, "epoch": 5471} {"train_loss": -26.230789184570312, "global_step": 454095, "epoch": 5471} {"train_loss": -26.462921142578125, "global_step": 454096, "epoch": 5471} {"train_loss": -26.37821388244629, "global_step": 454097, "epoch": 5471} {"train_loss": -26.472965240478516, "global_step": 454098, "epoch": 5471} {"train_loss": -26.20289421081543, "global_step": 454099, "epoch": 5471} {"train_loss": -26.52198600769043, "global_step": 454100, "epoch": 5471} {"train_loss": -26.382001876831055, "global_step": 454101, "epoch": 5471} {"train_loss": -26.671722412109375, "global_step": 454102, "epoch": 5471} {"train_loss": -26.263702392578125, "global_step": 454103, "epoch": 5471} {"train_loss": -26.59309959411621, "global_step": 454104, "epoch": 5471} {"train_loss": -26.48318862915039, "global_step": 454105, "epoch": 5471} {"train_loss": -26.61038589477539, "global_step": 454106, "epoch": 5471} {"train_loss": -26.77741813659668, "global_step": 454107, "epoch": 5471} {"train_loss": -26.600439071655273, "global_step": 454108, "epoch": 5471} {"train_loss": -26.43706703186035, "global_step": 454109, "epoch": 5471} {"train_loss": -26.6505126953125, "global_step": 454110, "epoch": 5471} {"train_loss": -26.88348960876465, "global_step": 454111, "epoch": 5471} {"train_loss": -26.714338302612305, "global_step": 454112, "epoch": 5471} {"train_loss": -26.854114532470703, "global_step": 454113, "epoch": 5471} {"train_loss": -26.707616806030273, "global_step": 454114, "epoch": 5471} {"train_loss": -26.611845016479492, "global_step": 454115, "epoch": 5471} {"train_loss": -26.8684139251709, "global_step": 454116, "epoch": 5471} {"train_loss": -26.8609561920166, "global_step": 454117, "epoch": 5471} {"train_loss": -26.79766845703125, "global_step": 454118, "epoch": 5471} {"train_loss": -26.703596115112305, "global_step": 454119, "epoch": 5471} {"train_loss": -26.785917282104492, "global_step": 454120, "epoch": 5471} {"train_loss": -27.2022705078125, "global_step": 454121, "epoch": 5471} {"train_loss": -26.872150421142578, "global_step": 454122, "epoch": 5471} {"train_loss": -26.79591178894043, "global_step": 454123, "epoch": 5471} {"train_loss": -26.926305770874023, "global_step": 454124, "epoch": 5471} {"train_loss": -27.334646224975586, "global_step": 454125, "epoch": 5471} {"train_loss": -27.18733024597168, "global_step": 454126, "epoch": 5471} {"train_loss": -27.118467330932617, "global_step": 454127, "epoch": 5471} {"train_loss": -27.05897331237793, "global_step": 454128, "epoch": 5471} {"train_loss": -27.306188583374023, "global_step": 454129, "epoch": 5471} {"train_loss": -27.061979293823242, "global_step": 454130, "epoch": 5471} {"train_loss": -27.481847763061523, "global_step": 454131, "epoch": 5471} {"train_loss": -27.43903160095215, "global_step": 454132, "epoch": 5471} {"train_loss": -27.392196655273438, "global_step": 454133, "epoch": 5471} {"train_loss": -27.12575340270996, "global_step": 454134, "epoch": 5471} {"train_loss": -27.510730743408203, "global_step": 454135, "epoch": 5471} {"train_loss": -27.213830947875977, "global_step": 454136, "epoch": 5471} {"train_loss": -27.1728458404541, "global_step": 454137, "epoch": 5471} {"train_loss": -27.369909286499023, "global_step": 454138, "epoch": 5471} {"train_loss": -27.093677520751953, "global_step": 454139, "epoch": 5471} {"train_loss": -27.059741973876953, "global_step": 454140, "epoch": 5471} {"train_loss": -27.078495025634766, "global_step": 454141, "epoch": 5471} {"train_loss": -27.0582275390625, "global_step": 454142, "epoch": 5471} {"train_loss": -26.85065269470215, "global_step": 454143, "epoch": 5471} {"train_loss": -25.61907386779785, "global_step": 454144, "epoch": 5471} {"train_loss": -25.18717384338379, "global_step": 454145, "epoch": 5471} {"train_loss": -25.60615348815918, "global_step": 454146, "epoch": 5471} {"train_loss": -26.2661190032959, "global_step": 454147, "epoch": 5471} {"train_loss": -26.878808975219727, "global_step": 454148, "epoch": 5471} {"train_loss": -26.4606990814209, "global_step": 454149, "epoch": 5471} {"train_loss": -26.234716415405273, "global_step": 454150, "epoch": 5471} {"train_loss": -26.588855743408203, "global_step": 454151, "epoch": 5471} {"train_loss": -26.270523071289062, "global_step": 454152, "epoch": 5471} {"train_loss": -26.97955894470215, "global_step": 454153, "epoch": 5471} {"train_loss": -26.380451202392578, "global_step": 454154, "epoch": 5471} {"train_loss": -26.676847457885742, "global_step": 454155, "epoch": 5471} {"train_loss": -26.850357055664062, "global_step": 454156, "epoch": 5471} {"train_loss": -26.53289222717285, "global_step": 454157, "epoch": 5471} {"train_loss": -27.0098934173584, "global_step": 454158, "epoch": 5471} {"train_loss": -26.781177520751953, "global_step": 454159, "epoch": 5471} {"train_loss": -26.705463409423828, "global_step": 454160, "epoch": 5471} {"train_loss": -26.607196807861328, "global_step": 454161, "epoch": 5471} {"train_loss": -26.514081954956055, "global_step": 454162, "epoch": 5471} {"train_loss": -26.939233779907227, "global_step": 454163, "epoch": 5471} {"train_loss": -27.305908203125, "global_step": 454164, "epoch": 5471} {"train_loss": -26.94459342956543, "global_step": 454165, "epoch": 5471} {"train_loss": -26.80877113342285, "global_step": 454166, "epoch": 5471} {"train_loss": -27.264719009399414, "global_step": 454167, "epoch": 5471} {"train_loss": -26.772214889526367, "global_step": 454168, "epoch": 5471} {"train_loss": -26.779739379882812, "global_step": 454169, "epoch": 5471} {"train_loss": -26.889448165893555, "global_step": 454170, "epoch": 5471} {"train_loss": -26.814573287963867, "global_step": 454171, "epoch": 5471} {"train_loss": -27.032611846923828, "global_step": 454172, "epoch": 5471} {"train_loss": -27.379392623901367, "global_step": 454173, "epoch": 5471} {"train_loss": -27.21339225769043, "global_step": 454174, "epoch": 5471} {"train_loss": -26.768256359789746, "global_step": 454175, "epoch": 5471, "val_loss": 6565347.0} {"train_loss": -26.90692138671875, "global_step": 454176, "epoch": 5472} {"train_loss": -27.31986427307129, "global_step": 454177, "epoch": 5472} {"train_loss": -26.674640655517578, "global_step": 454178, "epoch": 5472} {"train_loss": -27.382831573486328, "global_step": 454179, "epoch": 5472} {"train_loss": -26.78338623046875, "global_step": 454180, "epoch": 5472} {"train_loss": -26.963958740234375, "global_step": 454181, "epoch": 5472} {"train_loss": -27.084257125854492, "global_step": 454182, "epoch": 5472} {"train_loss": -27.22355079650879, "global_step": 454183, "epoch": 5472} {"train_loss": -26.5156192779541, "global_step": 454184, "epoch": 5472} {"train_loss": -27.326446533203125, "global_step": 454185, "epoch": 5472} {"train_loss": -26.966894149780273, "global_step": 454186, "epoch": 5472} {"train_loss": -27.061019897460938, "global_step": 454187, "epoch": 5472} {"train_loss": -27.060216903686523, "global_step": 454188, "epoch": 5472} {"train_loss": -27.1352481842041, "global_step": 454189, "epoch": 5472} {"train_loss": -26.925220489501953, "global_step": 454190, "epoch": 5472} {"train_loss": -27.05093765258789, "global_step": 454191, "epoch": 5472} {"train_loss": -26.956989288330078, "global_step": 454192, "epoch": 5472} {"train_loss": -27.153417587280273, "global_step": 454193, "epoch": 5472} {"train_loss": -26.921493530273438, "global_step": 454194, "epoch": 5472} {"train_loss": -27.109800338745117, "global_step": 454195, "epoch": 5472} {"train_loss": -27.07565689086914, "global_step": 454196, "epoch": 5472} {"train_loss": -26.924551010131836, "global_step": 454197, "epoch": 5472} {"train_loss": -27.02482032775879, "global_step": 454198, "epoch": 5472} {"train_loss": -27.159948348999023, "global_step": 454199, "epoch": 5472} {"train_loss": -27.287656784057617, "global_step": 454200, "epoch": 5472} {"train_loss": -26.93397331237793, "global_step": 454201, "epoch": 5472} {"train_loss": -27.442358016967773, "global_step": 454202, "epoch": 5472} {"train_loss": -27.32502555847168, "global_step": 454203, "epoch": 5472} {"train_loss": -27.381988525390625, "global_step": 454204, "epoch": 5472} {"train_loss": -27.38262367248535, "global_step": 454205, "epoch": 5472} {"train_loss": -27.4741153717041, "global_step": 454206, "epoch": 5472} {"train_loss": -27.319381713867188, "global_step": 454207, "epoch": 5472} {"train_loss": -27.458234786987305, "global_step": 454208, "epoch": 5472} {"train_loss": -26.91733169555664, "global_step": 454209, "epoch": 5472} {"train_loss": -27.22149085998535, "global_step": 454210, "epoch": 5472} {"train_loss": -27.058197021484375, "global_step": 454211, "epoch": 5472} {"train_loss": -27.178924560546875, "global_step": 454212, "epoch": 5472} {"train_loss": -26.74237632751465, "global_step": 454213, "epoch": 5472} {"train_loss": -27.28669548034668, "global_step": 454214, "epoch": 5472} {"train_loss": -27.081762313842773, "global_step": 454215, "epoch": 5472} {"train_loss": -26.8964786529541, "global_step": 454216, "epoch": 5472} {"train_loss": -26.891347885131836, "global_step": 454217, "epoch": 5472} {"train_loss": -27.025487899780273, "global_step": 454218, "epoch": 5472} {"train_loss": -27.562225341796875, "global_step": 454219, "epoch": 5472} {"train_loss": -26.78525733947754, "global_step": 454220, "epoch": 5472} {"train_loss": -27.239429473876953, "global_step": 454221, "epoch": 5472} {"train_loss": -26.983219146728516, "global_step": 454222, "epoch": 5472} {"train_loss": -27.267187118530273, "global_step": 454223, "epoch": 5472} {"train_loss": -26.957983016967773, "global_step": 454224, "epoch": 5472} {"train_loss": -26.649097442626953, "global_step": 454225, "epoch": 5472} {"train_loss": -27.28712272644043, "global_step": 454226, "epoch": 5472} {"train_loss": -26.990161895751953, "global_step": 454227, "epoch": 5472} {"train_loss": -26.91663932800293, "global_step": 454228, "epoch": 5472} {"train_loss": -26.632556915283203, "global_step": 454229, "epoch": 5472} {"train_loss": -26.975788116455078, "global_step": 454230, "epoch": 5472} {"train_loss": -27.061344146728516, "global_step": 454231, "epoch": 5472} {"train_loss": -26.32929039001465, "global_step": 454232, "epoch": 5472} {"train_loss": -27.1927433013916, "global_step": 454233, "epoch": 5472} {"train_loss": -27.119626998901367, "global_step": 454234, "epoch": 5472} {"train_loss": -27.043439865112305, "global_step": 454235, "epoch": 5472} {"train_loss": -26.956756591796875, "global_step": 454236, "epoch": 5472} {"train_loss": -27.17803955078125, "global_step": 454237, "epoch": 5472} {"train_loss": -27.35392189025879, "global_step": 454238, "epoch": 5472} {"train_loss": -26.9383544921875, "global_step": 454239, "epoch": 5472} {"train_loss": -26.940237045288086, "global_step": 454240, "epoch": 5472} {"train_loss": -26.66152000427246, "global_step": 454241, "epoch": 5472} {"train_loss": -27.05692481994629, "global_step": 454242, "epoch": 5472} {"train_loss": -26.878034591674805, "global_step": 454243, "epoch": 5472} {"train_loss": -26.83216667175293, "global_step": 454244, "epoch": 5472} {"train_loss": -27.070804595947266, "global_step": 454245, "epoch": 5472} {"train_loss": -27.33277702331543, "global_step": 454246, "epoch": 5472} {"train_loss": -26.7443904876709, "global_step": 454247, "epoch": 5472} {"train_loss": -27.200254440307617, "global_step": 454248, "epoch": 5472} {"train_loss": -27.463394165039062, "global_step": 454249, "epoch": 5472} {"train_loss": -27.22254753112793, "global_step": 454250, "epoch": 5472} {"train_loss": -27.541015625, "global_step": 454251, "epoch": 5472} {"train_loss": -26.558837890625, "global_step": 454252, "epoch": 5472} {"train_loss": -27.31117057800293, "global_step": 454253, "epoch": 5472} {"train_loss": -27.16962242126465, "global_step": 454254, "epoch": 5472} {"train_loss": -27.340600967407227, "global_step": 454255, "epoch": 5472} {"train_loss": -27.376562118530273, "global_step": 454256, "epoch": 5472} {"train_loss": -27.35565185546875, "global_step": 454257, "epoch": 5472} {"train_loss": -27.088891799191394, "global_step": 454258, "epoch": 5472, "val_loss": 6546531.0} {"train_loss": -27.494688034057617, "global_step": 454259, "epoch": 5473} {"train_loss": -26.830392837524414, "global_step": 454260, "epoch": 5473} {"train_loss": -26.805500030517578, "global_step": 454261, "epoch": 5473} {"train_loss": -26.84111976623535, "global_step": 454262, "epoch": 5473} {"train_loss": -26.649139404296875, "global_step": 454263, "epoch": 5473} {"train_loss": -27.084863662719727, "global_step": 454264, "epoch": 5473} {"train_loss": -26.827930450439453, "global_step": 454265, "epoch": 5473} {"train_loss": -26.51239585876465, "global_step": 454266, "epoch": 5473} {"train_loss": -26.83902931213379, "global_step": 454267, "epoch": 5473} {"train_loss": -26.658872604370117, "global_step": 454268, "epoch": 5473} {"train_loss": -26.364704132080078, "global_step": 454269, "epoch": 5473} {"train_loss": -26.776742935180664, "global_step": 454270, "epoch": 5473} {"train_loss": -26.91924476623535, "global_step": 454271, "epoch": 5473} {"train_loss": -26.692590713500977, "global_step": 454272, "epoch": 5473} {"train_loss": -27.16572380065918, "global_step": 454273, "epoch": 5473} {"train_loss": -26.92890739440918, "global_step": 454274, "epoch": 5473} {"train_loss": -27.212024688720703, "global_step": 454275, "epoch": 5473} {"train_loss": -26.866901397705078, "global_step": 454276, "epoch": 5473} {"train_loss": -26.775480270385742, "global_step": 454277, "epoch": 5473} {"train_loss": -26.653345108032227, "global_step": 454278, "epoch": 5473} {"train_loss": -26.879404067993164, "global_step": 454279, "epoch": 5473} {"train_loss": -26.979032516479492, "global_step": 454280, "epoch": 5473} {"train_loss": -26.780309677124023, "global_step": 454281, "epoch": 5473} {"train_loss": -27.163959503173828, "global_step": 454282, "epoch": 5473} {"train_loss": -26.93511962890625, "global_step": 454283, "epoch": 5473} {"train_loss": -27.171789169311523, "global_step": 454284, "epoch": 5473} {"train_loss": -27.042768478393555, "global_step": 454285, "epoch": 5473} {"train_loss": -27.033130645751953, "global_step": 454286, "epoch": 5473} {"train_loss": -27.443958282470703, "global_step": 454287, "epoch": 5473} {"train_loss": -27.204696655273438, "global_step": 454288, "epoch": 5473} {"train_loss": -27.0357608795166, "global_step": 454289, "epoch": 5473} {"train_loss": -26.975357055664062, "global_step": 454290, "epoch": 5473} {"train_loss": -27.28733253479004, "global_step": 454291, "epoch": 5473} {"train_loss": -27.17304801940918, "global_step": 454292, "epoch": 5473} {"train_loss": -27.38204002380371, "global_step": 454293, "epoch": 5473} {"train_loss": -27.005573272705078, "global_step": 454294, "epoch": 5473} {"train_loss": -27.084455490112305, "global_step": 454295, "epoch": 5473} {"train_loss": -27.607288360595703, "global_step": 454296, "epoch": 5473} {"train_loss": -27.16583824157715, "global_step": 454297, "epoch": 5473} {"train_loss": -27.094913482666016, "global_step": 454298, "epoch": 5473} {"train_loss": -27.121564865112305, "global_step": 454299, "epoch": 5473} {"train_loss": -27.184406280517578, "global_step": 454300, "epoch": 5473} {"train_loss": -26.996923446655273, "global_step": 454301, "epoch": 5473} {"train_loss": -27.422758102416992, "global_step": 454302, "epoch": 5473} {"train_loss": -27.080734252929688, "global_step": 454303, "epoch": 5473} {"train_loss": -27.246261596679688, "global_step": 454304, "epoch": 5473} {"train_loss": -27.11456871032715, "global_step": 454305, "epoch": 5473} {"train_loss": -27.27713394165039, "global_step": 454306, "epoch": 5473} {"train_loss": -27.226947784423828, "global_step": 454307, "epoch": 5473} {"train_loss": -27.253049850463867, "global_step": 454308, "epoch": 5473} {"train_loss": -27.150976181030273, "global_step": 454309, "epoch": 5473} {"train_loss": -27.078845977783203, "global_step": 454310, "epoch": 5473} {"train_loss": -27.12830924987793, "global_step": 454311, "epoch": 5473} {"train_loss": -27.157026290893555, "global_step": 454312, "epoch": 5473} {"train_loss": -26.574365615844727, "global_step": 454313, "epoch": 5473} {"train_loss": -26.267688751220703, "global_step": 454314, "epoch": 5473} {"train_loss": -26.651647567749023, "global_step": 454315, "epoch": 5473} {"train_loss": -26.713470458984375, "global_step": 454316, "epoch": 5473} {"train_loss": -26.99104118347168, "global_step": 454317, "epoch": 5473} {"train_loss": -26.649866104125977, "global_step": 454318, "epoch": 5473} {"train_loss": -27.27095603942871, "global_step": 454319, "epoch": 5473} {"train_loss": -27.190778732299805, "global_step": 454320, "epoch": 5473} {"train_loss": -26.952117919921875, "global_step": 454321, "epoch": 5473} {"train_loss": -26.43512535095215, "global_step": 454322, "epoch": 5473} {"train_loss": -26.488815307617188, "global_step": 454323, "epoch": 5473} {"train_loss": -26.674680709838867, "global_step": 454324, "epoch": 5473} {"train_loss": -27.145429611206055, "global_step": 454325, "epoch": 5473} {"train_loss": -26.994977951049805, "global_step": 454326, "epoch": 5473} {"train_loss": -26.962955474853516, "global_step": 454327, "epoch": 5473} {"train_loss": -26.95570182800293, "global_step": 454328, "epoch": 5473} {"train_loss": -27.283893585205078, "global_step": 454329, "epoch": 5473} {"train_loss": -27.368627548217773, "global_step": 454330, "epoch": 5473} {"train_loss": -26.829328536987305, "global_step": 454331, "epoch": 5473} {"train_loss": -27.217208862304688, "global_step": 454332, "epoch": 5473} {"train_loss": -27.35919189453125, "global_step": 454333, "epoch": 5473} {"train_loss": -27.023731231689453, "global_step": 454334, "epoch": 5473} {"train_loss": -27.144062042236328, "global_step": 454335, "epoch": 5473} {"train_loss": -26.767196655273438, "global_step": 454336, "epoch": 5473} {"train_loss": -26.996036529541016, "global_step": 454337, "epoch": 5473} {"train_loss": -26.95440101623535, "global_step": 454338, "epoch": 5473} {"train_loss": -26.90291404724121, "global_step": 454339, "epoch": 5473} {"train_loss": -27.23244285583496, "global_step": 454340, "epoch": 5473} {"train_loss": -27.00521096838526, "global_step": 454341, "epoch": 5473, "val_loss": 6555974.5} {"train_loss": -26.7070369720459, "global_step": 454342, "epoch": 5474} {"train_loss": -26.20943260192871, "global_step": 454343, "epoch": 5474} {"train_loss": -27.088598251342773, "global_step": 454344, "epoch": 5474} {"train_loss": -27.307636260986328, "global_step": 454345, "epoch": 5474} {"train_loss": -26.82757568359375, "global_step": 454346, "epoch": 5474} {"train_loss": -26.976943969726562, "global_step": 454347, "epoch": 5474} {"train_loss": -26.459213256835938, "global_step": 454348, "epoch": 5474} {"train_loss": -27.168081283569336, "global_step": 454349, "epoch": 5474} {"train_loss": -26.824207305908203, "global_step": 454350, "epoch": 5474} {"train_loss": -26.90601921081543, "global_step": 454351, "epoch": 5474} {"train_loss": -26.84174156188965, "global_step": 454352, "epoch": 5474} {"train_loss": -26.826522827148438, "global_step": 454353, "epoch": 5474} {"train_loss": -26.566984176635742, "global_step": 454354, "epoch": 5474} {"train_loss": -26.796140670776367, "global_step": 454355, "epoch": 5474} {"train_loss": -27.02497673034668, "global_step": 454356, "epoch": 5474} {"train_loss": -26.33234214782715, "global_step": 454357, "epoch": 5474} {"train_loss": -26.859222412109375, "global_step": 454358, "epoch": 5474} {"train_loss": -26.52688980102539, "global_step": 454359, "epoch": 5474} {"train_loss": -26.888534545898438, "global_step": 454360, "epoch": 5474} {"train_loss": -26.6387996673584, "global_step": 454361, "epoch": 5474} {"train_loss": -26.843524932861328, "global_step": 454362, "epoch": 5474} {"train_loss": -26.742216110229492, "global_step": 454363, "epoch": 5474} {"train_loss": -26.47553825378418, "global_step": 454364, "epoch": 5474} {"train_loss": -26.913373947143555, "global_step": 454365, "epoch": 5474} {"train_loss": -26.898990631103516, "global_step": 454366, "epoch": 5474} {"train_loss": -26.843219757080078, "global_step": 454367, "epoch": 5474} {"train_loss": -26.76837730407715, "global_step": 454368, "epoch": 5474} {"train_loss": -27.166269302368164, "global_step": 454369, "epoch": 5474} {"train_loss": -26.9609317779541, "global_step": 454370, "epoch": 5474} {"train_loss": -26.767431259155273, "global_step": 454371, "epoch": 5474} {"train_loss": -27.1462345123291, "global_step": 454372, "epoch": 5474} {"train_loss": -27.046422958374023, "global_step": 454373, "epoch": 5474} {"train_loss": -26.834945678710938, "global_step": 454374, "epoch": 5474} {"train_loss": -26.849164962768555, "global_step": 454375, "epoch": 5474} {"train_loss": -26.812332153320312, "global_step": 454376, "epoch": 5474} {"train_loss": -26.961557388305664, "global_step": 454377, "epoch": 5474} {"train_loss": -26.953699111938477, "global_step": 454378, "epoch": 5474} {"train_loss": -27.044824600219727, "global_step": 454379, "epoch": 5474} {"train_loss": -27.087697982788086, "global_step": 454380, "epoch": 5474} {"train_loss": -26.8983097076416, "global_step": 454381, "epoch": 5474} {"train_loss": -27.0970401763916, "global_step": 454382, "epoch": 5474} {"train_loss": -27.094070434570312, "global_step": 454383, "epoch": 5474} {"train_loss": -27.09844970703125, "global_step": 454384, "epoch": 5474} {"train_loss": -26.693029403686523, "global_step": 454385, "epoch": 5474} {"train_loss": -27.19476890563965, "global_step": 454386, "epoch": 5474} {"train_loss": -27.148365020751953, "global_step": 454387, "epoch": 5474} {"train_loss": -27.03974723815918, "global_step": 454388, "epoch": 5474} {"train_loss": -27.261249542236328, "global_step": 454389, "epoch": 5474} {"train_loss": -27.421396255493164, "global_step": 454390, "epoch": 5474} {"train_loss": -27.35112953186035, "global_step": 454391, "epoch": 5474} {"train_loss": -27.27113151550293, "global_step": 454392, "epoch": 5474} {"train_loss": -27.04493522644043, "global_step": 454393, "epoch": 5474} {"train_loss": -26.94061279296875, "global_step": 454394, "epoch": 5474} {"train_loss": -27.184316635131836, "global_step": 454395, "epoch": 5474} {"train_loss": -27.261463165283203, "global_step": 454396, "epoch": 5474} {"train_loss": -26.855152130126953, "global_step": 454397, "epoch": 5474} {"train_loss": -26.402612686157227, "global_step": 454398, "epoch": 5474} {"train_loss": -26.28053092956543, "global_step": 454399, "epoch": 5474} {"train_loss": -26.660200119018555, "global_step": 454400, "epoch": 5474} {"train_loss": -27.06927490234375, "global_step": 454401, "epoch": 5474} {"train_loss": -26.556421279907227, "global_step": 454402, "epoch": 5474} {"train_loss": -26.711530685424805, "global_step": 454403, "epoch": 5474} {"train_loss": -26.711721420288086, "global_step": 454404, "epoch": 5474} {"train_loss": -27.06739616394043, "global_step": 454405, "epoch": 5474} {"train_loss": -26.495452880859375, "global_step": 454406, "epoch": 5474} {"train_loss": -27.179441452026367, "global_step": 454407, "epoch": 5474} {"train_loss": -26.7299747467041, "global_step": 454408, "epoch": 5474} {"train_loss": -26.752599716186523, "global_step": 454409, "epoch": 5474} {"train_loss": -27.04292869567871, "global_step": 454410, "epoch": 5474} {"train_loss": -27.338098526000977, "global_step": 454411, "epoch": 5474} {"train_loss": -27.230789184570312, "global_step": 454412, "epoch": 5474} {"train_loss": -27.24810218811035, "global_step": 454413, "epoch": 5474} {"train_loss": -27.10395622253418, "global_step": 454414, "epoch": 5474} {"train_loss": -26.723438262939453, "global_step": 454415, "epoch": 5474} {"train_loss": -26.608154296875, "global_step": 454416, "epoch": 5474} {"train_loss": -26.796432495117188, "global_step": 454417, "epoch": 5474} {"train_loss": -27.272924423217773, "global_step": 454418, "epoch": 5474} {"train_loss": -26.509723663330078, "global_step": 454419, "epoch": 5474} {"train_loss": -27.00603675842285, "global_step": 454420, "epoch": 5474} {"train_loss": -26.416311264038086, "global_step": 454421, "epoch": 5474} {"train_loss": -27.068750381469727, "global_step": 454422, "epoch": 5474} {"train_loss": -26.693212509155273, "global_step": 454423, "epoch": 5474} {"train_loss": -26.890120724597608, "global_step": 454424, "epoch": 5474, "val_loss": 6503165.0} {"train_loss": -26.370298385620117, "global_step": 454425, "epoch": 5475} {"train_loss": -26.45256996154785, "global_step": 454426, "epoch": 5475} {"train_loss": -26.3155574798584, "global_step": 454427, "epoch": 5475} {"train_loss": -25.937213897705078, "global_step": 454428, "epoch": 5475} {"train_loss": -26.343420028686523, "global_step": 454429, "epoch": 5475} {"train_loss": -26.301095962524414, "global_step": 454430, "epoch": 5475} {"train_loss": -26.887130737304688, "global_step": 454431, "epoch": 5475} {"train_loss": -26.58441162109375, "global_step": 454432, "epoch": 5475} {"train_loss": -26.45930290222168, "global_step": 454433, "epoch": 5475} {"train_loss": -26.538908004760742, "global_step": 454434, "epoch": 5475} {"train_loss": -26.897573471069336, "global_step": 454435, "epoch": 5475} {"train_loss": -26.81048011779785, "global_step": 454436, "epoch": 5475} {"train_loss": -26.84501075744629, "global_step": 454437, "epoch": 5475} {"train_loss": -26.75800895690918, "global_step": 454438, "epoch": 5475} {"train_loss": -26.595300674438477, "global_step": 454439, "epoch": 5475} {"train_loss": -26.731475830078125, "global_step": 454440, "epoch": 5475} {"train_loss": -26.746850967407227, "global_step": 454441, "epoch": 5475} {"train_loss": -26.59869384765625, "global_step": 454442, "epoch": 5475} {"train_loss": -26.991437911987305, "global_step": 454443, "epoch": 5475} {"train_loss": -26.85955238342285, "global_step": 454444, "epoch": 5475} {"train_loss": -26.739221572875977, "global_step": 454445, "epoch": 5475} {"train_loss": -26.85529136657715, "global_step": 454446, "epoch": 5475} {"train_loss": -27.08017921447754, "global_step": 454447, "epoch": 5475} {"train_loss": -27.30167007446289, "global_step": 454448, "epoch": 5475} {"train_loss": -26.845794677734375, "global_step": 454449, "epoch": 5475} {"train_loss": -27.224618911743164, "global_step": 454450, "epoch": 5475} {"train_loss": -27.040090560913086, "global_step": 454451, "epoch": 5475} {"train_loss": -26.715778350830078, "global_step": 454452, "epoch": 5475} {"train_loss": -27.073286056518555, "global_step": 454453, "epoch": 5475} {"train_loss": -26.97877311706543, "global_step": 454454, "epoch": 5475} {"train_loss": -27.0106258392334, "global_step": 454455, "epoch": 5475} {"train_loss": -27.0137996673584, "global_step": 454456, "epoch": 5475} {"train_loss": -26.77875328063965, "global_step": 454457, "epoch": 5475} {"train_loss": -27.079710006713867, "global_step": 454458, "epoch": 5475} {"train_loss": -26.737035751342773, "global_step": 454459, "epoch": 5475} {"train_loss": -27.3067684173584, "global_step": 454460, "epoch": 5475} {"train_loss": -26.986358642578125, "global_step": 454461, "epoch": 5475} {"train_loss": -27.229604721069336, "global_step": 454462, "epoch": 5475} {"train_loss": -27.00431251525879, "global_step": 454463, "epoch": 5475} {"train_loss": -26.908008575439453, "global_step": 454464, "epoch": 5475} {"train_loss": -27.250165939331055, "global_step": 454465, "epoch": 5475} {"train_loss": -27.480802536010742, "global_step": 454466, "epoch": 5475} {"train_loss": -26.866846084594727, "global_step": 454467, "epoch": 5475} {"train_loss": -27.416467666625977, "global_step": 454468, "epoch": 5475} {"train_loss": -27.163745880126953, "global_step": 454469, "epoch": 5475} {"train_loss": -26.98219108581543, "global_step": 454470, "epoch": 5475} {"train_loss": -27.333972930908203, "global_step": 454471, "epoch": 5475} {"train_loss": -27.514448165893555, "global_step": 454472, "epoch": 5475} {"train_loss": -26.954477310180664, "global_step": 454473, "epoch": 5475} {"train_loss": -27.273096084594727, "global_step": 454474, "epoch": 5475} {"train_loss": -27.04994010925293, "global_step": 454475, "epoch": 5475} {"train_loss": -27.028247833251953, "global_step": 454476, "epoch": 5475} {"train_loss": -27.148605346679688, "global_step": 454477, "epoch": 5475} {"train_loss": -26.63913917541504, "global_step": 454478, "epoch": 5475} {"train_loss": -27.131437301635742, "global_step": 454479, "epoch": 5475} {"train_loss": -27.16840171813965, "global_step": 454480, "epoch": 5475} {"train_loss": -27.2818603515625, "global_step": 454481, "epoch": 5475} {"train_loss": -26.926959991455078, "global_step": 454482, "epoch": 5475} {"train_loss": -26.675613403320312, "global_step": 454483, "epoch": 5475} {"train_loss": -26.688827514648438, "global_step": 454484, "epoch": 5475} {"train_loss": -26.800195693969727, "global_step": 454485, "epoch": 5475} {"train_loss": -26.271060943603516, "global_step": 454486, "epoch": 5475} {"train_loss": -24.772499084472656, "global_step": 454487, "epoch": 5475} {"train_loss": -23.83196449279785, "global_step": 454488, "epoch": 5475} {"train_loss": -25.018835067749023, "global_step": 454489, "epoch": 5475} {"train_loss": -26.50103759765625, "global_step": 454490, "epoch": 5475} {"train_loss": -25.889739990234375, "global_step": 454491, "epoch": 5475} {"train_loss": -25.7065372467041, "global_step": 454492, "epoch": 5475} {"train_loss": -26.385364532470703, "global_step": 454493, "epoch": 5475} {"train_loss": -25.916812896728516, "global_step": 454494, "epoch": 5475} {"train_loss": -26.17043113708496, "global_step": 454495, "epoch": 5475} {"train_loss": -26.363279342651367, "global_step": 454496, "epoch": 5475} {"train_loss": -26.482263565063477, "global_step": 454497, "epoch": 5475} {"train_loss": -26.614877700805664, "global_step": 454498, "epoch": 5475} {"train_loss": -26.376174926757812, "global_step": 454499, "epoch": 5475} {"train_loss": -26.473398208618164, "global_step": 454500, "epoch": 5475} {"train_loss": -26.52910804748535, "global_step": 454501, "epoch": 5475} {"train_loss": -26.3305606842041, "global_step": 454502, "epoch": 5475} {"train_loss": -26.661325454711914, "global_step": 454503, "epoch": 5475} {"train_loss": -26.58625602722168, "global_step": 454504, "epoch": 5475} {"train_loss": -26.67119789123535, "global_step": 454505, "epoch": 5475} {"train_loss": -26.7600040435791, "global_step": 454506, "epoch": 5475} {"train_loss": -26.692501803478564, "global_step": 454507, "epoch": 5475, "val_loss": 6709926.5} {"train_loss": -26.069318771362305, "global_step": 454508, "epoch": 5476} {"train_loss": -26.389667510986328, "global_step": 454509, "epoch": 5476} {"train_loss": -26.39753532409668, "global_step": 454510, "epoch": 5476} {"train_loss": -26.684839248657227, "global_step": 454511, "epoch": 5476} {"train_loss": -26.29499626159668, "global_step": 454512, "epoch": 5476} {"train_loss": -26.266925811767578, "global_step": 454513, "epoch": 5476} {"train_loss": -26.2895450592041, "global_step": 454514, "epoch": 5476} {"train_loss": -26.43050193786621, "global_step": 454515, "epoch": 5476} {"train_loss": -26.387039184570312, "global_step": 454516, "epoch": 5476} {"train_loss": -26.15239906311035, "global_step": 454517, "epoch": 5476} {"train_loss": -26.47523307800293, "global_step": 454518, "epoch": 5476} {"train_loss": -26.698511123657227, "global_step": 454519, "epoch": 5476} {"train_loss": -26.547224044799805, "global_step": 454520, "epoch": 5476} {"train_loss": -26.993005752563477, "global_step": 454521, "epoch": 5476} {"train_loss": -26.68723487854004, "global_step": 454522, "epoch": 5476} {"train_loss": -27.159198760986328, "global_step": 454523, "epoch": 5476} {"train_loss": -26.787221908569336, "global_step": 454524, "epoch": 5476} {"train_loss": -26.86185073852539, "global_step": 454525, "epoch": 5476} {"train_loss": -27.029211044311523, "global_step": 454526, "epoch": 5476} {"train_loss": -27.0046443939209, "global_step": 454527, "epoch": 5476} {"train_loss": -26.945819854736328, "global_step": 454528, "epoch": 5476} {"train_loss": -26.776611328125, "global_step": 454529, "epoch": 5476} {"train_loss": -27.3547306060791, "global_step": 454530, "epoch": 5476} {"train_loss": -27.228681564331055, "global_step": 454531, "epoch": 5476} {"train_loss": -27.41290283203125, "global_step": 454532, "epoch": 5476} {"train_loss": -27.18781089782715, "global_step": 454533, "epoch": 5476} {"train_loss": -27.04512596130371, "global_step": 454534, "epoch": 5476} {"train_loss": -27.1721134185791, "global_step": 454535, "epoch": 5476} {"train_loss": -27.002323150634766, "global_step": 454536, "epoch": 5476} {"train_loss": -27.29798698425293, "global_step": 454537, "epoch": 5476} {"train_loss": -27.302661895751953, "global_step": 454538, "epoch": 5476} {"train_loss": -27.012109756469727, "global_step": 454539, "epoch": 5476} {"train_loss": -27.267276763916016, "global_step": 454540, "epoch": 5476} {"train_loss": -27.152652740478516, "global_step": 454541, "epoch": 5476} {"train_loss": -27.350446701049805, "global_step": 454542, "epoch": 5476} {"train_loss": -27.218830108642578, "global_step": 454543, "epoch": 5476} {"train_loss": -27.430419921875, "global_step": 454544, "epoch": 5476} {"train_loss": -26.991872787475586, "global_step": 454545, "epoch": 5476} {"train_loss": -27.0214786529541, "global_step": 454546, "epoch": 5476} {"train_loss": -27.20291519165039, "global_step": 454547, "epoch": 5476} {"train_loss": -27.16495704650879, "global_step": 454548, "epoch": 5476} {"train_loss": -27.275171279907227, "global_step": 454549, "epoch": 5476} {"train_loss": -26.975210189819336, "global_step": 454550, "epoch": 5476} {"train_loss": -26.92848014831543, "global_step": 454551, "epoch": 5476} {"train_loss": -27.330469131469727, "global_step": 454552, "epoch": 5476} {"train_loss": -27.138202667236328, "global_step": 454553, "epoch": 5476} {"train_loss": -26.74667739868164, "global_step": 454554, "epoch": 5476} {"train_loss": -26.523679733276367, "global_step": 454555, "epoch": 5476} {"train_loss": -27.26790428161621, "global_step": 454556, "epoch": 5476} {"train_loss": -26.651172637939453, "global_step": 454557, "epoch": 5476} {"train_loss": -27.195281982421875, "global_step": 454558, "epoch": 5476} {"train_loss": -27.018112182617188, "global_step": 454559, "epoch": 5476} {"train_loss": -26.78156852722168, "global_step": 454560, "epoch": 5476} {"train_loss": -26.89691734313965, "global_step": 454561, "epoch": 5476} {"train_loss": -26.988880157470703, "global_step": 454562, "epoch": 5476} {"train_loss": -26.949066162109375, "global_step": 454563, "epoch": 5476} {"train_loss": -27.399145126342773, "global_step": 454564, "epoch": 5476} {"train_loss": -26.9962215423584, "global_step": 454565, "epoch": 5476} {"train_loss": -27.501691818237305, "global_step": 454566, "epoch": 5476} {"train_loss": -26.978540420532227, "global_step": 454567, "epoch": 5476} {"train_loss": -26.840667724609375, "global_step": 454568, "epoch": 5476} {"train_loss": -26.763961791992188, "global_step": 454569, "epoch": 5476} {"train_loss": -26.920211791992188, "global_step": 454570, "epoch": 5476} {"train_loss": -27.0239315032959, "global_step": 454571, "epoch": 5476} {"train_loss": -27.39508628845215, "global_step": 454572, "epoch": 5476} {"train_loss": -26.724470138549805, "global_step": 454573, "epoch": 5476} {"train_loss": -27.034467697143555, "global_step": 454574, "epoch": 5476} {"train_loss": -27.305801391601562, "global_step": 454575, "epoch": 5476} {"train_loss": -27.0909481048584, "global_step": 454576, "epoch": 5476} {"train_loss": -27.103010177612305, "global_step": 454577, "epoch": 5476} {"train_loss": -27.249713897705078, "global_step": 454578, "epoch": 5476} {"train_loss": -27.245899200439453, "global_step": 454579, "epoch": 5476} {"train_loss": -27.29168128967285, "global_step": 454580, "epoch": 5476} {"train_loss": -27.3159122467041, "global_step": 454581, "epoch": 5476} {"train_loss": -27.217981338500977, "global_step": 454582, "epoch": 5476} {"train_loss": -26.8779354095459, "global_step": 454583, "epoch": 5476} {"train_loss": -27.014463424682617, "global_step": 454584, "epoch": 5476} {"train_loss": -27.135589599609375, "global_step": 454585, "epoch": 5476} {"train_loss": -27.0998592376709, "global_step": 454586, "epoch": 5476} {"train_loss": -27.009552001953125, "global_step": 454587, "epoch": 5476} {"train_loss": -27.518102645874023, "global_step": 454588, "epoch": 5476} {"train_loss": -27.225839614868164, "global_step": 454589, "epoch": 5476} {"train_loss": -26.983185503856244, "global_step": 454590, "epoch": 5476, "val_loss": 6571336.5} {"train_loss": -25.678449630737305, "global_step": 454591, "epoch": 5477} {"train_loss": -25.302459716796875, "global_step": 454592, "epoch": 5477} {"train_loss": -26.83259391784668, "global_step": 454593, "epoch": 5477} {"train_loss": -26.251968383789062, "global_step": 454594, "epoch": 5477} {"train_loss": -26.030920028686523, "global_step": 454595, "epoch": 5477} {"train_loss": -26.48402976989746, "global_step": 454596, "epoch": 5477} {"train_loss": -26.307825088500977, "global_step": 454597, "epoch": 5477} {"train_loss": -26.571744918823242, "global_step": 454598, "epoch": 5477} {"train_loss": -26.015546798706055, "global_step": 454599, "epoch": 5477} {"train_loss": -26.847204208374023, "global_step": 454600, "epoch": 5477} {"train_loss": -26.22260093688965, "global_step": 454601, "epoch": 5477} {"train_loss": -26.675495147705078, "global_step": 454602, "epoch": 5477} {"train_loss": -26.30445671081543, "global_step": 454603, "epoch": 5477} {"train_loss": -26.6495418548584, "global_step": 454604, "epoch": 5477} {"train_loss": -26.69575309753418, "global_step": 454605, "epoch": 5477} {"train_loss": -26.536575317382812, "global_step": 454606, "epoch": 5477} {"train_loss": -26.84808921813965, "global_step": 454607, "epoch": 5477} {"train_loss": -26.419843673706055, "global_step": 454608, "epoch": 5477} {"train_loss": -26.816720962524414, "global_step": 454609, "epoch": 5477} {"train_loss": -26.753772735595703, "global_step": 454610, "epoch": 5477} {"train_loss": -26.6673526763916, "global_step": 454611, "epoch": 5477} {"train_loss": -26.422901153564453, "global_step": 454612, "epoch": 5477} {"train_loss": -26.806127548217773, "global_step": 454613, "epoch": 5477} {"train_loss": -26.645751953125, "global_step": 454614, "epoch": 5477} {"train_loss": -26.551538467407227, "global_step": 454615, "epoch": 5477} {"train_loss": -26.718753814697266, "global_step": 454616, "epoch": 5477} {"train_loss": -26.684797286987305, "global_step": 454617, "epoch": 5477} {"train_loss": -26.75349235534668, "global_step": 454618, "epoch": 5477} {"train_loss": -26.443389892578125, "global_step": 454619, "epoch": 5477} {"train_loss": -26.825687408447266, "global_step": 454620, "epoch": 5477} {"train_loss": -26.81890296936035, "global_step": 454621, "epoch": 5477} {"train_loss": -27.12091636657715, "global_step": 454622, "epoch": 5477} {"train_loss": -27.030078887939453, "global_step": 454623, "epoch": 5477} {"train_loss": -26.957916259765625, "global_step": 454624, "epoch": 5477} {"train_loss": -27.385818481445312, "global_step": 454625, "epoch": 5477} {"train_loss": -27.14804458618164, "global_step": 454626, "epoch": 5477} {"train_loss": -26.9194393157959, "global_step": 454627, "epoch": 5477} {"train_loss": -26.81133460998535, "global_step": 454628, "epoch": 5477} {"train_loss": -27.238162994384766, "global_step": 454629, "epoch": 5477} {"train_loss": -27.295698165893555, "global_step": 454630, "epoch": 5477} {"train_loss": -27.051733016967773, "global_step": 454631, "epoch": 5477} {"train_loss": -27.140745162963867, "global_step": 454632, "epoch": 5477} {"train_loss": -26.944660186767578, "global_step": 454633, "epoch": 5477} {"train_loss": -26.98465347290039, "global_step": 454634, "epoch": 5477} {"train_loss": -26.598337173461914, "global_step": 454635, "epoch": 5477} {"train_loss": -27.168903350830078, "global_step": 454636, "epoch": 5477} {"train_loss": -27.34527015686035, "global_step": 454637, "epoch": 5477} {"train_loss": -27.188678741455078, "global_step": 454638, "epoch": 5477} {"train_loss": -26.787336349487305, "global_step": 454639, "epoch": 5477} {"train_loss": -27.00569725036621, "global_step": 454640, "epoch": 5477} {"train_loss": -27.299518585205078, "global_step": 454641, "epoch": 5477} {"train_loss": -27.464879989624023, "global_step": 454642, "epoch": 5477} {"train_loss": -27.11311149597168, "global_step": 454643, "epoch": 5477} {"train_loss": -27.011219024658203, "global_step": 454644, "epoch": 5477} {"train_loss": -26.99686050415039, "global_step": 454645, "epoch": 5477} {"train_loss": -27.468128204345703, "global_step": 454646, "epoch": 5477} {"train_loss": -27.59111976623535, "global_step": 454647, "epoch": 5477} {"train_loss": -27.195220947265625, "global_step": 454648, "epoch": 5477} {"train_loss": -27.062658309936523, "global_step": 454649, "epoch": 5477} {"train_loss": -27.10187339782715, "global_step": 454650, "epoch": 5477} {"train_loss": -26.989551544189453, "global_step": 454651, "epoch": 5477} {"train_loss": -27.03071403503418, "global_step": 454652, "epoch": 5477} {"train_loss": -27.048242568969727, "global_step": 454653, "epoch": 5477} {"train_loss": -26.948959350585938, "global_step": 454654, "epoch": 5477} {"train_loss": -27.17618751525879, "global_step": 454655, "epoch": 5477} {"train_loss": -27.282438278198242, "global_step": 454656, "epoch": 5477} {"train_loss": -27.333066940307617, "global_step": 454657, "epoch": 5477} {"train_loss": -27.055749893188477, "global_step": 454658, "epoch": 5477} {"train_loss": -27.123559951782227, "global_step": 454659, "epoch": 5477} {"train_loss": -27.036502838134766, "global_step": 454660, "epoch": 5477} {"train_loss": -27.050642013549805, "global_step": 454661, "epoch": 5477} {"train_loss": -27.46487808227539, "global_step": 454662, "epoch": 5477} {"train_loss": -27.076858520507812, "global_step": 454663, "epoch": 5477} {"train_loss": -27.254911422729492, "global_step": 454664, "epoch": 5477} {"train_loss": -26.997943878173828, "global_step": 454665, "epoch": 5477} {"train_loss": -27.3358154296875, "global_step": 454666, "epoch": 5477} {"train_loss": -27.19646644592285, "global_step": 454667, "epoch": 5477} {"train_loss": -26.865264892578125, "global_step": 454668, "epoch": 5477} {"train_loss": -26.953046798706055, "global_step": 454669, "epoch": 5477} {"train_loss": -27.035558700561523, "global_step": 454670, "epoch": 5477} {"train_loss": -26.892927169799805, "global_step": 454671, "epoch": 5477} {"train_loss": -26.87079429626465, "global_step": 454672, "epoch": 5477} {"train_loss": -26.87125238165798, "global_step": 454673, "epoch": 5477, "val_loss": 6538680.0} {"train_loss": -26.70301628112793, "global_step": 454674, "epoch": 5478} {"train_loss": -26.021543502807617, "global_step": 454675, "epoch": 5478} {"train_loss": -26.42051124572754, "global_step": 454676, "epoch": 5478} {"train_loss": -26.318714141845703, "global_step": 454677, "epoch": 5478} {"train_loss": -26.301624298095703, "global_step": 454678, "epoch": 5478} {"train_loss": -26.41815185546875, "global_step": 454679, "epoch": 5478} {"train_loss": -26.53786277770996, "global_step": 454680, "epoch": 5478} {"train_loss": -26.57465934753418, "global_step": 454681, "epoch": 5478} {"train_loss": -26.4280948638916, "global_step": 454682, "epoch": 5478} {"train_loss": -26.539106369018555, "global_step": 454683, "epoch": 5478} {"train_loss": -26.179784774780273, "global_step": 454684, "epoch": 5478} {"train_loss": -26.65286636352539, "global_step": 454685, "epoch": 5478} {"train_loss": -26.796457290649414, "global_step": 454686, "epoch": 5478} {"train_loss": -26.90009880065918, "global_step": 454687, "epoch": 5478} {"train_loss": -26.611356735229492, "global_step": 454688, "epoch": 5478} {"train_loss": -26.886892318725586, "global_step": 454689, "epoch": 5478} {"train_loss": -27.044281005859375, "global_step": 454690, "epoch": 5478} {"train_loss": -26.78733253479004, "global_step": 454691, "epoch": 5478} {"train_loss": -26.811853408813477, "global_step": 454692, "epoch": 5478} {"train_loss": -26.592254638671875, "global_step": 454693, "epoch": 5478} {"train_loss": -27.14215660095215, "global_step": 454694, "epoch": 5478} {"train_loss": -26.724349975585938, "global_step": 454695, "epoch": 5478} {"train_loss": -27.126943588256836, "global_step": 454696, "epoch": 5478} {"train_loss": -27.200925827026367, "global_step": 454697, "epoch": 5478} {"train_loss": -27.132360458374023, "global_step": 454698, "epoch": 5478} {"train_loss": -27.457462310791016, "global_step": 454699, "epoch": 5478} {"train_loss": -27.08656883239746, "global_step": 454700, "epoch": 5478} {"train_loss": -26.917333602905273, "global_step": 454701, "epoch": 5478} {"train_loss": -27.0128173828125, "global_step": 454702, "epoch": 5478} {"train_loss": -27.215301513671875, "global_step": 454703, "epoch": 5478} {"train_loss": -26.65594482421875, "global_step": 454704, "epoch": 5478} {"train_loss": -27.536115646362305, "global_step": 454705, "epoch": 5478} {"train_loss": -27.10200309753418, "global_step": 454706, "epoch": 5478} {"train_loss": -27.293415069580078, "global_step": 454707, "epoch": 5478} {"train_loss": -26.844135284423828, "global_step": 454708, "epoch": 5478} {"train_loss": -27.017684936523438, "global_step": 454709, "epoch": 5478} {"train_loss": -27.148670196533203, "global_step": 454710, "epoch": 5478} {"train_loss": -27.245649337768555, "global_step": 454711, "epoch": 5478} {"train_loss": -26.79152488708496, "global_step": 454712, "epoch": 5478} {"train_loss": -27.14606285095215, "global_step": 454713, "epoch": 5478} {"train_loss": -27.400014877319336, "global_step": 454714, "epoch": 5478} {"train_loss": -27.211206436157227, "global_step": 454715, "epoch": 5478} {"train_loss": -27.120147705078125, "global_step": 454716, "epoch": 5478} {"train_loss": -27.467151641845703, "global_step": 454717, "epoch": 5478} {"train_loss": -27.10125160217285, "global_step": 454718, "epoch": 5478} {"train_loss": -27.13458824157715, "global_step": 454719, "epoch": 5478} {"train_loss": -27.439359664916992, "global_step": 454720, "epoch": 5478} {"train_loss": -27.174274444580078, "global_step": 454721, "epoch": 5478} {"train_loss": -26.920520782470703, "global_step": 454722, "epoch": 5478} {"train_loss": -27.085851669311523, "global_step": 454723, "epoch": 5478} {"train_loss": -27.4625186920166, "global_step": 454724, "epoch": 5478} {"train_loss": -27.161884307861328, "global_step": 454725, "epoch": 5478} {"train_loss": -27.01668357849121, "global_step": 454726, "epoch": 5478} {"train_loss": -27.24078369140625, "global_step": 454727, "epoch": 5478} {"train_loss": -27.358800888061523, "global_step": 454728, "epoch": 5478} {"train_loss": -27.29180908203125, "global_step": 454729, "epoch": 5478} {"train_loss": -27.51613426208496, "global_step": 454730, "epoch": 5478} {"train_loss": -26.983875274658203, "global_step": 454731, "epoch": 5478} {"train_loss": -27.19893455505371, "global_step": 454732, "epoch": 5478} {"train_loss": -27.047937393188477, "global_step": 454733, "epoch": 5478} {"train_loss": -27.337936401367188, "global_step": 454734, "epoch": 5478} {"train_loss": -26.7871150970459, "global_step": 454735, "epoch": 5478} {"train_loss": -27.352325439453125, "global_step": 454736, "epoch": 5478} {"train_loss": -26.75088882446289, "global_step": 454737, "epoch": 5478} {"train_loss": -27.235198974609375, "global_step": 454738, "epoch": 5478} {"train_loss": -27.29829216003418, "global_step": 454739, "epoch": 5478} {"train_loss": -27.1302547454834, "global_step": 454740, "epoch": 5478} {"train_loss": -27.345975875854492, "global_step": 454741, "epoch": 5478} {"train_loss": -27.036874771118164, "global_step": 454742, "epoch": 5478} {"train_loss": -26.83296012878418, "global_step": 454743, "epoch": 5478} {"train_loss": -26.6890811920166, "global_step": 454744, "epoch": 5478} {"train_loss": -26.547260284423828, "global_step": 454745, "epoch": 5478} {"train_loss": -26.790699005126953, "global_step": 454746, "epoch": 5478} {"train_loss": -27.088895797729492, "global_step": 454747, "epoch": 5478} {"train_loss": -27.07839012145996, "global_step": 454748, "epoch": 5478} {"train_loss": -26.839603424072266, "global_step": 454749, "epoch": 5478} {"train_loss": -26.79849624633789, "global_step": 454750, "epoch": 5478} {"train_loss": -26.76801109313965, "global_step": 454751, "epoch": 5478} {"train_loss": -27.01152992248535, "global_step": 454752, "epoch": 5478} {"train_loss": -26.23274040222168, "global_step": 454753, "epoch": 5478} {"train_loss": -27.419296264648438, "global_step": 454754, "epoch": 5478} {"train_loss": -27.045591354370117, "global_step": 454755, "epoch": 5478} {"train_loss": -26.96560030098421, "global_step": 454756, "epoch": 5478, "val_loss": 6611447.5} {"train_loss": -25.594263076782227, "global_step": 454757, "epoch": 5479} {"train_loss": -25.81882667541504, "global_step": 454758, "epoch": 5479} {"train_loss": -25.971670150756836, "global_step": 454759, "epoch": 5479} {"train_loss": -25.698659896850586, "global_step": 454760, "epoch": 5479} {"train_loss": -25.617528915405273, "global_step": 454761, "epoch": 5479} {"train_loss": -25.75974464416504, "global_step": 454762, "epoch": 5479} {"train_loss": -26.655847549438477, "global_step": 454763, "epoch": 5479} {"train_loss": -26.732763290405273, "global_step": 454764, "epoch": 5479} {"train_loss": -26.9902400970459, "global_step": 454765, "epoch": 5479} {"train_loss": -26.209348678588867, "global_step": 454766, "epoch": 5479} {"train_loss": -26.07429313659668, "global_step": 454767, "epoch": 5479} {"train_loss": -26.75217056274414, "global_step": 454768, "epoch": 5479} {"train_loss": -26.347049713134766, "global_step": 454769, "epoch": 5479} {"train_loss": -26.38234519958496, "global_step": 454770, "epoch": 5479} {"train_loss": -26.390390396118164, "global_step": 454771, "epoch": 5479} {"train_loss": -26.4226131439209, "global_step": 454772, "epoch": 5479} {"train_loss": -26.656570434570312, "global_step": 454773, "epoch": 5479} {"train_loss": -26.92041015625, "global_step": 454774, "epoch": 5479} {"train_loss": -26.942157745361328, "global_step": 454775, "epoch": 5479} {"train_loss": -26.557188034057617, "global_step": 454776, "epoch": 5479} {"train_loss": -26.479267120361328, "global_step": 454777, "epoch": 5479} {"train_loss": -26.761478424072266, "global_step": 454778, "epoch": 5479} {"train_loss": -26.92306900024414, "global_step": 454779, "epoch": 5479} {"train_loss": -26.6229248046875, "global_step": 454780, "epoch": 5479} {"train_loss": -26.797199249267578, "global_step": 454781, "epoch": 5479} {"train_loss": -26.82871437072754, "global_step": 454782, "epoch": 5479} {"train_loss": -27.08473777770996, "global_step": 454783, "epoch": 5479} {"train_loss": -26.840051651000977, "global_step": 454784, "epoch": 5479} {"train_loss": -26.7698974609375, "global_step": 454785, "epoch": 5479} {"train_loss": -27.039386749267578, "global_step": 454786, "epoch": 5479} {"train_loss": -26.809850692749023, "global_step": 454787, "epoch": 5479} {"train_loss": -27.080841064453125, "global_step": 454788, "epoch": 5479} {"train_loss": -27.30963706970215, "global_step": 454789, "epoch": 5479} {"train_loss": -27.11358070373535, "global_step": 454790, "epoch": 5479} {"train_loss": -27.00539207458496, "global_step": 454791, "epoch": 5479} {"train_loss": -27.241907119750977, "global_step": 454792, "epoch": 5479} {"train_loss": -27.19046974182129, "global_step": 454793, "epoch": 5479} {"train_loss": -26.875696182250977, "global_step": 454794, "epoch": 5479} {"train_loss": -26.866140365600586, "global_step": 454795, "epoch": 5479} {"train_loss": -27.258047103881836, "global_step": 454796, "epoch": 5479} {"train_loss": -27.25339698791504, "global_step": 454797, "epoch": 5479} {"train_loss": -27.32623863220215, "global_step": 454798, "epoch": 5479} {"train_loss": -27.320688247680664, "global_step": 454799, "epoch": 5479} {"train_loss": -27.328516006469727, "global_step": 454800, "epoch": 5479} {"train_loss": -27.21113395690918, "global_step": 454801, "epoch": 5479} {"train_loss": -27.243274688720703, "global_step": 454802, "epoch": 5479} {"train_loss": -26.79952049255371, "global_step": 454803, "epoch": 5479} {"train_loss": -26.93326187133789, "global_step": 454804, "epoch": 5479} {"train_loss": -27.379520416259766, "global_step": 454805, "epoch": 5479} {"train_loss": -27.248987197875977, "global_step": 454806, "epoch": 5479} {"train_loss": -26.923131942749023, "global_step": 454807, "epoch": 5479} {"train_loss": -27.213796615600586, "global_step": 454808, "epoch": 5479} {"train_loss": -27.244892120361328, "global_step": 454809, "epoch": 5479} {"train_loss": -27.21742057800293, "global_step": 454810, "epoch": 5479} {"train_loss": -27.035306930541992, "global_step": 454811, "epoch": 5479} {"train_loss": -27.15175437927246, "global_step": 454812, "epoch": 5479} {"train_loss": -26.6931209564209, "global_step": 454813, "epoch": 5479} {"train_loss": -26.869037628173828, "global_step": 454814, "epoch": 5479} {"train_loss": -27.46589469909668, "global_step": 454815, "epoch": 5479} {"train_loss": -27.431976318359375, "global_step": 454816, "epoch": 5479} {"train_loss": -27.368436813354492, "global_step": 454817, "epoch": 5479} {"train_loss": -26.837116241455078, "global_step": 454818, "epoch": 5479} {"train_loss": -27.636091232299805, "global_step": 454819, "epoch": 5479} {"train_loss": -27.23919105529785, "global_step": 454820, "epoch": 5479} {"train_loss": -27.128812789916992, "global_step": 454821, "epoch": 5479} {"train_loss": -26.97747230529785, "global_step": 454822, "epoch": 5479} {"train_loss": -27.13753318786621, "global_step": 454823, "epoch": 5479} {"train_loss": -27.167865753173828, "global_step": 454824, "epoch": 5479} {"train_loss": -27.085529327392578, "global_step": 454825, "epoch": 5479} {"train_loss": -27.375873565673828, "global_step": 454826, "epoch": 5479} {"train_loss": -27.56937026977539, "global_step": 454827, "epoch": 5479} {"train_loss": -27.298053741455078, "global_step": 454828, "epoch": 5479} {"train_loss": -27.009740829467773, "global_step": 454829, "epoch": 5479} {"train_loss": -27.31064796447754, "global_step": 454830, "epoch": 5479} {"train_loss": -27.24092674255371, "global_step": 454831, "epoch": 5479} {"train_loss": -27.13722038269043, "global_step": 454832, "epoch": 5479} {"train_loss": -27.285552978515625, "global_step": 454833, "epoch": 5479} {"train_loss": -27.036142349243164, "global_step": 454834, "epoch": 5479} {"train_loss": -27.079084396362305, "global_step": 454835, "epoch": 5479} {"train_loss": -27.182241439819336, "global_step": 454836, "epoch": 5479} {"train_loss": -27.48603630065918, "global_step": 454837, "epoch": 5479} {"train_loss": -27.341291427612305, "global_step": 454838, "epoch": 5479} {"train_loss": -26.911589725908026, "global_step": 454839, "epoch": 5479, "val_loss": 6782213.0} {"train_loss": -26.086389541625977, "global_step": 454840, "epoch": 5480} {"train_loss": -25.9510498046875, "global_step": 454841, "epoch": 5480} {"train_loss": -25.691434860229492, "global_step": 454842, "epoch": 5480} {"train_loss": -23.5233097076416, "global_step": 454843, "epoch": 5480} {"train_loss": -24.442691802978516, "global_step": 454844, "epoch": 5480} {"train_loss": -26.33197593688965, "global_step": 454845, "epoch": 5480} {"train_loss": -25.76063346862793, "global_step": 454846, "epoch": 5480} {"train_loss": -25.95881462097168, "global_step": 454847, "epoch": 5480} {"train_loss": -26.463163375854492, "global_step": 454848, "epoch": 5480} {"train_loss": -26.167932510375977, "global_step": 454849, "epoch": 5480} {"train_loss": -26.311349868774414, "global_step": 454850, "epoch": 5480} {"train_loss": -26.420455932617188, "global_step": 454851, "epoch": 5480} {"train_loss": -26.219614028930664, "global_step": 454852, "epoch": 5480} {"train_loss": -26.387556076049805, "global_step": 454853, "epoch": 5480} {"train_loss": -26.42042350769043, "global_step": 454854, "epoch": 5480} {"train_loss": -26.709264755249023, "global_step": 454855, "epoch": 5480} {"train_loss": -26.24287223815918, "global_step": 454856, "epoch": 5480} {"train_loss": -26.844547271728516, "global_step": 454857, "epoch": 5480} {"train_loss": -26.188695907592773, "global_step": 454858, "epoch": 5480} {"train_loss": -26.824777603149414, "global_step": 454859, "epoch": 5480} {"train_loss": -26.474288940429688, "global_step": 454860, "epoch": 5480} {"train_loss": -27.08095359802246, "global_step": 454861, "epoch": 5480} {"train_loss": -26.6608829498291, "global_step": 454862, "epoch": 5480} {"train_loss": -26.63209342956543, "global_step": 454863, "epoch": 5480} {"train_loss": -26.5277156829834, "global_step": 454864, "epoch": 5480} {"train_loss": -26.916601181030273, "global_step": 454865, "epoch": 5480} {"train_loss": -26.861663818359375, "global_step": 454866, "epoch": 5480} {"train_loss": -26.468046188354492, "global_step": 454867, "epoch": 5480} {"train_loss": -27.026655197143555, "global_step": 454868, "epoch": 5480} {"train_loss": -27.19000244140625, "global_step": 454869, "epoch": 5480} {"train_loss": -26.706222534179688, "global_step": 454870, "epoch": 5480} {"train_loss": -26.689626693725586, "global_step": 454871, "epoch": 5480} {"train_loss": -26.75632667541504, "global_step": 454872, "epoch": 5480} {"train_loss": -26.89794921875, "global_step": 454873, "epoch": 5480} {"train_loss": -26.84907341003418, "global_step": 454874, "epoch": 5480} {"train_loss": -27.0296688079834, "global_step": 454875, "epoch": 5480} {"train_loss": -26.75990104675293, "global_step": 454876, "epoch": 5480} {"train_loss": -27.048770904541016, "global_step": 454877, "epoch": 5480} {"train_loss": -26.77735710144043, "global_step": 454878, "epoch": 5480} {"train_loss": -26.43958854675293, "global_step": 454879, "epoch": 5480} {"train_loss": -26.45857048034668, "global_step": 454880, "epoch": 5480} {"train_loss": -27.19476318359375, "global_step": 454881, "epoch": 5480} {"train_loss": -26.815717697143555, "global_step": 454882, "epoch": 5480} {"train_loss": -26.546375274658203, "global_step": 454883, "epoch": 5480} {"train_loss": -26.999725341796875, "global_step": 454884, "epoch": 5480} {"train_loss": -26.643417358398438, "global_step": 454885, "epoch": 5480} {"train_loss": -27.23681640625, "global_step": 454886, "epoch": 5480} {"train_loss": -26.7692813873291, "global_step": 454887, "epoch": 5480} {"train_loss": -26.832538604736328, "global_step": 454888, "epoch": 5480} {"train_loss": -27.048858642578125, "global_step": 454889, "epoch": 5480} {"train_loss": -26.75907325744629, "global_step": 454890, "epoch": 5480} {"train_loss": -27.118896484375, "global_step": 454891, "epoch": 5480} {"train_loss": -26.809005737304688, "global_step": 454892, "epoch": 5480} {"train_loss": -26.906652450561523, "global_step": 454893, "epoch": 5480} {"train_loss": -26.908985137939453, "global_step": 454894, "epoch": 5480} {"train_loss": -27.25579261779785, "global_step": 454895, "epoch": 5480} {"train_loss": -27.08893394470215, "global_step": 454896, "epoch": 5480} {"train_loss": -27.098861694335938, "global_step": 454897, "epoch": 5480} {"train_loss": -27.086034774780273, "global_step": 454898, "epoch": 5480} {"train_loss": -26.753061294555664, "global_step": 454899, "epoch": 5480} {"train_loss": -27.138715744018555, "global_step": 454900, "epoch": 5480} {"train_loss": -27.132923126220703, "global_step": 454901, "epoch": 5480} {"train_loss": -26.91883659362793, "global_step": 454902, "epoch": 5480} {"train_loss": -27.188608169555664, "global_step": 454903, "epoch": 5480} {"train_loss": -27.235395431518555, "global_step": 454904, "epoch": 5480} {"train_loss": -27.06052589416504, "global_step": 454905, "epoch": 5480} {"train_loss": -26.995330810546875, "global_step": 454906, "epoch": 5480} {"train_loss": -27.226301193237305, "global_step": 454907, "epoch": 5480} {"train_loss": -27.133825302124023, "global_step": 454908, "epoch": 5480} {"train_loss": -26.965185165405273, "global_step": 454909, "epoch": 5480} {"train_loss": -26.960025787353516, "global_step": 454910, "epoch": 5480} {"train_loss": -27.307891845703125, "global_step": 454911, "epoch": 5480} {"train_loss": -27.20796012878418, "global_step": 454912, "epoch": 5480} {"train_loss": -26.970556259155273, "global_step": 454913, "epoch": 5480} {"train_loss": -27.195266723632812, "global_step": 454914, "epoch": 5480} {"train_loss": -27.27852439880371, "global_step": 454915, "epoch": 5480} {"train_loss": -26.9609375, "global_step": 454916, "epoch": 5480} {"train_loss": -27.129148483276367, "global_step": 454917, "epoch": 5480} {"train_loss": -27.119199752807617, "global_step": 454918, "epoch": 5480} {"train_loss": -27.051410675048828, "global_step": 454919, "epoch": 5480} {"train_loss": -27.098968505859375, "global_step": 454920, "epoch": 5480} {"train_loss": -27.60004234313965, "global_step": 454921, "epoch": 5480} {"train_loss": -26.752436327647015, "global_step": 454922, "epoch": 5480, "val_loss": 6619916.0} {"train_loss": -26.758102416992188, "global_step": 454923, "epoch": 5481} {"train_loss": -27.065961837768555, "global_step": 454924, "epoch": 5481} {"train_loss": -26.762210845947266, "global_step": 454925, "epoch": 5481} {"train_loss": -26.809223175048828, "global_step": 454926, "epoch": 5481} {"train_loss": -26.73639488220215, "global_step": 454927, "epoch": 5481} {"train_loss": -26.419523239135742, "global_step": 454928, "epoch": 5481} {"train_loss": -26.971582412719727, "global_step": 454929, "epoch": 5481} {"train_loss": -26.7969970703125, "global_step": 454930, "epoch": 5481} {"train_loss": -26.55109977722168, "global_step": 454931, "epoch": 5481} {"train_loss": -27.173181533813477, "global_step": 454932, "epoch": 5481} {"train_loss": -26.702550888061523, "global_step": 454933, "epoch": 5481} {"train_loss": -27.126911163330078, "global_step": 454934, "epoch": 5481} {"train_loss": -26.715600967407227, "global_step": 454935, "epoch": 5481} {"train_loss": -27.106674194335938, "global_step": 454936, "epoch": 5481} {"train_loss": -26.90998649597168, "global_step": 454937, "epoch": 5481} {"train_loss": -27.262357711791992, "global_step": 454938, "epoch": 5481} {"train_loss": -26.63685417175293, "global_step": 454939, "epoch": 5481} {"train_loss": -26.80327796936035, "global_step": 454940, "epoch": 5481} {"train_loss": -27.099811553955078, "global_step": 454941, "epoch": 5481} {"train_loss": -27.163715362548828, "global_step": 454942, "epoch": 5481} {"train_loss": -27.223005294799805, "global_step": 454943, "epoch": 5481} {"train_loss": -27.038745880126953, "global_step": 454944, "epoch": 5481} {"train_loss": -26.868488311767578, "global_step": 454945, "epoch": 5481} {"train_loss": -26.662992477416992, "global_step": 454946, "epoch": 5481} {"train_loss": -27.157855987548828, "global_step": 454947, "epoch": 5481} {"train_loss": -27.06243324279785, "global_step": 454948, "epoch": 5481} {"train_loss": -26.952972412109375, "global_step": 454949, "epoch": 5481} {"train_loss": -27.305526733398438, "global_step": 454950, "epoch": 5481} {"train_loss": -27.135160446166992, "global_step": 454951, "epoch": 5481} {"train_loss": -26.73529052734375, "global_step": 454952, "epoch": 5481} {"train_loss": -26.780012130737305, "global_step": 454953, "epoch": 5481} {"train_loss": -27.613739013671875, "global_step": 454954, "epoch": 5481} {"train_loss": -27.0142822265625, "global_step": 454955, "epoch": 5481} {"train_loss": -27.05457878112793, "global_step": 454956, "epoch": 5481} {"train_loss": -27.21782875061035, "global_step": 454957, "epoch": 5481} {"train_loss": -27.264692306518555, "global_step": 454958, "epoch": 5481} {"train_loss": -27.174667358398438, "global_step": 454959, "epoch": 5481} {"train_loss": -27.137948989868164, "global_step": 454960, "epoch": 5481} {"train_loss": -27.2541561126709, "global_step": 454961, "epoch": 5481} {"train_loss": -27.039838790893555, "global_step": 454962, "epoch": 5481} {"train_loss": -27.41362953186035, "global_step": 454963, "epoch": 5481} {"train_loss": -27.158954620361328, "global_step": 454964, "epoch": 5481} {"train_loss": -27.086578369140625, "global_step": 454965, "epoch": 5481} {"train_loss": -27.174997329711914, "global_step": 454966, "epoch": 5481} {"train_loss": -27.31450843811035, "global_step": 454967, "epoch": 5481} {"train_loss": -27.502912521362305, "global_step": 454968, "epoch": 5481} {"train_loss": -27.155807495117188, "global_step": 454969, "epoch": 5481} {"train_loss": -27.718765258789062, "global_step": 454970, "epoch": 5481} {"train_loss": -27.367624282836914, "global_step": 454971, "epoch": 5481} {"train_loss": -27.59925651550293, "global_step": 454972, "epoch": 5481} {"train_loss": -26.933090209960938, "global_step": 454973, "epoch": 5481} {"train_loss": -27.014739990234375, "global_step": 454974, "epoch": 5481} {"train_loss": -27.008787155151367, "global_step": 454975, "epoch": 5481} {"train_loss": -26.4228458404541, "global_step": 454976, "epoch": 5481} {"train_loss": -25.7242431640625, "global_step": 454977, "epoch": 5481} {"train_loss": -25.744550704956055, "global_step": 454978, "epoch": 5481} {"train_loss": -27.122480392456055, "global_step": 454979, "epoch": 5481} {"train_loss": -26.899871826171875, "global_step": 454980, "epoch": 5481} {"train_loss": -26.818069458007812, "global_step": 454981, "epoch": 5481} {"train_loss": -26.896411895751953, "global_step": 454982, "epoch": 5481} {"train_loss": -26.811481475830078, "global_step": 454983, "epoch": 5481} {"train_loss": -27.20975112915039, "global_step": 454984, "epoch": 5481} {"train_loss": -26.9627685546875, "global_step": 454985, "epoch": 5481} {"train_loss": -26.838134765625, "global_step": 454986, "epoch": 5481} {"train_loss": -27.028905868530273, "global_step": 454987, "epoch": 5481} {"train_loss": -27.071218490600586, "global_step": 454988, "epoch": 5481} {"train_loss": -26.847272872924805, "global_step": 454989, "epoch": 5481} {"train_loss": -26.91058921813965, "global_step": 454990, "epoch": 5481} {"train_loss": -26.923017501831055, "global_step": 454991, "epoch": 5481} {"train_loss": -26.962034225463867, "global_step": 454992, "epoch": 5481} {"train_loss": -27.145751953125, "global_step": 454993, "epoch": 5481} {"train_loss": -26.98225212097168, "global_step": 454994, "epoch": 5481} {"train_loss": -27.04920768737793, "global_step": 454995, "epoch": 5481} {"train_loss": -26.9751033782959, "global_step": 454996, "epoch": 5481} {"train_loss": -27.260202407836914, "global_step": 454997, "epoch": 5481} {"train_loss": -26.76202392578125, "global_step": 454998, "epoch": 5481} {"train_loss": -26.901880264282227, "global_step": 454999, "epoch": 5481} {"train_loss": -27.09928321838379, "global_step": 455000, "epoch": 5481} {"train_loss": -26.758127212524414, "global_step": 455001, "epoch": 5481} {"train_loss": -27.225370407104492, "global_step": 455002, "epoch": 5481} {"train_loss": -27.27347755432129, "global_step": 455003, "epoch": 5481} {"train_loss": -26.893232345581055, "global_step": 455004, "epoch": 5481} {"train_loss": -26.985889618655285, "global_step": 455005, "epoch": 5481, "val_loss": 6527235.0} {"train_loss": -26.738866806030273, "global_step": 455006, "epoch": 5482} {"train_loss": -26.428918838500977, "global_step": 455007, "epoch": 5482} {"train_loss": -26.659204483032227, "global_step": 455008, "epoch": 5482} {"train_loss": -26.726530075073242, "global_step": 455009, "epoch": 5482} {"train_loss": -26.82526969909668, "global_step": 455010, "epoch": 5482} {"train_loss": -26.816253662109375, "global_step": 455011, "epoch": 5482} {"train_loss": -26.624502182006836, "global_step": 455012, "epoch": 5482} {"train_loss": -26.8231258392334, "global_step": 455013, "epoch": 5482} {"train_loss": -27.00446891784668, "global_step": 455014, "epoch": 5482} {"train_loss": -27.054224014282227, "global_step": 455015, "epoch": 5482} {"train_loss": -27.360065460205078, "global_step": 455016, "epoch": 5482} {"train_loss": -27.1178035736084, "global_step": 455017, "epoch": 5482} {"train_loss": -26.694293975830078, "global_step": 455018, "epoch": 5482} {"train_loss": -27.074071884155273, "global_step": 455019, "epoch": 5482} {"train_loss": -26.9337158203125, "global_step": 455020, "epoch": 5482} {"train_loss": -27.318918228149414, "global_step": 455021, "epoch": 5482} {"train_loss": -27.088123321533203, "global_step": 455022, "epoch": 5482} {"train_loss": -26.657398223876953, "global_step": 455023, "epoch": 5482} {"train_loss": -26.762603759765625, "global_step": 455024, "epoch": 5482} {"train_loss": -26.93436050415039, "global_step": 455025, "epoch": 5482} {"train_loss": -27.355697631835938, "global_step": 455026, "epoch": 5482} {"train_loss": -26.414798736572266, "global_step": 455027, "epoch": 5482} {"train_loss": -26.550098419189453, "global_step": 455028, "epoch": 5482} {"train_loss": -27.03290367126465, "global_step": 455029, "epoch": 5482} {"train_loss": -26.07240867614746, "global_step": 455030, "epoch": 5482} {"train_loss": -26.498205184936523, "global_step": 455031, "epoch": 5482} {"train_loss": -25.910627365112305, "global_step": 455032, "epoch": 5482} {"train_loss": -26.522220611572266, "global_step": 455033, "epoch": 5482} {"train_loss": -26.08588218688965, "global_step": 455034, "epoch": 5482} {"train_loss": -26.63739585876465, "global_step": 455035, "epoch": 5482} {"train_loss": -25.936120986938477, "global_step": 455036, "epoch": 5482} {"train_loss": -26.883991241455078, "global_step": 455037, "epoch": 5482} {"train_loss": -26.6629695892334, "global_step": 455038, "epoch": 5482} {"train_loss": -26.724618911743164, "global_step": 455039, "epoch": 5482} {"train_loss": -26.661157608032227, "global_step": 455040, "epoch": 5482} {"train_loss": -26.563613891601562, "global_step": 455041, "epoch": 5482} {"train_loss": -26.57230567932129, "global_step": 455042, "epoch": 5482} {"train_loss": -26.552600860595703, "global_step": 455043, "epoch": 5482} {"train_loss": -26.378726959228516, "global_step": 455044, "epoch": 5482} {"train_loss": -27.298070907592773, "global_step": 455045, "epoch": 5482} {"train_loss": -26.826913833618164, "global_step": 455046, "epoch": 5482} {"train_loss": -26.951948165893555, "global_step": 455047, "epoch": 5482} {"train_loss": -26.801437377929688, "global_step": 455048, "epoch": 5482} {"train_loss": -26.8432559967041, "global_step": 455049, "epoch": 5482} {"train_loss": -27.07358741760254, "global_step": 455050, "epoch": 5482} {"train_loss": -26.64444351196289, "global_step": 455051, "epoch": 5482} {"train_loss": -26.762832641601562, "global_step": 455052, "epoch": 5482} {"train_loss": -27.187564849853516, "global_step": 455053, "epoch": 5482} {"train_loss": -27.248876571655273, "global_step": 455054, "epoch": 5482} {"train_loss": -27.209680557250977, "global_step": 455055, "epoch": 5482} {"train_loss": -26.871234893798828, "global_step": 455056, "epoch": 5482} {"train_loss": -26.835554122924805, "global_step": 455057, "epoch": 5482} {"train_loss": -27.152118682861328, "global_step": 455058, "epoch": 5482} {"train_loss": -27.07392692565918, "global_step": 455059, "epoch": 5482} {"train_loss": -27.35028648376465, "global_step": 455060, "epoch": 5482} {"train_loss": -27.252134323120117, "global_step": 455061, "epoch": 5482} {"train_loss": -26.930587768554688, "global_step": 455062, "epoch": 5482} {"train_loss": -27.21013832092285, "global_step": 455063, "epoch": 5482} {"train_loss": -27.449934005737305, "global_step": 455064, "epoch": 5482} {"train_loss": -27.273406982421875, "global_step": 455065, "epoch": 5482} {"train_loss": -27.11322021484375, "global_step": 455066, "epoch": 5482} {"train_loss": -27.178638458251953, "global_step": 455067, "epoch": 5482} {"train_loss": -27.053571701049805, "global_step": 455068, "epoch": 5482} {"train_loss": -27.005285263061523, "global_step": 455069, "epoch": 5482} {"train_loss": -27.300159454345703, "global_step": 455070, "epoch": 5482} {"train_loss": -27.13589859008789, "global_step": 455071, "epoch": 5482} {"train_loss": -27.29191017150879, "global_step": 455072, "epoch": 5482} {"train_loss": -27.19264030456543, "global_step": 455073, "epoch": 5482} {"train_loss": -27.10993003845215, "global_step": 455074, "epoch": 5482} {"train_loss": -27.252582550048828, "global_step": 455075, "epoch": 5482} {"train_loss": -26.690465927124023, "global_step": 455076, "epoch": 5482} {"train_loss": -27.482131958007812, "global_step": 455077, "epoch": 5482} {"train_loss": -27.2557430267334, "global_step": 455078, "epoch": 5482} {"train_loss": -27.279285430908203, "global_step": 455079, "epoch": 5482} {"train_loss": -27.286977767944336, "global_step": 455080, "epoch": 5482} {"train_loss": -27.1302433013916, "global_step": 455081, "epoch": 5482} {"train_loss": -27.270078659057617, "global_step": 455082, "epoch": 5482} {"train_loss": -27.13800621032715, "global_step": 455083, "epoch": 5482} {"train_loss": -26.986051559448242, "global_step": 455084, "epoch": 5482} {"train_loss": -26.65781593322754, "global_step": 455085, "epoch": 5482} {"train_loss": -26.808002471923828, "global_step": 455086, "epoch": 5482} {"train_loss": -27.13461685180664, "global_step": 455087, "epoch": 5482} {"train_loss": -26.908912038228596, "global_step": 455088, "epoch": 5482, "val_loss": 6565539.5} {"train_loss": -26.07575035095215, "global_step": 455089, "epoch": 5483} {"train_loss": -25.88081932067871, "global_step": 455090, "epoch": 5483} {"train_loss": -26.866662979125977, "global_step": 455091, "epoch": 5483} {"train_loss": -26.495223999023438, "global_step": 455092, "epoch": 5483} {"train_loss": -26.156232833862305, "global_step": 455093, "epoch": 5483} {"train_loss": -27.007246017456055, "global_step": 455094, "epoch": 5483} {"train_loss": -26.807239532470703, "global_step": 455095, "epoch": 5483} {"train_loss": -26.683734893798828, "global_step": 455096, "epoch": 5483} {"train_loss": -26.529438018798828, "global_step": 455097, "epoch": 5483} {"train_loss": -26.932086944580078, "global_step": 455098, "epoch": 5483} {"train_loss": -26.81589698791504, "global_step": 455099, "epoch": 5483} {"train_loss": -26.667572021484375, "global_step": 455100, "epoch": 5483} {"train_loss": -26.761112213134766, "global_step": 455101, "epoch": 5483} {"train_loss": -26.602216720581055, "global_step": 455102, "epoch": 5483} {"train_loss": -26.76651382446289, "global_step": 455103, "epoch": 5483} {"train_loss": -26.85873794555664, "global_step": 455104, "epoch": 5483} {"train_loss": -26.867645263671875, "global_step": 455105, "epoch": 5483} {"train_loss": -26.66181755065918, "global_step": 455106, "epoch": 5483} {"train_loss": -26.780115127563477, "global_step": 455107, "epoch": 5483} {"train_loss": -26.7943058013916, "global_step": 455108, "epoch": 5483} {"train_loss": -26.92158317565918, "global_step": 455109, "epoch": 5483} {"train_loss": -26.652944564819336, "global_step": 455110, "epoch": 5483} {"train_loss": -27.01665687561035, "global_step": 455111, "epoch": 5483} {"train_loss": -26.960769653320312, "global_step": 455112, "epoch": 5483} {"train_loss": -26.942407608032227, "global_step": 455113, "epoch": 5483} {"train_loss": -27.302907943725586, "global_step": 455114, "epoch": 5483} {"train_loss": -27.03607749938965, "global_step": 455115, "epoch": 5483} {"train_loss": -26.743793487548828, "global_step": 455116, "epoch": 5483} {"train_loss": -27.155065536499023, "global_step": 455117, "epoch": 5483} {"train_loss": -26.973861694335938, "global_step": 455118, "epoch": 5483} {"train_loss": -26.720983505249023, "global_step": 455119, "epoch": 5483} {"train_loss": -26.818082809448242, "global_step": 455120, "epoch": 5483} {"train_loss": -27.085554122924805, "global_step": 455121, "epoch": 5483} {"train_loss": -27.255762100219727, "global_step": 455122, "epoch": 5483} {"train_loss": -27.02557373046875, "global_step": 455123, "epoch": 5483} {"train_loss": -27.017398834228516, "global_step": 455124, "epoch": 5483} {"train_loss": -26.95363426208496, "global_step": 455125, "epoch": 5483} {"train_loss": -27.1350040435791, "global_step": 455126, "epoch": 5483} {"train_loss": -26.89820671081543, "global_step": 455127, "epoch": 5483} {"train_loss": -27.046247482299805, "global_step": 455128, "epoch": 5483} {"train_loss": -27.167627334594727, "global_step": 455129, "epoch": 5483} {"train_loss": -27.1726016998291, "global_step": 455130, "epoch": 5483} {"train_loss": -27.339340209960938, "global_step": 455131, "epoch": 5483} {"train_loss": -27.079252243041992, "global_step": 455132, "epoch": 5483} {"train_loss": -27.017187118530273, "global_step": 455133, "epoch": 5483} {"train_loss": -27.2578067779541, "global_step": 455134, "epoch": 5483} {"train_loss": -27.025501251220703, "global_step": 455135, "epoch": 5483} {"train_loss": -27.1010684967041, "global_step": 455136, "epoch": 5483} {"train_loss": -27.33027458190918, "global_step": 455137, "epoch": 5483} {"train_loss": -27.26025390625, "global_step": 455138, "epoch": 5483} {"train_loss": -26.977224349975586, "global_step": 455139, "epoch": 5483} {"train_loss": -27.349618911743164, "global_step": 455140, "epoch": 5483} {"train_loss": -27.090967178344727, "global_step": 455141, "epoch": 5483} {"train_loss": -27.00153160095215, "global_step": 455142, "epoch": 5483} {"train_loss": -27.41351890563965, "global_step": 455143, "epoch": 5483} {"train_loss": -27.034292221069336, "global_step": 455144, "epoch": 5483} {"train_loss": -27.089330673217773, "global_step": 455145, "epoch": 5483} {"train_loss": -26.653696060180664, "global_step": 455146, "epoch": 5483} {"train_loss": -27.16387367248535, "global_step": 455147, "epoch": 5483} {"train_loss": -26.979238510131836, "global_step": 455148, "epoch": 5483} {"train_loss": -26.941495895385742, "global_step": 455149, "epoch": 5483} {"train_loss": -27.0851993560791, "global_step": 455150, "epoch": 5483} {"train_loss": -27.0057315826416, "global_step": 455151, "epoch": 5483} {"train_loss": -26.938100814819336, "global_step": 455152, "epoch": 5483} {"train_loss": -27.478239059448242, "global_step": 455153, "epoch": 5483} {"train_loss": -27.039121627807617, "global_step": 455154, "epoch": 5483} {"train_loss": -27.3333683013916, "global_step": 455155, "epoch": 5483} {"train_loss": -26.969806671142578, "global_step": 455156, "epoch": 5483} {"train_loss": -27.704740524291992, "global_step": 455157, "epoch": 5483} {"train_loss": -27.185455322265625, "global_step": 455158, "epoch": 5483} {"train_loss": -26.795740127563477, "global_step": 455159, "epoch": 5483} {"train_loss": -27.363134384155273, "global_step": 455160, "epoch": 5483} {"train_loss": -27.086841583251953, "global_step": 455161, "epoch": 5483} {"train_loss": -26.90729331970215, "global_step": 455162, "epoch": 5483} {"train_loss": -26.504377365112305, "global_step": 455163, "epoch": 5483} {"train_loss": -27.3885555267334, "global_step": 455164, "epoch": 5483} {"train_loss": -26.951303482055664, "global_step": 455165, "epoch": 5483} {"train_loss": -27.006576538085938, "global_step": 455166, "epoch": 5483} {"train_loss": -26.68891716003418, "global_step": 455167, "epoch": 5483} {"train_loss": -27.282175064086914, "global_step": 455168, "epoch": 5483} {"train_loss": -26.5759334564209, "global_step": 455169, "epoch": 5483} {"train_loss": -27.160785675048828, "global_step": 455170, "epoch": 5483} {"train_loss": -26.968994209565313, "global_step": 455171, "epoch": 5483, "val_loss": 6609834.0} {"train_loss": -25.690006256103516, "global_step": 455172, "epoch": 5484} {"train_loss": -25.987401962280273, "global_step": 455173, "epoch": 5484} {"train_loss": -26.2998046875, "global_step": 455174, "epoch": 5484} {"train_loss": -25.81780433654785, "global_step": 455175, "epoch": 5484} {"train_loss": -26.59193992614746, "global_step": 455176, "epoch": 5484} {"train_loss": -26.039093017578125, "global_step": 455177, "epoch": 5484} {"train_loss": -26.42864418029785, "global_step": 455178, "epoch": 5484} {"train_loss": -26.368194580078125, "global_step": 455179, "epoch": 5484} {"train_loss": -26.350366592407227, "global_step": 455180, "epoch": 5484} {"train_loss": -26.34290885925293, "global_step": 455181, "epoch": 5484} {"train_loss": -26.602270126342773, "global_step": 455182, "epoch": 5484} {"train_loss": -26.429655075073242, "global_step": 455183, "epoch": 5484} {"train_loss": -26.587020874023438, "global_step": 455184, "epoch": 5484} {"train_loss": -26.74127197265625, "global_step": 455185, "epoch": 5484} {"train_loss": -26.198780059814453, "global_step": 455186, "epoch": 5484} {"train_loss": -26.688785552978516, "global_step": 455187, "epoch": 5484} {"train_loss": -26.875226974487305, "global_step": 455188, "epoch": 5484} {"train_loss": -26.6684627532959, "global_step": 455189, "epoch": 5484} {"train_loss": -26.719507217407227, "global_step": 455190, "epoch": 5484} {"train_loss": -26.660017013549805, "global_step": 455191, "epoch": 5484} {"train_loss": -26.79163932800293, "global_step": 455192, "epoch": 5484} {"train_loss": -26.69679069519043, "global_step": 455193, "epoch": 5484} {"train_loss": -26.77862548828125, "global_step": 455194, "epoch": 5484} {"train_loss": -26.610143661499023, "global_step": 455195, "epoch": 5484} {"train_loss": -26.893096923828125, "global_step": 455196, "epoch": 5484} {"train_loss": -27.0841064453125, "global_step": 455197, "epoch": 5484} {"train_loss": -27.06138038635254, "global_step": 455198, "epoch": 5484} {"train_loss": -26.821210861206055, "global_step": 455199, "epoch": 5484} {"train_loss": -27.137109756469727, "global_step": 455200, "epoch": 5484} {"train_loss": -26.43548583984375, "global_step": 455201, "epoch": 5484} {"train_loss": -27.078479766845703, "global_step": 455202, "epoch": 5484} {"train_loss": -26.884424209594727, "global_step": 455203, "epoch": 5484} {"train_loss": -26.991291046142578, "global_step": 455204, "epoch": 5484} {"train_loss": -26.996152877807617, "global_step": 455205, "epoch": 5484} {"train_loss": -27.175159454345703, "global_step": 455206, "epoch": 5484} {"train_loss": -26.679365158081055, "global_step": 455207, "epoch": 5484} {"train_loss": -26.834918975830078, "global_step": 455208, "epoch": 5484} {"train_loss": -27.041833877563477, "global_step": 455209, "epoch": 5484} {"train_loss": -27.1589412689209, "global_step": 455210, "epoch": 5484} {"train_loss": -26.863555908203125, "global_step": 455211, "epoch": 5484} {"train_loss": -27.207538604736328, "global_step": 455212, "epoch": 5484} {"train_loss": -26.86956214904785, "global_step": 455213, "epoch": 5484} {"train_loss": -26.823551177978516, "global_step": 455214, "epoch": 5484} {"train_loss": -27.145437240600586, "global_step": 455215, "epoch": 5484} {"train_loss": -27.484130859375, "global_step": 455216, "epoch": 5484} {"train_loss": -27.420700073242188, "global_step": 455217, "epoch": 5484} {"train_loss": -27.021194458007812, "global_step": 455218, "epoch": 5484} {"train_loss": -26.789947509765625, "global_step": 455219, "epoch": 5484} {"train_loss": -27.329282760620117, "global_step": 455220, "epoch": 5484} {"train_loss": -26.80853271484375, "global_step": 455221, "epoch": 5484} {"train_loss": -27.045801162719727, "global_step": 455222, "epoch": 5484} {"train_loss": -27.1777286529541, "global_step": 455223, "epoch": 5484} {"train_loss": -27.114490509033203, "global_step": 455224, "epoch": 5484} {"train_loss": -27.254758834838867, "global_step": 455225, "epoch": 5484} {"train_loss": -27.65852165222168, "global_step": 455226, "epoch": 5484} {"train_loss": -27.211408615112305, "global_step": 455227, "epoch": 5484} {"train_loss": -27.010717391967773, "global_step": 455228, "epoch": 5484} {"train_loss": -26.67352867126465, "global_step": 455229, "epoch": 5484} {"train_loss": -26.939786911010742, "global_step": 455230, "epoch": 5484} {"train_loss": -26.887128829956055, "global_step": 455231, "epoch": 5484} {"train_loss": -26.84064292907715, "global_step": 455232, "epoch": 5484} {"train_loss": -26.106740951538086, "global_step": 455233, "epoch": 5484} {"train_loss": -25.946142196655273, "global_step": 455234, "epoch": 5484} {"train_loss": -26.92530632019043, "global_step": 455235, "epoch": 5484} {"train_loss": -26.871469497680664, "global_step": 455236, "epoch": 5484} {"train_loss": -26.249216079711914, "global_step": 455237, "epoch": 5484} {"train_loss": -26.683515548706055, "global_step": 455238, "epoch": 5484} {"train_loss": -26.927331924438477, "global_step": 455239, "epoch": 5484} {"train_loss": -27.189468383789062, "global_step": 455240, "epoch": 5484} {"train_loss": -26.622970581054688, "global_step": 455241, "epoch": 5484} {"train_loss": -26.56658935546875, "global_step": 455242, "epoch": 5484} {"train_loss": -26.91470718383789, "global_step": 455243, "epoch": 5484} {"train_loss": -26.797712326049805, "global_step": 455244, "epoch": 5484} {"train_loss": -26.552310943603516, "global_step": 455245, "epoch": 5484} {"train_loss": -26.90481948852539, "global_step": 455246, "epoch": 5484} {"train_loss": -26.84381675720215, "global_step": 455247, "epoch": 5484} {"train_loss": -26.859113693237305, "global_step": 455248, "epoch": 5484} {"train_loss": -26.7781982421875, "global_step": 455249, "epoch": 5484} {"train_loss": -26.972986221313477, "global_step": 455250, "epoch": 5484} {"train_loss": -27.055810928344727, "global_step": 455251, "epoch": 5484} {"train_loss": -26.953840255737305, "global_step": 455252, "epoch": 5484} {"train_loss": -27.198957443237305, "global_step": 455253, "epoch": 5484} {"train_loss": -26.79677751839879, "global_step": 455254, "epoch": 5484, "val_loss": 6601426.0} {"train_loss": -26.770751953125, "global_step": 455255, "epoch": 5485} {"train_loss": -26.734268188476562, "global_step": 455256, "epoch": 5485} {"train_loss": -26.98651695251465, "global_step": 455257, "epoch": 5485} {"train_loss": -26.554931640625, "global_step": 455258, "epoch": 5485} {"train_loss": -26.735095977783203, "global_step": 455259, "epoch": 5485} {"train_loss": -26.80385398864746, "global_step": 455260, "epoch": 5485} {"train_loss": -26.973615646362305, "global_step": 455261, "epoch": 5485} {"train_loss": -26.612401962280273, "global_step": 455262, "epoch": 5485} {"train_loss": -26.8692684173584, "global_step": 455263, "epoch": 5485} {"train_loss": -26.36842155456543, "global_step": 455264, "epoch": 5485} {"train_loss": -26.738666534423828, "global_step": 455265, "epoch": 5485} {"train_loss": -26.96455192565918, "global_step": 455266, "epoch": 5485} {"train_loss": -27.175504684448242, "global_step": 455267, "epoch": 5485} {"train_loss": -26.797840118408203, "global_step": 455268, "epoch": 5485} {"train_loss": -26.848724365234375, "global_step": 455269, "epoch": 5485} {"train_loss": -27.00876235961914, "global_step": 455270, "epoch": 5485} {"train_loss": -26.97565269470215, "global_step": 455271, "epoch": 5485} {"train_loss": -27.396671295166016, "global_step": 455272, "epoch": 5485} {"train_loss": -26.776172637939453, "global_step": 455273, "epoch": 5485} {"train_loss": -27.488744735717773, "global_step": 455274, "epoch": 5485} {"train_loss": -27.050146102905273, "global_step": 455275, "epoch": 5485} {"train_loss": -27.461057662963867, "global_step": 455276, "epoch": 5485} {"train_loss": -26.88818359375, "global_step": 455277, "epoch": 5485} {"train_loss": -27.17376136779785, "global_step": 455278, "epoch": 5485} {"train_loss": -27.364307403564453, "global_step": 455279, "epoch": 5485} {"train_loss": -26.9999942779541, "global_step": 455280, "epoch": 5485} {"train_loss": -26.902606964111328, "global_step": 455281, "epoch": 5485} {"train_loss": -26.852201461791992, "global_step": 455282, "epoch": 5485} {"train_loss": -26.802831649780273, "global_step": 455283, "epoch": 5485} {"train_loss": -27.11512565612793, "global_step": 455284, "epoch": 5485} {"train_loss": -27.033447265625, "global_step": 455285, "epoch": 5485} {"train_loss": -26.93195152282715, "global_step": 455286, "epoch": 5485} {"train_loss": -27.400434494018555, "global_step": 455287, "epoch": 5485} {"train_loss": -27.396169662475586, "global_step": 455288, "epoch": 5485} {"train_loss": -27.056833267211914, "global_step": 455289, "epoch": 5485} {"train_loss": -26.869720458984375, "global_step": 455290, "epoch": 5485} {"train_loss": -27.535261154174805, "global_step": 455291, "epoch": 5485} {"train_loss": -27.000049591064453, "global_step": 455292, "epoch": 5485} {"train_loss": -26.874988555908203, "global_step": 455293, "epoch": 5485} {"train_loss": -27.17573356628418, "global_step": 455294, "epoch": 5485} {"train_loss": -27.474660873413086, "global_step": 455295, "epoch": 5485} {"train_loss": -27.390735626220703, "global_step": 455296, "epoch": 5485} {"train_loss": -26.954254150390625, "global_step": 455297, "epoch": 5485} {"train_loss": -27.261035919189453, "global_step": 455298, "epoch": 5485} {"train_loss": -27.385923385620117, "global_step": 455299, "epoch": 5485} {"train_loss": -27.42913818359375, "global_step": 455300, "epoch": 5485} {"train_loss": -27.08334732055664, "global_step": 455301, "epoch": 5485} {"train_loss": -27.51360511779785, "global_step": 455302, "epoch": 5485} {"train_loss": -27.373640060424805, "global_step": 455303, "epoch": 5485} {"train_loss": -27.461181640625, "global_step": 455304, "epoch": 5485} {"train_loss": -27.343069076538086, "global_step": 455305, "epoch": 5485} {"train_loss": -27.3658390045166, "global_step": 455306, "epoch": 5485} {"train_loss": -26.949111938476562, "global_step": 455307, "epoch": 5485} {"train_loss": -27.266681671142578, "global_step": 455308, "epoch": 5485} {"train_loss": -26.972427368164062, "global_step": 455309, "epoch": 5485} {"train_loss": -27.16719627380371, "global_step": 455310, "epoch": 5485} {"train_loss": -26.821548461914062, "global_step": 455311, "epoch": 5485} {"train_loss": -27.126850128173828, "global_step": 455312, "epoch": 5485} {"train_loss": -27.067529678344727, "global_step": 455313, "epoch": 5485} {"train_loss": -27.187658309936523, "global_step": 455314, "epoch": 5485} {"train_loss": -27.288360595703125, "global_step": 455315, "epoch": 5485} {"train_loss": -26.70477294921875, "global_step": 455316, "epoch": 5485} {"train_loss": -26.554752349853516, "global_step": 455317, "epoch": 5485} {"train_loss": -26.278329849243164, "global_step": 455318, "epoch": 5485} {"train_loss": -27.150068283081055, "global_step": 455319, "epoch": 5485} {"train_loss": -26.987171173095703, "global_step": 455320, "epoch": 5485} {"train_loss": -26.303625106811523, "global_step": 455321, "epoch": 5485} {"train_loss": -26.672815322875977, "global_step": 455322, "epoch": 5485} {"train_loss": -27.12814712524414, "global_step": 455323, "epoch": 5485} {"train_loss": -26.54365348815918, "global_step": 455324, "epoch": 5485} {"train_loss": -26.409149169921875, "global_step": 455325, "epoch": 5485} {"train_loss": -26.454797744750977, "global_step": 455326, "epoch": 5485} {"train_loss": -26.75677490234375, "global_step": 455327, "epoch": 5485} {"train_loss": -26.83381462097168, "global_step": 455328, "epoch": 5485} {"train_loss": -27.023595809936523, "global_step": 455329, "epoch": 5485} {"train_loss": -26.595407485961914, "global_step": 455330, "epoch": 5485} {"train_loss": -26.647382736206055, "global_step": 455331, "epoch": 5485} {"train_loss": -26.91718864440918, "global_step": 455332, "epoch": 5485} {"train_loss": -26.945310592651367, "global_step": 455333, "epoch": 5485} {"train_loss": -26.86049461364746, "global_step": 455334, "epoch": 5485} {"train_loss": -26.921253204345703, "global_step": 455335, "epoch": 5485} {"train_loss": -26.9746150970459, "global_step": 455336, "epoch": 5485} {"train_loss": -26.988618551966656, "global_step": 455337, "epoch": 5485, "val_loss": 6587455.0} {"train_loss": -26.039478302001953, "global_step": 455338, "epoch": 5486} {"train_loss": -26.40091323852539, "global_step": 455339, "epoch": 5486} {"train_loss": -26.39286231994629, "global_step": 455340, "epoch": 5486} {"train_loss": -26.41956901550293, "global_step": 455341, "epoch": 5486} {"train_loss": -26.563989639282227, "global_step": 455342, "epoch": 5486} {"train_loss": -26.79844093322754, "global_step": 455343, "epoch": 5486} {"train_loss": -26.839872360229492, "global_step": 455344, "epoch": 5486} {"train_loss": -26.67473793029785, "global_step": 455345, "epoch": 5486} {"train_loss": -27.141223907470703, "global_step": 455346, "epoch": 5486} {"train_loss": -26.773130416870117, "global_step": 455347, "epoch": 5486} {"train_loss": -26.9693546295166, "global_step": 455348, "epoch": 5486} {"train_loss": -26.513097763061523, "global_step": 455349, "epoch": 5486} {"train_loss": -26.568384170532227, "global_step": 455350, "epoch": 5486} {"train_loss": -26.958892822265625, "global_step": 455351, "epoch": 5486} {"train_loss": -26.555591583251953, "global_step": 455352, "epoch": 5486} {"train_loss": -27.099634170532227, "global_step": 455353, "epoch": 5486} {"train_loss": -26.733234405517578, "global_step": 455354, "epoch": 5486} {"train_loss": -26.760663986206055, "global_step": 455355, "epoch": 5486} {"train_loss": -27.302642822265625, "global_step": 455356, "epoch": 5486} {"train_loss": -27.12992286682129, "global_step": 455357, "epoch": 5486} {"train_loss": -27.2008113861084, "global_step": 455358, "epoch": 5486} {"train_loss": -27.089645385742188, "global_step": 455359, "epoch": 5486} {"train_loss": -27.473541259765625, "global_step": 455360, "epoch": 5486} {"train_loss": -27.000329971313477, "global_step": 455361, "epoch": 5486} {"train_loss": -26.800161361694336, "global_step": 455362, "epoch": 5486} {"train_loss": -26.972003936767578, "global_step": 455363, "epoch": 5486} {"train_loss": -27.121570587158203, "global_step": 455364, "epoch": 5486} {"train_loss": -27.21198844909668, "global_step": 455365, "epoch": 5486} {"train_loss": -27.34681510925293, "global_step": 455366, "epoch": 5486} {"train_loss": -26.987268447875977, "global_step": 455367, "epoch": 5486} {"train_loss": -26.83624267578125, "global_step": 455368, "epoch": 5486} {"train_loss": -27.227039337158203, "global_step": 455369, "epoch": 5486} {"train_loss": -27.067535400390625, "global_step": 455370, "epoch": 5486} {"train_loss": -27.224639892578125, "global_step": 455371, "epoch": 5486} {"train_loss": -27.14765739440918, "global_step": 455372, "epoch": 5486} {"train_loss": -27.303083419799805, "global_step": 455373, "epoch": 5486} {"train_loss": -27.193988800048828, "global_step": 455374, "epoch": 5486} {"train_loss": -27.050931930541992, "global_step": 455375, "epoch": 5486} {"train_loss": -27.200109481811523, "global_step": 455376, "epoch": 5486} {"train_loss": -26.96198081970215, "global_step": 455377, "epoch": 5486} {"train_loss": -26.794845581054688, "global_step": 455378, "epoch": 5486} {"train_loss": -26.535581588745117, "global_step": 455379, "epoch": 5486} {"train_loss": -26.518701553344727, "global_step": 455380, "epoch": 5486} {"train_loss": -27.05148696899414, "global_step": 455381, "epoch": 5486} {"train_loss": -26.951581954956055, "global_step": 455382, "epoch": 5486} {"train_loss": -26.892364501953125, "global_step": 455383, "epoch": 5486} {"train_loss": -27.027006149291992, "global_step": 455384, "epoch": 5486} {"train_loss": -27.11423683166504, "global_step": 455385, "epoch": 5486} {"train_loss": -27.1262149810791, "global_step": 455386, "epoch": 5486} {"train_loss": -27.2514705657959, "global_step": 455387, "epoch": 5486} {"train_loss": -26.79097557067871, "global_step": 455388, "epoch": 5486} {"train_loss": -27.144773483276367, "global_step": 455389, "epoch": 5486} {"train_loss": -27.122949600219727, "global_step": 455390, "epoch": 5486} {"train_loss": -27.428802490234375, "global_step": 455391, "epoch": 5486} {"train_loss": -26.854084014892578, "global_step": 455392, "epoch": 5486} {"train_loss": -27.255361557006836, "global_step": 455393, "epoch": 5486} {"train_loss": -27.021215438842773, "global_step": 455394, "epoch": 5486} {"train_loss": -27.219974517822266, "global_step": 455395, "epoch": 5486} {"train_loss": -27.461807250976562, "global_step": 455396, "epoch": 5486} {"train_loss": -27.3118839263916, "global_step": 455397, "epoch": 5486} {"train_loss": -27.14101219177246, "global_step": 455398, "epoch": 5486} {"train_loss": -27.16106605529785, "global_step": 455399, "epoch": 5486} {"train_loss": -26.930856704711914, "global_step": 455400, "epoch": 5486} {"train_loss": -27.539011001586914, "global_step": 455401, "epoch": 5486} {"train_loss": -26.934009552001953, "global_step": 455402, "epoch": 5486} {"train_loss": -27.012460708618164, "global_step": 455403, "epoch": 5486} {"train_loss": -27.0828857421875, "global_step": 455404, "epoch": 5486} {"train_loss": -27.44727897644043, "global_step": 455405, "epoch": 5486} {"train_loss": -27.192432403564453, "global_step": 455406, "epoch": 5486} {"train_loss": -27.26410484313965, "global_step": 455407, "epoch": 5486} {"train_loss": -27.2488956451416, "global_step": 455408, "epoch": 5486} {"train_loss": -27.117273330688477, "global_step": 455409, "epoch": 5486} {"train_loss": -27.5902042388916, "global_step": 455410, "epoch": 5486} {"train_loss": -27.32218360900879, "global_step": 455411, "epoch": 5486} {"train_loss": -26.908323287963867, "global_step": 455412, "epoch": 5486} {"train_loss": -26.8810977935791, "global_step": 455413, "epoch": 5486} {"train_loss": -26.86688804626465, "global_step": 455414, "epoch": 5486} {"train_loss": -27.432693481445312, "global_step": 455415, "epoch": 5486} {"train_loss": -27.233789443969727, "global_step": 455416, "epoch": 5486} {"train_loss": -27.45161247253418, "global_step": 455417, "epoch": 5486} {"train_loss": -26.75385856628418, "global_step": 455418, "epoch": 5486} {"train_loss": -27.326513290405273, "global_step": 455419, "epoch": 5486} {"train_loss": -27.028635990188782, "global_step": 455420, "epoch": 5486, "val_loss": 6702298.0} {"train_loss": -26.772674560546875, "global_step": 455421, "epoch": 5487} {"train_loss": -26.242034912109375, "global_step": 455422, "epoch": 5487} {"train_loss": -26.01969337463379, "global_step": 455423, "epoch": 5487} {"train_loss": -26.421960830688477, "global_step": 455424, "epoch": 5487} {"train_loss": -26.740985870361328, "global_step": 455425, "epoch": 5487} {"train_loss": -26.76993751525879, "global_step": 455426, "epoch": 5487} {"train_loss": -26.619897842407227, "global_step": 455427, "epoch": 5487} {"train_loss": -26.318811416625977, "global_step": 455428, "epoch": 5487} {"train_loss": -27.158288955688477, "global_step": 455429, "epoch": 5487} {"train_loss": -26.409381866455078, "global_step": 455430, "epoch": 5487} {"train_loss": -26.494232177734375, "global_step": 455431, "epoch": 5487} {"train_loss": -26.343778610229492, "global_step": 455432, "epoch": 5487} {"train_loss": -27.04731559753418, "global_step": 455433, "epoch": 5487} {"train_loss": -26.85542106628418, "global_step": 455434, "epoch": 5487} {"train_loss": -27.194921493530273, "global_step": 455435, "epoch": 5487} {"train_loss": -26.9130916595459, "global_step": 455436, "epoch": 5487} {"train_loss": -27.209070205688477, "global_step": 455437, "epoch": 5487} {"train_loss": -26.358442306518555, "global_step": 455438, "epoch": 5487} {"train_loss": -27.072721481323242, "global_step": 455439, "epoch": 5487} {"train_loss": -26.53303337097168, "global_step": 455440, "epoch": 5487} {"train_loss": -27.3023624420166, "global_step": 455441, "epoch": 5487} {"train_loss": -27.13518714904785, "global_step": 455442, "epoch": 5487} {"train_loss": -26.6697998046875, "global_step": 455443, "epoch": 5487} {"train_loss": -26.600040435791016, "global_step": 455444, "epoch": 5487} {"train_loss": -26.95631980895996, "global_step": 455445, "epoch": 5487} {"train_loss": -27.17447853088379, "global_step": 455446, "epoch": 5487} {"train_loss": -26.793970108032227, "global_step": 455447, "epoch": 5487} {"train_loss": -27.382892608642578, "global_step": 455448, "epoch": 5487} {"train_loss": -27.075239181518555, "global_step": 455449, "epoch": 5487} {"train_loss": -26.980222702026367, "global_step": 455450, "epoch": 5487} {"train_loss": -26.481006622314453, "global_step": 455451, "epoch": 5487} {"train_loss": -27.035324096679688, "global_step": 455452, "epoch": 5487} {"train_loss": -27.1291561126709, "global_step": 455453, "epoch": 5487} {"train_loss": -27.251638412475586, "global_step": 455454, "epoch": 5487} {"train_loss": -26.962970733642578, "global_step": 455455, "epoch": 5487} {"train_loss": -27.05372428894043, "global_step": 455456, "epoch": 5487} {"train_loss": -26.886646270751953, "global_step": 455457, "epoch": 5487} {"train_loss": -26.826704025268555, "global_step": 455458, "epoch": 5487} {"train_loss": -26.985361099243164, "global_step": 455459, "epoch": 5487} {"train_loss": -26.956113815307617, "global_step": 455460, "epoch": 5487} {"train_loss": -27.342260360717773, "global_step": 455461, "epoch": 5487} {"train_loss": -26.96661376953125, "global_step": 455462, "epoch": 5487} {"train_loss": -27.33966636657715, "global_step": 455463, "epoch": 5487} {"train_loss": -27.275989532470703, "global_step": 455464, "epoch": 5487} {"train_loss": -27.146442413330078, "global_step": 455465, "epoch": 5487} {"train_loss": -27.076345443725586, "global_step": 455466, "epoch": 5487} {"train_loss": -27.203855514526367, "global_step": 455467, "epoch": 5487} {"train_loss": -27.44227409362793, "global_step": 455468, "epoch": 5487} {"train_loss": -27.489242553710938, "global_step": 455469, "epoch": 5487} {"train_loss": -27.28639793395996, "global_step": 455470, "epoch": 5487} {"train_loss": -27.273038864135742, "global_step": 455471, "epoch": 5487} {"train_loss": -27.372482299804688, "global_step": 455472, "epoch": 5487} {"train_loss": -27.16167640686035, "global_step": 455473, "epoch": 5487} {"train_loss": -26.73447608947754, "global_step": 455474, "epoch": 5487} {"train_loss": -27.214162826538086, "global_step": 455475, "epoch": 5487} {"train_loss": -27.261213302612305, "global_step": 455476, "epoch": 5487} {"train_loss": -26.937952041625977, "global_step": 455477, "epoch": 5487} {"train_loss": -27.11455726623535, "global_step": 455478, "epoch": 5487} {"train_loss": -26.717041015625, "global_step": 455479, "epoch": 5487} {"train_loss": -27.319263458251953, "global_step": 455480, "epoch": 5487} {"train_loss": -27.14656639099121, "global_step": 455481, "epoch": 5487} {"train_loss": -27.14763832092285, "global_step": 455482, "epoch": 5487} {"train_loss": -27.32623291015625, "global_step": 455483, "epoch": 5487} {"train_loss": -26.881591796875, "global_step": 455484, "epoch": 5487} {"train_loss": -27.10503578186035, "global_step": 455485, "epoch": 5487} {"train_loss": -26.387975692749023, "global_step": 455486, "epoch": 5487} {"train_loss": -26.79803466796875, "global_step": 455487, "epoch": 5487} {"train_loss": -27.126773834228516, "global_step": 455488, "epoch": 5487} {"train_loss": -26.503326416015625, "global_step": 455489, "epoch": 5487} {"train_loss": -26.964139938354492, "global_step": 455490, "epoch": 5487} {"train_loss": -27.1290225982666, "global_step": 455491, "epoch": 5487} {"train_loss": -27.249618530273438, "global_step": 455492, "epoch": 5487} {"train_loss": -26.687524795532227, "global_step": 455493, "epoch": 5487} {"train_loss": -26.604766845703125, "global_step": 455494, "epoch": 5487} {"train_loss": -27.10683250427246, "global_step": 455495, "epoch": 5487} {"train_loss": -27.12049674987793, "global_step": 455496, "epoch": 5487} {"train_loss": -27.15093994140625, "global_step": 455497, "epoch": 5487} {"train_loss": -26.98565101623535, "global_step": 455498, "epoch": 5487} {"train_loss": -27.281335830688477, "global_step": 455499, "epoch": 5487} {"train_loss": -27.071508407592773, "global_step": 455500, "epoch": 5487} {"train_loss": -27.2581844329834, "global_step": 455501, "epoch": 5487} {"train_loss": -27.12664222717285, "global_step": 455502, "epoch": 5487} {"train_loss": -26.974207475960974, "global_step": 455503, "epoch": 5487, "val_loss": 6597259.0} {"train_loss": -26.366113662719727, "global_step": 455504, "epoch": 5488} {"train_loss": -26.001312255859375, "global_step": 455505, "epoch": 5488} {"train_loss": -26.233051300048828, "global_step": 455506, "epoch": 5488} {"train_loss": -26.0574951171875, "global_step": 455507, "epoch": 5488} {"train_loss": -26.265111923217773, "global_step": 455508, "epoch": 5488} {"train_loss": -26.50967788696289, "global_step": 455509, "epoch": 5488} {"train_loss": -26.377721786499023, "global_step": 455510, "epoch": 5488} {"train_loss": -26.53985595703125, "global_step": 455511, "epoch": 5488} {"train_loss": -26.582502365112305, "global_step": 455512, "epoch": 5488} {"train_loss": -26.543720245361328, "global_step": 455513, "epoch": 5488} {"train_loss": -26.6525821685791, "global_step": 455514, "epoch": 5488} {"train_loss": -26.99492835998535, "global_step": 455515, "epoch": 5488} {"train_loss": -26.2052059173584, "global_step": 455516, "epoch": 5488} {"train_loss": -26.6920108795166, "global_step": 455517, "epoch": 5488} {"train_loss": -26.796497344970703, "global_step": 455518, "epoch": 5488} {"train_loss": -26.642026901245117, "global_step": 455519, "epoch": 5488} {"train_loss": -26.565534591674805, "global_step": 455520, "epoch": 5488} {"train_loss": -27.033353805541992, "global_step": 455521, "epoch": 5488} {"train_loss": -26.89143180847168, "global_step": 455522, "epoch": 5488} {"train_loss": -26.740921020507812, "global_step": 455523, "epoch": 5488} {"train_loss": -26.78032875061035, "global_step": 455524, "epoch": 5488} {"train_loss": -27.114606857299805, "global_step": 455525, "epoch": 5488} {"train_loss": -26.821304321289062, "global_step": 455526, "epoch": 5488} {"train_loss": -26.772968292236328, "global_step": 455527, "epoch": 5488} {"train_loss": -26.686120986938477, "global_step": 455528, "epoch": 5488} {"train_loss": -26.7904109954834, "global_step": 455529, "epoch": 5488} {"train_loss": -27.13443374633789, "global_step": 455530, "epoch": 5488} {"train_loss": -27.20212173461914, "global_step": 455531, "epoch": 5488} {"train_loss": -26.79933738708496, "global_step": 455532, "epoch": 5488} {"train_loss": -26.943561553955078, "global_step": 455533, "epoch": 5488} {"train_loss": -26.95849609375, "global_step": 455534, "epoch": 5488} {"train_loss": -27.09404945373535, "global_step": 455535, "epoch": 5488} {"train_loss": -26.954572677612305, "global_step": 455536, "epoch": 5488} {"train_loss": -27.282169342041016, "global_step": 455537, "epoch": 5488} {"train_loss": -27.188467025756836, "global_step": 455538, "epoch": 5488} {"train_loss": -27.249561309814453, "global_step": 455539, "epoch": 5488} {"train_loss": -27.403043746948242, "global_step": 455540, "epoch": 5488} {"train_loss": -27.338987350463867, "global_step": 455541, "epoch": 5488} {"train_loss": -27.060626983642578, "global_step": 455542, "epoch": 5488} {"train_loss": -27.6218318939209, "global_step": 455543, "epoch": 5488} {"train_loss": -27.148462295532227, "global_step": 455544, "epoch": 5488} {"train_loss": -26.762720108032227, "global_step": 455545, "epoch": 5488} {"train_loss": -27.186269760131836, "global_step": 455546, "epoch": 5488} {"train_loss": -27.084552764892578, "global_step": 455547, "epoch": 5488} {"train_loss": -27.01409912109375, "global_step": 455548, "epoch": 5488} {"train_loss": -27.333478927612305, "global_step": 455549, "epoch": 5488} {"train_loss": -27.27011489868164, "global_step": 455550, "epoch": 5488} {"train_loss": -27.25864601135254, "global_step": 455551, "epoch": 5488} {"train_loss": -27.42351722717285, "global_step": 455552, "epoch": 5488} {"train_loss": -27.05316734313965, "global_step": 455553, "epoch": 5488} {"train_loss": -27.463586807250977, "global_step": 455554, "epoch": 5488} {"train_loss": -27.13210105895996, "global_step": 455555, "epoch": 5488} {"train_loss": -27.29803466796875, "global_step": 455556, "epoch": 5488} {"train_loss": -27.170169830322266, "global_step": 455557, "epoch": 5488} {"train_loss": -27.508529663085938, "global_step": 455558, "epoch": 5488} {"train_loss": -27.137165069580078, "global_step": 455559, "epoch": 5488} {"train_loss": -26.811664581298828, "global_step": 455560, "epoch": 5488} {"train_loss": -27.03925132751465, "global_step": 455561, "epoch": 5488} {"train_loss": -27.278310775756836, "global_step": 455562, "epoch": 5488} {"train_loss": -26.96978187561035, "global_step": 455563, "epoch": 5488} {"train_loss": -26.951995849609375, "global_step": 455564, "epoch": 5488} {"train_loss": -27.2224178314209, "global_step": 455565, "epoch": 5488} {"train_loss": -27.0292911529541, "global_step": 455566, "epoch": 5488} {"train_loss": -27.072418212890625, "global_step": 455567, "epoch": 5488} {"train_loss": -27.134748458862305, "global_step": 455568, "epoch": 5488} {"train_loss": -27.518569946289062, "global_step": 455569, "epoch": 5488} {"train_loss": -26.986438751220703, "global_step": 455570, "epoch": 5488} {"train_loss": -26.924772262573242, "global_step": 455571, "epoch": 5488} {"train_loss": -26.991931915283203, "global_step": 455572, "epoch": 5488} {"train_loss": -27.380218505859375, "global_step": 455573, "epoch": 5488} {"train_loss": -27.328937530517578, "global_step": 455574, "epoch": 5488} {"train_loss": -27.261808395385742, "global_step": 455575, "epoch": 5488} {"train_loss": -27.006574630737305, "global_step": 455576, "epoch": 5488} {"train_loss": -26.912158966064453, "global_step": 455577, "epoch": 5488} {"train_loss": -27.158735275268555, "global_step": 455578, "epoch": 5488} {"train_loss": -26.845539093017578, "global_step": 455579, "epoch": 5488} {"train_loss": -27.01679039001465, "global_step": 455580, "epoch": 5488} {"train_loss": -26.965585708618164, "global_step": 455581, "epoch": 5488} {"train_loss": -27.43642234802246, "global_step": 455582, "epoch": 5488} {"train_loss": -27.023345947265625, "global_step": 455583, "epoch": 5488} {"train_loss": -26.910018920898438, "global_step": 455584, "epoch": 5488} {"train_loss": -27.421512603759766, "global_step": 455585, "epoch": 5488} {"train_loss": -26.97245147429317, "global_step": 455586, "epoch": 5488, "val_loss": 6627274.0} {"train_loss": -25.9351806640625, "global_step": 455587, "epoch": 5489} {"train_loss": -26.064804077148438, "global_step": 455588, "epoch": 5489} {"train_loss": -26.94935417175293, "global_step": 455589, "epoch": 5489} {"train_loss": -26.233306884765625, "global_step": 455590, "epoch": 5489} {"train_loss": -26.881372451782227, "global_step": 455591, "epoch": 5489} {"train_loss": -26.76898765563965, "global_step": 455592, "epoch": 5489} {"train_loss": -26.670303344726562, "global_step": 455593, "epoch": 5489} {"train_loss": -26.6340389251709, "global_step": 455594, "epoch": 5489} {"train_loss": -26.535367965698242, "global_step": 455595, "epoch": 5489} {"train_loss": -26.41168785095215, "global_step": 455596, "epoch": 5489} {"train_loss": -26.737003326416016, "global_step": 455597, "epoch": 5489} {"train_loss": -26.298995971679688, "global_step": 455598, "epoch": 5489} {"train_loss": -26.46567153930664, "global_step": 455599, "epoch": 5489} {"train_loss": -26.632755279541016, "global_step": 455600, "epoch": 5489} {"train_loss": -27.21746826171875, "global_step": 455601, "epoch": 5489} {"train_loss": -26.8331356048584, "global_step": 455602, "epoch": 5489} {"train_loss": -27.099903106689453, "global_step": 455603, "epoch": 5489} {"train_loss": -26.65943717956543, "global_step": 455604, "epoch": 5489} {"train_loss": -26.86992835998535, "global_step": 455605, "epoch": 5489} {"train_loss": -26.821699142456055, "global_step": 455606, "epoch": 5489} {"train_loss": -26.877887725830078, "global_step": 455607, "epoch": 5489} {"train_loss": -26.457117080688477, "global_step": 455608, "epoch": 5489} {"train_loss": -26.73197364807129, "global_step": 455609, "epoch": 5489} {"train_loss": -26.675405502319336, "global_step": 455610, "epoch": 5489} {"train_loss": -26.8043155670166, "global_step": 455611, "epoch": 5489} {"train_loss": -26.9783992767334, "global_step": 455612, "epoch": 5489} {"train_loss": -26.57972526550293, "global_step": 455613, "epoch": 5489} {"train_loss": -26.9401798248291, "global_step": 455614, "epoch": 5489} {"train_loss": -26.962636947631836, "global_step": 455615, "epoch": 5489} {"train_loss": -27.280935287475586, "global_step": 455616, "epoch": 5489} {"train_loss": -27.1217098236084, "global_step": 455617, "epoch": 5489} {"train_loss": -26.64786720275879, "global_step": 455618, "epoch": 5489} {"train_loss": -26.871692657470703, "global_step": 455619, "epoch": 5489} {"train_loss": -26.821325302124023, "global_step": 455620, "epoch": 5489} {"train_loss": -27.261646270751953, "global_step": 455621, "epoch": 5489} {"train_loss": -27.396209716796875, "global_step": 455622, "epoch": 5489} {"train_loss": -26.934911727905273, "global_step": 455623, "epoch": 5489} {"train_loss": -27.30856704711914, "global_step": 455624, "epoch": 5489} {"train_loss": -26.87757682800293, "global_step": 455625, "epoch": 5489} {"train_loss": -27.334354400634766, "global_step": 455626, "epoch": 5489} {"train_loss": -27.19953727722168, "global_step": 455627, "epoch": 5489} {"train_loss": -27.234304428100586, "global_step": 455628, "epoch": 5489} {"train_loss": -27.055612564086914, "global_step": 455629, "epoch": 5489} {"train_loss": -27.436445236206055, "global_step": 455630, "epoch": 5489} {"train_loss": -27.221725463867188, "global_step": 455631, "epoch": 5489} {"train_loss": -27.553491592407227, "global_step": 455632, "epoch": 5489} {"train_loss": -26.95148277282715, "global_step": 455633, "epoch": 5489} {"train_loss": -27.304655075073242, "global_step": 455634, "epoch": 5489} {"train_loss": -26.83868980407715, "global_step": 455635, "epoch": 5489} {"train_loss": -26.855566024780273, "global_step": 455636, "epoch": 5489} {"train_loss": -27.11420249938965, "global_step": 455637, "epoch": 5489} {"train_loss": -27.319608688354492, "global_step": 455638, "epoch": 5489} {"train_loss": -27.018329620361328, "global_step": 455639, "epoch": 5489} {"train_loss": -27.343109130859375, "global_step": 455640, "epoch": 5489} {"train_loss": -27.41947364807129, "global_step": 455641, "epoch": 5489} {"train_loss": -27.179061889648438, "global_step": 455642, "epoch": 5489} {"train_loss": -26.76519203186035, "global_step": 455643, "epoch": 5489} {"train_loss": -27.281797409057617, "global_step": 455644, "epoch": 5489} {"train_loss": -26.566755294799805, "global_step": 455645, "epoch": 5489} {"train_loss": -26.84319496154785, "global_step": 455646, "epoch": 5489} {"train_loss": -27.087860107421875, "global_step": 455647, "epoch": 5489} {"train_loss": -27.29705810546875, "global_step": 455648, "epoch": 5489} {"train_loss": -26.93524742126465, "global_step": 455649, "epoch": 5489} {"train_loss": -27.085851669311523, "global_step": 455650, "epoch": 5489} {"train_loss": -27.12211036682129, "global_step": 455651, "epoch": 5489} {"train_loss": -26.716388702392578, "global_step": 455652, "epoch": 5489} {"train_loss": -26.882165908813477, "global_step": 455653, "epoch": 5489} {"train_loss": -26.894399642944336, "global_step": 455654, "epoch": 5489} {"train_loss": -26.653913497924805, "global_step": 455655, "epoch": 5489} {"train_loss": -26.936948776245117, "global_step": 455656, "epoch": 5489} {"train_loss": -26.965787887573242, "global_step": 455657, "epoch": 5489} {"train_loss": -26.8886661529541, "global_step": 455658, "epoch": 5489} {"train_loss": -26.6044921875, "global_step": 455659, "epoch": 5489} {"train_loss": -26.772382736206055, "global_step": 455660, "epoch": 5489} {"train_loss": -26.992176055908203, "global_step": 455661, "epoch": 5489} {"train_loss": -27.19947624206543, "global_step": 455662, "epoch": 5489} {"train_loss": -26.817419052124023, "global_step": 455663, "epoch": 5489} {"train_loss": -26.97517204284668, "global_step": 455664, "epoch": 5489} {"train_loss": -26.938894271850586, "global_step": 455665, "epoch": 5489} {"train_loss": -27.10601234436035, "global_step": 455666, "epoch": 5489} {"train_loss": -26.90591812133789, "global_step": 455667, "epoch": 5489} {"train_loss": -27.152685165405273, "global_step": 455668, "epoch": 5489} {"train_loss": -26.929425756615327, "global_step": 455669, "epoch": 5489, "val_loss": 6483205.0} {"train_loss": -26.423124313354492, "global_step": 455670, "epoch": 5490} {"train_loss": -26.175668716430664, "global_step": 455671, "epoch": 5490} {"train_loss": -26.698328018188477, "global_step": 455672, "epoch": 5490} {"train_loss": -26.390628814697266, "global_step": 455673, "epoch": 5490} {"train_loss": -26.279870986938477, "global_step": 455674, "epoch": 5490} {"train_loss": -26.547021865844727, "global_step": 455675, "epoch": 5490} {"train_loss": -26.296964645385742, "global_step": 455676, "epoch": 5490} {"train_loss": -26.67795181274414, "global_step": 455677, "epoch": 5490} {"train_loss": -27.009119033813477, "global_step": 455678, "epoch": 5490} {"train_loss": -26.91517448425293, "global_step": 455679, "epoch": 5490} {"train_loss": -26.748441696166992, "global_step": 455680, "epoch": 5490} {"train_loss": -26.644927978515625, "global_step": 455681, "epoch": 5490} {"train_loss": -26.685922622680664, "global_step": 455682, "epoch": 5490} {"train_loss": -26.6278076171875, "global_step": 455683, "epoch": 5490} {"train_loss": -27.172748565673828, "global_step": 455684, "epoch": 5490} {"train_loss": -26.88958740234375, "global_step": 455685, "epoch": 5490} {"train_loss": -26.856037139892578, "global_step": 455686, "epoch": 5490} {"train_loss": -27.076330184936523, "global_step": 455687, "epoch": 5490} {"train_loss": -26.867841720581055, "global_step": 455688, "epoch": 5490} {"train_loss": -27.08941650390625, "global_step": 455689, "epoch": 5490} {"train_loss": -27.1004638671875, "global_step": 455690, "epoch": 5490} {"train_loss": -27.01263427734375, "global_step": 455691, "epoch": 5490} {"train_loss": -26.847782135009766, "global_step": 455692, "epoch": 5490} {"train_loss": -27.24091148376465, "global_step": 455693, "epoch": 5490} {"train_loss": -27.07171630859375, "global_step": 455694, "epoch": 5490} {"train_loss": -27.321979522705078, "global_step": 455695, "epoch": 5490} {"train_loss": -27.27033042907715, "global_step": 455696, "epoch": 5490} {"train_loss": -27.20130729675293, "global_step": 455697, "epoch": 5490} {"train_loss": -27.270532608032227, "global_step": 455698, "epoch": 5490} {"train_loss": -27.347400665283203, "global_step": 455699, "epoch": 5490} {"train_loss": -26.83734703063965, "global_step": 455700, "epoch": 5490} {"train_loss": -27.028213500976562, "global_step": 455701, "epoch": 5490} {"train_loss": -27.12836265563965, "global_step": 455702, "epoch": 5490} {"train_loss": -27.217859268188477, "global_step": 455703, "epoch": 5490} {"train_loss": -27.152063369750977, "global_step": 455704, "epoch": 5490} {"train_loss": -27.465240478515625, "global_step": 455705, "epoch": 5490} {"train_loss": -27.03203773498535, "global_step": 455706, "epoch": 5490} {"train_loss": -27.312788009643555, "global_step": 455707, "epoch": 5490} {"train_loss": -27.501184463500977, "global_step": 455708, "epoch": 5490} {"train_loss": -27.219879150390625, "global_step": 455709, "epoch": 5490} {"train_loss": -27.179534912109375, "global_step": 455710, "epoch": 5490} {"train_loss": -26.79438591003418, "global_step": 455711, "epoch": 5490} {"train_loss": -26.677967071533203, "global_step": 455712, "epoch": 5490} {"train_loss": -27.29146385192871, "global_step": 455713, "epoch": 5490} {"train_loss": -27.42042350769043, "global_step": 455714, "epoch": 5490} {"train_loss": -27.214181900024414, "global_step": 455715, "epoch": 5490} {"train_loss": -27.365589141845703, "global_step": 455716, "epoch": 5490} {"train_loss": -27.153705596923828, "global_step": 455717, "epoch": 5490} {"train_loss": -26.73964500427246, "global_step": 455718, "epoch": 5490} {"train_loss": -26.805362701416016, "global_step": 455719, "epoch": 5490} {"train_loss": -26.580169677734375, "global_step": 455720, "epoch": 5490} {"train_loss": -26.55470848083496, "global_step": 455721, "epoch": 5490} {"train_loss": -26.33888053894043, "global_step": 455722, "epoch": 5490} {"train_loss": -26.486602783203125, "global_step": 455723, "epoch": 5490} {"train_loss": -26.40003776550293, "global_step": 455724, "epoch": 5490} {"train_loss": -26.943639755249023, "global_step": 455725, "epoch": 5490} {"train_loss": -26.87051773071289, "global_step": 455726, "epoch": 5490} {"train_loss": -26.411548614501953, "global_step": 455727, "epoch": 5490} {"train_loss": -26.745697021484375, "global_step": 455728, "epoch": 5490} {"train_loss": -26.805200576782227, "global_step": 455729, "epoch": 5490} {"train_loss": -26.844852447509766, "global_step": 455730, "epoch": 5490} {"train_loss": -27.031558990478516, "global_step": 455731, "epoch": 5490} {"train_loss": -26.917993545532227, "global_step": 455732, "epoch": 5490} {"train_loss": -27.08257484436035, "global_step": 455733, "epoch": 5490} {"train_loss": -26.906253814697266, "global_step": 455734, "epoch": 5490} {"train_loss": -27.221912384033203, "global_step": 455735, "epoch": 5490} {"train_loss": -27.058664321899414, "global_step": 455736, "epoch": 5490} {"train_loss": -27.0063419342041, "global_step": 455737, "epoch": 5490} {"train_loss": -27.066944122314453, "global_step": 455738, "epoch": 5490} {"train_loss": -27.133975982666016, "global_step": 455739, "epoch": 5490} {"train_loss": -27.086355209350586, "global_step": 455740, "epoch": 5490} {"train_loss": -27.268238067626953, "global_step": 455741, "epoch": 5490} {"train_loss": -27.059207916259766, "global_step": 455742, "epoch": 5490} {"train_loss": -27.35247802734375, "global_step": 455743, "epoch": 5490} {"train_loss": -27.180356979370117, "global_step": 455744, "epoch": 5490} {"train_loss": -26.97536277770996, "global_step": 455745, "epoch": 5490} {"train_loss": -26.95114517211914, "global_step": 455746, "epoch": 5490} {"train_loss": -27.0411319732666, "global_step": 455747, "epoch": 5490} {"train_loss": -27.10210609436035, "global_step": 455748, "epoch": 5490} {"train_loss": -27.091806411743164, "global_step": 455749, "epoch": 5490} {"train_loss": -27.331113815307617, "global_step": 455750, "epoch": 5490} {"train_loss": -27.25904655456543, "global_step": 455751, "epoch": 5490} {"train_loss": -26.96330750706684, "global_step": 455752, "epoch": 5490, "val_loss": 6529018.0} {"train_loss": -26.886478424072266, "global_step": 455753, "epoch": 5491} {"train_loss": -27.179880142211914, "global_step": 455754, "epoch": 5491} {"train_loss": -26.58319091796875, "global_step": 455755, "epoch": 5491} {"train_loss": -27.141767501831055, "global_step": 455756, "epoch": 5491} {"train_loss": -27.064350128173828, "global_step": 455757, "epoch": 5491} {"train_loss": -27.012680053710938, "global_step": 455758, "epoch": 5491} {"train_loss": -27.07941246032715, "global_step": 455759, "epoch": 5491} {"train_loss": -27.259260177612305, "global_step": 455760, "epoch": 5491} {"train_loss": -27.135080337524414, "global_step": 455761, "epoch": 5491} {"train_loss": -27.073415756225586, "global_step": 455762, "epoch": 5491} {"train_loss": -27.063642501831055, "global_step": 455763, "epoch": 5491} {"train_loss": -27.23560905456543, "global_step": 455764, "epoch": 5491} {"train_loss": -26.886823654174805, "global_step": 455765, "epoch": 5491} {"train_loss": -27.3727970123291, "global_step": 455766, "epoch": 5491} {"train_loss": -27.186033248901367, "global_step": 455767, "epoch": 5491} {"train_loss": -27.139379501342773, "global_step": 455768, "epoch": 5491} {"train_loss": -27.347076416015625, "global_step": 455769, "epoch": 5491} {"train_loss": -27.14031982421875, "global_step": 455770, "epoch": 5491} {"train_loss": -26.9139461517334, "global_step": 455771, "epoch": 5491} {"train_loss": -27.173994064331055, "global_step": 455772, "epoch": 5491} {"train_loss": -26.878997802734375, "global_step": 455773, "epoch": 5491} {"train_loss": -27.18354606628418, "global_step": 455774, "epoch": 5491} {"train_loss": -27.199848175048828, "global_step": 455775, "epoch": 5491} {"train_loss": -26.905963897705078, "global_step": 455776, "epoch": 5491} {"train_loss": -26.814544677734375, "global_step": 455777, "epoch": 5491} {"train_loss": -26.98915672302246, "global_step": 455778, "epoch": 5491} {"train_loss": -26.999555587768555, "global_step": 455779, "epoch": 5491} {"train_loss": -27.250782012939453, "global_step": 455780, "epoch": 5491} {"train_loss": -27.10748291015625, "global_step": 455781, "epoch": 5491} {"train_loss": -27.31300926208496, "global_step": 455782, "epoch": 5491} {"train_loss": -27.11298179626465, "global_step": 455783, "epoch": 5491} {"train_loss": -27.274961471557617, "global_step": 455784, "epoch": 5491} {"train_loss": -27.20086669921875, "global_step": 455785, "epoch": 5491} {"train_loss": -26.963642120361328, "global_step": 455786, "epoch": 5491} {"train_loss": -27.201507568359375, "global_step": 455787, "epoch": 5491} {"train_loss": -26.938861846923828, "global_step": 455788, "epoch": 5491} {"train_loss": -27.152545928955078, "global_step": 455789, "epoch": 5491} {"train_loss": -27.16465187072754, "global_step": 455790, "epoch": 5491} {"train_loss": -26.89759635925293, "global_step": 455791, "epoch": 5491} {"train_loss": -27.140167236328125, "global_step": 455792, "epoch": 5491} {"train_loss": -27.4066219329834, "global_step": 455793, "epoch": 5491} {"train_loss": -27.373310089111328, "global_step": 455794, "epoch": 5491} {"train_loss": -27.174545288085938, "global_step": 455795, "epoch": 5491} {"train_loss": -27.16163444519043, "global_step": 455796, "epoch": 5491} {"train_loss": -27.246713638305664, "global_step": 455797, "epoch": 5491} {"train_loss": -27.05182456970215, "global_step": 455798, "epoch": 5491} {"train_loss": -26.870325088500977, "global_step": 455799, "epoch": 5491} {"train_loss": -27.292251586914062, "global_step": 455800, "epoch": 5491} {"train_loss": -26.915292739868164, "global_step": 455801, "epoch": 5491} {"train_loss": -27.00311279296875, "global_step": 455802, "epoch": 5491} {"train_loss": -26.900604248046875, "global_step": 455803, "epoch": 5491} {"train_loss": -26.867279052734375, "global_step": 455804, "epoch": 5491} {"train_loss": -27.117446899414062, "global_step": 455805, "epoch": 5491} {"train_loss": -27.026432037353516, "global_step": 455806, "epoch": 5491} {"train_loss": -26.9188232421875, "global_step": 455807, "epoch": 5491} {"train_loss": -27.40925407409668, "global_step": 455808, "epoch": 5491} {"train_loss": -26.892969131469727, "global_step": 455809, "epoch": 5491} {"train_loss": -26.981428146362305, "global_step": 455810, "epoch": 5491} {"train_loss": -26.361448287963867, "global_step": 455811, "epoch": 5491} {"train_loss": -26.8392333984375, "global_step": 455812, "epoch": 5491} {"train_loss": -26.909666061401367, "global_step": 455813, "epoch": 5491} {"train_loss": -26.74519157409668, "global_step": 455814, "epoch": 5491} {"train_loss": -26.88897132873535, "global_step": 455815, "epoch": 5491} {"train_loss": -26.758581161499023, "global_step": 455816, "epoch": 5491} {"train_loss": -26.725431442260742, "global_step": 455817, "epoch": 5491} {"train_loss": -27.066892623901367, "global_step": 455818, "epoch": 5491} {"train_loss": -26.8880672454834, "global_step": 455819, "epoch": 5491} {"train_loss": -26.939956665039062, "global_step": 455820, "epoch": 5491} {"train_loss": -27.214786529541016, "global_step": 455821, "epoch": 5491} {"train_loss": -26.951007843017578, "global_step": 455822, "epoch": 5491} {"train_loss": -26.67740821838379, "global_step": 455823, "epoch": 5491} {"train_loss": -27.134180068969727, "global_step": 455824, "epoch": 5491} {"train_loss": -27.122802734375, "global_step": 455825, "epoch": 5491} {"train_loss": -27.29902458190918, "global_step": 455826, "epoch": 5491} {"train_loss": -27.080005645751953, "global_step": 455827, "epoch": 5491} {"train_loss": -27.191619873046875, "global_step": 455828, "epoch": 5491} {"train_loss": -27.0449275970459, "global_step": 455829, "epoch": 5491} {"train_loss": -26.96504783630371, "global_step": 455830, "epoch": 5491} {"train_loss": -27.0714168548584, "global_step": 455831, "epoch": 5491} {"train_loss": -27.332447052001953, "global_step": 455832, "epoch": 5491} {"train_loss": -26.829397201538086, "global_step": 455833, "epoch": 5491} {"train_loss": -27.222742080688477, "global_step": 455834, "epoch": 5491} {"train_loss": -27.042065792773144, "global_step": 455835, "epoch": 5491, "val_loss": 6590733.0} {"train_loss": -26.890838623046875, "global_step": 455836, "epoch": 5492} {"train_loss": -26.45111656188965, "global_step": 455837, "epoch": 5492} {"train_loss": -26.999225616455078, "global_step": 455838, "epoch": 5492} {"train_loss": -26.976123809814453, "global_step": 455839, "epoch": 5492} {"train_loss": -26.856109619140625, "global_step": 455840, "epoch": 5492} {"train_loss": -26.74000358581543, "global_step": 455841, "epoch": 5492} {"train_loss": -27.082233428955078, "global_step": 455842, "epoch": 5492} {"train_loss": -26.884973526000977, "global_step": 455843, "epoch": 5492} {"train_loss": -26.9970645904541, "global_step": 455844, "epoch": 5492} {"train_loss": -26.89841079711914, "global_step": 455845, "epoch": 5492} {"train_loss": -26.871747970581055, "global_step": 455846, "epoch": 5492} {"train_loss": -27.432281494140625, "global_step": 455847, "epoch": 5492} {"train_loss": -27.094327926635742, "global_step": 455848, "epoch": 5492} {"train_loss": -26.700971603393555, "global_step": 455849, "epoch": 5492} {"train_loss": -27.196197509765625, "global_step": 455850, "epoch": 5492} {"train_loss": -27.15159034729004, "global_step": 455851, "epoch": 5492} {"train_loss": -27.422094345092773, "global_step": 455852, "epoch": 5492} {"train_loss": -27.121198654174805, "global_step": 455853, "epoch": 5492} {"train_loss": -27.278884887695312, "global_step": 455854, "epoch": 5492} {"train_loss": -27.304534912109375, "global_step": 455855, "epoch": 5492} {"train_loss": -26.944730758666992, "global_step": 455856, "epoch": 5492} {"train_loss": -27.15101432800293, "global_step": 455857, "epoch": 5492} {"train_loss": -26.84807777404785, "global_step": 455858, "epoch": 5492} {"train_loss": -27.121835708618164, "global_step": 455859, "epoch": 5492} {"train_loss": -27.299823760986328, "global_step": 455860, "epoch": 5492} {"train_loss": -27.522329330444336, "global_step": 455861, "epoch": 5492} {"train_loss": -27.320953369140625, "global_step": 455862, "epoch": 5492} {"train_loss": -27.145450592041016, "global_step": 455863, "epoch": 5492} {"train_loss": -27.225269317626953, "global_step": 455864, "epoch": 5492} {"train_loss": -27.121183395385742, "global_step": 455865, "epoch": 5492} {"train_loss": -27.315351486206055, "global_step": 455866, "epoch": 5492} {"train_loss": -27.34015464782715, "global_step": 455867, "epoch": 5492} {"train_loss": -27.3193416595459, "global_step": 455868, "epoch": 5492} {"train_loss": -27.21645164489746, "global_step": 455869, "epoch": 5492} {"train_loss": -27.245269775390625, "global_step": 455870, "epoch": 5492} {"train_loss": -27.053180694580078, "global_step": 455871, "epoch": 5492} {"train_loss": -27.512725830078125, "global_step": 455872, "epoch": 5492} {"train_loss": -27.211652755737305, "global_step": 455873, "epoch": 5492} {"train_loss": -27.333383560180664, "global_step": 455874, "epoch": 5492} {"train_loss": -27.133167266845703, "global_step": 455875, "epoch": 5492} {"train_loss": -27.116479873657227, "global_step": 455876, "epoch": 5492} {"train_loss": -26.9238224029541, "global_step": 455877, "epoch": 5492} {"train_loss": -27.443191528320312, "global_step": 455878, "epoch": 5492} {"train_loss": -27.012176513671875, "global_step": 455879, "epoch": 5492} {"train_loss": -26.990203857421875, "global_step": 455880, "epoch": 5492} {"train_loss": -27.261194229125977, "global_step": 455881, "epoch": 5492} {"train_loss": -26.222936630249023, "global_step": 455882, "epoch": 5492} {"train_loss": -26.796573638916016, "global_step": 455883, "epoch": 5492} {"train_loss": -26.74009132385254, "global_step": 455884, "epoch": 5492} {"train_loss": -27.168664932250977, "global_step": 455885, "epoch": 5492} {"train_loss": -27.2561092376709, "global_step": 455886, "epoch": 5492} {"train_loss": -27.209745407104492, "global_step": 455887, "epoch": 5492} {"train_loss": -27.33939552307129, "global_step": 455888, "epoch": 5492} {"train_loss": -27.20479393005371, "global_step": 455889, "epoch": 5492} {"train_loss": -27.19685173034668, "global_step": 455890, "epoch": 5492} {"train_loss": -27.386178970336914, "global_step": 455891, "epoch": 5492} {"train_loss": -27.296308517456055, "global_step": 455892, "epoch": 5492} {"train_loss": -27.57806396484375, "global_step": 455893, "epoch": 5492} {"train_loss": -27.128759384155273, "global_step": 455894, "epoch": 5492} {"train_loss": -27.232770919799805, "global_step": 455895, "epoch": 5492} {"train_loss": -27.086645126342773, "global_step": 455896, "epoch": 5492} {"train_loss": -27.084314346313477, "global_step": 455897, "epoch": 5492} {"train_loss": -27.10085105895996, "global_step": 455898, "epoch": 5492} {"train_loss": -26.53035545349121, "global_step": 455899, "epoch": 5492} {"train_loss": -26.360387802124023, "global_step": 455900, "epoch": 5492} {"train_loss": -26.129194259643555, "global_step": 455901, "epoch": 5492} {"train_loss": -26.602502822875977, "global_step": 455902, "epoch": 5492} {"train_loss": -26.793197631835938, "global_step": 455903, "epoch": 5492} {"train_loss": -26.437253952026367, "global_step": 455904, "epoch": 5492} {"train_loss": -26.748687744140625, "global_step": 455905, "epoch": 5492} {"train_loss": -26.356794357299805, "global_step": 455906, "epoch": 5492} {"train_loss": -26.716598510742188, "global_step": 455907, "epoch": 5492} {"train_loss": -26.247467041015625, "global_step": 455908, "epoch": 5492} {"train_loss": -26.934823989868164, "global_step": 455909, "epoch": 5492} {"train_loss": -26.792789459228516, "global_step": 455910, "epoch": 5492} {"train_loss": -27.06366539001465, "global_step": 455911, "epoch": 5492} {"train_loss": -26.742786407470703, "global_step": 455912, "epoch": 5492} {"train_loss": -26.79345703125, "global_step": 455913, "epoch": 5492} {"train_loss": -26.73554039001465, "global_step": 455914, "epoch": 5492} {"train_loss": -26.9887638092041, "global_step": 455915, "epoch": 5492} {"train_loss": -27.154987335205078, "global_step": 455916, "epoch": 5492} {"train_loss": -26.798934936523438, "global_step": 455917, "epoch": 5492} {"train_loss": -27.012535830578173, "global_step": 455918, "epoch": 5492, "val_loss": 6614356.0} {"train_loss": -25.745893478393555, "global_step": 455919, "epoch": 5493} {"train_loss": -25.322702407836914, "global_step": 455920, "epoch": 5493} {"train_loss": -25.611499786376953, "global_step": 455921, "epoch": 5493} {"train_loss": -26.400989532470703, "global_step": 455922, "epoch": 5493} {"train_loss": -25.691272735595703, "global_step": 455923, "epoch": 5493} {"train_loss": -26.472217559814453, "global_step": 455924, "epoch": 5493} {"train_loss": -26.505563735961914, "global_step": 455925, "epoch": 5493} {"train_loss": -26.16145896911621, "global_step": 455926, "epoch": 5493} {"train_loss": -26.206634521484375, "global_step": 455927, "epoch": 5493} {"train_loss": -26.19209098815918, "global_step": 455928, "epoch": 5493} {"train_loss": -26.8038272857666, "global_step": 455929, "epoch": 5493} {"train_loss": -26.193456649780273, "global_step": 455930, "epoch": 5493} {"train_loss": -26.519012451171875, "global_step": 455931, "epoch": 5493} {"train_loss": -26.500818252563477, "global_step": 455932, "epoch": 5493} {"train_loss": -26.54176139831543, "global_step": 455933, "epoch": 5493} {"train_loss": -26.216230392456055, "global_step": 455934, "epoch": 5493} {"train_loss": -26.667810440063477, "global_step": 455935, "epoch": 5493} {"train_loss": -26.4306583404541, "global_step": 455936, "epoch": 5493} {"train_loss": -26.5142822265625, "global_step": 455937, "epoch": 5493} {"train_loss": -26.5858211517334, "global_step": 455938, "epoch": 5493} {"train_loss": -27.010095596313477, "global_step": 455939, "epoch": 5493} {"train_loss": -26.625049591064453, "global_step": 455940, "epoch": 5493} {"train_loss": -26.901676177978516, "global_step": 455941, "epoch": 5493} {"train_loss": -26.934722900390625, "global_step": 455942, "epoch": 5493} {"train_loss": -26.88739013671875, "global_step": 455943, "epoch": 5493} {"train_loss": -27.16997718811035, "global_step": 455944, "epoch": 5493} {"train_loss": -27.085798263549805, "global_step": 455945, "epoch": 5493} {"train_loss": -26.683338165283203, "global_step": 455946, "epoch": 5493} {"train_loss": -27.215784072875977, "global_step": 455947, "epoch": 5493} {"train_loss": -26.6992130279541, "global_step": 455948, "epoch": 5493} {"train_loss": -27.01752281188965, "global_step": 455949, "epoch": 5493} {"train_loss": -26.8375244140625, "global_step": 455950, "epoch": 5493} {"train_loss": -27.296369552612305, "global_step": 455951, "epoch": 5493} {"train_loss": -26.995468139648438, "global_step": 455952, "epoch": 5493} {"train_loss": -27.326257705688477, "global_step": 455953, "epoch": 5493} {"train_loss": -27.17231559753418, "global_step": 455954, "epoch": 5493} {"train_loss": -27.045190811157227, "global_step": 455955, "epoch": 5493} {"train_loss": -27.32527732849121, "global_step": 455956, "epoch": 5493} {"train_loss": -27.23514175415039, "global_step": 455957, "epoch": 5493} {"train_loss": -26.745935440063477, "global_step": 455958, "epoch": 5493} {"train_loss": -27.228071212768555, "global_step": 455959, "epoch": 5493} {"train_loss": -27.174072265625, "global_step": 455960, "epoch": 5493} {"train_loss": -27.022130966186523, "global_step": 455961, "epoch": 5493} {"train_loss": -27.030729293823242, "global_step": 455962, "epoch": 5493} {"train_loss": -27.224029541015625, "global_step": 455963, "epoch": 5493} {"train_loss": -27.64206314086914, "global_step": 455964, "epoch": 5493} {"train_loss": -27.212430953979492, "global_step": 455965, "epoch": 5493} {"train_loss": -27.439945220947266, "global_step": 455966, "epoch": 5493} {"train_loss": -27.3673152923584, "global_step": 455967, "epoch": 5493} {"train_loss": -27.26797866821289, "global_step": 455968, "epoch": 5493} {"train_loss": -27.296344757080078, "global_step": 455969, "epoch": 5493} {"train_loss": -27.328886032104492, "global_step": 455970, "epoch": 5493} {"train_loss": -27.618762969970703, "global_step": 455971, "epoch": 5493} {"train_loss": -27.10751724243164, "global_step": 455972, "epoch": 5493} {"train_loss": -27.236974716186523, "global_step": 455973, "epoch": 5493} {"train_loss": -27.2486515045166, "global_step": 455974, "epoch": 5493} {"train_loss": -27.422998428344727, "global_step": 455975, "epoch": 5493} {"train_loss": -27.352283477783203, "global_step": 455976, "epoch": 5493} {"train_loss": -27.30695152282715, "global_step": 455977, "epoch": 5493} {"train_loss": -27.454946517944336, "global_step": 455978, "epoch": 5493} {"train_loss": -27.39374351501465, "global_step": 455979, "epoch": 5493} {"train_loss": -27.00581169128418, "global_step": 455980, "epoch": 5493} {"train_loss": -27.429798126220703, "global_step": 455981, "epoch": 5493} {"train_loss": -27.23676109313965, "global_step": 455982, "epoch": 5493} {"train_loss": -27.072738647460938, "global_step": 455983, "epoch": 5493} {"train_loss": -27.272216796875, "global_step": 455984, "epoch": 5493} {"train_loss": -27.371429443359375, "global_step": 455985, "epoch": 5493} {"train_loss": -27.2374267578125, "global_step": 455986, "epoch": 5493} {"train_loss": -27.126096725463867, "global_step": 455987, "epoch": 5493} {"train_loss": -26.972501754760742, "global_step": 455988, "epoch": 5493} {"train_loss": -26.9910831451416, "global_step": 455989, "epoch": 5493} {"train_loss": -27.251983642578125, "global_step": 455990, "epoch": 5493} {"train_loss": -26.90752601623535, "global_step": 455991, "epoch": 5493} {"train_loss": -27.062814712524414, "global_step": 455992, "epoch": 5493} {"train_loss": -26.6948184967041, "global_step": 455993, "epoch": 5493} {"train_loss": -27.18533706665039, "global_step": 455994, "epoch": 5493} {"train_loss": -27.088184356689453, "global_step": 455995, "epoch": 5493} {"train_loss": -26.464746475219727, "global_step": 455996, "epoch": 5493} {"train_loss": -27.21142578125, "global_step": 455997, "epoch": 5493} {"train_loss": -27.141101837158203, "global_step": 455998, "epoch": 5493} {"train_loss": -27.24312400817871, "global_step": 455999, "epoch": 5493} {"train_loss": -27.195905685424805, "global_step": 456000, "epoch": 5493} {"train_loss": -26.93817844161068, "global_step": 456001, "epoch": 5493, "val_loss": 6624523.0} {"train_loss": -26.268991470336914, "global_step": 456002, "epoch": 5494} {"train_loss": -26.395288467407227, "global_step": 456003, "epoch": 5494} {"train_loss": -26.466466903686523, "global_step": 456004, "epoch": 5494} {"train_loss": -26.244922637939453, "global_step": 456005, "epoch": 5494} {"train_loss": -26.114673614501953, "global_step": 456006, "epoch": 5494} {"train_loss": -26.266508102416992, "global_step": 456007, "epoch": 5494} {"train_loss": -26.287561416625977, "global_step": 456008, "epoch": 5494} {"train_loss": -26.4890079498291, "global_step": 456009, "epoch": 5494} {"train_loss": -26.481470108032227, "global_step": 456010, "epoch": 5494} {"train_loss": -26.80915641784668, "global_step": 456011, "epoch": 5494} {"train_loss": -26.259241104125977, "global_step": 456012, "epoch": 5494} {"train_loss": -26.978567123413086, "global_step": 456013, "epoch": 5494} {"train_loss": -26.509765625, "global_step": 456014, "epoch": 5494} {"train_loss": -26.911848068237305, "global_step": 456015, "epoch": 5494} {"train_loss": -26.931432723999023, "global_step": 456016, "epoch": 5494} {"train_loss": -26.63392448425293, "global_step": 456017, "epoch": 5494} {"train_loss": -26.977636337280273, "global_step": 456018, "epoch": 5494} {"train_loss": -26.573209762573242, "global_step": 456019, "epoch": 5494} {"train_loss": -27.0739688873291, "global_step": 456020, "epoch": 5494} {"train_loss": -27.119449615478516, "global_step": 456021, "epoch": 5494} {"train_loss": -26.850971221923828, "global_step": 456022, "epoch": 5494} {"train_loss": -26.99903678894043, "global_step": 456023, "epoch": 5494} {"train_loss": -26.779325485229492, "global_step": 456024, "epoch": 5494} {"train_loss": -27.04095458984375, "global_step": 456025, "epoch": 5494} {"train_loss": -27.112030029296875, "global_step": 456026, "epoch": 5494} {"train_loss": -26.890653610229492, "global_step": 456027, "epoch": 5494} {"train_loss": -27.241397857666016, "global_step": 456028, "epoch": 5494} {"train_loss": -27.151304244995117, "global_step": 456029, "epoch": 5494} {"train_loss": -27.19294548034668, "global_step": 456030, "epoch": 5494} {"train_loss": -27.2122745513916, "global_step": 456031, "epoch": 5494} {"train_loss": -27.314844131469727, "global_step": 456032, "epoch": 5494} {"train_loss": -27.0283145904541, "global_step": 456033, "epoch": 5494} {"train_loss": -27.000696182250977, "global_step": 456034, "epoch": 5494} {"train_loss": -27.017303466796875, "global_step": 456035, "epoch": 5494} {"train_loss": -27.141210556030273, "global_step": 456036, "epoch": 5494} {"train_loss": -27.283838272094727, "global_step": 456037, "epoch": 5494} {"train_loss": -27.386301040649414, "global_step": 456038, "epoch": 5494} {"train_loss": -27.117237091064453, "global_step": 456039, "epoch": 5494} {"train_loss": -26.902307510375977, "global_step": 456040, "epoch": 5494} {"train_loss": -26.881818771362305, "global_step": 456041, "epoch": 5494} {"train_loss": -27.22258949279785, "global_step": 456042, "epoch": 5494} {"train_loss": -27.39825439453125, "global_step": 456043, "epoch": 5494} {"train_loss": -27.06679344177246, "global_step": 456044, "epoch": 5494} {"train_loss": -26.803298950195312, "global_step": 456045, "epoch": 5494} {"train_loss": -27.37983512878418, "global_step": 456046, "epoch": 5494} {"train_loss": -26.835309982299805, "global_step": 456047, "epoch": 5494} {"train_loss": -27.408157348632812, "global_step": 456048, "epoch": 5494} {"train_loss": -27.03901481628418, "global_step": 456049, "epoch": 5494} {"train_loss": -26.64508056640625, "global_step": 456050, "epoch": 5494} {"train_loss": -26.93865966796875, "global_step": 456051, "epoch": 5494} {"train_loss": -27.224735260009766, "global_step": 456052, "epoch": 5494} {"train_loss": -27.50553321838379, "global_step": 456053, "epoch": 5494} {"train_loss": -27.14697265625, "global_step": 456054, "epoch": 5494} {"train_loss": -27.23954200744629, "global_step": 456055, "epoch": 5494} {"train_loss": -27.089139938354492, "global_step": 456056, "epoch": 5494} {"train_loss": -27.13530921936035, "global_step": 456057, "epoch": 5494} {"train_loss": -27.17496109008789, "global_step": 456058, "epoch": 5494} {"train_loss": -27.104969024658203, "global_step": 456059, "epoch": 5494} {"train_loss": -26.630023956298828, "global_step": 456060, "epoch": 5494} {"train_loss": -26.71600341796875, "global_step": 456061, "epoch": 5494} {"train_loss": -26.101545333862305, "global_step": 456062, "epoch": 5494} {"train_loss": -26.098535537719727, "global_step": 456063, "epoch": 5494} {"train_loss": -26.76789665222168, "global_step": 456064, "epoch": 5494} {"train_loss": -27.058347702026367, "global_step": 456065, "epoch": 5494} {"train_loss": -26.02923583984375, "global_step": 456066, "epoch": 5494} {"train_loss": -26.463232040405273, "global_step": 456067, "epoch": 5494} {"train_loss": -27.286035537719727, "global_step": 456068, "epoch": 5494} {"train_loss": -26.78424644470215, "global_step": 456069, "epoch": 5494} {"train_loss": -27.35965919494629, "global_step": 456070, "epoch": 5494} {"train_loss": -26.57039451599121, "global_step": 456071, "epoch": 5494} {"train_loss": -27.05096435546875, "global_step": 456072, "epoch": 5494} {"train_loss": -26.705860137939453, "global_step": 456073, "epoch": 5494} {"train_loss": -27.28138542175293, "global_step": 456074, "epoch": 5494} {"train_loss": -26.946813583374023, "global_step": 456075, "epoch": 5494} {"train_loss": -27.11370277404785, "global_step": 456076, "epoch": 5494} {"train_loss": -26.872533798217773, "global_step": 456077, "epoch": 5494} {"train_loss": -27.105615615844727, "global_step": 456078, "epoch": 5494} {"train_loss": -26.93145751953125, "global_step": 456079, "epoch": 5494} {"train_loss": -27.30463981628418, "global_step": 456080, "epoch": 5494} {"train_loss": -27.16169548034668, "global_step": 456081, "epoch": 5494} {"train_loss": -27.141006469726562, "global_step": 456082, "epoch": 5494} {"train_loss": -27.650711059570312, "global_step": 456083, "epoch": 5494} {"train_loss": -26.926139188100056, "global_step": 456084, "epoch": 5494, "val_loss": 6674650.5} {"train_loss": -26.216312408447266, "global_step": 456085, "epoch": 5495} {"train_loss": -25.937231063842773, "global_step": 456086, "epoch": 5495} {"train_loss": -25.815046310424805, "global_step": 456087, "epoch": 5495} {"train_loss": -25.954511642456055, "global_step": 456088, "epoch": 5495} {"train_loss": -26.5640926361084, "global_step": 456089, "epoch": 5495} {"train_loss": -26.0799560546875, "global_step": 456090, "epoch": 5495} {"train_loss": -26.02164649963379, "global_step": 456091, "epoch": 5495} {"train_loss": -26.415098190307617, "global_step": 456092, "epoch": 5495} {"train_loss": -26.825693130493164, "global_step": 456093, "epoch": 5495} {"train_loss": -26.28997802734375, "global_step": 456094, "epoch": 5495} {"train_loss": -26.513036727905273, "global_step": 456095, "epoch": 5495} {"train_loss": -26.596288681030273, "global_step": 456096, "epoch": 5495} {"train_loss": -26.650741577148438, "global_step": 456097, "epoch": 5495} {"train_loss": -26.82367515563965, "global_step": 456098, "epoch": 5495} {"train_loss": -26.383100509643555, "global_step": 456099, "epoch": 5495} {"train_loss": -26.543752670288086, "global_step": 456100, "epoch": 5495} {"train_loss": -26.73953628540039, "global_step": 456101, "epoch": 5495} {"train_loss": -26.728918075561523, "global_step": 456102, "epoch": 5495} {"train_loss": -26.611169815063477, "global_step": 456103, "epoch": 5495} {"train_loss": -26.986774444580078, "global_step": 456104, "epoch": 5495} {"train_loss": -26.843408584594727, "global_step": 456105, "epoch": 5495} {"train_loss": -26.7442626953125, "global_step": 456106, "epoch": 5495} {"train_loss": -26.96406364440918, "global_step": 456107, "epoch": 5495} {"train_loss": -26.93996238708496, "global_step": 456108, "epoch": 5495} {"train_loss": -26.997976303100586, "global_step": 456109, "epoch": 5495} {"train_loss": -26.7491397857666, "global_step": 456110, "epoch": 5495} {"train_loss": -27.084924697875977, "global_step": 456111, "epoch": 5495} {"train_loss": -26.79339027404785, "global_step": 456112, "epoch": 5495} {"train_loss": -27.028528213500977, "global_step": 456113, "epoch": 5495} {"train_loss": -26.889495849609375, "global_step": 456114, "epoch": 5495} {"train_loss": -26.8919677734375, "global_step": 456115, "epoch": 5495} {"train_loss": -26.636762619018555, "global_step": 456116, "epoch": 5495} {"train_loss": -27.073759078979492, "global_step": 456117, "epoch": 5495} {"train_loss": -27.09893226623535, "global_step": 456118, "epoch": 5495} {"train_loss": -27.0030574798584, "global_step": 456119, "epoch": 5495} {"train_loss": -27.32280921936035, "global_step": 456120, "epoch": 5495} {"train_loss": -26.982419967651367, "global_step": 456121, "epoch": 5495} {"train_loss": -27.47235679626465, "global_step": 456122, "epoch": 5495} {"train_loss": -27.20767593383789, "global_step": 456123, "epoch": 5495} {"train_loss": -27.363683700561523, "global_step": 456124, "epoch": 5495} {"train_loss": -27.153610229492188, "global_step": 456125, "epoch": 5495} {"train_loss": -27.196151733398438, "global_step": 456126, "epoch": 5495} {"train_loss": -27.069503784179688, "global_step": 456127, "epoch": 5495} {"train_loss": -26.941089630126953, "global_step": 456128, "epoch": 5495} {"train_loss": -27.07232666015625, "global_step": 456129, "epoch": 5495} {"train_loss": -26.702009201049805, "global_step": 456130, "epoch": 5495} {"train_loss": -26.171560287475586, "global_step": 456131, "epoch": 5495} {"train_loss": -26.605283737182617, "global_step": 456132, "epoch": 5495} {"train_loss": -26.88117790222168, "global_step": 456133, "epoch": 5495} {"train_loss": -27.028961181640625, "global_step": 456134, "epoch": 5495} {"train_loss": -26.97782325744629, "global_step": 456135, "epoch": 5495} {"train_loss": -26.895959854125977, "global_step": 456136, "epoch": 5495} {"train_loss": -27.129297256469727, "global_step": 456137, "epoch": 5495} {"train_loss": -26.738510131835938, "global_step": 456138, "epoch": 5495} {"train_loss": -27.271392822265625, "global_step": 456139, "epoch": 5495} {"train_loss": -27.066726684570312, "global_step": 456140, "epoch": 5495} {"train_loss": -27.035140991210938, "global_step": 456141, "epoch": 5495} {"train_loss": -27.43277359008789, "global_step": 456142, "epoch": 5495} {"train_loss": -27.4134464263916, "global_step": 456143, "epoch": 5495} {"train_loss": -27.295806884765625, "global_step": 456144, "epoch": 5495} {"train_loss": -26.667724609375, "global_step": 456145, "epoch": 5495} {"train_loss": -27.053579330444336, "global_step": 456146, "epoch": 5495} {"train_loss": -26.576257705688477, "global_step": 456147, "epoch": 5495} {"train_loss": -26.851850509643555, "global_step": 456148, "epoch": 5495} {"train_loss": -26.615758895874023, "global_step": 456149, "epoch": 5495} {"train_loss": -27.154882431030273, "global_step": 456150, "epoch": 5495} {"train_loss": -26.869094848632812, "global_step": 456151, "epoch": 5495} {"train_loss": -27.016260147094727, "global_step": 456152, "epoch": 5495} {"train_loss": -27.142578125, "global_step": 456153, "epoch": 5495} {"train_loss": -27.2487735748291, "global_step": 456154, "epoch": 5495} {"train_loss": -27.428518295288086, "global_step": 456155, "epoch": 5495} {"train_loss": -27.05267333984375, "global_step": 456156, "epoch": 5495} {"train_loss": -27.178232192993164, "global_step": 456157, "epoch": 5495} {"train_loss": -27.60601234436035, "global_step": 456158, "epoch": 5495} {"train_loss": -26.774702072143555, "global_step": 456159, "epoch": 5495} {"train_loss": -26.823347091674805, "global_step": 456160, "epoch": 5495} {"train_loss": -26.96363639831543, "global_step": 456161, "epoch": 5495} {"train_loss": -27.251596450805664, "global_step": 456162, "epoch": 5495} {"train_loss": -27.046838760375977, "global_step": 456163, "epoch": 5495} {"train_loss": -27.412214279174805, "global_step": 456164, "epoch": 5495} {"train_loss": -27.078662872314453, "global_step": 456165, "epoch": 5495} {"train_loss": -26.81268310546875, "global_step": 456166, "epoch": 5495} {"train_loss": -26.876707329807513, "global_step": 456167, "epoch": 5495, "val_loss": 6619060.0} {"train_loss": -26.62824058532715, "global_step": 456168, "epoch": 5496} {"train_loss": -26.643299102783203, "global_step": 456169, "epoch": 5496} {"train_loss": -27.092151641845703, "global_step": 456170, "epoch": 5496} {"train_loss": -26.677305221557617, "global_step": 456171, "epoch": 5496} {"train_loss": -26.808761596679688, "global_step": 456172, "epoch": 5496} {"train_loss": -26.504911422729492, "global_step": 456173, "epoch": 5496} {"train_loss": -26.93928337097168, "global_step": 456174, "epoch": 5496} {"train_loss": -26.527606964111328, "global_step": 456175, "epoch": 5496} {"train_loss": -26.5555477142334, "global_step": 456176, "epoch": 5496} {"train_loss": -27.059080123901367, "global_step": 456177, "epoch": 5496} {"train_loss": -26.942060470581055, "global_step": 456178, "epoch": 5496} {"train_loss": -27.164335250854492, "global_step": 456179, "epoch": 5496} {"train_loss": -26.769916534423828, "global_step": 456180, "epoch": 5496} {"train_loss": -26.646854400634766, "global_step": 456181, "epoch": 5496} {"train_loss": -26.65069007873535, "global_step": 456182, "epoch": 5496} {"train_loss": -27.089651107788086, "global_step": 456183, "epoch": 5496} {"train_loss": -26.958585739135742, "global_step": 456184, "epoch": 5496} {"train_loss": -26.7166748046875, "global_step": 456185, "epoch": 5496} {"train_loss": -27.074676513671875, "global_step": 456186, "epoch": 5496} {"train_loss": -26.943655014038086, "global_step": 456187, "epoch": 5496} {"train_loss": -26.930845260620117, "global_step": 456188, "epoch": 5496} {"train_loss": -27.46906089782715, "global_step": 456189, "epoch": 5496} {"train_loss": -26.892791748046875, "global_step": 456190, "epoch": 5496} {"train_loss": -27.087289810180664, "global_step": 456191, "epoch": 5496} {"train_loss": -26.93128776550293, "global_step": 456192, "epoch": 5496} {"train_loss": -27.088266372680664, "global_step": 456193, "epoch": 5496} {"train_loss": -26.866958618164062, "global_step": 456194, "epoch": 5496} {"train_loss": -27.037031173706055, "global_step": 456195, "epoch": 5496} {"train_loss": -27.009418487548828, "global_step": 456196, "epoch": 5496} {"train_loss": -27.043701171875, "global_step": 456197, "epoch": 5496} {"train_loss": -27.270910263061523, "global_step": 456198, "epoch": 5496} {"train_loss": -27.050870895385742, "global_step": 456199, "epoch": 5496} {"train_loss": -26.964670181274414, "global_step": 456200, "epoch": 5496} {"train_loss": -27.353565216064453, "global_step": 456201, "epoch": 5496} {"train_loss": -26.96210289001465, "global_step": 456202, "epoch": 5496} {"train_loss": -27.4497013092041, "global_step": 456203, "epoch": 5496} {"train_loss": -27.115615844726562, "global_step": 456204, "epoch": 5496} {"train_loss": -27.440290451049805, "global_step": 456205, "epoch": 5496} {"train_loss": -27.182600021362305, "global_step": 456206, "epoch": 5496} {"train_loss": -27.19525718688965, "global_step": 456207, "epoch": 5496} {"train_loss": -26.985980987548828, "global_step": 456208, "epoch": 5496} {"train_loss": -27.2136287689209, "global_step": 456209, "epoch": 5496} {"train_loss": -27.336252212524414, "global_step": 456210, "epoch": 5496} {"train_loss": -27.100744247436523, "global_step": 456211, "epoch": 5496} {"train_loss": -27.31524658203125, "global_step": 456212, "epoch": 5496} {"train_loss": -27.231918334960938, "global_step": 456213, "epoch": 5496} {"train_loss": -27.245899200439453, "global_step": 456214, "epoch": 5496} {"train_loss": -27.014541625976562, "global_step": 456215, "epoch": 5496} {"train_loss": -27.29128074645996, "global_step": 456216, "epoch": 5496} {"train_loss": -27.397689819335938, "global_step": 456217, "epoch": 5496} {"train_loss": -27.1697940826416, "global_step": 456218, "epoch": 5496} {"train_loss": -27.040054321289062, "global_step": 456219, "epoch": 5496} {"train_loss": -27.16812515258789, "global_step": 456220, "epoch": 5496} {"train_loss": -27.639179229736328, "global_step": 456221, "epoch": 5496} {"train_loss": -27.425251007080078, "global_step": 456222, "epoch": 5496} {"train_loss": -26.83062171936035, "global_step": 456223, "epoch": 5496} {"train_loss": -26.875959396362305, "global_step": 456224, "epoch": 5496} {"train_loss": -26.977081298828125, "global_step": 456225, "epoch": 5496} {"train_loss": -27.2008056640625, "global_step": 456226, "epoch": 5496} {"train_loss": -27.050745010375977, "global_step": 456227, "epoch": 5496} {"train_loss": -27.270660400390625, "global_step": 456228, "epoch": 5496} {"train_loss": -27.312320709228516, "global_step": 456229, "epoch": 5496} {"train_loss": -27.07087516784668, "global_step": 456230, "epoch": 5496} {"train_loss": -27.016748428344727, "global_step": 456231, "epoch": 5496} {"train_loss": -27.267181396484375, "global_step": 456232, "epoch": 5496} {"train_loss": -27.46417236328125, "global_step": 456233, "epoch": 5496} {"train_loss": -27.273956298828125, "global_step": 456234, "epoch": 5496} {"train_loss": -27.071491241455078, "global_step": 456235, "epoch": 5496} {"train_loss": -27.219152450561523, "global_step": 456236, "epoch": 5496} {"train_loss": -27.48126220703125, "global_step": 456237, "epoch": 5496} {"train_loss": -27.400747299194336, "global_step": 456238, "epoch": 5496} {"train_loss": -26.89084815979004, "global_step": 456239, "epoch": 5496} {"train_loss": -26.619226455688477, "global_step": 456240, "epoch": 5496} {"train_loss": -27.11924171447754, "global_step": 456241, "epoch": 5496} {"train_loss": -26.904010772705078, "global_step": 456242, "epoch": 5496} {"train_loss": -27.27430534362793, "global_step": 456243, "epoch": 5496} {"train_loss": -26.548913955688477, "global_step": 456244, "epoch": 5496} {"train_loss": -27.102161407470703, "global_step": 456245, "epoch": 5496} {"train_loss": -27.23508071899414, "global_step": 456246, "epoch": 5496} {"train_loss": -27.064794540405273, "global_step": 456247, "epoch": 5496} {"train_loss": -27.117145538330078, "global_step": 456248, "epoch": 5496} {"train_loss": -27.167530059814453, "global_step": 456249, "epoch": 5496} {"train_loss": -27.06147191610681, "global_step": 456250, "epoch": 5496, "val_loss": 6607771.5} {"train_loss": -25.74887466430664, "global_step": 456251, "epoch": 5497} {"train_loss": -25.876834869384766, "global_step": 456252, "epoch": 5497} {"train_loss": -26.015399932861328, "global_step": 456253, "epoch": 5497} {"train_loss": -23.499155044555664, "global_step": 456254, "epoch": 5497} {"train_loss": -25.551504135131836, "global_step": 456255, "epoch": 5497} {"train_loss": -26.318445205688477, "global_step": 456256, "epoch": 5497} {"train_loss": -24.995969772338867, "global_step": 456257, "epoch": 5497} {"train_loss": -25.999420166015625, "global_step": 456258, "epoch": 5497} {"train_loss": -26.337549209594727, "global_step": 456259, "epoch": 5497} {"train_loss": -26.03852653503418, "global_step": 456260, "epoch": 5497} {"train_loss": -26.26995849609375, "global_step": 456261, "epoch": 5497} {"train_loss": -26.33380126953125, "global_step": 456262, "epoch": 5497} {"train_loss": -26.350858688354492, "global_step": 456263, "epoch": 5497} {"train_loss": -26.10724449157715, "global_step": 456264, "epoch": 5497} {"train_loss": -26.50408363342285, "global_step": 456265, "epoch": 5497} {"train_loss": -26.41672134399414, "global_step": 456266, "epoch": 5497} {"train_loss": -26.304611206054688, "global_step": 456267, "epoch": 5497} {"train_loss": -26.575708389282227, "global_step": 456268, "epoch": 5497} {"train_loss": -26.600454330444336, "global_step": 456269, "epoch": 5497} {"train_loss": -26.74365234375, "global_step": 456270, "epoch": 5497} {"train_loss": -26.28779411315918, "global_step": 456271, "epoch": 5497} {"train_loss": -26.66574478149414, "global_step": 456272, "epoch": 5497} {"train_loss": -26.70745849609375, "global_step": 456273, "epoch": 5497} {"train_loss": -26.38128662109375, "global_step": 456274, "epoch": 5497} {"train_loss": -25.935407638549805, "global_step": 456275, "epoch": 5497} {"train_loss": -26.67848777770996, "global_step": 456276, "epoch": 5497} {"train_loss": -26.86345863342285, "global_step": 456277, "epoch": 5497} {"train_loss": -26.35172462463379, "global_step": 456278, "epoch": 5497} {"train_loss": -26.935529708862305, "global_step": 456279, "epoch": 5497} {"train_loss": -26.296802520751953, "global_step": 456280, "epoch": 5497} {"train_loss": -26.9210147857666, "global_step": 456281, "epoch": 5497} {"train_loss": -26.709440231323242, "global_step": 456282, "epoch": 5497} {"train_loss": -26.929264068603516, "global_step": 456283, "epoch": 5497} {"train_loss": -27.039569854736328, "global_step": 456284, "epoch": 5497} {"train_loss": -26.965240478515625, "global_step": 456285, "epoch": 5497} {"train_loss": -26.75482177734375, "global_step": 456286, "epoch": 5497} {"train_loss": -27.18387794494629, "global_step": 456287, "epoch": 5497} {"train_loss": -27.070514678955078, "global_step": 456288, "epoch": 5497} {"train_loss": -26.965734481811523, "global_step": 456289, "epoch": 5497} {"train_loss": -27.574432373046875, "global_step": 456290, "epoch": 5497} {"train_loss": -27.151782989501953, "global_step": 456291, "epoch": 5497} {"train_loss": -26.881738662719727, "global_step": 456292, "epoch": 5497} {"train_loss": -27.286890029907227, "global_step": 456293, "epoch": 5497} {"train_loss": -27.244861602783203, "global_step": 456294, "epoch": 5497} {"train_loss": -26.93092918395996, "global_step": 456295, "epoch": 5497} {"train_loss": -27.068716049194336, "global_step": 456296, "epoch": 5497} {"train_loss": -27.398422241210938, "global_step": 456297, "epoch": 5497} {"train_loss": -27.07721519470215, "global_step": 456298, "epoch": 5497} {"train_loss": -27.2646484375, "global_step": 456299, "epoch": 5497} {"train_loss": -27.45929527282715, "global_step": 456300, "epoch": 5497} {"train_loss": -27.452634811401367, "global_step": 456301, "epoch": 5497} {"train_loss": -26.93603515625, "global_step": 456302, "epoch": 5497} {"train_loss": -27.108915328979492, "global_step": 456303, "epoch": 5497} {"train_loss": -27.197071075439453, "global_step": 456304, "epoch": 5497} {"train_loss": -27.56587028503418, "global_step": 456305, "epoch": 5497} {"train_loss": -27.665197372436523, "global_step": 456306, "epoch": 5497} {"train_loss": -27.01053237915039, "global_step": 456307, "epoch": 5497} {"train_loss": -27.612655639648438, "global_step": 456308, "epoch": 5497} {"train_loss": -27.25193214416504, "global_step": 456309, "epoch": 5497} {"train_loss": -27.170621871948242, "global_step": 456310, "epoch": 5497} {"train_loss": -27.3833065032959, "global_step": 456311, "epoch": 5497} {"train_loss": -26.872644424438477, "global_step": 456312, "epoch": 5497} {"train_loss": -26.74077796936035, "global_step": 456313, "epoch": 5497} {"train_loss": -26.65227699279785, "global_step": 456314, "epoch": 5497} {"train_loss": -26.664175033569336, "global_step": 456315, "epoch": 5497} {"train_loss": -27.2153263092041, "global_step": 456316, "epoch": 5497} {"train_loss": -26.82184410095215, "global_step": 456317, "epoch": 5497} {"train_loss": -27.448347091674805, "global_step": 456318, "epoch": 5497} {"train_loss": -26.8668155670166, "global_step": 456319, "epoch": 5497} {"train_loss": -26.4660701751709, "global_step": 456320, "epoch": 5497} {"train_loss": -26.626596450805664, "global_step": 456321, "epoch": 5497} {"train_loss": -26.864887237548828, "global_step": 456322, "epoch": 5497} {"train_loss": -27.12259864807129, "global_step": 456323, "epoch": 5497} {"train_loss": -26.83522605895996, "global_step": 456324, "epoch": 5497} {"train_loss": -27.203466415405273, "global_step": 456325, "epoch": 5497} {"train_loss": -26.973478317260742, "global_step": 456326, "epoch": 5497} {"train_loss": -27.169031143188477, "global_step": 456327, "epoch": 5497} {"train_loss": -27.488616943359375, "global_step": 456328, "epoch": 5497} {"train_loss": -27.259408950805664, "global_step": 456329, "epoch": 5497} {"train_loss": -27.240650177001953, "global_step": 456330, "epoch": 5497} {"train_loss": -26.992902755737305, "global_step": 456331, "epoch": 5497} {"train_loss": -27.046293258666992, "global_step": 456332, "epoch": 5497} {"train_loss": -26.77483616105045, "global_step": 456333, "epoch": 5497, "val_loss": 6596222.5} {"train_loss": -26.955503463745117, "global_step": 456334, "epoch": 5498} {"train_loss": -26.221948623657227, "global_step": 456335, "epoch": 5498} {"train_loss": -26.365156173706055, "global_step": 456336, "epoch": 5498} {"train_loss": -26.5037841796875, "global_step": 456337, "epoch": 5498} {"train_loss": -26.330127716064453, "global_step": 456338, "epoch": 5498} {"train_loss": -26.381336212158203, "global_step": 456339, "epoch": 5498} {"train_loss": -26.16460609436035, "global_step": 456340, "epoch": 5498} {"train_loss": -26.468252182006836, "global_step": 456341, "epoch": 5498} {"train_loss": -26.812427520751953, "global_step": 456342, "epoch": 5498} {"train_loss": -27.05474281311035, "global_step": 456343, "epoch": 5498} {"train_loss": -26.834203720092773, "global_step": 456344, "epoch": 5498} {"train_loss": -26.595300674438477, "global_step": 456345, "epoch": 5498} {"train_loss": -26.619352340698242, "global_step": 456346, "epoch": 5498} {"train_loss": -27.3066349029541, "global_step": 456347, "epoch": 5498} {"train_loss": -27.22491455078125, "global_step": 456348, "epoch": 5498} {"train_loss": -27.342329025268555, "global_step": 456349, "epoch": 5498} {"train_loss": -26.765546798706055, "global_step": 456350, "epoch": 5498} {"train_loss": -26.86677360534668, "global_step": 456351, "epoch": 5498} {"train_loss": -27.27310562133789, "global_step": 456352, "epoch": 5498} {"train_loss": -26.823684692382812, "global_step": 456353, "epoch": 5498} {"train_loss": -27.1934814453125, "global_step": 456354, "epoch": 5498} {"train_loss": -27.173608779907227, "global_step": 456355, "epoch": 5498} {"train_loss": -27.031824111938477, "global_step": 456356, "epoch": 5498} {"train_loss": -27.140668869018555, "global_step": 456357, "epoch": 5498} {"train_loss": -27.1872501373291, "global_step": 456358, "epoch": 5498} {"train_loss": -27.235401153564453, "global_step": 456359, "epoch": 5498} {"train_loss": -26.582731246948242, "global_step": 456360, "epoch": 5498} {"train_loss": -27.11809730529785, "global_step": 456361, "epoch": 5498} {"train_loss": -27.46034049987793, "global_step": 456362, "epoch": 5498} {"train_loss": -26.99395179748535, "global_step": 456363, "epoch": 5498} {"train_loss": -27.29810905456543, "global_step": 456364, "epoch": 5498} {"train_loss": -27.022802352905273, "global_step": 456365, "epoch": 5498} {"train_loss": -27.006637573242188, "global_step": 456366, "epoch": 5498} {"train_loss": -26.895193099975586, "global_step": 456367, "epoch": 5498} {"train_loss": -26.52924919128418, "global_step": 456368, "epoch": 5498} {"train_loss": -26.35400390625, "global_step": 456369, "epoch": 5498} {"train_loss": -26.509565353393555, "global_step": 456370, "epoch": 5498} {"train_loss": -26.75341796875, "global_step": 456371, "epoch": 5498} {"train_loss": -27.193586349487305, "global_step": 456372, "epoch": 5498} {"train_loss": -27.03046226501465, "global_step": 456373, "epoch": 5498} {"train_loss": -27.142969131469727, "global_step": 456374, "epoch": 5498} {"train_loss": -26.9090576171875, "global_step": 456375, "epoch": 5498} {"train_loss": -26.96120262145996, "global_step": 456376, "epoch": 5498} {"train_loss": -26.86979103088379, "global_step": 456377, "epoch": 5498} {"train_loss": -27.43084144592285, "global_step": 456378, "epoch": 5498} {"train_loss": -27.204328536987305, "global_step": 456379, "epoch": 5498} {"train_loss": -26.965845108032227, "global_step": 456380, "epoch": 5498} {"train_loss": -27.399433135986328, "global_step": 456381, "epoch": 5498} {"train_loss": -26.88840103149414, "global_step": 456382, "epoch": 5498} {"train_loss": -27.19495964050293, "global_step": 456383, "epoch": 5498} {"train_loss": -26.878223419189453, "global_step": 456384, "epoch": 5498} {"train_loss": -26.93035316467285, "global_step": 456385, "epoch": 5498} {"train_loss": -26.98872184753418, "global_step": 456386, "epoch": 5498} {"train_loss": -27.086624145507812, "global_step": 456387, "epoch": 5498} {"train_loss": -26.8153133392334, "global_step": 456388, "epoch": 5498} {"train_loss": -27.009057998657227, "global_step": 456389, "epoch": 5498} {"train_loss": -27.046133041381836, "global_step": 456390, "epoch": 5498} {"train_loss": -27.121810913085938, "global_step": 456391, "epoch": 5498} {"train_loss": -27.173559188842773, "global_step": 456392, "epoch": 5498} {"train_loss": -27.073171615600586, "global_step": 456393, "epoch": 5498} {"train_loss": -26.611236572265625, "global_step": 456394, "epoch": 5498} {"train_loss": -27.302398681640625, "global_step": 456395, "epoch": 5498} {"train_loss": -27.17229652404785, "global_step": 456396, "epoch": 5498} {"train_loss": -27.3308048248291, "global_step": 456397, "epoch": 5498} {"train_loss": -27.47490882873535, "global_step": 456398, "epoch": 5498} {"train_loss": -27.240697860717773, "global_step": 456399, "epoch": 5498} {"train_loss": -26.994543075561523, "global_step": 456400, "epoch": 5498} {"train_loss": -27.13532066345215, "global_step": 456401, "epoch": 5498} {"train_loss": -27.32221794128418, "global_step": 456402, "epoch": 5498} {"train_loss": -27.093738555908203, "global_step": 456403, "epoch": 5498} {"train_loss": -26.873916625976562, "global_step": 456404, "epoch": 5498} {"train_loss": -27.544830322265625, "global_step": 456405, "epoch": 5498} {"train_loss": -27.104719161987305, "global_step": 456406, "epoch": 5498} {"train_loss": -27.12469482421875, "global_step": 456407, "epoch": 5498} {"train_loss": -26.92317008972168, "global_step": 456408, "epoch": 5498} {"train_loss": -26.77625846862793, "global_step": 456409, "epoch": 5498} {"train_loss": -27.08350944519043, "global_step": 456410, "epoch": 5498} {"train_loss": -27.082910537719727, "global_step": 456411, "epoch": 5498} {"train_loss": -27.2508544921875, "global_step": 456412, "epoch": 5498} {"train_loss": -26.8682918548584, "global_step": 456413, "epoch": 5498} {"train_loss": -27.29815673828125, "global_step": 456414, "epoch": 5498} {"train_loss": -27.403406143188477, "global_step": 456415, "epoch": 5498} {"train_loss": -26.994799763323314, "global_step": 456416, "epoch": 5498, "val_loss": 6610980.0} {"train_loss": -26.351118087768555, "global_step": 456417, "epoch": 5499} {"train_loss": -26.43839454650879, "global_step": 456418, "epoch": 5499} {"train_loss": -26.555845260620117, "global_step": 456419, "epoch": 5499} {"train_loss": -26.165678024291992, "global_step": 456420, "epoch": 5499} {"train_loss": -26.12186050415039, "global_step": 456421, "epoch": 5499} {"train_loss": -26.009857177734375, "global_step": 456422, "epoch": 5499} {"train_loss": -26.47666358947754, "global_step": 456423, "epoch": 5499} {"train_loss": -26.485837936401367, "global_step": 456424, "epoch": 5499} {"train_loss": -26.65974235534668, "global_step": 456425, "epoch": 5499} {"train_loss": -26.739980697631836, "global_step": 456426, "epoch": 5499} {"train_loss": -26.43470573425293, "global_step": 456427, "epoch": 5499} {"train_loss": -26.77235221862793, "global_step": 456428, "epoch": 5499} {"train_loss": -26.748218536376953, "global_step": 456429, "epoch": 5499} {"train_loss": -27.045923233032227, "global_step": 456430, "epoch": 5499} {"train_loss": -26.877355575561523, "global_step": 456431, "epoch": 5499} {"train_loss": -26.74822425842285, "global_step": 456432, "epoch": 5499} {"train_loss": -27.103302001953125, "global_step": 456433, "epoch": 5499} {"train_loss": -26.8599853515625, "global_step": 456434, "epoch": 5499} {"train_loss": -26.776142120361328, "global_step": 456435, "epoch": 5499} {"train_loss": -26.81890296936035, "global_step": 456436, "epoch": 5499} {"train_loss": -27.221654891967773, "global_step": 456437, "epoch": 5499} {"train_loss": -26.855268478393555, "global_step": 456438, "epoch": 5499} {"train_loss": -27.0084228515625, "global_step": 456439, "epoch": 5499} {"train_loss": -26.81012535095215, "global_step": 456440, "epoch": 5499} {"train_loss": -26.667490005493164, "global_step": 456441, "epoch": 5499} {"train_loss": -27.36203956604004, "global_step": 456442, "epoch": 5499} {"train_loss": -26.716156005859375, "global_step": 456443, "epoch": 5499} {"train_loss": -26.932453155517578, "global_step": 456444, "epoch": 5499} {"train_loss": -26.867948532104492, "global_step": 456445, "epoch": 5499} {"train_loss": -26.82230567932129, "global_step": 456446, "epoch": 5499} {"train_loss": -27.295663833618164, "global_step": 456447, "epoch": 5499} {"train_loss": -27.062341690063477, "global_step": 456448, "epoch": 5499} {"train_loss": -26.83685302734375, "global_step": 456449, "epoch": 5499} {"train_loss": -27.34160804748535, "global_step": 456450, "epoch": 5499} {"train_loss": -27.018035888671875, "global_step": 456451, "epoch": 5499} {"train_loss": -27.039640426635742, "global_step": 456452, "epoch": 5499} {"train_loss": -27.19466209411621, "global_step": 456453, "epoch": 5499} {"train_loss": -26.73280143737793, "global_step": 456454, "epoch": 5499} {"train_loss": -27.155858993530273, "global_step": 456455, "epoch": 5499} {"train_loss": -27.11212158203125, "global_step": 456456, "epoch": 5499} {"train_loss": -26.975086212158203, "global_step": 456457, "epoch": 5499} {"train_loss": -27.21115493774414, "global_step": 456458, "epoch": 5499} {"train_loss": -26.879825592041016, "global_step": 456459, "epoch": 5499} {"train_loss": -26.7939395904541, "global_step": 456460, "epoch": 5499} {"train_loss": -27.1583309173584, "global_step": 456461, "epoch": 5499} {"train_loss": -27.115324020385742, "global_step": 456462, "epoch": 5499} {"train_loss": -27.29315757751465, "global_step": 456463, "epoch": 5499} {"train_loss": -27.096643447875977, "global_step": 456464, "epoch": 5499} {"train_loss": -27.129133224487305, "global_step": 456465, "epoch": 5499} {"train_loss": -27.245580673217773, "global_step": 456466, "epoch": 5499} {"train_loss": -26.98707389831543, "global_step": 456467, "epoch": 5499} {"train_loss": -27.450754165649414, "global_step": 456468, "epoch": 5499} {"train_loss": -27.0706844329834, "global_step": 456469, "epoch": 5499} {"train_loss": -26.937788009643555, "global_step": 456470, "epoch": 5499} {"train_loss": -27.36311149597168, "global_step": 456471, "epoch": 5499} {"train_loss": -27.33935546875, "global_step": 456472, "epoch": 5499} {"train_loss": -27.553375244140625, "global_step": 456473, "epoch": 5499} {"train_loss": -27.41656494140625, "global_step": 456474, "epoch": 5499} {"train_loss": -27.5882568359375, "global_step": 456475, "epoch": 5499} {"train_loss": -27.38306999206543, "global_step": 456476, "epoch": 5499} {"train_loss": -27.222522735595703, "global_step": 456477, "epoch": 5499} {"train_loss": -27.195505142211914, "global_step": 456478, "epoch": 5499} {"train_loss": -26.971628189086914, "global_step": 456479, "epoch": 5499} {"train_loss": -26.979663848876953, "global_step": 456480, "epoch": 5499} {"train_loss": -26.92254638671875, "global_step": 456481, "epoch": 5499} {"train_loss": -27.026151657104492, "global_step": 456482, "epoch": 5499} {"train_loss": -27.521581649780273, "global_step": 456483, "epoch": 5499} {"train_loss": -27.23187828063965, "global_step": 456484, "epoch": 5499} {"train_loss": -27.057086944580078, "global_step": 456485, "epoch": 5499} {"train_loss": -27.417524337768555, "global_step": 456486, "epoch": 5499} {"train_loss": -27.141637802124023, "global_step": 456487, "epoch": 5499} {"train_loss": -27.308746337890625, "global_step": 456488, "epoch": 5499} {"train_loss": -27.020221710205078, "global_step": 456489, "epoch": 5499} {"train_loss": -27.207691192626953, "global_step": 456490, "epoch": 5499} {"train_loss": -27.498519897460938, "global_step": 456491, "epoch": 5499} {"train_loss": -27.07736587524414, "global_step": 456492, "epoch": 5499} {"train_loss": -27.06195640563965, "global_step": 456493, "epoch": 5499} {"train_loss": -27.057788848876953, "global_step": 456494, "epoch": 5499} {"train_loss": -26.66981315612793, "global_step": 456495, "epoch": 5499} {"train_loss": -27.215452194213867, "global_step": 456496, "epoch": 5499} {"train_loss": -26.98395347595215, "global_step": 456497, "epoch": 5499} {"train_loss": -27.284353256225586, "global_step": 456498, "epoch": 5499} {"train_loss": -26.996239122137965, "global_step": 456499, "epoch": 5499, "val_loss": 6591209.5} {"train_loss": -26.44269371032715, "global_step": 456500, "epoch": 5500} {"train_loss": -24.92574119567871, "global_step": 456501, "epoch": 5500} {"train_loss": -24.307144165039062, "global_step": 456502, "epoch": 5500} {"train_loss": -26.314559936523438, "global_step": 456503, "epoch": 5500} {"train_loss": -25.199127197265625, "global_step": 456504, "epoch": 5500} {"train_loss": -25.7181453704834, "global_step": 456505, "epoch": 5500} {"train_loss": -26.190505981445312, "global_step": 456506, "epoch": 5500} {"train_loss": -26.05060386657715, "global_step": 456507, "epoch": 5500} {"train_loss": -26.124921798706055, "global_step": 456508, "epoch": 5500} {"train_loss": -26.345224380493164, "global_step": 456509, "epoch": 5500} {"train_loss": -26.48554801940918, "global_step": 456510, "epoch": 5500} {"train_loss": -26.54962158203125, "global_step": 456511, "epoch": 5500} {"train_loss": -26.133752822875977, "global_step": 456512, "epoch": 5500} {"train_loss": -26.316486358642578, "global_step": 456513, "epoch": 5500} {"train_loss": -26.60755729675293, "global_step": 456514, "epoch": 5500} {"train_loss": -26.051471710205078, "global_step": 456515, "epoch": 5500} {"train_loss": -26.37883949279785, "global_step": 456516, "epoch": 5500} {"train_loss": -26.66261863708496, "global_step": 456517, "epoch": 5500} {"train_loss": -26.75356101989746, "global_step": 456518, "epoch": 5500} {"train_loss": -26.697711944580078, "global_step": 456519, "epoch": 5500} {"train_loss": -26.309982299804688, "global_step": 456520, "epoch": 5500} {"train_loss": -26.67988395690918, "global_step": 456521, "epoch": 5500} {"train_loss": -26.48723793029785, "global_step": 456522, "epoch": 5500} {"train_loss": -26.823211669921875, "global_step": 456523, "epoch": 5500} {"train_loss": -26.48831558227539, "global_step": 456524, "epoch": 5500} {"train_loss": -27.012231826782227, "global_step": 456525, "epoch": 5500} {"train_loss": -26.6149845123291, "global_step": 456526, "epoch": 5500} {"train_loss": -27.007080078125, "global_step": 456527, "epoch": 5500} {"train_loss": -26.865381240844727, "global_step": 456528, "epoch": 5500} {"train_loss": -26.672407150268555, "global_step": 456529, "epoch": 5500} {"train_loss": -27.256391525268555, "global_step": 456530, "epoch": 5500} {"train_loss": -27.07742691040039, "global_step": 456531, "epoch": 5500} {"train_loss": -26.871423721313477, "global_step": 456532, "epoch": 5500} {"train_loss": -27.1098575592041, "global_step": 456533, "epoch": 5500} {"train_loss": -26.688459396362305, "global_step": 456534, "epoch": 5500} {"train_loss": -26.99371337890625, "global_step": 456535, "epoch": 5500} {"train_loss": -27.209735870361328, "global_step": 456536, "epoch": 5500} {"train_loss": -27.225183486938477, "global_step": 456537, "epoch": 5500} {"train_loss": -26.812814712524414, "global_step": 456538, "epoch": 5500} {"train_loss": -27.602781295776367, "global_step": 456539, "epoch": 5500} {"train_loss": -27.211780548095703, "global_step": 456540, "epoch": 5500} {"train_loss": -26.949201583862305, "global_step": 456541, "epoch": 5500} {"train_loss": -27.101531982421875, "global_step": 456542, "epoch": 5500} {"train_loss": -27.355310440063477, "global_step": 456543, "epoch": 5500} {"train_loss": -27.028966903686523, "global_step": 456544, "epoch": 5500} {"train_loss": -27.365686416625977, "global_step": 456545, "epoch": 5500} {"train_loss": -27.063140869140625, "global_step": 456546, "epoch": 5500} {"train_loss": -27.446685791015625, "global_step": 456547, "epoch": 5500} {"train_loss": -27.18522071838379, "global_step": 456548, "epoch": 5500} {"train_loss": -27.576740264892578, "global_step": 456549, "epoch": 5500} {"train_loss": -27.271604537963867, "global_step": 456550, "epoch": 5500} {"train_loss": -27.376855850219727, "global_step": 456551, "epoch": 5500} {"train_loss": -27.066679000854492, "global_step": 456552, "epoch": 5500} {"train_loss": -27.158090591430664, "global_step": 456553, "epoch": 5500} {"train_loss": -27.410266876220703, "global_step": 456554, "epoch": 5500} {"train_loss": -27.287988662719727, "global_step": 456555, "epoch": 5500} {"train_loss": -26.850696563720703, "global_step": 456556, "epoch": 5500} {"train_loss": -27.0302677154541, "global_step": 456557, "epoch": 5500} {"train_loss": -26.756855010986328, "global_step": 456558, "epoch": 5500} {"train_loss": -27.25848960876465, "global_step": 456559, "epoch": 5500} {"train_loss": -27.37285804748535, "global_step": 456560, "epoch": 5500} {"train_loss": -27.229772567749023, "global_step": 456561, "epoch": 5500} {"train_loss": -27.298385620117188, "global_step": 456562, "epoch": 5500} {"train_loss": -26.90878677368164, "global_step": 456563, "epoch": 5500} {"train_loss": -27.122961044311523, "global_step": 456564, "epoch": 5500} {"train_loss": -26.74338150024414, "global_step": 456565, "epoch": 5500} {"train_loss": -26.9041805267334, "global_step": 456566, "epoch": 5500} {"train_loss": -27.36554527282715, "global_step": 456567, "epoch": 5500} {"train_loss": -26.571136474609375, "global_step": 456568, "epoch": 5500} {"train_loss": -26.95699119567871, "global_step": 456569, "epoch": 5500} {"train_loss": -26.85991859436035, "global_step": 456570, "epoch": 5500} {"train_loss": -27.068342208862305, "global_step": 456571, "epoch": 5500} {"train_loss": -27.02419090270996, "global_step": 456572, "epoch": 5500} {"train_loss": -26.697973251342773, "global_step": 456573, "epoch": 5500} {"train_loss": -26.851194381713867, "global_step": 456574, "epoch": 5500} {"train_loss": -26.934728622436523, "global_step": 456575, "epoch": 5500} {"train_loss": -27.035505294799805, "global_step": 456576, "epoch": 5500} {"train_loss": -27.035608291625977, "global_step": 456577, "epoch": 5500} {"train_loss": -27.191232681274414, "global_step": 456578, "epoch": 5500} {"train_loss": -27.25069236755371, "global_step": 456579, "epoch": 5500} {"train_loss": -26.92694664001465, "global_step": 456580, "epoch": 5500} {"train_loss": -26.87568473815918, "global_step": 456581, "epoch": 5500} {"train_loss": -26.80843396933682, "global_step": 456582, "epoch": 5500, "train/sim_max_reward_0": 1.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4500000": 1.0, "test/sim_max_reward_4500001": 1.0, "test/sim_max_reward_4500002": 1.0, "test/sim_max_reward_4500003": 1.0, "test/sim_max_reward_4500004": 1.0, "test/sim_max_reward_4500005": 1.0, "test/sim_max_reward_4500006": 1.0, "test/sim_max_reward_4500007": 0.0, "test/sim_max_reward_4500008": 1.0, "test/sim_max_reward_4500009": 1.0, "test/sim_max_reward_4500010": 1.0, "test/sim_max_reward_4500011": 1.0, "test/sim_max_reward_4500012": 1.0, "test/sim_max_reward_4500013": 1.0, "test/sim_max_reward_4500014": 1.0, "test/sim_max_reward_4500015": 1.0, "test/sim_max_reward_4500016": 1.0, "test/sim_max_reward_4500017": 1.0, "test/sim_max_reward_4500018": 1.0, "test/sim_max_reward_4500019": 1.0, "test/sim_max_reward_4500020": 1.0, "test/sim_max_reward_4500021": 1.0, "train/mean_score": 1.0, "test/mean_score": 0.9545454545454546, "val_loss": 6638435.0} {"train_loss": -26.319738388061523, "global_step": 456583, "epoch": 5501} {"train_loss": -23.910261154174805, "global_step": 456584, "epoch": 5501} {"train_loss": -20.96414566040039, "global_step": 456585, "epoch": 5501} {"train_loss": -25.048616409301758, "global_step": 456586, "epoch": 5501} {"train_loss": -25.513397216796875, "global_step": 456587, "epoch": 5501} {"train_loss": -24.88498306274414, "global_step": 456588, "epoch": 5501} {"train_loss": -24.82204818725586, "global_step": 456589, "epoch": 5501} {"train_loss": -25.104618072509766, "global_step": 456590, "epoch": 5501} {"train_loss": -25.454221725463867, "global_step": 456591, "epoch": 5501} {"train_loss": -25.792219161987305, "global_step": 456592, "epoch": 5501} {"train_loss": -25.746885299682617, "global_step": 456593, "epoch": 5501} {"train_loss": -25.729475021362305, "global_step": 456594, "epoch": 5501} {"train_loss": -26.102163314819336, "global_step": 456595, "epoch": 5501} {"train_loss": -26.147369384765625, "global_step": 456596, "epoch": 5501} {"train_loss": -25.983627319335938, "global_step": 456597, "epoch": 5501} {"train_loss": -26.010345458984375, "global_step": 456598, "epoch": 5501} {"train_loss": -26.180419921875, "global_step": 456599, "epoch": 5501} {"train_loss": -26.164047241210938, "global_step": 456600, "epoch": 5501} {"train_loss": -26.183237075805664, "global_step": 456601, "epoch": 5501} {"train_loss": -25.8908634185791, "global_step": 456602, "epoch": 5501} {"train_loss": -26.51655387878418, "global_step": 456603, "epoch": 5501} {"train_loss": -26.111600875854492, "global_step": 456604, "epoch": 5501} {"train_loss": -26.312835693359375, "global_step": 456605, "epoch": 5501} {"train_loss": -26.22757339477539, "global_step": 456606, "epoch": 5501} {"train_loss": -26.443256378173828, "global_step": 456607, "epoch": 5501} {"train_loss": -26.58343505859375, "global_step": 456608, "epoch": 5501} {"train_loss": -26.43120765686035, "global_step": 456609, "epoch": 5501} {"train_loss": -26.804401397705078, "global_step": 456610, "epoch": 5501} {"train_loss": -26.71062660217285, "global_step": 456611, "epoch": 5501} {"train_loss": -26.953052520751953, "global_step": 456612, "epoch": 5501} {"train_loss": -26.83685874938965, "global_step": 456613, "epoch": 5501} {"train_loss": -26.744775772094727, "global_step": 456614, "epoch": 5501} {"train_loss": -26.5976619720459, "global_step": 456615, "epoch": 5501} {"train_loss": -26.732437133789062, "global_step": 456616, "epoch": 5501} {"train_loss": -26.85969352722168, "global_step": 456617, "epoch": 5501} {"train_loss": -26.955657958984375, "global_step": 456618, "epoch": 5501} {"train_loss": -27.005456924438477, "global_step": 456619, "epoch": 5501} {"train_loss": -26.484872817993164, "global_step": 456620, "epoch": 5501} {"train_loss": -26.56586265563965, "global_step": 456621, "epoch": 5501} {"train_loss": -26.922834396362305, "global_step": 456622, "epoch": 5501} {"train_loss": -26.68873405456543, "global_step": 456623, "epoch": 5501} {"train_loss": -26.925918579101562, "global_step": 456624, "epoch": 5501} {"train_loss": -26.639942169189453, "global_step": 456625, "epoch": 5501} {"train_loss": -26.9742431640625, "global_step": 456626, "epoch": 5501} {"train_loss": -27.208581924438477, "global_step": 456627, "epoch": 5501} {"train_loss": -26.883071899414062, "global_step": 456628, "epoch": 5501} {"train_loss": -26.9410400390625, "global_step": 456629, "epoch": 5501} {"train_loss": -26.762714385986328, "global_step": 456630, "epoch": 5501} {"train_loss": -26.977466583251953, "global_step": 456631, "epoch": 5501} {"train_loss": -27.081266403198242, "global_step": 456632, "epoch": 5501} {"train_loss": -27.258407592773438, "global_step": 456633, "epoch": 5501} {"train_loss": -26.836410522460938, "global_step": 456634, "epoch": 5501} {"train_loss": -27.236982345581055, "global_step": 456635, "epoch": 5501} {"train_loss": -27.253015518188477, "global_step": 456636, "epoch": 5501} {"train_loss": -26.956323623657227, "global_step": 456637, "epoch": 5501} {"train_loss": -27.252063751220703, "global_step": 456638, "epoch": 5501} {"train_loss": -26.975311279296875, "global_step": 456639, "epoch": 5501} {"train_loss": -27.3499698638916, "global_step": 456640, "epoch": 5501} {"train_loss": -27.26035499572754, "global_step": 456641, "epoch": 5501} {"train_loss": -27.045385360717773, "global_step": 456642, "epoch": 5501} {"train_loss": -27.323522567749023, "global_step": 456643, "epoch": 5501} {"train_loss": -27.121915817260742, "global_step": 456644, "epoch": 5501} {"train_loss": -27.151809692382812, "global_step": 456645, "epoch": 5501} {"train_loss": -27.317951202392578, "global_step": 456646, "epoch": 5501} {"train_loss": -27.1037540435791, "global_step": 456647, "epoch": 5501} {"train_loss": -27.291913986206055, "global_step": 456648, "epoch": 5501} {"train_loss": -27.391172409057617, "global_step": 456649, "epoch": 5501} {"train_loss": -27.196325302124023, "global_step": 456650, "epoch": 5501} {"train_loss": -27.039487838745117, "global_step": 456651, "epoch": 5501} {"train_loss": -27.25079345703125, "global_step": 456652, "epoch": 5501} {"train_loss": -27.455448150634766, "global_step": 456653, "epoch": 5501} {"train_loss": -27.419469833374023, "global_step": 456654, "epoch": 5501} {"train_loss": -27.516942977905273, "global_step": 456655, "epoch": 5501} {"train_loss": -26.82586669921875, "global_step": 456656, "epoch": 5501} {"train_loss": -27.105255126953125, "global_step": 456657, "epoch": 5501} {"train_loss": -27.174484252929688, "global_step": 456658, "epoch": 5501} {"train_loss": -26.843875885009766, "global_step": 456659, "epoch": 5501} {"train_loss": -27.198801040649414, "global_step": 456660, "epoch": 5501} {"train_loss": -27.063385009765625, "global_step": 456661, "epoch": 5501} {"train_loss": -27.072256088256836, "global_step": 456662, "epoch": 5501} {"train_loss": -27.418256759643555, "global_step": 456663, "epoch": 5501} {"train_loss": -27.37131690979004, "global_step": 456664, "epoch": 5501} {"train_loss": -26.602547634078796, "global_step": 456665, "epoch": 5501, "val_loss": 6559210.0} {"train_loss": -25.77284049987793, "global_step": 456666, "epoch": 5502} {"train_loss": -26.766036987304688, "global_step": 456667, "epoch": 5502} {"train_loss": -26.62687110900879, "global_step": 456668, "epoch": 5502} {"train_loss": -26.774038314819336, "global_step": 456669, "epoch": 5502} {"train_loss": -26.234607696533203, "global_step": 456670, "epoch": 5502} {"train_loss": -26.965662002563477, "global_step": 456671, "epoch": 5502} {"train_loss": -26.99561882019043, "global_step": 456672, "epoch": 5502} {"train_loss": -26.382831573486328, "global_step": 456673, "epoch": 5502} {"train_loss": -26.907873153686523, "global_step": 456674, "epoch": 5502} {"train_loss": -26.7557430267334, "global_step": 456675, "epoch": 5502} {"train_loss": -26.500085830688477, "global_step": 456676, "epoch": 5502} {"train_loss": -26.73360252380371, "global_step": 456677, "epoch": 5502} {"train_loss": -26.894575119018555, "global_step": 456678, "epoch": 5502} {"train_loss": -26.725656509399414, "global_step": 456679, "epoch": 5502} {"train_loss": -26.755517959594727, "global_step": 456680, "epoch": 5502} {"train_loss": -27.15223503112793, "global_step": 456681, "epoch": 5502} {"train_loss": -26.820295333862305, "global_step": 456682, "epoch": 5502} {"train_loss": -26.93256187438965, "global_step": 456683, "epoch": 5502} {"train_loss": -26.976531982421875, "global_step": 456684, "epoch": 5502} {"train_loss": -26.737104415893555, "global_step": 456685, "epoch": 5502} {"train_loss": -27.020593643188477, "global_step": 456686, "epoch": 5502} {"train_loss": -26.888959884643555, "global_step": 456687, "epoch": 5502} {"train_loss": -26.820226669311523, "global_step": 456688, "epoch": 5502} {"train_loss": -26.97816276550293, "global_step": 456689, "epoch": 5502} {"train_loss": -27.07672119140625, "global_step": 456690, "epoch": 5502} {"train_loss": -26.63580322265625, "global_step": 456691, "epoch": 5502} {"train_loss": -26.85867691040039, "global_step": 456692, "epoch": 5502} {"train_loss": -27.0820369720459, "global_step": 456693, "epoch": 5502} {"train_loss": -26.835010528564453, "global_step": 456694, "epoch": 5502} {"train_loss": -26.981382369995117, "global_step": 456695, "epoch": 5502} {"train_loss": -27.226806640625, "global_step": 456696, "epoch": 5502} {"train_loss": -26.739683151245117, "global_step": 456697, "epoch": 5502} {"train_loss": -27.177112579345703, "global_step": 456698, "epoch": 5502} {"train_loss": -27.35894775390625, "global_step": 456699, "epoch": 5502} {"train_loss": -27.505041122436523, "global_step": 456700, "epoch": 5502} {"train_loss": -27.39104652404785, "global_step": 456701, "epoch": 5502} {"train_loss": -26.970422744750977, "global_step": 456702, "epoch": 5502} {"train_loss": -27.434537887573242, "global_step": 456703, "epoch": 5502} {"train_loss": -27.2992000579834, "global_step": 456704, "epoch": 5502} {"train_loss": -27.25263786315918, "global_step": 456705, "epoch": 5502} {"train_loss": -27.4385929107666, "global_step": 456706, "epoch": 5502} {"train_loss": -27.14306640625, "global_step": 456707, "epoch": 5502} {"train_loss": -27.220020294189453, "global_step": 456708, "epoch": 5502} {"train_loss": -26.80311393737793, "global_step": 456709, "epoch": 5502} {"train_loss": -26.9561824798584, "global_step": 456710, "epoch": 5502} {"train_loss": -27.08684730529785, "global_step": 456711, "epoch": 5502} {"train_loss": -27.010883331298828, "global_step": 456712, "epoch": 5502} {"train_loss": -27.237262725830078, "global_step": 456713, "epoch": 5502} {"train_loss": -27.065820693969727, "global_step": 456714, "epoch": 5502} {"train_loss": -27.23337173461914, "global_step": 456715, "epoch": 5502} {"train_loss": -26.684682846069336, "global_step": 456716, "epoch": 5502} {"train_loss": -27.081762313842773, "global_step": 456717, "epoch": 5502} {"train_loss": -27.053298950195312, "global_step": 456718, "epoch": 5502} {"train_loss": -27.419645309448242, "global_step": 456719, "epoch": 5502} {"train_loss": -27.092329025268555, "global_step": 456720, "epoch": 5502} {"train_loss": -27.33066177368164, "global_step": 456721, "epoch": 5502} {"train_loss": -27.274682998657227, "global_step": 456722, "epoch": 5502} {"train_loss": -27.285024642944336, "global_step": 456723, "epoch": 5502} {"train_loss": -27.157276153564453, "global_step": 456724, "epoch": 5502} {"train_loss": -27.023374557495117, "global_step": 456725, "epoch": 5502} {"train_loss": -27.20966148376465, "global_step": 456726, "epoch": 5502} {"train_loss": -27.049436569213867, "global_step": 456727, "epoch": 5502} {"train_loss": -27.2291316986084, "global_step": 456728, "epoch": 5502} {"train_loss": -26.88270378112793, "global_step": 456729, "epoch": 5502} {"train_loss": -27.18280601501465, "global_step": 456730, "epoch": 5502} {"train_loss": -26.981969833374023, "global_step": 456731, "epoch": 5502} {"train_loss": -27.12929344177246, "global_step": 456732, "epoch": 5502} {"train_loss": -27.06231117248535, "global_step": 456733, "epoch": 5502} {"train_loss": -27.653928756713867, "global_step": 456734, "epoch": 5502} {"train_loss": -27.28069496154785, "global_step": 456735, "epoch": 5502} {"train_loss": -27.07102394104004, "global_step": 456736, "epoch": 5502} {"train_loss": -26.823522567749023, "global_step": 456737, "epoch": 5502} {"train_loss": -27.146589279174805, "global_step": 456738, "epoch": 5502} {"train_loss": -26.95625114440918, "global_step": 456739, "epoch": 5502} {"train_loss": -26.928024291992188, "global_step": 456740, "epoch": 5502} {"train_loss": -26.97052574157715, "global_step": 456741, "epoch": 5502} {"train_loss": -26.93259620666504, "global_step": 456742, "epoch": 5502} {"train_loss": -27.169143676757812, "global_step": 456743, "epoch": 5502} {"train_loss": -27.3779354095459, "global_step": 456744, "epoch": 5502} {"train_loss": -27.339588165283203, "global_step": 456745, "epoch": 5502} {"train_loss": -26.985687255859375, "global_step": 456746, "epoch": 5502} {"train_loss": -26.86311149597168, "global_step": 456747, "epoch": 5502} {"train_loss": -27.016690978084704, "global_step": 456748, "epoch": 5502, "val_loss": 6590598.0} {"train_loss": -26.532758712768555, "global_step": 456749, "epoch": 5503} {"train_loss": -26.920215606689453, "global_step": 456750, "epoch": 5503} {"train_loss": -26.20716667175293, "global_step": 456751, "epoch": 5503} {"train_loss": -26.246234893798828, "global_step": 456752, "epoch": 5503} {"train_loss": -26.4929256439209, "global_step": 456753, "epoch": 5503} {"train_loss": -26.6190128326416, "global_step": 456754, "epoch": 5503} {"train_loss": -26.1780948638916, "global_step": 456755, "epoch": 5503} {"train_loss": -26.14283561706543, "global_step": 456756, "epoch": 5503} {"train_loss": -27.326032638549805, "global_step": 456757, "epoch": 5503} {"train_loss": -26.2509708404541, "global_step": 456758, "epoch": 5503} {"train_loss": -26.545822143554688, "global_step": 456759, "epoch": 5503} {"train_loss": -26.694395065307617, "global_step": 456760, "epoch": 5503} {"train_loss": -26.684812545776367, "global_step": 456761, "epoch": 5503} {"train_loss": -26.51594352722168, "global_step": 456762, "epoch": 5503} {"train_loss": -26.520675659179688, "global_step": 456763, "epoch": 5503} {"train_loss": -27.052412033081055, "global_step": 456764, "epoch": 5503} {"train_loss": -27.04802894592285, "global_step": 456765, "epoch": 5503} {"train_loss": -26.89463233947754, "global_step": 456766, "epoch": 5503} {"train_loss": -26.582849502563477, "global_step": 456767, "epoch": 5503} {"train_loss": -26.745752334594727, "global_step": 456768, "epoch": 5503} {"train_loss": -26.97216796875, "global_step": 456769, "epoch": 5503} {"train_loss": -26.5025577545166, "global_step": 456770, "epoch": 5503} {"train_loss": -26.582183837890625, "global_step": 456771, "epoch": 5503} {"train_loss": -27.20771598815918, "global_step": 456772, "epoch": 5503} {"train_loss": -26.756345748901367, "global_step": 456773, "epoch": 5503} {"train_loss": -26.94679832458496, "global_step": 456774, "epoch": 5503} {"train_loss": -26.592016220092773, "global_step": 456775, "epoch": 5503} {"train_loss": -26.55897331237793, "global_step": 456776, "epoch": 5503} {"train_loss": -27.244428634643555, "global_step": 456777, "epoch": 5503} {"train_loss": -27.188634872436523, "global_step": 456778, "epoch": 5503} {"train_loss": -27.052148818969727, "global_step": 456779, "epoch": 5503} {"train_loss": -26.81768226623535, "global_step": 456780, "epoch": 5503} {"train_loss": -27.2044734954834, "global_step": 456781, "epoch": 5503} {"train_loss": -26.782819747924805, "global_step": 456782, "epoch": 5503} {"train_loss": -27.067676544189453, "global_step": 456783, "epoch": 5503} {"train_loss": -26.627878189086914, "global_step": 456784, "epoch": 5503} {"train_loss": -27.05714225769043, "global_step": 456785, "epoch": 5503} {"train_loss": -26.97881507873535, "global_step": 456786, "epoch": 5503} {"train_loss": -27.034521102905273, "global_step": 456787, "epoch": 5503} {"train_loss": -26.95659828186035, "global_step": 456788, "epoch": 5503} {"train_loss": -27.145267486572266, "global_step": 456789, "epoch": 5503} {"train_loss": -27.272409439086914, "global_step": 456790, "epoch": 5503} {"train_loss": -27.069257736206055, "global_step": 456791, "epoch": 5503} {"train_loss": -27.30533790588379, "global_step": 456792, "epoch": 5503} {"train_loss": -27.233978271484375, "global_step": 456793, "epoch": 5503} {"train_loss": -27.26711082458496, "global_step": 456794, "epoch": 5503} {"train_loss": -27.189340591430664, "global_step": 456795, "epoch": 5503} {"train_loss": -27.296802520751953, "global_step": 456796, "epoch": 5503} {"train_loss": -27.56133460998535, "global_step": 456797, "epoch": 5503} {"train_loss": -27.38351821899414, "global_step": 456798, "epoch": 5503} {"train_loss": -27.30586051940918, "global_step": 456799, "epoch": 5503} {"train_loss": -27.035085678100586, "global_step": 456800, "epoch": 5503} {"train_loss": -27.185529708862305, "global_step": 456801, "epoch": 5503} {"train_loss": -27.128803253173828, "global_step": 456802, "epoch": 5503} {"train_loss": -27.037755966186523, "global_step": 456803, "epoch": 5503} {"train_loss": -26.93406105041504, "global_step": 456804, "epoch": 5503} {"train_loss": -26.913013458251953, "global_step": 456805, "epoch": 5503} {"train_loss": -26.712860107421875, "global_step": 456806, "epoch": 5503} {"train_loss": -27.26319694519043, "global_step": 456807, "epoch": 5503} {"train_loss": -27.047327041625977, "global_step": 456808, "epoch": 5503} {"train_loss": -26.958295822143555, "global_step": 456809, "epoch": 5503} {"train_loss": -26.963224411010742, "global_step": 456810, "epoch": 5503} {"train_loss": -27.102569580078125, "global_step": 456811, "epoch": 5503} {"train_loss": -27.288782119750977, "global_step": 456812, "epoch": 5503} {"train_loss": -26.638370513916016, "global_step": 456813, "epoch": 5503} {"train_loss": -27.258136749267578, "global_step": 456814, "epoch": 5503} {"train_loss": -27.366132736206055, "global_step": 456815, "epoch": 5503} {"train_loss": -27.0126953125, "global_step": 456816, "epoch": 5503} {"train_loss": -26.76492691040039, "global_step": 456817, "epoch": 5503} {"train_loss": -27.3945255279541, "global_step": 456818, "epoch": 5503} {"train_loss": -26.840560913085938, "global_step": 456819, "epoch": 5503} {"train_loss": -26.928064346313477, "global_step": 456820, "epoch": 5503} {"train_loss": -27.000524520874023, "global_step": 456821, "epoch": 5503} {"train_loss": -26.133426666259766, "global_step": 456822, "epoch": 5503} {"train_loss": -26.729185104370117, "global_step": 456823, "epoch": 5503} {"train_loss": -26.9547176361084, "global_step": 456824, "epoch": 5503} {"train_loss": -26.649274826049805, "global_step": 456825, "epoch": 5503} {"train_loss": -26.393339157104492, "global_step": 456826, "epoch": 5503} {"train_loss": -27.202072143554688, "global_step": 456827, "epoch": 5503} {"train_loss": -26.599863052368164, "global_step": 456828, "epoch": 5503} {"train_loss": -26.846128463745117, "global_step": 456829, "epoch": 5503} {"train_loss": -27.027379989624023, "global_step": 456830, "epoch": 5503} {"train_loss": -26.904545680586114, "global_step": 456831, "epoch": 5503, "val_loss": 6577627.0} {"train_loss": -26.47117042541504, "global_step": 456832, "epoch": 5504} {"train_loss": -26.129064559936523, "global_step": 456833, "epoch": 5504} {"train_loss": -26.558185577392578, "global_step": 456834, "epoch": 5504} {"train_loss": -27.199087142944336, "global_step": 456835, "epoch": 5504} {"train_loss": -26.02583122253418, "global_step": 456836, "epoch": 5504} {"train_loss": -26.32828140258789, "global_step": 456837, "epoch": 5504} {"train_loss": -26.512989044189453, "global_step": 456838, "epoch": 5504} {"train_loss": -26.713214874267578, "global_step": 456839, "epoch": 5504} {"train_loss": -26.597000122070312, "global_step": 456840, "epoch": 5504} {"train_loss": -26.810678482055664, "global_step": 456841, "epoch": 5504} {"train_loss": -26.754230499267578, "global_step": 456842, "epoch": 5504} {"train_loss": -26.870275497436523, "global_step": 456843, "epoch": 5504} {"train_loss": -26.521438598632812, "global_step": 456844, "epoch": 5504} {"train_loss": -26.6978816986084, "global_step": 456845, "epoch": 5504} {"train_loss": -26.906728744506836, "global_step": 456846, "epoch": 5504} {"train_loss": -26.8371524810791, "global_step": 456847, "epoch": 5504} {"train_loss": -26.975814819335938, "global_step": 456848, "epoch": 5504} {"train_loss": -26.611852645874023, "global_step": 456849, "epoch": 5504} {"train_loss": -26.672046661376953, "global_step": 456850, "epoch": 5504} {"train_loss": -27.13264274597168, "global_step": 456851, "epoch": 5504} {"train_loss": -27.237218856811523, "global_step": 456852, "epoch": 5504} {"train_loss": -26.87557029724121, "global_step": 456853, "epoch": 5504} {"train_loss": -26.988920211791992, "global_step": 456854, "epoch": 5504} {"train_loss": -26.786884307861328, "global_step": 456855, "epoch": 5504} {"train_loss": -26.43634605407715, "global_step": 456856, "epoch": 5504} {"train_loss": -26.670392990112305, "global_step": 456857, "epoch": 5504} {"train_loss": -27.247913360595703, "global_step": 456858, "epoch": 5504} {"train_loss": -26.73053550720215, "global_step": 456859, "epoch": 5504} {"train_loss": -26.928049087524414, "global_step": 456860, "epoch": 5504} {"train_loss": -26.8581600189209, "global_step": 456861, "epoch": 5504} {"train_loss": -27.202228546142578, "global_step": 456862, "epoch": 5504} {"train_loss": -27.23944091796875, "global_step": 456863, "epoch": 5504} {"train_loss": -26.95948600769043, "global_step": 456864, "epoch": 5504} {"train_loss": -26.806379318237305, "global_step": 456865, "epoch": 5504} {"train_loss": -27.086713790893555, "global_step": 456866, "epoch": 5504} {"train_loss": -27.128026962280273, "global_step": 456867, "epoch": 5504} {"train_loss": -26.795825958251953, "global_step": 456868, "epoch": 5504} {"train_loss": -26.906530380249023, "global_step": 456869, "epoch": 5504} {"train_loss": -27.263071060180664, "global_step": 456870, "epoch": 5504} {"train_loss": -27.093414306640625, "global_step": 456871, "epoch": 5504} {"train_loss": -27.076696395874023, "global_step": 456872, "epoch": 5504} {"train_loss": -27.141321182250977, "global_step": 456873, "epoch": 5504} {"train_loss": -27.16851806640625, "global_step": 456874, "epoch": 5504} {"train_loss": -27.2857666015625, "global_step": 456875, "epoch": 5504} {"train_loss": -27.308618545532227, "global_step": 456876, "epoch": 5504} {"train_loss": -27.017364501953125, "global_step": 456877, "epoch": 5504} {"train_loss": -26.943347930908203, "global_step": 456878, "epoch": 5504} {"train_loss": -27.275562286376953, "global_step": 456879, "epoch": 5504} {"train_loss": -26.899656295776367, "global_step": 456880, "epoch": 5504} {"train_loss": -27.127004623413086, "global_step": 456881, "epoch": 5504} {"train_loss": -27.173185348510742, "global_step": 456882, "epoch": 5504} {"train_loss": -27.476465225219727, "global_step": 456883, "epoch": 5504} {"train_loss": -27.457122802734375, "global_step": 456884, "epoch": 5504} {"train_loss": -27.090381622314453, "global_step": 456885, "epoch": 5504} {"train_loss": -27.203189849853516, "global_step": 456886, "epoch": 5504} {"train_loss": -27.5639591217041, "global_step": 456887, "epoch": 5504} {"train_loss": -27.707242965698242, "global_step": 456888, "epoch": 5504} {"train_loss": -27.378061294555664, "global_step": 456889, "epoch": 5504} {"train_loss": -27.428180694580078, "global_step": 456890, "epoch": 5504} {"train_loss": -27.266284942626953, "global_step": 456891, "epoch": 5504} {"train_loss": -27.28604507446289, "global_step": 456892, "epoch": 5504} {"train_loss": -26.98758888244629, "global_step": 456893, "epoch": 5504} {"train_loss": -27.054040908813477, "global_step": 456894, "epoch": 5504} {"train_loss": -26.795896530151367, "global_step": 456895, "epoch": 5504} {"train_loss": -27.282581329345703, "global_step": 456896, "epoch": 5504} {"train_loss": -27.420312881469727, "global_step": 456897, "epoch": 5504} {"train_loss": -27.399749755859375, "global_step": 456898, "epoch": 5504} {"train_loss": -27.15165138244629, "global_step": 456899, "epoch": 5504} {"train_loss": -27.400365829467773, "global_step": 456900, "epoch": 5504} {"train_loss": -27.214263916015625, "global_step": 456901, "epoch": 5504} {"train_loss": -26.952442169189453, "global_step": 456902, "epoch": 5504} {"train_loss": -27.24323844909668, "global_step": 456903, "epoch": 5504} {"train_loss": -27.361801147460938, "global_step": 456904, "epoch": 5504} {"train_loss": -26.908279418945312, "global_step": 456905, "epoch": 5504} {"train_loss": -26.97730827331543, "global_step": 456906, "epoch": 5504} {"train_loss": -27.080881118774414, "global_step": 456907, "epoch": 5504} {"train_loss": -27.137775421142578, "global_step": 456908, "epoch": 5504} {"train_loss": -26.905027389526367, "global_step": 456909, "epoch": 5504} {"train_loss": -27.066436767578125, "global_step": 456910, "epoch": 5504} {"train_loss": -26.745344161987305, "global_step": 456911, "epoch": 5504} {"train_loss": -27.542850494384766, "global_step": 456912, "epoch": 5504} {"train_loss": -27.15424156188965, "global_step": 456913, "epoch": 5504} {"train_loss": -26.99720807822354, "global_step": 456914, "epoch": 5504, "val_loss": 6563272.0} {"train_loss": -26.31707763671875, "global_step": 456915, "epoch": 5505} {"train_loss": -25.366262435913086, "global_step": 456916, "epoch": 5505} {"train_loss": -25.942413330078125, "global_step": 456917, "epoch": 5505} {"train_loss": -25.966175079345703, "global_step": 456918, "epoch": 5505} {"train_loss": -25.657001495361328, "global_step": 456919, "epoch": 5505} {"train_loss": -26.659814834594727, "global_step": 456920, "epoch": 5505} {"train_loss": -25.951154708862305, "global_step": 456921, "epoch": 5505} {"train_loss": -26.3924617767334, "global_step": 456922, "epoch": 5505} {"train_loss": -25.85230827331543, "global_step": 456923, "epoch": 5505} {"train_loss": -26.7747802734375, "global_step": 456924, "epoch": 5505} {"train_loss": -26.207605361938477, "global_step": 456925, "epoch": 5505} {"train_loss": -26.529748916625977, "global_step": 456926, "epoch": 5505} {"train_loss": -26.76517677307129, "global_step": 456927, "epoch": 5505} {"train_loss": -26.71306800842285, "global_step": 456928, "epoch": 5505} {"train_loss": -26.786102294921875, "global_step": 456929, "epoch": 5505} {"train_loss": -26.725473403930664, "global_step": 456930, "epoch": 5505} {"train_loss": -26.545669555664062, "global_step": 456931, "epoch": 5505} {"train_loss": -27.06929588317871, "global_step": 456932, "epoch": 5505} {"train_loss": -26.96211051940918, "global_step": 456933, "epoch": 5505} {"train_loss": -26.545734405517578, "global_step": 456934, "epoch": 5505} {"train_loss": -26.909399032592773, "global_step": 456935, "epoch": 5505} {"train_loss": -26.836759567260742, "global_step": 456936, "epoch": 5505} {"train_loss": -26.91936683654785, "global_step": 456937, "epoch": 5505} {"train_loss": -26.767059326171875, "global_step": 456938, "epoch": 5505} {"train_loss": -27.034414291381836, "global_step": 456939, "epoch": 5505} {"train_loss": -26.6408634185791, "global_step": 456940, "epoch": 5505} {"train_loss": -26.85206413269043, "global_step": 456941, "epoch": 5505} {"train_loss": -27.083389282226562, "global_step": 456942, "epoch": 5505} {"train_loss": -26.94828224182129, "global_step": 456943, "epoch": 5505} {"train_loss": -26.632001876831055, "global_step": 456944, "epoch": 5505} {"train_loss": -27.515180587768555, "global_step": 456945, "epoch": 5505} {"train_loss": -26.654315948486328, "global_step": 456946, "epoch": 5505} {"train_loss": -26.813934326171875, "global_step": 456947, "epoch": 5505} {"train_loss": -27.24152946472168, "global_step": 456948, "epoch": 5505} {"train_loss": -26.96290397644043, "global_step": 456949, "epoch": 5505} {"train_loss": -26.88484001159668, "global_step": 456950, "epoch": 5505} {"train_loss": -27.140466690063477, "global_step": 456951, "epoch": 5505} {"train_loss": -26.915658950805664, "global_step": 456952, "epoch": 5505} {"train_loss": -27.168542861938477, "global_step": 456953, "epoch": 5505} {"train_loss": -27.111982345581055, "global_step": 456954, "epoch": 5505} {"train_loss": -26.65774917602539, "global_step": 456955, "epoch": 5505} {"train_loss": -27.447372436523438, "global_step": 456956, "epoch": 5505} {"train_loss": -26.886215209960938, "global_step": 456957, "epoch": 5505} {"train_loss": -27.058679580688477, "global_step": 456958, "epoch": 5505} {"train_loss": -26.743961334228516, "global_step": 456959, "epoch": 5505} {"train_loss": -27.038745880126953, "global_step": 456960, "epoch": 5505} {"train_loss": -27.16266441345215, "global_step": 456961, "epoch": 5505} {"train_loss": -26.883398056030273, "global_step": 456962, "epoch": 5505} {"train_loss": -26.946002960205078, "global_step": 456963, "epoch": 5505} {"train_loss": -27.246784210205078, "global_step": 456964, "epoch": 5505} {"train_loss": -26.81025505065918, "global_step": 456965, "epoch": 5505} {"train_loss": -27.044021606445312, "global_step": 456966, "epoch": 5505} {"train_loss": -27.391942977905273, "global_step": 456967, "epoch": 5505} {"train_loss": -26.932004928588867, "global_step": 456968, "epoch": 5505} {"train_loss": -27.04204750061035, "global_step": 456969, "epoch": 5505} {"train_loss": -26.812580108642578, "global_step": 456970, "epoch": 5505} {"train_loss": -26.875152587890625, "global_step": 456971, "epoch": 5505} {"train_loss": -27.319595336914062, "global_step": 456972, "epoch": 5505} {"train_loss": -27.033100128173828, "global_step": 456973, "epoch": 5505} {"train_loss": -27.068429946899414, "global_step": 456974, "epoch": 5505} {"train_loss": -27.12037467956543, "global_step": 456975, "epoch": 5505} {"train_loss": -27.113513946533203, "global_step": 456976, "epoch": 5505} {"train_loss": -27.079877853393555, "global_step": 456977, "epoch": 5505} {"train_loss": -27.173391342163086, "global_step": 456978, "epoch": 5505} {"train_loss": -27.291250228881836, "global_step": 456979, "epoch": 5505} {"train_loss": -26.911710739135742, "global_step": 456980, "epoch": 5505} {"train_loss": -27.446075439453125, "global_step": 456981, "epoch": 5505} {"train_loss": -27.18048095703125, "global_step": 456982, "epoch": 5505} {"train_loss": -27.12238121032715, "global_step": 456983, "epoch": 5505} {"train_loss": -27.565753936767578, "global_step": 456984, "epoch": 5505} {"train_loss": -27.09854507446289, "global_step": 456985, "epoch": 5505} {"train_loss": -27.176931381225586, "global_step": 456986, "epoch": 5505} {"train_loss": -26.999256134033203, "global_step": 456987, "epoch": 5505} {"train_loss": -27.311986923217773, "global_step": 456988, "epoch": 5505} {"train_loss": -27.170867919921875, "global_step": 456989, "epoch": 5505} {"train_loss": -27.416519165039062, "global_step": 456990, "epoch": 5505} {"train_loss": -27.223358154296875, "global_step": 456991, "epoch": 5505} {"train_loss": -27.446125030517578, "global_step": 456992, "epoch": 5505} {"train_loss": -27.534347534179688, "global_step": 456993, "epoch": 5505} {"train_loss": -27.4184513092041, "global_step": 456994, "epoch": 5505} {"train_loss": -27.675931930541992, "global_step": 456995, "epoch": 5505} {"train_loss": -27.55401611328125, "global_step": 456996, "epoch": 5505} {"train_loss": -26.924624753285602, "global_step": 456997, "epoch": 5505, "val_loss": 6506895.5} {"train_loss": -26.565933227539062, "global_step": 456998, "epoch": 5506} {"train_loss": -26.271728515625, "global_step": 456999, "epoch": 5506} {"train_loss": -26.35762596130371, "global_step": 457000, "epoch": 5506} {"train_loss": -26.47591209411621, "global_step": 457001, "epoch": 5506} {"train_loss": -26.332294464111328, "global_step": 457002, "epoch": 5506} {"train_loss": -26.300140380859375, "global_step": 457003, "epoch": 5506} {"train_loss": -27.057043075561523, "global_step": 457004, "epoch": 5506} {"train_loss": -26.967443466186523, "global_step": 457005, "epoch": 5506} {"train_loss": -26.547943115234375, "global_step": 457006, "epoch": 5506} {"train_loss": -26.71042823791504, "global_step": 457007, "epoch": 5506} {"train_loss": -26.45783805847168, "global_step": 457008, "epoch": 5506} {"train_loss": -26.99271011352539, "global_step": 457009, "epoch": 5506} {"train_loss": -26.93751335144043, "global_step": 457010, "epoch": 5506} {"train_loss": -26.91680908203125, "global_step": 457011, "epoch": 5506} {"train_loss": -26.6794490814209, "global_step": 457012, "epoch": 5506} {"train_loss": -27.165363311767578, "global_step": 457013, "epoch": 5506} {"train_loss": -27.15447998046875, "global_step": 457014, "epoch": 5506} {"train_loss": -26.91546058654785, "global_step": 457015, "epoch": 5506} {"train_loss": -26.670225143432617, "global_step": 457016, "epoch": 5506} {"train_loss": -26.8264217376709, "global_step": 457017, "epoch": 5506} {"train_loss": -26.790380477905273, "global_step": 457018, "epoch": 5506} {"train_loss": -26.7008056640625, "global_step": 457019, "epoch": 5506} {"train_loss": -27.2083740234375, "global_step": 457020, "epoch": 5506} {"train_loss": -27.264942169189453, "global_step": 457021, "epoch": 5506} {"train_loss": -26.7818546295166, "global_step": 457022, "epoch": 5506} {"train_loss": -26.87461280822754, "global_step": 457023, "epoch": 5506} {"train_loss": -27.144262313842773, "global_step": 457024, "epoch": 5506} {"train_loss": -26.765201568603516, "global_step": 457025, "epoch": 5506} {"train_loss": -26.953344345092773, "global_step": 457026, "epoch": 5506} {"train_loss": -27.18684959411621, "global_step": 457027, "epoch": 5506} {"train_loss": -26.935392379760742, "global_step": 457028, "epoch": 5506} {"train_loss": -27.16204261779785, "global_step": 457029, "epoch": 5506} {"train_loss": -27.213354110717773, "global_step": 457030, "epoch": 5506} {"train_loss": -27.042478561401367, "global_step": 457031, "epoch": 5506} {"train_loss": -27.126123428344727, "global_step": 457032, "epoch": 5506} {"train_loss": -27.12923240661621, "global_step": 457033, "epoch": 5506} {"train_loss": -27.178945541381836, "global_step": 457034, "epoch": 5506} {"train_loss": -27.2933292388916, "global_step": 457035, "epoch": 5506} {"train_loss": -27.102375030517578, "global_step": 457036, "epoch": 5506} {"train_loss": -27.022968292236328, "global_step": 457037, "epoch": 5506} {"train_loss": -27.110187530517578, "global_step": 457038, "epoch": 5506} {"train_loss": -27.419097900390625, "global_step": 457039, "epoch": 5506} {"train_loss": -27.407987594604492, "global_step": 457040, "epoch": 5506} {"train_loss": -26.86305046081543, "global_step": 457041, "epoch": 5506} {"train_loss": -27.403066635131836, "global_step": 457042, "epoch": 5506} {"train_loss": -27.366809844970703, "global_step": 457043, "epoch": 5506} {"train_loss": -27.011672973632812, "global_step": 457044, "epoch": 5506} {"train_loss": -27.2904109954834, "global_step": 457045, "epoch": 5506} {"train_loss": -26.948078155517578, "global_step": 457046, "epoch": 5506} {"train_loss": -27.34681510925293, "global_step": 457047, "epoch": 5506} {"train_loss": -26.943531036376953, "global_step": 457048, "epoch": 5506} {"train_loss": -27.383996963500977, "global_step": 457049, "epoch": 5506} {"train_loss": -27.14668083190918, "global_step": 457050, "epoch": 5506} {"train_loss": -26.59222412109375, "global_step": 457051, "epoch": 5506} {"train_loss": -26.812458038330078, "global_step": 457052, "epoch": 5506} {"train_loss": -27.1060733795166, "global_step": 457053, "epoch": 5506} {"train_loss": -26.400115966796875, "global_step": 457054, "epoch": 5506} {"train_loss": -26.9539737701416, "global_step": 457055, "epoch": 5506} {"train_loss": -27.2119197845459, "global_step": 457056, "epoch": 5506} {"train_loss": -27.101343154907227, "global_step": 457057, "epoch": 5506} {"train_loss": -26.957406997680664, "global_step": 457058, "epoch": 5506} {"train_loss": -26.88071060180664, "global_step": 457059, "epoch": 5506} {"train_loss": -26.556110382080078, "global_step": 457060, "epoch": 5506} {"train_loss": -27.206134796142578, "global_step": 457061, "epoch": 5506} {"train_loss": -27.0687198638916, "global_step": 457062, "epoch": 5506} {"train_loss": -26.844268798828125, "global_step": 457063, "epoch": 5506} {"train_loss": -26.963592529296875, "global_step": 457064, "epoch": 5506} {"train_loss": -27.04412841796875, "global_step": 457065, "epoch": 5506} {"train_loss": -27.362945556640625, "global_step": 457066, "epoch": 5506} {"train_loss": -27.56125259399414, "global_step": 457067, "epoch": 5506} {"train_loss": -27.431806564331055, "global_step": 457068, "epoch": 5506} {"train_loss": -27.423721313476562, "global_step": 457069, "epoch": 5506} {"train_loss": -27.142749786376953, "global_step": 457070, "epoch": 5506} {"train_loss": -27.029052734375, "global_step": 457071, "epoch": 5506} {"train_loss": -26.77504539489746, "global_step": 457072, "epoch": 5506} {"train_loss": -27.300079345703125, "global_step": 457073, "epoch": 5506} {"train_loss": -27.44036293029785, "global_step": 457074, "epoch": 5506} {"train_loss": -26.912378311157227, "global_step": 457075, "epoch": 5506} {"train_loss": -27.496673583984375, "global_step": 457076, "epoch": 5506} {"train_loss": -27.59689712524414, "global_step": 457077, "epoch": 5506} {"train_loss": -26.862762451171875, "global_step": 457078, "epoch": 5506} {"train_loss": -27.328771591186523, "global_step": 457079, "epoch": 5506} {"train_loss": -26.993597421301416, "global_step": 457080, "epoch": 5506, "val_loss": 6474897.0} {"train_loss": -26.245092391967773, "global_step": 457081, "epoch": 5507} {"train_loss": -25.584630966186523, "global_step": 457082, "epoch": 5507} {"train_loss": -24.389768600463867, "global_step": 457083, "epoch": 5507} {"train_loss": -26.16472816467285, "global_step": 457084, "epoch": 5507} {"train_loss": -25.997175216674805, "global_step": 457085, "epoch": 5507} {"train_loss": -26.120193481445312, "global_step": 457086, "epoch": 5507} {"train_loss": -25.868244171142578, "global_step": 457087, "epoch": 5507} {"train_loss": -26.29931640625, "global_step": 457088, "epoch": 5507} {"train_loss": -26.066089630126953, "global_step": 457089, "epoch": 5507} {"train_loss": -26.43940544128418, "global_step": 457090, "epoch": 5507} {"train_loss": -26.349536895751953, "global_step": 457091, "epoch": 5507} {"train_loss": -26.968067169189453, "global_step": 457092, "epoch": 5507} {"train_loss": -26.69483757019043, "global_step": 457093, "epoch": 5507} {"train_loss": -26.67426872253418, "global_step": 457094, "epoch": 5507} {"train_loss": -26.762744903564453, "global_step": 457095, "epoch": 5507} {"train_loss": -26.72128677368164, "global_step": 457096, "epoch": 5507} {"train_loss": -26.765310287475586, "global_step": 457097, "epoch": 5507} {"train_loss": -26.735706329345703, "global_step": 457098, "epoch": 5507} {"train_loss": -26.81659507751465, "global_step": 457099, "epoch": 5507} {"train_loss": -26.97265625, "global_step": 457100, "epoch": 5507} {"train_loss": -26.483205795288086, "global_step": 457101, "epoch": 5507} {"train_loss": -26.884265899658203, "global_step": 457102, "epoch": 5507} {"train_loss": -26.831256866455078, "global_step": 457103, "epoch": 5507} {"train_loss": -26.543588638305664, "global_step": 457104, "epoch": 5507} {"train_loss": -26.498640060424805, "global_step": 457105, "epoch": 5507} {"train_loss": -27.011524200439453, "global_step": 457106, "epoch": 5507} {"train_loss": -26.442956924438477, "global_step": 457107, "epoch": 5507} {"train_loss": -26.830347061157227, "global_step": 457108, "epoch": 5507} {"train_loss": -26.951536178588867, "global_step": 457109, "epoch": 5507} {"train_loss": -27.159738540649414, "global_step": 457110, "epoch": 5507} {"train_loss": -26.84058952331543, "global_step": 457111, "epoch": 5507} {"train_loss": -26.83161735534668, "global_step": 457112, "epoch": 5507} {"train_loss": -26.952594757080078, "global_step": 457113, "epoch": 5507} {"train_loss": -27.183507919311523, "global_step": 457114, "epoch": 5507} {"train_loss": -27.065282821655273, "global_step": 457115, "epoch": 5507} {"train_loss": -27.36408042907715, "global_step": 457116, "epoch": 5507} {"train_loss": -26.9765567779541, "global_step": 457117, "epoch": 5507} {"train_loss": -26.86695671081543, "global_step": 457118, "epoch": 5507} {"train_loss": -26.89984130859375, "global_step": 457119, "epoch": 5507} {"train_loss": -27.070068359375, "global_step": 457120, "epoch": 5507} {"train_loss": -27.18464469909668, "global_step": 457121, "epoch": 5507} {"train_loss": -27.309656143188477, "global_step": 457122, "epoch": 5507} {"train_loss": -27.008655548095703, "global_step": 457123, "epoch": 5507} {"train_loss": -26.837629318237305, "global_step": 457124, "epoch": 5507} {"train_loss": -27.442859649658203, "global_step": 457125, "epoch": 5507} {"train_loss": -27.449079513549805, "global_step": 457126, "epoch": 5507} {"train_loss": -27.35699462890625, "global_step": 457127, "epoch": 5507} {"train_loss": -27.296300888061523, "global_step": 457128, "epoch": 5507} {"train_loss": -27.224842071533203, "global_step": 457129, "epoch": 5507} {"train_loss": -27.274250030517578, "global_step": 457130, "epoch": 5507} {"train_loss": -27.1757869720459, "global_step": 457131, "epoch": 5507} {"train_loss": -27.098447799682617, "global_step": 457132, "epoch": 5507} {"train_loss": -27.34669303894043, "global_step": 457133, "epoch": 5507} {"train_loss": -27.38115882873535, "global_step": 457134, "epoch": 5507} {"train_loss": -27.442228317260742, "global_step": 457135, "epoch": 5507} {"train_loss": -27.57892417907715, "global_step": 457136, "epoch": 5507} {"train_loss": -27.275171279907227, "global_step": 457137, "epoch": 5507} {"train_loss": -27.29075050354004, "global_step": 457138, "epoch": 5507} {"train_loss": -27.29103660583496, "global_step": 457139, "epoch": 5507} {"train_loss": -27.143659591674805, "global_step": 457140, "epoch": 5507} {"train_loss": -27.23748207092285, "global_step": 457141, "epoch": 5507} {"train_loss": -27.344898223876953, "global_step": 457142, "epoch": 5507} {"train_loss": -27.026350021362305, "global_step": 457143, "epoch": 5507} {"train_loss": -27.24836540222168, "global_step": 457144, "epoch": 5507} {"train_loss": -26.96785545349121, "global_step": 457145, "epoch": 5507} {"train_loss": -26.866239547729492, "global_step": 457146, "epoch": 5507} {"train_loss": -26.70517921447754, "global_step": 457147, "epoch": 5507} {"train_loss": -26.7745304107666, "global_step": 457148, "epoch": 5507} {"train_loss": -27.226850509643555, "global_step": 457149, "epoch": 5507} {"train_loss": -26.683744430541992, "global_step": 457150, "epoch": 5507} {"train_loss": -26.967920303344727, "global_step": 457151, "epoch": 5507} {"train_loss": -27.285490036010742, "global_step": 457152, "epoch": 5507} {"train_loss": -27.150415420532227, "global_step": 457153, "epoch": 5507} {"train_loss": -26.832983016967773, "global_step": 457154, "epoch": 5507} {"train_loss": -26.452512741088867, "global_step": 457155, "epoch": 5507} {"train_loss": -26.864521026611328, "global_step": 457156, "epoch": 5507} {"train_loss": -27.25446891784668, "global_step": 457157, "epoch": 5507} {"train_loss": -27.633808135986328, "global_step": 457158, "epoch": 5507} {"train_loss": -26.686019897460938, "global_step": 457159, "epoch": 5507} {"train_loss": -27.19051170349121, "global_step": 457160, "epoch": 5507} {"train_loss": -27.049795150756836, "global_step": 457161, "epoch": 5507} {"train_loss": -26.923551559448242, "global_step": 457162, "epoch": 5507} {"train_loss": -26.889823132250683, "global_step": 457163, "epoch": 5507, "val_loss": 6526247.0} {"train_loss": -26.354602813720703, "global_step": 457164, "epoch": 5508} {"train_loss": -25.499557495117188, "global_step": 457165, "epoch": 5508} {"train_loss": -26.101316452026367, "global_step": 457166, "epoch": 5508} {"train_loss": -26.61005973815918, "global_step": 457167, "epoch": 5508} {"train_loss": -26.406661987304688, "global_step": 457168, "epoch": 5508} {"train_loss": -26.5794620513916, "global_step": 457169, "epoch": 5508} {"train_loss": -26.531391143798828, "global_step": 457170, "epoch": 5508} {"train_loss": -26.6066951751709, "global_step": 457171, "epoch": 5508} {"train_loss": -26.482263565063477, "global_step": 457172, "epoch": 5508} {"train_loss": -26.755355834960938, "global_step": 457173, "epoch": 5508} {"train_loss": -26.7753963470459, "global_step": 457174, "epoch": 5508} {"train_loss": -26.511083602905273, "global_step": 457175, "epoch": 5508} {"train_loss": -26.579071044921875, "global_step": 457176, "epoch": 5508} {"train_loss": -26.927417755126953, "global_step": 457177, "epoch": 5508} {"train_loss": -26.87432861328125, "global_step": 457178, "epoch": 5508} {"train_loss": -26.766141891479492, "global_step": 457179, "epoch": 5508} {"train_loss": -26.78724479675293, "global_step": 457180, "epoch": 5508} {"train_loss": -26.84601402282715, "global_step": 457181, "epoch": 5508} {"train_loss": -26.978382110595703, "global_step": 457182, "epoch": 5508} {"train_loss": -26.81937599182129, "global_step": 457183, "epoch": 5508} {"train_loss": -26.827932357788086, "global_step": 457184, "epoch": 5508} {"train_loss": -27.244531631469727, "global_step": 457185, "epoch": 5508} {"train_loss": -26.86983299255371, "global_step": 457186, "epoch": 5508} {"train_loss": -26.831775665283203, "global_step": 457187, "epoch": 5508} {"train_loss": -26.98406410217285, "global_step": 457188, "epoch": 5508} {"train_loss": -26.651105880737305, "global_step": 457189, "epoch": 5508} {"train_loss": -27.180469512939453, "global_step": 457190, "epoch": 5508} {"train_loss": -26.8752498626709, "global_step": 457191, "epoch": 5508} {"train_loss": -26.95781898498535, "global_step": 457192, "epoch": 5508} {"train_loss": -27.164691925048828, "global_step": 457193, "epoch": 5508} {"train_loss": -27.093774795532227, "global_step": 457194, "epoch": 5508} {"train_loss": -26.87080192565918, "global_step": 457195, "epoch": 5508} {"train_loss": -27.36431884765625, "global_step": 457196, "epoch": 5508} {"train_loss": -26.834501266479492, "global_step": 457197, "epoch": 5508} {"train_loss": -27.257131576538086, "global_step": 457198, "epoch": 5508} {"train_loss": -26.897485733032227, "global_step": 457199, "epoch": 5508} {"train_loss": -27.317758560180664, "global_step": 457200, "epoch": 5508} {"train_loss": -27.210163116455078, "global_step": 457201, "epoch": 5508} {"train_loss": -27.096057891845703, "global_step": 457202, "epoch": 5508} {"train_loss": -26.883392333984375, "global_step": 457203, "epoch": 5508} {"train_loss": -27.183881759643555, "global_step": 457204, "epoch": 5508} {"train_loss": -26.921390533447266, "global_step": 457205, "epoch": 5508} {"train_loss": -27.3458251953125, "global_step": 457206, "epoch": 5508} {"train_loss": -26.939178466796875, "global_step": 457207, "epoch": 5508} {"train_loss": -27.22173500061035, "global_step": 457208, "epoch": 5508} {"train_loss": -27.030853271484375, "global_step": 457209, "epoch": 5508} {"train_loss": -26.7404842376709, "global_step": 457210, "epoch": 5508} {"train_loss": -26.90130043029785, "global_step": 457211, "epoch": 5508} {"train_loss": -26.752721786499023, "global_step": 457212, "epoch": 5508} {"train_loss": -27.0227108001709, "global_step": 457213, "epoch": 5508} {"train_loss": -27.351369857788086, "global_step": 457214, "epoch": 5508} {"train_loss": -27.526830673217773, "global_step": 457215, "epoch": 5508} {"train_loss": -27.25933837890625, "global_step": 457216, "epoch": 5508} {"train_loss": -27.273181915283203, "global_step": 457217, "epoch": 5508} {"train_loss": -27.086896896362305, "global_step": 457218, "epoch": 5508} {"train_loss": -27.323862075805664, "global_step": 457219, "epoch": 5508} {"train_loss": -27.385272979736328, "global_step": 457220, "epoch": 5508} {"train_loss": -27.053913116455078, "global_step": 457221, "epoch": 5508} {"train_loss": -27.194549560546875, "global_step": 457222, "epoch": 5508} {"train_loss": -27.3646240234375, "global_step": 457223, "epoch": 5508} {"train_loss": -27.281574249267578, "global_step": 457224, "epoch": 5508} {"train_loss": -26.96766471862793, "global_step": 457225, "epoch": 5508} {"train_loss": -27.188079833984375, "global_step": 457226, "epoch": 5508} {"train_loss": -27.297168731689453, "global_step": 457227, "epoch": 5508} {"train_loss": -26.90549087524414, "global_step": 457228, "epoch": 5508} {"train_loss": -27.38800048828125, "global_step": 457229, "epoch": 5508} {"train_loss": -27.129392623901367, "global_step": 457230, "epoch": 5508} {"train_loss": -27.257471084594727, "global_step": 457231, "epoch": 5508} {"train_loss": -26.872812271118164, "global_step": 457232, "epoch": 5508} {"train_loss": -27.255496978759766, "global_step": 457233, "epoch": 5508} {"train_loss": -27.20441246032715, "global_step": 457234, "epoch": 5508} {"train_loss": -27.12247085571289, "global_step": 457235, "epoch": 5508} {"train_loss": -27.110212326049805, "global_step": 457236, "epoch": 5508} {"train_loss": -27.417510986328125, "global_step": 457237, "epoch": 5508} {"train_loss": -27.12102699279785, "global_step": 457238, "epoch": 5508} {"train_loss": -27.282257080078125, "global_step": 457239, "epoch": 5508} {"train_loss": -27.19721031188965, "global_step": 457240, "epoch": 5508} {"train_loss": -26.99127769470215, "global_step": 457241, "epoch": 5508} {"train_loss": -27.06888198852539, "global_step": 457242, "epoch": 5508} {"train_loss": -26.8617000579834, "global_step": 457243, "epoch": 5508} {"train_loss": -26.96736717224121, "global_step": 457244, "epoch": 5508} {"train_loss": -26.603940963745117, "global_step": 457245, "epoch": 5508} {"train_loss": -26.9765109326466, "global_step": 457246, "epoch": 5508, "val_loss": 6487375.0} {"train_loss": -25.918975830078125, "global_step": 457247, "epoch": 5509} {"train_loss": -26.011716842651367, "global_step": 457248, "epoch": 5509} {"train_loss": -25.753631591796875, "global_step": 457249, "epoch": 5509} {"train_loss": -26.026227951049805, "global_step": 457250, "epoch": 5509} {"train_loss": -26.097137451171875, "global_step": 457251, "epoch": 5509} {"train_loss": -26.549325942993164, "global_step": 457252, "epoch": 5509} {"train_loss": -26.220550537109375, "global_step": 457253, "epoch": 5509} {"train_loss": -26.273849487304688, "global_step": 457254, "epoch": 5509} {"train_loss": -26.26045036315918, "global_step": 457255, "epoch": 5509} {"train_loss": -26.717670440673828, "global_step": 457256, "epoch": 5509} {"train_loss": -26.32366943359375, "global_step": 457257, "epoch": 5509} {"train_loss": -26.955265045166016, "global_step": 457258, "epoch": 5509} {"train_loss": -26.527063369750977, "global_step": 457259, "epoch": 5509} {"train_loss": -26.57581901550293, "global_step": 457260, "epoch": 5509} {"train_loss": -26.77530860900879, "global_step": 457261, "epoch": 5509} {"train_loss": -26.899194717407227, "global_step": 457262, "epoch": 5509} {"train_loss": -26.89325523376465, "global_step": 457263, "epoch": 5509} {"train_loss": -26.796100616455078, "global_step": 457264, "epoch": 5509} {"train_loss": -26.84857749938965, "global_step": 457265, "epoch": 5509} {"train_loss": -26.80784034729004, "global_step": 457266, "epoch": 5509} {"train_loss": -26.87158203125, "global_step": 457267, "epoch": 5509} {"train_loss": -26.979482650756836, "global_step": 457268, "epoch": 5509} {"train_loss": -27.183347702026367, "global_step": 457269, "epoch": 5509} {"train_loss": -26.820972442626953, "global_step": 457270, "epoch": 5509} {"train_loss": -26.963531494140625, "global_step": 457271, "epoch": 5509} {"train_loss": -27.02762222290039, "global_step": 457272, "epoch": 5509} {"train_loss": -26.90472412109375, "global_step": 457273, "epoch": 5509} {"train_loss": -27.261829376220703, "global_step": 457274, "epoch": 5509} {"train_loss": -27.176193237304688, "global_step": 457275, "epoch": 5509} {"train_loss": -27.17779541015625, "global_step": 457276, "epoch": 5509} {"train_loss": -27.026269912719727, "global_step": 457277, "epoch": 5509} {"train_loss": -27.23849868774414, "global_step": 457278, "epoch": 5509} {"train_loss": -26.628589630126953, "global_step": 457279, "epoch": 5509} {"train_loss": -27.02249526977539, "global_step": 457280, "epoch": 5509} {"train_loss": -27.202911376953125, "global_step": 457281, "epoch": 5509} {"train_loss": -27.100004196166992, "global_step": 457282, "epoch": 5509} {"train_loss": -26.993824005126953, "global_step": 457283, "epoch": 5509} {"train_loss": -27.697864532470703, "global_step": 457284, "epoch": 5509} {"train_loss": -26.96622657775879, "global_step": 457285, "epoch": 5509} {"train_loss": -27.012256622314453, "global_step": 457286, "epoch": 5509} {"train_loss": -27.35957145690918, "global_step": 457287, "epoch": 5509} {"train_loss": -26.819549560546875, "global_step": 457288, "epoch": 5509} {"train_loss": -27.340641021728516, "global_step": 457289, "epoch": 5509} {"train_loss": -26.679752349853516, "global_step": 457290, "epoch": 5509} {"train_loss": -26.82004737854004, "global_step": 457291, "epoch": 5509} {"train_loss": -27.230060577392578, "global_step": 457292, "epoch": 5509} {"train_loss": -27.211994171142578, "global_step": 457293, "epoch": 5509} {"train_loss": -26.935638427734375, "global_step": 457294, "epoch": 5509} {"train_loss": -27.175628662109375, "global_step": 457295, "epoch": 5509} {"train_loss": -27.171939849853516, "global_step": 457296, "epoch": 5509} {"train_loss": -26.510602951049805, "global_step": 457297, "epoch": 5509} {"train_loss": -26.99555778503418, "global_step": 457298, "epoch": 5509} {"train_loss": -27.347986221313477, "global_step": 457299, "epoch": 5509} {"train_loss": -27.097869873046875, "global_step": 457300, "epoch": 5509} {"train_loss": -26.728565216064453, "global_step": 457301, "epoch": 5509} {"train_loss": -27.220727920532227, "global_step": 457302, "epoch": 5509} {"train_loss": -27.468463897705078, "global_step": 457303, "epoch": 5509} {"train_loss": -26.72939109802246, "global_step": 457304, "epoch": 5509} {"train_loss": -27.252492904663086, "global_step": 457305, "epoch": 5509} {"train_loss": -26.959625244140625, "global_step": 457306, "epoch": 5509} {"train_loss": -27.175329208374023, "global_step": 457307, "epoch": 5509} {"train_loss": -27.129657745361328, "global_step": 457308, "epoch": 5509} {"train_loss": -27.166004180908203, "global_step": 457309, "epoch": 5509} {"train_loss": -27.253507614135742, "global_step": 457310, "epoch": 5509} {"train_loss": -27.198211669921875, "global_step": 457311, "epoch": 5509} {"train_loss": -27.355838775634766, "global_step": 457312, "epoch": 5509} {"train_loss": -27.19532585144043, "global_step": 457313, "epoch": 5509} {"train_loss": -27.401823043823242, "global_step": 457314, "epoch": 5509} {"train_loss": -27.327505111694336, "global_step": 457315, "epoch": 5509} {"train_loss": -27.41718101501465, "global_step": 457316, "epoch": 5509} {"train_loss": -26.92481803894043, "global_step": 457317, "epoch": 5509} {"train_loss": -27.4300594329834, "global_step": 457318, "epoch": 5509} {"train_loss": -27.06244468688965, "global_step": 457319, "epoch": 5509} {"train_loss": -27.1246395111084, "global_step": 457320, "epoch": 5509} {"train_loss": -27.223031997680664, "global_step": 457321, "epoch": 5509} {"train_loss": -27.370391845703125, "global_step": 457322, "epoch": 5509} {"train_loss": -26.951297760009766, "global_step": 457323, "epoch": 5509} {"train_loss": -27.08881950378418, "global_step": 457324, "epoch": 5509} {"train_loss": -27.004934310913086, "global_step": 457325, "epoch": 5509} {"train_loss": -26.127731323242188, "global_step": 457326, "epoch": 5509} {"train_loss": -26.484455108642578, "global_step": 457327, "epoch": 5509} {"train_loss": -27.144378662109375, "global_step": 457328, "epoch": 5509} {"train_loss": -26.93182039835367, "global_step": 457329, "epoch": 5509, "val_loss": 6552970.0} {"train_loss": -25.288732528686523, "global_step": 457330, "epoch": 5510} {"train_loss": -25.652822494506836, "global_step": 457331, "epoch": 5510} {"train_loss": -26.245798110961914, "global_step": 457332, "epoch": 5510} {"train_loss": -25.623748779296875, "global_step": 457333, "epoch": 5510} {"train_loss": -25.530986785888672, "global_step": 457334, "epoch": 5510} {"train_loss": -26.32132911682129, "global_step": 457335, "epoch": 5510} {"train_loss": -25.919736862182617, "global_step": 457336, "epoch": 5510} {"train_loss": -26.260854721069336, "global_step": 457337, "epoch": 5510} {"train_loss": -26.428638458251953, "global_step": 457338, "epoch": 5510} {"train_loss": -26.150543212890625, "global_step": 457339, "epoch": 5510} {"train_loss": -26.6143856048584, "global_step": 457340, "epoch": 5510} {"train_loss": -26.314359664916992, "global_step": 457341, "epoch": 5510} {"train_loss": -26.036884307861328, "global_step": 457342, "epoch": 5510} {"train_loss": -26.57952880859375, "global_step": 457343, "epoch": 5510} {"train_loss": -26.092742919921875, "global_step": 457344, "epoch": 5510} {"train_loss": -26.040151596069336, "global_step": 457345, "epoch": 5510} {"train_loss": -26.602344512939453, "global_step": 457346, "epoch": 5510} {"train_loss": -26.330270767211914, "global_step": 457347, "epoch": 5510} {"train_loss": -27.1787166595459, "global_step": 457348, "epoch": 5510} {"train_loss": -26.34535026550293, "global_step": 457349, "epoch": 5510} {"train_loss": -26.669803619384766, "global_step": 457350, "epoch": 5510} {"train_loss": -26.42328453063965, "global_step": 457351, "epoch": 5510} {"train_loss": -26.799680709838867, "global_step": 457352, "epoch": 5510} {"train_loss": -26.860830307006836, "global_step": 457353, "epoch": 5510} {"train_loss": -26.71319007873535, "global_step": 457354, "epoch": 5510} {"train_loss": -26.815587997436523, "global_step": 457355, "epoch": 5510} {"train_loss": -26.96339225769043, "global_step": 457356, "epoch": 5510} {"train_loss": -26.759363174438477, "global_step": 457357, "epoch": 5510} {"train_loss": -26.937519073486328, "global_step": 457358, "epoch": 5510} {"train_loss": -26.95039176940918, "global_step": 457359, "epoch": 5510} {"train_loss": -26.855487823486328, "global_step": 457360, "epoch": 5510} {"train_loss": -27.229236602783203, "global_step": 457361, "epoch": 5510} {"train_loss": -26.96482276916504, "global_step": 457362, "epoch": 5510} {"train_loss": -26.984939575195312, "global_step": 457363, "epoch": 5510} {"train_loss": -26.75508689880371, "global_step": 457364, "epoch": 5510} {"train_loss": -26.937253952026367, "global_step": 457365, "epoch": 5510} {"train_loss": -27.158559799194336, "global_step": 457366, "epoch": 5510} {"train_loss": -27.162277221679688, "global_step": 457367, "epoch": 5510} {"train_loss": -27.263931274414062, "global_step": 457368, "epoch": 5510} {"train_loss": -27.410419464111328, "global_step": 457369, "epoch": 5510} {"train_loss": -26.94307518005371, "global_step": 457370, "epoch": 5510} {"train_loss": -27.222009658813477, "global_step": 457371, "epoch": 5510} {"train_loss": -27.30653190612793, "global_step": 457372, "epoch": 5510} {"train_loss": -26.90846061706543, "global_step": 457373, "epoch": 5510} {"train_loss": -27.411209106445312, "global_step": 457374, "epoch": 5510} {"train_loss": -27.483922958374023, "global_step": 457375, "epoch": 5510} {"train_loss": -27.4266300201416, "global_step": 457376, "epoch": 5510} {"train_loss": -27.37969970703125, "global_step": 457377, "epoch": 5510} {"train_loss": -27.421377182006836, "global_step": 457378, "epoch": 5510} {"train_loss": -27.070087432861328, "global_step": 457379, "epoch": 5510} {"train_loss": -27.652917861938477, "global_step": 457380, "epoch": 5510} {"train_loss": -27.49945068359375, "global_step": 457381, "epoch": 5510} {"train_loss": -27.13287925720215, "global_step": 457382, "epoch": 5510} {"train_loss": -27.568103790283203, "global_step": 457383, "epoch": 5510} {"train_loss": -27.404340744018555, "global_step": 457384, "epoch": 5510} {"train_loss": -27.41632080078125, "global_step": 457385, "epoch": 5510} {"train_loss": -27.481611251831055, "global_step": 457386, "epoch": 5510} {"train_loss": -27.2232723236084, "global_step": 457387, "epoch": 5510} {"train_loss": -27.211084365844727, "global_step": 457388, "epoch": 5510} {"train_loss": -27.366540908813477, "global_step": 457389, "epoch": 5510} {"train_loss": -27.578170776367188, "global_step": 457390, "epoch": 5510} {"train_loss": -27.625089645385742, "global_step": 457391, "epoch": 5510} {"train_loss": -27.2265682220459, "global_step": 457392, "epoch": 5510} {"train_loss": -26.5408935546875, "global_step": 457393, "epoch": 5510} {"train_loss": -26.240802764892578, "global_step": 457394, "epoch": 5510} {"train_loss": -25.9144229888916, "global_step": 457395, "epoch": 5510} {"train_loss": -26.449609756469727, "global_step": 457396, "epoch": 5510} {"train_loss": -26.13129234313965, "global_step": 457397, "epoch": 5510} {"train_loss": -25.64057731628418, "global_step": 457398, "epoch": 5510} {"train_loss": -26.527729034423828, "global_step": 457399, "epoch": 5510} {"train_loss": -26.758838653564453, "global_step": 457400, "epoch": 5510} {"train_loss": -26.7979679107666, "global_step": 457401, "epoch": 5510} {"train_loss": -26.73443031311035, "global_step": 457402, "epoch": 5510} {"train_loss": -26.744937896728516, "global_step": 457403, "epoch": 5510} {"train_loss": -26.97248649597168, "global_step": 457404, "epoch": 5510} {"train_loss": -26.82554054260254, "global_step": 457405, "epoch": 5510} {"train_loss": -26.894821166992188, "global_step": 457406, "epoch": 5510} {"train_loss": -26.694421768188477, "global_step": 457407, "epoch": 5510} {"train_loss": -26.83198356628418, "global_step": 457408, "epoch": 5510} {"train_loss": -27.01165199279785, "global_step": 457409, "epoch": 5510} {"train_loss": -27.200769424438477, "global_step": 457410, "epoch": 5510} {"train_loss": -26.7586727142334, "global_step": 457411, "epoch": 5510} {"train_loss": -26.7947980811797, "global_step": 457412, "epoch": 5510, "val_loss": 6525812.0} {"train_loss": -26.832197189331055, "global_step": 457413, "epoch": 5511} {"train_loss": -26.433090209960938, "global_step": 457414, "epoch": 5511} {"train_loss": -26.666006088256836, "global_step": 457415, "epoch": 5511} {"train_loss": -26.937103271484375, "global_step": 457416, "epoch": 5511} {"train_loss": -26.651111602783203, "global_step": 457417, "epoch": 5511} {"train_loss": -26.58759880065918, "global_step": 457418, "epoch": 5511} {"train_loss": -26.74887466430664, "global_step": 457419, "epoch": 5511} {"train_loss": -26.99640464782715, "global_step": 457420, "epoch": 5511} {"train_loss": -26.686872482299805, "global_step": 457421, "epoch": 5511} {"train_loss": -26.775775909423828, "global_step": 457422, "epoch": 5511} {"train_loss": -26.683521270751953, "global_step": 457423, "epoch": 5511} {"train_loss": -26.897069931030273, "global_step": 457424, "epoch": 5511} {"train_loss": -26.61244773864746, "global_step": 457425, "epoch": 5511} {"train_loss": -27.0531005859375, "global_step": 457426, "epoch": 5511} {"train_loss": -27.019439697265625, "global_step": 457427, "epoch": 5511} {"train_loss": -27.32050132751465, "global_step": 457428, "epoch": 5511} {"train_loss": -27.35877799987793, "global_step": 457429, "epoch": 5511} {"train_loss": -26.782758712768555, "global_step": 457430, "epoch": 5511} {"train_loss": -26.69978904724121, "global_step": 457431, "epoch": 5511} {"train_loss": -27.065759658813477, "global_step": 457432, "epoch": 5511} {"train_loss": -27.145349502563477, "global_step": 457433, "epoch": 5511} {"train_loss": -27.0532169342041, "global_step": 457434, "epoch": 5511} {"train_loss": -27.371671676635742, "global_step": 457435, "epoch": 5511} {"train_loss": -27.2677059173584, "global_step": 457436, "epoch": 5511} {"train_loss": -26.859790802001953, "global_step": 457437, "epoch": 5511} {"train_loss": -27.26441764831543, "global_step": 457438, "epoch": 5511} {"train_loss": -26.97084617614746, "global_step": 457439, "epoch": 5511} {"train_loss": -26.828433990478516, "global_step": 457440, "epoch": 5511} {"train_loss": -27.39267349243164, "global_step": 457441, "epoch": 5511} {"train_loss": -27.41708755493164, "global_step": 457442, "epoch": 5511} {"train_loss": -26.954608917236328, "global_step": 457443, "epoch": 5511} {"train_loss": -27.29117774963379, "global_step": 457444, "epoch": 5511} {"train_loss": -27.0716495513916, "global_step": 457445, "epoch": 5511} {"train_loss": -27.3367862701416, "global_step": 457446, "epoch": 5511} {"train_loss": -27.44110679626465, "global_step": 457447, "epoch": 5511} {"train_loss": -26.98837661743164, "global_step": 457448, "epoch": 5511} {"train_loss": -27.126489639282227, "global_step": 457449, "epoch": 5511} {"train_loss": -26.813003540039062, "global_step": 457450, "epoch": 5511} {"train_loss": -26.846601486206055, "global_step": 457451, "epoch": 5511} {"train_loss": -27.051834106445312, "global_step": 457452, "epoch": 5511} {"train_loss": -27.038761138916016, "global_step": 457453, "epoch": 5511} {"train_loss": -26.952396392822266, "global_step": 457454, "epoch": 5511} {"train_loss": -27.058074951171875, "global_step": 457455, "epoch": 5511} {"train_loss": -26.708515167236328, "global_step": 457456, "epoch": 5511} {"train_loss": -27.2485294342041, "global_step": 457457, "epoch": 5511} {"train_loss": -26.8410701751709, "global_step": 457458, "epoch": 5511} {"train_loss": -27.359729766845703, "global_step": 457459, "epoch": 5511} {"train_loss": -27.29774284362793, "global_step": 457460, "epoch": 5511} {"train_loss": -27.084821701049805, "global_step": 457461, "epoch": 5511} {"train_loss": -26.995014190673828, "global_step": 457462, "epoch": 5511} {"train_loss": -26.72222900390625, "global_step": 457463, "epoch": 5511} {"train_loss": -27.10477066040039, "global_step": 457464, "epoch": 5511} {"train_loss": -27.297901153564453, "global_step": 457465, "epoch": 5511} {"train_loss": -26.846866607666016, "global_step": 457466, "epoch": 5511} {"train_loss": -26.528900146484375, "global_step": 457467, "epoch": 5511} {"train_loss": -27.0051326751709, "global_step": 457468, "epoch": 5511} {"train_loss": -26.758569717407227, "global_step": 457469, "epoch": 5511} {"train_loss": -26.19426918029785, "global_step": 457470, "epoch": 5511} {"train_loss": -26.126174926757812, "global_step": 457471, "epoch": 5511} {"train_loss": -26.62220573425293, "global_step": 457472, "epoch": 5511} {"train_loss": -27.11895179748535, "global_step": 457473, "epoch": 5511} {"train_loss": -26.13327980041504, "global_step": 457474, "epoch": 5511} {"train_loss": -26.666624069213867, "global_step": 457475, "epoch": 5511} {"train_loss": -26.555456161499023, "global_step": 457476, "epoch": 5511} {"train_loss": -26.423059463500977, "global_step": 457477, "epoch": 5511} {"train_loss": -26.307300567626953, "global_step": 457478, "epoch": 5511} {"train_loss": -26.937475204467773, "global_step": 457479, "epoch": 5511} {"train_loss": -26.59445571899414, "global_step": 457480, "epoch": 5511} {"train_loss": -26.29803466796875, "global_step": 457481, "epoch": 5511} {"train_loss": -27.392536163330078, "global_step": 457482, "epoch": 5511} {"train_loss": -26.167667388916016, "global_step": 457483, "epoch": 5511} {"train_loss": -27.050634384155273, "global_step": 457484, "epoch": 5511} {"train_loss": -26.742847442626953, "global_step": 457485, "epoch": 5511} {"train_loss": -26.919809341430664, "global_step": 457486, "epoch": 5511} {"train_loss": -27.12529945373535, "global_step": 457487, "epoch": 5511} {"train_loss": -26.81475830078125, "global_step": 457488, "epoch": 5511} {"train_loss": -26.949167251586914, "global_step": 457489, "epoch": 5511} {"train_loss": -27.19091796875, "global_step": 457490, "epoch": 5511} {"train_loss": -26.885046005249023, "global_step": 457491, "epoch": 5511} {"train_loss": -26.6616153717041, "global_step": 457492, "epoch": 5511} {"train_loss": -26.714557647705078, "global_step": 457493, "epoch": 5511} {"train_loss": -27.294076919555664, "global_step": 457494, "epoch": 5511} {"train_loss": -26.903220326067455, "global_step": 457495, "epoch": 5511, "val_loss": 6469887.0} {"train_loss": -26.621564865112305, "global_step": 457496, "epoch": 5512} {"train_loss": -27.085615158081055, "global_step": 457497, "epoch": 5512} {"train_loss": -26.462167739868164, "global_step": 457498, "epoch": 5512} {"train_loss": -26.7248477935791, "global_step": 457499, "epoch": 5512} {"train_loss": -26.89845085144043, "global_step": 457500, "epoch": 5512} {"train_loss": -26.93348503112793, "global_step": 457501, "epoch": 5512} {"train_loss": -26.978443145751953, "global_step": 457502, "epoch": 5512} {"train_loss": -26.768848419189453, "global_step": 457503, "epoch": 5512} {"train_loss": -27.014745712280273, "global_step": 457504, "epoch": 5512} {"train_loss": -26.8478946685791, "global_step": 457505, "epoch": 5512} {"train_loss": -26.934783935546875, "global_step": 457506, "epoch": 5512} {"train_loss": -27.109085083007812, "global_step": 457507, "epoch": 5512} {"train_loss": -27.18324851989746, "global_step": 457508, "epoch": 5512} {"train_loss": -27.313074111938477, "global_step": 457509, "epoch": 5512} {"train_loss": -27.180923461914062, "global_step": 457510, "epoch": 5512} {"train_loss": -27.23890495300293, "global_step": 457511, "epoch": 5512} {"train_loss": -26.90667724609375, "global_step": 457512, "epoch": 5512} {"train_loss": -26.728118896484375, "global_step": 457513, "epoch": 5512} {"train_loss": -26.89371681213379, "global_step": 457514, "epoch": 5512} {"train_loss": -26.8856258392334, "global_step": 457515, "epoch": 5512} {"train_loss": -27.47991943359375, "global_step": 457516, "epoch": 5512} {"train_loss": -27.17889404296875, "global_step": 457517, "epoch": 5512} {"train_loss": -27.43195152282715, "global_step": 457518, "epoch": 5512} {"train_loss": -27.16888999938965, "global_step": 457519, "epoch": 5512} {"train_loss": -27.37162208557129, "global_step": 457520, "epoch": 5512} {"train_loss": -27.305816650390625, "global_step": 457521, "epoch": 5512} {"train_loss": -27.492013931274414, "global_step": 457522, "epoch": 5512} {"train_loss": -27.123559951782227, "global_step": 457523, "epoch": 5512} {"train_loss": -27.06158447265625, "global_step": 457524, "epoch": 5512} {"train_loss": -27.298053741455078, "global_step": 457525, "epoch": 5512} {"train_loss": -26.978845596313477, "global_step": 457526, "epoch": 5512} {"train_loss": -27.19647789001465, "global_step": 457527, "epoch": 5512} {"train_loss": -27.25336265563965, "global_step": 457528, "epoch": 5512} {"train_loss": -27.55338478088379, "global_step": 457529, "epoch": 5512} {"train_loss": -27.273761749267578, "global_step": 457530, "epoch": 5512} {"train_loss": -27.306127548217773, "global_step": 457531, "epoch": 5512} {"train_loss": -27.11268424987793, "global_step": 457532, "epoch": 5512} {"train_loss": -27.0459041595459, "global_step": 457533, "epoch": 5512} {"train_loss": -26.875946044921875, "global_step": 457534, "epoch": 5512} {"train_loss": -26.626195907592773, "global_step": 457535, "epoch": 5512} {"train_loss": -26.98679542541504, "global_step": 457536, "epoch": 5512} {"train_loss": -27.106603622436523, "global_step": 457537, "epoch": 5512} {"train_loss": -27.30885887145996, "global_step": 457538, "epoch": 5512} {"train_loss": -26.962453842163086, "global_step": 457539, "epoch": 5512} {"train_loss": -27.011693954467773, "global_step": 457540, "epoch": 5512} {"train_loss": -27.37653923034668, "global_step": 457541, "epoch": 5512} {"train_loss": -27.001358032226562, "global_step": 457542, "epoch": 5512} {"train_loss": -27.28663444519043, "global_step": 457543, "epoch": 5512} {"train_loss": -27.17042350769043, "global_step": 457544, "epoch": 5512} {"train_loss": -27.375049591064453, "global_step": 457545, "epoch": 5512} {"train_loss": -27.24149513244629, "global_step": 457546, "epoch": 5512} {"train_loss": -27.08892250061035, "global_step": 457547, "epoch": 5512} {"train_loss": -27.193740844726562, "global_step": 457548, "epoch": 5512} {"train_loss": -27.408124923706055, "global_step": 457549, "epoch": 5512} {"train_loss": -27.280126571655273, "global_step": 457550, "epoch": 5512} {"train_loss": -27.202011108398438, "global_step": 457551, "epoch": 5512} {"train_loss": -26.804349899291992, "global_step": 457552, "epoch": 5512} {"train_loss": -27.467519760131836, "global_step": 457553, "epoch": 5512} {"train_loss": -27.434844970703125, "global_step": 457554, "epoch": 5512} {"train_loss": -27.326587677001953, "global_step": 457555, "epoch": 5512} {"train_loss": -27.529462814331055, "global_step": 457556, "epoch": 5512} {"train_loss": -26.90289878845215, "global_step": 457557, "epoch": 5512} {"train_loss": -27.167383193969727, "global_step": 457558, "epoch": 5512} {"train_loss": -26.7050724029541, "global_step": 457559, "epoch": 5512} {"train_loss": -26.99018669128418, "global_step": 457560, "epoch": 5512} {"train_loss": -26.9613037109375, "global_step": 457561, "epoch": 5512} {"train_loss": -27.14832878112793, "global_step": 457562, "epoch": 5512} {"train_loss": -27.150632858276367, "global_step": 457563, "epoch": 5512} {"train_loss": -27.088764190673828, "global_step": 457564, "epoch": 5512} {"train_loss": -26.91615104675293, "global_step": 457565, "epoch": 5512} {"train_loss": -26.920446395874023, "global_step": 457566, "epoch": 5512} {"train_loss": -27.089252471923828, "global_step": 457567, "epoch": 5512} {"train_loss": -26.46834373474121, "global_step": 457568, "epoch": 5512} {"train_loss": -26.88437843322754, "global_step": 457569, "epoch": 5512} {"train_loss": -26.791990280151367, "global_step": 457570, "epoch": 5512} {"train_loss": -27.277597427368164, "global_step": 457571, "epoch": 5512} {"train_loss": -26.849721908569336, "global_step": 457572, "epoch": 5512} {"train_loss": -26.421585083007812, "global_step": 457573, "epoch": 5512} {"train_loss": -26.489547729492188, "global_step": 457574, "epoch": 5512} {"train_loss": -27.333715438842773, "global_step": 457575, "epoch": 5512} {"train_loss": -26.704538345336914, "global_step": 457576, "epoch": 5512} {"train_loss": -26.615081787109375, "global_step": 457577, "epoch": 5512} {"train_loss": -27.0508746641228, "global_step": 457578, "epoch": 5512, "val_loss": 6515833.0} {"train_loss": -27.01112174987793, "global_step": 457579, "epoch": 5513} {"train_loss": -26.37237548828125, "global_step": 457580, "epoch": 5513} {"train_loss": -26.581289291381836, "global_step": 457581, "epoch": 5513} {"train_loss": -26.852243423461914, "global_step": 457582, "epoch": 5513} {"train_loss": -26.672107696533203, "global_step": 457583, "epoch": 5513} {"train_loss": -26.596515655517578, "global_step": 457584, "epoch": 5513} {"train_loss": -26.887821197509766, "global_step": 457585, "epoch": 5513} {"train_loss": -26.719284057617188, "global_step": 457586, "epoch": 5513} {"train_loss": -27.047765731811523, "global_step": 457587, "epoch": 5513} {"train_loss": -26.973896026611328, "global_step": 457588, "epoch": 5513} {"train_loss": -26.763830184936523, "global_step": 457589, "epoch": 5513} {"train_loss": -26.806188583374023, "global_step": 457590, "epoch": 5513} {"train_loss": -26.538267135620117, "global_step": 457591, "epoch": 5513} {"train_loss": -26.924942016601562, "global_step": 457592, "epoch": 5513} {"train_loss": -27.000837326049805, "global_step": 457593, "epoch": 5513} {"train_loss": -26.993305206298828, "global_step": 457594, "epoch": 5513} {"train_loss": -26.776121139526367, "global_step": 457595, "epoch": 5513} {"train_loss": -26.814594268798828, "global_step": 457596, "epoch": 5513} {"train_loss": -26.7049503326416, "global_step": 457597, "epoch": 5513} {"train_loss": -26.995153427124023, "global_step": 457598, "epoch": 5513} {"train_loss": -26.932729721069336, "global_step": 457599, "epoch": 5513} {"train_loss": -26.859561920166016, "global_step": 457600, "epoch": 5513} {"train_loss": -26.815093994140625, "global_step": 457601, "epoch": 5513} {"train_loss": -27.229175567626953, "global_step": 457602, "epoch": 5513} {"train_loss": -26.59498405456543, "global_step": 457603, "epoch": 5513} {"train_loss": -26.8753662109375, "global_step": 457604, "epoch": 5513} {"train_loss": -27.2067928314209, "global_step": 457605, "epoch": 5513} {"train_loss": -27.031204223632812, "global_step": 457606, "epoch": 5513} {"train_loss": -27.195199966430664, "global_step": 457607, "epoch": 5513} {"train_loss": -27.52558708190918, "global_step": 457608, "epoch": 5513} {"train_loss": -26.878799438476562, "global_step": 457609, "epoch": 5513} {"train_loss": -27.084930419921875, "global_step": 457610, "epoch": 5513} {"train_loss": -27.2746639251709, "global_step": 457611, "epoch": 5513} {"train_loss": -27.22108268737793, "global_step": 457612, "epoch": 5513} {"train_loss": -26.936613082885742, "global_step": 457613, "epoch": 5513} {"train_loss": -27.520048141479492, "global_step": 457614, "epoch": 5513} {"train_loss": -27.100378036499023, "global_step": 457615, "epoch": 5513} {"train_loss": -27.100616455078125, "global_step": 457616, "epoch": 5513} {"train_loss": -26.949026107788086, "global_step": 457617, "epoch": 5513} {"train_loss": -27.16086769104004, "global_step": 457618, "epoch": 5513} {"train_loss": -27.2301082611084, "global_step": 457619, "epoch": 5513} {"train_loss": -27.523908615112305, "global_step": 457620, "epoch": 5513} {"train_loss": -27.337635040283203, "global_step": 457621, "epoch": 5513} {"train_loss": -27.34099769592285, "global_step": 457622, "epoch": 5513} {"train_loss": -26.855199813842773, "global_step": 457623, "epoch": 5513} {"train_loss": -27.309833526611328, "global_step": 457624, "epoch": 5513} {"train_loss": -27.576032638549805, "global_step": 457625, "epoch": 5513} {"train_loss": -27.085311889648438, "global_step": 457626, "epoch": 5513} {"train_loss": -27.068653106689453, "global_step": 457627, "epoch": 5513} {"train_loss": -27.29490089416504, "global_step": 457628, "epoch": 5513} {"train_loss": -26.77646255493164, "global_step": 457629, "epoch": 5513} {"train_loss": -27.2838134765625, "global_step": 457630, "epoch": 5513} {"train_loss": -26.914077758789062, "global_step": 457631, "epoch": 5513} {"train_loss": -27.01205825805664, "global_step": 457632, "epoch": 5513} {"train_loss": -27.456928253173828, "global_step": 457633, "epoch": 5513} {"train_loss": -27.054946899414062, "global_step": 457634, "epoch": 5513} {"train_loss": -26.791242599487305, "global_step": 457635, "epoch": 5513} {"train_loss": -27.35166358947754, "global_step": 457636, "epoch": 5513} {"train_loss": -27.44780921936035, "global_step": 457637, "epoch": 5513} {"train_loss": -27.307220458984375, "global_step": 457638, "epoch": 5513} {"train_loss": -27.108428955078125, "global_step": 457639, "epoch": 5513} {"train_loss": -26.570697784423828, "global_step": 457640, "epoch": 5513} {"train_loss": -26.829511642456055, "global_step": 457641, "epoch": 5513} {"train_loss": -27.398639678955078, "global_step": 457642, "epoch": 5513} {"train_loss": -27.161230087280273, "global_step": 457643, "epoch": 5513} {"train_loss": -26.87601661682129, "global_step": 457644, "epoch": 5513} {"train_loss": -26.903852462768555, "global_step": 457645, "epoch": 5513} {"train_loss": -26.699756622314453, "global_step": 457646, "epoch": 5513} {"train_loss": -26.819650650024414, "global_step": 457647, "epoch": 5513} {"train_loss": -26.651676177978516, "global_step": 457648, "epoch": 5513} {"train_loss": -26.7028865814209, "global_step": 457649, "epoch": 5513} {"train_loss": -26.6641902923584, "global_step": 457650, "epoch": 5513} {"train_loss": -27.305341720581055, "global_step": 457651, "epoch": 5513} {"train_loss": -26.87379264831543, "global_step": 457652, "epoch": 5513} {"train_loss": -26.96027183532715, "global_step": 457653, "epoch": 5513} {"train_loss": -27.194595336914062, "global_step": 457654, "epoch": 5513} {"train_loss": -26.957000732421875, "global_step": 457655, "epoch": 5513} {"train_loss": -27.108856201171875, "global_step": 457656, "epoch": 5513} {"train_loss": -27.17146873474121, "global_step": 457657, "epoch": 5513} {"train_loss": -27.577381134033203, "global_step": 457658, "epoch": 5513} {"train_loss": -27.116291046142578, "global_step": 457659, "epoch": 5513} {"train_loss": -27.287397384643555, "global_step": 457660, "epoch": 5513} {"train_loss": -27.027829802179912, "global_step": 457661, "epoch": 5513, "val_loss": 6532877.5} {"train_loss": -26.454181671142578, "global_step": 457662, "epoch": 5514} {"train_loss": -26.16141700744629, "global_step": 457663, "epoch": 5514} {"train_loss": -26.268386840820312, "global_step": 457664, "epoch": 5514} {"train_loss": -26.958847045898438, "global_step": 457665, "epoch": 5514} {"train_loss": -26.020002365112305, "global_step": 457666, "epoch": 5514} {"train_loss": -26.36501121520996, "global_step": 457667, "epoch": 5514} {"train_loss": -26.929651260375977, "global_step": 457668, "epoch": 5514} {"train_loss": -26.3428955078125, "global_step": 457669, "epoch": 5514} {"train_loss": -26.43756103515625, "global_step": 457670, "epoch": 5514} {"train_loss": -27.0405216217041, "global_step": 457671, "epoch": 5514} {"train_loss": -26.835845947265625, "global_step": 457672, "epoch": 5514} {"train_loss": -26.567996978759766, "global_step": 457673, "epoch": 5514} {"train_loss": -26.7197322845459, "global_step": 457674, "epoch": 5514} {"train_loss": -26.80328369140625, "global_step": 457675, "epoch": 5514} {"train_loss": -26.649953842163086, "global_step": 457676, "epoch": 5514} {"train_loss": -26.74189567565918, "global_step": 457677, "epoch": 5514} {"train_loss": -26.8494930267334, "global_step": 457678, "epoch": 5514} {"train_loss": -26.657583236694336, "global_step": 457679, "epoch": 5514} {"train_loss": -27.108386993408203, "global_step": 457680, "epoch": 5514} {"train_loss": -27.044599533081055, "global_step": 457681, "epoch": 5514} {"train_loss": -27.326196670532227, "global_step": 457682, "epoch": 5514} {"train_loss": -26.91194725036621, "global_step": 457683, "epoch": 5514} {"train_loss": -26.993955612182617, "global_step": 457684, "epoch": 5514} {"train_loss": -26.9824161529541, "global_step": 457685, "epoch": 5514} {"train_loss": -27.051538467407227, "global_step": 457686, "epoch": 5514} {"train_loss": -26.92616081237793, "global_step": 457687, "epoch": 5514} {"train_loss": -27.177112579345703, "global_step": 457688, "epoch": 5514} {"train_loss": -26.588932037353516, "global_step": 457689, "epoch": 5514} {"train_loss": -27.26384925842285, "global_step": 457690, "epoch": 5514} {"train_loss": -27.39912223815918, "global_step": 457691, "epoch": 5514} {"train_loss": -27.168533325195312, "global_step": 457692, "epoch": 5514} {"train_loss": -27.050617218017578, "global_step": 457693, "epoch": 5514} {"train_loss": -27.208593368530273, "global_step": 457694, "epoch": 5514} {"train_loss": -27.608922958374023, "global_step": 457695, "epoch": 5514} {"train_loss": -26.978906631469727, "global_step": 457696, "epoch": 5514} {"train_loss": -27.16794776916504, "global_step": 457697, "epoch": 5514} {"train_loss": -27.153919219970703, "global_step": 457698, "epoch": 5514} {"train_loss": -27.376209259033203, "global_step": 457699, "epoch": 5514} {"train_loss": -27.288166046142578, "global_step": 457700, "epoch": 5514} {"train_loss": -27.10808753967285, "global_step": 457701, "epoch": 5514} {"train_loss": -27.10430335998535, "global_step": 457702, "epoch": 5514} {"train_loss": -27.4935245513916, "global_step": 457703, "epoch": 5514} {"train_loss": -27.489511489868164, "global_step": 457704, "epoch": 5514} {"train_loss": -27.559011459350586, "global_step": 457705, "epoch": 5514} {"train_loss": -26.871353149414062, "global_step": 457706, "epoch": 5514} {"train_loss": -27.408893585205078, "global_step": 457707, "epoch": 5514} {"train_loss": -27.194202423095703, "global_step": 457708, "epoch": 5514} {"train_loss": -27.001453399658203, "global_step": 457709, "epoch": 5514} {"train_loss": -27.15349769592285, "global_step": 457710, "epoch": 5514} {"train_loss": -27.005706787109375, "global_step": 457711, "epoch": 5514} {"train_loss": -27.46599769592285, "global_step": 457712, "epoch": 5514} {"train_loss": -26.562549591064453, "global_step": 457713, "epoch": 5514} {"train_loss": -27.64863395690918, "global_step": 457714, "epoch": 5514} {"train_loss": -27.534229278564453, "global_step": 457715, "epoch": 5514} {"train_loss": -27.075653076171875, "global_step": 457716, "epoch": 5514} {"train_loss": -27.266881942749023, "global_step": 457717, "epoch": 5514} {"train_loss": -27.124862670898438, "global_step": 457718, "epoch": 5514} {"train_loss": -26.998579025268555, "global_step": 457719, "epoch": 5514} {"train_loss": -26.666589736938477, "global_step": 457720, "epoch": 5514} {"train_loss": -27.33700942993164, "global_step": 457721, "epoch": 5514} {"train_loss": -27.034107208251953, "global_step": 457722, "epoch": 5514} {"train_loss": -27.024551391601562, "global_step": 457723, "epoch": 5514} {"train_loss": -27.070785522460938, "global_step": 457724, "epoch": 5514} {"train_loss": -27.14717674255371, "global_step": 457725, "epoch": 5514} {"train_loss": -26.841711044311523, "global_step": 457726, "epoch": 5514} {"train_loss": -27.295612335205078, "global_step": 457727, "epoch": 5514} {"train_loss": -27.165454864501953, "global_step": 457728, "epoch": 5514} {"train_loss": -27.17667007446289, "global_step": 457729, "epoch": 5514} {"train_loss": -27.163314819335938, "global_step": 457730, "epoch": 5514} {"train_loss": -27.298688888549805, "global_step": 457731, "epoch": 5514} {"train_loss": -27.25593376159668, "global_step": 457732, "epoch": 5514} {"train_loss": -27.347381591796875, "global_step": 457733, "epoch": 5514} {"train_loss": -27.251575469970703, "global_step": 457734, "epoch": 5514} {"train_loss": -27.126672744750977, "global_step": 457735, "epoch": 5514} {"train_loss": -27.016998291015625, "global_step": 457736, "epoch": 5514} {"train_loss": -27.370107650756836, "global_step": 457737, "epoch": 5514} {"train_loss": -27.0496883392334, "global_step": 457738, "epoch": 5514} {"train_loss": -26.995838165283203, "global_step": 457739, "epoch": 5514} {"train_loss": -27.03680419921875, "global_step": 457740, "epoch": 5514} {"train_loss": -27.310184478759766, "global_step": 457741, "epoch": 5514} {"train_loss": -27.07037353515625, "global_step": 457742, "epoch": 5514} {"train_loss": -26.998010635375977, "global_step": 457743, "epoch": 5514} {"train_loss": -27.04595430213285, "global_step": 457744, "epoch": 5514, "val_loss": 6533136.0} {"train_loss": -26.864826202392578, "global_step": 457745, "epoch": 5515} {"train_loss": -27.144262313842773, "global_step": 457746, "epoch": 5515} {"train_loss": -27.037521362304688, "global_step": 457747, "epoch": 5515} {"train_loss": -26.988656997680664, "global_step": 457748, "epoch": 5515} {"train_loss": -26.85019874572754, "global_step": 457749, "epoch": 5515} {"train_loss": -26.83466148376465, "global_step": 457750, "epoch": 5515} {"train_loss": -26.923131942749023, "global_step": 457751, "epoch": 5515} {"train_loss": -27.20405387878418, "global_step": 457752, "epoch": 5515} {"train_loss": -26.67368507385254, "global_step": 457753, "epoch": 5515} {"train_loss": -26.512786865234375, "global_step": 457754, "epoch": 5515} {"train_loss": -26.7308406829834, "global_step": 457755, "epoch": 5515} {"train_loss": -26.94952964782715, "global_step": 457756, "epoch": 5515} {"train_loss": -27.117202758789062, "global_step": 457757, "epoch": 5515} {"train_loss": -27.093969345092773, "global_step": 457758, "epoch": 5515} {"train_loss": -27.237823486328125, "global_step": 457759, "epoch": 5515} {"train_loss": -26.994672775268555, "global_step": 457760, "epoch": 5515} {"train_loss": -27.441181182861328, "global_step": 457761, "epoch": 5515} {"train_loss": -26.945159912109375, "global_step": 457762, "epoch": 5515} {"train_loss": -26.635583877563477, "global_step": 457763, "epoch": 5515} {"train_loss": -26.78773307800293, "global_step": 457764, "epoch": 5515} {"train_loss": -26.82288932800293, "global_step": 457765, "epoch": 5515} {"train_loss": -27.273727416992188, "global_step": 457766, "epoch": 5515} {"train_loss": -27.054380416870117, "global_step": 457767, "epoch": 5515} {"train_loss": -27.010059356689453, "global_step": 457768, "epoch": 5515} {"train_loss": -26.942209243774414, "global_step": 457769, "epoch": 5515} {"train_loss": -26.898956298828125, "global_step": 457770, "epoch": 5515} {"train_loss": -26.6507625579834, "global_step": 457771, "epoch": 5515} {"train_loss": -26.95989990234375, "global_step": 457772, "epoch": 5515} {"train_loss": -26.937402725219727, "global_step": 457773, "epoch": 5515} {"train_loss": -26.853124618530273, "global_step": 457774, "epoch": 5515} {"train_loss": -26.887311935424805, "global_step": 457775, "epoch": 5515} {"train_loss": -27.151172637939453, "global_step": 457776, "epoch": 5515} {"train_loss": -26.896936416625977, "global_step": 457777, "epoch": 5515} {"train_loss": -26.972885131835938, "global_step": 457778, "epoch": 5515} {"train_loss": -27.04937171936035, "global_step": 457779, "epoch": 5515} {"train_loss": -27.181076049804688, "global_step": 457780, "epoch": 5515} {"train_loss": -27.123449325561523, "global_step": 457781, "epoch": 5515} {"train_loss": -27.27678871154785, "global_step": 457782, "epoch": 5515} {"train_loss": -26.973127365112305, "global_step": 457783, "epoch": 5515} {"train_loss": -27.15394401550293, "global_step": 457784, "epoch": 5515} {"train_loss": -27.38836669921875, "global_step": 457785, "epoch": 5515} {"train_loss": -27.162311553955078, "global_step": 457786, "epoch": 5515} {"train_loss": -27.24002456665039, "global_step": 457787, "epoch": 5515} {"train_loss": -27.25921058654785, "global_step": 457788, "epoch": 5515} {"train_loss": -27.341114044189453, "global_step": 457789, "epoch": 5515} {"train_loss": -27.5709285736084, "global_step": 457790, "epoch": 5515} {"train_loss": -27.249582290649414, "global_step": 457791, "epoch": 5515} {"train_loss": -27.329299926757812, "global_step": 457792, "epoch": 5515} {"train_loss": -26.66135597229004, "global_step": 457793, "epoch": 5515} {"train_loss": -27.26411247253418, "global_step": 457794, "epoch": 5515} {"train_loss": -27.2467098236084, "global_step": 457795, "epoch": 5515} {"train_loss": -27.173908233642578, "global_step": 457796, "epoch": 5515} {"train_loss": -27.042499542236328, "global_step": 457797, "epoch": 5515} {"train_loss": -27.316442489624023, "global_step": 457798, "epoch": 5515} {"train_loss": -27.191608428955078, "global_step": 457799, "epoch": 5515} {"train_loss": -26.87640953063965, "global_step": 457800, "epoch": 5515} {"train_loss": -26.792682647705078, "global_step": 457801, "epoch": 5515} {"train_loss": -26.515527725219727, "global_step": 457802, "epoch": 5515} {"train_loss": -26.81221580505371, "global_step": 457803, "epoch": 5515} {"train_loss": -26.684406280517578, "global_step": 457804, "epoch": 5515} {"train_loss": -27.276464462280273, "global_step": 457805, "epoch": 5515} {"train_loss": -26.34737205505371, "global_step": 457806, "epoch": 5515} {"train_loss": -26.593372344970703, "global_step": 457807, "epoch": 5515} {"train_loss": -27.035568237304688, "global_step": 457808, "epoch": 5515} {"train_loss": -26.71906852722168, "global_step": 457809, "epoch": 5515} {"train_loss": -26.54608154296875, "global_step": 457810, "epoch": 5515} {"train_loss": -27.13093376159668, "global_step": 457811, "epoch": 5515} {"train_loss": -26.37468910217285, "global_step": 457812, "epoch": 5515} {"train_loss": -27.097768783569336, "global_step": 457813, "epoch": 5515} {"train_loss": -26.858978271484375, "global_step": 457814, "epoch": 5515} {"train_loss": -26.928802490234375, "global_step": 457815, "epoch": 5515} {"train_loss": -26.991291046142578, "global_step": 457816, "epoch": 5515} {"train_loss": -27.13877296447754, "global_step": 457817, "epoch": 5515} {"train_loss": -27.243947982788086, "global_step": 457818, "epoch": 5515} {"train_loss": -27.024250030517578, "global_step": 457819, "epoch": 5515} {"train_loss": -27.105798721313477, "global_step": 457820, "epoch": 5515} {"train_loss": -27.2221622467041, "global_step": 457821, "epoch": 5515} {"train_loss": -27.053680419921875, "global_step": 457822, "epoch": 5515} {"train_loss": -27.212753295898438, "global_step": 457823, "epoch": 5515} {"train_loss": -27.085580825805664, "global_step": 457824, "epoch": 5515} {"train_loss": -27.167028427124023, "global_step": 457825, "epoch": 5515} {"train_loss": -27.132543563842773, "global_step": 457826, "epoch": 5515} {"train_loss": -27.009052552372577, "global_step": 457827, "epoch": 5515, "val_loss": 6515239.0} {"train_loss": -27.3067684173584, "global_step": 457828, "epoch": 5516} {"train_loss": -26.580625534057617, "global_step": 457829, "epoch": 5516} {"train_loss": -26.780057907104492, "global_step": 457830, "epoch": 5516} {"train_loss": -27.038625717163086, "global_step": 457831, "epoch": 5516} {"train_loss": -26.549985885620117, "global_step": 457832, "epoch": 5516} {"train_loss": -27.047168731689453, "global_step": 457833, "epoch": 5516} {"train_loss": -26.475143432617188, "global_step": 457834, "epoch": 5516} {"train_loss": -26.334426879882812, "global_step": 457835, "epoch": 5516} {"train_loss": -27.219648361206055, "global_step": 457836, "epoch": 5516} {"train_loss": -27.09263038635254, "global_step": 457837, "epoch": 5516} {"train_loss": -26.801435470581055, "global_step": 457838, "epoch": 5516} {"train_loss": -26.784107208251953, "global_step": 457839, "epoch": 5516} {"train_loss": -26.940946578979492, "global_step": 457840, "epoch": 5516} {"train_loss": -27.307729721069336, "global_step": 457841, "epoch": 5516} {"train_loss": -27.20273780822754, "global_step": 457842, "epoch": 5516} {"train_loss": -26.850757598876953, "global_step": 457843, "epoch": 5516} {"train_loss": -27.279300689697266, "global_step": 457844, "epoch": 5516} {"train_loss": -26.878408432006836, "global_step": 457845, "epoch": 5516} {"train_loss": -27.1110782623291, "global_step": 457846, "epoch": 5516} {"train_loss": -26.75429344177246, "global_step": 457847, "epoch": 5516} {"train_loss": -27.1365909576416, "global_step": 457848, "epoch": 5516} {"train_loss": -27.041669845581055, "global_step": 457849, "epoch": 5516} {"train_loss": -27.033239364624023, "global_step": 457850, "epoch": 5516} {"train_loss": -27.394256591796875, "global_step": 457851, "epoch": 5516} {"train_loss": -27.285064697265625, "global_step": 457852, "epoch": 5516} {"train_loss": -26.92913818359375, "global_step": 457853, "epoch": 5516} {"train_loss": -26.99928092956543, "global_step": 457854, "epoch": 5516} {"train_loss": -27.058197021484375, "global_step": 457855, "epoch": 5516} {"train_loss": -26.962997436523438, "global_step": 457856, "epoch": 5516} {"train_loss": -27.069753646850586, "global_step": 457857, "epoch": 5516} {"train_loss": -26.863534927368164, "global_step": 457858, "epoch": 5516} {"train_loss": -27.0322208404541, "global_step": 457859, "epoch": 5516} {"train_loss": -27.485925674438477, "global_step": 457860, "epoch": 5516} {"train_loss": -26.572782516479492, "global_step": 457861, "epoch": 5516} {"train_loss": -26.696542739868164, "global_step": 457862, "epoch": 5516} {"train_loss": -27.353696823120117, "global_step": 457863, "epoch": 5516} {"train_loss": -27.32744789123535, "global_step": 457864, "epoch": 5516} {"train_loss": -27.07500648498535, "global_step": 457865, "epoch": 5516} {"train_loss": -27.004362106323242, "global_step": 457866, "epoch": 5516} {"train_loss": -26.8966121673584, "global_step": 457867, "epoch": 5516} {"train_loss": -27.208993911743164, "global_step": 457868, "epoch": 5516} {"train_loss": -27.14163589477539, "global_step": 457869, "epoch": 5516} {"train_loss": -27.132287979125977, "global_step": 457870, "epoch": 5516} {"train_loss": -27.038000106811523, "global_step": 457871, "epoch": 5516} {"train_loss": -26.8853759765625, "global_step": 457872, "epoch": 5516} {"train_loss": -26.889617919921875, "global_step": 457873, "epoch": 5516} {"train_loss": -27.300678253173828, "global_step": 457874, "epoch": 5516} {"train_loss": -27.084943771362305, "global_step": 457875, "epoch": 5516} {"train_loss": -27.169784545898438, "global_step": 457876, "epoch": 5516} {"train_loss": -27.0495548248291, "global_step": 457877, "epoch": 5516} {"train_loss": -27.07843017578125, "global_step": 457878, "epoch": 5516} {"train_loss": -27.10371971130371, "global_step": 457879, "epoch": 5516} {"train_loss": -27.086761474609375, "global_step": 457880, "epoch": 5516} {"train_loss": -27.163055419921875, "global_step": 457881, "epoch": 5516} {"train_loss": -27.417890548706055, "global_step": 457882, "epoch": 5516} {"train_loss": -27.525800704956055, "global_step": 457883, "epoch": 5516} {"train_loss": -27.38919448852539, "global_step": 457884, "epoch": 5516} {"train_loss": -27.13228416442871, "global_step": 457885, "epoch": 5516} {"train_loss": -27.113025665283203, "global_step": 457886, "epoch": 5516} {"train_loss": -27.502216339111328, "global_step": 457887, "epoch": 5516} {"train_loss": -27.035810470581055, "global_step": 457888, "epoch": 5516} {"train_loss": -27.056900024414062, "global_step": 457889, "epoch": 5516} {"train_loss": -27.12255859375, "global_step": 457890, "epoch": 5516} {"train_loss": -27.012115478515625, "global_step": 457891, "epoch": 5516} {"train_loss": -27.093149185180664, "global_step": 457892, "epoch": 5516} {"train_loss": -27.267454147338867, "global_step": 457893, "epoch": 5516} {"train_loss": -27.494129180908203, "global_step": 457894, "epoch": 5516} {"train_loss": -26.768468856811523, "global_step": 457895, "epoch": 5516} {"train_loss": -27.294538497924805, "global_step": 457896, "epoch": 5516} {"train_loss": -27.220630645751953, "global_step": 457897, "epoch": 5516} {"train_loss": -27.2119140625, "global_step": 457898, "epoch": 5516} {"train_loss": -26.818939208984375, "global_step": 457899, "epoch": 5516} {"train_loss": -27.17616081237793, "global_step": 457900, "epoch": 5516} {"train_loss": -26.904569625854492, "global_step": 457901, "epoch": 5516} {"train_loss": -27.01118278503418, "global_step": 457902, "epoch": 5516} {"train_loss": -27.39523696899414, "global_step": 457903, "epoch": 5516} {"train_loss": -27.43772315979004, "global_step": 457904, "epoch": 5516} {"train_loss": -27.08485221862793, "global_step": 457905, "epoch": 5516} {"train_loss": -26.99773597717285, "global_step": 457906, "epoch": 5516} {"train_loss": -27.007984161376953, "global_step": 457907, "epoch": 5516} {"train_loss": -27.1054630279541, "global_step": 457908, "epoch": 5516} {"train_loss": -27.3704776763916, "global_step": 457909, "epoch": 5516} {"train_loss": -27.052947009902404, "global_step": 457910, "epoch": 5516, "val_loss": 6540818.0} {"train_loss": -27.0247745513916, "global_step": 457911, "epoch": 5517} {"train_loss": -26.68535804748535, "global_step": 457912, "epoch": 5517} {"train_loss": -26.57195472717285, "global_step": 457913, "epoch": 5517} {"train_loss": -26.8470458984375, "global_step": 457914, "epoch": 5517} {"train_loss": -26.379491806030273, "global_step": 457915, "epoch": 5517} {"train_loss": -26.616479873657227, "global_step": 457916, "epoch": 5517} {"train_loss": -26.280750274658203, "global_step": 457917, "epoch": 5517} {"train_loss": -26.737241744995117, "global_step": 457918, "epoch": 5517} {"train_loss": -26.767990112304688, "global_step": 457919, "epoch": 5517} {"train_loss": -26.175567626953125, "global_step": 457920, "epoch": 5517} {"train_loss": -26.307498931884766, "global_step": 457921, "epoch": 5517} {"train_loss": -26.640073776245117, "global_step": 457922, "epoch": 5517} {"train_loss": -26.637680053710938, "global_step": 457923, "epoch": 5517} {"train_loss": -26.3678035736084, "global_step": 457924, "epoch": 5517} {"train_loss": -26.863021850585938, "global_step": 457925, "epoch": 5517} {"train_loss": -26.995136260986328, "global_step": 457926, "epoch": 5517} {"train_loss": -26.81682777404785, "global_step": 457927, "epoch": 5517} {"train_loss": -26.90655517578125, "global_step": 457928, "epoch": 5517} {"train_loss": -26.9986572265625, "global_step": 457929, "epoch": 5517} {"train_loss": -27.095325469970703, "global_step": 457930, "epoch": 5517} {"train_loss": -27.094663619995117, "global_step": 457931, "epoch": 5517} {"train_loss": -26.628820419311523, "global_step": 457932, "epoch": 5517} {"train_loss": -26.819915771484375, "global_step": 457933, "epoch": 5517} {"train_loss": -26.885272979736328, "global_step": 457934, "epoch": 5517} {"train_loss": -26.92169761657715, "global_step": 457935, "epoch": 5517} {"train_loss": -27.019113540649414, "global_step": 457936, "epoch": 5517} {"train_loss": -26.741418838500977, "global_step": 457937, "epoch": 5517} {"train_loss": -27.327056884765625, "global_step": 457938, "epoch": 5517} {"train_loss": -27.1854305267334, "global_step": 457939, "epoch": 5517} {"train_loss": -27.22719383239746, "global_step": 457940, "epoch": 5517} {"train_loss": -27.2623291015625, "global_step": 457941, "epoch": 5517} {"train_loss": -27.268325805664062, "global_step": 457942, "epoch": 5517} {"train_loss": -26.903980255126953, "global_step": 457943, "epoch": 5517} {"train_loss": -27.575607299804688, "global_step": 457944, "epoch": 5517} {"train_loss": -27.241992950439453, "global_step": 457945, "epoch": 5517} {"train_loss": -27.405115127563477, "global_step": 457946, "epoch": 5517} {"train_loss": -27.133426666259766, "global_step": 457947, "epoch": 5517} {"train_loss": -27.44208335876465, "global_step": 457948, "epoch": 5517} {"train_loss": -27.31147575378418, "global_step": 457949, "epoch": 5517} {"train_loss": -27.12495231628418, "global_step": 457950, "epoch": 5517} {"train_loss": -27.295148849487305, "global_step": 457951, "epoch": 5517} {"train_loss": -27.156707763671875, "global_step": 457952, "epoch": 5517} {"train_loss": -27.308008193969727, "global_step": 457953, "epoch": 5517} {"train_loss": -27.54901123046875, "global_step": 457954, "epoch": 5517} {"train_loss": -27.439634323120117, "global_step": 457955, "epoch": 5517} {"train_loss": -27.12836265563965, "global_step": 457956, "epoch": 5517} {"train_loss": -27.15156364440918, "global_step": 457957, "epoch": 5517} {"train_loss": -27.340208053588867, "global_step": 457958, "epoch": 5517} {"train_loss": -27.209457397460938, "global_step": 457959, "epoch": 5517} {"train_loss": -27.563796997070312, "global_step": 457960, "epoch": 5517} {"train_loss": -27.595487594604492, "global_step": 457961, "epoch": 5517} {"train_loss": -26.927183151245117, "global_step": 457962, "epoch": 5517} {"train_loss": -27.141559600830078, "global_step": 457963, "epoch": 5517} {"train_loss": -26.835174560546875, "global_step": 457964, "epoch": 5517} {"train_loss": -26.59736442565918, "global_step": 457965, "epoch": 5517} {"train_loss": -26.712228775024414, "global_step": 457966, "epoch": 5517} {"train_loss": -26.558984756469727, "global_step": 457967, "epoch": 5517} {"train_loss": -26.97662925720215, "global_step": 457968, "epoch": 5517} {"train_loss": -27.36004066467285, "global_step": 457969, "epoch": 5517} {"train_loss": -27.001239776611328, "global_step": 457970, "epoch": 5517} {"train_loss": -26.432117462158203, "global_step": 457971, "epoch": 5517} {"train_loss": -25.9664306640625, "global_step": 457972, "epoch": 5517} {"train_loss": -25.357791900634766, "global_step": 457973, "epoch": 5517} {"train_loss": -26.5966854095459, "global_step": 457974, "epoch": 5517} {"train_loss": -27.033737182617188, "global_step": 457975, "epoch": 5517} {"train_loss": -26.137948989868164, "global_step": 457976, "epoch": 5517} {"train_loss": -26.505895614624023, "global_step": 457977, "epoch": 5517} {"train_loss": -26.713581085205078, "global_step": 457978, "epoch": 5517} {"train_loss": -26.261356353759766, "global_step": 457979, "epoch": 5517} {"train_loss": -26.708927154541016, "global_step": 457980, "epoch": 5517} {"train_loss": -26.37861442565918, "global_step": 457981, "epoch": 5517} {"train_loss": -26.830244064331055, "global_step": 457982, "epoch": 5517} {"train_loss": -26.991025924682617, "global_step": 457983, "epoch": 5517} {"train_loss": -26.53094482421875, "global_step": 457984, "epoch": 5517} {"train_loss": -26.784849166870117, "global_step": 457985, "epoch": 5517} {"train_loss": -26.629627227783203, "global_step": 457986, "epoch": 5517} {"train_loss": -27.02149772644043, "global_step": 457987, "epoch": 5517} {"train_loss": -26.707843780517578, "global_step": 457988, "epoch": 5517} {"train_loss": -27.102039337158203, "global_step": 457989, "epoch": 5517} {"train_loss": -26.794336318969727, "global_step": 457990, "epoch": 5517} {"train_loss": -26.703638076782227, "global_step": 457991, "epoch": 5517} {"train_loss": -26.99281120300293, "global_step": 457992, "epoch": 5517} {"train_loss": -26.879463655402862, "global_step": 457993, "epoch": 5517, "val_loss": 6576564.5} {"train_loss": -26.90105628967285, "global_step": 457994, "epoch": 5518} {"train_loss": -26.773420333862305, "global_step": 457995, "epoch": 5518} {"train_loss": -26.63105583190918, "global_step": 457996, "epoch": 5518} {"train_loss": -27.337356567382812, "global_step": 457997, "epoch": 5518} {"train_loss": -26.73866081237793, "global_step": 457998, "epoch": 5518} {"train_loss": -27.024595260620117, "global_step": 457999, "epoch": 5518} {"train_loss": -26.62031364440918, "global_step": 458000, "epoch": 5518} {"train_loss": -26.803363800048828, "global_step": 458001, "epoch": 5518} {"train_loss": -26.954030990600586, "global_step": 458002, "epoch": 5518} {"train_loss": -26.948678970336914, "global_step": 458003, "epoch": 5518} {"train_loss": -26.8758487701416, "global_step": 458004, "epoch": 5518} {"train_loss": -26.928531646728516, "global_step": 458005, "epoch": 5518} {"train_loss": -26.952848434448242, "global_step": 458006, "epoch": 5518} {"train_loss": -26.569955825805664, "global_step": 458007, "epoch": 5518} {"train_loss": -27.242584228515625, "global_step": 458008, "epoch": 5518} {"train_loss": -26.710309982299805, "global_step": 458009, "epoch": 5518} {"train_loss": -26.952056884765625, "global_step": 458010, "epoch": 5518} {"train_loss": -26.73895835876465, "global_step": 458011, "epoch": 5518} {"train_loss": -27.21649169921875, "global_step": 458012, "epoch": 5518} {"train_loss": -26.93988037109375, "global_step": 458013, "epoch": 5518} {"train_loss": -26.959796905517578, "global_step": 458014, "epoch": 5518} {"train_loss": -26.953012466430664, "global_step": 458015, "epoch": 5518} {"train_loss": -27.141515731811523, "global_step": 458016, "epoch": 5518} {"train_loss": -26.68896484375, "global_step": 458017, "epoch": 5518} {"train_loss": -27.17238426208496, "global_step": 458018, "epoch": 5518} {"train_loss": -27.288894653320312, "global_step": 458019, "epoch": 5518} {"train_loss": -26.85087013244629, "global_step": 458020, "epoch": 5518} {"train_loss": -26.847631454467773, "global_step": 458021, "epoch": 5518} {"train_loss": -27.44898796081543, "global_step": 458022, "epoch": 5518} {"train_loss": -27.03809928894043, "global_step": 458023, "epoch": 5518} {"train_loss": -27.1700439453125, "global_step": 458024, "epoch": 5518} {"train_loss": -27.043195724487305, "global_step": 458025, "epoch": 5518} {"train_loss": -27.39090919494629, "global_step": 458026, "epoch": 5518} {"train_loss": -27.218137741088867, "global_step": 458027, "epoch": 5518} {"train_loss": -27.4257869720459, "global_step": 458028, "epoch": 5518} {"train_loss": -27.33154296875, "global_step": 458029, "epoch": 5518} {"train_loss": -27.227697372436523, "global_step": 458030, "epoch": 5518} {"train_loss": -27.125762939453125, "global_step": 458031, "epoch": 5518} {"train_loss": -27.00738525390625, "global_step": 458032, "epoch": 5518} {"train_loss": -27.230854034423828, "global_step": 458033, "epoch": 5518} {"train_loss": -27.017133712768555, "global_step": 458034, "epoch": 5518} {"train_loss": -27.286584854125977, "global_step": 458035, "epoch": 5518} {"train_loss": -27.051029205322266, "global_step": 458036, "epoch": 5518} {"train_loss": -27.39223289489746, "global_step": 458037, "epoch": 5518} {"train_loss": -26.578954696655273, "global_step": 458038, "epoch": 5518} {"train_loss": -27.013385772705078, "global_step": 458039, "epoch": 5518} {"train_loss": -27.03058433532715, "global_step": 458040, "epoch": 5518} {"train_loss": -27.110265731811523, "global_step": 458041, "epoch": 5518} {"train_loss": -27.175384521484375, "global_step": 458042, "epoch": 5518} {"train_loss": -27.267438888549805, "global_step": 458043, "epoch": 5518} {"train_loss": -27.240802764892578, "global_step": 458044, "epoch": 5518} {"train_loss": -27.594457626342773, "global_step": 458045, "epoch": 5518} {"train_loss": -27.216400146484375, "global_step": 458046, "epoch": 5518} {"train_loss": -27.053573608398438, "global_step": 458047, "epoch": 5518} {"train_loss": -27.306570053100586, "global_step": 458048, "epoch": 5518} {"train_loss": -27.48798942565918, "global_step": 458049, "epoch": 5518} {"train_loss": -27.087055206298828, "global_step": 458050, "epoch": 5518} {"train_loss": -27.290307998657227, "global_step": 458051, "epoch": 5518} {"train_loss": -27.14777946472168, "global_step": 458052, "epoch": 5518} {"train_loss": -26.68637466430664, "global_step": 458053, "epoch": 5518} {"train_loss": -26.889352798461914, "global_step": 458054, "epoch": 5518} {"train_loss": -27.38100242614746, "global_step": 458055, "epoch": 5518} {"train_loss": -26.896780014038086, "global_step": 458056, "epoch": 5518} {"train_loss": -26.65238380432129, "global_step": 458057, "epoch": 5518} {"train_loss": -27.045068740844727, "global_step": 458058, "epoch": 5518} {"train_loss": -26.942373275756836, "global_step": 458059, "epoch": 5518} {"train_loss": -27.018421173095703, "global_step": 458060, "epoch": 5518} {"train_loss": -26.849048614501953, "global_step": 458061, "epoch": 5518} {"train_loss": -26.85878562927246, "global_step": 458062, "epoch": 5518} {"train_loss": -26.697071075439453, "global_step": 458063, "epoch": 5518} {"train_loss": -27.064054489135742, "global_step": 458064, "epoch": 5518} {"train_loss": -27.23935317993164, "global_step": 458065, "epoch": 5518} {"train_loss": -26.704986572265625, "global_step": 458066, "epoch": 5518} {"train_loss": -26.612958908081055, "global_step": 458067, "epoch": 5518} {"train_loss": -27.401639938354492, "global_step": 458068, "epoch": 5518} {"train_loss": -26.5518798828125, "global_step": 458069, "epoch": 5518} {"train_loss": -27.412845611572266, "global_step": 458070, "epoch": 5518} {"train_loss": -27.139575958251953, "global_step": 458071, "epoch": 5518} {"train_loss": -27.384565353393555, "global_step": 458072, "epoch": 5518} {"train_loss": -27.242298126220703, "global_step": 458073, "epoch": 5518} {"train_loss": -27.37190055847168, "global_step": 458074, "epoch": 5518} {"train_loss": -27.069904327392578, "global_step": 458075, "epoch": 5518} {"train_loss": -27.039820291909827, "global_step": 458076, "epoch": 5518, "val_loss": 6567800.5} {"train_loss": -25.984338760375977, "global_step": 458077, "epoch": 5519} {"train_loss": -24.559566497802734, "global_step": 458078, "epoch": 5519} {"train_loss": -24.87190055847168, "global_step": 458079, "epoch": 5519} {"train_loss": -25.759540557861328, "global_step": 458080, "epoch": 5519} {"train_loss": -25.917627334594727, "global_step": 458081, "epoch": 5519} {"train_loss": -26.205392837524414, "global_step": 458082, "epoch": 5519} {"train_loss": -26.0987491607666, "global_step": 458083, "epoch": 5519} {"train_loss": -26.597925186157227, "global_step": 458084, "epoch": 5519} {"train_loss": -26.28995132446289, "global_step": 458085, "epoch": 5519} {"train_loss": -26.858551025390625, "global_step": 458086, "epoch": 5519} {"train_loss": -26.48404884338379, "global_step": 458087, "epoch": 5519} {"train_loss": -26.48654556274414, "global_step": 458088, "epoch": 5519} {"train_loss": -26.855484008789062, "global_step": 458089, "epoch": 5519} {"train_loss": -26.690210342407227, "global_step": 458090, "epoch": 5519} {"train_loss": -26.671857833862305, "global_step": 458091, "epoch": 5519} {"train_loss": -26.59638786315918, "global_step": 458092, "epoch": 5519} {"train_loss": -26.63332176208496, "global_step": 458093, "epoch": 5519} {"train_loss": -26.664350509643555, "global_step": 458094, "epoch": 5519} {"train_loss": -26.81412696838379, "global_step": 458095, "epoch": 5519} {"train_loss": -26.4730224609375, "global_step": 458096, "epoch": 5519} {"train_loss": -26.93532371520996, "global_step": 458097, "epoch": 5519} {"train_loss": -27.000741958618164, "global_step": 458098, "epoch": 5519} {"train_loss": -26.986835479736328, "global_step": 458099, "epoch": 5519} {"train_loss": -26.7220401763916, "global_step": 458100, "epoch": 5519} {"train_loss": -26.797521591186523, "global_step": 458101, "epoch": 5519} {"train_loss": -26.71353530883789, "global_step": 458102, "epoch": 5519} {"train_loss": -26.73624610900879, "global_step": 458103, "epoch": 5519} {"train_loss": -27.040082931518555, "global_step": 458104, "epoch": 5519} {"train_loss": -27.185998916625977, "global_step": 458105, "epoch": 5519} {"train_loss": -27.074262619018555, "global_step": 458106, "epoch": 5519} {"train_loss": -27.110227584838867, "global_step": 458107, "epoch": 5519} {"train_loss": -26.93833351135254, "global_step": 458108, "epoch": 5519} {"train_loss": -26.720722198486328, "global_step": 458109, "epoch": 5519} {"train_loss": -27.022642135620117, "global_step": 458110, "epoch": 5519} {"train_loss": -27.257902145385742, "global_step": 458111, "epoch": 5519} {"train_loss": -27.227813720703125, "global_step": 458112, "epoch": 5519} {"train_loss": -26.990442276000977, "global_step": 458113, "epoch": 5519} {"train_loss": -27.123876571655273, "global_step": 458114, "epoch": 5519} {"train_loss": -26.9939022064209, "global_step": 458115, "epoch": 5519} {"train_loss": -26.677453994750977, "global_step": 458116, "epoch": 5519} {"train_loss": -26.973440170288086, "global_step": 458117, "epoch": 5519} {"train_loss": -26.812641143798828, "global_step": 458118, "epoch": 5519} {"train_loss": -27.2524471282959, "global_step": 458119, "epoch": 5519} {"train_loss": -27.013086318969727, "global_step": 458120, "epoch": 5519} {"train_loss": -26.678363800048828, "global_step": 458121, "epoch": 5519} {"train_loss": -26.745824813842773, "global_step": 458122, "epoch": 5519} {"train_loss": -26.436182022094727, "global_step": 458123, "epoch": 5519} {"train_loss": -26.940174102783203, "global_step": 458124, "epoch": 5519} {"train_loss": -27.034467697143555, "global_step": 458125, "epoch": 5519} {"train_loss": -27.061203002929688, "global_step": 458126, "epoch": 5519} {"train_loss": -26.762176513671875, "global_step": 458127, "epoch": 5519} {"train_loss": -26.587182998657227, "global_step": 458128, "epoch": 5519} {"train_loss": -26.905181884765625, "global_step": 458129, "epoch": 5519} {"train_loss": -27.05377769470215, "global_step": 458130, "epoch": 5519} {"train_loss": -27.136194229125977, "global_step": 458131, "epoch": 5519} {"train_loss": -27.032922744750977, "global_step": 458132, "epoch": 5519} {"train_loss": -26.834604263305664, "global_step": 458133, "epoch": 5519} {"train_loss": -27.294376373291016, "global_step": 458134, "epoch": 5519} {"train_loss": -27.038705825805664, "global_step": 458135, "epoch": 5519} {"train_loss": -27.431608200073242, "global_step": 458136, "epoch": 5519} {"train_loss": -26.913482666015625, "global_step": 458137, "epoch": 5519} {"train_loss": -27.343061447143555, "global_step": 458138, "epoch": 5519} {"train_loss": -26.93902587890625, "global_step": 458139, "epoch": 5519} {"train_loss": -27.46352195739746, "global_step": 458140, "epoch": 5519} {"train_loss": -26.94752311706543, "global_step": 458141, "epoch": 5519} {"train_loss": -27.22674560546875, "global_step": 458142, "epoch": 5519} {"train_loss": -26.746667861938477, "global_step": 458143, "epoch": 5519} {"train_loss": -26.6834774017334, "global_step": 458144, "epoch": 5519} {"train_loss": -27.07163429260254, "global_step": 458145, "epoch": 5519} {"train_loss": -27.073373794555664, "global_step": 458146, "epoch": 5519} {"train_loss": -27.257001876831055, "global_step": 458147, "epoch": 5519} {"train_loss": -27.101587295532227, "global_step": 458148, "epoch": 5519} {"train_loss": -26.910734176635742, "global_step": 458149, "epoch": 5519} {"train_loss": -27.532285690307617, "global_step": 458150, "epoch": 5519} {"train_loss": -27.301183700561523, "global_step": 458151, "epoch": 5519} {"train_loss": -27.208389282226562, "global_step": 458152, "epoch": 5519} {"train_loss": -27.20426368713379, "global_step": 458153, "epoch": 5519} {"train_loss": -27.203800201416016, "global_step": 458154, "epoch": 5519} {"train_loss": -27.49103355407715, "global_step": 458155, "epoch": 5519} {"train_loss": -27.018463134765625, "global_step": 458156, "epoch": 5519} {"train_loss": -27.253324508666992, "global_step": 458157, "epoch": 5519} {"train_loss": -27.327360153198242, "global_step": 458158, "epoch": 5519} {"train_loss": -26.83555892576654, "global_step": 458159, "epoch": 5519, "val_loss": 6575321.5} {"train_loss": -26.7216854095459, "global_step": 458160, "epoch": 5520} {"train_loss": -26.54612159729004, "global_step": 458161, "epoch": 5520} {"train_loss": -26.867462158203125, "global_step": 458162, "epoch": 5520} {"train_loss": -26.589487075805664, "global_step": 458163, "epoch": 5520} {"train_loss": -26.59235954284668, "global_step": 458164, "epoch": 5520} {"train_loss": -25.9833927154541, "global_step": 458165, "epoch": 5520} {"train_loss": -26.409561157226562, "global_step": 458166, "epoch": 5520} {"train_loss": -26.150304794311523, "global_step": 458167, "epoch": 5520} {"train_loss": -26.26165771484375, "global_step": 458168, "epoch": 5520} {"train_loss": -26.4279842376709, "global_step": 458169, "epoch": 5520} {"train_loss": -26.73480224609375, "global_step": 458170, "epoch": 5520} {"train_loss": -26.74738883972168, "global_step": 458171, "epoch": 5520} {"train_loss": -26.377582550048828, "global_step": 458172, "epoch": 5520} {"train_loss": -26.83278465270996, "global_step": 458173, "epoch": 5520} {"train_loss": -27.00078773498535, "global_step": 458174, "epoch": 5520} {"train_loss": -26.724552154541016, "global_step": 458175, "epoch": 5520} {"train_loss": -26.78400230407715, "global_step": 458176, "epoch": 5520} {"train_loss": -26.799909591674805, "global_step": 458177, "epoch": 5520} {"train_loss": -26.841527938842773, "global_step": 458178, "epoch": 5520} {"train_loss": -27.23390007019043, "global_step": 458179, "epoch": 5520} {"train_loss": -26.694196701049805, "global_step": 458180, "epoch": 5520} {"train_loss": -26.766408920288086, "global_step": 458181, "epoch": 5520} {"train_loss": -26.767974853515625, "global_step": 458182, "epoch": 5520} {"train_loss": -26.821802139282227, "global_step": 458183, "epoch": 5520} {"train_loss": -26.968982696533203, "global_step": 458184, "epoch": 5520} {"train_loss": -26.712705612182617, "global_step": 458185, "epoch": 5520} {"train_loss": -27.337987899780273, "global_step": 458186, "epoch": 5520} {"train_loss": -27.103626251220703, "global_step": 458187, "epoch": 5520} {"train_loss": -27.107633590698242, "global_step": 458188, "epoch": 5520} {"train_loss": -27.004514694213867, "global_step": 458189, "epoch": 5520} {"train_loss": -26.91619300842285, "global_step": 458190, "epoch": 5520} {"train_loss": -27.389591217041016, "global_step": 458191, "epoch": 5520} {"train_loss": -27.150854110717773, "global_step": 458192, "epoch": 5520} {"train_loss": -27.05990982055664, "global_step": 458193, "epoch": 5520} {"train_loss": -27.345539093017578, "global_step": 458194, "epoch": 5520} {"train_loss": -27.62000846862793, "global_step": 458195, "epoch": 5520} {"train_loss": -27.12061882019043, "global_step": 458196, "epoch": 5520} {"train_loss": -27.304962158203125, "global_step": 458197, "epoch": 5520} {"train_loss": -27.406265258789062, "global_step": 458198, "epoch": 5520} {"train_loss": -27.211654663085938, "global_step": 458199, "epoch": 5520} {"train_loss": -27.5343074798584, "global_step": 458200, "epoch": 5520} {"train_loss": -27.11846923828125, "global_step": 458201, "epoch": 5520} {"train_loss": -27.5489559173584, "global_step": 458202, "epoch": 5520} {"train_loss": -27.125635147094727, "global_step": 458203, "epoch": 5520} {"train_loss": -27.497156143188477, "global_step": 458204, "epoch": 5520} {"train_loss": -27.341278076171875, "global_step": 458205, "epoch": 5520} {"train_loss": -27.22047233581543, "global_step": 458206, "epoch": 5520} {"train_loss": -27.204797744750977, "global_step": 458207, "epoch": 5520} {"train_loss": -27.370065689086914, "global_step": 458208, "epoch": 5520} {"train_loss": -27.293676376342773, "global_step": 458209, "epoch": 5520} {"train_loss": -27.134977340698242, "global_step": 458210, "epoch": 5520} {"train_loss": -27.5930233001709, "global_step": 458211, "epoch": 5520} {"train_loss": -27.5086727142334, "global_step": 458212, "epoch": 5520} {"train_loss": -27.481937408447266, "global_step": 458213, "epoch": 5520} {"train_loss": -27.349807739257812, "global_step": 458214, "epoch": 5520} {"train_loss": -27.29384422302246, "global_step": 458215, "epoch": 5520} {"train_loss": -26.65359878540039, "global_step": 458216, "epoch": 5520} {"train_loss": -25.450647354125977, "global_step": 458217, "epoch": 5520} {"train_loss": -23.472951889038086, "global_step": 458218, "epoch": 5520} {"train_loss": -24.463743209838867, "global_step": 458219, "epoch": 5520} {"train_loss": -25.366727828979492, "global_step": 458220, "epoch": 5520} {"train_loss": -25.73396110534668, "global_step": 458221, "epoch": 5520} {"train_loss": -25.47193717956543, "global_step": 458222, "epoch": 5520} {"train_loss": -25.97149085998535, "global_step": 458223, "epoch": 5520} {"train_loss": -25.635282516479492, "global_step": 458224, "epoch": 5520} {"train_loss": -26.11612319946289, "global_step": 458225, "epoch": 5520} {"train_loss": -25.968677520751953, "global_step": 458226, "epoch": 5520} {"train_loss": -26.661523818969727, "global_step": 458227, "epoch": 5520} {"train_loss": -26.30217933654785, "global_step": 458228, "epoch": 5520} {"train_loss": -26.01193618774414, "global_step": 458229, "epoch": 5520} {"train_loss": -26.493982315063477, "global_step": 458230, "epoch": 5520} {"train_loss": -26.786527633666992, "global_step": 458231, "epoch": 5520} {"train_loss": -26.098047256469727, "global_step": 458232, "epoch": 5520} {"train_loss": -26.5435848236084, "global_step": 458233, "epoch": 5520} {"train_loss": -26.944425582885742, "global_step": 458234, "epoch": 5520} {"train_loss": -26.359777450561523, "global_step": 458235, "epoch": 5520} {"train_loss": -26.817707061767578, "global_step": 458236, "epoch": 5520} {"train_loss": -26.726003646850586, "global_step": 458237, "epoch": 5520} {"train_loss": -26.4866943359375, "global_step": 458238, "epoch": 5520} {"train_loss": -26.539579391479492, "global_step": 458239, "epoch": 5520} {"train_loss": -27.028039932250977, "global_step": 458240, "epoch": 5520} {"train_loss": -26.125324249267578, "global_step": 458241, "epoch": 5520} {"train_loss": -26.7158254830234, "global_step": 458242, "epoch": 5520, "val_loss": 6566015.0} {"train_loss": -26.58559226989746, "global_step": 458243, "epoch": 5521} {"train_loss": -26.562280654907227, "global_step": 458244, "epoch": 5521} {"train_loss": -26.511566162109375, "global_step": 458245, "epoch": 5521} {"train_loss": -26.86683464050293, "global_step": 458246, "epoch": 5521} {"train_loss": -26.856054306030273, "global_step": 458247, "epoch": 5521} {"train_loss": -26.7281551361084, "global_step": 458248, "epoch": 5521} {"train_loss": -26.809736251831055, "global_step": 458249, "epoch": 5521} {"train_loss": -26.52606773376465, "global_step": 458250, "epoch": 5521} {"train_loss": -26.739465713500977, "global_step": 458251, "epoch": 5521} {"train_loss": -26.8017578125, "global_step": 458252, "epoch": 5521} {"train_loss": -26.879568099975586, "global_step": 458253, "epoch": 5521} {"train_loss": -27.021982192993164, "global_step": 458254, "epoch": 5521} {"train_loss": -27.078155517578125, "global_step": 458255, "epoch": 5521} {"train_loss": -27.0816650390625, "global_step": 458256, "epoch": 5521} {"train_loss": -26.530731201171875, "global_step": 458257, "epoch": 5521} {"train_loss": -26.85491371154785, "global_step": 458258, "epoch": 5521} {"train_loss": -26.824493408203125, "global_step": 458259, "epoch": 5521} {"train_loss": -27.16360855102539, "global_step": 458260, "epoch": 5521} {"train_loss": -27.40642738342285, "global_step": 458261, "epoch": 5521} {"train_loss": -27.15582847595215, "global_step": 458262, "epoch": 5521} {"train_loss": -27.005029678344727, "global_step": 458263, "epoch": 5521} {"train_loss": -26.79620933532715, "global_step": 458264, "epoch": 5521} {"train_loss": -27.447357177734375, "global_step": 458265, "epoch": 5521} {"train_loss": -27.179391860961914, "global_step": 458266, "epoch": 5521} {"train_loss": -27.380456924438477, "global_step": 458267, "epoch": 5521} {"train_loss": -27.514434814453125, "global_step": 458268, "epoch": 5521} {"train_loss": -26.79298210144043, "global_step": 458269, "epoch": 5521} {"train_loss": -27.06467628479004, "global_step": 458270, "epoch": 5521} {"train_loss": -27.34259605407715, "global_step": 458271, "epoch": 5521} {"train_loss": -27.217878341674805, "global_step": 458272, "epoch": 5521} {"train_loss": -27.107831954956055, "global_step": 458273, "epoch": 5521} {"train_loss": -27.18609046936035, "global_step": 458274, "epoch": 5521} {"train_loss": -27.18763542175293, "global_step": 458275, "epoch": 5521} {"train_loss": -27.430875778198242, "global_step": 458276, "epoch": 5521} {"train_loss": -27.356470108032227, "global_step": 458277, "epoch": 5521} {"train_loss": -27.07419776916504, "global_step": 458278, "epoch": 5521} {"train_loss": -27.2593936920166, "global_step": 458279, "epoch": 5521} {"train_loss": -27.865802764892578, "global_step": 458280, "epoch": 5521} {"train_loss": -26.912616729736328, "global_step": 458281, "epoch": 5521} {"train_loss": -26.877613067626953, "global_step": 458282, "epoch": 5521} {"train_loss": -27.41773796081543, "global_step": 458283, "epoch": 5521} {"train_loss": -27.29795265197754, "global_step": 458284, "epoch": 5521} {"train_loss": -27.096784591674805, "global_step": 458285, "epoch": 5521} {"train_loss": -27.293203353881836, "global_step": 458286, "epoch": 5521} {"train_loss": -27.167938232421875, "global_step": 458287, "epoch": 5521} {"train_loss": -27.181167602539062, "global_step": 458288, "epoch": 5521} {"train_loss": -27.283950805664062, "global_step": 458289, "epoch": 5521} {"train_loss": -27.1617488861084, "global_step": 458290, "epoch": 5521} {"train_loss": -27.152545928955078, "global_step": 458291, "epoch": 5521} {"train_loss": -26.7519474029541, "global_step": 458292, "epoch": 5521} {"train_loss": -27.1282958984375, "global_step": 458293, "epoch": 5521} {"train_loss": -27.339502334594727, "global_step": 458294, "epoch": 5521} {"train_loss": -27.1859188079834, "global_step": 458295, "epoch": 5521} {"train_loss": -27.104780197143555, "global_step": 458296, "epoch": 5521} {"train_loss": -27.122974395751953, "global_step": 458297, "epoch": 5521} {"train_loss": -27.146575927734375, "global_step": 458298, "epoch": 5521} {"train_loss": -27.166873931884766, "global_step": 458299, "epoch": 5521} {"train_loss": -27.406652450561523, "global_step": 458300, "epoch": 5521} {"train_loss": -27.310184478759766, "global_step": 458301, "epoch": 5521} {"train_loss": -27.45591163635254, "global_step": 458302, "epoch": 5521} {"train_loss": -27.682464599609375, "global_step": 458303, "epoch": 5521} {"train_loss": -27.163583755493164, "global_step": 458304, "epoch": 5521} {"train_loss": -27.056726455688477, "global_step": 458305, "epoch": 5521} {"train_loss": -26.936767578125, "global_step": 458306, "epoch": 5521} {"train_loss": -26.85821533203125, "global_step": 458307, "epoch": 5521} {"train_loss": -27.11665153503418, "global_step": 458308, "epoch": 5521} {"train_loss": -27.339466094970703, "global_step": 458309, "epoch": 5521} {"train_loss": -27.13710594177246, "global_step": 458310, "epoch": 5521} {"train_loss": -27.25369644165039, "global_step": 458311, "epoch": 5521} {"train_loss": -27.042957305908203, "global_step": 458312, "epoch": 5521} {"train_loss": -26.923675537109375, "global_step": 458313, "epoch": 5521} {"train_loss": -26.957275390625, "global_step": 458314, "epoch": 5521} {"train_loss": -26.861957550048828, "global_step": 458315, "epoch": 5521} {"train_loss": -26.912805557250977, "global_step": 458316, "epoch": 5521} {"train_loss": -26.48589515686035, "global_step": 458317, "epoch": 5521} {"train_loss": -27.522796630859375, "global_step": 458318, "epoch": 5521} {"train_loss": -27.04994010925293, "global_step": 458319, "epoch": 5521} {"train_loss": -26.819900512695312, "global_step": 458320, "epoch": 5521} {"train_loss": -27.115009307861328, "global_step": 458321, "epoch": 5521} {"train_loss": -26.857507705688477, "global_step": 458322, "epoch": 5521} {"train_loss": -26.798471450805664, "global_step": 458323, "epoch": 5521} {"train_loss": -27.017309188842773, "global_step": 458324, "epoch": 5521} {"train_loss": -27.06548768928252, "global_step": 458325, "epoch": 5521, "val_loss": 6495292.5} {"train_loss": -25.400156021118164, "global_step": 458326, "epoch": 5522} {"train_loss": -26.3737735748291, "global_step": 458327, "epoch": 5522} {"train_loss": -26.68731117248535, "global_step": 458328, "epoch": 5522} {"train_loss": -25.63093376159668, "global_step": 458329, "epoch": 5522} {"train_loss": -26.649580001831055, "global_step": 458330, "epoch": 5522} {"train_loss": -26.706466674804688, "global_step": 458331, "epoch": 5522} {"train_loss": -26.990076065063477, "global_step": 458332, "epoch": 5522} {"train_loss": -26.423925399780273, "global_step": 458333, "epoch": 5522} {"train_loss": -27.017166137695312, "global_step": 458334, "epoch": 5522} {"train_loss": -26.548694610595703, "global_step": 458335, "epoch": 5522} {"train_loss": -26.791458129882812, "global_step": 458336, "epoch": 5522} {"train_loss": -26.49867057800293, "global_step": 458337, "epoch": 5522} {"train_loss": -26.6462345123291, "global_step": 458338, "epoch": 5522} {"train_loss": -26.46949577331543, "global_step": 458339, "epoch": 5522} {"train_loss": -26.955678939819336, "global_step": 458340, "epoch": 5522} {"train_loss": -26.798328399658203, "global_step": 458341, "epoch": 5522} {"train_loss": -27.062335968017578, "global_step": 458342, "epoch": 5522} {"train_loss": -26.721027374267578, "global_step": 458343, "epoch": 5522} {"train_loss": -26.82881736755371, "global_step": 458344, "epoch": 5522} {"train_loss": -26.9182186126709, "global_step": 458345, "epoch": 5522} {"train_loss": -26.873666763305664, "global_step": 458346, "epoch": 5522} {"train_loss": -26.8845157623291, "global_step": 458347, "epoch": 5522} {"train_loss": -26.767438888549805, "global_step": 458348, "epoch": 5522} {"train_loss": -26.902494430541992, "global_step": 458349, "epoch": 5522} {"train_loss": -26.985692977905273, "global_step": 458350, "epoch": 5522} {"train_loss": -27.473779678344727, "global_step": 458351, "epoch": 5522} {"train_loss": -27.33888053894043, "global_step": 458352, "epoch": 5522} {"train_loss": -27.2842960357666, "global_step": 458353, "epoch": 5522} {"train_loss": -27.09246826171875, "global_step": 458354, "epoch": 5522} {"train_loss": -27.032642364501953, "global_step": 458355, "epoch": 5522} {"train_loss": -26.95302391052246, "global_step": 458356, "epoch": 5522} {"train_loss": -27.331085205078125, "global_step": 458357, "epoch": 5522} {"train_loss": -26.95062255859375, "global_step": 458358, "epoch": 5522} {"train_loss": -27.221466064453125, "global_step": 458359, "epoch": 5522} {"train_loss": -27.075122833251953, "global_step": 458360, "epoch": 5522} {"train_loss": -26.991498947143555, "global_step": 458361, "epoch": 5522} {"train_loss": -27.418914794921875, "global_step": 458362, "epoch": 5522} {"train_loss": -27.300003051757812, "global_step": 458363, "epoch": 5522} {"train_loss": -27.3298397064209, "global_step": 458364, "epoch": 5522} {"train_loss": -27.247705459594727, "global_step": 458365, "epoch": 5522} {"train_loss": -27.413238525390625, "global_step": 458366, "epoch": 5522} {"train_loss": -27.410181045532227, "global_step": 458367, "epoch": 5522} {"train_loss": -26.988569259643555, "global_step": 458368, "epoch": 5522} {"train_loss": -27.247018814086914, "global_step": 458369, "epoch": 5522} {"train_loss": -27.081140518188477, "global_step": 458370, "epoch": 5522} {"train_loss": -27.321683883666992, "global_step": 458371, "epoch": 5522} {"train_loss": -27.412275314331055, "global_step": 458372, "epoch": 5522} {"train_loss": -26.97381019592285, "global_step": 458373, "epoch": 5522} {"train_loss": -27.18902015686035, "global_step": 458374, "epoch": 5522} {"train_loss": -27.2208194732666, "global_step": 458375, "epoch": 5522} {"train_loss": -27.18807029724121, "global_step": 458376, "epoch": 5522} {"train_loss": -27.45285415649414, "global_step": 458377, "epoch": 5522} {"train_loss": -27.4735107421875, "global_step": 458378, "epoch": 5522} {"train_loss": -27.323156356811523, "global_step": 458379, "epoch": 5522} {"train_loss": -27.42291259765625, "global_step": 458380, "epoch": 5522} {"train_loss": -27.025501251220703, "global_step": 458381, "epoch": 5522} {"train_loss": -26.975830078125, "global_step": 458382, "epoch": 5522} {"train_loss": -27.516681671142578, "global_step": 458383, "epoch": 5522} {"train_loss": -27.153671264648438, "global_step": 458384, "epoch": 5522} {"train_loss": -27.23663330078125, "global_step": 458385, "epoch": 5522} {"train_loss": -27.428998947143555, "global_step": 458386, "epoch": 5522} {"train_loss": -27.02276039123535, "global_step": 458387, "epoch": 5522} {"train_loss": -27.149261474609375, "global_step": 458388, "epoch": 5522} {"train_loss": -27.3631649017334, "global_step": 458389, "epoch": 5522} {"train_loss": -26.841964721679688, "global_step": 458390, "epoch": 5522} {"train_loss": -27.01045799255371, "global_step": 458391, "epoch": 5522} {"train_loss": -27.125946044921875, "global_step": 458392, "epoch": 5522} {"train_loss": -27.656030654907227, "global_step": 458393, "epoch": 5522} {"train_loss": -27.112823486328125, "global_step": 458394, "epoch": 5522} {"train_loss": -26.810895919799805, "global_step": 458395, "epoch": 5522} {"train_loss": -26.893192291259766, "global_step": 458396, "epoch": 5522} {"train_loss": -26.78458595275879, "global_step": 458397, "epoch": 5522} {"train_loss": -26.650739669799805, "global_step": 458398, "epoch": 5522} {"train_loss": -26.809778213500977, "global_step": 458399, "epoch": 5522} {"train_loss": -27.258544921875, "global_step": 458400, "epoch": 5522} {"train_loss": -27.231338500976562, "global_step": 458401, "epoch": 5522} {"train_loss": -26.970182418823242, "global_step": 458402, "epoch": 5522} {"train_loss": -27.31867027282715, "global_step": 458403, "epoch": 5522} {"train_loss": -27.25813102722168, "global_step": 458404, "epoch": 5522} {"train_loss": -27.302038192749023, "global_step": 458405, "epoch": 5522} {"train_loss": -27.1365909576416, "global_step": 458406, "epoch": 5522} {"train_loss": -26.913497924804688, "global_step": 458407, "epoch": 5522} {"train_loss": -27.01909460504371, "global_step": 458408, "epoch": 5522, "val_loss": 6467715.0} {"train_loss": -25.593856811523438, "global_step": 458409, "epoch": 5523} {"train_loss": -25.682437896728516, "global_step": 458410, "epoch": 5523} {"train_loss": -26.529172897338867, "global_step": 458411, "epoch": 5523} {"train_loss": -26.336179733276367, "global_step": 458412, "epoch": 5523} {"train_loss": -26.22553062438965, "global_step": 458413, "epoch": 5523} {"train_loss": -26.502893447875977, "global_step": 458414, "epoch": 5523} {"train_loss": -25.999372482299805, "global_step": 458415, "epoch": 5523} {"train_loss": -26.749221801757812, "global_step": 458416, "epoch": 5523} {"train_loss": -26.265039443969727, "global_step": 458417, "epoch": 5523} {"train_loss": -26.2010555267334, "global_step": 458418, "epoch": 5523} {"train_loss": -26.877283096313477, "global_step": 458419, "epoch": 5523} {"train_loss": -26.097890853881836, "global_step": 458420, "epoch": 5523} {"train_loss": -26.510114669799805, "global_step": 458421, "epoch": 5523} {"train_loss": -26.5587158203125, "global_step": 458422, "epoch": 5523} {"train_loss": -26.14246940612793, "global_step": 458423, "epoch": 5523} {"train_loss": -26.78500747680664, "global_step": 458424, "epoch": 5523} {"train_loss": -26.756879806518555, "global_step": 458425, "epoch": 5523} {"train_loss": -26.413095474243164, "global_step": 458426, "epoch": 5523} {"train_loss": -26.850149154663086, "global_step": 458427, "epoch": 5523} {"train_loss": -26.766117095947266, "global_step": 458428, "epoch": 5523} {"train_loss": -26.730640411376953, "global_step": 458429, "epoch": 5523} {"train_loss": -26.978071212768555, "global_step": 458430, "epoch": 5523} {"train_loss": -26.736297607421875, "global_step": 458431, "epoch": 5523} {"train_loss": -26.676258087158203, "global_step": 458432, "epoch": 5523} {"train_loss": -26.654361724853516, "global_step": 458433, "epoch": 5523} {"train_loss": -26.887521743774414, "global_step": 458434, "epoch": 5523} {"train_loss": -26.883398056030273, "global_step": 458435, "epoch": 5523} {"train_loss": -26.73554801940918, "global_step": 458436, "epoch": 5523} {"train_loss": -27.23660659790039, "global_step": 458437, "epoch": 5523} {"train_loss": -27.189916610717773, "global_step": 458438, "epoch": 5523} {"train_loss": -27.035171508789062, "global_step": 458439, "epoch": 5523} {"train_loss": -27.301605224609375, "global_step": 458440, "epoch": 5523} {"train_loss": -26.775060653686523, "global_step": 458441, "epoch": 5523} {"train_loss": -27.142993927001953, "global_step": 458442, "epoch": 5523} {"train_loss": -26.939212799072266, "global_step": 458443, "epoch": 5523} {"train_loss": -27.005008697509766, "global_step": 458444, "epoch": 5523} {"train_loss": -26.976308822631836, "global_step": 458445, "epoch": 5523} {"train_loss": -27.036972045898438, "global_step": 458446, "epoch": 5523} {"train_loss": -27.238367080688477, "global_step": 458447, "epoch": 5523} {"train_loss": -27.098865509033203, "global_step": 458448, "epoch": 5523} {"train_loss": -27.190332412719727, "global_step": 458449, "epoch": 5523} {"train_loss": -27.062841415405273, "global_step": 458450, "epoch": 5523} {"train_loss": -27.039398193359375, "global_step": 458451, "epoch": 5523} {"train_loss": -26.90093994140625, "global_step": 458452, "epoch": 5523} {"train_loss": -27.190763473510742, "global_step": 458453, "epoch": 5523} {"train_loss": -27.14700698852539, "global_step": 458454, "epoch": 5523} {"train_loss": -27.204299926757812, "global_step": 458455, "epoch": 5523} {"train_loss": -27.194677352905273, "global_step": 458456, "epoch": 5523} {"train_loss": -27.412067413330078, "global_step": 458457, "epoch": 5523} {"train_loss": -27.781219482421875, "global_step": 458458, "epoch": 5523} {"train_loss": -27.480085372924805, "global_step": 458459, "epoch": 5523} {"train_loss": -27.3074951171875, "global_step": 458460, "epoch": 5523} {"train_loss": -27.508691787719727, "global_step": 458461, "epoch": 5523} {"train_loss": -27.23508071899414, "global_step": 458462, "epoch": 5523} {"train_loss": -27.128976821899414, "global_step": 458463, "epoch": 5523} {"train_loss": -27.04876708984375, "global_step": 458464, "epoch": 5523} {"train_loss": -27.099485397338867, "global_step": 458465, "epoch": 5523} {"train_loss": -27.283710479736328, "global_step": 458466, "epoch": 5523} {"train_loss": -27.238080978393555, "global_step": 458467, "epoch": 5523} {"train_loss": -27.664846420288086, "global_step": 458468, "epoch": 5523} {"train_loss": -27.153371810913086, "global_step": 458469, "epoch": 5523} {"train_loss": -27.266870498657227, "global_step": 458470, "epoch": 5523} {"train_loss": -27.162473678588867, "global_step": 458471, "epoch": 5523} {"train_loss": -27.189924240112305, "global_step": 458472, "epoch": 5523} {"train_loss": -27.3144588470459, "global_step": 458473, "epoch": 5523} {"train_loss": -26.997303009033203, "global_step": 458474, "epoch": 5523} {"train_loss": -27.416181564331055, "global_step": 458475, "epoch": 5523} {"train_loss": -27.333242416381836, "global_step": 458476, "epoch": 5523} {"train_loss": -27.544050216674805, "global_step": 458477, "epoch": 5523} {"train_loss": -27.35284996032715, "global_step": 458478, "epoch": 5523} {"train_loss": -27.5821590423584, "global_step": 458479, "epoch": 5523} {"train_loss": -26.851133346557617, "global_step": 458480, "epoch": 5523} {"train_loss": -26.994760513305664, "global_step": 458481, "epoch": 5523} {"train_loss": -27.147388458251953, "global_step": 458482, "epoch": 5523} {"train_loss": -27.108667373657227, "global_step": 458483, "epoch": 5523} {"train_loss": -27.212316513061523, "global_step": 458484, "epoch": 5523} {"train_loss": -27.163049697875977, "global_step": 458485, "epoch": 5523} {"train_loss": -27.184309005737305, "global_step": 458486, "epoch": 5523} {"train_loss": -26.765466690063477, "global_step": 458487, "epoch": 5523} {"train_loss": -26.86444664001465, "global_step": 458488, "epoch": 5523} {"train_loss": -27.5033016204834, "global_step": 458489, "epoch": 5523} {"train_loss": -26.879384994506836, "global_step": 458490, "epoch": 5523} {"train_loss": -26.9382215293057, "global_step": 458491, "epoch": 5523, "val_loss": 6564993.5} {"train_loss": -24.073135375976562, "global_step": 458492, "epoch": 5524} {"train_loss": -24.64088249206543, "global_step": 458493, "epoch": 5524} {"train_loss": -26.60247802734375, "global_step": 458494, "epoch": 5524} {"train_loss": -25.25484275817871, "global_step": 458495, "epoch": 5524} {"train_loss": -26.431127548217773, "global_step": 458496, "epoch": 5524} {"train_loss": -25.278194427490234, "global_step": 458497, "epoch": 5524} {"train_loss": -26.125152587890625, "global_step": 458498, "epoch": 5524} {"train_loss": -25.91895866394043, "global_step": 458499, "epoch": 5524} {"train_loss": -25.52309226989746, "global_step": 458500, "epoch": 5524} {"train_loss": -25.942276000976562, "global_step": 458501, "epoch": 5524} {"train_loss": -25.52054786682129, "global_step": 458502, "epoch": 5524} {"train_loss": -26.325092315673828, "global_step": 458503, "epoch": 5524} {"train_loss": -25.979650497436523, "global_step": 458504, "epoch": 5524} {"train_loss": -26.63922691345215, "global_step": 458505, "epoch": 5524} {"train_loss": -26.27936363220215, "global_step": 458506, "epoch": 5524} {"train_loss": -26.552539825439453, "global_step": 458507, "epoch": 5524} {"train_loss": -26.461881637573242, "global_step": 458508, "epoch": 5524} {"train_loss": -26.328161239624023, "global_step": 458509, "epoch": 5524} {"train_loss": -26.318649291992188, "global_step": 458510, "epoch": 5524} {"train_loss": -26.384571075439453, "global_step": 458511, "epoch": 5524} {"train_loss": -26.40262222290039, "global_step": 458512, "epoch": 5524} {"train_loss": -26.62635612487793, "global_step": 458513, "epoch": 5524} {"train_loss": -26.496158599853516, "global_step": 458514, "epoch": 5524} {"train_loss": -26.626447677612305, "global_step": 458515, "epoch": 5524} {"train_loss": -26.2513484954834, "global_step": 458516, "epoch": 5524} {"train_loss": -26.6357364654541, "global_step": 458517, "epoch": 5524} {"train_loss": -26.81096839904785, "global_step": 458518, "epoch": 5524} {"train_loss": -26.93390464782715, "global_step": 458519, "epoch": 5524} {"train_loss": -26.71892738342285, "global_step": 458520, "epoch": 5524} {"train_loss": -26.63117790222168, "global_step": 458521, "epoch": 5524} {"train_loss": -26.375268936157227, "global_step": 458522, "epoch": 5524} {"train_loss": -26.778791427612305, "global_step": 458523, "epoch": 5524} {"train_loss": -26.774106979370117, "global_step": 458524, "epoch": 5524} {"train_loss": -26.391132354736328, "global_step": 458525, "epoch": 5524} {"train_loss": -26.804859161376953, "global_step": 458526, "epoch": 5524} {"train_loss": -26.985904693603516, "global_step": 458527, "epoch": 5524} {"train_loss": -27.12172508239746, "global_step": 458528, "epoch": 5524} {"train_loss": -26.751697540283203, "global_step": 458529, "epoch": 5524} {"train_loss": -27.090229034423828, "global_step": 458530, "epoch": 5524} {"train_loss": -27.066251754760742, "global_step": 458531, "epoch": 5524} {"train_loss": -26.737112045288086, "global_step": 458532, "epoch": 5524} {"train_loss": -27.024145126342773, "global_step": 458533, "epoch": 5524} {"train_loss": -27.313451766967773, "global_step": 458534, "epoch": 5524} {"train_loss": -26.837072372436523, "global_step": 458535, "epoch": 5524} {"train_loss": -26.997589111328125, "global_step": 458536, "epoch": 5524} {"train_loss": -27.110692977905273, "global_step": 458537, "epoch": 5524} {"train_loss": -26.97590446472168, "global_step": 458538, "epoch": 5524} {"train_loss": -27.23858070373535, "global_step": 458539, "epoch": 5524} {"train_loss": -27.365863800048828, "global_step": 458540, "epoch": 5524} {"train_loss": -27.114465713500977, "global_step": 458541, "epoch": 5524} {"train_loss": -26.73909568786621, "global_step": 458542, "epoch": 5524} {"train_loss": -26.7867488861084, "global_step": 458543, "epoch": 5524} {"train_loss": -27.333898544311523, "global_step": 458544, "epoch": 5524} {"train_loss": -27.362146377563477, "global_step": 458545, "epoch": 5524} {"train_loss": -27.018274307250977, "global_step": 458546, "epoch": 5524} {"train_loss": -27.13397789001465, "global_step": 458547, "epoch": 5524} {"train_loss": -27.063756942749023, "global_step": 458548, "epoch": 5524} {"train_loss": -27.379928588867188, "global_step": 458549, "epoch": 5524} {"train_loss": -27.306013107299805, "global_step": 458550, "epoch": 5524} {"train_loss": -27.387451171875, "global_step": 458551, "epoch": 5524} {"train_loss": -27.146162033081055, "global_step": 458552, "epoch": 5524} {"train_loss": -27.26606559753418, "global_step": 458553, "epoch": 5524} {"train_loss": -27.181949615478516, "global_step": 458554, "epoch": 5524} {"train_loss": -27.133853912353516, "global_step": 458555, "epoch": 5524} {"train_loss": -27.195158004760742, "global_step": 458556, "epoch": 5524} {"train_loss": -26.855106353759766, "global_step": 458557, "epoch": 5524} {"train_loss": -27.045307159423828, "global_step": 458558, "epoch": 5524} {"train_loss": -27.179502487182617, "global_step": 458559, "epoch": 5524} {"train_loss": -27.30807876586914, "global_step": 458560, "epoch": 5524} {"train_loss": -27.301427841186523, "global_step": 458561, "epoch": 5524} {"train_loss": -26.864643096923828, "global_step": 458562, "epoch": 5524} {"train_loss": -27.17131996154785, "global_step": 458563, "epoch": 5524} {"train_loss": -27.091522216796875, "global_step": 458564, "epoch": 5524} {"train_loss": -27.051542282104492, "global_step": 458565, "epoch": 5524} {"train_loss": -26.96612548828125, "global_step": 458566, "epoch": 5524} {"train_loss": -26.995386123657227, "global_step": 458567, "epoch": 5524} {"train_loss": -27.517847061157227, "global_step": 458568, "epoch": 5524} {"train_loss": -27.24775505065918, "global_step": 458569, "epoch": 5524} {"train_loss": -27.034509658813477, "global_step": 458570, "epoch": 5524} {"train_loss": -27.440576553344727, "global_step": 458571, "epoch": 5524} {"train_loss": -26.95849609375, "global_step": 458572, "epoch": 5524} {"train_loss": -27.159637451171875, "global_step": 458573, "epoch": 5524} {"train_loss": -26.718477364046027, "global_step": 458574, "epoch": 5524, "val_loss": 6385685.0} {"train_loss": -25.854703903198242, "global_step": 458575, "epoch": 5525} {"train_loss": -26.2694034576416, "global_step": 458576, "epoch": 5525} {"train_loss": -26.2652587890625, "global_step": 458577, "epoch": 5525} {"train_loss": -26.705554962158203, "global_step": 458578, "epoch": 5525} {"train_loss": -26.138822555541992, "global_step": 458579, "epoch": 5525} {"train_loss": -25.794153213500977, "global_step": 458580, "epoch": 5525} {"train_loss": -26.453750610351562, "global_step": 458581, "epoch": 5525} {"train_loss": -26.319120407104492, "global_step": 458582, "epoch": 5525} {"train_loss": -25.946027755737305, "global_step": 458583, "epoch": 5525} {"train_loss": -26.588516235351562, "global_step": 458584, "epoch": 5525} {"train_loss": -26.458234786987305, "global_step": 458585, "epoch": 5525} {"train_loss": -26.356292724609375, "global_step": 458586, "epoch": 5525} {"train_loss": -26.77192497253418, "global_step": 458587, "epoch": 5525} {"train_loss": -25.806493759155273, "global_step": 458588, "epoch": 5525} {"train_loss": -27.010711669921875, "global_step": 458589, "epoch": 5525} {"train_loss": -26.379003524780273, "global_step": 458590, "epoch": 5525} {"train_loss": -26.61200523376465, "global_step": 458591, "epoch": 5525} {"train_loss": -26.5628662109375, "global_step": 458592, "epoch": 5525} {"train_loss": -26.230321884155273, "global_step": 458593, "epoch": 5525} {"train_loss": -26.9040470123291, "global_step": 458594, "epoch": 5525} {"train_loss": -26.448949813842773, "global_step": 458595, "epoch": 5525} {"train_loss": -26.62360191345215, "global_step": 458596, "epoch": 5525} {"train_loss": -26.631071090698242, "global_step": 458597, "epoch": 5525} {"train_loss": -26.566572189331055, "global_step": 458598, "epoch": 5525} {"train_loss": -27.29517936706543, "global_step": 458599, "epoch": 5525} {"train_loss": -26.63287925720215, "global_step": 458600, "epoch": 5525} {"train_loss": -26.885089874267578, "global_step": 458601, "epoch": 5525} {"train_loss": -26.449615478515625, "global_step": 458602, "epoch": 5525} {"train_loss": -26.878345489501953, "global_step": 458603, "epoch": 5525} {"train_loss": -26.6375789642334, "global_step": 458604, "epoch": 5525} {"train_loss": -26.900089263916016, "global_step": 458605, "epoch": 5525} {"train_loss": -26.74321937561035, "global_step": 458606, "epoch": 5525} {"train_loss": -27.07779884338379, "global_step": 458607, "epoch": 5525} {"train_loss": -27.10980224609375, "global_step": 458608, "epoch": 5525} {"train_loss": -26.66242027282715, "global_step": 458609, "epoch": 5525} {"train_loss": -26.94970703125, "global_step": 458610, "epoch": 5525} {"train_loss": -27.035398483276367, "global_step": 458611, "epoch": 5525} {"train_loss": -27.264148712158203, "global_step": 458612, "epoch": 5525} {"train_loss": -26.914020538330078, "global_step": 458613, "epoch": 5525} {"train_loss": -27.203149795532227, "global_step": 458614, "epoch": 5525} {"train_loss": -27.198780059814453, "global_step": 458615, "epoch": 5525} {"train_loss": -27.004865646362305, "global_step": 458616, "epoch": 5525} {"train_loss": -27.187183380126953, "global_step": 458617, "epoch": 5525} {"train_loss": -27.3468017578125, "global_step": 458618, "epoch": 5525} {"train_loss": -26.98883056640625, "global_step": 458619, "epoch": 5525} {"train_loss": -27.20869255065918, "global_step": 458620, "epoch": 5525} {"train_loss": -27.289173126220703, "global_step": 458621, "epoch": 5525} {"train_loss": -27.139684677124023, "global_step": 458622, "epoch": 5525} {"train_loss": -27.00435447692871, "global_step": 458623, "epoch": 5525} {"train_loss": -27.2878475189209, "global_step": 458624, "epoch": 5525} {"train_loss": -27.287511825561523, "global_step": 458625, "epoch": 5525} {"train_loss": -27.15205955505371, "global_step": 458626, "epoch": 5525} {"train_loss": -27.357141494750977, "global_step": 458627, "epoch": 5525} {"train_loss": -27.030054092407227, "global_step": 458628, "epoch": 5525} {"train_loss": -27.293725967407227, "global_step": 458629, "epoch": 5525} {"train_loss": -27.13681983947754, "global_step": 458630, "epoch": 5525} {"train_loss": -27.160018920898438, "global_step": 458631, "epoch": 5525} {"train_loss": -27.01362419128418, "global_step": 458632, "epoch": 5525} {"train_loss": -26.843576431274414, "global_step": 458633, "epoch": 5525} {"train_loss": -27.2576961517334, "global_step": 458634, "epoch": 5525} {"train_loss": -27.260183334350586, "global_step": 458635, "epoch": 5525} {"train_loss": -27.10687828063965, "global_step": 458636, "epoch": 5525} {"train_loss": -27.259347915649414, "global_step": 458637, "epoch": 5525} {"train_loss": -27.145694732666016, "global_step": 458638, "epoch": 5525} {"train_loss": -27.363744735717773, "global_step": 458639, "epoch": 5525} {"train_loss": -26.92583656311035, "global_step": 458640, "epoch": 5525} {"train_loss": -27.5340518951416, "global_step": 458641, "epoch": 5525} {"train_loss": -27.122013092041016, "global_step": 458642, "epoch": 5525} {"train_loss": -27.4080867767334, "global_step": 458643, "epoch": 5525} {"train_loss": -27.437896728515625, "global_step": 458644, "epoch": 5525} {"train_loss": -27.163007736206055, "global_step": 458645, "epoch": 5525} {"train_loss": -27.2221622467041, "global_step": 458646, "epoch": 5525} {"train_loss": -27.02842140197754, "global_step": 458647, "epoch": 5525} {"train_loss": -27.303176879882812, "global_step": 458648, "epoch": 5525} {"train_loss": -26.874744415283203, "global_step": 458649, "epoch": 5525} {"train_loss": -27.361713409423828, "global_step": 458650, "epoch": 5525} {"train_loss": -27.1083984375, "global_step": 458651, "epoch": 5525} {"train_loss": -27.481582641601562, "global_step": 458652, "epoch": 5525} {"train_loss": -27.328012466430664, "global_step": 458653, "epoch": 5525} {"train_loss": -27.293859481811523, "global_step": 458654, "epoch": 5525} {"train_loss": -27.39784049987793, "global_step": 458655, "epoch": 5525} {"train_loss": -27.5367488861084, "global_step": 458656, "epoch": 5525} {"train_loss": -26.918768595500165, "global_step": 458657, "epoch": 5525, "val_loss": 6394353.0} {"train_loss": -27.11671257019043, "global_step": 458658, "epoch": 5526} {"train_loss": -26.441293716430664, "global_step": 458659, "epoch": 5526} {"train_loss": -26.676895141601562, "global_step": 458660, "epoch": 5526} {"train_loss": -26.83036231994629, "global_step": 458661, "epoch": 5526} {"train_loss": -26.67425537109375, "global_step": 458662, "epoch": 5526} {"train_loss": -26.163305282592773, "global_step": 458663, "epoch": 5526} {"train_loss": -26.532575607299805, "global_step": 458664, "epoch": 5526} {"train_loss": -26.831985473632812, "global_step": 458665, "epoch": 5526} {"train_loss": -26.675373077392578, "global_step": 458666, "epoch": 5526} {"train_loss": -26.532316207885742, "global_step": 458667, "epoch": 5526} {"train_loss": -27.03986930847168, "global_step": 458668, "epoch": 5526} {"train_loss": -26.792388916015625, "global_step": 458669, "epoch": 5526} {"train_loss": -26.498538970947266, "global_step": 458670, "epoch": 5526} {"train_loss": -26.761844635009766, "global_step": 458671, "epoch": 5526} {"train_loss": -26.581567764282227, "global_step": 458672, "epoch": 5526} {"train_loss": -26.748254776000977, "global_step": 458673, "epoch": 5526} {"train_loss": -27.08746337890625, "global_step": 458674, "epoch": 5526} {"train_loss": -26.92286491394043, "global_step": 458675, "epoch": 5526} {"train_loss": -26.87790870666504, "global_step": 458676, "epoch": 5526} {"train_loss": -27.087244033813477, "global_step": 458677, "epoch": 5526} {"train_loss": -26.728595733642578, "global_step": 458678, "epoch": 5526} {"train_loss": -27.007659912109375, "global_step": 458679, "epoch": 5526} {"train_loss": -26.884937286376953, "global_step": 458680, "epoch": 5526} {"train_loss": -26.76877784729004, "global_step": 458681, "epoch": 5526} {"train_loss": -26.719623565673828, "global_step": 458682, "epoch": 5526} {"train_loss": -27.280813217163086, "global_step": 458683, "epoch": 5526} {"train_loss": -27.04560661315918, "global_step": 458684, "epoch": 5526} {"train_loss": -26.90077018737793, "global_step": 458685, "epoch": 5526} {"train_loss": -26.771337509155273, "global_step": 458686, "epoch": 5526} {"train_loss": -26.73134422302246, "global_step": 458687, "epoch": 5526} {"train_loss": -27.344282150268555, "global_step": 458688, "epoch": 5526} {"train_loss": -27.052276611328125, "global_step": 458689, "epoch": 5526} {"train_loss": -27.013458251953125, "global_step": 458690, "epoch": 5526} {"train_loss": -26.975086212158203, "global_step": 458691, "epoch": 5526} {"train_loss": -27.221786499023438, "global_step": 458692, "epoch": 5526} {"train_loss": -27.307910919189453, "global_step": 458693, "epoch": 5526} {"train_loss": -27.09065055847168, "global_step": 458694, "epoch": 5526} {"train_loss": -26.797046661376953, "global_step": 458695, "epoch": 5526} {"train_loss": -27.646610260009766, "global_step": 458696, "epoch": 5526} {"train_loss": -27.154062271118164, "global_step": 458697, "epoch": 5526} {"train_loss": -27.236093521118164, "global_step": 458698, "epoch": 5526} {"train_loss": -27.48651695251465, "global_step": 458699, "epoch": 5526} {"train_loss": -27.073993682861328, "global_step": 458700, "epoch": 5526} {"train_loss": -27.22784423828125, "global_step": 458701, "epoch": 5526} {"train_loss": -27.305063247680664, "global_step": 458702, "epoch": 5526} {"train_loss": -27.154150009155273, "global_step": 458703, "epoch": 5526} {"train_loss": -27.064945220947266, "global_step": 458704, "epoch": 5526} {"train_loss": -26.955869674682617, "global_step": 458705, "epoch": 5526} {"train_loss": -27.364049911499023, "global_step": 458706, "epoch": 5526} {"train_loss": -26.875608444213867, "global_step": 458707, "epoch": 5526} {"train_loss": -27.056554794311523, "global_step": 458708, "epoch": 5526} {"train_loss": -27.376850128173828, "global_step": 458709, "epoch": 5526} {"train_loss": -27.330881118774414, "global_step": 458710, "epoch": 5526} {"train_loss": -27.185504913330078, "global_step": 458711, "epoch": 5526} {"train_loss": -27.346200942993164, "global_step": 458712, "epoch": 5526} {"train_loss": -27.4304256439209, "global_step": 458713, "epoch": 5526} {"train_loss": -27.206684112548828, "global_step": 458714, "epoch": 5526} {"train_loss": -26.592870712280273, "global_step": 458715, "epoch": 5526} {"train_loss": -27.29041862487793, "global_step": 458716, "epoch": 5526} {"train_loss": -27.0935001373291, "global_step": 458717, "epoch": 5526} {"train_loss": -27.19760513305664, "global_step": 458718, "epoch": 5526} {"train_loss": -26.6434326171875, "global_step": 458719, "epoch": 5526} {"train_loss": -27.05364990234375, "global_step": 458720, "epoch": 5526} {"train_loss": -27.37255859375, "global_step": 458721, "epoch": 5526} {"train_loss": -26.997394561767578, "global_step": 458722, "epoch": 5526} {"train_loss": -27.06451416015625, "global_step": 458723, "epoch": 5526} {"train_loss": -27.312055587768555, "global_step": 458724, "epoch": 5526} {"train_loss": -27.074499130249023, "global_step": 458725, "epoch": 5526} {"train_loss": -27.542545318603516, "global_step": 458726, "epoch": 5526} {"train_loss": -27.387176513671875, "global_step": 458727, "epoch": 5526} {"train_loss": -27.295623779296875, "global_step": 458728, "epoch": 5526} {"train_loss": -27.141284942626953, "global_step": 458729, "epoch": 5526} {"train_loss": -27.422317504882812, "global_step": 458730, "epoch": 5526} {"train_loss": -27.06733512878418, "global_step": 458731, "epoch": 5526} {"train_loss": -27.313894271850586, "global_step": 458732, "epoch": 5526} {"train_loss": -27.045454025268555, "global_step": 458733, "epoch": 5526} {"train_loss": -27.5747013092041, "global_step": 458734, "epoch": 5526} {"train_loss": -27.351520538330078, "global_step": 458735, "epoch": 5526} {"train_loss": -27.237567901611328, "global_step": 458736, "epoch": 5526} {"train_loss": -27.338062286376953, "global_step": 458737, "epoch": 5526} {"train_loss": -27.13673210144043, "global_step": 458738, "epoch": 5526} {"train_loss": -27.190893173217773, "global_step": 458739, "epoch": 5526} {"train_loss": -27.02433606802699, "global_step": 458740, "epoch": 5526, "val_loss": 6340893.0} {"train_loss": -24.813663482666016, "global_step": 458741, "epoch": 5527} {"train_loss": -24.728893280029297, "global_step": 458742, "epoch": 5527} {"train_loss": -26.678558349609375, "global_step": 458743, "epoch": 5527} {"train_loss": -26.189069747924805, "global_step": 458744, "epoch": 5527} {"train_loss": -26.484304428100586, "global_step": 458745, "epoch": 5527} {"train_loss": -25.89491081237793, "global_step": 458746, "epoch": 5527} {"train_loss": -26.22175407409668, "global_step": 458747, "epoch": 5527} {"train_loss": -26.81656837463379, "global_step": 458748, "epoch": 5527} {"train_loss": -26.435583114624023, "global_step": 458749, "epoch": 5527} {"train_loss": -26.566614151000977, "global_step": 458750, "epoch": 5527} {"train_loss": -26.363019943237305, "global_step": 458751, "epoch": 5527} {"train_loss": -26.523664474487305, "global_step": 458752, "epoch": 5527} {"train_loss": -26.373075485229492, "global_step": 458753, "epoch": 5527} {"train_loss": -26.327367782592773, "global_step": 458754, "epoch": 5527} {"train_loss": -26.794713973999023, "global_step": 458755, "epoch": 5527} {"train_loss": -26.152652740478516, "global_step": 458756, "epoch": 5527} {"train_loss": -26.909162521362305, "global_step": 458757, "epoch": 5527} {"train_loss": -26.637073516845703, "global_step": 458758, "epoch": 5527} {"train_loss": -26.616424560546875, "global_step": 458759, "epoch": 5527} {"train_loss": -26.678083419799805, "global_step": 458760, "epoch": 5527} {"train_loss": -26.743499755859375, "global_step": 458761, "epoch": 5527} {"train_loss": -26.81389808654785, "global_step": 458762, "epoch": 5527} {"train_loss": -26.976593017578125, "global_step": 458763, "epoch": 5527} {"train_loss": -26.98932456970215, "global_step": 458764, "epoch": 5527} {"train_loss": -27.05756187438965, "global_step": 458765, "epoch": 5527} {"train_loss": -26.779876708984375, "global_step": 458766, "epoch": 5527} {"train_loss": -26.9443302154541, "global_step": 458767, "epoch": 5527} {"train_loss": -26.58591651916504, "global_step": 458768, "epoch": 5527} {"train_loss": -27.0670223236084, "global_step": 458769, "epoch": 5527} {"train_loss": -26.890546798706055, "global_step": 458770, "epoch": 5527} {"train_loss": -26.65498161315918, "global_step": 458771, "epoch": 5527} {"train_loss": -26.695035934448242, "global_step": 458772, "epoch": 5527} {"train_loss": -27.058774948120117, "global_step": 458773, "epoch": 5527} {"train_loss": -27.220050811767578, "global_step": 458774, "epoch": 5527} {"train_loss": -27.229801177978516, "global_step": 458775, "epoch": 5527} {"train_loss": -27.38934898376465, "global_step": 458776, "epoch": 5527} {"train_loss": -27.15823745727539, "global_step": 458777, "epoch": 5527} {"train_loss": -27.223987579345703, "global_step": 458778, "epoch": 5527} {"train_loss": -26.977155685424805, "global_step": 458779, "epoch": 5527} {"train_loss": -27.140775680541992, "global_step": 458780, "epoch": 5527} {"train_loss": -26.9466495513916, "global_step": 458781, "epoch": 5527} {"train_loss": -27.2591609954834, "global_step": 458782, "epoch": 5527} {"train_loss": -27.304019927978516, "global_step": 458783, "epoch": 5527} {"train_loss": -27.560598373413086, "global_step": 458784, "epoch": 5527} {"train_loss": -27.326587677001953, "global_step": 458785, "epoch": 5527} {"train_loss": -27.054935455322266, "global_step": 458786, "epoch": 5527} {"train_loss": -27.241907119750977, "global_step": 458787, "epoch": 5527} {"train_loss": -27.634449005126953, "global_step": 458788, "epoch": 5527} {"train_loss": -26.92426109313965, "global_step": 458789, "epoch": 5527} {"train_loss": -27.085830688476562, "global_step": 458790, "epoch": 5527} {"train_loss": -27.338153839111328, "global_step": 458791, "epoch": 5527} {"train_loss": -27.17764663696289, "global_step": 458792, "epoch": 5527} {"train_loss": -26.8969783782959, "global_step": 458793, "epoch": 5527} {"train_loss": -26.833072662353516, "global_step": 458794, "epoch": 5527} {"train_loss": -26.993213653564453, "global_step": 458795, "epoch": 5527} {"train_loss": -27.009756088256836, "global_step": 458796, "epoch": 5527} {"train_loss": -26.72920036315918, "global_step": 458797, "epoch": 5527} {"train_loss": -26.87080192565918, "global_step": 458798, "epoch": 5527} {"train_loss": -27.047388076782227, "global_step": 458799, "epoch": 5527} {"train_loss": -26.893314361572266, "global_step": 458800, "epoch": 5527} {"train_loss": -26.786136627197266, "global_step": 458801, "epoch": 5527} {"train_loss": -27.115345001220703, "global_step": 458802, "epoch": 5527} {"train_loss": -27.453657150268555, "global_step": 458803, "epoch": 5527} {"train_loss": -26.69367790222168, "global_step": 458804, "epoch": 5527} {"train_loss": -26.70271873474121, "global_step": 458805, "epoch": 5527} {"train_loss": -26.8881778717041, "global_step": 458806, "epoch": 5527} {"train_loss": -27.42755126953125, "global_step": 458807, "epoch": 5527} {"train_loss": -27.051786422729492, "global_step": 458808, "epoch": 5527} {"train_loss": -27.155654907226562, "global_step": 458809, "epoch": 5527} {"train_loss": -26.915943145751953, "global_step": 458810, "epoch": 5527} {"train_loss": -26.710071563720703, "global_step": 458811, "epoch": 5527} {"train_loss": -26.986480712890625, "global_step": 458812, "epoch": 5527} {"train_loss": -26.9493408203125, "global_step": 458813, "epoch": 5527} {"train_loss": -27.1638126373291, "global_step": 458814, "epoch": 5527} {"train_loss": -27.1081485748291, "global_step": 458815, "epoch": 5527} {"train_loss": -27.139667510986328, "global_step": 458816, "epoch": 5527} {"train_loss": -27.042652130126953, "global_step": 458817, "epoch": 5527} {"train_loss": -26.979177474975586, "global_step": 458818, "epoch": 5527} {"train_loss": -27.40606689453125, "global_step": 458819, "epoch": 5527} {"train_loss": -27.07378578186035, "global_step": 458820, "epoch": 5527} {"train_loss": -26.8018856048584, "global_step": 458821, "epoch": 5527} {"train_loss": -27.054523468017578, "global_step": 458822, "epoch": 5527} {"train_loss": -26.874423888792474, "global_step": 458823, "epoch": 5527, "val_loss": 6423433.0} {"train_loss": -22.870487213134766, "global_step": 458824, "epoch": 5528} {"train_loss": -25.124540328979492, "global_step": 458825, "epoch": 5528} {"train_loss": -25.021514892578125, "global_step": 458826, "epoch": 5528} {"train_loss": -25.334585189819336, "global_step": 458827, "epoch": 5528} {"train_loss": -24.829788208007812, "global_step": 458828, "epoch": 5528} {"train_loss": -25.20796012878418, "global_step": 458829, "epoch": 5528} {"train_loss": -26.168561935424805, "global_step": 458830, "epoch": 5528} {"train_loss": -24.940460205078125, "global_step": 458831, "epoch": 5528} {"train_loss": -25.722497940063477, "global_step": 458832, "epoch": 5528} {"train_loss": -26.149099349975586, "global_step": 458833, "epoch": 5528} {"train_loss": -25.7896785736084, "global_step": 458834, "epoch": 5528} {"train_loss": -25.787099838256836, "global_step": 458835, "epoch": 5528} {"train_loss": -26.09165382385254, "global_step": 458836, "epoch": 5528} {"train_loss": -26.29371452331543, "global_step": 458837, "epoch": 5528} {"train_loss": -26.478036880493164, "global_step": 458838, "epoch": 5528} {"train_loss": -26.504907608032227, "global_step": 458839, "epoch": 5528} {"train_loss": -26.683197021484375, "global_step": 458840, "epoch": 5528} {"train_loss": -26.388641357421875, "global_step": 458841, "epoch": 5528} {"train_loss": -26.46929359436035, "global_step": 458842, "epoch": 5528} {"train_loss": -26.53204345703125, "global_step": 458843, "epoch": 5528} {"train_loss": -26.455060958862305, "global_step": 458844, "epoch": 5528} {"train_loss": -26.6308650970459, "global_step": 458845, "epoch": 5528} {"train_loss": -26.4366397857666, "global_step": 458846, "epoch": 5528} {"train_loss": -26.57557487487793, "global_step": 458847, "epoch": 5528} {"train_loss": -26.47108268737793, "global_step": 458848, "epoch": 5528} {"train_loss": -26.97031021118164, "global_step": 458849, "epoch": 5528} {"train_loss": -26.3972110748291, "global_step": 458850, "epoch": 5528} {"train_loss": -26.25599479675293, "global_step": 458851, "epoch": 5528} {"train_loss": -26.69598960876465, "global_step": 458852, "epoch": 5528} {"train_loss": -26.93232536315918, "global_step": 458853, "epoch": 5528} {"train_loss": -26.926523208618164, "global_step": 458854, "epoch": 5528} {"train_loss": -26.85540771484375, "global_step": 458855, "epoch": 5528} {"train_loss": -26.823816299438477, "global_step": 458856, "epoch": 5528} {"train_loss": -26.808828353881836, "global_step": 458857, "epoch": 5528} {"train_loss": -27.005828857421875, "global_step": 458858, "epoch": 5528} {"train_loss": -26.88407325744629, "global_step": 458859, "epoch": 5528} {"train_loss": -27.377775192260742, "global_step": 458860, "epoch": 5528} {"train_loss": -27.176156997680664, "global_step": 458861, "epoch": 5528} {"train_loss": -26.85820960998535, "global_step": 458862, "epoch": 5528} {"train_loss": -27.118518829345703, "global_step": 458863, "epoch": 5528} {"train_loss": -26.8332576751709, "global_step": 458864, "epoch": 5528} {"train_loss": -27.22942543029785, "global_step": 458865, "epoch": 5528} {"train_loss": -27.420270919799805, "global_step": 458866, "epoch": 5528} {"train_loss": -27.059574127197266, "global_step": 458867, "epoch": 5528} {"train_loss": -27.40639305114746, "global_step": 458868, "epoch": 5528} {"train_loss": -26.839441299438477, "global_step": 458869, "epoch": 5528} {"train_loss": -26.970001220703125, "global_step": 458870, "epoch": 5528} {"train_loss": -27.097461700439453, "global_step": 458871, "epoch": 5528} {"train_loss": -27.034326553344727, "global_step": 458872, "epoch": 5528} {"train_loss": -27.170862197875977, "global_step": 458873, "epoch": 5528} {"train_loss": -26.803625106811523, "global_step": 458874, "epoch": 5528} {"train_loss": -27.161457061767578, "global_step": 458875, "epoch": 5528} {"train_loss": -27.491058349609375, "global_step": 458876, "epoch": 5528} {"train_loss": -26.91248893737793, "global_step": 458877, "epoch": 5528} {"train_loss": -27.031179428100586, "global_step": 458878, "epoch": 5528} {"train_loss": -27.212507247924805, "global_step": 458879, "epoch": 5528} {"train_loss": -27.145389556884766, "global_step": 458880, "epoch": 5528} {"train_loss": -27.026416778564453, "global_step": 458881, "epoch": 5528} {"train_loss": -27.149600982666016, "global_step": 458882, "epoch": 5528} {"train_loss": -26.877777099609375, "global_step": 458883, "epoch": 5528} {"train_loss": -26.958227157592773, "global_step": 458884, "epoch": 5528} {"train_loss": -26.959030151367188, "global_step": 458885, "epoch": 5528} {"train_loss": -27.44144630432129, "global_step": 458886, "epoch": 5528} {"train_loss": -27.536691665649414, "global_step": 458887, "epoch": 5528} {"train_loss": -27.067174911499023, "global_step": 458888, "epoch": 5528} {"train_loss": -27.118112564086914, "global_step": 458889, "epoch": 5528} {"train_loss": -27.44925880432129, "global_step": 458890, "epoch": 5528} {"train_loss": -27.268285751342773, "global_step": 458891, "epoch": 5528} {"train_loss": -27.18731689453125, "global_step": 458892, "epoch": 5528} {"train_loss": -27.233325958251953, "global_step": 458893, "epoch": 5528} {"train_loss": -27.326276779174805, "global_step": 458894, "epoch": 5528} {"train_loss": -27.504261016845703, "global_step": 458895, "epoch": 5528} {"train_loss": -27.609312057495117, "global_step": 458896, "epoch": 5528} {"train_loss": -27.212690353393555, "global_step": 458897, "epoch": 5528} {"train_loss": -27.296051025390625, "global_step": 458898, "epoch": 5528} {"train_loss": -27.208526611328125, "global_step": 458899, "epoch": 5528} {"train_loss": -27.080509185791016, "global_step": 458900, "epoch": 5528} {"train_loss": -27.3166446685791, "global_step": 458901, "epoch": 5528} {"train_loss": -27.033645629882812, "global_step": 458902, "epoch": 5528} {"train_loss": -27.36541748046875, "global_step": 458903, "epoch": 5528} {"train_loss": -27.2546329498291, "global_step": 458904, "epoch": 5528} {"train_loss": -27.408035278320312, "global_step": 458905, "epoch": 5528} {"train_loss": -26.72759437561035, "global_step": 458906, "epoch": 5528, "val_loss": 6436042.0} {"train_loss": -26.950485229492188, "global_step": 458907, "epoch": 5529} {"train_loss": -26.680831909179688, "global_step": 458908, "epoch": 5529} {"train_loss": -26.185598373413086, "global_step": 458909, "epoch": 5529} {"train_loss": -25.84295082092285, "global_step": 458910, "epoch": 5529} {"train_loss": -26.543676376342773, "global_step": 458911, "epoch": 5529} {"train_loss": -26.765039443969727, "global_step": 458912, "epoch": 5529} {"train_loss": -26.951507568359375, "global_step": 458913, "epoch": 5529} {"train_loss": -26.83636474609375, "global_step": 458914, "epoch": 5529} {"train_loss": -27.067005157470703, "global_step": 458915, "epoch": 5529} {"train_loss": -26.924243927001953, "global_step": 458916, "epoch": 5529} {"train_loss": -26.935102462768555, "global_step": 458917, "epoch": 5529} {"train_loss": -26.80278968811035, "global_step": 458918, "epoch": 5529} {"train_loss": -26.644262313842773, "global_step": 458919, "epoch": 5529} {"train_loss": -26.873245239257812, "global_step": 458920, "epoch": 5529} {"train_loss": -27.142385482788086, "global_step": 458921, "epoch": 5529} {"train_loss": -27.032733917236328, "global_step": 458922, "epoch": 5529} {"train_loss": -27.095014572143555, "global_step": 458923, "epoch": 5529} {"train_loss": -27.12758445739746, "global_step": 458924, "epoch": 5529} {"train_loss": -27.11968421936035, "global_step": 458925, "epoch": 5529} {"train_loss": -26.97515296936035, "global_step": 458926, "epoch": 5529} {"train_loss": -26.799551010131836, "global_step": 458927, "epoch": 5529} {"train_loss": -27.40616798400879, "global_step": 458928, "epoch": 5529} {"train_loss": -27.0835018157959, "global_step": 458929, "epoch": 5529} {"train_loss": -26.65883445739746, "global_step": 458930, "epoch": 5529} {"train_loss": -26.860998153686523, "global_step": 458931, "epoch": 5529} {"train_loss": -27.043323516845703, "global_step": 458932, "epoch": 5529} {"train_loss": -26.9456787109375, "global_step": 458933, "epoch": 5529} {"train_loss": -26.725299835205078, "global_step": 458934, "epoch": 5529} {"train_loss": -26.803665161132812, "global_step": 458935, "epoch": 5529} {"train_loss": -26.69296646118164, "global_step": 458936, "epoch": 5529} {"train_loss": -27.208332061767578, "global_step": 458937, "epoch": 5529} {"train_loss": -27.048660278320312, "global_step": 458938, "epoch": 5529} {"train_loss": -26.709959030151367, "global_step": 458939, "epoch": 5529} {"train_loss": -26.85371208190918, "global_step": 458940, "epoch": 5529} {"train_loss": -27.389698028564453, "global_step": 458941, "epoch": 5529} {"train_loss": -26.90985679626465, "global_step": 458942, "epoch": 5529} {"train_loss": -27.083539962768555, "global_step": 458943, "epoch": 5529} {"train_loss": -27.556293487548828, "global_step": 458944, "epoch": 5529} {"train_loss": -27.244464874267578, "global_step": 458945, "epoch": 5529} {"train_loss": -26.877628326416016, "global_step": 458946, "epoch": 5529} {"train_loss": -26.70086097717285, "global_step": 458947, "epoch": 5529} {"train_loss": -27.3341007232666, "global_step": 458948, "epoch": 5529} {"train_loss": -27.012292861938477, "global_step": 458949, "epoch": 5529} {"train_loss": -26.976804733276367, "global_step": 458950, "epoch": 5529} {"train_loss": -27.048627853393555, "global_step": 458951, "epoch": 5529} {"train_loss": -26.8927059173584, "global_step": 458952, "epoch": 5529} {"train_loss": -27.392292022705078, "global_step": 458953, "epoch": 5529} {"train_loss": -27.454004287719727, "global_step": 458954, "epoch": 5529} {"train_loss": -27.20350456237793, "global_step": 458955, "epoch": 5529} {"train_loss": -27.25984001159668, "global_step": 458956, "epoch": 5529} {"train_loss": -27.18013572692871, "global_step": 458957, "epoch": 5529} {"train_loss": -27.304636001586914, "global_step": 458958, "epoch": 5529} {"train_loss": -27.214359283447266, "global_step": 458959, "epoch": 5529} {"train_loss": -27.2794189453125, "global_step": 458960, "epoch": 5529} {"train_loss": -27.517623901367188, "global_step": 458961, "epoch": 5529} {"train_loss": -27.260746002197266, "global_step": 458962, "epoch": 5529} {"train_loss": -27.235828399658203, "global_step": 458963, "epoch": 5529} {"train_loss": -27.35200309753418, "global_step": 458964, "epoch": 5529} {"train_loss": -27.360050201416016, "global_step": 458965, "epoch": 5529} {"train_loss": -27.295379638671875, "global_step": 458966, "epoch": 5529} {"train_loss": -26.988849639892578, "global_step": 458967, "epoch": 5529} {"train_loss": -27.3266544342041, "global_step": 458968, "epoch": 5529} {"train_loss": -27.160634994506836, "global_step": 458969, "epoch": 5529} {"train_loss": -27.181665420532227, "global_step": 458970, "epoch": 5529} {"train_loss": -27.335264205932617, "global_step": 458971, "epoch": 5529} {"train_loss": -27.500839233398438, "global_step": 458972, "epoch": 5529} {"train_loss": -27.137739181518555, "global_step": 458973, "epoch": 5529} {"train_loss": -27.039228439331055, "global_step": 458974, "epoch": 5529} {"train_loss": -26.909912109375, "global_step": 458975, "epoch": 5529} {"train_loss": -26.89919090270996, "global_step": 458976, "epoch": 5529} {"train_loss": -27.56012535095215, "global_step": 458977, "epoch": 5529} {"train_loss": -27.444305419921875, "global_step": 458978, "epoch": 5529} {"train_loss": -27.578189849853516, "global_step": 458979, "epoch": 5529} {"train_loss": -27.48752212524414, "global_step": 458980, "epoch": 5529} {"train_loss": -27.369892120361328, "global_step": 458981, "epoch": 5529} {"train_loss": -27.2634220123291, "global_step": 458982, "epoch": 5529} {"train_loss": -27.022436141967773, "global_step": 458983, "epoch": 5529} {"train_loss": -27.251386642456055, "global_step": 458984, "epoch": 5529} {"train_loss": -27.06696128845215, "global_step": 458985, "epoch": 5529} {"train_loss": -27.36090087890625, "global_step": 458986, "epoch": 5529} {"train_loss": -27.418027877807617, "global_step": 458987, "epoch": 5529} {"train_loss": -27.1353816986084, "global_step": 458988, "epoch": 5529} {"train_loss": -27.07959848426911, "global_step": 458989, "epoch": 5529, "val_loss": 6399251.5} {"train_loss": -26.276138305664062, "global_step": 458990, "epoch": 5530} {"train_loss": -26.08390235900879, "global_step": 458991, "epoch": 5530} {"train_loss": -26.50725746154785, "global_step": 458992, "epoch": 5530} {"train_loss": -25.740201950073242, "global_step": 458993, "epoch": 5530} {"train_loss": -26.06743812561035, "global_step": 458994, "epoch": 5530} {"train_loss": -26.376462936401367, "global_step": 458995, "epoch": 5530} {"train_loss": -26.28806495666504, "global_step": 458996, "epoch": 5530} {"train_loss": -26.996118545532227, "global_step": 458997, "epoch": 5530} {"train_loss": -26.4856014251709, "global_step": 458998, "epoch": 5530} {"train_loss": -26.356901168823242, "global_step": 458999, "epoch": 5530} {"train_loss": -26.072101593017578, "global_step": 459000, "epoch": 5530} {"train_loss": -26.32843017578125, "global_step": 459001, "epoch": 5530} {"train_loss": -26.159900665283203, "global_step": 459002, "epoch": 5530} {"train_loss": -26.231836318969727, "global_step": 459003, "epoch": 5530} {"train_loss": -26.041595458984375, "global_step": 459004, "epoch": 5530} {"train_loss": -26.61948585510254, "global_step": 459005, "epoch": 5530} {"train_loss": -26.068500518798828, "global_step": 459006, "epoch": 5530} {"train_loss": -26.624982833862305, "global_step": 459007, "epoch": 5530} {"train_loss": -26.487451553344727, "global_step": 459008, "epoch": 5530} {"train_loss": -26.76802635192871, "global_step": 459009, "epoch": 5530} {"train_loss": -26.6865234375, "global_step": 459010, "epoch": 5530} {"train_loss": -26.35025405883789, "global_step": 459011, "epoch": 5530} {"train_loss": -26.911224365234375, "global_step": 459012, "epoch": 5530} {"train_loss": -26.4708194732666, "global_step": 459013, "epoch": 5530} {"train_loss": -26.57217788696289, "global_step": 459014, "epoch": 5530} {"train_loss": -26.239343643188477, "global_step": 459015, "epoch": 5530} {"train_loss": -26.876007080078125, "global_step": 459016, "epoch": 5530} {"train_loss": -26.450735092163086, "global_step": 459017, "epoch": 5530} {"train_loss": -26.913166046142578, "global_step": 459018, "epoch": 5530} {"train_loss": -26.802600860595703, "global_step": 459019, "epoch": 5530} {"train_loss": -26.584213256835938, "global_step": 459020, "epoch": 5530} {"train_loss": -26.881921768188477, "global_step": 459021, "epoch": 5530} {"train_loss": -26.757919311523438, "global_step": 459022, "epoch": 5530} {"train_loss": -27.226581573486328, "global_step": 459023, "epoch": 5530} {"train_loss": -26.75294303894043, "global_step": 459024, "epoch": 5530} {"train_loss": -26.924945831298828, "global_step": 459025, "epoch": 5530} {"train_loss": -27.082275390625, "global_step": 459026, "epoch": 5530} {"train_loss": -27.118005752563477, "global_step": 459027, "epoch": 5530} {"train_loss": -27.19594383239746, "global_step": 459028, "epoch": 5530} {"train_loss": -27.283538818359375, "global_step": 459029, "epoch": 5530} {"train_loss": -27.15289306640625, "global_step": 459030, "epoch": 5530} {"train_loss": -27.513864517211914, "global_step": 459031, "epoch": 5530} {"train_loss": -26.848485946655273, "global_step": 459032, "epoch": 5530} {"train_loss": -27.190420150756836, "global_step": 459033, "epoch": 5530} {"train_loss": -27.250720977783203, "global_step": 459034, "epoch": 5530} {"train_loss": -27.2128963470459, "global_step": 459035, "epoch": 5530} {"train_loss": -26.925464630126953, "global_step": 459036, "epoch": 5530} {"train_loss": -27.11908531188965, "global_step": 459037, "epoch": 5530} {"train_loss": -27.3118896484375, "global_step": 459038, "epoch": 5530} {"train_loss": -26.9969425201416, "global_step": 459039, "epoch": 5530} {"train_loss": -26.8638916015625, "global_step": 459040, "epoch": 5530} {"train_loss": -26.865827560424805, "global_step": 459041, "epoch": 5530} {"train_loss": -27.462217330932617, "global_step": 459042, "epoch": 5530} {"train_loss": -27.3590087890625, "global_step": 459043, "epoch": 5530} {"train_loss": -26.792572021484375, "global_step": 459044, "epoch": 5530} {"train_loss": -26.801807403564453, "global_step": 459045, "epoch": 5530} {"train_loss": -27.593225479125977, "global_step": 459046, "epoch": 5530} {"train_loss": -27.49163246154785, "global_step": 459047, "epoch": 5530} {"train_loss": -27.016559600830078, "global_step": 459048, "epoch": 5530} {"train_loss": -27.405981063842773, "global_step": 459049, "epoch": 5530} {"train_loss": -27.3465576171875, "global_step": 459050, "epoch": 5530} {"train_loss": -27.272306442260742, "global_step": 459051, "epoch": 5530} {"train_loss": -27.442564010620117, "global_step": 459052, "epoch": 5530} {"train_loss": -27.378372192382812, "global_step": 459053, "epoch": 5530} {"train_loss": -27.2663516998291, "global_step": 459054, "epoch": 5530} {"train_loss": -26.9140625, "global_step": 459055, "epoch": 5530} {"train_loss": -27.23343849182129, "global_step": 459056, "epoch": 5530} {"train_loss": -27.422834396362305, "global_step": 459057, "epoch": 5530} {"train_loss": -27.23529624938965, "global_step": 459058, "epoch": 5530} {"train_loss": -27.372976303100586, "global_step": 459059, "epoch": 5530} {"train_loss": -27.3409481048584, "global_step": 459060, "epoch": 5530} {"train_loss": -27.325180053710938, "global_step": 459061, "epoch": 5530} {"train_loss": -26.981094360351562, "global_step": 459062, "epoch": 5530} {"train_loss": -26.917404174804688, "global_step": 459063, "epoch": 5530} {"train_loss": -27.170385360717773, "global_step": 459064, "epoch": 5530} {"train_loss": -26.683319091796875, "global_step": 459065, "epoch": 5530} {"train_loss": -26.928632736206055, "global_step": 459066, "epoch": 5530} {"train_loss": -26.847827911376953, "global_step": 459067, "epoch": 5530} {"train_loss": -27.207921981811523, "global_step": 459068, "epoch": 5530} {"train_loss": -26.7774658203125, "global_step": 459069, "epoch": 5530} {"train_loss": -26.6041202545166, "global_step": 459070, "epoch": 5530} {"train_loss": -26.58623695373535, "global_step": 459071, "epoch": 5530} {"train_loss": -26.849244404988116, "global_step": 459072, "epoch": 5530, "val_loss": 6463391.0} {"train_loss": -25.566192626953125, "global_step": 459073, "epoch": 5531} {"train_loss": -24.738386154174805, "global_step": 459074, "epoch": 5531} {"train_loss": -24.851106643676758, "global_step": 459075, "epoch": 5531} {"train_loss": -25.669437408447266, "global_step": 459076, "epoch": 5531} {"train_loss": -25.74991798400879, "global_step": 459077, "epoch": 5531} {"train_loss": -26.033950805664062, "global_step": 459078, "epoch": 5531} {"train_loss": -26.694128036499023, "global_step": 459079, "epoch": 5531} {"train_loss": -26.12580680847168, "global_step": 459080, "epoch": 5531} {"train_loss": -26.585834503173828, "global_step": 459081, "epoch": 5531} {"train_loss": -26.330078125, "global_step": 459082, "epoch": 5531} {"train_loss": -26.079364776611328, "global_step": 459083, "epoch": 5531} {"train_loss": -26.483753204345703, "global_step": 459084, "epoch": 5531} {"train_loss": -26.612829208374023, "global_step": 459085, "epoch": 5531} {"train_loss": -26.2857608795166, "global_step": 459086, "epoch": 5531} {"train_loss": -26.401525497436523, "global_step": 459087, "epoch": 5531} {"train_loss": -26.45706558227539, "global_step": 459088, "epoch": 5531} {"train_loss": -26.469812393188477, "global_step": 459089, "epoch": 5531} {"train_loss": -26.532861709594727, "global_step": 459090, "epoch": 5531} {"train_loss": -26.784467697143555, "global_step": 459091, "epoch": 5531} {"train_loss": -26.645858764648438, "global_step": 459092, "epoch": 5531} {"train_loss": -26.714466094970703, "global_step": 459093, "epoch": 5531} {"train_loss": -26.684656143188477, "global_step": 459094, "epoch": 5531} {"train_loss": -26.753070831298828, "global_step": 459095, "epoch": 5531} {"train_loss": -27.159717559814453, "global_step": 459096, "epoch": 5531} {"train_loss": -27.035215377807617, "global_step": 459097, "epoch": 5531} {"train_loss": -26.747882843017578, "global_step": 459098, "epoch": 5531} {"train_loss": -26.8453369140625, "global_step": 459099, "epoch": 5531} {"train_loss": -26.81995964050293, "global_step": 459100, "epoch": 5531} {"train_loss": -26.866254806518555, "global_step": 459101, "epoch": 5531} {"train_loss": -27.035367965698242, "global_step": 459102, "epoch": 5531} {"train_loss": -26.84964942932129, "global_step": 459103, "epoch": 5531} {"train_loss": -26.701919555664062, "global_step": 459104, "epoch": 5531} {"train_loss": -26.82460594177246, "global_step": 459105, "epoch": 5531} {"train_loss": -26.8143310546875, "global_step": 459106, "epoch": 5531} {"train_loss": -27.116422653198242, "global_step": 459107, "epoch": 5531} {"train_loss": -27.094608306884766, "global_step": 459108, "epoch": 5531} {"train_loss": -26.904682159423828, "global_step": 459109, "epoch": 5531} {"train_loss": -27.284589767456055, "global_step": 459110, "epoch": 5531} {"train_loss": -27.12580680847168, "global_step": 459111, "epoch": 5531} {"train_loss": -27.06049919128418, "global_step": 459112, "epoch": 5531} {"train_loss": -26.7603816986084, "global_step": 459113, "epoch": 5531} {"train_loss": -27.513473510742188, "global_step": 459114, "epoch": 5531} {"train_loss": -26.845983505249023, "global_step": 459115, "epoch": 5531} {"train_loss": -26.86724853515625, "global_step": 459116, "epoch": 5531} {"train_loss": -27.558237075805664, "global_step": 459117, "epoch": 5531} {"train_loss": -26.796056747436523, "global_step": 459118, "epoch": 5531} {"train_loss": -27.138294219970703, "global_step": 459119, "epoch": 5531} {"train_loss": -26.83696937561035, "global_step": 459120, "epoch": 5531} {"train_loss": -26.6849365234375, "global_step": 459121, "epoch": 5531} {"train_loss": -27.41054344177246, "global_step": 459122, "epoch": 5531} {"train_loss": -26.8956298828125, "global_step": 459123, "epoch": 5531} {"train_loss": -27.045190811157227, "global_step": 459124, "epoch": 5531} {"train_loss": -26.919296264648438, "global_step": 459125, "epoch": 5531} {"train_loss": -27.112445831298828, "global_step": 459126, "epoch": 5531} {"train_loss": -27.20794105529785, "global_step": 459127, "epoch": 5531} {"train_loss": -27.063526153564453, "global_step": 459128, "epoch": 5531} {"train_loss": -27.15774917602539, "global_step": 459129, "epoch": 5531} {"train_loss": -27.245344161987305, "global_step": 459130, "epoch": 5531} {"train_loss": -27.201841354370117, "global_step": 459131, "epoch": 5531} {"train_loss": -27.357940673828125, "global_step": 459132, "epoch": 5531} {"train_loss": -27.256132125854492, "global_step": 459133, "epoch": 5531} {"train_loss": -27.128131866455078, "global_step": 459134, "epoch": 5531} {"train_loss": -27.088977813720703, "global_step": 459135, "epoch": 5531} {"train_loss": -27.062061309814453, "global_step": 459136, "epoch": 5531} {"train_loss": -27.270177841186523, "global_step": 459137, "epoch": 5531} {"train_loss": -26.990055084228516, "global_step": 459138, "epoch": 5531} {"train_loss": -27.05179786682129, "global_step": 459139, "epoch": 5531} {"train_loss": -27.264081954956055, "global_step": 459140, "epoch": 5531} {"train_loss": -27.37264060974121, "global_step": 459141, "epoch": 5531} {"train_loss": -27.523529052734375, "global_step": 459142, "epoch": 5531} {"train_loss": -27.10918617248535, "global_step": 459143, "epoch": 5531} {"train_loss": -27.524372100830078, "global_step": 459144, "epoch": 5531} {"train_loss": -27.24683952331543, "global_step": 459145, "epoch": 5531} {"train_loss": -27.42347526550293, "global_step": 459146, "epoch": 5531} {"train_loss": -27.063207626342773, "global_step": 459147, "epoch": 5531} {"train_loss": -27.37359619140625, "global_step": 459148, "epoch": 5531} {"train_loss": -27.359298706054688, "global_step": 459149, "epoch": 5531} {"train_loss": -27.36911392211914, "global_step": 459150, "epoch": 5531} {"train_loss": -27.26788330078125, "global_step": 459151, "epoch": 5531} {"train_loss": -27.202306747436523, "global_step": 459152, "epoch": 5531} {"train_loss": -27.43001365661621, "global_step": 459153, "epoch": 5531} {"train_loss": -27.628360748291016, "global_step": 459154, "epoch": 5531} {"train_loss": -26.87430781628712, "global_step": 459155, "epoch": 5531, "val_loss": 6412856.0} {"train_loss": -26.133432388305664, "global_step": 459156, "epoch": 5532} {"train_loss": -26.534292221069336, "global_step": 459157, "epoch": 5532} {"train_loss": -26.126239776611328, "global_step": 459158, "epoch": 5532} {"train_loss": -25.957468032836914, "global_step": 459159, "epoch": 5532} {"train_loss": -26.23578453063965, "global_step": 459160, "epoch": 5532} {"train_loss": -26.973358154296875, "global_step": 459161, "epoch": 5532} {"train_loss": -26.7354679107666, "global_step": 459162, "epoch": 5532} {"train_loss": -26.60776710510254, "global_step": 459163, "epoch": 5532} {"train_loss": -26.704092025756836, "global_step": 459164, "epoch": 5532} {"train_loss": -25.849401473999023, "global_step": 459165, "epoch": 5532} {"train_loss": -26.621179580688477, "global_step": 459166, "epoch": 5532} {"train_loss": -27.070098876953125, "global_step": 459167, "epoch": 5532} {"train_loss": -26.770105361938477, "global_step": 459168, "epoch": 5532} {"train_loss": -26.58662986755371, "global_step": 459169, "epoch": 5532} {"train_loss": -27.016828536987305, "global_step": 459170, "epoch": 5532} {"train_loss": -26.650104522705078, "global_step": 459171, "epoch": 5532} {"train_loss": -26.53321647644043, "global_step": 459172, "epoch": 5532} {"train_loss": -26.769079208374023, "global_step": 459173, "epoch": 5532} {"train_loss": -26.930587768554688, "global_step": 459174, "epoch": 5532} {"train_loss": -27.336023330688477, "global_step": 459175, "epoch": 5532} {"train_loss": -26.79827880859375, "global_step": 459176, "epoch": 5532} {"train_loss": -26.9439640045166, "global_step": 459177, "epoch": 5532} {"train_loss": -26.467260360717773, "global_step": 459178, "epoch": 5532} {"train_loss": -27.050580978393555, "global_step": 459179, "epoch": 5532} {"train_loss": -27.036584854125977, "global_step": 459180, "epoch": 5532} {"train_loss": -27.18109703063965, "global_step": 459181, "epoch": 5532} {"train_loss": -27.22886085510254, "global_step": 459182, "epoch": 5532} {"train_loss": -26.923791885375977, "global_step": 459183, "epoch": 5532} {"train_loss": -27.13462257385254, "global_step": 459184, "epoch": 5532} {"train_loss": -27.0941219329834, "global_step": 459185, "epoch": 5532} {"train_loss": -26.5888729095459, "global_step": 459186, "epoch": 5532} {"train_loss": -27.032394409179688, "global_step": 459187, "epoch": 5532} {"train_loss": -27.149810791015625, "global_step": 459188, "epoch": 5532} {"train_loss": -26.93170166015625, "global_step": 459189, "epoch": 5532} {"train_loss": -27.084796905517578, "global_step": 459190, "epoch": 5532} {"train_loss": -27.225431442260742, "global_step": 459191, "epoch": 5532} {"train_loss": -27.149856567382812, "global_step": 459192, "epoch": 5532} {"train_loss": -27.136127471923828, "global_step": 459193, "epoch": 5532} {"train_loss": -27.2852783203125, "global_step": 459194, "epoch": 5532} {"train_loss": -27.353979110717773, "global_step": 459195, "epoch": 5532} {"train_loss": -27.329700469970703, "global_step": 459196, "epoch": 5532} {"train_loss": -27.217565536499023, "global_step": 459197, "epoch": 5532} {"train_loss": -27.21760368347168, "global_step": 459198, "epoch": 5532} {"train_loss": -27.045934677124023, "global_step": 459199, "epoch": 5532} {"train_loss": -27.28101921081543, "global_step": 459200, "epoch": 5532} {"train_loss": -27.076330184936523, "global_step": 459201, "epoch": 5532} {"train_loss": -27.235477447509766, "global_step": 459202, "epoch": 5532} {"train_loss": -27.570661544799805, "global_step": 459203, "epoch": 5532} {"train_loss": -26.884414672851562, "global_step": 459204, "epoch": 5532} {"train_loss": -27.53217124938965, "global_step": 459205, "epoch": 5532} {"train_loss": -27.49546241760254, "global_step": 459206, "epoch": 5532} {"train_loss": -27.26392936706543, "global_step": 459207, "epoch": 5532} {"train_loss": -27.440099716186523, "global_step": 459208, "epoch": 5532} {"train_loss": -27.34295082092285, "global_step": 459209, "epoch": 5532} {"train_loss": -27.3927059173584, "global_step": 459210, "epoch": 5532} {"train_loss": -27.12456703186035, "global_step": 459211, "epoch": 5532} {"train_loss": -27.321338653564453, "global_step": 459212, "epoch": 5532} {"train_loss": -27.324506759643555, "global_step": 459213, "epoch": 5532} {"train_loss": -27.210668563842773, "global_step": 459214, "epoch": 5532} {"train_loss": -27.179922103881836, "global_step": 459215, "epoch": 5532} {"train_loss": -27.242435455322266, "global_step": 459216, "epoch": 5532} {"train_loss": -27.1679744720459, "global_step": 459217, "epoch": 5532} {"train_loss": -26.966093063354492, "global_step": 459218, "epoch": 5532} {"train_loss": -27.244586944580078, "global_step": 459219, "epoch": 5532} {"train_loss": -27.489133834838867, "global_step": 459220, "epoch": 5532} {"train_loss": -27.166339874267578, "global_step": 459221, "epoch": 5532} {"train_loss": -27.239225387573242, "global_step": 459222, "epoch": 5532} {"train_loss": -27.207279205322266, "global_step": 459223, "epoch": 5532} {"train_loss": -27.701526641845703, "global_step": 459224, "epoch": 5532} {"train_loss": -26.968032836914062, "global_step": 459225, "epoch": 5532} {"train_loss": -27.083044052124023, "global_step": 459226, "epoch": 5532} {"train_loss": -27.2198429107666, "global_step": 459227, "epoch": 5532} {"train_loss": -27.461103439331055, "global_step": 459228, "epoch": 5532} {"train_loss": -27.333852767944336, "global_step": 459229, "epoch": 5532} {"train_loss": -27.382080078125, "global_step": 459230, "epoch": 5532} {"train_loss": -27.143341064453125, "global_step": 459231, "epoch": 5532} {"train_loss": -27.374256134033203, "global_step": 459232, "epoch": 5532} {"train_loss": -27.353086471557617, "global_step": 459233, "epoch": 5532} {"train_loss": -27.30328941345215, "global_step": 459234, "epoch": 5532} {"train_loss": -27.097415924072266, "global_step": 459235, "epoch": 5532} {"train_loss": -27.436254501342773, "global_step": 459236, "epoch": 5532} {"train_loss": -27.106693267822266, "global_step": 459237, "epoch": 5532} {"train_loss": -27.059423055993506, "global_step": 459238, "epoch": 5532, "val_loss": 6510514.0} {"train_loss": -26.619598388671875, "global_step": 459239, "epoch": 5533} {"train_loss": -26.406824111938477, "global_step": 459240, "epoch": 5533} {"train_loss": -26.405792236328125, "global_step": 459241, "epoch": 5533} {"train_loss": -26.614978790283203, "global_step": 459242, "epoch": 5533} {"train_loss": -26.35198974609375, "global_step": 459243, "epoch": 5533} {"train_loss": -25.711048126220703, "global_step": 459244, "epoch": 5533} {"train_loss": -25.767627716064453, "global_step": 459245, "epoch": 5533} {"train_loss": -25.964832305908203, "global_step": 459246, "epoch": 5533} {"train_loss": -26.3472900390625, "global_step": 459247, "epoch": 5533} {"train_loss": -26.038623809814453, "global_step": 459248, "epoch": 5533} {"train_loss": -26.526769638061523, "global_step": 459249, "epoch": 5533} {"train_loss": -26.40522575378418, "global_step": 459250, "epoch": 5533} {"train_loss": -26.140974044799805, "global_step": 459251, "epoch": 5533} {"train_loss": -25.93794059753418, "global_step": 459252, "epoch": 5533} {"train_loss": -26.243947982788086, "global_step": 459253, "epoch": 5533} {"train_loss": -26.161975860595703, "global_step": 459254, "epoch": 5533} {"train_loss": -26.449254989624023, "global_step": 459255, "epoch": 5533} {"train_loss": -26.61069679260254, "global_step": 459256, "epoch": 5533} {"train_loss": -26.31562614440918, "global_step": 459257, "epoch": 5533} {"train_loss": -26.59473991394043, "global_step": 459258, "epoch": 5533} {"train_loss": -26.891956329345703, "global_step": 459259, "epoch": 5533} {"train_loss": -26.118057250976562, "global_step": 459260, "epoch": 5533} {"train_loss": -26.78732681274414, "global_step": 459261, "epoch": 5533} {"train_loss": -26.179025650024414, "global_step": 459262, "epoch": 5533} {"train_loss": -26.962207794189453, "global_step": 459263, "epoch": 5533} {"train_loss": -26.529438018798828, "global_step": 459264, "epoch": 5533} {"train_loss": -26.487777709960938, "global_step": 459265, "epoch": 5533} {"train_loss": -26.901636123657227, "global_step": 459266, "epoch": 5533} {"train_loss": -26.436492919921875, "global_step": 459267, "epoch": 5533} {"train_loss": -27.052845001220703, "global_step": 459268, "epoch": 5533} {"train_loss": -26.925989151000977, "global_step": 459269, "epoch": 5533} {"train_loss": -26.550107955932617, "global_step": 459270, "epoch": 5533} {"train_loss": -26.560672760009766, "global_step": 459271, "epoch": 5533} {"train_loss": -26.916309356689453, "global_step": 459272, "epoch": 5533} {"train_loss": -26.966333389282227, "global_step": 459273, "epoch": 5533} {"train_loss": -27.036237716674805, "global_step": 459274, "epoch": 5533} {"train_loss": -26.762815475463867, "global_step": 459275, "epoch": 5533} {"train_loss": -26.73902702331543, "global_step": 459276, "epoch": 5533} {"train_loss": -26.884336471557617, "global_step": 459277, "epoch": 5533} {"train_loss": -27.030988693237305, "global_step": 459278, "epoch": 5533} {"train_loss": -27.12372398376465, "global_step": 459279, "epoch": 5533} {"train_loss": -27.018396377563477, "global_step": 459280, "epoch": 5533} {"train_loss": -27.483312606811523, "global_step": 459281, "epoch": 5533} {"train_loss": -26.851516723632812, "global_step": 459282, "epoch": 5533} {"train_loss": -26.99363136291504, "global_step": 459283, "epoch": 5533} {"train_loss": -27.167194366455078, "global_step": 459284, "epoch": 5533} {"train_loss": -26.879180908203125, "global_step": 459285, "epoch": 5533} {"train_loss": -27.053247451782227, "global_step": 459286, "epoch": 5533} {"train_loss": -27.244415283203125, "global_step": 459287, "epoch": 5533} {"train_loss": -27.58672523498535, "global_step": 459288, "epoch": 5533} {"train_loss": -27.140180587768555, "global_step": 459289, "epoch": 5533} {"train_loss": -27.527240753173828, "global_step": 459290, "epoch": 5533} {"train_loss": -27.195905685424805, "global_step": 459291, "epoch": 5533} {"train_loss": -27.124784469604492, "global_step": 459292, "epoch": 5533} {"train_loss": -26.957868576049805, "global_step": 459293, "epoch": 5533} {"train_loss": -27.210844039916992, "global_step": 459294, "epoch": 5533} {"train_loss": -27.214353561401367, "global_step": 459295, "epoch": 5533} {"train_loss": -27.430591583251953, "global_step": 459296, "epoch": 5533} {"train_loss": -27.047138214111328, "global_step": 459297, "epoch": 5533} {"train_loss": -27.0379695892334, "global_step": 459298, "epoch": 5533} {"train_loss": -27.2114315032959, "global_step": 459299, "epoch": 5533} {"train_loss": -27.243391036987305, "global_step": 459300, "epoch": 5533} {"train_loss": -27.21953773498535, "global_step": 459301, "epoch": 5533} {"train_loss": -26.992414474487305, "global_step": 459302, "epoch": 5533} {"train_loss": -26.985319137573242, "global_step": 459303, "epoch": 5533} {"train_loss": -26.938343048095703, "global_step": 459304, "epoch": 5533} {"train_loss": -27.003620147705078, "global_step": 459305, "epoch": 5533} {"train_loss": -26.985279083251953, "global_step": 459306, "epoch": 5533} {"train_loss": -27.224140167236328, "global_step": 459307, "epoch": 5533} {"train_loss": -27.0073299407959, "global_step": 459308, "epoch": 5533} {"train_loss": -27.122848510742188, "global_step": 459309, "epoch": 5533} {"train_loss": -27.29804039001465, "global_step": 459310, "epoch": 5533} {"train_loss": -27.185016632080078, "global_step": 459311, "epoch": 5533} {"train_loss": -26.865753173828125, "global_step": 459312, "epoch": 5533} {"train_loss": -26.80609130859375, "global_step": 459313, "epoch": 5533} {"train_loss": -27.012821197509766, "global_step": 459314, "epoch": 5533} {"train_loss": -26.996601104736328, "global_step": 459315, "epoch": 5533} {"train_loss": -27.357913970947266, "global_step": 459316, "epoch": 5533} {"train_loss": -27.31390380859375, "global_step": 459317, "epoch": 5533} {"train_loss": -27.10379981994629, "global_step": 459318, "epoch": 5533} {"train_loss": -27.348602294921875, "global_step": 459319, "epoch": 5533} {"train_loss": -26.9893798828125, "global_step": 459320, "epoch": 5533} {"train_loss": -26.81901552590979, "global_step": 459321, "epoch": 5533, "val_loss": 6432042.0} {"train_loss": -25.32573699951172, "global_step": 459322, "epoch": 5534} {"train_loss": -24.439151763916016, "global_step": 459323, "epoch": 5534} {"train_loss": -24.736066818237305, "global_step": 459324, "epoch": 5534} {"train_loss": -25.860095977783203, "global_step": 459325, "epoch": 5534} {"train_loss": -25.32268714904785, "global_step": 459326, "epoch": 5534} {"train_loss": -26.249347686767578, "global_step": 459327, "epoch": 5534} {"train_loss": -25.382970809936523, "global_step": 459328, "epoch": 5534} {"train_loss": -26.3972225189209, "global_step": 459329, "epoch": 5534} {"train_loss": -25.83817481994629, "global_step": 459330, "epoch": 5534} {"train_loss": -25.62060546875, "global_step": 459331, "epoch": 5534} {"train_loss": -26.207128524780273, "global_step": 459332, "epoch": 5534} {"train_loss": -26.109039306640625, "global_step": 459333, "epoch": 5534} {"train_loss": -26.10420799255371, "global_step": 459334, "epoch": 5534} {"train_loss": -26.032880783081055, "global_step": 459335, "epoch": 5534} {"train_loss": -26.025665283203125, "global_step": 459336, "epoch": 5534} {"train_loss": -26.226049423217773, "global_step": 459337, "epoch": 5534} {"train_loss": -26.32720947265625, "global_step": 459338, "epoch": 5534} {"train_loss": -26.3652286529541, "global_step": 459339, "epoch": 5534} {"train_loss": -26.66376304626465, "global_step": 459340, "epoch": 5534} {"train_loss": -26.12030601501465, "global_step": 459341, "epoch": 5534} {"train_loss": -26.70027732849121, "global_step": 459342, "epoch": 5534} {"train_loss": -26.18311882019043, "global_step": 459343, "epoch": 5534} {"train_loss": -26.83279800415039, "global_step": 459344, "epoch": 5534} {"train_loss": -25.993194580078125, "global_step": 459345, "epoch": 5534} {"train_loss": -26.64154052734375, "global_step": 459346, "epoch": 5534} {"train_loss": -26.338550567626953, "global_step": 459347, "epoch": 5534} {"train_loss": -26.91438102722168, "global_step": 459348, "epoch": 5534} {"train_loss": -26.881305694580078, "global_step": 459349, "epoch": 5534} {"train_loss": -26.7276554107666, "global_step": 459350, "epoch": 5534} {"train_loss": -27.027359008789062, "global_step": 459351, "epoch": 5534} {"train_loss": -26.960126876831055, "global_step": 459352, "epoch": 5534} {"train_loss": -26.75937843322754, "global_step": 459353, "epoch": 5534} {"train_loss": -26.61688232421875, "global_step": 459354, "epoch": 5534} {"train_loss": -26.290515899658203, "global_step": 459355, "epoch": 5534} {"train_loss": -26.690088272094727, "global_step": 459356, "epoch": 5534} {"train_loss": -27.06052017211914, "global_step": 459357, "epoch": 5534} {"train_loss": -26.969654083251953, "global_step": 459358, "epoch": 5534} {"train_loss": -27.067636489868164, "global_step": 459359, "epoch": 5534} {"train_loss": -26.5636043548584, "global_step": 459360, "epoch": 5534} {"train_loss": -26.672067642211914, "global_step": 459361, "epoch": 5534} {"train_loss": -26.956979751586914, "global_step": 459362, "epoch": 5534} {"train_loss": -27.01984214782715, "global_step": 459363, "epoch": 5534} {"train_loss": -26.75374412536621, "global_step": 459364, "epoch": 5534} {"train_loss": -27.04560661315918, "global_step": 459365, "epoch": 5534} {"train_loss": -26.857284545898438, "global_step": 459366, "epoch": 5534} {"train_loss": -26.996564865112305, "global_step": 459367, "epoch": 5534} {"train_loss": -27.007171630859375, "global_step": 459368, "epoch": 5534} {"train_loss": -26.845489501953125, "global_step": 459369, "epoch": 5534} {"train_loss": -26.993844985961914, "global_step": 459370, "epoch": 5534} {"train_loss": -26.90594482421875, "global_step": 459371, "epoch": 5534} {"train_loss": -27.108530044555664, "global_step": 459372, "epoch": 5534} {"train_loss": -27.267873764038086, "global_step": 459373, "epoch": 5534} {"train_loss": -27.277774810791016, "global_step": 459374, "epoch": 5534} {"train_loss": -27.1339168548584, "global_step": 459375, "epoch": 5534} {"train_loss": -27.492084503173828, "global_step": 459376, "epoch": 5534} {"train_loss": -26.664697647094727, "global_step": 459377, "epoch": 5534} {"train_loss": -27.004552841186523, "global_step": 459378, "epoch": 5534} {"train_loss": -26.982519149780273, "global_step": 459379, "epoch": 5534} {"train_loss": -27.468219757080078, "global_step": 459380, "epoch": 5534} {"train_loss": -27.17168617248535, "global_step": 459381, "epoch": 5534} {"train_loss": -26.74468994140625, "global_step": 459382, "epoch": 5534} {"train_loss": -27.28395652770996, "global_step": 459383, "epoch": 5534} {"train_loss": -27.166702270507812, "global_step": 459384, "epoch": 5534} {"train_loss": -27.418256759643555, "global_step": 459385, "epoch": 5534} {"train_loss": -27.275070190429688, "global_step": 459386, "epoch": 5534} {"train_loss": -27.35674476623535, "global_step": 459387, "epoch": 5534} {"train_loss": -27.19598960876465, "global_step": 459388, "epoch": 5534} {"train_loss": -27.294775009155273, "global_step": 459389, "epoch": 5534} {"train_loss": -27.146902084350586, "global_step": 459390, "epoch": 5534} {"train_loss": -27.25531005859375, "global_step": 459391, "epoch": 5534} {"train_loss": -27.2181453704834, "global_step": 459392, "epoch": 5534} {"train_loss": -26.671524047851562, "global_step": 459393, "epoch": 5534} {"train_loss": -26.981916427612305, "global_step": 459394, "epoch": 5534} {"train_loss": -26.8126220703125, "global_step": 459395, "epoch": 5534} {"train_loss": -27.084619522094727, "global_step": 459396, "epoch": 5534} {"train_loss": -27.143163681030273, "global_step": 459397, "epoch": 5534} {"train_loss": -27.143924713134766, "global_step": 459398, "epoch": 5534} {"train_loss": -26.975881576538086, "global_step": 459399, "epoch": 5534} {"train_loss": -26.9564151763916, "global_step": 459400, "epoch": 5534} {"train_loss": -26.993499755859375, "global_step": 459401, "epoch": 5534} {"train_loss": -27.226654052734375, "global_step": 459402, "epoch": 5534} {"train_loss": -27.61802101135254, "global_step": 459403, "epoch": 5534} {"train_loss": -26.70782544239458, "global_step": 459404, "epoch": 5534, "val_loss": 6423678.0} {"train_loss": -26.25244140625, "global_step": 459405, "epoch": 5535} {"train_loss": -26.406360626220703, "global_step": 459406, "epoch": 5535} {"train_loss": -26.533050537109375, "global_step": 459407, "epoch": 5535} {"train_loss": -26.863061904907227, "global_step": 459408, "epoch": 5535} {"train_loss": -26.68031883239746, "global_step": 459409, "epoch": 5535} {"train_loss": -26.963836669921875, "global_step": 459410, "epoch": 5535} {"train_loss": -26.819141387939453, "global_step": 459411, "epoch": 5535} {"train_loss": -26.680471420288086, "global_step": 459412, "epoch": 5535} {"train_loss": -26.74676513671875, "global_step": 459413, "epoch": 5535} {"train_loss": -26.704669952392578, "global_step": 459414, "epoch": 5535} {"train_loss": -26.72186851501465, "global_step": 459415, "epoch": 5535} {"train_loss": -26.724002838134766, "global_step": 459416, "epoch": 5535} {"train_loss": -26.519962310791016, "global_step": 459417, "epoch": 5535} {"train_loss": -26.99774742126465, "global_step": 459418, "epoch": 5535} {"train_loss": -27.017120361328125, "global_step": 459419, "epoch": 5535} {"train_loss": -27.02375602722168, "global_step": 459420, "epoch": 5535} {"train_loss": -27.034093856811523, "global_step": 459421, "epoch": 5535} {"train_loss": -27.107770919799805, "global_step": 459422, "epoch": 5535} {"train_loss": -27.010456085205078, "global_step": 459423, "epoch": 5535} {"train_loss": -27.462133407592773, "global_step": 459424, "epoch": 5535} {"train_loss": -27.15252685546875, "global_step": 459425, "epoch": 5535} {"train_loss": -27.654499053955078, "global_step": 459426, "epoch": 5535} {"train_loss": -27.34816551208496, "global_step": 459427, "epoch": 5535} {"train_loss": -26.913742065429688, "global_step": 459428, "epoch": 5535} {"train_loss": -27.0344295501709, "global_step": 459429, "epoch": 5535} {"train_loss": -26.978607177734375, "global_step": 459430, "epoch": 5535} {"train_loss": -27.324804306030273, "global_step": 459431, "epoch": 5535} {"train_loss": -27.02225112915039, "global_step": 459432, "epoch": 5535} {"train_loss": -27.094776153564453, "global_step": 459433, "epoch": 5535} {"train_loss": -27.149316787719727, "global_step": 459434, "epoch": 5535} {"train_loss": -27.15923500061035, "global_step": 459435, "epoch": 5535} {"train_loss": -27.130807876586914, "global_step": 459436, "epoch": 5535} {"train_loss": -27.188465118408203, "global_step": 459437, "epoch": 5535} {"train_loss": -26.98309326171875, "global_step": 459438, "epoch": 5535} {"train_loss": -27.30810546875, "global_step": 459439, "epoch": 5535} {"train_loss": -27.0798282623291, "global_step": 459440, "epoch": 5535} {"train_loss": -27.136615753173828, "global_step": 459441, "epoch": 5535} {"train_loss": -27.1451416015625, "global_step": 459442, "epoch": 5535} {"train_loss": -27.22516441345215, "global_step": 459443, "epoch": 5535} {"train_loss": -27.250818252563477, "global_step": 459444, "epoch": 5535} {"train_loss": -27.176794052124023, "global_step": 459445, "epoch": 5535} {"train_loss": -27.3846378326416, "global_step": 459446, "epoch": 5535} {"train_loss": -27.36066246032715, "global_step": 459447, "epoch": 5535} {"train_loss": -27.22039794921875, "global_step": 459448, "epoch": 5535} {"train_loss": -27.132965087890625, "global_step": 459449, "epoch": 5535} {"train_loss": -27.4495792388916, "global_step": 459450, "epoch": 5535} {"train_loss": -27.140884399414062, "global_step": 459451, "epoch": 5535} {"train_loss": -27.457050323486328, "global_step": 459452, "epoch": 5535} {"train_loss": -27.0248966217041, "global_step": 459453, "epoch": 5535} {"train_loss": -27.262601852416992, "global_step": 459454, "epoch": 5535} {"train_loss": -27.16135025024414, "global_step": 459455, "epoch": 5535} {"train_loss": -26.9454402923584, "global_step": 459456, "epoch": 5535} {"train_loss": -26.473529815673828, "global_step": 459457, "epoch": 5535} {"train_loss": -25.898244857788086, "global_step": 459458, "epoch": 5535} {"train_loss": -26.05596923828125, "global_step": 459459, "epoch": 5535} {"train_loss": -27.055261611938477, "global_step": 459460, "epoch": 5535} {"train_loss": -26.67648696899414, "global_step": 459461, "epoch": 5535} {"train_loss": -26.651386260986328, "global_step": 459462, "epoch": 5535} {"train_loss": -27.161291122436523, "global_step": 459463, "epoch": 5535} {"train_loss": -26.900074005126953, "global_step": 459464, "epoch": 5535} {"train_loss": -26.99726676940918, "global_step": 459465, "epoch": 5535} {"train_loss": -26.968555450439453, "global_step": 459466, "epoch": 5535} {"train_loss": -27.234243392944336, "global_step": 459467, "epoch": 5535} {"train_loss": -26.967309951782227, "global_step": 459468, "epoch": 5535} {"train_loss": -27.009342193603516, "global_step": 459469, "epoch": 5535} {"train_loss": -27.12581443786621, "global_step": 459470, "epoch": 5535} {"train_loss": -27.003320693969727, "global_step": 459471, "epoch": 5535} {"train_loss": -26.75348472595215, "global_step": 459472, "epoch": 5535} {"train_loss": -27.182830810546875, "global_step": 459473, "epoch": 5535} {"train_loss": -27.024662017822266, "global_step": 459474, "epoch": 5535} {"train_loss": -27.11139488220215, "global_step": 459475, "epoch": 5535} {"train_loss": -26.57392692565918, "global_step": 459476, "epoch": 5535} {"train_loss": -26.692060470581055, "global_step": 459477, "epoch": 5535} {"train_loss": -27.31461524963379, "global_step": 459478, "epoch": 5535} {"train_loss": -27.143171310424805, "global_step": 459479, "epoch": 5535} {"train_loss": -27.42105484008789, "global_step": 459480, "epoch": 5535} {"train_loss": -27.161130905151367, "global_step": 459481, "epoch": 5535} {"train_loss": -27.03806495666504, "global_step": 459482, "epoch": 5535} {"train_loss": -26.8743839263916, "global_step": 459483, "epoch": 5535} {"train_loss": -27.144994735717773, "global_step": 459484, "epoch": 5535} {"train_loss": -27.223983764648438, "global_step": 459485, "epoch": 5535} {"train_loss": -27.522367477416992, "global_step": 459486, "epoch": 5535} {"train_loss": -27.019591113170947, "global_step": 459487, "epoch": 5535, "val_loss": 6419994.0} {"train_loss": -26.402851104736328, "global_step": 459488, "epoch": 5536} {"train_loss": -26.308130264282227, "global_step": 459489, "epoch": 5536} {"train_loss": -26.052356719970703, "global_step": 459490, "epoch": 5536} {"train_loss": -26.5787410736084, "global_step": 459491, "epoch": 5536} {"train_loss": -26.967365264892578, "global_step": 459492, "epoch": 5536} {"train_loss": -26.474323272705078, "global_step": 459493, "epoch": 5536} {"train_loss": -26.553634643554688, "global_step": 459494, "epoch": 5536} {"train_loss": -26.510374069213867, "global_step": 459495, "epoch": 5536} {"train_loss": -26.52902603149414, "global_step": 459496, "epoch": 5536} {"train_loss": -26.64434814453125, "global_step": 459497, "epoch": 5536} {"train_loss": -26.578781127929688, "global_step": 459498, "epoch": 5536} {"train_loss": -26.775344848632812, "global_step": 459499, "epoch": 5536} {"train_loss": -26.762861251831055, "global_step": 459500, "epoch": 5536} {"train_loss": -26.80866813659668, "global_step": 459501, "epoch": 5536} {"train_loss": -26.498584747314453, "global_step": 459502, "epoch": 5536} {"train_loss": -26.733993530273438, "global_step": 459503, "epoch": 5536} {"train_loss": -27.106576919555664, "global_step": 459504, "epoch": 5536} {"train_loss": -26.6437931060791, "global_step": 459505, "epoch": 5536} {"train_loss": -26.854324340820312, "global_step": 459506, "epoch": 5536} {"train_loss": -26.906391143798828, "global_step": 459507, "epoch": 5536} {"train_loss": -26.81430435180664, "global_step": 459508, "epoch": 5536} {"train_loss": -26.7351131439209, "global_step": 459509, "epoch": 5536} {"train_loss": -26.58673667907715, "global_step": 459510, "epoch": 5536} {"train_loss": -26.768625259399414, "global_step": 459511, "epoch": 5536} {"train_loss": -26.751123428344727, "global_step": 459512, "epoch": 5536} {"train_loss": -26.877344131469727, "global_step": 459513, "epoch": 5536} {"train_loss": -27.073532104492188, "global_step": 459514, "epoch": 5536} {"train_loss": -26.718433380126953, "global_step": 459515, "epoch": 5536} {"train_loss": -27.40718650817871, "global_step": 459516, "epoch": 5536} {"train_loss": -27.095300674438477, "global_step": 459517, "epoch": 5536} {"train_loss": -26.74366569519043, "global_step": 459518, "epoch": 5536} {"train_loss": -27.01141929626465, "global_step": 459519, "epoch": 5536} {"train_loss": -27.046924591064453, "global_step": 459520, "epoch": 5536} {"train_loss": -27.001373291015625, "global_step": 459521, "epoch": 5536} {"train_loss": -27.056476593017578, "global_step": 459522, "epoch": 5536} {"train_loss": -27.202075958251953, "global_step": 459523, "epoch": 5536} {"train_loss": -26.79755210876465, "global_step": 459524, "epoch": 5536} {"train_loss": -26.990819931030273, "global_step": 459525, "epoch": 5536} {"train_loss": -27.11714744567871, "global_step": 459526, "epoch": 5536} {"train_loss": -27.26605796813965, "global_step": 459527, "epoch": 5536} {"train_loss": -27.107114791870117, "global_step": 459528, "epoch": 5536} {"train_loss": -27.201868057250977, "global_step": 459529, "epoch": 5536} {"train_loss": -27.07306480407715, "global_step": 459530, "epoch": 5536} {"train_loss": -27.27680015563965, "global_step": 459531, "epoch": 5536} {"train_loss": -27.4368896484375, "global_step": 459532, "epoch": 5536} {"train_loss": -26.729780197143555, "global_step": 459533, "epoch": 5536} {"train_loss": -27.397979736328125, "global_step": 459534, "epoch": 5536} {"train_loss": -27.214956283569336, "global_step": 459535, "epoch": 5536} {"train_loss": -27.45436668395996, "global_step": 459536, "epoch": 5536} {"train_loss": -27.106714248657227, "global_step": 459537, "epoch": 5536} {"train_loss": -26.887420654296875, "global_step": 459538, "epoch": 5536} {"train_loss": -27.246509552001953, "global_step": 459539, "epoch": 5536} {"train_loss": -27.36871337890625, "global_step": 459540, "epoch": 5536} {"train_loss": -27.041767120361328, "global_step": 459541, "epoch": 5536} {"train_loss": -27.267669677734375, "global_step": 459542, "epoch": 5536} {"train_loss": -27.314477920532227, "global_step": 459543, "epoch": 5536} {"train_loss": -26.95054054260254, "global_step": 459544, "epoch": 5536} {"train_loss": -27.54215431213379, "global_step": 459545, "epoch": 5536} {"train_loss": -27.283483505249023, "global_step": 459546, "epoch": 5536} {"train_loss": -27.29705238342285, "global_step": 459547, "epoch": 5536} {"train_loss": -26.62982749938965, "global_step": 459548, "epoch": 5536} {"train_loss": -27.272613525390625, "global_step": 459549, "epoch": 5536} {"train_loss": -27.24297523498535, "global_step": 459550, "epoch": 5536} {"train_loss": -27.35791015625, "global_step": 459551, "epoch": 5536} {"train_loss": -27.244476318359375, "global_step": 459552, "epoch": 5536} {"train_loss": -27.25575065612793, "global_step": 459553, "epoch": 5536} {"train_loss": -27.057743072509766, "global_step": 459554, "epoch": 5536} {"train_loss": -27.52485466003418, "global_step": 459555, "epoch": 5536} {"train_loss": -27.411962509155273, "global_step": 459556, "epoch": 5536} {"train_loss": -27.5992488861084, "global_step": 459557, "epoch": 5536} {"train_loss": -27.446081161499023, "global_step": 459558, "epoch": 5536} {"train_loss": -27.187744140625, "global_step": 459559, "epoch": 5536} {"train_loss": -27.123600006103516, "global_step": 459560, "epoch": 5536} {"train_loss": -27.3558349609375, "global_step": 459561, "epoch": 5536} {"train_loss": -27.506576538085938, "global_step": 459562, "epoch": 5536} {"train_loss": -27.506031036376953, "global_step": 459563, "epoch": 5536} {"train_loss": -27.37751579284668, "global_step": 459564, "epoch": 5536} {"train_loss": -26.757400512695312, "global_step": 459565, "epoch": 5536} {"train_loss": -27.1142578125, "global_step": 459566, "epoch": 5536} {"train_loss": -27.322599411010742, "global_step": 459567, "epoch": 5536} {"train_loss": -26.865991592407227, "global_step": 459568, "epoch": 5536} {"train_loss": -27.37298011779785, "global_step": 459569, "epoch": 5536} {"train_loss": -27.009613335850727, "global_step": 459570, "epoch": 5536, "val_loss": 6384634.0} {"train_loss": -27.00172233581543, "global_step": 459571, "epoch": 5537} {"train_loss": -26.702905654907227, "global_step": 459572, "epoch": 5537} {"train_loss": -26.919912338256836, "global_step": 459573, "epoch": 5537} {"train_loss": -26.904834747314453, "global_step": 459574, "epoch": 5537} {"train_loss": -26.581174850463867, "global_step": 459575, "epoch": 5537} {"train_loss": -26.90216064453125, "global_step": 459576, "epoch": 5537} {"train_loss": -26.280797958374023, "global_step": 459577, "epoch": 5537} {"train_loss": -26.580432891845703, "global_step": 459578, "epoch": 5537} {"train_loss": -26.52015495300293, "global_step": 459579, "epoch": 5537} {"train_loss": -26.578907012939453, "global_step": 459580, "epoch": 5537} {"train_loss": -26.725034713745117, "global_step": 459581, "epoch": 5537} {"train_loss": -27.022069931030273, "global_step": 459582, "epoch": 5537} {"train_loss": -27.087194442749023, "global_step": 459583, "epoch": 5537} {"train_loss": -26.604536056518555, "global_step": 459584, "epoch": 5537} {"train_loss": -26.9188175201416, "global_step": 459585, "epoch": 5537} {"train_loss": -26.91464614868164, "global_step": 459586, "epoch": 5537} {"train_loss": -26.762678146362305, "global_step": 459587, "epoch": 5537} {"train_loss": -26.90805435180664, "global_step": 459588, "epoch": 5537} {"train_loss": -27.104028701782227, "global_step": 459589, "epoch": 5537} {"train_loss": -26.996824264526367, "global_step": 459590, "epoch": 5537} {"train_loss": -26.940576553344727, "global_step": 459591, "epoch": 5537} {"train_loss": -27.106138229370117, "global_step": 459592, "epoch": 5537} {"train_loss": -27.1374454498291, "global_step": 459593, "epoch": 5537} {"train_loss": -26.984619140625, "global_step": 459594, "epoch": 5537} {"train_loss": -26.662412643432617, "global_step": 459595, "epoch": 5537} {"train_loss": -26.953351974487305, "global_step": 459596, "epoch": 5537} {"train_loss": -27.114673614501953, "global_step": 459597, "epoch": 5537} {"train_loss": -27.08990478515625, "global_step": 459598, "epoch": 5537} {"train_loss": -26.82465934753418, "global_step": 459599, "epoch": 5537} {"train_loss": -26.95987892150879, "global_step": 459600, "epoch": 5537} {"train_loss": -26.876047134399414, "global_step": 459601, "epoch": 5537} {"train_loss": -26.844696044921875, "global_step": 459602, "epoch": 5537} {"train_loss": -26.873016357421875, "global_step": 459603, "epoch": 5537} {"train_loss": -27.047887802124023, "global_step": 459604, "epoch": 5537} {"train_loss": -27.160078048706055, "global_step": 459605, "epoch": 5537} {"train_loss": -26.874723434448242, "global_step": 459606, "epoch": 5537} {"train_loss": -27.392133712768555, "global_step": 459607, "epoch": 5537} {"train_loss": -27.064523696899414, "global_step": 459608, "epoch": 5537} {"train_loss": -26.94277000427246, "global_step": 459609, "epoch": 5537} {"train_loss": -27.30832862854004, "global_step": 459610, "epoch": 5537} {"train_loss": -27.193601608276367, "global_step": 459611, "epoch": 5537} {"train_loss": -27.06618309020996, "global_step": 459612, "epoch": 5537} {"train_loss": -27.20404624938965, "global_step": 459613, "epoch": 5537} {"train_loss": -26.7695369720459, "global_step": 459614, "epoch": 5537} {"train_loss": -27.119400024414062, "global_step": 459615, "epoch": 5537} {"train_loss": -27.30230140686035, "global_step": 459616, "epoch": 5537} {"train_loss": -27.047229766845703, "global_step": 459617, "epoch": 5537} {"train_loss": -26.929367065429688, "global_step": 459618, "epoch": 5537} {"train_loss": -27.375837326049805, "global_step": 459619, "epoch": 5537} {"train_loss": -27.02459716796875, "global_step": 459620, "epoch": 5537} {"train_loss": -27.042104721069336, "global_step": 459621, "epoch": 5537} {"train_loss": -26.9814395904541, "global_step": 459622, "epoch": 5537} {"train_loss": -26.932117462158203, "global_step": 459623, "epoch": 5537} {"train_loss": -27.105737686157227, "global_step": 459624, "epoch": 5537} {"train_loss": -27.03254508972168, "global_step": 459625, "epoch": 5537} {"train_loss": -27.244998931884766, "global_step": 459626, "epoch": 5537} {"train_loss": -27.277124404907227, "global_step": 459627, "epoch": 5537} {"train_loss": -27.279809951782227, "global_step": 459628, "epoch": 5537} {"train_loss": -26.9969425201416, "global_step": 459629, "epoch": 5537} {"train_loss": -27.14456558227539, "global_step": 459630, "epoch": 5537} {"train_loss": -26.605173110961914, "global_step": 459631, "epoch": 5537} {"train_loss": -27.05018424987793, "global_step": 459632, "epoch": 5537} {"train_loss": -27.053525924682617, "global_step": 459633, "epoch": 5537} {"train_loss": -27.120283126831055, "global_step": 459634, "epoch": 5537} {"train_loss": -27.202960968017578, "global_step": 459635, "epoch": 5537} {"train_loss": -26.77239990234375, "global_step": 459636, "epoch": 5537} {"train_loss": -26.886083602905273, "global_step": 459637, "epoch": 5537} {"train_loss": -27.126529693603516, "global_step": 459638, "epoch": 5537} {"train_loss": -26.770599365234375, "global_step": 459639, "epoch": 5537} {"train_loss": -27.198293685913086, "global_step": 459640, "epoch": 5537} {"train_loss": -26.83145523071289, "global_step": 459641, "epoch": 5537} {"train_loss": -27.256839752197266, "global_step": 459642, "epoch": 5537} {"train_loss": -27.496551513671875, "global_step": 459643, "epoch": 5537} {"train_loss": -27.129663467407227, "global_step": 459644, "epoch": 5537} {"train_loss": -27.24611473083496, "global_step": 459645, "epoch": 5537} {"train_loss": -26.9193058013916, "global_step": 459646, "epoch": 5537} {"train_loss": -27.499774932861328, "global_step": 459647, "epoch": 5537} {"train_loss": -26.8250789642334, "global_step": 459648, "epoch": 5537} {"train_loss": -27.120832443237305, "global_step": 459649, "epoch": 5537} {"train_loss": -26.931299209594727, "global_step": 459650, "epoch": 5537} {"train_loss": -27.178274154663086, "global_step": 459651, "epoch": 5537} {"train_loss": -26.738178253173828, "global_step": 459652, "epoch": 5537} {"train_loss": -26.99826109552958, "global_step": 459653, "epoch": 5537, "val_loss": 6395671.0} {"train_loss": -26.86166763305664, "global_step": 459654, "epoch": 5538} {"train_loss": -25.89173698425293, "global_step": 459655, "epoch": 5538} {"train_loss": -26.47174072265625, "global_step": 459656, "epoch": 5538} {"train_loss": -26.657663345336914, "global_step": 459657, "epoch": 5538} {"train_loss": -26.06121826171875, "global_step": 459658, "epoch": 5538} {"train_loss": -26.415632247924805, "global_step": 459659, "epoch": 5538} {"train_loss": -26.496244430541992, "global_step": 459660, "epoch": 5538} {"train_loss": -26.6908016204834, "global_step": 459661, "epoch": 5538} {"train_loss": -26.660175323486328, "global_step": 459662, "epoch": 5538} {"train_loss": -26.985366821289062, "global_step": 459663, "epoch": 5538} {"train_loss": -27.101184844970703, "global_step": 459664, "epoch": 5538} {"train_loss": -26.7025203704834, "global_step": 459665, "epoch": 5538} {"train_loss": -27.14020347595215, "global_step": 459666, "epoch": 5538} {"train_loss": -26.509246826171875, "global_step": 459667, "epoch": 5538} {"train_loss": -27.01806640625, "global_step": 459668, "epoch": 5538} {"train_loss": -26.98272132873535, "global_step": 459669, "epoch": 5538} {"train_loss": -27.05438232421875, "global_step": 459670, "epoch": 5538} {"train_loss": -27.059171676635742, "global_step": 459671, "epoch": 5538} {"train_loss": -26.836502075195312, "global_step": 459672, "epoch": 5538} {"train_loss": -26.496557235717773, "global_step": 459673, "epoch": 5538} {"train_loss": -26.832971572875977, "global_step": 459674, "epoch": 5538} {"train_loss": -26.450885772705078, "global_step": 459675, "epoch": 5538} {"train_loss": -27.241943359375, "global_step": 459676, "epoch": 5538} {"train_loss": -26.747760772705078, "global_step": 459677, "epoch": 5538} {"train_loss": -26.9016056060791, "global_step": 459678, "epoch": 5538} {"train_loss": -26.965702056884766, "global_step": 459679, "epoch": 5538} {"train_loss": -26.806777954101562, "global_step": 459680, "epoch": 5538} {"train_loss": -26.95380973815918, "global_step": 459681, "epoch": 5538} {"train_loss": -27.08930015563965, "global_step": 459682, "epoch": 5538} {"train_loss": -27.10064697265625, "global_step": 459683, "epoch": 5538} {"train_loss": -27.120319366455078, "global_step": 459684, "epoch": 5538} {"train_loss": -26.853498458862305, "global_step": 459685, "epoch": 5538} {"train_loss": -26.591299057006836, "global_step": 459686, "epoch": 5538} {"train_loss": -26.70838737487793, "global_step": 459687, "epoch": 5538} {"train_loss": -27.164997100830078, "global_step": 459688, "epoch": 5538} {"train_loss": -27.3173828125, "global_step": 459689, "epoch": 5538} {"train_loss": -26.950841903686523, "global_step": 459690, "epoch": 5538} {"train_loss": -27.287403106689453, "global_step": 459691, "epoch": 5538} {"train_loss": -26.70781898498535, "global_step": 459692, "epoch": 5538} {"train_loss": -27.150421142578125, "global_step": 459693, "epoch": 5538} {"train_loss": -27.206533432006836, "global_step": 459694, "epoch": 5538} {"train_loss": -27.117467880249023, "global_step": 459695, "epoch": 5538} {"train_loss": -26.759695053100586, "global_step": 459696, "epoch": 5538} {"train_loss": -27.26215171813965, "global_step": 459697, "epoch": 5538} {"train_loss": -27.296661376953125, "global_step": 459698, "epoch": 5538} {"train_loss": -26.510953903198242, "global_step": 459699, "epoch": 5538} {"train_loss": -27.21930503845215, "global_step": 459700, "epoch": 5538} {"train_loss": -27.222517013549805, "global_step": 459701, "epoch": 5538} {"train_loss": -26.84492301940918, "global_step": 459702, "epoch": 5538} {"train_loss": -26.936613082885742, "global_step": 459703, "epoch": 5538} {"train_loss": -27.261951446533203, "global_step": 459704, "epoch": 5538} {"train_loss": -27.024137496948242, "global_step": 459705, "epoch": 5538} {"train_loss": -27.102651596069336, "global_step": 459706, "epoch": 5538} {"train_loss": -27.1011962890625, "global_step": 459707, "epoch": 5538} {"train_loss": -27.11337661743164, "global_step": 459708, "epoch": 5538} {"train_loss": -27.22980308532715, "global_step": 459709, "epoch": 5538} {"train_loss": -27.371673583984375, "global_step": 459710, "epoch": 5538} {"train_loss": -27.15972900390625, "global_step": 459711, "epoch": 5538} {"train_loss": -27.063690185546875, "global_step": 459712, "epoch": 5538} {"train_loss": -26.730539321899414, "global_step": 459713, "epoch": 5538} {"train_loss": -27.3167781829834, "global_step": 459714, "epoch": 5538} {"train_loss": -27.268346786499023, "global_step": 459715, "epoch": 5538} {"train_loss": -27.20728874206543, "global_step": 459716, "epoch": 5538} {"train_loss": -27.486539840698242, "global_step": 459717, "epoch": 5538} {"train_loss": -27.40809440612793, "global_step": 459718, "epoch": 5538} {"train_loss": -27.739614486694336, "global_step": 459719, "epoch": 5538} {"train_loss": -27.07560157775879, "global_step": 459720, "epoch": 5538} {"train_loss": -27.1009578704834, "global_step": 459721, "epoch": 5538} {"train_loss": -27.294940948486328, "global_step": 459722, "epoch": 5538} {"train_loss": -27.459890365600586, "global_step": 459723, "epoch": 5538} {"train_loss": -26.965421676635742, "global_step": 459724, "epoch": 5538} {"train_loss": -27.27834129333496, "global_step": 459725, "epoch": 5538} {"train_loss": -27.023115158081055, "global_step": 459726, "epoch": 5538} {"train_loss": -25.832813262939453, "global_step": 459727, "epoch": 5538} {"train_loss": -24.909887313842773, "global_step": 459728, "epoch": 5538} {"train_loss": -24.71927833557129, "global_step": 459729, "epoch": 5538} {"train_loss": -24.657209396362305, "global_step": 459730, "epoch": 5538} {"train_loss": -26.197647094726562, "global_step": 459731, "epoch": 5538} {"train_loss": -25.864309310913086, "global_step": 459732, "epoch": 5538} {"train_loss": -26.083454132080078, "global_step": 459733, "epoch": 5538} {"train_loss": -26.24513816833496, "global_step": 459734, "epoch": 5538} {"train_loss": -26.163564682006836, "global_step": 459735, "epoch": 5538} {"train_loss": -26.827855604240693, "global_step": 459736, "epoch": 5538, "val_loss": 6486780.0} {"train_loss": -25.732837677001953, "global_step": 459737, "epoch": 5539} {"train_loss": -24.867765426635742, "global_step": 459738, "epoch": 5539} {"train_loss": -26.334997177124023, "global_step": 459739, "epoch": 5539} {"train_loss": -25.524057388305664, "global_step": 459740, "epoch": 5539} {"train_loss": -25.54840660095215, "global_step": 459741, "epoch": 5539} {"train_loss": -25.98516273498535, "global_step": 459742, "epoch": 5539} {"train_loss": -25.86989402770996, "global_step": 459743, "epoch": 5539} {"train_loss": -26.3155517578125, "global_step": 459744, "epoch": 5539} {"train_loss": -26.214508056640625, "global_step": 459745, "epoch": 5539} {"train_loss": -25.56873893737793, "global_step": 459746, "epoch": 5539} {"train_loss": -26.47320556640625, "global_step": 459747, "epoch": 5539} {"train_loss": -26.0494441986084, "global_step": 459748, "epoch": 5539} {"train_loss": -26.459365844726562, "global_step": 459749, "epoch": 5539} {"train_loss": -26.370466232299805, "global_step": 459750, "epoch": 5539} {"train_loss": -26.50275230407715, "global_step": 459751, "epoch": 5539} {"train_loss": -26.159732818603516, "global_step": 459752, "epoch": 5539} {"train_loss": -26.301244735717773, "global_step": 459753, "epoch": 5539} {"train_loss": -26.34037208557129, "global_step": 459754, "epoch": 5539} {"train_loss": -26.480640411376953, "global_step": 459755, "epoch": 5539} {"train_loss": -26.48927116394043, "global_step": 459756, "epoch": 5539} {"train_loss": -26.29277992248535, "global_step": 459757, "epoch": 5539} {"train_loss": -26.44016456604004, "global_step": 459758, "epoch": 5539} {"train_loss": -26.60419273376465, "global_step": 459759, "epoch": 5539} {"train_loss": -26.708044052124023, "global_step": 459760, "epoch": 5539} {"train_loss": -26.626605987548828, "global_step": 459761, "epoch": 5539} {"train_loss": -26.533987045288086, "global_step": 459762, "epoch": 5539} {"train_loss": -26.916519165039062, "global_step": 459763, "epoch": 5539} {"train_loss": -26.906757354736328, "global_step": 459764, "epoch": 5539} {"train_loss": -26.75453758239746, "global_step": 459765, "epoch": 5539} {"train_loss": -26.62652015686035, "global_step": 459766, "epoch": 5539} {"train_loss": -26.816242218017578, "global_step": 459767, "epoch": 5539} {"train_loss": -27.211400985717773, "global_step": 459768, "epoch": 5539} {"train_loss": -27.06925392150879, "global_step": 459769, "epoch": 5539} {"train_loss": -26.944990158081055, "global_step": 459770, "epoch": 5539} {"train_loss": -26.80842399597168, "global_step": 459771, "epoch": 5539} {"train_loss": -27.16535758972168, "global_step": 459772, "epoch": 5539} {"train_loss": -27.03875160217285, "global_step": 459773, "epoch": 5539} {"train_loss": -27.34539794921875, "global_step": 459774, "epoch": 5539} {"train_loss": -27.28315544128418, "global_step": 459775, "epoch": 5539} {"train_loss": -27.186965942382812, "global_step": 459776, "epoch": 5539} {"train_loss": -27.239835739135742, "global_step": 459777, "epoch": 5539} {"train_loss": -27.35288429260254, "global_step": 459778, "epoch": 5539} {"train_loss": -26.951139450073242, "global_step": 459779, "epoch": 5539} {"train_loss": -27.04087257385254, "global_step": 459780, "epoch": 5539} {"train_loss": -27.175642013549805, "global_step": 459781, "epoch": 5539} {"train_loss": -26.927030563354492, "global_step": 459782, "epoch": 5539} {"train_loss": -27.0604190826416, "global_step": 459783, "epoch": 5539} {"train_loss": -27.448530197143555, "global_step": 459784, "epoch": 5539} {"train_loss": -27.381488800048828, "global_step": 459785, "epoch": 5539} {"train_loss": -27.06427574157715, "global_step": 459786, "epoch": 5539} {"train_loss": -26.975976943969727, "global_step": 459787, "epoch": 5539} {"train_loss": -27.354053497314453, "global_step": 459788, "epoch": 5539} {"train_loss": -27.021467208862305, "global_step": 459789, "epoch": 5539} {"train_loss": -27.225934982299805, "global_step": 459790, "epoch": 5539} {"train_loss": -27.696903228759766, "global_step": 459791, "epoch": 5539} {"train_loss": -27.356842041015625, "global_step": 459792, "epoch": 5539} {"train_loss": -27.506799697875977, "global_step": 459793, "epoch": 5539} {"train_loss": -27.45391273498535, "global_step": 459794, "epoch": 5539} {"train_loss": -27.123981475830078, "global_step": 459795, "epoch": 5539} {"train_loss": -27.449787139892578, "global_step": 459796, "epoch": 5539} {"train_loss": -27.30914306640625, "global_step": 459797, "epoch": 5539} {"train_loss": -27.50620460510254, "global_step": 459798, "epoch": 5539} {"train_loss": -27.34681510925293, "global_step": 459799, "epoch": 5539} {"train_loss": -27.176462173461914, "global_step": 459800, "epoch": 5539} {"train_loss": -27.026214599609375, "global_step": 459801, "epoch": 5539} {"train_loss": -26.946121215820312, "global_step": 459802, "epoch": 5539} {"train_loss": -26.959909439086914, "global_step": 459803, "epoch": 5539} {"train_loss": -27.02777099609375, "global_step": 459804, "epoch": 5539} {"train_loss": -26.7155818939209, "global_step": 459805, "epoch": 5539} {"train_loss": -27.28717041015625, "global_step": 459806, "epoch": 5539} {"train_loss": -27.00958824157715, "global_step": 459807, "epoch": 5539} {"train_loss": -27.034414291381836, "global_step": 459808, "epoch": 5539} {"train_loss": -27.2744083404541, "global_step": 459809, "epoch": 5539} {"train_loss": -27.602426528930664, "global_step": 459810, "epoch": 5539} {"train_loss": -27.186246871948242, "global_step": 459811, "epoch": 5539} {"train_loss": -27.324853897094727, "global_step": 459812, "epoch": 5539} {"train_loss": -27.27240562438965, "global_step": 459813, "epoch": 5539} {"train_loss": -27.040918350219727, "global_step": 459814, "epoch": 5539} {"train_loss": -27.231470108032227, "global_step": 459815, "epoch": 5539} {"train_loss": -27.162641525268555, "global_step": 459816, "epoch": 5539} {"train_loss": -26.481489181518555, "global_step": 459817, "epoch": 5539} {"train_loss": -26.467634201049805, "global_step": 459818, "epoch": 5539} {"train_loss": -26.805230129195984, "global_step": 459819, "epoch": 5539, "val_loss": 6276242.0} {"train_loss": -23.99777603149414, "global_step": 459820, "epoch": 5540} {"train_loss": -24.402860641479492, "global_step": 459821, "epoch": 5540} {"train_loss": -25.21054458618164, "global_step": 459822, "epoch": 5540} {"train_loss": -23.684406280517578, "global_step": 459823, "epoch": 5540} {"train_loss": -25.750715255737305, "global_step": 459824, "epoch": 5540} {"train_loss": -24.650190353393555, "global_step": 459825, "epoch": 5540} {"train_loss": -25.510051727294922, "global_step": 459826, "epoch": 5540} {"train_loss": -25.349761962890625, "global_step": 459827, "epoch": 5540} {"train_loss": -25.352832794189453, "global_step": 459828, "epoch": 5540} {"train_loss": -25.576892852783203, "global_step": 459829, "epoch": 5540} {"train_loss": -26.285146713256836, "global_step": 459830, "epoch": 5540} {"train_loss": -25.588741302490234, "global_step": 459831, "epoch": 5540} {"train_loss": -26.152667999267578, "global_step": 459832, "epoch": 5540} {"train_loss": -26.106033325195312, "global_step": 459833, "epoch": 5540} {"train_loss": -26.131235122680664, "global_step": 459834, "epoch": 5540} {"train_loss": -25.769128799438477, "global_step": 459835, "epoch": 5540} {"train_loss": -26.0164852142334, "global_step": 459836, "epoch": 5540} {"train_loss": -26.085973739624023, "global_step": 459837, "epoch": 5540} {"train_loss": -26.198348999023438, "global_step": 459838, "epoch": 5540} {"train_loss": -26.568511962890625, "global_step": 459839, "epoch": 5540} {"train_loss": -26.195819854736328, "global_step": 459840, "epoch": 5540} {"train_loss": -26.66291618347168, "global_step": 459841, "epoch": 5540} {"train_loss": -26.378192901611328, "global_step": 459842, "epoch": 5540} {"train_loss": -26.155736923217773, "global_step": 459843, "epoch": 5540} {"train_loss": -26.685077667236328, "global_step": 459844, "epoch": 5540} {"train_loss": -26.436237335205078, "global_step": 459845, "epoch": 5540} {"train_loss": -26.77741050720215, "global_step": 459846, "epoch": 5540} {"train_loss": -26.85308837890625, "global_step": 459847, "epoch": 5540} {"train_loss": -26.784757614135742, "global_step": 459848, "epoch": 5540} {"train_loss": -26.4432373046875, "global_step": 459849, "epoch": 5540} {"train_loss": -26.639602661132812, "global_step": 459850, "epoch": 5540} {"train_loss": -26.982208251953125, "global_step": 459851, "epoch": 5540} {"train_loss": -26.731969833374023, "global_step": 459852, "epoch": 5540} {"train_loss": -27.093128204345703, "global_step": 459853, "epoch": 5540} {"train_loss": -26.915246963500977, "global_step": 459854, "epoch": 5540} {"train_loss": -27.1888484954834, "global_step": 459855, "epoch": 5540} {"train_loss": -26.90423011779785, "global_step": 459856, "epoch": 5540} {"train_loss": -26.965200424194336, "global_step": 459857, "epoch": 5540} {"train_loss": -26.896595001220703, "global_step": 459858, "epoch": 5540} {"train_loss": -26.995975494384766, "global_step": 459859, "epoch": 5540} {"train_loss": -27.240177154541016, "global_step": 459860, "epoch": 5540} {"train_loss": -26.66522789001465, "global_step": 459861, "epoch": 5540} {"train_loss": -27.415430068969727, "global_step": 459862, "epoch": 5540} {"train_loss": -26.931806564331055, "global_step": 459863, "epoch": 5540} {"train_loss": -26.68958854675293, "global_step": 459864, "epoch": 5540} {"train_loss": -27.018415451049805, "global_step": 459865, "epoch": 5540} {"train_loss": -27.010324478149414, "global_step": 459866, "epoch": 5540} {"train_loss": -27.1628475189209, "global_step": 459867, "epoch": 5540} {"train_loss": -27.120161056518555, "global_step": 459868, "epoch": 5540} {"train_loss": -27.13578224182129, "global_step": 459869, "epoch": 5540} {"train_loss": -27.016357421875, "global_step": 459870, "epoch": 5540} {"train_loss": -27.391254425048828, "global_step": 459871, "epoch": 5540} {"train_loss": -27.368322372436523, "global_step": 459872, "epoch": 5540} {"train_loss": -27.24057960510254, "global_step": 459873, "epoch": 5540} {"train_loss": -27.337514877319336, "global_step": 459874, "epoch": 5540} {"train_loss": -26.625951766967773, "global_step": 459875, "epoch": 5540} {"train_loss": -27.091602325439453, "global_step": 459876, "epoch": 5540} {"train_loss": -26.778650283813477, "global_step": 459877, "epoch": 5540} {"train_loss": -26.702070236206055, "global_step": 459878, "epoch": 5540} {"train_loss": -26.902883529663086, "global_step": 459879, "epoch": 5540} {"train_loss": -26.295316696166992, "global_step": 459880, "epoch": 5540} {"train_loss": -26.492956161499023, "global_step": 459881, "epoch": 5540} {"train_loss": -26.498640060424805, "global_step": 459882, "epoch": 5540} {"train_loss": -27.27324867248535, "global_step": 459883, "epoch": 5540} {"train_loss": -26.7457332611084, "global_step": 459884, "epoch": 5540} {"train_loss": -26.872501373291016, "global_step": 459885, "epoch": 5540} {"train_loss": -26.886749267578125, "global_step": 459886, "epoch": 5540} {"train_loss": -26.82977294921875, "global_step": 459887, "epoch": 5540} {"train_loss": -26.967191696166992, "global_step": 459888, "epoch": 5540} {"train_loss": -27.283884048461914, "global_step": 459889, "epoch": 5540} {"train_loss": -26.9716739654541, "global_step": 459890, "epoch": 5540} {"train_loss": -26.977731704711914, "global_step": 459891, "epoch": 5540} {"train_loss": -27.18194580078125, "global_step": 459892, "epoch": 5540} {"train_loss": -26.85881996154785, "global_step": 459893, "epoch": 5540} {"train_loss": -27.102380752563477, "global_step": 459894, "epoch": 5540} {"train_loss": -27.087549209594727, "global_step": 459895, "epoch": 5540} {"train_loss": -27.20725440979004, "global_step": 459896, "epoch": 5540} {"train_loss": -27.292722702026367, "global_step": 459897, "epoch": 5540} {"train_loss": -27.144018173217773, "global_step": 459898, "epoch": 5540} {"train_loss": -27.211023330688477, "global_step": 459899, "epoch": 5540} {"train_loss": -26.82318115234375, "global_step": 459900, "epoch": 5540} {"train_loss": -27.075397491455078, "global_step": 459901, "epoch": 5540} {"train_loss": -26.586519218352905, "global_step": 459902, "epoch": 5540, "val_loss": 6649033.0} {"train_loss": -24.17607307434082, "global_step": 459903, "epoch": 5541} {"train_loss": -26.47504997253418, "global_step": 459904, "epoch": 5541} {"train_loss": -25.03525161743164, "global_step": 459905, "epoch": 5541} {"train_loss": -26.60453224182129, "global_step": 459906, "epoch": 5541} {"train_loss": -25.719648361206055, "global_step": 459907, "epoch": 5541} {"train_loss": -25.922348022460938, "global_step": 459908, "epoch": 5541} {"train_loss": -26.617151260375977, "global_step": 459909, "epoch": 5541} {"train_loss": -26.34500503540039, "global_step": 459910, "epoch": 5541} {"train_loss": -26.200531005859375, "global_step": 459911, "epoch": 5541} {"train_loss": -26.932891845703125, "global_step": 459912, "epoch": 5541} {"train_loss": -26.59720230102539, "global_step": 459913, "epoch": 5541} {"train_loss": -26.715747833251953, "global_step": 459914, "epoch": 5541} {"train_loss": -26.572729110717773, "global_step": 459915, "epoch": 5541} {"train_loss": -26.45722007751465, "global_step": 459916, "epoch": 5541} {"train_loss": -26.906492233276367, "global_step": 459917, "epoch": 5541} {"train_loss": -26.908544540405273, "global_step": 459918, "epoch": 5541} {"train_loss": -26.540143966674805, "global_step": 459919, "epoch": 5541} {"train_loss": -26.457883834838867, "global_step": 459920, "epoch": 5541} {"train_loss": -26.341825485229492, "global_step": 459921, "epoch": 5541} {"train_loss": -26.69160270690918, "global_step": 459922, "epoch": 5541} {"train_loss": -26.467594146728516, "global_step": 459923, "epoch": 5541} {"train_loss": -26.954055786132812, "global_step": 459924, "epoch": 5541} {"train_loss": -27.05655860900879, "global_step": 459925, "epoch": 5541} {"train_loss": -27.05600929260254, "global_step": 459926, "epoch": 5541} {"train_loss": -26.913105010986328, "global_step": 459927, "epoch": 5541} {"train_loss": -26.825010299682617, "global_step": 459928, "epoch": 5541} {"train_loss": -26.818918228149414, "global_step": 459929, "epoch": 5541} {"train_loss": -26.5976505279541, "global_step": 459930, "epoch": 5541} {"train_loss": -26.87249755859375, "global_step": 459931, "epoch": 5541} {"train_loss": -27.13886833190918, "global_step": 459932, "epoch": 5541} {"train_loss": -26.99822998046875, "global_step": 459933, "epoch": 5541} {"train_loss": -27.4654483795166, "global_step": 459934, "epoch": 5541} {"train_loss": -26.952075958251953, "global_step": 459935, "epoch": 5541} {"train_loss": -26.654279708862305, "global_step": 459936, "epoch": 5541} {"train_loss": -26.677148818969727, "global_step": 459937, "epoch": 5541} {"train_loss": -26.857885360717773, "global_step": 459938, "epoch": 5541} {"train_loss": -26.907438278198242, "global_step": 459939, "epoch": 5541} {"train_loss": -26.812543869018555, "global_step": 459940, "epoch": 5541} {"train_loss": -26.768314361572266, "global_step": 459941, "epoch": 5541} {"train_loss": -27.114429473876953, "global_step": 459942, "epoch": 5541} {"train_loss": -27.186323165893555, "global_step": 459943, "epoch": 5541} {"train_loss": -26.803146362304688, "global_step": 459944, "epoch": 5541} {"train_loss": -26.72395896911621, "global_step": 459945, "epoch": 5541} {"train_loss": -26.7939510345459, "global_step": 459946, "epoch": 5541} {"train_loss": -27.79786491394043, "global_step": 459947, "epoch": 5541} {"train_loss": -27.14884376525879, "global_step": 459948, "epoch": 5541} {"train_loss": -26.661279678344727, "global_step": 459949, "epoch": 5541} {"train_loss": -26.881622314453125, "global_step": 459950, "epoch": 5541} {"train_loss": -27.012170791625977, "global_step": 459951, "epoch": 5541} {"train_loss": -27.052932739257812, "global_step": 459952, "epoch": 5541} {"train_loss": -27.1181583404541, "global_step": 459953, "epoch": 5541} {"train_loss": -26.97989273071289, "global_step": 459954, "epoch": 5541} {"train_loss": -27.052576065063477, "global_step": 459955, "epoch": 5541} {"train_loss": -26.8824405670166, "global_step": 459956, "epoch": 5541} {"train_loss": -26.987485885620117, "global_step": 459957, "epoch": 5541} {"train_loss": -27.089162826538086, "global_step": 459958, "epoch": 5541} {"train_loss": -27.079517364501953, "global_step": 459959, "epoch": 5541} {"train_loss": -26.861112594604492, "global_step": 459960, "epoch": 5541} {"train_loss": -27.0693416595459, "global_step": 459961, "epoch": 5541} {"train_loss": -26.9340877532959, "global_step": 459962, "epoch": 5541} {"train_loss": -27.064605712890625, "global_step": 459963, "epoch": 5541} {"train_loss": -27.128808975219727, "global_step": 459964, "epoch": 5541} {"train_loss": -27.00398063659668, "global_step": 459965, "epoch": 5541} {"train_loss": -27.162368774414062, "global_step": 459966, "epoch": 5541} {"train_loss": -27.17432975769043, "global_step": 459967, "epoch": 5541} {"train_loss": -27.304052352905273, "global_step": 459968, "epoch": 5541} {"train_loss": -26.912433624267578, "global_step": 459969, "epoch": 5541} {"train_loss": -27.039915084838867, "global_step": 459970, "epoch": 5541} {"train_loss": -27.203115463256836, "global_step": 459971, "epoch": 5541} {"train_loss": -27.471460342407227, "global_step": 459972, "epoch": 5541} {"train_loss": -27.71832847595215, "global_step": 459973, "epoch": 5541} {"train_loss": -27.325122833251953, "global_step": 459974, "epoch": 5541} {"train_loss": -27.205936431884766, "global_step": 459975, "epoch": 5541} {"train_loss": -27.310224533081055, "global_step": 459976, "epoch": 5541} {"train_loss": -27.1613712310791, "global_step": 459977, "epoch": 5541} {"train_loss": -27.177305221557617, "global_step": 459978, "epoch": 5541} {"train_loss": -27.552770614624023, "global_step": 459979, "epoch": 5541} {"train_loss": -27.36566162109375, "global_step": 459980, "epoch": 5541} {"train_loss": -27.472883224487305, "global_step": 459981, "epoch": 5541} {"train_loss": -27.217742919921875, "global_step": 459982, "epoch": 5541} {"train_loss": -27.043481826782227, "global_step": 459983, "epoch": 5541} {"train_loss": -27.08819580078125, "global_step": 459984, "epoch": 5541} {"train_loss": -26.869595631059394, "global_step": 459985, "epoch": 5541, "val_loss": 6659204.0} {"train_loss": -26.203754425048828, "global_step": 459986, "epoch": 5542} {"train_loss": -25.988937377929688, "global_step": 459987, "epoch": 5542} {"train_loss": -25.899877548217773, "global_step": 459988, "epoch": 5542} {"train_loss": -27.059467315673828, "global_step": 459989, "epoch": 5542} {"train_loss": -26.412229537963867, "global_step": 459990, "epoch": 5542} {"train_loss": -26.044416427612305, "global_step": 459991, "epoch": 5542} {"train_loss": -25.269454956054688, "global_step": 459992, "epoch": 5542} {"train_loss": -25.657934188842773, "global_step": 459993, "epoch": 5542} {"train_loss": -26.91084861755371, "global_step": 459994, "epoch": 5542} {"train_loss": -26.263463973999023, "global_step": 459995, "epoch": 5542} {"train_loss": -26.555601119995117, "global_step": 459996, "epoch": 5542} {"train_loss": -26.639333724975586, "global_step": 459997, "epoch": 5542} {"train_loss": -26.385812759399414, "global_step": 459998, "epoch": 5542} {"train_loss": -27.11468505859375, "global_step": 459999, "epoch": 5542} {"train_loss": -26.829029083251953, "global_step": 460000, "epoch": 5542} {"train_loss": -26.818674087524414, "global_step": 460001, "epoch": 5542} {"train_loss": -26.6407527923584, "global_step": 460002, "epoch": 5542} {"train_loss": -26.914871215820312, "global_step": 460003, "epoch": 5542} {"train_loss": -26.901111602783203, "global_step": 460004, "epoch": 5542} {"train_loss": -26.901037216186523, "global_step": 460005, "epoch": 5542} {"train_loss": -27.104787826538086, "global_step": 460006, "epoch": 5542} {"train_loss": -26.76896095275879, "global_step": 460007, "epoch": 5542} {"train_loss": -27.21427345275879, "global_step": 460008, "epoch": 5542} {"train_loss": -26.94980812072754, "global_step": 460009, "epoch": 5542} {"train_loss": -27.151227951049805, "global_step": 460010, "epoch": 5542} {"train_loss": -26.801538467407227, "global_step": 460011, "epoch": 5542} {"train_loss": -27.025100708007812, "global_step": 460012, "epoch": 5542} {"train_loss": -27.072778701782227, "global_step": 460013, "epoch": 5542} {"train_loss": -26.78312110900879, "global_step": 460014, "epoch": 5542} {"train_loss": -27.238828659057617, "global_step": 460015, "epoch": 5542} {"train_loss": -27.092132568359375, "global_step": 460016, "epoch": 5542} {"train_loss": -27.4110050201416, "global_step": 460017, "epoch": 5542} {"train_loss": -27.360931396484375, "global_step": 460018, "epoch": 5542} {"train_loss": -26.840076446533203, "global_step": 460019, "epoch": 5542} {"train_loss": -27.14930534362793, "global_step": 460020, "epoch": 5542} {"train_loss": -26.84164810180664, "global_step": 460021, "epoch": 5542} {"train_loss": -27.445362091064453, "global_step": 460022, "epoch": 5542} {"train_loss": -27.056320190429688, "global_step": 460023, "epoch": 5542} {"train_loss": -27.11720085144043, "global_step": 460024, "epoch": 5542} {"train_loss": -27.140600204467773, "global_step": 460025, "epoch": 5542} {"train_loss": -27.527484893798828, "global_step": 460026, "epoch": 5542} {"train_loss": -27.29962158203125, "global_step": 460027, "epoch": 5542} {"train_loss": -27.166345596313477, "global_step": 460028, "epoch": 5542} {"train_loss": -27.368850708007812, "global_step": 460029, "epoch": 5542} {"train_loss": -27.3841609954834, "global_step": 460030, "epoch": 5542} {"train_loss": -27.0570011138916, "global_step": 460031, "epoch": 5542} {"train_loss": -27.213443756103516, "global_step": 460032, "epoch": 5542} {"train_loss": -27.52772331237793, "global_step": 460033, "epoch": 5542} {"train_loss": -27.451452255249023, "global_step": 460034, "epoch": 5542} {"train_loss": -27.263080596923828, "global_step": 460035, "epoch": 5542} {"train_loss": -27.313156127929688, "global_step": 460036, "epoch": 5542} {"train_loss": -26.8828182220459, "global_step": 460037, "epoch": 5542} {"train_loss": -26.855932235717773, "global_step": 460038, "epoch": 5542} {"train_loss": -27.211191177368164, "global_step": 460039, "epoch": 5542} {"train_loss": -27.0301513671875, "global_step": 460040, "epoch": 5542} {"train_loss": -26.783111572265625, "global_step": 460041, "epoch": 5542} {"train_loss": -26.90865135192871, "global_step": 460042, "epoch": 5542} {"train_loss": -26.998071670532227, "global_step": 460043, "epoch": 5542} {"train_loss": -27.435108184814453, "global_step": 460044, "epoch": 5542} {"train_loss": -27.093793869018555, "global_step": 460045, "epoch": 5542} {"train_loss": -27.166767120361328, "global_step": 460046, "epoch": 5542} {"train_loss": -27.692548751831055, "global_step": 460047, "epoch": 5542} {"train_loss": -27.171255111694336, "global_step": 460048, "epoch": 5542} {"train_loss": -27.29792594909668, "global_step": 460049, "epoch": 5542} {"train_loss": -26.82550621032715, "global_step": 460050, "epoch": 5542} {"train_loss": -27.331445693969727, "global_step": 460051, "epoch": 5542} {"train_loss": -27.21729850769043, "global_step": 460052, "epoch": 5542} {"train_loss": -27.452661514282227, "global_step": 460053, "epoch": 5542} {"train_loss": -27.219263076782227, "global_step": 460054, "epoch": 5542} {"train_loss": -27.0982608795166, "global_step": 460055, "epoch": 5542} {"train_loss": -26.860986709594727, "global_step": 460056, "epoch": 5542} {"train_loss": -26.871753692626953, "global_step": 460057, "epoch": 5542} {"train_loss": -27.10849380493164, "global_step": 460058, "epoch": 5542} {"train_loss": -27.374364852905273, "global_step": 460059, "epoch": 5542} {"train_loss": -27.075193405151367, "global_step": 460060, "epoch": 5542} {"train_loss": -27.121809005737305, "global_step": 460061, "epoch": 5542} {"train_loss": -26.719919204711914, "global_step": 460062, "epoch": 5542} {"train_loss": -26.979663848876953, "global_step": 460063, "epoch": 5542} {"train_loss": -27.533288955688477, "global_step": 460064, "epoch": 5542} {"train_loss": -27.299484252929688, "global_step": 460065, "epoch": 5542} {"train_loss": -26.650497436523438, "global_step": 460066, "epoch": 5542} {"train_loss": -26.5556640625, "global_step": 460067, "epoch": 5542} {"train_loss": -26.964050545749895, "global_step": 460068, "epoch": 5542, "val_loss": 6693623.0} {"train_loss": -26.950788497924805, "global_step": 460069, "epoch": 5543} {"train_loss": -26.498477935791016, "global_step": 460070, "epoch": 5543} {"train_loss": -27.429410934448242, "global_step": 460071, "epoch": 5543} {"train_loss": -26.485218048095703, "global_step": 460072, "epoch": 5543} {"train_loss": -26.796613693237305, "global_step": 460073, "epoch": 5543} {"train_loss": -26.705556869506836, "global_step": 460074, "epoch": 5543} {"train_loss": -26.73101234436035, "global_step": 460075, "epoch": 5543} {"train_loss": -27.011533737182617, "global_step": 460076, "epoch": 5543} {"train_loss": -26.9030818939209, "global_step": 460077, "epoch": 5543} {"train_loss": -26.464313507080078, "global_step": 460078, "epoch": 5543} {"train_loss": -27.149322509765625, "global_step": 460079, "epoch": 5543} {"train_loss": -26.546558380126953, "global_step": 460080, "epoch": 5543} {"train_loss": -26.71128273010254, "global_step": 460081, "epoch": 5543} {"train_loss": -26.86802101135254, "global_step": 460082, "epoch": 5543} {"train_loss": -26.8879337310791, "global_step": 460083, "epoch": 5543} {"train_loss": -26.7965145111084, "global_step": 460084, "epoch": 5543} {"train_loss": -26.902158737182617, "global_step": 460085, "epoch": 5543} {"train_loss": -27.428037643432617, "global_step": 460086, "epoch": 5543} {"train_loss": -26.803726196289062, "global_step": 460087, "epoch": 5543} {"train_loss": -26.778623580932617, "global_step": 460088, "epoch": 5543} {"train_loss": -27.38351821899414, "global_step": 460089, "epoch": 5543} {"train_loss": -27.084379196166992, "global_step": 460090, "epoch": 5543} {"train_loss": -26.81341552734375, "global_step": 460091, "epoch": 5543} {"train_loss": -26.97391700744629, "global_step": 460092, "epoch": 5543} {"train_loss": -27.015363693237305, "global_step": 460093, "epoch": 5543} {"train_loss": -26.77829933166504, "global_step": 460094, "epoch": 5543} {"train_loss": -27.172473907470703, "global_step": 460095, "epoch": 5543} {"train_loss": -27.260950088500977, "global_step": 460096, "epoch": 5543} {"train_loss": -27.198354721069336, "global_step": 460097, "epoch": 5543} {"train_loss": -26.82672119140625, "global_step": 460098, "epoch": 5543} {"train_loss": -26.579206466674805, "global_step": 460099, "epoch": 5543} {"train_loss": -26.984481811523438, "global_step": 460100, "epoch": 5543} {"train_loss": -27.15382194519043, "global_step": 460101, "epoch": 5543} {"train_loss": -26.988880157470703, "global_step": 460102, "epoch": 5543} {"train_loss": -27.02834129333496, "global_step": 460103, "epoch": 5543} {"train_loss": -27.25247573852539, "global_step": 460104, "epoch": 5543} {"train_loss": -27.02137565612793, "global_step": 460105, "epoch": 5543} {"train_loss": -27.0263671875, "global_step": 460106, "epoch": 5543} {"train_loss": -27.233423233032227, "global_step": 460107, "epoch": 5543} {"train_loss": -27.12298011779785, "global_step": 460108, "epoch": 5543} {"train_loss": -26.91770362854004, "global_step": 460109, "epoch": 5543} {"train_loss": -27.107873916625977, "global_step": 460110, "epoch": 5543} {"train_loss": -27.68195915222168, "global_step": 460111, "epoch": 5543} {"train_loss": -27.333219528198242, "global_step": 460112, "epoch": 5543} {"train_loss": -27.03009033203125, "global_step": 460113, "epoch": 5543} {"train_loss": -27.096420288085938, "global_step": 460114, "epoch": 5543} {"train_loss": -27.084030151367188, "global_step": 460115, "epoch": 5543} {"train_loss": -27.26767349243164, "global_step": 460116, "epoch": 5543} {"train_loss": -27.531469345092773, "global_step": 460117, "epoch": 5543} {"train_loss": -27.4622859954834, "global_step": 460118, "epoch": 5543} {"train_loss": -27.37019157409668, "global_step": 460119, "epoch": 5543} {"train_loss": -27.410797119140625, "global_step": 460120, "epoch": 5543} {"train_loss": -27.36910057067871, "global_step": 460121, "epoch": 5543} {"train_loss": -26.798192977905273, "global_step": 460122, "epoch": 5543} {"train_loss": -27.140501022338867, "global_step": 460123, "epoch": 5543} {"train_loss": -27.4378604888916, "global_step": 460124, "epoch": 5543} {"train_loss": -27.011951446533203, "global_step": 460125, "epoch": 5543} {"train_loss": -26.920185089111328, "global_step": 460126, "epoch": 5543} {"train_loss": -26.780012130737305, "global_step": 460127, "epoch": 5543} {"train_loss": -26.922101974487305, "global_step": 460128, "epoch": 5543} {"train_loss": -27.032230377197266, "global_step": 460129, "epoch": 5543} {"train_loss": -27.126434326171875, "global_step": 460130, "epoch": 5543} {"train_loss": -26.95111083984375, "global_step": 460131, "epoch": 5543} {"train_loss": -26.9700927734375, "global_step": 460132, "epoch": 5543} {"train_loss": -26.94024658203125, "global_step": 460133, "epoch": 5543} {"train_loss": -27.242996215820312, "global_step": 460134, "epoch": 5543} {"train_loss": -27.073566436767578, "global_step": 460135, "epoch": 5543} {"train_loss": -27.173368453979492, "global_step": 460136, "epoch": 5543} {"train_loss": -27.238183975219727, "global_step": 460137, "epoch": 5543} {"train_loss": -27.6989803314209, "global_step": 460138, "epoch": 5543} {"train_loss": -27.164525985717773, "global_step": 460139, "epoch": 5543} {"train_loss": -27.297794342041016, "global_step": 460140, "epoch": 5543} {"train_loss": -27.10298728942871, "global_step": 460141, "epoch": 5543} {"train_loss": -27.036975860595703, "global_step": 460142, "epoch": 5543} {"train_loss": -27.629236221313477, "global_step": 460143, "epoch": 5543} {"train_loss": -27.069599151611328, "global_step": 460144, "epoch": 5543} {"train_loss": -27.28550148010254, "global_step": 460145, "epoch": 5543} {"train_loss": -27.25360679626465, "global_step": 460146, "epoch": 5543} {"train_loss": -27.23076820373535, "global_step": 460147, "epoch": 5543} {"train_loss": -26.941150665283203, "global_step": 460148, "epoch": 5543} {"train_loss": -27.357105255126953, "global_step": 460149, "epoch": 5543} {"train_loss": -27.435022354125977, "global_step": 460150, "epoch": 5543} {"train_loss": -27.07215752659074, "global_step": 460151, "epoch": 5543, "val_loss": 6616087.0} {"train_loss": -26.312536239624023, "global_step": 460152, "epoch": 5544} {"train_loss": -26.165210723876953, "global_step": 460153, "epoch": 5544} {"train_loss": -26.183746337890625, "global_step": 460154, "epoch": 5544} {"train_loss": -26.7960262298584, "global_step": 460155, "epoch": 5544} {"train_loss": -27.35590934753418, "global_step": 460156, "epoch": 5544} {"train_loss": -26.648544311523438, "global_step": 460157, "epoch": 5544} {"train_loss": -26.74713706970215, "global_step": 460158, "epoch": 5544} {"train_loss": -26.8154239654541, "global_step": 460159, "epoch": 5544} {"train_loss": -26.89230728149414, "global_step": 460160, "epoch": 5544} {"train_loss": -26.700727462768555, "global_step": 460161, "epoch": 5544} {"train_loss": -26.81875991821289, "global_step": 460162, "epoch": 5544} {"train_loss": -27.077131271362305, "global_step": 460163, "epoch": 5544} {"train_loss": -27.166961669921875, "global_step": 460164, "epoch": 5544} {"train_loss": -26.9138126373291, "global_step": 460165, "epoch": 5544} {"train_loss": -27.051910400390625, "global_step": 460166, "epoch": 5544} {"train_loss": -27.079309463500977, "global_step": 460167, "epoch": 5544} {"train_loss": -27.054798126220703, "global_step": 460168, "epoch": 5544} {"train_loss": -27.334503173828125, "global_step": 460169, "epoch": 5544} {"train_loss": -27.01844596862793, "global_step": 460170, "epoch": 5544} {"train_loss": -26.992752075195312, "global_step": 460171, "epoch": 5544} {"train_loss": -26.922779083251953, "global_step": 460172, "epoch": 5544} {"train_loss": -27.07723045349121, "global_step": 460173, "epoch": 5544} {"train_loss": -26.906408309936523, "global_step": 460174, "epoch": 5544} {"train_loss": -27.195331573486328, "global_step": 460175, "epoch": 5544} {"train_loss": -27.3435115814209, "global_step": 460176, "epoch": 5544} {"train_loss": -27.13787269592285, "global_step": 460177, "epoch": 5544} {"train_loss": -27.28740882873535, "global_step": 460178, "epoch": 5544} {"train_loss": -27.09638023376465, "global_step": 460179, "epoch": 5544} {"train_loss": -26.94944190979004, "global_step": 460180, "epoch": 5544} {"train_loss": -27.039031982421875, "global_step": 460181, "epoch": 5544} {"train_loss": -27.1484432220459, "global_step": 460182, "epoch": 5544} {"train_loss": -27.19287109375, "global_step": 460183, "epoch": 5544} {"train_loss": -26.97760581970215, "global_step": 460184, "epoch": 5544} {"train_loss": -27.366819381713867, "global_step": 460185, "epoch": 5544} {"train_loss": -27.207334518432617, "global_step": 460186, "epoch": 5544} {"train_loss": -26.947416305541992, "global_step": 460187, "epoch": 5544} {"train_loss": -27.378568649291992, "global_step": 460188, "epoch": 5544} {"train_loss": -27.392850875854492, "global_step": 460189, "epoch": 5544} {"train_loss": -26.966161727905273, "global_step": 460190, "epoch": 5544} {"train_loss": -27.224210739135742, "global_step": 460191, "epoch": 5544} {"train_loss": -27.028776168823242, "global_step": 460192, "epoch": 5544} {"train_loss": -27.350961685180664, "global_step": 460193, "epoch": 5544} {"train_loss": -26.74432945251465, "global_step": 460194, "epoch": 5544} {"train_loss": -27.051008224487305, "global_step": 460195, "epoch": 5544} {"train_loss": -27.239866256713867, "global_step": 460196, "epoch": 5544} {"train_loss": -27.433332443237305, "global_step": 460197, "epoch": 5544} {"train_loss": -26.856201171875, "global_step": 460198, "epoch": 5544} {"train_loss": -27.29074478149414, "global_step": 460199, "epoch": 5544} {"train_loss": -27.17877769470215, "global_step": 460200, "epoch": 5544} {"train_loss": -27.222814559936523, "global_step": 460201, "epoch": 5544} {"train_loss": -26.780963897705078, "global_step": 460202, "epoch": 5544} {"train_loss": -27.38124656677246, "global_step": 460203, "epoch": 5544} {"train_loss": -27.497241973876953, "global_step": 460204, "epoch": 5544} {"train_loss": -27.136962890625, "global_step": 460205, "epoch": 5544} {"train_loss": -27.105884552001953, "global_step": 460206, "epoch": 5544} {"train_loss": -27.352880477905273, "global_step": 460207, "epoch": 5544} {"train_loss": -27.346603393554688, "global_step": 460208, "epoch": 5544} {"train_loss": -27.155664443969727, "global_step": 460209, "epoch": 5544} {"train_loss": -26.604068756103516, "global_step": 460210, "epoch": 5544} {"train_loss": -26.773752212524414, "global_step": 460211, "epoch": 5544} {"train_loss": -27.176969528198242, "global_step": 460212, "epoch": 5544} {"train_loss": -26.632461547851562, "global_step": 460213, "epoch": 5544} {"train_loss": -26.90094566345215, "global_step": 460214, "epoch": 5544} {"train_loss": -27.006134033203125, "global_step": 460215, "epoch": 5544} {"train_loss": -26.968473434448242, "global_step": 460216, "epoch": 5544} {"train_loss": -27.2028865814209, "global_step": 460217, "epoch": 5544} {"train_loss": -27.313934326171875, "global_step": 460218, "epoch": 5544} {"train_loss": -27.161649703979492, "global_step": 460219, "epoch": 5544} {"train_loss": -27.23578453063965, "global_step": 460220, "epoch": 5544} {"train_loss": -27.18695068359375, "global_step": 460221, "epoch": 5544} {"train_loss": -26.949430465698242, "global_step": 460222, "epoch": 5544} {"train_loss": -27.223377227783203, "global_step": 460223, "epoch": 5544} {"train_loss": -27.345199584960938, "global_step": 460224, "epoch": 5544} {"train_loss": -27.140607833862305, "global_step": 460225, "epoch": 5544} {"train_loss": -27.1533145904541, "global_step": 460226, "epoch": 5544} {"train_loss": -27.05254554748535, "global_step": 460227, "epoch": 5544} {"train_loss": -27.152612686157227, "global_step": 460228, "epoch": 5544} {"train_loss": -27.282989501953125, "global_step": 460229, "epoch": 5544} {"train_loss": -27.21368408203125, "global_step": 460230, "epoch": 5544} {"train_loss": -26.94223976135254, "global_step": 460231, "epoch": 5544} {"train_loss": -27.27033805847168, "global_step": 460232, "epoch": 5544} {"train_loss": -27.074726104736328, "global_step": 460233, "epoch": 5544} {"train_loss": -27.058807671788227, "global_step": 460234, "epoch": 5544, "val_loss": 6571119.0} {"train_loss": -26.988311767578125, "global_step": 460235, "epoch": 5545} {"train_loss": -26.995649337768555, "global_step": 460236, "epoch": 5545} {"train_loss": -26.98944664001465, "global_step": 460237, "epoch": 5545} {"train_loss": -26.55177116394043, "global_step": 460238, "epoch": 5545} {"train_loss": -27.101978302001953, "global_step": 460239, "epoch": 5545} {"train_loss": -26.963544845581055, "global_step": 460240, "epoch": 5545} {"train_loss": -27.033910751342773, "global_step": 460241, "epoch": 5545} {"train_loss": -26.773014068603516, "global_step": 460242, "epoch": 5545} {"train_loss": -27.031787872314453, "global_step": 460243, "epoch": 5545} {"train_loss": -26.906904220581055, "global_step": 460244, "epoch": 5545} {"train_loss": -26.990875244140625, "global_step": 460245, "epoch": 5545} {"train_loss": -27.407180786132812, "global_step": 460246, "epoch": 5545} {"train_loss": -26.90016746520996, "global_step": 460247, "epoch": 5545} {"train_loss": -26.712858200073242, "global_step": 460248, "epoch": 5545} {"train_loss": -27.38667869567871, "global_step": 460249, "epoch": 5545} {"train_loss": -27.2891845703125, "global_step": 460250, "epoch": 5545} {"train_loss": -27.096179962158203, "global_step": 460251, "epoch": 5545} {"train_loss": -27.066608428955078, "global_step": 460252, "epoch": 5545} {"train_loss": -27.3471736907959, "global_step": 460253, "epoch": 5545} {"train_loss": -27.008697509765625, "global_step": 460254, "epoch": 5545} {"train_loss": -26.987049102783203, "global_step": 460255, "epoch": 5545} {"train_loss": -27.35407066345215, "global_step": 460256, "epoch": 5545} {"train_loss": -27.048171997070312, "global_step": 460257, "epoch": 5545} {"train_loss": -27.11492919921875, "global_step": 460258, "epoch": 5545} {"train_loss": -27.119720458984375, "global_step": 460259, "epoch": 5545} {"train_loss": -27.148279190063477, "global_step": 460260, "epoch": 5545} {"train_loss": -27.37190055847168, "global_step": 460261, "epoch": 5545} {"train_loss": -27.046716690063477, "global_step": 460262, "epoch": 5545} {"train_loss": -26.9085636138916, "global_step": 460263, "epoch": 5545} {"train_loss": -27.356952667236328, "global_step": 460264, "epoch": 5545} {"train_loss": -27.241785049438477, "global_step": 460265, "epoch": 5545} {"train_loss": -27.2960205078125, "global_step": 460266, "epoch": 5545} {"train_loss": -26.89163589477539, "global_step": 460267, "epoch": 5545} {"train_loss": -27.68975257873535, "global_step": 460268, "epoch": 5545} {"train_loss": -27.265125274658203, "global_step": 460269, "epoch": 5545} {"train_loss": -27.042469024658203, "global_step": 460270, "epoch": 5545} {"train_loss": -27.386499404907227, "global_step": 460271, "epoch": 5545} {"train_loss": -27.2055721282959, "global_step": 460272, "epoch": 5545} {"train_loss": -26.95473289489746, "global_step": 460273, "epoch": 5545} {"train_loss": -26.828214645385742, "global_step": 460274, "epoch": 5545} {"train_loss": -27.201587677001953, "global_step": 460275, "epoch": 5545} {"train_loss": -27.33064842224121, "global_step": 460276, "epoch": 5545} {"train_loss": -26.933801651000977, "global_step": 460277, "epoch": 5545} {"train_loss": -27.15455436706543, "global_step": 460278, "epoch": 5545} {"train_loss": -27.39246940612793, "global_step": 460279, "epoch": 5545} {"train_loss": -26.88117027282715, "global_step": 460280, "epoch": 5545} {"train_loss": -26.973257064819336, "global_step": 460281, "epoch": 5545} {"train_loss": -26.8122615814209, "global_step": 460282, "epoch": 5545} {"train_loss": -26.7298641204834, "global_step": 460283, "epoch": 5545} {"train_loss": -27.514820098876953, "global_step": 460284, "epoch": 5545} {"train_loss": -27.07320213317871, "global_step": 460285, "epoch": 5545} {"train_loss": -26.842309951782227, "global_step": 460286, "epoch": 5545} {"train_loss": -26.78192138671875, "global_step": 460287, "epoch": 5545} {"train_loss": -26.421222686767578, "global_step": 460288, "epoch": 5545} {"train_loss": -27.053739547729492, "global_step": 460289, "epoch": 5545} {"train_loss": -26.980304718017578, "global_step": 460290, "epoch": 5545} {"train_loss": -26.173431396484375, "global_step": 460291, "epoch": 5545} {"train_loss": -26.310699462890625, "global_step": 460292, "epoch": 5545} {"train_loss": -27.145551681518555, "global_step": 460293, "epoch": 5545} {"train_loss": -26.868322372436523, "global_step": 460294, "epoch": 5545} {"train_loss": -26.824981689453125, "global_step": 460295, "epoch": 5545} {"train_loss": -26.9592227935791, "global_step": 460296, "epoch": 5545} {"train_loss": -27.143646240234375, "global_step": 460297, "epoch": 5545} {"train_loss": -26.75331687927246, "global_step": 460298, "epoch": 5545} {"train_loss": -27.16776466369629, "global_step": 460299, "epoch": 5545} {"train_loss": -26.81540298461914, "global_step": 460300, "epoch": 5545} {"train_loss": -27.015857696533203, "global_step": 460301, "epoch": 5545} {"train_loss": -27.467788696289062, "global_step": 460302, "epoch": 5545} {"train_loss": -26.959638595581055, "global_step": 460303, "epoch": 5545} {"train_loss": -27.251310348510742, "global_step": 460304, "epoch": 5545} {"train_loss": -27.46657371520996, "global_step": 460305, "epoch": 5545} {"train_loss": -27.14043617248535, "global_step": 460306, "epoch": 5545} {"train_loss": -27.2235164642334, "global_step": 460307, "epoch": 5545} {"train_loss": -26.834802627563477, "global_step": 460308, "epoch": 5545} {"train_loss": -27.34779167175293, "global_step": 460309, "epoch": 5545} {"train_loss": -26.910120010375977, "global_step": 460310, "epoch": 5545} {"train_loss": -26.94662857055664, "global_step": 460311, "epoch": 5545} {"train_loss": -27.162031173706055, "global_step": 460312, "epoch": 5545} {"train_loss": -27.0758113861084, "global_step": 460313, "epoch": 5545} {"train_loss": -26.538251876831055, "global_step": 460314, "epoch": 5545} {"train_loss": -26.9946346282959, "global_step": 460315, "epoch": 5545} {"train_loss": -26.79281997680664, "global_step": 460316, "epoch": 5545} {"train_loss": -27.040945673563396, "global_step": 460317, "epoch": 5545, "val_loss": 6638387.0} {"train_loss": -26.37344741821289, "global_step": 460318, "epoch": 5546} {"train_loss": -26.918848037719727, "global_step": 460319, "epoch": 5546} {"train_loss": -26.03301429748535, "global_step": 460320, "epoch": 5546} {"train_loss": -26.535003662109375, "global_step": 460321, "epoch": 5546} {"train_loss": -27.095279693603516, "global_step": 460322, "epoch": 5546} {"train_loss": -26.437042236328125, "global_step": 460323, "epoch": 5546} {"train_loss": -26.1507568359375, "global_step": 460324, "epoch": 5546} {"train_loss": -26.078855514526367, "global_step": 460325, "epoch": 5546} {"train_loss": -26.8404483795166, "global_step": 460326, "epoch": 5546} {"train_loss": -26.447553634643555, "global_step": 460327, "epoch": 5546} {"train_loss": -26.38117027282715, "global_step": 460328, "epoch": 5546} {"train_loss": -26.542104721069336, "global_step": 460329, "epoch": 5546} {"train_loss": -26.049362182617188, "global_step": 460330, "epoch": 5546} {"train_loss": -26.708906173706055, "global_step": 460331, "epoch": 5546} {"train_loss": -26.96625328063965, "global_step": 460332, "epoch": 5546} {"train_loss": -26.589643478393555, "global_step": 460333, "epoch": 5546} {"train_loss": -27.02900505065918, "global_step": 460334, "epoch": 5546} {"train_loss": -26.835250854492188, "global_step": 460335, "epoch": 5546} {"train_loss": -26.82805824279785, "global_step": 460336, "epoch": 5546} {"train_loss": -26.532751083374023, "global_step": 460337, "epoch": 5546} {"train_loss": -27.115991592407227, "global_step": 460338, "epoch": 5546} {"train_loss": -26.80975914001465, "global_step": 460339, "epoch": 5546} {"train_loss": -26.95804786682129, "global_step": 460340, "epoch": 5546} {"train_loss": -26.877973556518555, "global_step": 460341, "epoch": 5546} {"train_loss": -26.8776912689209, "global_step": 460342, "epoch": 5546} {"train_loss": -26.93903160095215, "global_step": 460343, "epoch": 5546} {"train_loss": -26.783842086791992, "global_step": 460344, "epoch": 5546} {"train_loss": -27.216527938842773, "global_step": 460345, "epoch": 5546} {"train_loss": -26.87982177734375, "global_step": 460346, "epoch": 5546} {"train_loss": -26.913984298706055, "global_step": 460347, "epoch": 5546} {"train_loss": -27.100751876831055, "global_step": 460348, "epoch": 5546} {"train_loss": -26.665679931640625, "global_step": 460349, "epoch": 5546} {"train_loss": -26.887527465820312, "global_step": 460350, "epoch": 5546} {"train_loss": -26.832727432250977, "global_step": 460351, "epoch": 5546} {"train_loss": -27.157001495361328, "global_step": 460352, "epoch": 5546} {"train_loss": -26.981382369995117, "global_step": 460353, "epoch": 5546} {"train_loss": -26.6112060546875, "global_step": 460354, "epoch": 5546} {"train_loss": -27.024499893188477, "global_step": 460355, "epoch": 5546} {"train_loss": -27.15769386291504, "global_step": 460356, "epoch": 5546} {"train_loss": -27.272974014282227, "global_step": 460357, "epoch": 5546} {"train_loss": -27.315628051757812, "global_step": 460358, "epoch": 5546} {"train_loss": -27.119924545288086, "global_step": 460359, "epoch": 5546} {"train_loss": -27.124298095703125, "global_step": 460360, "epoch": 5546} {"train_loss": -27.213031768798828, "global_step": 460361, "epoch": 5546} {"train_loss": -27.330549240112305, "global_step": 460362, "epoch": 5546} {"train_loss": -27.069610595703125, "global_step": 460363, "epoch": 5546} {"train_loss": -27.5408992767334, "global_step": 460364, "epoch": 5546} {"train_loss": -27.120288848876953, "global_step": 460365, "epoch": 5546} {"train_loss": -27.406713485717773, "global_step": 460366, "epoch": 5546} {"train_loss": -27.3707218170166, "global_step": 460367, "epoch": 5546} {"train_loss": -27.113561630249023, "global_step": 460368, "epoch": 5546} {"train_loss": -26.83441162109375, "global_step": 460369, "epoch": 5546} {"train_loss": -27.212194442749023, "global_step": 460370, "epoch": 5546} {"train_loss": -27.459436416625977, "global_step": 460371, "epoch": 5546} {"train_loss": -27.335952758789062, "global_step": 460372, "epoch": 5546} {"train_loss": -27.527118682861328, "global_step": 460373, "epoch": 5546} {"train_loss": -27.0056209564209, "global_step": 460374, "epoch": 5546} {"train_loss": -27.31317710876465, "global_step": 460375, "epoch": 5546} {"train_loss": -27.437713623046875, "global_step": 460376, "epoch": 5546} {"train_loss": -26.975906372070312, "global_step": 460377, "epoch": 5546} {"train_loss": -26.932031631469727, "global_step": 460378, "epoch": 5546} {"train_loss": -27.4283390045166, "global_step": 460379, "epoch": 5546} {"train_loss": -27.182287216186523, "global_step": 460380, "epoch": 5546} {"train_loss": -27.266376495361328, "global_step": 460381, "epoch": 5546} {"train_loss": -27.399560928344727, "global_step": 460382, "epoch": 5546} {"train_loss": -26.91572380065918, "global_step": 460383, "epoch": 5546} {"train_loss": -27.090978622436523, "global_step": 460384, "epoch": 5546} {"train_loss": -27.15907096862793, "global_step": 460385, "epoch": 5546} {"train_loss": -27.468652725219727, "global_step": 460386, "epoch": 5546} {"train_loss": -26.800024032592773, "global_step": 460387, "epoch": 5546} {"train_loss": -27.32732582092285, "global_step": 460388, "epoch": 5546} {"train_loss": -26.810556411743164, "global_step": 460389, "epoch": 5546} {"train_loss": -26.505970001220703, "global_step": 460390, "epoch": 5546} {"train_loss": -26.06587028503418, "global_step": 460391, "epoch": 5546} {"train_loss": -26.617231369018555, "global_step": 460392, "epoch": 5546} {"train_loss": -27.162174224853516, "global_step": 460393, "epoch": 5546} {"train_loss": -27.153478622436523, "global_step": 460394, "epoch": 5546} {"train_loss": -26.47393798828125, "global_step": 460395, "epoch": 5546} {"train_loss": -27.014881134033203, "global_step": 460396, "epoch": 5546} {"train_loss": -26.743017196655273, "global_step": 460397, "epoch": 5546} {"train_loss": -27.091999053955078, "global_step": 460398, "epoch": 5546} {"train_loss": -27.322690963745117, "global_step": 460399, "epoch": 5546} {"train_loss": -26.931318903543865, "global_step": 460400, "epoch": 5546, "val_loss": 6644063.5} {"train_loss": -25.693159103393555, "global_step": 460401, "epoch": 5547} {"train_loss": -25.674152374267578, "global_step": 460402, "epoch": 5547} {"train_loss": -25.329015731811523, "global_step": 460403, "epoch": 5547} {"train_loss": -25.604772567749023, "global_step": 460404, "epoch": 5547} {"train_loss": -26.10686683654785, "global_step": 460405, "epoch": 5547} {"train_loss": -25.34662628173828, "global_step": 460406, "epoch": 5547} {"train_loss": -26.614309310913086, "global_step": 460407, "epoch": 5547} {"train_loss": -26.606603622436523, "global_step": 460408, "epoch": 5547} {"train_loss": -26.412809371948242, "global_step": 460409, "epoch": 5547} {"train_loss": -26.45782470703125, "global_step": 460410, "epoch": 5547} {"train_loss": -26.50690269470215, "global_step": 460411, "epoch": 5547} {"train_loss": -26.755308151245117, "global_step": 460412, "epoch": 5547} {"train_loss": -27.120466232299805, "global_step": 460413, "epoch": 5547} {"train_loss": -26.531946182250977, "global_step": 460414, "epoch": 5547} {"train_loss": -26.62353515625, "global_step": 460415, "epoch": 5547} {"train_loss": -26.463998794555664, "global_step": 460416, "epoch": 5547} {"train_loss": -26.76523208618164, "global_step": 460417, "epoch": 5547} {"train_loss": -26.869983673095703, "global_step": 460418, "epoch": 5547} {"train_loss": -26.982772827148438, "global_step": 460419, "epoch": 5547} {"train_loss": -26.741357803344727, "global_step": 460420, "epoch": 5547} {"train_loss": -26.76283836364746, "global_step": 460421, "epoch": 5547} {"train_loss": -26.618610382080078, "global_step": 460422, "epoch": 5547} {"train_loss": -27.224157333374023, "global_step": 460423, "epoch": 5547} {"train_loss": -26.712726593017578, "global_step": 460424, "epoch": 5547} {"train_loss": -26.772891998291016, "global_step": 460425, "epoch": 5547} {"train_loss": -26.866613388061523, "global_step": 460426, "epoch": 5547} {"train_loss": -26.97382164001465, "global_step": 460427, "epoch": 5547} {"train_loss": -27.311614990234375, "global_step": 460428, "epoch": 5547} {"train_loss": -26.673343658447266, "global_step": 460429, "epoch": 5547} {"train_loss": -27.131610870361328, "global_step": 460430, "epoch": 5547} {"train_loss": -27.127038955688477, "global_step": 460431, "epoch": 5547} {"train_loss": -27.023406982421875, "global_step": 460432, "epoch": 5547} {"train_loss": -27.2051944732666, "global_step": 460433, "epoch": 5547} {"train_loss": -27.033056259155273, "global_step": 460434, "epoch": 5547} {"train_loss": -26.894851684570312, "global_step": 460435, "epoch": 5547} {"train_loss": -27.23734474182129, "global_step": 460436, "epoch": 5547} {"train_loss": -26.946210861206055, "global_step": 460437, "epoch": 5547} {"train_loss": -27.289575576782227, "global_step": 460438, "epoch": 5547} {"train_loss": -27.4686279296875, "global_step": 460439, "epoch": 5547} {"train_loss": -27.24539566040039, "global_step": 460440, "epoch": 5547} {"train_loss": -26.909198760986328, "global_step": 460441, "epoch": 5547} {"train_loss": -27.6726016998291, "global_step": 460442, "epoch": 5547} {"train_loss": -27.175445556640625, "global_step": 460443, "epoch": 5547} {"train_loss": -27.2791805267334, "global_step": 460444, "epoch": 5547} {"train_loss": -27.265295028686523, "global_step": 460445, "epoch": 5547} {"train_loss": -27.086698532104492, "global_step": 460446, "epoch": 5547} {"train_loss": -27.379547119140625, "global_step": 460447, "epoch": 5547} {"train_loss": -27.08184242248535, "global_step": 460448, "epoch": 5547} {"train_loss": -26.918222427368164, "global_step": 460449, "epoch": 5547} {"train_loss": -27.3712100982666, "global_step": 460450, "epoch": 5547} {"train_loss": -27.34429931640625, "global_step": 460451, "epoch": 5547} {"train_loss": -27.123046875, "global_step": 460452, "epoch": 5547} {"train_loss": -27.090900421142578, "global_step": 460453, "epoch": 5547} {"train_loss": -27.360212326049805, "global_step": 460454, "epoch": 5547} {"train_loss": -26.963926315307617, "global_step": 460455, "epoch": 5547} {"train_loss": -27.194021224975586, "global_step": 460456, "epoch": 5547} {"train_loss": -27.51654052734375, "global_step": 460457, "epoch": 5547} {"train_loss": -27.14371109008789, "global_step": 460458, "epoch": 5547} {"train_loss": -27.051956176757812, "global_step": 460459, "epoch": 5547} {"train_loss": -26.76962661743164, "global_step": 460460, "epoch": 5547} {"train_loss": -26.543109893798828, "global_step": 460461, "epoch": 5547} {"train_loss": -26.6685848236084, "global_step": 460462, "epoch": 5547} {"train_loss": -26.390884399414062, "global_step": 460463, "epoch": 5547} {"train_loss": -26.830524444580078, "global_step": 460464, "epoch": 5547} {"train_loss": -27.160566329956055, "global_step": 460465, "epoch": 5547} {"train_loss": -26.933805465698242, "global_step": 460466, "epoch": 5547} {"train_loss": -27.0928955078125, "global_step": 460467, "epoch": 5547} {"train_loss": -26.9468994140625, "global_step": 460468, "epoch": 5547} {"train_loss": -26.96760368347168, "global_step": 460469, "epoch": 5547} {"train_loss": -27.240177154541016, "global_step": 460470, "epoch": 5547} {"train_loss": -27.038869857788086, "global_step": 460471, "epoch": 5547} {"train_loss": -26.48993492126465, "global_step": 460472, "epoch": 5547} {"train_loss": -26.570037841796875, "global_step": 460473, "epoch": 5547} {"train_loss": -26.57574462890625, "global_step": 460474, "epoch": 5547} {"train_loss": -26.793201446533203, "global_step": 460475, "epoch": 5547} {"train_loss": -26.905622482299805, "global_step": 460476, "epoch": 5547} {"train_loss": -26.91916275024414, "global_step": 460477, "epoch": 5547} {"train_loss": -26.465824127197266, "global_step": 460478, "epoch": 5547} {"train_loss": -27.174854278564453, "global_step": 460479, "epoch": 5547} {"train_loss": -27.00396156311035, "global_step": 460480, "epoch": 5547} {"train_loss": -26.631872177124023, "global_step": 460481, "epoch": 5547} {"train_loss": -26.74668312072754, "global_step": 460482, "epoch": 5547} {"train_loss": -26.850198263145355, "global_step": 460483, "epoch": 5547, "val_loss": 6691391.0} {"train_loss": -25.6546688079834, "global_step": 460484, "epoch": 5548} {"train_loss": -26.130298614501953, "global_step": 460485, "epoch": 5548} {"train_loss": -25.900604248046875, "global_step": 460486, "epoch": 5548} {"train_loss": -26.262914657592773, "global_step": 460487, "epoch": 5548} {"train_loss": -26.084823608398438, "global_step": 460488, "epoch": 5548} {"train_loss": -26.406970977783203, "global_step": 460489, "epoch": 5548} {"train_loss": -26.27410316467285, "global_step": 460490, "epoch": 5548} {"train_loss": -26.407007217407227, "global_step": 460491, "epoch": 5548} {"train_loss": -26.576223373413086, "global_step": 460492, "epoch": 5548} {"train_loss": -26.348358154296875, "global_step": 460493, "epoch": 5548} {"train_loss": -26.538293838500977, "global_step": 460494, "epoch": 5548} {"train_loss": -26.245849609375, "global_step": 460495, "epoch": 5548} {"train_loss": -26.807861328125, "global_step": 460496, "epoch": 5548} {"train_loss": -26.234649658203125, "global_step": 460497, "epoch": 5548} {"train_loss": -26.283445358276367, "global_step": 460498, "epoch": 5548} {"train_loss": -26.22540855407715, "global_step": 460499, "epoch": 5548} {"train_loss": -26.4991397857666, "global_step": 460500, "epoch": 5548} {"train_loss": -26.463581085205078, "global_step": 460501, "epoch": 5548} {"train_loss": -26.53037452697754, "global_step": 460502, "epoch": 5548} {"train_loss": -26.54729652404785, "global_step": 460503, "epoch": 5548} {"train_loss": -26.848562240600586, "global_step": 460504, "epoch": 5548} {"train_loss": -26.56544303894043, "global_step": 460505, "epoch": 5548} {"train_loss": -26.7335262298584, "global_step": 460506, "epoch": 5548} {"train_loss": -26.491804122924805, "global_step": 460507, "epoch": 5548} {"train_loss": -27.00685691833496, "global_step": 460508, "epoch": 5548} {"train_loss": -26.90815544128418, "global_step": 460509, "epoch": 5548} {"train_loss": -26.66358757019043, "global_step": 460510, "epoch": 5548} {"train_loss": -26.774885177612305, "global_step": 460511, "epoch": 5548} {"train_loss": -26.95928955078125, "global_step": 460512, "epoch": 5548} {"train_loss": -26.80632972717285, "global_step": 460513, "epoch": 5548} {"train_loss": -26.80401039123535, "global_step": 460514, "epoch": 5548} {"train_loss": -26.867231369018555, "global_step": 460515, "epoch": 5548} {"train_loss": -27.108139038085938, "global_step": 460516, "epoch": 5548} {"train_loss": -27.052892684936523, "global_step": 460517, "epoch": 5548} {"train_loss": -27.0910587310791, "global_step": 460518, "epoch": 5548} {"train_loss": -27.061033248901367, "global_step": 460519, "epoch": 5548} {"train_loss": -26.577289581298828, "global_step": 460520, "epoch": 5548} {"train_loss": -26.957935333251953, "global_step": 460521, "epoch": 5548} {"train_loss": -27.068506240844727, "global_step": 460522, "epoch": 5548} {"train_loss": -26.815027236938477, "global_step": 460523, "epoch": 5548} {"train_loss": -27.357391357421875, "global_step": 460524, "epoch": 5548} {"train_loss": -27.206573486328125, "global_step": 460525, "epoch": 5548} {"train_loss": -27.239959716796875, "global_step": 460526, "epoch": 5548} {"train_loss": -27.23126220703125, "global_step": 460527, "epoch": 5548} {"train_loss": -27.317235946655273, "global_step": 460528, "epoch": 5548} {"train_loss": -27.303390502929688, "global_step": 460529, "epoch": 5548} {"train_loss": -27.059900283813477, "global_step": 460530, "epoch": 5548} {"train_loss": -27.628198623657227, "global_step": 460531, "epoch": 5548} {"train_loss": -27.427017211914062, "global_step": 460532, "epoch": 5548} {"train_loss": -26.878555297851562, "global_step": 460533, "epoch": 5548} {"train_loss": -27.14198112487793, "global_step": 460534, "epoch": 5548} {"train_loss": -27.381107330322266, "global_step": 460535, "epoch": 5548} {"train_loss": -27.137113571166992, "global_step": 460536, "epoch": 5548} {"train_loss": -26.977975845336914, "global_step": 460537, "epoch": 5548} {"train_loss": -27.47527503967285, "global_step": 460538, "epoch": 5548} {"train_loss": -27.404077529907227, "global_step": 460539, "epoch": 5548} {"train_loss": -27.6440372467041, "global_step": 460540, "epoch": 5548} {"train_loss": -27.370349884033203, "global_step": 460541, "epoch": 5548} {"train_loss": -27.307117462158203, "global_step": 460542, "epoch": 5548} {"train_loss": -27.95556640625, "global_step": 460543, "epoch": 5548} {"train_loss": -27.297224044799805, "global_step": 460544, "epoch": 5548} {"train_loss": -27.55619239807129, "global_step": 460545, "epoch": 5548} {"train_loss": -26.669889450073242, "global_step": 460546, "epoch": 5548} {"train_loss": -27.21982765197754, "global_step": 460547, "epoch": 5548} {"train_loss": -26.955686569213867, "global_step": 460548, "epoch": 5548} {"train_loss": -27.272735595703125, "global_step": 460549, "epoch": 5548} {"train_loss": -27.191442489624023, "global_step": 460550, "epoch": 5548} {"train_loss": -27.081735610961914, "global_step": 460551, "epoch": 5548} {"train_loss": -26.97243309020996, "global_step": 460552, "epoch": 5548} {"train_loss": -27.3040828704834, "global_step": 460553, "epoch": 5548} {"train_loss": -26.862396240234375, "global_step": 460554, "epoch": 5548} {"train_loss": -27.394453048706055, "global_step": 460555, "epoch": 5548} {"train_loss": -27.7696475982666, "global_step": 460556, "epoch": 5548} {"train_loss": -27.187650680541992, "global_step": 460557, "epoch": 5548} {"train_loss": -26.862869262695312, "global_step": 460558, "epoch": 5548} {"train_loss": -27.056921005249023, "global_step": 460559, "epoch": 5548} {"train_loss": -26.863540649414062, "global_step": 460560, "epoch": 5548} {"train_loss": -26.788543701171875, "global_step": 460561, "epoch": 5548} {"train_loss": -26.250335693359375, "global_step": 460562, "epoch": 5548} {"train_loss": -26.268461227416992, "global_step": 460563, "epoch": 5548} {"train_loss": -26.024616241455078, "global_step": 460564, "epoch": 5548} {"train_loss": -26.9649715423584, "global_step": 460565, "epoch": 5548} {"train_loss": -26.87311684941671, "global_step": 460566, "epoch": 5548, "val_loss": 6673955.5} {"train_loss": -24.913965225219727, "global_step": 460567, "epoch": 5549} {"train_loss": -24.24744987487793, "global_step": 460568, "epoch": 5549} {"train_loss": -24.397907257080078, "global_step": 460569, "epoch": 5549} {"train_loss": -25.83791160583496, "global_step": 460570, "epoch": 5549} {"train_loss": -25.37727928161621, "global_step": 460571, "epoch": 5549} {"train_loss": -25.169219970703125, "global_step": 460572, "epoch": 5549} {"train_loss": -25.890851974487305, "global_step": 460573, "epoch": 5549} {"train_loss": -25.448774337768555, "global_step": 460574, "epoch": 5549} {"train_loss": -26.115863800048828, "global_step": 460575, "epoch": 5549} {"train_loss": -26.208898544311523, "global_step": 460576, "epoch": 5549} {"train_loss": -26.399677276611328, "global_step": 460577, "epoch": 5549} {"train_loss": -25.329744338989258, "global_step": 460578, "epoch": 5549} {"train_loss": -26.217004776000977, "global_step": 460579, "epoch": 5549} {"train_loss": -26.263174057006836, "global_step": 460580, "epoch": 5549} {"train_loss": -26.06146812438965, "global_step": 460581, "epoch": 5549} {"train_loss": -26.089527130126953, "global_step": 460582, "epoch": 5549} {"train_loss": -26.2639217376709, "global_step": 460583, "epoch": 5549} {"train_loss": -26.461278915405273, "global_step": 460584, "epoch": 5549} {"train_loss": -26.33966636657715, "global_step": 460585, "epoch": 5549} {"train_loss": -26.502084732055664, "global_step": 460586, "epoch": 5549} {"train_loss": -26.873676300048828, "global_step": 460587, "epoch": 5549} {"train_loss": -26.53070068359375, "global_step": 460588, "epoch": 5549} {"train_loss": -26.42405128479004, "global_step": 460589, "epoch": 5549} {"train_loss": -26.8673038482666, "global_step": 460590, "epoch": 5549} {"train_loss": -27.15622901916504, "global_step": 460591, "epoch": 5549} {"train_loss": -26.547607421875, "global_step": 460592, "epoch": 5549} {"train_loss": -26.90579605102539, "global_step": 460593, "epoch": 5549} {"train_loss": -26.36629295349121, "global_step": 460594, "epoch": 5549} {"train_loss": -26.7633113861084, "global_step": 460595, "epoch": 5549} {"train_loss": -26.770307540893555, "global_step": 460596, "epoch": 5549} {"train_loss": -26.666015625, "global_step": 460597, "epoch": 5549} {"train_loss": -26.416278839111328, "global_step": 460598, "epoch": 5549} {"train_loss": -27.094501495361328, "global_step": 460599, "epoch": 5549} {"train_loss": -26.5433292388916, "global_step": 460600, "epoch": 5549} {"train_loss": -26.696386337280273, "global_step": 460601, "epoch": 5549} {"train_loss": -27.130908966064453, "global_step": 460602, "epoch": 5549} {"train_loss": -26.699689865112305, "global_step": 460603, "epoch": 5549} {"train_loss": -27.101364135742188, "global_step": 460604, "epoch": 5549} {"train_loss": -27.241958618164062, "global_step": 460605, "epoch": 5549} {"train_loss": -26.972858428955078, "global_step": 460606, "epoch": 5549} {"train_loss": -27.076013565063477, "global_step": 460607, "epoch": 5549} {"train_loss": -27.001672744750977, "global_step": 460608, "epoch": 5549} {"train_loss": -27.319263458251953, "global_step": 460609, "epoch": 5549} {"train_loss": -26.74671745300293, "global_step": 460610, "epoch": 5549} {"train_loss": -27.175058364868164, "global_step": 460611, "epoch": 5549} {"train_loss": -26.88495445251465, "global_step": 460612, "epoch": 5549} {"train_loss": -26.84610939025879, "global_step": 460613, "epoch": 5549} {"train_loss": -26.802942276000977, "global_step": 460614, "epoch": 5549} {"train_loss": -27.060932159423828, "global_step": 460615, "epoch": 5549} {"train_loss": -26.950946807861328, "global_step": 460616, "epoch": 5549} {"train_loss": -27.46746253967285, "global_step": 460617, "epoch": 5549} {"train_loss": -27.303686141967773, "global_step": 460618, "epoch": 5549} {"train_loss": -27.263416290283203, "global_step": 460619, "epoch": 5549} {"train_loss": -26.783191680908203, "global_step": 460620, "epoch": 5549} {"train_loss": -27.100650787353516, "global_step": 460621, "epoch": 5549} {"train_loss": -27.09598731994629, "global_step": 460622, "epoch": 5549} {"train_loss": -27.691757202148438, "global_step": 460623, "epoch": 5549} {"train_loss": -27.379125595092773, "global_step": 460624, "epoch": 5549} {"train_loss": -27.225629806518555, "global_step": 460625, "epoch": 5549} {"train_loss": -27.005605697631836, "global_step": 460626, "epoch": 5549} {"train_loss": -27.604694366455078, "global_step": 460627, "epoch": 5549} {"train_loss": -27.031827926635742, "global_step": 460628, "epoch": 5549} {"train_loss": -27.217910766601562, "global_step": 460629, "epoch": 5549} {"train_loss": -26.8996639251709, "global_step": 460630, "epoch": 5549} {"train_loss": -26.89202308654785, "global_step": 460631, "epoch": 5549} {"train_loss": -26.974628448486328, "global_step": 460632, "epoch": 5549} {"train_loss": -27.235843658447266, "global_step": 460633, "epoch": 5549} {"train_loss": -27.048749923706055, "global_step": 460634, "epoch": 5549} {"train_loss": -26.919797897338867, "global_step": 460635, "epoch": 5549} {"train_loss": -27.42927360534668, "global_step": 460636, "epoch": 5549} {"train_loss": -26.806018829345703, "global_step": 460637, "epoch": 5549} {"train_loss": -27.209365844726562, "global_step": 460638, "epoch": 5549} {"train_loss": -27.299116134643555, "global_step": 460639, "epoch": 5549} {"train_loss": -27.18180274963379, "global_step": 460640, "epoch": 5549} {"train_loss": -27.0875186920166, "global_step": 460641, "epoch": 5549} {"train_loss": -27.136615753173828, "global_step": 460642, "epoch": 5549} {"train_loss": -26.960205078125, "global_step": 460643, "epoch": 5549} {"train_loss": -26.89859390258789, "global_step": 460644, "epoch": 5549} {"train_loss": -27.14862632751465, "global_step": 460645, "epoch": 5549} {"train_loss": -27.226354598999023, "global_step": 460646, "epoch": 5549} {"train_loss": -27.130691528320312, "global_step": 460647, "epoch": 5549} {"train_loss": -27.38895606994629, "global_step": 460648, "epoch": 5549} {"train_loss": -26.71055747801999, "global_step": 460649, "epoch": 5549, "val_loss": 6543045.5} {"train_loss": -26.342987060546875, "global_step": 460650, "epoch": 5550} {"train_loss": -26.57400894165039, "global_step": 460651, "epoch": 5550} {"train_loss": -26.632749557495117, "global_step": 460652, "epoch": 5550} {"train_loss": -26.404388427734375, "global_step": 460653, "epoch": 5550} {"train_loss": -26.270639419555664, "global_step": 460654, "epoch": 5550} {"train_loss": -26.089624404907227, "global_step": 460655, "epoch": 5550} {"train_loss": -26.895462036132812, "global_step": 460656, "epoch": 5550} {"train_loss": -26.50905418395996, "global_step": 460657, "epoch": 5550} {"train_loss": -26.211761474609375, "global_step": 460658, "epoch": 5550} {"train_loss": -26.518774032592773, "global_step": 460659, "epoch": 5550} {"train_loss": -26.658903121948242, "global_step": 460660, "epoch": 5550} {"train_loss": -26.08892822265625, "global_step": 460661, "epoch": 5550} {"train_loss": -26.672534942626953, "global_step": 460662, "epoch": 5550} {"train_loss": -26.578786849975586, "global_step": 460663, "epoch": 5550} {"train_loss": -27.092334747314453, "global_step": 460664, "epoch": 5550} {"train_loss": -26.746143341064453, "global_step": 460665, "epoch": 5550} {"train_loss": -26.642658233642578, "global_step": 460666, "epoch": 5550} {"train_loss": -26.489225387573242, "global_step": 460667, "epoch": 5550} {"train_loss": -26.551435470581055, "global_step": 460668, "epoch": 5550} {"train_loss": -26.81068229675293, "global_step": 460669, "epoch": 5550} {"train_loss": -26.835596084594727, "global_step": 460670, "epoch": 5550} {"train_loss": -26.834524154663086, "global_step": 460671, "epoch": 5550} {"train_loss": -26.8033504486084, "global_step": 460672, "epoch": 5550} {"train_loss": -26.502517700195312, "global_step": 460673, "epoch": 5550} {"train_loss": -27.05392837524414, "global_step": 460674, "epoch": 5550} {"train_loss": -26.654325485229492, "global_step": 460675, "epoch": 5550} {"train_loss": -26.56878662109375, "global_step": 460676, "epoch": 5550} {"train_loss": -26.549325942993164, "global_step": 460677, "epoch": 5550} {"train_loss": -27.071792602539062, "global_step": 460678, "epoch": 5550} {"train_loss": -26.92921257019043, "global_step": 460679, "epoch": 5550} {"train_loss": -26.81953239440918, "global_step": 460680, "epoch": 5550} {"train_loss": -27.119062423706055, "global_step": 460681, "epoch": 5550} {"train_loss": -27.196516036987305, "global_step": 460682, "epoch": 5550} {"train_loss": -27.128870010375977, "global_step": 460683, "epoch": 5550} {"train_loss": -27.181364059448242, "global_step": 460684, "epoch": 5550} {"train_loss": -27.349584579467773, "global_step": 460685, "epoch": 5550} {"train_loss": -27.122333526611328, "global_step": 460686, "epoch": 5550} {"train_loss": -26.9478816986084, "global_step": 460687, "epoch": 5550} {"train_loss": -26.660541534423828, "global_step": 460688, "epoch": 5550} {"train_loss": -26.85908317565918, "global_step": 460689, "epoch": 5550} {"train_loss": -27.070737838745117, "global_step": 460690, "epoch": 5550} {"train_loss": -26.908405303955078, "global_step": 460691, "epoch": 5550} {"train_loss": -27.33078384399414, "global_step": 460692, "epoch": 5550} {"train_loss": -26.841110229492188, "global_step": 460693, "epoch": 5550} {"train_loss": -27.52768325805664, "global_step": 460694, "epoch": 5550} {"train_loss": -27.380462646484375, "global_step": 460695, "epoch": 5550} {"train_loss": -27.19362449645996, "global_step": 460696, "epoch": 5550} {"train_loss": -26.96927261352539, "global_step": 460697, "epoch": 5550} {"train_loss": -27.223852157592773, "global_step": 460698, "epoch": 5550} {"train_loss": -27.07002830505371, "global_step": 460699, "epoch": 5550} {"train_loss": -27.2112979888916, "global_step": 460700, "epoch": 5550} {"train_loss": -27.34514808654785, "global_step": 460701, "epoch": 5550} {"train_loss": -27.08060073852539, "global_step": 460702, "epoch": 5550} {"train_loss": -26.9082088470459, "global_step": 460703, "epoch": 5550} {"train_loss": -27.242645263671875, "global_step": 460704, "epoch": 5550} {"train_loss": -27.144079208374023, "global_step": 460705, "epoch": 5550} {"train_loss": -27.037763595581055, "global_step": 460706, "epoch": 5550} {"train_loss": -27.20232582092285, "global_step": 460707, "epoch": 5550} {"train_loss": -27.36591148376465, "global_step": 460708, "epoch": 5550} {"train_loss": -27.256025314331055, "global_step": 460709, "epoch": 5550} {"train_loss": -27.400909423828125, "global_step": 460710, "epoch": 5550} {"train_loss": -26.91335105895996, "global_step": 460711, "epoch": 5550} {"train_loss": -27.127582550048828, "global_step": 460712, "epoch": 5550} {"train_loss": -26.9903621673584, "global_step": 460713, "epoch": 5550} {"train_loss": -26.798574447631836, "global_step": 460714, "epoch": 5550} {"train_loss": -26.73689842224121, "global_step": 460715, "epoch": 5550} {"train_loss": -26.72296714782715, "global_step": 460716, "epoch": 5550} {"train_loss": -26.807514190673828, "global_step": 460717, "epoch": 5550} {"train_loss": -27.020898818969727, "global_step": 460718, "epoch": 5550} {"train_loss": -26.93918800354004, "global_step": 460719, "epoch": 5550} {"train_loss": -26.713285446166992, "global_step": 460720, "epoch": 5550} {"train_loss": -26.997900009155273, "global_step": 460721, "epoch": 5550} {"train_loss": -27.231021881103516, "global_step": 460722, "epoch": 5550} {"train_loss": -26.9094181060791, "global_step": 460723, "epoch": 5550} {"train_loss": -27.410770416259766, "global_step": 460724, "epoch": 5550} {"train_loss": -27.0113582611084, "global_step": 460725, "epoch": 5550} {"train_loss": -26.93159294128418, "global_step": 460726, "epoch": 5550} {"train_loss": -27.466344833374023, "global_step": 460727, "epoch": 5550} {"train_loss": -27.1657772064209, "global_step": 460728, "epoch": 5550} {"train_loss": -27.32341957092285, "global_step": 460729, "epoch": 5550} {"train_loss": -27.25762367248535, "global_step": 460730, "epoch": 5550} {"train_loss": -26.96864128112793, "global_step": 460731, "epoch": 5550} {"train_loss": -26.907541504825453, "global_step": 460732, "epoch": 5550, "train/sim_max_reward_0": 1.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4500000": 1.0, "test/sim_max_reward_4500001": 1.0, "test/sim_max_reward_4500002": 1.0, "test/sim_max_reward_4500003": 1.0, "test/sim_max_reward_4500004": 1.0, "test/sim_max_reward_4500005": 1.0, "test/sim_max_reward_4500006": 1.0, "test/sim_max_reward_4500007": 0.0, "test/sim_max_reward_4500008": 1.0, "test/sim_max_reward_4500009": 1.0, "test/sim_max_reward_4500010": 1.0, "test/sim_max_reward_4500011": 1.0, "test/sim_max_reward_4500012": 1.0, "test/sim_max_reward_4500013": 0.0, "test/sim_max_reward_4500014": 1.0, "test/sim_max_reward_4500015": 1.0, "test/sim_max_reward_4500016": 1.0, "test/sim_max_reward_4500017": 1.0, "test/sim_max_reward_4500018": 0.0, "test/sim_max_reward_4500019": 0.0, "test/sim_max_reward_4500020": 1.0, "test/sim_max_reward_4500021": 1.0, "train/mean_score": 1.0, "test/mean_score": 0.8181818181818182, "val_loss": 6579049.0} {"train_loss": -26.88916015625, "global_step": 460733, "epoch": 5551} {"train_loss": -26.761016845703125, "global_step": 460734, "epoch": 5551} {"train_loss": -26.578369140625, "global_step": 460735, "epoch": 5551} {"train_loss": -26.927200317382812, "global_step": 460736, "epoch": 5551} {"train_loss": -26.811731338500977, "global_step": 460737, "epoch": 5551} {"train_loss": -26.615758895874023, "global_step": 460738, "epoch": 5551} {"train_loss": -26.940444946289062, "global_step": 460739, "epoch": 5551} {"train_loss": -27.242603302001953, "global_step": 460740, "epoch": 5551} {"train_loss": -27.2485408782959, "global_step": 460741, "epoch": 5551} {"train_loss": -26.898529052734375, "global_step": 460742, "epoch": 5551} {"train_loss": -26.882568359375, "global_step": 460743, "epoch": 5551} {"train_loss": -27.064117431640625, "global_step": 460744, "epoch": 5551} {"train_loss": -26.905893325805664, "global_step": 460745, "epoch": 5551} {"train_loss": -26.977279663085938, "global_step": 460746, "epoch": 5551} {"train_loss": -27.13172721862793, "global_step": 460747, "epoch": 5551} {"train_loss": -26.993595123291016, "global_step": 460748, "epoch": 5551} {"train_loss": -27.4951114654541, "global_step": 460749, "epoch": 5551} {"train_loss": -27.0577449798584, "global_step": 460750, "epoch": 5551} {"train_loss": -27.077865600585938, "global_step": 460751, "epoch": 5551} {"train_loss": -27.228551864624023, "global_step": 460752, "epoch": 5551} {"train_loss": -27.173864364624023, "global_step": 460753, "epoch": 5551} {"train_loss": -26.969064712524414, "global_step": 460754, "epoch": 5551} {"train_loss": -26.953800201416016, "global_step": 460755, "epoch": 5551} {"train_loss": -27.26995849609375, "global_step": 460756, "epoch": 5551} {"train_loss": -27.27675437927246, "global_step": 460757, "epoch": 5551} {"train_loss": -27.143972396850586, "global_step": 460758, "epoch": 5551} {"train_loss": -27.160541534423828, "global_step": 460759, "epoch": 5551} {"train_loss": -27.569232940673828, "global_step": 460760, "epoch": 5551} {"train_loss": -27.33578872680664, "global_step": 460761, "epoch": 5551} {"train_loss": -27.3715877532959, "global_step": 460762, "epoch": 5551} {"train_loss": -27.34574317932129, "global_step": 460763, "epoch": 5551} {"train_loss": -27.39081382751465, "global_step": 460764, "epoch": 5551} {"train_loss": -27.049951553344727, "global_step": 460765, "epoch": 5551} {"train_loss": -27.17838478088379, "global_step": 460766, "epoch": 5551} {"train_loss": -27.23219108581543, "global_step": 460767, "epoch": 5551} {"train_loss": -27.086669921875, "global_step": 460768, "epoch": 5551} {"train_loss": -27.58455467224121, "global_step": 460769, "epoch": 5551} {"train_loss": -27.133563995361328, "global_step": 460770, "epoch": 5551} {"train_loss": -27.234769821166992, "global_step": 460771, "epoch": 5551} {"train_loss": -27.49774169921875, "global_step": 460772, "epoch": 5551} {"train_loss": -27.2072811126709, "global_step": 460773, "epoch": 5551} {"train_loss": -26.939054489135742, "global_step": 460774, "epoch": 5551} {"train_loss": -27.011615753173828, "global_step": 460775, "epoch": 5551} {"train_loss": -27.5344181060791, "global_step": 460776, "epoch": 5551} {"train_loss": -27.39204216003418, "global_step": 460777, "epoch": 5551} {"train_loss": -26.9349422454834, "global_step": 460778, "epoch": 5551} {"train_loss": -27.055927276611328, "global_step": 460779, "epoch": 5551} {"train_loss": -26.849353790283203, "global_step": 460780, "epoch": 5551} {"train_loss": -26.6732120513916, "global_step": 460781, "epoch": 5551} {"train_loss": -26.176197052001953, "global_step": 460782, "epoch": 5551} {"train_loss": -26.1719913482666, "global_step": 460783, "epoch": 5551} {"train_loss": -26.19965171813965, "global_step": 460784, "epoch": 5551} {"train_loss": -26.72125244140625, "global_step": 460785, "epoch": 5551} {"train_loss": -26.8902530670166, "global_step": 460786, "epoch": 5551} {"train_loss": -26.23398780822754, "global_step": 460787, "epoch": 5551} {"train_loss": -26.644855499267578, "global_step": 460788, "epoch": 5551} {"train_loss": -27.01826286315918, "global_step": 460789, "epoch": 5551} {"train_loss": -27.176233291625977, "global_step": 460790, "epoch": 5551} {"train_loss": -26.871875762939453, "global_step": 460791, "epoch": 5551} {"train_loss": -27.08737564086914, "global_step": 460792, "epoch": 5551} {"train_loss": -27.250730514526367, "global_step": 460793, "epoch": 5551} {"train_loss": -27.56477928161621, "global_step": 460794, "epoch": 5551} {"train_loss": -27.00678825378418, "global_step": 460795, "epoch": 5551} {"train_loss": -26.825942993164062, "global_step": 460796, "epoch": 5551} {"train_loss": -26.920276641845703, "global_step": 460797, "epoch": 5551} {"train_loss": -26.889209747314453, "global_step": 460798, "epoch": 5551} {"train_loss": -27.17884635925293, "global_step": 460799, "epoch": 5551} {"train_loss": -27.153783798217773, "global_step": 460800, "epoch": 5551} {"train_loss": -26.944808959960938, "global_step": 460801, "epoch": 5551} {"train_loss": -27.123395919799805, "global_step": 460802, "epoch": 5551} {"train_loss": -27.095930099487305, "global_step": 460803, "epoch": 5551} {"train_loss": -27.1080265045166, "global_step": 460804, "epoch": 5551} {"train_loss": -26.9702091217041, "global_step": 460805, "epoch": 5551} {"train_loss": -27.066970825195312, "global_step": 460806, "epoch": 5551} {"train_loss": -27.187652587890625, "global_step": 460807, "epoch": 5551} {"train_loss": -26.776647567749023, "global_step": 460808, "epoch": 5551} {"train_loss": -27.152921676635742, "global_step": 460809, "epoch": 5551} {"train_loss": -27.082014083862305, "global_step": 460810, "epoch": 5551} {"train_loss": -27.419015884399414, "global_step": 460811, "epoch": 5551} {"train_loss": -27.303449630737305, "global_step": 460812, "epoch": 5551} {"train_loss": -27.414356231689453, "global_step": 460813, "epoch": 5551} {"train_loss": -27.37324333190918, "global_step": 460814, "epoch": 5551} {"train_loss": -27.056329060749835, "global_step": 460815, "epoch": 5551, "val_loss": 6560359.5} {"train_loss": -26.597095489501953, "global_step": 460816, "epoch": 5552} {"train_loss": -27.244787216186523, "global_step": 460817, "epoch": 5552} {"train_loss": -26.971439361572266, "global_step": 460818, "epoch": 5552} {"train_loss": -27.121381759643555, "global_step": 460819, "epoch": 5552} {"train_loss": -26.63691520690918, "global_step": 460820, "epoch": 5552} {"train_loss": -26.63056755065918, "global_step": 460821, "epoch": 5552} {"train_loss": -26.939428329467773, "global_step": 460822, "epoch": 5552} {"train_loss": -27.14935302734375, "global_step": 460823, "epoch": 5552} {"train_loss": -26.90891456604004, "global_step": 460824, "epoch": 5552} {"train_loss": -26.93779945373535, "global_step": 460825, "epoch": 5552} {"train_loss": -26.879011154174805, "global_step": 460826, "epoch": 5552} {"train_loss": -26.9412899017334, "global_step": 460827, "epoch": 5552} {"train_loss": -26.950061798095703, "global_step": 460828, "epoch": 5552} {"train_loss": -27.058069229125977, "global_step": 460829, "epoch": 5552} {"train_loss": -27.138671875, "global_step": 460830, "epoch": 5552} {"train_loss": -27.02131462097168, "global_step": 460831, "epoch": 5552} {"train_loss": -26.76002311706543, "global_step": 460832, "epoch": 5552} {"train_loss": -27.077741622924805, "global_step": 460833, "epoch": 5552} {"train_loss": -27.259366989135742, "global_step": 460834, "epoch": 5552} {"train_loss": -27.074935913085938, "global_step": 460835, "epoch": 5552} {"train_loss": -26.825942993164062, "global_step": 460836, "epoch": 5552} {"train_loss": -27.120651245117188, "global_step": 460837, "epoch": 5552} {"train_loss": -27.083372116088867, "global_step": 460838, "epoch": 5552} {"train_loss": -26.871597290039062, "global_step": 460839, "epoch": 5552} {"train_loss": -27.0114803314209, "global_step": 460840, "epoch": 5552} {"train_loss": -27.270355224609375, "global_step": 460841, "epoch": 5552} {"train_loss": -26.348325729370117, "global_step": 460842, "epoch": 5552} {"train_loss": -26.918622970581055, "global_step": 460843, "epoch": 5552} {"train_loss": -27.108203887939453, "global_step": 460844, "epoch": 5552} {"train_loss": -26.94399070739746, "global_step": 460845, "epoch": 5552} {"train_loss": -26.7391414642334, "global_step": 460846, "epoch": 5552} {"train_loss": -27.108137130737305, "global_step": 460847, "epoch": 5552} {"train_loss": -26.8828125, "global_step": 460848, "epoch": 5552} {"train_loss": -27.19817543029785, "global_step": 460849, "epoch": 5552} {"train_loss": -27.08782958984375, "global_step": 460850, "epoch": 5552} {"train_loss": -26.67302894592285, "global_step": 460851, "epoch": 5552} {"train_loss": -27.246124267578125, "global_step": 460852, "epoch": 5552} {"train_loss": -27.109262466430664, "global_step": 460853, "epoch": 5552} {"train_loss": -26.864871978759766, "global_step": 460854, "epoch": 5552} {"train_loss": -27.152759552001953, "global_step": 460855, "epoch": 5552} {"train_loss": -27.021804809570312, "global_step": 460856, "epoch": 5552} {"train_loss": -27.142044067382812, "global_step": 460857, "epoch": 5552} {"train_loss": -27.313983917236328, "global_step": 460858, "epoch": 5552} {"train_loss": -26.820209503173828, "global_step": 460859, "epoch": 5552} {"train_loss": -27.388254165649414, "global_step": 460860, "epoch": 5552} {"train_loss": -26.891468048095703, "global_step": 460861, "epoch": 5552} {"train_loss": -26.592426300048828, "global_step": 460862, "epoch": 5552} {"train_loss": -27.075345993041992, "global_step": 460863, "epoch": 5552} {"train_loss": -27.026615142822266, "global_step": 460864, "epoch": 5552} {"train_loss": -26.588287353515625, "global_step": 460865, "epoch": 5552} {"train_loss": -27.268096923828125, "global_step": 460866, "epoch": 5552} {"train_loss": -27.0510311126709, "global_step": 460867, "epoch": 5552} {"train_loss": -26.623889923095703, "global_step": 460868, "epoch": 5552} {"train_loss": -26.980573654174805, "global_step": 460869, "epoch": 5552} {"train_loss": -26.84016227722168, "global_step": 460870, "epoch": 5552} {"train_loss": -27.28316307067871, "global_step": 460871, "epoch": 5552} {"train_loss": -26.948898315429688, "global_step": 460872, "epoch": 5552} {"train_loss": -26.8583927154541, "global_step": 460873, "epoch": 5552} {"train_loss": -26.665964126586914, "global_step": 460874, "epoch": 5552} {"train_loss": -27.153661727905273, "global_step": 460875, "epoch": 5552} {"train_loss": -26.98163414001465, "global_step": 460876, "epoch": 5552} {"train_loss": -26.985082626342773, "global_step": 460877, "epoch": 5552} {"train_loss": -26.958724975585938, "global_step": 460878, "epoch": 5552} {"train_loss": -27.252582550048828, "global_step": 460879, "epoch": 5552} {"train_loss": -27.03577995300293, "global_step": 460880, "epoch": 5552} {"train_loss": -26.94297218322754, "global_step": 460881, "epoch": 5552} {"train_loss": -26.850976943969727, "global_step": 460882, "epoch": 5552} {"train_loss": -27.279972076416016, "global_step": 460883, "epoch": 5552} {"train_loss": -26.668460845947266, "global_step": 460884, "epoch": 5552} {"train_loss": -26.971527099609375, "global_step": 460885, "epoch": 5552} {"train_loss": -27.226760864257812, "global_step": 460886, "epoch": 5552} {"train_loss": -27.10087013244629, "global_step": 460887, "epoch": 5552} {"train_loss": -26.95194435119629, "global_step": 460888, "epoch": 5552} {"train_loss": -26.632064819335938, "global_step": 460889, "epoch": 5552} {"train_loss": -26.73162841796875, "global_step": 460890, "epoch": 5552} {"train_loss": -26.652191162109375, "global_step": 460891, "epoch": 5552} {"train_loss": -27.076568603515625, "global_step": 460892, "epoch": 5552} {"train_loss": -26.772754669189453, "global_step": 460893, "epoch": 5552} {"train_loss": -27.277454376220703, "global_step": 460894, "epoch": 5552} {"train_loss": -27.087848663330078, "global_step": 460895, "epoch": 5552} {"train_loss": -26.96125602722168, "global_step": 460896, "epoch": 5552} {"train_loss": -27.066572189331055, "global_step": 460897, "epoch": 5552} {"train_loss": -26.986407360398626, "global_step": 460898, "epoch": 5552, "val_loss": 6478870.0} {"train_loss": -26.362646102905273, "global_step": 460899, "epoch": 5553} {"train_loss": -26.788793563842773, "global_step": 460900, "epoch": 5553} {"train_loss": -26.24476432800293, "global_step": 460901, "epoch": 5553} {"train_loss": -26.186216354370117, "global_step": 460902, "epoch": 5553} {"train_loss": -27.305749893188477, "global_step": 460903, "epoch": 5553} {"train_loss": -26.83038330078125, "global_step": 460904, "epoch": 5553} {"train_loss": -26.64052391052246, "global_step": 460905, "epoch": 5553} {"train_loss": -26.7340030670166, "global_step": 460906, "epoch": 5553} {"train_loss": -26.712814331054688, "global_step": 460907, "epoch": 5553} {"train_loss": -26.410175323486328, "global_step": 460908, "epoch": 5553} {"train_loss": -26.55055046081543, "global_step": 460909, "epoch": 5553} {"train_loss": -26.21270751953125, "global_step": 460910, "epoch": 5553} {"train_loss": -26.476499557495117, "global_step": 460911, "epoch": 5553} {"train_loss": -26.780786514282227, "global_step": 460912, "epoch": 5553} {"train_loss": -26.62640953063965, "global_step": 460913, "epoch": 5553} {"train_loss": -26.55230712890625, "global_step": 460914, "epoch": 5553} {"train_loss": -26.926034927368164, "global_step": 460915, "epoch": 5553} {"train_loss": -27.05368423461914, "global_step": 460916, "epoch": 5553} {"train_loss": -26.44025230407715, "global_step": 460917, "epoch": 5553} {"train_loss": -26.916339874267578, "global_step": 460918, "epoch": 5553} {"train_loss": -26.970426559448242, "global_step": 460919, "epoch": 5553} {"train_loss": -26.79734230041504, "global_step": 460920, "epoch": 5553} {"train_loss": -26.708984375, "global_step": 460921, "epoch": 5553} {"train_loss": -27.066852569580078, "global_step": 460922, "epoch": 5553} {"train_loss": -27.056760787963867, "global_step": 460923, "epoch": 5553} {"train_loss": -26.562793731689453, "global_step": 460924, "epoch": 5553} {"train_loss": -27.05449867248535, "global_step": 460925, "epoch": 5553} {"train_loss": -27.124042510986328, "global_step": 460926, "epoch": 5553} {"train_loss": -26.91451072692871, "global_step": 460927, "epoch": 5553} {"train_loss": -27.319629669189453, "global_step": 460928, "epoch": 5553} {"train_loss": -26.7690486907959, "global_step": 460929, "epoch": 5553} {"train_loss": -26.929712295532227, "global_step": 460930, "epoch": 5553} {"train_loss": -27.422033309936523, "global_step": 460931, "epoch": 5553} {"train_loss": -26.996179580688477, "global_step": 460932, "epoch": 5553} {"train_loss": -27.040449142456055, "global_step": 460933, "epoch": 5553} {"train_loss": -27.20920181274414, "global_step": 460934, "epoch": 5553} {"train_loss": -27.265539169311523, "global_step": 460935, "epoch": 5553} {"train_loss": -27.15089988708496, "global_step": 460936, "epoch": 5553} {"train_loss": -26.824350357055664, "global_step": 460937, "epoch": 5553} {"train_loss": -26.885299682617188, "global_step": 460938, "epoch": 5553} {"train_loss": -27.294509887695312, "global_step": 460939, "epoch": 5553} {"train_loss": -26.971166610717773, "global_step": 460940, "epoch": 5553} {"train_loss": -27.191593170166016, "global_step": 460941, "epoch": 5553} {"train_loss": -27.43073081970215, "global_step": 460942, "epoch": 5553} {"train_loss": -27.102279663085938, "global_step": 460943, "epoch": 5553} {"train_loss": -27.276321411132812, "global_step": 460944, "epoch": 5553} {"train_loss": -27.43000602722168, "global_step": 460945, "epoch": 5553} {"train_loss": -27.12574577331543, "global_step": 460946, "epoch": 5553} {"train_loss": -26.89362144470215, "global_step": 460947, "epoch": 5553} {"train_loss": -26.867368698120117, "global_step": 460948, "epoch": 5553} {"train_loss": -27.30414390563965, "global_step": 460949, "epoch": 5553} {"train_loss": -27.354196548461914, "global_step": 460950, "epoch": 5553} {"train_loss": -27.303302764892578, "global_step": 460951, "epoch": 5553} {"train_loss": -27.3642578125, "global_step": 460952, "epoch": 5553} {"train_loss": -26.8035831451416, "global_step": 460953, "epoch": 5553} {"train_loss": -27.13934898376465, "global_step": 460954, "epoch": 5553} {"train_loss": -26.930862426757812, "global_step": 460955, "epoch": 5553} {"train_loss": -27.32050132751465, "global_step": 460956, "epoch": 5553} {"train_loss": -26.8271427154541, "global_step": 460957, "epoch": 5553} {"train_loss": -26.934301376342773, "global_step": 460958, "epoch": 5553} {"train_loss": -26.86672019958496, "global_step": 460959, "epoch": 5553} {"train_loss": -27.166791915893555, "global_step": 460960, "epoch": 5553} {"train_loss": -26.801177978515625, "global_step": 460961, "epoch": 5553} {"train_loss": -27.357040405273438, "global_step": 460962, "epoch": 5553} {"train_loss": -27.265228271484375, "global_step": 460963, "epoch": 5553} {"train_loss": -27.26422119140625, "global_step": 460964, "epoch": 5553} {"train_loss": -27.301822662353516, "global_step": 460965, "epoch": 5553} {"train_loss": -27.040231704711914, "global_step": 460966, "epoch": 5553} {"train_loss": -27.21742057800293, "global_step": 460967, "epoch": 5553} {"train_loss": -27.22675132751465, "global_step": 460968, "epoch": 5553} {"train_loss": -26.903594970703125, "global_step": 460969, "epoch": 5553} {"train_loss": -27.265607833862305, "global_step": 460970, "epoch": 5553} {"train_loss": -27.055517196655273, "global_step": 460971, "epoch": 5553} {"train_loss": -26.964569091796875, "global_step": 460972, "epoch": 5553} {"train_loss": -26.8690128326416, "global_step": 460973, "epoch": 5553} {"train_loss": -27.256986618041992, "global_step": 460974, "epoch": 5553} {"train_loss": -27.144134521484375, "global_step": 460975, "epoch": 5553} {"train_loss": -27.11896324157715, "global_step": 460976, "epoch": 5553} {"train_loss": -27.123126983642578, "global_step": 460977, "epoch": 5553} {"train_loss": -27.098066329956055, "global_step": 460978, "epoch": 5553} {"train_loss": -27.065174102783203, "global_step": 460979, "epoch": 5553} {"train_loss": -27.363800048828125, "global_step": 460980, "epoch": 5553} {"train_loss": -26.979117933526098, "global_step": 460981, "epoch": 5553, "val_loss": 6544021.0} {"train_loss": -26.26531410217285, "global_step": 460982, "epoch": 5554} {"train_loss": -26.22417640686035, "global_step": 460983, "epoch": 5554} {"train_loss": -26.717992782592773, "global_step": 460984, "epoch": 5554} {"train_loss": -25.639440536499023, "global_step": 460985, "epoch": 5554} {"train_loss": -26.340879440307617, "global_step": 460986, "epoch": 5554} {"train_loss": -26.319345474243164, "global_step": 460987, "epoch": 5554} {"train_loss": -26.259790420532227, "global_step": 460988, "epoch": 5554} {"train_loss": -26.799924850463867, "global_step": 460989, "epoch": 5554} {"train_loss": -26.611616134643555, "global_step": 460990, "epoch": 5554} {"train_loss": -27.243499755859375, "global_step": 460991, "epoch": 5554} {"train_loss": -26.820749282836914, "global_step": 460992, "epoch": 5554} {"train_loss": -26.755849838256836, "global_step": 460993, "epoch": 5554} {"train_loss": -26.724897384643555, "global_step": 460994, "epoch": 5554} {"train_loss": -26.55103874206543, "global_step": 460995, "epoch": 5554} {"train_loss": -26.957815170288086, "global_step": 460996, "epoch": 5554} {"train_loss": -27.110733032226562, "global_step": 460997, "epoch": 5554} {"train_loss": -27.079315185546875, "global_step": 460998, "epoch": 5554} {"train_loss": -26.855915069580078, "global_step": 460999, "epoch": 5554} {"train_loss": -27.06572914123535, "global_step": 461000, "epoch": 5554} {"train_loss": -26.70094108581543, "global_step": 461001, "epoch": 5554} {"train_loss": -26.935577392578125, "global_step": 461002, "epoch": 5554} {"train_loss": -26.7657527923584, "global_step": 461003, "epoch": 5554} {"train_loss": -26.76995849609375, "global_step": 461004, "epoch": 5554} {"train_loss": -27.369226455688477, "global_step": 461005, "epoch": 5554} {"train_loss": -27.022974014282227, "global_step": 461006, "epoch": 5554} {"train_loss": -27.181577682495117, "global_step": 461007, "epoch": 5554} {"train_loss": -27.17127799987793, "global_step": 461008, "epoch": 5554} {"train_loss": -27.21242332458496, "global_step": 461009, "epoch": 5554} {"train_loss": -27.00788688659668, "global_step": 461010, "epoch": 5554} {"train_loss": -26.863752365112305, "global_step": 461011, "epoch": 5554} {"train_loss": -26.8934383392334, "global_step": 461012, "epoch": 5554} {"train_loss": -27.190717697143555, "global_step": 461013, "epoch": 5554} {"train_loss": -27.530359268188477, "global_step": 461014, "epoch": 5554} {"train_loss": -27.416614532470703, "global_step": 461015, "epoch": 5554} {"train_loss": -27.54510498046875, "global_step": 461016, "epoch": 5554} {"train_loss": -27.19144630432129, "global_step": 461017, "epoch": 5554} {"train_loss": -27.372495651245117, "global_step": 461018, "epoch": 5554} {"train_loss": -27.2927188873291, "global_step": 461019, "epoch": 5554} {"train_loss": -27.16031837463379, "global_step": 461020, "epoch": 5554} {"train_loss": -27.5835018157959, "global_step": 461021, "epoch": 5554} {"train_loss": -26.718046188354492, "global_step": 461022, "epoch": 5554} {"train_loss": -27.400007247924805, "global_step": 461023, "epoch": 5554} {"train_loss": -27.040021896362305, "global_step": 461024, "epoch": 5554} {"train_loss": -27.215307235717773, "global_step": 461025, "epoch": 5554} {"train_loss": -27.25689125061035, "global_step": 461026, "epoch": 5554} {"train_loss": -27.1390323638916, "global_step": 461027, "epoch": 5554} {"train_loss": -27.21295166015625, "global_step": 461028, "epoch": 5554} {"train_loss": -27.441024780273438, "global_step": 461029, "epoch": 5554} {"train_loss": -27.613515853881836, "global_step": 461030, "epoch": 5554} {"train_loss": -27.053083419799805, "global_step": 461031, "epoch": 5554} {"train_loss": -27.10187339782715, "global_step": 461032, "epoch": 5554} {"train_loss": -26.994098663330078, "global_step": 461033, "epoch": 5554} {"train_loss": -27.201568603515625, "global_step": 461034, "epoch": 5554} {"train_loss": -27.159671783447266, "global_step": 461035, "epoch": 5554} {"train_loss": -26.76148796081543, "global_step": 461036, "epoch": 5554} {"train_loss": -26.437458038330078, "global_step": 461037, "epoch": 5554} {"train_loss": -25.34694480895996, "global_step": 461038, "epoch": 5554} {"train_loss": -24.845796585083008, "global_step": 461039, "epoch": 5554} {"train_loss": -25.740360260009766, "global_step": 461040, "epoch": 5554} {"train_loss": -25.95077896118164, "global_step": 461041, "epoch": 5554} {"train_loss": -26.48429298400879, "global_step": 461042, "epoch": 5554} {"train_loss": -26.40618324279785, "global_step": 461043, "epoch": 5554} {"train_loss": -26.314905166625977, "global_step": 461044, "epoch": 5554} {"train_loss": -26.8831787109375, "global_step": 461045, "epoch": 5554} {"train_loss": -26.447723388671875, "global_step": 461046, "epoch": 5554} {"train_loss": -26.5931396484375, "global_step": 461047, "epoch": 5554} {"train_loss": -27.12981605529785, "global_step": 461048, "epoch": 5554} {"train_loss": -26.467557907104492, "global_step": 461049, "epoch": 5554} {"train_loss": -27.156904220581055, "global_step": 461050, "epoch": 5554} {"train_loss": -27.044239044189453, "global_step": 461051, "epoch": 5554} {"train_loss": -27.12738609313965, "global_step": 461052, "epoch": 5554} {"train_loss": -27.014135360717773, "global_step": 461053, "epoch": 5554} {"train_loss": -26.712696075439453, "global_step": 461054, "epoch": 5554} {"train_loss": -27.158666610717773, "global_step": 461055, "epoch": 5554} {"train_loss": -26.99470329284668, "global_step": 461056, "epoch": 5554} {"train_loss": -27.11250877380371, "global_step": 461057, "epoch": 5554} {"train_loss": -26.79974365234375, "global_step": 461058, "epoch": 5554} {"train_loss": -26.906570434570312, "global_step": 461059, "epoch": 5554} {"train_loss": -27.086334228515625, "global_step": 461060, "epoch": 5554} {"train_loss": -27.13397216796875, "global_step": 461061, "epoch": 5554} {"train_loss": -27.091934204101562, "global_step": 461062, "epoch": 5554} {"train_loss": -27.100107192993164, "global_step": 461063, "epoch": 5554} {"train_loss": -26.88355397603598, "global_step": 461064, "epoch": 5554, "val_loss": 6560434.0} {"train_loss": -27.032617568969727, "global_step": 461065, "epoch": 5555} {"train_loss": -27.09619140625, "global_step": 461066, "epoch": 5555} {"train_loss": -27.109683990478516, "global_step": 461067, "epoch": 5555} {"train_loss": -27.022497177124023, "global_step": 461068, "epoch": 5555} {"train_loss": -27.087696075439453, "global_step": 461069, "epoch": 5555} {"train_loss": -27.164291381835938, "global_step": 461070, "epoch": 5555} {"train_loss": -27.159269332885742, "global_step": 461071, "epoch": 5555} {"train_loss": -27.034473419189453, "global_step": 461072, "epoch": 5555} {"train_loss": -27.05328941345215, "global_step": 461073, "epoch": 5555} {"train_loss": -26.903722763061523, "global_step": 461074, "epoch": 5555} {"train_loss": -27.100614547729492, "global_step": 461075, "epoch": 5555} {"train_loss": -27.28765296936035, "global_step": 461076, "epoch": 5555} {"train_loss": -27.302459716796875, "global_step": 461077, "epoch": 5555} {"train_loss": -27.073856353759766, "global_step": 461078, "epoch": 5555} {"train_loss": -27.27511978149414, "global_step": 461079, "epoch": 5555} {"train_loss": -27.12086296081543, "global_step": 461080, "epoch": 5555} {"train_loss": -27.264480590820312, "global_step": 461081, "epoch": 5555} {"train_loss": -27.272125244140625, "global_step": 461082, "epoch": 5555} {"train_loss": -26.88165283203125, "global_step": 461083, "epoch": 5555} {"train_loss": -27.054319381713867, "global_step": 461084, "epoch": 5555} {"train_loss": -27.153793334960938, "global_step": 461085, "epoch": 5555} {"train_loss": -27.0133056640625, "global_step": 461086, "epoch": 5555} {"train_loss": -27.117767333984375, "global_step": 461087, "epoch": 5555} {"train_loss": -27.2454891204834, "global_step": 461088, "epoch": 5555} {"train_loss": -27.35272789001465, "global_step": 461089, "epoch": 5555} {"train_loss": -27.555255889892578, "global_step": 461090, "epoch": 5555} {"train_loss": -27.392704010009766, "global_step": 461091, "epoch": 5555} {"train_loss": -27.320465087890625, "global_step": 461092, "epoch": 5555} {"train_loss": -27.40028190612793, "global_step": 461093, "epoch": 5555} {"train_loss": -27.051557540893555, "global_step": 461094, "epoch": 5555} {"train_loss": -27.387479782104492, "global_step": 461095, "epoch": 5555} {"train_loss": -26.746896743774414, "global_step": 461096, "epoch": 5555} {"train_loss": -26.904834747314453, "global_step": 461097, "epoch": 5555} {"train_loss": -26.283843994140625, "global_step": 461098, "epoch": 5555} {"train_loss": -26.32228660583496, "global_step": 461099, "epoch": 5555} {"train_loss": -26.956317901611328, "global_step": 461100, "epoch": 5555} {"train_loss": -27.14866065979004, "global_step": 461101, "epoch": 5555} {"train_loss": -27.08624267578125, "global_step": 461102, "epoch": 5555} {"train_loss": -26.8602237701416, "global_step": 461103, "epoch": 5555} {"train_loss": -26.80158805847168, "global_step": 461104, "epoch": 5555} {"train_loss": -27.16473388671875, "global_step": 461105, "epoch": 5555} {"train_loss": -27.372365951538086, "global_step": 461106, "epoch": 5555} {"train_loss": -27.265100479125977, "global_step": 461107, "epoch": 5555} {"train_loss": -27.123437881469727, "global_step": 461108, "epoch": 5555} {"train_loss": -27.14568519592285, "global_step": 461109, "epoch": 5555} {"train_loss": -27.067428588867188, "global_step": 461110, "epoch": 5555} {"train_loss": -26.861835479736328, "global_step": 461111, "epoch": 5555} {"train_loss": -26.517541885375977, "global_step": 461112, "epoch": 5555} {"train_loss": -26.65577507019043, "global_step": 461113, "epoch": 5555} {"train_loss": -26.91379165649414, "global_step": 461114, "epoch": 5555} {"train_loss": -27.03423500061035, "global_step": 461115, "epoch": 5555} {"train_loss": -27.243268966674805, "global_step": 461116, "epoch": 5555} {"train_loss": -27.31182289123535, "global_step": 461117, "epoch": 5555} {"train_loss": -27.45757484436035, "global_step": 461118, "epoch": 5555} {"train_loss": -26.739368438720703, "global_step": 461119, "epoch": 5555} {"train_loss": -27.08426284790039, "global_step": 461120, "epoch": 5555} {"train_loss": -26.9823055267334, "global_step": 461121, "epoch": 5555} {"train_loss": -27.068222045898438, "global_step": 461122, "epoch": 5555} {"train_loss": -26.926191329956055, "global_step": 461123, "epoch": 5555} {"train_loss": -26.89471435546875, "global_step": 461124, "epoch": 5555} {"train_loss": -27.10153579711914, "global_step": 461125, "epoch": 5555} {"train_loss": -27.174768447875977, "global_step": 461126, "epoch": 5555} {"train_loss": -27.133554458618164, "global_step": 461127, "epoch": 5555} {"train_loss": -27.01637077331543, "global_step": 461128, "epoch": 5555} {"train_loss": -27.31793212890625, "global_step": 461129, "epoch": 5555} {"train_loss": -27.00250816345215, "global_step": 461130, "epoch": 5555} {"train_loss": -27.122201919555664, "global_step": 461131, "epoch": 5555} {"train_loss": -27.264257431030273, "global_step": 461132, "epoch": 5555} {"train_loss": -27.014652252197266, "global_step": 461133, "epoch": 5555} {"train_loss": -26.768903732299805, "global_step": 461134, "epoch": 5555} {"train_loss": -26.794485092163086, "global_step": 461135, "epoch": 5555} {"train_loss": -26.880462646484375, "global_step": 461136, "epoch": 5555} {"train_loss": -27.018238067626953, "global_step": 461137, "epoch": 5555} {"train_loss": -27.15118980407715, "global_step": 461138, "epoch": 5555} {"train_loss": -26.497455596923828, "global_step": 461139, "epoch": 5555} {"train_loss": -26.69154167175293, "global_step": 461140, "epoch": 5555} {"train_loss": -26.4464168548584, "global_step": 461141, "epoch": 5555} {"train_loss": -26.816335678100586, "global_step": 461142, "epoch": 5555} {"train_loss": -27.066619873046875, "global_step": 461143, "epoch": 5555} {"train_loss": -26.821699142456055, "global_step": 461144, "epoch": 5555} {"train_loss": -26.885305404663086, "global_step": 461145, "epoch": 5555} {"train_loss": -26.767719268798828, "global_step": 461146, "epoch": 5555} {"train_loss": -27.053652545055712, "global_step": 461147, "epoch": 5555, "val_loss": 6479003.0} {"train_loss": -25.944379806518555, "global_step": 461148, "epoch": 5556} {"train_loss": -25.948455810546875, "global_step": 461149, "epoch": 5556} {"train_loss": -26.40386962890625, "global_step": 461150, "epoch": 5556} {"train_loss": -26.393423080444336, "global_step": 461151, "epoch": 5556} {"train_loss": -26.264862060546875, "global_step": 461152, "epoch": 5556} {"train_loss": -26.909635543823242, "global_step": 461153, "epoch": 5556} {"train_loss": -26.129261016845703, "global_step": 461154, "epoch": 5556} {"train_loss": -26.41326904296875, "global_step": 461155, "epoch": 5556} {"train_loss": -26.586029052734375, "global_step": 461156, "epoch": 5556} {"train_loss": -26.485855102539062, "global_step": 461157, "epoch": 5556} {"train_loss": -26.37676429748535, "global_step": 461158, "epoch": 5556} {"train_loss": -26.41814613342285, "global_step": 461159, "epoch": 5556} {"train_loss": -26.595014572143555, "global_step": 461160, "epoch": 5556} {"train_loss": -26.675817489624023, "global_step": 461161, "epoch": 5556} {"train_loss": -26.850889205932617, "global_step": 461162, "epoch": 5556} {"train_loss": -26.49790382385254, "global_step": 461163, "epoch": 5556} {"train_loss": -26.984283447265625, "global_step": 461164, "epoch": 5556} {"train_loss": -26.647119522094727, "global_step": 461165, "epoch": 5556} {"train_loss": -26.536725997924805, "global_step": 461166, "epoch": 5556} {"train_loss": -26.78672218322754, "global_step": 461167, "epoch": 5556} {"train_loss": -27.35883903503418, "global_step": 461168, "epoch": 5556} {"train_loss": -26.98420524597168, "global_step": 461169, "epoch": 5556} {"train_loss": -26.85711669921875, "global_step": 461170, "epoch": 5556} {"train_loss": -27.14851188659668, "global_step": 461171, "epoch": 5556} {"train_loss": -26.853759765625, "global_step": 461172, "epoch": 5556} {"train_loss": -27.098682403564453, "global_step": 461173, "epoch": 5556} {"train_loss": -27.019336700439453, "global_step": 461174, "epoch": 5556} {"train_loss": -27.01299476623535, "global_step": 461175, "epoch": 5556} {"train_loss": -27.30060386657715, "global_step": 461176, "epoch": 5556} {"train_loss": -27.035810470581055, "global_step": 461177, "epoch": 5556} {"train_loss": -27.159997940063477, "global_step": 461178, "epoch": 5556} {"train_loss": -27.15846061706543, "global_step": 461179, "epoch": 5556} {"train_loss": -27.02210807800293, "global_step": 461180, "epoch": 5556} {"train_loss": -27.208837509155273, "global_step": 461181, "epoch": 5556} {"train_loss": -27.109968185424805, "global_step": 461182, "epoch": 5556} {"train_loss": -27.355316162109375, "global_step": 461183, "epoch": 5556} {"train_loss": -27.597082138061523, "global_step": 461184, "epoch": 5556} {"train_loss": -26.9757080078125, "global_step": 461185, "epoch": 5556} {"train_loss": -27.159631729125977, "global_step": 461186, "epoch": 5556} {"train_loss": -27.191259384155273, "global_step": 461187, "epoch": 5556} {"train_loss": -27.280858993530273, "global_step": 461188, "epoch": 5556} {"train_loss": -27.235523223876953, "global_step": 461189, "epoch": 5556} {"train_loss": -27.331029891967773, "global_step": 461190, "epoch": 5556} {"train_loss": -27.24262046813965, "global_step": 461191, "epoch": 5556} {"train_loss": -27.027313232421875, "global_step": 461192, "epoch": 5556} {"train_loss": -27.268075942993164, "global_step": 461193, "epoch": 5556} {"train_loss": -26.955663681030273, "global_step": 461194, "epoch": 5556} {"train_loss": -27.15655517578125, "global_step": 461195, "epoch": 5556} {"train_loss": -27.0843448638916, "global_step": 461196, "epoch": 5556} {"train_loss": -27.495758056640625, "global_step": 461197, "epoch": 5556} {"train_loss": -27.200483322143555, "global_step": 461198, "epoch": 5556} {"train_loss": -27.376632690429688, "global_step": 461199, "epoch": 5556} {"train_loss": -27.18694496154785, "global_step": 461200, "epoch": 5556} {"train_loss": -27.5174503326416, "global_step": 461201, "epoch": 5556} {"train_loss": -27.01958656311035, "global_step": 461202, "epoch": 5556} {"train_loss": -27.59134292602539, "global_step": 461203, "epoch": 5556} {"train_loss": -27.554121017456055, "global_step": 461204, "epoch": 5556} {"train_loss": -27.25482749938965, "global_step": 461205, "epoch": 5556} {"train_loss": -27.519901275634766, "global_step": 461206, "epoch": 5556} {"train_loss": -27.623273849487305, "global_step": 461207, "epoch": 5556} {"train_loss": -27.23752784729004, "global_step": 461208, "epoch": 5556} {"train_loss": -27.530048370361328, "global_step": 461209, "epoch": 5556} {"train_loss": -27.119321823120117, "global_step": 461210, "epoch": 5556} {"train_loss": -27.271203994750977, "global_step": 461211, "epoch": 5556} {"train_loss": -27.106000900268555, "global_step": 461212, "epoch": 5556} {"train_loss": -27.37929344177246, "global_step": 461213, "epoch": 5556} {"train_loss": -27.356464385986328, "global_step": 461214, "epoch": 5556} {"train_loss": -27.07452964782715, "global_step": 461215, "epoch": 5556} {"train_loss": -26.70551872253418, "global_step": 461216, "epoch": 5556} {"train_loss": -26.697345733642578, "global_step": 461217, "epoch": 5556} {"train_loss": -27.256637573242188, "global_step": 461218, "epoch": 5556} {"train_loss": -26.794086456298828, "global_step": 461219, "epoch": 5556} {"train_loss": -27.302261352539062, "global_step": 461220, "epoch": 5556} {"train_loss": -27.326114654541016, "global_step": 461221, "epoch": 5556} {"train_loss": -27.330602645874023, "global_step": 461222, "epoch": 5556} {"train_loss": -26.92811393737793, "global_step": 461223, "epoch": 5556} {"train_loss": -27.06927490234375, "global_step": 461224, "epoch": 5556} {"train_loss": -27.1337947845459, "global_step": 461225, "epoch": 5556} {"train_loss": -27.10918617248535, "global_step": 461226, "epoch": 5556} {"train_loss": -27.0800724029541, "global_step": 461227, "epoch": 5556} {"train_loss": -27.068021774291992, "global_step": 461228, "epoch": 5556} {"train_loss": -27.0344295501709, "global_step": 461229, "epoch": 5556} {"train_loss": -27.0276572445789, "global_step": 461230, "epoch": 5556, "val_loss": 6596147.0} {"train_loss": -27.08768653869629, "global_step": 461231, "epoch": 5557} {"train_loss": -26.434438705444336, "global_step": 461232, "epoch": 5557} {"train_loss": -26.983448028564453, "global_step": 461233, "epoch": 5557} {"train_loss": -26.478681564331055, "global_step": 461234, "epoch": 5557} {"train_loss": -26.375030517578125, "global_step": 461235, "epoch": 5557} {"train_loss": -26.47896385192871, "global_step": 461236, "epoch": 5557} {"train_loss": -26.740070343017578, "global_step": 461237, "epoch": 5557} {"train_loss": -26.840925216674805, "global_step": 461238, "epoch": 5557} {"train_loss": -26.967344284057617, "global_step": 461239, "epoch": 5557} {"train_loss": -26.882110595703125, "global_step": 461240, "epoch": 5557} {"train_loss": -27.015146255493164, "global_step": 461241, "epoch": 5557} {"train_loss": -27.25263786315918, "global_step": 461242, "epoch": 5557} {"train_loss": -26.77297019958496, "global_step": 461243, "epoch": 5557} {"train_loss": -27.233835220336914, "global_step": 461244, "epoch": 5557} {"train_loss": -26.9326229095459, "global_step": 461245, "epoch": 5557} {"train_loss": -26.477859497070312, "global_step": 461246, "epoch": 5557} {"train_loss": -26.592809677124023, "global_step": 461247, "epoch": 5557} {"train_loss": -26.794952392578125, "global_step": 461248, "epoch": 5557} {"train_loss": -27.028905868530273, "global_step": 461249, "epoch": 5557} {"train_loss": -27.14470863342285, "global_step": 461250, "epoch": 5557} {"train_loss": -27.307327270507812, "global_step": 461251, "epoch": 5557} {"train_loss": -26.770751953125, "global_step": 461252, "epoch": 5557} {"train_loss": -26.877851486206055, "global_step": 461253, "epoch": 5557} {"train_loss": -26.587915420532227, "global_step": 461254, "epoch": 5557} {"train_loss": -27.3976993560791, "global_step": 461255, "epoch": 5557} {"train_loss": -27.000696182250977, "global_step": 461256, "epoch": 5557} {"train_loss": -26.8601131439209, "global_step": 461257, "epoch": 5557} {"train_loss": -27.03651237487793, "global_step": 461258, "epoch": 5557} {"train_loss": -26.67873191833496, "global_step": 461259, "epoch": 5557} {"train_loss": -27.25873374938965, "global_step": 461260, "epoch": 5557} {"train_loss": -26.993606567382812, "global_step": 461261, "epoch": 5557} {"train_loss": -27.07818603515625, "global_step": 461262, "epoch": 5557} {"train_loss": -27.335241317749023, "global_step": 461263, "epoch": 5557} {"train_loss": -27.105670928955078, "global_step": 461264, "epoch": 5557} {"train_loss": -27.246200561523438, "global_step": 461265, "epoch": 5557} {"train_loss": -26.985754013061523, "global_step": 461266, "epoch": 5557} {"train_loss": -27.263031005859375, "global_step": 461267, "epoch": 5557} {"train_loss": -27.57425308227539, "global_step": 461268, "epoch": 5557} {"train_loss": -27.52644157409668, "global_step": 461269, "epoch": 5557} {"train_loss": -27.365615844726562, "global_step": 461270, "epoch": 5557} {"train_loss": -27.19707679748535, "global_step": 461271, "epoch": 5557} {"train_loss": -27.639606475830078, "global_step": 461272, "epoch": 5557} {"train_loss": -27.199085235595703, "global_step": 461273, "epoch": 5557} {"train_loss": -27.57642936706543, "global_step": 461274, "epoch": 5557} {"train_loss": -27.261417388916016, "global_step": 461275, "epoch": 5557} {"train_loss": -27.083499908447266, "global_step": 461276, "epoch": 5557} {"train_loss": -27.017736434936523, "global_step": 461277, "epoch": 5557} {"train_loss": -27.10261344909668, "global_step": 461278, "epoch": 5557} {"train_loss": -27.074888229370117, "global_step": 461279, "epoch": 5557} {"train_loss": -27.183979034423828, "global_step": 461280, "epoch": 5557} {"train_loss": -27.115447998046875, "global_step": 461281, "epoch": 5557} {"train_loss": -27.096704483032227, "global_step": 461282, "epoch": 5557} {"train_loss": -27.584308624267578, "global_step": 461283, "epoch": 5557} {"train_loss": -27.176767349243164, "global_step": 461284, "epoch": 5557} {"train_loss": -27.418277740478516, "global_step": 461285, "epoch": 5557} {"train_loss": -27.479694366455078, "global_step": 461286, "epoch": 5557} {"train_loss": -27.293853759765625, "global_step": 461287, "epoch": 5557} {"train_loss": -26.81195640563965, "global_step": 461288, "epoch": 5557} {"train_loss": -27.52326011657715, "global_step": 461289, "epoch": 5557} {"train_loss": -26.8011531829834, "global_step": 461290, "epoch": 5557} {"train_loss": -27.030353546142578, "global_step": 461291, "epoch": 5557} {"train_loss": -26.690107345581055, "global_step": 461292, "epoch": 5557} {"train_loss": -26.770263671875, "global_step": 461293, "epoch": 5557} {"train_loss": -27.41599464416504, "global_step": 461294, "epoch": 5557} {"train_loss": -26.812253952026367, "global_step": 461295, "epoch": 5557} {"train_loss": -27.161014556884766, "global_step": 461296, "epoch": 5557} {"train_loss": -26.746557235717773, "global_step": 461297, "epoch": 5557} {"train_loss": -27.06947898864746, "global_step": 461298, "epoch": 5557} {"train_loss": -26.652414321899414, "global_step": 461299, "epoch": 5557} {"train_loss": -27.048553466796875, "global_step": 461300, "epoch": 5557} {"train_loss": -26.58356285095215, "global_step": 461301, "epoch": 5557} {"train_loss": -26.60221290588379, "global_step": 461302, "epoch": 5557} {"train_loss": -26.64400291442871, "global_step": 461303, "epoch": 5557} {"train_loss": -27.0642032623291, "global_step": 461304, "epoch": 5557} {"train_loss": -26.89444923400879, "global_step": 461305, "epoch": 5557} {"train_loss": -26.761234283447266, "global_step": 461306, "epoch": 5557} {"train_loss": -27.173919677734375, "global_step": 461307, "epoch": 5557} {"train_loss": -26.88641929626465, "global_step": 461308, "epoch": 5557} {"train_loss": -26.792505264282227, "global_step": 461309, "epoch": 5557} {"train_loss": -27.155120849609375, "global_step": 461310, "epoch": 5557} {"train_loss": -27.347009658813477, "global_step": 461311, "epoch": 5557} {"train_loss": -27.075719833374023, "global_step": 461312, "epoch": 5557} {"train_loss": -27.04381894490805, "global_step": 461313, "epoch": 5557, "val_loss": 6542998.0} {"train_loss": -26.215595245361328, "global_step": 461314, "epoch": 5558} {"train_loss": -26.496814727783203, "global_step": 461315, "epoch": 5558} {"train_loss": -26.231552124023438, "global_step": 461316, "epoch": 5558} {"train_loss": -26.47519874572754, "global_step": 461317, "epoch": 5558} {"train_loss": -26.499547958374023, "global_step": 461318, "epoch": 5558} {"train_loss": -26.277353286743164, "global_step": 461319, "epoch": 5558} {"train_loss": -26.712854385375977, "global_step": 461320, "epoch": 5558} {"train_loss": -25.98431396484375, "global_step": 461321, "epoch": 5558} {"train_loss": -26.69906997680664, "global_step": 461322, "epoch": 5558} {"train_loss": -26.461713790893555, "global_step": 461323, "epoch": 5558} {"train_loss": -27.0858097076416, "global_step": 461324, "epoch": 5558} {"train_loss": -26.709259033203125, "global_step": 461325, "epoch": 5558} {"train_loss": -27.218738555908203, "global_step": 461326, "epoch": 5558} {"train_loss": -26.629138946533203, "global_step": 461327, "epoch": 5558} {"train_loss": -27.048070907592773, "global_step": 461328, "epoch": 5558} {"train_loss": -26.564416885375977, "global_step": 461329, "epoch": 5558} {"train_loss": -26.84402847290039, "global_step": 461330, "epoch": 5558} {"train_loss": -26.63852310180664, "global_step": 461331, "epoch": 5558} {"train_loss": -26.682830810546875, "global_step": 461332, "epoch": 5558} {"train_loss": -26.500104904174805, "global_step": 461333, "epoch": 5558} {"train_loss": -26.989246368408203, "global_step": 461334, "epoch": 5558} {"train_loss": -26.717670440673828, "global_step": 461335, "epoch": 5558} {"train_loss": -26.746816635131836, "global_step": 461336, "epoch": 5558} {"train_loss": -27.186670303344727, "global_step": 461337, "epoch": 5558} {"train_loss": -26.825124740600586, "global_step": 461338, "epoch": 5558} {"train_loss": -27.361801147460938, "global_step": 461339, "epoch": 5558} {"train_loss": -26.815881729125977, "global_step": 461340, "epoch": 5558} {"train_loss": -27.248432159423828, "global_step": 461341, "epoch": 5558} {"train_loss": -26.7365779876709, "global_step": 461342, "epoch": 5558} {"train_loss": -26.568105697631836, "global_step": 461343, "epoch": 5558} {"train_loss": -27.06644630432129, "global_step": 461344, "epoch": 5558} {"train_loss": -26.896686553955078, "global_step": 461345, "epoch": 5558} {"train_loss": -26.919424057006836, "global_step": 461346, "epoch": 5558} {"train_loss": -26.958698272705078, "global_step": 461347, "epoch": 5558} {"train_loss": -26.803558349609375, "global_step": 461348, "epoch": 5558} {"train_loss": -26.809667587280273, "global_step": 461349, "epoch": 5558} {"train_loss": -27.217878341674805, "global_step": 461350, "epoch": 5558} {"train_loss": -27.061038970947266, "global_step": 461351, "epoch": 5558} {"train_loss": -27.379413604736328, "global_step": 461352, "epoch": 5558} {"train_loss": -27.05726432800293, "global_step": 461353, "epoch": 5558} {"train_loss": -26.9677791595459, "global_step": 461354, "epoch": 5558} {"train_loss": -27.194311141967773, "global_step": 461355, "epoch": 5558} {"train_loss": -26.929828643798828, "global_step": 461356, "epoch": 5558} {"train_loss": -27.178180694580078, "global_step": 461357, "epoch": 5558} {"train_loss": -27.1431941986084, "global_step": 461358, "epoch": 5558} {"train_loss": -26.983983993530273, "global_step": 461359, "epoch": 5558} {"train_loss": -27.238134384155273, "global_step": 461360, "epoch": 5558} {"train_loss": -27.392932891845703, "global_step": 461361, "epoch": 5558} {"train_loss": -27.20441246032715, "global_step": 461362, "epoch": 5558} {"train_loss": -27.37677001953125, "global_step": 461363, "epoch": 5558} {"train_loss": -27.17579460144043, "global_step": 461364, "epoch": 5558} {"train_loss": -26.989410400390625, "global_step": 461365, "epoch": 5558} {"train_loss": -27.330961227416992, "global_step": 461366, "epoch": 5558} {"train_loss": -26.882129669189453, "global_step": 461367, "epoch": 5558} {"train_loss": -26.98760414123535, "global_step": 461368, "epoch": 5558} {"train_loss": -26.727802276611328, "global_step": 461369, "epoch": 5558} {"train_loss": -26.70478630065918, "global_step": 461370, "epoch": 5558} {"train_loss": -26.811111450195312, "global_step": 461371, "epoch": 5558} {"train_loss": -26.833078384399414, "global_step": 461372, "epoch": 5558} {"train_loss": -27.00188636779785, "global_step": 461373, "epoch": 5558} {"train_loss": -26.924192428588867, "global_step": 461374, "epoch": 5558} {"train_loss": -27.030460357666016, "global_step": 461375, "epoch": 5558} {"train_loss": -26.950834274291992, "global_step": 461376, "epoch": 5558} {"train_loss": -26.917226791381836, "global_step": 461377, "epoch": 5558} {"train_loss": -27.04087257385254, "global_step": 461378, "epoch": 5558} {"train_loss": -26.72198486328125, "global_step": 461379, "epoch": 5558} {"train_loss": -27.045337677001953, "global_step": 461380, "epoch": 5558} {"train_loss": -26.580575942993164, "global_step": 461381, "epoch": 5558} {"train_loss": -27.171466827392578, "global_step": 461382, "epoch": 5558} {"train_loss": -27.054107666015625, "global_step": 461383, "epoch": 5558} {"train_loss": -26.93147850036621, "global_step": 461384, "epoch": 5558} {"train_loss": -27.23577308654785, "global_step": 461385, "epoch": 5558} {"train_loss": -27.118438720703125, "global_step": 461386, "epoch": 5558} {"train_loss": -27.255569458007812, "global_step": 461387, "epoch": 5558} {"train_loss": -26.939056396484375, "global_step": 461388, "epoch": 5558} {"train_loss": -26.885847091674805, "global_step": 461389, "epoch": 5558} {"train_loss": -27.092355728149414, "global_step": 461390, "epoch": 5558} {"train_loss": -27.399002075195312, "global_step": 461391, "epoch": 5558} {"train_loss": -26.981184005737305, "global_step": 461392, "epoch": 5558} {"train_loss": -27.24375343322754, "global_step": 461393, "epoch": 5558} {"train_loss": -27.276655197143555, "global_step": 461394, "epoch": 5558} {"train_loss": -27.242063522338867, "global_step": 461395, "epoch": 5558} {"train_loss": -26.906396957765143, "global_step": 461396, "epoch": 5558, "val_loss": 6618179.0} {"train_loss": -26.302860260009766, "global_step": 461397, "epoch": 5559} {"train_loss": -26.30209732055664, "global_step": 461398, "epoch": 5559} {"train_loss": -26.366621017456055, "global_step": 461399, "epoch": 5559} {"train_loss": -26.326562881469727, "global_step": 461400, "epoch": 5559} {"train_loss": -26.221893310546875, "global_step": 461401, "epoch": 5559} {"train_loss": -26.414505004882812, "global_step": 461402, "epoch": 5559} {"train_loss": -26.03850746154785, "global_step": 461403, "epoch": 5559} {"train_loss": -26.736133575439453, "global_step": 461404, "epoch": 5559} {"train_loss": -26.395679473876953, "global_step": 461405, "epoch": 5559} {"train_loss": -26.440261840820312, "global_step": 461406, "epoch": 5559} {"train_loss": -26.505908966064453, "global_step": 461407, "epoch": 5559} {"train_loss": -26.749902725219727, "global_step": 461408, "epoch": 5559} {"train_loss": -26.347997665405273, "global_step": 461409, "epoch": 5559} {"train_loss": -26.323532104492188, "global_step": 461410, "epoch": 5559} {"train_loss": -26.891416549682617, "global_step": 461411, "epoch": 5559} {"train_loss": -27.007312774658203, "global_step": 461412, "epoch": 5559} {"train_loss": -27.188800811767578, "global_step": 461413, "epoch": 5559} {"train_loss": -26.85816764831543, "global_step": 461414, "epoch": 5559} {"train_loss": -26.781269073486328, "global_step": 461415, "epoch": 5559} {"train_loss": -26.778783798217773, "global_step": 461416, "epoch": 5559} {"train_loss": -26.819732666015625, "global_step": 461417, "epoch": 5559} {"train_loss": -27.136444091796875, "global_step": 461418, "epoch": 5559} {"train_loss": -26.47696876525879, "global_step": 461419, "epoch": 5559} {"train_loss": -26.78496742248535, "global_step": 461420, "epoch": 5559} {"train_loss": -26.614850997924805, "global_step": 461421, "epoch": 5559} {"train_loss": -26.959537506103516, "global_step": 461422, "epoch": 5559} {"train_loss": -27.078800201416016, "global_step": 461423, "epoch": 5559} {"train_loss": -27.1507625579834, "global_step": 461424, "epoch": 5559} {"train_loss": -27.118824005126953, "global_step": 461425, "epoch": 5559} {"train_loss": -26.618452072143555, "global_step": 461426, "epoch": 5559} {"train_loss": -27.08335304260254, "global_step": 461427, "epoch": 5559} {"train_loss": -27.357425689697266, "global_step": 461428, "epoch": 5559} {"train_loss": -27.18342399597168, "global_step": 461429, "epoch": 5559} {"train_loss": -26.955066680908203, "global_step": 461430, "epoch": 5559} {"train_loss": -27.19593620300293, "global_step": 461431, "epoch": 5559} {"train_loss": -27.09271240234375, "global_step": 461432, "epoch": 5559} {"train_loss": -27.13580894470215, "global_step": 461433, "epoch": 5559} {"train_loss": -27.010000228881836, "global_step": 461434, "epoch": 5559} {"train_loss": -27.284997940063477, "global_step": 461435, "epoch": 5559} {"train_loss": -26.934249877929688, "global_step": 461436, "epoch": 5559} {"train_loss": -27.318740844726562, "global_step": 461437, "epoch": 5559} {"train_loss": -27.3330020904541, "global_step": 461438, "epoch": 5559} {"train_loss": -27.45026969909668, "global_step": 461439, "epoch": 5559} {"train_loss": -27.20265007019043, "global_step": 461440, "epoch": 5559} {"train_loss": -27.311792373657227, "global_step": 461441, "epoch": 5559} {"train_loss": -27.331640243530273, "global_step": 461442, "epoch": 5559} {"train_loss": -27.202106475830078, "global_step": 461443, "epoch": 5559} {"train_loss": -27.264551162719727, "global_step": 461444, "epoch": 5559} {"train_loss": -27.39032554626465, "global_step": 461445, "epoch": 5559} {"train_loss": -27.41377067565918, "global_step": 461446, "epoch": 5559} {"train_loss": -27.744586944580078, "global_step": 461447, "epoch": 5559} {"train_loss": -27.102802276611328, "global_step": 461448, "epoch": 5559} {"train_loss": -27.3393497467041, "global_step": 461449, "epoch": 5559} {"train_loss": -27.371173858642578, "global_step": 461450, "epoch": 5559} {"train_loss": -27.605274200439453, "global_step": 461451, "epoch": 5559} {"train_loss": -27.293960571289062, "global_step": 461452, "epoch": 5559} {"train_loss": -27.10233497619629, "global_step": 461453, "epoch": 5559} {"train_loss": -27.4567928314209, "global_step": 461454, "epoch": 5559} {"train_loss": -27.479583740234375, "global_step": 461455, "epoch": 5559} {"train_loss": -27.202533721923828, "global_step": 461456, "epoch": 5559} {"train_loss": -27.450780868530273, "global_step": 461457, "epoch": 5559} {"train_loss": -27.142072677612305, "global_step": 461458, "epoch": 5559} {"train_loss": -26.73013687133789, "global_step": 461459, "epoch": 5559} {"train_loss": -26.2109432220459, "global_step": 461460, "epoch": 5559} {"train_loss": -24.92745018005371, "global_step": 461461, "epoch": 5559} {"train_loss": -24.821081161499023, "global_step": 461462, "epoch": 5559} {"train_loss": -25.53231430053711, "global_step": 461463, "epoch": 5559} {"train_loss": -26.432729721069336, "global_step": 461464, "epoch": 5559} {"train_loss": -26.2548770904541, "global_step": 461465, "epoch": 5559} {"train_loss": -25.684656143188477, "global_step": 461466, "epoch": 5559} {"train_loss": -26.433988571166992, "global_step": 461467, "epoch": 5559} {"train_loss": -25.783557891845703, "global_step": 461468, "epoch": 5559} {"train_loss": -26.619068145751953, "global_step": 461469, "epoch": 5559} {"train_loss": -26.13718032836914, "global_step": 461470, "epoch": 5559} {"train_loss": -26.284597396850586, "global_step": 461471, "epoch": 5559} {"train_loss": -26.537078857421875, "global_step": 461472, "epoch": 5559} {"train_loss": -26.140701293945312, "global_step": 461473, "epoch": 5559} {"train_loss": -26.448535919189453, "global_step": 461474, "epoch": 5559} {"train_loss": -26.456790924072266, "global_step": 461475, "epoch": 5559} {"train_loss": -26.561908721923828, "global_step": 461476, "epoch": 5559} {"train_loss": -26.6319637298584, "global_step": 461477, "epoch": 5559} {"train_loss": -26.446887969970703, "global_step": 461478, "epoch": 5559} {"train_loss": -26.79269287385136, "global_step": 461479, "epoch": 5559, "val_loss": 6534194.5} {"train_loss": -26.280242919921875, "global_step": 461480, "epoch": 5560} {"train_loss": -26.481922149658203, "global_step": 461481, "epoch": 5560} {"train_loss": -26.347665786743164, "global_step": 461482, "epoch": 5560} {"train_loss": -26.7005615234375, "global_step": 461483, "epoch": 5560} {"train_loss": -26.37822914123535, "global_step": 461484, "epoch": 5560} {"train_loss": -26.419904708862305, "global_step": 461485, "epoch": 5560} {"train_loss": -26.487661361694336, "global_step": 461486, "epoch": 5560} {"train_loss": -26.823551177978516, "global_step": 461487, "epoch": 5560} {"train_loss": -26.459537506103516, "global_step": 461488, "epoch": 5560} {"train_loss": -26.786657333374023, "global_step": 461489, "epoch": 5560} {"train_loss": -26.81858253479004, "global_step": 461490, "epoch": 5560} {"train_loss": -26.82659912109375, "global_step": 461491, "epoch": 5560} {"train_loss": -26.4948673248291, "global_step": 461492, "epoch": 5560} {"train_loss": -26.610794067382812, "global_step": 461493, "epoch": 5560} {"train_loss": -26.851999282836914, "global_step": 461494, "epoch": 5560} {"train_loss": -26.667211532592773, "global_step": 461495, "epoch": 5560} {"train_loss": -27.06001091003418, "global_step": 461496, "epoch": 5560} {"train_loss": -26.648834228515625, "global_step": 461497, "epoch": 5560} {"train_loss": -26.992919921875, "global_step": 461498, "epoch": 5560} {"train_loss": -26.992856979370117, "global_step": 461499, "epoch": 5560} {"train_loss": -27.023107528686523, "global_step": 461500, "epoch": 5560} {"train_loss": -26.880155563354492, "global_step": 461501, "epoch": 5560} {"train_loss": -27.426172256469727, "global_step": 461502, "epoch": 5560} {"train_loss": -27.438968658447266, "global_step": 461503, "epoch": 5560} {"train_loss": -27.163013458251953, "global_step": 461504, "epoch": 5560} {"train_loss": -27.049457550048828, "global_step": 461505, "epoch": 5560} {"train_loss": -26.929733276367188, "global_step": 461506, "epoch": 5560} {"train_loss": -26.867597579956055, "global_step": 461507, "epoch": 5560} {"train_loss": -27.183324813842773, "global_step": 461508, "epoch": 5560} {"train_loss": -26.805150985717773, "global_step": 461509, "epoch": 5560} {"train_loss": -27.013959884643555, "global_step": 461510, "epoch": 5560} {"train_loss": -27.338354110717773, "global_step": 461511, "epoch": 5560} {"train_loss": -27.193256378173828, "global_step": 461512, "epoch": 5560} {"train_loss": -27.063770294189453, "global_step": 461513, "epoch": 5560} {"train_loss": -27.284442901611328, "global_step": 461514, "epoch": 5560} {"train_loss": -27.548465728759766, "global_step": 461515, "epoch": 5560} {"train_loss": -27.131628036499023, "global_step": 461516, "epoch": 5560} {"train_loss": -27.038999557495117, "global_step": 461517, "epoch": 5560} {"train_loss": -27.218921661376953, "global_step": 461518, "epoch": 5560} {"train_loss": -27.03763198852539, "global_step": 461519, "epoch": 5560} {"train_loss": -26.788557052612305, "global_step": 461520, "epoch": 5560} {"train_loss": -27.0752010345459, "global_step": 461521, "epoch": 5560} {"train_loss": -26.863943099975586, "global_step": 461522, "epoch": 5560} {"train_loss": -26.961471557617188, "global_step": 461523, "epoch": 5560} {"train_loss": -27.204633712768555, "global_step": 461524, "epoch": 5560} {"train_loss": -27.31422233581543, "global_step": 461525, "epoch": 5560} {"train_loss": -27.165542602539062, "global_step": 461526, "epoch": 5560} {"train_loss": -27.253833770751953, "global_step": 461527, "epoch": 5560} {"train_loss": -27.05873680114746, "global_step": 461528, "epoch": 5560} {"train_loss": -26.702468872070312, "global_step": 461529, "epoch": 5560} {"train_loss": -26.9971981048584, "global_step": 461530, "epoch": 5560} {"train_loss": -27.422760009765625, "global_step": 461531, "epoch": 5560} {"train_loss": -27.194049835205078, "global_step": 461532, "epoch": 5560} {"train_loss": -26.820356369018555, "global_step": 461533, "epoch": 5560} {"train_loss": -27.216028213500977, "global_step": 461534, "epoch": 5560} {"train_loss": -27.271215438842773, "global_step": 461535, "epoch": 5560} {"train_loss": -26.682580947875977, "global_step": 461536, "epoch": 5560} {"train_loss": -26.955093383789062, "global_step": 461537, "epoch": 5560} {"train_loss": -27.040176391601562, "global_step": 461538, "epoch": 5560} {"train_loss": -27.340728759765625, "global_step": 461539, "epoch": 5560} {"train_loss": -26.938268661499023, "global_step": 461540, "epoch": 5560} {"train_loss": -27.2144832611084, "global_step": 461541, "epoch": 5560} {"train_loss": -27.065582275390625, "global_step": 461542, "epoch": 5560} {"train_loss": -27.103078842163086, "global_step": 461543, "epoch": 5560} {"train_loss": -27.181385040283203, "global_step": 461544, "epoch": 5560} {"train_loss": -27.18387794494629, "global_step": 461545, "epoch": 5560} {"train_loss": -26.67388916015625, "global_step": 461546, "epoch": 5560} {"train_loss": -27.388036727905273, "global_step": 461547, "epoch": 5560} {"train_loss": -26.92779541015625, "global_step": 461548, "epoch": 5560} {"train_loss": -27.085285186767578, "global_step": 461549, "epoch": 5560} {"train_loss": -27.765045166015625, "global_step": 461550, "epoch": 5560} {"train_loss": -27.2347354888916, "global_step": 461551, "epoch": 5560} {"train_loss": -26.989486694335938, "global_step": 461552, "epoch": 5560} {"train_loss": -27.133808135986328, "global_step": 461553, "epoch": 5560} {"train_loss": -27.181949615478516, "global_step": 461554, "epoch": 5560} {"train_loss": -27.117441177368164, "global_step": 461555, "epoch": 5560} {"train_loss": -27.156253814697266, "global_step": 461556, "epoch": 5560} {"train_loss": -26.99026870727539, "global_step": 461557, "epoch": 5560} {"train_loss": -27.010425567626953, "global_step": 461558, "epoch": 5560} {"train_loss": -27.3416805267334, "global_step": 461559, "epoch": 5560} {"train_loss": -27.15376853942871, "global_step": 461560, "epoch": 5560} {"train_loss": -26.830982208251953, "global_step": 461561, "epoch": 5560} {"train_loss": -27.002373247261506, "global_step": 461562, "epoch": 5560, "val_loss": 6537658.0} {"train_loss": -25.427371978759766, "global_step": 461563, "epoch": 5561} {"train_loss": -25.5517520904541, "global_step": 461564, "epoch": 5561} {"train_loss": -25.8173828125, "global_step": 461565, "epoch": 5561} {"train_loss": -25.910770416259766, "global_step": 461566, "epoch": 5561} {"train_loss": -25.713476181030273, "global_step": 461567, "epoch": 5561} {"train_loss": -25.93012809753418, "global_step": 461568, "epoch": 5561} {"train_loss": -26.2944393157959, "global_step": 461569, "epoch": 5561} {"train_loss": -26.19715690612793, "global_step": 461570, "epoch": 5561} {"train_loss": -26.503223419189453, "global_step": 461571, "epoch": 5561} {"train_loss": -26.3599796295166, "global_step": 461572, "epoch": 5561} {"train_loss": -26.22942543029785, "global_step": 461573, "epoch": 5561} {"train_loss": -26.56427001953125, "global_step": 461574, "epoch": 5561} {"train_loss": -26.709630966186523, "global_step": 461575, "epoch": 5561} {"train_loss": -26.782880783081055, "global_step": 461576, "epoch": 5561} {"train_loss": -26.513202667236328, "global_step": 461577, "epoch": 5561} {"train_loss": -27.012237548828125, "global_step": 461578, "epoch": 5561} {"train_loss": -26.45985221862793, "global_step": 461579, "epoch": 5561} {"train_loss": -26.626373291015625, "global_step": 461580, "epoch": 5561} {"train_loss": -26.71671485900879, "global_step": 461581, "epoch": 5561} {"train_loss": -26.815343856811523, "global_step": 461582, "epoch": 5561} {"train_loss": -26.635955810546875, "global_step": 461583, "epoch": 5561} {"train_loss": -26.594898223876953, "global_step": 461584, "epoch": 5561} {"train_loss": -26.883041381835938, "global_step": 461585, "epoch": 5561} {"train_loss": -26.723169326782227, "global_step": 461586, "epoch": 5561} {"train_loss": -26.76835060119629, "global_step": 461587, "epoch": 5561} {"train_loss": -27.0495548248291, "global_step": 461588, "epoch": 5561} {"train_loss": -26.82590675354004, "global_step": 461589, "epoch": 5561} {"train_loss": -26.701757431030273, "global_step": 461590, "epoch": 5561} {"train_loss": -26.798816680908203, "global_step": 461591, "epoch": 5561} {"train_loss": -27.29573631286621, "global_step": 461592, "epoch": 5561} {"train_loss": -27.22315788269043, "global_step": 461593, "epoch": 5561} {"train_loss": -27.06073570251465, "global_step": 461594, "epoch": 5561} {"train_loss": -26.988555908203125, "global_step": 461595, "epoch": 5561} {"train_loss": -26.986968994140625, "global_step": 461596, "epoch": 5561} {"train_loss": -27.1312198638916, "global_step": 461597, "epoch": 5561} {"train_loss": -27.038803100585938, "global_step": 461598, "epoch": 5561} {"train_loss": -27.299591064453125, "global_step": 461599, "epoch": 5561} {"train_loss": -27.13271141052246, "global_step": 461600, "epoch": 5561} {"train_loss": -27.332666397094727, "global_step": 461601, "epoch": 5561} {"train_loss": -27.002960205078125, "global_step": 461602, "epoch": 5561} {"train_loss": -27.241918563842773, "global_step": 461603, "epoch": 5561} {"train_loss": -26.97238540649414, "global_step": 461604, "epoch": 5561} {"train_loss": -27.157012939453125, "global_step": 461605, "epoch": 5561} {"train_loss": -27.091938018798828, "global_step": 461606, "epoch": 5561} {"train_loss": -27.47357177734375, "global_step": 461607, "epoch": 5561} {"train_loss": -27.561920166015625, "global_step": 461608, "epoch": 5561} {"train_loss": -27.033355712890625, "global_step": 461609, "epoch": 5561} {"train_loss": -27.353317260742188, "global_step": 461610, "epoch": 5561} {"train_loss": -27.198291778564453, "global_step": 461611, "epoch": 5561} {"train_loss": -27.252151489257812, "global_step": 461612, "epoch": 5561} {"train_loss": -27.32809829711914, "global_step": 461613, "epoch": 5561} {"train_loss": -27.3116455078125, "global_step": 461614, "epoch": 5561} {"train_loss": -27.35383415222168, "global_step": 461615, "epoch": 5561} {"train_loss": -27.369626998901367, "global_step": 461616, "epoch": 5561} {"train_loss": -27.321929931640625, "global_step": 461617, "epoch": 5561} {"train_loss": -27.492618560791016, "global_step": 461618, "epoch": 5561} {"train_loss": -27.188440322875977, "global_step": 461619, "epoch": 5561} {"train_loss": -27.200525283813477, "global_step": 461620, "epoch": 5561} {"train_loss": -27.289804458618164, "global_step": 461621, "epoch": 5561} {"train_loss": -27.039264678955078, "global_step": 461622, "epoch": 5561} {"train_loss": -27.101703643798828, "global_step": 461623, "epoch": 5561} {"train_loss": -27.47161865234375, "global_step": 461624, "epoch": 5561} {"train_loss": -27.407949447631836, "global_step": 461625, "epoch": 5561} {"train_loss": -27.076236724853516, "global_step": 461626, "epoch": 5561} {"train_loss": -27.342248916625977, "global_step": 461627, "epoch": 5561} {"train_loss": -27.52303123474121, "global_step": 461628, "epoch": 5561} {"train_loss": -27.351825714111328, "global_step": 461629, "epoch": 5561} {"train_loss": -27.219818115234375, "global_step": 461630, "epoch": 5561} {"train_loss": -27.329614639282227, "global_step": 461631, "epoch": 5561} {"train_loss": -26.9363956451416, "global_step": 461632, "epoch": 5561} {"train_loss": -26.572265625, "global_step": 461633, "epoch": 5561} {"train_loss": -27.165115356445312, "global_step": 461634, "epoch": 5561} {"train_loss": -27.217609405517578, "global_step": 461635, "epoch": 5561} {"train_loss": -27.122838973999023, "global_step": 461636, "epoch": 5561} {"train_loss": -26.95929527282715, "global_step": 461637, "epoch": 5561} {"train_loss": -27.138900756835938, "global_step": 461638, "epoch": 5561} {"train_loss": -27.539030075073242, "global_step": 461639, "epoch": 5561} {"train_loss": -27.31739616394043, "global_step": 461640, "epoch": 5561} {"train_loss": -26.95304298400879, "global_step": 461641, "epoch": 5561} {"train_loss": -27.260120391845703, "global_step": 461642, "epoch": 5561} {"train_loss": -27.310083389282227, "global_step": 461643, "epoch": 5561} {"train_loss": -26.914899826049805, "global_step": 461644, "epoch": 5561} {"train_loss": -26.938499726444842, "global_step": 461645, "epoch": 5561, "val_loss": 6547691.0} {"train_loss": -26.41395378112793, "global_step": 461646, "epoch": 5562} {"train_loss": -26.155475616455078, "global_step": 461647, "epoch": 5562} {"train_loss": -26.283924102783203, "global_step": 461648, "epoch": 5562} {"train_loss": -26.861658096313477, "global_step": 461649, "epoch": 5562} {"train_loss": -26.902830123901367, "global_step": 461650, "epoch": 5562} {"train_loss": -26.63288688659668, "global_step": 461651, "epoch": 5562} {"train_loss": -26.91204261779785, "global_step": 461652, "epoch": 5562} {"train_loss": -26.65618324279785, "global_step": 461653, "epoch": 5562} {"train_loss": -26.176965713500977, "global_step": 461654, "epoch": 5562} {"train_loss": -26.213537216186523, "global_step": 461655, "epoch": 5562} {"train_loss": -27.087345123291016, "global_step": 461656, "epoch": 5562} {"train_loss": -27.0941104888916, "global_step": 461657, "epoch": 5562} {"train_loss": -26.608427047729492, "global_step": 461658, "epoch": 5562} {"train_loss": -27.2069034576416, "global_step": 461659, "epoch": 5562} {"train_loss": -26.748300552368164, "global_step": 461660, "epoch": 5562} {"train_loss": -26.88718032836914, "global_step": 461661, "epoch": 5562} {"train_loss": -26.980661392211914, "global_step": 461662, "epoch": 5562} {"train_loss": -26.734390258789062, "global_step": 461663, "epoch": 5562} {"train_loss": -27.260351181030273, "global_step": 461664, "epoch": 5562} {"train_loss": -26.952377319335938, "global_step": 461665, "epoch": 5562} {"train_loss": -27.02044677734375, "global_step": 461666, "epoch": 5562} {"train_loss": -26.972827911376953, "global_step": 461667, "epoch": 5562} {"train_loss": -26.845870971679688, "global_step": 461668, "epoch": 5562} {"train_loss": -26.955936431884766, "global_step": 461669, "epoch": 5562} {"train_loss": -27.162683486938477, "global_step": 461670, "epoch": 5562} {"train_loss": -26.857397079467773, "global_step": 461671, "epoch": 5562} {"train_loss": -27.313947677612305, "global_step": 461672, "epoch": 5562} {"train_loss": -26.9657039642334, "global_step": 461673, "epoch": 5562} {"train_loss": -27.278959274291992, "global_step": 461674, "epoch": 5562} {"train_loss": -26.801315307617188, "global_step": 461675, "epoch": 5562} {"train_loss": -27.018213272094727, "global_step": 461676, "epoch": 5562} {"train_loss": -27.214981079101562, "global_step": 461677, "epoch": 5562} {"train_loss": -27.46241569519043, "global_step": 461678, "epoch": 5562} {"train_loss": -27.338037490844727, "global_step": 461679, "epoch": 5562} {"train_loss": -27.082595825195312, "global_step": 461680, "epoch": 5562} {"train_loss": -27.183881759643555, "global_step": 461681, "epoch": 5562} {"train_loss": -27.60413932800293, "global_step": 461682, "epoch": 5562} {"train_loss": -27.419021606445312, "global_step": 461683, "epoch": 5562} {"train_loss": -27.102060317993164, "global_step": 461684, "epoch": 5562} {"train_loss": -27.40418815612793, "global_step": 461685, "epoch": 5562} {"train_loss": -27.503711700439453, "global_step": 461686, "epoch": 5562} {"train_loss": -27.274932861328125, "global_step": 461687, "epoch": 5562} {"train_loss": -26.970746994018555, "global_step": 461688, "epoch": 5562} {"train_loss": -27.694000244140625, "global_step": 461689, "epoch": 5562} {"train_loss": -27.341693878173828, "global_step": 461690, "epoch": 5562} {"train_loss": -27.56085205078125, "global_step": 461691, "epoch": 5562} {"train_loss": -27.155536651611328, "global_step": 461692, "epoch": 5562} {"train_loss": -27.694416046142578, "global_step": 461693, "epoch": 5562} {"train_loss": -27.14252281188965, "global_step": 461694, "epoch": 5562} {"train_loss": -27.394489288330078, "global_step": 461695, "epoch": 5562} {"train_loss": -27.6268310546875, "global_step": 461696, "epoch": 5562} {"train_loss": -27.523818969726562, "global_step": 461697, "epoch": 5562} {"train_loss": -27.57112693786621, "global_step": 461698, "epoch": 5562} {"train_loss": -26.981342315673828, "global_step": 461699, "epoch": 5562} {"train_loss": -27.550146102905273, "global_step": 461700, "epoch": 5562} {"train_loss": -27.007049560546875, "global_step": 461701, "epoch": 5562} {"train_loss": -26.875574111938477, "global_step": 461702, "epoch": 5562} {"train_loss": -26.818634033203125, "global_step": 461703, "epoch": 5562} {"train_loss": -26.861907958984375, "global_step": 461704, "epoch": 5562} {"train_loss": -26.660314559936523, "global_step": 461705, "epoch": 5562} {"train_loss": -27.142126083374023, "global_step": 461706, "epoch": 5562} {"train_loss": -27.311817169189453, "global_step": 461707, "epoch": 5562} {"train_loss": -27.34309196472168, "global_step": 461708, "epoch": 5562} {"train_loss": -26.813404083251953, "global_step": 461709, "epoch": 5562} {"train_loss": -27.073556900024414, "global_step": 461710, "epoch": 5562} {"train_loss": -27.111928939819336, "global_step": 461711, "epoch": 5562} {"train_loss": -26.65193748474121, "global_step": 461712, "epoch": 5562} {"train_loss": -26.962982177734375, "global_step": 461713, "epoch": 5562} {"train_loss": -26.80454444885254, "global_step": 461714, "epoch": 5562} {"train_loss": -27.0672664642334, "global_step": 461715, "epoch": 5562} {"train_loss": -26.990209579467773, "global_step": 461716, "epoch": 5562} {"train_loss": -26.925779342651367, "global_step": 461717, "epoch": 5562} {"train_loss": -27.15711784362793, "global_step": 461718, "epoch": 5562} {"train_loss": -26.95123291015625, "global_step": 461719, "epoch": 5562} {"train_loss": -26.669416427612305, "global_step": 461720, "epoch": 5562} {"train_loss": -27.116348266601562, "global_step": 461721, "epoch": 5562} {"train_loss": -27.081968307495117, "global_step": 461722, "epoch": 5562} {"train_loss": -26.984155654907227, "global_step": 461723, "epoch": 5562} {"train_loss": -26.567602157592773, "global_step": 461724, "epoch": 5562} {"train_loss": -27.460819244384766, "global_step": 461725, "epoch": 5562} {"train_loss": -27.01348876953125, "global_step": 461726, "epoch": 5562} {"train_loss": -27.346166610717773, "global_step": 461727, "epoch": 5562} {"train_loss": -27.04863143828978, "global_step": 461728, "epoch": 5562, "val_loss": 6551119.0} {"train_loss": -26.108245849609375, "global_step": 461729, "epoch": 5563} {"train_loss": -26.111108779907227, "global_step": 461730, "epoch": 5563} {"train_loss": -26.690448760986328, "global_step": 461731, "epoch": 5563} {"train_loss": -26.24976921081543, "global_step": 461732, "epoch": 5563} {"train_loss": -26.758514404296875, "global_step": 461733, "epoch": 5563} {"train_loss": -25.92608070373535, "global_step": 461734, "epoch": 5563} {"train_loss": -25.8856143951416, "global_step": 461735, "epoch": 5563} {"train_loss": -26.472558975219727, "global_step": 461736, "epoch": 5563} {"train_loss": -26.26605796813965, "global_step": 461737, "epoch": 5563} {"train_loss": -26.751707077026367, "global_step": 461738, "epoch": 5563} {"train_loss": -26.3111572265625, "global_step": 461739, "epoch": 5563} {"train_loss": -26.47403907775879, "global_step": 461740, "epoch": 5563} {"train_loss": -26.974964141845703, "global_step": 461741, "epoch": 5563} {"train_loss": -26.238168716430664, "global_step": 461742, "epoch": 5563} {"train_loss": -26.71219253540039, "global_step": 461743, "epoch": 5563} {"train_loss": -26.18890380859375, "global_step": 461744, "epoch": 5563} {"train_loss": -26.6037540435791, "global_step": 461745, "epoch": 5563} {"train_loss": -26.440805435180664, "global_step": 461746, "epoch": 5563} {"train_loss": -26.51572036743164, "global_step": 461747, "epoch": 5563} {"train_loss": -26.78998374938965, "global_step": 461748, "epoch": 5563} {"train_loss": -26.6431827545166, "global_step": 461749, "epoch": 5563} {"train_loss": -27.018878936767578, "global_step": 461750, "epoch": 5563} {"train_loss": -26.924909591674805, "global_step": 461751, "epoch": 5563} {"train_loss": -26.663156509399414, "global_step": 461752, "epoch": 5563} {"train_loss": -26.90350341796875, "global_step": 461753, "epoch": 5563} {"train_loss": -26.876300811767578, "global_step": 461754, "epoch": 5563} {"train_loss": -27.23560905456543, "global_step": 461755, "epoch": 5563} {"train_loss": -26.805011749267578, "global_step": 461756, "epoch": 5563} {"train_loss": -27.147022247314453, "global_step": 461757, "epoch": 5563} {"train_loss": -26.631855010986328, "global_step": 461758, "epoch": 5563} {"train_loss": -26.755496978759766, "global_step": 461759, "epoch": 5563} {"train_loss": -26.98883628845215, "global_step": 461760, "epoch": 5563} {"train_loss": -26.9920654296875, "global_step": 461761, "epoch": 5563} {"train_loss": -27.553693771362305, "global_step": 461762, "epoch": 5563} {"train_loss": -27.443103790283203, "global_step": 461763, "epoch": 5563} {"train_loss": -26.938501358032227, "global_step": 461764, "epoch": 5563} {"train_loss": -26.998870849609375, "global_step": 461765, "epoch": 5563} {"train_loss": -27.111093521118164, "global_step": 461766, "epoch": 5563} {"train_loss": -27.119369506835938, "global_step": 461767, "epoch": 5563} {"train_loss": -27.085453033447266, "global_step": 461768, "epoch": 5563} {"train_loss": -27.292287826538086, "global_step": 461769, "epoch": 5563} {"train_loss": -27.19951820373535, "global_step": 461770, "epoch": 5563} {"train_loss": -27.046152114868164, "global_step": 461771, "epoch": 5563} {"train_loss": -27.118915557861328, "global_step": 461772, "epoch": 5563} {"train_loss": -27.132349014282227, "global_step": 461773, "epoch": 5563} {"train_loss": -27.19426918029785, "global_step": 461774, "epoch": 5563} {"train_loss": -27.551685333251953, "global_step": 461775, "epoch": 5563} {"train_loss": -27.5936222076416, "global_step": 461776, "epoch": 5563} {"train_loss": -27.27058219909668, "global_step": 461777, "epoch": 5563} {"train_loss": -27.334760665893555, "global_step": 461778, "epoch": 5563} {"train_loss": -27.510778427124023, "global_step": 461779, "epoch": 5563} {"train_loss": -27.2645263671875, "global_step": 461780, "epoch": 5563} {"train_loss": -27.40482521057129, "global_step": 461781, "epoch": 5563} {"train_loss": -27.239990234375, "global_step": 461782, "epoch": 5563} {"train_loss": -26.98543357849121, "global_step": 461783, "epoch": 5563} {"train_loss": -26.81330680847168, "global_step": 461784, "epoch": 5563} {"train_loss": -26.5655517578125, "global_step": 461785, "epoch": 5563} {"train_loss": -26.767969131469727, "global_step": 461786, "epoch": 5563} {"train_loss": -26.51385498046875, "global_step": 461787, "epoch": 5563} {"train_loss": -26.843082427978516, "global_step": 461788, "epoch": 5563} {"train_loss": -27.03849220275879, "global_step": 461789, "epoch": 5563} {"train_loss": -26.29107666015625, "global_step": 461790, "epoch": 5563} {"train_loss": -26.889556884765625, "global_step": 461791, "epoch": 5563} {"train_loss": -27.155414581298828, "global_step": 461792, "epoch": 5563} {"train_loss": -26.56121253967285, "global_step": 461793, "epoch": 5563} {"train_loss": -26.9600772857666, "global_step": 461794, "epoch": 5563} {"train_loss": -27.147693634033203, "global_step": 461795, "epoch": 5563} {"train_loss": -26.84522819519043, "global_step": 461796, "epoch": 5563} {"train_loss": -26.898910522460938, "global_step": 461797, "epoch": 5563} {"train_loss": -27.032827377319336, "global_step": 461798, "epoch": 5563} {"train_loss": -27.12113380432129, "global_step": 461799, "epoch": 5563} {"train_loss": -26.8632755279541, "global_step": 461800, "epoch": 5563} {"train_loss": -26.89546775817871, "global_step": 461801, "epoch": 5563} {"train_loss": -27.218505859375, "global_step": 461802, "epoch": 5563} {"train_loss": -27.171051025390625, "global_step": 461803, "epoch": 5563} {"train_loss": -27.263071060180664, "global_step": 461804, "epoch": 5563} {"train_loss": -27.00240135192871, "global_step": 461805, "epoch": 5563} {"train_loss": -27.262500762939453, "global_step": 461806, "epoch": 5563} {"train_loss": -27.112943649291992, "global_step": 461807, "epoch": 5563} {"train_loss": -26.7408390045166, "global_step": 461808, "epoch": 5563} {"train_loss": -27.15250015258789, "global_step": 461809, "epoch": 5563} {"train_loss": -26.765460968017578, "global_step": 461810, "epoch": 5563} {"train_loss": -26.86035294130624, "global_step": 461811, "epoch": 5563, "val_loss": 6606884.0} {"train_loss": -26.75345802307129, "global_step": 461812, "epoch": 5564} {"train_loss": -26.6796817779541, "global_step": 461813, "epoch": 5564} {"train_loss": -26.84315299987793, "global_step": 461814, "epoch": 5564} {"train_loss": -26.415369033813477, "global_step": 461815, "epoch": 5564} {"train_loss": -26.98231315612793, "global_step": 461816, "epoch": 5564} {"train_loss": -26.54644775390625, "global_step": 461817, "epoch": 5564} {"train_loss": -27.058353424072266, "global_step": 461818, "epoch": 5564} {"train_loss": -26.957685470581055, "global_step": 461819, "epoch": 5564} {"train_loss": -27.003662109375, "global_step": 461820, "epoch": 5564} {"train_loss": -27.170984268188477, "global_step": 461821, "epoch": 5564} {"train_loss": -27.27311134338379, "global_step": 461822, "epoch": 5564} {"train_loss": -27.389188766479492, "global_step": 461823, "epoch": 5564} {"train_loss": -27.072660446166992, "global_step": 461824, "epoch": 5564} {"train_loss": -26.954269409179688, "global_step": 461825, "epoch": 5564} {"train_loss": -26.992919921875, "global_step": 461826, "epoch": 5564} {"train_loss": -27.066564559936523, "global_step": 461827, "epoch": 5564} {"train_loss": -26.89277458190918, "global_step": 461828, "epoch": 5564} {"train_loss": -26.843313217163086, "global_step": 461829, "epoch": 5564} {"train_loss": -27.156198501586914, "global_step": 461830, "epoch": 5564} {"train_loss": -27.33524513244629, "global_step": 461831, "epoch": 5564} {"train_loss": -26.976865768432617, "global_step": 461832, "epoch": 5564} {"train_loss": -27.1837158203125, "global_step": 461833, "epoch": 5564} {"train_loss": -26.933256149291992, "global_step": 461834, "epoch": 5564} {"train_loss": -27.095346450805664, "global_step": 461835, "epoch": 5564} {"train_loss": -27.18061637878418, "global_step": 461836, "epoch": 5564} {"train_loss": -27.200958251953125, "global_step": 461837, "epoch": 5564} {"train_loss": -26.99567222595215, "global_step": 461838, "epoch": 5564} {"train_loss": -26.979202270507812, "global_step": 461839, "epoch": 5564} {"train_loss": -26.8148250579834, "global_step": 461840, "epoch": 5564} {"train_loss": -27.214603424072266, "global_step": 461841, "epoch": 5564} {"train_loss": -27.361303329467773, "global_step": 461842, "epoch": 5564} {"train_loss": -27.02545166015625, "global_step": 461843, "epoch": 5564} {"train_loss": -27.02570915222168, "global_step": 461844, "epoch": 5564} {"train_loss": -27.169296264648438, "global_step": 461845, "epoch": 5564} {"train_loss": -27.18842124938965, "global_step": 461846, "epoch": 5564} {"train_loss": -27.29542350769043, "global_step": 461847, "epoch": 5564} {"train_loss": -27.446008682250977, "global_step": 461848, "epoch": 5564} {"train_loss": -27.086902618408203, "global_step": 461849, "epoch": 5564} {"train_loss": -27.221784591674805, "global_step": 461850, "epoch": 5564} {"train_loss": -26.945281982421875, "global_step": 461851, "epoch": 5564} {"train_loss": -27.25530433654785, "global_step": 461852, "epoch": 5564} {"train_loss": -27.273284912109375, "global_step": 461853, "epoch": 5564} {"train_loss": -27.316486358642578, "global_step": 461854, "epoch": 5564} {"train_loss": -27.03986930847168, "global_step": 461855, "epoch": 5564} {"train_loss": -27.07305908203125, "global_step": 461856, "epoch": 5564} {"train_loss": -27.19305992126465, "global_step": 461857, "epoch": 5564} {"train_loss": -26.990741729736328, "global_step": 461858, "epoch": 5564} {"train_loss": -27.319578170776367, "global_step": 461859, "epoch": 5564} {"train_loss": -27.109907150268555, "global_step": 461860, "epoch": 5564} {"train_loss": -27.15213966369629, "global_step": 461861, "epoch": 5564} {"train_loss": -27.321210861206055, "global_step": 461862, "epoch": 5564} {"train_loss": -27.2727108001709, "global_step": 461863, "epoch": 5564} {"train_loss": -27.166898727416992, "global_step": 461864, "epoch": 5564} {"train_loss": -27.226545333862305, "global_step": 461865, "epoch": 5564} {"train_loss": -26.99615478515625, "global_step": 461866, "epoch": 5564} {"train_loss": -27.357873916625977, "global_step": 461867, "epoch": 5564} {"train_loss": -27.039005279541016, "global_step": 461868, "epoch": 5564} {"train_loss": -27.491464614868164, "global_step": 461869, "epoch": 5564} {"train_loss": -27.512039184570312, "global_step": 461870, "epoch": 5564} {"train_loss": -26.970783233642578, "global_step": 461871, "epoch": 5564} {"train_loss": -27.1825008392334, "global_step": 461872, "epoch": 5564} {"train_loss": -27.015024185180664, "global_step": 461873, "epoch": 5564} {"train_loss": -27.173059463500977, "global_step": 461874, "epoch": 5564} {"train_loss": -27.51222038269043, "global_step": 461875, "epoch": 5564} {"train_loss": -27.4727840423584, "global_step": 461876, "epoch": 5564} {"train_loss": -26.970233917236328, "global_step": 461877, "epoch": 5564} {"train_loss": -27.276264190673828, "global_step": 461878, "epoch": 5564} {"train_loss": -26.7802791595459, "global_step": 461879, "epoch": 5564} {"train_loss": -27.250228881835938, "global_step": 461880, "epoch": 5564} {"train_loss": -27.1202392578125, "global_step": 461881, "epoch": 5564} {"train_loss": -27.115280151367188, "global_step": 461882, "epoch": 5564} {"train_loss": -27.200498580932617, "global_step": 461883, "epoch": 5564} {"train_loss": -26.966482162475586, "global_step": 461884, "epoch": 5564} {"train_loss": -27.24798583984375, "global_step": 461885, "epoch": 5564} {"train_loss": -27.266721725463867, "global_step": 461886, "epoch": 5564} {"train_loss": -26.90101432800293, "global_step": 461887, "epoch": 5564} {"train_loss": -27.181884765625, "global_step": 461888, "epoch": 5564} {"train_loss": -27.005842208862305, "global_step": 461889, "epoch": 5564} {"train_loss": -26.78631591796875, "global_step": 461890, "epoch": 5564} {"train_loss": -27.1057071685791, "global_step": 461891, "epoch": 5564} {"train_loss": -27.369489669799805, "global_step": 461892, "epoch": 5564} {"train_loss": -27.173696517944336, "global_step": 461893, "epoch": 5564} {"train_loss": -27.1232188121382, "global_step": 461894, "epoch": 5564, "val_loss": 6667497.0} {"train_loss": -26.58154296875, "global_step": 461895, "epoch": 5565} {"train_loss": -25.685821533203125, "global_step": 461896, "epoch": 5565} {"train_loss": -26.314359664916992, "global_step": 461897, "epoch": 5565} {"train_loss": -26.6414852142334, "global_step": 461898, "epoch": 5565} {"train_loss": -25.366233825683594, "global_step": 461899, "epoch": 5565} {"train_loss": -25.389862060546875, "global_step": 461900, "epoch": 5565} {"train_loss": -26.62615966796875, "global_step": 461901, "epoch": 5565} {"train_loss": -26.338613510131836, "global_step": 461902, "epoch": 5565} {"train_loss": -26.2711181640625, "global_step": 461903, "epoch": 5565} {"train_loss": -26.060077667236328, "global_step": 461904, "epoch": 5565} {"train_loss": -25.951391220092773, "global_step": 461905, "epoch": 5565} {"train_loss": -26.492353439331055, "global_step": 461906, "epoch": 5565} {"train_loss": -26.476795196533203, "global_step": 461907, "epoch": 5565} {"train_loss": -26.644428253173828, "global_step": 461908, "epoch": 5565} {"train_loss": -26.465152740478516, "global_step": 461909, "epoch": 5565} {"train_loss": -26.7667236328125, "global_step": 461910, "epoch": 5565} {"train_loss": -26.561542510986328, "global_step": 461911, "epoch": 5565} {"train_loss": -26.551166534423828, "global_step": 461912, "epoch": 5565} {"train_loss": -26.915393829345703, "global_step": 461913, "epoch": 5565} {"train_loss": -26.527393341064453, "global_step": 461914, "epoch": 5565} {"train_loss": -26.887165069580078, "global_step": 461915, "epoch": 5565} {"train_loss": -26.627582550048828, "global_step": 461916, "epoch": 5565} {"train_loss": -26.804962158203125, "global_step": 461917, "epoch": 5565} {"train_loss": -26.88111686706543, "global_step": 461918, "epoch": 5565} {"train_loss": -26.823755264282227, "global_step": 461919, "epoch": 5565} {"train_loss": -26.919553756713867, "global_step": 461920, "epoch": 5565} {"train_loss": -26.93281364440918, "global_step": 461921, "epoch": 5565} {"train_loss": -26.7401065826416, "global_step": 461922, "epoch": 5565} {"train_loss": -26.78090476989746, "global_step": 461923, "epoch": 5565} {"train_loss": -26.779083251953125, "global_step": 461924, "epoch": 5565} {"train_loss": -26.77947998046875, "global_step": 461925, "epoch": 5565} {"train_loss": -27.07341957092285, "global_step": 461926, "epoch": 5565} {"train_loss": -26.832656860351562, "global_step": 461927, "epoch": 5565} {"train_loss": -27.024389266967773, "global_step": 461928, "epoch": 5565} {"train_loss": -27.0095157623291, "global_step": 461929, "epoch": 5565} {"train_loss": -27.037384033203125, "global_step": 461930, "epoch": 5565} {"train_loss": -27.28455924987793, "global_step": 461931, "epoch": 5565} {"train_loss": -27.2469425201416, "global_step": 461932, "epoch": 5565} {"train_loss": -26.825651168823242, "global_step": 461933, "epoch": 5565} {"train_loss": -27.26202392578125, "global_step": 461934, "epoch": 5565} {"train_loss": -27.32453727722168, "global_step": 461935, "epoch": 5565} {"train_loss": -27.185834884643555, "global_step": 461936, "epoch": 5565} {"train_loss": -27.110626220703125, "global_step": 461937, "epoch": 5565} {"train_loss": -27.028654098510742, "global_step": 461938, "epoch": 5565} {"train_loss": -27.373937606811523, "global_step": 461939, "epoch": 5565} {"train_loss": -27.218252182006836, "global_step": 461940, "epoch": 5565} {"train_loss": -27.303640365600586, "global_step": 461941, "epoch": 5565} {"train_loss": -27.21693992614746, "global_step": 461942, "epoch": 5565} {"train_loss": -27.251855850219727, "global_step": 461943, "epoch": 5565} {"train_loss": -26.990436553955078, "global_step": 461944, "epoch": 5565} {"train_loss": -27.315093994140625, "global_step": 461945, "epoch": 5565} {"train_loss": -27.225940704345703, "global_step": 461946, "epoch": 5565} {"train_loss": -27.472864151000977, "global_step": 461947, "epoch": 5565} {"train_loss": -26.793506622314453, "global_step": 461948, "epoch": 5565} {"train_loss": -27.135086059570312, "global_step": 461949, "epoch": 5565} {"train_loss": -27.26539421081543, "global_step": 461950, "epoch": 5565} {"train_loss": -27.245895385742188, "global_step": 461951, "epoch": 5565} {"train_loss": -27.120697021484375, "global_step": 461952, "epoch": 5565} {"train_loss": -26.910932540893555, "global_step": 461953, "epoch": 5565} {"train_loss": -27.452224731445312, "global_step": 461954, "epoch": 5565} {"train_loss": -26.995752334594727, "global_step": 461955, "epoch": 5565} {"train_loss": -27.487768173217773, "global_step": 461956, "epoch": 5565} {"train_loss": -27.060302734375, "global_step": 461957, "epoch": 5565} {"train_loss": -27.378437042236328, "global_step": 461958, "epoch": 5565} {"train_loss": -27.020246505737305, "global_step": 461959, "epoch": 5565} {"train_loss": -27.284320831298828, "global_step": 461960, "epoch": 5565} {"train_loss": -27.58265495300293, "global_step": 461961, "epoch": 5565} {"train_loss": -27.046567916870117, "global_step": 461962, "epoch": 5565} {"train_loss": -26.948163986206055, "global_step": 461963, "epoch": 5565} {"train_loss": -26.96121597290039, "global_step": 461964, "epoch": 5565} {"train_loss": -27.357131958007812, "global_step": 461965, "epoch": 5565} {"train_loss": -27.026288986206055, "global_step": 461966, "epoch": 5565} {"train_loss": -27.175024032592773, "global_step": 461967, "epoch": 5565} {"train_loss": -27.308523178100586, "global_step": 461968, "epoch": 5565} {"train_loss": -26.980030059814453, "global_step": 461969, "epoch": 5565} {"train_loss": -27.204694747924805, "global_step": 461970, "epoch": 5565} {"train_loss": -27.4741268157959, "global_step": 461971, "epoch": 5565} {"train_loss": -27.03352165222168, "global_step": 461972, "epoch": 5565} {"train_loss": -26.581457138061523, "global_step": 461973, "epoch": 5565} {"train_loss": -27.58684730529785, "global_step": 461974, "epoch": 5565} {"train_loss": -27.211145401000977, "global_step": 461975, "epoch": 5565} {"train_loss": -26.77069091796875, "global_step": 461976, "epoch": 5565} {"train_loss": -26.88873405916145, "global_step": 461977, "epoch": 5565, "val_loss": 6528610.0} {"train_loss": -25.18670654296875, "global_step": 461978, "epoch": 5566} {"train_loss": -25.665042877197266, "global_step": 461979, "epoch": 5566} {"train_loss": -25.63532829284668, "global_step": 461980, "epoch": 5566} {"train_loss": -25.964008331298828, "global_step": 461981, "epoch": 5566} {"train_loss": -26.678638458251953, "global_step": 461982, "epoch": 5566} {"train_loss": -25.719532012939453, "global_step": 461983, "epoch": 5566} {"train_loss": -26.407529830932617, "global_step": 461984, "epoch": 5566} {"train_loss": -26.330717086791992, "global_step": 461985, "epoch": 5566} {"train_loss": -26.504709243774414, "global_step": 461986, "epoch": 5566} {"train_loss": -26.710912704467773, "global_step": 461987, "epoch": 5566} {"train_loss": -26.511077880859375, "global_step": 461988, "epoch": 5566} {"train_loss": -26.226409912109375, "global_step": 461989, "epoch": 5566} {"train_loss": -26.144567489624023, "global_step": 461990, "epoch": 5566} {"train_loss": -26.317968368530273, "global_step": 461991, "epoch": 5566} {"train_loss": -26.906909942626953, "global_step": 461992, "epoch": 5566} {"train_loss": -26.510456085205078, "global_step": 461993, "epoch": 5566} {"train_loss": -26.364532470703125, "global_step": 461994, "epoch": 5566} {"train_loss": -26.68433952331543, "global_step": 461995, "epoch": 5566} {"train_loss": -26.865575790405273, "global_step": 461996, "epoch": 5566} {"train_loss": -26.848926544189453, "global_step": 461997, "epoch": 5566} {"train_loss": -26.66692543029785, "global_step": 461998, "epoch": 5566} {"train_loss": -27.129056930541992, "global_step": 461999, "epoch": 5566} {"train_loss": -26.659320831298828, "global_step": 462000, "epoch": 5566} {"train_loss": -26.837417602539062, "global_step": 462001, "epoch": 5566} {"train_loss": -26.801565170288086, "global_step": 462002, "epoch": 5566} {"train_loss": -27.02528190612793, "global_step": 462003, "epoch": 5566} {"train_loss": -26.771406173706055, "global_step": 462004, "epoch": 5566} {"train_loss": -27.131977081298828, "global_step": 462005, "epoch": 5566} {"train_loss": -26.981338500976562, "global_step": 462006, "epoch": 5566} {"train_loss": -26.82716178894043, "global_step": 462007, "epoch": 5566} {"train_loss": -27.093032836914062, "global_step": 462008, "epoch": 5566} {"train_loss": -26.912601470947266, "global_step": 462009, "epoch": 5566} {"train_loss": -27.0472354888916, "global_step": 462010, "epoch": 5566} {"train_loss": -26.77308464050293, "global_step": 462011, "epoch": 5566} {"train_loss": -26.7498722076416, "global_step": 462012, "epoch": 5566} {"train_loss": -27.095983505249023, "global_step": 462013, "epoch": 5566} {"train_loss": -26.68668556213379, "global_step": 462014, "epoch": 5566} {"train_loss": -26.956329345703125, "global_step": 462015, "epoch": 5566} {"train_loss": -26.932703018188477, "global_step": 462016, "epoch": 5566} {"train_loss": -27.51222801208496, "global_step": 462017, "epoch": 5566} {"train_loss": -27.26700782775879, "global_step": 462018, "epoch": 5566} {"train_loss": -26.823083877563477, "global_step": 462019, "epoch": 5566} {"train_loss": -27.04168701171875, "global_step": 462020, "epoch": 5566} {"train_loss": -27.32283592224121, "global_step": 462021, "epoch": 5566} {"train_loss": -27.369043350219727, "global_step": 462022, "epoch": 5566} {"train_loss": -27.16974449157715, "global_step": 462023, "epoch": 5566} {"train_loss": -27.073486328125, "global_step": 462024, "epoch": 5566} {"train_loss": -26.960046768188477, "global_step": 462025, "epoch": 5566} {"train_loss": -26.80810546875, "global_step": 462026, "epoch": 5566} {"train_loss": -27.28742027282715, "global_step": 462027, "epoch": 5566} {"train_loss": -27.04412269592285, "global_step": 462028, "epoch": 5566} {"train_loss": -26.986083984375, "global_step": 462029, "epoch": 5566} {"train_loss": -27.114856719970703, "global_step": 462030, "epoch": 5566} {"train_loss": -27.005460739135742, "global_step": 462031, "epoch": 5566} {"train_loss": -27.09701919555664, "global_step": 462032, "epoch": 5566} {"train_loss": -27.517169952392578, "global_step": 462033, "epoch": 5566} {"train_loss": -27.174406051635742, "global_step": 462034, "epoch": 5566} {"train_loss": -27.180448532104492, "global_step": 462035, "epoch": 5566} {"train_loss": -26.758285522460938, "global_step": 462036, "epoch": 5566} {"train_loss": -27.029712677001953, "global_step": 462037, "epoch": 5566} {"train_loss": -27.56511878967285, "global_step": 462038, "epoch": 5566} {"train_loss": -26.91248893737793, "global_step": 462039, "epoch": 5566} {"train_loss": -27.28958511352539, "global_step": 462040, "epoch": 5566} {"train_loss": -27.30449867248535, "global_step": 462041, "epoch": 5566} {"train_loss": -27.181562423706055, "global_step": 462042, "epoch": 5566} {"train_loss": -26.99297523498535, "global_step": 462043, "epoch": 5566} {"train_loss": -26.9916934967041, "global_step": 462044, "epoch": 5566} {"train_loss": -27.334991455078125, "global_step": 462045, "epoch": 5566} {"train_loss": -26.889211654663086, "global_step": 462046, "epoch": 5566} {"train_loss": -26.86614418029785, "global_step": 462047, "epoch": 5566} {"train_loss": -27.335485458374023, "global_step": 462048, "epoch": 5566} {"train_loss": -27.088409423828125, "global_step": 462049, "epoch": 5566} {"train_loss": -26.9849910736084, "global_step": 462050, "epoch": 5566} {"train_loss": -26.94596290588379, "global_step": 462051, "epoch": 5566} {"train_loss": -26.93928337097168, "global_step": 462052, "epoch": 5566} {"train_loss": -26.914228439331055, "global_step": 462053, "epoch": 5566} {"train_loss": -26.930328369140625, "global_step": 462054, "epoch": 5566} {"train_loss": -26.876184463500977, "global_step": 462055, "epoch": 5566} {"train_loss": -27.04249382019043, "global_step": 462056, "epoch": 5566} {"train_loss": -26.779495239257812, "global_step": 462057, "epoch": 5566} {"train_loss": -26.839902877807617, "global_step": 462058, "epoch": 5566} {"train_loss": -26.779224395751953, "global_step": 462059, "epoch": 5566} {"train_loss": -26.839073893535566, "global_step": 462060, "epoch": 5566, "val_loss": 6529363.0} {"train_loss": -26.98856544494629, "global_step": 462061, "epoch": 5567} {"train_loss": -26.926794052124023, "global_step": 462062, "epoch": 5567} {"train_loss": -27.291152954101562, "global_step": 462063, "epoch": 5567} {"train_loss": -27.268461227416992, "global_step": 462064, "epoch": 5567} {"train_loss": -26.869062423706055, "global_step": 462065, "epoch": 5567} {"train_loss": -27.067035675048828, "global_step": 462066, "epoch": 5567} {"train_loss": -27.118314743041992, "global_step": 462067, "epoch": 5567} {"train_loss": -27.266393661499023, "global_step": 462068, "epoch": 5567} {"train_loss": -27.0382022857666, "global_step": 462069, "epoch": 5567} {"train_loss": -26.64944839477539, "global_step": 462070, "epoch": 5567} {"train_loss": -26.58363151550293, "global_step": 462071, "epoch": 5567} {"train_loss": -27.036630630493164, "global_step": 462072, "epoch": 5567} {"train_loss": -27.019269943237305, "global_step": 462073, "epoch": 5567} {"train_loss": -26.8754825592041, "global_step": 462074, "epoch": 5567} {"train_loss": -26.77070426940918, "global_step": 462075, "epoch": 5567} {"train_loss": -26.36785888671875, "global_step": 462076, "epoch": 5567} {"train_loss": -26.327594757080078, "global_step": 462077, "epoch": 5567} {"train_loss": -26.869171142578125, "global_step": 462078, "epoch": 5567} {"train_loss": -26.79473304748535, "global_step": 462079, "epoch": 5567} {"train_loss": -26.686756134033203, "global_step": 462080, "epoch": 5567} {"train_loss": -26.75608253479004, "global_step": 462081, "epoch": 5567} {"train_loss": -26.43902015686035, "global_step": 462082, "epoch": 5567} {"train_loss": -26.299692153930664, "global_step": 462083, "epoch": 5567} {"train_loss": -26.8271484375, "global_step": 462084, "epoch": 5567} {"train_loss": -26.42474365234375, "global_step": 462085, "epoch": 5567} {"train_loss": -26.879770278930664, "global_step": 462086, "epoch": 5567} {"train_loss": -26.46327018737793, "global_step": 462087, "epoch": 5567} {"train_loss": -26.429584503173828, "global_step": 462088, "epoch": 5567} {"train_loss": -26.76584815979004, "global_step": 462089, "epoch": 5567} {"train_loss": -26.73260498046875, "global_step": 462090, "epoch": 5567} {"train_loss": -26.685840606689453, "global_step": 462091, "epoch": 5567} {"train_loss": -27.250335693359375, "global_step": 462092, "epoch": 5567} {"train_loss": -26.4138240814209, "global_step": 462093, "epoch": 5567} {"train_loss": -26.83820915222168, "global_step": 462094, "epoch": 5567} {"train_loss": -26.84771156311035, "global_step": 462095, "epoch": 5567} {"train_loss": -27.476675033569336, "global_step": 462096, "epoch": 5567} {"train_loss": -27.002655029296875, "global_step": 462097, "epoch": 5567} {"train_loss": -26.624597549438477, "global_step": 462098, "epoch": 5567} {"train_loss": -26.970483779907227, "global_step": 462099, "epoch": 5567} {"train_loss": -27.17807960510254, "global_step": 462100, "epoch": 5567} {"train_loss": -27.148014068603516, "global_step": 462101, "epoch": 5567} {"train_loss": -27.345312118530273, "global_step": 462102, "epoch": 5567} {"train_loss": -26.621530532836914, "global_step": 462103, "epoch": 5567} {"train_loss": -26.83969497680664, "global_step": 462104, "epoch": 5567} {"train_loss": -26.99873161315918, "global_step": 462105, "epoch": 5567} {"train_loss": -27.204452514648438, "global_step": 462106, "epoch": 5567} {"train_loss": -27.1434383392334, "global_step": 462107, "epoch": 5567} {"train_loss": -27.130420684814453, "global_step": 462108, "epoch": 5567} {"train_loss": -27.12359619140625, "global_step": 462109, "epoch": 5567} {"train_loss": -27.4787654876709, "global_step": 462110, "epoch": 5567} {"train_loss": -26.836652755737305, "global_step": 462111, "epoch": 5567} {"train_loss": -27.301542282104492, "global_step": 462112, "epoch": 5567} {"train_loss": -27.169769287109375, "global_step": 462113, "epoch": 5567} {"train_loss": -27.46604347229004, "global_step": 462114, "epoch": 5567} {"train_loss": -27.3038272857666, "global_step": 462115, "epoch": 5567} {"train_loss": -27.268308639526367, "global_step": 462116, "epoch": 5567} {"train_loss": -27.680830001831055, "global_step": 462117, "epoch": 5567} {"train_loss": -27.053693771362305, "global_step": 462118, "epoch": 5567} {"train_loss": -27.413175582885742, "global_step": 462119, "epoch": 5567} {"train_loss": -27.037158966064453, "global_step": 462120, "epoch": 5567} {"train_loss": -27.42673110961914, "global_step": 462121, "epoch": 5567} {"train_loss": -27.03541374206543, "global_step": 462122, "epoch": 5567} {"train_loss": -27.422636032104492, "global_step": 462123, "epoch": 5567} {"train_loss": -27.337629318237305, "global_step": 462124, "epoch": 5567} {"train_loss": -27.142126083374023, "global_step": 462125, "epoch": 5567} {"train_loss": -27.152368545532227, "global_step": 462126, "epoch": 5567} {"train_loss": -27.224782943725586, "global_step": 462127, "epoch": 5567} {"train_loss": -27.3699951171875, "global_step": 462128, "epoch": 5567} {"train_loss": -27.19244384765625, "global_step": 462129, "epoch": 5567} {"train_loss": -27.034093856811523, "global_step": 462130, "epoch": 5567} {"train_loss": -27.41827392578125, "global_step": 462131, "epoch": 5567} {"train_loss": -27.449499130249023, "global_step": 462132, "epoch": 5567} {"train_loss": -27.00398063659668, "global_step": 462133, "epoch": 5567} {"train_loss": -27.041229248046875, "global_step": 462134, "epoch": 5567} {"train_loss": -27.07450294494629, "global_step": 462135, "epoch": 5567} {"train_loss": -26.817060470581055, "global_step": 462136, "epoch": 5567} {"train_loss": -27.102771759033203, "global_step": 462137, "epoch": 5567} {"train_loss": -26.3044490814209, "global_step": 462138, "epoch": 5567} {"train_loss": -26.447635650634766, "global_step": 462139, "epoch": 5567} {"train_loss": -27.5109920501709, "global_step": 462140, "epoch": 5567} {"train_loss": -26.3646297454834, "global_step": 462141, "epoch": 5567} {"train_loss": -26.559247970581055, "global_step": 462142, "epoch": 5567} {"train_loss": -26.98710404821189, "global_step": 462143, "epoch": 5567, "val_loss": 6592689.0} {"train_loss": -26.27418327331543, "global_step": 462144, "epoch": 5568} {"train_loss": -26.72193717956543, "global_step": 462145, "epoch": 5568} {"train_loss": -26.160816192626953, "global_step": 462146, "epoch": 5568} {"train_loss": -26.889719009399414, "global_step": 462147, "epoch": 5568} {"train_loss": -26.57455825805664, "global_step": 462148, "epoch": 5568} {"train_loss": -26.57398796081543, "global_step": 462149, "epoch": 5568} {"train_loss": -26.45509147644043, "global_step": 462150, "epoch": 5568} {"train_loss": -26.89935302734375, "global_step": 462151, "epoch": 5568} {"train_loss": -26.24675941467285, "global_step": 462152, "epoch": 5568} {"train_loss": -26.341520309448242, "global_step": 462153, "epoch": 5568} {"train_loss": -26.388723373413086, "global_step": 462154, "epoch": 5568} {"train_loss": -26.787107467651367, "global_step": 462155, "epoch": 5568} {"train_loss": -26.754932403564453, "global_step": 462156, "epoch": 5568} {"train_loss": -26.5221004486084, "global_step": 462157, "epoch": 5568} {"train_loss": -26.51478385925293, "global_step": 462158, "epoch": 5568} {"train_loss": -27.02713966369629, "global_step": 462159, "epoch": 5568} {"train_loss": -26.68720817565918, "global_step": 462160, "epoch": 5568} {"train_loss": -26.680185317993164, "global_step": 462161, "epoch": 5568} {"train_loss": -26.388416290283203, "global_step": 462162, "epoch": 5568} {"train_loss": -26.85393714904785, "global_step": 462163, "epoch": 5568} {"train_loss": -26.758167266845703, "global_step": 462164, "epoch": 5568} {"train_loss": -27.12564468383789, "global_step": 462165, "epoch": 5568} {"train_loss": -26.74078369140625, "global_step": 462166, "epoch": 5568} {"train_loss": -26.942853927612305, "global_step": 462167, "epoch": 5568} {"train_loss": -26.926239013671875, "global_step": 462168, "epoch": 5568} {"train_loss": -26.90174674987793, "global_step": 462169, "epoch": 5568} {"train_loss": -27.22371482849121, "global_step": 462170, "epoch": 5568} {"train_loss": -27.195837020874023, "global_step": 462171, "epoch": 5568} {"train_loss": -27.187829971313477, "global_step": 462172, "epoch": 5568} {"train_loss": -26.822906494140625, "global_step": 462173, "epoch": 5568} {"train_loss": -27.261280059814453, "global_step": 462174, "epoch": 5568} {"train_loss": -27.21270751953125, "global_step": 462175, "epoch": 5568} {"train_loss": -26.959131240844727, "global_step": 462176, "epoch": 5568} {"train_loss": -27.3199520111084, "global_step": 462177, "epoch": 5568} {"train_loss": -27.264068603515625, "global_step": 462178, "epoch": 5568} {"train_loss": -27.316944122314453, "global_step": 462179, "epoch": 5568} {"train_loss": -27.4539737701416, "global_step": 462180, "epoch": 5568} {"train_loss": -27.123334884643555, "global_step": 462181, "epoch": 5568} {"train_loss": -27.023237228393555, "global_step": 462182, "epoch": 5568} {"train_loss": -27.17081642150879, "global_step": 462183, "epoch": 5568} {"train_loss": -27.082372665405273, "global_step": 462184, "epoch": 5568} {"train_loss": -27.19304847717285, "global_step": 462185, "epoch": 5568} {"train_loss": -26.876941680908203, "global_step": 462186, "epoch": 5568} {"train_loss": -27.47246742248535, "global_step": 462187, "epoch": 5568} {"train_loss": -27.49871253967285, "global_step": 462188, "epoch": 5568} {"train_loss": -27.0693416595459, "global_step": 462189, "epoch": 5568} {"train_loss": -27.262374877929688, "global_step": 462190, "epoch": 5568} {"train_loss": -27.002817153930664, "global_step": 462191, "epoch": 5568} {"train_loss": -27.3897705078125, "global_step": 462192, "epoch": 5568} {"train_loss": -27.343307495117188, "global_step": 462193, "epoch": 5568} {"train_loss": -26.837289810180664, "global_step": 462194, "epoch": 5568} {"train_loss": -27.1015682220459, "global_step": 462195, "epoch": 5568} {"train_loss": -26.723928451538086, "global_step": 462196, "epoch": 5568} {"train_loss": -26.9289608001709, "global_step": 462197, "epoch": 5568} {"train_loss": -27.125293731689453, "global_step": 462198, "epoch": 5568} {"train_loss": -27.025562286376953, "global_step": 462199, "epoch": 5568} {"train_loss": -26.99130630493164, "global_step": 462200, "epoch": 5568} {"train_loss": -27.18918800354004, "global_step": 462201, "epoch": 5568} {"train_loss": -26.702478408813477, "global_step": 462202, "epoch": 5568} {"train_loss": -27.0810489654541, "global_step": 462203, "epoch": 5568} {"train_loss": -27.411457061767578, "global_step": 462204, "epoch": 5568} {"train_loss": -26.582788467407227, "global_step": 462205, "epoch": 5568} {"train_loss": -27.036039352416992, "global_step": 462206, "epoch": 5568} {"train_loss": -26.82929801940918, "global_step": 462207, "epoch": 5568} {"train_loss": -27.192468643188477, "global_step": 462208, "epoch": 5568} {"train_loss": -27.180679321289062, "global_step": 462209, "epoch": 5568} {"train_loss": -27.324575424194336, "global_step": 462210, "epoch": 5568} {"train_loss": -27.291425704956055, "global_step": 462211, "epoch": 5568} {"train_loss": -26.805830001831055, "global_step": 462212, "epoch": 5568} {"train_loss": -27.093372344970703, "global_step": 462213, "epoch": 5568} {"train_loss": -27.43973731994629, "global_step": 462214, "epoch": 5568} {"train_loss": -27.12415885925293, "global_step": 462215, "epoch": 5568} {"train_loss": -27.125967025756836, "global_step": 462216, "epoch": 5568} {"train_loss": -27.123132705688477, "global_step": 462217, "epoch": 5568} {"train_loss": -27.103605270385742, "global_step": 462218, "epoch": 5568} {"train_loss": -27.5057430267334, "global_step": 462219, "epoch": 5568} {"train_loss": -27.392614364624023, "global_step": 462220, "epoch": 5568} {"train_loss": -27.206573486328125, "global_step": 462221, "epoch": 5568} {"train_loss": -27.05437660217285, "global_step": 462222, "epoch": 5568} {"train_loss": -27.53348159790039, "global_step": 462223, "epoch": 5568} {"train_loss": -27.05900001525879, "global_step": 462224, "epoch": 5568} {"train_loss": -27.061420440673828, "global_step": 462225, "epoch": 5568} {"train_loss": -26.996208443699114, "global_step": 462226, "epoch": 5568, "val_loss": 6485818.0} {"train_loss": -25.99151039123535, "global_step": 462227, "epoch": 5569} {"train_loss": -25.360214233398438, "global_step": 462228, "epoch": 5569} {"train_loss": -25.22121238708496, "global_step": 462229, "epoch": 5569} {"train_loss": -26.410526275634766, "global_step": 462230, "epoch": 5569} {"train_loss": -26.197362899780273, "global_step": 462231, "epoch": 5569} {"train_loss": -25.859960556030273, "global_step": 462232, "epoch": 5569} {"train_loss": -26.23687171936035, "global_step": 462233, "epoch": 5569} {"train_loss": -25.998655319213867, "global_step": 462234, "epoch": 5569} {"train_loss": -26.392004013061523, "global_step": 462235, "epoch": 5569} {"train_loss": -26.5577335357666, "global_step": 462236, "epoch": 5569} {"train_loss": -26.493337631225586, "global_step": 462237, "epoch": 5569} {"train_loss": -26.340612411499023, "global_step": 462238, "epoch": 5569} {"train_loss": -26.54237937927246, "global_step": 462239, "epoch": 5569} {"train_loss": -26.350629806518555, "global_step": 462240, "epoch": 5569} {"train_loss": -26.521230697631836, "global_step": 462241, "epoch": 5569} {"train_loss": -26.70914649963379, "global_step": 462242, "epoch": 5569} {"train_loss": -26.51362419128418, "global_step": 462243, "epoch": 5569} {"train_loss": -26.866546630859375, "global_step": 462244, "epoch": 5569} {"train_loss": -26.575727462768555, "global_step": 462245, "epoch": 5569} {"train_loss": -26.715951919555664, "global_step": 462246, "epoch": 5569} {"train_loss": -26.53753662109375, "global_step": 462247, "epoch": 5569} {"train_loss": -26.54559898376465, "global_step": 462248, "epoch": 5569} {"train_loss": -26.880817413330078, "global_step": 462249, "epoch": 5569} {"train_loss": -26.805023193359375, "global_step": 462250, "epoch": 5569} {"train_loss": -26.46546745300293, "global_step": 462251, "epoch": 5569} {"train_loss": -27.065353393554688, "global_step": 462252, "epoch": 5569} {"train_loss": -26.637760162353516, "global_step": 462253, "epoch": 5569} {"train_loss": -26.72650146484375, "global_step": 462254, "epoch": 5569} {"train_loss": -26.75030517578125, "global_step": 462255, "epoch": 5569} {"train_loss": -26.78032875061035, "global_step": 462256, "epoch": 5569} {"train_loss": -26.793354034423828, "global_step": 462257, "epoch": 5569} {"train_loss": -27.410120010375977, "global_step": 462258, "epoch": 5569} {"train_loss": -26.973859786987305, "global_step": 462259, "epoch": 5569} {"train_loss": -26.626020431518555, "global_step": 462260, "epoch": 5569} {"train_loss": -27.339202880859375, "global_step": 462261, "epoch": 5569} {"train_loss": -26.952070236206055, "global_step": 462262, "epoch": 5569} {"train_loss": -27.127450942993164, "global_step": 462263, "epoch": 5569} {"train_loss": -26.90165138244629, "global_step": 462264, "epoch": 5569} {"train_loss": -27.123477935791016, "global_step": 462265, "epoch": 5569} {"train_loss": -27.19112205505371, "global_step": 462266, "epoch": 5569} {"train_loss": -27.197980880737305, "global_step": 462267, "epoch": 5569} {"train_loss": -27.332807540893555, "global_step": 462268, "epoch": 5569} {"train_loss": -26.99773597717285, "global_step": 462269, "epoch": 5569} {"train_loss": -27.295719146728516, "global_step": 462270, "epoch": 5569} {"train_loss": -27.068944931030273, "global_step": 462271, "epoch": 5569} {"train_loss": -27.170318603515625, "global_step": 462272, "epoch": 5569} {"train_loss": -27.34893226623535, "global_step": 462273, "epoch": 5569} {"train_loss": -27.07834243774414, "global_step": 462274, "epoch": 5569} {"train_loss": -27.474878311157227, "global_step": 462275, "epoch": 5569} {"train_loss": -27.22944450378418, "global_step": 462276, "epoch": 5569} {"train_loss": -27.1647891998291, "global_step": 462277, "epoch": 5569} {"train_loss": -27.375289916992188, "global_step": 462278, "epoch": 5569} {"train_loss": -27.24169921875, "global_step": 462279, "epoch": 5569} {"train_loss": -27.52143669128418, "global_step": 462280, "epoch": 5569} {"train_loss": -27.114765167236328, "global_step": 462281, "epoch": 5569} {"train_loss": -26.888996124267578, "global_step": 462282, "epoch": 5569} {"train_loss": -27.129718780517578, "global_step": 462283, "epoch": 5569} {"train_loss": -26.918445587158203, "global_step": 462284, "epoch": 5569} {"train_loss": -27.786863327026367, "global_step": 462285, "epoch": 5569} {"train_loss": -27.132038116455078, "global_step": 462286, "epoch": 5569} {"train_loss": -27.36262321472168, "global_step": 462287, "epoch": 5569} {"train_loss": -27.467029571533203, "global_step": 462288, "epoch": 5569} {"train_loss": -27.172643661499023, "global_step": 462289, "epoch": 5569} {"train_loss": -27.729175567626953, "global_step": 462290, "epoch": 5569} {"train_loss": -27.676462173461914, "global_step": 462291, "epoch": 5569} {"train_loss": -27.180133819580078, "global_step": 462292, "epoch": 5569} {"train_loss": -27.358642578125, "global_step": 462293, "epoch": 5569} {"train_loss": -27.431875228881836, "global_step": 462294, "epoch": 5569} {"train_loss": -27.743371963500977, "global_step": 462295, "epoch": 5569} {"train_loss": -27.34261131286621, "global_step": 462296, "epoch": 5569} {"train_loss": -27.521154403686523, "global_step": 462297, "epoch": 5569} {"train_loss": -27.360071182250977, "global_step": 462298, "epoch": 5569} {"train_loss": -27.22663688659668, "global_step": 462299, "epoch": 5569} {"train_loss": -27.039997100830078, "global_step": 462300, "epoch": 5569} {"train_loss": -27.071247100830078, "global_step": 462301, "epoch": 5569} {"train_loss": -26.97359275817871, "global_step": 462302, "epoch": 5569} {"train_loss": -27.21162986755371, "global_step": 462303, "epoch": 5569} {"train_loss": -26.68219566345215, "global_step": 462304, "epoch": 5569} {"train_loss": -26.900909423828125, "global_step": 462305, "epoch": 5569} {"train_loss": -27.1906795501709, "global_step": 462306, "epoch": 5569} {"train_loss": -26.965662002563477, "global_step": 462307, "epoch": 5569} {"train_loss": -27.22088050842285, "global_step": 462308, "epoch": 5569} {"train_loss": -26.92385344907462, "global_step": 462309, "epoch": 5569, "val_loss": 6577587.0} {"train_loss": -25.817975997924805, "global_step": 462310, "epoch": 5570} {"train_loss": -25.49307632446289, "global_step": 462311, "epoch": 5570} {"train_loss": -26.316797256469727, "global_step": 462312, "epoch": 5570} {"train_loss": -26.182153701782227, "global_step": 462313, "epoch": 5570} {"train_loss": -26.3253231048584, "global_step": 462314, "epoch": 5570} {"train_loss": -25.985021591186523, "global_step": 462315, "epoch": 5570} {"train_loss": -26.357030868530273, "global_step": 462316, "epoch": 5570} {"train_loss": -26.25782585144043, "global_step": 462317, "epoch": 5570} {"train_loss": -26.143503189086914, "global_step": 462318, "epoch": 5570} {"train_loss": -26.28212547302246, "global_step": 462319, "epoch": 5570} {"train_loss": -26.795547485351562, "global_step": 462320, "epoch": 5570} {"train_loss": -26.354690551757812, "global_step": 462321, "epoch": 5570} {"train_loss": -26.147083282470703, "global_step": 462322, "epoch": 5570} {"train_loss": -25.7841796875, "global_step": 462323, "epoch": 5570} {"train_loss": -26.647388458251953, "global_step": 462324, "epoch": 5570} {"train_loss": -26.979772567749023, "global_step": 462325, "epoch": 5570} {"train_loss": -26.506418228149414, "global_step": 462326, "epoch": 5570} {"train_loss": -26.675668716430664, "global_step": 462327, "epoch": 5570} {"train_loss": -26.65519142150879, "global_step": 462328, "epoch": 5570} {"train_loss": -26.706323623657227, "global_step": 462329, "epoch": 5570} {"train_loss": -26.691852569580078, "global_step": 462330, "epoch": 5570} {"train_loss": -26.724609375, "global_step": 462331, "epoch": 5570} {"train_loss": -27.037078857421875, "global_step": 462332, "epoch": 5570} {"train_loss": -27.1720027923584, "global_step": 462333, "epoch": 5570} {"train_loss": -27.139251708984375, "global_step": 462334, "epoch": 5570} {"train_loss": -27.363739013671875, "global_step": 462335, "epoch": 5570} {"train_loss": -27.113208770751953, "global_step": 462336, "epoch": 5570} {"train_loss": -26.533527374267578, "global_step": 462337, "epoch": 5570} {"train_loss": -26.71245765686035, "global_step": 462338, "epoch": 5570} {"train_loss": -26.893529891967773, "global_step": 462339, "epoch": 5570} {"train_loss": -27.2711181640625, "global_step": 462340, "epoch": 5570} {"train_loss": -26.77727699279785, "global_step": 462341, "epoch": 5570} {"train_loss": -27.282278060913086, "global_step": 462342, "epoch": 5570} {"train_loss": -26.829938888549805, "global_step": 462343, "epoch": 5570} {"train_loss": -27.204076766967773, "global_step": 462344, "epoch": 5570} {"train_loss": -27.207239151000977, "global_step": 462345, "epoch": 5570} {"train_loss": -27.370141983032227, "global_step": 462346, "epoch": 5570} {"train_loss": -27.179800033569336, "global_step": 462347, "epoch": 5570} {"train_loss": -27.058958053588867, "global_step": 462348, "epoch": 5570} {"train_loss": -27.328657150268555, "global_step": 462349, "epoch": 5570} {"train_loss": -27.31620216369629, "global_step": 462350, "epoch": 5570} {"train_loss": -27.163623809814453, "global_step": 462351, "epoch": 5570} {"train_loss": -27.422149658203125, "global_step": 462352, "epoch": 5570} {"train_loss": -27.305063247680664, "global_step": 462353, "epoch": 5570} {"train_loss": -27.214391708374023, "global_step": 462354, "epoch": 5570} {"train_loss": -27.25067138671875, "global_step": 462355, "epoch": 5570} {"train_loss": -27.190555572509766, "global_step": 462356, "epoch": 5570} {"train_loss": -26.880722045898438, "global_step": 462357, "epoch": 5570} {"train_loss": -27.4742431640625, "global_step": 462358, "epoch": 5570} {"train_loss": -27.243558883666992, "global_step": 462359, "epoch": 5570} {"train_loss": -27.1136474609375, "global_step": 462360, "epoch": 5570} {"train_loss": -27.08633804321289, "global_step": 462361, "epoch": 5570} {"train_loss": -27.213438034057617, "global_step": 462362, "epoch": 5570} {"train_loss": -27.413618087768555, "global_step": 462363, "epoch": 5570} {"train_loss": -27.074453353881836, "global_step": 462364, "epoch": 5570} {"train_loss": -27.119190216064453, "global_step": 462365, "epoch": 5570} {"train_loss": -27.26666831970215, "global_step": 462366, "epoch": 5570} {"train_loss": -27.462827682495117, "global_step": 462367, "epoch": 5570} {"train_loss": -27.12750816345215, "global_step": 462368, "epoch": 5570} {"train_loss": -27.388158798217773, "global_step": 462369, "epoch": 5570} {"train_loss": -27.411548614501953, "global_step": 462370, "epoch": 5570} {"train_loss": -27.35243797302246, "global_step": 462371, "epoch": 5570} {"train_loss": -26.973669052124023, "global_step": 462372, "epoch": 5570} {"train_loss": -27.165983200073242, "global_step": 462373, "epoch": 5570} {"train_loss": -27.731693267822266, "global_step": 462374, "epoch": 5570} {"train_loss": -27.220670700073242, "global_step": 462375, "epoch": 5570} {"train_loss": -27.377124786376953, "global_step": 462376, "epoch": 5570} {"train_loss": -27.187055587768555, "global_step": 462377, "epoch": 5570} {"train_loss": -27.271215438842773, "global_step": 462378, "epoch": 5570} {"train_loss": -27.171070098876953, "global_step": 462379, "epoch": 5570} {"train_loss": -27.297956466674805, "global_step": 462380, "epoch": 5570} {"train_loss": -27.055648803710938, "global_step": 462381, "epoch": 5570} {"train_loss": -26.706724166870117, "global_step": 462382, "epoch": 5570} {"train_loss": -26.60693359375, "global_step": 462383, "epoch": 5570} {"train_loss": -27.0594482421875, "global_step": 462384, "epoch": 5570} {"train_loss": -27.58274269104004, "global_step": 462385, "epoch": 5570} {"train_loss": -26.518299102783203, "global_step": 462386, "epoch": 5570} {"train_loss": -26.6849308013916, "global_step": 462387, "epoch": 5570} {"train_loss": -26.797910690307617, "global_step": 462388, "epoch": 5570} {"train_loss": -26.996723175048828, "global_step": 462389, "epoch": 5570} {"train_loss": -27.1109619140625, "global_step": 462390, "epoch": 5570} {"train_loss": -27.1450138092041, "global_step": 462391, "epoch": 5570} {"train_loss": -26.935317947203856, "global_step": 462392, "epoch": 5570, "val_loss": 6508830.0} {"train_loss": -26.521289825439453, "global_step": 462393, "epoch": 5571} {"train_loss": -25.92282485961914, "global_step": 462394, "epoch": 5571} {"train_loss": -26.620431900024414, "global_step": 462395, "epoch": 5571} {"train_loss": -26.856164932250977, "global_step": 462396, "epoch": 5571} {"train_loss": -26.587726593017578, "global_step": 462397, "epoch": 5571} {"train_loss": -26.886157989501953, "global_step": 462398, "epoch": 5571} {"train_loss": -26.556028366088867, "global_step": 462399, "epoch": 5571} {"train_loss": -27.067718505859375, "global_step": 462400, "epoch": 5571} {"train_loss": -26.6337833404541, "global_step": 462401, "epoch": 5571} {"train_loss": -26.7220516204834, "global_step": 462402, "epoch": 5571} {"train_loss": -27.230947494506836, "global_step": 462403, "epoch": 5571} {"train_loss": -26.623260498046875, "global_step": 462404, "epoch": 5571} {"train_loss": -26.97662353515625, "global_step": 462405, "epoch": 5571} {"train_loss": -26.9958553314209, "global_step": 462406, "epoch": 5571} {"train_loss": -26.92035484313965, "global_step": 462407, "epoch": 5571} {"train_loss": -26.99427604675293, "global_step": 462408, "epoch": 5571} {"train_loss": -26.962900161743164, "global_step": 462409, "epoch": 5571} {"train_loss": -26.99853515625, "global_step": 462410, "epoch": 5571} {"train_loss": -27.268346786499023, "global_step": 462411, "epoch": 5571} {"train_loss": -27.297765731811523, "global_step": 462412, "epoch": 5571} {"train_loss": -26.980504989624023, "global_step": 462413, "epoch": 5571} {"train_loss": -26.99922752380371, "global_step": 462414, "epoch": 5571} {"train_loss": -26.985382080078125, "global_step": 462415, "epoch": 5571} {"train_loss": -26.986785888671875, "global_step": 462416, "epoch": 5571} {"train_loss": -26.938276290893555, "global_step": 462417, "epoch": 5571} {"train_loss": -27.55312156677246, "global_step": 462418, "epoch": 5571} {"train_loss": -26.506988525390625, "global_step": 462419, "epoch": 5571} {"train_loss": -27.1694393157959, "global_step": 462420, "epoch": 5571} {"train_loss": -27.132909774780273, "global_step": 462421, "epoch": 5571} {"train_loss": -27.453771591186523, "global_step": 462422, "epoch": 5571} {"train_loss": -27.508087158203125, "global_step": 462423, "epoch": 5571} {"train_loss": -27.258651733398438, "global_step": 462424, "epoch": 5571} {"train_loss": -27.25214958190918, "global_step": 462425, "epoch": 5571} {"train_loss": -27.236469268798828, "global_step": 462426, "epoch": 5571} {"train_loss": -27.278076171875, "global_step": 462427, "epoch": 5571} {"train_loss": -27.01079750061035, "global_step": 462428, "epoch": 5571} {"train_loss": -27.108346939086914, "global_step": 462429, "epoch": 5571} {"train_loss": -27.316564559936523, "global_step": 462430, "epoch": 5571} {"train_loss": -27.107425689697266, "global_step": 462431, "epoch": 5571} {"train_loss": -26.937671661376953, "global_step": 462432, "epoch": 5571} {"train_loss": -27.4172306060791, "global_step": 462433, "epoch": 5571} {"train_loss": -27.569263458251953, "global_step": 462434, "epoch": 5571} {"train_loss": -27.530902862548828, "global_step": 462435, "epoch": 5571} {"train_loss": -27.365253448486328, "global_step": 462436, "epoch": 5571} {"train_loss": -27.033771514892578, "global_step": 462437, "epoch": 5571} {"train_loss": -27.32571792602539, "global_step": 462438, "epoch": 5571} {"train_loss": -27.369287490844727, "global_step": 462439, "epoch": 5571} {"train_loss": -27.206933975219727, "global_step": 462440, "epoch": 5571} {"train_loss": -27.018117904663086, "global_step": 462441, "epoch": 5571} {"train_loss": -27.413415908813477, "global_step": 462442, "epoch": 5571} {"train_loss": -27.651565551757812, "global_step": 462443, "epoch": 5571} {"train_loss": -27.246826171875, "global_step": 462444, "epoch": 5571} {"train_loss": -27.070556640625, "global_step": 462445, "epoch": 5571} {"train_loss": -27.37379264831543, "global_step": 462446, "epoch": 5571} {"train_loss": -27.409765243530273, "global_step": 462447, "epoch": 5571} {"train_loss": -27.116724014282227, "global_step": 462448, "epoch": 5571} {"train_loss": -27.17626953125, "global_step": 462449, "epoch": 5571} {"train_loss": -27.365671157836914, "global_step": 462450, "epoch": 5571} {"train_loss": -27.105213165283203, "global_step": 462451, "epoch": 5571} {"train_loss": -27.0659236907959, "global_step": 462452, "epoch": 5571} {"train_loss": -27.418554306030273, "global_step": 462453, "epoch": 5571} {"train_loss": -27.228891372680664, "global_step": 462454, "epoch": 5571} {"train_loss": -27.242481231689453, "global_step": 462455, "epoch": 5571} {"train_loss": -27.4450626373291, "global_step": 462456, "epoch": 5571} {"train_loss": -27.288745880126953, "global_step": 462457, "epoch": 5571} {"train_loss": -27.412006378173828, "global_step": 462458, "epoch": 5571} {"train_loss": -27.150684356689453, "global_step": 462459, "epoch": 5571} {"train_loss": -27.29282569885254, "global_step": 462460, "epoch": 5571} {"train_loss": -26.945459365844727, "global_step": 462461, "epoch": 5571} {"train_loss": -27.250263214111328, "global_step": 462462, "epoch": 5571} {"train_loss": -27.385101318359375, "global_step": 462463, "epoch": 5571} {"train_loss": -26.88802146911621, "global_step": 462464, "epoch": 5571} {"train_loss": -27.396299362182617, "global_step": 462465, "epoch": 5571} {"train_loss": -27.091663360595703, "global_step": 462466, "epoch": 5571} {"train_loss": -27.308319091796875, "global_step": 462467, "epoch": 5571} {"train_loss": -27.171951293945312, "global_step": 462468, "epoch": 5571} {"train_loss": -27.170995712280273, "global_step": 462469, "epoch": 5571} {"train_loss": -27.087142944335938, "global_step": 462470, "epoch": 5571} {"train_loss": -27.352161407470703, "global_step": 462471, "epoch": 5571} {"train_loss": -27.38515281677246, "global_step": 462472, "epoch": 5571} {"train_loss": -27.2376651763916, "global_step": 462473, "epoch": 5571} {"train_loss": -27.11945915222168, "global_step": 462474, "epoch": 5571} {"train_loss": -27.132285796016095, "global_step": 462475, "epoch": 5571, "val_loss": 6506995.0} {"train_loss": -26.301441192626953, "global_step": 462476, "epoch": 5572} {"train_loss": -25.144861221313477, "global_step": 462477, "epoch": 5572} {"train_loss": -24.9398193359375, "global_step": 462478, "epoch": 5572} {"train_loss": -25.444671630859375, "global_step": 462479, "epoch": 5572} {"train_loss": -25.733585357666016, "global_step": 462480, "epoch": 5572} {"train_loss": -25.576810836791992, "global_step": 462481, "epoch": 5572} {"train_loss": -26.22884178161621, "global_step": 462482, "epoch": 5572} {"train_loss": -26.389362335205078, "global_step": 462483, "epoch": 5572} {"train_loss": -26.597585678100586, "global_step": 462484, "epoch": 5572} {"train_loss": -26.67792320251465, "global_step": 462485, "epoch": 5572} {"train_loss": -26.502038955688477, "global_step": 462486, "epoch": 5572} {"train_loss": -26.69355583190918, "global_step": 462487, "epoch": 5572} {"train_loss": -25.979528427124023, "global_step": 462488, "epoch": 5572} {"train_loss": -26.59563636779785, "global_step": 462489, "epoch": 5572} {"train_loss": -26.39534568786621, "global_step": 462490, "epoch": 5572} {"train_loss": -26.382192611694336, "global_step": 462491, "epoch": 5572} {"train_loss": -26.60770034790039, "global_step": 462492, "epoch": 5572} {"train_loss": -26.81157875061035, "global_step": 462493, "epoch": 5572} {"train_loss": -26.90093994140625, "global_step": 462494, "epoch": 5572} {"train_loss": -26.82537841796875, "global_step": 462495, "epoch": 5572} {"train_loss": -26.546802520751953, "global_step": 462496, "epoch": 5572} {"train_loss": -26.702285766601562, "global_step": 462497, "epoch": 5572} {"train_loss": -26.9758243560791, "global_step": 462498, "epoch": 5572} {"train_loss": -26.868549346923828, "global_step": 462499, "epoch": 5572} {"train_loss": -26.83229637145996, "global_step": 462500, "epoch": 5572} {"train_loss": -27.1856746673584, "global_step": 462501, "epoch": 5572} {"train_loss": -26.91057777404785, "global_step": 462502, "epoch": 5572} {"train_loss": -26.841205596923828, "global_step": 462503, "epoch": 5572} {"train_loss": -26.88564109802246, "global_step": 462504, "epoch": 5572} {"train_loss": -26.746152877807617, "global_step": 462505, "epoch": 5572} {"train_loss": -27.026687622070312, "global_step": 462506, "epoch": 5572} {"train_loss": -26.625106811523438, "global_step": 462507, "epoch": 5572} {"train_loss": -26.8841609954834, "global_step": 462508, "epoch": 5572} {"train_loss": -27.57295036315918, "global_step": 462509, "epoch": 5572} {"train_loss": -27.057147979736328, "global_step": 462510, "epoch": 5572} {"train_loss": -27.06328773498535, "global_step": 462511, "epoch": 5572} {"train_loss": -27.35493278503418, "global_step": 462512, "epoch": 5572} {"train_loss": -27.2850284576416, "global_step": 462513, "epoch": 5572} {"train_loss": -26.882917404174805, "global_step": 462514, "epoch": 5572} {"train_loss": -26.90559959411621, "global_step": 462515, "epoch": 5572} {"train_loss": -27.09650993347168, "global_step": 462516, "epoch": 5572} {"train_loss": -26.870071411132812, "global_step": 462517, "epoch": 5572} {"train_loss": -27.15097427368164, "global_step": 462518, "epoch": 5572} {"train_loss": -27.320600509643555, "global_step": 462519, "epoch": 5572} {"train_loss": -27.326223373413086, "global_step": 462520, "epoch": 5572} {"train_loss": -27.329282760620117, "global_step": 462521, "epoch": 5572} {"train_loss": -27.465784072875977, "global_step": 462522, "epoch": 5572} {"train_loss": -27.14337158203125, "global_step": 462523, "epoch": 5572} {"train_loss": -27.422143936157227, "global_step": 462524, "epoch": 5572} {"train_loss": -27.208744049072266, "global_step": 462525, "epoch": 5572} {"train_loss": -27.06968116760254, "global_step": 462526, "epoch": 5572} {"train_loss": -26.832910537719727, "global_step": 462527, "epoch": 5572} {"train_loss": -27.325353622436523, "global_step": 462528, "epoch": 5572} {"train_loss": -27.1949520111084, "global_step": 462529, "epoch": 5572} {"train_loss": -27.26426124572754, "global_step": 462530, "epoch": 5572} {"train_loss": -27.144628524780273, "global_step": 462531, "epoch": 5572} {"train_loss": -27.197473526000977, "global_step": 462532, "epoch": 5572} {"train_loss": -27.286731719970703, "global_step": 462533, "epoch": 5572} {"train_loss": -27.456256866455078, "global_step": 462534, "epoch": 5572} {"train_loss": -27.015487670898438, "global_step": 462535, "epoch": 5572} {"train_loss": -27.42919921875, "global_step": 462536, "epoch": 5572} {"train_loss": -27.432113647460938, "global_step": 462537, "epoch": 5572} {"train_loss": -27.346067428588867, "global_step": 462538, "epoch": 5572} {"train_loss": -27.061376571655273, "global_step": 462539, "epoch": 5572} {"train_loss": -27.305158615112305, "global_step": 462540, "epoch": 5572} {"train_loss": -26.949121475219727, "global_step": 462541, "epoch": 5572} {"train_loss": -27.24297523498535, "global_step": 462542, "epoch": 5572} {"train_loss": -27.20503044128418, "global_step": 462543, "epoch": 5572} {"train_loss": -27.385290145874023, "global_step": 462544, "epoch": 5572} {"train_loss": -27.577392578125, "global_step": 462545, "epoch": 5572} {"train_loss": -26.87281608581543, "global_step": 462546, "epoch": 5572} {"train_loss": -27.313302993774414, "global_step": 462547, "epoch": 5572} {"train_loss": -27.650671005249023, "global_step": 462548, "epoch": 5572} {"train_loss": -27.23646354675293, "global_step": 462549, "epoch": 5572} {"train_loss": -27.03496742248535, "global_step": 462550, "epoch": 5572} {"train_loss": -27.441547393798828, "global_step": 462551, "epoch": 5572} {"train_loss": -27.403003692626953, "global_step": 462552, "epoch": 5572} {"train_loss": -27.329544067382812, "global_step": 462553, "epoch": 5572} {"train_loss": -27.1865234375, "global_step": 462554, "epoch": 5572} {"train_loss": -27.158681869506836, "global_step": 462555, "epoch": 5572} {"train_loss": -27.466581344604492, "global_step": 462556, "epoch": 5572} {"train_loss": -27.7166805267334, "global_step": 462557, "epoch": 5572} {"train_loss": -26.950727600649177, "global_step": 462558, "epoch": 5572, "val_loss": 6521522.0} {"train_loss": -26.764759063720703, "global_step": 462559, "epoch": 5573} {"train_loss": -25.446807861328125, "global_step": 462560, "epoch": 5573} {"train_loss": -25.094160079956055, "global_step": 462561, "epoch": 5573} {"train_loss": -24.365680694580078, "global_step": 462562, "epoch": 5573} {"train_loss": -25.617090225219727, "global_step": 462563, "epoch": 5573} {"train_loss": -26.2806339263916, "global_step": 462564, "epoch": 5573} {"train_loss": -26.0771541595459, "global_step": 462565, "epoch": 5573} {"train_loss": -26.576175689697266, "global_step": 462566, "epoch": 5573} {"train_loss": -25.873645782470703, "global_step": 462567, "epoch": 5573} {"train_loss": -26.11952018737793, "global_step": 462568, "epoch": 5573} {"train_loss": -26.320581436157227, "global_step": 462569, "epoch": 5573} {"train_loss": -26.28839683532715, "global_step": 462570, "epoch": 5573} {"train_loss": -26.625492095947266, "global_step": 462571, "epoch": 5573} {"train_loss": -26.667835235595703, "global_step": 462572, "epoch": 5573} {"train_loss": -26.428380966186523, "global_step": 462573, "epoch": 5573} {"train_loss": -26.891523361206055, "global_step": 462574, "epoch": 5573} {"train_loss": -26.9271183013916, "global_step": 462575, "epoch": 5573} {"train_loss": -26.62946128845215, "global_step": 462576, "epoch": 5573} {"train_loss": -26.941009521484375, "global_step": 462577, "epoch": 5573} {"train_loss": -26.884002685546875, "global_step": 462578, "epoch": 5573} {"train_loss": -26.858057022094727, "global_step": 462579, "epoch": 5573} {"train_loss": -27.241140365600586, "global_step": 462580, "epoch": 5573} {"train_loss": -27.0936222076416, "global_step": 462581, "epoch": 5573} {"train_loss": -26.805572509765625, "global_step": 462582, "epoch": 5573} {"train_loss": -26.919116973876953, "global_step": 462583, "epoch": 5573} {"train_loss": -27.365222930908203, "global_step": 462584, "epoch": 5573} {"train_loss": -27.240339279174805, "global_step": 462585, "epoch": 5573} {"train_loss": -27.150541305541992, "global_step": 462586, "epoch": 5573} {"train_loss": -26.856046676635742, "global_step": 462587, "epoch": 5573} {"train_loss": -27.184757232666016, "global_step": 462588, "epoch": 5573} {"train_loss": -26.970474243164062, "global_step": 462589, "epoch": 5573} {"train_loss": -27.0045223236084, "global_step": 462590, "epoch": 5573} {"train_loss": -27.364303588867188, "global_step": 462591, "epoch": 5573} {"train_loss": -26.908811569213867, "global_step": 462592, "epoch": 5573} {"train_loss": -27.0567569732666, "global_step": 462593, "epoch": 5573} {"train_loss": -27.10367774963379, "global_step": 462594, "epoch": 5573} {"train_loss": -26.824583053588867, "global_step": 462595, "epoch": 5573} {"train_loss": -27.462839126586914, "global_step": 462596, "epoch": 5573} {"train_loss": -27.172727584838867, "global_step": 462597, "epoch": 5573} {"train_loss": -27.350265502929688, "global_step": 462598, "epoch": 5573} {"train_loss": -27.285552978515625, "global_step": 462599, "epoch": 5573} {"train_loss": -27.257404327392578, "global_step": 462600, "epoch": 5573} {"train_loss": -27.364301681518555, "global_step": 462601, "epoch": 5573} {"train_loss": -27.081884384155273, "global_step": 462602, "epoch": 5573} {"train_loss": -27.203886032104492, "global_step": 462603, "epoch": 5573} {"train_loss": -27.49831199645996, "global_step": 462604, "epoch": 5573} {"train_loss": -27.123432159423828, "global_step": 462605, "epoch": 5573} {"train_loss": -27.511075973510742, "global_step": 462606, "epoch": 5573} {"train_loss": -27.353979110717773, "global_step": 462607, "epoch": 5573} {"train_loss": -27.751068115234375, "global_step": 462608, "epoch": 5573} {"train_loss": -27.1929931640625, "global_step": 462609, "epoch": 5573} {"train_loss": -27.1352596282959, "global_step": 462610, "epoch": 5573} {"train_loss": -26.91552734375, "global_step": 462611, "epoch": 5573} {"train_loss": -27.169015884399414, "global_step": 462612, "epoch": 5573} {"train_loss": -27.0262508392334, "global_step": 462613, "epoch": 5573} {"train_loss": -27.196508407592773, "global_step": 462614, "epoch": 5573} {"train_loss": -26.977880477905273, "global_step": 462615, "epoch": 5573} {"train_loss": -26.83905029296875, "global_step": 462616, "epoch": 5573} {"train_loss": -26.949771881103516, "global_step": 462617, "epoch": 5573} {"train_loss": -27.489057540893555, "global_step": 462618, "epoch": 5573} {"train_loss": -27.376413345336914, "global_step": 462619, "epoch": 5573} {"train_loss": -27.429529190063477, "global_step": 462620, "epoch": 5573} {"train_loss": -27.141904830932617, "global_step": 462621, "epoch": 5573} {"train_loss": -27.154714584350586, "global_step": 462622, "epoch": 5573} {"train_loss": -27.29828453063965, "global_step": 462623, "epoch": 5573} {"train_loss": -26.735883712768555, "global_step": 462624, "epoch": 5573} {"train_loss": -27.240039825439453, "global_step": 462625, "epoch": 5573} {"train_loss": -26.750534057617188, "global_step": 462626, "epoch": 5573} {"train_loss": -26.74006462097168, "global_step": 462627, "epoch": 5573} {"train_loss": -27.22764015197754, "global_step": 462628, "epoch": 5573} {"train_loss": -27.311132431030273, "global_step": 462629, "epoch": 5573} {"train_loss": -27.087726593017578, "global_step": 462630, "epoch": 5573} {"train_loss": -27.56635856628418, "global_step": 462631, "epoch": 5573} {"train_loss": -27.051599502563477, "global_step": 462632, "epoch": 5573} {"train_loss": -27.259000778198242, "global_step": 462633, "epoch": 5573} {"train_loss": -27.088647842407227, "global_step": 462634, "epoch": 5573} {"train_loss": -27.181283950805664, "global_step": 462635, "epoch": 5573} {"train_loss": -26.997594833374023, "global_step": 462636, "epoch": 5573} {"train_loss": -27.671533584594727, "global_step": 462637, "epoch": 5573} {"train_loss": -27.34222984313965, "global_step": 462638, "epoch": 5573} {"train_loss": -27.28383445739746, "global_step": 462639, "epoch": 5573} {"train_loss": -26.831144332885742, "global_step": 462640, "epoch": 5573} {"train_loss": -26.928493132074195, "global_step": 462641, "epoch": 5573, "val_loss": 6474979.0} {"train_loss": -26.88324546813965, "global_step": 462642, "epoch": 5574} {"train_loss": -26.343053817749023, "global_step": 462643, "epoch": 5574} {"train_loss": -26.43545913696289, "global_step": 462644, "epoch": 5574} {"train_loss": -26.616559982299805, "global_step": 462645, "epoch": 5574} {"train_loss": -26.27924156188965, "global_step": 462646, "epoch": 5574} {"train_loss": -26.311811447143555, "global_step": 462647, "epoch": 5574} {"train_loss": -26.792572021484375, "global_step": 462648, "epoch": 5574} {"train_loss": -26.67791748046875, "global_step": 462649, "epoch": 5574} {"train_loss": -26.614709854125977, "global_step": 462650, "epoch": 5574} {"train_loss": -26.89821434020996, "global_step": 462651, "epoch": 5574} {"train_loss": -26.575489044189453, "global_step": 462652, "epoch": 5574} {"train_loss": -27.080698013305664, "global_step": 462653, "epoch": 5574} {"train_loss": -27.064374923706055, "global_step": 462654, "epoch": 5574} {"train_loss": -26.91791343688965, "global_step": 462655, "epoch": 5574} {"train_loss": -26.792667388916016, "global_step": 462656, "epoch": 5574} {"train_loss": -27.28925132751465, "global_step": 462657, "epoch": 5574} {"train_loss": -26.526660919189453, "global_step": 462658, "epoch": 5574} {"train_loss": -26.811737060546875, "global_step": 462659, "epoch": 5574} {"train_loss": -27.290891647338867, "global_step": 462660, "epoch": 5574} {"train_loss": -27.101682662963867, "global_step": 462661, "epoch": 5574} {"train_loss": -27.106664657592773, "global_step": 462662, "epoch": 5574} {"train_loss": -26.486164093017578, "global_step": 462663, "epoch": 5574} {"train_loss": -27.13455581665039, "global_step": 462664, "epoch": 5574} {"train_loss": -27.175031661987305, "global_step": 462665, "epoch": 5574} {"train_loss": -27.223129272460938, "global_step": 462666, "epoch": 5574} {"train_loss": -27.075347900390625, "global_step": 462667, "epoch": 5574} {"train_loss": -26.9773006439209, "global_step": 462668, "epoch": 5574} {"train_loss": -26.792760848999023, "global_step": 462669, "epoch": 5574} {"train_loss": -27.1308536529541, "global_step": 462670, "epoch": 5574} {"train_loss": -27.058340072631836, "global_step": 462671, "epoch": 5574} {"train_loss": -27.174448013305664, "global_step": 462672, "epoch": 5574} {"train_loss": -27.146997451782227, "global_step": 462673, "epoch": 5574} {"train_loss": -27.508426666259766, "global_step": 462674, "epoch": 5574} {"train_loss": -27.205463409423828, "global_step": 462675, "epoch": 5574} {"train_loss": -27.011585235595703, "global_step": 462676, "epoch": 5574} {"train_loss": -27.30560302734375, "global_step": 462677, "epoch": 5574} {"train_loss": -27.1767578125, "global_step": 462678, "epoch": 5574} {"train_loss": -27.221532821655273, "global_step": 462679, "epoch": 5574} {"train_loss": -26.915807723999023, "global_step": 462680, "epoch": 5574} {"train_loss": -27.186187744140625, "global_step": 462681, "epoch": 5574} {"train_loss": -27.208221435546875, "global_step": 462682, "epoch": 5574} {"train_loss": -27.40305519104004, "global_step": 462683, "epoch": 5574} {"train_loss": -27.189544677734375, "global_step": 462684, "epoch": 5574} {"train_loss": -26.91111183166504, "global_step": 462685, "epoch": 5574} {"train_loss": -27.259937286376953, "global_step": 462686, "epoch": 5574} {"train_loss": -27.26582908630371, "global_step": 462687, "epoch": 5574} {"train_loss": -27.094388961791992, "global_step": 462688, "epoch": 5574} {"train_loss": -27.549854278564453, "global_step": 462689, "epoch": 5574} {"train_loss": -27.110666275024414, "global_step": 462690, "epoch": 5574} {"train_loss": -27.306440353393555, "global_step": 462691, "epoch": 5574} {"train_loss": -27.250080108642578, "global_step": 462692, "epoch": 5574} {"train_loss": -27.428503036499023, "global_step": 462693, "epoch": 5574} {"train_loss": -27.249710083007812, "global_step": 462694, "epoch": 5574} {"train_loss": -27.805328369140625, "global_step": 462695, "epoch": 5574} {"train_loss": -27.14825439453125, "global_step": 462696, "epoch": 5574} {"train_loss": -27.152814865112305, "global_step": 462697, "epoch": 5574} {"train_loss": -27.046131134033203, "global_step": 462698, "epoch": 5574} {"train_loss": -27.16773796081543, "global_step": 462699, "epoch": 5574} {"train_loss": -27.62458610534668, "global_step": 462700, "epoch": 5574} {"train_loss": -27.145673751831055, "global_step": 462701, "epoch": 5574} {"train_loss": -26.677417755126953, "global_step": 462702, "epoch": 5574} {"train_loss": -27.410017013549805, "global_step": 462703, "epoch": 5574} {"train_loss": -26.831323623657227, "global_step": 462704, "epoch": 5574} {"train_loss": -26.89935302734375, "global_step": 462705, "epoch": 5574} {"train_loss": -26.704648971557617, "global_step": 462706, "epoch": 5574} {"train_loss": -26.740951538085938, "global_step": 462707, "epoch": 5574} {"train_loss": -26.723485946655273, "global_step": 462708, "epoch": 5574} {"train_loss": -27.04957389831543, "global_step": 462709, "epoch": 5574} {"train_loss": -26.960474014282227, "global_step": 462710, "epoch": 5574} {"train_loss": -26.820148468017578, "global_step": 462711, "epoch": 5574} {"train_loss": -26.79608726501465, "global_step": 462712, "epoch": 5574} {"train_loss": -26.837827682495117, "global_step": 462713, "epoch": 5574} {"train_loss": -27.15638542175293, "global_step": 462714, "epoch": 5574} {"train_loss": -27.227460861206055, "global_step": 462715, "epoch": 5574} {"train_loss": -27.089567184448242, "global_step": 462716, "epoch": 5574} {"train_loss": -26.788999557495117, "global_step": 462717, "epoch": 5574} {"train_loss": -27.394155502319336, "global_step": 462718, "epoch": 5574} {"train_loss": -26.302947998046875, "global_step": 462719, "epoch": 5574} {"train_loss": -26.66635513305664, "global_step": 462720, "epoch": 5574} {"train_loss": -26.932897567749023, "global_step": 462721, "epoch": 5574} {"train_loss": -26.70295524597168, "global_step": 462722, "epoch": 5574} {"train_loss": -26.828144073486328, "global_step": 462723, "epoch": 5574} {"train_loss": -27.003921141107398, "global_step": 462724, "epoch": 5574, "val_loss": 6624771.0} {"train_loss": -26.49519157409668, "global_step": 462725, "epoch": 5575} {"train_loss": -25.277286529541016, "global_step": 462726, "epoch": 5575} {"train_loss": -26.059141159057617, "global_step": 462727, "epoch": 5575} {"train_loss": -27.039297103881836, "global_step": 462728, "epoch": 5575} {"train_loss": -26.3193302154541, "global_step": 462729, "epoch": 5575} {"train_loss": -26.11187171936035, "global_step": 462730, "epoch": 5575} {"train_loss": -27.10276222229004, "global_step": 462731, "epoch": 5575} {"train_loss": -26.145368576049805, "global_step": 462732, "epoch": 5575} {"train_loss": -26.8596248626709, "global_step": 462733, "epoch": 5575} {"train_loss": -27.050445556640625, "global_step": 462734, "epoch": 5575} {"train_loss": -26.603256225585938, "global_step": 462735, "epoch": 5575} {"train_loss": -26.639806747436523, "global_step": 462736, "epoch": 5575} {"train_loss": -27.150205612182617, "global_step": 462737, "epoch": 5575} {"train_loss": -27.0229434967041, "global_step": 462738, "epoch": 5575} {"train_loss": -26.778034210205078, "global_step": 462739, "epoch": 5575} {"train_loss": -26.578622817993164, "global_step": 462740, "epoch": 5575} {"train_loss": -26.969762802124023, "global_step": 462741, "epoch": 5575} {"train_loss": -26.940820693969727, "global_step": 462742, "epoch": 5575} {"train_loss": -27.35004234313965, "global_step": 462743, "epoch": 5575} {"train_loss": -26.7504825592041, "global_step": 462744, "epoch": 5575} {"train_loss": -27.017187118530273, "global_step": 462745, "epoch": 5575} {"train_loss": -27.058521270751953, "global_step": 462746, "epoch": 5575} {"train_loss": -27.256467819213867, "global_step": 462747, "epoch": 5575} {"train_loss": -27.187597274780273, "global_step": 462748, "epoch": 5575} {"train_loss": -27.326932907104492, "global_step": 462749, "epoch": 5575} {"train_loss": -26.828840255737305, "global_step": 462750, "epoch": 5575} {"train_loss": -26.948278427124023, "global_step": 462751, "epoch": 5575} {"train_loss": -27.249616622924805, "global_step": 462752, "epoch": 5575} {"train_loss": -27.189184188842773, "global_step": 462753, "epoch": 5575} {"train_loss": -26.925207138061523, "global_step": 462754, "epoch": 5575} {"train_loss": -27.237234115600586, "global_step": 462755, "epoch": 5575} {"train_loss": -27.069549560546875, "global_step": 462756, "epoch": 5575} {"train_loss": -27.547992706298828, "global_step": 462757, "epoch": 5575} {"train_loss": -27.365787506103516, "global_step": 462758, "epoch": 5575} {"train_loss": -27.06050682067871, "global_step": 462759, "epoch": 5575} {"train_loss": -27.007368087768555, "global_step": 462760, "epoch": 5575} {"train_loss": -27.26690673828125, "global_step": 462761, "epoch": 5575} {"train_loss": -27.317138671875, "global_step": 462762, "epoch": 5575} {"train_loss": -27.3472843170166, "global_step": 462763, "epoch": 5575} {"train_loss": -27.334753036499023, "global_step": 462764, "epoch": 5575} {"train_loss": -27.271203994750977, "global_step": 462765, "epoch": 5575} {"train_loss": -27.445758819580078, "global_step": 462766, "epoch": 5575} {"train_loss": -26.980621337890625, "global_step": 462767, "epoch": 5575} {"train_loss": -27.17661476135254, "global_step": 462768, "epoch": 5575} {"train_loss": -26.861785888671875, "global_step": 462769, "epoch": 5575} {"train_loss": -26.94318962097168, "global_step": 462770, "epoch": 5575} {"train_loss": -27.216474533081055, "global_step": 462771, "epoch": 5575} {"train_loss": -27.35499382019043, "global_step": 462772, "epoch": 5575} {"train_loss": -26.5145206451416, "global_step": 462773, "epoch": 5575} {"train_loss": -27.108701705932617, "global_step": 462774, "epoch": 5575} {"train_loss": -26.87396812438965, "global_step": 462775, "epoch": 5575} {"train_loss": -27.390058517456055, "global_step": 462776, "epoch": 5575} {"train_loss": -26.957685470581055, "global_step": 462777, "epoch": 5575} {"train_loss": -27.159208297729492, "global_step": 462778, "epoch": 5575} {"train_loss": -26.8464298248291, "global_step": 462779, "epoch": 5575} {"train_loss": -26.940275192260742, "global_step": 462780, "epoch": 5575} {"train_loss": -27.254993438720703, "global_step": 462781, "epoch": 5575} {"train_loss": -27.236846923828125, "global_step": 462782, "epoch": 5575} {"train_loss": -26.898656845092773, "global_step": 462783, "epoch": 5575} {"train_loss": -27.4111328125, "global_step": 462784, "epoch": 5575} {"train_loss": -27.005176544189453, "global_step": 462785, "epoch": 5575} {"train_loss": -27.06720542907715, "global_step": 462786, "epoch": 5575} {"train_loss": -27.13368034362793, "global_step": 462787, "epoch": 5575} {"train_loss": -27.26911735534668, "global_step": 462788, "epoch": 5575} {"train_loss": -26.845752716064453, "global_step": 462789, "epoch": 5575} {"train_loss": -27.591283798217773, "global_step": 462790, "epoch": 5575} {"train_loss": -27.129602432250977, "global_step": 462791, "epoch": 5575} {"train_loss": -27.596698760986328, "global_step": 462792, "epoch": 5575} {"train_loss": -27.172260284423828, "global_step": 462793, "epoch": 5575} {"train_loss": -27.321409225463867, "global_step": 462794, "epoch": 5575} {"train_loss": -27.143884658813477, "global_step": 462795, "epoch": 5575} {"train_loss": -27.269887924194336, "global_step": 462796, "epoch": 5575} {"train_loss": -27.366107940673828, "global_step": 462797, "epoch": 5575} {"train_loss": -27.017072677612305, "global_step": 462798, "epoch": 5575} {"train_loss": -27.112812042236328, "global_step": 462799, "epoch": 5575} {"train_loss": -27.232481002807617, "global_step": 462800, "epoch": 5575} {"train_loss": -27.06076431274414, "global_step": 462801, "epoch": 5575} {"train_loss": -27.28092384338379, "global_step": 462802, "epoch": 5575} {"train_loss": -27.022348403930664, "global_step": 462803, "epoch": 5575} {"train_loss": -27.225439071655273, "global_step": 462804, "epoch": 5575} {"train_loss": -27.30791664123535, "global_step": 462805, "epoch": 5575} {"train_loss": -26.985082626342773, "global_step": 462806, "epoch": 5575} {"train_loss": -27.056028756750635, "global_step": 462807, "epoch": 5575, "val_loss": 6556109.0} {"train_loss": -27.268232345581055, "global_step": 462808, "epoch": 5576} {"train_loss": -27.002155303955078, "global_step": 462809, "epoch": 5576} {"train_loss": -26.987802505493164, "global_step": 462810, "epoch": 5576} {"train_loss": -27.365192413330078, "global_step": 462811, "epoch": 5576} {"train_loss": -26.91547203063965, "global_step": 462812, "epoch": 5576} {"train_loss": -26.319456100463867, "global_step": 462813, "epoch": 5576} {"train_loss": -26.42923927307129, "global_step": 462814, "epoch": 5576} {"train_loss": -26.432636260986328, "global_step": 462815, "epoch": 5576} {"train_loss": -26.278440475463867, "global_step": 462816, "epoch": 5576} {"train_loss": -26.914554595947266, "global_step": 462817, "epoch": 5576} {"train_loss": -26.80000114440918, "global_step": 462818, "epoch": 5576} {"train_loss": -26.530288696289062, "global_step": 462819, "epoch": 5576} {"train_loss": -26.8410701751709, "global_step": 462820, "epoch": 5576} {"train_loss": -26.800907135009766, "global_step": 462821, "epoch": 5576} {"train_loss": -27.02642822265625, "global_step": 462822, "epoch": 5576} {"train_loss": -26.71756362915039, "global_step": 462823, "epoch": 5576} {"train_loss": -27.3929500579834, "global_step": 462824, "epoch": 5576} {"train_loss": -26.545948028564453, "global_step": 462825, "epoch": 5576} {"train_loss": -27.494550704956055, "global_step": 462826, "epoch": 5576} {"train_loss": -26.95781898498535, "global_step": 462827, "epoch": 5576} {"train_loss": -27.319238662719727, "global_step": 462828, "epoch": 5576} {"train_loss": -26.861331939697266, "global_step": 462829, "epoch": 5576} {"train_loss": -26.9473876953125, "global_step": 462830, "epoch": 5576} {"train_loss": -27.373876571655273, "global_step": 462831, "epoch": 5576} {"train_loss": -26.592254638671875, "global_step": 462832, "epoch": 5576} {"train_loss": -26.974721908569336, "global_step": 462833, "epoch": 5576} {"train_loss": -27.21528434753418, "global_step": 462834, "epoch": 5576} {"train_loss": -27.11191177368164, "global_step": 462835, "epoch": 5576} {"train_loss": -27.10100746154785, "global_step": 462836, "epoch": 5576} {"train_loss": -26.62354850769043, "global_step": 462837, "epoch": 5576} {"train_loss": -26.98435401916504, "global_step": 462838, "epoch": 5576} {"train_loss": -26.996999740600586, "global_step": 462839, "epoch": 5576} {"train_loss": -26.768146514892578, "global_step": 462840, "epoch": 5576} {"train_loss": -27.08957290649414, "global_step": 462841, "epoch": 5576} {"train_loss": -27.5470027923584, "global_step": 462842, "epoch": 5576} {"train_loss": -26.993040084838867, "global_step": 462843, "epoch": 5576} {"train_loss": -26.889087677001953, "global_step": 462844, "epoch": 5576} {"train_loss": -27.074813842773438, "global_step": 462845, "epoch": 5576} {"train_loss": -27.757543563842773, "global_step": 462846, "epoch": 5576} {"train_loss": -27.142248153686523, "global_step": 462847, "epoch": 5576} {"train_loss": -26.987598419189453, "global_step": 462848, "epoch": 5576} {"train_loss": -27.327634811401367, "global_step": 462849, "epoch": 5576} {"train_loss": -27.046106338500977, "global_step": 462850, "epoch": 5576} {"train_loss": -27.5297908782959, "global_step": 462851, "epoch": 5576} {"train_loss": -27.002561569213867, "global_step": 462852, "epoch": 5576} {"train_loss": -26.988422393798828, "global_step": 462853, "epoch": 5576} {"train_loss": -27.499231338500977, "global_step": 462854, "epoch": 5576} {"train_loss": -27.299341201782227, "global_step": 462855, "epoch": 5576} {"train_loss": -27.049413681030273, "global_step": 462856, "epoch": 5576} {"train_loss": -27.015308380126953, "global_step": 462857, "epoch": 5576} {"train_loss": -27.648244857788086, "global_step": 462858, "epoch": 5576} {"train_loss": -27.263879776000977, "global_step": 462859, "epoch": 5576} {"train_loss": -27.32781410217285, "global_step": 462860, "epoch": 5576} {"train_loss": -27.065176010131836, "global_step": 462861, "epoch": 5576} {"train_loss": -26.95111656188965, "global_step": 462862, "epoch": 5576} {"train_loss": -27.163297653198242, "global_step": 462863, "epoch": 5576} {"train_loss": -27.361799240112305, "global_step": 462864, "epoch": 5576} {"train_loss": -27.13222312927246, "global_step": 462865, "epoch": 5576} {"train_loss": -27.098230361938477, "global_step": 462866, "epoch": 5576} {"train_loss": -27.356435775756836, "global_step": 462867, "epoch": 5576} {"train_loss": -27.104455947875977, "global_step": 462868, "epoch": 5576} {"train_loss": -27.229211807250977, "global_step": 462869, "epoch": 5576} {"train_loss": -27.132129669189453, "global_step": 462870, "epoch": 5576} {"train_loss": -26.96351432800293, "global_step": 462871, "epoch": 5576} {"train_loss": -27.242389678955078, "global_step": 462872, "epoch": 5576} {"train_loss": -27.03546714782715, "global_step": 462873, "epoch": 5576} {"train_loss": -27.050764083862305, "global_step": 462874, "epoch": 5576} {"train_loss": -26.629430770874023, "global_step": 462875, "epoch": 5576} {"train_loss": -27.18207359313965, "global_step": 462876, "epoch": 5576} {"train_loss": -26.649322509765625, "global_step": 462877, "epoch": 5576} {"train_loss": -26.823383331298828, "global_step": 462878, "epoch": 5576} {"train_loss": -26.83656883239746, "global_step": 462879, "epoch": 5576} {"train_loss": -26.945999145507812, "global_step": 462880, "epoch": 5576} {"train_loss": -27.31528663635254, "global_step": 462881, "epoch": 5576} {"train_loss": -27.482513427734375, "global_step": 462882, "epoch": 5576} {"train_loss": -27.175222396850586, "global_step": 462883, "epoch": 5576} {"train_loss": -27.244754791259766, "global_step": 462884, "epoch": 5576} {"train_loss": -27.460601806640625, "global_step": 462885, "epoch": 5576} {"train_loss": -26.958032608032227, "global_step": 462886, "epoch": 5576} {"train_loss": -26.8167724609375, "global_step": 462887, "epoch": 5576} {"train_loss": -26.997400283813477, "global_step": 462888, "epoch": 5576} {"train_loss": -27.243106842041016, "global_step": 462889, "epoch": 5576} {"train_loss": -27.044954552707903, "global_step": 462890, "epoch": 5576, "val_loss": 6566670.0} {"train_loss": -26.132104873657227, "global_step": 462891, "epoch": 5577} {"train_loss": -25.557607650756836, "global_step": 462892, "epoch": 5577} {"train_loss": -25.82254981994629, "global_step": 462893, "epoch": 5577} {"train_loss": -25.91172218322754, "global_step": 462894, "epoch": 5577} {"train_loss": -25.667591094970703, "global_step": 462895, "epoch": 5577} {"train_loss": -26.2071475982666, "global_step": 462896, "epoch": 5577} {"train_loss": -25.87333106994629, "global_step": 462897, "epoch": 5577} {"train_loss": -26.1181697845459, "global_step": 462898, "epoch": 5577} {"train_loss": -26.060644149780273, "global_step": 462899, "epoch": 5577} {"train_loss": -25.34714698791504, "global_step": 462900, "epoch": 5577} {"train_loss": -26.543066024780273, "global_step": 462901, "epoch": 5577} {"train_loss": -26.22003746032715, "global_step": 462902, "epoch": 5577} {"train_loss": -26.39048194885254, "global_step": 462903, "epoch": 5577} {"train_loss": -26.226003646850586, "global_step": 462904, "epoch": 5577} {"train_loss": -26.46002769470215, "global_step": 462905, "epoch": 5577} {"train_loss": -26.50575065612793, "global_step": 462906, "epoch": 5577} {"train_loss": -26.546640396118164, "global_step": 462907, "epoch": 5577} {"train_loss": -26.379810333251953, "global_step": 462908, "epoch": 5577} {"train_loss": -26.6346492767334, "global_step": 462909, "epoch": 5577} {"train_loss": -26.5645751953125, "global_step": 462910, "epoch": 5577} {"train_loss": -26.470855712890625, "global_step": 462911, "epoch": 5577} {"train_loss": -26.86494255065918, "global_step": 462912, "epoch": 5577} {"train_loss": -26.764408111572266, "global_step": 462913, "epoch": 5577} {"train_loss": -26.70747947692871, "global_step": 462914, "epoch": 5577} {"train_loss": -26.907302856445312, "global_step": 462915, "epoch": 5577} {"train_loss": -26.695785522460938, "global_step": 462916, "epoch": 5577} {"train_loss": -26.777387619018555, "global_step": 462917, "epoch": 5577} {"train_loss": -26.69190788269043, "global_step": 462918, "epoch": 5577} {"train_loss": -26.880964279174805, "global_step": 462919, "epoch": 5577} {"train_loss": -26.77369499206543, "global_step": 462920, "epoch": 5577} {"train_loss": -26.973066329956055, "global_step": 462921, "epoch": 5577} {"train_loss": -27.096710205078125, "global_step": 462922, "epoch": 5577} {"train_loss": -27.084503173828125, "global_step": 462923, "epoch": 5577} {"train_loss": -27.03323745727539, "global_step": 462924, "epoch": 5577} {"train_loss": -26.644498825073242, "global_step": 462925, "epoch": 5577} {"train_loss": -27.0599422454834, "global_step": 462926, "epoch": 5577} {"train_loss": -26.887067794799805, "global_step": 462927, "epoch": 5577} {"train_loss": -26.860565185546875, "global_step": 462928, "epoch": 5577} {"train_loss": -26.80278968811035, "global_step": 462929, "epoch": 5577} {"train_loss": -26.73394775390625, "global_step": 462930, "epoch": 5577} {"train_loss": -27.190353393554688, "global_step": 462931, "epoch": 5577} {"train_loss": -27.288455963134766, "global_step": 462932, "epoch": 5577} {"train_loss": -27.007648468017578, "global_step": 462933, "epoch": 5577} {"train_loss": -27.1474552154541, "global_step": 462934, "epoch": 5577} {"train_loss": -26.634811401367188, "global_step": 462935, "epoch": 5577} {"train_loss": -27.035078048706055, "global_step": 462936, "epoch": 5577} {"train_loss": -27.044103622436523, "global_step": 462937, "epoch": 5577} {"train_loss": -27.087188720703125, "global_step": 462938, "epoch": 5577} {"train_loss": -26.9523868560791, "global_step": 462939, "epoch": 5577} {"train_loss": -27.156309127807617, "global_step": 462940, "epoch": 5577} {"train_loss": -27.40212059020996, "global_step": 462941, "epoch": 5577} {"train_loss": -27.350095748901367, "global_step": 462942, "epoch": 5577} {"train_loss": -27.18824577331543, "global_step": 462943, "epoch": 5577} {"train_loss": -27.561298370361328, "global_step": 462944, "epoch": 5577} {"train_loss": -27.353240966796875, "global_step": 462945, "epoch": 5577} {"train_loss": -27.16107749938965, "global_step": 462946, "epoch": 5577} {"train_loss": -27.027786254882812, "global_step": 462947, "epoch": 5577} {"train_loss": -27.28922462463379, "global_step": 462948, "epoch": 5577} {"train_loss": -27.867544174194336, "global_step": 462949, "epoch": 5577} {"train_loss": -27.1355037689209, "global_step": 462950, "epoch": 5577} {"train_loss": -27.430423736572266, "global_step": 462951, "epoch": 5577} {"train_loss": -27.035364151000977, "global_step": 462952, "epoch": 5577} {"train_loss": -27.803552627563477, "global_step": 462953, "epoch": 5577} {"train_loss": -26.786365509033203, "global_step": 462954, "epoch": 5577} {"train_loss": -27.345914840698242, "global_step": 462955, "epoch": 5577} {"train_loss": -26.98879051208496, "global_step": 462956, "epoch": 5577} {"train_loss": -27.182836532592773, "global_step": 462957, "epoch": 5577} {"train_loss": -26.641483306884766, "global_step": 462958, "epoch": 5577} {"train_loss": -26.282629013061523, "global_step": 462959, "epoch": 5577} {"train_loss": -26.81585693359375, "global_step": 462960, "epoch": 5577} {"train_loss": -26.549665451049805, "global_step": 462961, "epoch": 5577} {"train_loss": -27.20484733581543, "global_step": 462962, "epoch": 5577} {"train_loss": -26.955530166625977, "global_step": 462963, "epoch": 5577} {"train_loss": -27.158493041992188, "global_step": 462964, "epoch": 5577} {"train_loss": -26.916610717773438, "global_step": 462965, "epoch": 5577} {"train_loss": -26.681537628173828, "global_step": 462966, "epoch": 5577} {"train_loss": -27.524982452392578, "global_step": 462967, "epoch": 5577} {"train_loss": -27.24216651916504, "global_step": 462968, "epoch": 5577} {"train_loss": -27.1856746673584, "global_step": 462969, "epoch": 5577} {"train_loss": -27.070907592773438, "global_step": 462970, "epoch": 5577} {"train_loss": -26.883697509765625, "global_step": 462971, "epoch": 5577} {"train_loss": -26.956113815307617, "global_step": 462972, "epoch": 5577} {"train_loss": -26.79250271349068, "global_step": 462973, "epoch": 5577, "val_loss": 6503129.5} {"train_loss": -25.386137008666992, "global_step": 462974, "epoch": 5578} {"train_loss": -25.993703842163086, "global_step": 462975, "epoch": 5578} {"train_loss": -25.82309341430664, "global_step": 462976, "epoch": 5578} {"train_loss": -25.12286949157715, "global_step": 462977, "epoch": 5578} {"train_loss": -26.082555770874023, "global_step": 462978, "epoch": 5578} {"train_loss": -25.276477813720703, "global_step": 462979, "epoch": 5578} {"train_loss": -26.36091423034668, "global_step": 462980, "epoch": 5578} {"train_loss": -25.545011520385742, "global_step": 462981, "epoch": 5578} {"train_loss": -26.29573631286621, "global_step": 462982, "epoch": 5578} {"train_loss": -26.19241714477539, "global_step": 462983, "epoch": 5578} {"train_loss": -26.220783233642578, "global_step": 462984, "epoch": 5578} {"train_loss": -26.38502311706543, "global_step": 462985, "epoch": 5578} {"train_loss": -26.05120849609375, "global_step": 462986, "epoch": 5578} {"train_loss": -26.4456729888916, "global_step": 462987, "epoch": 5578} {"train_loss": -26.16773796081543, "global_step": 462988, "epoch": 5578} {"train_loss": -26.57159996032715, "global_step": 462989, "epoch": 5578} {"train_loss": -26.711332321166992, "global_step": 462990, "epoch": 5578} {"train_loss": -26.342313766479492, "global_step": 462991, "epoch": 5578} {"train_loss": -26.487873077392578, "global_step": 462992, "epoch": 5578} {"train_loss": -26.482452392578125, "global_step": 462993, "epoch": 5578} {"train_loss": -26.753366470336914, "global_step": 462994, "epoch": 5578} {"train_loss": -26.372608184814453, "global_step": 462995, "epoch": 5578} {"train_loss": -26.756195068359375, "global_step": 462996, "epoch": 5578} {"train_loss": -26.812650680541992, "global_step": 462997, "epoch": 5578} {"train_loss": -27.01041030883789, "global_step": 462998, "epoch": 5578} {"train_loss": -26.88785171508789, "global_step": 462999, "epoch": 5578} {"train_loss": -27.008392333984375, "global_step": 463000, "epoch": 5578} {"train_loss": -26.524335861206055, "global_step": 463001, "epoch": 5578} {"train_loss": -26.797943115234375, "global_step": 463002, "epoch": 5578} {"train_loss": -26.8406925201416, "global_step": 463003, "epoch": 5578} {"train_loss": -26.845294952392578, "global_step": 463004, "epoch": 5578} {"train_loss": -26.92852210998535, "global_step": 463005, "epoch": 5578} {"train_loss": -26.650070190429688, "global_step": 463006, "epoch": 5578} {"train_loss": -26.678756713867188, "global_step": 463007, "epoch": 5578} {"train_loss": -26.58782386779785, "global_step": 463008, "epoch": 5578} {"train_loss": -26.93995475769043, "global_step": 463009, "epoch": 5578} {"train_loss": -26.846933364868164, "global_step": 463010, "epoch": 5578} {"train_loss": -26.755252838134766, "global_step": 463011, "epoch": 5578} {"train_loss": -27.05901527404785, "global_step": 463012, "epoch": 5578} {"train_loss": -27.0585880279541, "global_step": 463013, "epoch": 5578} {"train_loss": -27.423364639282227, "global_step": 463014, "epoch": 5578} {"train_loss": -26.726913452148438, "global_step": 463015, "epoch": 5578} {"train_loss": -27.007923126220703, "global_step": 463016, "epoch": 5578} {"train_loss": -27.021413803100586, "global_step": 463017, "epoch": 5578} {"train_loss": -27.252639770507812, "global_step": 463018, "epoch": 5578} {"train_loss": -27.037397384643555, "global_step": 463019, "epoch": 5578} {"train_loss": -26.837377548217773, "global_step": 463020, "epoch": 5578} {"train_loss": -27.063446044921875, "global_step": 463021, "epoch": 5578} {"train_loss": -26.994413375854492, "global_step": 463022, "epoch": 5578} {"train_loss": -27.351398468017578, "global_step": 463023, "epoch": 5578} {"train_loss": -27.31061363220215, "global_step": 463024, "epoch": 5578} {"train_loss": -27.43179702758789, "global_step": 463025, "epoch": 5578} {"train_loss": -27.121763229370117, "global_step": 463026, "epoch": 5578} {"train_loss": -27.2396240234375, "global_step": 463027, "epoch": 5578} {"train_loss": -27.5831241607666, "global_step": 463028, "epoch": 5578} {"train_loss": -27.514179229736328, "global_step": 463029, "epoch": 5578} {"train_loss": -27.03541374206543, "global_step": 463030, "epoch": 5578} {"train_loss": -27.095426559448242, "global_step": 463031, "epoch": 5578} {"train_loss": -27.143402099609375, "global_step": 463032, "epoch": 5578} {"train_loss": -27.1591796875, "global_step": 463033, "epoch": 5578} {"train_loss": -27.0582218170166, "global_step": 463034, "epoch": 5578} {"train_loss": -27.279205322265625, "global_step": 463035, "epoch": 5578} {"train_loss": -27.035736083984375, "global_step": 463036, "epoch": 5578} {"train_loss": -27.000263214111328, "global_step": 463037, "epoch": 5578} {"train_loss": -27.32257652282715, "global_step": 463038, "epoch": 5578} {"train_loss": -27.761655807495117, "global_step": 463039, "epoch": 5578} {"train_loss": -27.14609718322754, "global_step": 463040, "epoch": 5578} {"train_loss": -27.39483070373535, "global_step": 463041, "epoch": 5578} {"train_loss": -26.883197784423828, "global_step": 463042, "epoch": 5578} {"train_loss": -27.4841251373291, "global_step": 463043, "epoch": 5578} {"train_loss": -27.43231201171875, "global_step": 463044, "epoch": 5578} {"train_loss": -27.3352108001709, "global_step": 463045, "epoch": 5578} {"train_loss": -27.169172286987305, "global_step": 463046, "epoch": 5578} {"train_loss": -27.16920280456543, "global_step": 463047, "epoch": 5578} {"train_loss": -27.31502342224121, "global_step": 463048, "epoch": 5578} {"train_loss": -27.60110855102539, "global_step": 463049, "epoch": 5578} {"train_loss": -26.686431884765625, "global_step": 463050, "epoch": 5578} {"train_loss": -27.50408363342285, "global_step": 463051, "epoch": 5578} {"train_loss": -27.1395263671875, "global_step": 463052, "epoch": 5578} {"train_loss": -27.262237548828125, "global_step": 463053, "epoch": 5578} {"train_loss": -27.591772079467773, "global_step": 463054, "epoch": 5578} {"train_loss": -27.117868423461914, "global_step": 463055, "epoch": 5578} {"train_loss": -26.853648381060864, "global_step": 463056, "epoch": 5578, "val_loss": 6634413.0} {"train_loss": -27.1900634765625, "global_step": 463057, "epoch": 5579} {"train_loss": -26.46074867248535, "global_step": 463058, "epoch": 5579} {"train_loss": -24.914426803588867, "global_step": 463059, "epoch": 5579} {"train_loss": -23.884536743164062, "global_step": 463060, "epoch": 5579} {"train_loss": -25.746234893798828, "global_step": 463061, "epoch": 5579} {"train_loss": -26.37066650390625, "global_step": 463062, "epoch": 5579} {"train_loss": -25.8389949798584, "global_step": 463063, "epoch": 5579} {"train_loss": -25.39542007446289, "global_step": 463064, "epoch": 5579} {"train_loss": -26.556486129760742, "global_step": 463065, "epoch": 5579} {"train_loss": -25.828649520874023, "global_step": 463066, "epoch": 5579} {"train_loss": -26.187463760375977, "global_step": 463067, "epoch": 5579} {"train_loss": -25.95440673828125, "global_step": 463068, "epoch": 5579} {"train_loss": -26.864837646484375, "global_step": 463069, "epoch": 5579} {"train_loss": -26.11358070373535, "global_step": 463070, "epoch": 5579} {"train_loss": -26.259084701538086, "global_step": 463071, "epoch": 5579} {"train_loss": -26.382644653320312, "global_step": 463072, "epoch": 5579} {"train_loss": -26.07578468322754, "global_step": 463073, "epoch": 5579} {"train_loss": -26.60096549987793, "global_step": 463074, "epoch": 5579} {"train_loss": -26.5264892578125, "global_step": 463075, "epoch": 5579} {"train_loss": -26.24616050720215, "global_step": 463076, "epoch": 5579} {"train_loss": -26.643558502197266, "global_step": 463077, "epoch": 5579} {"train_loss": -26.63490867614746, "global_step": 463078, "epoch": 5579} {"train_loss": -26.735456466674805, "global_step": 463079, "epoch": 5579} {"train_loss": -25.979450225830078, "global_step": 463080, "epoch": 5579} {"train_loss": -26.321401596069336, "global_step": 463081, "epoch": 5579} {"train_loss": -26.52119255065918, "global_step": 463082, "epoch": 5579} {"train_loss": -26.546100616455078, "global_step": 463083, "epoch": 5579} {"train_loss": -26.87961769104004, "global_step": 463084, "epoch": 5579} {"train_loss": -26.743667602539062, "global_step": 463085, "epoch": 5579} {"train_loss": -26.804351806640625, "global_step": 463086, "epoch": 5579} {"train_loss": -26.595508575439453, "global_step": 463087, "epoch": 5579} {"train_loss": -26.68765640258789, "global_step": 463088, "epoch": 5579} {"train_loss": -27.1313533782959, "global_step": 463089, "epoch": 5579} {"train_loss": -26.88205337524414, "global_step": 463090, "epoch": 5579} {"train_loss": -27.158132553100586, "global_step": 463091, "epoch": 5579} {"train_loss": -26.784006118774414, "global_step": 463092, "epoch": 5579} {"train_loss": -27.034616470336914, "global_step": 463093, "epoch": 5579} {"train_loss": -27.0567569732666, "global_step": 463094, "epoch": 5579} {"train_loss": -26.51228141784668, "global_step": 463095, "epoch": 5579} {"train_loss": -26.754810333251953, "global_step": 463096, "epoch": 5579} {"train_loss": -26.769506454467773, "global_step": 463097, "epoch": 5579} {"train_loss": -27.111862182617188, "global_step": 463098, "epoch": 5579} {"train_loss": -27.2066707611084, "global_step": 463099, "epoch": 5579} {"train_loss": -26.945154190063477, "global_step": 463100, "epoch": 5579} {"train_loss": -27.3751163482666, "global_step": 463101, "epoch": 5579} {"train_loss": -26.977773666381836, "global_step": 463102, "epoch": 5579} {"train_loss": -27.15754508972168, "global_step": 463103, "epoch": 5579} {"train_loss": -27.310546875, "global_step": 463104, "epoch": 5579} {"train_loss": -27.014606475830078, "global_step": 463105, "epoch": 5579} {"train_loss": -27.14481544494629, "global_step": 463106, "epoch": 5579} {"train_loss": -27.06117057800293, "global_step": 463107, "epoch": 5579} {"train_loss": -26.799657821655273, "global_step": 463108, "epoch": 5579} {"train_loss": -27.544910430908203, "global_step": 463109, "epoch": 5579} {"train_loss": -27.29694175720215, "global_step": 463110, "epoch": 5579} {"train_loss": -27.198095321655273, "global_step": 463111, "epoch": 5579} {"train_loss": -26.844501495361328, "global_step": 463112, "epoch": 5579} {"train_loss": -27.001178741455078, "global_step": 463113, "epoch": 5579} {"train_loss": -27.2342472076416, "global_step": 463114, "epoch": 5579} {"train_loss": -27.256200790405273, "global_step": 463115, "epoch": 5579} {"train_loss": -27.37762451171875, "global_step": 463116, "epoch": 5579} {"train_loss": -27.177343368530273, "global_step": 463117, "epoch": 5579} {"train_loss": -27.760019302368164, "global_step": 463118, "epoch": 5579} {"train_loss": -27.23097801208496, "global_step": 463119, "epoch": 5579} {"train_loss": -27.227237701416016, "global_step": 463120, "epoch": 5579} {"train_loss": -27.27949333190918, "global_step": 463121, "epoch": 5579} {"train_loss": -27.285369873046875, "global_step": 463122, "epoch": 5579} {"train_loss": -26.844318389892578, "global_step": 463123, "epoch": 5579} {"train_loss": -26.8752384185791, "global_step": 463124, "epoch": 5579} {"train_loss": -26.717248916625977, "global_step": 463125, "epoch": 5579} {"train_loss": -27.39093589782715, "global_step": 463126, "epoch": 5579} {"train_loss": -27.138294219970703, "global_step": 463127, "epoch": 5579} {"train_loss": -26.997900009155273, "global_step": 463128, "epoch": 5579} {"train_loss": -27.042560577392578, "global_step": 463129, "epoch": 5579} {"train_loss": -27.258840560913086, "global_step": 463130, "epoch": 5579} {"train_loss": -27.046972274780273, "global_step": 463131, "epoch": 5579} {"train_loss": -27.25446128845215, "global_step": 463132, "epoch": 5579} {"train_loss": -27.027942657470703, "global_step": 463133, "epoch": 5579} {"train_loss": -27.23076820373535, "global_step": 463134, "epoch": 5579} {"train_loss": -27.243432998657227, "global_step": 463135, "epoch": 5579} {"train_loss": -27.21002197265625, "global_step": 463136, "epoch": 5579} {"train_loss": -27.080347061157227, "global_step": 463137, "epoch": 5579} {"train_loss": -27.079486846923828, "global_step": 463138, "epoch": 5579} {"train_loss": -26.765789169863044, "global_step": 463139, "epoch": 5579, "val_loss": 6634747.5} {"train_loss": -26.877643585205078, "global_step": 463140, "epoch": 5580} {"train_loss": -26.498321533203125, "global_step": 463141, "epoch": 5580} {"train_loss": -26.85527992248535, "global_step": 463142, "epoch": 5580} {"train_loss": -26.604978561401367, "global_step": 463143, "epoch": 5580} {"train_loss": -26.535785675048828, "global_step": 463144, "epoch": 5580} {"train_loss": -26.4278621673584, "global_step": 463145, "epoch": 5580} {"train_loss": -26.46380043029785, "global_step": 463146, "epoch": 5580} {"train_loss": -26.664167404174805, "global_step": 463147, "epoch": 5580} {"train_loss": -26.512250900268555, "global_step": 463148, "epoch": 5580} {"train_loss": -27.065845489501953, "global_step": 463149, "epoch": 5580} {"train_loss": -26.9000244140625, "global_step": 463150, "epoch": 5580} {"train_loss": -27.21921730041504, "global_step": 463151, "epoch": 5580} {"train_loss": -26.91632652282715, "global_step": 463152, "epoch": 5580} {"train_loss": -26.995635986328125, "global_step": 463153, "epoch": 5580} {"train_loss": -27.092641830444336, "global_step": 463154, "epoch": 5580} {"train_loss": -26.835554122924805, "global_step": 463155, "epoch": 5580} {"train_loss": -26.770654678344727, "global_step": 463156, "epoch": 5580} {"train_loss": -27.1333065032959, "global_step": 463157, "epoch": 5580} {"train_loss": -27.405038833618164, "global_step": 463158, "epoch": 5580} {"train_loss": -26.947662353515625, "global_step": 463159, "epoch": 5580} {"train_loss": -27.530149459838867, "global_step": 463160, "epoch": 5580} {"train_loss": -27.031097412109375, "global_step": 463161, "epoch": 5580} {"train_loss": -26.952558517456055, "global_step": 463162, "epoch": 5580} {"train_loss": -27.139404296875, "global_step": 463163, "epoch": 5580} {"train_loss": -27.00507926940918, "global_step": 463164, "epoch": 5580} {"train_loss": -27.072057723999023, "global_step": 463165, "epoch": 5580} {"train_loss": -27.030994415283203, "global_step": 463166, "epoch": 5580} {"train_loss": -27.010656356811523, "global_step": 463167, "epoch": 5580} {"train_loss": -27.100006103515625, "global_step": 463168, "epoch": 5580} {"train_loss": -27.020578384399414, "global_step": 463169, "epoch": 5580} {"train_loss": -27.112009048461914, "global_step": 463170, "epoch": 5580} {"train_loss": -27.28423500061035, "global_step": 463171, "epoch": 5580} {"train_loss": -27.172876358032227, "global_step": 463172, "epoch": 5580} {"train_loss": -27.086454391479492, "global_step": 463173, "epoch": 5580} {"train_loss": -27.21856689453125, "global_step": 463174, "epoch": 5580} {"train_loss": -27.31088638305664, "global_step": 463175, "epoch": 5580} {"train_loss": -26.867162704467773, "global_step": 463176, "epoch": 5580} {"train_loss": -27.24853515625, "global_step": 463177, "epoch": 5580} {"train_loss": -26.725263595581055, "global_step": 463178, "epoch": 5580} {"train_loss": -27.020233154296875, "global_step": 463179, "epoch": 5580} {"train_loss": -27.231321334838867, "global_step": 463180, "epoch": 5580} {"train_loss": -27.366195678710938, "global_step": 463181, "epoch": 5580} {"train_loss": -27.144559860229492, "global_step": 463182, "epoch": 5580} {"train_loss": -27.10273551940918, "global_step": 463183, "epoch": 5580} {"train_loss": -27.59160804748535, "global_step": 463184, "epoch": 5580} {"train_loss": -27.638410568237305, "global_step": 463185, "epoch": 5580} {"train_loss": -27.263944625854492, "global_step": 463186, "epoch": 5580} {"train_loss": -27.34442138671875, "global_step": 463187, "epoch": 5580} {"train_loss": -27.428022384643555, "global_step": 463188, "epoch": 5580} {"train_loss": -27.081787109375, "global_step": 463189, "epoch": 5580} {"train_loss": -27.220172882080078, "global_step": 463190, "epoch": 5580} {"train_loss": -27.45692253112793, "global_step": 463191, "epoch": 5580} {"train_loss": -27.4749755859375, "global_step": 463192, "epoch": 5580} {"train_loss": -27.141204833984375, "global_step": 463193, "epoch": 5580} {"train_loss": -27.010385513305664, "global_step": 463194, "epoch": 5580} {"train_loss": -26.966724395751953, "global_step": 463195, "epoch": 5580} {"train_loss": -27.017480850219727, "global_step": 463196, "epoch": 5580} {"train_loss": -27.046985626220703, "global_step": 463197, "epoch": 5580} {"train_loss": -26.889789581298828, "global_step": 463198, "epoch": 5580} {"train_loss": -26.795822143554688, "global_step": 463199, "epoch": 5580} {"train_loss": -27.123693466186523, "global_step": 463200, "epoch": 5580} {"train_loss": -27.498586654663086, "global_step": 463201, "epoch": 5580} {"train_loss": -26.920612335205078, "global_step": 463202, "epoch": 5580} {"train_loss": -26.639333724975586, "global_step": 463203, "epoch": 5580} {"train_loss": -26.905176162719727, "global_step": 463204, "epoch": 5580} {"train_loss": -27.03639030456543, "global_step": 463205, "epoch": 5580} {"train_loss": -26.97564697265625, "global_step": 463206, "epoch": 5580} {"train_loss": -27.14747428894043, "global_step": 463207, "epoch": 5580} {"train_loss": -27.232269287109375, "global_step": 463208, "epoch": 5580} {"train_loss": -27.095922470092773, "global_step": 463209, "epoch": 5580} {"train_loss": -27.203794479370117, "global_step": 463210, "epoch": 5580} {"train_loss": -27.1617488861084, "global_step": 463211, "epoch": 5580} {"train_loss": -27.321008682250977, "global_step": 463212, "epoch": 5580} {"train_loss": -27.257282257080078, "global_step": 463213, "epoch": 5580} {"train_loss": -27.299917221069336, "global_step": 463214, "epoch": 5580} {"train_loss": -27.1595401763916, "global_step": 463215, "epoch": 5580} {"train_loss": -27.412206649780273, "global_step": 463216, "epoch": 5580} {"train_loss": -27.357694625854492, "global_step": 463217, "epoch": 5580} {"train_loss": -26.912073135375977, "global_step": 463218, "epoch": 5580} {"train_loss": -27.362634658813477, "global_step": 463219, "epoch": 5580} {"train_loss": -27.51637077331543, "global_step": 463220, "epoch": 5580} {"train_loss": -27.48681640625, "global_step": 463221, "epoch": 5580} {"train_loss": -27.098538525133247, "global_step": 463222, "epoch": 5580, "val_loss": 6580343.0} {"train_loss": -26.749616622924805, "global_step": 463223, "epoch": 5581} {"train_loss": -27.066614151000977, "global_step": 463224, "epoch": 5581} {"train_loss": -27.076923370361328, "global_step": 463225, "epoch": 5581} {"train_loss": -26.683019638061523, "global_step": 463226, "epoch": 5581} {"train_loss": -26.792423248291016, "global_step": 463227, "epoch": 5581} {"train_loss": -26.97230339050293, "global_step": 463228, "epoch": 5581} {"train_loss": -27.109888076782227, "global_step": 463229, "epoch": 5581} {"train_loss": -27.145910263061523, "global_step": 463230, "epoch": 5581} {"train_loss": -26.912336349487305, "global_step": 463231, "epoch": 5581} {"train_loss": -26.961450576782227, "global_step": 463232, "epoch": 5581} {"train_loss": -27.131193161010742, "global_step": 463233, "epoch": 5581} {"train_loss": -26.8786678314209, "global_step": 463234, "epoch": 5581} {"train_loss": -27.0900821685791, "global_step": 463235, "epoch": 5581} {"train_loss": -26.934301376342773, "global_step": 463236, "epoch": 5581} {"train_loss": -27.472930908203125, "global_step": 463237, "epoch": 5581} {"train_loss": -27.21454429626465, "global_step": 463238, "epoch": 5581} {"train_loss": -27.515676498413086, "global_step": 463239, "epoch": 5581} {"train_loss": -27.121389389038086, "global_step": 463240, "epoch": 5581} {"train_loss": -27.025985717773438, "global_step": 463241, "epoch": 5581} {"train_loss": -26.750202178955078, "global_step": 463242, "epoch": 5581} {"train_loss": -27.403554916381836, "global_step": 463243, "epoch": 5581} {"train_loss": -27.173315048217773, "global_step": 463244, "epoch": 5581} {"train_loss": -26.84988784790039, "global_step": 463245, "epoch": 5581} {"train_loss": -26.815900802612305, "global_step": 463246, "epoch": 5581} {"train_loss": -27.063520431518555, "global_step": 463247, "epoch": 5581} {"train_loss": -27.11897087097168, "global_step": 463248, "epoch": 5581} {"train_loss": -27.247533798217773, "global_step": 463249, "epoch": 5581} {"train_loss": -27.58050537109375, "global_step": 463250, "epoch": 5581} {"train_loss": -27.227888107299805, "global_step": 463251, "epoch": 5581} {"train_loss": -27.0798397064209, "global_step": 463252, "epoch": 5581} {"train_loss": -26.968961715698242, "global_step": 463253, "epoch": 5581} {"train_loss": -27.1297664642334, "global_step": 463254, "epoch": 5581} {"train_loss": -27.131662368774414, "global_step": 463255, "epoch": 5581} {"train_loss": -27.429672241210938, "global_step": 463256, "epoch": 5581} {"train_loss": -26.855823516845703, "global_step": 463257, "epoch": 5581} {"train_loss": -26.8349609375, "global_step": 463258, "epoch": 5581} {"train_loss": -27.265766143798828, "global_step": 463259, "epoch": 5581} {"train_loss": -27.230249404907227, "global_step": 463260, "epoch": 5581} {"train_loss": -26.938526153564453, "global_step": 463261, "epoch": 5581} {"train_loss": -27.465234756469727, "global_step": 463262, "epoch": 5581} {"train_loss": -27.440881729125977, "global_step": 463263, "epoch": 5581} {"train_loss": -26.712308883666992, "global_step": 463264, "epoch": 5581} {"train_loss": -27.21490478515625, "global_step": 463265, "epoch": 5581} {"train_loss": -27.31595802307129, "global_step": 463266, "epoch": 5581} {"train_loss": -27.276025772094727, "global_step": 463267, "epoch": 5581} {"train_loss": -27.403852462768555, "global_step": 463268, "epoch": 5581} {"train_loss": -27.095502853393555, "global_step": 463269, "epoch": 5581} {"train_loss": -27.37847900390625, "global_step": 463270, "epoch": 5581} {"train_loss": -27.346954345703125, "global_step": 463271, "epoch": 5581} {"train_loss": -27.071508407592773, "global_step": 463272, "epoch": 5581} {"train_loss": -27.28297233581543, "global_step": 463273, "epoch": 5581} {"train_loss": -27.39984130859375, "global_step": 463274, "epoch": 5581} {"train_loss": -27.35426902770996, "global_step": 463275, "epoch": 5581} {"train_loss": -27.167463302612305, "global_step": 463276, "epoch": 5581} {"train_loss": -27.143463134765625, "global_step": 463277, "epoch": 5581} {"train_loss": -27.111658096313477, "global_step": 463278, "epoch": 5581} {"train_loss": -27.247705459594727, "global_step": 463279, "epoch": 5581} {"train_loss": -26.8795108795166, "global_step": 463280, "epoch": 5581} {"train_loss": -27.417083740234375, "global_step": 463281, "epoch": 5581} {"train_loss": -27.359943389892578, "global_step": 463282, "epoch": 5581} {"train_loss": -27.203083038330078, "global_step": 463283, "epoch": 5581} {"train_loss": -26.881423950195312, "global_step": 463284, "epoch": 5581} {"train_loss": -27.186471939086914, "global_step": 463285, "epoch": 5581} {"train_loss": -26.98052406311035, "global_step": 463286, "epoch": 5581} {"train_loss": -27.15757179260254, "global_step": 463287, "epoch": 5581} {"train_loss": -27.04463005065918, "global_step": 463288, "epoch": 5581} {"train_loss": -27.31674575805664, "global_step": 463289, "epoch": 5581} {"train_loss": -27.2497501373291, "global_step": 463290, "epoch": 5581} {"train_loss": -27.336273193359375, "global_step": 463291, "epoch": 5581} {"train_loss": -27.390247344970703, "global_step": 463292, "epoch": 5581} {"train_loss": -27.214221954345703, "global_step": 463293, "epoch": 5581} {"train_loss": -27.25410270690918, "global_step": 463294, "epoch": 5581} {"train_loss": -27.392047882080078, "global_step": 463295, "epoch": 5581} {"train_loss": -27.46742057800293, "global_step": 463296, "epoch": 5581} {"train_loss": -27.55387306213379, "global_step": 463297, "epoch": 5581} {"train_loss": -26.98150634765625, "global_step": 463298, "epoch": 5581} {"train_loss": -27.29877281188965, "global_step": 463299, "epoch": 5581} {"train_loss": -26.974267959594727, "global_step": 463300, "epoch": 5581} {"train_loss": -27.27863883972168, "global_step": 463301, "epoch": 5581} {"train_loss": -27.180591583251953, "global_step": 463302, "epoch": 5581} {"train_loss": -27.546369552612305, "global_step": 463303, "epoch": 5581} {"train_loss": -27.212522506713867, "global_step": 463304, "epoch": 5581} {"train_loss": -27.154454794274756, "global_step": 463305, "epoch": 5581, "val_loss": 6595623.0} {"train_loss": -26.48432731628418, "global_step": 463306, "epoch": 5582} {"train_loss": -26.138120651245117, "global_step": 463307, "epoch": 5582} {"train_loss": -26.800662994384766, "global_step": 463308, "epoch": 5582} {"train_loss": -26.652685165405273, "global_step": 463309, "epoch": 5582} {"train_loss": -26.1308536529541, "global_step": 463310, "epoch": 5582} {"train_loss": -27.088626861572266, "global_step": 463311, "epoch": 5582} {"train_loss": -26.673818588256836, "global_step": 463312, "epoch": 5582} {"train_loss": -26.847431182861328, "global_step": 463313, "epoch": 5582} {"train_loss": -26.898853302001953, "global_step": 463314, "epoch": 5582} {"train_loss": -26.82721519470215, "global_step": 463315, "epoch": 5582} {"train_loss": -26.594690322875977, "global_step": 463316, "epoch": 5582} {"train_loss": -27.117895126342773, "global_step": 463317, "epoch": 5582} {"train_loss": -26.739215850830078, "global_step": 463318, "epoch": 5582} {"train_loss": -26.926679611206055, "global_step": 463319, "epoch": 5582} {"train_loss": -26.65238380432129, "global_step": 463320, "epoch": 5582} {"train_loss": -26.62060546875, "global_step": 463321, "epoch": 5582} {"train_loss": -26.959396362304688, "global_step": 463322, "epoch": 5582} {"train_loss": -26.701688766479492, "global_step": 463323, "epoch": 5582} {"train_loss": -27.042367935180664, "global_step": 463324, "epoch": 5582} {"train_loss": -26.606733322143555, "global_step": 463325, "epoch": 5582} {"train_loss": -27.04615592956543, "global_step": 463326, "epoch": 5582} {"train_loss": -27.003477096557617, "global_step": 463327, "epoch": 5582} {"train_loss": -26.633359909057617, "global_step": 463328, "epoch": 5582} {"train_loss": -26.838403701782227, "global_step": 463329, "epoch": 5582} {"train_loss": -27.38058853149414, "global_step": 463330, "epoch": 5582} {"train_loss": -27.20393180847168, "global_step": 463331, "epoch": 5582} {"train_loss": -27.102903366088867, "global_step": 463332, "epoch": 5582} {"train_loss": -27.158187866210938, "global_step": 463333, "epoch": 5582} {"train_loss": -26.852771759033203, "global_step": 463334, "epoch": 5582} {"train_loss": -27.128820419311523, "global_step": 463335, "epoch": 5582} {"train_loss": -27.08710289001465, "global_step": 463336, "epoch": 5582} {"train_loss": -27.447555541992188, "global_step": 463337, "epoch": 5582} {"train_loss": -27.0850772857666, "global_step": 463338, "epoch": 5582} {"train_loss": -27.413288116455078, "global_step": 463339, "epoch": 5582} {"train_loss": -27.07857322692871, "global_step": 463340, "epoch": 5582} {"train_loss": -27.447467803955078, "global_step": 463341, "epoch": 5582} {"train_loss": -26.91883659362793, "global_step": 463342, "epoch": 5582} {"train_loss": -27.273569107055664, "global_step": 463343, "epoch": 5582} {"train_loss": -27.177770614624023, "global_step": 463344, "epoch": 5582} {"train_loss": -27.445724487304688, "global_step": 463345, "epoch": 5582} {"train_loss": -27.596012115478516, "global_step": 463346, "epoch": 5582} {"train_loss": -27.235315322875977, "global_step": 463347, "epoch": 5582} {"train_loss": -27.28125, "global_step": 463348, "epoch": 5582} {"train_loss": -26.8526611328125, "global_step": 463349, "epoch": 5582} {"train_loss": -27.291967391967773, "global_step": 463350, "epoch": 5582} {"train_loss": -26.941787719726562, "global_step": 463351, "epoch": 5582} {"train_loss": -26.562414169311523, "global_step": 463352, "epoch": 5582} {"train_loss": -26.721454620361328, "global_step": 463353, "epoch": 5582} {"train_loss": -27.028974533081055, "global_step": 463354, "epoch": 5582} {"train_loss": -27.112384796142578, "global_step": 463355, "epoch": 5582} {"train_loss": -26.353763580322266, "global_step": 463356, "epoch": 5582} {"train_loss": -26.464374542236328, "global_step": 463357, "epoch": 5582} {"train_loss": -26.63770866394043, "global_step": 463358, "epoch": 5582} {"train_loss": -27.070066452026367, "global_step": 463359, "epoch": 5582} {"train_loss": -26.357999801635742, "global_step": 463360, "epoch": 5582} {"train_loss": -27.130151748657227, "global_step": 463361, "epoch": 5582} {"train_loss": -27.236047744750977, "global_step": 463362, "epoch": 5582} {"train_loss": -26.673322677612305, "global_step": 463363, "epoch": 5582} {"train_loss": -27.031539916992188, "global_step": 463364, "epoch": 5582} {"train_loss": -27.12833023071289, "global_step": 463365, "epoch": 5582} {"train_loss": -26.619977951049805, "global_step": 463366, "epoch": 5582} {"train_loss": -26.86866569519043, "global_step": 463367, "epoch": 5582} {"train_loss": -26.733144760131836, "global_step": 463368, "epoch": 5582} {"train_loss": -27.082447052001953, "global_step": 463369, "epoch": 5582} {"train_loss": -26.944793701171875, "global_step": 463370, "epoch": 5582} {"train_loss": -27.04926872253418, "global_step": 463371, "epoch": 5582} {"train_loss": -27.018667221069336, "global_step": 463372, "epoch": 5582} {"train_loss": -27.2132568359375, "global_step": 463373, "epoch": 5582} {"train_loss": -27.444019317626953, "global_step": 463374, "epoch": 5582} {"train_loss": -27.246286392211914, "global_step": 463375, "epoch": 5582} {"train_loss": -27.198827743530273, "global_step": 463376, "epoch": 5582} {"train_loss": -27.111127853393555, "global_step": 463377, "epoch": 5582} {"train_loss": -27.24830436706543, "global_step": 463378, "epoch": 5582} {"train_loss": -26.904132843017578, "global_step": 463379, "epoch": 5582} {"train_loss": -27.410200119018555, "global_step": 463380, "epoch": 5582} {"train_loss": -27.140121459960938, "global_step": 463381, "epoch": 5582} {"train_loss": -27.3532657623291, "global_step": 463382, "epoch": 5582} {"train_loss": -27.325803756713867, "global_step": 463383, "epoch": 5582} {"train_loss": -27.033109664916992, "global_step": 463384, "epoch": 5582} {"train_loss": -27.115446090698242, "global_step": 463385, "epoch": 5582} {"train_loss": -26.962339401245117, "global_step": 463386, "epoch": 5582} {"train_loss": -27.130903244018555, "global_step": 463387, "epoch": 5582} {"train_loss": -26.95916077027838, "global_step": 463388, "epoch": 5582, "val_loss": 6596445.0} {"train_loss": -25.516660690307617, "global_step": 463389, "epoch": 5583} {"train_loss": -26.152002334594727, "global_step": 463390, "epoch": 5583} {"train_loss": -26.727869033813477, "global_step": 463391, "epoch": 5583} {"train_loss": -26.480436325073242, "global_step": 463392, "epoch": 5583} {"train_loss": -26.41953468322754, "global_step": 463393, "epoch": 5583} {"train_loss": -26.988000869750977, "global_step": 463394, "epoch": 5583} {"train_loss": -26.60883140563965, "global_step": 463395, "epoch": 5583} {"train_loss": -26.836761474609375, "global_step": 463396, "epoch": 5583} {"train_loss": -26.727697372436523, "global_step": 463397, "epoch": 5583} {"train_loss": -26.767282485961914, "global_step": 463398, "epoch": 5583} {"train_loss": -26.45186424255371, "global_step": 463399, "epoch": 5583} {"train_loss": -26.658172607421875, "global_step": 463400, "epoch": 5583} {"train_loss": -26.86897087097168, "global_step": 463401, "epoch": 5583} {"train_loss": -27.057086944580078, "global_step": 463402, "epoch": 5583} {"train_loss": -27.039005279541016, "global_step": 463403, "epoch": 5583} {"train_loss": -26.468765258789062, "global_step": 463404, "epoch": 5583} {"train_loss": -26.8673152923584, "global_step": 463405, "epoch": 5583} {"train_loss": -27.094079971313477, "global_step": 463406, "epoch": 5583} {"train_loss": -26.87713050842285, "global_step": 463407, "epoch": 5583} {"train_loss": -26.978418350219727, "global_step": 463408, "epoch": 5583} {"train_loss": -27.01905632019043, "global_step": 463409, "epoch": 5583} {"train_loss": -26.977853775024414, "global_step": 463410, "epoch": 5583} {"train_loss": -26.958608627319336, "global_step": 463411, "epoch": 5583} {"train_loss": -27.112207412719727, "global_step": 463412, "epoch": 5583} {"train_loss": -27.061084747314453, "global_step": 463413, "epoch": 5583} {"train_loss": -27.01220703125, "global_step": 463414, "epoch": 5583} {"train_loss": -27.0606689453125, "global_step": 463415, "epoch": 5583} {"train_loss": -26.968793869018555, "global_step": 463416, "epoch": 5583} {"train_loss": -27.0510311126709, "global_step": 463417, "epoch": 5583} {"train_loss": -26.65594482421875, "global_step": 463418, "epoch": 5583} {"train_loss": -26.992162704467773, "global_step": 463419, "epoch": 5583} {"train_loss": -27.1823787689209, "global_step": 463420, "epoch": 5583} {"train_loss": -27.258405685424805, "global_step": 463421, "epoch": 5583} {"train_loss": -26.859739303588867, "global_step": 463422, "epoch": 5583} {"train_loss": -27.111083984375, "global_step": 463423, "epoch": 5583} {"train_loss": -27.002721786499023, "global_step": 463424, "epoch": 5583} {"train_loss": -27.100866317749023, "global_step": 463425, "epoch": 5583} {"train_loss": -27.46231460571289, "global_step": 463426, "epoch": 5583} {"train_loss": -26.89238929748535, "global_step": 463427, "epoch": 5583} {"train_loss": -27.598264694213867, "global_step": 463428, "epoch": 5583} {"train_loss": -27.431432723999023, "global_step": 463429, "epoch": 5583} {"train_loss": -27.069427490234375, "global_step": 463430, "epoch": 5583} {"train_loss": -27.093372344970703, "global_step": 463431, "epoch": 5583} {"train_loss": -27.272932052612305, "global_step": 463432, "epoch": 5583} {"train_loss": -27.38230323791504, "global_step": 463433, "epoch": 5583} {"train_loss": -27.386091232299805, "global_step": 463434, "epoch": 5583} {"train_loss": -26.962997436523438, "global_step": 463435, "epoch": 5583} {"train_loss": -27.362396240234375, "global_step": 463436, "epoch": 5583} {"train_loss": -27.292821884155273, "global_step": 463437, "epoch": 5583} {"train_loss": -27.61936378479004, "global_step": 463438, "epoch": 5583} {"train_loss": -26.958181381225586, "global_step": 463439, "epoch": 5583} {"train_loss": -27.429609298706055, "global_step": 463440, "epoch": 5583} {"train_loss": -27.360509872436523, "global_step": 463441, "epoch": 5583} {"train_loss": -27.11604118347168, "global_step": 463442, "epoch": 5583} {"train_loss": -27.670059204101562, "global_step": 463443, "epoch": 5583} {"train_loss": -27.28775405883789, "global_step": 463444, "epoch": 5583} {"train_loss": -27.12061882019043, "global_step": 463445, "epoch": 5583} {"train_loss": -27.37116813659668, "global_step": 463446, "epoch": 5583} {"train_loss": -27.154638290405273, "global_step": 463447, "epoch": 5583} {"train_loss": -27.48431968688965, "global_step": 463448, "epoch": 5583} {"train_loss": -27.38575553894043, "global_step": 463449, "epoch": 5583} {"train_loss": -27.058759689331055, "global_step": 463450, "epoch": 5583} {"train_loss": -27.225229263305664, "global_step": 463451, "epoch": 5583} {"train_loss": -27.391040802001953, "global_step": 463452, "epoch": 5583} {"train_loss": -27.584537506103516, "global_step": 463453, "epoch": 5583} {"train_loss": -26.910205841064453, "global_step": 463454, "epoch": 5583} {"train_loss": -26.315092086791992, "global_step": 463455, "epoch": 5583} {"train_loss": -26.497900009155273, "global_step": 463456, "epoch": 5583} {"train_loss": -26.64239501953125, "global_step": 463457, "epoch": 5583} {"train_loss": -26.725086212158203, "global_step": 463458, "epoch": 5583} {"train_loss": -27.13861083984375, "global_step": 463459, "epoch": 5583} {"train_loss": -26.9638614654541, "global_step": 463460, "epoch": 5583} {"train_loss": -26.18425941467285, "global_step": 463461, "epoch": 5583} {"train_loss": -26.978742599487305, "global_step": 463462, "epoch": 5583} {"train_loss": -26.97494888305664, "global_step": 463463, "epoch": 5583} {"train_loss": -26.72141456604004, "global_step": 463464, "epoch": 5583} {"train_loss": -26.99896240234375, "global_step": 463465, "epoch": 5583} {"train_loss": -26.87395668029785, "global_step": 463466, "epoch": 5583} {"train_loss": -27.234466552734375, "global_step": 463467, "epoch": 5583} {"train_loss": -27.189489364624023, "global_step": 463468, "epoch": 5583} {"train_loss": -26.62091636657715, "global_step": 463469, "epoch": 5583} {"train_loss": -26.9687557220459, "global_step": 463470, "epoch": 5583} {"train_loss": -26.99233615829284, "global_step": 463471, "epoch": 5583, "val_loss": 6604212.0} {"train_loss": -26.75583267211914, "global_step": 463472, "epoch": 5584} {"train_loss": -26.388320922851562, "global_step": 463473, "epoch": 5584} {"train_loss": -26.87909507751465, "global_step": 463474, "epoch": 5584} {"train_loss": -26.514368057250977, "global_step": 463475, "epoch": 5584} {"train_loss": -26.39898109436035, "global_step": 463476, "epoch": 5584} {"train_loss": -26.635269165039062, "global_step": 463477, "epoch": 5584} {"train_loss": -26.60285758972168, "global_step": 463478, "epoch": 5584} {"train_loss": -26.679553985595703, "global_step": 463479, "epoch": 5584} {"train_loss": -26.75446891784668, "global_step": 463480, "epoch": 5584} {"train_loss": -26.753305435180664, "global_step": 463481, "epoch": 5584} {"train_loss": -26.851530075073242, "global_step": 463482, "epoch": 5584} {"train_loss": -26.874242782592773, "global_step": 463483, "epoch": 5584} {"train_loss": -26.88559341430664, "global_step": 463484, "epoch": 5584} {"train_loss": -26.527145385742188, "global_step": 463485, "epoch": 5584} {"train_loss": -26.985794067382812, "global_step": 463486, "epoch": 5584} {"train_loss": -27.008588790893555, "global_step": 463487, "epoch": 5584} {"train_loss": -27.161365509033203, "global_step": 463488, "epoch": 5584} {"train_loss": -27.22964859008789, "global_step": 463489, "epoch": 5584} {"train_loss": -26.857685089111328, "global_step": 463490, "epoch": 5584} {"train_loss": -26.876611709594727, "global_step": 463491, "epoch": 5584} {"train_loss": -26.85529136657715, "global_step": 463492, "epoch": 5584} {"train_loss": -26.935449600219727, "global_step": 463493, "epoch": 5584} {"train_loss": -27.24123191833496, "global_step": 463494, "epoch": 5584} {"train_loss": -27.575952529907227, "global_step": 463495, "epoch": 5584} {"train_loss": -26.716352462768555, "global_step": 463496, "epoch": 5584} {"train_loss": -26.789295196533203, "global_step": 463497, "epoch": 5584} {"train_loss": -26.959033966064453, "global_step": 463498, "epoch": 5584} {"train_loss": -27.29044532775879, "global_step": 463499, "epoch": 5584} {"train_loss": -26.98042106628418, "global_step": 463500, "epoch": 5584} {"train_loss": -27.080976486206055, "global_step": 463501, "epoch": 5584} {"train_loss": -27.157135009765625, "global_step": 463502, "epoch": 5584} {"train_loss": -27.18280601501465, "global_step": 463503, "epoch": 5584} {"train_loss": -27.23713493347168, "global_step": 463504, "epoch": 5584} {"train_loss": -26.918272018432617, "global_step": 463505, "epoch": 5584} {"train_loss": -27.187992095947266, "global_step": 463506, "epoch": 5584} {"train_loss": -27.718603134155273, "global_step": 463507, "epoch": 5584} {"train_loss": -27.319232940673828, "global_step": 463508, "epoch": 5584} {"train_loss": -27.5877628326416, "global_step": 463509, "epoch": 5584} {"train_loss": -27.120731353759766, "global_step": 463510, "epoch": 5584} {"train_loss": -27.421838760375977, "global_step": 463511, "epoch": 5584} {"train_loss": -27.184219360351562, "global_step": 463512, "epoch": 5584} {"train_loss": -26.945911407470703, "global_step": 463513, "epoch": 5584} {"train_loss": -27.15900993347168, "global_step": 463514, "epoch": 5584} {"train_loss": -27.5205135345459, "global_step": 463515, "epoch": 5584} {"train_loss": -26.93951416015625, "global_step": 463516, "epoch": 5584} {"train_loss": -27.108877182006836, "global_step": 463517, "epoch": 5584} {"train_loss": -27.513769149780273, "global_step": 463518, "epoch": 5584} {"train_loss": -27.608549118041992, "global_step": 463519, "epoch": 5584} {"train_loss": -27.749780654907227, "global_step": 463520, "epoch": 5584} {"train_loss": -26.52870750427246, "global_step": 463521, "epoch": 5584} {"train_loss": -27.070362091064453, "global_step": 463522, "epoch": 5584} {"train_loss": -27.373498916625977, "global_step": 463523, "epoch": 5584} {"train_loss": -27.36252784729004, "global_step": 463524, "epoch": 5584} {"train_loss": -27.03193473815918, "global_step": 463525, "epoch": 5584} {"train_loss": -27.37758445739746, "global_step": 463526, "epoch": 5584} {"train_loss": -26.7248477935791, "global_step": 463527, "epoch": 5584} {"train_loss": -26.780668258666992, "global_step": 463528, "epoch": 5584} {"train_loss": -26.050683975219727, "global_step": 463529, "epoch": 5584} {"train_loss": -25.753986358642578, "global_step": 463530, "epoch": 5584} {"train_loss": -26.96042251586914, "global_step": 463531, "epoch": 5584} {"train_loss": -27.074148178100586, "global_step": 463532, "epoch": 5584} {"train_loss": -26.83906364440918, "global_step": 463533, "epoch": 5584} {"train_loss": -27.187469482421875, "global_step": 463534, "epoch": 5584} {"train_loss": -26.60200309753418, "global_step": 463535, "epoch": 5584} {"train_loss": -26.690332412719727, "global_step": 463536, "epoch": 5584} {"train_loss": -26.477685928344727, "global_step": 463537, "epoch": 5584} {"train_loss": -26.859878540039062, "global_step": 463538, "epoch": 5584} {"train_loss": -26.756467819213867, "global_step": 463539, "epoch": 5584} {"train_loss": -27.048215866088867, "global_step": 463540, "epoch": 5584} {"train_loss": -26.705921173095703, "global_step": 463541, "epoch": 5584} {"train_loss": -27.26543617248535, "global_step": 463542, "epoch": 5584} {"train_loss": -26.851835250854492, "global_step": 463543, "epoch": 5584} {"train_loss": -27.082456588745117, "global_step": 463544, "epoch": 5584} {"train_loss": -27.040815353393555, "global_step": 463545, "epoch": 5584} {"train_loss": -26.957489013671875, "global_step": 463546, "epoch": 5584} {"train_loss": -27.119110107421875, "global_step": 463547, "epoch": 5584} {"train_loss": -26.944814682006836, "global_step": 463548, "epoch": 5584} {"train_loss": -27.0369815826416, "global_step": 463549, "epoch": 5584} {"train_loss": -26.824064254760742, "global_step": 463550, "epoch": 5584} {"train_loss": -26.81854820251465, "global_step": 463551, "epoch": 5584} {"train_loss": -27.13531494140625, "global_step": 463552, "epoch": 5584} {"train_loss": -27.051471710205078, "global_step": 463553, "epoch": 5584} {"train_loss": -26.972724937530884, "global_step": 463554, "epoch": 5584, "val_loss": 6543511.5} {"train_loss": -26.829242706298828, "global_step": 463555, "epoch": 5585} {"train_loss": -27.040979385375977, "global_step": 463556, "epoch": 5585} {"train_loss": -27.09893798828125, "global_step": 463557, "epoch": 5585} {"train_loss": -26.270355224609375, "global_step": 463558, "epoch": 5585} {"train_loss": -26.731225967407227, "global_step": 463559, "epoch": 5585} {"train_loss": -26.9671688079834, "global_step": 463560, "epoch": 5585} {"train_loss": -27.443374633789062, "global_step": 463561, "epoch": 5585} {"train_loss": -26.830041885375977, "global_step": 463562, "epoch": 5585} {"train_loss": -27.64151382446289, "global_step": 463563, "epoch": 5585} {"train_loss": -27.62080192565918, "global_step": 463564, "epoch": 5585} {"train_loss": -26.82282066345215, "global_step": 463565, "epoch": 5585} {"train_loss": -27.1337947845459, "global_step": 463566, "epoch": 5585} {"train_loss": -27.106088638305664, "global_step": 463567, "epoch": 5585} {"train_loss": -27.2415714263916, "global_step": 463568, "epoch": 5585} {"train_loss": -26.973058700561523, "global_step": 463569, "epoch": 5585} {"train_loss": -27.499164581298828, "global_step": 463570, "epoch": 5585} {"train_loss": -27.165802001953125, "global_step": 463571, "epoch": 5585} {"train_loss": -27.364017486572266, "global_step": 463572, "epoch": 5585} {"train_loss": -27.227386474609375, "global_step": 463573, "epoch": 5585} {"train_loss": -27.265180587768555, "global_step": 463574, "epoch": 5585} {"train_loss": -27.292041778564453, "global_step": 463575, "epoch": 5585} {"train_loss": -27.48465347290039, "global_step": 463576, "epoch": 5585} {"train_loss": -27.185232162475586, "global_step": 463577, "epoch": 5585} {"train_loss": -26.98834800720215, "global_step": 463578, "epoch": 5585} {"train_loss": -27.11093521118164, "global_step": 463579, "epoch": 5585} {"train_loss": -27.278676986694336, "global_step": 463580, "epoch": 5585} {"train_loss": -27.37656593322754, "global_step": 463581, "epoch": 5585} {"train_loss": -27.343244552612305, "global_step": 463582, "epoch": 5585} {"train_loss": -27.0754451751709, "global_step": 463583, "epoch": 5585} {"train_loss": -27.350854873657227, "global_step": 463584, "epoch": 5585} {"train_loss": -27.458654403686523, "global_step": 463585, "epoch": 5585} {"train_loss": -27.17799186706543, "global_step": 463586, "epoch": 5585} {"train_loss": -27.552188873291016, "global_step": 463587, "epoch": 5585} {"train_loss": -27.114171981811523, "global_step": 463588, "epoch": 5585} {"train_loss": -27.103429794311523, "global_step": 463589, "epoch": 5585} {"train_loss": -27.205310821533203, "global_step": 463590, "epoch": 5585} {"train_loss": -26.875843048095703, "global_step": 463591, "epoch": 5585} {"train_loss": -27.551605224609375, "global_step": 463592, "epoch": 5585} {"train_loss": -27.54421043395996, "global_step": 463593, "epoch": 5585} {"train_loss": -27.17051124572754, "global_step": 463594, "epoch": 5585} {"train_loss": -26.925006866455078, "global_step": 463595, "epoch": 5585} {"train_loss": -27.489370346069336, "global_step": 463596, "epoch": 5585} {"train_loss": -27.164403915405273, "global_step": 463597, "epoch": 5585} {"train_loss": -27.043704986572266, "global_step": 463598, "epoch": 5585} {"train_loss": -27.11818504333496, "global_step": 463599, "epoch": 5585} {"train_loss": -26.95460319519043, "global_step": 463600, "epoch": 5585} {"train_loss": -27.380285263061523, "global_step": 463601, "epoch": 5585} {"train_loss": -26.86322593688965, "global_step": 463602, "epoch": 5585} {"train_loss": -27.30182456970215, "global_step": 463603, "epoch": 5585} {"train_loss": -27.337799072265625, "global_step": 463604, "epoch": 5585} {"train_loss": -27.1383056640625, "global_step": 463605, "epoch": 5585} {"train_loss": -27.33502197265625, "global_step": 463606, "epoch": 5585} {"train_loss": -27.241409301757812, "global_step": 463607, "epoch": 5585} {"train_loss": -27.213275909423828, "global_step": 463608, "epoch": 5585} {"train_loss": -27.366718292236328, "global_step": 463609, "epoch": 5585} {"train_loss": -26.819089889526367, "global_step": 463610, "epoch": 5585} {"train_loss": -27.1038761138916, "global_step": 463611, "epoch": 5585} {"train_loss": -27.142004013061523, "global_step": 463612, "epoch": 5585} {"train_loss": -27.11195945739746, "global_step": 463613, "epoch": 5585} {"train_loss": -27.454547882080078, "global_step": 463614, "epoch": 5585} {"train_loss": -27.61746597290039, "global_step": 463615, "epoch": 5585} {"train_loss": -27.17152214050293, "global_step": 463616, "epoch": 5585} {"train_loss": -27.23728370666504, "global_step": 463617, "epoch": 5585} {"train_loss": -27.42097282409668, "global_step": 463618, "epoch": 5585} {"train_loss": -27.187976837158203, "global_step": 463619, "epoch": 5585} {"train_loss": -27.391565322875977, "global_step": 463620, "epoch": 5585} {"train_loss": -27.29231071472168, "global_step": 463621, "epoch": 5585} {"train_loss": -27.46244239807129, "global_step": 463622, "epoch": 5585} {"train_loss": -27.01816749572754, "global_step": 463623, "epoch": 5585} {"train_loss": -27.338476181030273, "global_step": 463624, "epoch": 5585} {"train_loss": -27.4727840423584, "global_step": 463625, "epoch": 5585} {"train_loss": -27.058019638061523, "global_step": 463626, "epoch": 5585} {"train_loss": -27.0700740814209, "global_step": 463627, "epoch": 5585} {"train_loss": -27.322219848632812, "global_step": 463628, "epoch": 5585} {"train_loss": -27.44782829284668, "global_step": 463629, "epoch": 5585} {"train_loss": -27.256803512573242, "global_step": 463630, "epoch": 5585} {"train_loss": -26.677404403686523, "global_step": 463631, "epoch": 5585} {"train_loss": -26.823902130126953, "global_step": 463632, "epoch": 5585} {"train_loss": -25.99164390563965, "global_step": 463633, "epoch": 5585} {"train_loss": -26.422443389892578, "global_step": 463634, "epoch": 5585} {"train_loss": -26.966964721679688, "global_step": 463635, "epoch": 5585} {"train_loss": -26.613666534423828, "global_step": 463636, "epoch": 5585} {"train_loss": -27.16415409869458, "global_step": 463637, "epoch": 5585, "val_loss": 6562684.0} {"train_loss": -25.587543487548828, "global_step": 463638, "epoch": 5586} {"train_loss": -26.167560577392578, "global_step": 463639, "epoch": 5586} {"train_loss": -25.530384063720703, "global_step": 463640, "epoch": 5586} {"train_loss": -26.164871215820312, "global_step": 463641, "epoch": 5586} {"train_loss": -26.62508201599121, "global_step": 463642, "epoch": 5586} {"train_loss": -26.164875030517578, "global_step": 463643, "epoch": 5586} {"train_loss": -26.279815673828125, "global_step": 463644, "epoch": 5586} {"train_loss": -26.262897491455078, "global_step": 463645, "epoch": 5586} {"train_loss": -26.139684677124023, "global_step": 463646, "epoch": 5586} {"train_loss": -26.985254287719727, "global_step": 463647, "epoch": 5586} {"train_loss": -26.387943267822266, "global_step": 463648, "epoch": 5586} {"train_loss": -26.96602439880371, "global_step": 463649, "epoch": 5586} {"train_loss": -26.35323143005371, "global_step": 463650, "epoch": 5586} {"train_loss": -26.742401123046875, "global_step": 463651, "epoch": 5586} {"train_loss": -26.594757080078125, "global_step": 463652, "epoch": 5586} {"train_loss": -26.88865089416504, "global_step": 463653, "epoch": 5586} {"train_loss": -26.641483306884766, "global_step": 463654, "epoch": 5586} {"train_loss": -26.261322021484375, "global_step": 463655, "epoch": 5586} {"train_loss": -26.29835319519043, "global_step": 463656, "epoch": 5586} {"train_loss": -26.8067684173584, "global_step": 463657, "epoch": 5586} {"train_loss": -26.9560546875, "global_step": 463658, "epoch": 5586} {"train_loss": -26.771535873413086, "global_step": 463659, "epoch": 5586} {"train_loss": -26.74456214904785, "global_step": 463660, "epoch": 5586} {"train_loss": -26.60650062561035, "global_step": 463661, "epoch": 5586} {"train_loss": -27.036712646484375, "global_step": 463662, "epoch": 5586} {"train_loss": -26.714853286743164, "global_step": 463663, "epoch": 5586} {"train_loss": -26.791486740112305, "global_step": 463664, "epoch": 5586} {"train_loss": -26.950510025024414, "global_step": 463665, "epoch": 5586} {"train_loss": -27.049291610717773, "global_step": 463666, "epoch": 5586} {"train_loss": -26.896472930908203, "global_step": 463667, "epoch": 5586} {"train_loss": -26.887741088867188, "global_step": 463668, "epoch": 5586} {"train_loss": -27.176069259643555, "global_step": 463669, "epoch": 5586} {"train_loss": -27.089670181274414, "global_step": 463670, "epoch": 5586} {"train_loss": -26.66558265686035, "global_step": 463671, "epoch": 5586} {"train_loss": -26.777175903320312, "global_step": 463672, "epoch": 5586} {"train_loss": -27.347211837768555, "global_step": 463673, "epoch": 5586} {"train_loss": -27.326215744018555, "global_step": 463674, "epoch": 5586} {"train_loss": -26.688201904296875, "global_step": 463675, "epoch": 5586} {"train_loss": -27.241193771362305, "global_step": 463676, "epoch": 5586} {"train_loss": -26.668188095092773, "global_step": 463677, "epoch": 5586} {"train_loss": -26.947845458984375, "global_step": 463678, "epoch": 5586} {"train_loss": -27.49039077758789, "global_step": 463679, "epoch": 5586} {"train_loss": -27.402212142944336, "global_step": 463680, "epoch": 5586} {"train_loss": -27.232852935791016, "global_step": 463681, "epoch": 5586} {"train_loss": -27.216760635375977, "global_step": 463682, "epoch": 5586} {"train_loss": -27.075742721557617, "global_step": 463683, "epoch": 5586} {"train_loss": -27.381681442260742, "global_step": 463684, "epoch": 5586} {"train_loss": -26.996862411499023, "global_step": 463685, "epoch": 5586} {"train_loss": -27.44257164001465, "global_step": 463686, "epoch": 5586} {"train_loss": -27.096227645874023, "global_step": 463687, "epoch": 5586} {"train_loss": -27.561620712280273, "global_step": 463688, "epoch": 5586} {"train_loss": -27.5241756439209, "global_step": 463689, "epoch": 5586} {"train_loss": -27.196746826171875, "global_step": 463690, "epoch": 5586} {"train_loss": -27.422163009643555, "global_step": 463691, "epoch": 5586} {"train_loss": -27.231801986694336, "global_step": 463692, "epoch": 5586} {"train_loss": -27.03937339782715, "global_step": 463693, "epoch": 5586} {"train_loss": -27.053308486938477, "global_step": 463694, "epoch": 5586} {"train_loss": -27.50178337097168, "global_step": 463695, "epoch": 5586} {"train_loss": -27.150196075439453, "global_step": 463696, "epoch": 5586} {"train_loss": -27.289052963256836, "global_step": 463697, "epoch": 5586} {"train_loss": -27.24586296081543, "global_step": 463698, "epoch": 5586} {"train_loss": -27.2874698638916, "global_step": 463699, "epoch": 5586} {"train_loss": -27.409244537353516, "global_step": 463700, "epoch": 5586} {"train_loss": -27.61359977722168, "global_step": 463701, "epoch": 5586} {"train_loss": -27.04135513305664, "global_step": 463702, "epoch": 5586} {"train_loss": -26.600873947143555, "global_step": 463703, "epoch": 5586} {"train_loss": -26.94034767150879, "global_step": 463704, "epoch": 5586} {"train_loss": -26.248493194580078, "global_step": 463705, "epoch": 5586} {"train_loss": -25.723474502563477, "global_step": 463706, "epoch": 5586} {"train_loss": -26.404346466064453, "global_step": 463707, "epoch": 5586} {"train_loss": -26.781797409057617, "global_step": 463708, "epoch": 5586} {"train_loss": -26.264694213867188, "global_step": 463709, "epoch": 5586} {"train_loss": -26.270618438720703, "global_step": 463710, "epoch": 5586} {"train_loss": -26.501205444335938, "global_step": 463711, "epoch": 5586} {"train_loss": -26.559600830078125, "global_step": 463712, "epoch": 5586} {"train_loss": -26.152175903320312, "global_step": 463713, "epoch": 5586} {"train_loss": -26.946491241455078, "global_step": 463714, "epoch": 5586} {"train_loss": -26.077463150024414, "global_step": 463715, "epoch": 5586} {"train_loss": -26.623533248901367, "global_step": 463716, "epoch": 5586} {"train_loss": -26.594831466674805, "global_step": 463717, "epoch": 5586} {"train_loss": -26.40619468688965, "global_step": 463718, "epoch": 5586} {"train_loss": -26.551349639892578, "global_step": 463719, "epoch": 5586} {"train_loss": -26.822285778551215, "global_step": 463720, "epoch": 5586, "val_loss": 6487775.5} {"train_loss": -25.372976303100586, "global_step": 463721, "epoch": 5587} {"train_loss": -25.96968650817871, "global_step": 463722, "epoch": 5587} {"train_loss": -26.51519203186035, "global_step": 463723, "epoch": 5587} {"train_loss": -25.904333114624023, "global_step": 463724, "epoch": 5587} {"train_loss": -25.651493072509766, "global_step": 463725, "epoch": 5587} {"train_loss": -26.495960235595703, "global_step": 463726, "epoch": 5587} {"train_loss": -26.314050674438477, "global_step": 463727, "epoch": 5587} {"train_loss": -26.219873428344727, "global_step": 463728, "epoch": 5587} {"train_loss": -26.775955200195312, "global_step": 463729, "epoch": 5587} {"train_loss": -26.164936065673828, "global_step": 463730, "epoch": 5587} {"train_loss": -26.51327896118164, "global_step": 463731, "epoch": 5587} {"train_loss": -26.72222900390625, "global_step": 463732, "epoch": 5587} {"train_loss": -26.355731964111328, "global_step": 463733, "epoch": 5587} {"train_loss": -26.5856990814209, "global_step": 463734, "epoch": 5587} {"train_loss": -26.7164306640625, "global_step": 463735, "epoch": 5587} {"train_loss": -26.556055068969727, "global_step": 463736, "epoch": 5587} {"train_loss": -26.361743927001953, "global_step": 463737, "epoch": 5587} {"train_loss": -26.196950912475586, "global_step": 463738, "epoch": 5587} {"train_loss": -26.483173370361328, "global_step": 463739, "epoch": 5587} {"train_loss": -26.741199493408203, "global_step": 463740, "epoch": 5587} {"train_loss": -26.90647315979004, "global_step": 463741, "epoch": 5587} {"train_loss": -26.673093795776367, "global_step": 463742, "epoch": 5587} {"train_loss": -26.252914428710938, "global_step": 463743, "epoch": 5587} {"train_loss": -26.286951065063477, "global_step": 463744, "epoch": 5587} {"train_loss": -26.86931800842285, "global_step": 463745, "epoch": 5587} {"train_loss": -26.93949317932129, "global_step": 463746, "epoch": 5587} {"train_loss": -26.752782821655273, "global_step": 463747, "epoch": 5587} {"train_loss": -26.775861740112305, "global_step": 463748, "epoch": 5587} {"train_loss": -27.015451431274414, "global_step": 463749, "epoch": 5587} {"train_loss": -27.317047119140625, "global_step": 463750, "epoch": 5587} {"train_loss": -26.42477798461914, "global_step": 463751, "epoch": 5587} {"train_loss": -27.197998046875, "global_step": 463752, "epoch": 5587} {"train_loss": -27.204090118408203, "global_step": 463753, "epoch": 5587} {"train_loss": -26.9180965423584, "global_step": 463754, "epoch": 5587} {"train_loss": -27.06744956970215, "global_step": 463755, "epoch": 5587} {"train_loss": -27.045730590820312, "global_step": 463756, "epoch": 5587} {"train_loss": -27.184173583984375, "global_step": 463757, "epoch": 5587} {"train_loss": -26.92233657836914, "global_step": 463758, "epoch": 5587} {"train_loss": -26.579391479492188, "global_step": 463759, "epoch": 5587} {"train_loss": -27.315160751342773, "global_step": 463760, "epoch": 5587} {"train_loss": -26.7716121673584, "global_step": 463761, "epoch": 5587} {"train_loss": -27.281494140625, "global_step": 463762, "epoch": 5587} {"train_loss": -27.360456466674805, "global_step": 463763, "epoch": 5587} {"train_loss": -27.2864990234375, "global_step": 463764, "epoch": 5587} {"train_loss": -27.3557071685791, "global_step": 463765, "epoch": 5587} {"train_loss": -27.13239097595215, "global_step": 463766, "epoch": 5587} {"train_loss": -27.458227157592773, "global_step": 463767, "epoch": 5587} {"train_loss": -27.178308486938477, "global_step": 463768, "epoch": 5587} {"train_loss": -27.248559951782227, "global_step": 463769, "epoch": 5587} {"train_loss": -26.714155197143555, "global_step": 463770, "epoch": 5587} {"train_loss": -26.90886878967285, "global_step": 463771, "epoch": 5587} {"train_loss": -26.141027450561523, "global_step": 463772, "epoch": 5587} {"train_loss": -25.625411987304688, "global_step": 463773, "epoch": 5587} {"train_loss": -26.427587509155273, "global_step": 463774, "epoch": 5587} {"train_loss": -27.351789474487305, "global_step": 463775, "epoch": 5587} {"train_loss": -26.46296501159668, "global_step": 463776, "epoch": 5587} {"train_loss": -27.027936935424805, "global_step": 463777, "epoch": 5587} {"train_loss": -26.97802734375, "global_step": 463778, "epoch": 5587} {"train_loss": -26.98003578186035, "global_step": 463779, "epoch": 5587} {"train_loss": -26.547388076782227, "global_step": 463780, "epoch": 5587} {"train_loss": -27.06327247619629, "global_step": 463781, "epoch": 5587} {"train_loss": -26.999542236328125, "global_step": 463782, "epoch": 5587} {"train_loss": -26.997220993041992, "global_step": 463783, "epoch": 5587} {"train_loss": -27.08430290222168, "global_step": 463784, "epoch": 5587} {"train_loss": -26.89774513244629, "global_step": 463785, "epoch": 5587} {"train_loss": -26.73805809020996, "global_step": 463786, "epoch": 5587} {"train_loss": -27.239171981811523, "global_step": 463787, "epoch": 5587} {"train_loss": -26.969446182250977, "global_step": 463788, "epoch": 5587} {"train_loss": -26.783863067626953, "global_step": 463789, "epoch": 5587} {"train_loss": -26.89385986328125, "global_step": 463790, "epoch": 5587} {"train_loss": -26.764673233032227, "global_step": 463791, "epoch": 5587} {"train_loss": -27.271270751953125, "global_step": 463792, "epoch": 5587} {"train_loss": -27.10618019104004, "global_step": 463793, "epoch": 5587} {"train_loss": -27.20596694946289, "global_step": 463794, "epoch": 5587} {"train_loss": -27.325475692749023, "global_step": 463795, "epoch": 5587} {"train_loss": -27.0611515045166, "global_step": 463796, "epoch": 5587} {"train_loss": -27.429534912109375, "global_step": 463797, "epoch": 5587} {"train_loss": -26.958087921142578, "global_step": 463798, "epoch": 5587} {"train_loss": -27.307722091674805, "global_step": 463799, "epoch": 5587} {"train_loss": -27.14948844909668, "global_step": 463800, "epoch": 5587} {"train_loss": -26.825061798095703, "global_step": 463801, "epoch": 5587} {"train_loss": -27.49030113220215, "global_step": 463802, "epoch": 5587} {"train_loss": -26.826193154576313, "global_step": 463803, "epoch": 5587, "val_loss": 6554516.0} {"train_loss": -27.02264404296875, "global_step": 463804, "epoch": 5588} {"train_loss": -26.93021011352539, "global_step": 463805, "epoch": 5588} {"train_loss": -26.61284828186035, "global_step": 463806, "epoch": 5588} {"train_loss": -26.69525146484375, "global_step": 463807, "epoch": 5588} {"train_loss": -26.76954460144043, "global_step": 463808, "epoch": 5588} {"train_loss": -26.647418975830078, "global_step": 463809, "epoch": 5588} {"train_loss": -26.92658805847168, "global_step": 463810, "epoch": 5588} {"train_loss": -27.207590103149414, "global_step": 463811, "epoch": 5588} {"train_loss": -27.00343132019043, "global_step": 463812, "epoch": 5588} {"train_loss": -27.22150230407715, "global_step": 463813, "epoch": 5588} {"train_loss": -27.728153228759766, "global_step": 463814, "epoch": 5588} {"train_loss": -27.3397159576416, "global_step": 463815, "epoch": 5588} {"train_loss": -26.886335372924805, "global_step": 463816, "epoch": 5588} {"train_loss": -27.303119659423828, "global_step": 463817, "epoch": 5588} {"train_loss": -27.282262802124023, "global_step": 463818, "epoch": 5588} {"train_loss": -27.10468101501465, "global_step": 463819, "epoch": 5588} {"train_loss": -26.861865997314453, "global_step": 463820, "epoch": 5588} {"train_loss": -27.152196884155273, "global_step": 463821, "epoch": 5588} {"train_loss": -27.1177978515625, "global_step": 463822, "epoch": 5588} {"train_loss": -27.508071899414062, "global_step": 463823, "epoch": 5588} {"train_loss": -27.1002197265625, "global_step": 463824, "epoch": 5588} {"train_loss": -27.570215225219727, "global_step": 463825, "epoch": 5588} {"train_loss": -27.061670303344727, "global_step": 463826, "epoch": 5588} {"train_loss": -26.954648971557617, "global_step": 463827, "epoch": 5588} {"train_loss": -27.45220375061035, "global_step": 463828, "epoch": 5588} {"train_loss": -27.14179801940918, "global_step": 463829, "epoch": 5588} {"train_loss": -26.89349937438965, "global_step": 463830, "epoch": 5588} {"train_loss": -26.918725967407227, "global_step": 463831, "epoch": 5588} {"train_loss": -27.13177490234375, "global_step": 463832, "epoch": 5588} {"train_loss": -26.7130069732666, "global_step": 463833, "epoch": 5588} {"train_loss": -26.951068878173828, "global_step": 463834, "epoch": 5588} {"train_loss": -27.160877227783203, "global_step": 463835, "epoch": 5588} {"train_loss": -26.987192153930664, "global_step": 463836, "epoch": 5588} {"train_loss": -26.973901748657227, "global_step": 463837, "epoch": 5588} {"train_loss": -27.23373794555664, "global_step": 463838, "epoch": 5588} {"train_loss": -27.31625747680664, "global_step": 463839, "epoch": 5588} {"train_loss": -27.12885093688965, "global_step": 463840, "epoch": 5588} {"train_loss": -27.328100204467773, "global_step": 463841, "epoch": 5588} {"train_loss": -27.208526611328125, "global_step": 463842, "epoch": 5588} {"train_loss": -27.247501373291016, "global_step": 463843, "epoch": 5588} {"train_loss": -26.977502822875977, "global_step": 463844, "epoch": 5588} {"train_loss": -27.277301788330078, "global_step": 463845, "epoch": 5588} {"train_loss": -26.967737197875977, "global_step": 463846, "epoch": 5588} {"train_loss": -27.197589874267578, "global_step": 463847, "epoch": 5588} {"train_loss": -26.747058868408203, "global_step": 463848, "epoch": 5588} {"train_loss": -27.47682762145996, "global_step": 463849, "epoch": 5588} {"train_loss": -27.027677536010742, "global_step": 463850, "epoch": 5588} {"train_loss": -27.500295639038086, "global_step": 463851, "epoch": 5588} {"train_loss": -27.367345809936523, "global_step": 463852, "epoch": 5588} {"train_loss": -27.33677101135254, "global_step": 463853, "epoch": 5588} {"train_loss": -27.309253692626953, "global_step": 463854, "epoch": 5588} {"train_loss": -27.188756942749023, "global_step": 463855, "epoch": 5588} {"train_loss": -27.170368194580078, "global_step": 463856, "epoch": 5588} {"train_loss": -27.07574462890625, "global_step": 463857, "epoch": 5588} {"train_loss": -26.907312393188477, "global_step": 463858, "epoch": 5588} {"train_loss": -27.166793823242188, "global_step": 463859, "epoch": 5588} {"train_loss": -27.003528594970703, "global_step": 463860, "epoch": 5588} {"train_loss": -27.21441650390625, "global_step": 463861, "epoch": 5588} {"train_loss": -27.422855377197266, "global_step": 463862, "epoch": 5588} {"train_loss": -26.865930557250977, "global_step": 463863, "epoch": 5588} {"train_loss": -27.46869468688965, "global_step": 463864, "epoch": 5588} {"train_loss": -26.867868423461914, "global_step": 463865, "epoch": 5588} {"train_loss": -26.616357803344727, "global_step": 463866, "epoch": 5588} {"train_loss": -26.562458038330078, "global_step": 463867, "epoch": 5588} {"train_loss": -27.169788360595703, "global_step": 463868, "epoch": 5588} {"train_loss": -26.990814208984375, "global_step": 463869, "epoch": 5588} {"train_loss": -27.030786514282227, "global_step": 463870, "epoch": 5588} {"train_loss": -27.17597007751465, "global_step": 463871, "epoch": 5588} {"train_loss": -27.04477882385254, "global_step": 463872, "epoch": 5588} {"train_loss": -27.02567481994629, "global_step": 463873, "epoch": 5588} {"train_loss": -27.226438522338867, "global_step": 463874, "epoch": 5588} {"train_loss": -26.896936416625977, "global_step": 463875, "epoch": 5588} {"train_loss": -26.989408493041992, "global_step": 463876, "epoch": 5588} {"train_loss": -26.85770034790039, "global_step": 463877, "epoch": 5588} {"train_loss": -26.631641387939453, "global_step": 463878, "epoch": 5588} {"train_loss": -26.813074111938477, "global_step": 463879, "epoch": 5588} {"train_loss": -26.710580825805664, "global_step": 463880, "epoch": 5588} {"train_loss": -26.753326416015625, "global_step": 463881, "epoch": 5588} {"train_loss": -26.6545352935791, "global_step": 463882, "epoch": 5588} {"train_loss": -26.743322372436523, "global_step": 463883, "epoch": 5588} {"train_loss": -26.847436904907227, "global_step": 463884, "epoch": 5588} {"train_loss": -26.752277374267578, "global_step": 463885, "epoch": 5588} {"train_loss": -27.063208890248493, "global_step": 463886, "epoch": 5588, "val_loss": 6581953.0} {"train_loss": -26.19379234313965, "global_step": 463887, "epoch": 5589} {"train_loss": -26.360980987548828, "global_step": 463888, "epoch": 5589} {"train_loss": -26.67327880859375, "global_step": 463889, "epoch": 5589} {"train_loss": -26.8100643157959, "global_step": 463890, "epoch": 5589} {"train_loss": -26.381824493408203, "global_step": 463891, "epoch": 5589} {"train_loss": -26.426259994506836, "global_step": 463892, "epoch": 5589} {"train_loss": -26.68505859375, "global_step": 463893, "epoch": 5589} {"train_loss": -26.20794677734375, "global_step": 463894, "epoch": 5589} {"train_loss": -26.672887802124023, "global_step": 463895, "epoch": 5589} {"train_loss": -26.20941734313965, "global_step": 463896, "epoch": 5589} {"train_loss": -26.602127075195312, "global_step": 463897, "epoch": 5589} {"train_loss": -26.23786735534668, "global_step": 463898, "epoch": 5589} {"train_loss": -26.204559326171875, "global_step": 463899, "epoch": 5589} {"train_loss": -26.72577476501465, "global_step": 463900, "epoch": 5589} {"train_loss": -26.782621383666992, "global_step": 463901, "epoch": 5589} {"train_loss": -26.619953155517578, "global_step": 463902, "epoch": 5589} {"train_loss": -26.543472290039062, "global_step": 463903, "epoch": 5589} {"train_loss": -26.88614845275879, "global_step": 463904, "epoch": 5589} {"train_loss": -26.7702693939209, "global_step": 463905, "epoch": 5589} {"train_loss": -26.551258087158203, "global_step": 463906, "epoch": 5589} {"train_loss": -26.753660202026367, "global_step": 463907, "epoch": 5589} {"train_loss": -26.746662139892578, "global_step": 463908, "epoch": 5589} {"train_loss": -26.9215030670166, "global_step": 463909, "epoch": 5589} {"train_loss": -26.86004638671875, "global_step": 463910, "epoch": 5589} {"train_loss": -27.060022354125977, "global_step": 463911, "epoch": 5589} {"train_loss": -26.826099395751953, "global_step": 463912, "epoch": 5589} {"train_loss": -27.322118759155273, "global_step": 463913, "epoch": 5589} {"train_loss": -27.13580322265625, "global_step": 463914, "epoch": 5589} {"train_loss": -27.0382022857666, "global_step": 463915, "epoch": 5589} {"train_loss": -26.959686279296875, "global_step": 463916, "epoch": 5589} {"train_loss": -26.657917022705078, "global_step": 463917, "epoch": 5589} {"train_loss": -27.24769401550293, "global_step": 463918, "epoch": 5589} {"train_loss": -27.203832626342773, "global_step": 463919, "epoch": 5589} {"train_loss": -27.011709213256836, "global_step": 463920, "epoch": 5589} {"train_loss": -27.247303009033203, "global_step": 463921, "epoch": 5589} {"train_loss": -27.10112953186035, "global_step": 463922, "epoch": 5589} {"train_loss": -27.008909225463867, "global_step": 463923, "epoch": 5589} {"train_loss": -27.17206382751465, "global_step": 463924, "epoch": 5589} {"train_loss": -27.173315048217773, "global_step": 463925, "epoch": 5589} {"train_loss": -27.17181968688965, "global_step": 463926, "epoch": 5589} {"train_loss": -26.897733688354492, "global_step": 463927, "epoch": 5589} {"train_loss": -27.27094841003418, "global_step": 463928, "epoch": 5589} {"train_loss": -27.61203956604004, "global_step": 463929, "epoch": 5589} {"train_loss": -27.343175888061523, "global_step": 463930, "epoch": 5589} {"train_loss": -27.413040161132812, "global_step": 463931, "epoch": 5589} {"train_loss": -27.667509078979492, "global_step": 463932, "epoch": 5589} {"train_loss": -27.082014083862305, "global_step": 463933, "epoch": 5589} {"train_loss": -27.23074722290039, "global_step": 463934, "epoch": 5589} {"train_loss": -27.24163818359375, "global_step": 463935, "epoch": 5589} {"train_loss": -27.043630599975586, "global_step": 463936, "epoch": 5589} {"train_loss": -27.312849044799805, "global_step": 463937, "epoch": 5589} {"train_loss": -27.079456329345703, "global_step": 463938, "epoch": 5589} {"train_loss": -27.328149795532227, "global_step": 463939, "epoch": 5589} {"train_loss": -27.4040470123291, "global_step": 463940, "epoch": 5589} {"train_loss": -27.453882217407227, "global_step": 463941, "epoch": 5589} {"train_loss": -26.901748657226562, "global_step": 463942, "epoch": 5589} {"train_loss": -26.810977935791016, "global_step": 463943, "epoch": 5589} {"train_loss": -27.047399520874023, "global_step": 463944, "epoch": 5589} {"train_loss": -27.33527183532715, "global_step": 463945, "epoch": 5589} {"train_loss": -26.78583335876465, "global_step": 463946, "epoch": 5589} {"train_loss": -27.228076934814453, "global_step": 463947, "epoch": 5589} {"train_loss": -27.17722511291504, "global_step": 463948, "epoch": 5589} {"train_loss": -27.34457778930664, "global_step": 463949, "epoch": 5589} {"train_loss": -26.94158363342285, "global_step": 463950, "epoch": 5589} {"train_loss": -26.943387985229492, "global_step": 463951, "epoch": 5589} {"train_loss": -27.20879554748535, "global_step": 463952, "epoch": 5589} {"train_loss": -27.065536499023438, "global_step": 463953, "epoch": 5589} {"train_loss": -26.9800968170166, "global_step": 463954, "epoch": 5589} {"train_loss": -27.097074508666992, "global_step": 463955, "epoch": 5589} {"train_loss": -26.777807235717773, "global_step": 463956, "epoch": 5589} {"train_loss": -26.490812301635742, "global_step": 463957, "epoch": 5589} {"train_loss": -26.78717613220215, "global_step": 463958, "epoch": 5589} {"train_loss": -26.886478424072266, "global_step": 463959, "epoch": 5589} {"train_loss": -26.70526123046875, "global_step": 463960, "epoch": 5589} {"train_loss": -27.367618560791016, "global_step": 463961, "epoch": 5589} {"train_loss": -26.831785202026367, "global_step": 463962, "epoch": 5589} {"train_loss": -27.10170555114746, "global_step": 463963, "epoch": 5589} {"train_loss": -27.0184383392334, "global_step": 463964, "epoch": 5589} {"train_loss": -27.447158813476562, "global_step": 463965, "epoch": 5589} {"train_loss": -27.265869140625, "global_step": 463966, "epoch": 5589} {"train_loss": -27.079553604125977, "global_step": 463967, "epoch": 5589} {"train_loss": -27.11189079284668, "global_step": 463968, "epoch": 5589} {"train_loss": -26.96102135439953, "global_step": 463969, "epoch": 5589, "val_loss": 6552890.0} {"train_loss": -23.285507202148438, "global_step": 463970, "epoch": 5590} {"train_loss": -22.096166610717773, "global_step": 463971, "epoch": 5590} {"train_loss": -24.976346969604492, "global_step": 463972, "epoch": 5590} {"train_loss": -25.243915557861328, "global_step": 463973, "epoch": 5590} {"train_loss": -24.393596649169922, "global_step": 463974, "epoch": 5590} {"train_loss": -26.188512802124023, "global_step": 463975, "epoch": 5590} {"train_loss": -25.39470863342285, "global_step": 463976, "epoch": 5590} {"train_loss": -25.9776554107666, "global_step": 463977, "epoch": 5590} {"train_loss": -25.325428009033203, "global_step": 463978, "epoch": 5590} {"train_loss": -26.366302490234375, "global_step": 463979, "epoch": 5590} {"train_loss": -25.76214027404785, "global_step": 463980, "epoch": 5590} {"train_loss": -25.67276954650879, "global_step": 463981, "epoch": 5590} {"train_loss": -26.478857040405273, "global_step": 463982, "epoch": 5590} {"train_loss": -26.037511825561523, "global_step": 463983, "epoch": 5590} {"train_loss": -25.70941162109375, "global_step": 463984, "epoch": 5590} {"train_loss": -26.167577743530273, "global_step": 463985, "epoch": 5590} {"train_loss": -26.076190948486328, "global_step": 463986, "epoch": 5590} {"train_loss": -26.02498435974121, "global_step": 463987, "epoch": 5590} {"train_loss": -26.48233985900879, "global_step": 463988, "epoch": 5590} {"train_loss": -26.02157974243164, "global_step": 463989, "epoch": 5590} {"train_loss": -26.290021896362305, "global_step": 463990, "epoch": 5590} {"train_loss": -26.401721954345703, "global_step": 463991, "epoch": 5590} {"train_loss": -26.421316146850586, "global_step": 463992, "epoch": 5590} {"train_loss": -26.488800048828125, "global_step": 463993, "epoch": 5590} {"train_loss": -26.525165557861328, "global_step": 463994, "epoch": 5590} {"train_loss": -26.33473014831543, "global_step": 463995, "epoch": 5590} {"train_loss": -26.634723663330078, "global_step": 463996, "epoch": 5590} {"train_loss": -26.30971336364746, "global_step": 463997, "epoch": 5590} {"train_loss": -26.178312301635742, "global_step": 463998, "epoch": 5590} {"train_loss": -27.22064781188965, "global_step": 463999, "epoch": 5590} {"train_loss": -26.408788681030273, "global_step": 464000, "epoch": 5590} {"train_loss": -26.90513038635254, "global_step": 464001, "epoch": 5590} {"train_loss": -26.64803123474121, "global_step": 464002, "epoch": 5590} {"train_loss": -27.039291381835938, "global_step": 464003, "epoch": 5590} {"train_loss": -26.648208618164062, "global_step": 464004, "epoch": 5590} {"train_loss": -26.997594833374023, "global_step": 464005, "epoch": 5590} {"train_loss": -26.565786361694336, "global_step": 464006, "epoch": 5590} {"train_loss": -26.961109161376953, "global_step": 464007, "epoch": 5590} {"train_loss": -26.977258682250977, "global_step": 464008, "epoch": 5590} {"train_loss": -26.831073760986328, "global_step": 464009, "epoch": 5590} {"train_loss": -27.3121337890625, "global_step": 464010, "epoch": 5590} {"train_loss": -26.70932960510254, "global_step": 464011, "epoch": 5590} {"train_loss": -27.07370948791504, "global_step": 464012, "epoch": 5590} {"train_loss": -27.27998161315918, "global_step": 464013, "epoch": 5590} {"train_loss": -27.289228439331055, "global_step": 464014, "epoch": 5590} {"train_loss": -26.979177474975586, "global_step": 464015, "epoch": 5590} {"train_loss": -27.214252471923828, "global_step": 464016, "epoch": 5590} {"train_loss": -27.0368595123291, "global_step": 464017, "epoch": 5590} {"train_loss": -27.155195236206055, "global_step": 464018, "epoch": 5590} {"train_loss": -27.01678466796875, "global_step": 464019, "epoch": 5590} {"train_loss": -27.39044761657715, "global_step": 464020, "epoch": 5590} {"train_loss": -26.799673080444336, "global_step": 464021, "epoch": 5590} {"train_loss": -27.524988174438477, "global_step": 464022, "epoch": 5590} {"train_loss": -26.91316032409668, "global_step": 464023, "epoch": 5590} {"train_loss": -27.739490509033203, "global_step": 464024, "epoch": 5590} {"train_loss": -27.08574867248535, "global_step": 464025, "epoch": 5590} {"train_loss": -27.39043617248535, "global_step": 464026, "epoch": 5590} {"train_loss": -26.945911407470703, "global_step": 464027, "epoch": 5590} {"train_loss": -27.441564559936523, "global_step": 464028, "epoch": 5590} {"train_loss": -27.489233016967773, "global_step": 464029, "epoch": 5590} {"train_loss": -27.429859161376953, "global_step": 464030, "epoch": 5590} {"train_loss": -27.281286239624023, "global_step": 464031, "epoch": 5590} {"train_loss": -27.09231948852539, "global_step": 464032, "epoch": 5590} {"train_loss": -27.459020614624023, "global_step": 464033, "epoch": 5590} {"train_loss": -27.367780685424805, "global_step": 464034, "epoch": 5590} {"train_loss": -26.94630241394043, "global_step": 464035, "epoch": 5590} {"train_loss": -27.07499122619629, "global_step": 464036, "epoch": 5590} {"train_loss": -26.69001579284668, "global_step": 464037, "epoch": 5590} {"train_loss": -27.378870010375977, "global_step": 464038, "epoch": 5590} {"train_loss": -27.472143173217773, "global_step": 464039, "epoch": 5590} {"train_loss": -26.781213760375977, "global_step": 464040, "epoch": 5590} {"train_loss": -26.977807998657227, "global_step": 464041, "epoch": 5590} {"train_loss": -27.3885440826416, "global_step": 464042, "epoch": 5590} {"train_loss": -27.099613189697266, "global_step": 464043, "epoch": 5590} {"train_loss": -27.4373836517334, "global_step": 464044, "epoch": 5590} {"train_loss": -27.157958984375, "global_step": 464045, "epoch": 5590} {"train_loss": -26.862552642822266, "global_step": 464046, "epoch": 5590} {"train_loss": -26.77016258239746, "global_step": 464047, "epoch": 5590} {"train_loss": -26.95979881286621, "global_step": 464048, "epoch": 5590} {"train_loss": -27.456745147705078, "global_step": 464049, "epoch": 5590} {"train_loss": -27.39760398864746, "global_step": 464050, "epoch": 5590} {"train_loss": -27.157629013061523, "global_step": 464051, "epoch": 5590} {"train_loss": -26.626712040728833, "global_step": 464052, "epoch": 5590, "val_loss": 6686642.0} {"train_loss": -26.4708194732666, "global_step": 464053, "epoch": 5591} {"train_loss": -26.49213218688965, "global_step": 464054, "epoch": 5591} {"train_loss": -26.957712173461914, "global_step": 464055, "epoch": 5591} {"train_loss": -26.81084632873535, "global_step": 464056, "epoch": 5591} {"train_loss": -26.580158233642578, "global_step": 464057, "epoch": 5591} {"train_loss": -26.66046142578125, "global_step": 464058, "epoch": 5591} {"train_loss": -26.77301597595215, "global_step": 464059, "epoch": 5591} {"train_loss": -26.90276527404785, "global_step": 464060, "epoch": 5591} {"train_loss": -26.743438720703125, "global_step": 464061, "epoch": 5591} {"train_loss": -26.66985511779785, "global_step": 464062, "epoch": 5591} {"train_loss": -26.533889770507812, "global_step": 464063, "epoch": 5591} {"train_loss": -26.581647872924805, "global_step": 464064, "epoch": 5591} {"train_loss": -26.843551635742188, "global_step": 464065, "epoch": 5591} {"train_loss": -26.493820190429688, "global_step": 464066, "epoch": 5591} {"train_loss": -26.512067794799805, "global_step": 464067, "epoch": 5591} {"train_loss": -27.27571678161621, "global_step": 464068, "epoch": 5591} {"train_loss": -26.836034774780273, "global_step": 464069, "epoch": 5591} {"train_loss": -27.00337028503418, "global_step": 464070, "epoch": 5591} {"train_loss": -26.830322265625, "global_step": 464071, "epoch": 5591} {"train_loss": -26.481836318969727, "global_step": 464072, "epoch": 5591} {"train_loss": -26.747207641601562, "global_step": 464073, "epoch": 5591} {"train_loss": -27.042280197143555, "global_step": 464074, "epoch": 5591} {"train_loss": -26.396554946899414, "global_step": 464075, "epoch": 5591} {"train_loss": -27.52474021911621, "global_step": 464076, "epoch": 5591} {"train_loss": -27.037134170532227, "global_step": 464077, "epoch": 5591} {"train_loss": -26.880512237548828, "global_step": 464078, "epoch": 5591} {"train_loss": -27.06243324279785, "global_step": 464079, "epoch": 5591} {"train_loss": -27.055988311767578, "global_step": 464080, "epoch": 5591} {"train_loss": -27.263004302978516, "global_step": 464081, "epoch": 5591} {"train_loss": -27.595783233642578, "global_step": 464082, "epoch": 5591} {"train_loss": -27.453577041625977, "global_step": 464083, "epoch": 5591} {"train_loss": -27.269006729125977, "global_step": 464084, "epoch": 5591} {"train_loss": -27.121915817260742, "global_step": 464085, "epoch": 5591} {"train_loss": -27.57354736328125, "global_step": 464086, "epoch": 5591} {"train_loss": -26.823867797851562, "global_step": 464087, "epoch": 5591} {"train_loss": -27.1627140045166, "global_step": 464088, "epoch": 5591} {"train_loss": -27.4559268951416, "global_step": 464089, "epoch": 5591} {"train_loss": -27.040664672851562, "global_step": 464090, "epoch": 5591} {"train_loss": -26.773847579956055, "global_step": 464091, "epoch": 5591} {"train_loss": -27.38812255859375, "global_step": 464092, "epoch": 5591} {"train_loss": -27.2138671875, "global_step": 464093, "epoch": 5591} {"train_loss": -27.373035430908203, "global_step": 464094, "epoch": 5591} {"train_loss": -27.177682876586914, "global_step": 464095, "epoch": 5591} {"train_loss": -27.060657501220703, "global_step": 464096, "epoch": 5591} {"train_loss": -26.961185455322266, "global_step": 464097, "epoch": 5591} {"train_loss": -27.07411766052246, "global_step": 464098, "epoch": 5591} {"train_loss": -27.31365394592285, "global_step": 464099, "epoch": 5591} {"train_loss": -27.3511962890625, "global_step": 464100, "epoch": 5591} {"train_loss": -27.2791690826416, "global_step": 464101, "epoch": 5591} {"train_loss": -27.47577476501465, "global_step": 464102, "epoch": 5591} {"train_loss": -26.976587295532227, "global_step": 464103, "epoch": 5591} {"train_loss": -27.210737228393555, "global_step": 464104, "epoch": 5591} {"train_loss": -27.214218139648438, "global_step": 464105, "epoch": 5591} {"train_loss": -27.049245834350586, "global_step": 464106, "epoch": 5591} {"train_loss": -27.10845375061035, "global_step": 464107, "epoch": 5591} {"train_loss": -27.44331169128418, "global_step": 464108, "epoch": 5591} {"train_loss": -26.96900749206543, "global_step": 464109, "epoch": 5591} {"train_loss": -27.19318962097168, "global_step": 464110, "epoch": 5591} {"train_loss": -27.23013687133789, "global_step": 464111, "epoch": 5591} {"train_loss": -27.152130126953125, "global_step": 464112, "epoch": 5591} {"train_loss": -27.201318740844727, "global_step": 464113, "epoch": 5591} {"train_loss": -27.051855087280273, "global_step": 464114, "epoch": 5591} {"train_loss": -27.0518741607666, "global_step": 464115, "epoch": 5591} {"train_loss": -27.321531295776367, "global_step": 464116, "epoch": 5591} {"train_loss": -27.493207931518555, "global_step": 464117, "epoch": 5591} {"train_loss": -27.226776123046875, "global_step": 464118, "epoch": 5591} {"train_loss": -27.344863891601562, "global_step": 464119, "epoch": 5591} {"train_loss": -27.066370010375977, "global_step": 464120, "epoch": 5591} {"train_loss": -27.253442764282227, "global_step": 464121, "epoch": 5591} {"train_loss": -27.543058395385742, "global_step": 464122, "epoch": 5591} {"train_loss": -27.048389434814453, "global_step": 464123, "epoch": 5591} {"train_loss": -27.445648193359375, "global_step": 464124, "epoch": 5591} {"train_loss": -27.139911651611328, "global_step": 464125, "epoch": 5591} {"train_loss": -27.26558494567871, "global_step": 464126, "epoch": 5591} {"train_loss": -27.371564865112305, "global_step": 464127, "epoch": 5591} {"train_loss": -27.198495864868164, "global_step": 464128, "epoch": 5591} {"train_loss": -27.387348175048828, "global_step": 464129, "epoch": 5591} {"train_loss": -27.15338706970215, "global_step": 464130, "epoch": 5591} {"train_loss": -27.32293128967285, "global_step": 464131, "epoch": 5591} {"train_loss": -26.91119384765625, "global_step": 464132, "epoch": 5591} {"train_loss": -27.31207275390625, "global_step": 464133, "epoch": 5591} {"train_loss": -27.13815689086914, "global_step": 464134, "epoch": 5591} {"train_loss": -27.08401852343456, "global_step": 464135, "epoch": 5591, "val_loss": 6641171.0} {"train_loss": -26.97980308532715, "global_step": 464136, "epoch": 5592} {"train_loss": -25.93303871154785, "global_step": 464137, "epoch": 5592} {"train_loss": -25.037137985229492, "global_step": 464138, "epoch": 5592} {"train_loss": -25.796598434448242, "global_step": 464139, "epoch": 5592} {"train_loss": -26.724761962890625, "global_step": 464140, "epoch": 5592} {"train_loss": -26.66910743713379, "global_step": 464141, "epoch": 5592} {"train_loss": -26.35987663269043, "global_step": 464142, "epoch": 5592} {"train_loss": -26.99509048461914, "global_step": 464143, "epoch": 5592} {"train_loss": -27.050384521484375, "global_step": 464144, "epoch": 5592} {"train_loss": -26.769550323486328, "global_step": 464145, "epoch": 5592} {"train_loss": -26.451200485229492, "global_step": 464146, "epoch": 5592} {"train_loss": -27.239572525024414, "global_step": 464147, "epoch": 5592} {"train_loss": -26.919675827026367, "global_step": 464148, "epoch": 5592} {"train_loss": -26.855274200439453, "global_step": 464149, "epoch": 5592} {"train_loss": -27.094465255737305, "global_step": 464150, "epoch": 5592} {"train_loss": -26.255273818969727, "global_step": 464151, "epoch": 5592} {"train_loss": -27.14093017578125, "global_step": 464152, "epoch": 5592} {"train_loss": -26.732421875, "global_step": 464153, "epoch": 5592} {"train_loss": -26.976104736328125, "global_step": 464154, "epoch": 5592} {"train_loss": -26.8674373626709, "global_step": 464155, "epoch": 5592} {"train_loss": -27.007125854492188, "global_step": 464156, "epoch": 5592} {"train_loss": -26.8732967376709, "global_step": 464157, "epoch": 5592} {"train_loss": -26.767292022705078, "global_step": 464158, "epoch": 5592} {"train_loss": -26.794464111328125, "global_step": 464159, "epoch": 5592} {"train_loss": -27.10112953186035, "global_step": 464160, "epoch": 5592} {"train_loss": -27.101903915405273, "global_step": 464161, "epoch": 5592} {"train_loss": -26.954946517944336, "global_step": 464162, "epoch": 5592} {"train_loss": -27.10333251953125, "global_step": 464163, "epoch": 5592} {"train_loss": -26.964929580688477, "global_step": 464164, "epoch": 5592} {"train_loss": -26.900054931640625, "global_step": 464165, "epoch": 5592} {"train_loss": -27.075178146362305, "global_step": 464166, "epoch": 5592} {"train_loss": -27.04075050354004, "global_step": 464167, "epoch": 5592} {"train_loss": -27.073413848876953, "global_step": 464168, "epoch": 5592} {"train_loss": -27.05756187438965, "global_step": 464169, "epoch": 5592} {"train_loss": -27.206897735595703, "global_step": 464170, "epoch": 5592} {"train_loss": -27.239171981811523, "global_step": 464171, "epoch": 5592} {"train_loss": -26.850086212158203, "global_step": 464172, "epoch": 5592} {"train_loss": -27.25823402404785, "global_step": 464173, "epoch": 5592} {"train_loss": -27.056549072265625, "global_step": 464174, "epoch": 5592} {"train_loss": -27.174585342407227, "global_step": 464175, "epoch": 5592} {"train_loss": -27.541532516479492, "global_step": 464176, "epoch": 5592} {"train_loss": -27.18535804748535, "global_step": 464177, "epoch": 5592} {"train_loss": -27.566797256469727, "global_step": 464178, "epoch": 5592} {"train_loss": -27.25941276550293, "global_step": 464179, "epoch": 5592} {"train_loss": -27.373279571533203, "global_step": 464180, "epoch": 5592} {"train_loss": -27.385345458984375, "global_step": 464181, "epoch": 5592} {"train_loss": -27.246734619140625, "global_step": 464182, "epoch": 5592} {"train_loss": -26.90755271911621, "global_step": 464183, "epoch": 5592} {"train_loss": -27.278034210205078, "global_step": 464184, "epoch": 5592} {"train_loss": -27.230945587158203, "global_step": 464185, "epoch": 5592} {"train_loss": -27.553543090820312, "global_step": 464186, "epoch": 5592} {"train_loss": -27.292163848876953, "global_step": 464187, "epoch": 5592} {"train_loss": -27.582473754882812, "global_step": 464188, "epoch": 5592} {"train_loss": -27.239398956298828, "global_step": 464189, "epoch": 5592} {"train_loss": -27.354766845703125, "global_step": 464190, "epoch": 5592} {"train_loss": -27.37750816345215, "global_step": 464191, "epoch": 5592} {"train_loss": -27.1788272857666, "global_step": 464192, "epoch": 5592} {"train_loss": -27.512542724609375, "global_step": 464193, "epoch": 5592} {"train_loss": -27.5026912689209, "global_step": 464194, "epoch": 5592} {"train_loss": -27.346302032470703, "global_step": 464195, "epoch": 5592} {"train_loss": -27.200788497924805, "global_step": 464196, "epoch": 5592} {"train_loss": -27.45002555847168, "global_step": 464197, "epoch": 5592} {"train_loss": -27.43735694885254, "global_step": 464198, "epoch": 5592} {"train_loss": -27.396474838256836, "global_step": 464199, "epoch": 5592} {"train_loss": -27.068296432495117, "global_step": 464200, "epoch": 5592} {"train_loss": -27.350311279296875, "global_step": 464201, "epoch": 5592} {"train_loss": -27.392053604125977, "global_step": 464202, "epoch": 5592} {"train_loss": -27.155542373657227, "global_step": 464203, "epoch": 5592} {"train_loss": -27.374740600585938, "global_step": 464204, "epoch": 5592} {"train_loss": -27.474380493164062, "global_step": 464205, "epoch": 5592} {"train_loss": -27.005537033081055, "global_step": 464206, "epoch": 5592} {"train_loss": -26.60630226135254, "global_step": 464207, "epoch": 5592} {"train_loss": -26.088682174682617, "global_step": 464208, "epoch": 5592} {"train_loss": -25.827356338500977, "global_step": 464209, "epoch": 5592} {"train_loss": -26.29029655456543, "global_step": 464210, "epoch": 5592} {"train_loss": -26.6217041015625, "global_step": 464211, "epoch": 5592} {"train_loss": -26.874860763549805, "global_step": 464212, "epoch": 5592} {"train_loss": -26.64289665222168, "global_step": 464213, "epoch": 5592} {"train_loss": -27.041919708251953, "global_step": 464214, "epoch": 5592} {"train_loss": -26.78374671936035, "global_step": 464215, "epoch": 5592} {"train_loss": -26.995532989501953, "global_step": 464216, "epoch": 5592} {"train_loss": -26.865381240844727, "global_step": 464217, "epoch": 5592} {"train_loss": -26.98069953918457, "global_step": 464218, "epoch": 5592, "val_loss": 6450072.0} {"train_loss": -26.797229766845703, "global_step": 464219, "epoch": 5593} {"train_loss": -26.516284942626953, "global_step": 464220, "epoch": 5593} {"train_loss": -25.921911239624023, "global_step": 464221, "epoch": 5593} {"train_loss": -26.7652530670166, "global_step": 464222, "epoch": 5593} {"train_loss": -26.056379318237305, "global_step": 464223, "epoch": 5593} {"train_loss": -26.247968673706055, "global_step": 464224, "epoch": 5593} {"train_loss": -26.680036544799805, "global_step": 464225, "epoch": 5593} {"train_loss": -26.42545509338379, "global_step": 464226, "epoch": 5593} {"train_loss": -26.42718505859375, "global_step": 464227, "epoch": 5593} {"train_loss": -26.986494064331055, "global_step": 464228, "epoch": 5593} {"train_loss": -26.77339744567871, "global_step": 464229, "epoch": 5593} {"train_loss": -26.8967227935791, "global_step": 464230, "epoch": 5593} {"train_loss": -26.64109230041504, "global_step": 464231, "epoch": 5593} {"train_loss": -26.42152214050293, "global_step": 464232, "epoch": 5593} {"train_loss": -26.547239303588867, "global_step": 464233, "epoch": 5593} {"train_loss": -26.809473037719727, "global_step": 464234, "epoch": 5593} {"train_loss": -26.935544967651367, "global_step": 464235, "epoch": 5593} {"train_loss": -26.738428115844727, "global_step": 464236, "epoch": 5593} {"train_loss": -26.789289474487305, "global_step": 464237, "epoch": 5593} {"train_loss": -27.007099151611328, "global_step": 464238, "epoch": 5593} {"train_loss": -27.116910934448242, "global_step": 464239, "epoch": 5593} {"train_loss": -27.1319637298584, "global_step": 464240, "epoch": 5593} {"train_loss": -26.72258949279785, "global_step": 464241, "epoch": 5593} {"train_loss": -27.050878524780273, "global_step": 464242, "epoch": 5593} {"train_loss": -26.91042137145996, "global_step": 464243, "epoch": 5593} {"train_loss": -27.07217788696289, "global_step": 464244, "epoch": 5593} {"train_loss": -26.543750762939453, "global_step": 464245, "epoch": 5593} {"train_loss": -27.01373863220215, "global_step": 464246, "epoch": 5593} {"train_loss": -26.915576934814453, "global_step": 464247, "epoch": 5593} {"train_loss": -27.018299102783203, "global_step": 464248, "epoch": 5593} {"train_loss": -27.205554962158203, "global_step": 464249, "epoch": 5593} {"train_loss": -26.898717880249023, "global_step": 464250, "epoch": 5593} {"train_loss": -26.865234375, "global_step": 464251, "epoch": 5593} {"train_loss": -27.092803955078125, "global_step": 464252, "epoch": 5593} {"train_loss": -26.731958389282227, "global_step": 464253, "epoch": 5593} {"train_loss": -27.010089874267578, "global_step": 464254, "epoch": 5593} {"train_loss": -27.270294189453125, "global_step": 464255, "epoch": 5593} {"train_loss": -26.90940284729004, "global_step": 464256, "epoch": 5593} {"train_loss": -27.399465560913086, "global_step": 464257, "epoch": 5593} {"train_loss": -27.234207153320312, "global_step": 464258, "epoch": 5593} {"train_loss": -27.37982177734375, "global_step": 464259, "epoch": 5593} {"train_loss": -27.097318649291992, "global_step": 464260, "epoch": 5593} {"train_loss": -27.12415885925293, "global_step": 464261, "epoch": 5593} {"train_loss": -27.25290298461914, "global_step": 464262, "epoch": 5593} {"train_loss": -27.132043838500977, "global_step": 464263, "epoch": 5593} {"train_loss": -27.43707847595215, "global_step": 464264, "epoch": 5593} {"train_loss": -27.401477813720703, "global_step": 464265, "epoch": 5593} {"train_loss": -27.139957427978516, "global_step": 464266, "epoch": 5593} {"train_loss": -27.090784072875977, "global_step": 464267, "epoch": 5593} {"train_loss": -27.168371200561523, "global_step": 464268, "epoch": 5593} {"train_loss": -27.23959732055664, "global_step": 464269, "epoch": 5593} {"train_loss": -27.537683486938477, "global_step": 464270, "epoch": 5593} {"train_loss": -26.971948623657227, "global_step": 464271, "epoch": 5593} {"train_loss": -27.166067123413086, "global_step": 464272, "epoch": 5593} {"train_loss": -27.10980796813965, "global_step": 464273, "epoch": 5593} {"train_loss": -27.09942626953125, "global_step": 464274, "epoch": 5593} {"train_loss": -27.392059326171875, "global_step": 464275, "epoch": 5593} {"train_loss": -26.855762481689453, "global_step": 464276, "epoch": 5593} {"train_loss": -27.084455490112305, "global_step": 464277, "epoch": 5593} {"train_loss": -26.688161849975586, "global_step": 464278, "epoch": 5593} {"train_loss": -27.085275650024414, "global_step": 464279, "epoch": 5593} {"train_loss": -27.20160484313965, "global_step": 464280, "epoch": 5593} {"train_loss": -27.073598861694336, "global_step": 464281, "epoch": 5593} {"train_loss": -26.670379638671875, "global_step": 464282, "epoch": 5593} {"train_loss": -27.120893478393555, "global_step": 464283, "epoch": 5593} {"train_loss": -26.930099487304688, "global_step": 464284, "epoch": 5593} {"train_loss": -27.264362335205078, "global_step": 464285, "epoch": 5593} {"train_loss": -27.177204132080078, "global_step": 464286, "epoch": 5593} {"train_loss": -26.907123565673828, "global_step": 464287, "epoch": 5593} {"train_loss": -27.03156089782715, "global_step": 464288, "epoch": 5593} {"train_loss": -26.80682945251465, "global_step": 464289, "epoch": 5593} {"train_loss": -27.035449981689453, "global_step": 464290, "epoch": 5593} {"train_loss": -27.28501319885254, "global_step": 464291, "epoch": 5593} {"train_loss": -26.890832901000977, "global_step": 464292, "epoch": 5593} {"train_loss": -27.107873916625977, "global_step": 464293, "epoch": 5593} {"train_loss": -27.108779907226562, "global_step": 464294, "epoch": 5593} {"train_loss": -26.842391967773438, "global_step": 464295, "epoch": 5593} {"train_loss": -27.254947662353516, "global_step": 464296, "epoch": 5593} {"train_loss": -27.14129638671875, "global_step": 464297, "epoch": 5593} {"train_loss": -27.225116729736328, "global_step": 464298, "epoch": 5593} {"train_loss": -27.3476505279541, "global_step": 464299, "epoch": 5593} {"train_loss": -27.040390014648438, "global_step": 464300, "epoch": 5593} {"train_loss": -26.975495097148848, "global_step": 464301, "epoch": 5593, "val_loss": 6505040.0} {"train_loss": -26.793689727783203, "global_step": 464302, "epoch": 5594} {"train_loss": -26.824304580688477, "global_step": 464303, "epoch": 5594} {"train_loss": -26.574268341064453, "global_step": 464304, "epoch": 5594} {"train_loss": -26.66066551208496, "global_step": 464305, "epoch": 5594} {"train_loss": -26.698862075805664, "global_step": 464306, "epoch": 5594} {"train_loss": -26.929340362548828, "global_step": 464307, "epoch": 5594} {"train_loss": -26.4083309173584, "global_step": 464308, "epoch": 5594} {"train_loss": -26.36749839782715, "global_step": 464309, "epoch": 5594} {"train_loss": -26.616186141967773, "global_step": 464310, "epoch": 5594} {"train_loss": -26.5653076171875, "global_step": 464311, "epoch": 5594} {"train_loss": -26.36920738220215, "global_step": 464312, "epoch": 5594} {"train_loss": -26.258060455322266, "global_step": 464313, "epoch": 5594} {"train_loss": -27.050403594970703, "global_step": 464314, "epoch": 5594} {"train_loss": -26.71620750427246, "global_step": 464315, "epoch": 5594} {"train_loss": -27.111957550048828, "global_step": 464316, "epoch": 5594} {"train_loss": -26.90826416015625, "global_step": 464317, "epoch": 5594} {"train_loss": -26.85609245300293, "global_step": 464318, "epoch": 5594} {"train_loss": -27.253705978393555, "global_step": 464319, "epoch": 5594} {"train_loss": -26.739599227905273, "global_step": 464320, "epoch": 5594} {"train_loss": -27.103952407836914, "global_step": 464321, "epoch": 5594} {"train_loss": -27.044843673706055, "global_step": 464322, "epoch": 5594} {"train_loss": -27.012317657470703, "global_step": 464323, "epoch": 5594} {"train_loss": -27.12281608581543, "global_step": 464324, "epoch": 5594} {"train_loss": -27.06414794921875, "global_step": 464325, "epoch": 5594} {"train_loss": -27.05750846862793, "global_step": 464326, "epoch": 5594} {"train_loss": -27.042234420776367, "global_step": 464327, "epoch": 5594} {"train_loss": -26.990476608276367, "global_step": 464328, "epoch": 5594} {"train_loss": -27.13789176940918, "global_step": 464329, "epoch": 5594} {"train_loss": -26.88178062438965, "global_step": 464330, "epoch": 5594} {"train_loss": -27.141088485717773, "global_step": 464331, "epoch": 5594} {"train_loss": -27.180877685546875, "global_step": 464332, "epoch": 5594} {"train_loss": -27.02533531188965, "global_step": 464333, "epoch": 5594} {"train_loss": -27.1917724609375, "global_step": 464334, "epoch": 5594} {"train_loss": -27.072412490844727, "global_step": 464335, "epoch": 5594} {"train_loss": -27.313220977783203, "global_step": 464336, "epoch": 5594} {"train_loss": -27.17548179626465, "global_step": 464337, "epoch": 5594} {"train_loss": -26.910192489624023, "global_step": 464338, "epoch": 5594} {"train_loss": -27.430139541625977, "global_step": 464339, "epoch": 5594} {"train_loss": -27.45892333984375, "global_step": 464340, "epoch": 5594} {"train_loss": -27.238727569580078, "global_step": 464341, "epoch": 5594} {"train_loss": -27.37123680114746, "global_step": 464342, "epoch": 5594} {"train_loss": -27.3155574798584, "global_step": 464343, "epoch": 5594} {"train_loss": -27.330799102783203, "global_step": 464344, "epoch": 5594} {"train_loss": -27.301025390625, "global_step": 464345, "epoch": 5594} {"train_loss": -27.401941299438477, "global_step": 464346, "epoch": 5594} {"train_loss": -27.353565216064453, "global_step": 464347, "epoch": 5594} {"train_loss": -27.59833335876465, "global_step": 464348, "epoch": 5594} {"train_loss": -27.159238815307617, "global_step": 464349, "epoch": 5594} {"train_loss": -27.23262596130371, "global_step": 464350, "epoch": 5594} {"train_loss": -27.14885902404785, "global_step": 464351, "epoch": 5594} {"train_loss": -27.505084991455078, "global_step": 464352, "epoch": 5594} {"train_loss": -27.727436065673828, "global_step": 464353, "epoch": 5594} {"train_loss": -27.288455963134766, "global_step": 464354, "epoch": 5594} {"train_loss": -27.645404815673828, "global_step": 464355, "epoch": 5594} {"train_loss": -27.46955680847168, "global_step": 464356, "epoch": 5594} {"train_loss": -27.404279708862305, "global_step": 464357, "epoch": 5594} {"train_loss": -27.25827407836914, "global_step": 464358, "epoch": 5594} {"train_loss": -27.23920249938965, "global_step": 464359, "epoch": 5594} {"train_loss": -27.332355499267578, "global_step": 464360, "epoch": 5594} {"train_loss": -27.158594131469727, "global_step": 464361, "epoch": 5594} {"train_loss": -27.162763595581055, "global_step": 464362, "epoch": 5594} {"train_loss": -26.22820472717285, "global_step": 464363, "epoch": 5594} {"train_loss": -25.672765731811523, "global_step": 464364, "epoch": 5594} {"train_loss": -25.99863624572754, "global_step": 464365, "epoch": 5594} {"train_loss": -26.958703994750977, "global_step": 464366, "epoch": 5594} {"train_loss": -26.503467559814453, "global_step": 464367, "epoch": 5594} {"train_loss": -26.84205436706543, "global_step": 464368, "epoch": 5594} {"train_loss": -26.535388946533203, "global_step": 464369, "epoch": 5594} {"train_loss": -26.74262809753418, "global_step": 464370, "epoch": 5594} {"train_loss": -27.068241119384766, "global_step": 464371, "epoch": 5594} {"train_loss": -26.942203521728516, "global_step": 464372, "epoch": 5594} {"train_loss": -26.936697006225586, "global_step": 464373, "epoch": 5594} {"train_loss": -26.645217895507812, "global_step": 464374, "epoch": 5594} {"train_loss": -26.76972007751465, "global_step": 464375, "epoch": 5594} {"train_loss": -27.15412712097168, "global_step": 464376, "epoch": 5594} {"train_loss": -27.044418334960938, "global_step": 464377, "epoch": 5594} {"train_loss": -26.86347007751465, "global_step": 464378, "epoch": 5594} {"train_loss": -26.801244735717773, "global_step": 464379, "epoch": 5594} {"train_loss": -26.511579513549805, "global_step": 464380, "epoch": 5594} {"train_loss": -26.75629997253418, "global_step": 464381, "epoch": 5594} {"train_loss": -26.964202880859375, "global_step": 464382, "epoch": 5594} {"train_loss": -27.034818649291992, "global_step": 464383, "epoch": 5594} {"train_loss": -26.990536724228456, "global_step": 464384, "epoch": 5594, "val_loss": 6443984.5} {"train_loss": -26.77826499938965, "global_step": 464385, "epoch": 5595} {"train_loss": -26.6325740814209, "global_step": 464386, "epoch": 5595} {"train_loss": -26.687366485595703, "global_step": 464387, "epoch": 5595} {"train_loss": -26.91180992126465, "global_step": 464388, "epoch": 5595} {"train_loss": -26.504430770874023, "global_step": 464389, "epoch": 5595} {"train_loss": -27.02388572692871, "global_step": 464390, "epoch": 5595} {"train_loss": -26.6664981842041, "global_step": 464391, "epoch": 5595} {"train_loss": -26.72539710998535, "global_step": 464392, "epoch": 5595} {"train_loss": -26.62324333190918, "global_step": 464393, "epoch": 5595} {"train_loss": -26.816516876220703, "global_step": 464394, "epoch": 5595} {"train_loss": -26.70108985900879, "global_step": 464395, "epoch": 5595} {"train_loss": -26.86616325378418, "global_step": 464396, "epoch": 5595} {"train_loss": -26.773813247680664, "global_step": 464397, "epoch": 5595} {"train_loss": -26.803632736206055, "global_step": 464398, "epoch": 5595} {"train_loss": -27.433359146118164, "global_step": 464399, "epoch": 5595} {"train_loss": -27.08888816833496, "global_step": 464400, "epoch": 5595} {"train_loss": -26.852624893188477, "global_step": 464401, "epoch": 5595} {"train_loss": -26.99993324279785, "global_step": 464402, "epoch": 5595} {"train_loss": -27.122406005859375, "global_step": 464403, "epoch": 5595} {"train_loss": -26.80832862854004, "global_step": 464404, "epoch": 5595} {"train_loss": -27.00172233581543, "global_step": 464405, "epoch": 5595} {"train_loss": -26.930973052978516, "global_step": 464406, "epoch": 5595} {"train_loss": -27.583051681518555, "global_step": 464407, "epoch": 5595} {"train_loss": -27.198593139648438, "global_step": 464408, "epoch": 5595} {"train_loss": -27.031848907470703, "global_step": 464409, "epoch": 5595} {"train_loss": -27.256317138671875, "global_step": 464410, "epoch": 5595} {"train_loss": -27.074527740478516, "global_step": 464411, "epoch": 5595} {"train_loss": -26.829792022705078, "global_step": 464412, "epoch": 5595} {"train_loss": -26.951452255249023, "global_step": 464413, "epoch": 5595} {"train_loss": -26.863798141479492, "global_step": 464414, "epoch": 5595} {"train_loss": -27.248762130737305, "global_step": 464415, "epoch": 5595} {"train_loss": -27.20924949645996, "global_step": 464416, "epoch": 5595} {"train_loss": -27.1409912109375, "global_step": 464417, "epoch": 5595} {"train_loss": -27.75382423400879, "global_step": 464418, "epoch": 5595} {"train_loss": -27.310693740844727, "global_step": 464419, "epoch": 5595} {"train_loss": -27.106672286987305, "global_step": 464420, "epoch": 5595} {"train_loss": -27.18536376953125, "global_step": 464421, "epoch": 5595} {"train_loss": -27.232263565063477, "global_step": 464422, "epoch": 5595} {"train_loss": -27.36520767211914, "global_step": 464423, "epoch": 5595} {"train_loss": -27.208871841430664, "global_step": 464424, "epoch": 5595} {"train_loss": -26.941925048828125, "global_step": 464425, "epoch": 5595} {"train_loss": -27.366138458251953, "global_step": 464426, "epoch": 5595} {"train_loss": -27.404386520385742, "global_step": 464427, "epoch": 5595} {"train_loss": -27.285429000854492, "global_step": 464428, "epoch": 5595} {"train_loss": -27.265522003173828, "global_step": 464429, "epoch": 5595} {"train_loss": -27.503009796142578, "global_step": 464430, "epoch": 5595} {"train_loss": -27.423328399658203, "global_step": 464431, "epoch": 5595} {"train_loss": -27.49281883239746, "global_step": 464432, "epoch": 5595} {"train_loss": -27.20684242248535, "global_step": 464433, "epoch": 5595} {"train_loss": -27.44422721862793, "global_step": 464434, "epoch": 5595} {"train_loss": -27.346282958984375, "global_step": 464435, "epoch": 5595} {"train_loss": -27.230676651000977, "global_step": 464436, "epoch": 5595} {"train_loss": -27.186100006103516, "global_step": 464437, "epoch": 5595} {"train_loss": -26.99371910095215, "global_step": 464438, "epoch": 5595} {"train_loss": -27.168975830078125, "global_step": 464439, "epoch": 5595} {"train_loss": -27.23274040222168, "global_step": 464440, "epoch": 5595} {"train_loss": -26.911344528198242, "global_step": 464441, "epoch": 5595} {"train_loss": -26.809961318969727, "global_step": 464442, "epoch": 5595} {"train_loss": -27.300878524780273, "global_step": 464443, "epoch": 5595} {"train_loss": -27.264728546142578, "global_step": 464444, "epoch": 5595} {"train_loss": -27.3792667388916, "global_step": 464445, "epoch": 5595} {"train_loss": -27.337060928344727, "global_step": 464446, "epoch": 5595} {"train_loss": -27.268701553344727, "global_step": 464447, "epoch": 5595} {"train_loss": -27.105499267578125, "global_step": 464448, "epoch": 5595} {"train_loss": -27.05299186706543, "global_step": 464449, "epoch": 5595} {"train_loss": -27.223901748657227, "global_step": 464450, "epoch": 5595} {"train_loss": -27.373754501342773, "global_step": 464451, "epoch": 5595} {"train_loss": -27.151906967163086, "global_step": 464452, "epoch": 5595} {"train_loss": -26.7554988861084, "global_step": 464453, "epoch": 5595} {"train_loss": -26.9789981842041, "global_step": 464454, "epoch": 5595} {"train_loss": -27.450916290283203, "global_step": 464455, "epoch": 5595} {"train_loss": -26.8331298828125, "global_step": 464456, "epoch": 5595} {"train_loss": -26.67660903930664, "global_step": 464457, "epoch": 5595} {"train_loss": -26.608417510986328, "global_step": 464458, "epoch": 5595} {"train_loss": -26.621829986572266, "global_step": 464459, "epoch": 5595} {"train_loss": -27.25385093688965, "global_step": 464460, "epoch": 5595} {"train_loss": -26.673093795776367, "global_step": 464461, "epoch": 5595} {"train_loss": -27.231220245361328, "global_step": 464462, "epoch": 5595} {"train_loss": -26.82415199279785, "global_step": 464463, "epoch": 5595} {"train_loss": -26.69032859802246, "global_step": 464464, "epoch": 5595} {"train_loss": -26.980188369750977, "global_step": 464465, "epoch": 5595} {"train_loss": -26.924291610717773, "global_step": 464466, "epoch": 5595} {"train_loss": -27.059293517147204, "global_step": 464467, "epoch": 5595, "val_loss": 6512461.0} {"train_loss": -26.138036727905273, "global_step": 464468, "epoch": 5596} {"train_loss": -26.42658042907715, "global_step": 464469, "epoch": 5596} {"train_loss": -26.784896850585938, "global_step": 464470, "epoch": 5596} {"train_loss": -26.1142635345459, "global_step": 464471, "epoch": 5596} {"train_loss": -26.92677116394043, "global_step": 464472, "epoch": 5596} {"train_loss": -26.220117568969727, "global_step": 464473, "epoch": 5596} {"train_loss": -26.791275024414062, "global_step": 464474, "epoch": 5596} {"train_loss": -26.42340087890625, "global_step": 464475, "epoch": 5596} {"train_loss": -26.57281494140625, "global_step": 464476, "epoch": 5596} {"train_loss": -26.727554321289062, "global_step": 464477, "epoch": 5596} {"train_loss": -26.69287109375, "global_step": 464478, "epoch": 5596} {"train_loss": -26.5062255859375, "global_step": 464479, "epoch": 5596} {"train_loss": -26.936552047729492, "global_step": 464480, "epoch": 5596} {"train_loss": -26.727025985717773, "global_step": 464481, "epoch": 5596} {"train_loss": -26.91033363342285, "global_step": 464482, "epoch": 5596} {"train_loss": -26.555343627929688, "global_step": 464483, "epoch": 5596} {"train_loss": -26.878934860229492, "global_step": 464484, "epoch": 5596} {"train_loss": -26.993757247924805, "global_step": 464485, "epoch": 5596} {"train_loss": -27.01413917541504, "global_step": 464486, "epoch": 5596} {"train_loss": -26.794809341430664, "global_step": 464487, "epoch": 5596} {"train_loss": -26.728933334350586, "global_step": 464488, "epoch": 5596} {"train_loss": -26.7769775390625, "global_step": 464489, "epoch": 5596} {"train_loss": -26.994855880737305, "global_step": 464490, "epoch": 5596} {"train_loss": -27.166065216064453, "global_step": 464491, "epoch": 5596} {"train_loss": -27.17567253112793, "global_step": 464492, "epoch": 5596} {"train_loss": -27.0063533782959, "global_step": 464493, "epoch": 5596} {"train_loss": -26.904321670532227, "global_step": 464494, "epoch": 5596} {"train_loss": -26.98257827758789, "global_step": 464495, "epoch": 5596} {"train_loss": -26.92769432067871, "global_step": 464496, "epoch": 5596} {"train_loss": -27.131610870361328, "global_step": 464497, "epoch": 5596} {"train_loss": -27.303237915039062, "global_step": 464498, "epoch": 5596} {"train_loss": -27.169513702392578, "global_step": 464499, "epoch": 5596} {"train_loss": -26.62042236328125, "global_step": 464500, "epoch": 5596} {"train_loss": -26.92359733581543, "global_step": 464501, "epoch": 5596} {"train_loss": -26.860198974609375, "global_step": 464502, "epoch": 5596} {"train_loss": -27.142181396484375, "global_step": 464503, "epoch": 5596} {"train_loss": -26.90311622619629, "global_step": 464504, "epoch": 5596} {"train_loss": -27.046003341674805, "global_step": 464505, "epoch": 5596} {"train_loss": -27.119892120361328, "global_step": 464506, "epoch": 5596} {"train_loss": -27.017343521118164, "global_step": 464507, "epoch": 5596} {"train_loss": -27.021596908569336, "global_step": 464508, "epoch": 5596} {"train_loss": -27.258344650268555, "global_step": 464509, "epoch": 5596} {"train_loss": -27.613300323486328, "global_step": 464510, "epoch": 5596} {"train_loss": -27.402679443359375, "global_step": 464511, "epoch": 5596} {"train_loss": -27.037839889526367, "global_step": 464512, "epoch": 5596} {"train_loss": -27.327239990234375, "global_step": 464513, "epoch": 5596} {"train_loss": -26.969968795776367, "global_step": 464514, "epoch": 5596} {"train_loss": -27.33076286315918, "global_step": 464515, "epoch": 5596} {"train_loss": -26.857995986938477, "global_step": 464516, "epoch": 5596} {"train_loss": -27.21221923828125, "global_step": 464517, "epoch": 5596} {"train_loss": -27.565759658813477, "global_step": 464518, "epoch": 5596} {"train_loss": -27.127904891967773, "global_step": 464519, "epoch": 5596} {"train_loss": -27.693220138549805, "global_step": 464520, "epoch": 5596} {"train_loss": -27.316186904907227, "global_step": 464521, "epoch": 5596} {"train_loss": -26.905181884765625, "global_step": 464522, "epoch": 5596} {"train_loss": -27.50457191467285, "global_step": 464523, "epoch": 5596} {"train_loss": -27.386611938476562, "global_step": 464524, "epoch": 5596} {"train_loss": -27.62269401550293, "global_step": 464525, "epoch": 5596} {"train_loss": -27.0546817779541, "global_step": 464526, "epoch": 5596} {"train_loss": -27.414478302001953, "global_step": 464527, "epoch": 5596} {"train_loss": -27.4886417388916, "global_step": 464528, "epoch": 5596} {"train_loss": -27.438739776611328, "global_step": 464529, "epoch": 5596} {"train_loss": -27.54741859436035, "global_step": 464530, "epoch": 5596} {"train_loss": -27.25423240661621, "global_step": 464531, "epoch": 5596} {"train_loss": -26.983423233032227, "global_step": 464532, "epoch": 5596} {"train_loss": -27.129419326782227, "global_step": 464533, "epoch": 5596} {"train_loss": -27.178693771362305, "global_step": 464534, "epoch": 5596} {"train_loss": -27.412485122680664, "global_step": 464535, "epoch": 5596} {"train_loss": -27.012418746948242, "global_step": 464536, "epoch": 5596} {"train_loss": -27.118146896362305, "global_step": 464537, "epoch": 5596} {"train_loss": -27.323749542236328, "global_step": 464538, "epoch": 5596} {"train_loss": -27.549413681030273, "global_step": 464539, "epoch": 5596} {"train_loss": -27.530420303344727, "global_step": 464540, "epoch": 5596} {"train_loss": -26.709381103515625, "global_step": 464541, "epoch": 5596} {"train_loss": -26.893386840820312, "global_step": 464542, "epoch": 5596} {"train_loss": -27.115692138671875, "global_step": 464543, "epoch": 5596} {"train_loss": -27.14459800720215, "global_step": 464544, "epoch": 5596} {"train_loss": -27.19601821899414, "global_step": 464545, "epoch": 5596} {"train_loss": -27.13857078552246, "global_step": 464546, "epoch": 5596} {"train_loss": -26.541839599609375, "global_step": 464547, "epoch": 5596} {"train_loss": -26.988849639892578, "global_step": 464548, "epoch": 5596} {"train_loss": -26.859603881835938, "global_step": 464549, "epoch": 5596} {"train_loss": -27.024189799664967, "global_step": 464550, "epoch": 5596, "val_loss": 6583038.0} {"train_loss": -26.310855865478516, "global_step": 464551, "epoch": 5597} {"train_loss": -26.193592071533203, "global_step": 464552, "epoch": 5597} {"train_loss": -26.10853385925293, "global_step": 464553, "epoch": 5597} {"train_loss": -26.336347579956055, "global_step": 464554, "epoch": 5597} {"train_loss": -26.708032608032227, "global_step": 464555, "epoch": 5597} {"train_loss": -26.537384033203125, "global_step": 464556, "epoch": 5597} {"train_loss": -26.08127212524414, "global_step": 464557, "epoch": 5597} {"train_loss": -26.28162956237793, "global_step": 464558, "epoch": 5597} {"train_loss": -26.463647842407227, "global_step": 464559, "epoch": 5597} {"train_loss": -26.3259334564209, "global_step": 464560, "epoch": 5597} {"train_loss": -26.327224731445312, "global_step": 464561, "epoch": 5597} {"train_loss": -26.565765380859375, "global_step": 464562, "epoch": 5597} {"train_loss": -26.4332275390625, "global_step": 464563, "epoch": 5597} {"train_loss": -26.622724533081055, "global_step": 464564, "epoch": 5597} {"train_loss": -26.262792587280273, "global_step": 464565, "epoch": 5597} {"train_loss": -26.306869506835938, "global_step": 464566, "epoch": 5597} {"train_loss": -26.724689483642578, "global_step": 464567, "epoch": 5597} {"train_loss": -26.715909957885742, "global_step": 464568, "epoch": 5597} {"train_loss": -26.7507381439209, "global_step": 464569, "epoch": 5597} {"train_loss": -26.57496452331543, "global_step": 464570, "epoch": 5597} {"train_loss": -26.689451217651367, "global_step": 464571, "epoch": 5597} {"train_loss": -26.473926544189453, "global_step": 464572, "epoch": 5597} {"train_loss": -26.93128776550293, "global_step": 464573, "epoch": 5597} {"train_loss": -27.14899253845215, "global_step": 464574, "epoch": 5597} {"train_loss": -27.102554321289062, "global_step": 464575, "epoch": 5597} {"train_loss": -26.82343864440918, "global_step": 464576, "epoch": 5597} {"train_loss": -26.7968807220459, "global_step": 464577, "epoch": 5597} {"train_loss": -27.18459129333496, "global_step": 464578, "epoch": 5597} {"train_loss": -26.986759185791016, "global_step": 464579, "epoch": 5597} {"train_loss": -27.152143478393555, "global_step": 464580, "epoch": 5597} {"train_loss": -27.13043212890625, "global_step": 464581, "epoch": 5597} {"train_loss": -27.119403839111328, "global_step": 464582, "epoch": 5597} {"train_loss": -26.657806396484375, "global_step": 464583, "epoch": 5597} {"train_loss": -26.96271324157715, "global_step": 464584, "epoch": 5597} {"train_loss": -27.26521110534668, "global_step": 464585, "epoch": 5597} {"train_loss": -27.31171226501465, "global_step": 464586, "epoch": 5597} {"train_loss": -26.920917510986328, "global_step": 464587, "epoch": 5597} {"train_loss": -27.0667781829834, "global_step": 464588, "epoch": 5597} {"train_loss": -27.169702529907227, "global_step": 464589, "epoch": 5597} {"train_loss": -27.144140243530273, "global_step": 464590, "epoch": 5597} {"train_loss": -27.290353775024414, "global_step": 464591, "epoch": 5597} {"train_loss": -27.021286010742188, "global_step": 464592, "epoch": 5597} {"train_loss": -27.368316650390625, "global_step": 464593, "epoch": 5597} {"train_loss": -27.25331687927246, "global_step": 464594, "epoch": 5597} {"train_loss": -27.268606185913086, "global_step": 464595, "epoch": 5597} {"train_loss": -27.287809371948242, "global_step": 464596, "epoch": 5597} {"train_loss": -27.03657341003418, "global_step": 464597, "epoch": 5597} {"train_loss": -27.2564640045166, "global_step": 464598, "epoch": 5597} {"train_loss": -27.428640365600586, "global_step": 464599, "epoch": 5597} {"train_loss": -27.03861427307129, "global_step": 464600, "epoch": 5597} {"train_loss": -27.39109230041504, "global_step": 464601, "epoch": 5597} {"train_loss": -27.57857322692871, "global_step": 464602, "epoch": 5597} {"train_loss": -27.609222412109375, "global_step": 464603, "epoch": 5597} {"train_loss": -27.561542510986328, "global_step": 464604, "epoch": 5597} {"train_loss": -27.310697555541992, "global_step": 464605, "epoch": 5597} {"train_loss": -27.420642852783203, "global_step": 464606, "epoch": 5597} {"train_loss": -27.1814022064209, "global_step": 464607, "epoch": 5597} {"train_loss": -27.060504913330078, "global_step": 464608, "epoch": 5597} {"train_loss": -27.187788009643555, "global_step": 464609, "epoch": 5597} {"train_loss": -27.5447940826416, "global_step": 464610, "epoch": 5597} {"train_loss": -27.55868911743164, "global_step": 464611, "epoch": 5597} {"train_loss": -27.355390548706055, "global_step": 464612, "epoch": 5597} {"train_loss": -26.651824951171875, "global_step": 464613, "epoch": 5597} {"train_loss": -26.32948112487793, "global_step": 464614, "epoch": 5597} {"train_loss": -26.433059692382812, "global_step": 464615, "epoch": 5597} {"train_loss": -26.71466064453125, "global_step": 464616, "epoch": 5597} {"train_loss": -27.4965763092041, "global_step": 464617, "epoch": 5597} {"train_loss": -26.90007972717285, "global_step": 464618, "epoch": 5597} {"train_loss": -27.08258628845215, "global_step": 464619, "epoch": 5597} {"train_loss": -26.416854858398438, "global_step": 464620, "epoch": 5597} {"train_loss": -27.030899047851562, "global_step": 464621, "epoch": 5597} {"train_loss": -27.013050079345703, "global_step": 464622, "epoch": 5597} {"train_loss": -26.76740837097168, "global_step": 464623, "epoch": 5597} {"train_loss": -26.903675079345703, "global_step": 464624, "epoch": 5597} {"train_loss": -26.78765296936035, "global_step": 464625, "epoch": 5597} {"train_loss": -26.853382110595703, "global_step": 464626, "epoch": 5597} {"train_loss": -26.679792404174805, "global_step": 464627, "epoch": 5597} {"train_loss": -26.73162841796875, "global_step": 464628, "epoch": 5597} {"train_loss": -26.49098777770996, "global_step": 464629, "epoch": 5597} {"train_loss": -26.691303253173828, "global_step": 464630, "epoch": 5597} {"train_loss": -26.553787231445312, "global_step": 464631, "epoch": 5597} {"train_loss": -26.621673583984375, "global_step": 464632, "epoch": 5597} {"train_loss": -26.898177227341986, "global_step": 464633, "epoch": 5597, "val_loss": 6653246.0} {"train_loss": -26.8989200592041, "global_step": 464634, "epoch": 5598} {"train_loss": -26.68953514099121, "global_step": 464635, "epoch": 5598} {"train_loss": -26.851398468017578, "global_step": 464636, "epoch": 5598} {"train_loss": -26.374908447265625, "global_step": 464637, "epoch": 5598} {"train_loss": -26.767484664916992, "global_step": 464638, "epoch": 5598} {"train_loss": -26.52849769592285, "global_step": 464639, "epoch": 5598} {"train_loss": -26.621356964111328, "global_step": 464640, "epoch": 5598} {"train_loss": -26.89143943786621, "global_step": 464641, "epoch": 5598} {"train_loss": -26.792301177978516, "global_step": 464642, "epoch": 5598} {"train_loss": -26.904438018798828, "global_step": 464643, "epoch": 5598} {"train_loss": -27.0102481842041, "global_step": 464644, "epoch": 5598} {"train_loss": -26.686094284057617, "global_step": 464645, "epoch": 5598} {"train_loss": -27.210763931274414, "global_step": 464646, "epoch": 5598} {"train_loss": -26.854907989501953, "global_step": 464647, "epoch": 5598} {"train_loss": -26.786535263061523, "global_step": 464648, "epoch": 5598} {"train_loss": -26.580108642578125, "global_step": 464649, "epoch": 5598} {"train_loss": -26.63748550415039, "global_step": 464650, "epoch": 5598} {"train_loss": -26.688833236694336, "global_step": 464651, "epoch": 5598} {"train_loss": -27.13397216796875, "global_step": 464652, "epoch": 5598} {"train_loss": -26.954557418823242, "global_step": 464653, "epoch": 5598} {"train_loss": -26.764179229736328, "global_step": 464654, "epoch": 5598} {"train_loss": -26.95783042907715, "global_step": 464655, "epoch": 5598} {"train_loss": -27.257238388061523, "global_step": 464656, "epoch": 5598} {"train_loss": -27.16070556640625, "global_step": 464657, "epoch": 5598} {"train_loss": -27.1012020111084, "global_step": 464658, "epoch": 5598} {"train_loss": -27.00261878967285, "global_step": 464659, "epoch": 5598} {"train_loss": -27.313180923461914, "global_step": 464660, "epoch": 5598} {"train_loss": -27.106006622314453, "global_step": 464661, "epoch": 5598} {"train_loss": -27.293054580688477, "global_step": 464662, "epoch": 5598} {"train_loss": -27.0591983795166, "global_step": 464663, "epoch": 5598} {"train_loss": -26.96980094909668, "global_step": 464664, "epoch": 5598} {"train_loss": -27.065078735351562, "global_step": 464665, "epoch": 5598} {"train_loss": -27.53496742248535, "global_step": 464666, "epoch": 5598} {"train_loss": -27.13079833984375, "global_step": 464667, "epoch": 5598} {"train_loss": -26.96933364868164, "global_step": 464668, "epoch": 5598} {"train_loss": -27.248205184936523, "global_step": 464669, "epoch": 5598} {"train_loss": -27.29119873046875, "global_step": 464670, "epoch": 5598} {"train_loss": -27.58688735961914, "global_step": 464671, "epoch": 5598} {"train_loss": -27.04001235961914, "global_step": 464672, "epoch": 5598} {"train_loss": -27.4799747467041, "global_step": 464673, "epoch": 5598} {"train_loss": -27.379133224487305, "global_step": 464674, "epoch": 5598} {"train_loss": -26.99268913269043, "global_step": 464675, "epoch": 5598} {"train_loss": -27.093881607055664, "global_step": 464676, "epoch": 5598} {"train_loss": -27.606719970703125, "global_step": 464677, "epoch": 5598} {"train_loss": -27.11100196838379, "global_step": 464678, "epoch": 5598} {"train_loss": -27.307126998901367, "global_step": 464679, "epoch": 5598} {"train_loss": -27.785017013549805, "global_step": 464680, "epoch": 5598} {"train_loss": -27.316791534423828, "global_step": 464681, "epoch": 5598} {"train_loss": -27.055967330932617, "global_step": 464682, "epoch": 5598} {"train_loss": -26.970722198486328, "global_step": 464683, "epoch": 5598} {"train_loss": -27.176244735717773, "global_step": 464684, "epoch": 5598} {"train_loss": -27.056640625, "global_step": 464685, "epoch": 5598} {"train_loss": -27.340106964111328, "global_step": 464686, "epoch": 5598} {"train_loss": -27.158863067626953, "global_step": 464687, "epoch": 5598} {"train_loss": -27.436614990234375, "global_step": 464688, "epoch": 5598} {"train_loss": -27.518798828125, "global_step": 464689, "epoch": 5598} {"train_loss": -26.99734878540039, "global_step": 464690, "epoch": 5598} {"train_loss": -27.132421493530273, "global_step": 464691, "epoch": 5598} {"train_loss": -27.137842178344727, "global_step": 464692, "epoch": 5598} {"train_loss": -27.123859405517578, "global_step": 464693, "epoch": 5598} {"train_loss": -27.213459014892578, "global_step": 464694, "epoch": 5598} {"train_loss": -27.38300895690918, "global_step": 464695, "epoch": 5598} {"train_loss": -26.9884033203125, "global_step": 464696, "epoch": 5598} {"train_loss": -27.250158309936523, "global_step": 464697, "epoch": 5598} {"train_loss": -27.33262062072754, "global_step": 464698, "epoch": 5598} {"train_loss": -27.327411651611328, "global_step": 464699, "epoch": 5598} {"train_loss": -27.298797607421875, "global_step": 464700, "epoch": 5598} {"train_loss": -27.227575302124023, "global_step": 464701, "epoch": 5598} {"train_loss": -27.511077880859375, "global_step": 464702, "epoch": 5598} {"train_loss": -27.24683952331543, "global_step": 464703, "epoch": 5598} {"train_loss": -27.729557037353516, "global_step": 464704, "epoch": 5598} {"train_loss": -27.6899356842041, "global_step": 464705, "epoch": 5598} {"train_loss": -27.80426025390625, "global_step": 464706, "epoch": 5598} {"train_loss": -27.440534591674805, "global_step": 464707, "epoch": 5598} {"train_loss": -27.230060577392578, "global_step": 464708, "epoch": 5598} {"train_loss": -27.143207550048828, "global_step": 464709, "epoch": 5598} {"train_loss": -27.02836036682129, "global_step": 464710, "epoch": 5598} {"train_loss": -27.071563720703125, "global_step": 464711, "epoch": 5598} {"train_loss": -26.651288986206055, "global_step": 464712, "epoch": 5598} {"train_loss": -25.85725212097168, "global_step": 464713, "epoch": 5598} {"train_loss": -26.701467514038086, "global_step": 464714, "epoch": 5598} {"train_loss": -26.3855037689209, "global_step": 464715, "epoch": 5598} {"train_loss": -27.069218486188404, "global_step": 464716, "epoch": 5598, "val_loss": 6594371.0} {"train_loss": -21.807382583618164, "global_step": 464717, "epoch": 5599} {"train_loss": -23.078073501586914, "global_step": 464718, "epoch": 5599} {"train_loss": -25.32867431640625, "global_step": 464719, "epoch": 5599} {"train_loss": -24.412166595458984, "global_step": 464720, "epoch": 5599} {"train_loss": -24.8045711517334, "global_step": 464721, "epoch": 5599} {"train_loss": -24.966073989868164, "global_step": 464722, "epoch": 5599} {"train_loss": -24.990095138549805, "global_step": 464723, "epoch": 5599} {"train_loss": -25.85548210144043, "global_step": 464724, "epoch": 5599} {"train_loss": -26.337055206298828, "global_step": 464725, "epoch": 5599} {"train_loss": -25.62978172302246, "global_step": 464726, "epoch": 5599} {"train_loss": -25.564077377319336, "global_step": 464727, "epoch": 5599} {"train_loss": -26.245834350585938, "global_step": 464728, "epoch": 5599} {"train_loss": -25.537931442260742, "global_step": 464729, "epoch": 5599} {"train_loss": -25.891706466674805, "global_step": 464730, "epoch": 5599} {"train_loss": -25.83783531188965, "global_step": 464731, "epoch": 5599} {"train_loss": -26.008092880249023, "global_step": 464732, "epoch": 5599} {"train_loss": -26.075153350830078, "global_step": 464733, "epoch": 5599} {"train_loss": -26.12813377380371, "global_step": 464734, "epoch": 5599} {"train_loss": -26.38563346862793, "global_step": 464735, "epoch": 5599} {"train_loss": -25.65888023376465, "global_step": 464736, "epoch": 5599} {"train_loss": -26.473264694213867, "global_step": 464737, "epoch": 5599} {"train_loss": -26.544677734375, "global_step": 464738, "epoch": 5599} {"train_loss": -26.366331100463867, "global_step": 464739, "epoch": 5599} {"train_loss": -26.666677474975586, "global_step": 464740, "epoch": 5599} {"train_loss": -26.511016845703125, "global_step": 464741, "epoch": 5599} {"train_loss": -25.98640251159668, "global_step": 464742, "epoch": 5599} {"train_loss": -26.457996368408203, "global_step": 464743, "epoch": 5599} {"train_loss": -26.301746368408203, "global_step": 464744, "epoch": 5599} {"train_loss": -26.2901611328125, "global_step": 464745, "epoch": 5599} {"train_loss": -26.525619506835938, "global_step": 464746, "epoch": 5599} {"train_loss": -26.47784423828125, "global_step": 464747, "epoch": 5599} {"train_loss": -26.713109970092773, "global_step": 464748, "epoch": 5599} {"train_loss": -26.43794059753418, "global_step": 464749, "epoch": 5599} {"train_loss": -26.6827335357666, "global_step": 464750, "epoch": 5599} {"train_loss": -26.461822509765625, "global_step": 464751, "epoch": 5599} {"train_loss": -26.558027267456055, "global_step": 464752, "epoch": 5599} {"train_loss": -26.438512802124023, "global_step": 464753, "epoch": 5599} {"train_loss": -26.670583724975586, "global_step": 464754, "epoch": 5599} {"train_loss": -27.0051326751709, "global_step": 464755, "epoch": 5599} {"train_loss": -27.19412612915039, "global_step": 464756, "epoch": 5599} {"train_loss": -26.851598739624023, "global_step": 464757, "epoch": 5599} {"train_loss": -26.97024917602539, "global_step": 464758, "epoch": 5599} {"train_loss": -26.9371337890625, "global_step": 464759, "epoch": 5599} {"train_loss": -26.7762393951416, "global_step": 464760, "epoch": 5599} {"train_loss": -27.037887573242188, "global_step": 464761, "epoch": 5599} {"train_loss": -26.934497833251953, "global_step": 464762, "epoch": 5599} {"train_loss": -26.65650749206543, "global_step": 464763, "epoch": 5599} {"train_loss": -26.98416519165039, "global_step": 464764, "epoch": 5599} {"train_loss": -26.682697296142578, "global_step": 464765, "epoch": 5599} {"train_loss": -26.884464263916016, "global_step": 464766, "epoch": 5599} {"train_loss": -27.030405044555664, "global_step": 464767, "epoch": 5599} {"train_loss": -26.923368453979492, "global_step": 464768, "epoch": 5599} {"train_loss": -27.115619659423828, "global_step": 464769, "epoch": 5599} {"train_loss": -26.816694259643555, "global_step": 464770, "epoch": 5599} {"train_loss": -26.95516014099121, "global_step": 464771, "epoch": 5599} {"train_loss": -27.39417839050293, "global_step": 464772, "epoch": 5599} {"train_loss": -27.198705673217773, "global_step": 464773, "epoch": 5599} {"train_loss": -26.916173934936523, "global_step": 464774, "epoch": 5599} {"train_loss": -26.832483291625977, "global_step": 464775, "epoch": 5599} {"train_loss": -26.833642959594727, "global_step": 464776, "epoch": 5599} {"train_loss": -27.045562744140625, "global_step": 464777, "epoch": 5599} {"train_loss": -27.133777618408203, "global_step": 464778, "epoch": 5599} {"train_loss": -26.88567543029785, "global_step": 464779, "epoch": 5599} {"train_loss": -27.170454025268555, "global_step": 464780, "epoch": 5599} {"train_loss": -26.894107818603516, "global_step": 464781, "epoch": 5599} {"train_loss": -27.427000045776367, "global_step": 464782, "epoch": 5599} {"train_loss": -26.591032028198242, "global_step": 464783, "epoch": 5599} {"train_loss": -26.21449851989746, "global_step": 464784, "epoch": 5599} {"train_loss": -26.54705238342285, "global_step": 464785, "epoch": 5599} {"train_loss": -26.724218368530273, "global_step": 464786, "epoch": 5599} {"train_loss": -26.86456871032715, "global_step": 464787, "epoch": 5599} {"train_loss": -26.452604293823242, "global_step": 464788, "epoch": 5599} {"train_loss": -26.639875411987305, "global_step": 464789, "epoch": 5599} {"train_loss": -27.057138442993164, "global_step": 464790, "epoch": 5599} {"train_loss": -27.094053268432617, "global_step": 464791, "epoch": 5599} {"train_loss": -27.084217071533203, "global_step": 464792, "epoch": 5599} {"train_loss": -26.72657585144043, "global_step": 464793, "epoch": 5599} {"train_loss": -27.28944206237793, "global_step": 464794, "epoch": 5599} {"train_loss": -26.688705444335938, "global_step": 464795, "epoch": 5599} {"train_loss": -27.14398193359375, "global_step": 464796, "epoch": 5599} {"train_loss": -26.94793128967285, "global_step": 464797, "epoch": 5599} {"train_loss": -27.10248374938965, "global_step": 464798, "epoch": 5599} {"train_loss": -26.44771557543651, "global_step": 464799, "epoch": 5599, "val_loss": 6700179.0} {"train_loss": -26.1726016998291, "global_step": 464800, "epoch": 5600} {"train_loss": -26.766803741455078, "global_step": 464801, "epoch": 5600} {"train_loss": -26.967987060546875, "global_step": 464802, "epoch": 5600} {"train_loss": -26.5659122467041, "global_step": 464803, "epoch": 5600} {"train_loss": -26.63815689086914, "global_step": 464804, "epoch": 5600} {"train_loss": -26.637006759643555, "global_step": 464805, "epoch": 5600} {"train_loss": -26.881738662719727, "global_step": 464806, "epoch": 5600} {"train_loss": -26.907865524291992, "global_step": 464807, "epoch": 5600} {"train_loss": -26.664270401000977, "global_step": 464808, "epoch": 5600} {"train_loss": -26.614704132080078, "global_step": 464809, "epoch": 5600} {"train_loss": -26.84344482421875, "global_step": 464810, "epoch": 5600} {"train_loss": -26.980976104736328, "global_step": 464811, "epoch": 5600} {"train_loss": -26.852603912353516, "global_step": 464812, "epoch": 5600} {"train_loss": -27.054059982299805, "global_step": 464813, "epoch": 5600} {"train_loss": -26.9365234375, "global_step": 464814, "epoch": 5600} {"train_loss": -26.920698165893555, "global_step": 464815, "epoch": 5600} {"train_loss": -26.946063995361328, "global_step": 464816, "epoch": 5600} {"train_loss": -26.8642635345459, "global_step": 464817, "epoch": 5600} {"train_loss": -27.10821533203125, "global_step": 464818, "epoch": 5600} {"train_loss": -26.94422721862793, "global_step": 464819, "epoch": 5600} {"train_loss": -26.729904174804688, "global_step": 464820, "epoch": 5600} {"train_loss": -26.959497451782227, "global_step": 464821, "epoch": 5600} {"train_loss": -27.34126091003418, "global_step": 464822, "epoch": 5600} {"train_loss": -26.840307235717773, "global_step": 464823, "epoch": 5600} {"train_loss": -27.217620849609375, "global_step": 464824, "epoch": 5600} {"train_loss": -27.380420684814453, "global_step": 464825, "epoch": 5600} {"train_loss": -26.66546630859375, "global_step": 464826, "epoch": 5600} {"train_loss": -27.185409545898438, "global_step": 464827, "epoch": 5600} {"train_loss": -27.17963218688965, "global_step": 464828, "epoch": 5600} {"train_loss": -27.00510025024414, "global_step": 464829, "epoch": 5600} {"train_loss": -27.4242000579834, "global_step": 464830, "epoch": 5600} {"train_loss": -27.383453369140625, "global_step": 464831, "epoch": 5600} {"train_loss": -27.27027702331543, "global_step": 464832, "epoch": 5600} {"train_loss": -27.241491317749023, "global_step": 464833, "epoch": 5600} {"train_loss": -27.329504013061523, "global_step": 464834, "epoch": 5600} {"train_loss": -27.400909423828125, "global_step": 464835, "epoch": 5600} {"train_loss": -27.35297966003418, "global_step": 464836, "epoch": 5600} {"train_loss": -27.14371109008789, "global_step": 464837, "epoch": 5600} {"train_loss": -27.304025650024414, "global_step": 464838, "epoch": 5600} {"train_loss": -27.110143661499023, "global_step": 464839, "epoch": 5600} {"train_loss": -27.25360107421875, "global_step": 464840, "epoch": 5600} {"train_loss": -27.040420532226562, "global_step": 464841, "epoch": 5600} {"train_loss": -27.25543785095215, "global_step": 464842, "epoch": 5600} {"train_loss": -27.219144821166992, "global_step": 464843, "epoch": 5600} {"train_loss": -27.19892692565918, "global_step": 464844, "epoch": 5600} {"train_loss": -27.75929832458496, "global_step": 464845, "epoch": 5600} {"train_loss": -27.260425567626953, "global_step": 464846, "epoch": 5600} {"train_loss": -27.3734188079834, "global_step": 464847, "epoch": 5600} {"train_loss": -27.071279525756836, "global_step": 464848, "epoch": 5600} {"train_loss": -27.12896156311035, "global_step": 464849, "epoch": 5600} {"train_loss": -27.010272979736328, "global_step": 464850, "epoch": 5600} {"train_loss": -27.410974502563477, "global_step": 464851, "epoch": 5600} {"train_loss": -27.0967960357666, "global_step": 464852, "epoch": 5600} {"train_loss": -27.185129165649414, "global_step": 464853, "epoch": 5600} {"train_loss": -26.80295181274414, "global_step": 464854, "epoch": 5600} {"train_loss": -27.04522705078125, "global_step": 464855, "epoch": 5600} {"train_loss": -27.38519859313965, "global_step": 464856, "epoch": 5600} {"train_loss": -27.334918975830078, "global_step": 464857, "epoch": 5600} {"train_loss": -27.205785751342773, "global_step": 464858, "epoch": 5600} {"train_loss": -27.378889083862305, "global_step": 464859, "epoch": 5600} {"train_loss": -27.057880401611328, "global_step": 464860, "epoch": 5600} {"train_loss": -27.462682723999023, "global_step": 464861, "epoch": 5600} {"train_loss": -26.921955108642578, "global_step": 464862, "epoch": 5600} {"train_loss": -27.374042510986328, "global_step": 464863, "epoch": 5600} {"train_loss": -27.095417022705078, "global_step": 464864, "epoch": 5600} {"train_loss": -27.14535903930664, "global_step": 464865, "epoch": 5600} {"train_loss": -27.244794845581055, "global_step": 464866, "epoch": 5600} {"train_loss": -27.013334274291992, "global_step": 464867, "epoch": 5600} {"train_loss": -27.615339279174805, "global_step": 464868, "epoch": 5600} {"train_loss": -27.199594497680664, "global_step": 464869, "epoch": 5600} {"train_loss": -26.881805419921875, "global_step": 464870, "epoch": 5600} {"train_loss": -27.290576934814453, "global_step": 464871, "epoch": 5600} {"train_loss": -26.9578857421875, "global_step": 464872, "epoch": 5600} {"train_loss": -27.519506454467773, "global_step": 464873, "epoch": 5600} {"train_loss": -26.922277450561523, "global_step": 464874, "epoch": 5600} {"train_loss": -27.5445499420166, "global_step": 464875, "epoch": 5600} {"train_loss": -26.790563583374023, "global_step": 464876, "epoch": 5600} {"train_loss": -27.154590606689453, "global_step": 464877, "epoch": 5600} {"train_loss": -26.781707763671875, "global_step": 464878, "epoch": 5600} {"train_loss": -27.283527374267578, "global_step": 464879, "epoch": 5600} {"train_loss": -26.86199378967285, "global_step": 464880, "epoch": 5600} {"train_loss": -27.20133399963379, "global_step": 464881, "epoch": 5600} {"train_loss": -27.10071867058076, "global_step": 464882, "epoch": 5600, "train/sim_max_reward_0": 1.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4500000": 1.0, "test/sim_max_reward_4500001": 1.0, "test/sim_max_reward_4500002": 1.0, "test/sim_max_reward_4500003": 1.0, "test/sim_max_reward_4500004": 1.0, "test/sim_max_reward_4500005": 1.0, "test/sim_max_reward_4500006": 1.0, "test/sim_max_reward_4500007": 0.0, "test/sim_max_reward_4500008": 1.0, "test/sim_max_reward_4500009": 1.0, "test/sim_max_reward_4500010": 1.0, "test/sim_max_reward_4500011": 1.0, "test/sim_max_reward_4500012": 1.0, "test/sim_max_reward_4500013": 0.0, "test/sim_max_reward_4500014": 1.0, "test/sim_max_reward_4500015": 1.0, "test/sim_max_reward_4500016": 0.0, "test/sim_max_reward_4500017": 1.0, "test/sim_max_reward_4500018": 1.0, "test/sim_max_reward_4500019": 1.0, "test/sim_max_reward_4500020": 1.0, "test/sim_max_reward_4500021": 1.0, "train/mean_score": 1.0, "test/mean_score": 0.8636363636363636, "val_loss": 6532077.0} {"train_loss": -26.354658126831055, "global_step": 464883, "epoch": 5601} {"train_loss": -26.40220069885254, "global_step": 464884, "epoch": 5601} {"train_loss": -25.90923500061035, "global_step": 464885, "epoch": 5601} {"train_loss": -26.473730087280273, "global_step": 464886, "epoch": 5601} {"train_loss": -26.622909545898438, "global_step": 464887, "epoch": 5601} {"train_loss": -27.179431915283203, "global_step": 464888, "epoch": 5601} {"train_loss": -26.67817497253418, "global_step": 464889, "epoch": 5601} {"train_loss": -26.991270065307617, "global_step": 464890, "epoch": 5601} {"train_loss": -27.00296401977539, "global_step": 464891, "epoch": 5601} {"train_loss": -26.71856117248535, "global_step": 464892, "epoch": 5601} {"train_loss": -27.123510360717773, "global_step": 464893, "epoch": 5601} {"train_loss": -26.824554443359375, "global_step": 464894, "epoch": 5601} {"train_loss": -26.933332443237305, "global_step": 464895, "epoch": 5601} {"train_loss": -26.70943260192871, "global_step": 464896, "epoch": 5601} {"train_loss": -26.923898696899414, "global_step": 464897, "epoch": 5601} {"train_loss": -27.01191520690918, "global_step": 464898, "epoch": 5601} {"train_loss": -27.02670669555664, "global_step": 464899, "epoch": 5601} {"train_loss": -26.691970825195312, "global_step": 464900, "epoch": 5601} {"train_loss": -27.20823097229004, "global_step": 464901, "epoch": 5601} {"train_loss": -26.927316665649414, "global_step": 464902, "epoch": 5601} {"train_loss": -27.65033531188965, "global_step": 464903, "epoch": 5601} {"train_loss": -27.175390243530273, "global_step": 464904, "epoch": 5601} {"train_loss": -26.864416122436523, "global_step": 464905, "epoch": 5601} {"train_loss": -27.005756378173828, "global_step": 464906, "epoch": 5601} {"train_loss": -27.068540573120117, "global_step": 464907, "epoch": 5601} {"train_loss": -26.860721588134766, "global_step": 464908, "epoch": 5601} {"train_loss": -26.928634643554688, "global_step": 464909, "epoch": 5601} {"train_loss": -26.997695922851562, "global_step": 464910, "epoch": 5601} {"train_loss": -27.198963165283203, "global_step": 464911, "epoch": 5601} {"train_loss": -27.117502212524414, "global_step": 464912, "epoch": 5601} {"train_loss": -27.253332138061523, "global_step": 464913, "epoch": 5601} {"train_loss": -27.119359970092773, "global_step": 464914, "epoch": 5601} {"train_loss": -27.19508171081543, "global_step": 464915, "epoch": 5601} {"train_loss": -27.28334617614746, "global_step": 464916, "epoch": 5601} {"train_loss": -27.244115829467773, "global_step": 464917, "epoch": 5601} {"train_loss": -27.46695327758789, "global_step": 464918, "epoch": 5601} {"train_loss": -27.5794620513916, "global_step": 464919, "epoch": 5601} {"train_loss": -26.995691299438477, "global_step": 464920, "epoch": 5601} {"train_loss": -27.084692001342773, "global_step": 464921, "epoch": 5601} {"train_loss": -27.474267959594727, "global_step": 464922, "epoch": 5601} {"train_loss": -27.50990104675293, "global_step": 464923, "epoch": 5601} {"train_loss": -27.261152267456055, "global_step": 464924, "epoch": 5601} {"train_loss": -27.526782989501953, "global_step": 464925, "epoch": 5601} {"train_loss": -27.319229125976562, "global_step": 464926, "epoch": 5601} {"train_loss": -27.28822135925293, "global_step": 464927, "epoch": 5601} {"train_loss": -27.216720581054688, "global_step": 464928, "epoch": 5601} {"train_loss": -27.31943702697754, "global_step": 464929, "epoch": 5601} {"train_loss": -27.074079513549805, "global_step": 464930, "epoch": 5601} {"train_loss": -27.131607055664062, "global_step": 464931, "epoch": 5601} {"train_loss": -27.3282470703125, "global_step": 464932, "epoch": 5601} {"train_loss": -27.561243057250977, "global_step": 464933, "epoch": 5601} {"train_loss": -27.563434600830078, "global_step": 464934, "epoch": 5601} {"train_loss": -27.225976943969727, "global_step": 464935, "epoch": 5601} {"train_loss": -27.26716423034668, "global_step": 464936, "epoch": 5601} {"train_loss": -27.0468807220459, "global_step": 464937, "epoch": 5601} {"train_loss": -27.193313598632812, "global_step": 464938, "epoch": 5601} {"train_loss": -27.36237144470215, "global_step": 464939, "epoch": 5601} {"train_loss": -27.419687271118164, "global_step": 464940, "epoch": 5601} {"train_loss": -27.27237319946289, "global_step": 464941, "epoch": 5601} {"train_loss": -27.629831314086914, "global_step": 464942, "epoch": 5601} {"train_loss": -27.41241455078125, "global_step": 464943, "epoch": 5601} {"train_loss": -27.555097579956055, "global_step": 464944, "epoch": 5601} {"train_loss": -27.526981353759766, "global_step": 464945, "epoch": 5601} {"train_loss": -27.18842887878418, "global_step": 464946, "epoch": 5601} {"train_loss": -27.22648048400879, "global_step": 464947, "epoch": 5601} {"train_loss": -27.29770851135254, "global_step": 464948, "epoch": 5601} {"train_loss": -27.2464599609375, "global_step": 464949, "epoch": 5601} {"train_loss": -27.030792236328125, "global_step": 464950, "epoch": 5601} {"train_loss": -27.240270614624023, "global_step": 464951, "epoch": 5601} {"train_loss": -27.22596549987793, "global_step": 464952, "epoch": 5601} {"train_loss": -27.100690841674805, "global_step": 464953, "epoch": 5601} {"train_loss": -27.3804874420166, "global_step": 464954, "epoch": 5601} {"train_loss": -27.295429229736328, "global_step": 464955, "epoch": 5601} {"train_loss": -27.37897300720215, "global_step": 464956, "epoch": 5601} {"train_loss": -27.37823486328125, "global_step": 464957, "epoch": 5601} {"train_loss": -27.431318283081055, "global_step": 464958, "epoch": 5601} {"train_loss": -27.0280704498291, "global_step": 464959, "epoch": 5601} {"train_loss": -27.302316665649414, "global_step": 464960, "epoch": 5601} {"train_loss": -27.00994873046875, "global_step": 464961, "epoch": 5601} {"train_loss": -27.446836471557617, "global_step": 464962, "epoch": 5601} {"train_loss": -27.2418155670166, "global_step": 464963, "epoch": 5601} {"train_loss": -27.069843292236328, "global_step": 464964, "epoch": 5601} {"train_loss": -27.150668868099352, "global_step": 464965, "epoch": 5601, "val_loss": 6632967.0} {"train_loss": -25.329452514648438, "global_step": 464966, "epoch": 5602} {"train_loss": -24.739208221435547, "global_step": 464967, "epoch": 5602} {"train_loss": -26.164228439331055, "global_step": 464968, "epoch": 5602} {"train_loss": -25.5086669921875, "global_step": 464969, "epoch": 5602} {"train_loss": -25.759540557861328, "global_step": 464970, "epoch": 5602} {"train_loss": -26.10918617248535, "global_step": 464971, "epoch": 5602} {"train_loss": -26.040063858032227, "global_step": 464972, "epoch": 5602} {"train_loss": -26.289350509643555, "global_step": 464973, "epoch": 5602} {"train_loss": -25.790042877197266, "global_step": 464974, "epoch": 5602} {"train_loss": -26.663944244384766, "global_step": 464975, "epoch": 5602} {"train_loss": -26.02727699279785, "global_step": 464976, "epoch": 5602} {"train_loss": -26.41997718811035, "global_step": 464977, "epoch": 5602} {"train_loss": -26.328245162963867, "global_step": 464978, "epoch": 5602} {"train_loss": -26.29119300842285, "global_step": 464979, "epoch": 5602} {"train_loss": -26.361957550048828, "global_step": 464980, "epoch": 5602} {"train_loss": -26.563644409179688, "global_step": 464981, "epoch": 5602} {"train_loss": -26.527481079101562, "global_step": 464982, "epoch": 5602} {"train_loss": -26.643299102783203, "global_step": 464983, "epoch": 5602} {"train_loss": -26.60943031311035, "global_step": 464984, "epoch": 5602} {"train_loss": -26.651554107666016, "global_step": 464985, "epoch": 5602} {"train_loss": -26.496103286743164, "global_step": 464986, "epoch": 5602} {"train_loss": -26.75705337524414, "global_step": 464987, "epoch": 5602} {"train_loss": -26.92596435546875, "global_step": 464988, "epoch": 5602} {"train_loss": -26.52796745300293, "global_step": 464989, "epoch": 5602} {"train_loss": -26.806243896484375, "global_step": 464990, "epoch": 5602} {"train_loss": -27.15708351135254, "global_step": 464991, "epoch": 5602} {"train_loss": -27.12615966796875, "global_step": 464992, "epoch": 5602} {"train_loss": -26.555688858032227, "global_step": 464993, "epoch": 5602} {"train_loss": -26.582265853881836, "global_step": 464994, "epoch": 5602} {"train_loss": -26.694156646728516, "global_step": 464995, "epoch": 5602} {"train_loss": -26.825687408447266, "global_step": 464996, "epoch": 5602} {"train_loss": -27.078815460205078, "global_step": 464997, "epoch": 5602} {"train_loss": -27.431934356689453, "global_step": 464998, "epoch": 5602} {"train_loss": -27.17510414123535, "global_step": 464999, "epoch": 5602} {"train_loss": -27.193622589111328, "global_step": 465000, "epoch": 5602} {"train_loss": -27.059980392456055, "global_step": 465001, "epoch": 5602} {"train_loss": -27.17549705505371, "global_step": 465002, "epoch": 5602} {"train_loss": -27.25127601623535, "global_step": 465003, "epoch": 5602} {"train_loss": -27.118696212768555, "global_step": 465004, "epoch": 5602} {"train_loss": -27.301349639892578, "global_step": 465005, "epoch": 5602} {"train_loss": -27.2039737701416, "global_step": 465006, "epoch": 5602} {"train_loss": -27.228296279907227, "global_step": 465007, "epoch": 5602} {"train_loss": -27.299055099487305, "global_step": 465008, "epoch": 5602} {"train_loss": -27.315093994140625, "global_step": 465009, "epoch": 5602} {"train_loss": -27.238508224487305, "global_step": 465010, "epoch": 5602} {"train_loss": -27.38362693786621, "global_step": 465011, "epoch": 5602} {"train_loss": -27.518911361694336, "global_step": 465012, "epoch": 5602} {"train_loss": -27.46748924255371, "global_step": 465013, "epoch": 5602} {"train_loss": -27.050134658813477, "global_step": 465014, "epoch": 5602} {"train_loss": -27.091449737548828, "global_step": 465015, "epoch": 5602} {"train_loss": -27.317325592041016, "global_step": 465016, "epoch": 5602} {"train_loss": -27.137548446655273, "global_step": 465017, "epoch": 5602} {"train_loss": -27.23798179626465, "global_step": 465018, "epoch": 5602} {"train_loss": -27.019550323486328, "global_step": 465019, "epoch": 5602} {"train_loss": -27.160207748413086, "global_step": 465020, "epoch": 5602} {"train_loss": -27.192514419555664, "global_step": 465021, "epoch": 5602} {"train_loss": -27.061893463134766, "global_step": 465022, "epoch": 5602} {"train_loss": -27.088211059570312, "global_step": 465023, "epoch": 5602} {"train_loss": -27.43630027770996, "global_step": 465024, "epoch": 5602} {"train_loss": -27.23428726196289, "global_step": 465025, "epoch": 5602} {"train_loss": -27.348764419555664, "global_step": 465026, "epoch": 5602} {"train_loss": -27.524322509765625, "global_step": 465027, "epoch": 5602} {"train_loss": -27.43625259399414, "global_step": 465028, "epoch": 5602} {"train_loss": -27.59279441833496, "global_step": 465029, "epoch": 5602} {"train_loss": -26.87373924255371, "global_step": 465030, "epoch": 5602} {"train_loss": -27.074392318725586, "global_step": 465031, "epoch": 5602} {"train_loss": -27.2330265045166, "global_step": 465032, "epoch": 5602} {"train_loss": -27.27655029296875, "global_step": 465033, "epoch": 5602} {"train_loss": -27.256011962890625, "global_step": 465034, "epoch": 5602} {"train_loss": -27.2811279296875, "global_step": 465035, "epoch": 5602} {"train_loss": -27.067047119140625, "global_step": 465036, "epoch": 5602} {"train_loss": -27.1568546295166, "global_step": 465037, "epoch": 5602} {"train_loss": -27.326623916625977, "global_step": 465038, "epoch": 5602} {"train_loss": -26.79571533203125, "global_step": 465039, "epoch": 5602} {"train_loss": -26.73710060119629, "global_step": 465040, "epoch": 5602} {"train_loss": -27.178180694580078, "global_step": 465041, "epoch": 5602} {"train_loss": -27.293792724609375, "global_step": 465042, "epoch": 5602} {"train_loss": -27.500080108642578, "global_step": 465043, "epoch": 5602} {"train_loss": -27.251264572143555, "global_step": 465044, "epoch": 5602} {"train_loss": -27.089872360229492, "global_step": 465045, "epoch": 5602} {"train_loss": -27.137542724609375, "global_step": 465046, "epoch": 5602} {"train_loss": -27.3915958404541, "global_step": 465047, "epoch": 5602} {"train_loss": -26.909205723957843, "global_step": 465048, "epoch": 5602, "val_loss": 6630998.0} {"train_loss": -27.221399307250977, "global_step": 465049, "epoch": 5603} {"train_loss": -26.7957706451416, "global_step": 465050, "epoch": 5603} {"train_loss": -26.989160537719727, "global_step": 465051, "epoch": 5603} {"train_loss": -26.762100219726562, "global_step": 465052, "epoch": 5603} {"train_loss": -27.13605308532715, "global_step": 465053, "epoch": 5603} {"train_loss": -26.80755043029785, "global_step": 465054, "epoch": 5603} {"train_loss": -26.517908096313477, "global_step": 465055, "epoch": 5603} {"train_loss": -26.09065055847168, "global_step": 465056, "epoch": 5603} {"train_loss": -26.66042137145996, "global_step": 465057, "epoch": 5603} {"train_loss": -26.916305541992188, "global_step": 465058, "epoch": 5603} {"train_loss": -26.502180099487305, "global_step": 465059, "epoch": 5603} {"train_loss": -26.77972984313965, "global_step": 465060, "epoch": 5603} {"train_loss": -27.1182861328125, "global_step": 465061, "epoch": 5603} {"train_loss": -26.324127197265625, "global_step": 465062, "epoch": 5603} {"train_loss": -27.094451904296875, "global_step": 465063, "epoch": 5603} {"train_loss": -26.543842315673828, "global_step": 465064, "epoch": 5603} {"train_loss": -26.970808029174805, "global_step": 465065, "epoch": 5603} {"train_loss": -27.016067504882812, "global_step": 465066, "epoch": 5603} {"train_loss": -26.994403839111328, "global_step": 465067, "epoch": 5603} {"train_loss": -27.1002254486084, "global_step": 465068, "epoch": 5603} {"train_loss": -27.20167350769043, "global_step": 465069, "epoch": 5603} {"train_loss": -26.84083366394043, "global_step": 465070, "epoch": 5603} {"train_loss": -27.05476951599121, "global_step": 465071, "epoch": 5603} {"train_loss": -27.057470321655273, "global_step": 465072, "epoch": 5603} {"train_loss": -27.087575912475586, "global_step": 465073, "epoch": 5603} {"train_loss": -27.060461044311523, "global_step": 465074, "epoch": 5603} {"train_loss": -26.93682289123535, "global_step": 465075, "epoch": 5603} {"train_loss": -27.314184188842773, "global_step": 465076, "epoch": 5603} {"train_loss": -27.08321189880371, "global_step": 465077, "epoch": 5603} {"train_loss": -27.147008895874023, "global_step": 465078, "epoch": 5603} {"train_loss": -27.195478439331055, "global_step": 465079, "epoch": 5603} {"train_loss": -27.14995765686035, "global_step": 465080, "epoch": 5603} {"train_loss": -27.083234786987305, "global_step": 465081, "epoch": 5603} {"train_loss": -27.09112548828125, "global_step": 465082, "epoch": 5603} {"train_loss": -27.26346206665039, "global_step": 465083, "epoch": 5603} {"train_loss": -27.144437789916992, "global_step": 465084, "epoch": 5603} {"train_loss": -27.200483322143555, "global_step": 465085, "epoch": 5603} {"train_loss": -27.1700496673584, "global_step": 465086, "epoch": 5603} {"train_loss": -26.909778594970703, "global_step": 465087, "epoch": 5603} {"train_loss": -27.20194435119629, "global_step": 465088, "epoch": 5603} {"train_loss": -27.115842819213867, "global_step": 465089, "epoch": 5603} {"train_loss": -27.148914337158203, "global_step": 465090, "epoch": 5603} {"train_loss": -27.278949737548828, "global_step": 465091, "epoch": 5603} {"train_loss": -27.155561447143555, "global_step": 465092, "epoch": 5603} {"train_loss": -27.556562423706055, "global_step": 465093, "epoch": 5603} {"train_loss": -27.162296295166016, "global_step": 465094, "epoch": 5603} {"train_loss": -27.231983184814453, "global_step": 465095, "epoch": 5603} {"train_loss": -27.4052791595459, "global_step": 465096, "epoch": 5603} {"train_loss": -26.87565040588379, "global_step": 465097, "epoch": 5603} {"train_loss": -27.04132080078125, "global_step": 465098, "epoch": 5603} {"train_loss": -27.463855743408203, "global_step": 465099, "epoch": 5603} {"train_loss": -27.20699119567871, "global_step": 465100, "epoch": 5603} {"train_loss": -27.282190322875977, "global_step": 465101, "epoch": 5603} {"train_loss": -27.0991153717041, "global_step": 465102, "epoch": 5603} {"train_loss": -26.749225616455078, "global_step": 465103, "epoch": 5603} {"train_loss": -26.97711753845215, "global_step": 465104, "epoch": 5603} {"train_loss": -27.111881256103516, "global_step": 465105, "epoch": 5603} {"train_loss": -27.098825454711914, "global_step": 465106, "epoch": 5603} {"train_loss": -26.737747192382812, "global_step": 465107, "epoch": 5603} {"train_loss": -26.90479850769043, "global_step": 465108, "epoch": 5603} {"train_loss": -26.933027267456055, "global_step": 465109, "epoch": 5603} {"train_loss": -26.954349517822266, "global_step": 465110, "epoch": 5603} {"train_loss": -26.993478775024414, "global_step": 465111, "epoch": 5603} {"train_loss": -27.03379249572754, "global_step": 465112, "epoch": 5603} {"train_loss": -27.294172286987305, "global_step": 465113, "epoch": 5603} {"train_loss": -26.74649429321289, "global_step": 465114, "epoch": 5603} {"train_loss": -27.140308380126953, "global_step": 465115, "epoch": 5603} {"train_loss": -27.409320831298828, "global_step": 465116, "epoch": 5603} {"train_loss": -27.11712074279785, "global_step": 465117, "epoch": 5603} {"train_loss": -27.30426025390625, "global_step": 465118, "epoch": 5603} {"train_loss": -27.2705078125, "global_step": 465119, "epoch": 5603} {"train_loss": -27.64565086364746, "global_step": 465120, "epoch": 5603} {"train_loss": -27.18079948425293, "global_step": 465121, "epoch": 5603} {"train_loss": -27.320898056030273, "global_step": 465122, "epoch": 5603} {"train_loss": -27.103271484375, "global_step": 465123, "epoch": 5603} {"train_loss": -27.73921775817871, "global_step": 465124, "epoch": 5603} {"train_loss": -27.334226608276367, "global_step": 465125, "epoch": 5603} {"train_loss": -27.349340438842773, "global_step": 465126, "epoch": 5603} {"train_loss": -27.44990348815918, "global_step": 465127, "epoch": 5603} {"train_loss": -27.548969268798828, "global_step": 465128, "epoch": 5603} {"train_loss": -27.15485954284668, "global_step": 465129, "epoch": 5603} {"train_loss": -27.2945499420166, "global_step": 465130, "epoch": 5603} {"train_loss": -27.083482098866657, "global_step": 465131, "epoch": 5603, "val_loss": 6580698.0} {"train_loss": -26.802976608276367, "global_step": 465132, "epoch": 5604} {"train_loss": -26.634464263916016, "global_step": 465133, "epoch": 5604} {"train_loss": -27.264368057250977, "global_step": 465134, "epoch": 5604} {"train_loss": -26.9893798828125, "global_step": 465135, "epoch": 5604} {"train_loss": -26.866498947143555, "global_step": 465136, "epoch": 5604} {"train_loss": -27.140735626220703, "global_step": 465137, "epoch": 5604} {"train_loss": -26.76580238342285, "global_step": 465138, "epoch": 5604} {"train_loss": -27.22722816467285, "global_step": 465139, "epoch": 5604} {"train_loss": -26.969266891479492, "global_step": 465140, "epoch": 5604} {"train_loss": -27.246789932250977, "global_step": 465141, "epoch": 5604} {"train_loss": -27.24464988708496, "global_step": 465142, "epoch": 5604} {"train_loss": -27.014789581298828, "global_step": 465143, "epoch": 5604} {"train_loss": -26.960269927978516, "global_step": 465144, "epoch": 5604} {"train_loss": -27.151025772094727, "global_step": 465145, "epoch": 5604} {"train_loss": -27.211957931518555, "global_step": 465146, "epoch": 5604} {"train_loss": -27.0982608795166, "global_step": 465147, "epoch": 5604} {"train_loss": -26.947240829467773, "global_step": 465148, "epoch": 5604} {"train_loss": -27.09113121032715, "global_step": 465149, "epoch": 5604} {"train_loss": -26.964191436767578, "global_step": 465150, "epoch": 5604} {"train_loss": -26.765233993530273, "global_step": 465151, "epoch": 5604} {"train_loss": -27.35182762145996, "global_step": 465152, "epoch": 5604} {"train_loss": -27.10391616821289, "global_step": 465153, "epoch": 5604} {"train_loss": -26.988447189331055, "global_step": 465154, "epoch": 5604} {"train_loss": -27.119226455688477, "global_step": 465155, "epoch": 5604} {"train_loss": -26.8277587890625, "global_step": 465156, "epoch": 5604} {"train_loss": -26.838977813720703, "global_step": 465157, "epoch": 5604} {"train_loss": -27.162872314453125, "global_step": 465158, "epoch": 5604} {"train_loss": -27.057865142822266, "global_step": 465159, "epoch": 5604} {"train_loss": -27.010648727416992, "global_step": 465160, "epoch": 5604} {"train_loss": -27.53061866760254, "global_step": 465161, "epoch": 5604} {"train_loss": -27.588367462158203, "global_step": 465162, "epoch": 5604} {"train_loss": -27.400144577026367, "global_step": 465163, "epoch": 5604} {"train_loss": -27.43474769592285, "global_step": 465164, "epoch": 5604} {"train_loss": -26.965734481811523, "global_step": 465165, "epoch": 5604} {"train_loss": -27.244831085205078, "global_step": 465166, "epoch": 5604} {"train_loss": -27.397790908813477, "global_step": 465167, "epoch": 5604} {"train_loss": -27.314306259155273, "global_step": 465168, "epoch": 5604} {"train_loss": -27.323286056518555, "global_step": 465169, "epoch": 5604} {"train_loss": -27.29145622253418, "global_step": 465170, "epoch": 5604} {"train_loss": -27.4339599609375, "global_step": 465171, "epoch": 5604} {"train_loss": -27.158552169799805, "global_step": 465172, "epoch": 5604} {"train_loss": -27.2559871673584, "global_step": 465173, "epoch": 5604} {"train_loss": -26.92463493347168, "global_step": 465174, "epoch": 5604} {"train_loss": -26.945234298706055, "global_step": 465175, "epoch": 5604} {"train_loss": -26.963184356689453, "global_step": 465176, "epoch": 5604} {"train_loss": -26.90399742126465, "global_step": 465177, "epoch": 5604} {"train_loss": -27.381134033203125, "global_step": 465178, "epoch": 5604} {"train_loss": -26.991270065307617, "global_step": 465179, "epoch": 5604} {"train_loss": -27.38795280456543, "global_step": 465180, "epoch": 5604} {"train_loss": -27.37493324279785, "global_step": 465181, "epoch": 5604} {"train_loss": -27.305822372436523, "global_step": 465182, "epoch": 5604} {"train_loss": -26.74224853515625, "global_step": 465183, "epoch": 5604} {"train_loss": -27.17011070251465, "global_step": 465184, "epoch": 5604} {"train_loss": -27.09698486328125, "global_step": 465185, "epoch": 5604} {"train_loss": -26.91451072692871, "global_step": 465186, "epoch": 5604} {"train_loss": -27.02008056640625, "global_step": 465187, "epoch": 5604} {"train_loss": -27.161304473876953, "global_step": 465188, "epoch": 5604} {"train_loss": -27.055402755737305, "global_step": 465189, "epoch": 5604} {"train_loss": -27.240909576416016, "global_step": 465190, "epoch": 5604} {"train_loss": -26.83845329284668, "global_step": 465191, "epoch": 5604} {"train_loss": -27.096851348876953, "global_step": 465192, "epoch": 5604} {"train_loss": -27.45521354675293, "global_step": 465193, "epoch": 5604} {"train_loss": -27.066381454467773, "global_step": 465194, "epoch": 5604} {"train_loss": -27.002588272094727, "global_step": 465195, "epoch": 5604} {"train_loss": -27.341428756713867, "global_step": 465196, "epoch": 5604} {"train_loss": -27.233381271362305, "global_step": 465197, "epoch": 5604} {"train_loss": -26.977405548095703, "global_step": 465198, "epoch": 5604} {"train_loss": -27.1408748626709, "global_step": 465199, "epoch": 5604} {"train_loss": -27.441669464111328, "global_step": 465200, "epoch": 5604} {"train_loss": -27.415319442749023, "global_step": 465201, "epoch": 5604} {"train_loss": -27.192138671875, "global_step": 465202, "epoch": 5604} {"train_loss": -27.451242446899414, "global_step": 465203, "epoch": 5604} {"train_loss": -27.350055694580078, "global_step": 465204, "epoch": 5604} {"train_loss": -27.237043380737305, "global_step": 465205, "epoch": 5604} {"train_loss": -27.227102279663086, "global_step": 465206, "epoch": 5604} {"train_loss": -27.441579818725586, "global_step": 465207, "epoch": 5604} {"train_loss": -27.05519676208496, "global_step": 465208, "epoch": 5604} {"train_loss": -27.314563751220703, "global_step": 465209, "epoch": 5604} {"train_loss": -27.448068618774414, "global_step": 465210, "epoch": 5604} {"train_loss": -27.18757438659668, "global_step": 465211, "epoch": 5604} {"train_loss": -27.500629425048828, "global_step": 465212, "epoch": 5604} {"train_loss": -27.289459228515625, "global_step": 465213, "epoch": 5604} {"train_loss": -27.164536372724786, "global_step": 465214, "epoch": 5604, "val_loss": 6602827.0} {"train_loss": -26.182373046875, "global_step": 465215, "epoch": 5605} {"train_loss": -25.30431365966797, "global_step": 465216, "epoch": 5605} {"train_loss": -25.496801376342773, "global_step": 465217, "epoch": 5605} {"train_loss": -26.508682250976562, "global_step": 465218, "epoch": 5605} {"train_loss": -26.677616119384766, "global_step": 465219, "epoch": 5605} {"train_loss": -26.379377365112305, "global_step": 465220, "epoch": 5605} {"train_loss": -26.904468536376953, "global_step": 465221, "epoch": 5605} {"train_loss": -26.34571647644043, "global_step": 465222, "epoch": 5605} {"train_loss": -26.804059982299805, "global_step": 465223, "epoch": 5605} {"train_loss": -26.376911163330078, "global_step": 465224, "epoch": 5605} {"train_loss": -26.7440185546875, "global_step": 465225, "epoch": 5605} {"train_loss": -26.860105514526367, "global_step": 465226, "epoch": 5605} {"train_loss": -26.744958877563477, "global_step": 465227, "epoch": 5605} {"train_loss": -27.089685440063477, "global_step": 465228, "epoch": 5605} {"train_loss": -26.423904418945312, "global_step": 465229, "epoch": 5605} {"train_loss": -27.18304443359375, "global_step": 465230, "epoch": 5605} {"train_loss": -26.885757446289062, "global_step": 465231, "epoch": 5605} {"train_loss": -27.066736221313477, "global_step": 465232, "epoch": 5605} {"train_loss": -27.0865535736084, "global_step": 465233, "epoch": 5605} {"train_loss": -27.229324340820312, "global_step": 465234, "epoch": 5605} {"train_loss": -27.03110694885254, "global_step": 465235, "epoch": 5605} {"train_loss": -27.200214385986328, "global_step": 465236, "epoch": 5605} {"train_loss": -26.699024200439453, "global_step": 465237, "epoch": 5605} {"train_loss": -26.9658260345459, "global_step": 465238, "epoch": 5605} {"train_loss": -27.066375732421875, "global_step": 465239, "epoch": 5605} {"train_loss": -27.391504287719727, "global_step": 465240, "epoch": 5605} {"train_loss": -27.28369140625, "global_step": 465241, "epoch": 5605} {"train_loss": -27.305566787719727, "global_step": 465242, "epoch": 5605} {"train_loss": -27.0791072845459, "global_step": 465243, "epoch": 5605} {"train_loss": -27.22416114807129, "global_step": 465244, "epoch": 5605} {"train_loss": -27.1982421875, "global_step": 465245, "epoch": 5605} {"train_loss": -27.163166046142578, "global_step": 465246, "epoch": 5605} {"train_loss": -26.892902374267578, "global_step": 465247, "epoch": 5605} {"train_loss": -27.111066818237305, "global_step": 465248, "epoch": 5605} {"train_loss": -26.750869750976562, "global_step": 465249, "epoch": 5605} {"train_loss": -26.79640007019043, "global_step": 465250, "epoch": 5605} {"train_loss": -27.198827743530273, "global_step": 465251, "epoch": 5605} {"train_loss": -26.88445472717285, "global_step": 465252, "epoch": 5605} {"train_loss": -26.79031753540039, "global_step": 465253, "epoch": 5605} {"train_loss": -27.119892120361328, "global_step": 465254, "epoch": 5605} {"train_loss": -27.00229835510254, "global_step": 465255, "epoch": 5605} {"train_loss": -26.94512367248535, "global_step": 465256, "epoch": 5605} {"train_loss": -26.89017105102539, "global_step": 465257, "epoch": 5605} {"train_loss": -26.83356285095215, "global_step": 465258, "epoch": 5605} {"train_loss": -27.19317054748535, "global_step": 465259, "epoch": 5605} {"train_loss": -27.084548950195312, "global_step": 465260, "epoch": 5605} {"train_loss": -27.274396896362305, "global_step": 465261, "epoch": 5605} {"train_loss": -26.8228702545166, "global_step": 465262, "epoch": 5605} {"train_loss": -27.366636276245117, "global_step": 465263, "epoch": 5605} {"train_loss": -26.991134643554688, "global_step": 465264, "epoch": 5605} {"train_loss": -27.114267349243164, "global_step": 465265, "epoch": 5605} {"train_loss": -26.90884780883789, "global_step": 465266, "epoch": 5605} {"train_loss": -27.254459381103516, "global_step": 465267, "epoch": 5605} {"train_loss": -27.070510864257812, "global_step": 465268, "epoch": 5605} {"train_loss": -27.1793155670166, "global_step": 465269, "epoch": 5605} {"train_loss": -27.253217697143555, "global_step": 465270, "epoch": 5605} {"train_loss": -26.818653106689453, "global_step": 465271, "epoch": 5605} {"train_loss": -27.294553756713867, "global_step": 465272, "epoch": 5605} {"train_loss": -27.26894187927246, "global_step": 465273, "epoch": 5605} {"train_loss": -27.276350021362305, "global_step": 465274, "epoch": 5605} {"train_loss": -27.079824447631836, "global_step": 465275, "epoch": 5605} {"train_loss": -27.152441024780273, "global_step": 465276, "epoch": 5605} {"train_loss": -27.508127212524414, "global_step": 465277, "epoch": 5605} {"train_loss": -27.280487060546875, "global_step": 465278, "epoch": 5605} {"train_loss": -27.1573429107666, "global_step": 465279, "epoch": 5605} {"train_loss": -26.5421199798584, "global_step": 465280, "epoch": 5605} {"train_loss": -27.452749252319336, "global_step": 465281, "epoch": 5605} {"train_loss": -27.136743545532227, "global_step": 465282, "epoch": 5605} {"train_loss": -27.003355026245117, "global_step": 465283, "epoch": 5605} {"train_loss": -27.026296615600586, "global_step": 465284, "epoch": 5605} {"train_loss": -27.2233829498291, "global_step": 465285, "epoch": 5605} {"train_loss": -27.3685359954834, "global_step": 465286, "epoch": 5605} {"train_loss": -27.280893325805664, "global_step": 465287, "epoch": 5605} {"train_loss": -27.245746612548828, "global_step": 465288, "epoch": 5605} {"train_loss": -27.688207626342773, "global_step": 465289, "epoch": 5605} {"train_loss": -27.530303955078125, "global_step": 465290, "epoch": 5605} {"train_loss": -27.457040786743164, "global_step": 465291, "epoch": 5605} {"train_loss": -27.520374298095703, "global_step": 465292, "epoch": 5605} {"train_loss": -27.208728790283203, "global_step": 465293, "epoch": 5605} {"train_loss": -27.3568172454834, "global_step": 465294, "epoch": 5605} {"train_loss": -27.199527740478516, "global_step": 465295, "epoch": 5605} {"train_loss": -27.00160789489746, "global_step": 465296, "epoch": 5605} {"train_loss": -27.006789379809277, "global_step": 465297, "epoch": 5605, "val_loss": 6605143.0} {"train_loss": -26.560047149658203, "global_step": 465298, "epoch": 5606} {"train_loss": -26.844314575195312, "global_step": 465299, "epoch": 5606} {"train_loss": -26.646011352539062, "global_step": 465300, "epoch": 5606} {"train_loss": -27.042627334594727, "global_step": 465301, "epoch": 5606} {"train_loss": -25.720962524414062, "global_step": 465302, "epoch": 5606} {"train_loss": -25.295141220092773, "global_step": 465303, "epoch": 5606} {"train_loss": -24.8482723236084, "global_step": 465304, "epoch": 5606} {"train_loss": -27.18352699279785, "global_step": 465305, "epoch": 5606} {"train_loss": -26.6783504486084, "global_step": 465306, "epoch": 5606} {"train_loss": -26.750812530517578, "global_step": 465307, "epoch": 5606} {"train_loss": -26.58420753479004, "global_step": 465308, "epoch": 5606} {"train_loss": -26.435779571533203, "global_step": 465309, "epoch": 5606} {"train_loss": -26.658802032470703, "global_step": 465310, "epoch": 5606} {"train_loss": -26.46310806274414, "global_step": 465311, "epoch": 5606} {"train_loss": -26.656452178955078, "global_step": 465312, "epoch": 5606} {"train_loss": -26.437591552734375, "global_step": 465313, "epoch": 5606} {"train_loss": -27.062793731689453, "global_step": 465314, "epoch": 5606} {"train_loss": -26.431140899658203, "global_step": 465315, "epoch": 5606} {"train_loss": -26.192758560180664, "global_step": 465316, "epoch": 5606} {"train_loss": -26.9312744140625, "global_step": 465317, "epoch": 5606} {"train_loss": -26.714801788330078, "global_step": 465318, "epoch": 5606} {"train_loss": -26.719573974609375, "global_step": 465319, "epoch": 5606} {"train_loss": -26.845998764038086, "global_step": 465320, "epoch": 5606} {"train_loss": -26.929529190063477, "global_step": 465321, "epoch": 5606} {"train_loss": -26.902074813842773, "global_step": 465322, "epoch": 5606} {"train_loss": -26.74578857421875, "global_step": 465323, "epoch": 5606} {"train_loss": -27.112348556518555, "global_step": 465324, "epoch": 5606} {"train_loss": -26.922155380249023, "global_step": 465325, "epoch": 5606} {"train_loss": -26.88413429260254, "global_step": 465326, "epoch": 5606} {"train_loss": -26.990331649780273, "global_step": 465327, "epoch": 5606} {"train_loss": -27.382352828979492, "global_step": 465328, "epoch": 5606} {"train_loss": -26.87247657775879, "global_step": 465329, "epoch": 5606} {"train_loss": -26.79202651977539, "global_step": 465330, "epoch": 5606} {"train_loss": -26.71630859375, "global_step": 465331, "epoch": 5606} {"train_loss": -27.21026039123535, "global_step": 465332, "epoch": 5606} {"train_loss": -26.958662033081055, "global_step": 465333, "epoch": 5606} {"train_loss": -27.489856719970703, "global_step": 465334, "epoch": 5606} {"train_loss": -27.125152587890625, "global_step": 465335, "epoch": 5606} {"train_loss": -27.261322021484375, "global_step": 465336, "epoch": 5606} {"train_loss": -27.192678451538086, "global_step": 465337, "epoch": 5606} {"train_loss": -27.43267250061035, "global_step": 465338, "epoch": 5606} {"train_loss": -27.177692413330078, "global_step": 465339, "epoch": 5606} {"train_loss": -27.437835693359375, "global_step": 465340, "epoch": 5606} {"train_loss": -27.03022575378418, "global_step": 465341, "epoch": 5606} {"train_loss": -27.20975685119629, "global_step": 465342, "epoch": 5606} {"train_loss": -27.496383666992188, "global_step": 465343, "epoch": 5606} {"train_loss": -27.056257247924805, "global_step": 465344, "epoch": 5606} {"train_loss": -27.27432632446289, "global_step": 465345, "epoch": 5606} {"train_loss": -26.99257469177246, "global_step": 465346, "epoch": 5606} {"train_loss": -26.953454971313477, "global_step": 465347, "epoch": 5606} {"train_loss": -27.127832412719727, "global_step": 465348, "epoch": 5606} {"train_loss": -27.00214195251465, "global_step": 465349, "epoch": 5606} {"train_loss": -26.8623104095459, "global_step": 465350, "epoch": 5606} {"train_loss": -27.074359893798828, "global_step": 465351, "epoch": 5606} {"train_loss": -27.1284236907959, "global_step": 465352, "epoch": 5606} {"train_loss": -27.059961318969727, "global_step": 465353, "epoch": 5606} {"train_loss": -27.307331085205078, "global_step": 465354, "epoch": 5606} {"train_loss": -26.9101619720459, "global_step": 465355, "epoch": 5606} {"train_loss": -26.9274845123291, "global_step": 465356, "epoch": 5606} {"train_loss": -26.987903594970703, "global_step": 465357, "epoch": 5606} {"train_loss": -26.84967613220215, "global_step": 465358, "epoch": 5606} {"train_loss": -27.196273803710938, "global_step": 465359, "epoch": 5606} {"train_loss": -27.274518966674805, "global_step": 465360, "epoch": 5606} {"train_loss": -26.7877197265625, "global_step": 465361, "epoch": 5606} {"train_loss": -26.97865104675293, "global_step": 465362, "epoch": 5606} {"train_loss": -26.642520904541016, "global_step": 465363, "epoch": 5606} {"train_loss": -26.833454132080078, "global_step": 465364, "epoch": 5606} {"train_loss": -26.895217895507812, "global_step": 465365, "epoch": 5606} {"train_loss": -27.22623634338379, "global_step": 465366, "epoch": 5606} {"train_loss": -26.916025161743164, "global_step": 465367, "epoch": 5606} {"train_loss": -27.316373825073242, "global_step": 465368, "epoch": 5606} {"train_loss": -27.00612449645996, "global_step": 465369, "epoch": 5606} {"train_loss": -27.125385284423828, "global_step": 465370, "epoch": 5606} {"train_loss": -26.537500381469727, "global_step": 465371, "epoch": 5606} {"train_loss": -27.271991729736328, "global_step": 465372, "epoch": 5606} {"train_loss": -26.970563888549805, "global_step": 465373, "epoch": 5606} {"train_loss": -27.213409423828125, "global_step": 465374, "epoch": 5606} {"train_loss": -26.84844970703125, "global_step": 465375, "epoch": 5606} {"train_loss": -26.673994064331055, "global_step": 465376, "epoch": 5606} {"train_loss": -26.94770622253418, "global_step": 465377, "epoch": 5606} {"train_loss": -26.84669303894043, "global_step": 465378, "epoch": 5606} {"train_loss": -26.9926815032959, "global_step": 465379, "epoch": 5606} {"train_loss": -26.879343676279827, "global_step": 465380, "epoch": 5606, "val_loss": 6574987.0} {"train_loss": -26.543548583984375, "global_step": 465381, "epoch": 5607} {"train_loss": -26.770843505859375, "global_step": 465382, "epoch": 5607} {"train_loss": -26.838354110717773, "global_step": 465383, "epoch": 5607} {"train_loss": -26.560415267944336, "global_step": 465384, "epoch": 5607} {"train_loss": -26.70928382873535, "global_step": 465385, "epoch": 5607} {"train_loss": -27.220457077026367, "global_step": 465386, "epoch": 5607} {"train_loss": -26.5617618560791, "global_step": 465387, "epoch": 5607} {"train_loss": -26.699201583862305, "global_step": 465388, "epoch": 5607} {"train_loss": -26.99506950378418, "global_step": 465389, "epoch": 5607} {"train_loss": -26.72320556640625, "global_step": 465390, "epoch": 5607} {"train_loss": -26.84760093688965, "global_step": 465391, "epoch": 5607} {"train_loss": -27.07195472717285, "global_step": 465392, "epoch": 5607} {"train_loss": -26.961851119995117, "global_step": 465393, "epoch": 5607} {"train_loss": -26.529687881469727, "global_step": 465394, "epoch": 5607} {"train_loss": -27.085205078125, "global_step": 465395, "epoch": 5607} {"train_loss": -27.021717071533203, "global_step": 465396, "epoch": 5607} {"train_loss": -26.6853084564209, "global_step": 465397, "epoch": 5607} {"train_loss": -27.0064697265625, "global_step": 465398, "epoch": 5607} {"train_loss": -27.1600341796875, "global_step": 465399, "epoch": 5607} {"train_loss": -26.885364532470703, "global_step": 465400, "epoch": 5607} {"train_loss": -26.708789825439453, "global_step": 465401, "epoch": 5607} {"train_loss": -26.985952377319336, "global_step": 465402, "epoch": 5607} {"train_loss": -27.040185928344727, "global_step": 465403, "epoch": 5607} {"train_loss": -26.981897354125977, "global_step": 465404, "epoch": 5607} {"train_loss": -27.40030860900879, "global_step": 465405, "epoch": 5607} {"train_loss": -27.16388511657715, "global_step": 465406, "epoch": 5607} {"train_loss": -26.865686416625977, "global_step": 465407, "epoch": 5607} {"train_loss": -27.266223907470703, "global_step": 465408, "epoch": 5607} {"train_loss": -27.13913345336914, "global_step": 465409, "epoch": 5607} {"train_loss": -27.1402530670166, "global_step": 465410, "epoch": 5607} {"train_loss": -27.081501007080078, "global_step": 465411, "epoch": 5607} {"train_loss": -27.467294692993164, "global_step": 465412, "epoch": 5607} {"train_loss": -26.93310546875, "global_step": 465413, "epoch": 5607} {"train_loss": -27.470947265625, "global_step": 465414, "epoch": 5607} {"train_loss": -27.272552490234375, "global_step": 465415, "epoch": 5607} {"train_loss": -27.13973045349121, "global_step": 465416, "epoch": 5607} {"train_loss": -27.21526527404785, "global_step": 465417, "epoch": 5607} {"train_loss": -26.937992095947266, "global_step": 465418, "epoch": 5607} {"train_loss": -27.014123916625977, "global_step": 465419, "epoch": 5607} {"train_loss": -27.429672241210938, "global_step": 465420, "epoch": 5607} {"train_loss": -27.01091957092285, "global_step": 465421, "epoch": 5607} {"train_loss": -26.966373443603516, "global_step": 465422, "epoch": 5607} {"train_loss": -27.78310203552246, "global_step": 465423, "epoch": 5607} {"train_loss": -27.771991729736328, "global_step": 465424, "epoch": 5607} {"train_loss": -26.86813735961914, "global_step": 465425, "epoch": 5607} {"train_loss": -26.999515533447266, "global_step": 465426, "epoch": 5607} {"train_loss": -27.144306182861328, "global_step": 465427, "epoch": 5607} {"train_loss": -27.192407608032227, "global_step": 465428, "epoch": 5607} {"train_loss": -27.227991104125977, "global_step": 465429, "epoch": 5607} {"train_loss": -26.915515899658203, "global_step": 465430, "epoch": 5607} {"train_loss": -27.106027603149414, "global_step": 465431, "epoch": 5607} {"train_loss": -27.24830436706543, "global_step": 465432, "epoch": 5607} {"train_loss": -27.482471466064453, "global_step": 465433, "epoch": 5607} {"train_loss": -27.327234268188477, "global_step": 465434, "epoch": 5607} {"train_loss": -27.42487907409668, "global_step": 465435, "epoch": 5607} {"train_loss": -27.10139274597168, "global_step": 465436, "epoch": 5607} {"train_loss": -27.397384643554688, "global_step": 465437, "epoch": 5607} {"train_loss": -27.70224380493164, "global_step": 465438, "epoch": 5607} {"train_loss": -27.167394638061523, "global_step": 465439, "epoch": 5607} {"train_loss": -27.309919357299805, "global_step": 465440, "epoch": 5607} {"train_loss": -26.808563232421875, "global_step": 465441, "epoch": 5607} {"train_loss": -26.692975997924805, "global_step": 465442, "epoch": 5607} {"train_loss": -26.11677360534668, "global_step": 465443, "epoch": 5607} {"train_loss": -26.35337257385254, "global_step": 465444, "epoch": 5607} {"train_loss": -27.008991241455078, "global_step": 465445, "epoch": 5607} {"train_loss": -27.167312622070312, "global_step": 465446, "epoch": 5607} {"train_loss": -27.114425659179688, "global_step": 465447, "epoch": 5607} {"train_loss": -27.357580184936523, "global_step": 465448, "epoch": 5607} {"train_loss": -26.974721908569336, "global_step": 465449, "epoch": 5607} {"train_loss": -27.528705596923828, "global_step": 465450, "epoch": 5607} {"train_loss": -27.038726806640625, "global_step": 465451, "epoch": 5607} {"train_loss": -27.381072998046875, "global_step": 465452, "epoch": 5607} {"train_loss": -26.677371978759766, "global_step": 465453, "epoch": 5607} {"train_loss": -27.316848754882812, "global_step": 465454, "epoch": 5607} {"train_loss": -27.177709579467773, "global_step": 465455, "epoch": 5607} {"train_loss": -26.694812774658203, "global_step": 465456, "epoch": 5607} {"train_loss": -26.411874771118164, "global_step": 465457, "epoch": 5607} {"train_loss": -26.575178146362305, "global_step": 465458, "epoch": 5607} {"train_loss": -26.199996948242188, "global_step": 465459, "epoch": 5607} {"train_loss": -26.923751831054688, "global_step": 465460, "epoch": 5607} {"train_loss": -26.676483154296875, "global_step": 465461, "epoch": 5607} {"train_loss": -26.515960693359375, "global_step": 465462, "epoch": 5607} {"train_loss": -27.00520793501153, "global_step": 465463, "epoch": 5607, "val_loss": 6573958.0} {"train_loss": -25.86948013305664, "global_step": 465464, "epoch": 5608} {"train_loss": -26.08908462524414, "global_step": 465465, "epoch": 5608} {"train_loss": -26.4677734375, "global_step": 465466, "epoch": 5608} {"train_loss": -26.457355499267578, "global_step": 465467, "epoch": 5608} {"train_loss": -26.19880485534668, "global_step": 465468, "epoch": 5608} {"train_loss": -25.534883499145508, "global_step": 465469, "epoch": 5608} {"train_loss": -26.533849716186523, "global_step": 465470, "epoch": 5608} {"train_loss": -26.49655532836914, "global_step": 465471, "epoch": 5608} {"train_loss": -26.704364776611328, "global_step": 465472, "epoch": 5608} {"train_loss": -26.453882217407227, "global_step": 465473, "epoch": 5608} {"train_loss": -26.31485366821289, "global_step": 465474, "epoch": 5608} {"train_loss": -26.524478912353516, "global_step": 465475, "epoch": 5608} {"train_loss": -26.810087203979492, "global_step": 465476, "epoch": 5608} {"train_loss": -26.3648681640625, "global_step": 465477, "epoch": 5608} {"train_loss": -26.52088737487793, "global_step": 465478, "epoch": 5608} {"train_loss": -26.495513916015625, "global_step": 465479, "epoch": 5608} {"train_loss": -26.269941329956055, "global_step": 465480, "epoch": 5608} {"train_loss": -26.465301513671875, "global_step": 465481, "epoch": 5608} {"train_loss": -26.533227920532227, "global_step": 465482, "epoch": 5608} {"train_loss": -26.828535079956055, "global_step": 465483, "epoch": 5608} {"train_loss": -26.879499435424805, "global_step": 465484, "epoch": 5608} {"train_loss": -26.59950065612793, "global_step": 465485, "epoch": 5608} {"train_loss": -27.193647384643555, "global_step": 465486, "epoch": 5608} {"train_loss": -26.8387508392334, "global_step": 465487, "epoch": 5608} {"train_loss": -27.002134323120117, "global_step": 465488, "epoch": 5608} {"train_loss": -26.7352352142334, "global_step": 465489, "epoch": 5608} {"train_loss": -26.605260848999023, "global_step": 465490, "epoch": 5608} {"train_loss": -26.952009201049805, "global_step": 465491, "epoch": 5608} {"train_loss": -26.88763999938965, "global_step": 465492, "epoch": 5608} {"train_loss": -26.790836334228516, "global_step": 465493, "epoch": 5608} {"train_loss": -27.048267364501953, "global_step": 465494, "epoch": 5608} {"train_loss": -27.137937545776367, "global_step": 465495, "epoch": 5608} {"train_loss": -27.26653480529785, "global_step": 465496, "epoch": 5608} {"train_loss": -26.62013053894043, "global_step": 465497, "epoch": 5608} {"train_loss": -26.988388061523438, "global_step": 465498, "epoch": 5608} {"train_loss": -27.124862670898438, "global_step": 465499, "epoch": 5608} {"train_loss": -26.977054595947266, "global_step": 465500, "epoch": 5608} {"train_loss": -27.285505294799805, "global_step": 465501, "epoch": 5608} {"train_loss": -26.973941802978516, "global_step": 465502, "epoch": 5608} {"train_loss": -27.518695831298828, "global_step": 465503, "epoch": 5608} {"train_loss": -27.050825119018555, "global_step": 465504, "epoch": 5608} {"train_loss": -27.179296493530273, "global_step": 465505, "epoch": 5608} {"train_loss": -27.31611442565918, "global_step": 465506, "epoch": 5608} {"train_loss": -27.06501579284668, "global_step": 465507, "epoch": 5608} {"train_loss": -27.1762638092041, "global_step": 465508, "epoch": 5608} {"train_loss": -27.067590713500977, "global_step": 465509, "epoch": 5608} {"train_loss": -27.126983642578125, "global_step": 465510, "epoch": 5608} {"train_loss": -27.311283111572266, "global_step": 465511, "epoch": 5608} {"train_loss": -27.54129409790039, "global_step": 465512, "epoch": 5608} {"train_loss": -27.48927116394043, "global_step": 465513, "epoch": 5608} {"train_loss": -27.078588485717773, "global_step": 465514, "epoch": 5608} {"train_loss": -27.23284339904785, "global_step": 465515, "epoch": 5608} {"train_loss": -27.318296432495117, "global_step": 465516, "epoch": 5608} {"train_loss": -27.242639541625977, "global_step": 465517, "epoch": 5608} {"train_loss": -27.047719955444336, "global_step": 465518, "epoch": 5608} {"train_loss": -27.37055778503418, "global_step": 465519, "epoch": 5608} {"train_loss": -27.1169376373291, "global_step": 465520, "epoch": 5608} {"train_loss": -27.66204833984375, "global_step": 465521, "epoch": 5608} {"train_loss": -27.169294357299805, "global_step": 465522, "epoch": 5608} {"train_loss": -27.17392349243164, "global_step": 465523, "epoch": 5608} {"train_loss": -27.43914222717285, "global_step": 465524, "epoch": 5608} {"train_loss": -27.17047119140625, "global_step": 465525, "epoch": 5608} {"train_loss": -27.07257080078125, "global_step": 465526, "epoch": 5608} {"train_loss": -27.07525634765625, "global_step": 465527, "epoch": 5608} {"train_loss": -27.26555824279785, "global_step": 465528, "epoch": 5608} {"train_loss": -27.254735946655273, "global_step": 465529, "epoch": 5608} {"train_loss": -27.16974449157715, "global_step": 465530, "epoch": 5608} {"train_loss": -27.269201278686523, "global_step": 465531, "epoch": 5608} {"train_loss": -27.199951171875, "global_step": 465532, "epoch": 5608} {"train_loss": -27.331708908081055, "global_step": 465533, "epoch": 5608} {"train_loss": -27.170515060424805, "global_step": 465534, "epoch": 5608} {"train_loss": -27.20664405822754, "global_step": 465535, "epoch": 5608} {"train_loss": -27.047224044799805, "global_step": 465536, "epoch": 5608} {"train_loss": -27.085168838500977, "global_step": 465537, "epoch": 5608} {"train_loss": -27.262496948242188, "global_step": 465538, "epoch": 5608} {"train_loss": -27.4747371673584, "global_step": 465539, "epoch": 5608} {"train_loss": -27.17348289489746, "global_step": 465540, "epoch": 5608} {"train_loss": -27.532611846923828, "global_step": 465541, "epoch": 5608} {"train_loss": -27.125049591064453, "global_step": 465542, "epoch": 5608} {"train_loss": -26.938589096069336, "global_step": 465543, "epoch": 5608} {"train_loss": -26.924274444580078, "global_step": 465544, "epoch": 5608} {"train_loss": -27.075742721557617, "global_step": 465545, "epoch": 5608} {"train_loss": -26.966105472610657, "global_step": 465546, "epoch": 5608, "val_loss": 6590001.0} {"train_loss": -26.732257843017578, "global_step": 465547, "epoch": 5609} {"train_loss": -26.558576583862305, "global_step": 465548, "epoch": 5609} {"train_loss": -25.767566680908203, "global_step": 465549, "epoch": 5609} {"train_loss": -26.39908218383789, "global_step": 465550, "epoch": 5609} {"train_loss": -26.863073348999023, "global_step": 465551, "epoch": 5609} {"train_loss": -25.80938148498535, "global_step": 465552, "epoch": 5609} {"train_loss": -26.665136337280273, "global_step": 465553, "epoch": 5609} {"train_loss": -26.33755874633789, "global_step": 465554, "epoch": 5609} {"train_loss": -26.537214279174805, "global_step": 465555, "epoch": 5609} {"train_loss": -26.728628158569336, "global_step": 465556, "epoch": 5609} {"train_loss": -26.697940826416016, "global_step": 465557, "epoch": 5609} {"train_loss": -27.11835289001465, "global_step": 465558, "epoch": 5609} {"train_loss": -26.688093185424805, "global_step": 465559, "epoch": 5609} {"train_loss": -27.0288143157959, "global_step": 465560, "epoch": 5609} {"train_loss": -26.953962326049805, "global_step": 465561, "epoch": 5609} {"train_loss": -27.10706901550293, "global_step": 465562, "epoch": 5609} {"train_loss": -26.977033615112305, "global_step": 465563, "epoch": 5609} {"train_loss": -27.0482234954834, "global_step": 465564, "epoch": 5609} {"train_loss": -26.78394889831543, "global_step": 465565, "epoch": 5609} {"train_loss": -27.147632598876953, "global_step": 465566, "epoch": 5609} {"train_loss": -27.020673751831055, "global_step": 465567, "epoch": 5609} {"train_loss": -26.8764705657959, "global_step": 465568, "epoch": 5609} {"train_loss": -26.87885856628418, "global_step": 465569, "epoch": 5609} {"train_loss": -27.001819610595703, "global_step": 465570, "epoch": 5609} {"train_loss": -27.369083404541016, "global_step": 465571, "epoch": 5609} {"train_loss": -26.9893741607666, "global_step": 465572, "epoch": 5609} {"train_loss": -27.003015518188477, "global_step": 465573, "epoch": 5609} {"train_loss": -27.454206466674805, "global_step": 465574, "epoch": 5609} {"train_loss": -27.12408447265625, "global_step": 465575, "epoch": 5609} {"train_loss": -27.486902236938477, "global_step": 465576, "epoch": 5609} {"train_loss": -27.12567138671875, "global_step": 465577, "epoch": 5609} {"train_loss": -27.40207290649414, "global_step": 465578, "epoch": 5609} {"train_loss": -27.1391658782959, "global_step": 465579, "epoch": 5609} {"train_loss": -27.131855010986328, "global_step": 465580, "epoch": 5609} {"train_loss": -27.23664665222168, "global_step": 465581, "epoch": 5609} {"train_loss": -27.17087745666504, "global_step": 465582, "epoch": 5609} {"train_loss": -27.366369247436523, "global_step": 465583, "epoch": 5609} {"train_loss": -27.166824340820312, "global_step": 465584, "epoch": 5609} {"train_loss": -27.099023818969727, "global_step": 465585, "epoch": 5609} {"train_loss": -27.124799728393555, "global_step": 465586, "epoch": 5609} {"train_loss": -27.330270767211914, "global_step": 465587, "epoch": 5609} {"train_loss": -27.213987350463867, "global_step": 465588, "epoch": 5609} {"train_loss": -26.799427032470703, "global_step": 465589, "epoch": 5609} {"train_loss": -26.6722412109375, "global_step": 465590, "epoch": 5609} {"train_loss": -27.448522567749023, "global_step": 465591, "epoch": 5609} {"train_loss": -26.8232479095459, "global_step": 465592, "epoch": 5609} {"train_loss": -26.72528076171875, "global_step": 465593, "epoch": 5609} {"train_loss": -27.158981323242188, "global_step": 465594, "epoch": 5609} {"train_loss": -27.16851806640625, "global_step": 465595, "epoch": 5609} {"train_loss": -26.842111587524414, "global_step": 465596, "epoch": 5609} {"train_loss": -26.93593406677246, "global_step": 465597, "epoch": 5609} {"train_loss": -27.313459396362305, "global_step": 465598, "epoch": 5609} {"train_loss": -27.143468856811523, "global_step": 465599, "epoch": 5609} {"train_loss": -27.10318946838379, "global_step": 465600, "epoch": 5609} {"train_loss": -26.966955184936523, "global_step": 465601, "epoch": 5609} {"train_loss": -27.539539337158203, "global_step": 465602, "epoch": 5609} {"train_loss": -27.151315689086914, "global_step": 465603, "epoch": 5609} {"train_loss": -27.377660751342773, "global_step": 465604, "epoch": 5609} {"train_loss": -26.5618953704834, "global_step": 465605, "epoch": 5609} {"train_loss": -26.7648983001709, "global_step": 465606, "epoch": 5609} {"train_loss": -26.776941299438477, "global_step": 465607, "epoch": 5609} {"train_loss": -27.0723876953125, "global_step": 465608, "epoch": 5609} {"train_loss": -27.032062530517578, "global_step": 465609, "epoch": 5609} {"train_loss": -27.11328125, "global_step": 465610, "epoch": 5609} {"train_loss": -26.761198043823242, "global_step": 465611, "epoch": 5609} {"train_loss": -27.0892276763916, "global_step": 465612, "epoch": 5609} {"train_loss": -27.140625, "global_step": 465613, "epoch": 5609} {"train_loss": -27.05230140686035, "global_step": 465614, "epoch": 5609} {"train_loss": -27.203216552734375, "global_step": 465615, "epoch": 5609} {"train_loss": -26.939401626586914, "global_step": 465616, "epoch": 5609} {"train_loss": -27.121295928955078, "global_step": 465617, "epoch": 5609} {"train_loss": -27.396467208862305, "global_step": 465618, "epoch": 5609} {"train_loss": -27.223224639892578, "global_step": 465619, "epoch": 5609} {"train_loss": -27.01420021057129, "global_step": 465620, "epoch": 5609} {"train_loss": -27.395002365112305, "global_step": 465621, "epoch": 5609} {"train_loss": -26.76495361328125, "global_step": 465622, "epoch": 5609} {"train_loss": -27.207672119140625, "global_step": 465623, "epoch": 5609} {"train_loss": -26.977502822875977, "global_step": 465624, "epoch": 5609} {"train_loss": -27.27213478088379, "global_step": 465625, "epoch": 5609} {"train_loss": -27.482086181640625, "global_step": 465626, "epoch": 5609} {"train_loss": -27.663013458251953, "global_step": 465627, "epoch": 5609} {"train_loss": -27.388837814331055, "global_step": 465628, "epoch": 5609} {"train_loss": -27.013528157429523, "global_step": 465629, "epoch": 5609, "val_loss": 6596461.0} {"train_loss": -26.922195434570312, "global_step": 465630, "epoch": 5610} {"train_loss": -27.076862335205078, "global_step": 465631, "epoch": 5610} {"train_loss": -26.6140079498291, "global_step": 465632, "epoch": 5610} {"train_loss": -26.377063751220703, "global_step": 465633, "epoch": 5610} {"train_loss": -26.826557159423828, "global_step": 465634, "epoch": 5610} {"train_loss": -26.705259323120117, "global_step": 465635, "epoch": 5610} {"train_loss": -26.59686279296875, "global_step": 465636, "epoch": 5610} {"train_loss": -26.38545799255371, "global_step": 465637, "epoch": 5610} {"train_loss": -26.753345489501953, "global_step": 465638, "epoch": 5610} {"train_loss": -26.763586044311523, "global_step": 465639, "epoch": 5610} {"train_loss": -26.710912704467773, "global_step": 465640, "epoch": 5610} {"train_loss": -26.674041748046875, "global_step": 465641, "epoch": 5610} {"train_loss": -26.618993759155273, "global_step": 465642, "epoch": 5610} {"train_loss": -27.1359920501709, "global_step": 465643, "epoch": 5610} {"train_loss": -26.9980411529541, "global_step": 465644, "epoch": 5610} {"train_loss": -26.342376708984375, "global_step": 465645, "epoch": 5610} {"train_loss": -26.66259765625, "global_step": 465646, "epoch": 5610} {"train_loss": -26.651325225830078, "global_step": 465647, "epoch": 5610} {"train_loss": -26.826093673706055, "global_step": 465648, "epoch": 5610} {"train_loss": -26.81804847717285, "global_step": 465649, "epoch": 5610} {"train_loss": -26.54816246032715, "global_step": 465650, "epoch": 5610} {"train_loss": -26.615219116210938, "global_step": 465651, "epoch": 5610} {"train_loss": -27.295270919799805, "global_step": 465652, "epoch": 5610} {"train_loss": -26.87074089050293, "global_step": 465653, "epoch": 5610} {"train_loss": -27.08790397644043, "global_step": 465654, "epoch": 5610} {"train_loss": -27.15155601501465, "global_step": 465655, "epoch": 5610} {"train_loss": -26.957761764526367, "global_step": 465656, "epoch": 5610} {"train_loss": -26.938385009765625, "global_step": 465657, "epoch": 5610} {"train_loss": -26.897632598876953, "global_step": 465658, "epoch": 5610} {"train_loss": -26.97292137145996, "global_step": 465659, "epoch": 5610} {"train_loss": -27.343236923217773, "global_step": 465660, "epoch": 5610} {"train_loss": -27.082773208618164, "global_step": 465661, "epoch": 5610} {"train_loss": -27.201929092407227, "global_step": 465662, "epoch": 5610} {"train_loss": -26.52363395690918, "global_step": 465663, "epoch": 5610} {"train_loss": -26.882415771484375, "global_step": 465664, "epoch": 5610} {"train_loss": -26.648202896118164, "global_step": 465665, "epoch": 5610} {"train_loss": -27.047433853149414, "global_step": 465666, "epoch": 5610} {"train_loss": -27.265979766845703, "global_step": 465667, "epoch": 5610} {"train_loss": -26.88300132751465, "global_step": 465668, "epoch": 5610} {"train_loss": -27.12556266784668, "global_step": 465669, "epoch": 5610} {"train_loss": -27.014394760131836, "global_step": 465670, "epoch": 5610} {"train_loss": -27.19011878967285, "global_step": 465671, "epoch": 5610} {"train_loss": -27.357288360595703, "global_step": 465672, "epoch": 5610} {"train_loss": -26.966968536376953, "global_step": 465673, "epoch": 5610} {"train_loss": -26.986175537109375, "global_step": 465674, "epoch": 5610} {"train_loss": -26.884723663330078, "global_step": 465675, "epoch": 5610} {"train_loss": -27.380817413330078, "global_step": 465676, "epoch": 5610} {"train_loss": -27.2626895904541, "global_step": 465677, "epoch": 5610} {"train_loss": -27.41335105895996, "global_step": 465678, "epoch": 5610} {"train_loss": -27.048614501953125, "global_step": 465679, "epoch": 5610} {"train_loss": -27.053552627563477, "global_step": 465680, "epoch": 5610} {"train_loss": -27.180683135986328, "global_step": 465681, "epoch": 5610} {"train_loss": -27.711042404174805, "global_step": 465682, "epoch": 5610} {"train_loss": -27.38612174987793, "global_step": 465683, "epoch": 5610} {"train_loss": -27.173114776611328, "global_step": 465684, "epoch": 5610} {"train_loss": -27.337921142578125, "global_step": 465685, "epoch": 5610} {"train_loss": -27.44424819946289, "global_step": 465686, "epoch": 5610} {"train_loss": -27.462472915649414, "global_step": 465687, "epoch": 5610} {"train_loss": -27.021808624267578, "global_step": 465688, "epoch": 5610} {"train_loss": -27.57777976989746, "global_step": 465689, "epoch": 5610} {"train_loss": -27.285221099853516, "global_step": 465690, "epoch": 5610} {"train_loss": -27.142044067382812, "global_step": 465691, "epoch": 5610} {"train_loss": -27.496225357055664, "global_step": 465692, "epoch": 5610} {"train_loss": -27.315839767456055, "global_step": 465693, "epoch": 5610} {"train_loss": -27.62371253967285, "global_step": 465694, "epoch": 5610} {"train_loss": -27.43881607055664, "global_step": 465695, "epoch": 5610} {"train_loss": -27.3177433013916, "global_step": 465696, "epoch": 5610} {"train_loss": -27.26673698425293, "global_step": 465697, "epoch": 5610} {"train_loss": -27.3828067779541, "global_step": 465698, "epoch": 5610} {"train_loss": -26.916858673095703, "global_step": 465699, "epoch": 5610} {"train_loss": -27.213186264038086, "global_step": 465700, "epoch": 5610} {"train_loss": -26.631824493408203, "global_step": 465701, "epoch": 5610} {"train_loss": -26.032175064086914, "global_step": 465702, "epoch": 5610} {"train_loss": -25.322265625, "global_step": 465703, "epoch": 5610} {"train_loss": -24.864429473876953, "global_step": 465704, "epoch": 5610} {"train_loss": -27.062488555908203, "global_step": 465705, "epoch": 5610} {"train_loss": -26.4473819732666, "global_step": 465706, "epoch": 5610} {"train_loss": -26.557462692260742, "global_step": 465707, "epoch": 5610} {"train_loss": -26.453052520751953, "global_step": 465708, "epoch": 5610} {"train_loss": -26.584806442260742, "global_step": 465709, "epoch": 5610} {"train_loss": -26.35157585144043, "global_step": 465710, "epoch": 5610} {"train_loss": -27.295679092407227, "global_step": 465711, "epoch": 5610} {"train_loss": -26.91685212376606, "global_step": 465712, "epoch": 5610, "val_loss": 6506527.0} {"train_loss": -26.686376571655273, "global_step": 465713, "epoch": 5611} {"train_loss": -25.962677001953125, "global_step": 465714, "epoch": 5611} {"train_loss": -26.35404396057129, "global_step": 465715, "epoch": 5611} {"train_loss": -26.528051376342773, "global_step": 465716, "epoch": 5611} {"train_loss": -25.915084838867188, "global_step": 465717, "epoch": 5611} {"train_loss": -26.420780181884766, "global_step": 465718, "epoch": 5611} {"train_loss": -26.608896255493164, "global_step": 465719, "epoch": 5611} {"train_loss": -26.552356719970703, "global_step": 465720, "epoch": 5611} {"train_loss": -26.247888565063477, "global_step": 465721, "epoch": 5611} {"train_loss": -26.327512741088867, "global_step": 465722, "epoch": 5611} {"train_loss": -26.211164474487305, "global_step": 465723, "epoch": 5611} {"train_loss": -26.288572311401367, "global_step": 465724, "epoch": 5611} {"train_loss": -26.195453643798828, "global_step": 465725, "epoch": 5611} {"train_loss": -26.599966049194336, "global_step": 465726, "epoch": 5611} {"train_loss": -26.911657333374023, "global_step": 465727, "epoch": 5611} {"train_loss": -26.747116088867188, "global_step": 465728, "epoch": 5611} {"train_loss": -26.44342041015625, "global_step": 465729, "epoch": 5611} {"train_loss": -27.226964950561523, "global_step": 465730, "epoch": 5611} {"train_loss": -26.81247329711914, "global_step": 465731, "epoch": 5611} {"train_loss": -26.713769912719727, "global_step": 465732, "epoch": 5611} {"train_loss": -26.861618041992188, "global_step": 465733, "epoch": 5611} {"train_loss": -26.9346866607666, "global_step": 465734, "epoch": 5611} {"train_loss": -26.891754150390625, "global_step": 465735, "epoch": 5611} {"train_loss": -26.7921142578125, "global_step": 465736, "epoch": 5611} {"train_loss": -26.809728622436523, "global_step": 465737, "epoch": 5611} {"train_loss": -26.92726707458496, "global_step": 465738, "epoch": 5611} {"train_loss": -27.0755615234375, "global_step": 465739, "epoch": 5611} {"train_loss": -27.108469009399414, "global_step": 465740, "epoch": 5611} {"train_loss": -26.82948875427246, "global_step": 465741, "epoch": 5611} {"train_loss": -27.09418296813965, "global_step": 465742, "epoch": 5611} {"train_loss": -27.089757919311523, "global_step": 465743, "epoch": 5611} {"train_loss": -27.024524688720703, "global_step": 465744, "epoch": 5611} {"train_loss": -27.108320236206055, "global_step": 465745, "epoch": 5611} {"train_loss": -27.10440444946289, "global_step": 465746, "epoch": 5611} {"train_loss": -27.353912353515625, "global_step": 465747, "epoch": 5611} {"train_loss": -26.93080711364746, "global_step": 465748, "epoch": 5611} {"train_loss": -27.229352951049805, "global_step": 465749, "epoch": 5611} {"train_loss": -27.024463653564453, "global_step": 465750, "epoch": 5611} {"train_loss": -27.477497100830078, "global_step": 465751, "epoch": 5611} {"train_loss": -26.999731063842773, "global_step": 465752, "epoch": 5611} {"train_loss": -27.1994571685791, "global_step": 465753, "epoch": 5611} {"train_loss": -27.139196395874023, "global_step": 465754, "epoch": 5611} {"train_loss": -26.798675537109375, "global_step": 465755, "epoch": 5611} {"train_loss": -27.1485595703125, "global_step": 465756, "epoch": 5611} {"train_loss": -27.32000160217285, "global_step": 465757, "epoch": 5611} {"train_loss": -26.937515258789062, "global_step": 465758, "epoch": 5611} {"train_loss": -27.359060287475586, "global_step": 465759, "epoch": 5611} {"train_loss": -27.603057861328125, "global_step": 465760, "epoch": 5611} {"train_loss": -27.51166343688965, "global_step": 465761, "epoch": 5611} {"train_loss": -27.12432861328125, "global_step": 465762, "epoch": 5611} {"train_loss": -27.473947525024414, "global_step": 465763, "epoch": 5611} {"train_loss": -27.40961265563965, "global_step": 465764, "epoch": 5611} {"train_loss": -27.433683395385742, "global_step": 465765, "epoch": 5611} {"train_loss": -27.22767448425293, "global_step": 465766, "epoch": 5611} {"train_loss": -27.191198348999023, "global_step": 465767, "epoch": 5611} {"train_loss": -27.363788604736328, "global_step": 465768, "epoch": 5611} {"train_loss": -27.41946792602539, "global_step": 465769, "epoch": 5611} {"train_loss": -27.022418975830078, "global_step": 465770, "epoch": 5611} {"train_loss": -27.477476119995117, "global_step": 465771, "epoch": 5611} {"train_loss": -27.401885986328125, "global_step": 465772, "epoch": 5611} {"train_loss": -27.572851181030273, "global_step": 465773, "epoch": 5611} {"train_loss": -27.326248168945312, "global_step": 465774, "epoch": 5611} {"train_loss": -27.563512802124023, "global_step": 465775, "epoch": 5611} {"train_loss": -26.7943115234375, "global_step": 465776, "epoch": 5611} {"train_loss": -27.193206787109375, "global_step": 465777, "epoch": 5611} {"train_loss": -27.190814971923828, "global_step": 465778, "epoch": 5611} {"train_loss": -27.512073516845703, "global_step": 465779, "epoch": 5611} {"train_loss": -27.333572387695312, "global_step": 465780, "epoch": 5611} {"train_loss": -27.425521850585938, "global_step": 465781, "epoch": 5611} {"train_loss": -27.199743270874023, "global_step": 465782, "epoch": 5611} {"train_loss": -26.875431060791016, "global_step": 465783, "epoch": 5611} {"train_loss": -27.900800704956055, "global_step": 465784, "epoch": 5611} {"train_loss": -27.202865600585938, "global_step": 465785, "epoch": 5611} {"train_loss": -27.12489128112793, "global_step": 465786, "epoch": 5611} {"train_loss": -26.93670654296875, "global_step": 465787, "epoch": 5611} {"train_loss": -27.078460693359375, "global_step": 465788, "epoch": 5611} {"train_loss": -27.368566513061523, "global_step": 465789, "epoch": 5611} {"train_loss": -27.346439361572266, "global_step": 465790, "epoch": 5611} {"train_loss": -27.322546005249023, "global_step": 465791, "epoch": 5611} {"train_loss": -26.77338981628418, "global_step": 465792, "epoch": 5611} {"train_loss": -26.7376651763916, "global_step": 465793, "epoch": 5611} {"train_loss": -26.961645126342773, "global_step": 465794, "epoch": 5611} {"train_loss": -26.998937032308923, "global_step": 465795, "epoch": 5611, "val_loss": 6551854.0} {"train_loss": -25.63007926940918, "global_step": 465796, "epoch": 5612} {"train_loss": -25.29974365234375, "global_step": 465797, "epoch": 5612} {"train_loss": -26.14206314086914, "global_step": 465798, "epoch": 5612} {"train_loss": -25.481969833374023, "global_step": 465799, "epoch": 5612} {"train_loss": -26.214563369750977, "global_step": 465800, "epoch": 5612} {"train_loss": -26.239288330078125, "global_step": 465801, "epoch": 5612} {"train_loss": -25.987903594970703, "global_step": 465802, "epoch": 5612} {"train_loss": -26.507028579711914, "global_step": 465803, "epoch": 5612} {"train_loss": -26.373300552368164, "global_step": 465804, "epoch": 5612} {"train_loss": -26.257959365844727, "global_step": 465805, "epoch": 5612} {"train_loss": -26.39706802368164, "global_step": 465806, "epoch": 5612} {"train_loss": -26.52252197265625, "global_step": 465807, "epoch": 5612} {"train_loss": -26.32782554626465, "global_step": 465808, "epoch": 5612} {"train_loss": -26.76079750061035, "global_step": 465809, "epoch": 5612} {"train_loss": -26.881677627563477, "global_step": 465810, "epoch": 5612} {"train_loss": -26.668720245361328, "global_step": 465811, "epoch": 5612} {"train_loss": -26.55702018737793, "global_step": 465812, "epoch": 5612} {"train_loss": -27.02433204650879, "global_step": 465813, "epoch": 5612} {"train_loss": -26.762378692626953, "global_step": 465814, "epoch": 5612} {"train_loss": -26.766321182250977, "global_step": 465815, "epoch": 5612} {"train_loss": -26.678003311157227, "global_step": 465816, "epoch": 5612} {"train_loss": -26.88239097595215, "global_step": 465817, "epoch": 5612} {"train_loss": -27.008163452148438, "global_step": 465818, "epoch": 5612} {"train_loss": -26.79085350036621, "global_step": 465819, "epoch": 5612} {"train_loss": -27.092451095581055, "global_step": 465820, "epoch": 5612} {"train_loss": -26.813501358032227, "global_step": 465821, "epoch": 5612} {"train_loss": -27.22263526916504, "global_step": 465822, "epoch": 5612} {"train_loss": -27.036279678344727, "global_step": 465823, "epoch": 5612} {"train_loss": -27.201129913330078, "global_step": 465824, "epoch": 5612} {"train_loss": -26.908283233642578, "global_step": 465825, "epoch": 5612} {"train_loss": -27.458581924438477, "global_step": 465826, "epoch": 5612} {"train_loss": -27.261640548706055, "global_step": 465827, "epoch": 5612} {"train_loss": -26.85066795349121, "global_step": 465828, "epoch": 5612} {"train_loss": -27.161380767822266, "global_step": 465829, "epoch": 5612} {"train_loss": -27.265811920166016, "global_step": 465830, "epoch": 5612} {"train_loss": -27.555810928344727, "global_step": 465831, "epoch": 5612} {"train_loss": -27.0765438079834, "global_step": 465832, "epoch": 5612} {"train_loss": -27.628339767456055, "global_step": 465833, "epoch": 5612} {"train_loss": -27.387287139892578, "global_step": 465834, "epoch": 5612} {"train_loss": -27.072412490844727, "global_step": 465835, "epoch": 5612} {"train_loss": -27.358972549438477, "global_step": 465836, "epoch": 5612} {"train_loss": -27.178607940673828, "global_step": 465837, "epoch": 5612} {"train_loss": -27.212167739868164, "global_step": 465838, "epoch": 5612} {"train_loss": -27.484594345092773, "global_step": 465839, "epoch": 5612} {"train_loss": -27.493738174438477, "global_step": 465840, "epoch": 5612} {"train_loss": -27.214975357055664, "global_step": 465841, "epoch": 5612} {"train_loss": -27.128698348999023, "global_step": 465842, "epoch": 5612} {"train_loss": -26.9619197845459, "global_step": 465843, "epoch": 5612} {"train_loss": -27.227161407470703, "global_step": 465844, "epoch": 5612} {"train_loss": -26.837554931640625, "global_step": 465845, "epoch": 5612} {"train_loss": -26.365955352783203, "global_step": 465846, "epoch": 5612} {"train_loss": -27.511932373046875, "global_step": 465847, "epoch": 5612} {"train_loss": -27.179443359375, "global_step": 465848, "epoch": 5612} {"train_loss": -27.028303146362305, "global_step": 465849, "epoch": 5612} {"train_loss": -27.183740615844727, "global_step": 465850, "epoch": 5612} {"train_loss": -27.33107566833496, "global_step": 465851, "epoch": 5612} {"train_loss": -27.298828125, "global_step": 465852, "epoch": 5612} {"train_loss": -27.00013542175293, "global_step": 465853, "epoch": 5612} {"train_loss": -27.225727081298828, "global_step": 465854, "epoch": 5612} {"train_loss": -26.881677627563477, "global_step": 465855, "epoch": 5612} {"train_loss": -27.443174362182617, "global_step": 465856, "epoch": 5612} {"train_loss": -26.836612701416016, "global_step": 465857, "epoch": 5612} {"train_loss": -26.738672256469727, "global_step": 465858, "epoch": 5612} {"train_loss": -26.561185836791992, "global_step": 465859, "epoch": 5612} {"train_loss": -26.314453125, "global_step": 465860, "epoch": 5612} {"train_loss": -26.363754272460938, "global_step": 465861, "epoch": 5612} {"train_loss": -27.016443252563477, "global_step": 465862, "epoch": 5612} {"train_loss": -26.550312042236328, "global_step": 465863, "epoch": 5612} {"train_loss": -26.946874618530273, "global_step": 465864, "epoch": 5612} {"train_loss": -27.008350372314453, "global_step": 465865, "epoch": 5612} {"train_loss": -26.67840576171875, "global_step": 465866, "epoch": 5612} {"train_loss": -27.326932907104492, "global_step": 465867, "epoch": 5612} {"train_loss": -26.49043083190918, "global_step": 465868, "epoch": 5612} {"train_loss": -27.144750595092773, "global_step": 465869, "epoch": 5612} {"train_loss": -26.994123458862305, "global_step": 465870, "epoch": 5612} {"train_loss": -26.953357696533203, "global_step": 465871, "epoch": 5612} {"train_loss": -26.87032127380371, "global_step": 465872, "epoch": 5612} {"train_loss": -26.881357192993164, "global_step": 465873, "epoch": 5612} {"train_loss": -27.127655029296875, "global_step": 465874, "epoch": 5612} {"train_loss": -27.027402877807617, "global_step": 465875, "epoch": 5612} {"train_loss": -27.315027236938477, "global_step": 465876, "epoch": 5612} {"train_loss": -27.033329010009766, "global_step": 465877, "epoch": 5612} {"train_loss": -26.87429972729051, "global_step": 465878, "epoch": 5612, "val_loss": 6600351.0} {"train_loss": -27.132715225219727, "global_step": 465879, "epoch": 5613} {"train_loss": -26.911090850830078, "global_step": 465880, "epoch": 5613} {"train_loss": -27.2688045501709, "global_step": 465881, "epoch": 5613} {"train_loss": -27.168798446655273, "global_step": 465882, "epoch": 5613} {"train_loss": -26.608030319213867, "global_step": 465883, "epoch": 5613} {"train_loss": -26.891218185424805, "global_step": 465884, "epoch": 5613} {"train_loss": -26.74786376953125, "global_step": 465885, "epoch": 5613} {"train_loss": -26.81330680847168, "global_step": 465886, "epoch": 5613} {"train_loss": -27.465330123901367, "global_step": 465887, "epoch": 5613} {"train_loss": -27.157438278198242, "global_step": 465888, "epoch": 5613} {"train_loss": -27.270496368408203, "global_step": 465889, "epoch": 5613} {"train_loss": -26.94040298461914, "global_step": 465890, "epoch": 5613} {"train_loss": -26.992353439331055, "global_step": 465891, "epoch": 5613} {"train_loss": -27.23927116394043, "global_step": 465892, "epoch": 5613} {"train_loss": -27.45680809020996, "global_step": 465893, "epoch": 5613} {"train_loss": -27.17824363708496, "global_step": 465894, "epoch": 5613} {"train_loss": -27.284408569335938, "global_step": 465895, "epoch": 5613} {"train_loss": -27.14179801940918, "global_step": 465896, "epoch": 5613} {"train_loss": -27.332300186157227, "global_step": 465897, "epoch": 5613} {"train_loss": -27.42396354675293, "global_step": 465898, "epoch": 5613} {"train_loss": -27.0849552154541, "global_step": 465899, "epoch": 5613} {"train_loss": -26.85858726501465, "global_step": 465900, "epoch": 5613} {"train_loss": -26.861143112182617, "global_step": 465901, "epoch": 5613} {"train_loss": -27.286893844604492, "global_step": 465902, "epoch": 5613} {"train_loss": -26.963302612304688, "global_step": 465903, "epoch": 5613} {"train_loss": -27.247482299804688, "global_step": 465904, "epoch": 5613} {"train_loss": -27.123632431030273, "global_step": 465905, "epoch": 5613} {"train_loss": -27.17598533630371, "global_step": 465906, "epoch": 5613} {"train_loss": -26.90662956237793, "global_step": 465907, "epoch": 5613} {"train_loss": -26.778751373291016, "global_step": 465908, "epoch": 5613} {"train_loss": -27.333337783813477, "global_step": 465909, "epoch": 5613} {"train_loss": -27.008182525634766, "global_step": 465910, "epoch": 5613} {"train_loss": -27.153095245361328, "global_step": 465911, "epoch": 5613} {"train_loss": -26.560760498046875, "global_step": 465912, "epoch": 5613} {"train_loss": -27.046924591064453, "global_step": 465913, "epoch": 5613} {"train_loss": -27.1705322265625, "global_step": 465914, "epoch": 5613} {"train_loss": -26.8704833984375, "global_step": 465915, "epoch": 5613} {"train_loss": -27.204071044921875, "global_step": 465916, "epoch": 5613} {"train_loss": -27.0833797454834, "global_step": 465917, "epoch": 5613} {"train_loss": -27.07598304748535, "global_step": 465918, "epoch": 5613} {"train_loss": -26.831226348876953, "global_step": 465919, "epoch": 5613} {"train_loss": -27.203022003173828, "global_step": 465920, "epoch": 5613} {"train_loss": -27.047657012939453, "global_step": 465921, "epoch": 5613} {"train_loss": -27.18397331237793, "global_step": 465922, "epoch": 5613} {"train_loss": -27.316938400268555, "global_step": 465923, "epoch": 5613} {"train_loss": -27.096954345703125, "global_step": 465924, "epoch": 5613} {"train_loss": -27.23261070251465, "global_step": 465925, "epoch": 5613} {"train_loss": -27.133289337158203, "global_step": 465926, "epoch": 5613} {"train_loss": -27.19819450378418, "global_step": 465927, "epoch": 5613} {"train_loss": -27.393545150756836, "global_step": 465928, "epoch": 5613} {"train_loss": -27.058887481689453, "global_step": 465929, "epoch": 5613} {"train_loss": -27.192230224609375, "global_step": 465930, "epoch": 5613} {"train_loss": -26.90923500061035, "global_step": 465931, "epoch": 5613} {"train_loss": -27.051288604736328, "global_step": 465932, "epoch": 5613} {"train_loss": -27.30122947692871, "global_step": 465933, "epoch": 5613} {"train_loss": -27.07160758972168, "global_step": 465934, "epoch": 5613} {"train_loss": -26.8931827545166, "global_step": 465935, "epoch": 5613} {"train_loss": -27.08143424987793, "global_step": 465936, "epoch": 5613} {"train_loss": -27.025909423828125, "global_step": 465937, "epoch": 5613} {"train_loss": -27.270414352416992, "global_step": 465938, "epoch": 5613} {"train_loss": -27.319379806518555, "global_step": 465939, "epoch": 5613} {"train_loss": -26.96845817565918, "global_step": 465940, "epoch": 5613} {"train_loss": -26.7908992767334, "global_step": 465941, "epoch": 5613} {"train_loss": -26.999975204467773, "global_step": 465942, "epoch": 5613} {"train_loss": -27.191526412963867, "global_step": 465943, "epoch": 5613} {"train_loss": -27.464941024780273, "global_step": 465944, "epoch": 5613} {"train_loss": -26.684402465820312, "global_step": 465945, "epoch": 5613} {"train_loss": -27.341754913330078, "global_step": 465946, "epoch": 5613} {"train_loss": -27.187284469604492, "global_step": 465947, "epoch": 5613} {"train_loss": -27.452356338500977, "global_step": 465948, "epoch": 5613} {"train_loss": -27.19913673400879, "global_step": 465949, "epoch": 5613} {"train_loss": -27.397626876831055, "global_step": 465950, "epoch": 5613} {"train_loss": -27.260522842407227, "global_step": 465951, "epoch": 5613} {"train_loss": -27.448415756225586, "global_step": 465952, "epoch": 5613} {"train_loss": -26.95880126953125, "global_step": 465953, "epoch": 5613} {"train_loss": -27.31721305847168, "global_step": 465954, "epoch": 5613} {"train_loss": -26.75424575805664, "global_step": 465955, "epoch": 5613} {"train_loss": -26.9462947845459, "global_step": 465956, "epoch": 5613} {"train_loss": -27.468652725219727, "global_step": 465957, "epoch": 5613} {"train_loss": -27.092212677001953, "global_step": 465958, "epoch": 5613} {"train_loss": -26.966217041015625, "global_step": 465959, "epoch": 5613} {"train_loss": -26.789188385009766, "global_step": 465960, "epoch": 5613} {"train_loss": -27.119910389544017, "global_step": 465961, "epoch": 5613, "val_loss": 6567329.0} {"train_loss": -25.666711807250977, "global_step": 465962, "epoch": 5614} {"train_loss": -25.261343002319336, "global_step": 465963, "epoch": 5614} {"train_loss": -26.024869918823242, "global_step": 465964, "epoch": 5614} {"train_loss": -26.172815322875977, "global_step": 465965, "epoch": 5614} {"train_loss": -26.55829429626465, "global_step": 465966, "epoch": 5614} {"train_loss": -26.629316329956055, "global_step": 465967, "epoch": 5614} {"train_loss": -26.54559326171875, "global_step": 465968, "epoch": 5614} {"train_loss": -26.511762619018555, "global_step": 465969, "epoch": 5614} {"train_loss": -26.32177734375, "global_step": 465970, "epoch": 5614} {"train_loss": -26.572046279907227, "global_step": 465971, "epoch": 5614} {"train_loss": -26.58770179748535, "global_step": 465972, "epoch": 5614} {"train_loss": -26.59136962890625, "global_step": 465973, "epoch": 5614} {"train_loss": -26.62869644165039, "global_step": 465974, "epoch": 5614} {"train_loss": -26.525659561157227, "global_step": 465975, "epoch": 5614} {"train_loss": -26.90118980407715, "global_step": 465976, "epoch": 5614} {"train_loss": -26.74399757385254, "global_step": 465977, "epoch": 5614} {"train_loss": -26.460865020751953, "global_step": 465978, "epoch": 5614} {"train_loss": -26.973651885986328, "global_step": 465979, "epoch": 5614} {"train_loss": -26.67425537109375, "global_step": 465980, "epoch": 5614} {"train_loss": -26.672372817993164, "global_step": 465981, "epoch": 5614} {"train_loss": -26.698089599609375, "global_step": 465982, "epoch": 5614} {"train_loss": -27.048242568969727, "global_step": 465983, "epoch": 5614} {"train_loss": -26.759668350219727, "global_step": 465984, "epoch": 5614} {"train_loss": -26.93926429748535, "global_step": 465985, "epoch": 5614} {"train_loss": -27.0054931640625, "global_step": 465986, "epoch": 5614} {"train_loss": -27.05378532409668, "global_step": 465987, "epoch": 5614} {"train_loss": -26.91843032836914, "global_step": 465988, "epoch": 5614} {"train_loss": -26.9691219329834, "global_step": 465989, "epoch": 5614} {"train_loss": -26.8784236907959, "global_step": 465990, "epoch": 5614} {"train_loss": -27.203550338745117, "global_step": 465991, "epoch": 5614} {"train_loss": -27.610326766967773, "global_step": 465992, "epoch": 5614} {"train_loss": -27.05305290222168, "global_step": 465993, "epoch": 5614} {"train_loss": -27.342300415039062, "global_step": 465994, "epoch": 5614} {"train_loss": -27.119970321655273, "global_step": 465995, "epoch": 5614} {"train_loss": -27.011133193969727, "global_step": 465996, "epoch": 5614} {"train_loss": -27.055139541625977, "global_step": 465997, "epoch": 5614} {"train_loss": -27.23370933532715, "global_step": 465998, "epoch": 5614} {"train_loss": -27.027013778686523, "global_step": 465999, "epoch": 5614} {"train_loss": -27.016010284423828, "global_step": 466000, "epoch": 5614} {"train_loss": -27.146820068359375, "global_step": 466001, "epoch": 5614} {"train_loss": -27.07606315612793, "global_step": 466002, "epoch": 5614} {"train_loss": -26.90277671813965, "global_step": 466003, "epoch": 5614} {"train_loss": -27.034543991088867, "global_step": 466004, "epoch": 5614} {"train_loss": -27.28726577758789, "global_step": 466005, "epoch": 5614} {"train_loss": -27.1650390625, "global_step": 466006, "epoch": 5614} {"train_loss": -27.27849769592285, "global_step": 466007, "epoch": 5614} {"train_loss": -27.178308486938477, "global_step": 466008, "epoch": 5614} {"train_loss": -27.480863571166992, "global_step": 466009, "epoch": 5614} {"train_loss": -27.364294052124023, "global_step": 466010, "epoch": 5614} {"train_loss": -27.132165908813477, "global_step": 466011, "epoch": 5614} {"train_loss": -26.9234676361084, "global_step": 466012, "epoch": 5614} {"train_loss": -27.29853630065918, "global_step": 466013, "epoch": 5614} {"train_loss": -27.210474014282227, "global_step": 466014, "epoch": 5614} {"train_loss": -27.147321701049805, "global_step": 466015, "epoch": 5614} {"train_loss": -26.986347198486328, "global_step": 466016, "epoch": 5614} {"train_loss": -27.411041259765625, "global_step": 466017, "epoch": 5614} {"train_loss": -27.409061431884766, "global_step": 466018, "epoch": 5614} {"train_loss": -26.862594604492188, "global_step": 466019, "epoch": 5614} {"train_loss": -27.266263961791992, "global_step": 466020, "epoch": 5614} {"train_loss": -27.37421989440918, "global_step": 466021, "epoch": 5614} {"train_loss": -27.224353790283203, "global_step": 466022, "epoch": 5614} {"train_loss": -27.10975456237793, "global_step": 466023, "epoch": 5614} {"train_loss": -27.47305679321289, "global_step": 466024, "epoch": 5614} {"train_loss": -27.36419105529785, "global_step": 466025, "epoch": 5614} {"train_loss": -27.155899047851562, "global_step": 466026, "epoch": 5614} {"train_loss": -26.904096603393555, "global_step": 466027, "epoch": 5614} {"train_loss": -27.382415771484375, "global_step": 466028, "epoch": 5614} {"train_loss": -27.52278709411621, "global_step": 466029, "epoch": 5614} {"train_loss": -27.375640869140625, "global_step": 466030, "epoch": 5614} {"train_loss": -27.3721981048584, "global_step": 466031, "epoch": 5614} {"train_loss": -27.009765625, "global_step": 466032, "epoch": 5614} {"train_loss": -27.296117782592773, "global_step": 466033, "epoch": 5614} {"train_loss": -27.131977081298828, "global_step": 466034, "epoch": 5614} {"train_loss": -27.156980514526367, "global_step": 466035, "epoch": 5614} {"train_loss": -27.0513916015625, "global_step": 466036, "epoch": 5614} {"train_loss": -26.8204402923584, "global_step": 466037, "epoch": 5614} {"train_loss": -27.233240127563477, "global_step": 466038, "epoch": 5614} {"train_loss": -27.508466720581055, "global_step": 466039, "epoch": 5614} {"train_loss": -26.745206832885742, "global_step": 466040, "epoch": 5614} {"train_loss": -26.843978881835938, "global_step": 466041, "epoch": 5614} {"train_loss": -27.696897506713867, "global_step": 466042, "epoch": 5614} {"train_loss": -27.142797470092773, "global_step": 466043, "epoch": 5614} {"train_loss": -26.963351605886437, "global_step": 466044, "epoch": 5614, "val_loss": 6510340.5} {"train_loss": -26.33637809753418, "global_step": 466045, "epoch": 5615} {"train_loss": -26.309680938720703, "global_step": 466046, "epoch": 5615} {"train_loss": -26.536100387573242, "global_step": 466047, "epoch": 5615} {"train_loss": -26.4072265625, "global_step": 466048, "epoch": 5615} {"train_loss": -26.362720489501953, "global_step": 466049, "epoch": 5615} {"train_loss": -26.65797233581543, "global_step": 466050, "epoch": 5615} {"train_loss": -26.499425888061523, "global_step": 466051, "epoch": 5615} {"train_loss": -26.679977416992188, "global_step": 466052, "epoch": 5615} {"train_loss": -26.835371017456055, "global_step": 466053, "epoch": 5615} {"train_loss": -26.97467613220215, "global_step": 466054, "epoch": 5615} {"train_loss": -26.702228546142578, "global_step": 466055, "epoch": 5615} {"train_loss": -26.9698486328125, "global_step": 466056, "epoch": 5615} {"train_loss": -27.058826446533203, "global_step": 466057, "epoch": 5615} {"train_loss": -26.830810546875, "global_step": 466058, "epoch": 5615} {"train_loss": -26.421772003173828, "global_step": 466059, "epoch": 5615} {"train_loss": -26.921340942382812, "global_step": 466060, "epoch": 5615} {"train_loss": -26.825958251953125, "global_step": 466061, "epoch": 5615} {"train_loss": -27.25484275817871, "global_step": 466062, "epoch": 5615} {"train_loss": -26.713184356689453, "global_step": 466063, "epoch": 5615} {"train_loss": -27.041004180908203, "global_step": 466064, "epoch": 5615} {"train_loss": -27.016096115112305, "global_step": 466065, "epoch": 5615} {"train_loss": -27.19411277770996, "global_step": 466066, "epoch": 5615} {"train_loss": -26.705036163330078, "global_step": 466067, "epoch": 5615} {"train_loss": -26.986188888549805, "global_step": 466068, "epoch": 5615} {"train_loss": -26.656339645385742, "global_step": 466069, "epoch": 5615} {"train_loss": -27.32008171081543, "global_step": 466070, "epoch": 5615} {"train_loss": -27.3021297454834, "global_step": 466071, "epoch": 5615} {"train_loss": -27.153589248657227, "global_step": 466072, "epoch": 5615} {"train_loss": -26.8772029876709, "global_step": 466073, "epoch": 5615} {"train_loss": -27.40826988220215, "global_step": 466074, "epoch": 5615} {"train_loss": -26.971027374267578, "global_step": 466075, "epoch": 5615} {"train_loss": -27.100324630737305, "global_step": 466076, "epoch": 5615} {"train_loss": -27.037704467773438, "global_step": 466077, "epoch": 5615} {"train_loss": -27.356613159179688, "global_step": 466078, "epoch": 5615} {"train_loss": -27.337890625, "global_step": 466079, "epoch": 5615} {"train_loss": -27.22589683532715, "global_step": 466080, "epoch": 5615} {"train_loss": -27.552541732788086, "global_step": 466081, "epoch": 5615} {"train_loss": -27.41228675842285, "global_step": 466082, "epoch": 5615} {"train_loss": -27.219696044921875, "global_step": 466083, "epoch": 5615} {"train_loss": -27.408533096313477, "global_step": 466084, "epoch": 5615} {"train_loss": -27.219196319580078, "global_step": 466085, "epoch": 5615} {"train_loss": -27.516983032226562, "global_step": 466086, "epoch": 5615} {"train_loss": -27.26827049255371, "global_step": 466087, "epoch": 5615} {"train_loss": -27.270877838134766, "global_step": 466088, "epoch": 5615} {"train_loss": -27.368778228759766, "global_step": 466089, "epoch": 5615} {"train_loss": -27.14564323425293, "global_step": 466090, "epoch": 5615} {"train_loss": -27.077667236328125, "global_step": 466091, "epoch": 5615} {"train_loss": -26.88347816467285, "global_step": 466092, "epoch": 5615} {"train_loss": -27.0822811126709, "global_step": 466093, "epoch": 5615} {"train_loss": -27.575422286987305, "global_step": 466094, "epoch": 5615} {"train_loss": -26.936674118041992, "global_step": 466095, "epoch": 5615} {"train_loss": -27.142242431640625, "global_step": 466096, "epoch": 5615} {"train_loss": -26.982421875, "global_step": 466097, "epoch": 5615} {"train_loss": -27.07602310180664, "global_step": 466098, "epoch": 5615} {"train_loss": -27.289093017578125, "global_step": 466099, "epoch": 5615} {"train_loss": -27.044614791870117, "global_step": 466100, "epoch": 5615} {"train_loss": -27.12748146057129, "global_step": 466101, "epoch": 5615} {"train_loss": -27.172094345092773, "global_step": 466102, "epoch": 5615} {"train_loss": -27.352252960205078, "global_step": 466103, "epoch": 5615} {"train_loss": -27.422088623046875, "global_step": 466104, "epoch": 5615} {"train_loss": -27.237905502319336, "global_step": 466105, "epoch": 5615} {"train_loss": -27.27046775817871, "global_step": 466106, "epoch": 5615} {"train_loss": -27.357547760009766, "global_step": 466107, "epoch": 5615} {"train_loss": -27.52435874938965, "global_step": 466108, "epoch": 5615} {"train_loss": -27.585790634155273, "global_step": 466109, "epoch": 5615} {"train_loss": -27.487707138061523, "global_step": 466110, "epoch": 5615} {"train_loss": -27.190576553344727, "global_step": 466111, "epoch": 5615} {"train_loss": -27.434635162353516, "global_step": 466112, "epoch": 5615} {"train_loss": -27.1838436126709, "global_step": 466113, "epoch": 5615} {"train_loss": -26.867359161376953, "global_step": 466114, "epoch": 5615} {"train_loss": -26.526325225830078, "global_step": 466115, "epoch": 5615} {"train_loss": -25.76595115661621, "global_step": 466116, "epoch": 5615} {"train_loss": -26.497119903564453, "global_step": 466117, "epoch": 5615} {"train_loss": -26.383869171142578, "global_step": 466118, "epoch": 5615} {"train_loss": -25.45777702331543, "global_step": 466119, "epoch": 5615} {"train_loss": -26.17306900024414, "global_step": 466120, "epoch": 5615} {"train_loss": -26.762948989868164, "global_step": 466121, "epoch": 5615} {"train_loss": -26.10904884338379, "global_step": 466122, "epoch": 5615} {"train_loss": -26.5594425201416, "global_step": 466123, "epoch": 5615} {"train_loss": -26.787382125854492, "global_step": 466124, "epoch": 5615} {"train_loss": -26.2604923248291, "global_step": 466125, "epoch": 5615} {"train_loss": -26.2885799407959, "global_step": 466126, "epoch": 5615} {"train_loss": -26.976198839854046, "global_step": 466127, "epoch": 5615, "val_loss": 6450674.5} {"train_loss": -25.482038497924805, "global_step": 466128, "epoch": 5616} {"train_loss": -26.49757957458496, "global_step": 466129, "epoch": 5616} {"train_loss": -25.66568946838379, "global_step": 466130, "epoch": 5616} {"train_loss": -26.377416610717773, "global_step": 466131, "epoch": 5616} {"train_loss": -25.68536949157715, "global_step": 466132, "epoch": 5616} {"train_loss": -26.190460205078125, "global_step": 466133, "epoch": 5616} {"train_loss": -25.711069107055664, "global_step": 466134, "epoch": 5616} {"train_loss": -26.481855392456055, "global_step": 466135, "epoch": 5616} {"train_loss": -26.306900024414062, "global_step": 466136, "epoch": 5616} {"train_loss": -25.962621688842773, "global_step": 466137, "epoch": 5616} {"train_loss": -26.1745662689209, "global_step": 466138, "epoch": 5616} {"train_loss": -26.492874145507812, "global_step": 466139, "epoch": 5616} {"train_loss": -26.437788009643555, "global_step": 466140, "epoch": 5616} {"train_loss": -26.535205841064453, "global_step": 466141, "epoch": 5616} {"train_loss": -26.61220359802246, "global_step": 466142, "epoch": 5616} {"train_loss": -26.482770919799805, "global_step": 466143, "epoch": 5616} {"train_loss": -26.447946548461914, "global_step": 466144, "epoch": 5616} {"train_loss": -26.56403923034668, "global_step": 466145, "epoch": 5616} {"train_loss": -26.895017623901367, "global_step": 466146, "epoch": 5616} {"train_loss": -26.39898681640625, "global_step": 466147, "epoch": 5616} {"train_loss": -26.426956176757812, "global_step": 466148, "epoch": 5616} {"train_loss": -26.703954696655273, "global_step": 466149, "epoch": 5616} {"train_loss": -26.52747917175293, "global_step": 466150, "epoch": 5616} {"train_loss": -26.818714141845703, "global_step": 466151, "epoch": 5616} {"train_loss": -26.825468063354492, "global_step": 466152, "epoch": 5616} {"train_loss": -26.820585250854492, "global_step": 466153, "epoch": 5616} {"train_loss": -26.680572509765625, "global_step": 466154, "epoch": 5616} {"train_loss": -27.037839889526367, "global_step": 466155, "epoch": 5616} {"train_loss": -26.793258666992188, "global_step": 466156, "epoch": 5616} {"train_loss": -26.71474266052246, "global_step": 466157, "epoch": 5616} {"train_loss": -26.748767852783203, "global_step": 466158, "epoch": 5616} {"train_loss": -27.053619384765625, "global_step": 466159, "epoch": 5616} {"train_loss": -27.385461807250977, "global_step": 466160, "epoch": 5616} {"train_loss": -27.168500900268555, "global_step": 466161, "epoch": 5616} {"train_loss": -27.37689208984375, "global_step": 466162, "epoch": 5616} {"train_loss": -26.974512100219727, "global_step": 466163, "epoch": 5616} {"train_loss": -26.964630126953125, "global_step": 466164, "epoch": 5616} {"train_loss": -27.31267738342285, "global_step": 466165, "epoch": 5616} {"train_loss": -26.8481388092041, "global_step": 466166, "epoch": 5616} {"train_loss": -26.995405197143555, "global_step": 466167, "epoch": 5616} {"train_loss": -27.1734676361084, "global_step": 466168, "epoch": 5616} {"train_loss": -26.98829460144043, "global_step": 466169, "epoch": 5616} {"train_loss": -26.972126007080078, "global_step": 466170, "epoch": 5616} {"train_loss": -27.077198028564453, "global_step": 466171, "epoch": 5616} {"train_loss": -27.07061767578125, "global_step": 466172, "epoch": 5616} {"train_loss": -27.121549606323242, "global_step": 466173, "epoch": 5616} {"train_loss": -27.50357437133789, "global_step": 466174, "epoch": 5616} {"train_loss": -27.332305908203125, "global_step": 466175, "epoch": 5616} {"train_loss": -27.355207443237305, "global_step": 466176, "epoch": 5616} {"train_loss": -26.95831871032715, "global_step": 466177, "epoch": 5616} {"train_loss": -27.119979858398438, "global_step": 466178, "epoch": 5616} {"train_loss": -27.17732048034668, "global_step": 466179, "epoch": 5616} {"train_loss": -27.417158126831055, "global_step": 466180, "epoch": 5616} {"train_loss": -27.06330680847168, "global_step": 466181, "epoch": 5616} {"train_loss": -27.130483627319336, "global_step": 466182, "epoch": 5616} {"train_loss": -27.953718185424805, "global_step": 466183, "epoch": 5616} {"train_loss": -27.27308464050293, "global_step": 466184, "epoch": 5616} {"train_loss": -27.359619140625, "global_step": 466185, "epoch": 5616} {"train_loss": -27.780426025390625, "global_step": 466186, "epoch": 5616} {"train_loss": -27.181543350219727, "global_step": 466187, "epoch": 5616} {"train_loss": -27.461618423461914, "global_step": 466188, "epoch": 5616} {"train_loss": -27.59198570251465, "global_step": 466189, "epoch": 5616} {"train_loss": -27.567167282104492, "global_step": 466190, "epoch": 5616} {"train_loss": -27.283437728881836, "global_step": 466191, "epoch": 5616} {"train_loss": -27.436447143554688, "global_step": 466192, "epoch": 5616} {"train_loss": -27.05719566345215, "global_step": 466193, "epoch": 5616} {"train_loss": -27.259260177612305, "global_step": 466194, "epoch": 5616} {"train_loss": -26.60589599609375, "global_step": 466195, "epoch": 5616} {"train_loss": -26.660242080688477, "global_step": 466196, "epoch": 5616} {"train_loss": -26.977598190307617, "global_step": 466197, "epoch": 5616} {"train_loss": -26.318456649780273, "global_step": 466198, "epoch": 5616} {"train_loss": -26.860904693603516, "global_step": 466199, "epoch": 5616} {"train_loss": -26.892765045166016, "global_step": 466200, "epoch": 5616} {"train_loss": -27.383392333984375, "global_step": 466201, "epoch": 5616} {"train_loss": -26.556421279907227, "global_step": 466202, "epoch": 5616} {"train_loss": -27.132980346679688, "global_step": 466203, "epoch": 5616} {"train_loss": -27.00079345703125, "global_step": 466204, "epoch": 5616} {"train_loss": -26.954498291015625, "global_step": 466205, "epoch": 5616} {"train_loss": -27.074268341064453, "global_step": 466206, "epoch": 5616} {"train_loss": -26.9118709564209, "global_step": 466207, "epoch": 5616} {"train_loss": -26.75416374206543, "global_step": 466208, "epoch": 5616} {"train_loss": -26.874755859375, "global_step": 466209, "epoch": 5616} {"train_loss": -26.862684755440217, "global_step": 466210, "epoch": 5616, "val_loss": 6598684.0} {"train_loss": -26.761550903320312, "global_step": 466211, "epoch": 5617} {"train_loss": -26.088510513305664, "global_step": 466212, "epoch": 5617} {"train_loss": -26.299070358276367, "global_step": 466213, "epoch": 5617} {"train_loss": -26.112964630126953, "global_step": 466214, "epoch": 5617} {"train_loss": -26.4841251373291, "global_step": 466215, "epoch": 5617} {"train_loss": -25.84503746032715, "global_step": 466216, "epoch": 5617} {"train_loss": -26.488330841064453, "global_step": 466217, "epoch": 5617} {"train_loss": -26.591604232788086, "global_step": 466218, "epoch": 5617} {"train_loss": -26.464065551757812, "global_step": 466219, "epoch": 5617} {"train_loss": -26.587905883789062, "global_step": 466220, "epoch": 5617} {"train_loss": -26.817352294921875, "global_step": 466221, "epoch": 5617} {"train_loss": -26.045215606689453, "global_step": 466222, "epoch": 5617} {"train_loss": -26.667932510375977, "global_step": 466223, "epoch": 5617} {"train_loss": -26.52301597595215, "global_step": 466224, "epoch": 5617} {"train_loss": -26.2987117767334, "global_step": 466225, "epoch": 5617} {"train_loss": -26.87576675415039, "global_step": 466226, "epoch": 5617} {"train_loss": -26.720417022705078, "global_step": 466227, "epoch": 5617} {"train_loss": -26.753894805908203, "global_step": 466228, "epoch": 5617} {"train_loss": -26.639524459838867, "global_step": 466229, "epoch": 5617} {"train_loss": -26.422653198242188, "global_step": 466230, "epoch": 5617} {"train_loss": -26.657154083251953, "global_step": 466231, "epoch": 5617} {"train_loss": -26.806076049804688, "global_step": 466232, "epoch": 5617} {"train_loss": -26.887739181518555, "global_step": 466233, "epoch": 5617} {"train_loss": -26.946521759033203, "global_step": 466234, "epoch": 5617} {"train_loss": -26.72621726989746, "global_step": 466235, "epoch": 5617} {"train_loss": -26.95635414123535, "global_step": 466236, "epoch": 5617} {"train_loss": -26.875207901000977, "global_step": 466237, "epoch": 5617} {"train_loss": -26.69427490234375, "global_step": 466238, "epoch": 5617} {"train_loss": -26.633258819580078, "global_step": 466239, "epoch": 5617} {"train_loss": -26.88789939880371, "global_step": 466240, "epoch": 5617} {"train_loss": -26.913593292236328, "global_step": 466241, "epoch": 5617} {"train_loss": -26.940046310424805, "global_step": 466242, "epoch": 5617} {"train_loss": -27.44541358947754, "global_step": 466243, "epoch": 5617} {"train_loss": -27.007131576538086, "global_step": 466244, "epoch": 5617} {"train_loss": -26.970930099487305, "global_step": 466245, "epoch": 5617} {"train_loss": -27.197416305541992, "global_step": 466246, "epoch": 5617} {"train_loss": -27.35110855102539, "global_step": 466247, "epoch": 5617} {"train_loss": -26.919702529907227, "global_step": 466248, "epoch": 5617} {"train_loss": -27.019275665283203, "global_step": 466249, "epoch": 5617} {"train_loss": -27.1331844329834, "global_step": 466250, "epoch": 5617} {"train_loss": -27.093738555908203, "global_step": 466251, "epoch": 5617} {"train_loss": -27.28287696838379, "global_step": 466252, "epoch": 5617} {"train_loss": -27.11213493347168, "global_step": 466253, "epoch": 5617} {"train_loss": -27.000280380249023, "global_step": 466254, "epoch": 5617} {"train_loss": -27.315509796142578, "global_step": 466255, "epoch": 5617} {"train_loss": -27.6534366607666, "global_step": 466256, "epoch": 5617} {"train_loss": -27.511804580688477, "global_step": 466257, "epoch": 5617} {"train_loss": -27.13296890258789, "global_step": 466258, "epoch": 5617} {"train_loss": -27.449155807495117, "global_step": 466259, "epoch": 5617} {"train_loss": -27.20185661315918, "global_step": 466260, "epoch": 5617} {"train_loss": -27.40286636352539, "global_step": 466261, "epoch": 5617} {"train_loss": -26.911142349243164, "global_step": 466262, "epoch": 5617} {"train_loss": -27.1320858001709, "global_step": 466263, "epoch": 5617} {"train_loss": -27.26279640197754, "global_step": 466264, "epoch": 5617} {"train_loss": -26.93814468383789, "global_step": 466265, "epoch": 5617} {"train_loss": -27.439062118530273, "global_step": 466266, "epoch": 5617} {"train_loss": -27.358917236328125, "global_step": 466267, "epoch": 5617} {"train_loss": -27.230823516845703, "global_step": 466268, "epoch": 5617} {"train_loss": -27.1192626953125, "global_step": 466269, "epoch": 5617} {"train_loss": -27.247400283813477, "global_step": 466270, "epoch": 5617} {"train_loss": -27.123748779296875, "global_step": 466271, "epoch": 5617} {"train_loss": -27.48188591003418, "global_step": 466272, "epoch": 5617} {"train_loss": -26.92779541015625, "global_step": 466273, "epoch": 5617} {"train_loss": -27.058399200439453, "global_step": 466274, "epoch": 5617} {"train_loss": -27.09971046447754, "global_step": 466275, "epoch": 5617} {"train_loss": -27.151586532592773, "global_step": 466276, "epoch": 5617} {"train_loss": -27.190805435180664, "global_step": 466277, "epoch": 5617} {"train_loss": -27.101886749267578, "global_step": 466278, "epoch": 5617} {"train_loss": -27.2300968170166, "global_step": 466279, "epoch": 5617} {"train_loss": -27.6922550201416, "global_step": 466280, "epoch": 5617} {"train_loss": -27.035123825073242, "global_step": 466281, "epoch": 5617} {"train_loss": -27.1307315826416, "global_step": 466282, "epoch": 5617} {"train_loss": -27.121374130249023, "global_step": 466283, "epoch": 5617} {"train_loss": -27.26234245300293, "global_step": 466284, "epoch": 5617} {"train_loss": -27.289087295532227, "global_step": 466285, "epoch": 5617} {"train_loss": -27.17830467224121, "global_step": 466286, "epoch": 5617} {"train_loss": -27.69500160217285, "global_step": 466287, "epoch": 5617} {"train_loss": -27.148462295532227, "global_step": 466288, "epoch": 5617} {"train_loss": -27.371885299682617, "global_step": 466289, "epoch": 5617} {"train_loss": -27.36576271057129, "global_step": 466290, "epoch": 5617} {"train_loss": -27.111743927001953, "global_step": 466291, "epoch": 5617} {"train_loss": -27.61884117126465, "global_step": 466292, "epoch": 5617} {"train_loss": -26.989209186599915, "global_step": 466293, "epoch": 5617, "val_loss": 6492175.5} {"train_loss": -26.8367919921875, "global_step": 466294, "epoch": 5618} {"train_loss": -26.535633087158203, "global_step": 466295, "epoch": 5618} {"train_loss": -26.31766128540039, "global_step": 466296, "epoch": 5618} {"train_loss": -26.67730712890625, "global_step": 466297, "epoch": 5618} {"train_loss": -25.883398056030273, "global_step": 466298, "epoch": 5618} {"train_loss": -26.724634170532227, "global_step": 466299, "epoch": 5618} {"train_loss": -26.907026290893555, "global_step": 466300, "epoch": 5618} {"train_loss": -26.896106719970703, "global_step": 466301, "epoch": 5618} {"train_loss": -26.92157554626465, "global_step": 466302, "epoch": 5618} {"train_loss": -26.663421630859375, "global_step": 466303, "epoch": 5618} {"train_loss": -26.876760482788086, "global_step": 466304, "epoch": 5618} {"train_loss": -27.072101593017578, "global_step": 466305, "epoch": 5618} {"train_loss": -26.581899642944336, "global_step": 466306, "epoch": 5618} {"train_loss": -27.321638107299805, "global_step": 466307, "epoch": 5618} {"train_loss": -26.982990264892578, "global_step": 466308, "epoch": 5618} {"train_loss": -27.291975021362305, "global_step": 466309, "epoch": 5618} {"train_loss": -26.68061637878418, "global_step": 466310, "epoch": 5618} {"train_loss": -26.844512939453125, "global_step": 466311, "epoch": 5618} {"train_loss": -27.07978630065918, "global_step": 466312, "epoch": 5618} {"train_loss": -27.350128173828125, "global_step": 466313, "epoch": 5618} {"train_loss": -27.094655990600586, "global_step": 466314, "epoch": 5618} {"train_loss": -27.433340072631836, "global_step": 466315, "epoch": 5618} {"train_loss": -27.247663497924805, "global_step": 466316, "epoch": 5618} {"train_loss": -27.132770538330078, "global_step": 466317, "epoch": 5618} {"train_loss": -27.201313018798828, "global_step": 466318, "epoch": 5618} {"train_loss": -27.071847915649414, "global_step": 466319, "epoch": 5618} {"train_loss": -27.1004695892334, "global_step": 466320, "epoch": 5618} {"train_loss": -27.21087074279785, "global_step": 466321, "epoch": 5618} {"train_loss": -27.36324119567871, "global_step": 466322, "epoch": 5618} {"train_loss": -27.4267635345459, "global_step": 466323, "epoch": 5618} {"train_loss": -27.033857345581055, "global_step": 466324, "epoch": 5618} {"train_loss": -27.113431930541992, "global_step": 466325, "epoch": 5618} {"train_loss": -27.294178009033203, "global_step": 466326, "epoch": 5618} {"train_loss": -27.587751388549805, "global_step": 466327, "epoch": 5618} {"train_loss": -26.76630210876465, "global_step": 466328, "epoch": 5618} {"train_loss": -27.330183029174805, "global_step": 466329, "epoch": 5618} {"train_loss": -26.793432235717773, "global_step": 466330, "epoch": 5618} {"train_loss": -27.321889877319336, "global_step": 466331, "epoch": 5618} {"train_loss": -27.53675651550293, "global_step": 466332, "epoch": 5618} {"train_loss": -27.076108932495117, "global_step": 466333, "epoch": 5618} {"train_loss": -27.34991455078125, "global_step": 466334, "epoch": 5618} {"train_loss": -26.98710060119629, "global_step": 466335, "epoch": 5618} {"train_loss": -27.062759399414062, "global_step": 466336, "epoch": 5618} {"train_loss": -27.813201904296875, "global_step": 466337, "epoch": 5618} {"train_loss": -27.116531372070312, "global_step": 466338, "epoch": 5618} {"train_loss": -27.41932487487793, "global_step": 466339, "epoch": 5618} {"train_loss": -27.42822265625, "global_step": 466340, "epoch": 5618} {"train_loss": -26.917020797729492, "global_step": 466341, "epoch": 5618} {"train_loss": -27.223180770874023, "global_step": 466342, "epoch": 5618} {"train_loss": -27.03604507446289, "global_step": 466343, "epoch": 5618} {"train_loss": -27.463916778564453, "global_step": 466344, "epoch": 5618} {"train_loss": -27.620702743530273, "global_step": 466345, "epoch": 5618} {"train_loss": -27.127836227416992, "global_step": 466346, "epoch": 5618} {"train_loss": -26.822860717773438, "global_step": 466347, "epoch": 5618} {"train_loss": -27.384546279907227, "global_step": 466348, "epoch": 5618} {"train_loss": -27.0789737701416, "global_step": 466349, "epoch": 5618} {"train_loss": -27.363122940063477, "global_step": 466350, "epoch": 5618} {"train_loss": -27.3909969329834, "global_step": 466351, "epoch": 5618} {"train_loss": -27.401086807250977, "global_step": 466352, "epoch": 5618} {"train_loss": -27.507476806640625, "global_step": 466353, "epoch": 5618} {"train_loss": -27.064252853393555, "global_step": 466354, "epoch": 5618} {"train_loss": -27.246530532836914, "global_step": 466355, "epoch": 5618} {"train_loss": -27.27095603942871, "global_step": 466356, "epoch": 5618} {"train_loss": -27.2080020904541, "global_step": 466357, "epoch": 5618} {"train_loss": -26.929370880126953, "global_step": 466358, "epoch": 5618} {"train_loss": -27.055042266845703, "global_step": 466359, "epoch": 5618} {"train_loss": -27.07526969909668, "global_step": 466360, "epoch": 5618} {"train_loss": -26.98439598083496, "global_step": 466361, "epoch": 5618} {"train_loss": -27.162809371948242, "global_step": 466362, "epoch": 5618} {"train_loss": -26.828527450561523, "global_step": 466363, "epoch": 5618} {"train_loss": -27.78374671936035, "global_step": 466364, "epoch": 5618} {"train_loss": -26.957340240478516, "global_step": 466365, "epoch": 5618} {"train_loss": -27.11866569519043, "global_step": 466366, "epoch": 5618} {"train_loss": -27.267242431640625, "global_step": 466367, "epoch": 5618} {"train_loss": -27.66303062438965, "global_step": 466368, "epoch": 5618} {"train_loss": -27.021387100219727, "global_step": 466369, "epoch": 5618} {"train_loss": -27.116397857666016, "global_step": 466370, "epoch": 5618} {"train_loss": -27.22251319885254, "global_step": 466371, "epoch": 5618} {"train_loss": -27.342252731323242, "global_step": 466372, "epoch": 5618} {"train_loss": -26.899280548095703, "global_step": 466373, "epoch": 5618} {"train_loss": -27.72113609313965, "global_step": 466374, "epoch": 5618} {"train_loss": -27.149560928344727, "global_step": 466375, "epoch": 5618} {"train_loss": -27.117140482707196, "global_step": 466376, "epoch": 5618, "val_loss": 6596179.0} {"train_loss": -26.39234733581543, "global_step": 466377, "epoch": 5619} {"train_loss": -26.56560707092285, "global_step": 466378, "epoch": 5619} {"train_loss": -26.180438995361328, "global_step": 466379, "epoch": 5619} {"train_loss": -26.674524307250977, "global_step": 466380, "epoch": 5619} {"train_loss": -26.34975242614746, "global_step": 466381, "epoch": 5619} {"train_loss": -26.42391014099121, "global_step": 466382, "epoch": 5619} {"train_loss": -26.4960880279541, "global_step": 466383, "epoch": 5619} {"train_loss": -26.900442123413086, "global_step": 466384, "epoch": 5619} {"train_loss": -26.316028594970703, "global_step": 466385, "epoch": 5619} {"train_loss": -26.875715255737305, "global_step": 466386, "epoch": 5619} {"train_loss": -26.586240768432617, "global_step": 466387, "epoch": 5619} {"train_loss": -26.997833251953125, "global_step": 466388, "epoch": 5619} {"train_loss": -26.316802978515625, "global_step": 466389, "epoch": 5619} {"train_loss": -27.56317138671875, "global_step": 466390, "epoch": 5619} {"train_loss": -26.820127487182617, "global_step": 466391, "epoch": 5619} {"train_loss": -26.924646377563477, "global_step": 466392, "epoch": 5619} {"train_loss": -26.742944717407227, "global_step": 466393, "epoch": 5619} {"train_loss": -26.78667640686035, "global_step": 466394, "epoch": 5619} {"train_loss": -26.725988388061523, "global_step": 466395, "epoch": 5619} {"train_loss": -27.0374755859375, "global_step": 466396, "epoch": 5619} {"train_loss": -26.835906982421875, "global_step": 466397, "epoch": 5619} {"train_loss": -26.805707931518555, "global_step": 466398, "epoch": 5619} {"train_loss": -27.119482040405273, "global_step": 466399, "epoch": 5619} {"train_loss": -26.758642196655273, "global_step": 466400, "epoch": 5619} {"train_loss": -27.215911865234375, "global_step": 466401, "epoch": 5619} {"train_loss": -27.051034927368164, "global_step": 466402, "epoch": 5619} {"train_loss": -27.29532814025879, "global_step": 466403, "epoch": 5619} {"train_loss": -26.96125602722168, "global_step": 466404, "epoch": 5619} {"train_loss": -27.191864013671875, "global_step": 466405, "epoch": 5619} {"train_loss": -26.964269638061523, "global_step": 466406, "epoch": 5619} {"train_loss": -27.265710830688477, "global_step": 466407, "epoch": 5619} {"train_loss": -26.77507972717285, "global_step": 466408, "epoch": 5619} {"train_loss": -27.153736114501953, "global_step": 466409, "epoch": 5619} {"train_loss": -27.351791381835938, "global_step": 466410, "epoch": 5619} {"train_loss": -27.509235382080078, "global_step": 466411, "epoch": 5619} {"train_loss": -26.90889549255371, "global_step": 466412, "epoch": 5619} {"train_loss": -27.21400260925293, "global_step": 466413, "epoch": 5619} {"train_loss": -27.2103214263916, "global_step": 466414, "epoch": 5619} {"train_loss": -27.232013702392578, "global_step": 466415, "epoch": 5619} {"train_loss": -26.90028190612793, "global_step": 466416, "epoch": 5619} {"train_loss": -26.681737899780273, "global_step": 466417, "epoch": 5619} {"train_loss": -27.214797973632812, "global_step": 466418, "epoch": 5619} {"train_loss": -27.189456939697266, "global_step": 466419, "epoch": 5619} {"train_loss": -26.74169921875, "global_step": 466420, "epoch": 5619} {"train_loss": -27.137292861938477, "global_step": 466421, "epoch": 5619} {"train_loss": -27.076642990112305, "global_step": 466422, "epoch": 5619} {"train_loss": -27.0777530670166, "global_step": 466423, "epoch": 5619} {"train_loss": -27.318872451782227, "global_step": 466424, "epoch": 5619} {"train_loss": -27.348464965820312, "global_step": 466425, "epoch": 5619} {"train_loss": -27.221288681030273, "global_step": 466426, "epoch": 5619} {"train_loss": -27.119129180908203, "global_step": 466427, "epoch": 5619} {"train_loss": -27.183752059936523, "global_step": 466428, "epoch": 5619} {"train_loss": -27.07439613342285, "global_step": 466429, "epoch": 5619} {"train_loss": -27.275876998901367, "global_step": 466430, "epoch": 5619} {"train_loss": -27.0974063873291, "global_step": 466431, "epoch": 5619} {"train_loss": -27.330860137939453, "global_step": 466432, "epoch": 5619} {"train_loss": -27.185205459594727, "global_step": 466433, "epoch": 5619} {"train_loss": -27.221607208251953, "global_step": 466434, "epoch": 5619} {"train_loss": -27.59942054748535, "global_step": 466435, "epoch": 5619} {"train_loss": -27.425220489501953, "global_step": 466436, "epoch": 5619} {"train_loss": -27.75699234008789, "global_step": 466437, "epoch": 5619} {"train_loss": -27.46039390563965, "global_step": 466438, "epoch": 5619} {"train_loss": -27.12982177734375, "global_step": 466439, "epoch": 5619} {"train_loss": -27.420700073242188, "global_step": 466440, "epoch": 5619} {"train_loss": -27.444971084594727, "global_step": 466441, "epoch": 5619} {"train_loss": -27.58448600769043, "global_step": 466442, "epoch": 5619} {"train_loss": -27.4886474609375, "global_step": 466443, "epoch": 5619} {"train_loss": -27.26954460144043, "global_step": 466444, "epoch": 5619} {"train_loss": -27.699731826782227, "global_step": 466445, "epoch": 5619} {"train_loss": -27.50025749206543, "global_step": 466446, "epoch": 5619} {"train_loss": -27.858810424804688, "global_step": 466447, "epoch": 5619} {"train_loss": -27.28921890258789, "global_step": 466448, "epoch": 5619} {"train_loss": -27.4097843170166, "global_step": 466449, "epoch": 5619} {"train_loss": -27.40234375, "global_step": 466450, "epoch": 5619} {"train_loss": -27.636703491210938, "global_step": 466451, "epoch": 5619} {"train_loss": -27.095495223999023, "global_step": 466452, "epoch": 5619} {"train_loss": -27.559057235717773, "global_step": 466453, "epoch": 5619} {"train_loss": -27.404829025268555, "global_step": 466454, "epoch": 5619} {"train_loss": -26.982572555541992, "global_step": 466455, "epoch": 5619} {"train_loss": -27.040847778320312, "global_step": 466456, "epoch": 5619} {"train_loss": -26.6981201171875, "global_step": 466457, "epoch": 5619} {"train_loss": -25.611047744750977, "global_step": 466458, "epoch": 5619} {"train_loss": -27.044253567615186, "global_step": 466459, "epoch": 5619, "val_loss": 6559655.0} {"train_loss": -23.143165588378906, "global_step": 466460, "epoch": 5620} {"train_loss": -23.739328384399414, "global_step": 466461, "epoch": 5620} {"train_loss": -23.909595489501953, "global_step": 466462, "epoch": 5620} {"train_loss": -23.985034942626953, "global_step": 466463, "epoch": 5620} {"train_loss": -24.442092895507812, "global_step": 466464, "epoch": 5620} {"train_loss": -25.119443893432617, "global_step": 466465, "epoch": 5620} {"train_loss": -25.32511329650879, "global_step": 466466, "epoch": 5620} {"train_loss": -24.838903427124023, "global_step": 466467, "epoch": 5620} {"train_loss": -25.05515480041504, "global_step": 466468, "epoch": 5620} {"train_loss": -25.327213287353516, "global_step": 466469, "epoch": 5620} {"train_loss": -25.74458122253418, "global_step": 466470, "epoch": 5620} {"train_loss": -25.076597213745117, "global_step": 466471, "epoch": 5620} {"train_loss": -25.509796142578125, "global_step": 466472, "epoch": 5620} {"train_loss": -25.425308227539062, "global_step": 466473, "epoch": 5620} {"train_loss": -25.3387508392334, "global_step": 466474, "epoch": 5620} {"train_loss": -25.529056549072266, "global_step": 466475, "epoch": 5620} {"train_loss": -25.977277755737305, "global_step": 466476, "epoch": 5620} {"train_loss": -25.473005294799805, "global_step": 466477, "epoch": 5620} {"train_loss": -25.73341178894043, "global_step": 466478, "epoch": 5620} {"train_loss": -25.82642936706543, "global_step": 466479, "epoch": 5620} {"train_loss": -25.980762481689453, "global_step": 466480, "epoch": 5620} {"train_loss": -26.405729293823242, "global_step": 466481, "epoch": 5620} {"train_loss": -25.78705406188965, "global_step": 466482, "epoch": 5620} {"train_loss": -25.898828506469727, "global_step": 466483, "epoch": 5620} {"train_loss": -26.131000518798828, "global_step": 466484, "epoch": 5620} {"train_loss": -26.315458297729492, "global_step": 466485, "epoch": 5620} {"train_loss": -25.702789306640625, "global_step": 466486, "epoch": 5620} {"train_loss": -26.14101219177246, "global_step": 466487, "epoch": 5620} {"train_loss": -26.60986328125, "global_step": 466488, "epoch": 5620} {"train_loss": -26.514392852783203, "global_step": 466489, "epoch": 5620} {"train_loss": -26.33274269104004, "global_step": 466490, "epoch": 5620} {"train_loss": -26.408145904541016, "global_step": 466491, "epoch": 5620} {"train_loss": -26.641141891479492, "global_step": 466492, "epoch": 5620} {"train_loss": -26.641218185424805, "global_step": 466493, "epoch": 5620} {"train_loss": -26.76283073425293, "global_step": 466494, "epoch": 5620} {"train_loss": -26.62395668029785, "global_step": 466495, "epoch": 5620} {"train_loss": -26.828344345092773, "global_step": 466496, "epoch": 5620} {"train_loss": -26.701385498046875, "global_step": 466497, "epoch": 5620} {"train_loss": -26.612268447875977, "global_step": 466498, "epoch": 5620} {"train_loss": -26.616418838500977, "global_step": 466499, "epoch": 5620} {"train_loss": -26.69264030456543, "global_step": 466500, "epoch": 5620} {"train_loss": -26.907958984375, "global_step": 466501, "epoch": 5620} {"train_loss": -27.07663345336914, "global_step": 466502, "epoch": 5620} {"train_loss": -26.822851181030273, "global_step": 466503, "epoch": 5620} {"train_loss": -26.86397361755371, "global_step": 466504, "epoch": 5620} {"train_loss": -26.83298683166504, "global_step": 466505, "epoch": 5620} {"train_loss": -26.76959228515625, "global_step": 466506, "epoch": 5620} {"train_loss": -26.917911529541016, "global_step": 466507, "epoch": 5620} {"train_loss": -26.742450714111328, "global_step": 466508, "epoch": 5620} {"train_loss": -26.89423942565918, "global_step": 466509, "epoch": 5620} {"train_loss": -27.080312728881836, "global_step": 466510, "epoch": 5620} {"train_loss": -27.13014030456543, "global_step": 466511, "epoch": 5620} {"train_loss": -27.071210861206055, "global_step": 466512, "epoch": 5620} {"train_loss": -27.203083038330078, "global_step": 466513, "epoch": 5620} {"train_loss": -27.326772689819336, "global_step": 466514, "epoch": 5620} {"train_loss": -27.038623809814453, "global_step": 466515, "epoch": 5620} {"train_loss": -26.96870231628418, "global_step": 466516, "epoch": 5620} {"train_loss": -26.915882110595703, "global_step": 466517, "epoch": 5620} {"train_loss": -27.57806968688965, "global_step": 466518, "epoch": 5620} {"train_loss": -27.22831153869629, "global_step": 466519, "epoch": 5620} {"train_loss": -26.838048934936523, "global_step": 466520, "epoch": 5620} {"train_loss": -27.054975509643555, "global_step": 466521, "epoch": 5620} {"train_loss": -27.282947540283203, "global_step": 466522, "epoch": 5620} {"train_loss": -27.617908477783203, "global_step": 466523, "epoch": 5620} {"train_loss": -27.121957778930664, "global_step": 466524, "epoch": 5620} {"train_loss": -27.09699058532715, "global_step": 466525, "epoch": 5620} {"train_loss": -27.07319450378418, "global_step": 466526, "epoch": 5620} {"train_loss": -27.27899169921875, "global_step": 466527, "epoch": 5620} {"train_loss": -27.34848976135254, "global_step": 466528, "epoch": 5620} {"train_loss": -26.848119735717773, "global_step": 466529, "epoch": 5620} {"train_loss": -27.14985466003418, "global_step": 466530, "epoch": 5620} {"train_loss": -26.754566192626953, "global_step": 466531, "epoch": 5620} {"train_loss": -27.105024337768555, "global_step": 466532, "epoch": 5620} {"train_loss": -27.917194366455078, "global_step": 466533, "epoch": 5620} {"train_loss": -27.597623825073242, "global_step": 466534, "epoch": 5620} {"train_loss": -27.03036880493164, "global_step": 466535, "epoch": 5620} {"train_loss": -27.246862411499023, "global_step": 466536, "epoch": 5620} {"train_loss": -27.025800704956055, "global_step": 466537, "epoch": 5620} {"train_loss": -26.84002113342285, "global_step": 466538, "epoch": 5620} {"train_loss": -27.239282608032227, "global_step": 466539, "epoch": 5620} {"train_loss": -27.47285270690918, "global_step": 466540, "epoch": 5620} {"train_loss": -27.25861930847168, "global_step": 466541, "epoch": 5620} {"train_loss": -26.427143602486115, "global_step": 466542, "epoch": 5620, "val_loss": 6553085.0} {"train_loss": -27.01969337463379, "global_step": 466543, "epoch": 5621} {"train_loss": -26.956268310546875, "global_step": 466544, "epoch": 5621} {"train_loss": -26.676910400390625, "global_step": 466545, "epoch": 5621} {"train_loss": -27.029499053955078, "global_step": 466546, "epoch": 5621} {"train_loss": -26.738229751586914, "global_step": 466547, "epoch": 5621} {"train_loss": -27.077924728393555, "global_step": 466548, "epoch": 5621} {"train_loss": -27.224639892578125, "global_step": 466549, "epoch": 5621} {"train_loss": -26.523761749267578, "global_step": 466550, "epoch": 5621} {"train_loss": -26.728946685791016, "global_step": 466551, "epoch": 5621} {"train_loss": -27.151777267456055, "global_step": 466552, "epoch": 5621} {"train_loss": -26.987472534179688, "global_step": 466553, "epoch": 5621} {"train_loss": -27.088703155517578, "global_step": 466554, "epoch": 5621} {"train_loss": -26.79933738708496, "global_step": 466555, "epoch": 5621} {"train_loss": -26.900365829467773, "global_step": 466556, "epoch": 5621} {"train_loss": -27.015851974487305, "global_step": 466557, "epoch": 5621} {"train_loss": -27.359960556030273, "global_step": 466558, "epoch": 5621} {"train_loss": -27.199554443359375, "global_step": 466559, "epoch": 5621} {"train_loss": -27.220844268798828, "global_step": 466560, "epoch": 5621} {"train_loss": -27.390836715698242, "global_step": 466561, "epoch": 5621} {"train_loss": -27.279443740844727, "global_step": 466562, "epoch": 5621} {"train_loss": -27.389387130737305, "global_step": 466563, "epoch": 5621} {"train_loss": -27.086536407470703, "global_step": 466564, "epoch": 5621} {"train_loss": -26.932661056518555, "global_step": 466565, "epoch": 5621} {"train_loss": -27.211477279663086, "global_step": 466566, "epoch": 5621} {"train_loss": -27.143280029296875, "global_step": 466567, "epoch": 5621} {"train_loss": -27.43853759765625, "global_step": 466568, "epoch": 5621} {"train_loss": -27.416101455688477, "global_step": 466569, "epoch": 5621} {"train_loss": -27.4320068359375, "global_step": 466570, "epoch": 5621} {"train_loss": -27.0795841217041, "global_step": 466571, "epoch": 5621} {"train_loss": -27.170822143554688, "global_step": 466572, "epoch": 5621} {"train_loss": -26.83091163635254, "global_step": 466573, "epoch": 5621} {"train_loss": -27.23211097717285, "global_step": 466574, "epoch": 5621} {"train_loss": -27.817596435546875, "global_step": 466575, "epoch": 5621} {"train_loss": -27.307214736938477, "global_step": 466576, "epoch": 5621} {"train_loss": -27.56076431274414, "global_step": 466577, "epoch": 5621} {"train_loss": -27.093189239501953, "global_step": 466578, "epoch": 5621} {"train_loss": -27.4069766998291, "global_step": 466579, "epoch": 5621} {"train_loss": -27.2031307220459, "global_step": 466580, "epoch": 5621} {"train_loss": -27.40650749206543, "global_step": 466581, "epoch": 5621} {"train_loss": -26.654052734375, "global_step": 466582, "epoch": 5621} {"train_loss": -26.9290714263916, "global_step": 466583, "epoch": 5621} {"train_loss": -26.935712814331055, "global_step": 466584, "epoch": 5621} {"train_loss": -26.76845359802246, "global_step": 466585, "epoch": 5621} {"train_loss": -26.430999755859375, "global_step": 466586, "epoch": 5621} {"train_loss": -26.3538875579834, "global_step": 466587, "epoch": 5621} {"train_loss": -26.745410919189453, "global_step": 466588, "epoch": 5621} {"train_loss": -27.358795166015625, "global_step": 466589, "epoch": 5621} {"train_loss": -26.7497501373291, "global_step": 466590, "epoch": 5621} {"train_loss": -27.261816024780273, "global_step": 466591, "epoch": 5621} {"train_loss": -27.070093154907227, "global_step": 466592, "epoch": 5621} {"train_loss": -27.24285316467285, "global_step": 466593, "epoch": 5621} {"train_loss": -27.352624893188477, "global_step": 466594, "epoch": 5621} {"train_loss": -27.018726348876953, "global_step": 466595, "epoch": 5621} {"train_loss": -27.082204818725586, "global_step": 466596, "epoch": 5621} {"train_loss": -27.260950088500977, "global_step": 466597, "epoch": 5621} {"train_loss": -27.123682022094727, "global_step": 466598, "epoch": 5621} {"train_loss": -26.781774520874023, "global_step": 466599, "epoch": 5621} {"train_loss": -27.191747665405273, "global_step": 466600, "epoch": 5621} {"train_loss": -27.422861099243164, "global_step": 466601, "epoch": 5621} {"train_loss": -26.61138343811035, "global_step": 466602, "epoch": 5621} {"train_loss": -27.28485679626465, "global_step": 466603, "epoch": 5621} {"train_loss": -27.367345809936523, "global_step": 466604, "epoch": 5621} {"train_loss": -26.82850456237793, "global_step": 466605, "epoch": 5621} {"train_loss": -27.083032608032227, "global_step": 466606, "epoch": 5621} {"train_loss": -27.09307861328125, "global_step": 466607, "epoch": 5621} {"train_loss": -26.972753524780273, "global_step": 466608, "epoch": 5621} {"train_loss": -27.35548210144043, "global_step": 466609, "epoch": 5621} {"train_loss": -27.29102897644043, "global_step": 466610, "epoch": 5621} {"train_loss": -27.155353546142578, "global_step": 466611, "epoch": 5621} {"train_loss": -27.304046630859375, "global_step": 466612, "epoch": 5621} {"train_loss": -27.015247344970703, "global_step": 466613, "epoch": 5621} {"train_loss": -27.22291374206543, "global_step": 466614, "epoch": 5621} {"train_loss": -27.014190673828125, "global_step": 466615, "epoch": 5621} {"train_loss": -26.984899520874023, "global_step": 466616, "epoch": 5621} {"train_loss": -27.228906631469727, "global_step": 466617, "epoch": 5621} {"train_loss": -26.969030380249023, "global_step": 466618, "epoch": 5621} {"train_loss": -27.215396881103516, "global_step": 466619, "epoch": 5621} {"train_loss": -27.05842399597168, "global_step": 466620, "epoch": 5621} {"train_loss": -27.34510612487793, "global_step": 466621, "epoch": 5621} {"train_loss": -27.081220626831055, "global_step": 466622, "epoch": 5621} {"train_loss": -27.2259464263916, "global_step": 466623, "epoch": 5621} {"train_loss": -27.335805892944336, "global_step": 466624, "epoch": 5621} {"train_loss": -27.118551966655684, "global_step": 466625, "epoch": 5621, "val_loss": 6541373.0} {"train_loss": -26.628314971923828, "global_step": 466626, "epoch": 5622} {"train_loss": -26.54107093811035, "global_step": 466627, "epoch": 5622} {"train_loss": -26.77446937561035, "global_step": 466628, "epoch": 5622} {"train_loss": -26.675832748413086, "global_step": 466629, "epoch": 5622} {"train_loss": -26.641876220703125, "global_step": 466630, "epoch": 5622} {"train_loss": -27.18915367126465, "global_step": 466631, "epoch": 5622} {"train_loss": -26.548192977905273, "global_step": 466632, "epoch": 5622} {"train_loss": -26.44109535217285, "global_step": 466633, "epoch": 5622} {"train_loss": -26.651700973510742, "global_step": 466634, "epoch": 5622} {"train_loss": -27.0092716217041, "global_step": 466635, "epoch": 5622} {"train_loss": -26.539350509643555, "global_step": 466636, "epoch": 5622} {"train_loss": -26.140003204345703, "global_step": 466637, "epoch": 5622} {"train_loss": -25.85988426208496, "global_step": 466638, "epoch": 5622} {"train_loss": -26.419025421142578, "global_step": 466639, "epoch": 5622} {"train_loss": -26.641443252563477, "global_step": 466640, "epoch": 5622} {"train_loss": -26.693546295166016, "global_step": 466641, "epoch": 5622} {"train_loss": -26.828649520874023, "global_step": 466642, "epoch": 5622} {"train_loss": -26.518726348876953, "global_step": 466643, "epoch": 5622} {"train_loss": -26.872705459594727, "global_step": 466644, "epoch": 5622} {"train_loss": -26.803424835205078, "global_step": 466645, "epoch": 5622} {"train_loss": -26.517597198486328, "global_step": 466646, "epoch": 5622} {"train_loss": -26.721893310546875, "global_step": 466647, "epoch": 5622} {"train_loss": -26.981307983398438, "global_step": 466648, "epoch": 5622} {"train_loss": -26.719928741455078, "global_step": 466649, "epoch": 5622} {"train_loss": -27.118497848510742, "global_step": 466650, "epoch": 5622} {"train_loss": -26.92928123474121, "global_step": 466651, "epoch": 5622} {"train_loss": -27.126367568969727, "global_step": 466652, "epoch": 5622} {"train_loss": -27.075769424438477, "global_step": 466653, "epoch": 5622} {"train_loss": -27.104825973510742, "global_step": 466654, "epoch": 5622} {"train_loss": -27.128738403320312, "global_step": 466655, "epoch": 5622} {"train_loss": -26.976303100585938, "global_step": 466656, "epoch": 5622} {"train_loss": -26.9830265045166, "global_step": 466657, "epoch": 5622} {"train_loss": -27.262527465820312, "global_step": 466658, "epoch": 5622} {"train_loss": -27.103546142578125, "global_step": 466659, "epoch": 5622} {"train_loss": -26.900598526000977, "global_step": 466660, "epoch": 5622} {"train_loss": -27.118061065673828, "global_step": 466661, "epoch": 5622} {"train_loss": -27.522825241088867, "global_step": 466662, "epoch": 5622} {"train_loss": -27.378164291381836, "global_step": 466663, "epoch": 5622} {"train_loss": -27.403263092041016, "global_step": 466664, "epoch": 5622} {"train_loss": -27.22458267211914, "global_step": 466665, "epoch": 5622} {"train_loss": -27.070993423461914, "global_step": 466666, "epoch": 5622} {"train_loss": -27.204999923706055, "global_step": 466667, "epoch": 5622} {"train_loss": -27.13812828063965, "global_step": 466668, "epoch": 5622} {"train_loss": -27.49286460876465, "global_step": 466669, "epoch": 5622} {"train_loss": -27.46969985961914, "global_step": 466670, "epoch": 5622} {"train_loss": -27.362817764282227, "global_step": 466671, "epoch": 5622} {"train_loss": -27.430776596069336, "global_step": 466672, "epoch": 5622} {"train_loss": -27.290842056274414, "global_step": 466673, "epoch": 5622} {"train_loss": -27.207473754882812, "global_step": 466674, "epoch": 5622} {"train_loss": -27.153051376342773, "global_step": 466675, "epoch": 5622} {"train_loss": -27.467426300048828, "global_step": 466676, "epoch": 5622} {"train_loss": -27.196252822875977, "global_step": 466677, "epoch": 5622} {"train_loss": -27.22211265563965, "global_step": 466678, "epoch": 5622} {"train_loss": -27.2624454498291, "global_step": 466679, "epoch": 5622} {"train_loss": -27.497461318969727, "global_step": 466680, "epoch": 5622} {"train_loss": -27.518224716186523, "global_step": 466681, "epoch": 5622} {"train_loss": -27.40846061706543, "global_step": 466682, "epoch": 5622} {"train_loss": -27.740076065063477, "global_step": 466683, "epoch": 5622} {"train_loss": -27.204120635986328, "global_step": 466684, "epoch": 5622} {"train_loss": -27.309228897094727, "global_step": 466685, "epoch": 5622} {"train_loss": -27.171796798706055, "global_step": 466686, "epoch": 5622} {"train_loss": -26.842670440673828, "global_step": 466687, "epoch": 5622} {"train_loss": -26.33493995666504, "global_step": 466688, "epoch": 5622} {"train_loss": -26.653722763061523, "global_step": 466689, "epoch": 5622} {"train_loss": -26.782148361206055, "global_step": 466690, "epoch": 5622} {"train_loss": -27.25343132019043, "global_step": 466691, "epoch": 5622} {"train_loss": -27.115222930908203, "global_step": 466692, "epoch": 5622} {"train_loss": -26.695270538330078, "global_step": 466693, "epoch": 5622} {"train_loss": -27.297367095947266, "global_step": 466694, "epoch": 5622} {"train_loss": -27.103727340698242, "global_step": 466695, "epoch": 5622} {"train_loss": -27.097980499267578, "global_step": 466696, "epoch": 5622} {"train_loss": -27.25634765625, "global_step": 466697, "epoch": 5622} {"train_loss": -26.980606079101562, "global_step": 466698, "epoch": 5622} {"train_loss": -27.0169734954834, "global_step": 466699, "epoch": 5622} {"train_loss": -27.3041934967041, "global_step": 466700, "epoch": 5622} {"train_loss": -27.29859733581543, "global_step": 466701, "epoch": 5622} {"train_loss": -26.88283348083496, "global_step": 466702, "epoch": 5622} {"train_loss": -26.98394203186035, "global_step": 466703, "epoch": 5622} {"train_loss": -27.042743682861328, "global_step": 466704, "epoch": 5622} {"train_loss": -27.321680068969727, "global_step": 466705, "epoch": 5622} {"train_loss": -27.05560302734375, "global_step": 466706, "epoch": 5622} {"train_loss": -27.120264053344727, "global_step": 466707, "epoch": 5622} {"train_loss": -27.023804538221246, "global_step": 466708, "epoch": 5622, "val_loss": 6557107.5} {"train_loss": -26.53436279296875, "global_step": 466709, "epoch": 5623} {"train_loss": -26.634979248046875, "global_step": 466710, "epoch": 5623} {"train_loss": -26.09682273864746, "global_step": 466711, "epoch": 5623} {"train_loss": -26.60896873474121, "global_step": 466712, "epoch": 5623} {"train_loss": -26.767471313476562, "global_step": 466713, "epoch": 5623} {"train_loss": -26.55483055114746, "global_step": 466714, "epoch": 5623} {"train_loss": -26.68391227722168, "global_step": 466715, "epoch": 5623} {"train_loss": -27.04274559020996, "global_step": 466716, "epoch": 5623} {"train_loss": -26.451557159423828, "global_step": 466717, "epoch": 5623} {"train_loss": -26.681501388549805, "global_step": 466718, "epoch": 5623} {"train_loss": -26.710052490234375, "global_step": 466719, "epoch": 5623} {"train_loss": -26.79762077331543, "global_step": 466720, "epoch": 5623} {"train_loss": -27.06662368774414, "global_step": 466721, "epoch": 5623} {"train_loss": -26.480310440063477, "global_step": 466722, "epoch": 5623} {"train_loss": -26.660009384155273, "global_step": 466723, "epoch": 5623} {"train_loss": -27.182819366455078, "global_step": 466724, "epoch": 5623} {"train_loss": -26.869693756103516, "global_step": 466725, "epoch": 5623} {"train_loss": -26.99347496032715, "global_step": 466726, "epoch": 5623} {"train_loss": -27.09564208984375, "global_step": 466727, "epoch": 5623} {"train_loss": -26.937402725219727, "global_step": 466728, "epoch": 5623} {"train_loss": -26.97736930847168, "global_step": 466729, "epoch": 5623} {"train_loss": -27.150043487548828, "global_step": 466730, "epoch": 5623} {"train_loss": -27.048294067382812, "global_step": 466731, "epoch": 5623} {"train_loss": -27.070138931274414, "global_step": 466732, "epoch": 5623} {"train_loss": -27.069507598876953, "global_step": 466733, "epoch": 5623} {"train_loss": -27.13275718688965, "global_step": 466734, "epoch": 5623} {"train_loss": -26.83546257019043, "global_step": 466735, "epoch": 5623} {"train_loss": -27.0667781829834, "global_step": 466736, "epoch": 5623} {"train_loss": -27.2784423828125, "global_step": 466737, "epoch": 5623} {"train_loss": -27.384252548217773, "global_step": 466738, "epoch": 5623} {"train_loss": -26.758411407470703, "global_step": 466739, "epoch": 5623} {"train_loss": -27.183923721313477, "global_step": 466740, "epoch": 5623} {"train_loss": -27.621414184570312, "global_step": 466741, "epoch": 5623} {"train_loss": -27.083715438842773, "global_step": 466742, "epoch": 5623} {"train_loss": -26.7736759185791, "global_step": 466743, "epoch": 5623} {"train_loss": -26.781904220581055, "global_step": 466744, "epoch": 5623} {"train_loss": -27.339094161987305, "global_step": 466745, "epoch": 5623} {"train_loss": -26.82342529296875, "global_step": 466746, "epoch": 5623} {"train_loss": -27.232587814331055, "global_step": 466747, "epoch": 5623} {"train_loss": -27.468475341796875, "global_step": 466748, "epoch": 5623} {"train_loss": -27.034555435180664, "global_step": 466749, "epoch": 5623} {"train_loss": -27.07232093811035, "global_step": 466750, "epoch": 5623} {"train_loss": -26.99506187438965, "global_step": 466751, "epoch": 5623} {"train_loss": -27.66228675842285, "global_step": 466752, "epoch": 5623} {"train_loss": -27.444385528564453, "global_step": 466753, "epoch": 5623} {"train_loss": -27.28436851501465, "global_step": 466754, "epoch": 5623} {"train_loss": -27.096527099609375, "global_step": 466755, "epoch": 5623} {"train_loss": -27.262311935424805, "global_step": 466756, "epoch": 5623} {"train_loss": -27.132537841796875, "global_step": 466757, "epoch": 5623} {"train_loss": -26.933324813842773, "global_step": 466758, "epoch": 5623} {"train_loss": -27.288293838500977, "global_step": 466759, "epoch": 5623} {"train_loss": -27.457569122314453, "global_step": 466760, "epoch": 5623} {"train_loss": -27.415252685546875, "global_step": 466761, "epoch": 5623} {"train_loss": -27.696842193603516, "global_step": 466762, "epoch": 5623} {"train_loss": -26.991201400756836, "global_step": 466763, "epoch": 5623} {"train_loss": -27.4105167388916, "global_step": 466764, "epoch": 5623} {"train_loss": -27.233728408813477, "global_step": 466765, "epoch": 5623} {"train_loss": -27.532926559448242, "global_step": 466766, "epoch": 5623} {"train_loss": -27.228473663330078, "global_step": 466767, "epoch": 5623} {"train_loss": -27.47602653503418, "global_step": 466768, "epoch": 5623} {"train_loss": -27.1606502532959, "global_step": 466769, "epoch": 5623} {"train_loss": -27.42093849182129, "global_step": 466770, "epoch": 5623} {"train_loss": -27.733633041381836, "global_step": 466771, "epoch": 5623} {"train_loss": -27.342870712280273, "global_step": 466772, "epoch": 5623} {"train_loss": -27.358129501342773, "global_step": 466773, "epoch": 5623} {"train_loss": -27.33686637878418, "global_step": 466774, "epoch": 5623} {"train_loss": -27.21940040588379, "global_step": 466775, "epoch": 5623} {"train_loss": -27.117284774780273, "global_step": 466776, "epoch": 5623} {"train_loss": -27.172555923461914, "global_step": 466777, "epoch": 5623} {"train_loss": -27.35686683654785, "global_step": 466778, "epoch": 5623} {"train_loss": -27.765729904174805, "global_step": 466779, "epoch": 5623} {"train_loss": -27.08550453186035, "global_step": 466780, "epoch": 5623} {"train_loss": -27.15273094177246, "global_step": 466781, "epoch": 5623} {"train_loss": -27.001270294189453, "global_step": 466782, "epoch": 5623} {"train_loss": -27.002613067626953, "global_step": 466783, "epoch": 5623} {"train_loss": -26.896320343017578, "global_step": 466784, "epoch": 5623} {"train_loss": -27.39950942993164, "global_step": 466785, "epoch": 5623} {"train_loss": -27.102951049804688, "global_step": 466786, "epoch": 5623} {"train_loss": -27.048419952392578, "global_step": 466787, "epoch": 5623} {"train_loss": -27.023839950561523, "global_step": 466788, "epoch": 5623} {"train_loss": -26.85895347595215, "global_step": 466789, "epoch": 5623} {"train_loss": -27.127424240112305, "global_step": 466790, "epoch": 5623} {"train_loss": -27.094600011067218, "global_step": 466791, "epoch": 5623, "val_loss": 6476415.0} {"train_loss": -25.336862564086914, "global_step": 466792, "epoch": 5624} {"train_loss": -24.29695701599121, "global_step": 466793, "epoch": 5624} {"train_loss": -25.100309371948242, "global_step": 466794, "epoch": 5624} {"train_loss": -25.1903076171875, "global_step": 466795, "epoch": 5624} {"train_loss": -25.51006507873535, "global_step": 466796, "epoch": 5624} {"train_loss": -24.434911727905273, "global_step": 466797, "epoch": 5624} {"train_loss": -25.067304611206055, "global_step": 466798, "epoch": 5624} {"train_loss": -26.169116973876953, "global_step": 466799, "epoch": 5624} {"train_loss": -25.631153106689453, "global_step": 466800, "epoch": 5624} {"train_loss": -25.94158935546875, "global_step": 466801, "epoch": 5624} {"train_loss": -25.904958724975586, "global_step": 466802, "epoch": 5624} {"train_loss": -26.352706909179688, "global_step": 466803, "epoch": 5624} {"train_loss": -26.143054962158203, "global_step": 466804, "epoch": 5624} {"train_loss": -26.61846923828125, "global_step": 466805, "epoch": 5624} {"train_loss": -26.273862838745117, "global_step": 466806, "epoch": 5624} {"train_loss": -26.540191650390625, "global_step": 466807, "epoch": 5624} {"train_loss": -26.000913619995117, "global_step": 466808, "epoch": 5624} {"train_loss": -26.174026489257812, "global_step": 466809, "epoch": 5624} {"train_loss": -26.938812255859375, "global_step": 466810, "epoch": 5624} {"train_loss": -26.417953491210938, "global_step": 466811, "epoch": 5624} {"train_loss": -26.51141357421875, "global_step": 466812, "epoch": 5624} {"train_loss": -26.622827529907227, "global_step": 466813, "epoch": 5624} {"train_loss": -26.7187557220459, "global_step": 466814, "epoch": 5624} {"train_loss": -26.765615463256836, "global_step": 466815, "epoch": 5624} {"train_loss": -26.71451187133789, "global_step": 466816, "epoch": 5624} {"train_loss": -26.78034019470215, "global_step": 466817, "epoch": 5624} {"train_loss": -26.89545249938965, "global_step": 466818, "epoch": 5624} {"train_loss": -26.97607421875, "global_step": 466819, "epoch": 5624} {"train_loss": -26.967554092407227, "global_step": 466820, "epoch": 5624} {"train_loss": -26.306554794311523, "global_step": 466821, "epoch": 5624} {"train_loss": -26.851852416992188, "global_step": 466822, "epoch": 5624} {"train_loss": -26.618452072143555, "global_step": 466823, "epoch": 5624} {"train_loss": -27.403030395507812, "global_step": 466824, "epoch": 5624} {"train_loss": -26.502609252929688, "global_step": 466825, "epoch": 5624} {"train_loss": -26.903844833374023, "global_step": 466826, "epoch": 5624} {"train_loss": -26.60150718688965, "global_step": 466827, "epoch": 5624} {"train_loss": -27.091571807861328, "global_step": 466828, "epoch": 5624} {"train_loss": -27.17457389831543, "global_step": 466829, "epoch": 5624} {"train_loss": -27.179489135742188, "global_step": 466830, "epoch": 5624} {"train_loss": -27.009077072143555, "global_step": 466831, "epoch": 5624} {"train_loss": -27.390705108642578, "global_step": 466832, "epoch": 5624} {"train_loss": -27.078519821166992, "global_step": 466833, "epoch": 5624} {"train_loss": -27.091176986694336, "global_step": 466834, "epoch": 5624} {"train_loss": -27.07037353515625, "global_step": 466835, "epoch": 5624} {"train_loss": -27.351572036743164, "global_step": 466836, "epoch": 5624} {"train_loss": -26.932025909423828, "global_step": 466837, "epoch": 5624} {"train_loss": -27.17634391784668, "global_step": 466838, "epoch": 5624} {"train_loss": -27.18767738342285, "global_step": 466839, "epoch": 5624} {"train_loss": -27.802322387695312, "global_step": 466840, "epoch": 5624} {"train_loss": -26.971647262573242, "global_step": 466841, "epoch": 5624} {"train_loss": -27.600751876831055, "global_step": 466842, "epoch": 5624} {"train_loss": -27.355701446533203, "global_step": 466843, "epoch": 5624} {"train_loss": -27.71083641052246, "global_step": 466844, "epoch": 5624} {"train_loss": -27.190420150756836, "global_step": 466845, "epoch": 5624} {"train_loss": -27.297224044799805, "global_step": 466846, "epoch": 5624} {"train_loss": -27.504077911376953, "global_step": 466847, "epoch": 5624} {"train_loss": -27.355688095092773, "global_step": 466848, "epoch": 5624} {"train_loss": -27.386686325073242, "global_step": 466849, "epoch": 5624} {"train_loss": -27.3375186920166, "global_step": 466850, "epoch": 5624} {"train_loss": -27.325788497924805, "global_step": 466851, "epoch": 5624} {"train_loss": -27.435565948486328, "global_step": 466852, "epoch": 5624} {"train_loss": -27.177610397338867, "global_step": 466853, "epoch": 5624} {"train_loss": -27.5178165435791, "global_step": 466854, "epoch": 5624} {"train_loss": -27.459821701049805, "global_step": 466855, "epoch": 5624} {"train_loss": -27.458463668823242, "global_step": 466856, "epoch": 5624} {"train_loss": -27.521108627319336, "global_step": 466857, "epoch": 5624} {"train_loss": -27.292438507080078, "global_step": 466858, "epoch": 5624} {"train_loss": -27.5408935546875, "global_step": 466859, "epoch": 5624} {"train_loss": -27.381885528564453, "global_step": 466860, "epoch": 5624} {"train_loss": -27.15289878845215, "global_step": 466861, "epoch": 5624} {"train_loss": -27.26119041442871, "global_step": 466862, "epoch": 5624} {"train_loss": -27.166418075561523, "global_step": 466863, "epoch": 5624} {"train_loss": -27.442350387573242, "global_step": 466864, "epoch": 5624} {"train_loss": -27.409442901611328, "global_step": 466865, "epoch": 5624} {"train_loss": -27.2806396484375, "global_step": 466866, "epoch": 5624} {"train_loss": -27.069608688354492, "global_step": 466867, "epoch": 5624} {"train_loss": -27.242666244506836, "global_step": 466868, "epoch": 5624} {"train_loss": -26.760534286499023, "global_step": 466869, "epoch": 5624} {"train_loss": -27.24192237854004, "global_step": 466870, "epoch": 5624} {"train_loss": -27.244230270385742, "global_step": 466871, "epoch": 5624} {"train_loss": -27.025711059570312, "global_step": 466872, "epoch": 5624} {"train_loss": -26.96656608581543, "global_step": 466873, "epoch": 5624} {"train_loss": -26.81237358644784, "global_step": 466874, "epoch": 5624, "val_loss": 6532414.0} {"train_loss": -26.85498046875, "global_step": 466875, "epoch": 5625} {"train_loss": -26.156661987304688, "global_step": 466876, "epoch": 5625} {"train_loss": -25.736194610595703, "global_step": 466877, "epoch": 5625} {"train_loss": -25.323270797729492, "global_step": 466878, "epoch": 5625} {"train_loss": -24.727622985839844, "global_step": 466879, "epoch": 5625} {"train_loss": -26.209075927734375, "global_step": 466880, "epoch": 5625} {"train_loss": -26.112939834594727, "global_step": 466881, "epoch": 5625} {"train_loss": -26.002267837524414, "global_step": 466882, "epoch": 5625} {"train_loss": -26.33448600769043, "global_step": 466883, "epoch": 5625} {"train_loss": -26.42197608947754, "global_step": 466884, "epoch": 5625} {"train_loss": -26.100122451782227, "global_step": 466885, "epoch": 5625} {"train_loss": -26.302112579345703, "global_step": 466886, "epoch": 5625} {"train_loss": -26.623205184936523, "global_step": 466887, "epoch": 5625} {"train_loss": -26.088275909423828, "global_step": 466888, "epoch": 5625} {"train_loss": -26.509033203125, "global_step": 466889, "epoch": 5625} {"train_loss": -26.287067413330078, "global_step": 466890, "epoch": 5625} {"train_loss": -26.481597900390625, "global_step": 466891, "epoch": 5625} {"train_loss": -26.644744873046875, "global_step": 466892, "epoch": 5625} {"train_loss": -26.69135856628418, "global_step": 466893, "epoch": 5625} {"train_loss": -26.301685333251953, "global_step": 466894, "epoch": 5625} {"train_loss": -26.844131469726562, "global_step": 466895, "epoch": 5625} {"train_loss": -26.557540893554688, "global_step": 466896, "epoch": 5625} {"train_loss": -26.462635040283203, "global_step": 466897, "epoch": 5625} {"train_loss": -26.449853897094727, "global_step": 466898, "epoch": 5625} {"train_loss": -26.705236434936523, "global_step": 466899, "epoch": 5625} {"train_loss": -26.427066802978516, "global_step": 466900, "epoch": 5625} {"train_loss": -26.3985652923584, "global_step": 466901, "epoch": 5625} {"train_loss": -26.715429306030273, "global_step": 466902, "epoch": 5625} {"train_loss": -26.99090003967285, "global_step": 466903, "epoch": 5625} {"train_loss": -26.679006576538086, "global_step": 466904, "epoch": 5625} {"train_loss": -26.6379337310791, "global_step": 466905, "epoch": 5625} {"train_loss": -26.885868072509766, "global_step": 466906, "epoch": 5625} {"train_loss": -26.70619010925293, "global_step": 466907, "epoch": 5625} {"train_loss": -26.813873291015625, "global_step": 466908, "epoch": 5625} {"train_loss": -26.82716178894043, "global_step": 466909, "epoch": 5625} {"train_loss": -26.716175079345703, "global_step": 466910, "epoch": 5625} {"train_loss": -26.83452796936035, "global_step": 466911, "epoch": 5625} {"train_loss": -26.9034366607666, "global_step": 466912, "epoch": 5625} {"train_loss": -26.983722686767578, "global_step": 466913, "epoch": 5625} {"train_loss": -27.261188507080078, "global_step": 466914, "epoch": 5625} {"train_loss": -26.90290641784668, "global_step": 466915, "epoch": 5625} {"train_loss": -27.27936363220215, "global_step": 466916, "epoch": 5625} {"train_loss": -26.739948272705078, "global_step": 466917, "epoch": 5625} {"train_loss": -27.000207901000977, "global_step": 466918, "epoch": 5625} {"train_loss": -27.20709228515625, "global_step": 466919, "epoch": 5625} {"train_loss": -26.8998966217041, "global_step": 466920, "epoch": 5625} {"train_loss": -27.2305850982666, "global_step": 466921, "epoch": 5625} {"train_loss": -26.936254501342773, "global_step": 466922, "epoch": 5625} {"train_loss": -27.137754440307617, "global_step": 466923, "epoch": 5625} {"train_loss": -27.350061416625977, "global_step": 466924, "epoch": 5625} {"train_loss": -27.303964614868164, "global_step": 466925, "epoch": 5625} {"train_loss": -27.380224227905273, "global_step": 466926, "epoch": 5625} {"train_loss": -27.17462158203125, "global_step": 466927, "epoch": 5625} {"train_loss": -27.435277938842773, "global_step": 466928, "epoch": 5625} {"train_loss": -27.3426456451416, "global_step": 466929, "epoch": 5625} {"train_loss": -27.0394344329834, "global_step": 466930, "epoch": 5625} {"train_loss": -27.197927474975586, "global_step": 466931, "epoch": 5625} {"train_loss": -27.390356063842773, "global_step": 466932, "epoch": 5625} {"train_loss": -27.296539306640625, "global_step": 466933, "epoch": 5625} {"train_loss": -27.470584869384766, "global_step": 466934, "epoch": 5625} {"train_loss": -27.27300453186035, "global_step": 466935, "epoch": 5625} {"train_loss": -27.26706886291504, "global_step": 466936, "epoch": 5625} {"train_loss": -27.27109718322754, "global_step": 466937, "epoch": 5625} {"train_loss": -27.2335205078125, "global_step": 466938, "epoch": 5625} {"train_loss": -27.38836097717285, "global_step": 466939, "epoch": 5625} {"train_loss": -27.12470054626465, "global_step": 466940, "epoch": 5625} {"train_loss": -27.432723999023438, "global_step": 466941, "epoch": 5625} {"train_loss": -27.49872398376465, "global_step": 466942, "epoch": 5625} {"train_loss": -27.213714599609375, "global_step": 466943, "epoch": 5625} {"train_loss": -27.313404083251953, "global_step": 466944, "epoch": 5625} {"train_loss": -27.432453155517578, "global_step": 466945, "epoch": 5625} {"train_loss": -27.20342445373535, "global_step": 466946, "epoch": 5625} {"train_loss": -27.329730987548828, "global_step": 466947, "epoch": 5625} {"train_loss": -27.397668838500977, "global_step": 466948, "epoch": 5625} {"train_loss": -26.85400390625, "global_step": 466949, "epoch": 5625} {"train_loss": -27.595685958862305, "global_step": 466950, "epoch": 5625} {"train_loss": -27.231054306030273, "global_step": 466951, "epoch": 5625} {"train_loss": -27.101245880126953, "global_step": 466952, "epoch": 5625} {"train_loss": -27.20624351501465, "global_step": 466953, "epoch": 5625} {"train_loss": -27.251605987548828, "global_step": 466954, "epoch": 5625} {"train_loss": -27.220067977905273, "global_step": 466955, "epoch": 5625} {"train_loss": -26.872760772705078, "global_step": 466956, "epoch": 5625} {"train_loss": -26.845453561070453, "global_step": 466957, "epoch": 5625, "val_loss": 6458695.5} {"train_loss": -26.130468368530273, "global_step": 466958, "epoch": 5626} {"train_loss": -26.296289443969727, "global_step": 466959, "epoch": 5626} {"train_loss": -26.725915908813477, "global_step": 466960, "epoch": 5626} {"train_loss": -26.247098922729492, "global_step": 466961, "epoch": 5626} {"train_loss": -26.44921875, "global_step": 466962, "epoch": 5626} {"train_loss": -26.502105712890625, "global_step": 466963, "epoch": 5626} {"train_loss": -26.956689834594727, "global_step": 466964, "epoch": 5626} {"train_loss": -26.369068145751953, "global_step": 466965, "epoch": 5626} {"train_loss": -26.42035484313965, "global_step": 466966, "epoch": 5626} {"train_loss": -26.753416061401367, "global_step": 466967, "epoch": 5626} {"train_loss": -26.595792770385742, "global_step": 466968, "epoch": 5626} {"train_loss": -26.859907150268555, "global_step": 466969, "epoch": 5626} {"train_loss": -26.48578453063965, "global_step": 466970, "epoch": 5626} {"train_loss": -26.663009643554688, "global_step": 466971, "epoch": 5626} {"train_loss": -26.576772689819336, "global_step": 466972, "epoch": 5626} {"train_loss": -26.525379180908203, "global_step": 466973, "epoch": 5626} {"train_loss": -26.9101619720459, "global_step": 466974, "epoch": 5626} {"train_loss": -26.622211456298828, "global_step": 466975, "epoch": 5626} {"train_loss": -26.98920249938965, "global_step": 466976, "epoch": 5626} {"train_loss": -26.661975860595703, "global_step": 466977, "epoch": 5626} {"train_loss": -26.91156578063965, "global_step": 466978, "epoch": 5626} {"train_loss": -27.105239868164062, "global_step": 466979, "epoch": 5626} {"train_loss": -27.00360107421875, "global_step": 466980, "epoch": 5626} {"train_loss": -27.311965942382812, "global_step": 466981, "epoch": 5626} {"train_loss": -27.21449851989746, "global_step": 466982, "epoch": 5626} {"train_loss": -26.967121124267578, "global_step": 466983, "epoch": 5626} {"train_loss": -27.12993812561035, "global_step": 466984, "epoch": 5626} {"train_loss": -26.89888572692871, "global_step": 466985, "epoch": 5626} {"train_loss": -27.044530868530273, "global_step": 466986, "epoch": 5626} {"train_loss": -27.211963653564453, "global_step": 466987, "epoch": 5626} {"train_loss": -27.1404972076416, "global_step": 466988, "epoch": 5626} {"train_loss": -27.156253814697266, "global_step": 466989, "epoch": 5626} {"train_loss": -27.090137481689453, "global_step": 466990, "epoch": 5626} {"train_loss": -27.167692184448242, "global_step": 466991, "epoch": 5626} {"train_loss": -27.266340255737305, "global_step": 466992, "epoch": 5626} {"train_loss": -27.121198654174805, "global_step": 466993, "epoch": 5626} {"train_loss": -27.34163475036621, "global_step": 466994, "epoch": 5626} {"train_loss": -26.632938385009766, "global_step": 466995, "epoch": 5626} {"train_loss": -27.207014083862305, "global_step": 466996, "epoch": 5626} {"train_loss": -27.040307998657227, "global_step": 466997, "epoch": 5626} {"train_loss": -27.231252670288086, "global_step": 466998, "epoch": 5626} {"train_loss": -27.525999069213867, "global_step": 466999, "epoch": 5626} {"train_loss": -27.071247100830078, "global_step": 467000, "epoch": 5626} {"train_loss": -26.98870277404785, "global_step": 467001, "epoch": 5626} {"train_loss": -27.33803367614746, "global_step": 467002, "epoch": 5626} {"train_loss": -27.248815536499023, "global_step": 467003, "epoch": 5626} {"train_loss": -27.20415687561035, "global_step": 467004, "epoch": 5626} {"train_loss": -27.345703125, "global_step": 467005, "epoch": 5626} {"train_loss": -27.61231803894043, "global_step": 467006, "epoch": 5626} {"train_loss": -27.41128921508789, "global_step": 467007, "epoch": 5626} {"train_loss": -27.225849151611328, "global_step": 467008, "epoch": 5626} {"train_loss": -27.284826278686523, "global_step": 467009, "epoch": 5626} {"train_loss": -27.435626983642578, "global_step": 467010, "epoch": 5626} {"train_loss": -27.644012451171875, "global_step": 467011, "epoch": 5626} {"train_loss": -27.600284576416016, "global_step": 467012, "epoch": 5626} {"train_loss": -27.045562744140625, "global_step": 467013, "epoch": 5626} {"train_loss": -27.270227432250977, "global_step": 467014, "epoch": 5626} {"train_loss": -26.636280059814453, "global_step": 467015, "epoch": 5626} {"train_loss": -26.597198486328125, "global_step": 467016, "epoch": 5626} {"train_loss": -26.085412979125977, "global_step": 467017, "epoch": 5626} {"train_loss": -26.911956787109375, "global_step": 467018, "epoch": 5626} {"train_loss": -27.310300827026367, "global_step": 467019, "epoch": 5626} {"train_loss": -26.91072654724121, "global_step": 467020, "epoch": 5626} {"train_loss": -27.011184692382812, "global_step": 467021, "epoch": 5626} {"train_loss": -27.398853302001953, "global_step": 467022, "epoch": 5626} {"train_loss": -26.933643341064453, "global_step": 467023, "epoch": 5626} {"train_loss": -26.95684242248535, "global_step": 467024, "epoch": 5626} {"train_loss": -27.53740882873535, "global_step": 467025, "epoch": 5626} {"train_loss": -27.202451705932617, "global_step": 467026, "epoch": 5626} {"train_loss": -27.334192276000977, "global_step": 467027, "epoch": 5626} {"train_loss": -27.2407169342041, "global_step": 467028, "epoch": 5626} {"train_loss": -27.143722534179688, "global_step": 467029, "epoch": 5626} {"train_loss": -27.32693862915039, "global_step": 467030, "epoch": 5626} {"train_loss": -26.9995059967041, "global_step": 467031, "epoch": 5626} {"train_loss": -27.3437442779541, "global_step": 467032, "epoch": 5626} {"train_loss": -27.000513076782227, "global_step": 467033, "epoch": 5626} {"train_loss": -27.120248794555664, "global_step": 467034, "epoch": 5626} {"train_loss": -27.500228881835938, "global_step": 467035, "epoch": 5626} {"train_loss": -27.659643173217773, "global_step": 467036, "epoch": 5626} {"train_loss": -27.452899932861328, "global_step": 467037, "epoch": 5626} {"train_loss": -27.062036514282227, "global_step": 467038, "epoch": 5626} {"train_loss": -27.117206573486328, "global_step": 467039, "epoch": 5626} {"train_loss": -27.036464392420758, "global_step": 467040, "epoch": 5626, "val_loss": 6472636.0} {"train_loss": -27.244327545166016, "global_step": 467041, "epoch": 5627} {"train_loss": -26.671222686767578, "global_step": 467042, "epoch": 5627} {"train_loss": -26.851028442382812, "global_step": 467043, "epoch": 5627} {"train_loss": -27.16485023498535, "global_step": 467044, "epoch": 5627} {"train_loss": -27.152002334594727, "global_step": 467045, "epoch": 5627} {"train_loss": -26.594934463500977, "global_step": 467046, "epoch": 5627} {"train_loss": -27.062301635742188, "global_step": 467047, "epoch": 5627} {"train_loss": -27.07454490661621, "global_step": 467048, "epoch": 5627} {"train_loss": -27.029266357421875, "global_step": 467049, "epoch": 5627} {"train_loss": -27.09744644165039, "global_step": 467050, "epoch": 5627} {"train_loss": -26.282928466796875, "global_step": 467051, "epoch": 5627} {"train_loss": -26.101659774780273, "global_step": 467052, "epoch": 5627} {"train_loss": -26.6767635345459, "global_step": 467053, "epoch": 5627} {"train_loss": -26.856897354125977, "global_step": 467054, "epoch": 5627} {"train_loss": -26.707473754882812, "global_step": 467055, "epoch": 5627} {"train_loss": -26.781213760375977, "global_step": 467056, "epoch": 5627} {"train_loss": -27.066181182861328, "global_step": 467057, "epoch": 5627} {"train_loss": -26.7187557220459, "global_step": 467058, "epoch": 5627} {"train_loss": -26.677637100219727, "global_step": 467059, "epoch": 5627} {"train_loss": -27.1175479888916, "global_step": 467060, "epoch": 5627} {"train_loss": -26.935226440429688, "global_step": 467061, "epoch": 5627} {"train_loss": -27.055362701416016, "global_step": 467062, "epoch": 5627} {"train_loss": -26.663129806518555, "global_step": 467063, "epoch": 5627} {"train_loss": -27.22748374938965, "global_step": 467064, "epoch": 5627} {"train_loss": -26.85626220703125, "global_step": 467065, "epoch": 5627} {"train_loss": -27.297210693359375, "global_step": 467066, "epoch": 5627} {"train_loss": -26.98709487915039, "global_step": 467067, "epoch": 5627} {"train_loss": -27.436120986938477, "global_step": 467068, "epoch": 5627} {"train_loss": -26.852039337158203, "global_step": 467069, "epoch": 5627} {"train_loss": -27.28910255432129, "global_step": 467070, "epoch": 5627} {"train_loss": -27.30304527282715, "global_step": 467071, "epoch": 5627} {"train_loss": -26.938474655151367, "global_step": 467072, "epoch": 5627} {"train_loss": -26.940351486206055, "global_step": 467073, "epoch": 5627} {"train_loss": -26.9716854095459, "global_step": 467074, "epoch": 5627} {"train_loss": -27.036081314086914, "global_step": 467075, "epoch": 5627} {"train_loss": -27.019245147705078, "global_step": 467076, "epoch": 5627} {"train_loss": -27.588048934936523, "global_step": 467077, "epoch": 5627} {"train_loss": -27.0050048828125, "global_step": 467078, "epoch": 5627} {"train_loss": -27.134902954101562, "global_step": 467079, "epoch": 5627} {"train_loss": -27.271203994750977, "global_step": 467080, "epoch": 5627} {"train_loss": -27.10170555114746, "global_step": 467081, "epoch": 5627} {"train_loss": -27.256391525268555, "global_step": 467082, "epoch": 5627} {"train_loss": -27.3934326171875, "global_step": 467083, "epoch": 5627} {"train_loss": -27.22785758972168, "global_step": 467084, "epoch": 5627} {"train_loss": -26.749547958374023, "global_step": 467085, "epoch": 5627} {"train_loss": -26.931589126586914, "global_step": 467086, "epoch": 5627} {"train_loss": -27.095779418945312, "global_step": 467087, "epoch": 5627} {"train_loss": -26.958242416381836, "global_step": 467088, "epoch": 5627} {"train_loss": -27.445199966430664, "global_step": 467089, "epoch": 5627} {"train_loss": -26.9423828125, "global_step": 467090, "epoch": 5627} {"train_loss": -27.226972579956055, "global_step": 467091, "epoch": 5627} {"train_loss": -26.804792404174805, "global_step": 467092, "epoch": 5627} {"train_loss": -26.18086814880371, "global_step": 467093, "epoch": 5627} {"train_loss": -26.21490478515625, "global_step": 467094, "epoch": 5627} {"train_loss": -27.005102157592773, "global_step": 467095, "epoch": 5627} {"train_loss": -26.663114547729492, "global_step": 467096, "epoch": 5627} {"train_loss": -26.532251358032227, "global_step": 467097, "epoch": 5627} {"train_loss": -27.159820556640625, "global_step": 467098, "epoch": 5627} {"train_loss": -26.792844772338867, "global_step": 467099, "epoch": 5627} {"train_loss": -27.058027267456055, "global_step": 467100, "epoch": 5627} {"train_loss": -26.917621612548828, "global_step": 467101, "epoch": 5627} {"train_loss": -26.879688262939453, "global_step": 467102, "epoch": 5627} {"train_loss": -27.16412353515625, "global_step": 467103, "epoch": 5627} {"train_loss": -26.651578903198242, "global_step": 467104, "epoch": 5627} {"train_loss": -27.408842086791992, "global_step": 467105, "epoch": 5627} {"train_loss": -27.434925079345703, "global_step": 467106, "epoch": 5627} {"train_loss": -26.643354415893555, "global_step": 467107, "epoch": 5627} {"train_loss": -27.27032470703125, "global_step": 467108, "epoch": 5627} {"train_loss": -27.256872177124023, "global_step": 467109, "epoch": 5627} {"train_loss": -27.092138290405273, "global_step": 467110, "epoch": 5627} {"train_loss": -27.120813369750977, "global_step": 467111, "epoch": 5627} {"train_loss": -27.241565704345703, "global_step": 467112, "epoch": 5627} {"train_loss": -26.946802139282227, "global_step": 467113, "epoch": 5627} {"train_loss": -27.32480812072754, "global_step": 467114, "epoch": 5627} {"train_loss": -27.049413681030273, "global_step": 467115, "epoch": 5627} {"train_loss": -26.911787033081055, "global_step": 467116, "epoch": 5627} {"train_loss": -27.007055282592773, "global_step": 467117, "epoch": 5627} {"train_loss": -27.200275421142578, "global_step": 467118, "epoch": 5627} {"train_loss": -27.280054092407227, "global_step": 467119, "epoch": 5627} {"train_loss": -27.00725746154785, "global_step": 467120, "epoch": 5627} {"train_loss": -26.8255615234375, "global_step": 467121, "epoch": 5627} {"train_loss": -26.83159828186035, "global_step": 467122, "epoch": 5627} {"train_loss": -26.984523405511695, "global_step": 467123, "epoch": 5627, "val_loss": 6559417.0} {"train_loss": -27.1009578704834, "global_step": 467124, "epoch": 5628} {"train_loss": -26.874420166015625, "global_step": 467125, "epoch": 5628} {"train_loss": -26.561315536499023, "global_step": 467126, "epoch": 5628} {"train_loss": -27.008359909057617, "global_step": 467127, "epoch": 5628} {"train_loss": -27.106306076049805, "global_step": 467128, "epoch": 5628} {"train_loss": -26.52496910095215, "global_step": 467129, "epoch": 5628} {"train_loss": -26.826770782470703, "global_step": 467130, "epoch": 5628} {"train_loss": -26.702672958374023, "global_step": 467131, "epoch": 5628} {"train_loss": -27.0303955078125, "global_step": 467132, "epoch": 5628} {"train_loss": -27.469099044799805, "global_step": 467133, "epoch": 5628} {"train_loss": -27.09119987487793, "global_step": 467134, "epoch": 5628} {"train_loss": -26.442859649658203, "global_step": 467135, "epoch": 5628} {"train_loss": -27.410175323486328, "global_step": 467136, "epoch": 5628} {"train_loss": -27.324054718017578, "global_step": 467137, "epoch": 5628} {"train_loss": -27.10572624206543, "global_step": 467138, "epoch": 5628} {"train_loss": -27.304752349853516, "global_step": 467139, "epoch": 5628} {"train_loss": -27.143009185791016, "global_step": 467140, "epoch": 5628} {"train_loss": -26.9043025970459, "global_step": 467141, "epoch": 5628} {"train_loss": -27.220325469970703, "global_step": 467142, "epoch": 5628} {"train_loss": -26.946664810180664, "global_step": 467143, "epoch": 5628} {"train_loss": -27.178808212280273, "global_step": 467144, "epoch": 5628} {"train_loss": -27.27039909362793, "global_step": 467145, "epoch": 5628} {"train_loss": -27.410425186157227, "global_step": 467146, "epoch": 5628} {"train_loss": -27.0992374420166, "global_step": 467147, "epoch": 5628} {"train_loss": -26.912466049194336, "global_step": 467148, "epoch": 5628} {"train_loss": -27.446237564086914, "global_step": 467149, "epoch": 5628} {"train_loss": -26.971240997314453, "global_step": 467150, "epoch": 5628} {"train_loss": -27.2281551361084, "global_step": 467151, "epoch": 5628} {"train_loss": -27.45035743713379, "global_step": 467152, "epoch": 5628} {"train_loss": -26.994476318359375, "global_step": 467153, "epoch": 5628} {"train_loss": -27.277801513671875, "global_step": 467154, "epoch": 5628} {"train_loss": -27.231374740600586, "global_step": 467155, "epoch": 5628} {"train_loss": -26.90528678894043, "global_step": 467156, "epoch": 5628} {"train_loss": -27.056137084960938, "global_step": 467157, "epoch": 5628} {"train_loss": -27.227415084838867, "global_step": 467158, "epoch": 5628} {"train_loss": -26.92789077758789, "global_step": 467159, "epoch": 5628} {"train_loss": -27.017541885375977, "global_step": 467160, "epoch": 5628} {"train_loss": -27.2770938873291, "global_step": 467161, "epoch": 5628} {"train_loss": -26.83762550354004, "global_step": 467162, "epoch": 5628} {"train_loss": -26.39661979675293, "global_step": 467163, "epoch": 5628} {"train_loss": -27.050155639648438, "global_step": 467164, "epoch": 5628} {"train_loss": -27.18177604675293, "global_step": 467165, "epoch": 5628} {"train_loss": -27.025577545166016, "global_step": 467166, "epoch": 5628} {"train_loss": -27.20849609375, "global_step": 467167, "epoch": 5628} {"train_loss": -27.17994499206543, "global_step": 467168, "epoch": 5628} {"train_loss": -27.301252365112305, "global_step": 467169, "epoch": 5628} {"train_loss": -26.731063842773438, "global_step": 467170, "epoch": 5628} {"train_loss": -26.927106857299805, "global_step": 467171, "epoch": 5628} {"train_loss": -26.902099609375, "global_step": 467172, "epoch": 5628} {"train_loss": -27.031705856323242, "global_step": 467173, "epoch": 5628} {"train_loss": -26.970855712890625, "global_step": 467174, "epoch": 5628} {"train_loss": -27.3132381439209, "global_step": 467175, "epoch": 5628} {"train_loss": -26.9058895111084, "global_step": 467176, "epoch": 5628} {"train_loss": -27.350839614868164, "global_step": 467177, "epoch": 5628} {"train_loss": -26.89984130859375, "global_step": 467178, "epoch": 5628} {"train_loss": -27.50738525390625, "global_step": 467179, "epoch": 5628} {"train_loss": -26.605209350585938, "global_step": 467180, "epoch": 5628} {"train_loss": -27.57220458984375, "global_step": 467181, "epoch": 5628} {"train_loss": -27.210920333862305, "global_step": 467182, "epoch": 5628} {"train_loss": -26.936681747436523, "global_step": 467183, "epoch": 5628} {"train_loss": -27.158618927001953, "global_step": 467184, "epoch": 5628} {"train_loss": -27.26499366760254, "global_step": 467185, "epoch": 5628} {"train_loss": -27.2374267578125, "global_step": 467186, "epoch": 5628} {"train_loss": -27.26845359802246, "global_step": 467187, "epoch": 5628} {"train_loss": -27.33856773376465, "global_step": 467188, "epoch": 5628} {"train_loss": -27.376983642578125, "global_step": 467189, "epoch": 5628} {"train_loss": -27.483627319335938, "global_step": 467190, "epoch": 5628} {"train_loss": -27.361820220947266, "global_step": 467191, "epoch": 5628} {"train_loss": -27.383398056030273, "global_step": 467192, "epoch": 5628} {"train_loss": -27.410429000854492, "global_step": 467193, "epoch": 5628} {"train_loss": -27.119237899780273, "global_step": 467194, "epoch": 5628} {"train_loss": -27.22456932067871, "global_step": 467195, "epoch": 5628} {"train_loss": -25.9693603515625, "global_step": 467196, "epoch": 5628} {"train_loss": -25.520200729370117, "global_step": 467197, "epoch": 5628} {"train_loss": -24.068294525146484, "global_step": 467198, "epoch": 5628} {"train_loss": -24.32270622253418, "global_step": 467199, "epoch": 5628} {"train_loss": -26.6680965423584, "global_step": 467200, "epoch": 5628} {"train_loss": -24.9084415435791, "global_step": 467201, "epoch": 5628} {"train_loss": -25.648828506469727, "global_step": 467202, "epoch": 5628} {"train_loss": -25.660831451416016, "global_step": 467203, "epoch": 5628} {"train_loss": -26.121856689453125, "global_step": 467204, "epoch": 5628} {"train_loss": -26.46355628967285, "global_step": 467205, "epoch": 5628} {"train_loss": -26.894859382905157, "global_step": 467206, "epoch": 5628, "val_loss": 6446882.0} {"train_loss": -25.57538414001465, "global_step": 467207, "epoch": 5629} {"train_loss": -26.1141414642334, "global_step": 467208, "epoch": 5629} {"train_loss": -25.654829025268555, "global_step": 467209, "epoch": 5629} {"train_loss": -25.473207473754883, "global_step": 467210, "epoch": 5629} {"train_loss": -25.82736587524414, "global_step": 467211, "epoch": 5629} {"train_loss": -25.26349639892578, "global_step": 467212, "epoch": 5629} {"train_loss": -25.090621948242188, "global_step": 467213, "epoch": 5629} {"train_loss": -25.972858428955078, "global_step": 467214, "epoch": 5629} {"train_loss": -25.840383529663086, "global_step": 467215, "epoch": 5629} {"train_loss": -26.402435302734375, "global_step": 467216, "epoch": 5629} {"train_loss": -26.29534339904785, "global_step": 467217, "epoch": 5629} {"train_loss": -25.928466796875, "global_step": 467218, "epoch": 5629} {"train_loss": -25.678808212280273, "global_step": 467219, "epoch": 5629} {"train_loss": -26.370624542236328, "global_step": 467220, "epoch": 5629} {"train_loss": -26.2416934967041, "global_step": 467221, "epoch": 5629} {"train_loss": -26.69451332092285, "global_step": 467222, "epoch": 5629} {"train_loss": -26.1235408782959, "global_step": 467223, "epoch": 5629} {"train_loss": -26.662382125854492, "global_step": 467224, "epoch": 5629} {"train_loss": -26.495458602905273, "global_step": 467225, "epoch": 5629} {"train_loss": -26.56697654724121, "global_step": 467226, "epoch": 5629} {"train_loss": -26.5806827545166, "global_step": 467227, "epoch": 5629} {"train_loss": -26.4171199798584, "global_step": 467228, "epoch": 5629} {"train_loss": -26.340559005737305, "global_step": 467229, "epoch": 5629} {"train_loss": -26.453210830688477, "global_step": 467230, "epoch": 5629} {"train_loss": -26.423309326171875, "global_step": 467231, "epoch": 5629} {"train_loss": -26.58180046081543, "global_step": 467232, "epoch": 5629} {"train_loss": -26.57899284362793, "global_step": 467233, "epoch": 5629} {"train_loss": -26.658527374267578, "global_step": 467234, "epoch": 5629} {"train_loss": -27.06959342956543, "global_step": 467235, "epoch": 5629} {"train_loss": -26.603302001953125, "global_step": 467236, "epoch": 5629} {"train_loss": -26.770004272460938, "global_step": 467237, "epoch": 5629} {"train_loss": -26.9102783203125, "global_step": 467238, "epoch": 5629} {"train_loss": -26.735437393188477, "global_step": 467239, "epoch": 5629} {"train_loss": -26.710163116455078, "global_step": 467240, "epoch": 5629} {"train_loss": -26.8170223236084, "global_step": 467241, "epoch": 5629} {"train_loss": -26.842782974243164, "global_step": 467242, "epoch": 5629} {"train_loss": -26.77361488342285, "global_step": 467243, "epoch": 5629} {"train_loss": -27.13530921936035, "global_step": 467244, "epoch": 5629} {"train_loss": -27.16237449645996, "global_step": 467245, "epoch": 5629} {"train_loss": -27.192243576049805, "global_step": 467246, "epoch": 5629} {"train_loss": -27.165510177612305, "global_step": 467247, "epoch": 5629} {"train_loss": -26.857053756713867, "global_step": 467248, "epoch": 5629} {"train_loss": -27.09986686706543, "global_step": 467249, "epoch": 5629} {"train_loss": -27.3070011138916, "global_step": 467250, "epoch": 5629} {"train_loss": -27.0866641998291, "global_step": 467251, "epoch": 5629} {"train_loss": -27.134021759033203, "global_step": 467252, "epoch": 5629} {"train_loss": -27.155323028564453, "global_step": 467253, "epoch": 5629} {"train_loss": -26.940343856811523, "global_step": 467254, "epoch": 5629} {"train_loss": -27.023990631103516, "global_step": 467255, "epoch": 5629} {"train_loss": -26.740951538085938, "global_step": 467256, "epoch": 5629} {"train_loss": -27.056350708007812, "global_step": 467257, "epoch": 5629} {"train_loss": -26.92683219909668, "global_step": 467258, "epoch": 5629} {"train_loss": -26.803720474243164, "global_step": 467259, "epoch": 5629} {"train_loss": -27.31890296936035, "global_step": 467260, "epoch": 5629} {"train_loss": -27.178586959838867, "global_step": 467261, "epoch": 5629} {"train_loss": -27.158288955688477, "global_step": 467262, "epoch": 5629} {"train_loss": -26.795806884765625, "global_step": 467263, "epoch": 5629} {"train_loss": -27.60407829284668, "global_step": 467264, "epoch": 5629} {"train_loss": -27.282516479492188, "global_step": 467265, "epoch": 5629} {"train_loss": -27.0567684173584, "global_step": 467266, "epoch": 5629} {"train_loss": -27.106557846069336, "global_step": 467267, "epoch": 5629} {"train_loss": -26.987995147705078, "global_step": 467268, "epoch": 5629} {"train_loss": -26.87613868713379, "global_step": 467269, "epoch": 5629} {"train_loss": -27.196746826171875, "global_step": 467270, "epoch": 5629} {"train_loss": -26.8900089263916, "global_step": 467271, "epoch": 5629} {"train_loss": -27.193098068237305, "global_step": 467272, "epoch": 5629} {"train_loss": -27.040267944335938, "global_step": 467273, "epoch": 5629} {"train_loss": -27.09697914123535, "global_step": 467274, "epoch": 5629} {"train_loss": -27.2115478515625, "global_step": 467275, "epoch": 5629} {"train_loss": -27.136016845703125, "global_step": 467276, "epoch": 5629} {"train_loss": -27.070209503173828, "global_step": 467277, "epoch": 5629} {"train_loss": -27.105905532836914, "global_step": 467278, "epoch": 5629} {"train_loss": -27.355772018432617, "global_step": 467279, "epoch": 5629} {"train_loss": -27.449600219726562, "global_step": 467280, "epoch": 5629} {"train_loss": -27.535608291625977, "global_step": 467281, "epoch": 5629} {"train_loss": -27.641143798828125, "global_step": 467282, "epoch": 5629} {"train_loss": -27.24773597717285, "global_step": 467283, "epoch": 5629} {"train_loss": -26.9024715423584, "global_step": 467284, "epoch": 5629} {"train_loss": -27.344680786132812, "global_step": 467285, "epoch": 5629} {"train_loss": -27.19793701171875, "global_step": 467286, "epoch": 5629} {"train_loss": -27.4753360748291, "global_step": 467287, "epoch": 5629} {"train_loss": -27.200620651245117, "global_step": 467288, "epoch": 5629} {"train_loss": -26.779657731573266, "global_step": 467289, "epoch": 5629, "val_loss": 6496960.0} {"train_loss": -26.98245620727539, "global_step": 467290, "epoch": 5630} {"train_loss": -26.845163345336914, "global_step": 467291, "epoch": 5630} {"train_loss": -26.6889705657959, "global_step": 467292, "epoch": 5630} {"train_loss": -26.58819007873535, "global_step": 467293, "epoch": 5630} {"train_loss": -26.72016716003418, "global_step": 467294, "epoch": 5630} {"train_loss": -26.868331909179688, "global_step": 467295, "epoch": 5630} {"train_loss": -26.36543846130371, "global_step": 467296, "epoch": 5630} {"train_loss": -26.43505859375, "global_step": 467297, "epoch": 5630} {"train_loss": -26.2935791015625, "global_step": 467298, "epoch": 5630} {"train_loss": -26.225971221923828, "global_step": 467299, "epoch": 5630} {"train_loss": -26.769262313842773, "global_step": 467300, "epoch": 5630} {"train_loss": -26.710596084594727, "global_step": 467301, "epoch": 5630} {"train_loss": -26.686725616455078, "global_step": 467302, "epoch": 5630} {"train_loss": -26.640851974487305, "global_step": 467303, "epoch": 5630} {"train_loss": -26.879108428955078, "global_step": 467304, "epoch": 5630} {"train_loss": -27.04450798034668, "global_step": 467305, "epoch": 5630} {"train_loss": -27.0543270111084, "global_step": 467306, "epoch": 5630} {"train_loss": -27.234216690063477, "global_step": 467307, "epoch": 5630} {"train_loss": -26.98772621154785, "global_step": 467308, "epoch": 5630} {"train_loss": -27.18271827697754, "global_step": 467309, "epoch": 5630} {"train_loss": -27.006256103515625, "global_step": 467310, "epoch": 5630} {"train_loss": -27.455402374267578, "global_step": 467311, "epoch": 5630} {"train_loss": -27.5743350982666, "global_step": 467312, "epoch": 5630} {"train_loss": -27.05517578125, "global_step": 467313, "epoch": 5630} {"train_loss": -27.440082550048828, "global_step": 467314, "epoch": 5630} {"train_loss": -26.963300704956055, "global_step": 467315, "epoch": 5630} {"train_loss": -27.381513595581055, "global_step": 467316, "epoch": 5630} {"train_loss": -26.90122413635254, "global_step": 467317, "epoch": 5630} {"train_loss": -27.190753936767578, "global_step": 467318, "epoch": 5630} {"train_loss": -26.922040939331055, "global_step": 467319, "epoch": 5630} {"train_loss": -27.28777503967285, "global_step": 467320, "epoch": 5630} {"train_loss": -27.276870727539062, "global_step": 467321, "epoch": 5630} {"train_loss": -26.8243465423584, "global_step": 467322, "epoch": 5630} {"train_loss": -27.08241081237793, "global_step": 467323, "epoch": 5630} {"train_loss": -27.111465454101562, "global_step": 467324, "epoch": 5630} {"train_loss": -27.452484130859375, "global_step": 467325, "epoch": 5630} {"train_loss": -27.10589599609375, "global_step": 467326, "epoch": 5630} {"train_loss": -27.337055206298828, "global_step": 467327, "epoch": 5630} {"train_loss": -27.12175941467285, "global_step": 467328, "epoch": 5630} {"train_loss": -26.858051300048828, "global_step": 467329, "epoch": 5630} {"train_loss": -26.981420516967773, "global_step": 467330, "epoch": 5630} {"train_loss": -26.83575439453125, "global_step": 467331, "epoch": 5630} {"train_loss": -26.786169052124023, "global_step": 467332, "epoch": 5630} {"train_loss": -25.886322021484375, "global_step": 467333, "epoch": 5630} {"train_loss": -26.707746505737305, "global_step": 467334, "epoch": 5630} {"train_loss": -27.0706729888916, "global_step": 467335, "epoch": 5630} {"train_loss": -27.040740966796875, "global_step": 467336, "epoch": 5630} {"train_loss": -26.63360023498535, "global_step": 467337, "epoch": 5630} {"train_loss": -27.010547637939453, "global_step": 467338, "epoch": 5630} {"train_loss": -26.831653594970703, "global_step": 467339, "epoch": 5630} {"train_loss": -26.936731338500977, "global_step": 467340, "epoch": 5630} {"train_loss": -27.096038818359375, "global_step": 467341, "epoch": 5630} {"train_loss": -27.064313888549805, "global_step": 467342, "epoch": 5630} {"train_loss": -26.957998275756836, "global_step": 467343, "epoch": 5630} {"train_loss": -27.05829429626465, "global_step": 467344, "epoch": 5630} {"train_loss": -27.35981559753418, "global_step": 467345, "epoch": 5630} {"train_loss": -26.88657569885254, "global_step": 467346, "epoch": 5630} {"train_loss": -26.927213668823242, "global_step": 467347, "epoch": 5630} {"train_loss": -26.832324981689453, "global_step": 467348, "epoch": 5630} {"train_loss": -27.163654327392578, "global_step": 467349, "epoch": 5630} {"train_loss": -27.198720932006836, "global_step": 467350, "epoch": 5630} {"train_loss": -27.055994033813477, "global_step": 467351, "epoch": 5630} {"train_loss": -27.08436393737793, "global_step": 467352, "epoch": 5630} {"train_loss": -26.6763973236084, "global_step": 467353, "epoch": 5630} {"train_loss": -26.88465690612793, "global_step": 467354, "epoch": 5630} {"train_loss": -27.350799560546875, "global_step": 467355, "epoch": 5630} {"train_loss": -27.200366973876953, "global_step": 467356, "epoch": 5630} {"train_loss": -27.029096603393555, "global_step": 467357, "epoch": 5630} {"train_loss": -26.9038143157959, "global_step": 467358, "epoch": 5630} {"train_loss": -27.117887496948242, "global_step": 467359, "epoch": 5630} {"train_loss": -27.157119750976562, "global_step": 467360, "epoch": 5630} {"train_loss": -27.161664962768555, "global_step": 467361, "epoch": 5630} {"train_loss": -27.09120750427246, "global_step": 467362, "epoch": 5630} {"train_loss": -27.10320472717285, "global_step": 467363, "epoch": 5630} {"train_loss": -27.398080825805664, "global_step": 467364, "epoch": 5630} {"train_loss": -27.44087028503418, "global_step": 467365, "epoch": 5630} {"train_loss": -27.183059692382812, "global_step": 467366, "epoch": 5630} {"train_loss": -27.52311134338379, "global_step": 467367, "epoch": 5630} {"train_loss": -27.25071144104004, "global_step": 467368, "epoch": 5630} {"train_loss": -27.517637252807617, "global_step": 467369, "epoch": 5630} {"train_loss": -27.043798446655273, "global_step": 467370, "epoch": 5630} {"train_loss": -27.085432052612305, "global_step": 467371, "epoch": 5630} {"train_loss": -26.992961791624506, "global_step": 467372, "epoch": 5630, "val_loss": 6462405.5} {"train_loss": -27.2216796875, "global_step": 467373, "epoch": 5631} {"train_loss": -26.899658203125, "global_step": 467374, "epoch": 5631} {"train_loss": -26.70686149597168, "global_step": 467375, "epoch": 5631} {"train_loss": -26.97854995727539, "global_step": 467376, "epoch": 5631} {"train_loss": -27.0908145904541, "global_step": 467377, "epoch": 5631} {"train_loss": -27.060260772705078, "global_step": 467378, "epoch": 5631} {"train_loss": -27.08221435546875, "global_step": 467379, "epoch": 5631} {"train_loss": -27.131391525268555, "global_step": 467380, "epoch": 5631} {"train_loss": -27.024585723876953, "global_step": 467381, "epoch": 5631} {"train_loss": -27.096420288085938, "global_step": 467382, "epoch": 5631} {"train_loss": -27.252283096313477, "global_step": 467383, "epoch": 5631} {"train_loss": -27.545917510986328, "global_step": 467384, "epoch": 5631} {"train_loss": -27.308191299438477, "global_step": 467385, "epoch": 5631} {"train_loss": -27.2109375, "global_step": 467386, "epoch": 5631} {"train_loss": -27.183073043823242, "global_step": 467387, "epoch": 5631} {"train_loss": -27.131261825561523, "global_step": 467388, "epoch": 5631} {"train_loss": -27.370031356811523, "global_step": 467389, "epoch": 5631} {"train_loss": -27.564285278320312, "global_step": 467390, "epoch": 5631} {"train_loss": -27.75937271118164, "global_step": 467391, "epoch": 5631} {"train_loss": -27.274280548095703, "global_step": 467392, "epoch": 5631} {"train_loss": -27.206501007080078, "global_step": 467393, "epoch": 5631} {"train_loss": -27.65839195251465, "global_step": 467394, "epoch": 5631} {"train_loss": -27.113706588745117, "global_step": 467395, "epoch": 5631} {"train_loss": -27.16206932067871, "global_step": 467396, "epoch": 5631} {"train_loss": -27.315814971923828, "global_step": 467397, "epoch": 5631} {"train_loss": -27.439672470092773, "global_step": 467398, "epoch": 5631} {"train_loss": -27.052978515625, "global_step": 467399, "epoch": 5631} {"train_loss": -27.352514266967773, "global_step": 467400, "epoch": 5631} {"train_loss": -26.782541275024414, "global_step": 467401, "epoch": 5631} {"train_loss": -27.217309951782227, "global_step": 467402, "epoch": 5631} {"train_loss": -27.49714469909668, "global_step": 467403, "epoch": 5631} {"train_loss": -27.37818717956543, "global_step": 467404, "epoch": 5631} {"train_loss": -27.1977596282959, "global_step": 467405, "epoch": 5631} {"train_loss": -27.28804588317871, "global_step": 467406, "epoch": 5631} {"train_loss": -27.127552032470703, "global_step": 467407, "epoch": 5631} {"train_loss": -26.109542846679688, "global_step": 467408, "epoch": 5631} {"train_loss": -26.3004150390625, "global_step": 467409, "epoch": 5631} {"train_loss": -26.014917373657227, "global_step": 467410, "epoch": 5631} {"train_loss": -27.09515953063965, "global_step": 467411, "epoch": 5631} {"train_loss": -26.718414306640625, "global_step": 467412, "epoch": 5631} {"train_loss": -26.665464401245117, "global_step": 467413, "epoch": 5631} {"train_loss": -26.749927520751953, "global_step": 467414, "epoch": 5631} {"train_loss": -26.96109962463379, "global_step": 467415, "epoch": 5631} {"train_loss": -26.794605255126953, "global_step": 467416, "epoch": 5631} {"train_loss": -26.805423736572266, "global_step": 467417, "epoch": 5631} {"train_loss": -26.976240158081055, "global_step": 467418, "epoch": 5631} {"train_loss": -27.121566772460938, "global_step": 467419, "epoch": 5631} {"train_loss": -26.88789176940918, "global_step": 467420, "epoch": 5631} {"train_loss": -26.948715209960938, "global_step": 467421, "epoch": 5631} {"train_loss": -27.047353744506836, "global_step": 467422, "epoch": 5631} {"train_loss": -27.14375114440918, "global_step": 467423, "epoch": 5631} {"train_loss": -27.08062171936035, "global_step": 467424, "epoch": 5631} {"train_loss": -26.84815788269043, "global_step": 467425, "epoch": 5631} {"train_loss": -26.866052627563477, "global_step": 467426, "epoch": 5631} {"train_loss": -27.31089210510254, "global_step": 467427, "epoch": 5631} {"train_loss": -27.007095336914062, "global_step": 467428, "epoch": 5631} {"train_loss": -27.11264991760254, "global_step": 467429, "epoch": 5631} {"train_loss": -26.931665420532227, "global_step": 467430, "epoch": 5631} {"train_loss": -27.216211318969727, "global_step": 467431, "epoch": 5631} {"train_loss": -27.32648277282715, "global_step": 467432, "epoch": 5631} {"train_loss": -27.331634521484375, "global_step": 467433, "epoch": 5631} {"train_loss": -27.312030792236328, "global_step": 467434, "epoch": 5631} {"train_loss": -27.11777114868164, "global_step": 467435, "epoch": 5631} {"train_loss": -27.322357177734375, "global_step": 467436, "epoch": 5631} {"train_loss": -27.189777374267578, "global_step": 467437, "epoch": 5631} {"train_loss": -26.964101791381836, "global_step": 467438, "epoch": 5631} {"train_loss": -27.230024337768555, "global_step": 467439, "epoch": 5631} {"train_loss": -27.245391845703125, "global_step": 467440, "epoch": 5631} {"train_loss": -27.346210479736328, "global_step": 467441, "epoch": 5631} {"train_loss": -27.48603630065918, "global_step": 467442, "epoch": 5631} {"train_loss": -27.8206844329834, "global_step": 467443, "epoch": 5631} {"train_loss": -27.18994140625, "global_step": 467444, "epoch": 5631} {"train_loss": -27.1578369140625, "global_step": 467445, "epoch": 5631} {"train_loss": -27.297658920288086, "global_step": 467446, "epoch": 5631} {"train_loss": -26.881330490112305, "global_step": 467447, "epoch": 5631} {"train_loss": -27.269811630249023, "global_step": 467448, "epoch": 5631} {"train_loss": -27.408100128173828, "global_step": 467449, "epoch": 5631} {"train_loss": -27.367877960205078, "global_step": 467450, "epoch": 5631} {"train_loss": -27.283218383789062, "global_step": 467451, "epoch": 5631} {"train_loss": -26.783517837524414, "global_step": 467452, "epoch": 5631} {"train_loss": -27.399280548095703, "global_step": 467453, "epoch": 5631} {"train_loss": -27.21233558654785, "global_step": 467454, "epoch": 5631} {"train_loss": -27.11732062374253, "global_step": 467455, "epoch": 5631, "val_loss": 6456472.0} {"train_loss": -26.728662490844727, "global_step": 467456, "epoch": 5632} {"train_loss": -26.646915435791016, "global_step": 467457, "epoch": 5632} {"train_loss": -26.974124908447266, "global_step": 467458, "epoch": 5632} {"train_loss": -26.705617904663086, "global_step": 467459, "epoch": 5632} {"train_loss": -26.472858428955078, "global_step": 467460, "epoch": 5632} {"train_loss": -27.000141143798828, "global_step": 467461, "epoch": 5632} {"train_loss": -27.35847282409668, "global_step": 467462, "epoch": 5632} {"train_loss": -26.961286544799805, "global_step": 467463, "epoch": 5632} {"train_loss": -27.110645294189453, "global_step": 467464, "epoch": 5632} {"train_loss": -26.726282119750977, "global_step": 467465, "epoch": 5632} {"train_loss": -27.006006240844727, "global_step": 467466, "epoch": 5632} {"train_loss": -27.09734535217285, "global_step": 467467, "epoch": 5632} {"train_loss": -26.423343658447266, "global_step": 467468, "epoch": 5632} {"train_loss": -26.966684341430664, "global_step": 467469, "epoch": 5632} {"train_loss": -26.9899845123291, "global_step": 467470, "epoch": 5632} {"train_loss": -26.54931640625, "global_step": 467471, "epoch": 5632} {"train_loss": -26.754087448120117, "global_step": 467472, "epoch": 5632} {"train_loss": -27.048452377319336, "global_step": 467473, "epoch": 5632} {"train_loss": -26.542158126831055, "global_step": 467474, "epoch": 5632} {"train_loss": -26.6585693359375, "global_step": 467475, "epoch": 5632} {"train_loss": -26.63431739807129, "global_step": 467476, "epoch": 5632} {"train_loss": -26.81330680847168, "global_step": 467477, "epoch": 5632} {"train_loss": -26.51896095275879, "global_step": 467478, "epoch": 5632} {"train_loss": -26.75587272644043, "global_step": 467479, "epoch": 5632} {"train_loss": -26.810956954956055, "global_step": 467480, "epoch": 5632} {"train_loss": -26.932966232299805, "global_step": 467481, "epoch": 5632} {"train_loss": -27.267248153686523, "global_step": 467482, "epoch": 5632} {"train_loss": -27.129230499267578, "global_step": 467483, "epoch": 5632} {"train_loss": -27.11318016052246, "global_step": 467484, "epoch": 5632} {"train_loss": -27.106414794921875, "global_step": 467485, "epoch": 5632} {"train_loss": -27.268497467041016, "global_step": 467486, "epoch": 5632} {"train_loss": -27.07246971130371, "global_step": 467487, "epoch": 5632} {"train_loss": -27.17573356628418, "global_step": 467488, "epoch": 5632} {"train_loss": -27.0855770111084, "global_step": 467489, "epoch": 5632} {"train_loss": -27.180261611938477, "global_step": 467490, "epoch": 5632} {"train_loss": -27.378021240234375, "global_step": 467491, "epoch": 5632} {"train_loss": -26.93828773498535, "global_step": 467492, "epoch": 5632} {"train_loss": -27.305997848510742, "global_step": 467493, "epoch": 5632} {"train_loss": -27.0083065032959, "global_step": 467494, "epoch": 5632} {"train_loss": -27.4409122467041, "global_step": 467495, "epoch": 5632} {"train_loss": -27.024648666381836, "global_step": 467496, "epoch": 5632} {"train_loss": -27.10831642150879, "global_step": 467497, "epoch": 5632} {"train_loss": -27.416595458984375, "global_step": 467498, "epoch": 5632} {"train_loss": -27.219379425048828, "global_step": 467499, "epoch": 5632} {"train_loss": -27.365636825561523, "global_step": 467500, "epoch": 5632} {"train_loss": -27.47686195373535, "global_step": 467501, "epoch": 5632} {"train_loss": -27.300567626953125, "global_step": 467502, "epoch": 5632} {"train_loss": -27.233423233032227, "global_step": 467503, "epoch": 5632} {"train_loss": -27.52349853515625, "global_step": 467504, "epoch": 5632} {"train_loss": -27.356098175048828, "global_step": 467505, "epoch": 5632} {"train_loss": -27.194522857666016, "global_step": 467506, "epoch": 5632} {"train_loss": -27.432159423828125, "global_step": 467507, "epoch": 5632} {"train_loss": -27.56386375427246, "global_step": 467508, "epoch": 5632} {"train_loss": -27.654525756835938, "global_step": 467509, "epoch": 5632} {"train_loss": -26.93855094909668, "global_step": 467510, "epoch": 5632} {"train_loss": -27.4619083404541, "global_step": 467511, "epoch": 5632} {"train_loss": -27.35259437561035, "global_step": 467512, "epoch": 5632} {"train_loss": -27.45037841796875, "global_step": 467513, "epoch": 5632} {"train_loss": -27.16472816467285, "global_step": 467514, "epoch": 5632} {"train_loss": -27.3237361907959, "global_step": 467515, "epoch": 5632} {"train_loss": -27.01091957092285, "global_step": 467516, "epoch": 5632} {"train_loss": -27.319137573242188, "global_step": 467517, "epoch": 5632} {"train_loss": -27.566497802734375, "global_step": 467518, "epoch": 5632} {"train_loss": -27.346811294555664, "global_step": 467519, "epoch": 5632} {"train_loss": -27.455556869506836, "global_step": 467520, "epoch": 5632} {"train_loss": -27.002277374267578, "global_step": 467521, "epoch": 5632} {"train_loss": -27.259933471679688, "global_step": 467522, "epoch": 5632} {"train_loss": -27.023284912109375, "global_step": 467523, "epoch": 5632} {"train_loss": -26.935352325439453, "global_step": 467524, "epoch": 5632} {"train_loss": -26.95179557800293, "global_step": 467525, "epoch": 5632} {"train_loss": -27.356924057006836, "global_step": 467526, "epoch": 5632} {"train_loss": -26.94989013671875, "global_step": 467527, "epoch": 5632} {"train_loss": -27.21271324157715, "global_step": 467528, "epoch": 5632} {"train_loss": -26.96256446838379, "global_step": 467529, "epoch": 5632} {"train_loss": -27.355222702026367, "global_step": 467530, "epoch": 5632} {"train_loss": -27.24112892150879, "global_step": 467531, "epoch": 5632} {"train_loss": -27.003156661987305, "global_step": 467532, "epoch": 5632} {"train_loss": -27.048547744750977, "global_step": 467533, "epoch": 5632} {"train_loss": -26.798620223999023, "global_step": 467534, "epoch": 5632} {"train_loss": -27.252832412719727, "global_step": 467535, "epoch": 5632} {"train_loss": -27.103778839111328, "global_step": 467536, "epoch": 5632} {"train_loss": -26.832956314086914, "global_step": 467537, "epoch": 5632} {"train_loss": -27.10520424900285, "global_step": 467538, "epoch": 5632, "val_loss": 6521147.0} {"train_loss": -26.223119735717773, "global_step": 467539, "epoch": 5633} {"train_loss": -26.342456817626953, "global_step": 467540, "epoch": 5633} {"train_loss": -25.973011016845703, "global_step": 467541, "epoch": 5633} {"train_loss": -26.60500144958496, "global_step": 467542, "epoch": 5633} {"train_loss": -26.60024070739746, "global_step": 467543, "epoch": 5633} {"train_loss": -26.8175048828125, "global_step": 467544, "epoch": 5633} {"train_loss": -26.47075843811035, "global_step": 467545, "epoch": 5633} {"train_loss": -26.428434371948242, "global_step": 467546, "epoch": 5633} {"train_loss": -27.01593589782715, "global_step": 467547, "epoch": 5633} {"train_loss": -26.838851928710938, "global_step": 467548, "epoch": 5633} {"train_loss": -26.564910888671875, "global_step": 467549, "epoch": 5633} {"train_loss": -26.572406768798828, "global_step": 467550, "epoch": 5633} {"train_loss": -27.0949649810791, "global_step": 467551, "epoch": 5633} {"train_loss": -26.1059513092041, "global_step": 467552, "epoch": 5633} {"train_loss": -26.826370239257812, "global_step": 467553, "epoch": 5633} {"train_loss": -27.195852279663086, "global_step": 467554, "epoch": 5633} {"train_loss": -26.680830001831055, "global_step": 467555, "epoch": 5633} {"train_loss": -26.910703659057617, "global_step": 467556, "epoch": 5633} {"train_loss": -27.0192928314209, "global_step": 467557, "epoch": 5633} {"train_loss": -27.327070236206055, "global_step": 467558, "epoch": 5633} {"train_loss": -27.172760009765625, "global_step": 467559, "epoch": 5633} {"train_loss": -27.293354034423828, "global_step": 467560, "epoch": 5633} {"train_loss": -26.97101402282715, "global_step": 467561, "epoch": 5633} {"train_loss": -27.125864028930664, "global_step": 467562, "epoch": 5633} {"train_loss": -27.187747955322266, "global_step": 467563, "epoch": 5633} {"train_loss": -26.75144386291504, "global_step": 467564, "epoch": 5633} {"train_loss": -27.03508949279785, "global_step": 467565, "epoch": 5633} {"train_loss": -27.234174728393555, "global_step": 467566, "epoch": 5633} {"train_loss": -27.179601669311523, "global_step": 467567, "epoch": 5633} {"train_loss": -27.0827693939209, "global_step": 467568, "epoch": 5633} {"train_loss": -27.27363395690918, "global_step": 467569, "epoch": 5633} {"train_loss": -27.15955924987793, "global_step": 467570, "epoch": 5633} {"train_loss": -27.29166603088379, "global_step": 467571, "epoch": 5633} {"train_loss": -27.233617782592773, "global_step": 467572, "epoch": 5633} {"train_loss": -27.276142120361328, "global_step": 467573, "epoch": 5633} {"train_loss": -27.05633544921875, "global_step": 467574, "epoch": 5633} {"train_loss": -27.213592529296875, "global_step": 467575, "epoch": 5633} {"train_loss": -27.250431060791016, "global_step": 467576, "epoch": 5633} {"train_loss": -27.45315933227539, "global_step": 467577, "epoch": 5633} {"train_loss": -26.8839054107666, "global_step": 467578, "epoch": 5633} {"train_loss": -27.186939239501953, "global_step": 467579, "epoch": 5633} {"train_loss": -26.9151611328125, "global_step": 467580, "epoch": 5633} {"train_loss": -27.234893798828125, "global_step": 467581, "epoch": 5633} {"train_loss": -26.9342041015625, "global_step": 467582, "epoch": 5633} {"train_loss": -27.015527725219727, "global_step": 467583, "epoch": 5633} {"train_loss": -27.382190704345703, "global_step": 467584, "epoch": 5633} {"train_loss": -27.412694931030273, "global_step": 467585, "epoch": 5633} {"train_loss": -27.37152671813965, "global_step": 467586, "epoch": 5633} {"train_loss": -27.609241485595703, "global_step": 467587, "epoch": 5633} {"train_loss": -26.953466415405273, "global_step": 467588, "epoch": 5633} {"train_loss": -27.576648712158203, "global_step": 467589, "epoch": 5633} {"train_loss": -27.279926300048828, "global_step": 467590, "epoch": 5633} {"train_loss": -27.4742431640625, "global_step": 467591, "epoch": 5633} {"train_loss": -27.245267868041992, "global_step": 467592, "epoch": 5633} {"train_loss": -27.341537475585938, "global_step": 467593, "epoch": 5633} {"train_loss": -26.947574615478516, "global_step": 467594, "epoch": 5633} {"train_loss": -27.30121421813965, "global_step": 467595, "epoch": 5633} {"train_loss": -27.18257713317871, "global_step": 467596, "epoch": 5633} {"train_loss": -27.582971572875977, "global_step": 467597, "epoch": 5633} {"train_loss": -27.260665893554688, "global_step": 467598, "epoch": 5633} {"train_loss": -27.042226791381836, "global_step": 467599, "epoch": 5633} {"train_loss": -27.124658584594727, "global_step": 467600, "epoch": 5633} {"train_loss": -27.535058975219727, "global_step": 467601, "epoch": 5633} {"train_loss": -27.30450439453125, "global_step": 467602, "epoch": 5633} {"train_loss": -26.953149795532227, "global_step": 467603, "epoch": 5633} {"train_loss": -26.8785400390625, "global_step": 467604, "epoch": 5633} {"train_loss": -27.114370346069336, "global_step": 467605, "epoch": 5633} {"train_loss": -27.292816162109375, "global_step": 467606, "epoch": 5633} {"train_loss": -27.046436309814453, "global_step": 467607, "epoch": 5633} {"train_loss": -26.775068283081055, "global_step": 467608, "epoch": 5633} {"train_loss": -26.84087562561035, "global_step": 467609, "epoch": 5633} {"train_loss": -26.940113067626953, "global_step": 467610, "epoch": 5633} {"train_loss": -27.098876953125, "global_step": 467611, "epoch": 5633} {"train_loss": -27.096281051635742, "global_step": 467612, "epoch": 5633} {"train_loss": -26.9083309173584, "global_step": 467613, "epoch": 5633} {"train_loss": -26.71304702758789, "global_step": 467614, "epoch": 5633} {"train_loss": -27.04196548461914, "global_step": 467615, "epoch": 5633} {"train_loss": -27.118579864501953, "global_step": 467616, "epoch": 5633} {"train_loss": -26.49081802368164, "global_step": 467617, "epoch": 5633} {"train_loss": -26.420713424682617, "global_step": 467618, "epoch": 5633} {"train_loss": -26.56963539123535, "global_step": 467619, "epoch": 5633} {"train_loss": -27.103103637695312, "global_step": 467620, "epoch": 5633} {"train_loss": -27.017099679234516, "global_step": 467621, "epoch": 5633, "val_loss": 6446323.0} {"train_loss": -25.54859733581543, "global_step": 467622, "epoch": 5634} {"train_loss": -26.242938995361328, "global_step": 467623, "epoch": 5634} {"train_loss": -25.794225692749023, "global_step": 467624, "epoch": 5634} {"train_loss": -25.6097412109375, "global_step": 467625, "epoch": 5634} {"train_loss": -25.925748825073242, "global_step": 467626, "epoch": 5634} {"train_loss": -25.89737892150879, "global_step": 467627, "epoch": 5634} {"train_loss": -25.720197677612305, "global_step": 467628, "epoch": 5634} {"train_loss": -26.338979721069336, "global_step": 467629, "epoch": 5634} {"train_loss": -25.94254493713379, "global_step": 467630, "epoch": 5634} {"train_loss": -26.4608154296875, "global_step": 467631, "epoch": 5634} {"train_loss": -26.16193962097168, "global_step": 467632, "epoch": 5634} {"train_loss": -26.281335830688477, "global_step": 467633, "epoch": 5634} {"train_loss": -25.914289474487305, "global_step": 467634, "epoch": 5634} {"train_loss": -26.446624755859375, "global_step": 467635, "epoch": 5634} {"train_loss": -26.386388778686523, "global_step": 467636, "epoch": 5634} {"train_loss": -26.2380428314209, "global_step": 467637, "epoch": 5634} {"train_loss": -26.044103622436523, "global_step": 467638, "epoch": 5634} {"train_loss": -26.471044540405273, "global_step": 467639, "epoch": 5634} {"train_loss": -26.30234146118164, "global_step": 467640, "epoch": 5634} {"train_loss": -26.7570858001709, "global_step": 467641, "epoch": 5634} {"train_loss": -26.48484230041504, "global_step": 467642, "epoch": 5634} {"train_loss": -26.541400909423828, "global_step": 467643, "epoch": 5634} {"train_loss": -26.52625846862793, "global_step": 467644, "epoch": 5634} {"train_loss": -26.859272003173828, "global_step": 467645, "epoch": 5634} {"train_loss": -26.60626220703125, "global_step": 467646, "epoch": 5634} {"train_loss": -26.599767684936523, "global_step": 467647, "epoch": 5634} {"train_loss": -26.634204864501953, "global_step": 467648, "epoch": 5634} {"train_loss": -26.933950424194336, "global_step": 467649, "epoch": 5634} {"train_loss": -27.076452255249023, "global_step": 467650, "epoch": 5634} {"train_loss": -27.075428009033203, "global_step": 467651, "epoch": 5634} {"train_loss": -26.802566528320312, "global_step": 467652, "epoch": 5634} {"train_loss": -26.89630699157715, "global_step": 467653, "epoch": 5634} {"train_loss": -26.888763427734375, "global_step": 467654, "epoch": 5634} {"train_loss": -26.88675880432129, "global_step": 467655, "epoch": 5634} {"train_loss": -27.0009822845459, "global_step": 467656, "epoch": 5634} {"train_loss": -26.79843521118164, "global_step": 467657, "epoch": 5634} {"train_loss": -27.343774795532227, "global_step": 467658, "epoch": 5634} {"train_loss": -26.7188663482666, "global_step": 467659, "epoch": 5634} {"train_loss": -27.081960678100586, "global_step": 467660, "epoch": 5634} {"train_loss": -27.20136070251465, "global_step": 467661, "epoch": 5634} {"train_loss": -26.96270179748535, "global_step": 467662, "epoch": 5634} {"train_loss": -27.178983688354492, "global_step": 467663, "epoch": 5634} {"train_loss": -26.692914962768555, "global_step": 467664, "epoch": 5634} {"train_loss": -27.197629928588867, "global_step": 467665, "epoch": 5634} {"train_loss": -27.109588623046875, "global_step": 467666, "epoch": 5634} {"train_loss": -27.417266845703125, "global_step": 467667, "epoch": 5634} {"train_loss": -27.10857582092285, "global_step": 467668, "epoch": 5634} {"train_loss": -27.754846572875977, "global_step": 467669, "epoch": 5634} {"train_loss": -26.9533748626709, "global_step": 467670, "epoch": 5634} {"train_loss": -27.460102081298828, "global_step": 467671, "epoch": 5634} {"train_loss": -26.99236488342285, "global_step": 467672, "epoch": 5634} {"train_loss": -26.964338302612305, "global_step": 467673, "epoch": 5634} {"train_loss": -26.98196792602539, "global_step": 467674, "epoch": 5634} {"train_loss": -27.129465103149414, "global_step": 467675, "epoch": 5634} {"train_loss": -27.038904190063477, "global_step": 467676, "epoch": 5634} {"train_loss": -27.261661529541016, "global_step": 467677, "epoch": 5634} {"train_loss": -27.225858688354492, "global_step": 467678, "epoch": 5634} {"train_loss": -27.478681564331055, "global_step": 467679, "epoch": 5634} {"train_loss": -27.197607040405273, "global_step": 467680, "epoch": 5634} {"train_loss": -27.093210220336914, "global_step": 467681, "epoch": 5634} {"train_loss": -27.607202529907227, "global_step": 467682, "epoch": 5634} {"train_loss": -27.2047119140625, "global_step": 467683, "epoch": 5634} {"train_loss": -27.094877243041992, "global_step": 467684, "epoch": 5634} {"train_loss": -26.897241592407227, "global_step": 467685, "epoch": 5634} {"train_loss": -27.14979362487793, "global_step": 467686, "epoch": 5634} {"train_loss": -27.052831649780273, "global_step": 467687, "epoch": 5634} {"train_loss": -27.420124053955078, "global_step": 467688, "epoch": 5634} {"train_loss": -27.425983428955078, "global_step": 467689, "epoch": 5634} {"train_loss": -27.219314575195312, "global_step": 467690, "epoch": 5634} {"train_loss": -27.226516723632812, "global_step": 467691, "epoch": 5634} {"train_loss": -27.01727294921875, "global_step": 467692, "epoch": 5634} {"train_loss": -27.415023803710938, "global_step": 467693, "epoch": 5634} {"train_loss": -27.272083282470703, "global_step": 467694, "epoch": 5634} {"train_loss": -27.337894439697266, "global_step": 467695, "epoch": 5634} {"train_loss": -27.33578872680664, "global_step": 467696, "epoch": 5634} {"train_loss": -27.180160522460938, "global_step": 467697, "epoch": 5634} {"train_loss": -27.394811630249023, "global_step": 467698, "epoch": 5634} {"train_loss": -26.972614288330078, "global_step": 467699, "epoch": 5634} {"train_loss": -27.123315811157227, "global_step": 467700, "epoch": 5634} {"train_loss": -26.984949111938477, "global_step": 467701, "epoch": 5634} {"train_loss": -27.0440616607666, "global_step": 467702, "epoch": 5634} {"train_loss": -27.275609970092773, "global_step": 467703, "epoch": 5634} {"train_loss": -26.84168431845056, "global_step": 467704, "epoch": 5634, "val_loss": 6664503.0} {"train_loss": -25.93825340270996, "global_step": 467705, "epoch": 5635} {"train_loss": -24.94917869567871, "global_step": 467706, "epoch": 5635} {"train_loss": -25.271886825561523, "global_step": 467707, "epoch": 5635} {"train_loss": -26.509490966796875, "global_step": 467708, "epoch": 5635} {"train_loss": -26.562829971313477, "global_step": 467709, "epoch": 5635} {"train_loss": -25.849660873413086, "global_step": 467710, "epoch": 5635} {"train_loss": -26.365880966186523, "global_step": 467711, "epoch": 5635} {"train_loss": -26.571720123291016, "global_step": 467712, "epoch": 5635} {"train_loss": -26.606403350830078, "global_step": 467713, "epoch": 5635} {"train_loss": -26.41969108581543, "global_step": 467714, "epoch": 5635} {"train_loss": -26.265913009643555, "global_step": 467715, "epoch": 5635} {"train_loss": -26.75440788269043, "global_step": 467716, "epoch": 5635} {"train_loss": -26.61577796936035, "global_step": 467717, "epoch": 5635} {"train_loss": -26.907758712768555, "global_step": 467718, "epoch": 5635} {"train_loss": -26.51641273498535, "global_step": 467719, "epoch": 5635} {"train_loss": -26.969772338867188, "global_step": 467720, "epoch": 5635} {"train_loss": -26.940353393554688, "global_step": 467721, "epoch": 5635} {"train_loss": -26.879505157470703, "global_step": 467722, "epoch": 5635} {"train_loss": -26.869638442993164, "global_step": 467723, "epoch": 5635} {"train_loss": -26.72395133972168, "global_step": 467724, "epoch": 5635} {"train_loss": -26.76759147644043, "global_step": 467725, "epoch": 5635} {"train_loss": -26.787092208862305, "global_step": 467726, "epoch": 5635} {"train_loss": -26.77276611328125, "global_step": 467727, "epoch": 5635} {"train_loss": -27.01116943359375, "global_step": 467728, "epoch": 5635} {"train_loss": -27.237417221069336, "global_step": 467729, "epoch": 5635} {"train_loss": -26.85666847229004, "global_step": 467730, "epoch": 5635} {"train_loss": -27.0445556640625, "global_step": 467731, "epoch": 5635} {"train_loss": -26.886377334594727, "global_step": 467732, "epoch": 5635} {"train_loss": -27.152631759643555, "global_step": 467733, "epoch": 5635} {"train_loss": -26.949127197265625, "global_step": 467734, "epoch": 5635} {"train_loss": -27.44742202758789, "global_step": 467735, "epoch": 5635} {"train_loss": -27.22468376159668, "global_step": 467736, "epoch": 5635} {"train_loss": -26.94648551940918, "global_step": 467737, "epoch": 5635} {"train_loss": -27.30171012878418, "global_step": 467738, "epoch": 5635} {"train_loss": -27.061948776245117, "global_step": 467739, "epoch": 5635} {"train_loss": -27.706830978393555, "global_step": 467740, "epoch": 5635} {"train_loss": -27.375263214111328, "global_step": 467741, "epoch": 5635} {"train_loss": -26.855493545532227, "global_step": 467742, "epoch": 5635} {"train_loss": -27.310733795166016, "global_step": 467743, "epoch": 5635} {"train_loss": -27.070417404174805, "global_step": 467744, "epoch": 5635} {"train_loss": -27.15943717956543, "global_step": 467745, "epoch": 5635} {"train_loss": -27.467514038085938, "global_step": 467746, "epoch": 5635} {"train_loss": -27.09528923034668, "global_step": 467747, "epoch": 5635} {"train_loss": -27.302261352539062, "global_step": 467748, "epoch": 5635} {"train_loss": -26.891523361206055, "global_step": 467749, "epoch": 5635} {"train_loss": -27.364883422851562, "global_step": 467750, "epoch": 5635} {"train_loss": -27.161163330078125, "global_step": 467751, "epoch": 5635} {"train_loss": -27.108083724975586, "global_step": 467752, "epoch": 5635} {"train_loss": -27.499343872070312, "global_step": 467753, "epoch": 5635} {"train_loss": -27.12518882751465, "global_step": 467754, "epoch": 5635} {"train_loss": -27.304584503173828, "global_step": 467755, "epoch": 5635} {"train_loss": -27.742740631103516, "global_step": 467756, "epoch": 5635} {"train_loss": -27.38726806640625, "global_step": 467757, "epoch": 5635} {"train_loss": -27.038496017456055, "global_step": 467758, "epoch": 5635} {"train_loss": -27.064741134643555, "global_step": 467759, "epoch": 5635} {"train_loss": -27.057371139526367, "global_step": 467760, "epoch": 5635} {"train_loss": -27.287893295288086, "global_step": 467761, "epoch": 5635} {"train_loss": -26.819211959838867, "global_step": 467762, "epoch": 5635} {"train_loss": -26.811811447143555, "global_step": 467763, "epoch": 5635} {"train_loss": -27.060888290405273, "global_step": 467764, "epoch": 5635} {"train_loss": -26.845056533813477, "global_step": 467765, "epoch": 5635} {"train_loss": -27.257551193237305, "global_step": 467766, "epoch": 5635} {"train_loss": -27.362707138061523, "global_step": 467767, "epoch": 5635} {"train_loss": -27.06511878967285, "global_step": 467768, "epoch": 5635} {"train_loss": -27.088071823120117, "global_step": 467769, "epoch": 5635} {"train_loss": -27.428180694580078, "global_step": 467770, "epoch": 5635} {"train_loss": -27.39361572265625, "global_step": 467771, "epoch": 5635} {"train_loss": -27.63516616821289, "global_step": 467772, "epoch": 5635} {"train_loss": -27.33442497253418, "global_step": 467773, "epoch": 5635} {"train_loss": -27.230533599853516, "global_step": 467774, "epoch": 5635} {"train_loss": -27.234424591064453, "global_step": 467775, "epoch": 5635} {"train_loss": -27.313634872436523, "global_step": 467776, "epoch": 5635} {"train_loss": -27.592639923095703, "global_step": 467777, "epoch": 5635} {"train_loss": -27.315656661987305, "global_step": 467778, "epoch": 5635} {"train_loss": -27.265607833862305, "global_step": 467779, "epoch": 5635} {"train_loss": -27.425628662109375, "global_step": 467780, "epoch": 5635} {"train_loss": -27.2559814453125, "global_step": 467781, "epoch": 5635} {"train_loss": -27.453266143798828, "global_step": 467782, "epoch": 5635} {"train_loss": -27.447742462158203, "global_step": 467783, "epoch": 5635} {"train_loss": -27.430877685546875, "global_step": 467784, "epoch": 5635} {"train_loss": -27.263931274414062, "global_step": 467785, "epoch": 5635} {"train_loss": -27.372739791870117, "global_step": 467786, "epoch": 5635} {"train_loss": -27.00272463603192, "global_step": 467787, "epoch": 5635, "val_loss": 6578609.0} {"train_loss": -27.382766723632812, "global_step": 467788, "epoch": 5636} {"train_loss": -26.147130966186523, "global_step": 467789, "epoch": 5636} {"train_loss": -26.005918502807617, "global_step": 467790, "epoch": 5636} {"train_loss": -26.258344650268555, "global_step": 467791, "epoch": 5636} {"train_loss": -26.35261344909668, "global_step": 467792, "epoch": 5636} {"train_loss": -25.38669776916504, "global_step": 467793, "epoch": 5636} {"train_loss": -22.894224166870117, "global_step": 467794, "epoch": 5636} {"train_loss": -23.68625259399414, "global_step": 467795, "epoch": 5636} {"train_loss": -26.258014678955078, "global_step": 467796, "epoch": 5636} {"train_loss": -24.970251083374023, "global_step": 467797, "epoch": 5636} {"train_loss": -25.81495475769043, "global_step": 467798, "epoch": 5636} {"train_loss": -26.51837730407715, "global_step": 467799, "epoch": 5636} {"train_loss": -25.924365997314453, "global_step": 467800, "epoch": 5636} {"train_loss": -25.854902267456055, "global_step": 467801, "epoch": 5636} {"train_loss": -26.366308212280273, "global_step": 467802, "epoch": 5636} {"train_loss": -26.723556518554688, "global_step": 467803, "epoch": 5636} {"train_loss": -26.270551681518555, "global_step": 467804, "epoch": 5636} {"train_loss": -26.5622615814209, "global_step": 467805, "epoch": 5636} {"train_loss": -26.300268173217773, "global_step": 467806, "epoch": 5636} {"train_loss": -26.287214279174805, "global_step": 467807, "epoch": 5636} {"train_loss": -26.45039176940918, "global_step": 467808, "epoch": 5636} {"train_loss": -26.8502197265625, "global_step": 467809, "epoch": 5636} {"train_loss": -26.4476261138916, "global_step": 467810, "epoch": 5636} {"train_loss": -26.823373794555664, "global_step": 467811, "epoch": 5636} {"train_loss": -26.5311336517334, "global_step": 467812, "epoch": 5636} {"train_loss": -26.46268081665039, "global_step": 467813, "epoch": 5636} {"train_loss": -26.87091064453125, "global_step": 467814, "epoch": 5636} {"train_loss": -26.400196075439453, "global_step": 467815, "epoch": 5636} {"train_loss": -27.005704879760742, "global_step": 467816, "epoch": 5636} {"train_loss": -26.669397354125977, "global_step": 467817, "epoch": 5636} {"train_loss": -26.838459014892578, "global_step": 467818, "epoch": 5636} {"train_loss": -26.91986656188965, "global_step": 467819, "epoch": 5636} {"train_loss": -27.116565704345703, "global_step": 467820, "epoch": 5636} {"train_loss": -26.78863525390625, "global_step": 467821, "epoch": 5636} {"train_loss": -27.10504722595215, "global_step": 467822, "epoch": 5636} {"train_loss": -27.065649032592773, "global_step": 467823, "epoch": 5636} {"train_loss": -27.24057388305664, "global_step": 467824, "epoch": 5636} {"train_loss": -27.075891494750977, "global_step": 467825, "epoch": 5636} {"train_loss": -26.894132614135742, "global_step": 467826, "epoch": 5636} {"train_loss": -27.180908203125, "global_step": 467827, "epoch": 5636} {"train_loss": -26.9979248046875, "global_step": 467828, "epoch": 5636} {"train_loss": -26.878599166870117, "global_step": 467829, "epoch": 5636} {"train_loss": -27.291406631469727, "global_step": 467830, "epoch": 5636} {"train_loss": -26.91180419921875, "global_step": 467831, "epoch": 5636} {"train_loss": -27.19801139831543, "global_step": 467832, "epoch": 5636} {"train_loss": -27.127002716064453, "global_step": 467833, "epoch": 5636} {"train_loss": -27.3072452545166, "global_step": 467834, "epoch": 5636} {"train_loss": -27.03915786743164, "global_step": 467835, "epoch": 5636} {"train_loss": -27.17083740234375, "global_step": 467836, "epoch": 5636} {"train_loss": -27.054258346557617, "global_step": 467837, "epoch": 5636} {"train_loss": -27.425308227539062, "global_step": 467838, "epoch": 5636} {"train_loss": -27.586328506469727, "global_step": 467839, "epoch": 5636} {"train_loss": -27.126386642456055, "global_step": 467840, "epoch": 5636} {"train_loss": -27.268936157226562, "global_step": 467841, "epoch": 5636} {"train_loss": -27.492420196533203, "global_step": 467842, "epoch": 5636} {"train_loss": -27.243642807006836, "global_step": 467843, "epoch": 5636} {"train_loss": -27.124448776245117, "global_step": 467844, "epoch": 5636} {"train_loss": -27.538854598999023, "global_step": 467845, "epoch": 5636} {"train_loss": -27.08393669128418, "global_step": 467846, "epoch": 5636} {"train_loss": -27.28829002380371, "global_step": 467847, "epoch": 5636} {"train_loss": -27.417621612548828, "global_step": 467848, "epoch": 5636} {"train_loss": -27.281030654907227, "global_step": 467849, "epoch": 5636} {"train_loss": -27.34177017211914, "global_step": 467850, "epoch": 5636} {"train_loss": -27.54054069519043, "global_step": 467851, "epoch": 5636} {"train_loss": -27.35024070739746, "global_step": 467852, "epoch": 5636} {"train_loss": -27.329980850219727, "global_step": 467853, "epoch": 5636} {"train_loss": -27.45088005065918, "global_step": 467854, "epoch": 5636} {"train_loss": -27.022159576416016, "global_step": 467855, "epoch": 5636} {"train_loss": -26.842981338500977, "global_step": 467856, "epoch": 5636} {"train_loss": -26.81003761291504, "global_step": 467857, "epoch": 5636} {"train_loss": -27.294158935546875, "global_step": 467858, "epoch": 5636} {"train_loss": -27.431821823120117, "global_step": 467859, "epoch": 5636} {"train_loss": -27.168766021728516, "global_step": 467860, "epoch": 5636} {"train_loss": -27.509958267211914, "global_step": 467861, "epoch": 5636} {"train_loss": -26.890213012695312, "global_step": 467862, "epoch": 5636} {"train_loss": -26.8420467376709, "global_step": 467863, "epoch": 5636} {"train_loss": -26.962661743164062, "global_step": 467864, "epoch": 5636} {"train_loss": -26.5577392578125, "global_step": 467865, "epoch": 5636} {"train_loss": -26.80006217956543, "global_step": 467866, "epoch": 5636} {"train_loss": -27.18648338317871, "global_step": 467867, "epoch": 5636} {"train_loss": -26.868452072143555, "global_step": 467868, "epoch": 5636} {"train_loss": -27.057058334350586, "global_step": 467869, "epoch": 5636} {"train_loss": -26.77899783490652, "global_step": 467870, "epoch": 5636, "val_loss": 6666900.0} {"train_loss": -26.45172691345215, "global_step": 467871, "epoch": 5637} {"train_loss": -27.12493324279785, "global_step": 467872, "epoch": 5637} {"train_loss": -26.67609214782715, "global_step": 467873, "epoch": 5637} {"train_loss": -26.907367706298828, "global_step": 467874, "epoch": 5637} {"train_loss": -26.815244674682617, "global_step": 467875, "epoch": 5637} {"train_loss": -26.42438316345215, "global_step": 467876, "epoch": 5637} {"train_loss": -26.92188835144043, "global_step": 467877, "epoch": 5637} {"train_loss": -27.090734481811523, "global_step": 467878, "epoch": 5637} {"train_loss": -27.09346580505371, "global_step": 467879, "epoch": 5637} {"train_loss": -26.791492462158203, "global_step": 467880, "epoch": 5637} {"train_loss": -26.648778915405273, "global_step": 467881, "epoch": 5637} {"train_loss": -26.686050415039062, "global_step": 467882, "epoch": 5637} {"train_loss": -26.902875900268555, "global_step": 467883, "epoch": 5637} {"train_loss": -27.0114688873291, "global_step": 467884, "epoch": 5637} {"train_loss": -26.815155029296875, "global_step": 467885, "epoch": 5637} {"train_loss": -27.0211238861084, "global_step": 467886, "epoch": 5637} {"train_loss": -26.73499870300293, "global_step": 467887, "epoch": 5637} {"train_loss": -26.993270874023438, "global_step": 467888, "epoch": 5637} {"train_loss": -26.787189483642578, "global_step": 467889, "epoch": 5637} {"train_loss": -26.976537704467773, "global_step": 467890, "epoch": 5637} {"train_loss": -26.90240478515625, "global_step": 467891, "epoch": 5637} {"train_loss": -27.214765548706055, "global_step": 467892, "epoch": 5637} {"train_loss": -27.011249542236328, "global_step": 467893, "epoch": 5637} {"train_loss": -26.79656982421875, "global_step": 467894, "epoch": 5637} {"train_loss": -26.977558135986328, "global_step": 467895, "epoch": 5637} {"train_loss": -27.200946807861328, "global_step": 467896, "epoch": 5637} {"train_loss": -27.05964469909668, "global_step": 467897, "epoch": 5637} {"train_loss": -27.152225494384766, "global_step": 467898, "epoch": 5637} {"train_loss": -26.894739151000977, "global_step": 467899, "epoch": 5637} {"train_loss": -27.042144775390625, "global_step": 467900, "epoch": 5637} {"train_loss": -27.113483428955078, "global_step": 467901, "epoch": 5637} {"train_loss": -27.44547462463379, "global_step": 467902, "epoch": 5637} {"train_loss": -27.036649703979492, "global_step": 467903, "epoch": 5637} {"train_loss": -26.95501136779785, "global_step": 467904, "epoch": 5637} {"train_loss": -26.896696090698242, "global_step": 467905, "epoch": 5637} {"train_loss": -27.312610626220703, "global_step": 467906, "epoch": 5637} {"train_loss": -26.9379825592041, "global_step": 467907, "epoch": 5637} {"train_loss": -27.190235137939453, "global_step": 467908, "epoch": 5637} {"train_loss": -27.094701766967773, "global_step": 467909, "epoch": 5637} {"train_loss": -27.31410026550293, "global_step": 467910, "epoch": 5637} {"train_loss": -27.203821182250977, "global_step": 467911, "epoch": 5637} {"train_loss": -27.018203735351562, "global_step": 467912, "epoch": 5637} {"train_loss": -27.068756103515625, "global_step": 467913, "epoch": 5637} {"train_loss": -27.24199867248535, "global_step": 467914, "epoch": 5637} {"train_loss": -27.03389549255371, "global_step": 467915, "epoch": 5637} {"train_loss": -27.529890060424805, "global_step": 467916, "epoch": 5637} {"train_loss": -27.1491641998291, "global_step": 467917, "epoch": 5637} {"train_loss": -27.174169540405273, "global_step": 467918, "epoch": 5637} {"train_loss": -27.200489044189453, "global_step": 467919, "epoch": 5637} {"train_loss": -27.48621940612793, "global_step": 467920, "epoch": 5637} {"train_loss": -27.291608810424805, "global_step": 467921, "epoch": 5637} {"train_loss": -27.29022216796875, "global_step": 467922, "epoch": 5637} {"train_loss": -27.400222778320312, "global_step": 467923, "epoch": 5637} {"train_loss": -27.295703887939453, "global_step": 467924, "epoch": 5637} {"train_loss": -26.581409454345703, "global_step": 467925, "epoch": 5637} {"train_loss": -26.705846786499023, "global_step": 467926, "epoch": 5637} {"train_loss": -25.92083168029785, "global_step": 467927, "epoch": 5637} {"train_loss": -26.806289672851562, "global_step": 467928, "epoch": 5637} {"train_loss": -27.562414169311523, "global_step": 467929, "epoch": 5637} {"train_loss": -26.512039184570312, "global_step": 467930, "epoch": 5637} {"train_loss": -27.0900821685791, "global_step": 467931, "epoch": 5637} {"train_loss": -26.837549209594727, "global_step": 467932, "epoch": 5637} {"train_loss": -27.466413497924805, "global_step": 467933, "epoch": 5637} {"train_loss": -27.106672286987305, "global_step": 467934, "epoch": 5637} {"train_loss": -27.295886993408203, "global_step": 467935, "epoch": 5637} {"train_loss": -27.06207275390625, "global_step": 467936, "epoch": 5637} {"train_loss": -27.137399673461914, "global_step": 467937, "epoch": 5637} {"train_loss": -26.972518920898438, "global_step": 467938, "epoch": 5637} {"train_loss": -27.273862838745117, "global_step": 467939, "epoch": 5637} {"train_loss": -27.204242706298828, "global_step": 467940, "epoch": 5637} {"train_loss": -27.039777755737305, "global_step": 467941, "epoch": 5637} {"train_loss": -26.88330078125, "global_step": 467942, "epoch": 5637} {"train_loss": -27.305585861206055, "global_step": 467943, "epoch": 5637} {"train_loss": -27.165603637695312, "global_step": 467944, "epoch": 5637} {"train_loss": -26.904035568237305, "global_step": 467945, "epoch": 5637} {"train_loss": -26.873538970947266, "global_step": 467946, "epoch": 5637} {"train_loss": -27.20358657836914, "global_step": 467947, "epoch": 5637} {"train_loss": -26.794775009155273, "global_step": 467948, "epoch": 5637} {"train_loss": -27.46510887145996, "global_step": 467949, "epoch": 5637} {"train_loss": -26.804636001586914, "global_step": 467950, "epoch": 5637} {"train_loss": -26.903045654296875, "global_step": 467951, "epoch": 5637} {"train_loss": -27.397735595703125, "global_step": 467952, "epoch": 5637} {"train_loss": -27.020466080631117, "global_step": 467953, "epoch": 5637, "val_loss": 6737316.0} {"train_loss": -26.877470016479492, "global_step": 467954, "epoch": 5638} {"train_loss": -25.86530876159668, "global_step": 467955, "epoch": 5638} {"train_loss": -26.194232940673828, "global_step": 467956, "epoch": 5638} {"train_loss": -26.753570556640625, "global_step": 467957, "epoch": 5638} {"train_loss": -26.52504539489746, "global_step": 467958, "epoch": 5638} {"train_loss": -26.541425704956055, "global_step": 467959, "epoch": 5638} {"train_loss": -26.428852081298828, "global_step": 467960, "epoch": 5638} {"train_loss": -26.785322189331055, "global_step": 467961, "epoch": 5638} {"train_loss": -26.5828857421875, "global_step": 467962, "epoch": 5638} {"train_loss": -27.20745277404785, "global_step": 467963, "epoch": 5638} {"train_loss": -26.637113571166992, "global_step": 467964, "epoch": 5638} {"train_loss": -26.694442749023438, "global_step": 467965, "epoch": 5638} {"train_loss": -26.548480987548828, "global_step": 467966, "epoch": 5638} {"train_loss": -26.862409591674805, "global_step": 467967, "epoch": 5638} {"train_loss": -27.164777755737305, "global_step": 467968, "epoch": 5638} {"train_loss": -26.87992286682129, "global_step": 467969, "epoch": 5638} {"train_loss": -26.641876220703125, "global_step": 467970, "epoch": 5638} {"train_loss": -27.09775733947754, "global_step": 467971, "epoch": 5638} {"train_loss": -26.85821533203125, "global_step": 467972, "epoch": 5638} {"train_loss": -26.738611221313477, "global_step": 467973, "epoch": 5638} {"train_loss": -26.538427352905273, "global_step": 467974, "epoch": 5638} {"train_loss": -26.759435653686523, "global_step": 467975, "epoch": 5638} {"train_loss": -26.47939109802246, "global_step": 467976, "epoch": 5638} {"train_loss": -26.358850479125977, "global_step": 467977, "epoch": 5638} {"train_loss": -26.750839233398438, "global_step": 467978, "epoch": 5638} {"train_loss": -26.4345645904541, "global_step": 467979, "epoch": 5638} {"train_loss": -26.93698501586914, "global_step": 467980, "epoch": 5638} {"train_loss": -26.998193740844727, "global_step": 467981, "epoch": 5638} {"train_loss": -26.98540687561035, "global_step": 467982, "epoch": 5638} {"train_loss": -26.99012565612793, "global_step": 467983, "epoch": 5638} {"train_loss": -26.87080192565918, "global_step": 467984, "epoch": 5638} {"train_loss": -27.2200927734375, "global_step": 467985, "epoch": 5638} {"train_loss": -26.94060707092285, "global_step": 467986, "epoch": 5638} {"train_loss": -26.812429428100586, "global_step": 467987, "epoch": 5638} {"train_loss": -26.949228286743164, "global_step": 467988, "epoch": 5638} {"train_loss": -26.819351196289062, "global_step": 467989, "epoch": 5638} {"train_loss": -27.172149658203125, "global_step": 467990, "epoch": 5638} {"train_loss": -27.430774688720703, "global_step": 467991, "epoch": 5638} {"train_loss": -27.39509391784668, "global_step": 467992, "epoch": 5638} {"train_loss": -27.166662216186523, "global_step": 467993, "epoch": 5638} {"train_loss": -26.904632568359375, "global_step": 467994, "epoch": 5638} {"train_loss": -27.340320587158203, "global_step": 467995, "epoch": 5638} {"train_loss": -27.117685317993164, "global_step": 467996, "epoch": 5638} {"train_loss": -27.246137619018555, "global_step": 467997, "epoch": 5638} {"train_loss": -27.435285568237305, "global_step": 467998, "epoch": 5638} {"train_loss": -27.37871742248535, "global_step": 467999, "epoch": 5638} {"train_loss": -27.1589298248291, "global_step": 468000, "epoch": 5638} {"train_loss": -27.45310401916504, "global_step": 468001, "epoch": 5638} {"train_loss": -27.0489444732666, "global_step": 468002, "epoch": 5638} {"train_loss": -27.682098388671875, "global_step": 468003, "epoch": 5638} {"train_loss": -26.910247802734375, "global_step": 468004, "epoch": 5638} {"train_loss": -27.005273818969727, "global_step": 468005, "epoch": 5638} {"train_loss": -27.051645278930664, "global_step": 468006, "epoch": 5638} {"train_loss": -27.187475204467773, "global_step": 468007, "epoch": 5638} {"train_loss": -27.346282958984375, "global_step": 468008, "epoch": 5638} {"train_loss": -27.425397872924805, "global_step": 468009, "epoch": 5638} {"train_loss": -27.307605743408203, "global_step": 468010, "epoch": 5638} {"train_loss": -26.99468994140625, "global_step": 468011, "epoch": 5638} {"train_loss": -27.310077667236328, "global_step": 468012, "epoch": 5638} {"train_loss": -27.360578536987305, "global_step": 468013, "epoch": 5638} {"train_loss": -27.2978458404541, "global_step": 468014, "epoch": 5638} {"train_loss": -27.122114181518555, "global_step": 468015, "epoch": 5638} {"train_loss": -27.561933517456055, "global_step": 468016, "epoch": 5638} {"train_loss": -27.36033058166504, "global_step": 468017, "epoch": 5638} {"train_loss": -27.55781364440918, "global_step": 468018, "epoch": 5638} {"train_loss": -27.357797622680664, "global_step": 468019, "epoch": 5638} {"train_loss": -27.02728843688965, "global_step": 468020, "epoch": 5638} {"train_loss": -27.200469970703125, "global_step": 468021, "epoch": 5638} {"train_loss": -27.31357765197754, "global_step": 468022, "epoch": 5638} {"train_loss": -27.099790573120117, "global_step": 468023, "epoch": 5638} {"train_loss": -27.568359375, "global_step": 468024, "epoch": 5638} {"train_loss": -27.076690673828125, "global_step": 468025, "epoch": 5638} {"train_loss": -26.8405704498291, "global_step": 468026, "epoch": 5638} {"train_loss": -26.946090698242188, "global_step": 468027, "epoch": 5638} {"train_loss": -27.15989112854004, "global_step": 468028, "epoch": 5638} {"train_loss": -26.767805099487305, "global_step": 468029, "epoch": 5638} {"train_loss": -27.147748947143555, "global_step": 468030, "epoch": 5638} {"train_loss": -26.727869033813477, "global_step": 468031, "epoch": 5638} {"train_loss": -27.040922164916992, "global_step": 468032, "epoch": 5638} {"train_loss": -27.173603057861328, "global_step": 468033, "epoch": 5638} {"train_loss": -27.513051986694336, "global_step": 468034, "epoch": 5638} {"train_loss": -27.4542236328125, "global_step": 468035, "epoch": 5638} {"train_loss": -27.010186321764106, "global_step": 468036, "epoch": 5638, "val_loss": 6688393.0} {"train_loss": -26.840946197509766, "global_step": 468037, "epoch": 5639} {"train_loss": -26.4689884185791, "global_step": 468038, "epoch": 5639} {"train_loss": -26.64698600769043, "global_step": 468039, "epoch": 5639} {"train_loss": -26.703710556030273, "global_step": 468040, "epoch": 5639} {"train_loss": -26.738248825073242, "global_step": 468041, "epoch": 5639} {"train_loss": -26.909460067749023, "global_step": 468042, "epoch": 5639} {"train_loss": -26.759641647338867, "global_step": 468043, "epoch": 5639} {"train_loss": -26.437793731689453, "global_step": 468044, "epoch": 5639} {"train_loss": -27.174646377563477, "global_step": 468045, "epoch": 5639} {"train_loss": -27.0502986907959, "global_step": 468046, "epoch": 5639} {"train_loss": -26.6993465423584, "global_step": 468047, "epoch": 5639} {"train_loss": -26.778491973876953, "global_step": 468048, "epoch": 5639} {"train_loss": -26.926666259765625, "global_step": 468049, "epoch": 5639} {"train_loss": -26.768939971923828, "global_step": 468050, "epoch": 5639} {"train_loss": -27.11231803894043, "global_step": 468051, "epoch": 5639} {"train_loss": -27.128894805908203, "global_step": 468052, "epoch": 5639} {"train_loss": -27.05415153503418, "global_step": 468053, "epoch": 5639} {"train_loss": -27.127792358398438, "global_step": 468054, "epoch": 5639} {"train_loss": -27.176239013671875, "global_step": 468055, "epoch": 5639} {"train_loss": -27.07903480529785, "global_step": 468056, "epoch": 5639} {"train_loss": -26.965993881225586, "global_step": 468057, "epoch": 5639} {"train_loss": -27.176929473876953, "global_step": 468058, "epoch": 5639} {"train_loss": -26.947147369384766, "global_step": 468059, "epoch": 5639} {"train_loss": -27.125675201416016, "global_step": 468060, "epoch": 5639} {"train_loss": -27.082550048828125, "global_step": 468061, "epoch": 5639} {"train_loss": -27.20462417602539, "global_step": 468062, "epoch": 5639} {"train_loss": -27.289962768554688, "global_step": 468063, "epoch": 5639} {"train_loss": -27.266876220703125, "global_step": 468064, "epoch": 5639} {"train_loss": -27.444334030151367, "global_step": 468065, "epoch": 5639} {"train_loss": -27.4033203125, "global_step": 468066, "epoch": 5639} {"train_loss": -26.991186141967773, "global_step": 468067, "epoch": 5639} {"train_loss": -27.214242935180664, "global_step": 468068, "epoch": 5639} {"train_loss": -27.322345733642578, "global_step": 468069, "epoch": 5639} {"train_loss": -27.435718536376953, "global_step": 468070, "epoch": 5639} {"train_loss": -27.164331436157227, "global_step": 468071, "epoch": 5639} {"train_loss": -27.174285888671875, "global_step": 468072, "epoch": 5639} {"train_loss": -27.47412109375, "global_step": 468073, "epoch": 5639} {"train_loss": -27.46194839477539, "global_step": 468074, "epoch": 5639} {"train_loss": -27.08741569519043, "global_step": 468075, "epoch": 5639} {"train_loss": -27.64674186706543, "global_step": 468076, "epoch": 5639} {"train_loss": -27.305959701538086, "global_step": 468077, "epoch": 5639} {"train_loss": -27.056751251220703, "global_step": 468078, "epoch": 5639} {"train_loss": -27.364349365234375, "global_step": 468079, "epoch": 5639} {"train_loss": -27.37900161743164, "global_step": 468080, "epoch": 5639} {"train_loss": -27.615087509155273, "global_step": 468081, "epoch": 5639} {"train_loss": -27.157739639282227, "global_step": 468082, "epoch": 5639} {"train_loss": -27.2080078125, "global_step": 468083, "epoch": 5639} {"train_loss": -27.314794540405273, "global_step": 468084, "epoch": 5639} {"train_loss": -27.11309242248535, "global_step": 468085, "epoch": 5639} {"train_loss": -27.57199478149414, "global_step": 468086, "epoch": 5639} {"train_loss": -27.404321670532227, "global_step": 468087, "epoch": 5639} {"train_loss": -27.387632369995117, "global_step": 468088, "epoch": 5639} {"train_loss": -27.112085342407227, "global_step": 468089, "epoch": 5639} {"train_loss": -27.616113662719727, "global_step": 468090, "epoch": 5639} {"train_loss": -27.157068252563477, "global_step": 468091, "epoch": 5639} {"train_loss": -27.042617797851562, "global_step": 468092, "epoch": 5639} {"train_loss": -26.6850528717041, "global_step": 468093, "epoch": 5639} {"train_loss": -27.030263900756836, "global_step": 468094, "epoch": 5639} {"train_loss": -26.602130889892578, "global_step": 468095, "epoch": 5639} {"train_loss": -26.931961059570312, "global_step": 468096, "epoch": 5639} {"train_loss": -27.02455711364746, "global_step": 468097, "epoch": 5639} {"train_loss": -27.457441329956055, "global_step": 468098, "epoch": 5639} {"train_loss": -26.924732208251953, "global_step": 468099, "epoch": 5639} {"train_loss": -27.209272384643555, "global_step": 468100, "epoch": 5639} {"train_loss": -27.246423721313477, "global_step": 468101, "epoch": 5639} {"train_loss": -27.21229362487793, "global_step": 468102, "epoch": 5639} {"train_loss": -27.568145751953125, "global_step": 468103, "epoch": 5639} {"train_loss": -27.007062911987305, "global_step": 468104, "epoch": 5639} {"train_loss": -27.01600456237793, "global_step": 468105, "epoch": 5639} {"train_loss": -27.2164306640625, "global_step": 468106, "epoch": 5639} {"train_loss": -27.159448623657227, "global_step": 468107, "epoch": 5639} {"train_loss": -27.074010848999023, "global_step": 468108, "epoch": 5639} {"train_loss": -26.649255752563477, "global_step": 468109, "epoch": 5639} {"train_loss": -27.088043212890625, "global_step": 468110, "epoch": 5639} {"train_loss": -27.2792911529541, "global_step": 468111, "epoch": 5639} {"train_loss": -27.115522384643555, "global_step": 468112, "epoch": 5639} {"train_loss": -27.31772232055664, "global_step": 468113, "epoch": 5639} {"train_loss": -27.55573081970215, "global_step": 468114, "epoch": 5639} {"train_loss": -27.632535934448242, "global_step": 468115, "epoch": 5639} {"train_loss": -27.367889404296875, "global_step": 468116, "epoch": 5639} {"train_loss": -27.283172607421875, "global_step": 468117, "epoch": 5639} {"train_loss": -27.44129753112793, "global_step": 468118, "epoch": 5639} {"train_loss": -27.150054380118128, "global_step": 468119, "epoch": 5639, "val_loss": 6605085.5} {"train_loss": -26.410043716430664, "global_step": 468120, "epoch": 5640} {"train_loss": -25.330272674560547, "global_step": 468121, "epoch": 5640} {"train_loss": -25.87477684020996, "global_step": 468122, "epoch": 5640} {"train_loss": -26.262451171875, "global_step": 468123, "epoch": 5640} {"train_loss": -26.553327560424805, "global_step": 468124, "epoch": 5640} {"train_loss": -25.258230209350586, "global_step": 468125, "epoch": 5640} {"train_loss": -25.222639083862305, "global_step": 468126, "epoch": 5640} {"train_loss": -26.187768936157227, "global_step": 468127, "epoch": 5640} {"train_loss": -25.73041343688965, "global_step": 468128, "epoch": 5640} {"train_loss": -26.784393310546875, "global_step": 468129, "epoch": 5640} {"train_loss": -26.0478458404541, "global_step": 468130, "epoch": 5640} {"train_loss": -26.956302642822266, "global_step": 468131, "epoch": 5640} {"train_loss": -25.999074935913086, "global_step": 468132, "epoch": 5640} {"train_loss": -26.0816593170166, "global_step": 468133, "epoch": 5640} {"train_loss": -26.712976455688477, "global_step": 468134, "epoch": 5640} {"train_loss": -26.422576904296875, "global_step": 468135, "epoch": 5640} {"train_loss": -26.134485244750977, "global_step": 468136, "epoch": 5640} {"train_loss": -26.690824508666992, "global_step": 468137, "epoch": 5640} {"train_loss": -26.55789566040039, "global_step": 468138, "epoch": 5640} {"train_loss": -26.53534507751465, "global_step": 468139, "epoch": 5640} {"train_loss": -26.8454532623291, "global_step": 468140, "epoch": 5640} {"train_loss": -26.666446685791016, "global_step": 468141, "epoch": 5640} {"train_loss": -26.864858627319336, "global_step": 468142, "epoch": 5640} {"train_loss": -26.63911247253418, "global_step": 468143, "epoch": 5640} {"train_loss": -26.83294105529785, "global_step": 468144, "epoch": 5640} {"train_loss": -26.742345809936523, "global_step": 468145, "epoch": 5640} {"train_loss": -26.82192039489746, "global_step": 468146, "epoch": 5640} {"train_loss": -26.954294204711914, "global_step": 468147, "epoch": 5640} {"train_loss": -26.656421661376953, "global_step": 468148, "epoch": 5640} {"train_loss": -26.950428009033203, "global_step": 468149, "epoch": 5640} {"train_loss": -26.9183292388916, "global_step": 468150, "epoch": 5640} {"train_loss": -26.722808837890625, "global_step": 468151, "epoch": 5640} {"train_loss": -27.179168701171875, "global_step": 468152, "epoch": 5640} {"train_loss": -27.698484420776367, "global_step": 468153, "epoch": 5640} {"train_loss": -27.05402946472168, "global_step": 468154, "epoch": 5640} {"train_loss": -26.883386611938477, "global_step": 468155, "epoch": 5640} {"train_loss": -27.02362060546875, "global_step": 468156, "epoch": 5640} {"train_loss": -27.093780517578125, "global_step": 468157, "epoch": 5640} {"train_loss": -27.293201446533203, "global_step": 468158, "epoch": 5640} {"train_loss": -27.124555587768555, "global_step": 468159, "epoch": 5640} {"train_loss": -27.35321044921875, "global_step": 468160, "epoch": 5640} {"train_loss": -27.073774337768555, "global_step": 468161, "epoch": 5640} {"train_loss": -27.30157470703125, "global_step": 468162, "epoch": 5640} {"train_loss": -26.963464736938477, "global_step": 468163, "epoch": 5640} {"train_loss": -27.40186882019043, "global_step": 468164, "epoch": 5640} {"train_loss": -27.39423179626465, "global_step": 468165, "epoch": 5640} {"train_loss": -27.092294692993164, "global_step": 468166, "epoch": 5640} {"train_loss": -27.260761260986328, "global_step": 468167, "epoch": 5640} {"train_loss": -27.113712310791016, "global_step": 468168, "epoch": 5640} {"train_loss": -27.362838745117188, "global_step": 468169, "epoch": 5640} {"train_loss": -26.871780395507812, "global_step": 468170, "epoch": 5640} {"train_loss": -27.502634048461914, "global_step": 468171, "epoch": 5640} {"train_loss": -27.54324722290039, "global_step": 468172, "epoch": 5640} {"train_loss": -27.064340591430664, "global_step": 468173, "epoch": 5640} {"train_loss": -27.31841468811035, "global_step": 468174, "epoch": 5640} {"train_loss": -27.515583038330078, "global_step": 468175, "epoch": 5640} {"train_loss": -27.00235366821289, "global_step": 468176, "epoch": 5640} {"train_loss": -27.283918380737305, "global_step": 468177, "epoch": 5640} {"train_loss": -27.199750900268555, "global_step": 468178, "epoch": 5640} {"train_loss": -27.433725357055664, "global_step": 468179, "epoch": 5640} {"train_loss": -27.297378540039062, "global_step": 468180, "epoch": 5640} {"train_loss": -27.22247314453125, "global_step": 468181, "epoch": 5640} {"train_loss": -27.42047691345215, "global_step": 468182, "epoch": 5640} {"train_loss": -27.185611724853516, "global_step": 468183, "epoch": 5640} {"train_loss": -27.228485107421875, "global_step": 468184, "epoch": 5640} {"train_loss": -27.33916664123535, "global_step": 468185, "epoch": 5640} {"train_loss": -27.1391658782959, "global_step": 468186, "epoch": 5640} {"train_loss": -27.12482261657715, "global_step": 468187, "epoch": 5640} {"train_loss": -26.905414581298828, "global_step": 468188, "epoch": 5640} {"train_loss": -27.284500122070312, "global_step": 468189, "epoch": 5640} {"train_loss": -27.187185287475586, "global_step": 468190, "epoch": 5640} {"train_loss": -27.30317497253418, "global_step": 468191, "epoch": 5640} {"train_loss": -27.207351684570312, "global_step": 468192, "epoch": 5640} {"train_loss": -27.58732032775879, "global_step": 468193, "epoch": 5640} {"train_loss": -27.4818172454834, "global_step": 468194, "epoch": 5640} {"train_loss": -27.097457885742188, "global_step": 468195, "epoch": 5640} {"train_loss": -26.68036460876465, "global_step": 468196, "epoch": 5640} {"train_loss": -27.1337947845459, "global_step": 468197, "epoch": 5640} {"train_loss": -27.609375, "global_step": 468198, "epoch": 5640} {"train_loss": -27.114261627197266, "global_step": 468199, "epoch": 5640} {"train_loss": -27.40415382385254, "global_step": 468200, "epoch": 5640} {"train_loss": -27.733152389526367, "global_step": 468201, "epoch": 5640} {"train_loss": -26.928229757102137, "global_step": 468202, "epoch": 5640, "val_loss": 6695343.5} {"train_loss": -26.049392700195312, "global_step": 468203, "epoch": 5641} {"train_loss": -25.661727905273438, "global_step": 468204, "epoch": 5641} {"train_loss": -26.71573829650879, "global_step": 468205, "epoch": 5641} {"train_loss": -26.2387638092041, "global_step": 468206, "epoch": 5641} {"train_loss": -26.489416122436523, "global_step": 468207, "epoch": 5641} {"train_loss": -26.219318389892578, "global_step": 468208, "epoch": 5641} {"train_loss": -26.6878662109375, "global_step": 468209, "epoch": 5641} {"train_loss": -26.2999267578125, "global_step": 468210, "epoch": 5641} {"train_loss": -26.683786392211914, "global_step": 468211, "epoch": 5641} {"train_loss": -26.637481689453125, "global_step": 468212, "epoch": 5641} {"train_loss": -27.059844970703125, "global_step": 468213, "epoch": 5641} {"train_loss": -26.421003341674805, "global_step": 468214, "epoch": 5641} {"train_loss": -26.664289474487305, "global_step": 468215, "epoch": 5641} {"train_loss": -26.435367584228516, "global_step": 468216, "epoch": 5641} {"train_loss": -26.532880783081055, "global_step": 468217, "epoch": 5641} {"train_loss": -26.786062240600586, "global_step": 468218, "epoch": 5641} {"train_loss": -26.806400299072266, "global_step": 468219, "epoch": 5641} {"train_loss": -26.784626007080078, "global_step": 468220, "epoch": 5641} {"train_loss": -26.608142852783203, "global_step": 468221, "epoch": 5641} {"train_loss": -26.96851921081543, "global_step": 468222, "epoch": 5641} {"train_loss": -26.706830978393555, "global_step": 468223, "epoch": 5641} {"train_loss": -26.722660064697266, "global_step": 468224, "epoch": 5641} {"train_loss": -26.986448287963867, "global_step": 468225, "epoch": 5641} {"train_loss": -26.829833984375, "global_step": 468226, "epoch": 5641} {"train_loss": -26.854557037353516, "global_step": 468227, "epoch": 5641} {"train_loss": -26.779447555541992, "global_step": 468228, "epoch": 5641} {"train_loss": -27.176366806030273, "global_step": 468229, "epoch": 5641} {"train_loss": -26.898664474487305, "global_step": 468230, "epoch": 5641} {"train_loss": -27.184213638305664, "global_step": 468231, "epoch": 5641} {"train_loss": -27.08144187927246, "global_step": 468232, "epoch": 5641} {"train_loss": -27.057294845581055, "global_step": 468233, "epoch": 5641} {"train_loss": -27.178430557250977, "global_step": 468234, "epoch": 5641} {"train_loss": -27.36419105529785, "global_step": 468235, "epoch": 5641} {"train_loss": -27.085988998413086, "global_step": 468236, "epoch": 5641} {"train_loss": -27.13007926940918, "global_step": 468237, "epoch": 5641} {"train_loss": -27.207263946533203, "global_step": 468238, "epoch": 5641} {"train_loss": -27.09987449645996, "global_step": 468239, "epoch": 5641} {"train_loss": -27.477643966674805, "global_step": 468240, "epoch": 5641} {"train_loss": -27.086450576782227, "global_step": 468241, "epoch": 5641} {"train_loss": -26.855804443359375, "global_step": 468242, "epoch": 5641} {"train_loss": -27.21640968322754, "global_step": 468243, "epoch": 5641} {"train_loss": -27.494184494018555, "global_step": 468244, "epoch": 5641} {"train_loss": -27.072256088256836, "global_step": 468245, "epoch": 5641} {"train_loss": -27.620315551757812, "global_step": 468246, "epoch": 5641} {"train_loss": -27.38775634765625, "global_step": 468247, "epoch": 5641} {"train_loss": -27.425405502319336, "global_step": 468248, "epoch": 5641} {"train_loss": -27.4019718170166, "global_step": 468249, "epoch": 5641} {"train_loss": -27.290374755859375, "global_step": 468250, "epoch": 5641} {"train_loss": -27.543792724609375, "global_step": 468251, "epoch": 5641} {"train_loss": -27.526304244995117, "global_step": 468252, "epoch": 5641} {"train_loss": -27.449472427368164, "global_step": 468253, "epoch": 5641} {"train_loss": -27.293066024780273, "global_step": 468254, "epoch": 5641} {"train_loss": -27.187509536743164, "global_step": 468255, "epoch": 5641} {"train_loss": -27.388168334960938, "global_step": 468256, "epoch": 5641} {"train_loss": -27.109342575073242, "global_step": 468257, "epoch": 5641} {"train_loss": -27.387144088745117, "global_step": 468258, "epoch": 5641} {"train_loss": -27.42037010192871, "global_step": 468259, "epoch": 5641} {"train_loss": -27.685012817382812, "global_step": 468260, "epoch": 5641} {"train_loss": -27.233509063720703, "global_step": 468261, "epoch": 5641} {"train_loss": -26.87346839904785, "global_step": 468262, "epoch": 5641} {"train_loss": -27.074176788330078, "global_step": 468263, "epoch": 5641} {"train_loss": -27.397138595581055, "global_step": 468264, "epoch": 5641} {"train_loss": -26.970111846923828, "global_step": 468265, "epoch": 5641} {"train_loss": -26.876129150390625, "global_step": 468266, "epoch": 5641} {"train_loss": -27.126056671142578, "global_step": 468267, "epoch": 5641} {"train_loss": -27.46979331970215, "global_step": 468268, "epoch": 5641} {"train_loss": -27.880292892456055, "global_step": 468269, "epoch": 5641} {"train_loss": -27.404733657836914, "global_step": 468270, "epoch": 5641} {"train_loss": -27.364187240600586, "global_step": 468271, "epoch": 5641} {"train_loss": -27.053274154663086, "global_step": 468272, "epoch": 5641} {"train_loss": -27.726154327392578, "global_step": 468273, "epoch": 5641} {"train_loss": -27.358606338500977, "global_step": 468274, "epoch": 5641} {"train_loss": -27.68851661682129, "global_step": 468275, "epoch": 5641} {"train_loss": -27.341480255126953, "global_step": 468276, "epoch": 5641} {"train_loss": -27.240060806274414, "global_step": 468277, "epoch": 5641} {"train_loss": -27.387958526611328, "global_step": 468278, "epoch": 5641} {"train_loss": -27.377944946289062, "global_step": 468279, "epoch": 5641} {"train_loss": -27.36629295349121, "global_step": 468280, "epoch": 5641} {"train_loss": -27.431079864501953, "global_step": 468281, "epoch": 5641} {"train_loss": -27.45941162109375, "global_step": 468282, "epoch": 5641} {"train_loss": -27.421707153320312, "global_step": 468283, "epoch": 5641} {"train_loss": -27.447473526000977, "global_step": 468284, "epoch": 5641} {"train_loss": -27.073552418904132, "global_step": 468285, "epoch": 5641, "val_loss": 6570048.0} {"train_loss": -26.456985473632812, "global_step": 468286, "epoch": 5642} {"train_loss": -25.965164184570312, "global_step": 468287, "epoch": 5642} {"train_loss": -25.988306045532227, "global_step": 468288, "epoch": 5642} {"train_loss": -26.80049705505371, "global_step": 468289, "epoch": 5642} {"train_loss": -26.551843643188477, "global_step": 468290, "epoch": 5642} {"train_loss": -26.787534713745117, "global_step": 468291, "epoch": 5642} {"train_loss": -26.63693618774414, "global_step": 468292, "epoch": 5642} {"train_loss": -26.493871688842773, "global_step": 468293, "epoch": 5642} {"train_loss": -26.842864990234375, "global_step": 468294, "epoch": 5642} {"train_loss": -26.944522857666016, "global_step": 468295, "epoch": 5642} {"train_loss": -27.08448600769043, "global_step": 468296, "epoch": 5642} {"train_loss": -26.587451934814453, "global_step": 468297, "epoch": 5642} {"train_loss": -27.273059844970703, "global_step": 468298, "epoch": 5642} {"train_loss": -26.579954147338867, "global_step": 468299, "epoch": 5642} {"train_loss": -27.122333526611328, "global_step": 468300, "epoch": 5642} {"train_loss": -26.81546974182129, "global_step": 468301, "epoch": 5642} {"train_loss": -26.963171005249023, "global_step": 468302, "epoch": 5642} {"train_loss": -26.84307289123535, "global_step": 468303, "epoch": 5642} {"train_loss": -27.18757438659668, "global_step": 468304, "epoch": 5642} {"train_loss": -27.3045597076416, "global_step": 468305, "epoch": 5642} {"train_loss": -26.97084617614746, "global_step": 468306, "epoch": 5642} {"train_loss": -27.005048751831055, "global_step": 468307, "epoch": 5642} {"train_loss": -26.982955932617188, "global_step": 468308, "epoch": 5642} {"train_loss": -27.20778465270996, "global_step": 468309, "epoch": 5642} {"train_loss": -27.616849899291992, "global_step": 468310, "epoch": 5642} {"train_loss": -27.0319881439209, "global_step": 468311, "epoch": 5642} {"train_loss": -27.08916664123535, "global_step": 468312, "epoch": 5642} {"train_loss": -27.00048828125, "global_step": 468313, "epoch": 5642} {"train_loss": -27.161340713500977, "global_step": 468314, "epoch": 5642} {"train_loss": -27.118154525756836, "global_step": 468315, "epoch": 5642} {"train_loss": -27.587400436401367, "global_step": 468316, "epoch": 5642} {"train_loss": -27.01211929321289, "global_step": 468317, "epoch": 5642} {"train_loss": -27.142087936401367, "global_step": 468318, "epoch": 5642} {"train_loss": -27.058761596679688, "global_step": 468319, "epoch": 5642} {"train_loss": -26.970056533813477, "global_step": 468320, "epoch": 5642} {"train_loss": -27.271717071533203, "global_step": 468321, "epoch": 5642} {"train_loss": -27.35110855102539, "global_step": 468322, "epoch": 5642} {"train_loss": -27.50360679626465, "global_step": 468323, "epoch": 5642} {"train_loss": -27.184864044189453, "global_step": 468324, "epoch": 5642} {"train_loss": -27.50583267211914, "global_step": 468325, "epoch": 5642} {"train_loss": -27.188627243041992, "global_step": 468326, "epoch": 5642} {"train_loss": -27.45989990234375, "global_step": 468327, "epoch": 5642} {"train_loss": -26.970218658447266, "global_step": 468328, "epoch": 5642} {"train_loss": -27.5587215423584, "global_step": 468329, "epoch": 5642} {"train_loss": -27.744131088256836, "global_step": 468330, "epoch": 5642} {"train_loss": -27.062885284423828, "global_step": 468331, "epoch": 5642} {"train_loss": -27.52827262878418, "global_step": 468332, "epoch": 5642} {"train_loss": -26.659042358398438, "global_step": 468333, "epoch": 5642} {"train_loss": -25.75531005859375, "global_step": 468334, "epoch": 5642} {"train_loss": -25.11256980895996, "global_step": 468335, "epoch": 5642} {"train_loss": -26.359567642211914, "global_step": 468336, "epoch": 5642} {"train_loss": -26.88104820251465, "global_step": 468337, "epoch": 5642} {"train_loss": -26.61478614807129, "global_step": 468338, "epoch": 5642} {"train_loss": -27.19260597229004, "global_step": 468339, "epoch": 5642} {"train_loss": -26.569766998291016, "global_step": 468340, "epoch": 5642} {"train_loss": -27.119726181030273, "global_step": 468341, "epoch": 5642} {"train_loss": -26.89862632751465, "global_step": 468342, "epoch": 5642} {"train_loss": -27.147668838500977, "global_step": 468343, "epoch": 5642} {"train_loss": -27.418561935424805, "global_step": 468344, "epoch": 5642} {"train_loss": -26.817462921142578, "global_step": 468345, "epoch": 5642} {"train_loss": -27.3292179107666, "global_step": 468346, "epoch": 5642} {"train_loss": -26.901477813720703, "global_step": 468347, "epoch": 5642} {"train_loss": -26.988779067993164, "global_step": 468348, "epoch": 5642} {"train_loss": -26.821002960205078, "global_step": 468349, "epoch": 5642} {"train_loss": -27.186004638671875, "global_step": 468350, "epoch": 5642} {"train_loss": -27.24274253845215, "global_step": 468351, "epoch": 5642} {"train_loss": -26.976842880249023, "global_step": 468352, "epoch": 5642} {"train_loss": -27.10249900817871, "global_step": 468353, "epoch": 5642} {"train_loss": -27.16400718688965, "global_step": 468354, "epoch": 5642} {"train_loss": -26.857797622680664, "global_step": 468355, "epoch": 5642} {"train_loss": -27.1009464263916, "global_step": 468356, "epoch": 5642} {"train_loss": -27.622602462768555, "global_step": 468357, "epoch": 5642} {"train_loss": -27.031967163085938, "global_step": 468358, "epoch": 5642} {"train_loss": -27.461538314819336, "global_step": 468359, "epoch": 5642} {"train_loss": -27.512439727783203, "global_step": 468360, "epoch": 5642} {"train_loss": -27.204797744750977, "global_step": 468361, "epoch": 5642} {"train_loss": -27.269922256469727, "global_step": 468362, "epoch": 5642} {"train_loss": -27.119232177734375, "global_step": 468363, "epoch": 5642} {"train_loss": -27.122451782226562, "global_step": 468364, "epoch": 5642} {"train_loss": -26.77094841003418, "global_step": 468365, "epoch": 5642} {"train_loss": -26.83184814453125, "global_step": 468366, "epoch": 5642} {"train_loss": -26.681760787963867, "global_step": 468367, "epoch": 5642} {"train_loss": -26.969069768147296, "global_step": 468368, "epoch": 5642, "val_loss": 6699493.0} {"train_loss": -26.556875228881836, "global_step": 468369, "epoch": 5643} {"train_loss": -25.90431785583496, "global_step": 468370, "epoch": 5643} {"train_loss": -26.705890655517578, "global_step": 468371, "epoch": 5643} {"train_loss": -26.42987060546875, "global_step": 468372, "epoch": 5643} {"train_loss": -26.40757179260254, "global_step": 468373, "epoch": 5643} {"train_loss": -25.9876708984375, "global_step": 468374, "epoch": 5643} {"train_loss": -25.42869758605957, "global_step": 468375, "epoch": 5643} {"train_loss": -26.63533592224121, "global_step": 468376, "epoch": 5643} {"train_loss": -26.5403995513916, "global_step": 468377, "epoch": 5643} {"train_loss": -26.20541763305664, "global_step": 468378, "epoch": 5643} {"train_loss": -26.60511589050293, "global_step": 468379, "epoch": 5643} {"train_loss": -26.334091186523438, "global_step": 468380, "epoch": 5643} {"train_loss": -26.455041885375977, "global_step": 468381, "epoch": 5643} {"train_loss": -26.60395622253418, "global_step": 468382, "epoch": 5643} {"train_loss": -26.553466796875, "global_step": 468383, "epoch": 5643} {"train_loss": -26.784698486328125, "global_step": 468384, "epoch": 5643} {"train_loss": -26.81086540222168, "global_step": 468385, "epoch": 5643} {"train_loss": -26.848154067993164, "global_step": 468386, "epoch": 5643} {"train_loss": -26.664899826049805, "global_step": 468387, "epoch": 5643} {"train_loss": -26.718076705932617, "global_step": 468388, "epoch": 5643} {"train_loss": -26.4594783782959, "global_step": 468389, "epoch": 5643} {"train_loss": -26.771778106689453, "global_step": 468390, "epoch": 5643} {"train_loss": -26.864477157592773, "global_step": 468391, "epoch": 5643} {"train_loss": -26.41702651977539, "global_step": 468392, "epoch": 5643} {"train_loss": -26.966161727905273, "global_step": 468393, "epoch": 5643} {"train_loss": -26.986419677734375, "global_step": 468394, "epoch": 5643} {"train_loss": -27.03350257873535, "global_step": 468395, "epoch": 5643} {"train_loss": -27.307056427001953, "global_step": 468396, "epoch": 5643} {"train_loss": -27.0134334564209, "global_step": 468397, "epoch": 5643} {"train_loss": -27.12965202331543, "global_step": 468398, "epoch": 5643} {"train_loss": -26.949094772338867, "global_step": 468399, "epoch": 5643} {"train_loss": -26.694440841674805, "global_step": 468400, "epoch": 5643} {"train_loss": -27.394895553588867, "global_step": 468401, "epoch": 5643} {"train_loss": -27.182886123657227, "global_step": 468402, "epoch": 5643} {"train_loss": -26.68642234802246, "global_step": 468403, "epoch": 5643} {"train_loss": -27.258569717407227, "global_step": 468404, "epoch": 5643} {"train_loss": -27.149246215820312, "global_step": 468405, "epoch": 5643} {"train_loss": -27.1114444732666, "global_step": 468406, "epoch": 5643} {"train_loss": -27.324039459228516, "global_step": 468407, "epoch": 5643} {"train_loss": -27.3929386138916, "global_step": 468408, "epoch": 5643} {"train_loss": -27.1061954498291, "global_step": 468409, "epoch": 5643} {"train_loss": -27.041685104370117, "global_step": 468410, "epoch": 5643} {"train_loss": -27.385122299194336, "global_step": 468411, "epoch": 5643} {"train_loss": -27.23799705505371, "global_step": 468412, "epoch": 5643} {"train_loss": -27.095609664916992, "global_step": 468413, "epoch": 5643} {"train_loss": -26.81618309020996, "global_step": 468414, "epoch": 5643} {"train_loss": -27.100341796875, "global_step": 468415, "epoch": 5643} {"train_loss": -26.820188522338867, "global_step": 468416, "epoch": 5643} {"train_loss": -27.245182037353516, "global_step": 468417, "epoch": 5643} {"train_loss": -27.195043563842773, "global_step": 468418, "epoch": 5643} {"train_loss": -27.386199951171875, "global_step": 468419, "epoch": 5643} {"train_loss": -27.278528213500977, "global_step": 468420, "epoch": 5643} {"train_loss": -27.29237174987793, "global_step": 468421, "epoch": 5643} {"train_loss": -27.4791259765625, "global_step": 468422, "epoch": 5643} {"train_loss": -27.233041763305664, "global_step": 468423, "epoch": 5643} {"train_loss": -27.208459854125977, "global_step": 468424, "epoch": 5643} {"train_loss": -27.317792892456055, "global_step": 468425, "epoch": 5643} {"train_loss": -27.35706901550293, "global_step": 468426, "epoch": 5643} {"train_loss": -27.637128829956055, "global_step": 468427, "epoch": 5643} {"train_loss": -27.17298698425293, "global_step": 468428, "epoch": 5643} {"train_loss": -27.18999671936035, "global_step": 468429, "epoch": 5643} {"train_loss": -27.330289840698242, "global_step": 468430, "epoch": 5643} {"train_loss": -27.177640914916992, "global_step": 468431, "epoch": 5643} {"train_loss": -27.212284088134766, "global_step": 468432, "epoch": 5643} {"train_loss": -27.38300895690918, "global_step": 468433, "epoch": 5643} {"train_loss": -27.29117202758789, "global_step": 468434, "epoch": 5643} {"train_loss": -27.326379776000977, "global_step": 468435, "epoch": 5643} {"train_loss": -27.438114166259766, "global_step": 468436, "epoch": 5643} {"train_loss": -27.200885772705078, "global_step": 468437, "epoch": 5643} {"train_loss": -27.404699325561523, "global_step": 468438, "epoch": 5643} {"train_loss": -27.31184196472168, "global_step": 468439, "epoch": 5643} {"train_loss": -27.45322608947754, "global_step": 468440, "epoch": 5643} {"train_loss": -27.4462947845459, "global_step": 468441, "epoch": 5643} {"train_loss": -27.29550552368164, "global_step": 468442, "epoch": 5643} {"train_loss": -27.345548629760742, "global_step": 468443, "epoch": 5643} {"train_loss": -27.549957275390625, "global_step": 468444, "epoch": 5643} {"train_loss": -26.922658920288086, "global_step": 468445, "epoch": 5643} {"train_loss": -27.508813858032227, "global_step": 468446, "epoch": 5643} {"train_loss": -27.588031768798828, "global_step": 468447, "epoch": 5643} {"train_loss": -27.54876136779785, "global_step": 468448, "epoch": 5643} {"train_loss": -27.35554313659668, "global_step": 468449, "epoch": 5643} {"train_loss": -27.33808708190918, "global_step": 468450, "epoch": 5643} {"train_loss": -27.03296397105757, "global_step": 468451, "epoch": 5643, "val_loss": 6589239.0} {"train_loss": -26.269712448120117, "global_step": 468452, "epoch": 5644} {"train_loss": -25.231033325195312, "global_step": 468453, "epoch": 5644} {"train_loss": -23.455677032470703, "global_step": 468454, "epoch": 5644} {"train_loss": -23.291547775268555, "global_step": 468455, "epoch": 5644} {"train_loss": -25.191686630249023, "global_step": 468456, "epoch": 5644} {"train_loss": -25.593303680419922, "global_step": 468457, "epoch": 5644} {"train_loss": -25.300901412963867, "global_step": 468458, "epoch": 5644} {"train_loss": -25.993452072143555, "global_step": 468459, "epoch": 5644} {"train_loss": -25.962848663330078, "global_step": 468460, "epoch": 5644} {"train_loss": -25.620389938354492, "global_step": 468461, "epoch": 5644} {"train_loss": -26.068159103393555, "global_step": 468462, "epoch": 5644} {"train_loss": -25.850936889648438, "global_step": 468463, "epoch": 5644} {"train_loss": -26.311079025268555, "global_step": 468464, "epoch": 5644} {"train_loss": -26.178674697875977, "global_step": 468465, "epoch": 5644} {"train_loss": -26.529653549194336, "global_step": 468466, "epoch": 5644} {"train_loss": -25.90732192993164, "global_step": 468467, "epoch": 5644} {"train_loss": -26.431623458862305, "global_step": 468468, "epoch": 5644} {"train_loss": -26.191648483276367, "global_step": 468469, "epoch": 5644} {"train_loss": -26.334524154663086, "global_step": 468470, "epoch": 5644} {"train_loss": -26.562164306640625, "global_step": 468471, "epoch": 5644} {"train_loss": -26.3750057220459, "global_step": 468472, "epoch": 5644} {"train_loss": -26.605859756469727, "global_step": 468473, "epoch": 5644} {"train_loss": -26.815689086914062, "global_step": 468474, "epoch": 5644} {"train_loss": -26.602079391479492, "global_step": 468475, "epoch": 5644} {"train_loss": -26.69394874572754, "global_step": 468476, "epoch": 5644} {"train_loss": -26.630756378173828, "global_step": 468477, "epoch": 5644} {"train_loss": -26.519678115844727, "global_step": 468478, "epoch": 5644} {"train_loss": -26.48388671875, "global_step": 468479, "epoch": 5644} {"train_loss": -26.608739852905273, "global_step": 468480, "epoch": 5644} {"train_loss": -26.8140926361084, "global_step": 468481, "epoch": 5644} {"train_loss": -26.85019874572754, "global_step": 468482, "epoch": 5644} {"train_loss": -27.069055557250977, "global_step": 468483, "epoch": 5644} {"train_loss": -26.593463897705078, "global_step": 468484, "epoch": 5644} {"train_loss": -27.097034454345703, "global_step": 468485, "epoch": 5644} {"train_loss": -26.63091468811035, "global_step": 468486, "epoch": 5644} {"train_loss": -26.93121337890625, "global_step": 468487, "epoch": 5644} {"train_loss": -27.04361915588379, "global_step": 468488, "epoch": 5644} {"train_loss": -27.112695693969727, "global_step": 468489, "epoch": 5644} {"train_loss": -27.192035675048828, "global_step": 468490, "epoch": 5644} {"train_loss": -26.947702407836914, "global_step": 468491, "epoch": 5644} {"train_loss": -27.15020179748535, "global_step": 468492, "epoch": 5644} {"train_loss": -27.157520294189453, "global_step": 468493, "epoch": 5644} {"train_loss": -26.923492431640625, "global_step": 468494, "epoch": 5644} {"train_loss": -27.149885177612305, "global_step": 468495, "epoch": 5644} {"train_loss": -27.1810302734375, "global_step": 468496, "epoch": 5644} {"train_loss": -27.199682235717773, "global_step": 468497, "epoch": 5644} {"train_loss": -27.477075576782227, "global_step": 468498, "epoch": 5644} {"train_loss": -27.369733810424805, "global_step": 468499, "epoch": 5644} {"train_loss": -27.009702682495117, "global_step": 468500, "epoch": 5644} {"train_loss": -27.36565589904785, "global_step": 468501, "epoch": 5644} {"train_loss": -27.32098388671875, "global_step": 468502, "epoch": 5644} {"train_loss": -27.36954116821289, "global_step": 468503, "epoch": 5644} {"train_loss": -27.628936767578125, "global_step": 468504, "epoch": 5644} {"train_loss": -27.33612060546875, "global_step": 468505, "epoch": 5644} {"train_loss": -27.486541748046875, "global_step": 468506, "epoch": 5644} {"train_loss": -27.711883544921875, "global_step": 468507, "epoch": 5644} {"train_loss": -27.301801681518555, "global_step": 468508, "epoch": 5644} {"train_loss": -27.316940307617188, "global_step": 468509, "epoch": 5644} {"train_loss": -27.473154067993164, "global_step": 468510, "epoch": 5644} {"train_loss": -27.5447998046875, "global_step": 468511, "epoch": 5644} {"train_loss": -27.14348793029785, "global_step": 468512, "epoch": 5644} {"train_loss": -27.07163429260254, "global_step": 468513, "epoch": 5644} {"train_loss": -27.205646514892578, "global_step": 468514, "epoch": 5644} {"train_loss": -27.33405876159668, "global_step": 468515, "epoch": 5644} {"train_loss": -27.290441513061523, "global_step": 468516, "epoch": 5644} {"train_loss": -27.21918296813965, "global_step": 468517, "epoch": 5644} {"train_loss": -26.834272384643555, "global_step": 468518, "epoch": 5644} {"train_loss": -26.93391990661621, "global_step": 468519, "epoch": 5644} {"train_loss": -27.09210777282715, "global_step": 468520, "epoch": 5644} {"train_loss": -26.96575355529785, "global_step": 468521, "epoch": 5644} {"train_loss": -27.58247184753418, "global_step": 468522, "epoch": 5644} {"train_loss": -27.04213523864746, "global_step": 468523, "epoch": 5644} {"train_loss": -26.87799644470215, "global_step": 468524, "epoch": 5644} {"train_loss": -27.564258575439453, "global_step": 468525, "epoch": 5644} {"train_loss": -27.196704864501953, "global_step": 468526, "epoch": 5644} {"train_loss": -27.241180419921875, "global_step": 468527, "epoch": 5644} {"train_loss": -27.561323165893555, "global_step": 468528, "epoch": 5644} {"train_loss": -27.789459228515625, "global_step": 468529, "epoch": 5644} {"train_loss": -27.229673385620117, "global_step": 468530, "epoch": 5644} {"train_loss": -27.16579246520996, "global_step": 468531, "epoch": 5644} {"train_loss": -27.159442901611328, "global_step": 468532, "epoch": 5644} {"train_loss": -27.316144943237305, "global_step": 468533, "epoch": 5644} {"train_loss": -26.771035504628376, "global_step": 468534, "epoch": 5644, "val_loss": 6667369.5} {"train_loss": -26.97201919555664, "global_step": 468535, "epoch": 5645} {"train_loss": -26.53310203552246, "global_step": 468536, "epoch": 5645} {"train_loss": -27.109766006469727, "global_step": 468537, "epoch": 5645} {"train_loss": -27.211172103881836, "global_step": 468538, "epoch": 5645} {"train_loss": -26.85532569885254, "global_step": 468539, "epoch": 5645} {"train_loss": -26.886005401611328, "global_step": 468540, "epoch": 5645} {"train_loss": -26.929580688476562, "global_step": 468541, "epoch": 5645} {"train_loss": -27.10474967956543, "global_step": 468542, "epoch": 5645} {"train_loss": -27.183395385742188, "global_step": 468543, "epoch": 5645} {"train_loss": -26.689847946166992, "global_step": 468544, "epoch": 5645} {"train_loss": -27.484893798828125, "global_step": 468545, "epoch": 5645} {"train_loss": -26.8054256439209, "global_step": 468546, "epoch": 5645} {"train_loss": -27.417036056518555, "global_step": 468547, "epoch": 5645} {"train_loss": -26.8974666595459, "global_step": 468548, "epoch": 5645} {"train_loss": -26.880252838134766, "global_step": 468549, "epoch": 5645} {"train_loss": -27.19001579284668, "global_step": 468550, "epoch": 5645} {"train_loss": -27.348876953125, "global_step": 468551, "epoch": 5645} {"train_loss": -26.877552032470703, "global_step": 468552, "epoch": 5645} {"train_loss": -26.92498779296875, "global_step": 468553, "epoch": 5645} {"train_loss": -27.22952651977539, "global_step": 468554, "epoch": 5645} {"train_loss": -27.18202781677246, "global_step": 468555, "epoch": 5645} {"train_loss": -27.103254318237305, "global_step": 468556, "epoch": 5645} {"train_loss": -27.099103927612305, "global_step": 468557, "epoch": 5645} {"train_loss": -27.482572555541992, "global_step": 468558, "epoch": 5645} {"train_loss": -26.732776641845703, "global_step": 468559, "epoch": 5645} {"train_loss": -27.216333389282227, "global_step": 468560, "epoch": 5645} {"train_loss": -27.28901481628418, "global_step": 468561, "epoch": 5645} {"train_loss": -26.975406646728516, "global_step": 468562, "epoch": 5645} {"train_loss": -26.920486450195312, "global_step": 468563, "epoch": 5645} {"train_loss": -27.31597328186035, "global_step": 468564, "epoch": 5645} {"train_loss": -27.22620964050293, "global_step": 468565, "epoch": 5645} {"train_loss": -26.978986740112305, "global_step": 468566, "epoch": 5645} {"train_loss": -26.81467628479004, "global_step": 468567, "epoch": 5645} {"train_loss": -27.125946044921875, "global_step": 468568, "epoch": 5645} {"train_loss": -27.201562881469727, "global_step": 468569, "epoch": 5645} {"train_loss": -27.1801815032959, "global_step": 468570, "epoch": 5645} {"train_loss": -27.520679473876953, "global_step": 468571, "epoch": 5645} {"train_loss": -26.998779296875, "global_step": 468572, "epoch": 5645} {"train_loss": -27.06696128845215, "global_step": 468573, "epoch": 5645} {"train_loss": -27.173120498657227, "global_step": 468574, "epoch": 5645} {"train_loss": -27.1535587310791, "global_step": 468575, "epoch": 5645} {"train_loss": -27.30183982849121, "global_step": 468576, "epoch": 5645} {"train_loss": -27.434736251831055, "global_step": 468577, "epoch": 5645} {"train_loss": -27.551654815673828, "global_step": 468578, "epoch": 5645} {"train_loss": -27.398527145385742, "global_step": 468579, "epoch": 5645} {"train_loss": -27.52496910095215, "global_step": 468580, "epoch": 5645} {"train_loss": -27.63486099243164, "global_step": 468581, "epoch": 5645} {"train_loss": -27.46945571899414, "global_step": 468582, "epoch": 5645} {"train_loss": -27.35112953186035, "global_step": 468583, "epoch": 5645} {"train_loss": -26.919981002807617, "global_step": 468584, "epoch": 5645} {"train_loss": -27.184309005737305, "global_step": 468585, "epoch": 5645} {"train_loss": -27.5327091217041, "global_step": 468586, "epoch": 5645} {"train_loss": -27.452219009399414, "global_step": 468587, "epoch": 5645} {"train_loss": -27.902099609375, "global_step": 468588, "epoch": 5645} {"train_loss": -27.159961700439453, "global_step": 468589, "epoch": 5645} {"train_loss": -27.2139949798584, "global_step": 468590, "epoch": 5645} {"train_loss": -27.22654151916504, "global_step": 468591, "epoch": 5645} {"train_loss": -27.117755889892578, "global_step": 468592, "epoch": 5645} {"train_loss": -26.908843994140625, "global_step": 468593, "epoch": 5645} {"train_loss": -27.215063095092773, "global_step": 468594, "epoch": 5645} {"train_loss": -27.80299186706543, "global_step": 468595, "epoch": 5645} {"train_loss": -26.907346725463867, "global_step": 468596, "epoch": 5645} {"train_loss": -26.7322940826416, "global_step": 468597, "epoch": 5645} {"train_loss": -27.134952545166016, "global_step": 468598, "epoch": 5645} {"train_loss": -27.176471710205078, "global_step": 468599, "epoch": 5645} {"train_loss": -26.99665641784668, "global_step": 468600, "epoch": 5645} {"train_loss": -26.8018856048584, "global_step": 468601, "epoch": 5645} {"train_loss": -26.57172203063965, "global_step": 468602, "epoch": 5645} {"train_loss": -27.092496871948242, "global_step": 468603, "epoch": 5645} {"train_loss": -27.25282859802246, "global_step": 468604, "epoch": 5645} {"train_loss": -27.210819244384766, "global_step": 468605, "epoch": 5645} {"train_loss": -27.557714462280273, "global_step": 468606, "epoch": 5645} {"train_loss": -27.090757369995117, "global_step": 468607, "epoch": 5645} {"train_loss": -26.756744384765625, "global_step": 468608, "epoch": 5645} {"train_loss": -27.26289176940918, "global_step": 468609, "epoch": 5645} {"train_loss": -27.3780574798584, "global_step": 468610, "epoch": 5645} {"train_loss": -27.00433921813965, "global_step": 468611, "epoch": 5645} {"train_loss": -27.232608795166016, "global_step": 468612, "epoch": 5645} {"train_loss": -27.323352813720703, "global_step": 468613, "epoch": 5645} {"train_loss": -27.0566349029541, "global_step": 468614, "epoch": 5645} {"train_loss": -27.197973251342773, "global_step": 468615, "epoch": 5645} {"train_loss": -27.25324058532715, "global_step": 468616, "epoch": 5645} {"train_loss": -27.17360508011048, "global_step": 468617, "epoch": 5645, "val_loss": 6601680.0} {"train_loss": -25.0275821685791, "global_step": 468618, "epoch": 5646} {"train_loss": -25.670408248901367, "global_step": 468619, "epoch": 5646} {"train_loss": -25.54657745361328, "global_step": 468620, "epoch": 5646} {"train_loss": -25.878080368041992, "global_step": 468621, "epoch": 5646} {"train_loss": -25.761993408203125, "global_step": 468622, "epoch": 5646} {"train_loss": -26.37611198425293, "global_step": 468623, "epoch": 5646} {"train_loss": -25.892841339111328, "global_step": 468624, "epoch": 5646} {"train_loss": -26.036035537719727, "global_step": 468625, "epoch": 5646} {"train_loss": -25.995702743530273, "global_step": 468626, "epoch": 5646} {"train_loss": -26.350339889526367, "global_step": 468627, "epoch": 5646} {"train_loss": -26.3394775390625, "global_step": 468628, "epoch": 5646} {"train_loss": -26.489288330078125, "global_step": 468629, "epoch": 5646} {"train_loss": -26.320478439331055, "global_step": 468630, "epoch": 5646} {"train_loss": -26.3524227142334, "global_step": 468631, "epoch": 5646} {"train_loss": -26.676685333251953, "global_step": 468632, "epoch": 5646} {"train_loss": -26.6561336517334, "global_step": 468633, "epoch": 5646} {"train_loss": -26.479684829711914, "global_step": 468634, "epoch": 5646} {"train_loss": -26.612655639648438, "global_step": 468635, "epoch": 5646} {"train_loss": -26.972436904907227, "global_step": 468636, "epoch": 5646} {"train_loss": -26.973295211791992, "global_step": 468637, "epoch": 5646} {"train_loss": -26.58197021484375, "global_step": 468638, "epoch": 5646} {"train_loss": -26.54513931274414, "global_step": 468639, "epoch": 5646} {"train_loss": -26.719446182250977, "global_step": 468640, "epoch": 5646} {"train_loss": -26.671558380126953, "global_step": 468641, "epoch": 5646} {"train_loss": -26.5440616607666, "global_step": 468642, "epoch": 5646} {"train_loss": -26.473676681518555, "global_step": 468643, "epoch": 5646} {"train_loss": -27.03372573852539, "global_step": 468644, "epoch": 5646} {"train_loss": -26.619434356689453, "global_step": 468645, "epoch": 5646} {"train_loss": -26.738727569580078, "global_step": 468646, "epoch": 5646} {"train_loss": -26.816925048828125, "global_step": 468647, "epoch": 5646} {"train_loss": -26.40769386291504, "global_step": 468648, "epoch": 5646} {"train_loss": -26.808124542236328, "global_step": 468649, "epoch": 5646} {"train_loss": -26.883380889892578, "global_step": 468650, "epoch": 5646} {"train_loss": -26.89469337463379, "global_step": 468651, "epoch": 5646} {"train_loss": -27.381763458251953, "global_step": 468652, "epoch": 5646} {"train_loss": -27.122419357299805, "global_step": 468653, "epoch": 5646} {"train_loss": -27.27975845336914, "global_step": 468654, "epoch": 5646} {"train_loss": -26.911890029907227, "global_step": 468655, "epoch": 5646} {"train_loss": -27.16078758239746, "global_step": 468656, "epoch": 5646} {"train_loss": -27.22138023376465, "global_step": 468657, "epoch": 5646} {"train_loss": -27.226776123046875, "global_step": 468658, "epoch": 5646} {"train_loss": -27.06990623474121, "global_step": 468659, "epoch": 5646} {"train_loss": -27.3587646484375, "global_step": 468660, "epoch": 5646} {"train_loss": -27.128284454345703, "global_step": 468661, "epoch": 5646} {"train_loss": -27.323841094970703, "global_step": 468662, "epoch": 5646} {"train_loss": -27.045988082885742, "global_step": 468663, "epoch": 5646} {"train_loss": -26.99940299987793, "global_step": 468664, "epoch": 5646} {"train_loss": -27.04804039001465, "global_step": 468665, "epoch": 5646} {"train_loss": -27.148054122924805, "global_step": 468666, "epoch": 5646} {"train_loss": -27.404264450073242, "global_step": 468667, "epoch": 5646} {"train_loss": -27.571533203125, "global_step": 468668, "epoch": 5646} {"train_loss": -27.342008590698242, "global_step": 468669, "epoch": 5646} {"train_loss": -26.756567001342773, "global_step": 468670, "epoch": 5646} {"train_loss": -27.015722274780273, "global_step": 468671, "epoch": 5646} {"train_loss": -27.391632080078125, "global_step": 468672, "epoch": 5646} {"train_loss": -27.080280303955078, "global_step": 468673, "epoch": 5646} {"train_loss": -26.88237953186035, "global_step": 468674, "epoch": 5646} {"train_loss": -27.316701889038086, "global_step": 468675, "epoch": 5646} {"train_loss": -27.118925094604492, "global_step": 468676, "epoch": 5646} {"train_loss": -27.14601707458496, "global_step": 468677, "epoch": 5646} {"train_loss": -27.227323532104492, "global_step": 468678, "epoch": 5646} {"train_loss": -27.424762725830078, "global_step": 468679, "epoch": 5646} {"train_loss": -27.102466583251953, "global_step": 468680, "epoch": 5646} {"train_loss": -27.334339141845703, "global_step": 468681, "epoch": 5646} {"train_loss": -27.40229606628418, "global_step": 468682, "epoch": 5646} {"train_loss": -27.468656539916992, "global_step": 468683, "epoch": 5646} {"train_loss": -27.384519577026367, "global_step": 468684, "epoch": 5646} {"train_loss": -27.44635009765625, "global_step": 468685, "epoch": 5646} {"train_loss": -27.161264419555664, "global_step": 468686, "epoch": 5646} {"train_loss": -27.613895416259766, "global_step": 468687, "epoch": 5646} {"train_loss": -27.4121150970459, "global_step": 468688, "epoch": 5646} {"train_loss": -27.443286895751953, "global_step": 468689, "epoch": 5646} {"train_loss": -27.311676025390625, "global_step": 468690, "epoch": 5646} {"train_loss": -27.407733917236328, "global_step": 468691, "epoch": 5646} {"train_loss": -27.55646324157715, "global_step": 468692, "epoch": 5646} {"train_loss": -27.413537979125977, "global_step": 468693, "epoch": 5646} {"train_loss": -27.046283721923828, "global_step": 468694, "epoch": 5646} {"train_loss": -27.25946044921875, "global_step": 468695, "epoch": 5646} {"train_loss": -27.06983757019043, "global_step": 468696, "epoch": 5646} {"train_loss": -27.08597755432129, "global_step": 468697, "epoch": 5646} {"train_loss": -27.066986083984375, "global_step": 468698, "epoch": 5646} {"train_loss": -27.0538272857666, "global_step": 468699, "epoch": 5646} {"train_loss": -26.89559566543763, "global_step": 468700, "epoch": 5646, "val_loss": 6814640.0} {"train_loss": -26.375823974609375, "global_step": 468701, "epoch": 5647} {"train_loss": -26.8874454498291, "global_step": 468702, "epoch": 5647} {"train_loss": -26.426807403564453, "global_step": 468703, "epoch": 5647} {"train_loss": -26.42854118347168, "global_step": 468704, "epoch": 5647} {"train_loss": -26.26584243774414, "global_step": 468705, "epoch": 5647} {"train_loss": -26.91425132751465, "global_step": 468706, "epoch": 5647} {"train_loss": -26.741413116455078, "global_step": 468707, "epoch": 5647} {"train_loss": -26.270965576171875, "global_step": 468708, "epoch": 5647} {"train_loss": -26.537433624267578, "global_step": 468709, "epoch": 5647} {"train_loss": -26.684377670288086, "global_step": 468710, "epoch": 5647} {"train_loss": -27.346664428710938, "global_step": 468711, "epoch": 5647} {"train_loss": -26.444549560546875, "global_step": 468712, "epoch": 5647} {"train_loss": -27.02887535095215, "global_step": 468713, "epoch": 5647} {"train_loss": -26.726327896118164, "global_step": 468714, "epoch": 5647} {"train_loss": -27.033172607421875, "global_step": 468715, "epoch": 5647} {"train_loss": -26.794464111328125, "global_step": 468716, "epoch": 5647} {"train_loss": -26.7103271484375, "global_step": 468717, "epoch": 5647} {"train_loss": -26.948226928710938, "global_step": 468718, "epoch": 5647} {"train_loss": -27.045398712158203, "global_step": 468719, "epoch": 5647} {"train_loss": -26.974699020385742, "global_step": 468720, "epoch": 5647} {"train_loss": -27.038679122924805, "global_step": 468721, "epoch": 5647} {"train_loss": -27.2244873046875, "global_step": 468722, "epoch": 5647} {"train_loss": -27.398386001586914, "global_step": 468723, "epoch": 5647} {"train_loss": -27.015216827392578, "global_step": 468724, "epoch": 5647} {"train_loss": -27.1185245513916, "global_step": 468725, "epoch": 5647} {"train_loss": -27.02228355407715, "global_step": 468726, "epoch": 5647} {"train_loss": -27.512500762939453, "global_step": 468727, "epoch": 5647} {"train_loss": -27.27023696899414, "global_step": 468728, "epoch": 5647} {"train_loss": -27.0047607421875, "global_step": 468729, "epoch": 5647} {"train_loss": -27.40458106994629, "global_step": 468730, "epoch": 5647} {"train_loss": -27.119977951049805, "global_step": 468731, "epoch": 5647} {"train_loss": -27.042722702026367, "global_step": 468732, "epoch": 5647} {"train_loss": -26.914936065673828, "global_step": 468733, "epoch": 5647} {"train_loss": -27.552316665649414, "global_step": 468734, "epoch": 5647} {"train_loss": -27.576108932495117, "global_step": 468735, "epoch": 5647} {"train_loss": -27.180023193359375, "global_step": 468736, "epoch": 5647} {"train_loss": -27.536823272705078, "global_step": 468737, "epoch": 5647} {"train_loss": -27.248144149780273, "global_step": 468738, "epoch": 5647} {"train_loss": -26.6180362701416, "global_step": 468739, "epoch": 5647} {"train_loss": -27.27361488342285, "global_step": 468740, "epoch": 5647} {"train_loss": -27.421218872070312, "global_step": 468741, "epoch": 5647} {"train_loss": -27.30856704711914, "global_step": 468742, "epoch": 5647} {"train_loss": -27.045948028564453, "global_step": 468743, "epoch": 5647} {"train_loss": -27.4655818939209, "global_step": 468744, "epoch": 5647} {"train_loss": -26.945880889892578, "global_step": 468745, "epoch": 5647} {"train_loss": -27.234649658203125, "global_step": 468746, "epoch": 5647} {"train_loss": -27.49186134338379, "global_step": 468747, "epoch": 5647} {"train_loss": -27.31787109375, "global_step": 468748, "epoch": 5647} {"train_loss": -27.22281837463379, "global_step": 468749, "epoch": 5647} {"train_loss": -27.202600479125977, "global_step": 468750, "epoch": 5647} {"train_loss": -27.266132354736328, "global_step": 468751, "epoch": 5647} {"train_loss": -27.040185928344727, "global_step": 468752, "epoch": 5647} {"train_loss": -26.85916519165039, "global_step": 468753, "epoch": 5647} {"train_loss": -26.93427085876465, "global_step": 468754, "epoch": 5647} {"train_loss": -26.79781150817871, "global_step": 468755, "epoch": 5647} {"train_loss": -27.543243408203125, "global_step": 468756, "epoch": 5647} {"train_loss": -27.530658721923828, "global_step": 468757, "epoch": 5647} {"train_loss": -27.202001571655273, "global_step": 468758, "epoch": 5647} {"train_loss": -27.109729766845703, "global_step": 468759, "epoch": 5647} {"train_loss": -27.24820899963379, "global_step": 468760, "epoch": 5647} {"train_loss": -27.611286163330078, "global_step": 468761, "epoch": 5647} {"train_loss": -27.30079460144043, "global_step": 468762, "epoch": 5647} {"train_loss": -26.85694694519043, "global_step": 468763, "epoch": 5647} {"train_loss": -27.270124435424805, "global_step": 468764, "epoch": 5647} {"train_loss": -27.31430435180664, "global_step": 468765, "epoch": 5647} {"train_loss": -27.351987838745117, "global_step": 468766, "epoch": 5647} {"train_loss": -26.932775497436523, "global_step": 468767, "epoch": 5647} {"train_loss": -27.2198486328125, "global_step": 468768, "epoch": 5647} {"train_loss": -26.826004028320312, "global_step": 468769, "epoch": 5647} {"train_loss": -27.504438400268555, "global_step": 468770, "epoch": 5647} {"train_loss": -26.987457275390625, "global_step": 468771, "epoch": 5647} {"train_loss": -27.237104415893555, "global_step": 468772, "epoch": 5647} {"train_loss": -27.267383575439453, "global_step": 468773, "epoch": 5647} {"train_loss": -27.333459854125977, "global_step": 468774, "epoch": 5647} {"train_loss": -27.028213500976562, "global_step": 468775, "epoch": 5647} {"train_loss": -27.160022735595703, "global_step": 468776, "epoch": 5647} {"train_loss": -27.462656021118164, "global_step": 468777, "epoch": 5647} {"train_loss": -26.922866821289062, "global_step": 468778, "epoch": 5647} {"train_loss": -26.778701782226562, "global_step": 468779, "epoch": 5647} {"train_loss": -27.09602165222168, "global_step": 468780, "epoch": 5647} {"train_loss": -26.591293334960938, "global_step": 468781, "epoch": 5647} {"train_loss": -26.752288818359375, "global_step": 468782, "epoch": 5647} {"train_loss": -27.07873868367758, "global_step": 468783, "epoch": 5647, "val_loss": 6743718.0} {"train_loss": -26.255857467651367, "global_step": 468784, "epoch": 5648} {"train_loss": -25.70429801940918, "global_step": 468785, "epoch": 5648} {"train_loss": -26.0241756439209, "global_step": 468786, "epoch": 5648} {"train_loss": -26.3682804107666, "global_step": 468787, "epoch": 5648} {"train_loss": -26.47905921936035, "global_step": 468788, "epoch": 5648} {"train_loss": -26.506208419799805, "global_step": 468789, "epoch": 5648} {"train_loss": -26.482206344604492, "global_step": 468790, "epoch": 5648} {"train_loss": -26.036407470703125, "global_step": 468791, "epoch": 5648} {"train_loss": -26.574604034423828, "global_step": 468792, "epoch": 5648} {"train_loss": -26.45546531677246, "global_step": 468793, "epoch": 5648} {"train_loss": -26.6654052734375, "global_step": 468794, "epoch": 5648} {"train_loss": -26.8264217376709, "global_step": 468795, "epoch": 5648} {"train_loss": -26.32477378845215, "global_step": 468796, "epoch": 5648} {"train_loss": -26.722936630249023, "global_step": 468797, "epoch": 5648} {"train_loss": -26.358600616455078, "global_step": 468798, "epoch": 5648} {"train_loss": -26.58555030822754, "global_step": 468799, "epoch": 5648} {"train_loss": -27.082990646362305, "global_step": 468800, "epoch": 5648} {"train_loss": -26.923627853393555, "global_step": 468801, "epoch": 5648} {"train_loss": -26.82499122619629, "global_step": 468802, "epoch": 5648} {"train_loss": -27.094654083251953, "global_step": 468803, "epoch": 5648} {"train_loss": -27.116901397705078, "global_step": 468804, "epoch": 5648} {"train_loss": -27.263269424438477, "global_step": 468805, "epoch": 5648} {"train_loss": -27.22768211364746, "global_step": 468806, "epoch": 5648} {"train_loss": -26.9432430267334, "global_step": 468807, "epoch": 5648} {"train_loss": -26.907745361328125, "global_step": 468808, "epoch": 5648} {"train_loss": -27.030323028564453, "global_step": 468809, "epoch": 5648} {"train_loss": -27.225019454956055, "global_step": 468810, "epoch": 5648} {"train_loss": -27.10768699645996, "global_step": 468811, "epoch": 5648} {"train_loss": -27.481271743774414, "global_step": 468812, "epoch": 5648} {"train_loss": -27.33198356628418, "global_step": 468813, "epoch": 5648} {"train_loss": -27.695484161376953, "global_step": 468814, "epoch": 5648} {"train_loss": -27.102771759033203, "global_step": 468815, "epoch": 5648} {"train_loss": -27.407424926757812, "global_step": 468816, "epoch": 5648} {"train_loss": -26.943500518798828, "global_step": 468817, "epoch": 5648} {"train_loss": -27.217853546142578, "global_step": 468818, "epoch": 5648} {"train_loss": -27.418760299682617, "global_step": 468819, "epoch": 5648} {"train_loss": -27.395734786987305, "global_step": 468820, "epoch": 5648} {"train_loss": -27.599903106689453, "global_step": 468821, "epoch": 5648} {"train_loss": -27.336990356445312, "global_step": 468822, "epoch": 5648} {"train_loss": -27.5429744720459, "global_step": 468823, "epoch": 5648} {"train_loss": -27.06165885925293, "global_step": 468824, "epoch": 5648} {"train_loss": -27.337970733642578, "global_step": 468825, "epoch": 5648} {"train_loss": -27.416706085205078, "global_step": 468826, "epoch": 5648} {"train_loss": -27.20838737487793, "global_step": 468827, "epoch": 5648} {"train_loss": -27.147815704345703, "global_step": 468828, "epoch": 5648} {"train_loss": -27.484146118164062, "global_step": 468829, "epoch": 5648} {"train_loss": -26.97412109375, "global_step": 468830, "epoch": 5648} {"train_loss": -27.215200424194336, "global_step": 468831, "epoch": 5648} {"train_loss": -26.962299346923828, "global_step": 468832, "epoch": 5648} {"train_loss": -27.225357055664062, "global_step": 468833, "epoch": 5648} {"train_loss": -27.083404541015625, "global_step": 468834, "epoch": 5648} {"train_loss": -27.2073917388916, "global_step": 468835, "epoch": 5648} {"train_loss": -27.327856063842773, "global_step": 468836, "epoch": 5648} {"train_loss": -27.192358016967773, "global_step": 468837, "epoch": 5648} {"train_loss": -27.042236328125, "global_step": 468838, "epoch": 5648} {"train_loss": -26.898666381835938, "global_step": 468839, "epoch": 5648} {"train_loss": -27.26936912536621, "global_step": 468840, "epoch": 5648} {"train_loss": -27.27210807800293, "global_step": 468841, "epoch": 5648} {"train_loss": -27.28633689880371, "global_step": 468842, "epoch": 5648} {"train_loss": -27.02008056640625, "global_step": 468843, "epoch": 5648} {"train_loss": -27.128925323486328, "global_step": 468844, "epoch": 5648} {"train_loss": -26.967878341674805, "global_step": 468845, "epoch": 5648} {"train_loss": -26.893512725830078, "global_step": 468846, "epoch": 5648} {"train_loss": -27.517724990844727, "global_step": 468847, "epoch": 5648} {"train_loss": -26.918201446533203, "global_step": 468848, "epoch": 5648} {"train_loss": -27.112369537353516, "global_step": 468849, "epoch": 5648} {"train_loss": -27.477954864501953, "global_step": 468850, "epoch": 5648} {"train_loss": -26.94415283203125, "global_step": 468851, "epoch": 5648} {"train_loss": -27.06925392150879, "global_step": 468852, "epoch": 5648} {"train_loss": -27.2353572845459, "global_step": 468853, "epoch": 5648} {"train_loss": -27.53621482849121, "global_step": 468854, "epoch": 5648} {"train_loss": -26.909921646118164, "global_step": 468855, "epoch": 5648} {"train_loss": -26.708948135375977, "global_step": 468856, "epoch": 5648} {"train_loss": -26.56342887878418, "global_step": 468857, "epoch": 5648} {"train_loss": -26.87290382385254, "global_step": 468858, "epoch": 5648} {"train_loss": -26.80157470703125, "global_step": 468859, "epoch": 5648} {"train_loss": -27.448957443237305, "global_step": 468860, "epoch": 5648} {"train_loss": -26.370941162109375, "global_step": 468861, "epoch": 5648} {"train_loss": -26.221343994140625, "global_step": 468862, "epoch": 5648} {"train_loss": -26.54627799987793, "global_step": 468863, "epoch": 5648} {"train_loss": -27.17060661315918, "global_step": 468864, "epoch": 5648} {"train_loss": -26.98195457458496, "global_step": 468865, "epoch": 5648} {"train_loss": -26.975390836416956, "global_step": 468866, "epoch": 5648, "val_loss": 6722872.5} {"train_loss": -26.7493839263916, "global_step": 468867, "epoch": 5649} {"train_loss": -26.370946884155273, "global_step": 468868, "epoch": 5649} {"train_loss": -27.083463668823242, "global_step": 468869, "epoch": 5649} {"train_loss": -26.272663116455078, "global_step": 468870, "epoch": 5649} {"train_loss": -26.81143569946289, "global_step": 468871, "epoch": 5649} {"train_loss": -26.068164825439453, "global_step": 468872, "epoch": 5649} {"train_loss": -26.984771728515625, "global_step": 468873, "epoch": 5649} {"train_loss": -26.7983455657959, "global_step": 468874, "epoch": 5649} {"train_loss": -26.69672966003418, "global_step": 468875, "epoch": 5649} {"train_loss": -26.6663875579834, "global_step": 468876, "epoch": 5649} {"train_loss": -27.042287826538086, "global_step": 468877, "epoch": 5649} {"train_loss": -26.85808753967285, "global_step": 468878, "epoch": 5649} {"train_loss": -26.921300888061523, "global_step": 468879, "epoch": 5649} {"train_loss": -26.674549102783203, "global_step": 468880, "epoch": 5649} {"train_loss": -26.501651763916016, "global_step": 468881, "epoch": 5649} {"train_loss": -26.896081924438477, "global_step": 468882, "epoch": 5649} {"train_loss": -26.850194931030273, "global_step": 468883, "epoch": 5649} {"train_loss": -26.9672794342041, "global_step": 468884, "epoch": 5649} {"train_loss": -26.9844970703125, "global_step": 468885, "epoch": 5649} {"train_loss": -26.954181671142578, "global_step": 468886, "epoch": 5649} {"train_loss": -27.041833877563477, "global_step": 468887, "epoch": 5649} {"train_loss": -26.847692489624023, "global_step": 468888, "epoch": 5649} {"train_loss": -27.1229248046875, "global_step": 468889, "epoch": 5649} {"train_loss": -27.021421432495117, "global_step": 468890, "epoch": 5649} {"train_loss": -26.990497589111328, "global_step": 468891, "epoch": 5649} {"train_loss": -27.210407257080078, "global_step": 468892, "epoch": 5649} {"train_loss": -27.056360244750977, "global_step": 468893, "epoch": 5649} {"train_loss": -27.424652099609375, "global_step": 468894, "epoch": 5649} {"train_loss": -27.331867218017578, "global_step": 468895, "epoch": 5649} {"train_loss": -26.697650909423828, "global_step": 468896, "epoch": 5649} {"train_loss": -27.143014907836914, "global_step": 468897, "epoch": 5649} {"train_loss": -26.9649715423584, "global_step": 468898, "epoch": 5649} {"train_loss": -26.751911163330078, "global_step": 468899, "epoch": 5649} {"train_loss": -27.275205612182617, "global_step": 468900, "epoch": 5649} {"train_loss": -26.83314323425293, "global_step": 468901, "epoch": 5649} {"train_loss": -27.279693603515625, "global_step": 468902, "epoch": 5649} {"train_loss": -26.793292999267578, "global_step": 468903, "epoch": 5649} {"train_loss": -27.10068702697754, "global_step": 468904, "epoch": 5649} {"train_loss": -27.091909408569336, "global_step": 468905, "epoch": 5649} {"train_loss": -26.95670509338379, "global_step": 468906, "epoch": 5649} {"train_loss": -26.557641983032227, "global_step": 468907, "epoch": 5649} {"train_loss": -26.654315948486328, "global_step": 468908, "epoch": 5649} {"train_loss": -26.873783111572266, "global_step": 468909, "epoch": 5649} {"train_loss": -26.80914306640625, "global_step": 468910, "epoch": 5649} {"train_loss": -27.2525577545166, "global_step": 468911, "epoch": 5649} {"train_loss": -27.05367088317871, "global_step": 468912, "epoch": 5649} {"train_loss": -27.4752140045166, "global_step": 468913, "epoch": 5649} {"train_loss": -26.850194931030273, "global_step": 468914, "epoch": 5649} {"train_loss": -27.21213150024414, "global_step": 468915, "epoch": 5649} {"train_loss": -26.991535186767578, "global_step": 468916, "epoch": 5649} {"train_loss": -27.27728843688965, "global_step": 468917, "epoch": 5649} {"train_loss": -26.741912841796875, "global_step": 468918, "epoch": 5649} {"train_loss": -27.431570053100586, "global_step": 468919, "epoch": 5649} {"train_loss": -26.766998291015625, "global_step": 468920, "epoch": 5649} {"train_loss": -27.409503936767578, "global_step": 468921, "epoch": 5649} {"train_loss": -27.15813636779785, "global_step": 468922, "epoch": 5649} {"train_loss": -27.50678062438965, "global_step": 468923, "epoch": 5649} {"train_loss": -26.8330020904541, "global_step": 468924, "epoch": 5649} {"train_loss": -27.127866744995117, "global_step": 468925, "epoch": 5649} {"train_loss": -26.962787628173828, "global_step": 468926, "epoch": 5649} {"train_loss": -26.89691162109375, "global_step": 468927, "epoch": 5649} {"train_loss": -27.35047721862793, "global_step": 468928, "epoch": 5649} {"train_loss": -27.158727645874023, "global_step": 468929, "epoch": 5649} {"train_loss": -27.191205978393555, "global_step": 468930, "epoch": 5649} {"train_loss": -27.285558700561523, "global_step": 468931, "epoch": 5649} {"train_loss": -27.58681297302246, "global_step": 468932, "epoch": 5649} {"train_loss": -27.147735595703125, "global_step": 468933, "epoch": 5649} {"train_loss": -27.023324966430664, "global_step": 468934, "epoch": 5649} {"train_loss": -27.381128311157227, "global_step": 468935, "epoch": 5649} {"train_loss": -27.12451171875, "global_step": 468936, "epoch": 5649} {"train_loss": -27.118864059448242, "global_step": 468937, "epoch": 5649} {"train_loss": -27.447790145874023, "global_step": 468938, "epoch": 5649} {"train_loss": -27.056814193725586, "global_step": 468939, "epoch": 5649} {"train_loss": -27.658523559570312, "global_step": 468940, "epoch": 5649} {"train_loss": -27.355548858642578, "global_step": 468941, "epoch": 5649} {"train_loss": -27.3818359375, "global_step": 468942, "epoch": 5649} {"train_loss": -27.336963653564453, "global_step": 468943, "epoch": 5649} {"train_loss": -27.47736930847168, "global_step": 468944, "epoch": 5649} {"train_loss": -27.358495712280273, "global_step": 468945, "epoch": 5649} {"train_loss": -27.40717124938965, "global_step": 468946, "epoch": 5649} {"train_loss": -27.431379318237305, "global_step": 468947, "epoch": 5649} {"train_loss": -27.354013442993164, "global_step": 468948, "epoch": 5649} {"train_loss": -27.05441888556423, "global_step": 468949, "epoch": 5649, "val_loss": 6637676.0} {"train_loss": -27.402877807617188, "global_step": 468950, "epoch": 5650} {"train_loss": -27.510583877563477, "global_step": 468951, "epoch": 5650} {"train_loss": -26.855091094970703, "global_step": 468952, "epoch": 5650} {"train_loss": -27.162261962890625, "global_step": 468953, "epoch": 5650} {"train_loss": -26.539758682250977, "global_step": 468954, "epoch": 5650} {"train_loss": -26.6500301361084, "global_step": 468955, "epoch": 5650} {"train_loss": -26.766803741455078, "global_step": 468956, "epoch": 5650} {"train_loss": -27.078216552734375, "global_step": 468957, "epoch": 5650} {"train_loss": -27.094114303588867, "global_step": 468958, "epoch": 5650} {"train_loss": -27.095001220703125, "global_step": 468959, "epoch": 5650} {"train_loss": -26.7866268157959, "global_step": 468960, "epoch": 5650} {"train_loss": -26.40949058532715, "global_step": 468961, "epoch": 5650} {"train_loss": -27.121732711791992, "global_step": 468962, "epoch": 5650} {"train_loss": -27.712255477905273, "global_step": 468963, "epoch": 5650} {"train_loss": -27.42329216003418, "global_step": 468964, "epoch": 5650} {"train_loss": -27.282550811767578, "global_step": 468965, "epoch": 5650} {"train_loss": -27.190027236938477, "global_step": 468966, "epoch": 5650} {"train_loss": -27.0262393951416, "global_step": 468967, "epoch": 5650} {"train_loss": -27.226877212524414, "global_step": 468968, "epoch": 5650} {"train_loss": -27.36004638671875, "global_step": 468969, "epoch": 5650} {"train_loss": -26.938241958618164, "global_step": 468970, "epoch": 5650} {"train_loss": -26.927412033081055, "global_step": 468971, "epoch": 5650} {"train_loss": -27.44769287109375, "global_step": 468972, "epoch": 5650} {"train_loss": -27.506269454956055, "global_step": 468973, "epoch": 5650} {"train_loss": -27.366134643554688, "global_step": 468974, "epoch": 5650} {"train_loss": -26.929922103881836, "global_step": 468975, "epoch": 5650} {"train_loss": -27.362390518188477, "global_step": 468976, "epoch": 5650} {"train_loss": -27.561309814453125, "global_step": 468977, "epoch": 5650} {"train_loss": -27.356678009033203, "global_step": 468978, "epoch": 5650} {"train_loss": -27.044275283813477, "global_step": 468979, "epoch": 5650} {"train_loss": -27.005029678344727, "global_step": 468980, "epoch": 5650} {"train_loss": -27.13905143737793, "global_step": 468981, "epoch": 5650} {"train_loss": -26.992523193359375, "global_step": 468982, "epoch": 5650} {"train_loss": -27.428876876831055, "global_step": 468983, "epoch": 5650} {"train_loss": -27.166034698486328, "global_step": 468984, "epoch": 5650} {"train_loss": -27.38873863220215, "global_step": 468985, "epoch": 5650} {"train_loss": -27.209253311157227, "global_step": 468986, "epoch": 5650} {"train_loss": -27.510534286499023, "global_step": 468987, "epoch": 5650} {"train_loss": -27.295154571533203, "global_step": 468988, "epoch": 5650} {"train_loss": -26.937376022338867, "global_step": 468989, "epoch": 5650} {"train_loss": -27.153539657592773, "global_step": 468990, "epoch": 5650} {"train_loss": -27.545745849609375, "global_step": 468991, "epoch": 5650} {"train_loss": -27.680179595947266, "global_step": 468992, "epoch": 5650} {"train_loss": -26.603891372680664, "global_step": 468993, "epoch": 5650} {"train_loss": -27.430465698242188, "global_step": 468994, "epoch": 5650} {"train_loss": -27.293256759643555, "global_step": 468995, "epoch": 5650} {"train_loss": -26.811933517456055, "global_step": 468996, "epoch": 5650} {"train_loss": -27.018329620361328, "global_step": 468997, "epoch": 5650} {"train_loss": -27.143346786499023, "global_step": 468998, "epoch": 5650} {"train_loss": -27.114713668823242, "global_step": 468999, "epoch": 5650} {"train_loss": -27.488067626953125, "global_step": 469000, "epoch": 5650} {"train_loss": -27.087228775024414, "global_step": 469001, "epoch": 5650} {"train_loss": -27.097705841064453, "global_step": 469002, "epoch": 5650} {"train_loss": -27.136627197265625, "global_step": 469003, "epoch": 5650} {"train_loss": -27.0281925201416, "global_step": 469004, "epoch": 5650} {"train_loss": -27.489484786987305, "global_step": 469005, "epoch": 5650} {"train_loss": -27.241958618164062, "global_step": 469006, "epoch": 5650} {"train_loss": -27.372028350830078, "global_step": 469007, "epoch": 5650} {"train_loss": -27.318286895751953, "global_step": 469008, "epoch": 5650} {"train_loss": -27.00489616394043, "global_step": 469009, "epoch": 5650} {"train_loss": -27.348581314086914, "global_step": 469010, "epoch": 5650} {"train_loss": -27.184045791625977, "global_step": 469011, "epoch": 5650} {"train_loss": -27.32586669921875, "global_step": 469012, "epoch": 5650} {"train_loss": -27.129247665405273, "global_step": 469013, "epoch": 5650} {"train_loss": -27.385440826416016, "global_step": 469014, "epoch": 5650} {"train_loss": -27.280790328979492, "global_step": 469015, "epoch": 5650} {"train_loss": -27.007858276367188, "global_step": 469016, "epoch": 5650} {"train_loss": -27.06922721862793, "global_step": 469017, "epoch": 5650} {"train_loss": -27.311145782470703, "global_step": 469018, "epoch": 5650} {"train_loss": -27.36859703063965, "global_step": 469019, "epoch": 5650} {"train_loss": -27.392980575561523, "global_step": 469020, "epoch": 5650} {"train_loss": -27.370288848876953, "global_step": 469021, "epoch": 5650} {"train_loss": -27.322961807250977, "global_step": 469022, "epoch": 5650} {"train_loss": -26.95863151550293, "global_step": 469023, "epoch": 5650} {"train_loss": -27.05130958557129, "global_step": 469024, "epoch": 5650} {"train_loss": -27.163110733032227, "global_step": 469025, "epoch": 5650} {"train_loss": -27.484888076782227, "global_step": 469026, "epoch": 5650} {"train_loss": -26.817419052124023, "global_step": 469027, "epoch": 5650} {"train_loss": -26.959104537963867, "global_step": 469028, "epoch": 5650} {"train_loss": -26.986835479736328, "global_step": 469029, "epoch": 5650} {"train_loss": -27.07568359375, "global_step": 469030, "epoch": 5650} {"train_loss": -26.996286392211914, "global_step": 469031, "epoch": 5650} {"train_loss": -27.160330393228186, "global_step": 469032, "epoch": 5650, "train/sim_max_reward_0": 0.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4500000": 1.0, "test/sim_max_reward_4500001": 1.0, "test/sim_max_reward_4500002": 1.0, "test/sim_max_reward_4500003": 1.0, "test/sim_max_reward_4500004": 1.0, "test/sim_max_reward_4500005": 1.0, "test/sim_max_reward_4500006": 1.0, "test/sim_max_reward_4500007": 0.0, "test/sim_max_reward_4500008": 1.0, "test/sim_max_reward_4500009": 1.0, "test/sim_max_reward_4500010": 1.0, "test/sim_max_reward_4500011": 1.0, "test/sim_max_reward_4500012": 1.0, "test/sim_max_reward_4500013": 0.0, "test/sim_max_reward_4500014": 1.0, "test/sim_max_reward_4500015": 1.0, "test/sim_max_reward_4500016": 1.0, "test/sim_max_reward_4500017": 1.0, "test/sim_max_reward_4500018": 0.0, "test/sim_max_reward_4500019": 1.0, "test/sim_max_reward_4500020": 1.0, "test/sim_max_reward_4500021": 1.0, "train/mean_score": 0.8333333333333334, "test/mean_score": 0.8636363636363636, "val_loss": 6661057.5} {"train_loss": -26.922266006469727, "global_step": 469033, "epoch": 5651} {"train_loss": -26.01228904724121, "global_step": 469034, "epoch": 5651} {"train_loss": -25.8602352142334, "global_step": 469035, "epoch": 5651} {"train_loss": -25.879348754882812, "global_step": 469036, "epoch": 5651} {"train_loss": -25.634628295898438, "global_step": 469037, "epoch": 5651} {"train_loss": -26.368392944335938, "global_step": 469038, "epoch": 5651} {"train_loss": -25.758710861206055, "global_step": 469039, "epoch": 5651} {"train_loss": -26.570356369018555, "global_step": 469040, "epoch": 5651} {"train_loss": -26.370487213134766, "global_step": 469041, "epoch": 5651} {"train_loss": -25.81591796875, "global_step": 469042, "epoch": 5651} {"train_loss": -26.462284088134766, "global_step": 469043, "epoch": 5651} {"train_loss": -25.61404800415039, "global_step": 469044, "epoch": 5651} {"train_loss": -26.691495895385742, "global_step": 469045, "epoch": 5651} {"train_loss": -26.501855850219727, "global_step": 469046, "epoch": 5651} {"train_loss": -26.262292861938477, "global_step": 469047, "epoch": 5651} {"train_loss": -26.351154327392578, "global_step": 469048, "epoch": 5651} {"train_loss": -26.269750595092773, "global_step": 469049, "epoch": 5651} {"train_loss": -26.5678768157959, "global_step": 469050, "epoch": 5651} {"train_loss": -27.138669967651367, "global_step": 469051, "epoch": 5651} {"train_loss": -26.691450119018555, "global_step": 469052, "epoch": 5651} {"train_loss": -26.777023315429688, "global_step": 469053, "epoch": 5651} {"train_loss": -26.7952938079834, "global_step": 469054, "epoch": 5651} {"train_loss": -26.590808868408203, "global_step": 469055, "epoch": 5651} {"train_loss": -26.768787384033203, "global_step": 469056, "epoch": 5651} {"train_loss": -26.658344268798828, "global_step": 469057, "epoch": 5651} {"train_loss": -26.8278865814209, "global_step": 469058, "epoch": 5651} {"train_loss": -26.825647354125977, "global_step": 469059, "epoch": 5651} {"train_loss": -26.858327865600586, "global_step": 469060, "epoch": 5651} {"train_loss": -26.808469772338867, "global_step": 469061, "epoch": 5651} {"train_loss": -27.053638458251953, "global_step": 469062, "epoch": 5651} {"train_loss": -27.388843536376953, "global_step": 469063, "epoch": 5651} {"train_loss": -27.059356689453125, "global_step": 469064, "epoch": 5651} {"train_loss": -27.227813720703125, "global_step": 469065, "epoch": 5651} {"train_loss": -26.925336837768555, "global_step": 469066, "epoch": 5651} {"train_loss": -27.016691207885742, "global_step": 469067, "epoch": 5651} {"train_loss": -27.243921279907227, "global_step": 469068, "epoch": 5651} {"train_loss": -26.816818237304688, "global_step": 469069, "epoch": 5651} {"train_loss": -27.264352798461914, "global_step": 469070, "epoch": 5651} {"train_loss": -27.368457794189453, "global_step": 469071, "epoch": 5651} {"train_loss": -27.38054847717285, "global_step": 469072, "epoch": 5651} {"train_loss": -27.22566032409668, "global_step": 469073, "epoch": 5651} {"train_loss": -27.211713790893555, "global_step": 469074, "epoch": 5651} {"train_loss": -27.0562686920166, "global_step": 469075, "epoch": 5651} {"train_loss": -27.10629653930664, "global_step": 469076, "epoch": 5651} {"train_loss": -26.76007080078125, "global_step": 469077, "epoch": 5651} {"train_loss": -27.220306396484375, "global_step": 469078, "epoch": 5651} {"train_loss": -27.091840744018555, "global_step": 469079, "epoch": 5651} {"train_loss": -26.977767944335938, "global_step": 469080, "epoch": 5651} {"train_loss": -27.434890747070312, "global_step": 469081, "epoch": 5651} {"train_loss": -27.037302017211914, "global_step": 469082, "epoch": 5651} {"train_loss": -26.998493194580078, "global_step": 469083, "epoch": 5651} {"train_loss": -26.655195236206055, "global_step": 469084, "epoch": 5651} {"train_loss": -27.33453941345215, "global_step": 469085, "epoch": 5651} {"train_loss": -26.96491813659668, "global_step": 469086, "epoch": 5651} {"train_loss": -27.052967071533203, "global_step": 469087, "epoch": 5651} {"train_loss": -26.905994415283203, "global_step": 469088, "epoch": 5651} {"train_loss": -27.33888053894043, "global_step": 469089, "epoch": 5651} {"train_loss": -27.11371421813965, "global_step": 469090, "epoch": 5651} {"train_loss": -27.264514923095703, "global_step": 469091, "epoch": 5651} {"train_loss": -27.181318283081055, "global_step": 469092, "epoch": 5651} {"train_loss": -27.112884521484375, "global_step": 469093, "epoch": 5651} {"train_loss": -26.95363426208496, "global_step": 469094, "epoch": 5651} {"train_loss": -27.31758689880371, "global_step": 469095, "epoch": 5651} {"train_loss": -27.323095321655273, "global_step": 469096, "epoch": 5651} {"train_loss": -26.960119247436523, "global_step": 469097, "epoch": 5651} {"train_loss": -27.52239990234375, "global_step": 469098, "epoch": 5651} {"train_loss": -27.1251277923584, "global_step": 469099, "epoch": 5651} {"train_loss": -27.044111251831055, "global_step": 469100, "epoch": 5651} {"train_loss": -27.190893173217773, "global_step": 469101, "epoch": 5651} {"train_loss": -27.444488525390625, "global_step": 469102, "epoch": 5651} {"train_loss": -27.380905151367188, "global_step": 469103, "epoch": 5651} {"train_loss": -27.181116104125977, "global_step": 469104, "epoch": 5651} {"train_loss": -27.107431411743164, "global_step": 469105, "epoch": 5651} {"train_loss": -27.14130973815918, "global_step": 469106, "epoch": 5651} {"train_loss": -27.57634925842285, "global_step": 469107, "epoch": 5651} {"train_loss": -27.479019165039062, "global_step": 469108, "epoch": 5651} {"train_loss": -27.31100845336914, "global_step": 469109, "epoch": 5651} {"train_loss": -27.452558517456055, "global_step": 469110, "epoch": 5651} {"train_loss": -27.515338897705078, "global_step": 469111, "epoch": 5651} {"train_loss": -27.473424911499023, "global_step": 469112, "epoch": 5651} {"train_loss": -27.4237060546875, "global_step": 469113, "epoch": 5651} {"train_loss": -27.151020050048828, "global_step": 469114, "epoch": 5651} {"train_loss": -26.935222074209925, "global_step": 469115, "epoch": 5651, "val_loss": 6711644.0} {"train_loss": -26.77911376953125, "global_step": 469116, "epoch": 5652} {"train_loss": -26.777555465698242, "global_step": 469117, "epoch": 5652} {"train_loss": -26.608642578125, "global_step": 469118, "epoch": 5652} {"train_loss": -26.712982177734375, "global_step": 469119, "epoch": 5652} {"train_loss": -26.88028335571289, "global_step": 469120, "epoch": 5652} {"train_loss": -27.150110244750977, "global_step": 469121, "epoch": 5652} {"train_loss": -26.93287467956543, "global_step": 469122, "epoch": 5652} {"train_loss": -26.889667510986328, "global_step": 469123, "epoch": 5652} {"train_loss": -25.786848068237305, "global_step": 469124, "epoch": 5652} {"train_loss": -25.842554092407227, "global_step": 469125, "epoch": 5652} {"train_loss": -26.621973037719727, "global_step": 469126, "epoch": 5652} {"train_loss": -26.529342651367188, "global_step": 469127, "epoch": 5652} {"train_loss": -26.264972686767578, "global_step": 469128, "epoch": 5652} {"train_loss": -26.88300895690918, "global_step": 469129, "epoch": 5652} {"train_loss": -26.352392196655273, "global_step": 469130, "epoch": 5652} {"train_loss": -26.83917808532715, "global_step": 469131, "epoch": 5652} {"train_loss": -26.802114486694336, "global_step": 469132, "epoch": 5652} {"train_loss": -26.4918270111084, "global_step": 469133, "epoch": 5652} {"train_loss": -27.082910537719727, "global_step": 469134, "epoch": 5652} {"train_loss": -26.780393600463867, "global_step": 469135, "epoch": 5652} {"train_loss": -26.8402156829834, "global_step": 469136, "epoch": 5652} {"train_loss": -27.388111114501953, "global_step": 469137, "epoch": 5652} {"train_loss": -26.780359268188477, "global_step": 469138, "epoch": 5652} {"train_loss": -26.93973731994629, "global_step": 469139, "epoch": 5652} {"train_loss": -27.091089248657227, "global_step": 469140, "epoch": 5652} {"train_loss": -26.42637062072754, "global_step": 469141, "epoch": 5652} {"train_loss": -27.231159210205078, "global_step": 469142, "epoch": 5652} {"train_loss": -26.66053581237793, "global_step": 469143, "epoch": 5652} {"train_loss": -27.202016830444336, "global_step": 469144, "epoch": 5652} {"train_loss": -26.614965438842773, "global_step": 469145, "epoch": 5652} {"train_loss": -27.026081085205078, "global_step": 469146, "epoch": 5652} {"train_loss": -27.000152587890625, "global_step": 469147, "epoch": 5652} {"train_loss": -27.373859405517578, "global_step": 469148, "epoch": 5652} {"train_loss": -26.988727569580078, "global_step": 469149, "epoch": 5652} {"train_loss": -26.917469024658203, "global_step": 469150, "epoch": 5652} {"train_loss": -27.034942626953125, "global_step": 469151, "epoch": 5652} {"train_loss": -26.900293350219727, "global_step": 469152, "epoch": 5652} {"train_loss": -27.44337272644043, "global_step": 469153, "epoch": 5652} {"train_loss": -27.731332778930664, "global_step": 469154, "epoch": 5652} {"train_loss": -27.09259605407715, "global_step": 469155, "epoch": 5652} {"train_loss": -27.140522003173828, "global_step": 469156, "epoch": 5652} {"train_loss": -27.331735610961914, "global_step": 469157, "epoch": 5652} {"train_loss": -27.14689064025879, "global_step": 469158, "epoch": 5652} {"train_loss": -26.716047286987305, "global_step": 469159, "epoch": 5652} {"train_loss": -26.044906616210938, "global_step": 469160, "epoch": 5652} {"train_loss": -25.220144271850586, "global_step": 469161, "epoch": 5652} {"train_loss": -25.84321403503418, "global_step": 469162, "epoch": 5652} {"train_loss": -26.912458419799805, "global_step": 469163, "epoch": 5652} {"train_loss": -26.551115036010742, "global_step": 469164, "epoch": 5652} {"train_loss": -27.013914108276367, "global_step": 469165, "epoch": 5652} {"train_loss": -26.778644561767578, "global_step": 469166, "epoch": 5652} {"train_loss": -27.584823608398438, "global_step": 469167, "epoch": 5652} {"train_loss": -26.830917358398438, "global_step": 469168, "epoch": 5652} {"train_loss": -26.449909210205078, "global_step": 469169, "epoch": 5652} {"train_loss": -27.006824493408203, "global_step": 469170, "epoch": 5652} {"train_loss": -26.8160400390625, "global_step": 469171, "epoch": 5652} {"train_loss": -26.899450302124023, "global_step": 469172, "epoch": 5652} {"train_loss": -26.977365493774414, "global_step": 469173, "epoch": 5652} {"train_loss": -26.801355361938477, "global_step": 469174, "epoch": 5652} {"train_loss": -27.088058471679688, "global_step": 469175, "epoch": 5652} {"train_loss": -26.876745223999023, "global_step": 469176, "epoch": 5652} {"train_loss": -27.057592391967773, "global_step": 469177, "epoch": 5652} {"train_loss": -27.271041870117188, "global_step": 469178, "epoch": 5652} {"train_loss": -27.236865997314453, "global_step": 469179, "epoch": 5652} {"train_loss": -27.28750991821289, "global_step": 469180, "epoch": 5652} {"train_loss": -26.970489501953125, "global_step": 469181, "epoch": 5652} {"train_loss": -27.084796905517578, "global_step": 469182, "epoch": 5652} {"train_loss": -26.70916175842285, "global_step": 469183, "epoch": 5652} {"train_loss": -27.109210968017578, "global_step": 469184, "epoch": 5652} {"train_loss": -26.93886375427246, "global_step": 469185, "epoch": 5652} {"train_loss": -27.212427139282227, "global_step": 469186, "epoch": 5652} {"train_loss": -27.316669464111328, "global_step": 469187, "epoch": 5652} {"train_loss": -26.6529483795166, "global_step": 469188, "epoch": 5652} {"train_loss": -27.00349235534668, "global_step": 469189, "epoch": 5652} {"train_loss": -26.92642593383789, "global_step": 469190, "epoch": 5652} {"train_loss": -27.049169540405273, "global_step": 469191, "epoch": 5652} {"train_loss": -27.033044815063477, "global_step": 469192, "epoch": 5652} {"train_loss": -26.913360595703125, "global_step": 469193, "epoch": 5652} {"train_loss": -26.874500274658203, "global_step": 469194, "epoch": 5652} {"train_loss": -27.100341796875, "global_step": 469195, "epoch": 5652} {"train_loss": -26.989065170288086, "global_step": 469196, "epoch": 5652} {"train_loss": -27.039453506469727, "global_step": 469197, "epoch": 5652} {"train_loss": -26.866781326661627, "global_step": 469198, "epoch": 5652, "val_loss": 6678485.0} {"train_loss": -26.928735733032227, "global_step": 469199, "epoch": 5653} {"train_loss": -27.068445205688477, "global_step": 469200, "epoch": 5653} {"train_loss": -26.9007625579834, "global_step": 469201, "epoch": 5653} {"train_loss": -27.1279239654541, "global_step": 469202, "epoch": 5653} {"train_loss": -26.884632110595703, "global_step": 469203, "epoch": 5653} {"train_loss": -27.0478572845459, "global_step": 469204, "epoch": 5653} {"train_loss": -26.609546661376953, "global_step": 469205, "epoch": 5653} {"train_loss": -26.913129806518555, "global_step": 469206, "epoch": 5653} {"train_loss": -26.851318359375, "global_step": 469207, "epoch": 5653} {"train_loss": -26.6699275970459, "global_step": 469208, "epoch": 5653} {"train_loss": -27.471179962158203, "global_step": 469209, "epoch": 5653} {"train_loss": -26.74546241760254, "global_step": 469210, "epoch": 5653} {"train_loss": -26.96925163269043, "global_step": 469211, "epoch": 5653} {"train_loss": -26.73819923400879, "global_step": 469212, "epoch": 5653} {"train_loss": -26.850324630737305, "global_step": 469213, "epoch": 5653} {"train_loss": -26.781402587890625, "global_step": 469214, "epoch": 5653} {"train_loss": -26.807214736938477, "global_step": 469215, "epoch": 5653} {"train_loss": -27.013044357299805, "global_step": 469216, "epoch": 5653} {"train_loss": -27.348127365112305, "global_step": 469217, "epoch": 5653} {"train_loss": -27.1004695892334, "global_step": 469218, "epoch": 5653} {"train_loss": -27.15228271484375, "global_step": 469219, "epoch": 5653} {"train_loss": -26.9102725982666, "global_step": 469220, "epoch": 5653} {"train_loss": -27.125410079956055, "global_step": 469221, "epoch": 5653} {"train_loss": -27.014373779296875, "global_step": 469222, "epoch": 5653} {"train_loss": -26.569721221923828, "global_step": 469223, "epoch": 5653} {"train_loss": -27.034759521484375, "global_step": 469224, "epoch": 5653} {"train_loss": -27.114545822143555, "global_step": 469225, "epoch": 5653} {"train_loss": -26.87491226196289, "global_step": 469226, "epoch": 5653} {"train_loss": -26.644155502319336, "global_step": 469227, "epoch": 5653} {"train_loss": -27.22159194946289, "global_step": 469228, "epoch": 5653} {"train_loss": -27.08619499206543, "global_step": 469229, "epoch": 5653} {"train_loss": -26.824573516845703, "global_step": 469230, "epoch": 5653} {"train_loss": -27.048498153686523, "global_step": 469231, "epoch": 5653} {"train_loss": -27.076141357421875, "global_step": 469232, "epoch": 5653} {"train_loss": -27.3623046875, "global_step": 469233, "epoch": 5653} {"train_loss": -27.187671661376953, "global_step": 469234, "epoch": 5653} {"train_loss": -26.969717025756836, "global_step": 469235, "epoch": 5653} {"train_loss": -27.111433029174805, "global_step": 469236, "epoch": 5653} {"train_loss": -27.265399932861328, "global_step": 469237, "epoch": 5653} {"train_loss": -27.116256713867188, "global_step": 469238, "epoch": 5653} {"train_loss": -27.165557861328125, "global_step": 469239, "epoch": 5653} {"train_loss": -27.238672256469727, "global_step": 469240, "epoch": 5653} {"train_loss": -27.030776977539062, "global_step": 469241, "epoch": 5653} {"train_loss": -27.299835205078125, "global_step": 469242, "epoch": 5653} {"train_loss": -27.35126304626465, "global_step": 469243, "epoch": 5653} {"train_loss": -27.074920654296875, "global_step": 469244, "epoch": 5653} {"train_loss": -26.954191207885742, "global_step": 469245, "epoch": 5653} {"train_loss": -27.26692008972168, "global_step": 469246, "epoch": 5653} {"train_loss": -27.250492095947266, "global_step": 469247, "epoch": 5653} {"train_loss": -27.193790435791016, "global_step": 469248, "epoch": 5653} {"train_loss": -27.454450607299805, "global_step": 469249, "epoch": 5653} {"train_loss": -27.458179473876953, "global_step": 469250, "epoch": 5653} {"train_loss": -27.36260414123535, "global_step": 469251, "epoch": 5653} {"train_loss": -26.99372673034668, "global_step": 469252, "epoch": 5653} {"train_loss": -27.153915405273438, "global_step": 469253, "epoch": 5653} {"train_loss": -27.517683029174805, "global_step": 469254, "epoch": 5653} {"train_loss": -27.222654342651367, "global_step": 469255, "epoch": 5653} {"train_loss": -27.299264907836914, "global_step": 469256, "epoch": 5653} {"train_loss": -27.273670196533203, "global_step": 469257, "epoch": 5653} {"train_loss": -27.18641471862793, "global_step": 469258, "epoch": 5653} {"train_loss": -27.264312744140625, "global_step": 469259, "epoch": 5653} {"train_loss": -27.449787139892578, "global_step": 469260, "epoch": 5653} {"train_loss": -27.309921264648438, "global_step": 469261, "epoch": 5653} {"train_loss": -27.04998207092285, "global_step": 469262, "epoch": 5653} {"train_loss": -27.151519775390625, "global_step": 469263, "epoch": 5653} {"train_loss": -26.999719619750977, "global_step": 469264, "epoch": 5653} {"train_loss": -27.5992488861084, "global_step": 469265, "epoch": 5653} {"train_loss": -27.407611846923828, "global_step": 469266, "epoch": 5653} {"train_loss": -27.831146240234375, "global_step": 469267, "epoch": 5653} {"train_loss": -27.246448516845703, "global_step": 469268, "epoch": 5653} {"train_loss": -27.26287269592285, "global_step": 469269, "epoch": 5653} {"train_loss": -27.321134567260742, "global_step": 469270, "epoch": 5653} {"train_loss": -27.112869262695312, "global_step": 469271, "epoch": 5653} {"train_loss": -27.315887451171875, "global_step": 469272, "epoch": 5653} {"train_loss": -27.04153823852539, "global_step": 469273, "epoch": 5653} {"train_loss": -27.12717056274414, "global_step": 469274, "epoch": 5653} {"train_loss": -27.37337303161621, "global_step": 469275, "epoch": 5653} {"train_loss": -27.164831161499023, "global_step": 469276, "epoch": 5653} {"train_loss": -27.069299697875977, "global_step": 469277, "epoch": 5653} {"train_loss": -27.323694229125977, "global_step": 469278, "epoch": 5653} {"train_loss": -27.372228622436523, "global_step": 469279, "epoch": 5653} {"train_loss": -27.16656494140625, "global_step": 469280, "epoch": 5653} {"train_loss": -27.125660632030073, "global_step": 469281, "epoch": 5653, "val_loss": 6538403.5} {"train_loss": -25.89243507385254, "global_step": 469282, "epoch": 5654} {"train_loss": -26.757740020751953, "global_step": 469283, "epoch": 5654} {"train_loss": -26.835580825805664, "global_step": 469284, "epoch": 5654} {"train_loss": -27.0815372467041, "global_step": 469285, "epoch": 5654} {"train_loss": -26.564233779907227, "global_step": 469286, "epoch": 5654} {"train_loss": -26.532751083374023, "global_step": 469287, "epoch": 5654} {"train_loss": -26.665979385375977, "global_step": 469288, "epoch": 5654} {"train_loss": -26.377897262573242, "global_step": 469289, "epoch": 5654} {"train_loss": -26.940107345581055, "global_step": 469290, "epoch": 5654} {"train_loss": -26.607563018798828, "global_step": 469291, "epoch": 5654} {"train_loss": -26.79123878479004, "global_step": 469292, "epoch": 5654} {"train_loss": -26.971128463745117, "global_step": 469293, "epoch": 5654} {"train_loss": -26.449951171875, "global_step": 469294, "epoch": 5654} {"train_loss": -27.02947998046875, "global_step": 469295, "epoch": 5654} {"train_loss": -27.16748046875, "global_step": 469296, "epoch": 5654} {"train_loss": -27.1010799407959, "global_step": 469297, "epoch": 5654} {"train_loss": -27.022018432617188, "global_step": 469298, "epoch": 5654} {"train_loss": -27.0322265625, "global_step": 469299, "epoch": 5654} {"train_loss": -26.998157501220703, "global_step": 469300, "epoch": 5654} {"train_loss": -27.16546058654785, "global_step": 469301, "epoch": 5654} {"train_loss": -27.0148983001709, "global_step": 469302, "epoch": 5654} {"train_loss": -26.791324615478516, "global_step": 469303, "epoch": 5654} {"train_loss": -27.076623916625977, "global_step": 469304, "epoch": 5654} {"train_loss": -26.804401397705078, "global_step": 469305, "epoch": 5654} {"train_loss": -27.483884811401367, "global_step": 469306, "epoch": 5654} {"train_loss": -26.982776641845703, "global_step": 469307, "epoch": 5654} {"train_loss": -27.496789932250977, "global_step": 469308, "epoch": 5654} {"train_loss": -27.25214958190918, "global_step": 469309, "epoch": 5654} {"train_loss": -27.30750846862793, "global_step": 469310, "epoch": 5654} {"train_loss": -27.10917091369629, "global_step": 469311, "epoch": 5654} {"train_loss": -26.92350196838379, "global_step": 469312, "epoch": 5654} {"train_loss": -27.008777618408203, "global_step": 469313, "epoch": 5654} {"train_loss": -26.93393898010254, "global_step": 469314, "epoch": 5654} {"train_loss": -27.26140785217285, "global_step": 469315, "epoch": 5654} {"train_loss": -27.57269859313965, "global_step": 469316, "epoch": 5654} {"train_loss": -27.411890029907227, "global_step": 469317, "epoch": 5654} {"train_loss": -27.4445858001709, "global_step": 469318, "epoch": 5654} {"train_loss": -27.112396240234375, "global_step": 469319, "epoch": 5654} {"train_loss": -27.506315231323242, "global_step": 469320, "epoch": 5654} {"train_loss": -27.19752311706543, "global_step": 469321, "epoch": 5654} {"train_loss": -27.081907272338867, "global_step": 469322, "epoch": 5654} {"train_loss": -26.72287368774414, "global_step": 469323, "epoch": 5654} {"train_loss": -27.170644760131836, "global_step": 469324, "epoch": 5654} {"train_loss": -27.265655517578125, "global_step": 469325, "epoch": 5654} {"train_loss": -27.02874183654785, "global_step": 469326, "epoch": 5654} {"train_loss": -27.238393783569336, "global_step": 469327, "epoch": 5654} {"train_loss": -26.957611083984375, "global_step": 469328, "epoch": 5654} {"train_loss": -27.660160064697266, "global_step": 469329, "epoch": 5654} {"train_loss": -27.593297958374023, "global_step": 469330, "epoch": 5654} {"train_loss": -27.263629913330078, "global_step": 469331, "epoch": 5654} {"train_loss": -27.532392501831055, "global_step": 469332, "epoch": 5654} {"train_loss": -27.127241134643555, "global_step": 469333, "epoch": 5654} {"train_loss": -26.581134796142578, "global_step": 469334, "epoch": 5654} {"train_loss": -26.870397567749023, "global_step": 469335, "epoch": 5654} {"train_loss": -26.776935577392578, "global_step": 469336, "epoch": 5654} {"train_loss": -26.878332138061523, "global_step": 469337, "epoch": 5654} {"train_loss": -27.478418350219727, "global_step": 469338, "epoch": 5654} {"train_loss": -27.1471004486084, "global_step": 469339, "epoch": 5654} {"train_loss": -27.436786651611328, "global_step": 469340, "epoch": 5654} {"train_loss": -27.317047119140625, "global_step": 469341, "epoch": 5654} {"train_loss": -26.894880294799805, "global_step": 469342, "epoch": 5654} {"train_loss": -27.09467124938965, "global_step": 469343, "epoch": 5654} {"train_loss": -27.1462345123291, "global_step": 469344, "epoch": 5654} {"train_loss": -27.257339477539062, "global_step": 469345, "epoch": 5654} {"train_loss": -27.233137130737305, "global_step": 469346, "epoch": 5654} {"train_loss": -27.0932674407959, "global_step": 469347, "epoch": 5654} {"train_loss": -26.6223087310791, "global_step": 469348, "epoch": 5654} {"train_loss": -27.229467391967773, "global_step": 469349, "epoch": 5654} {"train_loss": -27.13641357421875, "global_step": 469350, "epoch": 5654} {"train_loss": -26.45263671875, "global_step": 469351, "epoch": 5654} {"train_loss": -26.402313232421875, "global_step": 469352, "epoch": 5654} {"train_loss": -27.149032592773438, "global_step": 469353, "epoch": 5654} {"train_loss": -27.088476181030273, "global_step": 469354, "epoch": 5654} {"train_loss": -26.582813262939453, "global_step": 469355, "epoch": 5654} {"train_loss": -26.890954971313477, "global_step": 469356, "epoch": 5654} {"train_loss": -27.4104061126709, "global_step": 469357, "epoch": 5654} {"train_loss": -26.71054458618164, "global_step": 469358, "epoch": 5654} {"train_loss": -27.014373779296875, "global_step": 469359, "epoch": 5654} {"train_loss": -27.10150718688965, "global_step": 469360, "epoch": 5654} {"train_loss": -26.55756187438965, "global_step": 469361, "epoch": 5654} {"train_loss": -26.72311782836914, "global_step": 469362, "epoch": 5654} {"train_loss": -26.837766647338867, "global_step": 469363, "epoch": 5654} {"train_loss": -27.022200228220008, "global_step": 469364, "epoch": 5654, "val_loss": 6674719.5} {"train_loss": -26.8309383392334, "global_step": 469365, "epoch": 5655} {"train_loss": -26.433094024658203, "global_step": 469366, "epoch": 5655} {"train_loss": -26.148603439331055, "global_step": 469367, "epoch": 5655} {"train_loss": -26.62910270690918, "global_step": 469368, "epoch": 5655} {"train_loss": -26.203369140625, "global_step": 469369, "epoch": 5655} {"train_loss": -26.380136489868164, "global_step": 469370, "epoch": 5655} {"train_loss": -26.791975021362305, "global_step": 469371, "epoch": 5655} {"train_loss": -26.91912269592285, "global_step": 469372, "epoch": 5655} {"train_loss": -27.1177978515625, "global_step": 469373, "epoch": 5655} {"train_loss": -26.949359893798828, "global_step": 469374, "epoch": 5655} {"train_loss": -27.0031681060791, "global_step": 469375, "epoch": 5655} {"train_loss": -27.04608726501465, "global_step": 469376, "epoch": 5655} {"train_loss": -27.00933837890625, "global_step": 469377, "epoch": 5655} {"train_loss": -27.27193260192871, "global_step": 469378, "epoch": 5655} {"train_loss": -27.25301170349121, "global_step": 469379, "epoch": 5655} {"train_loss": -27.10091209411621, "global_step": 469380, "epoch": 5655} {"train_loss": -27.108713150024414, "global_step": 469381, "epoch": 5655} {"train_loss": -27.3160343170166, "global_step": 469382, "epoch": 5655} {"train_loss": -27.29182243347168, "global_step": 469383, "epoch": 5655} {"train_loss": -27.192474365234375, "global_step": 469384, "epoch": 5655} {"train_loss": -27.35418128967285, "global_step": 469385, "epoch": 5655} {"train_loss": -27.188196182250977, "global_step": 469386, "epoch": 5655} {"train_loss": -27.249420166015625, "global_step": 469387, "epoch": 5655} {"train_loss": -26.935840606689453, "global_step": 469388, "epoch": 5655} {"train_loss": -27.331708908081055, "global_step": 469389, "epoch": 5655} {"train_loss": -27.58981704711914, "global_step": 469390, "epoch": 5655} {"train_loss": -27.283435821533203, "global_step": 469391, "epoch": 5655} {"train_loss": -26.898313522338867, "global_step": 469392, "epoch": 5655} {"train_loss": -27.2020263671875, "global_step": 469393, "epoch": 5655} {"train_loss": -27.394025802612305, "global_step": 469394, "epoch": 5655} {"train_loss": -27.408370971679688, "global_step": 469395, "epoch": 5655} {"train_loss": -27.3337459564209, "global_step": 469396, "epoch": 5655} {"train_loss": -27.103666305541992, "global_step": 469397, "epoch": 5655} {"train_loss": -27.232559204101562, "global_step": 469398, "epoch": 5655} {"train_loss": -27.570337295532227, "global_step": 469399, "epoch": 5655} {"train_loss": -27.4417724609375, "global_step": 469400, "epoch": 5655} {"train_loss": -27.4147891998291, "global_step": 469401, "epoch": 5655} {"train_loss": -27.55939292907715, "global_step": 469402, "epoch": 5655} {"train_loss": -27.549283981323242, "global_step": 469403, "epoch": 5655} {"train_loss": -26.934223175048828, "global_step": 469404, "epoch": 5655} {"train_loss": -27.161413192749023, "global_step": 469405, "epoch": 5655} {"train_loss": -27.35406494140625, "global_step": 469406, "epoch": 5655} {"train_loss": -27.25581169128418, "global_step": 469407, "epoch": 5655} {"train_loss": -27.337787628173828, "global_step": 469408, "epoch": 5655} {"train_loss": -27.322797775268555, "global_step": 469409, "epoch": 5655} {"train_loss": -27.117340087890625, "global_step": 469410, "epoch": 5655} {"train_loss": -27.068750381469727, "global_step": 469411, "epoch": 5655} {"train_loss": -27.0322208404541, "global_step": 469412, "epoch": 5655} {"train_loss": -27.211685180664062, "global_step": 469413, "epoch": 5655} {"train_loss": -26.9995059967041, "global_step": 469414, "epoch": 5655} {"train_loss": -27.20432472229004, "global_step": 469415, "epoch": 5655} {"train_loss": -27.36686134338379, "global_step": 469416, "epoch": 5655} {"train_loss": -27.383615493774414, "global_step": 469417, "epoch": 5655} {"train_loss": -27.076889038085938, "global_step": 469418, "epoch": 5655} {"train_loss": -27.111722946166992, "global_step": 469419, "epoch": 5655} {"train_loss": -26.950531005859375, "global_step": 469420, "epoch": 5655} {"train_loss": -27.1464786529541, "global_step": 469421, "epoch": 5655} {"train_loss": -27.268939971923828, "global_step": 469422, "epoch": 5655} {"train_loss": -27.435867309570312, "global_step": 469423, "epoch": 5655} {"train_loss": -27.324193954467773, "global_step": 469424, "epoch": 5655} {"train_loss": -27.216577529907227, "global_step": 469425, "epoch": 5655} {"train_loss": -27.23958396911621, "global_step": 469426, "epoch": 5655} {"train_loss": -27.05841064453125, "global_step": 469427, "epoch": 5655} {"train_loss": -27.380369186401367, "global_step": 469428, "epoch": 5655} {"train_loss": -27.450326919555664, "global_step": 469429, "epoch": 5655} {"train_loss": -27.199005126953125, "global_step": 469430, "epoch": 5655} {"train_loss": -26.903305053710938, "global_step": 469431, "epoch": 5655} {"train_loss": -27.032629013061523, "global_step": 469432, "epoch": 5655} {"train_loss": -26.94281578063965, "global_step": 469433, "epoch": 5655} {"train_loss": -27.40464210510254, "global_step": 469434, "epoch": 5655} {"train_loss": -26.95701026916504, "global_step": 469435, "epoch": 5655} {"train_loss": -26.77947425842285, "global_step": 469436, "epoch": 5655} {"train_loss": -26.95887565612793, "global_step": 469437, "epoch": 5655} {"train_loss": -27.385950088500977, "global_step": 469438, "epoch": 5655} {"train_loss": -27.383787155151367, "global_step": 469439, "epoch": 5655} {"train_loss": -27.3818302154541, "global_step": 469440, "epoch": 5655} {"train_loss": -27.176599502563477, "global_step": 469441, "epoch": 5655} {"train_loss": -27.252721786499023, "global_step": 469442, "epoch": 5655} {"train_loss": -27.50555992126465, "global_step": 469443, "epoch": 5655} {"train_loss": -27.42513084411621, "global_step": 469444, "epoch": 5655} {"train_loss": -26.98443603515625, "global_step": 469445, "epoch": 5655} {"train_loss": -26.976476669311523, "global_step": 469446, "epoch": 5655} {"train_loss": -27.13784367205149, "global_step": 469447, "epoch": 5655, "val_loss": 6690335.5} {"train_loss": -26.76519775390625, "global_step": 469448, "epoch": 5656} {"train_loss": -26.518890380859375, "global_step": 469449, "epoch": 5656} {"train_loss": -26.0894718170166, "global_step": 469450, "epoch": 5656} {"train_loss": -26.13154411315918, "global_step": 469451, "epoch": 5656} {"train_loss": -27.15069580078125, "global_step": 469452, "epoch": 5656} {"train_loss": -26.739118576049805, "global_step": 469453, "epoch": 5656} {"train_loss": -26.942808151245117, "global_step": 469454, "epoch": 5656} {"train_loss": -26.94837760925293, "global_step": 469455, "epoch": 5656} {"train_loss": -26.64886474609375, "global_step": 469456, "epoch": 5656} {"train_loss": -26.585180282592773, "global_step": 469457, "epoch": 5656} {"train_loss": -26.6488094329834, "global_step": 469458, "epoch": 5656} {"train_loss": -26.9908504486084, "global_step": 469459, "epoch": 5656} {"train_loss": -26.979217529296875, "global_step": 469460, "epoch": 5656} {"train_loss": -26.705097198486328, "global_step": 469461, "epoch": 5656} {"train_loss": -27.015853881835938, "global_step": 469462, "epoch": 5656} {"train_loss": -26.849079132080078, "global_step": 469463, "epoch": 5656} {"train_loss": -27.137250900268555, "global_step": 469464, "epoch": 5656} {"train_loss": -27.090662002563477, "global_step": 469465, "epoch": 5656} {"train_loss": -27.12628173828125, "global_step": 469466, "epoch": 5656} {"train_loss": -27.05781364440918, "global_step": 469467, "epoch": 5656} {"train_loss": -26.92365837097168, "global_step": 469468, "epoch": 5656} {"train_loss": -26.9161376953125, "global_step": 469469, "epoch": 5656} {"train_loss": -27.189178466796875, "global_step": 469470, "epoch": 5656} {"train_loss": -26.814483642578125, "global_step": 469471, "epoch": 5656} {"train_loss": -27.448211669921875, "global_step": 469472, "epoch": 5656} {"train_loss": -27.371713638305664, "global_step": 469473, "epoch": 5656} {"train_loss": -27.1102237701416, "global_step": 469474, "epoch": 5656} {"train_loss": -27.35047721862793, "global_step": 469475, "epoch": 5656} {"train_loss": -27.348663330078125, "global_step": 469476, "epoch": 5656} {"train_loss": -27.207319259643555, "global_step": 469477, "epoch": 5656} {"train_loss": -27.08790397644043, "global_step": 469478, "epoch": 5656} {"train_loss": -27.08255958557129, "global_step": 469479, "epoch": 5656} {"train_loss": -27.207122802734375, "global_step": 469480, "epoch": 5656} {"train_loss": -26.967626571655273, "global_step": 469481, "epoch": 5656} {"train_loss": -27.0201473236084, "global_step": 469482, "epoch": 5656} {"train_loss": -27.124242782592773, "global_step": 469483, "epoch": 5656} {"train_loss": -26.883441925048828, "global_step": 469484, "epoch": 5656} {"train_loss": -27.205896377563477, "global_step": 469485, "epoch": 5656} {"train_loss": -27.26788330078125, "global_step": 469486, "epoch": 5656} {"train_loss": -27.2523136138916, "global_step": 469487, "epoch": 5656} {"train_loss": -26.982995986938477, "global_step": 469488, "epoch": 5656} {"train_loss": -27.510114669799805, "global_step": 469489, "epoch": 5656} {"train_loss": -27.037973403930664, "global_step": 469490, "epoch": 5656} {"train_loss": -27.293142318725586, "global_step": 469491, "epoch": 5656} {"train_loss": -27.451934814453125, "global_step": 469492, "epoch": 5656} {"train_loss": -26.923389434814453, "global_step": 469493, "epoch": 5656} {"train_loss": -27.29831314086914, "global_step": 469494, "epoch": 5656} {"train_loss": -27.433835983276367, "global_step": 469495, "epoch": 5656} {"train_loss": -27.145776748657227, "global_step": 469496, "epoch": 5656} {"train_loss": -26.941650390625, "global_step": 469497, "epoch": 5656} {"train_loss": -26.785078048706055, "global_step": 469498, "epoch": 5656} {"train_loss": -27.075565338134766, "global_step": 469499, "epoch": 5656} {"train_loss": -27.02583885192871, "global_step": 469500, "epoch": 5656} {"train_loss": -27.086652755737305, "global_step": 469501, "epoch": 5656} {"train_loss": -26.974287033081055, "global_step": 469502, "epoch": 5656} {"train_loss": -27.094003677368164, "global_step": 469503, "epoch": 5656} {"train_loss": -27.15802574157715, "global_step": 469504, "epoch": 5656} {"train_loss": -27.006332397460938, "global_step": 469505, "epoch": 5656} {"train_loss": -26.44525146484375, "global_step": 469506, "epoch": 5656} {"train_loss": -27.096731185913086, "global_step": 469507, "epoch": 5656} {"train_loss": -27.49397850036621, "global_step": 469508, "epoch": 5656} {"train_loss": -26.861026763916016, "global_step": 469509, "epoch": 5656} {"train_loss": -26.746856689453125, "global_step": 469510, "epoch": 5656} {"train_loss": -27.635334014892578, "global_step": 469511, "epoch": 5656} {"train_loss": -26.933225631713867, "global_step": 469512, "epoch": 5656} {"train_loss": -26.886770248413086, "global_step": 469513, "epoch": 5656} {"train_loss": -27.325902938842773, "global_step": 469514, "epoch": 5656} {"train_loss": -26.96884536743164, "global_step": 469515, "epoch": 5656} {"train_loss": -27.159656524658203, "global_step": 469516, "epoch": 5656} {"train_loss": -27.0683536529541, "global_step": 469517, "epoch": 5656} {"train_loss": -27.333072662353516, "global_step": 469518, "epoch": 5656} {"train_loss": -26.933130264282227, "global_step": 469519, "epoch": 5656} {"train_loss": -27.48341178894043, "global_step": 469520, "epoch": 5656} {"train_loss": -27.281299591064453, "global_step": 469521, "epoch": 5656} {"train_loss": -26.984516143798828, "global_step": 469522, "epoch": 5656} {"train_loss": -26.866758346557617, "global_step": 469523, "epoch": 5656} {"train_loss": -27.00067138671875, "global_step": 469524, "epoch": 5656} {"train_loss": -27.15363883972168, "global_step": 469525, "epoch": 5656} {"train_loss": -27.059326171875, "global_step": 469526, "epoch": 5656} {"train_loss": -27.302936553955078, "global_step": 469527, "epoch": 5656} {"train_loss": -26.70908546447754, "global_step": 469528, "epoch": 5656} {"train_loss": -27.385663986206055, "global_step": 469529, "epoch": 5656} {"train_loss": -27.042172489396062, "global_step": 469530, "epoch": 5656, "val_loss": 6728431.5} {"train_loss": -26.67670249938965, "global_step": 469531, "epoch": 5657} {"train_loss": -26.64900779724121, "global_step": 469532, "epoch": 5657} {"train_loss": -26.72406578063965, "global_step": 469533, "epoch": 5657} {"train_loss": -26.50044059753418, "global_step": 469534, "epoch": 5657} {"train_loss": -26.333011627197266, "global_step": 469535, "epoch": 5657} {"train_loss": -26.565338134765625, "global_step": 469536, "epoch": 5657} {"train_loss": -26.65180778503418, "global_step": 469537, "epoch": 5657} {"train_loss": -26.468717575073242, "global_step": 469538, "epoch": 5657} {"train_loss": -26.623371124267578, "global_step": 469539, "epoch": 5657} {"train_loss": -26.649463653564453, "global_step": 469540, "epoch": 5657} {"train_loss": -26.347537994384766, "global_step": 469541, "epoch": 5657} {"train_loss": -26.528430938720703, "global_step": 469542, "epoch": 5657} {"train_loss": -26.932514190673828, "global_step": 469543, "epoch": 5657} {"train_loss": -26.751794815063477, "global_step": 469544, "epoch": 5657} {"train_loss": -27.213232040405273, "global_step": 469545, "epoch": 5657} {"train_loss": -26.291732788085938, "global_step": 469546, "epoch": 5657} {"train_loss": -26.594446182250977, "global_step": 469547, "epoch": 5657} {"train_loss": -27.115934371948242, "global_step": 469548, "epoch": 5657} {"train_loss": -27.037195205688477, "global_step": 469549, "epoch": 5657} {"train_loss": -27.187612533569336, "global_step": 469550, "epoch": 5657} {"train_loss": -26.589282989501953, "global_step": 469551, "epoch": 5657} {"train_loss": -27.297964096069336, "global_step": 469552, "epoch": 5657} {"train_loss": -26.875356674194336, "global_step": 469553, "epoch": 5657} {"train_loss": -26.955541610717773, "global_step": 469554, "epoch": 5657} {"train_loss": -27.136194229125977, "global_step": 469555, "epoch": 5657} {"train_loss": -26.811359405517578, "global_step": 469556, "epoch": 5657} {"train_loss": -26.788715362548828, "global_step": 469557, "epoch": 5657} {"train_loss": -27.31549644470215, "global_step": 469558, "epoch": 5657} {"train_loss": -27.25459861755371, "global_step": 469559, "epoch": 5657} {"train_loss": -27.205474853515625, "global_step": 469560, "epoch": 5657} {"train_loss": -27.253263473510742, "global_step": 469561, "epoch": 5657} {"train_loss": -27.474414825439453, "global_step": 469562, "epoch": 5657} {"train_loss": -26.99686050415039, "global_step": 469563, "epoch": 5657} {"train_loss": -27.707233428955078, "global_step": 469564, "epoch": 5657} {"train_loss": -27.472980499267578, "global_step": 469565, "epoch": 5657} {"train_loss": -27.114103317260742, "global_step": 469566, "epoch": 5657} {"train_loss": -26.945287704467773, "global_step": 469567, "epoch": 5657} {"train_loss": -27.260412216186523, "global_step": 469568, "epoch": 5657} {"train_loss": -26.975666046142578, "global_step": 469569, "epoch": 5657} {"train_loss": -27.14156150817871, "global_step": 469570, "epoch": 5657} {"train_loss": -27.456003189086914, "global_step": 469571, "epoch": 5657} {"train_loss": -27.307538986206055, "global_step": 469572, "epoch": 5657} {"train_loss": -27.229833602905273, "global_step": 469573, "epoch": 5657} {"train_loss": -26.963027954101562, "global_step": 469574, "epoch": 5657} {"train_loss": -27.153348922729492, "global_step": 469575, "epoch": 5657} {"train_loss": -27.301740646362305, "global_step": 469576, "epoch": 5657} {"train_loss": -27.318140029907227, "global_step": 469577, "epoch": 5657} {"train_loss": -27.175521850585938, "global_step": 469578, "epoch": 5657} {"train_loss": -27.658905029296875, "global_step": 469579, "epoch": 5657} {"train_loss": -27.101285934448242, "global_step": 469580, "epoch": 5657} {"train_loss": -26.816099166870117, "global_step": 469581, "epoch": 5657} {"train_loss": -27.121496200561523, "global_step": 469582, "epoch": 5657} {"train_loss": -27.236677169799805, "global_step": 469583, "epoch": 5657} {"train_loss": -27.243581771850586, "global_step": 469584, "epoch": 5657} {"train_loss": -26.841760635375977, "global_step": 469585, "epoch": 5657} {"train_loss": -27.296350479125977, "global_step": 469586, "epoch": 5657} {"train_loss": -27.228137969970703, "global_step": 469587, "epoch": 5657} {"train_loss": -26.782562255859375, "global_step": 469588, "epoch": 5657} {"train_loss": -26.866430282592773, "global_step": 469589, "epoch": 5657} {"train_loss": -26.91080665588379, "global_step": 469590, "epoch": 5657} {"train_loss": -27.376941680908203, "global_step": 469591, "epoch": 5657} {"train_loss": -26.488067626953125, "global_step": 469592, "epoch": 5657} {"train_loss": -26.876012802124023, "global_step": 469593, "epoch": 5657} {"train_loss": -27.033618927001953, "global_step": 469594, "epoch": 5657} {"train_loss": -26.69452476501465, "global_step": 469595, "epoch": 5657} {"train_loss": -27.201313018798828, "global_step": 469596, "epoch": 5657} {"train_loss": -27.26422691345215, "global_step": 469597, "epoch": 5657} {"train_loss": -27.117605209350586, "global_step": 469598, "epoch": 5657} {"train_loss": -27.21955680847168, "global_step": 469599, "epoch": 5657} {"train_loss": -27.045053482055664, "global_step": 469600, "epoch": 5657} {"train_loss": -27.085840225219727, "global_step": 469601, "epoch": 5657} {"train_loss": -27.085493087768555, "global_step": 469602, "epoch": 5657} {"train_loss": -27.1002254486084, "global_step": 469603, "epoch": 5657} {"train_loss": -27.2611141204834, "global_step": 469604, "epoch": 5657} {"train_loss": -27.13553237915039, "global_step": 469605, "epoch": 5657} {"train_loss": -27.48062515258789, "global_step": 469606, "epoch": 5657} {"train_loss": -26.960956573486328, "global_step": 469607, "epoch": 5657} {"train_loss": -27.233633041381836, "global_step": 469608, "epoch": 5657} {"train_loss": -27.3533935546875, "global_step": 469609, "epoch": 5657} {"train_loss": -27.3790225982666, "global_step": 469610, "epoch": 5657} {"train_loss": -27.268951416015625, "global_step": 469611, "epoch": 5657} {"train_loss": -26.954193115234375, "global_step": 469612, "epoch": 5657} {"train_loss": -27.014861876706043, "global_step": 469613, "epoch": 5657, "val_loss": 6701263.0} {"train_loss": -25.946996688842773, "global_step": 469614, "epoch": 5658} {"train_loss": -27.063566207885742, "global_step": 469615, "epoch": 5658} {"train_loss": -26.594013214111328, "global_step": 469616, "epoch": 5658} {"train_loss": -26.55267906188965, "global_step": 469617, "epoch": 5658} {"train_loss": -26.774688720703125, "global_step": 469618, "epoch": 5658} {"train_loss": -26.70465087890625, "global_step": 469619, "epoch": 5658} {"train_loss": -26.844242095947266, "global_step": 469620, "epoch": 5658} {"train_loss": -27.031538009643555, "global_step": 469621, "epoch": 5658} {"train_loss": -26.88008689880371, "global_step": 469622, "epoch": 5658} {"train_loss": -27.06926918029785, "global_step": 469623, "epoch": 5658} {"train_loss": -27.11333656311035, "global_step": 469624, "epoch": 5658} {"train_loss": -27.440977096557617, "global_step": 469625, "epoch": 5658} {"train_loss": -27.21449851989746, "global_step": 469626, "epoch": 5658} {"train_loss": -26.616342544555664, "global_step": 469627, "epoch": 5658} {"train_loss": -26.862106323242188, "global_step": 469628, "epoch": 5658} {"train_loss": -27.042526245117188, "global_step": 469629, "epoch": 5658} {"train_loss": -26.826818466186523, "global_step": 469630, "epoch": 5658} {"train_loss": -26.744672775268555, "global_step": 469631, "epoch": 5658} {"train_loss": -26.864965438842773, "global_step": 469632, "epoch": 5658} {"train_loss": -26.81817054748535, "global_step": 469633, "epoch": 5658} {"train_loss": -27.042234420776367, "global_step": 469634, "epoch": 5658} {"train_loss": -27.077259063720703, "global_step": 469635, "epoch": 5658} {"train_loss": -27.23174476623535, "global_step": 469636, "epoch": 5658} {"train_loss": -26.943389892578125, "global_step": 469637, "epoch": 5658} {"train_loss": -26.943023681640625, "global_step": 469638, "epoch": 5658} {"train_loss": -26.939544677734375, "global_step": 469639, "epoch": 5658} {"train_loss": -26.916303634643555, "global_step": 469640, "epoch": 5658} {"train_loss": -26.84986686706543, "global_step": 469641, "epoch": 5658} {"train_loss": -26.933576583862305, "global_step": 469642, "epoch": 5658} {"train_loss": -26.973928451538086, "global_step": 469643, "epoch": 5658} {"train_loss": -27.06548500061035, "global_step": 469644, "epoch": 5658} {"train_loss": -26.760456085205078, "global_step": 469645, "epoch": 5658} {"train_loss": -27.20023536682129, "global_step": 469646, "epoch": 5658} {"train_loss": -27.150033950805664, "global_step": 469647, "epoch": 5658} {"train_loss": -26.909162521362305, "global_step": 469648, "epoch": 5658} {"train_loss": -26.949865341186523, "global_step": 469649, "epoch": 5658} {"train_loss": -27.066675186157227, "global_step": 469650, "epoch": 5658} {"train_loss": -27.477102279663086, "global_step": 469651, "epoch": 5658} {"train_loss": -27.056751251220703, "global_step": 469652, "epoch": 5658} {"train_loss": -27.371707916259766, "global_step": 469653, "epoch": 5658} {"train_loss": -27.613874435424805, "global_step": 469654, "epoch": 5658} {"train_loss": -27.329679489135742, "global_step": 469655, "epoch": 5658} {"train_loss": -27.596179962158203, "global_step": 469656, "epoch": 5658} {"train_loss": -27.120100021362305, "global_step": 469657, "epoch": 5658} {"train_loss": -27.429113388061523, "global_step": 469658, "epoch": 5658} {"train_loss": -27.552017211914062, "global_step": 469659, "epoch": 5658} {"train_loss": -27.310346603393555, "global_step": 469660, "epoch": 5658} {"train_loss": -27.414846420288086, "global_step": 469661, "epoch": 5658} {"train_loss": -26.928146362304688, "global_step": 469662, "epoch": 5658} {"train_loss": -27.879148483276367, "global_step": 469663, "epoch": 5658} {"train_loss": -27.26323890686035, "global_step": 469664, "epoch": 5658} {"train_loss": -27.082916259765625, "global_step": 469665, "epoch": 5658} {"train_loss": -27.365386962890625, "global_step": 469666, "epoch": 5658} {"train_loss": -26.912363052368164, "global_step": 469667, "epoch": 5658} {"train_loss": -27.30829429626465, "global_step": 469668, "epoch": 5658} {"train_loss": -27.16281509399414, "global_step": 469669, "epoch": 5658} {"train_loss": -27.25190544128418, "global_step": 469670, "epoch": 5658} {"train_loss": -27.218708038330078, "global_step": 469671, "epoch": 5658} {"train_loss": -27.234832763671875, "global_step": 469672, "epoch": 5658} {"train_loss": -27.62079429626465, "global_step": 469673, "epoch": 5658} {"train_loss": -27.089263916015625, "global_step": 469674, "epoch": 5658} {"train_loss": -27.39749526977539, "global_step": 469675, "epoch": 5658} {"train_loss": -27.159570693969727, "global_step": 469676, "epoch": 5658} {"train_loss": -27.32339859008789, "global_step": 469677, "epoch": 5658} {"train_loss": -27.405948638916016, "global_step": 469678, "epoch": 5658} {"train_loss": -27.806665420532227, "global_step": 469679, "epoch": 5658} {"train_loss": -27.195728302001953, "global_step": 469680, "epoch": 5658} {"train_loss": -27.1212100982666, "global_step": 469681, "epoch": 5658} {"train_loss": -27.082921981811523, "global_step": 469682, "epoch": 5658} {"train_loss": -27.2457218170166, "global_step": 469683, "epoch": 5658} {"train_loss": -27.159976959228516, "global_step": 469684, "epoch": 5658} {"train_loss": -27.404788970947266, "global_step": 469685, "epoch": 5658} {"train_loss": -27.233596801757812, "global_step": 469686, "epoch": 5658} {"train_loss": -27.07899284362793, "global_step": 469687, "epoch": 5658} {"train_loss": -27.454029083251953, "global_step": 469688, "epoch": 5658} {"train_loss": -27.524866104125977, "global_step": 469689, "epoch": 5658} {"train_loss": -26.792707443237305, "global_step": 469690, "epoch": 5658} {"train_loss": -26.852685928344727, "global_step": 469691, "epoch": 5658} {"train_loss": -26.936344146728516, "global_step": 469692, "epoch": 5658} {"train_loss": -26.82083511352539, "global_step": 469693, "epoch": 5658} {"train_loss": -27.047788619995117, "global_step": 469694, "epoch": 5658} {"train_loss": -27.20355796813965, "global_step": 469695, "epoch": 5658} {"train_loss": -27.103232877800263, "global_step": 469696, "epoch": 5658, "val_loss": 6639884.0} {"train_loss": -26.398681640625, "global_step": 469697, "epoch": 5659} {"train_loss": -26.811017990112305, "global_step": 469698, "epoch": 5659} {"train_loss": -26.80219841003418, "global_step": 469699, "epoch": 5659} {"train_loss": -26.473783493041992, "global_step": 469700, "epoch": 5659} {"train_loss": -25.971851348876953, "global_step": 469701, "epoch": 5659} {"train_loss": -26.895206451416016, "global_step": 469702, "epoch": 5659} {"train_loss": -26.528186798095703, "global_step": 469703, "epoch": 5659} {"train_loss": -26.385595321655273, "global_step": 469704, "epoch": 5659} {"train_loss": -26.802854537963867, "global_step": 469705, "epoch": 5659} {"train_loss": -26.046283721923828, "global_step": 469706, "epoch": 5659} {"train_loss": -26.632431030273438, "global_step": 469707, "epoch": 5659} {"train_loss": -26.7495059967041, "global_step": 469708, "epoch": 5659} {"train_loss": -26.326007843017578, "global_step": 469709, "epoch": 5659} {"train_loss": -26.45350456237793, "global_step": 469710, "epoch": 5659} {"train_loss": -26.845916748046875, "global_step": 469711, "epoch": 5659} {"train_loss": -26.982797622680664, "global_step": 469712, "epoch": 5659} {"train_loss": -26.74016761779785, "global_step": 469713, "epoch": 5659} {"train_loss": -26.292646408081055, "global_step": 469714, "epoch": 5659} {"train_loss": -26.9899845123291, "global_step": 469715, "epoch": 5659} {"train_loss": -26.740686416625977, "global_step": 469716, "epoch": 5659} {"train_loss": -26.85841178894043, "global_step": 469717, "epoch": 5659} {"train_loss": -26.53309440612793, "global_step": 469718, "epoch": 5659} {"train_loss": -26.733678817749023, "global_step": 469719, "epoch": 5659} {"train_loss": -26.966073989868164, "global_step": 469720, "epoch": 5659} {"train_loss": -27.02347755432129, "global_step": 469721, "epoch": 5659} {"train_loss": -27.052997589111328, "global_step": 469722, "epoch": 5659} {"train_loss": -27.248889923095703, "global_step": 469723, "epoch": 5659} {"train_loss": -26.819488525390625, "global_step": 469724, "epoch": 5659} {"train_loss": -26.79402732849121, "global_step": 469725, "epoch": 5659} {"train_loss": -27.230520248413086, "global_step": 469726, "epoch": 5659} {"train_loss": -26.88629722595215, "global_step": 469727, "epoch": 5659} {"train_loss": -27.014434814453125, "global_step": 469728, "epoch": 5659} {"train_loss": -26.808923721313477, "global_step": 469729, "epoch": 5659} {"train_loss": -26.942235946655273, "global_step": 469730, "epoch": 5659} {"train_loss": -26.698575973510742, "global_step": 469731, "epoch": 5659} {"train_loss": -27.110214233398438, "global_step": 469732, "epoch": 5659} {"train_loss": -27.31537437438965, "global_step": 469733, "epoch": 5659} {"train_loss": -27.516225814819336, "global_step": 469734, "epoch": 5659} {"train_loss": -27.100027084350586, "global_step": 469735, "epoch": 5659} {"train_loss": -27.272430419921875, "global_step": 469736, "epoch": 5659} {"train_loss": -27.2601375579834, "global_step": 469737, "epoch": 5659} {"train_loss": -26.849218368530273, "global_step": 469738, "epoch": 5659} {"train_loss": -26.969945907592773, "global_step": 469739, "epoch": 5659} {"train_loss": -27.310840606689453, "global_step": 469740, "epoch": 5659} {"train_loss": -27.2369441986084, "global_step": 469741, "epoch": 5659} {"train_loss": -27.260473251342773, "global_step": 469742, "epoch": 5659} {"train_loss": -27.310346603393555, "global_step": 469743, "epoch": 5659} {"train_loss": -27.10235595703125, "global_step": 469744, "epoch": 5659} {"train_loss": -27.413175582885742, "global_step": 469745, "epoch": 5659} {"train_loss": -27.47171401977539, "global_step": 469746, "epoch": 5659} {"train_loss": -27.4891300201416, "global_step": 469747, "epoch": 5659} {"train_loss": -27.505146026611328, "global_step": 469748, "epoch": 5659} {"train_loss": -27.546415328979492, "global_step": 469749, "epoch": 5659} {"train_loss": -27.79220962524414, "global_step": 469750, "epoch": 5659} {"train_loss": -27.551639556884766, "global_step": 469751, "epoch": 5659} {"train_loss": -27.655370712280273, "global_step": 469752, "epoch": 5659} {"train_loss": -27.302536010742188, "global_step": 469753, "epoch": 5659} {"train_loss": -27.498676300048828, "global_step": 469754, "epoch": 5659} {"train_loss": -27.43625259399414, "global_step": 469755, "epoch": 5659} {"train_loss": -27.165491104125977, "global_step": 469756, "epoch": 5659} {"train_loss": -27.4881591796875, "global_step": 469757, "epoch": 5659} {"train_loss": -26.97992515563965, "global_step": 469758, "epoch": 5659} {"train_loss": -27.07315444946289, "global_step": 469759, "epoch": 5659} {"train_loss": -27.131635665893555, "global_step": 469760, "epoch": 5659} {"train_loss": -26.997623443603516, "global_step": 469761, "epoch": 5659} {"train_loss": -27.278711318969727, "global_step": 469762, "epoch": 5659} {"train_loss": -27.42011833190918, "global_step": 469763, "epoch": 5659} {"train_loss": -26.941192626953125, "global_step": 469764, "epoch": 5659} {"train_loss": -27.35648536682129, "global_step": 469765, "epoch": 5659} {"train_loss": -27.023040771484375, "global_step": 469766, "epoch": 5659} {"train_loss": -27.43159294128418, "global_step": 469767, "epoch": 5659} {"train_loss": -27.084985733032227, "global_step": 469768, "epoch": 5659} {"train_loss": -27.050674438476562, "global_step": 469769, "epoch": 5659} {"train_loss": -27.24430274963379, "global_step": 469770, "epoch": 5659} {"train_loss": -26.828495025634766, "global_step": 469771, "epoch": 5659} {"train_loss": -27.1948184967041, "global_step": 469772, "epoch": 5659} {"train_loss": -26.5576229095459, "global_step": 469773, "epoch": 5659} {"train_loss": -26.358325958251953, "global_step": 469774, "epoch": 5659} {"train_loss": -25.394723892211914, "global_step": 469775, "epoch": 5659} {"train_loss": -25.117361068725586, "global_step": 469776, "epoch": 5659} {"train_loss": -26.48935317993164, "global_step": 469777, "epoch": 5659} {"train_loss": -25.8745174407959, "global_step": 469778, "epoch": 5659} {"train_loss": -26.924756337361163, "global_step": 469779, "epoch": 5659, "val_loss": 6644357.0} {"train_loss": -26.40177345275879, "global_step": 469780, "epoch": 5660} {"train_loss": -26.28065299987793, "global_step": 469781, "epoch": 5660} {"train_loss": -26.251676559448242, "global_step": 469782, "epoch": 5660} {"train_loss": -25.679794311523438, "global_step": 469783, "epoch": 5660} {"train_loss": -26.031949996948242, "global_step": 469784, "epoch": 5660} {"train_loss": -26.129352569580078, "global_step": 469785, "epoch": 5660} {"train_loss": -25.740991592407227, "global_step": 469786, "epoch": 5660} {"train_loss": -26.031482696533203, "global_step": 469787, "epoch": 5660} {"train_loss": -26.297073364257812, "global_step": 469788, "epoch": 5660} {"train_loss": -26.012975692749023, "global_step": 469789, "epoch": 5660} {"train_loss": -26.16757583618164, "global_step": 469790, "epoch": 5660} {"train_loss": -26.240283966064453, "global_step": 469791, "epoch": 5660} {"train_loss": -26.497339248657227, "global_step": 469792, "epoch": 5660} {"train_loss": -26.36562156677246, "global_step": 469793, "epoch": 5660} {"train_loss": -26.564010620117188, "global_step": 469794, "epoch": 5660} {"train_loss": -26.426090240478516, "global_step": 469795, "epoch": 5660} {"train_loss": -26.675540924072266, "global_step": 469796, "epoch": 5660} {"train_loss": -26.84697914123535, "global_step": 469797, "epoch": 5660} {"train_loss": -26.493513107299805, "global_step": 469798, "epoch": 5660} {"train_loss": -26.520431518554688, "global_step": 469799, "epoch": 5660} {"train_loss": -26.876306533813477, "global_step": 469800, "epoch": 5660} {"train_loss": -27.131223678588867, "global_step": 469801, "epoch": 5660} {"train_loss": -27.017929077148438, "global_step": 469802, "epoch": 5660} {"train_loss": -26.76920509338379, "global_step": 469803, "epoch": 5660} {"train_loss": -26.626062393188477, "global_step": 469804, "epoch": 5660} {"train_loss": -26.384801864624023, "global_step": 469805, "epoch": 5660} {"train_loss": -26.921009063720703, "global_step": 469806, "epoch": 5660} {"train_loss": -26.875844955444336, "global_step": 469807, "epoch": 5660} {"train_loss": -26.663034439086914, "global_step": 469808, "epoch": 5660} {"train_loss": -27.110198974609375, "global_step": 469809, "epoch": 5660} {"train_loss": -26.95344352722168, "global_step": 469810, "epoch": 5660} {"train_loss": -27.21937370300293, "global_step": 469811, "epoch": 5660} {"train_loss": -27.27766990661621, "global_step": 469812, "epoch": 5660} {"train_loss": -27.09821128845215, "global_step": 469813, "epoch": 5660} {"train_loss": -27.178308486938477, "global_step": 469814, "epoch": 5660} {"train_loss": -27.028135299682617, "global_step": 469815, "epoch": 5660} {"train_loss": -26.778196334838867, "global_step": 469816, "epoch": 5660} {"train_loss": -26.890295028686523, "global_step": 469817, "epoch": 5660} {"train_loss": -27.335678100585938, "global_step": 469818, "epoch": 5660} {"train_loss": -27.059833526611328, "global_step": 469819, "epoch": 5660} {"train_loss": -27.3546085357666, "global_step": 469820, "epoch": 5660} {"train_loss": -27.097036361694336, "global_step": 469821, "epoch": 5660} {"train_loss": -27.1553897857666, "global_step": 469822, "epoch": 5660} {"train_loss": -27.148427963256836, "global_step": 469823, "epoch": 5660} {"train_loss": -27.3135986328125, "global_step": 469824, "epoch": 5660} {"train_loss": -27.16261863708496, "global_step": 469825, "epoch": 5660} {"train_loss": -27.4117431640625, "global_step": 469826, "epoch": 5660} {"train_loss": -27.469404220581055, "global_step": 469827, "epoch": 5660} {"train_loss": -27.4923038482666, "global_step": 469828, "epoch": 5660} {"train_loss": -26.882434844970703, "global_step": 469829, "epoch": 5660} {"train_loss": -27.0982723236084, "global_step": 469830, "epoch": 5660} {"train_loss": -26.837614059448242, "global_step": 469831, "epoch": 5660} {"train_loss": -26.6649169921875, "global_step": 469832, "epoch": 5660} {"train_loss": -26.668079376220703, "global_step": 469833, "epoch": 5660} {"train_loss": -27.2404842376709, "global_step": 469834, "epoch": 5660} {"train_loss": -27.07659339904785, "global_step": 469835, "epoch": 5660} {"train_loss": -26.5031795501709, "global_step": 469836, "epoch": 5660} {"train_loss": -26.682174682617188, "global_step": 469837, "epoch": 5660} {"train_loss": -26.884429931640625, "global_step": 469838, "epoch": 5660} {"train_loss": -27.17486572265625, "global_step": 469839, "epoch": 5660} {"train_loss": -26.95538330078125, "global_step": 469840, "epoch": 5660} {"train_loss": -27.08857536315918, "global_step": 469841, "epoch": 5660} {"train_loss": -27.1785888671875, "global_step": 469842, "epoch": 5660} {"train_loss": -27.291534423828125, "global_step": 469843, "epoch": 5660} {"train_loss": -27.34384536743164, "global_step": 469844, "epoch": 5660} {"train_loss": -27.722259521484375, "global_step": 469845, "epoch": 5660} {"train_loss": -27.2093448638916, "global_step": 469846, "epoch": 5660} {"train_loss": -26.889123916625977, "global_step": 469847, "epoch": 5660} {"train_loss": -27.412439346313477, "global_step": 469848, "epoch": 5660} {"train_loss": -27.4741268157959, "global_step": 469849, "epoch": 5660} {"train_loss": -27.32926368713379, "global_step": 469850, "epoch": 5660} {"train_loss": -27.264404296875, "global_step": 469851, "epoch": 5660} {"train_loss": -27.292984008789062, "global_step": 469852, "epoch": 5660} {"train_loss": -27.153949737548828, "global_step": 469853, "epoch": 5660} {"train_loss": -27.592670440673828, "global_step": 469854, "epoch": 5660} {"train_loss": -27.659988403320312, "global_step": 469855, "epoch": 5660} {"train_loss": -27.452829360961914, "global_step": 469856, "epoch": 5660} {"train_loss": -27.41269302368164, "global_step": 469857, "epoch": 5660} {"train_loss": -27.716449737548828, "global_step": 469858, "epoch": 5660} {"train_loss": -27.62278175354004, "global_step": 469859, "epoch": 5660} {"train_loss": -27.640003204345703, "global_step": 469860, "epoch": 5660} {"train_loss": -27.351150512695312, "global_step": 469861, "epoch": 5660} {"train_loss": -26.92395403298987, "global_step": 469862, "epoch": 5660, "val_loss": 6667249.0} {"train_loss": -26.814163208007812, "global_step": 469863, "epoch": 5661} {"train_loss": -27.483259201049805, "global_step": 469864, "epoch": 5661} {"train_loss": -27.231992721557617, "global_step": 469865, "epoch": 5661} {"train_loss": -27.092212677001953, "global_step": 469866, "epoch": 5661} {"train_loss": -27.006567001342773, "global_step": 469867, "epoch": 5661} {"train_loss": -27.145095825195312, "global_step": 469868, "epoch": 5661} {"train_loss": -26.72065544128418, "global_step": 469869, "epoch": 5661} {"train_loss": -26.894514083862305, "global_step": 469870, "epoch": 5661} {"train_loss": -27.157087326049805, "global_step": 469871, "epoch": 5661} {"train_loss": -26.83652114868164, "global_step": 469872, "epoch": 5661} {"train_loss": -27.490142822265625, "global_step": 469873, "epoch": 5661} {"train_loss": -27.276269912719727, "global_step": 469874, "epoch": 5661} {"train_loss": -26.942203521728516, "global_step": 469875, "epoch": 5661} {"train_loss": -26.907154083251953, "global_step": 469876, "epoch": 5661} {"train_loss": -26.877126693725586, "global_step": 469877, "epoch": 5661} {"train_loss": -26.91875648498535, "global_step": 469878, "epoch": 5661} {"train_loss": -27.026111602783203, "global_step": 469879, "epoch": 5661} {"train_loss": -26.96504783630371, "global_step": 469880, "epoch": 5661} {"train_loss": -27.106250762939453, "global_step": 469881, "epoch": 5661} {"train_loss": -26.69727897644043, "global_step": 469882, "epoch": 5661} {"train_loss": -27.38777732849121, "global_step": 469883, "epoch": 5661} {"train_loss": -26.923643112182617, "global_step": 469884, "epoch": 5661} {"train_loss": -26.430448532104492, "global_step": 469885, "epoch": 5661} {"train_loss": -26.737655639648438, "global_step": 469886, "epoch": 5661} {"train_loss": -26.97857666015625, "global_step": 469887, "epoch": 5661} {"train_loss": -26.70676040649414, "global_step": 469888, "epoch": 5661} {"train_loss": -26.996967315673828, "global_step": 469889, "epoch": 5661} {"train_loss": -26.79396629333496, "global_step": 469890, "epoch": 5661} {"train_loss": -26.859312057495117, "global_step": 469891, "epoch": 5661} {"train_loss": -27.073505401611328, "global_step": 469892, "epoch": 5661} {"train_loss": -27.320886611938477, "global_step": 469893, "epoch": 5661} {"train_loss": -26.93592643737793, "global_step": 469894, "epoch": 5661} {"train_loss": -27.153656005859375, "global_step": 469895, "epoch": 5661} {"train_loss": -27.235990524291992, "global_step": 469896, "epoch": 5661} {"train_loss": -26.627227783203125, "global_step": 469897, "epoch": 5661} {"train_loss": -27.098901748657227, "global_step": 469898, "epoch": 5661} {"train_loss": -26.89373207092285, "global_step": 469899, "epoch": 5661} {"train_loss": -26.742856979370117, "global_step": 469900, "epoch": 5661} {"train_loss": -26.940631866455078, "global_step": 469901, "epoch": 5661} {"train_loss": -26.989044189453125, "global_step": 469902, "epoch": 5661} {"train_loss": -27.138757705688477, "global_step": 469903, "epoch": 5661} {"train_loss": -27.345600128173828, "global_step": 469904, "epoch": 5661} {"train_loss": -26.729040145874023, "global_step": 469905, "epoch": 5661} {"train_loss": -27.00811767578125, "global_step": 469906, "epoch": 5661} {"train_loss": -26.828214645385742, "global_step": 469907, "epoch": 5661} {"train_loss": -27.014184951782227, "global_step": 469908, "epoch": 5661} {"train_loss": -27.252180099487305, "global_step": 469909, "epoch": 5661} {"train_loss": -27.11341667175293, "global_step": 469910, "epoch": 5661} {"train_loss": -27.015033721923828, "global_step": 469911, "epoch": 5661} {"train_loss": -27.143705368041992, "global_step": 469912, "epoch": 5661} {"train_loss": -27.397445678710938, "global_step": 469913, "epoch": 5661} {"train_loss": -27.397998809814453, "global_step": 469914, "epoch": 5661} {"train_loss": -27.417163848876953, "global_step": 469915, "epoch": 5661} {"train_loss": -27.137680053710938, "global_step": 469916, "epoch": 5661} {"train_loss": -26.997638702392578, "global_step": 469917, "epoch": 5661} {"train_loss": -27.184310913085938, "global_step": 469918, "epoch": 5661} {"train_loss": -27.022382736206055, "global_step": 469919, "epoch": 5661} {"train_loss": -27.09858512878418, "global_step": 469920, "epoch": 5661} {"train_loss": -26.942731857299805, "global_step": 469921, "epoch": 5661} {"train_loss": -27.3826904296875, "global_step": 469922, "epoch": 5661} {"train_loss": -27.42803955078125, "global_step": 469923, "epoch": 5661} {"train_loss": -27.143407821655273, "global_step": 469924, "epoch": 5661} {"train_loss": -27.41298484802246, "global_step": 469925, "epoch": 5661} {"train_loss": -27.59364891052246, "global_step": 469926, "epoch": 5661} {"train_loss": -27.289844512939453, "global_step": 469927, "epoch": 5661} {"train_loss": -27.160629272460938, "global_step": 469928, "epoch": 5661} {"train_loss": -27.674108505249023, "global_step": 469929, "epoch": 5661} {"train_loss": -27.173004150390625, "global_step": 469930, "epoch": 5661} {"train_loss": -27.267370223999023, "global_step": 469931, "epoch": 5661} {"train_loss": -27.506799697875977, "global_step": 469932, "epoch": 5661} {"train_loss": -27.494190216064453, "global_step": 469933, "epoch": 5661} {"train_loss": -27.439550399780273, "global_step": 469934, "epoch": 5661} {"train_loss": -27.246610641479492, "global_step": 469935, "epoch": 5661} {"train_loss": -27.1816349029541, "global_step": 469936, "epoch": 5661} {"train_loss": -27.318023681640625, "global_step": 469937, "epoch": 5661} {"train_loss": -27.435199737548828, "global_step": 469938, "epoch": 5661} {"train_loss": -27.390960693359375, "global_step": 469939, "epoch": 5661} {"train_loss": -27.1855411529541, "global_step": 469940, "epoch": 5661} {"train_loss": -26.9709529876709, "global_step": 469941, "epoch": 5661} {"train_loss": -27.09659194946289, "global_step": 469942, "epoch": 5661} {"train_loss": -26.918216705322266, "global_step": 469943, "epoch": 5661} {"train_loss": -27.404438018798828, "global_step": 469944, "epoch": 5661} {"train_loss": -27.112580218947077, "global_step": 469945, "epoch": 5661, "val_loss": 6729408.5} {"train_loss": -26.440439224243164, "global_step": 469946, "epoch": 5662} {"train_loss": -26.32297706604004, "global_step": 469947, "epoch": 5662} {"train_loss": -27.05072021484375, "global_step": 469948, "epoch": 5662} {"train_loss": -26.711103439331055, "global_step": 469949, "epoch": 5662} {"train_loss": -27.417348861694336, "global_step": 469950, "epoch": 5662} {"train_loss": -26.514678955078125, "global_step": 469951, "epoch": 5662} {"train_loss": -26.128446578979492, "global_step": 469952, "epoch": 5662} {"train_loss": -26.217422485351562, "global_step": 469953, "epoch": 5662} {"train_loss": -26.451202392578125, "global_step": 469954, "epoch": 5662} {"train_loss": -27.3123722076416, "global_step": 469955, "epoch": 5662} {"train_loss": -26.177106857299805, "global_step": 469956, "epoch": 5662} {"train_loss": -26.946441650390625, "global_step": 469957, "epoch": 5662} {"train_loss": -26.59437370300293, "global_step": 469958, "epoch": 5662} {"train_loss": -26.531330108642578, "global_step": 469959, "epoch": 5662} {"train_loss": -26.7817440032959, "global_step": 469960, "epoch": 5662} {"train_loss": -27.026708602905273, "global_step": 469961, "epoch": 5662} {"train_loss": -26.935102462768555, "global_step": 469962, "epoch": 5662} {"train_loss": -27.04902458190918, "global_step": 469963, "epoch": 5662} {"train_loss": -26.8411922454834, "global_step": 469964, "epoch": 5662} {"train_loss": -27.077768325805664, "global_step": 469965, "epoch": 5662} {"train_loss": -27.0689754486084, "global_step": 469966, "epoch": 5662} {"train_loss": -27.089750289916992, "global_step": 469967, "epoch": 5662} {"train_loss": -26.798627853393555, "global_step": 469968, "epoch": 5662} {"train_loss": -27.184085845947266, "global_step": 469969, "epoch": 5662} {"train_loss": -26.990182876586914, "global_step": 469970, "epoch": 5662} {"train_loss": -27.243505477905273, "global_step": 469971, "epoch": 5662} {"train_loss": -27.156005859375, "global_step": 469972, "epoch": 5662} {"train_loss": -26.824804306030273, "global_step": 469973, "epoch": 5662} {"train_loss": -27.13941764831543, "global_step": 469974, "epoch": 5662} {"train_loss": -26.997726440429688, "global_step": 469975, "epoch": 5662} {"train_loss": -27.35125160217285, "global_step": 469976, "epoch": 5662} {"train_loss": -27.134668350219727, "global_step": 469977, "epoch": 5662} {"train_loss": -27.107929229736328, "global_step": 469978, "epoch": 5662} {"train_loss": -26.80864906311035, "global_step": 469979, "epoch": 5662} {"train_loss": -27.187047958374023, "global_step": 469980, "epoch": 5662} {"train_loss": -26.985137939453125, "global_step": 469981, "epoch": 5662} {"train_loss": -27.512975692749023, "global_step": 469982, "epoch": 5662} {"train_loss": -26.944578170776367, "global_step": 469983, "epoch": 5662} {"train_loss": -27.222822189331055, "global_step": 469984, "epoch": 5662} {"train_loss": -27.407255172729492, "global_step": 469985, "epoch": 5662} {"train_loss": -27.4200439453125, "global_step": 469986, "epoch": 5662} {"train_loss": -26.945215225219727, "global_step": 469987, "epoch": 5662} {"train_loss": -27.404600143432617, "global_step": 469988, "epoch": 5662} {"train_loss": -27.260242462158203, "global_step": 469989, "epoch": 5662} {"train_loss": -27.469526290893555, "global_step": 469990, "epoch": 5662} {"train_loss": -27.363739013671875, "global_step": 469991, "epoch": 5662} {"train_loss": -27.355640411376953, "global_step": 469992, "epoch": 5662} {"train_loss": -27.13435173034668, "global_step": 469993, "epoch": 5662} {"train_loss": -27.365880966186523, "global_step": 469994, "epoch": 5662} {"train_loss": -26.787206649780273, "global_step": 469995, "epoch": 5662} {"train_loss": -26.716337203979492, "global_step": 469996, "epoch": 5662} {"train_loss": -26.797595977783203, "global_step": 469997, "epoch": 5662} {"train_loss": -26.84626579284668, "global_step": 469998, "epoch": 5662} {"train_loss": -27.399505615234375, "global_step": 469999, "epoch": 5662} {"train_loss": -27.404951095581055, "global_step": 470000, "epoch": 5662} {"train_loss": -26.60883903503418, "global_step": 470001, "epoch": 5662} {"train_loss": -27.141864776611328, "global_step": 470002, "epoch": 5662} {"train_loss": -27.251007080078125, "global_step": 470003, "epoch": 5662} {"train_loss": -26.947574615478516, "global_step": 470004, "epoch": 5662} {"train_loss": -27.22535514831543, "global_step": 470005, "epoch": 5662} {"train_loss": -27.2323055267334, "global_step": 470006, "epoch": 5662} {"train_loss": -26.985700607299805, "global_step": 470007, "epoch": 5662} {"train_loss": -27.488428115844727, "global_step": 470008, "epoch": 5662} {"train_loss": -27.30632972717285, "global_step": 470009, "epoch": 5662} {"train_loss": -27.3126220703125, "global_step": 470010, "epoch": 5662} {"train_loss": -27.373579025268555, "global_step": 470011, "epoch": 5662} {"train_loss": -27.205347061157227, "global_step": 470012, "epoch": 5662} {"train_loss": -26.962966918945312, "global_step": 470013, "epoch": 5662} {"train_loss": -27.45460319519043, "global_step": 470014, "epoch": 5662} {"train_loss": -27.6486873626709, "global_step": 470015, "epoch": 5662} {"train_loss": -27.26130485534668, "global_step": 470016, "epoch": 5662} {"train_loss": -27.429418563842773, "global_step": 470017, "epoch": 5662} {"train_loss": -27.09375, "global_step": 470018, "epoch": 5662} {"train_loss": -27.223052978515625, "global_step": 470019, "epoch": 5662} {"train_loss": -26.750476837158203, "global_step": 470020, "epoch": 5662} {"train_loss": -26.571027755737305, "global_step": 470021, "epoch": 5662} {"train_loss": -26.93531608581543, "global_step": 470022, "epoch": 5662} {"train_loss": -26.8028564453125, "global_step": 470023, "epoch": 5662} {"train_loss": -27.012680053710938, "global_step": 470024, "epoch": 5662} {"train_loss": -27.113805770874023, "global_step": 470025, "epoch": 5662} {"train_loss": -27.00896644592285, "global_step": 470026, "epoch": 5662} {"train_loss": -27.078781127929688, "global_step": 470027, "epoch": 5662} {"train_loss": -27.028062751494257, "global_step": 470028, "epoch": 5662, "val_loss": 6777617.0} {"train_loss": -26.3489990234375, "global_step": 470029, "epoch": 5663} {"train_loss": -26.48164176940918, "global_step": 470030, "epoch": 5663} {"train_loss": -25.851444244384766, "global_step": 470031, "epoch": 5663} {"train_loss": -26.525760650634766, "global_step": 470032, "epoch": 5663} {"train_loss": -25.699539184570312, "global_step": 470033, "epoch": 5663} {"train_loss": -25.960235595703125, "global_step": 470034, "epoch": 5663} {"train_loss": -26.459070205688477, "global_step": 470035, "epoch": 5663} {"train_loss": -25.743640899658203, "global_step": 470036, "epoch": 5663} {"train_loss": -26.101531982421875, "global_step": 470037, "epoch": 5663} {"train_loss": -25.953842163085938, "global_step": 470038, "epoch": 5663} {"train_loss": -26.007938385009766, "global_step": 470039, "epoch": 5663} {"train_loss": -26.50083351135254, "global_step": 470040, "epoch": 5663} {"train_loss": -26.1959171295166, "global_step": 470041, "epoch": 5663} {"train_loss": -26.722814559936523, "global_step": 470042, "epoch": 5663} {"train_loss": -26.346887588500977, "global_step": 470043, "epoch": 5663} {"train_loss": -26.607181549072266, "global_step": 470044, "epoch": 5663} {"train_loss": -27.013158798217773, "global_step": 470045, "epoch": 5663} {"train_loss": -26.8714599609375, "global_step": 470046, "epoch": 5663} {"train_loss": -26.913122177124023, "global_step": 470047, "epoch": 5663} {"train_loss": -26.476516723632812, "global_step": 470048, "epoch": 5663} {"train_loss": -26.810108184814453, "global_step": 470049, "epoch": 5663} {"train_loss": -27.282934188842773, "global_step": 470050, "epoch": 5663} {"train_loss": -26.86838722229004, "global_step": 470051, "epoch": 5663} {"train_loss": -26.737043380737305, "global_step": 470052, "epoch": 5663} {"train_loss": -26.702163696289062, "global_step": 470053, "epoch": 5663} {"train_loss": -27.05240249633789, "global_step": 470054, "epoch": 5663} {"train_loss": -27.18003273010254, "global_step": 470055, "epoch": 5663} {"train_loss": -27.01166343688965, "global_step": 470056, "epoch": 5663} {"train_loss": -26.69574546813965, "global_step": 470057, "epoch": 5663} {"train_loss": -26.95481300354004, "global_step": 470058, "epoch": 5663} {"train_loss": -26.57988929748535, "global_step": 470059, "epoch": 5663} {"train_loss": -27.01322364807129, "global_step": 470060, "epoch": 5663} {"train_loss": -27.046802520751953, "global_step": 470061, "epoch": 5663} {"train_loss": -27.048673629760742, "global_step": 470062, "epoch": 5663} {"train_loss": -27.041015625, "global_step": 470063, "epoch": 5663} {"train_loss": -26.977819442749023, "global_step": 470064, "epoch": 5663} {"train_loss": -27.29010009765625, "global_step": 470065, "epoch": 5663} {"train_loss": -27.4405574798584, "global_step": 470066, "epoch": 5663} {"train_loss": -27.10666847229004, "global_step": 470067, "epoch": 5663} {"train_loss": -27.61421775817871, "global_step": 470068, "epoch": 5663} {"train_loss": -27.23895263671875, "global_step": 470069, "epoch": 5663} {"train_loss": -27.10938835144043, "global_step": 470070, "epoch": 5663} {"train_loss": -27.42698097229004, "global_step": 470071, "epoch": 5663} {"train_loss": -27.407697677612305, "global_step": 470072, "epoch": 5663} {"train_loss": -27.280187606811523, "global_step": 470073, "epoch": 5663} {"train_loss": -27.488019943237305, "global_step": 470074, "epoch": 5663} {"train_loss": -27.59370994567871, "global_step": 470075, "epoch": 5663} {"train_loss": -27.17140769958496, "global_step": 470076, "epoch": 5663} {"train_loss": -26.962860107421875, "global_step": 470077, "epoch": 5663} {"train_loss": -27.405176162719727, "global_step": 470078, "epoch": 5663} {"train_loss": -27.206201553344727, "global_step": 470079, "epoch": 5663} {"train_loss": -27.370351791381836, "global_step": 470080, "epoch": 5663} {"train_loss": -27.503751754760742, "global_step": 470081, "epoch": 5663} {"train_loss": -27.34889030456543, "global_step": 470082, "epoch": 5663} {"train_loss": -27.504735946655273, "global_step": 470083, "epoch": 5663} {"train_loss": -27.002593994140625, "global_step": 470084, "epoch": 5663} {"train_loss": -27.46870231628418, "global_step": 470085, "epoch": 5663} {"train_loss": -27.071874618530273, "global_step": 470086, "epoch": 5663} {"train_loss": -27.394094467163086, "global_step": 470087, "epoch": 5663} {"train_loss": -27.113727569580078, "global_step": 470088, "epoch": 5663} {"train_loss": -27.0428466796875, "global_step": 470089, "epoch": 5663} {"train_loss": -26.975326538085938, "global_step": 470090, "epoch": 5663} {"train_loss": -27.65935707092285, "global_step": 470091, "epoch": 5663} {"train_loss": -26.7685604095459, "global_step": 470092, "epoch": 5663} {"train_loss": -27.1873836517334, "global_step": 470093, "epoch": 5663} {"train_loss": -26.918807983398438, "global_step": 470094, "epoch": 5663} {"train_loss": -26.5008544921875, "global_step": 470095, "epoch": 5663} {"train_loss": -26.862939834594727, "global_step": 470096, "epoch": 5663} {"train_loss": -26.802753448486328, "global_step": 470097, "epoch": 5663} {"train_loss": -27.396326065063477, "global_step": 470098, "epoch": 5663} {"train_loss": -27.04400634765625, "global_step": 470099, "epoch": 5663} {"train_loss": -27.141983032226562, "global_step": 470100, "epoch": 5663} {"train_loss": -26.905399322509766, "global_step": 470101, "epoch": 5663} {"train_loss": -26.95905113220215, "global_step": 470102, "epoch": 5663} {"train_loss": -27.03423500061035, "global_step": 470103, "epoch": 5663} {"train_loss": -27.13838005065918, "global_step": 470104, "epoch": 5663} {"train_loss": -26.9956111907959, "global_step": 470105, "epoch": 5663} {"train_loss": -26.709470748901367, "global_step": 470106, "epoch": 5663} {"train_loss": -27.12738609313965, "global_step": 470107, "epoch": 5663} {"train_loss": -27.054296493530273, "global_step": 470108, "epoch": 5663} {"train_loss": -26.814550399780273, "global_step": 470109, "epoch": 5663} {"train_loss": -27.009504318237305, "global_step": 470110, "epoch": 5663} {"train_loss": -26.91477423978139, "global_step": 470111, "epoch": 5663, "val_loss": 6740058.0} {"train_loss": -26.076913833618164, "global_step": 470112, "epoch": 5664} {"train_loss": -26.1921443939209, "global_step": 470113, "epoch": 5664} {"train_loss": -26.937530517578125, "global_step": 470114, "epoch": 5664} {"train_loss": -26.331409454345703, "global_step": 470115, "epoch": 5664} {"train_loss": -26.263019561767578, "global_step": 470116, "epoch": 5664} {"train_loss": -26.52153968811035, "global_step": 470117, "epoch": 5664} {"train_loss": -26.530481338500977, "global_step": 470118, "epoch": 5664} {"train_loss": -26.426931381225586, "global_step": 470119, "epoch": 5664} {"train_loss": -26.654844284057617, "global_step": 470120, "epoch": 5664} {"train_loss": -26.019678115844727, "global_step": 470121, "epoch": 5664} {"train_loss": -26.516706466674805, "global_step": 470122, "epoch": 5664} {"train_loss": -26.5128231048584, "global_step": 470123, "epoch": 5664} {"train_loss": -26.863910675048828, "global_step": 470124, "epoch": 5664} {"train_loss": -26.4373779296875, "global_step": 470125, "epoch": 5664} {"train_loss": -26.754491806030273, "global_step": 470126, "epoch": 5664} {"train_loss": -26.45330810546875, "global_step": 470127, "epoch": 5664} {"train_loss": -26.925657272338867, "global_step": 470128, "epoch": 5664} {"train_loss": -26.723169326782227, "global_step": 470129, "epoch": 5664} {"train_loss": -26.62171745300293, "global_step": 470130, "epoch": 5664} {"train_loss": -26.50516128540039, "global_step": 470131, "epoch": 5664} {"train_loss": -27.01832389831543, "global_step": 470132, "epoch": 5664} {"train_loss": -26.645374298095703, "global_step": 470133, "epoch": 5664} {"train_loss": -27.051111221313477, "global_step": 470134, "epoch": 5664} {"train_loss": -27.077457427978516, "global_step": 470135, "epoch": 5664} {"train_loss": -26.983625411987305, "global_step": 470136, "epoch": 5664} {"train_loss": -27.140644073486328, "global_step": 470137, "epoch": 5664} {"train_loss": -27.391637802124023, "global_step": 470138, "epoch": 5664} {"train_loss": -26.9706974029541, "global_step": 470139, "epoch": 5664} {"train_loss": -27.27703857421875, "global_step": 470140, "epoch": 5664} {"train_loss": -27.1417179107666, "global_step": 470141, "epoch": 5664} {"train_loss": -27.049463272094727, "global_step": 470142, "epoch": 5664} {"train_loss": -27.246063232421875, "global_step": 470143, "epoch": 5664} {"train_loss": -27.1864070892334, "global_step": 470144, "epoch": 5664} {"train_loss": -27.69037437438965, "global_step": 470145, "epoch": 5664} {"train_loss": -27.387481689453125, "global_step": 470146, "epoch": 5664} {"train_loss": -27.24696159362793, "global_step": 470147, "epoch": 5664} {"train_loss": -27.239633560180664, "global_step": 470148, "epoch": 5664} {"train_loss": -27.317365646362305, "global_step": 470149, "epoch": 5664} {"train_loss": -27.5731143951416, "global_step": 470150, "epoch": 5664} {"train_loss": -27.675647735595703, "global_step": 470151, "epoch": 5664} {"train_loss": -27.270050048828125, "global_step": 470152, "epoch": 5664} {"train_loss": -27.393033981323242, "global_step": 470153, "epoch": 5664} {"train_loss": -27.579519271850586, "global_step": 470154, "epoch": 5664} {"train_loss": -27.386383056640625, "global_step": 470155, "epoch": 5664} {"train_loss": -27.610166549682617, "global_step": 470156, "epoch": 5664} {"train_loss": -27.339277267456055, "global_step": 470157, "epoch": 5664} {"train_loss": -27.509967803955078, "global_step": 470158, "epoch": 5664} {"train_loss": -27.464004516601562, "global_step": 470159, "epoch": 5664} {"train_loss": -26.89997673034668, "global_step": 470160, "epoch": 5664} {"train_loss": -27.178586959838867, "global_step": 470161, "epoch": 5664} {"train_loss": -27.270450592041016, "global_step": 470162, "epoch": 5664} {"train_loss": -26.870330810546875, "global_step": 470163, "epoch": 5664} {"train_loss": -27.458356857299805, "global_step": 470164, "epoch": 5664} {"train_loss": -27.373022079467773, "global_step": 470165, "epoch": 5664} {"train_loss": -27.287784576416016, "global_step": 470166, "epoch": 5664} {"train_loss": -27.404184341430664, "global_step": 470167, "epoch": 5664} {"train_loss": -26.974695205688477, "global_step": 470168, "epoch": 5664} {"train_loss": -27.460590362548828, "global_step": 470169, "epoch": 5664} {"train_loss": -27.618072509765625, "global_step": 470170, "epoch": 5664} {"train_loss": -27.386383056640625, "global_step": 470171, "epoch": 5664} {"train_loss": -27.50128173828125, "global_step": 470172, "epoch": 5664} {"train_loss": -27.54483413696289, "global_step": 470173, "epoch": 5664} {"train_loss": -27.456501007080078, "global_step": 470174, "epoch": 5664} {"train_loss": -27.038679122924805, "global_step": 470175, "epoch": 5664} {"train_loss": -27.264123916625977, "global_step": 470176, "epoch": 5664} {"train_loss": -27.482690811157227, "global_step": 470177, "epoch": 5664} {"train_loss": -27.357696533203125, "global_step": 470178, "epoch": 5664} {"train_loss": -27.303958892822266, "global_step": 470179, "epoch": 5664} {"train_loss": -27.327655792236328, "global_step": 470180, "epoch": 5664} {"train_loss": -27.5178165435791, "global_step": 470181, "epoch": 5664} {"train_loss": -26.982574462890625, "global_step": 470182, "epoch": 5664} {"train_loss": -26.33392333984375, "global_step": 470183, "epoch": 5664} {"train_loss": -26.392730712890625, "global_step": 470184, "epoch": 5664} {"train_loss": -26.9577693939209, "global_step": 470185, "epoch": 5664} {"train_loss": -27.1204833984375, "global_step": 470186, "epoch": 5664} {"train_loss": -27.13715934753418, "global_step": 470187, "epoch": 5664} {"train_loss": -27.1044864654541, "global_step": 470188, "epoch": 5664} {"train_loss": -26.822021484375, "global_step": 470189, "epoch": 5664} {"train_loss": -27.276514053344727, "global_step": 470190, "epoch": 5664} {"train_loss": -27.732419967651367, "global_step": 470191, "epoch": 5664} {"train_loss": -27.1074161529541, "global_step": 470192, "epoch": 5664} {"train_loss": -27.170339584350586, "global_step": 470193, "epoch": 5664} {"train_loss": -27.061989290168487, "global_step": 470194, "epoch": 5664, "val_loss": 6710010.0} {"train_loss": -26.977766036987305, "global_step": 470195, "epoch": 5665} {"train_loss": -27.084150314331055, "global_step": 470196, "epoch": 5665} {"train_loss": -26.973682403564453, "global_step": 470197, "epoch": 5665} {"train_loss": -26.82136344909668, "global_step": 470198, "epoch": 5665} {"train_loss": -26.628103256225586, "global_step": 470199, "epoch": 5665} {"train_loss": -26.416784286499023, "global_step": 470200, "epoch": 5665} {"train_loss": -26.61431884765625, "global_step": 470201, "epoch": 5665} {"train_loss": -26.83841323852539, "global_step": 470202, "epoch": 5665} {"train_loss": -26.960973739624023, "global_step": 470203, "epoch": 5665} {"train_loss": -26.64121437072754, "global_step": 470204, "epoch": 5665} {"train_loss": -27.113422393798828, "global_step": 470205, "epoch": 5665} {"train_loss": -26.712844848632812, "global_step": 470206, "epoch": 5665} {"train_loss": -26.76873207092285, "global_step": 470207, "epoch": 5665} {"train_loss": -27.008142471313477, "global_step": 470208, "epoch": 5665} {"train_loss": -27.0736141204834, "global_step": 470209, "epoch": 5665} {"train_loss": -27.23358154296875, "global_step": 470210, "epoch": 5665} {"train_loss": -27.041425704956055, "global_step": 470211, "epoch": 5665} {"train_loss": -26.9210147857666, "global_step": 470212, "epoch": 5665} {"train_loss": -27.082721710205078, "global_step": 470213, "epoch": 5665} {"train_loss": -27.321426391601562, "global_step": 470214, "epoch": 5665} {"train_loss": -27.31424331665039, "global_step": 470215, "epoch": 5665} {"train_loss": -26.953205108642578, "global_step": 470216, "epoch": 5665} {"train_loss": -27.251392364501953, "global_step": 470217, "epoch": 5665} {"train_loss": -26.741657257080078, "global_step": 470218, "epoch": 5665} {"train_loss": -27.083356857299805, "global_step": 470219, "epoch": 5665} {"train_loss": -26.784387588500977, "global_step": 470220, "epoch": 5665} {"train_loss": -27.314472198486328, "global_step": 470221, "epoch": 5665} {"train_loss": -27.15606117248535, "global_step": 470222, "epoch": 5665} {"train_loss": -26.874134063720703, "global_step": 470223, "epoch": 5665} {"train_loss": -27.04217529296875, "global_step": 470224, "epoch": 5665} {"train_loss": -26.9622802734375, "global_step": 470225, "epoch": 5665} {"train_loss": -26.579618453979492, "global_step": 470226, "epoch": 5665} {"train_loss": -26.845386505126953, "global_step": 470227, "epoch": 5665} {"train_loss": -27.027097702026367, "global_step": 470228, "epoch": 5665} {"train_loss": -26.684406280517578, "global_step": 470229, "epoch": 5665} {"train_loss": -27.132904052734375, "global_step": 470230, "epoch": 5665} {"train_loss": -27.2243709564209, "global_step": 470231, "epoch": 5665} {"train_loss": -26.486013412475586, "global_step": 470232, "epoch": 5665} {"train_loss": -27.207386016845703, "global_step": 470233, "epoch": 5665} {"train_loss": -26.645795822143555, "global_step": 470234, "epoch": 5665} {"train_loss": -26.357025146484375, "global_step": 470235, "epoch": 5665} {"train_loss": -26.79244041442871, "global_step": 470236, "epoch": 5665} {"train_loss": -27.398609161376953, "global_step": 470237, "epoch": 5665} {"train_loss": -26.7233829498291, "global_step": 470238, "epoch": 5665} {"train_loss": -26.86423683166504, "global_step": 470239, "epoch": 5665} {"train_loss": -26.569860458374023, "global_step": 470240, "epoch": 5665} {"train_loss": -27.31216812133789, "global_step": 470241, "epoch": 5665} {"train_loss": -26.949081420898438, "global_step": 470242, "epoch": 5665} {"train_loss": -27.0120792388916, "global_step": 470243, "epoch": 5665} {"train_loss": -26.995731353759766, "global_step": 470244, "epoch": 5665} {"train_loss": -27.42343521118164, "global_step": 470245, "epoch": 5665} {"train_loss": -27.37958335876465, "global_step": 470246, "epoch": 5665} {"train_loss": -27.184513092041016, "global_step": 470247, "epoch": 5665} {"train_loss": -27.385513305664062, "global_step": 470248, "epoch": 5665} {"train_loss": -26.976139068603516, "global_step": 470249, "epoch": 5665} {"train_loss": -27.06787109375, "global_step": 470250, "epoch": 5665} {"train_loss": -26.976186752319336, "global_step": 470251, "epoch": 5665} {"train_loss": -27.379684448242188, "global_step": 470252, "epoch": 5665} {"train_loss": -26.72366714477539, "global_step": 470253, "epoch": 5665} {"train_loss": -27.137571334838867, "global_step": 470254, "epoch": 5665} {"train_loss": -27.354124069213867, "global_step": 470255, "epoch": 5665} {"train_loss": -27.4335994720459, "global_step": 470256, "epoch": 5665} {"train_loss": -27.08148765563965, "global_step": 470257, "epoch": 5665} {"train_loss": -26.7990665435791, "global_step": 470258, "epoch": 5665} {"train_loss": -27.5928897857666, "global_step": 470259, "epoch": 5665} {"train_loss": -26.8873291015625, "global_step": 470260, "epoch": 5665} {"train_loss": -27.55280876159668, "global_step": 470261, "epoch": 5665} {"train_loss": -27.62274169921875, "global_step": 470262, "epoch": 5665} {"train_loss": -27.294797897338867, "global_step": 470263, "epoch": 5665} {"train_loss": -27.66031265258789, "global_step": 470264, "epoch": 5665} {"train_loss": -27.3107967376709, "global_step": 470265, "epoch": 5665} {"train_loss": -27.409128189086914, "global_step": 470266, "epoch": 5665} {"train_loss": -27.41914176940918, "global_step": 470267, "epoch": 5665} {"train_loss": -27.269987106323242, "global_step": 470268, "epoch": 5665} {"train_loss": -27.66107749938965, "global_step": 470269, "epoch": 5665} {"train_loss": -26.89149284362793, "global_step": 470270, "epoch": 5665} {"train_loss": -27.80177879333496, "global_step": 470271, "epoch": 5665} {"train_loss": -27.194799423217773, "global_step": 470272, "epoch": 5665} {"train_loss": -27.235517501831055, "global_step": 470273, "epoch": 5665} {"train_loss": -27.19571876525879, "global_step": 470274, "epoch": 5665} {"train_loss": -27.0779972076416, "global_step": 470275, "epoch": 5665} {"train_loss": -27.063032150268555, "global_step": 470276, "epoch": 5665} {"train_loss": -27.086528984897107, "global_step": 470277, "epoch": 5665, "val_loss": 6676195.0} {"train_loss": -25.986297607421875, "global_step": 470278, "epoch": 5666} {"train_loss": -26.113386154174805, "global_step": 470279, "epoch": 5666} {"train_loss": -26.295211791992188, "global_step": 470280, "epoch": 5666} {"train_loss": -26.411848068237305, "global_step": 470281, "epoch": 5666} {"train_loss": -25.911518096923828, "global_step": 470282, "epoch": 5666} {"train_loss": -26.529211044311523, "global_step": 470283, "epoch": 5666} {"train_loss": -26.73087501525879, "global_step": 470284, "epoch": 5666} {"train_loss": -25.90912437438965, "global_step": 470285, "epoch": 5666} {"train_loss": -26.402145385742188, "global_step": 470286, "epoch": 5666} {"train_loss": -26.27083396911621, "global_step": 470287, "epoch": 5666} {"train_loss": -26.911218643188477, "global_step": 470288, "epoch": 5666} {"train_loss": -26.41228675842285, "global_step": 470289, "epoch": 5666} {"train_loss": -26.414337158203125, "global_step": 470290, "epoch": 5666} {"train_loss": -26.2911319732666, "global_step": 470291, "epoch": 5666} {"train_loss": -26.661270141601562, "global_step": 470292, "epoch": 5666} {"train_loss": -26.648649215698242, "global_step": 470293, "epoch": 5666} {"train_loss": -26.669742584228516, "global_step": 470294, "epoch": 5666} {"train_loss": -26.506162643432617, "global_step": 470295, "epoch": 5666} {"train_loss": -26.531309127807617, "global_step": 470296, "epoch": 5666} {"train_loss": -26.892398834228516, "global_step": 470297, "epoch": 5666} {"train_loss": -26.697065353393555, "global_step": 470298, "epoch": 5666} {"train_loss": -26.541845321655273, "global_step": 470299, "epoch": 5666} {"train_loss": -27.091938018798828, "global_step": 470300, "epoch": 5666} {"train_loss": -26.528823852539062, "global_step": 470301, "epoch": 5666} {"train_loss": -26.886646270751953, "global_step": 470302, "epoch": 5666} {"train_loss": -26.838987350463867, "global_step": 470303, "epoch": 5666} {"train_loss": -27.0015811920166, "global_step": 470304, "epoch": 5666} {"train_loss": -26.822336196899414, "global_step": 470305, "epoch": 5666} {"train_loss": -27.005170822143555, "global_step": 470306, "epoch": 5666} {"train_loss": -27.503503799438477, "global_step": 470307, "epoch": 5666} {"train_loss": -26.91773796081543, "global_step": 470308, "epoch": 5666} {"train_loss": -27.2757511138916, "global_step": 470309, "epoch": 5666} {"train_loss": -26.71693229675293, "global_step": 470310, "epoch": 5666} {"train_loss": -27.0416259765625, "global_step": 470311, "epoch": 5666} {"train_loss": -26.835851669311523, "global_step": 470312, "epoch": 5666} {"train_loss": -27.2696590423584, "global_step": 470313, "epoch": 5666} {"train_loss": -27.16546058654785, "global_step": 470314, "epoch": 5666} {"train_loss": -27.320932388305664, "global_step": 470315, "epoch": 5666} {"train_loss": -27.30169105529785, "global_step": 470316, "epoch": 5666} {"train_loss": -27.36753273010254, "global_step": 470317, "epoch": 5666} {"train_loss": -27.173629760742188, "global_step": 470318, "epoch": 5666} {"train_loss": -27.316137313842773, "global_step": 470319, "epoch": 5666} {"train_loss": -27.278532028198242, "global_step": 470320, "epoch": 5666} {"train_loss": -27.54917335510254, "global_step": 470321, "epoch": 5666} {"train_loss": -27.38136863708496, "global_step": 470322, "epoch": 5666} {"train_loss": -27.14190101623535, "global_step": 470323, "epoch": 5666} {"train_loss": -27.362201690673828, "global_step": 470324, "epoch": 5666} {"train_loss": -27.34641456604004, "global_step": 470325, "epoch": 5666} {"train_loss": -27.37690544128418, "global_step": 470326, "epoch": 5666} {"train_loss": -27.546300888061523, "global_step": 470327, "epoch": 5666} {"train_loss": -27.39484977722168, "global_step": 470328, "epoch": 5666} {"train_loss": -27.72808837890625, "global_step": 470329, "epoch": 5666} {"train_loss": -27.417224884033203, "global_step": 470330, "epoch": 5666} {"train_loss": -27.67877769470215, "global_step": 470331, "epoch": 5666} {"train_loss": -27.194250106811523, "global_step": 470332, "epoch": 5666} {"train_loss": -27.443347930908203, "global_step": 470333, "epoch": 5666} {"train_loss": -27.329925537109375, "global_step": 470334, "epoch": 5666} {"train_loss": -27.170560836791992, "global_step": 470335, "epoch": 5666} {"train_loss": -27.493494033813477, "global_step": 470336, "epoch": 5666} {"train_loss": -27.207075119018555, "global_step": 470337, "epoch": 5666} {"train_loss": -27.51889419555664, "global_step": 470338, "epoch": 5666} {"train_loss": -27.439590454101562, "global_step": 470339, "epoch": 5666} {"train_loss": -27.097003936767578, "global_step": 470340, "epoch": 5666} {"train_loss": -27.137235641479492, "global_step": 470341, "epoch": 5666} {"train_loss": -27.4016056060791, "global_step": 470342, "epoch": 5666} {"train_loss": -27.104999542236328, "global_step": 470343, "epoch": 5666} {"train_loss": -27.226293563842773, "global_step": 470344, "epoch": 5666} {"train_loss": -26.83930015563965, "global_step": 470345, "epoch": 5666} {"train_loss": -26.4518985748291, "global_step": 470346, "epoch": 5666} {"train_loss": -26.22064781188965, "global_step": 470347, "epoch": 5666} {"train_loss": -27.00998878479004, "global_step": 470348, "epoch": 5666} {"train_loss": -27.30047035217285, "global_step": 470349, "epoch": 5666} {"train_loss": -27.545785903930664, "global_step": 470350, "epoch": 5666} {"train_loss": -27.055124282836914, "global_step": 470351, "epoch": 5666} {"train_loss": -27.139633178710938, "global_step": 470352, "epoch": 5666} {"train_loss": -27.949359893798828, "global_step": 470353, "epoch": 5666} {"train_loss": -26.993976593017578, "global_step": 470354, "epoch": 5666} {"train_loss": -26.93250846862793, "global_step": 470355, "epoch": 5666} {"train_loss": -27.101511001586914, "global_step": 470356, "epoch": 5666} {"train_loss": -27.20990562438965, "global_step": 470357, "epoch": 5666} {"train_loss": -26.806127548217773, "global_step": 470358, "epoch": 5666} {"train_loss": -26.702001571655273, "global_step": 470359, "epoch": 5666} {"train_loss": -26.997569325458574, "global_step": 470360, "epoch": 5666, "val_loss": 6746828.0} {"train_loss": -25.60993766784668, "global_step": 470361, "epoch": 5667} {"train_loss": -26.267120361328125, "global_step": 470362, "epoch": 5667} {"train_loss": -26.50848960876465, "global_step": 470363, "epoch": 5667} {"train_loss": -26.301847457885742, "global_step": 470364, "epoch": 5667} {"train_loss": -26.08990478515625, "global_step": 470365, "epoch": 5667} {"train_loss": -26.804555892944336, "global_step": 470366, "epoch": 5667} {"train_loss": -26.33906364440918, "global_step": 470367, "epoch": 5667} {"train_loss": -26.659717559814453, "global_step": 470368, "epoch": 5667} {"train_loss": -26.54737663269043, "global_step": 470369, "epoch": 5667} {"train_loss": -26.42762565612793, "global_step": 470370, "epoch": 5667} {"train_loss": -26.648950576782227, "global_step": 470371, "epoch": 5667} {"train_loss": -26.371326446533203, "global_step": 470372, "epoch": 5667} {"train_loss": -26.457202911376953, "global_step": 470373, "epoch": 5667} {"train_loss": -26.8096866607666, "global_step": 470374, "epoch": 5667} {"train_loss": -26.225919723510742, "global_step": 470375, "epoch": 5667} {"train_loss": -26.705289840698242, "global_step": 470376, "epoch": 5667} {"train_loss": -26.678266525268555, "global_step": 470377, "epoch": 5667} {"train_loss": -26.870447158813477, "global_step": 470378, "epoch": 5667} {"train_loss": -26.530780792236328, "global_step": 470379, "epoch": 5667} {"train_loss": -27.186124801635742, "global_step": 470380, "epoch": 5667} {"train_loss": -27.006383895874023, "global_step": 470381, "epoch": 5667} {"train_loss": -26.914432525634766, "global_step": 470382, "epoch": 5667} {"train_loss": -26.984399795532227, "global_step": 470383, "epoch": 5667} {"train_loss": -26.659391403198242, "global_step": 470384, "epoch": 5667} {"train_loss": -27.12200927734375, "global_step": 470385, "epoch": 5667} {"train_loss": -27.07610511779785, "global_step": 470386, "epoch": 5667} {"train_loss": -27.310327529907227, "global_step": 470387, "epoch": 5667} {"train_loss": -27.024587631225586, "global_step": 470388, "epoch": 5667} {"train_loss": -27.231420516967773, "global_step": 470389, "epoch": 5667} {"train_loss": -27.223779678344727, "global_step": 470390, "epoch": 5667} {"train_loss": -27.104877471923828, "global_step": 470391, "epoch": 5667} {"train_loss": -26.755834579467773, "global_step": 470392, "epoch": 5667} {"train_loss": -27.024343490600586, "global_step": 470393, "epoch": 5667} {"train_loss": -27.083581924438477, "global_step": 470394, "epoch": 5667} {"train_loss": -26.975828170776367, "global_step": 470395, "epoch": 5667} {"train_loss": -27.499866485595703, "global_step": 470396, "epoch": 5667} {"train_loss": -27.199981689453125, "global_step": 470397, "epoch": 5667} {"train_loss": -27.07663917541504, "global_step": 470398, "epoch": 5667} {"train_loss": -27.23383903503418, "global_step": 470399, "epoch": 5667} {"train_loss": -27.218801498413086, "global_step": 470400, "epoch": 5667} {"train_loss": -27.379812240600586, "global_step": 470401, "epoch": 5667} {"train_loss": -27.40303611755371, "global_step": 470402, "epoch": 5667} {"train_loss": -27.197473526000977, "global_step": 470403, "epoch": 5667} {"train_loss": -27.368078231811523, "global_step": 470404, "epoch": 5667} {"train_loss": -27.378332138061523, "global_step": 470405, "epoch": 5667} {"train_loss": -27.14764404296875, "global_step": 470406, "epoch": 5667} {"train_loss": -26.7784366607666, "global_step": 470407, "epoch": 5667} {"train_loss": -27.34604835510254, "global_step": 470408, "epoch": 5667} {"train_loss": -27.278757095336914, "global_step": 470409, "epoch": 5667} {"train_loss": -27.398462295532227, "global_step": 470410, "epoch": 5667} {"train_loss": -27.16253089904785, "global_step": 470411, "epoch": 5667} {"train_loss": -27.5220890045166, "global_step": 470412, "epoch": 5667} {"train_loss": -27.514789581298828, "global_step": 470413, "epoch": 5667} {"train_loss": -27.412582397460938, "global_step": 470414, "epoch": 5667} {"train_loss": -26.826374053955078, "global_step": 470415, "epoch": 5667} {"train_loss": -27.007776260375977, "global_step": 470416, "epoch": 5667} {"train_loss": -27.21087074279785, "global_step": 470417, "epoch": 5667} {"train_loss": -27.226490020751953, "global_step": 470418, "epoch": 5667} {"train_loss": -26.9227237701416, "global_step": 470419, "epoch": 5667} {"train_loss": -27.372766494750977, "global_step": 470420, "epoch": 5667} {"train_loss": -27.40631675720215, "global_step": 470421, "epoch": 5667} {"train_loss": -27.358625411987305, "global_step": 470422, "epoch": 5667} {"train_loss": -27.360212326049805, "global_step": 470423, "epoch": 5667} {"train_loss": -27.373443603515625, "global_step": 470424, "epoch": 5667} {"train_loss": -27.10455894470215, "global_step": 470425, "epoch": 5667} {"train_loss": -27.078876495361328, "global_step": 470426, "epoch": 5667} {"train_loss": -27.501935958862305, "global_step": 470427, "epoch": 5667} {"train_loss": -27.54549217224121, "global_step": 470428, "epoch": 5667} {"train_loss": -27.2735595703125, "global_step": 470429, "epoch": 5667} {"train_loss": -27.286619186401367, "global_step": 470430, "epoch": 5667} {"train_loss": -27.135955810546875, "global_step": 470431, "epoch": 5667} {"train_loss": -27.3651065826416, "global_step": 470432, "epoch": 5667} {"train_loss": -27.141204833984375, "global_step": 470433, "epoch": 5667} {"train_loss": -26.920629501342773, "global_step": 470434, "epoch": 5667} {"train_loss": -27.22462272644043, "global_step": 470435, "epoch": 5667} {"train_loss": -27.255964279174805, "global_step": 470436, "epoch": 5667} {"train_loss": -27.469512939453125, "global_step": 470437, "epoch": 5667} {"train_loss": -27.177881240844727, "global_step": 470438, "epoch": 5667} {"train_loss": -26.773181915283203, "global_step": 470439, "epoch": 5667} {"train_loss": -26.949079513549805, "global_step": 470440, "epoch": 5667} {"train_loss": -26.828588485717773, "global_step": 470441, "epoch": 5667} {"train_loss": -27.159107208251953, "global_step": 470442, "epoch": 5667} {"train_loss": -26.99870794365205, "global_step": 470443, "epoch": 5667, "val_loss": 6740890.5} {"train_loss": -26.463537216186523, "global_step": 470444, "epoch": 5668} {"train_loss": -26.24420166015625, "global_step": 470445, "epoch": 5668} {"train_loss": -26.103626251220703, "global_step": 470446, "epoch": 5668} {"train_loss": -27.218957901000977, "global_step": 470447, "epoch": 5668} {"train_loss": -26.619354248046875, "global_step": 470448, "epoch": 5668} {"train_loss": -26.843351364135742, "global_step": 470449, "epoch": 5668} {"train_loss": -27.180578231811523, "global_step": 470450, "epoch": 5668} {"train_loss": -26.187305450439453, "global_step": 470451, "epoch": 5668} {"train_loss": -26.894821166992188, "global_step": 470452, "epoch": 5668} {"train_loss": -27.14121437072754, "global_step": 470453, "epoch": 5668} {"train_loss": -27.047666549682617, "global_step": 470454, "epoch": 5668} {"train_loss": -27.359695434570312, "global_step": 470455, "epoch": 5668} {"train_loss": -26.739791870117188, "global_step": 470456, "epoch": 5668} {"train_loss": -26.683349609375, "global_step": 470457, "epoch": 5668} {"train_loss": -27.241474151611328, "global_step": 470458, "epoch": 5668} {"train_loss": -27.18568229675293, "global_step": 470459, "epoch": 5668} {"train_loss": -27.211139678955078, "global_step": 470460, "epoch": 5668} {"train_loss": -26.878652572631836, "global_step": 470461, "epoch": 5668} {"train_loss": -26.865873336791992, "global_step": 470462, "epoch": 5668} {"train_loss": -27.509647369384766, "global_step": 470463, "epoch": 5668} {"train_loss": -27.485074996948242, "global_step": 470464, "epoch": 5668} {"train_loss": -27.286697387695312, "global_step": 470465, "epoch": 5668} {"train_loss": -27.252044677734375, "global_step": 470466, "epoch": 5668} {"train_loss": -27.36737632751465, "global_step": 470467, "epoch": 5668} {"train_loss": -27.227386474609375, "global_step": 470468, "epoch": 5668} {"train_loss": -27.35304069519043, "global_step": 470469, "epoch": 5668} {"train_loss": -27.287805557250977, "global_step": 470470, "epoch": 5668} {"train_loss": -27.21109390258789, "global_step": 470471, "epoch": 5668} {"train_loss": -27.304672241210938, "global_step": 470472, "epoch": 5668} {"train_loss": -26.989023208618164, "global_step": 470473, "epoch": 5668} {"train_loss": -27.052112579345703, "global_step": 470474, "epoch": 5668} {"train_loss": -27.183673858642578, "global_step": 470475, "epoch": 5668} {"train_loss": -27.110340118408203, "global_step": 470476, "epoch": 5668} {"train_loss": -27.02958106994629, "global_step": 470477, "epoch": 5668} {"train_loss": -26.832738876342773, "global_step": 470478, "epoch": 5668} {"train_loss": -27.4180965423584, "global_step": 470479, "epoch": 5668} {"train_loss": -27.643402099609375, "global_step": 470480, "epoch": 5668} {"train_loss": -27.036245346069336, "global_step": 470481, "epoch": 5668} {"train_loss": -27.15998649597168, "global_step": 470482, "epoch": 5668} {"train_loss": -27.21803092956543, "global_step": 470483, "epoch": 5668} {"train_loss": -27.487945556640625, "global_step": 470484, "epoch": 5668} {"train_loss": -27.26055908203125, "global_step": 470485, "epoch": 5668} {"train_loss": -27.485565185546875, "global_step": 470486, "epoch": 5668} {"train_loss": -27.559728622436523, "global_step": 470487, "epoch": 5668} {"train_loss": -27.337858200073242, "global_step": 470488, "epoch": 5668} {"train_loss": -27.644947052001953, "global_step": 470489, "epoch": 5668} {"train_loss": -27.547895431518555, "global_step": 470490, "epoch": 5668} {"train_loss": -27.354324340820312, "global_step": 470491, "epoch": 5668} {"train_loss": -27.311872482299805, "global_step": 470492, "epoch": 5668} {"train_loss": -27.276273727416992, "global_step": 470493, "epoch": 5668} {"train_loss": -27.509016036987305, "global_step": 470494, "epoch": 5668} {"train_loss": -27.36273193359375, "global_step": 470495, "epoch": 5668} {"train_loss": -27.177814483642578, "global_step": 470496, "epoch": 5668} {"train_loss": -27.18422508239746, "global_step": 470497, "epoch": 5668} {"train_loss": -27.367130279541016, "global_step": 470498, "epoch": 5668} {"train_loss": -27.193395614624023, "global_step": 470499, "epoch": 5668} {"train_loss": -27.53285026550293, "global_step": 470500, "epoch": 5668} {"train_loss": -27.284040451049805, "global_step": 470501, "epoch": 5668} {"train_loss": -27.179723739624023, "global_step": 470502, "epoch": 5668} {"train_loss": -27.549570083618164, "global_step": 470503, "epoch": 5668} {"train_loss": -27.323556900024414, "global_step": 470504, "epoch": 5668} {"train_loss": -27.378637313842773, "global_step": 470505, "epoch": 5668} {"train_loss": -26.527013778686523, "global_step": 470506, "epoch": 5668} {"train_loss": -26.807693481445312, "global_step": 470507, "epoch": 5668} {"train_loss": -27.071090698242188, "global_step": 470508, "epoch": 5668} {"train_loss": -27.1943302154541, "global_step": 470509, "epoch": 5668} {"train_loss": -27.23957633972168, "global_step": 470510, "epoch": 5668} {"train_loss": -27.543094635009766, "global_step": 470511, "epoch": 5668} {"train_loss": -27.596948623657227, "global_step": 470512, "epoch": 5668} {"train_loss": -26.81174087524414, "global_step": 470513, "epoch": 5668} {"train_loss": -27.2436466217041, "global_step": 470514, "epoch": 5668} {"train_loss": -26.58265495300293, "global_step": 470515, "epoch": 5668} {"train_loss": -26.971271514892578, "global_step": 470516, "epoch": 5668} {"train_loss": -27.060815811157227, "global_step": 470517, "epoch": 5668} {"train_loss": -27.257720947265625, "global_step": 470518, "epoch": 5668} {"train_loss": -26.70502281188965, "global_step": 470519, "epoch": 5668} {"train_loss": -26.8037052154541, "global_step": 470520, "epoch": 5668} {"train_loss": -27.192306518554688, "global_step": 470521, "epoch": 5668} {"train_loss": -26.88058853149414, "global_step": 470522, "epoch": 5668} {"train_loss": -26.956485748291016, "global_step": 470523, "epoch": 5668} {"train_loss": -27.025156021118164, "global_step": 470524, "epoch": 5668} {"train_loss": -27.052520751953125, "global_step": 470525, "epoch": 5668} {"train_loss": -27.11784369687, "global_step": 470526, "epoch": 5668, "val_loss": 6649137.0} {"train_loss": -26.103437423706055, "global_step": 470527, "epoch": 5669} {"train_loss": -25.704587936401367, "global_step": 470528, "epoch": 5669} {"train_loss": -26.482389450073242, "global_step": 470529, "epoch": 5669} {"train_loss": -25.46551513671875, "global_step": 470530, "epoch": 5669} {"train_loss": -26.43726921081543, "global_step": 470531, "epoch": 5669} {"train_loss": -25.692840576171875, "global_step": 470532, "epoch": 5669} {"train_loss": -26.551151275634766, "global_step": 470533, "epoch": 5669} {"train_loss": -26.42474937438965, "global_step": 470534, "epoch": 5669} {"train_loss": -26.33196449279785, "global_step": 470535, "epoch": 5669} {"train_loss": -26.476530075073242, "global_step": 470536, "epoch": 5669} {"train_loss": -27.001867294311523, "global_step": 470537, "epoch": 5669} {"train_loss": -26.630762100219727, "global_step": 470538, "epoch": 5669} {"train_loss": -26.765607833862305, "global_step": 470539, "epoch": 5669} {"train_loss": -26.46210289001465, "global_step": 470540, "epoch": 5669} {"train_loss": -26.433496475219727, "global_step": 470541, "epoch": 5669} {"train_loss": -26.88874626159668, "global_step": 470542, "epoch": 5669} {"train_loss": -26.8516788482666, "global_step": 470543, "epoch": 5669} {"train_loss": -26.767658233642578, "global_step": 470544, "epoch": 5669} {"train_loss": -26.48137855529785, "global_step": 470545, "epoch": 5669} {"train_loss": -26.942163467407227, "global_step": 470546, "epoch": 5669} {"train_loss": -26.81715202331543, "global_step": 470547, "epoch": 5669} {"train_loss": -27.00504493713379, "global_step": 470548, "epoch": 5669} {"train_loss": -27.397964477539062, "global_step": 470549, "epoch": 5669} {"train_loss": -26.67864418029785, "global_step": 470550, "epoch": 5669} {"train_loss": -26.778730392456055, "global_step": 470551, "epoch": 5669} {"train_loss": -27.377002716064453, "global_step": 470552, "epoch": 5669} {"train_loss": -27.184951782226562, "global_step": 470553, "epoch": 5669} {"train_loss": -27.030242919921875, "global_step": 470554, "epoch": 5669} {"train_loss": -26.738264083862305, "global_step": 470555, "epoch": 5669} {"train_loss": -27.165393829345703, "global_step": 470556, "epoch": 5669} {"train_loss": -27.27728843688965, "global_step": 470557, "epoch": 5669} {"train_loss": -27.192230224609375, "global_step": 470558, "epoch": 5669} {"train_loss": -26.83087158203125, "global_step": 470559, "epoch": 5669} {"train_loss": -26.986753463745117, "global_step": 470560, "epoch": 5669} {"train_loss": -27.433242797851562, "global_step": 470561, "epoch": 5669} {"train_loss": -26.89214515686035, "global_step": 470562, "epoch": 5669} {"train_loss": -27.10767936706543, "global_step": 470563, "epoch": 5669} {"train_loss": -27.111196517944336, "global_step": 470564, "epoch": 5669} {"train_loss": -27.030881881713867, "global_step": 470565, "epoch": 5669} {"train_loss": -27.417282104492188, "global_step": 470566, "epoch": 5669} {"train_loss": -27.270078659057617, "global_step": 470567, "epoch": 5669} {"train_loss": -26.9442195892334, "global_step": 470568, "epoch": 5669} {"train_loss": -27.376096725463867, "global_step": 470569, "epoch": 5669} {"train_loss": -27.06574821472168, "global_step": 470570, "epoch": 5669} {"train_loss": -27.22488784790039, "global_step": 470571, "epoch": 5669} {"train_loss": -27.23992919921875, "global_step": 470572, "epoch": 5669} {"train_loss": -27.157638549804688, "global_step": 470573, "epoch": 5669} {"train_loss": -27.43580436706543, "global_step": 470574, "epoch": 5669} {"train_loss": -27.31244468688965, "global_step": 470575, "epoch": 5669} {"train_loss": -27.296741485595703, "global_step": 470576, "epoch": 5669} {"train_loss": -27.011747360229492, "global_step": 470577, "epoch": 5669} {"train_loss": -27.142120361328125, "global_step": 470578, "epoch": 5669} {"train_loss": -27.245359420776367, "global_step": 470579, "epoch": 5669} {"train_loss": -26.917734146118164, "global_step": 470580, "epoch": 5669} {"train_loss": -27.350116729736328, "global_step": 470581, "epoch": 5669} {"train_loss": -27.18330955505371, "global_step": 470582, "epoch": 5669} {"train_loss": -27.288166046142578, "global_step": 470583, "epoch": 5669} {"train_loss": -27.130346298217773, "global_step": 470584, "epoch": 5669} {"train_loss": -27.422592163085938, "global_step": 470585, "epoch": 5669} {"train_loss": -27.36004638671875, "global_step": 470586, "epoch": 5669} {"train_loss": -27.274494171142578, "global_step": 470587, "epoch": 5669} {"train_loss": -27.3830509185791, "global_step": 470588, "epoch": 5669} {"train_loss": -27.27151870727539, "global_step": 470589, "epoch": 5669} {"train_loss": -27.493188858032227, "global_step": 470590, "epoch": 5669} {"train_loss": -27.243179321289062, "global_step": 470591, "epoch": 5669} {"train_loss": -27.2722110748291, "global_step": 470592, "epoch": 5669} {"train_loss": -27.47397232055664, "global_step": 470593, "epoch": 5669} {"train_loss": -27.532907485961914, "global_step": 470594, "epoch": 5669} {"train_loss": -27.052127838134766, "global_step": 470595, "epoch": 5669} {"train_loss": -27.417577743530273, "global_step": 470596, "epoch": 5669} {"train_loss": -27.391626358032227, "global_step": 470597, "epoch": 5669} {"train_loss": -27.48179054260254, "global_step": 470598, "epoch": 5669} {"train_loss": -27.245508193969727, "global_step": 470599, "epoch": 5669} {"train_loss": -27.092954635620117, "global_step": 470600, "epoch": 5669} {"train_loss": -27.331892013549805, "global_step": 470601, "epoch": 5669} {"train_loss": -27.620691299438477, "global_step": 470602, "epoch": 5669} {"train_loss": -27.373388290405273, "global_step": 470603, "epoch": 5669} {"train_loss": -27.29170036315918, "global_step": 470604, "epoch": 5669} {"train_loss": -27.200963973999023, "global_step": 470605, "epoch": 5669} {"train_loss": -27.2078914642334, "global_step": 470606, "epoch": 5669} {"train_loss": -27.206863403320312, "global_step": 470607, "epoch": 5669} {"train_loss": -27.25311279296875, "global_step": 470608, "epoch": 5669} {"train_loss": -27.02735307992223, "global_step": 470609, "epoch": 5669, "val_loss": 6740718.0} {"train_loss": -26.540403366088867, "global_step": 470610, "epoch": 5670} {"train_loss": -26.38155174255371, "global_step": 470611, "epoch": 5670} {"train_loss": -25.689626693725586, "global_step": 470612, "epoch": 5670} {"train_loss": -25.546918869018555, "global_step": 470613, "epoch": 5670} {"train_loss": -25.8848819732666, "global_step": 470614, "epoch": 5670} {"train_loss": -26.78498649597168, "global_step": 470615, "epoch": 5670} {"train_loss": -27.02001953125, "global_step": 470616, "epoch": 5670} {"train_loss": -26.68621253967285, "global_step": 470617, "epoch": 5670} {"train_loss": -26.650897979736328, "global_step": 470618, "epoch": 5670} {"train_loss": -27.108963012695312, "global_step": 470619, "epoch": 5670} {"train_loss": -26.4096622467041, "global_step": 470620, "epoch": 5670} {"train_loss": -26.93958854675293, "global_step": 470621, "epoch": 5670} {"train_loss": -27.153839111328125, "global_step": 470622, "epoch": 5670} {"train_loss": -26.92799949645996, "global_step": 470623, "epoch": 5670} {"train_loss": -26.902191162109375, "global_step": 470624, "epoch": 5670} {"train_loss": -27.09869956970215, "global_step": 470625, "epoch": 5670} {"train_loss": -27.072011947631836, "global_step": 470626, "epoch": 5670} {"train_loss": -26.95794105529785, "global_step": 470627, "epoch": 5670} {"train_loss": -27.306318283081055, "global_step": 470628, "epoch": 5670} {"train_loss": -27.038732528686523, "global_step": 470629, "epoch": 5670} {"train_loss": -26.717451095581055, "global_step": 470630, "epoch": 5670} {"train_loss": -27.136701583862305, "global_step": 470631, "epoch": 5670} {"train_loss": -27.136356353759766, "global_step": 470632, "epoch": 5670} {"train_loss": -27.115507125854492, "global_step": 470633, "epoch": 5670} {"train_loss": -27.14594841003418, "global_step": 470634, "epoch": 5670} {"train_loss": -27.14521598815918, "global_step": 470635, "epoch": 5670} {"train_loss": -26.945627212524414, "global_step": 470636, "epoch": 5670} {"train_loss": -27.02984046936035, "global_step": 470637, "epoch": 5670} {"train_loss": -27.263065338134766, "global_step": 470638, "epoch": 5670} {"train_loss": -27.421802520751953, "global_step": 470639, "epoch": 5670} {"train_loss": -27.390485763549805, "global_step": 470640, "epoch": 5670} {"train_loss": -26.936124801635742, "global_step": 470641, "epoch": 5670} {"train_loss": -27.166173934936523, "global_step": 470642, "epoch": 5670} {"train_loss": -27.400318145751953, "global_step": 470643, "epoch": 5670} {"train_loss": -27.129425048828125, "global_step": 470644, "epoch": 5670} {"train_loss": -27.760852813720703, "global_step": 470645, "epoch": 5670} {"train_loss": -27.464990615844727, "global_step": 470646, "epoch": 5670} {"train_loss": -27.037504196166992, "global_step": 470647, "epoch": 5670} {"train_loss": -27.326251983642578, "global_step": 470648, "epoch": 5670} {"train_loss": -27.202051162719727, "global_step": 470649, "epoch": 5670} {"train_loss": -27.2518367767334, "global_step": 470650, "epoch": 5670} {"train_loss": -27.557538986206055, "global_step": 470651, "epoch": 5670} {"train_loss": -27.2324275970459, "global_step": 470652, "epoch": 5670} {"train_loss": -27.23084831237793, "global_step": 470653, "epoch": 5670} {"train_loss": -27.118900299072266, "global_step": 470654, "epoch": 5670} {"train_loss": -27.204675674438477, "global_step": 470655, "epoch": 5670} {"train_loss": -27.409814834594727, "global_step": 470656, "epoch": 5670} {"train_loss": -27.2244873046875, "global_step": 470657, "epoch": 5670} {"train_loss": -27.043012619018555, "global_step": 470658, "epoch": 5670} {"train_loss": -26.670072555541992, "global_step": 470659, "epoch": 5670} {"train_loss": -27.286054611206055, "global_step": 470660, "epoch": 5670} {"train_loss": -27.41000747680664, "global_step": 470661, "epoch": 5670} {"train_loss": -26.96484375, "global_step": 470662, "epoch": 5670} {"train_loss": -26.392786026000977, "global_step": 470663, "epoch": 5670} {"train_loss": -26.40822410583496, "global_step": 470664, "epoch": 5670} {"train_loss": -26.92475700378418, "global_step": 470665, "epoch": 5670} {"train_loss": -27.362350463867188, "global_step": 470666, "epoch": 5670} {"train_loss": -27.140182495117188, "global_step": 470667, "epoch": 5670} {"train_loss": -26.570661544799805, "global_step": 470668, "epoch": 5670} {"train_loss": -27.29544448852539, "global_step": 470669, "epoch": 5670} {"train_loss": -26.65229606628418, "global_step": 470670, "epoch": 5670} {"train_loss": -27.550352096557617, "global_step": 470671, "epoch": 5670} {"train_loss": -27.178354263305664, "global_step": 470672, "epoch": 5670} {"train_loss": -27.364505767822266, "global_step": 470673, "epoch": 5670} {"train_loss": -27.605731964111328, "global_step": 470674, "epoch": 5670} {"train_loss": -27.239099502563477, "global_step": 470675, "epoch": 5670} {"train_loss": -27.2933349609375, "global_step": 470676, "epoch": 5670} {"train_loss": -26.988433837890625, "global_step": 470677, "epoch": 5670} {"train_loss": -27.213056564331055, "global_step": 470678, "epoch": 5670} {"train_loss": -27.094404220581055, "global_step": 470679, "epoch": 5670} {"train_loss": -27.264135360717773, "global_step": 470680, "epoch": 5670} {"train_loss": -27.451812744140625, "global_step": 470681, "epoch": 5670} {"train_loss": -27.142698287963867, "global_step": 470682, "epoch": 5670} {"train_loss": -27.440229415893555, "global_step": 470683, "epoch": 5670} {"train_loss": -27.162580490112305, "global_step": 470684, "epoch": 5670} {"train_loss": -27.326833724975586, "global_step": 470685, "epoch": 5670} {"train_loss": -27.073530197143555, "global_step": 470686, "epoch": 5670} {"train_loss": -27.381811141967773, "global_step": 470687, "epoch": 5670} {"train_loss": -26.7432861328125, "global_step": 470688, "epoch": 5670} {"train_loss": -27.240270614624023, "global_step": 470689, "epoch": 5670} {"train_loss": -27.3428955078125, "global_step": 470690, "epoch": 5670} {"train_loss": -27.212614059448242, "global_step": 470691, "epoch": 5670} {"train_loss": -27.06908692509295, "global_step": 470692, "epoch": 5670, "val_loss": 6684608.0} {"train_loss": -26.712696075439453, "global_step": 470693, "epoch": 5671} {"train_loss": -25.88822364807129, "global_step": 470694, "epoch": 5671} {"train_loss": -25.104150772094727, "global_step": 470695, "epoch": 5671} {"train_loss": -26.093347549438477, "global_step": 470696, "epoch": 5671} {"train_loss": -26.69867515563965, "global_step": 470697, "epoch": 5671} {"train_loss": -26.1651554107666, "global_step": 470698, "epoch": 5671} {"train_loss": -26.6622314453125, "global_step": 470699, "epoch": 5671} {"train_loss": -26.577014923095703, "global_step": 470700, "epoch": 5671} {"train_loss": -26.42329216003418, "global_step": 470701, "epoch": 5671} {"train_loss": -26.69874382019043, "global_step": 470702, "epoch": 5671} {"train_loss": -26.62192726135254, "global_step": 470703, "epoch": 5671} {"train_loss": -27.116735458374023, "global_step": 470704, "epoch": 5671} {"train_loss": -26.728219985961914, "global_step": 470705, "epoch": 5671} {"train_loss": -26.62247085571289, "global_step": 470706, "epoch": 5671} {"train_loss": -26.55775260925293, "global_step": 470707, "epoch": 5671} {"train_loss": -26.547574996948242, "global_step": 470708, "epoch": 5671} {"train_loss": -26.541339874267578, "global_step": 470709, "epoch": 5671} {"train_loss": -26.931838989257812, "global_step": 470710, "epoch": 5671} {"train_loss": -26.660266876220703, "global_step": 470711, "epoch": 5671} {"train_loss": -27.3043155670166, "global_step": 470712, "epoch": 5671} {"train_loss": -27.213104248046875, "global_step": 470713, "epoch": 5671} {"train_loss": -26.788198471069336, "global_step": 470714, "epoch": 5671} {"train_loss": -26.784467697143555, "global_step": 470715, "epoch": 5671} {"train_loss": -26.99849510192871, "global_step": 470716, "epoch": 5671} {"train_loss": -27.207839965820312, "global_step": 470717, "epoch": 5671} {"train_loss": -26.546615600585938, "global_step": 470718, "epoch": 5671} {"train_loss": -26.67911148071289, "global_step": 470719, "epoch": 5671} {"train_loss": -26.86246109008789, "global_step": 470720, "epoch": 5671} {"train_loss": -26.97779655456543, "global_step": 470721, "epoch": 5671} {"train_loss": -26.841230392456055, "global_step": 470722, "epoch": 5671} {"train_loss": -27.248340606689453, "global_step": 470723, "epoch": 5671} {"train_loss": -27.107221603393555, "global_step": 470724, "epoch": 5671} {"train_loss": -26.96445083618164, "global_step": 470725, "epoch": 5671} {"train_loss": -27.415395736694336, "global_step": 470726, "epoch": 5671} {"train_loss": -27.3137149810791, "global_step": 470727, "epoch": 5671} {"train_loss": -27.173126220703125, "global_step": 470728, "epoch": 5671} {"train_loss": -27.3099422454834, "global_step": 470729, "epoch": 5671} {"train_loss": -27.074426651000977, "global_step": 470730, "epoch": 5671} {"train_loss": -27.213605880737305, "global_step": 470731, "epoch": 5671} {"train_loss": -27.287702560424805, "global_step": 470732, "epoch": 5671} {"train_loss": -27.34791374206543, "global_step": 470733, "epoch": 5671} {"train_loss": -27.3630313873291, "global_step": 470734, "epoch": 5671} {"train_loss": -27.20849609375, "global_step": 470735, "epoch": 5671} {"train_loss": -26.994043350219727, "global_step": 470736, "epoch": 5671} {"train_loss": -27.35761070251465, "global_step": 470737, "epoch": 5671} {"train_loss": -27.24407958984375, "global_step": 470738, "epoch": 5671} {"train_loss": -26.85590171813965, "global_step": 470739, "epoch": 5671} {"train_loss": -27.59644889831543, "global_step": 470740, "epoch": 5671} {"train_loss": -27.274282455444336, "global_step": 470741, "epoch": 5671} {"train_loss": -27.321258544921875, "global_step": 470742, "epoch": 5671} {"train_loss": -26.9457950592041, "global_step": 470743, "epoch": 5671} {"train_loss": -27.057464599609375, "global_step": 470744, "epoch": 5671} {"train_loss": -27.105060577392578, "global_step": 470745, "epoch": 5671} {"train_loss": -27.396512985229492, "global_step": 470746, "epoch": 5671} {"train_loss": -27.360218048095703, "global_step": 470747, "epoch": 5671} {"train_loss": -27.362897872924805, "global_step": 470748, "epoch": 5671} {"train_loss": -27.2916259765625, "global_step": 470749, "epoch": 5671} {"train_loss": -27.494953155517578, "global_step": 470750, "epoch": 5671} {"train_loss": -27.191497802734375, "global_step": 470751, "epoch": 5671} {"train_loss": -27.428823471069336, "global_step": 470752, "epoch": 5671} {"train_loss": -27.216690063476562, "global_step": 470753, "epoch": 5671} {"train_loss": -27.60481834411621, "global_step": 470754, "epoch": 5671} {"train_loss": -27.05890464782715, "global_step": 470755, "epoch": 5671} {"train_loss": -27.509174346923828, "global_step": 470756, "epoch": 5671} {"train_loss": -27.38486099243164, "global_step": 470757, "epoch": 5671} {"train_loss": -27.732709884643555, "global_step": 470758, "epoch": 5671} {"train_loss": -27.08331871032715, "global_step": 470759, "epoch": 5671} {"train_loss": -27.56581687927246, "global_step": 470760, "epoch": 5671} {"train_loss": -27.49309730529785, "global_step": 470761, "epoch": 5671} {"train_loss": -27.206745147705078, "global_step": 470762, "epoch": 5671} {"train_loss": -27.253131866455078, "global_step": 470763, "epoch": 5671} {"train_loss": -27.060842514038086, "global_step": 470764, "epoch": 5671} {"train_loss": -26.82574462890625, "global_step": 470765, "epoch": 5671} {"train_loss": -26.502988815307617, "global_step": 470766, "epoch": 5671} {"train_loss": -26.588300704956055, "global_step": 470767, "epoch": 5671} {"train_loss": -26.170873641967773, "global_step": 470768, "epoch": 5671} {"train_loss": -26.800750732421875, "global_step": 470769, "epoch": 5671} {"train_loss": -27.051252365112305, "global_step": 470770, "epoch": 5671} {"train_loss": -26.45145034790039, "global_step": 470771, "epoch": 5671} {"train_loss": -26.881956100463867, "global_step": 470772, "epoch": 5671} {"train_loss": -26.841938018798828, "global_step": 470773, "epoch": 5671} {"train_loss": -27.087711334228516, "global_step": 470774, "epoch": 5671} {"train_loss": -26.98083162882242, "global_step": 470775, "epoch": 5671, "val_loss": 6752068.5} {"train_loss": -26.565174102783203, "global_step": 470776, "epoch": 5672} {"train_loss": -26.581918716430664, "global_step": 470777, "epoch": 5672} {"train_loss": -26.45119285583496, "global_step": 470778, "epoch": 5672} {"train_loss": -26.417282104492188, "global_step": 470779, "epoch": 5672} {"train_loss": -26.978071212768555, "global_step": 470780, "epoch": 5672} {"train_loss": -26.374603271484375, "global_step": 470781, "epoch": 5672} {"train_loss": -26.69428825378418, "global_step": 470782, "epoch": 5672} {"train_loss": -26.668806076049805, "global_step": 470783, "epoch": 5672} {"train_loss": -26.308029174804688, "global_step": 470784, "epoch": 5672} {"train_loss": -26.389698028564453, "global_step": 470785, "epoch": 5672} {"train_loss": -26.62091636657715, "global_step": 470786, "epoch": 5672} {"train_loss": -26.543415069580078, "global_step": 470787, "epoch": 5672} {"train_loss": -26.915424346923828, "global_step": 470788, "epoch": 5672} {"train_loss": -26.822418212890625, "global_step": 470789, "epoch": 5672} {"train_loss": -26.751789093017578, "global_step": 470790, "epoch": 5672} {"train_loss": -27.013015747070312, "global_step": 470791, "epoch": 5672} {"train_loss": -26.92500114440918, "global_step": 470792, "epoch": 5672} {"train_loss": -27.1085147857666, "global_step": 470793, "epoch": 5672} {"train_loss": -27.069990158081055, "global_step": 470794, "epoch": 5672} {"train_loss": -27.128040313720703, "global_step": 470795, "epoch": 5672} {"train_loss": -27.08795166015625, "global_step": 470796, "epoch": 5672} {"train_loss": -26.9635009765625, "global_step": 470797, "epoch": 5672} {"train_loss": -26.97296714782715, "global_step": 470798, "epoch": 5672} {"train_loss": -27.3314266204834, "global_step": 470799, "epoch": 5672} {"train_loss": -27.549854278564453, "global_step": 470800, "epoch": 5672} {"train_loss": -27.183349609375, "global_step": 470801, "epoch": 5672} {"train_loss": -26.729736328125, "global_step": 470802, "epoch": 5672} {"train_loss": -27.089136123657227, "global_step": 470803, "epoch": 5672} {"train_loss": -27.409528732299805, "global_step": 470804, "epoch": 5672} {"train_loss": -26.818151473999023, "global_step": 470805, "epoch": 5672} {"train_loss": -27.351871490478516, "global_step": 470806, "epoch": 5672} {"train_loss": -27.024829864501953, "global_step": 470807, "epoch": 5672} {"train_loss": -27.30918312072754, "global_step": 470808, "epoch": 5672} {"train_loss": -27.34809684753418, "global_step": 470809, "epoch": 5672} {"train_loss": -27.300809860229492, "global_step": 470810, "epoch": 5672} {"train_loss": -27.292722702026367, "global_step": 470811, "epoch": 5672} {"train_loss": -27.46893310546875, "global_step": 470812, "epoch": 5672} {"train_loss": -27.287256240844727, "global_step": 470813, "epoch": 5672} {"train_loss": -27.297210693359375, "global_step": 470814, "epoch": 5672} {"train_loss": -27.20940589904785, "global_step": 470815, "epoch": 5672} {"train_loss": -27.074462890625, "global_step": 470816, "epoch": 5672} {"train_loss": -26.825647354125977, "global_step": 470817, "epoch": 5672} {"train_loss": -26.80388832092285, "global_step": 470818, "epoch": 5672} {"train_loss": -27.431318283081055, "global_step": 470819, "epoch": 5672} {"train_loss": -27.62567138671875, "global_step": 470820, "epoch": 5672} {"train_loss": -27.147199630737305, "global_step": 470821, "epoch": 5672} {"train_loss": -27.3192138671875, "global_step": 470822, "epoch": 5672} {"train_loss": -27.191741943359375, "global_step": 470823, "epoch": 5672} {"train_loss": -27.402013778686523, "global_step": 470824, "epoch": 5672} {"train_loss": -27.403467178344727, "global_step": 470825, "epoch": 5672} {"train_loss": -27.409692764282227, "global_step": 470826, "epoch": 5672} {"train_loss": -27.223834991455078, "global_step": 470827, "epoch": 5672} {"train_loss": -26.828332901000977, "global_step": 470828, "epoch": 5672} {"train_loss": -27.457477569580078, "global_step": 470829, "epoch": 5672} {"train_loss": -27.256067276000977, "global_step": 470830, "epoch": 5672} {"train_loss": -27.10625648498535, "global_step": 470831, "epoch": 5672} {"train_loss": -27.31476402282715, "global_step": 470832, "epoch": 5672} {"train_loss": -27.218585968017578, "global_step": 470833, "epoch": 5672} {"train_loss": -27.477582931518555, "global_step": 470834, "epoch": 5672} {"train_loss": -26.804981231689453, "global_step": 470835, "epoch": 5672} {"train_loss": -27.38404655456543, "global_step": 470836, "epoch": 5672} {"train_loss": -27.234060287475586, "global_step": 470837, "epoch": 5672} {"train_loss": -27.26470375061035, "global_step": 470838, "epoch": 5672} {"train_loss": -27.105762481689453, "global_step": 470839, "epoch": 5672} {"train_loss": -27.51752281188965, "global_step": 470840, "epoch": 5672} {"train_loss": -27.22894287109375, "global_step": 470841, "epoch": 5672} {"train_loss": -27.24366569519043, "global_step": 470842, "epoch": 5672} {"train_loss": -27.094587326049805, "global_step": 470843, "epoch": 5672} {"train_loss": -27.096494674682617, "global_step": 470844, "epoch": 5672} {"train_loss": -27.186023712158203, "global_step": 470845, "epoch": 5672} {"train_loss": -27.100629806518555, "global_step": 470846, "epoch": 5672} {"train_loss": -27.1800479888916, "global_step": 470847, "epoch": 5672} {"train_loss": -27.621475219726562, "global_step": 470848, "epoch": 5672} {"train_loss": -27.26508140563965, "global_step": 470849, "epoch": 5672} {"train_loss": -27.293781280517578, "global_step": 470850, "epoch": 5672} {"train_loss": -27.03350257873535, "global_step": 470851, "epoch": 5672} {"train_loss": -26.821643829345703, "global_step": 470852, "epoch": 5672} {"train_loss": -26.946197509765625, "global_step": 470853, "epoch": 5672} {"train_loss": -27.367551803588867, "global_step": 470854, "epoch": 5672} {"train_loss": -27.367319107055664, "global_step": 470855, "epoch": 5672} {"train_loss": -27.46833610534668, "global_step": 470856, "epoch": 5672} {"train_loss": -27.089893341064453, "global_step": 470857, "epoch": 5672} {"train_loss": -27.076980544860106, "global_step": 470858, "epoch": 5672, "val_loss": 6645182.5} {"train_loss": -26.6622257232666, "global_step": 470859, "epoch": 5673} {"train_loss": -26.39263916015625, "global_step": 470860, "epoch": 5673} {"train_loss": -26.76104736328125, "global_step": 470861, "epoch": 5673} {"train_loss": -26.9311466217041, "global_step": 470862, "epoch": 5673} {"train_loss": -27.37753677368164, "global_step": 470863, "epoch": 5673} {"train_loss": -26.76787757873535, "global_step": 470864, "epoch": 5673} {"train_loss": -27.317853927612305, "global_step": 470865, "epoch": 5673} {"train_loss": -26.836816787719727, "global_step": 470866, "epoch": 5673} {"train_loss": -27.356489181518555, "global_step": 470867, "epoch": 5673} {"train_loss": -26.761213302612305, "global_step": 470868, "epoch": 5673} {"train_loss": -26.59144401550293, "global_step": 470869, "epoch": 5673} {"train_loss": -26.95713233947754, "global_step": 470870, "epoch": 5673} {"train_loss": -27.31648063659668, "global_step": 470871, "epoch": 5673} {"train_loss": -27.027212142944336, "global_step": 470872, "epoch": 5673} {"train_loss": -26.898635864257812, "global_step": 470873, "epoch": 5673} {"train_loss": -27.152774810791016, "global_step": 470874, "epoch": 5673} {"train_loss": -27.281723022460938, "global_step": 470875, "epoch": 5673} {"train_loss": -27.130353927612305, "global_step": 470876, "epoch": 5673} {"train_loss": -26.744779586791992, "global_step": 470877, "epoch": 5673} {"train_loss": -27.264942169189453, "global_step": 470878, "epoch": 5673} {"train_loss": -27.063861846923828, "global_step": 470879, "epoch": 5673} {"train_loss": -27.01422691345215, "global_step": 470880, "epoch": 5673} {"train_loss": -27.02485466003418, "global_step": 470881, "epoch": 5673} {"train_loss": -27.23036766052246, "global_step": 470882, "epoch": 5673} {"train_loss": -26.92103385925293, "global_step": 470883, "epoch": 5673} {"train_loss": -27.091184616088867, "global_step": 470884, "epoch": 5673} {"train_loss": -27.042957305908203, "global_step": 470885, "epoch": 5673} {"train_loss": -27.090131759643555, "global_step": 470886, "epoch": 5673} {"train_loss": -27.1892147064209, "global_step": 470887, "epoch": 5673} {"train_loss": -26.83814811706543, "global_step": 470888, "epoch": 5673} {"train_loss": -27.094024658203125, "global_step": 470889, "epoch": 5673} {"train_loss": -26.930700302124023, "global_step": 470890, "epoch": 5673} {"train_loss": -27.526687622070312, "global_step": 470891, "epoch": 5673} {"train_loss": -27.161945343017578, "global_step": 470892, "epoch": 5673} {"train_loss": -27.555255889892578, "global_step": 470893, "epoch": 5673} {"train_loss": -27.684911727905273, "global_step": 470894, "epoch": 5673} {"train_loss": -27.45708656311035, "global_step": 470895, "epoch": 5673} {"train_loss": -27.21904945373535, "global_step": 470896, "epoch": 5673} {"train_loss": -27.092748641967773, "global_step": 470897, "epoch": 5673} {"train_loss": -27.754770278930664, "global_step": 470898, "epoch": 5673} {"train_loss": -27.370946884155273, "global_step": 470899, "epoch": 5673} {"train_loss": -27.28070640563965, "global_step": 470900, "epoch": 5673} {"train_loss": -27.3494815826416, "global_step": 470901, "epoch": 5673} {"train_loss": -26.902969360351562, "global_step": 470902, "epoch": 5673} {"train_loss": -26.202173233032227, "global_step": 470903, "epoch": 5673} {"train_loss": -26.245502471923828, "global_step": 470904, "epoch": 5673} {"train_loss": -27.089834213256836, "global_step": 470905, "epoch": 5673} {"train_loss": -27.203954696655273, "global_step": 470906, "epoch": 5673} {"train_loss": -26.666624069213867, "global_step": 470907, "epoch": 5673} {"train_loss": -27.191370010375977, "global_step": 470908, "epoch": 5673} {"train_loss": -27.014789581298828, "global_step": 470909, "epoch": 5673} {"train_loss": -27.315595626831055, "global_step": 470910, "epoch": 5673} {"train_loss": -27.255203247070312, "global_step": 470911, "epoch": 5673} {"train_loss": -27.181699752807617, "global_step": 470912, "epoch": 5673} {"train_loss": -27.01605796813965, "global_step": 470913, "epoch": 5673} {"train_loss": -27.376697540283203, "global_step": 470914, "epoch": 5673} {"train_loss": -27.151594161987305, "global_step": 470915, "epoch": 5673} {"train_loss": -26.99031639099121, "global_step": 470916, "epoch": 5673} {"train_loss": -27.23914909362793, "global_step": 470917, "epoch": 5673} {"train_loss": -27.013248443603516, "global_step": 470918, "epoch": 5673} {"train_loss": -27.202289581298828, "global_step": 470919, "epoch": 5673} {"train_loss": -26.885303497314453, "global_step": 470920, "epoch": 5673} {"train_loss": -26.742267608642578, "global_step": 470921, "epoch": 5673} {"train_loss": -27.096975326538086, "global_step": 470922, "epoch": 5673} {"train_loss": -26.79315757751465, "global_step": 470923, "epoch": 5673} {"train_loss": -26.979894638061523, "global_step": 470924, "epoch": 5673} {"train_loss": -27.0211238861084, "global_step": 470925, "epoch": 5673} {"train_loss": -27.015167236328125, "global_step": 470926, "epoch": 5673} {"train_loss": -26.532855987548828, "global_step": 470927, "epoch": 5673} {"train_loss": -26.63416862487793, "global_step": 470928, "epoch": 5673} {"train_loss": -25.986133575439453, "global_step": 470929, "epoch": 5673} {"train_loss": -25.74755859375, "global_step": 470930, "epoch": 5673} {"train_loss": -26.968463897705078, "global_step": 470931, "epoch": 5673} {"train_loss": -26.633350372314453, "global_step": 470932, "epoch": 5673} {"train_loss": -26.442228317260742, "global_step": 470933, "epoch": 5673} {"train_loss": -27.054309844970703, "global_step": 470934, "epoch": 5673} {"train_loss": -26.4164981842041, "global_step": 470935, "epoch": 5673} {"train_loss": -26.919225692749023, "global_step": 470936, "epoch": 5673} {"train_loss": -26.63226890563965, "global_step": 470937, "epoch": 5673} {"train_loss": -26.527746200561523, "global_step": 470938, "epoch": 5673} {"train_loss": -26.80283546447754, "global_step": 470939, "epoch": 5673} {"train_loss": -26.5118465423584, "global_step": 470940, "epoch": 5673} {"train_loss": -26.979465507599244, "global_step": 470941, "epoch": 5673, "val_loss": 6705722.0} {"train_loss": -26.426664352416992, "global_step": 470942, "epoch": 5674} {"train_loss": -26.473281860351562, "global_step": 470943, "epoch": 5674} {"train_loss": -26.2512149810791, "global_step": 470944, "epoch": 5674} {"train_loss": -26.56428337097168, "global_step": 470945, "epoch": 5674} {"train_loss": -26.481184005737305, "global_step": 470946, "epoch": 5674} {"train_loss": -25.874820709228516, "global_step": 470947, "epoch": 5674} {"train_loss": -26.50288963317871, "global_step": 470948, "epoch": 5674} {"train_loss": -25.319839477539062, "global_step": 470949, "epoch": 5674} {"train_loss": -26.281539916992188, "global_step": 470950, "epoch": 5674} {"train_loss": -26.457151412963867, "global_step": 470951, "epoch": 5674} {"train_loss": -26.07990074157715, "global_step": 470952, "epoch": 5674} {"train_loss": -26.428543090820312, "global_step": 470953, "epoch": 5674} {"train_loss": -26.490833282470703, "global_step": 470954, "epoch": 5674} {"train_loss": -26.590917587280273, "global_step": 470955, "epoch": 5674} {"train_loss": -26.90960121154785, "global_step": 470956, "epoch": 5674} {"train_loss": -26.538501739501953, "global_step": 470957, "epoch": 5674} {"train_loss": -26.60444450378418, "global_step": 470958, "epoch": 5674} {"train_loss": -26.59754753112793, "global_step": 470959, "epoch": 5674} {"train_loss": -26.716339111328125, "global_step": 470960, "epoch": 5674} {"train_loss": -26.9018497467041, "global_step": 470961, "epoch": 5674} {"train_loss": -26.632190704345703, "global_step": 470962, "epoch": 5674} {"train_loss": -26.552204132080078, "global_step": 470963, "epoch": 5674} {"train_loss": -26.77685546875, "global_step": 470964, "epoch": 5674} {"train_loss": -26.900848388671875, "global_step": 470965, "epoch": 5674} {"train_loss": -26.9066104888916, "global_step": 470966, "epoch": 5674} {"train_loss": -27.004364013671875, "global_step": 470967, "epoch": 5674} {"train_loss": -26.696842193603516, "global_step": 470968, "epoch": 5674} {"train_loss": -26.860504150390625, "global_step": 470969, "epoch": 5674} {"train_loss": -26.819889068603516, "global_step": 470970, "epoch": 5674} {"train_loss": -27.179767608642578, "global_step": 470971, "epoch": 5674} {"train_loss": -26.963638305664062, "global_step": 470972, "epoch": 5674} {"train_loss": -26.96115493774414, "global_step": 470973, "epoch": 5674} {"train_loss": -26.948383331298828, "global_step": 470974, "epoch": 5674} {"train_loss": -27.245223999023438, "global_step": 470975, "epoch": 5674} {"train_loss": -27.13534927368164, "global_step": 470976, "epoch": 5674} {"train_loss": -27.297149658203125, "global_step": 470977, "epoch": 5674} {"train_loss": -27.37346839904785, "global_step": 470978, "epoch": 5674} {"train_loss": -27.189306259155273, "global_step": 470979, "epoch": 5674} {"train_loss": -27.412748336791992, "global_step": 470980, "epoch": 5674} {"train_loss": -27.25406265258789, "global_step": 470981, "epoch": 5674} {"train_loss": -27.424671173095703, "global_step": 470982, "epoch": 5674} {"train_loss": -27.158536911010742, "global_step": 470983, "epoch": 5674} {"train_loss": -27.38568115234375, "global_step": 470984, "epoch": 5674} {"train_loss": -26.955915451049805, "global_step": 470985, "epoch": 5674} {"train_loss": -26.74625015258789, "global_step": 470986, "epoch": 5674} {"train_loss": -27.3507022857666, "global_step": 470987, "epoch": 5674} {"train_loss": -27.078596115112305, "global_step": 470988, "epoch": 5674} {"train_loss": -27.598913192749023, "global_step": 470989, "epoch": 5674} {"train_loss": -27.379047393798828, "global_step": 470990, "epoch": 5674} {"train_loss": -27.453718185424805, "global_step": 470991, "epoch": 5674} {"train_loss": -27.373794555664062, "global_step": 470992, "epoch": 5674} {"train_loss": -26.893705368041992, "global_step": 470993, "epoch": 5674} {"train_loss": -27.612035751342773, "global_step": 470994, "epoch": 5674} {"train_loss": -27.10733413696289, "global_step": 470995, "epoch": 5674} {"train_loss": -27.249845504760742, "global_step": 470996, "epoch": 5674} {"train_loss": -27.10647964477539, "global_step": 470997, "epoch": 5674} {"train_loss": -27.08046531677246, "global_step": 470998, "epoch": 5674} {"train_loss": -27.548791885375977, "global_step": 470999, "epoch": 5674} {"train_loss": -27.325910568237305, "global_step": 471000, "epoch": 5674} {"train_loss": -27.300769805908203, "global_step": 471001, "epoch": 5674} {"train_loss": -27.542743682861328, "global_step": 471002, "epoch": 5674} {"train_loss": -27.341882705688477, "global_step": 471003, "epoch": 5674} {"train_loss": -27.569665908813477, "global_step": 471004, "epoch": 5674} {"train_loss": -27.018802642822266, "global_step": 471005, "epoch": 5674} {"train_loss": -27.676477432250977, "global_step": 471006, "epoch": 5674} {"train_loss": -27.391498565673828, "global_step": 471007, "epoch": 5674} {"train_loss": -27.51372718811035, "global_step": 471008, "epoch": 5674} {"train_loss": -27.35371208190918, "global_step": 471009, "epoch": 5674} {"train_loss": -27.753082275390625, "global_step": 471010, "epoch": 5674} {"train_loss": -27.224695205688477, "global_step": 471011, "epoch": 5674} {"train_loss": -27.475767135620117, "global_step": 471012, "epoch": 5674} {"train_loss": -27.310504913330078, "global_step": 471013, "epoch": 5674} {"train_loss": -27.650671005249023, "global_step": 471014, "epoch": 5674} {"train_loss": -27.278791427612305, "global_step": 471015, "epoch": 5674} {"train_loss": -27.27874183654785, "global_step": 471016, "epoch": 5674} {"train_loss": -27.622486114501953, "global_step": 471017, "epoch": 5674} {"train_loss": -27.36566162109375, "global_step": 471018, "epoch": 5674} {"train_loss": -27.455188751220703, "global_step": 471019, "epoch": 5674} {"train_loss": -27.419401168823242, "global_step": 471020, "epoch": 5674} {"train_loss": -27.34394645690918, "global_step": 471021, "epoch": 5674} {"train_loss": -27.481414794921875, "global_step": 471022, "epoch": 5674} {"train_loss": -27.352985382080078, "global_step": 471023, "epoch": 5674} {"train_loss": -27.062808806637683, "global_step": 471024, "epoch": 5674, "val_loss": 6710717.0} {"train_loss": -26.544754028320312, "global_step": 471025, "epoch": 5675} {"train_loss": -26.4834041595459, "global_step": 471026, "epoch": 5675} {"train_loss": -26.826618194580078, "global_step": 471027, "epoch": 5675} {"train_loss": -26.53436279296875, "global_step": 471028, "epoch": 5675} {"train_loss": -26.703519821166992, "global_step": 471029, "epoch": 5675} {"train_loss": -26.68218421936035, "global_step": 471030, "epoch": 5675} {"train_loss": -26.77783203125, "global_step": 471031, "epoch": 5675} {"train_loss": -26.21109962463379, "global_step": 471032, "epoch": 5675} {"train_loss": -26.211505889892578, "global_step": 471033, "epoch": 5675} {"train_loss": -26.379169464111328, "global_step": 471034, "epoch": 5675} {"train_loss": -27.167306900024414, "global_step": 471035, "epoch": 5675} {"train_loss": -26.425588607788086, "global_step": 471036, "epoch": 5675} {"train_loss": -25.79140281677246, "global_step": 471037, "epoch": 5675} {"train_loss": -26.445066452026367, "global_step": 471038, "epoch": 5675} {"train_loss": -26.952890396118164, "global_step": 471039, "epoch": 5675} {"train_loss": -26.0974063873291, "global_step": 471040, "epoch": 5675} {"train_loss": -26.732711791992188, "global_step": 471041, "epoch": 5675} {"train_loss": -26.288599014282227, "global_step": 471042, "epoch": 5675} {"train_loss": -27.0129451751709, "global_step": 471043, "epoch": 5675} {"train_loss": -26.494464874267578, "global_step": 471044, "epoch": 5675} {"train_loss": -26.346343994140625, "global_step": 471045, "epoch": 5675} {"train_loss": -26.892805099487305, "global_step": 471046, "epoch": 5675} {"train_loss": -26.894983291625977, "global_step": 471047, "epoch": 5675} {"train_loss": -26.661863327026367, "global_step": 471048, "epoch": 5675} {"train_loss": -26.84271812438965, "global_step": 471049, "epoch": 5675} {"train_loss": -26.6320858001709, "global_step": 471050, "epoch": 5675} {"train_loss": -26.859546661376953, "global_step": 471051, "epoch": 5675} {"train_loss": -26.939054489135742, "global_step": 471052, "epoch": 5675} {"train_loss": -27.106201171875, "global_step": 471053, "epoch": 5675} {"train_loss": -27.0880069732666, "global_step": 471054, "epoch": 5675} {"train_loss": -26.675596237182617, "global_step": 471055, "epoch": 5675} {"train_loss": -26.98017692565918, "global_step": 471056, "epoch": 5675} {"train_loss": -27.0272216796875, "global_step": 471057, "epoch": 5675} {"train_loss": -26.599477767944336, "global_step": 471058, "epoch": 5675} {"train_loss": -26.87255859375, "global_step": 471059, "epoch": 5675} {"train_loss": -27.15309715270996, "global_step": 471060, "epoch": 5675} {"train_loss": -27.268503189086914, "global_step": 471061, "epoch": 5675} {"train_loss": -27.20016860961914, "global_step": 471062, "epoch": 5675} {"train_loss": -27.23170280456543, "global_step": 471063, "epoch": 5675} {"train_loss": -27.21967887878418, "global_step": 471064, "epoch": 5675} {"train_loss": -27.426855087280273, "global_step": 471065, "epoch": 5675} {"train_loss": -27.0031681060791, "global_step": 471066, "epoch": 5675} {"train_loss": -27.053348541259766, "global_step": 471067, "epoch": 5675} {"train_loss": -26.912220001220703, "global_step": 471068, "epoch": 5675} {"train_loss": -27.464536666870117, "global_step": 471069, "epoch": 5675} {"train_loss": -27.19510841369629, "global_step": 471070, "epoch": 5675} {"train_loss": -27.153432846069336, "global_step": 471071, "epoch": 5675} {"train_loss": -27.220844268798828, "global_step": 471072, "epoch": 5675} {"train_loss": -27.02469253540039, "global_step": 471073, "epoch": 5675} {"train_loss": -27.115005493164062, "global_step": 471074, "epoch": 5675} {"train_loss": -27.029508590698242, "global_step": 471075, "epoch": 5675} {"train_loss": -27.330041885375977, "global_step": 471076, "epoch": 5675} {"train_loss": -27.490514755249023, "global_step": 471077, "epoch": 5675} {"train_loss": -27.643259048461914, "global_step": 471078, "epoch": 5675} {"train_loss": -27.55974769592285, "global_step": 471079, "epoch": 5675} {"train_loss": -27.45246696472168, "global_step": 471080, "epoch": 5675} {"train_loss": -27.00831413269043, "global_step": 471081, "epoch": 5675} {"train_loss": -27.062902450561523, "global_step": 471082, "epoch": 5675} {"train_loss": -27.40247917175293, "global_step": 471083, "epoch": 5675} {"train_loss": -27.214981079101562, "global_step": 471084, "epoch": 5675} {"train_loss": -26.980024337768555, "global_step": 471085, "epoch": 5675} {"train_loss": -27.312946319580078, "global_step": 471086, "epoch": 5675} {"train_loss": -27.78643226623535, "global_step": 471087, "epoch": 5675} {"train_loss": -27.162994384765625, "global_step": 471088, "epoch": 5675} {"train_loss": -27.20931053161621, "global_step": 471089, "epoch": 5675} {"train_loss": -27.396747589111328, "global_step": 471090, "epoch": 5675} {"train_loss": -27.060068130493164, "global_step": 471091, "epoch": 5675} {"train_loss": -27.279254913330078, "global_step": 471092, "epoch": 5675} {"train_loss": -27.04288101196289, "global_step": 471093, "epoch": 5675} {"train_loss": -27.599872589111328, "global_step": 471094, "epoch": 5675} {"train_loss": -27.169214248657227, "global_step": 471095, "epoch": 5675} {"train_loss": -27.55159568786621, "global_step": 471096, "epoch": 5675} {"train_loss": -27.040771484375, "global_step": 471097, "epoch": 5675} {"train_loss": -27.163970947265625, "global_step": 471098, "epoch": 5675} {"train_loss": -27.38226318359375, "global_step": 471099, "epoch": 5675} {"train_loss": -26.725906372070312, "global_step": 471100, "epoch": 5675} {"train_loss": -27.48158073425293, "global_step": 471101, "epoch": 5675} {"train_loss": -27.280996322631836, "global_step": 471102, "epoch": 5675} {"train_loss": -27.382205963134766, "global_step": 471103, "epoch": 5675} {"train_loss": -27.781814575195312, "global_step": 471104, "epoch": 5675} {"train_loss": -27.75358009338379, "global_step": 471105, "epoch": 5675} {"train_loss": -27.483041763305664, "global_step": 471106, "epoch": 5675} {"train_loss": -27.029866115156427, "global_step": 471107, "epoch": 5675, "val_loss": 6796944.0} {"train_loss": -26.950183868408203, "global_step": 471108, "epoch": 5676} {"train_loss": -26.641874313354492, "global_step": 471109, "epoch": 5676} {"train_loss": -26.931415557861328, "global_step": 471110, "epoch": 5676} {"train_loss": -26.83393669128418, "global_step": 471111, "epoch": 5676} {"train_loss": -27.264799118041992, "global_step": 471112, "epoch": 5676} {"train_loss": -26.895910263061523, "global_step": 471113, "epoch": 5676} {"train_loss": -26.930221557617188, "global_step": 471114, "epoch": 5676} {"train_loss": -26.939661026000977, "global_step": 471115, "epoch": 5676} {"train_loss": -27.07268714904785, "global_step": 471116, "epoch": 5676} {"train_loss": -27.05584716796875, "global_step": 471117, "epoch": 5676} {"train_loss": -26.7415714263916, "global_step": 471118, "epoch": 5676} {"train_loss": -26.58929443359375, "global_step": 471119, "epoch": 5676} {"train_loss": -27.176496505737305, "global_step": 471120, "epoch": 5676} {"train_loss": -26.80757713317871, "global_step": 471121, "epoch": 5676} {"train_loss": -27.276086807250977, "global_step": 471122, "epoch": 5676} {"train_loss": -26.859479904174805, "global_step": 471123, "epoch": 5676} {"train_loss": -26.926977157592773, "global_step": 471124, "epoch": 5676} {"train_loss": -26.92168617248535, "global_step": 471125, "epoch": 5676} {"train_loss": -27.099592208862305, "global_step": 471126, "epoch": 5676} {"train_loss": -26.43967628479004, "global_step": 471127, "epoch": 5676} {"train_loss": -26.786680221557617, "global_step": 471128, "epoch": 5676} {"train_loss": -26.889419555664062, "global_step": 471129, "epoch": 5676} {"train_loss": -27.06373405456543, "global_step": 471130, "epoch": 5676} {"train_loss": -27.0255126953125, "global_step": 471131, "epoch": 5676} {"train_loss": -27.01417350769043, "global_step": 471132, "epoch": 5676} {"train_loss": -27.05879020690918, "global_step": 471133, "epoch": 5676} {"train_loss": -27.306140899658203, "global_step": 471134, "epoch": 5676} {"train_loss": -26.737823486328125, "global_step": 471135, "epoch": 5676} {"train_loss": -26.88678550720215, "global_step": 471136, "epoch": 5676} {"train_loss": -27.144058227539062, "global_step": 471137, "epoch": 5676} {"train_loss": -27.396026611328125, "global_step": 471138, "epoch": 5676} {"train_loss": -26.90667724609375, "global_step": 471139, "epoch": 5676} {"train_loss": -26.99904441833496, "global_step": 471140, "epoch": 5676} {"train_loss": -27.051513671875, "global_step": 471141, "epoch": 5676} {"train_loss": -27.031402587890625, "global_step": 471142, "epoch": 5676} {"train_loss": -27.3981876373291, "global_step": 471143, "epoch": 5676} {"train_loss": -27.164960861206055, "global_step": 471144, "epoch": 5676} {"train_loss": -27.45102882385254, "global_step": 471145, "epoch": 5676} {"train_loss": -27.192764282226562, "global_step": 471146, "epoch": 5676} {"train_loss": -27.53412437438965, "global_step": 471147, "epoch": 5676} {"train_loss": -27.20431900024414, "global_step": 471148, "epoch": 5676} {"train_loss": -27.055709838867188, "global_step": 471149, "epoch": 5676} {"train_loss": -27.26787757873535, "global_step": 471150, "epoch": 5676} {"train_loss": -27.185596466064453, "global_step": 471151, "epoch": 5676} {"train_loss": -27.21050453186035, "global_step": 471152, "epoch": 5676} {"train_loss": -27.110509872436523, "global_step": 471153, "epoch": 5676} {"train_loss": -27.22966957092285, "global_step": 471154, "epoch": 5676} {"train_loss": -27.331689834594727, "global_step": 471155, "epoch": 5676} {"train_loss": -27.35969352722168, "global_step": 471156, "epoch": 5676} {"train_loss": -27.243146896362305, "global_step": 471157, "epoch": 5676} {"train_loss": -27.080402374267578, "global_step": 471158, "epoch": 5676} {"train_loss": -27.316152572631836, "global_step": 471159, "epoch": 5676} {"train_loss": -26.979644775390625, "global_step": 471160, "epoch": 5676} {"train_loss": -26.87200927734375, "global_step": 471161, "epoch": 5676} {"train_loss": -26.851364135742188, "global_step": 471162, "epoch": 5676} {"train_loss": -26.589895248413086, "global_step": 471163, "epoch": 5676} {"train_loss": -26.8026180267334, "global_step": 471164, "epoch": 5676} {"train_loss": -26.965436935424805, "global_step": 471165, "epoch": 5676} {"train_loss": -26.848676681518555, "global_step": 471166, "epoch": 5676} {"train_loss": -27.558155059814453, "global_step": 471167, "epoch": 5676} {"train_loss": -27.363683700561523, "global_step": 471168, "epoch": 5676} {"train_loss": -27.292837142944336, "global_step": 471169, "epoch": 5676} {"train_loss": -27.127490997314453, "global_step": 471170, "epoch": 5676} {"train_loss": -26.96441650390625, "global_step": 471171, "epoch": 5676} {"train_loss": -27.484838485717773, "global_step": 471172, "epoch": 5676} {"train_loss": -27.035490036010742, "global_step": 471173, "epoch": 5676} {"train_loss": -27.343647003173828, "global_step": 471174, "epoch": 5676} {"train_loss": -27.253293991088867, "global_step": 471175, "epoch": 5676} {"train_loss": -27.189624786376953, "global_step": 471176, "epoch": 5676} {"train_loss": -27.149560928344727, "global_step": 471177, "epoch": 5676} {"train_loss": -27.216842651367188, "global_step": 471178, "epoch": 5676} {"train_loss": -27.24146842956543, "global_step": 471179, "epoch": 5676} {"train_loss": -26.939151763916016, "global_step": 471180, "epoch": 5676} {"train_loss": -27.448062896728516, "global_step": 471181, "epoch": 5676} {"train_loss": -27.266265869140625, "global_step": 471182, "epoch": 5676} {"train_loss": -27.165185928344727, "global_step": 471183, "epoch": 5676} {"train_loss": -27.4864501953125, "global_step": 471184, "epoch": 5676} {"train_loss": -27.43633460998535, "global_step": 471185, "epoch": 5676} {"train_loss": -27.350223541259766, "global_step": 471186, "epoch": 5676} {"train_loss": -27.489532470703125, "global_step": 471187, "epoch": 5676} {"train_loss": -27.1347599029541, "global_step": 471188, "epoch": 5676} {"train_loss": -27.412708282470703, "global_step": 471189, "epoch": 5676} {"train_loss": -27.103655780654357, "global_step": 471190, "epoch": 5676, "val_loss": 6691924.0} {"train_loss": -26.225086212158203, "global_step": 471191, "epoch": 5677} {"train_loss": -26.808258056640625, "global_step": 471192, "epoch": 5677} {"train_loss": -25.677154541015625, "global_step": 471193, "epoch": 5677} {"train_loss": -26.534595489501953, "global_step": 471194, "epoch": 5677} {"train_loss": -26.358007431030273, "global_step": 471195, "epoch": 5677} {"train_loss": -27.0900821685791, "global_step": 471196, "epoch": 5677} {"train_loss": -26.84170913696289, "global_step": 471197, "epoch": 5677} {"train_loss": -26.613880157470703, "global_step": 471198, "epoch": 5677} {"train_loss": -26.715585708618164, "global_step": 471199, "epoch": 5677} {"train_loss": -26.85702896118164, "global_step": 471200, "epoch": 5677} {"train_loss": -27.235937118530273, "global_step": 471201, "epoch": 5677} {"train_loss": -26.878774642944336, "global_step": 471202, "epoch": 5677} {"train_loss": -26.640125274658203, "global_step": 471203, "epoch": 5677} {"train_loss": -26.95088005065918, "global_step": 471204, "epoch": 5677} {"train_loss": -26.69434928894043, "global_step": 471205, "epoch": 5677} {"train_loss": -26.95118522644043, "global_step": 471206, "epoch": 5677} {"train_loss": -26.626264572143555, "global_step": 471207, "epoch": 5677} {"train_loss": -27.410919189453125, "global_step": 471208, "epoch": 5677} {"train_loss": -27.147275924682617, "global_step": 471209, "epoch": 5677} {"train_loss": -26.971704483032227, "global_step": 471210, "epoch": 5677} {"train_loss": -26.696258544921875, "global_step": 471211, "epoch": 5677} {"train_loss": -27.324142456054688, "global_step": 471212, "epoch": 5677} {"train_loss": -26.77459144592285, "global_step": 471213, "epoch": 5677} {"train_loss": -26.74625587463379, "global_step": 471214, "epoch": 5677} {"train_loss": -27.19986343383789, "global_step": 471215, "epoch": 5677} {"train_loss": -27.5074520111084, "global_step": 471216, "epoch": 5677} {"train_loss": -27.52985191345215, "global_step": 471217, "epoch": 5677} {"train_loss": -26.936447143554688, "global_step": 471218, "epoch": 5677} {"train_loss": -27.135913848876953, "global_step": 471219, "epoch": 5677} {"train_loss": -27.452411651611328, "global_step": 471220, "epoch": 5677} {"train_loss": -27.03126335144043, "global_step": 471221, "epoch": 5677} {"train_loss": -27.11256980895996, "global_step": 471222, "epoch": 5677} {"train_loss": -27.245126724243164, "global_step": 471223, "epoch": 5677} {"train_loss": -27.162824630737305, "global_step": 471224, "epoch": 5677} {"train_loss": -27.42291831970215, "global_step": 471225, "epoch": 5677} {"train_loss": -27.190841674804688, "global_step": 471226, "epoch": 5677} {"train_loss": -27.6981143951416, "global_step": 471227, "epoch": 5677} {"train_loss": -27.14051628112793, "global_step": 471228, "epoch": 5677} {"train_loss": -26.902023315429688, "global_step": 471229, "epoch": 5677} {"train_loss": -27.424718856811523, "global_step": 471230, "epoch": 5677} {"train_loss": -27.102109909057617, "global_step": 471231, "epoch": 5677} {"train_loss": -27.354047775268555, "global_step": 471232, "epoch": 5677} {"train_loss": -27.13404655456543, "global_step": 471233, "epoch": 5677} {"train_loss": -27.462844848632812, "global_step": 471234, "epoch": 5677} {"train_loss": -27.7188777923584, "global_step": 471235, "epoch": 5677} {"train_loss": -27.119714736938477, "global_step": 471236, "epoch": 5677} {"train_loss": -27.291296005249023, "global_step": 471237, "epoch": 5677} {"train_loss": -26.964996337890625, "global_step": 471238, "epoch": 5677} {"train_loss": -27.133085250854492, "global_step": 471239, "epoch": 5677} {"train_loss": -27.211685180664062, "global_step": 471240, "epoch": 5677} {"train_loss": -27.0830020904541, "global_step": 471241, "epoch": 5677} {"train_loss": -27.163633346557617, "global_step": 471242, "epoch": 5677} {"train_loss": -26.810712814331055, "global_step": 471243, "epoch": 5677} {"train_loss": -26.34467124938965, "global_step": 471244, "epoch": 5677} {"train_loss": -26.891681671142578, "global_step": 471245, "epoch": 5677} {"train_loss": -26.9617977142334, "global_step": 471246, "epoch": 5677} {"train_loss": -27.31256675720215, "global_step": 471247, "epoch": 5677} {"train_loss": -27.182342529296875, "global_step": 471248, "epoch": 5677} {"train_loss": -26.92963981628418, "global_step": 471249, "epoch": 5677} {"train_loss": -26.948949813842773, "global_step": 471250, "epoch": 5677} {"train_loss": -27.06817054748535, "global_step": 471251, "epoch": 5677} {"train_loss": -27.34247398376465, "global_step": 471252, "epoch": 5677} {"train_loss": -27.154455184936523, "global_step": 471253, "epoch": 5677} {"train_loss": -27.122983932495117, "global_step": 471254, "epoch": 5677} {"train_loss": -27.184051513671875, "global_step": 471255, "epoch": 5677} {"train_loss": -27.260587692260742, "global_step": 471256, "epoch": 5677} {"train_loss": -27.060117721557617, "global_step": 471257, "epoch": 5677} {"train_loss": -27.042051315307617, "global_step": 471258, "epoch": 5677} {"train_loss": -27.145490646362305, "global_step": 471259, "epoch": 5677} {"train_loss": -27.2003116607666, "global_step": 471260, "epoch": 5677} {"train_loss": -26.762451171875, "global_step": 471261, "epoch": 5677} {"train_loss": -27.28769302368164, "global_step": 471262, "epoch": 5677} {"train_loss": -27.387897491455078, "global_step": 471263, "epoch": 5677} {"train_loss": -26.996000289916992, "global_step": 471264, "epoch": 5677} {"train_loss": -27.17313003540039, "global_step": 471265, "epoch": 5677} {"train_loss": -27.261011123657227, "global_step": 471266, "epoch": 5677} {"train_loss": -27.692169189453125, "global_step": 471267, "epoch": 5677} {"train_loss": -27.623281478881836, "global_step": 471268, "epoch": 5677} {"train_loss": -27.476980209350586, "global_step": 471269, "epoch": 5677} {"train_loss": -27.229909896850586, "global_step": 471270, "epoch": 5677} {"train_loss": -27.650800704956055, "global_step": 471271, "epoch": 5677} {"train_loss": -27.259967803955078, "global_step": 471272, "epoch": 5677} {"train_loss": -27.068242544151214, "global_step": 471273, "epoch": 5677, "val_loss": 6740405.0} {"train_loss": -25.6411190032959, "global_step": 471274, "epoch": 5678} {"train_loss": -25.913816452026367, "global_step": 471275, "epoch": 5678} {"train_loss": -26.645416259765625, "global_step": 471276, "epoch": 5678} {"train_loss": -26.551620483398438, "global_step": 471277, "epoch": 5678} {"train_loss": -26.172317504882812, "global_step": 471278, "epoch": 5678} {"train_loss": -26.667144775390625, "global_step": 471279, "epoch": 5678} {"train_loss": -26.5483455657959, "global_step": 471280, "epoch": 5678} {"train_loss": -26.549108505249023, "global_step": 471281, "epoch": 5678} {"train_loss": -27.214147567749023, "global_step": 471282, "epoch": 5678} {"train_loss": -26.370410919189453, "global_step": 471283, "epoch": 5678} {"train_loss": -26.592105865478516, "global_step": 471284, "epoch": 5678} {"train_loss": -26.670156478881836, "global_step": 471285, "epoch": 5678} {"train_loss": -26.726470947265625, "global_step": 471286, "epoch": 5678} {"train_loss": -27.007709503173828, "global_step": 471287, "epoch": 5678} {"train_loss": -26.61561393737793, "global_step": 471288, "epoch": 5678} {"train_loss": -26.854379653930664, "global_step": 471289, "epoch": 5678} {"train_loss": -26.68158531188965, "global_step": 471290, "epoch": 5678} {"train_loss": -27.23872184753418, "global_step": 471291, "epoch": 5678} {"train_loss": -26.71329116821289, "global_step": 471292, "epoch": 5678} {"train_loss": -26.775938034057617, "global_step": 471293, "epoch": 5678} {"train_loss": -26.617969512939453, "global_step": 471294, "epoch": 5678} {"train_loss": -26.7876033782959, "global_step": 471295, "epoch": 5678} {"train_loss": -27.088926315307617, "global_step": 471296, "epoch": 5678} {"train_loss": -26.46792984008789, "global_step": 471297, "epoch": 5678} {"train_loss": -26.71160316467285, "global_step": 471298, "epoch": 5678} {"train_loss": -27.124465942382812, "global_step": 471299, "epoch": 5678} {"train_loss": -26.906110763549805, "global_step": 471300, "epoch": 5678} {"train_loss": -26.876373291015625, "global_step": 471301, "epoch": 5678} {"train_loss": -27.146869659423828, "global_step": 471302, "epoch": 5678} {"train_loss": -27.076574325561523, "global_step": 471303, "epoch": 5678} {"train_loss": -27.109663009643555, "global_step": 471304, "epoch": 5678} {"train_loss": -27.302326202392578, "global_step": 471305, "epoch": 5678} {"train_loss": -26.975452423095703, "global_step": 471306, "epoch": 5678} {"train_loss": -27.110319137573242, "global_step": 471307, "epoch": 5678} {"train_loss": -27.3369140625, "global_step": 471308, "epoch": 5678} {"train_loss": -27.221582412719727, "global_step": 471309, "epoch": 5678} {"train_loss": -27.23969078063965, "global_step": 471310, "epoch": 5678} {"train_loss": -27.22763442993164, "global_step": 471311, "epoch": 5678} {"train_loss": -27.5428409576416, "global_step": 471312, "epoch": 5678} {"train_loss": -26.83904457092285, "global_step": 471313, "epoch": 5678} {"train_loss": -27.6544246673584, "global_step": 471314, "epoch": 5678} {"train_loss": -27.463083267211914, "global_step": 471315, "epoch": 5678} {"train_loss": -27.712512969970703, "global_step": 471316, "epoch": 5678} {"train_loss": -27.328678131103516, "global_step": 471317, "epoch": 5678} {"train_loss": -27.013172149658203, "global_step": 471318, "epoch": 5678} {"train_loss": -27.20637321472168, "global_step": 471319, "epoch": 5678} {"train_loss": -27.103092193603516, "global_step": 471320, "epoch": 5678} {"train_loss": -27.2761173248291, "global_step": 471321, "epoch": 5678} {"train_loss": -27.534284591674805, "global_step": 471322, "epoch": 5678} {"train_loss": -27.695764541625977, "global_step": 471323, "epoch": 5678} {"train_loss": -27.12896156311035, "global_step": 471324, "epoch": 5678} {"train_loss": -27.26580810546875, "global_step": 471325, "epoch": 5678} {"train_loss": -27.217639923095703, "global_step": 471326, "epoch": 5678} {"train_loss": -27.340763092041016, "global_step": 471327, "epoch": 5678} {"train_loss": -27.3543701171875, "global_step": 471328, "epoch": 5678} {"train_loss": -27.202777862548828, "global_step": 471329, "epoch": 5678} {"train_loss": -27.227201461791992, "global_step": 471330, "epoch": 5678} {"train_loss": -27.162622451782227, "global_step": 471331, "epoch": 5678} {"train_loss": -27.708545684814453, "global_step": 471332, "epoch": 5678} {"train_loss": -27.537494659423828, "global_step": 471333, "epoch": 5678} {"train_loss": -26.986194610595703, "global_step": 471334, "epoch": 5678} {"train_loss": -27.115650177001953, "global_step": 471335, "epoch": 5678} {"train_loss": -27.131017684936523, "global_step": 471336, "epoch": 5678} {"train_loss": -27.147480010986328, "global_step": 471337, "epoch": 5678} {"train_loss": -27.323511123657227, "global_step": 471338, "epoch": 5678} {"train_loss": -27.383014678955078, "global_step": 471339, "epoch": 5678} {"train_loss": -27.233510971069336, "global_step": 471340, "epoch": 5678} {"train_loss": -27.07169532775879, "global_step": 471341, "epoch": 5678} {"train_loss": -27.138324737548828, "global_step": 471342, "epoch": 5678} {"train_loss": -27.42529296875, "global_step": 471343, "epoch": 5678} {"train_loss": -27.112070083618164, "global_step": 471344, "epoch": 5678} {"train_loss": -27.4492244720459, "global_step": 471345, "epoch": 5678} {"train_loss": -27.187143325805664, "global_step": 471346, "epoch": 5678} {"train_loss": -27.5455322265625, "global_step": 471347, "epoch": 5678} {"train_loss": -27.178180694580078, "global_step": 471348, "epoch": 5678} {"train_loss": -26.876245498657227, "global_step": 471349, "epoch": 5678} {"train_loss": -26.5275821685791, "global_step": 471350, "epoch": 5678} {"train_loss": -26.550397872924805, "global_step": 471351, "epoch": 5678} {"train_loss": -27.159631729125977, "global_step": 471352, "epoch": 5678} {"train_loss": -26.48145866394043, "global_step": 471353, "epoch": 5678} {"train_loss": -26.88640785217285, "global_step": 471354, "epoch": 5678} {"train_loss": -26.7575740814209, "global_step": 471355, "epoch": 5678} {"train_loss": -27.022571333919664, "global_step": 471356, "epoch": 5678, "val_loss": 6636996.0} {"train_loss": -26.342620849609375, "global_step": 471357, "epoch": 5679} {"train_loss": -24.618188858032227, "global_step": 471358, "epoch": 5679} {"train_loss": -25.775495529174805, "global_step": 471359, "epoch": 5679} {"train_loss": -26.2760066986084, "global_step": 471360, "epoch": 5679} {"train_loss": -25.880468368530273, "global_step": 471361, "epoch": 5679} {"train_loss": -26.10858154296875, "global_step": 471362, "epoch": 5679} {"train_loss": -25.8313045501709, "global_step": 471363, "epoch": 5679} {"train_loss": -26.3687744140625, "global_step": 471364, "epoch": 5679} {"train_loss": -25.852514266967773, "global_step": 471365, "epoch": 5679} {"train_loss": -26.01960563659668, "global_step": 471366, "epoch": 5679} {"train_loss": -26.553409576416016, "global_step": 471367, "epoch": 5679} {"train_loss": -26.345157623291016, "global_step": 471368, "epoch": 5679} {"train_loss": -26.66010093688965, "global_step": 471369, "epoch": 5679} {"train_loss": -26.453989028930664, "global_step": 471370, "epoch": 5679} {"train_loss": -26.611997604370117, "global_step": 471371, "epoch": 5679} {"train_loss": -26.647180557250977, "global_step": 471372, "epoch": 5679} {"train_loss": -26.574710845947266, "global_step": 471373, "epoch": 5679} {"train_loss": -26.60519790649414, "global_step": 471374, "epoch": 5679} {"train_loss": -26.773717880249023, "global_step": 471375, "epoch": 5679} {"train_loss": -26.256391525268555, "global_step": 471376, "epoch": 5679} {"train_loss": -26.487014770507812, "global_step": 471377, "epoch": 5679} {"train_loss": -26.364410400390625, "global_step": 471378, "epoch": 5679} {"train_loss": -26.691394805908203, "global_step": 471379, "epoch": 5679} {"train_loss": -27.061288833618164, "global_step": 471380, "epoch": 5679} {"train_loss": -26.74262809753418, "global_step": 471381, "epoch": 5679} {"train_loss": -26.718320846557617, "global_step": 471382, "epoch": 5679} {"train_loss": -26.837940216064453, "global_step": 471383, "epoch": 5679} {"train_loss": -26.83631706237793, "global_step": 471384, "epoch": 5679} {"train_loss": -27.22889518737793, "global_step": 471385, "epoch": 5679} {"train_loss": -27.089303970336914, "global_step": 471386, "epoch": 5679} {"train_loss": -27.22358512878418, "global_step": 471387, "epoch": 5679} {"train_loss": -27.122838973999023, "global_step": 471388, "epoch": 5679} {"train_loss": -27.278766632080078, "global_step": 471389, "epoch": 5679} {"train_loss": -27.213788986206055, "global_step": 471390, "epoch": 5679} {"train_loss": -27.016326904296875, "global_step": 471391, "epoch": 5679} {"train_loss": -27.465200424194336, "global_step": 471392, "epoch": 5679} {"train_loss": -27.250930786132812, "global_step": 471393, "epoch": 5679} {"train_loss": -27.076879501342773, "global_step": 471394, "epoch": 5679} {"train_loss": -26.964160919189453, "global_step": 471395, "epoch": 5679} {"train_loss": -27.472070693969727, "global_step": 471396, "epoch": 5679} {"train_loss": -27.38838768005371, "global_step": 471397, "epoch": 5679} {"train_loss": -27.38626480102539, "global_step": 471398, "epoch": 5679} {"train_loss": -27.34675407409668, "global_step": 471399, "epoch": 5679} {"train_loss": -27.549026489257812, "global_step": 471400, "epoch": 5679} {"train_loss": -26.980161666870117, "global_step": 471401, "epoch": 5679} {"train_loss": -27.352262496948242, "global_step": 471402, "epoch": 5679} {"train_loss": -27.085264205932617, "global_step": 471403, "epoch": 5679} {"train_loss": -27.051748275756836, "global_step": 471404, "epoch": 5679} {"train_loss": -27.2818546295166, "global_step": 471405, "epoch": 5679} {"train_loss": -27.3294734954834, "global_step": 471406, "epoch": 5679} {"train_loss": -27.428211212158203, "global_step": 471407, "epoch": 5679} {"train_loss": -27.380908966064453, "global_step": 471408, "epoch": 5679} {"train_loss": -27.569116592407227, "global_step": 471409, "epoch": 5679} {"train_loss": -27.209558486938477, "global_step": 471410, "epoch": 5679} {"train_loss": -27.468170166015625, "global_step": 471411, "epoch": 5679} {"train_loss": -27.0998592376709, "global_step": 471412, "epoch": 5679} {"train_loss": -27.398096084594727, "global_step": 471413, "epoch": 5679} {"train_loss": -27.575468063354492, "global_step": 471414, "epoch": 5679} {"train_loss": -26.950103759765625, "global_step": 471415, "epoch": 5679} {"train_loss": -27.352588653564453, "global_step": 471416, "epoch": 5679} {"train_loss": -27.207136154174805, "global_step": 471417, "epoch": 5679} {"train_loss": -27.209732055664062, "global_step": 471418, "epoch": 5679} {"train_loss": -27.214344024658203, "global_step": 471419, "epoch": 5679} {"train_loss": -27.11871910095215, "global_step": 471420, "epoch": 5679} {"train_loss": -27.572986602783203, "global_step": 471421, "epoch": 5679} {"train_loss": -27.4345645904541, "global_step": 471422, "epoch": 5679} {"train_loss": -27.267658233642578, "global_step": 471423, "epoch": 5679} {"train_loss": -26.728107452392578, "global_step": 471424, "epoch": 5679} {"train_loss": -27.12446403503418, "global_step": 471425, "epoch": 5679} {"train_loss": -27.293792724609375, "global_step": 471426, "epoch": 5679} {"train_loss": -27.730518341064453, "global_step": 471427, "epoch": 5679} {"train_loss": -27.080053329467773, "global_step": 471428, "epoch": 5679} {"train_loss": -26.51165771484375, "global_step": 471429, "epoch": 5679} {"train_loss": -26.886402130126953, "global_step": 471430, "epoch": 5679} {"train_loss": -27.113433837890625, "global_step": 471431, "epoch": 5679} {"train_loss": -27.076196670532227, "global_step": 471432, "epoch": 5679} {"train_loss": -27.103107452392578, "global_step": 471433, "epoch": 5679} {"train_loss": -26.860944747924805, "global_step": 471434, "epoch": 5679} {"train_loss": -27.23288345336914, "global_step": 471435, "epoch": 5679} {"train_loss": -27.245038986206055, "global_step": 471436, "epoch": 5679} {"train_loss": -27.202091217041016, "global_step": 471437, "epoch": 5679} {"train_loss": -27.10430908203125, "global_step": 471438, "epoch": 5679} {"train_loss": -26.959399096937066, "global_step": 471439, "epoch": 5679, "val_loss": 6649185.0} {"train_loss": -26.21205711364746, "global_step": 471440, "epoch": 5680} {"train_loss": -26.44454002380371, "global_step": 471441, "epoch": 5680} {"train_loss": -26.4066162109375, "global_step": 471442, "epoch": 5680} {"train_loss": -26.54355239868164, "global_step": 471443, "epoch": 5680} {"train_loss": -26.738250732421875, "global_step": 471444, "epoch": 5680} {"train_loss": -26.17293357849121, "global_step": 471445, "epoch": 5680} {"train_loss": -26.5389404296875, "global_step": 471446, "epoch": 5680} {"train_loss": -26.666976928710938, "global_step": 471447, "epoch": 5680} {"train_loss": -26.485416412353516, "global_step": 471448, "epoch": 5680} {"train_loss": -26.91925048828125, "global_step": 471449, "epoch": 5680} {"train_loss": -26.506305694580078, "global_step": 471450, "epoch": 5680} {"train_loss": -26.671588897705078, "global_step": 471451, "epoch": 5680} {"train_loss": -26.959806442260742, "global_step": 471452, "epoch": 5680} {"train_loss": -26.786945343017578, "global_step": 471453, "epoch": 5680} {"train_loss": -26.77695655822754, "global_step": 471454, "epoch": 5680} {"train_loss": -26.74989128112793, "global_step": 471455, "epoch": 5680} {"train_loss": -27.134428024291992, "global_step": 471456, "epoch": 5680} {"train_loss": -27.15872573852539, "global_step": 471457, "epoch": 5680} {"train_loss": -27.22157096862793, "global_step": 471458, "epoch": 5680} {"train_loss": -26.76044273376465, "global_step": 471459, "epoch": 5680} {"train_loss": -26.95343589782715, "global_step": 471460, "epoch": 5680} {"train_loss": -26.969390869140625, "global_step": 471461, "epoch": 5680} {"train_loss": -26.98089599609375, "global_step": 471462, "epoch": 5680} {"train_loss": -27.396392822265625, "global_step": 471463, "epoch": 5680} {"train_loss": -26.9778995513916, "global_step": 471464, "epoch": 5680} {"train_loss": -27.09929847717285, "global_step": 471465, "epoch": 5680} {"train_loss": -27.0184268951416, "global_step": 471466, "epoch": 5680} {"train_loss": -26.71744155883789, "global_step": 471467, "epoch": 5680} {"train_loss": -26.92584800720215, "global_step": 471468, "epoch": 5680} {"train_loss": -27.508886337280273, "global_step": 471469, "epoch": 5680} {"train_loss": -27.2581787109375, "global_step": 471470, "epoch": 5680} {"train_loss": -27.36272621154785, "global_step": 471471, "epoch": 5680} {"train_loss": -27.34356689453125, "global_step": 471472, "epoch": 5680} {"train_loss": -27.2553653717041, "global_step": 471473, "epoch": 5680} {"train_loss": -27.309528350830078, "global_step": 471474, "epoch": 5680} {"train_loss": -27.38258934020996, "global_step": 471475, "epoch": 5680} {"train_loss": -27.52508544921875, "global_step": 471476, "epoch": 5680} {"train_loss": -27.190221786499023, "global_step": 471477, "epoch": 5680} {"train_loss": -27.222471237182617, "global_step": 471478, "epoch": 5680} {"train_loss": -27.364276885986328, "global_step": 471479, "epoch": 5680} {"train_loss": -27.1949462890625, "global_step": 471480, "epoch": 5680} {"train_loss": -27.232959747314453, "global_step": 471481, "epoch": 5680} {"train_loss": -27.25701904296875, "global_step": 471482, "epoch": 5680} {"train_loss": -27.512983322143555, "global_step": 471483, "epoch": 5680} {"train_loss": -27.114980697631836, "global_step": 471484, "epoch": 5680} {"train_loss": -27.158979415893555, "global_step": 471485, "epoch": 5680} {"train_loss": -27.016382217407227, "global_step": 471486, "epoch": 5680} {"train_loss": -27.20594596862793, "global_step": 471487, "epoch": 5680} {"train_loss": -26.6199951171875, "global_step": 471488, "epoch": 5680} {"train_loss": -27.272724151611328, "global_step": 471489, "epoch": 5680} {"train_loss": -27.45895767211914, "global_step": 471490, "epoch": 5680} {"train_loss": -27.23665428161621, "global_step": 471491, "epoch": 5680} {"train_loss": -27.20856285095215, "global_step": 471492, "epoch": 5680} {"train_loss": -27.004297256469727, "global_step": 471493, "epoch": 5680} {"train_loss": -27.116943359375, "global_step": 471494, "epoch": 5680} {"train_loss": -27.102619171142578, "global_step": 471495, "epoch": 5680} {"train_loss": -27.406457901000977, "global_step": 471496, "epoch": 5680} {"train_loss": -26.89754295349121, "global_step": 471497, "epoch": 5680} {"train_loss": -26.578033447265625, "global_step": 471498, "epoch": 5680} {"train_loss": -27.20509910583496, "global_step": 471499, "epoch": 5680} {"train_loss": -26.9442195892334, "global_step": 471500, "epoch": 5680} {"train_loss": -27.249053955078125, "global_step": 471501, "epoch": 5680} {"train_loss": -26.792760848999023, "global_step": 471502, "epoch": 5680} {"train_loss": -26.7669677734375, "global_step": 471503, "epoch": 5680} {"train_loss": -27.016464233398438, "global_step": 471504, "epoch": 5680} {"train_loss": -27.331384658813477, "global_step": 471505, "epoch": 5680} {"train_loss": -27.256284713745117, "global_step": 471506, "epoch": 5680} {"train_loss": -27.08124351501465, "global_step": 471507, "epoch": 5680} {"train_loss": -27.272714614868164, "global_step": 471508, "epoch": 5680} {"train_loss": -27.255613327026367, "global_step": 471509, "epoch": 5680} {"train_loss": -26.882461547851562, "global_step": 471510, "epoch": 5680} {"train_loss": -26.515289306640625, "global_step": 471511, "epoch": 5680} {"train_loss": -26.827238082885742, "global_step": 471512, "epoch": 5680} {"train_loss": -27.022058486938477, "global_step": 471513, "epoch": 5680} {"train_loss": -27.07573890686035, "global_step": 471514, "epoch": 5680} {"train_loss": -27.36329460144043, "global_step": 471515, "epoch": 5680} {"train_loss": -26.772571563720703, "global_step": 471516, "epoch": 5680} {"train_loss": -27.243642807006836, "global_step": 471517, "epoch": 5680} {"train_loss": -27.315109252929688, "global_step": 471518, "epoch": 5680} {"train_loss": -27.238550186157227, "global_step": 471519, "epoch": 5680} {"train_loss": -27.0435733795166, "global_step": 471520, "epoch": 5680} {"train_loss": -26.89676284790039, "global_step": 471521, "epoch": 5680} {"train_loss": -27.001434946634685, "global_step": 471522, "epoch": 5680, "val_loss": 6685411.0} {"train_loss": -26.489587783813477, "global_step": 471523, "epoch": 5681} {"train_loss": -26.235219955444336, "global_step": 471524, "epoch": 5681} {"train_loss": -26.25669288635254, "global_step": 471525, "epoch": 5681} {"train_loss": -26.410690307617188, "global_step": 471526, "epoch": 5681} {"train_loss": -26.714807510375977, "global_step": 471527, "epoch": 5681} {"train_loss": -26.499862670898438, "global_step": 471528, "epoch": 5681} {"train_loss": -27.000638961791992, "global_step": 471529, "epoch": 5681} {"train_loss": -26.780567169189453, "global_step": 471530, "epoch": 5681} {"train_loss": -26.521581649780273, "global_step": 471531, "epoch": 5681} {"train_loss": -26.378143310546875, "global_step": 471532, "epoch": 5681} {"train_loss": -26.823514938354492, "global_step": 471533, "epoch": 5681} {"train_loss": -26.96708106994629, "global_step": 471534, "epoch": 5681} {"train_loss": -26.18364906311035, "global_step": 471535, "epoch": 5681} {"train_loss": -26.939788818359375, "global_step": 471536, "epoch": 5681} {"train_loss": -26.76605796813965, "global_step": 471537, "epoch": 5681} {"train_loss": -26.778003692626953, "global_step": 471538, "epoch": 5681} {"train_loss": -27.05994987487793, "global_step": 471539, "epoch": 5681} {"train_loss": -26.973926544189453, "global_step": 471540, "epoch": 5681} {"train_loss": -26.662322998046875, "global_step": 471541, "epoch": 5681} {"train_loss": -26.664960861206055, "global_step": 471542, "epoch": 5681} {"train_loss": -27.003280639648438, "global_step": 471543, "epoch": 5681} {"train_loss": -26.626142501831055, "global_step": 471544, "epoch": 5681} {"train_loss": -26.64069175720215, "global_step": 471545, "epoch": 5681} {"train_loss": -27.02997398376465, "global_step": 471546, "epoch": 5681} {"train_loss": -27.372943878173828, "global_step": 471547, "epoch": 5681} {"train_loss": -27.142786026000977, "global_step": 471548, "epoch": 5681} {"train_loss": -27.568084716796875, "global_step": 471549, "epoch": 5681} {"train_loss": -27.18903160095215, "global_step": 471550, "epoch": 5681} {"train_loss": -27.170459747314453, "global_step": 471551, "epoch": 5681} {"train_loss": -26.67652702331543, "global_step": 471552, "epoch": 5681} {"train_loss": -27.214887619018555, "global_step": 471553, "epoch": 5681} {"train_loss": -26.582326889038086, "global_step": 471554, "epoch": 5681} {"train_loss": -26.659759521484375, "global_step": 471555, "epoch": 5681} {"train_loss": -26.834930419921875, "global_step": 471556, "epoch": 5681} {"train_loss": -26.8569278717041, "global_step": 471557, "epoch": 5681} {"train_loss": -26.826093673706055, "global_step": 471558, "epoch": 5681} {"train_loss": -26.68310546875, "global_step": 471559, "epoch": 5681} {"train_loss": -26.901098251342773, "global_step": 471560, "epoch": 5681} {"train_loss": -27.05524253845215, "global_step": 471561, "epoch": 5681} {"train_loss": -27.11724281311035, "global_step": 471562, "epoch": 5681} {"train_loss": -27.166330337524414, "global_step": 471563, "epoch": 5681} {"train_loss": -26.98105239868164, "global_step": 471564, "epoch": 5681} {"train_loss": -27.262060165405273, "global_step": 471565, "epoch": 5681} {"train_loss": -27.48488426208496, "global_step": 471566, "epoch": 5681} {"train_loss": -27.40822410583496, "global_step": 471567, "epoch": 5681} {"train_loss": -27.1268367767334, "global_step": 471568, "epoch": 5681} {"train_loss": -26.7717227935791, "global_step": 471569, "epoch": 5681} {"train_loss": -27.133060455322266, "global_step": 471570, "epoch": 5681} {"train_loss": -27.2668399810791, "global_step": 471571, "epoch": 5681} {"train_loss": -27.24224853515625, "global_step": 471572, "epoch": 5681} {"train_loss": -27.08880043029785, "global_step": 471573, "epoch": 5681} {"train_loss": -27.274106979370117, "global_step": 471574, "epoch": 5681} {"train_loss": -27.381534576416016, "global_step": 471575, "epoch": 5681} {"train_loss": -27.364410400390625, "global_step": 471576, "epoch": 5681} {"train_loss": -27.709863662719727, "global_step": 471577, "epoch": 5681} {"train_loss": -26.982568740844727, "global_step": 471578, "epoch": 5681} {"train_loss": -27.069305419921875, "global_step": 471579, "epoch": 5681} {"train_loss": -27.201385498046875, "global_step": 471580, "epoch": 5681} {"train_loss": -27.171865463256836, "global_step": 471581, "epoch": 5681} {"train_loss": -27.11811637878418, "global_step": 471582, "epoch": 5681} {"train_loss": -27.006250381469727, "global_step": 471583, "epoch": 5681} {"train_loss": -27.411121368408203, "global_step": 471584, "epoch": 5681} {"train_loss": -27.327917098999023, "global_step": 471585, "epoch": 5681} {"train_loss": -27.177488327026367, "global_step": 471586, "epoch": 5681} {"train_loss": -27.350147247314453, "global_step": 471587, "epoch": 5681} {"train_loss": -27.038705825805664, "global_step": 471588, "epoch": 5681} {"train_loss": -27.38984489440918, "global_step": 471589, "epoch": 5681} {"train_loss": -27.5116024017334, "global_step": 471590, "epoch": 5681} {"train_loss": -27.34042739868164, "global_step": 471591, "epoch": 5681} {"train_loss": -27.36482810974121, "global_step": 471592, "epoch": 5681} {"train_loss": -27.32435417175293, "global_step": 471593, "epoch": 5681} {"train_loss": -27.386457443237305, "global_step": 471594, "epoch": 5681} {"train_loss": -27.34510612487793, "global_step": 471595, "epoch": 5681} {"train_loss": -27.204267501831055, "global_step": 471596, "epoch": 5681} {"train_loss": -27.56366539001465, "global_step": 471597, "epoch": 5681} {"train_loss": -27.216596603393555, "global_step": 471598, "epoch": 5681} {"train_loss": -27.218555450439453, "global_step": 471599, "epoch": 5681} {"train_loss": -27.191701889038086, "global_step": 471600, "epoch": 5681} {"train_loss": -27.015798568725586, "global_step": 471601, "epoch": 5681} {"train_loss": -27.147031784057617, "global_step": 471602, "epoch": 5681} {"train_loss": -27.370405197143555, "global_step": 471603, "epoch": 5681} {"train_loss": -27.62737464904785, "global_step": 471604, "epoch": 5681} {"train_loss": -27.04665227683194, "global_step": 471605, "epoch": 5681, "val_loss": 6623600.5} {"train_loss": -26.394079208374023, "global_step": 471606, "epoch": 5682} {"train_loss": -26.419538497924805, "global_step": 471607, "epoch": 5682} {"train_loss": -26.329147338867188, "global_step": 471608, "epoch": 5682} {"train_loss": -25.964664459228516, "global_step": 471609, "epoch": 5682} {"train_loss": -26.508228302001953, "global_step": 471610, "epoch": 5682} {"train_loss": -25.396493911743164, "global_step": 471611, "epoch": 5682} {"train_loss": -25.846694946289062, "global_step": 471612, "epoch": 5682} {"train_loss": -26.45404052734375, "global_step": 471613, "epoch": 5682} {"train_loss": -26.163837432861328, "global_step": 471614, "epoch": 5682} {"train_loss": -26.5858097076416, "global_step": 471615, "epoch": 5682} {"train_loss": -26.22835350036621, "global_step": 471616, "epoch": 5682} {"train_loss": -26.705001831054688, "global_step": 471617, "epoch": 5682} {"train_loss": -26.475183486938477, "global_step": 471618, "epoch": 5682} {"train_loss": -26.59846305847168, "global_step": 471619, "epoch": 5682} {"train_loss": -26.2425479888916, "global_step": 471620, "epoch": 5682} {"train_loss": -24.795806884765625, "global_step": 471621, "epoch": 5682} {"train_loss": -26.328189849853516, "global_step": 471622, "epoch": 5682} {"train_loss": -26.490705490112305, "global_step": 471623, "epoch": 5682} {"train_loss": -26.206235885620117, "global_step": 471624, "epoch": 5682} {"train_loss": -26.292627334594727, "global_step": 471625, "epoch": 5682} {"train_loss": -25.911039352416992, "global_step": 471626, "epoch": 5682} {"train_loss": -26.41973304748535, "global_step": 471627, "epoch": 5682} {"train_loss": -26.263141632080078, "global_step": 471628, "epoch": 5682} {"train_loss": -26.466815948486328, "global_step": 471629, "epoch": 5682} {"train_loss": -26.46978759765625, "global_step": 471630, "epoch": 5682} {"train_loss": -26.492910385131836, "global_step": 471631, "epoch": 5682} {"train_loss": -26.510969161987305, "global_step": 471632, "epoch": 5682} {"train_loss": -27.056934356689453, "global_step": 471633, "epoch": 5682} {"train_loss": -26.61761474609375, "global_step": 471634, "epoch": 5682} {"train_loss": -26.314844131469727, "global_step": 471635, "epoch": 5682} {"train_loss": -26.3747501373291, "global_step": 471636, "epoch": 5682} {"train_loss": -26.7025203704834, "global_step": 471637, "epoch": 5682} {"train_loss": -26.026025772094727, "global_step": 471638, "epoch": 5682} {"train_loss": -26.7967472076416, "global_step": 471639, "epoch": 5682} {"train_loss": -26.642578125, "global_step": 471640, "epoch": 5682} {"train_loss": -26.861379623413086, "global_step": 471641, "epoch": 5682} {"train_loss": -26.61279296875, "global_step": 471642, "epoch": 5682} {"train_loss": -26.605182647705078, "global_step": 471643, "epoch": 5682} {"train_loss": -27.399921417236328, "global_step": 471644, "epoch": 5682} {"train_loss": -26.835554122924805, "global_step": 471645, "epoch": 5682} {"train_loss": -26.947467803955078, "global_step": 471646, "epoch": 5682} {"train_loss": -26.9196834564209, "global_step": 471647, "epoch": 5682} {"train_loss": -26.9368896484375, "global_step": 471648, "epoch": 5682} {"train_loss": -27.299840927124023, "global_step": 471649, "epoch": 5682} {"train_loss": -27.304641723632812, "global_step": 471650, "epoch": 5682} {"train_loss": -27.004438400268555, "global_step": 471651, "epoch": 5682} {"train_loss": -27.20340919494629, "global_step": 471652, "epoch": 5682} {"train_loss": -27.155181884765625, "global_step": 471653, "epoch": 5682} {"train_loss": -27.195798873901367, "global_step": 471654, "epoch": 5682} {"train_loss": -27.295923233032227, "global_step": 471655, "epoch": 5682} {"train_loss": -27.158451080322266, "global_step": 471656, "epoch": 5682} {"train_loss": -26.901498794555664, "global_step": 471657, "epoch": 5682} {"train_loss": -27.245935440063477, "global_step": 471658, "epoch": 5682} {"train_loss": -27.05121421813965, "global_step": 471659, "epoch": 5682} {"train_loss": -27.21248435974121, "global_step": 471660, "epoch": 5682} {"train_loss": -27.200977325439453, "global_step": 471661, "epoch": 5682} {"train_loss": -27.35907554626465, "global_step": 471662, "epoch": 5682} {"train_loss": -27.645496368408203, "global_step": 471663, "epoch": 5682} {"train_loss": -27.466033935546875, "global_step": 471664, "epoch": 5682} {"train_loss": -27.438385009765625, "global_step": 471665, "epoch": 5682} {"train_loss": -27.35747718811035, "global_step": 471666, "epoch": 5682} {"train_loss": -27.822071075439453, "global_step": 471667, "epoch": 5682} {"train_loss": -27.71149253845215, "global_step": 471668, "epoch": 5682} {"train_loss": -27.374948501586914, "global_step": 471669, "epoch": 5682} {"train_loss": -27.35279655456543, "global_step": 471670, "epoch": 5682} {"train_loss": -27.242212295532227, "global_step": 471671, "epoch": 5682} {"train_loss": -27.481689453125, "global_step": 471672, "epoch": 5682} {"train_loss": -27.301618576049805, "global_step": 471673, "epoch": 5682} {"train_loss": -27.464162826538086, "global_step": 471674, "epoch": 5682} {"train_loss": -27.553258895874023, "global_step": 471675, "epoch": 5682} {"train_loss": -27.3032283782959, "global_step": 471676, "epoch": 5682} {"train_loss": -27.61703872680664, "global_step": 471677, "epoch": 5682} {"train_loss": -27.56314468383789, "global_step": 471678, "epoch": 5682} {"train_loss": -27.70050621032715, "global_step": 471679, "epoch": 5682} {"train_loss": -27.546045303344727, "global_step": 471680, "epoch": 5682} {"train_loss": -27.24171257019043, "global_step": 471681, "epoch": 5682} {"train_loss": -27.4051570892334, "global_step": 471682, "epoch": 5682} {"train_loss": -27.19464683532715, "global_step": 471683, "epoch": 5682} {"train_loss": -26.259260177612305, "global_step": 471684, "epoch": 5682} {"train_loss": -25.709869384765625, "global_step": 471685, "epoch": 5682} {"train_loss": -25.044645309448242, "global_step": 471686, "epoch": 5682} {"train_loss": -25.140661239624023, "global_step": 471687, "epoch": 5682} {"train_loss": -26.7917938921825, "global_step": 471688, "epoch": 5682, "val_loss": 6644971.5} {"train_loss": -25.099388122558594, "global_step": 471689, "epoch": 5683} {"train_loss": -24.116010665893555, "global_step": 471690, "epoch": 5683} {"train_loss": -26.02988624572754, "global_step": 471691, "epoch": 5683} {"train_loss": -25.664794921875, "global_step": 471692, "epoch": 5683} {"train_loss": -25.815784454345703, "global_step": 471693, "epoch": 5683} {"train_loss": -25.35591697692871, "global_step": 471694, "epoch": 5683} {"train_loss": -25.625263214111328, "global_step": 471695, "epoch": 5683} {"train_loss": -26.075231552124023, "global_step": 471696, "epoch": 5683} {"train_loss": -25.773412704467773, "global_step": 471697, "epoch": 5683} {"train_loss": -26.186044692993164, "global_step": 471698, "epoch": 5683} {"train_loss": -25.965192794799805, "global_step": 471699, "epoch": 5683} {"train_loss": -25.912643432617188, "global_step": 471700, "epoch": 5683} {"train_loss": -26.339431762695312, "global_step": 471701, "epoch": 5683} {"train_loss": -25.958181381225586, "global_step": 471702, "epoch": 5683} {"train_loss": -26.47785758972168, "global_step": 471703, "epoch": 5683} {"train_loss": -26.77040672302246, "global_step": 471704, "epoch": 5683} {"train_loss": -26.45265007019043, "global_step": 471705, "epoch": 5683} {"train_loss": -26.64459800720215, "global_step": 471706, "epoch": 5683} {"train_loss": -26.823400497436523, "global_step": 471707, "epoch": 5683} {"train_loss": -26.204879760742188, "global_step": 471708, "epoch": 5683} {"train_loss": -26.619186401367188, "global_step": 471709, "epoch": 5683} {"train_loss": -26.193572998046875, "global_step": 471710, "epoch": 5683} {"train_loss": -26.622949600219727, "global_step": 471711, "epoch": 5683} {"train_loss": -26.746021270751953, "global_step": 471712, "epoch": 5683} {"train_loss": -26.827192306518555, "global_step": 471713, "epoch": 5683} {"train_loss": -26.611608505249023, "global_step": 471714, "epoch": 5683} {"train_loss": -26.639312744140625, "global_step": 471715, "epoch": 5683} {"train_loss": -26.825992584228516, "global_step": 471716, "epoch": 5683} {"train_loss": -26.777740478515625, "global_step": 471717, "epoch": 5683} {"train_loss": -26.71820068359375, "global_step": 471718, "epoch": 5683} {"train_loss": -26.79714012145996, "global_step": 471719, "epoch": 5683} {"train_loss": -26.60645866394043, "global_step": 471720, "epoch": 5683} {"train_loss": -27.118030548095703, "global_step": 471721, "epoch": 5683} {"train_loss": -26.79501724243164, "global_step": 471722, "epoch": 5683} {"train_loss": -27.327117919921875, "global_step": 471723, "epoch": 5683} {"train_loss": -27.124069213867188, "global_step": 471724, "epoch": 5683} {"train_loss": -27.217432022094727, "global_step": 471725, "epoch": 5683} {"train_loss": -26.822904586791992, "global_step": 471726, "epoch": 5683} {"train_loss": -27.236906051635742, "global_step": 471727, "epoch": 5683} {"train_loss": -27.374181747436523, "global_step": 471728, "epoch": 5683} {"train_loss": -26.95549964904785, "global_step": 471729, "epoch": 5683} {"train_loss": -27.3092098236084, "global_step": 471730, "epoch": 5683} {"train_loss": -27.13873863220215, "global_step": 471731, "epoch": 5683} {"train_loss": -27.293994903564453, "global_step": 471732, "epoch": 5683} {"train_loss": -26.980609893798828, "global_step": 471733, "epoch": 5683} {"train_loss": -27.223297119140625, "global_step": 471734, "epoch": 5683} {"train_loss": -26.8458194732666, "global_step": 471735, "epoch": 5683} {"train_loss": -26.85072898864746, "global_step": 471736, "epoch": 5683} {"train_loss": -27.718505859375, "global_step": 471737, "epoch": 5683} {"train_loss": -27.468053817749023, "global_step": 471738, "epoch": 5683} {"train_loss": -27.299945831298828, "global_step": 471739, "epoch": 5683} {"train_loss": -27.040998458862305, "global_step": 471740, "epoch": 5683} {"train_loss": -26.9992618560791, "global_step": 471741, "epoch": 5683} {"train_loss": -27.11274528503418, "global_step": 471742, "epoch": 5683} {"train_loss": -27.5151309967041, "global_step": 471743, "epoch": 5683} {"train_loss": -27.137664794921875, "global_step": 471744, "epoch": 5683} {"train_loss": -27.047367095947266, "global_step": 471745, "epoch": 5683} {"train_loss": -27.100112915039062, "global_step": 471746, "epoch": 5683} {"train_loss": -27.400348663330078, "global_step": 471747, "epoch": 5683} {"train_loss": -26.98992919921875, "global_step": 471748, "epoch": 5683} {"train_loss": -27.420530319213867, "global_step": 471749, "epoch": 5683} {"train_loss": -27.01175880432129, "global_step": 471750, "epoch": 5683} {"train_loss": -27.154666900634766, "global_step": 471751, "epoch": 5683} {"train_loss": -27.304157257080078, "global_step": 471752, "epoch": 5683} {"train_loss": -27.389753341674805, "global_step": 471753, "epoch": 5683} {"train_loss": -26.953033447265625, "global_step": 471754, "epoch": 5683} {"train_loss": -27.071292877197266, "global_step": 471755, "epoch": 5683} {"train_loss": -27.2199649810791, "global_step": 471756, "epoch": 5683} {"train_loss": -27.287282943725586, "global_step": 471757, "epoch": 5683} {"train_loss": -27.140424728393555, "global_step": 471758, "epoch": 5683} {"train_loss": -27.17144775390625, "global_step": 471759, "epoch": 5683} {"train_loss": -26.868900299072266, "global_step": 471760, "epoch": 5683} {"train_loss": -26.812610626220703, "global_step": 471761, "epoch": 5683} {"train_loss": -26.298175811767578, "global_step": 471762, "epoch": 5683} {"train_loss": -26.3031005859375, "global_step": 471763, "epoch": 5683} {"train_loss": -26.770526885986328, "global_step": 471764, "epoch": 5683} {"train_loss": -26.766332626342773, "global_step": 471765, "epoch": 5683} {"train_loss": -27.142011642456055, "global_step": 471766, "epoch": 5683} {"train_loss": -26.200428009033203, "global_step": 471767, "epoch": 5683} {"train_loss": -26.809301376342773, "global_step": 471768, "epoch": 5683} {"train_loss": -27.086273193359375, "global_step": 471769, "epoch": 5683} {"train_loss": -26.878049850463867, "global_step": 471770, "epoch": 5683} {"train_loss": -26.73447896199054, "global_step": 471771, "epoch": 5683, "val_loss": 6676439.0} {"train_loss": -25.872900009155273, "global_step": 471772, "epoch": 5684} {"train_loss": -26.31865882873535, "global_step": 471773, "epoch": 5684} {"train_loss": -25.365150451660156, "global_step": 471774, "epoch": 5684} {"train_loss": -25.51320457458496, "global_step": 471775, "epoch": 5684} {"train_loss": -26.524097442626953, "global_step": 471776, "epoch": 5684} {"train_loss": -25.78902244567871, "global_step": 471777, "epoch": 5684} {"train_loss": -26.3757381439209, "global_step": 471778, "epoch": 5684} {"train_loss": -26.187082290649414, "global_step": 471779, "epoch": 5684} {"train_loss": -26.82598304748535, "global_step": 471780, "epoch": 5684} {"train_loss": -26.576013565063477, "global_step": 471781, "epoch": 5684} {"train_loss": -26.48493003845215, "global_step": 471782, "epoch": 5684} {"train_loss": -26.580472946166992, "global_step": 471783, "epoch": 5684} {"train_loss": -26.155475616455078, "global_step": 471784, "epoch": 5684} {"train_loss": -26.57834243774414, "global_step": 471785, "epoch": 5684} {"train_loss": -26.546045303344727, "global_step": 471786, "epoch": 5684} {"train_loss": -27.1843204498291, "global_step": 471787, "epoch": 5684} {"train_loss": -26.547651290893555, "global_step": 471788, "epoch": 5684} {"train_loss": -26.717798233032227, "global_step": 471789, "epoch": 5684} {"train_loss": -26.804052352905273, "global_step": 471790, "epoch": 5684} {"train_loss": -27.2423038482666, "global_step": 471791, "epoch": 5684} {"train_loss": -26.852075576782227, "global_step": 471792, "epoch": 5684} {"train_loss": -26.869794845581055, "global_step": 471793, "epoch": 5684} {"train_loss": -26.881732940673828, "global_step": 471794, "epoch": 5684} {"train_loss": -26.673160552978516, "global_step": 471795, "epoch": 5684} {"train_loss": -26.52385902404785, "global_step": 471796, "epoch": 5684} {"train_loss": -26.6627254486084, "global_step": 471797, "epoch": 5684} {"train_loss": -26.961688995361328, "global_step": 471798, "epoch": 5684} {"train_loss": -27.12721061706543, "global_step": 471799, "epoch": 5684} {"train_loss": -27.138580322265625, "global_step": 471800, "epoch": 5684} {"train_loss": -26.879135131835938, "global_step": 471801, "epoch": 5684} {"train_loss": -27.00679588317871, "global_step": 471802, "epoch": 5684} {"train_loss": -27.08139991760254, "global_step": 471803, "epoch": 5684} {"train_loss": -27.417194366455078, "global_step": 471804, "epoch": 5684} {"train_loss": -26.991003036499023, "global_step": 471805, "epoch": 5684} {"train_loss": -26.85218620300293, "global_step": 471806, "epoch": 5684} {"train_loss": -27.279516220092773, "global_step": 471807, "epoch": 5684} {"train_loss": -26.996734619140625, "global_step": 471808, "epoch": 5684} {"train_loss": -27.4491024017334, "global_step": 471809, "epoch": 5684} {"train_loss": -27.15302848815918, "global_step": 471810, "epoch": 5684} {"train_loss": -27.235553741455078, "global_step": 471811, "epoch": 5684} {"train_loss": -27.32275390625, "global_step": 471812, "epoch": 5684} {"train_loss": -27.33768653869629, "global_step": 471813, "epoch": 5684} {"train_loss": -27.5738582611084, "global_step": 471814, "epoch": 5684} {"train_loss": -27.498014450073242, "global_step": 471815, "epoch": 5684} {"train_loss": -27.534317016601562, "global_step": 471816, "epoch": 5684} {"train_loss": -27.163318634033203, "global_step": 471817, "epoch": 5684} {"train_loss": -27.668643951416016, "global_step": 471818, "epoch": 5684} {"train_loss": -27.20570182800293, "global_step": 471819, "epoch": 5684} {"train_loss": -27.292373657226562, "global_step": 471820, "epoch": 5684} {"train_loss": -27.275278091430664, "global_step": 471821, "epoch": 5684} {"train_loss": -27.01863670349121, "global_step": 471822, "epoch": 5684} {"train_loss": -27.209121704101562, "global_step": 471823, "epoch": 5684} {"train_loss": -27.34287452697754, "global_step": 471824, "epoch": 5684} {"train_loss": -27.160736083984375, "global_step": 471825, "epoch": 5684} {"train_loss": -27.242780685424805, "global_step": 471826, "epoch": 5684} {"train_loss": -27.026426315307617, "global_step": 471827, "epoch": 5684} {"train_loss": -27.254384994506836, "global_step": 471828, "epoch": 5684} {"train_loss": -26.765634536743164, "global_step": 471829, "epoch": 5684} {"train_loss": -27.594852447509766, "global_step": 471830, "epoch": 5684} {"train_loss": -27.13226318359375, "global_step": 471831, "epoch": 5684} {"train_loss": -27.17376708984375, "global_step": 471832, "epoch": 5684} {"train_loss": -27.59394645690918, "global_step": 471833, "epoch": 5684} {"train_loss": -27.479352951049805, "global_step": 471834, "epoch": 5684} {"train_loss": -27.51047134399414, "global_step": 471835, "epoch": 5684} {"train_loss": -27.27927589416504, "global_step": 471836, "epoch": 5684} {"train_loss": -27.22625160217285, "global_step": 471837, "epoch": 5684} {"train_loss": -27.551727294921875, "global_step": 471838, "epoch": 5684} {"train_loss": -27.066144943237305, "global_step": 471839, "epoch": 5684} {"train_loss": -27.40216064453125, "global_step": 471840, "epoch": 5684} {"train_loss": -26.8303165435791, "global_step": 471841, "epoch": 5684} {"train_loss": -27.589141845703125, "global_step": 471842, "epoch": 5684} {"train_loss": -27.10713768005371, "global_step": 471843, "epoch": 5684} {"train_loss": -27.143054962158203, "global_step": 471844, "epoch": 5684} {"train_loss": -27.49664878845215, "global_step": 471845, "epoch": 5684} {"train_loss": -26.79920768737793, "global_step": 471846, "epoch": 5684} {"train_loss": -27.169143676757812, "global_step": 471847, "epoch": 5684} {"train_loss": -26.74102783203125, "global_step": 471848, "epoch": 5684} {"train_loss": -27.698474884033203, "global_step": 471849, "epoch": 5684} {"train_loss": -27.34347915649414, "global_step": 471850, "epoch": 5684} {"train_loss": -27.273395538330078, "global_step": 471851, "epoch": 5684} {"train_loss": -27.363061904907227, "global_step": 471852, "epoch": 5684} {"train_loss": -27.113788604736328, "global_step": 471853, "epoch": 5684} {"train_loss": -27.00287943001253, "global_step": 471854, "epoch": 5684, "val_loss": 6629456.0} {"train_loss": -26.90506935119629, "global_step": 471855, "epoch": 5685} {"train_loss": -26.77984619140625, "global_step": 471856, "epoch": 5685} {"train_loss": -26.577320098876953, "global_step": 471857, "epoch": 5685} {"train_loss": -27.0063419342041, "global_step": 471858, "epoch": 5685} {"train_loss": -26.5109920501709, "global_step": 471859, "epoch": 5685} {"train_loss": -26.774887084960938, "global_step": 471860, "epoch": 5685} {"train_loss": -27.018651962280273, "global_step": 471861, "epoch": 5685} {"train_loss": -27.1934871673584, "global_step": 471862, "epoch": 5685} {"train_loss": -26.82477378845215, "global_step": 471863, "epoch": 5685} {"train_loss": -27.02680015563965, "global_step": 471864, "epoch": 5685} {"train_loss": -26.84126853942871, "global_step": 471865, "epoch": 5685} {"train_loss": -26.932437896728516, "global_step": 471866, "epoch": 5685} {"train_loss": -26.89167594909668, "global_step": 471867, "epoch": 5685} {"train_loss": -27.266584396362305, "global_step": 471868, "epoch": 5685} {"train_loss": -27.09088134765625, "global_step": 471869, "epoch": 5685} {"train_loss": -27.052539825439453, "global_step": 471870, "epoch": 5685} {"train_loss": -27.060226440429688, "global_step": 471871, "epoch": 5685} {"train_loss": -27.30366325378418, "global_step": 471872, "epoch": 5685} {"train_loss": -27.254993438720703, "global_step": 471873, "epoch": 5685} {"train_loss": -26.79212760925293, "global_step": 471874, "epoch": 5685} {"train_loss": -27.21282958984375, "global_step": 471875, "epoch": 5685} {"train_loss": -27.115415573120117, "global_step": 471876, "epoch": 5685} {"train_loss": -27.545703887939453, "global_step": 471877, "epoch": 5685} {"train_loss": -27.477264404296875, "global_step": 471878, "epoch": 5685} {"train_loss": -27.276647567749023, "global_step": 471879, "epoch": 5685} {"train_loss": -26.97003173828125, "global_step": 471880, "epoch": 5685} {"train_loss": -27.49420166015625, "global_step": 471881, "epoch": 5685} {"train_loss": -27.27581214904785, "global_step": 471882, "epoch": 5685} {"train_loss": -27.1798038482666, "global_step": 471883, "epoch": 5685} {"train_loss": -27.170820236206055, "global_step": 471884, "epoch": 5685} {"train_loss": -27.20853614807129, "global_step": 471885, "epoch": 5685} {"train_loss": -27.20903968811035, "global_step": 471886, "epoch": 5685} {"train_loss": -27.21409034729004, "global_step": 471887, "epoch": 5685} {"train_loss": -27.243871688842773, "global_step": 471888, "epoch": 5685} {"train_loss": -27.18214225769043, "global_step": 471889, "epoch": 5685} {"train_loss": -27.291967391967773, "global_step": 471890, "epoch": 5685} {"train_loss": -27.2416934967041, "global_step": 471891, "epoch": 5685} {"train_loss": -27.394556045532227, "global_step": 471892, "epoch": 5685} {"train_loss": -27.6602725982666, "global_step": 471893, "epoch": 5685} {"train_loss": -27.28443717956543, "global_step": 471894, "epoch": 5685} {"train_loss": -27.574567794799805, "global_step": 471895, "epoch": 5685} {"train_loss": -27.4023380279541, "global_step": 471896, "epoch": 5685} {"train_loss": -27.682470321655273, "global_step": 471897, "epoch": 5685} {"train_loss": -26.753314971923828, "global_step": 471898, "epoch": 5685} {"train_loss": -27.47859001159668, "global_step": 471899, "epoch": 5685} {"train_loss": -27.0225887298584, "global_step": 471900, "epoch": 5685} {"train_loss": -27.50105094909668, "global_step": 471901, "epoch": 5685} {"train_loss": -26.999601364135742, "global_step": 471902, "epoch": 5685} {"train_loss": -26.850341796875, "global_step": 471903, "epoch": 5685} {"train_loss": -27.448352813720703, "global_step": 471904, "epoch": 5685} {"train_loss": -27.133359909057617, "global_step": 471905, "epoch": 5685} {"train_loss": -27.053543090820312, "global_step": 471906, "epoch": 5685} {"train_loss": -27.507537841796875, "global_step": 471907, "epoch": 5685} {"train_loss": -26.82637596130371, "global_step": 471908, "epoch": 5685} {"train_loss": -27.415786743164062, "global_step": 471909, "epoch": 5685} {"train_loss": -27.41878318786621, "global_step": 471910, "epoch": 5685} {"train_loss": -26.586444854736328, "global_step": 471911, "epoch": 5685} {"train_loss": -27.634429931640625, "global_step": 471912, "epoch": 5685} {"train_loss": -27.2086238861084, "global_step": 471913, "epoch": 5685} {"train_loss": -26.987722396850586, "global_step": 471914, "epoch": 5685} {"train_loss": -27.4427490234375, "global_step": 471915, "epoch": 5685} {"train_loss": -27.188390731811523, "global_step": 471916, "epoch": 5685} {"train_loss": -27.527612686157227, "global_step": 471917, "epoch": 5685} {"train_loss": -27.43111228942871, "global_step": 471918, "epoch": 5685} {"train_loss": -27.16480827331543, "global_step": 471919, "epoch": 5685} {"train_loss": -27.196020126342773, "global_step": 471920, "epoch": 5685} {"train_loss": -27.1485652923584, "global_step": 471921, "epoch": 5685} {"train_loss": -27.064010620117188, "global_step": 471922, "epoch": 5685} {"train_loss": -27.474035263061523, "global_step": 471923, "epoch": 5685} {"train_loss": -27.395666122436523, "global_step": 471924, "epoch": 5685} {"train_loss": -27.16669273376465, "global_step": 471925, "epoch": 5685} {"train_loss": -27.55719566345215, "global_step": 471926, "epoch": 5685} {"train_loss": -27.329511642456055, "global_step": 471927, "epoch": 5685} {"train_loss": -26.858510971069336, "global_step": 471928, "epoch": 5685} {"train_loss": -27.254209518432617, "global_step": 471929, "epoch": 5685} {"train_loss": -26.95367431640625, "global_step": 471930, "epoch": 5685} {"train_loss": -27.275293350219727, "global_step": 471931, "epoch": 5685} {"train_loss": -26.721424102783203, "global_step": 471932, "epoch": 5685} {"train_loss": -26.981216430664062, "global_step": 471933, "epoch": 5685} {"train_loss": -27.246112823486328, "global_step": 471934, "epoch": 5685} {"train_loss": -26.877593994140625, "global_step": 471935, "epoch": 5685} {"train_loss": -26.97845458984375, "global_step": 471936, "epoch": 5685} {"train_loss": -27.181139199130506, "global_step": 471937, "epoch": 5685, "val_loss": 6645234.0} {"train_loss": -26.305591583251953, "global_step": 471938, "epoch": 5686} {"train_loss": -26.168109893798828, "global_step": 471939, "epoch": 5686} {"train_loss": -26.33847999572754, "global_step": 471940, "epoch": 5686} {"train_loss": -26.001834869384766, "global_step": 471941, "epoch": 5686} {"train_loss": -26.11836051940918, "global_step": 471942, "epoch": 5686} {"train_loss": -26.46546745300293, "global_step": 471943, "epoch": 5686} {"train_loss": -26.1049861907959, "global_step": 471944, "epoch": 5686} {"train_loss": -26.381763458251953, "global_step": 471945, "epoch": 5686} {"train_loss": -26.633066177368164, "global_step": 471946, "epoch": 5686} {"train_loss": -26.650182723999023, "global_step": 471947, "epoch": 5686} {"train_loss": -26.680221557617188, "global_step": 471948, "epoch": 5686} {"train_loss": -26.738996505737305, "global_step": 471949, "epoch": 5686} {"train_loss": -26.701446533203125, "global_step": 471950, "epoch": 5686} {"train_loss": -26.58725357055664, "global_step": 471951, "epoch": 5686} {"train_loss": -26.90378189086914, "global_step": 471952, "epoch": 5686} {"train_loss": -27.17945671081543, "global_step": 471953, "epoch": 5686} {"train_loss": -26.61237907409668, "global_step": 471954, "epoch": 5686} {"train_loss": -27.0419864654541, "global_step": 471955, "epoch": 5686} {"train_loss": -26.7270450592041, "global_step": 471956, "epoch": 5686} {"train_loss": -26.568603515625, "global_step": 471957, "epoch": 5686} {"train_loss": -27.030363082885742, "global_step": 471958, "epoch": 5686} {"train_loss": -26.97612953186035, "global_step": 471959, "epoch": 5686} {"train_loss": -26.983997344970703, "global_step": 471960, "epoch": 5686} {"train_loss": -26.93796157836914, "global_step": 471961, "epoch": 5686} {"train_loss": -26.807065963745117, "global_step": 471962, "epoch": 5686} {"train_loss": -26.633777618408203, "global_step": 471963, "epoch": 5686} {"train_loss": -27.061996459960938, "global_step": 471964, "epoch": 5686} {"train_loss": -26.93450355529785, "global_step": 471965, "epoch": 5686} {"train_loss": -27.062713623046875, "global_step": 471966, "epoch": 5686} {"train_loss": -26.905384063720703, "global_step": 471967, "epoch": 5686} {"train_loss": -26.997207641601562, "global_step": 471968, "epoch": 5686} {"train_loss": -27.422943115234375, "global_step": 471969, "epoch": 5686} {"train_loss": -27.64670753479004, "global_step": 471970, "epoch": 5686} {"train_loss": -26.895156860351562, "global_step": 471971, "epoch": 5686} {"train_loss": -27.23908805847168, "global_step": 471972, "epoch": 5686} {"train_loss": -27.156452178955078, "global_step": 471973, "epoch": 5686} {"train_loss": -27.56207847595215, "global_step": 471974, "epoch": 5686} {"train_loss": -27.70041847229004, "global_step": 471975, "epoch": 5686} {"train_loss": -27.25241470336914, "global_step": 471976, "epoch": 5686} {"train_loss": -27.044498443603516, "global_step": 471977, "epoch": 5686} {"train_loss": -27.250762939453125, "global_step": 471978, "epoch": 5686} {"train_loss": -27.4068546295166, "global_step": 471979, "epoch": 5686} {"train_loss": -27.072092056274414, "global_step": 471980, "epoch": 5686} {"train_loss": -27.074722290039062, "global_step": 471981, "epoch": 5686} {"train_loss": -26.898406982421875, "global_step": 471982, "epoch": 5686} {"train_loss": -26.986188888549805, "global_step": 471983, "epoch": 5686} {"train_loss": -27.399335861206055, "global_step": 471984, "epoch": 5686} {"train_loss": -27.15888023376465, "global_step": 471985, "epoch": 5686} {"train_loss": -27.333280563354492, "global_step": 471986, "epoch": 5686} {"train_loss": -27.40107536315918, "global_step": 471987, "epoch": 5686} {"train_loss": -27.108428955078125, "global_step": 471988, "epoch": 5686} {"train_loss": -27.468463897705078, "global_step": 471989, "epoch": 5686} {"train_loss": -27.3553466796875, "global_step": 471990, "epoch": 5686} {"train_loss": -27.629108428955078, "global_step": 471991, "epoch": 5686} {"train_loss": -27.32846450805664, "global_step": 471992, "epoch": 5686} {"train_loss": -27.2010555267334, "global_step": 471993, "epoch": 5686} {"train_loss": -27.4593448638916, "global_step": 471994, "epoch": 5686} {"train_loss": -27.36069107055664, "global_step": 471995, "epoch": 5686} {"train_loss": -27.396371841430664, "global_step": 471996, "epoch": 5686} {"train_loss": -27.54401206970215, "global_step": 471997, "epoch": 5686} {"train_loss": -27.428678512573242, "global_step": 471998, "epoch": 5686} {"train_loss": -27.709247589111328, "global_step": 471999, "epoch": 5686} {"train_loss": -27.002805709838867, "global_step": 472000, "epoch": 5686} {"train_loss": -27.36305046081543, "global_step": 472001, "epoch": 5686} {"train_loss": -27.536970138549805, "global_step": 472002, "epoch": 5686} {"train_loss": -27.367029190063477, "global_step": 472003, "epoch": 5686} {"train_loss": -27.552234649658203, "global_step": 472004, "epoch": 5686} {"train_loss": -27.586416244506836, "global_step": 472005, "epoch": 5686} {"train_loss": -27.37334632873535, "global_step": 472006, "epoch": 5686} {"train_loss": -27.131088256835938, "global_step": 472007, "epoch": 5686} {"train_loss": -27.365589141845703, "global_step": 472008, "epoch": 5686} {"train_loss": -27.70783805847168, "global_step": 472009, "epoch": 5686} {"train_loss": -27.22983169555664, "global_step": 472010, "epoch": 5686} {"train_loss": -27.199594497680664, "global_step": 472011, "epoch": 5686} {"train_loss": -27.546716690063477, "global_step": 472012, "epoch": 5686} {"train_loss": -27.608325958251953, "global_step": 472013, "epoch": 5686} {"train_loss": -27.111860275268555, "global_step": 472014, "epoch": 5686} {"train_loss": -27.09431266784668, "global_step": 472015, "epoch": 5686} {"train_loss": -26.140981674194336, "global_step": 472016, "epoch": 5686} {"train_loss": -25.08985710144043, "global_step": 472017, "epoch": 5686} {"train_loss": -24.748310089111328, "global_step": 472018, "epoch": 5686} {"train_loss": -24.921302795410156, "global_step": 472019, "epoch": 5686} {"train_loss": -26.98421080715685, "global_step": 472020, "epoch": 5686, "val_loss": 6708384.5} {"train_loss": -24.48566246032715, "global_step": 472021, "epoch": 5687} {"train_loss": -21.282384872436523, "global_step": 472022, "epoch": 5687} {"train_loss": -26.628009796142578, "global_step": 472023, "epoch": 5687} {"train_loss": -23.192949295043945, "global_step": 472024, "epoch": 5687} {"train_loss": -26.131793975830078, "global_step": 472025, "epoch": 5687} {"train_loss": -24.182886123657227, "global_step": 472026, "epoch": 5687} {"train_loss": -25.81129264831543, "global_step": 472027, "epoch": 5687} {"train_loss": -26.43413734436035, "global_step": 472028, "epoch": 5687} {"train_loss": -25.235366821289062, "global_step": 472029, "epoch": 5687} {"train_loss": -25.779951095581055, "global_step": 472030, "epoch": 5687} {"train_loss": -25.954809188842773, "global_step": 472031, "epoch": 5687} {"train_loss": -26.06109046936035, "global_step": 472032, "epoch": 5687} {"train_loss": -26.035139083862305, "global_step": 472033, "epoch": 5687} {"train_loss": -25.399335861206055, "global_step": 472034, "epoch": 5687} {"train_loss": -26.20330810546875, "global_step": 472035, "epoch": 5687} {"train_loss": -26.17640495300293, "global_step": 472036, "epoch": 5687} {"train_loss": -25.973608016967773, "global_step": 472037, "epoch": 5687} {"train_loss": -26.352237701416016, "global_step": 472038, "epoch": 5687} {"train_loss": -26.40101432800293, "global_step": 472039, "epoch": 5687} {"train_loss": -26.261999130249023, "global_step": 472040, "epoch": 5687} {"train_loss": -26.28032875061035, "global_step": 472041, "epoch": 5687} {"train_loss": -25.91936683654785, "global_step": 472042, "epoch": 5687} {"train_loss": -26.205732345581055, "global_step": 472043, "epoch": 5687} {"train_loss": -26.354867935180664, "global_step": 472044, "epoch": 5687} {"train_loss": -26.391977310180664, "global_step": 472045, "epoch": 5687} {"train_loss": -26.47134780883789, "global_step": 472046, "epoch": 5687} {"train_loss": -26.634252548217773, "global_step": 472047, "epoch": 5687} {"train_loss": -26.810428619384766, "global_step": 472048, "epoch": 5687} {"train_loss": -26.57802391052246, "global_step": 472049, "epoch": 5687} {"train_loss": -26.52392578125, "global_step": 472050, "epoch": 5687} {"train_loss": -26.5919189453125, "global_step": 472051, "epoch": 5687} {"train_loss": -27.214391708374023, "global_step": 472052, "epoch": 5687} {"train_loss": -26.8781681060791, "global_step": 472053, "epoch": 5687} {"train_loss": -26.88960075378418, "global_step": 472054, "epoch": 5687} {"train_loss": -26.733108520507812, "global_step": 472055, "epoch": 5687} {"train_loss": -26.777332305908203, "global_step": 472056, "epoch": 5687} {"train_loss": -26.694761276245117, "global_step": 472057, "epoch": 5687} {"train_loss": -26.623926162719727, "global_step": 472058, "epoch": 5687} {"train_loss": -26.95743179321289, "global_step": 472059, "epoch": 5687} {"train_loss": -26.968780517578125, "global_step": 472060, "epoch": 5687} {"train_loss": -26.666784286499023, "global_step": 472061, "epoch": 5687} {"train_loss": -26.606037139892578, "global_step": 472062, "epoch": 5687} {"train_loss": -26.83405876159668, "global_step": 472063, "epoch": 5687} {"train_loss": -26.787317276000977, "global_step": 472064, "epoch": 5687} {"train_loss": -26.85259437561035, "global_step": 472065, "epoch": 5687} {"train_loss": -27.334726333618164, "global_step": 472066, "epoch": 5687} {"train_loss": -27.132007598876953, "global_step": 472067, "epoch": 5687} {"train_loss": -27.277984619140625, "global_step": 472068, "epoch": 5687} {"train_loss": -26.88917350769043, "global_step": 472069, "epoch": 5687} {"train_loss": -27.420337677001953, "global_step": 472070, "epoch": 5687} {"train_loss": -27.3223876953125, "global_step": 472071, "epoch": 5687} {"train_loss": -27.198902130126953, "global_step": 472072, "epoch": 5687} {"train_loss": -27.269546508789062, "global_step": 472073, "epoch": 5687} {"train_loss": -26.935504913330078, "global_step": 472074, "epoch": 5687} {"train_loss": -27.43927574157715, "global_step": 472075, "epoch": 5687} {"train_loss": -26.5831356048584, "global_step": 472076, "epoch": 5687} {"train_loss": -27.3266658782959, "global_step": 472077, "epoch": 5687} {"train_loss": -26.859609603881836, "global_step": 472078, "epoch": 5687} {"train_loss": -27.27495765686035, "global_step": 472079, "epoch": 5687} {"train_loss": -27.18305015563965, "global_step": 472080, "epoch": 5687} {"train_loss": -26.947620391845703, "global_step": 472081, "epoch": 5687} {"train_loss": -27.160449981689453, "global_step": 472082, "epoch": 5687} {"train_loss": -27.11638832092285, "global_step": 472083, "epoch": 5687} {"train_loss": -27.40858268737793, "global_step": 472084, "epoch": 5687} {"train_loss": -27.375202178955078, "global_step": 472085, "epoch": 5687} {"train_loss": -26.69935417175293, "global_step": 472086, "epoch": 5687} {"train_loss": -27.2834529876709, "global_step": 472087, "epoch": 5687} {"train_loss": -27.599218368530273, "global_step": 472088, "epoch": 5687} {"train_loss": -26.987577438354492, "global_step": 472089, "epoch": 5687} {"train_loss": -26.6610050201416, "global_step": 472090, "epoch": 5687} {"train_loss": -26.97840690612793, "global_step": 472091, "epoch": 5687} {"train_loss": -27.490345001220703, "global_step": 472092, "epoch": 5687} {"train_loss": -26.837244033813477, "global_step": 472093, "epoch": 5687} {"train_loss": -26.688074111938477, "global_step": 472094, "epoch": 5687} {"train_loss": -27.01959228515625, "global_step": 472095, "epoch": 5687} {"train_loss": -26.813430786132812, "global_step": 472096, "epoch": 5687} {"train_loss": -26.82118034362793, "global_step": 472097, "epoch": 5687} {"train_loss": -27.131656646728516, "global_step": 472098, "epoch": 5687} {"train_loss": -26.524707794189453, "global_step": 472099, "epoch": 5687} {"train_loss": -26.86800193786621, "global_step": 472100, "epoch": 5687} {"train_loss": -27.364179611206055, "global_step": 472101, "epoch": 5687} {"train_loss": -27.207555770874023, "global_step": 472102, "epoch": 5687} {"train_loss": -26.5948125310691, "global_step": 472103, "epoch": 5687, "val_loss": 6632737.0} {"train_loss": -24.72161102294922, "global_step": 472104, "epoch": 5688} {"train_loss": -27.000152587890625, "global_step": 472105, "epoch": 5688} {"train_loss": -24.917570114135742, "global_step": 472106, "epoch": 5688} {"train_loss": -26.114810943603516, "global_step": 472107, "epoch": 5688} {"train_loss": -25.390867233276367, "global_step": 472108, "epoch": 5688} {"train_loss": -26.025318145751953, "global_step": 472109, "epoch": 5688} {"train_loss": -26.234060287475586, "global_step": 472110, "epoch": 5688} {"train_loss": -25.959131240844727, "global_step": 472111, "epoch": 5688} {"train_loss": -26.24677848815918, "global_step": 472112, "epoch": 5688} {"train_loss": -26.69144630432129, "global_step": 472113, "epoch": 5688} {"train_loss": -26.4857234954834, "global_step": 472114, "epoch": 5688} {"train_loss": -26.406652450561523, "global_step": 472115, "epoch": 5688} {"train_loss": -26.29168701171875, "global_step": 472116, "epoch": 5688} {"train_loss": -26.84943962097168, "global_step": 472117, "epoch": 5688} {"train_loss": -26.773792266845703, "global_step": 472118, "epoch": 5688} {"train_loss": -26.50510025024414, "global_step": 472119, "epoch": 5688} {"train_loss": -26.896026611328125, "global_step": 472120, "epoch": 5688} {"train_loss": -26.958547592163086, "global_step": 472121, "epoch": 5688} {"train_loss": -26.58392333984375, "global_step": 472122, "epoch": 5688} {"train_loss": -26.9280948638916, "global_step": 472123, "epoch": 5688} {"train_loss": -26.935083389282227, "global_step": 472124, "epoch": 5688} {"train_loss": -26.446420669555664, "global_step": 472125, "epoch": 5688} {"train_loss": -26.765592575073242, "global_step": 472126, "epoch": 5688} {"train_loss": -26.862653732299805, "global_step": 472127, "epoch": 5688} {"train_loss": -27.06007194519043, "global_step": 472128, "epoch": 5688} {"train_loss": -26.87583351135254, "global_step": 472129, "epoch": 5688} {"train_loss": -27.098203659057617, "global_step": 472130, "epoch": 5688} {"train_loss": -27.148406982421875, "global_step": 472131, "epoch": 5688} {"train_loss": -26.88056755065918, "global_step": 472132, "epoch": 5688} {"train_loss": -27.4272403717041, "global_step": 472133, "epoch": 5688} {"train_loss": -26.956995010375977, "global_step": 472134, "epoch": 5688} {"train_loss": -27.009490966796875, "global_step": 472135, "epoch": 5688} {"train_loss": -26.806928634643555, "global_step": 472136, "epoch": 5688} {"train_loss": -27.128507614135742, "global_step": 472137, "epoch": 5688} {"train_loss": -26.986927032470703, "global_step": 472138, "epoch": 5688} {"train_loss": -27.381921768188477, "global_step": 472139, "epoch": 5688} {"train_loss": -27.33978843688965, "global_step": 472140, "epoch": 5688} {"train_loss": -26.99152946472168, "global_step": 472141, "epoch": 5688} {"train_loss": -27.40277671813965, "global_step": 472142, "epoch": 5688} {"train_loss": -27.045270919799805, "global_step": 472143, "epoch": 5688} {"train_loss": -27.14656639099121, "global_step": 472144, "epoch": 5688} {"train_loss": -27.099700927734375, "global_step": 472145, "epoch": 5688} {"train_loss": -27.292173385620117, "global_step": 472146, "epoch": 5688} {"train_loss": -26.832616806030273, "global_step": 472147, "epoch": 5688} {"train_loss": -27.46687889099121, "global_step": 472148, "epoch": 5688} {"train_loss": -26.944046020507812, "global_step": 472149, "epoch": 5688} {"train_loss": -27.226484298706055, "global_step": 472150, "epoch": 5688} {"train_loss": -27.297107696533203, "global_step": 472151, "epoch": 5688} {"train_loss": -27.292404174804688, "global_step": 472152, "epoch": 5688} {"train_loss": -27.213964462280273, "global_step": 472153, "epoch": 5688} {"train_loss": -27.409622192382812, "global_step": 472154, "epoch": 5688} {"train_loss": -27.332651138305664, "global_step": 472155, "epoch": 5688} {"train_loss": -27.6114559173584, "global_step": 472156, "epoch": 5688} {"train_loss": -27.203094482421875, "global_step": 472157, "epoch": 5688} {"train_loss": -27.151264190673828, "global_step": 472158, "epoch": 5688} {"train_loss": -27.354516983032227, "global_step": 472159, "epoch": 5688} {"train_loss": -27.254230499267578, "global_step": 472160, "epoch": 5688} {"train_loss": -27.396955490112305, "global_step": 472161, "epoch": 5688} {"train_loss": -26.985015869140625, "global_step": 472162, "epoch": 5688} {"train_loss": -27.379621505737305, "global_step": 472163, "epoch": 5688} {"train_loss": -27.101560592651367, "global_step": 472164, "epoch": 5688} {"train_loss": -27.165130615234375, "global_step": 472165, "epoch": 5688} {"train_loss": -26.95041275024414, "global_step": 472166, "epoch": 5688} {"train_loss": -27.217090606689453, "global_step": 472167, "epoch": 5688} {"train_loss": -27.36285400390625, "global_step": 472168, "epoch": 5688} {"train_loss": -27.343524932861328, "global_step": 472169, "epoch": 5688} {"train_loss": -27.1846866607666, "global_step": 472170, "epoch": 5688} {"train_loss": -27.164966583251953, "global_step": 472171, "epoch": 5688} {"train_loss": -27.459400177001953, "global_step": 472172, "epoch": 5688} {"train_loss": -27.3526668548584, "global_step": 472173, "epoch": 5688} {"train_loss": -27.19921875, "global_step": 472174, "epoch": 5688} {"train_loss": -26.7381591796875, "global_step": 472175, "epoch": 5688} {"train_loss": -27.169605255126953, "global_step": 472176, "epoch": 5688} {"train_loss": -27.19597816467285, "global_step": 472177, "epoch": 5688} {"train_loss": -27.337081909179688, "global_step": 472178, "epoch": 5688} {"train_loss": -27.235626220703125, "global_step": 472179, "epoch": 5688} {"train_loss": -27.17732048034668, "global_step": 472180, "epoch": 5688} {"train_loss": -27.335779190063477, "global_step": 472181, "epoch": 5688} {"train_loss": -27.28005027770996, "global_step": 472182, "epoch": 5688} {"train_loss": -27.3714656829834, "global_step": 472183, "epoch": 5688} {"train_loss": -27.245336532592773, "global_step": 472184, "epoch": 5688} {"train_loss": -27.304279327392578, "global_step": 472185, "epoch": 5688} {"train_loss": -26.975340923631048, "global_step": 472186, "epoch": 5688, "val_loss": 6544631.5} {"train_loss": -27.081796646118164, "global_step": 472187, "epoch": 5689} {"train_loss": -26.92890739440918, "global_step": 472188, "epoch": 5689} {"train_loss": -27.314558029174805, "global_step": 472189, "epoch": 5689} {"train_loss": -27.228229522705078, "global_step": 472190, "epoch": 5689} {"train_loss": -27.08637046813965, "global_step": 472191, "epoch": 5689} {"train_loss": -27.18242835998535, "global_step": 472192, "epoch": 5689} {"train_loss": -27.183731079101562, "global_step": 472193, "epoch": 5689} {"train_loss": -27.458881378173828, "global_step": 472194, "epoch": 5689} {"train_loss": -27.27046012878418, "global_step": 472195, "epoch": 5689} {"train_loss": -27.584213256835938, "global_step": 472196, "epoch": 5689} {"train_loss": -27.22879981994629, "global_step": 472197, "epoch": 5689} {"train_loss": -27.277374267578125, "global_step": 472198, "epoch": 5689} {"train_loss": -27.22694206237793, "global_step": 472199, "epoch": 5689} {"train_loss": -27.115930557250977, "global_step": 472200, "epoch": 5689} {"train_loss": -27.232385635375977, "global_step": 472201, "epoch": 5689} {"train_loss": -27.13173484802246, "global_step": 472202, "epoch": 5689} {"train_loss": -26.951873779296875, "global_step": 472203, "epoch": 5689} {"train_loss": -27.27642822265625, "global_step": 472204, "epoch": 5689} {"train_loss": -27.123050689697266, "global_step": 472205, "epoch": 5689} {"train_loss": -26.55225944519043, "global_step": 472206, "epoch": 5689} {"train_loss": -27.063446044921875, "global_step": 472207, "epoch": 5689} {"train_loss": -27.220312118530273, "global_step": 472208, "epoch": 5689} {"train_loss": -27.066822052001953, "global_step": 472209, "epoch": 5689} {"train_loss": -27.349552154541016, "global_step": 472210, "epoch": 5689} {"train_loss": -27.086572647094727, "global_step": 472211, "epoch": 5689} {"train_loss": -27.304977416992188, "global_step": 472212, "epoch": 5689} {"train_loss": -27.58136558532715, "global_step": 472213, "epoch": 5689} {"train_loss": -27.683837890625, "global_step": 472214, "epoch": 5689} {"train_loss": -27.620574951171875, "global_step": 472215, "epoch": 5689} {"train_loss": -27.159265518188477, "global_step": 472216, "epoch": 5689} {"train_loss": -27.439538955688477, "global_step": 472217, "epoch": 5689} {"train_loss": -27.199674606323242, "global_step": 472218, "epoch": 5689} {"train_loss": -27.294843673706055, "global_step": 472219, "epoch": 5689} {"train_loss": -27.25105094909668, "global_step": 472220, "epoch": 5689} {"train_loss": -27.083948135375977, "global_step": 472221, "epoch": 5689} {"train_loss": -27.3486328125, "global_step": 472222, "epoch": 5689} {"train_loss": -27.276777267456055, "global_step": 472223, "epoch": 5689} {"train_loss": -27.562238693237305, "global_step": 472224, "epoch": 5689} {"train_loss": -27.325092315673828, "global_step": 472225, "epoch": 5689} {"train_loss": -27.269031524658203, "global_step": 472226, "epoch": 5689} {"train_loss": -27.1127872467041, "global_step": 472227, "epoch": 5689} {"train_loss": -27.20599937438965, "global_step": 472228, "epoch": 5689} {"train_loss": -27.56160545349121, "global_step": 472229, "epoch": 5689} {"train_loss": -26.952070236206055, "global_step": 472230, "epoch": 5689} {"train_loss": -27.02229881286621, "global_step": 472231, "epoch": 5689} {"train_loss": -27.095483779907227, "global_step": 472232, "epoch": 5689} {"train_loss": -27.4708309173584, "global_step": 472233, "epoch": 5689} {"train_loss": -27.58649253845215, "global_step": 472234, "epoch": 5689} {"train_loss": -26.947500228881836, "global_step": 472235, "epoch": 5689} {"train_loss": -26.90155601501465, "global_step": 472236, "epoch": 5689} {"train_loss": -27.486963272094727, "global_step": 472237, "epoch": 5689} {"train_loss": -27.487829208374023, "global_step": 472238, "epoch": 5689} {"train_loss": -27.439605712890625, "global_step": 472239, "epoch": 5689} {"train_loss": -27.012866973876953, "global_step": 472240, "epoch": 5689} {"train_loss": -26.732669830322266, "global_step": 472241, "epoch": 5689} {"train_loss": -26.887069702148438, "global_step": 472242, "epoch": 5689} {"train_loss": -27.147855758666992, "global_step": 472243, "epoch": 5689} {"train_loss": -27.257415771484375, "global_step": 472244, "epoch": 5689} {"train_loss": -27.024383544921875, "global_step": 472245, "epoch": 5689} {"train_loss": -27.560394287109375, "global_step": 472246, "epoch": 5689} {"train_loss": -26.8843936920166, "global_step": 472247, "epoch": 5689} {"train_loss": -27.509443283081055, "global_step": 472248, "epoch": 5689} {"train_loss": -26.953571319580078, "global_step": 472249, "epoch": 5689} {"train_loss": -27.091007232666016, "global_step": 472250, "epoch": 5689} {"train_loss": -27.015905380249023, "global_step": 472251, "epoch": 5689} {"train_loss": -27.219928741455078, "global_step": 472252, "epoch": 5689} {"train_loss": -27.333322525024414, "global_step": 472253, "epoch": 5689} {"train_loss": -27.502166748046875, "global_step": 472254, "epoch": 5689} {"train_loss": -26.80916404724121, "global_step": 472255, "epoch": 5689} {"train_loss": -27.353330612182617, "global_step": 472256, "epoch": 5689} {"train_loss": -27.288671493530273, "global_step": 472257, "epoch": 5689} {"train_loss": -27.36896324157715, "global_step": 472258, "epoch": 5689} {"train_loss": -27.653512954711914, "global_step": 472259, "epoch": 5689} {"train_loss": -27.107013702392578, "global_step": 472260, "epoch": 5689} {"train_loss": -27.249731063842773, "global_step": 472261, "epoch": 5689} {"train_loss": -27.430891036987305, "global_step": 472262, "epoch": 5689} {"train_loss": -26.97100257873535, "global_step": 472263, "epoch": 5689} {"train_loss": -27.15180778503418, "global_step": 472264, "epoch": 5689} {"train_loss": -27.304718017578125, "global_step": 472265, "epoch": 5689} {"train_loss": -27.174341201782227, "global_step": 472266, "epoch": 5689} {"train_loss": -27.30779457092285, "global_step": 472267, "epoch": 5689} {"train_loss": -27.143756866455078, "global_step": 472268, "epoch": 5689} {"train_loss": -27.23361759875194, "global_step": 472269, "epoch": 5689, "val_loss": 6514511.0} {"train_loss": -26.63245964050293, "global_step": 472270, "epoch": 5690} {"train_loss": -26.308130264282227, "global_step": 472271, "epoch": 5690} {"train_loss": -26.963037490844727, "global_step": 472272, "epoch": 5690} {"train_loss": -27.090524673461914, "global_step": 472273, "epoch": 5690} {"train_loss": -26.888168334960938, "global_step": 472274, "epoch": 5690} {"train_loss": -26.79522132873535, "global_step": 472275, "epoch": 5690} {"train_loss": -26.824848175048828, "global_step": 472276, "epoch": 5690} {"train_loss": -27.203001022338867, "global_step": 472277, "epoch": 5690} {"train_loss": -26.765857696533203, "global_step": 472278, "epoch": 5690} {"train_loss": -26.46847915649414, "global_step": 472279, "epoch": 5690} {"train_loss": -27.228052139282227, "global_step": 472280, "epoch": 5690} {"train_loss": -27.333646774291992, "global_step": 472281, "epoch": 5690} {"train_loss": -27.047683715820312, "global_step": 472282, "epoch": 5690} {"train_loss": -27.25979995727539, "global_step": 472283, "epoch": 5690} {"train_loss": -27.006406784057617, "global_step": 472284, "epoch": 5690} {"train_loss": -27.058746337890625, "global_step": 472285, "epoch": 5690} {"train_loss": -26.64788818359375, "global_step": 472286, "epoch": 5690} {"train_loss": -27.221099853515625, "global_step": 472287, "epoch": 5690} {"train_loss": -27.37415885925293, "global_step": 472288, "epoch": 5690} {"train_loss": -27.365690231323242, "global_step": 472289, "epoch": 5690} {"train_loss": -27.129505157470703, "global_step": 472290, "epoch": 5690} {"train_loss": -27.0794620513916, "global_step": 472291, "epoch": 5690} {"train_loss": -27.31952476501465, "global_step": 472292, "epoch": 5690} {"train_loss": -27.07195472717285, "global_step": 472293, "epoch": 5690} {"train_loss": -27.0555362701416, "global_step": 472294, "epoch": 5690} {"train_loss": -27.22673988342285, "global_step": 472295, "epoch": 5690} {"train_loss": -26.957233428955078, "global_step": 472296, "epoch": 5690} {"train_loss": -27.268207550048828, "global_step": 472297, "epoch": 5690} {"train_loss": -27.436878204345703, "global_step": 472298, "epoch": 5690} {"train_loss": -27.301258087158203, "global_step": 472299, "epoch": 5690} {"train_loss": -27.509916305541992, "global_step": 472300, "epoch": 5690} {"train_loss": -27.32427406311035, "global_step": 472301, "epoch": 5690} {"train_loss": -27.220319747924805, "global_step": 472302, "epoch": 5690} {"train_loss": -27.221603393554688, "global_step": 472303, "epoch": 5690} {"train_loss": -27.362897872924805, "global_step": 472304, "epoch": 5690} {"train_loss": -27.279043197631836, "global_step": 472305, "epoch": 5690} {"train_loss": -27.297277450561523, "global_step": 472306, "epoch": 5690} {"train_loss": -27.147485733032227, "global_step": 472307, "epoch": 5690} {"train_loss": -27.322906494140625, "global_step": 472308, "epoch": 5690} {"train_loss": -27.589908599853516, "global_step": 472309, "epoch": 5690} {"train_loss": -27.21439552307129, "global_step": 472310, "epoch": 5690} {"train_loss": -26.7949161529541, "global_step": 472311, "epoch": 5690} {"train_loss": -26.293027877807617, "global_step": 472312, "epoch": 5690} {"train_loss": -26.74405860900879, "global_step": 472313, "epoch": 5690} {"train_loss": -27.12994384765625, "global_step": 472314, "epoch": 5690} {"train_loss": -27.043127059936523, "global_step": 472315, "epoch": 5690} {"train_loss": -27.43147087097168, "global_step": 472316, "epoch": 5690} {"train_loss": -27.058019638061523, "global_step": 472317, "epoch": 5690} {"train_loss": -26.89893913269043, "global_step": 472318, "epoch": 5690} {"train_loss": -27.284875869750977, "global_step": 472319, "epoch": 5690} {"train_loss": -26.898950576782227, "global_step": 472320, "epoch": 5690} {"train_loss": -26.900487899780273, "global_step": 472321, "epoch": 5690} {"train_loss": -27.0451717376709, "global_step": 472322, "epoch": 5690} {"train_loss": -26.923925399780273, "global_step": 472323, "epoch": 5690} {"train_loss": -27.168079376220703, "global_step": 472324, "epoch": 5690} {"train_loss": -26.974979400634766, "global_step": 472325, "epoch": 5690} {"train_loss": -27.316272735595703, "global_step": 472326, "epoch": 5690} {"train_loss": -27.036884307861328, "global_step": 472327, "epoch": 5690} {"train_loss": -27.064504623413086, "global_step": 472328, "epoch": 5690} {"train_loss": -27.011754989624023, "global_step": 472329, "epoch": 5690} {"train_loss": -27.583715438842773, "global_step": 472330, "epoch": 5690} {"train_loss": -26.98328971862793, "global_step": 472331, "epoch": 5690} {"train_loss": -26.873449325561523, "global_step": 472332, "epoch": 5690} {"train_loss": -26.580127716064453, "global_step": 472333, "epoch": 5690} {"train_loss": -26.89314079284668, "global_step": 472334, "epoch": 5690} {"train_loss": -27.38265037536621, "global_step": 472335, "epoch": 5690} {"train_loss": -27.233869552612305, "global_step": 472336, "epoch": 5690} {"train_loss": -27.22981834411621, "global_step": 472337, "epoch": 5690} {"train_loss": -27.127206802368164, "global_step": 472338, "epoch": 5690} {"train_loss": -27.356298446655273, "global_step": 472339, "epoch": 5690} {"train_loss": -27.240680694580078, "global_step": 472340, "epoch": 5690} {"train_loss": -27.38250160217285, "global_step": 472341, "epoch": 5690} {"train_loss": -27.2096004486084, "global_step": 472342, "epoch": 5690} {"train_loss": -27.05592155456543, "global_step": 472343, "epoch": 5690} {"train_loss": -27.097034454345703, "global_step": 472344, "epoch": 5690} {"train_loss": -27.49452018737793, "global_step": 472345, "epoch": 5690} {"train_loss": -27.145999908447266, "global_step": 472346, "epoch": 5690} {"train_loss": -27.458892822265625, "global_step": 472347, "epoch": 5690} {"train_loss": -27.147104263305664, "global_step": 472348, "epoch": 5690} {"train_loss": -27.113468170166016, "global_step": 472349, "epoch": 5690} {"train_loss": -27.004669189453125, "global_step": 472350, "epoch": 5690} {"train_loss": -27.444122314453125, "global_step": 472351, "epoch": 5690} {"train_loss": -27.114983202463172, "global_step": 472352, "epoch": 5690, "val_loss": 6586968.0} {"train_loss": -26.4146728515625, "global_step": 472353, "epoch": 5691} {"train_loss": -26.167556762695312, "global_step": 472354, "epoch": 5691} {"train_loss": -26.637250900268555, "global_step": 472355, "epoch": 5691} {"train_loss": -26.308073043823242, "global_step": 472356, "epoch": 5691} {"train_loss": -26.559667587280273, "global_step": 472357, "epoch": 5691} {"train_loss": -26.873096466064453, "global_step": 472358, "epoch": 5691} {"train_loss": -26.637563705444336, "global_step": 472359, "epoch": 5691} {"train_loss": -26.66766357421875, "global_step": 472360, "epoch": 5691} {"train_loss": -26.498382568359375, "global_step": 472361, "epoch": 5691} {"train_loss": -26.84393310546875, "global_step": 472362, "epoch": 5691} {"train_loss": -27.15167236328125, "global_step": 472363, "epoch": 5691} {"train_loss": -26.504852294921875, "global_step": 472364, "epoch": 5691} {"train_loss": -26.91861915588379, "global_step": 472365, "epoch": 5691} {"train_loss": -26.518417358398438, "global_step": 472366, "epoch": 5691} {"train_loss": -27.350610733032227, "global_step": 472367, "epoch": 5691} {"train_loss": -27.09246826171875, "global_step": 472368, "epoch": 5691} {"train_loss": -26.945465087890625, "global_step": 472369, "epoch": 5691} {"train_loss": -26.591161727905273, "global_step": 472370, "epoch": 5691} {"train_loss": -26.83518409729004, "global_step": 472371, "epoch": 5691} {"train_loss": -27.096155166625977, "global_step": 472372, "epoch": 5691} {"train_loss": -26.9488525390625, "global_step": 472373, "epoch": 5691} {"train_loss": -27.125598907470703, "global_step": 472374, "epoch": 5691} {"train_loss": -27.008275985717773, "global_step": 472375, "epoch": 5691} {"train_loss": -26.78753089904785, "global_step": 472376, "epoch": 5691} {"train_loss": -27.160795211791992, "global_step": 472377, "epoch": 5691} {"train_loss": -27.086225509643555, "global_step": 472378, "epoch": 5691} {"train_loss": -27.263092041015625, "global_step": 472379, "epoch": 5691} {"train_loss": -27.063568115234375, "global_step": 472380, "epoch": 5691} {"train_loss": -27.221771240234375, "global_step": 472381, "epoch": 5691} {"train_loss": -27.13214683532715, "global_step": 472382, "epoch": 5691} {"train_loss": -27.206130981445312, "global_step": 472383, "epoch": 5691} {"train_loss": -27.02384376525879, "global_step": 472384, "epoch": 5691} {"train_loss": -27.23569679260254, "global_step": 472385, "epoch": 5691} {"train_loss": -27.013471603393555, "global_step": 472386, "epoch": 5691} {"train_loss": -27.11163330078125, "global_step": 472387, "epoch": 5691} {"train_loss": -26.983539581298828, "global_step": 472388, "epoch": 5691} {"train_loss": -27.427112579345703, "global_step": 472389, "epoch": 5691} {"train_loss": -26.951154708862305, "global_step": 472390, "epoch": 5691} {"train_loss": -27.371784210205078, "global_step": 472391, "epoch": 5691} {"train_loss": -27.5421085357666, "global_step": 472392, "epoch": 5691} {"train_loss": -27.260656356811523, "global_step": 472393, "epoch": 5691} {"train_loss": -27.228681564331055, "global_step": 472394, "epoch": 5691} {"train_loss": -27.2592716217041, "global_step": 472395, "epoch": 5691} {"train_loss": -27.2208309173584, "global_step": 472396, "epoch": 5691} {"train_loss": -27.254968643188477, "global_step": 472397, "epoch": 5691} {"train_loss": -27.202106475830078, "global_step": 472398, "epoch": 5691} {"train_loss": -27.29829978942871, "global_step": 472399, "epoch": 5691} {"train_loss": -27.414321899414062, "global_step": 472400, "epoch": 5691} {"train_loss": -27.166162490844727, "global_step": 472401, "epoch": 5691} {"train_loss": -27.160879135131836, "global_step": 472402, "epoch": 5691} {"train_loss": -26.81011962890625, "global_step": 472403, "epoch": 5691} {"train_loss": -27.325407028198242, "global_step": 472404, "epoch": 5691} {"train_loss": -27.3952693939209, "global_step": 472405, "epoch": 5691} {"train_loss": -26.804346084594727, "global_step": 472406, "epoch": 5691} {"train_loss": -27.682294845581055, "global_step": 472407, "epoch": 5691} {"train_loss": -27.171701431274414, "global_step": 472408, "epoch": 5691} {"train_loss": -27.530902862548828, "global_step": 472409, "epoch": 5691} {"train_loss": -27.515745162963867, "global_step": 472410, "epoch": 5691} {"train_loss": -27.67449951171875, "global_step": 472411, "epoch": 5691} {"train_loss": -27.065908432006836, "global_step": 472412, "epoch": 5691} {"train_loss": -27.014862060546875, "global_step": 472413, "epoch": 5691} {"train_loss": -27.100351333618164, "global_step": 472414, "epoch": 5691} {"train_loss": -26.9532527923584, "global_step": 472415, "epoch": 5691} {"train_loss": -27.014745712280273, "global_step": 472416, "epoch": 5691} {"train_loss": -27.008398056030273, "global_step": 472417, "epoch": 5691} {"train_loss": -27.0430908203125, "global_step": 472418, "epoch": 5691} {"train_loss": -27.311649322509766, "global_step": 472419, "epoch": 5691} {"train_loss": -27.183639526367188, "global_step": 472420, "epoch": 5691} {"train_loss": -27.100488662719727, "global_step": 472421, "epoch": 5691} {"train_loss": -27.005817413330078, "global_step": 472422, "epoch": 5691} {"train_loss": -27.229785919189453, "global_step": 472423, "epoch": 5691} {"train_loss": -27.3583927154541, "global_step": 472424, "epoch": 5691} {"train_loss": -27.444202423095703, "global_step": 472425, "epoch": 5691} {"train_loss": -27.245532989501953, "global_step": 472426, "epoch": 5691} {"train_loss": -27.460412979125977, "global_step": 472427, "epoch": 5691} {"train_loss": -27.313180923461914, "global_step": 472428, "epoch": 5691} {"train_loss": -27.3049259185791, "global_step": 472429, "epoch": 5691} {"train_loss": -27.330724716186523, "global_step": 472430, "epoch": 5691} {"train_loss": -27.369184494018555, "global_step": 472431, "epoch": 5691} {"train_loss": -26.951574325561523, "global_step": 472432, "epoch": 5691} {"train_loss": -27.09718132019043, "global_step": 472433, "epoch": 5691} {"train_loss": -27.05706787109375, "global_step": 472434, "epoch": 5691} {"train_loss": -27.07900274805276, "global_step": 472435, "epoch": 5691, "val_loss": 6507378.0} {"train_loss": -26.59978675842285, "global_step": 472436, "epoch": 5692} {"train_loss": -25.537973403930664, "global_step": 472437, "epoch": 5692} {"train_loss": -26.465688705444336, "global_step": 472438, "epoch": 5692} {"train_loss": -26.2192440032959, "global_step": 472439, "epoch": 5692} {"train_loss": -26.530668258666992, "global_step": 472440, "epoch": 5692} {"train_loss": -26.689716339111328, "global_step": 472441, "epoch": 5692} {"train_loss": -26.430255889892578, "global_step": 472442, "epoch": 5692} {"train_loss": -26.943212509155273, "global_step": 472443, "epoch": 5692} {"train_loss": -26.424936294555664, "global_step": 472444, "epoch": 5692} {"train_loss": -26.494293212890625, "global_step": 472445, "epoch": 5692} {"train_loss": -26.71158790588379, "global_step": 472446, "epoch": 5692} {"train_loss": -26.754383087158203, "global_step": 472447, "epoch": 5692} {"train_loss": -26.82716941833496, "global_step": 472448, "epoch": 5692} {"train_loss": -27.26120376586914, "global_step": 472449, "epoch": 5692} {"train_loss": -26.89398765563965, "global_step": 472450, "epoch": 5692} {"train_loss": -26.52473258972168, "global_step": 472451, "epoch": 5692} {"train_loss": -26.86372184753418, "global_step": 472452, "epoch": 5692} {"train_loss": -27.073593139648438, "global_step": 472453, "epoch": 5692} {"train_loss": -27.15643882751465, "global_step": 472454, "epoch": 5692} {"train_loss": -27.3962459564209, "global_step": 472455, "epoch": 5692} {"train_loss": -27.06121253967285, "global_step": 472456, "epoch": 5692} {"train_loss": -27.331701278686523, "global_step": 472457, "epoch": 5692} {"train_loss": -26.925642013549805, "global_step": 472458, "epoch": 5692} {"train_loss": -26.983396530151367, "global_step": 472459, "epoch": 5692} {"train_loss": -26.874414443969727, "global_step": 472460, "epoch": 5692} {"train_loss": -26.802661895751953, "global_step": 472461, "epoch": 5692} {"train_loss": -26.902435302734375, "global_step": 472462, "epoch": 5692} {"train_loss": -27.0028076171875, "global_step": 472463, "epoch": 5692} {"train_loss": -27.1691951751709, "global_step": 472464, "epoch": 5692} {"train_loss": -27.072851181030273, "global_step": 472465, "epoch": 5692} {"train_loss": -26.327817916870117, "global_step": 472466, "epoch": 5692} {"train_loss": -26.599096298217773, "global_step": 472467, "epoch": 5692} {"train_loss": -27.32732582092285, "global_step": 472468, "epoch": 5692} {"train_loss": -27.060033798217773, "global_step": 472469, "epoch": 5692} {"train_loss": -26.92637062072754, "global_step": 472470, "epoch": 5692} {"train_loss": -26.96173667907715, "global_step": 472471, "epoch": 5692} {"train_loss": -27.28824234008789, "global_step": 472472, "epoch": 5692} {"train_loss": -27.410938262939453, "global_step": 472473, "epoch": 5692} {"train_loss": -26.9273681640625, "global_step": 472474, "epoch": 5692} {"train_loss": -27.253681182861328, "global_step": 472475, "epoch": 5692} {"train_loss": -26.97265625, "global_step": 472476, "epoch": 5692} {"train_loss": -27.014387130737305, "global_step": 472477, "epoch": 5692} {"train_loss": -27.2226619720459, "global_step": 472478, "epoch": 5692} {"train_loss": -26.65447998046875, "global_step": 472479, "epoch": 5692} {"train_loss": -27.14324951171875, "global_step": 472480, "epoch": 5692} {"train_loss": -27.330154418945312, "global_step": 472481, "epoch": 5692} {"train_loss": -27.042463302612305, "global_step": 472482, "epoch": 5692} {"train_loss": -27.307113647460938, "global_step": 472483, "epoch": 5692} {"train_loss": -27.160680770874023, "global_step": 472484, "epoch": 5692} {"train_loss": -27.466903686523438, "global_step": 472485, "epoch": 5692} {"train_loss": -27.06879234313965, "global_step": 472486, "epoch": 5692} {"train_loss": -27.2132625579834, "global_step": 472487, "epoch": 5692} {"train_loss": -27.13227653503418, "global_step": 472488, "epoch": 5692} {"train_loss": -27.283008575439453, "global_step": 472489, "epoch": 5692} {"train_loss": -27.400299072265625, "global_step": 472490, "epoch": 5692} {"train_loss": -27.16034507751465, "global_step": 472491, "epoch": 5692} {"train_loss": -27.04743003845215, "global_step": 472492, "epoch": 5692} {"train_loss": -27.220121383666992, "global_step": 472493, "epoch": 5692} {"train_loss": -27.34064292907715, "global_step": 472494, "epoch": 5692} {"train_loss": -26.909704208374023, "global_step": 472495, "epoch": 5692} {"train_loss": -27.312002182006836, "global_step": 472496, "epoch": 5692} {"train_loss": -27.2584171295166, "global_step": 472497, "epoch": 5692} {"train_loss": -27.4888973236084, "global_step": 472498, "epoch": 5692} {"train_loss": -27.510467529296875, "global_step": 472499, "epoch": 5692} {"train_loss": -26.708913803100586, "global_step": 472500, "epoch": 5692} {"train_loss": -27.22346305847168, "global_step": 472501, "epoch": 5692} {"train_loss": -27.091785430908203, "global_step": 472502, "epoch": 5692} {"train_loss": -27.101703643798828, "global_step": 472503, "epoch": 5692} {"train_loss": -27.080961227416992, "global_step": 472504, "epoch": 5692} {"train_loss": -26.774946212768555, "global_step": 472505, "epoch": 5692} {"train_loss": -27.294464111328125, "global_step": 472506, "epoch": 5692} {"train_loss": -27.16578483581543, "global_step": 472507, "epoch": 5692} {"train_loss": -27.74907875061035, "global_step": 472508, "epoch": 5692} {"train_loss": -27.35255241394043, "global_step": 472509, "epoch": 5692} {"train_loss": -27.200220108032227, "global_step": 472510, "epoch": 5692} {"train_loss": -27.596582412719727, "global_step": 472511, "epoch": 5692} {"train_loss": -27.414813995361328, "global_step": 472512, "epoch": 5692} {"train_loss": -27.266571044921875, "global_step": 472513, "epoch": 5692} {"train_loss": -27.18819236755371, "global_step": 472514, "epoch": 5692} {"train_loss": -27.19573402404785, "global_step": 472515, "epoch": 5692} {"train_loss": -27.655414581298828, "global_step": 472516, "epoch": 5692} {"train_loss": -27.199377059936523, "global_step": 472517, "epoch": 5692} {"train_loss": -27.057696147137378, "global_step": 472518, "epoch": 5692, "val_loss": 6617295.5} {"train_loss": -26.67926025390625, "global_step": 472519, "epoch": 5693} {"train_loss": -27.07476234436035, "global_step": 472520, "epoch": 5693} {"train_loss": -26.636762619018555, "global_step": 472521, "epoch": 5693} {"train_loss": -26.708637237548828, "global_step": 472522, "epoch": 5693} {"train_loss": -26.60052490234375, "global_step": 472523, "epoch": 5693} {"train_loss": -26.871200561523438, "global_step": 472524, "epoch": 5693} {"train_loss": -26.661544799804688, "global_step": 472525, "epoch": 5693} {"train_loss": -26.490234375, "global_step": 472526, "epoch": 5693} {"train_loss": -26.67841911315918, "global_step": 472527, "epoch": 5693} {"train_loss": -27.08770179748535, "global_step": 472528, "epoch": 5693} {"train_loss": -26.53348731994629, "global_step": 472529, "epoch": 5693} {"train_loss": -27.23874282836914, "global_step": 472530, "epoch": 5693} {"train_loss": -26.919748306274414, "global_step": 472531, "epoch": 5693} {"train_loss": -27.115869522094727, "global_step": 472532, "epoch": 5693} {"train_loss": -26.91575050354004, "global_step": 472533, "epoch": 5693} {"train_loss": -27.082395553588867, "global_step": 472534, "epoch": 5693} {"train_loss": -27.126272201538086, "global_step": 472535, "epoch": 5693} {"train_loss": -26.63544273376465, "global_step": 472536, "epoch": 5693} {"train_loss": -27.15484046936035, "global_step": 472537, "epoch": 5693} {"train_loss": -26.96500015258789, "global_step": 472538, "epoch": 5693} {"train_loss": -27.3459415435791, "global_step": 472539, "epoch": 5693} {"train_loss": -26.86773109436035, "global_step": 472540, "epoch": 5693} {"train_loss": -26.98291015625, "global_step": 472541, "epoch": 5693} {"train_loss": -27.131378173828125, "global_step": 472542, "epoch": 5693} {"train_loss": -26.998764038085938, "global_step": 472543, "epoch": 5693} {"train_loss": -27.766754150390625, "global_step": 472544, "epoch": 5693} {"train_loss": -27.152511596679688, "global_step": 472545, "epoch": 5693} {"train_loss": -27.05499267578125, "global_step": 472546, "epoch": 5693} {"train_loss": -27.06830406188965, "global_step": 472547, "epoch": 5693} {"train_loss": -27.490798950195312, "global_step": 472548, "epoch": 5693} {"train_loss": -26.747211456298828, "global_step": 472549, "epoch": 5693} {"train_loss": -27.1253719329834, "global_step": 472550, "epoch": 5693} {"train_loss": -27.063501358032227, "global_step": 472551, "epoch": 5693} {"train_loss": -27.249319076538086, "global_step": 472552, "epoch": 5693} {"train_loss": -27.070770263671875, "global_step": 472553, "epoch": 5693} {"train_loss": -27.296728134155273, "global_step": 472554, "epoch": 5693} {"train_loss": -27.31575584411621, "global_step": 472555, "epoch": 5693} {"train_loss": -27.00360107421875, "global_step": 472556, "epoch": 5693} {"train_loss": -27.125293731689453, "global_step": 472557, "epoch": 5693} {"train_loss": -27.144617080688477, "global_step": 472558, "epoch": 5693} {"train_loss": -27.4050235748291, "global_step": 472559, "epoch": 5693} {"train_loss": -27.302534103393555, "global_step": 472560, "epoch": 5693} {"train_loss": -26.928796768188477, "global_step": 472561, "epoch": 5693} {"train_loss": -27.145233154296875, "global_step": 472562, "epoch": 5693} {"train_loss": -26.894262313842773, "global_step": 472563, "epoch": 5693} {"train_loss": -27.12554359436035, "global_step": 472564, "epoch": 5693} {"train_loss": -27.319494247436523, "global_step": 472565, "epoch": 5693} {"train_loss": -26.818832397460938, "global_step": 472566, "epoch": 5693} {"train_loss": -27.017948150634766, "global_step": 472567, "epoch": 5693} {"train_loss": -27.45517349243164, "global_step": 472568, "epoch": 5693} {"train_loss": -27.1097354888916, "global_step": 472569, "epoch": 5693} {"train_loss": -26.7661190032959, "global_step": 472570, "epoch": 5693} {"train_loss": -27.026391983032227, "global_step": 472571, "epoch": 5693} {"train_loss": -27.3831844329834, "global_step": 472572, "epoch": 5693} {"train_loss": -26.9495849609375, "global_step": 472573, "epoch": 5693} {"train_loss": -27.52717399597168, "global_step": 472574, "epoch": 5693} {"train_loss": -27.017608642578125, "global_step": 472575, "epoch": 5693} {"train_loss": -27.742202758789062, "global_step": 472576, "epoch": 5693} {"train_loss": -27.31818199157715, "global_step": 472577, "epoch": 5693} {"train_loss": -27.165145874023438, "global_step": 472578, "epoch": 5693} {"train_loss": -27.34575843811035, "global_step": 472579, "epoch": 5693} {"train_loss": -27.467151641845703, "global_step": 472580, "epoch": 5693} {"train_loss": -27.374494552612305, "global_step": 472581, "epoch": 5693} {"train_loss": -27.303625106811523, "global_step": 472582, "epoch": 5693} {"train_loss": -26.874286651611328, "global_step": 472583, "epoch": 5693} {"train_loss": -27.143407821655273, "global_step": 472584, "epoch": 5693} {"train_loss": -26.986255645751953, "global_step": 472585, "epoch": 5693} {"train_loss": -26.508020401000977, "global_step": 472586, "epoch": 5693} {"train_loss": -26.56915855407715, "global_step": 472587, "epoch": 5693} {"train_loss": -26.96243667602539, "global_step": 472588, "epoch": 5693} {"train_loss": -27.258695602416992, "global_step": 472589, "epoch": 5693} {"train_loss": -27.200414657592773, "global_step": 472590, "epoch": 5693} {"train_loss": -26.785327911376953, "global_step": 472591, "epoch": 5693} {"train_loss": -27.330463409423828, "global_step": 472592, "epoch": 5693} {"train_loss": -26.94843101501465, "global_step": 472593, "epoch": 5693} {"train_loss": -27.192930221557617, "global_step": 472594, "epoch": 5693} {"train_loss": -26.928625106811523, "global_step": 472595, "epoch": 5693} {"train_loss": -26.9123477935791, "global_step": 472596, "epoch": 5693} {"train_loss": -27.24762535095215, "global_step": 472597, "epoch": 5693} {"train_loss": -27.067569732666016, "global_step": 472598, "epoch": 5693} {"train_loss": -27.283899307250977, "global_step": 472599, "epoch": 5693} {"train_loss": -27.088623046875, "global_step": 472600, "epoch": 5693} {"train_loss": -27.051558873739587, "global_step": 472601, "epoch": 5693, "val_loss": 6558263.0} {"train_loss": -27.0737361907959, "global_step": 472602, "epoch": 5694} {"train_loss": -25.92584800720215, "global_step": 472603, "epoch": 5694} {"train_loss": -26.459272384643555, "global_step": 472604, "epoch": 5694} {"train_loss": -25.78082275390625, "global_step": 472605, "epoch": 5694} {"train_loss": -26.021747589111328, "global_step": 472606, "epoch": 5694} {"train_loss": -26.340848922729492, "global_step": 472607, "epoch": 5694} {"train_loss": -25.853830337524414, "global_step": 472608, "epoch": 5694} {"train_loss": -26.809375762939453, "global_step": 472609, "epoch": 5694} {"train_loss": -26.316991806030273, "global_step": 472610, "epoch": 5694} {"train_loss": -26.596017837524414, "global_step": 472611, "epoch": 5694} {"train_loss": -26.189868927001953, "global_step": 472612, "epoch": 5694} {"train_loss": -26.387954711914062, "global_step": 472613, "epoch": 5694} {"train_loss": -26.66652488708496, "global_step": 472614, "epoch": 5694} {"train_loss": -26.6878719329834, "global_step": 472615, "epoch": 5694} {"train_loss": -26.659582138061523, "global_step": 472616, "epoch": 5694} {"train_loss": -26.87591552734375, "global_step": 472617, "epoch": 5694} {"train_loss": -26.974340438842773, "global_step": 472618, "epoch": 5694} {"train_loss": -27.068517684936523, "global_step": 472619, "epoch": 5694} {"train_loss": -26.85391616821289, "global_step": 472620, "epoch": 5694} {"train_loss": -26.889734268188477, "global_step": 472621, "epoch": 5694} {"train_loss": -26.90888786315918, "global_step": 472622, "epoch": 5694} {"train_loss": -26.96335792541504, "global_step": 472623, "epoch": 5694} {"train_loss": -27.061100006103516, "global_step": 472624, "epoch": 5694} {"train_loss": -27.21323013305664, "global_step": 472625, "epoch": 5694} {"train_loss": -27.34229850769043, "global_step": 472626, "epoch": 5694} {"train_loss": -27.41064453125, "global_step": 472627, "epoch": 5694} {"train_loss": -27.198150634765625, "global_step": 472628, "epoch": 5694} {"train_loss": -27.267566680908203, "global_step": 472629, "epoch": 5694} {"train_loss": -27.1295166015625, "global_step": 472630, "epoch": 5694} {"train_loss": -27.34563636779785, "global_step": 472631, "epoch": 5694} {"train_loss": -27.2177734375, "global_step": 472632, "epoch": 5694} {"train_loss": -27.27253532409668, "global_step": 472633, "epoch": 5694} {"train_loss": -27.3138427734375, "global_step": 472634, "epoch": 5694} {"train_loss": -27.214492797851562, "global_step": 472635, "epoch": 5694} {"train_loss": -26.85428810119629, "global_step": 472636, "epoch": 5694} {"train_loss": -27.1558780670166, "global_step": 472637, "epoch": 5694} {"train_loss": -27.056503295898438, "global_step": 472638, "epoch": 5694} {"train_loss": -27.459060668945312, "global_step": 472639, "epoch": 5694} {"train_loss": -27.01387596130371, "global_step": 472640, "epoch": 5694} {"train_loss": -27.41337013244629, "global_step": 472641, "epoch": 5694} {"train_loss": -27.579864501953125, "global_step": 472642, "epoch": 5694} {"train_loss": -27.097639083862305, "global_step": 472643, "epoch": 5694} {"train_loss": -27.5383358001709, "global_step": 472644, "epoch": 5694} {"train_loss": -27.3392276763916, "global_step": 472645, "epoch": 5694} {"train_loss": -27.54194450378418, "global_step": 472646, "epoch": 5694} {"train_loss": -27.162078857421875, "global_step": 472647, "epoch": 5694} {"train_loss": -27.340240478515625, "global_step": 472648, "epoch": 5694} {"train_loss": -26.96148109436035, "global_step": 472649, "epoch": 5694} {"train_loss": -27.204267501831055, "global_step": 472650, "epoch": 5694} {"train_loss": -27.35542869567871, "global_step": 472651, "epoch": 5694} {"train_loss": -27.21543312072754, "global_step": 472652, "epoch": 5694} {"train_loss": -27.10646629333496, "global_step": 472653, "epoch": 5694} {"train_loss": -27.447011947631836, "global_step": 472654, "epoch": 5694} {"train_loss": -27.254926681518555, "global_step": 472655, "epoch": 5694} {"train_loss": -27.638647079467773, "global_step": 472656, "epoch": 5694} {"train_loss": -27.04793357849121, "global_step": 472657, "epoch": 5694} {"train_loss": -27.602447509765625, "global_step": 472658, "epoch": 5694} {"train_loss": -27.085712432861328, "global_step": 472659, "epoch": 5694} {"train_loss": -27.152698516845703, "global_step": 472660, "epoch": 5694} {"train_loss": -27.089847564697266, "global_step": 472661, "epoch": 5694} {"train_loss": -27.448883056640625, "global_step": 472662, "epoch": 5694} {"train_loss": -27.117902755737305, "global_step": 472663, "epoch": 5694} {"train_loss": -27.18808364868164, "global_step": 472664, "epoch": 5694} {"train_loss": -26.9721736907959, "global_step": 472665, "epoch": 5694} {"train_loss": -26.824111938476562, "global_step": 472666, "epoch": 5694} {"train_loss": -26.965463638305664, "global_step": 472667, "epoch": 5694} {"train_loss": -27.267425537109375, "global_step": 472668, "epoch": 5694} {"train_loss": -26.98750114440918, "global_step": 472669, "epoch": 5694} {"train_loss": -26.92244529724121, "global_step": 472670, "epoch": 5694} {"train_loss": -26.868871688842773, "global_step": 472671, "epoch": 5694} {"train_loss": -26.771100997924805, "global_step": 472672, "epoch": 5694} {"train_loss": -27.389301300048828, "global_step": 472673, "epoch": 5694} {"train_loss": -27.463394165039062, "global_step": 472674, "epoch": 5694} {"train_loss": -27.3704833984375, "global_step": 472675, "epoch": 5694} {"train_loss": -27.159826278686523, "global_step": 472676, "epoch": 5694} {"train_loss": -27.37208366394043, "global_step": 472677, "epoch": 5694} {"train_loss": -27.042261123657227, "global_step": 472678, "epoch": 5694} {"train_loss": -27.193267822265625, "global_step": 472679, "epoch": 5694} {"train_loss": -27.653493881225586, "global_step": 472680, "epoch": 5694} {"train_loss": -27.267993927001953, "global_step": 472681, "epoch": 5694} {"train_loss": -27.6827449798584, "global_step": 472682, "epoch": 5694} {"train_loss": -27.799612045288086, "global_step": 472683, "epoch": 5694} {"train_loss": -27.059936155755835, "global_step": 472684, "epoch": 5694, "val_loss": 6551812.5} {"train_loss": -27.145605087280273, "global_step": 472685, "epoch": 5695} {"train_loss": -27.03535270690918, "global_step": 472686, "epoch": 5695} {"train_loss": -27.202512741088867, "global_step": 472687, "epoch": 5695} {"train_loss": -27.381498336791992, "global_step": 472688, "epoch": 5695} {"train_loss": -26.687402725219727, "global_step": 472689, "epoch": 5695} {"train_loss": -26.8914852142334, "global_step": 472690, "epoch": 5695} {"train_loss": -27.198963165283203, "global_step": 472691, "epoch": 5695} {"train_loss": -27.11016845703125, "global_step": 472692, "epoch": 5695} {"train_loss": -27.429052352905273, "global_step": 472693, "epoch": 5695} {"train_loss": -27.37973403930664, "global_step": 472694, "epoch": 5695} {"train_loss": -26.625207901000977, "global_step": 472695, "epoch": 5695} {"train_loss": -26.895099639892578, "global_step": 472696, "epoch": 5695} {"train_loss": -26.946271896362305, "global_step": 472697, "epoch": 5695} {"train_loss": -27.04096794128418, "global_step": 472698, "epoch": 5695} {"train_loss": -26.033130645751953, "global_step": 472699, "epoch": 5695} {"train_loss": -25.464618682861328, "global_step": 472700, "epoch": 5695} {"train_loss": -26.67081642150879, "global_step": 472701, "epoch": 5695} {"train_loss": -26.961145401000977, "global_step": 472702, "epoch": 5695} {"train_loss": -26.458526611328125, "global_step": 472703, "epoch": 5695} {"train_loss": -26.675466537475586, "global_step": 472704, "epoch": 5695} {"train_loss": -26.7249755859375, "global_step": 472705, "epoch": 5695} {"train_loss": -26.95868492126465, "global_step": 472706, "epoch": 5695} {"train_loss": -27.225927352905273, "global_step": 472707, "epoch": 5695} {"train_loss": -26.847553253173828, "global_step": 472708, "epoch": 5695} {"train_loss": -26.846027374267578, "global_step": 472709, "epoch": 5695} {"train_loss": -26.65932273864746, "global_step": 472710, "epoch": 5695} {"train_loss": -27.108123779296875, "global_step": 472711, "epoch": 5695} {"train_loss": -27.282215118408203, "global_step": 472712, "epoch": 5695} {"train_loss": -27.365234375, "global_step": 472713, "epoch": 5695} {"train_loss": -27.1297607421875, "global_step": 472714, "epoch": 5695} {"train_loss": -27.492475509643555, "global_step": 472715, "epoch": 5695} {"train_loss": -26.999420166015625, "global_step": 472716, "epoch": 5695} {"train_loss": -27.35999870300293, "global_step": 472717, "epoch": 5695} {"train_loss": -27.021360397338867, "global_step": 472718, "epoch": 5695} {"train_loss": -26.972244262695312, "global_step": 472719, "epoch": 5695} {"train_loss": -27.254674911499023, "global_step": 472720, "epoch": 5695} {"train_loss": -27.1154842376709, "global_step": 472721, "epoch": 5695} {"train_loss": -27.6207332611084, "global_step": 472722, "epoch": 5695} {"train_loss": -27.201522827148438, "global_step": 472723, "epoch": 5695} {"train_loss": -27.181482315063477, "global_step": 472724, "epoch": 5695} {"train_loss": -27.62569236755371, "global_step": 472725, "epoch": 5695} {"train_loss": -27.026599884033203, "global_step": 472726, "epoch": 5695} {"train_loss": -27.22835350036621, "global_step": 472727, "epoch": 5695} {"train_loss": -27.29569435119629, "global_step": 472728, "epoch": 5695} {"train_loss": -27.191272735595703, "global_step": 472729, "epoch": 5695} {"train_loss": -27.41864013671875, "global_step": 472730, "epoch": 5695} {"train_loss": -27.527084350585938, "global_step": 472731, "epoch": 5695} {"train_loss": -27.187902450561523, "global_step": 472732, "epoch": 5695} {"train_loss": -27.613983154296875, "global_step": 472733, "epoch": 5695} {"train_loss": -27.536605834960938, "global_step": 472734, "epoch": 5695} {"train_loss": -27.214218139648438, "global_step": 472735, "epoch": 5695} {"train_loss": -27.385303497314453, "global_step": 472736, "epoch": 5695} {"train_loss": -27.336233139038086, "global_step": 472737, "epoch": 5695} {"train_loss": -27.06764793395996, "global_step": 472738, "epoch": 5695} {"train_loss": -27.377277374267578, "global_step": 472739, "epoch": 5695} {"train_loss": -27.1447811126709, "global_step": 472740, "epoch": 5695} {"train_loss": -27.361621856689453, "global_step": 472741, "epoch": 5695} {"train_loss": -27.549224853515625, "global_step": 472742, "epoch": 5695} {"train_loss": -27.576974868774414, "global_step": 472743, "epoch": 5695} {"train_loss": -27.307382583618164, "global_step": 472744, "epoch": 5695} {"train_loss": -27.303024291992188, "global_step": 472745, "epoch": 5695} {"train_loss": -27.346704483032227, "global_step": 472746, "epoch": 5695} {"train_loss": -27.1759090423584, "global_step": 472747, "epoch": 5695} {"train_loss": -27.39063835144043, "global_step": 472748, "epoch": 5695} {"train_loss": -27.6355037689209, "global_step": 472749, "epoch": 5695} {"train_loss": -27.449499130249023, "global_step": 472750, "epoch": 5695} {"train_loss": -27.124465942382812, "global_step": 472751, "epoch": 5695} {"train_loss": -27.299213409423828, "global_step": 472752, "epoch": 5695} {"train_loss": -27.183883666992188, "global_step": 472753, "epoch": 5695} {"train_loss": -27.3027400970459, "global_step": 472754, "epoch": 5695} {"train_loss": -27.28977394104004, "global_step": 472755, "epoch": 5695} {"train_loss": -27.55994987487793, "global_step": 472756, "epoch": 5695} {"train_loss": -27.45172119140625, "global_step": 472757, "epoch": 5695} {"train_loss": -27.275583267211914, "global_step": 472758, "epoch": 5695} {"train_loss": -27.156696319580078, "global_step": 472759, "epoch": 5695} {"train_loss": -27.424551010131836, "global_step": 472760, "epoch": 5695} {"train_loss": -27.35602378845215, "global_step": 472761, "epoch": 5695} {"train_loss": -27.187402725219727, "global_step": 472762, "epoch": 5695} {"train_loss": -27.39210319519043, "global_step": 472763, "epoch": 5695} {"train_loss": -27.3746337890625, "global_step": 472764, "epoch": 5695} {"train_loss": -27.434240341186523, "global_step": 472765, "epoch": 5695} {"train_loss": -26.922393798828125, "global_step": 472766, "epoch": 5695} {"train_loss": -27.16640585014619, "global_step": 472767, "epoch": 5695, "val_loss": 6632899.0} {"train_loss": -26.162342071533203, "global_step": 472768, "epoch": 5696} {"train_loss": -26.2180118560791, "global_step": 472769, "epoch": 5696} {"train_loss": -27.0477294921875, "global_step": 472770, "epoch": 5696} {"train_loss": -26.33868980407715, "global_step": 472771, "epoch": 5696} {"train_loss": -26.35663414001465, "global_step": 472772, "epoch": 5696} {"train_loss": -26.78162956237793, "global_step": 472773, "epoch": 5696} {"train_loss": -25.93470573425293, "global_step": 472774, "epoch": 5696} {"train_loss": -27.032581329345703, "global_step": 472775, "epoch": 5696} {"train_loss": -26.502012252807617, "global_step": 472776, "epoch": 5696} {"train_loss": -26.18446159362793, "global_step": 472777, "epoch": 5696} {"train_loss": -26.953699111938477, "global_step": 472778, "epoch": 5696} {"train_loss": -27.012609481811523, "global_step": 472779, "epoch": 5696} {"train_loss": -27.2324275970459, "global_step": 472780, "epoch": 5696} {"train_loss": -26.749618530273438, "global_step": 472781, "epoch": 5696} {"train_loss": -27.063220977783203, "global_step": 472782, "epoch": 5696} {"train_loss": -27.101896286010742, "global_step": 472783, "epoch": 5696} {"train_loss": -26.971393585205078, "global_step": 472784, "epoch": 5696} {"train_loss": -27.121652603149414, "global_step": 472785, "epoch": 5696} {"train_loss": -27.116113662719727, "global_step": 472786, "epoch": 5696} {"train_loss": -26.966272354125977, "global_step": 472787, "epoch": 5696} {"train_loss": -27.03775405883789, "global_step": 472788, "epoch": 5696} {"train_loss": -26.98921012878418, "global_step": 472789, "epoch": 5696} {"train_loss": -26.967960357666016, "global_step": 472790, "epoch": 5696} {"train_loss": -26.9261531829834, "global_step": 472791, "epoch": 5696} {"train_loss": -27.27191734313965, "global_step": 472792, "epoch": 5696} {"train_loss": -27.242313385009766, "global_step": 472793, "epoch": 5696} {"train_loss": -27.193435668945312, "global_step": 472794, "epoch": 5696} {"train_loss": -27.11627197265625, "global_step": 472795, "epoch": 5696} {"train_loss": -27.409643173217773, "global_step": 472796, "epoch": 5696} {"train_loss": -26.985034942626953, "global_step": 472797, "epoch": 5696} {"train_loss": -27.294286727905273, "global_step": 472798, "epoch": 5696} {"train_loss": -26.9948787689209, "global_step": 472799, "epoch": 5696} {"train_loss": -27.24106216430664, "global_step": 472800, "epoch": 5696} {"train_loss": -27.455535888671875, "global_step": 472801, "epoch": 5696} {"train_loss": -27.743545532226562, "global_step": 472802, "epoch": 5696} {"train_loss": -26.974767684936523, "global_step": 472803, "epoch": 5696} {"train_loss": -27.655902862548828, "global_step": 472804, "epoch": 5696} {"train_loss": -27.256132125854492, "global_step": 472805, "epoch": 5696} {"train_loss": -27.33466911315918, "global_step": 472806, "epoch": 5696} {"train_loss": -27.354782104492188, "global_step": 472807, "epoch": 5696} {"train_loss": -27.034467697143555, "global_step": 472808, "epoch": 5696} {"train_loss": -27.515640258789062, "global_step": 472809, "epoch": 5696} {"train_loss": -27.187585830688477, "global_step": 472810, "epoch": 5696} {"train_loss": -27.095062255859375, "global_step": 472811, "epoch": 5696} {"train_loss": -27.152795791625977, "global_step": 472812, "epoch": 5696} {"train_loss": -27.211872100830078, "global_step": 472813, "epoch": 5696} {"train_loss": -27.77717399597168, "global_step": 472814, "epoch": 5696} {"train_loss": -27.378875732421875, "global_step": 472815, "epoch": 5696} {"train_loss": -27.546966552734375, "global_step": 472816, "epoch": 5696} {"train_loss": -27.46222496032715, "global_step": 472817, "epoch": 5696} {"train_loss": -27.564023971557617, "global_step": 472818, "epoch": 5696} {"train_loss": -26.913986206054688, "global_step": 472819, "epoch": 5696} {"train_loss": -26.95771598815918, "global_step": 472820, "epoch": 5696} {"train_loss": -27.172948837280273, "global_step": 472821, "epoch": 5696} {"train_loss": -27.629566192626953, "global_step": 472822, "epoch": 5696} {"train_loss": -27.375446319580078, "global_step": 472823, "epoch": 5696} {"train_loss": -26.968664169311523, "global_step": 472824, "epoch": 5696} {"train_loss": -27.1984920501709, "global_step": 472825, "epoch": 5696} {"train_loss": -27.035856246948242, "global_step": 472826, "epoch": 5696} {"train_loss": -27.001941680908203, "global_step": 472827, "epoch": 5696} {"train_loss": -26.99073600769043, "global_step": 472828, "epoch": 5696} {"train_loss": -27.561185836791992, "global_step": 472829, "epoch": 5696} {"train_loss": -27.3176326751709, "global_step": 472830, "epoch": 5696} {"train_loss": -27.470178604125977, "global_step": 472831, "epoch": 5696} {"train_loss": -27.04621696472168, "global_step": 472832, "epoch": 5696} {"train_loss": -27.10675621032715, "global_step": 472833, "epoch": 5696} {"train_loss": -27.4086971282959, "global_step": 472834, "epoch": 5696} {"train_loss": -27.29762840270996, "global_step": 472835, "epoch": 5696} {"train_loss": -27.145526885986328, "global_step": 472836, "epoch": 5696} {"train_loss": -26.905195236206055, "global_step": 472837, "epoch": 5696} {"train_loss": -27.304004669189453, "global_step": 472838, "epoch": 5696} {"train_loss": -27.06583023071289, "global_step": 472839, "epoch": 5696} {"train_loss": -27.57675552368164, "global_step": 472840, "epoch": 5696} {"train_loss": -27.114688873291016, "global_step": 472841, "epoch": 5696} {"train_loss": -27.098546981811523, "global_step": 472842, "epoch": 5696} {"train_loss": -27.07830810546875, "global_step": 472843, "epoch": 5696} {"train_loss": -27.131006240844727, "global_step": 472844, "epoch": 5696} {"train_loss": -27.07118797302246, "global_step": 472845, "epoch": 5696} {"train_loss": -27.3142032623291, "global_step": 472846, "epoch": 5696} {"train_loss": -27.353864669799805, "global_step": 472847, "epoch": 5696} {"train_loss": -27.340225219726562, "global_step": 472848, "epoch": 5696} {"train_loss": -27.280359268188477, "global_step": 472849, "epoch": 5696} {"train_loss": -27.115960959928582, "global_step": 472850, "epoch": 5696, "val_loss": 6601026.5} {"train_loss": -26.01002311706543, "global_step": 472851, "epoch": 5697} {"train_loss": -25.355621337890625, "global_step": 472852, "epoch": 5697} {"train_loss": -26.856586456298828, "global_step": 472853, "epoch": 5697} {"train_loss": -25.881011962890625, "global_step": 472854, "epoch": 5697} {"train_loss": -27.05207633972168, "global_step": 472855, "epoch": 5697} {"train_loss": -26.243671417236328, "global_step": 472856, "epoch": 5697} {"train_loss": -26.230228424072266, "global_step": 472857, "epoch": 5697} {"train_loss": -26.14469337463379, "global_step": 472858, "epoch": 5697} {"train_loss": -26.44972038269043, "global_step": 472859, "epoch": 5697} {"train_loss": -26.735578536987305, "global_step": 472860, "epoch": 5697} {"train_loss": -26.61712074279785, "global_step": 472861, "epoch": 5697} {"train_loss": -26.5615177154541, "global_step": 472862, "epoch": 5697} {"train_loss": -26.609689712524414, "global_step": 472863, "epoch": 5697} {"train_loss": -26.28753662109375, "global_step": 472864, "epoch": 5697} {"train_loss": -26.761152267456055, "global_step": 472865, "epoch": 5697} {"train_loss": -26.404016494750977, "global_step": 472866, "epoch": 5697} {"train_loss": -26.23798179626465, "global_step": 472867, "epoch": 5697} {"train_loss": -27.005720138549805, "global_step": 472868, "epoch": 5697} {"train_loss": -26.704538345336914, "global_step": 472869, "epoch": 5697} {"train_loss": -26.67693519592285, "global_step": 472870, "epoch": 5697} {"train_loss": -26.6126651763916, "global_step": 472871, "epoch": 5697} {"train_loss": -26.767215728759766, "global_step": 472872, "epoch": 5697} {"train_loss": -26.729726791381836, "global_step": 472873, "epoch": 5697} {"train_loss": -26.76993751525879, "global_step": 472874, "epoch": 5697} {"train_loss": -26.954843521118164, "global_step": 472875, "epoch": 5697} {"train_loss": -27.126646041870117, "global_step": 472876, "epoch": 5697} {"train_loss": -27.214014053344727, "global_step": 472877, "epoch": 5697} {"train_loss": -26.7819766998291, "global_step": 472878, "epoch": 5697} {"train_loss": -27.0617618560791, "global_step": 472879, "epoch": 5697} {"train_loss": -26.879663467407227, "global_step": 472880, "epoch": 5697} {"train_loss": -27.09195899963379, "global_step": 472881, "epoch": 5697} {"train_loss": -27.1276912689209, "global_step": 472882, "epoch": 5697} {"train_loss": -26.756473541259766, "global_step": 472883, "epoch": 5697} {"train_loss": -27.175928115844727, "global_step": 472884, "epoch": 5697} {"train_loss": -27.301950454711914, "global_step": 472885, "epoch": 5697} {"train_loss": -27.212478637695312, "global_step": 472886, "epoch": 5697} {"train_loss": -26.9667911529541, "global_step": 472887, "epoch": 5697} {"train_loss": -27.107587814331055, "global_step": 472888, "epoch": 5697} {"train_loss": -27.185461044311523, "global_step": 472889, "epoch": 5697} {"train_loss": -26.700000762939453, "global_step": 472890, "epoch": 5697} {"train_loss": -27.3040771484375, "global_step": 472891, "epoch": 5697} {"train_loss": -27.617380142211914, "global_step": 472892, "epoch": 5697} {"train_loss": -27.22137451171875, "global_step": 472893, "epoch": 5697} {"train_loss": -26.903467178344727, "global_step": 472894, "epoch": 5697} {"train_loss": -26.85959243774414, "global_step": 472895, "epoch": 5697} {"train_loss": -27.42574119567871, "global_step": 472896, "epoch": 5697} {"train_loss": -26.883380889892578, "global_step": 472897, "epoch": 5697} {"train_loss": -27.397687911987305, "global_step": 472898, "epoch": 5697} {"train_loss": -27.39691734313965, "global_step": 472899, "epoch": 5697} {"train_loss": -27.235660552978516, "global_step": 472900, "epoch": 5697} {"train_loss": -27.1495418548584, "global_step": 472901, "epoch": 5697} {"train_loss": -27.113840103149414, "global_step": 472902, "epoch": 5697} {"train_loss": -26.992528915405273, "global_step": 472903, "epoch": 5697} {"train_loss": -26.985794067382812, "global_step": 472904, "epoch": 5697} {"train_loss": -26.6683406829834, "global_step": 472905, "epoch": 5697} {"train_loss": -27.386381149291992, "global_step": 472906, "epoch": 5697} {"train_loss": -27.245956420898438, "global_step": 472907, "epoch": 5697} {"train_loss": -27.205081939697266, "global_step": 472908, "epoch": 5697} {"train_loss": -27.281808853149414, "global_step": 472909, "epoch": 5697} {"train_loss": -27.524580001831055, "global_step": 472910, "epoch": 5697} {"train_loss": -27.363513946533203, "global_step": 472911, "epoch": 5697} {"train_loss": -26.828657150268555, "global_step": 472912, "epoch": 5697} {"train_loss": -27.411956787109375, "global_step": 472913, "epoch": 5697} {"train_loss": -27.454755783081055, "global_step": 472914, "epoch": 5697} {"train_loss": -27.491052627563477, "global_step": 472915, "epoch": 5697} {"train_loss": -27.308805465698242, "global_step": 472916, "epoch": 5697} {"train_loss": -27.342756271362305, "global_step": 472917, "epoch": 5697} {"train_loss": -27.000661849975586, "global_step": 472918, "epoch": 5697} {"train_loss": -27.202987670898438, "global_step": 472919, "epoch": 5697} {"train_loss": -27.445138931274414, "global_step": 472920, "epoch": 5697} {"train_loss": -27.343143463134766, "global_step": 472921, "epoch": 5697} {"train_loss": -27.484052658081055, "global_step": 472922, "epoch": 5697} {"train_loss": -27.41192054748535, "global_step": 472923, "epoch": 5697} {"train_loss": -27.2640323638916, "global_step": 472924, "epoch": 5697} {"train_loss": -27.414112091064453, "global_step": 472925, "epoch": 5697} {"train_loss": -27.62177848815918, "global_step": 472926, "epoch": 5697} {"train_loss": -27.331388473510742, "global_step": 472927, "epoch": 5697} {"train_loss": -27.68291664123535, "global_step": 472928, "epoch": 5697} {"train_loss": -27.81192970275879, "global_step": 472929, "epoch": 5697} {"train_loss": -27.219940185546875, "global_step": 472930, "epoch": 5697} {"train_loss": -27.245716094970703, "global_step": 472931, "epoch": 5697} {"train_loss": -27.298078536987305, "global_step": 472932, "epoch": 5697} {"train_loss": -26.9977482945086, "global_step": 472933, "epoch": 5697, "val_loss": 6652975.0} {"train_loss": -27.304157257080078, "global_step": 472934, "epoch": 5698} {"train_loss": -26.268573760986328, "global_step": 472935, "epoch": 5698} {"train_loss": -26.947799682617188, "global_step": 472936, "epoch": 5698} {"train_loss": -26.654006958007812, "global_step": 472937, "epoch": 5698} {"train_loss": -26.9132022857666, "global_step": 472938, "epoch": 5698} {"train_loss": -26.8079833984375, "global_step": 472939, "epoch": 5698} {"train_loss": -26.79646110534668, "global_step": 472940, "epoch": 5698} {"train_loss": -26.585126876831055, "global_step": 472941, "epoch": 5698} {"train_loss": -27.036548614501953, "global_step": 472942, "epoch": 5698} {"train_loss": -26.93250846862793, "global_step": 472943, "epoch": 5698} {"train_loss": -27.0844669342041, "global_step": 472944, "epoch": 5698} {"train_loss": -26.774396896362305, "global_step": 472945, "epoch": 5698} {"train_loss": -27.029193878173828, "global_step": 472946, "epoch": 5698} {"train_loss": -27.12849998474121, "global_step": 472947, "epoch": 5698} {"train_loss": -26.9149169921875, "global_step": 472948, "epoch": 5698} {"train_loss": -26.75856590270996, "global_step": 472949, "epoch": 5698} {"train_loss": -26.869781494140625, "global_step": 472950, "epoch": 5698} {"train_loss": -27.07278823852539, "global_step": 472951, "epoch": 5698} {"train_loss": -26.85918617248535, "global_step": 472952, "epoch": 5698} {"train_loss": -27.087406158447266, "global_step": 472953, "epoch": 5698} {"train_loss": -27.05376625061035, "global_step": 472954, "epoch": 5698} {"train_loss": -26.991174697875977, "global_step": 472955, "epoch": 5698} {"train_loss": -27.065723419189453, "global_step": 472956, "epoch": 5698} {"train_loss": -27.60440444946289, "global_step": 472957, "epoch": 5698} {"train_loss": -27.247297286987305, "global_step": 472958, "epoch": 5698} {"train_loss": -27.375030517578125, "global_step": 472959, "epoch": 5698} {"train_loss": -26.98103904724121, "global_step": 472960, "epoch": 5698} {"train_loss": -27.371301651000977, "global_step": 472961, "epoch": 5698} {"train_loss": -27.199277877807617, "global_step": 472962, "epoch": 5698} {"train_loss": -27.04587745666504, "global_step": 472963, "epoch": 5698} {"train_loss": -26.919357299804688, "global_step": 472964, "epoch": 5698} {"train_loss": -27.1837158203125, "global_step": 472965, "epoch": 5698} {"train_loss": -27.407535552978516, "global_step": 472966, "epoch": 5698} {"train_loss": -27.181669235229492, "global_step": 472967, "epoch": 5698} {"train_loss": -27.082050323486328, "global_step": 472968, "epoch": 5698} {"train_loss": -27.093408584594727, "global_step": 472969, "epoch": 5698} {"train_loss": -27.662424087524414, "global_step": 472970, "epoch": 5698} {"train_loss": -27.28461265563965, "global_step": 472971, "epoch": 5698} {"train_loss": -27.526952743530273, "global_step": 472972, "epoch": 5698} {"train_loss": -27.3328800201416, "global_step": 472973, "epoch": 5698} {"train_loss": -27.364171981811523, "global_step": 472974, "epoch": 5698} {"train_loss": -26.974750518798828, "global_step": 472975, "epoch": 5698} {"train_loss": -27.457605361938477, "global_step": 472976, "epoch": 5698} {"train_loss": -27.64023780822754, "global_step": 472977, "epoch": 5698} {"train_loss": -27.412683486938477, "global_step": 472978, "epoch": 5698} {"train_loss": -27.363325119018555, "global_step": 472979, "epoch": 5698} {"train_loss": -27.11067008972168, "global_step": 472980, "epoch": 5698} {"train_loss": -27.192670822143555, "global_step": 472981, "epoch": 5698} {"train_loss": -26.75494956970215, "global_step": 472982, "epoch": 5698} {"train_loss": -27.097644805908203, "global_step": 472983, "epoch": 5698} {"train_loss": -27.625782012939453, "global_step": 472984, "epoch": 5698} {"train_loss": -26.859060287475586, "global_step": 472985, "epoch": 5698} {"train_loss": -27.054346084594727, "global_step": 472986, "epoch": 5698} {"train_loss": -27.428647994995117, "global_step": 472987, "epoch": 5698} {"train_loss": -27.178546905517578, "global_step": 472988, "epoch": 5698} {"train_loss": -27.075693130493164, "global_step": 472989, "epoch": 5698} {"train_loss": -27.565576553344727, "global_step": 472990, "epoch": 5698} {"train_loss": -27.287214279174805, "global_step": 472991, "epoch": 5698} {"train_loss": -27.617517471313477, "global_step": 472992, "epoch": 5698} {"train_loss": -27.567041397094727, "global_step": 472993, "epoch": 5698} {"train_loss": -27.207372665405273, "global_step": 472994, "epoch": 5698} {"train_loss": -27.2021541595459, "global_step": 472995, "epoch": 5698} {"train_loss": -27.238235473632812, "global_step": 472996, "epoch": 5698} {"train_loss": -27.3039608001709, "global_step": 472997, "epoch": 5698} {"train_loss": -27.38567543029785, "global_step": 472998, "epoch": 5698} {"train_loss": -27.7083740234375, "global_step": 472999, "epoch": 5698} {"train_loss": -27.135740280151367, "global_step": 473000, "epoch": 5698} {"train_loss": -27.38580894470215, "global_step": 473001, "epoch": 5698} {"train_loss": -26.5533504486084, "global_step": 473002, "epoch": 5698} {"train_loss": -26.992298126220703, "global_step": 473003, "epoch": 5698} {"train_loss": -27.4195556640625, "global_step": 473004, "epoch": 5698} {"train_loss": -26.915342330932617, "global_step": 473005, "epoch": 5698} {"train_loss": -26.9615535736084, "global_step": 473006, "epoch": 5698} {"train_loss": -27.02685546875, "global_step": 473007, "epoch": 5698} {"train_loss": -26.724292755126953, "global_step": 473008, "epoch": 5698} {"train_loss": -26.3632755279541, "global_step": 473009, "epoch": 5698} {"train_loss": -26.819379806518555, "global_step": 473010, "epoch": 5698} {"train_loss": -27.1038875579834, "global_step": 473011, "epoch": 5698} {"train_loss": -26.564075469970703, "global_step": 473012, "epoch": 5698} {"train_loss": -27.041940689086914, "global_step": 473013, "epoch": 5698} {"train_loss": -27.15227699279785, "global_step": 473014, "epoch": 5698} {"train_loss": -27.042343139648438, "global_step": 473015, "epoch": 5698} {"train_loss": -27.10885169707149, "global_step": 473016, "epoch": 5698, "val_loss": 6571719.0} {"train_loss": -25.762414932250977, "global_step": 473017, "epoch": 5699} {"train_loss": -26.061513900756836, "global_step": 473018, "epoch": 5699} {"train_loss": -26.408689498901367, "global_step": 473019, "epoch": 5699} {"train_loss": -26.012042999267578, "global_step": 473020, "epoch": 5699} {"train_loss": -26.400724411010742, "global_step": 473021, "epoch": 5699} {"train_loss": -26.247343063354492, "global_step": 473022, "epoch": 5699} {"train_loss": -26.31550407409668, "global_step": 473023, "epoch": 5699} {"train_loss": -26.060195922851562, "global_step": 473024, "epoch": 5699} {"train_loss": -26.67352294921875, "global_step": 473025, "epoch": 5699} {"train_loss": -26.759851455688477, "global_step": 473026, "epoch": 5699} {"train_loss": -27.097599029541016, "global_step": 473027, "epoch": 5699} {"train_loss": -26.745010375976562, "global_step": 473028, "epoch": 5699} {"train_loss": -26.72823143005371, "global_step": 473029, "epoch": 5699} {"train_loss": -26.470407485961914, "global_step": 473030, "epoch": 5699} {"train_loss": -26.802448272705078, "global_step": 473031, "epoch": 5699} {"train_loss": -26.39149284362793, "global_step": 473032, "epoch": 5699} {"train_loss": -26.874359130859375, "global_step": 473033, "epoch": 5699} {"train_loss": -26.553058624267578, "global_step": 473034, "epoch": 5699} {"train_loss": -26.855545043945312, "global_step": 473035, "epoch": 5699} {"train_loss": -26.610925674438477, "global_step": 473036, "epoch": 5699} {"train_loss": -26.964710235595703, "global_step": 473037, "epoch": 5699} {"train_loss": -26.766279220581055, "global_step": 473038, "epoch": 5699} {"train_loss": -26.867694854736328, "global_step": 473039, "epoch": 5699} {"train_loss": -27.194021224975586, "global_step": 473040, "epoch": 5699} {"train_loss": -26.791345596313477, "global_step": 473041, "epoch": 5699} {"train_loss": -26.915943145751953, "global_step": 473042, "epoch": 5699} {"train_loss": -26.979650497436523, "global_step": 473043, "epoch": 5699} {"train_loss": -26.93133544921875, "global_step": 473044, "epoch": 5699} {"train_loss": -27.485736846923828, "global_step": 473045, "epoch": 5699} {"train_loss": -27.614713668823242, "global_step": 473046, "epoch": 5699} {"train_loss": -27.259674072265625, "global_step": 473047, "epoch": 5699} {"train_loss": -27.35662269592285, "global_step": 473048, "epoch": 5699} {"train_loss": -27.223068237304688, "global_step": 473049, "epoch": 5699} {"train_loss": -27.4819393157959, "global_step": 473050, "epoch": 5699} {"train_loss": -27.03449821472168, "global_step": 473051, "epoch": 5699} {"train_loss": -27.62420082092285, "global_step": 473052, "epoch": 5699} {"train_loss": -27.408910751342773, "global_step": 473053, "epoch": 5699} {"train_loss": -27.189855575561523, "global_step": 473054, "epoch": 5699} {"train_loss": -27.486801147460938, "global_step": 473055, "epoch": 5699} {"train_loss": -27.354047775268555, "global_step": 473056, "epoch": 5699} {"train_loss": -27.18219566345215, "global_step": 473057, "epoch": 5699} {"train_loss": -27.27581214904785, "global_step": 473058, "epoch": 5699} {"train_loss": -27.285688400268555, "global_step": 473059, "epoch": 5699} {"train_loss": -27.458967208862305, "global_step": 473060, "epoch": 5699} {"train_loss": -27.174833297729492, "global_step": 473061, "epoch": 5699} {"train_loss": -27.187170028686523, "global_step": 473062, "epoch": 5699} {"train_loss": -27.1966495513916, "global_step": 473063, "epoch": 5699} {"train_loss": -27.21955680847168, "global_step": 473064, "epoch": 5699} {"train_loss": -27.486536026000977, "global_step": 473065, "epoch": 5699} {"train_loss": -27.456298828125, "global_step": 473066, "epoch": 5699} {"train_loss": -27.67536735534668, "global_step": 473067, "epoch": 5699} {"train_loss": -27.60296630859375, "global_step": 473068, "epoch": 5699} {"train_loss": -27.32362937927246, "global_step": 473069, "epoch": 5699} {"train_loss": -27.43280601501465, "global_step": 473070, "epoch": 5699} {"train_loss": -27.088470458984375, "global_step": 473071, "epoch": 5699} {"train_loss": -27.074438095092773, "global_step": 473072, "epoch": 5699} {"train_loss": -26.7332763671875, "global_step": 473073, "epoch": 5699} {"train_loss": -26.289630889892578, "global_step": 473074, "epoch": 5699} {"train_loss": -26.16204261779785, "global_step": 473075, "epoch": 5699} {"train_loss": -26.96430015563965, "global_step": 473076, "epoch": 5699} {"train_loss": -26.850860595703125, "global_step": 473077, "epoch": 5699} {"train_loss": -26.476531982421875, "global_step": 473078, "epoch": 5699} {"train_loss": -27.207279205322266, "global_step": 473079, "epoch": 5699} {"train_loss": -26.63300132751465, "global_step": 473080, "epoch": 5699} {"train_loss": -26.655242919921875, "global_step": 473081, "epoch": 5699} {"train_loss": -25.881668090820312, "global_step": 473082, "epoch": 5699} {"train_loss": -25.590164184570312, "global_step": 473083, "epoch": 5699} {"train_loss": -23.370182037353516, "global_step": 473084, "epoch": 5699} {"train_loss": -24.924137115478516, "global_step": 473085, "epoch": 5699} {"train_loss": -26.271142959594727, "global_step": 473086, "epoch": 5699} {"train_loss": -25.298391342163086, "global_step": 473087, "epoch": 5699} {"train_loss": -25.755578994750977, "global_step": 473088, "epoch": 5699} {"train_loss": -26.323944091796875, "global_step": 473089, "epoch": 5699} {"train_loss": -26.171567916870117, "global_step": 473090, "epoch": 5699} {"train_loss": -26.406400680541992, "global_step": 473091, "epoch": 5699} {"train_loss": -25.9864444732666, "global_step": 473092, "epoch": 5699} {"train_loss": -26.478330612182617, "global_step": 473093, "epoch": 5699} {"train_loss": -26.04163932800293, "global_step": 473094, "epoch": 5699} {"train_loss": -26.14923667907715, "global_step": 473095, "epoch": 5699} {"train_loss": -26.149585723876953, "global_step": 473096, "epoch": 5699} {"train_loss": -25.992074966430664, "global_step": 473097, "epoch": 5699} {"train_loss": -26.42059898376465, "global_step": 473098, "epoch": 5699} {"train_loss": -26.703992590846784, "global_step": 473099, "epoch": 5699, "val_loss": 6536962.5} {"train_loss": -26.34124755859375, "global_step": 473100, "epoch": 5700} {"train_loss": -26.03106689453125, "global_step": 473101, "epoch": 5700} {"train_loss": -25.738794326782227, "global_step": 473102, "epoch": 5700} {"train_loss": -26.102155685424805, "global_step": 473103, "epoch": 5700} {"train_loss": -25.86777114868164, "global_step": 473104, "epoch": 5700} {"train_loss": -25.817636489868164, "global_step": 473105, "epoch": 5700} {"train_loss": -26.274988174438477, "global_step": 473106, "epoch": 5700} {"train_loss": -25.957763671875, "global_step": 473107, "epoch": 5700} {"train_loss": -26.441593170166016, "global_step": 473108, "epoch": 5700} {"train_loss": -26.085752487182617, "global_step": 473109, "epoch": 5700} {"train_loss": -26.396869659423828, "global_step": 473110, "epoch": 5700} {"train_loss": -26.57333755493164, "global_step": 473111, "epoch": 5700} {"train_loss": -26.255090713500977, "global_step": 473112, "epoch": 5700} {"train_loss": -26.949499130249023, "global_step": 473113, "epoch": 5700} {"train_loss": -26.6707763671875, "global_step": 473114, "epoch": 5700} {"train_loss": -26.393354415893555, "global_step": 473115, "epoch": 5700} {"train_loss": -26.502033233642578, "global_step": 473116, "epoch": 5700} {"train_loss": -26.873538970947266, "global_step": 473117, "epoch": 5700} {"train_loss": -26.873281478881836, "global_step": 473118, "epoch": 5700} {"train_loss": -26.648792266845703, "global_step": 473119, "epoch": 5700} {"train_loss": -26.911224365234375, "global_step": 473120, "epoch": 5700} {"train_loss": -27.1208438873291, "global_step": 473121, "epoch": 5700} {"train_loss": -26.743213653564453, "global_step": 473122, "epoch": 5700} {"train_loss": -26.675573348999023, "global_step": 473123, "epoch": 5700} {"train_loss": -26.702823638916016, "global_step": 473124, "epoch": 5700} {"train_loss": -26.99725341796875, "global_step": 473125, "epoch": 5700} {"train_loss": -27.045679092407227, "global_step": 473126, "epoch": 5700} {"train_loss": -26.876789093017578, "global_step": 473127, "epoch": 5700} {"train_loss": -27.0301456451416, "global_step": 473128, "epoch": 5700} {"train_loss": -27.317487716674805, "global_step": 473129, "epoch": 5700} {"train_loss": -27.184967041015625, "global_step": 473130, "epoch": 5700} {"train_loss": -27.2034969329834, "global_step": 473131, "epoch": 5700} {"train_loss": -27.05740737915039, "global_step": 473132, "epoch": 5700} {"train_loss": -27.078094482421875, "global_step": 473133, "epoch": 5700} {"train_loss": -27.335805892944336, "global_step": 473134, "epoch": 5700} {"train_loss": -27.3320369720459, "global_step": 473135, "epoch": 5700} {"train_loss": -27.136001586914062, "global_step": 473136, "epoch": 5700} {"train_loss": -27.218908309936523, "global_step": 473137, "epoch": 5700} {"train_loss": -27.2866153717041, "global_step": 473138, "epoch": 5700} {"train_loss": -27.303274154663086, "global_step": 473139, "epoch": 5700} {"train_loss": -27.52764892578125, "global_step": 473140, "epoch": 5700} {"train_loss": -27.421768188476562, "global_step": 473141, "epoch": 5700} {"train_loss": -27.318073272705078, "global_step": 473142, "epoch": 5700} {"train_loss": -27.237085342407227, "global_step": 473143, "epoch": 5700} {"train_loss": -27.376819610595703, "global_step": 473144, "epoch": 5700} {"train_loss": -27.228271484375, "global_step": 473145, "epoch": 5700} {"train_loss": -27.379743576049805, "global_step": 473146, "epoch": 5700} {"train_loss": -27.361398696899414, "global_step": 473147, "epoch": 5700} {"train_loss": -27.370580673217773, "global_step": 473148, "epoch": 5700} {"train_loss": -27.515186309814453, "global_step": 473149, "epoch": 5700} {"train_loss": -27.62104606628418, "global_step": 473150, "epoch": 5700} {"train_loss": -27.542890548706055, "global_step": 473151, "epoch": 5700} {"train_loss": -27.0533390045166, "global_step": 473152, "epoch": 5700} {"train_loss": -27.529632568359375, "global_step": 473153, "epoch": 5700} {"train_loss": -27.427534103393555, "global_step": 473154, "epoch": 5700} {"train_loss": -27.470081329345703, "global_step": 473155, "epoch": 5700} {"train_loss": -27.134366989135742, "global_step": 473156, "epoch": 5700} {"train_loss": -26.68671226501465, "global_step": 473157, "epoch": 5700} {"train_loss": -27.345813751220703, "global_step": 473158, "epoch": 5700} {"train_loss": -27.50446128845215, "global_step": 473159, "epoch": 5700} {"train_loss": -26.787267684936523, "global_step": 473160, "epoch": 5700} {"train_loss": -26.79690933227539, "global_step": 473161, "epoch": 5700} {"train_loss": -27.2755126953125, "global_step": 473162, "epoch": 5700} {"train_loss": -27.035724639892578, "global_step": 473163, "epoch": 5700} {"train_loss": -26.94097328186035, "global_step": 473164, "epoch": 5700} {"train_loss": -27.52829360961914, "global_step": 473165, "epoch": 5700} {"train_loss": -26.905548095703125, "global_step": 473166, "epoch": 5700} {"train_loss": -27.210418701171875, "global_step": 473167, "epoch": 5700} {"train_loss": -27.16493034362793, "global_step": 473168, "epoch": 5700} {"train_loss": -26.971027374267578, "global_step": 473169, "epoch": 5700} {"train_loss": -26.920141220092773, "global_step": 473170, "epoch": 5700} {"train_loss": -26.9491024017334, "global_step": 473171, "epoch": 5700} {"train_loss": -27.268285751342773, "global_step": 473172, "epoch": 5700} {"train_loss": -27.041345596313477, "global_step": 473173, "epoch": 5700} {"train_loss": -27.226409912109375, "global_step": 473174, "epoch": 5700} {"train_loss": -26.973642349243164, "global_step": 473175, "epoch": 5700} {"train_loss": -27.205820083618164, "global_step": 473176, "epoch": 5700} {"train_loss": -27.1569766998291, "global_step": 473177, "epoch": 5700} {"train_loss": -27.35621452331543, "global_step": 473178, "epoch": 5700} {"train_loss": -27.2164363861084, "global_step": 473179, "epoch": 5700} {"train_loss": -27.719745635986328, "global_step": 473180, "epoch": 5700} {"train_loss": -27.265186309814453, "global_step": 473181, "epoch": 5700} {"train_loss": -26.986245557486292, "global_step": 473182, "epoch": 5700, "train/sim_max_reward_0": 0.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4500000": 1.0, "test/sim_max_reward_4500001": 1.0, "test/sim_max_reward_4500002": 1.0, "test/sim_max_reward_4500003": 1.0, "test/sim_max_reward_4500004": 1.0, "test/sim_max_reward_4500005": 1.0, "test/sim_max_reward_4500006": 1.0, "test/sim_max_reward_4500007": 0.0, "test/sim_max_reward_4500008": 1.0, "test/sim_max_reward_4500009": 1.0, "test/sim_max_reward_4500010": 1.0, "test/sim_max_reward_4500011": 1.0, "test/sim_max_reward_4500012": 1.0, "test/sim_max_reward_4500013": 1.0, "test/sim_max_reward_4500014": 1.0, "test/sim_max_reward_4500015": 1.0, "test/sim_max_reward_4500016": 1.0, "test/sim_max_reward_4500017": 1.0, "test/sim_max_reward_4500018": 1.0, "test/sim_max_reward_4500019": 1.0, "test/sim_max_reward_4500020": 1.0, "test/sim_max_reward_4500021": 1.0, "train/mean_score": 0.8333333333333334, "test/mean_score": 0.9545454545454546, "val_loss": 6568882.0} {"train_loss": -26.866443634033203, "global_step": 473183, "epoch": 5701} {"train_loss": -26.908493041992188, "global_step": 473184, "epoch": 5701} {"train_loss": -26.909011840820312, "global_step": 473185, "epoch": 5701} {"train_loss": -27.065460205078125, "global_step": 473186, "epoch": 5701} {"train_loss": -27.220441818237305, "global_step": 473187, "epoch": 5701} {"train_loss": -26.970869064331055, "global_step": 473188, "epoch": 5701} {"train_loss": -27.072805404663086, "global_step": 473189, "epoch": 5701} {"train_loss": -27.0870304107666, "global_step": 473190, "epoch": 5701} {"train_loss": -26.52215576171875, "global_step": 473191, "epoch": 5701} {"train_loss": -27.226093292236328, "global_step": 473192, "epoch": 5701} {"train_loss": -27.717517852783203, "global_step": 473193, "epoch": 5701} {"train_loss": -27.303373336791992, "global_step": 473194, "epoch": 5701} {"train_loss": -27.245986938476562, "global_step": 473195, "epoch": 5701} {"train_loss": -27.356351852416992, "global_step": 473196, "epoch": 5701} {"train_loss": -27.187931060791016, "global_step": 473197, "epoch": 5701} {"train_loss": -27.37900733947754, "global_step": 473198, "epoch": 5701} {"train_loss": -27.40863037109375, "global_step": 473199, "epoch": 5701} {"train_loss": -27.475677490234375, "global_step": 473200, "epoch": 5701} {"train_loss": -27.300756454467773, "global_step": 473201, "epoch": 5701} {"train_loss": -27.209598541259766, "global_step": 473202, "epoch": 5701} {"train_loss": -27.319583892822266, "global_step": 473203, "epoch": 5701} {"train_loss": -27.087011337280273, "global_step": 473204, "epoch": 5701} {"train_loss": -27.218658447265625, "global_step": 473205, "epoch": 5701} {"train_loss": -27.2928466796875, "global_step": 473206, "epoch": 5701} {"train_loss": -27.295011520385742, "global_step": 473207, "epoch": 5701} {"train_loss": -27.317676544189453, "global_step": 473208, "epoch": 5701} {"train_loss": -27.411222457885742, "global_step": 473209, "epoch": 5701} {"train_loss": -27.120229721069336, "global_step": 473210, "epoch": 5701} {"train_loss": -27.56439208984375, "global_step": 473211, "epoch": 5701} {"train_loss": -27.135562896728516, "global_step": 473212, "epoch": 5701} {"train_loss": -27.150833129882812, "global_step": 473213, "epoch": 5701} {"train_loss": -27.25250816345215, "global_step": 473214, "epoch": 5701} {"train_loss": -27.433813095092773, "global_step": 473215, "epoch": 5701} {"train_loss": -27.409467697143555, "global_step": 473216, "epoch": 5701} {"train_loss": -27.44769859313965, "global_step": 473217, "epoch": 5701} {"train_loss": -27.291717529296875, "global_step": 473218, "epoch": 5701} {"train_loss": -27.516576766967773, "global_step": 473219, "epoch": 5701} {"train_loss": -27.443500518798828, "global_step": 473220, "epoch": 5701} {"train_loss": -27.542627334594727, "global_step": 473221, "epoch": 5701} {"train_loss": -27.158863067626953, "global_step": 473222, "epoch": 5701} {"train_loss": -27.301443099975586, "global_step": 473223, "epoch": 5701} {"train_loss": -27.25762939453125, "global_step": 473224, "epoch": 5701} {"train_loss": -27.24262046813965, "global_step": 473225, "epoch": 5701} {"train_loss": -27.409948348999023, "global_step": 473226, "epoch": 5701} {"train_loss": -26.989622116088867, "global_step": 473227, "epoch": 5701} {"train_loss": -27.426334381103516, "global_step": 473228, "epoch": 5701} {"train_loss": -27.120471954345703, "global_step": 473229, "epoch": 5701} {"train_loss": -27.094345092773438, "global_step": 473230, "epoch": 5701} {"train_loss": -27.563495635986328, "global_step": 473231, "epoch": 5701} {"train_loss": -27.379011154174805, "global_step": 473232, "epoch": 5701} {"train_loss": -27.44048500061035, "global_step": 473233, "epoch": 5701} {"train_loss": -27.47511863708496, "global_step": 473234, "epoch": 5701} {"train_loss": -27.157169342041016, "global_step": 473235, "epoch": 5701} {"train_loss": -27.6398868560791, "global_step": 473236, "epoch": 5701} {"train_loss": -27.45578384399414, "global_step": 473237, "epoch": 5701} {"train_loss": -27.03034019470215, "global_step": 473238, "epoch": 5701} {"train_loss": -26.55973243713379, "global_step": 473239, "epoch": 5701} {"train_loss": -26.592456817626953, "global_step": 473240, "epoch": 5701} {"train_loss": -25.855222702026367, "global_step": 473241, "epoch": 5701} {"train_loss": -26.42167091369629, "global_step": 473242, "epoch": 5701} {"train_loss": -26.76393699645996, "global_step": 473243, "epoch": 5701} {"train_loss": -26.816669464111328, "global_step": 473244, "epoch": 5701} {"train_loss": -26.6967716217041, "global_step": 473245, "epoch": 5701} {"train_loss": -26.3815975189209, "global_step": 473246, "epoch": 5701} {"train_loss": -26.354040145874023, "global_step": 473247, "epoch": 5701} {"train_loss": -26.377965927124023, "global_step": 473248, "epoch": 5701} {"train_loss": -26.1405029296875, "global_step": 473249, "epoch": 5701} {"train_loss": -27.043378829956055, "global_step": 473250, "epoch": 5701} {"train_loss": -26.052841186523438, "global_step": 473251, "epoch": 5701} {"train_loss": -26.973447799682617, "global_step": 473252, "epoch": 5701} {"train_loss": -27.016565322875977, "global_step": 473253, "epoch": 5701} {"train_loss": -26.805679321289062, "global_step": 473254, "epoch": 5701} {"train_loss": -26.930078506469727, "global_step": 473255, "epoch": 5701} {"train_loss": -27.00992202758789, "global_step": 473256, "epoch": 5701} {"train_loss": -26.762548446655273, "global_step": 473257, "epoch": 5701} {"train_loss": -26.905975341796875, "global_step": 473258, "epoch": 5701} {"train_loss": -27.291162490844727, "global_step": 473259, "epoch": 5701} {"train_loss": -26.71232032775879, "global_step": 473260, "epoch": 5701} {"train_loss": -26.9386043548584, "global_step": 473261, "epoch": 5701} {"train_loss": -26.84956169128418, "global_step": 473262, "epoch": 5701} {"train_loss": -26.845203399658203, "global_step": 473263, "epoch": 5701} {"train_loss": -26.8675594329834, "global_step": 473264, "epoch": 5701} {"train_loss": -27.081469616258, "global_step": 473265, "epoch": 5701, "val_loss": 6537141.0} {"train_loss": -26.012577056884766, "global_step": 473266, "epoch": 5702} {"train_loss": -26.210031509399414, "global_step": 473267, "epoch": 5702} {"train_loss": -26.567310333251953, "global_step": 473268, "epoch": 5702} {"train_loss": -26.303852081298828, "global_step": 473269, "epoch": 5702} {"train_loss": -26.436635971069336, "global_step": 473270, "epoch": 5702} {"train_loss": -26.248987197875977, "global_step": 473271, "epoch": 5702} {"train_loss": -26.59356689453125, "global_step": 473272, "epoch": 5702} {"train_loss": -26.913190841674805, "global_step": 473273, "epoch": 5702} {"train_loss": -26.59235954284668, "global_step": 473274, "epoch": 5702} {"train_loss": -26.64631462097168, "global_step": 473275, "epoch": 5702} {"train_loss": -26.73541259765625, "global_step": 473276, "epoch": 5702} {"train_loss": -26.858936309814453, "global_step": 473277, "epoch": 5702} {"train_loss": -26.477954864501953, "global_step": 473278, "epoch": 5702} {"train_loss": -26.847766876220703, "global_step": 473279, "epoch": 5702} {"train_loss": -26.721729278564453, "global_step": 473280, "epoch": 5702} {"train_loss": -26.8826961517334, "global_step": 473281, "epoch": 5702} {"train_loss": -26.79670524597168, "global_step": 473282, "epoch": 5702} {"train_loss": -26.9598388671875, "global_step": 473283, "epoch": 5702} {"train_loss": -26.741376876831055, "global_step": 473284, "epoch": 5702} {"train_loss": -26.6220703125, "global_step": 473285, "epoch": 5702} {"train_loss": -26.818622589111328, "global_step": 473286, "epoch": 5702} {"train_loss": -27.0323429107666, "global_step": 473287, "epoch": 5702} {"train_loss": -27.024282455444336, "global_step": 473288, "epoch": 5702} {"train_loss": -26.820417404174805, "global_step": 473289, "epoch": 5702} {"train_loss": -27.169036865234375, "global_step": 473290, "epoch": 5702} {"train_loss": -26.752859115600586, "global_step": 473291, "epoch": 5702} {"train_loss": -26.95356559753418, "global_step": 473292, "epoch": 5702} {"train_loss": -27.08526611328125, "global_step": 473293, "epoch": 5702} {"train_loss": -27.347753524780273, "global_step": 473294, "epoch": 5702} {"train_loss": -27.015588760375977, "global_step": 473295, "epoch": 5702} {"train_loss": -26.6884765625, "global_step": 473296, "epoch": 5702} {"train_loss": -27.079925537109375, "global_step": 473297, "epoch": 5702} {"train_loss": -27.449743270874023, "global_step": 473298, "epoch": 5702} {"train_loss": -27.2568302154541, "global_step": 473299, "epoch": 5702} {"train_loss": -26.918365478515625, "global_step": 473300, "epoch": 5702} {"train_loss": -27.04833984375, "global_step": 473301, "epoch": 5702} {"train_loss": -26.93696403503418, "global_step": 473302, "epoch": 5702} {"train_loss": -27.099027633666992, "global_step": 473303, "epoch": 5702} {"train_loss": -27.540903091430664, "global_step": 473304, "epoch": 5702} {"train_loss": -26.89923095703125, "global_step": 473305, "epoch": 5702} {"train_loss": -27.262380599975586, "global_step": 473306, "epoch": 5702} {"train_loss": -27.118896484375, "global_step": 473307, "epoch": 5702} {"train_loss": -27.11783218383789, "global_step": 473308, "epoch": 5702} {"train_loss": -27.24675941467285, "global_step": 473309, "epoch": 5702} {"train_loss": -27.382862091064453, "global_step": 473310, "epoch": 5702} {"train_loss": -27.036535263061523, "global_step": 473311, "epoch": 5702} {"train_loss": -27.449613571166992, "global_step": 473312, "epoch": 5702} {"train_loss": -26.86393165588379, "global_step": 473313, "epoch": 5702} {"train_loss": -27.38140296936035, "global_step": 473314, "epoch": 5702} {"train_loss": -27.16485023498535, "global_step": 473315, "epoch": 5702} {"train_loss": -27.39215087890625, "global_step": 473316, "epoch": 5702} {"train_loss": -27.1461238861084, "global_step": 473317, "epoch": 5702} {"train_loss": -27.566679000854492, "global_step": 473318, "epoch": 5702} {"train_loss": -27.027624130249023, "global_step": 473319, "epoch": 5702} {"train_loss": -27.14589500427246, "global_step": 473320, "epoch": 5702} {"train_loss": -27.12041664123535, "global_step": 473321, "epoch": 5702} {"train_loss": -27.31591796875, "global_step": 473322, "epoch": 5702} {"train_loss": -27.263452529907227, "global_step": 473323, "epoch": 5702} {"train_loss": -27.275842666625977, "global_step": 473324, "epoch": 5702} {"train_loss": -26.897932052612305, "global_step": 473325, "epoch": 5702} {"train_loss": -27.227319717407227, "global_step": 473326, "epoch": 5702} {"train_loss": -27.33489990234375, "global_step": 473327, "epoch": 5702} {"train_loss": -27.070981979370117, "global_step": 473328, "epoch": 5702} {"train_loss": -26.8570499420166, "global_step": 473329, "epoch": 5702} {"train_loss": -26.57744789123535, "global_step": 473330, "epoch": 5702} {"train_loss": -26.84743309020996, "global_step": 473331, "epoch": 5702} {"train_loss": -27.176000595092773, "global_step": 473332, "epoch": 5702} {"train_loss": -26.463043212890625, "global_step": 473333, "epoch": 5702} {"train_loss": -26.714920043945312, "global_step": 473334, "epoch": 5702} {"train_loss": -27.334508895874023, "global_step": 473335, "epoch": 5702} {"train_loss": -27.510831832885742, "global_step": 473336, "epoch": 5702} {"train_loss": -26.76533317565918, "global_step": 473337, "epoch": 5702} {"train_loss": -27.459150314331055, "global_step": 473338, "epoch": 5702} {"train_loss": -27.776792526245117, "global_step": 473339, "epoch": 5702} {"train_loss": -27.06068992614746, "global_step": 473340, "epoch": 5702} {"train_loss": -27.283557891845703, "global_step": 473341, "epoch": 5702} {"train_loss": -27.371368408203125, "global_step": 473342, "epoch": 5702} {"train_loss": -27.477909088134766, "global_step": 473343, "epoch": 5702} {"train_loss": -27.197376251220703, "global_step": 473344, "epoch": 5702} {"train_loss": -27.873767852783203, "global_step": 473345, "epoch": 5702} {"train_loss": -27.418354034423828, "global_step": 473346, "epoch": 5702} {"train_loss": -27.13385009765625, "global_step": 473347, "epoch": 5702} {"train_loss": -27.01296335243317, "global_step": 473348, "epoch": 5702, "val_loss": 6680589.5} {"train_loss": -26.84699821472168, "global_step": 473349, "epoch": 5703} {"train_loss": -26.83570671081543, "global_step": 473350, "epoch": 5703} {"train_loss": -26.9798526763916, "global_step": 473351, "epoch": 5703} {"train_loss": -27.10214614868164, "global_step": 473352, "epoch": 5703} {"train_loss": -27.032363891601562, "global_step": 473353, "epoch": 5703} {"train_loss": -26.754926681518555, "global_step": 473354, "epoch": 5703} {"train_loss": -27.06507682800293, "global_step": 473355, "epoch": 5703} {"train_loss": -27.287302017211914, "global_step": 473356, "epoch": 5703} {"train_loss": -27.122177124023438, "global_step": 473357, "epoch": 5703} {"train_loss": -27.006195068359375, "global_step": 473358, "epoch": 5703} {"train_loss": -27.466039657592773, "global_step": 473359, "epoch": 5703} {"train_loss": -26.766021728515625, "global_step": 473360, "epoch": 5703} {"train_loss": -27.42831802368164, "global_step": 473361, "epoch": 5703} {"train_loss": -27.052173614501953, "global_step": 473362, "epoch": 5703} {"train_loss": -27.306629180908203, "global_step": 473363, "epoch": 5703} {"train_loss": -27.053699493408203, "global_step": 473364, "epoch": 5703} {"train_loss": -27.417993545532227, "global_step": 473365, "epoch": 5703} {"train_loss": -27.455581665039062, "global_step": 473366, "epoch": 5703} {"train_loss": -27.41168212890625, "global_step": 473367, "epoch": 5703} {"train_loss": -27.530099868774414, "global_step": 473368, "epoch": 5703} {"train_loss": -27.505590438842773, "global_step": 473369, "epoch": 5703} {"train_loss": -27.624622344970703, "global_step": 473370, "epoch": 5703} {"train_loss": -27.241565704345703, "global_step": 473371, "epoch": 5703} {"train_loss": -27.5808162689209, "global_step": 473372, "epoch": 5703} {"train_loss": -27.484106063842773, "global_step": 473373, "epoch": 5703} {"train_loss": -27.640399932861328, "global_step": 473374, "epoch": 5703} {"train_loss": -27.24391746520996, "global_step": 473375, "epoch": 5703} {"train_loss": -27.240293502807617, "global_step": 473376, "epoch": 5703} {"train_loss": -27.439905166625977, "global_step": 473377, "epoch": 5703} {"train_loss": -27.155136108398438, "global_step": 473378, "epoch": 5703} {"train_loss": -27.299518585205078, "global_step": 473379, "epoch": 5703} {"train_loss": -27.046966552734375, "global_step": 473380, "epoch": 5703} {"train_loss": -27.064794540405273, "global_step": 473381, "epoch": 5703} {"train_loss": -27.140716552734375, "global_step": 473382, "epoch": 5703} {"train_loss": -26.835168838500977, "global_step": 473383, "epoch": 5703} {"train_loss": -26.849817276000977, "global_step": 473384, "epoch": 5703} {"train_loss": -26.96551513671875, "global_step": 473385, "epoch": 5703} {"train_loss": -27.144062042236328, "global_step": 473386, "epoch": 5703} {"train_loss": -27.150129318237305, "global_step": 473387, "epoch": 5703} {"train_loss": -26.99313735961914, "global_step": 473388, "epoch": 5703} {"train_loss": -26.942794799804688, "global_step": 473389, "epoch": 5703} {"train_loss": -27.558332443237305, "global_step": 473390, "epoch": 5703} {"train_loss": -26.892908096313477, "global_step": 473391, "epoch": 5703} {"train_loss": -26.772756576538086, "global_step": 473392, "epoch": 5703} {"train_loss": -27.201873779296875, "global_step": 473393, "epoch": 5703} {"train_loss": -26.718793869018555, "global_step": 473394, "epoch": 5703} {"train_loss": -26.6810245513916, "global_step": 473395, "epoch": 5703} {"train_loss": -27.13990592956543, "global_step": 473396, "epoch": 5703} {"train_loss": -26.9117431640625, "global_step": 473397, "epoch": 5703} {"train_loss": -27.203582763671875, "global_step": 473398, "epoch": 5703} {"train_loss": -26.878223419189453, "global_step": 473399, "epoch": 5703} {"train_loss": -27.095518112182617, "global_step": 473400, "epoch": 5703} {"train_loss": -26.9971981048584, "global_step": 473401, "epoch": 5703} {"train_loss": -26.9166259765625, "global_step": 473402, "epoch": 5703} {"train_loss": -26.954345703125, "global_step": 473403, "epoch": 5703} {"train_loss": -27.034101486206055, "global_step": 473404, "epoch": 5703} {"train_loss": -27.216705322265625, "global_step": 473405, "epoch": 5703} {"train_loss": -26.872228622436523, "global_step": 473406, "epoch": 5703} {"train_loss": -26.594263076782227, "global_step": 473407, "epoch": 5703} {"train_loss": -27.29072380065918, "global_step": 473408, "epoch": 5703} {"train_loss": -27.22995376586914, "global_step": 473409, "epoch": 5703} {"train_loss": -26.889480590820312, "global_step": 473410, "epoch": 5703} {"train_loss": -27.268096923828125, "global_step": 473411, "epoch": 5703} {"train_loss": -27.426679611206055, "global_step": 473412, "epoch": 5703} {"train_loss": -27.193866729736328, "global_step": 473413, "epoch": 5703} {"train_loss": -27.604169845581055, "global_step": 473414, "epoch": 5703} {"train_loss": -27.158605575561523, "global_step": 473415, "epoch": 5703} {"train_loss": -26.94581413269043, "global_step": 473416, "epoch": 5703} {"train_loss": -27.3217830657959, "global_step": 473417, "epoch": 5703} {"train_loss": -27.501523971557617, "global_step": 473418, "epoch": 5703} {"train_loss": -27.616453170776367, "global_step": 473419, "epoch": 5703} {"train_loss": -27.175317764282227, "global_step": 473420, "epoch": 5703} {"train_loss": -27.354902267456055, "global_step": 473421, "epoch": 5703} {"train_loss": -26.923355102539062, "global_step": 473422, "epoch": 5703} {"train_loss": -27.210840225219727, "global_step": 473423, "epoch": 5703} {"train_loss": -27.26597023010254, "global_step": 473424, "epoch": 5703} {"train_loss": -27.266122817993164, "global_step": 473425, "epoch": 5703} {"train_loss": -27.02402687072754, "global_step": 473426, "epoch": 5703} {"train_loss": -27.277374267578125, "global_step": 473427, "epoch": 5703} {"train_loss": -27.370813369750977, "global_step": 473428, "epoch": 5703} {"train_loss": -27.33941078186035, "global_step": 473429, "epoch": 5703} {"train_loss": -27.248794555664062, "global_step": 473430, "epoch": 5703} {"train_loss": -27.168427846517908, "global_step": 473431, "epoch": 5703, "val_loss": 6708005.0} {"train_loss": -26.577661514282227, "global_step": 473432, "epoch": 5704} {"train_loss": -26.490808486938477, "global_step": 473433, "epoch": 5704} {"train_loss": -26.604825973510742, "global_step": 473434, "epoch": 5704} {"train_loss": -27.0296630859375, "global_step": 473435, "epoch": 5704} {"train_loss": -26.4213924407959, "global_step": 473436, "epoch": 5704} {"train_loss": -27.503997802734375, "global_step": 473437, "epoch": 5704} {"train_loss": -27.133756637573242, "global_step": 473438, "epoch": 5704} {"train_loss": -27.296289443969727, "global_step": 473439, "epoch": 5704} {"train_loss": -27.446521759033203, "global_step": 473440, "epoch": 5704} {"train_loss": -26.949140548706055, "global_step": 473441, "epoch": 5704} {"train_loss": -27.44635581970215, "global_step": 473442, "epoch": 5704} {"train_loss": -27.24344825744629, "global_step": 473443, "epoch": 5704} {"train_loss": -27.050214767456055, "global_step": 473444, "epoch": 5704} {"train_loss": -27.111896514892578, "global_step": 473445, "epoch": 5704} {"train_loss": -27.07056999206543, "global_step": 473446, "epoch": 5704} {"train_loss": -26.99543571472168, "global_step": 473447, "epoch": 5704} {"train_loss": -27.362497329711914, "global_step": 473448, "epoch": 5704} {"train_loss": -27.58283042907715, "global_step": 473449, "epoch": 5704} {"train_loss": -27.204313278198242, "global_step": 473450, "epoch": 5704} {"train_loss": -27.27174186706543, "global_step": 473451, "epoch": 5704} {"train_loss": -27.559326171875, "global_step": 473452, "epoch": 5704} {"train_loss": -27.037500381469727, "global_step": 473453, "epoch": 5704} {"train_loss": -26.88759422302246, "global_step": 473454, "epoch": 5704} {"train_loss": -27.263050079345703, "global_step": 473455, "epoch": 5704} {"train_loss": -27.064289093017578, "global_step": 473456, "epoch": 5704} {"train_loss": -27.282489776611328, "global_step": 473457, "epoch": 5704} {"train_loss": -26.906530380249023, "global_step": 473458, "epoch": 5704} {"train_loss": -27.308889389038086, "global_step": 473459, "epoch": 5704} {"train_loss": -27.18621826171875, "global_step": 473460, "epoch": 5704} {"train_loss": -26.86054039001465, "global_step": 473461, "epoch": 5704} {"train_loss": -27.298694610595703, "global_step": 473462, "epoch": 5704} {"train_loss": -27.486371994018555, "global_step": 473463, "epoch": 5704} {"train_loss": -26.81586265563965, "global_step": 473464, "epoch": 5704} {"train_loss": -26.976032257080078, "global_step": 473465, "epoch": 5704} {"train_loss": -27.184906005859375, "global_step": 473466, "epoch": 5704} {"train_loss": -27.144458770751953, "global_step": 473467, "epoch": 5704} {"train_loss": -27.353351593017578, "global_step": 473468, "epoch": 5704} {"train_loss": -27.124509811401367, "global_step": 473469, "epoch": 5704} {"train_loss": -27.151325225830078, "global_step": 473470, "epoch": 5704} {"train_loss": -27.296911239624023, "global_step": 473471, "epoch": 5704} {"train_loss": -27.038679122924805, "global_step": 473472, "epoch": 5704} {"train_loss": -27.03962516784668, "global_step": 473473, "epoch": 5704} {"train_loss": -27.10615348815918, "global_step": 473474, "epoch": 5704} {"train_loss": -27.298974990844727, "global_step": 473475, "epoch": 5704} {"train_loss": -26.914533615112305, "global_step": 473476, "epoch": 5704} {"train_loss": -27.259918212890625, "global_step": 473477, "epoch": 5704} {"train_loss": -27.248971939086914, "global_step": 473478, "epoch": 5704} {"train_loss": -27.2221622467041, "global_step": 473479, "epoch": 5704} {"train_loss": -26.870447158813477, "global_step": 473480, "epoch": 5704} {"train_loss": -27.118244171142578, "global_step": 473481, "epoch": 5704} {"train_loss": -27.210132598876953, "global_step": 473482, "epoch": 5704} {"train_loss": -26.93218994140625, "global_step": 473483, "epoch": 5704} {"train_loss": -27.187780380249023, "global_step": 473484, "epoch": 5704} {"train_loss": -27.15952491760254, "global_step": 473485, "epoch": 5704} {"train_loss": -26.957040786743164, "global_step": 473486, "epoch": 5704} {"train_loss": -26.768817901611328, "global_step": 473487, "epoch": 5704} {"train_loss": -27.46234703063965, "global_step": 473488, "epoch": 5704} {"train_loss": -27.010351181030273, "global_step": 473489, "epoch": 5704} {"train_loss": -27.383655548095703, "global_step": 473490, "epoch": 5704} {"train_loss": -27.400720596313477, "global_step": 473491, "epoch": 5704} {"train_loss": -27.336151123046875, "global_step": 473492, "epoch": 5704} {"train_loss": -27.6027774810791, "global_step": 473493, "epoch": 5704} {"train_loss": -27.071805953979492, "global_step": 473494, "epoch": 5704} {"train_loss": -27.47886085510254, "global_step": 473495, "epoch": 5704} {"train_loss": -27.158628463745117, "global_step": 473496, "epoch": 5704} {"train_loss": -26.90015983581543, "global_step": 473497, "epoch": 5704} {"train_loss": -26.979150772094727, "global_step": 473498, "epoch": 5704} {"train_loss": -27.498809814453125, "global_step": 473499, "epoch": 5704} {"train_loss": -27.209875106811523, "global_step": 473500, "epoch": 5704} {"train_loss": -27.484134674072266, "global_step": 473501, "epoch": 5704} {"train_loss": -27.2277889251709, "global_step": 473502, "epoch": 5704} {"train_loss": -27.443517684936523, "global_step": 473503, "epoch": 5704} {"train_loss": -27.058319091796875, "global_step": 473504, "epoch": 5704} {"train_loss": -27.506261825561523, "global_step": 473505, "epoch": 5704} {"train_loss": -27.433130264282227, "global_step": 473506, "epoch": 5704} {"train_loss": -27.26885986328125, "global_step": 473507, "epoch": 5704} {"train_loss": -26.843412399291992, "global_step": 473508, "epoch": 5704} {"train_loss": -27.266569137573242, "global_step": 473509, "epoch": 5704} {"train_loss": -27.583471298217773, "global_step": 473510, "epoch": 5704} {"train_loss": -27.405838012695312, "global_step": 473511, "epoch": 5704} {"train_loss": -27.23255729675293, "global_step": 473512, "epoch": 5704} {"train_loss": -27.122516632080078, "global_step": 473513, "epoch": 5704} {"train_loss": -27.160843630871142, "global_step": 473514, "epoch": 5704, "val_loss": 6735981.0} {"train_loss": -27.220701217651367, "global_step": 473515, "epoch": 5705} {"train_loss": -27.414960861206055, "global_step": 473516, "epoch": 5705} {"train_loss": -27.1217098236084, "global_step": 473517, "epoch": 5705} {"train_loss": -27.0030517578125, "global_step": 473518, "epoch": 5705} {"train_loss": -26.73687744140625, "global_step": 473519, "epoch": 5705} {"train_loss": -26.235071182250977, "global_step": 473520, "epoch": 5705} {"train_loss": -26.276586532592773, "global_step": 473521, "epoch": 5705} {"train_loss": -26.444589614868164, "global_step": 473522, "epoch": 5705} {"train_loss": -26.691162109375, "global_step": 473523, "epoch": 5705} {"train_loss": -26.85251235961914, "global_step": 473524, "epoch": 5705} {"train_loss": -26.439666748046875, "global_step": 473525, "epoch": 5705} {"train_loss": -26.9273681640625, "global_step": 473526, "epoch": 5705} {"train_loss": -26.76698112487793, "global_step": 473527, "epoch": 5705} {"train_loss": -26.50211524963379, "global_step": 473528, "epoch": 5705} {"train_loss": -27.098358154296875, "global_step": 473529, "epoch": 5705} {"train_loss": -26.779346466064453, "global_step": 473530, "epoch": 5705} {"train_loss": -27.387100219726562, "global_step": 473531, "epoch": 5705} {"train_loss": -26.560470581054688, "global_step": 473532, "epoch": 5705} {"train_loss": -27.438024520874023, "global_step": 473533, "epoch": 5705} {"train_loss": -27.044422149658203, "global_step": 473534, "epoch": 5705} {"train_loss": -27.254384994506836, "global_step": 473535, "epoch": 5705} {"train_loss": -27.238584518432617, "global_step": 473536, "epoch": 5705} {"train_loss": -26.880542755126953, "global_step": 473537, "epoch": 5705} {"train_loss": -27.242345809936523, "global_step": 473538, "epoch": 5705} {"train_loss": -27.220373153686523, "global_step": 473539, "epoch": 5705} {"train_loss": -27.201223373413086, "global_step": 473540, "epoch": 5705} {"train_loss": -27.09821128845215, "global_step": 473541, "epoch": 5705} {"train_loss": -27.072782516479492, "global_step": 473542, "epoch": 5705} {"train_loss": -27.030561447143555, "global_step": 473543, "epoch": 5705} {"train_loss": -26.9882755279541, "global_step": 473544, "epoch": 5705} {"train_loss": -27.484821319580078, "global_step": 473545, "epoch": 5705} {"train_loss": -26.86065673828125, "global_step": 473546, "epoch": 5705} {"train_loss": -26.900482177734375, "global_step": 473547, "epoch": 5705} {"train_loss": -26.835987091064453, "global_step": 473548, "epoch": 5705} {"train_loss": -27.310575485229492, "global_step": 473549, "epoch": 5705} {"train_loss": -27.409515380859375, "global_step": 473550, "epoch": 5705} {"train_loss": -27.14796257019043, "global_step": 473551, "epoch": 5705} {"train_loss": -27.371068954467773, "global_step": 473552, "epoch": 5705} {"train_loss": -27.376617431640625, "global_step": 473553, "epoch": 5705} {"train_loss": -27.4384765625, "global_step": 473554, "epoch": 5705} {"train_loss": -27.480667114257812, "global_step": 473555, "epoch": 5705} {"train_loss": -26.967239379882812, "global_step": 473556, "epoch": 5705} {"train_loss": -27.126867294311523, "global_step": 473557, "epoch": 5705} {"train_loss": -27.37116813659668, "global_step": 473558, "epoch": 5705} {"train_loss": -27.311389923095703, "global_step": 473559, "epoch": 5705} {"train_loss": -27.675323486328125, "global_step": 473560, "epoch": 5705} {"train_loss": -27.160816192626953, "global_step": 473561, "epoch": 5705} {"train_loss": -27.615589141845703, "global_step": 473562, "epoch": 5705} {"train_loss": -27.890844345092773, "global_step": 473563, "epoch": 5705} {"train_loss": -27.525671005249023, "global_step": 473564, "epoch": 5705} {"train_loss": -27.637155532836914, "global_step": 473565, "epoch": 5705} {"train_loss": -27.480010986328125, "global_step": 473566, "epoch": 5705} {"train_loss": -27.6086368560791, "global_step": 473567, "epoch": 5705} {"train_loss": -27.158689498901367, "global_step": 473568, "epoch": 5705} {"train_loss": -27.018320083618164, "global_step": 473569, "epoch": 5705} {"train_loss": -27.408166885375977, "global_step": 473570, "epoch": 5705} {"train_loss": -27.179346084594727, "global_step": 473571, "epoch": 5705} {"train_loss": -26.554889678955078, "global_step": 473572, "epoch": 5705} {"train_loss": -26.61319923400879, "global_step": 473573, "epoch": 5705} {"train_loss": -27.110458374023438, "global_step": 473574, "epoch": 5705} {"train_loss": -26.98041343688965, "global_step": 473575, "epoch": 5705} {"train_loss": -26.991613388061523, "global_step": 473576, "epoch": 5705} {"train_loss": -27.46466064453125, "global_step": 473577, "epoch": 5705} {"train_loss": -27.167285919189453, "global_step": 473578, "epoch": 5705} {"train_loss": -27.362836837768555, "global_step": 473579, "epoch": 5705} {"train_loss": -26.996572494506836, "global_step": 473580, "epoch": 5705} {"train_loss": -27.121292114257812, "global_step": 473581, "epoch": 5705} {"train_loss": -27.047224044799805, "global_step": 473582, "epoch": 5705} {"train_loss": -27.0787296295166, "global_step": 473583, "epoch": 5705} {"train_loss": -27.024633407592773, "global_step": 473584, "epoch": 5705} {"train_loss": -27.124597549438477, "global_step": 473585, "epoch": 5705} {"train_loss": -27.20794105529785, "global_step": 473586, "epoch": 5705} {"train_loss": -27.628498077392578, "global_step": 473587, "epoch": 5705} {"train_loss": -27.090795516967773, "global_step": 473588, "epoch": 5705} {"train_loss": -27.10235595703125, "global_step": 473589, "epoch": 5705} {"train_loss": -26.944807052612305, "global_step": 473590, "epoch": 5705} {"train_loss": -27.240503311157227, "global_step": 473591, "epoch": 5705} {"train_loss": -27.003812789916992, "global_step": 473592, "epoch": 5705} {"train_loss": -27.27814292907715, "global_step": 473593, "epoch": 5705} {"train_loss": -27.73005485534668, "global_step": 473594, "epoch": 5705} {"train_loss": -27.23093032836914, "global_step": 473595, "epoch": 5705} {"train_loss": -27.291410446166992, "global_step": 473596, "epoch": 5705} {"train_loss": -27.143401065504694, "global_step": 473597, "epoch": 5705, "val_loss": 6915068.0} {"train_loss": -26.86866569519043, "global_step": 473598, "epoch": 5706} {"train_loss": -26.9484806060791, "global_step": 473599, "epoch": 5706} {"train_loss": -26.700366973876953, "global_step": 473600, "epoch": 5706} {"train_loss": -26.51410484313965, "global_step": 473601, "epoch": 5706} {"train_loss": -27.030933380126953, "global_step": 473602, "epoch": 5706} {"train_loss": -26.985105514526367, "global_step": 473603, "epoch": 5706} {"train_loss": -26.703510284423828, "global_step": 473604, "epoch": 5706} {"train_loss": -26.69855308532715, "global_step": 473605, "epoch": 5706} {"train_loss": -27.208215713500977, "global_step": 473606, "epoch": 5706} {"train_loss": -27.451696395874023, "global_step": 473607, "epoch": 5706} {"train_loss": -26.895339965820312, "global_step": 473608, "epoch": 5706} {"train_loss": -27.05196189880371, "global_step": 473609, "epoch": 5706} {"train_loss": -27.224456787109375, "global_step": 473610, "epoch": 5706} {"train_loss": -27.088647842407227, "global_step": 473611, "epoch": 5706} {"train_loss": -27.16047477722168, "global_step": 473612, "epoch": 5706} {"train_loss": -27.01517105102539, "global_step": 473613, "epoch": 5706} {"train_loss": -27.145709991455078, "global_step": 473614, "epoch": 5706} {"train_loss": -26.945255279541016, "global_step": 473615, "epoch": 5706} {"train_loss": -26.992422103881836, "global_step": 473616, "epoch": 5706} {"train_loss": -27.170202255249023, "global_step": 473617, "epoch": 5706} {"train_loss": -27.08536720275879, "global_step": 473618, "epoch": 5706} {"train_loss": -27.527368545532227, "global_step": 473619, "epoch": 5706} {"train_loss": -27.119693756103516, "global_step": 473620, "epoch": 5706} {"train_loss": -27.1668758392334, "global_step": 473621, "epoch": 5706} {"train_loss": -27.022695541381836, "global_step": 473622, "epoch": 5706} {"train_loss": -27.01836585998535, "global_step": 473623, "epoch": 5706} {"train_loss": -27.331491470336914, "global_step": 473624, "epoch": 5706} {"train_loss": -27.33819580078125, "global_step": 473625, "epoch": 5706} {"train_loss": -27.39885902404785, "global_step": 473626, "epoch": 5706} {"train_loss": -27.10150146484375, "global_step": 473627, "epoch": 5706} {"train_loss": -27.27895164489746, "global_step": 473628, "epoch": 5706} {"train_loss": -27.146148681640625, "global_step": 473629, "epoch": 5706} {"train_loss": -26.76955223083496, "global_step": 473630, "epoch": 5706} {"train_loss": -27.0737361907959, "global_step": 473631, "epoch": 5706} {"train_loss": -27.25750160217285, "global_step": 473632, "epoch": 5706} {"train_loss": -27.361753463745117, "global_step": 473633, "epoch": 5706} {"train_loss": -27.3264217376709, "global_step": 473634, "epoch": 5706} {"train_loss": -27.420459747314453, "global_step": 473635, "epoch": 5706} {"train_loss": -27.002426147460938, "global_step": 473636, "epoch": 5706} {"train_loss": -27.18644142150879, "global_step": 473637, "epoch": 5706} {"train_loss": -27.08790397644043, "global_step": 473638, "epoch": 5706} {"train_loss": -27.242048263549805, "global_step": 473639, "epoch": 5706} {"train_loss": -27.175016403198242, "global_step": 473640, "epoch": 5706} {"train_loss": -27.7716121673584, "global_step": 473641, "epoch": 5706} {"train_loss": -27.218027114868164, "global_step": 473642, "epoch": 5706} {"train_loss": -27.35481834411621, "global_step": 473643, "epoch": 5706} {"train_loss": -27.075353622436523, "global_step": 473644, "epoch": 5706} {"train_loss": -27.18929100036621, "global_step": 473645, "epoch": 5706} {"train_loss": -27.516691207885742, "global_step": 473646, "epoch": 5706} {"train_loss": -27.24629783630371, "global_step": 473647, "epoch": 5706} {"train_loss": -27.308338165283203, "global_step": 473648, "epoch": 5706} {"train_loss": -27.14340591430664, "global_step": 473649, "epoch": 5706} {"train_loss": -27.555805206298828, "global_step": 473650, "epoch": 5706} {"train_loss": -27.324005126953125, "global_step": 473651, "epoch": 5706} {"train_loss": -27.5334415435791, "global_step": 473652, "epoch": 5706} {"train_loss": -27.09307289123535, "global_step": 473653, "epoch": 5706} {"train_loss": -27.351194381713867, "global_step": 473654, "epoch": 5706} {"train_loss": -27.022357940673828, "global_step": 473655, "epoch": 5706} {"train_loss": -27.2960147857666, "global_step": 473656, "epoch": 5706} {"train_loss": -26.77052116394043, "global_step": 473657, "epoch": 5706} {"train_loss": -27.089929580688477, "global_step": 473658, "epoch": 5706} {"train_loss": -27.5216121673584, "global_step": 473659, "epoch": 5706} {"train_loss": -27.22712516784668, "global_step": 473660, "epoch": 5706} {"train_loss": -27.041568756103516, "global_step": 473661, "epoch": 5706} {"train_loss": -26.800329208374023, "global_step": 473662, "epoch": 5706} {"train_loss": -27.577383041381836, "global_step": 473663, "epoch": 5706} {"train_loss": -27.116504669189453, "global_step": 473664, "epoch": 5706} {"train_loss": -26.87383460998535, "global_step": 473665, "epoch": 5706} {"train_loss": -27.1071720123291, "global_step": 473666, "epoch": 5706} {"train_loss": -26.994028091430664, "global_step": 473667, "epoch": 5706} {"train_loss": -27.387842178344727, "global_step": 473668, "epoch": 5706} {"train_loss": -27.189929962158203, "global_step": 473669, "epoch": 5706} {"train_loss": -27.104215621948242, "global_step": 473670, "epoch": 5706} {"train_loss": -27.105688095092773, "global_step": 473671, "epoch": 5706} {"train_loss": -27.299779891967773, "global_step": 473672, "epoch": 5706} {"train_loss": -27.0922794342041, "global_step": 473673, "epoch": 5706} {"train_loss": -27.30893898010254, "global_step": 473674, "epoch": 5706} {"train_loss": -27.0213565826416, "global_step": 473675, "epoch": 5706} {"train_loss": -26.883014678955078, "global_step": 473676, "epoch": 5706} {"train_loss": -27.158960342407227, "global_step": 473677, "epoch": 5706} {"train_loss": -26.882165908813477, "global_step": 473678, "epoch": 5706} {"train_loss": -26.871042251586914, "global_step": 473679, "epoch": 5706} {"train_loss": -27.134999930140484, "global_step": 473680, "epoch": 5706, "val_loss": 6823544.0} {"train_loss": -26.779882431030273, "global_step": 473681, "epoch": 5707} {"train_loss": -26.443164825439453, "global_step": 473682, "epoch": 5707} {"train_loss": -26.81336784362793, "global_step": 473683, "epoch": 5707} {"train_loss": -26.425323486328125, "global_step": 473684, "epoch": 5707} {"train_loss": -26.696081161499023, "global_step": 473685, "epoch": 5707} {"train_loss": -26.90578269958496, "global_step": 473686, "epoch": 5707} {"train_loss": -26.632617950439453, "global_step": 473687, "epoch": 5707} {"train_loss": -26.581222534179688, "global_step": 473688, "epoch": 5707} {"train_loss": -26.845279693603516, "global_step": 473689, "epoch": 5707} {"train_loss": -26.6357421875, "global_step": 473690, "epoch": 5707} {"train_loss": -27.361494064331055, "global_step": 473691, "epoch": 5707} {"train_loss": -27.136829376220703, "global_step": 473692, "epoch": 5707} {"train_loss": -26.761825561523438, "global_step": 473693, "epoch": 5707} {"train_loss": -27.257938385009766, "global_step": 473694, "epoch": 5707} {"train_loss": -27.20134925842285, "global_step": 473695, "epoch": 5707} {"train_loss": -26.863447189331055, "global_step": 473696, "epoch": 5707} {"train_loss": -26.9945011138916, "global_step": 473697, "epoch": 5707} {"train_loss": -26.83078956604004, "global_step": 473698, "epoch": 5707} {"train_loss": -27.025787353515625, "global_step": 473699, "epoch": 5707} {"train_loss": -27.0211124420166, "global_step": 473700, "epoch": 5707} {"train_loss": -27.146255493164062, "global_step": 473701, "epoch": 5707} {"train_loss": -26.96109962463379, "global_step": 473702, "epoch": 5707} {"train_loss": -27.175928115844727, "global_step": 473703, "epoch": 5707} {"train_loss": -26.7349796295166, "global_step": 473704, "epoch": 5707} {"train_loss": -26.73431968688965, "global_step": 473705, "epoch": 5707} {"train_loss": -27.621835708618164, "global_step": 473706, "epoch": 5707} {"train_loss": -27.00042724609375, "global_step": 473707, "epoch": 5707} {"train_loss": -27.041732788085938, "global_step": 473708, "epoch": 5707} {"train_loss": -27.18349266052246, "global_step": 473709, "epoch": 5707} {"train_loss": -27.144140243530273, "global_step": 473710, "epoch": 5707} {"train_loss": -27.293054580688477, "global_step": 473711, "epoch": 5707} {"train_loss": -27.109777450561523, "global_step": 473712, "epoch": 5707} {"train_loss": -27.305261611938477, "global_step": 473713, "epoch": 5707} {"train_loss": -27.081281661987305, "global_step": 473714, "epoch": 5707} {"train_loss": -27.021604537963867, "global_step": 473715, "epoch": 5707} {"train_loss": -27.383377075195312, "global_step": 473716, "epoch": 5707} {"train_loss": -27.305423736572266, "global_step": 473717, "epoch": 5707} {"train_loss": -27.51019287109375, "global_step": 473718, "epoch": 5707} {"train_loss": -27.271575927734375, "global_step": 473719, "epoch": 5707} {"train_loss": -27.255273818969727, "global_step": 473720, "epoch": 5707} {"train_loss": -27.343402862548828, "global_step": 473721, "epoch": 5707} {"train_loss": -27.246305465698242, "global_step": 473722, "epoch": 5707} {"train_loss": -27.306507110595703, "global_step": 473723, "epoch": 5707} {"train_loss": -27.44245719909668, "global_step": 473724, "epoch": 5707} {"train_loss": -27.557409286499023, "global_step": 473725, "epoch": 5707} {"train_loss": -27.270618438720703, "global_step": 473726, "epoch": 5707} {"train_loss": -27.092960357666016, "global_step": 473727, "epoch": 5707} {"train_loss": -26.812088012695312, "global_step": 473728, "epoch": 5707} {"train_loss": -26.758010864257812, "global_step": 473729, "epoch": 5707} {"train_loss": -26.170063018798828, "global_step": 473730, "epoch": 5707} {"train_loss": -27.078826904296875, "global_step": 473731, "epoch": 5707} {"train_loss": -27.25630760192871, "global_step": 473732, "epoch": 5707} {"train_loss": -27.470197677612305, "global_step": 473733, "epoch": 5707} {"train_loss": -26.89764404296875, "global_step": 473734, "epoch": 5707} {"train_loss": -27.26888084411621, "global_step": 473735, "epoch": 5707} {"train_loss": -27.167800903320312, "global_step": 473736, "epoch": 5707} {"train_loss": -27.352069854736328, "global_step": 473737, "epoch": 5707} {"train_loss": -27.26565933227539, "global_step": 473738, "epoch": 5707} {"train_loss": -27.33888816833496, "global_step": 473739, "epoch": 5707} {"train_loss": -27.292163848876953, "global_step": 473740, "epoch": 5707} {"train_loss": -27.20061683654785, "global_step": 473741, "epoch": 5707} {"train_loss": -27.07185173034668, "global_step": 473742, "epoch": 5707} {"train_loss": -27.152362823486328, "global_step": 473743, "epoch": 5707} {"train_loss": -27.365402221679688, "global_step": 473744, "epoch": 5707} {"train_loss": -27.1275577545166, "global_step": 473745, "epoch": 5707} {"train_loss": -27.4387264251709, "global_step": 473746, "epoch": 5707} {"train_loss": -27.26584815979004, "global_step": 473747, "epoch": 5707} {"train_loss": -27.019855499267578, "global_step": 473748, "epoch": 5707} {"train_loss": -26.956220626831055, "global_step": 473749, "epoch": 5707} {"train_loss": -27.375272750854492, "global_step": 473750, "epoch": 5707} {"train_loss": -27.146596908569336, "global_step": 473751, "epoch": 5707} {"train_loss": -27.08851432800293, "global_step": 473752, "epoch": 5707} {"train_loss": -26.90189552307129, "global_step": 473753, "epoch": 5707} {"train_loss": -27.14208984375, "global_step": 473754, "epoch": 5707} {"train_loss": -27.563989639282227, "global_step": 473755, "epoch": 5707} {"train_loss": -27.101409912109375, "global_step": 473756, "epoch": 5707} {"train_loss": -26.992645263671875, "global_step": 473757, "epoch": 5707} {"train_loss": -27.214468002319336, "global_step": 473758, "epoch": 5707} {"train_loss": -27.3622989654541, "global_step": 473759, "epoch": 5707} {"train_loss": -27.292577743530273, "global_step": 473760, "epoch": 5707} {"train_loss": -27.252721786499023, "global_step": 473761, "epoch": 5707} {"train_loss": -27.046472549438477, "global_step": 473762, "epoch": 5707} {"train_loss": -27.09562673913427, "global_step": 473763, "epoch": 5707, "val_loss": 6874457.0} {"train_loss": -26.80329704284668, "global_step": 473764, "epoch": 5708} {"train_loss": -26.644184112548828, "global_step": 473765, "epoch": 5708} {"train_loss": -27.62261962890625, "global_step": 473766, "epoch": 5708} {"train_loss": -26.7767391204834, "global_step": 473767, "epoch": 5708} {"train_loss": -27.13692283630371, "global_step": 473768, "epoch": 5708} {"train_loss": -26.91871452331543, "global_step": 473769, "epoch": 5708} {"train_loss": -26.8708553314209, "global_step": 473770, "epoch": 5708} {"train_loss": -27.095661163330078, "global_step": 473771, "epoch": 5708} {"train_loss": -26.700714111328125, "global_step": 473772, "epoch": 5708} {"train_loss": -27.2175235748291, "global_step": 473773, "epoch": 5708} {"train_loss": -27.107954025268555, "global_step": 473774, "epoch": 5708} {"train_loss": -26.85211753845215, "global_step": 473775, "epoch": 5708} {"train_loss": -26.9124755859375, "global_step": 473776, "epoch": 5708} {"train_loss": -27.285276412963867, "global_step": 473777, "epoch": 5708} {"train_loss": -26.941699981689453, "global_step": 473778, "epoch": 5708} {"train_loss": -26.90532875061035, "global_step": 473779, "epoch": 5708} {"train_loss": -26.874378204345703, "global_step": 473780, "epoch": 5708} {"train_loss": -26.88929557800293, "global_step": 473781, "epoch": 5708} {"train_loss": -27.25166893005371, "global_step": 473782, "epoch": 5708} {"train_loss": -27.136581420898438, "global_step": 473783, "epoch": 5708} {"train_loss": -27.182209014892578, "global_step": 473784, "epoch": 5708} {"train_loss": -27.000091552734375, "global_step": 473785, "epoch": 5708} {"train_loss": -26.967939376831055, "global_step": 473786, "epoch": 5708} {"train_loss": -27.416593551635742, "global_step": 473787, "epoch": 5708} {"train_loss": -27.299407958984375, "global_step": 473788, "epoch": 5708} {"train_loss": -27.848134994506836, "global_step": 473789, "epoch": 5708} {"train_loss": -27.1937313079834, "global_step": 473790, "epoch": 5708} {"train_loss": -26.998762130737305, "global_step": 473791, "epoch": 5708} {"train_loss": -27.2626953125, "global_step": 473792, "epoch": 5708} {"train_loss": -27.11457633972168, "global_step": 473793, "epoch": 5708} {"train_loss": -27.188583374023438, "global_step": 473794, "epoch": 5708} {"train_loss": -27.38861656188965, "global_step": 473795, "epoch": 5708} {"train_loss": -27.37009048461914, "global_step": 473796, "epoch": 5708} {"train_loss": -27.269140243530273, "global_step": 473797, "epoch": 5708} {"train_loss": -27.2386417388916, "global_step": 473798, "epoch": 5708} {"train_loss": -26.816160202026367, "global_step": 473799, "epoch": 5708} {"train_loss": -26.6234188079834, "global_step": 473800, "epoch": 5708} {"train_loss": -27.068317413330078, "global_step": 473801, "epoch": 5708} {"train_loss": -27.418933868408203, "global_step": 473802, "epoch": 5708} {"train_loss": -27.076889038085938, "global_step": 473803, "epoch": 5708} {"train_loss": -27.0192928314209, "global_step": 473804, "epoch": 5708} {"train_loss": -27.537189483642578, "global_step": 473805, "epoch": 5708} {"train_loss": -27.19114112854004, "global_step": 473806, "epoch": 5708} {"train_loss": -27.220808029174805, "global_step": 473807, "epoch": 5708} {"train_loss": -27.18414878845215, "global_step": 473808, "epoch": 5708} {"train_loss": -27.32940673828125, "global_step": 473809, "epoch": 5708} {"train_loss": -27.521743774414062, "global_step": 473810, "epoch": 5708} {"train_loss": -27.302814483642578, "global_step": 473811, "epoch": 5708} {"train_loss": -27.113615036010742, "global_step": 473812, "epoch": 5708} {"train_loss": -27.044910430908203, "global_step": 473813, "epoch": 5708} {"train_loss": -27.164533615112305, "global_step": 473814, "epoch": 5708} {"train_loss": -27.34580421447754, "global_step": 473815, "epoch": 5708} {"train_loss": -27.598358154296875, "global_step": 473816, "epoch": 5708} {"train_loss": -27.249073028564453, "global_step": 473817, "epoch": 5708} {"train_loss": -27.268468856811523, "global_step": 473818, "epoch": 5708} {"train_loss": -27.053701400756836, "global_step": 473819, "epoch": 5708} {"train_loss": -27.27506446838379, "global_step": 473820, "epoch": 5708} {"train_loss": -27.19388771057129, "global_step": 473821, "epoch": 5708} {"train_loss": -27.17581558227539, "global_step": 473822, "epoch": 5708} {"train_loss": -27.400531768798828, "global_step": 473823, "epoch": 5708} {"train_loss": -27.219018936157227, "global_step": 473824, "epoch": 5708} {"train_loss": -27.436664581298828, "global_step": 473825, "epoch": 5708} {"train_loss": -27.003406524658203, "global_step": 473826, "epoch": 5708} {"train_loss": -26.058856964111328, "global_step": 473827, "epoch": 5708} {"train_loss": -26.18381118774414, "global_step": 473828, "epoch": 5708} {"train_loss": -26.69504737854004, "global_step": 473829, "epoch": 5708} {"train_loss": -26.54960060119629, "global_step": 473830, "epoch": 5708} {"train_loss": -26.90683937072754, "global_step": 473831, "epoch": 5708} {"train_loss": -27.260181427001953, "global_step": 473832, "epoch": 5708} {"train_loss": -26.367263793945312, "global_step": 473833, "epoch": 5708} {"train_loss": -26.732053756713867, "global_step": 473834, "epoch": 5708} {"train_loss": -27.255874633789062, "global_step": 473835, "epoch": 5708} {"train_loss": -26.720626831054688, "global_step": 473836, "epoch": 5708} {"train_loss": -26.74704933166504, "global_step": 473837, "epoch": 5708} {"train_loss": -27.296655654907227, "global_step": 473838, "epoch": 5708} {"train_loss": -26.589033126831055, "global_step": 473839, "epoch": 5708} {"train_loss": -26.49257469177246, "global_step": 473840, "epoch": 5708} {"train_loss": -26.28961753845215, "global_step": 473841, "epoch": 5708} {"train_loss": -26.988210678100586, "global_step": 473842, "epoch": 5708} {"train_loss": -26.97715187072754, "global_step": 473843, "epoch": 5708} {"train_loss": -26.887344360351562, "global_step": 473844, "epoch": 5708} {"train_loss": -27.22858238220215, "global_step": 473845, "epoch": 5708} {"train_loss": -27.048643479864282, "global_step": 473846, "epoch": 5708, "val_loss": 6795717.0} {"train_loss": -26.808069229125977, "global_step": 473847, "epoch": 5709} {"train_loss": -26.806365966796875, "global_step": 473848, "epoch": 5709} {"train_loss": -26.72731590270996, "global_step": 473849, "epoch": 5709} {"train_loss": -26.59503173828125, "global_step": 473850, "epoch": 5709} {"train_loss": -26.720632553100586, "global_step": 473851, "epoch": 5709} {"train_loss": -27.088376998901367, "global_step": 473852, "epoch": 5709} {"train_loss": -26.911361694335938, "global_step": 473853, "epoch": 5709} {"train_loss": -26.79664421081543, "global_step": 473854, "epoch": 5709} {"train_loss": -26.879980087280273, "global_step": 473855, "epoch": 5709} {"train_loss": -27.224185943603516, "global_step": 473856, "epoch": 5709} {"train_loss": -27.04530143737793, "global_step": 473857, "epoch": 5709} {"train_loss": -26.8748722076416, "global_step": 473858, "epoch": 5709} {"train_loss": -27.110910415649414, "global_step": 473859, "epoch": 5709} {"train_loss": -27.380237579345703, "global_step": 473860, "epoch": 5709} {"train_loss": -27.384353637695312, "global_step": 473861, "epoch": 5709} {"train_loss": -26.919458389282227, "global_step": 473862, "epoch": 5709} {"train_loss": -27.25007438659668, "global_step": 473863, "epoch": 5709} {"train_loss": -27.19097900390625, "global_step": 473864, "epoch": 5709} {"train_loss": -27.629138946533203, "global_step": 473865, "epoch": 5709} {"train_loss": -26.98268699645996, "global_step": 473866, "epoch": 5709} {"train_loss": -27.130407333374023, "global_step": 473867, "epoch": 5709} {"train_loss": -26.86475944519043, "global_step": 473868, "epoch": 5709} {"train_loss": -26.7005558013916, "global_step": 473869, "epoch": 5709} {"train_loss": -27.197607040405273, "global_step": 473870, "epoch": 5709} {"train_loss": -27.317401885986328, "global_step": 473871, "epoch": 5709} {"train_loss": -27.15838623046875, "global_step": 473872, "epoch": 5709} {"train_loss": -27.47821044921875, "global_step": 473873, "epoch": 5709} {"train_loss": -27.26539421081543, "global_step": 473874, "epoch": 5709} {"train_loss": -27.10395622253418, "global_step": 473875, "epoch": 5709} {"train_loss": -27.246408462524414, "global_step": 473876, "epoch": 5709} {"train_loss": -27.385290145874023, "global_step": 473877, "epoch": 5709} {"train_loss": -26.883071899414062, "global_step": 473878, "epoch": 5709} {"train_loss": -26.819889068603516, "global_step": 473879, "epoch": 5709} {"train_loss": -27.191686630249023, "global_step": 473880, "epoch": 5709} {"train_loss": -27.241979598999023, "global_step": 473881, "epoch": 5709} {"train_loss": -27.255054473876953, "global_step": 473882, "epoch": 5709} {"train_loss": -27.023468017578125, "global_step": 473883, "epoch": 5709} {"train_loss": -27.239398956298828, "global_step": 473884, "epoch": 5709} {"train_loss": -27.094329833984375, "global_step": 473885, "epoch": 5709} {"train_loss": -27.175745010375977, "global_step": 473886, "epoch": 5709} {"train_loss": -27.150190353393555, "global_step": 473887, "epoch": 5709} {"train_loss": -27.69428825378418, "global_step": 473888, "epoch": 5709} {"train_loss": -27.23041343688965, "global_step": 473889, "epoch": 5709} {"train_loss": -27.394699096679688, "global_step": 473890, "epoch": 5709} {"train_loss": -27.219999313354492, "global_step": 473891, "epoch": 5709} {"train_loss": -27.403730392456055, "global_step": 473892, "epoch": 5709} {"train_loss": -27.139554977416992, "global_step": 473893, "epoch": 5709} {"train_loss": -27.137983322143555, "global_step": 473894, "epoch": 5709} {"train_loss": -27.4542293548584, "global_step": 473895, "epoch": 5709} {"train_loss": -27.097248077392578, "global_step": 473896, "epoch": 5709} {"train_loss": -27.5112361907959, "global_step": 473897, "epoch": 5709} {"train_loss": -27.67376708984375, "global_step": 473898, "epoch": 5709} {"train_loss": -27.29730224609375, "global_step": 473899, "epoch": 5709} {"train_loss": -27.58603286743164, "global_step": 473900, "epoch": 5709} {"train_loss": -27.410802841186523, "global_step": 473901, "epoch": 5709} {"train_loss": -27.482290267944336, "global_step": 473902, "epoch": 5709} {"train_loss": -27.479923248291016, "global_step": 473903, "epoch": 5709} {"train_loss": -27.287433624267578, "global_step": 473904, "epoch": 5709} {"train_loss": -27.38639259338379, "global_step": 473905, "epoch": 5709} {"train_loss": -27.397192001342773, "global_step": 473906, "epoch": 5709} {"train_loss": -27.016324996948242, "global_step": 473907, "epoch": 5709} {"train_loss": -27.802539825439453, "global_step": 473908, "epoch": 5709} {"train_loss": -26.548538208007812, "global_step": 473909, "epoch": 5709} {"train_loss": -27.30437660217285, "global_step": 473910, "epoch": 5709} {"train_loss": -27.190631866455078, "global_step": 473911, "epoch": 5709} {"train_loss": -27.16073989868164, "global_step": 473912, "epoch": 5709} {"train_loss": -27.182565689086914, "global_step": 473913, "epoch": 5709} {"train_loss": -26.488813400268555, "global_step": 473914, "epoch": 5709} {"train_loss": -26.78187370300293, "global_step": 473915, "epoch": 5709} {"train_loss": -26.624221801757812, "global_step": 473916, "epoch": 5709} {"train_loss": -27.391218185424805, "global_step": 473917, "epoch": 5709} {"train_loss": -26.97761344909668, "global_step": 473918, "epoch": 5709} {"train_loss": -26.9119930267334, "global_step": 473919, "epoch": 5709} {"train_loss": -26.955591201782227, "global_step": 473920, "epoch": 5709} {"train_loss": -27.119421005249023, "global_step": 473921, "epoch": 5709} {"train_loss": -26.762170791625977, "global_step": 473922, "epoch": 5709} {"train_loss": -26.648340225219727, "global_step": 473923, "epoch": 5709} {"train_loss": -27.066064834594727, "global_step": 473924, "epoch": 5709} {"train_loss": -27.140928268432617, "global_step": 473925, "epoch": 5709} {"train_loss": -26.414941787719727, "global_step": 473926, "epoch": 5709} {"train_loss": -26.37485694885254, "global_step": 473927, "epoch": 5709} {"train_loss": -26.191442489624023, "global_step": 473928, "epoch": 5709} {"train_loss": -27.090778327849975, "global_step": 473929, "epoch": 5709, "val_loss": 6886955.0} {"train_loss": -26.679609298706055, "global_step": 473930, "epoch": 5710} {"train_loss": -25.881961822509766, "global_step": 473931, "epoch": 5710} {"train_loss": -25.819721221923828, "global_step": 473932, "epoch": 5710} {"train_loss": -26.533390045166016, "global_step": 473933, "epoch": 5710} {"train_loss": -26.329421997070312, "global_step": 473934, "epoch": 5710} {"train_loss": -26.59950828552246, "global_step": 473935, "epoch": 5710} {"train_loss": -26.453702926635742, "global_step": 473936, "epoch": 5710} {"train_loss": -26.195276260375977, "global_step": 473937, "epoch": 5710} {"train_loss": -26.695180892944336, "global_step": 473938, "epoch": 5710} {"train_loss": -26.641454696655273, "global_step": 473939, "epoch": 5710} {"train_loss": -27.004724502563477, "global_step": 473940, "epoch": 5710} {"train_loss": -26.845428466796875, "global_step": 473941, "epoch": 5710} {"train_loss": -26.852014541625977, "global_step": 473942, "epoch": 5710} {"train_loss": -26.753192901611328, "global_step": 473943, "epoch": 5710} {"train_loss": -26.723356246948242, "global_step": 473944, "epoch": 5710} {"train_loss": -26.78985023498535, "global_step": 473945, "epoch": 5710} {"train_loss": -27.06184959411621, "global_step": 473946, "epoch": 5710} {"train_loss": -26.7912540435791, "global_step": 473947, "epoch": 5710} {"train_loss": -26.643207550048828, "global_step": 473948, "epoch": 5710} {"train_loss": -26.412931442260742, "global_step": 473949, "epoch": 5710} {"train_loss": -27.229257583618164, "global_step": 473950, "epoch": 5710} {"train_loss": -26.681787490844727, "global_step": 473951, "epoch": 5710} {"train_loss": -26.67984390258789, "global_step": 473952, "epoch": 5710} {"train_loss": -26.876514434814453, "global_step": 473953, "epoch": 5710} {"train_loss": -26.781497955322266, "global_step": 473954, "epoch": 5710} {"train_loss": -26.932950973510742, "global_step": 473955, "epoch": 5710} {"train_loss": -26.919519424438477, "global_step": 473956, "epoch": 5710} {"train_loss": -27.021137237548828, "global_step": 473957, "epoch": 5710} {"train_loss": -27.13263511657715, "global_step": 473958, "epoch": 5710} {"train_loss": -27.050107955932617, "global_step": 473959, "epoch": 5710} {"train_loss": -26.828754425048828, "global_step": 473960, "epoch": 5710} {"train_loss": -26.712705612182617, "global_step": 473961, "epoch": 5710} {"train_loss": -26.99367332458496, "global_step": 473962, "epoch": 5710} {"train_loss": -27.375654220581055, "global_step": 473963, "epoch": 5710} {"train_loss": -26.96917724609375, "global_step": 473964, "epoch": 5710} {"train_loss": -27.19472312927246, "global_step": 473965, "epoch": 5710} {"train_loss": -27.400243759155273, "global_step": 473966, "epoch": 5710} {"train_loss": -27.240636825561523, "global_step": 473967, "epoch": 5710} {"train_loss": -27.153472900390625, "global_step": 473968, "epoch": 5710} {"train_loss": -27.49614906311035, "global_step": 473969, "epoch": 5710} {"train_loss": -27.18462562561035, "global_step": 473970, "epoch": 5710} {"train_loss": -27.4428653717041, "global_step": 473971, "epoch": 5710} {"train_loss": -27.2734317779541, "global_step": 473972, "epoch": 5710} {"train_loss": -27.251981735229492, "global_step": 473973, "epoch": 5710} {"train_loss": -27.265390396118164, "global_step": 473974, "epoch": 5710} {"train_loss": -27.42525291442871, "global_step": 473975, "epoch": 5710} {"train_loss": -27.30824851989746, "global_step": 473976, "epoch": 5710} {"train_loss": -27.329593658447266, "global_step": 473977, "epoch": 5710} {"train_loss": -27.3157958984375, "global_step": 473978, "epoch": 5710} {"train_loss": -27.074377059936523, "global_step": 473979, "epoch": 5710} {"train_loss": -27.1995906829834, "global_step": 473980, "epoch": 5710} {"train_loss": -27.471548080444336, "global_step": 473981, "epoch": 5710} {"train_loss": -27.119043350219727, "global_step": 473982, "epoch": 5710} {"train_loss": -27.238910675048828, "global_step": 473983, "epoch": 5710} {"train_loss": -27.28761100769043, "global_step": 473984, "epoch": 5710} {"train_loss": -27.431167602539062, "global_step": 473985, "epoch": 5710} {"train_loss": -27.484298706054688, "global_step": 473986, "epoch": 5710} {"train_loss": -27.447736740112305, "global_step": 473987, "epoch": 5710} {"train_loss": -26.930395126342773, "global_step": 473988, "epoch": 5710} {"train_loss": -27.61641502380371, "global_step": 473989, "epoch": 5710} {"train_loss": -27.3173770904541, "global_step": 473990, "epoch": 5710} {"train_loss": -27.055837631225586, "global_step": 473991, "epoch": 5710} {"train_loss": -27.68910026550293, "global_step": 473992, "epoch": 5710} {"train_loss": -27.46177101135254, "global_step": 473993, "epoch": 5710} {"train_loss": -27.010730743408203, "global_step": 473994, "epoch": 5710} {"train_loss": -27.191049575805664, "global_step": 473995, "epoch": 5710} {"train_loss": -27.27057456970215, "global_step": 473996, "epoch": 5710} {"train_loss": -27.254119873046875, "global_step": 473997, "epoch": 5710} {"train_loss": -27.222442626953125, "global_step": 473998, "epoch": 5710} {"train_loss": -27.289045333862305, "global_step": 473999, "epoch": 5710} {"train_loss": -27.334980010986328, "global_step": 474000, "epoch": 5710} {"train_loss": -27.071887969970703, "global_step": 474001, "epoch": 5710} {"train_loss": -27.335824966430664, "global_step": 474002, "epoch": 5710} {"train_loss": -27.24617576599121, "global_step": 474003, "epoch": 5710} {"train_loss": -27.421905517578125, "global_step": 474004, "epoch": 5710} {"train_loss": -27.3773136138916, "global_step": 474005, "epoch": 5710} {"train_loss": -27.108251571655273, "global_step": 474006, "epoch": 5710} {"train_loss": -27.180612564086914, "global_step": 474007, "epoch": 5710} {"train_loss": -26.987939834594727, "global_step": 474008, "epoch": 5710} {"train_loss": -27.4467716217041, "global_step": 474009, "epoch": 5710} {"train_loss": -27.3199405670166, "global_step": 474010, "epoch": 5710} {"train_loss": -27.36008071899414, "global_step": 474011, "epoch": 5710} {"train_loss": -27.0512523191521, "global_step": 474012, "epoch": 5710, "val_loss": 6926238.0} {"train_loss": -25.94902992248535, "global_step": 474013, "epoch": 5711} {"train_loss": -26.01093101501465, "global_step": 474014, "epoch": 5711} {"train_loss": -26.66460609436035, "global_step": 474015, "epoch": 5711} {"train_loss": -25.818008422851562, "global_step": 474016, "epoch": 5711} {"train_loss": -26.12061882019043, "global_step": 474017, "epoch": 5711} {"train_loss": -26.085330963134766, "global_step": 474018, "epoch": 5711} {"train_loss": -26.023162841796875, "global_step": 474019, "epoch": 5711} {"train_loss": -26.560529708862305, "global_step": 474020, "epoch": 5711} {"train_loss": -26.27882194519043, "global_step": 474021, "epoch": 5711} {"train_loss": -26.55411720275879, "global_step": 474022, "epoch": 5711} {"train_loss": -25.64619255065918, "global_step": 474023, "epoch": 5711} {"train_loss": -26.76297950744629, "global_step": 474024, "epoch": 5711} {"train_loss": -26.482446670532227, "global_step": 474025, "epoch": 5711} {"train_loss": -26.467620849609375, "global_step": 474026, "epoch": 5711} {"train_loss": -26.422565460205078, "global_step": 474027, "epoch": 5711} {"train_loss": -26.896686553955078, "global_step": 474028, "epoch": 5711} {"train_loss": -26.416248321533203, "global_step": 474029, "epoch": 5711} {"train_loss": -26.879077911376953, "global_step": 474030, "epoch": 5711} {"train_loss": -26.317630767822266, "global_step": 474031, "epoch": 5711} {"train_loss": -26.9953670501709, "global_step": 474032, "epoch": 5711} {"train_loss": -26.912656784057617, "global_step": 474033, "epoch": 5711} {"train_loss": -27.082080841064453, "global_step": 474034, "epoch": 5711} {"train_loss": -26.687829971313477, "global_step": 474035, "epoch": 5711} {"train_loss": -26.865026473999023, "global_step": 474036, "epoch": 5711} {"train_loss": -26.988056182861328, "global_step": 474037, "epoch": 5711} {"train_loss": -26.718170166015625, "global_step": 474038, "epoch": 5711} {"train_loss": -27.229658126831055, "global_step": 474039, "epoch": 5711} {"train_loss": -26.978479385375977, "global_step": 474040, "epoch": 5711} {"train_loss": -26.810382843017578, "global_step": 474041, "epoch": 5711} {"train_loss": -27.021570205688477, "global_step": 474042, "epoch": 5711} {"train_loss": -26.981069564819336, "global_step": 474043, "epoch": 5711} {"train_loss": -27.21442985534668, "global_step": 474044, "epoch": 5711} {"train_loss": -26.93295669555664, "global_step": 474045, "epoch": 5711} {"train_loss": -27.316837310791016, "global_step": 474046, "epoch": 5711} {"train_loss": -26.94906997680664, "global_step": 474047, "epoch": 5711} {"train_loss": -26.903553009033203, "global_step": 474048, "epoch": 5711} {"train_loss": -26.98335075378418, "global_step": 474049, "epoch": 5711} {"train_loss": -27.554367065429688, "global_step": 474050, "epoch": 5711} {"train_loss": -27.313989639282227, "global_step": 474051, "epoch": 5711} {"train_loss": -27.09912109375, "global_step": 474052, "epoch": 5711} {"train_loss": -27.11825942993164, "global_step": 474053, "epoch": 5711} {"train_loss": -27.42689323425293, "global_step": 474054, "epoch": 5711} {"train_loss": -27.315967559814453, "global_step": 474055, "epoch": 5711} {"train_loss": -27.351566314697266, "global_step": 474056, "epoch": 5711} {"train_loss": -27.446889877319336, "global_step": 474057, "epoch": 5711} {"train_loss": -27.27788734436035, "global_step": 474058, "epoch": 5711} {"train_loss": -27.183225631713867, "global_step": 474059, "epoch": 5711} {"train_loss": -27.38496208190918, "global_step": 474060, "epoch": 5711} {"train_loss": -27.458816528320312, "global_step": 474061, "epoch": 5711} {"train_loss": -27.526260375976562, "global_step": 474062, "epoch": 5711} {"train_loss": -27.154693603515625, "global_step": 474063, "epoch": 5711} {"train_loss": -27.5870361328125, "global_step": 474064, "epoch": 5711} {"train_loss": -27.657501220703125, "global_step": 474065, "epoch": 5711} {"train_loss": -27.276941299438477, "global_step": 474066, "epoch": 5711} {"train_loss": -27.221759796142578, "global_step": 474067, "epoch": 5711} {"train_loss": -27.465391159057617, "global_step": 474068, "epoch": 5711} {"train_loss": -27.134140014648438, "global_step": 474069, "epoch": 5711} {"train_loss": -27.34186363220215, "global_step": 474070, "epoch": 5711} {"train_loss": -27.340795516967773, "global_step": 474071, "epoch": 5711} {"train_loss": -26.5904483795166, "global_step": 474072, "epoch": 5711} {"train_loss": -27.363874435424805, "global_step": 474073, "epoch": 5711} {"train_loss": -27.233718872070312, "global_step": 474074, "epoch": 5711} {"train_loss": -27.44500732421875, "global_step": 474075, "epoch": 5711} {"train_loss": -27.22175407409668, "global_step": 474076, "epoch": 5711} {"train_loss": -27.549732208251953, "global_step": 474077, "epoch": 5711} {"train_loss": -27.412031173706055, "global_step": 474078, "epoch": 5711} {"train_loss": -27.520532608032227, "global_step": 474079, "epoch": 5711} {"train_loss": -26.94464111328125, "global_step": 474080, "epoch": 5711} {"train_loss": -27.193552017211914, "global_step": 474081, "epoch": 5711} {"train_loss": -27.320755004882812, "global_step": 474082, "epoch": 5711} {"train_loss": -27.383005142211914, "global_step": 474083, "epoch": 5711} {"train_loss": -27.336584091186523, "global_step": 474084, "epoch": 5711} {"train_loss": -27.337390899658203, "global_step": 474085, "epoch": 5711} {"train_loss": -27.034870147705078, "global_step": 474086, "epoch": 5711} {"train_loss": -27.305118560791016, "global_step": 474087, "epoch": 5711} {"train_loss": -27.172067642211914, "global_step": 474088, "epoch": 5711} {"train_loss": -27.477773666381836, "global_step": 474089, "epoch": 5711} {"train_loss": -27.52679443359375, "global_step": 474090, "epoch": 5711} {"train_loss": -27.518741607666016, "global_step": 474091, "epoch": 5711} {"train_loss": -26.99334716796875, "global_step": 474092, "epoch": 5711} {"train_loss": -27.055347442626953, "global_step": 474093, "epoch": 5711} {"train_loss": -26.932004928588867, "global_step": 474094, "epoch": 5711} {"train_loss": -27.011950136667274, "global_step": 474095, "epoch": 5711, "val_loss": 7004410.0} {"train_loss": -25.763391494750977, "global_step": 474096, "epoch": 5712} {"train_loss": -25.799997329711914, "global_step": 474097, "epoch": 5712} {"train_loss": -25.528539657592773, "global_step": 474098, "epoch": 5712} {"train_loss": -26.059417724609375, "global_step": 474099, "epoch": 5712} {"train_loss": -25.989282608032227, "global_step": 474100, "epoch": 5712} {"train_loss": -26.31500244140625, "global_step": 474101, "epoch": 5712} {"train_loss": -25.822370529174805, "global_step": 474102, "epoch": 5712} {"train_loss": -26.6921329498291, "global_step": 474103, "epoch": 5712} {"train_loss": -26.2768611907959, "global_step": 474104, "epoch": 5712} {"train_loss": -26.461332321166992, "global_step": 474105, "epoch": 5712} {"train_loss": -26.70587730407715, "global_step": 474106, "epoch": 5712} {"train_loss": -26.489118576049805, "global_step": 474107, "epoch": 5712} {"train_loss": -26.60392189025879, "global_step": 474108, "epoch": 5712} {"train_loss": -27.000585556030273, "global_step": 474109, "epoch": 5712} {"train_loss": -26.57668113708496, "global_step": 474110, "epoch": 5712} {"train_loss": -26.62056541442871, "global_step": 474111, "epoch": 5712} {"train_loss": -26.893268585205078, "global_step": 474112, "epoch": 5712} {"train_loss": -26.63213539123535, "global_step": 474113, "epoch": 5712} {"train_loss": -26.823881149291992, "global_step": 474114, "epoch": 5712} {"train_loss": -26.548776626586914, "global_step": 474115, "epoch": 5712} {"train_loss": -26.456899642944336, "global_step": 474116, "epoch": 5712} {"train_loss": -26.9324951171875, "global_step": 474117, "epoch": 5712} {"train_loss": -27.206104278564453, "global_step": 474118, "epoch": 5712} {"train_loss": -26.762548446655273, "global_step": 474119, "epoch": 5712} {"train_loss": -27.36704444885254, "global_step": 474120, "epoch": 5712} {"train_loss": -26.937952041625977, "global_step": 474121, "epoch": 5712} {"train_loss": -26.80594825744629, "global_step": 474122, "epoch": 5712} {"train_loss": -27.185529708862305, "global_step": 474123, "epoch": 5712} {"train_loss": -26.846973419189453, "global_step": 474124, "epoch": 5712} {"train_loss": -27.00130271911621, "global_step": 474125, "epoch": 5712} {"train_loss": -26.948963165283203, "global_step": 474126, "epoch": 5712} {"train_loss": -27.016324996948242, "global_step": 474127, "epoch": 5712} {"train_loss": -27.048757553100586, "global_step": 474128, "epoch": 5712} {"train_loss": -27.237533569335938, "global_step": 474129, "epoch": 5712} {"train_loss": -27.70441246032715, "global_step": 474130, "epoch": 5712} {"train_loss": -26.90741539001465, "global_step": 474131, "epoch": 5712} {"train_loss": -26.982221603393555, "global_step": 474132, "epoch": 5712} {"train_loss": -27.28848648071289, "global_step": 474133, "epoch": 5712} {"train_loss": -27.4558162689209, "global_step": 474134, "epoch": 5712} {"train_loss": -27.4499454498291, "global_step": 474135, "epoch": 5712} {"train_loss": -27.511072158813477, "global_step": 474136, "epoch": 5712} {"train_loss": -27.038293838500977, "global_step": 474137, "epoch": 5712} {"train_loss": -27.03852653503418, "global_step": 474138, "epoch": 5712} {"train_loss": -27.446151733398438, "global_step": 474139, "epoch": 5712} {"train_loss": -27.290231704711914, "global_step": 474140, "epoch": 5712} {"train_loss": -27.357349395751953, "global_step": 474141, "epoch": 5712} {"train_loss": -27.244159698486328, "global_step": 474142, "epoch": 5712} {"train_loss": -26.98947525024414, "global_step": 474143, "epoch": 5712} {"train_loss": -27.70464515686035, "global_step": 474144, "epoch": 5712} {"train_loss": -27.32257652282715, "global_step": 474145, "epoch": 5712} {"train_loss": -27.535919189453125, "global_step": 474146, "epoch": 5712} {"train_loss": -27.3292293548584, "global_step": 474147, "epoch": 5712} {"train_loss": -27.308103561401367, "global_step": 474148, "epoch": 5712} {"train_loss": -27.569934844970703, "global_step": 474149, "epoch": 5712} {"train_loss": -27.2965087890625, "global_step": 474150, "epoch": 5712} {"train_loss": -27.694334030151367, "global_step": 474151, "epoch": 5712} {"train_loss": -27.18067741394043, "global_step": 474152, "epoch": 5712} {"train_loss": -27.382314682006836, "global_step": 474153, "epoch": 5712} {"train_loss": -27.400999069213867, "global_step": 474154, "epoch": 5712} {"train_loss": -27.19239616394043, "global_step": 474155, "epoch": 5712} {"train_loss": -27.462514877319336, "global_step": 474156, "epoch": 5712} {"train_loss": -27.600540161132812, "global_step": 474157, "epoch": 5712} {"train_loss": -27.27457046508789, "global_step": 474158, "epoch": 5712} {"train_loss": -27.633087158203125, "global_step": 474159, "epoch": 5712} {"train_loss": -27.2553653717041, "global_step": 474160, "epoch": 5712} {"train_loss": -27.135034561157227, "global_step": 474161, "epoch": 5712} {"train_loss": -25.75522232055664, "global_step": 474162, "epoch": 5712} {"train_loss": -24.38056755065918, "global_step": 474163, "epoch": 5712} {"train_loss": -25.436817169189453, "global_step": 474164, "epoch": 5712} {"train_loss": -27.3427791595459, "global_step": 474165, "epoch": 5712} {"train_loss": -26.021366119384766, "global_step": 474166, "epoch": 5712} {"train_loss": -26.526769638061523, "global_step": 474167, "epoch": 5712} {"train_loss": -26.45880699157715, "global_step": 474168, "epoch": 5712} {"train_loss": -26.493366241455078, "global_step": 474169, "epoch": 5712} {"train_loss": -26.411767959594727, "global_step": 474170, "epoch": 5712} {"train_loss": -26.586109161376953, "global_step": 474171, "epoch": 5712} {"train_loss": -26.386621475219727, "global_step": 474172, "epoch": 5712} {"train_loss": -26.93195915222168, "global_step": 474173, "epoch": 5712} {"train_loss": -26.577978134155273, "global_step": 474174, "epoch": 5712} {"train_loss": -26.93438720703125, "global_step": 474175, "epoch": 5712} {"train_loss": -26.85603141784668, "global_step": 474176, "epoch": 5712} {"train_loss": -26.7486515045166, "global_step": 474177, "epoch": 5712} {"train_loss": -26.869156619152392, "global_step": 474178, "epoch": 5712, "val_loss": 6778759.5} {"train_loss": -24.706327438354492, "global_step": 474179, "epoch": 5713} {"train_loss": -24.99123191833496, "global_step": 474180, "epoch": 5713} {"train_loss": -25.77364158630371, "global_step": 474181, "epoch": 5713} {"train_loss": -25.807714462280273, "global_step": 474182, "epoch": 5713} {"train_loss": -26.184127807617188, "global_step": 474183, "epoch": 5713} {"train_loss": -25.915395736694336, "global_step": 474184, "epoch": 5713} {"train_loss": -26.169031143188477, "global_step": 474185, "epoch": 5713} {"train_loss": -26.5467529296875, "global_step": 474186, "epoch": 5713} {"train_loss": -26.173526763916016, "global_step": 474187, "epoch": 5713} {"train_loss": -26.564319610595703, "global_step": 474188, "epoch": 5713} {"train_loss": -26.415876388549805, "global_step": 474189, "epoch": 5713} {"train_loss": -26.215717315673828, "global_step": 474190, "epoch": 5713} {"train_loss": -26.62653923034668, "global_step": 474191, "epoch": 5713} {"train_loss": -26.53571128845215, "global_step": 474192, "epoch": 5713} {"train_loss": -26.507095336914062, "global_step": 474193, "epoch": 5713} {"train_loss": -26.556188583374023, "global_step": 474194, "epoch": 5713} {"train_loss": -26.66706657409668, "global_step": 474195, "epoch": 5713} {"train_loss": -26.6374568939209, "global_step": 474196, "epoch": 5713} {"train_loss": -26.51947593688965, "global_step": 474197, "epoch": 5713} {"train_loss": -26.825902938842773, "global_step": 474198, "epoch": 5713} {"train_loss": -26.604511260986328, "global_step": 474199, "epoch": 5713} {"train_loss": -26.563276290893555, "global_step": 474200, "epoch": 5713} {"train_loss": -26.716754913330078, "global_step": 474201, "epoch": 5713} {"train_loss": -27.370691299438477, "global_step": 474202, "epoch": 5713} {"train_loss": -27.187870025634766, "global_step": 474203, "epoch": 5713} {"train_loss": -26.70221519470215, "global_step": 474204, "epoch": 5713} {"train_loss": -26.94745445251465, "global_step": 474205, "epoch": 5713} {"train_loss": -27.06910514831543, "global_step": 474206, "epoch": 5713} {"train_loss": -27.037582397460938, "global_step": 474207, "epoch": 5713} {"train_loss": -27.11249351501465, "global_step": 474208, "epoch": 5713} {"train_loss": -26.788898468017578, "global_step": 474209, "epoch": 5713} {"train_loss": -27.0546817779541, "global_step": 474210, "epoch": 5713} {"train_loss": -26.953107833862305, "global_step": 474211, "epoch": 5713} {"train_loss": -27.128162384033203, "global_step": 474212, "epoch": 5713} {"train_loss": -27.18147850036621, "global_step": 474213, "epoch": 5713} {"train_loss": -27.237131118774414, "global_step": 474214, "epoch": 5713} {"train_loss": -27.45697021484375, "global_step": 474215, "epoch": 5713} {"train_loss": -26.948949813842773, "global_step": 474216, "epoch": 5713} {"train_loss": -27.26251220703125, "global_step": 474217, "epoch": 5713} {"train_loss": -27.40608787536621, "global_step": 474218, "epoch": 5713} {"train_loss": -27.217071533203125, "global_step": 474219, "epoch": 5713} {"train_loss": -27.2944393157959, "global_step": 474220, "epoch": 5713} {"train_loss": -27.053821563720703, "global_step": 474221, "epoch": 5713} {"train_loss": -27.33747673034668, "global_step": 474222, "epoch": 5713} {"train_loss": -27.22596549987793, "global_step": 474223, "epoch": 5713} {"train_loss": -27.369735717773438, "global_step": 474224, "epoch": 5713} {"train_loss": -27.404541015625, "global_step": 474225, "epoch": 5713} {"train_loss": -27.536121368408203, "global_step": 474226, "epoch": 5713} {"train_loss": -27.01214027404785, "global_step": 474227, "epoch": 5713} {"train_loss": -27.08819580078125, "global_step": 474228, "epoch": 5713} {"train_loss": -27.734472274780273, "global_step": 474229, "epoch": 5713} {"train_loss": -26.762897491455078, "global_step": 474230, "epoch": 5713} {"train_loss": -27.25348472595215, "global_step": 474231, "epoch": 5713} {"train_loss": -26.9180850982666, "global_step": 474232, "epoch": 5713} {"train_loss": -26.749296188354492, "global_step": 474233, "epoch": 5713} {"train_loss": -27.205947875976562, "global_step": 474234, "epoch": 5713} {"train_loss": -26.984073638916016, "global_step": 474235, "epoch": 5713} {"train_loss": -27.17213249206543, "global_step": 474236, "epoch": 5713} {"train_loss": -26.848102569580078, "global_step": 474237, "epoch": 5713} {"train_loss": -27.5627384185791, "global_step": 474238, "epoch": 5713} {"train_loss": -27.0189151763916, "global_step": 474239, "epoch": 5713} {"train_loss": -26.92136573791504, "global_step": 474240, "epoch": 5713} {"train_loss": -27.342838287353516, "global_step": 474241, "epoch": 5713} {"train_loss": -26.99614906311035, "global_step": 474242, "epoch": 5713} {"train_loss": -27.180395126342773, "global_step": 474243, "epoch": 5713} {"train_loss": -27.009862899780273, "global_step": 474244, "epoch": 5713} {"train_loss": -27.48052406311035, "global_step": 474245, "epoch": 5713} {"train_loss": -27.09467887878418, "global_step": 474246, "epoch": 5713} {"train_loss": -27.279586791992188, "global_step": 474247, "epoch": 5713} {"train_loss": -27.21204948425293, "global_step": 474248, "epoch": 5713} {"train_loss": -27.171960830688477, "global_step": 474249, "epoch": 5713} {"train_loss": -27.11370277404785, "global_step": 474250, "epoch": 5713} {"train_loss": -27.36720085144043, "global_step": 474251, "epoch": 5713} {"train_loss": -26.82154655456543, "global_step": 474252, "epoch": 5713} {"train_loss": -27.196533203125, "global_step": 474253, "epoch": 5713} {"train_loss": -27.040821075439453, "global_step": 474254, "epoch": 5713} {"train_loss": -27.05414390563965, "global_step": 474255, "epoch": 5713} {"train_loss": -26.79052734375, "global_step": 474256, "epoch": 5713} {"train_loss": -26.80338478088379, "global_step": 474257, "epoch": 5713} {"train_loss": -27.21868324279785, "global_step": 474258, "epoch": 5713} {"train_loss": -27.193410873413086, "global_step": 474259, "epoch": 5713} {"train_loss": -27.103900909423828, "global_step": 474260, "epoch": 5713} {"train_loss": -26.90700271330684, "global_step": 474261, "epoch": 5713, "val_loss": 6855261.0} {"train_loss": -26.148441314697266, "global_step": 474262, "epoch": 5714} {"train_loss": -26.367877960205078, "global_step": 474263, "epoch": 5714} {"train_loss": -26.425138473510742, "global_step": 474264, "epoch": 5714} {"train_loss": -26.605627059936523, "global_step": 474265, "epoch": 5714} {"train_loss": -26.75531005859375, "global_step": 474266, "epoch": 5714} {"train_loss": -26.121322631835938, "global_step": 474267, "epoch": 5714} {"train_loss": -26.7486515045166, "global_step": 474268, "epoch": 5714} {"train_loss": -26.392385482788086, "global_step": 474269, "epoch": 5714} {"train_loss": -26.882715225219727, "global_step": 474270, "epoch": 5714} {"train_loss": -27.199018478393555, "global_step": 474271, "epoch": 5714} {"train_loss": -26.549102783203125, "global_step": 474272, "epoch": 5714} {"train_loss": -26.496448516845703, "global_step": 474273, "epoch": 5714} {"train_loss": -26.946701049804688, "global_step": 474274, "epoch": 5714} {"train_loss": -26.856048583984375, "global_step": 474275, "epoch": 5714} {"train_loss": -27.286298751831055, "global_step": 474276, "epoch": 5714} {"train_loss": -27.027679443359375, "global_step": 474277, "epoch": 5714} {"train_loss": -27.041889190673828, "global_step": 474278, "epoch": 5714} {"train_loss": -26.93532371520996, "global_step": 474279, "epoch": 5714} {"train_loss": -27.235532760620117, "global_step": 474280, "epoch": 5714} {"train_loss": -26.83466148376465, "global_step": 474281, "epoch": 5714} {"train_loss": -27.052534103393555, "global_step": 474282, "epoch": 5714} {"train_loss": -27.068105697631836, "global_step": 474283, "epoch": 5714} {"train_loss": -27.34431266784668, "global_step": 474284, "epoch": 5714} {"train_loss": -27.032272338867188, "global_step": 474285, "epoch": 5714} {"train_loss": -26.721296310424805, "global_step": 474286, "epoch": 5714} {"train_loss": -27.155567169189453, "global_step": 474287, "epoch": 5714} {"train_loss": -27.106592178344727, "global_step": 474288, "epoch": 5714} {"train_loss": -27.228057861328125, "global_step": 474289, "epoch": 5714} {"train_loss": -27.217859268188477, "global_step": 474290, "epoch": 5714} {"train_loss": -27.37369728088379, "global_step": 474291, "epoch": 5714} {"train_loss": -27.41643714904785, "global_step": 474292, "epoch": 5714} {"train_loss": -26.873397827148438, "global_step": 474293, "epoch": 5714} {"train_loss": -27.034255981445312, "global_step": 474294, "epoch": 5714} {"train_loss": -27.239303588867188, "global_step": 474295, "epoch": 5714} {"train_loss": -26.620330810546875, "global_step": 474296, "epoch": 5714} {"train_loss": -27.1732120513916, "global_step": 474297, "epoch": 5714} {"train_loss": -27.329853057861328, "global_step": 474298, "epoch": 5714} {"train_loss": -27.1241455078125, "global_step": 474299, "epoch": 5714} {"train_loss": -26.878137588500977, "global_step": 474300, "epoch": 5714} {"train_loss": -27.053293228149414, "global_step": 474301, "epoch": 5714} {"train_loss": -27.082141876220703, "global_step": 474302, "epoch": 5714} {"train_loss": -27.08149528503418, "global_step": 474303, "epoch": 5714} {"train_loss": -27.034149169921875, "global_step": 474304, "epoch": 5714} {"train_loss": -27.33441734313965, "global_step": 474305, "epoch": 5714} {"train_loss": -27.5778865814209, "global_step": 474306, "epoch": 5714} {"train_loss": -27.19464111328125, "global_step": 474307, "epoch": 5714} {"train_loss": -27.078744888305664, "global_step": 474308, "epoch": 5714} {"train_loss": -27.730243682861328, "global_step": 474309, "epoch": 5714} {"train_loss": -27.196313858032227, "global_step": 474310, "epoch": 5714} {"train_loss": -26.917478561401367, "global_step": 474311, "epoch": 5714} {"train_loss": -26.527332305908203, "global_step": 474312, "epoch": 5714} {"train_loss": -26.833417892456055, "global_step": 474313, "epoch": 5714} {"train_loss": -26.996484756469727, "global_step": 474314, "epoch": 5714} {"train_loss": -26.982343673706055, "global_step": 474315, "epoch": 5714} {"train_loss": -27.71377944946289, "global_step": 474316, "epoch": 5714} {"train_loss": -27.191425323486328, "global_step": 474317, "epoch": 5714} {"train_loss": -27.397205352783203, "global_step": 474318, "epoch": 5714} {"train_loss": -27.3984375, "global_step": 474319, "epoch": 5714} {"train_loss": -27.178436279296875, "global_step": 474320, "epoch": 5714} {"train_loss": -27.274389266967773, "global_step": 474321, "epoch": 5714} {"train_loss": -26.983474731445312, "global_step": 474322, "epoch": 5714} {"train_loss": -26.67877197265625, "global_step": 474323, "epoch": 5714} {"train_loss": -27.351959228515625, "global_step": 474324, "epoch": 5714} {"train_loss": -27.682342529296875, "global_step": 474325, "epoch": 5714} {"train_loss": -27.145151138305664, "global_step": 474326, "epoch": 5714} {"train_loss": -27.380813598632812, "global_step": 474327, "epoch": 5714} {"train_loss": -27.15643310546875, "global_step": 474328, "epoch": 5714} {"train_loss": -27.43043327331543, "global_step": 474329, "epoch": 5714} {"train_loss": -27.163476943969727, "global_step": 474330, "epoch": 5714} {"train_loss": -27.16660499572754, "global_step": 474331, "epoch": 5714} {"train_loss": -27.075942993164062, "global_step": 474332, "epoch": 5714} {"train_loss": -27.111753463745117, "global_step": 474333, "epoch": 5714} {"train_loss": -26.96559715270996, "global_step": 474334, "epoch": 5714} {"train_loss": -26.976346969604492, "global_step": 474335, "epoch": 5714} {"train_loss": -26.890365600585938, "global_step": 474336, "epoch": 5714} {"train_loss": -26.854721069335938, "global_step": 474337, "epoch": 5714} {"train_loss": -26.98634910583496, "global_step": 474338, "epoch": 5714} {"train_loss": -27.235742568969727, "global_step": 474339, "epoch": 5714} {"train_loss": -27.041034698486328, "global_step": 474340, "epoch": 5714} {"train_loss": -27.059900283813477, "global_step": 474341, "epoch": 5714} {"train_loss": -26.942493438720703, "global_step": 474342, "epoch": 5714} {"train_loss": -27.4693660736084, "global_step": 474343, "epoch": 5714} {"train_loss": -27.049068152186383, "global_step": 474344, "epoch": 5714, "val_loss": 6805716.0} {"train_loss": -26.192462921142578, "global_step": 474345, "epoch": 5715} {"train_loss": -26.598379135131836, "global_step": 474346, "epoch": 5715} {"train_loss": -25.986846923828125, "global_step": 474347, "epoch": 5715} {"train_loss": -26.742673873901367, "global_step": 474348, "epoch": 5715} {"train_loss": -26.603113174438477, "global_step": 474349, "epoch": 5715} {"train_loss": -27.0858211517334, "global_step": 474350, "epoch": 5715} {"train_loss": -26.786596298217773, "global_step": 474351, "epoch": 5715} {"train_loss": -26.557621002197266, "global_step": 474352, "epoch": 5715} {"train_loss": -27.090484619140625, "global_step": 474353, "epoch": 5715} {"train_loss": -26.504093170166016, "global_step": 474354, "epoch": 5715} {"train_loss": -26.88651466369629, "global_step": 474355, "epoch": 5715} {"train_loss": -26.92022132873535, "global_step": 474356, "epoch": 5715} {"train_loss": -26.687744140625, "global_step": 474357, "epoch": 5715} {"train_loss": -27.07342529296875, "global_step": 474358, "epoch": 5715} {"train_loss": -26.950937271118164, "global_step": 474359, "epoch": 5715} {"train_loss": -26.78993034362793, "global_step": 474360, "epoch": 5715} {"train_loss": -27.020105361938477, "global_step": 474361, "epoch": 5715} {"train_loss": -26.845739364624023, "global_step": 474362, "epoch": 5715} {"train_loss": -27.101552963256836, "global_step": 474363, "epoch": 5715} {"train_loss": -27.065723419189453, "global_step": 474364, "epoch": 5715} {"train_loss": -26.7453556060791, "global_step": 474365, "epoch": 5715} {"train_loss": -27.403661727905273, "global_step": 474366, "epoch": 5715} {"train_loss": -26.893362045288086, "global_step": 474367, "epoch": 5715} {"train_loss": -27.106042861938477, "global_step": 474368, "epoch": 5715} {"train_loss": -27.0346622467041, "global_step": 474369, "epoch": 5715} {"train_loss": -27.13035011291504, "global_step": 474370, "epoch": 5715} {"train_loss": -27.102514266967773, "global_step": 474371, "epoch": 5715} {"train_loss": -27.430042266845703, "global_step": 474372, "epoch": 5715} {"train_loss": -26.939590454101562, "global_step": 474373, "epoch": 5715} {"train_loss": -27.462223052978516, "global_step": 474374, "epoch": 5715} {"train_loss": -27.31756591796875, "global_step": 474375, "epoch": 5715} {"train_loss": -27.344562530517578, "global_step": 474376, "epoch": 5715} {"train_loss": -27.007816314697266, "global_step": 474377, "epoch": 5715} {"train_loss": -27.093067169189453, "global_step": 474378, "epoch": 5715} {"train_loss": -27.360361099243164, "global_step": 474379, "epoch": 5715} {"train_loss": -27.270538330078125, "global_step": 474380, "epoch": 5715} {"train_loss": -27.04184341430664, "global_step": 474381, "epoch": 5715} {"train_loss": -27.462671279907227, "global_step": 474382, "epoch": 5715} {"train_loss": -27.30221939086914, "global_step": 474383, "epoch": 5715} {"train_loss": -27.3104248046875, "global_step": 474384, "epoch": 5715} {"train_loss": -27.545568466186523, "global_step": 474385, "epoch": 5715} {"train_loss": -27.63274574279785, "global_step": 474386, "epoch": 5715} {"train_loss": -27.27237319946289, "global_step": 474387, "epoch": 5715} {"train_loss": -27.441532135009766, "global_step": 474388, "epoch": 5715} {"train_loss": -27.384435653686523, "global_step": 474389, "epoch": 5715} {"train_loss": -27.21930503845215, "global_step": 474390, "epoch": 5715} {"train_loss": -27.087020874023438, "global_step": 474391, "epoch": 5715} {"train_loss": -27.18349266052246, "global_step": 474392, "epoch": 5715} {"train_loss": -27.05084228515625, "global_step": 474393, "epoch": 5715} {"train_loss": -27.44342613220215, "global_step": 474394, "epoch": 5715} {"train_loss": -27.288232803344727, "global_step": 474395, "epoch": 5715} {"train_loss": -27.030542373657227, "global_step": 474396, "epoch": 5715} {"train_loss": -27.085981369018555, "global_step": 474397, "epoch": 5715} {"train_loss": -27.231983184814453, "global_step": 474398, "epoch": 5715} {"train_loss": -27.196674346923828, "global_step": 474399, "epoch": 5715} {"train_loss": -27.21728515625, "global_step": 474400, "epoch": 5715} {"train_loss": -27.343036651611328, "global_step": 474401, "epoch": 5715} {"train_loss": -27.208297729492188, "global_step": 474402, "epoch": 5715} {"train_loss": -27.389341354370117, "global_step": 474403, "epoch": 5715} {"train_loss": -26.999958038330078, "global_step": 474404, "epoch": 5715} {"train_loss": -27.359785079956055, "global_step": 474405, "epoch": 5715} {"train_loss": -27.177282333374023, "global_step": 474406, "epoch": 5715} {"train_loss": -27.241230010986328, "global_step": 474407, "epoch": 5715} {"train_loss": -27.373823165893555, "global_step": 474408, "epoch": 5715} {"train_loss": -27.422666549682617, "global_step": 474409, "epoch": 5715} {"train_loss": -27.58613395690918, "global_step": 474410, "epoch": 5715} {"train_loss": -27.398244857788086, "global_step": 474411, "epoch": 5715} {"train_loss": -27.249692916870117, "global_step": 474412, "epoch": 5715} {"train_loss": -27.420581817626953, "global_step": 474413, "epoch": 5715} {"train_loss": -27.0167236328125, "global_step": 474414, "epoch": 5715} {"train_loss": -26.596527099609375, "global_step": 474415, "epoch": 5715} {"train_loss": -26.606769561767578, "global_step": 474416, "epoch": 5715} {"train_loss": -26.483835220336914, "global_step": 474417, "epoch": 5715} {"train_loss": -27.06110954284668, "global_step": 474418, "epoch": 5715} {"train_loss": -27.134870529174805, "global_step": 474419, "epoch": 5715} {"train_loss": -27.134435653686523, "global_step": 474420, "epoch": 5715} {"train_loss": -26.83368492126465, "global_step": 474421, "epoch": 5715} {"train_loss": -26.834686279296875, "global_step": 474422, "epoch": 5715} {"train_loss": -27.18768310546875, "global_step": 474423, "epoch": 5715} {"train_loss": -27.21284294128418, "global_step": 474424, "epoch": 5715} {"train_loss": -26.92103385925293, "global_step": 474425, "epoch": 5715} {"train_loss": -27.041400909423828, "global_step": 474426, "epoch": 5715} {"train_loss": -27.05864184735769, "global_step": 474427, "epoch": 5715, "val_loss": 6856650.0} {"train_loss": -25.430500030517578, "global_step": 474428, "epoch": 5716} {"train_loss": -24.242631912231445, "global_step": 474429, "epoch": 5716} {"train_loss": -25.955097198486328, "global_step": 474430, "epoch": 5716} {"train_loss": -26.1297550201416, "global_step": 474431, "epoch": 5716} {"train_loss": -25.822874069213867, "global_step": 474432, "epoch": 5716} {"train_loss": -26.095380783081055, "global_step": 474433, "epoch": 5716} {"train_loss": -26.070539474487305, "global_step": 474434, "epoch": 5716} {"train_loss": -25.510473251342773, "global_step": 474435, "epoch": 5716} {"train_loss": -26.454877853393555, "global_step": 474436, "epoch": 5716} {"train_loss": -25.262065887451172, "global_step": 474437, "epoch": 5716} {"train_loss": -25.911237716674805, "global_step": 474438, "epoch": 5716} {"train_loss": -26.483083724975586, "global_step": 474439, "epoch": 5716} {"train_loss": -26.3245849609375, "global_step": 474440, "epoch": 5716} {"train_loss": -26.236303329467773, "global_step": 474441, "epoch": 5716} {"train_loss": -26.3343563079834, "global_step": 474442, "epoch": 5716} {"train_loss": -26.750009536743164, "global_step": 474443, "epoch": 5716} {"train_loss": -26.170148849487305, "global_step": 474444, "epoch": 5716} {"train_loss": -26.356653213500977, "global_step": 474445, "epoch": 5716} {"train_loss": -26.224411010742188, "global_step": 474446, "epoch": 5716} {"train_loss": -26.466644287109375, "global_step": 474447, "epoch": 5716} {"train_loss": -26.628772735595703, "global_step": 474448, "epoch": 5716} {"train_loss": -26.97378921508789, "global_step": 474449, "epoch": 5716} {"train_loss": -26.522809982299805, "global_step": 474450, "epoch": 5716} {"train_loss": -26.97236442565918, "global_step": 474451, "epoch": 5716} {"train_loss": -26.989139556884766, "global_step": 474452, "epoch": 5716} {"train_loss": -26.7911319732666, "global_step": 474453, "epoch": 5716} {"train_loss": -27.332077026367188, "global_step": 474454, "epoch": 5716} {"train_loss": -26.82090187072754, "global_step": 474455, "epoch": 5716} {"train_loss": -26.716283798217773, "global_step": 474456, "epoch": 5716} {"train_loss": -27.002368927001953, "global_step": 474457, "epoch": 5716} {"train_loss": -26.763891220092773, "global_step": 474458, "epoch": 5716} {"train_loss": -26.703022003173828, "global_step": 474459, "epoch": 5716} {"train_loss": -26.949874877929688, "global_step": 474460, "epoch": 5716} {"train_loss": -27.229663848876953, "global_step": 474461, "epoch": 5716} {"train_loss": -27.159574508666992, "global_step": 474462, "epoch": 5716} {"train_loss": -27.080829620361328, "global_step": 474463, "epoch": 5716} {"train_loss": -27.248571395874023, "global_step": 474464, "epoch": 5716} {"train_loss": -27.091754913330078, "global_step": 474465, "epoch": 5716} {"train_loss": -26.674713134765625, "global_step": 474466, "epoch": 5716} {"train_loss": -27.290191650390625, "global_step": 474467, "epoch": 5716} {"train_loss": -27.5986385345459, "global_step": 474468, "epoch": 5716} {"train_loss": -27.248533248901367, "global_step": 474469, "epoch": 5716} {"train_loss": -27.003637313842773, "global_step": 474470, "epoch": 5716} {"train_loss": -27.237167358398438, "global_step": 474471, "epoch": 5716} {"train_loss": -27.049291610717773, "global_step": 474472, "epoch": 5716} {"train_loss": -27.344202041625977, "global_step": 474473, "epoch": 5716} {"train_loss": -27.232603073120117, "global_step": 474474, "epoch": 5716} {"train_loss": -27.514373779296875, "global_step": 474475, "epoch": 5716} {"train_loss": -27.147382736206055, "global_step": 474476, "epoch": 5716} {"train_loss": -26.92866325378418, "global_step": 474477, "epoch": 5716} {"train_loss": -27.551904678344727, "global_step": 474478, "epoch": 5716} {"train_loss": -27.501447677612305, "global_step": 474479, "epoch": 5716} {"train_loss": -27.02716064453125, "global_step": 474480, "epoch": 5716} {"train_loss": -26.855703353881836, "global_step": 474481, "epoch": 5716} {"train_loss": -26.56943130493164, "global_step": 474482, "epoch": 5716} {"train_loss": -27.252307891845703, "global_step": 474483, "epoch": 5716} {"train_loss": -27.38850212097168, "global_step": 474484, "epoch": 5716} {"train_loss": -27.22356605529785, "global_step": 474485, "epoch": 5716} {"train_loss": -27.085092544555664, "global_step": 474486, "epoch": 5716} {"train_loss": -27.21759605407715, "global_step": 474487, "epoch": 5716} {"train_loss": -27.493793487548828, "global_step": 474488, "epoch": 5716} {"train_loss": -27.380224227905273, "global_step": 474489, "epoch": 5716} {"train_loss": -27.04141616821289, "global_step": 474490, "epoch": 5716} {"train_loss": -27.301023483276367, "global_step": 474491, "epoch": 5716} {"train_loss": -27.822885513305664, "global_step": 474492, "epoch": 5716} {"train_loss": -27.295637130737305, "global_step": 474493, "epoch": 5716} {"train_loss": -27.02788734436035, "global_step": 474494, "epoch": 5716} {"train_loss": -27.37055015563965, "global_step": 474495, "epoch": 5716} {"train_loss": -27.399084091186523, "global_step": 474496, "epoch": 5716} {"train_loss": -26.9807071685791, "global_step": 474497, "epoch": 5716} {"train_loss": -27.626760482788086, "global_step": 474498, "epoch": 5716} {"train_loss": -27.12212562561035, "global_step": 474499, "epoch": 5716} {"train_loss": -27.51688003540039, "global_step": 474500, "epoch": 5716} {"train_loss": -27.41982078552246, "global_step": 474501, "epoch": 5716} {"train_loss": -27.320829391479492, "global_step": 474502, "epoch": 5716} {"train_loss": -27.39204216003418, "global_step": 474503, "epoch": 5716} {"train_loss": -26.9993896484375, "global_step": 474504, "epoch": 5716} {"train_loss": -27.319971084594727, "global_step": 474505, "epoch": 5716} {"train_loss": -27.1677188873291, "global_step": 474506, "epoch": 5716} {"train_loss": -27.297870635986328, "global_step": 474507, "epoch": 5716} {"train_loss": -27.178136825561523, "global_step": 474508, "epoch": 5716} {"train_loss": -27.29876708984375, "global_step": 474509, "epoch": 5716} {"train_loss": -26.880329614662262, "global_step": 474510, "epoch": 5716, "val_loss": 6826488.0} {"train_loss": -26.194305419921875, "global_step": 474511, "epoch": 5717} {"train_loss": -26.362747192382812, "global_step": 474512, "epoch": 5717} {"train_loss": -26.542394638061523, "global_step": 474513, "epoch": 5717} {"train_loss": -26.59551429748535, "global_step": 474514, "epoch": 5717} {"train_loss": -26.3529052734375, "global_step": 474515, "epoch": 5717} {"train_loss": -26.719181060791016, "global_step": 474516, "epoch": 5717} {"train_loss": -26.493383407592773, "global_step": 474517, "epoch": 5717} {"train_loss": -26.53352165222168, "global_step": 474518, "epoch": 5717} {"train_loss": -26.701486587524414, "global_step": 474519, "epoch": 5717} {"train_loss": -26.68916130065918, "global_step": 474520, "epoch": 5717} {"train_loss": -26.897809982299805, "global_step": 474521, "epoch": 5717} {"train_loss": -26.89520263671875, "global_step": 474522, "epoch": 5717} {"train_loss": -26.658655166625977, "global_step": 474523, "epoch": 5717} {"train_loss": -26.909393310546875, "global_step": 474524, "epoch": 5717} {"train_loss": -26.918222427368164, "global_step": 474525, "epoch": 5717} {"train_loss": -26.87294578552246, "global_step": 474526, "epoch": 5717} {"train_loss": -26.852951049804688, "global_step": 474527, "epoch": 5717} {"train_loss": -26.898517608642578, "global_step": 474528, "epoch": 5717} {"train_loss": -26.893497467041016, "global_step": 474529, "epoch": 5717} {"train_loss": -26.817182540893555, "global_step": 474530, "epoch": 5717} {"train_loss": -27.185598373413086, "global_step": 474531, "epoch": 5717} {"train_loss": -26.8526668548584, "global_step": 474532, "epoch": 5717} {"train_loss": -27.104684829711914, "global_step": 474533, "epoch": 5717} {"train_loss": -27.146804809570312, "global_step": 474534, "epoch": 5717} {"train_loss": -26.967254638671875, "global_step": 474535, "epoch": 5717} {"train_loss": -27.02715492248535, "global_step": 474536, "epoch": 5717} {"train_loss": -27.0123233795166, "global_step": 474537, "epoch": 5717} {"train_loss": -26.969152450561523, "global_step": 474538, "epoch": 5717} {"train_loss": -27.418298721313477, "global_step": 474539, "epoch": 5717} {"train_loss": -27.063077926635742, "global_step": 474540, "epoch": 5717} {"train_loss": -26.985294342041016, "global_step": 474541, "epoch": 5717} {"train_loss": -26.857343673706055, "global_step": 474542, "epoch": 5717} {"train_loss": -27.360097885131836, "global_step": 474543, "epoch": 5717} {"train_loss": -27.3333797454834, "global_step": 474544, "epoch": 5717} {"train_loss": -27.018585205078125, "global_step": 474545, "epoch": 5717} {"train_loss": -27.52094078063965, "global_step": 474546, "epoch": 5717} {"train_loss": -27.05495262145996, "global_step": 474547, "epoch": 5717} {"train_loss": -27.38595962524414, "global_step": 474548, "epoch": 5717} {"train_loss": -27.00571632385254, "global_step": 474549, "epoch": 5717} {"train_loss": -27.374231338500977, "global_step": 474550, "epoch": 5717} {"train_loss": -27.306507110595703, "global_step": 474551, "epoch": 5717} {"train_loss": -27.388721466064453, "global_step": 474552, "epoch": 5717} {"train_loss": -27.34811782836914, "global_step": 474553, "epoch": 5717} {"train_loss": -27.39697265625, "global_step": 474554, "epoch": 5717} {"train_loss": -27.06662940979004, "global_step": 474555, "epoch": 5717} {"train_loss": -27.558862686157227, "global_step": 474556, "epoch": 5717} {"train_loss": -26.919910430908203, "global_step": 474557, "epoch": 5717} {"train_loss": -27.345584869384766, "global_step": 474558, "epoch": 5717} {"train_loss": -27.343231201171875, "global_step": 474559, "epoch": 5717} {"train_loss": -27.390111923217773, "global_step": 474560, "epoch": 5717} {"train_loss": -27.26740074157715, "global_step": 474561, "epoch": 5717} {"train_loss": -27.49220085144043, "global_step": 474562, "epoch": 5717} {"train_loss": -27.279193878173828, "global_step": 474563, "epoch": 5717} {"train_loss": -27.329431533813477, "global_step": 474564, "epoch": 5717} {"train_loss": -27.336673736572266, "global_step": 474565, "epoch": 5717} {"train_loss": -27.289331436157227, "global_step": 474566, "epoch": 5717} {"train_loss": -27.22021484375, "global_step": 474567, "epoch": 5717} {"train_loss": -27.406631469726562, "global_step": 474568, "epoch": 5717} {"train_loss": -27.701322555541992, "global_step": 474569, "epoch": 5717} {"train_loss": -26.745813369750977, "global_step": 474570, "epoch": 5717} {"train_loss": -27.265033721923828, "global_step": 474571, "epoch": 5717} {"train_loss": -27.298614501953125, "global_step": 474572, "epoch": 5717} {"train_loss": -27.131860733032227, "global_step": 474573, "epoch": 5717} {"train_loss": -27.516103744506836, "global_step": 474574, "epoch": 5717} {"train_loss": -27.162586212158203, "global_step": 474575, "epoch": 5717} {"train_loss": -27.00412368774414, "global_step": 474576, "epoch": 5717} {"train_loss": -27.053287506103516, "global_step": 474577, "epoch": 5717} {"train_loss": -27.248804092407227, "global_step": 474578, "epoch": 5717} {"train_loss": -27.323209762573242, "global_step": 474579, "epoch": 5717} {"train_loss": -27.344635009765625, "global_step": 474580, "epoch": 5717} {"train_loss": -27.481908798217773, "global_step": 474581, "epoch": 5717} {"train_loss": -27.303552627563477, "global_step": 474582, "epoch": 5717} {"train_loss": -27.637836456298828, "global_step": 474583, "epoch": 5717} {"train_loss": -27.40228843688965, "global_step": 474584, "epoch": 5717} {"train_loss": -27.698780059814453, "global_step": 474585, "epoch": 5717} {"train_loss": -27.294687271118164, "global_step": 474586, "epoch": 5717} {"train_loss": -27.5509033203125, "global_step": 474587, "epoch": 5717} {"train_loss": -27.446813583374023, "global_step": 474588, "epoch": 5717} {"train_loss": -27.420812606811523, "global_step": 474589, "epoch": 5717} {"train_loss": -27.347970962524414, "global_step": 474590, "epoch": 5717} {"train_loss": -27.233057022094727, "global_step": 474591, "epoch": 5717} {"train_loss": -27.089618682861328, "global_step": 474592, "epoch": 5717} {"train_loss": -27.11805189661233, "global_step": 474593, "epoch": 5717, "val_loss": 6775894.0} {"train_loss": -27.00129508972168, "global_step": 474594, "epoch": 5718} {"train_loss": -26.17827796936035, "global_step": 474595, "epoch": 5718} {"train_loss": -26.986547470092773, "global_step": 474596, "epoch": 5718} {"train_loss": -26.80600929260254, "global_step": 474597, "epoch": 5718} {"train_loss": -26.665252685546875, "global_step": 474598, "epoch": 5718} {"train_loss": -26.796051025390625, "global_step": 474599, "epoch": 5718} {"train_loss": -26.882099151611328, "global_step": 474600, "epoch": 5718} {"train_loss": -26.785736083984375, "global_step": 474601, "epoch": 5718} {"train_loss": -26.596561431884766, "global_step": 474602, "epoch": 5718} {"train_loss": -27.2286434173584, "global_step": 474603, "epoch": 5718} {"train_loss": -26.83845329284668, "global_step": 474604, "epoch": 5718} {"train_loss": -26.9251651763916, "global_step": 474605, "epoch": 5718} {"train_loss": -27.038373947143555, "global_step": 474606, "epoch": 5718} {"train_loss": -26.943378448486328, "global_step": 474607, "epoch": 5718} {"train_loss": -26.664899826049805, "global_step": 474608, "epoch": 5718} {"train_loss": -27.352935791015625, "global_step": 474609, "epoch": 5718} {"train_loss": -27.2166805267334, "global_step": 474610, "epoch": 5718} {"train_loss": -26.853307723999023, "global_step": 474611, "epoch": 5718} {"train_loss": -27.43665885925293, "global_step": 474612, "epoch": 5718} {"train_loss": -27.143232345581055, "global_step": 474613, "epoch": 5718} {"train_loss": -26.67511558532715, "global_step": 474614, "epoch": 5718} {"train_loss": -27.0294246673584, "global_step": 474615, "epoch": 5718} {"train_loss": -26.67275047302246, "global_step": 474616, "epoch": 5718} {"train_loss": -26.63856315612793, "global_step": 474617, "epoch": 5718} {"train_loss": -27.23575210571289, "global_step": 474618, "epoch": 5718} {"train_loss": -27.17701530456543, "global_step": 474619, "epoch": 5718} {"train_loss": -27.337263107299805, "global_step": 474620, "epoch": 5718} {"train_loss": -26.93680191040039, "global_step": 474621, "epoch": 5718} {"train_loss": -27.396955490112305, "global_step": 474622, "epoch": 5718} {"train_loss": -27.02072525024414, "global_step": 474623, "epoch": 5718} {"train_loss": -27.600229263305664, "global_step": 474624, "epoch": 5718} {"train_loss": -27.195758819580078, "global_step": 474625, "epoch": 5718} {"train_loss": -27.25385093688965, "global_step": 474626, "epoch": 5718} {"train_loss": -27.390607833862305, "global_step": 474627, "epoch": 5718} {"train_loss": -27.45928382873535, "global_step": 474628, "epoch": 5718} {"train_loss": -27.462615966796875, "global_step": 474629, "epoch": 5718} {"train_loss": -27.356048583984375, "global_step": 474630, "epoch": 5718} {"train_loss": -27.308609008789062, "global_step": 474631, "epoch": 5718} {"train_loss": -27.45953941345215, "global_step": 474632, "epoch": 5718} {"train_loss": -27.51738929748535, "global_step": 474633, "epoch": 5718} {"train_loss": -27.419055938720703, "global_step": 474634, "epoch": 5718} {"train_loss": -27.105915069580078, "global_step": 474635, "epoch": 5718} {"train_loss": -27.75908851623535, "global_step": 474636, "epoch": 5718} {"train_loss": -27.181594848632812, "global_step": 474637, "epoch": 5718} {"train_loss": -27.433324813842773, "global_step": 474638, "epoch": 5718} {"train_loss": -27.1035099029541, "global_step": 474639, "epoch": 5718} {"train_loss": -27.23451042175293, "global_step": 474640, "epoch": 5718} {"train_loss": -27.075666427612305, "global_step": 474641, "epoch": 5718} {"train_loss": -27.327640533447266, "global_step": 474642, "epoch": 5718} {"train_loss": -27.2228946685791, "global_step": 474643, "epoch": 5718} {"train_loss": -27.514440536499023, "global_step": 474644, "epoch": 5718} {"train_loss": -27.5513858795166, "global_step": 474645, "epoch": 5718} {"train_loss": -27.426130294799805, "global_step": 474646, "epoch": 5718} {"train_loss": -27.4075870513916, "global_step": 474647, "epoch": 5718} {"train_loss": -27.043760299682617, "global_step": 474648, "epoch": 5718} {"train_loss": -27.123382568359375, "global_step": 474649, "epoch": 5718} {"train_loss": -26.606225967407227, "global_step": 474650, "epoch": 5718} {"train_loss": -26.82903480529785, "global_step": 474651, "epoch": 5718} {"train_loss": -27.20863151550293, "global_step": 474652, "epoch": 5718} {"train_loss": -27.465993881225586, "global_step": 474653, "epoch": 5718} {"train_loss": -27.27718162536621, "global_step": 474654, "epoch": 5718} {"train_loss": -27.050907135009766, "global_step": 474655, "epoch": 5718} {"train_loss": -27.158447265625, "global_step": 474656, "epoch": 5718} {"train_loss": -27.406543731689453, "global_step": 474657, "epoch": 5718} {"train_loss": -27.2889404296875, "global_step": 474658, "epoch": 5718} {"train_loss": -27.53229331970215, "global_step": 474659, "epoch": 5718} {"train_loss": -27.32428550720215, "global_step": 474660, "epoch": 5718} {"train_loss": -27.345264434814453, "global_step": 474661, "epoch": 5718} {"train_loss": -27.29815673828125, "global_step": 474662, "epoch": 5718} {"train_loss": -27.455036163330078, "global_step": 474663, "epoch": 5718} {"train_loss": -27.053564071655273, "global_step": 474664, "epoch": 5718} {"train_loss": -27.158447265625, "global_step": 474665, "epoch": 5718} {"train_loss": -27.06080436706543, "global_step": 474666, "epoch": 5718} {"train_loss": -27.311872482299805, "global_step": 474667, "epoch": 5718} {"train_loss": -27.464004516601562, "global_step": 474668, "epoch": 5718} {"train_loss": -27.51319694519043, "global_step": 474669, "epoch": 5718} {"train_loss": -27.104658126831055, "global_step": 474670, "epoch": 5718} {"train_loss": -27.658008575439453, "global_step": 474671, "epoch": 5718} {"train_loss": -27.562305450439453, "global_step": 474672, "epoch": 5718} {"train_loss": -27.241321563720703, "global_step": 474673, "epoch": 5718} {"train_loss": -26.926044464111328, "global_step": 474674, "epoch": 5718} {"train_loss": -27.364660263061523, "global_step": 474675, "epoch": 5718} {"train_loss": -27.173797952123437, "global_step": 474676, "epoch": 5718, "val_loss": 6639964.0} {"train_loss": -19.975982666015625, "global_step": 474677, "epoch": 5719} {"train_loss": -24.42542839050293, "global_step": 474678, "epoch": 5719} {"train_loss": -22.886167526245117, "global_step": 474679, "epoch": 5719} {"train_loss": -22.0975284576416, "global_step": 474680, "epoch": 5719} {"train_loss": -24.221906661987305, "global_step": 474681, "epoch": 5719} {"train_loss": -24.330053329467773, "global_step": 474682, "epoch": 5719} {"train_loss": -23.964324951171875, "global_step": 474683, "epoch": 5719} {"train_loss": -24.631942749023438, "global_step": 474684, "epoch": 5719} {"train_loss": -24.630773544311523, "global_step": 474685, "epoch": 5719} {"train_loss": -24.986753463745117, "global_step": 474686, "epoch": 5719} {"train_loss": -24.621601104736328, "global_step": 474687, "epoch": 5719} {"train_loss": -24.936893463134766, "global_step": 474688, "epoch": 5719} {"train_loss": -24.91805648803711, "global_step": 474689, "epoch": 5719} {"train_loss": -25.275047302246094, "global_step": 474690, "epoch": 5719} {"train_loss": -25.38229751586914, "global_step": 474691, "epoch": 5719} {"train_loss": -25.530635833740234, "global_step": 474692, "epoch": 5719} {"train_loss": -25.4381046295166, "global_step": 474693, "epoch": 5719} {"train_loss": -25.47760581970215, "global_step": 474694, "epoch": 5719} {"train_loss": -25.560604095458984, "global_step": 474695, "epoch": 5719} {"train_loss": -25.652118682861328, "global_step": 474696, "epoch": 5719} {"train_loss": -25.636245727539062, "global_step": 474697, "epoch": 5719} {"train_loss": -25.823373794555664, "global_step": 474698, "epoch": 5719} {"train_loss": -25.94598388671875, "global_step": 474699, "epoch": 5719} {"train_loss": -25.583417892456055, "global_step": 474700, "epoch": 5719} {"train_loss": -25.905752182006836, "global_step": 474701, "epoch": 5719} {"train_loss": -26.168609619140625, "global_step": 474702, "epoch": 5719} {"train_loss": -26.087888717651367, "global_step": 474703, "epoch": 5719} {"train_loss": -26.091217041015625, "global_step": 474704, "epoch": 5719} {"train_loss": -25.952157974243164, "global_step": 474705, "epoch": 5719} {"train_loss": -26.397119522094727, "global_step": 474706, "epoch": 5719} {"train_loss": -26.125837326049805, "global_step": 474707, "epoch": 5719} {"train_loss": -26.126020431518555, "global_step": 474708, "epoch": 5719} {"train_loss": -26.291223526000977, "global_step": 474709, "epoch": 5719} {"train_loss": -26.64165687561035, "global_step": 474710, "epoch": 5719} {"train_loss": -26.49300193786621, "global_step": 474711, "epoch": 5719} {"train_loss": -26.259992599487305, "global_step": 474712, "epoch": 5719} {"train_loss": -26.641708374023438, "global_step": 474713, "epoch": 5719} {"train_loss": -26.732044219970703, "global_step": 474714, "epoch": 5719} {"train_loss": -26.759336471557617, "global_step": 474715, "epoch": 5719} {"train_loss": -26.601520538330078, "global_step": 474716, "epoch": 5719} {"train_loss": -26.81646156311035, "global_step": 474717, "epoch": 5719} {"train_loss": -26.888681411743164, "global_step": 474718, "epoch": 5719} {"train_loss": -26.64813232421875, "global_step": 474719, "epoch": 5719} {"train_loss": -26.949567794799805, "global_step": 474720, "epoch": 5719} {"train_loss": -26.63374900817871, "global_step": 474721, "epoch": 5719} {"train_loss": -26.807462692260742, "global_step": 474722, "epoch": 5719} {"train_loss": -26.7934627532959, "global_step": 474723, "epoch": 5719} {"train_loss": -26.985929489135742, "global_step": 474724, "epoch": 5719} {"train_loss": -26.688678741455078, "global_step": 474725, "epoch": 5719} {"train_loss": -27.084745407104492, "global_step": 474726, "epoch": 5719} {"train_loss": -27.138614654541016, "global_step": 474727, "epoch": 5719} {"train_loss": -27.183637619018555, "global_step": 474728, "epoch": 5719} {"train_loss": -27.10979652404785, "global_step": 474729, "epoch": 5719} {"train_loss": -26.972333908081055, "global_step": 474730, "epoch": 5719} {"train_loss": -27.07158851623535, "global_step": 474731, "epoch": 5719} {"train_loss": -27.005355834960938, "global_step": 474732, "epoch": 5719} {"train_loss": -27.225940704345703, "global_step": 474733, "epoch": 5719} {"train_loss": -27.0428466796875, "global_step": 474734, "epoch": 5719} {"train_loss": -27.22273063659668, "global_step": 474735, "epoch": 5719} {"train_loss": -27.04543113708496, "global_step": 474736, "epoch": 5719} {"train_loss": -26.942834854125977, "global_step": 474737, "epoch": 5719} {"train_loss": -27.191247940063477, "global_step": 474738, "epoch": 5719} {"train_loss": -27.231176376342773, "global_step": 474739, "epoch": 5719} {"train_loss": -27.234634399414062, "global_step": 474740, "epoch": 5719} {"train_loss": -27.376073837280273, "global_step": 474741, "epoch": 5719} {"train_loss": -27.12163734436035, "global_step": 474742, "epoch": 5719} {"train_loss": -27.385732650756836, "global_step": 474743, "epoch": 5719} {"train_loss": -27.193988800048828, "global_step": 474744, "epoch": 5719} {"train_loss": -27.04559326171875, "global_step": 474745, "epoch": 5719} {"train_loss": -27.28525733947754, "global_step": 474746, "epoch": 5719} {"train_loss": -27.026020050048828, "global_step": 474747, "epoch": 5719} {"train_loss": -27.32488441467285, "global_step": 474748, "epoch": 5719} {"train_loss": -27.42083740234375, "global_step": 474749, "epoch": 5719} {"train_loss": -27.16266441345215, "global_step": 474750, "epoch": 5719} {"train_loss": -27.35212516784668, "global_step": 474751, "epoch": 5719} {"train_loss": -27.061298370361328, "global_step": 474752, "epoch": 5719} {"train_loss": -26.882551193237305, "global_step": 474753, "epoch": 5719} {"train_loss": -27.153371810913086, "global_step": 474754, "epoch": 5719} {"train_loss": -26.90225601196289, "global_step": 474755, "epoch": 5719} {"train_loss": -27.052610397338867, "global_step": 474756, "epoch": 5719} {"train_loss": -27.56451416015625, "global_step": 474757, "epoch": 5719} {"train_loss": -27.391494750976562, "global_step": 474758, "epoch": 5719} {"train_loss": -26.22283172607422, "global_step": 474759, "epoch": 5719, "val_loss": 6646358.5} {"train_loss": -22.478490829467773, "global_step": 474760, "epoch": 5720} {"train_loss": -23.280668258666992, "global_step": 474761, "epoch": 5720} {"train_loss": -25.507539749145508, "global_step": 474762, "epoch": 5720} {"train_loss": -24.952207565307617, "global_step": 474763, "epoch": 5720} {"train_loss": -25.7730655670166, "global_step": 474764, "epoch": 5720} {"train_loss": -24.57510757446289, "global_step": 474765, "epoch": 5720} {"train_loss": -26.19776725769043, "global_step": 474766, "epoch": 5720} {"train_loss": -25.776874542236328, "global_step": 474767, "epoch": 5720} {"train_loss": -25.480697631835938, "global_step": 474768, "epoch": 5720} {"train_loss": -26.34929847717285, "global_step": 474769, "epoch": 5720} {"train_loss": -25.513639450073242, "global_step": 474770, "epoch": 5720} {"train_loss": -25.882160186767578, "global_step": 474771, "epoch": 5720} {"train_loss": -25.971887588500977, "global_step": 474772, "epoch": 5720} {"train_loss": -26.239093780517578, "global_step": 474773, "epoch": 5720} {"train_loss": -26.296472549438477, "global_step": 474774, "epoch": 5720} {"train_loss": -26.224964141845703, "global_step": 474775, "epoch": 5720} {"train_loss": -26.29762077331543, "global_step": 474776, "epoch": 5720} {"train_loss": -26.7038631439209, "global_step": 474777, "epoch": 5720} {"train_loss": -26.369855880737305, "global_step": 474778, "epoch": 5720} {"train_loss": -26.175140380859375, "global_step": 474779, "epoch": 5720} {"train_loss": -26.105697631835938, "global_step": 474780, "epoch": 5720} {"train_loss": -26.590986251831055, "global_step": 474781, "epoch": 5720} {"train_loss": -26.819843292236328, "global_step": 474782, "epoch": 5720} {"train_loss": -26.559192657470703, "global_step": 474783, "epoch": 5720} {"train_loss": -26.585416793823242, "global_step": 474784, "epoch": 5720} {"train_loss": -26.332050323486328, "global_step": 474785, "epoch": 5720} {"train_loss": -26.5643310546875, "global_step": 474786, "epoch": 5720} {"train_loss": -26.8234920501709, "global_step": 474787, "epoch": 5720} {"train_loss": -26.61441993713379, "global_step": 474788, "epoch": 5720} {"train_loss": -26.5003604888916, "global_step": 474789, "epoch": 5720} {"train_loss": -26.344526290893555, "global_step": 474790, "epoch": 5720} {"train_loss": -26.912418365478516, "global_step": 474791, "epoch": 5720} {"train_loss": -26.669652938842773, "global_step": 474792, "epoch": 5720} {"train_loss": -27.097986221313477, "global_step": 474793, "epoch": 5720} {"train_loss": -26.413068771362305, "global_step": 474794, "epoch": 5720} {"train_loss": -27.147367477416992, "global_step": 474795, "epoch": 5720} {"train_loss": -27.088363647460938, "global_step": 474796, "epoch": 5720} {"train_loss": -26.766366958618164, "global_step": 474797, "epoch": 5720} {"train_loss": -27.013586044311523, "global_step": 474798, "epoch": 5720} {"train_loss": -27.099267959594727, "global_step": 474799, "epoch": 5720} {"train_loss": -26.74860954284668, "global_step": 474800, "epoch": 5720} {"train_loss": -26.89276123046875, "global_step": 474801, "epoch": 5720} {"train_loss": -26.98247718811035, "global_step": 474802, "epoch": 5720} {"train_loss": -27.139673233032227, "global_step": 474803, "epoch": 5720} {"train_loss": -27.146284103393555, "global_step": 474804, "epoch": 5720} {"train_loss": -27.251815795898438, "global_step": 474805, "epoch": 5720} {"train_loss": -27.4249267578125, "global_step": 474806, "epoch": 5720} {"train_loss": -27.346221923828125, "global_step": 474807, "epoch": 5720} {"train_loss": -27.140073776245117, "global_step": 474808, "epoch": 5720} {"train_loss": -27.434619903564453, "global_step": 474809, "epoch": 5720} {"train_loss": -26.86594581604004, "global_step": 474810, "epoch": 5720} {"train_loss": -27.047399520874023, "global_step": 474811, "epoch": 5720} {"train_loss": -26.975446701049805, "global_step": 474812, "epoch": 5720} {"train_loss": -27.295734405517578, "global_step": 474813, "epoch": 5720} {"train_loss": -27.113555908203125, "global_step": 474814, "epoch": 5720} {"train_loss": -27.33154296875, "global_step": 474815, "epoch": 5720} {"train_loss": -27.171125411987305, "global_step": 474816, "epoch": 5720} {"train_loss": -27.586883544921875, "global_step": 474817, "epoch": 5720} {"train_loss": -26.994293212890625, "global_step": 474818, "epoch": 5720} {"train_loss": -27.469989776611328, "global_step": 474819, "epoch": 5720} {"train_loss": -27.211572647094727, "global_step": 474820, "epoch": 5720} {"train_loss": -27.09551429748535, "global_step": 474821, "epoch": 5720} {"train_loss": -26.92621421813965, "global_step": 474822, "epoch": 5720} {"train_loss": -27.095264434814453, "global_step": 474823, "epoch": 5720} {"train_loss": -27.238601684570312, "global_step": 474824, "epoch": 5720} {"train_loss": -27.08704948425293, "global_step": 474825, "epoch": 5720} {"train_loss": -26.966306686401367, "global_step": 474826, "epoch": 5720} {"train_loss": -26.818695068359375, "global_step": 474827, "epoch": 5720} {"train_loss": -26.9438419342041, "global_step": 474828, "epoch": 5720} {"train_loss": -27.14349937438965, "global_step": 474829, "epoch": 5720} {"train_loss": -26.617109298706055, "global_step": 474830, "epoch": 5720} {"train_loss": -26.9270076751709, "global_step": 474831, "epoch": 5720} {"train_loss": -27.1683292388916, "global_step": 474832, "epoch": 5720} {"train_loss": -27.150888442993164, "global_step": 474833, "epoch": 5720} {"train_loss": -27.470579147338867, "global_step": 474834, "epoch": 5720} {"train_loss": -27.234994888305664, "global_step": 474835, "epoch": 5720} {"train_loss": -27.319250106811523, "global_step": 474836, "epoch": 5720} {"train_loss": -26.773038864135742, "global_step": 474837, "epoch": 5720} {"train_loss": -27.26474380493164, "global_step": 474838, "epoch": 5720} {"train_loss": -27.093372344970703, "global_step": 474839, "epoch": 5720} {"train_loss": -27.144174575805664, "global_step": 474840, "epoch": 5720} {"train_loss": -26.61484718322754, "global_step": 474841, "epoch": 5720} {"train_loss": -26.65046632146261, "global_step": 474842, "epoch": 5720, "val_loss": 6626952.0} {"train_loss": -27.295791625976562, "global_step": 474843, "epoch": 5721} {"train_loss": -26.635400772094727, "global_step": 474844, "epoch": 5721} {"train_loss": -26.4346981048584, "global_step": 474845, "epoch": 5721} {"train_loss": -26.250446319580078, "global_step": 474846, "epoch": 5721} {"train_loss": -26.897306442260742, "global_step": 474847, "epoch": 5721} {"train_loss": -26.83713722229004, "global_step": 474848, "epoch": 5721} {"train_loss": -26.996448516845703, "global_step": 474849, "epoch": 5721} {"train_loss": -26.950653076171875, "global_step": 474850, "epoch": 5721} {"train_loss": -26.89727783203125, "global_step": 474851, "epoch": 5721} {"train_loss": -27.02056884765625, "global_step": 474852, "epoch": 5721} {"train_loss": -26.7513484954834, "global_step": 474853, "epoch": 5721} {"train_loss": -26.771100997924805, "global_step": 474854, "epoch": 5721} {"train_loss": -26.919294357299805, "global_step": 474855, "epoch": 5721} {"train_loss": -26.97124671936035, "global_step": 474856, "epoch": 5721} {"train_loss": -26.59760093688965, "global_step": 474857, "epoch": 5721} {"train_loss": -26.8865909576416, "global_step": 474858, "epoch": 5721} {"train_loss": -27.450851440429688, "global_step": 474859, "epoch": 5721} {"train_loss": -27.056848526000977, "global_step": 474860, "epoch": 5721} {"train_loss": -27.28055763244629, "global_step": 474861, "epoch": 5721} {"train_loss": -27.06827735900879, "global_step": 474862, "epoch": 5721} {"train_loss": -27.152555465698242, "global_step": 474863, "epoch": 5721} {"train_loss": -27.145206451416016, "global_step": 474864, "epoch": 5721} {"train_loss": -26.81134033203125, "global_step": 474865, "epoch": 5721} {"train_loss": -27.620441436767578, "global_step": 474866, "epoch": 5721} {"train_loss": -27.173654556274414, "global_step": 474867, "epoch": 5721} {"train_loss": -27.165624618530273, "global_step": 474868, "epoch": 5721} {"train_loss": -27.330106735229492, "global_step": 474869, "epoch": 5721} {"train_loss": -27.30994987487793, "global_step": 474870, "epoch": 5721} {"train_loss": -27.463470458984375, "global_step": 474871, "epoch": 5721} {"train_loss": -27.381790161132812, "global_step": 474872, "epoch": 5721} {"train_loss": -27.207412719726562, "global_step": 474873, "epoch": 5721} {"train_loss": -27.12041664123535, "global_step": 474874, "epoch": 5721} {"train_loss": -27.538114547729492, "global_step": 474875, "epoch": 5721} {"train_loss": -27.3846492767334, "global_step": 474876, "epoch": 5721} {"train_loss": -27.192419052124023, "global_step": 474877, "epoch": 5721} {"train_loss": -27.345823287963867, "global_step": 474878, "epoch": 5721} {"train_loss": -27.379541397094727, "global_step": 474879, "epoch": 5721} {"train_loss": -27.321435928344727, "global_step": 474880, "epoch": 5721} {"train_loss": -27.167226791381836, "global_step": 474881, "epoch": 5721} {"train_loss": -27.194110870361328, "global_step": 474882, "epoch": 5721} {"train_loss": -27.670957565307617, "global_step": 474883, "epoch": 5721} {"train_loss": -27.548538208007812, "global_step": 474884, "epoch": 5721} {"train_loss": -27.143218994140625, "global_step": 474885, "epoch": 5721} {"train_loss": -27.348058700561523, "global_step": 474886, "epoch": 5721} {"train_loss": -27.467121124267578, "global_step": 474887, "epoch": 5721} {"train_loss": -28.002796173095703, "global_step": 474888, "epoch": 5721} {"train_loss": -27.281339645385742, "global_step": 474889, "epoch": 5721} {"train_loss": -27.547637939453125, "global_step": 474890, "epoch": 5721} {"train_loss": -27.516576766967773, "global_step": 474891, "epoch": 5721} {"train_loss": -27.517648696899414, "global_step": 474892, "epoch": 5721} {"train_loss": -27.592121124267578, "global_step": 474893, "epoch": 5721} {"train_loss": -27.444900512695312, "global_step": 474894, "epoch": 5721} {"train_loss": -27.3946475982666, "global_step": 474895, "epoch": 5721} {"train_loss": -26.270360946655273, "global_step": 474896, "epoch": 5721} {"train_loss": -25.68536376953125, "global_step": 474897, "epoch": 5721} {"train_loss": -25.437223434448242, "global_step": 474898, "epoch": 5721} {"train_loss": -26.19154167175293, "global_step": 474899, "epoch": 5721} {"train_loss": -26.818044662475586, "global_step": 474900, "epoch": 5721} {"train_loss": -26.74650001525879, "global_step": 474901, "epoch": 5721} {"train_loss": -26.58323097229004, "global_step": 474902, "epoch": 5721} {"train_loss": -26.269311904907227, "global_step": 474903, "epoch": 5721} {"train_loss": -26.848373413085938, "global_step": 474904, "epoch": 5721} {"train_loss": -27.128026962280273, "global_step": 474905, "epoch": 5721} {"train_loss": -26.426013946533203, "global_step": 474906, "epoch": 5721} {"train_loss": -26.651931762695312, "global_step": 474907, "epoch": 5721} {"train_loss": -26.670886993408203, "global_step": 474908, "epoch": 5721} {"train_loss": -26.749591827392578, "global_step": 474909, "epoch": 5721} {"train_loss": -26.599287033081055, "global_step": 474910, "epoch": 5721} {"train_loss": -26.8265438079834, "global_step": 474911, "epoch": 5721} {"train_loss": -26.735858917236328, "global_step": 474912, "epoch": 5721} {"train_loss": -26.70649528503418, "global_step": 474913, "epoch": 5721} {"train_loss": -26.88054847717285, "global_step": 474914, "epoch": 5721} {"train_loss": -26.930164337158203, "global_step": 474915, "epoch": 5721} {"train_loss": -27.205488204956055, "global_step": 474916, "epoch": 5721} {"train_loss": -26.874847412109375, "global_step": 474917, "epoch": 5721} {"train_loss": -27.38006591796875, "global_step": 474918, "epoch": 5721} {"train_loss": -26.81768226623535, "global_step": 474919, "epoch": 5721} {"train_loss": -27.09137535095215, "global_step": 474920, "epoch": 5721} {"train_loss": -27.02667236328125, "global_step": 474921, "epoch": 5721} {"train_loss": -27.156644821166992, "global_step": 474922, "epoch": 5721} {"train_loss": -27.412372589111328, "global_step": 474923, "epoch": 5721} {"train_loss": -27.138479232788086, "global_step": 474924, "epoch": 5721} {"train_loss": -27.015424176871058, "global_step": 474925, "epoch": 5721, "val_loss": 6587066.0} {"train_loss": -26.876251220703125, "global_step": 474926, "epoch": 5722} {"train_loss": -26.930089950561523, "global_step": 474927, "epoch": 5722} {"train_loss": -26.657958984375, "global_step": 474928, "epoch": 5722} {"train_loss": -26.682525634765625, "global_step": 474929, "epoch": 5722} {"train_loss": -26.590167999267578, "global_step": 474930, "epoch": 5722} {"train_loss": -27.126657485961914, "global_step": 474931, "epoch": 5722} {"train_loss": -26.95521354675293, "global_step": 474932, "epoch": 5722} {"train_loss": -26.82198143005371, "global_step": 474933, "epoch": 5722} {"train_loss": -26.67951774597168, "global_step": 474934, "epoch": 5722} {"train_loss": -27.273578643798828, "global_step": 474935, "epoch": 5722} {"train_loss": -27.040979385375977, "global_step": 474936, "epoch": 5722} {"train_loss": -26.834714889526367, "global_step": 474937, "epoch": 5722} {"train_loss": -27.290771484375, "global_step": 474938, "epoch": 5722} {"train_loss": -26.984527587890625, "global_step": 474939, "epoch": 5722} {"train_loss": -27.694379806518555, "global_step": 474940, "epoch": 5722} {"train_loss": -27.028915405273438, "global_step": 474941, "epoch": 5722} {"train_loss": -26.85638999938965, "global_step": 474942, "epoch": 5722} {"train_loss": -27.283344268798828, "global_step": 474943, "epoch": 5722} {"train_loss": -27.032306671142578, "global_step": 474944, "epoch": 5722} {"train_loss": -27.364343643188477, "global_step": 474945, "epoch": 5722} {"train_loss": -26.971704483032227, "global_step": 474946, "epoch": 5722} {"train_loss": -27.07659339904785, "global_step": 474947, "epoch": 5722} {"train_loss": -27.038328170776367, "global_step": 474948, "epoch": 5722} {"train_loss": -27.114822387695312, "global_step": 474949, "epoch": 5722} {"train_loss": -27.391321182250977, "global_step": 474950, "epoch": 5722} {"train_loss": -27.60740089416504, "global_step": 474951, "epoch": 5722} {"train_loss": -27.365493774414062, "global_step": 474952, "epoch": 5722} {"train_loss": -27.4888973236084, "global_step": 474953, "epoch": 5722} {"train_loss": -27.327285766601562, "global_step": 474954, "epoch": 5722} {"train_loss": -27.165821075439453, "global_step": 474955, "epoch": 5722} {"train_loss": -27.0533390045166, "global_step": 474956, "epoch": 5722} {"train_loss": -27.241046905517578, "global_step": 474957, "epoch": 5722} {"train_loss": -27.1807804107666, "global_step": 474958, "epoch": 5722} {"train_loss": -27.366254806518555, "global_step": 474959, "epoch": 5722} {"train_loss": -27.476795196533203, "global_step": 474960, "epoch": 5722} {"train_loss": -27.2404842376709, "global_step": 474961, "epoch": 5722} {"train_loss": -27.27678871154785, "global_step": 474962, "epoch": 5722} {"train_loss": -27.316482543945312, "global_step": 474963, "epoch": 5722} {"train_loss": -27.253589630126953, "global_step": 474964, "epoch": 5722} {"train_loss": -26.88884925842285, "global_step": 474965, "epoch": 5722} {"train_loss": -27.139087677001953, "global_step": 474966, "epoch": 5722} {"train_loss": -27.620847702026367, "global_step": 474967, "epoch": 5722} {"train_loss": -27.00037956237793, "global_step": 474968, "epoch": 5722} {"train_loss": -27.395069122314453, "global_step": 474969, "epoch": 5722} {"train_loss": -27.453388214111328, "global_step": 474970, "epoch": 5722} {"train_loss": -27.48699378967285, "global_step": 474971, "epoch": 5722} {"train_loss": -27.467243194580078, "global_step": 474972, "epoch": 5722} {"train_loss": -27.296173095703125, "global_step": 474973, "epoch": 5722} {"train_loss": -27.389755249023438, "global_step": 474974, "epoch": 5722} {"train_loss": -27.106002807617188, "global_step": 474975, "epoch": 5722} {"train_loss": -26.76485252380371, "global_step": 474976, "epoch": 5722} {"train_loss": -27.3619384765625, "global_step": 474977, "epoch": 5722} {"train_loss": -27.260629653930664, "global_step": 474978, "epoch": 5722} {"train_loss": -27.1502742767334, "global_step": 474979, "epoch": 5722} {"train_loss": -27.3833065032959, "global_step": 474980, "epoch": 5722} {"train_loss": -27.17782974243164, "global_step": 474981, "epoch": 5722} {"train_loss": -27.645538330078125, "global_step": 474982, "epoch": 5722} {"train_loss": -27.567707061767578, "global_step": 474983, "epoch": 5722} {"train_loss": -27.325300216674805, "global_step": 474984, "epoch": 5722} {"train_loss": -27.192480087280273, "global_step": 474985, "epoch": 5722} {"train_loss": -26.958465576171875, "global_step": 474986, "epoch": 5722} {"train_loss": -27.058368682861328, "global_step": 474987, "epoch": 5722} {"train_loss": -27.491621017456055, "global_step": 474988, "epoch": 5722} {"train_loss": -27.178213119506836, "global_step": 474989, "epoch": 5722} {"train_loss": -27.25596046447754, "global_step": 474990, "epoch": 5722} {"train_loss": -26.82927894592285, "global_step": 474991, "epoch": 5722} {"train_loss": -26.475339889526367, "global_step": 474992, "epoch": 5722} {"train_loss": -26.9435977935791, "global_step": 474993, "epoch": 5722} {"train_loss": -26.91571617126465, "global_step": 474994, "epoch": 5722} {"train_loss": -27.214365005493164, "global_step": 474995, "epoch": 5722} {"train_loss": -26.969348907470703, "global_step": 474996, "epoch": 5722} {"train_loss": -26.796945571899414, "global_step": 474997, "epoch": 5722} {"train_loss": -27.098031997680664, "global_step": 474998, "epoch": 5722} {"train_loss": -27.168304443359375, "global_step": 474999, "epoch": 5722} {"train_loss": -27.4719181060791, "global_step": 475000, "epoch": 5722} {"train_loss": -26.628589630126953, "global_step": 475001, "epoch": 5722} {"train_loss": -26.604080200195312, "global_step": 475002, "epoch": 5722} {"train_loss": -26.50391960144043, "global_step": 475003, "epoch": 5722} {"train_loss": -27.0853271484375, "global_step": 475004, "epoch": 5722} {"train_loss": -27.502979278564453, "global_step": 475005, "epoch": 5722} {"train_loss": -27.20123863220215, "global_step": 475006, "epoch": 5722} {"train_loss": -27.313695907592773, "global_step": 475007, "epoch": 5722} {"train_loss": -27.149257453091174, "global_step": 475008, "epoch": 5722, "val_loss": 6622562.0} {"train_loss": -26.54095458984375, "global_step": 475009, "epoch": 5723} {"train_loss": -26.804931640625, "global_step": 475010, "epoch": 5723} {"train_loss": -26.716562271118164, "global_step": 475011, "epoch": 5723} {"train_loss": -27.104536056518555, "global_step": 475012, "epoch": 5723} {"train_loss": -27.13028335571289, "global_step": 475013, "epoch": 5723} {"train_loss": -27.457595825195312, "global_step": 475014, "epoch": 5723} {"train_loss": -26.869876861572266, "global_step": 475015, "epoch": 5723} {"train_loss": -27.227338790893555, "global_step": 475016, "epoch": 5723} {"train_loss": -26.866565704345703, "global_step": 475017, "epoch": 5723} {"train_loss": -27.239171981811523, "global_step": 475018, "epoch": 5723} {"train_loss": -27.1732234954834, "global_step": 475019, "epoch": 5723} {"train_loss": -27.323444366455078, "global_step": 475020, "epoch": 5723} {"train_loss": -27.230573654174805, "global_step": 475021, "epoch": 5723} {"train_loss": -27.371856689453125, "global_step": 475022, "epoch": 5723} {"train_loss": -26.91097068786621, "global_step": 475023, "epoch": 5723} {"train_loss": -27.454992294311523, "global_step": 475024, "epoch": 5723} {"train_loss": -27.32599449157715, "global_step": 475025, "epoch": 5723} {"train_loss": -27.46632957458496, "global_step": 475026, "epoch": 5723} {"train_loss": -26.823179244995117, "global_step": 475027, "epoch": 5723} {"train_loss": -27.230947494506836, "global_step": 475028, "epoch": 5723} {"train_loss": -27.188953399658203, "global_step": 475029, "epoch": 5723} {"train_loss": -27.291345596313477, "global_step": 475030, "epoch": 5723} {"train_loss": -27.42327308654785, "global_step": 475031, "epoch": 5723} {"train_loss": -27.57122802734375, "global_step": 475032, "epoch": 5723} {"train_loss": -27.428125381469727, "global_step": 475033, "epoch": 5723} {"train_loss": -27.097803115844727, "global_step": 475034, "epoch": 5723} {"train_loss": -27.411569595336914, "global_step": 475035, "epoch": 5723} {"train_loss": -26.89090347290039, "global_step": 475036, "epoch": 5723} {"train_loss": -26.987485885620117, "global_step": 475037, "epoch": 5723} {"train_loss": -27.08744239807129, "global_step": 475038, "epoch": 5723} {"train_loss": -26.889850616455078, "global_step": 475039, "epoch": 5723} {"train_loss": -26.584182739257812, "global_step": 475040, "epoch": 5723} {"train_loss": -27.052825927734375, "global_step": 475041, "epoch": 5723} {"train_loss": -27.011646270751953, "global_step": 475042, "epoch": 5723} {"train_loss": -27.06696891784668, "global_step": 475043, "epoch": 5723} {"train_loss": -26.67616081237793, "global_step": 475044, "epoch": 5723} {"train_loss": -27.227542877197266, "global_step": 475045, "epoch": 5723} {"train_loss": -27.020612716674805, "global_step": 475046, "epoch": 5723} {"train_loss": -27.24073600769043, "global_step": 475047, "epoch": 5723} {"train_loss": -26.765100479125977, "global_step": 475048, "epoch": 5723} {"train_loss": -27.245620727539062, "global_step": 475049, "epoch": 5723} {"train_loss": -27.3566951751709, "global_step": 475050, "epoch": 5723} {"train_loss": -27.053268432617188, "global_step": 475051, "epoch": 5723} {"train_loss": -27.223623275756836, "global_step": 475052, "epoch": 5723} {"train_loss": -27.40900230407715, "global_step": 475053, "epoch": 5723} {"train_loss": -27.361221313476562, "global_step": 475054, "epoch": 5723} {"train_loss": -27.54347038269043, "global_step": 475055, "epoch": 5723} {"train_loss": -27.07329750061035, "global_step": 475056, "epoch": 5723} {"train_loss": -27.494800567626953, "global_step": 475057, "epoch": 5723} {"train_loss": -27.405118942260742, "global_step": 475058, "epoch": 5723} {"train_loss": -27.36590576171875, "global_step": 475059, "epoch": 5723} {"train_loss": -27.520679473876953, "global_step": 475060, "epoch": 5723} {"train_loss": -27.21575927734375, "global_step": 475061, "epoch": 5723} {"train_loss": -27.015949249267578, "global_step": 475062, "epoch": 5723} {"train_loss": -27.75860023498535, "global_step": 475063, "epoch": 5723} {"train_loss": -27.202428817749023, "global_step": 475064, "epoch": 5723} {"train_loss": -27.436689376831055, "global_step": 475065, "epoch": 5723} {"train_loss": -27.178136825561523, "global_step": 475066, "epoch": 5723} {"train_loss": -27.43894386291504, "global_step": 475067, "epoch": 5723} {"train_loss": -27.256811141967773, "global_step": 475068, "epoch": 5723} {"train_loss": -27.088598251342773, "global_step": 475069, "epoch": 5723} {"train_loss": -27.2840518951416, "global_step": 475070, "epoch": 5723} {"train_loss": -27.320606231689453, "global_step": 475071, "epoch": 5723} {"train_loss": -27.239887237548828, "global_step": 475072, "epoch": 5723} {"train_loss": -26.973703384399414, "global_step": 475073, "epoch": 5723} {"train_loss": -26.800317764282227, "global_step": 475074, "epoch": 5723} {"train_loss": -26.89503288269043, "global_step": 475075, "epoch": 5723} {"train_loss": -27.12830924987793, "global_step": 475076, "epoch": 5723} {"train_loss": -27.15280532836914, "global_step": 475077, "epoch": 5723} {"train_loss": -27.120132446289062, "global_step": 475078, "epoch": 5723} {"train_loss": -27.1920108795166, "global_step": 475079, "epoch": 5723} {"train_loss": -26.939228057861328, "global_step": 475080, "epoch": 5723} {"train_loss": -27.2559871673584, "global_step": 475081, "epoch": 5723} {"train_loss": -27.235437393188477, "global_step": 475082, "epoch": 5723} {"train_loss": -27.1368350982666, "global_step": 475083, "epoch": 5723} {"train_loss": -27.000410079956055, "global_step": 475084, "epoch": 5723} {"train_loss": -27.742816925048828, "global_step": 475085, "epoch": 5723} {"train_loss": -27.032657623291016, "global_step": 475086, "epoch": 5723} {"train_loss": -27.6912899017334, "global_step": 475087, "epoch": 5723} {"train_loss": -27.166223526000977, "global_step": 475088, "epoch": 5723} {"train_loss": -27.330829620361328, "global_step": 475089, "epoch": 5723} {"train_loss": -27.072362899780273, "global_step": 475090, "epoch": 5723} {"train_loss": -27.191104590174664, "global_step": 475091, "epoch": 5723, "val_loss": 6616154.0} {"train_loss": -26.752197265625, "global_step": 475092, "epoch": 5724} {"train_loss": -25.982776641845703, "global_step": 475093, "epoch": 5724} {"train_loss": -26.453765869140625, "global_step": 475094, "epoch": 5724} {"train_loss": -27.033536911010742, "global_step": 475095, "epoch": 5724} {"train_loss": -26.91727066040039, "global_step": 475096, "epoch": 5724} {"train_loss": -26.978900909423828, "global_step": 475097, "epoch": 5724} {"train_loss": -27.25336265563965, "global_step": 475098, "epoch": 5724} {"train_loss": -26.9700984954834, "global_step": 475099, "epoch": 5724} {"train_loss": -26.987537384033203, "global_step": 475100, "epoch": 5724} {"train_loss": -27.073408126831055, "global_step": 475101, "epoch": 5724} {"train_loss": -26.85530662536621, "global_step": 475102, "epoch": 5724} {"train_loss": -27.092069625854492, "global_step": 475103, "epoch": 5724} {"train_loss": -27.180194854736328, "global_step": 475104, "epoch": 5724} {"train_loss": -27.108320236206055, "global_step": 475105, "epoch": 5724} {"train_loss": -26.73744773864746, "global_step": 475106, "epoch": 5724} {"train_loss": -27.08980369567871, "global_step": 475107, "epoch": 5724} {"train_loss": -27.185338973999023, "global_step": 475108, "epoch": 5724} {"train_loss": -27.019001007080078, "global_step": 475109, "epoch": 5724} {"train_loss": -26.946786880493164, "global_step": 475110, "epoch": 5724} {"train_loss": -27.149991989135742, "global_step": 475111, "epoch": 5724} {"train_loss": -27.160757064819336, "global_step": 475112, "epoch": 5724} {"train_loss": -27.079282760620117, "global_step": 475113, "epoch": 5724} {"train_loss": -26.95135498046875, "global_step": 475114, "epoch": 5724} {"train_loss": -27.042203903198242, "global_step": 475115, "epoch": 5724} {"train_loss": -27.258779525756836, "global_step": 475116, "epoch": 5724} {"train_loss": -27.405431747436523, "global_step": 475117, "epoch": 5724} {"train_loss": -26.818267822265625, "global_step": 475118, "epoch": 5724} {"train_loss": -27.363821029663086, "global_step": 475119, "epoch": 5724} {"train_loss": -27.197134017944336, "global_step": 475120, "epoch": 5724} {"train_loss": -27.31448745727539, "global_step": 475121, "epoch": 5724} {"train_loss": -27.32242202758789, "global_step": 475122, "epoch": 5724} {"train_loss": -27.179651260375977, "global_step": 475123, "epoch": 5724} {"train_loss": -27.17951011657715, "global_step": 475124, "epoch": 5724} {"train_loss": -26.940942764282227, "global_step": 475125, "epoch": 5724} {"train_loss": -27.13239097595215, "global_step": 475126, "epoch": 5724} {"train_loss": -27.172910690307617, "global_step": 475127, "epoch": 5724} {"train_loss": -27.3460636138916, "global_step": 475128, "epoch": 5724} {"train_loss": -27.506601333618164, "global_step": 475129, "epoch": 5724} {"train_loss": -27.35112953186035, "global_step": 475130, "epoch": 5724} {"train_loss": -27.298389434814453, "global_step": 475131, "epoch": 5724} {"train_loss": -27.375335693359375, "global_step": 475132, "epoch": 5724} {"train_loss": -27.202116012573242, "global_step": 475133, "epoch": 5724} {"train_loss": -27.308115005493164, "global_step": 475134, "epoch": 5724} {"train_loss": -27.759723663330078, "global_step": 475135, "epoch": 5724} {"train_loss": -27.0268497467041, "global_step": 475136, "epoch": 5724} {"train_loss": -27.512746810913086, "global_step": 475137, "epoch": 5724} {"train_loss": -27.33009147644043, "global_step": 475138, "epoch": 5724} {"train_loss": -27.227079391479492, "global_step": 475139, "epoch": 5724} {"train_loss": -27.321746826171875, "global_step": 475140, "epoch": 5724} {"train_loss": -27.457136154174805, "global_step": 475141, "epoch": 5724} {"train_loss": -27.213708877563477, "global_step": 475142, "epoch": 5724} {"train_loss": -27.37416648864746, "global_step": 475143, "epoch": 5724} {"train_loss": -27.5775089263916, "global_step": 475144, "epoch": 5724} {"train_loss": -27.3873348236084, "global_step": 475145, "epoch": 5724} {"train_loss": -27.533727645874023, "global_step": 475146, "epoch": 5724} {"train_loss": -27.286640167236328, "global_step": 475147, "epoch": 5724} {"train_loss": -27.452985763549805, "global_step": 475148, "epoch": 5724} {"train_loss": -27.354658126831055, "global_step": 475149, "epoch": 5724} {"train_loss": -26.96797752380371, "global_step": 475150, "epoch": 5724} {"train_loss": -26.83717155456543, "global_step": 475151, "epoch": 5724} {"train_loss": -27.233631134033203, "global_step": 475152, "epoch": 5724} {"train_loss": -27.29396629333496, "global_step": 475153, "epoch": 5724} {"train_loss": -27.52437400817871, "global_step": 475154, "epoch": 5724} {"train_loss": -27.005401611328125, "global_step": 475155, "epoch": 5724} {"train_loss": -27.009328842163086, "global_step": 475156, "epoch": 5724} {"train_loss": -27.377063751220703, "global_step": 475157, "epoch": 5724} {"train_loss": -27.395797729492188, "global_step": 475158, "epoch": 5724} {"train_loss": -27.090316772460938, "global_step": 475159, "epoch": 5724} {"train_loss": -27.362659454345703, "global_step": 475160, "epoch": 5724} {"train_loss": -27.384321212768555, "global_step": 475161, "epoch": 5724} {"train_loss": -27.52570915222168, "global_step": 475162, "epoch": 5724} {"train_loss": -27.288455963134766, "global_step": 475163, "epoch": 5724} {"train_loss": -27.4759521484375, "global_step": 475164, "epoch": 5724} {"train_loss": -27.2000732421875, "global_step": 475165, "epoch": 5724} {"train_loss": -27.17938232421875, "global_step": 475166, "epoch": 5724} {"train_loss": -27.46845054626465, "global_step": 475167, "epoch": 5724} {"train_loss": -27.487436294555664, "global_step": 475168, "epoch": 5724} {"train_loss": -27.2719669342041, "global_step": 475169, "epoch": 5724} {"train_loss": -27.377714157104492, "global_step": 475170, "epoch": 5724} {"train_loss": -27.429227828979492, "global_step": 475171, "epoch": 5724} {"train_loss": -27.443592071533203, "global_step": 475172, "epoch": 5724} {"train_loss": -26.7049617767334, "global_step": 475173, "epoch": 5724} {"train_loss": -27.176831279892518, "global_step": 475174, "epoch": 5724, "val_loss": 6636313.0} {"train_loss": -26.592771530151367, "global_step": 475175, "epoch": 5725} {"train_loss": -26.898935317993164, "global_step": 475176, "epoch": 5725} {"train_loss": -26.659332275390625, "global_step": 475177, "epoch": 5725} {"train_loss": -26.989057540893555, "global_step": 475178, "epoch": 5725} {"train_loss": -27.03108787536621, "global_step": 475179, "epoch": 5725} {"train_loss": -26.762958526611328, "global_step": 475180, "epoch": 5725} {"train_loss": -26.837665557861328, "global_step": 475181, "epoch": 5725} {"train_loss": -27.12196922302246, "global_step": 475182, "epoch": 5725} {"train_loss": -27.06538200378418, "global_step": 475183, "epoch": 5725} {"train_loss": -26.990217208862305, "global_step": 475184, "epoch": 5725} {"train_loss": -26.884723663330078, "global_step": 475185, "epoch": 5725} {"train_loss": -27.034809112548828, "global_step": 475186, "epoch": 5725} {"train_loss": -26.992630004882812, "global_step": 475187, "epoch": 5725} {"train_loss": -27.294189453125, "global_step": 475188, "epoch": 5725} {"train_loss": -26.581274032592773, "global_step": 475189, "epoch": 5725} {"train_loss": -27.163299560546875, "global_step": 475190, "epoch": 5725} {"train_loss": -27.20941162109375, "global_step": 475191, "epoch": 5725} {"train_loss": -26.965286254882812, "global_step": 475192, "epoch": 5725} {"train_loss": -27.249103546142578, "global_step": 475193, "epoch": 5725} {"train_loss": -27.359500885009766, "global_step": 475194, "epoch": 5725} {"train_loss": -26.80322265625, "global_step": 475195, "epoch": 5725} {"train_loss": -27.0550594329834, "global_step": 475196, "epoch": 5725} {"train_loss": -27.432266235351562, "global_step": 475197, "epoch": 5725} {"train_loss": -26.83778190612793, "global_step": 475198, "epoch": 5725} {"train_loss": -27.236988067626953, "global_step": 475199, "epoch": 5725} {"train_loss": -27.497243881225586, "global_step": 475200, "epoch": 5725} {"train_loss": -27.2032470703125, "global_step": 475201, "epoch": 5725} {"train_loss": -27.455066680908203, "global_step": 475202, "epoch": 5725} {"train_loss": -27.354461669921875, "global_step": 475203, "epoch": 5725} {"train_loss": -27.05442237854004, "global_step": 475204, "epoch": 5725} {"train_loss": -27.438953399658203, "global_step": 475205, "epoch": 5725} {"train_loss": -27.34540367126465, "global_step": 475206, "epoch": 5725} {"train_loss": -27.0214786529541, "global_step": 475207, "epoch": 5725} {"train_loss": -27.509435653686523, "global_step": 475208, "epoch": 5725} {"train_loss": -27.267181396484375, "global_step": 475209, "epoch": 5725} {"train_loss": -27.210477828979492, "global_step": 475210, "epoch": 5725} {"train_loss": -27.58888053894043, "global_step": 475211, "epoch": 5725} {"train_loss": -27.215106964111328, "global_step": 475212, "epoch": 5725} {"train_loss": -27.628311157226562, "global_step": 475213, "epoch": 5725} {"train_loss": -27.188400268554688, "global_step": 475214, "epoch": 5725} {"train_loss": -27.110456466674805, "global_step": 475215, "epoch": 5725} {"train_loss": -27.2476749420166, "global_step": 475216, "epoch": 5725} {"train_loss": -27.3062801361084, "global_step": 475217, "epoch": 5725} {"train_loss": -27.244903564453125, "global_step": 475218, "epoch": 5725} {"train_loss": -27.06109619140625, "global_step": 475219, "epoch": 5725} {"train_loss": -27.55817985534668, "global_step": 475220, "epoch": 5725} {"train_loss": -26.993122100830078, "global_step": 475221, "epoch": 5725} {"train_loss": -26.866546630859375, "global_step": 475222, "epoch": 5725} {"train_loss": -26.718305587768555, "global_step": 475223, "epoch": 5725} {"train_loss": -27.44122886657715, "global_step": 475224, "epoch": 5725} {"train_loss": -27.125356674194336, "global_step": 475225, "epoch": 5725} {"train_loss": -27.255544662475586, "global_step": 475226, "epoch": 5725} {"train_loss": -27.033843994140625, "global_step": 475227, "epoch": 5725} {"train_loss": -27.12601089477539, "global_step": 475228, "epoch": 5725} {"train_loss": -27.132104873657227, "global_step": 475229, "epoch": 5725} {"train_loss": -27.51849937438965, "global_step": 475230, "epoch": 5725} {"train_loss": -27.568090438842773, "global_step": 475231, "epoch": 5725} {"train_loss": -27.444265365600586, "global_step": 475232, "epoch": 5725} {"train_loss": -26.885272979736328, "global_step": 475233, "epoch": 5725} {"train_loss": -27.52869987487793, "global_step": 475234, "epoch": 5725} {"train_loss": -27.316043853759766, "global_step": 475235, "epoch": 5725} {"train_loss": -27.53265380859375, "global_step": 475236, "epoch": 5725} {"train_loss": -27.35089683532715, "global_step": 475237, "epoch": 5725} {"train_loss": -27.8037109375, "global_step": 475238, "epoch": 5725} {"train_loss": -27.077848434448242, "global_step": 475239, "epoch": 5725} {"train_loss": -27.399011611938477, "global_step": 475240, "epoch": 5725} {"train_loss": -27.164636611938477, "global_step": 475241, "epoch": 5725} {"train_loss": -27.433151245117188, "global_step": 475242, "epoch": 5725} {"train_loss": -27.35737419128418, "global_step": 475243, "epoch": 5725} {"train_loss": -27.55208396911621, "global_step": 475244, "epoch": 5725} {"train_loss": -27.69011878967285, "global_step": 475245, "epoch": 5725} {"train_loss": -27.592443466186523, "global_step": 475246, "epoch": 5725} {"train_loss": -27.52558708190918, "global_step": 475247, "epoch": 5725} {"train_loss": -27.532154083251953, "global_step": 475248, "epoch": 5725} {"train_loss": -27.27815818786621, "global_step": 475249, "epoch": 5725} {"train_loss": -27.29007339477539, "global_step": 475250, "epoch": 5725} {"train_loss": -27.630146026611328, "global_step": 475251, "epoch": 5725} {"train_loss": -27.190189361572266, "global_step": 475252, "epoch": 5725} {"train_loss": -27.20747947692871, "global_step": 475253, "epoch": 5725} {"train_loss": -27.051986694335938, "global_step": 475254, "epoch": 5725} {"train_loss": -26.918048858642578, "global_step": 475255, "epoch": 5725} {"train_loss": -27.448095321655273, "global_step": 475256, "epoch": 5725} {"train_loss": -27.207111312682372, "global_step": 475257, "epoch": 5725, "val_loss": 6605005.0} {"train_loss": -27.372955322265625, "global_step": 475258, "epoch": 5726} {"train_loss": -27.166339874267578, "global_step": 475259, "epoch": 5726} {"train_loss": -27.569080352783203, "global_step": 475260, "epoch": 5726} {"train_loss": -27.11982536315918, "global_step": 475261, "epoch": 5726} {"train_loss": -27.12676429748535, "global_step": 475262, "epoch": 5726} {"train_loss": -27.093408584594727, "global_step": 475263, "epoch": 5726} {"train_loss": -27.025617599487305, "global_step": 475264, "epoch": 5726} {"train_loss": -26.765676498413086, "global_step": 475265, "epoch": 5726} {"train_loss": -27.089624404907227, "global_step": 475266, "epoch": 5726} {"train_loss": -27.098388671875, "global_step": 475267, "epoch": 5726} {"train_loss": -27.192214965820312, "global_step": 475268, "epoch": 5726} {"train_loss": -27.330169677734375, "global_step": 475269, "epoch": 5726} {"train_loss": -27.43305015563965, "global_step": 475270, "epoch": 5726} {"train_loss": -27.23777198791504, "global_step": 475271, "epoch": 5726} {"train_loss": -27.33613395690918, "global_step": 475272, "epoch": 5726} {"train_loss": -27.0444278717041, "global_step": 475273, "epoch": 5726} {"train_loss": -27.54876136779785, "global_step": 475274, "epoch": 5726} {"train_loss": -27.28130531311035, "global_step": 475275, "epoch": 5726} {"train_loss": -27.299711227416992, "global_step": 475276, "epoch": 5726} {"train_loss": -27.22177505493164, "global_step": 475277, "epoch": 5726} {"train_loss": -27.3187198638916, "global_step": 475278, "epoch": 5726} {"train_loss": -26.8950252532959, "global_step": 475279, "epoch": 5726} {"train_loss": -27.2514705657959, "global_step": 475280, "epoch": 5726} {"train_loss": -27.060705184936523, "global_step": 475281, "epoch": 5726} {"train_loss": -27.596439361572266, "global_step": 475282, "epoch": 5726} {"train_loss": -27.553678512573242, "global_step": 475283, "epoch": 5726} {"train_loss": -27.21675682067871, "global_step": 475284, "epoch": 5726} {"train_loss": -27.35833168029785, "global_step": 475285, "epoch": 5726} {"train_loss": -27.45038414001465, "global_step": 475286, "epoch": 5726} {"train_loss": -27.13386344909668, "global_step": 475287, "epoch": 5726} {"train_loss": -26.925378799438477, "global_step": 475288, "epoch": 5726} {"train_loss": -26.606769561767578, "global_step": 475289, "epoch": 5726} {"train_loss": -26.701786041259766, "global_step": 475290, "epoch": 5726} {"train_loss": -27.349695205688477, "global_step": 475291, "epoch": 5726} {"train_loss": -26.93931007385254, "global_step": 475292, "epoch": 5726} {"train_loss": -27.22515296936035, "global_step": 475293, "epoch": 5726} {"train_loss": -27.25703239440918, "global_step": 475294, "epoch": 5726} {"train_loss": -26.669757843017578, "global_step": 475295, "epoch": 5726} {"train_loss": -27.398427963256836, "global_step": 475296, "epoch": 5726} {"train_loss": -27.112024307250977, "global_step": 475297, "epoch": 5726} {"train_loss": -27.219959259033203, "global_step": 475298, "epoch": 5726} {"train_loss": -27.024930953979492, "global_step": 475299, "epoch": 5726} {"train_loss": -26.971866607666016, "global_step": 475300, "epoch": 5726} {"train_loss": -27.08585548400879, "global_step": 475301, "epoch": 5726} {"train_loss": -27.233739852905273, "global_step": 475302, "epoch": 5726} {"train_loss": -27.310428619384766, "global_step": 475303, "epoch": 5726} {"train_loss": -26.7177677154541, "global_step": 475304, "epoch": 5726} {"train_loss": -27.0318603515625, "global_step": 475305, "epoch": 5726} {"train_loss": -27.31744384765625, "global_step": 475306, "epoch": 5726} {"train_loss": -27.36420249938965, "global_step": 475307, "epoch": 5726} {"train_loss": -27.525348663330078, "global_step": 475308, "epoch": 5726} {"train_loss": -26.990758895874023, "global_step": 475309, "epoch": 5726} {"train_loss": -26.749317169189453, "global_step": 475310, "epoch": 5726} {"train_loss": -27.331729888916016, "global_step": 475311, "epoch": 5726} {"train_loss": -27.531518936157227, "global_step": 475312, "epoch": 5726} {"train_loss": -26.85406494140625, "global_step": 475313, "epoch": 5726} {"train_loss": -27.41300392150879, "global_step": 475314, "epoch": 5726} {"train_loss": -26.966215133666992, "global_step": 475315, "epoch": 5726} {"train_loss": -27.17988395690918, "global_step": 475316, "epoch": 5726} {"train_loss": -27.201923370361328, "global_step": 475317, "epoch": 5726} {"train_loss": -26.981618881225586, "global_step": 475318, "epoch": 5726} {"train_loss": -27.01936149597168, "global_step": 475319, "epoch": 5726} {"train_loss": -27.2029972076416, "global_step": 475320, "epoch": 5726} {"train_loss": -27.066919326782227, "global_step": 475321, "epoch": 5726} {"train_loss": -26.9765567779541, "global_step": 475322, "epoch": 5726} {"train_loss": -26.8509521484375, "global_step": 475323, "epoch": 5726} {"train_loss": -27.166061401367188, "global_step": 475324, "epoch": 5726} {"train_loss": -26.96466064453125, "global_step": 475325, "epoch": 5726} {"train_loss": -27.220151901245117, "global_step": 475326, "epoch": 5726} {"train_loss": -27.387189865112305, "global_step": 475327, "epoch": 5726} {"train_loss": -27.149763107299805, "global_step": 475328, "epoch": 5726} {"train_loss": -27.098546981811523, "global_step": 475329, "epoch": 5726} {"train_loss": -27.140522003173828, "global_step": 475330, "epoch": 5726} {"train_loss": -27.27174949645996, "global_step": 475331, "epoch": 5726} {"train_loss": -27.38800621032715, "global_step": 475332, "epoch": 5726} {"train_loss": -26.976598739624023, "global_step": 475333, "epoch": 5726} {"train_loss": -27.18308448791504, "global_step": 475334, "epoch": 5726} {"train_loss": -27.013351440429688, "global_step": 475335, "epoch": 5726} {"train_loss": -27.008249282836914, "global_step": 475336, "epoch": 5726} {"train_loss": -27.12569236755371, "global_step": 475337, "epoch": 5726} {"train_loss": -26.893781661987305, "global_step": 475338, "epoch": 5726} {"train_loss": -27.135847091674805, "global_step": 475339, "epoch": 5726} {"train_loss": -27.167593576821936, "global_step": 475340, "epoch": 5726, "val_loss": 6717499.0} {"train_loss": -26.464696884155273, "global_step": 475341, "epoch": 5727} {"train_loss": -25.917999267578125, "global_step": 475342, "epoch": 5727} {"train_loss": -25.778684616088867, "global_step": 475343, "epoch": 5727} {"train_loss": -25.73223876953125, "global_step": 475344, "epoch": 5727} {"train_loss": -26.22113037109375, "global_step": 475345, "epoch": 5727} {"train_loss": -26.25275993347168, "global_step": 475346, "epoch": 5727} {"train_loss": -26.006399154663086, "global_step": 475347, "epoch": 5727} {"train_loss": -26.202646255493164, "global_step": 475348, "epoch": 5727} {"train_loss": -25.822568893432617, "global_step": 475349, "epoch": 5727} {"train_loss": -26.210126876831055, "global_step": 475350, "epoch": 5727} {"train_loss": -25.806760787963867, "global_step": 475351, "epoch": 5727} {"train_loss": -26.135427474975586, "global_step": 475352, "epoch": 5727} {"train_loss": -26.047977447509766, "global_step": 475353, "epoch": 5727} {"train_loss": -26.065845489501953, "global_step": 475354, "epoch": 5727} {"train_loss": -26.5787296295166, "global_step": 475355, "epoch": 5727} {"train_loss": -26.30216407775879, "global_step": 475356, "epoch": 5727} {"train_loss": -26.585744857788086, "global_step": 475357, "epoch": 5727} {"train_loss": -26.320226669311523, "global_step": 475358, "epoch": 5727} {"train_loss": -27.080230712890625, "global_step": 475359, "epoch": 5727} {"train_loss": -26.373022079467773, "global_step": 475360, "epoch": 5727} {"train_loss": -26.48774528503418, "global_step": 475361, "epoch": 5727} {"train_loss": -26.6656436920166, "global_step": 475362, "epoch": 5727} {"train_loss": -26.888952255249023, "global_step": 475363, "epoch": 5727} {"train_loss": -26.910486221313477, "global_step": 475364, "epoch": 5727} {"train_loss": -26.89046287536621, "global_step": 475365, "epoch": 5727} {"train_loss": -26.10602378845215, "global_step": 475366, "epoch": 5727} {"train_loss": -26.794775009155273, "global_step": 475367, "epoch": 5727} {"train_loss": -27.202611923217773, "global_step": 475368, "epoch": 5727} {"train_loss": -27.212289810180664, "global_step": 475369, "epoch": 5727} {"train_loss": -26.8547420501709, "global_step": 475370, "epoch": 5727} {"train_loss": -27.04878044128418, "global_step": 475371, "epoch": 5727} {"train_loss": -27.119531631469727, "global_step": 475372, "epoch": 5727} {"train_loss": -26.912586212158203, "global_step": 475373, "epoch": 5727} {"train_loss": -26.859771728515625, "global_step": 475374, "epoch": 5727} {"train_loss": -26.974164962768555, "global_step": 475375, "epoch": 5727} {"train_loss": -27.373432159423828, "global_step": 475376, "epoch": 5727} {"train_loss": -26.886096954345703, "global_step": 475377, "epoch": 5727} {"train_loss": -27.07038688659668, "global_step": 475378, "epoch": 5727} {"train_loss": -26.895437240600586, "global_step": 475379, "epoch": 5727} {"train_loss": -27.22858238220215, "global_step": 475380, "epoch": 5727} {"train_loss": -26.824665069580078, "global_step": 475381, "epoch": 5727} {"train_loss": -27.231489181518555, "global_step": 475382, "epoch": 5727} {"train_loss": -27.075244903564453, "global_step": 475383, "epoch": 5727} {"train_loss": -27.28114128112793, "global_step": 475384, "epoch": 5727} {"train_loss": -26.876245498657227, "global_step": 475385, "epoch": 5727} {"train_loss": -27.192838668823242, "global_step": 475386, "epoch": 5727} {"train_loss": -27.08687400817871, "global_step": 475387, "epoch": 5727} {"train_loss": -27.461511611938477, "global_step": 475388, "epoch": 5727} {"train_loss": -27.349884033203125, "global_step": 475389, "epoch": 5727} {"train_loss": -27.31396484375, "global_step": 475390, "epoch": 5727} {"train_loss": -27.266571044921875, "global_step": 475391, "epoch": 5727} {"train_loss": -27.15909194946289, "global_step": 475392, "epoch": 5727} {"train_loss": -27.087512969970703, "global_step": 475393, "epoch": 5727} {"train_loss": -27.050922393798828, "global_step": 475394, "epoch": 5727} {"train_loss": -27.328516006469727, "global_step": 475395, "epoch": 5727} {"train_loss": -27.378583908081055, "global_step": 475396, "epoch": 5727} {"train_loss": -27.71807861328125, "global_step": 475397, "epoch": 5727} {"train_loss": -27.382410049438477, "global_step": 475398, "epoch": 5727} {"train_loss": -27.2768611907959, "global_step": 475399, "epoch": 5727} {"train_loss": -27.178436279296875, "global_step": 475400, "epoch": 5727} {"train_loss": -27.3406982421875, "global_step": 475401, "epoch": 5727} {"train_loss": -27.153852462768555, "global_step": 475402, "epoch": 5727} {"train_loss": -27.01624870300293, "global_step": 475403, "epoch": 5727} {"train_loss": -27.34384536743164, "global_step": 475404, "epoch": 5727} {"train_loss": -27.382898330688477, "global_step": 475405, "epoch": 5727} {"train_loss": -27.542932510375977, "global_step": 475406, "epoch": 5727} {"train_loss": -26.82813835144043, "global_step": 475407, "epoch": 5727} {"train_loss": -27.51495361328125, "global_step": 475408, "epoch": 5727} {"train_loss": -27.144824981689453, "global_step": 475409, "epoch": 5727} {"train_loss": -27.356351852416992, "global_step": 475410, "epoch": 5727} {"train_loss": -27.33254051208496, "global_step": 475411, "epoch": 5727} {"train_loss": -27.41473960876465, "global_step": 475412, "epoch": 5727} {"train_loss": -27.39093017578125, "global_step": 475413, "epoch": 5727} {"train_loss": -27.479663848876953, "global_step": 475414, "epoch": 5727} {"train_loss": -27.191375732421875, "global_step": 475415, "epoch": 5727} {"train_loss": -27.259408950805664, "global_step": 475416, "epoch": 5727} {"train_loss": -27.033411026000977, "global_step": 475417, "epoch": 5727} {"train_loss": -27.306005477905273, "global_step": 475418, "epoch": 5727} {"train_loss": -27.223608016967773, "global_step": 475419, "epoch": 5727} {"train_loss": -27.3552188873291, "global_step": 475420, "epoch": 5727} {"train_loss": -27.304859161376953, "global_step": 475421, "epoch": 5727} {"train_loss": -27.121999740600586, "global_step": 475422, "epoch": 5727} {"train_loss": -26.92365012111434, "global_step": 475423, "epoch": 5727, "val_loss": 6636036.0} {"train_loss": -26.380157470703125, "global_step": 475424, "epoch": 5728} {"train_loss": -26.511327743530273, "global_step": 475425, "epoch": 5728} {"train_loss": -26.552778244018555, "global_step": 475426, "epoch": 5728} {"train_loss": -26.088565826416016, "global_step": 475427, "epoch": 5728} {"train_loss": -26.429122924804688, "global_step": 475428, "epoch": 5728} {"train_loss": -27.07832145690918, "global_step": 475429, "epoch": 5728} {"train_loss": -26.13136100769043, "global_step": 475430, "epoch": 5728} {"train_loss": -26.609033584594727, "global_step": 475431, "epoch": 5728} {"train_loss": -26.338088989257812, "global_step": 475432, "epoch": 5728} {"train_loss": -26.670612335205078, "global_step": 475433, "epoch": 5728} {"train_loss": -26.546796798706055, "global_step": 475434, "epoch": 5728} {"train_loss": -26.804351806640625, "global_step": 475435, "epoch": 5728} {"train_loss": -26.3619384765625, "global_step": 475436, "epoch": 5728} {"train_loss": -27.113574981689453, "global_step": 475437, "epoch": 5728} {"train_loss": -26.57291603088379, "global_step": 475438, "epoch": 5728} {"train_loss": -27.222217559814453, "global_step": 475439, "epoch": 5728} {"train_loss": -26.945226669311523, "global_step": 475440, "epoch": 5728} {"train_loss": -26.838382720947266, "global_step": 475441, "epoch": 5728} {"train_loss": -26.989099502563477, "global_step": 475442, "epoch": 5728} {"train_loss": -26.60492515563965, "global_step": 475443, "epoch": 5728} {"train_loss": -27.29292106628418, "global_step": 475444, "epoch": 5728} {"train_loss": -26.751056671142578, "global_step": 475445, "epoch": 5728} {"train_loss": -27.102752685546875, "global_step": 475446, "epoch": 5728} {"train_loss": -27.00603675842285, "global_step": 475447, "epoch": 5728} {"train_loss": -26.89180564880371, "global_step": 475448, "epoch": 5728} {"train_loss": -26.887800216674805, "global_step": 475449, "epoch": 5728} {"train_loss": -26.983362197875977, "global_step": 475450, "epoch": 5728} {"train_loss": -27.43125343322754, "global_step": 475451, "epoch": 5728} {"train_loss": -27.29095458984375, "global_step": 475452, "epoch": 5728} {"train_loss": -27.228662490844727, "global_step": 475453, "epoch": 5728} {"train_loss": -27.058942794799805, "global_step": 475454, "epoch": 5728} {"train_loss": -27.430952072143555, "global_step": 475455, "epoch": 5728} {"train_loss": -27.353490829467773, "global_step": 475456, "epoch": 5728} {"train_loss": -27.424169540405273, "global_step": 475457, "epoch": 5728} {"train_loss": -27.064523696899414, "global_step": 475458, "epoch": 5728} {"train_loss": -27.287906646728516, "global_step": 475459, "epoch": 5728} {"train_loss": -27.248382568359375, "global_step": 475460, "epoch": 5728} {"train_loss": -27.356760025024414, "global_step": 475461, "epoch": 5728} {"train_loss": -27.482995986938477, "global_step": 475462, "epoch": 5728} {"train_loss": -27.394468307495117, "global_step": 475463, "epoch": 5728} {"train_loss": -27.022857666015625, "global_step": 475464, "epoch": 5728} {"train_loss": -27.37224769592285, "global_step": 475465, "epoch": 5728} {"train_loss": -27.31396484375, "global_step": 475466, "epoch": 5728} {"train_loss": -27.315793991088867, "global_step": 475467, "epoch": 5728} {"train_loss": -27.26472282409668, "global_step": 475468, "epoch": 5728} {"train_loss": -27.239471435546875, "global_step": 475469, "epoch": 5728} {"train_loss": -27.557849884033203, "global_step": 475470, "epoch": 5728} {"train_loss": -27.261022567749023, "global_step": 475471, "epoch": 5728} {"train_loss": -27.23552894592285, "global_step": 475472, "epoch": 5728} {"train_loss": -26.856908798217773, "global_step": 475473, "epoch": 5728} {"train_loss": -26.323999404907227, "global_step": 475474, "epoch": 5728} {"train_loss": -26.914413452148438, "global_step": 475475, "epoch": 5728} {"train_loss": -26.65480613708496, "global_step": 475476, "epoch": 5728} {"train_loss": -27.55372428894043, "global_step": 475477, "epoch": 5728} {"train_loss": -27.333173751831055, "global_step": 475478, "epoch": 5728} {"train_loss": -26.903980255126953, "global_step": 475479, "epoch": 5728} {"train_loss": -26.95709228515625, "global_step": 475480, "epoch": 5728} {"train_loss": -27.371627807617188, "global_step": 475481, "epoch": 5728} {"train_loss": -27.304960250854492, "global_step": 475482, "epoch": 5728} {"train_loss": -27.283857345581055, "global_step": 475483, "epoch": 5728} {"train_loss": -27.1919002532959, "global_step": 475484, "epoch": 5728} {"train_loss": -27.008115768432617, "global_step": 475485, "epoch": 5728} {"train_loss": -27.445775985717773, "global_step": 475486, "epoch": 5728} {"train_loss": -26.9241886138916, "global_step": 475487, "epoch": 5728} {"train_loss": -27.331090927124023, "global_step": 475488, "epoch": 5728} {"train_loss": -27.355993270874023, "global_step": 475489, "epoch": 5728} {"train_loss": -27.09222984313965, "global_step": 475490, "epoch": 5728} {"train_loss": -27.5837345123291, "global_step": 475491, "epoch": 5728} {"train_loss": -27.17067527770996, "global_step": 475492, "epoch": 5728} {"train_loss": -27.158727645874023, "global_step": 475493, "epoch": 5728} {"train_loss": -27.643842697143555, "global_step": 475494, "epoch": 5728} {"train_loss": -27.33436393737793, "global_step": 475495, "epoch": 5728} {"train_loss": -27.306964874267578, "global_step": 475496, "epoch": 5728} {"train_loss": -27.4736385345459, "global_step": 475497, "epoch": 5728} {"train_loss": -26.908231735229492, "global_step": 475498, "epoch": 5728} {"train_loss": -27.42431640625, "global_step": 475499, "epoch": 5728} {"train_loss": -27.32586097717285, "global_step": 475500, "epoch": 5728} {"train_loss": -26.925464630126953, "global_step": 475501, "epoch": 5728} {"train_loss": -27.263792037963867, "global_step": 475502, "epoch": 5728} {"train_loss": -27.109725952148438, "global_step": 475503, "epoch": 5728} {"train_loss": -26.840957641601562, "global_step": 475504, "epoch": 5728} {"train_loss": -26.98905372619629, "global_step": 475505, "epoch": 5728} {"train_loss": -27.065433915839137, "global_step": 475506, "epoch": 5728, "val_loss": 6626386.5} {"train_loss": -26.80203628540039, "global_step": 475507, "epoch": 5729} {"train_loss": -25.3283748626709, "global_step": 475508, "epoch": 5729} {"train_loss": -22.740968704223633, "global_step": 475509, "epoch": 5729} {"train_loss": -23.704553604125977, "global_step": 475510, "epoch": 5729} {"train_loss": -26.99686050415039, "global_step": 475511, "epoch": 5729} {"train_loss": -24.436294555664062, "global_step": 475512, "epoch": 5729} {"train_loss": -26.714893341064453, "global_step": 475513, "epoch": 5729} {"train_loss": -26.09270668029785, "global_step": 475514, "epoch": 5729} {"train_loss": -26.303030014038086, "global_step": 475515, "epoch": 5729} {"train_loss": -26.704248428344727, "global_step": 475516, "epoch": 5729} {"train_loss": -26.300251007080078, "global_step": 475517, "epoch": 5729} {"train_loss": -26.353546142578125, "global_step": 475518, "epoch": 5729} {"train_loss": -26.884923934936523, "global_step": 475519, "epoch": 5729} {"train_loss": -27.016958236694336, "global_step": 475520, "epoch": 5729} {"train_loss": -26.551589965820312, "global_step": 475521, "epoch": 5729} {"train_loss": -26.815692901611328, "global_step": 475522, "epoch": 5729} {"train_loss": -26.79754066467285, "global_step": 475523, "epoch": 5729} {"train_loss": -26.685138702392578, "global_step": 475524, "epoch": 5729} {"train_loss": -26.80268669128418, "global_step": 475525, "epoch": 5729} {"train_loss": -26.60483741760254, "global_step": 475526, "epoch": 5729} {"train_loss": -26.499128341674805, "global_step": 475527, "epoch": 5729} {"train_loss": -27.103540420532227, "global_step": 475528, "epoch": 5729} {"train_loss": -26.645008087158203, "global_step": 475529, "epoch": 5729} {"train_loss": -26.731597900390625, "global_step": 475530, "epoch": 5729} {"train_loss": -26.29469108581543, "global_step": 475531, "epoch": 5729} {"train_loss": -26.609893798828125, "global_step": 475532, "epoch": 5729} {"train_loss": -26.415771484375, "global_step": 475533, "epoch": 5729} {"train_loss": -26.995203018188477, "global_step": 475534, "epoch": 5729} {"train_loss": -26.944202423095703, "global_step": 475535, "epoch": 5729} {"train_loss": -27.16596031188965, "global_step": 475536, "epoch": 5729} {"train_loss": -27.021982192993164, "global_step": 475537, "epoch": 5729} {"train_loss": -26.7634220123291, "global_step": 475538, "epoch": 5729} {"train_loss": -27.024892807006836, "global_step": 475539, "epoch": 5729} {"train_loss": -26.55780029296875, "global_step": 475540, "epoch": 5729} {"train_loss": -27.015371322631836, "global_step": 475541, "epoch": 5729} {"train_loss": -27.068143844604492, "global_step": 475542, "epoch": 5729} {"train_loss": -27.35474967956543, "global_step": 475543, "epoch": 5729} {"train_loss": -27.30781364440918, "global_step": 475544, "epoch": 5729} {"train_loss": -26.843103408813477, "global_step": 475545, "epoch": 5729} {"train_loss": -26.993072509765625, "global_step": 475546, "epoch": 5729} {"train_loss": -26.830366134643555, "global_step": 475547, "epoch": 5729} {"train_loss": -27.114181518554688, "global_step": 475548, "epoch": 5729} {"train_loss": -27.379901885986328, "global_step": 475549, "epoch": 5729} {"train_loss": -26.86161231994629, "global_step": 475550, "epoch": 5729} {"train_loss": -26.846189498901367, "global_step": 475551, "epoch": 5729} {"train_loss": -26.950010299682617, "global_step": 475552, "epoch": 5729} {"train_loss": -27.533308029174805, "global_step": 475553, "epoch": 5729} {"train_loss": -26.86680030822754, "global_step": 475554, "epoch": 5729} {"train_loss": -27.285314559936523, "global_step": 475555, "epoch": 5729} {"train_loss": -26.879552841186523, "global_step": 475556, "epoch": 5729} {"train_loss": -26.293182373046875, "global_step": 475557, "epoch": 5729} {"train_loss": -26.497900009155273, "global_step": 475558, "epoch": 5729} {"train_loss": -26.549896240234375, "global_step": 475559, "epoch": 5729} {"train_loss": -27.08845329284668, "global_step": 475560, "epoch": 5729} {"train_loss": -26.99481773376465, "global_step": 475561, "epoch": 5729} {"train_loss": -27.467817306518555, "global_step": 475562, "epoch": 5729} {"train_loss": -27.0718994140625, "global_step": 475563, "epoch": 5729} {"train_loss": -27.005523681640625, "global_step": 475564, "epoch": 5729} {"train_loss": -27.290510177612305, "global_step": 475565, "epoch": 5729} {"train_loss": -27.434125900268555, "global_step": 475566, "epoch": 5729} {"train_loss": -27.394943237304688, "global_step": 475567, "epoch": 5729} {"train_loss": -27.68570899963379, "global_step": 475568, "epoch": 5729} {"train_loss": -27.368127822875977, "global_step": 475569, "epoch": 5729} {"train_loss": -27.343189239501953, "global_step": 475570, "epoch": 5729} {"train_loss": -27.213226318359375, "global_step": 475571, "epoch": 5729} {"train_loss": -27.251577377319336, "global_step": 475572, "epoch": 5729} {"train_loss": -27.72308921813965, "global_step": 475573, "epoch": 5729} {"train_loss": -27.17104148864746, "global_step": 475574, "epoch": 5729} {"train_loss": -27.025222778320312, "global_step": 475575, "epoch": 5729} {"train_loss": -26.953155517578125, "global_step": 475576, "epoch": 5729} {"train_loss": -27.34744644165039, "global_step": 475577, "epoch": 5729} {"train_loss": -27.441455841064453, "global_step": 475578, "epoch": 5729} {"train_loss": -27.054168701171875, "global_step": 475579, "epoch": 5729} {"train_loss": -27.419330596923828, "global_step": 475580, "epoch": 5729} {"train_loss": -27.298185348510742, "global_step": 475581, "epoch": 5729} {"train_loss": -27.38411521911621, "global_step": 475582, "epoch": 5729} {"train_loss": -27.433603286743164, "global_step": 475583, "epoch": 5729} {"train_loss": -27.158849716186523, "global_step": 475584, "epoch": 5729} {"train_loss": -27.813520431518555, "global_step": 475585, "epoch": 5729} {"train_loss": -26.9020938873291, "global_step": 475586, "epoch": 5729} {"train_loss": -27.058441162109375, "global_step": 475587, "epoch": 5729} {"train_loss": -26.57193374633789, "global_step": 475588, "epoch": 5729} {"train_loss": -26.82538533498006, "global_step": 475589, "epoch": 5729, "val_loss": 6650932.0} {"train_loss": -26.479949951171875, "global_step": 475590, "epoch": 5730} {"train_loss": -25.542160034179688, "global_step": 475591, "epoch": 5730} {"train_loss": -25.72669792175293, "global_step": 475592, "epoch": 5730} {"train_loss": -25.757831573486328, "global_step": 475593, "epoch": 5730} {"train_loss": -26.232257843017578, "global_step": 475594, "epoch": 5730} {"train_loss": -26.057998657226562, "global_step": 475595, "epoch": 5730} {"train_loss": -26.25554847717285, "global_step": 475596, "epoch": 5730} {"train_loss": -26.473480224609375, "global_step": 475597, "epoch": 5730} {"train_loss": -26.6091251373291, "global_step": 475598, "epoch": 5730} {"train_loss": -26.68523597717285, "global_step": 475599, "epoch": 5730} {"train_loss": -26.22700309753418, "global_step": 475600, "epoch": 5730} {"train_loss": -26.897214889526367, "global_step": 475601, "epoch": 5730} {"train_loss": -26.424579620361328, "global_step": 475602, "epoch": 5730} {"train_loss": -26.81467056274414, "global_step": 475603, "epoch": 5730} {"train_loss": -26.711416244506836, "global_step": 475604, "epoch": 5730} {"train_loss": -26.487060546875, "global_step": 475605, "epoch": 5730} {"train_loss": -26.8362979888916, "global_step": 475606, "epoch": 5730} {"train_loss": -26.761890411376953, "global_step": 475607, "epoch": 5730} {"train_loss": -26.88306999206543, "global_step": 475608, "epoch": 5730} {"train_loss": -26.978260040283203, "global_step": 475609, "epoch": 5730} {"train_loss": -27.030853271484375, "global_step": 475610, "epoch": 5730} {"train_loss": -26.812780380249023, "global_step": 475611, "epoch": 5730} {"train_loss": -27.051984786987305, "global_step": 475612, "epoch": 5730} {"train_loss": -26.737974166870117, "global_step": 475613, "epoch": 5730} {"train_loss": -26.9455509185791, "global_step": 475614, "epoch": 5730} {"train_loss": -26.826257705688477, "global_step": 475615, "epoch": 5730} {"train_loss": -26.748188018798828, "global_step": 475616, "epoch": 5730} {"train_loss": -26.87404441833496, "global_step": 475617, "epoch": 5730} {"train_loss": -26.89509391784668, "global_step": 475618, "epoch": 5730} {"train_loss": -26.976608276367188, "global_step": 475619, "epoch": 5730} {"train_loss": -27.256244659423828, "global_step": 475620, "epoch": 5730} {"train_loss": -27.152908325195312, "global_step": 475621, "epoch": 5730} {"train_loss": -27.087682723999023, "global_step": 475622, "epoch": 5730} {"train_loss": -27.30329704284668, "global_step": 475623, "epoch": 5730} {"train_loss": -27.127685546875, "global_step": 475624, "epoch": 5730} {"train_loss": -27.02069664001465, "global_step": 475625, "epoch": 5730} {"train_loss": -27.306211471557617, "global_step": 475626, "epoch": 5730} {"train_loss": -27.273365020751953, "global_step": 475627, "epoch": 5730} {"train_loss": -27.12837791442871, "global_step": 475628, "epoch": 5730} {"train_loss": -26.778839111328125, "global_step": 475629, "epoch": 5730} {"train_loss": -27.476865768432617, "global_step": 475630, "epoch": 5730} {"train_loss": -27.252859115600586, "global_step": 475631, "epoch": 5730} {"train_loss": -27.337360382080078, "global_step": 475632, "epoch": 5730} {"train_loss": -27.162832260131836, "global_step": 475633, "epoch": 5730} {"train_loss": -27.178442001342773, "global_step": 475634, "epoch": 5730} {"train_loss": -27.47833251953125, "global_step": 475635, "epoch": 5730} {"train_loss": -27.432193756103516, "global_step": 475636, "epoch": 5730} {"train_loss": -27.202823638916016, "global_step": 475637, "epoch": 5730} {"train_loss": -27.095972061157227, "global_step": 475638, "epoch": 5730} {"train_loss": -27.466434478759766, "global_step": 475639, "epoch": 5730} {"train_loss": -27.470020294189453, "global_step": 475640, "epoch": 5730} {"train_loss": -27.44695472717285, "global_step": 475641, "epoch": 5730} {"train_loss": -27.017240524291992, "global_step": 475642, "epoch": 5730} {"train_loss": -27.227975845336914, "global_step": 475643, "epoch": 5730} {"train_loss": -27.426801681518555, "global_step": 475644, "epoch": 5730} {"train_loss": -27.28907585144043, "global_step": 475645, "epoch": 5730} {"train_loss": -27.53020668029785, "global_step": 475646, "epoch": 5730} {"train_loss": -27.717529296875, "global_step": 475647, "epoch": 5730} {"train_loss": -27.479284286499023, "global_step": 475648, "epoch": 5730} {"train_loss": -27.248580932617188, "global_step": 475649, "epoch": 5730} {"train_loss": -27.01520347595215, "global_step": 475650, "epoch": 5730} {"train_loss": -27.17559814453125, "global_step": 475651, "epoch": 5730} {"train_loss": -27.4334659576416, "global_step": 475652, "epoch": 5730} {"train_loss": -27.37113380432129, "global_step": 475653, "epoch": 5730} {"train_loss": -27.19697380065918, "global_step": 475654, "epoch": 5730} {"train_loss": -26.986499786376953, "global_step": 475655, "epoch": 5730} {"train_loss": -27.43794822692871, "global_step": 475656, "epoch": 5730} {"train_loss": -27.026660919189453, "global_step": 475657, "epoch": 5730} {"train_loss": -27.171161651611328, "global_step": 475658, "epoch": 5730} {"train_loss": -27.668521881103516, "global_step": 475659, "epoch": 5730} {"train_loss": -27.63355827331543, "global_step": 475660, "epoch": 5730} {"train_loss": -26.9958438873291, "global_step": 475661, "epoch": 5730} {"train_loss": -27.502492904663086, "global_step": 475662, "epoch": 5730} {"train_loss": -27.493749618530273, "global_step": 475663, "epoch": 5730} {"train_loss": -27.046659469604492, "global_step": 475664, "epoch": 5730} {"train_loss": -26.749073028564453, "global_step": 475665, "epoch": 5730} {"train_loss": -27.175214767456055, "global_step": 475666, "epoch": 5730} {"train_loss": -27.45880699157715, "global_step": 475667, "epoch": 5730} {"train_loss": -27.2499942779541, "global_step": 475668, "epoch": 5730} {"train_loss": -27.537336349487305, "global_step": 475669, "epoch": 5730} {"train_loss": -27.677576065063477, "global_step": 475670, "epoch": 5730} {"train_loss": -27.228927612304688, "global_step": 475671, "epoch": 5730} {"train_loss": -27.02130322284009, "global_step": 475672, "epoch": 5730, "val_loss": 6740518.0} {"train_loss": -24.44550895690918, "global_step": 475673, "epoch": 5731} {"train_loss": -24.89181900024414, "global_step": 475674, "epoch": 5731} {"train_loss": -26.3184757232666, "global_step": 475675, "epoch": 5731} {"train_loss": -25.517335891723633, "global_step": 475676, "epoch": 5731} {"train_loss": -26.027578353881836, "global_step": 475677, "epoch": 5731} {"train_loss": -26.07547950744629, "global_step": 475678, "epoch": 5731} {"train_loss": -25.992542266845703, "global_step": 475679, "epoch": 5731} {"train_loss": -26.347684860229492, "global_step": 475680, "epoch": 5731} {"train_loss": -26.519418716430664, "global_step": 475681, "epoch": 5731} {"train_loss": -26.308435440063477, "global_step": 475682, "epoch": 5731} {"train_loss": -26.331806182861328, "global_step": 475683, "epoch": 5731} {"train_loss": -26.683378219604492, "global_step": 475684, "epoch": 5731} {"train_loss": -26.165319442749023, "global_step": 475685, "epoch": 5731} {"train_loss": -26.97845458984375, "global_step": 475686, "epoch": 5731} {"train_loss": -26.504194259643555, "global_step": 475687, "epoch": 5731} {"train_loss": -26.574743270874023, "global_step": 475688, "epoch": 5731} {"train_loss": -26.62322425842285, "global_step": 475689, "epoch": 5731} {"train_loss": -26.884918212890625, "global_step": 475690, "epoch": 5731} {"train_loss": -26.522647857666016, "global_step": 475691, "epoch": 5731} {"train_loss": -26.949934005737305, "global_step": 475692, "epoch": 5731} {"train_loss": -26.877222061157227, "global_step": 475693, "epoch": 5731} {"train_loss": -26.940692901611328, "global_step": 475694, "epoch": 5731} {"train_loss": -26.964075088500977, "global_step": 475695, "epoch": 5731} {"train_loss": -27.154691696166992, "global_step": 475696, "epoch": 5731} {"train_loss": -26.847265243530273, "global_step": 475697, "epoch": 5731} {"train_loss": -27.1075382232666, "global_step": 475698, "epoch": 5731} {"train_loss": -27.081085205078125, "global_step": 475699, "epoch": 5731} {"train_loss": -27.257322311401367, "global_step": 475700, "epoch": 5731} {"train_loss": -26.688190460205078, "global_step": 475701, "epoch": 5731} {"train_loss": -27.0218448638916, "global_step": 475702, "epoch": 5731} {"train_loss": -27.21030044555664, "global_step": 475703, "epoch": 5731} {"train_loss": -27.385498046875, "global_step": 475704, "epoch": 5731} {"train_loss": -27.43477439880371, "global_step": 475705, "epoch": 5731} {"train_loss": -27.537466049194336, "global_step": 475706, "epoch": 5731} {"train_loss": -26.97688865661621, "global_step": 475707, "epoch": 5731} {"train_loss": -27.336084365844727, "global_step": 475708, "epoch": 5731} {"train_loss": -27.3580379486084, "global_step": 475709, "epoch": 5731} {"train_loss": -26.872791290283203, "global_step": 475710, "epoch": 5731} {"train_loss": -27.120609283447266, "global_step": 475711, "epoch": 5731} {"train_loss": -27.0142879486084, "global_step": 475712, "epoch": 5731} {"train_loss": -27.6292781829834, "global_step": 475713, "epoch": 5731} {"train_loss": -27.10422706604004, "global_step": 475714, "epoch": 5731} {"train_loss": -27.33765983581543, "global_step": 475715, "epoch": 5731} {"train_loss": -27.2778377532959, "global_step": 475716, "epoch": 5731} {"train_loss": -27.248937606811523, "global_step": 475717, "epoch": 5731} {"train_loss": -27.303205490112305, "global_step": 475718, "epoch": 5731} {"train_loss": -27.146841049194336, "global_step": 475719, "epoch": 5731} {"train_loss": -27.33595085144043, "global_step": 475720, "epoch": 5731} {"train_loss": -27.611175537109375, "global_step": 475721, "epoch": 5731} {"train_loss": -27.7459716796875, "global_step": 475722, "epoch": 5731} {"train_loss": -27.3380126953125, "global_step": 475723, "epoch": 5731} {"train_loss": -27.32794189453125, "global_step": 475724, "epoch": 5731} {"train_loss": -27.523468017578125, "global_step": 475725, "epoch": 5731} {"train_loss": -27.380233764648438, "global_step": 475726, "epoch": 5731} {"train_loss": -27.319360733032227, "global_step": 475727, "epoch": 5731} {"train_loss": -27.5842227935791, "global_step": 475728, "epoch": 5731} {"train_loss": -27.10152244567871, "global_step": 475729, "epoch": 5731} {"train_loss": -27.04424476623535, "global_step": 475730, "epoch": 5731} {"train_loss": -27.6625919342041, "global_step": 475731, "epoch": 5731} {"train_loss": -27.528242111206055, "global_step": 475732, "epoch": 5731} {"train_loss": -27.15878677368164, "global_step": 475733, "epoch": 5731} {"train_loss": -26.897375106811523, "global_step": 475734, "epoch": 5731} {"train_loss": -27.2390079498291, "global_step": 475735, "epoch": 5731} {"train_loss": -26.742984771728516, "global_step": 475736, "epoch": 5731} {"train_loss": -26.865766525268555, "global_step": 475737, "epoch": 5731} {"train_loss": -27.494916915893555, "global_step": 475738, "epoch": 5731} {"train_loss": -27.411062240600586, "global_step": 475739, "epoch": 5731} {"train_loss": -27.0610294342041, "global_step": 475740, "epoch": 5731} {"train_loss": -26.675861358642578, "global_step": 475741, "epoch": 5731} {"train_loss": -27.169666290283203, "global_step": 475742, "epoch": 5731} {"train_loss": -27.407180786132812, "global_step": 475743, "epoch": 5731} {"train_loss": -27.292234420776367, "global_step": 475744, "epoch": 5731} {"train_loss": -27.6046085357666, "global_step": 475745, "epoch": 5731} {"train_loss": -27.1339111328125, "global_step": 475746, "epoch": 5731} {"train_loss": -26.920988082885742, "global_step": 475747, "epoch": 5731} {"train_loss": -27.141082763671875, "global_step": 475748, "epoch": 5731} {"train_loss": -27.372323989868164, "global_step": 475749, "epoch": 5731} {"train_loss": -27.345993041992188, "global_step": 475750, "epoch": 5731} {"train_loss": -26.93014907836914, "global_step": 475751, "epoch": 5731} {"train_loss": -27.244110107421875, "global_step": 475752, "epoch": 5731} {"train_loss": -27.493698120117188, "global_step": 475753, "epoch": 5731} {"train_loss": -27.2888126373291, "global_step": 475754, "epoch": 5731} {"train_loss": -26.97120413722762, "global_step": 475755, "epoch": 5731, "val_loss": 6631263.0} {"train_loss": -26.682022094726562, "global_step": 475756, "epoch": 5732} {"train_loss": -27.124927520751953, "global_step": 475757, "epoch": 5732} {"train_loss": -26.961151123046875, "global_step": 475758, "epoch": 5732} {"train_loss": -27.116607666015625, "global_step": 475759, "epoch": 5732} {"train_loss": -26.780431747436523, "global_step": 475760, "epoch": 5732} {"train_loss": -27.04486083984375, "global_step": 475761, "epoch": 5732} {"train_loss": -26.763431549072266, "global_step": 475762, "epoch": 5732} {"train_loss": -27.115873336791992, "global_step": 475763, "epoch": 5732} {"train_loss": -27.18195152282715, "global_step": 475764, "epoch": 5732} {"train_loss": -27.01905632019043, "global_step": 475765, "epoch": 5732} {"train_loss": -27.05225944519043, "global_step": 475766, "epoch": 5732} {"train_loss": -27.29535484313965, "global_step": 475767, "epoch": 5732} {"train_loss": -27.081445693969727, "global_step": 475768, "epoch": 5732} {"train_loss": -27.083648681640625, "global_step": 475769, "epoch": 5732} {"train_loss": -27.213550567626953, "global_step": 475770, "epoch": 5732} {"train_loss": -27.16863441467285, "global_step": 475771, "epoch": 5732} {"train_loss": -27.09833335876465, "global_step": 475772, "epoch": 5732} {"train_loss": -27.157346725463867, "global_step": 475773, "epoch": 5732} {"train_loss": -27.173572540283203, "global_step": 475774, "epoch": 5732} {"train_loss": -27.53949546813965, "global_step": 475775, "epoch": 5732} {"train_loss": -27.174560546875, "global_step": 475776, "epoch": 5732} {"train_loss": -27.230337142944336, "global_step": 475777, "epoch": 5732} {"train_loss": -27.481430053710938, "global_step": 475778, "epoch": 5732} {"train_loss": -26.90809440612793, "global_step": 475779, "epoch": 5732} {"train_loss": -27.277097702026367, "global_step": 475780, "epoch": 5732} {"train_loss": -27.52703285217285, "global_step": 475781, "epoch": 5732} {"train_loss": -27.40754508972168, "global_step": 475782, "epoch": 5732} {"train_loss": -27.339242935180664, "global_step": 475783, "epoch": 5732} {"train_loss": -27.2606258392334, "global_step": 475784, "epoch": 5732} {"train_loss": -27.61212158203125, "global_step": 475785, "epoch": 5732} {"train_loss": -27.346731185913086, "global_step": 475786, "epoch": 5732} {"train_loss": -27.65215492248535, "global_step": 475787, "epoch": 5732} {"train_loss": -27.2994441986084, "global_step": 475788, "epoch": 5732} {"train_loss": -27.47572135925293, "global_step": 475789, "epoch": 5732} {"train_loss": -27.277868270874023, "global_step": 475790, "epoch": 5732} {"train_loss": -27.34531593322754, "global_step": 475791, "epoch": 5732} {"train_loss": -27.5521297454834, "global_step": 475792, "epoch": 5732} {"train_loss": -27.249433517456055, "global_step": 475793, "epoch": 5732} {"train_loss": -27.285200119018555, "global_step": 475794, "epoch": 5732} {"train_loss": -27.099714279174805, "global_step": 475795, "epoch": 5732} {"train_loss": -27.419692993164062, "global_step": 475796, "epoch": 5732} {"train_loss": -27.596027374267578, "global_step": 475797, "epoch": 5732} {"train_loss": -27.017988204956055, "global_step": 475798, "epoch": 5732} {"train_loss": -27.372272491455078, "global_step": 475799, "epoch": 5732} {"train_loss": -27.13679313659668, "global_step": 475800, "epoch": 5732} {"train_loss": -27.027856826782227, "global_step": 475801, "epoch": 5732} {"train_loss": -27.103790283203125, "global_step": 475802, "epoch": 5732} {"train_loss": -27.7316837310791, "global_step": 475803, "epoch": 5732} {"train_loss": -27.307144165039062, "global_step": 475804, "epoch": 5732} {"train_loss": -26.979511260986328, "global_step": 475805, "epoch": 5732} {"train_loss": -26.908294677734375, "global_step": 475806, "epoch": 5732} {"train_loss": -27.218204498291016, "global_step": 475807, "epoch": 5732} {"train_loss": -27.284870147705078, "global_step": 475808, "epoch": 5732} {"train_loss": -27.70947265625, "global_step": 475809, "epoch": 5732} {"train_loss": -27.397321701049805, "global_step": 475810, "epoch": 5732} {"train_loss": -27.1458683013916, "global_step": 475811, "epoch": 5732} {"train_loss": -27.383092880249023, "global_step": 475812, "epoch": 5732} {"train_loss": -27.229150772094727, "global_step": 475813, "epoch": 5732} {"train_loss": -27.571598052978516, "global_step": 475814, "epoch": 5732} {"train_loss": -27.06683349609375, "global_step": 475815, "epoch": 5732} {"train_loss": -27.262033462524414, "global_step": 475816, "epoch": 5732} {"train_loss": -27.26483154296875, "global_step": 475817, "epoch": 5732} {"train_loss": -27.546649932861328, "global_step": 475818, "epoch": 5732} {"train_loss": -27.286788940429688, "global_step": 475819, "epoch": 5732} {"train_loss": -27.681671142578125, "global_step": 475820, "epoch": 5732} {"train_loss": -27.473398208618164, "global_step": 475821, "epoch": 5732} {"train_loss": -27.233442306518555, "global_step": 475822, "epoch": 5732} {"train_loss": -27.50176429748535, "global_step": 475823, "epoch": 5732} {"train_loss": -27.18976402282715, "global_step": 475824, "epoch": 5732} {"train_loss": -27.51338005065918, "global_step": 475825, "epoch": 5732} {"train_loss": -27.384031295776367, "global_step": 475826, "epoch": 5732} {"train_loss": -27.67167091369629, "global_step": 475827, "epoch": 5732} {"train_loss": -27.195459365844727, "global_step": 475828, "epoch": 5732} {"train_loss": -27.29903221130371, "global_step": 475829, "epoch": 5732} {"train_loss": -27.095504760742188, "global_step": 475830, "epoch": 5732} {"train_loss": -27.481298446655273, "global_step": 475831, "epoch": 5732} {"train_loss": -27.715091705322266, "global_step": 475832, "epoch": 5732} {"train_loss": -27.567670822143555, "global_step": 475833, "epoch": 5732} {"train_loss": -27.585935592651367, "global_step": 475834, "epoch": 5732} {"train_loss": -27.376962661743164, "global_step": 475835, "epoch": 5732} {"train_loss": -27.007129669189453, "global_step": 475836, "epoch": 5732} {"train_loss": -27.189651489257812, "global_step": 475837, "epoch": 5732} {"train_loss": -27.263992631291767, "global_step": 475838, "epoch": 5732, "val_loss": 6702636.0} {"train_loss": -26.85239601135254, "global_step": 475839, "epoch": 5733} {"train_loss": -26.296857833862305, "global_step": 475840, "epoch": 5733} {"train_loss": -26.582645416259766, "global_step": 475841, "epoch": 5733} {"train_loss": -26.63604736328125, "global_step": 475842, "epoch": 5733} {"train_loss": -26.29669761657715, "global_step": 475843, "epoch": 5733} {"train_loss": -26.5799617767334, "global_step": 475844, "epoch": 5733} {"train_loss": -26.918354034423828, "global_step": 475845, "epoch": 5733} {"train_loss": -27.04583740234375, "global_step": 475846, "epoch": 5733} {"train_loss": -26.639007568359375, "global_step": 475847, "epoch": 5733} {"train_loss": -26.27229881286621, "global_step": 475848, "epoch": 5733} {"train_loss": -26.91340446472168, "global_step": 475849, "epoch": 5733} {"train_loss": -26.234821319580078, "global_step": 475850, "epoch": 5733} {"train_loss": -26.690229415893555, "global_step": 475851, "epoch": 5733} {"train_loss": -27.03423500061035, "global_step": 475852, "epoch": 5733} {"train_loss": -26.782506942749023, "global_step": 475853, "epoch": 5733} {"train_loss": -26.7882022857666, "global_step": 475854, "epoch": 5733} {"train_loss": -26.76751708984375, "global_step": 475855, "epoch": 5733} {"train_loss": -27.080549240112305, "global_step": 475856, "epoch": 5733} {"train_loss": -26.892663955688477, "global_step": 475857, "epoch": 5733} {"train_loss": -27.135534286499023, "global_step": 475858, "epoch": 5733} {"train_loss": -27.086750030517578, "global_step": 475859, "epoch": 5733} {"train_loss": -26.92350196838379, "global_step": 475860, "epoch": 5733} {"train_loss": -26.950698852539062, "global_step": 475861, "epoch": 5733} {"train_loss": -26.9412841796875, "global_step": 475862, "epoch": 5733} {"train_loss": -27.110126495361328, "global_step": 475863, "epoch": 5733} {"train_loss": -27.180007934570312, "global_step": 475864, "epoch": 5733} {"train_loss": -27.173166275024414, "global_step": 475865, "epoch": 5733} {"train_loss": -26.94060707092285, "global_step": 475866, "epoch": 5733} {"train_loss": -27.042516708374023, "global_step": 475867, "epoch": 5733} {"train_loss": -27.31494140625, "global_step": 475868, "epoch": 5733} {"train_loss": -27.201568603515625, "global_step": 475869, "epoch": 5733} {"train_loss": -27.08148193359375, "global_step": 475870, "epoch": 5733} {"train_loss": -27.34807777404785, "global_step": 475871, "epoch": 5733} {"train_loss": -26.9414005279541, "global_step": 475872, "epoch": 5733} {"train_loss": -27.240610122680664, "global_step": 475873, "epoch": 5733} {"train_loss": -27.262022018432617, "global_step": 475874, "epoch": 5733} {"train_loss": -26.838361740112305, "global_step": 475875, "epoch": 5733} {"train_loss": -26.565515518188477, "global_step": 475876, "epoch": 5733} {"train_loss": -27.20057487487793, "global_step": 475877, "epoch": 5733} {"train_loss": -27.32379722595215, "global_step": 475878, "epoch": 5733} {"train_loss": -27.184341430664062, "global_step": 475879, "epoch": 5733} {"train_loss": -27.434545516967773, "global_step": 475880, "epoch": 5733} {"train_loss": -26.817228317260742, "global_step": 475881, "epoch": 5733} {"train_loss": -27.156707763671875, "global_step": 475882, "epoch": 5733} {"train_loss": -27.335126876831055, "global_step": 475883, "epoch": 5733} {"train_loss": -27.018701553344727, "global_step": 475884, "epoch": 5733} {"train_loss": -27.10358238220215, "global_step": 475885, "epoch": 5733} {"train_loss": -26.866668701171875, "global_step": 475886, "epoch": 5733} {"train_loss": -27.28647232055664, "global_step": 475887, "epoch": 5733} {"train_loss": -26.791675567626953, "global_step": 475888, "epoch": 5733} {"train_loss": -27.1995792388916, "global_step": 475889, "epoch": 5733} {"train_loss": -27.3546142578125, "global_step": 475890, "epoch": 5733} {"train_loss": -27.09454917907715, "global_step": 475891, "epoch": 5733} {"train_loss": -27.373640060424805, "global_step": 475892, "epoch": 5733} {"train_loss": -27.62562370300293, "global_step": 475893, "epoch": 5733} {"train_loss": -27.30838966369629, "global_step": 475894, "epoch": 5733} {"train_loss": -27.430774688720703, "global_step": 475895, "epoch": 5733} {"train_loss": -27.407567977905273, "global_step": 475896, "epoch": 5733} {"train_loss": -27.33404541015625, "global_step": 475897, "epoch": 5733} {"train_loss": -27.028411865234375, "global_step": 475898, "epoch": 5733} {"train_loss": -27.405012130737305, "global_step": 475899, "epoch": 5733} {"train_loss": -27.30923843383789, "global_step": 475900, "epoch": 5733} {"train_loss": -27.331283569335938, "global_step": 475901, "epoch": 5733} {"train_loss": -27.631982803344727, "global_step": 475902, "epoch": 5733} {"train_loss": -27.20820426940918, "global_step": 475903, "epoch": 5733} {"train_loss": -27.03423500061035, "global_step": 475904, "epoch": 5733} {"train_loss": -27.350860595703125, "global_step": 475905, "epoch": 5733} {"train_loss": -27.779067993164062, "global_step": 475906, "epoch": 5733} {"train_loss": -27.191991806030273, "global_step": 475907, "epoch": 5733} {"train_loss": -27.092233657836914, "global_step": 475908, "epoch": 5733} {"train_loss": -27.06534194946289, "global_step": 475909, "epoch": 5733} {"train_loss": -27.217029571533203, "global_step": 475910, "epoch": 5733} {"train_loss": -27.42121696472168, "global_step": 475911, "epoch": 5733} {"train_loss": -27.238107681274414, "global_step": 475912, "epoch": 5733} {"train_loss": -27.011341094970703, "global_step": 475913, "epoch": 5733} {"train_loss": -27.424301147460938, "global_step": 475914, "epoch": 5733} {"train_loss": -27.249893188476562, "global_step": 475915, "epoch": 5733} {"train_loss": -27.462650299072266, "global_step": 475916, "epoch": 5733} {"train_loss": -26.796533584594727, "global_step": 475917, "epoch": 5733} {"train_loss": -27.513751983642578, "global_step": 475918, "epoch": 5733} {"train_loss": -27.18915367126465, "global_step": 475919, "epoch": 5733} {"train_loss": -27.215991973876953, "global_step": 475920, "epoch": 5733} {"train_loss": -27.08199296514672, "global_step": 475921, "epoch": 5733, "val_loss": 6649084.0} {"train_loss": -26.484134674072266, "global_step": 475922, "epoch": 5734} {"train_loss": -26.306415557861328, "global_step": 475923, "epoch": 5734} {"train_loss": -25.988178253173828, "global_step": 475924, "epoch": 5734} {"train_loss": -26.77384376525879, "global_step": 475925, "epoch": 5734} {"train_loss": -25.912952423095703, "global_step": 475926, "epoch": 5734} {"train_loss": -25.50950813293457, "global_step": 475927, "epoch": 5734} {"train_loss": -26.57754898071289, "global_step": 475928, "epoch": 5734} {"train_loss": -26.300085067749023, "global_step": 475929, "epoch": 5734} {"train_loss": -26.727542877197266, "global_step": 475930, "epoch": 5734} {"train_loss": -26.515033721923828, "global_step": 475931, "epoch": 5734} {"train_loss": -26.9002742767334, "global_step": 475932, "epoch": 5734} {"train_loss": -26.516773223876953, "global_step": 475933, "epoch": 5734} {"train_loss": -26.49969482421875, "global_step": 475934, "epoch": 5734} {"train_loss": -26.584732055664062, "global_step": 475935, "epoch": 5734} {"train_loss": -26.68390464782715, "global_step": 475936, "epoch": 5734} {"train_loss": -26.871200561523438, "global_step": 475937, "epoch": 5734} {"train_loss": -26.859464645385742, "global_step": 475938, "epoch": 5734} {"train_loss": -27.004318237304688, "global_step": 475939, "epoch": 5734} {"train_loss": -26.74361228942871, "global_step": 475940, "epoch": 5734} {"train_loss": -26.720569610595703, "global_step": 475941, "epoch": 5734} {"train_loss": -26.838205337524414, "global_step": 475942, "epoch": 5734} {"train_loss": -26.421646118164062, "global_step": 475943, "epoch": 5734} {"train_loss": -27.13788414001465, "global_step": 475944, "epoch": 5734} {"train_loss": -26.188034057617188, "global_step": 475945, "epoch": 5734} {"train_loss": -26.95896339416504, "global_step": 475946, "epoch": 5734} {"train_loss": -26.730579376220703, "global_step": 475947, "epoch": 5734} {"train_loss": -27.28006935119629, "global_step": 475948, "epoch": 5734} {"train_loss": -26.981353759765625, "global_step": 475949, "epoch": 5734} {"train_loss": -27.424015045166016, "global_step": 475950, "epoch": 5734} {"train_loss": -27.41179847717285, "global_step": 475951, "epoch": 5734} {"train_loss": -27.14887809753418, "global_step": 475952, "epoch": 5734} {"train_loss": -27.208898544311523, "global_step": 475953, "epoch": 5734} {"train_loss": -27.212385177612305, "global_step": 475954, "epoch": 5734} {"train_loss": -26.75530433654785, "global_step": 475955, "epoch": 5734} {"train_loss": -26.798349380493164, "global_step": 475956, "epoch": 5734} {"train_loss": -27.497882843017578, "global_step": 475957, "epoch": 5734} {"train_loss": -27.467374801635742, "global_step": 475958, "epoch": 5734} {"train_loss": -27.3830509185791, "global_step": 475959, "epoch": 5734} {"train_loss": -27.025043487548828, "global_step": 475960, "epoch": 5734} {"train_loss": -27.375898361206055, "global_step": 475961, "epoch": 5734} {"train_loss": -27.482324600219727, "global_step": 475962, "epoch": 5734} {"train_loss": -27.174198150634766, "global_step": 475963, "epoch": 5734} {"train_loss": -27.266925811767578, "global_step": 475964, "epoch": 5734} {"train_loss": -26.904428482055664, "global_step": 475965, "epoch": 5734} {"train_loss": -27.122528076171875, "global_step": 475966, "epoch": 5734} {"train_loss": -27.21223258972168, "global_step": 475967, "epoch": 5734} {"train_loss": -27.125547409057617, "global_step": 475968, "epoch": 5734} {"train_loss": -27.676233291625977, "global_step": 475969, "epoch": 5734} {"train_loss": -27.088083267211914, "global_step": 475970, "epoch": 5734} {"train_loss": -27.300949096679688, "global_step": 475971, "epoch": 5734} {"train_loss": -27.337350845336914, "global_step": 475972, "epoch": 5734} {"train_loss": -27.044965744018555, "global_step": 475973, "epoch": 5734} {"train_loss": -27.19168472290039, "global_step": 475974, "epoch": 5734} {"train_loss": -27.38504409790039, "global_step": 475975, "epoch": 5734} {"train_loss": -27.464948654174805, "global_step": 475976, "epoch": 5734} {"train_loss": -27.1414852142334, "global_step": 475977, "epoch": 5734} {"train_loss": -27.30620765686035, "global_step": 475978, "epoch": 5734} {"train_loss": -27.528284072875977, "global_step": 475979, "epoch": 5734} {"train_loss": -27.32847023010254, "global_step": 475980, "epoch": 5734} {"train_loss": -27.458471298217773, "global_step": 475981, "epoch": 5734} {"train_loss": -27.25876808166504, "global_step": 475982, "epoch": 5734} {"train_loss": -27.36173439025879, "global_step": 475983, "epoch": 5734} {"train_loss": -27.32221794128418, "global_step": 475984, "epoch": 5734} {"train_loss": -27.537092208862305, "global_step": 475985, "epoch": 5734} {"train_loss": -27.569080352783203, "global_step": 475986, "epoch": 5734} {"train_loss": -27.49725914001465, "global_step": 475987, "epoch": 5734} {"train_loss": -27.298635482788086, "global_step": 475988, "epoch": 5734} {"train_loss": -27.441679000854492, "global_step": 475989, "epoch": 5734} {"train_loss": -27.83074378967285, "global_step": 475990, "epoch": 5734} {"train_loss": -27.626575469970703, "global_step": 475991, "epoch": 5734} {"train_loss": -27.414098739624023, "global_step": 475992, "epoch": 5734} {"train_loss": -27.469934463500977, "global_step": 475993, "epoch": 5734} {"train_loss": -27.44022560119629, "global_step": 475994, "epoch": 5734} {"train_loss": -26.8746337890625, "global_step": 475995, "epoch": 5734} {"train_loss": -26.1300106048584, "global_step": 475996, "epoch": 5734} {"train_loss": -24.96590232849121, "global_step": 475997, "epoch": 5734} {"train_loss": -25.244091033935547, "global_step": 475998, "epoch": 5734} {"train_loss": -26.482746124267578, "global_step": 475999, "epoch": 5734} {"train_loss": -26.702655792236328, "global_step": 476000, "epoch": 5734} {"train_loss": -26.350330352783203, "global_step": 476001, "epoch": 5734} {"train_loss": -26.4168701171875, "global_step": 476002, "epoch": 5734} {"train_loss": -25.812305450439453, "global_step": 476003, "epoch": 5734} {"train_loss": -26.945763944143273, "global_step": 476004, "epoch": 5734, "val_loss": 6659128.5} {"train_loss": -24.782148361206055, "global_step": 476005, "epoch": 5735} {"train_loss": -25.069358825683594, "global_step": 476006, "epoch": 5735} {"train_loss": -26.490137100219727, "global_step": 476007, "epoch": 5735} {"train_loss": -25.330053329467773, "global_step": 476008, "epoch": 5735} {"train_loss": -25.674909591674805, "global_step": 476009, "epoch": 5735} {"train_loss": -25.748071670532227, "global_step": 476010, "epoch": 5735} {"train_loss": -25.72926139831543, "global_step": 476011, "epoch": 5735} {"train_loss": -25.875959396362305, "global_step": 476012, "epoch": 5735} {"train_loss": -25.922998428344727, "global_step": 476013, "epoch": 5735} {"train_loss": -25.901899337768555, "global_step": 476014, "epoch": 5735} {"train_loss": -25.921710968017578, "global_step": 476015, "epoch": 5735} {"train_loss": -25.793201446533203, "global_step": 476016, "epoch": 5735} {"train_loss": -26.8221492767334, "global_step": 476017, "epoch": 5735} {"train_loss": -25.649982452392578, "global_step": 476018, "epoch": 5735} {"train_loss": -26.617971420288086, "global_step": 476019, "epoch": 5735} {"train_loss": -26.457061767578125, "global_step": 476020, "epoch": 5735} {"train_loss": -26.447357177734375, "global_step": 476021, "epoch": 5735} {"train_loss": -26.487295150756836, "global_step": 476022, "epoch": 5735} {"train_loss": -25.916894912719727, "global_step": 476023, "epoch": 5735} {"train_loss": -26.35504722595215, "global_step": 476024, "epoch": 5735} {"train_loss": -26.799890518188477, "global_step": 476025, "epoch": 5735} {"train_loss": -26.77692985534668, "global_step": 476026, "epoch": 5735} {"train_loss": -26.530920028686523, "global_step": 476027, "epoch": 5735} {"train_loss": -26.87332534790039, "global_step": 476028, "epoch": 5735} {"train_loss": -26.892751693725586, "global_step": 476029, "epoch": 5735} {"train_loss": -27.051395416259766, "global_step": 476030, "epoch": 5735} {"train_loss": -26.951074600219727, "global_step": 476031, "epoch": 5735} {"train_loss": -26.81033706665039, "global_step": 476032, "epoch": 5735} {"train_loss": -26.8604793548584, "global_step": 476033, "epoch": 5735} {"train_loss": -27.1540584564209, "global_step": 476034, "epoch": 5735} {"train_loss": -26.86167335510254, "global_step": 476035, "epoch": 5735} {"train_loss": -27.204349517822266, "global_step": 476036, "epoch": 5735} {"train_loss": -27.1507625579834, "global_step": 476037, "epoch": 5735} {"train_loss": -27.211332321166992, "global_step": 476038, "epoch": 5735} {"train_loss": -27.097936630249023, "global_step": 476039, "epoch": 5735} {"train_loss": -27.106338500976562, "global_step": 476040, "epoch": 5735} {"train_loss": -27.355222702026367, "global_step": 476041, "epoch": 5735} {"train_loss": -26.99696159362793, "global_step": 476042, "epoch": 5735} {"train_loss": -27.19915771484375, "global_step": 476043, "epoch": 5735} {"train_loss": -27.307546615600586, "global_step": 476044, "epoch": 5735} {"train_loss": -27.04523277282715, "global_step": 476045, "epoch": 5735} {"train_loss": -27.261295318603516, "global_step": 476046, "epoch": 5735} {"train_loss": -27.34735107421875, "global_step": 476047, "epoch": 5735} {"train_loss": -27.294605255126953, "global_step": 476048, "epoch": 5735} {"train_loss": -27.460554122924805, "global_step": 476049, "epoch": 5735} {"train_loss": -27.260465621948242, "global_step": 476050, "epoch": 5735} {"train_loss": -27.525644302368164, "global_step": 476051, "epoch": 5735} {"train_loss": -27.227537155151367, "global_step": 476052, "epoch": 5735} {"train_loss": -27.733556747436523, "global_step": 476053, "epoch": 5735} {"train_loss": -27.472822189331055, "global_step": 476054, "epoch": 5735} {"train_loss": -27.33258628845215, "global_step": 476055, "epoch": 5735} {"train_loss": -27.179656982421875, "global_step": 476056, "epoch": 5735} {"train_loss": -27.48483657836914, "global_step": 476057, "epoch": 5735} {"train_loss": -27.85639762878418, "global_step": 476058, "epoch": 5735} {"train_loss": -27.434919357299805, "global_step": 476059, "epoch": 5735} {"train_loss": -27.150959014892578, "global_step": 476060, "epoch": 5735} {"train_loss": -27.717161178588867, "global_step": 476061, "epoch": 5735} {"train_loss": -27.634998321533203, "global_step": 476062, "epoch": 5735} {"train_loss": -27.56171226501465, "global_step": 476063, "epoch": 5735} {"train_loss": -27.282651901245117, "global_step": 476064, "epoch": 5735} {"train_loss": -27.674381256103516, "global_step": 476065, "epoch": 5735} {"train_loss": -27.590015411376953, "global_step": 476066, "epoch": 5735} {"train_loss": -27.245264053344727, "global_step": 476067, "epoch": 5735} {"train_loss": -27.310327529907227, "global_step": 476068, "epoch": 5735} {"train_loss": -26.253442764282227, "global_step": 476069, "epoch": 5735} {"train_loss": -26.45668601989746, "global_step": 476070, "epoch": 5735} {"train_loss": -27.081714630126953, "global_step": 476071, "epoch": 5735} {"train_loss": -27.129413604736328, "global_step": 476072, "epoch": 5735} {"train_loss": -27.346277236938477, "global_step": 476073, "epoch": 5735} {"train_loss": -27.28643226623535, "global_step": 476074, "epoch": 5735} {"train_loss": -27.36903953552246, "global_step": 476075, "epoch": 5735} {"train_loss": -27.153003692626953, "global_step": 476076, "epoch": 5735} {"train_loss": -26.981708526611328, "global_step": 476077, "epoch": 5735} {"train_loss": -27.175037384033203, "global_step": 476078, "epoch": 5735} {"train_loss": -27.153573989868164, "global_step": 476079, "epoch": 5735} {"train_loss": -27.374841690063477, "global_step": 476080, "epoch": 5735} {"train_loss": -27.264801025390625, "global_step": 476081, "epoch": 5735} {"train_loss": -27.211761474609375, "global_step": 476082, "epoch": 5735} {"train_loss": -27.260263442993164, "global_step": 476083, "epoch": 5735} {"train_loss": -27.452482223510742, "global_step": 476084, "epoch": 5735} {"train_loss": -27.538644790649414, "global_step": 476085, "epoch": 5735} {"train_loss": -27.264251708984375, "global_step": 476086, "epoch": 5735} {"train_loss": -26.906520177082843, "global_step": 476087, "epoch": 5735, "val_loss": 6600442.0} {"train_loss": -26.790388107299805, "global_step": 476088, "epoch": 5736} {"train_loss": -26.63445472717285, "global_step": 476089, "epoch": 5736} {"train_loss": -27.21421241760254, "global_step": 476090, "epoch": 5736} {"train_loss": -26.88852310180664, "global_step": 476091, "epoch": 5736} {"train_loss": -26.821308135986328, "global_step": 476092, "epoch": 5736} {"train_loss": -26.954862594604492, "global_step": 476093, "epoch": 5736} {"train_loss": -26.697437286376953, "global_step": 476094, "epoch": 5736} {"train_loss": -26.914670944213867, "global_step": 476095, "epoch": 5736} {"train_loss": -26.93525505065918, "global_step": 476096, "epoch": 5736} {"train_loss": -26.87262535095215, "global_step": 476097, "epoch": 5736} {"train_loss": -27.044788360595703, "global_step": 476098, "epoch": 5736} {"train_loss": -26.873214721679688, "global_step": 476099, "epoch": 5736} {"train_loss": -27.160938262939453, "global_step": 476100, "epoch": 5736} {"train_loss": -27.11610984802246, "global_step": 476101, "epoch": 5736} {"train_loss": -27.042469024658203, "global_step": 476102, "epoch": 5736} {"train_loss": -26.966632843017578, "global_step": 476103, "epoch": 5736} {"train_loss": -27.487197875976562, "global_step": 476104, "epoch": 5736} {"train_loss": -26.794424057006836, "global_step": 476105, "epoch": 5736} {"train_loss": -26.397153854370117, "global_step": 476106, "epoch": 5736} {"train_loss": -26.795032501220703, "global_step": 476107, "epoch": 5736} {"train_loss": -27.185522079467773, "global_step": 476108, "epoch": 5736} {"train_loss": -27.047101974487305, "global_step": 476109, "epoch": 5736} {"train_loss": -26.944299697875977, "global_step": 476110, "epoch": 5736} {"train_loss": -26.741296768188477, "global_step": 476111, "epoch": 5736} {"train_loss": -26.653244018554688, "global_step": 476112, "epoch": 5736} {"train_loss": -27.2025203704834, "global_step": 476113, "epoch": 5736} {"train_loss": -27.315622329711914, "global_step": 476114, "epoch": 5736} {"train_loss": -27.29315185546875, "global_step": 476115, "epoch": 5736} {"train_loss": -27.539901733398438, "global_step": 476116, "epoch": 5736} {"train_loss": -26.945270538330078, "global_step": 476117, "epoch": 5736} {"train_loss": -26.857318878173828, "global_step": 476118, "epoch": 5736} {"train_loss": -27.166671752929688, "global_step": 476119, "epoch": 5736} {"train_loss": -27.436914443969727, "global_step": 476120, "epoch": 5736} {"train_loss": -26.94118309020996, "global_step": 476121, "epoch": 5736} {"train_loss": -27.241209030151367, "global_step": 476122, "epoch": 5736} {"train_loss": -27.425601959228516, "global_step": 476123, "epoch": 5736} {"train_loss": -26.76327896118164, "global_step": 476124, "epoch": 5736} {"train_loss": -27.097265243530273, "global_step": 476125, "epoch": 5736} {"train_loss": -27.070859909057617, "global_step": 476126, "epoch": 5736} {"train_loss": -27.138715744018555, "global_step": 476127, "epoch": 5736} {"train_loss": -27.355249404907227, "global_step": 476128, "epoch": 5736} {"train_loss": -27.293821334838867, "global_step": 476129, "epoch": 5736} {"train_loss": -27.12613868713379, "global_step": 476130, "epoch": 5736} {"train_loss": -26.932647705078125, "global_step": 476131, "epoch": 5736} {"train_loss": -27.61823844909668, "global_step": 476132, "epoch": 5736} {"train_loss": -27.20021629333496, "global_step": 476133, "epoch": 5736} {"train_loss": -27.26515007019043, "global_step": 476134, "epoch": 5736} {"train_loss": -26.889631271362305, "global_step": 476135, "epoch": 5736} {"train_loss": -27.651397705078125, "global_step": 476136, "epoch": 5736} {"train_loss": -27.131025314331055, "global_step": 476137, "epoch": 5736} {"train_loss": -27.31315040588379, "global_step": 476138, "epoch": 5736} {"train_loss": -27.233551025390625, "global_step": 476139, "epoch": 5736} {"train_loss": -27.574132919311523, "global_step": 476140, "epoch": 5736} {"train_loss": -27.325580596923828, "global_step": 476141, "epoch": 5736} {"train_loss": -27.062681198120117, "global_step": 476142, "epoch": 5736} {"train_loss": -27.193445205688477, "global_step": 476143, "epoch": 5736} {"train_loss": -27.47059440612793, "global_step": 476144, "epoch": 5736} {"train_loss": -26.941221237182617, "global_step": 476145, "epoch": 5736} {"train_loss": -27.367334365844727, "global_step": 476146, "epoch": 5736} {"train_loss": -27.451318740844727, "global_step": 476147, "epoch": 5736} {"train_loss": -27.167638778686523, "global_step": 476148, "epoch": 5736} {"train_loss": -27.180566787719727, "global_step": 476149, "epoch": 5736} {"train_loss": -26.812170028686523, "global_step": 476150, "epoch": 5736} {"train_loss": -27.098297119140625, "global_step": 476151, "epoch": 5736} {"train_loss": -27.42569351196289, "global_step": 476152, "epoch": 5736} {"train_loss": -27.091339111328125, "global_step": 476153, "epoch": 5736} {"train_loss": -27.1014404296875, "global_step": 476154, "epoch": 5736} {"train_loss": -26.91798210144043, "global_step": 476155, "epoch": 5736} {"train_loss": -26.857553482055664, "global_step": 476156, "epoch": 5736} {"train_loss": -26.33942222595215, "global_step": 476157, "epoch": 5736} {"train_loss": -27.004657745361328, "global_step": 476158, "epoch": 5736} {"train_loss": -27.184173583984375, "global_step": 476159, "epoch": 5736} {"train_loss": -27.304121017456055, "global_step": 476160, "epoch": 5736} {"train_loss": -27.397296905517578, "global_step": 476161, "epoch": 5736} {"train_loss": -27.335302352905273, "global_step": 476162, "epoch": 5736} {"train_loss": -27.120309829711914, "global_step": 476163, "epoch": 5736} {"train_loss": -27.161273956298828, "global_step": 476164, "epoch": 5736} {"train_loss": -27.0816593170166, "global_step": 476165, "epoch": 5736} {"train_loss": -26.975666046142578, "global_step": 476166, "epoch": 5736} {"train_loss": -27.349145889282227, "global_step": 476167, "epoch": 5736} {"train_loss": -26.844390869140625, "global_step": 476168, "epoch": 5736} {"train_loss": -27.145334243774414, "global_step": 476169, "epoch": 5736} {"train_loss": -27.097038475863904, "global_step": 476170, "epoch": 5736, "val_loss": 6627942.5} {"train_loss": -25.715970993041992, "global_step": 476171, "epoch": 5737} {"train_loss": -26.119474411010742, "global_step": 476172, "epoch": 5737} {"train_loss": -26.251989364624023, "global_step": 476173, "epoch": 5737} {"train_loss": -25.917211532592773, "global_step": 476174, "epoch": 5737} {"train_loss": -26.28486442565918, "global_step": 476175, "epoch": 5737} {"train_loss": -26.353015899658203, "global_step": 476176, "epoch": 5737} {"train_loss": -26.463361740112305, "global_step": 476177, "epoch": 5737} {"train_loss": -26.501083374023438, "global_step": 476178, "epoch": 5737} {"train_loss": -26.7302188873291, "global_step": 476179, "epoch": 5737} {"train_loss": -26.598194122314453, "global_step": 476180, "epoch": 5737} {"train_loss": -27.25126075744629, "global_step": 476181, "epoch": 5737} {"train_loss": -26.697778701782227, "global_step": 476182, "epoch": 5737} {"train_loss": -26.53887939453125, "global_step": 476183, "epoch": 5737} {"train_loss": -26.309860229492188, "global_step": 476184, "epoch": 5737} {"train_loss": -26.578750610351562, "global_step": 476185, "epoch": 5737} {"train_loss": -26.624807357788086, "global_step": 476186, "epoch": 5737} {"train_loss": -27.046772003173828, "global_step": 476187, "epoch": 5737} {"train_loss": -27.237442016601562, "global_step": 476188, "epoch": 5737} {"train_loss": -26.6805419921875, "global_step": 476189, "epoch": 5737} {"train_loss": -26.9566650390625, "global_step": 476190, "epoch": 5737} {"train_loss": -26.710229873657227, "global_step": 476191, "epoch": 5737} {"train_loss": -27.055999755859375, "global_step": 476192, "epoch": 5737} {"train_loss": -26.668140411376953, "global_step": 476193, "epoch": 5737} {"train_loss": -26.991180419921875, "global_step": 476194, "epoch": 5737} {"train_loss": -26.8583927154541, "global_step": 476195, "epoch": 5737} {"train_loss": -27.26043701171875, "global_step": 476196, "epoch": 5737} {"train_loss": -26.943984985351562, "global_step": 476197, "epoch": 5737} {"train_loss": -27.329345703125, "global_step": 476198, "epoch": 5737} {"train_loss": -27.35687828063965, "global_step": 476199, "epoch": 5737} {"train_loss": -27.225662231445312, "global_step": 476200, "epoch": 5737} {"train_loss": -27.283971786499023, "global_step": 476201, "epoch": 5737} {"train_loss": -27.0401611328125, "global_step": 476202, "epoch": 5737} {"train_loss": -27.66901969909668, "global_step": 476203, "epoch": 5737} {"train_loss": -27.065214157104492, "global_step": 476204, "epoch": 5737} {"train_loss": -27.060529708862305, "global_step": 476205, "epoch": 5737} {"train_loss": -27.203222274780273, "global_step": 476206, "epoch": 5737} {"train_loss": -27.575550079345703, "global_step": 476207, "epoch": 5737} {"train_loss": -26.87421226501465, "global_step": 476208, "epoch": 5737} {"train_loss": -26.985788345336914, "global_step": 476209, "epoch": 5737} {"train_loss": -26.958332061767578, "global_step": 476210, "epoch": 5737} {"train_loss": -27.20997428894043, "global_step": 476211, "epoch": 5737} {"train_loss": -27.493066787719727, "global_step": 476212, "epoch": 5737} {"train_loss": -27.252349853515625, "global_step": 476213, "epoch": 5737} {"train_loss": -26.987781524658203, "global_step": 476214, "epoch": 5737} {"train_loss": -27.50494956970215, "global_step": 476215, "epoch": 5737} {"train_loss": -27.250120162963867, "global_step": 476216, "epoch": 5737} {"train_loss": -27.20857048034668, "global_step": 476217, "epoch": 5737} {"train_loss": -27.569883346557617, "global_step": 476218, "epoch": 5737} {"train_loss": -27.6763916015625, "global_step": 476219, "epoch": 5737} {"train_loss": -27.2586612701416, "global_step": 476220, "epoch": 5737} {"train_loss": -27.24203872680664, "global_step": 476221, "epoch": 5737} {"train_loss": -27.207059860229492, "global_step": 476222, "epoch": 5737} {"train_loss": -27.034391403198242, "global_step": 476223, "epoch": 5737} {"train_loss": -27.113367080688477, "global_step": 476224, "epoch": 5737} {"train_loss": -27.460752487182617, "global_step": 476225, "epoch": 5737} {"train_loss": -27.524057388305664, "global_step": 476226, "epoch": 5737} {"train_loss": -27.478490829467773, "global_step": 476227, "epoch": 5737} {"train_loss": -27.209890365600586, "global_step": 476228, "epoch": 5737} {"train_loss": -27.357807159423828, "global_step": 476229, "epoch": 5737} {"train_loss": -27.442169189453125, "global_step": 476230, "epoch": 5737} {"train_loss": -27.40766716003418, "global_step": 476231, "epoch": 5737} {"train_loss": -27.139135360717773, "global_step": 476232, "epoch": 5737} {"train_loss": -27.246936798095703, "global_step": 476233, "epoch": 5737} {"train_loss": -27.50678062438965, "global_step": 476234, "epoch": 5737} {"train_loss": -27.331281661987305, "global_step": 476235, "epoch": 5737} {"train_loss": -27.76480484008789, "global_step": 476236, "epoch": 5737} {"train_loss": -27.518707275390625, "global_step": 476237, "epoch": 5737} {"train_loss": -27.35382080078125, "global_step": 476238, "epoch": 5737} {"train_loss": -27.473257064819336, "global_step": 476239, "epoch": 5737} {"train_loss": -27.171255111694336, "global_step": 476240, "epoch": 5737} {"train_loss": -27.1611328125, "global_step": 476241, "epoch": 5737} {"train_loss": -27.158430099487305, "global_step": 476242, "epoch": 5737} {"train_loss": -27.271451950073242, "global_step": 476243, "epoch": 5737} {"train_loss": -27.107135772705078, "global_step": 476244, "epoch": 5737} {"train_loss": -27.453998565673828, "global_step": 476245, "epoch": 5737} {"train_loss": -27.218963623046875, "global_step": 476246, "epoch": 5737} {"train_loss": -27.245695114135742, "global_step": 476247, "epoch": 5737} {"train_loss": -27.154296875, "global_step": 476248, "epoch": 5737} {"train_loss": -27.622303009033203, "global_step": 476249, "epoch": 5737} {"train_loss": -27.397119522094727, "global_step": 476250, "epoch": 5737} {"train_loss": -26.463260650634766, "global_step": 476251, "epoch": 5737} {"train_loss": -26.493284225463867, "global_step": 476252, "epoch": 5737} {"train_loss": -27.069113421152874, "global_step": 476253, "epoch": 5737, "val_loss": 6632949.5} {"train_loss": -25.979328155517578, "global_step": 476254, "epoch": 5738} {"train_loss": -26.289331436157227, "global_step": 476255, "epoch": 5738} {"train_loss": -25.74677848815918, "global_step": 476256, "epoch": 5738} {"train_loss": -24.616992950439453, "global_step": 476257, "epoch": 5738} {"train_loss": -26.41914939880371, "global_step": 476258, "epoch": 5738} {"train_loss": -25.656494140625, "global_step": 476259, "epoch": 5738} {"train_loss": -26.481897354125977, "global_step": 476260, "epoch": 5738} {"train_loss": -25.60527992248535, "global_step": 476261, "epoch": 5738} {"train_loss": -26.130813598632812, "global_step": 476262, "epoch": 5738} {"train_loss": -26.028501510620117, "global_step": 476263, "epoch": 5738} {"train_loss": -25.781827926635742, "global_step": 476264, "epoch": 5738} {"train_loss": -26.59433364868164, "global_step": 476265, "epoch": 5738} {"train_loss": -26.224811553955078, "global_step": 476266, "epoch": 5738} {"train_loss": -26.601499557495117, "global_step": 476267, "epoch": 5738} {"train_loss": -26.412363052368164, "global_step": 476268, "epoch": 5738} {"train_loss": -26.10190200805664, "global_step": 476269, "epoch": 5738} {"train_loss": -26.349777221679688, "global_step": 476270, "epoch": 5738} {"train_loss": -26.66522789001465, "global_step": 476271, "epoch": 5738} {"train_loss": -26.29035758972168, "global_step": 476272, "epoch": 5738} {"train_loss": -26.589862823486328, "global_step": 476273, "epoch": 5738} {"train_loss": -26.58697509765625, "global_step": 476274, "epoch": 5738} {"train_loss": -26.584375381469727, "global_step": 476275, "epoch": 5738} {"train_loss": -26.217329025268555, "global_step": 476276, "epoch": 5738} {"train_loss": -26.673852920532227, "global_step": 476277, "epoch": 5738} {"train_loss": -27.096847534179688, "global_step": 476278, "epoch": 5738} {"train_loss": -26.66873550415039, "global_step": 476279, "epoch": 5738} {"train_loss": -26.90553092956543, "global_step": 476280, "epoch": 5738} {"train_loss": -26.79302978515625, "global_step": 476281, "epoch": 5738} {"train_loss": -27.055566787719727, "global_step": 476282, "epoch": 5738} {"train_loss": -27.177490234375, "global_step": 476283, "epoch": 5738} {"train_loss": -26.9963321685791, "global_step": 476284, "epoch": 5738} {"train_loss": -27.1624755859375, "global_step": 476285, "epoch": 5738} {"train_loss": -27.096784591674805, "global_step": 476286, "epoch": 5738} {"train_loss": -27.0928955078125, "global_step": 476287, "epoch": 5738} {"train_loss": -27.369489669799805, "global_step": 476288, "epoch": 5738} {"train_loss": -26.894699096679688, "global_step": 476289, "epoch": 5738} {"train_loss": -26.645788192749023, "global_step": 476290, "epoch": 5738} {"train_loss": -27.308216094970703, "global_step": 476291, "epoch": 5738} {"train_loss": -27.330825805664062, "global_step": 476292, "epoch": 5738} {"train_loss": -27.16131019592285, "global_step": 476293, "epoch": 5738} {"train_loss": -27.247053146362305, "global_step": 476294, "epoch": 5738} {"train_loss": -27.04450035095215, "global_step": 476295, "epoch": 5738} {"train_loss": -27.132593154907227, "global_step": 476296, "epoch": 5738} {"train_loss": -27.57728385925293, "global_step": 476297, "epoch": 5738} {"train_loss": -27.19256019592285, "global_step": 476298, "epoch": 5738} {"train_loss": -27.37652587890625, "global_step": 476299, "epoch": 5738} {"train_loss": -27.21070671081543, "global_step": 476300, "epoch": 5738} {"train_loss": -27.008649826049805, "global_step": 476301, "epoch": 5738} {"train_loss": -27.31292724609375, "global_step": 476302, "epoch": 5738} {"train_loss": -26.869476318359375, "global_step": 476303, "epoch": 5738} {"train_loss": -27.398303985595703, "global_step": 476304, "epoch": 5738} {"train_loss": -27.38105583190918, "global_step": 476305, "epoch": 5738} {"train_loss": -27.278228759765625, "global_step": 476306, "epoch": 5738} {"train_loss": -27.461933135986328, "global_step": 476307, "epoch": 5738} {"train_loss": -27.50685691833496, "global_step": 476308, "epoch": 5738} {"train_loss": -27.482030868530273, "global_step": 476309, "epoch": 5738} {"train_loss": -27.331745147705078, "global_step": 476310, "epoch": 5738} {"train_loss": -27.554004669189453, "global_step": 476311, "epoch": 5738} {"train_loss": -27.274011611938477, "global_step": 476312, "epoch": 5738} {"train_loss": -27.228796005249023, "global_step": 476313, "epoch": 5738} {"train_loss": -27.248437881469727, "global_step": 476314, "epoch": 5738} {"train_loss": -27.096403121948242, "global_step": 476315, "epoch": 5738} {"train_loss": -27.4033203125, "global_step": 476316, "epoch": 5738} {"train_loss": -27.825361251831055, "global_step": 476317, "epoch": 5738} {"train_loss": -27.453916549682617, "global_step": 476318, "epoch": 5738} {"train_loss": -27.862567901611328, "global_step": 476319, "epoch": 5738} {"train_loss": -27.221420288085938, "global_step": 476320, "epoch": 5738} {"train_loss": -27.72216796875, "global_step": 476321, "epoch": 5738} {"train_loss": -27.187116622924805, "global_step": 476322, "epoch": 5738} {"train_loss": -27.18753433227539, "global_step": 476323, "epoch": 5738} {"train_loss": -27.27132225036621, "global_step": 476324, "epoch": 5738} {"train_loss": -27.212921142578125, "global_step": 476325, "epoch": 5738} {"train_loss": -27.122547149658203, "global_step": 476326, "epoch": 5738} {"train_loss": -27.237112045288086, "global_step": 476327, "epoch": 5738} {"train_loss": -26.944477081298828, "global_step": 476328, "epoch": 5738} {"train_loss": -26.1640567779541, "global_step": 476329, "epoch": 5738} {"train_loss": -26.620370864868164, "global_step": 476330, "epoch": 5738} {"train_loss": -27.075422286987305, "global_step": 476331, "epoch": 5738} {"train_loss": -27.528675079345703, "global_step": 476332, "epoch": 5738} {"train_loss": -27.03665542602539, "global_step": 476333, "epoch": 5738} {"train_loss": -26.854084014892578, "global_step": 476334, "epoch": 5738} {"train_loss": -27.333099365234375, "global_step": 476335, "epoch": 5738} {"train_loss": -26.887320139321936, "global_step": 476336, "epoch": 5738, "val_loss": 6728765.5} {"train_loss": -26.126708984375, "global_step": 476337, "epoch": 5739} {"train_loss": -26.494094848632812, "global_step": 476338, "epoch": 5739} {"train_loss": -27.039382934570312, "global_step": 476339, "epoch": 5739} {"train_loss": -26.552021026611328, "global_step": 476340, "epoch": 5739} {"train_loss": -26.96038246154785, "global_step": 476341, "epoch": 5739} {"train_loss": -27.119617462158203, "global_step": 476342, "epoch": 5739} {"train_loss": -26.393024444580078, "global_step": 476343, "epoch": 5739} {"train_loss": -27.140295028686523, "global_step": 476344, "epoch": 5739} {"train_loss": -26.672088623046875, "global_step": 476345, "epoch": 5739} {"train_loss": -26.56214714050293, "global_step": 476346, "epoch": 5739} {"train_loss": -27.00031852722168, "global_step": 476347, "epoch": 5739} {"train_loss": -26.78716468811035, "global_step": 476348, "epoch": 5739} {"train_loss": -27.022308349609375, "global_step": 476349, "epoch": 5739} {"train_loss": -27.08740234375, "global_step": 476350, "epoch": 5739} {"train_loss": -27.435760498046875, "global_step": 476351, "epoch": 5739} {"train_loss": -26.746463775634766, "global_step": 476352, "epoch": 5739} {"train_loss": -27.08443260192871, "global_step": 476353, "epoch": 5739} {"train_loss": -26.895771026611328, "global_step": 476354, "epoch": 5739} {"train_loss": -26.590198516845703, "global_step": 476355, "epoch": 5739} {"train_loss": -26.904977798461914, "global_step": 476356, "epoch": 5739} {"train_loss": -26.82248306274414, "global_step": 476357, "epoch": 5739} {"train_loss": -26.788700103759766, "global_step": 476358, "epoch": 5739} {"train_loss": -26.848867416381836, "global_step": 476359, "epoch": 5739} {"train_loss": -27.014318466186523, "global_step": 476360, "epoch": 5739} {"train_loss": -27.08930015563965, "global_step": 476361, "epoch": 5739} {"train_loss": -26.961719512939453, "global_step": 476362, "epoch": 5739} {"train_loss": -26.8966064453125, "global_step": 476363, "epoch": 5739} {"train_loss": -27.067920684814453, "global_step": 476364, "epoch": 5739} {"train_loss": -26.972253799438477, "global_step": 476365, "epoch": 5739} {"train_loss": -27.010498046875, "global_step": 476366, "epoch": 5739} {"train_loss": -27.2211856842041, "global_step": 476367, "epoch": 5739} {"train_loss": -27.310577392578125, "global_step": 476368, "epoch": 5739} {"train_loss": -26.9971981048584, "global_step": 476369, "epoch": 5739} {"train_loss": -27.23353385925293, "global_step": 476370, "epoch": 5739} {"train_loss": -27.151901245117188, "global_step": 476371, "epoch": 5739} {"train_loss": -27.245664596557617, "global_step": 476372, "epoch": 5739} {"train_loss": -27.266706466674805, "global_step": 476373, "epoch": 5739} {"train_loss": -27.289953231811523, "global_step": 476374, "epoch": 5739} {"train_loss": -27.073232650756836, "global_step": 476375, "epoch": 5739} {"train_loss": -27.643049240112305, "global_step": 476376, "epoch": 5739} {"train_loss": -27.31385612487793, "global_step": 476377, "epoch": 5739} {"train_loss": -26.91993522644043, "global_step": 476378, "epoch": 5739} {"train_loss": -27.398090362548828, "global_step": 476379, "epoch": 5739} {"train_loss": -26.840620040893555, "global_step": 476380, "epoch": 5739} {"train_loss": -27.267438888549805, "global_step": 476381, "epoch": 5739} {"train_loss": -27.35828971862793, "global_step": 476382, "epoch": 5739} {"train_loss": -27.233694076538086, "global_step": 476383, "epoch": 5739} {"train_loss": -27.166528701782227, "global_step": 476384, "epoch": 5739} {"train_loss": -27.1361026763916, "global_step": 476385, "epoch": 5739} {"train_loss": -27.356597900390625, "global_step": 476386, "epoch": 5739} {"train_loss": -27.378662109375, "global_step": 476387, "epoch": 5739} {"train_loss": -27.3531551361084, "global_step": 476388, "epoch": 5739} {"train_loss": -27.3345947265625, "global_step": 476389, "epoch": 5739} {"train_loss": -27.50166130065918, "global_step": 476390, "epoch": 5739} {"train_loss": -27.24907875061035, "global_step": 476391, "epoch": 5739} {"train_loss": -26.954626083374023, "global_step": 476392, "epoch": 5739} {"train_loss": -27.2607421875, "global_step": 476393, "epoch": 5739} {"train_loss": -26.8284854888916, "global_step": 476394, "epoch": 5739} {"train_loss": -27.14361572265625, "global_step": 476395, "epoch": 5739} {"train_loss": -27.840412139892578, "global_step": 476396, "epoch": 5739} {"train_loss": -27.663278579711914, "global_step": 476397, "epoch": 5739} {"train_loss": -27.321765899658203, "global_step": 476398, "epoch": 5739} {"train_loss": -26.88565444946289, "global_step": 476399, "epoch": 5739} {"train_loss": -27.35873794555664, "global_step": 476400, "epoch": 5739} {"train_loss": -27.478591918945312, "global_step": 476401, "epoch": 5739} {"train_loss": -27.43813133239746, "global_step": 476402, "epoch": 5739} {"train_loss": -27.32828140258789, "global_step": 476403, "epoch": 5739} {"train_loss": -26.88435173034668, "global_step": 476404, "epoch": 5739} {"train_loss": -27.542394638061523, "global_step": 476405, "epoch": 5739} {"train_loss": -27.6340389251709, "global_step": 476406, "epoch": 5739} {"train_loss": -27.298994064331055, "global_step": 476407, "epoch": 5739} {"train_loss": -27.1560001373291, "global_step": 476408, "epoch": 5739} {"train_loss": -26.97113037109375, "global_step": 476409, "epoch": 5739} {"train_loss": -27.258331298828125, "global_step": 476410, "epoch": 5739} {"train_loss": -27.055566787719727, "global_step": 476411, "epoch": 5739} {"train_loss": -27.073902130126953, "global_step": 476412, "epoch": 5739} {"train_loss": -27.303693771362305, "global_step": 476413, "epoch": 5739} {"train_loss": -27.086181640625, "global_step": 476414, "epoch": 5739} {"train_loss": -27.69412612915039, "global_step": 476415, "epoch": 5739} {"train_loss": -27.242633819580078, "global_step": 476416, "epoch": 5739} {"train_loss": -27.49151611328125, "global_step": 476417, "epoch": 5739} {"train_loss": -27.27796745300293, "global_step": 476418, "epoch": 5739} {"train_loss": -27.13055013174034, "global_step": 476419, "epoch": 5739, "val_loss": 6590530.0} {"train_loss": -26.91121482849121, "global_step": 476420, "epoch": 5740} {"train_loss": -27.043699264526367, "global_step": 476421, "epoch": 5740} {"train_loss": -26.896076202392578, "global_step": 476422, "epoch": 5740} {"train_loss": -27.30655860900879, "global_step": 476423, "epoch": 5740} {"train_loss": -26.635534286499023, "global_step": 476424, "epoch": 5740} {"train_loss": -27.263025283813477, "global_step": 476425, "epoch": 5740} {"train_loss": -27.409643173217773, "global_step": 476426, "epoch": 5740} {"train_loss": -27.16458511352539, "global_step": 476427, "epoch": 5740} {"train_loss": -27.042682647705078, "global_step": 476428, "epoch": 5740} {"train_loss": -27.053085327148438, "global_step": 476429, "epoch": 5740} {"train_loss": -27.19019889831543, "global_step": 476430, "epoch": 5740} {"train_loss": -27.242755889892578, "global_step": 476431, "epoch": 5740} {"train_loss": -27.419239044189453, "global_step": 476432, "epoch": 5740} {"train_loss": -26.99151039123535, "global_step": 476433, "epoch": 5740} {"train_loss": -26.821857452392578, "global_step": 476434, "epoch": 5740} {"train_loss": -27.53621482849121, "global_step": 476435, "epoch": 5740} {"train_loss": -27.154821395874023, "global_step": 476436, "epoch": 5740} {"train_loss": -27.326663970947266, "global_step": 476437, "epoch": 5740} {"train_loss": -27.233251571655273, "global_step": 476438, "epoch": 5740} {"train_loss": -27.05488395690918, "global_step": 476439, "epoch": 5740} {"train_loss": -27.2982120513916, "global_step": 476440, "epoch": 5740} {"train_loss": -27.17746353149414, "global_step": 476441, "epoch": 5740} {"train_loss": -27.355146408081055, "global_step": 476442, "epoch": 5740} {"train_loss": -27.37528419494629, "global_step": 476443, "epoch": 5740} {"train_loss": -27.076007843017578, "global_step": 476444, "epoch": 5740} {"train_loss": -26.718957901000977, "global_step": 476445, "epoch": 5740} {"train_loss": -27.477262496948242, "global_step": 476446, "epoch": 5740} {"train_loss": -27.42462730407715, "global_step": 476447, "epoch": 5740} {"train_loss": -27.1013240814209, "global_step": 476448, "epoch": 5740} {"train_loss": -26.68433952331543, "global_step": 476449, "epoch": 5740} {"train_loss": -27.219654083251953, "global_step": 476450, "epoch": 5740} {"train_loss": -27.38498306274414, "global_step": 476451, "epoch": 5740} {"train_loss": -27.47185707092285, "global_step": 476452, "epoch": 5740} {"train_loss": -27.398086547851562, "global_step": 476453, "epoch": 5740} {"train_loss": -27.1014404296875, "global_step": 476454, "epoch": 5740} {"train_loss": -26.860334396362305, "global_step": 476455, "epoch": 5740} {"train_loss": -27.25330924987793, "global_step": 476456, "epoch": 5740} {"train_loss": -27.278844833374023, "global_step": 476457, "epoch": 5740} {"train_loss": -27.239990234375, "global_step": 476458, "epoch": 5740} {"train_loss": -27.464874267578125, "global_step": 476459, "epoch": 5740} {"train_loss": -26.987695693969727, "global_step": 476460, "epoch": 5740} {"train_loss": -27.57415199279785, "global_step": 476461, "epoch": 5740} {"train_loss": -27.253339767456055, "global_step": 476462, "epoch": 5740} {"train_loss": -26.821775436401367, "global_step": 476463, "epoch": 5740} {"train_loss": -27.293195724487305, "global_step": 476464, "epoch": 5740} {"train_loss": -27.32793617248535, "global_step": 476465, "epoch": 5740} {"train_loss": -27.170486450195312, "global_step": 476466, "epoch": 5740} {"train_loss": -27.123144149780273, "global_step": 476467, "epoch": 5740} {"train_loss": -27.5317325592041, "global_step": 476468, "epoch": 5740} {"train_loss": -27.424779891967773, "global_step": 476469, "epoch": 5740} {"train_loss": -27.567413330078125, "global_step": 476470, "epoch": 5740} {"train_loss": -27.33286476135254, "global_step": 476471, "epoch": 5740} {"train_loss": -27.002716064453125, "global_step": 476472, "epoch": 5740} {"train_loss": -27.09159278869629, "global_step": 476473, "epoch": 5740} {"train_loss": -27.252973556518555, "global_step": 476474, "epoch": 5740} {"train_loss": -27.296873092651367, "global_step": 476475, "epoch": 5740} {"train_loss": -27.5560302734375, "global_step": 476476, "epoch": 5740} {"train_loss": -27.030797958374023, "global_step": 476477, "epoch": 5740} {"train_loss": -27.54340171813965, "global_step": 476478, "epoch": 5740} {"train_loss": -27.652191162109375, "global_step": 476479, "epoch": 5740} {"train_loss": -27.33353614807129, "global_step": 476480, "epoch": 5740} {"train_loss": -27.35288429260254, "global_step": 476481, "epoch": 5740} {"train_loss": -26.88392448425293, "global_step": 476482, "epoch": 5740} {"train_loss": -27.43060302734375, "global_step": 476483, "epoch": 5740} {"train_loss": -27.420759201049805, "global_step": 476484, "epoch": 5740} {"train_loss": -27.277191162109375, "global_step": 476485, "epoch": 5740} {"train_loss": -26.933990478515625, "global_step": 476486, "epoch": 5740} {"train_loss": -26.934614181518555, "global_step": 476487, "epoch": 5740} {"train_loss": -26.994260787963867, "global_step": 476488, "epoch": 5740} {"train_loss": -27.324832916259766, "global_step": 476489, "epoch": 5740} {"train_loss": -27.47406578063965, "global_step": 476490, "epoch": 5740} {"train_loss": -27.390323638916016, "global_step": 476491, "epoch": 5740} {"train_loss": -27.353565216064453, "global_step": 476492, "epoch": 5740} {"train_loss": -27.463438034057617, "global_step": 476493, "epoch": 5740} {"train_loss": -27.849689483642578, "global_step": 476494, "epoch": 5740} {"train_loss": -27.29630470275879, "global_step": 476495, "epoch": 5740} {"train_loss": -27.492456436157227, "global_step": 476496, "epoch": 5740} {"train_loss": -27.640119552612305, "global_step": 476497, "epoch": 5740} {"train_loss": -27.375452041625977, "global_step": 476498, "epoch": 5740} {"train_loss": -27.0540771484375, "global_step": 476499, "epoch": 5740} {"train_loss": -27.267282485961914, "global_step": 476500, "epoch": 5740} {"train_loss": -27.28594398498535, "global_step": 476501, "epoch": 5740} {"train_loss": -27.229169431939184, "global_step": 476502, "epoch": 5740, "val_loss": 6632409.0} {"train_loss": -26.395734786987305, "global_step": 476503, "epoch": 5741} {"train_loss": -26.0040340423584, "global_step": 476504, "epoch": 5741} {"train_loss": -25.654251098632812, "global_step": 476505, "epoch": 5741} {"train_loss": -26.93360710144043, "global_step": 476506, "epoch": 5741} {"train_loss": -26.371326446533203, "global_step": 476507, "epoch": 5741} {"train_loss": -26.59234619140625, "global_step": 476508, "epoch": 5741} {"train_loss": -27.124347686767578, "global_step": 476509, "epoch": 5741} {"train_loss": -26.639673233032227, "global_step": 476510, "epoch": 5741} {"train_loss": -26.455991744995117, "global_step": 476511, "epoch": 5741} {"train_loss": -27.1369571685791, "global_step": 476512, "epoch": 5741} {"train_loss": -26.777359008789062, "global_step": 476513, "epoch": 5741} {"train_loss": -26.901477813720703, "global_step": 476514, "epoch": 5741} {"train_loss": -26.412857055664062, "global_step": 476515, "epoch": 5741} {"train_loss": -26.930383682250977, "global_step": 476516, "epoch": 5741} {"train_loss": -26.841760635375977, "global_step": 476517, "epoch": 5741} {"train_loss": -26.815326690673828, "global_step": 476518, "epoch": 5741} {"train_loss": -27.179960250854492, "global_step": 476519, "epoch": 5741} {"train_loss": -26.833837509155273, "global_step": 476520, "epoch": 5741} {"train_loss": -26.857526779174805, "global_step": 476521, "epoch": 5741} {"train_loss": -27.36244010925293, "global_step": 476522, "epoch": 5741} {"train_loss": -27.056310653686523, "global_step": 476523, "epoch": 5741} {"train_loss": -26.748403549194336, "global_step": 476524, "epoch": 5741} {"train_loss": -26.95588493347168, "global_step": 476525, "epoch": 5741} {"train_loss": -26.85737419128418, "global_step": 476526, "epoch": 5741} {"train_loss": -27.409381866455078, "global_step": 476527, "epoch": 5741} {"train_loss": -26.981229782104492, "global_step": 476528, "epoch": 5741} {"train_loss": -27.243085861206055, "global_step": 476529, "epoch": 5741} {"train_loss": -26.958410263061523, "global_step": 476530, "epoch": 5741} {"train_loss": -26.967981338500977, "global_step": 476531, "epoch": 5741} {"train_loss": -27.561277389526367, "global_step": 476532, "epoch": 5741} {"train_loss": -27.11516761779785, "global_step": 476533, "epoch": 5741} {"train_loss": -27.15433120727539, "global_step": 476534, "epoch": 5741} {"train_loss": -27.26542091369629, "global_step": 476535, "epoch": 5741} {"train_loss": -26.966785430908203, "global_step": 476536, "epoch": 5741} {"train_loss": -27.691925048828125, "global_step": 476537, "epoch": 5741} {"train_loss": -26.989599227905273, "global_step": 476538, "epoch": 5741} {"train_loss": -27.521276473999023, "global_step": 476539, "epoch": 5741} {"train_loss": -27.3253116607666, "global_step": 476540, "epoch": 5741} {"train_loss": -27.496484756469727, "global_step": 476541, "epoch": 5741} {"train_loss": -27.338109970092773, "global_step": 476542, "epoch": 5741} {"train_loss": -26.93752098083496, "global_step": 476543, "epoch": 5741} {"train_loss": -27.449356079101562, "global_step": 476544, "epoch": 5741} {"train_loss": -27.73187255859375, "global_step": 476545, "epoch": 5741} {"train_loss": -26.9613094329834, "global_step": 476546, "epoch": 5741} {"train_loss": -27.090286254882812, "global_step": 476547, "epoch": 5741} {"train_loss": -27.090734481811523, "global_step": 476548, "epoch": 5741} {"train_loss": -27.151514053344727, "global_step": 476549, "epoch": 5741} {"train_loss": -27.500940322875977, "global_step": 476550, "epoch": 5741} {"train_loss": -27.339813232421875, "global_step": 476551, "epoch": 5741} {"train_loss": -27.523950576782227, "global_step": 476552, "epoch": 5741} {"train_loss": -27.410642623901367, "global_step": 476553, "epoch": 5741} {"train_loss": -27.726308822631836, "global_step": 476554, "epoch": 5741} {"train_loss": -27.668094635009766, "global_step": 476555, "epoch": 5741} {"train_loss": -27.309743881225586, "global_step": 476556, "epoch": 5741} {"train_loss": -27.5076847076416, "global_step": 476557, "epoch": 5741} {"train_loss": -27.498464584350586, "global_step": 476558, "epoch": 5741} {"train_loss": -27.3552303314209, "global_step": 476559, "epoch": 5741} {"train_loss": -27.614288330078125, "global_step": 476560, "epoch": 5741} {"train_loss": -27.136571884155273, "global_step": 476561, "epoch": 5741} {"train_loss": -27.088220596313477, "global_step": 476562, "epoch": 5741} {"train_loss": -26.8397216796875, "global_step": 476563, "epoch": 5741} {"train_loss": -26.90521240234375, "global_step": 476564, "epoch": 5741} {"train_loss": -27.336118698120117, "global_step": 476565, "epoch": 5741} {"train_loss": -26.609790802001953, "global_step": 476566, "epoch": 5741} {"train_loss": -27.176130294799805, "global_step": 476567, "epoch": 5741} {"train_loss": -27.440839767456055, "global_step": 476568, "epoch": 5741} {"train_loss": -27.170948028564453, "global_step": 476569, "epoch": 5741} {"train_loss": -27.17121696472168, "global_step": 476570, "epoch": 5741} {"train_loss": -27.530454635620117, "global_step": 476571, "epoch": 5741} {"train_loss": -27.3133544921875, "global_step": 476572, "epoch": 5741} {"train_loss": -27.30108070373535, "global_step": 476573, "epoch": 5741} {"train_loss": -27.535511016845703, "global_step": 476574, "epoch": 5741} {"train_loss": -27.328474044799805, "global_step": 476575, "epoch": 5741} {"train_loss": -27.986616134643555, "global_step": 476576, "epoch": 5741} {"train_loss": -27.464155197143555, "global_step": 476577, "epoch": 5741} {"train_loss": -27.070905685424805, "global_step": 476578, "epoch": 5741} {"train_loss": -27.3669490814209, "global_step": 476579, "epoch": 5741} {"train_loss": -27.396657943725586, "global_step": 476580, "epoch": 5741} {"train_loss": -27.202234268188477, "global_step": 476581, "epoch": 5741} {"train_loss": -27.143110275268555, "global_step": 476582, "epoch": 5741} {"train_loss": -27.937976837158203, "global_step": 476583, "epoch": 5741} {"train_loss": -27.33363151550293, "global_step": 476584, "epoch": 5741} {"train_loss": -27.147747660257732, "global_step": 476585, "epoch": 5741, "val_loss": 6737592.0} {"train_loss": -26.943912506103516, "global_step": 476586, "epoch": 5742} {"train_loss": -26.276132583618164, "global_step": 476587, "epoch": 5742} {"train_loss": -26.215917587280273, "global_step": 476588, "epoch": 5742} {"train_loss": -25.777023315429688, "global_step": 476589, "epoch": 5742} {"train_loss": -26.03608512878418, "global_step": 476590, "epoch": 5742} {"train_loss": -26.70049476623535, "global_step": 476591, "epoch": 5742} {"train_loss": -25.95588493347168, "global_step": 476592, "epoch": 5742} {"train_loss": -26.648609161376953, "global_step": 476593, "epoch": 5742} {"train_loss": -26.59515380859375, "global_step": 476594, "epoch": 5742} {"train_loss": -26.426483154296875, "global_step": 476595, "epoch": 5742} {"train_loss": -27.00929069519043, "global_step": 476596, "epoch": 5742} {"train_loss": -26.639616012573242, "global_step": 476597, "epoch": 5742} {"train_loss": -26.127426147460938, "global_step": 476598, "epoch": 5742} {"train_loss": -26.717985153198242, "global_step": 476599, "epoch": 5742} {"train_loss": -26.72187614440918, "global_step": 476600, "epoch": 5742} {"train_loss": -26.34442710876465, "global_step": 476601, "epoch": 5742} {"train_loss": -26.8856143951416, "global_step": 476602, "epoch": 5742} {"train_loss": -26.73243522644043, "global_step": 476603, "epoch": 5742} {"train_loss": -26.789478302001953, "global_step": 476604, "epoch": 5742} {"train_loss": -26.86739158630371, "global_step": 476605, "epoch": 5742} {"train_loss": -26.920522689819336, "global_step": 476606, "epoch": 5742} {"train_loss": -26.84515953063965, "global_step": 476607, "epoch": 5742} {"train_loss": -27.0203857421875, "global_step": 476608, "epoch": 5742} {"train_loss": -27.44748306274414, "global_step": 476609, "epoch": 5742} {"train_loss": -26.833524703979492, "global_step": 476610, "epoch": 5742} {"train_loss": -27.087692260742188, "global_step": 476611, "epoch": 5742} {"train_loss": -26.97818946838379, "global_step": 476612, "epoch": 5742} {"train_loss": -26.76517105102539, "global_step": 476613, "epoch": 5742} {"train_loss": -26.784406661987305, "global_step": 476614, "epoch": 5742} {"train_loss": -26.977956771850586, "global_step": 476615, "epoch": 5742} {"train_loss": -26.734619140625, "global_step": 476616, "epoch": 5742} {"train_loss": -26.658655166625977, "global_step": 476617, "epoch": 5742} {"train_loss": -26.962833404541016, "global_step": 476618, "epoch": 5742} {"train_loss": -27.21260643005371, "global_step": 476619, "epoch": 5742} {"train_loss": -27.440526962280273, "global_step": 476620, "epoch": 5742} {"train_loss": -27.051401138305664, "global_step": 476621, "epoch": 5742} {"train_loss": -26.971973419189453, "global_step": 476622, "epoch": 5742} {"train_loss": -27.227432250976562, "global_step": 476623, "epoch": 5742} {"train_loss": -26.880817413330078, "global_step": 476624, "epoch": 5742} {"train_loss": -27.42439079284668, "global_step": 476625, "epoch": 5742} {"train_loss": -27.113052368164062, "global_step": 476626, "epoch": 5742} {"train_loss": -26.7684268951416, "global_step": 476627, "epoch": 5742} {"train_loss": -26.821996688842773, "global_step": 476628, "epoch": 5742} {"train_loss": -27.180150985717773, "global_step": 476629, "epoch": 5742} {"train_loss": -27.258071899414062, "global_step": 476630, "epoch": 5742} {"train_loss": -27.290985107421875, "global_step": 476631, "epoch": 5742} {"train_loss": -27.40464210510254, "global_step": 476632, "epoch": 5742} {"train_loss": -27.218164443969727, "global_step": 476633, "epoch": 5742} {"train_loss": -27.39751625061035, "global_step": 476634, "epoch": 5742} {"train_loss": -27.252887725830078, "global_step": 476635, "epoch": 5742} {"train_loss": -27.10371208190918, "global_step": 476636, "epoch": 5742} {"train_loss": -27.412702560424805, "global_step": 476637, "epoch": 5742} {"train_loss": -26.948505401611328, "global_step": 476638, "epoch": 5742} {"train_loss": -27.476545333862305, "global_step": 476639, "epoch": 5742} {"train_loss": -27.136083602905273, "global_step": 476640, "epoch": 5742} {"train_loss": -27.415109634399414, "global_step": 476641, "epoch": 5742} {"train_loss": -27.196048736572266, "global_step": 476642, "epoch": 5742} {"train_loss": -27.289899826049805, "global_step": 476643, "epoch": 5742} {"train_loss": -27.6646785736084, "global_step": 476644, "epoch": 5742} {"train_loss": -27.361108779907227, "global_step": 476645, "epoch": 5742} {"train_loss": -27.712604522705078, "global_step": 476646, "epoch": 5742} {"train_loss": -27.10395622253418, "global_step": 476647, "epoch": 5742} {"train_loss": -27.244192123413086, "global_step": 476648, "epoch": 5742} {"train_loss": -27.2753963470459, "global_step": 476649, "epoch": 5742} {"train_loss": -27.503131866455078, "global_step": 476650, "epoch": 5742} {"train_loss": -27.100866317749023, "global_step": 476651, "epoch": 5742} {"train_loss": -27.29852294921875, "global_step": 476652, "epoch": 5742} {"train_loss": -27.637664794921875, "global_step": 476653, "epoch": 5742} {"train_loss": -27.523834228515625, "global_step": 476654, "epoch": 5742} {"train_loss": -27.22332763671875, "global_step": 476655, "epoch": 5742} {"train_loss": -27.5684871673584, "global_step": 476656, "epoch": 5742} {"train_loss": -27.252145767211914, "global_step": 476657, "epoch": 5742} {"train_loss": -27.01881217956543, "global_step": 476658, "epoch": 5742} {"train_loss": -27.4481201171875, "global_step": 476659, "epoch": 5742} {"train_loss": -27.377124786376953, "global_step": 476660, "epoch": 5742} {"train_loss": -27.203439712524414, "global_step": 476661, "epoch": 5742} {"train_loss": -27.352874755859375, "global_step": 476662, "epoch": 5742} {"train_loss": -26.892194747924805, "global_step": 476663, "epoch": 5742} {"train_loss": -27.61176872253418, "global_step": 476664, "epoch": 5742} {"train_loss": -27.167240142822266, "global_step": 476665, "epoch": 5742} {"train_loss": -27.33790397644043, "global_step": 476666, "epoch": 5742} {"train_loss": -27.292455673217773, "global_step": 476667, "epoch": 5742} {"train_loss": -27.042177889720502, "global_step": 476668, "epoch": 5742, "val_loss": 6684563.0} {"train_loss": -27.15131187438965, "global_step": 476669, "epoch": 5743} {"train_loss": -27.094343185424805, "global_step": 476670, "epoch": 5743} {"train_loss": -27.282379150390625, "global_step": 476671, "epoch": 5743} {"train_loss": -26.757587432861328, "global_step": 476672, "epoch": 5743} {"train_loss": -26.789011001586914, "global_step": 476673, "epoch": 5743} {"train_loss": -27.395965576171875, "global_step": 476674, "epoch": 5743} {"train_loss": -26.803159713745117, "global_step": 476675, "epoch": 5743} {"train_loss": -27.129907608032227, "global_step": 476676, "epoch": 5743} {"train_loss": -26.732257843017578, "global_step": 476677, "epoch": 5743} {"train_loss": -27.08418846130371, "global_step": 476678, "epoch": 5743} {"train_loss": -27.10175895690918, "global_step": 476679, "epoch": 5743} {"train_loss": -27.0349178314209, "global_step": 476680, "epoch": 5743} {"train_loss": -27.154895782470703, "global_step": 476681, "epoch": 5743} {"train_loss": -27.429412841796875, "global_step": 476682, "epoch": 5743} {"train_loss": -26.874042510986328, "global_step": 476683, "epoch": 5743} {"train_loss": -27.147424697875977, "global_step": 476684, "epoch": 5743} {"train_loss": -26.65277099609375, "global_step": 476685, "epoch": 5743} {"train_loss": -27.038116455078125, "global_step": 476686, "epoch": 5743} {"train_loss": -27.464330673217773, "global_step": 476687, "epoch": 5743} {"train_loss": -27.162647247314453, "global_step": 476688, "epoch": 5743} {"train_loss": -27.008420944213867, "global_step": 476689, "epoch": 5743} {"train_loss": -26.528234481811523, "global_step": 476690, "epoch": 5743} {"train_loss": -26.833154678344727, "global_step": 476691, "epoch": 5743} {"train_loss": -27.021081924438477, "global_step": 476692, "epoch": 5743} {"train_loss": -27.056684494018555, "global_step": 476693, "epoch": 5743} {"train_loss": -27.090717315673828, "global_step": 476694, "epoch": 5743} {"train_loss": -26.95892906188965, "global_step": 476695, "epoch": 5743} {"train_loss": -27.172712326049805, "global_step": 476696, "epoch": 5743} {"train_loss": -27.151336669921875, "global_step": 476697, "epoch": 5743} {"train_loss": -27.199127197265625, "global_step": 476698, "epoch": 5743} {"train_loss": -27.17892837524414, "global_step": 476699, "epoch": 5743} {"train_loss": -27.14691734313965, "global_step": 476700, "epoch": 5743} {"train_loss": -27.29408073425293, "global_step": 476701, "epoch": 5743} {"train_loss": -27.287878036499023, "global_step": 476702, "epoch": 5743} {"train_loss": -27.294214248657227, "global_step": 476703, "epoch": 5743} {"train_loss": -27.268346786499023, "global_step": 476704, "epoch": 5743} {"train_loss": -27.016462326049805, "global_step": 476705, "epoch": 5743} {"train_loss": -26.959842681884766, "global_step": 476706, "epoch": 5743} {"train_loss": -27.45171546936035, "global_step": 476707, "epoch": 5743} {"train_loss": -26.75554847717285, "global_step": 476708, "epoch": 5743} {"train_loss": -26.652591705322266, "global_step": 476709, "epoch": 5743} {"train_loss": -26.947341918945312, "global_step": 476710, "epoch": 5743} {"train_loss": -26.986419677734375, "global_step": 476711, "epoch": 5743} {"train_loss": -27.271442413330078, "global_step": 476712, "epoch": 5743} {"train_loss": -27.437856674194336, "global_step": 476713, "epoch": 5743} {"train_loss": -27.68155860900879, "global_step": 476714, "epoch": 5743} {"train_loss": -27.34050941467285, "global_step": 476715, "epoch": 5743} {"train_loss": -27.067296981811523, "global_step": 476716, "epoch": 5743} {"train_loss": -27.6367244720459, "global_step": 476717, "epoch": 5743} {"train_loss": -27.440153121948242, "global_step": 476718, "epoch": 5743} {"train_loss": -27.265954971313477, "global_step": 476719, "epoch": 5743} {"train_loss": -27.159170150756836, "global_step": 476720, "epoch": 5743} {"train_loss": -27.525821685791016, "global_step": 476721, "epoch": 5743} {"train_loss": -27.12473487854004, "global_step": 476722, "epoch": 5743} {"train_loss": -27.410367965698242, "global_step": 476723, "epoch": 5743} {"train_loss": -27.0756893157959, "global_step": 476724, "epoch": 5743} {"train_loss": -27.32986831665039, "global_step": 476725, "epoch": 5743} {"train_loss": -27.073816299438477, "global_step": 476726, "epoch": 5743} {"train_loss": -27.46649742126465, "global_step": 476727, "epoch": 5743} {"train_loss": -26.897748947143555, "global_step": 476728, "epoch": 5743} {"train_loss": -27.028305053710938, "global_step": 476729, "epoch": 5743} {"train_loss": -27.527624130249023, "global_step": 476730, "epoch": 5743} {"train_loss": -27.085708618164062, "global_step": 476731, "epoch": 5743} {"train_loss": -27.42499351501465, "global_step": 476732, "epoch": 5743} {"train_loss": -27.407184600830078, "global_step": 476733, "epoch": 5743} {"train_loss": -26.958951950073242, "global_step": 476734, "epoch": 5743} {"train_loss": -27.43039321899414, "global_step": 476735, "epoch": 5743} {"train_loss": -27.305988311767578, "global_step": 476736, "epoch": 5743} {"train_loss": -27.522998809814453, "global_step": 476737, "epoch": 5743} {"train_loss": -27.284696578979492, "global_step": 476738, "epoch": 5743} {"train_loss": -27.40409278869629, "global_step": 476739, "epoch": 5743} {"train_loss": -27.3707275390625, "global_step": 476740, "epoch": 5743} {"train_loss": -27.449310302734375, "global_step": 476741, "epoch": 5743} {"train_loss": -27.05634117126465, "global_step": 476742, "epoch": 5743} {"train_loss": -27.50066566467285, "global_step": 476743, "epoch": 5743} {"train_loss": -27.451208114624023, "global_step": 476744, "epoch": 5743} {"train_loss": -27.368188858032227, "global_step": 476745, "epoch": 5743} {"train_loss": -27.424768447875977, "global_step": 476746, "epoch": 5743} {"train_loss": -26.734907150268555, "global_step": 476747, "epoch": 5743} {"train_loss": -27.456281661987305, "global_step": 476748, "epoch": 5743} {"train_loss": -27.051061630249023, "global_step": 476749, "epoch": 5743} {"train_loss": -27.246183395385742, "global_step": 476750, "epoch": 5743} {"train_loss": -27.160861440451747, "global_step": 476751, "epoch": 5743, "val_loss": 6785700.5} {"train_loss": -26.775049209594727, "global_step": 476752, "epoch": 5744} {"train_loss": -26.153772354125977, "global_step": 476753, "epoch": 5744} {"train_loss": -26.262765884399414, "global_step": 476754, "epoch": 5744} {"train_loss": -26.145227432250977, "global_step": 476755, "epoch": 5744} {"train_loss": -26.932470321655273, "global_step": 476756, "epoch": 5744} {"train_loss": -26.149524688720703, "global_step": 476757, "epoch": 5744} {"train_loss": -25.853912353515625, "global_step": 476758, "epoch": 5744} {"train_loss": -27.015872955322266, "global_step": 476759, "epoch": 5744} {"train_loss": -26.824369430541992, "global_step": 476760, "epoch": 5744} {"train_loss": -26.287805557250977, "global_step": 476761, "epoch": 5744} {"train_loss": -27.039264678955078, "global_step": 476762, "epoch": 5744} {"train_loss": -26.5636043548584, "global_step": 476763, "epoch": 5744} {"train_loss": -26.787805557250977, "global_step": 476764, "epoch": 5744} {"train_loss": -26.923276901245117, "global_step": 476765, "epoch": 5744} {"train_loss": -27.2294921875, "global_step": 476766, "epoch": 5744} {"train_loss": -26.9966983795166, "global_step": 476767, "epoch": 5744} {"train_loss": -27.255298614501953, "global_step": 476768, "epoch": 5744} {"train_loss": -26.796438217163086, "global_step": 476769, "epoch": 5744} {"train_loss": -27.13788414001465, "global_step": 476770, "epoch": 5744} {"train_loss": -27.054014205932617, "global_step": 476771, "epoch": 5744} {"train_loss": -26.855627059936523, "global_step": 476772, "epoch": 5744} {"train_loss": -27.0398006439209, "global_step": 476773, "epoch": 5744} {"train_loss": -27.284154891967773, "global_step": 476774, "epoch": 5744} {"train_loss": -27.094099044799805, "global_step": 476775, "epoch": 5744} {"train_loss": -27.230670928955078, "global_step": 476776, "epoch": 5744} {"train_loss": -27.695560455322266, "global_step": 476777, "epoch": 5744} {"train_loss": -26.800119400024414, "global_step": 476778, "epoch": 5744} {"train_loss": -27.28778076171875, "global_step": 476779, "epoch": 5744} {"train_loss": -27.084980010986328, "global_step": 476780, "epoch": 5744} {"train_loss": -27.09710121154785, "global_step": 476781, "epoch": 5744} {"train_loss": -26.869827270507812, "global_step": 476782, "epoch": 5744} {"train_loss": -27.065778732299805, "global_step": 476783, "epoch": 5744} {"train_loss": -26.970300674438477, "global_step": 476784, "epoch": 5744} {"train_loss": -26.989288330078125, "global_step": 476785, "epoch": 5744} {"train_loss": -27.185598373413086, "global_step": 476786, "epoch": 5744} {"train_loss": -27.0726375579834, "global_step": 476787, "epoch": 5744} {"train_loss": -26.86311149597168, "global_step": 476788, "epoch": 5744} {"train_loss": -27.354511260986328, "global_step": 476789, "epoch": 5744} {"train_loss": -27.014982223510742, "global_step": 476790, "epoch": 5744} {"train_loss": -27.176427841186523, "global_step": 476791, "epoch": 5744} {"train_loss": -27.215194702148438, "global_step": 476792, "epoch": 5744} {"train_loss": -27.522851943969727, "global_step": 476793, "epoch": 5744} {"train_loss": -27.231107711791992, "global_step": 476794, "epoch": 5744} {"train_loss": -27.118539810180664, "global_step": 476795, "epoch": 5744} {"train_loss": -27.427881240844727, "global_step": 476796, "epoch": 5744} {"train_loss": -27.315710067749023, "global_step": 476797, "epoch": 5744} {"train_loss": -27.012104034423828, "global_step": 476798, "epoch": 5744} {"train_loss": -27.31959342956543, "global_step": 476799, "epoch": 5744} {"train_loss": -27.30256462097168, "global_step": 476800, "epoch": 5744} {"train_loss": -27.402759552001953, "global_step": 476801, "epoch": 5744} {"train_loss": -27.06097412109375, "global_step": 476802, "epoch": 5744} {"train_loss": -27.312088012695312, "global_step": 476803, "epoch": 5744} {"train_loss": -27.62869644165039, "global_step": 476804, "epoch": 5744} {"train_loss": -27.1370849609375, "global_step": 476805, "epoch": 5744} {"train_loss": -27.30377769470215, "global_step": 476806, "epoch": 5744} {"train_loss": -27.487546920776367, "global_step": 476807, "epoch": 5744} {"train_loss": -27.18938636779785, "global_step": 476808, "epoch": 5744} {"train_loss": -27.318273544311523, "global_step": 476809, "epoch": 5744} {"train_loss": -27.539596557617188, "global_step": 476810, "epoch": 5744} {"train_loss": -27.538986206054688, "global_step": 476811, "epoch": 5744} {"train_loss": -27.288671493530273, "global_step": 476812, "epoch": 5744} {"train_loss": -27.494308471679688, "global_step": 476813, "epoch": 5744} {"train_loss": -27.168048858642578, "global_step": 476814, "epoch": 5744} {"train_loss": -27.51376724243164, "global_step": 476815, "epoch": 5744} {"train_loss": -27.357519149780273, "global_step": 476816, "epoch": 5744} {"train_loss": -27.299192428588867, "global_step": 476817, "epoch": 5744} {"train_loss": -27.510007858276367, "global_step": 476818, "epoch": 5744} {"train_loss": -27.298389434814453, "global_step": 476819, "epoch": 5744} {"train_loss": -27.17958641052246, "global_step": 476820, "epoch": 5744} {"train_loss": -27.22625160217285, "global_step": 476821, "epoch": 5744} {"train_loss": -27.114501953125, "global_step": 476822, "epoch": 5744} {"train_loss": -27.242218017578125, "global_step": 476823, "epoch": 5744} {"train_loss": -27.227460861206055, "global_step": 476824, "epoch": 5744} {"train_loss": -27.20088005065918, "global_step": 476825, "epoch": 5744} {"train_loss": -27.522974014282227, "global_step": 476826, "epoch": 5744} {"train_loss": -27.570539474487305, "global_step": 476827, "epoch": 5744} {"train_loss": -27.452604293823242, "global_step": 476828, "epoch": 5744} {"train_loss": -27.60101890563965, "global_step": 476829, "epoch": 5744} {"train_loss": -27.05682945251465, "global_step": 476830, "epoch": 5744} {"train_loss": -27.79794692993164, "global_step": 476831, "epoch": 5744} {"train_loss": -27.78497886657715, "global_step": 476832, "epoch": 5744} {"train_loss": -27.38197135925293, "global_step": 476833, "epoch": 5744} {"train_loss": -27.13547862868711, "global_step": 476834, "epoch": 5744, "val_loss": 6698725.0} {"train_loss": -26.64338493347168, "global_step": 476835, "epoch": 5745} {"train_loss": -27.116809844970703, "global_step": 476836, "epoch": 5745} {"train_loss": -26.1478328704834, "global_step": 476837, "epoch": 5745} {"train_loss": -26.651504516601562, "global_step": 476838, "epoch": 5745} {"train_loss": -26.775272369384766, "global_step": 476839, "epoch": 5745} {"train_loss": -27.05097770690918, "global_step": 476840, "epoch": 5745} {"train_loss": -25.931222915649414, "global_step": 476841, "epoch": 5745} {"train_loss": -26.774641036987305, "global_step": 476842, "epoch": 5745} {"train_loss": -26.222702026367188, "global_step": 476843, "epoch": 5745} {"train_loss": -26.58981704711914, "global_step": 476844, "epoch": 5745} {"train_loss": -27.0812931060791, "global_step": 476845, "epoch": 5745} {"train_loss": -26.965763092041016, "global_step": 476846, "epoch": 5745} {"train_loss": -26.841323852539062, "global_step": 476847, "epoch": 5745} {"train_loss": -27.22698402404785, "global_step": 476848, "epoch": 5745} {"train_loss": -27.062849044799805, "global_step": 476849, "epoch": 5745} {"train_loss": -27.03214454650879, "global_step": 476850, "epoch": 5745} {"train_loss": -27.235986709594727, "global_step": 476851, "epoch": 5745} {"train_loss": -27.136062622070312, "global_step": 476852, "epoch": 5745} {"train_loss": -26.974512100219727, "global_step": 476853, "epoch": 5745} {"train_loss": -27.079864501953125, "global_step": 476854, "epoch": 5745} {"train_loss": -27.154016494750977, "global_step": 476855, "epoch": 5745} {"train_loss": -27.0157413482666, "global_step": 476856, "epoch": 5745} {"train_loss": -27.337390899658203, "global_step": 476857, "epoch": 5745} {"train_loss": -27.075963973999023, "global_step": 476858, "epoch": 5745} {"train_loss": -27.039569854736328, "global_step": 476859, "epoch": 5745} {"train_loss": -27.037317276000977, "global_step": 476860, "epoch": 5745} {"train_loss": -27.352060317993164, "global_step": 476861, "epoch": 5745} {"train_loss": -27.35113525390625, "global_step": 476862, "epoch": 5745} {"train_loss": -26.944772720336914, "global_step": 476863, "epoch": 5745} {"train_loss": -27.585113525390625, "global_step": 476864, "epoch": 5745} {"train_loss": -27.08086585998535, "global_step": 476865, "epoch": 5745} {"train_loss": -26.97818374633789, "global_step": 476866, "epoch": 5745} {"train_loss": -27.337045669555664, "global_step": 476867, "epoch": 5745} {"train_loss": -27.42816162109375, "global_step": 476868, "epoch": 5745} {"train_loss": -27.007898330688477, "global_step": 476869, "epoch": 5745} {"train_loss": -27.13324546813965, "global_step": 476870, "epoch": 5745} {"train_loss": -27.205310821533203, "global_step": 476871, "epoch": 5745} {"train_loss": -27.636510848999023, "global_step": 476872, "epoch": 5745} {"train_loss": -27.153583526611328, "global_step": 476873, "epoch": 5745} {"train_loss": -27.173471450805664, "global_step": 476874, "epoch": 5745} {"train_loss": -27.316701889038086, "global_step": 476875, "epoch": 5745} {"train_loss": -27.627843856811523, "global_step": 476876, "epoch": 5745} {"train_loss": -27.1734561920166, "global_step": 476877, "epoch": 5745} {"train_loss": -27.36353874206543, "global_step": 476878, "epoch": 5745} {"train_loss": -27.81903648376465, "global_step": 476879, "epoch": 5745} {"train_loss": -27.740036010742188, "global_step": 476880, "epoch": 5745} {"train_loss": -27.592504501342773, "global_step": 476881, "epoch": 5745} {"train_loss": -27.68134117126465, "global_step": 476882, "epoch": 5745} {"train_loss": -27.540014266967773, "global_step": 476883, "epoch": 5745} {"train_loss": -27.239013671875, "global_step": 476884, "epoch": 5745} {"train_loss": -26.74184226989746, "global_step": 476885, "epoch": 5745} {"train_loss": -26.890771865844727, "global_step": 476886, "epoch": 5745} {"train_loss": -27.265735626220703, "global_step": 476887, "epoch": 5745} {"train_loss": -27.457935333251953, "global_step": 476888, "epoch": 5745} {"train_loss": -27.143054962158203, "global_step": 476889, "epoch": 5745} {"train_loss": -27.134550094604492, "global_step": 476890, "epoch": 5745} {"train_loss": -26.789758682250977, "global_step": 476891, "epoch": 5745} {"train_loss": -26.21406364440918, "global_step": 476892, "epoch": 5745} {"train_loss": -25.8281307220459, "global_step": 476893, "epoch": 5745} {"train_loss": -25.66778564453125, "global_step": 476894, "epoch": 5745} {"train_loss": -27.4278564453125, "global_step": 476895, "epoch": 5745} {"train_loss": -26.338245391845703, "global_step": 476896, "epoch": 5745} {"train_loss": -25.897266387939453, "global_step": 476897, "epoch": 5745} {"train_loss": -27.023212432861328, "global_step": 476898, "epoch": 5745} {"train_loss": -26.3719539642334, "global_step": 476899, "epoch": 5745} {"train_loss": -27.397907257080078, "global_step": 476900, "epoch": 5745} {"train_loss": -26.544836044311523, "global_step": 476901, "epoch": 5745} {"train_loss": -26.84384536743164, "global_step": 476902, "epoch": 5745} {"train_loss": -26.710073471069336, "global_step": 476903, "epoch": 5745} {"train_loss": -26.28330421447754, "global_step": 476904, "epoch": 5745} {"train_loss": -27.015796661376953, "global_step": 476905, "epoch": 5745} {"train_loss": -26.72881507873535, "global_step": 476906, "epoch": 5745} {"train_loss": -27.263916015625, "global_step": 476907, "epoch": 5745} {"train_loss": -26.86751365661621, "global_step": 476908, "epoch": 5745} {"train_loss": -26.93988609313965, "global_step": 476909, "epoch": 5745} {"train_loss": -27.537561416625977, "global_step": 476910, "epoch": 5745} {"train_loss": -26.565305709838867, "global_step": 476911, "epoch": 5745} {"train_loss": -27.015966415405273, "global_step": 476912, "epoch": 5745} {"train_loss": -27.332263946533203, "global_step": 476913, "epoch": 5745} {"train_loss": -26.973844528198242, "global_step": 476914, "epoch": 5745} {"train_loss": -26.834264755249023, "global_step": 476915, "epoch": 5745} {"train_loss": -26.771991729736328, "global_step": 476916, "epoch": 5745} {"train_loss": -27.011251817266626, "global_step": 476917, "epoch": 5745, "val_loss": 6600155.0} {"train_loss": -26.81374168395996, "global_step": 476918, "epoch": 5746} {"train_loss": -26.987567901611328, "global_step": 476919, "epoch": 5746} {"train_loss": -26.97648048400879, "global_step": 476920, "epoch": 5746} {"train_loss": -26.939716339111328, "global_step": 476921, "epoch": 5746} {"train_loss": -26.939725875854492, "global_step": 476922, "epoch": 5746} {"train_loss": -26.410999298095703, "global_step": 476923, "epoch": 5746} {"train_loss": -26.935400009155273, "global_step": 476924, "epoch": 5746} {"train_loss": -26.575428009033203, "global_step": 476925, "epoch": 5746} {"train_loss": -26.503095626831055, "global_step": 476926, "epoch": 5746} {"train_loss": -27.124469757080078, "global_step": 476927, "epoch": 5746} {"train_loss": -26.762380599975586, "global_step": 476928, "epoch": 5746} {"train_loss": -26.71965980529785, "global_step": 476929, "epoch": 5746} {"train_loss": -27.099002838134766, "global_step": 476930, "epoch": 5746} {"train_loss": -26.752429962158203, "global_step": 476931, "epoch": 5746} {"train_loss": -26.967161178588867, "global_step": 476932, "epoch": 5746} {"train_loss": -27.052473068237305, "global_step": 476933, "epoch": 5746} {"train_loss": -26.9899959564209, "global_step": 476934, "epoch": 5746} {"train_loss": -27.080169677734375, "global_step": 476935, "epoch": 5746} {"train_loss": -27.17233657836914, "global_step": 476936, "epoch": 5746} {"train_loss": -27.118330001831055, "global_step": 476937, "epoch": 5746} {"train_loss": -27.367950439453125, "global_step": 476938, "epoch": 5746} {"train_loss": -27.303497314453125, "global_step": 476939, "epoch": 5746} {"train_loss": -27.193464279174805, "global_step": 476940, "epoch": 5746} {"train_loss": -26.62946128845215, "global_step": 476941, "epoch": 5746} {"train_loss": -27.13134765625, "global_step": 476942, "epoch": 5746} {"train_loss": -27.055530548095703, "global_step": 476943, "epoch": 5746} {"train_loss": -27.229772567749023, "global_step": 476944, "epoch": 5746} {"train_loss": -27.225439071655273, "global_step": 476945, "epoch": 5746} {"train_loss": -26.887571334838867, "global_step": 476946, "epoch": 5746} {"train_loss": -27.276782989501953, "global_step": 476947, "epoch": 5746} {"train_loss": -27.511743545532227, "global_step": 476948, "epoch": 5746} {"train_loss": -27.142425537109375, "global_step": 476949, "epoch": 5746} {"train_loss": -27.430912017822266, "global_step": 476950, "epoch": 5746} {"train_loss": -27.090545654296875, "global_step": 476951, "epoch": 5746} {"train_loss": -26.980539321899414, "global_step": 476952, "epoch": 5746} {"train_loss": -27.280029296875, "global_step": 476953, "epoch": 5746} {"train_loss": -27.10626792907715, "global_step": 476954, "epoch": 5746} {"train_loss": -27.195907592773438, "global_step": 476955, "epoch": 5746} {"train_loss": -27.1606502532959, "global_step": 476956, "epoch": 5746} {"train_loss": -27.148456573486328, "global_step": 476957, "epoch": 5746} {"train_loss": -27.482269287109375, "global_step": 476958, "epoch": 5746} {"train_loss": -27.13771629333496, "global_step": 476959, "epoch": 5746} {"train_loss": -27.463071823120117, "global_step": 476960, "epoch": 5746} {"train_loss": -27.403745651245117, "global_step": 476961, "epoch": 5746} {"train_loss": -27.215045928955078, "global_step": 476962, "epoch": 5746} {"train_loss": -26.95556640625, "global_step": 476963, "epoch": 5746} {"train_loss": -27.13868522644043, "global_step": 476964, "epoch": 5746} {"train_loss": -26.702123641967773, "global_step": 476965, "epoch": 5746} {"train_loss": -26.593368530273438, "global_step": 476966, "epoch": 5746} {"train_loss": -26.50446128845215, "global_step": 476967, "epoch": 5746} {"train_loss": -26.796405792236328, "global_step": 476968, "epoch": 5746} {"train_loss": -26.8184871673584, "global_step": 476969, "epoch": 5746} {"train_loss": -27.26654052734375, "global_step": 476970, "epoch": 5746} {"train_loss": -26.56394386291504, "global_step": 476971, "epoch": 5746} {"train_loss": -26.94019889831543, "global_step": 476972, "epoch": 5746} {"train_loss": -27.262664794921875, "global_step": 476973, "epoch": 5746} {"train_loss": -27.019216537475586, "global_step": 476974, "epoch": 5746} {"train_loss": -26.7812557220459, "global_step": 476975, "epoch": 5746} {"train_loss": -27.269567489624023, "global_step": 476976, "epoch": 5746} {"train_loss": -27.299631118774414, "global_step": 476977, "epoch": 5746} {"train_loss": -27.357168197631836, "global_step": 476978, "epoch": 5746} {"train_loss": -27.255346298217773, "global_step": 476979, "epoch": 5746} {"train_loss": -27.232013702392578, "global_step": 476980, "epoch": 5746} {"train_loss": -27.166915893554688, "global_step": 476981, "epoch": 5746} {"train_loss": -27.326955795288086, "global_step": 476982, "epoch": 5746} {"train_loss": -27.6138916015625, "global_step": 476983, "epoch": 5746} {"train_loss": -27.502735137939453, "global_step": 476984, "epoch": 5746} {"train_loss": -26.85481071472168, "global_step": 476985, "epoch": 5746} {"train_loss": -27.146448135375977, "global_step": 476986, "epoch": 5746} {"train_loss": -27.191953659057617, "global_step": 476987, "epoch": 5746} {"train_loss": -27.285669326782227, "global_step": 476988, "epoch": 5746} {"train_loss": -27.135059356689453, "global_step": 476989, "epoch": 5746} {"train_loss": -27.363340377807617, "global_step": 476990, "epoch": 5746} {"train_loss": -27.010791778564453, "global_step": 476991, "epoch": 5746} {"train_loss": -27.152692794799805, "global_step": 476992, "epoch": 5746} {"train_loss": -27.078195571899414, "global_step": 476993, "epoch": 5746} {"train_loss": -27.15028190612793, "global_step": 476994, "epoch": 5746} {"train_loss": -27.5717716217041, "global_step": 476995, "epoch": 5746} {"train_loss": -27.5846004486084, "global_step": 476996, "epoch": 5746} {"train_loss": -27.090986251831055, "global_step": 476997, "epoch": 5746} {"train_loss": -27.263019561767578, "global_step": 476998, "epoch": 5746} {"train_loss": -26.977197647094727, "global_step": 476999, "epoch": 5746} {"train_loss": -27.095959973622517, "global_step": 477000, "epoch": 5746, "val_loss": 6583064.0} {"train_loss": -27.157806396484375, "global_step": 477001, "epoch": 5747} {"train_loss": -25.865339279174805, "global_step": 477002, "epoch": 5747} {"train_loss": -26.559574127197266, "global_step": 477003, "epoch": 5747} {"train_loss": -27.073205947875977, "global_step": 477004, "epoch": 5747} {"train_loss": -25.629613876342773, "global_step": 477005, "epoch": 5747} {"train_loss": -26.6227970123291, "global_step": 477006, "epoch": 5747} {"train_loss": -26.565093994140625, "global_step": 477007, "epoch": 5747} {"train_loss": -26.645349502563477, "global_step": 477008, "epoch": 5747} {"train_loss": -26.7623233795166, "global_step": 477009, "epoch": 5747} {"train_loss": -26.727014541625977, "global_step": 477010, "epoch": 5747} {"train_loss": -26.9631290435791, "global_step": 477011, "epoch": 5747} {"train_loss": -27.096282958984375, "global_step": 477012, "epoch": 5747} {"train_loss": -26.903120040893555, "global_step": 477013, "epoch": 5747} {"train_loss": -26.796649932861328, "global_step": 477014, "epoch": 5747} {"train_loss": -26.663930892944336, "global_step": 477015, "epoch": 5747} {"train_loss": -27.171356201171875, "global_step": 477016, "epoch": 5747} {"train_loss": -26.66813087463379, "global_step": 477017, "epoch": 5747} {"train_loss": -27.203317642211914, "global_step": 477018, "epoch": 5747} {"train_loss": -27.046804428100586, "global_step": 477019, "epoch": 5747} {"train_loss": -26.82303810119629, "global_step": 477020, "epoch": 5747} {"train_loss": -26.96380043029785, "global_step": 477021, "epoch": 5747} {"train_loss": -26.733997344970703, "global_step": 477022, "epoch": 5747} {"train_loss": -26.70387077331543, "global_step": 477023, "epoch": 5747} {"train_loss": -26.719348907470703, "global_step": 477024, "epoch": 5747} {"train_loss": -27.345966339111328, "global_step": 477025, "epoch": 5747} {"train_loss": -27.190948486328125, "global_step": 477026, "epoch": 5747} {"train_loss": -27.565771102905273, "global_step": 477027, "epoch": 5747} {"train_loss": -27.109603881835938, "global_step": 477028, "epoch": 5747} {"train_loss": -26.752429962158203, "global_step": 477029, "epoch": 5747} {"train_loss": -27.398801803588867, "global_step": 477030, "epoch": 5747} {"train_loss": -27.1176815032959, "global_step": 477031, "epoch": 5747} {"train_loss": -27.15740394592285, "global_step": 477032, "epoch": 5747} {"train_loss": -26.768173217773438, "global_step": 477033, "epoch": 5747} {"train_loss": -27.088703155517578, "global_step": 477034, "epoch": 5747} {"train_loss": -27.004987716674805, "global_step": 477035, "epoch": 5747} {"train_loss": -27.405439376831055, "global_step": 477036, "epoch": 5747} {"train_loss": -27.23638343811035, "global_step": 477037, "epoch": 5747} {"train_loss": -27.45867919921875, "global_step": 477038, "epoch": 5747} {"train_loss": -27.10548210144043, "global_step": 477039, "epoch": 5747} {"train_loss": -27.1230411529541, "global_step": 477040, "epoch": 5747} {"train_loss": -27.400562286376953, "global_step": 477041, "epoch": 5747} {"train_loss": -26.99236488342285, "global_step": 477042, "epoch": 5747} {"train_loss": -27.385534286499023, "global_step": 477043, "epoch": 5747} {"train_loss": -27.300573348999023, "global_step": 477044, "epoch": 5747} {"train_loss": -27.657201766967773, "global_step": 477045, "epoch": 5747} {"train_loss": -27.19524574279785, "global_step": 477046, "epoch": 5747} {"train_loss": -27.538251876831055, "global_step": 477047, "epoch": 5747} {"train_loss": -27.097509384155273, "global_step": 477048, "epoch": 5747} {"train_loss": -27.412927627563477, "global_step": 477049, "epoch": 5747} {"train_loss": -27.81296157836914, "global_step": 477050, "epoch": 5747} {"train_loss": -27.417861938476562, "global_step": 477051, "epoch": 5747} {"train_loss": -27.05875587463379, "global_step": 477052, "epoch": 5747} {"train_loss": -27.1811580657959, "global_step": 477053, "epoch": 5747} {"train_loss": -27.255422592163086, "global_step": 477054, "epoch": 5747} {"train_loss": -27.300241470336914, "global_step": 477055, "epoch": 5747} {"train_loss": -27.0606746673584, "global_step": 477056, "epoch": 5747} {"train_loss": -27.427698135375977, "global_step": 477057, "epoch": 5747} {"train_loss": -27.17970848083496, "global_step": 477058, "epoch": 5747} {"train_loss": -27.24782371520996, "global_step": 477059, "epoch": 5747} {"train_loss": -27.01962661743164, "global_step": 477060, "epoch": 5747} {"train_loss": -27.3682804107666, "global_step": 477061, "epoch": 5747} {"train_loss": -27.285818099975586, "global_step": 477062, "epoch": 5747} {"train_loss": -27.124425888061523, "global_step": 477063, "epoch": 5747} {"train_loss": -27.4259090423584, "global_step": 477064, "epoch": 5747} {"train_loss": -26.72421646118164, "global_step": 477065, "epoch": 5747} {"train_loss": -27.566587448120117, "global_step": 477066, "epoch": 5747} {"train_loss": -26.873075485229492, "global_step": 477067, "epoch": 5747} {"train_loss": -27.175107955932617, "global_step": 477068, "epoch": 5747} {"train_loss": -27.318143844604492, "global_step": 477069, "epoch": 5747} {"train_loss": -27.210575103759766, "global_step": 477070, "epoch": 5747} {"train_loss": -26.971160888671875, "global_step": 477071, "epoch": 5747} {"train_loss": -26.95546531677246, "global_step": 477072, "epoch": 5747} {"train_loss": -27.102203369140625, "global_step": 477073, "epoch": 5747} {"train_loss": -27.658252716064453, "global_step": 477074, "epoch": 5747} {"train_loss": -27.216175079345703, "global_step": 477075, "epoch": 5747} {"train_loss": -27.323532104492188, "global_step": 477076, "epoch": 5747} {"train_loss": -27.355443954467773, "global_step": 477077, "epoch": 5747} {"train_loss": -27.243152618408203, "global_step": 477078, "epoch": 5747} {"train_loss": -27.10633659362793, "global_step": 477079, "epoch": 5747} {"train_loss": -27.554462432861328, "global_step": 477080, "epoch": 5747} {"train_loss": -27.172651290893555, "global_step": 477081, "epoch": 5747} {"train_loss": -27.224369049072266, "global_step": 477082, "epoch": 5747} {"train_loss": -27.09762003335608, "global_step": 477083, "epoch": 5747, "val_loss": 6625547.5} {"train_loss": -26.36427879333496, "global_step": 477084, "epoch": 5748} {"train_loss": -25.483003616333008, "global_step": 477085, "epoch": 5748} {"train_loss": -26.46640396118164, "global_step": 477086, "epoch": 5748} {"train_loss": -26.93487548828125, "global_step": 477087, "epoch": 5748} {"train_loss": -26.273420333862305, "global_step": 477088, "epoch": 5748} {"train_loss": -26.526519775390625, "global_step": 477089, "epoch": 5748} {"train_loss": -26.52492332458496, "global_step": 477090, "epoch": 5748} {"train_loss": -26.445337295532227, "global_step": 477091, "epoch": 5748} {"train_loss": -26.684141159057617, "global_step": 477092, "epoch": 5748} {"train_loss": -26.69160270690918, "global_step": 477093, "epoch": 5748} {"train_loss": -26.9426326751709, "global_step": 477094, "epoch": 5748} {"train_loss": -27.09876823425293, "global_step": 477095, "epoch": 5748} {"train_loss": -26.727746963500977, "global_step": 477096, "epoch": 5748} {"train_loss": -26.86371421813965, "global_step": 477097, "epoch": 5748} {"train_loss": -27.06122398376465, "global_step": 477098, "epoch": 5748} {"train_loss": -26.312702178955078, "global_step": 477099, "epoch": 5748} {"train_loss": -26.927509307861328, "global_step": 477100, "epoch": 5748} {"train_loss": -26.747562408447266, "global_step": 477101, "epoch": 5748} {"train_loss": -26.910511016845703, "global_step": 477102, "epoch": 5748} {"train_loss": -27.137928009033203, "global_step": 477103, "epoch": 5748} {"train_loss": -26.74277114868164, "global_step": 477104, "epoch": 5748} {"train_loss": -27.137683868408203, "global_step": 477105, "epoch": 5748} {"train_loss": -26.907827377319336, "global_step": 477106, "epoch": 5748} {"train_loss": -27.200002670288086, "global_step": 477107, "epoch": 5748} {"train_loss": -27.26002311706543, "global_step": 477108, "epoch": 5748} {"train_loss": -27.0195369720459, "global_step": 477109, "epoch": 5748} {"train_loss": -27.127628326416016, "global_step": 477110, "epoch": 5748} {"train_loss": -27.244647979736328, "global_step": 477111, "epoch": 5748} {"train_loss": -27.110326766967773, "global_step": 477112, "epoch": 5748} {"train_loss": -27.38093376159668, "global_step": 477113, "epoch": 5748} {"train_loss": -27.365270614624023, "global_step": 477114, "epoch": 5748} {"train_loss": -27.231586456298828, "global_step": 477115, "epoch": 5748} {"train_loss": -26.99936866760254, "global_step": 477116, "epoch": 5748} {"train_loss": -27.146087646484375, "global_step": 477117, "epoch": 5748} {"train_loss": -27.173940658569336, "global_step": 477118, "epoch": 5748} {"train_loss": -27.4273681640625, "global_step": 477119, "epoch": 5748} {"train_loss": -27.388608932495117, "global_step": 477120, "epoch": 5748} {"train_loss": -27.448562622070312, "global_step": 477121, "epoch": 5748} {"train_loss": -27.3956241607666, "global_step": 477122, "epoch": 5748} {"train_loss": -27.239871978759766, "global_step": 477123, "epoch": 5748} {"train_loss": -27.337848663330078, "global_step": 477124, "epoch": 5748} {"train_loss": -27.2335262298584, "global_step": 477125, "epoch": 5748} {"train_loss": -27.77029800415039, "global_step": 477126, "epoch": 5748} {"train_loss": -27.26875877380371, "global_step": 477127, "epoch": 5748} {"train_loss": -27.3868350982666, "global_step": 477128, "epoch": 5748} {"train_loss": -26.9882869720459, "global_step": 477129, "epoch": 5748} {"train_loss": -27.287933349609375, "global_step": 477130, "epoch": 5748} {"train_loss": -27.7154541015625, "global_step": 477131, "epoch": 5748} {"train_loss": -27.280139923095703, "global_step": 477132, "epoch": 5748} {"train_loss": -27.246305465698242, "global_step": 477133, "epoch": 5748} {"train_loss": -27.244348526000977, "global_step": 477134, "epoch": 5748} {"train_loss": -27.00669288635254, "global_step": 477135, "epoch": 5748} {"train_loss": -27.362268447875977, "global_step": 477136, "epoch": 5748} {"train_loss": -27.308094024658203, "global_step": 477137, "epoch": 5748} {"train_loss": -27.144739151000977, "global_step": 477138, "epoch": 5748} {"train_loss": -27.294042587280273, "global_step": 477139, "epoch": 5748} {"train_loss": -27.18586540222168, "global_step": 477140, "epoch": 5748} {"train_loss": -27.449462890625, "global_step": 477141, "epoch": 5748} {"train_loss": -27.036413192749023, "global_step": 477142, "epoch": 5748} {"train_loss": -27.178329467773438, "global_step": 477143, "epoch": 5748} {"train_loss": -27.222578048706055, "global_step": 477144, "epoch": 5748} {"train_loss": -26.536340713500977, "global_step": 477145, "epoch": 5748} {"train_loss": -26.719648361206055, "global_step": 477146, "epoch": 5748} {"train_loss": -26.915924072265625, "global_step": 477147, "epoch": 5748} {"train_loss": -26.970624923706055, "global_step": 477148, "epoch": 5748} {"train_loss": -26.95769691467285, "global_step": 477149, "epoch": 5748} {"train_loss": -27.29420280456543, "global_step": 477150, "epoch": 5748} {"train_loss": -27.062397003173828, "global_step": 477151, "epoch": 5748} {"train_loss": -26.942554473876953, "global_step": 477152, "epoch": 5748} {"train_loss": -26.957202911376953, "global_step": 477153, "epoch": 5748} {"train_loss": -27.144855499267578, "global_step": 477154, "epoch": 5748} {"train_loss": -27.38739013671875, "global_step": 477155, "epoch": 5748} {"train_loss": -27.262561798095703, "global_step": 477156, "epoch": 5748} {"train_loss": -26.88209342956543, "global_step": 477157, "epoch": 5748} {"train_loss": -27.0023193359375, "global_step": 477158, "epoch": 5748} {"train_loss": -27.08863639831543, "global_step": 477159, "epoch": 5748} {"train_loss": -27.008121490478516, "global_step": 477160, "epoch": 5748} {"train_loss": -26.85420036315918, "global_step": 477161, "epoch": 5748} {"train_loss": -27.280176162719727, "global_step": 477162, "epoch": 5748} {"train_loss": -27.038990020751953, "global_step": 477163, "epoch": 5748} {"train_loss": -27.38263511657715, "global_step": 477164, "epoch": 5748} {"train_loss": -27.189136505126953, "global_step": 477165, "epoch": 5748} {"train_loss": -27.043528752154614, "global_step": 477166, "epoch": 5748, "val_loss": 6608459.0} {"train_loss": -26.9681339263916, "global_step": 477167, "epoch": 5749} {"train_loss": -26.835474014282227, "global_step": 477168, "epoch": 5749} {"train_loss": -26.71930503845215, "global_step": 477169, "epoch": 5749} {"train_loss": -26.814102172851562, "global_step": 477170, "epoch": 5749} {"train_loss": -26.78437614440918, "global_step": 477171, "epoch": 5749} {"train_loss": -26.730375289916992, "global_step": 477172, "epoch": 5749} {"train_loss": -26.970746994018555, "global_step": 477173, "epoch": 5749} {"train_loss": -26.997909545898438, "global_step": 477174, "epoch": 5749} {"train_loss": -26.826147079467773, "global_step": 477175, "epoch": 5749} {"train_loss": -27.02125358581543, "global_step": 477176, "epoch": 5749} {"train_loss": -27.1563720703125, "global_step": 477177, "epoch": 5749} {"train_loss": -27.233814239501953, "global_step": 477178, "epoch": 5749} {"train_loss": -26.924610137939453, "global_step": 477179, "epoch": 5749} {"train_loss": -27.09698486328125, "global_step": 477180, "epoch": 5749} {"train_loss": -26.81520652770996, "global_step": 477181, "epoch": 5749} {"train_loss": -27.421356201171875, "global_step": 477182, "epoch": 5749} {"train_loss": -27.285558700561523, "global_step": 477183, "epoch": 5749} {"train_loss": -27.003253936767578, "global_step": 477184, "epoch": 5749} {"train_loss": -27.223737716674805, "global_step": 477185, "epoch": 5749} {"train_loss": -27.3775691986084, "global_step": 477186, "epoch": 5749} {"train_loss": -27.497222900390625, "global_step": 477187, "epoch": 5749} {"train_loss": -27.35320472717285, "global_step": 477188, "epoch": 5749} {"train_loss": -27.23666763305664, "global_step": 477189, "epoch": 5749} {"train_loss": -27.259750366210938, "global_step": 477190, "epoch": 5749} {"train_loss": -27.247243881225586, "global_step": 477191, "epoch": 5749} {"train_loss": -27.305150985717773, "global_step": 477192, "epoch": 5749} {"train_loss": -27.652484893798828, "global_step": 477193, "epoch": 5749} {"train_loss": -27.05494499206543, "global_step": 477194, "epoch": 5749} {"train_loss": -27.006444931030273, "global_step": 477195, "epoch": 5749} {"train_loss": -27.57343101501465, "global_step": 477196, "epoch": 5749} {"train_loss": -27.159408569335938, "global_step": 477197, "epoch": 5749} {"train_loss": -27.021509170532227, "global_step": 477198, "epoch": 5749} {"train_loss": -27.262720108032227, "global_step": 477199, "epoch": 5749} {"train_loss": -27.67494010925293, "global_step": 477200, "epoch": 5749} {"train_loss": -27.17242431640625, "global_step": 477201, "epoch": 5749} {"train_loss": -26.948205947875977, "global_step": 477202, "epoch": 5749} {"train_loss": -27.03327751159668, "global_step": 477203, "epoch": 5749} {"train_loss": -27.272109985351562, "global_step": 477204, "epoch": 5749} {"train_loss": -27.5344295501709, "global_step": 477205, "epoch": 5749} {"train_loss": -27.200836181640625, "global_step": 477206, "epoch": 5749} {"train_loss": -27.005146026611328, "global_step": 477207, "epoch": 5749} {"train_loss": -27.15247917175293, "global_step": 477208, "epoch": 5749} {"train_loss": -27.22085952758789, "global_step": 477209, "epoch": 5749} {"train_loss": -27.393945693969727, "global_step": 477210, "epoch": 5749} {"train_loss": -27.265338897705078, "global_step": 477211, "epoch": 5749} {"train_loss": -27.094327926635742, "global_step": 477212, "epoch": 5749} {"train_loss": -26.99335289001465, "global_step": 477213, "epoch": 5749} {"train_loss": -27.255329132080078, "global_step": 477214, "epoch": 5749} {"train_loss": -27.1740779876709, "global_step": 477215, "epoch": 5749} {"train_loss": -27.438337326049805, "global_step": 477216, "epoch": 5749} {"train_loss": -27.24118423461914, "global_step": 477217, "epoch": 5749} {"train_loss": -26.865503311157227, "global_step": 477218, "epoch": 5749} {"train_loss": -27.54071044921875, "global_step": 477219, "epoch": 5749} {"train_loss": -27.11713981628418, "global_step": 477220, "epoch": 5749} {"train_loss": -27.145421981811523, "global_step": 477221, "epoch": 5749} {"train_loss": -27.309295654296875, "global_step": 477222, "epoch": 5749} {"train_loss": -27.63111686706543, "global_step": 477223, "epoch": 5749} {"train_loss": -26.91364097595215, "global_step": 477224, "epoch": 5749} {"train_loss": -27.508136749267578, "global_step": 477225, "epoch": 5749} {"train_loss": -27.444950103759766, "global_step": 477226, "epoch": 5749} {"train_loss": -27.294214248657227, "global_step": 477227, "epoch": 5749} {"train_loss": -27.270299911499023, "global_step": 477228, "epoch": 5749} {"train_loss": -26.96368980407715, "global_step": 477229, "epoch": 5749} {"train_loss": -26.884572982788086, "global_step": 477230, "epoch": 5749} {"train_loss": -27.0743465423584, "global_step": 477231, "epoch": 5749} {"train_loss": -27.34992027282715, "global_step": 477232, "epoch": 5749} {"train_loss": -27.075063705444336, "global_step": 477233, "epoch": 5749} {"train_loss": -26.996713638305664, "global_step": 477234, "epoch": 5749} {"train_loss": -27.077224731445312, "global_step": 477235, "epoch": 5749} {"train_loss": -27.298954010009766, "global_step": 477236, "epoch": 5749} {"train_loss": -26.81607437133789, "global_step": 477237, "epoch": 5749} {"train_loss": -26.984785079956055, "global_step": 477238, "epoch": 5749} {"train_loss": -26.74293327331543, "global_step": 477239, "epoch": 5749} {"train_loss": -26.969654083251953, "global_step": 477240, "epoch": 5749} {"train_loss": -26.878726959228516, "global_step": 477241, "epoch": 5749} {"train_loss": -27.001943588256836, "global_step": 477242, "epoch": 5749} {"train_loss": -27.412221908569336, "global_step": 477243, "epoch": 5749} {"train_loss": -27.275562286376953, "global_step": 477244, "epoch": 5749} {"train_loss": -27.04736328125, "global_step": 477245, "epoch": 5749} {"train_loss": -27.1279239654541, "global_step": 477246, "epoch": 5749} {"train_loss": -27.086339950561523, "global_step": 477247, "epoch": 5749} {"train_loss": -27.143787384033203, "global_step": 477248, "epoch": 5749} {"train_loss": -27.14045329266284, "global_step": 477249, "epoch": 5749, "val_loss": 6602182.0} {"train_loss": -27.029813766479492, "global_step": 477250, "epoch": 5750} {"train_loss": -26.702075958251953, "global_step": 477251, "epoch": 5750} {"train_loss": -26.98762321472168, "global_step": 477252, "epoch": 5750} {"train_loss": -26.417041778564453, "global_step": 477253, "epoch": 5750} {"train_loss": -26.73358154296875, "global_step": 477254, "epoch": 5750} {"train_loss": -26.693410873413086, "global_step": 477255, "epoch": 5750} {"train_loss": -27.22509765625, "global_step": 477256, "epoch": 5750} {"train_loss": -26.968358993530273, "global_step": 477257, "epoch": 5750} {"train_loss": -27.05014419555664, "global_step": 477258, "epoch": 5750} {"train_loss": -27.04066276550293, "global_step": 477259, "epoch": 5750} {"train_loss": -27.01191520690918, "global_step": 477260, "epoch": 5750} {"train_loss": -26.811975479125977, "global_step": 477261, "epoch": 5750} {"train_loss": -27.033151626586914, "global_step": 477262, "epoch": 5750} {"train_loss": -26.964996337890625, "global_step": 477263, "epoch": 5750} {"train_loss": -26.87137794494629, "global_step": 477264, "epoch": 5750} {"train_loss": -27.39243507385254, "global_step": 477265, "epoch": 5750} {"train_loss": -27.00025749206543, "global_step": 477266, "epoch": 5750} {"train_loss": -27.107868194580078, "global_step": 477267, "epoch": 5750} {"train_loss": -27.03374671936035, "global_step": 477268, "epoch": 5750} {"train_loss": -26.976150512695312, "global_step": 477269, "epoch": 5750} {"train_loss": -27.075103759765625, "global_step": 477270, "epoch": 5750} {"train_loss": -27.126745223999023, "global_step": 477271, "epoch": 5750} {"train_loss": -27.304773330688477, "global_step": 477272, "epoch": 5750} {"train_loss": -26.84860610961914, "global_step": 477273, "epoch": 5750} {"train_loss": -27.21956443786621, "global_step": 477274, "epoch": 5750} {"train_loss": -27.377042770385742, "global_step": 477275, "epoch": 5750} {"train_loss": -27.418142318725586, "global_step": 477276, "epoch": 5750} {"train_loss": -26.97071647644043, "global_step": 477277, "epoch": 5750} {"train_loss": -26.907941818237305, "global_step": 477278, "epoch": 5750} {"train_loss": -27.49627113342285, "global_step": 477279, "epoch": 5750} {"train_loss": -27.013809204101562, "global_step": 477280, "epoch": 5750} {"train_loss": -27.47653579711914, "global_step": 477281, "epoch": 5750} {"train_loss": -27.479093551635742, "global_step": 477282, "epoch": 5750} {"train_loss": -27.27277946472168, "global_step": 477283, "epoch": 5750} {"train_loss": -27.33551025390625, "global_step": 477284, "epoch": 5750} {"train_loss": -27.54715919494629, "global_step": 477285, "epoch": 5750} {"train_loss": -27.737689971923828, "global_step": 477286, "epoch": 5750} {"train_loss": -27.342544555664062, "global_step": 477287, "epoch": 5750} {"train_loss": -27.15809440612793, "global_step": 477288, "epoch": 5750} {"train_loss": -27.050561904907227, "global_step": 477289, "epoch": 5750} {"train_loss": -27.4984130859375, "global_step": 477290, "epoch": 5750} {"train_loss": -27.016759872436523, "global_step": 477291, "epoch": 5750} {"train_loss": -27.248977661132812, "global_step": 477292, "epoch": 5750} {"train_loss": -27.385181427001953, "global_step": 477293, "epoch": 5750} {"train_loss": -27.33662223815918, "global_step": 477294, "epoch": 5750} {"train_loss": -27.606382369995117, "global_step": 477295, "epoch": 5750} {"train_loss": -27.1214656829834, "global_step": 477296, "epoch": 5750} {"train_loss": -27.4732666015625, "global_step": 477297, "epoch": 5750} {"train_loss": -27.1407527923584, "global_step": 477298, "epoch": 5750} {"train_loss": -27.675506591796875, "global_step": 477299, "epoch": 5750} {"train_loss": -27.694751739501953, "global_step": 477300, "epoch": 5750} {"train_loss": -27.15806007385254, "global_step": 477301, "epoch": 5750} {"train_loss": -27.153289794921875, "global_step": 477302, "epoch": 5750} {"train_loss": -27.427108764648438, "global_step": 477303, "epoch": 5750} {"train_loss": -27.520248413085938, "global_step": 477304, "epoch": 5750} {"train_loss": -27.647476196289062, "global_step": 477305, "epoch": 5750} {"train_loss": -27.170495986938477, "global_step": 477306, "epoch": 5750} {"train_loss": -26.65779685974121, "global_step": 477307, "epoch": 5750} {"train_loss": -27.0654296875, "global_step": 477308, "epoch": 5750} {"train_loss": -27.106403350830078, "global_step": 477309, "epoch": 5750} {"train_loss": -27.25174331665039, "global_step": 477310, "epoch": 5750} {"train_loss": -26.578723907470703, "global_step": 477311, "epoch": 5750} {"train_loss": -27.121877670288086, "global_step": 477312, "epoch": 5750} {"train_loss": -26.9886531829834, "global_step": 477313, "epoch": 5750} {"train_loss": -27.234601974487305, "global_step": 477314, "epoch": 5750} {"train_loss": -27.558191299438477, "global_step": 477315, "epoch": 5750} {"train_loss": -27.223602294921875, "global_step": 477316, "epoch": 5750} {"train_loss": -27.323034286499023, "global_step": 477317, "epoch": 5750} {"train_loss": -27.144458770751953, "global_step": 477318, "epoch": 5750} {"train_loss": -27.13551902770996, "global_step": 477319, "epoch": 5750} {"train_loss": -27.18817138671875, "global_step": 477320, "epoch": 5750} {"train_loss": -27.16584587097168, "global_step": 477321, "epoch": 5750} {"train_loss": -27.503662109375, "global_step": 477322, "epoch": 5750} {"train_loss": -27.402957916259766, "global_step": 477323, "epoch": 5750} {"train_loss": -27.01951026916504, "global_step": 477324, "epoch": 5750} {"train_loss": -26.93060874938965, "global_step": 477325, "epoch": 5750} {"train_loss": -26.962127685546875, "global_step": 477326, "epoch": 5750} {"train_loss": -27.12666130065918, "global_step": 477327, "epoch": 5750} {"train_loss": -27.06825065612793, "global_step": 477328, "epoch": 5750} {"train_loss": -27.42106056213379, "global_step": 477329, "epoch": 5750} {"train_loss": -26.84305763244629, "global_step": 477330, "epoch": 5750} {"train_loss": -26.8581485748291, "global_step": 477331, "epoch": 5750} {"train_loss": -27.162390191871, "global_step": 477332, "epoch": 5750, "train/sim_max_reward_0": 1.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4500000": 1.0, "test/sim_max_reward_4500001": 1.0, "test/sim_max_reward_4500002": 1.0, "test/sim_max_reward_4500003": 1.0, "test/sim_max_reward_4500004": 1.0, "test/sim_max_reward_4500005": 1.0, "test/sim_max_reward_4500006": 1.0, "test/sim_max_reward_4500007": 0.0, "test/sim_max_reward_4500008": 1.0, "test/sim_max_reward_4500009": 1.0, "test/sim_max_reward_4500010": 1.0, "test/sim_max_reward_4500011": 1.0, "test/sim_max_reward_4500012": 1.0, "test/sim_max_reward_4500013": 1.0, "test/sim_max_reward_4500014": 1.0, "test/sim_max_reward_4500015": 1.0, "test/sim_max_reward_4500016": 1.0, "test/sim_max_reward_4500017": 1.0, "test/sim_max_reward_4500018": 1.0, "test/sim_max_reward_4500019": 1.0, "test/sim_max_reward_4500020": 1.0, "test/sim_max_reward_4500021": 1.0, "train/mean_score": 1.0, "test/mean_score": 0.9545454545454546, "val_loss": 6741252.0} {"train_loss": -26.680816650390625, "global_step": 477333, "epoch": 5751} {"train_loss": -26.567529678344727, "global_step": 477334, "epoch": 5751} {"train_loss": -26.7607479095459, "global_step": 477335, "epoch": 5751} {"train_loss": -26.5277042388916, "global_step": 477336, "epoch": 5751} {"train_loss": -26.870336532592773, "global_step": 477337, "epoch": 5751} {"train_loss": -26.905263900756836, "global_step": 477338, "epoch": 5751} {"train_loss": -27.303668975830078, "global_step": 477339, "epoch": 5751} {"train_loss": -26.758087158203125, "global_step": 477340, "epoch": 5751} {"train_loss": -27.058349609375, "global_step": 477341, "epoch": 5751} {"train_loss": -26.5452880859375, "global_step": 477342, "epoch": 5751} {"train_loss": -27.19426918029785, "global_step": 477343, "epoch": 5751} {"train_loss": -26.720502853393555, "global_step": 477344, "epoch": 5751} {"train_loss": -27.31269645690918, "global_step": 477345, "epoch": 5751} {"train_loss": -26.96967124938965, "global_step": 477346, "epoch": 5751} {"train_loss": -26.911224365234375, "global_step": 477347, "epoch": 5751} {"train_loss": -26.5955810546875, "global_step": 477348, "epoch": 5751} {"train_loss": -26.696735382080078, "global_step": 477349, "epoch": 5751} {"train_loss": -27.100479125976562, "global_step": 477350, "epoch": 5751} {"train_loss": -27.255813598632812, "global_step": 477351, "epoch": 5751} {"train_loss": -26.965423583984375, "global_step": 477352, "epoch": 5751} {"train_loss": -27.25537109375, "global_step": 477353, "epoch": 5751} {"train_loss": -27.413171768188477, "global_step": 477354, "epoch": 5751} {"train_loss": -27.238977432250977, "global_step": 477355, "epoch": 5751} {"train_loss": -27.172163009643555, "global_step": 477356, "epoch": 5751} {"train_loss": -27.280359268188477, "global_step": 477357, "epoch": 5751} {"train_loss": -27.12212562561035, "global_step": 477358, "epoch": 5751} {"train_loss": -27.438135147094727, "global_step": 477359, "epoch": 5751} {"train_loss": -27.274274826049805, "global_step": 477360, "epoch": 5751} {"train_loss": -27.208637237548828, "global_step": 477361, "epoch": 5751} {"train_loss": -27.020166397094727, "global_step": 477362, "epoch": 5751} {"train_loss": -27.3424129486084, "global_step": 477363, "epoch": 5751} {"train_loss": -27.47224998474121, "global_step": 477364, "epoch": 5751} {"train_loss": -27.30265235900879, "global_step": 477365, "epoch": 5751} {"train_loss": -27.433429718017578, "global_step": 477366, "epoch": 5751} {"train_loss": -27.222158432006836, "global_step": 477367, "epoch": 5751} {"train_loss": -27.252288818359375, "global_step": 477368, "epoch": 5751} {"train_loss": -27.46657371520996, "global_step": 477369, "epoch": 5751} {"train_loss": -27.46347999572754, "global_step": 477370, "epoch": 5751} {"train_loss": -27.26848793029785, "global_step": 477371, "epoch": 5751} {"train_loss": -27.517541885375977, "global_step": 477372, "epoch": 5751} {"train_loss": -27.486148834228516, "global_step": 477373, "epoch": 5751} {"train_loss": -27.387495040893555, "global_step": 477374, "epoch": 5751} {"train_loss": -27.21034049987793, "global_step": 477375, "epoch": 5751} {"train_loss": -27.2331600189209, "global_step": 477376, "epoch": 5751} {"train_loss": -27.720518112182617, "global_step": 477377, "epoch": 5751} {"train_loss": -27.330663681030273, "global_step": 477378, "epoch": 5751} {"train_loss": -27.328598022460938, "global_step": 477379, "epoch": 5751} {"train_loss": -27.209182739257812, "global_step": 477380, "epoch": 5751} {"train_loss": -26.9285831451416, "global_step": 477381, "epoch": 5751} {"train_loss": -27.553171157836914, "global_step": 477382, "epoch": 5751} {"train_loss": -27.325855255126953, "global_step": 477383, "epoch": 5751} {"train_loss": -27.2062931060791, "global_step": 477384, "epoch": 5751} {"train_loss": -27.380847930908203, "global_step": 477385, "epoch": 5751} {"train_loss": -27.02076530456543, "global_step": 477386, "epoch": 5751} {"train_loss": -27.53165626525879, "global_step": 477387, "epoch": 5751} {"train_loss": -27.09553337097168, "global_step": 477388, "epoch": 5751} {"train_loss": -27.229581832885742, "global_step": 477389, "epoch": 5751} {"train_loss": -27.26129150390625, "global_step": 477390, "epoch": 5751} {"train_loss": -27.527109146118164, "global_step": 477391, "epoch": 5751} {"train_loss": -27.3624324798584, "global_step": 477392, "epoch": 5751} {"train_loss": -27.503042221069336, "global_step": 477393, "epoch": 5751} {"train_loss": -27.342823028564453, "global_step": 477394, "epoch": 5751} {"train_loss": -27.183837890625, "global_step": 477395, "epoch": 5751} {"train_loss": -27.04591178894043, "global_step": 477396, "epoch": 5751} {"train_loss": -27.03077507019043, "global_step": 477397, "epoch": 5751} {"train_loss": -26.30707359313965, "global_step": 477398, "epoch": 5751} {"train_loss": -25.58107566833496, "global_step": 477399, "epoch": 5751} {"train_loss": -26.30330467224121, "global_step": 477400, "epoch": 5751} {"train_loss": -27.054868698120117, "global_step": 477401, "epoch": 5751} {"train_loss": -26.590986251831055, "global_step": 477402, "epoch": 5751} {"train_loss": -26.687442779541016, "global_step": 477403, "epoch": 5751} {"train_loss": -26.470243453979492, "global_step": 477404, "epoch": 5751} {"train_loss": -26.15168571472168, "global_step": 477405, "epoch": 5751} {"train_loss": -27.092422485351562, "global_step": 477406, "epoch": 5751} {"train_loss": -26.46589469909668, "global_step": 477407, "epoch": 5751} {"train_loss": -26.481565475463867, "global_step": 477408, "epoch": 5751} {"train_loss": -27.23248863220215, "global_step": 477409, "epoch": 5751} {"train_loss": -26.88422966003418, "global_step": 477410, "epoch": 5751} {"train_loss": -26.76405143737793, "global_step": 477411, "epoch": 5751} {"train_loss": -26.877416610717773, "global_step": 477412, "epoch": 5751} {"train_loss": -27.500625610351562, "global_step": 477413, "epoch": 5751} {"train_loss": -27.145734786987305, "global_step": 477414, "epoch": 5751} {"train_loss": -27.05762727576566, "global_step": 477415, "epoch": 5751, "val_loss": 6704662.0} {"train_loss": -27.228912353515625, "global_step": 477416, "epoch": 5752} {"train_loss": -26.734586715698242, "global_step": 477417, "epoch": 5752} {"train_loss": -26.91753578186035, "global_step": 477418, "epoch": 5752} {"train_loss": -27.072284698486328, "global_step": 477419, "epoch": 5752} {"train_loss": -26.87501335144043, "global_step": 477420, "epoch": 5752} {"train_loss": -27.32855796813965, "global_step": 477421, "epoch": 5752} {"train_loss": -27.15683937072754, "global_step": 477422, "epoch": 5752} {"train_loss": -27.073522567749023, "global_step": 477423, "epoch": 5752} {"train_loss": -26.85554313659668, "global_step": 477424, "epoch": 5752} {"train_loss": -27.1419677734375, "global_step": 477425, "epoch": 5752} {"train_loss": -26.798297882080078, "global_step": 477426, "epoch": 5752} {"train_loss": -26.67934226989746, "global_step": 477427, "epoch": 5752} {"train_loss": -26.975706100463867, "global_step": 477428, "epoch": 5752} {"train_loss": -26.74365234375, "global_step": 477429, "epoch": 5752} {"train_loss": -27.39422607421875, "global_step": 477430, "epoch": 5752} {"train_loss": -27.442663192749023, "global_step": 477431, "epoch": 5752} {"train_loss": -26.95303726196289, "global_step": 477432, "epoch": 5752} {"train_loss": -27.227100372314453, "global_step": 477433, "epoch": 5752} {"train_loss": -27.06277847290039, "global_step": 477434, "epoch": 5752} {"train_loss": -27.401599884033203, "global_step": 477435, "epoch": 5752} {"train_loss": -27.1892032623291, "global_step": 477436, "epoch": 5752} {"train_loss": -26.710920333862305, "global_step": 477437, "epoch": 5752} {"train_loss": -27.363101959228516, "global_step": 477438, "epoch": 5752} {"train_loss": -26.9654541015625, "global_step": 477439, "epoch": 5752} {"train_loss": -27.374195098876953, "global_step": 477440, "epoch": 5752} {"train_loss": -26.972198486328125, "global_step": 477441, "epoch": 5752} {"train_loss": -27.219324111938477, "global_step": 477442, "epoch": 5752} {"train_loss": -27.175018310546875, "global_step": 477443, "epoch": 5752} {"train_loss": -27.300369262695312, "global_step": 477444, "epoch": 5752} {"train_loss": -26.99216651916504, "global_step": 477445, "epoch": 5752} {"train_loss": -27.480106353759766, "global_step": 477446, "epoch": 5752} {"train_loss": -27.157983779907227, "global_step": 477447, "epoch": 5752} {"train_loss": -27.62800407409668, "global_step": 477448, "epoch": 5752} {"train_loss": -27.308380126953125, "global_step": 477449, "epoch": 5752} {"train_loss": -27.639142990112305, "global_step": 477450, "epoch": 5752} {"train_loss": -27.542835235595703, "global_step": 477451, "epoch": 5752} {"train_loss": -27.538427352905273, "global_step": 477452, "epoch": 5752} {"train_loss": -27.270505905151367, "global_step": 477453, "epoch": 5752} {"train_loss": -27.629348754882812, "global_step": 477454, "epoch": 5752} {"train_loss": -27.355213165283203, "global_step": 477455, "epoch": 5752} {"train_loss": -27.253767013549805, "global_step": 477456, "epoch": 5752} {"train_loss": -27.208967208862305, "global_step": 477457, "epoch": 5752} {"train_loss": -27.52263832092285, "global_step": 477458, "epoch": 5752} {"train_loss": -27.12592124938965, "global_step": 477459, "epoch": 5752} {"train_loss": -27.545515060424805, "global_step": 477460, "epoch": 5752} {"train_loss": -27.46514320373535, "global_step": 477461, "epoch": 5752} {"train_loss": -27.46039390563965, "global_step": 477462, "epoch": 5752} {"train_loss": -27.34433937072754, "global_step": 477463, "epoch": 5752} {"train_loss": -27.53093910217285, "global_step": 477464, "epoch": 5752} {"train_loss": -27.0726375579834, "global_step": 477465, "epoch": 5752} {"train_loss": -27.2125186920166, "global_step": 477466, "epoch": 5752} {"train_loss": -27.03938102722168, "global_step": 477467, "epoch": 5752} {"train_loss": -26.242752075195312, "global_step": 477468, "epoch": 5752} {"train_loss": -27.242151260375977, "global_step": 477469, "epoch": 5752} {"train_loss": -26.627344131469727, "global_step": 477470, "epoch": 5752} {"train_loss": -27.323537826538086, "global_step": 477471, "epoch": 5752} {"train_loss": -27.195514678955078, "global_step": 477472, "epoch": 5752} {"train_loss": -26.611587524414062, "global_step": 477473, "epoch": 5752} {"train_loss": -27.13360023498535, "global_step": 477474, "epoch": 5752} {"train_loss": -26.930959701538086, "global_step": 477475, "epoch": 5752} {"train_loss": -27.24649429321289, "global_step": 477476, "epoch": 5752} {"train_loss": -26.78067398071289, "global_step": 477477, "epoch": 5752} {"train_loss": -27.2997989654541, "global_step": 477478, "epoch": 5752} {"train_loss": -27.220111846923828, "global_step": 477479, "epoch": 5752} {"train_loss": -27.41278076171875, "global_step": 477480, "epoch": 5752} {"train_loss": -27.044092178344727, "global_step": 477481, "epoch": 5752} {"train_loss": -26.911237716674805, "global_step": 477482, "epoch": 5752} {"train_loss": -27.1554012298584, "global_step": 477483, "epoch": 5752} {"train_loss": -27.020044326782227, "global_step": 477484, "epoch": 5752} {"train_loss": -26.899494171142578, "global_step": 477485, "epoch": 5752} {"train_loss": -27.36530113220215, "global_step": 477486, "epoch": 5752} {"train_loss": -26.808380126953125, "global_step": 477487, "epoch": 5752} {"train_loss": -26.9084529876709, "global_step": 477488, "epoch": 5752} {"train_loss": -27.22419548034668, "global_step": 477489, "epoch": 5752} {"train_loss": -26.787988662719727, "global_step": 477490, "epoch": 5752} {"train_loss": -27.0987606048584, "global_step": 477491, "epoch": 5752} {"train_loss": -27.1772518157959, "global_step": 477492, "epoch": 5752} {"train_loss": -27.027515411376953, "global_step": 477493, "epoch": 5752} {"train_loss": -27.245405197143555, "global_step": 477494, "epoch": 5752} {"train_loss": -27.081418991088867, "global_step": 477495, "epoch": 5752} {"train_loss": -27.115650177001953, "global_step": 477496, "epoch": 5752} {"train_loss": -26.860021591186523, "global_step": 477497, "epoch": 5752} {"train_loss": -27.138258256107928, "global_step": 477498, "epoch": 5752, "val_loss": 6650734.0} {"train_loss": -26.934858322143555, "global_step": 477499, "epoch": 5753} {"train_loss": -26.5480899810791, "global_step": 477500, "epoch": 5753} {"train_loss": -26.71274757385254, "global_step": 477501, "epoch": 5753} {"train_loss": -26.622623443603516, "global_step": 477502, "epoch": 5753} {"train_loss": -26.94952964782715, "global_step": 477503, "epoch": 5753} {"train_loss": -26.27491569519043, "global_step": 477504, "epoch": 5753} {"train_loss": -26.845701217651367, "global_step": 477505, "epoch": 5753} {"train_loss": -27.076480865478516, "global_step": 477506, "epoch": 5753} {"train_loss": -26.477359771728516, "global_step": 477507, "epoch": 5753} {"train_loss": -27.123865127563477, "global_step": 477508, "epoch": 5753} {"train_loss": -27.078588485717773, "global_step": 477509, "epoch": 5753} {"train_loss": -26.902738571166992, "global_step": 477510, "epoch": 5753} {"train_loss": -26.697961807250977, "global_step": 477511, "epoch": 5753} {"train_loss": -26.662647247314453, "global_step": 477512, "epoch": 5753} {"train_loss": -26.786529541015625, "global_step": 477513, "epoch": 5753} {"train_loss": -26.368228912353516, "global_step": 477514, "epoch": 5753} {"train_loss": -26.970718383789062, "global_step": 477515, "epoch": 5753} {"train_loss": -26.72867202758789, "global_step": 477516, "epoch": 5753} {"train_loss": -27.203144073486328, "global_step": 477517, "epoch": 5753} {"train_loss": -26.964691162109375, "global_step": 477518, "epoch": 5753} {"train_loss": -26.727209091186523, "global_step": 477519, "epoch": 5753} {"train_loss": -26.609130859375, "global_step": 477520, "epoch": 5753} {"train_loss": -27.15203285217285, "global_step": 477521, "epoch": 5753} {"train_loss": -27.200397491455078, "global_step": 477522, "epoch": 5753} {"train_loss": -27.218027114868164, "global_step": 477523, "epoch": 5753} {"train_loss": -27.301916122436523, "global_step": 477524, "epoch": 5753} {"train_loss": -26.940353393554688, "global_step": 477525, "epoch": 5753} {"train_loss": -27.293684005737305, "global_step": 477526, "epoch": 5753} {"train_loss": -27.13032341003418, "global_step": 477527, "epoch": 5753} {"train_loss": -27.537830352783203, "global_step": 477528, "epoch": 5753} {"train_loss": -27.087751388549805, "global_step": 477529, "epoch": 5753} {"train_loss": -27.210163116455078, "global_step": 477530, "epoch": 5753} {"train_loss": -27.446258544921875, "global_step": 477531, "epoch": 5753} {"train_loss": -27.126636505126953, "global_step": 477532, "epoch": 5753} {"train_loss": -27.18787956237793, "global_step": 477533, "epoch": 5753} {"train_loss": -27.08588981628418, "global_step": 477534, "epoch": 5753} {"train_loss": -27.40061378479004, "global_step": 477535, "epoch": 5753} {"train_loss": -27.481143951416016, "global_step": 477536, "epoch": 5753} {"train_loss": -27.665802001953125, "global_step": 477537, "epoch": 5753} {"train_loss": -27.576353073120117, "global_step": 477538, "epoch": 5753} {"train_loss": -27.318708419799805, "global_step": 477539, "epoch": 5753} {"train_loss": -27.2714900970459, "global_step": 477540, "epoch": 5753} {"train_loss": -27.522016525268555, "global_step": 477541, "epoch": 5753} {"train_loss": -27.706762313842773, "global_step": 477542, "epoch": 5753} {"train_loss": -27.48308753967285, "global_step": 477543, "epoch": 5753} {"train_loss": -27.24542808532715, "global_step": 477544, "epoch": 5753} {"train_loss": -26.807886123657227, "global_step": 477545, "epoch": 5753} {"train_loss": -27.578786849975586, "global_step": 477546, "epoch": 5753} {"train_loss": -27.300500869750977, "global_step": 477547, "epoch": 5753} {"train_loss": -27.420270919799805, "global_step": 477548, "epoch": 5753} {"train_loss": -26.766332626342773, "global_step": 477549, "epoch": 5753} {"train_loss": -26.4810733795166, "global_step": 477550, "epoch": 5753} {"train_loss": -26.713062286376953, "global_step": 477551, "epoch": 5753} {"train_loss": -27.02118492126465, "global_step": 477552, "epoch": 5753} {"train_loss": -27.2469482421875, "global_step": 477553, "epoch": 5753} {"train_loss": -26.671857833862305, "global_step": 477554, "epoch": 5753} {"train_loss": -27.38349723815918, "global_step": 477555, "epoch": 5753} {"train_loss": -26.872663497924805, "global_step": 477556, "epoch": 5753} {"train_loss": -27.1881103515625, "global_step": 477557, "epoch": 5753} {"train_loss": -27.178747177124023, "global_step": 477558, "epoch": 5753} {"train_loss": -27.046661376953125, "global_step": 477559, "epoch": 5753} {"train_loss": -26.715505599975586, "global_step": 477560, "epoch": 5753} {"train_loss": -27.107275009155273, "global_step": 477561, "epoch": 5753} {"train_loss": -26.920949935913086, "global_step": 477562, "epoch": 5753} {"train_loss": -26.923410415649414, "global_step": 477563, "epoch": 5753} {"train_loss": -27.3507022857666, "global_step": 477564, "epoch": 5753} {"train_loss": -27.026382446289062, "global_step": 477565, "epoch": 5753} {"train_loss": -27.11749839782715, "global_step": 477566, "epoch": 5753} {"train_loss": -26.788461685180664, "global_step": 477567, "epoch": 5753} {"train_loss": -27.255178451538086, "global_step": 477568, "epoch": 5753} {"train_loss": -27.03826332092285, "global_step": 477569, "epoch": 5753} {"train_loss": -27.483356475830078, "global_step": 477570, "epoch": 5753} {"train_loss": -27.043487548828125, "global_step": 477571, "epoch": 5753} {"train_loss": -27.135974884033203, "global_step": 477572, "epoch": 5753} {"train_loss": -26.915637969970703, "global_step": 477573, "epoch": 5753} {"train_loss": -27.287322998046875, "global_step": 477574, "epoch": 5753} {"train_loss": -26.933340072631836, "global_step": 477575, "epoch": 5753} {"train_loss": -27.181503295898438, "global_step": 477576, "epoch": 5753} {"train_loss": -26.751020431518555, "global_step": 477577, "epoch": 5753} {"train_loss": -27.301156997680664, "global_step": 477578, "epoch": 5753} {"train_loss": -26.926862716674805, "global_step": 477579, "epoch": 5753} {"train_loss": -27.13055992126465, "global_step": 477580, "epoch": 5753} {"train_loss": -27.060561352465527, "global_step": 477581, "epoch": 5753, "val_loss": 6639906.0} {"train_loss": -26.629180908203125, "global_step": 477582, "epoch": 5754} {"train_loss": -26.257238388061523, "global_step": 477583, "epoch": 5754} {"train_loss": -26.60444450378418, "global_step": 477584, "epoch": 5754} {"train_loss": -27.096948623657227, "global_step": 477585, "epoch": 5754} {"train_loss": -26.691818237304688, "global_step": 477586, "epoch": 5754} {"train_loss": -26.27874755859375, "global_step": 477587, "epoch": 5754} {"train_loss": -26.56781005859375, "global_step": 477588, "epoch": 5754} {"train_loss": -26.768842697143555, "global_step": 477589, "epoch": 5754} {"train_loss": -26.694538116455078, "global_step": 477590, "epoch": 5754} {"train_loss": -26.725339889526367, "global_step": 477591, "epoch": 5754} {"train_loss": -26.785253524780273, "global_step": 477592, "epoch": 5754} {"train_loss": -26.34624671936035, "global_step": 477593, "epoch": 5754} {"train_loss": -26.688007354736328, "global_step": 477594, "epoch": 5754} {"train_loss": -26.8803653717041, "global_step": 477595, "epoch": 5754} {"train_loss": -27.01808738708496, "global_step": 477596, "epoch": 5754} {"train_loss": -26.679428100585938, "global_step": 477597, "epoch": 5754} {"train_loss": -26.90334129333496, "global_step": 477598, "epoch": 5754} {"train_loss": -26.3240966796875, "global_step": 477599, "epoch": 5754} {"train_loss": -26.892181396484375, "global_step": 477600, "epoch": 5754} {"train_loss": -27.171777725219727, "global_step": 477601, "epoch": 5754} {"train_loss": -27.044458389282227, "global_step": 477602, "epoch": 5754} {"train_loss": -27.367029190063477, "global_step": 477603, "epoch": 5754} {"train_loss": -27.010669708251953, "global_step": 477604, "epoch": 5754} {"train_loss": -27.018041610717773, "global_step": 477605, "epoch": 5754} {"train_loss": -27.25421714782715, "global_step": 477606, "epoch": 5754} {"train_loss": -26.951025009155273, "global_step": 477607, "epoch": 5754} {"train_loss": -27.25282096862793, "global_step": 477608, "epoch": 5754} {"train_loss": -27.031702041625977, "global_step": 477609, "epoch": 5754} {"train_loss": -27.478246688842773, "global_step": 477610, "epoch": 5754} {"train_loss": -27.617691040039062, "global_step": 477611, "epoch": 5754} {"train_loss": -27.180740356445312, "global_step": 477612, "epoch": 5754} {"train_loss": -26.936939239501953, "global_step": 477613, "epoch": 5754} {"train_loss": -27.17010498046875, "global_step": 477614, "epoch": 5754} {"train_loss": -27.0456485748291, "global_step": 477615, "epoch": 5754} {"train_loss": -27.327234268188477, "global_step": 477616, "epoch": 5754} {"train_loss": -27.10822105407715, "global_step": 477617, "epoch": 5754} {"train_loss": -27.227542877197266, "global_step": 477618, "epoch": 5754} {"train_loss": -27.36231803894043, "global_step": 477619, "epoch": 5754} {"train_loss": -27.36277198791504, "global_step": 477620, "epoch": 5754} {"train_loss": -26.843097686767578, "global_step": 477621, "epoch": 5754} {"train_loss": -27.251733779907227, "global_step": 477622, "epoch": 5754} {"train_loss": -27.30254554748535, "global_step": 477623, "epoch": 5754} {"train_loss": -27.224960327148438, "global_step": 477624, "epoch": 5754} {"train_loss": -26.930715560913086, "global_step": 477625, "epoch": 5754} {"train_loss": -27.547210693359375, "global_step": 477626, "epoch": 5754} {"train_loss": -26.9580135345459, "global_step": 477627, "epoch": 5754} {"train_loss": -27.085508346557617, "global_step": 477628, "epoch": 5754} {"train_loss": -27.23703384399414, "global_step": 477629, "epoch": 5754} {"train_loss": -27.55982780456543, "global_step": 477630, "epoch": 5754} {"train_loss": -27.28252601623535, "global_step": 477631, "epoch": 5754} {"train_loss": -27.753721237182617, "global_step": 477632, "epoch": 5754} {"train_loss": -27.5965633392334, "global_step": 477633, "epoch": 5754} {"train_loss": -27.432682037353516, "global_step": 477634, "epoch": 5754} {"train_loss": -27.792648315429688, "global_step": 477635, "epoch": 5754} {"train_loss": -27.43023109436035, "global_step": 477636, "epoch": 5754} {"train_loss": -27.37814712524414, "global_step": 477637, "epoch": 5754} {"train_loss": -27.48158073425293, "global_step": 477638, "epoch": 5754} {"train_loss": -27.133895874023438, "global_step": 477639, "epoch": 5754} {"train_loss": -27.203506469726562, "global_step": 477640, "epoch": 5754} {"train_loss": -27.18482780456543, "global_step": 477641, "epoch": 5754} {"train_loss": -27.532865524291992, "global_step": 477642, "epoch": 5754} {"train_loss": -27.4702091217041, "global_step": 477643, "epoch": 5754} {"train_loss": -27.093297958374023, "global_step": 477644, "epoch": 5754} {"train_loss": -26.996240615844727, "global_step": 477645, "epoch": 5754} {"train_loss": -27.3107967376709, "global_step": 477646, "epoch": 5754} {"train_loss": -27.275436401367188, "global_step": 477647, "epoch": 5754} {"train_loss": -27.012420654296875, "global_step": 477648, "epoch": 5754} {"train_loss": -27.352828979492188, "global_step": 477649, "epoch": 5754} {"train_loss": -27.520339965820312, "global_step": 477650, "epoch": 5754} {"train_loss": -27.358539581298828, "global_step": 477651, "epoch": 5754} {"train_loss": -27.56787109375, "global_step": 477652, "epoch": 5754} {"train_loss": -27.337980270385742, "global_step": 477653, "epoch": 5754} {"train_loss": -27.203901290893555, "global_step": 477654, "epoch": 5754} {"train_loss": -27.5750732421875, "global_step": 477655, "epoch": 5754} {"train_loss": -27.16607093811035, "global_step": 477656, "epoch": 5754} {"train_loss": -27.5175838470459, "global_step": 477657, "epoch": 5754} {"train_loss": -26.80832290649414, "global_step": 477658, "epoch": 5754} {"train_loss": -27.186847686767578, "global_step": 477659, "epoch": 5754} {"train_loss": -27.436574935913086, "global_step": 477660, "epoch": 5754} {"train_loss": -26.699420928955078, "global_step": 477661, "epoch": 5754} {"train_loss": -26.832189559936523, "global_step": 477662, "epoch": 5754} {"train_loss": -27.0251522064209, "global_step": 477663, "epoch": 5754} {"train_loss": -27.113217710012414, "global_step": 477664, "epoch": 5754, "val_loss": 6649325.0} {"train_loss": -26.06241226196289, "global_step": 477665, "epoch": 5755} {"train_loss": -24.78754234313965, "global_step": 477666, "epoch": 5755} {"train_loss": -26.356266021728516, "global_step": 477667, "epoch": 5755} {"train_loss": -25.926273345947266, "global_step": 477668, "epoch": 5755} {"train_loss": -26.331201553344727, "global_step": 477669, "epoch": 5755} {"train_loss": -26.157861709594727, "global_step": 477670, "epoch": 5755} {"train_loss": -26.1580753326416, "global_step": 477671, "epoch": 5755} {"train_loss": -26.602462768554688, "global_step": 477672, "epoch": 5755} {"train_loss": -26.21087646484375, "global_step": 477673, "epoch": 5755} {"train_loss": -27.05084800720215, "global_step": 477674, "epoch": 5755} {"train_loss": -26.5104923248291, "global_step": 477675, "epoch": 5755} {"train_loss": -26.523828506469727, "global_step": 477676, "epoch": 5755} {"train_loss": -26.927499771118164, "global_step": 477677, "epoch": 5755} {"train_loss": -26.42254066467285, "global_step": 477678, "epoch": 5755} {"train_loss": -26.745595932006836, "global_step": 477679, "epoch": 5755} {"train_loss": -26.626874923706055, "global_step": 477680, "epoch": 5755} {"train_loss": -26.7971248626709, "global_step": 477681, "epoch": 5755} {"train_loss": -26.879444122314453, "global_step": 477682, "epoch": 5755} {"train_loss": -26.64501953125, "global_step": 477683, "epoch": 5755} {"train_loss": -27.404144287109375, "global_step": 477684, "epoch": 5755} {"train_loss": -26.846038818359375, "global_step": 477685, "epoch": 5755} {"train_loss": -26.798608779907227, "global_step": 477686, "epoch": 5755} {"train_loss": -26.878528594970703, "global_step": 477687, "epoch": 5755} {"train_loss": -27.11834144592285, "global_step": 477688, "epoch": 5755} {"train_loss": -27.207223892211914, "global_step": 477689, "epoch": 5755} {"train_loss": -26.86036491394043, "global_step": 477690, "epoch": 5755} {"train_loss": -26.907611846923828, "global_step": 477691, "epoch": 5755} {"train_loss": -27.329870223999023, "global_step": 477692, "epoch": 5755} {"train_loss": -27.0958251953125, "global_step": 477693, "epoch": 5755} {"train_loss": -26.8994140625, "global_step": 477694, "epoch": 5755} {"train_loss": -27.204614639282227, "global_step": 477695, "epoch": 5755} {"train_loss": -27.136098861694336, "global_step": 477696, "epoch": 5755} {"train_loss": -27.062713623046875, "global_step": 477697, "epoch": 5755} {"train_loss": -27.300445556640625, "global_step": 477698, "epoch": 5755} {"train_loss": -27.184833526611328, "global_step": 477699, "epoch": 5755} {"train_loss": -27.168136596679688, "global_step": 477700, "epoch": 5755} {"train_loss": -27.114673614501953, "global_step": 477701, "epoch": 5755} {"train_loss": -27.209318161010742, "global_step": 477702, "epoch": 5755} {"train_loss": -27.165454864501953, "global_step": 477703, "epoch": 5755} {"train_loss": -27.038990020751953, "global_step": 477704, "epoch": 5755} {"train_loss": -27.56442642211914, "global_step": 477705, "epoch": 5755} {"train_loss": -26.782697677612305, "global_step": 477706, "epoch": 5755} {"train_loss": -27.457061767578125, "global_step": 477707, "epoch": 5755} {"train_loss": -26.97639274597168, "global_step": 477708, "epoch": 5755} {"train_loss": -27.318429946899414, "global_step": 477709, "epoch": 5755} {"train_loss": -27.055627822875977, "global_step": 477710, "epoch": 5755} {"train_loss": -27.26189613342285, "global_step": 477711, "epoch": 5755} {"train_loss": -27.182565689086914, "global_step": 477712, "epoch": 5755} {"train_loss": -27.307601928710938, "global_step": 477713, "epoch": 5755} {"train_loss": -27.409238815307617, "global_step": 477714, "epoch": 5755} {"train_loss": -27.513818740844727, "global_step": 477715, "epoch": 5755} {"train_loss": -27.428573608398438, "global_step": 477716, "epoch": 5755} {"train_loss": -27.27906608581543, "global_step": 477717, "epoch": 5755} {"train_loss": -27.358327865600586, "global_step": 477718, "epoch": 5755} {"train_loss": -27.49318504333496, "global_step": 477719, "epoch": 5755} {"train_loss": -27.38134765625, "global_step": 477720, "epoch": 5755} {"train_loss": -27.095813751220703, "global_step": 477721, "epoch": 5755} {"train_loss": -26.781335830688477, "global_step": 477722, "epoch": 5755} {"train_loss": -27.681318283081055, "global_step": 477723, "epoch": 5755} {"train_loss": -27.33837890625, "global_step": 477724, "epoch": 5755} {"train_loss": -27.6673641204834, "global_step": 477725, "epoch": 5755} {"train_loss": -27.327512741088867, "global_step": 477726, "epoch": 5755} {"train_loss": -26.919204711914062, "global_step": 477727, "epoch": 5755} {"train_loss": -27.2298526763916, "global_step": 477728, "epoch": 5755} {"train_loss": -27.66267967224121, "global_step": 477729, "epoch": 5755} {"train_loss": -27.3762149810791, "global_step": 477730, "epoch": 5755} {"train_loss": -27.51222038269043, "global_step": 477731, "epoch": 5755} {"train_loss": -27.6424503326416, "global_step": 477732, "epoch": 5755} {"train_loss": -27.175907135009766, "global_step": 477733, "epoch": 5755} {"train_loss": -26.79926872253418, "global_step": 477734, "epoch": 5755} {"train_loss": -27.22475242614746, "global_step": 477735, "epoch": 5755} {"train_loss": -27.16663932800293, "global_step": 477736, "epoch": 5755} {"train_loss": -27.335111618041992, "global_step": 477737, "epoch": 5755} {"train_loss": -26.976720809936523, "global_step": 477738, "epoch": 5755} {"train_loss": -27.0604305267334, "global_step": 477739, "epoch": 5755} {"train_loss": -27.159704208374023, "global_step": 477740, "epoch": 5755} {"train_loss": -27.76846694946289, "global_step": 477741, "epoch": 5755} {"train_loss": -27.386808395385742, "global_step": 477742, "epoch": 5755} {"train_loss": -27.190750122070312, "global_step": 477743, "epoch": 5755} {"train_loss": -27.209136962890625, "global_step": 477744, "epoch": 5755} {"train_loss": -27.4549503326416, "global_step": 477745, "epoch": 5755} {"train_loss": -27.388153076171875, "global_step": 477746, "epoch": 5755} {"train_loss": -27.04002885933382, "global_step": 477747, "epoch": 5755, "val_loss": 6747983.0} {"train_loss": -24.482643127441406, "global_step": 477748, "epoch": 5756} {"train_loss": -23.50851821899414, "global_step": 477749, "epoch": 5756} {"train_loss": -21.979551315307617, "global_step": 477750, "epoch": 5756} {"train_loss": -24.61709976196289, "global_step": 477751, "epoch": 5756} {"train_loss": -25.238615036010742, "global_step": 477752, "epoch": 5756} {"train_loss": -24.259355545043945, "global_step": 477753, "epoch": 5756} {"train_loss": -25.192142486572266, "global_step": 477754, "epoch": 5756} {"train_loss": -24.911094665527344, "global_step": 477755, "epoch": 5756} {"train_loss": -25.084558486938477, "global_step": 477756, "epoch": 5756} {"train_loss": -25.148529052734375, "global_step": 477757, "epoch": 5756} {"train_loss": -24.898706436157227, "global_step": 477758, "epoch": 5756} {"train_loss": -25.32733726501465, "global_step": 477759, "epoch": 5756} {"train_loss": -25.55989646911621, "global_step": 477760, "epoch": 5756} {"train_loss": -25.402679443359375, "global_step": 477761, "epoch": 5756} {"train_loss": -26.035480499267578, "global_step": 477762, "epoch": 5756} {"train_loss": -25.60735511779785, "global_step": 477763, "epoch": 5756} {"train_loss": -25.858932495117188, "global_step": 477764, "epoch": 5756} {"train_loss": -26.285375595092773, "global_step": 477765, "epoch": 5756} {"train_loss": -25.905658721923828, "global_step": 477766, "epoch": 5756} {"train_loss": -26.3182430267334, "global_step": 477767, "epoch": 5756} {"train_loss": -25.9507999420166, "global_step": 477768, "epoch": 5756} {"train_loss": -26.0589599609375, "global_step": 477769, "epoch": 5756} {"train_loss": -26.070409774780273, "global_step": 477770, "epoch": 5756} {"train_loss": -26.29035758972168, "global_step": 477771, "epoch": 5756} {"train_loss": -26.259748458862305, "global_step": 477772, "epoch": 5756} {"train_loss": -26.511648178100586, "global_step": 477773, "epoch": 5756} {"train_loss": -26.30527687072754, "global_step": 477774, "epoch": 5756} {"train_loss": -26.22022819519043, "global_step": 477775, "epoch": 5756} {"train_loss": -26.617902755737305, "global_step": 477776, "epoch": 5756} {"train_loss": -26.634775161743164, "global_step": 477777, "epoch": 5756} {"train_loss": -26.2586669921875, "global_step": 477778, "epoch": 5756} {"train_loss": -26.642383575439453, "global_step": 477779, "epoch": 5756} {"train_loss": -26.40437889099121, "global_step": 477780, "epoch": 5756} {"train_loss": -26.711984634399414, "global_step": 477781, "epoch": 5756} {"train_loss": -26.516101837158203, "global_step": 477782, "epoch": 5756} {"train_loss": -26.780195236206055, "global_step": 477783, "epoch": 5756} {"train_loss": -26.55164909362793, "global_step": 477784, "epoch": 5756} {"train_loss": -26.584348678588867, "global_step": 477785, "epoch": 5756} {"train_loss": -26.585901260375977, "global_step": 477786, "epoch": 5756} {"train_loss": -26.965681076049805, "global_step": 477787, "epoch": 5756} {"train_loss": -27.00056266784668, "global_step": 477788, "epoch": 5756} {"train_loss": -26.849872589111328, "global_step": 477789, "epoch": 5756} {"train_loss": -26.72751235961914, "global_step": 477790, "epoch": 5756} {"train_loss": -27.11277198791504, "global_step": 477791, "epoch": 5756} {"train_loss": -26.6430721282959, "global_step": 477792, "epoch": 5756} {"train_loss": -26.812524795532227, "global_step": 477793, "epoch": 5756} {"train_loss": -27.116825103759766, "global_step": 477794, "epoch": 5756} {"train_loss": -27.0781307220459, "global_step": 477795, "epoch": 5756} {"train_loss": -27.19062614440918, "global_step": 477796, "epoch": 5756} {"train_loss": -27.256559371948242, "global_step": 477797, "epoch": 5756} {"train_loss": -27.52787208557129, "global_step": 477798, "epoch": 5756} {"train_loss": -26.961729049682617, "global_step": 477799, "epoch": 5756} {"train_loss": -27.245153427124023, "global_step": 477800, "epoch": 5756} {"train_loss": -26.755908966064453, "global_step": 477801, "epoch": 5756} {"train_loss": -27.185083389282227, "global_step": 477802, "epoch": 5756} {"train_loss": -27.393848419189453, "global_step": 477803, "epoch": 5756} {"train_loss": -26.899433135986328, "global_step": 477804, "epoch": 5756} {"train_loss": -27.41034507751465, "global_step": 477805, "epoch": 5756} {"train_loss": -27.35587501525879, "global_step": 477806, "epoch": 5756} {"train_loss": -26.737258911132812, "global_step": 477807, "epoch": 5756} {"train_loss": -26.87993812561035, "global_step": 477808, "epoch": 5756} {"train_loss": -27.114337921142578, "global_step": 477809, "epoch": 5756} {"train_loss": -27.064380645751953, "global_step": 477810, "epoch": 5756} {"train_loss": -27.50333023071289, "global_step": 477811, "epoch": 5756} {"train_loss": -27.372724533081055, "global_step": 477812, "epoch": 5756} {"train_loss": -27.640161514282227, "global_step": 477813, "epoch": 5756} {"train_loss": -27.431350708007812, "global_step": 477814, "epoch": 5756} {"train_loss": -27.288801193237305, "global_step": 477815, "epoch": 5756} {"train_loss": -27.62103843688965, "global_step": 477816, "epoch": 5756} {"train_loss": -27.012195587158203, "global_step": 477817, "epoch": 5756} {"train_loss": -26.942625045776367, "global_step": 477818, "epoch": 5756} {"train_loss": -27.214399337768555, "global_step": 477819, "epoch": 5756} {"train_loss": -27.09101676940918, "global_step": 477820, "epoch": 5756} {"train_loss": -27.360300064086914, "global_step": 477821, "epoch": 5756} {"train_loss": -27.565967559814453, "global_step": 477822, "epoch": 5756} {"train_loss": -27.269702911376953, "global_step": 477823, "epoch": 5756} {"train_loss": -27.598896026611328, "global_step": 477824, "epoch": 5756} {"train_loss": -27.5560302734375, "global_step": 477825, "epoch": 5756} {"train_loss": -27.181543350219727, "global_step": 477826, "epoch": 5756} {"train_loss": -27.108057022094727, "global_step": 477827, "epoch": 5756} {"train_loss": -27.410978317260742, "global_step": 477828, "epoch": 5756} {"train_loss": -27.0606746673584, "global_step": 477829, "epoch": 5756} {"train_loss": -26.503280731568854, "global_step": 477830, "epoch": 5756, "val_loss": 6640910.0} {"train_loss": -26.906152725219727, "global_step": 477831, "epoch": 5757} {"train_loss": -26.801532745361328, "global_step": 477832, "epoch": 5757} {"train_loss": -26.84160804748535, "global_step": 477833, "epoch": 5757} {"train_loss": -26.79509925842285, "global_step": 477834, "epoch": 5757} {"train_loss": -26.604429244995117, "global_step": 477835, "epoch": 5757} {"train_loss": -26.32185935974121, "global_step": 477836, "epoch": 5757} {"train_loss": -27.111907958984375, "global_step": 477837, "epoch": 5757} {"train_loss": -26.9218692779541, "global_step": 477838, "epoch": 5757} {"train_loss": -27.21942138671875, "global_step": 477839, "epoch": 5757} {"train_loss": -26.98597526550293, "global_step": 477840, "epoch": 5757} {"train_loss": -27.04584312438965, "global_step": 477841, "epoch": 5757} {"train_loss": -27.38995361328125, "global_step": 477842, "epoch": 5757} {"train_loss": -27.25733757019043, "global_step": 477843, "epoch": 5757} {"train_loss": -26.837793350219727, "global_step": 477844, "epoch": 5757} {"train_loss": -27.155048370361328, "global_step": 477845, "epoch": 5757} {"train_loss": -27.3638916015625, "global_step": 477846, "epoch": 5757} {"train_loss": -27.548248291015625, "global_step": 477847, "epoch": 5757} {"train_loss": -27.405752182006836, "global_step": 477848, "epoch": 5757} {"train_loss": -27.387842178344727, "global_step": 477849, "epoch": 5757} {"train_loss": -27.39631462097168, "global_step": 477850, "epoch": 5757} {"train_loss": -26.962162017822266, "global_step": 477851, "epoch": 5757} {"train_loss": -26.96498680114746, "global_step": 477852, "epoch": 5757} {"train_loss": -27.426862716674805, "global_step": 477853, "epoch": 5757} {"train_loss": -27.14948844909668, "global_step": 477854, "epoch": 5757} {"train_loss": -27.4074649810791, "global_step": 477855, "epoch": 5757} {"train_loss": -27.146530151367188, "global_step": 477856, "epoch": 5757} {"train_loss": -27.027021408081055, "global_step": 477857, "epoch": 5757} {"train_loss": -26.962173461914062, "global_step": 477858, "epoch": 5757} {"train_loss": -26.79376220703125, "global_step": 477859, "epoch": 5757} {"train_loss": -27.368350982666016, "global_step": 477860, "epoch": 5757} {"train_loss": -26.983779907226562, "global_step": 477861, "epoch": 5757} {"train_loss": -27.2587947845459, "global_step": 477862, "epoch": 5757} {"train_loss": -27.277692794799805, "global_step": 477863, "epoch": 5757} {"train_loss": -27.34746742248535, "global_step": 477864, "epoch": 5757} {"train_loss": -27.51043128967285, "global_step": 477865, "epoch": 5757} {"train_loss": -27.366559982299805, "global_step": 477866, "epoch": 5757} {"train_loss": -27.16041374206543, "global_step": 477867, "epoch": 5757} {"train_loss": -27.310087203979492, "global_step": 477868, "epoch": 5757} {"train_loss": -27.227262496948242, "global_step": 477869, "epoch": 5757} {"train_loss": -27.6780948638916, "global_step": 477870, "epoch": 5757} {"train_loss": -27.182714462280273, "global_step": 477871, "epoch": 5757} {"train_loss": -27.672855377197266, "global_step": 477872, "epoch": 5757} {"train_loss": -27.1448974609375, "global_step": 477873, "epoch": 5757} {"train_loss": -27.485509872436523, "global_step": 477874, "epoch": 5757} {"train_loss": -27.48713493347168, "global_step": 477875, "epoch": 5757} {"train_loss": -27.293996810913086, "global_step": 477876, "epoch": 5757} {"train_loss": -27.40180015563965, "global_step": 477877, "epoch": 5757} {"train_loss": -27.404455184936523, "global_step": 477878, "epoch": 5757} {"train_loss": -27.417724609375, "global_step": 477879, "epoch": 5757} {"train_loss": -27.398595809936523, "global_step": 477880, "epoch": 5757} {"train_loss": -27.47796058654785, "global_step": 477881, "epoch": 5757} {"train_loss": -27.20987892150879, "global_step": 477882, "epoch": 5757} {"train_loss": -27.313556671142578, "global_step": 477883, "epoch": 5757} {"train_loss": -27.2590274810791, "global_step": 477884, "epoch": 5757} {"train_loss": -27.239450454711914, "global_step": 477885, "epoch": 5757} {"train_loss": -27.469633102416992, "global_step": 477886, "epoch": 5757} {"train_loss": -27.589813232421875, "global_step": 477887, "epoch": 5757} {"train_loss": -27.63006591796875, "global_step": 477888, "epoch": 5757} {"train_loss": -27.23703956604004, "global_step": 477889, "epoch": 5757} {"train_loss": -27.86341667175293, "global_step": 477890, "epoch": 5757} {"train_loss": -27.156452178955078, "global_step": 477891, "epoch": 5757} {"train_loss": -27.085412979125977, "global_step": 477892, "epoch": 5757} {"train_loss": -27.217153549194336, "global_step": 477893, "epoch": 5757} {"train_loss": -27.32608985900879, "global_step": 477894, "epoch": 5757} {"train_loss": -27.652236938476562, "global_step": 477895, "epoch": 5757} {"train_loss": -27.395187377929688, "global_step": 477896, "epoch": 5757} {"train_loss": -27.126697540283203, "global_step": 477897, "epoch": 5757} {"train_loss": -26.901687622070312, "global_step": 477898, "epoch": 5757} {"train_loss": -26.943683624267578, "global_step": 477899, "epoch": 5757} {"train_loss": -27.41552734375, "global_step": 477900, "epoch": 5757} {"train_loss": -26.996540069580078, "global_step": 477901, "epoch": 5757} {"train_loss": -26.757343292236328, "global_step": 477902, "epoch": 5757} {"train_loss": -26.981220245361328, "global_step": 477903, "epoch": 5757} {"train_loss": -27.218704223632812, "global_step": 477904, "epoch": 5757} {"train_loss": -27.029254913330078, "global_step": 477905, "epoch": 5757} {"train_loss": -26.860986709594727, "global_step": 477906, "epoch": 5757} {"train_loss": -27.239606857299805, "global_step": 477907, "epoch": 5757} {"train_loss": -27.336389541625977, "global_step": 477908, "epoch": 5757} {"train_loss": -27.0062313079834, "global_step": 477909, "epoch": 5757} {"train_loss": -27.2452335357666, "global_step": 477910, "epoch": 5757} {"train_loss": -26.693830490112305, "global_step": 477911, "epoch": 5757} {"train_loss": -27.298269271850586, "global_step": 477912, "epoch": 5757} {"train_loss": -27.19328326489552, "global_step": 477913, "epoch": 5757, "val_loss": 6484238.0} {"train_loss": -24.910945892333984, "global_step": 477914, "epoch": 5758} {"train_loss": -24.508872985839844, "global_step": 477915, "epoch": 5758} {"train_loss": -26.051828384399414, "global_step": 477916, "epoch": 5758} {"train_loss": -24.849689483642578, "global_step": 477917, "epoch": 5758} {"train_loss": -25.154775619506836, "global_step": 477918, "epoch": 5758} {"train_loss": -26.679950714111328, "global_step": 477919, "epoch": 5758} {"train_loss": -25.98272705078125, "global_step": 477920, "epoch": 5758} {"train_loss": -25.537948608398438, "global_step": 477921, "epoch": 5758} {"train_loss": -25.71003532409668, "global_step": 477922, "epoch": 5758} {"train_loss": -25.946826934814453, "global_step": 477923, "epoch": 5758} {"train_loss": -26.19365882873535, "global_step": 477924, "epoch": 5758} {"train_loss": -26.322616577148438, "global_step": 477925, "epoch": 5758} {"train_loss": -26.41868019104004, "global_step": 477926, "epoch": 5758} {"train_loss": -25.717580795288086, "global_step": 477927, "epoch": 5758} {"train_loss": -26.336597442626953, "global_step": 477928, "epoch": 5758} {"train_loss": -26.290143966674805, "global_step": 477929, "epoch": 5758} {"train_loss": -26.613311767578125, "global_step": 477930, "epoch": 5758} {"train_loss": -26.357685089111328, "global_step": 477931, "epoch": 5758} {"train_loss": -26.39837646484375, "global_step": 477932, "epoch": 5758} {"train_loss": -26.03376579284668, "global_step": 477933, "epoch": 5758} {"train_loss": -26.560791015625, "global_step": 477934, "epoch": 5758} {"train_loss": -26.540159225463867, "global_step": 477935, "epoch": 5758} {"train_loss": -26.944501876831055, "global_step": 477936, "epoch": 5758} {"train_loss": -26.469358444213867, "global_step": 477937, "epoch": 5758} {"train_loss": -26.227582931518555, "global_step": 477938, "epoch": 5758} {"train_loss": -26.909748077392578, "global_step": 477939, "epoch": 5758} {"train_loss": -26.7314510345459, "global_step": 477940, "epoch": 5758} {"train_loss": -26.872909545898438, "global_step": 477941, "epoch": 5758} {"train_loss": -26.433002471923828, "global_step": 477942, "epoch": 5758} {"train_loss": -27.199981689453125, "global_step": 477943, "epoch": 5758} {"train_loss": -26.480215072631836, "global_step": 477944, "epoch": 5758} {"train_loss": -27.10820960998535, "global_step": 477945, "epoch": 5758} {"train_loss": -26.97247314453125, "global_step": 477946, "epoch": 5758} {"train_loss": -27.033660888671875, "global_step": 477947, "epoch": 5758} {"train_loss": -26.856048583984375, "global_step": 477948, "epoch": 5758} {"train_loss": -26.82566261291504, "global_step": 477949, "epoch": 5758} {"train_loss": -26.896757125854492, "global_step": 477950, "epoch": 5758} {"train_loss": -26.752676010131836, "global_step": 477951, "epoch": 5758} {"train_loss": -27.491186141967773, "global_step": 477952, "epoch": 5758} {"train_loss": -26.9595947265625, "global_step": 477953, "epoch": 5758} {"train_loss": -26.785720825195312, "global_step": 477954, "epoch": 5758} {"train_loss": -27.122167587280273, "global_step": 477955, "epoch": 5758} {"train_loss": -27.088214874267578, "global_step": 477956, "epoch": 5758} {"train_loss": -26.978092193603516, "global_step": 477957, "epoch": 5758} {"train_loss": -27.169971466064453, "global_step": 477958, "epoch": 5758} {"train_loss": -26.963336944580078, "global_step": 477959, "epoch": 5758} {"train_loss": -26.917560577392578, "global_step": 477960, "epoch": 5758} {"train_loss": -27.026477813720703, "global_step": 477961, "epoch": 5758} {"train_loss": -26.933094024658203, "global_step": 477962, "epoch": 5758} {"train_loss": -27.502655029296875, "global_step": 477963, "epoch": 5758} {"train_loss": -27.3593692779541, "global_step": 477964, "epoch": 5758} {"train_loss": -27.008380889892578, "global_step": 477965, "epoch": 5758} {"train_loss": -27.17950439453125, "global_step": 477966, "epoch": 5758} {"train_loss": -27.423206329345703, "global_step": 477967, "epoch": 5758} {"train_loss": -27.227651596069336, "global_step": 477968, "epoch": 5758} {"train_loss": -27.3826847076416, "global_step": 477969, "epoch": 5758} {"train_loss": -27.230466842651367, "global_step": 477970, "epoch": 5758} {"train_loss": -27.426239013671875, "global_step": 477971, "epoch": 5758} {"train_loss": -26.98297691345215, "global_step": 477972, "epoch": 5758} {"train_loss": -26.972196578979492, "global_step": 477973, "epoch": 5758} {"train_loss": -27.049673080444336, "global_step": 477974, "epoch": 5758} {"train_loss": -27.643402099609375, "global_step": 477975, "epoch": 5758} {"train_loss": -26.855133056640625, "global_step": 477976, "epoch": 5758} {"train_loss": -26.8678035736084, "global_step": 477977, "epoch": 5758} {"train_loss": -27.393463134765625, "global_step": 477978, "epoch": 5758} {"train_loss": -26.91696548461914, "global_step": 477979, "epoch": 5758} {"train_loss": -27.1154842376709, "global_step": 477980, "epoch": 5758} {"train_loss": -26.8795166015625, "global_step": 477981, "epoch": 5758} {"train_loss": -26.6959228515625, "global_step": 477982, "epoch": 5758} {"train_loss": -26.98707389831543, "global_step": 477983, "epoch": 5758} {"train_loss": -27.164031982421875, "global_step": 477984, "epoch": 5758} {"train_loss": -26.766775131225586, "global_step": 477985, "epoch": 5758} {"train_loss": -27.106260299682617, "global_step": 477986, "epoch": 5758} {"train_loss": -27.02204704284668, "global_step": 477987, "epoch": 5758} {"train_loss": -26.92584800720215, "global_step": 477988, "epoch": 5758} {"train_loss": -27.562841415405273, "global_step": 477989, "epoch": 5758} {"train_loss": -26.852081298828125, "global_step": 477990, "epoch": 5758} {"train_loss": -27.21685791015625, "global_step": 477991, "epoch": 5758} {"train_loss": -27.20212745666504, "global_step": 477992, "epoch": 5758} {"train_loss": -26.927631378173828, "global_step": 477993, "epoch": 5758} {"train_loss": -27.154611587524414, "global_step": 477994, "epoch": 5758} {"train_loss": -26.97771644592285, "global_step": 477995, "epoch": 5758} {"train_loss": -26.745646534195867, "global_step": 477996, "epoch": 5758, "val_loss": 6613277.0} {"train_loss": -26.687475204467773, "global_step": 477997, "epoch": 5759} {"train_loss": -27.061954498291016, "global_step": 477998, "epoch": 5759} {"train_loss": -26.99983787536621, "global_step": 477999, "epoch": 5759} {"train_loss": -27.067235946655273, "global_step": 478000, "epoch": 5759} {"train_loss": -27.161649703979492, "global_step": 478001, "epoch": 5759} {"train_loss": -26.97364616394043, "global_step": 478002, "epoch": 5759} {"train_loss": -27.119430541992188, "global_step": 478003, "epoch": 5759} {"train_loss": -27.208984375, "global_step": 478004, "epoch": 5759} {"train_loss": -26.858179092407227, "global_step": 478005, "epoch": 5759} {"train_loss": -27.228900909423828, "global_step": 478006, "epoch": 5759} {"train_loss": -27.014575958251953, "global_step": 478007, "epoch": 5759} {"train_loss": -27.0018367767334, "global_step": 478008, "epoch": 5759} {"train_loss": -26.997156143188477, "global_step": 478009, "epoch": 5759} {"train_loss": -27.150623321533203, "global_step": 478010, "epoch": 5759} {"train_loss": -27.081226348876953, "global_step": 478011, "epoch": 5759} {"train_loss": -26.905622482299805, "global_step": 478012, "epoch": 5759} {"train_loss": -26.859033584594727, "global_step": 478013, "epoch": 5759} {"train_loss": -27.346622467041016, "global_step": 478014, "epoch": 5759} {"train_loss": -26.93929100036621, "global_step": 478015, "epoch": 5759} {"train_loss": -27.471487045288086, "global_step": 478016, "epoch": 5759} {"train_loss": -27.11329460144043, "global_step": 478017, "epoch": 5759} {"train_loss": -27.567291259765625, "global_step": 478018, "epoch": 5759} {"train_loss": -27.299732208251953, "global_step": 478019, "epoch": 5759} {"train_loss": -27.17938232421875, "global_step": 478020, "epoch": 5759} {"train_loss": -27.30194091796875, "global_step": 478021, "epoch": 5759} {"train_loss": -27.328100204467773, "global_step": 478022, "epoch": 5759} {"train_loss": -27.274398803710938, "global_step": 478023, "epoch": 5759} {"train_loss": -27.35309410095215, "global_step": 478024, "epoch": 5759} {"train_loss": -27.21506690979004, "global_step": 478025, "epoch": 5759} {"train_loss": -27.358566284179688, "global_step": 478026, "epoch": 5759} {"train_loss": -27.198490142822266, "global_step": 478027, "epoch": 5759} {"train_loss": -27.366186141967773, "global_step": 478028, "epoch": 5759} {"train_loss": -27.327619552612305, "global_step": 478029, "epoch": 5759} {"train_loss": -27.493680953979492, "global_step": 478030, "epoch": 5759} {"train_loss": -27.45936393737793, "global_step": 478031, "epoch": 5759} {"train_loss": -27.113981246948242, "global_step": 478032, "epoch": 5759} {"train_loss": -27.120697021484375, "global_step": 478033, "epoch": 5759} {"train_loss": -27.37635612487793, "global_step": 478034, "epoch": 5759} {"train_loss": -27.44135856628418, "global_step": 478035, "epoch": 5759} {"train_loss": -27.485919952392578, "global_step": 478036, "epoch": 5759} {"train_loss": -27.169504165649414, "global_step": 478037, "epoch": 5759} {"train_loss": -27.089710235595703, "global_step": 478038, "epoch": 5759} {"train_loss": -27.45796012878418, "global_step": 478039, "epoch": 5759} {"train_loss": -27.304645538330078, "global_step": 478040, "epoch": 5759} {"train_loss": -27.627872467041016, "global_step": 478041, "epoch": 5759} {"train_loss": -27.0689697265625, "global_step": 478042, "epoch": 5759} {"train_loss": -26.898847579956055, "global_step": 478043, "epoch": 5759} {"train_loss": -27.3684024810791, "global_step": 478044, "epoch": 5759} {"train_loss": -27.127090454101562, "global_step": 478045, "epoch": 5759} {"train_loss": -27.114309310913086, "global_step": 478046, "epoch": 5759} {"train_loss": -27.0398006439209, "global_step": 478047, "epoch": 5759} {"train_loss": -27.118871688842773, "global_step": 478048, "epoch": 5759} {"train_loss": -27.198644638061523, "global_step": 478049, "epoch": 5759} {"train_loss": -27.382673263549805, "global_step": 478050, "epoch": 5759} {"train_loss": -27.168588638305664, "global_step": 478051, "epoch": 5759} {"train_loss": -27.432453155517578, "global_step": 478052, "epoch": 5759} {"train_loss": -26.838733673095703, "global_step": 478053, "epoch": 5759} {"train_loss": -27.102344512939453, "global_step": 478054, "epoch": 5759} {"train_loss": -26.328369140625, "global_step": 478055, "epoch": 5759} {"train_loss": -27.41631507873535, "global_step": 478056, "epoch": 5759} {"train_loss": -27.532745361328125, "global_step": 478057, "epoch": 5759} {"train_loss": -27.04922866821289, "global_step": 478058, "epoch": 5759} {"train_loss": -27.216995239257812, "global_step": 478059, "epoch": 5759} {"train_loss": -27.398176193237305, "global_step": 478060, "epoch": 5759} {"train_loss": -27.108367919921875, "global_step": 478061, "epoch": 5759} {"train_loss": -27.160175323486328, "global_step": 478062, "epoch": 5759} {"train_loss": -27.17362403869629, "global_step": 478063, "epoch": 5759} {"train_loss": -27.307947158813477, "global_step": 478064, "epoch": 5759} {"train_loss": -27.263992309570312, "global_step": 478065, "epoch": 5759} {"train_loss": -27.578521728515625, "global_step": 478066, "epoch": 5759} {"train_loss": -27.138792037963867, "global_step": 478067, "epoch": 5759} {"train_loss": -27.3643856048584, "global_step": 478068, "epoch": 5759} {"train_loss": -27.471521377563477, "global_step": 478069, "epoch": 5759} {"train_loss": -27.538196563720703, "global_step": 478070, "epoch": 5759} {"train_loss": -27.30438232421875, "global_step": 478071, "epoch": 5759} {"train_loss": -27.52936363220215, "global_step": 478072, "epoch": 5759} {"train_loss": -27.13266944885254, "global_step": 478073, "epoch": 5759} {"train_loss": -27.37287712097168, "global_step": 478074, "epoch": 5759} {"train_loss": -27.258581161499023, "global_step": 478075, "epoch": 5759} {"train_loss": -27.71626091003418, "global_step": 478076, "epoch": 5759} {"train_loss": -27.394697189331055, "global_step": 478077, "epoch": 5759} {"train_loss": -27.082178115844727, "global_step": 478078, "epoch": 5759} {"train_loss": -27.208052531782403, "global_step": 478079, "epoch": 5759, "val_loss": 6445371.0} {"train_loss": -25.923810958862305, "global_step": 478080, "epoch": 5760} {"train_loss": -25.955890655517578, "global_step": 478081, "epoch": 5760} {"train_loss": -25.873886108398438, "global_step": 478082, "epoch": 5760} {"train_loss": -26.0229434967041, "global_step": 478083, "epoch": 5760} {"train_loss": -26.01222801208496, "global_step": 478084, "epoch": 5760} {"train_loss": -25.22317123413086, "global_step": 478085, "epoch": 5760} {"train_loss": -25.8526668548584, "global_step": 478086, "epoch": 5760} {"train_loss": -25.758203506469727, "global_step": 478087, "epoch": 5760} {"train_loss": -26.61905860900879, "global_step": 478088, "epoch": 5760} {"train_loss": -26.292770385742188, "global_step": 478089, "epoch": 5760} {"train_loss": -26.553882598876953, "global_step": 478090, "epoch": 5760} {"train_loss": -26.59307861328125, "global_step": 478091, "epoch": 5760} {"train_loss": -26.400415420532227, "global_step": 478092, "epoch": 5760} {"train_loss": -26.32197380065918, "global_step": 478093, "epoch": 5760} {"train_loss": -26.355493545532227, "global_step": 478094, "epoch": 5760} {"train_loss": -26.46897315979004, "global_step": 478095, "epoch": 5760} {"train_loss": -26.715280532836914, "global_step": 478096, "epoch": 5760} {"train_loss": -26.57014274597168, "global_step": 478097, "epoch": 5760} {"train_loss": -26.71518898010254, "global_step": 478098, "epoch": 5760} {"train_loss": -26.5516414642334, "global_step": 478099, "epoch": 5760} {"train_loss": -26.545392990112305, "global_step": 478100, "epoch": 5760} {"train_loss": -26.810626983642578, "global_step": 478101, "epoch": 5760} {"train_loss": -26.652088165283203, "global_step": 478102, "epoch": 5760} {"train_loss": -26.770984649658203, "global_step": 478103, "epoch": 5760} {"train_loss": -27.113183975219727, "global_step": 478104, "epoch": 5760} {"train_loss": -26.703601837158203, "global_step": 478105, "epoch": 5760} {"train_loss": -27.096969604492188, "global_step": 478106, "epoch": 5760} {"train_loss": -26.73244285583496, "global_step": 478107, "epoch": 5760} {"train_loss": -27.287551879882812, "global_step": 478108, "epoch": 5760} {"train_loss": -27.250829696655273, "global_step": 478109, "epoch": 5760} {"train_loss": -27.232343673706055, "global_step": 478110, "epoch": 5760} {"train_loss": -27.18709373474121, "global_step": 478111, "epoch": 5760} {"train_loss": -27.26856803894043, "global_step": 478112, "epoch": 5760} {"train_loss": -27.14414405822754, "global_step": 478113, "epoch": 5760} {"train_loss": -26.928253173828125, "global_step": 478114, "epoch": 5760} {"train_loss": -27.05704116821289, "global_step": 478115, "epoch": 5760} {"train_loss": -27.035968780517578, "global_step": 478116, "epoch": 5760} {"train_loss": -27.376001358032227, "global_step": 478117, "epoch": 5760} {"train_loss": -27.3331356048584, "global_step": 478118, "epoch": 5760} {"train_loss": -27.5100154876709, "global_step": 478119, "epoch": 5760} {"train_loss": -27.21380043029785, "global_step": 478120, "epoch": 5760} {"train_loss": -27.183740615844727, "global_step": 478121, "epoch": 5760} {"train_loss": -27.184728622436523, "global_step": 478122, "epoch": 5760} {"train_loss": -27.09645652770996, "global_step": 478123, "epoch": 5760} {"train_loss": -27.339818954467773, "global_step": 478124, "epoch": 5760} {"train_loss": -26.9300594329834, "global_step": 478125, "epoch": 5760} {"train_loss": -27.349613189697266, "global_step": 478126, "epoch": 5760} {"train_loss": -27.0801944732666, "global_step": 478127, "epoch": 5760} {"train_loss": -27.253116607666016, "global_step": 478128, "epoch": 5760} {"train_loss": -27.34357261657715, "global_step": 478129, "epoch": 5760} {"train_loss": -27.115436553955078, "global_step": 478130, "epoch": 5760} {"train_loss": -27.107898712158203, "global_step": 478131, "epoch": 5760} {"train_loss": -27.31511878967285, "global_step": 478132, "epoch": 5760} {"train_loss": -27.278629302978516, "global_step": 478133, "epoch": 5760} {"train_loss": -27.36431312561035, "global_step": 478134, "epoch": 5760} {"train_loss": -27.582555770874023, "global_step": 478135, "epoch": 5760} {"train_loss": -27.31683921813965, "global_step": 478136, "epoch": 5760} {"train_loss": -27.045886993408203, "global_step": 478137, "epoch": 5760} {"train_loss": -27.34539794921875, "global_step": 478138, "epoch": 5760} {"train_loss": -27.14521598815918, "global_step": 478139, "epoch": 5760} {"train_loss": -27.08321189880371, "global_step": 478140, "epoch": 5760} {"train_loss": -27.4493350982666, "global_step": 478141, "epoch": 5760} {"train_loss": -27.48362159729004, "global_step": 478142, "epoch": 5760} {"train_loss": -27.375043869018555, "global_step": 478143, "epoch": 5760} {"train_loss": -27.152652740478516, "global_step": 478144, "epoch": 5760} {"train_loss": -27.367019653320312, "global_step": 478145, "epoch": 5760} {"train_loss": -26.781787872314453, "global_step": 478146, "epoch": 5760} {"train_loss": -26.715930938720703, "global_step": 478147, "epoch": 5760} {"train_loss": -26.948699951171875, "global_step": 478148, "epoch": 5760} {"train_loss": -26.983015060424805, "global_step": 478149, "epoch": 5760} {"train_loss": -27.0196533203125, "global_step": 478150, "epoch": 5760} {"train_loss": -26.97541618347168, "global_step": 478151, "epoch": 5760} {"train_loss": -27.193567276000977, "global_step": 478152, "epoch": 5760} {"train_loss": -27.2640323638916, "global_step": 478153, "epoch": 5760} {"train_loss": -26.650129318237305, "global_step": 478154, "epoch": 5760} {"train_loss": -27.21462059020996, "global_step": 478155, "epoch": 5760} {"train_loss": -27.18438720703125, "global_step": 478156, "epoch": 5760} {"train_loss": -26.899137496948242, "global_step": 478157, "epoch": 5760} {"train_loss": -27.121536254882812, "global_step": 478158, "epoch": 5760} {"train_loss": -27.189208984375, "global_step": 478159, "epoch": 5760} {"train_loss": -26.750463485717773, "global_step": 478160, "epoch": 5760} {"train_loss": -27.4268856048584, "global_step": 478161, "epoch": 5760} {"train_loss": -26.91385112900332, "global_step": 478162, "epoch": 5760, "val_loss": 6614304.0} {"train_loss": -26.601499557495117, "global_step": 478163, "epoch": 5761} {"train_loss": -26.81930923461914, "global_step": 478164, "epoch": 5761} {"train_loss": -26.40704345703125, "global_step": 478165, "epoch": 5761} {"train_loss": -26.76936149597168, "global_step": 478166, "epoch": 5761} {"train_loss": -26.490558624267578, "global_step": 478167, "epoch": 5761} {"train_loss": -26.853118896484375, "global_step": 478168, "epoch": 5761} {"train_loss": -26.593664169311523, "global_step": 478169, "epoch": 5761} {"train_loss": -27.01325035095215, "global_step": 478170, "epoch": 5761} {"train_loss": -26.911197662353516, "global_step": 478171, "epoch": 5761} {"train_loss": -26.611982345581055, "global_step": 478172, "epoch": 5761} {"train_loss": -27.280054092407227, "global_step": 478173, "epoch": 5761} {"train_loss": -26.80915641784668, "global_step": 478174, "epoch": 5761} {"train_loss": -27.089035034179688, "global_step": 478175, "epoch": 5761} {"train_loss": -26.850271224975586, "global_step": 478176, "epoch": 5761} {"train_loss": -27.081073760986328, "global_step": 478177, "epoch": 5761} {"train_loss": -27.07972526550293, "global_step": 478178, "epoch": 5761} {"train_loss": -27.29121971130371, "global_step": 478179, "epoch": 5761} {"train_loss": -27.369892120361328, "global_step": 478180, "epoch": 5761} {"train_loss": -27.398990631103516, "global_step": 478181, "epoch": 5761} {"train_loss": -27.03092384338379, "global_step": 478182, "epoch": 5761} {"train_loss": -26.855981826782227, "global_step": 478183, "epoch": 5761} {"train_loss": -27.16064453125, "global_step": 478184, "epoch": 5761} {"train_loss": -26.878026962280273, "global_step": 478185, "epoch": 5761} {"train_loss": -27.4572811126709, "global_step": 478186, "epoch": 5761} {"train_loss": -27.2305908203125, "global_step": 478187, "epoch": 5761} {"train_loss": -27.720417022705078, "global_step": 478188, "epoch": 5761} {"train_loss": -27.154470443725586, "global_step": 478189, "epoch": 5761} {"train_loss": -27.29719352722168, "global_step": 478190, "epoch": 5761} {"train_loss": -27.146162033081055, "global_step": 478191, "epoch": 5761} {"train_loss": -27.389677047729492, "global_step": 478192, "epoch": 5761} {"train_loss": -27.46646499633789, "global_step": 478193, "epoch": 5761} {"train_loss": -27.3620662689209, "global_step": 478194, "epoch": 5761} {"train_loss": -27.508127212524414, "global_step": 478195, "epoch": 5761} {"train_loss": -27.389013290405273, "global_step": 478196, "epoch": 5761} {"train_loss": -27.151248931884766, "global_step": 478197, "epoch": 5761} {"train_loss": -27.197463989257812, "global_step": 478198, "epoch": 5761} {"train_loss": -27.392358779907227, "global_step": 478199, "epoch": 5761} {"train_loss": -27.2828426361084, "global_step": 478200, "epoch": 5761} {"train_loss": -27.307783126831055, "global_step": 478201, "epoch": 5761} {"train_loss": -26.88772964477539, "global_step": 478202, "epoch": 5761} {"train_loss": -27.511865615844727, "global_step": 478203, "epoch": 5761} {"train_loss": -27.004657745361328, "global_step": 478204, "epoch": 5761} {"train_loss": -27.44223976135254, "global_step": 478205, "epoch": 5761} {"train_loss": -27.62818717956543, "global_step": 478206, "epoch": 5761} {"train_loss": -27.264968872070312, "global_step": 478207, "epoch": 5761} {"train_loss": -27.848737716674805, "global_step": 478208, "epoch": 5761} {"train_loss": -27.34210777282715, "global_step": 478209, "epoch": 5761} {"train_loss": -27.595050811767578, "global_step": 478210, "epoch": 5761} {"train_loss": -26.968786239624023, "global_step": 478211, "epoch": 5761} {"train_loss": -26.928308486938477, "global_step": 478212, "epoch": 5761} {"train_loss": -27.215890884399414, "global_step": 478213, "epoch": 5761} {"train_loss": -27.139219284057617, "global_step": 478214, "epoch": 5761} {"train_loss": -27.50177574157715, "global_step": 478215, "epoch": 5761} {"train_loss": -27.24578857421875, "global_step": 478216, "epoch": 5761} {"train_loss": -26.88306999206543, "global_step": 478217, "epoch": 5761} {"train_loss": -27.02853775024414, "global_step": 478218, "epoch": 5761} {"train_loss": -26.643386840820312, "global_step": 478219, "epoch": 5761} {"train_loss": -27.0018367767334, "global_step": 478220, "epoch": 5761} {"train_loss": -27.124958038330078, "global_step": 478221, "epoch": 5761} {"train_loss": -27.1844539642334, "global_step": 478222, "epoch": 5761} {"train_loss": -27.064865112304688, "global_step": 478223, "epoch": 5761} {"train_loss": -27.49297523498535, "global_step": 478224, "epoch": 5761} {"train_loss": -26.916202545166016, "global_step": 478225, "epoch": 5761} {"train_loss": -27.065988540649414, "global_step": 478226, "epoch": 5761} {"train_loss": -27.003965377807617, "global_step": 478227, "epoch": 5761} {"train_loss": -26.930456161499023, "global_step": 478228, "epoch": 5761} {"train_loss": -27.128652572631836, "global_step": 478229, "epoch": 5761} {"train_loss": -27.539813995361328, "global_step": 478230, "epoch": 5761} {"train_loss": -27.459671020507812, "global_step": 478231, "epoch": 5761} {"train_loss": -27.261749267578125, "global_step": 478232, "epoch": 5761} {"train_loss": -27.012487411499023, "global_step": 478233, "epoch": 5761} {"train_loss": -27.08673095703125, "global_step": 478234, "epoch": 5761} {"train_loss": -27.5468807220459, "global_step": 478235, "epoch": 5761} {"train_loss": -27.15643310546875, "global_step": 478236, "epoch": 5761} {"train_loss": -27.406503677368164, "global_step": 478237, "epoch": 5761} {"train_loss": -27.324583053588867, "global_step": 478238, "epoch": 5761} {"train_loss": -27.533079147338867, "global_step": 478239, "epoch": 5761} {"train_loss": -27.262924194335938, "global_step": 478240, "epoch": 5761} {"train_loss": -27.496702194213867, "global_step": 478241, "epoch": 5761} {"train_loss": -27.648096084594727, "global_step": 478242, "epoch": 5761} {"train_loss": -27.608417510986328, "global_step": 478243, "epoch": 5761} {"train_loss": -27.282880783081055, "global_step": 478244, "epoch": 5761} {"train_loss": -27.170394001236883, "global_step": 478245, "epoch": 5761, "val_loss": 6646732.0} {"train_loss": -26.009328842163086, "global_step": 478246, "epoch": 5762} {"train_loss": -26.47559928894043, "global_step": 478247, "epoch": 5762} {"train_loss": -27.413406372070312, "global_step": 478248, "epoch": 5762} {"train_loss": -26.00882911682129, "global_step": 478249, "epoch": 5762} {"train_loss": -26.71510124206543, "global_step": 478250, "epoch": 5762} {"train_loss": -26.316696166992188, "global_step": 478251, "epoch": 5762} {"train_loss": -26.758752822875977, "global_step": 478252, "epoch": 5762} {"train_loss": -26.412668228149414, "global_step": 478253, "epoch": 5762} {"train_loss": -26.995954513549805, "global_step": 478254, "epoch": 5762} {"train_loss": -27.133459091186523, "global_step": 478255, "epoch": 5762} {"train_loss": -26.483083724975586, "global_step": 478256, "epoch": 5762} {"train_loss": -26.86029624938965, "global_step": 478257, "epoch": 5762} {"train_loss": -26.835758209228516, "global_step": 478258, "epoch": 5762} {"train_loss": -26.887548446655273, "global_step": 478259, "epoch": 5762} {"train_loss": -26.43159294128418, "global_step": 478260, "epoch": 5762} {"train_loss": -27.086688995361328, "global_step": 478261, "epoch": 5762} {"train_loss": -27.06806755065918, "global_step": 478262, "epoch": 5762} {"train_loss": -27.31697654724121, "global_step": 478263, "epoch": 5762} {"train_loss": -27.065771102905273, "global_step": 478264, "epoch": 5762} {"train_loss": -26.83920669555664, "global_step": 478265, "epoch": 5762} {"train_loss": -27.04709243774414, "global_step": 478266, "epoch": 5762} {"train_loss": -27.065649032592773, "global_step": 478267, "epoch": 5762} {"train_loss": -27.197010040283203, "global_step": 478268, "epoch": 5762} {"train_loss": -27.08439064025879, "global_step": 478269, "epoch": 5762} {"train_loss": -27.237646102905273, "global_step": 478270, "epoch": 5762} {"train_loss": -27.05327796936035, "global_step": 478271, "epoch": 5762} {"train_loss": -27.166446685791016, "global_step": 478272, "epoch": 5762} {"train_loss": -27.286874771118164, "global_step": 478273, "epoch": 5762} {"train_loss": -26.6914119720459, "global_step": 478274, "epoch": 5762} {"train_loss": -26.833768844604492, "global_step": 478275, "epoch": 5762} {"train_loss": -26.761960983276367, "global_step": 478276, "epoch": 5762} {"train_loss": -27.2416934967041, "global_step": 478277, "epoch": 5762} {"train_loss": -26.8608341217041, "global_step": 478278, "epoch": 5762} {"train_loss": -27.346288681030273, "global_step": 478279, "epoch": 5762} {"train_loss": -27.260059356689453, "global_step": 478280, "epoch": 5762} {"train_loss": -26.78089714050293, "global_step": 478281, "epoch": 5762} {"train_loss": -27.49675941467285, "global_step": 478282, "epoch": 5762} {"train_loss": -27.399673461914062, "global_step": 478283, "epoch": 5762} {"train_loss": -26.852279663085938, "global_step": 478284, "epoch": 5762} {"train_loss": -27.42340087890625, "global_step": 478285, "epoch": 5762} {"train_loss": -27.141386032104492, "global_step": 478286, "epoch": 5762} {"train_loss": -27.428014755249023, "global_step": 478287, "epoch": 5762} {"train_loss": -27.27638053894043, "global_step": 478288, "epoch": 5762} {"train_loss": -27.195112228393555, "global_step": 478289, "epoch": 5762} {"train_loss": -26.888574600219727, "global_step": 478290, "epoch": 5762} {"train_loss": -27.340469360351562, "global_step": 478291, "epoch": 5762} {"train_loss": -27.32383155822754, "global_step": 478292, "epoch": 5762} {"train_loss": -27.286609649658203, "global_step": 478293, "epoch": 5762} {"train_loss": -27.019994735717773, "global_step": 478294, "epoch": 5762} {"train_loss": -27.510629653930664, "global_step": 478295, "epoch": 5762} {"train_loss": -27.17038917541504, "global_step": 478296, "epoch": 5762} {"train_loss": -27.200897216796875, "global_step": 478297, "epoch": 5762} {"train_loss": -27.527362823486328, "global_step": 478298, "epoch": 5762} {"train_loss": -27.577260971069336, "global_step": 478299, "epoch": 5762} {"train_loss": -26.944921493530273, "global_step": 478300, "epoch": 5762} {"train_loss": -27.479223251342773, "global_step": 478301, "epoch": 5762} {"train_loss": -27.477527618408203, "global_step": 478302, "epoch": 5762} {"train_loss": -27.151763916015625, "global_step": 478303, "epoch": 5762} {"train_loss": -27.495939254760742, "global_step": 478304, "epoch": 5762} {"train_loss": -27.14504051208496, "global_step": 478305, "epoch": 5762} {"train_loss": -27.51273536682129, "global_step": 478306, "epoch": 5762} {"train_loss": -26.651092529296875, "global_step": 478307, "epoch": 5762} {"train_loss": -26.965295791625977, "global_step": 478308, "epoch": 5762} {"train_loss": -27.079191207885742, "global_step": 478309, "epoch": 5762} {"train_loss": -27.2575740814209, "global_step": 478310, "epoch": 5762} {"train_loss": -27.374893188476562, "global_step": 478311, "epoch": 5762} {"train_loss": -26.834985733032227, "global_step": 478312, "epoch": 5762} {"train_loss": -27.12640380859375, "global_step": 478313, "epoch": 5762} {"train_loss": -27.092931747436523, "global_step": 478314, "epoch": 5762} {"train_loss": -27.361318588256836, "global_step": 478315, "epoch": 5762} {"train_loss": -27.042606353759766, "global_step": 478316, "epoch": 5762} {"train_loss": -26.9455509185791, "global_step": 478317, "epoch": 5762} {"train_loss": -27.101964950561523, "global_step": 478318, "epoch": 5762} {"train_loss": -26.98386001586914, "global_step": 478319, "epoch": 5762} {"train_loss": -27.324377059936523, "global_step": 478320, "epoch": 5762} {"train_loss": -27.14310646057129, "global_step": 478321, "epoch": 5762} {"train_loss": -27.54066276550293, "global_step": 478322, "epoch": 5762} {"train_loss": -27.39841651916504, "global_step": 478323, "epoch": 5762} {"train_loss": -27.382598876953125, "global_step": 478324, "epoch": 5762} {"train_loss": -27.65057373046875, "global_step": 478325, "epoch": 5762} {"train_loss": -27.420820236206055, "global_step": 478326, "epoch": 5762} {"train_loss": -27.41387367248535, "global_step": 478327, "epoch": 5762} {"train_loss": -27.11391653497535, "global_step": 478328, "epoch": 5762, "val_loss": 6615822.0} {"train_loss": -26.422277450561523, "global_step": 478329, "epoch": 5763} {"train_loss": -25.282485961914062, "global_step": 478330, "epoch": 5763} {"train_loss": -25.623579025268555, "global_step": 478331, "epoch": 5763} {"train_loss": -26.921567916870117, "global_step": 478332, "epoch": 5763} {"train_loss": -26.439483642578125, "global_step": 478333, "epoch": 5763} {"train_loss": -26.40116310119629, "global_step": 478334, "epoch": 5763} {"train_loss": -27.11565589904785, "global_step": 478335, "epoch": 5763} {"train_loss": -26.438032150268555, "global_step": 478336, "epoch": 5763} {"train_loss": -26.626789093017578, "global_step": 478337, "epoch": 5763} {"train_loss": -26.257802963256836, "global_step": 478338, "epoch": 5763} {"train_loss": -26.644184112548828, "global_step": 478339, "epoch": 5763} {"train_loss": -26.340408325195312, "global_step": 478340, "epoch": 5763} {"train_loss": -26.97637367248535, "global_step": 478341, "epoch": 5763} {"train_loss": -26.539274215698242, "global_step": 478342, "epoch": 5763} {"train_loss": -27.126815795898438, "global_step": 478343, "epoch": 5763} {"train_loss": -26.88813591003418, "global_step": 478344, "epoch": 5763} {"train_loss": -26.56719970703125, "global_step": 478345, "epoch": 5763} {"train_loss": -26.62824821472168, "global_step": 478346, "epoch": 5763} {"train_loss": -26.362043380737305, "global_step": 478347, "epoch": 5763} {"train_loss": -26.74332046508789, "global_step": 478348, "epoch": 5763} {"train_loss": -26.83734130859375, "global_step": 478349, "epoch": 5763} {"train_loss": -26.219099044799805, "global_step": 478350, "epoch": 5763} {"train_loss": -26.887908935546875, "global_step": 478351, "epoch": 5763} {"train_loss": -27.145414352416992, "global_step": 478352, "epoch": 5763} {"train_loss": -26.905120849609375, "global_step": 478353, "epoch": 5763} {"train_loss": -27.0403995513916, "global_step": 478354, "epoch": 5763} {"train_loss": -27.09827995300293, "global_step": 478355, "epoch": 5763} {"train_loss": -27.313419342041016, "global_step": 478356, "epoch": 5763} {"train_loss": -27.31341552734375, "global_step": 478357, "epoch": 5763} {"train_loss": -27.456745147705078, "global_step": 478358, "epoch": 5763} {"train_loss": -27.228742599487305, "global_step": 478359, "epoch": 5763} {"train_loss": -27.375930786132812, "global_step": 478360, "epoch": 5763} {"train_loss": -27.386062622070312, "global_step": 478361, "epoch": 5763} {"train_loss": -27.18250846862793, "global_step": 478362, "epoch": 5763} {"train_loss": -27.418380737304688, "global_step": 478363, "epoch": 5763} {"train_loss": -27.2369327545166, "global_step": 478364, "epoch": 5763} {"train_loss": -26.873743057250977, "global_step": 478365, "epoch": 5763} {"train_loss": -27.434833526611328, "global_step": 478366, "epoch": 5763} {"train_loss": -27.30769920349121, "global_step": 478367, "epoch": 5763} {"train_loss": -27.2535343170166, "global_step": 478368, "epoch": 5763} {"train_loss": -27.19893455505371, "global_step": 478369, "epoch": 5763} {"train_loss": -27.097867965698242, "global_step": 478370, "epoch": 5763} {"train_loss": -27.2852783203125, "global_step": 478371, "epoch": 5763} {"train_loss": -27.090070724487305, "global_step": 478372, "epoch": 5763} {"train_loss": -27.044309616088867, "global_step": 478373, "epoch": 5763} {"train_loss": -27.767383575439453, "global_step": 478374, "epoch": 5763} {"train_loss": -27.412328720092773, "global_step": 478375, "epoch": 5763} {"train_loss": -27.369693756103516, "global_step": 478376, "epoch": 5763} {"train_loss": -27.41495704650879, "global_step": 478377, "epoch": 5763} {"train_loss": -27.607685089111328, "global_step": 478378, "epoch": 5763} {"train_loss": -27.354156494140625, "global_step": 478379, "epoch": 5763} {"train_loss": -27.23932456970215, "global_step": 478380, "epoch": 5763} {"train_loss": -27.350427627563477, "global_step": 478381, "epoch": 5763} {"train_loss": -27.255117416381836, "global_step": 478382, "epoch": 5763} {"train_loss": -27.241352081298828, "global_step": 478383, "epoch": 5763} {"train_loss": -27.3237247467041, "global_step": 478384, "epoch": 5763} {"train_loss": -27.33405113220215, "global_step": 478385, "epoch": 5763} {"train_loss": -27.171527862548828, "global_step": 478386, "epoch": 5763} {"train_loss": -27.106531143188477, "global_step": 478387, "epoch": 5763} {"train_loss": -27.122095108032227, "global_step": 478388, "epoch": 5763} {"train_loss": -27.43265724182129, "global_step": 478389, "epoch": 5763} {"train_loss": -27.40497398376465, "global_step": 478390, "epoch": 5763} {"train_loss": -27.335407257080078, "global_step": 478391, "epoch": 5763} {"train_loss": -27.263837814331055, "global_step": 478392, "epoch": 5763} {"train_loss": -27.73756217956543, "global_step": 478393, "epoch": 5763} {"train_loss": -26.883106231689453, "global_step": 478394, "epoch": 5763} {"train_loss": -27.359785079956055, "global_step": 478395, "epoch": 5763} {"train_loss": -27.405303955078125, "global_step": 478396, "epoch": 5763} {"train_loss": -27.103322982788086, "global_step": 478397, "epoch": 5763} {"train_loss": -27.635290145874023, "global_step": 478398, "epoch": 5763} {"train_loss": -27.488088607788086, "global_step": 478399, "epoch": 5763} {"train_loss": -27.662267684936523, "global_step": 478400, "epoch": 5763} {"train_loss": -27.463287353515625, "global_step": 478401, "epoch": 5763} {"train_loss": -27.826025009155273, "global_step": 478402, "epoch": 5763} {"train_loss": -27.752399444580078, "global_step": 478403, "epoch": 5763} {"train_loss": -27.66547203063965, "global_step": 478404, "epoch": 5763} {"train_loss": -27.25300407409668, "global_step": 478405, "epoch": 5763} {"train_loss": -27.29804039001465, "global_step": 478406, "epoch": 5763} {"train_loss": -27.406110763549805, "global_step": 478407, "epoch": 5763} {"train_loss": -27.606901168823242, "global_step": 478408, "epoch": 5763} {"train_loss": -27.447866439819336, "global_step": 478409, "epoch": 5763} {"train_loss": -27.863386154174805, "global_step": 478410, "epoch": 5763} {"train_loss": -27.09209591509348, "global_step": 478411, "epoch": 5763, "val_loss": 6670182.0} {"train_loss": -26.854400634765625, "global_step": 478412, "epoch": 5764} {"train_loss": -27.210575103759766, "global_step": 478413, "epoch": 5764} {"train_loss": -27.3122501373291, "global_step": 478414, "epoch": 5764} {"train_loss": -27.005599975585938, "global_step": 478415, "epoch": 5764} {"train_loss": -26.50040626525879, "global_step": 478416, "epoch": 5764} {"train_loss": -27.1488094329834, "global_step": 478417, "epoch": 5764} {"train_loss": -27.047433853149414, "global_step": 478418, "epoch": 5764} {"train_loss": -27.536733627319336, "global_step": 478419, "epoch": 5764} {"train_loss": -26.679412841796875, "global_step": 478420, "epoch": 5764} {"train_loss": -26.773778915405273, "global_step": 478421, "epoch": 5764} {"train_loss": -26.88026237487793, "global_step": 478422, "epoch": 5764} {"train_loss": -26.734277725219727, "global_step": 478423, "epoch": 5764} {"train_loss": -27.3421573638916, "global_step": 478424, "epoch": 5764} {"train_loss": -27.114904403686523, "global_step": 478425, "epoch": 5764} {"train_loss": -26.763952255249023, "global_step": 478426, "epoch": 5764} {"train_loss": -27.126510620117188, "global_step": 478427, "epoch": 5764} {"train_loss": -27.2730770111084, "global_step": 478428, "epoch": 5764} {"train_loss": -26.799585342407227, "global_step": 478429, "epoch": 5764} {"train_loss": -26.07207679748535, "global_step": 478430, "epoch": 5764} {"train_loss": -27.146625518798828, "global_step": 478431, "epoch": 5764} {"train_loss": -27.112075805664062, "global_step": 478432, "epoch": 5764} {"train_loss": -26.988025665283203, "global_step": 478433, "epoch": 5764} {"train_loss": -27.055801391601562, "global_step": 478434, "epoch": 5764} {"train_loss": -26.812204360961914, "global_step": 478435, "epoch": 5764} {"train_loss": -27.369626998901367, "global_step": 478436, "epoch": 5764} {"train_loss": -27.064512252807617, "global_step": 478437, "epoch": 5764} {"train_loss": -27.558237075805664, "global_step": 478438, "epoch": 5764} {"train_loss": -27.130285263061523, "global_step": 478439, "epoch": 5764} {"train_loss": -26.714298248291016, "global_step": 478440, "epoch": 5764} {"train_loss": -27.110021591186523, "global_step": 478441, "epoch": 5764} {"train_loss": -27.306884765625, "global_step": 478442, "epoch": 5764} {"train_loss": -26.914138793945312, "global_step": 478443, "epoch": 5764} {"train_loss": -27.077314376831055, "global_step": 478444, "epoch": 5764} {"train_loss": -26.67681884765625, "global_step": 478445, "epoch": 5764} {"train_loss": -27.215173721313477, "global_step": 478446, "epoch": 5764} {"train_loss": -27.5047664642334, "global_step": 478447, "epoch": 5764} {"train_loss": -26.993921279907227, "global_step": 478448, "epoch": 5764} {"train_loss": -27.076826095581055, "global_step": 478449, "epoch": 5764} {"train_loss": -27.14653968811035, "global_step": 478450, "epoch": 5764} {"train_loss": -26.95709800720215, "global_step": 478451, "epoch": 5764} {"train_loss": -27.094953536987305, "global_step": 478452, "epoch": 5764} {"train_loss": -27.142044067382812, "global_step": 478453, "epoch": 5764} {"train_loss": -27.140661239624023, "global_step": 478454, "epoch": 5764} {"train_loss": -27.101612091064453, "global_step": 478455, "epoch": 5764} {"train_loss": -27.349145889282227, "global_step": 478456, "epoch": 5764} {"train_loss": -27.34574317932129, "global_step": 478457, "epoch": 5764} {"train_loss": -27.30048179626465, "global_step": 478458, "epoch": 5764} {"train_loss": -27.118377685546875, "global_step": 478459, "epoch": 5764} {"train_loss": -27.638376235961914, "global_step": 478460, "epoch": 5764} {"train_loss": -27.289798736572266, "global_step": 478461, "epoch": 5764} {"train_loss": -27.15093994140625, "global_step": 478462, "epoch": 5764} {"train_loss": -27.434356689453125, "global_step": 478463, "epoch": 5764} {"train_loss": -27.697561264038086, "global_step": 478464, "epoch": 5764} {"train_loss": -27.3272762298584, "global_step": 478465, "epoch": 5764} {"train_loss": -27.331897735595703, "global_step": 478466, "epoch": 5764} {"train_loss": -27.020593643188477, "global_step": 478467, "epoch": 5764} {"train_loss": -27.427642822265625, "global_step": 478468, "epoch": 5764} {"train_loss": -27.314380645751953, "global_step": 478469, "epoch": 5764} {"train_loss": -27.2720947265625, "global_step": 478470, "epoch": 5764} {"train_loss": -27.162092208862305, "global_step": 478471, "epoch": 5764} {"train_loss": -27.444854736328125, "global_step": 478472, "epoch": 5764} {"train_loss": -27.3792781829834, "global_step": 478473, "epoch": 5764} {"train_loss": -27.470930099487305, "global_step": 478474, "epoch": 5764} {"train_loss": -27.13409996032715, "global_step": 478475, "epoch": 5764} {"train_loss": -27.383325576782227, "global_step": 478476, "epoch": 5764} {"train_loss": -27.19355583190918, "global_step": 478477, "epoch": 5764} {"train_loss": -27.54248046875, "global_step": 478478, "epoch": 5764} {"train_loss": -27.467639923095703, "global_step": 478479, "epoch": 5764} {"train_loss": -27.413232803344727, "global_step": 478480, "epoch": 5764} {"train_loss": -27.79804039001465, "global_step": 478481, "epoch": 5764} {"train_loss": -27.20037269592285, "global_step": 478482, "epoch": 5764} {"train_loss": -27.377395629882812, "global_step": 478483, "epoch": 5764} {"train_loss": -27.66413688659668, "global_step": 478484, "epoch": 5764} {"train_loss": -27.380353927612305, "global_step": 478485, "epoch": 5764} {"train_loss": -27.15447998046875, "global_step": 478486, "epoch": 5764} {"train_loss": -27.095617294311523, "global_step": 478487, "epoch": 5764} {"train_loss": -27.7030086517334, "global_step": 478488, "epoch": 5764} {"train_loss": -26.980941772460938, "global_step": 478489, "epoch": 5764} {"train_loss": -26.215869903564453, "global_step": 478490, "epoch": 5764} {"train_loss": -25.902830123901367, "global_step": 478491, "epoch": 5764} {"train_loss": -26.570749282836914, "global_step": 478492, "epoch": 5764} {"train_loss": -26.487442016601562, "global_step": 478493, "epoch": 5764} {"train_loss": -27.133141850850667, "global_step": 478494, "epoch": 5764, "val_loss": 6591685.0} {"train_loss": -26.4239501953125, "global_step": 478495, "epoch": 5765} {"train_loss": -25.69671058654785, "global_step": 478496, "epoch": 5765} {"train_loss": -26.639328002929688, "global_step": 478497, "epoch": 5765} {"train_loss": -26.556432723999023, "global_step": 478498, "epoch": 5765} {"train_loss": -26.157270431518555, "global_step": 478499, "epoch": 5765} {"train_loss": -26.74964714050293, "global_step": 478500, "epoch": 5765} {"train_loss": -26.300220489501953, "global_step": 478501, "epoch": 5765} {"train_loss": -26.805225372314453, "global_step": 478502, "epoch": 5765} {"train_loss": -26.709033966064453, "global_step": 478503, "epoch": 5765} {"train_loss": -26.936176300048828, "global_step": 478504, "epoch": 5765} {"train_loss": -26.4393367767334, "global_step": 478505, "epoch": 5765} {"train_loss": -26.743453979492188, "global_step": 478506, "epoch": 5765} {"train_loss": -26.662296295166016, "global_step": 478507, "epoch": 5765} {"train_loss": -26.667715072631836, "global_step": 478508, "epoch": 5765} {"train_loss": -26.547653198242188, "global_step": 478509, "epoch": 5765} {"train_loss": -26.95891761779785, "global_step": 478510, "epoch": 5765} {"train_loss": -26.654117584228516, "global_step": 478511, "epoch": 5765} {"train_loss": -26.7956600189209, "global_step": 478512, "epoch": 5765} {"train_loss": -27.204938888549805, "global_step": 478513, "epoch": 5765} {"train_loss": -26.91635513305664, "global_step": 478514, "epoch": 5765} {"train_loss": -27.253376007080078, "global_step": 478515, "epoch": 5765} {"train_loss": -26.55373191833496, "global_step": 478516, "epoch": 5765} {"train_loss": -27.263568878173828, "global_step": 478517, "epoch": 5765} {"train_loss": -27.043277740478516, "global_step": 478518, "epoch": 5765} {"train_loss": -27.000354766845703, "global_step": 478519, "epoch": 5765} {"train_loss": -26.779226303100586, "global_step": 478520, "epoch": 5765} {"train_loss": -27.251636505126953, "global_step": 478521, "epoch": 5765} {"train_loss": -27.087987899780273, "global_step": 478522, "epoch": 5765} {"train_loss": -27.1428279876709, "global_step": 478523, "epoch": 5765} {"train_loss": -27.24172019958496, "global_step": 478524, "epoch": 5765} {"train_loss": -26.947406768798828, "global_step": 478525, "epoch": 5765} {"train_loss": -27.17643165588379, "global_step": 478526, "epoch": 5765} {"train_loss": -27.532712936401367, "global_step": 478527, "epoch": 5765} {"train_loss": -27.211517333984375, "global_step": 478528, "epoch": 5765} {"train_loss": -27.059192657470703, "global_step": 478529, "epoch": 5765} {"train_loss": -27.251758575439453, "global_step": 478530, "epoch": 5765} {"train_loss": -27.3658447265625, "global_step": 478531, "epoch": 5765} {"train_loss": -27.4368896484375, "global_step": 478532, "epoch": 5765} {"train_loss": -27.214567184448242, "global_step": 478533, "epoch": 5765} {"train_loss": -27.040830612182617, "global_step": 478534, "epoch": 5765} {"train_loss": -27.312463760375977, "global_step": 478535, "epoch": 5765} {"train_loss": -27.18818473815918, "global_step": 478536, "epoch": 5765} {"train_loss": -27.021930694580078, "global_step": 478537, "epoch": 5765} {"train_loss": -27.28376579284668, "global_step": 478538, "epoch": 5765} {"train_loss": -27.293603897094727, "global_step": 478539, "epoch": 5765} {"train_loss": -27.417776107788086, "global_step": 478540, "epoch": 5765} {"train_loss": -27.213560104370117, "global_step": 478541, "epoch": 5765} {"train_loss": -27.220975875854492, "global_step": 478542, "epoch": 5765} {"train_loss": -27.4848575592041, "global_step": 478543, "epoch": 5765} {"train_loss": -27.301959991455078, "global_step": 478544, "epoch": 5765} {"train_loss": -27.44902992248535, "global_step": 478545, "epoch": 5765} {"train_loss": -27.464109420776367, "global_step": 478546, "epoch": 5765} {"train_loss": -27.513158798217773, "global_step": 478547, "epoch": 5765} {"train_loss": -27.533069610595703, "global_step": 478548, "epoch": 5765} {"train_loss": -27.252185821533203, "global_step": 478549, "epoch": 5765} {"train_loss": -27.4396915435791, "global_step": 478550, "epoch": 5765} {"train_loss": -27.39377784729004, "global_step": 478551, "epoch": 5765} {"train_loss": -27.662809371948242, "global_step": 478552, "epoch": 5765} {"train_loss": -27.204864501953125, "global_step": 478553, "epoch": 5765} {"train_loss": -27.135679244995117, "global_step": 478554, "epoch": 5765} {"train_loss": -27.060504913330078, "global_step": 478555, "epoch": 5765} {"train_loss": -27.287805557250977, "global_step": 478556, "epoch": 5765} {"train_loss": -27.307565689086914, "global_step": 478557, "epoch": 5765} {"train_loss": -27.152297973632812, "global_step": 478558, "epoch": 5765} {"train_loss": -27.314664840698242, "global_step": 478559, "epoch": 5765} {"train_loss": -27.232152938842773, "global_step": 478560, "epoch": 5765} {"train_loss": -27.27237892150879, "global_step": 478561, "epoch": 5765} {"train_loss": -27.216333389282227, "global_step": 478562, "epoch": 5765} {"train_loss": -27.243810653686523, "global_step": 478563, "epoch": 5765} {"train_loss": -27.027563095092773, "global_step": 478564, "epoch": 5765} {"train_loss": -27.16205406188965, "global_step": 478565, "epoch": 5765} {"train_loss": -27.491910934448242, "global_step": 478566, "epoch": 5765} {"train_loss": -27.448352813720703, "global_step": 478567, "epoch": 5765} {"train_loss": -27.17371940612793, "global_step": 478568, "epoch": 5765} {"train_loss": -27.55051040649414, "global_step": 478569, "epoch": 5765} {"train_loss": -27.292011260986328, "global_step": 478570, "epoch": 5765} {"train_loss": -27.27484130859375, "global_step": 478571, "epoch": 5765} {"train_loss": -27.37890625, "global_step": 478572, "epoch": 5765} {"train_loss": -27.006616592407227, "global_step": 478573, "epoch": 5765} {"train_loss": -27.155797958374023, "global_step": 478574, "epoch": 5765} {"train_loss": -27.214313507080078, "global_step": 478575, "epoch": 5765} {"train_loss": -27.26333999633789, "global_step": 478576, "epoch": 5765} {"train_loss": -27.093129514211633, "global_step": 478577, "epoch": 5765, "val_loss": 6529537.0} {"train_loss": -25.441144943237305, "global_step": 478578, "epoch": 5766} {"train_loss": -24.708112716674805, "global_step": 478579, "epoch": 5766} {"train_loss": -26.8008975982666, "global_step": 478580, "epoch": 5766} {"train_loss": -26.70881462097168, "global_step": 478581, "epoch": 5766} {"train_loss": -25.727354049682617, "global_step": 478582, "epoch": 5766} {"train_loss": -26.227161407470703, "global_step": 478583, "epoch": 5766} {"train_loss": -26.771039962768555, "global_step": 478584, "epoch": 5766} {"train_loss": -26.336124420166016, "global_step": 478585, "epoch": 5766} {"train_loss": -26.122364044189453, "global_step": 478586, "epoch": 5766} {"train_loss": -26.286462783813477, "global_step": 478587, "epoch": 5766} {"train_loss": -26.764490127563477, "global_step": 478588, "epoch": 5766} {"train_loss": -25.880701065063477, "global_step": 478589, "epoch": 5766} {"train_loss": -26.87127685546875, "global_step": 478590, "epoch": 5766} {"train_loss": -26.220932006835938, "global_step": 478591, "epoch": 5766} {"train_loss": -26.808507919311523, "global_step": 478592, "epoch": 5766} {"train_loss": -26.734745025634766, "global_step": 478593, "epoch": 5766} {"train_loss": -26.639984130859375, "global_step": 478594, "epoch": 5766} {"train_loss": -26.971576690673828, "global_step": 478595, "epoch": 5766} {"train_loss": -26.96253776550293, "global_step": 478596, "epoch": 5766} {"train_loss": -26.718063354492188, "global_step": 478597, "epoch": 5766} {"train_loss": -26.633026123046875, "global_step": 478598, "epoch": 5766} {"train_loss": -26.987512588500977, "global_step": 478599, "epoch": 5766} {"train_loss": -26.716739654541016, "global_step": 478600, "epoch": 5766} {"train_loss": -26.712345123291016, "global_step": 478601, "epoch": 5766} {"train_loss": -27.221912384033203, "global_step": 478602, "epoch": 5766} {"train_loss": -26.832111358642578, "global_step": 478603, "epoch": 5766} {"train_loss": -26.82366371154785, "global_step": 478604, "epoch": 5766} {"train_loss": -27.144750595092773, "global_step": 478605, "epoch": 5766} {"train_loss": -27.213409423828125, "global_step": 478606, "epoch": 5766} {"train_loss": -26.95127296447754, "global_step": 478607, "epoch": 5766} {"train_loss": -27.086950302124023, "global_step": 478608, "epoch": 5766} {"train_loss": -26.83704948425293, "global_step": 478609, "epoch": 5766} {"train_loss": -27.007028579711914, "global_step": 478610, "epoch": 5766} {"train_loss": -27.321918487548828, "global_step": 478611, "epoch": 5766} {"train_loss": -26.9481258392334, "global_step": 478612, "epoch": 5766} {"train_loss": -27.533023834228516, "global_step": 478613, "epoch": 5766} {"train_loss": -27.262451171875, "global_step": 478614, "epoch": 5766} {"train_loss": -27.239587783813477, "global_step": 478615, "epoch": 5766} {"train_loss": -26.97749137878418, "global_step": 478616, "epoch": 5766} {"train_loss": -27.425201416015625, "global_step": 478617, "epoch": 5766} {"train_loss": -27.1704044342041, "global_step": 478618, "epoch": 5766} {"train_loss": -26.881994247436523, "global_step": 478619, "epoch": 5766} {"train_loss": -27.45072364807129, "global_step": 478620, "epoch": 5766} {"train_loss": -27.526229858398438, "global_step": 478621, "epoch": 5766} {"train_loss": -27.500778198242188, "global_step": 478622, "epoch": 5766} {"train_loss": -26.950719833374023, "global_step": 478623, "epoch": 5766} {"train_loss": -27.264806747436523, "global_step": 478624, "epoch": 5766} {"train_loss": -27.18073844909668, "global_step": 478625, "epoch": 5766} {"train_loss": -27.638696670532227, "global_step": 478626, "epoch": 5766} {"train_loss": -27.24640464782715, "global_step": 478627, "epoch": 5766} {"train_loss": -27.181970596313477, "global_step": 478628, "epoch": 5766} {"train_loss": -27.122955322265625, "global_step": 478629, "epoch": 5766} {"train_loss": -27.377836227416992, "global_step": 478630, "epoch": 5766} {"train_loss": -27.33570671081543, "global_step": 478631, "epoch": 5766} {"train_loss": -27.594253540039062, "global_step": 478632, "epoch": 5766} {"train_loss": -27.27052116394043, "global_step": 478633, "epoch": 5766} {"train_loss": -27.174962997436523, "global_step": 478634, "epoch": 5766} {"train_loss": -27.62066078186035, "global_step": 478635, "epoch": 5766} {"train_loss": -26.939899444580078, "global_step": 478636, "epoch": 5766} {"train_loss": -27.37745475769043, "global_step": 478637, "epoch": 5766} {"train_loss": -26.98322105407715, "global_step": 478638, "epoch": 5766} {"train_loss": -26.8073673248291, "global_step": 478639, "epoch": 5766} {"train_loss": -26.886932373046875, "global_step": 478640, "epoch": 5766} {"train_loss": -26.468835830688477, "global_step": 478641, "epoch": 5766} {"train_loss": -27.038959503173828, "global_step": 478642, "epoch": 5766} {"train_loss": -27.4697208404541, "global_step": 478643, "epoch": 5766} {"train_loss": -26.999765396118164, "global_step": 478644, "epoch": 5766} {"train_loss": -26.911916732788086, "global_step": 478645, "epoch": 5766} {"train_loss": -27.461017608642578, "global_step": 478646, "epoch": 5766} {"train_loss": -27.256500244140625, "global_step": 478647, "epoch": 5766} {"train_loss": -27.336828231811523, "global_step": 478648, "epoch": 5766} {"train_loss": -27.75091552734375, "global_step": 478649, "epoch": 5766} {"train_loss": -27.037921905517578, "global_step": 478650, "epoch": 5766} {"train_loss": -27.399789810180664, "global_step": 478651, "epoch": 5766} {"train_loss": -27.0076847076416, "global_step": 478652, "epoch": 5766} {"train_loss": -27.433740615844727, "global_step": 478653, "epoch": 5766} {"train_loss": -27.451374053955078, "global_step": 478654, "epoch": 5766} {"train_loss": -26.986297607421875, "global_step": 478655, "epoch": 5766} {"train_loss": -27.314435958862305, "global_step": 478656, "epoch": 5766} {"train_loss": -27.45623779296875, "global_step": 478657, "epoch": 5766} {"train_loss": -27.077146530151367, "global_step": 478658, "epoch": 5766} {"train_loss": -27.501388549804688, "global_step": 478659, "epoch": 5766} {"train_loss": -26.98051298670022, "global_step": 478660, "epoch": 5766, "val_loss": 6520835.0} {"train_loss": -26.782928466796875, "global_step": 478661, "epoch": 5767} {"train_loss": -25.756717681884766, "global_step": 478662, "epoch": 5767} {"train_loss": -24.368555068969727, "global_step": 478663, "epoch": 5767} {"train_loss": -23.229604721069336, "global_step": 478664, "epoch": 5767} {"train_loss": -24.585498809814453, "global_step": 478665, "epoch": 5767} {"train_loss": -26.609479904174805, "global_step": 478666, "epoch": 5767} {"train_loss": -25.062454223632812, "global_step": 478667, "epoch": 5767} {"train_loss": -26.2141170501709, "global_step": 478668, "epoch": 5767} {"train_loss": -26.100955963134766, "global_step": 478669, "epoch": 5767} {"train_loss": -25.88868522644043, "global_step": 478670, "epoch": 5767} {"train_loss": -26.418628692626953, "global_step": 478671, "epoch": 5767} {"train_loss": -26.563169479370117, "global_step": 478672, "epoch": 5767} {"train_loss": -26.30170249938965, "global_step": 478673, "epoch": 5767} {"train_loss": -26.6401309967041, "global_step": 478674, "epoch": 5767} {"train_loss": -26.28669548034668, "global_step": 478675, "epoch": 5767} {"train_loss": -26.569080352783203, "global_step": 478676, "epoch": 5767} {"train_loss": -26.68159294128418, "global_step": 478677, "epoch": 5767} {"train_loss": -26.646787643432617, "global_step": 478678, "epoch": 5767} {"train_loss": -26.688220977783203, "global_step": 478679, "epoch": 5767} {"train_loss": -26.708017349243164, "global_step": 478680, "epoch": 5767} {"train_loss": -26.152494430541992, "global_step": 478681, "epoch": 5767} {"train_loss": -26.682697296142578, "global_step": 478682, "epoch": 5767} {"train_loss": -26.962873458862305, "global_step": 478683, "epoch": 5767} {"train_loss": -26.515167236328125, "global_step": 478684, "epoch": 5767} {"train_loss": -26.961273193359375, "global_step": 478685, "epoch": 5767} {"train_loss": -26.637725830078125, "global_step": 478686, "epoch": 5767} {"train_loss": -26.662397384643555, "global_step": 478687, "epoch": 5767} {"train_loss": -26.945892333984375, "global_step": 478688, "epoch": 5767} {"train_loss": -26.4837589263916, "global_step": 478689, "epoch": 5767} {"train_loss": -27.108352661132812, "global_step": 478690, "epoch": 5767} {"train_loss": -26.767724990844727, "global_step": 478691, "epoch": 5767} {"train_loss": -26.793832778930664, "global_step": 478692, "epoch": 5767} {"train_loss": -27.2121524810791, "global_step": 478693, "epoch": 5767} {"train_loss": -27.28948974609375, "global_step": 478694, "epoch": 5767} {"train_loss": -27.21604347229004, "global_step": 478695, "epoch": 5767} {"train_loss": -27.140287399291992, "global_step": 478696, "epoch": 5767} {"train_loss": -26.986114501953125, "global_step": 478697, "epoch": 5767} {"train_loss": -26.91839599609375, "global_step": 478698, "epoch": 5767} {"train_loss": -26.983198165893555, "global_step": 478699, "epoch": 5767} {"train_loss": -27.295032501220703, "global_step": 478700, "epoch": 5767} {"train_loss": -26.928537368774414, "global_step": 478701, "epoch": 5767} {"train_loss": -27.318403244018555, "global_step": 478702, "epoch": 5767} {"train_loss": -27.213775634765625, "global_step": 478703, "epoch": 5767} {"train_loss": -27.31818962097168, "global_step": 478704, "epoch": 5767} {"train_loss": -27.1842041015625, "global_step": 478705, "epoch": 5767} {"train_loss": -26.92573356628418, "global_step": 478706, "epoch": 5767} {"train_loss": -27.0738582611084, "global_step": 478707, "epoch": 5767} {"train_loss": -26.876754760742188, "global_step": 478708, "epoch": 5767} {"train_loss": -27.758625030517578, "global_step": 478709, "epoch": 5767} {"train_loss": -27.410430908203125, "global_step": 478710, "epoch": 5767} {"train_loss": -27.57142448425293, "global_step": 478711, "epoch": 5767} {"train_loss": -27.448144912719727, "global_step": 478712, "epoch": 5767} {"train_loss": -27.307703018188477, "global_step": 478713, "epoch": 5767} {"train_loss": -27.467737197875977, "global_step": 478714, "epoch": 5767} {"train_loss": -27.48566246032715, "global_step": 478715, "epoch": 5767} {"train_loss": -27.371997833251953, "global_step": 478716, "epoch": 5767} {"train_loss": -27.338336944580078, "global_step": 478717, "epoch": 5767} {"train_loss": -27.4940128326416, "global_step": 478718, "epoch": 5767} {"train_loss": -27.175458908081055, "global_step": 478719, "epoch": 5767} {"train_loss": -27.4843807220459, "global_step": 478720, "epoch": 5767} {"train_loss": -27.13356590270996, "global_step": 478721, "epoch": 5767} {"train_loss": -27.451818466186523, "global_step": 478722, "epoch": 5767} {"train_loss": -27.10267448425293, "global_step": 478723, "epoch": 5767} {"train_loss": -27.200414657592773, "global_step": 478724, "epoch": 5767} {"train_loss": -27.010847091674805, "global_step": 478725, "epoch": 5767} {"train_loss": -27.265140533447266, "global_step": 478726, "epoch": 5767} {"train_loss": -27.273681640625, "global_step": 478727, "epoch": 5767} {"train_loss": -27.469839096069336, "global_step": 478728, "epoch": 5767} {"train_loss": -27.070392608642578, "global_step": 478729, "epoch": 5767} {"train_loss": -27.532506942749023, "global_step": 478730, "epoch": 5767} {"train_loss": -27.32538414001465, "global_step": 478731, "epoch": 5767} {"train_loss": -27.442276000976562, "global_step": 478732, "epoch": 5767} {"train_loss": -27.55911636352539, "global_step": 478733, "epoch": 5767} {"train_loss": -27.435150146484375, "global_step": 478734, "epoch": 5767} {"train_loss": -26.984033584594727, "global_step": 478735, "epoch": 5767} {"train_loss": -27.197006225585938, "global_step": 478736, "epoch": 5767} {"train_loss": -27.248693466186523, "global_step": 478737, "epoch": 5767} {"train_loss": -27.696247100830078, "global_step": 478738, "epoch": 5767} {"train_loss": -26.971393585205078, "global_step": 478739, "epoch": 5767} {"train_loss": -27.4633846282959, "global_step": 478740, "epoch": 5767} {"train_loss": -27.320539474487305, "global_step": 478741, "epoch": 5767} {"train_loss": -27.49976921081543, "global_step": 478742, "epoch": 5767} {"train_loss": -26.883957483682288, "global_step": 478743, "epoch": 5767, "val_loss": 6610360.0} {"train_loss": -27.176496505737305, "global_step": 478744, "epoch": 5768} {"train_loss": -27.206592559814453, "global_step": 478745, "epoch": 5768} {"train_loss": -27.229291915893555, "global_step": 478746, "epoch": 5768} {"train_loss": -27.596832275390625, "global_step": 478747, "epoch": 5768} {"train_loss": -27.28069496154785, "global_step": 478748, "epoch": 5768} {"train_loss": -27.346633911132812, "global_step": 478749, "epoch": 5768} {"train_loss": -27.762487411499023, "global_step": 478750, "epoch": 5768} {"train_loss": -27.19013786315918, "global_step": 478751, "epoch": 5768} {"train_loss": -26.883020401000977, "global_step": 478752, "epoch": 5768} {"train_loss": -27.039337158203125, "global_step": 478753, "epoch": 5768} {"train_loss": -27.488468170166016, "global_step": 478754, "epoch": 5768} {"train_loss": -27.24171257019043, "global_step": 478755, "epoch": 5768} {"train_loss": -26.995946884155273, "global_step": 478756, "epoch": 5768} {"train_loss": -27.013019561767578, "global_step": 478757, "epoch": 5768} {"train_loss": -26.825946807861328, "global_step": 478758, "epoch": 5768} {"train_loss": -27.2186279296875, "global_step": 478759, "epoch": 5768} {"train_loss": -27.585601806640625, "global_step": 478760, "epoch": 5768} {"train_loss": -26.86774253845215, "global_step": 478761, "epoch": 5768} {"train_loss": -26.96430778503418, "global_step": 478762, "epoch": 5768} {"train_loss": -27.635929107666016, "global_step": 478763, "epoch": 5768} {"train_loss": -27.038175582885742, "global_step": 478764, "epoch": 5768} {"train_loss": -27.58349609375, "global_step": 478765, "epoch": 5768} {"train_loss": -27.308679580688477, "global_step": 478766, "epoch": 5768} {"train_loss": -27.056812286376953, "global_step": 478767, "epoch": 5768} {"train_loss": -27.4603271484375, "global_step": 478768, "epoch": 5768} {"train_loss": -27.60601806640625, "global_step": 478769, "epoch": 5768} {"train_loss": -27.441925048828125, "global_step": 478770, "epoch": 5768} {"train_loss": -26.921659469604492, "global_step": 478771, "epoch": 5768} {"train_loss": -27.433088302612305, "global_step": 478772, "epoch": 5768} {"train_loss": -27.2824649810791, "global_step": 478773, "epoch": 5768} {"train_loss": -27.21503257751465, "global_step": 478774, "epoch": 5768} {"train_loss": -27.565221786499023, "global_step": 478775, "epoch": 5768} {"train_loss": -27.39127540588379, "global_step": 478776, "epoch": 5768} {"train_loss": -27.268253326416016, "global_step": 478777, "epoch": 5768} {"train_loss": -27.350149154663086, "global_step": 478778, "epoch": 5768} {"train_loss": -27.147693634033203, "global_step": 478779, "epoch": 5768} {"train_loss": -27.63932228088379, "global_step": 478780, "epoch": 5768} {"train_loss": -27.49370765686035, "global_step": 478781, "epoch": 5768} {"train_loss": -27.46600341796875, "global_step": 478782, "epoch": 5768} {"train_loss": -27.285247802734375, "global_step": 478783, "epoch": 5768} {"train_loss": -27.29339599609375, "global_step": 478784, "epoch": 5768} {"train_loss": -27.392507553100586, "global_step": 478785, "epoch": 5768} {"train_loss": -27.47245216369629, "global_step": 478786, "epoch": 5768} {"train_loss": -27.26372718811035, "global_step": 478787, "epoch": 5768} {"train_loss": -27.39472007751465, "global_step": 478788, "epoch": 5768} {"train_loss": -26.837202072143555, "global_step": 478789, "epoch": 5768} {"train_loss": -26.946741104125977, "global_step": 478790, "epoch": 5768} {"train_loss": -27.44723892211914, "global_step": 478791, "epoch": 5768} {"train_loss": -27.155242919921875, "global_step": 478792, "epoch": 5768} {"train_loss": -26.659467697143555, "global_step": 478793, "epoch": 5768} {"train_loss": -26.996267318725586, "global_step": 478794, "epoch": 5768} {"train_loss": -26.46311378479004, "global_step": 478795, "epoch": 5768} {"train_loss": -26.97482681274414, "global_step": 478796, "epoch": 5768} {"train_loss": -26.9720458984375, "global_step": 478797, "epoch": 5768} {"train_loss": -26.668420791625977, "global_step": 478798, "epoch": 5768} {"train_loss": -26.92951774597168, "global_step": 478799, "epoch": 5768} {"train_loss": -26.93499183654785, "global_step": 478800, "epoch": 5768} {"train_loss": -26.70477867126465, "global_step": 478801, "epoch": 5768} {"train_loss": -27.43385887145996, "global_step": 478802, "epoch": 5768} {"train_loss": -26.5754451751709, "global_step": 478803, "epoch": 5768} {"train_loss": -26.742456436157227, "global_step": 478804, "epoch": 5768} {"train_loss": -27.27423095703125, "global_step": 478805, "epoch": 5768} {"train_loss": -26.75282096862793, "global_step": 478806, "epoch": 5768} {"train_loss": -27.32588768005371, "global_step": 478807, "epoch": 5768} {"train_loss": -26.988208770751953, "global_step": 478808, "epoch": 5768} {"train_loss": -27.040205001831055, "global_step": 478809, "epoch": 5768} {"train_loss": -27.066492080688477, "global_step": 478810, "epoch": 5768} {"train_loss": -27.240020751953125, "global_step": 478811, "epoch": 5768} {"train_loss": -27.122787475585938, "global_step": 478812, "epoch": 5768} {"train_loss": -27.304235458374023, "global_step": 478813, "epoch": 5768} {"train_loss": -27.3908634185791, "global_step": 478814, "epoch": 5768} {"train_loss": -27.216064453125, "global_step": 478815, "epoch": 5768} {"train_loss": -27.29783058166504, "global_step": 478816, "epoch": 5768} {"train_loss": -27.39784812927246, "global_step": 478817, "epoch": 5768} {"train_loss": -27.3232479095459, "global_step": 478818, "epoch": 5768} {"train_loss": -27.315860748291016, "global_step": 478819, "epoch": 5768} {"train_loss": -27.1690673828125, "global_step": 478820, "epoch": 5768} {"train_loss": -27.412765502929688, "global_step": 478821, "epoch": 5768} {"train_loss": -27.262998580932617, "global_step": 478822, "epoch": 5768} {"train_loss": -27.521625518798828, "global_step": 478823, "epoch": 5768} {"train_loss": -27.327672958374023, "global_step": 478824, "epoch": 5768} {"train_loss": -27.349334716796875, "global_step": 478825, "epoch": 5768} {"train_loss": -27.209235639457244, "global_step": 478826, "epoch": 5768, "val_loss": 6573316.0} {"train_loss": -26.47610855102539, "global_step": 478827, "epoch": 5769} {"train_loss": -26.04414176940918, "global_step": 478828, "epoch": 5769} {"train_loss": -27.022974014282227, "global_step": 478829, "epoch": 5769} {"train_loss": -26.61142921447754, "global_step": 478830, "epoch": 5769} {"train_loss": -26.591949462890625, "global_step": 478831, "epoch": 5769} {"train_loss": -26.593067169189453, "global_step": 478832, "epoch": 5769} {"train_loss": -26.6126651763916, "global_step": 478833, "epoch": 5769} {"train_loss": -26.90105628967285, "global_step": 478834, "epoch": 5769} {"train_loss": -26.95633316040039, "global_step": 478835, "epoch": 5769} {"train_loss": -27.34541893005371, "global_step": 478836, "epoch": 5769} {"train_loss": -26.8311824798584, "global_step": 478837, "epoch": 5769} {"train_loss": -26.9552001953125, "global_step": 478838, "epoch": 5769} {"train_loss": -27.161407470703125, "global_step": 478839, "epoch": 5769} {"train_loss": -26.9208984375, "global_step": 478840, "epoch": 5769} {"train_loss": -26.844669342041016, "global_step": 478841, "epoch": 5769} {"train_loss": -27.02484703063965, "global_step": 478842, "epoch": 5769} {"train_loss": -26.807260513305664, "global_step": 478843, "epoch": 5769} {"train_loss": -26.976606369018555, "global_step": 478844, "epoch": 5769} {"train_loss": -26.972806930541992, "global_step": 478845, "epoch": 5769} {"train_loss": -26.919692993164062, "global_step": 478846, "epoch": 5769} {"train_loss": -27.108322143554688, "global_step": 478847, "epoch": 5769} {"train_loss": -26.905065536499023, "global_step": 478848, "epoch": 5769} {"train_loss": -26.970937728881836, "global_step": 478849, "epoch": 5769} {"train_loss": -27.40117835998535, "global_step": 478850, "epoch": 5769} {"train_loss": -26.81422233581543, "global_step": 478851, "epoch": 5769} {"train_loss": -27.279401779174805, "global_step": 478852, "epoch": 5769} {"train_loss": -27.03679847717285, "global_step": 478853, "epoch": 5769} {"train_loss": -26.7281494140625, "global_step": 478854, "epoch": 5769} {"train_loss": -27.083450317382812, "global_step": 478855, "epoch": 5769} {"train_loss": -27.204593658447266, "global_step": 478856, "epoch": 5769} {"train_loss": -27.26948356628418, "global_step": 478857, "epoch": 5769} {"train_loss": -27.122838973999023, "global_step": 478858, "epoch": 5769} {"train_loss": -27.207366943359375, "global_step": 478859, "epoch": 5769} {"train_loss": -27.135915756225586, "global_step": 478860, "epoch": 5769} {"train_loss": -27.36713981628418, "global_step": 478861, "epoch": 5769} {"train_loss": -27.402587890625, "global_step": 478862, "epoch": 5769} {"train_loss": -27.18779945373535, "global_step": 478863, "epoch": 5769} {"train_loss": -27.44923210144043, "global_step": 478864, "epoch": 5769} {"train_loss": -27.300382614135742, "global_step": 478865, "epoch": 5769} {"train_loss": -27.073455810546875, "global_step": 478866, "epoch": 5769} {"train_loss": -27.703771591186523, "global_step": 478867, "epoch": 5769} {"train_loss": -26.849096298217773, "global_step": 478868, "epoch": 5769} {"train_loss": -27.358854293823242, "global_step": 478869, "epoch": 5769} {"train_loss": -27.318103790283203, "global_step": 478870, "epoch": 5769} {"train_loss": -27.34051513671875, "global_step": 478871, "epoch": 5769} {"train_loss": -27.410846710205078, "global_step": 478872, "epoch": 5769} {"train_loss": -27.464420318603516, "global_step": 478873, "epoch": 5769} {"train_loss": -27.21247673034668, "global_step": 478874, "epoch": 5769} {"train_loss": -27.62787437438965, "global_step": 478875, "epoch": 5769} {"train_loss": -27.186429977416992, "global_step": 478876, "epoch": 5769} {"train_loss": -27.228330612182617, "global_step": 478877, "epoch": 5769} {"train_loss": -27.368452072143555, "global_step": 478878, "epoch": 5769} {"train_loss": -26.98493003845215, "global_step": 478879, "epoch": 5769} {"train_loss": -27.271041870117188, "global_step": 478880, "epoch": 5769} {"train_loss": -26.838211059570312, "global_step": 478881, "epoch": 5769} {"train_loss": -26.571151733398438, "global_step": 478882, "epoch": 5769} {"train_loss": -26.942977905273438, "global_step": 478883, "epoch": 5769} {"train_loss": -26.912878036499023, "global_step": 478884, "epoch": 5769} {"train_loss": -26.655792236328125, "global_step": 478885, "epoch": 5769} {"train_loss": -27.11005973815918, "global_step": 478886, "epoch": 5769} {"train_loss": -27.206531524658203, "global_step": 478887, "epoch": 5769} {"train_loss": -26.81983757019043, "global_step": 478888, "epoch": 5769} {"train_loss": -26.822473526000977, "global_step": 478889, "epoch": 5769} {"train_loss": -26.850406646728516, "global_step": 478890, "epoch": 5769} {"train_loss": -27.46394157409668, "global_step": 478891, "epoch": 5769} {"train_loss": -27.413183212280273, "global_step": 478892, "epoch": 5769} {"train_loss": -26.790369033813477, "global_step": 478893, "epoch": 5769} {"train_loss": -27.047393798828125, "global_step": 478894, "epoch": 5769} {"train_loss": -26.98251724243164, "global_step": 478895, "epoch": 5769} {"train_loss": -27.17963218688965, "global_step": 478896, "epoch": 5769} {"train_loss": -27.226842880249023, "global_step": 478897, "epoch": 5769} {"train_loss": -27.222436904907227, "global_step": 478898, "epoch": 5769} {"train_loss": -27.412261962890625, "global_step": 478899, "epoch": 5769} {"train_loss": -26.7915096282959, "global_step": 478900, "epoch": 5769} {"train_loss": -26.73908042907715, "global_step": 478901, "epoch": 5769} {"train_loss": -27.44422721862793, "global_step": 478902, "epoch": 5769} {"train_loss": -27.145435333251953, "global_step": 478903, "epoch": 5769} {"train_loss": -27.162250518798828, "global_step": 478904, "epoch": 5769} {"train_loss": -27.165180206298828, "global_step": 478905, "epoch": 5769} {"train_loss": -27.155517578125, "global_step": 478906, "epoch": 5769} {"train_loss": -27.298925399780273, "global_step": 478907, "epoch": 5769} {"train_loss": -27.420812606811523, "global_step": 478908, "epoch": 5769} {"train_loss": -27.0933253276779, "global_step": 478909, "epoch": 5769, "val_loss": 6617896.0} {"train_loss": -26.90095329284668, "global_step": 478910, "epoch": 5770} {"train_loss": -26.66580581665039, "global_step": 478911, "epoch": 5770} {"train_loss": -26.982452392578125, "global_step": 478912, "epoch": 5770} {"train_loss": -26.42780113220215, "global_step": 478913, "epoch": 5770} {"train_loss": -27.196523666381836, "global_step": 478914, "epoch": 5770} {"train_loss": -26.707138061523438, "global_step": 478915, "epoch": 5770} {"train_loss": -27.01997184753418, "global_step": 478916, "epoch": 5770} {"train_loss": -26.880634307861328, "global_step": 478917, "epoch": 5770} {"train_loss": -26.81674575805664, "global_step": 478918, "epoch": 5770} {"train_loss": -26.562381744384766, "global_step": 478919, "epoch": 5770} {"train_loss": -27.080184936523438, "global_step": 478920, "epoch": 5770} {"train_loss": -26.807050704956055, "global_step": 478921, "epoch": 5770} {"train_loss": -27.791748046875, "global_step": 478922, "epoch": 5770} {"train_loss": -26.796178817749023, "global_step": 478923, "epoch": 5770} {"train_loss": -27.326343536376953, "global_step": 478924, "epoch": 5770} {"train_loss": -26.868371963500977, "global_step": 478925, "epoch": 5770} {"train_loss": -26.735076904296875, "global_step": 478926, "epoch": 5770} {"train_loss": -27.12421226501465, "global_step": 478927, "epoch": 5770} {"train_loss": -26.916152954101562, "global_step": 478928, "epoch": 5770} {"train_loss": -27.082483291625977, "global_step": 478929, "epoch": 5770} {"train_loss": -27.070539474487305, "global_step": 478930, "epoch": 5770} {"train_loss": -26.870222091674805, "global_step": 478931, "epoch": 5770} {"train_loss": -27.447309494018555, "global_step": 478932, "epoch": 5770} {"train_loss": -27.410058975219727, "global_step": 478933, "epoch": 5770} {"train_loss": -27.440750122070312, "global_step": 478934, "epoch": 5770} {"train_loss": -27.7766056060791, "global_step": 478935, "epoch": 5770} {"train_loss": -27.1428165435791, "global_step": 478936, "epoch": 5770} {"train_loss": -27.127622604370117, "global_step": 478937, "epoch": 5770} {"train_loss": -27.473974227905273, "global_step": 478938, "epoch": 5770} {"train_loss": -27.133405685424805, "global_step": 478939, "epoch": 5770} {"train_loss": -27.568918228149414, "global_step": 478940, "epoch": 5770} {"train_loss": -26.93246841430664, "global_step": 478941, "epoch": 5770} {"train_loss": -27.31525993347168, "global_step": 478942, "epoch": 5770} {"train_loss": -27.405166625976562, "global_step": 478943, "epoch": 5770} {"train_loss": -27.402307510375977, "global_step": 478944, "epoch": 5770} {"train_loss": -27.38832664489746, "global_step": 478945, "epoch": 5770} {"train_loss": -27.563159942626953, "global_step": 478946, "epoch": 5770} {"train_loss": -27.2366943359375, "global_step": 478947, "epoch": 5770} {"train_loss": -27.44107437133789, "global_step": 478948, "epoch": 5770} {"train_loss": -27.726200103759766, "global_step": 478949, "epoch": 5770} {"train_loss": -27.264785766601562, "global_step": 478950, "epoch": 5770} {"train_loss": -27.440881729125977, "global_step": 478951, "epoch": 5770} {"train_loss": -27.754547119140625, "global_step": 478952, "epoch": 5770} {"train_loss": -27.104196548461914, "global_step": 478953, "epoch": 5770} {"train_loss": -27.0203800201416, "global_step": 478954, "epoch": 5770} {"train_loss": -27.494327545166016, "global_step": 478955, "epoch": 5770} {"train_loss": -27.081588745117188, "global_step": 478956, "epoch": 5770} {"train_loss": -27.625959396362305, "global_step": 478957, "epoch": 5770} {"train_loss": -27.398340225219727, "global_step": 478958, "epoch": 5770} {"train_loss": -27.311716079711914, "global_step": 478959, "epoch": 5770} {"train_loss": -27.659955978393555, "global_step": 478960, "epoch": 5770} {"train_loss": -27.547636032104492, "global_step": 478961, "epoch": 5770} {"train_loss": -27.337125778198242, "global_step": 478962, "epoch": 5770} {"train_loss": -27.357385635375977, "global_step": 478963, "epoch": 5770} {"train_loss": -27.596954345703125, "global_step": 478964, "epoch": 5770} {"train_loss": -27.46864891052246, "global_step": 478965, "epoch": 5770} {"train_loss": -26.91303062438965, "global_step": 478966, "epoch": 5770} {"train_loss": -26.876422882080078, "global_step": 478967, "epoch": 5770} {"train_loss": -26.626916885375977, "global_step": 478968, "epoch": 5770} {"train_loss": -26.59918785095215, "global_step": 478969, "epoch": 5770} {"train_loss": -27.219913482666016, "global_step": 478970, "epoch": 5770} {"train_loss": -27.14668083190918, "global_step": 478971, "epoch": 5770} {"train_loss": -26.6650333404541, "global_step": 478972, "epoch": 5770} {"train_loss": -26.893341064453125, "global_step": 478973, "epoch": 5770} {"train_loss": -26.94254493713379, "global_step": 478974, "epoch": 5770} {"train_loss": -27.218952178955078, "global_step": 478975, "epoch": 5770} {"train_loss": -26.577733993530273, "global_step": 478976, "epoch": 5770} {"train_loss": -26.96573829650879, "global_step": 478977, "epoch": 5770} {"train_loss": -26.696094512939453, "global_step": 478978, "epoch": 5770} {"train_loss": -26.758686065673828, "global_step": 478979, "epoch": 5770} {"train_loss": -27.336149215698242, "global_step": 478980, "epoch": 5770} {"train_loss": -26.854827880859375, "global_step": 478981, "epoch": 5770} {"train_loss": -26.579742431640625, "global_step": 478982, "epoch": 5770} {"train_loss": -27.203641891479492, "global_step": 478983, "epoch": 5770} {"train_loss": -27.301549911499023, "global_step": 478984, "epoch": 5770} {"train_loss": -26.81903076171875, "global_step": 478985, "epoch": 5770} {"train_loss": -26.89898681640625, "global_step": 478986, "epoch": 5770} {"train_loss": -26.870405197143555, "global_step": 478987, "epoch": 5770} {"train_loss": -27.210071563720703, "global_step": 478988, "epoch": 5770} {"train_loss": -27.264551162719727, "global_step": 478989, "epoch": 5770} {"train_loss": -27.239124298095703, "global_step": 478990, "epoch": 5770} {"train_loss": -26.76951026916504, "global_step": 478991, "epoch": 5770} {"train_loss": -27.12219651923122, "global_step": 478992, "epoch": 5770, "val_loss": 6575940.5} {"train_loss": -27.098886489868164, "global_step": 478993, "epoch": 5771} {"train_loss": -26.941064834594727, "global_step": 478994, "epoch": 5771} {"train_loss": -27.175012588500977, "global_step": 478995, "epoch": 5771} {"train_loss": -26.9345703125, "global_step": 478996, "epoch": 5771} {"train_loss": -27.34364128112793, "global_step": 478997, "epoch": 5771} {"train_loss": -26.888671875, "global_step": 478998, "epoch": 5771} {"train_loss": -27.179738998413086, "global_step": 478999, "epoch": 5771} {"train_loss": -27.015966415405273, "global_step": 479000, "epoch": 5771} {"train_loss": -26.911279678344727, "global_step": 479001, "epoch": 5771} {"train_loss": -27.176025390625, "global_step": 479002, "epoch": 5771} {"train_loss": -26.927167892456055, "global_step": 479003, "epoch": 5771} {"train_loss": -27.200891494750977, "global_step": 479004, "epoch": 5771} {"train_loss": -27.619970321655273, "global_step": 479005, "epoch": 5771} {"train_loss": -27.258832931518555, "global_step": 479006, "epoch": 5771} {"train_loss": -27.42034339904785, "global_step": 479007, "epoch": 5771} {"train_loss": -27.56451416015625, "global_step": 479008, "epoch": 5771} {"train_loss": -27.66546630859375, "global_step": 479009, "epoch": 5771} {"train_loss": -27.17266845703125, "global_step": 479010, "epoch": 5771} {"train_loss": -27.322845458984375, "global_step": 479011, "epoch": 5771} {"train_loss": -26.8791446685791, "global_step": 479012, "epoch": 5771} {"train_loss": -27.100183486938477, "global_step": 479013, "epoch": 5771} {"train_loss": -27.10419273376465, "global_step": 479014, "epoch": 5771} {"train_loss": -27.2952823638916, "global_step": 479015, "epoch": 5771} {"train_loss": -27.150501251220703, "global_step": 479016, "epoch": 5771} {"train_loss": -27.314420700073242, "global_step": 479017, "epoch": 5771} {"train_loss": -27.223310470581055, "global_step": 479018, "epoch": 5771} {"train_loss": -27.464557647705078, "global_step": 479019, "epoch": 5771} {"train_loss": -27.354703903198242, "global_step": 479020, "epoch": 5771} {"train_loss": -27.415754318237305, "global_step": 479021, "epoch": 5771} {"train_loss": -27.410877227783203, "global_step": 479022, "epoch": 5771} {"train_loss": -27.382312774658203, "global_step": 479023, "epoch": 5771} {"train_loss": -27.219806671142578, "global_step": 479024, "epoch": 5771} {"train_loss": -26.724578857421875, "global_step": 479025, "epoch": 5771} {"train_loss": -27.49372673034668, "global_step": 479026, "epoch": 5771} {"train_loss": -27.16090965270996, "global_step": 479027, "epoch": 5771} {"train_loss": -27.06426429748535, "global_step": 479028, "epoch": 5771} {"train_loss": -27.1335391998291, "global_step": 479029, "epoch": 5771} {"train_loss": -26.96449089050293, "global_step": 479030, "epoch": 5771} {"train_loss": -27.2447509765625, "global_step": 479031, "epoch": 5771} {"train_loss": -27.260013580322266, "global_step": 479032, "epoch": 5771} {"train_loss": -27.317846298217773, "global_step": 479033, "epoch": 5771} {"train_loss": -27.446125030517578, "global_step": 479034, "epoch": 5771} {"train_loss": -27.558542251586914, "global_step": 479035, "epoch": 5771} {"train_loss": -27.153491973876953, "global_step": 479036, "epoch": 5771} {"train_loss": -27.048879623413086, "global_step": 479037, "epoch": 5771} {"train_loss": -27.576679229736328, "global_step": 479038, "epoch": 5771} {"train_loss": -27.33477210998535, "global_step": 479039, "epoch": 5771} {"train_loss": -27.173141479492188, "global_step": 479040, "epoch": 5771} {"train_loss": -27.261152267456055, "global_step": 479041, "epoch": 5771} {"train_loss": -27.280166625976562, "global_step": 479042, "epoch": 5771} {"train_loss": -27.290502548217773, "global_step": 479043, "epoch": 5771} {"train_loss": -27.054487228393555, "global_step": 479044, "epoch": 5771} {"train_loss": -27.26426124572754, "global_step": 479045, "epoch": 5771} {"train_loss": -27.397079467773438, "global_step": 479046, "epoch": 5771} {"train_loss": -27.40815544128418, "global_step": 479047, "epoch": 5771} {"train_loss": -27.622888565063477, "global_step": 479048, "epoch": 5771} {"train_loss": -26.989744186401367, "global_step": 479049, "epoch": 5771} {"train_loss": -27.4138126373291, "global_step": 479050, "epoch": 5771} {"train_loss": -26.9702205657959, "global_step": 479051, "epoch": 5771} {"train_loss": -27.304187774658203, "global_step": 479052, "epoch": 5771} {"train_loss": -27.625518798828125, "global_step": 479053, "epoch": 5771} {"train_loss": -27.428668975830078, "global_step": 479054, "epoch": 5771} {"train_loss": -27.645727157592773, "global_step": 479055, "epoch": 5771} {"train_loss": -27.612167358398438, "global_step": 479056, "epoch": 5771} {"train_loss": -27.55437660217285, "global_step": 479057, "epoch": 5771} {"train_loss": -27.543384552001953, "global_step": 479058, "epoch": 5771} {"train_loss": -27.460662841796875, "global_step": 479059, "epoch": 5771} {"train_loss": -27.11115074157715, "global_step": 479060, "epoch": 5771} {"train_loss": -27.278858184814453, "global_step": 479061, "epoch": 5771} {"train_loss": -27.15424919128418, "global_step": 479062, "epoch": 5771} {"train_loss": -27.382129669189453, "global_step": 479063, "epoch": 5771} {"train_loss": -27.5562686920166, "global_step": 479064, "epoch": 5771} {"train_loss": -27.291669845581055, "global_step": 479065, "epoch": 5771} {"train_loss": -27.172178268432617, "global_step": 479066, "epoch": 5771} {"train_loss": -27.257226943969727, "global_step": 479067, "epoch": 5771} {"train_loss": -27.369348526000977, "global_step": 479068, "epoch": 5771} {"train_loss": -27.029956817626953, "global_step": 479069, "epoch": 5771} {"train_loss": -27.259077072143555, "global_step": 479070, "epoch": 5771} {"train_loss": -27.440448760986328, "global_step": 479071, "epoch": 5771} {"train_loss": -27.197162628173828, "global_step": 479072, "epoch": 5771} {"train_loss": -27.40712547302246, "global_step": 479073, "epoch": 5771} {"train_loss": -27.45554542541504, "global_step": 479074, "epoch": 5771} {"train_loss": -27.26847754329084, "global_step": 479075, "epoch": 5771, "val_loss": 6598164.5} {"train_loss": -26.470849990844727, "global_step": 479076, "epoch": 5772} {"train_loss": -26.241580963134766, "global_step": 479077, "epoch": 5772} {"train_loss": -26.881305694580078, "global_step": 479078, "epoch": 5772} {"train_loss": -27.052526473999023, "global_step": 479079, "epoch": 5772} {"train_loss": -27.0895938873291, "global_step": 479080, "epoch": 5772} {"train_loss": -26.92122459411621, "global_step": 479081, "epoch": 5772} {"train_loss": -27.35623550415039, "global_step": 479082, "epoch": 5772} {"train_loss": -26.93218421936035, "global_step": 479083, "epoch": 5772} {"train_loss": -27.11236572265625, "global_step": 479084, "epoch": 5772} {"train_loss": -26.976409912109375, "global_step": 479085, "epoch": 5772} {"train_loss": -26.619993209838867, "global_step": 479086, "epoch": 5772} {"train_loss": -26.856781005859375, "global_step": 479087, "epoch": 5772} {"train_loss": -27.07086181640625, "global_step": 479088, "epoch": 5772} {"train_loss": -27.306671142578125, "global_step": 479089, "epoch": 5772} {"train_loss": -26.589099884033203, "global_step": 479090, "epoch": 5772} {"train_loss": -27.149017333984375, "global_step": 479091, "epoch": 5772} {"train_loss": -27.43421745300293, "global_step": 479092, "epoch": 5772} {"train_loss": -26.949426651000977, "global_step": 479093, "epoch": 5772} {"train_loss": -26.807697296142578, "global_step": 479094, "epoch": 5772} {"train_loss": -26.73990249633789, "global_step": 479095, "epoch": 5772} {"train_loss": -27.035247802734375, "global_step": 479096, "epoch": 5772} {"train_loss": -27.004735946655273, "global_step": 479097, "epoch": 5772} {"train_loss": -27.022876739501953, "global_step": 479098, "epoch": 5772} {"train_loss": -27.09803581237793, "global_step": 479099, "epoch": 5772} {"train_loss": -27.173969268798828, "global_step": 479100, "epoch": 5772} {"train_loss": -27.05806541442871, "global_step": 479101, "epoch": 5772} {"train_loss": -26.862003326416016, "global_step": 479102, "epoch": 5772} {"train_loss": -27.263168334960938, "global_step": 479103, "epoch": 5772} {"train_loss": -27.213830947875977, "global_step": 479104, "epoch": 5772} {"train_loss": -27.185993194580078, "global_step": 479105, "epoch": 5772} {"train_loss": -27.40097999572754, "global_step": 479106, "epoch": 5772} {"train_loss": -27.53981590270996, "global_step": 479107, "epoch": 5772} {"train_loss": -27.373876571655273, "global_step": 479108, "epoch": 5772} {"train_loss": -27.138463973999023, "global_step": 479109, "epoch": 5772} {"train_loss": -27.477827072143555, "global_step": 479110, "epoch": 5772} {"train_loss": -27.330427169799805, "global_step": 479111, "epoch": 5772} {"train_loss": -27.263166427612305, "global_step": 479112, "epoch": 5772} {"train_loss": -27.765899658203125, "global_step": 479113, "epoch": 5772} {"train_loss": -27.010648727416992, "global_step": 479114, "epoch": 5772} {"train_loss": -27.259185791015625, "global_step": 479115, "epoch": 5772} {"train_loss": -27.094186782836914, "global_step": 479116, "epoch": 5772} {"train_loss": -27.465991973876953, "global_step": 479117, "epoch": 5772} {"train_loss": -27.234851837158203, "global_step": 479118, "epoch": 5772} {"train_loss": -27.386798858642578, "global_step": 479119, "epoch": 5772} {"train_loss": -27.5289306640625, "global_step": 479120, "epoch": 5772} {"train_loss": -27.329212188720703, "global_step": 479121, "epoch": 5772} {"train_loss": -27.817413330078125, "global_step": 479122, "epoch": 5772} {"train_loss": -27.70720863342285, "global_step": 479123, "epoch": 5772} {"train_loss": -27.50326919555664, "global_step": 479124, "epoch": 5772} {"train_loss": -27.215576171875, "global_step": 479125, "epoch": 5772} {"train_loss": -27.18784523010254, "global_step": 479126, "epoch": 5772} {"train_loss": -27.488672256469727, "global_step": 479127, "epoch": 5772} {"train_loss": -27.428546905517578, "global_step": 479128, "epoch": 5772} {"train_loss": -26.93714714050293, "global_step": 479129, "epoch": 5772} {"train_loss": -27.628040313720703, "global_step": 479130, "epoch": 5772} {"train_loss": -27.715423583984375, "global_step": 479131, "epoch": 5772} {"train_loss": -27.46815299987793, "global_step": 479132, "epoch": 5772} {"train_loss": -27.301618576049805, "global_step": 479133, "epoch": 5772} {"train_loss": -27.633771896362305, "global_step": 479134, "epoch": 5772} {"train_loss": -27.511341094970703, "global_step": 479135, "epoch": 5772} {"train_loss": -27.36783790588379, "global_step": 479136, "epoch": 5772} {"train_loss": -27.023681640625, "global_step": 479137, "epoch": 5772} {"train_loss": -26.3092041015625, "global_step": 479138, "epoch": 5772} {"train_loss": -26.419769287109375, "global_step": 479139, "epoch": 5772} {"train_loss": -26.9449520111084, "global_step": 479140, "epoch": 5772} {"train_loss": -26.39478874206543, "global_step": 479141, "epoch": 5772} {"train_loss": -26.759876251220703, "global_step": 479142, "epoch": 5772} {"train_loss": -26.934019088745117, "global_step": 479143, "epoch": 5772} {"train_loss": -26.88852882385254, "global_step": 479144, "epoch": 5772} {"train_loss": -26.963987350463867, "global_step": 479145, "epoch": 5772} {"train_loss": -26.87748146057129, "global_step": 479146, "epoch": 5772} {"train_loss": -26.82867431640625, "global_step": 479147, "epoch": 5772} {"train_loss": -27.085355758666992, "global_step": 479148, "epoch": 5772} {"train_loss": -26.892934799194336, "global_step": 479149, "epoch": 5772} {"train_loss": -27.20074462890625, "global_step": 479150, "epoch": 5772} {"train_loss": -26.985919952392578, "global_step": 479151, "epoch": 5772} {"train_loss": -27.484487533569336, "global_step": 479152, "epoch": 5772} {"train_loss": -26.63887596130371, "global_step": 479153, "epoch": 5772} {"train_loss": -27.222925186157227, "global_step": 479154, "epoch": 5772} {"train_loss": -27.09315299987793, "global_step": 479155, "epoch": 5772} {"train_loss": -26.924100875854492, "global_step": 479156, "epoch": 5772} {"train_loss": -26.994281768798828, "global_step": 479157, "epoch": 5772} {"train_loss": -27.114920213998083, "global_step": 479158, "epoch": 5772, "val_loss": 6593502.0} {"train_loss": -26.970203399658203, "global_step": 479159, "epoch": 5773} {"train_loss": -27.4083251953125, "global_step": 479160, "epoch": 5773} {"train_loss": -27.451251983642578, "global_step": 479161, "epoch": 5773} {"train_loss": -26.579883575439453, "global_step": 479162, "epoch": 5773} {"train_loss": -26.853992462158203, "global_step": 479163, "epoch": 5773} {"train_loss": -26.431875228881836, "global_step": 479164, "epoch": 5773} {"train_loss": -27.16413688659668, "global_step": 479165, "epoch": 5773} {"train_loss": -27.105182647705078, "global_step": 479166, "epoch": 5773} {"train_loss": -26.846708297729492, "global_step": 479167, "epoch": 5773} {"train_loss": -27.0375919342041, "global_step": 479168, "epoch": 5773} {"train_loss": -27.060302734375, "global_step": 479169, "epoch": 5773} {"train_loss": -27.033044815063477, "global_step": 479170, "epoch": 5773} {"train_loss": -26.931562423706055, "global_step": 479171, "epoch": 5773} {"train_loss": -27.26643180847168, "global_step": 479172, "epoch": 5773} {"train_loss": -26.782377243041992, "global_step": 479173, "epoch": 5773} {"train_loss": -26.955310821533203, "global_step": 479174, "epoch": 5773} {"train_loss": -27.327878952026367, "global_step": 479175, "epoch": 5773} {"train_loss": -27.1368408203125, "global_step": 479176, "epoch": 5773} {"train_loss": -26.754117965698242, "global_step": 479177, "epoch": 5773} {"train_loss": -27.527896881103516, "global_step": 479178, "epoch": 5773} {"train_loss": -27.172876358032227, "global_step": 479179, "epoch": 5773} {"train_loss": -27.240446090698242, "global_step": 479180, "epoch": 5773} {"train_loss": -27.61590576171875, "global_step": 479181, "epoch": 5773} {"train_loss": -27.515893936157227, "global_step": 479182, "epoch": 5773} {"train_loss": -27.300220489501953, "global_step": 479183, "epoch": 5773} {"train_loss": -27.530841827392578, "global_step": 479184, "epoch": 5773} {"train_loss": -27.1156005859375, "global_step": 479185, "epoch": 5773} {"train_loss": -27.413406372070312, "global_step": 479186, "epoch": 5773} {"train_loss": -27.454147338867188, "global_step": 479187, "epoch": 5773} {"train_loss": -27.237539291381836, "global_step": 479188, "epoch": 5773} {"train_loss": -27.142425537109375, "global_step": 479189, "epoch": 5773} {"train_loss": -27.40204429626465, "global_step": 479190, "epoch": 5773} {"train_loss": -27.28968620300293, "global_step": 479191, "epoch": 5773} {"train_loss": -27.415191650390625, "global_step": 479192, "epoch": 5773} {"train_loss": -27.487274169921875, "global_step": 479193, "epoch": 5773} {"train_loss": -27.3327693939209, "global_step": 479194, "epoch": 5773} {"train_loss": -27.31434440612793, "global_step": 479195, "epoch": 5773} {"train_loss": -27.201953887939453, "global_step": 479196, "epoch": 5773} {"train_loss": -27.17426109313965, "global_step": 479197, "epoch": 5773} {"train_loss": -27.305891036987305, "global_step": 479198, "epoch": 5773} {"train_loss": -27.1401424407959, "global_step": 479199, "epoch": 5773} {"train_loss": -26.803403854370117, "global_step": 479200, "epoch": 5773} {"train_loss": -26.62031364440918, "global_step": 479201, "epoch": 5773} {"train_loss": -25.476903915405273, "global_step": 479202, "epoch": 5773} {"train_loss": -26.4681453704834, "global_step": 479203, "epoch": 5773} {"train_loss": -27.098636627197266, "global_step": 479204, "epoch": 5773} {"train_loss": -26.932397842407227, "global_step": 479205, "epoch": 5773} {"train_loss": -26.601409912109375, "global_step": 479206, "epoch": 5773} {"train_loss": -27.019119262695312, "global_step": 479207, "epoch": 5773} {"train_loss": -26.93958854675293, "global_step": 479208, "epoch": 5773} {"train_loss": -26.789682388305664, "global_step": 479209, "epoch": 5773} {"train_loss": -26.592206954956055, "global_step": 479210, "epoch": 5773} {"train_loss": -27.236486434936523, "global_step": 479211, "epoch": 5773} {"train_loss": -27.103137969970703, "global_step": 479212, "epoch": 5773} {"train_loss": -27.449167251586914, "global_step": 479213, "epoch": 5773} {"train_loss": -27.403356552124023, "global_step": 479214, "epoch": 5773} {"train_loss": -26.95951271057129, "global_step": 479215, "epoch": 5773} {"train_loss": -27.328235626220703, "global_step": 479216, "epoch": 5773} {"train_loss": -27.265600204467773, "global_step": 479217, "epoch": 5773} {"train_loss": -27.28439712524414, "global_step": 479218, "epoch": 5773} {"train_loss": -26.96231460571289, "global_step": 479219, "epoch": 5773} {"train_loss": -27.0523681640625, "global_step": 479220, "epoch": 5773} {"train_loss": -27.043079376220703, "global_step": 479221, "epoch": 5773} {"train_loss": -27.28157615661621, "global_step": 479222, "epoch": 5773} {"train_loss": -27.3516902923584, "global_step": 479223, "epoch": 5773} {"train_loss": -27.37808609008789, "global_step": 479224, "epoch": 5773} {"train_loss": -27.38612937927246, "global_step": 479225, "epoch": 5773} {"train_loss": -27.120975494384766, "global_step": 479226, "epoch": 5773} {"train_loss": -26.95924949645996, "global_step": 479227, "epoch": 5773} {"train_loss": -27.404773712158203, "global_step": 479228, "epoch": 5773} {"train_loss": -27.27573013305664, "global_step": 479229, "epoch": 5773} {"train_loss": -27.300037384033203, "global_step": 479230, "epoch": 5773} {"train_loss": -27.198822021484375, "global_step": 479231, "epoch": 5773} {"train_loss": -27.664352416992188, "global_step": 479232, "epoch": 5773} {"train_loss": -27.27422523498535, "global_step": 479233, "epoch": 5773} {"train_loss": -27.312585830688477, "global_step": 479234, "epoch": 5773} {"train_loss": -27.237600326538086, "global_step": 479235, "epoch": 5773} {"train_loss": -27.227140426635742, "global_step": 479236, "epoch": 5773} {"train_loss": -27.274438858032227, "global_step": 479237, "epoch": 5773} {"train_loss": -27.1295166015625, "global_step": 479238, "epoch": 5773} {"train_loss": -27.846837997436523, "global_step": 479239, "epoch": 5773} {"train_loss": -27.5396728515625, "global_step": 479240, "epoch": 5773} {"train_loss": -27.12734488981316, "global_step": 479241, "epoch": 5773, "val_loss": 6599983.0} {"train_loss": -24.130382537841797, "global_step": 479242, "epoch": 5774} {"train_loss": -20.766944885253906, "global_step": 479243, "epoch": 5774} {"train_loss": -25.30985450744629, "global_step": 479244, "epoch": 5774} {"train_loss": -24.696630477905273, "global_step": 479245, "epoch": 5774} {"train_loss": -26.36771583557129, "global_step": 479246, "epoch": 5774} {"train_loss": -24.868148803710938, "global_step": 479247, "epoch": 5774} {"train_loss": -25.740482330322266, "global_step": 479248, "epoch": 5774} {"train_loss": -25.761743545532227, "global_step": 479249, "epoch": 5774} {"train_loss": -25.52692222595215, "global_step": 479250, "epoch": 5774} {"train_loss": -26.453420639038086, "global_step": 479251, "epoch": 5774} {"train_loss": -26.228357315063477, "global_step": 479252, "epoch": 5774} {"train_loss": -25.76243019104004, "global_step": 479253, "epoch": 5774} {"train_loss": -26.06925392150879, "global_step": 479254, "epoch": 5774} {"train_loss": -26.5405330657959, "global_step": 479255, "epoch": 5774} {"train_loss": -26.1336727142334, "global_step": 479256, "epoch": 5774} {"train_loss": -26.368167877197266, "global_step": 479257, "epoch": 5774} {"train_loss": -26.412017822265625, "global_step": 479258, "epoch": 5774} {"train_loss": -26.164398193359375, "global_step": 479259, "epoch": 5774} {"train_loss": -26.702600479125977, "global_step": 479260, "epoch": 5774} {"train_loss": -26.13028907775879, "global_step": 479261, "epoch": 5774} {"train_loss": -26.102828979492188, "global_step": 479262, "epoch": 5774} {"train_loss": -26.460235595703125, "global_step": 479263, "epoch": 5774} {"train_loss": -26.43361473083496, "global_step": 479264, "epoch": 5774} {"train_loss": -26.557218551635742, "global_step": 479265, "epoch": 5774} {"train_loss": -26.367095947265625, "global_step": 479266, "epoch": 5774} {"train_loss": -26.758975982666016, "global_step": 479267, "epoch": 5774} {"train_loss": -26.672155380249023, "global_step": 479268, "epoch": 5774} {"train_loss": -26.71540641784668, "global_step": 479269, "epoch": 5774} {"train_loss": -26.7410888671875, "global_step": 479270, "epoch": 5774} {"train_loss": -26.762067794799805, "global_step": 479271, "epoch": 5774} {"train_loss": -26.493467330932617, "global_step": 479272, "epoch": 5774} {"train_loss": -27.214750289916992, "global_step": 479273, "epoch": 5774} {"train_loss": -26.585458755493164, "global_step": 479274, "epoch": 5774} {"train_loss": -27.02225685119629, "global_step": 479275, "epoch": 5774} {"train_loss": -26.885534286499023, "global_step": 479276, "epoch": 5774} {"train_loss": -26.5532283782959, "global_step": 479277, "epoch": 5774} {"train_loss": -26.830631256103516, "global_step": 479278, "epoch": 5774} {"train_loss": -27.100330352783203, "global_step": 479279, "epoch": 5774} {"train_loss": -26.910993576049805, "global_step": 479280, "epoch": 5774} {"train_loss": -27.16621971130371, "global_step": 479281, "epoch": 5774} {"train_loss": -27.321203231811523, "global_step": 479282, "epoch": 5774} {"train_loss": -26.962934494018555, "global_step": 479283, "epoch": 5774} {"train_loss": -27.07020378112793, "global_step": 479284, "epoch": 5774} {"train_loss": -27.304187774658203, "global_step": 479285, "epoch": 5774} {"train_loss": -27.29939842224121, "global_step": 479286, "epoch": 5774} {"train_loss": -27.098007202148438, "global_step": 479287, "epoch": 5774} {"train_loss": -26.585195541381836, "global_step": 479288, "epoch": 5774} {"train_loss": -27.027128219604492, "global_step": 479289, "epoch": 5774} {"train_loss": -27.157453536987305, "global_step": 479290, "epoch": 5774} {"train_loss": -27.423542022705078, "global_step": 479291, "epoch": 5774} {"train_loss": -27.478544235229492, "global_step": 479292, "epoch": 5774} {"train_loss": -27.313215255737305, "global_step": 479293, "epoch": 5774} {"train_loss": -27.13165283203125, "global_step": 479294, "epoch": 5774} {"train_loss": -27.125385284423828, "global_step": 479295, "epoch": 5774} {"train_loss": -27.236957550048828, "global_step": 479296, "epoch": 5774} {"train_loss": -27.367902755737305, "global_step": 479297, "epoch": 5774} {"train_loss": -27.274810791015625, "global_step": 479298, "epoch": 5774} {"train_loss": -27.38004493713379, "global_step": 479299, "epoch": 5774} {"train_loss": -27.66139030456543, "global_step": 479300, "epoch": 5774} {"train_loss": -27.33390235900879, "global_step": 479301, "epoch": 5774} {"train_loss": -27.131895065307617, "global_step": 479302, "epoch": 5774} {"train_loss": -27.383630752563477, "global_step": 479303, "epoch": 5774} {"train_loss": -27.122512817382812, "global_step": 479304, "epoch": 5774} {"train_loss": -27.437158584594727, "global_step": 479305, "epoch": 5774} {"train_loss": -27.49639320373535, "global_step": 479306, "epoch": 5774} {"train_loss": -27.180282592773438, "global_step": 479307, "epoch": 5774} {"train_loss": -27.3021297454834, "global_step": 479308, "epoch": 5774} {"train_loss": -27.429147720336914, "global_step": 479309, "epoch": 5774} {"train_loss": -26.92984962463379, "global_step": 479310, "epoch": 5774} {"train_loss": -27.433618545532227, "global_step": 479311, "epoch": 5774} {"train_loss": -27.2131290435791, "global_step": 479312, "epoch": 5774} {"train_loss": -26.90654945373535, "global_step": 479313, "epoch": 5774} {"train_loss": -27.03140640258789, "global_step": 479314, "epoch": 5774} {"train_loss": -26.79193687438965, "global_step": 479315, "epoch": 5774} {"train_loss": -27.167633056640625, "global_step": 479316, "epoch": 5774} {"train_loss": -26.825910568237305, "global_step": 479317, "epoch": 5774} {"train_loss": -26.78326988220215, "global_step": 479318, "epoch": 5774} {"train_loss": -27.41066551208496, "global_step": 479319, "epoch": 5774} {"train_loss": -27.009328842163086, "global_step": 479320, "epoch": 5774} {"train_loss": -26.989913940429688, "global_step": 479321, "epoch": 5774} {"train_loss": -26.550077438354492, "global_step": 479322, "epoch": 5774} {"train_loss": -26.50088882446289, "global_step": 479323, "epoch": 5774} {"train_loss": -26.67604979549546, "global_step": 479324, "epoch": 5774, "val_loss": 6483589.0} {"train_loss": -25.753820419311523, "global_step": 479325, "epoch": 5775} {"train_loss": -26.02105712890625, "global_step": 479326, "epoch": 5775} {"train_loss": -26.802967071533203, "global_step": 479327, "epoch": 5775} {"train_loss": -26.28325843811035, "global_step": 479328, "epoch": 5775} {"train_loss": -26.49324607849121, "global_step": 479329, "epoch": 5775} {"train_loss": -26.36029624938965, "global_step": 479330, "epoch": 5775} {"train_loss": -26.2542724609375, "global_step": 479331, "epoch": 5775} {"train_loss": -26.849271774291992, "global_step": 479332, "epoch": 5775} {"train_loss": -26.503141403198242, "global_step": 479333, "epoch": 5775} {"train_loss": -26.669931411743164, "global_step": 479334, "epoch": 5775} {"train_loss": -27.036895751953125, "global_step": 479335, "epoch": 5775} {"train_loss": -26.742761611938477, "global_step": 479336, "epoch": 5775} {"train_loss": -26.876440048217773, "global_step": 479337, "epoch": 5775} {"train_loss": -26.58125114440918, "global_step": 479338, "epoch": 5775} {"train_loss": -26.821577072143555, "global_step": 479339, "epoch": 5775} {"train_loss": -27.049335479736328, "global_step": 479340, "epoch": 5775} {"train_loss": -26.688093185424805, "global_step": 479341, "epoch": 5775} {"train_loss": -26.980712890625, "global_step": 479342, "epoch": 5775} {"train_loss": -26.817487716674805, "global_step": 479343, "epoch": 5775} {"train_loss": -27.122329711914062, "global_step": 479344, "epoch": 5775} {"train_loss": -26.9641056060791, "global_step": 479345, "epoch": 5775} {"train_loss": -27.00668716430664, "global_step": 479346, "epoch": 5775} {"train_loss": -27.046161651611328, "global_step": 479347, "epoch": 5775} {"train_loss": -27.048757553100586, "global_step": 479348, "epoch": 5775} {"train_loss": -27.174421310424805, "global_step": 479349, "epoch": 5775} {"train_loss": -27.281463623046875, "global_step": 479350, "epoch": 5775} {"train_loss": -27.10076904296875, "global_step": 479351, "epoch": 5775} {"train_loss": -27.382736206054688, "global_step": 479352, "epoch": 5775} {"train_loss": -27.3129825592041, "global_step": 479353, "epoch": 5775} {"train_loss": -27.20644187927246, "global_step": 479354, "epoch": 5775} {"train_loss": -27.14179039001465, "global_step": 479355, "epoch": 5775} {"train_loss": -27.21589469909668, "global_step": 479356, "epoch": 5775} {"train_loss": -27.195114135742188, "global_step": 479357, "epoch": 5775} {"train_loss": -27.0761661529541, "global_step": 479358, "epoch": 5775} {"train_loss": -27.479965209960938, "global_step": 479359, "epoch": 5775} {"train_loss": -27.722028732299805, "global_step": 479360, "epoch": 5775} {"train_loss": -27.423749923706055, "global_step": 479361, "epoch": 5775} {"train_loss": -27.181365966796875, "global_step": 479362, "epoch": 5775} {"train_loss": -27.609119415283203, "global_step": 479363, "epoch": 5775} {"train_loss": -27.39375114440918, "global_step": 479364, "epoch": 5775} {"train_loss": -27.17547035217285, "global_step": 479365, "epoch": 5775} {"train_loss": -27.481983184814453, "global_step": 479366, "epoch": 5775} {"train_loss": -27.352405548095703, "global_step": 479367, "epoch": 5775} {"train_loss": -27.278528213500977, "global_step": 479368, "epoch": 5775} {"train_loss": -27.127939224243164, "global_step": 479369, "epoch": 5775} {"train_loss": -27.110504150390625, "global_step": 479370, "epoch": 5775} {"train_loss": -26.828659057617188, "global_step": 479371, "epoch": 5775} {"train_loss": -26.521284103393555, "global_step": 479372, "epoch": 5775} {"train_loss": -26.332550048828125, "global_step": 479373, "epoch": 5775} {"train_loss": -26.093048095703125, "global_step": 479374, "epoch": 5775} {"train_loss": -26.857961654663086, "global_step": 479375, "epoch": 5775} {"train_loss": -27.076156616210938, "global_step": 479376, "epoch": 5775} {"train_loss": -27.005706787109375, "global_step": 479377, "epoch": 5775} {"train_loss": -27.456302642822266, "global_step": 479378, "epoch": 5775} {"train_loss": -27.272201538085938, "global_step": 479379, "epoch": 5775} {"train_loss": -27.184860229492188, "global_step": 479380, "epoch": 5775} {"train_loss": -27.03333854675293, "global_step": 479381, "epoch": 5775} {"train_loss": -26.832305908203125, "global_step": 479382, "epoch": 5775} {"train_loss": -27.379735946655273, "global_step": 479383, "epoch": 5775} {"train_loss": -27.29912757873535, "global_step": 479384, "epoch": 5775} {"train_loss": -27.03223991394043, "global_step": 479385, "epoch": 5775} {"train_loss": -27.17413902282715, "global_step": 479386, "epoch": 5775} {"train_loss": -26.797353744506836, "global_step": 479387, "epoch": 5775} {"train_loss": -27.14410972595215, "global_step": 479388, "epoch": 5775} {"train_loss": -27.104642868041992, "global_step": 479389, "epoch": 5775} {"train_loss": -26.984724044799805, "global_step": 479390, "epoch": 5775} {"train_loss": -27.744953155517578, "global_step": 479391, "epoch": 5775} {"train_loss": -27.2590389251709, "global_step": 479392, "epoch": 5775} {"train_loss": -27.369831085205078, "global_step": 479393, "epoch": 5775} {"train_loss": -27.329679489135742, "global_step": 479394, "epoch": 5775} {"train_loss": -27.137372970581055, "global_step": 479395, "epoch": 5775} {"train_loss": -27.263219833374023, "global_step": 479396, "epoch": 5775} {"train_loss": -27.11158561706543, "global_step": 479397, "epoch": 5775} {"train_loss": -27.148618698120117, "global_step": 479398, "epoch": 5775} {"train_loss": -27.49409294128418, "global_step": 479399, "epoch": 5775} {"train_loss": -27.585065841674805, "global_step": 479400, "epoch": 5775} {"train_loss": -27.19037437438965, "global_step": 479401, "epoch": 5775} {"train_loss": -27.411640167236328, "global_step": 479402, "epoch": 5775} {"train_loss": -27.388242721557617, "global_step": 479403, "epoch": 5775} {"train_loss": -27.27994155883789, "global_step": 479404, "epoch": 5775} {"train_loss": -26.968557357788086, "global_step": 479405, "epoch": 5775} {"train_loss": -27.205352783203125, "global_step": 479406, "epoch": 5775} {"train_loss": -27.053702411881414, "global_step": 479407, "epoch": 5775, "val_loss": 6583160.5} {"train_loss": -26.947729110717773, "global_step": 479408, "epoch": 5776} {"train_loss": -26.565906524658203, "global_step": 479409, "epoch": 5776} {"train_loss": -26.990644454956055, "global_step": 479410, "epoch": 5776} {"train_loss": -26.909521102905273, "global_step": 479411, "epoch": 5776} {"train_loss": -27.273038864135742, "global_step": 479412, "epoch": 5776} {"train_loss": -26.938806533813477, "global_step": 479413, "epoch": 5776} {"train_loss": -27.2513427734375, "global_step": 479414, "epoch": 5776} {"train_loss": -27.118515014648438, "global_step": 479415, "epoch": 5776} {"train_loss": -26.845922470092773, "global_step": 479416, "epoch": 5776} {"train_loss": -27.26948356628418, "global_step": 479417, "epoch": 5776} {"train_loss": -27.151792526245117, "global_step": 479418, "epoch": 5776} {"train_loss": -27.19240379333496, "global_step": 479419, "epoch": 5776} {"train_loss": -27.124114990234375, "global_step": 479420, "epoch": 5776} {"train_loss": -26.766407012939453, "global_step": 479421, "epoch": 5776} {"train_loss": -27.183515548706055, "global_step": 479422, "epoch": 5776} {"train_loss": -27.00337028503418, "global_step": 479423, "epoch": 5776} {"train_loss": -27.26279640197754, "global_step": 479424, "epoch": 5776} {"train_loss": -27.162261962890625, "global_step": 479425, "epoch": 5776} {"train_loss": -26.956327438354492, "global_step": 479426, "epoch": 5776} {"train_loss": -27.279651641845703, "global_step": 479427, "epoch": 5776} {"train_loss": -27.2464599609375, "global_step": 479428, "epoch": 5776} {"train_loss": -27.001550674438477, "global_step": 479429, "epoch": 5776} {"train_loss": -27.13128662109375, "global_step": 479430, "epoch": 5776} {"train_loss": -27.12973403930664, "global_step": 479431, "epoch": 5776} {"train_loss": -27.5971622467041, "global_step": 479432, "epoch": 5776} {"train_loss": -27.017486572265625, "global_step": 479433, "epoch": 5776} {"train_loss": -26.985559463500977, "global_step": 479434, "epoch": 5776} {"train_loss": -26.831289291381836, "global_step": 479435, "epoch": 5776} {"train_loss": -26.825651168823242, "global_step": 479436, "epoch": 5776} {"train_loss": -27.312122344970703, "global_step": 479437, "epoch": 5776} {"train_loss": -26.935840606689453, "global_step": 479438, "epoch": 5776} {"train_loss": -26.938608169555664, "global_step": 479439, "epoch": 5776} {"train_loss": -27.31145668029785, "global_step": 479440, "epoch": 5776} {"train_loss": -26.855636596679688, "global_step": 479441, "epoch": 5776} {"train_loss": -27.6002140045166, "global_step": 479442, "epoch": 5776} {"train_loss": -26.92274284362793, "global_step": 479443, "epoch": 5776} {"train_loss": -26.738977432250977, "global_step": 479444, "epoch": 5776} {"train_loss": -27.303922653198242, "global_step": 479445, "epoch": 5776} {"train_loss": -26.851978302001953, "global_step": 479446, "epoch": 5776} {"train_loss": -27.089874267578125, "global_step": 479447, "epoch": 5776} {"train_loss": -26.90220069885254, "global_step": 479448, "epoch": 5776} {"train_loss": -26.703445434570312, "global_step": 479449, "epoch": 5776} {"train_loss": -27.426061630249023, "global_step": 479450, "epoch": 5776} {"train_loss": -27.342126846313477, "global_step": 479451, "epoch": 5776} {"train_loss": -26.998075485229492, "global_step": 479452, "epoch": 5776} {"train_loss": -27.230304718017578, "global_step": 479453, "epoch": 5776} {"train_loss": -27.540302276611328, "global_step": 479454, "epoch": 5776} {"train_loss": -27.21705436706543, "global_step": 479455, "epoch": 5776} {"train_loss": -27.1866397857666, "global_step": 479456, "epoch": 5776} {"train_loss": -27.1732120513916, "global_step": 479457, "epoch": 5776} {"train_loss": -26.8032169342041, "global_step": 479458, "epoch": 5776} {"train_loss": -27.19276237487793, "global_step": 479459, "epoch": 5776} {"train_loss": -27.170074462890625, "global_step": 479460, "epoch": 5776} {"train_loss": -27.103803634643555, "global_step": 479461, "epoch": 5776} {"train_loss": -27.002899169921875, "global_step": 479462, "epoch": 5776} {"train_loss": -27.48512840270996, "global_step": 479463, "epoch": 5776} {"train_loss": -27.34065055847168, "global_step": 479464, "epoch": 5776} {"train_loss": -27.296567916870117, "global_step": 479465, "epoch": 5776} {"train_loss": -27.57368278503418, "global_step": 479466, "epoch": 5776} {"train_loss": -26.94402503967285, "global_step": 479467, "epoch": 5776} {"train_loss": -27.76459312438965, "global_step": 479468, "epoch": 5776} {"train_loss": -27.234058380126953, "global_step": 479469, "epoch": 5776} {"train_loss": -27.25983238220215, "global_step": 479470, "epoch": 5776} {"train_loss": -27.31683349609375, "global_step": 479471, "epoch": 5776} {"train_loss": -27.244583129882812, "global_step": 479472, "epoch": 5776} {"train_loss": -27.103015899658203, "global_step": 479473, "epoch": 5776} {"train_loss": -27.120874404907227, "global_step": 479474, "epoch": 5776} {"train_loss": -26.889148712158203, "global_step": 479475, "epoch": 5776} {"train_loss": -27.168399810791016, "global_step": 479476, "epoch": 5776} {"train_loss": -27.21211814880371, "global_step": 479477, "epoch": 5776} {"train_loss": -27.494367599487305, "global_step": 479478, "epoch": 5776} {"train_loss": -27.335281372070312, "global_step": 479479, "epoch": 5776} {"train_loss": -27.369321823120117, "global_step": 479480, "epoch": 5776} {"train_loss": -27.3399715423584, "global_step": 479481, "epoch": 5776} {"train_loss": -27.264591217041016, "global_step": 479482, "epoch": 5776} {"train_loss": -26.964096069335938, "global_step": 479483, "epoch": 5776} {"train_loss": -27.264753341674805, "global_step": 479484, "epoch": 5776} {"train_loss": -27.57708740234375, "global_step": 479485, "epoch": 5776} {"train_loss": -27.230945587158203, "global_step": 479486, "epoch": 5776} {"train_loss": -27.37725257873535, "global_step": 479487, "epoch": 5776} {"train_loss": -26.932209014892578, "global_step": 479488, "epoch": 5776} {"train_loss": -27.119543075561523, "global_step": 479489, "epoch": 5776} {"train_loss": -27.130593426256294, "global_step": 479490, "epoch": 5776, "val_loss": 6540813.0} {"train_loss": -26.867773056030273, "global_step": 479491, "epoch": 5777} {"train_loss": -26.531763076782227, "global_step": 479492, "epoch": 5777} {"train_loss": -26.565717697143555, "global_step": 479493, "epoch": 5777} {"train_loss": -26.171955108642578, "global_step": 479494, "epoch": 5777} {"train_loss": -26.39190101623535, "global_step": 479495, "epoch": 5777} {"train_loss": -26.08017921447754, "global_step": 479496, "epoch": 5777} {"train_loss": -26.384084701538086, "global_step": 479497, "epoch": 5777} {"train_loss": -26.709115982055664, "global_step": 479498, "epoch": 5777} {"train_loss": -25.941390991210938, "global_step": 479499, "epoch": 5777} {"train_loss": -26.464813232421875, "global_step": 479500, "epoch": 5777} {"train_loss": -26.529748916625977, "global_step": 479501, "epoch": 5777} {"train_loss": -26.6641845703125, "global_step": 479502, "epoch": 5777} {"train_loss": -26.82452964782715, "global_step": 479503, "epoch": 5777} {"train_loss": -26.15594482421875, "global_step": 479504, "epoch": 5777} {"train_loss": -26.7064151763916, "global_step": 479505, "epoch": 5777} {"train_loss": -26.610620498657227, "global_step": 479506, "epoch": 5777} {"train_loss": -26.71625328063965, "global_step": 479507, "epoch": 5777} {"train_loss": -26.845870971679688, "global_step": 479508, "epoch": 5777} {"train_loss": -26.750898361206055, "global_step": 479509, "epoch": 5777} {"train_loss": -27.074054718017578, "global_step": 479510, "epoch": 5777} {"train_loss": -26.560821533203125, "global_step": 479511, "epoch": 5777} {"train_loss": -26.598388671875, "global_step": 479512, "epoch": 5777} {"train_loss": -27.06196403503418, "global_step": 479513, "epoch": 5777} {"train_loss": -26.829639434814453, "global_step": 479514, "epoch": 5777} {"train_loss": -27.33636474609375, "global_step": 479515, "epoch": 5777} {"train_loss": -26.766071319580078, "global_step": 479516, "epoch": 5777} {"train_loss": -26.770029067993164, "global_step": 479517, "epoch": 5777} {"train_loss": -27.02931022644043, "global_step": 479518, "epoch": 5777} {"train_loss": -27.15105628967285, "global_step": 479519, "epoch": 5777} {"train_loss": -27.285425186157227, "global_step": 479520, "epoch": 5777} {"train_loss": -27.27729606628418, "global_step": 479521, "epoch": 5777} {"train_loss": -27.318700790405273, "global_step": 479522, "epoch": 5777} {"train_loss": -26.87586784362793, "global_step": 479523, "epoch": 5777} {"train_loss": -27.131383895874023, "global_step": 479524, "epoch": 5777} {"train_loss": -27.127954483032227, "global_step": 479525, "epoch": 5777} {"train_loss": -27.273984909057617, "global_step": 479526, "epoch": 5777} {"train_loss": -27.335952758789062, "global_step": 479527, "epoch": 5777} {"train_loss": -27.24513053894043, "global_step": 479528, "epoch": 5777} {"train_loss": -27.33680534362793, "global_step": 479529, "epoch": 5777} {"train_loss": -27.16718101501465, "global_step": 479530, "epoch": 5777} {"train_loss": -27.680755615234375, "global_step": 479531, "epoch": 5777} {"train_loss": -27.477426528930664, "global_step": 479532, "epoch": 5777} {"train_loss": -27.322711944580078, "global_step": 479533, "epoch": 5777} {"train_loss": -27.099470138549805, "global_step": 479534, "epoch": 5777} {"train_loss": -27.28728675842285, "global_step": 479535, "epoch": 5777} {"train_loss": -27.2835693359375, "global_step": 479536, "epoch": 5777} {"train_loss": -27.223438262939453, "global_step": 479537, "epoch": 5777} {"train_loss": -27.4941463470459, "global_step": 479538, "epoch": 5777} {"train_loss": -27.401554107666016, "global_step": 479539, "epoch": 5777} {"train_loss": -27.31490135192871, "global_step": 479540, "epoch": 5777} {"train_loss": -27.420154571533203, "global_step": 479541, "epoch": 5777} {"train_loss": -27.337854385375977, "global_step": 479542, "epoch": 5777} {"train_loss": -27.236547470092773, "global_step": 479543, "epoch": 5777} {"train_loss": -27.028451919555664, "global_step": 479544, "epoch": 5777} {"train_loss": -27.274145126342773, "global_step": 479545, "epoch": 5777} {"train_loss": -27.68743324279785, "global_step": 479546, "epoch": 5777} {"train_loss": -27.497507095336914, "global_step": 479547, "epoch": 5777} {"train_loss": -27.34902000427246, "global_step": 479548, "epoch": 5777} {"train_loss": -27.325292587280273, "global_step": 479549, "epoch": 5777} {"train_loss": -27.308637619018555, "global_step": 479550, "epoch": 5777} {"train_loss": -27.31536293029785, "global_step": 479551, "epoch": 5777} {"train_loss": -27.193328857421875, "global_step": 479552, "epoch": 5777} {"train_loss": -27.338552474975586, "global_step": 479553, "epoch": 5777} {"train_loss": -27.221099853515625, "global_step": 479554, "epoch": 5777} {"train_loss": -27.251953125, "global_step": 479555, "epoch": 5777} {"train_loss": -27.094501495361328, "global_step": 479556, "epoch": 5777} {"train_loss": -27.265607833862305, "global_step": 479557, "epoch": 5777} {"train_loss": -27.346820831298828, "global_step": 479558, "epoch": 5777} {"train_loss": -27.54119300842285, "global_step": 479559, "epoch": 5777} {"train_loss": -27.497241973876953, "global_step": 479560, "epoch": 5777} {"train_loss": -27.25537109375, "global_step": 479561, "epoch": 5777} {"train_loss": -27.163501739501953, "global_step": 479562, "epoch": 5777} {"train_loss": -27.178409576416016, "global_step": 479563, "epoch": 5777} {"train_loss": -27.119922637939453, "global_step": 479564, "epoch": 5777} {"train_loss": -27.096057891845703, "global_step": 479565, "epoch": 5777} {"train_loss": -26.992956161499023, "global_step": 479566, "epoch": 5777} {"train_loss": -27.42026138305664, "global_step": 479567, "epoch": 5777} {"train_loss": -27.335779190063477, "global_step": 479568, "epoch": 5777} {"train_loss": -27.08745765686035, "global_step": 479569, "epoch": 5777} {"train_loss": -27.1259765625, "global_step": 479570, "epoch": 5777} {"train_loss": -26.741621017456055, "global_step": 479571, "epoch": 5777} {"train_loss": -27.086523056030273, "global_step": 479572, "epoch": 5777} {"train_loss": -27.070833367037487, "global_step": 479573, "epoch": 5777, "val_loss": 6594856.0} {"train_loss": -26.955175399780273, "global_step": 479574, "epoch": 5778} {"train_loss": -26.14166831970215, "global_step": 479575, "epoch": 5778} {"train_loss": -26.621274948120117, "global_step": 479576, "epoch": 5778} {"train_loss": -26.737279891967773, "global_step": 479577, "epoch": 5778} {"train_loss": -26.670917510986328, "global_step": 479578, "epoch": 5778} {"train_loss": -27.00971794128418, "global_step": 479579, "epoch": 5778} {"train_loss": -25.925146102905273, "global_step": 479580, "epoch": 5778} {"train_loss": -26.900833129882812, "global_step": 479581, "epoch": 5778} {"train_loss": -26.38201332092285, "global_step": 479582, "epoch": 5778} {"train_loss": -26.830175399780273, "global_step": 479583, "epoch": 5778} {"train_loss": -26.83254051208496, "global_step": 479584, "epoch": 5778} {"train_loss": -26.745227813720703, "global_step": 479585, "epoch": 5778} {"train_loss": -26.9102783203125, "global_step": 479586, "epoch": 5778} {"train_loss": -27.006561279296875, "global_step": 479587, "epoch": 5778} {"train_loss": -27.111618041992188, "global_step": 479588, "epoch": 5778} {"train_loss": -26.895627975463867, "global_step": 479589, "epoch": 5778} {"train_loss": -26.995370864868164, "global_step": 479590, "epoch": 5778} {"train_loss": -26.563074111938477, "global_step": 479591, "epoch": 5778} {"train_loss": -26.886199951171875, "global_step": 479592, "epoch": 5778} {"train_loss": -26.824247360229492, "global_step": 479593, "epoch": 5778} {"train_loss": -26.950836181640625, "global_step": 479594, "epoch": 5778} {"train_loss": -27.092273712158203, "global_step": 479595, "epoch": 5778} {"train_loss": -26.80844497680664, "global_step": 479596, "epoch": 5778} {"train_loss": -27.02033805847168, "global_step": 479597, "epoch": 5778} {"train_loss": -27.27789306640625, "global_step": 479598, "epoch": 5778} {"train_loss": -27.37294578552246, "global_step": 479599, "epoch": 5778} {"train_loss": -27.03059959411621, "global_step": 479600, "epoch": 5778} {"train_loss": -27.503204345703125, "global_step": 479601, "epoch": 5778} {"train_loss": -27.02546501159668, "global_step": 479602, "epoch": 5778} {"train_loss": -27.08991813659668, "global_step": 479603, "epoch": 5778} {"train_loss": -27.161401748657227, "global_step": 479604, "epoch": 5778} {"train_loss": -27.17287254333496, "global_step": 479605, "epoch": 5778} {"train_loss": -27.510395050048828, "global_step": 479606, "epoch": 5778} {"train_loss": -27.141101837158203, "global_step": 479607, "epoch": 5778} {"train_loss": -27.24872398376465, "global_step": 479608, "epoch": 5778} {"train_loss": -27.083642959594727, "global_step": 479609, "epoch": 5778} {"train_loss": -27.67066764831543, "global_step": 479610, "epoch": 5778} {"train_loss": -27.2479248046875, "global_step": 479611, "epoch": 5778} {"train_loss": -27.4494686126709, "global_step": 479612, "epoch": 5778} {"train_loss": -27.4663143157959, "global_step": 479613, "epoch": 5778} {"train_loss": -27.097320556640625, "global_step": 479614, "epoch": 5778} {"train_loss": -27.23223304748535, "global_step": 479615, "epoch": 5778} {"train_loss": -27.413223266601562, "global_step": 479616, "epoch": 5778} {"train_loss": -27.5125675201416, "global_step": 479617, "epoch": 5778} {"train_loss": -27.686981201171875, "global_step": 479618, "epoch": 5778} {"train_loss": -27.516820907592773, "global_step": 479619, "epoch": 5778} {"train_loss": -27.21250343322754, "global_step": 479620, "epoch": 5778} {"train_loss": -27.121667861938477, "global_step": 479621, "epoch": 5778} {"train_loss": -27.005823135375977, "global_step": 479622, "epoch": 5778} {"train_loss": -27.325037002563477, "global_step": 479623, "epoch": 5778} {"train_loss": -27.13287925720215, "global_step": 479624, "epoch": 5778} {"train_loss": -27.189001083374023, "global_step": 479625, "epoch": 5778} {"train_loss": -27.483732223510742, "global_step": 479626, "epoch": 5778} {"train_loss": -27.442768096923828, "global_step": 479627, "epoch": 5778} {"train_loss": -27.296247482299805, "global_step": 479628, "epoch": 5778} {"train_loss": -27.10491943359375, "global_step": 479629, "epoch": 5778} {"train_loss": -27.674560546875, "global_step": 479630, "epoch": 5778} {"train_loss": -27.328842163085938, "global_step": 479631, "epoch": 5778} {"train_loss": -27.074695587158203, "global_step": 479632, "epoch": 5778} {"train_loss": -27.500959396362305, "global_step": 479633, "epoch": 5778} {"train_loss": -27.598791122436523, "global_step": 479634, "epoch": 5778} {"train_loss": -27.20631217956543, "global_step": 479635, "epoch": 5778} {"train_loss": -27.412139892578125, "global_step": 479636, "epoch": 5778} {"train_loss": -27.58194351196289, "global_step": 479637, "epoch": 5778} {"train_loss": -27.6475887298584, "global_step": 479638, "epoch": 5778} {"train_loss": -27.4378604888916, "global_step": 479639, "epoch": 5778} {"train_loss": -27.604333877563477, "global_step": 479640, "epoch": 5778} {"train_loss": -27.24129295349121, "global_step": 479641, "epoch": 5778} {"train_loss": -27.4782772064209, "global_step": 479642, "epoch": 5778} {"train_loss": -27.294843673706055, "global_step": 479643, "epoch": 5778} {"train_loss": -27.726917266845703, "global_step": 479644, "epoch": 5778} {"train_loss": -27.41410255432129, "global_step": 479645, "epoch": 5778} {"train_loss": -27.3387451171875, "global_step": 479646, "epoch": 5778} {"train_loss": -27.924116134643555, "global_step": 479647, "epoch": 5778} {"train_loss": -27.224075317382812, "global_step": 479648, "epoch": 5778} {"train_loss": -26.789838790893555, "global_step": 479649, "epoch": 5778} {"train_loss": -25.793655395507812, "global_step": 479650, "epoch": 5778} {"train_loss": -22.65860939025879, "global_step": 479651, "epoch": 5778} {"train_loss": -23.345855712890625, "global_step": 479652, "epoch": 5778} {"train_loss": -26.500463485717773, "global_step": 479653, "epoch": 5778} {"train_loss": -26.166412353515625, "global_step": 479654, "epoch": 5778} {"train_loss": -26.159320831298828, "global_step": 479655, "epoch": 5778} {"train_loss": -27.018117284200276, "global_step": 479656, "epoch": 5778, "val_loss": 6594777.5} {"train_loss": -26.235763549804688, "global_step": 479657, "epoch": 5779} {"train_loss": -25.528350830078125, "global_step": 479658, "epoch": 5779} {"train_loss": -25.632080078125, "global_step": 479659, "epoch": 5779} {"train_loss": -26.314441680908203, "global_step": 479660, "epoch": 5779} {"train_loss": -25.516530990600586, "global_step": 479661, "epoch": 5779} {"train_loss": -26.321149826049805, "global_step": 479662, "epoch": 5779} {"train_loss": -26.38014030456543, "global_step": 479663, "epoch": 5779} {"train_loss": -26.178253173828125, "global_step": 479664, "epoch": 5779} {"train_loss": -26.20843505859375, "global_step": 479665, "epoch": 5779} {"train_loss": -26.3122501373291, "global_step": 479666, "epoch": 5779} {"train_loss": -26.204137802124023, "global_step": 479667, "epoch": 5779} {"train_loss": -26.292448043823242, "global_step": 479668, "epoch": 5779} {"train_loss": -26.597951889038086, "global_step": 479669, "epoch": 5779} {"train_loss": -26.56754493713379, "global_step": 479670, "epoch": 5779} {"train_loss": -26.46613121032715, "global_step": 479671, "epoch": 5779} {"train_loss": -26.500812530517578, "global_step": 479672, "epoch": 5779} {"train_loss": -26.820707321166992, "global_step": 479673, "epoch": 5779} {"train_loss": -26.49745750427246, "global_step": 479674, "epoch": 5779} {"train_loss": -26.350820541381836, "global_step": 479675, "epoch": 5779} {"train_loss": -26.722028732299805, "global_step": 479676, "epoch": 5779} {"train_loss": -26.426898956298828, "global_step": 479677, "epoch": 5779} {"train_loss": -26.845081329345703, "global_step": 479678, "epoch": 5779} {"train_loss": -27.003942489624023, "global_step": 479679, "epoch": 5779} {"train_loss": -26.889114379882812, "global_step": 479680, "epoch": 5779} {"train_loss": -26.72102928161621, "global_step": 479681, "epoch": 5779} {"train_loss": -26.984766006469727, "global_step": 479682, "epoch": 5779} {"train_loss": -27.291934967041016, "global_step": 479683, "epoch": 5779} {"train_loss": -27.226850509643555, "global_step": 479684, "epoch": 5779} {"train_loss": -27.0758056640625, "global_step": 479685, "epoch": 5779} {"train_loss": -27.136335372924805, "global_step": 479686, "epoch": 5779} {"train_loss": -26.6102294921875, "global_step": 479687, "epoch": 5779} {"train_loss": -26.797897338867188, "global_step": 479688, "epoch": 5779} {"train_loss": -26.919403076171875, "global_step": 479689, "epoch": 5779} {"train_loss": -26.884735107421875, "global_step": 479690, "epoch": 5779} {"train_loss": -27.046178817749023, "global_step": 479691, "epoch": 5779} {"train_loss": -27.322650909423828, "global_step": 479692, "epoch": 5779} {"train_loss": -27.171483993530273, "global_step": 479693, "epoch": 5779} {"train_loss": -26.93751335144043, "global_step": 479694, "epoch": 5779} {"train_loss": -27.2152042388916, "global_step": 479695, "epoch": 5779} {"train_loss": -27.266754150390625, "global_step": 479696, "epoch": 5779} {"train_loss": -27.29279899597168, "global_step": 479697, "epoch": 5779} {"train_loss": -26.941680908203125, "global_step": 479698, "epoch": 5779} {"train_loss": -27.357812881469727, "global_step": 479699, "epoch": 5779} {"train_loss": -27.0342960357666, "global_step": 479700, "epoch": 5779} {"train_loss": -26.97541618347168, "global_step": 479701, "epoch": 5779} {"train_loss": -27.206918716430664, "global_step": 479702, "epoch": 5779} {"train_loss": -27.23687744140625, "global_step": 479703, "epoch": 5779} {"train_loss": -27.216955184936523, "global_step": 479704, "epoch": 5779} {"train_loss": -27.28777503967285, "global_step": 479705, "epoch": 5779} {"train_loss": -27.00227165222168, "global_step": 479706, "epoch": 5779} {"train_loss": -27.171422958374023, "global_step": 479707, "epoch": 5779} {"train_loss": -27.15787696838379, "global_step": 479708, "epoch": 5779} {"train_loss": -26.945478439331055, "global_step": 479709, "epoch": 5779} {"train_loss": -27.32697105407715, "global_step": 479710, "epoch": 5779} {"train_loss": -27.231470108032227, "global_step": 479711, "epoch": 5779} {"train_loss": -27.668386459350586, "global_step": 479712, "epoch": 5779} {"train_loss": -27.5037841796875, "global_step": 479713, "epoch": 5779} {"train_loss": -27.36689567565918, "global_step": 479714, "epoch": 5779} {"train_loss": -27.09061050415039, "global_step": 479715, "epoch": 5779} {"train_loss": -27.155670166015625, "global_step": 479716, "epoch": 5779} {"train_loss": -27.206562042236328, "global_step": 479717, "epoch": 5779} {"train_loss": -26.929533004760742, "global_step": 479718, "epoch": 5779} {"train_loss": -26.901962280273438, "global_step": 479719, "epoch": 5779} {"train_loss": -26.807321548461914, "global_step": 479720, "epoch": 5779} {"train_loss": -27.23213005065918, "global_step": 479721, "epoch": 5779} {"train_loss": -27.522626876831055, "global_step": 479722, "epoch": 5779} {"train_loss": -27.507627487182617, "global_step": 479723, "epoch": 5779} {"train_loss": -27.194665908813477, "global_step": 479724, "epoch": 5779} {"train_loss": -26.9000244140625, "global_step": 479725, "epoch": 5779} {"train_loss": -27.5015811920166, "global_step": 479726, "epoch": 5779} {"train_loss": -27.19049072265625, "global_step": 479727, "epoch": 5779} {"train_loss": -27.526752471923828, "global_step": 479728, "epoch": 5779} {"train_loss": -27.5175838470459, "global_step": 479729, "epoch": 5779} {"train_loss": -27.6844482421875, "global_step": 479730, "epoch": 5779} {"train_loss": -27.281326293945312, "global_step": 479731, "epoch": 5779} {"train_loss": -26.92291259765625, "global_step": 479732, "epoch": 5779} {"train_loss": -27.425582885742188, "global_step": 479733, "epoch": 5779} {"train_loss": -27.05983543395996, "global_step": 479734, "epoch": 5779} {"train_loss": -26.937036514282227, "global_step": 479735, "epoch": 5779} {"train_loss": -27.29896354675293, "global_step": 479736, "epoch": 5779} {"train_loss": -27.438251495361328, "global_step": 479737, "epoch": 5779} {"train_loss": -27.309606552124023, "global_step": 479738, "epoch": 5779} {"train_loss": -26.965764907469232, "global_step": 479739, "epoch": 5779, "val_loss": 6768246.0} {"train_loss": -23.271093368530273, "global_step": 479740, "epoch": 5780} {"train_loss": -24.37342071533203, "global_step": 479741, "epoch": 5780} {"train_loss": -25.38470458984375, "global_step": 479742, "epoch": 5780} {"train_loss": -24.38490867614746, "global_step": 479743, "epoch": 5780} {"train_loss": -24.517248153686523, "global_step": 479744, "epoch": 5780} {"train_loss": -24.93914222717285, "global_step": 479745, "epoch": 5780} {"train_loss": -24.34908676147461, "global_step": 479746, "epoch": 5780} {"train_loss": -25.666828155517578, "global_step": 479747, "epoch": 5780} {"train_loss": -24.729841232299805, "global_step": 479748, "epoch": 5780} {"train_loss": -25.73975944519043, "global_step": 479749, "epoch": 5780} {"train_loss": -25.827558517456055, "global_step": 479750, "epoch": 5780} {"train_loss": -25.57441520690918, "global_step": 479751, "epoch": 5780} {"train_loss": -25.955778121948242, "global_step": 479752, "epoch": 5780} {"train_loss": -25.8061466217041, "global_step": 479753, "epoch": 5780} {"train_loss": -25.830915451049805, "global_step": 479754, "epoch": 5780} {"train_loss": -25.74094581604004, "global_step": 479755, "epoch": 5780} {"train_loss": -25.95245933532715, "global_step": 479756, "epoch": 5780} {"train_loss": -25.94394302368164, "global_step": 479757, "epoch": 5780} {"train_loss": -26.120441436767578, "global_step": 479758, "epoch": 5780} {"train_loss": -26.16424560546875, "global_step": 479759, "epoch": 5780} {"train_loss": -25.84392738342285, "global_step": 479760, "epoch": 5780} {"train_loss": -25.90293312072754, "global_step": 479761, "epoch": 5780} {"train_loss": -26.181177139282227, "global_step": 479762, "epoch": 5780} {"train_loss": -26.459991455078125, "global_step": 479763, "epoch": 5780} {"train_loss": -26.305395126342773, "global_step": 479764, "epoch": 5780} {"train_loss": -26.24627113342285, "global_step": 479765, "epoch": 5780} {"train_loss": -26.46599769592285, "global_step": 479766, "epoch": 5780} {"train_loss": -26.277002334594727, "global_step": 479767, "epoch": 5780} {"train_loss": -26.501916885375977, "global_step": 479768, "epoch": 5780} {"train_loss": -26.663183212280273, "global_step": 479769, "epoch": 5780} {"train_loss": -26.68885612487793, "global_step": 479770, "epoch": 5780} {"train_loss": -26.816650390625, "global_step": 479771, "epoch": 5780} {"train_loss": -26.737085342407227, "global_step": 479772, "epoch": 5780} {"train_loss": -26.949188232421875, "global_step": 479773, "epoch": 5780} {"train_loss": -26.70887565612793, "global_step": 479774, "epoch": 5780} {"train_loss": -26.977468490600586, "global_step": 479775, "epoch": 5780} {"train_loss": -26.833227157592773, "global_step": 479776, "epoch": 5780} {"train_loss": -27.12054443359375, "global_step": 479777, "epoch": 5780} {"train_loss": -27.230548858642578, "global_step": 479778, "epoch": 5780} {"train_loss": -27.03175163269043, "global_step": 479779, "epoch": 5780} {"train_loss": -27.144819259643555, "global_step": 479780, "epoch": 5780} {"train_loss": -27.14800453186035, "global_step": 479781, "epoch": 5780} {"train_loss": -27.257770538330078, "global_step": 479782, "epoch": 5780} {"train_loss": -27.269926071166992, "global_step": 479783, "epoch": 5780} {"train_loss": -27.038110733032227, "global_step": 479784, "epoch": 5780} {"train_loss": -27.49131202697754, "global_step": 479785, "epoch": 5780} {"train_loss": -27.079059600830078, "global_step": 479786, "epoch": 5780} {"train_loss": -27.22266960144043, "global_step": 479787, "epoch": 5780} {"train_loss": -27.177356719970703, "global_step": 479788, "epoch": 5780} {"train_loss": -27.260000228881836, "global_step": 479789, "epoch": 5780} {"train_loss": -27.166156768798828, "global_step": 479790, "epoch": 5780} {"train_loss": -27.492170333862305, "global_step": 479791, "epoch": 5780} {"train_loss": -27.488019943237305, "global_step": 479792, "epoch": 5780} {"train_loss": -27.32374382019043, "global_step": 479793, "epoch": 5780} {"train_loss": -27.08390235900879, "global_step": 479794, "epoch": 5780} {"train_loss": -27.458545684814453, "global_step": 479795, "epoch": 5780} {"train_loss": -26.98318862915039, "global_step": 479796, "epoch": 5780} {"train_loss": -27.105854034423828, "global_step": 479797, "epoch": 5780} {"train_loss": -27.533315658569336, "global_step": 479798, "epoch": 5780} {"train_loss": -27.52594566345215, "global_step": 479799, "epoch": 5780} {"train_loss": -27.39777946472168, "global_step": 479800, "epoch": 5780} {"train_loss": -27.150426864624023, "global_step": 479801, "epoch": 5780} {"train_loss": -27.343128204345703, "global_step": 479802, "epoch": 5780} {"train_loss": -27.5924129486084, "global_step": 479803, "epoch": 5780} {"train_loss": -27.378284454345703, "global_step": 479804, "epoch": 5780} {"train_loss": -27.61854362487793, "global_step": 479805, "epoch": 5780} {"train_loss": -27.42535400390625, "global_step": 479806, "epoch": 5780} {"train_loss": -27.569446563720703, "global_step": 479807, "epoch": 5780} {"train_loss": -27.45814323425293, "global_step": 479808, "epoch": 5780} {"train_loss": -27.33251953125, "global_step": 479809, "epoch": 5780} {"train_loss": -27.399763107299805, "global_step": 479810, "epoch": 5780} {"train_loss": -27.479328155517578, "global_step": 479811, "epoch": 5780} {"train_loss": -27.6600284576416, "global_step": 479812, "epoch": 5780} {"train_loss": -27.556686401367188, "global_step": 479813, "epoch": 5780} {"train_loss": -27.353830337524414, "global_step": 479814, "epoch": 5780} {"train_loss": -27.271469116210938, "global_step": 479815, "epoch": 5780} {"train_loss": -27.72296142578125, "global_step": 479816, "epoch": 5780} {"train_loss": -27.635757446289062, "global_step": 479817, "epoch": 5780} {"train_loss": -27.169570922851562, "global_step": 479818, "epoch": 5780} {"train_loss": -27.471637725830078, "global_step": 479819, "epoch": 5780} {"train_loss": -27.390705108642578, "global_step": 479820, "epoch": 5780} {"train_loss": -27.641393661499023, "global_step": 479821, "epoch": 5780} {"train_loss": -26.66980072389166, "global_step": 479822, "epoch": 5780, "val_loss": 6603185.5} {"train_loss": -23.26129150390625, "global_step": 479823, "epoch": 5781} {"train_loss": -16.39354705810547, "global_step": 479824, "epoch": 5781} {"train_loss": -23.437597274780273, "global_step": 479825, "epoch": 5781} {"train_loss": -24.766935348510742, "global_step": 479826, "epoch": 5781} {"train_loss": -25.785825729370117, "global_step": 479827, "epoch": 5781} {"train_loss": -24.77339744567871, "global_step": 479828, "epoch": 5781} {"train_loss": -26.080896377563477, "global_step": 479829, "epoch": 5781} {"train_loss": -25.906265258789062, "global_step": 479830, "epoch": 5781} {"train_loss": -25.891693115234375, "global_step": 479831, "epoch": 5781} {"train_loss": -25.89375114440918, "global_step": 479832, "epoch": 5781} {"train_loss": -26.241962432861328, "global_step": 479833, "epoch": 5781} {"train_loss": -25.919281005859375, "global_step": 479834, "epoch": 5781} {"train_loss": -25.698720932006836, "global_step": 479835, "epoch": 5781} {"train_loss": -26.179712295532227, "global_step": 479836, "epoch": 5781} {"train_loss": -25.983306884765625, "global_step": 479837, "epoch": 5781} {"train_loss": -26.320392608642578, "global_step": 479838, "epoch": 5781} {"train_loss": -26.42424964904785, "global_step": 479839, "epoch": 5781} {"train_loss": -26.348926544189453, "global_step": 479840, "epoch": 5781} {"train_loss": -26.375043869018555, "global_step": 479841, "epoch": 5781} {"train_loss": -26.390735626220703, "global_step": 479842, "epoch": 5781} {"train_loss": -26.6727237701416, "global_step": 479843, "epoch": 5781} {"train_loss": -26.15996742248535, "global_step": 479844, "epoch": 5781} {"train_loss": -26.552099227905273, "global_step": 479845, "epoch": 5781} {"train_loss": -26.479333877563477, "global_step": 479846, "epoch": 5781} {"train_loss": -26.615869522094727, "global_step": 479847, "epoch": 5781} {"train_loss": -26.54656982421875, "global_step": 479848, "epoch": 5781} {"train_loss": -26.488386154174805, "global_step": 479849, "epoch": 5781} {"train_loss": -26.362329483032227, "global_step": 479850, "epoch": 5781} {"train_loss": -26.708906173706055, "global_step": 479851, "epoch": 5781} {"train_loss": -26.616779327392578, "global_step": 479852, "epoch": 5781} {"train_loss": -26.84442710876465, "global_step": 479853, "epoch": 5781} {"train_loss": -27.256078720092773, "global_step": 479854, "epoch": 5781} {"train_loss": -26.889606475830078, "global_step": 479855, "epoch": 5781} {"train_loss": -26.849430084228516, "global_step": 479856, "epoch": 5781} {"train_loss": -26.95977210998535, "global_step": 479857, "epoch": 5781} {"train_loss": -26.7209415435791, "global_step": 479858, "epoch": 5781} {"train_loss": -26.666259765625, "global_step": 479859, "epoch": 5781} {"train_loss": -26.880334854125977, "global_step": 479860, "epoch": 5781} {"train_loss": -27.00226402282715, "global_step": 479861, "epoch": 5781} {"train_loss": -26.74506187438965, "global_step": 479862, "epoch": 5781} {"train_loss": -26.851882934570312, "global_step": 479863, "epoch": 5781} {"train_loss": -26.79559898376465, "global_step": 479864, "epoch": 5781} {"train_loss": -27.092275619506836, "global_step": 479865, "epoch": 5781} {"train_loss": -27.141773223876953, "global_step": 479866, "epoch": 5781} {"train_loss": -27.10382652282715, "global_step": 479867, "epoch": 5781} {"train_loss": -27.005014419555664, "global_step": 479868, "epoch": 5781} {"train_loss": -27.07478904724121, "global_step": 479869, "epoch": 5781} {"train_loss": -27.257471084594727, "global_step": 479870, "epoch": 5781} {"train_loss": -27.131895065307617, "global_step": 479871, "epoch": 5781} {"train_loss": -27.24411964416504, "global_step": 479872, "epoch": 5781} {"train_loss": -27.479660034179688, "global_step": 479873, "epoch": 5781} {"train_loss": -27.229705810546875, "global_step": 479874, "epoch": 5781} {"train_loss": -26.980810165405273, "global_step": 479875, "epoch": 5781} {"train_loss": -27.449987411499023, "global_step": 479876, "epoch": 5781} {"train_loss": -27.365814208984375, "global_step": 479877, "epoch": 5781} {"train_loss": -27.73286247253418, "global_step": 479878, "epoch": 5781} {"train_loss": -27.057798385620117, "global_step": 479879, "epoch": 5781} {"train_loss": -27.460285186767578, "global_step": 479880, "epoch": 5781} {"train_loss": -27.117101669311523, "global_step": 479881, "epoch": 5781} {"train_loss": -27.240026473999023, "global_step": 479882, "epoch": 5781} {"train_loss": -27.304044723510742, "global_step": 479883, "epoch": 5781} {"train_loss": -27.34797477722168, "global_step": 479884, "epoch": 5781} {"train_loss": -27.178668975830078, "global_step": 479885, "epoch": 5781} {"train_loss": -27.295801162719727, "global_step": 479886, "epoch": 5781} {"train_loss": -26.954233169555664, "global_step": 479887, "epoch": 5781} {"train_loss": -27.560205459594727, "global_step": 479888, "epoch": 5781} {"train_loss": -27.2522029876709, "global_step": 479889, "epoch": 5781} {"train_loss": -27.20204734802246, "global_step": 479890, "epoch": 5781} {"train_loss": -26.996580123901367, "global_step": 479891, "epoch": 5781} {"train_loss": -27.3042049407959, "global_step": 479892, "epoch": 5781} {"train_loss": -27.30848503112793, "global_step": 479893, "epoch": 5781} {"train_loss": -27.3155517578125, "global_step": 479894, "epoch": 5781} {"train_loss": -26.89350700378418, "global_step": 479895, "epoch": 5781} {"train_loss": -26.800809860229492, "global_step": 479896, "epoch": 5781} {"train_loss": -27.014188766479492, "global_step": 479897, "epoch": 5781} {"train_loss": -27.3034610748291, "global_step": 479898, "epoch": 5781} {"train_loss": -27.329282760620117, "global_step": 479899, "epoch": 5781} {"train_loss": -27.108686447143555, "global_step": 479900, "epoch": 5781} {"train_loss": -27.431058883666992, "global_step": 479901, "epoch": 5781} {"train_loss": -27.418838500976562, "global_step": 479902, "epoch": 5781} {"train_loss": -26.80682945251465, "global_step": 479903, "epoch": 5781} {"train_loss": -27.293210983276367, "global_step": 479904, "epoch": 5781} {"train_loss": -26.59499729110534, "global_step": 479905, "epoch": 5781, "val_loss": 6601355.0} {"train_loss": -26.452402114868164, "global_step": 479906, "epoch": 5782} {"train_loss": -26.863449096679688, "global_step": 479907, "epoch": 5782} {"train_loss": -26.6535701751709, "global_step": 479908, "epoch": 5782} {"train_loss": -27.128713607788086, "global_step": 479909, "epoch": 5782} {"train_loss": -26.744421005249023, "global_step": 479910, "epoch": 5782} {"train_loss": -26.916990280151367, "global_step": 479911, "epoch": 5782} {"train_loss": -26.7536563873291, "global_step": 479912, "epoch": 5782} {"train_loss": -26.89447593688965, "global_step": 479913, "epoch": 5782} {"train_loss": -26.665271759033203, "global_step": 479914, "epoch": 5782} {"train_loss": -27.043853759765625, "global_step": 479915, "epoch": 5782} {"train_loss": -26.852537155151367, "global_step": 479916, "epoch": 5782} {"train_loss": -27.067066192626953, "global_step": 479917, "epoch": 5782} {"train_loss": -26.9769344329834, "global_step": 479918, "epoch": 5782} {"train_loss": -27.0242919921875, "global_step": 479919, "epoch": 5782} {"train_loss": -27.164941787719727, "global_step": 479920, "epoch": 5782} {"train_loss": -27.22507667541504, "global_step": 479921, "epoch": 5782} {"train_loss": -26.864582061767578, "global_step": 479922, "epoch": 5782} {"train_loss": -27.183332443237305, "global_step": 479923, "epoch": 5782} {"train_loss": -26.442249298095703, "global_step": 479924, "epoch": 5782} {"train_loss": -27.078201293945312, "global_step": 479925, "epoch": 5782} {"train_loss": -26.561386108398438, "global_step": 479926, "epoch": 5782} {"train_loss": -27.107589721679688, "global_step": 479927, "epoch": 5782} {"train_loss": -26.82332420349121, "global_step": 479928, "epoch": 5782} {"train_loss": -27.000768661499023, "global_step": 479929, "epoch": 5782} {"train_loss": -26.733234405517578, "global_step": 479930, "epoch": 5782} {"train_loss": -27.242944717407227, "global_step": 479931, "epoch": 5782} {"train_loss": -26.858036041259766, "global_step": 479932, "epoch": 5782} {"train_loss": -26.969562530517578, "global_step": 479933, "epoch": 5782} {"train_loss": -27.122900009155273, "global_step": 479934, "epoch": 5782} {"train_loss": -27.24320411682129, "global_step": 479935, "epoch": 5782} {"train_loss": -27.18857765197754, "global_step": 479936, "epoch": 5782} {"train_loss": -27.072452545166016, "global_step": 479937, "epoch": 5782} {"train_loss": -27.212024688720703, "global_step": 479938, "epoch": 5782} {"train_loss": -27.227148056030273, "global_step": 479939, "epoch": 5782} {"train_loss": -26.915246963500977, "global_step": 479940, "epoch": 5782} {"train_loss": -26.900150299072266, "global_step": 479941, "epoch": 5782} {"train_loss": -27.6333065032959, "global_step": 479942, "epoch": 5782} {"train_loss": -27.432798385620117, "global_step": 479943, "epoch": 5782} {"train_loss": -27.147048950195312, "global_step": 479944, "epoch": 5782} {"train_loss": -27.018207550048828, "global_step": 479945, "epoch": 5782} {"train_loss": -27.53510093688965, "global_step": 479946, "epoch": 5782} {"train_loss": -27.704559326171875, "global_step": 479947, "epoch": 5782} {"train_loss": -27.490568161010742, "global_step": 479948, "epoch": 5782} {"train_loss": -27.3670711517334, "global_step": 479949, "epoch": 5782} {"train_loss": -27.055387496948242, "global_step": 479950, "epoch": 5782} {"train_loss": -27.384138107299805, "global_step": 479951, "epoch": 5782} {"train_loss": -27.28681755065918, "global_step": 479952, "epoch": 5782} {"train_loss": -27.15995216369629, "global_step": 479953, "epoch": 5782} {"train_loss": -27.827865600585938, "global_step": 479954, "epoch": 5782} {"train_loss": -27.7061767578125, "global_step": 479955, "epoch": 5782} {"train_loss": -27.119140625, "global_step": 479956, "epoch": 5782} {"train_loss": -27.29214859008789, "global_step": 479957, "epoch": 5782} {"train_loss": -27.36639404296875, "global_step": 479958, "epoch": 5782} {"train_loss": -27.284900665283203, "global_step": 479959, "epoch": 5782} {"train_loss": -27.539289474487305, "global_step": 479960, "epoch": 5782} {"train_loss": -27.259023666381836, "global_step": 479961, "epoch": 5782} {"train_loss": -27.458532333374023, "global_step": 479962, "epoch": 5782} {"train_loss": -27.69434928894043, "global_step": 479963, "epoch": 5782} {"train_loss": -27.058759689331055, "global_step": 479964, "epoch": 5782} {"train_loss": -27.332693099975586, "global_step": 479965, "epoch": 5782} {"train_loss": -27.3917236328125, "global_step": 479966, "epoch": 5782} {"train_loss": -27.536264419555664, "global_step": 479967, "epoch": 5782} {"train_loss": -27.32074546813965, "global_step": 479968, "epoch": 5782} {"train_loss": -27.44498062133789, "global_step": 479969, "epoch": 5782} {"train_loss": -26.940567016601562, "global_step": 479970, "epoch": 5782} {"train_loss": -27.476715087890625, "global_step": 479971, "epoch": 5782} {"train_loss": -27.560504913330078, "global_step": 479972, "epoch": 5782} {"train_loss": -27.234846115112305, "global_step": 479973, "epoch": 5782} {"train_loss": -27.66050148010254, "global_step": 479974, "epoch": 5782} {"train_loss": -27.58477783203125, "global_step": 479975, "epoch": 5782} {"train_loss": -27.461877822875977, "global_step": 479976, "epoch": 5782} {"train_loss": -27.481525421142578, "global_step": 479977, "epoch": 5782} {"train_loss": -27.215576171875, "global_step": 479978, "epoch": 5782} {"train_loss": -27.272510528564453, "global_step": 479979, "epoch": 5782} {"train_loss": -27.118499755859375, "global_step": 479980, "epoch": 5782} {"train_loss": -27.285810470581055, "global_step": 479981, "epoch": 5782} {"train_loss": -27.547378540039062, "global_step": 479982, "epoch": 5782} {"train_loss": -27.3111515045166, "global_step": 479983, "epoch": 5782} {"train_loss": -27.650623321533203, "global_step": 479984, "epoch": 5782} {"train_loss": -27.184406280517578, "global_step": 479985, "epoch": 5782} {"train_loss": -27.050445556640625, "global_step": 479986, "epoch": 5782} {"train_loss": -26.861738204956055, "global_step": 479987, "epoch": 5782} {"train_loss": -27.190080458859363, "global_step": 479988, "epoch": 5782, "val_loss": 6623568.0} {"train_loss": -26.584421157836914, "global_step": 479989, "epoch": 5783} {"train_loss": -25.329355239868164, "global_step": 479990, "epoch": 5783} {"train_loss": -25.541975021362305, "global_step": 479991, "epoch": 5783} {"train_loss": -26.81438636779785, "global_step": 479992, "epoch": 5783} {"train_loss": -26.783218383789062, "global_step": 479993, "epoch": 5783} {"train_loss": -26.08454704284668, "global_step": 479994, "epoch": 5783} {"train_loss": -26.65680503845215, "global_step": 479995, "epoch": 5783} {"train_loss": -26.64674186706543, "global_step": 479996, "epoch": 5783} {"train_loss": -26.4896240234375, "global_step": 479997, "epoch": 5783} {"train_loss": -26.99485206604004, "global_step": 479998, "epoch": 5783} {"train_loss": -26.751922607421875, "global_step": 479999, "epoch": 5783} {"train_loss": -26.620222091674805, "global_step": 480000, "epoch": 5783} {"train_loss": -27.219324111938477, "global_step": 480001, "epoch": 5783} {"train_loss": -26.712705612182617, "global_step": 480002, "epoch": 5783} {"train_loss": -26.672550201416016, "global_step": 480003, "epoch": 5783} {"train_loss": -27.29949951171875, "global_step": 480004, "epoch": 5783} {"train_loss": -26.852191925048828, "global_step": 480005, "epoch": 5783} {"train_loss": -26.97585105895996, "global_step": 480006, "epoch": 5783} {"train_loss": -26.726285934448242, "global_step": 480007, "epoch": 5783} {"train_loss": -27.31416130065918, "global_step": 480008, "epoch": 5783} {"train_loss": -27.070226669311523, "global_step": 480009, "epoch": 5783} {"train_loss": -27.0018253326416, "global_step": 480010, "epoch": 5783} {"train_loss": -27.215795516967773, "global_step": 480011, "epoch": 5783} {"train_loss": -26.880903244018555, "global_step": 480012, "epoch": 5783} {"train_loss": -27.00690269470215, "global_step": 480013, "epoch": 5783} {"train_loss": -26.993972778320312, "global_step": 480014, "epoch": 5783} {"train_loss": -27.594186782836914, "global_step": 480015, "epoch": 5783} {"train_loss": -26.985309600830078, "global_step": 480016, "epoch": 5783} {"train_loss": -27.21527099609375, "global_step": 480017, "epoch": 5783} {"train_loss": -27.1392822265625, "global_step": 480018, "epoch": 5783} {"train_loss": -27.03718376159668, "global_step": 480019, "epoch": 5783} {"train_loss": -27.411218643188477, "global_step": 480020, "epoch": 5783} {"train_loss": -27.136011123657227, "global_step": 480021, "epoch": 5783} {"train_loss": -27.163938522338867, "global_step": 480022, "epoch": 5783} {"train_loss": -27.039480209350586, "global_step": 480023, "epoch": 5783} {"train_loss": -27.013593673706055, "global_step": 480024, "epoch": 5783} {"train_loss": -27.691761016845703, "global_step": 480025, "epoch": 5783} {"train_loss": -27.198888778686523, "global_step": 480026, "epoch": 5783} {"train_loss": -27.290119171142578, "global_step": 480027, "epoch": 5783} {"train_loss": -27.347686767578125, "global_step": 480028, "epoch": 5783} {"train_loss": -27.177045822143555, "global_step": 480029, "epoch": 5783} {"train_loss": -27.102773666381836, "global_step": 480030, "epoch": 5783} {"train_loss": -27.455459594726562, "global_step": 480031, "epoch": 5783} {"train_loss": -27.225126266479492, "global_step": 480032, "epoch": 5783} {"train_loss": -27.430999755859375, "global_step": 480033, "epoch": 5783} {"train_loss": -27.363483428955078, "global_step": 480034, "epoch": 5783} {"train_loss": -26.92487144470215, "global_step": 480035, "epoch": 5783} {"train_loss": -27.118173599243164, "global_step": 480036, "epoch": 5783} {"train_loss": -27.214786529541016, "global_step": 480037, "epoch": 5783} {"train_loss": -27.24116325378418, "global_step": 480038, "epoch": 5783} {"train_loss": -27.753400802612305, "global_step": 480039, "epoch": 5783} {"train_loss": -27.34064292907715, "global_step": 480040, "epoch": 5783} {"train_loss": -27.39156150817871, "global_step": 480041, "epoch": 5783} {"train_loss": -27.54451560974121, "global_step": 480042, "epoch": 5783} {"train_loss": -27.436416625976562, "global_step": 480043, "epoch": 5783} {"train_loss": -27.6463623046875, "global_step": 480044, "epoch": 5783} {"train_loss": -27.45401382446289, "global_step": 480045, "epoch": 5783} {"train_loss": -27.46087646484375, "global_step": 480046, "epoch": 5783} {"train_loss": -27.294559478759766, "global_step": 480047, "epoch": 5783} {"train_loss": -27.751419067382812, "global_step": 480048, "epoch": 5783} {"train_loss": -27.655689239501953, "global_step": 480049, "epoch": 5783} {"train_loss": -27.704059600830078, "global_step": 480050, "epoch": 5783} {"train_loss": -27.203983306884766, "global_step": 480051, "epoch": 5783} {"train_loss": -27.458316802978516, "global_step": 480052, "epoch": 5783} {"train_loss": -27.37299919128418, "global_step": 480053, "epoch": 5783} {"train_loss": -27.555957794189453, "global_step": 480054, "epoch": 5783} {"train_loss": -27.801862716674805, "global_step": 480055, "epoch": 5783} {"train_loss": -27.453601837158203, "global_step": 480056, "epoch": 5783} {"train_loss": -27.444217681884766, "global_step": 480057, "epoch": 5783} {"train_loss": -26.69708251953125, "global_step": 480058, "epoch": 5783} {"train_loss": -26.665542602539062, "global_step": 480059, "epoch": 5783} {"train_loss": -26.144744873046875, "global_step": 480060, "epoch": 5783} {"train_loss": -25.834875106811523, "global_step": 480061, "epoch": 5783} {"train_loss": -26.70582389831543, "global_step": 480062, "epoch": 5783} {"train_loss": -27.290815353393555, "global_step": 480063, "epoch": 5783} {"train_loss": -26.881765365600586, "global_step": 480064, "epoch": 5783} {"train_loss": -27.2050724029541, "global_step": 480065, "epoch": 5783} {"train_loss": -26.89597511291504, "global_step": 480066, "epoch": 5783} {"train_loss": -26.82755470275879, "global_step": 480067, "epoch": 5783} {"train_loss": -26.62909507751465, "global_step": 480068, "epoch": 5783} {"train_loss": -27.37396812438965, "global_step": 480069, "epoch": 5783} {"train_loss": -27.282575607299805, "global_step": 480070, "epoch": 5783} {"train_loss": -27.075273398893426, "global_step": 480071, "epoch": 5783, "val_loss": 6611375.0} {"train_loss": -26.517419815063477, "global_step": 480072, "epoch": 5784} {"train_loss": -26.66080665588379, "global_step": 480073, "epoch": 5784} {"train_loss": -26.773725509643555, "global_step": 480074, "epoch": 5784} {"train_loss": -26.6355037689209, "global_step": 480075, "epoch": 5784} {"train_loss": -26.033254623413086, "global_step": 480076, "epoch": 5784} {"train_loss": -27.142292022705078, "global_step": 480077, "epoch": 5784} {"train_loss": -27.283132553100586, "global_step": 480078, "epoch": 5784} {"train_loss": -26.559900283813477, "global_step": 480079, "epoch": 5784} {"train_loss": -26.741291046142578, "global_step": 480080, "epoch": 5784} {"train_loss": -26.8062744140625, "global_step": 480081, "epoch": 5784} {"train_loss": -26.91611099243164, "global_step": 480082, "epoch": 5784} {"train_loss": -27.035104751586914, "global_step": 480083, "epoch": 5784} {"train_loss": -26.649188995361328, "global_step": 480084, "epoch": 5784} {"train_loss": -27.09242820739746, "global_step": 480085, "epoch": 5784} {"train_loss": -26.63248634338379, "global_step": 480086, "epoch": 5784} {"train_loss": -27.593494415283203, "global_step": 480087, "epoch": 5784} {"train_loss": -26.961843490600586, "global_step": 480088, "epoch": 5784} {"train_loss": -27.402679443359375, "global_step": 480089, "epoch": 5784} {"train_loss": -27.51324462890625, "global_step": 480090, "epoch": 5784} {"train_loss": -26.788604736328125, "global_step": 480091, "epoch": 5784} {"train_loss": -27.37369728088379, "global_step": 480092, "epoch": 5784} {"train_loss": -27.44476890563965, "global_step": 480093, "epoch": 5784} {"train_loss": -27.319854736328125, "global_step": 480094, "epoch": 5784} {"train_loss": -26.99014663696289, "global_step": 480095, "epoch": 5784} {"train_loss": -26.856985092163086, "global_step": 480096, "epoch": 5784} {"train_loss": -27.180265426635742, "global_step": 480097, "epoch": 5784} {"train_loss": -27.245264053344727, "global_step": 480098, "epoch": 5784} {"train_loss": -27.44856834411621, "global_step": 480099, "epoch": 5784} {"train_loss": -27.246723175048828, "global_step": 480100, "epoch": 5784} {"train_loss": -27.506616592407227, "global_step": 480101, "epoch": 5784} {"train_loss": -27.462604522705078, "global_step": 480102, "epoch": 5784} {"train_loss": -27.38413429260254, "global_step": 480103, "epoch": 5784} {"train_loss": -27.782682418823242, "global_step": 480104, "epoch": 5784} {"train_loss": -27.18340492248535, "global_step": 480105, "epoch": 5784} {"train_loss": -27.199682235717773, "global_step": 480106, "epoch": 5784} {"train_loss": -27.48463249206543, "global_step": 480107, "epoch": 5784} {"train_loss": -27.111066818237305, "global_step": 480108, "epoch": 5784} {"train_loss": -27.028024673461914, "global_step": 480109, "epoch": 5784} {"train_loss": -27.24384880065918, "global_step": 480110, "epoch": 5784} {"train_loss": -27.100854873657227, "global_step": 480111, "epoch": 5784} {"train_loss": -27.354948043823242, "global_step": 480112, "epoch": 5784} {"train_loss": -27.105703353881836, "global_step": 480113, "epoch": 5784} {"train_loss": -27.428451538085938, "global_step": 480114, "epoch": 5784} {"train_loss": -27.273839950561523, "global_step": 480115, "epoch": 5784} {"train_loss": -27.353912353515625, "global_step": 480116, "epoch": 5784} {"train_loss": -27.65181541442871, "global_step": 480117, "epoch": 5784} {"train_loss": -27.490873336791992, "global_step": 480118, "epoch": 5784} {"train_loss": -27.520008087158203, "global_step": 480119, "epoch": 5784} {"train_loss": -27.529653549194336, "global_step": 480120, "epoch": 5784} {"train_loss": -27.693708419799805, "global_step": 480121, "epoch": 5784} {"train_loss": -27.548892974853516, "global_step": 480122, "epoch": 5784} {"train_loss": -27.53045082092285, "global_step": 480123, "epoch": 5784} {"train_loss": -27.330671310424805, "global_step": 480124, "epoch": 5784} {"train_loss": -27.4409236907959, "global_step": 480125, "epoch": 5784} {"train_loss": -27.629638671875, "global_step": 480126, "epoch": 5784} {"train_loss": -27.327163696289062, "global_step": 480127, "epoch": 5784} {"train_loss": -27.2912654876709, "global_step": 480128, "epoch": 5784} {"train_loss": -27.336423873901367, "global_step": 480129, "epoch": 5784} {"train_loss": -27.593557357788086, "global_step": 480130, "epoch": 5784} {"train_loss": -27.4483699798584, "global_step": 480131, "epoch": 5784} {"train_loss": -27.293058395385742, "global_step": 480132, "epoch": 5784} {"train_loss": -27.30756187438965, "global_step": 480133, "epoch": 5784} {"train_loss": -26.82321548461914, "global_step": 480134, "epoch": 5784} {"train_loss": -26.9124755859375, "global_step": 480135, "epoch": 5784} {"train_loss": -26.98480796813965, "global_step": 480136, "epoch": 5784} {"train_loss": -27.144453048706055, "global_step": 480137, "epoch": 5784} {"train_loss": -26.945693969726562, "global_step": 480138, "epoch": 5784} {"train_loss": -27.155750274658203, "global_step": 480139, "epoch": 5784} {"train_loss": -27.335309982299805, "global_step": 480140, "epoch": 5784} {"train_loss": -27.775815963745117, "global_step": 480141, "epoch": 5784} {"train_loss": -27.372577667236328, "global_step": 480142, "epoch": 5784} {"train_loss": -26.6995792388916, "global_step": 480143, "epoch": 5784} {"train_loss": -27.208148956298828, "global_step": 480144, "epoch": 5784} {"train_loss": -27.063373565673828, "global_step": 480145, "epoch": 5784} {"train_loss": -26.98701286315918, "global_step": 480146, "epoch": 5784} {"train_loss": -27.28388023376465, "global_step": 480147, "epoch": 5784} {"train_loss": -27.49688148498535, "global_step": 480148, "epoch": 5784} {"train_loss": -26.95460319519043, "global_step": 480149, "epoch": 5784} {"train_loss": -27.17801284790039, "global_step": 480150, "epoch": 5784} {"train_loss": -27.18892478942871, "global_step": 480151, "epoch": 5784} {"train_loss": -27.363758087158203, "global_step": 480152, "epoch": 5784} {"train_loss": -27.64569091796875, "global_step": 480153, "epoch": 5784} {"train_loss": -27.20509979523808, "global_step": 480154, "epoch": 5784, "val_loss": 6637212.0} {"train_loss": -26.963348388671875, "global_step": 480155, "epoch": 5785} {"train_loss": -26.4290828704834, "global_step": 480156, "epoch": 5785} {"train_loss": -26.985523223876953, "global_step": 480157, "epoch": 5785} {"train_loss": -26.826562881469727, "global_step": 480158, "epoch": 5785} {"train_loss": -26.97175407409668, "global_step": 480159, "epoch": 5785} {"train_loss": -26.89691162109375, "global_step": 480160, "epoch": 5785} {"train_loss": -26.948516845703125, "global_step": 480161, "epoch": 5785} {"train_loss": -27.016651153564453, "global_step": 480162, "epoch": 5785} {"train_loss": -26.97688102722168, "global_step": 480163, "epoch": 5785} {"train_loss": -26.9630184173584, "global_step": 480164, "epoch": 5785} {"train_loss": -27.225509643554688, "global_step": 480165, "epoch": 5785} {"train_loss": -27.00996208190918, "global_step": 480166, "epoch": 5785} {"train_loss": -26.4798526763916, "global_step": 480167, "epoch": 5785} {"train_loss": -27.04305076599121, "global_step": 480168, "epoch": 5785} {"train_loss": -27.160314559936523, "global_step": 480169, "epoch": 5785} {"train_loss": -26.72584342956543, "global_step": 480170, "epoch": 5785} {"train_loss": -27.329986572265625, "global_step": 480171, "epoch": 5785} {"train_loss": -27.202838897705078, "global_step": 480172, "epoch": 5785} {"train_loss": -27.57724380493164, "global_step": 480173, "epoch": 5785} {"train_loss": -27.244977951049805, "global_step": 480174, "epoch": 5785} {"train_loss": -27.127553939819336, "global_step": 480175, "epoch": 5785} {"train_loss": -27.293909072875977, "global_step": 480176, "epoch": 5785} {"train_loss": -27.420673370361328, "global_step": 480177, "epoch": 5785} {"train_loss": -26.924591064453125, "global_step": 480178, "epoch": 5785} {"train_loss": -27.353452682495117, "global_step": 480179, "epoch": 5785} {"train_loss": -27.406370162963867, "global_step": 480180, "epoch": 5785} {"train_loss": -26.792898178100586, "global_step": 480181, "epoch": 5785} {"train_loss": -27.46253776550293, "global_step": 480182, "epoch": 5785} {"train_loss": -27.463336944580078, "global_step": 480183, "epoch": 5785} {"train_loss": -27.191808700561523, "global_step": 480184, "epoch": 5785} {"train_loss": -27.49542808532715, "global_step": 480185, "epoch": 5785} {"train_loss": -27.230981826782227, "global_step": 480186, "epoch": 5785} {"train_loss": -27.40595054626465, "global_step": 480187, "epoch": 5785} {"train_loss": -27.258615493774414, "global_step": 480188, "epoch": 5785} {"train_loss": -27.601423263549805, "global_step": 480189, "epoch": 5785} {"train_loss": -27.450101852416992, "global_step": 480190, "epoch": 5785} {"train_loss": -27.40949058532715, "global_step": 480191, "epoch": 5785} {"train_loss": -27.49732780456543, "global_step": 480192, "epoch": 5785} {"train_loss": -27.45633888244629, "global_step": 480193, "epoch": 5785} {"train_loss": -27.666955947875977, "global_step": 480194, "epoch": 5785} {"train_loss": -27.31904411315918, "global_step": 480195, "epoch": 5785} {"train_loss": -27.60093116760254, "global_step": 480196, "epoch": 5785} {"train_loss": -27.017377853393555, "global_step": 480197, "epoch": 5785} {"train_loss": -27.29631996154785, "global_step": 480198, "epoch": 5785} {"train_loss": -27.21702003479004, "global_step": 480199, "epoch": 5785} {"train_loss": -27.41802406311035, "global_step": 480200, "epoch": 5785} {"train_loss": -27.6314697265625, "global_step": 480201, "epoch": 5785} {"train_loss": -27.19964599609375, "global_step": 480202, "epoch": 5785} {"train_loss": -27.322818756103516, "global_step": 480203, "epoch": 5785} {"train_loss": -27.4145450592041, "global_step": 480204, "epoch": 5785} {"train_loss": -27.27680778503418, "global_step": 480205, "epoch": 5785} {"train_loss": -27.48943519592285, "global_step": 480206, "epoch": 5785} {"train_loss": -27.55032730102539, "global_step": 480207, "epoch": 5785} {"train_loss": -27.29731559753418, "global_step": 480208, "epoch": 5785} {"train_loss": -27.171762466430664, "global_step": 480209, "epoch": 5785} {"train_loss": -27.41400718688965, "global_step": 480210, "epoch": 5785} {"train_loss": -27.316659927368164, "global_step": 480211, "epoch": 5785} {"train_loss": -27.25653076171875, "global_step": 480212, "epoch": 5785} {"train_loss": -27.274831771850586, "global_step": 480213, "epoch": 5785} {"train_loss": -27.439746856689453, "global_step": 480214, "epoch": 5785} {"train_loss": -27.789413452148438, "global_step": 480215, "epoch": 5785} {"train_loss": -27.14487075805664, "global_step": 480216, "epoch": 5785} {"train_loss": -27.186304092407227, "global_step": 480217, "epoch": 5785} {"train_loss": -26.938383102416992, "global_step": 480218, "epoch": 5785} {"train_loss": -27.447275161743164, "global_step": 480219, "epoch": 5785} {"train_loss": -27.3935546875, "global_step": 480220, "epoch": 5785} {"train_loss": -27.26837730407715, "global_step": 480221, "epoch": 5785} {"train_loss": -27.15972328186035, "global_step": 480222, "epoch": 5785} {"train_loss": -27.400915145874023, "global_step": 480223, "epoch": 5785} {"train_loss": -27.3113956451416, "global_step": 480224, "epoch": 5785} {"train_loss": -27.459497451782227, "global_step": 480225, "epoch": 5785} {"train_loss": -27.61324119567871, "global_step": 480226, "epoch": 5785} {"train_loss": -27.4578800201416, "global_step": 480227, "epoch": 5785} {"train_loss": -27.38336753845215, "global_step": 480228, "epoch": 5785} {"train_loss": -27.595977783203125, "global_step": 480229, "epoch": 5785} {"train_loss": -27.25502586364746, "global_step": 480230, "epoch": 5785} {"train_loss": -27.203577041625977, "global_step": 480231, "epoch": 5785} {"train_loss": -27.46677589416504, "global_step": 480232, "epoch": 5785} {"train_loss": -27.2835636138916, "global_step": 480233, "epoch": 5785} {"train_loss": -27.016712188720703, "global_step": 480234, "epoch": 5785} {"train_loss": -27.23665428161621, "global_step": 480235, "epoch": 5785} {"train_loss": -27.13543701171875, "global_step": 480236, "epoch": 5785} {"train_loss": -27.262215258127235, "global_step": 480237, "epoch": 5785, "val_loss": 6630625.5} {"train_loss": -26.552474975585938, "global_step": 480238, "epoch": 5786} {"train_loss": -25.82110023498535, "global_step": 480239, "epoch": 5786} {"train_loss": -25.855016708374023, "global_step": 480240, "epoch": 5786} {"train_loss": -26.719385147094727, "global_step": 480241, "epoch": 5786} {"train_loss": -26.028501510620117, "global_step": 480242, "epoch": 5786} {"train_loss": -26.622678756713867, "global_step": 480243, "epoch": 5786} {"train_loss": -26.475168228149414, "global_step": 480244, "epoch": 5786} {"train_loss": -26.493112564086914, "global_step": 480245, "epoch": 5786} {"train_loss": -26.59797477722168, "global_step": 480246, "epoch": 5786} {"train_loss": -26.427143096923828, "global_step": 480247, "epoch": 5786} {"train_loss": -26.844831466674805, "global_step": 480248, "epoch": 5786} {"train_loss": -26.662214279174805, "global_step": 480249, "epoch": 5786} {"train_loss": -26.87544822692871, "global_step": 480250, "epoch": 5786} {"train_loss": -27.000106811523438, "global_step": 480251, "epoch": 5786} {"train_loss": -26.759687423706055, "global_step": 480252, "epoch": 5786} {"train_loss": -26.79062843322754, "global_step": 480253, "epoch": 5786} {"train_loss": -27.017902374267578, "global_step": 480254, "epoch": 5786} {"train_loss": -26.99355125427246, "global_step": 480255, "epoch": 5786} {"train_loss": -26.951013565063477, "global_step": 480256, "epoch": 5786} {"train_loss": -27.048940658569336, "global_step": 480257, "epoch": 5786} {"train_loss": -27.234907150268555, "global_step": 480258, "epoch": 5786} {"train_loss": -26.921674728393555, "global_step": 480259, "epoch": 5786} {"train_loss": -27.216266632080078, "global_step": 480260, "epoch": 5786} {"train_loss": -27.083667755126953, "global_step": 480261, "epoch": 5786} {"train_loss": -27.116439819335938, "global_step": 480262, "epoch": 5786} {"train_loss": -27.504453659057617, "global_step": 480263, "epoch": 5786} {"train_loss": -27.253759384155273, "global_step": 480264, "epoch": 5786} {"train_loss": -27.056781768798828, "global_step": 480265, "epoch": 5786} {"train_loss": -27.195892333984375, "global_step": 480266, "epoch": 5786} {"train_loss": -27.08212661743164, "global_step": 480267, "epoch": 5786} {"train_loss": -27.010602951049805, "global_step": 480268, "epoch": 5786} {"train_loss": -27.152847290039062, "global_step": 480269, "epoch": 5786} {"train_loss": -27.090911865234375, "global_step": 480270, "epoch": 5786} {"train_loss": -26.703893661499023, "global_step": 480271, "epoch": 5786} {"train_loss": -26.99543571472168, "global_step": 480272, "epoch": 5786} {"train_loss": -27.147253036499023, "global_step": 480273, "epoch": 5786} {"train_loss": -27.063617706298828, "global_step": 480274, "epoch": 5786} {"train_loss": -27.13884925842285, "global_step": 480275, "epoch": 5786} {"train_loss": -27.304162979125977, "global_step": 480276, "epoch": 5786} {"train_loss": -27.225082397460938, "global_step": 480277, "epoch": 5786} {"train_loss": -27.086017608642578, "global_step": 480278, "epoch": 5786} {"train_loss": -26.75055503845215, "global_step": 480279, "epoch": 5786} {"train_loss": -27.102188110351562, "global_step": 480280, "epoch": 5786} {"train_loss": -27.609058380126953, "global_step": 480281, "epoch": 5786} {"train_loss": -27.14961051940918, "global_step": 480282, "epoch": 5786} {"train_loss": -27.201642990112305, "global_step": 480283, "epoch": 5786} {"train_loss": -27.601551055908203, "global_step": 480284, "epoch": 5786} {"train_loss": -26.85150718688965, "global_step": 480285, "epoch": 5786} {"train_loss": -26.760791778564453, "global_step": 480286, "epoch": 5786} {"train_loss": -27.406949996948242, "global_step": 480287, "epoch": 5786} {"train_loss": -27.299774169921875, "global_step": 480288, "epoch": 5786} {"train_loss": -27.21979331970215, "global_step": 480289, "epoch": 5786} {"train_loss": -27.331857681274414, "global_step": 480290, "epoch": 5786} {"train_loss": -27.71253776550293, "global_step": 480291, "epoch": 5786} {"train_loss": -27.36334228515625, "global_step": 480292, "epoch": 5786} {"train_loss": -26.918542861938477, "global_step": 480293, "epoch": 5786} {"train_loss": -27.229293823242188, "global_step": 480294, "epoch": 5786} {"train_loss": -27.109647750854492, "global_step": 480295, "epoch": 5786} {"train_loss": -27.407917022705078, "global_step": 480296, "epoch": 5786} {"train_loss": -27.325687408447266, "global_step": 480297, "epoch": 5786} {"train_loss": -26.906179428100586, "global_step": 480298, "epoch": 5786} {"train_loss": -27.426166534423828, "global_step": 480299, "epoch": 5786} {"train_loss": -26.964452743530273, "global_step": 480300, "epoch": 5786} {"train_loss": -27.35137939453125, "global_step": 480301, "epoch": 5786} {"train_loss": -27.378767013549805, "global_step": 480302, "epoch": 5786} {"train_loss": -27.554346084594727, "global_step": 480303, "epoch": 5786} {"train_loss": -27.047943115234375, "global_step": 480304, "epoch": 5786} {"train_loss": -26.892248153686523, "global_step": 480305, "epoch": 5786} {"train_loss": -26.959136962890625, "global_step": 480306, "epoch": 5786} {"train_loss": -27.2462158203125, "global_step": 480307, "epoch": 5786} {"train_loss": -27.17898941040039, "global_step": 480308, "epoch": 5786} {"train_loss": -27.479001998901367, "global_step": 480309, "epoch": 5786} {"train_loss": -27.39666175842285, "global_step": 480310, "epoch": 5786} {"train_loss": -27.01490592956543, "global_step": 480311, "epoch": 5786} {"train_loss": -27.585575103759766, "global_step": 480312, "epoch": 5786} {"train_loss": -27.243513107299805, "global_step": 480313, "epoch": 5786} {"train_loss": -27.18916130065918, "global_step": 480314, "epoch": 5786} {"train_loss": -27.36798095703125, "global_step": 480315, "epoch": 5786} {"train_loss": -27.31622314453125, "global_step": 480316, "epoch": 5786} {"train_loss": -27.431913375854492, "global_step": 480317, "epoch": 5786} {"train_loss": -27.513477325439453, "global_step": 480318, "epoch": 5786} {"train_loss": -27.141788482666016, "global_step": 480319, "epoch": 5786} {"train_loss": -27.055255361350184, "global_step": 480320, "epoch": 5786, "val_loss": 6590195.5} {"train_loss": -27.1527099609375, "global_step": 480321, "epoch": 5787} {"train_loss": -27.3677921295166, "global_step": 480322, "epoch": 5787} {"train_loss": -27.202136993408203, "global_step": 480323, "epoch": 5787} {"train_loss": -26.80877113342285, "global_step": 480324, "epoch": 5787} {"train_loss": -26.82976722717285, "global_step": 480325, "epoch": 5787} {"train_loss": -26.665857315063477, "global_step": 480326, "epoch": 5787} {"train_loss": -26.830493927001953, "global_step": 480327, "epoch": 5787} {"train_loss": -27.542341232299805, "global_step": 480328, "epoch": 5787} {"train_loss": -26.972156524658203, "global_step": 480329, "epoch": 5787} {"train_loss": -27.20876121520996, "global_step": 480330, "epoch": 5787} {"train_loss": -27.249658584594727, "global_step": 480331, "epoch": 5787} {"train_loss": -27.386646270751953, "global_step": 480332, "epoch": 5787} {"train_loss": -26.62384605407715, "global_step": 480333, "epoch": 5787} {"train_loss": -26.8631591796875, "global_step": 480334, "epoch": 5787} {"train_loss": -27.16009521484375, "global_step": 480335, "epoch": 5787} {"train_loss": -27.517919540405273, "global_step": 480336, "epoch": 5787} {"train_loss": -27.079193115234375, "global_step": 480337, "epoch": 5787} {"train_loss": -27.314605712890625, "global_step": 480338, "epoch": 5787} {"train_loss": -27.029998779296875, "global_step": 480339, "epoch": 5787} {"train_loss": -27.222583770751953, "global_step": 480340, "epoch": 5787} {"train_loss": -26.742660522460938, "global_step": 480341, "epoch": 5787} {"train_loss": -27.02166175842285, "global_step": 480342, "epoch": 5787} {"train_loss": -26.456470489501953, "global_step": 480343, "epoch": 5787} {"train_loss": -27.186416625976562, "global_step": 480344, "epoch": 5787} {"train_loss": -26.715505599975586, "global_step": 480345, "epoch": 5787} {"train_loss": -27.0161075592041, "global_step": 480346, "epoch": 5787} {"train_loss": -27.36212158203125, "global_step": 480347, "epoch": 5787} {"train_loss": -26.73858070373535, "global_step": 480348, "epoch": 5787} {"train_loss": -27.374317169189453, "global_step": 480349, "epoch": 5787} {"train_loss": -27.160205841064453, "global_step": 480350, "epoch": 5787} {"train_loss": -27.239614486694336, "global_step": 480351, "epoch": 5787} {"train_loss": -27.069305419921875, "global_step": 480352, "epoch": 5787} {"train_loss": -27.432722091674805, "global_step": 480353, "epoch": 5787} {"train_loss": -27.174692153930664, "global_step": 480354, "epoch": 5787} {"train_loss": -27.108184814453125, "global_step": 480355, "epoch": 5787} {"train_loss": -27.29905128479004, "global_step": 480356, "epoch": 5787} {"train_loss": -27.195531845092773, "global_step": 480357, "epoch": 5787} {"train_loss": -27.490158081054688, "global_step": 480358, "epoch": 5787} {"train_loss": -27.405378341674805, "global_step": 480359, "epoch": 5787} {"train_loss": -27.41180992126465, "global_step": 480360, "epoch": 5787} {"train_loss": -26.89861488342285, "global_step": 480361, "epoch": 5787} {"train_loss": -27.321542739868164, "global_step": 480362, "epoch": 5787} {"train_loss": -26.984359741210938, "global_step": 480363, "epoch": 5787} {"train_loss": -27.1859188079834, "global_step": 480364, "epoch": 5787} {"train_loss": -27.26459312438965, "global_step": 480365, "epoch": 5787} {"train_loss": -27.3311710357666, "global_step": 480366, "epoch": 5787} {"train_loss": -27.150390625, "global_step": 480367, "epoch": 5787} {"train_loss": -27.3797664642334, "global_step": 480368, "epoch": 5787} {"train_loss": -27.016077041625977, "global_step": 480369, "epoch": 5787} {"train_loss": -27.567548751831055, "global_step": 480370, "epoch": 5787} {"train_loss": -27.17561149597168, "global_step": 480371, "epoch": 5787} {"train_loss": -26.930078506469727, "global_step": 480372, "epoch": 5787} {"train_loss": -27.303449630737305, "global_step": 480373, "epoch": 5787} {"train_loss": -26.971466064453125, "global_step": 480374, "epoch": 5787} {"train_loss": -27.17514991760254, "global_step": 480375, "epoch": 5787} {"train_loss": -27.2697811126709, "global_step": 480376, "epoch": 5787} {"train_loss": -26.922529220581055, "global_step": 480377, "epoch": 5787} {"train_loss": -27.6575870513916, "global_step": 480378, "epoch": 5787} {"train_loss": -27.430816650390625, "global_step": 480379, "epoch": 5787} {"train_loss": -27.54804039001465, "global_step": 480380, "epoch": 5787} {"train_loss": -27.514362335205078, "global_step": 480381, "epoch": 5787} {"train_loss": -27.782934188842773, "global_step": 480382, "epoch": 5787} {"train_loss": -27.567188262939453, "global_step": 480383, "epoch": 5787} {"train_loss": -27.474206924438477, "global_step": 480384, "epoch": 5787} {"train_loss": -28.123626708984375, "global_step": 480385, "epoch": 5787} {"train_loss": -27.718158721923828, "global_step": 480386, "epoch": 5787} {"train_loss": -27.372705459594727, "global_step": 480387, "epoch": 5787} {"train_loss": -27.300338745117188, "global_step": 480388, "epoch": 5787} {"train_loss": -27.651609420776367, "global_step": 480389, "epoch": 5787} {"train_loss": -27.515039443969727, "global_step": 480390, "epoch": 5787} {"train_loss": -27.627216339111328, "global_step": 480391, "epoch": 5787} {"train_loss": -27.358488082885742, "global_step": 480392, "epoch": 5787} {"train_loss": -27.489582061767578, "global_step": 480393, "epoch": 5787} {"train_loss": -27.373266220092773, "global_step": 480394, "epoch": 5787} {"train_loss": -27.51654052734375, "global_step": 480395, "epoch": 5787} {"train_loss": -27.23811149597168, "global_step": 480396, "epoch": 5787} {"train_loss": -27.31879997253418, "global_step": 480397, "epoch": 5787} {"train_loss": -27.350238800048828, "global_step": 480398, "epoch": 5787} {"train_loss": -27.489301681518555, "global_step": 480399, "epoch": 5787} {"train_loss": -27.3049259185791, "global_step": 480400, "epoch": 5787} {"train_loss": -27.242727279663086, "global_step": 480401, "epoch": 5787} {"train_loss": -27.291532516479492, "global_step": 480402, "epoch": 5787} {"train_loss": -27.225827412432935, "global_step": 480403, "epoch": 5787, "val_loss": 6516127.0} {"train_loss": -26.888639450073242, "global_step": 480404, "epoch": 5788} {"train_loss": -25.966367721557617, "global_step": 480405, "epoch": 5788} {"train_loss": -26.546695709228516, "global_step": 480406, "epoch": 5788} {"train_loss": -26.452743530273438, "global_step": 480407, "epoch": 5788} {"train_loss": -26.284515380859375, "global_step": 480408, "epoch": 5788} {"train_loss": -26.964929580688477, "global_step": 480409, "epoch": 5788} {"train_loss": -27.133529663085938, "global_step": 480410, "epoch": 5788} {"train_loss": -26.5101318359375, "global_step": 480411, "epoch": 5788} {"train_loss": -26.3753662109375, "global_step": 480412, "epoch": 5788} {"train_loss": -26.360519409179688, "global_step": 480413, "epoch": 5788} {"train_loss": -26.205768585205078, "global_step": 480414, "epoch": 5788} {"train_loss": -25.925098419189453, "global_step": 480415, "epoch": 5788} {"train_loss": -26.484272003173828, "global_step": 480416, "epoch": 5788} {"train_loss": -26.690881729125977, "global_step": 480417, "epoch": 5788} {"train_loss": -27.187301635742188, "global_step": 480418, "epoch": 5788} {"train_loss": -26.62456703186035, "global_step": 480419, "epoch": 5788} {"train_loss": -27.137348175048828, "global_step": 480420, "epoch": 5788} {"train_loss": -26.703367233276367, "global_step": 480421, "epoch": 5788} {"train_loss": -26.939868927001953, "global_step": 480422, "epoch": 5788} {"train_loss": -27.411945343017578, "global_step": 480423, "epoch": 5788} {"train_loss": -26.812713623046875, "global_step": 480424, "epoch": 5788} {"train_loss": -27.081506729125977, "global_step": 480425, "epoch": 5788} {"train_loss": -27.077489852905273, "global_step": 480426, "epoch": 5788} {"train_loss": -27.077905654907227, "global_step": 480427, "epoch": 5788} {"train_loss": -27.189558029174805, "global_step": 480428, "epoch": 5788} {"train_loss": -27.00099754333496, "global_step": 480429, "epoch": 5788} {"train_loss": -27.339075088500977, "global_step": 480430, "epoch": 5788} {"train_loss": -26.946496963500977, "global_step": 480431, "epoch": 5788} {"train_loss": -27.295379638671875, "global_step": 480432, "epoch": 5788} {"train_loss": -27.236249923706055, "global_step": 480433, "epoch": 5788} {"train_loss": -27.59039306640625, "global_step": 480434, "epoch": 5788} {"train_loss": -27.186437606811523, "global_step": 480435, "epoch": 5788} {"train_loss": -27.198362350463867, "global_step": 480436, "epoch": 5788} {"train_loss": -27.51995849609375, "global_step": 480437, "epoch": 5788} {"train_loss": -27.552997589111328, "global_step": 480438, "epoch": 5788} {"train_loss": -27.459671020507812, "global_step": 480439, "epoch": 5788} {"train_loss": -27.51898765563965, "global_step": 480440, "epoch": 5788} {"train_loss": -27.642581939697266, "global_step": 480441, "epoch": 5788} {"train_loss": -27.3803768157959, "global_step": 480442, "epoch": 5788} {"train_loss": -27.39971351623535, "global_step": 480443, "epoch": 5788} {"train_loss": -27.209638595581055, "global_step": 480444, "epoch": 5788} {"train_loss": -27.2553653717041, "global_step": 480445, "epoch": 5788} {"train_loss": -27.397464752197266, "global_step": 480446, "epoch": 5788} {"train_loss": -27.3173770904541, "global_step": 480447, "epoch": 5788} {"train_loss": -27.134143829345703, "global_step": 480448, "epoch": 5788} {"train_loss": -27.219022750854492, "global_step": 480449, "epoch": 5788} {"train_loss": -27.21265983581543, "global_step": 480450, "epoch": 5788} {"train_loss": -27.740690231323242, "global_step": 480451, "epoch": 5788} {"train_loss": -27.408294677734375, "global_step": 480452, "epoch": 5788} {"train_loss": -27.63640785217285, "global_step": 480453, "epoch": 5788} {"train_loss": -27.455198287963867, "global_step": 480454, "epoch": 5788} {"train_loss": -26.94524574279785, "global_step": 480455, "epoch": 5788} {"train_loss": -27.549713134765625, "global_step": 480456, "epoch": 5788} {"train_loss": -27.41753578186035, "global_step": 480457, "epoch": 5788} {"train_loss": -27.337427139282227, "global_step": 480458, "epoch": 5788} {"train_loss": -27.12703514099121, "global_step": 480459, "epoch": 5788} {"train_loss": -27.411497116088867, "global_step": 480460, "epoch": 5788} {"train_loss": -28.092731475830078, "global_step": 480461, "epoch": 5788} {"train_loss": -27.31782341003418, "global_step": 480462, "epoch": 5788} {"train_loss": -27.552087783813477, "global_step": 480463, "epoch": 5788} {"train_loss": -27.381820678710938, "global_step": 480464, "epoch": 5788} {"train_loss": -27.7595272064209, "global_step": 480465, "epoch": 5788} {"train_loss": -27.23843765258789, "global_step": 480466, "epoch": 5788} {"train_loss": -27.324888229370117, "global_step": 480467, "epoch": 5788} {"train_loss": -27.134429931640625, "global_step": 480468, "epoch": 5788} {"train_loss": -27.495681762695312, "global_step": 480469, "epoch": 5788} {"train_loss": -27.2401065826416, "global_step": 480470, "epoch": 5788} {"train_loss": -26.89657974243164, "global_step": 480471, "epoch": 5788} {"train_loss": -27.184783935546875, "global_step": 480472, "epoch": 5788} {"train_loss": -27.590988159179688, "global_step": 480473, "epoch": 5788} {"train_loss": -27.363645553588867, "global_step": 480474, "epoch": 5788} {"train_loss": -27.274795532226562, "global_step": 480475, "epoch": 5788} {"train_loss": -27.38787841796875, "global_step": 480476, "epoch": 5788} {"train_loss": -26.9788761138916, "global_step": 480477, "epoch": 5788} {"train_loss": -27.24799156188965, "global_step": 480478, "epoch": 5788} {"train_loss": -26.813180923461914, "global_step": 480479, "epoch": 5788} {"train_loss": -26.42783546447754, "global_step": 480480, "epoch": 5788} {"train_loss": -26.09513282775879, "global_step": 480481, "epoch": 5788} {"train_loss": -25.2661075592041, "global_step": 480482, "epoch": 5788} {"train_loss": -26.385061264038086, "global_step": 480483, "epoch": 5788} {"train_loss": -27.057981491088867, "global_step": 480484, "epoch": 5788} {"train_loss": -26.39859390258789, "global_step": 480485, "epoch": 5788} {"train_loss": -27.056853903345313, "global_step": 480486, "epoch": 5788, "val_loss": 6523467.5} {"train_loss": -26.1655330657959, "global_step": 480487, "epoch": 5789} {"train_loss": -25.89576530456543, "global_step": 480488, "epoch": 5789} {"train_loss": -26.950483322143555, "global_step": 480489, "epoch": 5789} {"train_loss": -26.084430694580078, "global_step": 480490, "epoch": 5789} {"train_loss": -26.899938583374023, "global_step": 480491, "epoch": 5789} {"train_loss": -26.721120834350586, "global_step": 480492, "epoch": 5789} {"train_loss": -26.625707626342773, "global_step": 480493, "epoch": 5789} {"train_loss": -26.59522819519043, "global_step": 480494, "epoch": 5789} {"train_loss": -26.539718627929688, "global_step": 480495, "epoch": 5789} {"train_loss": -26.6976375579834, "global_step": 480496, "epoch": 5789} {"train_loss": -26.70379066467285, "global_step": 480497, "epoch": 5789} {"train_loss": -26.53021812438965, "global_step": 480498, "epoch": 5789} {"train_loss": -27.090255737304688, "global_step": 480499, "epoch": 5789} {"train_loss": -26.75941276550293, "global_step": 480500, "epoch": 5789} {"train_loss": -26.974365234375, "global_step": 480501, "epoch": 5789} {"train_loss": -27.013822555541992, "global_step": 480502, "epoch": 5789} {"train_loss": -26.95746421813965, "global_step": 480503, "epoch": 5789} {"train_loss": -26.9778995513916, "global_step": 480504, "epoch": 5789} {"train_loss": -26.917739868164062, "global_step": 480505, "epoch": 5789} {"train_loss": -26.8536434173584, "global_step": 480506, "epoch": 5789} {"train_loss": -27.24995231628418, "global_step": 480507, "epoch": 5789} {"train_loss": -26.82976722717285, "global_step": 480508, "epoch": 5789} {"train_loss": -26.88643455505371, "global_step": 480509, "epoch": 5789} {"train_loss": -27.11249351501465, "global_step": 480510, "epoch": 5789} {"train_loss": -26.927215576171875, "global_step": 480511, "epoch": 5789} {"train_loss": -27.074310302734375, "global_step": 480512, "epoch": 5789} {"train_loss": -26.824487686157227, "global_step": 480513, "epoch": 5789} {"train_loss": -27.365949630737305, "global_step": 480514, "epoch": 5789} {"train_loss": -26.996036529541016, "global_step": 480515, "epoch": 5789} {"train_loss": -27.080310821533203, "global_step": 480516, "epoch": 5789} {"train_loss": -26.937606811523438, "global_step": 480517, "epoch": 5789} {"train_loss": -27.342920303344727, "global_step": 480518, "epoch": 5789} {"train_loss": -27.037012100219727, "global_step": 480519, "epoch": 5789} {"train_loss": -27.298715591430664, "global_step": 480520, "epoch": 5789} {"train_loss": -27.32039451599121, "global_step": 480521, "epoch": 5789} {"train_loss": -27.562606811523438, "global_step": 480522, "epoch": 5789} {"train_loss": -27.06715202331543, "global_step": 480523, "epoch": 5789} {"train_loss": -27.321853637695312, "global_step": 480524, "epoch": 5789} {"train_loss": -27.502904891967773, "global_step": 480525, "epoch": 5789} {"train_loss": -27.13175392150879, "global_step": 480526, "epoch": 5789} {"train_loss": -27.704242706298828, "global_step": 480527, "epoch": 5789} {"train_loss": -27.201557159423828, "global_step": 480528, "epoch": 5789} {"train_loss": -27.495512008666992, "global_step": 480529, "epoch": 5789} {"train_loss": -27.126428604125977, "global_step": 480530, "epoch": 5789} {"train_loss": -27.5926570892334, "global_step": 480531, "epoch": 5789} {"train_loss": -27.448272705078125, "global_step": 480532, "epoch": 5789} {"train_loss": -27.547760009765625, "global_step": 480533, "epoch": 5789} {"train_loss": -27.084400177001953, "global_step": 480534, "epoch": 5789} {"train_loss": -27.694440841674805, "global_step": 480535, "epoch": 5789} {"train_loss": -27.17533302307129, "global_step": 480536, "epoch": 5789} {"train_loss": -27.700769424438477, "global_step": 480537, "epoch": 5789} {"train_loss": -27.4057674407959, "global_step": 480538, "epoch": 5789} {"train_loss": -27.46270179748535, "global_step": 480539, "epoch": 5789} {"train_loss": -27.42437171936035, "global_step": 480540, "epoch": 5789} {"train_loss": -27.498022079467773, "global_step": 480541, "epoch": 5789} {"train_loss": -26.992521286010742, "global_step": 480542, "epoch": 5789} {"train_loss": -27.492725372314453, "global_step": 480543, "epoch": 5789} {"train_loss": -27.514270782470703, "global_step": 480544, "epoch": 5789} {"train_loss": -27.20928382873535, "global_step": 480545, "epoch": 5789} {"train_loss": -27.199573516845703, "global_step": 480546, "epoch": 5789} {"train_loss": -27.42767906188965, "global_step": 480547, "epoch": 5789} {"train_loss": -27.608301162719727, "global_step": 480548, "epoch": 5789} {"train_loss": -27.175180435180664, "global_step": 480549, "epoch": 5789} {"train_loss": -27.75825309753418, "global_step": 480550, "epoch": 5789} {"train_loss": -27.106037139892578, "global_step": 480551, "epoch": 5789} {"train_loss": -27.433624267578125, "global_step": 480552, "epoch": 5789} {"train_loss": -27.384485244750977, "global_step": 480553, "epoch": 5789} {"train_loss": -27.52913475036621, "global_step": 480554, "epoch": 5789} {"train_loss": -27.203556060791016, "global_step": 480555, "epoch": 5789} {"train_loss": -27.262348175048828, "global_step": 480556, "epoch": 5789} {"train_loss": -27.472217559814453, "global_step": 480557, "epoch": 5789} {"train_loss": -27.881229400634766, "global_step": 480558, "epoch": 5789} {"train_loss": -27.440204620361328, "global_step": 480559, "epoch": 5789} {"train_loss": -27.076358795166016, "global_step": 480560, "epoch": 5789} {"train_loss": -27.24738883972168, "global_step": 480561, "epoch": 5789} {"train_loss": -27.414243698120117, "global_step": 480562, "epoch": 5789} {"train_loss": -26.959522247314453, "global_step": 480563, "epoch": 5789} {"train_loss": -27.358190536499023, "global_step": 480564, "epoch": 5789} {"train_loss": -26.98244285583496, "global_step": 480565, "epoch": 5789} {"train_loss": -27.350645065307617, "global_step": 480566, "epoch": 5789} {"train_loss": -27.095966339111328, "global_step": 480567, "epoch": 5789} {"train_loss": -26.768461227416992, "global_step": 480568, "epoch": 5789} {"train_loss": -27.134595089648144, "global_step": 480569, "epoch": 5789, "val_loss": 6585342.0} {"train_loss": -25.7004451751709, "global_step": 480570, "epoch": 5790} {"train_loss": -25.43568229675293, "global_step": 480571, "epoch": 5790} {"train_loss": -26.329015731811523, "global_step": 480572, "epoch": 5790} {"train_loss": -26.305862426757812, "global_step": 480573, "epoch": 5790} {"train_loss": -26.58935546875, "global_step": 480574, "epoch": 5790} {"train_loss": -26.140853881835938, "global_step": 480575, "epoch": 5790} {"train_loss": -26.689786911010742, "global_step": 480576, "epoch": 5790} {"train_loss": -26.813886642456055, "global_step": 480577, "epoch": 5790} {"train_loss": -26.964731216430664, "global_step": 480578, "epoch": 5790} {"train_loss": -27.091211318969727, "global_step": 480579, "epoch": 5790} {"train_loss": -26.863983154296875, "global_step": 480580, "epoch": 5790} {"train_loss": -27.141080856323242, "global_step": 480581, "epoch": 5790} {"train_loss": -27.407285690307617, "global_step": 480582, "epoch": 5790} {"train_loss": -27.161069869995117, "global_step": 480583, "epoch": 5790} {"train_loss": -26.610889434814453, "global_step": 480584, "epoch": 5790} {"train_loss": -26.962997436523438, "global_step": 480585, "epoch": 5790} {"train_loss": -26.99220085144043, "global_step": 480586, "epoch": 5790} {"train_loss": -27.177892684936523, "global_step": 480587, "epoch": 5790} {"train_loss": -27.0701961517334, "global_step": 480588, "epoch": 5790} {"train_loss": -26.82539176940918, "global_step": 480589, "epoch": 5790} {"train_loss": -27.11117935180664, "global_step": 480590, "epoch": 5790} {"train_loss": -27.092605590820312, "global_step": 480591, "epoch": 5790} {"train_loss": -26.8741397857666, "global_step": 480592, "epoch": 5790} {"train_loss": -26.961755752563477, "global_step": 480593, "epoch": 5790} {"train_loss": -27.150543212890625, "global_step": 480594, "epoch": 5790} {"train_loss": -27.00465202331543, "global_step": 480595, "epoch": 5790} {"train_loss": -26.999189376831055, "global_step": 480596, "epoch": 5790} {"train_loss": -27.48272132873535, "global_step": 480597, "epoch": 5790} {"train_loss": -27.139297485351562, "global_step": 480598, "epoch": 5790} {"train_loss": -26.886499404907227, "global_step": 480599, "epoch": 5790} {"train_loss": -27.6365909576416, "global_step": 480600, "epoch": 5790} {"train_loss": -27.2363338470459, "global_step": 480601, "epoch": 5790} {"train_loss": -27.407958984375, "global_step": 480602, "epoch": 5790} {"train_loss": -27.23707389831543, "global_step": 480603, "epoch": 5790} {"train_loss": -27.2227783203125, "global_step": 480604, "epoch": 5790} {"train_loss": -27.45209312438965, "global_step": 480605, "epoch": 5790} {"train_loss": -27.371850967407227, "global_step": 480606, "epoch": 5790} {"train_loss": -27.370893478393555, "global_step": 480607, "epoch": 5790} {"train_loss": -27.355823516845703, "global_step": 480608, "epoch": 5790} {"train_loss": -27.175312042236328, "global_step": 480609, "epoch": 5790} {"train_loss": -27.162189483642578, "global_step": 480610, "epoch": 5790} {"train_loss": -27.203916549682617, "global_step": 480611, "epoch": 5790} {"train_loss": -27.272504806518555, "global_step": 480612, "epoch": 5790} {"train_loss": -27.687891006469727, "global_step": 480613, "epoch": 5790} {"train_loss": -27.71241569519043, "global_step": 480614, "epoch": 5790} {"train_loss": -27.271686553955078, "global_step": 480615, "epoch": 5790} {"train_loss": -27.21919059753418, "global_step": 480616, "epoch": 5790} {"train_loss": -27.440616607666016, "global_step": 480617, "epoch": 5790} {"train_loss": -27.299646377563477, "global_step": 480618, "epoch": 5790} {"train_loss": -27.40591812133789, "global_step": 480619, "epoch": 5790} {"train_loss": -27.494543075561523, "global_step": 480620, "epoch": 5790} {"train_loss": -27.363950729370117, "global_step": 480621, "epoch": 5790} {"train_loss": -27.308469772338867, "global_step": 480622, "epoch": 5790} {"train_loss": -27.2269287109375, "global_step": 480623, "epoch": 5790} {"train_loss": -27.587987899780273, "global_step": 480624, "epoch": 5790} {"train_loss": -26.91175651550293, "global_step": 480625, "epoch": 5790} {"train_loss": -27.01136589050293, "global_step": 480626, "epoch": 5790} {"train_loss": -27.690921783447266, "global_step": 480627, "epoch": 5790} {"train_loss": -27.381214141845703, "global_step": 480628, "epoch": 5790} {"train_loss": -27.602462768554688, "global_step": 480629, "epoch": 5790} {"train_loss": -27.584375381469727, "global_step": 480630, "epoch": 5790} {"train_loss": -27.327051162719727, "global_step": 480631, "epoch": 5790} {"train_loss": -27.252765655517578, "global_step": 480632, "epoch": 5790} {"train_loss": -27.3498477935791, "global_step": 480633, "epoch": 5790} {"train_loss": -27.575809478759766, "global_step": 480634, "epoch": 5790} {"train_loss": -27.892688751220703, "global_step": 480635, "epoch": 5790} {"train_loss": -27.414325714111328, "global_step": 480636, "epoch": 5790} {"train_loss": -27.261280059814453, "global_step": 480637, "epoch": 5790} {"train_loss": -27.50489616394043, "global_step": 480638, "epoch": 5790} {"train_loss": -27.493894577026367, "global_step": 480639, "epoch": 5790} {"train_loss": -27.489608764648438, "global_step": 480640, "epoch": 5790} {"train_loss": -27.342023849487305, "global_step": 480641, "epoch": 5790} {"train_loss": -27.66693687438965, "global_step": 480642, "epoch": 5790} {"train_loss": -27.283496856689453, "global_step": 480643, "epoch": 5790} {"train_loss": -27.3448429107666, "global_step": 480644, "epoch": 5790} {"train_loss": -27.443037033081055, "global_step": 480645, "epoch": 5790} {"train_loss": -27.27032470703125, "global_step": 480646, "epoch": 5790} {"train_loss": -27.310693740844727, "global_step": 480647, "epoch": 5790} {"train_loss": -27.53424072265625, "global_step": 480648, "epoch": 5790} {"train_loss": -27.436359405517578, "global_step": 480649, "epoch": 5790} {"train_loss": -27.67693519592285, "global_step": 480650, "epoch": 5790} {"train_loss": -27.155364990234375, "global_step": 480651, "epoch": 5790} {"train_loss": -27.189062761973187, "global_step": 480652, "epoch": 5790, "val_loss": 6594919.0} {"train_loss": -26.97784423828125, "global_step": 480653, "epoch": 5791} {"train_loss": -26.21900749206543, "global_step": 480654, "epoch": 5791} {"train_loss": -26.32108497619629, "global_step": 480655, "epoch": 5791} {"train_loss": -25.825424194335938, "global_step": 480656, "epoch": 5791} {"train_loss": -25.999914169311523, "global_step": 480657, "epoch": 5791} {"train_loss": -27.148578643798828, "global_step": 480658, "epoch": 5791} {"train_loss": -26.619842529296875, "global_step": 480659, "epoch": 5791} {"train_loss": -26.6989803314209, "global_step": 480660, "epoch": 5791} {"train_loss": -26.555713653564453, "global_step": 480661, "epoch": 5791} {"train_loss": -27.158706665039062, "global_step": 480662, "epoch": 5791} {"train_loss": -26.29188346862793, "global_step": 480663, "epoch": 5791} {"train_loss": -26.785175323486328, "global_step": 480664, "epoch": 5791} {"train_loss": -26.6292724609375, "global_step": 480665, "epoch": 5791} {"train_loss": -26.510828018188477, "global_step": 480666, "epoch": 5791} {"train_loss": -26.537885665893555, "global_step": 480667, "epoch": 5791} {"train_loss": -26.612995147705078, "global_step": 480668, "epoch": 5791} {"train_loss": -26.8104305267334, "global_step": 480669, "epoch": 5791} {"train_loss": -26.318241119384766, "global_step": 480670, "epoch": 5791} {"train_loss": -26.948974609375, "global_step": 480671, "epoch": 5791} {"train_loss": -26.9910888671875, "global_step": 480672, "epoch": 5791} {"train_loss": -26.642919540405273, "global_step": 480673, "epoch": 5791} {"train_loss": -27.207324981689453, "global_step": 480674, "epoch": 5791} {"train_loss": -27.107635498046875, "global_step": 480675, "epoch": 5791} {"train_loss": -26.924421310424805, "global_step": 480676, "epoch": 5791} {"train_loss": -26.591833114624023, "global_step": 480677, "epoch": 5791} {"train_loss": -26.777820587158203, "global_step": 480678, "epoch": 5791} {"train_loss": -27.279478073120117, "global_step": 480679, "epoch": 5791} {"train_loss": -27.035202026367188, "global_step": 480680, "epoch": 5791} {"train_loss": -27.15923500061035, "global_step": 480681, "epoch": 5791} {"train_loss": -27.03264808654785, "global_step": 480682, "epoch": 5791} {"train_loss": -27.486164093017578, "global_step": 480683, "epoch": 5791} {"train_loss": -27.044952392578125, "global_step": 480684, "epoch": 5791} {"train_loss": -27.246763229370117, "global_step": 480685, "epoch": 5791} {"train_loss": -27.190542221069336, "global_step": 480686, "epoch": 5791} {"train_loss": -27.09286880493164, "global_step": 480687, "epoch": 5791} {"train_loss": -27.485761642456055, "global_step": 480688, "epoch": 5791} {"train_loss": -27.32794189453125, "global_step": 480689, "epoch": 5791} {"train_loss": -27.341657638549805, "global_step": 480690, "epoch": 5791} {"train_loss": -27.2008056640625, "global_step": 480691, "epoch": 5791} {"train_loss": -27.173282623291016, "global_step": 480692, "epoch": 5791} {"train_loss": -27.4538631439209, "global_step": 480693, "epoch": 5791} {"train_loss": -27.371564865112305, "global_step": 480694, "epoch": 5791} {"train_loss": -27.700300216674805, "global_step": 480695, "epoch": 5791} {"train_loss": -27.395374298095703, "global_step": 480696, "epoch": 5791} {"train_loss": -27.38275718688965, "global_step": 480697, "epoch": 5791} {"train_loss": -27.495208740234375, "global_step": 480698, "epoch": 5791} {"train_loss": -27.555463790893555, "global_step": 480699, "epoch": 5791} {"train_loss": -27.212270736694336, "global_step": 480700, "epoch": 5791} {"train_loss": -27.129322052001953, "global_step": 480701, "epoch": 5791} {"train_loss": -27.503726959228516, "global_step": 480702, "epoch": 5791} {"train_loss": -27.455793380737305, "global_step": 480703, "epoch": 5791} {"train_loss": -27.39484214782715, "global_step": 480704, "epoch": 5791} {"train_loss": -27.635086059570312, "global_step": 480705, "epoch": 5791} {"train_loss": -27.83119010925293, "global_step": 480706, "epoch": 5791} {"train_loss": -27.57301139831543, "global_step": 480707, "epoch": 5791} {"train_loss": -27.398883819580078, "global_step": 480708, "epoch": 5791} {"train_loss": -27.4899845123291, "global_step": 480709, "epoch": 5791} {"train_loss": -27.72492790222168, "global_step": 480710, "epoch": 5791} {"train_loss": -27.575681686401367, "global_step": 480711, "epoch": 5791} {"train_loss": -27.551197052001953, "global_step": 480712, "epoch": 5791} {"train_loss": -27.438486099243164, "global_step": 480713, "epoch": 5791} {"train_loss": -27.560972213745117, "global_step": 480714, "epoch": 5791} {"train_loss": -27.39618492126465, "global_step": 480715, "epoch": 5791} {"train_loss": -27.421863555908203, "global_step": 480716, "epoch": 5791} {"train_loss": -27.449310302734375, "global_step": 480717, "epoch": 5791} {"train_loss": -27.6048583984375, "global_step": 480718, "epoch": 5791} {"train_loss": -27.717350006103516, "global_step": 480719, "epoch": 5791} {"train_loss": -27.503156661987305, "global_step": 480720, "epoch": 5791} {"train_loss": -27.22918128967285, "global_step": 480721, "epoch": 5791} {"train_loss": -27.284610748291016, "global_step": 480722, "epoch": 5791} {"train_loss": -27.280654907226562, "global_step": 480723, "epoch": 5791} {"train_loss": -27.197616577148438, "global_step": 480724, "epoch": 5791} {"train_loss": -27.075408935546875, "global_step": 480725, "epoch": 5791} {"train_loss": -27.31304359436035, "global_step": 480726, "epoch": 5791} {"train_loss": -26.876752853393555, "global_step": 480727, "epoch": 5791} {"train_loss": -26.46929931640625, "global_step": 480728, "epoch": 5791} {"train_loss": -26.612375259399414, "global_step": 480729, "epoch": 5791} {"train_loss": -26.823348999023438, "global_step": 480730, "epoch": 5791} {"train_loss": -26.60750389099121, "global_step": 480731, "epoch": 5791} {"train_loss": -26.835187911987305, "global_step": 480732, "epoch": 5791} {"train_loss": -26.128870010375977, "global_step": 480733, "epoch": 5791} {"train_loss": -26.57843017578125, "global_step": 480734, "epoch": 5791} {"train_loss": -27.096246811280768, "global_step": 480735, "epoch": 5791, "val_loss": 6574470.0} {"train_loss": -25.545183181762695, "global_step": 480736, "epoch": 5792} {"train_loss": -24.50897216796875, "global_step": 480737, "epoch": 5792} {"train_loss": -26.383893966674805, "global_step": 480738, "epoch": 5792} {"train_loss": -25.85994529724121, "global_step": 480739, "epoch": 5792} {"train_loss": -25.775293350219727, "global_step": 480740, "epoch": 5792} {"train_loss": -26.5225887298584, "global_step": 480741, "epoch": 5792} {"train_loss": -26.216781616210938, "global_step": 480742, "epoch": 5792} {"train_loss": -26.722888946533203, "global_step": 480743, "epoch": 5792} {"train_loss": -26.242752075195312, "global_step": 480744, "epoch": 5792} {"train_loss": -26.751026153564453, "global_step": 480745, "epoch": 5792} {"train_loss": -26.325820922851562, "global_step": 480746, "epoch": 5792} {"train_loss": -26.546356201171875, "global_step": 480747, "epoch": 5792} {"train_loss": -26.341588973999023, "global_step": 480748, "epoch": 5792} {"train_loss": -26.41864013671875, "global_step": 480749, "epoch": 5792} {"train_loss": -26.6080322265625, "global_step": 480750, "epoch": 5792} {"train_loss": -26.383214950561523, "global_step": 480751, "epoch": 5792} {"train_loss": -26.793182373046875, "global_step": 480752, "epoch": 5792} {"train_loss": -26.401580810546875, "global_step": 480753, "epoch": 5792} {"train_loss": -26.509414672851562, "global_step": 480754, "epoch": 5792} {"train_loss": -26.83424186706543, "global_step": 480755, "epoch": 5792} {"train_loss": -26.4738826751709, "global_step": 480756, "epoch": 5792} {"train_loss": -26.75821876525879, "global_step": 480757, "epoch": 5792} {"train_loss": -26.945709228515625, "global_step": 480758, "epoch": 5792} {"train_loss": -26.902557373046875, "global_step": 480759, "epoch": 5792} {"train_loss": -26.87359619140625, "global_step": 480760, "epoch": 5792} {"train_loss": -27.03853416442871, "global_step": 480761, "epoch": 5792} {"train_loss": -26.974822998046875, "global_step": 480762, "epoch": 5792} {"train_loss": -27.265125274658203, "global_step": 480763, "epoch": 5792} {"train_loss": -27.11211585998535, "global_step": 480764, "epoch": 5792} {"train_loss": -26.91065788269043, "global_step": 480765, "epoch": 5792} {"train_loss": -26.833118438720703, "global_step": 480766, "epoch": 5792} {"train_loss": -27.13128089904785, "global_step": 480767, "epoch": 5792} {"train_loss": -27.148792266845703, "global_step": 480768, "epoch": 5792} {"train_loss": -26.890775680541992, "global_step": 480769, "epoch": 5792} {"train_loss": -26.932239532470703, "global_step": 480770, "epoch": 5792} {"train_loss": -27.378528594970703, "global_step": 480771, "epoch": 5792} {"train_loss": -27.42005729675293, "global_step": 480772, "epoch": 5792} {"train_loss": -27.0696964263916, "global_step": 480773, "epoch": 5792} {"train_loss": -27.197553634643555, "global_step": 480774, "epoch": 5792} {"train_loss": -27.175373077392578, "global_step": 480775, "epoch": 5792} {"train_loss": -27.272809982299805, "global_step": 480776, "epoch": 5792} {"train_loss": -27.0827579498291, "global_step": 480777, "epoch": 5792} {"train_loss": -27.325469970703125, "global_step": 480778, "epoch": 5792} {"train_loss": -26.856555938720703, "global_step": 480779, "epoch": 5792} {"train_loss": -27.202116012573242, "global_step": 480780, "epoch": 5792} {"train_loss": -26.968839645385742, "global_step": 480781, "epoch": 5792} {"train_loss": -27.654895782470703, "global_step": 480782, "epoch": 5792} {"train_loss": -27.200027465820312, "global_step": 480783, "epoch": 5792} {"train_loss": -27.36989402770996, "global_step": 480784, "epoch": 5792} {"train_loss": -27.30902671813965, "global_step": 480785, "epoch": 5792} {"train_loss": -26.857751846313477, "global_step": 480786, "epoch": 5792} {"train_loss": -27.234262466430664, "global_step": 480787, "epoch": 5792} {"train_loss": -27.53727149963379, "global_step": 480788, "epoch": 5792} {"train_loss": -27.330575942993164, "global_step": 480789, "epoch": 5792} {"train_loss": -27.4993839263916, "global_step": 480790, "epoch": 5792} {"train_loss": -27.526447296142578, "global_step": 480791, "epoch": 5792} {"train_loss": -27.096271514892578, "global_step": 480792, "epoch": 5792} {"train_loss": -27.272680282592773, "global_step": 480793, "epoch": 5792} {"train_loss": -27.692642211914062, "global_step": 480794, "epoch": 5792} {"train_loss": -27.499868392944336, "global_step": 480795, "epoch": 5792} {"train_loss": -27.303991317749023, "global_step": 480796, "epoch": 5792} {"train_loss": -27.624866485595703, "global_step": 480797, "epoch": 5792} {"train_loss": -27.5305118560791, "global_step": 480798, "epoch": 5792} {"train_loss": -27.534635543823242, "global_step": 480799, "epoch": 5792} {"train_loss": -27.337055206298828, "global_step": 480800, "epoch": 5792} {"train_loss": -27.2625675201416, "global_step": 480801, "epoch": 5792} {"train_loss": -27.420074462890625, "global_step": 480802, "epoch": 5792} {"train_loss": -26.932287216186523, "global_step": 480803, "epoch": 5792} {"train_loss": -27.051898956298828, "global_step": 480804, "epoch": 5792} {"train_loss": -27.699359893798828, "global_step": 480805, "epoch": 5792} {"train_loss": -27.556482315063477, "global_step": 480806, "epoch": 5792} {"train_loss": -27.259292602539062, "global_step": 480807, "epoch": 5792} {"train_loss": -27.53297233581543, "global_step": 480808, "epoch": 5792} {"train_loss": -27.48708152770996, "global_step": 480809, "epoch": 5792} {"train_loss": -27.07763671875, "global_step": 480810, "epoch": 5792} {"train_loss": -27.338415145874023, "global_step": 480811, "epoch": 5792} {"train_loss": -27.135053634643555, "global_step": 480812, "epoch": 5792} {"train_loss": -27.64822769165039, "global_step": 480813, "epoch": 5792} {"train_loss": -26.856342315673828, "global_step": 480814, "epoch": 5792} {"train_loss": -26.968292236328125, "global_step": 480815, "epoch": 5792} {"train_loss": -27.060293197631836, "global_step": 480816, "epoch": 5792} {"train_loss": -27.291858673095703, "global_step": 480817, "epoch": 5792} {"train_loss": -26.98543472749641, "global_step": 480818, "epoch": 5792, "val_loss": 6529911.5} {"train_loss": -26.2763729095459, "global_step": 480819, "epoch": 5793} {"train_loss": -24.965635299682617, "global_step": 480820, "epoch": 5793} {"train_loss": -25.004596710205078, "global_step": 480821, "epoch": 5793} {"train_loss": -25.7296199798584, "global_step": 480822, "epoch": 5793} {"train_loss": -26.533105850219727, "global_step": 480823, "epoch": 5793} {"train_loss": -25.97920799255371, "global_step": 480824, "epoch": 5793} {"train_loss": -26.279443740844727, "global_step": 480825, "epoch": 5793} {"train_loss": -26.740217208862305, "global_step": 480826, "epoch": 5793} {"train_loss": -26.71363639831543, "global_step": 480827, "epoch": 5793} {"train_loss": -26.602569580078125, "global_step": 480828, "epoch": 5793} {"train_loss": -26.557758331298828, "global_step": 480829, "epoch": 5793} {"train_loss": -26.58856201171875, "global_step": 480830, "epoch": 5793} {"train_loss": -26.780683517456055, "global_step": 480831, "epoch": 5793} {"train_loss": -26.743513107299805, "global_step": 480832, "epoch": 5793} {"train_loss": -26.623077392578125, "global_step": 480833, "epoch": 5793} {"train_loss": -26.833967208862305, "global_step": 480834, "epoch": 5793} {"train_loss": -26.72588539123535, "global_step": 480835, "epoch": 5793} {"train_loss": -26.433835983276367, "global_step": 480836, "epoch": 5793} {"train_loss": -26.61712074279785, "global_step": 480837, "epoch": 5793} {"train_loss": -26.737085342407227, "global_step": 480838, "epoch": 5793} {"train_loss": -26.8192195892334, "global_step": 480839, "epoch": 5793} {"train_loss": -26.550796508789062, "global_step": 480840, "epoch": 5793} {"train_loss": -26.950414657592773, "global_step": 480841, "epoch": 5793} {"train_loss": -26.71919059753418, "global_step": 480842, "epoch": 5793} {"train_loss": -26.925216674804688, "global_step": 480843, "epoch": 5793} {"train_loss": -27.274938583374023, "global_step": 480844, "epoch": 5793} {"train_loss": -27.05010414123535, "global_step": 480845, "epoch": 5793} {"train_loss": -27.100849151611328, "global_step": 480846, "epoch": 5793} {"train_loss": -27.310155868530273, "global_step": 480847, "epoch": 5793} {"train_loss": -27.1445369720459, "global_step": 480848, "epoch": 5793} {"train_loss": -26.896575927734375, "global_step": 480849, "epoch": 5793} {"train_loss": -27.52631187438965, "global_step": 480850, "epoch": 5793} {"train_loss": -26.87326431274414, "global_step": 480851, "epoch": 5793} {"train_loss": -27.202392578125, "global_step": 480852, "epoch": 5793} {"train_loss": -27.035663604736328, "global_step": 480853, "epoch": 5793} {"train_loss": -27.22245216369629, "global_step": 480854, "epoch": 5793} {"train_loss": -27.15118980407715, "global_step": 480855, "epoch": 5793} {"train_loss": -27.456953048706055, "global_step": 480856, "epoch": 5793} {"train_loss": -27.692096710205078, "global_step": 480857, "epoch": 5793} {"train_loss": -27.19325065612793, "global_step": 480858, "epoch": 5793} {"train_loss": -27.413419723510742, "global_step": 480859, "epoch": 5793} {"train_loss": -27.700048446655273, "global_step": 480860, "epoch": 5793} {"train_loss": -27.645965576171875, "global_step": 480861, "epoch": 5793} {"train_loss": -27.662939071655273, "global_step": 480862, "epoch": 5793} {"train_loss": -27.542036056518555, "global_step": 480863, "epoch": 5793} {"train_loss": -27.046613693237305, "global_step": 480864, "epoch": 5793} {"train_loss": -27.693979263305664, "global_step": 480865, "epoch": 5793} {"train_loss": -27.91725730895996, "global_step": 480866, "epoch": 5793} {"train_loss": -27.419897079467773, "global_step": 480867, "epoch": 5793} {"train_loss": -27.360462188720703, "global_step": 480868, "epoch": 5793} {"train_loss": -27.750171661376953, "global_step": 480869, "epoch": 5793} {"train_loss": -27.448328018188477, "global_step": 480870, "epoch": 5793} {"train_loss": -27.408649444580078, "global_step": 480871, "epoch": 5793} {"train_loss": -27.253812789916992, "global_step": 480872, "epoch": 5793} {"train_loss": -27.22587013244629, "global_step": 480873, "epoch": 5793} {"train_loss": -27.504724502563477, "global_step": 480874, "epoch": 5793} {"train_loss": -27.508481979370117, "global_step": 480875, "epoch": 5793} {"train_loss": -27.297473907470703, "global_step": 480876, "epoch": 5793} {"train_loss": -27.065210342407227, "global_step": 480877, "epoch": 5793} {"train_loss": -27.295740127563477, "global_step": 480878, "epoch": 5793} {"train_loss": -27.314664840698242, "global_step": 480879, "epoch": 5793} {"train_loss": -27.558156967163086, "global_step": 480880, "epoch": 5793} {"train_loss": -27.284881591796875, "global_step": 480881, "epoch": 5793} {"train_loss": -26.968402862548828, "global_step": 480882, "epoch": 5793} {"train_loss": -27.439197540283203, "global_step": 480883, "epoch": 5793} {"train_loss": -27.456436157226562, "global_step": 480884, "epoch": 5793} {"train_loss": -26.94251823425293, "global_step": 480885, "epoch": 5793} {"train_loss": -27.641376495361328, "global_step": 480886, "epoch": 5793} {"train_loss": -27.365692138671875, "global_step": 480887, "epoch": 5793} {"train_loss": -27.2578067779541, "global_step": 480888, "epoch": 5793} {"train_loss": -27.40142822265625, "global_step": 480889, "epoch": 5793} {"train_loss": -27.156991958618164, "global_step": 480890, "epoch": 5793} {"train_loss": -27.34749412536621, "global_step": 480891, "epoch": 5793} {"train_loss": -27.21229362487793, "global_step": 480892, "epoch": 5793} {"train_loss": -27.693490982055664, "global_step": 480893, "epoch": 5793} {"train_loss": -27.396188735961914, "global_step": 480894, "epoch": 5793} {"train_loss": -27.1949405670166, "global_step": 480895, "epoch": 5793} {"train_loss": -26.719274520874023, "global_step": 480896, "epoch": 5793} {"train_loss": -27.151630401611328, "global_step": 480897, "epoch": 5793} {"train_loss": -27.316791534423828, "global_step": 480898, "epoch": 5793} {"train_loss": -27.211313247680664, "global_step": 480899, "epoch": 5793} {"train_loss": -27.339466094970703, "global_step": 480900, "epoch": 5793} {"train_loss": -27.054161554359528, "global_step": 480901, "epoch": 5793, "val_loss": 6565789.0} {"train_loss": -27.068161010742188, "global_step": 480902, "epoch": 5794} {"train_loss": -26.59430503845215, "global_step": 480903, "epoch": 5794} {"train_loss": -26.5556583404541, "global_step": 480904, "epoch": 5794} {"train_loss": -26.598669052124023, "global_step": 480905, "epoch": 5794} {"train_loss": -26.620059967041016, "global_step": 480906, "epoch": 5794} {"train_loss": -26.57390785217285, "global_step": 480907, "epoch": 5794} {"train_loss": -26.410232543945312, "global_step": 480908, "epoch": 5794} {"train_loss": -27.230894088745117, "global_step": 480909, "epoch": 5794} {"train_loss": -26.980545043945312, "global_step": 480910, "epoch": 5794} {"train_loss": -26.751697540283203, "global_step": 480911, "epoch": 5794} {"train_loss": -27.204559326171875, "global_step": 480912, "epoch": 5794} {"train_loss": -27.104246139526367, "global_step": 480913, "epoch": 5794} {"train_loss": -27.079792022705078, "global_step": 480914, "epoch": 5794} {"train_loss": -26.754093170166016, "global_step": 480915, "epoch": 5794} {"train_loss": -27.297149658203125, "global_step": 480916, "epoch": 5794} {"train_loss": -26.984678268432617, "global_step": 480917, "epoch": 5794} {"train_loss": -26.872161865234375, "global_step": 480918, "epoch": 5794} {"train_loss": -27.05378532409668, "global_step": 480919, "epoch": 5794} {"train_loss": -26.895429611206055, "global_step": 480920, "epoch": 5794} {"train_loss": -27.4954891204834, "global_step": 480921, "epoch": 5794} {"train_loss": -27.27170753479004, "global_step": 480922, "epoch": 5794} {"train_loss": -27.49469566345215, "global_step": 480923, "epoch": 5794} {"train_loss": -27.35687255859375, "global_step": 480924, "epoch": 5794} {"train_loss": -27.41682243347168, "global_step": 480925, "epoch": 5794} {"train_loss": -26.97247886657715, "global_step": 480926, "epoch": 5794} {"train_loss": -27.528589248657227, "global_step": 480927, "epoch": 5794} {"train_loss": -27.353803634643555, "global_step": 480928, "epoch": 5794} {"train_loss": -27.465307235717773, "global_step": 480929, "epoch": 5794} {"train_loss": -27.387420654296875, "global_step": 480930, "epoch": 5794} {"train_loss": -27.43744468688965, "global_step": 480931, "epoch": 5794} {"train_loss": -27.602680206298828, "global_step": 480932, "epoch": 5794} {"train_loss": -27.366933822631836, "global_step": 480933, "epoch": 5794} {"train_loss": -27.237714767456055, "global_step": 480934, "epoch": 5794} {"train_loss": -27.01950454711914, "global_step": 480935, "epoch": 5794} {"train_loss": -27.140979766845703, "global_step": 480936, "epoch": 5794} {"train_loss": -27.257360458374023, "global_step": 480937, "epoch": 5794} {"train_loss": -27.55994987487793, "global_step": 480938, "epoch": 5794} {"train_loss": -27.702035903930664, "global_step": 480939, "epoch": 5794} {"train_loss": -27.3797607421875, "global_step": 480940, "epoch": 5794} {"train_loss": -27.281692504882812, "global_step": 480941, "epoch": 5794} {"train_loss": -27.261432647705078, "global_step": 480942, "epoch": 5794} {"train_loss": -27.59779167175293, "global_step": 480943, "epoch": 5794} {"train_loss": -27.56256675720215, "global_step": 480944, "epoch": 5794} {"train_loss": -27.295181274414062, "global_step": 480945, "epoch": 5794} {"train_loss": -26.959142684936523, "global_step": 480946, "epoch": 5794} {"train_loss": -26.94095802307129, "global_step": 480947, "epoch": 5794} {"train_loss": -27.304738998413086, "global_step": 480948, "epoch": 5794} {"train_loss": -27.265644073486328, "global_step": 480949, "epoch": 5794} {"train_loss": -27.260156631469727, "global_step": 480950, "epoch": 5794} {"train_loss": -27.428613662719727, "global_step": 480951, "epoch": 5794} {"train_loss": -27.12505531311035, "global_step": 480952, "epoch": 5794} {"train_loss": -27.5170841217041, "global_step": 480953, "epoch": 5794} {"train_loss": -27.541034698486328, "global_step": 480954, "epoch": 5794} {"train_loss": -27.0889892578125, "global_step": 480955, "epoch": 5794} {"train_loss": -27.46479606628418, "global_step": 480956, "epoch": 5794} {"train_loss": -27.26410484313965, "global_step": 480957, "epoch": 5794} {"train_loss": -27.17494773864746, "global_step": 480958, "epoch": 5794} {"train_loss": -27.4229736328125, "global_step": 480959, "epoch": 5794} {"train_loss": -27.32330894470215, "global_step": 480960, "epoch": 5794} {"train_loss": -27.34735679626465, "global_step": 480961, "epoch": 5794} {"train_loss": -27.413000106811523, "global_step": 480962, "epoch": 5794} {"train_loss": -27.083337783813477, "global_step": 480963, "epoch": 5794} {"train_loss": -27.618087768554688, "global_step": 480964, "epoch": 5794} {"train_loss": -27.308002471923828, "global_step": 480965, "epoch": 5794} {"train_loss": -27.280054092407227, "global_step": 480966, "epoch": 5794} {"train_loss": -27.282678604125977, "global_step": 480967, "epoch": 5794} {"train_loss": -27.40555191040039, "global_step": 480968, "epoch": 5794} {"train_loss": -27.41951560974121, "global_step": 480969, "epoch": 5794} {"train_loss": -27.572900772094727, "global_step": 480970, "epoch": 5794} {"train_loss": -27.341358184814453, "global_step": 480971, "epoch": 5794} {"train_loss": -27.33893394470215, "global_step": 480972, "epoch": 5794} {"train_loss": -27.379331588745117, "global_step": 480973, "epoch": 5794} {"train_loss": -27.57183837890625, "global_step": 480974, "epoch": 5794} {"train_loss": -27.24268913269043, "global_step": 480975, "epoch": 5794} {"train_loss": -27.476837158203125, "global_step": 480976, "epoch": 5794} {"train_loss": -27.191389083862305, "global_step": 480977, "epoch": 5794} {"train_loss": -27.031829833984375, "global_step": 480978, "epoch": 5794} {"train_loss": -27.3974552154541, "global_step": 480979, "epoch": 5794} {"train_loss": -27.402341842651367, "global_step": 480980, "epoch": 5794} {"train_loss": -27.383859634399414, "global_step": 480981, "epoch": 5794} {"train_loss": -27.109960556030273, "global_step": 480982, "epoch": 5794} {"train_loss": -27.46112632751465, "global_step": 480983, "epoch": 5794} {"train_loss": -27.258607542658428, "global_step": 480984, "epoch": 5794, "val_loss": 6601344.5} {"train_loss": -25.45458984375, "global_step": 480985, "epoch": 5795} {"train_loss": -25.562204360961914, "global_step": 480986, "epoch": 5795} {"train_loss": -25.05433464050293, "global_step": 480987, "epoch": 5795} {"train_loss": -26.673114776611328, "global_step": 480988, "epoch": 5795} {"train_loss": -25.783430099487305, "global_step": 480989, "epoch": 5795} {"train_loss": -25.998188018798828, "global_step": 480990, "epoch": 5795} {"train_loss": -26.694849014282227, "global_step": 480991, "epoch": 5795} {"train_loss": -26.554391860961914, "global_step": 480992, "epoch": 5795} {"train_loss": -26.345861434936523, "global_step": 480993, "epoch": 5795} {"train_loss": -26.525928497314453, "global_step": 480994, "epoch": 5795} {"train_loss": -26.653181076049805, "global_step": 480995, "epoch": 5795} {"train_loss": -26.262739181518555, "global_step": 480996, "epoch": 5795} {"train_loss": -26.633548736572266, "global_step": 480997, "epoch": 5795} {"train_loss": -26.6201229095459, "global_step": 480998, "epoch": 5795} {"train_loss": -26.26222801208496, "global_step": 480999, "epoch": 5795} {"train_loss": -26.705957412719727, "global_step": 481000, "epoch": 5795} {"train_loss": -26.649221420288086, "global_step": 481001, "epoch": 5795} {"train_loss": -26.7213191986084, "global_step": 481002, "epoch": 5795} {"train_loss": -26.776050567626953, "global_step": 481003, "epoch": 5795} {"train_loss": -26.94423484802246, "global_step": 481004, "epoch": 5795} {"train_loss": -26.700559616088867, "global_step": 481005, "epoch": 5795} {"train_loss": -26.592559814453125, "global_step": 481006, "epoch": 5795} {"train_loss": -27.156604766845703, "global_step": 481007, "epoch": 5795} {"train_loss": -27.00210952758789, "global_step": 481008, "epoch": 5795} {"train_loss": -26.70180320739746, "global_step": 481009, "epoch": 5795} {"train_loss": -26.85151481628418, "global_step": 481010, "epoch": 5795} {"train_loss": -26.927509307861328, "global_step": 481011, "epoch": 5795} {"train_loss": -26.912466049194336, "global_step": 481012, "epoch": 5795} {"train_loss": -26.96637535095215, "global_step": 481013, "epoch": 5795} {"train_loss": -26.589502334594727, "global_step": 481014, "epoch": 5795} {"train_loss": -27.10016441345215, "global_step": 481015, "epoch": 5795} {"train_loss": -27.155670166015625, "global_step": 481016, "epoch": 5795} {"train_loss": -27.242706298828125, "global_step": 481017, "epoch": 5795} {"train_loss": -27.211978912353516, "global_step": 481018, "epoch": 5795} {"train_loss": -27.235095977783203, "global_step": 481019, "epoch": 5795} {"train_loss": -27.150650024414062, "global_step": 481020, "epoch": 5795} {"train_loss": -27.040149688720703, "global_step": 481021, "epoch": 5795} {"train_loss": -27.3640193939209, "global_step": 481022, "epoch": 5795} {"train_loss": -27.233118057250977, "global_step": 481023, "epoch": 5795} {"train_loss": -27.06780433654785, "global_step": 481024, "epoch": 5795} {"train_loss": -27.197891235351562, "global_step": 481025, "epoch": 5795} {"train_loss": -27.335254669189453, "global_step": 481026, "epoch": 5795} {"train_loss": -27.051971435546875, "global_step": 481027, "epoch": 5795} {"train_loss": -27.670703887939453, "global_step": 481028, "epoch": 5795} {"train_loss": -27.283960342407227, "global_step": 481029, "epoch": 5795} {"train_loss": -27.576690673828125, "global_step": 481030, "epoch": 5795} {"train_loss": -27.487783432006836, "global_step": 481031, "epoch": 5795} {"train_loss": -26.86750602722168, "global_step": 481032, "epoch": 5795} {"train_loss": -27.325519561767578, "global_step": 481033, "epoch": 5795} {"train_loss": -27.37922477722168, "global_step": 481034, "epoch": 5795} {"train_loss": -27.645751953125, "global_step": 481035, "epoch": 5795} {"train_loss": -27.200353622436523, "global_step": 481036, "epoch": 5795} {"train_loss": -27.617223739624023, "global_step": 481037, "epoch": 5795} {"train_loss": -27.633264541625977, "global_step": 481038, "epoch": 5795} {"train_loss": -27.487775802612305, "global_step": 481039, "epoch": 5795} {"train_loss": -27.5244083404541, "global_step": 481040, "epoch": 5795} {"train_loss": -27.937971115112305, "global_step": 481041, "epoch": 5795} {"train_loss": -27.42642593383789, "global_step": 481042, "epoch": 5795} {"train_loss": -27.691633224487305, "global_step": 481043, "epoch": 5795} {"train_loss": -27.242847442626953, "global_step": 481044, "epoch": 5795} {"train_loss": -27.615324020385742, "global_step": 481045, "epoch": 5795} {"train_loss": -27.161237716674805, "global_step": 481046, "epoch": 5795} {"train_loss": -27.491369247436523, "global_step": 481047, "epoch": 5795} {"train_loss": -27.740833282470703, "global_step": 481048, "epoch": 5795} {"train_loss": -27.480173110961914, "global_step": 481049, "epoch": 5795} {"train_loss": -27.2948055267334, "global_step": 481050, "epoch": 5795} {"train_loss": -27.314136505126953, "global_step": 481051, "epoch": 5795} {"train_loss": -27.298980712890625, "global_step": 481052, "epoch": 5795} {"train_loss": -27.888635635375977, "global_step": 481053, "epoch": 5795} {"train_loss": -27.373952865600586, "global_step": 481054, "epoch": 5795} {"train_loss": -27.382282257080078, "global_step": 481055, "epoch": 5795} {"train_loss": -27.805471420288086, "global_step": 481056, "epoch": 5795} {"train_loss": -27.1424617767334, "global_step": 481057, "epoch": 5795} {"train_loss": -27.118982315063477, "global_step": 481058, "epoch": 5795} {"train_loss": -26.549726486206055, "global_step": 481059, "epoch": 5795} {"train_loss": -26.193511962890625, "global_step": 481060, "epoch": 5795} {"train_loss": -25.280563354492188, "global_step": 481061, "epoch": 5795} {"train_loss": -25.843921661376953, "global_step": 481062, "epoch": 5795} {"train_loss": -26.997167587280273, "global_step": 481063, "epoch": 5795} {"train_loss": -26.43667984008789, "global_step": 481064, "epoch": 5795} {"train_loss": -26.444448471069336, "global_step": 481065, "epoch": 5795} {"train_loss": -27.025287628173828, "global_step": 481066, "epoch": 5795} {"train_loss": -26.95256359605904, "global_step": 481067, "epoch": 5795, "val_loss": 6519004.0} {"train_loss": -25.780908584594727, "global_step": 481068, "epoch": 5796} {"train_loss": -26.28862953186035, "global_step": 481069, "epoch": 5796} {"train_loss": -26.602176666259766, "global_step": 481070, "epoch": 5796} {"train_loss": -26.0882625579834, "global_step": 481071, "epoch": 5796} {"train_loss": -26.832242965698242, "global_step": 481072, "epoch": 5796} {"train_loss": -26.16008949279785, "global_step": 481073, "epoch": 5796} {"train_loss": -26.4674015045166, "global_step": 481074, "epoch": 5796} {"train_loss": -26.507099151611328, "global_step": 481075, "epoch": 5796} {"train_loss": -26.180078506469727, "global_step": 481076, "epoch": 5796} {"train_loss": -26.200345993041992, "global_step": 481077, "epoch": 5796} {"train_loss": -26.433979034423828, "global_step": 481078, "epoch": 5796} {"train_loss": -26.671239852905273, "global_step": 481079, "epoch": 5796} {"train_loss": -26.374074935913086, "global_step": 481080, "epoch": 5796} {"train_loss": -26.400541305541992, "global_step": 481081, "epoch": 5796} {"train_loss": -26.927106857299805, "global_step": 481082, "epoch": 5796} {"train_loss": -26.54726219177246, "global_step": 481083, "epoch": 5796} {"train_loss": -26.867055892944336, "global_step": 481084, "epoch": 5796} {"train_loss": -26.684202194213867, "global_step": 481085, "epoch": 5796} {"train_loss": -26.703161239624023, "global_step": 481086, "epoch": 5796} {"train_loss": -26.593130111694336, "global_step": 481087, "epoch": 5796} {"train_loss": -27.137964248657227, "global_step": 481088, "epoch": 5796} {"train_loss": -26.923898696899414, "global_step": 481089, "epoch": 5796} {"train_loss": -26.764835357666016, "global_step": 481090, "epoch": 5796} {"train_loss": -26.955951690673828, "global_step": 481091, "epoch": 5796} {"train_loss": -26.796798706054688, "global_step": 481092, "epoch": 5796} {"train_loss": -27.476364135742188, "global_step": 481093, "epoch": 5796} {"train_loss": -26.98740005493164, "global_step": 481094, "epoch": 5796} {"train_loss": -27.002527236938477, "global_step": 481095, "epoch": 5796} {"train_loss": -27.271284103393555, "global_step": 481096, "epoch": 5796} {"train_loss": -26.78763198852539, "global_step": 481097, "epoch": 5796} {"train_loss": -26.95271110534668, "global_step": 481098, "epoch": 5796} {"train_loss": -26.953815460205078, "global_step": 481099, "epoch": 5796} {"train_loss": -26.79450035095215, "global_step": 481100, "epoch": 5796} {"train_loss": -27.084409713745117, "global_step": 481101, "epoch": 5796} {"train_loss": -27.16876220703125, "global_step": 481102, "epoch": 5796} {"train_loss": -26.856122970581055, "global_step": 481103, "epoch": 5796} {"train_loss": -27.294178009033203, "global_step": 481104, "epoch": 5796} {"train_loss": -27.2242374420166, "global_step": 481105, "epoch": 5796} {"train_loss": -27.418973922729492, "global_step": 481106, "epoch": 5796} {"train_loss": -27.654525756835938, "global_step": 481107, "epoch": 5796} {"train_loss": -27.15913963317871, "global_step": 481108, "epoch": 5796} {"train_loss": -27.215734481811523, "global_step": 481109, "epoch": 5796} {"train_loss": -27.22613525390625, "global_step": 481110, "epoch": 5796} {"train_loss": -27.55072021484375, "global_step": 481111, "epoch": 5796} {"train_loss": -27.255634307861328, "global_step": 481112, "epoch": 5796} {"train_loss": -27.32370376586914, "global_step": 481113, "epoch": 5796} {"train_loss": -27.517749786376953, "global_step": 481114, "epoch": 5796} {"train_loss": -27.902368545532227, "global_step": 481115, "epoch": 5796} {"train_loss": -27.345584869384766, "global_step": 481116, "epoch": 5796} {"train_loss": -27.41019058227539, "global_step": 481117, "epoch": 5796} {"train_loss": -27.455890655517578, "global_step": 481118, "epoch": 5796} {"train_loss": -27.6476993560791, "global_step": 481119, "epoch": 5796} {"train_loss": -27.554290771484375, "global_step": 481120, "epoch": 5796} {"train_loss": -27.496692657470703, "global_step": 481121, "epoch": 5796} {"train_loss": -27.406885147094727, "global_step": 481122, "epoch": 5796} {"train_loss": -27.51869773864746, "global_step": 481123, "epoch": 5796} {"train_loss": -27.435102462768555, "global_step": 481124, "epoch": 5796} {"train_loss": -26.915735244750977, "global_step": 481125, "epoch": 5796} {"train_loss": -27.347700119018555, "global_step": 481126, "epoch": 5796} {"train_loss": -27.54265785217285, "global_step": 481127, "epoch": 5796} {"train_loss": -27.393024444580078, "global_step": 481128, "epoch": 5796} {"train_loss": -27.67702293395996, "global_step": 481129, "epoch": 5796} {"train_loss": -27.138071060180664, "global_step": 481130, "epoch": 5796} {"train_loss": -27.328754425048828, "global_step": 481131, "epoch": 5796} {"train_loss": -27.735044479370117, "global_step": 481132, "epoch": 5796} {"train_loss": -27.4041805267334, "global_step": 481133, "epoch": 5796} {"train_loss": -27.489795684814453, "global_step": 481134, "epoch": 5796} {"train_loss": -27.0888671875, "global_step": 481135, "epoch": 5796} {"train_loss": -27.662097930908203, "global_step": 481136, "epoch": 5796} {"train_loss": -27.57417106628418, "global_step": 481137, "epoch": 5796} {"train_loss": -27.443084716796875, "global_step": 481138, "epoch": 5796} {"train_loss": -27.12263298034668, "global_step": 481139, "epoch": 5796} {"train_loss": -27.057310104370117, "global_step": 481140, "epoch": 5796} {"train_loss": -26.88482666015625, "global_step": 481141, "epoch": 5796} {"train_loss": -27.36964225769043, "global_step": 481142, "epoch": 5796} {"train_loss": -27.33877944946289, "global_step": 481143, "epoch": 5796} {"train_loss": -27.3953914642334, "global_step": 481144, "epoch": 5796} {"train_loss": -27.4344425201416, "global_step": 481145, "epoch": 5796} {"train_loss": -27.453088760375977, "global_step": 481146, "epoch": 5796} {"train_loss": -27.42942237854004, "global_step": 481147, "epoch": 5796} {"train_loss": -27.447072982788086, "global_step": 481148, "epoch": 5796} {"train_loss": -27.476537704467773, "global_step": 481149, "epoch": 5796} {"train_loss": -27.092941973582807, "global_step": 481150, "epoch": 5796, "val_loss": 6487777.5} {"train_loss": -27.119678497314453, "global_step": 481151, "epoch": 5797} {"train_loss": -26.729543685913086, "global_step": 481152, "epoch": 5797} {"train_loss": -27.005781173706055, "global_step": 481153, "epoch": 5797} {"train_loss": -26.7132511138916, "global_step": 481154, "epoch": 5797} {"train_loss": -26.875253677368164, "global_step": 481155, "epoch": 5797} {"train_loss": -26.92745018005371, "global_step": 481156, "epoch": 5797} {"train_loss": -27.15675163269043, "global_step": 481157, "epoch": 5797} {"train_loss": -26.930511474609375, "global_step": 481158, "epoch": 5797} {"train_loss": -26.910903930664062, "global_step": 481159, "epoch": 5797} {"train_loss": -26.94732666015625, "global_step": 481160, "epoch": 5797} {"train_loss": -27.102819442749023, "global_step": 481161, "epoch": 5797} {"train_loss": -26.825265884399414, "global_step": 481162, "epoch": 5797} {"train_loss": -26.900726318359375, "global_step": 481163, "epoch": 5797} {"train_loss": -27.266189575195312, "global_step": 481164, "epoch": 5797} {"train_loss": -26.850482940673828, "global_step": 481165, "epoch": 5797} {"train_loss": -27.21161460876465, "global_step": 481166, "epoch": 5797} {"train_loss": -27.455961227416992, "global_step": 481167, "epoch": 5797} {"train_loss": -26.66294288635254, "global_step": 481168, "epoch": 5797} {"train_loss": -26.887937545776367, "global_step": 481169, "epoch": 5797} {"train_loss": -26.57309913635254, "global_step": 481170, "epoch": 5797} {"train_loss": -27.09174156188965, "global_step": 481171, "epoch": 5797} {"train_loss": -27.194929122924805, "global_step": 481172, "epoch": 5797} {"train_loss": -26.974563598632812, "global_step": 481173, "epoch": 5797} {"train_loss": -26.957660675048828, "global_step": 481174, "epoch": 5797} {"train_loss": -27.07547950744629, "global_step": 481175, "epoch": 5797} {"train_loss": -27.224048614501953, "global_step": 481176, "epoch": 5797} {"train_loss": -27.1048641204834, "global_step": 481177, "epoch": 5797} {"train_loss": -26.838150024414062, "global_step": 481178, "epoch": 5797} {"train_loss": -26.447355270385742, "global_step": 481179, "epoch": 5797} {"train_loss": -26.831418991088867, "global_step": 481180, "epoch": 5797} {"train_loss": -27.180768966674805, "global_step": 481181, "epoch": 5797} {"train_loss": -27.24995994567871, "global_step": 481182, "epoch": 5797} {"train_loss": -26.97108268737793, "global_step": 481183, "epoch": 5797} {"train_loss": -27.27186393737793, "global_step": 481184, "epoch": 5797} {"train_loss": -26.72650146484375, "global_step": 481185, "epoch": 5797} {"train_loss": -27.14792823791504, "global_step": 481186, "epoch": 5797} {"train_loss": -27.08466911315918, "global_step": 481187, "epoch": 5797} {"train_loss": -27.149250030517578, "global_step": 481188, "epoch": 5797} {"train_loss": -27.196943283081055, "global_step": 481189, "epoch": 5797} {"train_loss": -27.02888298034668, "global_step": 481190, "epoch": 5797} {"train_loss": -27.175092697143555, "global_step": 481191, "epoch": 5797} {"train_loss": -26.95734214782715, "global_step": 481192, "epoch": 5797} {"train_loss": -27.302764892578125, "global_step": 481193, "epoch": 5797} {"train_loss": -27.5164794921875, "global_step": 481194, "epoch": 5797} {"train_loss": -27.495838165283203, "global_step": 481195, "epoch": 5797} {"train_loss": -27.21075439453125, "global_step": 481196, "epoch": 5797} {"train_loss": -27.433303833007812, "global_step": 481197, "epoch": 5797} {"train_loss": -27.26832389831543, "global_step": 481198, "epoch": 5797} {"train_loss": -27.544666290283203, "global_step": 481199, "epoch": 5797} {"train_loss": -27.34975242614746, "global_step": 481200, "epoch": 5797} {"train_loss": -27.16421890258789, "global_step": 481201, "epoch": 5797} {"train_loss": -27.4857234954834, "global_step": 481202, "epoch": 5797} {"train_loss": -27.3968563079834, "global_step": 481203, "epoch": 5797} {"train_loss": -27.23923110961914, "global_step": 481204, "epoch": 5797} {"train_loss": -27.62725257873535, "global_step": 481205, "epoch": 5797} {"train_loss": -27.739171981811523, "global_step": 481206, "epoch": 5797} {"train_loss": -27.374755859375, "global_step": 481207, "epoch": 5797} {"train_loss": -27.330541610717773, "global_step": 481208, "epoch": 5797} {"train_loss": -27.60165786743164, "global_step": 481209, "epoch": 5797} {"train_loss": -27.33454704284668, "global_step": 481210, "epoch": 5797} {"train_loss": -27.295888900756836, "global_step": 481211, "epoch": 5797} {"train_loss": -27.669031143188477, "global_step": 481212, "epoch": 5797} {"train_loss": -27.19782829284668, "global_step": 481213, "epoch": 5797} {"train_loss": -27.42352867126465, "global_step": 481214, "epoch": 5797} {"train_loss": -27.20766258239746, "global_step": 481215, "epoch": 5797} {"train_loss": -27.228118896484375, "global_step": 481216, "epoch": 5797} {"train_loss": -27.173742294311523, "global_step": 481217, "epoch": 5797} {"train_loss": -26.962173461914062, "global_step": 481218, "epoch": 5797} {"train_loss": -27.37213706970215, "global_step": 481219, "epoch": 5797} {"train_loss": -26.861682891845703, "global_step": 481220, "epoch": 5797} {"train_loss": -26.96075439453125, "global_step": 481221, "epoch": 5797} {"train_loss": -26.764419555664062, "global_step": 481222, "epoch": 5797} {"train_loss": -26.81925392150879, "global_step": 481223, "epoch": 5797} {"train_loss": -27.411909103393555, "global_step": 481224, "epoch": 5797} {"train_loss": -27.0821590423584, "global_step": 481225, "epoch": 5797} {"train_loss": -26.63083839416504, "global_step": 481226, "epoch": 5797} {"train_loss": -26.961780548095703, "global_step": 481227, "epoch": 5797} {"train_loss": -27.53253173828125, "global_step": 481228, "epoch": 5797} {"train_loss": -27.30242347717285, "global_step": 481229, "epoch": 5797} {"train_loss": -26.859228134155273, "global_step": 481230, "epoch": 5797} {"train_loss": -27.137319564819336, "global_step": 481231, "epoch": 5797} {"train_loss": -27.33441162109375, "global_step": 481232, "epoch": 5797} {"train_loss": -27.135768568659405, "global_step": 481233, "epoch": 5797, "val_loss": 6526718.0} {"train_loss": -25.97699546813965, "global_step": 481234, "epoch": 5798} {"train_loss": -25.658166885375977, "global_step": 481235, "epoch": 5798} {"train_loss": -26.326770782470703, "global_step": 481236, "epoch": 5798} {"train_loss": -26.26386070251465, "global_step": 481237, "epoch": 5798} {"train_loss": -26.531147003173828, "global_step": 481238, "epoch": 5798} {"train_loss": -25.842618942260742, "global_step": 481239, "epoch": 5798} {"train_loss": -26.483179092407227, "global_step": 481240, "epoch": 5798} {"train_loss": -26.120832443237305, "global_step": 481241, "epoch": 5798} {"train_loss": -26.92414665222168, "global_step": 481242, "epoch": 5798} {"train_loss": -26.571887969970703, "global_step": 481243, "epoch": 5798} {"train_loss": -26.35302734375, "global_step": 481244, "epoch": 5798} {"train_loss": -26.3927001953125, "global_step": 481245, "epoch": 5798} {"train_loss": -26.867431640625, "global_step": 481246, "epoch": 5798} {"train_loss": -26.523670196533203, "global_step": 481247, "epoch": 5798} {"train_loss": -26.51030921936035, "global_step": 481248, "epoch": 5798} {"train_loss": -26.66366958618164, "global_step": 481249, "epoch": 5798} {"train_loss": -26.4864444732666, "global_step": 481250, "epoch": 5798} {"train_loss": -26.741809844970703, "global_step": 481251, "epoch": 5798} {"train_loss": -26.763233184814453, "global_step": 481252, "epoch": 5798} {"train_loss": -26.5496883392334, "global_step": 481253, "epoch": 5798} {"train_loss": -26.907928466796875, "global_step": 481254, "epoch": 5798} {"train_loss": -27.3439998626709, "global_step": 481255, "epoch": 5798} {"train_loss": -26.798084259033203, "global_step": 481256, "epoch": 5798} {"train_loss": -27.02980613708496, "global_step": 481257, "epoch": 5798} {"train_loss": -27.004526138305664, "global_step": 481258, "epoch": 5798} {"train_loss": -27.460622787475586, "global_step": 481259, "epoch": 5798} {"train_loss": -26.84661865234375, "global_step": 481260, "epoch": 5798} {"train_loss": -27.174413681030273, "global_step": 481261, "epoch": 5798} {"train_loss": -26.952184677124023, "global_step": 481262, "epoch": 5798} {"train_loss": -27.260278701782227, "global_step": 481263, "epoch": 5798} {"train_loss": -27.0579833984375, "global_step": 481264, "epoch": 5798} {"train_loss": -27.051227569580078, "global_step": 481265, "epoch": 5798} {"train_loss": -26.858518600463867, "global_step": 481266, "epoch": 5798} {"train_loss": -27.25286865234375, "global_step": 481267, "epoch": 5798} {"train_loss": -27.12171745300293, "global_step": 481268, "epoch": 5798} {"train_loss": -26.934513092041016, "global_step": 481269, "epoch": 5798} {"train_loss": -27.018171310424805, "global_step": 481270, "epoch": 5798} {"train_loss": -27.076618194580078, "global_step": 481271, "epoch": 5798} {"train_loss": -27.118087768554688, "global_step": 481272, "epoch": 5798} {"train_loss": -27.4588623046875, "global_step": 481273, "epoch": 5798} {"train_loss": -27.25433349609375, "global_step": 481274, "epoch": 5798} {"train_loss": -27.433929443359375, "global_step": 481275, "epoch": 5798} {"train_loss": -27.19125747680664, "global_step": 481276, "epoch": 5798} {"train_loss": -27.260358810424805, "global_step": 481277, "epoch": 5798} {"train_loss": -27.399930953979492, "global_step": 481278, "epoch": 5798} {"train_loss": -27.67938232421875, "global_step": 481279, "epoch": 5798} {"train_loss": -27.222766876220703, "global_step": 481280, "epoch": 5798} {"train_loss": -27.42156982421875, "global_step": 481281, "epoch": 5798} {"train_loss": -27.152746200561523, "global_step": 481282, "epoch": 5798} {"train_loss": -27.078937530517578, "global_step": 481283, "epoch": 5798} {"train_loss": -27.40506362915039, "global_step": 481284, "epoch": 5798} {"train_loss": -26.982751846313477, "global_step": 481285, "epoch": 5798} {"train_loss": -27.2028751373291, "global_step": 481286, "epoch": 5798} {"train_loss": -27.373212814331055, "global_step": 481287, "epoch": 5798} {"train_loss": -27.46189308166504, "global_step": 481288, "epoch": 5798} {"train_loss": -26.940200805664062, "global_step": 481289, "epoch": 5798} {"train_loss": -27.83564567565918, "global_step": 481290, "epoch": 5798} {"train_loss": -27.289936065673828, "global_step": 481291, "epoch": 5798} {"train_loss": -27.28028678894043, "global_step": 481292, "epoch": 5798} {"train_loss": -27.607751846313477, "global_step": 481293, "epoch": 5798} {"train_loss": -27.741378784179688, "global_step": 481294, "epoch": 5798} {"train_loss": -27.664594650268555, "global_step": 481295, "epoch": 5798} {"train_loss": -27.25568962097168, "global_step": 481296, "epoch": 5798} {"train_loss": -26.561004638671875, "global_step": 481297, "epoch": 5798} {"train_loss": -27.139923095703125, "global_step": 481298, "epoch": 5798} {"train_loss": -27.57537841796875, "global_step": 481299, "epoch": 5798} {"train_loss": -27.4287052154541, "global_step": 481300, "epoch": 5798} {"train_loss": -27.46356773376465, "global_step": 481301, "epoch": 5798} {"train_loss": -27.43854331970215, "global_step": 481302, "epoch": 5798} {"train_loss": -26.93995475769043, "global_step": 481303, "epoch": 5798} {"train_loss": -27.1768856048584, "global_step": 481304, "epoch": 5798} {"train_loss": -27.25796890258789, "global_step": 481305, "epoch": 5798} {"train_loss": -27.204938888549805, "global_step": 481306, "epoch": 5798} {"train_loss": -26.96343421936035, "global_step": 481307, "epoch": 5798} {"train_loss": -27.492223739624023, "global_step": 481308, "epoch": 5798} {"train_loss": -27.21258544921875, "global_step": 481309, "epoch": 5798} {"train_loss": -26.884845733642578, "global_step": 481310, "epoch": 5798} {"train_loss": -27.137136459350586, "global_step": 481311, "epoch": 5798} {"train_loss": -27.19428825378418, "global_step": 481312, "epoch": 5798} {"train_loss": -26.826919555664062, "global_step": 481313, "epoch": 5798} {"train_loss": -27.453332901000977, "global_step": 481314, "epoch": 5798} {"train_loss": -26.5883731842041, "global_step": 481315, "epoch": 5798} {"train_loss": -27.029918555753778, "global_step": 481316, "epoch": 5798, "val_loss": 6553905.0} {"train_loss": -24.253747940063477, "global_step": 481317, "epoch": 5799} {"train_loss": -24.10343360900879, "global_step": 481318, "epoch": 5799} {"train_loss": -25.05906105041504, "global_step": 481319, "epoch": 5799} {"train_loss": -24.947763442993164, "global_step": 481320, "epoch": 5799} {"train_loss": -24.890565872192383, "global_step": 481321, "epoch": 5799} {"train_loss": -25.2507381439209, "global_step": 481322, "epoch": 5799} {"train_loss": -25.788482666015625, "global_step": 481323, "epoch": 5799} {"train_loss": -25.883407592773438, "global_step": 481324, "epoch": 5799} {"train_loss": -26.36159324645996, "global_step": 481325, "epoch": 5799} {"train_loss": -25.903100967407227, "global_step": 481326, "epoch": 5799} {"train_loss": -26.17145347595215, "global_step": 481327, "epoch": 5799} {"train_loss": -26.010263442993164, "global_step": 481328, "epoch": 5799} {"train_loss": -26.217517852783203, "global_step": 481329, "epoch": 5799} {"train_loss": -26.211271286010742, "global_step": 481330, "epoch": 5799} {"train_loss": -26.25421714782715, "global_step": 481331, "epoch": 5799} {"train_loss": -26.55311393737793, "global_step": 481332, "epoch": 5799} {"train_loss": -26.735715866088867, "global_step": 481333, "epoch": 5799} {"train_loss": -26.4882755279541, "global_step": 481334, "epoch": 5799} {"train_loss": -26.35736083984375, "global_step": 481335, "epoch": 5799} {"train_loss": -26.757131576538086, "global_step": 481336, "epoch": 5799} {"train_loss": -26.202762603759766, "global_step": 481337, "epoch": 5799} {"train_loss": -26.70167350769043, "global_step": 481338, "epoch": 5799} {"train_loss": -26.753881454467773, "global_step": 481339, "epoch": 5799} {"train_loss": -26.868940353393555, "global_step": 481340, "epoch": 5799} {"train_loss": -26.519453048706055, "global_step": 481341, "epoch": 5799} {"train_loss": -26.8450984954834, "global_step": 481342, "epoch": 5799} {"train_loss": -27.036279678344727, "global_step": 481343, "epoch": 5799} {"train_loss": -26.92879295349121, "global_step": 481344, "epoch": 5799} {"train_loss": -26.86764907836914, "global_step": 481345, "epoch": 5799} {"train_loss": -26.871692657470703, "global_step": 481346, "epoch": 5799} {"train_loss": -27.175189971923828, "global_step": 481347, "epoch": 5799} {"train_loss": -27.208703994750977, "global_step": 481348, "epoch": 5799} {"train_loss": -27.090124130249023, "global_step": 481349, "epoch": 5799} {"train_loss": -26.720380783081055, "global_step": 481350, "epoch": 5799} {"train_loss": -26.82342529296875, "global_step": 481351, "epoch": 5799} {"train_loss": -27.086294174194336, "global_step": 481352, "epoch": 5799} {"train_loss": -27.004566192626953, "global_step": 481353, "epoch": 5799} {"train_loss": -27.123640060424805, "global_step": 481354, "epoch": 5799} {"train_loss": -27.287128448486328, "global_step": 481355, "epoch": 5799} {"train_loss": -27.116682052612305, "global_step": 481356, "epoch": 5799} {"train_loss": -27.1456298828125, "global_step": 481357, "epoch": 5799} {"train_loss": -26.952436447143555, "global_step": 481358, "epoch": 5799} {"train_loss": -26.90620231628418, "global_step": 481359, "epoch": 5799} {"train_loss": -26.947052001953125, "global_step": 481360, "epoch": 5799} {"train_loss": -27.283649444580078, "global_step": 481361, "epoch": 5799} {"train_loss": -27.128347396850586, "global_step": 481362, "epoch": 5799} {"train_loss": -27.130834579467773, "global_step": 481363, "epoch": 5799} {"train_loss": -27.501544952392578, "global_step": 481364, "epoch": 5799} {"train_loss": -27.360265731811523, "global_step": 481365, "epoch": 5799} {"train_loss": -27.03411865234375, "global_step": 481366, "epoch": 5799} {"train_loss": -27.380252838134766, "global_step": 481367, "epoch": 5799} {"train_loss": -27.60881996154785, "global_step": 481368, "epoch": 5799} {"train_loss": -27.50592613220215, "global_step": 481369, "epoch": 5799} {"train_loss": -27.42950439453125, "global_step": 481370, "epoch": 5799} {"train_loss": -27.578693389892578, "global_step": 481371, "epoch": 5799} {"train_loss": -27.323749542236328, "global_step": 481372, "epoch": 5799} {"train_loss": -27.08332633972168, "global_step": 481373, "epoch": 5799} {"train_loss": -27.461111068725586, "global_step": 481374, "epoch": 5799} {"train_loss": -27.222747802734375, "global_step": 481375, "epoch": 5799} {"train_loss": -26.959136962890625, "global_step": 481376, "epoch": 5799} {"train_loss": -27.50347328186035, "global_step": 481377, "epoch": 5799} {"train_loss": -27.28716468811035, "global_step": 481378, "epoch": 5799} {"train_loss": -27.545215606689453, "global_step": 481379, "epoch": 5799} {"train_loss": -27.019479751586914, "global_step": 481380, "epoch": 5799} {"train_loss": -27.605188369750977, "global_step": 481381, "epoch": 5799} {"train_loss": -27.3062686920166, "global_step": 481382, "epoch": 5799} {"train_loss": -27.57851219177246, "global_step": 481383, "epoch": 5799} {"train_loss": -27.316064834594727, "global_step": 481384, "epoch": 5799} {"train_loss": -27.41609001159668, "global_step": 481385, "epoch": 5799} {"train_loss": -27.367462158203125, "global_step": 481386, "epoch": 5799} {"train_loss": -26.959613800048828, "global_step": 481387, "epoch": 5799} {"train_loss": -27.103967666625977, "global_step": 481388, "epoch": 5799} {"train_loss": -26.53580093383789, "global_step": 481389, "epoch": 5799} {"train_loss": -26.2537784576416, "global_step": 481390, "epoch": 5799} {"train_loss": -26.678796768188477, "global_step": 481391, "epoch": 5799} {"train_loss": -27.122297286987305, "global_step": 481392, "epoch": 5799} {"train_loss": -26.152023315429688, "global_step": 481393, "epoch": 5799} {"train_loss": -25.95172119140625, "global_step": 481394, "epoch": 5799} {"train_loss": -26.718732833862305, "global_step": 481395, "epoch": 5799} {"train_loss": -26.81308937072754, "global_step": 481396, "epoch": 5799} {"train_loss": -26.89129638671875, "global_step": 481397, "epoch": 5799} {"train_loss": -26.87302017211914, "global_step": 481398, "epoch": 5799} {"train_loss": -26.741369408297253, "global_step": 481399, "epoch": 5799, "val_loss": 6692821.0} {"train_loss": -26.433334350585938, "global_step": 481400, "epoch": 5800} {"train_loss": -24.725263595581055, "global_step": 481401, "epoch": 5800} {"train_loss": -26.083011627197266, "global_step": 481402, "epoch": 5800} {"train_loss": -25.801233291625977, "global_step": 481403, "epoch": 5800} {"train_loss": -25.96731948852539, "global_step": 481404, "epoch": 5800} {"train_loss": -25.255189895629883, "global_step": 481405, "epoch": 5800} {"train_loss": -26.869293212890625, "global_step": 481406, "epoch": 5800} {"train_loss": -25.8001766204834, "global_step": 481407, "epoch": 5800} {"train_loss": -26.331457138061523, "global_step": 481408, "epoch": 5800} {"train_loss": -26.35731315612793, "global_step": 481409, "epoch": 5800} {"train_loss": -26.25652503967285, "global_step": 481410, "epoch": 5800} {"train_loss": -26.6584529876709, "global_step": 481411, "epoch": 5800} {"train_loss": -26.313343048095703, "global_step": 481412, "epoch": 5800} {"train_loss": -26.702383041381836, "global_step": 481413, "epoch": 5800} {"train_loss": -26.9057674407959, "global_step": 481414, "epoch": 5800} {"train_loss": -26.468000411987305, "global_step": 481415, "epoch": 5800} {"train_loss": -26.274524688720703, "global_step": 481416, "epoch": 5800} {"train_loss": -26.516393661499023, "global_step": 481417, "epoch": 5800} {"train_loss": -26.872577667236328, "global_step": 481418, "epoch": 5800} {"train_loss": -26.092554092407227, "global_step": 481419, "epoch": 5800} {"train_loss": -26.94366455078125, "global_step": 481420, "epoch": 5800} {"train_loss": -27.176023483276367, "global_step": 481421, "epoch": 5800} {"train_loss": -26.90874671936035, "global_step": 481422, "epoch": 5800} {"train_loss": -26.603744506835938, "global_step": 481423, "epoch": 5800} {"train_loss": -27.0169734954834, "global_step": 481424, "epoch": 5800} {"train_loss": -26.93277931213379, "global_step": 481425, "epoch": 5800} {"train_loss": -26.8840389251709, "global_step": 481426, "epoch": 5800} {"train_loss": -26.78667640686035, "global_step": 481427, "epoch": 5800} {"train_loss": -26.792709350585938, "global_step": 481428, "epoch": 5800} {"train_loss": -26.904264450073242, "global_step": 481429, "epoch": 5800} {"train_loss": -27.369415283203125, "global_step": 481430, "epoch": 5800} {"train_loss": -27.2342586517334, "global_step": 481431, "epoch": 5800} {"train_loss": -27.08609962463379, "global_step": 481432, "epoch": 5800} {"train_loss": -27.1677188873291, "global_step": 481433, "epoch": 5800} {"train_loss": -26.86285400390625, "global_step": 481434, "epoch": 5800} {"train_loss": -27.54754638671875, "global_step": 481435, "epoch": 5800} {"train_loss": -27.204654693603516, "global_step": 481436, "epoch": 5800} {"train_loss": -26.91981315612793, "global_step": 481437, "epoch": 5800} {"train_loss": -27.1973876953125, "global_step": 481438, "epoch": 5800} {"train_loss": -27.1746768951416, "global_step": 481439, "epoch": 5800} {"train_loss": -27.230161666870117, "global_step": 481440, "epoch": 5800} {"train_loss": -27.13028907775879, "global_step": 481441, "epoch": 5800} {"train_loss": -27.13934326171875, "global_step": 481442, "epoch": 5800} {"train_loss": -27.0836124420166, "global_step": 481443, "epoch": 5800} {"train_loss": -27.083520889282227, "global_step": 481444, "epoch": 5800} {"train_loss": -27.489850997924805, "global_step": 481445, "epoch": 5800} {"train_loss": -27.414594650268555, "global_step": 481446, "epoch": 5800} {"train_loss": -27.272062301635742, "global_step": 481447, "epoch": 5800} {"train_loss": -27.589506149291992, "global_step": 481448, "epoch": 5800} {"train_loss": -27.04052734375, "global_step": 481449, "epoch": 5800} {"train_loss": -27.39643669128418, "global_step": 481450, "epoch": 5800} {"train_loss": -27.244665145874023, "global_step": 481451, "epoch": 5800} {"train_loss": -27.634815216064453, "global_step": 481452, "epoch": 5800} {"train_loss": -27.372541427612305, "global_step": 481453, "epoch": 5800} {"train_loss": -27.2631778717041, "global_step": 481454, "epoch": 5800} {"train_loss": -27.584686279296875, "global_step": 481455, "epoch": 5800} {"train_loss": -27.327802658081055, "global_step": 481456, "epoch": 5800} {"train_loss": -27.49700927734375, "global_step": 481457, "epoch": 5800} {"train_loss": -27.36785316467285, "global_step": 481458, "epoch": 5800} {"train_loss": -27.137720108032227, "global_step": 481459, "epoch": 5800} {"train_loss": -27.837528228759766, "global_step": 481460, "epoch": 5800} {"train_loss": -27.326826095581055, "global_step": 481461, "epoch": 5800} {"train_loss": -27.281423568725586, "global_step": 481462, "epoch": 5800} {"train_loss": -27.8389892578125, "global_step": 481463, "epoch": 5800} {"train_loss": -27.003753662109375, "global_step": 481464, "epoch": 5800} {"train_loss": -27.135589599609375, "global_step": 481465, "epoch": 5800} {"train_loss": -27.543231964111328, "global_step": 481466, "epoch": 5800} {"train_loss": -27.17803955078125, "global_step": 481467, "epoch": 5800} {"train_loss": -27.59891128540039, "global_step": 481468, "epoch": 5800} {"train_loss": -27.348615646362305, "global_step": 481469, "epoch": 5800} {"train_loss": -27.133670806884766, "global_step": 481470, "epoch": 5800} {"train_loss": -27.055150985717773, "global_step": 481471, "epoch": 5800} {"train_loss": -27.346179962158203, "global_step": 481472, "epoch": 5800} {"train_loss": -27.32295799255371, "global_step": 481473, "epoch": 5800} {"train_loss": -27.016529083251953, "global_step": 481474, "epoch": 5800} {"train_loss": -27.126554489135742, "global_step": 481475, "epoch": 5800} {"train_loss": -27.129499435424805, "global_step": 481476, "epoch": 5800} {"train_loss": -26.953039169311523, "global_step": 481477, "epoch": 5800} {"train_loss": -27.337020874023438, "global_step": 481478, "epoch": 5800} {"train_loss": -27.193958282470703, "global_step": 481479, "epoch": 5800} {"train_loss": -27.29231071472168, "global_step": 481480, "epoch": 5800} {"train_loss": -27.442981719970703, "global_step": 481481, "epoch": 5800} {"train_loss": -26.98126163252865, "global_step": 481482, "epoch": 5800, "train/sim_max_reward_0": 1.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4500000": 1.0, "test/sim_max_reward_4500001": 1.0, "test/sim_max_reward_4500002": 1.0, "test/sim_max_reward_4500003": 1.0, "test/sim_max_reward_4500004": 1.0, "test/sim_max_reward_4500005": 1.0, "test/sim_max_reward_4500006": 1.0, "test/sim_max_reward_4500007": 1.0, "test/sim_max_reward_4500008": 1.0, "test/sim_max_reward_4500009": 1.0, "test/sim_max_reward_4500010": 1.0, "test/sim_max_reward_4500011": 1.0, "test/sim_max_reward_4500012": 1.0, "test/sim_max_reward_4500013": 0.0, "test/sim_max_reward_4500014": 1.0, "test/sim_max_reward_4500015": 1.0, "test/sim_max_reward_4500016": 0.0, "test/sim_max_reward_4500017": 1.0, "test/sim_max_reward_4500018": 1.0, "test/sim_max_reward_4500019": 0.0, "test/sim_max_reward_4500020": 1.0, "test/sim_max_reward_4500021": 1.0, "train/mean_score": 1.0, "test/mean_score": 0.8636363636363636, "val_loss": 6632626.5} {"train_loss": -26.931934356689453, "global_step": 481483, "epoch": 5801} {"train_loss": -26.401968002319336, "global_step": 481484, "epoch": 5801} {"train_loss": -26.863311767578125, "global_step": 481485, "epoch": 5801} {"train_loss": -26.3916015625, "global_step": 481486, "epoch": 5801} {"train_loss": -26.808637619018555, "global_step": 481487, "epoch": 5801} {"train_loss": -26.701190948486328, "global_step": 481488, "epoch": 5801} {"train_loss": -26.63245964050293, "global_step": 481489, "epoch": 5801} {"train_loss": -26.850854873657227, "global_step": 481490, "epoch": 5801} {"train_loss": -27.010944366455078, "global_step": 481491, "epoch": 5801} {"train_loss": -27.26153564453125, "global_step": 481492, "epoch": 5801} {"train_loss": -26.795917510986328, "global_step": 481493, "epoch": 5801} {"train_loss": -26.59406852722168, "global_step": 481494, "epoch": 5801} {"train_loss": -26.647424697875977, "global_step": 481495, "epoch": 5801} {"train_loss": -26.95269203186035, "global_step": 481496, "epoch": 5801} {"train_loss": -26.945270538330078, "global_step": 481497, "epoch": 5801} {"train_loss": -26.553564071655273, "global_step": 481498, "epoch": 5801} {"train_loss": -26.313032150268555, "global_step": 481499, "epoch": 5801} {"train_loss": -26.82477378845215, "global_step": 481500, "epoch": 5801} {"train_loss": -27.05112648010254, "global_step": 481501, "epoch": 5801} {"train_loss": -26.63233757019043, "global_step": 481502, "epoch": 5801} {"train_loss": -26.996658325195312, "global_step": 481503, "epoch": 5801} {"train_loss": -27.248804092407227, "global_step": 481504, "epoch": 5801} {"train_loss": -26.880094528198242, "global_step": 481505, "epoch": 5801} {"train_loss": -26.7603759765625, "global_step": 481506, "epoch": 5801} {"train_loss": -26.4830379486084, "global_step": 481507, "epoch": 5801} {"train_loss": -26.978931427001953, "global_step": 481508, "epoch": 5801} {"train_loss": -26.829345703125, "global_step": 481509, "epoch": 5801} {"train_loss": -27.362131118774414, "global_step": 481510, "epoch": 5801} {"train_loss": -27.103422164916992, "global_step": 481511, "epoch": 5801} {"train_loss": -27.386062622070312, "global_step": 481512, "epoch": 5801} {"train_loss": -27.15216064453125, "global_step": 481513, "epoch": 5801} {"train_loss": -27.394886016845703, "global_step": 481514, "epoch": 5801} {"train_loss": -27.505834579467773, "global_step": 481515, "epoch": 5801} {"train_loss": -27.406782150268555, "global_step": 481516, "epoch": 5801} {"train_loss": -27.56998062133789, "global_step": 481517, "epoch": 5801} {"train_loss": -27.26295280456543, "global_step": 481518, "epoch": 5801} {"train_loss": -27.302541732788086, "global_step": 481519, "epoch": 5801} {"train_loss": -27.341650009155273, "global_step": 481520, "epoch": 5801} {"train_loss": -27.251087188720703, "global_step": 481521, "epoch": 5801} {"train_loss": -27.604475021362305, "global_step": 481522, "epoch": 5801} {"train_loss": -27.4300594329834, "global_step": 481523, "epoch": 5801} {"train_loss": -27.360143661499023, "global_step": 481524, "epoch": 5801} {"train_loss": -27.360864639282227, "global_step": 481525, "epoch": 5801} {"train_loss": -27.366592407226562, "global_step": 481526, "epoch": 5801} {"train_loss": -27.656085968017578, "global_step": 481527, "epoch": 5801} {"train_loss": -27.8575439453125, "global_step": 481528, "epoch": 5801} {"train_loss": -27.521026611328125, "global_step": 481529, "epoch": 5801} {"train_loss": -27.05647087097168, "global_step": 481530, "epoch": 5801} {"train_loss": -26.929845809936523, "global_step": 481531, "epoch": 5801} {"train_loss": -27.242456436157227, "global_step": 481532, "epoch": 5801} {"train_loss": -27.669824600219727, "global_step": 481533, "epoch": 5801} {"train_loss": -27.546667098999023, "global_step": 481534, "epoch": 5801} {"train_loss": -27.267547607421875, "global_step": 481535, "epoch": 5801} {"train_loss": -27.584762573242188, "global_step": 481536, "epoch": 5801} {"train_loss": -26.869827270507812, "global_step": 481537, "epoch": 5801} {"train_loss": -26.660877227783203, "global_step": 481538, "epoch": 5801} {"train_loss": -27.089651107788086, "global_step": 481539, "epoch": 5801} {"train_loss": -27.3750057220459, "global_step": 481540, "epoch": 5801} {"train_loss": -27.228757858276367, "global_step": 481541, "epoch": 5801} {"train_loss": -27.35202980041504, "global_step": 481542, "epoch": 5801} {"train_loss": -27.573699951171875, "global_step": 481543, "epoch": 5801} {"train_loss": -27.21656608581543, "global_step": 481544, "epoch": 5801} {"train_loss": -27.269821166992188, "global_step": 481545, "epoch": 5801} {"train_loss": -27.15386390686035, "global_step": 481546, "epoch": 5801} {"train_loss": -27.363296508789062, "global_step": 481547, "epoch": 5801} {"train_loss": -27.560056686401367, "global_step": 481548, "epoch": 5801} {"train_loss": -27.300031661987305, "global_step": 481549, "epoch": 5801} {"train_loss": -27.361835479736328, "global_step": 481550, "epoch": 5801} {"train_loss": -27.72273826599121, "global_step": 481551, "epoch": 5801} {"train_loss": -27.43937110900879, "global_step": 481552, "epoch": 5801} {"train_loss": -27.288532257080078, "global_step": 481553, "epoch": 5801} {"train_loss": -27.72715187072754, "global_step": 481554, "epoch": 5801} {"train_loss": -27.647785186767578, "global_step": 481555, "epoch": 5801} {"train_loss": -27.536457061767578, "global_step": 481556, "epoch": 5801} {"train_loss": -27.472320556640625, "global_step": 481557, "epoch": 5801} {"train_loss": -27.444299697875977, "global_step": 481558, "epoch": 5801} {"train_loss": -27.426694869995117, "global_step": 481559, "epoch": 5801} {"train_loss": -27.412260055541992, "global_step": 481560, "epoch": 5801} {"train_loss": -27.29473304748535, "global_step": 481561, "epoch": 5801} {"train_loss": -27.251117706298828, "global_step": 481562, "epoch": 5801} {"train_loss": -27.000890731811523, "global_step": 481563, "epoch": 5801} {"train_loss": -27.352624893188477, "global_step": 481564, "epoch": 5801} {"train_loss": -27.168694323804004, "global_step": 481565, "epoch": 5801, "val_loss": 6741640.5} {"train_loss": -26.314367294311523, "global_step": 481566, "epoch": 5802} {"train_loss": -26.492694854736328, "global_step": 481567, "epoch": 5802} {"train_loss": -25.829797744750977, "global_step": 481568, "epoch": 5802} {"train_loss": -25.532625198364258, "global_step": 481569, "epoch": 5802} {"train_loss": -25.74653434753418, "global_step": 481570, "epoch": 5802} {"train_loss": -26.67050552368164, "global_step": 481571, "epoch": 5802} {"train_loss": -26.5394229888916, "global_step": 481572, "epoch": 5802} {"train_loss": -26.46272087097168, "global_step": 481573, "epoch": 5802} {"train_loss": -26.337812423706055, "global_step": 481574, "epoch": 5802} {"train_loss": -25.874094009399414, "global_step": 481575, "epoch": 5802} {"train_loss": -26.78858757019043, "global_step": 481576, "epoch": 5802} {"train_loss": -26.267614364624023, "global_step": 481577, "epoch": 5802} {"train_loss": -26.62919044494629, "global_step": 481578, "epoch": 5802} {"train_loss": -27.087793350219727, "global_step": 481579, "epoch": 5802} {"train_loss": -27.235254287719727, "global_step": 481580, "epoch": 5802} {"train_loss": -26.843957901000977, "global_step": 481581, "epoch": 5802} {"train_loss": -26.682966232299805, "global_step": 481582, "epoch": 5802} {"train_loss": -26.2744140625, "global_step": 481583, "epoch": 5802} {"train_loss": -26.717700958251953, "global_step": 481584, "epoch": 5802} {"train_loss": -26.99554443359375, "global_step": 481585, "epoch": 5802} {"train_loss": -26.950336456298828, "global_step": 481586, "epoch": 5802} {"train_loss": -27.24356460571289, "global_step": 481587, "epoch": 5802} {"train_loss": -26.868215560913086, "global_step": 481588, "epoch": 5802} {"train_loss": -27.109586715698242, "global_step": 481589, "epoch": 5802} {"train_loss": -27.20795249938965, "global_step": 481590, "epoch": 5802} {"train_loss": -26.876516342163086, "global_step": 481591, "epoch": 5802} {"train_loss": -27.143680572509766, "global_step": 481592, "epoch": 5802} {"train_loss": -27.19904136657715, "global_step": 481593, "epoch": 5802} {"train_loss": -26.986392974853516, "global_step": 481594, "epoch": 5802} {"train_loss": -27.088260650634766, "global_step": 481595, "epoch": 5802} {"train_loss": -27.430419921875, "global_step": 481596, "epoch": 5802} {"train_loss": -27.219120025634766, "global_step": 481597, "epoch": 5802} {"train_loss": -27.20877456665039, "global_step": 481598, "epoch": 5802} {"train_loss": -26.9152774810791, "global_step": 481599, "epoch": 5802} {"train_loss": -26.984949111938477, "global_step": 481600, "epoch": 5802} {"train_loss": -27.265167236328125, "global_step": 481601, "epoch": 5802} {"train_loss": -27.201902389526367, "global_step": 481602, "epoch": 5802} {"train_loss": -27.463123321533203, "global_step": 481603, "epoch": 5802} {"train_loss": -27.612394332885742, "global_step": 481604, "epoch": 5802} {"train_loss": -27.2819881439209, "global_step": 481605, "epoch": 5802} {"train_loss": -27.54094886779785, "global_step": 481606, "epoch": 5802} {"train_loss": -27.087726593017578, "global_step": 481607, "epoch": 5802} {"train_loss": -27.373403549194336, "global_step": 481608, "epoch": 5802} {"train_loss": -27.008609771728516, "global_step": 481609, "epoch": 5802} {"train_loss": -27.430252075195312, "global_step": 481610, "epoch": 5802} {"train_loss": -27.293304443359375, "global_step": 481611, "epoch": 5802} {"train_loss": -27.029157638549805, "global_step": 481612, "epoch": 5802} {"train_loss": -27.287616729736328, "global_step": 481613, "epoch": 5802} {"train_loss": -26.786182403564453, "global_step": 481614, "epoch": 5802} {"train_loss": -26.992130279541016, "global_step": 481615, "epoch": 5802} {"train_loss": -27.262426376342773, "global_step": 481616, "epoch": 5802} {"train_loss": -26.922393798828125, "global_step": 481617, "epoch": 5802} {"train_loss": -26.95542335510254, "global_step": 481618, "epoch": 5802} {"train_loss": -27.46243667602539, "global_step": 481619, "epoch": 5802} {"train_loss": -27.14637565612793, "global_step": 481620, "epoch": 5802} {"train_loss": -27.46619987487793, "global_step": 481621, "epoch": 5802} {"train_loss": -27.2941837310791, "global_step": 481622, "epoch": 5802} {"train_loss": -27.028579711914062, "global_step": 481623, "epoch": 5802} {"train_loss": -27.65168571472168, "global_step": 481624, "epoch": 5802} {"train_loss": -26.683517456054688, "global_step": 481625, "epoch": 5802} {"train_loss": -27.113035202026367, "global_step": 481626, "epoch": 5802} {"train_loss": -27.24018669128418, "global_step": 481627, "epoch": 5802} {"train_loss": -27.215192794799805, "global_step": 481628, "epoch": 5802} {"train_loss": -27.044599533081055, "global_step": 481629, "epoch": 5802} {"train_loss": -27.753808975219727, "global_step": 481630, "epoch": 5802} {"train_loss": -27.169782638549805, "global_step": 481631, "epoch": 5802} {"train_loss": -26.9255428314209, "global_step": 481632, "epoch": 5802} {"train_loss": -27.025848388671875, "global_step": 481633, "epoch": 5802} {"train_loss": -27.195219039916992, "global_step": 481634, "epoch": 5802} {"train_loss": -27.413711547851562, "global_step": 481635, "epoch": 5802} {"train_loss": -27.0340633392334, "global_step": 481636, "epoch": 5802} {"train_loss": -27.171743392944336, "global_step": 481637, "epoch": 5802} {"train_loss": -27.079639434814453, "global_step": 481638, "epoch": 5802} {"train_loss": -27.117238998413086, "global_step": 481639, "epoch": 5802} {"train_loss": -27.540082931518555, "global_step": 481640, "epoch": 5802} {"train_loss": -26.959177017211914, "global_step": 481641, "epoch": 5802} {"train_loss": -27.173095703125, "global_step": 481642, "epoch": 5802} {"train_loss": -27.096832275390625, "global_step": 481643, "epoch": 5802} {"train_loss": -27.330276489257812, "global_step": 481644, "epoch": 5802} {"train_loss": -26.9659423828125, "global_step": 481645, "epoch": 5802} {"train_loss": -27.061201095581055, "global_step": 481646, "epoch": 5802} {"train_loss": -27.251447677612305, "global_step": 481647, "epoch": 5802} {"train_loss": -27.01584197814206, "global_step": 481648, "epoch": 5802, "val_loss": 6664241.0} {"train_loss": -26.34027099609375, "global_step": 481649, "epoch": 5803} {"train_loss": -26.53302574157715, "global_step": 481650, "epoch": 5803} {"train_loss": -26.2645206451416, "global_step": 481651, "epoch": 5803} {"train_loss": -26.47712516784668, "global_step": 481652, "epoch": 5803} {"train_loss": -26.52678871154785, "global_step": 481653, "epoch": 5803} {"train_loss": -26.682432174682617, "global_step": 481654, "epoch": 5803} {"train_loss": -26.516925811767578, "global_step": 481655, "epoch": 5803} {"train_loss": -26.77179527282715, "global_step": 481656, "epoch": 5803} {"train_loss": -26.616607666015625, "global_step": 481657, "epoch": 5803} {"train_loss": -27.186620712280273, "global_step": 481658, "epoch": 5803} {"train_loss": -27.1164493560791, "global_step": 481659, "epoch": 5803} {"train_loss": -26.63596534729004, "global_step": 481660, "epoch": 5803} {"train_loss": -27.152099609375, "global_step": 481661, "epoch": 5803} {"train_loss": -27.2842960357666, "global_step": 481662, "epoch": 5803} {"train_loss": -26.534351348876953, "global_step": 481663, "epoch": 5803} {"train_loss": -27.334247589111328, "global_step": 481664, "epoch": 5803} {"train_loss": -27.19464111328125, "global_step": 481665, "epoch": 5803} {"train_loss": -26.95436668395996, "global_step": 481666, "epoch": 5803} {"train_loss": -27.348535537719727, "global_step": 481667, "epoch": 5803} {"train_loss": -27.128759384155273, "global_step": 481668, "epoch": 5803} {"train_loss": -27.062213897705078, "global_step": 481669, "epoch": 5803} {"train_loss": -27.242923736572266, "global_step": 481670, "epoch": 5803} {"train_loss": -27.523792266845703, "global_step": 481671, "epoch": 5803} {"train_loss": -27.33099937438965, "global_step": 481672, "epoch": 5803} {"train_loss": -27.47005271911621, "global_step": 481673, "epoch": 5803} {"train_loss": -27.286588668823242, "global_step": 481674, "epoch": 5803} {"train_loss": -27.438663482666016, "global_step": 481675, "epoch": 5803} {"train_loss": -27.365442276000977, "global_step": 481676, "epoch": 5803} {"train_loss": -27.18051528930664, "global_step": 481677, "epoch": 5803} {"train_loss": -27.28558349609375, "global_step": 481678, "epoch": 5803} {"train_loss": -27.282779693603516, "global_step": 481679, "epoch": 5803} {"train_loss": -27.39371681213379, "global_step": 481680, "epoch": 5803} {"train_loss": -27.402502059936523, "global_step": 481681, "epoch": 5803} {"train_loss": -27.47625160217285, "global_step": 481682, "epoch": 5803} {"train_loss": -27.04029655456543, "global_step": 481683, "epoch": 5803} {"train_loss": -27.150190353393555, "global_step": 481684, "epoch": 5803} {"train_loss": -27.10431480407715, "global_step": 481685, "epoch": 5803} {"train_loss": -27.400175094604492, "global_step": 481686, "epoch": 5803} {"train_loss": -27.342788696289062, "global_step": 481687, "epoch": 5803} {"train_loss": -27.171606063842773, "global_step": 481688, "epoch": 5803} {"train_loss": -27.51173973083496, "global_step": 481689, "epoch": 5803} {"train_loss": -28.004667282104492, "global_step": 481690, "epoch": 5803} {"train_loss": -27.53021812438965, "global_step": 481691, "epoch": 5803} {"train_loss": -27.205352783203125, "global_step": 481692, "epoch": 5803} {"train_loss": -27.155115127563477, "global_step": 481693, "epoch": 5803} {"train_loss": -27.54035758972168, "global_step": 481694, "epoch": 5803} {"train_loss": -27.27566909790039, "global_step": 481695, "epoch": 5803} {"train_loss": -27.192716598510742, "global_step": 481696, "epoch": 5803} {"train_loss": -27.37798500061035, "global_step": 481697, "epoch": 5803} {"train_loss": -27.56640625, "global_step": 481698, "epoch": 5803} {"train_loss": -27.275699615478516, "global_step": 481699, "epoch": 5803} {"train_loss": -27.267414093017578, "global_step": 481700, "epoch": 5803} {"train_loss": -27.366682052612305, "global_step": 481701, "epoch": 5803} {"train_loss": -27.36250114440918, "global_step": 481702, "epoch": 5803} {"train_loss": -27.38869285583496, "global_step": 481703, "epoch": 5803} {"train_loss": -27.19817543029785, "global_step": 481704, "epoch": 5803} {"train_loss": -27.255456924438477, "global_step": 481705, "epoch": 5803} {"train_loss": -26.928647994995117, "global_step": 481706, "epoch": 5803} {"train_loss": -27.549219131469727, "global_step": 481707, "epoch": 5803} {"train_loss": -27.052148818969727, "global_step": 481708, "epoch": 5803} {"train_loss": -27.426239013671875, "global_step": 481709, "epoch": 5803} {"train_loss": -27.09592628479004, "global_step": 481710, "epoch": 5803} {"train_loss": -27.614110946655273, "global_step": 481711, "epoch": 5803} {"train_loss": -27.1220760345459, "global_step": 481712, "epoch": 5803} {"train_loss": -27.241811752319336, "global_step": 481713, "epoch": 5803} {"train_loss": -27.20045280456543, "global_step": 481714, "epoch": 5803} {"train_loss": -27.1412410736084, "global_step": 481715, "epoch": 5803} {"train_loss": -27.188400268554688, "global_step": 481716, "epoch": 5803} {"train_loss": -27.15296745300293, "global_step": 481717, "epoch": 5803} {"train_loss": -27.165327072143555, "global_step": 481718, "epoch": 5803} {"train_loss": -26.964200973510742, "global_step": 481719, "epoch": 5803} {"train_loss": -27.580902099609375, "global_step": 481720, "epoch": 5803} {"train_loss": -27.2457332611084, "global_step": 481721, "epoch": 5803} {"train_loss": -27.175342559814453, "global_step": 481722, "epoch": 5803} {"train_loss": -27.607702255249023, "global_step": 481723, "epoch": 5803} {"train_loss": -27.164966583251953, "global_step": 481724, "epoch": 5803} {"train_loss": -27.317459106445312, "global_step": 481725, "epoch": 5803} {"train_loss": -27.470544815063477, "global_step": 481726, "epoch": 5803} {"train_loss": -26.983264923095703, "global_step": 481727, "epoch": 5803} {"train_loss": -27.213468551635742, "global_step": 481728, "epoch": 5803} {"train_loss": -27.091644287109375, "global_step": 481729, "epoch": 5803} {"train_loss": -27.41986656188965, "global_step": 481730, "epoch": 5803} {"train_loss": -27.198217231107044, "global_step": 481731, "epoch": 5803, "val_loss": 6627798.0} {"train_loss": -26.566137313842773, "global_step": 481732, "epoch": 5804} {"train_loss": -26.597869873046875, "global_step": 481733, "epoch": 5804} {"train_loss": -26.710798263549805, "global_step": 481734, "epoch": 5804} {"train_loss": -26.90846061706543, "global_step": 481735, "epoch": 5804} {"train_loss": -26.67389488220215, "global_step": 481736, "epoch": 5804} {"train_loss": -26.181955337524414, "global_step": 481737, "epoch": 5804} {"train_loss": -27.056640625, "global_step": 481738, "epoch": 5804} {"train_loss": -26.980627059936523, "global_step": 481739, "epoch": 5804} {"train_loss": -26.641998291015625, "global_step": 481740, "epoch": 5804} {"train_loss": -26.45692253112793, "global_step": 481741, "epoch": 5804} {"train_loss": -26.450345993041992, "global_step": 481742, "epoch": 5804} {"train_loss": -26.619009017944336, "global_step": 481743, "epoch": 5804} {"train_loss": -26.780399322509766, "global_step": 481744, "epoch": 5804} {"train_loss": -27.1641902923584, "global_step": 481745, "epoch": 5804} {"train_loss": -26.58570671081543, "global_step": 481746, "epoch": 5804} {"train_loss": -26.967382431030273, "global_step": 481747, "epoch": 5804} {"train_loss": -26.748321533203125, "global_step": 481748, "epoch": 5804} {"train_loss": -27.023412704467773, "global_step": 481749, "epoch": 5804} {"train_loss": -26.870527267456055, "global_step": 481750, "epoch": 5804} {"train_loss": -26.843921661376953, "global_step": 481751, "epoch": 5804} {"train_loss": -26.977197647094727, "global_step": 481752, "epoch": 5804} {"train_loss": -26.832406997680664, "global_step": 481753, "epoch": 5804} {"train_loss": -27.222768783569336, "global_step": 481754, "epoch": 5804} {"train_loss": -27.30869483947754, "global_step": 481755, "epoch": 5804} {"train_loss": -27.19319725036621, "global_step": 481756, "epoch": 5804} {"train_loss": -26.7509708404541, "global_step": 481757, "epoch": 5804} {"train_loss": -27.4063720703125, "global_step": 481758, "epoch": 5804} {"train_loss": -27.256839752197266, "global_step": 481759, "epoch": 5804} {"train_loss": -27.26857566833496, "global_step": 481760, "epoch": 5804} {"train_loss": -27.229236602783203, "global_step": 481761, "epoch": 5804} {"train_loss": -26.94292640686035, "global_step": 481762, "epoch": 5804} {"train_loss": -27.054004669189453, "global_step": 481763, "epoch": 5804} {"train_loss": -27.4278621673584, "global_step": 481764, "epoch": 5804} {"train_loss": -27.134296417236328, "global_step": 481765, "epoch": 5804} {"train_loss": -27.28326988220215, "global_step": 481766, "epoch": 5804} {"train_loss": -27.623676300048828, "global_step": 481767, "epoch": 5804} {"train_loss": -26.918201446533203, "global_step": 481768, "epoch": 5804} {"train_loss": -27.267087936401367, "global_step": 481769, "epoch": 5804} {"train_loss": -26.96868324279785, "global_step": 481770, "epoch": 5804} {"train_loss": -27.37483024597168, "global_step": 481771, "epoch": 5804} {"train_loss": -26.994903564453125, "global_step": 481772, "epoch": 5804} {"train_loss": -27.354883193969727, "global_step": 481773, "epoch": 5804} {"train_loss": -27.556432723999023, "global_step": 481774, "epoch": 5804} {"train_loss": -27.411054611206055, "global_step": 481775, "epoch": 5804} {"train_loss": -27.32598304748535, "global_step": 481776, "epoch": 5804} {"train_loss": -27.2094669342041, "global_step": 481777, "epoch": 5804} {"train_loss": -27.280481338500977, "global_step": 481778, "epoch": 5804} {"train_loss": -27.54176139831543, "global_step": 481779, "epoch": 5804} {"train_loss": -27.397085189819336, "global_step": 481780, "epoch": 5804} {"train_loss": -27.311532974243164, "global_step": 481781, "epoch": 5804} {"train_loss": -27.552143096923828, "global_step": 481782, "epoch": 5804} {"train_loss": -27.380203247070312, "global_step": 481783, "epoch": 5804} {"train_loss": -27.588623046875, "global_step": 481784, "epoch": 5804} {"train_loss": -27.54703712463379, "global_step": 481785, "epoch": 5804} {"train_loss": -27.33363914489746, "global_step": 481786, "epoch": 5804} {"train_loss": -27.863128662109375, "global_step": 481787, "epoch": 5804} {"train_loss": -27.399566650390625, "global_step": 481788, "epoch": 5804} {"train_loss": -27.543127059936523, "global_step": 481789, "epoch": 5804} {"train_loss": -27.522857666015625, "global_step": 481790, "epoch": 5804} {"train_loss": -27.232318878173828, "global_step": 481791, "epoch": 5804} {"train_loss": -27.41456413269043, "global_step": 481792, "epoch": 5804} {"train_loss": -27.370229721069336, "global_step": 481793, "epoch": 5804} {"train_loss": -27.50152015686035, "global_step": 481794, "epoch": 5804} {"train_loss": -27.059064865112305, "global_step": 481795, "epoch": 5804} {"train_loss": -27.52280044555664, "global_step": 481796, "epoch": 5804} {"train_loss": -27.592016220092773, "global_step": 481797, "epoch": 5804} {"train_loss": -27.32520866394043, "global_step": 481798, "epoch": 5804} {"train_loss": -27.406421661376953, "global_step": 481799, "epoch": 5804} {"train_loss": -27.560277938842773, "global_step": 481800, "epoch": 5804} {"train_loss": -27.147064208984375, "global_step": 481801, "epoch": 5804} {"train_loss": -27.688199996948242, "global_step": 481802, "epoch": 5804} {"train_loss": -27.308069229125977, "global_step": 481803, "epoch": 5804} {"train_loss": -27.45338249206543, "global_step": 481804, "epoch": 5804} {"train_loss": -27.11294937133789, "global_step": 481805, "epoch": 5804} {"train_loss": -27.367095947265625, "global_step": 481806, "epoch": 5804} {"train_loss": -27.341556549072266, "global_step": 481807, "epoch": 5804} {"train_loss": -27.623254776000977, "global_step": 481808, "epoch": 5804} {"train_loss": -27.26262855529785, "global_step": 481809, "epoch": 5804} {"train_loss": -27.149280548095703, "global_step": 481810, "epoch": 5804} {"train_loss": -27.111906051635742, "global_step": 481811, "epoch": 5804} {"train_loss": -27.383020401000977, "global_step": 481812, "epoch": 5804} {"train_loss": -27.424238204956055, "global_step": 481813, "epoch": 5804} {"train_loss": -27.197557058679052, "global_step": 481814, "epoch": 5804, "val_loss": 6610326.0} {"train_loss": -26.98444175720215, "global_step": 481815, "epoch": 5805} {"train_loss": -26.699024200439453, "global_step": 481816, "epoch": 5805} {"train_loss": -26.86646842956543, "global_step": 481817, "epoch": 5805} {"train_loss": -26.911657333374023, "global_step": 481818, "epoch": 5805} {"train_loss": -26.7659912109375, "global_step": 481819, "epoch": 5805} {"train_loss": -26.723346710205078, "global_step": 481820, "epoch": 5805} {"train_loss": -27.12575340270996, "global_step": 481821, "epoch": 5805} {"train_loss": -26.601215362548828, "global_step": 481822, "epoch": 5805} {"train_loss": -27.12232780456543, "global_step": 481823, "epoch": 5805} {"train_loss": -26.816938400268555, "global_step": 481824, "epoch": 5805} {"train_loss": -26.94600486755371, "global_step": 481825, "epoch": 5805} {"train_loss": -26.753149032592773, "global_step": 481826, "epoch": 5805} {"train_loss": -27.0506534576416, "global_step": 481827, "epoch": 5805} {"train_loss": -26.971942901611328, "global_step": 481828, "epoch": 5805} {"train_loss": -26.839649200439453, "global_step": 481829, "epoch": 5805} {"train_loss": -27.0992374420166, "global_step": 481830, "epoch": 5805} {"train_loss": -26.847692489624023, "global_step": 481831, "epoch": 5805} {"train_loss": -27.480581283569336, "global_step": 481832, "epoch": 5805} {"train_loss": -26.76393699645996, "global_step": 481833, "epoch": 5805} {"train_loss": -27.318408966064453, "global_step": 481834, "epoch": 5805} {"train_loss": -27.27137565612793, "global_step": 481835, "epoch": 5805} {"train_loss": -27.3544864654541, "global_step": 481836, "epoch": 5805} {"train_loss": -27.35162353515625, "global_step": 481837, "epoch": 5805} {"train_loss": -27.564044952392578, "global_step": 481838, "epoch": 5805} {"train_loss": -27.628494262695312, "global_step": 481839, "epoch": 5805} {"train_loss": -26.991865158081055, "global_step": 481840, "epoch": 5805} {"train_loss": -27.28094482421875, "global_step": 481841, "epoch": 5805} {"train_loss": -27.25282096862793, "global_step": 481842, "epoch": 5805} {"train_loss": -27.35310173034668, "global_step": 481843, "epoch": 5805} {"train_loss": -27.0430965423584, "global_step": 481844, "epoch": 5805} {"train_loss": -26.8718318939209, "global_step": 481845, "epoch": 5805} {"train_loss": -27.20444679260254, "global_step": 481846, "epoch": 5805} {"train_loss": -27.097997665405273, "global_step": 481847, "epoch": 5805} {"train_loss": -27.30816078186035, "global_step": 481848, "epoch": 5805} {"train_loss": -27.166112899780273, "global_step": 481849, "epoch": 5805} {"train_loss": -27.69180679321289, "global_step": 481850, "epoch": 5805} {"train_loss": -27.0665283203125, "global_step": 481851, "epoch": 5805} {"train_loss": -27.452489852905273, "global_step": 481852, "epoch": 5805} {"train_loss": -27.5156307220459, "global_step": 481853, "epoch": 5805} {"train_loss": -27.396697998046875, "global_step": 481854, "epoch": 5805} {"train_loss": -26.954299926757812, "global_step": 481855, "epoch": 5805} {"train_loss": -27.384973526000977, "global_step": 481856, "epoch": 5805} {"train_loss": -27.62544059753418, "global_step": 481857, "epoch": 5805} {"train_loss": -27.38482093811035, "global_step": 481858, "epoch": 5805} {"train_loss": -27.384063720703125, "global_step": 481859, "epoch": 5805} {"train_loss": -27.730670928955078, "global_step": 481860, "epoch": 5805} {"train_loss": -27.210336685180664, "global_step": 481861, "epoch": 5805} {"train_loss": -27.320539474487305, "global_step": 481862, "epoch": 5805} {"train_loss": -27.597064971923828, "global_step": 481863, "epoch": 5805} {"train_loss": -27.494653701782227, "global_step": 481864, "epoch": 5805} {"train_loss": -27.517690658569336, "global_step": 481865, "epoch": 5805} {"train_loss": -27.29180335998535, "global_step": 481866, "epoch": 5805} {"train_loss": -27.525236129760742, "global_step": 481867, "epoch": 5805} {"train_loss": -27.364837646484375, "global_step": 481868, "epoch": 5805} {"train_loss": -27.67901611328125, "global_step": 481869, "epoch": 5805} {"train_loss": -27.27605628967285, "global_step": 481870, "epoch": 5805} {"train_loss": -27.5334529876709, "global_step": 481871, "epoch": 5805} {"train_loss": -27.49309730529785, "global_step": 481872, "epoch": 5805} {"train_loss": -27.622663497924805, "global_step": 481873, "epoch": 5805} {"train_loss": -27.213342666625977, "global_step": 481874, "epoch": 5805} {"train_loss": -27.54789161682129, "global_step": 481875, "epoch": 5805} {"train_loss": -27.363859176635742, "global_step": 481876, "epoch": 5805} {"train_loss": -27.36519432067871, "global_step": 481877, "epoch": 5805} {"train_loss": -27.06813621520996, "global_step": 481878, "epoch": 5805} {"train_loss": -26.967575073242188, "global_step": 481879, "epoch": 5805} {"train_loss": -27.489032745361328, "global_step": 481880, "epoch": 5805} {"train_loss": -27.690515518188477, "global_step": 481881, "epoch": 5805} {"train_loss": -27.52776527404785, "global_step": 481882, "epoch": 5805} {"train_loss": -27.278980255126953, "global_step": 481883, "epoch": 5805} {"train_loss": -26.883031845092773, "global_step": 481884, "epoch": 5805} {"train_loss": -27.284799575805664, "global_step": 481885, "epoch": 5805} {"train_loss": -27.270954132080078, "global_step": 481886, "epoch": 5805} {"train_loss": -27.459884643554688, "global_step": 481887, "epoch": 5805} {"train_loss": -27.553424835205078, "global_step": 481888, "epoch": 5805} {"train_loss": -27.147058486938477, "global_step": 481889, "epoch": 5805} {"train_loss": -27.486570358276367, "global_step": 481890, "epoch": 5805} {"train_loss": -27.445560455322266, "global_step": 481891, "epoch": 5805} {"train_loss": -27.371936798095703, "global_step": 481892, "epoch": 5805} {"train_loss": -27.190481185913086, "global_step": 481893, "epoch": 5805} {"train_loss": -27.312402725219727, "global_step": 481894, "epoch": 5805} {"train_loss": -27.179601669311523, "global_step": 481895, "epoch": 5805} {"train_loss": -27.336933135986328, "global_step": 481896, "epoch": 5805} {"train_loss": -27.247176825282086, "global_step": 481897, "epoch": 5805, "val_loss": 6654973.0} {"train_loss": -25.194276809692383, "global_step": 481898, "epoch": 5806} {"train_loss": -24.88240623474121, "global_step": 481899, "epoch": 5806} {"train_loss": -24.67148780822754, "global_step": 481900, "epoch": 5806} {"train_loss": -24.343042373657227, "global_step": 481901, "epoch": 5806} {"train_loss": -25.58428955078125, "global_step": 481902, "epoch": 5806} {"train_loss": -25.157577514648438, "global_step": 481903, "epoch": 5806} {"train_loss": -25.9290828704834, "global_step": 481904, "epoch": 5806} {"train_loss": -25.130022048950195, "global_step": 481905, "epoch": 5806} {"train_loss": -25.775634765625, "global_step": 481906, "epoch": 5806} {"train_loss": -25.739521026611328, "global_step": 481907, "epoch": 5806} {"train_loss": -25.658248901367188, "global_step": 481908, "epoch": 5806} {"train_loss": -25.640457153320312, "global_step": 481909, "epoch": 5806} {"train_loss": -25.95444107055664, "global_step": 481910, "epoch": 5806} {"train_loss": -26.044843673706055, "global_step": 481911, "epoch": 5806} {"train_loss": -26.030729293823242, "global_step": 481912, "epoch": 5806} {"train_loss": -25.882495880126953, "global_step": 481913, "epoch": 5806} {"train_loss": -26.438962936401367, "global_step": 481914, "epoch": 5806} {"train_loss": -26.034345626831055, "global_step": 481915, "epoch": 5806} {"train_loss": -26.339344024658203, "global_step": 481916, "epoch": 5806} {"train_loss": -25.912988662719727, "global_step": 481917, "epoch": 5806} {"train_loss": -26.440526962280273, "global_step": 481918, "epoch": 5806} {"train_loss": -26.3826961517334, "global_step": 481919, "epoch": 5806} {"train_loss": -26.31537437438965, "global_step": 481920, "epoch": 5806} {"train_loss": -26.362045288085938, "global_step": 481921, "epoch": 5806} {"train_loss": -26.78118896484375, "global_step": 481922, "epoch": 5806} {"train_loss": -26.41455078125, "global_step": 481923, "epoch": 5806} {"train_loss": -26.451780319213867, "global_step": 481924, "epoch": 5806} {"train_loss": -26.849166870117188, "global_step": 481925, "epoch": 5806} {"train_loss": -26.5728702545166, "global_step": 481926, "epoch": 5806} {"train_loss": -26.728164672851562, "global_step": 481927, "epoch": 5806} {"train_loss": -26.81952476501465, "global_step": 481928, "epoch": 5806} {"train_loss": -26.836889266967773, "global_step": 481929, "epoch": 5806} {"train_loss": -26.536481857299805, "global_step": 481930, "epoch": 5806} {"train_loss": -27.027393341064453, "global_step": 481931, "epoch": 5806} {"train_loss": -27.0223445892334, "global_step": 481932, "epoch": 5806} {"train_loss": -26.934751510620117, "global_step": 481933, "epoch": 5806} {"train_loss": -26.922531127929688, "global_step": 481934, "epoch": 5806} {"train_loss": -26.85467529296875, "global_step": 481935, "epoch": 5806} {"train_loss": -26.944433212280273, "global_step": 481936, "epoch": 5806} {"train_loss": -27.11578941345215, "global_step": 481937, "epoch": 5806} {"train_loss": -27.28423500061035, "global_step": 481938, "epoch": 5806} {"train_loss": -27.276540756225586, "global_step": 481939, "epoch": 5806} {"train_loss": -27.246923446655273, "global_step": 481940, "epoch": 5806} {"train_loss": -26.877731323242188, "global_step": 481941, "epoch": 5806} {"train_loss": -27.223438262939453, "global_step": 481942, "epoch": 5806} {"train_loss": -27.151321411132812, "global_step": 481943, "epoch": 5806} {"train_loss": -27.72242546081543, "global_step": 481944, "epoch": 5806} {"train_loss": -27.312219619750977, "global_step": 481945, "epoch": 5806} {"train_loss": -27.010435104370117, "global_step": 481946, "epoch": 5806} {"train_loss": -27.444366455078125, "global_step": 481947, "epoch": 5806} {"train_loss": -26.80938720703125, "global_step": 481948, "epoch": 5806} {"train_loss": -26.882471084594727, "global_step": 481949, "epoch": 5806} {"train_loss": -27.32956886291504, "global_step": 481950, "epoch": 5806} {"train_loss": -27.00125503540039, "global_step": 481951, "epoch": 5806} {"train_loss": -27.566425323486328, "global_step": 481952, "epoch": 5806} {"train_loss": -27.045774459838867, "global_step": 481953, "epoch": 5806} {"train_loss": -27.1326904296875, "global_step": 481954, "epoch": 5806} {"train_loss": -27.363754272460938, "global_step": 481955, "epoch": 5806} {"train_loss": -27.5029296875, "global_step": 481956, "epoch": 5806} {"train_loss": -27.388248443603516, "global_step": 481957, "epoch": 5806} {"train_loss": -27.0074462890625, "global_step": 481958, "epoch": 5806} {"train_loss": -27.239364624023438, "global_step": 481959, "epoch": 5806} {"train_loss": -27.274744033813477, "global_step": 481960, "epoch": 5806} {"train_loss": -27.147235870361328, "global_step": 481961, "epoch": 5806} {"train_loss": -27.45929527282715, "global_step": 481962, "epoch": 5806} {"train_loss": -27.032489776611328, "global_step": 481963, "epoch": 5806} {"train_loss": -27.1485652923584, "global_step": 481964, "epoch": 5806} {"train_loss": -27.110647201538086, "global_step": 481965, "epoch": 5806} {"train_loss": -27.017364501953125, "global_step": 481966, "epoch": 5806} {"train_loss": -27.6987247467041, "global_step": 481967, "epoch": 5806} {"train_loss": -27.201623916625977, "global_step": 481968, "epoch": 5806} {"train_loss": -27.406042098999023, "global_step": 481969, "epoch": 5806} {"train_loss": -27.664508819580078, "global_step": 481970, "epoch": 5806} {"train_loss": -27.577802658081055, "global_step": 481971, "epoch": 5806} {"train_loss": -27.44626235961914, "global_step": 481972, "epoch": 5806} {"train_loss": -27.563825607299805, "global_step": 481973, "epoch": 5806} {"train_loss": -27.653385162353516, "global_step": 481974, "epoch": 5806} {"train_loss": -27.13789176940918, "global_step": 481975, "epoch": 5806} {"train_loss": -27.359411239624023, "global_step": 481976, "epoch": 5806} {"train_loss": -27.605804443359375, "global_step": 481977, "epoch": 5806} {"train_loss": -27.4609317779541, "global_step": 481978, "epoch": 5806} {"train_loss": -27.396240234375, "global_step": 481979, "epoch": 5806} {"train_loss": -26.755764765911792, "global_step": 481980, "epoch": 5806, "val_loss": 6581034.5} {"train_loss": -26.440113067626953, "global_step": 481981, "epoch": 5807} {"train_loss": -26.706892013549805, "global_step": 481982, "epoch": 5807} {"train_loss": -26.907474517822266, "global_step": 481983, "epoch": 5807} {"train_loss": -27.295001983642578, "global_step": 481984, "epoch": 5807} {"train_loss": -26.520273208618164, "global_step": 481985, "epoch": 5807} {"train_loss": -26.690078735351562, "global_step": 481986, "epoch": 5807} {"train_loss": -26.791473388671875, "global_step": 481987, "epoch": 5807} {"train_loss": -26.209613800048828, "global_step": 481988, "epoch": 5807} {"train_loss": -26.870512008666992, "global_step": 481989, "epoch": 5807} {"train_loss": -26.769062042236328, "global_step": 481990, "epoch": 5807} {"train_loss": -26.382495880126953, "global_step": 481991, "epoch": 5807} {"train_loss": -26.73367691040039, "global_step": 481992, "epoch": 5807} {"train_loss": -26.450353622436523, "global_step": 481993, "epoch": 5807} {"train_loss": -26.9102783203125, "global_step": 481994, "epoch": 5807} {"train_loss": -26.75198745727539, "global_step": 481995, "epoch": 5807} {"train_loss": -26.99053382873535, "global_step": 481996, "epoch": 5807} {"train_loss": -26.61798667907715, "global_step": 481997, "epoch": 5807} {"train_loss": -27.049835205078125, "global_step": 481998, "epoch": 5807} {"train_loss": -26.9642333984375, "global_step": 481999, "epoch": 5807} {"train_loss": -27.02808952331543, "global_step": 482000, "epoch": 5807} {"train_loss": -27.212390899658203, "global_step": 482001, "epoch": 5807} {"train_loss": -26.928455352783203, "global_step": 482002, "epoch": 5807} {"train_loss": -27.30887222290039, "global_step": 482003, "epoch": 5807} {"train_loss": -27.1117000579834, "global_step": 482004, "epoch": 5807} {"train_loss": -27.471296310424805, "global_step": 482005, "epoch": 5807} {"train_loss": -27.129804611206055, "global_step": 482006, "epoch": 5807} {"train_loss": -27.395116806030273, "global_step": 482007, "epoch": 5807} {"train_loss": -26.883092880249023, "global_step": 482008, "epoch": 5807} {"train_loss": -27.186819076538086, "global_step": 482009, "epoch": 5807} {"train_loss": -27.42104148864746, "global_step": 482010, "epoch": 5807} {"train_loss": -27.29656410217285, "global_step": 482011, "epoch": 5807} {"train_loss": -27.42548942565918, "global_step": 482012, "epoch": 5807} {"train_loss": -27.53481101989746, "global_step": 482013, "epoch": 5807} {"train_loss": -27.280445098876953, "global_step": 482014, "epoch": 5807} {"train_loss": -27.35906410217285, "global_step": 482015, "epoch": 5807} {"train_loss": -27.2633056640625, "global_step": 482016, "epoch": 5807} {"train_loss": -27.0246639251709, "global_step": 482017, "epoch": 5807} {"train_loss": -27.126386642456055, "global_step": 482018, "epoch": 5807} {"train_loss": -27.434350967407227, "global_step": 482019, "epoch": 5807} {"train_loss": -27.190155029296875, "global_step": 482020, "epoch": 5807} {"train_loss": -27.788928985595703, "global_step": 482021, "epoch": 5807} {"train_loss": -27.4132137298584, "global_step": 482022, "epoch": 5807} {"train_loss": -27.18048667907715, "global_step": 482023, "epoch": 5807} {"train_loss": -27.562726974487305, "global_step": 482024, "epoch": 5807} {"train_loss": -27.104736328125, "global_step": 482025, "epoch": 5807} {"train_loss": -26.950735092163086, "global_step": 482026, "epoch": 5807} {"train_loss": -27.470901489257812, "global_step": 482027, "epoch": 5807} {"train_loss": -27.577545166015625, "global_step": 482028, "epoch": 5807} {"train_loss": -27.07401466369629, "global_step": 482029, "epoch": 5807} {"train_loss": -27.257251739501953, "global_step": 482030, "epoch": 5807} {"train_loss": -27.4064884185791, "global_step": 482031, "epoch": 5807} {"train_loss": -26.954883575439453, "global_step": 482032, "epoch": 5807} {"train_loss": -27.359689712524414, "global_step": 482033, "epoch": 5807} {"train_loss": -27.240936279296875, "global_step": 482034, "epoch": 5807} {"train_loss": -27.67219352722168, "global_step": 482035, "epoch": 5807} {"train_loss": -27.188451766967773, "global_step": 482036, "epoch": 5807} {"train_loss": -27.13020133972168, "global_step": 482037, "epoch": 5807} {"train_loss": -27.528974533081055, "global_step": 482038, "epoch": 5807} {"train_loss": -27.230152130126953, "global_step": 482039, "epoch": 5807} {"train_loss": -26.93096351623535, "global_step": 482040, "epoch": 5807} {"train_loss": -26.861011505126953, "global_step": 482041, "epoch": 5807} {"train_loss": -27.081872940063477, "global_step": 482042, "epoch": 5807} {"train_loss": -26.827978134155273, "global_step": 482043, "epoch": 5807} {"train_loss": -27.056381225585938, "global_step": 482044, "epoch": 5807} {"train_loss": -27.046127319335938, "global_step": 482045, "epoch": 5807} {"train_loss": -27.199359893798828, "global_step": 482046, "epoch": 5807} {"train_loss": -27.276548385620117, "global_step": 482047, "epoch": 5807} {"train_loss": -27.225372314453125, "global_step": 482048, "epoch": 5807} {"train_loss": -27.142553329467773, "global_step": 482049, "epoch": 5807} {"train_loss": -27.513168334960938, "global_step": 482050, "epoch": 5807} {"train_loss": -27.674793243408203, "global_step": 482051, "epoch": 5807} {"train_loss": -26.836074829101562, "global_step": 482052, "epoch": 5807} {"train_loss": -27.052488327026367, "global_step": 482053, "epoch": 5807} {"train_loss": -27.2420597076416, "global_step": 482054, "epoch": 5807} {"train_loss": -26.576709747314453, "global_step": 482055, "epoch": 5807} {"train_loss": -27.413742065429688, "global_step": 482056, "epoch": 5807} {"train_loss": -26.897241592407227, "global_step": 482057, "epoch": 5807} {"train_loss": -27.06081199645996, "global_step": 482058, "epoch": 5807} {"train_loss": -26.909337997436523, "global_step": 482059, "epoch": 5807} {"train_loss": -27.110193252563477, "global_step": 482060, "epoch": 5807} {"train_loss": -27.21599769592285, "global_step": 482061, "epoch": 5807} {"train_loss": -26.794342041015625, "global_step": 482062, "epoch": 5807} {"train_loss": -27.085691383086054, "global_step": 482063, "epoch": 5807, "val_loss": 6593712.0} {"train_loss": -26.82036781311035, "global_step": 482064, "epoch": 5808} {"train_loss": -26.666467666625977, "global_step": 482065, "epoch": 5808} {"train_loss": -26.840621948242188, "global_step": 482066, "epoch": 5808} {"train_loss": -26.895505905151367, "global_step": 482067, "epoch": 5808} {"train_loss": -26.565704345703125, "global_step": 482068, "epoch": 5808} {"train_loss": -27.041845321655273, "global_step": 482069, "epoch": 5808} {"train_loss": -27.009695053100586, "global_step": 482070, "epoch": 5808} {"train_loss": -27.229658126831055, "global_step": 482071, "epoch": 5808} {"train_loss": -26.93458366394043, "global_step": 482072, "epoch": 5808} {"train_loss": -27.290252685546875, "global_step": 482073, "epoch": 5808} {"train_loss": -27.390771865844727, "global_step": 482074, "epoch": 5808} {"train_loss": -27.22601318359375, "global_step": 482075, "epoch": 5808} {"train_loss": -27.473905563354492, "global_step": 482076, "epoch": 5808} {"train_loss": -27.282175064086914, "global_step": 482077, "epoch": 5808} {"train_loss": -27.137327194213867, "global_step": 482078, "epoch": 5808} {"train_loss": -27.399356842041016, "global_step": 482079, "epoch": 5808} {"train_loss": -27.2285213470459, "global_step": 482080, "epoch": 5808} {"train_loss": -27.304187774658203, "global_step": 482081, "epoch": 5808} {"train_loss": -27.315799713134766, "global_step": 482082, "epoch": 5808} {"train_loss": -27.26954460144043, "global_step": 482083, "epoch": 5808} {"train_loss": -27.111501693725586, "global_step": 482084, "epoch": 5808} {"train_loss": -27.191211700439453, "global_step": 482085, "epoch": 5808} {"train_loss": -27.172958374023438, "global_step": 482086, "epoch": 5808} {"train_loss": -26.91143798828125, "global_step": 482087, "epoch": 5808} {"train_loss": -26.827442169189453, "global_step": 482088, "epoch": 5808} {"train_loss": -27.2121524810791, "global_step": 482089, "epoch": 5808} {"train_loss": -27.090734481811523, "global_step": 482090, "epoch": 5808} {"train_loss": -27.12959098815918, "global_step": 482091, "epoch": 5808} {"train_loss": -26.845754623413086, "global_step": 482092, "epoch": 5808} {"train_loss": -27.028669357299805, "global_step": 482093, "epoch": 5808} {"train_loss": -27.78619384765625, "global_step": 482094, "epoch": 5808} {"train_loss": -27.429489135742188, "global_step": 482095, "epoch": 5808} {"train_loss": -27.185260772705078, "global_step": 482096, "epoch": 5808} {"train_loss": -27.076908111572266, "global_step": 482097, "epoch": 5808} {"train_loss": -27.07364273071289, "global_step": 482098, "epoch": 5808} {"train_loss": -26.96750259399414, "global_step": 482099, "epoch": 5808} {"train_loss": -27.672399520874023, "global_step": 482100, "epoch": 5808} {"train_loss": -27.286306381225586, "global_step": 482101, "epoch": 5808} {"train_loss": -27.1635799407959, "global_step": 482102, "epoch": 5808} {"train_loss": -27.384817123413086, "global_step": 482103, "epoch": 5808} {"train_loss": -27.4351806640625, "global_step": 482104, "epoch": 5808} {"train_loss": -27.767322540283203, "global_step": 482105, "epoch": 5808} {"train_loss": -27.162094116210938, "global_step": 482106, "epoch": 5808} {"train_loss": -27.2333927154541, "global_step": 482107, "epoch": 5808} {"train_loss": -27.49469566345215, "global_step": 482108, "epoch": 5808} {"train_loss": -27.465778350830078, "global_step": 482109, "epoch": 5808} {"train_loss": -27.797407150268555, "global_step": 482110, "epoch": 5808} {"train_loss": -27.109039306640625, "global_step": 482111, "epoch": 5808} {"train_loss": -27.18521499633789, "global_step": 482112, "epoch": 5808} {"train_loss": -27.33432960510254, "global_step": 482113, "epoch": 5808} {"train_loss": -27.31538200378418, "global_step": 482114, "epoch": 5808} {"train_loss": -27.019189834594727, "global_step": 482115, "epoch": 5808} {"train_loss": -27.53204345703125, "global_step": 482116, "epoch": 5808} {"train_loss": -26.996936798095703, "global_step": 482117, "epoch": 5808} {"train_loss": -27.030920028686523, "global_step": 482118, "epoch": 5808} {"train_loss": -27.156835556030273, "global_step": 482119, "epoch": 5808} {"train_loss": -26.963464736938477, "global_step": 482120, "epoch": 5808} {"train_loss": -27.656070709228516, "global_step": 482121, "epoch": 5808} {"train_loss": -27.29082679748535, "global_step": 482122, "epoch": 5808} {"train_loss": -27.449832916259766, "global_step": 482123, "epoch": 5808} {"train_loss": -27.783954620361328, "global_step": 482124, "epoch": 5808} {"train_loss": -27.373987197875977, "global_step": 482125, "epoch": 5808} {"train_loss": -27.572967529296875, "global_step": 482126, "epoch": 5808} {"train_loss": -27.49750328063965, "global_step": 482127, "epoch": 5808} {"train_loss": -27.267324447631836, "global_step": 482128, "epoch": 5808} {"train_loss": -27.543079376220703, "global_step": 482129, "epoch": 5808} {"train_loss": -27.192615509033203, "global_step": 482130, "epoch": 5808} {"train_loss": -27.152435302734375, "global_step": 482131, "epoch": 5808} {"train_loss": -27.123336791992188, "global_step": 482132, "epoch": 5808} {"train_loss": -26.618244171142578, "global_step": 482133, "epoch": 5808} {"train_loss": -26.72941017150879, "global_step": 482134, "epoch": 5808} {"train_loss": -27.068527221679688, "global_step": 482135, "epoch": 5808} {"train_loss": -27.2756290435791, "global_step": 482136, "epoch": 5808} {"train_loss": -27.3375301361084, "global_step": 482137, "epoch": 5808} {"train_loss": -26.70184898376465, "global_step": 482138, "epoch": 5808} {"train_loss": -26.92555809020996, "global_step": 482139, "epoch": 5808} {"train_loss": -26.852094650268555, "global_step": 482140, "epoch": 5808} {"train_loss": -27.3544979095459, "global_step": 482141, "epoch": 5808} {"train_loss": -27.278766632080078, "global_step": 482142, "epoch": 5808} {"train_loss": -27.2496280670166, "global_step": 482143, "epoch": 5808} {"train_loss": -27.38671875, "global_step": 482144, "epoch": 5808} {"train_loss": -27.397003173828125, "global_step": 482145, "epoch": 5808} {"train_loss": -27.208799821784698, "global_step": 482146, "epoch": 5808, "val_loss": 6571798.0} {"train_loss": -27.1478328704834, "global_step": 482147, "epoch": 5809} {"train_loss": -27.09950828552246, "global_step": 482148, "epoch": 5809} {"train_loss": -26.644901275634766, "global_step": 482149, "epoch": 5809} {"train_loss": -27.377084732055664, "global_step": 482150, "epoch": 5809} {"train_loss": -27.051258087158203, "global_step": 482151, "epoch": 5809} {"train_loss": -27.136682510375977, "global_step": 482152, "epoch": 5809} {"train_loss": -26.95973014831543, "global_step": 482153, "epoch": 5809} {"train_loss": -27.371234893798828, "global_step": 482154, "epoch": 5809} {"train_loss": -27.19845962524414, "global_step": 482155, "epoch": 5809} {"train_loss": -26.96876335144043, "global_step": 482156, "epoch": 5809} {"train_loss": -27.08094596862793, "global_step": 482157, "epoch": 5809} {"train_loss": -27.274267196655273, "global_step": 482158, "epoch": 5809} {"train_loss": -26.949899673461914, "global_step": 482159, "epoch": 5809} {"train_loss": -26.6944580078125, "global_step": 482160, "epoch": 5809} {"train_loss": -27.2126522064209, "global_step": 482161, "epoch": 5809} {"train_loss": -27.11505699157715, "global_step": 482162, "epoch": 5809} {"train_loss": -27.332483291625977, "global_step": 482163, "epoch": 5809} {"train_loss": -27.147022247314453, "global_step": 482164, "epoch": 5809} {"train_loss": -27.21192741394043, "global_step": 482165, "epoch": 5809} {"train_loss": -27.25775146484375, "global_step": 482166, "epoch": 5809} {"train_loss": -27.19806480407715, "global_step": 482167, "epoch": 5809} {"train_loss": -27.39180564880371, "global_step": 482168, "epoch": 5809} {"train_loss": -27.002466201782227, "global_step": 482169, "epoch": 5809} {"train_loss": -27.094852447509766, "global_step": 482170, "epoch": 5809} {"train_loss": -27.278913497924805, "global_step": 482171, "epoch": 5809} {"train_loss": -27.1412296295166, "global_step": 482172, "epoch": 5809} {"train_loss": -27.086301803588867, "global_step": 482173, "epoch": 5809} {"train_loss": -27.169240951538086, "global_step": 482174, "epoch": 5809} {"train_loss": -27.214752197265625, "global_step": 482175, "epoch": 5809} {"train_loss": -27.263132095336914, "global_step": 482176, "epoch": 5809} {"train_loss": -27.154592514038086, "global_step": 482177, "epoch": 5809} {"train_loss": -27.404605865478516, "global_step": 482178, "epoch": 5809} {"train_loss": -27.914142608642578, "global_step": 482179, "epoch": 5809} {"train_loss": -27.73223876953125, "global_step": 482180, "epoch": 5809} {"train_loss": -27.501256942749023, "global_step": 482181, "epoch": 5809} {"train_loss": -27.33259391784668, "global_step": 482182, "epoch": 5809} {"train_loss": -27.162811279296875, "global_step": 482183, "epoch": 5809} {"train_loss": -27.454666137695312, "global_step": 482184, "epoch": 5809} {"train_loss": -27.49252700805664, "global_step": 482185, "epoch": 5809} {"train_loss": -27.7745304107666, "global_step": 482186, "epoch": 5809} {"train_loss": -27.08437156677246, "global_step": 482187, "epoch": 5809} {"train_loss": -27.9440975189209, "global_step": 482188, "epoch": 5809} {"train_loss": -27.19677734375, "global_step": 482189, "epoch": 5809} {"train_loss": -26.793283462524414, "global_step": 482190, "epoch": 5809} {"train_loss": -27.057464599609375, "global_step": 482191, "epoch": 5809} {"train_loss": -27.105010986328125, "global_step": 482192, "epoch": 5809} {"train_loss": -27.0176944732666, "global_step": 482193, "epoch": 5809} {"train_loss": -27.165807723999023, "global_step": 482194, "epoch": 5809} {"train_loss": -27.110082626342773, "global_step": 482195, "epoch": 5809} {"train_loss": -26.860980987548828, "global_step": 482196, "epoch": 5809} {"train_loss": -27.166717529296875, "global_step": 482197, "epoch": 5809} {"train_loss": -27.122045516967773, "global_step": 482198, "epoch": 5809} {"train_loss": -27.3764591217041, "global_step": 482199, "epoch": 5809} {"train_loss": -27.103412628173828, "global_step": 482200, "epoch": 5809} {"train_loss": -27.205127716064453, "global_step": 482201, "epoch": 5809} {"train_loss": -27.27924919128418, "global_step": 482202, "epoch": 5809} {"train_loss": -27.168655395507812, "global_step": 482203, "epoch": 5809} {"train_loss": -27.563486099243164, "global_step": 482204, "epoch": 5809} {"train_loss": -27.300779342651367, "global_step": 482205, "epoch": 5809} {"train_loss": -27.07795524597168, "global_step": 482206, "epoch": 5809} {"train_loss": -27.463821411132812, "global_step": 482207, "epoch": 5809} {"train_loss": -27.61000633239746, "global_step": 482208, "epoch": 5809} {"train_loss": -27.18207359313965, "global_step": 482209, "epoch": 5809} {"train_loss": -27.1391658782959, "global_step": 482210, "epoch": 5809} {"train_loss": -27.085540771484375, "global_step": 482211, "epoch": 5809} {"train_loss": -27.208398818969727, "global_step": 482212, "epoch": 5809} {"train_loss": -27.455078125, "global_step": 482213, "epoch": 5809} {"train_loss": -27.493261337280273, "global_step": 482214, "epoch": 5809} {"train_loss": -27.433263778686523, "global_step": 482215, "epoch": 5809} {"train_loss": -27.398773193359375, "global_step": 482216, "epoch": 5809} {"train_loss": -27.688873291015625, "global_step": 482217, "epoch": 5809} {"train_loss": -27.48245620727539, "global_step": 482218, "epoch": 5809} {"train_loss": -27.368207931518555, "global_step": 482219, "epoch": 5809} {"train_loss": -27.40470314025879, "global_step": 482220, "epoch": 5809} {"train_loss": -26.915441513061523, "global_step": 482221, "epoch": 5809} {"train_loss": -27.56037712097168, "global_step": 482222, "epoch": 5809} {"train_loss": -27.334980010986328, "global_step": 482223, "epoch": 5809} {"train_loss": -27.261091232299805, "global_step": 482224, "epoch": 5809} {"train_loss": -27.338468551635742, "global_step": 482225, "epoch": 5809} {"train_loss": -27.37921142578125, "global_step": 482226, "epoch": 5809} {"train_loss": -27.438074111938477, "global_step": 482227, "epoch": 5809} {"train_loss": -27.229650497436523, "global_step": 482228, "epoch": 5809} {"train_loss": -27.26739026264972, "global_step": 482229, "epoch": 5809, "val_loss": 6672623.0} {"train_loss": -26.514739990234375, "global_step": 482230, "epoch": 5810} {"train_loss": -26.510446548461914, "global_step": 482231, "epoch": 5810} {"train_loss": -26.459579467773438, "global_step": 482232, "epoch": 5810} {"train_loss": -26.104108810424805, "global_step": 482233, "epoch": 5810} {"train_loss": -27.284381866455078, "global_step": 482234, "epoch": 5810} {"train_loss": -26.679706573486328, "global_step": 482235, "epoch": 5810} {"train_loss": -26.724628448486328, "global_step": 482236, "epoch": 5810} {"train_loss": -26.694936752319336, "global_step": 482237, "epoch": 5810} {"train_loss": -26.11248207092285, "global_step": 482238, "epoch": 5810} {"train_loss": -26.652515411376953, "global_step": 482239, "epoch": 5810} {"train_loss": -26.328405380249023, "global_step": 482240, "epoch": 5810} {"train_loss": -26.567474365234375, "global_step": 482241, "epoch": 5810} {"train_loss": -26.641462326049805, "global_step": 482242, "epoch": 5810} {"train_loss": -26.832178115844727, "global_step": 482243, "epoch": 5810} {"train_loss": -26.59278678894043, "global_step": 482244, "epoch": 5810} {"train_loss": -26.48798942565918, "global_step": 482245, "epoch": 5810} {"train_loss": -26.7738037109375, "global_step": 482246, "epoch": 5810} {"train_loss": -26.74955177307129, "global_step": 482247, "epoch": 5810} {"train_loss": -27.258893966674805, "global_step": 482248, "epoch": 5810} {"train_loss": -26.819555282592773, "global_step": 482249, "epoch": 5810} {"train_loss": -26.96693229675293, "global_step": 482250, "epoch": 5810} {"train_loss": -26.949796676635742, "global_step": 482251, "epoch": 5810} {"train_loss": -26.9672908782959, "global_step": 482252, "epoch": 5810} {"train_loss": -26.924163818359375, "global_step": 482253, "epoch": 5810} {"train_loss": -27.02686882019043, "global_step": 482254, "epoch": 5810} {"train_loss": -26.9378604888916, "global_step": 482255, "epoch": 5810} {"train_loss": -26.971689224243164, "global_step": 482256, "epoch": 5810} {"train_loss": -27.182798385620117, "global_step": 482257, "epoch": 5810} {"train_loss": -26.897907257080078, "global_step": 482258, "epoch": 5810} {"train_loss": -27.079076766967773, "global_step": 482259, "epoch": 5810} {"train_loss": -27.105375289916992, "global_step": 482260, "epoch": 5810} {"train_loss": -26.9542179107666, "global_step": 482261, "epoch": 5810} {"train_loss": -27.440397262573242, "global_step": 482262, "epoch": 5810} {"train_loss": -27.213781356811523, "global_step": 482263, "epoch": 5810} {"train_loss": -27.160993576049805, "global_step": 482264, "epoch": 5810} {"train_loss": -27.235055923461914, "global_step": 482265, "epoch": 5810} {"train_loss": -27.378171920776367, "global_step": 482266, "epoch": 5810} {"train_loss": -27.223913192749023, "global_step": 482267, "epoch": 5810} {"train_loss": -27.143447875976562, "global_step": 482268, "epoch": 5810} {"train_loss": -27.314661026000977, "global_step": 482269, "epoch": 5810} {"train_loss": -27.221220016479492, "global_step": 482270, "epoch": 5810} {"train_loss": -27.09067153930664, "global_step": 482271, "epoch": 5810} {"train_loss": -27.043914794921875, "global_step": 482272, "epoch": 5810} {"train_loss": -27.00420570373535, "global_step": 482273, "epoch": 5810} {"train_loss": -27.37095069885254, "global_step": 482274, "epoch": 5810} {"train_loss": -27.740575790405273, "global_step": 482275, "epoch": 5810} {"train_loss": -27.223892211914062, "global_step": 482276, "epoch": 5810} {"train_loss": -26.924890518188477, "global_step": 482277, "epoch": 5810} {"train_loss": -27.020832061767578, "global_step": 482278, "epoch": 5810} {"train_loss": -27.09821891784668, "global_step": 482279, "epoch": 5810} {"train_loss": -26.88338279724121, "global_step": 482280, "epoch": 5810} {"train_loss": -27.488178253173828, "global_step": 482281, "epoch": 5810} {"train_loss": -27.121570587158203, "global_step": 482282, "epoch": 5810} {"train_loss": -27.59220314025879, "global_step": 482283, "epoch": 5810} {"train_loss": -27.4824161529541, "global_step": 482284, "epoch": 5810} {"train_loss": -27.08180809020996, "global_step": 482285, "epoch": 5810} {"train_loss": -27.379247665405273, "global_step": 482286, "epoch": 5810} {"train_loss": -27.320648193359375, "global_step": 482287, "epoch": 5810} {"train_loss": -27.1539249420166, "global_step": 482288, "epoch": 5810} {"train_loss": -27.139236450195312, "global_step": 482289, "epoch": 5810} {"train_loss": -27.184415817260742, "global_step": 482290, "epoch": 5810} {"train_loss": -26.324914932250977, "global_step": 482291, "epoch": 5810} {"train_loss": -26.351591110229492, "global_step": 482292, "epoch": 5810} {"train_loss": -26.27979850769043, "global_step": 482293, "epoch": 5810} {"train_loss": -27.279767990112305, "global_step": 482294, "epoch": 5810} {"train_loss": -27.5909481048584, "global_step": 482295, "epoch": 5810} {"train_loss": -26.8360538482666, "global_step": 482296, "epoch": 5810} {"train_loss": -26.61310386657715, "global_step": 482297, "epoch": 5810} {"train_loss": -27.3448543548584, "global_step": 482298, "epoch": 5810} {"train_loss": -27.185022354125977, "global_step": 482299, "epoch": 5810} {"train_loss": -27.58982276916504, "global_step": 482300, "epoch": 5810} {"train_loss": -26.927576065063477, "global_step": 482301, "epoch": 5810} {"train_loss": -27.412641525268555, "global_step": 482302, "epoch": 5810} {"train_loss": -27.248416900634766, "global_step": 482303, "epoch": 5810} {"train_loss": -27.74234390258789, "global_step": 482304, "epoch": 5810} {"train_loss": -27.456439971923828, "global_step": 482305, "epoch": 5810} {"train_loss": -27.06087303161621, "global_step": 482306, "epoch": 5810} {"train_loss": -27.754507064819336, "global_step": 482307, "epoch": 5810} {"train_loss": -27.002111434936523, "global_step": 482308, "epoch": 5810} {"train_loss": -27.47889518737793, "global_step": 482309, "epoch": 5810} {"train_loss": -27.22755241394043, "global_step": 482310, "epoch": 5810} {"train_loss": -27.317291259765625, "global_step": 482311, "epoch": 5810} {"train_loss": -27.027094369911286, "global_step": 482312, "epoch": 5810, "val_loss": 6595841.0} {"train_loss": -27.15399742126465, "global_step": 482313, "epoch": 5811} {"train_loss": -27.0751953125, "global_step": 482314, "epoch": 5811} {"train_loss": -26.536096572875977, "global_step": 482315, "epoch": 5811} {"train_loss": -27.484411239624023, "global_step": 482316, "epoch": 5811} {"train_loss": -26.76336097717285, "global_step": 482317, "epoch": 5811} {"train_loss": -26.629587173461914, "global_step": 482318, "epoch": 5811} {"train_loss": -26.36427879333496, "global_step": 482319, "epoch": 5811} {"train_loss": -26.171802520751953, "global_step": 482320, "epoch": 5811} {"train_loss": -26.428747177124023, "global_step": 482321, "epoch": 5811} {"train_loss": -27.04204750061035, "global_step": 482322, "epoch": 5811} {"train_loss": -26.753662109375, "global_step": 482323, "epoch": 5811} {"train_loss": -25.618682861328125, "global_step": 482324, "epoch": 5811} {"train_loss": -26.664472579956055, "global_step": 482325, "epoch": 5811} {"train_loss": -26.299421310424805, "global_step": 482326, "epoch": 5811} {"train_loss": -26.405675888061523, "global_step": 482327, "epoch": 5811} {"train_loss": -27.224218368530273, "global_step": 482328, "epoch": 5811} {"train_loss": -26.939746856689453, "global_step": 482329, "epoch": 5811} {"train_loss": -26.693784713745117, "global_step": 482330, "epoch": 5811} {"train_loss": -27.398618698120117, "global_step": 482331, "epoch": 5811} {"train_loss": -26.76352882385254, "global_step": 482332, "epoch": 5811} {"train_loss": -26.845590591430664, "global_step": 482333, "epoch": 5811} {"train_loss": -26.951507568359375, "global_step": 482334, "epoch": 5811} {"train_loss": -26.7384090423584, "global_step": 482335, "epoch": 5811} {"train_loss": -27.016637802124023, "global_step": 482336, "epoch": 5811} {"train_loss": -27.1092586517334, "global_step": 482337, "epoch": 5811} {"train_loss": -27.0985107421875, "global_step": 482338, "epoch": 5811} {"train_loss": -26.91587257385254, "global_step": 482339, "epoch": 5811} {"train_loss": -27.382360458374023, "global_step": 482340, "epoch": 5811} {"train_loss": -27.277790069580078, "global_step": 482341, "epoch": 5811} {"train_loss": -26.990949630737305, "global_step": 482342, "epoch": 5811} {"train_loss": -26.900793075561523, "global_step": 482343, "epoch": 5811} {"train_loss": -27.193822860717773, "global_step": 482344, "epoch": 5811} {"train_loss": -27.310876846313477, "global_step": 482345, "epoch": 5811} {"train_loss": -27.536945343017578, "global_step": 482346, "epoch": 5811} {"train_loss": -27.3284912109375, "global_step": 482347, "epoch": 5811} {"train_loss": -27.020238876342773, "global_step": 482348, "epoch": 5811} {"train_loss": -27.162702560424805, "global_step": 482349, "epoch": 5811} {"train_loss": -27.06298828125, "global_step": 482350, "epoch": 5811} {"train_loss": -27.244993209838867, "global_step": 482351, "epoch": 5811} {"train_loss": -27.354568481445312, "global_step": 482352, "epoch": 5811} {"train_loss": -27.239521026611328, "global_step": 482353, "epoch": 5811} {"train_loss": -27.345355987548828, "global_step": 482354, "epoch": 5811} {"train_loss": -27.38595962524414, "global_step": 482355, "epoch": 5811} {"train_loss": -27.5411376953125, "global_step": 482356, "epoch": 5811} {"train_loss": -27.233535766601562, "global_step": 482357, "epoch": 5811} {"train_loss": -26.96408462524414, "global_step": 482358, "epoch": 5811} {"train_loss": -27.076276779174805, "global_step": 482359, "epoch": 5811} {"train_loss": -27.146167755126953, "global_step": 482360, "epoch": 5811} {"train_loss": -27.3948974609375, "global_step": 482361, "epoch": 5811} {"train_loss": -27.12849235534668, "global_step": 482362, "epoch": 5811} {"train_loss": -27.160558700561523, "global_step": 482363, "epoch": 5811} {"train_loss": -27.082883834838867, "global_step": 482364, "epoch": 5811} {"train_loss": -27.319849014282227, "global_step": 482365, "epoch": 5811} {"train_loss": -27.501867294311523, "global_step": 482366, "epoch": 5811} {"train_loss": -27.27345085144043, "global_step": 482367, "epoch": 5811} {"train_loss": -27.436262130737305, "global_step": 482368, "epoch": 5811} {"train_loss": -27.091657638549805, "global_step": 482369, "epoch": 5811} {"train_loss": -27.156980514526367, "global_step": 482370, "epoch": 5811} {"train_loss": -27.073413848876953, "global_step": 482371, "epoch": 5811} {"train_loss": -26.752979278564453, "global_step": 482372, "epoch": 5811} {"train_loss": -27.07183837890625, "global_step": 482373, "epoch": 5811} {"train_loss": -27.18545913696289, "global_step": 482374, "epoch": 5811} {"train_loss": -27.353437423706055, "global_step": 482375, "epoch": 5811} {"train_loss": -27.397504806518555, "global_step": 482376, "epoch": 5811} {"train_loss": -27.185623168945312, "global_step": 482377, "epoch": 5811} {"train_loss": -27.62063980102539, "global_step": 482378, "epoch": 5811} {"train_loss": -27.725915908813477, "global_step": 482379, "epoch": 5811} {"train_loss": -27.387866973876953, "global_step": 482380, "epoch": 5811} {"train_loss": -27.44367790222168, "global_step": 482381, "epoch": 5811} {"train_loss": -26.999622344970703, "global_step": 482382, "epoch": 5811} {"train_loss": -27.164993286132812, "global_step": 482383, "epoch": 5811} {"train_loss": -27.23956871032715, "global_step": 482384, "epoch": 5811} {"train_loss": -27.377866744995117, "global_step": 482385, "epoch": 5811} {"train_loss": -27.40985107421875, "global_step": 482386, "epoch": 5811} {"train_loss": -26.811965942382812, "global_step": 482387, "epoch": 5811} {"train_loss": -27.316267013549805, "global_step": 482388, "epoch": 5811} {"train_loss": -27.0696964263916, "global_step": 482389, "epoch": 5811} {"train_loss": -27.460498809814453, "global_step": 482390, "epoch": 5811} {"train_loss": -27.582983016967773, "global_step": 482391, "epoch": 5811} {"train_loss": -27.60151481628418, "global_step": 482392, "epoch": 5811} {"train_loss": -27.077362060546875, "global_step": 482393, "epoch": 5811} {"train_loss": -27.059829711914062, "global_step": 482394, "epoch": 5811} {"train_loss": -27.0906609914389, "global_step": 482395, "epoch": 5811, "val_loss": 6680264.5} {"train_loss": -27.267425537109375, "global_step": 482396, "epoch": 5812} {"train_loss": -27.03931999206543, "global_step": 482397, "epoch": 5812} {"train_loss": -26.63311767578125, "global_step": 482398, "epoch": 5812} {"train_loss": -26.940872192382812, "global_step": 482399, "epoch": 5812} {"train_loss": -27.421911239624023, "global_step": 482400, "epoch": 5812} {"train_loss": -26.50433921813965, "global_step": 482401, "epoch": 5812} {"train_loss": -26.945505142211914, "global_step": 482402, "epoch": 5812} {"train_loss": -26.790130615234375, "global_step": 482403, "epoch": 5812} {"train_loss": -27.429956436157227, "global_step": 482404, "epoch": 5812} {"train_loss": -26.988040924072266, "global_step": 482405, "epoch": 5812} {"train_loss": -26.817489624023438, "global_step": 482406, "epoch": 5812} {"train_loss": -26.88014030456543, "global_step": 482407, "epoch": 5812} {"train_loss": -27.37880516052246, "global_step": 482408, "epoch": 5812} {"train_loss": -27.284353256225586, "global_step": 482409, "epoch": 5812} {"train_loss": -27.401418685913086, "global_step": 482410, "epoch": 5812} {"train_loss": -27.228071212768555, "global_step": 482411, "epoch": 5812} {"train_loss": -27.32916259765625, "global_step": 482412, "epoch": 5812} {"train_loss": -27.410511016845703, "global_step": 482413, "epoch": 5812} {"train_loss": -27.112930297851562, "global_step": 482414, "epoch": 5812} {"train_loss": -27.10316276550293, "global_step": 482415, "epoch": 5812} {"train_loss": -26.7348690032959, "global_step": 482416, "epoch": 5812} {"train_loss": -27.390625, "global_step": 482417, "epoch": 5812} {"train_loss": -27.15058708190918, "global_step": 482418, "epoch": 5812} {"train_loss": -27.697052001953125, "global_step": 482419, "epoch": 5812} {"train_loss": -27.419986724853516, "global_step": 482420, "epoch": 5812} {"train_loss": -27.383737564086914, "global_step": 482421, "epoch": 5812} {"train_loss": -27.40252113342285, "global_step": 482422, "epoch": 5812} {"train_loss": -27.483631134033203, "global_step": 482423, "epoch": 5812} {"train_loss": -27.15203857421875, "global_step": 482424, "epoch": 5812} {"train_loss": -27.551502227783203, "global_step": 482425, "epoch": 5812} {"train_loss": -27.50532341003418, "global_step": 482426, "epoch": 5812} {"train_loss": -27.45830726623535, "global_step": 482427, "epoch": 5812} {"train_loss": -27.350055694580078, "global_step": 482428, "epoch": 5812} {"train_loss": -27.580801010131836, "global_step": 482429, "epoch": 5812} {"train_loss": -27.368627548217773, "global_step": 482430, "epoch": 5812} {"train_loss": -27.426715850830078, "global_step": 482431, "epoch": 5812} {"train_loss": -27.6866455078125, "global_step": 482432, "epoch": 5812} {"train_loss": -27.610492706298828, "global_step": 482433, "epoch": 5812} {"train_loss": -27.468503952026367, "global_step": 482434, "epoch": 5812} {"train_loss": -27.644763946533203, "global_step": 482435, "epoch": 5812} {"train_loss": -27.540563583374023, "global_step": 482436, "epoch": 5812} {"train_loss": -27.324243545532227, "global_step": 482437, "epoch": 5812} {"train_loss": -27.975168228149414, "global_step": 482438, "epoch": 5812} {"train_loss": -26.925662994384766, "global_step": 482439, "epoch": 5812} {"train_loss": -27.372913360595703, "global_step": 482440, "epoch": 5812} {"train_loss": -27.5980167388916, "global_step": 482441, "epoch": 5812} {"train_loss": -27.5366268157959, "global_step": 482442, "epoch": 5812} {"train_loss": -27.5181884765625, "global_step": 482443, "epoch": 5812} {"train_loss": -27.0443058013916, "global_step": 482444, "epoch": 5812} {"train_loss": -27.497156143188477, "global_step": 482445, "epoch": 5812} {"train_loss": -27.357776641845703, "global_step": 482446, "epoch": 5812} {"train_loss": -26.937702178955078, "global_step": 482447, "epoch": 5812} {"train_loss": -27.564435958862305, "global_step": 482448, "epoch": 5812} {"train_loss": -27.328161239624023, "global_step": 482449, "epoch": 5812} {"train_loss": -26.877912521362305, "global_step": 482450, "epoch": 5812} {"train_loss": -27.155500411987305, "global_step": 482451, "epoch": 5812} {"train_loss": -27.15931510925293, "global_step": 482452, "epoch": 5812} {"train_loss": -27.725116729736328, "global_step": 482453, "epoch": 5812} {"train_loss": -27.13340187072754, "global_step": 482454, "epoch": 5812} {"train_loss": -27.048389434814453, "global_step": 482455, "epoch": 5812} {"train_loss": -27.362564086914062, "global_step": 482456, "epoch": 5812} {"train_loss": -27.529621124267578, "global_step": 482457, "epoch": 5812} {"train_loss": -27.131336212158203, "global_step": 482458, "epoch": 5812} {"train_loss": -27.112905502319336, "global_step": 482459, "epoch": 5812} {"train_loss": -27.363439559936523, "global_step": 482460, "epoch": 5812} {"train_loss": -27.196460723876953, "global_step": 482461, "epoch": 5812} {"train_loss": -27.554859161376953, "global_step": 482462, "epoch": 5812} {"train_loss": -27.007150650024414, "global_step": 482463, "epoch": 5812} {"train_loss": -26.965490341186523, "global_step": 482464, "epoch": 5812} {"train_loss": -26.880111694335938, "global_step": 482465, "epoch": 5812} {"train_loss": -27.214075088500977, "global_step": 482466, "epoch": 5812} {"train_loss": -27.562658309936523, "global_step": 482467, "epoch": 5812} {"train_loss": -27.186908721923828, "global_step": 482468, "epoch": 5812} {"train_loss": -27.21319007873535, "global_step": 482469, "epoch": 5812} {"train_loss": -26.672672271728516, "global_step": 482470, "epoch": 5812} {"train_loss": -26.88079261779785, "global_step": 482471, "epoch": 5812} {"train_loss": -26.827484130859375, "global_step": 482472, "epoch": 5812} {"train_loss": -27.298547744750977, "global_step": 482473, "epoch": 5812} {"train_loss": -26.587244033813477, "global_step": 482474, "epoch": 5812} {"train_loss": -27.1982364654541, "global_step": 482475, "epoch": 5812} {"train_loss": -27.2332820892334, "global_step": 482476, "epoch": 5812} {"train_loss": -27.285449981689453, "global_step": 482477, "epoch": 5812} {"train_loss": -27.226522974221105, "global_step": 482478, "epoch": 5812, "val_loss": 6692336.5} {"train_loss": -25.590269088745117, "global_step": 482479, "epoch": 5813} {"train_loss": -26.42962074279785, "global_step": 482480, "epoch": 5813} {"train_loss": -26.3442325592041, "global_step": 482481, "epoch": 5813} {"train_loss": -26.335229873657227, "global_step": 482482, "epoch": 5813} {"train_loss": -26.316864013671875, "global_step": 482483, "epoch": 5813} {"train_loss": -26.702518463134766, "global_step": 482484, "epoch": 5813} {"train_loss": -26.5393009185791, "global_step": 482485, "epoch": 5813} {"train_loss": -26.721601486206055, "global_step": 482486, "epoch": 5813} {"train_loss": -27.043365478515625, "global_step": 482487, "epoch": 5813} {"train_loss": -26.10633659362793, "global_step": 482488, "epoch": 5813} {"train_loss": -26.5894718170166, "global_step": 482489, "epoch": 5813} {"train_loss": -26.743345260620117, "global_step": 482490, "epoch": 5813} {"train_loss": -26.918292999267578, "global_step": 482491, "epoch": 5813} {"train_loss": -26.875125885009766, "global_step": 482492, "epoch": 5813} {"train_loss": -26.750513076782227, "global_step": 482493, "epoch": 5813} {"train_loss": -26.78363037109375, "global_step": 482494, "epoch": 5813} {"train_loss": -26.619140625, "global_step": 482495, "epoch": 5813} {"train_loss": -26.6361141204834, "global_step": 482496, "epoch": 5813} {"train_loss": -27.020177841186523, "global_step": 482497, "epoch": 5813} {"train_loss": -27.135574340820312, "global_step": 482498, "epoch": 5813} {"train_loss": -27.03456687927246, "global_step": 482499, "epoch": 5813} {"train_loss": -27.01532554626465, "global_step": 482500, "epoch": 5813} {"train_loss": -27.17775535583496, "global_step": 482501, "epoch": 5813} {"train_loss": -27.048871994018555, "global_step": 482502, "epoch": 5813} {"train_loss": -27.347461700439453, "global_step": 482503, "epoch": 5813} {"train_loss": -27.233510971069336, "global_step": 482504, "epoch": 5813} {"train_loss": -27.584070205688477, "global_step": 482505, "epoch": 5813} {"train_loss": -27.255664825439453, "global_step": 482506, "epoch": 5813} {"train_loss": -27.183643341064453, "global_step": 482507, "epoch": 5813} {"train_loss": -27.347564697265625, "global_step": 482508, "epoch": 5813} {"train_loss": -27.082260131835938, "global_step": 482509, "epoch": 5813} {"train_loss": -27.34528923034668, "global_step": 482510, "epoch": 5813} {"train_loss": -27.520261764526367, "global_step": 482511, "epoch": 5813} {"train_loss": -27.104785919189453, "global_step": 482512, "epoch": 5813} {"train_loss": -26.87824058532715, "global_step": 482513, "epoch": 5813} {"train_loss": -27.427936553955078, "global_step": 482514, "epoch": 5813} {"train_loss": -27.685592651367188, "global_step": 482515, "epoch": 5813} {"train_loss": -27.179962158203125, "global_step": 482516, "epoch": 5813} {"train_loss": -27.474353790283203, "global_step": 482517, "epoch": 5813} {"train_loss": -27.307464599609375, "global_step": 482518, "epoch": 5813} {"train_loss": -27.32611656188965, "global_step": 482519, "epoch": 5813} {"train_loss": -27.27860450744629, "global_step": 482520, "epoch": 5813} {"train_loss": -27.390653610229492, "global_step": 482521, "epoch": 5813} {"train_loss": -27.39944839477539, "global_step": 482522, "epoch": 5813} {"train_loss": -27.280912399291992, "global_step": 482523, "epoch": 5813} {"train_loss": -27.699188232421875, "global_step": 482524, "epoch": 5813} {"train_loss": -27.32486915588379, "global_step": 482525, "epoch": 5813} {"train_loss": -27.927967071533203, "global_step": 482526, "epoch": 5813} {"train_loss": -27.371082305908203, "global_step": 482527, "epoch": 5813} {"train_loss": -27.284687042236328, "global_step": 482528, "epoch": 5813} {"train_loss": -27.111408233642578, "global_step": 482529, "epoch": 5813} {"train_loss": -27.332000732421875, "global_step": 482530, "epoch": 5813} {"train_loss": -27.56166648864746, "global_step": 482531, "epoch": 5813} {"train_loss": -27.765363693237305, "global_step": 482532, "epoch": 5813} {"train_loss": -27.388355255126953, "global_step": 482533, "epoch": 5813} {"train_loss": -27.322553634643555, "global_step": 482534, "epoch": 5813} {"train_loss": -27.42597007751465, "global_step": 482535, "epoch": 5813} {"train_loss": -27.30887794494629, "global_step": 482536, "epoch": 5813} {"train_loss": -27.023733139038086, "global_step": 482537, "epoch": 5813} {"train_loss": -27.667123794555664, "global_step": 482538, "epoch": 5813} {"train_loss": -27.385669708251953, "global_step": 482539, "epoch": 5813} {"train_loss": -27.243244171142578, "global_step": 482540, "epoch": 5813} {"train_loss": -27.6218318939209, "global_step": 482541, "epoch": 5813} {"train_loss": -27.588733673095703, "global_step": 482542, "epoch": 5813} {"train_loss": -27.317493438720703, "global_step": 482543, "epoch": 5813} {"train_loss": -27.152219772338867, "global_step": 482544, "epoch": 5813} {"train_loss": -27.3599853515625, "global_step": 482545, "epoch": 5813} {"train_loss": -27.206836700439453, "global_step": 482546, "epoch": 5813} {"train_loss": -27.523462295532227, "global_step": 482547, "epoch": 5813} {"train_loss": -27.50848388671875, "global_step": 482548, "epoch": 5813} {"train_loss": -27.1824951171875, "global_step": 482549, "epoch": 5813} {"train_loss": -27.2310733795166, "global_step": 482550, "epoch": 5813} {"train_loss": -27.3907413482666, "global_step": 482551, "epoch": 5813} {"train_loss": -27.60914421081543, "global_step": 482552, "epoch": 5813} {"train_loss": -27.492572784423828, "global_step": 482553, "epoch": 5813} {"train_loss": -27.169580459594727, "global_step": 482554, "epoch": 5813} {"train_loss": -26.74665641784668, "global_step": 482555, "epoch": 5813} {"train_loss": -27.112869262695312, "global_step": 482556, "epoch": 5813} {"train_loss": -27.137939453125, "global_step": 482557, "epoch": 5813} {"train_loss": -27.230619430541992, "global_step": 482558, "epoch": 5813} {"train_loss": -26.925695419311523, "global_step": 482559, "epoch": 5813} {"train_loss": -27.142080307006836, "global_step": 482560, "epoch": 5813} {"train_loss": -27.118121526327478, "global_step": 482561, "epoch": 5813, "val_loss": 6685878.0} {"train_loss": -26.449268341064453, "global_step": 482562, "epoch": 5814} {"train_loss": -25.51544189453125, "global_step": 482563, "epoch": 5814} {"train_loss": -25.978256225585938, "global_step": 482564, "epoch": 5814} {"train_loss": -25.382570266723633, "global_step": 482565, "epoch": 5814} {"train_loss": -24.8571834564209, "global_step": 482566, "epoch": 5814} {"train_loss": -26.378137588500977, "global_step": 482567, "epoch": 5814} {"train_loss": -25.881778717041016, "global_step": 482568, "epoch": 5814} {"train_loss": -26.171432495117188, "global_step": 482569, "epoch": 5814} {"train_loss": -26.646875381469727, "global_step": 482570, "epoch": 5814} {"train_loss": -25.93964195251465, "global_step": 482571, "epoch": 5814} {"train_loss": -26.627304077148438, "global_step": 482572, "epoch": 5814} {"train_loss": -25.905364990234375, "global_step": 482573, "epoch": 5814} {"train_loss": -26.956268310546875, "global_step": 482574, "epoch": 5814} {"train_loss": -26.665842056274414, "global_step": 482575, "epoch": 5814} {"train_loss": -26.67072105407715, "global_step": 482576, "epoch": 5814} {"train_loss": -27.01141929626465, "global_step": 482577, "epoch": 5814} {"train_loss": -26.243896484375, "global_step": 482578, "epoch": 5814} {"train_loss": -26.5075626373291, "global_step": 482579, "epoch": 5814} {"train_loss": -26.536596298217773, "global_step": 482580, "epoch": 5814} {"train_loss": -26.37514305114746, "global_step": 482581, "epoch": 5814} {"train_loss": -26.850849151611328, "global_step": 482582, "epoch": 5814} {"train_loss": -26.682056427001953, "global_step": 482583, "epoch": 5814} {"train_loss": -26.703100204467773, "global_step": 482584, "epoch": 5814} {"train_loss": -26.86264419555664, "global_step": 482585, "epoch": 5814} {"train_loss": -27.09539222717285, "global_step": 482586, "epoch": 5814} {"train_loss": -26.883630752563477, "global_step": 482587, "epoch": 5814} {"train_loss": -26.850982666015625, "global_step": 482588, "epoch": 5814} {"train_loss": -27.180917739868164, "global_step": 482589, "epoch": 5814} {"train_loss": -27.0851993560791, "global_step": 482590, "epoch": 5814} {"train_loss": -27.02277946472168, "global_step": 482591, "epoch": 5814} {"train_loss": -27.232091903686523, "global_step": 482592, "epoch": 5814} {"train_loss": -26.892484664916992, "global_step": 482593, "epoch": 5814} {"train_loss": -27.063018798828125, "global_step": 482594, "epoch": 5814} {"train_loss": -27.000463485717773, "global_step": 482595, "epoch": 5814} {"train_loss": -27.56085205078125, "global_step": 482596, "epoch": 5814} {"train_loss": -27.211212158203125, "global_step": 482597, "epoch": 5814} {"train_loss": -27.50409507751465, "global_step": 482598, "epoch": 5814} {"train_loss": -27.200613021850586, "global_step": 482599, "epoch": 5814} {"train_loss": -27.121906280517578, "global_step": 482600, "epoch": 5814} {"train_loss": -27.304931640625, "global_step": 482601, "epoch": 5814} {"train_loss": -26.824377059936523, "global_step": 482602, "epoch": 5814} {"train_loss": -27.46897315979004, "global_step": 482603, "epoch": 5814} {"train_loss": -27.39772605895996, "global_step": 482604, "epoch": 5814} {"train_loss": -27.228246688842773, "global_step": 482605, "epoch": 5814} {"train_loss": -27.421253204345703, "global_step": 482606, "epoch": 5814} {"train_loss": -27.251331329345703, "global_step": 482607, "epoch": 5814} {"train_loss": -27.64875602722168, "global_step": 482608, "epoch": 5814} {"train_loss": -27.372344970703125, "global_step": 482609, "epoch": 5814} {"train_loss": -27.280014038085938, "global_step": 482610, "epoch": 5814} {"train_loss": -27.518997192382812, "global_step": 482611, "epoch": 5814} {"train_loss": -27.849945068359375, "global_step": 482612, "epoch": 5814} {"train_loss": -27.270658493041992, "global_step": 482613, "epoch": 5814} {"train_loss": -27.352508544921875, "global_step": 482614, "epoch": 5814} {"train_loss": -27.00001335144043, "global_step": 482615, "epoch": 5814} {"train_loss": -26.873111724853516, "global_step": 482616, "epoch": 5814} {"train_loss": -27.249677658081055, "global_step": 482617, "epoch": 5814} {"train_loss": -27.20758056640625, "global_step": 482618, "epoch": 5814} {"train_loss": -27.561904907226562, "global_step": 482619, "epoch": 5814} {"train_loss": -27.342618942260742, "global_step": 482620, "epoch": 5814} {"train_loss": -27.130878448486328, "global_step": 482621, "epoch": 5814} {"train_loss": -27.426258087158203, "global_step": 482622, "epoch": 5814} {"train_loss": -27.1331787109375, "global_step": 482623, "epoch": 5814} {"train_loss": -26.886987686157227, "global_step": 482624, "epoch": 5814} {"train_loss": -27.070035934448242, "global_step": 482625, "epoch": 5814} {"train_loss": -27.041372299194336, "global_step": 482626, "epoch": 5814} {"train_loss": -27.442276000976562, "global_step": 482627, "epoch": 5814} {"train_loss": -27.0130672454834, "global_step": 482628, "epoch": 5814} {"train_loss": -27.056562423706055, "global_step": 482629, "epoch": 5814} {"train_loss": -27.105554580688477, "global_step": 482630, "epoch": 5814} {"train_loss": -27.08302116394043, "global_step": 482631, "epoch": 5814} {"train_loss": -27.328262329101562, "global_step": 482632, "epoch": 5814} {"train_loss": -27.180830001831055, "global_step": 482633, "epoch": 5814} {"train_loss": -27.018396377563477, "global_step": 482634, "epoch": 5814} {"train_loss": -27.243925094604492, "global_step": 482635, "epoch": 5814} {"train_loss": -27.307458877563477, "global_step": 482636, "epoch": 5814} {"train_loss": -27.277679443359375, "global_step": 482637, "epoch": 5814} {"train_loss": -27.33408546447754, "global_step": 482638, "epoch": 5814} {"train_loss": -27.067724227905273, "global_step": 482639, "epoch": 5814} {"train_loss": -27.527862548828125, "global_step": 482640, "epoch": 5814} {"train_loss": -27.250732421875, "global_step": 482641, "epoch": 5814} {"train_loss": -27.22059440612793, "global_step": 482642, "epoch": 5814} {"train_loss": -27.257394790649414, "global_step": 482643, "epoch": 5814} {"train_loss": -26.9797145429864, "global_step": 482644, "epoch": 5814, "val_loss": 6640243.5} {"train_loss": -26.94046974182129, "global_step": 482645, "epoch": 5815} {"train_loss": -27.1380672454834, "global_step": 482646, "epoch": 5815} {"train_loss": -27.09514808654785, "global_step": 482647, "epoch": 5815} {"train_loss": -27.166873931884766, "global_step": 482648, "epoch": 5815} {"train_loss": -27.27008056640625, "global_step": 482649, "epoch": 5815} {"train_loss": -26.913745880126953, "global_step": 482650, "epoch": 5815} {"train_loss": -27.17133903503418, "global_step": 482651, "epoch": 5815} {"train_loss": -27.04302406311035, "global_step": 482652, "epoch": 5815} {"train_loss": -27.501678466796875, "global_step": 482653, "epoch": 5815} {"train_loss": -27.296100616455078, "global_step": 482654, "epoch": 5815} {"train_loss": -27.146963119506836, "global_step": 482655, "epoch": 5815} {"train_loss": -27.098865509033203, "global_step": 482656, "epoch": 5815} {"train_loss": -27.139163970947266, "global_step": 482657, "epoch": 5815} {"train_loss": -26.974151611328125, "global_step": 482658, "epoch": 5815} {"train_loss": -27.797657012939453, "global_step": 482659, "epoch": 5815} {"train_loss": -27.50555992126465, "global_step": 482660, "epoch": 5815} {"train_loss": -27.14276123046875, "global_step": 482661, "epoch": 5815} {"train_loss": -27.126296997070312, "global_step": 482662, "epoch": 5815} {"train_loss": -26.99928092956543, "global_step": 482663, "epoch": 5815} {"train_loss": -27.437475204467773, "global_step": 482664, "epoch": 5815} {"train_loss": -27.4571590423584, "global_step": 482665, "epoch": 5815} {"train_loss": -27.309097290039062, "global_step": 482666, "epoch": 5815} {"train_loss": -27.17829704284668, "global_step": 482667, "epoch": 5815} {"train_loss": -27.076780319213867, "global_step": 482668, "epoch": 5815} {"train_loss": -27.4327335357666, "global_step": 482669, "epoch": 5815} {"train_loss": -27.034881591796875, "global_step": 482670, "epoch": 5815} {"train_loss": -27.267812728881836, "global_step": 482671, "epoch": 5815} {"train_loss": -26.92598533630371, "global_step": 482672, "epoch": 5815} {"train_loss": -26.950231552124023, "global_step": 482673, "epoch": 5815} {"train_loss": -26.138601303100586, "global_step": 482674, "epoch": 5815} {"train_loss": -26.58597183227539, "global_step": 482675, "epoch": 5815} {"train_loss": -27.433698654174805, "global_step": 482676, "epoch": 5815} {"train_loss": -26.479475021362305, "global_step": 482677, "epoch": 5815} {"train_loss": -27.007810592651367, "global_step": 482678, "epoch": 5815} {"train_loss": -27.287006378173828, "global_step": 482679, "epoch": 5815} {"train_loss": -26.93427848815918, "global_step": 482680, "epoch": 5815} {"train_loss": -27.293216705322266, "global_step": 482681, "epoch": 5815} {"train_loss": -27.012378692626953, "global_step": 482682, "epoch": 5815} {"train_loss": -27.491321563720703, "global_step": 482683, "epoch": 5815} {"train_loss": -27.146467208862305, "global_step": 482684, "epoch": 5815} {"train_loss": -26.817907333374023, "global_step": 482685, "epoch": 5815} {"train_loss": -27.375762939453125, "global_step": 482686, "epoch": 5815} {"train_loss": -27.428430557250977, "global_step": 482687, "epoch": 5815} {"train_loss": -26.912805557250977, "global_step": 482688, "epoch": 5815} {"train_loss": -27.40863609313965, "global_step": 482689, "epoch": 5815} {"train_loss": -27.319610595703125, "global_step": 482690, "epoch": 5815} {"train_loss": -27.295499801635742, "global_step": 482691, "epoch": 5815} {"train_loss": -27.233612060546875, "global_step": 482692, "epoch": 5815} {"train_loss": -26.869070053100586, "global_step": 482693, "epoch": 5815} {"train_loss": -27.053464889526367, "global_step": 482694, "epoch": 5815} {"train_loss": -27.482513427734375, "global_step": 482695, "epoch": 5815} {"train_loss": -27.37798500061035, "global_step": 482696, "epoch": 5815} {"train_loss": -27.538604736328125, "global_step": 482697, "epoch": 5815} {"train_loss": -27.30032730102539, "global_step": 482698, "epoch": 5815} {"train_loss": -27.429859161376953, "global_step": 482699, "epoch": 5815} {"train_loss": -27.243194580078125, "global_step": 482700, "epoch": 5815} {"train_loss": -27.226285934448242, "global_step": 482701, "epoch": 5815} {"train_loss": -27.39471435546875, "global_step": 482702, "epoch": 5815} {"train_loss": -26.887420654296875, "global_step": 482703, "epoch": 5815} {"train_loss": -27.429584503173828, "global_step": 482704, "epoch": 5815} {"train_loss": -27.73810386657715, "global_step": 482705, "epoch": 5815} {"train_loss": -27.331832885742188, "global_step": 482706, "epoch": 5815} {"train_loss": -27.397741317749023, "global_step": 482707, "epoch": 5815} {"train_loss": -27.406721115112305, "global_step": 482708, "epoch": 5815} {"train_loss": -27.4593448638916, "global_step": 482709, "epoch": 5815} {"train_loss": -27.341955184936523, "global_step": 482710, "epoch": 5815} {"train_loss": -27.15266227722168, "global_step": 482711, "epoch": 5815} {"train_loss": -27.236982345581055, "global_step": 482712, "epoch": 5815} {"train_loss": -26.97781753540039, "global_step": 482713, "epoch": 5815} {"train_loss": -27.050580978393555, "global_step": 482714, "epoch": 5815} {"train_loss": -27.221267700195312, "global_step": 482715, "epoch": 5815} {"train_loss": -27.044525146484375, "global_step": 482716, "epoch": 5815} {"train_loss": -27.59848976135254, "global_step": 482717, "epoch": 5815} {"train_loss": -26.920761108398438, "global_step": 482718, "epoch": 5815} {"train_loss": -27.584375381469727, "global_step": 482719, "epoch": 5815} {"train_loss": -27.630701065063477, "global_step": 482720, "epoch": 5815} {"train_loss": -27.284826278686523, "global_step": 482721, "epoch": 5815} {"train_loss": -27.37835693359375, "global_step": 482722, "epoch": 5815} {"train_loss": -27.659320831298828, "global_step": 482723, "epoch": 5815} {"train_loss": -27.1666259765625, "global_step": 482724, "epoch": 5815} {"train_loss": -27.58697509765625, "global_step": 482725, "epoch": 5815} {"train_loss": -27.23151969909668, "global_step": 482726, "epoch": 5815} {"train_loss": -27.220274798841363, "global_step": 482727, "epoch": 5815, "val_loss": 6713706.0} {"train_loss": -26.850305557250977, "global_step": 482728, "epoch": 5816} {"train_loss": -26.496389389038086, "global_step": 482729, "epoch": 5816} {"train_loss": -26.902212142944336, "global_step": 482730, "epoch": 5816} {"train_loss": -26.714813232421875, "global_step": 482731, "epoch": 5816} {"train_loss": -26.930761337280273, "global_step": 482732, "epoch": 5816} {"train_loss": -26.842992782592773, "global_step": 482733, "epoch": 5816} {"train_loss": -26.8114070892334, "global_step": 482734, "epoch": 5816} {"train_loss": -27.12409019470215, "global_step": 482735, "epoch": 5816} {"train_loss": -27.0170955657959, "global_step": 482736, "epoch": 5816} {"train_loss": -26.699514389038086, "global_step": 482737, "epoch": 5816} {"train_loss": -27.010175704956055, "global_step": 482738, "epoch": 5816} {"train_loss": -27.19440269470215, "global_step": 482739, "epoch": 5816} {"train_loss": -27.396228790283203, "global_step": 482740, "epoch": 5816} {"train_loss": -27.413366317749023, "global_step": 482741, "epoch": 5816} {"train_loss": -26.981475830078125, "global_step": 482742, "epoch": 5816} {"train_loss": -27.3812313079834, "global_step": 482743, "epoch": 5816} {"train_loss": -27.218738555908203, "global_step": 482744, "epoch": 5816} {"train_loss": -27.11725425720215, "global_step": 482745, "epoch": 5816} {"train_loss": -26.8151912689209, "global_step": 482746, "epoch": 5816} {"train_loss": -27.012449264526367, "global_step": 482747, "epoch": 5816} {"train_loss": -27.298925399780273, "global_step": 482748, "epoch": 5816} {"train_loss": -27.167638778686523, "global_step": 482749, "epoch": 5816} {"train_loss": -27.169546127319336, "global_step": 482750, "epoch": 5816} {"train_loss": -27.20916748046875, "global_step": 482751, "epoch": 5816} {"train_loss": -27.324506759643555, "global_step": 482752, "epoch": 5816} {"train_loss": -27.13129234313965, "global_step": 482753, "epoch": 5816} {"train_loss": -27.231443405151367, "global_step": 482754, "epoch": 5816} {"train_loss": -27.011987686157227, "global_step": 482755, "epoch": 5816} {"train_loss": -27.17462730407715, "global_step": 482756, "epoch": 5816} {"train_loss": -27.37189292907715, "global_step": 482757, "epoch": 5816} {"train_loss": -27.464590072631836, "global_step": 482758, "epoch": 5816} {"train_loss": -27.107009887695312, "global_step": 482759, "epoch": 5816} {"train_loss": -27.160764694213867, "global_step": 482760, "epoch": 5816} {"train_loss": -27.4395809173584, "global_step": 482761, "epoch": 5816} {"train_loss": -27.532140731811523, "global_step": 482762, "epoch": 5816} {"train_loss": -27.652490615844727, "global_step": 482763, "epoch": 5816} {"train_loss": -27.416318893432617, "global_step": 482764, "epoch": 5816} {"train_loss": -27.4691219329834, "global_step": 482765, "epoch": 5816} {"train_loss": -27.556995391845703, "global_step": 482766, "epoch": 5816} {"train_loss": -27.47272300720215, "global_step": 482767, "epoch": 5816} {"train_loss": -27.28229331970215, "global_step": 482768, "epoch": 5816} {"train_loss": -27.246091842651367, "global_step": 482769, "epoch": 5816} {"train_loss": -27.522632598876953, "global_step": 482770, "epoch": 5816} {"train_loss": -27.6702880859375, "global_step": 482771, "epoch": 5816} {"train_loss": -27.034719467163086, "global_step": 482772, "epoch": 5816} {"train_loss": -26.791486740112305, "global_step": 482773, "epoch": 5816} {"train_loss": -26.451398849487305, "global_step": 482774, "epoch": 5816} {"train_loss": -26.56406021118164, "global_step": 482775, "epoch": 5816} {"train_loss": -27.354705810546875, "global_step": 482776, "epoch": 5816} {"train_loss": -27.36878776550293, "global_step": 482777, "epoch": 5816} {"train_loss": -26.48115348815918, "global_step": 482778, "epoch": 5816} {"train_loss": -26.4873046875, "global_step": 482779, "epoch": 5816} {"train_loss": -26.3961181640625, "global_step": 482780, "epoch": 5816} {"train_loss": -27.34259605407715, "global_step": 482781, "epoch": 5816} {"train_loss": -26.876373291015625, "global_step": 482782, "epoch": 5816} {"train_loss": -27.285755157470703, "global_step": 482783, "epoch": 5816} {"train_loss": -26.96430778503418, "global_step": 482784, "epoch": 5816} {"train_loss": -27.154836654663086, "global_step": 482785, "epoch": 5816} {"train_loss": -26.915119171142578, "global_step": 482786, "epoch": 5816} {"train_loss": -26.925678253173828, "global_step": 482787, "epoch": 5816} {"train_loss": -27.19186782836914, "global_step": 482788, "epoch": 5816} {"train_loss": -26.876829147338867, "global_step": 482789, "epoch": 5816} {"train_loss": -27.576391220092773, "global_step": 482790, "epoch": 5816} {"train_loss": -26.85499382019043, "global_step": 482791, "epoch": 5816} {"train_loss": -27.46599769592285, "global_step": 482792, "epoch": 5816} {"train_loss": -26.904239654541016, "global_step": 482793, "epoch": 5816} {"train_loss": -27.149978637695312, "global_step": 482794, "epoch": 5816} {"train_loss": -27.316686630249023, "global_step": 482795, "epoch": 5816} {"train_loss": -27.219213485717773, "global_step": 482796, "epoch": 5816} {"train_loss": -26.80262565612793, "global_step": 482797, "epoch": 5816} {"train_loss": -27.271350860595703, "global_step": 482798, "epoch": 5816} {"train_loss": -27.306760787963867, "global_step": 482799, "epoch": 5816} {"train_loss": -27.27699089050293, "global_step": 482800, "epoch": 5816} {"train_loss": -27.127395629882812, "global_step": 482801, "epoch": 5816} {"train_loss": -27.219846725463867, "global_step": 482802, "epoch": 5816} {"train_loss": -27.4231014251709, "global_step": 482803, "epoch": 5816} {"train_loss": -27.269102096557617, "global_step": 482804, "epoch": 5816} {"train_loss": -27.093469619750977, "global_step": 482805, "epoch": 5816} {"train_loss": -26.98517417907715, "global_step": 482806, "epoch": 5816} {"train_loss": -27.6147518157959, "global_step": 482807, "epoch": 5816} {"train_loss": -27.336151123046875, "global_step": 482808, "epoch": 5816} {"train_loss": -27.58136558532715, "global_step": 482809, "epoch": 5816} {"train_loss": -27.14099001597209, "global_step": 482810, "epoch": 5816, "val_loss": 6600043.0} {"train_loss": -26.975622177124023, "global_step": 482811, "epoch": 5817} {"train_loss": -27.16071128845215, "global_step": 482812, "epoch": 5817} {"train_loss": -27.21424674987793, "global_step": 482813, "epoch": 5817} {"train_loss": -27.1168155670166, "global_step": 482814, "epoch": 5817} {"train_loss": -27.015207290649414, "global_step": 482815, "epoch": 5817} {"train_loss": -27.12558937072754, "global_step": 482816, "epoch": 5817} {"train_loss": -27.053699493408203, "global_step": 482817, "epoch": 5817} {"train_loss": -26.848133087158203, "global_step": 482818, "epoch": 5817} {"train_loss": -27.579084396362305, "global_step": 482819, "epoch": 5817} {"train_loss": -27.198108673095703, "global_step": 482820, "epoch": 5817} {"train_loss": -27.609403610229492, "global_step": 482821, "epoch": 5817} {"train_loss": -27.46368408203125, "global_step": 482822, "epoch": 5817} {"train_loss": -27.35212516784668, "global_step": 482823, "epoch": 5817} {"train_loss": -27.12847900390625, "global_step": 482824, "epoch": 5817} {"train_loss": -27.41629981994629, "global_step": 482825, "epoch": 5817} {"train_loss": -27.125696182250977, "global_step": 482826, "epoch": 5817} {"train_loss": -27.64910316467285, "global_step": 482827, "epoch": 5817} {"train_loss": -27.235998153686523, "global_step": 482828, "epoch": 5817} {"train_loss": -27.438568115234375, "global_step": 482829, "epoch": 5817} {"train_loss": -27.21941566467285, "global_step": 482830, "epoch": 5817} {"train_loss": -27.38417625427246, "global_step": 482831, "epoch": 5817} {"train_loss": -27.091632843017578, "global_step": 482832, "epoch": 5817} {"train_loss": -27.317846298217773, "global_step": 482833, "epoch": 5817} {"train_loss": -27.10992431640625, "global_step": 482834, "epoch": 5817} {"train_loss": -27.180484771728516, "global_step": 482835, "epoch": 5817} {"train_loss": -27.213459014892578, "global_step": 482836, "epoch": 5817} {"train_loss": -27.162372589111328, "global_step": 482837, "epoch": 5817} {"train_loss": -26.974231719970703, "global_step": 482838, "epoch": 5817} {"train_loss": -27.278717041015625, "global_step": 482839, "epoch": 5817} {"train_loss": -27.4276123046875, "global_step": 482840, "epoch": 5817} {"train_loss": -27.001195907592773, "global_step": 482841, "epoch": 5817} {"train_loss": -27.199161529541016, "global_step": 482842, "epoch": 5817} {"train_loss": -26.565515518188477, "global_step": 482843, "epoch": 5817} {"train_loss": -27.27105712890625, "global_step": 482844, "epoch": 5817} {"train_loss": -27.1418514251709, "global_step": 482845, "epoch": 5817} {"train_loss": -26.87970542907715, "global_step": 482846, "epoch": 5817} {"train_loss": -26.2969970703125, "global_step": 482847, "epoch": 5817} {"train_loss": -26.919178009033203, "global_step": 482848, "epoch": 5817} {"train_loss": -26.842771530151367, "global_step": 482849, "epoch": 5817} {"train_loss": -26.284849166870117, "global_step": 482850, "epoch": 5817} {"train_loss": -26.623762130737305, "global_step": 482851, "epoch": 5817} {"train_loss": -26.795013427734375, "global_step": 482852, "epoch": 5817} {"train_loss": -26.933629989624023, "global_step": 482853, "epoch": 5817} {"train_loss": -26.74567222595215, "global_step": 482854, "epoch": 5817} {"train_loss": -26.81402587890625, "global_step": 482855, "epoch": 5817} {"train_loss": -26.777790069580078, "global_step": 482856, "epoch": 5817} {"train_loss": -27.483551025390625, "global_step": 482857, "epoch": 5817} {"train_loss": -26.788421630859375, "global_step": 482858, "epoch": 5817} {"train_loss": -27.142993927001953, "global_step": 482859, "epoch": 5817} {"train_loss": -27.07171058654785, "global_step": 482860, "epoch": 5817} {"train_loss": -26.94025230407715, "global_step": 482861, "epoch": 5817} {"train_loss": -27.478418350219727, "global_step": 482862, "epoch": 5817} {"train_loss": -27.070133209228516, "global_step": 482863, "epoch": 5817} {"train_loss": -27.084918975830078, "global_step": 482864, "epoch": 5817} {"train_loss": -27.3089542388916, "global_step": 482865, "epoch": 5817} {"train_loss": -27.409103393554688, "global_step": 482866, "epoch": 5817} {"train_loss": -27.094970703125, "global_step": 482867, "epoch": 5817} {"train_loss": -27.234954833984375, "global_step": 482868, "epoch": 5817} {"train_loss": -26.7841854095459, "global_step": 482869, "epoch": 5817} {"train_loss": -27.018346786499023, "global_step": 482870, "epoch": 5817} {"train_loss": -27.229480743408203, "global_step": 482871, "epoch": 5817} {"train_loss": -27.34029197692871, "global_step": 482872, "epoch": 5817} {"train_loss": -27.255706787109375, "global_step": 482873, "epoch": 5817} {"train_loss": -27.243749618530273, "global_step": 482874, "epoch": 5817} {"train_loss": -26.840429306030273, "global_step": 482875, "epoch": 5817} {"train_loss": -27.41098403930664, "global_step": 482876, "epoch": 5817} {"train_loss": -27.362619400024414, "global_step": 482877, "epoch": 5817} {"train_loss": -27.204675674438477, "global_step": 482878, "epoch": 5817} {"train_loss": -27.434600830078125, "global_step": 482879, "epoch": 5817} {"train_loss": -27.506261825561523, "global_step": 482880, "epoch": 5817} {"train_loss": -27.45662498474121, "global_step": 482881, "epoch": 5817} {"train_loss": -27.381071090698242, "global_step": 482882, "epoch": 5817} {"train_loss": -27.569477081298828, "global_step": 482883, "epoch": 5817} {"train_loss": -27.011749267578125, "global_step": 482884, "epoch": 5817} {"train_loss": -27.396595001220703, "global_step": 482885, "epoch": 5817} {"train_loss": -27.24879264831543, "global_step": 482886, "epoch": 5817} {"train_loss": -27.544178009033203, "global_step": 482887, "epoch": 5817} {"train_loss": -27.90091323852539, "global_step": 482888, "epoch": 5817} {"train_loss": -27.253076553344727, "global_step": 482889, "epoch": 5817} {"train_loss": -27.1392822265625, "global_step": 482890, "epoch": 5817} {"train_loss": -27.066150665283203, "global_step": 482891, "epoch": 5817} {"train_loss": -27.127099990844727, "global_step": 482892, "epoch": 5817} {"train_loss": -27.170296427715254, "global_step": 482893, "epoch": 5817, "val_loss": 6700234.0} {"train_loss": -26.837726593017578, "global_step": 482894, "epoch": 5818} {"train_loss": -27.0396728515625, "global_step": 482895, "epoch": 5818} {"train_loss": -27.006261825561523, "global_step": 482896, "epoch": 5818} {"train_loss": -27.007339477539062, "global_step": 482897, "epoch": 5818} {"train_loss": -26.597681045532227, "global_step": 482898, "epoch": 5818} {"train_loss": -26.558740615844727, "global_step": 482899, "epoch": 5818} {"train_loss": -26.7363224029541, "global_step": 482900, "epoch": 5818} {"train_loss": -26.881879806518555, "global_step": 482901, "epoch": 5818} {"train_loss": -27.06638526916504, "global_step": 482902, "epoch": 5818} {"train_loss": -27.109878540039062, "global_step": 482903, "epoch": 5818} {"train_loss": -27.103397369384766, "global_step": 482904, "epoch": 5818} {"train_loss": -27.048633575439453, "global_step": 482905, "epoch": 5818} {"train_loss": -27.164825439453125, "global_step": 482906, "epoch": 5818} {"train_loss": -27.12135124206543, "global_step": 482907, "epoch": 5818} {"train_loss": -27.10569190979004, "global_step": 482908, "epoch": 5818} {"train_loss": -27.368932723999023, "global_step": 482909, "epoch": 5818} {"train_loss": -27.2594051361084, "global_step": 482910, "epoch": 5818} {"train_loss": -27.542831420898438, "global_step": 482911, "epoch": 5818} {"train_loss": -27.3353328704834, "global_step": 482912, "epoch": 5818} {"train_loss": -27.184921264648438, "global_step": 482913, "epoch": 5818} {"train_loss": -27.00031852722168, "global_step": 482914, "epoch": 5818} {"train_loss": -27.61469841003418, "global_step": 482915, "epoch": 5818} {"train_loss": -27.24200439453125, "global_step": 482916, "epoch": 5818} {"train_loss": -26.9674015045166, "global_step": 482917, "epoch": 5818} {"train_loss": -27.444721221923828, "global_step": 482918, "epoch": 5818} {"train_loss": -27.29486083984375, "global_step": 482919, "epoch": 5818} {"train_loss": -26.70082664489746, "global_step": 482920, "epoch": 5818} {"train_loss": -26.9818172454834, "global_step": 482921, "epoch": 5818} {"train_loss": -27.094114303588867, "global_step": 482922, "epoch": 5818} {"train_loss": -27.208845138549805, "global_step": 482923, "epoch": 5818} {"train_loss": -27.11572265625, "global_step": 482924, "epoch": 5818} {"train_loss": -27.02398109436035, "global_step": 482925, "epoch": 5818} {"train_loss": -27.36551856994629, "global_step": 482926, "epoch": 5818} {"train_loss": -27.355545043945312, "global_step": 482927, "epoch": 5818} {"train_loss": -26.863462448120117, "global_step": 482928, "epoch": 5818} {"train_loss": -27.471105575561523, "global_step": 482929, "epoch": 5818} {"train_loss": -27.341094970703125, "global_step": 482930, "epoch": 5818} {"train_loss": -26.857990264892578, "global_step": 482931, "epoch": 5818} {"train_loss": -27.443145751953125, "global_step": 482932, "epoch": 5818} {"train_loss": -27.190536499023438, "global_step": 482933, "epoch": 5818} {"train_loss": -27.369140625, "global_step": 482934, "epoch": 5818} {"train_loss": -27.395193099975586, "global_step": 482935, "epoch": 5818} {"train_loss": -27.380537033081055, "global_step": 482936, "epoch": 5818} {"train_loss": -27.2563419342041, "global_step": 482937, "epoch": 5818} {"train_loss": -27.270078659057617, "global_step": 482938, "epoch": 5818} {"train_loss": -27.504837036132812, "global_step": 482939, "epoch": 5818} {"train_loss": -27.155105590820312, "global_step": 482940, "epoch": 5818} {"train_loss": -27.31158447265625, "global_step": 482941, "epoch": 5818} {"train_loss": -27.321853637695312, "global_step": 482942, "epoch": 5818} {"train_loss": -26.814807891845703, "global_step": 482943, "epoch": 5818} {"train_loss": -26.056045532226562, "global_step": 482944, "epoch": 5818} {"train_loss": -25.6794490814209, "global_step": 482945, "epoch": 5818} {"train_loss": -26.39638328552246, "global_step": 482946, "epoch": 5818} {"train_loss": -27.21368408203125, "global_step": 482947, "epoch": 5818} {"train_loss": -26.69855308532715, "global_step": 482948, "epoch": 5818} {"train_loss": -26.703113555908203, "global_step": 482949, "epoch": 5818} {"train_loss": -27.13051414489746, "global_step": 482950, "epoch": 5818} {"train_loss": -27.328296661376953, "global_step": 482951, "epoch": 5818} {"train_loss": -26.770465850830078, "global_step": 482952, "epoch": 5818} {"train_loss": -26.8550968170166, "global_step": 482953, "epoch": 5818} {"train_loss": -27.170654296875, "global_step": 482954, "epoch": 5818} {"train_loss": -27.22802734375, "global_step": 482955, "epoch": 5818} {"train_loss": -26.7255802154541, "global_step": 482956, "epoch": 5818} {"train_loss": -27.27254295349121, "global_step": 482957, "epoch": 5818} {"train_loss": -27.089792251586914, "global_step": 482958, "epoch": 5818} {"train_loss": -26.8747615814209, "global_step": 482959, "epoch": 5818} {"train_loss": -26.889738082885742, "global_step": 482960, "epoch": 5818} {"train_loss": -27.11590576171875, "global_step": 482961, "epoch": 5818} {"train_loss": -27.189105987548828, "global_step": 482962, "epoch": 5818} {"train_loss": -27.049835205078125, "global_step": 482963, "epoch": 5818} {"train_loss": -27.143774032592773, "global_step": 482964, "epoch": 5818} {"train_loss": -27.23121452331543, "global_step": 482965, "epoch": 5818} {"train_loss": -27.6152400970459, "global_step": 482966, "epoch": 5818} {"train_loss": -27.302282333374023, "global_step": 482967, "epoch": 5818} {"train_loss": -27.277027130126953, "global_step": 482968, "epoch": 5818} {"train_loss": -27.2954158782959, "global_step": 482969, "epoch": 5818} {"train_loss": -27.23115348815918, "global_step": 482970, "epoch": 5818} {"train_loss": -27.153100967407227, "global_step": 482971, "epoch": 5818} {"train_loss": -27.577213287353516, "global_step": 482972, "epoch": 5818} {"train_loss": -26.979248046875, "global_step": 482973, "epoch": 5818} {"train_loss": -27.0661678314209, "global_step": 482974, "epoch": 5818} {"train_loss": -27.27276039123535, "global_step": 482975, "epoch": 5818} {"train_loss": -27.09818532093462, "global_step": 482976, "epoch": 5818, "val_loss": 6575610.0} {"train_loss": -26.463468551635742, "global_step": 482977, "epoch": 5819} {"train_loss": -26.295303344726562, "global_step": 482978, "epoch": 5819} {"train_loss": -26.472867965698242, "global_step": 482979, "epoch": 5819} {"train_loss": -26.790380477905273, "global_step": 482980, "epoch": 5819} {"train_loss": -26.9223575592041, "global_step": 482981, "epoch": 5819} {"train_loss": -26.681493759155273, "global_step": 482982, "epoch": 5819} {"train_loss": -27.036457061767578, "global_step": 482983, "epoch": 5819} {"train_loss": -27.115787506103516, "global_step": 482984, "epoch": 5819} {"train_loss": -26.862524032592773, "global_step": 482985, "epoch": 5819} {"train_loss": -27.379316329956055, "global_step": 482986, "epoch": 5819} {"train_loss": -27.015661239624023, "global_step": 482987, "epoch": 5819} {"train_loss": -26.906030654907227, "global_step": 482988, "epoch": 5819} {"train_loss": -27.153329849243164, "global_step": 482989, "epoch": 5819} {"train_loss": -27.0726318359375, "global_step": 482990, "epoch": 5819} {"train_loss": -26.5683650970459, "global_step": 482991, "epoch": 5819} {"train_loss": -27.095056533813477, "global_step": 482992, "epoch": 5819} {"train_loss": -26.637739181518555, "global_step": 482993, "epoch": 5819} {"train_loss": -27.279998779296875, "global_step": 482994, "epoch": 5819} {"train_loss": -27.269378662109375, "global_step": 482995, "epoch": 5819} {"train_loss": -27.405731201171875, "global_step": 482996, "epoch": 5819} {"train_loss": -27.391651153564453, "global_step": 482997, "epoch": 5819} {"train_loss": -27.092432022094727, "global_step": 482998, "epoch": 5819} {"train_loss": -27.1816349029541, "global_step": 482999, "epoch": 5819} {"train_loss": -26.89422035217285, "global_step": 483000, "epoch": 5819} {"train_loss": -27.334320068359375, "global_step": 483001, "epoch": 5819} {"train_loss": -27.10849380493164, "global_step": 483002, "epoch": 5819} {"train_loss": -26.90107536315918, "global_step": 483003, "epoch": 5819} {"train_loss": -27.115036010742188, "global_step": 483004, "epoch": 5819} {"train_loss": -27.457721710205078, "global_step": 483005, "epoch": 5819} {"train_loss": -27.30953025817871, "global_step": 483006, "epoch": 5819} {"train_loss": -27.66045570373535, "global_step": 483007, "epoch": 5819} {"train_loss": -27.493865966796875, "global_step": 483008, "epoch": 5819} {"train_loss": -27.637441635131836, "global_step": 483009, "epoch": 5819} {"train_loss": -27.058568954467773, "global_step": 483010, "epoch": 5819} {"train_loss": -27.41330909729004, "global_step": 483011, "epoch": 5819} {"train_loss": -27.28278923034668, "global_step": 483012, "epoch": 5819} {"train_loss": -27.128005981445312, "global_step": 483013, "epoch": 5819} {"train_loss": -27.3206844329834, "global_step": 483014, "epoch": 5819} {"train_loss": -27.490148544311523, "global_step": 483015, "epoch": 5819} {"train_loss": -27.350894927978516, "global_step": 483016, "epoch": 5819} {"train_loss": -27.438705444335938, "global_step": 483017, "epoch": 5819} {"train_loss": -27.52195167541504, "global_step": 483018, "epoch": 5819} {"train_loss": -27.48212242126465, "global_step": 483019, "epoch": 5819} {"train_loss": -27.099658966064453, "global_step": 483020, "epoch": 5819} {"train_loss": -27.45473289489746, "global_step": 483021, "epoch": 5819} {"train_loss": -27.360925674438477, "global_step": 483022, "epoch": 5819} {"train_loss": -27.541677474975586, "global_step": 483023, "epoch": 5819} {"train_loss": -27.73542594909668, "global_step": 483024, "epoch": 5819} {"train_loss": -27.588821411132812, "global_step": 483025, "epoch": 5819} {"train_loss": -27.36492919921875, "global_step": 483026, "epoch": 5819} {"train_loss": -26.89944839477539, "global_step": 483027, "epoch": 5819} {"train_loss": -27.649961471557617, "global_step": 483028, "epoch": 5819} {"train_loss": -27.59535789489746, "global_step": 483029, "epoch": 5819} {"train_loss": -27.454755783081055, "global_step": 483030, "epoch": 5819} {"train_loss": -27.428741455078125, "global_step": 483031, "epoch": 5819} {"train_loss": -27.749914169311523, "global_step": 483032, "epoch": 5819} {"train_loss": -27.515960693359375, "global_step": 483033, "epoch": 5819} {"train_loss": -27.152667999267578, "global_step": 483034, "epoch": 5819} {"train_loss": -27.485004425048828, "global_step": 483035, "epoch": 5819} {"train_loss": -27.394018173217773, "global_step": 483036, "epoch": 5819} {"train_loss": -27.43196678161621, "global_step": 483037, "epoch": 5819} {"train_loss": -27.536346435546875, "global_step": 483038, "epoch": 5819} {"train_loss": -27.3665771484375, "global_step": 483039, "epoch": 5819} {"train_loss": -27.34781837463379, "global_step": 483040, "epoch": 5819} {"train_loss": -27.20318603515625, "global_step": 483041, "epoch": 5819} {"train_loss": -27.256017684936523, "global_step": 483042, "epoch": 5819} {"train_loss": -27.2702693939209, "global_step": 483043, "epoch": 5819} {"train_loss": -27.120447158813477, "global_step": 483044, "epoch": 5819} {"train_loss": -26.84427833557129, "global_step": 483045, "epoch": 5819} {"train_loss": -26.68031120300293, "global_step": 483046, "epoch": 5819} {"train_loss": -26.422561645507812, "global_step": 483047, "epoch": 5819} {"train_loss": -26.551809310913086, "global_step": 483048, "epoch": 5819} {"train_loss": -26.966093063354492, "global_step": 483049, "epoch": 5819} {"train_loss": -26.849584579467773, "global_step": 483050, "epoch": 5819} {"train_loss": -27.12604331970215, "global_step": 483051, "epoch": 5819} {"train_loss": -26.491987228393555, "global_step": 483052, "epoch": 5819} {"train_loss": -26.976667404174805, "global_step": 483053, "epoch": 5819} {"train_loss": -26.988046646118164, "global_step": 483054, "epoch": 5819} {"train_loss": -26.897964477539062, "global_step": 483055, "epoch": 5819} {"train_loss": -27.0274600982666, "global_step": 483056, "epoch": 5819} {"train_loss": -27.27583885192871, "global_step": 483057, "epoch": 5819} {"train_loss": -26.876026153564453, "global_step": 483058, "epoch": 5819} {"train_loss": -27.17856944899961, "global_step": 483059, "epoch": 5819, "val_loss": 6451056.0} {"train_loss": -26.520221710205078, "global_step": 483060, "epoch": 5820} {"train_loss": -26.686798095703125, "global_step": 483061, "epoch": 5820} {"train_loss": -26.309843063354492, "global_step": 483062, "epoch": 5820} {"train_loss": -27.0497989654541, "global_step": 483063, "epoch": 5820} {"train_loss": -26.426156997680664, "global_step": 483064, "epoch": 5820} {"train_loss": -26.815343856811523, "global_step": 483065, "epoch": 5820} {"train_loss": -26.514892578125, "global_step": 483066, "epoch": 5820} {"train_loss": -27.292556762695312, "global_step": 483067, "epoch": 5820} {"train_loss": -26.632232666015625, "global_step": 483068, "epoch": 5820} {"train_loss": -26.723615646362305, "global_step": 483069, "epoch": 5820} {"train_loss": -26.916168212890625, "global_step": 483070, "epoch": 5820} {"train_loss": -27.07966423034668, "global_step": 483071, "epoch": 5820} {"train_loss": -27.289411544799805, "global_step": 483072, "epoch": 5820} {"train_loss": -26.97444725036621, "global_step": 483073, "epoch": 5820} {"train_loss": -26.899927139282227, "global_step": 483074, "epoch": 5820} {"train_loss": -26.902307510375977, "global_step": 483075, "epoch": 5820} {"train_loss": -27.023218154907227, "global_step": 483076, "epoch": 5820} {"train_loss": -26.9739990234375, "global_step": 483077, "epoch": 5820} {"train_loss": -27.174240112304688, "global_step": 483078, "epoch": 5820} {"train_loss": -27.13014793395996, "global_step": 483079, "epoch": 5820} {"train_loss": -27.049713134765625, "global_step": 483080, "epoch": 5820} {"train_loss": -27.090871810913086, "global_step": 483081, "epoch": 5820} {"train_loss": -27.211322784423828, "global_step": 483082, "epoch": 5820} {"train_loss": -27.10169792175293, "global_step": 483083, "epoch": 5820} {"train_loss": -27.076459884643555, "global_step": 483084, "epoch": 5820} {"train_loss": -27.13852310180664, "global_step": 483085, "epoch": 5820} {"train_loss": -27.24603271484375, "global_step": 483086, "epoch": 5820} {"train_loss": -27.286331176757812, "global_step": 483087, "epoch": 5820} {"train_loss": -27.063251495361328, "global_step": 483088, "epoch": 5820} {"train_loss": -27.083820343017578, "global_step": 483089, "epoch": 5820} {"train_loss": -27.302106857299805, "global_step": 483090, "epoch": 5820} {"train_loss": -27.390094757080078, "global_step": 483091, "epoch": 5820} {"train_loss": -27.458728790283203, "global_step": 483092, "epoch": 5820} {"train_loss": -27.613422393798828, "global_step": 483093, "epoch": 5820} {"train_loss": -27.67549705505371, "global_step": 483094, "epoch": 5820} {"train_loss": -27.266088485717773, "global_step": 483095, "epoch": 5820} {"train_loss": -27.464048385620117, "global_step": 483096, "epoch": 5820} {"train_loss": -27.570281982421875, "global_step": 483097, "epoch": 5820} {"train_loss": -27.609479904174805, "global_step": 483098, "epoch": 5820} {"train_loss": -27.863025665283203, "global_step": 483099, "epoch": 5820} {"train_loss": -27.42331886291504, "global_step": 483100, "epoch": 5820} {"train_loss": -27.4622745513916, "global_step": 483101, "epoch": 5820} {"train_loss": -27.515777587890625, "global_step": 483102, "epoch": 5820} {"train_loss": -27.34522819519043, "global_step": 483103, "epoch": 5820} {"train_loss": -27.72369956970215, "global_step": 483104, "epoch": 5820} {"train_loss": -27.4461669921875, "global_step": 483105, "epoch": 5820} {"train_loss": -27.788808822631836, "global_step": 483106, "epoch": 5820} {"train_loss": -27.365570068359375, "global_step": 483107, "epoch": 5820} {"train_loss": -27.614294052124023, "global_step": 483108, "epoch": 5820} {"train_loss": -27.15297508239746, "global_step": 483109, "epoch": 5820} {"train_loss": -27.212324142456055, "global_step": 483110, "epoch": 5820} {"train_loss": -27.062009811401367, "global_step": 483111, "epoch": 5820} {"train_loss": -27.186023712158203, "global_step": 483112, "epoch": 5820} {"train_loss": -26.685409545898438, "global_step": 483113, "epoch": 5820} {"train_loss": -26.9000301361084, "global_step": 483114, "epoch": 5820} {"train_loss": -27.008045196533203, "global_step": 483115, "epoch": 5820} {"train_loss": -27.1175594329834, "global_step": 483116, "epoch": 5820} {"train_loss": -26.747608184814453, "global_step": 483117, "epoch": 5820} {"train_loss": -26.521650314331055, "global_step": 483118, "epoch": 5820} {"train_loss": -26.818267822265625, "global_step": 483119, "epoch": 5820} {"train_loss": -27.203433990478516, "global_step": 483120, "epoch": 5820} {"train_loss": -26.748615264892578, "global_step": 483121, "epoch": 5820} {"train_loss": -26.51645278930664, "global_step": 483122, "epoch": 5820} {"train_loss": -27.3324031829834, "global_step": 483123, "epoch": 5820} {"train_loss": -27.115514755249023, "global_step": 483124, "epoch": 5820} {"train_loss": -26.84006118774414, "global_step": 483125, "epoch": 5820} {"train_loss": -27.18776512145996, "global_step": 483126, "epoch": 5820} {"train_loss": -27.0789737701416, "global_step": 483127, "epoch": 5820} {"train_loss": -27.126718521118164, "global_step": 483128, "epoch": 5820} {"train_loss": -26.775684356689453, "global_step": 483129, "epoch": 5820} {"train_loss": -27.149078369140625, "global_step": 483130, "epoch": 5820} {"train_loss": -27.20011329650879, "global_step": 483131, "epoch": 5820} {"train_loss": -27.33930778503418, "global_step": 483132, "epoch": 5820} {"train_loss": -27.16864585876465, "global_step": 483133, "epoch": 5820} {"train_loss": -27.012479782104492, "global_step": 483134, "epoch": 5820} {"train_loss": -27.16682243347168, "global_step": 483135, "epoch": 5820} {"train_loss": -27.29884910583496, "global_step": 483136, "epoch": 5820} {"train_loss": -27.365283966064453, "global_step": 483137, "epoch": 5820} {"train_loss": -27.239017486572266, "global_step": 483138, "epoch": 5820} {"train_loss": -27.103086471557617, "global_step": 483139, "epoch": 5820} {"train_loss": -27.25852394104004, "global_step": 483140, "epoch": 5820} {"train_loss": -27.03116798400879, "global_step": 483141, "epoch": 5820} {"train_loss": -27.12631623141737, "global_step": 483142, "epoch": 5820, "val_loss": 6592824.0} {"train_loss": -24.807266235351562, "global_step": 483143, "epoch": 5821} {"train_loss": -25.02830696105957, "global_step": 483144, "epoch": 5821} {"train_loss": -25.907461166381836, "global_step": 483145, "epoch": 5821} {"train_loss": -26.425128936767578, "global_step": 483146, "epoch": 5821} {"train_loss": -25.475976943969727, "global_step": 483147, "epoch": 5821} {"train_loss": -26.364526748657227, "global_step": 483148, "epoch": 5821} {"train_loss": -25.998334884643555, "global_step": 483149, "epoch": 5821} {"train_loss": -26.8258113861084, "global_step": 483150, "epoch": 5821} {"train_loss": -26.22279167175293, "global_step": 483151, "epoch": 5821} {"train_loss": -26.558883666992188, "global_step": 483152, "epoch": 5821} {"train_loss": -26.516422271728516, "global_step": 483153, "epoch": 5821} {"train_loss": -26.6785945892334, "global_step": 483154, "epoch": 5821} {"train_loss": -26.76513671875, "global_step": 483155, "epoch": 5821} {"train_loss": -26.783832550048828, "global_step": 483156, "epoch": 5821} {"train_loss": -26.699304580688477, "global_step": 483157, "epoch": 5821} {"train_loss": -26.60918617248535, "global_step": 483158, "epoch": 5821} {"train_loss": -26.39558982849121, "global_step": 483159, "epoch": 5821} {"train_loss": -27.1878719329834, "global_step": 483160, "epoch": 5821} {"train_loss": -26.526504516601562, "global_step": 483161, "epoch": 5821} {"train_loss": -26.997695922851562, "global_step": 483162, "epoch": 5821} {"train_loss": -27.061811447143555, "global_step": 483163, "epoch": 5821} {"train_loss": -27.034513473510742, "global_step": 483164, "epoch": 5821} {"train_loss": -27.043243408203125, "global_step": 483165, "epoch": 5821} {"train_loss": -26.914743423461914, "global_step": 483166, "epoch": 5821} {"train_loss": -27.01666259765625, "global_step": 483167, "epoch": 5821} {"train_loss": -27.18282127380371, "global_step": 483168, "epoch": 5821} {"train_loss": -26.950281143188477, "global_step": 483169, "epoch": 5821} {"train_loss": -26.93536949157715, "global_step": 483170, "epoch": 5821} {"train_loss": -27.0302734375, "global_step": 483171, "epoch": 5821} {"train_loss": -26.976749420166016, "global_step": 483172, "epoch": 5821} {"train_loss": -26.952268600463867, "global_step": 483173, "epoch": 5821} {"train_loss": -26.818923950195312, "global_step": 483174, "epoch": 5821} {"train_loss": -27.098356246948242, "global_step": 483175, "epoch": 5821} {"train_loss": -26.898523330688477, "global_step": 483176, "epoch": 5821} {"train_loss": -27.12543296813965, "global_step": 483177, "epoch": 5821} {"train_loss": -27.021472930908203, "global_step": 483178, "epoch": 5821} {"train_loss": -27.038818359375, "global_step": 483179, "epoch": 5821} {"train_loss": -27.44012451171875, "global_step": 483180, "epoch": 5821} {"train_loss": -27.181188583374023, "global_step": 483181, "epoch": 5821} {"train_loss": -27.35554313659668, "global_step": 483182, "epoch": 5821} {"train_loss": -27.113306045532227, "global_step": 483183, "epoch": 5821} {"train_loss": -26.794879913330078, "global_step": 483184, "epoch": 5821} {"train_loss": -27.577184677124023, "global_step": 483185, "epoch": 5821} {"train_loss": -27.458967208862305, "global_step": 483186, "epoch": 5821} {"train_loss": -27.31477165222168, "global_step": 483187, "epoch": 5821} {"train_loss": -27.393890380859375, "global_step": 483188, "epoch": 5821} {"train_loss": -27.55655860900879, "global_step": 483189, "epoch": 5821} {"train_loss": -27.0758056640625, "global_step": 483190, "epoch": 5821} {"train_loss": -27.416675567626953, "global_step": 483191, "epoch": 5821} {"train_loss": -27.19513511657715, "global_step": 483192, "epoch": 5821} {"train_loss": -27.581104278564453, "global_step": 483193, "epoch": 5821} {"train_loss": -27.227787017822266, "global_step": 483194, "epoch": 5821} {"train_loss": -26.97352409362793, "global_step": 483195, "epoch": 5821} {"train_loss": -27.55824089050293, "global_step": 483196, "epoch": 5821} {"train_loss": -27.402490615844727, "global_step": 483197, "epoch": 5821} {"train_loss": -27.598529815673828, "global_step": 483198, "epoch": 5821} {"train_loss": -27.338287353515625, "global_step": 483199, "epoch": 5821} {"train_loss": -27.52994728088379, "global_step": 483200, "epoch": 5821} {"train_loss": -27.12753677368164, "global_step": 483201, "epoch": 5821} {"train_loss": -27.419034957885742, "global_step": 483202, "epoch": 5821} {"train_loss": -27.5030460357666, "global_step": 483203, "epoch": 5821} {"train_loss": -27.35030174255371, "global_step": 483204, "epoch": 5821} {"train_loss": -27.141637802124023, "global_step": 483205, "epoch": 5821} {"train_loss": -27.429859161376953, "global_step": 483206, "epoch": 5821} {"train_loss": -27.173303604125977, "global_step": 483207, "epoch": 5821} {"train_loss": -27.526357650756836, "global_step": 483208, "epoch": 5821} {"train_loss": -27.244556427001953, "global_step": 483209, "epoch": 5821} {"train_loss": -27.326038360595703, "global_step": 483210, "epoch": 5821} {"train_loss": -27.101123809814453, "global_step": 483211, "epoch": 5821} {"train_loss": -27.57387351989746, "global_step": 483212, "epoch": 5821} {"train_loss": -27.647083282470703, "global_step": 483213, "epoch": 5821} {"train_loss": -26.973485946655273, "global_step": 483214, "epoch": 5821} {"train_loss": -26.93495750427246, "global_step": 483215, "epoch": 5821} {"train_loss": -26.677963256835938, "global_step": 483216, "epoch": 5821} {"train_loss": -27.37404441833496, "global_step": 483217, "epoch": 5821} {"train_loss": -27.253305435180664, "global_step": 483218, "epoch": 5821} {"train_loss": -26.103092193603516, "global_step": 483219, "epoch": 5821} {"train_loss": -26.202795028686523, "global_step": 483220, "epoch": 5821} {"train_loss": -27.293302536010742, "global_step": 483221, "epoch": 5821} {"train_loss": -27.095300674438477, "global_step": 483222, "epoch": 5821} {"train_loss": -25.937179565429688, "global_step": 483223, "epoch": 5821} {"train_loss": -27.3802547454834, "global_step": 483224, "epoch": 5821} {"train_loss": -26.946483887821795, "global_step": 483225, "epoch": 5821, "val_loss": 6582176.0} {"train_loss": -25.692249298095703, "global_step": 483226, "epoch": 5822} {"train_loss": -25.59282112121582, "global_step": 483227, "epoch": 5822} {"train_loss": -25.602558135986328, "global_step": 483228, "epoch": 5822} {"train_loss": -26.116485595703125, "global_step": 483229, "epoch": 5822} {"train_loss": -25.919279098510742, "global_step": 483230, "epoch": 5822} {"train_loss": -26.12359619140625, "global_step": 483231, "epoch": 5822} {"train_loss": -25.902942657470703, "global_step": 483232, "epoch": 5822} {"train_loss": -26.33283042907715, "global_step": 483233, "epoch": 5822} {"train_loss": -26.4009952545166, "global_step": 483234, "epoch": 5822} {"train_loss": -26.515960693359375, "global_step": 483235, "epoch": 5822} {"train_loss": -25.952356338500977, "global_step": 483236, "epoch": 5822} {"train_loss": -26.35382080078125, "global_step": 483237, "epoch": 5822} {"train_loss": -26.527997970581055, "global_step": 483238, "epoch": 5822} {"train_loss": -26.433923721313477, "global_step": 483239, "epoch": 5822} {"train_loss": -25.967987060546875, "global_step": 483240, "epoch": 5822} {"train_loss": -26.32404899597168, "global_step": 483241, "epoch": 5822} {"train_loss": -26.089704513549805, "global_step": 483242, "epoch": 5822} {"train_loss": -26.452070236206055, "global_step": 483243, "epoch": 5822} {"train_loss": -26.814807891845703, "global_step": 483244, "epoch": 5822} {"train_loss": -26.35638999938965, "global_step": 483245, "epoch": 5822} {"train_loss": -27.008808135986328, "global_step": 483246, "epoch": 5822} {"train_loss": -26.5279598236084, "global_step": 483247, "epoch": 5822} {"train_loss": -26.9542179107666, "global_step": 483248, "epoch": 5822} {"train_loss": -26.661212921142578, "global_step": 483249, "epoch": 5822} {"train_loss": -26.725814819335938, "global_step": 483250, "epoch": 5822} {"train_loss": -27.042898178100586, "global_step": 483251, "epoch": 5822} {"train_loss": -26.941822052001953, "global_step": 483252, "epoch": 5822} {"train_loss": -26.484180450439453, "global_step": 483253, "epoch": 5822} {"train_loss": -26.964609146118164, "global_step": 483254, "epoch": 5822} {"train_loss": -26.748926162719727, "global_step": 483255, "epoch": 5822} {"train_loss": -27.135955810546875, "global_step": 483256, "epoch": 5822} {"train_loss": -26.6905574798584, "global_step": 483257, "epoch": 5822} {"train_loss": -27.241931915283203, "global_step": 483258, "epoch": 5822} {"train_loss": -27.378326416015625, "global_step": 483259, "epoch": 5822} {"train_loss": -26.798673629760742, "global_step": 483260, "epoch": 5822} {"train_loss": -26.822769165039062, "global_step": 483261, "epoch": 5822} {"train_loss": -27.02522087097168, "global_step": 483262, "epoch": 5822} {"train_loss": -26.95672035217285, "global_step": 483263, "epoch": 5822} {"train_loss": -27.371625900268555, "global_step": 483264, "epoch": 5822} {"train_loss": -27.238122940063477, "global_step": 483265, "epoch": 5822} {"train_loss": -27.125165939331055, "global_step": 483266, "epoch": 5822} {"train_loss": -27.260522842407227, "global_step": 483267, "epoch": 5822} {"train_loss": -27.50309181213379, "global_step": 483268, "epoch": 5822} {"train_loss": -27.099218368530273, "global_step": 483269, "epoch": 5822} {"train_loss": -27.29296875, "global_step": 483270, "epoch": 5822} {"train_loss": -27.42310905456543, "global_step": 483271, "epoch": 5822} {"train_loss": -27.22544288635254, "global_step": 483272, "epoch": 5822} {"train_loss": -27.61478042602539, "global_step": 483273, "epoch": 5822} {"train_loss": -27.208845138549805, "global_step": 483274, "epoch": 5822} {"train_loss": -27.273237228393555, "global_step": 483275, "epoch": 5822} {"train_loss": -27.1959171295166, "global_step": 483276, "epoch": 5822} {"train_loss": -26.982013702392578, "global_step": 483277, "epoch": 5822} {"train_loss": -27.315038681030273, "global_step": 483278, "epoch": 5822} {"train_loss": -26.881763458251953, "global_step": 483279, "epoch": 5822} {"train_loss": -27.2818546295166, "global_step": 483280, "epoch": 5822} {"train_loss": -27.253881454467773, "global_step": 483281, "epoch": 5822} {"train_loss": -27.620206832885742, "global_step": 483282, "epoch": 5822} {"train_loss": -27.354522705078125, "global_step": 483283, "epoch": 5822} {"train_loss": -27.703657150268555, "global_step": 483284, "epoch": 5822} {"train_loss": -27.574621200561523, "global_step": 483285, "epoch": 5822} {"train_loss": -27.412673950195312, "global_step": 483286, "epoch": 5822} {"train_loss": -27.43208122253418, "global_step": 483287, "epoch": 5822} {"train_loss": -27.315149307250977, "global_step": 483288, "epoch": 5822} {"train_loss": -26.638174057006836, "global_step": 483289, "epoch": 5822} {"train_loss": -27.643814086914062, "global_step": 483290, "epoch": 5822} {"train_loss": -27.286029815673828, "global_step": 483291, "epoch": 5822} {"train_loss": -27.66994285583496, "global_step": 483292, "epoch": 5822} {"train_loss": -27.646869659423828, "global_step": 483293, "epoch": 5822} {"train_loss": -27.28761100769043, "global_step": 483294, "epoch": 5822} {"train_loss": -27.391889572143555, "global_step": 483295, "epoch": 5822} {"train_loss": -27.501401901245117, "global_step": 483296, "epoch": 5822} {"train_loss": -27.328596115112305, "global_step": 483297, "epoch": 5822} {"train_loss": -27.1776065826416, "global_step": 483298, "epoch": 5822} {"train_loss": -27.839929580688477, "global_step": 483299, "epoch": 5822} {"train_loss": -27.42976188659668, "global_step": 483300, "epoch": 5822} {"train_loss": -27.37430191040039, "global_step": 483301, "epoch": 5822} {"train_loss": -27.45022964477539, "global_step": 483302, "epoch": 5822} {"train_loss": -27.193302154541016, "global_step": 483303, "epoch": 5822} {"train_loss": -27.48583984375, "global_step": 483304, "epoch": 5822} {"train_loss": -27.402185440063477, "global_step": 483305, "epoch": 5822} {"train_loss": -27.64117431640625, "global_step": 483306, "epoch": 5822} {"train_loss": -26.920673370361328, "global_step": 483307, "epoch": 5822} {"train_loss": -26.964511917298097, "global_step": 483308, "epoch": 5822, "val_loss": 6636820.0} {"train_loss": -27.018512725830078, "global_step": 483309, "epoch": 5823} {"train_loss": -26.815643310546875, "global_step": 483310, "epoch": 5823} {"train_loss": -26.753192901611328, "global_step": 483311, "epoch": 5823} {"train_loss": -27.275821685791016, "global_step": 483312, "epoch": 5823} {"train_loss": -26.500585556030273, "global_step": 483313, "epoch": 5823} {"train_loss": -26.323705673217773, "global_step": 483314, "epoch": 5823} {"train_loss": -26.47968101501465, "global_step": 483315, "epoch": 5823} {"train_loss": -26.499542236328125, "global_step": 483316, "epoch": 5823} {"train_loss": -26.802480697631836, "global_step": 483317, "epoch": 5823} {"train_loss": -26.650821685791016, "global_step": 483318, "epoch": 5823} {"train_loss": -26.980426788330078, "global_step": 483319, "epoch": 5823} {"train_loss": -26.9224910736084, "global_step": 483320, "epoch": 5823} {"train_loss": -27.118249893188477, "global_step": 483321, "epoch": 5823} {"train_loss": -26.924270629882812, "global_step": 483322, "epoch": 5823} {"train_loss": -27.06463623046875, "global_step": 483323, "epoch": 5823} {"train_loss": -26.591617584228516, "global_step": 483324, "epoch": 5823} {"train_loss": -26.80695915222168, "global_step": 483325, "epoch": 5823} {"train_loss": -26.876514434814453, "global_step": 483326, "epoch": 5823} {"train_loss": -26.69198989868164, "global_step": 483327, "epoch": 5823} {"train_loss": -26.664886474609375, "global_step": 483328, "epoch": 5823} {"train_loss": -26.692611694335938, "global_step": 483329, "epoch": 5823} {"train_loss": -27.245325088500977, "global_step": 483330, "epoch": 5823} {"train_loss": -27.245044708251953, "global_step": 483331, "epoch": 5823} {"train_loss": -26.93289566040039, "global_step": 483332, "epoch": 5823} {"train_loss": -26.922399520874023, "global_step": 483333, "epoch": 5823} {"train_loss": -27.074365615844727, "global_step": 483334, "epoch": 5823} {"train_loss": -27.300954818725586, "global_step": 483335, "epoch": 5823} {"train_loss": -27.393970489501953, "global_step": 483336, "epoch": 5823} {"train_loss": -27.100507736206055, "global_step": 483337, "epoch": 5823} {"train_loss": -27.104841232299805, "global_step": 483338, "epoch": 5823} {"train_loss": -27.005294799804688, "global_step": 483339, "epoch": 5823} {"train_loss": -27.5317325592041, "global_step": 483340, "epoch": 5823} {"train_loss": -26.8413143157959, "global_step": 483341, "epoch": 5823} {"train_loss": -27.595975875854492, "global_step": 483342, "epoch": 5823} {"train_loss": -27.152912139892578, "global_step": 483343, "epoch": 5823} {"train_loss": -27.5345401763916, "global_step": 483344, "epoch": 5823} {"train_loss": -27.3934326171875, "global_step": 483345, "epoch": 5823} {"train_loss": -27.132080078125, "global_step": 483346, "epoch": 5823} {"train_loss": -27.061100006103516, "global_step": 483347, "epoch": 5823} {"train_loss": -27.59247398376465, "global_step": 483348, "epoch": 5823} {"train_loss": -27.453033447265625, "global_step": 483349, "epoch": 5823} {"train_loss": -27.319005966186523, "global_step": 483350, "epoch": 5823} {"train_loss": -27.035852432250977, "global_step": 483351, "epoch": 5823} {"train_loss": -27.6572208404541, "global_step": 483352, "epoch": 5823} {"train_loss": -27.726806640625, "global_step": 483353, "epoch": 5823} {"train_loss": -27.8597354888916, "global_step": 483354, "epoch": 5823} {"train_loss": -27.468576431274414, "global_step": 483355, "epoch": 5823} {"train_loss": -27.382080078125, "global_step": 483356, "epoch": 5823} {"train_loss": -27.61286735534668, "global_step": 483357, "epoch": 5823} {"train_loss": -27.7685546875, "global_step": 483358, "epoch": 5823} {"train_loss": -27.50628089904785, "global_step": 483359, "epoch": 5823} {"train_loss": -27.30875587463379, "global_step": 483360, "epoch": 5823} {"train_loss": -27.5390682220459, "global_step": 483361, "epoch": 5823} {"train_loss": -27.223377227783203, "global_step": 483362, "epoch": 5823} {"train_loss": -27.53627586364746, "global_step": 483363, "epoch": 5823} {"train_loss": -27.400339126586914, "global_step": 483364, "epoch": 5823} {"train_loss": -27.50009536743164, "global_step": 483365, "epoch": 5823} {"train_loss": -27.880481719970703, "global_step": 483366, "epoch": 5823} {"train_loss": -27.51373291015625, "global_step": 483367, "epoch": 5823} {"train_loss": -26.76799964904785, "global_step": 483368, "epoch": 5823} {"train_loss": -25.954193115234375, "global_step": 483369, "epoch": 5823} {"train_loss": -27.241214752197266, "global_step": 483370, "epoch": 5823} {"train_loss": -26.81538200378418, "global_step": 483371, "epoch": 5823} {"train_loss": -27.14991569519043, "global_step": 483372, "epoch": 5823} {"train_loss": -27.04599380493164, "global_step": 483373, "epoch": 5823} {"train_loss": -26.832809448242188, "global_step": 483374, "epoch": 5823} {"train_loss": -26.999494552612305, "global_step": 483375, "epoch": 5823} {"train_loss": -26.987812042236328, "global_step": 483376, "epoch": 5823} {"train_loss": -27.148944854736328, "global_step": 483377, "epoch": 5823} {"train_loss": -26.951416015625, "global_step": 483378, "epoch": 5823} {"train_loss": -27.225482940673828, "global_step": 483379, "epoch": 5823} {"train_loss": -27.180585861206055, "global_step": 483380, "epoch": 5823} {"train_loss": -26.724624633789062, "global_step": 483381, "epoch": 5823} {"train_loss": -26.354711532592773, "global_step": 483382, "epoch": 5823} {"train_loss": -26.052099227905273, "global_step": 483383, "epoch": 5823} {"train_loss": -26.490209579467773, "global_step": 483384, "epoch": 5823} {"train_loss": -26.88091468811035, "global_step": 483385, "epoch": 5823} {"train_loss": -27.326385498046875, "global_step": 483386, "epoch": 5823} {"train_loss": -26.952463150024414, "global_step": 483387, "epoch": 5823} {"train_loss": -26.807409286499023, "global_step": 483388, "epoch": 5823} {"train_loss": -26.949377059936523, "global_step": 483389, "epoch": 5823} {"train_loss": -26.898962020874023, "global_step": 483390, "epoch": 5823} {"train_loss": -27.08969095528844, "global_step": 483391, "epoch": 5823, "val_loss": 6576773.0} {"train_loss": -27.20597267150879, "global_step": 483392, "epoch": 5824} {"train_loss": -27.05219078063965, "global_step": 483393, "epoch": 5824} {"train_loss": -26.68039894104004, "global_step": 483394, "epoch": 5824} {"train_loss": -26.743579864501953, "global_step": 483395, "epoch": 5824} {"train_loss": -27.01239585876465, "global_step": 483396, "epoch": 5824} {"train_loss": -27.139184951782227, "global_step": 483397, "epoch": 5824} {"train_loss": -26.9248046875, "global_step": 483398, "epoch": 5824} {"train_loss": -27.24994468688965, "global_step": 483399, "epoch": 5824} {"train_loss": -27.268728256225586, "global_step": 483400, "epoch": 5824} {"train_loss": -27.015668869018555, "global_step": 483401, "epoch": 5824} {"train_loss": -27.127965927124023, "global_step": 483402, "epoch": 5824} {"train_loss": -26.829193115234375, "global_step": 483403, "epoch": 5824} {"train_loss": -26.82834243774414, "global_step": 483404, "epoch": 5824} {"train_loss": -26.946369171142578, "global_step": 483405, "epoch": 5824} {"train_loss": -26.9124813079834, "global_step": 483406, "epoch": 5824} {"train_loss": -27.508569717407227, "global_step": 483407, "epoch": 5824} {"train_loss": -27.17889976501465, "global_step": 483408, "epoch": 5824} {"train_loss": -26.8529052734375, "global_step": 483409, "epoch": 5824} {"train_loss": -27.399198532104492, "global_step": 483410, "epoch": 5824} {"train_loss": -26.938344955444336, "global_step": 483411, "epoch": 5824} {"train_loss": -27.072778701782227, "global_step": 483412, "epoch": 5824} {"train_loss": -27.148208618164062, "global_step": 483413, "epoch": 5824} {"train_loss": -27.23516273498535, "global_step": 483414, "epoch": 5824} {"train_loss": -27.38467788696289, "global_step": 483415, "epoch": 5824} {"train_loss": -27.2174072265625, "global_step": 483416, "epoch": 5824} {"train_loss": -27.321134567260742, "global_step": 483417, "epoch": 5824} {"train_loss": -27.477569580078125, "global_step": 483418, "epoch": 5824} {"train_loss": -27.356616973876953, "global_step": 483419, "epoch": 5824} {"train_loss": -27.317480087280273, "global_step": 483420, "epoch": 5824} {"train_loss": -27.445592880249023, "global_step": 483421, "epoch": 5824} {"train_loss": -27.18483543395996, "global_step": 483422, "epoch": 5824} {"train_loss": -27.201034545898438, "global_step": 483423, "epoch": 5824} {"train_loss": -27.264759063720703, "global_step": 483424, "epoch": 5824} {"train_loss": -27.372304916381836, "global_step": 483425, "epoch": 5824} {"train_loss": -26.995182037353516, "global_step": 483426, "epoch": 5824} {"train_loss": -27.79120445251465, "global_step": 483427, "epoch": 5824} {"train_loss": -27.32391929626465, "global_step": 483428, "epoch": 5824} {"train_loss": -27.353422164916992, "global_step": 483429, "epoch": 5824} {"train_loss": -27.636621475219727, "global_step": 483430, "epoch": 5824} {"train_loss": -27.505224227905273, "global_step": 483431, "epoch": 5824} {"train_loss": -27.18060302734375, "global_step": 483432, "epoch": 5824} {"train_loss": -27.3272647857666, "global_step": 483433, "epoch": 5824} {"train_loss": -27.367273330688477, "global_step": 483434, "epoch": 5824} {"train_loss": -27.46498680114746, "global_step": 483435, "epoch": 5824} {"train_loss": -27.558490753173828, "global_step": 483436, "epoch": 5824} {"train_loss": -27.398529052734375, "global_step": 483437, "epoch": 5824} {"train_loss": -27.2342586517334, "global_step": 483438, "epoch": 5824} {"train_loss": -27.759679794311523, "global_step": 483439, "epoch": 5824} {"train_loss": -27.161865234375, "global_step": 483440, "epoch": 5824} {"train_loss": -27.20069694519043, "global_step": 483441, "epoch": 5824} {"train_loss": -27.34063720703125, "global_step": 483442, "epoch": 5824} {"train_loss": -27.500946044921875, "global_step": 483443, "epoch": 5824} {"train_loss": -27.822097778320312, "global_step": 483444, "epoch": 5824} {"train_loss": -27.30364418029785, "global_step": 483445, "epoch": 5824} {"train_loss": -27.283248901367188, "global_step": 483446, "epoch": 5824} {"train_loss": -27.6051082611084, "global_step": 483447, "epoch": 5824} {"train_loss": -27.209060668945312, "global_step": 483448, "epoch": 5824} {"train_loss": -27.112085342407227, "global_step": 483449, "epoch": 5824} {"train_loss": -27.17838478088379, "global_step": 483450, "epoch": 5824} {"train_loss": -27.3686466217041, "global_step": 483451, "epoch": 5824} {"train_loss": -27.470001220703125, "global_step": 483452, "epoch": 5824} {"train_loss": -27.18015480041504, "global_step": 483453, "epoch": 5824} {"train_loss": -27.417478561401367, "global_step": 483454, "epoch": 5824} {"train_loss": -27.165449142456055, "global_step": 483455, "epoch": 5824} {"train_loss": -27.2066593170166, "global_step": 483456, "epoch": 5824} {"train_loss": -27.195199966430664, "global_step": 483457, "epoch": 5824} {"train_loss": -27.732763290405273, "global_step": 483458, "epoch": 5824} {"train_loss": -27.285221099853516, "global_step": 483459, "epoch": 5824} {"train_loss": -27.83554458618164, "global_step": 483460, "epoch": 5824} {"train_loss": -27.57918357849121, "global_step": 483461, "epoch": 5824} {"train_loss": -27.2376708984375, "global_step": 483462, "epoch": 5824} {"train_loss": -27.332914352416992, "global_step": 483463, "epoch": 5824} {"train_loss": -27.40627098083496, "global_step": 483464, "epoch": 5824} {"train_loss": -27.082462310791016, "global_step": 483465, "epoch": 5824} {"train_loss": -27.423608779907227, "global_step": 483466, "epoch": 5824} {"train_loss": -27.471694946289062, "global_step": 483467, "epoch": 5824} {"train_loss": -27.257848739624023, "global_step": 483468, "epoch": 5824} {"train_loss": -27.178503036499023, "global_step": 483469, "epoch": 5824} {"train_loss": -26.70374870300293, "global_step": 483470, "epoch": 5824} {"train_loss": -26.848358154296875, "global_step": 483471, "epoch": 5824} {"train_loss": -27.091602325439453, "global_step": 483472, "epoch": 5824} {"train_loss": -27.754058837890625, "global_step": 483473, "epoch": 5824} {"train_loss": -27.266268167151026, "global_step": 483474, "epoch": 5824, "val_loss": 6563960.0} {"train_loss": -25.26669692993164, "global_step": 483475, "epoch": 5825} {"train_loss": -24.492704391479492, "global_step": 483476, "epoch": 5825} {"train_loss": -26.833057403564453, "global_step": 483477, "epoch": 5825} {"train_loss": -26.373998641967773, "global_step": 483478, "epoch": 5825} {"train_loss": -25.622833251953125, "global_step": 483479, "epoch": 5825} {"train_loss": -26.111059188842773, "global_step": 483480, "epoch": 5825} {"train_loss": -26.047616958618164, "global_step": 483481, "epoch": 5825} {"train_loss": -26.6826114654541, "global_step": 483482, "epoch": 5825} {"train_loss": -26.298498153686523, "global_step": 483483, "epoch": 5825} {"train_loss": -27.083423614501953, "global_step": 483484, "epoch": 5825} {"train_loss": -26.626001358032227, "global_step": 483485, "epoch": 5825} {"train_loss": -26.90829849243164, "global_step": 483486, "epoch": 5825} {"train_loss": -27.06316566467285, "global_step": 483487, "epoch": 5825} {"train_loss": -26.577978134155273, "global_step": 483488, "epoch": 5825} {"train_loss": -26.62299156188965, "global_step": 483489, "epoch": 5825} {"train_loss": -26.85895347595215, "global_step": 483490, "epoch": 5825} {"train_loss": -27.150115966796875, "global_step": 483491, "epoch": 5825} {"train_loss": -26.986265182495117, "global_step": 483492, "epoch": 5825} {"train_loss": -26.766956329345703, "global_step": 483493, "epoch": 5825} {"train_loss": -27.083959579467773, "global_step": 483494, "epoch": 5825} {"train_loss": -26.896392822265625, "global_step": 483495, "epoch": 5825} {"train_loss": -26.81947898864746, "global_step": 483496, "epoch": 5825} {"train_loss": -26.7425537109375, "global_step": 483497, "epoch": 5825} {"train_loss": -26.9617862701416, "global_step": 483498, "epoch": 5825} {"train_loss": -27.15513038635254, "global_step": 483499, "epoch": 5825} {"train_loss": -26.93379020690918, "global_step": 483500, "epoch": 5825} {"train_loss": -27.161787033081055, "global_step": 483501, "epoch": 5825} {"train_loss": -27.13679313659668, "global_step": 483502, "epoch": 5825} {"train_loss": -27.092605590820312, "global_step": 483503, "epoch": 5825} {"train_loss": -27.399829864501953, "global_step": 483504, "epoch": 5825} {"train_loss": -27.281036376953125, "global_step": 483505, "epoch": 5825} {"train_loss": -26.983991622924805, "global_step": 483506, "epoch": 5825} {"train_loss": -27.035978317260742, "global_step": 483507, "epoch": 5825} {"train_loss": -26.991683959960938, "global_step": 483508, "epoch": 5825} {"train_loss": -27.181196212768555, "global_step": 483509, "epoch": 5825} {"train_loss": -27.016468048095703, "global_step": 483510, "epoch": 5825} {"train_loss": -27.481292724609375, "global_step": 483511, "epoch": 5825} {"train_loss": -27.418933868408203, "global_step": 483512, "epoch": 5825} {"train_loss": -27.564411163330078, "global_step": 483513, "epoch": 5825} {"train_loss": -27.315027236938477, "global_step": 483514, "epoch": 5825} {"train_loss": -27.34686279296875, "global_step": 483515, "epoch": 5825} {"train_loss": -27.071674346923828, "global_step": 483516, "epoch": 5825} {"train_loss": -26.431798934936523, "global_step": 483517, "epoch": 5825} {"train_loss": -27.142642974853516, "global_step": 483518, "epoch": 5825} {"train_loss": -27.564594268798828, "global_step": 483519, "epoch": 5825} {"train_loss": -27.345685958862305, "global_step": 483520, "epoch": 5825} {"train_loss": -27.608001708984375, "global_step": 483521, "epoch": 5825} {"train_loss": -27.157983779907227, "global_step": 483522, "epoch": 5825} {"train_loss": -27.293176651000977, "global_step": 483523, "epoch": 5825} {"train_loss": -27.473127365112305, "global_step": 483524, "epoch": 5825} {"train_loss": -27.30478858947754, "global_step": 483525, "epoch": 5825} {"train_loss": -27.47674560546875, "global_step": 483526, "epoch": 5825} {"train_loss": -26.93910026550293, "global_step": 483527, "epoch": 5825} {"train_loss": -27.1793155670166, "global_step": 483528, "epoch": 5825} {"train_loss": -27.296314239501953, "global_step": 483529, "epoch": 5825} {"train_loss": -27.343658447265625, "global_step": 483530, "epoch": 5825} {"train_loss": -27.077360153198242, "global_step": 483531, "epoch": 5825} {"train_loss": -26.839136123657227, "global_step": 483532, "epoch": 5825} {"train_loss": -27.165739059448242, "global_step": 483533, "epoch": 5825} {"train_loss": -27.384140014648438, "global_step": 483534, "epoch": 5825} {"train_loss": -27.3891658782959, "global_step": 483535, "epoch": 5825} {"train_loss": -27.001195907592773, "global_step": 483536, "epoch": 5825} {"train_loss": -26.968481063842773, "global_step": 483537, "epoch": 5825} {"train_loss": -27.240222930908203, "global_step": 483538, "epoch": 5825} {"train_loss": -27.7612247467041, "global_step": 483539, "epoch": 5825} {"train_loss": -27.682159423828125, "global_step": 483540, "epoch": 5825} {"train_loss": -27.58075523376465, "global_step": 483541, "epoch": 5825} {"train_loss": -27.32763671875, "global_step": 483542, "epoch": 5825} {"train_loss": -27.423376083374023, "global_step": 483543, "epoch": 5825} {"train_loss": -27.1324462890625, "global_step": 483544, "epoch": 5825} {"train_loss": -26.9713134765625, "global_step": 483545, "epoch": 5825} {"train_loss": -27.310733795166016, "global_step": 483546, "epoch": 5825} {"train_loss": -27.364795684814453, "global_step": 483547, "epoch": 5825} {"train_loss": -27.05889892578125, "global_step": 483548, "epoch": 5825} {"train_loss": -26.92603874206543, "global_step": 483549, "epoch": 5825} {"train_loss": -27.194711685180664, "global_step": 483550, "epoch": 5825} {"train_loss": -27.117206573486328, "global_step": 483551, "epoch": 5825} {"train_loss": -27.575143814086914, "global_step": 483552, "epoch": 5825} {"train_loss": -27.259496688842773, "global_step": 483553, "epoch": 5825} {"train_loss": -26.417388916015625, "global_step": 483554, "epoch": 5825} {"train_loss": -26.853784561157227, "global_step": 483555, "epoch": 5825} {"train_loss": -27.237812042236328, "global_step": 483556, "epoch": 5825} {"train_loss": -27.019577026367188, "global_step": 483557, "epoch": 5825, "val_loss": 6596917.0} {"train_loss": -26.64446449279785, "global_step": 483558, "epoch": 5826} {"train_loss": -26.824018478393555, "global_step": 483559, "epoch": 5826} {"train_loss": -26.082319259643555, "global_step": 483560, "epoch": 5826} {"train_loss": -26.8688907623291, "global_step": 483561, "epoch": 5826} {"train_loss": -26.571142196655273, "global_step": 483562, "epoch": 5826} {"train_loss": -26.595661163330078, "global_step": 483563, "epoch": 5826} {"train_loss": -26.632848739624023, "global_step": 483564, "epoch": 5826} {"train_loss": -26.497785568237305, "global_step": 483565, "epoch": 5826} {"train_loss": -26.977975845336914, "global_step": 483566, "epoch": 5826} {"train_loss": -26.39972496032715, "global_step": 483567, "epoch": 5826} {"train_loss": -27.00654411315918, "global_step": 483568, "epoch": 5826} {"train_loss": -26.787418365478516, "global_step": 483569, "epoch": 5826} {"train_loss": -26.721479415893555, "global_step": 483570, "epoch": 5826} {"train_loss": -26.77808952331543, "global_step": 483571, "epoch": 5826} {"train_loss": -26.790374755859375, "global_step": 483572, "epoch": 5826} {"train_loss": -26.9681453704834, "global_step": 483573, "epoch": 5826} {"train_loss": -26.75284194946289, "global_step": 483574, "epoch": 5826} {"train_loss": -27.35279655456543, "global_step": 483575, "epoch": 5826} {"train_loss": -26.837553024291992, "global_step": 483576, "epoch": 5826} {"train_loss": -26.871265411376953, "global_step": 483577, "epoch": 5826} {"train_loss": -27.1163272857666, "global_step": 483578, "epoch": 5826} {"train_loss": -27.156024932861328, "global_step": 483579, "epoch": 5826} {"train_loss": -26.94368553161621, "global_step": 483580, "epoch": 5826} {"train_loss": -27.197675704956055, "global_step": 483581, "epoch": 5826} {"train_loss": -27.19940757751465, "global_step": 483582, "epoch": 5826} {"train_loss": -27.26643943786621, "global_step": 483583, "epoch": 5826} {"train_loss": -27.010587692260742, "global_step": 483584, "epoch": 5826} {"train_loss": -26.92279052734375, "global_step": 483585, "epoch": 5826} {"train_loss": -27.115270614624023, "global_step": 483586, "epoch": 5826} {"train_loss": -27.46844482421875, "global_step": 483587, "epoch": 5826} {"train_loss": -27.35927391052246, "global_step": 483588, "epoch": 5826} {"train_loss": -27.251855850219727, "global_step": 483589, "epoch": 5826} {"train_loss": -27.27579689025879, "global_step": 483590, "epoch": 5826} {"train_loss": -27.176733016967773, "global_step": 483591, "epoch": 5826} {"train_loss": -27.420654296875, "global_step": 483592, "epoch": 5826} {"train_loss": -27.299421310424805, "global_step": 483593, "epoch": 5826} {"train_loss": -27.564350128173828, "global_step": 483594, "epoch": 5826} {"train_loss": -27.73784828186035, "global_step": 483595, "epoch": 5826} {"train_loss": -27.956140518188477, "global_step": 483596, "epoch": 5826} {"train_loss": -27.433691024780273, "global_step": 483597, "epoch": 5826} {"train_loss": -27.490583419799805, "global_step": 483598, "epoch": 5826} {"train_loss": -27.404693603515625, "global_step": 483599, "epoch": 5826} {"train_loss": -27.129413604736328, "global_step": 483600, "epoch": 5826} {"train_loss": -27.59735679626465, "global_step": 483601, "epoch": 5826} {"train_loss": -27.528095245361328, "global_step": 483602, "epoch": 5826} {"train_loss": -27.450393676757812, "global_step": 483603, "epoch": 5826} {"train_loss": -27.778844833374023, "global_step": 483604, "epoch": 5826} {"train_loss": -27.773483276367188, "global_step": 483605, "epoch": 5826} {"train_loss": -27.168594360351562, "global_step": 483606, "epoch": 5826} {"train_loss": -27.314746856689453, "global_step": 483607, "epoch": 5826} {"train_loss": -27.15818214416504, "global_step": 483608, "epoch": 5826} {"train_loss": -27.493200302124023, "global_step": 483609, "epoch": 5826} {"train_loss": -27.280487060546875, "global_step": 483610, "epoch": 5826} {"train_loss": -27.14630126953125, "global_step": 483611, "epoch": 5826} {"train_loss": -27.520294189453125, "global_step": 483612, "epoch": 5826} {"train_loss": -27.2886905670166, "global_step": 483613, "epoch": 5826} {"train_loss": -26.96241569519043, "global_step": 483614, "epoch": 5826} {"train_loss": -26.49945640563965, "global_step": 483615, "epoch": 5826} {"train_loss": -26.97818374633789, "global_step": 483616, "epoch": 5826} {"train_loss": -27.645612716674805, "global_step": 483617, "epoch": 5826} {"train_loss": -27.11899757385254, "global_step": 483618, "epoch": 5826} {"train_loss": -26.661191940307617, "global_step": 483619, "epoch": 5826} {"train_loss": -26.41480827331543, "global_step": 483620, "epoch": 5826} {"train_loss": -27.182470321655273, "global_step": 483621, "epoch": 5826} {"train_loss": -27.552600860595703, "global_step": 483622, "epoch": 5826} {"train_loss": -27.1520938873291, "global_step": 483623, "epoch": 5826} {"train_loss": -27.27685546875, "global_step": 483624, "epoch": 5826} {"train_loss": -27.473215103149414, "global_step": 483625, "epoch": 5826} {"train_loss": -27.127622604370117, "global_step": 483626, "epoch": 5826} {"train_loss": -27.022491455078125, "global_step": 483627, "epoch": 5826} {"train_loss": -27.255767822265625, "global_step": 483628, "epoch": 5826} {"train_loss": -26.965795516967773, "global_step": 483629, "epoch": 5826} {"train_loss": -26.9091739654541, "global_step": 483630, "epoch": 5826} {"train_loss": -27.281116485595703, "global_step": 483631, "epoch": 5826} {"train_loss": -27.111867904663086, "global_step": 483632, "epoch": 5826} {"train_loss": -27.307037353515625, "global_step": 483633, "epoch": 5826} {"train_loss": -27.041004180908203, "global_step": 483634, "epoch": 5826} {"train_loss": -27.313587188720703, "global_step": 483635, "epoch": 5826} {"train_loss": -27.405908584594727, "global_step": 483636, "epoch": 5826} {"train_loss": -27.17494010925293, "global_step": 483637, "epoch": 5826} {"train_loss": -27.17178726196289, "global_step": 483638, "epoch": 5826} {"train_loss": -27.045551300048828, "global_step": 483639, "epoch": 5826} {"train_loss": -27.12731085627912, "global_step": 483640, "epoch": 5826, "val_loss": 6493476.5} {"train_loss": -27.119436264038086, "global_step": 483641, "epoch": 5827} {"train_loss": -26.7136287689209, "global_step": 483642, "epoch": 5827} {"train_loss": -27.090442657470703, "global_step": 483643, "epoch": 5827} {"train_loss": -26.872995376586914, "global_step": 483644, "epoch": 5827} {"train_loss": -26.597335815429688, "global_step": 483645, "epoch": 5827} {"train_loss": -26.87127113342285, "global_step": 483646, "epoch": 5827} {"train_loss": -27.031885147094727, "global_step": 483647, "epoch": 5827} {"train_loss": -26.972503662109375, "global_step": 483648, "epoch": 5827} {"train_loss": -27.063140869140625, "global_step": 483649, "epoch": 5827} {"train_loss": -26.654815673828125, "global_step": 483650, "epoch": 5827} {"train_loss": -27.452545166015625, "global_step": 483651, "epoch": 5827} {"train_loss": -27.185705184936523, "global_step": 483652, "epoch": 5827} {"train_loss": -27.032957077026367, "global_step": 483653, "epoch": 5827} {"train_loss": -27.193281173706055, "global_step": 483654, "epoch": 5827} {"train_loss": -27.1619815826416, "global_step": 483655, "epoch": 5827} {"train_loss": -27.528295516967773, "global_step": 483656, "epoch": 5827} {"train_loss": -27.204999923706055, "global_step": 483657, "epoch": 5827} {"train_loss": -27.14272117614746, "global_step": 483658, "epoch": 5827} {"train_loss": -27.104644775390625, "global_step": 483659, "epoch": 5827} {"train_loss": -27.274377822875977, "global_step": 483660, "epoch": 5827} {"train_loss": -26.99136734008789, "global_step": 483661, "epoch": 5827} {"train_loss": -27.185232162475586, "global_step": 483662, "epoch": 5827} {"train_loss": -27.400165557861328, "global_step": 483663, "epoch": 5827} {"train_loss": -27.305896759033203, "global_step": 483664, "epoch": 5827} {"train_loss": -27.286102294921875, "global_step": 483665, "epoch": 5827} {"train_loss": -27.67572021484375, "global_step": 483666, "epoch": 5827} {"train_loss": -27.84010124206543, "global_step": 483667, "epoch": 5827} {"train_loss": -26.864133834838867, "global_step": 483668, "epoch": 5827} {"train_loss": -27.330331802368164, "global_step": 483669, "epoch": 5827} {"train_loss": -27.47554588317871, "global_step": 483670, "epoch": 5827} {"train_loss": -27.3453311920166, "global_step": 483671, "epoch": 5827} {"train_loss": -27.461902618408203, "global_step": 483672, "epoch": 5827} {"train_loss": -27.59693717956543, "global_step": 483673, "epoch": 5827} {"train_loss": -27.773056030273438, "global_step": 483674, "epoch": 5827} {"train_loss": -27.354658126831055, "global_step": 483675, "epoch": 5827} {"train_loss": -27.165058135986328, "global_step": 483676, "epoch": 5827} {"train_loss": -27.20232582092285, "global_step": 483677, "epoch": 5827} {"train_loss": -27.345624923706055, "global_step": 483678, "epoch": 5827} {"train_loss": -27.280309677124023, "global_step": 483679, "epoch": 5827} {"train_loss": -27.752073287963867, "global_step": 483680, "epoch": 5827} {"train_loss": -27.498334884643555, "global_step": 483681, "epoch": 5827} {"train_loss": -27.51291847229004, "global_step": 483682, "epoch": 5827} {"train_loss": -27.517927169799805, "global_step": 483683, "epoch": 5827} {"train_loss": -27.163990020751953, "global_step": 483684, "epoch": 5827} {"train_loss": -27.805334091186523, "global_step": 483685, "epoch": 5827} {"train_loss": -27.390106201171875, "global_step": 483686, "epoch": 5827} {"train_loss": -27.402069091796875, "global_step": 483687, "epoch": 5827} {"train_loss": -27.53925895690918, "global_step": 483688, "epoch": 5827} {"train_loss": -27.122150421142578, "global_step": 483689, "epoch": 5827} {"train_loss": -27.581298828125, "global_step": 483690, "epoch": 5827} {"train_loss": -27.028043746948242, "global_step": 483691, "epoch": 5827} {"train_loss": -27.15272331237793, "global_step": 483692, "epoch": 5827} {"train_loss": -27.01899528503418, "global_step": 483693, "epoch": 5827} {"train_loss": -27.04412269592285, "global_step": 483694, "epoch": 5827} {"train_loss": -27.20197105407715, "global_step": 483695, "epoch": 5827} {"train_loss": -27.061267852783203, "global_step": 483696, "epoch": 5827} {"train_loss": -27.529510498046875, "global_step": 483697, "epoch": 5827} {"train_loss": -27.217761993408203, "global_step": 483698, "epoch": 5827} {"train_loss": -27.7335262298584, "global_step": 483699, "epoch": 5827} {"train_loss": -27.17122459411621, "global_step": 483700, "epoch": 5827} {"train_loss": -27.627832412719727, "global_step": 483701, "epoch": 5827} {"train_loss": -27.38983726501465, "global_step": 483702, "epoch": 5827} {"train_loss": -27.835302352905273, "global_step": 483703, "epoch": 5827} {"train_loss": -27.68584632873535, "global_step": 483704, "epoch": 5827} {"train_loss": -27.29670524597168, "global_step": 483705, "epoch": 5827} {"train_loss": -26.950286865234375, "global_step": 483706, "epoch": 5827} {"train_loss": -27.886260986328125, "global_step": 483707, "epoch": 5827} {"train_loss": -27.262723922729492, "global_step": 483708, "epoch": 5827} {"train_loss": -27.396228790283203, "global_step": 483709, "epoch": 5827} {"train_loss": -27.363189697265625, "global_step": 483710, "epoch": 5827} {"train_loss": -27.49220848083496, "global_step": 483711, "epoch": 5827} {"train_loss": -27.168066024780273, "global_step": 483712, "epoch": 5827} {"train_loss": -26.966480255126953, "global_step": 483713, "epoch": 5827} {"train_loss": -26.64802360534668, "global_step": 483714, "epoch": 5827} {"train_loss": -27.19556999206543, "global_step": 483715, "epoch": 5827} {"train_loss": -26.805801391601562, "global_step": 483716, "epoch": 5827} {"train_loss": -26.412839889526367, "global_step": 483717, "epoch": 5827} {"train_loss": -25.731657028198242, "global_step": 483718, "epoch": 5827} {"train_loss": -27.233366012573242, "global_step": 483719, "epoch": 5827} {"train_loss": -27.033737182617188, "global_step": 483720, "epoch": 5827} {"train_loss": -26.504627227783203, "global_step": 483721, "epoch": 5827} {"train_loss": -27.330575942993164, "global_step": 483722, "epoch": 5827} {"train_loss": -27.23008626914886, "global_step": 483723, "epoch": 5827, "val_loss": 6515003.0} {"train_loss": -27.015625, "global_step": 483724, "epoch": 5828} {"train_loss": -26.309600830078125, "global_step": 483725, "epoch": 5828} {"train_loss": -26.399564743041992, "global_step": 483726, "epoch": 5828} {"train_loss": -26.7734317779541, "global_step": 483727, "epoch": 5828} {"train_loss": -26.649627685546875, "global_step": 483728, "epoch": 5828} {"train_loss": -26.8822021484375, "global_step": 483729, "epoch": 5828} {"train_loss": -26.405920028686523, "global_step": 483730, "epoch": 5828} {"train_loss": -26.637754440307617, "global_step": 483731, "epoch": 5828} {"train_loss": -26.308225631713867, "global_step": 483732, "epoch": 5828} {"train_loss": -26.4696102142334, "global_step": 483733, "epoch": 5828} {"train_loss": -26.536361694335938, "global_step": 483734, "epoch": 5828} {"train_loss": -26.37982177734375, "global_step": 483735, "epoch": 5828} {"train_loss": -26.974111557006836, "global_step": 483736, "epoch": 5828} {"train_loss": -26.877439498901367, "global_step": 483737, "epoch": 5828} {"train_loss": -26.989927291870117, "global_step": 483738, "epoch": 5828} {"train_loss": -26.556127548217773, "global_step": 483739, "epoch": 5828} {"train_loss": -26.7767333984375, "global_step": 483740, "epoch": 5828} {"train_loss": -27.048370361328125, "global_step": 483741, "epoch": 5828} {"train_loss": -26.60161781311035, "global_step": 483742, "epoch": 5828} {"train_loss": -27.100418090820312, "global_step": 483743, "epoch": 5828} {"train_loss": -26.838428497314453, "global_step": 483744, "epoch": 5828} {"train_loss": -26.9316349029541, "global_step": 483745, "epoch": 5828} {"train_loss": -27.108922958374023, "global_step": 483746, "epoch": 5828} {"train_loss": -26.968036651611328, "global_step": 483747, "epoch": 5828} {"train_loss": -26.977834701538086, "global_step": 483748, "epoch": 5828} {"train_loss": -26.824115753173828, "global_step": 483749, "epoch": 5828} {"train_loss": -27.18134880065918, "global_step": 483750, "epoch": 5828} {"train_loss": -27.520709991455078, "global_step": 483751, "epoch": 5828} {"train_loss": -27.357091903686523, "global_step": 483752, "epoch": 5828} {"train_loss": -26.938873291015625, "global_step": 483753, "epoch": 5828} {"train_loss": -27.147138595581055, "global_step": 483754, "epoch": 5828} {"train_loss": -27.466842651367188, "global_step": 483755, "epoch": 5828} {"train_loss": -27.371564865112305, "global_step": 483756, "epoch": 5828} {"train_loss": -27.34393310546875, "global_step": 483757, "epoch": 5828} {"train_loss": -27.058013916015625, "global_step": 483758, "epoch": 5828} {"train_loss": -27.864484786987305, "global_step": 483759, "epoch": 5828} {"train_loss": -27.119037628173828, "global_step": 483760, "epoch": 5828} {"train_loss": -27.454801559448242, "global_step": 483761, "epoch": 5828} {"train_loss": -27.312503814697266, "global_step": 483762, "epoch": 5828} {"train_loss": -27.4038143157959, "global_step": 483763, "epoch": 5828} {"train_loss": -27.7205867767334, "global_step": 483764, "epoch": 5828} {"train_loss": -27.299604415893555, "global_step": 483765, "epoch": 5828} {"train_loss": -27.525793075561523, "global_step": 483766, "epoch": 5828} {"train_loss": -27.824857711791992, "global_step": 483767, "epoch": 5828} {"train_loss": -27.32602310180664, "global_step": 483768, "epoch": 5828} {"train_loss": -27.6680908203125, "global_step": 483769, "epoch": 5828} {"train_loss": -27.452451705932617, "global_step": 483770, "epoch": 5828} {"train_loss": -27.49741554260254, "global_step": 483771, "epoch": 5828} {"train_loss": -27.21759605407715, "global_step": 483772, "epoch": 5828} {"train_loss": -27.208087921142578, "global_step": 483773, "epoch": 5828} {"train_loss": -27.547119140625, "global_step": 483774, "epoch": 5828} {"train_loss": -27.660160064697266, "global_step": 483775, "epoch": 5828} {"train_loss": -27.3641300201416, "global_step": 483776, "epoch": 5828} {"train_loss": -27.381011962890625, "global_step": 483777, "epoch": 5828} {"train_loss": -27.279409408569336, "global_step": 483778, "epoch": 5828} {"train_loss": -27.4620418548584, "global_step": 483779, "epoch": 5828} {"train_loss": -27.2692813873291, "global_step": 483780, "epoch": 5828} {"train_loss": -27.17880630493164, "global_step": 483781, "epoch": 5828} {"train_loss": -27.668859481811523, "global_step": 483782, "epoch": 5828} {"train_loss": -27.697534561157227, "global_step": 483783, "epoch": 5828} {"train_loss": -27.0119571685791, "global_step": 483784, "epoch": 5828} {"train_loss": -26.91876792907715, "global_step": 483785, "epoch": 5828} {"train_loss": -26.933216094970703, "global_step": 483786, "epoch": 5828} {"train_loss": -27.464933395385742, "global_step": 483787, "epoch": 5828} {"train_loss": -26.91517448425293, "global_step": 483788, "epoch": 5828} {"train_loss": -27.422000885009766, "global_step": 483789, "epoch": 5828} {"train_loss": -27.429279327392578, "global_step": 483790, "epoch": 5828} {"train_loss": -27.557910919189453, "global_step": 483791, "epoch": 5828} {"train_loss": -27.010894775390625, "global_step": 483792, "epoch": 5828} {"train_loss": -27.0146541595459, "global_step": 483793, "epoch": 5828} {"train_loss": -27.578418731689453, "global_step": 483794, "epoch": 5828} {"train_loss": -27.025842666625977, "global_step": 483795, "epoch": 5828} {"train_loss": -27.352697372436523, "global_step": 483796, "epoch": 5828} {"train_loss": -27.175067901611328, "global_step": 483797, "epoch": 5828} {"train_loss": -26.81331443786621, "global_step": 483798, "epoch": 5828} {"train_loss": -27.175535202026367, "global_step": 483799, "epoch": 5828} {"train_loss": -27.216922760009766, "global_step": 483800, "epoch": 5828} {"train_loss": -27.32940673828125, "global_step": 483801, "epoch": 5828} {"train_loss": -26.828466415405273, "global_step": 483802, "epoch": 5828} {"train_loss": -26.976831436157227, "global_step": 483803, "epoch": 5828} {"train_loss": -27.33424949645996, "global_step": 483804, "epoch": 5828} {"train_loss": -27.130224227905273, "global_step": 483805, "epoch": 5828} {"train_loss": -27.131494338253894, "global_step": 483806, "epoch": 5828, "val_loss": 6536285.0} {"train_loss": -26.975839614868164, "global_step": 483807, "epoch": 5829} {"train_loss": -26.66802406311035, "global_step": 483808, "epoch": 5829} {"train_loss": -27.187788009643555, "global_step": 483809, "epoch": 5829} {"train_loss": -27.08563804626465, "global_step": 483810, "epoch": 5829} {"train_loss": -26.784839630126953, "global_step": 483811, "epoch": 5829} {"train_loss": -26.66779899597168, "global_step": 483812, "epoch": 5829} {"train_loss": -26.760290145874023, "global_step": 483813, "epoch": 5829} {"train_loss": -26.609628677368164, "global_step": 483814, "epoch": 5829} {"train_loss": -26.992115020751953, "global_step": 483815, "epoch": 5829} {"train_loss": -26.76633071899414, "global_step": 483816, "epoch": 5829} {"train_loss": -26.77869987487793, "global_step": 483817, "epoch": 5829} {"train_loss": -26.620023727416992, "global_step": 483818, "epoch": 5829} {"train_loss": -27.3614501953125, "global_step": 483819, "epoch": 5829} {"train_loss": -26.78323745727539, "global_step": 483820, "epoch": 5829} {"train_loss": -26.965795516967773, "global_step": 483821, "epoch": 5829} {"train_loss": -27.050451278686523, "global_step": 483822, "epoch": 5829} {"train_loss": -26.803726196289062, "global_step": 483823, "epoch": 5829} {"train_loss": -27.008920669555664, "global_step": 483824, "epoch": 5829} {"train_loss": -27.23443603515625, "global_step": 483825, "epoch": 5829} {"train_loss": -27.01222038269043, "global_step": 483826, "epoch": 5829} {"train_loss": -27.288244247436523, "global_step": 483827, "epoch": 5829} {"train_loss": -27.1578311920166, "global_step": 483828, "epoch": 5829} {"train_loss": -27.346210479736328, "global_step": 483829, "epoch": 5829} {"train_loss": -27.453378677368164, "global_step": 483830, "epoch": 5829} {"train_loss": -27.166156768798828, "global_step": 483831, "epoch": 5829} {"train_loss": -27.28814697265625, "global_step": 483832, "epoch": 5829} {"train_loss": -26.959211349487305, "global_step": 483833, "epoch": 5829} {"train_loss": -27.49163246154785, "global_step": 483834, "epoch": 5829} {"train_loss": -27.03692054748535, "global_step": 483835, "epoch": 5829} {"train_loss": -27.1635684967041, "global_step": 483836, "epoch": 5829} {"train_loss": -27.046905517578125, "global_step": 483837, "epoch": 5829} {"train_loss": -27.403202056884766, "global_step": 483838, "epoch": 5829} {"train_loss": -27.0677490234375, "global_step": 483839, "epoch": 5829} {"train_loss": -27.0589656829834, "global_step": 483840, "epoch": 5829} {"train_loss": -27.23434829711914, "global_step": 483841, "epoch": 5829} {"train_loss": -27.429960250854492, "global_step": 483842, "epoch": 5829} {"train_loss": -27.288251876831055, "global_step": 483843, "epoch": 5829} {"train_loss": -27.471771240234375, "global_step": 483844, "epoch": 5829} {"train_loss": -27.149744033813477, "global_step": 483845, "epoch": 5829} {"train_loss": -27.664554595947266, "global_step": 483846, "epoch": 5829} {"train_loss": -27.403034210205078, "global_step": 483847, "epoch": 5829} {"train_loss": -27.15095329284668, "global_step": 483848, "epoch": 5829} {"train_loss": -27.577665328979492, "global_step": 483849, "epoch": 5829} {"train_loss": -27.516162872314453, "global_step": 483850, "epoch": 5829} {"train_loss": -27.538711547851562, "global_step": 483851, "epoch": 5829} {"train_loss": -27.30293083190918, "global_step": 483852, "epoch": 5829} {"train_loss": -27.479028701782227, "global_step": 483853, "epoch": 5829} {"train_loss": -27.834714889526367, "global_step": 483854, "epoch": 5829} {"train_loss": -27.535797119140625, "global_step": 483855, "epoch": 5829} {"train_loss": -27.24957275390625, "global_step": 483856, "epoch": 5829} {"train_loss": -27.5225772857666, "global_step": 483857, "epoch": 5829} {"train_loss": -27.454015731811523, "global_step": 483858, "epoch": 5829} {"train_loss": -27.454004287719727, "global_step": 483859, "epoch": 5829} {"train_loss": -26.948400497436523, "global_step": 483860, "epoch": 5829} {"train_loss": -27.070770263671875, "global_step": 483861, "epoch": 5829} {"train_loss": -26.66292381286621, "global_step": 483862, "epoch": 5829} {"train_loss": -26.16781997680664, "global_step": 483863, "epoch": 5829} {"train_loss": -27.02126121520996, "global_step": 483864, "epoch": 5829} {"train_loss": -27.26763343811035, "global_step": 483865, "epoch": 5829} {"train_loss": -26.908796310424805, "global_step": 483866, "epoch": 5829} {"train_loss": -26.182086944580078, "global_step": 483867, "epoch": 5829} {"train_loss": -26.897974014282227, "global_step": 483868, "epoch": 5829} {"train_loss": -26.94666862487793, "global_step": 483869, "epoch": 5829} {"train_loss": -27.134906768798828, "global_step": 483870, "epoch": 5829} {"train_loss": -26.822553634643555, "global_step": 483871, "epoch": 5829} {"train_loss": -27.41509437561035, "global_step": 483872, "epoch": 5829} {"train_loss": -27.109121322631836, "global_step": 483873, "epoch": 5829} {"train_loss": -26.9116153717041, "global_step": 483874, "epoch": 5829} {"train_loss": -27.186304092407227, "global_step": 483875, "epoch": 5829} {"train_loss": -27.25251579284668, "global_step": 483876, "epoch": 5829} {"train_loss": -27.2618465423584, "global_step": 483877, "epoch": 5829} {"train_loss": -27.147043228149414, "global_step": 483878, "epoch": 5829} {"train_loss": -27.38728141784668, "global_step": 483879, "epoch": 5829} {"train_loss": -27.24407386779785, "global_step": 483880, "epoch": 5829} {"train_loss": -26.941577911376953, "global_step": 483881, "epoch": 5829} {"train_loss": -27.404794692993164, "global_step": 483882, "epoch": 5829} {"train_loss": -27.465713500976562, "global_step": 483883, "epoch": 5829} {"train_loss": -27.386266708374023, "global_step": 483884, "epoch": 5829} {"train_loss": -27.330564498901367, "global_step": 483885, "epoch": 5829} {"train_loss": -27.010419845581055, "global_step": 483886, "epoch": 5829} {"train_loss": -27.56546974182129, "global_step": 483887, "epoch": 5829} {"train_loss": -27.398670196533203, "global_step": 483888, "epoch": 5829} {"train_loss": -27.160258189741388, "global_step": 483889, "epoch": 5829, "val_loss": 6500753.0} {"train_loss": -26.6484375, "global_step": 483890, "epoch": 5830} {"train_loss": -26.709054946899414, "global_step": 483891, "epoch": 5830} {"train_loss": -27.194372177124023, "global_step": 483892, "epoch": 5830} {"train_loss": -26.65571403503418, "global_step": 483893, "epoch": 5830} {"train_loss": -26.7760066986084, "global_step": 483894, "epoch": 5830} {"train_loss": -26.56864356994629, "global_step": 483895, "epoch": 5830} {"train_loss": -26.724262237548828, "global_step": 483896, "epoch": 5830} {"train_loss": -26.728851318359375, "global_step": 483897, "epoch": 5830} {"train_loss": -26.985858917236328, "global_step": 483898, "epoch": 5830} {"train_loss": -26.6320743560791, "global_step": 483899, "epoch": 5830} {"train_loss": -26.771448135375977, "global_step": 483900, "epoch": 5830} {"train_loss": -26.51513671875, "global_step": 483901, "epoch": 5830} {"train_loss": -26.955280303955078, "global_step": 483902, "epoch": 5830} {"train_loss": -26.614700317382812, "global_step": 483903, "epoch": 5830} {"train_loss": -26.698104858398438, "global_step": 483904, "epoch": 5830} {"train_loss": -27.035619735717773, "global_step": 483905, "epoch": 5830} {"train_loss": -27.012319564819336, "global_step": 483906, "epoch": 5830} {"train_loss": -27.36978530883789, "global_step": 483907, "epoch": 5830} {"train_loss": -27.2015323638916, "global_step": 483908, "epoch": 5830} {"train_loss": -26.9936580657959, "global_step": 483909, "epoch": 5830} {"train_loss": -27.105009078979492, "global_step": 483910, "epoch": 5830} {"train_loss": -27.073713302612305, "global_step": 483911, "epoch": 5830} {"train_loss": -26.837148666381836, "global_step": 483912, "epoch": 5830} {"train_loss": -27.184293746948242, "global_step": 483913, "epoch": 5830} {"train_loss": -26.932483673095703, "global_step": 483914, "epoch": 5830} {"train_loss": -27.2063045501709, "global_step": 483915, "epoch": 5830} {"train_loss": -27.108789443969727, "global_step": 483916, "epoch": 5830} {"train_loss": -27.197275161743164, "global_step": 483917, "epoch": 5830} {"train_loss": -26.743011474609375, "global_step": 483918, "epoch": 5830} {"train_loss": -27.14164161682129, "global_step": 483919, "epoch": 5830} {"train_loss": -27.5975284576416, "global_step": 483920, "epoch": 5830} {"train_loss": -27.395605087280273, "global_step": 483921, "epoch": 5830} {"train_loss": -27.324018478393555, "global_step": 483922, "epoch": 5830} {"train_loss": -27.36578941345215, "global_step": 483923, "epoch": 5830} {"train_loss": -27.033405303955078, "global_step": 483924, "epoch": 5830} {"train_loss": -27.555419921875, "global_step": 483925, "epoch": 5830} {"train_loss": -27.507108688354492, "global_step": 483926, "epoch": 5830} {"train_loss": -27.290475845336914, "global_step": 483927, "epoch": 5830} {"train_loss": -27.604536056518555, "global_step": 483928, "epoch": 5830} {"train_loss": -27.54463005065918, "global_step": 483929, "epoch": 5830} {"train_loss": -27.712005615234375, "global_step": 483930, "epoch": 5830} {"train_loss": -27.4439640045166, "global_step": 483931, "epoch": 5830} {"train_loss": -27.449481964111328, "global_step": 483932, "epoch": 5830} {"train_loss": -27.565698623657227, "global_step": 483933, "epoch": 5830} {"train_loss": -27.173114776611328, "global_step": 483934, "epoch": 5830} {"train_loss": -27.324636459350586, "global_step": 483935, "epoch": 5830} {"train_loss": -27.56732177734375, "global_step": 483936, "epoch": 5830} {"train_loss": -27.204883575439453, "global_step": 483937, "epoch": 5830} {"train_loss": -27.22332191467285, "global_step": 483938, "epoch": 5830} {"train_loss": -27.47760009765625, "global_step": 483939, "epoch": 5830} {"train_loss": -27.389623641967773, "global_step": 483940, "epoch": 5830} {"train_loss": -27.466333389282227, "global_step": 483941, "epoch": 5830} {"train_loss": -27.219974517822266, "global_step": 483942, "epoch": 5830} {"train_loss": -27.485401153564453, "global_step": 483943, "epoch": 5830} {"train_loss": -27.86333656311035, "global_step": 483944, "epoch": 5830} {"train_loss": -27.769845962524414, "global_step": 483945, "epoch": 5830} {"train_loss": -27.4997615814209, "global_step": 483946, "epoch": 5830} {"train_loss": -27.061750411987305, "global_step": 483947, "epoch": 5830} {"train_loss": -26.93265151977539, "global_step": 483948, "epoch": 5830} {"train_loss": -26.823017120361328, "global_step": 483949, "epoch": 5830} {"train_loss": -27.026464462280273, "global_step": 483950, "epoch": 5830} {"train_loss": -27.370529174804688, "global_step": 483951, "epoch": 5830} {"train_loss": -27.348224639892578, "global_step": 483952, "epoch": 5830} {"train_loss": -26.827102661132812, "global_step": 483953, "epoch": 5830} {"train_loss": -26.928302764892578, "global_step": 483954, "epoch": 5830} {"train_loss": -27.287939071655273, "global_step": 483955, "epoch": 5830} {"train_loss": -27.11689567565918, "global_step": 483956, "epoch": 5830} {"train_loss": -27.01666831970215, "global_step": 483957, "epoch": 5830} {"train_loss": -27.150196075439453, "global_step": 483958, "epoch": 5830} {"train_loss": -27.285741806030273, "global_step": 483959, "epoch": 5830} {"train_loss": -27.265623092651367, "global_step": 483960, "epoch": 5830} {"train_loss": -27.123212814331055, "global_step": 483961, "epoch": 5830} {"train_loss": -27.31753921508789, "global_step": 483962, "epoch": 5830} {"train_loss": -27.181427001953125, "global_step": 483963, "epoch": 5830} {"train_loss": -27.319976806640625, "global_step": 483964, "epoch": 5830} {"train_loss": -27.221261978149414, "global_step": 483965, "epoch": 5830} {"train_loss": -26.94886589050293, "global_step": 483966, "epoch": 5830} {"train_loss": -27.2039737701416, "global_step": 483967, "epoch": 5830} {"train_loss": -27.093048095703125, "global_step": 483968, "epoch": 5830} {"train_loss": -27.24277687072754, "global_step": 483969, "epoch": 5830} {"train_loss": -27.43073081970215, "global_step": 483970, "epoch": 5830} {"train_loss": -27.41938591003418, "global_step": 483971, "epoch": 5830} {"train_loss": -27.180287096873823, "global_step": 483972, "epoch": 5830, "val_loss": 6601580.0} {"train_loss": -26.632726669311523, "global_step": 483973, "epoch": 5831} {"train_loss": -26.811704635620117, "global_step": 483974, "epoch": 5831} {"train_loss": -26.879056930541992, "global_step": 483975, "epoch": 5831} {"train_loss": -27.09064292907715, "global_step": 483976, "epoch": 5831} {"train_loss": -27.005395889282227, "global_step": 483977, "epoch": 5831} {"train_loss": -26.584980010986328, "global_step": 483978, "epoch": 5831} {"train_loss": -26.789398193359375, "global_step": 483979, "epoch": 5831} {"train_loss": -27.018964767456055, "global_step": 483980, "epoch": 5831} {"train_loss": -26.520877838134766, "global_step": 483981, "epoch": 5831} {"train_loss": -27.115936279296875, "global_step": 483982, "epoch": 5831} {"train_loss": -26.793075561523438, "global_step": 483983, "epoch": 5831} {"train_loss": -26.990819931030273, "global_step": 483984, "epoch": 5831} {"train_loss": -27.1950626373291, "global_step": 483985, "epoch": 5831} {"train_loss": -27.242923736572266, "global_step": 483986, "epoch": 5831} {"train_loss": -27.079730987548828, "global_step": 483987, "epoch": 5831} {"train_loss": -27.19403076171875, "global_step": 483988, "epoch": 5831} {"train_loss": -26.707138061523438, "global_step": 483989, "epoch": 5831} {"train_loss": -27.091764450073242, "global_step": 483990, "epoch": 5831} {"train_loss": -27.465978622436523, "global_step": 483991, "epoch": 5831} {"train_loss": -27.081335067749023, "global_step": 483992, "epoch": 5831} {"train_loss": -27.410816192626953, "global_step": 483993, "epoch": 5831} {"train_loss": -27.332685470581055, "global_step": 483994, "epoch": 5831} {"train_loss": -27.619665145874023, "global_step": 483995, "epoch": 5831} {"train_loss": -27.14871597290039, "global_step": 483996, "epoch": 5831} {"train_loss": -27.243261337280273, "global_step": 483997, "epoch": 5831} {"train_loss": -27.5802001953125, "global_step": 483998, "epoch": 5831} {"train_loss": -27.496387481689453, "global_step": 483999, "epoch": 5831} {"train_loss": -27.559473037719727, "global_step": 484000, "epoch": 5831} {"train_loss": -27.4249267578125, "global_step": 484001, "epoch": 5831} {"train_loss": -27.49146842956543, "global_step": 484002, "epoch": 5831} {"train_loss": -27.31868553161621, "global_step": 484003, "epoch": 5831} {"train_loss": -27.222848892211914, "global_step": 484004, "epoch": 5831} {"train_loss": -27.44091796875, "global_step": 484005, "epoch": 5831} {"train_loss": -27.13272476196289, "global_step": 484006, "epoch": 5831} {"train_loss": -27.13067626953125, "global_step": 484007, "epoch": 5831} {"train_loss": -26.8880615234375, "global_step": 484008, "epoch": 5831} {"train_loss": -27.58588981628418, "global_step": 484009, "epoch": 5831} {"train_loss": -27.544300079345703, "global_step": 484010, "epoch": 5831} {"train_loss": -27.238855361938477, "global_step": 484011, "epoch": 5831} {"train_loss": -27.39579200744629, "global_step": 484012, "epoch": 5831} {"train_loss": -26.891576766967773, "global_step": 484013, "epoch": 5831} {"train_loss": -27.47393226623535, "global_step": 484014, "epoch": 5831} {"train_loss": -27.344141006469727, "global_step": 484015, "epoch": 5831} {"train_loss": -27.52742576599121, "global_step": 484016, "epoch": 5831} {"train_loss": -27.3850040435791, "global_step": 484017, "epoch": 5831} {"train_loss": -27.232099533081055, "global_step": 484018, "epoch": 5831} {"train_loss": -27.05616569519043, "global_step": 484019, "epoch": 5831} {"train_loss": -27.194067001342773, "global_step": 484020, "epoch": 5831} {"train_loss": -27.757062911987305, "global_step": 484021, "epoch": 5831} {"train_loss": -27.5236759185791, "global_step": 484022, "epoch": 5831} {"train_loss": -27.948974609375, "global_step": 484023, "epoch": 5831} {"train_loss": -27.149829864501953, "global_step": 484024, "epoch": 5831} {"train_loss": -26.686262130737305, "global_step": 484025, "epoch": 5831} {"train_loss": -26.9392147064209, "global_step": 484026, "epoch": 5831} {"train_loss": -27.19091796875, "global_step": 484027, "epoch": 5831} {"train_loss": -27.2518367767334, "global_step": 484028, "epoch": 5831} {"train_loss": -27.304601669311523, "global_step": 484029, "epoch": 5831} {"train_loss": -27.348230361938477, "global_step": 484030, "epoch": 5831} {"train_loss": -27.533878326416016, "global_step": 484031, "epoch": 5831} {"train_loss": -27.352508544921875, "global_step": 484032, "epoch": 5831} {"train_loss": -27.248754501342773, "global_step": 484033, "epoch": 5831} {"train_loss": -27.113073348999023, "global_step": 484034, "epoch": 5831} {"train_loss": -27.343917846679688, "global_step": 484035, "epoch": 5831} {"train_loss": -27.47747802734375, "global_step": 484036, "epoch": 5831} {"train_loss": -27.1688289642334, "global_step": 484037, "epoch": 5831} {"train_loss": -27.25809669494629, "global_step": 484038, "epoch": 5831} {"train_loss": -27.091388702392578, "global_step": 484039, "epoch": 5831} {"train_loss": -27.014829635620117, "global_step": 484040, "epoch": 5831} {"train_loss": -26.9295654296875, "global_step": 484041, "epoch": 5831} {"train_loss": -27.183774948120117, "global_step": 484042, "epoch": 5831} {"train_loss": -27.564111709594727, "global_step": 484043, "epoch": 5831} {"train_loss": -27.24884605407715, "global_step": 484044, "epoch": 5831} {"train_loss": -27.055150985717773, "global_step": 484045, "epoch": 5831} {"train_loss": -26.589405059814453, "global_step": 484046, "epoch": 5831} {"train_loss": -26.31732177734375, "global_step": 484047, "epoch": 5831} {"train_loss": -26.766077041625977, "global_step": 484048, "epoch": 5831} {"train_loss": -27.3311824798584, "global_step": 484049, "epoch": 5831} {"train_loss": -26.75640296936035, "global_step": 484050, "epoch": 5831} {"train_loss": -27.3203125, "global_step": 484051, "epoch": 5831} {"train_loss": -26.788543701171875, "global_step": 484052, "epoch": 5831} {"train_loss": -26.86258888244629, "global_step": 484053, "epoch": 5831} {"train_loss": -27.17612648010254, "global_step": 484054, "epoch": 5831} {"train_loss": -27.17702309482069, "global_step": 484055, "epoch": 5831, "val_loss": 6483425.0} {"train_loss": -26.9808406829834, "global_step": 484056, "epoch": 5832} {"train_loss": -26.5703125, "global_step": 484057, "epoch": 5832} {"train_loss": -27.15277099609375, "global_step": 484058, "epoch": 5832} {"train_loss": -26.835676193237305, "global_step": 484059, "epoch": 5832} {"train_loss": -26.941654205322266, "global_step": 484060, "epoch": 5832} {"train_loss": -26.47108268737793, "global_step": 484061, "epoch": 5832} {"train_loss": -26.596948623657227, "global_step": 484062, "epoch": 5832} {"train_loss": -26.84846305847168, "global_step": 484063, "epoch": 5832} {"train_loss": -26.766576766967773, "global_step": 484064, "epoch": 5832} {"train_loss": -26.988378524780273, "global_step": 484065, "epoch": 5832} {"train_loss": -26.756689071655273, "global_step": 484066, "epoch": 5832} {"train_loss": -26.814477920532227, "global_step": 484067, "epoch": 5832} {"train_loss": -26.759565353393555, "global_step": 484068, "epoch": 5832} {"train_loss": -27.148202896118164, "global_step": 484069, "epoch": 5832} {"train_loss": -26.91339683532715, "global_step": 484070, "epoch": 5832} {"train_loss": -26.75684928894043, "global_step": 484071, "epoch": 5832} {"train_loss": -26.960580825805664, "global_step": 484072, "epoch": 5832} {"train_loss": -26.889068603515625, "global_step": 484073, "epoch": 5832} {"train_loss": -26.7276554107666, "global_step": 484074, "epoch": 5832} {"train_loss": -26.4884033203125, "global_step": 484075, "epoch": 5832} {"train_loss": -26.8753662109375, "global_step": 484076, "epoch": 5832} {"train_loss": -26.765701293945312, "global_step": 484077, "epoch": 5832} {"train_loss": -27.242053985595703, "global_step": 484078, "epoch": 5832} {"train_loss": -26.587522506713867, "global_step": 484079, "epoch": 5832} {"train_loss": -26.950653076171875, "global_step": 484080, "epoch": 5832} {"train_loss": -26.783472061157227, "global_step": 484081, "epoch": 5832} {"train_loss": -26.680755615234375, "global_step": 484082, "epoch": 5832} {"train_loss": -27.133031845092773, "global_step": 484083, "epoch": 5832} {"train_loss": -27.057178497314453, "global_step": 484084, "epoch": 5832} {"train_loss": -27.075180053710938, "global_step": 484085, "epoch": 5832} {"train_loss": -27.137760162353516, "global_step": 484086, "epoch": 5832} {"train_loss": -27.0188045501709, "global_step": 484087, "epoch": 5832} {"train_loss": -27.194259643554688, "global_step": 484088, "epoch": 5832} {"train_loss": -27.244306564331055, "global_step": 484089, "epoch": 5832} {"train_loss": -27.143402099609375, "global_step": 484090, "epoch": 5832} {"train_loss": -27.080738067626953, "global_step": 484091, "epoch": 5832} {"train_loss": -27.47149658203125, "global_step": 484092, "epoch": 5832} {"train_loss": -26.925485610961914, "global_step": 484093, "epoch": 5832} {"train_loss": -27.40262222290039, "global_step": 484094, "epoch": 5832} {"train_loss": -27.35017967224121, "global_step": 484095, "epoch": 5832} {"train_loss": -26.918106079101562, "global_step": 484096, "epoch": 5832} {"train_loss": -27.20131492614746, "global_step": 484097, "epoch": 5832} {"train_loss": -27.388751983642578, "global_step": 484098, "epoch": 5832} {"train_loss": -27.05142593383789, "global_step": 484099, "epoch": 5832} {"train_loss": -27.30686378479004, "global_step": 484100, "epoch": 5832} {"train_loss": -27.4492130279541, "global_step": 484101, "epoch": 5832} {"train_loss": -27.71137809753418, "global_step": 484102, "epoch": 5832} {"train_loss": -26.85114860534668, "global_step": 484103, "epoch": 5832} {"train_loss": -27.3707218170166, "global_step": 484104, "epoch": 5832} {"train_loss": -27.41897964477539, "global_step": 484105, "epoch": 5832} {"train_loss": -27.522619247436523, "global_step": 484106, "epoch": 5832} {"train_loss": -27.5212345123291, "global_step": 484107, "epoch": 5832} {"train_loss": -27.418622970581055, "global_step": 484108, "epoch": 5832} {"train_loss": -27.40082359313965, "global_step": 484109, "epoch": 5832} {"train_loss": -27.22993278503418, "global_step": 484110, "epoch": 5832} {"train_loss": -27.30217933654785, "global_step": 484111, "epoch": 5832} {"train_loss": -27.38551139831543, "global_step": 484112, "epoch": 5832} {"train_loss": -27.463327407836914, "global_step": 484113, "epoch": 5832} {"train_loss": -26.998632431030273, "global_step": 484114, "epoch": 5832} {"train_loss": -27.301422119140625, "global_step": 484115, "epoch": 5832} {"train_loss": -27.279056549072266, "global_step": 484116, "epoch": 5832} {"train_loss": -27.43023681640625, "global_step": 484117, "epoch": 5832} {"train_loss": -27.4495792388916, "global_step": 484118, "epoch": 5832} {"train_loss": -27.338260650634766, "global_step": 484119, "epoch": 5832} {"train_loss": -27.29886245727539, "global_step": 484120, "epoch": 5832} {"train_loss": -26.98203468322754, "global_step": 484121, "epoch": 5832} {"train_loss": -27.40593910217285, "global_step": 484122, "epoch": 5832} {"train_loss": -27.412988662719727, "global_step": 484123, "epoch": 5832} {"train_loss": -27.7166748046875, "global_step": 484124, "epoch": 5832} {"train_loss": -27.464508056640625, "global_step": 484125, "epoch": 5832} {"train_loss": -27.532434463500977, "global_step": 484126, "epoch": 5832} {"train_loss": -27.4049072265625, "global_step": 484127, "epoch": 5832} {"train_loss": -27.215198516845703, "global_step": 484128, "epoch": 5832} {"train_loss": -27.571279525756836, "global_step": 484129, "epoch": 5832} {"train_loss": -27.27239418029785, "global_step": 484130, "epoch": 5832} {"train_loss": -27.223194122314453, "global_step": 484131, "epoch": 5832} {"train_loss": -27.463516235351562, "global_step": 484132, "epoch": 5832} {"train_loss": -27.807676315307617, "global_step": 484133, "epoch": 5832} {"train_loss": -27.4307804107666, "global_step": 484134, "epoch": 5832} {"train_loss": -27.494632720947266, "global_step": 484135, "epoch": 5832} {"train_loss": -26.982349395751953, "global_step": 484136, "epoch": 5832} {"train_loss": -27.231708526611328, "global_step": 484137, "epoch": 5832} {"train_loss": -27.151000539940522, "global_step": 484138, "epoch": 5832, "val_loss": 6549019.0} {"train_loss": -26.08199119567871, "global_step": 484139, "epoch": 5833} {"train_loss": -26.00559425354004, "global_step": 484140, "epoch": 5833} {"train_loss": -26.686908721923828, "global_step": 484141, "epoch": 5833} {"train_loss": -26.297956466674805, "global_step": 484142, "epoch": 5833} {"train_loss": -26.5897274017334, "global_step": 484143, "epoch": 5833} {"train_loss": -26.3386287689209, "global_step": 484144, "epoch": 5833} {"train_loss": -26.126453399658203, "global_step": 484145, "epoch": 5833} {"train_loss": -26.719945907592773, "global_step": 484146, "epoch": 5833} {"train_loss": -26.398733139038086, "global_step": 484147, "epoch": 5833} {"train_loss": -26.412933349609375, "global_step": 484148, "epoch": 5833} {"train_loss": -27.122983932495117, "global_step": 484149, "epoch": 5833} {"train_loss": -26.18958854675293, "global_step": 484150, "epoch": 5833} {"train_loss": -26.511930465698242, "global_step": 484151, "epoch": 5833} {"train_loss": -26.15301513671875, "global_step": 484152, "epoch": 5833} {"train_loss": -27.176959991455078, "global_step": 484153, "epoch": 5833} {"train_loss": -27.24672508239746, "global_step": 484154, "epoch": 5833} {"train_loss": -26.818017959594727, "global_step": 484155, "epoch": 5833} {"train_loss": -27.066205978393555, "global_step": 484156, "epoch": 5833} {"train_loss": -26.1803035736084, "global_step": 484157, "epoch": 5833} {"train_loss": -27.300994873046875, "global_step": 484158, "epoch": 5833} {"train_loss": -26.995019912719727, "global_step": 484159, "epoch": 5833} {"train_loss": -26.96194839477539, "global_step": 484160, "epoch": 5833} {"train_loss": -26.73797607421875, "global_step": 484161, "epoch": 5833} {"train_loss": -27.211576461791992, "global_step": 484162, "epoch": 5833} {"train_loss": -27.176122665405273, "global_step": 484163, "epoch": 5833} {"train_loss": -27.116422653198242, "global_step": 484164, "epoch": 5833} {"train_loss": -27.0627498626709, "global_step": 484165, "epoch": 5833} {"train_loss": -27.170242309570312, "global_step": 484166, "epoch": 5833} {"train_loss": -27.086761474609375, "global_step": 484167, "epoch": 5833} {"train_loss": -26.802845001220703, "global_step": 484168, "epoch": 5833} {"train_loss": -27.250762939453125, "global_step": 484169, "epoch": 5833} {"train_loss": -26.5645694732666, "global_step": 484170, "epoch": 5833} {"train_loss": -27.09503173828125, "global_step": 484171, "epoch": 5833} {"train_loss": -27.603351593017578, "global_step": 484172, "epoch": 5833} {"train_loss": -27.48223304748535, "global_step": 484173, "epoch": 5833} {"train_loss": -27.31770896911621, "global_step": 484174, "epoch": 5833} {"train_loss": -27.350601196289062, "global_step": 484175, "epoch": 5833} {"train_loss": -27.31182289123535, "global_step": 484176, "epoch": 5833} {"train_loss": -27.26914405822754, "global_step": 484177, "epoch": 5833} {"train_loss": -27.281787872314453, "global_step": 484178, "epoch": 5833} {"train_loss": -27.144811630249023, "global_step": 484179, "epoch": 5833} {"train_loss": -27.280439376831055, "global_step": 484180, "epoch": 5833} {"train_loss": -27.4031982421875, "global_step": 484181, "epoch": 5833} {"train_loss": -27.049224853515625, "global_step": 484182, "epoch": 5833} {"train_loss": -27.38568687438965, "global_step": 484183, "epoch": 5833} {"train_loss": -26.711828231811523, "global_step": 484184, "epoch": 5833} {"train_loss": -27.329824447631836, "global_step": 484185, "epoch": 5833} {"train_loss": -27.307605743408203, "global_step": 484186, "epoch": 5833} {"train_loss": -27.572301864624023, "global_step": 484187, "epoch": 5833} {"train_loss": -27.10349464416504, "global_step": 484188, "epoch": 5833} {"train_loss": -26.75064468383789, "global_step": 484189, "epoch": 5833} {"train_loss": -27.23841667175293, "global_step": 484190, "epoch": 5833} {"train_loss": -27.141510009765625, "global_step": 484191, "epoch": 5833} {"train_loss": -27.4093017578125, "global_step": 484192, "epoch": 5833} {"train_loss": -27.301010131835938, "global_step": 484193, "epoch": 5833} {"train_loss": -27.47930908203125, "global_step": 484194, "epoch": 5833} {"train_loss": -27.385211944580078, "global_step": 484195, "epoch": 5833} {"train_loss": -27.443124771118164, "global_step": 484196, "epoch": 5833} {"train_loss": -27.376073837280273, "global_step": 484197, "epoch": 5833} {"train_loss": -27.502527236938477, "global_step": 484198, "epoch": 5833} {"train_loss": -27.293725967407227, "global_step": 484199, "epoch": 5833} {"train_loss": -27.433807373046875, "global_step": 484200, "epoch": 5833} {"train_loss": -27.167158126831055, "global_step": 484201, "epoch": 5833} {"train_loss": -26.958356857299805, "global_step": 484202, "epoch": 5833} {"train_loss": -27.06617546081543, "global_step": 484203, "epoch": 5833} {"train_loss": -26.748443603515625, "global_step": 484204, "epoch": 5833} {"train_loss": -26.828794479370117, "global_step": 484205, "epoch": 5833} {"train_loss": -27.408008575439453, "global_step": 484206, "epoch": 5833} {"train_loss": -27.304492950439453, "global_step": 484207, "epoch": 5833} {"train_loss": -27.47829246520996, "global_step": 484208, "epoch": 5833} {"train_loss": -27.46416664123535, "global_step": 484209, "epoch": 5833} {"train_loss": -26.777801513671875, "global_step": 484210, "epoch": 5833} {"train_loss": -27.69805908203125, "global_step": 484211, "epoch": 5833} {"train_loss": -27.535619735717773, "global_step": 484212, "epoch": 5833} {"train_loss": -27.168670654296875, "global_step": 484213, "epoch": 5833} {"train_loss": -27.125045776367188, "global_step": 484214, "epoch": 5833} {"train_loss": -27.631759643554688, "global_step": 484215, "epoch": 5833} {"train_loss": -27.279834747314453, "global_step": 484216, "epoch": 5833} {"train_loss": -27.3145751953125, "global_step": 484217, "epoch": 5833} {"train_loss": -27.297550201416016, "global_step": 484218, "epoch": 5833} {"train_loss": -27.104284286499023, "global_step": 484219, "epoch": 5833} {"train_loss": -27.5136661529541, "global_step": 484220, "epoch": 5833} {"train_loss": -27.071825326207172, "global_step": 484221, "epoch": 5833, "val_loss": 6545742.0} {"train_loss": -25.835824966430664, "global_step": 484222, "epoch": 5834} {"train_loss": -26.18855094909668, "global_step": 484223, "epoch": 5834} {"train_loss": -26.64967155456543, "global_step": 484224, "epoch": 5834} {"train_loss": -25.807493209838867, "global_step": 484225, "epoch": 5834} {"train_loss": -26.46681785583496, "global_step": 484226, "epoch": 5834} {"train_loss": -25.94148063659668, "global_step": 484227, "epoch": 5834} {"train_loss": -26.4688720703125, "global_step": 484228, "epoch": 5834} {"train_loss": -26.82686424255371, "global_step": 484229, "epoch": 5834} {"train_loss": -26.232406616210938, "global_step": 484230, "epoch": 5834} {"train_loss": -26.461694717407227, "global_step": 484231, "epoch": 5834} {"train_loss": -26.04233169555664, "global_step": 484232, "epoch": 5834} {"train_loss": -26.770456314086914, "global_step": 484233, "epoch": 5834} {"train_loss": -26.640012741088867, "global_step": 484234, "epoch": 5834} {"train_loss": -26.702056884765625, "global_step": 484235, "epoch": 5834} {"train_loss": -26.936792373657227, "global_step": 484236, "epoch": 5834} {"train_loss": -26.81549644470215, "global_step": 484237, "epoch": 5834} {"train_loss": -26.42022132873535, "global_step": 484238, "epoch": 5834} {"train_loss": -26.807830810546875, "global_step": 484239, "epoch": 5834} {"train_loss": -26.812158584594727, "global_step": 484240, "epoch": 5834} {"train_loss": -26.895910263061523, "global_step": 484241, "epoch": 5834} {"train_loss": -26.98789405822754, "global_step": 484242, "epoch": 5834} {"train_loss": -26.57859230041504, "global_step": 484243, "epoch": 5834} {"train_loss": -27.0612850189209, "global_step": 484244, "epoch": 5834} {"train_loss": -26.844390869140625, "global_step": 484245, "epoch": 5834} {"train_loss": -27.09024429321289, "global_step": 484246, "epoch": 5834} {"train_loss": -26.656408309936523, "global_step": 484247, "epoch": 5834} {"train_loss": -27.215499877929688, "global_step": 484248, "epoch": 5834} {"train_loss": -26.686786651611328, "global_step": 484249, "epoch": 5834} {"train_loss": -27.12981605529785, "global_step": 484250, "epoch": 5834} {"train_loss": -27.15913200378418, "global_step": 484251, "epoch": 5834} {"train_loss": -27.29656982421875, "global_step": 484252, "epoch": 5834} {"train_loss": -26.94923973083496, "global_step": 484253, "epoch": 5834} {"train_loss": -27.009057998657227, "global_step": 484254, "epoch": 5834} {"train_loss": -27.326261520385742, "global_step": 484255, "epoch": 5834} {"train_loss": -27.400182723999023, "global_step": 484256, "epoch": 5834} {"train_loss": -26.83734703063965, "global_step": 484257, "epoch": 5834} {"train_loss": -27.2631778717041, "global_step": 484258, "epoch": 5834} {"train_loss": -27.497915267944336, "global_step": 484259, "epoch": 5834} {"train_loss": -27.213653564453125, "global_step": 484260, "epoch": 5834} {"train_loss": -27.14853286743164, "global_step": 484261, "epoch": 5834} {"train_loss": -27.048505783081055, "global_step": 484262, "epoch": 5834} {"train_loss": -27.41457176208496, "global_step": 484263, "epoch": 5834} {"train_loss": -27.603103637695312, "global_step": 484264, "epoch": 5834} {"train_loss": -27.324926376342773, "global_step": 484265, "epoch": 5834} {"train_loss": -27.551288604736328, "global_step": 484266, "epoch": 5834} {"train_loss": -27.12456703186035, "global_step": 484267, "epoch": 5834} {"train_loss": -27.351531982421875, "global_step": 484268, "epoch": 5834} {"train_loss": -27.34309196472168, "global_step": 484269, "epoch": 5834} {"train_loss": -26.874242782592773, "global_step": 484270, "epoch": 5834} {"train_loss": -27.818317413330078, "global_step": 484271, "epoch": 5834} {"train_loss": -27.171829223632812, "global_step": 484272, "epoch": 5834} {"train_loss": -27.14141845703125, "global_step": 484273, "epoch": 5834} {"train_loss": -27.338287353515625, "global_step": 484274, "epoch": 5834} {"train_loss": -27.294912338256836, "global_step": 484275, "epoch": 5834} {"train_loss": -27.456823348999023, "global_step": 484276, "epoch": 5834} {"train_loss": -26.85186767578125, "global_step": 484277, "epoch": 5834} {"train_loss": -26.69257164001465, "global_step": 484278, "epoch": 5834} {"train_loss": -25.746137619018555, "global_step": 484279, "epoch": 5834} {"train_loss": -25.21078872680664, "global_step": 484280, "epoch": 5834} {"train_loss": -27.029245376586914, "global_step": 484281, "epoch": 5834} {"train_loss": -26.482940673828125, "global_step": 484282, "epoch": 5834} {"train_loss": -26.448333740234375, "global_step": 484283, "epoch": 5834} {"train_loss": -26.940998077392578, "global_step": 484284, "epoch": 5834} {"train_loss": -26.96343421936035, "global_step": 484285, "epoch": 5834} {"train_loss": -26.46714210510254, "global_step": 484286, "epoch": 5834} {"train_loss": -27.158401489257812, "global_step": 484287, "epoch": 5834} {"train_loss": -26.91486930847168, "global_step": 484288, "epoch": 5834} {"train_loss": -26.823705673217773, "global_step": 484289, "epoch": 5834} {"train_loss": -27.6702938079834, "global_step": 484290, "epoch": 5834} {"train_loss": -27.028894424438477, "global_step": 484291, "epoch": 5834} {"train_loss": -26.85066032409668, "global_step": 484292, "epoch": 5834} {"train_loss": -27.2767391204834, "global_step": 484293, "epoch": 5834} {"train_loss": -27.385944366455078, "global_step": 484294, "epoch": 5834} {"train_loss": -26.943607330322266, "global_step": 484295, "epoch": 5834} {"train_loss": -27.044815063476562, "global_step": 484296, "epoch": 5834} {"train_loss": -27.411481857299805, "global_step": 484297, "epoch": 5834} {"train_loss": -27.07935905456543, "global_step": 484298, "epoch": 5834} {"train_loss": -27.187667846679688, "global_step": 484299, "epoch": 5834} {"train_loss": -27.192956924438477, "global_step": 484300, "epoch": 5834} {"train_loss": -27.39678955078125, "global_step": 484301, "epoch": 5834} {"train_loss": -27.40232276916504, "global_step": 484302, "epoch": 5834} {"train_loss": -27.413360595703125, "global_step": 484303, "epoch": 5834} {"train_loss": -26.932095539138977, "global_step": 484304, "epoch": 5834, "val_loss": 6455206.0} {"train_loss": -26.546661376953125, "global_step": 484305, "epoch": 5835} {"train_loss": -26.61931800842285, "global_step": 484306, "epoch": 5835} {"train_loss": -26.877307891845703, "global_step": 484307, "epoch": 5835} {"train_loss": -27.10780143737793, "global_step": 484308, "epoch": 5835} {"train_loss": -26.46306800842285, "global_step": 484309, "epoch": 5835} {"train_loss": -26.304052352905273, "global_step": 484310, "epoch": 5835} {"train_loss": -26.416934967041016, "global_step": 484311, "epoch": 5835} {"train_loss": -26.774311065673828, "global_step": 484312, "epoch": 5835} {"train_loss": -27.26242446899414, "global_step": 484313, "epoch": 5835} {"train_loss": -27.02825355529785, "global_step": 484314, "epoch": 5835} {"train_loss": -26.458154678344727, "global_step": 484315, "epoch": 5835} {"train_loss": -26.792327880859375, "global_step": 484316, "epoch": 5835} {"train_loss": -26.882221221923828, "global_step": 484317, "epoch": 5835} {"train_loss": -26.737524032592773, "global_step": 484318, "epoch": 5835} {"train_loss": -26.40169334411621, "global_step": 484319, "epoch": 5835} {"train_loss": -27.04970359802246, "global_step": 484320, "epoch": 5835} {"train_loss": -26.446386337280273, "global_step": 484321, "epoch": 5835} {"train_loss": -26.62994384765625, "global_step": 484322, "epoch": 5835} {"train_loss": -26.833770751953125, "global_step": 484323, "epoch": 5835} {"train_loss": -27.025421142578125, "global_step": 484324, "epoch": 5835} {"train_loss": -26.96827507019043, "global_step": 484325, "epoch": 5835} {"train_loss": -27.007556915283203, "global_step": 484326, "epoch": 5835} {"train_loss": -26.805316925048828, "global_step": 484327, "epoch": 5835} {"train_loss": -27.29633140563965, "global_step": 484328, "epoch": 5835} {"train_loss": -26.9254150390625, "global_step": 484329, "epoch": 5835} {"train_loss": -26.8903865814209, "global_step": 484330, "epoch": 5835} {"train_loss": -27.260517120361328, "global_step": 484331, "epoch": 5835} {"train_loss": -27.297306060791016, "global_step": 484332, "epoch": 5835} {"train_loss": -27.58635902404785, "global_step": 484333, "epoch": 5835} {"train_loss": -27.210355758666992, "global_step": 484334, "epoch": 5835} {"train_loss": -27.260883331298828, "global_step": 484335, "epoch": 5835} {"train_loss": -27.143285751342773, "global_step": 484336, "epoch": 5835} {"train_loss": -27.11634635925293, "global_step": 484337, "epoch": 5835} {"train_loss": -27.619190216064453, "global_step": 484338, "epoch": 5835} {"train_loss": -27.212736129760742, "global_step": 484339, "epoch": 5835} {"train_loss": -27.62140464782715, "global_step": 484340, "epoch": 5835} {"train_loss": -27.042322158813477, "global_step": 484341, "epoch": 5835} {"train_loss": -27.83037757873535, "global_step": 484342, "epoch": 5835} {"train_loss": -27.756317138671875, "global_step": 484343, "epoch": 5835} {"train_loss": -27.474679946899414, "global_step": 484344, "epoch": 5835} {"train_loss": -27.108367919921875, "global_step": 484345, "epoch": 5835} {"train_loss": -27.694477081298828, "global_step": 484346, "epoch": 5835} {"train_loss": -27.746469497680664, "global_step": 484347, "epoch": 5835} {"train_loss": -27.725940704345703, "global_step": 484348, "epoch": 5835} {"train_loss": -27.588760375976562, "global_step": 484349, "epoch": 5835} {"train_loss": -27.243764877319336, "global_step": 484350, "epoch": 5835} {"train_loss": -27.30459976196289, "global_step": 484351, "epoch": 5835} {"train_loss": -27.3372859954834, "global_step": 484352, "epoch": 5835} {"train_loss": -27.41777992248535, "global_step": 484353, "epoch": 5835} {"train_loss": -27.58001136779785, "global_step": 484354, "epoch": 5835} {"train_loss": -27.59868812561035, "global_step": 484355, "epoch": 5835} {"train_loss": -27.265600204467773, "global_step": 484356, "epoch": 5835} {"train_loss": -27.4594669342041, "global_step": 484357, "epoch": 5835} {"train_loss": -27.685998916625977, "global_step": 484358, "epoch": 5835} {"train_loss": -27.640783309936523, "global_step": 484359, "epoch": 5835} {"train_loss": -27.507678985595703, "global_step": 484360, "epoch": 5835} {"train_loss": -27.70221519470215, "global_step": 484361, "epoch": 5835} {"train_loss": -27.32954216003418, "global_step": 484362, "epoch": 5835} {"train_loss": -27.16411781311035, "global_step": 484363, "epoch": 5835} {"train_loss": -27.5495662689209, "global_step": 484364, "epoch": 5835} {"train_loss": -27.306293487548828, "global_step": 484365, "epoch": 5835} {"train_loss": -27.005056381225586, "global_step": 484366, "epoch": 5835} {"train_loss": -26.74319839477539, "global_step": 484367, "epoch": 5835} {"train_loss": -26.5274658203125, "global_step": 484368, "epoch": 5835} {"train_loss": -26.496570587158203, "global_step": 484369, "epoch": 5835} {"train_loss": -27.11222267150879, "global_step": 484370, "epoch": 5835} {"train_loss": -27.318212509155273, "global_step": 484371, "epoch": 5835} {"train_loss": -26.19679069519043, "global_step": 484372, "epoch": 5835} {"train_loss": -26.971899032592773, "global_step": 484373, "epoch": 5835} {"train_loss": -27.356836318969727, "global_step": 484374, "epoch": 5835} {"train_loss": -27.0273380279541, "global_step": 484375, "epoch": 5835} {"train_loss": -26.90289306640625, "global_step": 484376, "epoch": 5835} {"train_loss": -26.717329025268555, "global_step": 484377, "epoch": 5835} {"train_loss": -26.648107528686523, "global_step": 484378, "epoch": 5835} {"train_loss": -27.182861328125, "global_step": 484379, "epoch": 5835} {"train_loss": -26.90777015686035, "global_step": 484380, "epoch": 5835} {"train_loss": -27.396738052368164, "global_step": 484381, "epoch": 5835} {"train_loss": -27.397968292236328, "global_step": 484382, "epoch": 5835} {"train_loss": -26.54886245727539, "global_step": 484383, "epoch": 5835} {"train_loss": -26.919580459594727, "global_step": 484384, "epoch": 5835} {"train_loss": -27.25895118713379, "global_step": 484385, "epoch": 5835} {"train_loss": -27.047809600830078, "global_step": 484386, "epoch": 5835} {"train_loss": -27.113793591418897, "global_step": 484387, "epoch": 5835, "val_loss": 6518991.5} {"train_loss": -26.66755485534668, "global_step": 484388, "epoch": 5836} {"train_loss": -26.324996948242188, "global_step": 484389, "epoch": 5836} {"train_loss": -26.76141929626465, "global_step": 484390, "epoch": 5836} {"train_loss": -26.297168731689453, "global_step": 484391, "epoch": 5836} {"train_loss": -26.561132431030273, "global_step": 484392, "epoch": 5836} {"train_loss": -27.077177047729492, "global_step": 484393, "epoch": 5836} {"train_loss": -26.41834831237793, "global_step": 484394, "epoch": 5836} {"train_loss": -26.548181533813477, "global_step": 484395, "epoch": 5836} {"train_loss": -26.665800094604492, "global_step": 484396, "epoch": 5836} {"train_loss": -26.75935173034668, "global_step": 484397, "epoch": 5836} {"train_loss": -26.678647994995117, "global_step": 484398, "epoch": 5836} {"train_loss": -26.790897369384766, "global_step": 484399, "epoch": 5836} {"train_loss": -27.035388946533203, "global_step": 484400, "epoch": 5836} {"train_loss": -26.710010528564453, "global_step": 484401, "epoch": 5836} {"train_loss": -27.444351196289062, "global_step": 484402, "epoch": 5836} {"train_loss": -26.46518898010254, "global_step": 484403, "epoch": 5836} {"train_loss": -26.993671417236328, "global_step": 484404, "epoch": 5836} {"train_loss": -26.902524948120117, "global_step": 484405, "epoch": 5836} {"train_loss": -27.285358428955078, "global_step": 484406, "epoch": 5836} {"train_loss": -27.151187896728516, "global_step": 484407, "epoch": 5836} {"train_loss": -27.3835506439209, "global_step": 484408, "epoch": 5836} {"train_loss": -27.18001365661621, "global_step": 484409, "epoch": 5836} {"train_loss": -26.944284439086914, "global_step": 484410, "epoch": 5836} {"train_loss": -26.83169937133789, "global_step": 484411, "epoch": 5836} {"train_loss": -27.15254783630371, "global_step": 484412, "epoch": 5836} {"train_loss": -27.237180709838867, "global_step": 484413, "epoch": 5836} {"train_loss": -27.169775009155273, "global_step": 484414, "epoch": 5836} {"train_loss": -27.2890567779541, "global_step": 484415, "epoch": 5836} {"train_loss": -27.220434188842773, "global_step": 484416, "epoch": 5836} {"train_loss": -26.8507022857666, "global_step": 484417, "epoch": 5836} {"train_loss": -27.423908233642578, "global_step": 484418, "epoch": 5836} {"train_loss": -27.255651473999023, "global_step": 484419, "epoch": 5836} {"train_loss": -26.95037841796875, "global_step": 484420, "epoch": 5836} {"train_loss": -27.373111724853516, "global_step": 484421, "epoch": 5836} {"train_loss": -27.380817413330078, "global_step": 484422, "epoch": 5836} {"train_loss": -27.24454689025879, "global_step": 484423, "epoch": 5836} {"train_loss": -26.86514663696289, "global_step": 484424, "epoch": 5836} {"train_loss": -27.351552963256836, "global_step": 484425, "epoch": 5836} {"train_loss": -27.36932945251465, "global_step": 484426, "epoch": 5836} {"train_loss": -27.708051681518555, "global_step": 484427, "epoch": 5836} {"train_loss": -27.282642364501953, "global_step": 484428, "epoch": 5836} {"train_loss": -27.34503173828125, "global_step": 484429, "epoch": 5836} {"train_loss": -27.37282371520996, "global_step": 484430, "epoch": 5836} {"train_loss": -27.5714168548584, "global_step": 484431, "epoch": 5836} {"train_loss": -27.18570327758789, "global_step": 484432, "epoch": 5836} {"train_loss": -27.495655059814453, "global_step": 484433, "epoch": 5836} {"train_loss": -27.153369903564453, "global_step": 484434, "epoch": 5836} {"train_loss": -27.747833251953125, "global_step": 484435, "epoch": 5836} {"train_loss": -27.628870010375977, "global_step": 484436, "epoch": 5836} {"train_loss": -27.608057022094727, "global_step": 484437, "epoch": 5836} {"train_loss": -27.494205474853516, "global_step": 484438, "epoch": 5836} {"train_loss": -27.90252113342285, "global_step": 484439, "epoch": 5836} {"train_loss": -27.276586532592773, "global_step": 484440, "epoch": 5836} {"train_loss": -27.632251739501953, "global_step": 484441, "epoch": 5836} {"train_loss": -27.202489852905273, "global_step": 484442, "epoch": 5836} {"train_loss": -27.48832130432129, "global_step": 484443, "epoch": 5836} {"train_loss": -27.2934627532959, "global_step": 484444, "epoch": 5836} {"train_loss": -27.356943130493164, "global_step": 484445, "epoch": 5836} {"train_loss": -27.57816505432129, "global_step": 484446, "epoch": 5836} {"train_loss": -27.3540096282959, "global_step": 484447, "epoch": 5836} {"train_loss": -27.547338485717773, "global_step": 484448, "epoch": 5836} {"train_loss": -27.278884887695312, "global_step": 484449, "epoch": 5836} {"train_loss": -27.291095733642578, "global_step": 484450, "epoch": 5836} {"train_loss": -27.25530433654785, "global_step": 484451, "epoch": 5836} {"train_loss": -27.01336669921875, "global_step": 484452, "epoch": 5836} {"train_loss": -27.419696807861328, "global_step": 484453, "epoch": 5836} {"train_loss": -26.517013549804688, "global_step": 484454, "epoch": 5836} {"train_loss": -27.286956787109375, "global_step": 484455, "epoch": 5836} {"train_loss": -27.310083389282227, "global_step": 484456, "epoch": 5836} {"train_loss": -27.562711715698242, "global_step": 484457, "epoch": 5836} {"train_loss": -27.590030670166016, "global_step": 484458, "epoch": 5836} {"train_loss": -27.04986000061035, "global_step": 484459, "epoch": 5836} {"train_loss": -27.25056266784668, "global_step": 484460, "epoch": 5836} {"train_loss": -27.1595516204834, "global_step": 484461, "epoch": 5836} {"train_loss": -27.151554107666016, "global_step": 484462, "epoch": 5836} {"train_loss": -27.58216667175293, "global_step": 484463, "epoch": 5836} {"train_loss": -27.230670928955078, "global_step": 484464, "epoch": 5836} {"train_loss": -27.061710357666016, "global_step": 484465, "epoch": 5836} {"train_loss": -27.179147720336914, "global_step": 484466, "epoch": 5836} {"train_loss": -27.315765380859375, "global_step": 484467, "epoch": 5836} {"train_loss": -27.262781143188477, "global_step": 484468, "epoch": 5836} {"train_loss": -26.907947540283203, "global_step": 484469, "epoch": 5836} {"train_loss": -27.191715378359138, "global_step": 484470, "epoch": 5836, "val_loss": 6464013.5} {"train_loss": -26.084304809570312, "global_step": 484471, "epoch": 5837} {"train_loss": -26.979522705078125, "global_step": 484472, "epoch": 5837} {"train_loss": -26.774158477783203, "global_step": 484473, "epoch": 5837} {"train_loss": -26.73395347595215, "global_step": 484474, "epoch": 5837} {"train_loss": -26.842870712280273, "global_step": 484475, "epoch": 5837} {"train_loss": -26.224863052368164, "global_step": 484476, "epoch": 5837} {"train_loss": -27.247541427612305, "global_step": 484477, "epoch": 5837} {"train_loss": -26.719165802001953, "global_step": 484478, "epoch": 5837} {"train_loss": -27.160297393798828, "global_step": 484479, "epoch": 5837} {"train_loss": -26.669677734375, "global_step": 484480, "epoch": 5837} {"train_loss": -26.92634391784668, "global_step": 484481, "epoch": 5837} {"train_loss": -26.791290283203125, "global_step": 484482, "epoch": 5837} {"train_loss": -26.831228256225586, "global_step": 484483, "epoch": 5837} {"train_loss": -27.05342674255371, "global_step": 484484, "epoch": 5837} {"train_loss": -27.4887638092041, "global_step": 484485, "epoch": 5837} {"train_loss": -27.106769561767578, "global_step": 484486, "epoch": 5837} {"train_loss": -27.123762130737305, "global_step": 484487, "epoch": 5837} {"train_loss": -27.306049346923828, "global_step": 484488, "epoch": 5837} {"train_loss": -27.460540771484375, "global_step": 484489, "epoch": 5837} {"train_loss": -27.15028953552246, "global_step": 484490, "epoch": 5837} {"train_loss": -26.68560791015625, "global_step": 484491, "epoch": 5837} {"train_loss": -27.207197189331055, "global_step": 484492, "epoch": 5837} {"train_loss": -26.793149948120117, "global_step": 484493, "epoch": 5837} {"train_loss": -27.151966094970703, "global_step": 484494, "epoch": 5837} {"train_loss": -27.260211944580078, "global_step": 484495, "epoch": 5837} {"train_loss": -26.987218856811523, "global_step": 484496, "epoch": 5837} {"train_loss": -27.11634635925293, "global_step": 484497, "epoch": 5837} {"train_loss": -26.913776397705078, "global_step": 484498, "epoch": 5837} {"train_loss": -27.371719360351562, "global_step": 484499, "epoch": 5837} {"train_loss": -27.435400009155273, "global_step": 484500, "epoch": 5837} {"train_loss": -27.09539794921875, "global_step": 484501, "epoch": 5837} {"train_loss": -27.364822387695312, "global_step": 484502, "epoch": 5837} {"train_loss": -27.2943172454834, "global_step": 484503, "epoch": 5837} {"train_loss": -27.49787712097168, "global_step": 484504, "epoch": 5837} {"train_loss": -27.578189849853516, "global_step": 484505, "epoch": 5837} {"train_loss": -27.115219116210938, "global_step": 484506, "epoch": 5837} {"train_loss": -27.19697380065918, "global_step": 484507, "epoch": 5837} {"train_loss": -27.535614013671875, "global_step": 484508, "epoch": 5837} {"train_loss": -27.04189109802246, "global_step": 484509, "epoch": 5837} {"train_loss": -27.15052604675293, "global_step": 484510, "epoch": 5837} {"train_loss": -27.370105743408203, "global_step": 484511, "epoch": 5837} {"train_loss": -27.264877319335938, "global_step": 484512, "epoch": 5837} {"train_loss": -27.31453514099121, "global_step": 484513, "epoch": 5837} {"train_loss": -27.331762313842773, "global_step": 484514, "epoch": 5837} {"train_loss": -27.370716094970703, "global_step": 484515, "epoch": 5837} {"train_loss": -27.423368453979492, "global_step": 484516, "epoch": 5837} {"train_loss": -27.688867568969727, "global_step": 484517, "epoch": 5837} {"train_loss": -27.617843627929688, "global_step": 484518, "epoch": 5837} {"train_loss": -27.312397003173828, "global_step": 484519, "epoch": 5837} {"train_loss": -26.932327270507812, "global_step": 484520, "epoch": 5837} {"train_loss": -27.335315704345703, "global_step": 484521, "epoch": 5837} {"train_loss": -27.509387969970703, "global_step": 484522, "epoch": 5837} {"train_loss": -27.41814613342285, "global_step": 484523, "epoch": 5837} {"train_loss": -27.23417091369629, "global_step": 484524, "epoch": 5837} {"train_loss": -27.19854164123535, "global_step": 484525, "epoch": 5837} {"train_loss": -27.096654891967773, "global_step": 484526, "epoch": 5837} {"train_loss": -27.33320426940918, "global_step": 484527, "epoch": 5837} {"train_loss": -27.777423858642578, "global_step": 484528, "epoch": 5837} {"train_loss": -27.6420955657959, "global_step": 484529, "epoch": 5837} {"train_loss": -27.047529220581055, "global_step": 484530, "epoch": 5837} {"train_loss": -27.400007247924805, "global_step": 484531, "epoch": 5837} {"train_loss": -27.464094161987305, "global_step": 484532, "epoch": 5837} {"train_loss": -27.195423126220703, "global_step": 484533, "epoch": 5837} {"train_loss": -27.333276748657227, "global_step": 484534, "epoch": 5837} {"train_loss": -27.39761734008789, "global_step": 484535, "epoch": 5837} {"train_loss": -27.256677627563477, "global_step": 484536, "epoch": 5837} {"train_loss": -27.166126251220703, "global_step": 484537, "epoch": 5837} {"train_loss": -27.323415756225586, "global_step": 484538, "epoch": 5837} {"train_loss": -27.280227661132812, "global_step": 484539, "epoch": 5837} {"train_loss": -26.669116973876953, "global_step": 484540, "epoch": 5837} {"train_loss": -26.768171310424805, "global_step": 484541, "epoch": 5837} {"train_loss": -27.131256103515625, "global_step": 484542, "epoch": 5837} {"train_loss": -26.7921199798584, "global_step": 484543, "epoch": 5837} {"train_loss": -26.715396881103516, "global_step": 484544, "epoch": 5837} {"train_loss": -27.109350204467773, "global_step": 484545, "epoch": 5837} {"train_loss": -27.203857421875, "global_step": 484546, "epoch": 5837} {"train_loss": -26.4106388092041, "global_step": 484547, "epoch": 5837} {"train_loss": -27.050451278686523, "global_step": 484548, "epoch": 5837} {"train_loss": -27.328718185424805, "global_step": 484549, "epoch": 5837} {"train_loss": -27.135486602783203, "global_step": 484550, "epoch": 5837} {"train_loss": -27.222827911376953, "global_step": 484551, "epoch": 5837} {"train_loss": -27.241485595703125, "global_step": 484552, "epoch": 5837} {"train_loss": -27.13890163007989, "global_step": 484553, "epoch": 5837, "val_loss": 6575343.0} {"train_loss": -26.93471336364746, "global_step": 484554, "epoch": 5838} {"train_loss": -26.705575942993164, "global_step": 484555, "epoch": 5838} {"train_loss": -26.9032039642334, "global_step": 484556, "epoch": 5838} {"train_loss": -26.719146728515625, "global_step": 484557, "epoch": 5838} {"train_loss": -26.99552345275879, "global_step": 484558, "epoch": 5838} {"train_loss": -26.7962703704834, "global_step": 484559, "epoch": 5838} {"train_loss": -27.0882511138916, "global_step": 484560, "epoch": 5838} {"train_loss": -27.00501823425293, "global_step": 484561, "epoch": 5838} {"train_loss": -27.086414337158203, "global_step": 484562, "epoch": 5838} {"train_loss": -27.009601593017578, "global_step": 484563, "epoch": 5838} {"train_loss": -27.021711349487305, "global_step": 484564, "epoch": 5838} {"train_loss": -27.150836944580078, "global_step": 484565, "epoch": 5838} {"train_loss": -26.96148109436035, "global_step": 484566, "epoch": 5838} {"train_loss": -26.964599609375, "global_step": 484567, "epoch": 5838} {"train_loss": -27.43352699279785, "global_step": 484568, "epoch": 5838} {"train_loss": -27.27545738220215, "global_step": 484569, "epoch": 5838} {"train_loss": -27.37740135192871, "global_step": 484570, "epoch": 5838} {"train_loss": -26.940343856811523, "global_step": 484571, "epoch": 5838} {"train_loss": -27.22199821472168, "global_step": 484572, "epoch": 5838} {"train_loss": -26.835514068603516, "global_step": 484573, "epoch": 5838} {"train_loss": -27.535449981689453, "global_step": 484574, "epoch": 5838} {"train_loss": -27.05059242248535, "global_step": 484575, "epoch": 5838} {"train_loss": -27.24881362915039, "global_step": 484576, "epoch": 5838} {"train_loss": -26.974241256713867, "global_step": 484577, "epoch": 5838} {"train_loss": -27.325397491455078, "global_step": 484578, "epoch": 5838} {"train_loss": -27.288467407226562, "global_step": 484579, "epoch": 5838} {"train_loss": -27.564477920532227, "global_step": 484580, "epoch": 5838} {"train_loss": -26.84673500061035, "global_step": 484581, "epoch": 5838} {"train_loss": -27.22600746154785, "global_step": 484582, "epoch": 5838} {"train_loss": -27.28094482421875, "global_step": 484583, "epoch": 5838} {"train_loss": -27.179534912109375, "global_step": 484584, "epoch": 5838} {"train_loss": -27.085058212280273, "global_step": 484585, "epoch": 5838} {"train_loss": -27.718841552734375, "global_step": 484586, "epoch": 5838} {"train_loss": -27.025739669799805, "global_step": 484587, "epoch": 5838} {"train_loss": -27.150836944580078, "global_step": 484588, "epoch": 5838} {"train_loss": -27.200666427612305, "global_step": 484589, "epoch": 5838} {"train_loss": -27.4134464263916, "global_step": 484590, "epoch": 5838} {"train_loss": -27.047948837280273, "global_step": 484591, "epoch": 5838} {"train_loss": -27.134382247924805, "global_step": 484592, "epoch": 5838} {"train_loss": -27.384979248046875, "global_step": 484593, "epoch": 5838} {"train_loss": -27.382787704467773, "global_step": 484594, "epoch": 5838} {"train_loss": -27.433027267456055, "global_step": 484595, "epoch": 5838} {"train_loss": -27.05970573425293, "global_step": 484596, "epoch": 5838} {"train_loss": -27.37763786315918, "global_step": 484597, "epoch": 5838} {"train_loss": -27.520832061767578, "global_step": 484598, "epoch": 5838} {"train_loss": -27.48408317565918, "global_step": 484599, "epoch": 5838} {"train_loss": -27.81178855895996, "global_step": 484600, "epoch": 5838} {"train_loss": -27.300708770751953, "global_step": 484601, "epoch": 5838} {"train_loss": -27.182281494140625, "global_step": 484602, "epoch": 5838} {"train_loss": -27.44468116760254, "global_step": 484603, "epoch": 5838} {"train_loss": -27.473968505859375, "global_step": 484604, "epoch": 5838} {"train_loss": -27.108963012695312, "global_step": 484605, "epoch": 5838} {"train_loss": -27.58612632751465, "global_step": 484606, "epoch": 5838} {"train_loss": -26.961444854736328, "global_step": 484607, "epoch": 5838} {"train_loss": -27.183698654174805, "global_step": 484608, "epoch": 5838} {"train_loss": -27.407276153564453, "global_step": 484609, "epoch": 5838} {"train_loss": -26.848928451538086, "global_step": 484610, "epoch": 5838} {"train_loss": -27.346282958984375, "global_step": 484611, "epoch": 5838} {"train_loss": -27.28466796875, "global_step": 484612, "epoch": 5838} {"train_loss": -27.659931182861328, "global_step": 484613, "epoch": 5838} {"train_loss": -27.3795166015625, "global_step": 484614, "epoch": 5838} {"train_loss": -27.0928897857666, "global_step": 484615, "epoch": 5838} {"train_loss": -27.13726234436035, "global_step": 484616, "epoch": 5838} {"train_loss": -27.2877140045166, "global_step": 484617, "epoch": 5838} {"train_loss": -26.69988441467285, "global_step": 484618, "epoch": 5838} {"train_loss": -27.3183650970459, "global_step": 484619, "epoch": 5838} {"train_loss": -27.455429077148438, "global_step": 484620, "epoch": 5838} {"train_loss": -27.630002975463867, "global_step": 484621, "epoch": 5838} {"train_loss": -27.274328231811523, "global_step": 484622, "epoch": 5838} {"train_loss": -27.5522518157959, "global_step": 484623, "epoch": 5838} {"train_loss": -27.428882598876953, "global_step": 484624, "epoch": 5838} {"train_loss": -27.38433837890625, "global_step": 484625, "epoch": 5838} {"train_loss": -27.4073543548584, "global_step": 484626, "epoch": 5838} {"train_loss": -27.550622940063477, "global_step": 484627, "epoch": 5838} {"train_loss": -27.23536491394043, "global_step": 484628, "epoch": 5838} {"train_loss": -27.619653701782227, "global_step": 484629, "epoch": 5838} {"train_loss": -27.35798454284668, "global_step": 484630, "epoch": 5838} {"train_loss": -27.50996208190918, "global_step": 484631, "epoch": 5838} {"train_loss": -27.69266700744629, "global_step": 484632, "epoch": 5838} {"train_loss": -27.362415313720703, "global_step": 484633, "epoch": 5838} {"train_loss": -27.272510528564453, "global_step": 484634, "epoch": 5838} {"train_loss": -27.166288375854492, "global_step": 484635, "epoch": 5838} {"train_loss": -27.249259305287556, "global_step": 484636, "epoch": 5838, "val_loss": 6462452.5} {"train_loss": -27.201269149780273, "global_step": 484637, "epoch": 5839} {"train_loss": -26.6752872467041, "global_step": 484638, "epoch": 5839} {"train_loss": -26.71796226501465, "global_step": 484639, "epoch": 5839} {"train_loss": -26.97002601623535, "global_step": 484640, "epoch": 5839} {"train_loss": -26.929004669189453, "global_step": 484641, "epoch": 5839} {"train_loss": -26.894699096679688, "global_step": 484642, "epoch": 5839} {"train_loss": -27.244186401367188, "global_step": 484643, "epoch": 5839} {"train_loss": -27.019575119018555, "global_step": 484644, "epoch": 5839} {"train_loss": -26.960973739624023, "global_step": 484645, "epoch": 5839} {"train_loss": -27.11939811706543, "global_step": 484646, "epoch": 5839} {"train_loss": -27.2711238861084, "global_step": 484647, "epoch": 5839} {"train_loss": -27.23127555847168, "global_step": 484648, "epoch": 5839} {"train_loss": -26.94927406311035, "global_step": 484649, "epoch": 5839} {"train_loss": -27.07000160217285, "global_step": 484650, "epoch": 5839} {"train_loss": -27.283065795898438, "global_step": 484651, "epoch": 5839} {"train_loss": -27.087223052978516, "global_step": 484652, "epoch": 5839} {"train_loss": -27.13591957092285, "global_step": 484653, "epoch": 5839} {"train_loss": -27.183185577392578, "global_step": 484654, "epoch": 5839} {"train_loss": -27.19874382019043, "global_step": 484655, "epoch": 5839} {"train_loss": -27.102277755737305, "global_step": 484656, "epoch": 5839} {"train_loss": -27.127246856689453, "global_step": 484657, "epoch": 5839} {"train_loss": -27.455900192260742, "global_step": 484658, "epoch": 5839} {"train_loss": -27.176593780517578, "global_step": 484659, "epoch": 5839} {"train_loss": -27.2789249420166, "global_step": 484660, "epoch": 5839} {"train_loss": -27.371185302734375, "global_step": 484661, "epoch": 5839} {"train_loss": -27.54445457458496, "global_step": 484662, "epoch": 5839} {"train_loss": -27.444965362548828, "global_step": 484663, "epoch": 5839} {"train_loss": -27.12152099609375, "global_step": 484664, "epoch": 5839} {"train_loss": -27.402652740478516, "global_step": 484665, "epoch": 5839} {"train_loss": -27.4595890045166, "global_step": 484666, "epoch": 5839} {"train_loss": -27.31500244140625, "global_step": 484667, "epoch": 5839} {"train_loss": -26.84205436706543, "global_step": 484668, "epoch": 5839} {"train_loss": -26.918441772460938, "global_step": 484669, "epoch": 5839} {"train_loss": -27.096548080444336, "global_step": 484670, "epoch": 5839} {"train_loss": -27.49462890625, "global_step": 484671, "epoch": 5839} {"train_loss": -27.2464656829834, "global_step": 484672, "epoch": 5839} {"train_loss": -26.9364013671875, "global_step": 484673, "epoch": 5839} {"train_loss": -27.3238525390625, "global_step": 484674, "epoch": 5839} {"train_loss": -27.354663848876953, "global_step": 484675, "epoch": 5839} {"train_loss": -27.301471710205078, "global_step": 484676, "epoch": 5839} {"train_loss": -27.1147403717041, "global_step": 484677, "epoch": 5839} {"train_loss": -27.248193740844727, "global_step": 484678, "epoch": 5839} {"train_loss": -27.554859161376953, "global_step": 484679, "epoch": 5839} {"train_loss": -27.60676383972168, "global_step": 484680, "epoch": 5839} {"train_loss": -27.314367294311523, "global_step": 484681, "epoch": 5839} {"train_loss": -27.61481285095215, "global_step": 484682, "epoch": 5839} {"train_loss": -27.218435287475586, "global_step": 484683, "epoch": 5839} {"train_loss": -27.46820640563965, "global_step": 484684, "epoch": 5839} {"train_loss": -27.390378952026367, "global_step": 484685, "epoch": 5839} {"train_loss": -27.137826919555664, "global_step": 484686, "epoch": 5839} {"train_loss": -27.088979721069336, "global_step": 484687, "epoch": 5839} {"train_loss": -27.41385841369629, "global_step": 484688, "epoch": 5839} {"train_loss": -27.810083389282227, "global_step": 484689, "epoch": 5839} {"train_loss": -27.567739486694336, "global_step": 484690, "epoch": 5839} {"train_loss": -27.499921798706055, "global_step": 484691, "epoch": 5839} {"train_loss": -27.172271728515625, "global_step": 484692, "epoch": 5839} {"train_loss": -27.27521324157715, "global_step": 484693, "epoch": 5839} {"train_loss": -27.01226806640625, "global_step": 484694, "epoch": 5839} {"train_loss": -26.601898193359375, "global_step": 484695, "epoch": 5839} {"train_loss": -26.74873161315918, "global_step": 484696, "epoch": 5839} {"train_loss": -26.762582778930664, "global_step": 484697, "epoch": 5839} {"train_loss": -25.76397132873535, "global_step": 484698, "epoch": 5839} {"train_loss": -24.81584930419922, "global_step": 484699, "epoch": 5839} {"train_loss": -26.853971481323242, "global_step": 484700, "epoch": 5839} {"train_loss": -26.127248764038086, "global_step": 484701, "epoch": 5839} {"train_loss": -26.4034481048584, "global_step": 484702, "epoch": 5839} {"train_loss": -25.761728286743164, "global_step": 484703, "epoch": 5839} {"train_loss": -26.896543502807617, "global_step": 484704, "epoch": 5839} {"train_loss": -26.37380027770996, "global_step": 484705, "epoch": 5839} {"train_loss": -26.56061363220215, "global_step": 484706, "epoch": 5839} {"train_loss": -26.784711837768555, "global_step": 484707, "epoch": 5839} {"train_loss": -26.93947410583496, "global_step": 484708, "epoch": 5839} {"train_loss": -26.78196144104004, "global_step": 484709, "epoch": 5839} {"train_loss": -26.832433700561523, "global_step": 484710, "epoch": 5839} {"train_loss": -26.906518936157227, "global_step": 484711, "epoch": 5839} {"train_loss": -26.868093490600586, "global_step": 484712, "epoch": 5839} {"train_loss": -26.780149459838867, "global_step": 484713, "epoch": 5839} {"train_loss": -26.828632354736328, "global_step": 484714, "epoch": 5839} {"train_loss": -27.175312042236328, "global_step": 484715, "epoch": 5839} {"train_loss": -26.885517120361328, "global_step": 484716, "epoch": 5839} {"train_loss": -26.836584091186523, "global_step": 484717, "epoch": 5839} {"train_loss": -27.029041290283203, "global_step": 484718, "epoch": 5839} {"train_loss": -27.057967840907086, "global_step": 484719, "epoch": 5839, "val_loss": 6496153.0} {"train_loss": -26.732858657836914, "global_step": 484720, "epoch": 5840} {"train_loss": -26.983747482299805, "global_step": 484721, "epoch": 5840} {"train_loss": -27.02446937561035, "global_step": 484722, "epoch": 5840} {"train_loss": -26.907346725463867, "global_step": 484723, "epoch": 5840} {"train_loss": -26.602575302124023, "global_step": 484724, "epoch": 5840} {"train_loss": -27.1480655670166, "global_step": 484725, "epoch": 5840} {"train_loss": -27.135440826416016, "global_step": 484726, "epoch": 5840} {"train_loss": -26.782018661499023, "global_step": 484727, "epoch": 5840} {"train_loss": -27.126134872436523, "global_step": 484728, "epoch": 5840} {"train_loss": -27.074560165405273, "global_step": 484729, "epoch": 5840} {"train_loss": -27.105178833007812, "global_step": 484730, "epoch": 5840} {"train_loss": -27.4368953704834, "global_step": 484731, "epoch": 5840} {"train_loss": -27.282257080078125, "global_step": 484732, "epoch": 5840} {"train_loss": -26.780109405517578, "global_step": 484733, "epoch": 5840} {"train_loss": -27.53879165649414, "global_step": 484734, "epoch": 5840} {"train_loss": -27.083789825439453, "global_step": 484735, "epoch": 5840} {"train_loss": -27.113971710205078, "global_step": 484736, "epoch": 5840} {"train_loss": -27.715368270874023, "global_step": 484737, "epoch": 5840} {"train_loss": -27.49995994567871, "global_step": 484738, "epoch": 5840} {"train_loss": -27.25758171081543, "global_step": 484739, "epoch": 5840} {"train_loss": -27.120630264282227, "global_step": 484740, "epoch": 5840} {"train_loss": -27.737781524658203, "global_step": 484741, "epoch": 5840} {"train_loss": -27.55194091796875, "global_step": 484742, "epoch": 5840} {"train_loss": -27.275434494018555, "global_step": 484743, "epoch": 5840} {"train_loss": -27.15117835998535, "global_step": 484744, "epoch": 5840} {"train_loss": -27.3868408203125, "global_step": 484745, "epoch": 5840} {"train_loss": -27.3800106048584, "global_step": 484746, "epoch": 5840} {"train_loss": -27.49945640563965, "global_step": 484747, "epoch": 5840} {"train_loss": -27.410511016845703, "global_step": 484748, "epoch": 5840} {"train_loss": -27.648839950561523, "global_step": 484749, "epoch": 5840} {"train_loss": -27.132978439331055, "global_step": 484750, "epoch": 5840} {"train_loss": -27.27153968811035, "global_step": 484751, "epoch": 5840} {"train_loss": -27.797210693359375, "global_step": 484752, "epoch": 5840} {"train_loss": -27.054502487182617, "global_step": 484753, "epoch": 5840} {"train_loss": -27.68446159362793, "global_step": 484754, "epoch": 5840} {"train_loss": -27.189685821533203, "global_step": 484755, "epoch": 5840} {"train_loss": -27.352787017822266, "global_step": 484756, "epoch": 5840} {"train_loss": -27.81728172302246, "global_step": 484757, "epoch": 5840} {"train_loss": -27.732868194580078, "global_step": 484758, "epoch": 5840} {"train_loss": -27.401599884033203, "global_step": 484759, "epoch": 5840} {"train_loss": -27.690204620361328, "global_step": 484760, "epoch": 5840} {"train_loss": -27.805694580078125, "global_step": 484761, "epoch": 5840} {"train_loss": -27.608997344970703, "global_step": 484762, "epoch": 5840} {"train_loss": -27.038909912109375, "global_step": 484763, "epoch": 5840} {"train_loss": -27.121326446533203, "global_step": 484764, "epoch": 5840} {"train_loss": -27.580610275268555, "global_step": 484765, "epoch": 5840} {"train_loss": -27.35174560546875, "global_step": 484766, "epoch": 5840} {"train_loss": -27.28338050842285, "global_step": 484767, "epoch": 5840} {"train_loss": -26.196990966796875, "global_step": 484768, "epoch": 5840} {"train_loss": -26.797855377197266, "global_step": 484769, "epoch": 5840} {"train_loss": -26.486413955688477, "global_step": 484770, "epoch": 5840} {"train_loss": -26.39750099182129, "global_step": 484771, "epoch": 5840} {"train_loss": -27.062763214111328, "global_step": 484772, "epoch": 5840} {"train_loss": -26.639257431030273, "global_step": 484773, "epoch": 5840} {"train_loss": -26.468183517456055, "global_step": 484774, "epoch": 5840} {"train_loss": -27.1807918548584, "global_step": 484775, "epoch": 5840} {"train_loss": -26.816648483276367, "global_step": 484776, "epoch": 5840} {"train_loss": -26.45319938659668, "global_step": 484777, "epoch": 5840} {"train_loss": -26.649002075195312, "global_step": 484778, "epoch": 5840} {"train_loss": -27.19441032409668, "global_step": 484779, "epoch": 5840} {"train_loss": -26.583877563476562, "global_step": 484780, "epoch": 5840} {"train_loss": -27.133298873901367, "global_step": 484781, "epoch": 5840} {"train_loss": -26.864566802978516, "global_step": 484782, "epoch": 5840} {"train_loss": -26.578794479370117, "global_step": 484783, "epoch": 5840} {"train_loss": -27.063053131103516, "global_step": 484784, "epoch": 5840} {"train_loss": -25.93292808532715, "global_step": 484785, "epoch": 5840} {"train_loss": -26.833545684814453, "global_step": 484786, "epoch": 5840} {"train_loss": -27.062475204467773, "global_step": 484787, "epoch": 5840} {"train_loss": -26.734949111938477, "global_step": 484788, "epoch": 5840} {"train_loss": -27.051483154296875, "global_step": 484789, "epoch": 5840} {"train_loss": -26.725439071655273, "global_step": 484790, "epoch": 5840} {"train_loss": -26.850183486938477, "global_step": 484791, "epoch": 5840} {"train_loss": -27.461578369140625, "global_step": 484792, "epoch": 5840} {"train_loss": -27.316619873046875, "global_step": 484793, "epoch": 5840} {"train_loss": -27.20208740234375, "global_step": 484794, "epoch": 5840} {"train_loss": -27.155378341674805, "global_step": 484795, "epoch": 5840} {"train_loss": -27.40058708190918, "global_step": 484796, "epoch": 5840} {"train_loss": -27.2451114654541, "global_step": 484797, "epoch": 5840} {"train_loss": -27.0078182220459, "global_step": 484798, "epoch": 5840} {"train_loss": -27.367115020751953, "global_step": 484799, "epoch": 5840} {"train_loss": -27.384305953979492, "global_step": 484800, "epoch": 5840} {"train_loss": -26.84638786315918, "global_step": 484801, "epoch": 5840} {"train_loss": -27.128567339426063, "global_step": 484802, "epoch": 5840, "val_loss": 6525627.0} {"train_loss": -26.73426628112793, "global_step": 484803, "epoch": 5841} {"train_loss": -26.467451095581055, "global_step": 484804, "epoch": 5841} {"train_loss": -27.074743270874023, "global_step": 484805, "epoch": 5841} {"train_loss": -26.309955596923828, "global_step": 484806, "epoch": 5841} {"train_loss": -27.3268985748291, "global_step": 484807, "epoch": 5841} {"train_loss": -26.572772979736328, "global_step": 484808, "epoch": 5841} {"train_loss": -26.862411499023438, "global_step": 484809, "epoch": 5841} {"train_loss": -26.7479190826416, "global_step": 484810, "epoch": 5841} {"train_loss": -26.754764556884766, "global_step": 484811, "epoch": 5841} {"train_loss": -26.745901107788086, "global_step": 484812, "epoch": 5841} {"train_loss": -26.889423370361328, "global_step": 484813, "epoch": 5841} {"train_loss": -26.6610050201416, "global_step": 484814, "epoch": 5841} {"train_loss": -26.68207359313965, "global_step": 484815, "epoch": 5841} {"train_loss": -26.87916374206543, "global_step": 484816, "epoch": 5841} {"train_loss": -27.28059196472168, "global_step": 484817, "epoch": 5841} {"train_loss": -26.991907119750977, "global_step": 484818, "epoch": 5841} {"train_loss": -26.692218780517578, "global_step": 484819, "epoch": 5841} {"train_loss": -27.101720809936523, "global_step": 484820, "epoch": 5841} {"train_loss": -27.188949584960938, "global_step": 484821, "epoch": 5841} {"train_loss": -27.207006454467773, "global_step": 484822, "epoch": 5841} {"train_loss": -27.228199005126953, "global_step": 484823, "epoch": 5841} {"train_loss": -26.88811683654785, "global_step": 484824, "epoch": 5841} {"train_loss": -27.481977462768555, "global_step": 484825, "epoch": 5841} {"train_loss": -27.101673126220703, "global_step": 484826, "epoch": 5841} {"train_loss": -27.142324447631836, "global_step": 484827, "epoch": 5841} {"train_loss": -27.149078369140625, "global_step": 484828, "epoch": 5841} {"train_loss": -27.294294357299805, "global_step": 484829, "epoch": 5841} {"train_loss": -27.088092803955078, "global_step": 484830, "epoch": 5841} {"train_loss": -27.095590591430664, "global_step": 484831, "epoch": 5841} {"train_loss": -26.968219757080078, "global_step": 484832, "epoch": 5841} {"train_loss": -27.01618003845215, "global_step": 484833, "epoch": 5841} {"train_loss": -27.00337791442871, "global_step": 484834, "epoch": 5841} {"train_loss": -27.35515785217285, "global_step": 484835, "epoch": 5841} {"train_loss": -27.189741134643555, "global_step": 484836, "epoch": 5841} {"train_loss": -27.384342193603516, "global_step": 484837, "epoch": 5841} {"train_loss": -27.42279624938965, "global_step": 484838, "epoch": 5841} {"train_loss": -27.48798942565918, "global_step": 484839, "epoch": 5841} {"train_loss": -27.63311767578125, "global_step": 484840, "epoch": 5841} {"train_loss": -27.634906768798828, "global_step": 484841, "epoch": 5841} {"train_loss": -27.502059936523438, "global_step": 484842, "epoch": 5841} {"train_loss": -27.63418960571289, "global_step": 484843, "epoch": 5841} {"train_loss": -27.23305320739746, "global_step": 484844, "epoch": 5841} {"train_loss": -27.424909591674805, "global_step": 484845, "epoch": 5841} {"train_loss": -27.245758056640625, "global_step": 484846, "epoch": 5841} {"train_loss": -27.449926376342773, "global_step": 484847, "epoch": 5841} {"train_loss": -27.179624557495117, "global_step": 484848, "epoch": 5841} {"train_loss": -27.386402130126953, "global_step": 484849, "epoch": 5841} {"train_loss": -27.352081298828125, "global_step": 484850, "epoch": 5841} {"train_loss": -27.570058822631836, "global_step": 484851, "epoch": 5841} {"train_loss": -27.052982330322266, "global_step": 484852, "epoch": 5841} {"train_loss": -27.44827651977539, "global_step": 484853, "epoch": 5841} {"train_loss": -27.063770294189453, "global_step": 484854, "epoch": 5841} {"train_loss": -27.392370223999023, "global_step": 484855, "epoch": 5841} {"train_loss": -27.649311065673828, "global_step": 484856, "epoch": 5841} {"train_loss": -27.30514907836914, "global_step": 484857, "epoch": 5841} {"train_loss": -27.641937255859375, "global_step": 484858, "epoch": 5841} {"train_loss": -27.45692253112793, "global_step": 484859, "epoch": 5841} {"train_loss": -27.4653377532959, "global_step": 484860, "epoch": 5841} {"train_loss": -27.338720321655273, "global_step": 484861, "epoch": 5841} {"train_loss": -27.34564781188965, "global_step": 484862, "epoch": 5841} {"train_loss": -27.215808868408203, "global_step": 484863, "epoch": 5841} {"train_loss": -27.7419490814209, "global_step": 484864, "epoch": 5841} {"train_loss": -27.609556198120117, "global_step": 484865, "epoch": 5841} {"train_loss": -27.44065284729004, "global_step": 484866, "epoch": 5841} {"train_loss": -27.3784122467041, "global_step": 484867, "epoch": 5841} {"train_loss": -27.426923751831055, "global_step": 484868, "epoch": 5841} {"train_loss": -27.3303279876709, "global_step": 484869, "epoch": 5841} {"train_loss": -27.4189510345459, "global_step": 484870, "epoch": 5841} {"train_loss": -27.500391006469727, "global_step": 484871, "epoch": 5841} {"train_loss": -27.4934139251709, "global_step": 484872, "epoch": 5841} {"train_loss": -27.49445152282715, "global_step": 484873, "epoch": 5841} {"train_loss": -27.81268882751465, "global_step": 484874, "epoch": 5841} {"train_loss": -27.494665145874023, "global_step": 484875, "epoch": 5841} {"train_loss": -27.352712631225586, "global_step": 484876, "epoch": 5841} {"train_loss": -27.67585563659668, "global_step": 484877, "epoch": 5841} {"train_loss": -27.536794662475586, "global_step": 484878, "epoch": 5841} {"train_loss": -27.166662216186523, "global_step": 484879, "epoch": 5841} {"train_loss": -27.082977294921875, "global_step": 484880, "epoch": 5841} {"train_loss": -27.38360023498535, "global_step": 484881, "epoch": 5841} {"train_loss": -27.465402603149414, "global_step": 484882, "epoch": 5841} {"train_loss": -26.994131088256836, "global_step": 484883, "epoch": 5841} {"train_loss": -27.93439292907715, "global_step": 484884, "epoch": 5841} {"train_loss": -27.22589007917657, "global_step": 484885, "epoch": 5841, "val_loss": 6545022.0} {"train_loss": -26.857513427734375, "global_step": 484886, "epoch": 5842} {"train_loss": -26.450702667236328, "global_step": 484887, "epoch": 5842} {"train_loss": -26.530826568603516, "global_step": 484888, "epoch": 5842} {"train_loss": -25.884357452392578, "global_step": 484889, "epoch": 5842} {"train_loss": -26.45049476623535, "global_step": 484890, "epoch": 5842} {"train_loss": -26.273447036743164, "global_step": 484891, "epoch": 5842} {"train_loss": -26.742345809936523, "global_step": 484892, "epoch": 5842} {"train_loss": -26.953399658203125, "global_step": 484893, "epoch": 5842} {"train_loss": -27.0797061920166, "global_step": 484894, "epoch": 5842} {"train_loss": -26.666799545288086, "global_step": 484895, "epoch": 5842} {"train_loss": -26.699594497680664, "global_step": 484896, "epoch": 5842} {"train_loss": -26.886035919189453, "global_step": 484897, "epoch": 5842} {"train_loss": -27.052152633666992, "global_step": 484898, "epoch": 5842} {"train_loss": -27.375579833984375, "global_step": 484899, "epoch": 5842} {"train_loss": -27.34903335571289, "global_step": 484900, "epoch": 5842} {"train_loss": -27.225250244140625, "global_step": 484901, "epoch": 5842} {"train_loss": -27.054214477539062, "global_step": 484902, "epoch": 5842} {"train_loss": -26.93793296813965, "global_step": 484903, "epoch": 5842} {"train_loss": -27.247772216796875, "global_step": 484904, "epoch": 5842} {"train_loss": -27.185256958007812, "global_step": 484905, "epoch": 5842} {"train_loss": -27.31032371520996, "global_step": 484906, "epoch": 5842} {"train_loss": -26.89924430847168, "global_step": 484907, "epoch": 5842} {"train_loss": -27.723962783813477, "global_step": 484908, "epoch": 5842} {"train_loss": -26.934507369995117, "global_step": 484909, "epoch": 5842} {"train_loss": -26.87556266784668, "global_step": 484910, "epoch": 5842} {"train_loss": -27.3394718170166, "global_step": 484911, "epoch": 5842} {"train_loss": -27.299209594726562, "global_step": 484912, "epoch": 5842} {"train_loss": -27.202014923095703, "global_step": 484913, "epoch": 5842} {"train_loss": -27.096881866455078, "global_step": 484914, "epoch": 5842} {"train_loss": -27.289093017578125, "global_step": 484915, "epoch": 5842} {"train_loss": -26.74346923828125, "global_step": 484916, "epoch": 5842} {"train_loss": -27.251651763916016, "global_step": 484917, "epoch": 5842} {"train_loss": -27.322235107421875, "global_step": 484918, "epoch": 5842} {"train_loss": -27.660165786743164, "global_step": 484919, "epoch": 5842} {"train_loss": -27.37296485900879, "global_step": 484920, "epoch": 5842} {"train_loss": -27.569854736328125, "global_step": 484921, "epoch": 5842} {"train_loss": -27.637510299682617, "global_step": 484922, "epoch": 5842} {"train_loss": -27.403879165649414, "global_step": 484923, "epoch": 5842} {"train_loss": -27.35072135925293, "global_step": 484924, "epoch": 5842} {"train_loss": -27.844579696655273, "global_step": 484925, "epoch": 5842} {"train_loss": -27.772052764892578, "global_step": 484926, "epoch": 5842} {"train_loss": -27.706165313720703, "global_step": 484927, "epoch": 5842} {"train_loss": -27.437606811523438, "global_step": 484928, "epoch": 5842} {"train_loss": -27.449554443359375, "global_step": 484929, "epoch": 5842} {"train_loss": -27.185287475585938, "global_step": 484930, "epoch": 5842} {"train_loss": -27.35910987854004, "global_step": 484931, "epoch": 5842} {"train_loss": -27.676288604736328, "global_step": 484932, "epoch": 5842} {"train_loss": -27.11817741394043, "global_step": 484933, "epoch": 5842} {"train_loss": -27.661651611328125, "global_step": 484934, "epoch": 5842} {"train_loss": -27.59824562072754, "global_step": 484935, "epoch": 5842} {"train_loss": -27.452978134155273, "global_step": 484936, "epoch": 5842} {"train_loss": -27.463144302368164, "global_step": 484937, "epoch": 5842} {"train_loss": -27.073883056640625, "global_step": 484938, "epoch": 5842} {"train_loss": -27.477949142456055, "global_step": 484939, "epoch": 5842} {"train_loss": -27.687793731689453, "global_step": 484940, "epoch": 5842} {"train_loss": -27.420988082885742, "global_step": 484941, "epoch": 5842} {"train_loss": -27.503820419311523, "global_step": 484942, "epoch": 5842} {"train_loss": -27.368505477905273, "global_step": 484943, "epoch": 5842} {"train_loss": -27.25642204284668, "global_step": 484944, "epoch": 5842} {"train_loss": -27.17832374572754, "global_step": 484945, "epoch": 5842} {"train_loss": -27.017383575439453, "global_step": 484946, "epoch": 5842} {"train_loss": -26.9771728515625, "global_step": 484947, "epoch": 5842} {"train_loss": -26.295225143432617, "global_step": 484948, "epoch": 5842} {"train_loss": -25.87810707092285, "global_step": 484949, "epoch": 5842} {"train_loss": -25.202665328979492, "global_step": 484950, "epoch": 5842} {"train_loss": -26.29522705078125, "global_step": 484951, "epoch": 5842} {"train_loss": -26.997161865234375, "global_step": 484952, "epoch": 5842} {"train_loss": -26.837940216064453, "global_step": 484953, "epoch": 5842} {"train_loss": -26.28449821472168, "global_step": 484954, "epoch": 5842} {"train_loss": -26.35908317565918, "global_step": 484955, "epoch": 5842} {"train_loss": -26.970935821533203, "global_step": 484956, "epoch": 5842} {"train_loss": -26.966434478759766, "global_step": 484957, "epoch": 5842} {"train_loss": -26.6403751373291, "global_step": 484958, "epoch": 5842} {"train_loss": -27.000885009765625, "global_step": 484959, "epoch": 5842} {"train_loss": -27.002649307250977, "global_step": 484960, "epoch": 5842} {"train_loss": -27.11971092224121, "global_step": 484961, "epoch": 5842} {"train_loss": -26.897781372070312, "global_step": 484962, "epoch": 5842} {"train_loss": -26.946044921875, "global_step": 484963, "epoch": 5842} {"train_loss": -26.876819610595703, "global_step": 484964, "epoch": 5842} {"train_loss": -26.85723304748535, "global_step": 484965, "epoch": 5842} {"train_loss": -26.84583854675293, "global_step": 484966, "epoch": 5842} {"train_loss": -27.380767822265625, "global_step": 484967, "epoch": 5842} {"train_loss": -27.063484329775154, "global_step": 484968, "epoch": 5842, "val_loss": 6452506.0} {"train_loss": -27.162612915039062, "global_step": 484969, "epoch": 5843} {"train_loss": -26.6815185546875, "global_step": 484970, "epoch": 5843} {"train_loss": -26.988056182861328, "global_step": 484971, "epoch": 5843} {"train_loss": -26.754011154174805, "global_step": 484972, "epoch": 5843} {"train_loss": -27.188352584838867, "global_step": 484973, "epoch": 5843} {"train_loss": -26.7235164642334, "global_step": 484974, "epoch": 5843} {"train_loss": -27.069650650024414, "global_step": 484975, "epoch": 5843} {"train_loss": -26.869840621948242, "global_step": 484976, "epoch": 5843} {"train_loss": -26.970422744750977, "global_step": 484977, "epoch": 5843} {"train_loss": -26.93581199645996, "global_step": 484978, "epoch": 5843} {"train_loss": -26.891590118408203, "global_step": 484979, "epoch": 5843} {"train_loss": -26.9444637298584, "global_step": 484980, "epoch": 5843} {"train_loss": -26.835647583007812, "global_step": 484981, "epoch": 5843} {"train_loss": -26.922109603881836, "global_step": 484982, "epoch": 5843} {"train_loss": -27.138574600219727, "global_step": 484983, "epoch": 5843} {"train_loss": -27.005884170532227, "global_step": 484984, "epoch": 5843} {"train_loss": -27.256032943725586, "global_step": 484985, "epoch": 5843} {"train_loss": -27.373794555664062, "global_step": 484986, "epoch": 5843} {"train_loss": -26.88340187072754, "global_step": 484987, "epoch": 5843} {"train_loss": -27.1811580657959, "global_step": 484988, "epoch": 5843} {"train_loss": -27.277257919311523, "global_step": 484989, "epoch": 5843} {"train_loss": -27.308887481689453, "global_step": 484990, "epoch": 5843} {"train_loss": -27.364517211914062, "global_step": 484991, "epoch": 5843} {"train_loss": -27.45668601989746, "global_step": 484992, "epoch": 5843} {"train_loss": -27.704259872436523, "global_step": 484993, "epoch": 5843} {"train_loss": -27.564870834350586, "global_step": 484994, "epoch": 5843} {"train_loss": -27.19756507873535, "global_step": 484995, "epoch": 5843} {"train_loss": -27.3051815032959, "global_step": 484996, "epoch": 5843} {"train_loss": -27.625635147094727, "global_step": 484997, "epoch": 5843} {"train_loss": -27.29408073425293, "global_step": 484998, "epoch": 5843} {"train_loss": -27.505590438842773, "global_step": 484999, "epoch": 5843} {"train_loss": -27.45223045349121, "global_step": 485000, "epoch": 5843} {"train_loss": -27.581439971923828, "global_step": 485001, "epoch": 5843} {"train_loss": -27.41987419128418, "global_step": 485002, "epoch": 5843} {"train_loss": -27.087690353393555, "global_step": 485003, "epoch": 5843} {"train_loss": -27.6627197265625, "global_step": 485004, "epoch": 5843} {"train_loss": -27.531064987182617, "global_step": 485005, "epoch": 5843} {"train_loss": -27.37457275390625, "global_step": 485006, "epoch": 5843} {"train_loss": -27.1982421875, "global_step": 485007, "epoch": 5843} {"train_loss": -27.3763484954834, "global_step": 485008, "epoch": 5843} {"train_loss": -27.13722038269043, "global_step": 485009, "epoch": 5843} {"train_loss": -27.440032958984375, "global_step": 485010, "epoch": 5843} {"train_loss": -27.328128814697266, "global_step": 485011, "epoch": 5843} {"train_loss": -27.285547256469727, "global_step": 485012, "epoch": 5843} {"train_loss": -27.29205894470215, "global_step": 485013, "epoch": 5843} {"train_loss": -27.403013229370117, "global_step": 485014, "epoch": 5843} {"train_loss": -27.390167236328125, "global_step": 485015, "epoch": 5843} {"train_loss": -27.35780143737793, "global_step": 485016, "epoch": 5843} {"train_loss": -27.10664176940918, "global_step": 485017, "epoch": 5843} {"train_loss": -27.298978805541992, "global_step": 485018, "epoch": 5843} {"train_loss": -26.70779800415039, "global_step": 485019, "epoch": 5843} {"train_loss": -26.715253829956055, "global_step": 485020, "epoch": 5843} {"train_loss": -26.51508140563965, "global_step": 485021, "epoch": 5843} {"train_loss": -26.57215690612793, "global_step": 485022, "epoch": 5843} {"train_loss": -27.074514389038086, "global_step": 485023, "epoch": 5843} {"train_loss": -27.174835205078125, "global_step": 485024, "epoch": 5843} {"train_loss": -27.220495223999023, "global_step": 485025, "epoch": 5843} {"train_loss": -27.085193634033203, "global_step": 485026, "epoch": 5843} {"train_loss": -26.872817993164062, "global_step": 485027, "epoch": 5843} {"train_loss": -27.3289852142334, "global_step": 485028, "epoch": 5843} {"train_loss": -27.052976608276367, "global_step": 485029, "epoch": 5843} {"train_loss": -27.00428581237793, "global_step": 485030, "epoch": 5843} {"train_loss": -27.4404354095459, "global_step": 485031, "epoch": 5843} {"train_loss": -26.9692440032959, "global_step": 485032, "epoch": 5843} {"train_loss": -27.15838623046875, "global_step": 485033, "epoch": 5843} {"train_loss": -27.389434814453125, "global_step": 485034, "epoch": 5843} {"train_loss": -27.301624298095703, "global_step": 485035, "epoch": 5843} {"train_loss": -27.597949981689453, "global_step": 485036, "epoch": 5843} {"train_loss": -27.12980079650879, "global_step": 485037, "epoch": 5843} {"train_loss": -27.205554962158203, "global_step": 485038, "epoch": 5843} {"train_loss": -26.938257217407227, "global_step": 485039, "epoch": 5843} {"train_loss": -27.51421546936035, "global_step": 485040, "epoch": 5843} {"train_loss": -27.442127227783203, "global_step": 485041, "epoch": 5843} {"train_loss": -26.792667388916016, "global_step": 485042, "epoch": 5843} {"train_loss": -27.07720375061035, "global_step": 485043, "epoch": 5843} {"train_loss": -27.498197555541992, "global_step": 485044, "epoch": 5843} {"train_loss": -27.282794952392578, "global_step": 485045, "epoch": 5843} {"train_loss": -27.416351318359375, "global_step": 485046, "epoch": 5843} {"train_loss": -27.495895385742188, "global_step": 485047, "epoch": 5843} {"train_loss": -27.414514541625977, "global_step": 485048, "epoch": 5843} {"train_loss": -27.649473190307617, "global_step": 485049, "epoch": 5843} {"train_loss": -26.854093551635742, "global_step": 485050, "epoch": 5843} {"train_loss": -27.20026252930423, "global_step": 485051, "epoch": 5843, "val_loss": 6510111.0} {"train_loss": -26.799091339111328, "global_step": 485052, "epoch": 5844} {"train_loss": -26.981887817382812, "global_step": 485053, "epoch": 5844} {"train_loss": -26.75198745727539, "global_step": 485054, "epoch": 5844} {"train_loss": -27.100631713867188, "global_step": 485055, "epoch": 5844} {"train_loss": -26.569433212280273, "global_step": 485056, "epoch": 5844} {"train_loss": -26.925811767578125, "global_step": 485057, "epoch": 5844} {"train_loss": -26.696386337280273, "global_step": 485058, "epoch": 5844} {"train_loss": -26.376876831054688, "global_step": 485059, "epoch": 5844} {"train_loss": -27.084659576416016, "global_step": 485060, "epoch": 5844} {"train_loss": -27.131977081298828, "global_step": 485061, "epoch": 5844} {"train_loss": -26.590620040893555, "global_step": 485062, "epoch": 5844} {"train_loss": -26.99483299255371, "global_step": 485063, "epoch": 5844} {"train_loss": -26.742923736572266, "global_step": 485064, "epoch": 5844} {"train_loss": -27.065786361694336, "global_step": 485065, "epoch": 5844} {"train_loss": -27.07008171081543, "global_step": 485066, "epoch": 5844} {"train_loss": -27.053796768188477, "global_step": 485067, "epoch": 5844} {"train_loss": -26.7982234954834, "global_step": 485068, "epoch": 5844} {"train_loss": -27.10767936706543, "global_step": 485069, "epoch": 5844} {"train_loss": -27.255523681640625, "global_step": 485070, "epoch": 5844} {"train_loss": -27.672229766845703, "global_step": 485071, "epoch": 5844} {"train_loss": -27.438385009765625, "global_step": 485072, "epoch": 5844} {"train_loss": -27.5053653717041, "global_step": 485073, "epoch": 5844} {"train_loss": -27.2581787109375, "global_step": 485074, "epoch": 5844} {"train_loss": -27.319629669189453, "global_step": 485075, "epoch": 5844} {"train_loss": -27.588977813720703, "global_step": 485076, "epoch": 5844} {"train_loss": -27.037979125976562, "global_step": 485077, "epoch": 5844} {"train_loss": -27.383874893188477, "global_step": 485078, "epoch": 5844} {"train_loss": -27.12529945373535, "global_step": 485079, "epoch": 5844} {"train_loss": -27.446557998657227, "global_step": 485080, "epoch": 5844} {"train_loss": -27.294586181640625, "global_step": 485081, "epoch": 5844} {"train_loss": -27.652057647705078, "global_step": 485082, "epoch": 5844} {"train_loss": -27.40236473083496, "global_step": 485083, "epoch": 5844} {"train_loss": -27.049514770507812, "global_step": 485084, "epoch": 5844} {"train_loss": -27.49846839904785, "global_step": 485085, "epoch": 5844} {"train_loss": -27.40667724609375, "global_step": 485086, "epoch": 5844} {"train_loss": -27.124481201171875, "global_step": 485087, "epoch": 5844} {"train_loss": -27.129087448120117, "global_step": 485088, "epoch": 5844} {"train_loss": -27.26034927368164, "global_step": 485089, "epoch": 5844} {"train_loss": -27.254140853881836, "global_step": 485090, "epoch": 5844} {"train_loss": -27.5824031829834, "global_step": 485091, "epoch": 5844} {"train_loss": -27.368330001831055, "global_step": 485092, "epoch": 5844} {"train_loss": -27.22102165222168, "global_step": 485093, "epoch": 5844} {"train_loss": -27.105329513549805, "global_step": 485094, "epoch": 5844} {"train_loss": -27.408416748046875, "global_step": 485095, "epoch": 5844} {"train_loss": -27.23969841003418, "global_step": 485096, "epoch": 5844} {"train_loss": -27.632831573486328, "global_step": 485097, "epoch": 5844} {"train_loss": -27.268423080444336, "global_step": 485098, "epoch": 5844} {"train_loss": -27.566755294799805, "global_step": 485099, "epoch": 5844} {"train_loss": -27.7650203704834, "global_step": 485100, "epoch": 5844} {"train_loss": -27.44907569885254, "global_step": 485101, "epoch": 5844} {"train_loss": -27.373456954956055, "global_step": 485102, "epoch": 5844} {"train_loss": -27.552814483642578, "global_step": 485103, "epoch": 5844} {"train_loss": -27.33792495727539, "global_step": 485104, "epoch": 5844} {"train_loss": -27.26851463317871, "global_step": 485105, "epoch": 5844} {"train_loss": -27.295820236206055, "global_step": 485106, "epoch": 5844} {"train_loss": -27.82733726501465, "global_step": 485107, "epoch": 5844} {"train_loss": -27.24711036682129, "global_step": 485108, "epoch": 5844} {"train_loss": -27.20781898498535, "global_step": 485109, "epoch": 5844} {"train_loss": -27.213363647460938, "global_step": 485110, "epoch": 5844} {"train_loss": -27.686185836791992, "global_step": 485111, "epoch": 5844} {"train_loss": -27.31678581237793, "global_step": 485112, "epoch": 5844} {"train_loss": -27.21201515197754, "global_step": 485113, "epoch": 5844} {"train_loss": -26.960956573486328, "global_step": 485114, "epoch": 5844} {"train_loss": -27.559192657470703, "global_step": 485115, "epoch": 5844} {"train_loss": -27.109655380249023, "global_step": 485116, "epoch": 5844} {"train_loss": -27.079303741455078, "global_step": 485117, "epoch": 5844} {"train_loss": -27.14716148376465, "global_step": 485118, "epoch": 5844} {"train_loss": -26.836429595947266, "global_step": 485119, "epoch": 5844} {"train_loss": -27.090900421142578, "global_step": 485120, "epoch": 5844} {"train_loss": -27.335540771484375, "global_step": 485121, "epoch": 5844} {"train_loss": -27.242650985717773, "global_step": 485122, "epoch": 5844} {"train_loss": -27.333784103393555, "global_step": 485123, "epoch": 5844} {"train_loss": -27.5956974029541, "global_step": 485124, "epoch": 5844} {"train_loss": -27.536325454711914, "global_step": 485125, "epoch": 5844} {"train_loss": -27.459516525268555, "global_step": 485126, "epoch": 5844} {"train_loss": -27.484220504760742, "global_step": 485127, "epoch": 5844} {"train_loss": -26.99753761291504, "global_step": 485128, "epoch": 5844} {"train_loss": -27.158044815063477, "global_step": 485129, "epoch": 5844} {"train_loss": -27.3485050201416, "global_step": 485130, "epoch": 5844} {"train_loss": -27.80726432800293, "global_step": 485131, "epoch": 5844} {"train_loss": -27.5367488861084, "global_step": 485132, "epoch": 5844} {"train_loss": -27.294055938720703, "global_step": 485133, "epoch": 5844} {"train_loss": -27.249979501747223, "global_step": 485134, "epoch": 5844, "val_loss": 6445195.5} {"train_loss": -27.071866989135742, "global_step": 485135, "epoch": 5845} {"train_loss": -26.544675827026367, "global_step": 485136, "epoch": 5845} {"train_loss": -26.07073974609375, "global_step": 485137, "epoch": 5845} {"train_loss": -25.91400146484375, "global_step": 485138, "epoch": 5845} {"train_loss": -27.125141143798828, "global_step": 485139, "epoch": 5845} {"train_loss": -26.77312660217285, "global_step": 485140, "epoch": 5845} {"train_loss": -26.239770889282227, "global_step": 485141, "epoch": 5845} {"train_loss": -27.20871925354004, "global_step": 485142, "epoch": 5845} {"train_loss": -26.252613067626953, "global_step": 485143, "epoch": 5845} {"train_loss": -27.235065460205078, "global_step": 485144, "epoch": 5845} {"train_loss": -26.929731369018555, "global_step": 485145, "epoch": 5845} {"train_loss": -27.012887954711914, "global_step": 485146, "epoch": 5845} {"train_loss": -26.728830337524414, "global_step": 485147, "epoch": 5845} {"train_loss": -26.912830352783203, "global_step": 485148, "epoch": 5845} {"train_loss": -26.791440963745117, "global_step": 485149, "epoch": 5845} {"train_loss": -26.854904174804688, "global_step": 485150, "epoch": 5845} {"train_loss": -27.134634017944336, "global_step": 485151, "epoch": 5845} {"train_loss": -27.107284545898438, "global_step": 485152, "epoch": 5845} {"train_loss": -27.322174072265625, "global_step": 485153, "epoch": 5845} {"train_loss": -27.018070220947266, "global_step": 485154, "epoch": 5845} {"train_loss": -27.28449058532715, "global_step": 485155, "epoch": 5845} {"train_loss": -27.08200454711914, "global_step": 485156, "epoch": 5845} {"train_loss": -27.179052352905273, "global_step": 485157, "epoch": 5845} {"train_loss": -26.816709518432617, "global_step": 485158, "epoch": 5845} {"train_loss": -27.44989585876465, "global_step": 485159, "epoch": 5845} {"train_loss": -26.601110458374023, "global_step": 485160, "epoch": 5845} {"train_loss": -27.043622970581055, "global_step": 485161, "epoch": 5845} {"train_loss": -26.78352165222168, "global_step": 485162, "epoch": 5845} {"train_loss": -27.43641471862793, "global_step": 485163, "epoch": 5845} {"train_loss": -27.11643409729004, "global_step": 485164, "epoch": 5845} {"train_loss": -27.1039981842041, "global_step": 485165, "epoch": 5845} {"train_loss": -26.902917861938477, "global_step": 485166, "epoch": 5845} {"train_loss": -27.1205997467041, "global_step": 485167, "epoch": 5845} {"train_loss": -27.385175704956055, "global_step": 485168, "epoch": 5845} {"train_loss": -27.463211059570312, "global_step": 485169, "epoch": 5845} {"train_loss": -27.19339370727539, "global_step": 485170, "epoch": 5845} {"train_loss": -27.42866325378418, "global_step": 485171, "epoch": 5845} {"train_loss": -27.724395751953125, "global_step": 485172, "epoch": 5845} {"train_loss": -27.599475860595703, "global_step": 485173, "epoch": 5845} {"train_loss": -27.25269889831543, "global_step": 485174, "epoch": 5845} {"train_loss": -27.32611656188965, "global_step": 485175, "epoch": 5845} {"train_loss": -27.388181686401367, "global_step": 485176, "epoch": 5845} {"train_loss": -27.4678897857666, "global_step": 485177, "epoch": 5845} {"train_loss": -27.45648193359375, "global_step": 485178, "epoch": 5845} {"train_loss": -27.25965690612793, "global_step": 485179, "epoch": 5845} {"train_loss": -27.49285888671875, "global_step": 485180, "epoch": 5845} {"train_loss": -27.35527992248535, "global_step": 485181, "epoch": 5845} {"train_loss": -26.921466827392578, "global_step": 485182, "epoch": 5845} {"train_loss": -27.425806045532227, "global_step": 485183, "epoch": 5845} {"train_loss": -27.32464599609375, "global_step": 485184, "epoch": 5845} {"train_loss": -27.69775390625, "global_step": 485185, "epoch": 5845} {"train_loss": -27.35528564453125, "global_step": 485186, "epoch": 5845} {"train_loss": -27.319629669189453, "global_step": 485187, "epoch": 5845} {"train_loss": -27.313323974609375, "global_step": 485188, "epoch": 5845} {"train_loss": -27.192642211914062, "global_step": 485189, "epoch": 5845} {"train_loss": -27.25078773498535, "global_step": 485190, "epoch": 5845} {"train_loss": -27.257299423217773, "global_step": 485191, "epoch": 5845} {"train_loss": -27.381338119506836, "global_step": 485192, "epoch": 5845} {"train_loss": -27.21944236755371, "global_step": 485193, "epoch": 5845} {"train_loss": -27.190454483032227, "global_step": 485194, "epoch": 5845} {"train_loss": -26.991168975830078, "global_step": 485195, "epoch": 5845} {"train_loss": -26.992151260375977, "global_step": 485196, "epoch": 5845} {"train_loss": -27.186569213867188, "global_step": 485197, "epoch": 5845} {"train_loss": -27.110782623291016, "global_step": 485198, "epoch": 5845} {"train_loss": -27.424386978149414, "global_step": 485199, "epoch": 5845} {"train_loss": -26.95549964904785, "global_step": 485200, "epoch": 5845} {"train_loss": -27.368993759155273, "global_step": 485201, "epoch": 5845} {"train_loss": -27.295217514038086, "global_step": 485202, "epoch": 5845} {"train_loss": -26.93094825744629, "global_step": 485203, "epoch": 5845} {"train_loss": -27.543811798095703, "global_step": 485204, "epoch": 5845} {"train_loss": -27.2923583984375, "global_step": 485205, "epoch": 5845} {"train_loss": -27.577417373657227, "global_step": 485206, "epoch": 5845} {"train_loss": -27.314865112304688, "global_step": 485207, "epoch": 5845} {"train_loss": -27.039844512939453, "global_step": 485208, "epoch": 5845} {"train_loss": -27.363067626953125, "global_step": 485209, "epoch": 5845} {"train_loss": -27.226104736328125, "global_step": 485210, "epoch": 5845} {"train_loss": -27.4066219329834, "global_step": 485211, "epoch": 5845} {"train_loss": -27.233423233032227, "global_step": 485212, "epoch": 5845} {"train_loss": -27.280704498291016, "global_step": 485213, "epoch": 5845} {"train_loss": -27.38813591003418, "global_step": 485214, "epoch": 5845} {"train_loss": -27.42298698425293, "global_step": 485215, "epoch": 5845} {"train_loss": -27.26545524597168, "global_step": 485216, "epoch": 5845} {"train_loss": -27.141206143850304, "global_step": 485217, "epoch": 5845, "val_loss": 6560953.0} {"train_loss": -26.936450958251953, "global_step": 485218, "epoch": 5846} {"train_loss": -26.018884658813477, "global_step": 485219, "epoch": 5846} {"train_loss": -26.04876708984375, "global_step": 485220, "epoch": 5846} {"train_loss": -26.725812911987305, "global_step": 485221, "epoch": 5846} {"train_loss": -26.8718204498291, "global_step": 485222, "epoch": 5846} {"train_loss": -25.973257064819336, "global_step": 485223, "epoch": 5846} {"train_loss": -26.540882110595703, "global_step": 485224, "epoch": 5846} {"train_loss": -26.814538955688477, "global_step": 485225, "epoch": 5846} {"train_loss": -27.009374618530273, "global_step": 485226, "epoch": 5846} {"train_loss": -26.857397079467773, "global_step": 485227, "epoch": 5846} {"train_loss": -26.922134399414062, "global_step": 485228, "epoch": 5846} {"train_loss": -26.644250869750977, "global_step": 485229, "epoch": 5846} {"train_loss": -26.95320701599121, "global_step": 485230, "epoch": 5846} {"train_loss": -27.016754150390625, "global_step": 485231, "epoch": 5846} {"train_loss": -27.224843978881836, "global_step": 485232, "epoch": 5846} {"train_loss": -26.979650497436523, "global_step": 485233, "epoch": 5846} {"train_loss": -26.773929595947266, "global_step": 485234, "epoch": 5846} {"train_loss": -27.2247257232666, "global_step": 485235, "epoch": 5846} {"train_loss": -26.922901153564453, "global_step": 485236, "epoch": 5846} {"train_loss": -27.068281173706055, "global_step": 485237, "epoch": 5846} {"train_loss": -27.17828369140625, "global_step": 485238, "epoch": 5846} {"train_loss": -27.143753051757812, "global_step": 485239, "epoch": 5846} {"train_loss": -27.378849029541016, "global_step": 485240, "epoch": 5846} {"train_loss": -27.04743003845215, "global_step": 485241, "epoch": 5846} {"train_loss": -27.230268478393555, "global_step": 485242, "epoch": 5846} {"train_loss": -27.439794540405273, "global_step": 485243, "epoch": 5846} {"train_loss": -27.169269561767578, "global_step": 485244, "epoch": 5846} {"train_loss": -27.06989097595215, "global_step": 485245, "epoch": 5846} {"train_loss": -27.53338050842285, "global_step": 485246, "epoch": 5846} {"train_loss": -27.271881103515625, "global_step": 485247, "epoch": 5846} {"train_loss": -27.261320114135742, "global_step": 485248, "epoch": 5846} {"train_loss": -26.962677001953125, "global_step": 485249, "epoch": 5846} {"train_loss": -27.1221866607666, "global_step": 485250, "epoch": 5846} {"train_loss": -27.568344116210938, "global_step": 485251, "epoch": 5846} {"train_loss": -27.345014572143555, "global_step": 485252, "epoch": 5846} {"train_loss": -27.558752059936523, "global_step": 485253, "epoch": 5846} {"train_loss": -27.181188583374023, "global_step": 485254, "epoch": 5846} {"train_loss": -27.425418853759766, "global_step": 485255, "epoch": 5846} {"train_loss": -27.36116600036621, "global_step": 485256, "epoch": 5846} {"train_loss": -27.869977951049805, "global_step": 485257, "epoch": 5846} {"train_loss": -27.40874671936035, "global_step": 485258, "epoch": 5846} {"train_loss": -27.4576473236084, "global_step": 485259, "epoch": 5846} {"train_loss": -27.699548721313477, "global_step": 485260, "epoch": 5846} {"train_loss": -27.252172470092773, "global_step": 485261, "epoch": 5846} {"train_loss": -27.250049591064453, "global_step": 485262, "epoch": 5846} {"train_loss": -27.22308921813965, "global_step": 485263, "epoch": 5846} {"train_loss": -27.37255859375, "global_step": 485264, "epoch": 5846} {"train_loss": -27.128034591674805, "global_step": 485265, "epoch": 5846} {"train_loss": -27.4079532623291, "global_step": 485266, "epoch": 5846} {"train_loss": -27.47544288635254, "global_step": 485267, "epoch": 5846} {"train_loss": -27.587329864501953, "global_step": 485268, "epoch": 5846} {"train_loss": -27.313291549682617, "global_step": 485269, "epoch": 5846} {"train_loss": -27.390380859375, "global_step": 485270, "epoch": 5846} {"train_loss": -27.545032501220703, "global_step": 485271, "epoch": 5846} {"train_loss": -27.238189697265625, "global_step": 485272, "epoch": 5846} {"train_loss": -27.588104248046875, "global_step": 485273, "epoch": 5846} {"train_loss": -27.507410049438477, "global_step": 485274, "epoch": 5846} {"train_loss": -27.53165626525879, "global_step": 485275, "epoch": 5846} {"train_loss": -27.41105079650879, "global_step": 485276, "epoch": 5846} {"train_loss": -27.666303634643555, "global_step": 485277, "epoch": 5846} {"train_loss": -27.282129287719727, "global_step": 485278, "epoch": 5846} {"train_loss": -27.287885665893555, "global_step": 485279, "epoch": 5846} {"train_loss": -27.217199325561523, "global_step": 485280, "epoch": 5846} {"train_loss": -27.363636016845703, "global_step": 485281, "epoch": 5846} {"train_loss": -27.370391845703125, "global_step": 485282, "epoch": 5846} {"train_loss": -26.6527099609375, "global_step": 485283, "epoch": 5846} {"train_loss": -26.942752838134766, "global_step": 485284, "epoch": 5846} {"train_loss": -26.95843505859375, "global_step": 485285, "epoch": 5846} {"train_loss": -27.253311157226562, "global_step": 485286, "epoch": 5846} {"train_loss": -26.63886070251465, "global_step": 485287, "epoch": 5846} {"train_loss": -27.277978897094727, "global_step": 485288, "epoch": 5846} {"train_loss": -27.176227569580078, "global_step": 485289, "epoch": 5846} {"train_loss": -26.714080810546875, "global_step": 485290, "epoch": 5846} {"train_loss": -27.069812774658203, "global_step": 485291, "epoch": 5846} {"train_loss": -27.633142471313477, "global_step": 485292, "epoch": 5846} {"train_loss": -27.236310958862305, "global_step": 485293, "epoch": 5846} {"train_loss": -26.889230728149414, "global_step": 485294, "epoch": 5846} {"train_loss": -27.57525634765625, "global_step": 485295, "epoch": 5846} {"train_loss": -27.297834396362305, "global_step": 485296, "epoch": 5846} {"train_loss": -27.32248878479004, "global_step": 485297, "epoch": 5846} {"train_loss": -27.4624080657959, "global_step": 485298, "epoch": 5846} {"train_loss": -27.333581924438477, "global_step": 485299, "epoch": 5846} {"train_loss": -27.17235034345144, "global_step": 485300, "epoch": 5846, "val_loss": 6583955.5} {"train_loss": -26.73609733581543, "global_step": 485301, "epoch": 5847} {"train_loss": -26.97169303894043, "global_step": 485302, "epoch": 5847} {"train_loss": -26.99798583984375, "global_step": 485303, "epoch": 5847} {"train_loss": -26.236494064331055, "global_step": 485304, "epoch": 5847} {"train_loss": -27.233936309814453, "global_step": 485305, "epoch": 5847} {"train_loss": -26.78596305847168, "global_step": 485306, "epoch": 5847} {"train_loss": -26.890811920166016, "global_step": 485307, "epoch": 5847} {"train_loss": -26.559158325195312, "global_step": 485308, "epoch": 5847} {"train_loss": -26.953826904296875, "global_step": 485309, "epoch": 5847} {"train_loss": -27.039113998413086, "global_step": 485310, "epoch": 5847} {"train_loss": -27.293928146362305, "global_step": 485311, "epoch": 5847} {"train_loss": -27.022939682006836, "global_step": 485312, "epoch": 5847} {"train_loss": -26.964969635009766, "global_step": 485313, "epoch": 5847} {"train_loss": -26.956205368041992, "global_step": 485314, "epoch": 5847} {"train_loss": -26.894210815429688, "global_step": 485315, "epoch": 5847} {"train_loss": -27.1594181060791, "global_step": 485316, "epoch": 5847} {"train_loss": -27.01007080078125, "global_step": 485317, "epoch": 5847} {"train_loss": -26.921710968017578, "global_step": 485318, "epoch": 5847} {"train_loss": -27.150869369506836, "global_step": 485319, "epoch": 5847} {"train_loss": -26.995351791381836, "global_step": 485320, "epoch": 5847} {"train_loss": -27.254377365112305, "global_step": 485321, "epoch": 5847} {"train_loss": -26.98381996154785, "global_step": 485322, "epoch": 5847} {"train_loss": -27.165760040283203, "global_step": 485323, "epoch": 5847} {"train_loss": -27.418493270874023, "global_step": 485324, "epoch": 5847} {"train_loss": -27.335363388061523, "global_step": 485325, "epoch": 5847} {"train_loss": -27.43427848815918, "global_step": 485326, "epoch": 5847} {"train_loss": -27.434436798095703, "global_step": 485327, "epoch": 5847} {"train_loss": -27.403776168823242, "global_step": 485328, "epoch": 5847} {"train_loss": -27.419870376586914, "global_step": 485329, "epoch": 5847} {"train_loss": -27.319425582885742, "global_step": 485330, "epoch": 5847} {"train_loss": -27.2750186920166, "global_step": 485331, "epoch": 5847} {"train_loss": -27.43194007873535, "global_step": 485332, "epoch": 5847} {"train_loss": -26.73517417907715, "global_step": 485333, "epoch": 5847} {"train_loss": -27.377429962158203, "global_step": 485334, "epoch": 5847} {"train_loss": -27.07666015625, "global_step": 485335, "epoch": 5847} {"train_loss": -27.521772384643555, "global_step": 485336, "epoch": 5847} {"train_loss": -27.277856826782227, "global_step": 485337, "epoch": 5847} {"train_loss": -27.15815544128418, "global_step": 485338, "epoch": 5847} {"train_loss": -27.550458908081055, "global_step": 485339, "epoch": 5847} {"train_loss": -27.44996452331543, "global_step": 485340, "epoch": 5847} {"train_loss": -27.265777587890625, "global_step": 485341, "epoch": 5847} {"train_loss": -27.014911651611328, "global_step": 485342, "epoch": 5847} {"train_loss": -27.087493896484375, "global_step": 485343, "epoch": 5847} {"train_loss": -27.263593673706055, "global_step": 485344, "epoch": 5847} {"train_loss": -27.317352294921875, "global_step": 485345, "epoch": 5847} {"train_loss": -27.446210861206055, "global_step": 485346, "epoch": 5847} {"train_loss": -27.30126953125, "global_step": 485347, "epoch": 5847} {"train_loss": -27.12452507019043, "global_step": 485348, "epoch": 5847} {"train_loss": -27.19520378112793, "global_step": 485349, "epoch": 5847} {"train_loss": -27.220640182495117, "global_step": 485350, "epoch": 5847} {"train_loss": -27.21174430847168, "global_step": 485351, "epoch": 5847} {"train_loss": -26.918277740478516, "global_step": 485352, "epoch": 5847} {"train_loss": -26.856510162353516, "global_step": 485353, "epoch": 5847} {"train_loss": -27.656253814697266, "global_step": 485354, "epoch": 5847} {"train_loss": -27.167158126831055, "global_step": 485355, "epoch": 5847} {"train_loss": -27.1373291015625, "global_step": 485356, "epoch": 5847} {"train_loss": -27.3219051361084, "global_step": 485357, "epoch": 5847} {"train_loss": -26.923847198486328, "global_step": 485358, "epoch": 5847} {"train_loss": -27.482269287109375, "global_step": 485359, "epoch": 5847} {"train_loss": -27.007490158081055, "global_step": 485360, "epoch": 5847} {"train_loss": -27.320486068725586, "global_step": 485361, "epoch": 5847} {"train_loss": -27.531280517578125, "global_step": 485362, "epoch": 5847} {"train_loss": -27.48065185546875, "global_step": 485363, "epoch": 5847} {"train_loss": -27.513671875, "global_step": 485364, "epoch": 5847} {"train_loss": -27.177717208862305, "global_step": 485365, "epoch": 5847} {"train_loss": -26.82797622680664, "global_step": 485366, "epoch": 5847} {"train_loss": -26.62916374206543, "global_step": 485367, "epoch": 5847} {"train_loss": -27.45998191833496, "global_step": 485368, "epoch": 5847} {"train_loss": -27.47930908203125, "global_step": 485369, "epoch": 5847} {"train_loss": -26.82220458984375, "global_step": 485370, "epoch": 5847} {"train_loss": -27.085657119750977, "global_step": 485371, "epoch": 5847} {"train_loss": -27.02066421508789, "global_step": 485372, "epoch": 5847} {"train_loss": -27.094226837158203, "global_step": 485373, "epoch": 5847} {"train_loss": -27.448013305664062, "global_step": 485374, "epoch": 5847} {"train_loss": -27.45570945739746, "global_step": 485375, "epoch": 5847} {"train_loss": -27.374771118164062, "global_step": 485376, "epoch": 5847} {"train_loss": -27.18082046508789, "global_step": 485377, "epoch": 5847} {"train_loss": -26.952096939086914, "global_step": 485378, "epoch": 5847} {"train_loss": -27.36844253540039, "global_step": 485379, "epoch": 5847} {"train_loss": -27.760910034179688, "global_step": 485380, "epoch": 5847} {"train_loss": -26.867706298828125, "global_step": 485381, "epoch": 5847} {"train_loss": -27.363117218017578, "global_step": 485382, "epoch": 5847} {"train_loss": -27.15878286706396, "global_step": 485383, "epoch": 5847, "val_loss": 6514077.0} {"train_loss": -26.13221549987793, "global_step": 485384, "epoch": 5848} {"train_loss": -26.6032772064209, "global_step": 485385, "epoch": 5848} {"train_loss": -26.685216903686523, "global_step": 485386, "epoch": 5848} {"train_loss": -26.605741500854492, "global_step": 485387, "epoch": 5848} {"train_loss": -26.678802490234375, "global_step": 485388, "epoch": 5848} {"train_loss": -26.519214630126953, "global_step": 485389, "epoch": 5848} {"train_loss": -26.645044326782227, "global_step": 485390, "epoch": 5848} {"train_loss": -26.37379264831543, "global_step": 485391, "epoch": 5848} {"train_loss": -26.657108306884766, "global_step": 485392, "epoch": 5848} {"train_loss": -26.72650718688965, "global_step": 485393, "epoch": 5848} {"train_loss": -26.514196395874023, "global_step": 485394, "epoch": 5848} {"train_loss": -26.692426681518555, "global_step": 485395, "epoch": 5848} {"train_loss": -26.664770126342773, "global_step": 485396, "epoch": 5848} {"train_loss": -26.9444522857666, "global_step": 485397, "epoch": 5848} {"train_loss": -27.271337509155273, "global_step": 485398, "epoch": 5848} {"train_loss": -26.980443954467773, "global_step": 485399, "epoch": 5848} {"train_loss": -26.6478271484375, "global_step": 485400, "epoch": 5848} {"train_loss": -27.17500114440918, "global_step": 485401, "epoch": 5848} {"train_loss": -27.150373458862305, "global_step": 485402, "epoch": 5848} {"train_loss": -27.2360897064209, "global_step": 485403, "epoch": 5848} {"train_loss": -27.057397842407227, "global_step": 485404, "epoch": 5848} {"train_loss": -27.331470489501953, "global_step": 485405, "epoch": 5848} {"train_loss": -27.07356834411621, "global_step": 485406, "epoch": 5848} {"train_loss": -27.421537399291992, "global_step": 485407, "epoch": 5848} {"train_loss": -27.333927154541016, "global_step": 485408, "epoch": 5848} {"train_loss": -27.195697784423828, "global_step": 485409, "epoch": 5848} {"train_loss": -27.171289443969727, "global_step": 485410, "epoch": 5848} {"train_loss": -27.468582153320312, "global_step": 485411, "epoch": 5848} {"train_loss": -27.161733627319336, "global_step": 485412, "epoch": 5848} {"train_loss": -27.343366622924805, "global_step": 485413, "epoch": 5848} {"train_loss": -27.110095977783203, "global_step": 485414, "epoch": 5848} {"train_loss": -27.329010009765625, "global_step": 485415, "epoch": 5848} {"train_loss": -27.296789169311523, "global_step": 485416, "epoch": 5848} {"train_loss": -27.111536026000977, "global_step": 485417, "epoch": 5848} {"train_loss": -27.252161026000977, "global_step": 485418, "epoch": 5848} {"train_loss": -26.956830978393555, "global_step": 485419, "epoch": 5848} {"train_loss": -27.266178131103516, "global_step": 485420, "epoch": 5848} {"train_loss": -26.789682388305664, "global_step": 485421, "epoch": 5848} {"train_loss": -27.339752197265625, "global_step": 485422, "epoch": 5848} {"train_loss": -27.282819747924805, "global_step": 485423, "epoch": 5848} {"train_loss": -27.488285064697266, "global_step": 485424, "epoch": 5848} {"train_loss": -27.063077926635742, "global_step": 485425, "epoch": 5848} {"train_loss": -27.04450035095215, "global_step": 485426, "epoch": 5848} {"train_loss": -27.521167755126953, "global_step": 485427, "epoch": 5848} {"train_loss": -27.256513595581055, "global_step": 485428, "epoch": 5848} {"train_loss": -27.382659912109375, "global_step": 485429, "epoch": 5848} {"train_loss": -27.220977783203125, "global_step": 485430, "epoch": 5848} {"train_loss": -27.240055084228516, "global_step": 485431, "epoch": 5848} {"train_loss": -27.53883171081543, "global_step": 485432, "epoch": 5848} {"train_loss": -27.2272891998291, "global_step": 485433, "epoch": 5848} {"train_loss": -26.963876724243164, "global_step": 485434, "epoch": 5848} {"train_loss": -27.278223037719727, "global_step": 485435, "epoch": 5848} {"train_loss": -27.2273006439209, "global_step": 485436, "epoch": 5848} {"train_loss": -26.9025936126709, "global_step": 485437, "epoch": 5848} {"train_loss": -26.845617294311523, "global_step": 485438, "epoch": 5848} {"train_loss": -27.457691192626953, "global_step": 485439, "epoch": 5848} {"train_loss": -27.235095977783203, "global_step": 485440, "epoch": 5848} {"train_loss": -27.358434677124023, "global_step": 485441, "epoch": 5848} {"train_loss": -26.910449981689453, "global_step": 485442, "epoch": 5848} {"train_loss": -26.999603271484375, "global_step": 485443, "epoch": 5848} {"train_loss": -27.572433471679688, "global_step": 485444, "epoch": 5848} {"train_loss": -27.309417724609375, "global_step": 485445, "epoch": 5848} {"train_loss": -27.238981246948242, "global_step": 485446, "epoch": 5848} {"train_loss": -27.20533561706543, "global_step": 485447, "epoch": 5848} {"train_loss": -27.538497924804688, "global_step": 485448, "epoch": 5848} {"train_loss": -27.396902084350586, "global_step": 485449, "epoch": 5848} {"train_loss": -27.148792266845703, "global_step": 485450, "epoch": 5848} {"train_loss": -27.535139083862305, "global_step": 485451, "epoch": 5848} {"train_loss": -27.38661003112793, "global_step": 485452, "epoch": 5848} {"train_loss": -27.260120391845703, "global_step": 485453, "epoch": 5848} {"train_loss": -27.836334228515625, "global_step": 485454, "epoch": 5848} {"train_loss": -27.16448402404785, "global_step": 485455, "epoch": 5848} {"train_loss": -27.29286003112793, "global_step": 485456, "epoch": 5848} {"train_loss": -27.090208053588867, "global_step": 485457, "epoch": 5848} {"train_loss": -27.128015518188477, "global_step": 485458, "epoch": 5848} {"train_loss": -27.419193267822266, "global_step": 485459, "epoch": 5848} {"train_loss": -27.41278648376465, "global_step": 485460, "epoch": 5848} {"train_loss": -27.34456443786621, "global_step": 485461, "epoch": 5848} {"train_loss": -27.185516357421875, "global_step": 485462, "epoch": 5848} {"train_loss": -27.471887588500977, "global_step": 485463, "epoch": 5848} {"train_loss": -27.526060104370117, "global_step": 485464, "epoch": 5848} {"train_loss": -27.044952392578125, "global_step": 485465, "epoch": 5848} {"train_loss": -27.153951415096422, "global_step": 485466, "epoch": 5848, "val_loss": 6502272.0} {"train_loss": -25.36826515197754, "global_step": 485467, "epoch": 5849} {"train_loss": -25.387958526611328, "global_step": 485468, "epoch": 5849} {"train_loss": -25.9982852935791, "global_step": 485469, "epoch": 5849} {"train_loss": -26.053119659423828, "global_step": 485470, "epoch": 5849} {"train_loss": -26.690771102905273, "global_step": 485471, "epoch": 5849} {"train_loss": -26.38526725769043, "global_step": 485472, "epoch": 5849} {"train_loss": -26.999494552612305, "global_step": 485473, "epoch": 5849} {"train_loss": -26.122379302978516, "global_step": 485474, "epoch": 5849} {"train_loss": -26.304248809814453, "global_step": 485475, "epoch": 5849} {"train_loss": -26.508087158203125, "global_step": 485476, "epoch": 5849} {"train_loss": -26.59608268737793, "global_step": 485477, "epoch": 5849} {"train_loss": -26.345544815063477, "global_step": 485478, "epoch": 5849} {"train_loss": -27.11669921875, "global_step": 485479, "epoch": 5849} {"train_loss": -26.473974227905273, "global_step": 485480, "epoch": 5849} {"train_loss": -27.07594871520996, "global_step": 485481, "epoch": 5849} {"train_loss": -26.48972511291504, "global_step": 485482, "epoch": 5849} {"train_loss": -27.13347816467285, "global_step": 485483, "epoch": 5849} {"train_loss": -26.806640625, "global_step": 485484, "epoch": 5849} {"train_loss": -27.054279327392578, "global_step": 485485, "epoch": 5849} {"train_loss": -26.801130294799805, "global_step": 485486, "epoch": 5849} {"train_loss": -26.9390869140625, "global_step": 485487, "epoch": 5849} {"train_loss": -26.660781860351562, "global_step": 485488, "epoch": 5849} {"train_loss": -27.117040634155273, "global_step": 485489, "epoch": 5849} {"train_loss": -26.92361831665039, "global_step": 485490, "epoch": 5849} {"train_loss": -27.254011154174805, "global_step": 485491, "epoch": 5849} {"train_loss": -27.159826278686523, "global_step": 485492, "epoch": 5849} {"train_loss": -27.088972091674805, "global_step": 485493, "epoch": 5849} {"train_loss": -27.1882266998291, "global_step": 485494, "epoch": 5849} {"train_loss": -27.02625846862793, "global_step": 485495, "epoch": 5849} {"train_loss": -27.428449630737305, "global_step": 485496, "epoch": 5849} {"train_loss": -27.212146759033203, "global_step": 485497, "epoch": 5849} {"train_loss": -27.101232528686523, "global_step": 485498, "epoch": 5849} {"train_loss": -27.601667404174805, "global_step": 485499, "epoch": 5849} {"train_loss": -27.3542537689209, "global_step": 485500, "epoch": 5849} {"train_loss": -27.261402130126953, "global_step": 485501, "epoch": 5849} {"train_loss": -27.272871017456055, "global_step": 485502, "epoch": 5849} {"train_loss": -27.512409210205078, "global_step": 485503, "epoch": 5849} {"train_loss": -27.775983810424805, "global_step": 485504, "epoch": 5849} {"train_loss": -27.305465698242188, "global_step": 485505, "epoch": 5849} {"train_loss": -27.253355026245117, "global_step": 485506, "epoch": 5849} {"train_loss": -27.025678634643555, "global_step": 485507, "epoch": 5849} {"train_loss": -26.87458610534668, "global_step": 485508, "epoch": 5849} {"train_loss": -27.06485939025879, "global_step": 485509, "epoch": 5849} {"train_loss": -27.142425537109375, "global_step": 485510, "epoch": 5849} {"train_loss": -27.43059730529785, "global_step": 485511, "epoch": 5849} {"train_loss": -27.05994987487793, "global_step": 485512, "epoch": 5849} {"train_loss": -27.27947425842285, "global_step": 485513, "epoch": 5849} {"train_loss": -27.293609619140625, "global_step": 485514, "epoch": 5849} {"train_loss": -27.11533546447754, "global_step": 485515, "epoch": 5849} {"train_loss": -27.6550235748291, "global_step": 485516, "epoch": 5849} {"train_loss": -27.076492309570312, "global_step": 485517, "epoch": 5849} {"train_loss": -27.41853141784668, "global_step": 485518, "epoch": 5849} {"train_loss": -27.3677978515625, "global_step": 485519, "epoch": 5849} {"train_loss": -27.63922119140625, "global_step": 485520, "epoch": 5849} {"train_loss": -27.411273956298828, "global_step": 485521, "epoch": 5849} {"train_loss": -27.618671417236328, "global_step": 485522, "epoch": 5849} {"train_loss": -27.26276206970215, "global_step": 485523, "epoch": 5849} {"train_loss": -27.163694381713867, "global_step": 485524, "epoch": 5849} {"train_loss": -27.0188045501709, "global_step": 485525, "epoch": 5849} {"train_loss": -27.167646408081055, "global_step": 485526, "epoch": 5849} {"train_loss": -27.37091064453125, "global_step": 485527, "epoch": 5849} {"train_loss": -27.47719383239746, "global_step": 485528, "epoch": 5849} {"train_loss": -26.930469512939453, "global_step": 485529, "epoch": 5849} {"train_loss": -27.79296875, "global_step": 485530, "epoch": 5849} {"train_loss": -27.10847282409668, "global_step": 485531, "epoch": 5849} {"train_loss": -27.242582321166992, "global_step": 485532, "epoch": 5849} {"train_loss": -27.425968170166016, "global_step": 485533, "epoch": 5849} {"train_loss": -27.244474411010742, "global_step": 485534, "epoch": 5849} {"train_loss": -27.374414443969727, "global_step": 485535, "epoch": 5849} {"train_loss": -27.332685470581055, "global_step": 485536, "epoch": 5849} {"train_loss": -27.349145889282227, "global_step": 485537, "epoch": 5849} {"train_loss": -27.012678146362305, "global_step": 485538, "epoch": 5849} {"train_loss": -27.445966720581055, "global_step": 485539, "epoch": 5849} {"train_loss": -27.58961296081543, "global_step": 485540, "epoch": 5849} {"train_loss": -26.801563262939453, "global_step": 485541, "epoch": 5849} {"train_loss": -27.228137969970703, "global_step": 485542, "epoch": 5849} {"train_loss": -27.18336296081543, "global_step": 485543, "epoch": 5849} {"train_loss": -27.141071319580078, "global_step": 485544, "epoch": 5849} {"train_loss": -26.929845809936523, "global_step": 485545, "epoch": 5849} {"train_loss": -26.69708251953125, "global_step": 485546, "epoch": 5849} {"train_loss": -26.85047721862793, "global_step": 485547, "epoch": 5849} {"train_loss": -27.16156578063965, "global_step": 485548, "epoch": 5849} {"train_loss": -27.06829562819148, "global_step": 485549, "epoch": 5849, "val_loss": 6551964.0} {"train_loss": -27.564666748046875, "global_step": 485550, "epoch": 5850} {"train_loss": -26.9514102935791, "global_step": 485551, "epoch": 5850} {"train_loss": -27.141040802001953, "global_step": 485552, "epoch": 5850} {"train_loss": -27.3724365234375, "global_step": 485553, "epoch": 5850} {"train_loss": -27.405353546142578, "global_step": 485554, "epoch": 5850} {"train_loss": -26.388080596923828, "global_step": 485555, "epoch": 5850} {"train_loss": -26.9632511138916, "global_step": 485556, "epoch": 5850} {"train_loss": -26.847763061523438, "global_step": 485557, "epoch": 5850} {"train_loss": -27.123779296875, "global_step": 485558, "epoch": 5850} {"train_loss": -27.22515296936035, "global_step": 485559, "epoch": 5850} {"train_loss": -26.89533805847168, "global_step": 485560, "epoch": 5850} {"train_loss": -26.995553970336914, "global_step": 485561, "epoch": 5850} {"train_loss": -27.135366439819336, "global_step": 485562, "epoch": 5850} {"train_loss": -27.10560417175293, "global_step": 485563, "epoch": 5850} {"train_loss": -26.76117515563965, "global_step": 485564, "epoch": 5850} {"train_loss": -26.944244384765625, "global_step": 485565, "epoch": 5850} {"train_loss": -27.180225372314453, "global_step": 485566, "epoch": 5850} {"train_loss": -27.511362075805664, "global_step": 485567, "epoch": 5850} {"train_loss": -27.51496696472168, "global_step": 485568, "epoch": 5850} {"train_loss": -27.420169830322266, "global_step": 485569, "epoch": 5850} {"train_loss": -27.899133682250977, "global_step": 485570, "epoch": 5850} {"train_loss": -27.0768985748291, "global_step": 485571, "epoch": 5850} {"train_loss": -27.50702476501465, "global_step": 485572, "epoch": 5850} {"train_loss": -27.233051300048828, "global_step": 485573, "epoch": 5850} {"train_loss": -27.24420738220215, "global_step": 485574, "epoch": 5850} {"train_loss": -27.52585792541504, "global_step": 485575, "epoch": 5850} {"train_loss": -27.477270126342773, "global_step": 485576, "epoch": 5850} {"train_loss": -27.26716423034668, "global_step": 485577, "epoch": 5850} {"train_loss": -27.490354537963867, "global_step": 485578, "epoch": 5850} {"train_loss": -27.260059356689453, "global_step": 485579, "epoch": 5850} {"train_loss": -27.481311798095703, "global_step": 485580, "epoch": 5850} {"train_loss": -27.09674644470215, "global_step": 485581, "epoch": 5850} {"train_loss": -27.39088249206543, "global_step": 485582, "epoch": 5850} {"train_loss": -27.2528018951416, "global_step": 485583, "epoch": 5850} {"train_loss": -27.240386962890625, "global_step": 485584, "epoch": 5850} {"train_loss": -27.07415771484375, "global_step": 485585, "epoch": 5850} {"train_loss": -27.28253746032715, "global_step": 485586, "epoch": 5850} {"train_loss": -27.13666343688965, "global_step": 485587, "epoch": 5850} {"train_loss": -27.429981231689453, "global_step": 485588, "epoch": 5850} {"train_loss": -27.367380142211914, "global_step": 485589, "epoch": 5850} {"train_loss": -27.443450927734375, "global_step": 485590, "epoch": 5850} {"train_loss": -27.40821647644043, "global_step": 485591, "epoch": 5850} {"train_loss": -27.45526123046875, "global_step": 485592, "epoch": 5850} {"train_loss": -27.172677993774414, "global_step": 485593, "epoch": 5850} {"train_loss": -27.171777725219727, "global_step": 485594, "epoch": 5850} {"train_loss": -27.1317138671875, "global_step": 485595, "epoch": 5850} {"train_loss": -27.437936782836914, "global_step": 485596, "epoch": 5850} {"train_loss": -27.082014083862305, "global_step": 485597, "epoch": 5850} {"train_loss": -27.37883949279785, "global_step": 485598, "epoch": 5850} {"train_loss": -27.209716796875, "global_step": 485599, "epoch": 5850} {"train_loss": -27.4439754486084, "global_step": 485600, "epoch": 5850} {"train_loss": -26.869550704956055, "global_step": 485601, "epoch": 5850} {"train_loss": -27.1108341217041, "global_step": 485602, "epoch": 5850} {"train_loss": -27.12749671936035, "global_step": 485603, "epoch": 5850} {"train_loss": -26.740009307861328, "global_step": 485604, "epoch": 5850} {"train_loss": -27.41672134399414, "global_step": 485605, "epoch": 5850} {"train_loss": -27.055255889892578, "global_step": 485606, "epoch": 5850} {"train_loss": -27.325489044189453, "global_step": 485607, "epoch": 5850} {"train_loss": -27.34739112854004, "global_step": 485608, "epoch": 5850} {"train_loss": -27.15772819519043, "global_step": 485609, "epoch": 5850} {"train_loss": -27.50660514831543, "global_step": 485610, "epoch": 5850} {"train_loss": -27.347553253173828, "global_step": 485611, "epoch": 5850} {"train_loss": -27.035598754882812, "global_step": 485612, "epoch": 5850} {"train_loss": -27.408737182617188, "global_step": 485613, "epoch": 5850} {"train_loss": -27.04243278503418, "global_step": 485614, "epoch": 5850} {"train_loss": -27.524580001831055, "global_step": 485615, "epoch": 5850} {"train_loss": -27.41073989868164, "global_step": 485616, "epoch": 5850} {"train_loss": -26.797714233398438, "global_step": 485617, "epoch": 5850} {"train_loss": -26.863096237182617, "global_step": 485618, "epoch": 5850} {"train_loss": -27.387006759643555, "global_step": 485619, "epoch": 5850} {"train_loss": -27.506017684936523, "global_step": 485620, "epoch": 5850} {"train_loss": -27.320783615112305, "global_step": 485621, "epoch": 5850} {"train_loss": -27.01374626159668, "global_step": 485622, "epoch": 5850} {"train_loss": -27.22381019592285, "global_step": 485623, "epoch": 5850} {"train_loss": -26.83888816833496, "global_step": 485624, "epoch": 5850} {"train_loss": -27.09339714050293, "global_step": 485625, "epoch": 5850} {"train_loss": -27.379785537719727, "global_step": 485626, "epoch": 5850} {"train_loss": -27.05449867248535, "global_step": 485627, "epoch": 5850} {"train_loss": -27.263782501220703, "global_step": 485628, "epoch": 5850} {"train_loss": -27.465412139892578, "global_step": 485629, "epoch": 5850} {"train_loss": -27.576269149780273, "global_step": 485630, "epoch": 5850} {"train_loss": -27.5802059173584, "global_step": 485631, "epoch": 5850} {"train_loss": -27.223585082823973, "global_step": 485632, "epoch": 5850, "train/sim_max_reward_0": 1.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4500000": 1.0, "test/sim_max_reward_4500001": 1.0, "test/sim_max_reward_4500002": 1.0, "test/sim_max_reward_4500003": 1.0, "test/sim_max_reward_4500004": 1.0, "test/sim_max_reward_4500005": 1.0, "test/sim_max_reward_4500006": 1.0, "test/sim_max_reward_4500007": 1.0, "test/sim_max_reward_4500008": 1.0, "test/sim_max_reward_4500009": 1.0, "test/sim_max_reward_4500010": 1.0, "test/sim_max_reward_4500011": 1.0, "test/sim_max_reward_4500012": 1.0, "test/sim_max_reward_4500013": 0.0, "test/sim_max_reward_4500014": 1.0, "test/sim_max_reward_4500015": 1.0, "test/sim_max_reward_4500016": 1.0, "test/sim_max_reward_4500017": 1.0, "test/sim_max_reward_4500018": 0.0, "test/sim_max_reward_4500019": 0.0, "test/sim_max_reward_4500020": 1.0, "test/sim_max_reward_4500021": 1.0, "train/mean_score": 1.0, "test/mean_score": 0.8636363636363636, "val_loss": 6519649.0} {"train_loss": -26.907623291015625, "global_step": 485633, "epoch": 5851} {"train_loss": -26.592344284057617, "global_step": 485634, "epoch": 5851} {"train_loss": -27.039234161376953, "global_step": 485635, "epoch": 5851} {"train_loss": -26.9066162109375, "global_step": 485636, "epoch": 5851} {"train_loss": -27.01873779296875, "global_step": 485637, "epoch": 5851} {"train_loss": -27.02961540222168, "global_step": 485638, "epoch": 5851} {"train_loss": -26.969690322875977, "global_step": 485639, "epoch": 5851} {"train_loss": -27.173017501831055, "global_step": 485640, "epoch": 5851} {"train_loss": -27.006879806518555, "global_step": 485641, "epoch": 5851} {"train_loss": -27.278400421142578, "global_step": 485642, "epoch": 5851} {"train_loss": -27.02361488342285, "global_step": 485643, "epoch": 5851} {"train_loss": -27.30940818786621, "global_step": 485644, "epoch": 5851} {"train_loss": -27.240930557250977, "global_step": 485645, "epoch": 5851} {"train_loss": -27.1611385345459, "global_step": 485646, "epoch": 5851} {"train_loss": -26.911243438720703, "global_step": 485647, "epoch": 5851} {"train_loss": -27.925195693969727, "global_step": 485648, "epoch": 5851} {"train_loss": -26.93071937561035, "global_step": 485649, "epoch": 5851} {"train_loss": -27.069793701171875, "global_step": 485650, "epoch": 5851} {"train_loss": -27.2215576171875, "global_step": 485651, "epoch": 5851} {"train_loss": -27.650257110595703, "global_step": 485652, "epoch": 5851} {"train_loss": -27.3406925201416, "global_step": 485653, "epoch": 5851} {"train_loss": -27.09026527404785, "global_step": 485654, "epoch": 5851} {"train_loss": -27.157453536987305, "global_step": 485655, "epoch": 5851} {"train_loss": -27.3725528717041, "global_step": 485656, "epoch": 5851} {"train_loss": -27.198516845703125, "global_step": 485657, "epoch": 5851} {"train_loss": -27.010915756225586, "global_step": 485658, "epoch": 5851} {"train_loss": -27.004287719726562, "global_step": 485659, "epoch": 5851} {"train_loss": -27.354175567626953, "global_step": 485660, "epoch": 5851} {"train_loss": -27.031707763671875, "global_step": 485661, "epoch": 5851} {"train_loss": -27.143905639648438, "global_step": 485662, "epoch": 5851} {"train_loss": -27.25953483581543, "global_step": 485663, "epoch": 5851} {"train_loss": -26.830286026000977, "global_step": 485664, "epoch": 5851} {"train_loss": -27.2796688079834, "global_step": 485665, "epoch": 5851} {"train_loss": -27.12628173828125, "global_step": 485666, "epoch": 5851} {"train_loss": -26.68385887145996, "global_step": 485667, "epoch": 5851} {"train_loss": -26.624662399291992, "global_step": 485668, "epoch": 5851} {"train_loss": -27.396963119506836, "global_step": 485669, "epoch": 5851} {"train_loss": -26.8708553314209, "global_step": 485670, "epoch": 5851} {"train_loss": -27.377685546875, "global_step": 485671, "epoch": 5851} {"train_loss": -27.046680450439453, "global_step": 485672, "epoch": 5851} {"train_loss": -27.00201988220215, "global_step": 485673, "epoch": 5851} {"train_loss": -27.188262939453125, "global_step": 485674, "epoch": 5851} {"train_loss": -27.197187423706055, "global_step": 485675, "epoch": 5851} {"train_loss": -27.3844051361084, "global_step": 485676, "epoch": 5851} {"train_loss": -26.785415649414062, "global_step": 485677, "epoch": 5851} {"train_loss": -27.497007369995117, "global_step": 485678, "epoch": 5851} {"train_loss": -27.530847549438477, "global_step": 485679, "epoch": 5851} {"train_loss": -27.314802169799805, "global_step": 485680, "epoch": 5851} {"train_loss": -27.536640167236328, "global_step": 485681, "epoch": 5851} {"train_loss": -27.267292022705078, "global_step": 485682, "epoch": 5851} {"train_loss": -27.04656410217285, "global_step": 485683, "epoch": 5851} {"train_loss": -27.488819122314453, "global_step": 485684, "epoch": 5851} {"train_loss": -27.5725154876709, "global_step": 485685, "epoch": 5851} {"train_loss": -27.161945343017578, "global_step": 485686, "epoch": 5851} {"train_loss": -26.89151382446289, "global_step": 485687, "epoch": 5851} {"train_loss": -27.244647979736328, "global_step": 485688, "epoch": 5851} {"train_loss": -27.131444931030273, "global_step": 485689, "epoch": 5851} {"train_loss": -27.029767990112305, "global_step": 485690, "epoch": 5851} {"train_loss": -27.7193660736084, "global_step": 485691, "epoch": 5851} {"train_loss": -27.39434814453125, "global_step": 485692, "epoch": 5851} {"train_loss": -27.18307876586914, "global_step": 485693, "epoch": 5851} {"train_loss": -27.169483184814453, "global_step": 485694, "epoch": 5851} {"train_loss": -27.215925216674805, "global_step": 485695, "epoch": 5851} {"train_loss": -27.234760284423828, "global_step": 485696, "epoch": 5851} {"train_loss": -27.322452545166016, "global_step": 485697, "epoch": 5851} {"train_loss": -27.549915313720703, "global_step": 485698, "epoch": 5851} {"train_loss": -27.512542724609375, "global_step": 485699, "epoch": 5851} {"train_loss": -27.323150634765625, "global_step": 485700, "epoch": 5851} {"train_loss": -27.456586837768555, "global_step": 485701, "epoch": 5851} {"train_loss": -27.4403133392334, "global_step": 485702, "epoch": 5851} {"train_loss": -27.70246696472168, "global_step": 485703, "epoch": 5851} {"train_loss": -27.271223068237305, "global_step": 485704, "epoch": 5851} {"train_loss": -27.478092193603516, "global_step": 485705, "epoch": 5851} {"train_loss": -27.11347007751465, "global_step": 485706, "epoch": 5851} {"train_loss": -27.65521240234375, "global_step": 485707, "epoch": 5851} {"train_loss": -27.741226196289062, "global_step": 485708, "epoch": 5851} {"train_loss": -27.24595069885254, "global_step": 485709, "epoch": 5851} {"train_loss": -27.655668258666992, "global_step": 485710, "epoch": 5851} {"train_loss": -27.390100479125977, "global_step": 485711, "epoch": 5851} {"train_loss": -27.093252182006836, "global_step": 485712, "epoch": 5851} {"train_loss": -26.471052169799805, "global_step": 485713, "epoch": 5851} {"train_loss": -27.061086654663086, "global_step": 485714, "epoch": 5851} {"train_loss": -27.219938048397204, "global_step": 485715, "epoch": 5851, "val_loss": 6419692.0} {"train_loss": -26.06515884399414, "global_step": 485716, "epoch": 5852} {"train_loss": -24.555522918701172, "global_step": 485717, "epoch": 5852} {"train_loss": -24.62990379333496, "global_step": 485718, "epoch": 5852} {"train_loss": -25.611921310424805, "global_step": 485719, "epoch": 5852} {"train_loss": -24.5637149810791, "global_step": 485720, "epoch": 5852} {"train_loss": -25.556804656982422, "global_step": 485721, "epoch": 5852} {"train_loss": -25.471548080444336, "global_step": 485722, "epoch": 5852} {"train_loss": -26.186431884765625, "global_step": 485723, "epoch": 5852} {"train_loss": -25.234371185302734, "global_step": 485724, "epoch": 5852} {"train_loss": -25.530061721801758, "global_step": 485725, "epoch": 5852} {"train_loss": -25.940359115600586, "global_step": 485726, "epoch": 5852} {"train_loss": -26.228958129882812, "global_step": 485727, "epoch": 5852} {"train_loss": -26.127979278564453, "global_step": 485728, "epoch": 5852} {"train_loss": -26.028701782226562, "global_step": 485729, "epoch": 5852} {"train_loss": -26.172719955444336, "global_step": 485730, "epoch": 5852} {"train_loss": -26.6433048248291, "global_step": 485731, "epoch": 5852} {"train_loss": -26.618276596069336, "global_step": 485732, "epoch": 5852} {"train_loss": -26.372791290283203, "global_step": 485733, "epoch": 5852} {"train_loss": -26.616941452026367, "global_step": 485734, "epoch": 5852} {"train_loss": -26.4256534576416, "global_step": 485735, "epoch": 5852} {"train_loss": -26.21820640563965, "global_step": 485736, "epoch": 5852} {"train_loss": -26.5131778717041, "global_step": 485737, "epoch": 5852} {"train_loss": -26.5841121673584, "global_step": 485738, "epoch": 5852} {"train_loss": -26.601499557495117, "global_step": 485739, "epoch": 5852} {"train_loss": -26.381006240844727, "global_step": 485740, "epoch": 5852} {"train_loss": -26.856969833374023, "global_step": 485741, "epoch": 5852} {"train_loss": -27.0327205657959, "global_step": 485742, "epoch": 5852} {"train_loss": -26.633453369140625, "global_step": 485743, "epoch": 5852} {"train_loss": -26.482507705688477, "global_step": 485744, "epoch": 5852} {"train_loss": -26.959762573242188, "global_step": 485745, "epoch": 5852} {"train_loss": -26.996017456054688, "global_step": 485746, "epoch": 5852} {"train_loss": -26.796630859375, "global_step": 485747, "epoch": 5852} {"train_loss": -26.769983291625977, "global_step": 485748, "epoch": 5852} {"train_loss": -27.07501792907715, "global_step": 485749, "epoch": 5852} {"train_loss": -27.168603897094727, "global_step": 485750, "epoch": 5852} {"train_loss": -26.886646270751953, "global_step": 485751, "epoch": 5852} {"train_loss": -27.29021644592285, "global_step": 485752, "epoch": 5852} {"train_loss": -26.98417091369629, "global_step": 485753, "epoch": 5852} {"train_loss": -27.319950103759766, "global_step": 485754, "epoch": 5852} {"train_loss": -27.06171226501465, "global_step": 485755, "epoch": 5852} {"train_loss": -26.898828506469727, "global_step": 485756, "epoch": 5852} {"train_loss": -27.19097328186035, "global_step": 485757, "epoch": 5852} {"train_loss": -27.6397762298584, "global_step": 485758, "epoch": 5852} {"train_loss": -27.4201717376709, "global_step": 485759, "epoch": 5852} {"train_loss": -27.381500244140625, "global_step": 485760, "epoch": 5852} {"train_loss": -27.5015811920166, "global_step": 485761, "epoch": 5852} {"train_loss": -27.501195907592773, "global_step": 485762, "epoch": 5852} {"train_loss": -27.191503524780273, "global_step": 485763, "epoch": 5852} {"train_loss": -27.866138458251953, "global_step": 485764, "epoch": 5852} {"train_loss": -27.21114158630371, "global_step": 485765, "epoch": 5852} {"train_loss": -27.551828384399414, "global_step": 485766, "epoch": 5852} {"train_loss": -27.2877140045166, "global_step": 485767, "epoch": 5852} {"train_loss": -27.62324333190918, "global_step": 485768, "epoch": 5852} {"train_loss": -27.57159996032715, "global_step": 485769, "epoch": 5852} {"train_loss": -27.33741569519043, "global_step": 485770, "epoch": 5852} {"train_loss": -27.550756454467773, "global_step": 485771, "epoch": 5852} {"train_loss": -27.413862228393555, "global_step": 485772, "epoch": 5852} {"train_loss": -27.296722412109375, "global_step": 485773, "epoch": 5852} {"train_loss": -27.26753044128418, "global_step": 485774, "epoch": 5852} {"train_loss": -27.310361862182617, "global_step": 485775, "epoch": 5852} {"train_loss": -27.41511344909668, "global_step": 485776, "epoch": 5852} {"train_loss": -27.639053344726562, "global_step": 485777, "epoch": 5852} {"train_loss": -27.5902156829834, "global_step": 485778, "epoch": 5852} {"train_loss": -27.351572036743164, "global_step": 485779, "epoch": 5852} {"train_loss": -27.236663818359375, "global_step": 485780, "epoch": 5852} {"train_loss": -27.355499267578125, "global_step": 485781, "epoch": 5852} {"train_loss": -27.36112403869629, "global_step": 485782, "epoch": 5852} {"train_loss": -27.246124267578125, "global_step": 485783, "epoch": 5852} {"train_loss": -27.02021598815918, "global_step": 485784, "epoch": 5852} {"train_loss": -26.92983055114746, "global_step": 485785, "epoch": 5852} {"train_loss": -27.002552032470703, "global_step": 485786, "epoch": 5852} {"train_loss": -27.366275787353516, "global_step": 485787, "epoch": 5852} {"train_loss": -27.388639450073242, "global_step": 485788, "epoch": 5852} {"train_loss": -27.393491744995117, "global_step": 485789, "epoch": 5852} {"train_loss": -27.18719482421875, "global_step": 485790, "epoch": 5852} {"train_loss": -27.238012313842773, "global_step": 485791, "epoch": 5852} {"train_loss": -27.408008575439453, "global_step": 485792, "epoch": 5852} {"train_loss": -27.068700790405273, "global_step": 485793, "epoch": 5852} {"train_loss": -27.36578941345215, "global_step": 485794, "epoch": 5852} {"train_loss": -27.454938888549805, "global_step": 485795, "epoch": 5852} {"train_loss": -27.2039737701416, "global_step": 485796, "epoch": 5852} {"train_loss": -26.79426383972168, "global_step": 485797, "epoch": 5852} {"train_loss": -26.854084635355388, "global_step": 485798, "epoch": 5852, "val_loss": 6499524.0} {"train_loss": -26.90162467956543, "global_step": 485799, "epoch": 5853} {"train_loss": -27.218292236328125, "global_step": 485800, "epoch": 5853} {"train_loss": -27.5096492767334, "global_step": 485801, "epoch": 5853} {"train_loss": -27.155029296875, "global_step": 485802, "epoch": 5853} {"train_loss": -27.169443130493164, "global_step": 485803, "epoch": 5853} {"train_loss": -26.8280029296875, "global_step": 485804, "epoch": 5853} {"train_loss": -26.966266632080078, "global_step": 485805, "epoch": 5853} {"train_loss": -27.19056510925293, "global_step": 485806, "epoch": 5853} {"train_loss": -27.279743194580078, "global_step": 485807, "epoch": 5853} {"train_loss": -26.899118423461914, "global_step": 485808, "epoch": 5853} {"train_loss": -27.069110870361328, "global_step": 485809, "epoch": 5853} {"train_loss": -27.420337677001953, "global_step": 485810, "epoch": 5853} {"train_loss": -27.19413185119629, "global_step": 485811, "epoch": 5853} {"train_loss": -26.97920036315918, "global_step": 485812, "epoch": 5853} {"train_loss": -27.319238662719727, "global_step": 485813, "epoch": 5853} {"train_loss": -27.29483985900879, "global_step": 485814, "epoch": 5853} {"train_loss": -27.501001358032227, "global_step": 485815, "epoch": 5853} {"train_loss": -27.4581298828125, "global_step": 485816, "epoch": 5853} {"train_loss": -27.524473190307617, "global_step": 485817, "epoch": 5853} {"train_loss": -27.488473892211914, "global_step": 485818, "epoch": 5853} {"train_loss": -27.539304733276367, "global_step": 485819, "epoch": 5853} {"train_loss": -27.2576847076416, "global_step": 485820, "epoch": 5853} {"train_loss": -27.42184829711914, "global_step": 485821, "epoch": 5853} {"train_loss": -27.23475456237793, "global_step": 485822, "epoch": 5853} {"train_loss": -27.55109214782715, "global_step": 485823, "epoch": 5853} {"train_loss": -27.01104736328125, "global_step": 485824, "epoch": 5853} {"train_loss": -27.522144317626953, "global_step": 485825, "epoch": 5853} {"train_loss": -27.14789390563965, "global_step": 485826, "epoch": 5853} {"train_loss": -27.758634567260742, "global_step": 485827, "epoch": 5853} {"train_loss": -27.337202072143555, "global_step": 485828, "epoch": 5853} {"train_loss": -27.004867553710938, "global_step": 485829, "epoch": 5853} {"train_loss": -27.378629684448242, "global_step": 485830, "epoch": 5853} {"train_loss": -27.3698673248291, "global_step": 485831, "epoch": 5853} {"train_loss": -27.250280380249023, "global_step": 485832, "epoch": 5853} {"train_loss": -26.692596435546875, "global_step": 485833, "epoch": 5853} {"train_loss": -27.294189453125, "global_step": 485834, "epoch": 5853} {"train_loss": -27.185041427612305, "global_step": 485835, "epoch": 5853} {"train_loss": -26.9542293548584, "global_step": 485836, "epoch": 5853} {"train_loss": -27.482532501220703, "global_step": 485837, "epoch": 5853} {"train_loss": -27.410369873046875, "global_step": 485838, "epoch": 5853} {"train_loss": -27.36493492126465, "global_step": 485839, "epoch": 5853} {"train_loss": -27.113183975219727, "global_step": 485840, "epoch": 5853} {"train_loss": -27.1818790435791, "global_step": 485841, "epoch": 5853} {"train_loss": -27.505151748657227, "global_step": 485842, "epoch": 5853} {"train_loss": -27.119115829467773, "global_step": 485843, "epoch": 5853} {"train_loss": -27.053821563720703, "global_step": 485844, "epoch": 5853} {"train_loss": -27.284963607788086, "global_step": 485845, "epoch": 5853} {"train_loss": -27.1130313873291, "global_step": 485846, "epoch": 5853} {"train_loss": -27.42864418029785, "global_step": 485847, "epoch": 5853} {"train_loss": -27.4322509765625, "global_step": 485848, "epoch": 5853} {"train_loss": -27.29743766784668, "global_step": 485849, "epoch": 5853} {"train_loss": -27.432580947875977, "global_step": 485850, "epoch": 5853} {"train_loss": -26.946481704711914, "global_step": 485851, "epoch": 5853} {"train_loss": -27.383214950561523, "global_step": 485852, "epoch": 5853} {"train_loss": -27.214136123657227, "global_step": 485853, "epoch": 5853} {"train_loss": -27.0733585357666, "global_step": 485854, "epoch": 5853} {"train_loss": -27.509845733642578, "global_step": 485855, "epoch": 5853} {"train_loss": -27.160825729370117, "global_step": 485856, "epoch": 5853} {"train_loss": -26.560766220092773, "global_step": 485857, "epoch": 5853} {"train_loss": -26.5393123626709, "global_step": 485858, "epoch": 5853} {"train_loss": -26.89239501953125, "global_step": 485859, "epoch": 5853} {"train_loss": -27.0937557220459, "global_step": 485860, "epoch": 5853} {"train_loss": -27.183923721313477, "global_step": 485861, "epoch": 5853} {"train_loss": -27.195905685424805, "global_step": 485862, "epoch": 5853} {"train_loss": -27.692066192626953, "global_step": 485863, "epoch": 5853} {"train_loss": -26.96549415588379, "global_step": 485864, "epoch": 5853} {"train_loss": -27.362096786499023, "global_step": 485865, "epoch": 5853} {"train_loss": -27.56705665588379, "global_step": 485866, "epoch": 5853} {"train_loss": -27.362356185913086, "global_step": 485867, "epoch": 5853} {"train_loss": -27.139999389648438, "global_step": 485868, "epoch": 5853} {"train_loss": -27.0557861328125, "global_step": 485869, "epoch": 5853} {"train_loss": -27.385095596313477, "global_step": 485870, "epoch": 5853} {"train_loss": -27.472509384155273, "global_step": 485871, "epoch": 5853} {"train_loss": -27.455005645751953, "global_step": 485872, "epoch": 5853} {"train_loss": -27.516637802124023, "global_step": 485873, "epoch": 5853} {"train_loss": -27.383573532104492, "global_step": 485874, "epoch": 5853} {"train_loss": -27.37483024597168, "global_step": 485875, "epoch": 5853} {"train_loss": -27.611108779907227, "global_step": 485876, "epoch": 5853} {"train_loss": -26.881793975830078, "global_step": 485877, "epoch": 5853} {"train_loss": -27.41144371032715, "global_step": 485878, "epoch": 5853} {"train_loss": -26.9359188079834, "global_step": 485879, "epoch": 5853} {"train_loss": -26.90827751159668, "global_step": 485880, "epoch": 5853} {"train_loss": -27.237159246421722, "global_step": 485881, "epoch": 5853, "val_loss": 6489537.0} {"train_loss": -25.557748794555664, "global_step": 485882, "epoch": 5854} {"train_loss": -23.61402130126953, "global_step": 485883, "epoch": 5854} {"train_loss": -25.124486923217773, "global_step": 485884, "epoch": 5854} {"train_loss": -26.889230728149414, "global_step": 485885, "epoch": 5854} {"train_loss": -25.408294677734375, "global_step": 485886, "epoch": 5854} {"train_loss": -26.574493408203125, "global_step": 485887, "epoch": 5854} {"train_loss": -25.854284286499023, "global_step": 485888, "epoch": 5854} {"train_loss": -26.324451446533203, "global_step": 485889, "epoch": 5854} {"train_loss": -26.705154418945312, "global_step": 485890, "epoch": 5854} {"train_loss": -26.401941299438477, "global_step": 485891, "epoch": 5854} {"train_loss": -26.169103622436523, "global_step": 485892, "epoch": 5854} {"train_loss": -26.364593505859375, "global_step": 485893, "epoch": 5854} {"train_loss": -26.818979263305664, "global_step": 485894, "epoch": 5854} {"train_loss": -26.687213897705078, "global_step": 485895, "epoch": 5854} {"train_loss": -26.773700714111328, "global_step": 485896, "epoch": 5854} {"train_loss": -26.759735107421875, "global_step": 485897, "epoch": 5854} {"train_loss": -26.413742065429688, "global_step": 485898, "epoch": 5854} {"train_loss": -26.54133415222168, "global_step": 485899, "epoch": 5854} {"train_loss": -26.7846736907959, "global_step": 485900, "epoch": 5854} {"train_loss": -26.626798629760742, "global_step": 485901, "epoch": 5854} {"train_loss": -26.80157470703125, "global_step": 485902, "epoch": 5854} {"train_loss": -26.887939453125, "global_step": 485903, "epoch": 5854} {"train_loss": -26.964344024658203, "global_step": 485904, "epoch": 5854} {"train_loss": -26.99200439453125, "global_step": 485905, "epoch": 5854} {"train_loss": -27.2839412689209, "global_step": 485906, "epoch": 5854} {"train_loss": -27.404062271118164, "global_step": 485907, "epoch": 5854} {"train_loss": -26.75050163269043, "global_step": 485908, "epoch": 5854} {"train_loss": -27.207502365112305, "global_step": 485909, "epoch": 5854} {"train_loss": -26.831384658813477, "global_step": 485910, "epoch": 5854} {"train_loss": -27.0957088470459, "global_step": 485911, "epoch": 5854} {"train_loss": -27.06744384765625, "global_step": 485912, "epoch": 5854} {"train_loss": -27.251874923706055, "global_step": 485913, "epoch": 5854} {"train_loss": -27.128742218017578, "global_step": 485914, "epoch": 5854} {"train_loss": -27.152191162109375, "global_step": 485915, "epoch": 5854} {"train_loss": -27.094079971313477, "global_step": 485916, "epoch": 5854} {"train_loss": -27.141401290893555, "global_step": 485917, "epoch": 5854} {"train_loss": -27.109516143798828, "global_step": 485918, "epoch": 5854} {"train_loss": -27.29485511779785, "global_step": 485919, "epoch": 5854} {"train_loss": -27.328527450561523, "global_step": 485920, "epoch": 5854} {"train_loss": -27.282196044921875, "global_step": 485921, "epoch": 5854} {"train_loss": -27.36264419555664, "global_step": 485922, "epoch": 5854} {"train_loss": -27.1763973236084, "global_step": 485923, "epoch": 5854} {"train_loss": -27.60883903503418, "global_step": 485924, "epoch": 5854} {"train_loss": -27.646947860717773, "global_step": 485925, "epoch": 5854} {"train_loss": -27.527490615844727, "global_step": 485926, "epoch": 5854} {"train_loss": -27.501800537109375, "global_step": 485927, "epoch": 5854} {"train_loss": -27.121084213256836, "global_step": 485928, "epoch": 5854} {"train_loss": -27.127567291259766, "global_step": 485929, "epoch": 5854} {"train_loss": -27.477832794189453, "global_step": 485930, "epoch": 5854} {"train_loss": -27.617919921875, "global_step": 485931, "epoch": 5854} {"train_loss": -27.273767471313477, "global_step": 485932, "epoch": 5854} {"train_loss": -27.132862091064453, "global_step": 485933, "epoch": 5854} {"train_loss": -27.42548942565918, "global_step": 485934, "epoch": 5854} {"train_loss": -27.110177993774414, "global_step": 485935, "epoch": 5854} {"train_loss": -27.543699264526367, "global_step": 485936, "epoch": 5854} {"train_loss": -27.597875595092773, "global_step": 485937, "epoch": 5854} {"train_loss": -27.254638671875, "global_step": 485938, "epoch": 5854} {"train_loss": -27.279783248901367, "global_step": 485939, "epoch": 5854} {"train_loss": -27.518156051635742, "global_step": 485940, "epoch": 5854} {"train_loss": -27.224945068359375, "global_step": 485941, "epoch": 5854} {"train_loss": -27.035400390625, "global_step": 485942, "epoch": 5854} {"train_loss": -27.396209716796875, "global_step": 485943, "epoch": 5854} {"train_loss": -27.53249168395996, "global_step": 485944, "epoch": 5854} {"train_loss": -27.16800880432129, "global_step": 485945, "epoch": 5854} {"train_loss": -26.869115829467773, "global_step": 485946, "epoch": 5854} {"train_loss": -27.3241024017334, "global_step": 485947, "epoch": 5854} {"train_loss": -27.366016387939453, "global_step": 485948, "epoch": 5854} {"train_loss": -27.168888092041016, "global_step": 485949, "epoch": 5854} {"train_loss": -27.30909538269043, "global_step": 485950, "epoch": 5854} {"train_loss": -27.348962783813477, "global_step": 485951, "epoch": 5854} {"train_loss": -27.417011260986328, "global_step": 485952, "epoch": 5854} {"train_loss": -26.851255416870117, "global_step": 485953, "epoch": 5854} {"train_loss": -27.184741973876953, "global_step": 485954, "epoch": 5854} {"train_loss": -27.045446395874023, "global_step": 485955, "epoch": 5854} {"train_loss": -27.274381637573242, "global_step": 485956, "epoch": 5854} {"train_loss": -26.545642852783203, "global_step": 485957, "epoch": 5854} {"train_loss": -27.327346801757812, "global_step": 485958, "epoch": 5854} {"train_loss": -27.015777587890625, "global_step": 485959, "epoch": 5854} {"train_loss": -27.249364852905273, "global_step": 485960, "epoch": 5854} {"train_loss": -27.13677406311035, "global_step": 485961, "epoch": 5854} {"train_loss": -27.168365478515625, "global_step": 485962, "epoch": 5854} {"train_loss": -27.130661010742188, "global_step": 485963, "epoch": 5854} {"train_loss": -26.97001700803458, "global_step": 485964, "epoch": 5854, "val_loss": 6497598.0} {"train_loss": -26.95242691040039, "global_step": 485965, "epoch": 5855} {"train_loss": -27.067249298095703, "global_step": 485966, "epoch": 5855} {"train_loss": -27.357147216796875, "global_step": 485967, "epoch": 5855} {"train_loss": -26.76859474182129, "global_step": 485968, "epoch": 5855} {"train_loss": -26.704538345336914, "global_step": 485969, "epoch": 5855} {"train_loss": -26.95819091796875, "global_step": 485970, "epoch": 5855} {"train_loss": -26.849390029907227, "global_step": 485971, "epoch": 5855} {"train_loss": -27.106496810913086, "global_step": 485972, "epoch": 5855} {"train_loss": -27.37836265563965, "global_step": 485973, "epoch": 5855} {"train_loss": -26.907184600830078, "global_step": 485974, "epoch": 5855} {"train_loss": -27.040964126586914, "global_step": 485975, "epoch": 5855} {"train_loss": -26.902448654174805, "global_step": 485976, "epoch": 5855} {"train_loss": -26.801055908203125, "global_step": 485977, "epoch": 5855} {"train_loss": -27.151493072509766, "global_step": 485978, "epoch": 5855} {"train_loss": -26.907215118408203, "global_step": 485979, "epoch": 5855} {"train_loss": -27.248754501342773, "global_step": 485980, "epoch": 5855} {"train_loss": -26.94684410095215, "global_step": 485981, "epoch": 5855} {"train_loss": -26.824872970581055, "global_step": 485982, "epoch": 5855} {"train_loss": -27.696441650390625, "global_step": 485983, "epoch": 5855} {"train_loss": -27.087621688842773, "global_step": 485984, "epoch": 5855} {"train_loss": -27.325185775756836, "global_step": 485985, "epoch": 5855} {"train_loss": -27.121633529663086, "global_step": 485986, "epoch": 5855} {"train_loss": -27.526376724243164, "global_step": 485987, "epoch": 5855} {"train_loss": -27.286014556884766, "global_step": 485988, "epoch": 5855} {"train_loss": -27.104816436767578, "global_step": 485989, "epoch": 5855} {"train_loss": -27.5399169921875, "global_step": 485990, "epoch": 5855} {"train_loss": -27.30413246154785, "global_step": 485991, "epoch": 5855} {"train_loss": -27.4459285736084, "global_step": 485992, "epoch": 5855} {"train_loss": -27.402551651000977, "global_step": 485993, "epoch": 5855} {"train_loss": -27.083433151245117, "global_step": 485994, "epoch": 5855} {"train_loss": -27.21514320373535, "global_step": 485995, "epoch": 5855} {"train_loss": -27.441526412963867, "global_step": 485996, "epoch": 5855} {"train_loss": -27.23146629333496, "global_step": 485997, "epoch": 5855} {"train_loss": -27.470739364624023, "global_step": 485998, "epoch": 5855} {"train_loss": -27.212377548217773, "global_step": 485999, "epoch": 5855} {"train_loss": -27.71832275390625, "global_step": 486000, "epoch": 5855} {"train_loss": -27.357803344726562, "global_step": 486001, "epoch": 5855} {"train_loss": -27.355127334594727, "global_step": 486002, "epoch": 5855} {"train_loss": -26.555988311767578, "global_step": 486003, "epoch": 5855} {"train_loss": -26.615020751953125, "global_step": 486004, "epoch": 5855} {"train_loss": -26.92390251159668, "global_step": 486005, "epoch": 5855} {"train_loss": -26.674646377563477, "global_step": 486006, "epoch": 5855} {"train_loss": -26.861047744750977, "global_step": 486007, "epoch": 5855} {"train_loss": -27.24407958984375, "global_step": 486008, "epoch": 5855} {"train_loss": -27.14927101135254, "global_step": 486009, "epoch": 5855} {"train_loss": -26.413116455078125, "global_step": 486010, "epoch": 5855} {"train_loss": -26.73822593688965, "global_step": 486011, "epoch": 5855} {"train_loss": -27.153074264526367, "global_step": 486012, "epoch": 5855} {"train_loss": -27.35601806640625, "global_step": 486013, "epoch": 5855} {"train_loss": -27.16438865661621, "global_step": 486014, "epoch": 5855} {"train_loss": -27.2404842376709, "global_step": 486015, "epoch": 5855} {"train_loss": -27.272077560424805, "global_step": 486016, "epoch": 5855} {"train_loss": -27.44403076171875, "global_step": 486017, "epoch": 5855} {"train_loss": -27.0893497467041, "global_step": 486018, "epoch": 5855} {"train_loss": -27.326282501220703, "global_step": 486019, "epoch": 5855} {"train_loss": -27.24729347229004, "global_step": 486020, "epoch": 5855} {"train_loss": -27.225265502929688, "global_step": 486021, "epoch": 5855} {"train_loss": -27.51873779296875, "global_step": 486022, "epoch": 5855} {"train_loss": -27.228422164916992, "global_step": 486023, "epoch": 5855} {"train_loss": -27.654016494750977, "global_step": 486024, "epoch": 5855} {"train_loss": -27.600387573242188, "global_step": 486025, "epoch": 5855} {"train_loss": -27.504108428955078, "global_step": 486026, "epoch": 5855} {"train_loss": -27.5159912109375, "global_step": 486027, "epoch": 5855} {"train_loss": -27.54300880432129, "global_step": 486028, "epoch": 5855} {"train_loss": -27.315448760986328, "global_step": 486029, "epoch": 5855} {"train_loss": -27.716033935546875, "global_step": 486030, "epoch": 5855} {"train_loss": -27.65692710876465, "global_step": 486031, "epoch": 5855} {"train_loss": -27.40077781677246, "global_step": 486032, "epoch": 5855} {"train_loss": -27.50422477722168, "global_step": 486033, "epoch": 5855} {"train_loss": -27.336780548095703, "global_step": 486034, "epoch": 5855} {"train_loss": -27.866455078125, "global_step": 486035, "epoch": 5855} {"train_loss": -27.465652465820312, "global_step": 486036, "epoch": 5855} {"train_loss": -27.401325225830078, "global_step": 486037, "epoch": 5855} {"train_loss": -27.101465225219727, "global_step": 486038, "epoch": 5855} {"train_loss": -27.1066837310791, "global_step": 486039, "epoch": 5855} {"train_loss": -27.105743408203125, "global_step": 486040, "epoch": 5855} {"train_loss": -27.172672271728516, "global_step": 486041, "epoch": 5855} {"train_loss": -27.058765411376953, "global_step": 486042, "epoch": 5855} {"train_loss": -27.06171226501465, "global_step": 486043, "epoch": 5855} {"train_loss": -27.37247085571289, "global_step": 486044, "epoch": 5855} {"train_loss": -26.32395362854004, "global_step": 486045, "epoch": 5855} {"train_loss": -26.41172218322754, "global_step": 486046, "epoch": 5855} {"train_loss": -27.176537318402026, "global_step": 486047, "epoch": 5855, "val_loss": 6482509.5} {"train_loss": -23.536733627319336, "global_step": 486048, "epoch": 5856} {"train_loss": -25.152441024780273, "global_step": 486049, "epoch": 5856} {"train_loss": -25.88260269165039, "global_step": 486050, "epoch": 5856} {"train_loss": -25.786468505859375, "global_step": 486051, "epoch": 5856} {"train_loss": -25.417814254760742, "global_step": 486052, "epoch": 5856} {"train_loss": -26.462055206298828, "global_step": 486053, "epoch": 5856} {"train_loss": -25.636701583862305, "global_step": 486054, "epoch": 5856} {"train_loss": -26.047204971313477, "global_step": 486055, "epoch": 5856} {"train_loss": -26.576648712158203, "global_step": 486056, "epoch": 5856} {"train_loss": -26.449268341064453, "global_step": 486057, "epoch": 5856} {"train_loss": -26.401357650756836, "global_step": 486058, "epoch": 5856} {"train_loss": -26.258813858032227, "global_step": 486059, "epoch": 5856} {"train_loss": -26.409748077392578, "global_step": 486060, "epoch": 5856} {"train_loss": -26.721271514892578, "global_step": 486061, "epoch": 5856} {"train_loss": -26.61102867126465, "global_step": 486062, "epoch": 5856} {"train_loss": -26.716833114624023, "global_step": 486063, "epoch": 5856} {"train_loss": -26.516727447509766, "global_step": 486064, "epoch": 5856} {"train_loss": -26.36628532409668, "global_step": 486065, "epoch": 5856} {"train_loss": -26.73065185546875, "global_step": 486066, "epoch": 5856} {"train_loss": -26.523136138916016, "global_step": 486067, "epoch": 5856} {"train_loss": -26.55280876159668, "global_step": 486068, "epoch": 5856} {"train_loss": -26.80225944519043, "global_step": 486069, "epoch": 5856} {"train_loss": -26.886343002319336, "global_step": 486070, "epoch": 5856} {"train_loss": -26.656301498413086, "global_step": 486071, "epoch": 5856} {"train_loss": -26.872182846069336, "global_step": 486072, "epoch": 5856} {"train_loss": -27.006139755249023, "global_step": 486073, "epoch": 5856} {"train_loss": -26.908355712890625, "global_step": 486074, "epoch": 5856} {"train_loss": -27.051023483276367, "global_step": 486075, "epoch": 5856} {"train_loss": -26.959707260131836, "global_step": 486076, "epoch": 5856} {"train_loss": -26.828031539916992, "global_step": 486077, "epoch": 5856} {"train_loss": -27.468297958374023, "global_step": 486078, "epoch": 5856} {"train_loss": -26.9033260345459, "global_step": 486079, "epoch": 5856} {"train_loss": -26.97706413269043, "global_step": 486080, "epoch": 5856} {"train_loss": -27.06842041015625, "global_step": 486081, "epoch": 5856} {"train_loss": -26.99432945251465, "global_step": 486082, "epoch": 5856} {"train_loss": -26.911291122436523, "global_step": 486083, "epoch": 5856} {"train_loss": -26.951507568359375, "global_step": 486084, "epoch": 5856} {"train_loss": -27.24640464782715, "global_step": 486085, "epoch": 5856} {"train_loss": -27.001789093017578, "global_step": 486086, "epoch": 5856} {"train_loss": -27.378625869750977, "global_step": 486087, "epoch": 5856} {"train_loss": -27.1938533782959, "global_step": 486088, "epoch": 5856} {"train_loss": -27.171234130859375, "global_step": 486089, "epoch": 5856} {"train_loss": -27.474227905273438, "global_step": 486090, "epoch": 5856} {"train_loss": -26.989948272705078, "global_step": 486091, "epoch": 5856} {"train_loss": -27.59726333618164, "global_step": 486092, "epoch": 5856} {"train_loss": -27.20404052734375, "global_step": 486093, "epoch": 5856} {"train_loss": -27.28436851501465, "global_step": 486094, "epoch": 5856} {"train_loss": -27.341129302978516, "global_step": 486095, "epoch": 5856} {"train_loss": -27.52555274963379, "global_step": 486096, "epoch": 5856} {"train_loss": -27.223724365234375, "global_step": 486097, "epoch": 5856} {"train_loss": -27.34769630432129, "global_step": 486098, "epoch": 5856} {"train_loss": -27.723468780517578, "global_step": 486099, "epoch": 5856} {"train_loss": -27.002294540405273, "global_step": 486100, "epoch": 5856} {"train_loss": -27.430341720581055, "global_step": 486101, "epoch": 5856} {"train_loss": -27.428197860717773, "global_step": 486102, "epoch": 5856} {"train_loss": -27.51837158203125, "global_step": 486103, "epoch": 5856} {"train_loss": -27.376392364501953, "global_step": 486104, "epoch": 5856} {"train_loss": -27.62483024597168, "global_step": 486105, "epoch": 5856} {"train_loss": -27.25726318359375, "global_step": 486106, "epoch": 5856} {"train_loss": -27.3359317779541, "global_step": 486107, "epoch": 5856} {"train_loss": -27.412717819213867, "global_step": 486108, "epoch": 5856} {"train_loss": -27.595081329345703, "global_step": 486109, "epoch": 5856} {"train_loss": -27.39458656311035, "global_step": 486110, "epoch": 5856} {"train_loss": -27.367752075195312, "global_step": 486111, "epoch": 5856} {"train_loss": -27.33111000061035, "global_step": 486112, "epoch": 5856} {"train_loss": -27.716815948486328, "global_step": 486113, "epoch": 5856} {"train_loss": -27.615070343017578, "global_step": 486114, "epoch": 5856} {"train_loss": -28.120054244995117, "global_step": 486115, "epoch": 5856} {"train_loss": -27.5750789642334, "global_step": 486116, "epoch": 5856} {"train_loss": -27.378925323486328, "global_step": 486117, "epoch": 5856} {"train_loss": -27.63164710998535, "global_step": 486118, "epoch": 5856} {"train_loss": -27.34466552734375, "global_step": 486119, "epoch": 5856} {"train_loss": -27.486780166625977, "global_step": 486120, "epoch": 5856} {"train_loss": -27.599796295166016, "global_step": 486121, "epoch": 5856} {"train_loss": -27.242938995361328, "global_step": 486122, "epoch": 5856} {"train_loss": -27.361425399780273, "global_step": 486123, "epoch": 5856} {"train_loss": -27.341461181640625, "global_step": 486124, "epoch": 5856} {"train_loss": -27.744537353515625, "global_step": 486125, "epoch": 5856} {"train_loss": -27.277191162109375, "global_step": 486126, "epoch": 5856} {"train_loss": -27.379011154174805, "global_step": 486127, "epoch": 5856} {"train_loss": -27.284088134765625, "global_step": 486128, "epoch": 5856} {"train_loss": -27.15607261657715, "global_step": 486129, "epoch": 5856} {"train_loss": -26.988457852099316, "global_step": 486130, "epoch": 5856, "val_loss": 6532722.5} {"train_loss": -26.363515853881836, "global_step": 486131, "epoch": 5857} {"train_loss": -26.08284568786621, "global_step": 486132, "epoch": 5857} {"train_loss": -26.384008407592773, "global_step": 486133, "epoch": 5857} {"train_loss": -26.903095245361328, "global_step": 486134, "epoch": 5857} {"train_loss": -26.616682052612305, "global_step": 486135, "epoch": 5857} {"train_loss": -26.943084716796875, "global_step": 486136, "epoch": 5857} {"train_loss": -27.257495880126953, "global_step": 486137, "epoch": 5857} {"train_loss": -26.959918975830078, "global_step": 486138, "epoch": 5857} {"train_loss": -27.0584716796875, "global_step": 486139, "epoch": 5857} {"train_loss": -26.69189453125, "global_step": 486140, "epoch": 5857} {"train_loss": -27.2043514251709, "global_step": 486141, "epoch": 5857} {"train_loss": -26.98677635192871, "global_step": 486142, "epoch": 5857} {"train_loss": -27.0444393157959, "global_step": 486143, "epoch": 5857} {"train_loss": -26.412429809570312, "global_step": 486144, "epoch": 5857} {"train_loss": -27.05933952331543, "global_step": 486145, "epoch": 5857} {"train_loss": -26.55712890625, "global_step": 486146, "epoch": 5857} {"train_loss": -27.1336612701416, "global_step": 486147, "epoch": 5857} {"train_loss": -27.055072784423828, "global_step": 486148, "epoch": 5857} {"train_loss": -27.1546630859375, "global_step": 486149, "epoch": 5857} {"train_loss": -26.77167320251465, "global_step": 486150, "epoch": 5857} {"train_loss": -27.38374137878418, "global_step": 486151, "epoch": 5857} {"train_loss": -27.128503799438477, "global_step": 486152, "epoch": 5857} {"train_loss": -27.40291404724121, "global_step": 486153, "epoch": 5857} {"train_loss": -27.184371948242188, "global_step": 486154, "epoch": 5857} {"train_loss": -27.179059982299805, "global_step": 486155, "epoch": 5857} {"train_loss": -27.25508689880371, "global_step": 486156, "epoch": 5857} {"train_loss": -27.131839752197266, "global_step": 486157, "epoch": 5857} {"train_loss": -27.477643966674805, "global_step": 486158, "epoch": 5857} {"train_loss": -27.25178337097168, "global_step": 486159, "epoch": 5857} {"train_loss": -27.036142349243164, "global_step": 486160, "epoch": 5857} {"train_loss": -27.045520782470703, "global_step": 486161, "epoch": 5857} {"train_loss": -26.93206214904785, "global_step": 486162, "epoch": 5857} {"train_loss": -27.227680206298828, "global_step": 486163, "epoch": 5857} {"train_loss": -27.051406860351562, "global_step": 486164, "epoch": 5857} {"train_loss": -26.846662521362305, "global_step": 486165, "epoch": 5857} {"train_loss": -27.13593864440918, "global_step": 486166, "epoch": 5857} {"train_loss": -27.480194091796875, "global_step": 486167, "epoch": 5857} {"train_loss": -27.320600509643555, "global_step": 486168, "epoch": 5857} {"train_loss": -27.68060874938965, "global_step": 486169, "epoch": 5857} {"train_loss": -27.510095596313477, "global_step": 486170, "epoch": 5857} {"train_loss": -27.415210723876953, "global_step": 486171, "epoch": 5857} {"train_loss": -27.064727783203125, "global_step": 486172, "epoch": 5857} {"train_loss": -27.50824546813965, "global_step": 486173, "epoch": 5857} {"train_loss": -27.512195587158203, "global_step": 486174, "epoch": 5857} {"train_loss": -27.40753173828125, "global_step": 486175, "epoch": 5857} {"train_loss": -27.266937255859375, "global_step": 486176, "epoch": 5857} {"train_loss": -27.353076934814453, "global_step": 486177, "epoch": 5857} {"train_loss": -27.235870361328125, "global_step": 486178, "epoch": 5857} {"train_loss": -27.22218132019043, "global_step": 486179, "epoch": 5857} {"train_loss": -27.193103790283203, "global_step": 486180, "epoch": 5857} {"train_loss": -27.26374626159668, "global_step": 486181, "epoch": 5857} {"train_loss": -27.468839645385742, "global_step": 486182, "epoch": 5857} {"train_loss": -26.8361759185791, "global_step": 486183, "epoch": 5857} {"train_loss": -27.28291130065918, "global_step": 486184, "epoch": 5857} {"train_loss": -27.425085067749023, "global_step": 486185, "epoch": 5857} {"train_loss": -27.412931442260742, "global_step": 486186, "epoch": 5857} {"train_loss": -27.491119384765625, "global_step": 486187, "epoch": 5857} {"train_loss": -27.29353141784668, "global_step": 486188, "epoch": 5857} {"train_loss": -27.37282371520996, "global_step": 486189, "epoch": 5857} {"train_loss": -27.737939834594727, "global_step": 486190, "epoch": 5857} {"train_loss": -27.33351707458496, "global_step": 486191, "epoch": 5857} {"train_loss": -27.503320693969727, "global_step": 486192, "epoch": 5857} {"train_loss": -27.246450424194336, "global_step": 486193, "epoch": 5857} {"train_loss": -27.4049015045166, "global_step": 486194, "epoch": 5857} {"train_loss": -27.317411422729492, "global_step": 486195, "epoch": 5857} {"train_loss": -27.632465362548828, "global_step": 486196, "epoch": 5857} {"train_loss": -27.566492080688477, "global_step": 486197, "epoch": 5857} {"train_loss": -27.318037033081055, "global_step": 486198, "epoch": 5857} {"train_loss": -27.64453125, "global_step": 486199, "epoch": 5857} {"train_loss": -27.368799209594727, "global_step": 486200, "epoch": 5857} {"train_loss": -27.360742568969727, "global_step": 486201, "epoch": 5857} {"train_loss": -27.414831161499023, "global_step": 486202, "epoch": 5857} {"train_loss": -27.53128433227539, "global_step": 486203, "epoch": 5857} {"train_loss": -27.624475479125977, "global_step": 486204, "epoch": 5857} {"train_loss": -27.737268447875977, "global_step": 486205, "epoch": 5857} {"train_loss": -26.783811569213867, "global_step": 486206, "epoch": 5857} {"train_loss": -26.505929946899414, "global_step": 486207, "epoch": 5857} {"train_loss": -26.202600479125977, "global_step": 486208, "epoch": 5857} {"train_loss": -27.079736709594727, "global_step": 486209, "epoch": 5857} {"train_loss": -26.841888427734375, "global_step": 486210, "epoch": 5857} {"train_loss": -26.898733139038086, "global_step": 486211, "epoch": 5857} {"train_loss": -26.75699806213379, "global_step": 486212, "epoch": 5857} {"train_loss": -27.16486167907715, "global_step": 486213, "epoch": 5857, "val_loss": 6536444.0} {"train_loss": -25.89237403869629, "global_step": 486214, "epoch": 5858} {"train_loss": -25.662275314331055, "global_step": 486215, "epoch": 5858} {"train_loss": -26.884313583374023, "global_step": 486216, "epoch": 5858} {"train_loss": -25.59047508239746, "global_step": 486217, "epoch": 5858} {"train_loss": -25.978092193603516, "global_step": 486218, "epoch": 5858} {"train_loss": -26.79559326171875, "global_step": 486219, "epoch": 5858} {"train_loss": -25.887805938720703, "global_step": 486220, "epoch": 5858} {"train_loss": -26.85223388671875, "global_step": 486221, "epoch": 5858} {"train_loss": -26.22490882873535, "global_step": 486222, "epoch": 5858} {"train_loss": -26.4334659576416, "global_step": 486223, "epoch": 5858} {"train_loss": -26.633935928344727, "global_step": 486224, "epoch": 5858} {"train_loss": -26.855606079101562, "global_step": 486225, "epoch": 5858} {"train_loss": -26.985815048217773, "global_step": 486226, "epoch": 5858} {"train_loss": -26.764204025268555, "global_step": 486227, "epoch": 5858} {"train_loss": -26.741363525390625, "global_step": 486228, "epoch": 5858} {"train_loss": -26.940322875976562, "global_step": 486229, "epoch": 5858} {"train_loss": -27.255237579345703, "global_step": 486230, "epoch": 5858} {"train_loss": -27.275609970092773, "global_step": 486231, "epoch": 5858} {"train_loss": -27.699539184570312, "global_step": 486232, "epoch": 5858} {"train_loss": -27.390079498291016, "global_step": 486233, "epoch": 5858} {"train_loss": -26.8040828704834, "global_step": 486234, "epoch": 5858} {"train_loss": -26.8358154296875, "global_step": 486235, "epoch": 5858} {"train_loss": -27.460294723510742, "global_step": 486236, "epoch": 5858} {"train_loss": -27.14052391052246, "global_step": 486237, "epoch": 5858} {"train_loss": -26.963964462280273, "global_step": 486238, "epoch": 5858} {"train_loss": -27.338220596313477, "global_step": 486239, "epoch": 5858} {"train_loss": -27.377685546875, "global_step": 486240, "epoch": 5858} {"train_loss": -27.080371856689453, "global_step": 486241, "epoch": 5858} {"train_loss": -27.12672233581543, "global_step": 486242, "epoch": 5858} {"train_loss": -27.44014549255371, "global_step": 486243, "epoch": 5858} {"train_loss": -26.92719078063965, "global_step": 486244, "epoch": 5858} {"train_loss": -27.472692489624023, "global_step": 486245, "epoch": 5858} {"train_loss": -26.92945671081543, "global_step": 486246, "epoch": 5858} {"train_loss": -27.34540367126465, "global_step": 486247, "epoch": 5858} {"train_loss": -26.930078506469727, "global_step": 486248, "epoch": 5858} {"train_loss": -27.421178817749023, "global_step": 486249, "epoch": 5858} {"train_loss": -27.38742446899414, "global_step": 486250, "epoch": 5858} {"train_loss": -27.54554557800293, "global_step": 486251, "epoch": 5858} {"train_loss": -27.5236759185791, "global_step": 486252, "epoch": 5858} {"train_loss": -27.002948760986328, "global_step": 486253, "epoch": 5858} {"train_loss": -27.17905616760254, "global_step": 486254, "epoch": 5858} {"train_loss": -27.54169273376465, "global_step": 486255, "epoch": 5858} {"train_loss": -27.380218505859375, "global_step": 486256, "epoch": 5858} {"train_loss": -27.5017147064209, "global_step": 486257, "epoch": 5858} {"train_loss": -27.42258644104004, "global_step": 486258, "epoch": 5858} {"train_loss": -27.346227645874023, "global_step": 486259, "epoch": 5858} {"train_loss": -27.097166061401367, "global_step": 486260, "epoch": 5858} {"train_loss": -27.425573348999023, "global_step": 486261, "epoch": 5858} {"train_loss": -27.199390411376953, "global_step": 486262, "epoch": 5858} {"train_loss": -27.588098526000977, "global_step": 486263, "epoch": 5858} {"train_loss": -27.6743221282959, "global_step": 486264, "epoch": 5858} {"train_loss": -27.323225021362305, "global_step": 486265, "epoch": 5858} {"train_loss": -27.064289093017578, "global_step": 486266, "epoch": 5858} {"train_loss": -27.33953285217285, "global_step": 486267, "epoch": 5858} {"train_loss": -27.38172721862793, "global_step": 486268, "epoch": 5858} {"train_loss": -27.184417724609375, "global_step": 486269, "epoch": 5858} {"train_loss": -27.112802505493164, "global_step": 486270, "epoch": 5858} {"train_loss": -27.446802139282227, "global_step": 486271, "epoch": 5858} {"train_loss": -27.46225929260254, "global_step": 486272, "epoch": 5858} {"train_loss": -27.291702270507812, "global_step": 486273, "epoch": 5858} {"train_loss": -26.99261474609375, "global_step": 486274, "epoch": 5858} {"train_loss": -27.629125595092773, "global_step": 486275, "epoch": 5858} {"train_loss": -27.510223388671875, "global_step": 486276, "epoch": 5858} {"train_loss": -27.40115737915039, "global_step": 486277, "epoch": 5858} {"train_loss": -27.30170249938965, "global_step": 486278, "epoch": 5858} {"train_loss": -27.309326171875, "global_step": 486279, "epoch": 5858} {"train_loss": -27.445783615112305, "global_step": 486280, "epoch": 5858} {"train_loss": -27.485828399658203, "global_step": 486281, "epoch": 5858} {"train_loss": -27.604862213134766, "global_step": 486282, "epoch": 5858} {"train_loss": -27.225296020507812, "global_step": 486283, "epoch": 5858} {"train_loss": -27.622411727905273, "global_step": 486284, "epoch": 5858} {"train_loss": -27.57459831237793, "global_step": 486285, "epoch": 5858} {"train_loss": -27.447528839111328, "global_step": 486286, "epoch": 5858} {"train_loss": -27.119619369506836, "global_step": 486287, "epoch": 5858} {"train_loss": -27.35812759399414, "global_step": 486288, "epoch": 5858} {"train_loss": -27.45340919494629, "global_step": 486289, "epoch": 5858} {"train_loss": -27.36671257019043, "global_step": 486290, "epoch": 5858} {"train_loss": -27.51785659790039, "global_step": 486291, "epoch": 5858} {"train_loss": -27.539154052734375, "global_step": 486292, "epoch": 5858} {"train_loss": -27.66813087463379, "global_step": 486293, "epoch": 5858} {"train_loss": -27.311431884765625, "global_step": 486294, "epoch": 5858} {"train_loss": -27.183094024658203, "global_step": 486295, "epoch": 5858} {"train_loss": -27.149406341185053, "global_step": 486296, "epoch": 5858, "val_loss": 6533218.0} {"train_loss": -26.934301376342773, "global_step": 486297, "epoch": 5859} {"train_loss": -26.94898796081543, "global_step": 486298, "epoch": 5859} {"train_loss": -26.0395450592041, "global_step": 486299, "epoch": 5859} {"train_loss": -26.542118072509766, "global_step": 486300, "epoch": 5859} {"train_loss": -26.727294921875, "global_step": 486301, "epoch": 5859} {"train_loss": -26.78875732421875, "global_step": 486302, "epoch": 5859} {"train_loss": -26.5629825592041, "global_step": 486303, "epoch": 5859} {"train_loss": -26.52335548400879, "global_step": 486304, "epoch": 5859} {"train_loss": -27.004470825195312, "global_step": 486305, "epoch": 5859} {"train_loss": -26.723066329956055, "global_step": 486306, "epoch": 5859} {"train_loss": -26.669641494750977, "global_step": 486307, "epoch": 5859} {"train_loss": -26.748615264892578, "global_step": 486308, "epoch": 5859} {"train_loss": -26.89723014831543, "global_step": 486309, "epoch": 5859} {"train_loss": -26.977319717407227, "global_step": 486310, "epoch": 5859} {"train_loss": -27.063512802124023, "global_step": 486311, "epoch": 5859} {"train_loss": -27.06380271911621, "global_step": 486312, "epoch": 5859} {"train_loss": -27.360769271850586, "global_step": 486313, "epoch": 5859} {"train_loss": -26.709381103515625, "global_step": 486314, "epoch": 5859} {"train_loss": -27.10735511779785, "global_step": 486315, "epoch": 5859} {"train_loss": -27.195419311523438, "global_step": 486316, "epoch": 5859} {"train_loss": -27.186782836914062, "global_step": 486317, "epoch": 5859} {"train_loss": -27.356098175048828, "global_step": 486318, "epoch": 5859} {"train_loss": -26.94111442565918, "global_step": 486319, "epoch": 5859} {"train_loss": -27.079090118408203, "global_step": 486320, "epoch": 5859} {"train_loss": -27.03814697265625, "global_step": 486321, "epoch": 5859} {"train_loss": -27.072269439697266, "global_step": 486322, "epoch": 5859} {"train_loss": -27.102558135986328, "global_step": 486323, "epoch": 5859} {"train_loss": -27.734851837158203, "global_step": 486324, "epoch": 5859} {"train_loss": -27.231876373291016, "global_step": 486325, "epoch": 5859} {"train_loss": -27.8619384765625, "global_step": 486326, "epoch": 5859} {"train_loss": -27.168975830078125, "global_step": 486327, "epoch": 5859} {"train_loss": -27.82830238342285, "global_step": 486328, "epoch": 5859} {"train_loss": -27.216222763061523, "global_step": 486329, "epoch": 5859} {"train_loss": -27.585895538330078, "global_step": 486330, "epoch": 5859} {"train_loss": -27.504682540893555, "global_step": 486331, "epoch": 5859} {"train_loss": -27.322229385375977, "global_step": 486332, "epoch": 5859} {"train_loss": -27.64443016052246, "global_step": 486333, "epoch": 5859} {"train_loss": -27.471389770507812, "global_step": 486334, "epoch": 5859} {"train_loss": -27.369176864624023, "global_step": 486335, "epoch": 5859} {"train_loss": -27.656835556030273, "global_step": 486336, "epoch": 5859} {"train_loss": -27.554304122924805, "global_step": 486337, "epoch": 5859} {"train_loss": -27.389484405517578, "global_step": 486338, "epoch": 5859} {"train_loss": -27.50472068786621, "global_step": 486339, "epoch": 5859} {"train_loss": -27.04096031188965, "global_step": 486340, "epoch": 5859} {"train_loss": -27.859832763671875, "global_step": 486341, "epoch": 5859} {"train_loss": -27.294885635375977, "global_step": 486342, "epoch": 5859} {"train_loss": -27.69351577758789, "global_step": 486343, "epoch": 5859} {"train_loss": -27.11163330078125, "global_step": 486344, "epoch": 5859} {"train_loss": -27.292316436767578, "global_step": 486345, "epoch": 5859} {"train_loss": -27.109827041625977, "global_step": 486346, "epoch": 5859} {"train_loss": -27.33534812927246, "global_step": 486347, "epoch": 5859} {"train_loss": -27.43537712097168, "global_step": 486348, "epoch": 5859} {"train_loss": -27.341812133789062, "global_step": 486349, "epoch": 5859} {"train_loss": -27.236722946166992, "global_step": 486350, "epoch": 5859} {"train_loss": -27.594247817993164, "global_step": 486351, "epoch": 5859} {"train_loss": -27.2386474609375, "global_step": 486352, "epoch": 5859} {"train_loss": -27.577625274658203, "global_step": 486353, "epoch": 5859} {"train_loss": -27.562482833862305, "global_step": 486354, "epoch": 5859} {"train_loss": -27.451757431030273, "global_step": 486355, "epoch": 5859} {"train_loss": -27.797870635986328, "global_step": 486356, "epoch": 5859} {"train_loss": -27.57545280456543, "global_step": 486357, "epoch": 5859} {"train_loss": -27.719573974609375, "global_step": 486358, "epoch": 5859} {"train_loss": -27.174930572509766, "global_step": 486359, "epoch": 5859} {"train_loss": -27.44998550415039, "global_step": 486360, "epoch": 5859} {"train_loss": -27.556564331054688, "global_step": 486361, "epoch": 5859} {"train_loss": -27.361316680908203, "global_step": 486362, "epoch": 5859} {"train_loss": -27.661962509155273, "global_step": 486363, "epoch": 5859} {"train_loss": -26.98090934753418, "global_step": 486364, "epoch": 5859} {"train_loss": -27.480243682861328, "global_step": 486365, "epoch": 5859} {"train_loss": -26.970075607299805, "global_step": 486366, "epoch": 5859} {"train_loss": -27.375385284423828, "global_step": 486367, "epoch": 5859} {"train_loss": -27.3991641998291, "global_step": 486368, "epoch": 5859} {"train_loss": -27.499893188476562, "global_step": 486369, "epoch": 5859} {"train_loss": -26.90677833557129, "global_step": 486370, "epoch": 5859} {"train_loss": -27.206790924072266, "global_step": 486371, "epoch": 5859} {"train_loss": -26.948474884033203, "global_step": 486372, "epoch": 5859} {"train_loss": -27.24373435974121, "global_step": 486373, "epoch": 5859} {"train_loss": -27.014257431030273, "global_step": 486374, "epoch": 5859} {"train_loss": -27.47165870666504, "global_step": 486375, "epoch": 5859} {"train_loss": -26.960372924804688, "global_step": 486376, "epoch": 5859} {"train_loss": -27.262800216674805, "global_step": 486377, "epoch": 5859} {"train_loss": -27.40423583984375, "global_step": 486378, "epoch": 5859} {"train_loss": -27.24857086733163, "global_step": 486379, "epoch": 5859, "val_loss": 6525132.0} {"train_loss": -26.875080108642578, "global_step": 486380, "epoch": 5860} {"train_loss": -26.874252319335938, "global_step": 486381, "epoch": 5860} {"train_loss": -26.68670082092285, "global_step": 486382, "epoch": 5860} {"train_loss": -26.76710319519043, "global_step": 486383, "epoch": 5860} {"train_loss": -27.198511123657227, "global_step": 486384, "epoch": 5860} {"train_loss": -26.80598258972168, "global_step": 486385, "epoch": 5860} {"train_loss": -26.739660263061523, "global_step": 486386, "epoch": 5860} {"train_loss": -26.885663986206055, "global_step": 486387, "epoch": 5860} {"train_loss": -27.129291534423828, "global_step": 486388, "epoch": 5860} {"train_loss": -26.95319175720215, "global_step": 486389, "epoch": 5860} {"train_loss": -26.98078727722168, "global_step": 486390, "epoch": 5860} {"train_loss": -27.324783325195312, "global_step": 486391, "epoch": 5860} {"train_loss": -27.28522300720215, "global_step": 486392, "epoch": 5860} {"train_loss": -27.32132911682129, "global_step": 486393, "epoch": 5860} {"train_loss": -27.189472198486328, "global_step": 486394, "epoch": 5860} {"train_loss": -27.267292022705078, "global_step": 486395, "epoch": 5860} {"train_loss": -27.09966468811035, "global_step": 486396, "epoch": 5860} {"train_loss": -27.231128692626953, "global_step": 486397, "epoch": 5860} {"train_loss": -27.15266227722168, "global_step": 486398, "epoch": 5860} {"train_loss": -27.251678466796875, "global_step": 486399, "epoch": 5860} {"train_loss": -27.28147315979004, "global_step": 486400, "epoch": 5860} {"train_loss": -27.34284782409668, "global_step": 486401, "epoch": 5860} {"train_loss": -27.130029678344727, "global_step": 486402, "epoch": 5860} {"train_loss": -27.24287986755371, "global_step": 486403, "epoch": 5860} {"train_loss": -27.4328670501709, "global_step": 486404, "epoch": 5860} {"train_loss": -27.328413009643555, "global_step": 486405, "epoch": 5860} {"train_loss": -27.417118072509766, "global_step": 486406, "epoch": 5860} {"train_loss": -26.94998550415039, "global_step": 486407, "epoch": 5860} {"train_loss": -27.23774528503418, "global_step": 486408, "epoch": 5860} {"train_loss": -27.536008834838867, "global_step": 486409, "epoch": 5860} {"train_loss": -27.24553871154785, "global_step": 486410, "epoch": 5860} {"train_loss": -27.360187530517578, "global_step": 486411, "epoch": 5860} {"train_loss": -27.22357749938965, "global_step": 486412, "epoch": 5860} {"train_loss": -27.133310317993164, "global_step": 486413, "epoch": 5860} {"train_loss": -27.38248062133789, "global_step": 486414, "epoch": 5860} {"train_loss": -26.832921981811523, "global_step": 486415, "epoch": 5860} {"train_loss": -27.323352813720703, "global_step": 486416, "epoch": 5860} {"train_loss": -27.31892967224121, "global_step": 486417, "epoch": 5860} {"train_loss": -27.21754264831543, "global_step": 486418, "epoch": 5860} {"train_loss": -27.660425186157227, "global_step": 486419, "epoch": 5860} {"train_loss": -27.376012802124023, "global_step": 486420, "epoch": 5860} {"train_loss": -27.365009307861328, "global_step": 486421, "epoch": 5860} {"train_loss": -26.955739974975586, "global_step": 486422, "epoch": 5860} {"train_loss": -27.152795791625977, "global_step": 486423, "epoch": 5860} {"train_loss": -27.25739097595215, "global_step": 486424, "epoch": 5860} {"train_loss": -27.315820693969727, "global_step": 486425, "epoch": 5860} {"train_loss": -27.337682723999023, "global_step": 486426, "epoch": 5860} {"train_loss": -27.421239852905273, "global_step": 486427, "epoch": 5860} {"train_loss": -27.721593856811523, "global_step": 486428, "epoch": 5860} {"train_loss": -27.003202438354492, "global_step": 486429, "epoch": 5860} {"train_loss": -26.650257110595703, "global_step": 486430, "epoch": 5860} {"train_loss": -27.339263916015625, "global_step": 486431, "epoch": 5860} {"train_loss": -27.51580238342285, "global_step": 486432, "epoch": 5860} {"train_loss": -27.063013076782227, "global_step": 486433, "epoch": 5860} {"train_loss": -27.548526763916016, "global_step": 486434, "epoch": 5860} {"train_loss": -27.321929931640625, "global_step": 486435, "epoch": 5860} {"train_loss": -27.5633544921875, "global_step": 486436, "epoch": 5860} {"train_loss": -27.102025985717773, "global_step": 486437, "epoch": 5860} {"train_loss": -27.674482345581055, "global_step": 486438, "epoch": 5860} {"train_loss": -27.27851676940918, "global_step": 486439, "epoch": 5860} {"train_loss": -27.42548942565918, "global_step": 486440, "epoch": 5860} {"train_loss": -27.49257469177246, "global_step": 486441, "epoch": 5860} {"train_loss": -27.580739974975586, "global_step": 486442, "epoch": 5860} {"train_loss": -27.73626136779785, "global_step": 486443, "epoch": 5860} {"train_loss": -27.625320434570312, "global_step": 486444, "epoch": 5860} {"train_loss": -27.41888427734375, "global_step": 486445, "epoch": 5860} {"train_loss": -27.681447982788086, "global_step": 486446, "epoch": 5860} {"train_loss": -27.346044540405273, "global_step": 486447, "epoch": 5860} {"train_loss": -27.135541915893555, "global_step": 486448, "epoch": 5860} {"train_loss": -26.837064743041992, "global_step": 486449, "epoch": 5860} {"train_loss": -27.620532989501953, "global_step": 486450, "epoch": 5860} {"train_loss": -27.226154327392578, "global_step": 486451, "epoch": 5860} {"train_loss": -27.25887107849121, "global_step": 486452, "epoch": 5860} {"train_loss": -27.0499324798584, "global_step": 486453, "epoch": 5860} {"train_loss": -27.1731014251709, "global_step": 486454, "epoch": 5860} {"train_loss": -27.49114990234375, "global_step": 486455, "epoch": 5860} {"train_loss": -26.955137252807617, "global_step": 486456, "epoch": 5860} {"train_loss": -27.52886390686035, "global_step": 486457, "epoch": 5860} {"train_loss": -27.187702178955078, "global_step": 486458, "epoch": 5860} {"train_loss": -27.034292221069336, "global_step": 486459, "epoch": 5860} {"train_loss": -26.988195419311523, "global_step": 486460, "epoch": 5860} {"train_loss": -27.436817169189453, "global_step": 486461, "epoch": 5860} {"train_loss": -27.247964813048583, "global_step": 486462, "epoch": 5860, "val_loss": 6481470.0} {"train_loss": -27.187490463256836, "global_step": 486463, "epoch": 5861} {"train_loss": -26.586322784423828, "global_step": 486464, "epoch": 5861} {"train_loss": -26.575448989868164, "global_step": 486465, "epoch": 5861} {"train_loss": -26.572452545166016, "global_step": 486466, "epoch": 5861} {"train_loss": -26.484663009643555, "global_step": 486467, "epoch": 5861} {"train_loss": -26.64011001586914, "global_step": 486468, "epoch": 5861} {"train_loss": -26.9410457611084, "global_step": 486469, "epoch": 5861} {"train_loss": -27.186975479125977, "global_step": 486470, "epoch": 5861} {"train_loss": -26.867935180664062, "global_step": 486471, "epoch": 5861} {"train_loss": -27.165231704711914, "global_step": 486472, "epoch": 5861} {"train_loss": -26.89259910583496, "global_step": 486473, "epoch": 5861} {"train_loss": -26.900482177734375, "global_step": 486474, "epoch": 5861} {"train_loss": -26.799396514892578, "global_step": 486475, "epoch": 5861} {"train_loss": -26.980321884155273, "global_step": 486476, "epoch": 5861} {"train_loss": -26.977930068969727, "global_step": 486477, "epoch": 5861} {"train_loss": -27.176538467407227, "global_step": 486478, "epoch": 5861} {"train_loss": -27.20088005065918, "global_step": 486479, "epoch": 5861} {"train_loss": -26.959518432617188, "global_step": 486480, "epoch": 5861} {"train_loss": -27.179412841796875, "global_step": 486481, "epoch": 5861} {"train_loss": -27.279844284057617, "global_step": 486482, "epoch": 5861} {"train_loss": -26.852148056030273, "global_step": 486483, "epoch": 5861} {"train_loss": -27.393415451049805, "global_step": 486484, "epoch": 5861} {"train_loss": -27.210342407226562, "global_step": 486485, "epoch": 5861} {"train_loss": -27.65606117248535, "global_step": 486486, "epoch": 5861} {"train_loss": -27.35845375061035, "global_step": 486487, "epoch": 5861} {"train_loss": -27.56659507751465, "global_step": 486488, "epoch": 5861} {"train_loss": -27.662744522094727, "global_step": 486489, "epoch": 5861} {"train_loss": -27.517242431640625, "global_step": 486490, "epoch": 5861} {"train_loss": -27.14353370666504, "global_step": 486491, "epoch": 5861} {"train_loss": -27.43914794921875, "global_step": 486492, "epoch": 5861} {"train_loss": -27.541980743408203, "global_step": 486493, "epoch": 5861} {"train_loss": -27.31049919128418, "global_step": 486494, "epoch": 5861} {"train_loss": -27.358062744140625, "global_step": 486495, "epoch": 5861} {"train_loss": -27.2762508392334, "global_step": 486496, "epoch": 5861} {"train_loss": -27.588520050048828, "global_step": 486497, "epoch": 5861} {"train_loss": -27.41798210144043, "global_step": 486498, "epoch": 5861} {"train_loss": -27.1865234375, "global_step": 486499, "epoch": 5861} {"train_loss": -26.96673583984375, "global_step": 486500, "epoch": 5861} {"train_loss": -26.882654190063477, "global_step": 486501, "epoch": 5861} {"train_loss": -27.7254638671875, "global_step": 486502, "epoch": 5861} {"train_loss": -27.723371505737305, "global_step": 486503, "epoch": 5861} {"train_loss": -27.35968017578125, "global_step": 486504, "epoch": 5861} {"train_loss": -27.186695098876953, "global_step": 486505, "epoch": 5861} {"train_loss": -27.322101593017578, "global_step": 486506, "epoch": 5861} {"train_loss": -27.30535888671875, "global_step": 486507, "epoch": 5861} {"train_loss": -27.415327072143555, "global_step": 486508, "epoch": 5861} {"train_loss": -27.325519561767578, "global_step": 486509, "epoch": 5861} {"train_loss": -27.494937896728516, "global_step": 486510, "epoch": 5861} {"train_loss": -27.297164916992188, "global_step": 486511, "epoch": 5861} {"train_loss": -27.856836318969727, "global_step": 486512, "epoch": 5861} {"train_loss": -27.464658737182617, "global_step": 486513, "epoch": 5861} {"train_loss": -27.3723087310791, "global_step": 486514, "epoch": 5861} {"train_loss": -27.38459587097168, "global_step": 486515, "epoch": 5861} {"train_loss": -27.22568130493164, "global_step": 486516, "epoch": 5861} {"train_loss": -27.3109188079834, "global_step": 486517, "epoch": 5861} {"train_loss": -26.623868942260742, "global_step": 486518, "epoch": 5861} {"train_loss": -26.014026641845703, "global_step": 486519, "epoch": 5861} {"train_loss": -25.945722579956055, "global_step": 486520, "epoch": 5861} {"train_loss": -26.71235466003418, "global_step": 486521, "epoch": 5861} {"train_loss": -27.0116024017334, "global_step": 486522, "epoch": 5861} {"train_loss": -27.058897018432617, "global_step": 486523, "epoch": 5861} {"train_loss": -26.990936279296875, "global_step": 486524, "epoch": 5861} {"train_loss": -26.929853439331055, "global_step": 486525, "epoch": 5861} {"train_loss": -27.0167236328125, "global_step": 486526, "epoch": 5861} {"train_loss": -26.955169677734375, "global_step": 486527, "epoch": 5861} {"train_loss": -26.805978775024414, "global_step": 486528, "epoch": 5861} {"train_loss": -26.979734420776367, "global_step": 486529, "epoch": 5861} {"train_loss": -27.394800186157227, "global_step": 486530, "epoch": 5861} {"train_loss": -26.858264923095703, "global_step": 486531, "epoch": 5861} {"train_loss": -26.768537521362305, "global_step": 486532, "epoch": 5861} {"train_loss": -26.734113693237305, "global_step": 486533, "epoch": 5861} {"train_loss": -26.939197540283203, "global_step": 486534, "epoch": 5861} {"train_loss": -27.317895889282227, "global_step": 486535, "epoch": 5861} {"train_loss": -27.431333541870117, "global_step": 486536, "epoch": 5861} {"train_loss": -27.040283203125, "global_step": 486537, "epoch": 5861} {"train_loss": -27.143014907836914, "global_step": 486538, "epoch": 5861} {"train_loss": -26.921899795532227, "global_step": 486539, "epoch": 5861} {"train_loss": -27.004962921142578, "global_step": 486540, "epoch": 5861} {"train_loss": -27.133838653564453, "global_step": 486541, "epoch": 5861} {"train_loss": -27.289779663085938, "global_step": 486542, "epoch": 5861} {"train_loss": -26.701929092407227, "global_step": 486543, "epoch": 5861} {"train_loss": -27.281827926635742, "global_step": 486544, "epoch": 5861} {"train_loss": -27.095610699021673, "global_step": 486545, "epoch": 5861, "val_loss": 6498465.0} {"train_loss": -26.001562118530273, "global_step": 486546, "epoch": 5862} {"train_loss": -26.224645614624023, "global_step": 486547, "epoch": 5862} {"train_loss": -26.448062896728516, "global_step": 486548, "epoch": 5862} {"train_loss": -26.160511016845703, "global_step": 486549, "epoch": 5862} {"train_loss": -25.969532012939453, "global_step": 486550, "epoch": 5862} {"train_loss": -26.919300079345703, "global_step": 486551, "epoch": 5862} {"train_loss": -26.784881591796875, "global_step": 486552, "epoch": 5862} {"train_loss": -26.246784210205078, "global_step": 486553, "epoch": 5862} {"train_loss": -27.141347885131836, "global_step": 486554, "epoch": 5862} {"train_loss": -26.425800323486328, "global_step": 486555, "epoch": 5862} {"train_loss": -26.62299919128418, "global_step": 486556, "epoch": 5862} {"train_loss": -26.653167724609375, "global_step": 486557, "epoch": 5862} {"train_loss": -26.891691207885742, "global_step": 486558, "epoch": 5862} {"train_loss": -26.71259880065918, "global_step": 486559, "epoch": 5862} {"train_loss": -26.761533737182617, "global_step": 486560, "epoch": 5862} {"train_loss": -26.809595108032227, "global_step": 486561, "epoch": 5862} {"train_loss": -27.009674072265625, "global_step": 486562, "epoch": 5862} {"train_loss": -26.90833854675293, "global_step": 486563, "epoch": 5862} {"train_loss": -26.968414306640625, "global_step": 486564, "epoch": 5862} {"train_loss": -26.844160079956055, "global_step": 486565, "epoch": 5862} {"train_loss": -26.857229232788086, "global_step": 486566, "epoch": 5862} {"train_loss": -27.066852569580078, "global_step": 486567, "epoch": 5862} {"train_loss": -26.883188247680664, "global_step": 486568, "epoch": 5862} {"train_loss": -27.07840347290039, "global_step": 486569, "epoch": 5862} {"train_loss": -27.218481063842773, "global_step": 486570, "epoch": 5862} {"train_loss": -27.1232967376709, "global_step": 486571, "epoch": 5862} {"train_loss": -26.958417892456055, "global_step": 486572, "epoch": 5862} {"train_loss": -27.27687644958496, "global_step": 486573, "epoch": 5862} {"train_loss": -27.27374267578125, "global_step": 486574, "epoch": 5862} {"train_loss": -27.233102798461914, "global_step": 486575, "epoch": 5862} {"train_loss": -27.060821533203125, "global_step": 486576, "epoch": 5862} {"train_loss": -27.41292381286621, "global_step": 486577, "epoch": 5862} {"train_loss": -27.259845733642578, "global_step": 486578, "epoch": 5862} {"train_loss": -27.284101486206055, "global_step": 486579, "epoch": 5862} {"train_loss": -27.190595626831055, "global_step": 486580, "epoch": 5862} {"train_loss": -27.320173263549805, "global_step": 486581, "epoch": 5862} {"train_loss": -27.15557289123535, "global_step": 486582, "epoch": 5862} {"train_loss": -27.220224380493164, "global_step": 486583, "epoch": 5862} {"train_loss": -27.564666748046875, "global_step": 486584, "epoch": 5862} {"train_loss": -27.516361236572266, "global_step": 486585, "epoch": 5862} {"train_loss": -27.12813377380371, "global_step": 486586, "epoch": 5862} {"train_loss": -27.451292037963867, "global_step": 486587, "epoch": 5862} {"train_loss": -27.32061767578125, "global_step": 486588, "epoch": 5862} {"train_loss": -27.017995834350586, "global_step": 486589, "epoch": 5862} {"train_loss": -27.22052574157715, "global_step": 486590, "epoch": 5862} {"train_loss": -27.350698471069336, "global_step": 486591, "epoch": 5862} {"train_loss": -27.4305362701416, "global_step": 486592, "epoch": 5862} {"train_loss": -27.647811889648438, "global_step": 486593, "epoch": 5862} {"train_loss": -27.545120239257812, "global_step": 486594, "epoch": 5862} {"train_loss": -27.571805953979492, "global_step": 486595, "epoch": 5862} {"train_loss": -27.694971084594727, "global_step": 486596, "epoch": 5862} {"train_loss": -27.532583236694336, "global_step": 486597, "epoch": 5862} {"train_loss": -27.554473876953125, "global_step": 486598, "epoch": 5862} {"train_loss": -27.620397567749023, "global_step": 486599, "epoch": 5862} {"train_loss": -27.66116714477539, "global_step": 486600, "epoch": 5862} {"train_loss": -27.36517333984375, "global_step": 486601, "epoch": 5862} {"train_loss": -27.40546989440918, "global_step": 486602, "epoch": 5862} {"train_loss": -27.592870712280273, "global_step": 486603, "epoch": 5862} {"train_loss": -27.46193504333496, "global_step": 486604, "epoch": 5862} {"train_loss": -27.55177879333496, "global_step": 486605, "epoch": 5862} {"train_loss": -27.849735260009766, "global_step": 486606, "epoch": 5862} {"train_loss": -27.664905548095703, "global_step": 486607, "epoch": 5862} {"train_loss": -27.63237953186035, "global_step": 486608, "epoch": 5862} {"train_loss": -27.620939254760742, "global_step": 486609, "epoch": 5862} {"train_loss": -27.54374122619629, "global_step": 486610, "epoch": 5862} {"train_loss": -27.228200912475586, "global_step": 486611, "epoch": 5862} {"train_loss": -27.614316940307617, "global_step": 486612, "epoch": 5862} {"train_loss": -27.3070011138916, "global_step": 486613, "epoch": 5862} {"train_loss": -27.312265396118164, "global_step": 486614, "epoch": 5862} {"train_loss": -27.11188316345215, "global_step": 486615, "epoch": 5862} {"train_loss": -27.239856719970703, "global_step": 486616, "epoch": 5862} {"train_loss": -27.160465240478516, "global_step": 486617, "epoch": 5862} {"train_loss": -26.526416778564453, "global_step": 486618, "epoch": 5862} {"train_loss": -26.345251083374023, "global_step": 486619, "epoch": 5862} {"train_loss": -25.153705596923828, "global_step": 486620, "epoch": 5862} {"train_loss": -25.381601333618164, "global_step": 486621, "epoch": 5862} {"train_loss": -25.842065811157227, "global_step": 486622, "epoch": 5862} {"train_loss": -26.90030860900879, "global_step": 486623, "epoch": 5862} {"train_loss": -26.617273330688477, "global_step": 486624, "epoch": 5862} {"train_loss": -26.905179977416992, "global_step": 486625, "epoch": 5862} {"train_loss": -27.123279571533203, "global_step": 486626, "epoch": 5862} {"train_loss": -27.22248649597168, "global_step": 486627, "epoch": 5862} {"train_loss": -27.04394708196801, "global_step": 486628, "epoch": 5862, "val_loss": 6555815.0} {"train_loss": -26.4103946685791, "global_step": 486629, "epoch": 5863} {"train_loss": -27.229034423828125, "global_step": 486630, "epoch": 5863} {"train_loss": -26.343280792236328, "global_step": 486631, "epoch": 5863} {"train_loss": -26.790807723999023, "global_step": 486632, "epoch": 5863} {"train_loss": -26.34747886657715, "global_step": 486633, "epoch": 5863} {"train_loss": -26.786651611328125, "global_step": 486634, "epoch": 5863} {"train_loss": -26.549001693725586, "global_step": 486635, "epoch": 5863} {"train_loss": -26.67682456970215, "global_step": 486636, "epoch": 5863} {"train_loss": -26.933795928955078, "global_step": 486637, "epoch": 5863} {"train_loss": -26.841161727905273, "global_step": 486638, "epoch": 5863} {"train_loss": -26.753253936767578, "global_step": 486639, "epoch": 5863} {"train_loss": -27.043577194213867, "global_step": 486640, "epoch": 5863} {"train_loss": -26.522855758666992, "global_step": 486641, "epoch": 5863} {"train_loss": -27.039081573486328, "global_step": 486642, "epoch": 5863} {"train_loss": -27.17823600769043, "global_step": 486643, "epoch": 5863} {"train_loss": -26.917591094970703, "global_step": 486644, "epoch": 5863} {"train_loss": -27.42865562438965, "global_step": 486645, "epoch": 5863} {"train_loss": -27.08746337890625, "global_step": 486646, "epoch": 5863} {"train_loss": -27.1123104095459, "global_step": 486647, "epoch": 5863} {"train_loss": -27.28897476196289, "global_step": 486648, "epoch": 5863} {"train_loss": -26.81422996520996, "global_step": 486649, "epoch": 5863} {"train_loss": -27.04351806640625, "global_step": 486650, "epoch": 5863} {"train_loss": -26.801755905151367, "global_step": 486651, "epoch": 5863} {"train_loss": -27.06947135925293, "global_step": 486652, "epoch": 5863} {"train_loss": -27.19991111755371, "global_step": 486653, "epoch": 5863} {"train_loss": -27.21669578552246, "global_step": 486654, "epoch": 5863} {"train_loss": -27.2054386138916, "global_step": 486655, "epoch": 5863} {"train_loss": -27.093765258789062, "global_step": 486656, "epoch": 5863} {"train_loss": -27.125141143798828, "global_step": 486657, "epoch": 5863} {"train_loss": -27.58786392211914, "global_step": 486658, "epoch": 5863} {"train_loss": -27.481067657470703, "global_step": 486659, "epoch": 5863} {"train_loss": -27.334272384643555, "global_step": 486660, "epoch": 5863} {"train_loss": -26.959745407104492, "global_step": 486661, "epoch": 5863} {"train_loss": -27.392364501953125, "global_step": 486662, "epoch": 5863} {"train_loss": -27.216657638549805, "global_step": 486663, "epoch": 5863} {"train_loss": -27.252485275268555, "global_step": 486664, "epoch": 5863} {"train_loss": -27.34473991394043, "global_step": 486665, "epoch": 5863} {"train_loss": -27.35926628112793, "global_step": 486666, "epoch": 5863} {"train_loss": -27.47812271118164, "global_step": 486667, "epoch": 5863} {"train_loss": -27.437223434448242, "global_step": 486668, "epoch": 5863} {"train_loss": -27.356210708618164, "global_step": 486669, "epoch": 5863} {"train_loss": -27.26766014099121, "global_step": 486670, "epoch": 5863} {"train_loss": -27.493820190429688, "global_step": 486671, "epoch": 5863} {"train_loss": -27.32240867614746, "global_step": 486672, "epoch": 5863} {"train_loss": -27.390771865844727, "global_step": 486673, "epoch": 5863} {"train_loss": -27.59234619140625, "global_step": 486674, "epoch": 5863} {"train_loss": -27.44331932067871, "global_step": 486675, "epoch": 5863} {"train_loss": -27.47796058654785, "global_step": 486676, "epoch": 5863} {"train_loss": -27.4537353515625, "global_step": 486677, "epoch": 5863} {"train_loss": -27.232898712158203, "global_step": 486678, "epoch": 5863} {"train_loss": -27.136798858642578, "global_step": 486679, "epoch": 5863} {"train_loss": -27.417627334594727, "global_step": 486680, "epoch": 5863} {"train_loss": -27.15866470336914, "global_step": 486681, "epoch": 5863} {"train_loss": -27.75130271911621, "global_step": 486682, "epoch": 5863} {"train_loss": -27.47075843811035, "global_step": 486683, "epoch": 5863} {"train_loss": -27.489343643188477, "global_step": 486684, "epoch": 5863} {"train_loss": -27.521955490112305, "global_step": 486685, "epoch": 5863} {"train_loss": -27.485504150390625, "global_step": 486686, "epoch": 5863} {"train_loss": -27.340478897094727, "global_step": 486687, "epoch": 5863} {"train_loss": -27.4963436126709, "global_step": 486688, "epoch": 5863} {"train_loss": -27.20762062072754, "global_step": 486689, "epoch": 5863} {"train_loss": -27.18946647644043, "global_step": 486690, "epoch": 5863} {"train_loss": -27.511152267456055, "global_step": 486691, "epoch": 5863} {"train_loss": -27.414587020874023, "global_step": 486692, "epoch": 5863} {"train_loss": -27.080219268798828, "global_step": 486693, "epoch": 5863} {"train_loss": -27.297468185424805, "global_step": 486694, "epoch": 5863} {"train_loss": -27.01612663269043, "global_step": 486695, "epoch": 5863} {"train_loss": -27.397262573242188, "global_step": 486696, "epoch": 5863} {"train_loss": -27.3295955657959, "global_step": 486697, "epoch": 5863} {"train_loss": -27.4429874420166, "global_step": 486698, "epoch": 5863} {"train_loss": -27.2156925201416, "global_step": 486699, "epoch": 5863} {"train_loss": -27.38336181640625, "global_step": 486700, "epoch": 5863} {"train_loss": -27.2248592376709, "global_step": 486701, "epoch": 5863} {"train_loss": -27.28643798828125, "global_step": 486702, "epoch": 5863} {"train_loss": -27.073766708374023, "global_step": 486703, "epoch": 5863} {"train_loss": -27.47243309020996, "global_step": 486704, "epoch": 5863} {"train_loss": -27.10957145690918, "global_step": 486705, "epoch": 5863} {"train_loss": -26.987598419189453, "global_step": 486706, "epoch": 5863} {"train_loss": -27.230756759643555, "global_step": 486707, "epoch": 5863} {"train_loss": -27.3222599029541, "global_step": 486708, "epoch": 5863} {"train_loss": -27.065027236938477, "global_step": 486709, "epoch": 5863} {"train_loss": -27.056005477905273, "global_step": 486710, "epoch": 5863} {"train_loss": -27.17783116719809, "global_step": 486711, "epoch": 5863, "val_loss": 6551369.0} {"train_loss": -26.63056755065918, "global_step": 486712, "epoch": 5864} {"train_loss": -26.341602325439453, "global_step": 486713, "epoch": 5864} {"train_loss": -26.914880752563477, "global_step": 486714, "epoch": 5864} {"train_loss": -26.9207820892334, "global_step": 486715, "epoch": 5864} {"train_loss": -26.367603302001953, "global_step": 486716, "epoch": 5864} {"train_loss": -26.9034423828125, "global_step": 486717, "epoch": 5864} {"train_loss": -27.075611114501953, "global_step": 486718, "epoch": 5864} {"train_loss": -26.701217651367188, "global_step": 486719, "epoch": 5864} {"train_loss": -26.582128524780273, "global_step": 486720, "epoch": 5864} {"train_loss": -27.261465072631836, "global_step": 486721, "epoch": 5864} {"train_loss": -26.822498321533203, "global_step": 486722, "epoch": 5864} {"train_loss": -27.067474365234375, "global_step": 486723, "epoch": 5864} {"train_loss": -27.2576847076416, "global_step": 486724, "epoch": 5864} {"train_loss": -27.47576904296875, "global_step": 486725, "epoch": 5864} {"train_loss": -27.27967643737793, "global_step": 486726, "epoch": 5864} {"train_loss": -27.174604415893555, "global_step": 486727, "epoch": 5864} {"train_loss": -27.437000274658203, "global_step": 486728, "epoch": 5864} {"train_loss": -27.41021156311035, "global_step": 486729, "epoch": 5864} {"train_loss": -27.33954429626465, "global_step": 486730, "epoch": 5864} {"train_loss": -27.19959831237793, "global_step": 486731, "epoch": 5864} {"train_loss": -27.58565330505371, "global_step": 486732, "epoch": 5864} {"train_loss": -27.29615592956543, "global_step": 486733, "epoch": 5864} {"train_loss": -27.4210147857666, "global_step": 486734, "epoch": 5864} {"train_loss": -27.351896286010742, "global_step": 486735, "epoch": 5864} {"train_loss": -27.3956241607666, "global_step": 486736, "epoch": 5864} {"train_loss": -27.611865997314453, "global_step": 486737, "epoch": 5864} {"train_loss": -27.481897354125977, "global_step": 486738, "epoch": 5864} {"train_loss": -27.291006088256836, "global_step": 486739, "epoch": 5864} {"train_loss": -27.150360107421875, "global_step": 486740, "epoch": 5864} {"train_loss": -27.360319137573242, "global_step": 486741, "epoch": 5864} {"train_loss": -27.505950927734375, "global_step": 486742, "epoch": 5864} {"train_loss": -27.34063720703125, "global_step": 486743, "epoch": 5864} {"train_loss": -27.229658126831055, "global_step": 486744, "epoch": 5864} {"train_loss": -27.000593185424805, "global_step": 486745, "epoch": 5864} {"train_loss": -27.418262481689453, "global_step": 486746, "epoch": 5864} {"train_loss": -27.285154342651367, "global_step": 486747, "epoch": 5864} {"train_loss": -27.251708984375, "global_step": 486748, "epoch": 5864} {"train_loss": -27.06751823425293, "global_step": 486749, "epoch": 5864} {"train_loss": -27.0166072845459, "global_step": 486750, "epoch": 5864} {"train_loss": -27.29075050354004, "global_step": 486751, "epoch": 5864} {"train_loss": -27.130298614501953, "global_step": 486752, "epoch": 5864} {"train_loss": -26.89369010925293, "global_step": 486753, "epoch": 5864} {"train_loss": -27.729169845581055, "global_step": 486754, "epoch": 5864} {"train_loss": -27.451858520507812, "global_step": 486755, "epoch": 5864} {"train_loss": -27.22064208984375, "global_step": 486756, "epoch": 5864} {"train_loss": -27.360517501831055, "global_step": 486757, "epoch": 5864} {"train_loss": -27.2239990234375, "global_step": 486758, "epoch": 5864} {"train_loss": -27.073047637939453, "global_step": 486759, "epoch": 5864} {"train_loss": -26.993133544921875, "global_step": 486760, "epoch": 5864} {"train_loss": -26.925779342651367, "global_step": 486761, "epoch": 5864} {"train_loss": -27.134784698486328, "global_step": 486762, "epoch": 5864} {"train_loss": -27.232675552368164, "global_step": 486763, "epoch": 5864} {"train_loss": -27.16925621032715, "global_step": 486764, "epoch": 5864} {"train_loss": -27.2562198638916, "global_step": 486765, "epoch": 5864} {"train_loss": -26.992874145507812, "global_step": 486766, "epoch": 5864} {"train_loss": -27.338092803955078, "global_step": 486767, "epoch": 5864} {"train_loss": -27.305952072143555, "global_step": 486768, "epoch": 5864} {"train_loss": -27.40692138671875, "global_step": 486769, "epoch": 5864} {"train_loss": -27.74159049987793, "global_step": 486770, "epoch": 5864} {"train_loss": -27.2684326171875, "global_step": 486771, "epoch": 5864} {"train_loss": -27.20708656311035, "global_step": 486772, "epoch": 5864} {"train_loss": -27.35052490234375, "global_step": 486773, "epoch": 5864} {"train_loss": -27.186445236206055, "global_step": 486774, "epoch": 5864} {"train_loss": -27.03468132019043, "global_step": 486775, "epoch": 5864} {"train_loss": -27.505126953125, "global_step": 486776, "epoch": 5864} {"train_loss": -27.444387435913086, "global_step": 486777, "epoch": 5864} {"train_loss": -26.953943252563477, "global_step": 486778, "epoch": 5864} {"train_loss": -27.174535751342773, "global_step": 486779, "epoch": 5864} {"train_loss": -26.65376091003418, "global_step": 486780, "epoch": 5864} {"train_loss": -26.495624542236328, "global_step": 486781, "epoch": 5864} {"train_loss": -26.375463485717773, "global_step": 486782, "epoch": 5864} {"train_loss": -27.108068466186523, "global_step": 486783, "epoch": 5864} {"train_loss": -27.3784236907959, "global_step": 486784, "epoch": 5864} {"train_loss": -27.146820068359375, "global_step": 486785, "epoch": 5864} {"train_loss": -27.133289337158203, "global_step": 486786, "epoch": 5864} {"train_loss": -26.977142333984375, "global_step": 486787, "epoch": 5864} {"train_loss": -27.15284538269043, "global_step": 486788, "epoch": 5864} {"train_loss": -27.475683212280273, "global_step": 486789, "epoch": 5864} {"train_loss": -27.200002670288086, "global_step": 486790, "epoch": 5864} {"train_loss": -27.123205184936523, "global_step": 486791, "epoch": 5864} {"train_loss": -27.510053634643555, "global_step": 486792, "epoch": 5864} {"train_loss": -27.37860679626465, "global_step": 486793, "epoch": 5864} {"train_loss": -27.155578567321044, "global_step": 486794, "epoch": 5864, "val_loss": 6544608.0} {"train_loss": -25.10977554321289, "global_step": 486795, "epoch": 5865} {"train_loss": -23.90065574645996, "global_step": 486796, "epoch": 5865} {"train_loss": -24.58682632446289, "global_step": 486797, "epoch": 5865} {"train_loss": -25.755664825439453, "global_step": 486798, "epoch": 5865} {"train_loss": -25.151235580444336, "global_step": 486799, "epoch": 5865} {"train_loss": -25.7147216796875, "global_step": 486800, "epoch": 5865} {"train_loss": -26.086151123046875, "global_step": 486801, "epoch": 5865} {"train_loss": -26.160919189453125, "global_step": 486802, "epoch": 5865} {"train_loss": -25.894987106323242, "global_step": 486803, "epoch": 5865} {"train_loss": -26.591552734375, "global_step": 486804, "epoch": 5865} {"train_loss": -26.1976261138916, "global_step": 486805, "epoch": 5865} {"train_loss": -26.44280433654785, "global_step": 486806, "epoch": 5865} {"train_loss": -26.462921142578125, "global_step": 486807, "epoch": 5865} {"train_loss": -26.442129135131836, "global_step": 486808, "epoch": 5865} {"train_loss": -26.317819595336914, "global_step": 486809, "epoch": 5865} {"train_loss": -26.59175682067871, "global_step": 486810, "epoch": 5865} {"train_loss": -26.588153839111328, "global_step": 486811, "epoch": 5865} {"train_loss": -26.578125, "global_step": 486812, "epoch": 5865} {"train_loss": -26.760456085205078, "global_step": 486813, "epoch": 5865} {"train_loss": -26.609506607055664, "global_step": 486814, "epoch": 5865} {"train_loss": -26.482908248901367, "global_step": 486815, "epoch": 5865} {"train_loss": -26.62381362915039, "global_step": 486816, "epoch": 5865} {"train_loss": -26.755765914916992, "global_step": 486817, "epoch": 5865} {"train_loss": -26.66436195373535, "global_step": 486818, "epoch": 5865} {"train_loss": -26.37519645690918, "global_step": 486819, "epoch": 5865} {"train_loss": -27.052637100219727, "global_step": 486820, "epoch": 5865} {"train_loss": -26.78899574279785, "global_step": 486821, "epoch": 5865} {"train_loss": -27.2585506439209, "global_step": 486822, "epoch": 5865} {"train_loss": -26.75361442565918, "global_step": 486823, "epoch": 5865} {"train_loss": -27.057220458984375, "global_step": 486824, "epoch": 5865} {"train_loss": -26.686649322509766, "global_step": 486825, "epoch": 5865} {"train_loss": -27.218420028686523, "global_step": 486826, "epoch": 5865} {"train_loss": -26.892919540405273, "global_step": 486827, "epoch": 5865} {"train_loss": -26.857892990112305, "global_step": 486828, "epoch": 5865} {"train_loss": -27.247278213500977, "global_step": 486829, "epoch": 5865} {"train_loss": -27.233057022094727, "global_step": 486830, "epoch": 5865} {"train_loss": -27.342910766601562, "global_step": 486831, "epoch": 5865} {"train_loss": -27.356372833251953, "global_step": 486832, "epoch": 5865} {"train_loss": -27.21384620666504, "global_step": 486833, "epoch": 5865} {"train_loss": -27.511350631713867, "global_step": 486834, "epoch": 5865} {"train_loss": -27.37513542175293, "global_step": 486835, "epoch": 5865} {"train_loss": -27.462011337280273, "global_step": 486836, "epoch": 5865} {"train_loss": -27.129810333251953, "global_step": 486837, "epoch": 5865} {"train_loss": -27.032917022705078, "global_step": 486838, "epoch": 5865} {"train_loss": -27.798095703125, "global_step": 486839, "epoch": 5865} {"train_loss": -27.127111434936523, "global_step": 486840, "epoch": 5865} {"train_loss": -27.472564697265625, "global_step": 486841, "epoch": 5865} {"train_loss": -27.212966918945312, "global_step": 486842, "epoch": 5865} {"train_loss": -27.158405303955078, "global_step": 486843, "epoch": 5865} {"train_loss": -27.307767868041992, "global_step": 486844, "epoch": 5865} {"train_loss": -27.55849266052246, "global_step": 486845, "epoch": 5865} {"train_loss": -27.377607345581055, "global_step": 486846, "epoch": 5865} {"train_loss": -27.238754272460938, "global_step": 486847, "epoch": 5865} {"train_loss": -27.23186683654785, "global_step": 486848, "epoch": 5865} {"train_loss": -27.354248046875, "global_step": 486849, "epoch": 5865} {"train_loss": -27.365646362304688, "global_step": 486850, "epoch": 5865} {"train_loss": -27.6001033782959, "global_step": 486851, "epoch": 5865} {"train_loss": -27.038129806518555, "global_step": 486852, "epoch": 5865} {"train_loss": -27.677953720092773, "global_step": 486853, "epoch": 5865} {"train_loss": -27.525365829467773, "global_step": 486854, "epoch": 5865} {"train_loss": -27.538211822509766, "global_step": 486855, "epoch": 5865} {"train_loss": -27.579578399658203, "global_step": 486856, "epoch": 5865} {"train_loss": -27.496740341186523, "global_step": 486857, "epoch": 5865} {"train_loss": -27.624637603759766, "global_step": 486858, "epoch": 5865} {"train_loss": -27.04465675354004, "global_step": 486859, "epoch": 5865} {"train_loss": -27.44761085510254, "global_step": 486860, "epoch": 5865} {"train_loss": -27.48383903503418, "global_step": 486861, "epoch": 5865} {"train_loss": -27.584863662719727, "global_step": 486862, "epoch": 5865} {"train_loss": -27.641393661499023, "global_step": 486863, "epoch": 5865} {"train_loss": -27.45562744140625, "global_step": 486864, "epoch": 5865} {"train_loss": -27.700368881225586, "global_step": 486865, "epoch": 5865} {"train_loss": -27.602075576782227, "global_step": 486866, "epoch": 5865} {"train_loss": -27.422922134399414, "global_step": 486867, "epoch": 5865} {"train_loss": -27.48615837097168, "global_step": 486868, "epoch": 5865} {"train_loss": -27.626264572143555, "global_step": 486869, "epoch": 5865} {"train_loss": -27.536962509155273, "global_step": 486870, "epoch": 5865} {"train_loss": -27.3634033203125, "global_step": 486871, "epoch": 5865} {"train_loss": -27.50385856628418, "global_step": 486872, "epoch": 5865} {"train_loss": -27.232980728149414, "global_step": 486873, "epoch": 5865} {"train_loss": -27.323089599609375, "global_step": 486874, "epoch": 5865} {"train_loss": -27.1444034576416, "global_step": 486875, "epoch": 5865} {"train_loss": -26.962430953979492, "global_step": 486876, "epoch": 5865} {"train_loss": -26.960614078016167, "global_step": 486877, "epoch": 5865, "val_loss": 6537003.0} {"train_loss": -25.159324645996094, "global_step": 486878, "epoch": 5866} {"train_loss": -25.121417999267578, "global_step": 486879, "epoch": 5866} {"train_loss": -24.933616638183594, "global_step": 486880, "epoch": 5866} {"train_loss": -25.9124755859375, "global_step": 486881, "epoch": 5866} {"train_loss": -26.62898826599121, "global_step": 486882, "epoch": 5866} {"train_loss": -25.273019790649414, "global_step": 486883, "epoch": 5866} {"train_loss": -25.149953842163086, "global_step": 486884, "epoch": 5866} {"train_loss": -26.516672134399414, "global_step": 486885, "epoch": 5866} {"train_loss": -25.790851593017578, "global_step": 486886, "epoch": 5866} {"train_loss": -26.47981071472168, "global_step": 486887, "epoch": 5866} {"train_loss": -26.28611183166504, "global_step": 486888, "epoch": 5866} {"train_loss": -26.213769912719727, "global_step": 486889, "epoch": 5866} {"train_loss": -26.48333168029785, "global_step": 486890, "epoch": 5866} {"train_loss": -26.719207763671875, "global_step": 486891, "epoch": 5866} {"train_loss": -26.667150497436523, "global_step": 486892, "epoch": 5866} {"train_loss": -26.168384552001953, "global_step": 486893, "epoch": 5866} {"train_loss": -26.561420440673828, "global_step": 486894, "epoch": 5866} {"train_loss": -26.646432876586914, "global_step": 486895, "epoch": 5866} {"train_loss": -26.68426513671875, "global_step": 486896, "epoch": 5866} {"train_loss": -26.9914608001709, "global_step": 486897, "epoch": 5866} {"train_loss": -26.435583114624023, "global_step": 486898, "epoch": 5866} {"train_loss": -26.783945083618164, "global_step": 486899, "epoch": 5866} {"train_loss": -27.200361251831055, "global_step": 486900, "epoch": 5866} {"train_loss": -26.89776039123535, "global_step": 486901, "epoch": 5866} {"train_loss": -26.806228637695312, "global_step": 486902, "epoch": 5866} {"train_loss": -26.93977165222168, "global_step": 486903, "epoch": 5866} {"train_loss": -26.929651260375977, "global_step": 486904, "epoch": 5866} {"train_loss": -26.858068466186523, "global_step": 486905, "epoch": 5866} {"train_loss": -26.5216064453125, "global_step": 486906, "epoch": 5866} {"train_loss": -26.761770248413086, "global_step": 486907, "epoch": 5866} {"train_loss": -26.65705680847168, "global_step": 486908, "epoch": 5866} {"train_loss": -27.21723747253418, "global_step": 486909, "epoch": 5866} {"train_loss": -27.41395378112793, "global_step": 486910, "epoch": 5866} {"train_loss": -27.125425338745117, "global_step": 486911, "epoch": 5866} {"train_loss": -26.940053939819336, "global_step": 486912, "epoch": 5866} {"train_loss": -27.197370529174805, "global_step": 486913, "epoch": 5866} {"train_loss": -27.174551010131836, "global_step": 486914, "epoch": 5866} {"train_loss": -27.09268569946289, "global_step": 486915, "epoch": 5866} {"train_loss": -27.04092788696289, "global_step": 486916, "epoch": 5866} {"train_loss": -27.302392959594727, "global_step": 486917, "epoch": 5866} {"train_loss": -27.60682487487793, "global_step": 486918, "epoch": 5866} {"train_loss": -27.03047752380371, "global_step": 486919, "epoch": 5866} {"train_loss": -27.090042114257812, "global_step": 486920, "epoch": 5866} {"train_loss": -27.139148712158203, "global_step": 486921, "epoch": 5866} {"train_loss": -27.32118034362793, "global_step": 486922, "epoch": 5866} {"train_loss": -27.154287338256836, "global_step": 486923, "epoch": 5866} {"train_loss": -27.51934242248535, "global_step": 486924, "epoch": 5866} {"train_loss": -27.67616081237793, "global_step": 486925, "epoch": 5866} {"train_loss": -27.482406616210938, "global_step": 486926, "epoch": 5866} {"train_loss": -27.67864990234375, "global_step": 486927, "epoch": 5866} {"train_loss": -27.613544464111328, "global_step": 486928, "epoch": 5866} {"train_loss": -27.147216796875, "global_step": 486929, "epoch": 5866} {"train_loss": -27.4947566986084, "global_step": 486930, "epoch": 5866} {"train_loss": -27.56247329711914, "global_step": 486931, "epoch": 5866} {"train_loss": -27.3392333984375, "global_step": 486932, "epoch": 5866} {"train_loss": -27.615604400634766, "global_step": 486933, "epoch": 5866} {"train_loss": -27.311996459960938, "global_step": 486934, "epoch": 5866} {"train_loss": -27.7169132232666, "global_step": 486935, "epoch": 5866} {"train_loss": -27.400638580322266, "global_step": 486936, "epoch": 5866} {"train_loss": -27.527557373046875, "global_step": 486937, "epoch": 5866} {"train_loss": -27.334020614624023, "global_step": 486938, "epoch": 5866} {"train_loss": -27.004987716674805, "global_step": 486939, "epoch": 5866} {"train_loss": -27.42732048034668, "global_step": 486940, "epoch": 5866} {"train_loss": -27.049283981323242, "global_step": 486941, "epoch": 5866} {"train_loss": -27.589111328125, "global_step": 486942, "epoch": 5866} {"train_loss": -27.38107681274414, "global_step": 486943, "epoch": 5866} {"train_loss": -27.500959396362305, "global_step": 486944, "epoch": 5866} {"train_loss": -27.54254722595215, "global_step": 486945, "epoch": 5866} {"train_loss": -27.576080322265625, "global_step": 486946, "epoch": 5866} {"train_loss": -27.222883224487305, "global_step": 486947, "epoch": 5866} {"train_loss": -27.497833251953125, "global_step": 486948, "epoch": 5866} {"train_loss": -27.119983673095703, "global_step": 486949, "epoch": 5866} {"train_loss": -27.280561447143555, "global_step": 486950, "epoch": 5866} {"train_loss": -27.677173614501953, "global_step": 486951, "epoch": 5866} {"train_loss": -27.45423698425293, "global_step": 486952, "epoch": 5866} {"train_loss": -27.45412254333496, "global_step": 486953, "epoch": 5866} {"train_loss": -27.570775985717773, "global_step": 486954, "epoch": 5866} {"train_loss": -27.61505699157715, "global_step": 486955, "epoch": 5866} {"train_loss": -26.8149356842041, "global_step": 486956, "epoch": 5866} {"train_loss": -26.11624526977539, "global_step": 486957, "epoch": 5866} {"train_loss": -27.243234634399414, "global_step": 486958, "epoch": 5866} {"train_loss": -27.51059341430664, "global_step": 486959, "epoch": 5866} {"train_loss": -26.954800203622106, "global_step": 486960, "epoch": 5866, "val_loss": 6497674.5} {"train_loss": -26.14510154724121, "global_step": 486961, "epoch": 5867} {"train_loss": -26.088531494140625, "global_step": 486962, "epoch": 5867} {"train_loss": -25.84498405456543, "global_step": 486963, "epoch": 5867} {"train_loss": -24.720788955688477, "global_step": 486964, "epoch": 5867} {"train_loss": -25.27069091796875, "global_step": 486965, "epoch": 5867} {"train_loss": -26.297353744506836, "global_step": 486966, "epoch": 5867} {"train_loss": -26.019861221313477, "global_step": 486967, "epoch": 5867} {"train_loss": -25.814273834228516, "global_step": 486968, "epoch": 5867} {"train_loss": -26.210508346557617, "global_step": 486969, "epoch": 5867} {"train_loss": -26.26954460144043, "global_step": 486970, "epoch": 5867} {"train_loss": -25.907541275024414, "global_step": 486971, "epoch": 5867} {"train_loss": -26.21244239807129, "global_step": 486972, "epoch": 5867} {"train_loss": -25.920560836791992, "global_step": 486973, "epoch": 5867} {"train_loss": -26.656232833862305, "global_step": 486974, "epoch": 5867} {"train_loss": -26.471250534057617, "global_step": 486975, "epoch": 5867} {"train_loss": -26.28609275817871, "global_step": 486976, "epoch": 5867} {"train_loss": -26.41987419128418, "global_step": 486977, "epoch": 5867} {"train_loss": -26.43718910217285, "global_step": 486978, "epoch": 5867} {"train_loss": -26.369403839111328, "global_step": 486979, "epoch": 5867} {"train_loss": -26.512670516967773, "global_step": 486980, "epoch": 5867} {"train_loss": -26.249286651611328, "global_step": 486981, "epoch": 5867} {"train_loss": -26.302474975585938, "global_step": 486982, "epoch": 5867} {"train_loss": -26.452478408813477, "global_step": 486983, "epoch": 5867} {"train_loss": -26.413450241088867, "global_step": 486984, "epoch": 5867} {"train_loss": -26.560577392578125, "global_step": 486985, "epoch": 5867} {"train_loss": -26.510406494140625, "global_step": 486986, "epoch": 5867} {"train_loss": -26.807104110717773, "global_step": 486987, "epoch": 5867} {"train_loss": -26.78261375427246, "global_step": 486988, "epoch": 5867} {"train_loss": -26.940134048461914, "global_step": 486989, "epoch": 5867} {"train_loss": -27.071857452392578, "global_step": 486990, "epoch": 5867} {"train_loss": -27.146310806274414, "global_step": 486991, "epoch": 5867} {"train_loss": -27.06732177734375, "global_step": 486992, "epoch": 5867} {"train_loss": -26.950550079345703, "global_step": 486993, "epoch": 5867} {"train_loss": -27.20672035217285, "global_step": 486994, "epoch": 5867} {"train_loss": -27.396194458007812, "global_step": 486995, "epoch": 5867} {"train_loss": -27.270376205444336, "global_step": 486996, "epoch": 5867} {"train_loss": -27.001800537109375, "global_step": 486997, "epoch": 5867} {"train_loss": -27.4158992767334, "global_step": 486998, "epoch": 5867} {"train_loss": -27.055130004882812, "global_step": 486999, "epoch": 5867} {"train_loss": -27.31459617614746, "global_step": 487000, "epoch": 5867} {"train_loss": -27.06355094909668, "global_step": 487001, "epoch": 5867} {"train_loss": -27.192462921142578, "global_step": 487002, "epoch": 5867} {"train_loss": -26.83404541015625, "global_step": 487003, "epoch": 5867} {"train_loss": -27.458160400390625, "global_step": 487004, "epoch": 5867} {"train_loss": -27.302907943725586, "global_step": 487005, "epoch": 5867} {"train_loss": -27.30179786682129, "global_step": 487006, "epoch": 5867} {"train_loss": -27.8218936920166, "global_step": 487007, "epoch": 5867} {"train_loss": -27.390884399414062, "global_step": 487008, "epoch": 5867} {"train_loss": -27.26070213317871, "global_step": 487009, "epoch": 5867} {"train_loss": -27.414209365844727, "global_step": 487010, "epoch": 5867} {"train_loss": -27.522235870361328, "global_step": 487011, "epoch": 5867} {"train_loss": -27.193857192993164, "global_step": 487012, "epoch": 5867} {"train_loss": -27.356191635131836, "global_step": 487013, "epoch": 5867} {"train_loss": -27.733423233032227, "global_step": 487014, "epoch": 5867} {"train_loss": -27.26594352722168, "global_step": 487015, "epoch": 5867} {"train_loss": -27.659839630126953, "global_step": 487016, "epoch": 5867} {"train_loss": -27.41826820373535, "global_step": 487017, "epoch": 5867} {"train_loss": -27.38905906677246, "global_step": 487018, "epoch": 5867} {"train_loss": -27.31319236755371, "global_step": 487019, "epoch": 5867} {"train_loss": -27.401208877563477, "global_step": 487020, "epoch": 5867} {"train_loss": -27.186553955078125, "global_step": 487021, "epoch": 5867} {"train_loss": -27.576810836791992, "global_step": 487022, "epoch": 5867} {"train_loss": -27.40633201599121, "global_step": 487023, "epoch": 5867} {"train_loss": -27.22035026550293, "global_step": 487024, "epoch": 5867} {"train_loss": -27.551538467407227, "global_step": 487025, "epoch": 5867} {"train_loss": -27.703290939331055, "global_step": 487026, "epoch": 5867} {"train_loss": -27.528226852416992, "global_step": 487027, "epoch": 5867} {"train_loss": -27.52597427368164, "global_step": 487028, "epoch": 5867} {"train_loss": -27.53142738342285, "global_step": 487029, "epoch": 5867} {"train_loss": -27.18184471130371, "global_step": 487030, "epoch": 5867} {"train_loss": -27.5601863861084, "global_step": 487031, "epoch": 5867} {"train_loss": -27.22247314453125, "global_step": 487032, "epoch": 5867} {"train_loss": -27.45563316345215, "global_step": 487033, "epoch": 5867} {"train_loss": -27.1799259185791, "global_step": 487034, "epoch": 5867} {"train_loss": -27.074872970581055, "global_step": 487035, "epoch": 5867} {"train_loss": -27.189889907836914, "global_step": 487036, "epoch": 5867} {"train_loss": -27.43427085876465, "global_step": 487037, "epoch": 5867} {"train_loss": -27.08843994140625, "global_step": 487038, "epoch": 5867} {"train_loss": -27.103931427001953, "global_step": 487039, "epoch": 5867} {"train_loss": -27.419544219970703, "global_step": 487040, "epoch": 5867} {"train_loss": -27.248151779174805, "global_step": 487041, "epoch": 5867} {"train_loss": -27.339111328125, "global_step": 487042, "epoch": 5867} {"train_loss": -26.94942265246288, "global_step": 487043, "epoch": 5867, "val_loss": 6558467.5} {"train_loss": -27.146530151367188, "global_step": 487044, "epoch": 5868} {"train_loss": -26.28363609313965, "global_step": 487045, "epoch": 5868} {"train_loss": -27.071874618530273, "global_step": 487046, "epoch": 5868} {"train_loss": -26.99055290222168, "global_step": 487047, "epoch": 5868} {"train_loss": -26.278675079345703, "global_step": 487048, "epoch": 5868} {"train_loss": -26.85712242126465, "global_step": 487049, "epoch": 5868} {"train_loss": -26.922107696533203, "global_step": 487050, "epoch": 5868} {"train_loss": -27.06048011779785, "global_step": 487051, "epoch": 5868} {"train_loss": -26.450183868408203, "global_step": 487052, "epoch": 5868} {"train_loss": -27.297266006469727, "global_step": 487053, "epoch": 5868} {"train_loss": -26.900592803955078, "global_step": 487054, "epoch": 5868} {"train_loss": -26.80311393737793, "global_step": 487055, "epoch": 5868} {"train_loss": -27.359176635742188, "global_step": 487056, "epoch": 5868} {"train_loss": -26.66251564025879, "global_step": 487057, "epoch": 5868} {"train_loss": -27.290332794189453, "global_step": 487058, "epoch": 5868} {"train_loss": -26.69040298461914, "global_step": 487059, "epoch": 5868} {"train_loss": -26.945642471313477, "global_step": 487060, "epoch": 5868} {"train_loss": -26.8026065826416, "global_step": 487061, "epoch": 5868} {"train_loss": -26.99883460998535, "global_step": 487062, "epoch": 5868} {"train_loss": -26.925601959228516, "global_step": 487063, "epoch": 5868} {"train_loss": -27.1464786529541, "global_step": 487064, "epoch": 5868} {"train_loss": -27.607648849487305, "global_step": 487065, "epoch": 5868} {"train_loss": -27.089252471923828, "global_step": 487066, "epoch": 5868} {"train_loss": -26.79131507873535, "global_step": 487067, "epoch": 5868} {"train_loss": -27.227060317993164, "global_step": 487068, "epoch": 5868} {"train_loss": -26.55486488342285, "global_step": 487069, "epoch": 5868} {"train_loss": -26.900129318237305, "global_step": 487070, "epoch": 5868} {"train_loss": -27.05010414123535, "global_step": 487071, "epoch": 5868} {"train_loss": -26.960651397705078, "global_step": 487072, "epoch": 5868} {"train_loss": -27.040464401245117, "global_step": 487073, "epoch": 5868} {"train_loss": -27.355606079101562, "global_step": 487074, "epoch": 5868} {"train_loss": -26.7209415435791, "global_step": 487075, "epoch": 5868} {"train_loss": -27.200170516967773, "global_step": 487076, "epoch": 5868} {"train_loss": -26.849018096923828, "global_step": 487077, "epoch": 5868} {"train_loss": -27.1336612701416, "global_step": 487078, "epoch": 5868} {"train_loss": -27.10965919494629, "global_step": 487079, "epoch": 5868} {"train_loss": -27.0577392578125, "global_step": 487080, "epoch": 5868} {"train_loss": -27.403852462768555, "global_step": 487081, "epoch": 5868} {"train_loss": -27.461652755737305, "global_step": 487082, "epoch": 5868} {"train_loss": -27.352834701538086, "global_step": 487083, "epoch": 5868} {"train_loss": -27.44378089904785, "global_step": 487084, "epoch": 5868} {"train_loss": -27.249311447143555, "global_step": 487085, "epoch": 5868} {"train_loss": -27.222692489624023, "global_step": 487086, "epoch": 5868} {"train_loss": -27.64923095703125, "global_step": 487087, "epoch": 5868} {"train_loss": -27.333663940429688, "global_step": 487088, "epoch": 5868} {"train_loss": -27.395872116088867, "global_step": 487089, "epoch": 5868} {"train_loss": -27.160938262939453, "global_step": 487090, "epoch": 5868} {"train_loss": -27.647703170776367, "global_step": 487091, "epoch": 5868} {"train_loss": -27.88492774963379, "global_step": 487092, "epoch": 5868} {"train_loss": -27.415491104125977, "global_step": 487093, "epoch": 5868} {"train_loss": -27.467060089111328, "global_step": 487094, "epoch": 5868} {"train_loss": -27.56134033203125, "global_step": 487095, "epoch": 5868} {"train_loss": -27.5080509185791, "global_step": 487096, "epoch": 5868} {"train_loss": -27.637638092041016, "global_step": 487097, "epoch": 5868} {"train_loss": -27.563648223876953, "global_step": 487098, "epoch": 5868} {"train_loss": -27.544830322265625, "global_step": 487099, "epoch": 5868} {"train_loss": -27.410003662109375, "global_step": 487100, "epoch": 5868} {"train_loss": -27.709014892578125, "global_step": 487101, "epoch": 5868} {"train_loss": -27.474111557006836, "global_step": 487102, "epoch": 5868} {"train_loss": -27.4116153717041, "global_step": 487103, "epoch": 5868} {"train_loss": -27.79621696472168, "global_step": 487104, "epoch": 5868} {"train_loss": -27.423871994018555, "global_step": 487105, "epoch": 5868} {"train_loss": -27.409168243408203, "global_step": 487106, "epoch": 5868} {"train_loss": -27.522232055664062, "global_step": 487107, "epoch": 5868} {"train_loss": -27.51226234436035, "global_step": 487108, "epoch": 5868} {"train_loss": -27.315753936767578, "global_step": 487109, "epoch": 5868} {"train_loss": -27.526351928710938, "global_step": 487110, "epoch": 5868} {"train_loss": -27.324567794799805, "global_step": 487111, "epoch": 5868} {"train_loss": -27.412214279174805, "global_step": 487112, "epoch": 5868} {"train_loss": -27.438146591186523, "global_step": 487113, "epoch": 5868} {"train_loss": -27.593292236328125, "global_step": 487114, "epoch": 5868} {"train_loss": -27.5367374420166, "global_step": 487115, "epoch": 5868} {"train_loss": -27.286060333251953, "global_step": 487116, "epoch": 5868} {"train_loss": -27.19500160217285, "global_step": 487117, "epoch": 5868} {"train_loss": -26.737201690673828, "global_step": 487118, "epoch": 5868} {"train_loss": -26.729162216186523, "global_step": 487119, "epoch": 5868} {"train_loss": -26.7916202545166, "global_step": 487120, "epoch": 5868} {"train_loss": -26.424535751342773, "global_step": 487121, "epoch": 5868} {"train_loss": -26.818212509155273, "global_step": 487122, "epoch": 5868} {"train_loss": -27.1603946685791, "global_step": 487123, "epoch": 5868} {"train_loss": -26.86429214477539, "global_step": 487124, "epoch": 5868} {"train_loss": -26.65032386779785, "global_step": 487125, "epoch": 5868} {"train_loss": -27.154064592108668, "global_step": 487126, "epoch": 5868, "val_loss": 6529397.0} {"train_loss": -26.34821128845215, "global_step": 487127, "epoch": 5869} {"train_loss": -26.899866104125977, "global_step": 487128, "epoch": 5869} {"train_loss": -26.762100219726562, "global_step": 487129, "epoch": 5869} {"train_loss": -25.879995346069336, "global_step": 487130, "epoch": 5869} {"train_loss": -26.927417755126953, "global_step": 487131, "epoch": 5869} {"train_loss": -26.703840255737305, "global_step": 487132, "epoch": 5869} {"train_loss": -26.7926082611084, "global_step": 487133, "epoch": 5869} {"train_loss": -26.782567977905273, "global_step": 487134, "epoch": 5869} {"train_loss": -26.513565063476562, "global_step": 487135, "epoch": 5869} {"train_loss": -26.597070693969727, "global_step": 487136, "epoch": 5869} {"train_loss": -26.014856338500977, "global_step": 487137, "epoch": 5869} {"train_loss": -26.918664932250977, "global_step": 487138, "epoch": 5869} {"train_loss": -26.616775512695312, "global_step": 487139, "epoch": 5869} {"train_loss": -26.62540054321289, "global_step": 487140, "epoch": 5869} {"train_loss": -26.90302085876465, "global_step": 487141, "epoch": 5869} {"train_loss": -26.835437774658203, "global_step": 487142, "epoch": 5869} {"train_loss": -26.94782066345215, "global_step": 487143, "epoch": 5869} {"train_loss": -27.030969619750977, "global_step": 487144, "epoch": 5869} {"train_loss": -26.778308868408203, "global_step": 487145, "epoch": 5869} {"train_loss": -27.115524291992188, "global_step": 487146, "epoch": 5869} {"train_loss": -27.0201358795166, "global_step": 487147, "epoch": 5869} {"train_loss": -27.295795440673828, "global_step": 487148, "epoch": 5869} {"train_loss": -26.613622665405273, "global_step": 487149, "epoch": 5869} {"train_loss": -27.149444580078125, "global_step": 487150, "epoch": 5869} {"train_loss": -27.02178382873535, "global_step": 487151, "epoch": 5869} {"train_loss": -27.281030654907227, "global_step": 487152, "epoch": 5869} {"train_loss": -26.914758682250977, "global_step": 487153, "epoch": 5869} {"train_loss": -27.048187255859375, "global_step": 487154, "epoch": 5869} {"train_loss": -27.189228057861328, "global_step": 487155, "epoch": 5869} {"train_loss": -27.336505889892578, "global_step": 487156, "epoch": 5869} {"train_loss": -27.31499671936035, "global_step": 487157, "epoch": 5869} {"train_loss": -27.3525390625, "global_step": 487158, "epoch": 5869} {"train_loss": -27.621076583862305, "global_step": 487159, "epoch": 5869} {"train_loss": -27.322586059570312, "global_step": 487160, "epoch": 5869} {"train_loss": -27.02805519104004, "global_step": 487161, "epoch": 5869} {"train_loss": -27.418054580688477, "global_step": 487162, "epoch": 5869} {"train_loss": -27.407506942749023, "global_step": 487163, "epoch": 5869} {"train_loss": -27.14544677734375, "global_step": 487164, "epoch": 5869} {"train_loss": -27.046823501586914, "global_step": 487165, "epoch": 5869} {"train_loss": -27.333967208862305, "global_step": 487166, "epoch": 5869} {"train_loss": -27.498947143554688, "global_step": 487167, "epoch": 5869} {"train_loss": -27.244342803955078, "global_step": 487168, "epoch": 5869} {"train_loss": -27.423908233642578, "global_step": 487169, "epoch": 5869} {"train_loss": -27.255390167236328, "global_step": 487170, "epoch": 5869} {"train_loss": -27.2437744140625, "global_step": 487171, "epoch": 5869} {"train_loss": -27.37139892578125, "global_step": 487172, "epoch": 5869} {"train_loss": -27.513208389282227, "global_step": 487173, "epoch": 5869} {"train_loss": -27.488189697265625, "global_step": 487174, "epoch": 5869} {"train_loss": -27.295257568359375, "global_step": 487175, "epoch": 5869} {"train_loss": -27.803211212158203, "global_step": 487176, "epoch": 5869} {"train_loss": -26.9289608001709, "global_step": 487177, "epoch": 5869} {"train_loss": -27.209625244140625, "global_step": 487178, "epoch": 5869} {"train_loss": -26.571313858032227, "global_step": 487179, "epoch": 5869} {"train_loss": -27.206329345703125, "global_step": 487180, "epoch": 5869} {"train_loss": -26.956846237182617, "global_step": 487181, "epoch": 5869} {"train_loss": -27.69085121154785, "global_step": 487182, "epoch": 5869} {"train_loss": -26.656330108642578, "global_step": 487183, "epoch": 5869} {"train_loss": -26.82480239868164, "global_step": 487184, "epoch": 5869} {"train_loss": -27.300992965698242, "global_step": 487185, "epoch": 5869} {"train_loss": -26.99338722229004, "global_step": 487186, "epoch": 5869} {"train_loss": -27.64589500427246, "global_step": 487187, "epoch": 5869} {"train_loss": -27.25282096862793, "global_step": 487188, "epoch": 5869} {"train_loss": -27.07200050354004, "global_step": 487189, "epoch": 5869} {"train_loss": -27.089614868164062, "global_step": 487190, "epoch": 5869} {"train_loss": -27.43706703186035, "global_step": 487191, "epoch": 5869} {"train_loss": -27.201868057250977, "global_step": 487192, "epoch": 5869} {"train_loss": -27.290283203125, "global_step": 487193, "epoch": 5869} {"train_loss": -27.3347110748291, "global_step": 487194, "epoch": 5869} {"train_loss": -27.52948570251465, "global_step": 487195, "epoch": 5869} {"train_loss": -27.37629508972168, "global_step": 487196, "epoch": 5869} {"train_loss": -27.265594482421875, "global_step": 487197, "epoch": 5869} {"train_loss": -27.495038986206055, "global_step": 487198, "epoch": 5869} {"train_loss": -27.53923988342285, "global_step": 487199, "epoch": 5869} {"train_loss": -27.65803337097168, "global_step": 487200, "epoch": 5869} {"train_loss": -27.37729263305664, "global_step": 487201, "epoch": 5869} {"train_loss": -27.6539363861084, "global_step": 487202, "epoch": 5869} {"train_loss": -27.415754318237305, "global_step": 487203, "epoch": 5869} {"train_loss": -27.476537704467773, "global_step": 487204, "epoch": 5869} {"train_loss": -27.297643661499023, "global_step": 487205, "epoch": 5869} {"train_loss": -27.54361915588379, "global_step": 487206, "epoch": 5869} {"train_loss": -27.58139991760254, "global_step": 487207, "epoch": 5869} {"train_loss": -27.561038970947266, "global_step": 487208, "epoch": 5869} {"train_loss": -27.14036911654185, "global_step": 487209, "epoch": 5869, "val_loss": 6612284.5} {"train_loss": -27.2532901763916, "global_step": 487210, "epoch": 5870} {"train_loss": -26.29031753540039, "global_step": 487211, "epoch": 5870} {"train_loss": -26.0801944732666, "global_step": 487212, "epoch": 5870} {"train_loss": -25.872058868408203, "global_step": 487213, "epoch": 5870} {"train_loss": -26.329809188842773, "global_step": 487214, "epoch": 5870} {"train_loss": -26.958154678344727, "global_step": 487215, "epoch": 5870} {"train_loss": -26.902875900268555, "global_step": 487216, "epoch": 5870} {"train_loss": -26.484472274780273, "global_step": 487217, "epoch": 5870} {"train_loss": -27.162185668945312, "global_step": 487218, "epoch": 5870} {"train_loss": -27.035877227783203, "global_step": 487219, "epoch": 5870} {"train_loss": -27.31439208984375, "global_step": 487220, "epoch": 5870} {"train_loss": -26.719449996948242, "global_step": 487221, "epoch": 5870} {"train_loss": -27.234333038330078, "global_step": 487222, "epoch": 5870} {"train_loss": -27.02997398376465, "global_step": 487223, "epoch": 5870} {"train_loss": -27.22273063659668, "global_step": 487224, "epoch": 5870} {"train_loss": -27.170270919799805, "global_step": 487225, "epoch": 5870} {"train_loss": -26.76303482055664, "global_step": 487226, "epoch": 5870} {"train_loss": -26.781702041625977, "global_step": 487227, "epoch": 5870} {"train_loss": -27.525787353515625, "global_step": 487228, "epoch": 5870} {"train_loss": -27.108020782470703, "global_step": 487229, "epoch": 5870} {"train_loss": -27.200597763061523, "global_step": 487230, "epoch": 5870} {"train_loss": -27.354047775268555, "global_step": 487231, "epoch": 5870} {"train_loss": -27.21150016784668, "global_step": 487232, "epoch": 5870} {"train_loss": -27.4498233795166, "global_step": 487233, "epoch": 5870} {"train_loss": -27.29799461364746, "global_step": 487234, "epoch": 5870} {"train_loss": -27.2022762298584, "global_step": 487235, "epoch": 5870} {"train_loss": -27.15151023864746, "global_step": 487236, "epoch": 5870} {"train_loss": -27.150846481323242, "global_step": 487237, "epoch": 5870} {"train_loss": -27.445581436157227, "global_step": 487238, "epoch": 5870} {"train_loss": -27.561975479125977, "global_step": 487239, "epoch": 5870} {"train_loss": -27.676427841186523, "global_step": 487240, "epoch": 5870} {"train_loss": -27.532184600830078, "global_step": 487241, "epoch": 5870} {"train_loss": -27.61822509765625, "global_step": 487242, "epoch": 5870} {"train_loss": -27.437793731689453, "global_step": 487243, "epoch": 5870} {"train_loss": -27.57398796081543, "global_step": 487244, "epoch": 5870} {"train_loss": -27.270559310913086, "global_step": 487245, "epoch": 5870} {"train_loss": -27.23000144958496, "global_step": 487246, "epoch": 5870} {"train_loss": -27.502103805541992, "global_step": 487247, "epoch": 5870} {"train_loss": -27.283781051635742, "global_step": 487248, "epoch": 5870} {"train_loss": -27.709497451782227, "global_step": 487249, "epoch": 5870} {"train_loss": -27.36869239807129, "global_step": 487250, "epoch": 5870} {"train_loss": -27.662744522094727, "global_step": 487251, "epoch": 5870} {"train_loss": -27.54973793029785, "global_step": 487252, "epoch": 5870} {"train_loss": -27.681110382080078, "global_step": 487253, "epoch": 5870} {"train_loss": -27.30914306640625, "global_step": 487254, "epoch": 5870} {"train_loss": -27.255329132080078, "global_step": 487255, "epoch": 5870} {"train_loss": -27.75872230529785, "global_step": 487256, "epoch": 5870} {"train_loss": -27.0853328704834, "global_step": 487257, "epoch": 5870} {"train_loss": -27.522363662719727, "global_step": 487258, "epoch": 5870} {"train_loss": -27.575979232788086, "global_step": 487259, "epoch": 5870} {"train_loss": -27.554916381835938, "global_step": 487260, "epoch": 5870} {"train_loss": -27.764677047729492, "global_step": 487261, "epoch": 5870} {"train_loss": -27.890470504760742, "global_step": 487262, "epoch": 5870} {"train_loss": -27.70944595336914, "global_step": 487263, "epoch": 5870} {"train_loss": -27.05596351623535, "global_step": 487264, "epoch": 5870} {"train_loss": -25.402286529541016, "global_step": 487265, "epoch": 5870} {"train_loss": -25.679960250854492, "global_step": 487266, "epoch": 5870} {"train_loss": -26.381072998046875, "global_step": 487267, "epoch": 5870} {"train_loss": -26.457977294921875, "global_step": 487268, "epoch": 5870} {"train_loss": -27.25372886657715, "global_step": 487269, "epoch": 5870} {"train_loss": -26.586353302001953, "global_step": 487270, "epoch": 5870} {"train_loss": -26.635534286499023, "global_step": 487271, "epoch": 5870} {"train_loss": -26.956750869750977, "global_step": 487272, "epoch": 5870} {"train_loss": -27.114154815673828, "global_step": 487273, "epoch": 5870} {"train_loss": -27.031478881835938, "global_step": 487274, "epoch": 5870} {"train_loss": -26.764020919799805, "global_step": 487275, "epoch": 5870} {"train_loss": -26.9616641998291, "global_step": 487276, "epoch": 5870} {"train_loss": -26.76912498474121, "global_step": 487277, "epoch": 5870} {"train_loss": -26.71308708190918, "global_step": 487278, "epoch": 5870} {"train_loss": -27.051361083984375, "global_step": 487279, "epoch": 5870} {"train_loss": -27.000593185424805, "global_step": 487280, "epoch": 5870} {"train_loss": -26.803424835205078, "global_step": 487281, "epoch": 5870} {"train_loss": -26.936079025268555, "global_step": 487282, "epoch": 5870} {"train_loss": -27.186782836914062, "global_step": 487283, "epoch": 5870} {"train_loss": -26.921844482421875, "global_step": 487284, "epoch": 5870} {"train_loss": -27.318613052368164, "global_step": 487285, "epoch": 5870} {"train_loss": -27.3304443359375, "global_step": 487286, "epoch": 5870} {"train_loss": -27.125564575195312, "global_step": 487287, "epoch": 5870} {"train_loss": -26.96323585510254, "global_step": 487288, "epoch": 5870} {"train_loss": -27.24285888671875, "global_step": 487289, "epoch": 5870} {"train_loss": -27.05609130859375, "global_step": 487290, "epoch": 5870} {"train_loss": -26.881799697875977, "global_step": 487291, "epoch": 5870} {"train_loss": -27.119891339037792, "global_step": 487292, "epoch": 5870, "val_loss": 6519112.5} {"train_loss": -27.238956451416016, "global_step": 487293, "epoch": 5871} {"train_loss": -27.0709171295166, "global_step": 487294, "epoch": 5871} {"train_loss": -26.819019317626953, "global_step": 487295, "epoch": 5871} {"train_loss": -26.795124053955078, "global_step": 487296, "epoch": 5871} {"train_loss": -27.148223876953125, "global_step": 487297, "epoch": 5871} {"train_loss": -26.717920303344727, "global_step": 487298, "epoch": 5871} {"train_loss": -27.055402755737305, "global_step": 487299, "epoch": 5871} {"train_loss": -27.136276245117188, "global_step": 487300, "epoch": 5871} {"train_loss": -26.887311935424805, "global_step": 487301, "epoch": 5871} {"train_loss": -26.742990493774414, "global_step": 487302, "epoch": 5871} {"train_loss": -26.292261123657227, "global_step": 487303, "epoch": 5871} {"train_loss": -26.912311553955078, "global_step": 487304, "epoch": 5871} {"train_loss": -26.792301177978516, "global_step": 487305, "epoch": 5871} {"train_loss": -26.654172897338867, "global_step": 487306, "epoch": 5871} {"train_loss": -27.144983291625977, "global_step": 487307, "epoch": 5871} {"train_loss": -27.564172744750977, "global_step": 487308, "epoch": 5871} {"train_loss": -26.99350357055664, "global_step": 487309, "epoch": 5871} {"train_loss": -27.388757705688477, "global_step": 487310, "epoch": 5871} {"train_loss": -27.48520278930664, "global_step": 487311, "epoch": 5871} {"train_loss": -27.032751083374023, "global_step": 487312, "epoch": 5871} {"train_loss": -27.6632080078125, "global_step": 487313, "epoch": 5871} {"train_loss": -27.662036895751953, "global_step": 487314, "epoch": 5871} {"train_loss": -27.138656616210938, "global_step": 487315, "epoch": 5871} {"train_loss": -27.069812774658203, "global_step": 487316, "epoch": 5871} {"train_loss": -27.5152645111084, "global_step": 487317, "epoch": 5871} {"train_loss": -27.072717666625977, "global_step": 487318, "epoch": 5871} {"train_loss": -27.613073348999023, "global_step": 487319, "epoch": 5871} {"train_loss": -27.06092643737793, "global_step": 487320, "epoch": 5871} {"train_loss": -26.997608184814453, "global_step": 487321, "epoch": 5871} {"train_loss": -27.00897216796875, "global_step": 487322, "epoch": 5871} {"train_loss": -27.454486846923828, "global_step": 487323, "epoch": 5871} {"train_loss": -27.510852813720703, "global_step": 487324, "epoch": 5871} {"train_loss": -26.96881675720215, "global_step": 487325, "epoch": 5871} {"train_loss": -27.375532150268555, "global_step": 487326, "epoch": 5871} {"train_loss": -27.17890739440918, "global_step": 487327, "epoch": 5871} {"train_loss": -27.40673828125, "global_step": 487328, "epoch": 5871} {"train_loss": -27.126129150390625, "global_step": 487329, "epoch": 5871} {"train_loss": -27.406177520751953, "global_step": 487330, "epoch": 5871} {"train_loss": -27.254016876220703, "global_step": 487331, "epoch": 5871} {"train_loss": -26.98882484436035, "global_step": 487332, "epoch": 5871} {"train_loss": -26.82728385925293, "global_step": 487333, "epoch": 5871} {"train_loss": -26.989831924438477, "global_step": 487334, "epoch": 5871} {"train_loss": -27.275754928588867, "global_step": 487335, "epoch": 5871} {"train_loss": -27.25284194946289, "global_step": 487336, "epoch": 5871} {"train_loss": -27.270666122436523, "global_step": 487337, "epoch": 5871} {"train_loss": -27.00925064086914, "global_step": 487338, "epoch": 5871} {"train_loss": -27.495716094970703, "global_step": 487339, "epoch": 5871} {"train_loss": -27.060522079467773, "global_step": 487340, "epoch": 5871} {"train_loss": -27.411258697509766, "global_step": 487341, "epoch": 5871} {"train_loss": -27.235265731811523, "global_step": 487342, "epoch": 5871} {"train_loss": -27.22930335998535, "global_step": 487343, "epoch": 5871} {"train_loss": -27.533777236938477, "global_step": 487344, "epoch": 5871} {"train_loss": -27.544132232666016, "global_step": 487345, "epoch": 5871} {"train_loss": -27.093738555908203, "global_step": 487346, "epoch": 5871} {"train_loss": -27.395727157592773, "global_step": 487347, "epoch": 5871} {"train_loss": -27.021024703979492, "global_step": 487348, "epoch": 5871} {"train_loss": -27.479413986206055, "global_step": 487349, "epoch": 5871} {"train_loss": -27.33106803894043, "global_step": 487350, "epoch": 5871} {"train_loss": -27.398712158203125, "global_step": 487351, "epoch": 5871} {"train_loss": -27.440216064453125, "global_step": 487352, "epoch": 5871} {"train_loss": -27.359973907470703, "global_step": 487353, "epoch": 5871} {"train_loss": -27.56894874572754, "global_step": 487354, "epoch": 5871} {"train_loss": -27.696924209594727, "global_step": 487355, "epoch": 5871} {"train_loss": -27.420934677124023, "global_step": 487356, "epoch": 5871} {"train_loss": -27.604917526245117, "global_step": 487357, "epoch": 5871} {"train_loss": -27.581729888916016, "global_step": 487358, "epoch": 5871} {"train_loss": -27.383655548095703, "global_step": 487359, "epoch": 5871} {"train_loss": -27.7446346282959, "global_step": 487360, "epoch": 5871} {"train_loss": -27.614667892456055, "global_step": 487361, "epoch": 5871} {"train_loss": -27.816495895385742, "global_step": 487362, "epoch": 5871} {"train_loss": -27.414169311523438, "global_step": 487363, "epoch": 5871} {"train_loss": -27.405536651611328, "global_step": 487364, "epoch": 5871} {"train_loss": -27.586416244506836, "global_step": 487365, "epoch": 5871} {"train_loss": -27.149961471557617, "global_step": 487366, "epoch": 5871} {"train_loss": -27.73243522644043, "global_step": 487367, "epoch": 5871} {"train_loss": -27.091711044311523, "global_step": 487368, "epoch": 5871} {"train_loss": -27.87017822265625, "global_step": 487369, "epoch": 5871} {"train_loss": -27.170705795288086, "global_step": 487370, "epoch": 5871} {"train_loss": -27.436737060546875, "global_step": 487371, "epoch": 5871} {"train_loss": -27.406814575195312, "global_step": 487372, "epoch": 5871} {"train_loss": -27.396780014038086, "global_step": 487373, "epoch": 5871} {"train_loss": -27.316394805908203, "global_step": 487374, "epoch": 5871} {"train_loss": -27.245694378772413, "global_step": 487375, "epoch": 5871, "val_loss": 6561877.0} {"train_loss": -22.769710540771484, "global_step": 487376, "epoch": 5872} {"train_loss": -20.488889694213867, "global_step": 487377, "epoch": 5872} {"train_loss": -25.216327667236328, "global_step": 487378, "epoch": 5872} {"train_loss": -22.588098526000977, "global_step": 487379, "epoch": 5872} {"train_loss": -23.907812118530273, "global_step": 487380, "epoch": 5872} {"train_loss": -24.478357315063477, "global_step": 487381, "epoch": 5872} {"train_loss": -25.47371482849121, "global_step": 487382, "epoch": 5872} {"train_loss": -25.062271118164062, "global_step": 487383, "epoch": 5872} {"train_loss": -25.561166763305664, "global_step": 487384, "epoch": 5872} {"train_loss": -25.318796157836914, "global_step": 487385, "epoch": 5872} {"train_loss": -25.700759887695312, "global_step": 487386, "epoch": 5872} {"train_loss": -25.77961540222168, "global_step": 487387, "epoch": 5872} {"train_loss": -25.576171875, "global_step": 487388, "epoch": 5872} {"train_loss": -26.00962257385254, "global_step": 487389, "epoch": 5872} {"train_loss": -25.9525089263916, "global_step": 487390, "epoch": 5872} {"train_loss": -26.08511734008789, "global_step": 487391, "epoch": 5872} {"train_loss": -25.88042640686035, "global_step": 487392, "epoch": 5872} {"train_loss": -25.706335067749023, "global_step": 487393, "epoch": 5872} {"train_loss": -25.958038330078125, "global_step": 487394, "epoch": 5872} {"train_loss": -26.13343620300293, "global_step": 487395, "epoch": 5872} {"train_loss": -26.033294677734375, "global_step": 487396, "epoch": 5872} {"train_loss": -26.0450382232666, "global_step": 487397, "epoch": 5872} {"train_loss": -26.03217124938965, "global_step": 487398, "epoch": 5872} {"train_loss": -26.333078384399414, "global_step": 487399, "epoch": 5872} {"train_loss": -26.095746994018555, "global_step": 487400, "epoch": 5872} {"train_loss": -26.25882911682129, "global_step": 487401, "epoch": 5872} {"train_loss": -26.471933364868164, "global_step": 487402, "epoch": 5872} {"train_loss": -26.563215255737305, "global_step": 487403, "epoch": 5872} {"train_loss": -26.411264419555664, "global_step": 487404, "epoch": 5872} {"train_loss": -26.47194480895996, "global_step": 487405, "epoch": 5872} {"train_loss": -26.677656173706055, "global_step": 487406, "epoch": 5872} {"train_loss": -26.75396728515625, "global_step": 487407, "epoch": 5872} {"train_loss": -26.127477645874023, "global_step": 487408, "epoch": 5872} {"train_loss": -26.881677627563477, "global_step": 487409, "epoch": 5872} {"train_loss": -26.4449405670166, "global_step": 487410, "epoch": 5872} {"train_loss": -26.866016387939453, "global_step": 487411, "epoch": 5872} {"train_loss": -26.814716339111328, "global_step": 487412, "epoch": 5872} {"train_loss": -26.60297203063965, "global_step": 487413, "epoch": 5872} {"train_loss": -26.512922286987305, "global_step": 487414, "epoch": 5872} {"train_loss": -26.989715576171875, "global_step": 487415, "epoch": 5872} {"train_loss": -27.093698501586914, "global_step": 487416, "epoch": 5872} {"train_loss": -26.827306747436523, "global_step": 487417, "epoch": 5872} {"train_loss": -27.17502784729004, "global_step": 487418, "epoch": 5872} {"train_loss": -26.84214210510254, "global_step": 487419, "epoch": 5872} {"train_loss": -26.742345809936523, "global_step": 487420, "epoch": 5872} {"train_loss": -27.017908096313477, "global_step": 487421, "epoch": 5872} {"train_loss": -27.266738891601562, "global_step": 487422, "epoch": 5872} {"train_loss": -27.2447566986084, "global_step": 487423, "epoch": 5872} {"train_loss": -26.812219619750977, "global_step": 487424, "epoch": 5872} {"train_loss": -27.01669692993164, "global_step": 487425, "epoch": 5872} {"train_loss": -26.778757095336914, "global_step": 487426, "epoch": 5872} {"train_loss": -27.393857955932617, "global_step": 487427, "epoch": 5872} {"train_loss": -27.166685104370117, "global_step": 487428, "epoch": 5872} {"train_loss": -27.3503360748291, "global_step": 487429, "epoch": 5872} {"train_loss": -26.886526107788086, "global_step": 487430, "epoch": 5872} {"train_loss": -26.873701095581055, "global_step": 487431, "epoch": 5872} {"train_loss": -27.051177978515625, "global_step": 487432, "epoch": 5872} {"train_loss": -27.26643180847168, "global_step": 487433, "epoch": 5872} {"train_loss": -27.105701446533203, "global_step": 487434, "epoch": 5872} {"train_loss": -27.312856674194336, "global_step": 487435, "epoch": 5872} {"train_loss": -27.6514949798584, "global_step": 487436, "epoch": 5872} {"train_loss": -27.346506118774414, "global_step": 487437, "epoch": 5872} {"train_loss": -27.51240348815918, "global_step": 487438, "epoch": 5872} {"train_loss": -27.28997802734375, "global_step": 487439, "epoch": 5872} {"train_loss": -27.228199005126953, "global_step": 487440, "epoch": 5872} {"train_loss": -27.286325454711914, "global_step": 487441, "epoch": 5872} {"train_loss": -27.002307891845703, "global_step": 487442, "epoch": 5872} {"train_loss": -27.249128341674805, "global_step": 487443, "epoch": 5872} {"train_loss": -27.25901222229004, "global_step": 487444, "epoch": 5872} {"train_loss": -27.30720329284668, "global_step": 487445, "epoch": 5872} {"train_loss": -27.17242431640625, "global_step": 487446, "epoch": 5872} {"train_loss": -27.227951049804688, "global_step": 487447, "epoch": 5872} {"train_loss": -27.56597328186035, "global_step": 487448, "epoch": 5872} {"train_loss": -27.229339599609375, "global_step": 487449, "epoch": 5872} {"train_loss": -26.86152458190918, "global_step": 487450, "epoch": 5872} {"train_loss": -26.81283950805664, "global_step": 487451, "epoch": 5872} {"train_loss": -27.28297233581543, "global_step": 487452, "epoch": 5872} {"train_loss": -27.308460235595703, "global_step": 487453, "epoch": 5872} {"train_loss": -26.823089599609375, "global_step": 487454, "epoch": 5872} {"train_loss": -26.96943473815918, "global_step": 487455, "epoch": 5872} {"train_loss": -27.04827880859375, "global_step": 487456, "epoch": 5872} {"train_loss": -27.20172691345215, "global_step": 487457, "epoch": 5872} {"train_loss": -26.467829531933887, "global_step": 487458, "epoch": 5872, "val_loss": 6461788.0} {"train_loss": -26.210676193237305, "global_step": 487459, "epoch": 5873} {"train_loss": -26.91301918029785, "global_step": 487460, "epoch": 5873} {"train_loss": -25.993457794189453, "global_step": 487461, "epoch": 5873} {"train_loss": -26.89436912536621, "global_step": 487462, "epoch": 5873} {"train_loss": -26.24875831604004, "global_step": 487463, "epoch": 5873} {"train_loss": -26.714513778686523, "global_step": 487464, "epoch": 5873} {"train_loss": -26.85086441040039, "global_step": 487465, "epoch": 5873} {"train_loss": -26.571813583374023, "global_step": 487466, "epoch": 5873} {"train_loss": -27.29140281677246, "global_step": 487467, "epoch": 5873} {"train_loss": -27.106231689453125, "global_step": 487468, "epoch": 5873} {"train_loss": -26.793981552124023, "global_step": 487469, "epoch": 5873} {"train_loss": -26.838714599609375, "global_step": 487470, "epoch": 5873} {"train_loss": -27.046955108642578, "global_step": 487471, "epoch": 5873} {"train_loss": -26.979846954345703, "global_step": 487472, "epoch": 5873} {"train_loss": -26.475133895874023, "global_step": 487473, "epoch": 5873} {"train_loss": -27.056018829345703, "global_step": 487474, "epoch": 5873} {"train_loss": -27.045080184936523, "global_step": 487475, "epoch": 5873} {"train_loss": -26.877710342407227, "global_step": 487476, "epoch": 5873} {"train_loss": -27.332883834838867, "global_step": 487477, "epoch": 5873} {"train_loss": -27.158414840698242, "global_step": 487478, "epoch": 5873} {"train_loss": -27.2374267578125, "global_step": 487479, "epoch": 5873} {"train_loss": -27.13370704650879, "global_step": 487480, "epoch": 5873} {"train_loss": -27.38138198852539, "global_step": 487481, "epoch": 5873} {"train_loss": -27.355255126953125, "global_step": 487482, "epoch": 5873} {"train_loss": -27.36475944519043, "global_step": 487483, "epoch": 5873} {"train_loss": -27.49442481994629, "global_step": 487484, "epoch": 5873} {"train_loss": -27.45440673828125, "global_step": 487485, "epoch": 5873} {"train_loss": -27.27225685119629, "global_step": 487486, "epoch": 5873} {"train_loss": -27.224653244018555, "global_step": 487487, "epoch": 5873} {"train_loss": -27.471593856811523, "global_step": 487488, "epoch": 5873} {"train_loss": -26.843976974487305, "global_step": 487489, "epoch": 5873} {"train_loss": -27.274587631225586, "global_step": 487490, "epoch": 5873} {"train_loss": -27.473371505737305, "global_step": 487491, "epoch": 5873} {"train_loss": -27.36297607421875, "global_step": 487492, "epoch": 5873} {"train_loss": -27.39508628845215, "global_step": 487493, "epoch": 5873} {"train_loss": -27.404504776000977, "global_step": 487494, "epoch": 5873} {"train_loss": -27.15981101989746, "global_step": 487495, "epoch": 5873} {"train_loss": -27.20960807800293, "global_step": 487496, "epoch": 5873} {"train_loss": -27.49506187438965, "global_step": 487497, "epoch": 5873} {"train_loss": -27.2871036529541, "global_step": 487498, "epoch": 5873} {"train_loss": -27.464008331298828, "global_step": 487499, "epoch": 5873} {"train_loss": -27.34687614440918, "global_step": 487500, "epoch": 5873} {"train_loss": -27.570709228515625, "global_step": 487501, "epoch": 5873} {"train_loss": -27.474340438842773, "global_step": 487502, "epoch": 5873} {"train_loss": -27.709564208984375, "global_step": 487503, "epoch": 5873} {"train_loss": -27.40802574157715, "global_step": 487504, "epoch": 5873} {"train_loss": -27.337387084960938, "global_step": 487505, "epoch": 5873} {"train_loss": -27.106374740600586, "global_step": 487506, "epoch": 5873} {"train_loss": -27.39532470703125, "global_step": 487507, "epoch": 5873} {"train_loss": -27.533416748046875, "global_step": 487508, "epoch": 5873} {"train_loss": -27.47859001159668, "global_step": 487509, "epoch": 5873} {"train_loss": -27.163476943969727, "global_step": 487510, "epoch": 5873} {"train_loss": -27.33942222595215, "global_step": 487511, "epoch": 5873} {"train_loss": -27.556482315063477, "global_step": 487512, "epoch": 5873} {"train_loss": -27.568572998046875, "global_step": 487513, "epoch": 5873} {"train_loss": -27.636157989501953, "global_step": 487514, "epoch": 5873} {"train_loss": -27.599294662475586, "global_step": 487515, "epoch": 5873} {"train_loss": -27.69537925720215, "global_step": 487516, "epoch": 5873} {"train_loss": -27.755023956298828, "global_step": 487517, "epoch": 5873} {"train_loss": -27.441343307495117, "global_step": 487518, "epoch": 5873} {"train_loss": -27.831485748291016, "global_step": 487519, "epoch": 5873} {"train_loss": -27.4554386138916, "global_step": 487520, "epoch": 5873} {"train_loss": -27.68719482421875, "global_step": 487521, "epoch": 5873} {"train_loss": -27.518049240112305, "global_step": 487522, "epoch": 5873} {"train_loss": -27.47138786315918, "global_step": 487523, "epoch": 5873} {"train_loss": -27.668249130249023, "global_step": 487524, "epoch": 5873} {"train_loss": -27.85474967956543, "global_step": 487525, "epoch": 5873} {"train_loss": -27.53358268737793, "global_step": 487526, "epoch": 5873} {"train_loss": -27.44111442565918, "global_step": 487527, "epoch": 5873} {"train_loss": -27.528095245361328, "global_step": 487528, "epoch": 5873} {"train_loss": -27.516651153564453, "global_step": 487529, "epoch": 5873} {"train_loss": -27.132619857788086, "global_step": 487530, "epoch": 5873} {"train_loss": -27.447423934936523, "global_step": 487531, "epoch": 5873} {"train_loss": -27.21262550354004, "global_step": 487532, "epoch": 5873} {"train_loss": -27.277257919311523, "global_step": 487533, "epoch": 5873} {"train_loss": -27.34026527404785, "global_step": 487534, "epoch": 5873} {"train_loss": -26.87257194519043, "global_step": 487535, "epoch": 5873} {"train_loss": -27.256885528564453, "global_step": 487536, "epoch": 5873} {"train_loss": -26.632720947265625, "global_step": 487537, "epoch": 5873} {"train_loss": -27.21999168395996, "global_step": 487538, "epoch": 5873} {"train_loss": -27.1041316986084, "global_step": 487539, "epoch": 5873} {"train_loss": -27.17890739440918, "global_step": 487540, "epoch": 5873} {"train_loss": -27.255862753075288, "global_step": 487541, "epoch": 5873, "val_loss": 6541787.0} {"train_loss": -26.603912353515625, "global_step": 487542, "epoch": 5874} {"train_loss": -26.109899520874023, "global_step": 487543, "epoch": 5874} {"train_loss": -25.933195114135742, "global_step": 487544, "epoch": 5874} {"train_loss": -25.560382843017578, "global_step": 487545, "epoch": 5874} {"train_loss": -26.959918975830078, "global_step": 487546, "epoch": 5874} {"train_loss": -26.443683624267578, "global_step": 487547, "epoch": 5874} {"train_loss": -26.57393455505371, "global_step": 487548, "epoch": 5874} {"train_loss": -26.745532989501953, "global_step": 487549, "epoch": 5874} {"train_loss": -25.97983741760254, "global_step": 487550, "epoch": 5874} {"train_loss": -26.81072425842285, "global_step": 487551, "epoch": 5874} {"train_loss": -26.117902755737305, "global_step": 487552, "epoch": 5874} {"train_loss": -26.502782821655273, "global_step": 487553, "epoch": 5874} {"train_loss": -26.807861328125, "global_step": 487554, "epoch": 5874} {"train_loss": -26.60773277282715, "global_step": 487555, "epoch": 5874} {"train_loss": -26.432159423828125, "global_step": 487556, "epoch": 5874} {"train_loss": -26.951093673706055, "global_step": 487557, "epoch": 5874} {"train_loss": -26.903207778930664, "global_step": 487558, "epoch": 5874} {"train_loss": -26.868183135986328, "global_step": 487559, "epoch": 5874} {"train_loss": -26.91739273071289, "global_step": 487560, "epoch": 5874} {"train_loss": -26.98193359375, "global_step": 487561, "epoch": 5874} {"train_loss": -27.201740264892578, "global_step": 487562, "epoch": 5874} {"train_loss": -26.678983688354492, "global_step": 487563, "epoch": 5874} {"train_loss": -26.759567260742188, "global_step": 487564, "epoch": 5874} {"train_loss": -27.243610382080078, "global_step": 487565, "epoch": 5874} {"train_loss": -27.032968521118164, "global_step": 487566, "epoch": 5874} {"train_loss": -27.022876739501953, "global_step": 487567, "epoch": 5874} {"train_loss": -27.133466720581055, "global_step": 487568, "epoch": 5874} {"train_loss": -27.35584831237793, "global_step": 487569, "epoch": 5874} {"train_loss": -27.20432472229004, "global_step": 487570, "epoch": 5874} {"train_loss": -26.871002197265625, "global_step": 487571, "epoch": 5874} {"train_loss": -27.419076919555664, "global_step": 487572, "epoch": 5874} {"train_loss": -27.098773956298828, "global_step": 487573, "epoch": 5874} {"train_loss": -27.655447006225586, "global_step": 487574, "epoch": 5874} {"train_loss": -27.077600479125977, "global_step": 487575, "epoch": 5874} {"train_loss": -27.52115249633789, "global_step": 487576, "epoch": 5874} {"train_loss": -27.463354110717773, "global_step": 487577, "epoch": 5874} {"train_loss": -27.331893920898438, "global_step": 487578, "epoch": 5874} {"train_loss": -27.327810287475586, "global_step": 487579, "epoch": 5874} {"train_loss": -27.41534996032715, "global_step": 487580, "epoch": 5874} {"train_loss": -27.4576416015625, "global_step": 487581, "epoch": 5874} {"train_loss": -27.398893356323242, "global_step": 487582, "epoch": 5874} {"train_loss": -27.492034912109375, "global_step": 487583, "epoch": 5874} {"train_loss": -27.198017120361328, "global_step": 487584, "epoch": 5874} {"train_loss": -27.434839248657227, "global_step": 487585, "epoch": 5874} {"train_loss": -27.679370880126953, "global_step": 487586, "epoch": 5874} {"train_loss": -27.335691452026367, "global_step": 487587, "epoch": 5874} {"train_loss": -27.297382354736328, "global_step": 487588, "epoch": 5874} {"train_loss": -27.017871856689453, "global_step": 487589, "epoch": 5874} {"train_loss": -27.344343185424805, "global_step": 487590, "epoch": 5874} {"train_loss": -27.3898868560791, "global_step": 487591, "epoch": 5874} {"train_loss": -27.6219539642334, "global_step": 487592, "epoch": 5874} {"train_loss": -27.298492431640625, "global_step": 487593, "epoch": 5874} {"train_loss": -27.123779296875, "global_step": 487594, "epoch": 5874} {"train_loss": -27.418481826782227, "global_step": 487595, "epoch": 5874} {"train_loss": -27.330121994018555, "global_step": 487596, "epoch": 5874} {"train_loss": -27.70570182800293, "global_step": 487597, "epoch": 5874} {"train_loss": -27.431241989135742, "global_step": 487598, "epoch": 5874} {"train_loss": -27.111520767211914, "global_step": 487599, "epoch": 5874} {"train_loss": -27.421955108642578, "global_step": 487600, "epoch": 5874} {"train_loss": -27.245832443237305, "global_step": 487601, "epoch": 5874} {"train_loss": -27.317447662353516, "global_step": 487602, "epoch": 5874} {"train_loss": -27.3021240234375, "global_step": 487603, "epoch": 5874} {"train_loss": -27.219390869140625, "global_step": 487604, "epoch": 5874} {"train_loss": -26.83785057067871, "global_step": 487605, "epoch": 5874} {"train_loss": -27.3132381439209, "global_step": 487606, "epoch": 5874} {"train_loss": -27.42439079284668, "global_step": 487607, "epoch": 5874} {"train_loss": -27.153162002563477, "global_step": 487608, "epoch": 5874} {"train_loss": -26.79387855529785, "global_step": 487609, "epoch": 5874} {"train_loss": -27.763614654541016, "global_step": 487610, "epoch": 5874} {"train_loss": -26.895837783813477, "global_step": 487611, "epoch": 5874} {"train_loss": -26.9420108795166, "global_step": 487612, "epoch": 5874} {"train_loss": -27.71725845336914, "global_step": 487613, "epoch": 5874} {"train_loss": -26.954675674438477, "global_step": 487614, "epoch": 5874} {"train_loss": -27.14051628112793, "global_step": 487615, "epoch": 5874} {"train_loss": -27.197729110717773, "global_step": 487616, "epoch": 5874} {"train_loss": -27.256677627563477, "global_step": 487617, "epoch": 5874} {"train_loss": -27.43971061706543, "global_step": 487618, "epoch": 5874} {"train_loss": -27.629850387573242, "global_step": 487619, "epoch": 5874} {"train_loss": -27.159515380859375, "global_step": 487620, "epoch": 5874} {"train_loss": -27.35220718383789, "global_step": 487621, "epoch": 5874} {"train_loss": -27.4565372467041, "global_step": 487622, "epoch": 5874} {"train_loss": -27.387487411499023, "global_step": 487623, "epoch": 5874} {"train_loss": -27.095468590058477, "global_step": 487624, "epoch": 5874, "val_loss": 6498866.0} {"train_loss": -26.25372886657715, "global_step": 487625, "epoch": 5875} {"train_loss": -26.432682037353516, "global_step": 487626, "epoch": 5875} {"train_loss": -25.696674346923828, "global_step": 487627, "epoch": 5875} {"train_loss": -26.89204216003418, "global_step": 487628, "epoch": 5875} {"train_loss": -25.908361434936523, "global_step": 487629, "epoch": 5875} {"train_loss": -26.6769962310791, "global_step": 487630, "epoch": 5875} {"train_loss": -26.171127319335938, "global_step": 487631, "epoch": 5875} {"train_loss": -26.832380294799805, "global_step": 487632, "epoch": 5875} {"train_loss": -26.524276733398438, "global_step": 487633, "epoch": 5875} {"train_loss": -27.2515926361084, "global_step": 487634, "epoch": 5875} {"train_loss": -26.920522689819336, "global_step": 487635, "epoch": 5875} {"train_loss": -27.093957901000977, "global_step": 487636, "epoch": 5875} {"train_loss": -27.241750717163086, "global_step": 487637, "epoch": 5875} {"train_loss": -26.908849716186523, "global_step": 487638, "epoch": 5875} {"train_loss": -26.79142189025879, "global_step": 487639, "epoch": 5875} {"train_loss": -26.825698852539062, "global_step": 487640, "epoch": 5875} {"train_loss": -26.92396354675293, "global_step": 487641, "epoch": 5875} {"train_loss": -27.251270294189453, "global_step": 487642, "epoch": 5875} {"train_loss": -26.666950225830078, "global_step": 487643, "epoch": 5875} {"train_loss": -26.97021484375, "global_step": 487644, "epoch": 5875} {"train_loss": -26.76910972595215, "global_step": 487645, "epoch": 5875} {"train_loss": -27.184818267822266, "global_step": 487646, "epoch": 5875} {"train_loss": -27.21209144592285, "global_step": 487647, "epoch": 5875} {"train_loss": -26.91094398498535, "global_step": 487648, "epoch": 5875} {"train_loss": -27.32008171081543, "global_step": 487649, "epoch": 5875} {"train_loss": -27.321136474609375, "global_step": 487650, "epoch": 5875} {"train_loss": -27.138906478881836, "global_step": 487651, "epoch": 5875} {"train_loss": -27.059890747070312, "global_step": 487652, "epoch": 5875} {"train_loss": -27.109302520751953, "global_step": 487653, "epoch": 5875} {"train_loss": -27.15717124938965, "global_step": 487654, "epoch": 5875} {"train_loss": -27.852649688720703, "global_step": 487655, "epoch": 5875} {"train_loss": -27.095930099487305, "global_step": 487656, "epoch": 5875} {"train_loss": -27.15374755859375, "global_step": 487657, "epoch": 5875} {"train_loss": -27.216581344604492, "global_step": 487658, "epoch": 5875} {"train_loss": -27.889301300048828, "global_step": 487659, "epoch": 5875} {"train_loss": -27.360855102539062, "global_step": 487660, "epoch": 5875} {"train_loss": -27.522354125976562, "global_step": 487661, "epoch": 5875} {"train_loss": -27.058740615844727, "global_step": 487662, "epoch": 5875} {"train_loss": -27.581079483032227, "global_step": 487663, "epoch": 5875} {"train_loss": -27.589994430541992, "global_step": 487664, "epoch": 5875} {"train_loss": -27.469648361206055, "global_step": 487665, "epoch": 5875} {"train_loss": -27.67502784729004, "global_step": 487666, "epoch": 5875} {"train_loss": -27.203998565673828, "global_step": 487667, "epoch": 5875} {"train_loss": -27.0489501953125, "global_step": 487668, "epoch": 5875} {"train_loss": -27.22943115234375, "global_step": 487669, "epoch": 5875} {"train_loss": -27.424795150756836, "global_step": 487670, "epoch": 5875} {"train_loss": -27.40457534790039, "global_step": 487671, "epoch": 5875} {"train_loss": -27.461606979370117, "global_step": 487672, "epoch": 5875} {"train_loss": -27.47340202331543, "global_step": 487673, "epoch": 5875} {"train_loss": -27.52895164489746, "global_step": 487674, "epoch": 5875} {"train_loss": -27.40095329284668, "global_step": 487675, "epoch": 5875} {"train_loss": -27.375715255737305, "global_step": 487676, "epoch": 5875} {"train_loss": -27.566791534423828, "global_step": 487677, "epoch": 5875} {"train_loss": -27.82144546508789, "global_step": 487678, "epoch": 5875} {"train_loss": -27.75697898864746, "global_step": 487679, "epoch": 5875} {"train_loss": -27.614486694335938, "global_step": 487680, "epoch": 5875} {"train_loss": -27.5668888092041, "global_step": 487681, "epoch": 5875} {"train_loss": -27.30561637878418, "global_step": 487682, "epoch": 5875} {"train_loss": -27.731725692749023, "global_step": 487683, "epoch": 5875} {"train_loss": -27.44867515563965, "global_step": 487684, "epoch": 5875} {"train_loss": -27.352643966674805, "global_step": 487685, "epoch": 5875} {"train_loss": -27.42872428894043, "global_step": 487686, "epoch": 5875} {"train_loss": -27.536605834960938, "global_step": 487687, "epoch": 5875} {"train_loss": -27.173572540283203, "global_step": 487688, "epoch": 5875} {"train_loss": -27.7882080078125, "global_step": 487689, "epoch": 5875} {"train_loss": -27.626535415649414, "global_step": 487690, "epoch": 5875} {"train_loss": -26.83941078186035, "global_step": 487691, "epoch": 5875} {"train_loss": -27.00140953063965, "global_step": 487692, "epoch": 5875} {"train_loss": -26.989593505859375, "global_step": 487693, "epoch": 5875} {"train_loss": -27.317291259765625, "global_step": 487694, "epoch": 5875} {"train_loss": -26.859882354736328, "global_step": 487695, "epoch": 5875} {"train_loss": -26.844512939453125, "global_step": 487696, "epoch": 5875} {"train_loss": -27.332616806030273, "global_step": 487697, "epoch": 5875} {"train_loss": -27.269683837890625, "global_step": 487698, "epoch": 5875} {"train_loss": -27.379901885986328, "global_step": 487699, "epoch": 5875} {"train_loss": -27.449941635131836, "global_step": 487700, "epoch": 5875} {"train_loss": -27.59977149963379, "global_step": 487701, "epoch": 5875} {"train_loss": -27.228351593017578, "global_step": 487702, "epoch": 5875} {"train_loss": -27.609683990478516, "global_step": 487703, "epoch": 5875} {"train_loss": -27.145715713500977, "global_step": 487704, "epoch": 5875} {"train_loss": -27.328323364257812, "global_step": 487705, "epoch": 5875} {"train_loss": -27.22688102722168, "global_step": 487706, "epoch": 5875} {"train_loss": -27.203603606626213, "global_step": 487707, "epoch": 5875, "val_loss": 6566880.0} {"train_loss": -26.556549072265625, "global_step": 487708, "epoch": 5876} {"train_loss": -25.96225929260254, "global_step": 487709, "epoch": 5876} {"train_loss": -26.794225692749023, "global_step": 487710, "epoch": 5876} {"train_loss": -26.63416862487793, "global_step": 487711, "epoch": 5876} {"train_loss": -26.75288200378418, "global_step": 487712, "epoch": 5876} {"train_loss": -26.851709365844727, "global_step": 487713, "epoch": 5876} {"train_loss": -27.12359046936035, "global_step": 487714, "epoch": 5876} {"train_loss": -26.95002555847168, "global_step": 487715, "epoch": 5876} {"train_loss": -26.922943115234375, "global_step": 487716, "epoch": 5876} {"train_loss": -26.919586181640625, "global_step": 487717, "epoch": 5876} {"train_loss": -27.021533966064453, "global_step": 487718, "epoch": 5876} {"train_loss": -27.115066528320312, "global_step": 487719, "epoch": 5876} {"train_loss": -26.9926815032959, "global_step": 487720, "epoch": 5876} {"train_loss": -27.002790451049805, "global_step": 487721, "epoch": 5876} {"train_loss": -27.047697067260742, "global_step": 487722, "epoch": 5876} {"train_loss": -27.19074821472168, "global_step": 487723, "epoch": 5876} {"train_loss": -27.390777587890625, "global_step": 487724, "epoch": 5876} {"train_loss": -26.841367721557617, "global_step": 487725, "epoch": 5876} {"train_loss": -27.366552352905273, "global_step": 487726, "epoch": 5876} {"train_loss": -27.18158531188965, "global_step": 487727, "epoch": 5876} {"train_loss": -27.297536849975586, "global_step": 487728, "epoch": 5876} {"train_loss": -27.58097267150879, "global_step": 487729, "epoch": 5876} {"train_loss": -27.108015060424805, "global_step": 487730, "epoch": 5876} {"train_loss": -27.142929077148438, "global_step": 487731, "epoch": 5876} {"train_loss": -27.18427848815918, "global_step": 487732, "epoch": 5876} {"train_loss": -27.44549560546875, "global_step": 487733, "epoch": 5876} {"train_loss": -26.969831466674805, "global_step": 487734, "epoch": 5876} {"train_loss": -26.990087509155273, "global_step": 487735, "epoch": 5876} {"train_loss": -27.083454132080078, "global_step": 487736, "epoch": 5876} {"train_loss": -27.5056209564209, "global_step": 487737, "epoch": 5876} {"train_loss": -27.378192901611328, "global_step": 487738, "epoch": 5876} {"train_loss": -26.89154624938965, "global_step": 487739, "epoch": 5876} {"train_loss": -27.67017936706543, "global_step": 487740, "epoch": 5876} {"train_loss": -27.239898681640625, "global_step": 487741, "epoch": 5876} {"train_loss": -27.3427677154541, "global_step": 487742, "epoch": 5876} {"train_loss": -27.660459518432617, "global_step": 487743, "epoch": 5876} {"train_loss": -27.321197509765625, "global_step": 487744, "epoch": 5876} {"train_loss": -27.464643478393555, "global_step": 487745, "epoch": 5876} {"train_loss": -26.820804595947266, "global_step": 487746, "epoch": 5876} {"train_loss": -27.1987247467041, "global_step": 487747, "epoch": 5876} {"train_loss": -27.366561889648438, "global_step": 487748, "epoch": 5876} {"train_loss": -27.184406280517578, "global_step": 487749, "epoch": 5876} {"train_loss": -27.1645450592041, "global_step": 487750, "epoch": 5876} {"train_loss": -27.221866607666016, "global_step": 487751, "epoch": 5876} {"train_loss": -27.318084716796875, "global_step": 487752, "epoch": 5876} {"train_loss": -27.124252319335938, "global_step": 487753, "epoch": 5876} {"train_loss": -27.37883949279785, "global_step": 487754, "epoch": 5876} {"train_loss": -27.65348243713379, "global_step": 487755, "epoch": 5876} {"train_loss": -27.336902618408203, "global_step": 487756, "epoch": 5876} {"train_loss": -27.440820693969727, "global_step": 487757, "epoch": 5876} {"train_loss": -27.103376388549805, "global_step": 487758, "epoch": 5876} {"train_loss": -26.7639217376709, "global_step": 487759, "epoch": 5876} {"train_loss": -27.527719497680664, "global_step": 487760, "epoch": 5876} {"train_loss": -27.15748405456543, "global_step": 487761, "epoch": 5876} {"train_loss": -26.986547470092773, "global_step": 487762, "epoch": 5876} {"train_loss": -27.21023941040039, "global_step": 487763, "epoch": 5876} {"train_loss": -27.2686767578125, "global_step": 487764, "epoch": 5876} {"train_loss": -27.154699325561523, "global_step": 487765, "epoch": 5876} {"train_loss": -27.340991973876953, "global_step": 487766, "epoch": 5876} {"train_loss": -27.03729248046875, "global_step": 487767, "epoch": 5876} {"train_loss": -27.277990341186523, "global_step": 487768, "epoch": 5876} {"train_loss": -27.26194190979004, "global_step": 487769, "epoch": 5876} {"train_loss": -26.91956901550293, "global_step": 487770, "epoch": 5876} {"train_loss": -26.302947998046875, "global_step": 487771, "epoch": 5876} {"train_loss": -26.78031349182129, "global_step": 487772, "epoch": 5876} {"train_loss": -27.2980899810791, "global_step": 487773, "epoch": 5876} {"train_loss": -27.144468307495117, "global_step": 487774, "epoch": 5876} {"train_loss": -27.01422691345215, "global_step": 487775, "epoch": 5876} {"train_loss": -27.7669677734375, "global_step": 487776, "epoch": 5876} {"train_loss": -27.418283462524414, "global_step": 487777, "epoch": 5876} {"train_loss": -27.200580596923828, "global_step": 487778, "epoch": 5876} {"train_loss": -27.612585067749023, "global_step": 487779, "epoch": 5876} {"train_loss": -27.552148818969727, "global_step": 487780, "epoch": 5876} {"train_loss": -27.515317916870117, "global_step": 487781, "epoch": 5876} {"train_loss": -27.260000228881836, "global_step": 487782, "epoch": 5876} {"train_loss": -27.462268829345703, "global_step": 487783, "epoch": 5876} {"train_loss": -27.230234146118164, "global_step": 487784, "epoch": 5876} {"train_loss": -26.931507110595703, "global_step": 487785, "epoch": 5876} {"train_loss": -27.431415557861328, "global_step": 487786, "epoch": 5876} {"train_loss": -27.787805557250977, "global_step": 487787, "epoch": 5876} {"train_loss": -27.520151138305664, "global_step": 487788, "epoch": 5876} {"train_loss": -27.38203239440918, "global_step": 487789, "epoch": 5876} {"train_loss": -27.188891583178417, "global_step": 487790, "epoch": 5876, "val_loss": 6580270.5} {"train_loss": -26.887619018554688, "global_step": 487791, "epoch": 5877} {"train_loss": -26.81971549987793, "global_step": 487792, "epoch": 5877} {"train_loss": -27.12237548828125, "global_step": 487793, "epoch": 5877} {"train_loss": -26.948068618774414, "global_step": 487794, "epoch": 5877} {"train_loss": -26.97248649597168, "global_step": 487795, "epoch": 5877} {"train_loss": -26.676538467407227, "global_step": 487796, "epoch": 5877} {"train_loss": -27.497577667236328, "global_step": 487797, "epoch": 5877} {"train_loss": -27.667984008789062, "global_step": 487798, "epoch": 5877} {"train_loss": -27.554487228393555, "global_step": 487799, "epoch": 5877} {"train_loss": -27.226221084594727, "global_step": 487800, "epoch": 5877} {"train_loss": -27.310266494750977, "global_step": 487801, "epoch": 5877} {"train_loss": -27.48585319519043, "global_step": 487802, "epoch": 5877} {"train_loss": -27.209394454956055, "global_step": 487803, "epoch": 5877} {"train_loss": -27.617834091186523, "global_step": 487804, "epoch": 5877} {"train_loss": -27.671173095703125, "global_step": 487805, "epoch": 5877} {"train_loss": -27.261077880859375, "global_step": 487806, "epoch": 5877} {"train_loss": -27.784286499023438, "global_step": 487807, "epoch": 5877} {"train_loss": -27.333402633666992, "global_step": 487808, "epoch": 5877} {"train_loss": -27.075286865234375, "global_step": 487809, "epoch": 5877} {"train_loss": -27.451251983642578, "global_step": 487810, "epoch": 5877} {"train_loss": -27.35194206237793, "global_step": 487811, "epoch": 5877} {"train_loss": -27.47444725036621, "global_step": 487812, "epoch": 5877} {"train_loss": -27.199331283569336, "global_step": 487813, "epoch": 5877} {"train_loss": -27.68219566345215, "global_step": 487814, "epoch": 5877} {"train_loss": -27.655988693237305, "global_step": 487815, "epoch": 5877} {"train_loss": -27.44141960144043, "global_step": 487816, "epoch": 5877} {"train_loss": -27.44693374633789, "global_step": 487817, "epoch": 5877} {"train_loss": -27.098957061767578, "global_step": 487818, "epoch": 5877} {"train_loss": -27.20575523376465, "global_step": 487819, "epoch": 5877} {"train_loss": -27.58624839782715, "global_step": 487820, "epoch": 5877} {"train_loss": -27.495412826538086, "global_step": 487821, "epoch": 5877} {"train_loss": -27.792255401611328, "global_step": 487822, "epoch": 5877} {"train_loss": -27.566308975219727, "global_step": 487823, "epoch": 5877} {"train_loss": -26.925809860229492, "global_step": 487824, "epoch": 5877} {"train_loss": -27.172693252563477, "global_step": 487825, "epoch": 5877} {"train_loss": -26.797895431518555, "global_step": 487826, "epoch": 5877} {"train_loss": -27.7880802154541, "global_step": 487827, "epoch": 5877} {"train_loss": -27.53639030456543, "global_step": 487828, "epoch": 5877} {"train_loss": -27.25306510925293, "global_step": 487829, "epoch": 5877} {"train_loss": -27.417638778686523, "global_step": 487830, "epoch": 5877} {"train_loss": -27.503070831298828, "global_step": 487831, "epoch": 5877} {"train_loss": -27.615558624267578, "global_step": 487832, "epoch": 5877} {"train_loss": -27.303913116455078, "global_step": 487833, "epoch": 5877} {"train_loss": -27.310394287109375, "global_step": 487834, "epoch": 5877} {"train_loss": -27.34023094177246, "global_step": 487835, "epoch": 5877} {"train_loss": -27.690521240234375, "global_step": 487836, "epoch": 5877} {"train_loss": -27.521686553955078, "global_step": 487837, "epoch": 5877} {"train_loss": -27.558277130126953, "global_step": 487838, "epoch": 5877} {"train_loss": -27.221914291381836, "global_step": 487839, "epoch": 5877} {"train_loss": -27.510717391967773, "global_step": 487840, "epoch": 5877} {"train_loss": -27.241565704345703, "global_step": 487841, "epoch": 5877} {"train_loss": -27.515588760375977, "global_step": 487842, "epoch": 5877} {"train_loss": -26.843734741210938, "global_step": 487843, "epoch": 5877} {"train_loss": -26.861295700073242, "global_step": 487844, "epoch": 5877} {"train_loss": -27.48842430114746, "global_step": 487845, "epoch": 5877} {"train_loss": -27.224655151367188, "global_step": 487846, "epoch": 5877} {"train_loss": -27.090513229370117, "global_step": 487847, "epoch": 5877} {"train_loss": -27.11040687561035, "global_step": 487848, "epoch": 5877} {"train_loss": -27.177078247070312, "global_step": 487849, "epoch": 5877} {"train_loss": -27.616565704345703, "global_step": 487850, "epoch": 5877} {"train_loss": -27.458789825439453, "global_step": 487851, "epoch": 5877} {"train_loss": -27.2947998046875, "global_step": 487852, "epoch": 5877} {"train_loss": -27.240934371948242, "global_step": 487853, "epoch": 5877} {"train_loss": -27.213272094726562, "global_step": 487854, "epoch": 5877} {"train_loss": -27.306533813476562, "global_step": 487855, "epoch": 5877} {"train_loss": -27.340436935424805, "global_step": 487856, "epoch": 5877} {"train_loss": -27.440420150756836, "global_step": 487857, "epoch": 5877} {"train_loss": -27.487049102783203, "global_step": 487858, "epoch": 5877} {"train_loss": -27.67431640625, "global_step": 487859, "epoch": 5877} {"train_loss": -27.55095863342285, "global_step": 487860, "epoch": 5877} {"train_loss": -27.19868278503418, "global_step": 487861, "epoch": 5877} {"train_loss": -27.53378677368164, "global_step": 487862, "epoch": 5877} {"train_loss": -27.0841064453125, "global_step": 487863, "epoch": 5877} {"train_loss": -27.56194496154785, "global_step": 487864, "epoch": 5877} {"train_loss": -27.431167602539062, "global_step": 487865, "epoch": 5877} {"train_loss": -27.591272354125977, "global_step": 487866, "epoch": 5877} {"train_loss": -27.599287033081055, "global_step": 487867, "epoch": 5877} {"train_loss": -27.381153106689453, "global_step": 487868, "epoch": 5877} {"train_loss": -27.36554527282715, "global_step": 487869, "epoch": 5877} {"train_loss": -27.388341903686523, "global_step": 487870, "epoch": 5877} {"train_loss": -27.616470336914062, "global_step": 487871, "epoch": 5877} {"train_loss": -27.385501861572266, "global_step": 487872, "epoch": 5877} {"train_loss": -27.35330565578966, "global_step": 487873, "epoch": 5877, "val_loss": 6614855.5} {"train_loss": -26.738601684570312, "global_step": 487874, "epoch": 5878} {"train_loss": -26.926401138305664, "global_step": 487875, "epoch": 5878} {"train_loss": -27.0095157623291, "global_step": 487876, "epoch": 5878} {"train_loss": -27.262983322143555, "global_step": 487877, "epoch": 5878} {"train_loss": -27.25005531311035, "global_step": 487878, "epoch": 5878} {"train_loss": -27.170446395874023, "global_step": 487879, "epoch": 5878} {"train_loss": -27.500680923461914, "global_step": 487880, "epoch": 5878} {"train_loss": -26.74344825744629, "global_step": 487881, "epoch": 5878} {"train_loss": -27.5996036529541, "global_step": 487882, "epoch": 5878} {"train_loss": -27.26056480407715, "global_step": 487883, "epoch": 5878} {"train_loss": -27.080917358398438, "global_step": 487884, "epoch": 5878} {"train_loss": -27.396503448486328, "global_step": 487885, "epoch": 5878} {"train_loss": -26.964405059814453, "global_step": 487886, "epoch": 5878} {"train_loss": -27.077783584594727, "global_step": 487887, "epoch": 5878} {"train_loss": -26.392423629760742, "global_step": 487888, "epoch": 5878} {"train_loss": -27.484210968017578, "global_step": 487889, "epoch": 5878} {"train_loss": -27.366546630859375, "global_step": 487890, "epoch": 5878} {"train_loss": -26.699176788330078, "global_step": 487891, "epoch": 5878} {"train_loss": -27.434728622436523, "global_step": 487892, "epoch": 5878} {"train_loss": -27.141202926635742, "global_step": 487893, "epoch": 5878} {"train_loss": -27.272262573242188, "global_step": 487894, "epoch": 5878} {"train_loss": -26.661157608032227, "global_step": 487895, "epoch": 5878} {"train_loss": -27.148635864257812, "global_step": 487896, "epoch": 5878} {"train_loss": -27.1560001373291, "global_step": 487897, "epoch": 5878} {"train_loss": -27.07703971862793, "global_step": 487898, "epoch": 5878} {"train_loss": -27.205068588256836, "global_step": 487899, "epoch": 5878} {"train_loss": -27.273773193359375, "global_step": 487900, "epoch": 5878} {"train_loss": -27.38850212097168, "global_step": 487901, "epoch": 5878} {"train_loss": -27.434850692749023, "global_step": 487902, "epoch": 5878} {"train_loss": -27.30741310119629, "global_step": 487903, "epoch": 5878} {"train_loss": -27.674610137939453, "global_step": 487904, "epoch": 5878} {"train_loss": -27.3297119140625, "global_step": 487905, "epoch": 5878} {"train_loss": -26.78108024597168, "global_step": 487906, "epoch": 5878} {"train_loss": -27.128528594970703, "global_step": 487907, "epoch": 5878} {"train_loss": -27.418975830078125, "global_step": 487908, "epoch": 5878} {"train_loss": -27.022153854370117, "global_step": 487909, "epoch": 5878} {"train_loss": -27.4002685546875, "global_step": 487910, "epoch": 5878} {"train_loss": -27.091272354125977, "global_step": 487911, "epoch": 5878} {"train_loss": -27.168109893798828, "global_step": 487912, "epoch": 5878} {"train_loss": -27.183698654174805, "global_step": 487913, "epoch": 5878} {"train_loss": -27.084028244018555, "global_step": 487914, "epoch": 5878} {"train_loss": -27.343963623046875, "global_step": 487915, "epoch": 5878} {"train_loss": -27.369726181030273, "global_step": 487916, "epoch": 5878} {"train_loss": -27.352874755859375, "global_step": 487917, "epoch": 5878} {"train_loss": -27.282644271850586, "global_step": 487918, "epoch": 5878} {"train_loss": -27.289533615112305, "global_step": 487919, "epoch": 5878} {"train_loss": -27.390966415405273, "global_step": 487920, "epoch": 5878} {"train_loss": -27.664316177368164, "global_step": 487921, "epoch": 5878} {"train_loss": -27.539997100830078, "global_step": 487922, "epoch": 5878} {"train_loss": -27.622167587280273, "global_step": 487923, "epoch": 5878} {"train_loss": -27.319076538085938, "global_step": 487924, "epoch": 5878} {"train_loss": -27.26043701171875, "global_step": 487925, "epoch": 5878} {"train_loss": -27.150665283203125, "global_step": 487926, "epoch": 5878} {"train_loss": -27.30921745300293, "global_step": 487927, "epoch": 5878} {"train_loss": -27.18010902404785, "global_step": 487928, "epoch": 5878} {"train_loss": -27.874313354492188, "global_step": 487929, "epoch": 5878} {"train_loss": -27.49879264831543, "global_step": 487930, "epoch": 5878} {"train_loss": -27.371015548706055, "global_step": 487931, "epoch": 5878} {"train_loss": -27.79245948791504, "global_step": 487932, "epoch": 5878} {"train_loss": -27.614538192749023, "global_step": 487933, "epoch": 5878} {"train_loss": -26.975244522094727, "global_step": 487934, "epoch": 5878} {"train_loss": -27.11625099182129, "global_step": 487935, "epoch": 5878} {"train_loss": -27.30611228942871, "global_step": 487936, "epoch": 5878} {"train_loss": -27.846832275390625, "global_step": 487937, "epoch": 5878} {"train_loss": -27.742141723632812, "global_step": 487938, "epoch": 5878} {"train_loss": -27.5181884765625, "global_step": 487939, "epoch": 5878} {"train_loss": -27.503080368041992, "global_step": 487940, "epoch": 5878} {"train_loss": -26.92856788635254, "global_step": 487941, "epoch": 5878} {"train_loss": -27.34186363220215, "global_step": 487942, "epoch": 5878} {"train_loss": -26.868932723999023, "global_step": 487943, "epoch": 5878} {"train_loss": -26.881540298461914, "global_step": 487944, "epoch": 5878} {"train_loss": -26.678586959838867, "global_step": 487945, "epoch": 5878} {"train_loss": -26.358505249023438, "global_step": 487946, "epoch": 5878} {"train_loss": -25.746417999267578, "global_step": 487947, "epoch": 5878} {"train_loss": -26.28608512878418, "global_step": 487948, "epoch": 5878} {"train_loss": -27.044981002807617, "global_step": 487949, "epoch": 5878} {"train_loss": -26.81756591796875, "global_step": 487950, "epoch": 5878} {"train_loss": -26.806640625, "global_step": 487951, "epoch": 5878} {"train_loss": -26.9068603515625, "global_step": 487952, "epoch": 5878} {"train_loss": -26.147628784179688, "global_step": 487953, "epoch": 5878} {"train_loss": -26.907323837280273, "global_step": 487954, "epoch": 5878} {"train_loss": -27.02585792541504, "global_step": 487955, "epoch": 5878} {"train_loss": -27.165630524417004, "global_step": 487956, "epoch": 5878, "val_loss": 6639535.0} {"train_loss": -25.571720123291016, "global_step": 487957, "epoch": 5879} {"train_loss": -26.74116325378418, "global_step": 487958, "epoch": 5879} {"train_loss": -25.836170196533203, "global_step": 487959, "epoch": 5879} {"train_loss": -25.95648765563965, "global_step": 487960, "epoch": 5879} {"train_loss": -26.06308364868164, "global_step": 487961, "epoch": 5879} {"train_loss": -26.386890411376953, "global_step": 487962, "epoch": 5879} {"train_loss": -26.091644287109375, "global_step": 487963, "epoch": 5879} {"train_loss": -26.373126983642578, "global_step": 487964, "epoch": 5879} {"train_loss": -26.330856323242188, "global_step": 487965, "epoch": 5879} {"train_loss": -25.593042373657227, "global_step": 487966, "epoch": 5879} {"train_loss": -26.226673126220703, "global_step": 487967, "epoch": 5879} {"train_loss": -26.75323486328125, "global_step": 487968, "epoch": 5879} {"train_loss": -26.53045654296875, "global_step": 487969, "epoch": 5879} {"train_loss": -26.758045196533203, "global_step": 487970, "epoch": 5879} {"train_loss": -26.281049728393555, "global_step": 487971, "epoch": 5879} {"train_loss": -26.65961265563965, "global_step": 487972, "epoch": 5879} {"train_loss": -26.39045524597168, "global_step": 487973, "epoch": 5879} {"train_loss": -26.295120239257812, "global_step": 487974, "epoch": 5879} {"train_loss": -26.937225341796875, "global_step": 487975, "epoch": 5879} {"train_loss": -26.91681480407715, "global_step": 487976, "epoch": 5879} {"train_loss": -26.99810218811035, "global_step": 487977, "epoch": 5879} {"train_loss": -26.59845542907715, "global_step": 487978, "epoch": 5879} {"train_loss": -26.55055046081543, "global_step": 487979, "epoch": 5879} {"train_loss": -26.805540084838867, "global_step": 487980, "epoch": 5879} {"train_loss": -26.81300163269043, "global_step": 487981, "epoch": 5879} {"train_loss": -27.039413452148438, "global_step": 487982, "epoch": 5879} {"train_loss": -26.918859481811523, "global_step": 487983, "epoch": 5879} {"train_loss": -26.59260368347168, "global_step": 487984, "epoch": 5879} {"train_loss": -27.233856201171875, "global_step": 487985, "epoch": 5879} {"train_loss": -26.78744888305664, "global_step": 487986, "epoch": 5879} {"train_loss": -26.897018432617188, "global_step": 487987, "epoch": 5879} {"train_loss": -26.8512020111084, "global_step": 487988, "epoch": 5879} {"train_loss": -27.271284103393555, "global_step": 487989, "epoch": 5879} {"train_loss": -27.09773063659668, "global_step": 487990, "epoch": 5879} {"train_loss": -27.340734481811523, "global_step": 487991, "epoch": 5879} {"train_loss": -27.44805908203125, "global_step": 487992, "epoch": 5879} {"train_loss": -27.3798828125, "global_step": 487993, "epoch": 5879} {"train_loss": -27.28693199157715, "global_step": 487994, "epoch": 5879} {"train_loss": -27.22830581665039, "global_step": 487995, "epoch": 5879} {"train_loss": -27.214874267578125, "global_step": 487996, "epoch": 5879} {"train_loss": -27.14802360534668, "global_step": 487997, "epoch": 5879} {"train_loss": -27.468244552612305, "global_step": 487998, "epoch": 5879} {"train_loss": -26.69941520690918, "global_step": 487999, "epoch": 5879} {"train_loss": -27.301803588867188, "global_step": 488000, "epoch": 5879} {"train_loss": -27.577423095703125, "global_step": 488001, "epoch": 5879} {"train_loss": -27.462635040283203, "global_step": 488002, "epoch": 5879} {"train_loss": -27.292768478393555, "global_step": 488003, "epoch": 5879} {"train_loss": -27.70168113708496, "global_step": 488004, "epoch": 5879} {"train_loss": -27.69231605529785, "global_step": 488005, "epoch": 5879} {"train_loss": -27.349145889282227, "global_step": 488006, "epoch": 5879} {"train_loss": -27.13820457458496, "global_step": 488007, "epoch": 5879} {"train_loss": -27.592802047729492, "global_step": 488008, "epoch": 5879} {"train_loss": -27.25788688659668, "global_step": 488009, "epoch": 5879} {"train_loss": -27.835845947265625, "global_step": 488010, "epoch": 5879} {"train_loss": -27.34710121154785, "global_step": 488011, "epoch": 5879} {"train_loss": -27.5574951171875, "global_step": 488012, "epoch": 5879} {"train_loss": -27.0467529296875, "global_step": 488013, "epoch": 5879} {"train_loss": -27.08795738220215, "global_step": 488014, "epoch": 5879} {"train_loss": -27.375823974609375, "global_step": 488015, "epoch": 5879} {"train_loss": -27.3040828704834, "global_step": 488016, "epoch": 5879} {"train_loss": -27.400793075561523, "global_step": 488017, "epoch": 5879} {"train_loss": -27.439905166625977, "global_step": 488018, "epoch": 5879} {"train_loss": -27.237375259399414, "global_step": 488019, "epoch": 5879} {"train_loss": -27.549428939819336, "global_step": 488020, "epoch": 5879} {"train_loss": -27.39227867126465, "global_step": 488021, "epoch": 5879} {"train_loss": -26.957983016967773, "global_step": 488022, "epoch": 5879} {"train_loss": -27.396459579467773, "global_step": 488023, "epoch": 5879} {"train_loss": -27.57630729675293, "global_step": 488024, "epoch": 5879} {"train_loss": -27.469345092773438, "global_step": 488025, "epoch": 5879} {"train_loss": -27.316015243530273, "global_step": 488026, "epoch": 5879} {"train_loss": -27.552032470703125, "global_step": 488027, "epoch": 5879} {"train_loss": -27.232059478759766, "global_step": 488028, "epoch": 5879} {"train_loss": -27.5914249420166, "global_step": 488029, "epoch": 5879} {"train_loss": -27.458295822143555, "global_step": 488030, "epoch": 5879} {"train_loss": -27.2619686126709, "global_step": 488031, "epoch": 5879} {"train_loss": -27.402942657470703, "global_step": 488032, "epoch": 5879} {"train_loss": -27.824880599975586, "global_step": 488033, "epoch": 5879} {"train_loss": -27.666528701782227, "global_step": 488034, "epoch": 5879} {"train_loss": -27.272003173828125, "global_step": 488035, "epoch": 5879} {"train_loss": -27.113433837890625, "global_step": 488036, "epoch": 5879} {"train_loss": -27.307355880737305, "global_step": 488037, "epoch": 5879} {"train_loss": -27.28411865234375, "global_step": 488038, "epoch": 5879} {"train_loss": -27.062774589262812, "global_step": 488039, "epoch": 5879, "val_loss": 6551771.0} {"train_loss": -26.815948486328125, "global_step": 488040, "epoch": 5880} {"train_loss": -27.0705623626709, "global_step": 488041, "epoch": 5880} {"train_loss": -27.25531578063965, "global_step": 488042, "epoch": 5880} {"train_loss": -26.959020614624023, "global_step": 488043, "epoch": 5880} {"train_loss": -27.24169921875, "global_step": 488044, "epoch": 5880} {"train_loss": -26.939558029174805, "global_step": 488045, "epoch": 5880} {"train_loss": -27.40673828125, "global_step": 488046, "epoch": 5880} {"train_loss": -27.129499435424805, "global_step": 488047, "epoch": 5880} {"train_loss": -27.179624557495117, "global_step": 488048, "epoch": 5880} {"train_loss": -26.72476577758789, "global_step": 488049, "epoch": 5880} {"train_loss": -27.1158447265625, "global_step": 488050, "epoch": 5880} {"train_loss": -27.033405303955078, "global_step": 488051, "epoch": 5880} {"train_loss": -27.30829429626465, "global_step": 488052, "epoch": 5880} {"train_loss": -27.305627822875977, "global_step": 488053, "epoch": 5880} {"train_loss": -27.12396812438965, "global_step": 488054, "epoch": 5880} {"train_loss": -27.25983238220215, "global_step": 488055, "epoch": 5880} {"train_loss": -27.151208877563477, "global_step": 488056, "epoch": 5880} {"train_loss": -26.777088165283203, "global_step": 488057, "epoch": 5880} {"train_loss": -26.7271671295166, "global_step": 488058, "epoch": 5880} {"train_loss": -27.111059188842773, "global_step": 488059, "epoch": 5880} {"train_loss": -27.28736686706543, "global_step": 488060, "epoch": 5880} {"train_loss": -27.1180477142334, "global_step": 488061, "epoch": 5880} {"train_loss": -27.473114013671875, "global_step": 488062, "epoch": 5880} {"train_loss": -26.81593132019043, "global_step": 488063, "epoch": 5880} {"train_loss": -26.887924194335938, "global_step": 488064, "epoch": 5880} {"train_loss": -27.336750030517578, "global_step": 488065, "epoch": 5880} {"train_loss": -27.045682907104492, "global_step": 488066, "epoch": 5880} {"train_loss": -27.4600830078125, "global_step": 488067, "epoch": 5880} {"train_loss": -27.30173683166504, "global_step": 488068, "epoch": 5880} {"train_loss": -27.142602920532227, "global_step": 488069, "epoch": 5880} {"train_loss": -27.143524169921875, "global_step": 488070, "epoch": 5880} {"train_loss": -27.45267677307129, "global_step": 488071, "epoch": 5880} {"train_loss": -27.533649444580078, "global_step": 488072, "epoch": 5880} {"train_loss": -26.71015739440918, "global_step": 488073, "epoch": 5880} {"train_loss": -27.605310440063477, "global_step": 488074, "epoch": 5880} {"train_loss": -26.7674617767334, "global_step": 488075, "epoch": 5880} {"train_loss": -27.13041114807129, "global_step": 488076, "epoch": 5880} {"train_loss": -27.462438583374023, "global_step": 488077, "epoch": 5880} {"train_loss": -26.82801628112793, "global_step": 488078, "epoch": 5880} {"train_loss": -27.45066261291504, "global_step": 488079, "epoch": 5880} {"train_loss": -27.374664306640625, "global_step": 488080, "epoch": 5880} {"train_loss": -27.346145629882812, "global_step": 488081, "epoch": 5880} {"train_loss": -27.532880783081055, "global_step": 488082, "epoch": 5880} {"train_loss": -27.213926315307617, "global_step": 488083, "epoch": 5880} {"train_loss": -27.15789222717285, "global_step": 488084, "epoch": 5880} {"train_loss": -27.358245849609375, "global_step": 488085, "epoch": 5880} {"train_loss": -27.215890884399414, "global_step": 488086, "epoch": 5880} {"train_loss": -27.467926025390625, "global_step": 488087, "epoch": 5880} {"train_loss": -27.354724884033203, "global_step": 488088, "epoch": 5880} {"train_loss": -27.122251510620117, "global_step": 488089, "epoch": 5880} {"train_loss": -27.471445083618164, "global_step": 488090, "epoch": 5880} {"train_loss": -27.120203018188477, "global_step": 488091, "epoch": 5880} {"train_loss": -27.52560806274414, "global_step": 488092, "epoch": 5880} {"train_loss": -27.279285430908203, "global_step": 488093, "epoch": 5880} {"train_loss": -27.38184928894043, "global_step": 488094, "epoch": 5880} {"train_loss": -27.643661499023438, "global_step": 488095, "epoch": 5880} {"train_loss": -27.3079833984375, "global_step": 488096, "epoch": 5880} {"train_loss": -27.196701049804688, "global_step": 488097, "epoch": 5880} {"train_loss": -27.332172393798828, "global_step": 488098, "epoch": 5880} {"train_loss": -27.39070701599121, "global_step": 488099, "epoch": 5880} {"train_loss": -27.614286422729492, "global_step": 488100, "epoch": 5880} {"train_loss": -27.289657592773438, "global_step": 488101, "epoch": 5880} {"train_loss": -27.567337036132812, "global_step": 488102, "epoch": 5880} {"train_loss": -27.4414119720459, "global_step": 488103, "epoch": 5880} {"train_loss": -27.45684242248535, "global_step": 488104, "epoch": 5880} {"train_loss": -27.031818389892578, "global_step": 488105, "epoch": 5880} {"train_loss": -27.4988956451416, "global_step": 488106, "epoch": 5880} {"train_loss": -27.641971588134766, "global_step": 488107, "epoch": 5880} {"train_loss": -27.191364288330078, "global_step": 488108, "epoch": 5880} {"train_loss": -27.318201065063477, "global_step": 488109, "epoch": 5880} {"train_loss": -27.172046661376953, "global_step": 488110, "epoch": 5880} {"train_loss": -27.65199089050293, "global_step": 488111, "epoch": 5880} {"train_loss": -27.621732711791992, "global_step": 488112, "epoch": 5880} {"train_loss": -27.252832412719727, "global_step": 488113, "epoch": 5880} {"train_loss": -27.082599639892578, "global_step": 488114, "epoch": 5880} {"train_loss": -27.277856826782227, "global_step": 488115, "epoch": 5880} {"train_loss": -27.506311416625977, "global_step": 488116, "epoch": 5880} {"train_loss": -27.038354873657227, "global_step": 488117, "epoch": 5880} {"train_loss": -27.52643394470215, "global_step": 488118, "epoch": 5880} {"train_loss": -27.301898956298828, "global_step": 488119, "epoch": 5880} {"train_loss": -27.3997859954834, "global_step": 488120, "epoch": 5880} {"train_loss": -27.387542724609375, "global_step": 488121, "epoch": 5880} {"train_loss": -27.25716678205743, "global_step": 488122, "epoch": 5880, "val_loss": 6551024.0} {"train_loss": -26.788684844970703, "global_step": 488123, "epoch": 5881} {"train_loss": -27.1286563873291, "global_step": 488124, "epoch": 5881} {"train_loss": -26.970727920532227, "global_step": 488125, "epoch": 5881} {"train_loss": -27.280914306640625, "global_step": 488126, "epoch": 5881} {"train_loss": -27.064664840698242, "global_step": 488127, "epoch": 5881} {"train_loss": -26.815420150756836, "global_step": 488128, "epoch": 5881} {"train_loss": -26.76679801940918, "global_step": 488129, "epoch": 5881} {"train_loss": -26.876245498657227, "global_step": 488130, "epoch": 5881} {"train_loss": -26.965845108032227, "global_step": 488131, "epoch": 5881} {"train_loss": -27.080488204956055, "global_step": 488132, "epoch": 5881} {"train_loss": -27.4401912689209, "global_step": 488133, "epoch": 5881} {"train_loss": -27.02442741394043, "global_step": 488134, "epoch": 5881} {"train_loss": -27.110624313354492, "global_step": 488135, "epoch": 5881} {"train_loss": -27.202045440673828, "global_step": 488136, "epoch": 5881} {"train_loss": -26.73004722595215, "global_step": 488137, "epoch": 5881} {"train_loss": -26.89291763305664, "global_step": 488138, "epoch": 5881} {"train_loss": -26.77532386779785, "global_step": 488139, "epoch": 5881} {"train_loss": -26.641555786132812, "global_step": 488140, "epoch": 5881} {"train_loss": -27.311330795288086, "global_step": 488141, "epoch": 5881} {"train_loss": -27.238372802734375, "global_step": 488142, "epoch": 5881} {"train_loss": -26.812122344970703, "global_step": 488143, "epoch": 5881} {"train_loss": -26.805185317993164, "global_step": 488144, "epoch": 5881} {"train_loss": -27.1575984954834, "global_step": 488145, "epoch": 5881} {"train_loss": -26.900714874267578, "global_step": 488146, "epoch": 5881} {"train_loss": -26.855798721313477, "global_step": 488147, "epoch": 5881} {"train_loss": -26.594375610351562, "global_step": 488148, "epoch": 5881} {"train_loss": -26.982717514038086, "global_step": 488149, "epoch": 5881} {"train_loss": -26.9554500579834, "global_step": 488150, "epoch": 5881} {"train_loss": -27.316192626953125, "global_step": 488151, "epoch": 5881} {"train_loss": -26.971851348876953, "global_step": 488152, "epoch": 5881} {"train_loss": -26.75751304626465, "global_step": 488153, "epoch": 5881} {"train_loss": -27.04998779296875, "global_step": 488154, "epoch": 5881} {"train_loss": -27.342390060424805, "global_step": 488155, "epoch": 5881} {"train_loss": -27.469263076782227, "global_step": 488156, "epoch": 5881} {"train_loss": -27.377588272094727, "global_step": 488157, "epoch": 5881} {"train_loss": -27.345617294311523, "global_step": 488158, "epoch": 5881} {"train_loss": -27.4388484954834, "global_step": 488159, "epoch": 5881} {"train_loss": -27.281904220581055, "global_step": 488160, "epoch": 5881} {"train_loss": -27.171049118041992, "global_step": 488161, "epoch": 5881} {"train_loss": -27.44189453125, "global_step": 488162, "epoch": 5881} {"train_loss": -27.135812759399414, "global_step": 488163, "epoch": 5881} {"train_loss": -27.462621688842773, "global_step": 488164, "epoch": 5881} {"train_loss": -27.291706085205078, "global_step": 488165, "epoch": 5881} {"train_loss": -27.476003646850586, "global_step": 488166, "epoch": 5881} {"train_loss": -27.478063583374023, "global_step": 488167, "epoch": 5881} {"train_loss": -27.0427188873291, "global_step": 488168, "epoch": 5881} {"train_loss": -27.09221839904785, "global_step": 488169, "epoch": 5881} {"train_loss": -27.4300479888916, "global_step": 488170, "epoch": 5881} {"train_loss": -27.19663429260254, "global_step": 488171, "epoch": 5881} {"train_loss": -27.630399703979492, "global_step": 488172, "epoch": 5881} {"train_loss": -27.376388549804688, "global_step": 488173, "epoch": 5881} {"train_loss": -27.17465591430664, "global_step": 488174, "epoch": 5881} {"train_loss": -27.272809982299805, "global_step": 488175, "epoch": 5881} {"train_loss": -27.44000244140625, "global_step": 488176, "epoch": 5881} {"train_loss": -27.42267417907715, "global_step": 488177, "epoch": 5881} {"train_loss": -27.14949607849121, "global_step": 488178, "epoch": 5881} {"train_loss": -27.190275192260742, "global_step": 488179, "epoch": 5881} {"train_loss": -27.267044067382812, "global_step": 488180, "epoch": 5881} {"train_loss": -27.444726943969727, "global_step": 488181, "epoch": 5881} {"train_loss": -27.38287925720215, "global_step": 488182, "epoch": 5881} {"train_loss": -27.541812896728516, "global_step": 488183, "epoch": 5881} {"train_loss": -27.417917251586914, "global_step": 488184, "epoch": 5881} {"train_loss": -27.417926788330078, "global_step": 488185, "epoch": 5881} {"train_loss": -27.662830352783203, "global_step": 488186, "epoch": 5881} {"train_loss": -27.3383846282959, "global_step": 488187, "epoch": 5881} {"train_loss": -27.2360782623291, "global_step": 488188, "epoch": 5881} {"train_loss": -27.3787899017334, "global_step": 488189, "epoch": 5881} {"train_loss": -27.511625289916992, "global_step": 488190, "epoch": 5881} {"train_loss": -27.67585563659668, "global_step": 488191, "epoch": 5881} {"train_loss": -27.44140625, "global_step": 488192, "epoch": 5881} {"train_loss": -27.4775390625, "global_step": 488193, "epoch": 5881} {"train_loss": -27.376596450805664, "global_step": 488194, "epoch": 5881} {"train_loss": -27.648914337158203, "global_step": 488195, "epoch": 5881} {"train_loss": -27.035207748413086, "global_step": 488196, "epoch": 5881} {"train_loss": -27.800262451171875, "global_step": 488197, "epoch": 5881} {"train_loss": -27.513036727905273, "global_step": 488198, "epoch": 5881} {"train_loss": -27.709766387939453, "global_step": 488199, "epoch": 5881} {"train_loss": -27.407987594604492, "global_step": 488200, "epoch": 5881} {"train_loss": -27.62904930114746, "global_step": 488201, "epoch": 5881} {"train_loss": -27.560199737548828, "global_step": 488202, "epoch": 5881} {"train_loss": -27.5305233001709, "global_step": 488203, "epoch": 5881} {"train_loss": -27.48601722717285, "global_step": 488204, "epoch": 5881} {"train_loss": -27.226388586572853, "global_step": 488205, "epoch": 5881, "val_loss": 6579071.0} {"train_loss": -27.344953536987305, "global_step": 488206, "epoch": 5882} {"train_loss": -25.86854362487793, "global_step": 488207, "epoch": 5882} {"train_loss": -25.590810775756836, "global_step": 488208, "epoch": 5882} {"train_loss": -25.903705596923828, "global_step": 488209, "epoch": 5882} {"train_loss": -26.53301429748535, "global_step": 488210, "epoch": 5882} {"train_loss": -27.44209098815918, "global_step": 488211, "epoch": 5882} {"train_loss": -26.385656356811523, "global_step": 488212, "epoch": 5882} {"train_loss": -26.945791244506836, "global_step": 488213, "epoch": 5882} {"train_loss": -27.12371826171875, "global_step": 488214, "epoch": 5882} {"train_loss": -27.030725479125977, "global_step": 488215, "epoch": 5882} {"train_loss": -27.309492111206055, "global_step": 488216, "epoch": 5882} {"train_loss": -26.975418090820312, "global_step": 488217, "epoch": 5882} {"train_loss": -27.094192504882812, "global_step": 488218, "epoch": 5882} {"train_loss": -27.117780685424805, "global_step": 488219, "epoch": 5882} {"train_loss": -26.98069190979004, "global_step": 488220, "epoch": 5882} {"train_loss": -26.949726104736328, "global_step": 488221, "epoch": 5882} {"train_loss": -27.139373779296875, "global_step": 488222, "epoch": 5882} {"train_loss": -27.432926177978516, "global_step": 488223, "epoch": 5882} {"train_loss": -27.28692054748535, "global_step": 488224, "epoch": 5882} {"train_loss": -26.95965576171875, "global_step": 488225, "epoch": 5882} {"train_loss": -27.114395141601562, "global_step": 488226, "epoch": 5882} {"train_loss": -26.940160751342773, "global_step": 488227, "epoch": 5882} {"train_loss": -27.113386154174805, "global_step": 488228, "epoch": 5882} {"train_loss": -26.924026489257812, "global_step": 488229, "epoch": 5882} {"train_loss": -27.350727081298828, "global_step": 488230, "epoch": 5882} {"train_loss": -27.307554244995117, "global_step": 488231, "epoch": 5882} {"train_loss": -27.483930587768555, "global_step": 488232, "epoch": 5882} {"train_loss": -27.5845890045166, "global_step": 488233, "epoch": 5882} {"train_loss": -27.546131134033203, "global_step": 488234, "epoch": 5882} {"train_loss": -27.14361000061035, "global_step": 488235, "epoch": 5882} {"train_loss": -27.61946678161621, "global_step": 488236, "epoch": 5882} {"train_loss": -27.287805557250977, "global_step": 488237, "epoch": 5882} {"train_loss": -27.47674560546875, "global_step": 488238, "epoch": 5882} {"train_loss": -27.32477378845215, "global_step": 488239, "epoch": 5882} {"train_loss": -27.289091110229492, "global_step": 488240, "epoch": 5882} {"train_loss": -27.741336822509766, "global_step": 488241, "epoch": 5882} {"train_loss": -27.422595977783203, "global_step": 488242, "epoch": 5882} {"train_loss": -27.3179988861084, "global_step": 488243, "epoch": 5882} {"train_loss": -27.33806800842285, "global_step": 488244, "epoch": 5882} {"train_loss": -27.429609298706055, "global_step": 488245, "epoch": 5882} {"train_loss": -27.306882858276367, "global_step": 488246, "epoch": 5882} {"train_loss": -27.35945701599121, "global_step": 488247, "epoch": 5882} {"train_loss": -27.32086181640625, "global_step": 488248, "epoch": 5882} {"train_loss": -27.485891342163086, "global_step": 488249, "epoch": 5882} {"train_loss": -27.32795524597168, "global_step": 488250, "epoch": 5882} {"train_loss": -26.990522384643555, "global_step": 488251, "epoch": 5882} {"train_loss": -27.039581298828125, "global_step": 488252, "epoch": 5882} {"train_loss": -27.251800537109375, "global_step": 488253, "epoch": 5882} {"train_loss": -27.29974365234375, "global_step": 488254, "epoch": 5882} {"train_loss": -27.466140747070312, "global_step": 488255, "epoch": 5882} {"train_loss": -27.496007919311523, "global_step": 488256, "epoch": 5882} {"train_loss": -27.613805770874023, "global_step": 488257, "epoch": 5882} {"train_loss": -27.43815040588379, "global_step": 488258, "epoch": 5882} {"train_loss": -27.507583618164062, "global_step": 488259, "epoch": 5882} {"train_loss": -27.3372859954834, "global_step": 488260, "epoch": 5882} {"train_loss": -27.20162010192871, "global_step": 488261, "epoch": 5882} {"train_loss": -27.6472225189209, "global_step": 488262, "epoch": 5882} {"train_loss": -27.638586044311523, "global_step": 488263, "epoch": 5882} {"train_loss": -27.298858642578125, "global_step": 488264, "epoch": 5882} {"train_loss": -27.270959854125977, "global_step": 488265, "epoch": 5882} {"train_loss": -27.41176414489746, "global_step": 488266, "epoch": 5882} {"train_loss": -27.861719131469727, "global_step": 488267, "epoch": 5882} {"train_loss": -27.422943115234375, "global_step": 488268, "epoch": 5882} {"train_loss": -27.41071891784668, "global_step": 488269, "epoch": 5882} {"train_loss": -27.304738998413086, "global_step": 488270, "epoch": 5882} {"train_loss": -27.358808517456055, "global_step": 488271, "epoch": 5882} {"train_loss": -27.2122745513916, "global_step": 488272, "epoch": 5882} {"train_loss": -27.541751861572266, "global_step": 488273, "epoch": 5882} {"train_loss": -27.166051864624023, "global_step": 488274, "epoch": 5882} {"train_loss": -27.114042282104492, "global_step": 488275, "epoch": 5882} {"train_loss": -27.415002822875977, "global_step": 488276, "epoch": 5882} {"train_loss": -26.8558292388916, "global_step": 488277, "epoch": 5882} {"train_loss": -27.193164825439453, "global_step": 488278, "epoch": 5882} {"train_loss": -26.860105514526367, "global_step": 488279, "epoch": 5882} {"train_loss": -27.01856803894043, "global_step": 488280, "epoch": 5882} {"train_loss": -27.37306022644043, "global_step": 488281, "epoch": 5882} {"train_loss": -26.8667049407959, "global_step": 488282, "epoch": 5882} {"train_loss": -26.761377334594727, "global_step": 488283, "epoch": 5882} {"train_loss": -27.046707153320312, "global_step": 488284, "epoch": 5882} {"train_loss": -27.462072372436523, "global_step": 488285, "epoch": 5882} {"train_loss": -26.70171546936035, "global_step": 488286, "epoch": 5882} {"train_loss": -27.414627075195312, "global_step": 488287, "epoch": 5882} {"train_loss": -27.203269613794532, "global_step": 488288, "epoch": 5882, "val_loss": 6581137.5} {"train_loss": -25.66358757019043, "global_step": 488289, "epoch": 5883} {"train_loss": -25.399438858032227, "global_step": 488290, "epoch": 5883} {"train_loss": -26.6214599609375, "global_step": 488291, "epoch": 5883} {"train_loss": -25.97403335571289, "global_step": 488292, "epoch": 5883} {"train_loss": -26.89198875427246, "global_step": 488293, "epoch": 5883} {"train_loss": -26.544858932495117, "global_step": 488294, "epoch": 5883} {"train_loss": -26.613370895385742, "global_step": 488295, "epoch": 5883} {"train_loss": -26.369848251342773, "global_step": 488296, "epoch": 5883} {"train_loss": -26.638599395751953, "global_step": 488297, "epoch": 5883} {"train_loss": -26.780902862548828, "global_step": 488298, "epoch": 5883} {"train_loss": -26.736661911010742, "global_step": 488299, "epoch": 5883} {"train_loss": -26.646574020385742, "global_step": 488300, "epoch": 5883} {"train_loss": -26.824934005737305, "global_step": 488301, "epoch": 5883} {"train_loss": -26.70600700378418, "global_step": 488302, "epoch": 5883} {"train_loss": -26.64533042907715, "global_step": 488303, "epoch": 5883} {"train_loss": -27.0025577545166, "global_step": 488304, "epoch": 5883} {"train_loss": -26.826400756835938, "global_step": 488305, "epoch": 5883} {"train_loss": -26.98761558532715, "global_step": 488306, "epoch": 5883} {"train_loss": -27.079999923706055, "global_step": 488307, "epoch": 5883} {"train_loss": -26.739099502563477, "global_step": 488308, "epoch": 5883} {"train_loss": -26.977676391601562, "global_step": 488309, "epoch": 5883} {"train_loss": -27.03413200378418, "global_step": 488310, "epoch": 5883} {"train_loss": -26.813024520874023, "global_step": 488311, "epoch": 5883} {"train_loss": -26.653249740600586, "global_step": 488312, "epoch": 5883} {"train_loss": -27.05527114868164, "global_step": 488313, "epoch": 5883} {"train_loss": -27.296833038330078, "global_step": 488314, "epoch": 5883} {"train_loss": -27.346698760986328, "global_step": 488315, "epoch": 5883} {"train_loss": -27.311100006103516, "global_step": 488316, "epoch": 5883} {"train_loss": -26.950769424438477, "global_step": 488317, "epoch": 5883} {"train_loss": -27.119678497314453, "global_step": 488318, "epoch": 5883} {"train_loss": -27.0821590423584, "global_step": 488319, "epoch": 5883} {"train_loss": -27.214258193969727, "global_step": 488320, "epoch": 5883} {"train_loss": -27.13960075378418, "global_step": 488321, "epoch": 5883} {"train_loss": -27.191974639892578, "global_step": 488322, "epoch": 5883} {"train_loss": -27.24810218811035, "global_step": 488323, "epoch": 5883} {"train_loss": -26.846891403198242, "global_step": 488324, "epoch": 5883} {"train_loss": -27.10568618774414, "global_step": 488325, "epoch": 5883} {"train_loss": -27.256885528564453, "global_step": 488326, "epoch": 5883} {"train_loss": -27.513473510742188, "global_step": 488327, "epoch": 5883} {"train_loss": -27.63912010192871, "global_step": 488328, "epoch": 5883} {"train_loss": -27.580732345581055, "global_step": 488329, "epoch": 5883} {"train_loss": -27.552167892456055, "global_step": 488330, "epoch": 5883} {"train_loss": -27.18792152404785, "global_step": 488331, "epoch": 5883} {"train_loss": -27.414854049682617, "global_step": 488332, "epoch": 5883} {"train_loss": -27.50358009338379, "global_step": 488333, "epoch": 5883} {"train_loss": -27.04669761657715, "global_step": 488334, "epoch": 5883} {"train_loss": -27.177112579345703, "global_step": 488335, "epoch": 5883} {"train_loss": -26.964696884155273, "global_step": 488336, "epoch": 5883} {"train_loss": -27.116743087768555, "global_step": 488337, "epoch": 5883} {"train_loss": -27.479360580444336, "global_step": 488338, "epoch": 5883} {"train_loss": -27.136220932006836, "global_step": 488339, "epoch": 5883} {"train_loss": -26.8647403717041, "global_step": 488340, "epoch": 5883} {"train_loss": -27.26803970336914, "global_step": 488341, "epoch": 5883} {"train_loss": -27.1529541015625, "global_step": 488342, "epoch": 5883} {"train_loss": -26.910215377807617, "global_step": 488343, "epoch": 5883} {"train_loss": -27.314847946166992, "global_step": 488344, "epoch": 5883} {"train_loss": -27.610260009765625, "global_step": 488345, "epoch": 5883} {"train_loss": -27.140836715698242, "global_step": 488346, "epoch": 5883} {"train_loss": -27.355554580688477, "global_step": 488347, "epoch": 5883} {"train_loss": -27.495426177978516, "global_step": 488348, "epoch": 5883} {"train_loss": -27.8482723236084, "global_step": 488349, "epoch": 5883} {"train_loss": -27.38538932800293, "global_step": 488350, "epoch": 5883} {"train_loss": -27.489654541015625, "global_step": 488351, "epoch": 5883} {"train_loss": -27.53713035583496, "global_step": 488352, "epoch": 5883} {"train_loss": -27.618366241455078, "global_step": 488353, "epoch": 5883} {"train_loss": -27.641605377197266, "global_step": 488354, "epoch": 5883} {"train_loss": -27.515274047851562, "global_step": 488355, "epoch": 5883} {"train_loss": -27.204633712768555, "global_step": 488356, "epoch": 5883} {"train_loss": -27.625715255737305, "global_step": 488357, "epoch": 5883} {"train_loss": -27.626712799072266, "global_step": 488358, "epoch": 5883} {"train_loss": -27.594074249267578, "global_step": 488359, "epoch": 5883} {"train_loss": -27.634809494018555, "global_step": 488360, "epoch": 5883} {"train_loss": -27.384845733642578, "global_step": 488361, "epoch": 5883} {"train_loss": -27.609161376953125, "global_step": 488362, "epoch": 5883} {"train_loss": -27.531482696533203, "global_step": 488363, "epoch": 5883} {"train_loss": -27.15899085998535, "global_step": 488364, "epoch": 5883} {"train_loss": -27.18143081665039, "global_step": 488365, "epoch": 5883} {"train_loss": -27.559890747070312, "global_step": 488366, "epoch": 5883} {"train_loss": -27.726057052612305, "global_step": 488367, "epoch": 5883} {"train_loss": -27.627607345581055, "global_step": 488368, "epoch": 5883} {"train_loss": -27.28215980529785, "global_step": 488369, "epoch": 5883} {"train_loss": -27.373138427734375, "global_step": 488370, "epoch": 5883} {"train_loss": -27.139721767011896, "global_step": 488371, "epoch": 5883, "val_loss": 6607031.0} {"train_loss": -26.437946319580078, "global_step": 488372, "epoch": 5884} {"train_loss": -26.645471572875977, "global_step": 488373, "epoch": 5884} {"train_loss": -25.470617294311523, "global_step": 488374, "epoch": 5884} {"train_loss": -26.57411003112793, "global_step": 488375, "epoch": 5884} {"train_loss": -26.60450553894043, "global_step": 488376, "epoch": 5884} {"train_loss": -26.275251388549805, "global_step": 488377, "epoch": 5884} {"train_loss": -26.348508834838867, "global_step": 488378, "epoch": 5884} {"train_loss": -27.049579620361328, "global_step": 488379, "epoch": 5884} {"train_loss": -26.726245880126953, "global_step": 488380, "epoch": 5884} {"train_loss": -26.356876373291016, "global_step": 488381, "epoch": 5884} {"train_loss": -26.829553604125977, "global_step": 488382, "epoch": 5884} {"train_loss": -26.5159912109375, "global_step": 488383, "epoch": 5884} {"train_loss": -26.901498794555664, "global_step": 488384, "epoch": 5884} {"train_loss": -26.459997177124023, "global_step": 488385, "epoch": 5884} {"train_loss": -26.09515380859375, "global_step": 488386, "epoch": 5884} {"train_loss": -26.950061798095703, "global_step": 488387, "epoch": 5884} {"train_loss": -26.693622589111328, "global_step": 488388, "epoch": 5884} {"train_loss": -26.95704460144043, "global_step": 488389, "epoch": 5884} {"train_loss": -26.832693099975586, "global_step": 488390, "epoch": 5884} {"train_loss": -26.295154571533203, "global_step": 488391, "epoch": 5884} {"train_loss": -25.901020050048828, "global_step": 488392, "epoch": 5884} {"train_loss": -27.15921401977539, "global_step": 488393, "epoch": 5884} {"train_loss": -27.082605361938477, "global_step": 488394, "epoch": 5884} {"train_loss": -26.940296173095703, "global_step": 488395, "epoch": 5884} {"train_loss": -26.75786781311035, "global_step": 488396, "epoch": 5884} {"train_loss": -26.83257484436035, "global_step": 488397, "epoch": 5884} {"train_loss": -27.286884307861328, "global_step": 488398, "epoch": 5884} {"train_loss": -27.522491455078125, "global_step": 488399, "epoch": 5884} {"train_loss": -27.42806053161621, "global_step": 488400, "epoch": 5884} {"train_loss": -27.231168746948242, "global_step": 488401, "epoch": 5884} {"train_loss": -27.269989013671875, "global_step": 488402, "epoch": 5884} {"train_loss": -27.272785186767578, "global_step": 488403, "epoch": 5884} {"train_loss": -27.515869140625, "global_step": 488404, "epoch": 5884} {"train_loss": -27.05859375, "global_step": 488405, "epoch": 5884} {"train_loss": -27.550674438476562, "global_step": 488406, "epoch": 5884} {"train_loss": -27.37984275817871, "global_step": 488407, "epoch": 5884} {"train_loss": -27.25009536743164, "global_step": 488408, "epoch": 5884} {"train_loss": -27.46577262878418, "global_step": 488409, "epoch": 5884} {"train_loss": -27.110387802124023, "global_step": 488410, "epoch": 5884} {"train_loss": -27.248010635375977, "global_step": 488411, "epoch": 5884} {"train_loss": -27.73514747619629, "global_step": 488412, "epoch": 5884} {"train_loss": -27.242691040039062, "global_step": 488413, "epoch": 5884} {"train_loss": -27.48150062561035, "global_step": 488414, "epoch": 5884} {"train_loss": -27.587921142578125, "global_step": 488415, "epoch": 5884} {"train_loss": -27.19964599609375, "global_step": 488416, "epoch": 5884} {"train_loss": -27.220029830932617, "global_step": 488417, "epoch": 5884} {"train_loss": -27.226181030273438, "global_step": 488418, "epoch": 5884} {"train_loss": -27.13827896118164, "global_step": 488419, "epoch": 5884} {"train_loss": -27.611663818359375, "global_step": 488420, "epoch": 5884} {"train_loss": -27.43025779724121, "global_step": 488421, "epoch": 5884} {"train_loss": -27.279743194580078, "global_step": 488422, "epoch": 5884} {"train_loss": -27.14552116394043, "global_step": 488423, "epoch": 5884} {"train_loss": -27.648054122924805, "global_step": 488424, "epoch": 5884} {"train_loss": -27.444183349609375, "global_step": 488425, "epoch": 5884} {"train_loss": -27.289724349975586, "global_step": 488426, "epoch": 5884} {"train_loss": -27.139739990234375, "global_step": 488427, "epoch": 5884} {"train_loss": -27.40850257873535, "global_step": 488428, "epoch": 5884} {"train_loss": -27.253143310546875, "global_step": 488429, "epoch": 5884} {"train_loss": -27.23050308227539, "global_step": 488430, "epoch": 5884} {"train_loss": -27.27894401550293, "global_step": 488431, "epoch": 5884} {"train_loss": -27.417621612548828, "global_step": 488432, "epoch": 5884} {"train_loss": -27.383594512939453, "global_step": 488433, "epoch": 5884} {"train_loss": -27.062936782836914, "global_step": 488434, "epoch": 5884} {"train_loss": -26.948944091796875, "global_step": 488435, "epoch": 5884} {"train_loss": -26.86724853515625, "global_step": 488436, "epoch": 5884} {"train_loss": -26.553709030151367, "global_step": 488437, "epoch": 5884} {"train_loss": -27.0612850189209, "global_step": 488438, "epoch": 5884} {"train_loss": -26.874927520751953, "global_step": 488439, "epoch": 5884} {"train_loss": -27.09883689880371, "global_step": 488440, "epoch": 5884} {"train_loss": -26.97442054748535, "global_step": 488441, "epoch": 5884} {"train_loss": -26.957544326782227, "global_step": 488442, "epoch": 5884} {"train_loss": -27.157575607299805, "global_step": 488443, "epoch": 5884} {"train_loss": -27.01682472229004, "global_step": 488444, "epoch": 5884} {"train_loss": -26.531728744506836, "global_step": 488445, "epoch": 5884} {"train_loss": -26.942834854125977, "global_step": 488446, "epoch": 5884} {"train_loss": -25.736997604370117, "global_step": 488447, "epoch": 5884} {"train_loss": -26.98691749572754, "global_step": 488448, "epoch": 5884} {"train_loss": -27.10150146484375, "global_step": 488449, "epoch": 5884} {"train_loss": -27.1356201171875, "global_step": 488450, "epoch": 5884} {"train_loss": -26.661619186401367, "global_step": 488451, "epoch": 5884} {"train_loss": -26.835407257080078, "global_step": 488452, "epoch": 5884} {"train_loss": -26.918928146362305, "global_step": 488453, "epoch": 5884} {"train_loss": -27.01737105128277, "global_step": 488454, "epoch": 5884, "val_loss": 6579051.5} {"train_loss": -24.352161407470703, "global_step": 488455, "epoch": 5885} {"train_loss": -25.388599395751953, "global_step": 488456, "epoch": 5885} {"train_loss": -24.812698364257812, "global_step": 488457, "epoch": 5885} {"train_loss": -25.868879318237305, "global_step": 488458, "epoch": 5885} {"train_loss": -25.267230987548828, "global_step": 488459, "epoch": 5885} {"train_loss": -26.297765731811523, "global_step": 488460, "epoch": 5885} {"train_loss": -25.429357528686523, "global_step": 488461, "epoch": 5885} {"train_loss": -25.53657341003418, "global_step": 488462, "epoch": 5885} {"train_loss": -26.128400802612305, "global_step": 488463, "epoch": 5885} {"train_loss": -25.61099624633789, "global_step": 488464, "epoch": 5885} {"train_loss": -25.97171974182129, "global_step": 488465, "epoch": 5885} {"train_loss": -26.077106475830078, "global_step": 488466, "epoch": 5885} {"train_loss": -26.070032119750977, "global_step": 488467, "epoch": 5885} {"train_loss": -26.05437660217285, "global_step": 488468, "epoch": 5885} {"train_loss": -26.253259658813477, "global_step": 488469, "epoch": 5885} {"train_loss": -26.605981826782227, "global_step": 488470, "epoch": 5885} {"train_loss": -26.632801055908203, "global_step": 488471, "epoch": 5885} {"train_loss": -26.439407348632812, "global_step": 488472, "epoch": 5885} {"train_loss": -26.565587997436523, "global_step": 488473, "epoch": 5885} {"train_loss": -26.504919052124023, "global_step": 488474, "epoch": 5885} {"train_loss": -26.48567771911621, "global_step": 488475, "epoch": 5885} {"train_loss": -26.444244384765625, "global_step": 488476, "epoch": 5885} {"train_loss": -26.541852951049805, "global_step": 488477, "epoch": 5885} {"train_loss": -26.76332664489746, "global_step": 488478, "epoch": 5885} {"train_loss": -26.722930908203125, "global_step": 488479, "epoch": 5885} {"train_loss": -26.5884952545166, "global_step": 488480, "epoch": 5885} {"train_loss": -26.822784423828125, "global_step": 488481, "epoch": 5885} {"train_loss": -26.7794132232666, "global_step": 488482, "epoch": 5885} {"train_loss": -26.735387802124023, "global_step": 488483, "epoch": 5885} {"train_loss": -26.841175079345703, "global_step": 488484, "epoch": 5885} {"train_loss": -27.143497467041016, "global_step": 488485, "epoch": 5885} {"train_loss": -27.22406578063965, "global_step": 488486, "epoch": 5885} {"train_loss": -27.026142120361328, "global_step": 488487, "epoch": 5885} {"train_loss": -27.145877838134766, "global_step": 488488, "epoch": 5885} {"train_loss": -27.051145553588867, "global_step": 488489, "epoch": 5885} {"train_loss": -27.080121994018555, "global_step": 488490, "epoch": 5885} {"train_loss": -27.100244522094727, "global_step": 488491, "epoch": 5885} {"train_loss": -27.1290225982666, "global_step": 488492, "epoch": 5885} {"train_loss": -27.31597900390625, "global_step": 488493, "epoch": 5885} {"train_loss": -27.00519371032715, "global_step": 488494, "epoch": 5885} {"train_loss": -27.313125610351562, "global_step": 488495, "epoch": 5885} {"train_loss": -27.2676944732666, "global_step": 488496, "epoch": 5885} {"train_loss": -26.723236083984375, "global_step": 488497, "epoch": 5885} {"train_loss": -26.93259048461914, "global_step": 488498, "epoch": 5885} {"train_loss": -26.900409698486328, "global_step": 488499, "epoch": 5885} {"train_loss": -27.401594161987305, "global_step": 488500, "epoch": 5885} {"train_loss": -27.196308135986328, "global_step": 488501, "epoch": 5885} {"train_loss": -27.123579025268555, "global_step": 488502, "epoch": 5885} {"train_loss": -26.85868263244629, "global_step": 488503, "epoch": 5885} {"train_loss": -27.196271896362305, "global_step": 488504, "epoch": 5885} {"train_loss": -27.033039093017578, "global_step": 488505, "epoch": 5885} {"train_loss": -27.412107467651367, "global_step": 488506, "epoch": 5885} {"train_loss": -27.408527374267578, "global_step": 488507, "epoch": 5885} {"train_loss": -26.9624080657959, "global_step": 488508, "epoch": 5885} {"train_loss": -27.19257926940918, "global_step": 488509, "epoch": 5885} {"train_loss": -27.62949562072754, "global_step": 488510, "epoch": 5885} {"train_loss": -27.266986846923828, "global_step": 488511, "epoch": 5885} {"train_loss": -27.373380661010742, "global_step": 488512, "epoch": 5885} {"train_loss": -27.429656982421875, "global_step": 488513, "epoch": 5885} {"train_loss": -27.1636905670166, "global_step": 488514, "epoch": 5885} {"train_loss": -27.495838165283203, "global_step": 488515, "epoch": 5885} {"train_loss": -27.428152084350586, "global_step": 488516, "epoch": 5885} {"train_loss": -27.439802169799805, "global_step": 488517, "epoch": 5885} {"train_loss": -27.536252975463867, "global_step": 488518, "epoch": 5885} {"train_loss": -27.601980209350586, "global_step": 488519, "epoch": 5885} {"train_loss": -27.392248153686523, "global_step": 488520, "epoch": 5885} {"train_loss": -27.122150421142578, "global_step": 488521, "epoch": 5885} {"train_loss": -27.584369659423828, "global_step": 488522, "epoch": 5885} {"train_loss": -27.380033493041992, "global_step": 488523, "epoch": 5885} {"train_loss": -27.340253829956055, "global_step": 488524, "epoch": 5885} {"train_loss": -27.913869857788086, "global_step": 488525, "epoch": 5885} {"train_loss": -27.529996871948242, "global_step": 488526, "epoch": 5885} {"train_loss": -27.10249137878418, "global_step": 488527, "epoch": 5885} {"train_loss": -27.44626808166504, "global_step": 488528, "epoch": 5885} {"train_loss": -27.3962459564209, "global_step": 488529, "epoch": 5885} {"train_loss": -27.42782974243164, "global_step": 488530, "epoch": 5885} {"train_loss": -27.31878089904785, "global_step": 488531, "epoch": 5885} {"train_loss": -27.276342391967773, "global_step": 488532, "epoch": 5885} {"train_loss": -27.413410186767578, "global_step": 488533, "epoch": 5885} {"train_loss": -27.648752212524414, "global_step": 488534, "epoch": 5885} {"train_loss": -27.239276885986328, "global_step": 488535, "epoch": 5885} {"train_loss": -27.522491455078125, "global_step": 488536, "epoch": 5885} {"train_loss": -26.86966650170016, "global_step": 488537, "epoch": 5885, "val_loss": 6562435.0} {"train_loss": -26.405349731445312, "global_step": 488538, "epoch": 5886} {"train_loss": -25.31693458557129, "global_step": 488539, "epoch": 5886} {"train_loss": -25.60272216796875, "global_step": 488540, "epoch": 5886} {"train_loss": -26.601882934570312, "global_step": 488541, "epoch": 5886} {"train_loss": -26.497404098510742, "global_step": 488542, "epoch": 5886} {"train_loss": -26.624282836914062, "global_step": 488543, "epoch": 5886} {"train_loss": -26.682111740112305, "global_step": 488544, "epoch": 5886} {"train_loss": -26.533926010131836, "global_step": 488545, "epoch": 5886} {"train_loss": -27.143823623657227, "global_step": 488546, "epoch": 5886} {"train_loss": -25.917760848999023, "global_step": 488547, "epoch": 5886} {"train_loss": -27.080062866210938, "global_step": 488548, "epoch": 5886} {"train_loss": -26.468839645385742, "global_step": 488549, "epoch": 5886} {"train_loss": -26.975208282470703, "global_step": 488550, "epoch": 5886} {"train_loss": -26.516393661499023, "global_step": 488551, "epoch": 5886} {"train_loss": -27.217041015625, "global_step": 488552, "epoch": 5886} {"train_loss": -26.905105590820312, "global_step": 488553, "epoch": 5886} {"train_loss": -26.893518447875977, "global_step": 488554, "epoch": 5886} {"train_loss": -27.321990966796875, "global_step": 488555, "epoch": 5886} {"train_loss": -27.040283203125, "global_step": 488556, "epoch": 5886} {"train_loss": -26.9011173248291, "global_step": 488557, "epoch": 5886} {"train_loss": -27.341062545776367, "global_step": 488558, "epoch": 5886} {"train_loss": -27.64509391784668, "global_step": 488559, "epoch": 5886} {"train_loss": -26.9957332611084, "global_step": 488560, "epoch": 5886} {"train_loss": -27.094770431518555, "global_step": 488561, "epoch": 5886} {"train_loss": -26.6024169921875, "global_step": 488562, "epoch": 5886} {"train_loss": -27.520978927612305, "global_step": 488563, "epoch": 5886} {"train_loss": -27.222259521484375, "global_step": 488564, "epoch": 5886} {"train_loss": -27.205305099487305, "global_step": 488565, "epoch": 5886} {"train_loss": -27.713525772094727, "global_step": 488566, "epoch": 5886} {"train_loss": -27.070392608642578, "global_step": 488567, "epoch": 5886} {"train_loss": -27.425277709960938, "global_step": 488568, "epoch": 5886} {"train_loss": -27.264514923095703, "global_step": 488569, "epoch": 5886} {"train_loss": -27.290876388549805, "global_step": 488570, "epoch": 5886} {"train_loss": -27.466611862182617, "global_step": 488571, "epoch": 5886} {"train_loss": -27.813343048095703, "global_step": 488572, "epoch": 5886} {"train_loss": -27.347675323486328, "global_step": 488573, "epoch": 5886} {"train_loss": -27.09748649597168, "global_step": 488574, "epoch": 5886} {"train_loss": -27.05864906311035, "global_step": 488575, "epoch": 5886} {"train_loss": -27.444019317626953, "global_step": 488576, "epoch": 5886} {"train_loss": -27.311368942260742, "global_step": 488577, "epoch": 5886} {"train_loss": -27.345853805541992, "global_step": 488578, "epoch": 5886} {"train_loss": -27.555822372436523, "global_step": 488579, "epoch": 5886} {"train_loss": -27.500503540039062, "global_step": 488580, "epoch": 5886} {"train_loss": -27.579269409179688, "global_step": 488581, "epoch": 5886} {"train_loss": -27.394559860229492, "global_step": 488582, "epoch": 5886} {"train_loss": -27.7856502532959, "global_step": 488583, "epoch": 5886} {"train_loss": -27.602792739868164, "global_step": 488584, "epoch": 5886} {"train_loss": -27.420429229736328, "global_step": 488585, "epoch": 5886} {"train_loss": -27.441883087158203, "global_step": 488586, "epoch": 5886} {"train_loss": -27.355295181274414, "global_step": 488587, "epoch": 5886} {"train_loss": -27.347524642944336, "global_step": 488588, "epoch": 5886} {"train_loss": -27.29861831665039, "global_step": 488589, "epoch": 5886} {"train_loss": -27.258625030517578, "global_step": 488590, "epoch": 5886} {"train_loss": -27.06036949157715, "global_step": 488591, "epoch": 5886} {"train_loss": -26.8388614654541, "global_step": 488592, "epoch": 5886} {"train_loss": -26.997241973876953, "global_step": 488593, "epoch": 5886} {"train_loss": -26.722614288330078, "global_step": 488594, "epoch": 5886} {"train_loss": -27.933053970336914, "global_step": 488595, "epoch": 5886} {"train_loss": -27.324512481689453, "global_step": 488596, "epoch": 5886} {"train_loss": -27.157901763916016, "global_step": 488597, "epoch": 5886} {"train_loss": -26.87521743774414, "global_step": 488598, "epoch": 5886} {"train_loss": -27.20208168029785, "global_step": 488599, "epoch": 5886} {"train_loss": -27.3396053314209, "global_step": 488600, "epoch": 5886} {"train_loss": -26.884679794311523, "global_step": 488601, "epoch": 5886} {"train_loss": -27.63355827331543, "global_step": 488602, "epoch": 5886} {"train_loss": -27.155256271362305, "global_step": 488603, "epoch": 5886} {"train_loss": -26.756317138671875, "global_step": 488604, "epoch": 5886} {"train_loss": -27.043991088867188, "global_step": 488605, "epoch": 5886} {"train_loss": -27.400257110595703, "global_step": 488606, "epoch": 5886} {"train_loss": -27.2922306060791, "global_step": 488607, "epoch": 5886} {"train_loss": -27.356542587280273, "global_step": 488608, "epoch": 5886} {"train_loss": -27.018695831298828, "global_step": 488609, "epoch": 5886} {"train_loss": -27.335758209228516, "global_step": 488610, "epoch": 5886} {"train_loss": -27.43061637878418, "global_step": 488611, "epoch": 5886} {"train_loss": -27.221099853515625, "global_step": 488612, "epoch": 5886} {"train_loss": -27.448657989501953, "global_step": 488613, "epoch": 5886} {"train_loss": -27.139999389648438, "global_step": 488614, "epoch": 5886} {"train_loss": -27.35931968688965, "global_step": 488615, "epoch": 5886} {"train_loss": -27.243494033813477, "global_step": 488616, "epoch": 5886} {"train_loss": -27.764142990112305, "global_step": 488617, "epoch": 5886} {"train_loss": -27.587020874023438, "global_step": 488618, "epoch": 5886} {"train_loss": -27.30647087097168, "global_step": 488619, "epoch": 5886} {"train_loss": -27.151184587593537, "global_step": 488620, "epoch": 5886, "val_loss": 6662518.0} {"train_loss": -26.738794326782227, "global_step": 488621, "epoch": 5887} {"train_loss": -26.259693145751953, "global_step": 488622, "epoch": 5887} {"train_loss": -26.738311767578125, "global_step": 488623, "epoch": 5887} {"train_loss": -26.71698570251465, "global_step": 488624, "epoch": 5887} {"train_loss": -26.45924949645996, "global_step": 488625, "epoch": 5887} {"train_loss": -26.164566040039062, "global_step": 488626, "epoch": 5887} {"train_loss": -26.1771183013916, "global_step": 488627, "epoch": 5887} {"train_loss": -26.28194236755371, "global_step": 488628, "epoch": 5887} {"train_loss": -26.624149322509766, "global_step": 488629, "epoch": 5887} {"train_loss": -26.783248901367188, "global_step": 488630, "epoch": 5887} {"train_loss": -26.461095809936523, "global_step": 488631, "epoch": 5887} {"train_loss": -26.567609786987305, "global_step": 488632, "epoch": 5887} {"train_loss": -26.581953048706055, "global_step": 488633, "epoch": 5887} {"train_loss": -26.9066219329834, "global_step": 488634, "epoch": 5887} {"train_loss": -26.518295288085938, "global_step": 488635, "epoch": 5887} {"train_loss": -26.86858558654785, "global_step": 488636, "epoch": 5887} {"train_loss": -26.450927734375, "global_step": 488637, "epoch": 5887} {"train_loss": -27.283979415893555, "global_step": 488638, "epoch": 5887} {"train_loss": -26.677326202392578, "global_step": 488639, "epoch": 5887} {"train_loss": -27.023853302001953, "global_step": 488640, "epoch": 5887} {"train_loss": -27.21661376953125, "global_step": 488641, "epoch": 5887} {"train_loss": -27.436010360717773, "global_step": 488642, "epoch": 5887} {"train_loss": -27.344257354736328, "global_step": 488643, "epoch": 5887} {"train_loss": -26.659503936767578, "global_step": 488644, "epoch": 5887} {"train_loss": -27.2275390625, "global_step": 488645, "epoch": 5887} {"train_loss": -27.063932418823242, "global_step": 488646, "epoch": 5887} {"train_loss": -26.975522994995117, "global_step": 488647, "epoch": 5887} {"train_loss": -26.753082275390625, "global_step": 488648, "epoch": 5887} {"train_loss": -27.1319522857666, "global_step": 488649, "epoch": 5887} {"train_loss": -26.850568771362305, "global_step": 488650, "epoch": 5887} {"train_loss": -27.293615341186523, "global_step": 488651, "epoch": 5887} {"train_loss": -27.185644149780273, "global_step": 488652, "epoch": 5887} {"train_loss": -27.130298614501953, "global_step": 488653, "epoch": 5887} {"train_loss": -26.889326095581055, "global_step": 488654, "epoch": 5887} {"train_loss": -27.21247673034668, "global_step": 488655, "epoch": 5887} {"train_loss": -27.387409210205078, "global_step": 488656, "epoch": 5887} {"train_loss": -27.091995239257812, "global_step": 488657, "epoch": 5887} {"train_loss": -26.86911392211914, "global_step": 488658, "epoch": 5887} {"train_loss": -27.1676025390625, "global_step": 488659, "epoch": 5887} {"train_loss": -26.947067260742188, "global_step": 488660, "epoch": 5887} {"train_loss": -27.384756088256836, "global_step": 488661, "epoch": 5887} {"train_loss": -26.806562423706055, "global_step": 488662, "epoch": 5887} {"train_loss": -27.633594512939453, "global_step": 488663, "epoch": 5887} {"train_loss": -27.3659610748291, "global_step": 488664, "epoch": 5887} {"train_loss": -27.389801025390625, "global_step": 488665, "epoch": 5887} {"train_loss": -27.22283935546875, "global_step": 488666, "epoch": 5887} {"train_loss": -27.505023956298828, "global_step": 488667, "epoch": 5887} {"train_loss": -27.6289005279541, "global_step": 488668, "epoch": 5887} {"train_loss": -27.1241397857666, "global_step": 488669, "epoch": 5887} {"train_loss": -27.314931869506836, "global_step": 488670, "epoch": 5887} {"train_loss": -27.3240909576416, "global_step": 488671, "epoch": 5887} {"train_loss": -27.344501495361328, "global_step": 488672, "epoch": 5887} {"train_loss": -27.727100372314453, "global_step": 488673, "epoch": 5887} {"train_loss": -27.502695083618164, "global_step": 488674, "epoch": 5887} {"train_loss": -27.625289916992188, "global_step": 488675, "epoch": 5887} {"train_loss": -27.490320205688477, "global_step": 488676, "epoch": 5887} {"train_loss": -27.470746994018555, "global_step": 488677, "epoch": 5887} {"train_loss": -27.833662033081055, "global_step": 488678, "epoch": 5887} {"train_loss": -27.516605377197266, "global_step": 488679, "epoch": 5887} {"train_loss": -27.661731719970703, "global_step": 488680, "epoch": 5887} {"train_loss": -27.45978355407715, "global_step": 488681, "epoch": 5887} {"train_loss": -27.23663902282715, "global_step": 488682, "epoch": 5887} {"train_loss": -27.72833251953125, "global_step": 488683, "epoch": 5887} {"train_loss": -27.799896240234375, "global_step": 488684, "epoch": 5887} {"train_loss": -27.397192001342773, "global_step": 488685, "epoch": 5887} {"train_loss": -27.7981014251709, "global_step": 488686, "epoch": 5887} {"train_loss": -27.629560470581055, "global_step": 488687, "epoch": 5887} {"train_loss": -27.75209617614746, "global_step": 488688, "epoch": 5887} {"train_loss": -27.632307052612305, "global_step": 488689, "epoch": 5887} {"train_loss": -27.43137550354004, "global_step": 488690, "epoch": 5887} {"train_loss": -27.764591217041016, "global_step": 488691, "epoch": 5887} {"train_loss": -27.550382614135742, "global_step": 488692, "epoch": 5887} {"train_loss": -27.68128776550293, "global_step": 488693, "epoch": 5887} {"train_loss": -27.865713119506836, "global_step": 488694, "epoch": 5887} {"train_loss": -27.54366111755371, "global_step": 488695, "epoch": 5887} {"train_loss": -27.451614379882812, "global_step": 488696, "epoch": 5887} {"train_loss": -27.5026798248291, "global_step": 488697, "epoch": 5887} {"train_loss": -27.4407901763916, "global_step": 488698, "epoch": 5887} {"train_loss": -27.49470329284668, "global_step": 488699, "epoch": 5887} {"train_loss": -27.50571632385254, "global_step": 488700, "epoch": 5887} {"train_loss": -27.478769302368164, "global_step": 488701, "epoch": 5887} {"train_loss": -27.669584274291992, "global_step": 488702, "epoch": 5887} {"train_loss": -27.196620412619716, "global_step": 488703, "epoch": 5887, "val_loss": 6690851.0} {"train_loss": -23.12391471862793, "global_step": 488704, "epoch": 5888} {"train_loss": -18.574323654174805, "global_step": 488705, "epoch": 5888} {"train_loss": -21.1473445892334, "global_step": 488706, "epoch": 5888} {"train_loss": -25.255643844604492, "global_step": 488707, "epoch": 5888} {"train_loss": -23.5960750579834, "global_step": 488708, "epoch": 5888} {"train_loss": -24.611366271972656, "global_step": 488709, "epoch": 5888} {"train_loss": -25.17241859436035, "global_step": 488710, "epoch": 5888} {"train_loss": -24.93142318725586, "global_step": 488711, "epoch": 5888} {"train_loss": -25.93039321899414, "global_step": 488712, "epoch": 5888} {"train_loss": -25.49143409729004, "global_step": 488713, "epoch": 5888} {"train_loss": -25.58043670654297, "global_step": 488714, "epoch": 5888} {"train_loss": -25.449872970581055, "global_step": 488715, "epoch": 5888} {"train_loss": -25.8769588470459, "global_step": 488716, "epoch": 5888} {"train_loss": -25.73829460144043, "global_step": 488717, "epoch": 5888} {"train_loss": -25.758859634399414, "global_step": 488718, "epoch": 5888} {"train_loss": -25.940759658813477, "global_step": 488719, "epoch": 5888} {"train_loss": -26.090850830078125, "global_step": 488720, "epoch": 5888} {"train_loss": -26.224822998046875, "global_step": 488721, "epoch": 5888} {"train_loss": -26.243412017822266, "global_step": 488722, "epoch": 5888} {"train_loss": -26.23748779296875, "global_step": 488723, "epoch": 5888} {"train_loss": -26.218738555908203, "global_step": 488724, "epoch": 5888} {"train_loss": -26.23145866394043, "global_step": 488725, "epoch": 5888} {"train_loss": -26.3120174407959, "global_step": 488726, "epoch": 5888} {"train_loss": -26.1093807220459, "global_step": 488727, "epoch": 5888} {"train_loss": -26.180072784423828, "global_step": 488728, "epoch": 5888} {"train_loss": -26.678543090820312, "global_step": 488729, "epoch": 5888} {"train_loss": -26.183887481689453, "global_step": 488730, "epoch": 5888} {"train_loss": -26.549543380737305, "global_step": 488731, "epoch": 5888} {"train_loss": -26.60310935974121, "global_step": 488732, "epoch": 5888} {"train_loss": -26.434011459350586, "global_step": 488733, "epoch": 5888} {"train_loss": -26.530725479125977, "global_step": 488734, "epoch": 5888} {"train_loss": -26.771137237548828, "global_step": 488735, "epoch": 5888} {"train_loss": -26.33453369140625, "global_step": 488736, "epoch": 5888} {"train_loss": -26.66499137878418, "global_step": 488737, "epoch": 5888} {"train_loss": -26.334070205688477, "global_step": 488738, "epoch": 5888} {"train_loss": -26.423297882080078, "global_step": 488739, "epoch": 5888} {"train_loss": -26.829187393188477, "global_step": 488740, "epoch": 5888} {"train_loss": -27.054931640625, "global_step": 488741, "epoch": 5888} {"train_loss": -26.524478912353516, "global_step": 488742, "epoch": 5888} {"train_loss": -26.79001235961914, "global_step": 488743, "epoch": 5888} {"train_loss": -26.881332397460938, "global_step": 488744, "epoch": 5888} {"train_loss": -26.87593650817871, "global_step": 488745, "epoch": 5888} {"train_loss": -27.228775024414062, "global_step": 488746, "epoch": 5888} {"train_loss": -26.917327880859375, "global_step": 488747, "epoch": 5888} {"train_loss": -27.238889694213867, "global_step": 488748, "epoch": 5888} {"train_loss": -26.654998779296875, "global_step": 488749, "epoch": 5888} {"train_loss": -26.587722778320312, "global_step": 488750, "epoch": 5888} {"train_loss": -26.660507202148438, "global_step": 488751, "epoch": 5888} {"train_loss": -27.26222038269043, "global_step": 488752, "epoch": 5888} {"train_loss": -26.96294593811035, "global_step": 488753, "epoch": 5888} {"train_loss": -26.570392608642578, "global_step": 488754, "epoch": 5888} {"train_loss": -27.20157814025879, "global_step": 488755, "epoch": 5888} {"train_loss": -26.829038619995117, "global_step": 488756, "epoch": 5888} {"train_loss": -27.088027954101562, "global_step": 488757, "epoch": 5888} {"train_loss": -26.817138671875, "global_step": 488758, "epoch": 5888} {"train_loss": -26.82069969177246, "global_step": 488759, "epoch": 5888} {"train_loss": -27.51288414001465, "global_step": 488760, "epoch": 5888} {"train_loss": -27.36334228515625, "global_step": 488761, "epoch": 5888} {"train_loss": -27.31134033203125, "global_step": 488762, "epoch": 5888} {"train_loss": -27.017255783081055, "global_step": 488763, "epoch": 5888} {"train_loss": -27.052154541015625, "global_step": 488764, "epoch": 5888} {"train_loss": -27.041166305541992, "global_step": 488765, "epoch": 5888} {"train_loss": -27.1453857421875, "global_step": 488766, "epoch": 5888} {"train_loss": -27.32769775390625, "global_step": 488767, "epoch": 5888} {"train_loss": -26.79097557067871, "global_step": 488768, "epoch": 5888} {"train_loss": -27.615468978881836, "global_step": 488769, "epoch": 5888} {"train_loss": -27.2627010345459, "global_step": 488770, "epoch": 5888} {"train_loss": -27.48354148864746, "global_step": 488771, "epoch": 5888} {"train_loss": -27.240665435791016, "global_step": 488772, "epoch": 5888} {"train_loss": -26.99149513244629, "global_step": 488773, "epoch": 5888} {"train_loss": -27.677778244018555, "global_step": 488774, "epoch": 5888} {"train_loss": -27.443347930908203, "global_step": 488775, "epoch": 5888} {"train_loss": -27.753387451171875, "global_step": 488776, "epoch": 5888} {"train_loss": -28.09828758239746, "global_step": 488777, "epoch": 5888} {"train_loss": -27.256275177001953, "global_step": 488778, "epoch": 5888} {"train_loss": -27.548892974853516, "global_step": 488779, "epoch": 5888} {"train_loss": -27.428009033203125, "global_step": 488780, "epoch": 5888} {"train_loss": -27.205503463745117, "global_step": 488781, "epoch": 5888} {"train_loss": -27.478836059570312, "global_step": 488782, "epoch": 5888} {"train_loss": -26.9948787689209, "global_step": 488783, "epoch": 5888} {"train_loss": -27.22418785095215, "global_step": 488784, "epoch": 5888} {"train_loss": -27.32765769958496, "global_step": 488785, "epoch": 5888} {"train_loss": -26.436808413769825, "global_step": 488786, "epoch": 5888, "val_loss": 6715116.5} {"train_loss": -26.735919952392578, "global_step": 488787, "epoch": 5889} {"train_loss": -26.44764518737793, "global_step": 488788, "epoch": 5889} {"train_loss": -27.097537994384766, "global_step": 488789, "epoch": 5889} {"train_loss": -27.083669662475586, "global_step": 488790, "epoch": 5889} {"train_loss": -26.79901695251465, "global_step": 488791, "epoch": 5889} {"train_loss": -27.190412521362305, "global_step": 488792, "epoch": 5889} {"train_loss": -26.8533992767334, "global_step": 488793, "epoch": 5889} {"train_loss": -26.712955474853516, "global_step": 488794, "epoch": 5889} {"train_loss": -27.67701530456543, "global_step": 488795, "epoch": 5889} {"train_loss": -26.895795822143555, "global_step": 488796, "epoch": 5889} {"train_loss": -27.3040828704834, "global_step": 488797, "epoch": 5889} {"train_loss": -26.90943717956543, "global_step": 488798, "epoch": 5889} {"train_loss": -27.202383041381836, "global_step": 488799, "epoch": 5889} {"train_loss": -27.246322631835938, "global_step": 488800, "epoch": 5889} {"train_loss": -27.30134391784668, "global_step": 488801, "epoch": 5889} {"train_loss": -26.580167770385742, "global_step": 488802, "epoch": 5889} {"train_loss": -27.437299728393555, "global_step": 488803, "epoch": 5889} {"train_loss": -27.063817977905273, "global_step": 488804, "epoch": 5889} {"train_loss": -27.23025894165039, "global_step": 488805, "epoch": 5889} {"train_loss": -27.25262451171875, "global_step": 488806, "epoch": 5889} {"train_loss": -27.259057998657227, "global_step": 488807, "epoch": 5889} {"train_loss": -27.299177169799805, "global_step": 488808, "epoch": 5889} {"train_loss": -27.38482666015625, "global_step": 488809, "epoch": 5889} {"train_loss": -27.25043296813965, "global_step": 488810, "epoch": 5889} {"train_loss": -27.183202743530273, "global_step": 488811, "epoch": 5889} {"train_loss": -27.098724365234375, "global_step": 488812, "epoch": 5889} {"train_loss": -27.584333419799805, "global_step": 488813, "epoch": 5889} {"train_loss": -27.280414581298828, "global_step": 488814, "epoch": 5889} {"train_loss": -27.22256851196289, "global_step": 488815, "epoch": 5889} {"train_loss": -27.300241470336914, "global_step": 488816, "epoch": 5889} {"train_loss": -27.024824142456055, "global_step": 488817, "epoch": 5889} {"train_loss": -27.539926528930664, "global_step": 488818, "epoch": 5889} {"train_loss": -27.5870418548584, "global_step": 488819, "epoch": 5889} {"train_loss": -27.342487335205078, "global_step": 488820, "epoch": 5889} {"train_loss": -27.633573532104492, "global_step": 488821, "epoch": 5889} {"train_loss": -27.641834259033203, "global_step": 488822, "epoch": 5889} {"train_loss": -27.5682373046875, "global_step": 488823, "epoch": 5889} {"train_loss": -27.21429443359375, "global_step": 488824, "epoch": 5889} {"train_loss": -27.4906005859375, "global_step": 488825, "epoch": 5889} {"train_loss": -27.371246337890625, "global_step": 488826, "epoch": 5889} {"train_loss": -27.149084091186523, "global_step": 488827, "epoch": 5889} {"train_loss": -27.198713302612305, "global_step": 488828, "epoch": 5889} {"train_loss": -27.61203956604004, "global_step": 488829, "epoch": 5889} {"train_loss": -27.208173751831055, "global_step": 488830, "epoch": 5889} {"train_loss": -27.381881713867188, "global_step": 488831, "epoch": 5889} {"train_loss": -27.54079246520996, "global_step": 488832, "epoch": 5889} {"train_loss": -27.12531089782715, "global_step": 488833, "epoch": 5889} {"train_loss": -27.434186935424805, "global_step": 488834, "epoch": 5889} {"train_loss": -27.192951202392578, "global_step": 488835, "epoch": 5889} {"train_loss": -26.992721557617188, "global_step": 488836, "epoch": 5889} {"train_loss": -27.29953384399414, "global_step": 488837, "epoch": 5889} {"train_loss": -27.402692794799805, "global_step": 488838, "epoch": 5889} {"train_loss": -27.134113311767578, "global_step": 488839, "epoch": 5889} {"train_loss": -27.4504337310791, "global_step": 488840, "epoch": 5889} {"train_loss": -27.3726749420166, "global_step": 488841, "epoch": 5889} {"train_loss": -27.38187026977539, "global_step": 488842, "epoch": 5889} {"train_loss": -27.03310203552246, "global_step": 488843, "epoch": 5889} {"train_loss": -27.500614166259766, "global_step": 488844, "epoch": 5889} {"train_loss": -27.584836959838867, "global_step": 488845, "epoch": 5889} {"train_loss": -27.43636131286621, "global_step": 488846, "epoch": 5889} {"train_loss": -27.31926918029785, "global_step": 488847, "epoch": 5889} {"train_loss": -27.394392013549805, "global_step": 488848, "epoch": 5889} {"train_loss": -27.936811447143555, "global_step": 488849, "epoch": 5889} {"train_loss": -27.33319091796875, "global_step": 488850, "epoch": 5889} {"train_loss": -27.60348892211914, "global_step": 488851, "epoch": 5889} {"train_loss": -27.3402156829834, "global_step": 488852, "epoch": 5889} {"train_loss": -27.305089950561523, "global_step": 488853, "epoch": 5889} {"train_loss": -27.14914894104004, "global_step": 488854, "epoch": 5889} {"train_loss": -27.57149314880371, "global_step": 488855, "epoch": 5889} {"train_loss": -27.494897842407227, "global_step": 488856, "epoch": 5889} {"train_loss": -27.173303604125977, "global_step": 488857, "epoch": 5889} {"train_loss": -27.33331298828125, "global_step": 488858, "epoch": 5889} {"train_loss": -27.448505401611328, "global_step": 488859, "epoch": 5889} {"train_loss": -27.4097900390625, "global_step": 488860, "epoch": 5889} {"train_loss": -27.847326278686523, "global_step": 488861, "epoch": 5889} {"train_loss": -27.093341827392578, "global_step": 488862, "epoch": 5889} {"train_loss": -27.53492546081543, "global_step": 488863, "epoch": 5889} {"train_loss": -27.143049240112305, "global_step": 488864, "epoch": 5889} {"train_loss": -27.524734497070312, "global_step": 488865, "epoch": 5889} {"train_loss": -27.28346061706543, "global_step": 488866, "epoch": 5889} {"train_loss": -27.775653839111328, "global_step": 488867, "epoch": 5889} {"train_loss": -27.582870483398438, "global_step": 488868, "epoch": 5889} {"train_loss": -27.289439442646074, "global_step": 488869, "epoch": 5889, "val_loss": 6611631.0} {"train_loss": -25.599639892578125, "global_step": 488870, "epoch": 5890} {"train_loss": -25.62131118774414, "global_step": 488871, "epoch": 5890} {"train_loss": -26.74236488342285, "global_step": 488872, "epoch": 5890} {"train_loss": -26.252399444580078, "global_step": 488873, "epoch": 5890} {"train_loss": -25.918365478515625, "global_step": 488874, "epoch": 5890} {"train_loss": -26.788198471069336, "global_step": 488875, "epoch": 5890} {"train_loss": -26.452810287475586, "global_step": 488876, "epoch": 5890} {"train_loss": -26.403980255126953, "global_step": 488877, "epoch": 5890} {"train_loss": -26.744352340698242, "global_step": 488878, "epoch": 5890} {"train_loss": -27.040395736694336, "global_step": 488879, "epoch": 5890} {"train_loss": -26.892419815063477, "global_step": 488880, "epoch": 5890} {"train_loss": -26.984607696533203, "global_step": 488881, "epoch": 5890} {"train_loss": -26.519826889038086, "global_step": 488882, "epoch": 5890} {"train_loss": -26.892541885375977, "global_step": 488883, "epoch": 5890} {"train_loss": -26.619037628173828, "global_step": 488884, "epoch": 5890} {"train_loss": -27.02577018737793, "global_step": 488885, "epoch": 5890} {"train_loss": -26.63848304748535, "global_step": 488886, "epoch": 5890} {"train_loss": -26.879138946533203, "global_step": 488887, "epoch": 5890} {"train_loss": -26.655075073242188, "global_step": 488888, "epoch": 5890} {"train_loss": -27.01922607421875, "global_step": 488889, "epoch": 5890} {"train_loss": -26.988452911376953, "global_step": 488890, "epoch": 5890} {"train_loss": -27.57806396484375, "global_step": 488891, "epoch": 5890} {"train_loss": -26.32526969909668, "global_step": 488892, "epoch": 5890} {"train_loss": -26.889169692993164, "global_step": 488893, "epoch": 5890} {"train_loss": -26.770599365234375, "global_step": 488894, "epoch": 5890} {"train_loss": -26.975324630737305, "global_step": 488895, "epoch": 5890} {"train_loss": -26.731494903564453, "global_step": 488896, "epoch": 5890} {"train_loss": -26.978683471679688, "global_step": 488897, "epoch": 5890} {"train_loss": -27.062414169311523, "global_step": 488898, "epoch": 5890} {"train_loss": -26.627363204956055, "global_step": 488899, "epoch": 5890} {"train_loss": -26.840198516845703, "global_step": 488900, "epoch": 5890} {"train_loss": -26.721445083618164, "global_step": 488901, "epoch": 5890} {"train_loss": -26.964984893798828, "global_step": 488902, "epoch": 5890} {"train_loss": -26.789342880249023, "global_step": 488903, "epoch": 5890} {"train_loss": -27.115177154541016, "global_step": 488904, "epoch": 5890} {"train_loss": -26.80926513671875, "global_step": 488905, "epoch": 5890} {"train_loss": -27.020837783813477, "global_step": 488906, "epoch": 5890} {"train_loss": -27.022064208984375, "global_step": 488907, "epoch": 5890} {"train_loss": -27.0258731842041, "global_step": 488908, "epoch": 5890} {"train_loss": -27.027923583984375, "global_step": 488909, "epoch": 5890} {"train_loss": -27.301477432250977, "global_step": 488910, "epoch": 5890} {"train_loss": -26.93417739868164, "global_step": 488911, "epoch": 5890} {"train_loss": -27.11435317993164, "global_step": 488912, "epoch": 5890} {"train_loss": -27.16547966003418, "global_step": 488913, "epoch": 5890} {"train_loss": -27.004507064819336, "global_step": 488914, "epoch": 5890} {"train_loss": -27.423480987548828, "global_step": 488915, "epoch": 5890} {"train_loss": -27.195886611938477, "global_step": 488916, "epoch": 5890} {"train_loss": -27.3452205657959, "global_step": 488917, "epoch": 5890} {"train_loss": -27.52288818359375, "global_step": 488918, "epoch": 5890} {"train_loss": -27.580078125, "global_step": 488919, "epoch": 5890} {"train_loss": -27.09608268737793, "global_step": 488920, "epoch": 5890} {"train_loss": -27.45899772644043, "global_step": 488921, "epoch": 5890} {"train_loss": -27.262866973876953, "global_step": 488922, "epoch": 5890} {"train_loss": -27.261611938476562, "global_step": 488923, "epoch": 5890} {"train_loss": -27.76862907409668, "global_step": 488924, "epoch": 5890} {"train_loss": -27.684309005737305, "global_step": 488925, "epoch": 5890} {"train_loss": -27.59498405456543, "global_step": 488926, "epoch": 5890} {"train_loss": -27.6687068939209, "global_step": 488927, "epoch": 5890} {"train_loss": -27.607934951782227, "global_step": 488928, "epoch": 5890} {"train_loss": -27.549158096313477, "global_step": 488929, "epoch": 5890} {"train_loss": -27.484167098999023, "global_step": 488930, "epoch": 5890} {"train_loss": -27.490564346313477, "global_step": 488931, "epoch": 5890} {"train_loss": -27.529943466186523, "global_step": 488932, "epoch": 5890} {"train_loss": -27.18855094909668, "global_step": 488933, "epoch": 5890} {"train_loss": -27.237899780273438, "global_step": 488934, "epoch": 5890} {"train_loss": -26.88570213317871, "global_step": 488935, "epoch": 5890} {"train_loss": -26.7021541595459, "global_step": 488936, "epoch": 5890} {"train_loss": -26.1914005279541, "global_step": 488937, "epoch": 5890} {"train_loss": -26.443052291870117, "global_step": 488938, "epoch": 5890} {"train_loss": -27.046100616455078, "global_step": 488939, "epoch": 5890} {"train_loss": -26.95148277282715, "global_step": 488940, "epoch": 5890} {"train_loss": -27.441593170166016, "global_step": 488941, "epoch": 5890} {"train_loss": -26.96506118774414, "global_step": 488942, "epoch": 5890} {"train_loss": -27.328195571899414, "global_step": 488943, "epoch": 5890} {"train_loss": -27.392805099487305, "global_step": 488944, "epoch": 5890} {"train_loss": -27.3924617767334, "global_step": 488945, "epoch": 5890} {"train_loss": -26.886676788330078, "global_step": 488946, "epoch": 5890} {"train_loss": -27.125762939453125, "global_step": 488947, "epoch": 5890} {"train_loss": -26.764251708984375, "global_step": 488948, "epoch": 5890} {"train_loss": -27.065631866455078, "global_step": 488949, "epoch": 5890} {"train_loss": -27.610029220581055, "global_step": 488950, "epoch": 5890} {"train_loss": -27.288549423217773, "global_step": 488951, "epoch": 5890} {"train_loss": -27.011631034942994, "global_step": 488952, "epoch": 5890, "val_loss": 6747987.0} {"train_loss": -27.20438003540039, "global_step": 488953, "epoch": 5891} {"train_loss": -26.93691062927246, "global_step": 488954, "epoch": 5891} {"train_loss": -27.260175704956055, "global_step": 488955, "epoch": 5891} {"train_loss": -26.75080680847168, "global_step": 488956, "epoch": 5891} {"train_loss": -26.98609733581543, "global_step": 488957, "epoch": 5891} {"train_loss": -26.997650146484375, "global_step": 488958, "epoch": 5891} {"train_loss": -27.158063888549805, "global_step": 488959, "epoch": 5891} {"train_loss": -26.867542266845703, "global_step": 488960, "epoch": 5891} {"train_loss": -26.79188346862793, "global_step": 488961, "epoch": 5891} {"train_loss": -26.907835006713867, "global_step": 488962, "epoch": 5891} {"train_loss": -26.874486923217773, "global_step": 488963, "epoch": 5891} {"train_loss": -26.99078941345215, "global_step": 488964, "epoch": 5891} {"train_loss": -27.62985610961914, "global_step": 488965, "epoch": 5891} {"train_loss": -26.76900291442871, "global_step": 488966, "epoch": 5891} {"train_loss": -27.18930435180664, "global_step": 488967, "epoch": 5891} {"train_loss": -27.233673095703125, "global_step": 488968, "epoch": 5891} {"train_loss": -27.52178955078125, "global_step": 488969, "epoch": 5891} {"train_loss": -27.17236328125, "global_step": 488970, "epoch": 5891} {"train_loss": -27.295866012573242, "global_step": 488971, "epoch": 5891} {"train_loss": -26.968921661376953, "global_step": 488972, "epoch": 5891} {"train_loss": -27.12703514099121, "global_step": 488973, "epoch": 5891} {"train_loss": -27.052778244018555, "global_step": 488974, "epoch": 5891} {"train_loss": -27.375995635986328, "global_step": 488975, "epoch": 5891} {"train_loss": -27.429407119750977, "global_step": 488976, "epoch": 5891} {"train_loss": -27.396564483642578, "global_step": 488977, "epoch": 5891} {"train_loss": -27.363250732421875, "global_step": 488978, "epoch": 5891} {"train_loss": -27.13726234436035, "global_step": 488979, "epoch": 5891} {"train_loss": -27.503387451171875, "global_step": 488980, "epoch": 5891} {"train_loss": -27.2228946685791, "global_step": 488981, "epoch": 5891} {"train_loss": -27.4760799407959, "global_step": 488982, "epoch": 5891} {"train_loss": -27.46811294555664, "global_step": 488983, "epoch": 5891} {"train_loss": -27.456472396850586, "global_step": 488984, "epoch": 5891} {"train_loss": -27.185571670532227, "global_step": 488985, "epoch": 5891} {"train_loss": -27.186325073242188, "global_step": 488986, "epoch": 5891} {"train_loss": -26.719074249267578, "global_step": 488987, "epoch": 5891} {"train_loss": -26.85199546813965, "global_step": 488988, "epoch": 5891} {"train_loss": -26.636831283569336, "global_step": 488989, "epoch": 5891} {"train_loss": -27.375518798828125, "global_step": 488990, "epoch": 5891} {"train_loss": -27.6451473236084, "global_step": 488991, "epoch": 5891} {"train_loss": -27.244104385375977, "global_step": 488992, "epoch": 5891} {"train_loss": -27.34271240234375, "global_step": 488993, "epoch": 5891} {"train_loss": -27.826496124267578, "global_step": 488994, "epoch": 5891} {"train_loss": -27.375961303710938, "global_step": 488995, "epoch": 5891} {"train_loss": -27.351425170898438, "global_step": 488996, "epoch": 5891} {"train_loss": -27.50356101989746, "global_step": 488997, "epoch": 5891} {"train_loss": -27.37847900390625, "global_step": 488998, "epoch": 5891} {"train_loss": -27.445356369018555, "global_step": 488999, "epoch": 5891} {"train_loss": -27.5200138092041, "global_step": 489000, "epoch": 5891} {"train_loss": -27.59714126586914, "global_step": 489001, "epoch": 5891} {"train_loss": -27.229413986206055, "global_step": 489002, "epoch": 5891} {"train_loss": -27.527795791625977, "global_step": 489003, "epoch": 5891} {"train_loss": -26.965011596679688, "global_step": 489004, "epoch": 5891} {"train_loss": -27.488910675048828, "global_step": 489005, "epoch": 5891} {"train_loss": -27.117704391479492, "global_step": 489006, "epoch": 5891} {"train_loss": -26.99371910095215, "global_step": 489007, "epoch": 5891} {"train_loss": -27.489459991455078, "global_step": 489008, "epoch": 5891} {"train_loss": -27.173376083374023, "global_step": 489009, "epoch": 5891} {"train_loss": -27.29058837890625, "global_step": 489010, "epoch": 5891} {"train_loss": -27.328405380249023, "global_step": 489011, "epoch": 5891} {"train_loss": -27.51761817932129, "global_step": 489012, "epoch": 5891} {"train_loss": -27.542280197143555, "global_step": 489013, "epoch": 5891} {"train_loss": -27.696935653686523, "global_step": 489014, "epoch": 5891} {"train_loss": -27.07769203186035, "global_step": 489015, "epoch": 5891} {"train_loss": -27.023244857788086, "global_step": 489016, "epoch": 5891} {"train_loss": -27.382368087768555, "global_step": 489017, "epoch": 5891} {"train_loss": -27.171384811401367, "global_step": 489018, "epoch": 5891} {"train_loss": -27.09583854675293, "global_step": 489019, "epoch": 5891} {"train_loss": -27.561594009399414, "global_step": 489020, "epoch": 5891} {"train_loss": -27.135427474975586, "global_step": 489021, "epoch": 5891} {"train_loss": -27.31683921813965, "global_step": 489022, "epoch": 5891} {"train_loss": -27.2987003326416, "global_step": 489023, "epoch": 5891} {"train_loss": -27.292572021484375, "global_step": 489024, "epoch": 5891} {"train_loss": -27.022581100463867, "global_step": 489025, "epoch": 5891} {"train_loss": -27.665943145751953, "global_step": 489026, "epoch": 5891} {"train_loss": -27.050262451171875, "global_step": 489027, "epoch": 5891} {"train_loss": -27.231359481811523, "global_step": 489028, "epoch": 5891} {"train_loss": -27.095579147338867, "global_step": 489029, "epoch": 5891} {"train_loss": -27.32358741760254, "global_step": 489030, "epoch": 5891} {"train_loss": -27.16108512878418, "global_step": 489031, "epoch": 5891} {"train_loss": -27.543893814086914, "global_step": 489032, "epoch": 5891} {"train_loss": -27.55974769592285, "global_step": 489033, "epoch": 5891} {"train_loss": -27.646276473999023, "global_step": 489034, "epoch": 5891} {"train_loss": -27.270987751972246, "global_step": 489035, "epoch": 5891, "val_loss": 6673520.0} {"train_loss": -27.14618492126465, "global_step": 489036, "epoch": 5892} {"train_loss": -27.23114013671875, "global_step": 489037, "epoch": 5892} {"train_loss": -26.858911514282227, "global_step": 489038, "epoch": 5892} {"train_loss": -26.99941062927246, "global_step": 489039, "epoch": 5892} {"train_loss": -26.770801544189453, "global_step": 489040, "epoch": 5892} {"train_loss": -27.57631492614746, "global_step": 489041, "epoch": 5892} {"train_loss": -26.902332305908203, "global_step": 489042, "epoch": 5892} {"train_loss": -27.0689640045166, "global_step": 489043, "epoch": 5892} {"train_loss": -27.3104190826416, "global_step": 489044, "epoch": 5892} {"train_loss": -27.2371883392334, "global_step": 489045, "epoch": 5892} {"train_loss": -27.061338424682617, "global_step": 489046, "epoch": 5892} {"train_loss": -27.100622177124023, "global_step": 489047, "epoch": 5892} {"train_loss": -27.61175537109375, "global_step": 489048, "epoch": 5892} {"train_loss": -27.2786808013916, "global_step": 489049, "epoch": 5892} {"train_loss": -26.90436363220215, "global_step": 489050, "epoch": 5892} {"train_loss": -27.40962028503418, "global_step": 489051, "epoch": 5892} {"train_loss": -26.95916175842285, "global_step": 489052, "epoch": 5892} {"train_loss": -27.112401962280273, "global_step": 489053, "epoch": 5892} {"train_loss": -26.97755241394043, "global_step": 489054, "epoch": 5892} {"train_loss": -26.8826847076416, "global_step": 489055, "epoch": 5892} {"train_loss": -26.73322868347168, "global_step": 489056, "epoch": 5892} {"train_loss": -26.968658447265625, "global_step": 489057, "epoch": 5892} {"train_loss": -26.79752540588379, "global_step": 489058, "epoch": 5892} {"train_loss": -27.3624210357666, "global_step": 489059, "epoch": 5892} {"train_loss": -26.87213134765625, "global_step": 489060, "epoch": 5892} {"train_loss": -27.3441219329834, "global_step": 489061, "epoch": 5892} {"train_loss": -27.402326583862305, "global_step": 489062, "epoch": 5892} {"train_loss": -27.187911987304688, "global_step": 489063, "epoch": 5892} {"train_loss": -27.29170036315918, "global_step": 489064, "epoch": 5892} {"train_loss": -27.099613189697266, "global_step": 489065, "epoch": 5892} {"train_loss": -27.260269165039062, "global_step": 489066, "epoch": 5892} {"train_loss": -27.345060348510742, "global_step": 489067, "epoch": 5892} {"train_loss": -27.3895320892334, "global_step": 489068, "epoch": 5892} {"train_loss": -27.18293571472168, "global_step": 489069, "epoch": 5892} {"train_loss": -27.354108810424805, "global_step": 489070, "epoch": 5892} {"train_loss": -27.481412887573242, "global_step": 489071, "epoch": 5892} {"train_loss": -27.377857208251953, "global_step": 489072, "epoch": 5892} {"train_loss": -27.733488082885742, "global_step": 489073, "epoch": 5892} {"train_loss": -27.46371841430664, "global_step": 489074, "epoch": 5892} {"train_loss": -27.416614532470703, "global_step": 489075, "epoch": 5892} {"train_loss": -27.56184196472168, "global_step": 489076, "epoch": 5892} {"train_loss": -27.509052276611328, "global_step": 489077, "epoch": 5892} {"train_loss": -27.011768341064453, "global_step": 489078, "epoch": 5892} {"train_loss": -27.492124557495117, "global_step": 489079, "epoch": 5892} {"train_loss": -27.432722091674805, "global_step": 489080, "epoch": 5892} {"train_loss": -27.539762496948242, "global_step": 489081, "epoch": 5892} {"train_loss": -27.495807647705078, "global_step": 489082, "epoch": 5892} {"train_loss": -27.262399673461914, "global_step": 489083, "epoch": 5892} {"train_loss": -27.307544708251953, "global_step": 489084, "epoch": 5892} {"train_loss": -27.1248836517334, "global_step": 489085, "epoch": 5892} {"train_loss": -27.724456787109375, "global_step": 489086, "epoch": 5892} {"train_loss": -27.664403915405273, "global_step": 489087, "epoch": 5892} {"train_loss": -27.315387725830078, "global_step": 489088, "epoch": 5892} {"train_loss": -27.355255126953125, "global_step": 489089, "epoch": 5892} {"train_loss": -27.344980239868164, "global_step": 489090, "epoch": 5892} {"train_loss": -27.6007137298584, "global_step": 489091, "epoch": 5892} {"train_loss": -27.237028121948242, "global_step": 489092, "epoch": 5892} {"train_loss": -27.3370304107666, "global_step": 489093, "epoch": 5892} {"train_loss": -27.5733699798584, "global_step": 489094, "epoch": 5892} {"train_loss": -27.53555679321289, "global_step": 489095, "epoch": 5892} {"train_loss": -27.588855743408203, "global_step": 489096, "epoch": 5892} {"train_loss": -27.107715606689453, "global_step": 489097, "epoch": 5892} {"train_loss": -27.47121238708496, "global_step": 489098, "epoch": 5892} {"train_loss": -27.52088737487793, "global_step": 489099, "epoch": 5892} {"train_loss": -27.416736602783203, "global_step": 489100, "epoch": 5892} {"train_loss": -27.35405921936035, "global_step": 489101, "epoch": 5892} {"train_loss": -27.58492088317871, "global_step": 489102, "epoch": 5892} {"train_loss": -27.404895782470703, "global_step": 489103, "epoch": 5892} {"train_loss": -27.36213493347168, "global_step": 489104, "epoch": 5892} {"train_loss": -27.04233169555664, "global_step": 489105, "epoch": 5892} {"train_loss": -27.191852569580078, "global_step": 489106, "epoch": 5892} {"train_loss": -26.952411651611328, "global_step": 489107, "epoch": 5892} {"train_loss": -26.97784996032715, "global_step": 489108, "epoch": 5892} {"train_loss": -27.170297622680664, "global_step": 489109, "epoch": 5892} {"train_loss": -27.068939208984375, "global_step": 489110, "epoch": 5892} {"train_loss": -27.354907989501953, "global_step": 489111, "epoch": 5892} {"train_loss": -27.583942413330078, "global_step": 489112, "epoch": 5892} {"train_loss": -27.426904678344727, "global_step": 489113, "epoch": 5892} {"train_loss": -26.990705490112305, "global_step": 489114, "epoch": 5892} {"train_loss": -27.512067794799805, "global_step": 489115, "epoch": 5892} {"train_loss": -26.9670352935791, "global_step": 489116, "epoch": 5892} {"train_loss": -27.296171188354492, "global_step": 489117, "epoch": 5892} {"train_loss": -27.25213857443936, "global_step": 489118, "epoch": 5892, "val_loss": 6625992.0} {"train_loss": -26.812055587768555, "global_step": 489119, "epoch": 5893} {"train_loss": -26.09577751159668, "global_step": 489120, "epoch": 5893} {"train_loss": -26.723447799682617, "global_step": 489121, "epoch": 5893} {"train_loss": -26.8065185546875, "global_step": 489122, "epoch": 5893} {"train_loss": -26.559188842773438, "global_step": 489123, "epoch": 5893} {"train_loss": -26.25723648071289, "global_step": 489124, "epoch": 5893} {"train_loss": -26.961008071899414, "global_step": 489125, "epoch": 5893} {"train_loss": -26.955759048461914, "global_step": 489126, "epoch": 5893} {"train_loss": -26.838998794555664, "global_step": 489127, "epoch": 5893} {"train_loss": -26.753707885742188, "global_step": 489128, "epoch": 5893} {"train_loss": -27.07187271118164, "global_step": 489129, "epoch": 5893} {"train_loss": -26.98084831237793, "global_step": 489130, "epoch": 5893} {"train_loss": -26.59864616394043, "global_step": 489131, "epoch": 5893} {"train_loss": -27.001943588256836, "global_step": 489132, "epoch": 5893} {"train_loss": -27.097028732299805, "global_step": 489133, "epoch": 5893} {"train_loss": -26.628759384155273, "global_step": 489134, "epoch": 5893} {"train_loss": -27.115039825439453, "global_step": 489135, "epoch": 5893} {"train_loss": -27.16859245300293, "global_step": 489136, "epoch": 5893} {"train_loss": -27.216962814331055, "global_step": 489137, "epoch": 5893} {"train_loss": -27.46705436706543, "global_step": 489138, "epoch": 5893} {"train_loss": -27.077289581298828, "global_step": 489139, "epoch": 5893} {"train_loss": -26.907968521118164, "global_step": 489140, "epoch": 5893} {"train_loss": -27.241018295288086, "global_step": 489141, "epoch": 5893} {"train_loss": -27.0640811920166, "global_step": 489142, "epoch": 5893} {"train_loss": -27.083887100219727, "global_step": 489143, "epoch": 5893} {"train_loss": -26.739566802978516, "global_step": 489144, "epoch": 5893} {"train_loss": -27.330429077148438, "global_step": 489145, "epoch": 5893} {"train_loss": -27.20368003845215, "global_step": 489146, "epoch": 5893} {"train_loss": -27.096845626831055, "global_step": 489147, "epoch": 5893} {"train_loss": -27.39764404296875, "global_step": 489148, "epoch": 5893} {"train_loss": -27.052505493164062, "global_step": 489149, "epoch": 5893} {"train_loss": -27.154651641845703, "global_step": 489150, "epoch": 5893} {"train_loss": -27.45147705078125, "global_step": 489151, "epoch": 5893} {"train_loss": -27.184478759765625, "global_step": 489152, "epoch": 5893} {"train_loss": -26.98316764831543, "global_step": 489153, "epoch": 5893} {"train_loss": -27.09832763671875, "global_step": 489154, "epoch": 5893} {"train_loss": -27.386037826538086, "global_step": 489155, "epoch": 5893} {"train_loss": -27.040088653564453, "global_step": 489156, "epoch": 5893} {"train_loss": -27.33088493347168, "global_step": 489157, "epoch": 5893} {"train_loss": -27.230499267578125, "global_step": 489158, "epoch": 5893} {"train_loss": -27.069910049438477, "global_step": 489159, "epoch": 5893} {"train_loss": -27.311676025390625, "global_step": 489160, "epoch": 5893} {"train_loss": -27.50172996520996, "global_step": 489161, "epoch": 5893} {"train_loss": -27.344654083251953, "global_step": 489162, "epoch": 5893} {"train_loss": -27.498096466064453, "global_step": 489163, "epoch": 5893} {"train_loss": -27.363245010375977, "global_step": 489164, "epoch": 5893} {"train_loss": -27.601272583007812, "global_step": 489165, "epoch": 5893} {"train_loss": -27.67176628112793, "global_step": 489166, "epoch": 5893} {"train_loss": -27.183374404907227, "global_step": 489167, "epoch": 5893} {"train_loss": -27.236602783203125, "global_step": 489168, "epoch": 5893} {"train_loss": -27.17933464050293, "global_step": 489169, "epoch": 5893} {"train_loss": -27.11805534362793, "global_step": 489170, "epoch": 5893} {"train_loss": -26.9472599029541, "global_step": 489171, "epoch": 5893} {"train_loss": -27.300764083862305, "global_step": 489172, "epoch": 5893} {"train_loss": -27.27030372619629, "global_step": 489173, "epoch": 5893} {"train_loss": -27.225635528564453, "global_step": 489174, "epoch": 5893} {"train_loss": -27.375244140625, "global_step": 489175, "epoch": 5893} {"train_loss": -27.547338485717773, "global_step": 489176, "epoch": 5893} {"train_loss": -27.232397079467773, "global_step": 489177, "epoch": 5893} {"train_loss": -27.59336280822754, "global_step": 489178, "epoch": 5893} {"train_loss": -27.4246768951416, "global_step": 489179, "epoch": 5893} {"train_loss": -27.409711837768555, "global_step": 489180, "epoch": 5893} {"train_loss": -27.327192306518555, "global_step": 489181, "epoch": 5893} {"train_loss": -27.7186222076416, "global_step": 489182, "epoch": 5893} {"train_loss": -27.439788818359375, "global_step": 489183, "epoch": 5893} {"train_loss": -27.56268882751465, "global_step": 489184, "epoch": 5893} {"train_loss": -27.239065170288086, "global_step": 489185, "epoch": 5893} {"train_loss": -27.40070915222168, "global_step": 489186, "epoch": 5893} {"train_loss": -27.641864776611328, "global_step": 489187, "epoch": 5893} {"train_loss": -27.275562286376953, "global_step": 489188, "epoch": 5893} {"train_loss": -27.679235458374023, "global_step": 489189, "epoch": 5893} {"train_loss": -27.337568283081055, "global_step": 489190, "epoch": 5893} {"train_loss": -26.848011016845703, "global_step": 489191, "epoch": 5893} {"train_loss": -27.176599502563477, "global_step": 489192, "epoch": 5893} {"train_loss": -27.381738662719727, "global_step": 489193, "epoch": 5893} {"train_loss": -27.038970947265625, "global_step": 489194, "epoch": 5893} {"train_loss": -27.4939022064209, "global_step": 489195, "epoch": 5893} {"train_loss": -27.216257095336914, "global_step": 489196, "epoch": 5893} {"train_loss": -26.982553482055664, "global_step": 489197, "epoch": 5893} {"train_loss": -27.442291259765625, "global_step": 489198, "epoch": 5893} {"train_loss": -27.50264549255371, "global_step": 489199, "epoch": 5893} {"train_loss": -27.3155460357666, "global_step": 489200, "epoch": 5893} {"train_loss": -27.18524128557688, "global_step": 489201, "epoch": 5893, "val_loss": 6723314.0} {"train_loss": -26.773595809936523, "global_step": 489202, "epoch": 5894} {"train_loss": -27.26673698425293, "global_step": 489203, "epoch": 5894} {"train_loss": -27.06683921813965, "global_step": 489204, "epoch": 5894} {"train_loss": -26.401641845703125, "global_step": 489205, "epoch": 5894} {"train_loss": -26.959644317626953, "global_step": 489206, "epoch": 5894} {"train_loss": -27.176345825195312, "global_step": 489207, "epoch": 5894} {"train_loss": -27.00479507446289, "global_step": 489208, "epoch": 5894} {"train_loss": -26.984006881713867, "global_step": 489209, "epoch": 5894} {"train_loss": -27.13054847717285, "global_step": 489210, "epoch": 5894} {"train_loss": -27.13605308532715, "global_step": 489211, "epoch": 5894} {"train_loss": -27.04013442993164, "global_step": 489212, "epoch": 5894} {"train_loss": -27.01447868347168, "global_step": 489213, "epoch": 5894} {"train_loss": -26.881093978881836, "global_step": 489214, "epoch": 5894} {"train_loss": -27.017322540283203, "global_step": 489215, "epoch": 5894} {"train_loss": -27.300113677978516, "global_step": 489216, "epoch": 5894} {"train_loss": -26.782596588134766, "global_step": 489217, "epoch": 5894} {"train_loss": -26.94508171081543, "global_step": 489218, "epoch": 5894} {"train_loss": -27.171873092651367, "global_step": 489219, "epoch": 5894} {"train_loss": -26.96815299987793, "global_step": 489220, "epoch": 5894} {"train_loss": -26.929855346679688, "global_step": 489221, "epoch": 5894} {"train_loss": -27.161148071289062, "global_step": 489222, "epoch": 5894} {"train_loss": -27.099578857421875, "global_step": 489223, "epoch": 5894} {"train_loss": -27.160619735717773, "global_step": 489224, "epoch": 5894} {"train_loss": -27.070117950439453, "global_step": 489225, "epoch": 5894} {"train_loss": -26.779382705688477, "global_step": 489226, "epoch": 5894} {"train_loss": -27.41887855529785, "global_step": 489227, "epoch": 5894} {"train_loss": -26.69874382019043, "global_step": 489228, "epoch": 5894} {"train_loss": -27.072650909423828, "global_step": 489229, "epoch": 5894} {"train_loss": -27.376501083374023, "global_step": 489230, "epoch": 5894} {"train_loss": -26.58930015563965, "global_step": 489231, "epoch": 5894} {"train_loss": -27.387714385986328, "global_step": 489232, "epoch": 5894} {"train_loss": -26.928258895874023, "global_step": 489233, "epoch": 5894} {"train_loss": -27.44927406311035, "global_step": 489234, "epoch": 5894} {"train_loss": -27.674243927001953, "global_step": 489235, "epoch": 5894} {"train_loss": -27.222339630126953, "global_step": 489236, "epoch": 5894} {"train_loss": -27.122236251831055, "global_step": 489237, "epoch": 5894} {"train_loss": -27.62946128845215, "global_step": 489238, "epoch": 5894} {"train_loss": -26.9074764251709, "global_step": 489239, "epoch": 5894} {"train_loss": -27.450336456298828, "global_step": 489240, "epoch": 5894} {"train_loss": -27.517724990844727, "global_step": 489241, "epoch": 5894} {"train_loss": -27.336477279663086, "global_step": 489242, "epoch": 5894} {"train_loss": -27.739282608032227, "global_step": 489243, "epoch": 5894} {"train_loss": -27.316965103149414, "global_step": 489244, "epoch": 5894} {"train_loss": -27.127201080322266, "global_step": 489245, "epoch": 5894} {"train_loss": -27.27276611328125, "global_step": 489246, "epoch": 5894} {"train_loss": -27.284894943237305, "global_step": 489247, "epoch": 5894} {"train_loss": -27.498525619506836, "global_step": 489248, "epoch": 5894} {"train_loss": -27.054229736328125, "global_step": 489249, "epoch": 5894} {"train_loss": -27.423847198486328, "global_step": 489250, "epoch": 5894} {"train_loss": -27.25801658630371, "global_step": 489251, "epoch": 5894} {"train_loss": -27.380542755126953, "global_step": 489252, "epoch": 5894} {"train_loss": -27.36968994140625, "global_step": 489253, "epoch": 5894} {"train_loss": -27.481678009033203, "global_step": 489254, "epoch": 5894} {"train_loss": -27.61272621154785, "global_step": 489255, "epoch": 5894} {"train_loss": -27.30393409729004, "global_step": 489256, "epoch": 5894} {"train_loss": -27.60637855529785, "global_step": 489257, "epoch": 5894} {"train_loss": -26.98853874206543, "global_step": 489258, "epoch": 5894} {"train_loss": -27.261127471923828, "global_step": 489259, "epoch": 5894} {"train_loss": -27.31076431274414, "global_step": 489260, "epoch": 5894} {"train_loss": -27.566003799438477, "global_step": 489261, "epoch": 5894} {"train_loss": -27.436742782592773, "global_step": 489262, "epoch": 5894} {"train_loss": -27.175107955932617, "global_step": 489263, "epoch": 5894} {"train_loss": -26.977386474609375, "global_step": 489264, "epoch": 5894} {"train_loss": -27.374073028564453, "global_step": 489265, "epoch": 5894} {"train_loss": -27.445215225219727, "global_step": 489266, "epoch": 5894} {"train_loss": -27.689298629760742, "global_step": 489267, "epoch": 5894} {"train_loss": -27.115924835205078, "global_step": 489268, "epoch": 5894} {"train_loss": -27.132354736328125, "global_step": 489269, "epoch": 5894} {"train_loss": -27.285009384155273, "global_step": 489270, "epoch": 5894} {"train_loss": -27.52082633972168, "global_step": 489271, "epoch": 5894} {"train_loss": -27.19722557067871, "global_step": 489272, "epoch": 5894} {"train_loss": -27.11248207092285, "global_step": 489273, "epoch": 5894} {"train_loss": -27.350955963134766, "global_step": 489274, "epoch": 5894} {"train_loss": -27.468591690063477, "global_step": 489275, "epoch": 5894} {"train_loss": -27.25727653503418, "global_step": 489276, "epoch": 5894} {"train_loss": -27.439289093017578, "global_step": 489277, "epoch": 5894} {"train_loss": -27.57227897644043, "global_step": 489278, "epoch": 5894} {"train_loss": -27.55707359313965, "global_step": 489279, "epoch": 5894} {"train_loss": -27.732202529907227, "global_step": 489280, "epoch": 5894} {"train_loss": -27.209369659423828, "global_step": 489281, "epoch": 5894} {"train_loss": -26.998449325561523, "global_step": 489282, "epoch": 5894} {"train_loss": -26.7985782623291, "global_step": 489283, "epoch": 5894} {"train_loss": -27.21884674623788, "global_step": 489284, "epoch": 5894, "val_loss": 6653047.0} {"train_loss": -26.639123916625977, "global_step": 489285, "epoch": 5895} {"train_loss": -27.20465087890625, "global_step": 489286, "epoch": 5895} {"train_loss": -27.186338424682617, "global_step": 489287, "epoch": 5895} {"train_loss": -26.64706802368164, "global_step": 489288, "epoch": 5895} {"train_loss": -26.669296264648438, "global_step": 489289, "epoch": 5895} {"train_loss": -25.709064483642578, "global_step": 489290, "epoch": 5895} {"train_loss": -26.498371124267578, "global_step": 489291, "epoch": 5895} {"train_loss": -27.078344345092773, "global_step": 489292, "epoch": 5895} {"train_loss": -27.1219425201416, "global_step": 489293, "epoch": 5895} {"train_loss": -27.043359756469727, "global_step": 489294, "epoch": 5895} {"train_loss": -26.773269653320312, "global_step": 489295, "epoch": 5895} {"train_loss": -27.0629940032959, "global_step": 489296, "epoch": 5895} {"train_loss": -27.112079620361328, "global_step": 489297, "epoch": 5895} {"train_loss": -27.18633460998535, "global_step": 489298, "epoch": 5895} {"train_loss": -27.298248291015625, "global_step": 489299, "epoch": 5895} {"train_loss": -27.044757843017578, "global_step": 489300, "epoch": 5895} {"train_loss": -27.226032257080078, "global_step": 489301, "epoch": 5895} {"train_loss": -27.54366111755371, "global_step": 489302, "epoch": 5895} {"train_loss": -27.05792236328125, "global_step": 489303, "epoch": 5895} {"train_loss": -27.10013771057129, "global_step": 489304, "epoch": 5895} {"train_loss": -26.796533584594727, "global_step": 489305, "epoch": 5895} {"train_loss": -26.7716121673584, "global_step": 489306, "epoch": 5895} {"train_loss": -27.1785945892334, "global_step": 489307, "epoch": 5895} {"train_loss": -27.176544189453125, "global_step": 489308, "epoch": 5895} {"train_loss": -27.501739501953125, "global_step": 489309, "epoch": 5895} {"train_loss": -26.98565101623535, "global_step": 489310, "epoch": 5895} {"train_loss": -27.109281539916992, "global_step": 489311, "epoch": 5895} {"train_loss": -27.08542823791504, "global_step": 489312, "epoch": 5895} {"train_loss": -27.258264541625977, "global_step": 489313, "epoch": 5895} {"train_loss": -27.45517921447754, "global_step": 489314, "epoch": 5895} {"train_loss": -27.02874183654785, "global_step": 489315, "epoch": 5895} {"train_loss": -27.5003604888916, "global_step": 489316, "epoch": 5895} {"train_loss": -27.26142692565918, "global_step": 489317, "epoch": 5895} {"train_loss": -27.12527847290039, "global_step": 489318, "epoch": 5895} {"train_loss": -27.4282283782959, "global_step": 489319, "epoch": 5895} {"train_loss": -27.219465255737305, "global_step": 489320, "epoch": 5895} {"train_loss": -27.14406394958496, "global_step": 489321, "epoch": 5895} {"train_loss": -27.25312614440918, "global_step": 489322, "epoch": 5895} {"train_loss": -27.44720458984375, "global_step": 489323, "epoch": 5895} {"train_loss": -27.277637481689453, "global_step": 489324, "epoch": 5895} {"train_loss": -27.577375411987305, "global_step": 489325, "epoch": 5895} {"train_loss": -27.56477165222168, "global_step": 489326, "epoch": 5895} {"train_loss": -27.164091110229492, "global_step": 489327, "epoch": 5895} {"train_loss": -27.448654174804688, "global_step": 489328, "epoch": 5895} {"train_loss": -27.295440673828125, "global_step": 489329, "epoch": 5895} {"train_loss": -27.30710792541504, "global_step": 489330, "epoch": 5895} {"train_loss": -27.339004516601562, "global_step": 489331, "epoch": 5895} {"train_loss": -27.724380493164062, "global_step": 489332, "epoch": 5895} {"train_loss": -27.16929054260254, "global_step": 489333, "epoch": 5895} {"train_loss": -27.659055709838867, "global_step": 489334, "epoch": 5895} {"train_loss": -27.181671142578125, "global_step": 489335, "epoch": 5895} {"train_loss": -27.56666374206543, "global_step": 489336, "epoch": 5895} {"train_loss": -27.617528915405273, "global_step": 489337, "epoch": 5895} {"train_loss": -27.45391845703125, "global_step": 489338, "epoch": 5895} {"train_loss": -27.290491104125977, "global_step": 489339, "epoch": 5895} {"train_loss": -27.181982040405273, "global_step": 489340, "epoch": 5895} {"train_loss": -27.437963485717773, "global_step": 489341, "epoch": 5895} {"train_loss": -26.639728546142578, "global_step": 489342, "epoch": 5895} {"train_loss": -26.317352294921875, "global_step": 489343, "epoch": 5895} {"train_loss": -26.80988883972168, "global_step": 489344, "epoch": 5895} {"train_loss": -27.07805824279785, "global_step": 489345, "epoch": 5895} {"train_loss": -26.84954261779785, "global_step": 489346, "epoch": 5895} {"train_loss": -27.234882354736328, "global_step": 489347, "epoch": 5895} {"train_loss": -26.910598754882812, "global_step": 489348, "epoch": 5895} {"train_loss": -27.030139923095703, "global_step": 489349, "epoch": 5895} {"train_loss": -26.392438888549805, "global_step": 489350, "epoch": 5895} {"train_loss": -26.981863021850586, "global_step": 489351, "epoch": 5895} {"train_loss": -26.788497924804688, "global_step": 489352, "epoch": 5895} {"train_loss": -26.974958419799805, "global_step": 489353, "epoch": 5895} {"train_loss": -27.225616455078125, "global_step": 489354, "epoch": 5895} {"train_loss": -27.201642990112305, "global_step": 489355, "epoch": 5895} {"train_loss": -27.107831954956055, "global_step": 489356, "epoch": 5895} {"train_loss": -26.84052848815918, "global_step": 489357, "epoch": 5895} {"train_loss": -27.228498458862305, "global_step": 489358, "epoch": 5895} {"train_loss": -27.126123428344727, "global_step": 489359, "epoch": 5895} {"train_loss": -27.30499267578125, "global_step": 489360, "epoch": 5895} {"train_loss": -27.04233169555664, "global_step": 489361, "epoch": 5895} {"train_loss": -27.30198097229004, "global_step": 489362, "epoch": 5895} {"train_loss": -27.17380142211914, "global_step": 489363, "epoch": 5895} {"train_loss": -27.26751708984375, "global_step": 489364, "epoch": 5895} {"train_loss": -27.043527603149414, "global_step": 489365, "epoch": 5895} {"train_loss": -27.044544219970703, "global_step": 489366, "epoch": 5895} {"train_loss": -27.113620091633624, "global_step": 489367, "epoch": 5895, "val_loss": 6674523.0} {"train_loss": -27.161848068237305, "global_step": 489368, "epoch": 5896} {"train_loss": -26.961454391479492, "global_step": 489369, "epoch": 5896} {"train_loss": -26.8409366607666, "global_step": 489370, "epoch": 5896} {"train_loss": -26.6793270111084, "global_step": 489371, "epoch": 5896} {"train_loss": -27.365631103515625, "global_step": 489372, "epoch": 5896} {"train_loss": -26.70521354675293, "global_step": 489373, "epoch": 5896} {"train_loss": -26.838184356689453, "global_step": 489374, "epoch": 5896} {"train_loss": -26.892642974853516, "global_step": 489375, "epoch": 5896} {"train_loss": -26.3018798828125, "global_step": 489376, "epoch": 5896} {"train_loss": -26.383710861206055, "global_step": 489377, "epoch": 5896} {"train_loss": -27.286142349243164, "global_step": 489378, "epoch": 5896} {"train_loss": -26.61527442932129, "global_step": 489379, "epoch": 5896} {"train_loss": -26.636993408203125, "global_step": 489380, "epoch": 5896} {"train_loss": -26.88039207458496, "global_step": 489381, "epoch": 5896} {"train_loss": -26.9534969329834, "global_step": 489382, "epoch": 5896} {"train_loss": -26.257970809936523, "global_step": 489383, "epoch": 5896} {"train_loss": -27.202478408813477, "global_step": 489384, "epoch": 5896} {"train_loss": -26.578338623046875, "global_step": 489385, "epoch": 5896} {"train_loss": -26.65448570251465, "global_step": 489386, "epoch": 5896} {"train_loss": -27.03082847595215, "global_step": 489387, "epoch": 5896} {"train_loss": -27.290082931518555, "global_step": 489388, "epoch": 5896} {"train_loss": -27.000385284423828, "global_step": 489389, "epoch": 5896} {"train_loss": -27.008161544799805, "global_step": 489390, "epoch": 5896} {"train_loss": -26.8256893157959, "global_step": 489391, "epoch": 5896} {"train_loss": -27.134912490844727, "global_step": 489392, "epoch": 5896} {"train_loss": -27.09404945373535, "global_step": 489393, "epoch": 5896} {"train_loss": -26.879276275634766, "global_step": 489394, "epoch": 5896} {"train_loss": -27.138654708862305, "global_step": 489395, "epoch": 5896} {"train_loss": -27.32232666015625, "global_step": 489396, "epoch": 5896} {"train_loss": -27.0175724029541, "global_step": 489397, "epoch": 5896} {"train_loss": -27.54058837890625, "global_step": 489398, "epoch": 5896} {"train_loss": -27.10626220703125, "global_step": 489399, "epoch": 5896} {"train_loss": -27.332733154296875, "global_step": 489400, "epoch": 5896} {"train_loss": -27.516103744506836, "global_step": 489401, "epoch": 5896} {"train_loss": -27.35502052307129, "global_step": 489402, "epoch": 5896} {"train_loss": -27.37454605102539, "global_step": 489403, "epoch": 5896} {"train_loss": -27.3072452545166, "global_step": 489404, "epoch": 5896} {"train_loss": -27.615070343017578, "global_step": 489405, "epoch": 5896} {"train_loss": -27.638214111328125, "global_step": 489406, "epoch": 5896} {"train_loss": -27.472997665405273, "global_step": 489407, "epoch": 5896} {"train_loss": -27.24306297302246, "global_step": 489408, "epoch": 5896} {"train_loss": -27.056354522705078, "global_step": 489409, "epoch": 5896} {"train_loss": -27.498661041259766, "global_step": 489410, "epoch": 5896} {"train_loss": -27.26753044128418, "global_step": 489411, "epoch": 5896} {"train_loss": -27.353107452392578, "global_step": 489412, "epoch": 5896} {"train_loss": -27.43349266052246, "global_step": 489413, "epoch": 5896} {"train_loss": -27.21284294128418, "global_step": 489414, "epoch": 5896} {"train_loss": -27.025876998901367, "global_step": 489415, "epoch": 5896} {"train_loss": -27.195398330688477, "global_step": 489416, "epoch": 5896} {"train_loss": -27.324146270751953, "global_step": 489417, "epoch": 5896} {"train_loss": -27.12631607055664, "global_step": 489418, "epoch": 5896} {"train_loss": -27.48439598083496, "global_step": 489419, "epoch": 5896} {"train_loss": -27.1595516204834, "global_step": 489420, "epoch": 5896} {"train_loss": -27.790817260742188, "global_step": 489421, "epoch": 5896} {"train_loss": -27.675079345703125, "global_step": 489422, "epoch": 5896} {"train_loss": -27.366308212280273, "global_step": 489423, "epoch": 5896} {"train_loss": -27.391626358032227, "global_step": 489424, "epoch": 5896} {"train_loss": -27.267858505249023, "global_step": 489425, "epoch": 5896} {"train_loss": -27.421966552734375, "global_step": 489426, "epoch": 5896} {"train_loss": -27.61393165588379, "global_step": 489427, "epoch": 5896} {"train_loss": -27.610107421875, "global_step": 489428, "epoch": 5896} {"train_loss": -27.43430519104004, "global_step": 489429, "epoch": 5896} {"train_loss": -27.393217086791992, "global_step": 489430, "epoch": 5896} {"train_loss": -27.36982536315918, "global_step": 489431, "epoch": 5896} {"train_loss": -27.244287490844727, "global_step": 489432, "epoch": 5896} {"train_loss": -27.558813095092773, "global_step": 489433, "epoch": 5896} {"train_loss": -27.4676456451416, "global_step": 489434, "epoch": 5896} {"train_loss": -27.959152221679688, "global_step": 489435, "epoch": 5896} {"train_loss": -27.47930908203125, "global_step": 489436, "epoch": 5896} {"train_loss": -27.392364501953125, "global_step": 489437, "epoch": 5896} {"train_loss": -27.153564453125, "global_step": 489438, "epoch": 5896} {"train_loss": -27.319950103759766, "global_step": 489439, "epoch": 5896} {"train_loss": -27.368728637695312, "global_step": 489440, "epoch": 5896} {"train_loss": -27.328815460205078, "global_step": 489441, "epoch": 5896} {"train_loss": -27.239389419555664, "global_step": 489442, "epoch": 5896} {"train_loss": -26.964691162109375, "global_step": 489443, "epoch": 5896} {"train_loss": -27.00848960876465, "global_step": 489444, "epoch": 5896} {"train_loss": -27.44501304626465, "global_step": 489445, "epoch": 5896} {"train_loss": -27.14875602722168, "global_step": 489446, "epoch": 5896} {"train_loss": -27.69400978088379, "global_step": 489447, "epoch": 5896} {"train_loss": -27.651172637939453, "global_step": 489448, "epoch": 5896} {"train_loss": -27.114227294921875, "global_step": 489449, "epoch": 5896} {"train_loss": -27.198709464934936, "global_step": 489450, "epoch": 5896, "val_loss": 6709889.0} {"train_loss": -26.4527645111084, "global_step": 489451, "epoch": 5897} {"train_loss": -24.8629150390625, "global_step": 489452, "epoch": 5897} {"train_loss": -24.641061782836914, "global_step": 489453, "epoch": 5897} {"train_loss": -26.163257598876953, "global_step": 489454, "epoch": 5897} {"train_loss": -26.2708797454834, "global_step": 489455, "epoch": 5897} {"train_loss": -25.026866912841797, "global_step": 489456, "epoch": 5897} {"train_loss": -26.282617568969727, "global_step": 489457, "epoch": 5897} {"train_loss": -26.12965202331543, "global_step": 489458, "epoch": 5897} {"train_loss": -26.181140899658203, "global_step": 489459, "epoch": 5897} {"train_loss": -26.420429229736328, "global_step": 489460, "epoch": 5897} {"train_loss": -26.21046257019043, "global_step": 489461, "epoch": 5897} {"train_loss": -26.150882720947266, "global_step": 489462, "epoch": 5897} {"train_loss": -26.382099151611328, "global_step": 489463, "epoch": 5897} {"train_loss": -26.3839111328125, "global_step": 489464, "epoch": 5897} {"train_loss": -26.329294204711914, "global_step": 489465, "epoch": 5897} {"train_loss": -26.745529174804688, "global_step": 489466, "epoch": 5897} {"train_loss": -26.486974716186523, "global_step": 489467, "epoch": 5897} {"train_loss": -26.068078994750977, "global_step": 489468, "epoch": 5897} {"train_loss": -26.706205368041992, "global_step": 489469, "epoch": 5897} {"train_loss": -26.803180694580078, "global_step": 489470, "epoch": 5897} {"train_loss": -26.625234603881836, "global_step": 489471, "epoch": 5897} {"train_loss": -26.678699493408203, "global_step": 489472, "epoch": 5897} {"train_loss": -26.755598068237305, "global_step": 489473, "epoch": 5897} {"train_loss": -26.902692794799805, "global_step": 489474, "epoch": 5897} {"train_loss": -26.64350700378418, "global_step": 489475, "epoch": 5897} {"train_loss": -26.90265464782715, "global_step": 489476, "epoch": 5897} {"train_loss": -27.277799606323242, "global_step": 489477, "epoch": 5897} {"train_loss": -27.125112533569336, "global_step": 489478, "epoch": 5897} {"train_loss": -26.985687255859375, "global_step": 489479, "epoch": 5897} {"train_loss": -26.890308380126953, "global_step": 489480, "epoch": 5897} {"train_loss": -27.02353858947754, "global_step": 489481, "epoch": 5897} {"train_loss": -27.167789459228516, "global_step": 489482, "epoch": 5897} {"train_loss": -27.11065101623535, "global_step": 489483, "epoch": 5897} {"train_loss": -27.294452667236328, "global_step": 489484, "epoch": 5897} {"train_loss": -26.95521354675293, "global_step": 489485, "epoch": 5897} {"train_loss": -27.33416175842285, "global_step": 489486, "epoch": 5897} {"train_loss": -27.148101806640625, "global_step": 489487, "epoch": 5897} {"train_loss": -27.563573837280273, "global_step": 489488, "epoch": 5897} {"train_loss": -26.9591064453125, "global_step": 489489, "epoch": 5897} {"train_loss": -27.170347213745117, "global_step": 489490, "epoch": 5897} {"train_loss": -27.441852569580078, "global_step": 489491, "epoch": 5897} {"train_loss": -27.20169448852539, "global_step": 489492, "epoch": 5897} {"train_loss": -27.192611694335938, "global_step": 489493, "epoch": 5897} {"train_loss": -27.59393882751465, "global_step": 489494, "epoch": 5897} {"train_loss": -27.533803939819336, "global_step": 489495, "epoch": 5897} {"train_loss": -26.912221908569336, "global_step": 489496, "epoch": 5897} {"train_loss": -27.40618324279785, "global_step": 489497, "epoch": 5897} {"train_loss": -27.10052490234375, "global_step": 489498, "epoch": 5897} {"train_loss": -27.525989532470703, "global_step": 489499, "epoch": 5897} {"train_loss": -27.629138946533203, "global_step": 489500, "epoch": 5897} {"train_loss": -27.289113998413086, "global_step": 489501, "epoch": 5897} {"train_loss": -27.40777015686035, "global_step": 489502, "epoch": 5897} {"train_loss": -27.67083168029785, "global_step": 489503, "epoch": 5897} {"train_loss": -27.251911163330078, "global_step": 489504, "epoch": 5897} {"train_loss": -27.617223739624023, "global_step": 489505, "epoch": 5897} {"train_loss": -27.882816314697266, "global_step": 489506, "epoch": 5897} {"train_loss": -27.614303588867188, "global_step": 489507, "epoch": 5897} {"train_loss": -27.870532989501953, "global_step": 489508, "epoch": 5897} {"train_loss": -27.534780502319336, "global_step": 489509, "epoch": 5897} {"train_loss": -27.647207260131836, "global_step": 489510, "epoch": 5897} {"train_loss": -27.653888702392578, "global_step": 489511, "epoch": 5897} {"train_loss": -27.55731773376465, "global_step": 489512, "epoch": 5897} {"train_loss": -27.648168563842773, "global_step": 489513, "epoch": 5897} {"train_loss": -27.341419219970703, "global_step": 489514, "epoch": 5897} {"train_loss": -27.117752075195312, "global_step": 489515, "epoch": 5897} {"train_loss": -26.840002059936523, "global_step": 489516, "epoch": 5897} {"train_loss": -27.312768936157227, "global_step": 489517, "epoch": 5897} {"train_loss": -27.23762321472168, "global_step": 489518, "epoch": 5897} {"train_loss": -27.3671932220459, "global_step": 489519, "epoch": 5897} {"train_loss": -27.2305908203125, "global_step": 489520, "epoch": 5897} {"train_loss": -27.12823486328125, "global_step": 489521, "epoch": 5897} {"train_loss": -27.283466339111328, "global_step": 489522, "epoch": 5897} {"train_loss": -27.7562313079834, "global_step": 489523, "epoch": 5897} {"train_loss": -27.18500328063965, "global_step": 489524, "epoch": 5897} {"train_loss": -27.285348892211914, "global_step": 489525, "epoch": 5897} {"train_loss": -27.3373966217041, "global_step": 489526, "epoch": 5897} {"train_loss": -27.4301700592041, "global_step": 489527, "epoch": 5897} {"train_loss": -27.341724395751953, "global_step": 489528, "epoch": 5897} {"train_loss": -27.493799209594727, "global_step": 489529, "epoch": 5897} {"train_loss": -27.413345336914062, "global_step": 489530, "epoch": 5897} {"train_loss": -27.332433700561523, "global_step": 489531, "epoch": 5897} {"train_loss": -27.539243698120117, "global_step": 489532, "epoch": 5897} {"train_loss": -27.00861747006336, "global_step": 489533, "epoch": 5897, "val_loss": 6762854.0} {"train_loss": -27.063337326049805, "global_step": 489534, "epoch": 5898} {"train_loss": -26.8918514251709, "global_step": 489535, "epoch": 5898} {"train_loss": -26.62613296508789, "global_step": 489536, "epoch": 5898} {"train_loss": -26.257598876953125, "global_step": 489537, "epoch": 5898} {"train_loss": -26.288135528564453, "global_step": 489538, "epoch": 5898} {"train_loss": -26.98835563659668, "global_step": 489539, "epoch": 5898} {"train_loss": -27.156295776367188, "global_step": 489540, "epoch": 5898} {"train_loss": -27.51141357421875, "global_step": 489541, "epoch": 5898} {"train_loss": -27.416595458984375, "global_step": 489542, "epoch": 5898} {"train_loss": -27.356698989868164, "global_step": 489543, "epoch": 5898} {"train_loss": -26.791183471679688, "global_step": 489544, "epoch": 5898} {"train_loss": -27.355945587158203, "global_step": 489545, "epoch": 5898} {"train_loss": -27.42396354675293, "global_step": 489546, "epoch": 5898} {"train_loss": -27.5074520111084, "global_step": 489547, "epoch": 5898} {"train_loss": -27.095361709594727, "global_step": 489548, "epoch": 5898} {"train_loss": -27.014892578125, "global_step": 489549, "epoch": 5898} {"train_loss": -27.033903121948242, "global_step": 489550, "epoch": 5898} {"train_loss": -27.25111198425293, "global_step": 489551, "epoch": 5898} {"train_loss": -27.237003326416016, "global_step": 489552, "epoch": 5898} {"train_loss": -27.412145614624023, "global_step": 489553, "epoch": 5898} {"train_loss": -27.20240592956543, "global_step": 489554, "epoch": 5898} {"train_loss": -27.369115829467773, "global_step": 489555, "epoch": 5898} {"train_loss": -27.28033447265625, "global_step": 489556, "epoch": 5898} {"train_loss": -27.778610229492188, "global_step": 489557, "epoch": 5898} {"train_loss": -27.351232528686523, "global_step": 489558, "epoch": 5898} {"train_loss": -27.437612533569336, "global_step": 489559, "epoch": 5898} {"train_loss": -27.38360023498535, "global_step": 489560, "epoch": 5898} {"train_loss": -27.543930053710938, "global_step": 489561, "epoch": 5898} {"train_loss": -26.94020652770996, "global_step": 489562, "epoch": 5898} {"train_loss": -27.3530216217041, "global_step": 489563, "epoch": 5898} {"train_loss": -27.477039337158203, "global_step": 489564, "epoch": 5898} {"train_loss": -27.797870635986328, "global_step": 489565, "epoch": 5898} {"train_loss": -27.203128814697266, "global_step": 489566, "epoch": 5898} {"train_loss": -27.35984230041504, "global_step": 489567, "epoch": 5898} {"train_loss": -27.210424423217773, "global_step": 489568, "epoch": 5898} {"train_loss": -27.442434310913086, "global_step": 489569, "epoch": 5898} {"train_loss": -27.143239974975586, "global_step": 489570, "epoch": 5898} {"train_loss": -27.39871597290039, "global_step": 489571, "epoch": 5898} {"train_loss": -27.545007705688477, "global_step": 489572, "epoch": 5898} {"train_loss": -27.553680419921875, "global_step": 489573, "epoch": 5898} {"train_loss": -27.3955020904541, "global_step": 489574, "epoch": 5898} {"train_loss": -27.09406089782715, "global_step": 489575, "epoch": 5898} {"train_loss": -26.977130889892578, "global_step": 489576, "epoch": 5898} {"train_loss": -27.13010597229004, "global_step": 489577, "epoch": 5898} {"train_loss": -27.379718780517578, "global_step": 489578, "epoch": 5898} {"train_loss": -27.55413246154785, "global_step": 489579, "epoch": 5898} {"train_loss": -27.53509521484375, "global_step": 489580, "epoch": 5898} {"train_loss": -27.150354385375977, "global_step": 489581, "epoch": 5898} {"train_loss": -27.424543380737305, "global_step": 489582, "epoch": 5898} {"train_loss": -27.804351806640625, "global_step": 489583, "epoch": 5898} {"train_loss": -27.364362716674805, "global_step": 489584, "epoch": 5898} {"train_loss": -27.279821395874023, "global_step": 489585, "epoch": 5898} {"train_loss": -27.537511825561523, "global_step": 489586, "epoch": 5898} {"train_loss": -27.42915153503418, "global_step": 489587, "epoch": 5898} {"train_loss": -27.095075607299805, "global_step": 489588, "epoch": 5898} {"train_loss": -27.087976455688477, "global_step": 489589, "epoch": 5898} {"train_loss": -27.109777450561523, "global_step": 489590, "epoch": 5898} {"train_loss": -27.366668701171875, "global_step": 489591, "epoch": 5898} {"train_loss": -26.976877212524414, "global_step": 489592, "epoch": 5898} {"train_loss": -27.219221115112305, "global_step": 489593, "epoch": 5898} {"train_loss": -26.631174087524414, "global_step": 489594, "epoch": 5898} {"train_loss": -26.92030143737793, "global_step": 489595, "epoch": 5898} {"train_loss": -27.500646591186523, "global_step": 489596, "epoch": 5898} {"train_loss": -27.172285079956055, "global_step": 489597, "epoch": 5898} {"train_loss": -27.138761520385742, "global_step": 489598, "epoch": 5898} {"train_loss": -27.304712295532227, "global_step": 489599, "epoch": 5898} {"train_loss": -27.077085494995117, "global_step": 489600, "epoch": 5898} {"train_loss": -27.022748947143555, "global_step": 489601, "epoch": 5898} {"train_loss": -27.309049606323242, "global_step": 489602, "epoch": 5898} {"train_loss": -27.4145565032959, "global_step": 489603, "epoch": 5898} {"train_loss": -27.323444366455078, "global_step": 489604, "epoch": 5898} {"train_loss": -27.740636825561523, "global_step": 489605, "epoch": 5898} {"train_loss": -27.558124542236328, "global_step": 489606, "epoch": 5898} {"train_loss": -27.23223304748535, "global_step": 489607, "epoch": 5898} {"train_loss": -27.4548282623291, "global_step": 489608, "epoch": 5898} {"train_loss": -27.412372589111328, "global_step": 489609, "epoch": 5898} {"train_loss": -27.385467529296875, "global_step": 489610, "epoch": 5898} {"train_loss": -27.652027130126953, "global_step": 489611, "epoch": 5898} {"train_loss": -27.2454891204834, "global_step": 489612, "epoch": 5898} {"train_loss": -27.440332412719727, "global_step": 489613, "epoch": 5898} {"train_loss": -27.14137077331543, "global_step": 489614, "epoch": 5898} {"train_loss": -27.34173583984375, "global_step": 489615, "epoch": 5898} {"train_loss": -27.2726769964379, "global_step": 489616, "epoch": 5898, "val_loss": 6761410.0} {"train_loss": -26.515552520751953, "global_step": 489617, "epoch": 5899} {"train_loss": -27.146682739257812, "global_step": 489618, "epoch": 5899} {"train_loss": -27.008716583251953, "global_step": 489619, "epoch": 5899} {"train_loss": -27.155359268188477, "global_step": 489620, "epoch": 5899} {"train_loss": -26.759429931640625, "global_step": 489621, "epoch": 5899} {"train_loss": -27.566238403320312, "global_step": 489622, "epoch": 5899} {"train_loss": -27.304853439331055, "global_step": 489623, "epoch": 5899} {"train_loss": -26.862272262573242, "global_step": 489624, "epoch": 5899} {"train_loss": -27.052692413330078, "global_step": 489625, "epoch": 5899} {"train_loss": -27.12424659729004, "global_step": 489626, "epoch": 5899} {"train_loss": -27.06196403503418, "global_step": 489627, "epoch": 5899} {"train_loss": -26.909931182861328, "global_step": 489628, "epoch": 5899} {"train_loss": -27.1019344329834, "global_step": 489629, "epoch": 5899} {"train_loss": -27.468175888061523, "global_step": 489630, "epoch": 5899} {"train_loss": -27.24903678894043, "global_step": 489631, "epoch": 5899} {"train_loss": -26.764135360717773, "global_step": 489632, "epoch": 5899} {"train_loss": -26.88850975036621, "global_step": 489633, "epoch": 5899} {"train_loss": -27.169790267944336, "global_step": 489634, "epoch": 5899} {"train_loss": -27.151905059814453, "global_step": 489635, "epoch": 5899} {"train_loss": -27.199182510375977, "global_step": 489636, "epoch": 5899} {"train_loss": -27.31452751159668, "global_step": 489637, "epoch": 5899} {"train_loss": -27.151269912719727, "global_step": 489638, "epoch": 5899} {"train_loss": -27.059091567993164, "global_step": 489639, "epoch": 5899} {"train_loss": -27.21624755859375, "global_step": 489640, "epoch": 5899} {"train_loss": -27.501928329467773, "global_step": 489641, "epoch": 5899} {"train_loss": -27.37641716003418, "global_step": 489642, "epoch": 5899} {"train_loss": -27.59023094177246, "global_step": 489643, "epoch": 5899} {"train_loss": -27.603443145751953, "global_step": 489644, "epoch": 5899} {"train_loss": -27.498044967651367, "global_step": 489645, "epoch": 5899} {"train_loss": -27.24810218811035, "global_step": 489646, "epoch": 5899} {"train_loss": -27.373855590820312, "global_step": 489647, "epoch": 5899} {"train_loss": -27.2293643951416, "global_step": 489648, "epoch": 5899} {"train_loss": -27.32301902770996, "global_step": 489649, "epoch": 5899} {"train_loss": -27.26605796813965, "global_step": 489650, "epoch": 5899} {"train_loss": -27.71204948425293, "global_step": 489651, "epoch": 5899} {"train_loss": -27.462797164916992, "global_step": 489652, "epoch": 5899} {"train_loss": -27.542821884155273, "global_step": 489653, "epoch": 5899} {"train_loss": -27.5614013671875, "global_step": 489654, "epoch": 5899} {"train_loss": -27.0438232421875, "global_step": 489655, "epoch": 5899} {"train_loss": -27.5443115234375, "global_step": 489656, "epoch": 5899} {"train_loss": -27.159894943237305, "global_step": 489657, "epoch": 5899} {"train_loss": -27.16655921936035, "global_step": 489658, "epoch": 5899} {"train_loss": -27.197492599487305, "global_step": 489659, "epoch": 5899} {"train_loss": -26.6055850982666, "global_step": 489660, "epoch": 5899} {"train_loss": -26.662809371948242, "global_step": 489661, "epoch": 5899} {"train_loss": -26.902658462524414, "global_step": 489662, "epoch": 5899} {"train_loss": -27.265100479125977, "global_step": 489663, "epoch": 5899} {"train_loss": -26.74814796447754, "global_step": 489664, "epoch": 5899} {"train_loss": -27.093915939331055, "global_step": 489665, "epoch": 5899} {"train_loss": -27.110437393188477, "global_step": 489666, "epoch": 5899} {"train_loss": -26.9361629486084, "global_step": 489667, "epoch": 5899} {"train_loss": -27.3941593170166, "global_step": 489668, "epoch": 5899} {"train_loss": -26.720733642578125, "global_step": 489669, "epoch": 5899} {"train_loss": -26.81435203552246, "global_step": 489670, "epoch": 5899} {"train_loss": -27.202558517456055, "global_step": 489671, "epoch": 5899} {"train_loss": -27.164752960205078, "global_step": 489672, "epoch": 5899} {"train_loss": -26.983129501342773, "global_step": 489673, "epoch": 5899} {"train_loss": -27.3828182220459, "global_step": 489674, "epoch": 5899} {"train_loss": -26.836286544799805, "global_step": 489675, "epoch": 5899} {"train_loss": -27.169538497924805, "global_step": 489676, "epoch": 5899} {"train_loss": -27.157764434814453, "global_step": 489677, "epoch": 5899} {"train_loss": -26.862384796142578, "global_step": 489678, "epoch": 5899} {"train_loss": -27.076873779296875, "global_step": 489679, "epoch": 5899} {"train_loss": -27.255319595336914, "global_step": 489680, "epoch": 5899} {"train_loss": -26.578723907470703, "global_step": 489681, "epoch": 5899} {"train_loss": -27.415267944335938, "global_step": 489682, "epoch": 5899} {"train_loss": -27.242639541625977, "global_step": 489683, "epoch": 5899} {"train_loss": -27.038488388061523, "global_step": 489684, "epoch": 5899} {"train_loss": -27.497583389282227, "global_step": 489685, "epoch": 5899} {"train_loss": -27.018884658813477, "global_step": 489686, "epoch": 5899} {"train_loss": -27.372854232788086, "global_step": 489687, "epoch": 5899} {"train_loss": -26.972766876220703, "global_step": 489688, "epoch": 5899} {"train_loss": -27.064783096313477, "global_step": 489689, "epoch": 5899} {"train_loss": -26.95778465270996, "global_step": 489690, "epoch": 5899} {"train_loss": -27.360456466674805, "global_step": 489691, "epoch": 5899} {"train_loss": -26.814863204956055, "global_step": 489692, "epoch": 5899} {"train_loss": -27.276718139648438, "global_step": 489693, "epoch": 5899} {"train_loss": -27.769235610961914, "global_step": 489694, "epoch": 5899} {"train_loss": -27.606521606445312, "global_step": 489695, "epoch": 5899} {"train_loss": -27.5584716796875, "global_step": 489696, "epoch": 5899} {"train_loss": -27.457670211791992, "global_step": 489697, "epoch": 5899} {"train_loss": -27.674802780151367, "global_step": 489698, "epoch": 5899} {"train_loss": -27.170839953135296, "global_step": 489699, "epoch": 5899, "val_loss": 6677549.5} {"train_loss": -27.141592025756836, "global_step": 489700, "epoch": 5900} {"train_loss": -26.724746704101562, "global_step": 489701, "epoch": 5900} {"train_loss": -27.049955368041992, "global_step": 489702, "epoch": 5900} {"train_loss": -26.638662338256836, "global_step": 489703, "epoch": 5900} {"train_loss": -26.52011489868164, "global_step": 489704, "epoch": 5900} {"train_loss": -26.669235229492188, "global_step": 489705, "epoch": 5900} {"train_loss": -27.164281845092773, "global_step": 489706, "epoch": 5900} {"train_loss": -27.120031356811523, "global_step": 489707, "epoch": 5900} {"train_loss": -26.608911514282227, "global_step": 489708, "epoch": 5900} {"train_loss": -26.75271987915039, "global_step": 489709, "epoch": 5900} {"train_loss": -27.2850341796875, "global_step": 489710, "epoch": 5900} {"train_loss": -26.94459342956543, "global_step": 489711, "epoch": 5900} {"train_loss": -27.119861602783203, "global_step": 489712, "epoch": 5900} {"train_loss": -27.30293083190918, "global_step": 489713, "epoch": 5900} {"train_loss": -26.97175407409668, "global_step": 489714, "epoch": 5900} {"train_loss": -27.127288818359375, "global_step": 489715, "epoch": 5900} {"train_loss": -27.346118927001953, "global_step": 489716, "epoch": 5900} {"train_loss": -27.2169132232666, "global_step": 489717, "epoch": 5900} {"train_loss": -27.325910568237305, "global_step": 489718, "epoch": 5900} {"train_loss": -27.624338150024414, "global_step": 489719, "epoch": 5900} {"train_loss": -27.542768478393555, "global_step": 489720, "epoch": 5900} {"train_loss": -27.43128776550293, "global_step": 489721, "epoch": 5900} {"train_loss": -27.166248321533203, "global_step": 489722, "epoch": 5900} {"train_loss": -27.789112091064453, "global_step": 489723, "epoch": 5900} {"train_loss": -27.627233505249023, "global_step": 489724, "epoch": 5900} {"train_loss": -27.508657455444336, "global_step": 489725, "epoch": 5900} {"train_loss": -27.270383834838867, "global_step": 489726, "epoch": 5900} {"train_loss": -27.402664184570312, "global_step": 489727, "epoch": 5900} {"train_loss": -27.35223960876465, "global_step": 489728, "epoch": 5900} {"train_loss": -27.768024444580078, "global_step": 489729, "epoch": 5900} {"train_loss": -26.97230339050293, "global_step": 489730, "epoch": 5900} {"train_loss": -27.662275314331055, "global_step": 489731, "epoch": 5900} {"train_loss": -27.4194278717041, "global_step": 489732, "epoch": 5900} {"train_loss": -27.109434127807617, "global_step": 489733, "epoch": 5900} {"train_loss": -27.332427978515625, "global_step": 489734, "epoch": 5900} {"train_loss": -27.488143920898438, "global_step": 489735, "epoch": 5900} {"train_loss": -27.610876083374023, "global_step": 489736, "epoch": 5900} {"train_loss": -27.241744995117188, "global_step": 489737, "epoch": 5900} {"train_loss": -27.533756256103516, "global_step": 489738, "epoch": 5900} {"train_loss": -27.667409896850586, "global_step": 489739, "epoch": 5900} {"train_loss": -27.497167587280273, "global_step": 489740, "epoch": 5900} {"train_loss": -27.30963134765625, "global_step": 489741, "epoch": 5900} {"train_loss": -27.16901206970215, "global_step": 489742, "epoch": 5900} {"train_loss": -27.278371810913086, "global_step": 489743, "epoch": 5900} {"train_loss": -27.315311431884766, "global_step": 489744, "epoch": 5900} {"train_loss": -27.338354110717773, "global_step": 489745, "epoch": 5900} {"train_loss": -27.364044189453125, "global_step": 489746, "epoch": 5900} {"train_loss": -27.483509063720703, "global_step": 489747, "epoch": 5900} {"train_loss": -27.3347110748291, "global_step": 489748, "epoch": 5900} {"train_loss": -27.012052536010742, "global_step": 489749, "epoch": 5900} {"train_loss": -27.30476188659668, "global_step": 489750, "epoch": 5900} {"train_loss": -26.943450927734375, "global_step": 489751, "epoch": 5900} {"train_loss": -27.389368057250977, "global_step": 489752, "epoch": 5900} {"train_loss": -27.250110626220703, "global_step": 489753, "epoch": 5900} {"train_loss": -27.61008071899414, "global_step": 489754, "epoch": 5900} {"train_loss": -27.2236270904541, "global_step": 489755, "epoch": 5900} {"train_loss": -27.244359970092773, "global_step": 489756, "epoch": 5900} {"train_loss": -27.583816528320312, "global_step": 489757, "epoch": 5900} {"train_loss": -27.161468505859375, "global_step": 489758, "epoch": 5900} {"train_loss": -27.308988571166992, "global_step": 489759, "epoch": 5900} {"train_loss": -27.720901489257812, "global_step": 489760, "epoch": 5900} {"train_loss": -27.5065975189209, "global_step": 489761, "epoch": 5900} {"train_loss": -27.431299209594727, "global_step": 489762, "epoch": 5900} {"train_loss": -27.18104362487793, "global_step": 489763, "epoch": 5900} {"train_loss": -27.5169734954834, "global_step": 489764, "epoch": 5900} {"train_loss": -27.59798240661621, "global_step": 489765, "epoch": 5900} {"train_loss": -27.559606552124023, "global_step": 489766, "epoch": 5900} {"train_loss": -27.26368522644043, "global_step": 489767, "epoch": 5900} {"train_loss": -27.75851821899414, "global_step": 489768, "epoch": 5900} {"train_loss": -27.29392433166504, "global_step": 489769, "epoch": 5900} {"train_loss": -27.53443717956543, "global_step": 489770, "epoch": 5900} {"train_loss": -26.978178024291992, "global_step": 489771, "epoch": 5900} {"train_loss": -27.654804229736328, "global_step": 489772, "epoch": 5900} {"train_loss": -27.307058334350586, "global_step": 489773, "epoch": 5900} {"train_loss": -27.30750846862793, "global_step": 489774, "epoch": 5900} {"train_loss": -27.4453182220459, "global_step": 489775, "epoch": 5900} {"train_loss": -27.419225692749023, "global_step": 489776, "epoch": 5900} {"train_loss": -27.234155654907227, "global_step": 489777, "epoch": 5900} {"train_loss": -26.863203048706055, "global_step": 489778, "epoch": 5900} {"train_loss": -27.329437255859375, "global_step": 489779, "epoch": 5900} {"train_loss": -27.6398868560791, "global_step": 489780, "epoch": 5900} {"train_loss": -27.640094757080078, "global_step": 489781, "epoch": 5900} {"train_loss": -27.290864760617175, "global_step": 489782, "epoch": 5900, "train/sim_max_reward_0": 1.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 0.0, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4500000": 1.0, "test/sim_max_reward_4500001": 1.0, "test/sim_max_reward_4500002": 1.0, "test/sim_max_reward_4500003": 1.0, "test/sim_max_reward_4500004": 0.0, "test/sim_max_reward_4500005": 1.0, "test/sim_max_reward_4500006": 1.0, "test/sim_max_reward_4500007": 0.0, "test/sim_max_reward_4500008": 1.0, "test/sim_max_reward_4500009": 1.0, "test/sim_max_reward_4500010": 1.0, "test/sim_max_reward_4500011": 1.0, "test/sim_max_reward_4500012": 1.0, "test/sim_max_reward_4500013": 0.0, "test/sim_max_reward_4500014": 1.0, "test/sim_max_reward_4500015": 1.0, "test/sim_max_reward_4500016": 1.0, "test/sim_max_reward_4500017": 1.0, "test/sim_max_reward_4500018": 0.0, "test/sim_max_reward_4500019": 1.0, "test/sim_max_reward_4500020": 1.0, "test/sim_max_reward_4500021": 1.0, "train/mean_score": 0.8333333333333334, "test/mean_score": 0.8181818181818182, "val_loss": 6542576.5} {"train_loss": -24.018709182739258, "global_step": 489783, "epoch": 5901} {"train_loss": -26.28140640258789, "global_step": 489784, "epoch": 5901} {"train_loss": -25.951568603515625, "global_step": 489785, "epoch": 5901} {"train_loss": -26.226247787475586, "global_step": 489786, "epoch": 5901} {"train_loss": -26.412551879882812, "global_step": 489787, "epoch": 5901} {"train_loss": -26.363454818725586, "global_step": 489788, "epoch": 5901} {"train_loss": -26.66791343688965, "global_step": 489789, "epoch": 5901} {"train_loss": -26.727705001831055, "global_step": 489790, "epoch": 5901} {"train_loss": -26.874597549438477, "global_step": 489791, "epoch": 5901} {"train_loss": -26.7513427734375, "global_step": 489792, "epoch": 5901} {"train_loss": -26.83002281188965, "global_step": 489793, "epoch": 5901} {"train_loss": -26.955610275268555, "global_step": 489794, "epoch": 5901} {"train_loss": -26.856409072875977, "global_step": 489795, "epoch": 5901} {"train_loss": -26.982589721679688, "global_step": 489796, "epoch": 5901} {"train_loss": -26.782453536987305, "global_step": 489797, "epoch": 5901} {"train_loss": -26.8758544921875, "global_step": 489798, "epoch": 5901} {"train_loss": -26.793487548828125, "global_step": 489799, "epoch": 5901} {"train_loss": -26.883893966674805, "global_step": 489800, "epoch": 5901} {"train_loss": -27.144681930541992, "global_step": 489801, "epoch": 5901} {"train_loss": -27.151453018188477, "global_step": 489802, "epoch": 5901} {"train_loss": -27.1475887298584, "global_step": 489803, "epoch": 5901} {"train_loss": -27.2235050201416, "global_step": 489804, "epoch": 5901} {"train_loss": -27.029464721679688, "global_step": 489805, "epoch": 5901} {"train_loss": -27.409292221069336, "global_step": 489806, "epoch": 5901} {"train_loss": -27.3863525390625, "global_step": 489807, "epoch": 5901} {"train_loss": -27.119638442993164, "global_step": 489808, "epoch": 5901} {"train_loss": -27.234838485717773, "global_step": 489809, "epoch": 5901} {"train_loss": -27.085294723510742, "global_step": 489810, "epoch": 5901} {"train_loss": -27.116724014282227, "global_step": 489811, "epoch": 5901} {"train_loss": -27.272520065307617, "global_step": 489812, "epoch": 5901} {"train_loss": -27.174604415893555, "global_step": 489813, "epoch": 5901} {"train_loss": -27.105487823486328, "global_step": 489814, "epoch": 5901} {"train_loss": -27.444660186767578, "global_step": 489815, "epoch": 5901} {"train_loss": -27.335681915283203, "global_step": 489816, "epoch": 5901} {"train_loss": -27.38726234436035, "global_step": 489817, "epoch": 5901} {"train_loss": -27.200672149658203, "global_step": 489818, "epoch": 5901} {"train_loss": -26.939788818359375, "global_step": 489819, "epoch": 5901} {"train_loss": -27.120758056640625, "global_step": 489820, "epoch": 5901} {"train_loss": -27.24627685546875, "global_step": 489821, "epoch": 5901} {"train_loss": -27.056533813476562, "global_step": 489822, "epoch": 5901} {"train_loss": -27.80278968811035, "global_step": 489823, "epoch": 5901} {"train_loss": -27.2270565032959, "global_step": 489824, "epoch": 5901} {"train_loss": -26.890783309936523, "global_step": 489825, "epoch": 5901} {"train_loss": -27.420934677124023, "global_step": 489826, "epoch": 5901} {"train_loss": -27.350553512573242, "global_step": 489827, "epoch": 5901} {"train_loss": -27.295835494995117, "global_step": 489828, "epoch": 5901} {"train_loss": -27.18073844909668, "global_step": 489829, "epoch": 5901} {"train_loss": -27.021472930908203, "global_step": 489830, "epoch": 5901} {"train_loss": -27.42486000061035, "global_step": 489831, "epoch": 5901} {"train_loss": -27.247541427612305, "global_step": 489832, "epoch": 5901} {"train_loss": -27.489303588867188, "global_step": 489833, "epoch": 5901} {"train_loss": -27.517902374267578, "global_step": 489834, "epoch": 5901} {"train_loss": -27.67207145690918, "global_step": 489835, "epoch": 5901} {"train_loss": -26.991561889648438, "global_step": 489836, "epoch": 5901} {"train_loss": -27.390613555908203, "global_step": 489837, "epoch": 5901} {"train_loss": -27.344770431518555, "global_step": 489838, "epoch": 5901} {"train_loss": -27.41254997253418, "global_step": 489839, "epoch": 5901} {"train_loss": -27.470129013061523, "global_step": 489840, "epoch": 5901} {"train_loss": -27.488758087158203, "global_step": 489841, "epoch": 5901} {"train_loss": -27.25165367126465, "global_step": 489842, "epoch": 5901} {"train_loss": -27.25831413269043, "global_step": 489843, "epoch": 5901} {"train_loss": -26.891523361206055, "global_step": 489844, "epoch": 5901} {"train_loss": -26.747953414916992, "global_step": 489845, "epoch": 5901} {"train_loss": -27.061750411987305, "global_step": 489846, "epoch": 5901} {"train_loss": -26.89215660095215, "global_step": 489847, "epoch": 5901} {"train_loss": -27.393680572509766, "global_step": 489848, "epoch": 5901} {"train_loss": -27.156112670898438, "global_step": 489849, "epoch": 5901} {"train_loss": -26.911941528320312, "global_step": 489850, "epoch": 5901} {"train_loss": -26.851285934448242, "global_step": 489851, "epoch": 5901} {"train_loss": -27.25921058654785, "global_step": 489852, "epoch": 5901} {"train_loss": -27.319929122924805, "global_step": 489853, "epoch": 5901} {"train_loss": -27.26521110534668, "global_step": 489854, "epoch": 5901} {"train_loss": -27.38709831237793, "global_step": 489855, "epoch": 5901} {"train_loss": -27.159894943237305, "global_step": 489856, "epoch": 5901} {"train_loss": -27.654666900634766, "global_step": 489857, "epoch": 5901} {"train_loss": -27.683019638061523, "global_step": 489858, "epoch": 5901} {"train_loss": -27.291645050048828, "global_step": 489859, "epoch": 5901} {"train_loss": -27.505701065063477, "global_step": 489860, "epoch": 5901} {"train_loss": -27.30562400817871, "global_step": 489861, "epoch": 5901} {"train_loss": -27.39678955078125, "global_step": 489862, "epoch": 5901} {"train_loss": -27.642353057861328, "global_step": 489863, "epoch": 5901} {"train_loss": -27.220203399658203, "global_step": 489864, "epoch": 5901} {"train_loss": -27.104042328983905, "global_step": 489865, "epoch": 5901, "val_loss": 6546417.0} {"train_loss": -26.87879753112793, "global_step": 489866, "epoch": 5902} {"train_loss": -26.495691299438477, "global_step": 489867, "epoch": 5902} {"train_loss": -26.88517189025879, "global_step": 489868, "epoch": 5902} {"train_loss": -26.81146240234375, "global_step": 489869, "epoch": 5902} {"train_loss": -26.513803482055664, "global_step": 489870, "epoch": 5902} {"train_loss": -26.329452514648438, "global_step": 489871, "epoch": 5902} {"train_loss": -26.495527267456055, "global_step": 489872, "epoch": 5902} {"train_loss": -27.0190486907959, "global_step": 489873, "epoch": 5902} {"train_loss": -26.369495391845703, "global_step": 489874, "epoch": 5902} {"train_loss": -27.47589111328125, "global_step": 489875, "epoch": 5902} {"train_loss": -26.523624420166016, "global_step": 489876, "epoch": 5902} {"train_loss": -27.56854248046875, "global_step": 489877, "epoch": 5902} {"train_loss": -27.04052734375, "global_step": 489878, "epoch": 5902} {"train_loss": -26.981918334960938, "global_step": 489879, "epoch": 5902} {"train_loss": -26.800201416015625, "global_step": 489880, "epoch": 5902} {"train_loss": -26.88948631286621, "global_step": 489881, "epoch": 5902} {"train_loss": -27.10433006286621, "global_step": 489882, "epoch": 5902} {"train_loss": -27.243139266967773, "global_step": 489883, "epoch": 5902} {"train_loss": -27.274335861206055, "global_step": 489884, "epoch": 5902} {"train_loss": -26.99969482421875, "global_step": 489885, "epoch": 5902} {"train_loss": -26.97694969177246, "global_step": 489886, "epoch": 5902} {"train_loss": -27.284687042236328, "global_step": 489887, "epoch": 5902} {"train_loss": -26.99761962890625, "global_step": 489888, "epoch": 5902} {"train_loss": -27.31819725036621, "global_step": 489889, "epoch": 5902} {"train_loss": -27.169641494750977, "global_step": 489890, "epoch": 5902} {"train_loss": -27.295154571533203, "global_step": 489891, "epoch": 5902} {"train_loss": -27.370410919189453, "global_step": 489892, "epoch": 5902} {"train_loss": -27.520526885986328, "global_step": 489893, "epoch": 5902} {"train_loss": -27.473981857299805, "global_step": 489894, "epoch": 5902} {"train_loss": -27.547000885009766, "global_step": 489895, "epoch": 5902} {"train_loss": -27.447193145751953, "global_step": 489896, "epoch": 5902} {"train_loss": -27.104028701782227, "global_step": 489897, "epoch": 5902} {"train_loss": -27.291854858398438, "global_step": 489898, "epoch": 5902} {"train_loss": -27.265384674072266, "global_step": 489899, "epoch": 5902} {"train_loss": -27.81597328186035, "global_step": 489900, "epoch": 5902} {"train_loss": -27.432418823242188, "global_step": 489901, "epoch": 5902} {"train_loss": -27.640348434448242, "global_step": 489902, "epoch": 5902} {"train_loss": -27.473846435546875, "global_step": 489903, "epoch": 5902} {"train_loss": -27.416112899780273, "global_step": 489904, "epoch": 5902} {"train_loss": -27.45361328125, "global_step": 489905, "epoch": 5902} {"train_loss": -27.316638946533203, "global_step": 489906, "epoch": 5902} {"train_loss": -27.65946388244629, "global_step": 489907, "epoch": 5902} {"train_loss": -27.265609741210938, "global_step": 489908, "epoch": 5902} {"train_loss": -26.97672462463379, "global_step": 489909, "epoch": 5902} {"train_loss": -27.491315841674805, "global_step": 489910, "epoch": 5902} {"train_loss": -27.24886131286621, "global_step": 489911, "epoch": 5902} {"train_loss": -27.313419342041016, "global_step": 489912, "epoch": 5902} {"train_loss": -27.47767448425293, "global_step": 489913, "epoch": 5902} {"train_loss": -27.054834365844727, "global_step": 489914, "epoch": 5902} {"train_loss": -27.458160400390625, "global_step": 489915, "epoch": 5902} {"train_loss": -27.1495304107666, "global_step": 489916, "epoch": 5902} {"train_loss": -27.09480094909668, "global_step": 489917, "epoch": 5902} {"train_loss": -27.539167404174805, "global_step": 489918, "epoch": 5902} {"train_loss": -27.5538387298584, "global_step": 489919, "epoch": 5902} {"train_loss": -27.419931411743164, "global_step": 489920, "epoch": 5902} {"train_loss": -26.93699073791504, "global_step": 489921, "epoch": 5902} {"train_loss": -27.549835205078125, "global_step": 489922, "epoch": 5902} {"train_loss": -27.66192626953125, "global_step": 489923, "epoch": 5902} {"train_loss": -26.82145118713379, "global_step": 489924, "epoch": 5902} {"train_loss": -27.166589736938477, "global_step": 489925, "epoch": 5902} {"train_loss": -27.268360137939453, "global_step": 489926, "epoch": 5902} {"train_loss": -27.570606231689453, "global_step": 489927, "epoch": 5902} {"train_loss": -27.055017471313477, "global_step": 489928, "epoch": 5902} {"train_loss": -27.08298683166504, "global_step": 489929, "epoch": 5902} {"train_loss": -27.16120719909668, "global_step": 489930, "epoch": 5902} {"train_loss": -26.979267120361328, "global_step": 489931, "epoch": 5902} {"train_loss": -27.312597274780273, "global_step": 489932, "epoch": 5902} {"train_loss": -27.135833740234375, "global_step": 489933, "epoch": 5902} {"train_loss": -26.89930534362793, "global_step": 489934, "epoch": 5902} {"train_loss": -26.751312255859375, "global_step": 489935, "epoch": 5902} {"train_loss": -27.2969970703125, "global_step": 489936, "epoch": 5902} {"train_loss": -27.274127960205078, "global_step": 489937, "epoch": 5902} {"train_loss": -26.968408584594727, "global_step": 489938, "epoch": 5902} {"train_loss": -27.44825553894043, "global_step": 489939, "epoch": 5902} {"train_loss": -27.321069717407227, "global_step": 489940, "epoch": 5902} {"train_loss": -27.275836944580078, "global_step": 489941, "epoch": 5902} {"train_loss": -27.069177627563477, "global_step": 489942, "epoch": 5902} {"train_loss": -27.30615234375, "global_step": 489943, "epoch": 5902} {"train_loss": -27.393661499023438, "global_step": 489944, "epoch": 5902} {"train_loss": -27.444982528686523, "global_step": 489945, "epoch": 5902} {"train_loss": -27.66849708557129, "global_step": 489946, "epoch": 5902} {"train_loss": -27.435266494750977, "global_step": 489947, "epoch": 5902} {"train_loss": -27.17799708354904, "global_step": 489948, "epoch": 5902, "val_loss": 6521355.0} {"train_loss": -26.943510055541992, "global_step": 489949, "epoch": 5903} {"train_loss": -26.781415939331055, "global_step": 489950, "epoch": 5903} {"train_loss": -27.08184242248535, "global_step": 489951, "epoch": 5903} {"train_loss": -26.6309814453125, "global_step": 489952, "epoch": 5903} {"train_loss": -26.249303817749023, "global_step": 489953, "epoch": 5903} {"train_loss": -26.24673843383789, "global_step": 489954, "epoch": 5903} {"train_loss": -26.555952072143555, "global_step": 489955, "epoch": 5903} {"train_loss": -26.871612548828125, "global_step": 489956, "epoch": 5903} {"train_loss": -26.407148361206055, "global_step": 489957, "epoch": 5903} {"train_loss": -26.393030166625977, "global_step": 489958, "epoch": 5903} {"train_loss": -26.6729736328125, "global_step": 489959, "epoch": 5903} {"train_loss": -27.13226890563965, "global_step": 489960, "epoch": 5903} {"train_loss": -26.737445831298828, "global_step": 489961, "epoch": 5903} {"train_loss": -26.767566680908203, "global_step": 489962, "epoch": 5903} {"train_loss": -27.03644371032715, "global_step": 489963, "epoch": 5903} {"train_loss": -26.967187881469727, "global_step": 489964, "epoch": 5903} {"train_loss": -27.035572052001953, "global_step": 489965, "epoch": 5903} {"train_loss": -27.1157283782959, "global_step": 489966, "epoch": 5903} {"train_loss": -27.008352279663086, "global_step": 489967, "epoch": 5903} {"train_loss": -27.084577560424805, "global_step": 489968, "epoch": 5903} {"train_loss": -27.09931755065918, "global_step": 489969, "epoch": 5903} {"train_loss": -27.074554443359375, "global_step": 489970, "epoch": 5903} {"train_loss": -26.675642013549805, "global_step": 489971, "epoch": 5903} {"train_loss": -26.893125534057617, "global_step": 489972, "epoch": 5903} {"train_loss": -27.271488189697266, "global_step": 489973, "epoch": 5903} {"train_loss": -27.062055587768555, "global_step": 489974, "epoch": 5903} {"train_loss": -27.493574142456055, "global_step": 489975, "epoch": 5903} {"train_loss": -26.702611923217773, "global_step": 489976, "epoch": 5903} {"train_loss": -26.952802658081055, "global_step": 489977, "epoch": 5903} {"train_loss": -27.224994659423828, "global_step": 489978, "epoch": 5903} {"train_loss": -27.31634521484375, "global_step": 489979, "epoch": 5903} {"train_loss": -27.101099014282227, "global_step": 489980, "epoch": 5903} {"train_loss": -27.5263614654541, "global_step": 489981, "epoch": 5903} {"train_loss": -27.160810470581055, "global_step": 489982, "epoch": 5903} {"train_loss": -27.5291690826416, "global_step": 489983, "epoch": 5903} {"train_loss": -27.288137435913086, "global_step": 489984, "epoch": 5903} {"train_loss": -27.2137451171875, "global_step": 489985, "epoch": 5903} {"train_loss": -27.100421905517578, "global_step": 489986, "epoch": 5903} {"train_loss": -27.4645938873291, "global_step": 489987, "epoch": 5903} {"train_loss": -27.196012496948242, "global_step": 489988, "epoch": 5903} {"train_loss": -27.2567138671875, "global_step": 489989, "epoch": 5903} {"train_loss": -27.279001235961914, "global_step": 489990, "epoch": 5903} {"train_loss": -27.32622718811035, "global_step": 489991, "epoch": 5903} {"train_loss": -27.260786056518555, "global_step": 489992, "epoch": 5903} {"train_loss": -27.683969497680664, "global_step": 489993, "epoch": 5903} {"train_loss": -27.205184936523438, "global_step": 489994, "epoch": 5903} {"train_loss": -27.341272354125977, "global_step": 489995, "epoch": 5903} {"train_loss": -27.226043701171875, "global_step": 489996, "epoch": 5903} {"train_loss": -26.58384132385254, "global_step": 489997, "epoch": 5903} {"train_loss": -26.34126853942871, "global_step": 489998, "epoch": 5903} {"train_loss": -26.293378829956055, "global_step": 489999, "epoch": 5903} {"train_loss": -27.396825790405273, "global_step": 490000, "epoch": 5903} {"train_loss": -26.95599937438965, "global_step": 490001, "epoch": 5903} {"train_loss": -26.8306941986084, "global_step": 490002, "epoch": 5903} {"train_loss": -27.3508243560791, "global_step": 490003, "epoch": 5903} {"train_loss": -27.14002799987793, "global_step": 490004, "epoch": 5903} {"train_loss": -26.72064781188965, "global_step": 490005, "epoch": 5903} {"train_loss": -27.040929794311523, "global_step": 490006, "epoch": 5903} {"train_loss": -27.045164108276367, "global_step": 490007, "epoch": 5903} {"train_loss": -26.821578979492188, "global_step": 490008, "epoch": 5903} {"train_loss": -27.409942626953125, "global_step": 490009, "epoch": 5903} {"train_loss": -27.133310317993164, "global_step": 490010, "epoch": 5903} {"train_loss": -27.204742431640625, "global_step": 490011, "epoch": 5903} {"train_loss": -27.317365646362305, "global_step": 490012, "epoch": 5903} {"train_loss": -27.357410430908203, "global_step": 490013, "epoch": 5903} {"train_loss": -27.21599769592285, "global_step": 490014, "epoch": 5903} {"train_loss": -27.27899169921875, "global_step": 490015, "epoch": 5903} {"train_loss": -27.507116317749023, "global_step": 490016, "epoch": 5903} {"train_loss": -27.251449584960938, "global_step": 490017, "epoch": 5903} {"train_loss": -27.4742488861084, "global_step": 490018, "epoch": 5903} {"train_loss": -27.11488151550293, "global_step": 490019, "epoch": 5903} {"train_loss": -27.34502601623535, "global_step": 490020, "epoch": 5903} {"train_loss": -26.821332931518555, "global_step": 490021, "epoch": 5903} {"train_loss": -27.176898956298828, "global_step": 490022, "epoch": 5903} {"train_loss": -27.186786651611328, "global_step": 490023, "epoch": 5903} {"train_loss": -27.474607467651367, "global_step": 490024, "epoch": 5903} {"train_loss": -27.284076690673828, "global_step": 490025, "epoch": 5903} {"train_loss": -27.369277954101562, "global_step": 490026, "epoch": 5903} {"train_loss": -26.93505859375, "global_step": 490027, "epoch": 5903} {"train_loss": -27.830615997314453, "global_step": 490028, "epoch": 5903} {"train_loss": -27.221012115478516, "global_step": 490029, "epoch": 5903} {"train_loss": -27.47321128845215, "global_step": 490030, "epoch": 5903} {"train_loss": -27.080013137265862, "global_step": 490031, "epoch": 5903, "val_loss": 6568642.0} {"train_loss": -24.85689926147461, "global_step": 490032, "epoch": 5904} {"train_loss": -23.488183975219727, "global_step": 490033, "epoch": 5904} {"train_loss": -22.952741622924805, "global_step": 490034, "epoch": 5904} {"train_loss": -26.09737205505371, "global_step": 490035, "epoch": 5904} {"train_loss": -24.747852325439453, "global_step": 490036, "epoch": 5904} {"train_loss": -26.179540634155273, "global_step": 490037, "epoch": 5904} {"train_loss": -25.324485778808594, "global_step": 490038, "epoch": 5904} {"train_loss": -26.670862197875977, "global_step": 490039, "epoch": 5904} {"train_loss": -25.465909957885742, "global_step": 490040, "epoch": 5904} {"train_loss": -26.1862850189209, "global_step": 490041, "epoch": 5904} {"train_loss": -26.219907760620117, "global_step": 490042, "epoch": 5904} {"train_loss": -26.17693519592285, "global_step": 490043, "epoch": 5904} {"train_loss": -26.644987106323242, "global_step": 490044, "epoch": 5904} {"train_loss": -26.317224502563477, "global_step": 490045, "epoch": 5904} {"train_loss": -26.695859909057617, "global_step": 490046, "epoch": 5904} {"train_loss": -26.679113388061523, "global_step": 490047, "epoch": 5904} {"train_loss": -26.551166534423828, "global_step": 490048, "epoch": 5904} {"train_loss": -26.745208740234375, "global_step": 490049, "epoch": 5904} {"train_loss": -26.399702072143555, "global_step": 490050, "epoch": 5904} {"train_loss": -26.22395896911621, "global_step": 490051, "epoch": 5904} {"train_loss": -26.730838775634766, "global_step": 490052, "epoch": 5904} {"train_loss": -26.662961959838867, "global_step": 490053, "epoch": 5904} {"train_loss": -26.283246994018555, "global_step": 490054, "epoch": 5904} {"train_loss": -26.731103897094727, "global_step": 490055, "epoch": 5904} {"train_loss": -26.691247940063477, "global_step": 490056, "epoch": 5904} {"train_loss": -26.452844619750977, "global_step": 490057, "epoch": 5904} {"train_loss": -27.106992721557617, "global_step": 490058, "epoch": 5904} {"train_loss": -26.85111427307129, "global_step": 490059, "epoch": 5904} {"train_loss": -26.877187728881836, "global_step": 490060, "epoch": 5904} {"train_loss": -26.667688369750977, "global_step": 490061, "epoch": 5904} {"train_loss": -26.68403434753418, "global_step": 490062, "epoch": 5904} {"train_loss": -26.94927978515625, "global_step": 490063, "epoch": 5904} {"train_loss": -26.751928329467773, "global_step": 490064, "epoch": 5904} {"train_loss": -26.884937286376953, "global_step": 490065, "epoch": 5904} {"train_loss": -27.233203887939453, "global_step": 490066, "epoch": 5904} {"train_loss": -27.075092315673828, "global_step": 490067, "epoch": 5904} {"train_loss": -27.138568878173828, "global_step": 490068, "epoch": 5904} {"train_loss": -27.161182403564453, "global_step": 490069, "epoch": 5904} {"train_loss": -27.25553321838379, "global_step": 490070, "epoch": 5904} {"train_loss": -26.99017906188965, "global_step": 490071, "epoch": 5904} {"train_loss": -26.816431045532227, "global_step": 490072, "epoch": 5904} {"train_loss": -27.122907638549805, "global_step": 490073, "epoch": 5904} {"train_loss": -27.400238037109375, "global_step": 490074, "epoch": 5904} {"train_loss": -27.143232345581055, "global_step": 490075, "epoch": 5904} {"train_loss": -27.085912704467773, "global_step": 490076, "epoch": 5904} {"train_loss": -27.36993980407715, "global_step": 490077, "epoch": 5904} {"train_loss": -27.0662784576416, "global_step": 490078, "epoch": 5904} {"train_loss": -27.65382194519043, "global_step": 490079, "epoch": 5904} {"train_loss": -27.076812744140625, "global_step": 490080, "epoch": 5904} {"train_loss": -27.219959259033203, "global_step": 490081, "epoch": 5904} {"train_loss": -27.25465202331543, "global_step": 490082, "epoch": 5904} {"train_loss": -27.588327407836914, "global_step": 490083, "epoch": 5904} {"train_loss": -27.18109130859375, "global_step": 490084, "epoch": 5904} {"train_loss": -27.303058624267578, "global_step": 490085, "epoch": 5904} {"train_loss": -27.009765625, "global_step": 490086, "epoch": 5904} {"train_loss": -27.237394332885742, "global_step": 490087, "epoch": 5904} {"train_loss": -27.228551864624023, "global_step": 490088, "epoch": 5904} {"train_loss": -27.045480728149414, "global_step": 490089, "epoch": 5904} {"train_loss": -27.778772354125977, "global_step": 490090, "epoch": 5904} {"train_loss": -27.166797637939453, "global_step": 490091, "epoch": 5904} {"train_loss": -27.024789810180664, "global_step": 490092, "epoch": 5904} {"train_loss": -27.486358642578125, "global_step": 490093, "epoch": 5904} {"train_loss": -27.645612716674805, "global_step": 490094, "epoch": 5904} {"train_loss": -27.509225845336914, "global_step": 490095, "epoch": 5904} {"train_loss": -27.214359283447266, "global_step": 490096, "epoch": 5904} {"train_loss": -27.114105224609375, "global_step": 490097, "epoch": 5904} {"train_loss": -27.17131996154785, "global_step": 490098, "epoch": 5904} {"train_loss": -27.44219970703125, "global_step": 490099, "epoch": 5904} {"train_loss": -27.71993064880371, "global_step": 490100, "epoch": 5904} {"train_loss": -27.439590454101562, "global_step": 490101, "epoch": 5904} {"train_loss": -27.7018985748291, "global_step": 490102, "epoch": 5904} {"train_loss": -27.553939819335938, "global_step": 490103, "epoch": 5904} {"train_loss": -27.240819931030273, "global_step": 490104, "epoch": 5904} {"train_loss": -27.3245849609375, "global_step": 490105, "epoch": 5904} {"train_loss": -27.58038330078125, "global_step": 490106, "epoch": 5904} {"train_loss": -27.65215492248535, "global_step": 490107, "epoch": 5904} {"train_loss": -27.185354232788086, "global_step": 490108, "epoch": 5904} {"train_loss": -27.44496726989746, "global_step": 490109, "epoch": 5904} {"train_loss": -27.236499786376953, "global_step": 490110, "epoch": 5904} {"train_loss": -27.17705726623535, "global_step": 490111, "epoch": 5904} {"train_loss": -27.407663345336914, "global_step": 490112, "epoch": 5904} {"train_loss": -27.748807907104492, "global_step": 490113, "epoch": 5904} {"train_loss": -26.855536196605268, "global_step": 490114, "epoch": 5904, "val_loss": 6483092.0} {"train_loss": -26.858041763305664, "global_step": 490115, "epoch": 5905} {"train_loss": -26.065221786499023, "global_step": 490116, "epoch": 5905} {"train_loss": -26.688861846923828, "global_step": 490117, "epoch": 5905} {"train_loss": -26.745929718017578, "global_step": 490118, "epoch": 5905} {"train_loss": -26.963775634765625, "global_step": 490119, "epoch": 5905} {"train_loss": -26.348615646362305, "global_step": 490120, "epoch": 5905} {"train_loss": -26.963647842407227, "global_step": 490121, "epoch": 5905} {"train_loss": -27.010406494140625, "global_step": 490122, "epoch": 5905} {"train_loss": -26.878904342651367, "global_step": 490123, "epoch": 5905} {"train_loss": -27.210556030273438, "global_step": 490124, "epoch": 5905} {"train_loss": -27.092626571655273, "global_step": 490125, "epoch": 5905} {"train_loss": -27.019750595092773, "global_step": 490126, "epoch": 5905} {"train_loss": -27.106115341186523, "global_step": 490127, "epoch": 5905} {"train_loss": -26.8867244720459, "global_step": 490128, "epoch": 5905} {"train_loss": -27.023895263671875, "global_step": 490129, "epoch": 5905} {"train_loss": -27.232177734375, "global_step": 490130, "epoch": 5905} {"train_loss": -27.452077865600586, "global_step": 490131, "epoch": 5905} {"train_loss": -27.185596466064453, "global_step": 490132, "epoch": 5905} {"train_loss": -26.954267501831055, "global_step": 490133, "epoch": 5905} {"train_loss": -26.959365844726562, "global_step": 490134, "epoch": 5905} {"train_loss": -27.124038696289062, "global_step": 490135, "epoch": 5905} {"train_loss": -27.303075790405273, "global_step": 490136, "epoch": 5905} {"train_loss": -27.128559112548828, "global_step": 490137, "epoch": 5905} {"train_loss": -27.2557430267334, "global_step": 490138, "epoch": 5905} {"train_loss": -26.853254318237305, "global_step": 490139, "epoch": 5905} {"train_loss": -27.028345108032227, "global_step": 490140, "epoch": 5905} {"train_loss": -27.514144897460938, "global_step": 490141, "epoch": 5905} {"train_loss": -27.21142578125, "global_step": 490142, "epoch": 5905} {"train_loss": -27.149444580078125, "global_step": 490143, "epoch": 5905} {"train_loss": -27.420995712280273, "global_step": 490144, "epoch": 5905} {"train_loss": -27.001022338867188, "global_step": 490145, "epoch": 5905} {"train_loss": -27.32099723815918, "global_step": 490146, "epoch": 5905} {"train_loss": -27.159198760986328, "global_step": 490147, "epoch": 5905} {"train_loss": -27.73554039001465, "global_step": 490148, "epoch": 5905} {"train_loss": -27.25078773498535, "global_step": 490149, "epoch": 5905} {"train_loss": -27.5347843170166, "global_step": 490150, "epoch": 5905} {"train_loss": -27.46632194519043, "global_step": 490151, "epoch": 5905} {"train_loss": -27.378772735595703, "global_step": 490152, "epoch": 5905} {"train_loss": -27.554595947265625, "global_step": 490153, "epoch": 5905} {"train_loss": -27.4989070892334, "global_step": 490154, "epoch": 5905} {"train_loss": -26.9147891998291, "global_step": 490155, "epoch": 5905} {"train_loss": -27.32399559020996, "global_step": 490156, "epoch": 5905} {"train_loss": -27.26983642578125, "global_step": 490157, "epoch": 5905} {"train_loss": -27.700510025024414, "global_step": 490158, "epoch": 5905} {"train_loss": -27.54783058166504, "global_step": 490159, "epoch": 5905} {"train_loss": -27.387887954711914, "global_step": 490160, "epoch": 5905} {"train_loss": -27.223432540893555, "global_step": 490161, "epoch": 5905} {"train_loss": -27.555246353149414, "global_step": 490162, "epoch": 5905} {"train_loss": -27.13298988342285, "global_step": 490163, "epoch": 5905} {"train_loss": -27.31619644165039, "global_step": 490164, "epoch": 5905} {"train_loss": -27.01209831237793, "global_step": 490165, "epoch": 5905} {"train_loss": -27.48272132873535, "global_step": 490166, "epoch": 5905} {"train_loss": -27.10413932800293, "global_step": 490167, "epoch": 5905} {"train_loss": -27.292163848876953, "global_step": 490168, "epoch": 5905} {"train_loss": -27.32892417907715, "global_step": 490169, "epoch": 5905} {"train_loss": -27.5424861907959, "global_step": 490170, "epoch": 5905} {"train_loss": -27.61871337890625, "global_step": 490171, "epoch": 5905} {"train_loss": -27.255817413330078, "global_step": 490172, "epoch": 5905} {"train_loss": -27.732412338256836, "global_step": 490173, "epoch": 5905} {"train_loss": -27.519742965698242, "global_step": 490174, "epoch": 5905} {"train_loss": -27.21265983581543, "global_step": 490175, "epoch": 5905} {"train_loss": -27.27435874938965, "global_step": 490176, "epoch": 5905} {"train_loss": -27.822402954101562, "global_step": 490177, "epoch": 5905} {"train_loss": -27.089643478393555, "global_step": 490178, "epoch": 5905} {"train_loss": -27.54849624633789, "global_step": 490179, "epoch": 5905} {"train_loss": -27.5269832611084, "global_step": 490180, "epoch": 5905} {"train_loss": -27.649866104125977, "global_step": 490181, "epoch": 5905} {"train_loss": -27.626678466796875, "global_step": 490182, "epoch": 5905} {"train_loss": -27.249073028564453, "global_step": 490183, "epoch": 5905} {"train_loss": -27.440784454345703, "global_step": 490184, "epoch": 5905} {"train_loss": -27.81952476501465, "global_step": 490185, "epoch": 5905} {"train_loss": -27.30852699279785, "global_step": 490186, "epoch": 5905} {"train_loss": -27.60877799987793, "global_step": 490187, "epoch": 5905} {"train_loss": -27.54471778869629, "global_step": 490188, "epoch": 5905} {"train_loss": -27.57193374633789, "global_step": 490189, "epoch": 5905} {"train_loss": -27.334125518798828, "global_step": 490190, "epoch": 5905} {"train_loss": -27.470243453979492, "global_step": 490191, "epoch": 5905} {"train_loss": -27.291547775268555, "global_step": 490192, "epoch": 5905} {"train_loss": -27.62327003479004, "global_step": 490193, "epoch": 5905} {"train_loss": -27.021076202392578, "global_step": 490194, "epoch": 5905} {"train_loss": -27.234262466430664, "global_step": 490195, "epoch": 5905} {"train_loss": -27.42158317565918, "global_step": 490196, "epoch": 5905} {"train_loss": -27.252588547855975, "global_step": 490197, "epoch": 5905, "val_loss": 6502892.5} {"train_loss": -27.098834991455078, "global_step": 490198, "epoch": 5906} {"train_loss": -26.450031280517578, "global_step": 490199, "epoch": 5906} {"train_loss": -26.456607818603516, "global_step": 490200, "epoch": 5906} {"train_loss": -26.07224464416504, "global_step": 490201, "epoch": 5906} {"train_loss": -25.978742599487305, "global_step": 490202, "epoch": 5906} {"train_loss": -27.21404457092285, "global_step": 490203, "epoch": 5906} {"train_loss": -26.707929611206055, "global_step": 490204, "epoch": 5906} {"train_loss": -26.817197799682617, "global_step": 490205, "epoch": 5906} {"train_loss": -27.10523796081543, "global_step": 490206, "epoch": 5906} {"train_loss": -27.426788330078125, "global_step": 490207, "epoch": 5906} {"train_loss": -27.023557662963867, "global_step": 490208, "epoch": 5906} {"train_loss": -27.26605796813965, "global_step": 490209, "epoch": 5906} {"train_loss": -27.13800621032715, "global_step": 490210, "epoch": 5906} {"train_loss": -27.07073974609375, "global_step": 490211, "epoch": 5906} {"train_loss": -27.174230575561523, "global_step": 490212, "epoch": 5906} {"train_loss": -27.2554931640625, "global_step": 490213, "epoch": 5906} {"train_loss": -27.304080963134766, "global_step": 490214, "epoch": 5906} {"train_loss": -26.972061157226562, "global_step": 490215, "epoch": 5906} {"train_loss": -27.282073974609375, "global_step": 490216, "epoch": 5906} {"train_loss": -27.24845314025879, "global_step": 490217, "epoch": 5906} {"train_loss": -27.1552677154541, "global_step": 490218, "epoch": 5906} {"train_loss": -27.280725479125977, "global_step": 490219, "epoch": 5906} {"train_loss": -27.267841339111328, "global_step": 490220, "epoch": 5906} {"train_loss": -27.09470558166504, "global_step": 490221, "epoch": 5906} {"train_loss": -27.067956924438477, "global_step": 490222, "epoch": 5906} {"train_loss": -27.617116928100586, "global_step": 490223, "epoch": 5906} {"train_loss": -27.032602310180664, "global_step": 490224, "epoch": 5906} {"train_loss": -27.04789161682129, "global_step": 490225, "epoch": 5906} {"train_loss": -27.216419219970703, "global_step": 490226, "epoch": 5906} {"train_loss": -27.554243087768555, "global_step": 490227, "epoch": 5906} {"train_loss": -27.003808975219727, "global_step": 490228, "epoch": 5906} {"train_loss": -27.401844024658203, "global_step": 490229, "epoch": 5906} {"train_loss": -27.526992797851562, "global_step": 490230, "epoch": 5906} {"train_loss": -27.29200553894043, "global_step": 490231, "epoch": 5906} {"train_loss": -27.249134063720703, "global_step": 490232, "epoch": 5906} {"train_loss": -27.54266929626465, "global_step": 490233, "epoch": 5906} {"train_loss": -27.08965492248535, "global_step": 490234, "epoch": 5906} {"train_loss": -27.321374893188477, "global_step": 490235, "epoch": 5906} {"train_loss": -27.43561363220215, "global_step": 490236, "epoch": 5906} {"train_loss": -27.12433433532715, "global_step": 490237, "epoch": 5906} {"train_loss": -27.32819175720215, "global_step": 490238, "epoch": 5906} {"train_loss": -27.107099533081055, "global_step": 490239, "epoch": 5906} {"train_loss": -27.068647384643555, "global_step": 490240, "epoch": 5906} {"train_loss": -27.135913848876953, "global_step": 490241, "epoch": 5906} {"train_loss": -27.627981185913086, "global_step": 490242, "epoch": 5906} {"train_loss": -27.43023109436035, "global_step": 490243, "epoch": 5906} {"train_loss": -27.14251708984375, "global_step": 490244, "epoch": 5906} {"train_loss": -27.315509796142578, "global_step": 490245, "epoch": 5906} {"train_loss": -27.517932891845703, "global_step": 490246, "epoch": 5906} {"train_loss": -27.18526268005371, "global_step": 490247, "epoch": 5906} {"train_loss": -27.5109806060791, "global_step": 490248, "epoch": 5906} {"train_loss": -27.38514518737793, "global_step": 490249, "epoch": 5906} {"train_loss": -27.231916427612305, "global_step": 490250, "epoch": 5906} {"train_loss": -27.33222007751465, "global_step": 490251, "epoch": 5906} {"train_loss": -27.6121826171875, "global_step": 490252, "epoch": 5906} {"train_loss": -27.194427490234375, "global_step": 490253, "epoch": 5906} {"train_loss": -27.248361587524414, "global_step": 490254, "epoch": 5906} {"train_loss": -27.0383358001709, "global_step": 490255, "epoch": 5906} {"train_loss": -26.40716552734375, "global_step": 490256, "epoch": 5906} {"train_loss": -27.3363094329834, "global_step": 490257, "epoch": 5906} {"train_loss": -27.401662826538086, "global_step": 490258, "epoch": 5906} {"train_loss": -27.257495880126953, "global_step": 490259, "epoch": 5906} {"train_loss": -27.612537384033203, "global_step": 490260, "epoch": 5906} {"train_loss": -27.445104598999023, "global_step": 490261, "epoch": 5906} {"train_loss": -27.16845703125, "global_step": 490262, "epoch": 5906} {"train_loss": -27.539932250976562, "global_step": 490263, "epoch": 5906} {"train_loss": -27.063705444335938, "global_step": 490264, "epoch": 5906} {"train_loss": -26.928211212158203, "global_step": 490265, "epoch": 5906} {"train_loss": -27.303543090820312, "global_step": 490266, "epoch": 5906} {"train_loss": -27.724109649658203, "global_step": 490267, "epoch": 5906} {"train_loss": -27.425067901611328, "global_step": 490268, "epoch": 5906} {"train_loss": -27.137311935424805, "global_step": 490269, "epoch": 5906} {"train_loss": -27.300342559814453, "global_step": 490270, "epoch": 5906} {"train_loss": -27.298770904541016, "global_step": 490271, "epoch": 5906} {"train_loss": -27.283740997314453, "global_step": 490272, "epoch": 5906} {"train_loss": -27.34124755859375, "global_step": 490273, "epoch": 5906} {"train_loss": -27.421985626220703, "global_step": 490274, "epoch": 5906} {"train_loss": -27.664993286132812, "global_step": 490275, "epoch": 5906} {"train_loss": -27.263874053955078, "global_step": 490276, "epoch": 5906} {"train_loss": -27.394346237182617, "global_step": 490277, "epoch": 5906} {"train_loss": -27.362085342407227, "global_step": 490278, "epoch": 5906} {"train_loss": -27.440052032470703, "global_step": 490279, "epoch": 5906} {"train_loss": -27.209200158176653, "global_step": 490280, "epoch": 5906, "val_loss": 6518304.0} {"train_loss": -26.50990104675293, "global_step": 490281, "epoch": 5907} {"train_loss": -26.98150634765625, "global_step": 490282, "epoch": 5907} {"train_loss": -27.2037410736084, "global_step": 490283, "epoch": 5907} {"train_loss": -26.86331558227539, "global_step": 490284, "epoch": 5907} {"train_loss": -26.98551368713379, "global_step": 490285, "epoch": 5907} {"train_loss": -26.98187828063965, "global_step": 490286, "epoch": 5907} {"train_loss": -27.281539916992188, "global_step": 490287, "epoch": 5907} {"train_loss": -26.780553817749023, "global_step": 490288, "epoch": 5907} {"train_loss": -26.836837768554688, "global_step": 490289, "epoch": 5907} {"train_loss": -27.10182762145996, "global_step": 490290, "epoch": 5907} {"train_loss": -26.89938735961914, "global_step": 490291, "epoch": 5907} {"train_loss": -27.239179611206055, "global_step": 490292, "epoch": 5907} {"train_loss": -26.80448341369629, "global_step": 490293, "epoch": 5907} {"train_loss": -27.209142684936523, "global_step": 490294, "epoch": 5907} {"train_loss": -26.796966552734375, "global_step": 490295, "epoch": 5907} {"train_loss": -26.839887619018555, "global_step": 490296, "epoch": 5907} {"train_loss": -27.266332626342773, "global_step": 490297, "epoch": 5907} {"train_loss": -27.254459381103516, "global_step": 490298, "epoch": 5907} {"train_loss": -27.298980712890625, "global_step": 490299, "epoch": 5907} {"train_loss": -27.26032829284668, "global_step": 490300, "epoch": 5907} {"train_loss": -27.160388946533203, "global_step": 490301, "epoch": 5907} {"train_loss": -26.434247970581055, "global_step": 490302, "epoch": 5907} {"train_loss": -27.038990020751953, "global_step": 490303, "epoch": 5907} {"train_loss": -26.848291397094727, "global_step": 490304, "epoch": 5907} {"train_loss": -26.656850814819336, "global_step": 490305, "epoch": 5907} {"train_loss": -27.23065185546875, "global_step": 490306, "epoch": 5907} {"train_loss": -27.15351676940918, "global_step": 490307, "epoch": 5907} {"train_loss": -27.39338493347168, "global_step": 490308, "epoch": 5907} {"train_loss": -27.11604881286621, "global_step": 490309, "epoch": 5907} {"train_loss": -27.069974899291992, "global_step": 490310, "epoch": 5907} {"train_loss": -27.343509674072266, "global_step": 490311, "epoch": 5907} {"train_loss": -26.8995361328125, "global_step": 490312, "epoch": 5907} {"train_loss": -27.213491439819336, "global_step": 490313, "epoch": 5907} {"train_loss": -27.413806915283203, "global_step": 490314, "epoch": 5907} {"train_loss": -27.58290672302246, "global_step": 490315, "epoch": 5907} {"train_loss": -27.352371215820312, "global_step": 490316, "epoch": 5907} {"train_loss": -27.630512237548828, "global_step": 490317, "epoch": 5907} {"train_loss": -27.37809181213379, "global_step": 490318, "epoch": 5907} {"train_loss": -27.286090850830078, "global_step": 490319, "epoch": 5907} {"train_loss": -27.333362579345703, "global_step": 490320, "epoch": 5907} {"train_loss": -27.393436431884766, "global_step": 490321, "epoch": 5907} {"train_loss": -27.375843048095703, "global_step": 490322, "epoch": 5907} {"train_loss": -27.128543853759766, "global_step": 490323, "epoch": 5907} {"train_loss": -27.200098037719727, "global_step": 490324, "epoch": 5907} {"train_loss": -27.40616226196289, "global_step": 490325, "epoch": 5907} {"train_loss": -27.103925704956055, "global_step": 490326, "epoch": 5907} {"train_loss": -27.66961097717285, "global_step": 490327, "epoch": 5907} {"train_loss": -27.49781608581543, "global_step": 490328, "epoch": 5907} {"train_loss": -27.223779678344727, "global_step": 490329, "epoch": 5907} {"train_loss": -27.205453872680664, "global_step": 490330, "epoch": 5907} {"train_loss": -27.735944747924805, "global_step": 490331, "epoch": 5907} {"train_loss": -27.32077980041504, "global_step": 490332, "epoch": 5907} {"train_loss": -27.342138290405273, "global_step": 490333, "epoch": 5907} {"train_loss": -27.60166358947754, "global_step": 490334, "epoch": 5907} {"train_loss": -27.66925048828125, "global_step": 490335, "epoch": 5907} {"train_loss": -27.298959732055664, "global_step": 490336, "epoch": 5907} {"train_loss": -27.540573120117188, "global_step": 490337, "epoch": 5907} {"train_loss": -27.3984432220459, "global_step": 490338, "epoch": 5907} {"train_loss": -27.244647979736328, "global_step": 490339, "epoch": 5907} {"train_loss": -27.828012466430664, "global_step": 490340, "epoch": 5907} {"train_loss": -27.677753448486328, "global_step": 490341, "epoch": 5907} {"train_loss": -27.460590362548828, "global_step": 490342, "epoch": 5907} {"train_loss": -27.388696670532227, "global_step": 490343, "epoch": 5907} {"train_loss": -27.518939971923828, "global_step": 490344, "epoch": 5907} {"train_loss": -27.306386947631836, "global_step": 490345, "epoch": 5907} {"train_loss": -27.417957305908203, "global_step": 490346, "epoch": 5907} {"train_loss": -27.512128829956055, "global_step": 490347, "epoch": 5907} {"train_loss": -27.184412002563477, "global_step": 490348, "epoch": 5907} {"train_loss": -27.272186279296875, "global_step": 490349, "epoch": 5907} {"train_loss": -27.49879264831543, "global_step": 490350, "epoch": 5907} {"train_loss": -27.445545196533203, "global_step": 490351, "epoch": 5907} {"train_loss": -27.447168350219727, "global_step": 490352, "epoch": 5907} {"train_loss": -27.219472885131836, "global_step": 490353, "epoch": 5907} {"train_loss": -27.497833251953125, "global_step": 490354, "epoch": 5907} {"train_loss": -27.560827255249023, "global_step": 490355, "epoch": 5907} {"train_loss": -27.63276481628418, "global_step": 490356, "epoch": 5907} {"train_loss": -27.484643936157227, "global_step": 490357, "epoch": 5907} {"train_loss": -26.998132705688477, "global_step": 490358, "epoch": 5907} {"train_loss": -26.920148849487305, "global_step": 490359, "epoch": 5907} {"train_loss": -26.351581573486328, "global_step": 490360, "epoch": 5907} {"train_loss": -25.884801864624023, "global_step": 490361, "epoch": 5907} {"train_loss": -25.762975692749023, "global_step": 490362, "epoch": 5907} {"train_loss": -27.182818263410084, "global_step": 490363, "epoch": 5907, "val_loss": 6471694.0} {"train_loss": -23.963071823120117, "global_step": 490364, "epoch": 5908} {"train_loss": -22.681644439697266, "global_step": 490365, "epoch": 5908} {"train_loss": -25.810834884643555, "global_step": 490366, "epoch": 5908} {"train_loss": -24.710350036621094, "global_step": 490367, "epoch": 5908} {"train_loss": -25.2618465423584, "global_step": 490368, "epoch": 5908} {"train_loss": -25.45026397705078, "global_step": 490369, "epoch": 5908} {"train_loss": -25.787845611572266, "global_step": 490370, "epoch": 5908} {"train_loss": -24.848878860473633, "global_step": 490371, "epoch": 5908} {"train_loss": -26.07472038269043, "global_step": 490372, "epoch": 5908} {"train_loss": -25.627771377563477, "global_step": 490373, "epoch": 5908} {"train_loss": -25.69076919555664, "global_step": 490374, "epoch": 5908} {"train_loss": -25.948633193969727, "global_step": 490375, "epoch": 5908} {"train_loss": -25.77766227722168, "global_step": 490376, "epoch": 5908} {"train_loss": -26.62054443359375, "global_step": 490377, "epoch": 5908} {"train_loss": -25.883514404296875, "global_step": 490378, "epoch": 5908} {"train_loss": -26.40540885925293, "global_step": 490379, "epoch": 5908} {"train_loss": -26.352054595947266, "global_step": 490380, "epoch": 5908} {"train_loss": -26.587451934814453, "global_step": 490381, "epoch": 5908} {"train_loss": -26.337543487548828, "global_step": 490382, "epoch": 5908} {"train_loss": -26.299854278564453, "global_step": 490383, "epoch": 5908} {"train_loss": -26.749408721923828, "global_step": 490384, "epoch": 5908} {"train_loss": -26.381895065307617, "global_step": 490385, "epoch": 5908} {"train_loss": -26.27628517150879, "global_step": 490386, "epoch": 5908} {"train_loss": -26.47577476501465, "global_step": 490387, "epoch": 5908} {"train_loss": -26.694787979125977, "global_step": 490388, "epoch": 5908} {"train_loss": -26.886022567749023, "global_step": 490389, "epoch": 5908} {"train_loss": -26.54718017578125, "global_step": 490390, "epoch": 5908} {"train_loss": -26.677087783813477, "global_step": 490391, "epoch": 5908} {"train_loss": -27.055404663085938, "global_step": 490392, "epoch": 5908} {"train_loss": -26.88535499572754, "global_step": 490393, "epoch": 5908} {"train_loss": -26.85332679748535, "global_step": 490394, "epoch": 5908} {"train_loss": -27.164453506469727, "global_step": 490395, "epoch": 5908} {"train_loss": -26.91316032409668, "global_step": 490396, "epoch": 5908} {"train_loss": -27.440139770507812, "global_step": 490397, "epoch": 5908} {"train_loss": -27.0406494140625, "global_step": 490398, "epoch": 5908} {"train_loss": -27.168350219726562, "global_step": 490399, "epoch": 5908} {"train_loss": -27.175378799438477, "global_step": 490400, "epoch": 5908} {"train_loss": -27.286762237548828, "global_step": 490401, "epoch": 5908} {"train_loss": -27.247879028320312, "global_step": 490402, "epoch": 5908} {"train_loss": -27.20905876159668, "global_step": 490403, "epoch": 5908} {"train_loss": -27.327661514282227, "global_step": 490404, "epoch": 5908} {"train_loss": -26.828283309936523, "global_step": 490405, "epoch": 5908} {"train_loss": -27.2829532623291, "global_step": 490406, "epoch": 5908} {"train_loss": -27.009387969970703, "global_step": 490407, "epoch": 5908} {"train_loss": -27.13290786743164, "global_step": 490408, "epoch": 5908} {"train_loss": -27.1935977935791, "global_step": 490409, "epoch": 5908} {"train_loss": -27.33538246154785, "global_step": 490410, "epoch": 5908} {"train_loss": -27.33011817932129, "global_step": 490411, "epoch": 5908} {"train_loss": -26.957645416259766, "global_step": 490412, "epoch": 5908} {"train_loss": -27.534704208374023, "global_step": 490413, "epoch": 5908} {"train_loss": -27.264551162719727, "global_step": 490414, "epoch": 5908} {"train_loss": -27.273588180541992, "global_step": 490415, "epoch": 5908} {"train_loss": -27.30401611328125, "global_step": 490416, "epoch": 5908} {"train_loss": -27.714353561401367, "global_step": 490417, "epoch": 5908} {"train_loss": -27.40830421447754, "global_step": 490418, "epoch": 5908} {"train_loss": -27.658512115478516, "global_step": 490419, "epoch": 5908} {"train_loss": -27.504638671875, "global_step": 490420, "epoch": 5908} {"train_loss": -27.52581787109375, "global_step": 490421, "epoch": 5908} {"train_loss": -27.449665069580078, "global_step": 490422, "epoch": 5908} {"train_loss": -27.558029174804688, "global_step": 490423, "epoch": 5908} {"train_loss": -27.241382598876953, "global_step": 490424, "epoch": 5908} {"train_loss": -27.629154205322266, "global_step": 490425, "epoch": 5908} {"train_loss": -27.730817794799805, "global_step": 490426, "epoch": 5908} {"train_loss": -27.264240264892578, "global_step": 490427, "epoch": 5908} {"train_loss": -27.364368438720703, "global_step": 490428, "epoch": 5908} {"train_loss": -27.294116973876953, "global_step": 490429, "epoch": 5908} {"train_loss": -27.114477157592773, "global_step": 490430, "epoch": 5908} {"train_loss": -27.60126304626465, "global_step": 490431, "epoch": 5908} {"train_loss": -27.70124626159668, "global_step": 490432, "epoch": 5908} {"train_loss": -27.447559356689453, "global_step": 490433, "epoch": 5908} {"train_loss": -27.315649032592773, "global_step": 490434, "epoch": 5908} {"train_loss": -27.120656967163086, "global_step": 490435, "epoch": 5908} {"train_loss": -27.41876792907715, "global_step": 490436, "epoch": 5908} {"train_loss": -27.037433624267578, "global_step": 490437, "epoch": 5908} {"train_loss": -27.204364776611328, "global_step": 490438, "epoch": 5908} {"train_loss": -27.457040786743164, "global_step": 490439, "epoch": 5908} {"train_loss": -27.039600372314453, "global_step": 490440, "epoch": 5908} {"train_loss": -27.29524040222168, "global_step": 490441, "epoch": 5908} {"train_loss": -27.540281295776367, "global_step": 490442, "epoch": 5908} {"train_loss": -27.2101993560791, "global_step": 490443, "epoch": 5908} {"train_loss": -27.106252670288086, "global_step": 490444, "epoch": 5908} {"train_loss": -27.56694984436035, "global_step": 490445, "epoch": 5908} {"train_loss": -26.84115292652544, "global_step": 490446, "epoch": 5908, "val_loss": 6521745.0} {"train_loss": -26.708120346069336, "global_step": 490447, "epoch": 5909} {"train_loss": -26.436506271362305, "global_step": 490448, "epoch": 5909} {"train_loss": -26.34345054626465, "global_step": 490449, "epoch": 5909} {"train_loss": -26.813867568969727, "global_step": 490450, "epoch": 5909} {"train_loss": -26.768224716186523, "global_step": 490451, "epoch": 5909} {"train_loss": -27.153949737548828, "global_step": 490452, "epoch": 5909} {"train_loss": -26.985132217407227, "global_step": 490453, "epoch": 5909} {"train_loss": -26.651111602783203, "global_step": 490454, "epoch": 5909} {"train_loss": -26.984466552734375, "global_step": 490455, "epoch": 5909} {"train_loss": -26.927648544311523, "global_step": 490456, "epoch": 5909} {"train_loss": -27.212865829467773, "global_step": 490457, "epoch": 5909} {"train_loss": -26.62616539001465, "global_step": 490458, "epoch": 5909} {"train_loss": -27.434783935546875, "global_step": 490459, "epoch": 5909} {"train_loss": -26.5930233001709, "global_step": 490460, "epoch": 5909} {"train_loss": -26.980670928955078, "global_step": 490461, "epoch": 5909} {"train_loss": -27.188507080078125, "global_step": 490462, "epoch": 5909} {"train_loss": -26.962858200073242, "global_step": 490463, "epoch": 5909} {"train_loss": -27.23114013671875, "global_step": 490464, "epoch": 5909} {"train_loss": -27.265172958374023, "global_step": 490465, "epoch": 5909} {"train_loss": -27.219318389892578, "global_step": 490466, "epoch": 5909} {"train_loss": -27.428800582885742, "global_step": 490467, "epoch": 5909} {"train_loss": -27.328210830688477, "global_step": 490468, "epoch": 5909} {"train_loss": -27.327802658081055, "global_step": 490469, "epoch": 5909} {"train_loss": -27.1651668548584, "global_step": 490470, "epoch": 5909} {"train_loss": -27.2449951171875, "global_step": 490471, "epoch": 5909} {"train_loss": -27.150915145874023, "global_step": 490472, "epoch": 5909} {"train_loss": -27.063520431518555, "global_step": 490473, "epoch": 5909} {"train_loss": -26.977767944335938, "global_step": 490474, "epoch": 5909} {"train_loss": -27.5933780670166, "global_step": 490475, "epoch": 5909} {"train_loss": -27.093963623046875, "global_step": 490476, "epoch": 5909} {"train_loss": -27.320709228515625, "global_step": 490477, "epoch": 5909} {"train_loss": -27.507659912109375, "global_step": 490478, "epoch": 5909} {"train_loss": -27.3740291595459, "global_step": 490479, "epoch": 5909} {"train_loss": -27.20623207092285, "global_step": 490480, "epoch": 5909} {"train_loss": -27.46988296508789, "global_step": 490481, "epoch": 5909} {"train_loss": -27.397785186767578, "global_step": 490482, "epoch": 5909} {"train_loss": -27.514341354370117, "global_step": 490483, "epoch": 5909} {"train_loss": -27.668439865112305, "global_step": 490484, "epoch": 5909} {"train_loss": -27.039011001586914, "global_step": 490485, "epoch": 5909} {"train_loss": -27.740753173828125, "global_step": 490486, "epoch": 5909} {"train_loss": -27.928607940673828, "global_step": 490487, "epoch": 5909} {"train_loss": -27.354822158813477, "global_step": 490488, "epoch": 5909} {"train_loss": -27.4421443939209, "global_step": 490489, "epoch": 5909} {"train_loss": -27.74200439453125, "global_step": 490490, "epoch": 5909} {"train_loss": -27.78397560119629, "global_step": 490491, "epoch": 5909} {"train_loss": -27.586078643798828, "global_step": 490492, "epoch": 5909} {"train_loss": -27.44648551940918, "global_step": 490493, "epoch": 5909} {"train_loss": -27.61313819885254, "global_step": 490494, "epoch": 5909} {"train_loss": -27.699615478515625, "global_step": 490495, "epoch": 5909} {"train_loss": -27.756818771362305, "global_step": 490496, "epoch": 5909} {"train_loss": -27.73943519592285, "global_step": 490497, "epoch": 5909} {"train_loss": -27.43845558166504, "global_step": 490498, "epoch": 5909} {"train_loss": -27.387487411499023, "global_step": 490499, "epoch": 5909} {"train_loss": -27.540943145751953, "global_step": 490500, "epoch": 5909} {"train_loss": -27.016769409179688, "global_step": 490501, "epoch": 5909} {"train_loss": -27.17032241821289, "global_step": 490502, "epoch": 5909} {"train_loss": -27.36031150817871, "global_step": 490503, "epoch": 5909} {"train_loss": -27.21149253845215, "global_step": 490504, "epoch": 5909} {"train_loss": -27.35438346862793, "global_step": 490505, "epoch": 5909} {"train_loss": -27.545190811157227, "global_step": 490506, "epoch": 5909} {"train_loss": -27.489301681518555, "global_step": 490507, "epoch": 5909} {"train_loss": -26.994775772094727, "global_step": 490508, "epoch": 5909} {"train_loss": -27.221487045288086, "global_step": 490509, "epoch": 5909} {"train_loss": -27.073156356811523, "global_step": 490510, "epoch": 5909} {"train_loss": -27.2958984375, "global_step": 490511, "epoch": 5909} {"train_loss": -27.091354370117188, "global_step": 490512, "epoch": 5909} {"train_loss": -27.263269424438477, "global_step": 490513, "epoch": 5909} {"train_loss": -27.378171920776367, "global_step": 490514, "epoch": 5909} {"train_loss": -27.651508331298828, "global_step": 490515, "epoch": 5909} {"train_loss": -27.378034591674805, "global_step": 490516, "epoch": 5909} {"train_loss": -27.33601951599121, "global_step": 490517, "epoch": 5909} {"train_loss": -26.9688720703125, "global_step": 490518, "epoch": 5909} {"train_loss": -27.19817543029785, "global_step": 490519, "epoch": 5909} {"train_loss": -27.31479263305664, "global_step": 490520, "epoch": 5909} {"train_loss": -26.6928653717041, "global_step": 490521, "epoch": 5909} {"train_loss": -27.05218505859375, "global_step": 490522, "epoch": 5909} {"train_loss": -27.25619888305664, "global_step": 490523, "epoch": 5909} {"train_loss": -27.3405818939209, "global_step": 490524, "epoch": 5909} {"train_loss": -27.488813400268555, "global_step": 490525, "epoch": 5909} {"train_loss": -27.3470458984375, "global_step": 490526, "epoch": 5909} {"train_loss": -27.248519897460938, "global_step": 490527, "epoch": 5909} {"train_loss": -27.222631454467773, "global_step": 490528, "epoch": 5909} {"train_loss": -27.24904779641025, "global_step": 490529, "epoch": 5909, "val_loss": 6518521.0} {"train_loss": -26.287443161010742, "global_step": 490530, "epoch": 5910} {"train_loss": -25.806310653686523, "global_step": 490531, "epoch": 5910} {"train_loss": -26.360021591186523, "global_step": 490532, "epoch": 5910} {"train_loss": -26.81146240234375, "global_step": 490533, "epoch": 5910} {"train_loss": -26.36475944519043, "global_step": 490534, "epoch": 5910} {"train_loss": -26.923755645751953, "global_step": 490535, "epoch": 5910} {"train_loss": -27.164220809936523, "global_step": 490536, "epoch": 5910} {"train_loss": -26.907636642456055, "global_step": 490537, "epoch": 5910} {"train_loss": -26.301300048828125, "global_step": 490538, "epoch": 5910} {"train_loss": -26.653156280517578, "global_step": 490539, "epoch": 5910} {"train_loss": -26.60992431640625, "global_step": 490540, "epoch": 5910} {"train_loss": -26.816282272338867, "global_step": 490541, "epoch": 5910} {"train_loss": -26.894073486328125, "global_step": 490542, "epoch": 5910} {"train_loss": -26.525678634643555, "global_step": 490543, "epoch": 5910} {"train_loss": -26.94388771057129, "global_step": 490544, "epoch": 5910} {"train_loss": -27.298566818237305, "global_step": 490545, "epoch": 5910} {"train_loss": -27.196043014526367, "global_step": 490546, "epoch": 5910} {"train_loss": -26.69392204284668, "global_step": 490547, "epoch": 5910} {"train_loss": -27.127721786499023, "global_step": 490548, "epoch": 5910} {"train_loss": -26.8373966217041, "global_step": 490549, "epoch": 5910} {"train_loss": -26.86030387878418, "global_step": 490550, "epoch": 5910} {"train_loss": -26.745559692382812, "global_step": 490551, "epoch": 5910} {"train_loss": -27.239959716796875, "global_step": 490552, "epoch": 5910} {"train_loss": -26.96693229675293, "global_step": 490553, "epoch": 5910} {"train_loss": -27.477588653564453, "global_step": 490554, "epoch": 5910} {"train_loss": -27.50907325744629, "global_step": 490555, "epoch": 5910} {"train_loss": -27.052499771118164, "global_step": 490556, "epoch": 5910} {"train_loss": -27.033477783203125, "global_step": 490557, "epoch": 5910} {"train_loss": -27.493467330932617, "global_step": 490558, "epoch": 5910} {"train_loss": -27.503326416015625, "global_step": 490559, "epoch": 5910} {"train_loss": -27.246530532836914, "global_step": 490560, "epoch": 5910} {"train_loss": -27.719364166259766, "global_step": 490561, "epoch": 5910} {"train_loss": -27.477020263671875, "global_step": 490562, "epoch": 5910} {"train_loss": -27.53879737854004, "global_step": 490563, "epoch": 5910} {"train_loss": -27.078474044799805, "global_step": 490564, "epoch": 5910} {"train_loss": -27.44355583190918, "global_step": 490565, "epoch": 5910} {"train_loss": -26.735321044921875, "global_step": 490566, "epoch": 5910} {"train_loss": -27.619277954101562, "global_step": 490567, "epoch": 5910} {"train_loss": -27.307697296142578, "global_step": 490568, "epoch": 5910} {"train_loss": -26.864423751831055, "global_step": 490569, "epoch": 5910} {"train_loss": -27.015979766845703, "global_step": 490570, "epoch": 5910} {"train_loss": -27.29578971862793, "global_step": 490571, "epoch": 5910} {"train_loss": -27.18535804748535, "global_step": 490572, "epoch": 5910} {"train_loss": -27.04477882385254, "global_step": 490573, "epoch": 5910} {"train_loss": -26.775638580322266, "global_step": 490574, "epoch": 5910} {"train_loss": -27.30438804626465, "global_step": 490575, "epoch": 5910} {"train_loss": -27.276508331298828, "global_step": 490576, "epoch": 5910} {"train_loss": -27.107635498046875, "global_step": 490577, "epoch": 5910} {"train_loss": -27.376657485961914, "global_step": 490578, "epoch": 5910} {"train_loss": -27.3911075592041, "global_step": 490579, "epoch": 5910} {"train_loss": -27.313400268554688, "global_step": 490580, "epoch": 5910} {"train_loss": -27.215606689453125, "global_step": 490581, "epoch": 5910} {"train_loss": -27.307538986206055, "global_step": 490582, "epoch": 5910} {"train_loss": -27.078489303588867, "global_step": 490583, "epoch": 5910} {"train_loss": -27.0980281829834, "global_step": 490584, "epoch": 5910} {"train_loss": -27.21881675720215, "global_step": 490585, "epoch": 5910} {"train_loss": -27.437036514282227, "global_step": 490586, "epoch": 5910} {"train_loss": -27.34356689453125, "global_step": 490587, "epoch": 5910} {"train_loss": -27.356870651245117, "global_step": 490588, "epoch": 5910} {"train_loss": -27.221410751342773, "global_step": 490589, "epoch": 5910} {"train_loss": -27.385828018188477, "global_step": 490590, "epoch": 5910} {"train_loss": -27.27752685546875, "global_step": 490591, "epoch": 5910} {"train_loss": -27.33414077758789, "global_step": 490592, "epoch": 5910} {"train_loss": -27.37577247619629, "global_step": 490593, "epoch": 5910} {"train_loss": -27.522504806518555, "global_step": 490594, "epoch": 5910} {"train_loss": -27.842626571655273, "global_step": 490595, "epoch": 5910} {"train_loss": -27.329526901245117, "global_step": 490596, "epoch": 5910} {"train_loss": -27.44849967956543, "global_step": 490597, "epoch": 5910} {"train_loss": -27.224958419799805, "global_step": 490598, "epoch": 5910} {"train_loss": -27.261474609375, "global_step": 490599, "epoch": 5910} {"train_loss": -27.56842041015625, "global_step": 490600, "epoch": 5910} {"train_loss": -27.377355575561523, "global_step": 490601, "epoch": 5910} {"train_loss": -27.37534523010254, "global_step": 490602, "epoch": 5910} {"train_loss": -27.391992568969727, "global_step": 490603, "epoch": 5910} {"train_loss": -26.99700927734375, "global_step": 490604, "epoch": 5910} {"train_loss": -27.828596115112305, "global_step": 490605, "epoch": 5910} {"train_loss": -27.35212516784668, "global_step": 490606, "epoch": 5910} {"train_loss": -27.06166648864746, "global_step": 490607, "epoch": 5910} {"train_loss": -27.455947875976562, "global_step": 490608, "epoch": 5910} {"train_loss": -27.51828384399414, "global_step": 490609, "epoch": 5910} {"train_loss": -27.368865966796875, "global_step": 490610, "epoch": 5910} {"train_loss": -27.61492347717285, "global_step": 490611, "epoch": 5910} {"train_loss": -27.157157943909425, "global_step": 490612, "epoch": 5910, "val_loss": 6476220.5} {"train_loss": -27.47755241394043, "global_step": 490613, "epoch": 5911} {"train_loss": -26.90810203552246, "global_step": 490614, "epoch": 5911} {"train_loss": -27.21231460571289, "global_step": 490615, "epoch": 5911} {"train_loss": -26.587451934814453, "global_step": 490616, "epoch": 5911} {"train_loss": -27.467599868774414, "global_step": 490617, "epoch": 5911} {"train_loss": -26.79178810119629, "global_step": 490618, "epoch": 5911} {"train_loss": -26.907743453979492, "global_step": 490619, "epoch": 5911} {"train_loss": -27.03371238708496, "global_step": 490620, "epoch": 5911} {"train_loss": -27.131433486938477, "global_step": 490621, "epoch": 5911} {"train_loss": -26.907196044921875, "global_step": 490622, "epoch": 5911} {"train_loss": -27.013288497924805, "global_step": 490623, "epoch": 5911} {"train_loss": -27.274444580078125, "global_step": 490624, "epoch": 5911} {"train_loss": -27.546483993530273, "global_step": 490625, "epoch": 5911} {"train_loss": -27.159839630126953, "global_step": 490626, "epoch": 5911} {"train_loss": -26.952192306518555, "global_step": 490627, "epoch": 5911} {"train_loss": -27.0523624420166, "global_step": 490628, "epoch": 5911} {"train_loss": -27.335493087768555, "global_step": 490629, "epoch": 5911} {"train_loss": -27.733200073242188, "global_step": 490630, "epoch": 5911} {"train_loss": -27.083667755126953, "global_step": 490631, "epoch": 5911} {"train_loss": -27.27496910095215, "global_step": 490632, "epoch": 5911} {"train_loss": -27.269927978515625, "global_step": 490633, "epoch": 5911} {"train_loss": -27.201169967651367, "global_step": 490634, "epoch": 5911} {"train_loss": -27.133758544921875, "global_step": 490635, "epoch": 5911} {"train_loss": -27.63677406311035, "global_step": 490636, "epoch": 5911} {"train_loss": -27.148300170898438, "global_step": 490637, "epoch": 5911} {"train_loss": -27.56939697265625, "global_step": 490638, "epoch": 5911} {"train_loss": -27.0814208984375, "global_step": 490639, "epoch": 5911} {"train_loss": -27.163110733032227, "global_step": 490640, "epoch": 5911} {"train_loss": -27.250085830688477, "global_step": 490641, "epoch": 5911} {"train_loss": -27.295257568359375, "global_step": 490642, "epoch": 5911} {"train_loss": -27.166946411132812, "global_step": 490643, "epoch": 5911} {"train_loss": -27.5137939453125, "global_step": 490644, "epoch": 5911} {"train_loss": -27.4685115814209, "global_step": 490645, "epoch": 5911} {"train_loss": -27.412311553955078, "global_step": 490646, "epoch": 5911} {"train_loss": -27.444259643554688, "global_step": 490647, "epoch": 5911} {"train_loss": -27.481470108032227, "global_step": 490648, "epoch": 5911} {"train_loss": -27.45639419555664, "global_step": 490649, "epoch": 5911} {"train_loss": -27.420324325561523, "global_step": 490650, "epoch": 5911} {"train_loss": -27.080991744995117, "global_step": 490651, "epoch": 5911} {"train_loss": -27.16425895690918, "global_step": 490652, "epoch": 5911} {"train_loss": -27.4285888671875, "global_step": 490653, "epoch": 5911} {"train_loss": -27.10791015625, "global_step": 490654, "epoch": 5911} {"train_loss": -26.9495792388916, "global_step": 490655, "epoch": 5911} {"train_loss": -27.34071159362793, "global_step": 490656, "epoch": 5911} {"train_loss": -26.521337509155273, "global_step": 490657, "epoch": 5911} {"train_loss": -27.2867431640625, "global_step": 490658, "epoch": 5911} {"train_loss": -26.966588973999023, "global_step": 490659, "epoch": 5911} {"train_loss": -26.86915397644043, "global_step": 490660, "epoch": 5911} {"train_loss": -27.266952514648438, "global_step": 490661, "epoch": 5911} {"train_loss": -26.53742027282715, "global_step": 490662, "epoch": 5911} {"train_loss": -27.60750389099121, "global_step": 490663, "epoch": 5911} {"train_loss": -27.08082389831543, "global_step": 490664, "epoch": 5911} {"train_loss": -27.215362548828125, "global_step": 490665, "epoch": 5911} {"train_loss": -27.037139892578125, "global_step": 490666, "epoch": 5911} {"train_loss": -26.993764877319336, "global_step": 490667, "epoch": 5911} {"train_loss": -26.973556518554688, "global_step": 490668, "epoch": 5911} {"train_loss": -26.727563858032227, "global_step": 490669, "epoch": 5911} {"train_loss": -27.393152236938477, "global_step": 490670, "epoch": 5911} {"train_loss": -27.121021270751953, "global_step": 490671, "epoch": 5911} {"train_loss": -27.175024032592773, "global_step": 490672, "epoch": 5911} {"train_loss": -27.395587921142578, "global_step": 490673, "epoch": 5911} {"train_loss": -26.83168601989746, "global_step": 490674, "epoch": 5911} {"train_loss": -27.602399826049805, "global_step": 490675, "epoch": 5911} {"train_loss": -27.710168838500977, "global_step": 490676, "epoch": 5911} {"train_loss": -27.329381942749023, "global_step": 490677, "epoch": 5911} {"train_loss": -27.159677505493164, "global_step": 490678, "epoch": 5911} {"train_loss": -26.959537506103516, "global_step": 490679, "epoch": 5911} {"train_loss": -26.918134689331055, "global_step": 490680, "epoch": 5911} {"train_loss": -26.97425651550293, "global_step": 490681, "epoch": 5911} {"train_loss": -27.177244186401367, "global_step": 490682, "epoch": 5911} {"train_loss": -27.376855850219727, "global_step": 490683, "epoch": 5911} {"train_loss": -27.44495964050293, "global_step": 490684, "epoch": 5911} {"train_loss": -27.493249893188477, "global_step": 490685, "epoch": 5911} {"train_loss": -27.209766387939453, "global_step": 490686, "epoch": 5911} {"train_loss": -27.35695457458496, "global_step": 490687, "epoch": 5911} {"train_loss": -26.950830459594727, "global_step": 490688, "epoch": 5911} {"train_loss": -27.386011123657227, "global_step": 490689, "epoch": 5911} {"train_loss": -27.36716651916504, "global_step": 490690, "epoch": 5911} {"train_loss": -27.287145614624023, "global_step": 490691, "epoch": 5911} {"train_loss": -27.584674835205078, "global_step": 490692, "epoch": 5911} {"train_loss": -27.22820472717285, "global_step": 490693, "epoch": 5911} {"train_loss": -27.526731491088867, "global_step": 490694, "epoch": 5911} {"train_loss": -27.200297642903156, "global_step": 490695, "epoch": 5911, "val_loss": 6425706.0} {"train_loss": -27.119089126586914, "global_step": 490696, "epoch": 5912} {"train_loss": -26.770832061767578, "global_step": 490697, "epoch": 5912} {"train_loss": -26.9404354095459, "global_step": 490698, "epoch": 5912} {"train_loss": -27.03680992126465, "global_step": 490699, "epoch": 5912} {"train_loss": -26.936786651611328, "global_step": 490700, "epoch": 5912} {"train_loss": -26.937103271484375, "global_step": 490701, "epoch": 5912} {"train_loss": -26.858983993530273, "global_step": 490702, "epoch": 5912} {"train_loss": -27.18987464904785, "global_step": 490703, "epoch": 5912} {"train_loss": -26.849164962768555, "global_step": 490704, "epoch": 5912} {"train_loss": -27.082599639892578, "global_step": 490705, "epoch": 5912} {"train_loss": -27.289350509643555, "global_step": 490706, "epoch": 5912} {"train_loss": -27.375350952148438, "global_step": 490707, "epoch": 5912} {"train_loss": -26.76337242126465, "global_step": 490708, "epoch": 5912} {"train_loss": -27.064697265625, "global_step": 490709, "epoch": 5912} {"train_loss": -27.1655216217041, "global_step": 490710, "epoch": 5912} {"train_loss": -27.300302505493164, "global_step": 490711, "epoch": 5912} {"train_loss": -27.440689086914062, "global_step": 490712, "epoch": 5912} {"train_loss": -26.789892196655273, "global_step": 490713, "epoch": 5912} {"train_loss": -27.012353897094727, "global_step": 490714, "epoch": 5912} {"train_loss": -27.37104606628418, "global_step": 490715, "epoch": 5912} {"train_loss": -27.3718318939209, "global_step": 490716, "epoch": 5912} {"train_loss": -27.009876251220703, "global_step": 490717, "epoch": 5912} {"train_loss": -26.925832748413086, "global_step": 490718, "epoch": 5912} {"train_loss": -27.2552490234375, "global_step": 490719, "epoch": 5912} {"train_loss": -27.62477684020996, "global_step": 490720, "epoch": 5912} {"train_loss": -27.427154541015625, "global_step": 490721, "epoch": 5912} {"train_loss": -27.2747802734375, "global_step": 490722, "epoch": 5912} {"train_loss": -27.352527618408203, "global_step": 490723, "epoch": 5912} {"train_loss": -27.1876163482666, "global_step": 490724, "epoch": 5912} {"train_loss": -27.14581871032715, "global_step": 490725, "epoch": 5912} {"train_loss": -27.225860595703125, "global_step": 490726, "epoch": 5912} {"train_loss": -27.419401168823242, "global_step": 490727, "epoch": 5912} {"train_loss": -27.458160400390625, "global_step": 490728, "epoch": 5912} {"train_loss": -27.393964767456055, "global_step": 490729, "epoch": 5912} {"train_loss": -27.212478637695312, "global_step": 490730, "epoch": 5912} {"train_loss": -27.53309440612793, "global_step": 490731, "epoch": 5912} {"train_loss": -27.432849884033203, "global_step": 490732, "epoch": 5912} {"train_loss": -27.591846466064453, "global_step": 490733, "epoch": 5912} {"train_loss": -27.431425094604492, "global_step": 490734, "epoch": 5912} {"train_loss": -27.48359489440918, "global_step": 490735, "epoch": 5912} {"train_loss": -27.016183853149414, "global_step": 490736, "epoch": 5912} {"train_loss": -26.763214111328125, "global_step": 490737, "epoch": 5912} {"train_loss": -26.809309005737305, "global_step": 490738, "epoch": 5912} {"train_loss": -26.6761531829834, "global_step": 490739, "epoch": 5912} {"train_loss": -27.4276123046875, "global_step": 490740, "epoch": 5912} {"train_loss": -27.590274810791016, "global_step": 490741, "epoch": 5912} {"train_loss": -27.401264190673828, "global_step": 490742, "epoch": 5912} {"train_loss": -27.439916610717773, "global_step": 490743, "epoch": 5912} {"train_loss": -27.190582275390625, "global_step": 490744, "epoch": 5912} {"train_loss": -27.856311798095703, "global_step": 490745, "epoch": 5912} {"train_loss": -27.62159538269043, "global_step": 490746, "epoch": 5912} {"train_loss": -27.119287490844727, "global_step": 490747, "epoch": 5912} {"train_loss": -27.391164779663086, "global_step": 490748, "epoch": 5912} {"train_loss": -27.515607833862305, "global_step": 490749, "epoch": 5912} {"train_loss": -27.312671661376953, "global_step": 490750, "epoch": 5912} {"train_loss": -27.31209373474121, "global_step": 490751, "epoch": 5912} {"train_loss": -27.1546573638916, "global_step": 490752, "epoch": 5912} {"train_loss": -27.010456085205078, "global_step": 490753, "epoch": 5912} {"train_loss": -26.95551109313965, "global_step": 490754, "epoch": 5912} {"train_loss": -27.072296142578125, "global_step": 490755, "epoch": 5912} {"train_loss": -27.042688369750977, "global_step": 490756, "epoch": 5912} {"train_loss": -27.176401138305664, "global_step": 490757, "epoch": 5912} {"train_loss": -27.029071807861328, "global_step": 490758, "epoch": 5912} {"train_loss": -27.024572372436523, "global_step": 490759, "epoch": 5912} {"train_loss": -27.31608009338379, "global_step": 490760, "epoch": 5912} {"train_loss": -27.0822811126709, "global_step": 490761, "epoch": 5912} {"train_loss": -26.606338500976562, "global_step": 490762, "epoch": 5912} {"train_loss": -26.655981063842773, "global_step": 490763, "epoch": 5912} {"train_loss": -26.864898681640625, "global_step": 490764, "epoch": 5912} {"train_loss": -27.203306198120117, "global_step": 490765, "epoch": 5912} {"train_loss": -26.46510124206543, "global_step": 490766, "epoch": 5912} {"train_loss": -26.909896850585938, "global_step": 490767, "epoch": 5912} {"train_loss": -26.682958602905273, "global_step": 490768, "epoch": 5912} {"train_loss": -26.779911041259766, "global_step": 490769, "epoch": 5912} {"train_loss": -26.529077529907227, "global_step": 490770, "epoch": 5912} {"train_loss": -27.035024642944336, "global_step": 490771, "epoch": 5912} {"train_loss": -27.05620765686035, "global_step": 490772, "epoch": 5912} {"train_loss": -26.908910751342773, "global_step": 490773, "epoch": 5912} {"train_loss": -27.23415184020996, "global_step": 490774, "epoch": 5912} {"train_loss": -26.836444854736328, "global_step": 490775, "epoch": 5912} {"train_loss": -26.892499923706055, "global_step": 490776, "epoch": 5912} {"train_loss": -26.818628311157227, "global_step": 490777, "epoch": 5912} {"train_loss": -27.121555810951325, "global_step": 490778, "epoch": 5912, "val_loss": 6552791.0} {"train_loss": -26.839252471923828, "global_step": 490779, "epoch": 5913} {"train_loss": -26.928272247314453, "global_step": 490780, "epoch": 5913} {"train_loss": -26.722152709960938, "global_step": 490781, "epoch": 5913} {"train_loss": -26.9006290435791, "global_step": 490782, "epoch": 5913} {"train_loss": -27.140838623046875, "global_step": 490783, "epoch": 5913} {"train_loss": -27.13801383972168, "global_step": 490784, "epoch": 5913} {"train_loss": -27.08880615234375, "global_step": 490785, "epoch": 5913} {"train_loss": -26.97928237915039, "global_step": 490786, "epoch": 5913} {"train_loss": -27.1842098236084, "global_step": 490787, "epoch": 5913} {"train_loss": -27.432348251342773, "global_step": 490788, "epoch": 5913} {"train_loss": -27.154714584350586, "global_step": 490789, "epoch": 5913} {"train_loss": -27.165287017822266, "global_step": 490790, "epoch": 5913} {"train_loss": -27.001758575439453, "global_step": 490791, "epoch": 5913} {"train_loss": -27.29693031311035, "global_step": 490792, "epoch": 5913} {"train_loss": -27.49261474609375, "global_step": 490793, "epoch": 5913} {"train_loss": -27.363937377929688, "global_step": 490794, "epoch": 5913} {"train_loss": -26.836597442626953, "global_step": 490795, "epoch": 5913} {"train_loss": -26.724252700805664, "global_step": 490796, "epoch": 5913} {"train_loss": -27.372961044311523, "global_step": 490797, "epoch": 5913} {"train_loss": -27.434545516967773, "global_step": 490798, "epoch": 5913} {"train_loss": -27.013769149780273, "global_step": 490799, "epoch": 5913} {"train_loss": -27.193078994750977, "global_step": 490800, "epoch": 5913} {"train_loss": -26.96099281311035, "global_step": 490801, "epoch": 5913} {"train_loss": -27.20051383972168, "global_step": 490802, "epoch": 5913} {"train_loss": -27.20159912109375, "global_step": 490803, "epoch": 5913} {"train_loss": -27.547948837280273, "global_step": 490804, "epoch": 5913} {"train_loss": -27.202747344970703, "global_step": 490805, "epoch": 5913} {"train_loss": -27.274274826049805, "global_step": 490806, "epoch": 5913} {"train_loss": -27.53850746154785, "global_step": 490807, "epoch": 5913} {"train_loss": -27.592365264892578, "global_step": 490808, "epoch": 5913} {"train_loss": -27.560871124267578, "global_step": 490809, "epoch": 5913} {"train_loss": -27.356672286987305, "global_step": 490810, "epoch": 5913} {"train_loss": -27.555328369140625, "global_step": 490811, "epoch": 5913} {"train_loss": -27.7082576751709, "global_step": 490812, "epoch": 5913} {"train_loss": -27.923009872436523, "global_step": 490813, "epoch": 5913} {"train_loss": -27.55042839050293, "global_step": 490814, "epoch": 5913} {"train_loss": -27.253559112548828, "global_step": 490815, "epoch": 5913} {"train_loss": -27.347064971923828, "global_step": 490816, "epoch": 5913} {"train_loss": -27.5151309967041, "global_step": 490817, "epoch": 5913} {"train_loss": -27.45088005065918, "global_step": 490818, "epoch": 5913} {"train_loss": -27.264068603515625, "global_step": 490819, "epoch": 5913} {"train_loss": -27.471403121948242, "global_step": 490820, "epoch": 5913} {"train_loss": -27.884180068969727, "global_step": 490821, "epoch": 5913} {"train_loss": -27.620956420898438, "global_step": 490822, "epoch": 5913} {"train_loss": -27.699172973632812, "global_step": 490823, "epoch": 5913} {"train_loss": -27.02979850769043, "global_step": 490824, "epoch": 5913} {"train_loss": -27.3265438079834, "global_step": 490825, "epoch": 5913} {"train_loss": -27.229108810424805, "global_step": 490826, "epoch": 5913} {"train_loss": -27.583600997924805, "global_step": 490827, "epoch": 5913} {"train_loss": -27.25269889831543, "global_step": 490828, "epoch": 5913} {"train_loss": -27.03545570373535, "global_step": 490829, "epoch": 5913} {"train_loss": -27.066797256469727, "global_step": 490830, "epoch": 5913} {"train_loss": -27.32394790649414, "global_step": 490831, "epoch": 5913} {"train_loss": -27.482025146484375, "global_step": 490832, "epoch": 5913} {"train_loss": -27.120412826538086, "global_step": 490833, "epoch": 5913} {"train_loss": -26.5706729888916, "global_step": 490834, "epoch": 5913} {"train_loss": -26.38166618347168, "global_step": 490835, "epoch": 5913} {"train_loss": -27.396530151367188, "global_step": 490836, "epoch": 5913} {"train_loss": -27.099227905273438, "global_step": 490837, "epoch": 5913} {"train_loss": -27.51708984375, "global_step": 490838, "epoch": 5913} {"train_loss": -26.724685668945312, "global_step": 490839, "epoch": 5913} {"train_loss": -26.62196159362793, "global_step": 490840, "epoch": 5913} {"train_loss": -26.977575302124023, "global_step": 490841, "epoch": 5913} {"train_loss": -27.4213809967041, "global_step": 490842, "epoch": 5913} {"train_loss": -27.27338218688965, "global_step": 490843, "epoch": 5913} {"train_loss": -27.573715209960938, "global_step": 490844, "epoch": 5913} {"train_loss": -27.164688110351562, "global_step": 490845, "epoch": 5913} {"train_loss": -26.55060386657715, "global_step": 490846, "epoch": 5913} {"train_loss": -26.7625675201416, "global_step": 490847, "epoch": 5913} {"train_loss": -27.458633422851562, "global_step": 490848, "epoch": 5913} {"train_loss": -26.633859634399414, "global_step": 490849, "epoch": 5913} {"train_loss": -26.9091796875, "global_step": 490850, "epoch": 5913} {"train_loss": -27.4284610748291, "global_step": 490851, "epoch": 5913} {"train_loss": -27.068262100219727, "global_step": 490852, "epoch": 5913} {"train_loss": -27.36520767211914, "global_step": 490853, "epoch": 5913} {"train_loss": -26.776615142822266, "global_step": 490854, "epoch": 5913} {"train_loss": -27.35166358947754, "global_step": 490855, "epoch": 5913} {"train_loss": -27.76331901550293, "global_step": 490856, "epoch": 5913} {"train_loss": -27.485931396484375, "global_step": 490857, "epoch": 5913} {"train_loss": -27.09161376953125, "global_step": 490858, "epoch": 5913} {"train_loss": -27.43711280822754, "global_step": 490859, "epoch": 5913} {"train_loss": -27.28705406188965, "global_step": 490860, "epoch": 5913} {"train_loss": -27.231657625680946, "global_step": 490861, "epoch": 5913, "val_loss": 6569923.0} {"train_loss": -26.782285690307617, "global_step": 490862, "epoch": 5914} {"train_loss": -27.05925941467285, "global_step": 490863, "epoch": 5914} {"train_loss": -26.91876792907715, "global_step": 490864, "epoch": 5914} {"train_loss": -26.642240524291992, "global_step": 490865, "epoch": 5914} {"train_loss": -26.965967178344727, "global_step": 490866, "epoch": 5914} {"train_loss": -25.915266036987305, "global_step": 490867, "epoch": 5914} {"train_loss": -26.96697998046875, "global_step": 490868, "epoch": 5914} {"train_loss": -26.372175216674805, "global_step": 490869, "epoch": 5914} {"train_loss": -26.503589630126953, "global_step": 490870, "epoch": 5914} {"train_loss": -26.893945693969727, "global_step": 490871, "epoch": 5914} {"train_loss": -26.913007736206055, "global_step": 490872, "epoch": 5914} {"train_loss": -26.68238639831543, "global_step": 490873, "epoch": 5914} {"train_loss": -27.03631019592285, "global_step": 490874, "epoch": 5914} {"train_loss": -27.106903076171875, "global_step": 490875, "epoch": 5914} {"train_loss": -26.73457145690918, "global_step": 490876, "epoch": 5914} {"train_loss": -26.967679977416992, "global_step": 490877, "epoch": 5914} {"train_loss": -27.285673141479492, "global_step": 490878, "epoch": 5914} {"train_loss": -27.37824058532715, "global_step": 490879, "epoch": 5914} {"train_loss": -27.668420791625977, "global_step": 490880, "epoch": 5914} {"train_loss": -27.161102294921875, "global_step": 490881, "epoch": 5914} {"train_loss": -26.99588966369629, "global_step": 490882, "epoch": 5914} {"train_loss": -27.598468780517578, "global_step": 490883, "epoch": 5914} {"train_loss": -27.357257843017578, "global_step": 490884, "epoch": 5914} {"train_loss": -27.21923828125, "global_step": 490885, "epoch": 5914} {"train_loss": -27.044897079467773, "global_step": 490886, "epoch": 5914} {"train_loss": -27.685285568237305, "global_step": 490887, "epoch": 5914} {"train_loss": -27.549962997436523, "global_step": 490888, "epoch": 5914} {"train_loss": -27.337574005126953, "global_step": 490889, "epoch": 5914} {"train_loss": -27.45354652404785, "global_step": 490890, "epoch": 5914} {"train_loss": -27.224164962768555, "global_step": 490891, "epoch": 5914} {"train_loss": -27.503650665283203, "global_step": 490892, "epoch": 5914} {"train_loss": -27.559946060180664, "global_step": 490893, "epoch": 5914} {"train_loss": -26.909992218017578, "global_step": 490894, "epoch": 5914} {"train_loss": -27.0047664642334, "global_step": 490895, "epoch": 5914} {"train_loss": -27.245038986206055, "global_step": 490896, "epoch": 5914} {"train_loss": -27.093154907226562, "global_step": 490897, "epoch": 5914} {"train_loss": -26.934301376342773, "global_step": 490898, "epoch": 5914} {"train_loss": -27.2149715423584, "global_step": 490899, "epoch": 5914} {"train_loss": -27.51240348815918, "global_step": 490900, "epoch": 5914} {"train_loss": -27.245288848876953, "global_step": 490901, "epoch": 5914} {"train_loss": -27.33660316467285, "global_step": 490902, "epoch": 5914} {"train_loss": -27.41730308532715, "global_step": 490903, "epoch": 5914} {"train_loss": -26.899627685546875, "global_step": 490904, "epoch": 5914} {"train_loss": -27.395910263061523, "global_step": 490905, "epoch": 5914} {"train_loss": -27.1117000579834, "global_step": 490906, "epoch": 5914} {"train_loss": -27.291996002197266, "global_step": 490907, "epoch": 5914} {"train_loss": -26.958093643188477, "global_step": 490908, "epoch": 5914} {"train_loss": -26.98724365234375, "global_step": 490909, "epoch": 5914} {"train_loss": -27.441999435424805, "global_step": 490910, "epoch": 5914} {"train_loss": -27.401639938354492, "global_step": 490911, "epoch": 5914} {"train_loss": -27.487262725830078, "global_step": 490912, "epoch": 5914} {"train_loss": -27.235198974609375, "global_step": 490913, "epoch": 5914} {"train_loss": -27.434499740600586, "global_step": 490914, "epoch": 5914} {"train_loss": -27.352863311767578, "global_step": 490915, "epoch": 5914} {"train_loss": -27.516515731811523, "global_step": 490916, "epoch": 5914} {"train_loss": -27.257251739501953, "global_step": 490917, "epoch": 5914} {"train_loss": -27.5120906829834, "global_step": 490918, "epoch": 5914} {"train_loss": -27.80569839477539, "global_step": 490919, "epoch": 5914} {"train_loss": -27.128244400024414, "global_step": 490920, "epoch": 5914} {"train_loss": -27.376422882080078, "global_step": 490921, "epoch": 5914} {"train_loss": -27.330961227416992, "global_step": 490922, "epoch": 5914} {"train_loss": -26.986621856689453, "global_step": 490923, "epoch": 5914} {"train_loss": -27.297937393188477, "global_step": 490924, "epoch": 5914} {"train_loss": -27.400909423828125, "global_step": 490925, "epoch": 5914} {"train_loss": -27.325754165649414, "global_step": 490926, "epoch": 5914} {"train_loss": -27.69361686706543, "global_step": 490927, "epoch": 5914} {"train_loss": -27.15228843688965, "global_step": 490928, "epoch": 5914} {"train_loss": -27.428497314453125, "global_step": 490929, "epoch": 5914} {"train_loss": -27.253345489501953, "global_step": 490930, "epoch": 5914} {"train_loss": -27.502470016479492, "global_step": 490931, "epoch": 5914} {"train_loss": -27.168256759643555, "global_step": 490932, "epoch": 5914} {"train_loss": -27.165557861328125, "global_step": 490933, "epoch": 5914} {"train_loss": -26.853113174438477, "global_step": 490934, "epoch": 5914} {"train_loss": -27.23844337463379, "global_step": 490935, "epoch": 5914} {"train_loss": -27.79437828063965, "global_step": 490936, "epoch": 5914} {"train_loss": -27.357282638549805, "global_step": 490937, "epoch": 5914} {"train_loss": -27.307992935180664, "global_step": 490938, "epoch": 5914} {"train_loss": -27.00678062438965, "global_step": 490939, "epoch": 5914} {"train_loss": -27.061328887939453, "global_step": 490940, "epoch": 5914} {"train_loss": -26.98982048034668, "global_step": 490941, "epoch": 5914} {"train_loss": -27.356739044189453, "global_step": 490942, "epoch": 5914} {"train_loss": -27.653066635131836, "global_step": 490943, "epoch": 5914} {"train_loss": -27.201305849006378, "global_step": 490944, "epoch": 5914, "val_loss": 6508192.0} {"train_loss": -26.2587890625, "global_step": 490945, "epoch": 5915} {"train_loss": -26.83501625061035, "global_step": 490946, "epoch": 5915} {"train_loss": -26.8752498626709, "global_step": 490947, "epoch": 5915} {"train_loss": -26.4743595123291, "global_step": 490948, "epoch": 5915} {"train_loss": -26.78775978088379, "global_step": 490949, "epoch": 5915} {"train_loss": -27.175952911376953, "global_step": 490950, "epoch": 5915} {"train_loss": -27.0147647857666, "global_step": 490951, "epoch": 5915} {"train_loss": -27.12589454650879, "global_step": 490952, "epoch": 5915} {"train_loss": -26.749906539916992, "global_step": 490953, "epoch": 5915} {"train_loss": -26.890256881713867, "global_step": 490954, "epoch": 5915} {"train_loss": -26.781721115112305, "global_step": 490955, "epoch": 5915} {"train_loss": -27.4974422454834, "global_step": 490956, "epoch": 5915} {"train_loss": -27.28362464904785, "global_step": 490957, "epoch": 5915} {"train_loss": -27.49371910095215, "global_step": 490958, "epoch": 5915} {"train_loss": -27.332096099853516, "global_step": 490959, "epoch": 5915} {"train_loss": -27.493427276611328, "global_step": 490960, "epoch": 5915} {"train_loss": -26.995574951171875, "global_step": 490961, "epoch": 5915} {"train_loss": -27.20722007751465, "global_step": 490962, "epoch": 5915} {"train_loss": -27.149213790893555, "global_step": 490963, "epoch": 5915} {"train_loss": -27.261991500854492, "global_step": 490964, "epoch": 5915} {"train_loss": -27.454620361328125, "global_step": 490965, "epoch": 5915} {"train_loss": -27.708555221557617, "global_step": 490966, "epoch": 5915} {"train_loss": -27.295408248901367, "global_step": 490967, "epoch": 5915} {"train_loss": -27.476642608642578, "global_step": 490968, "epoch": 5915} {"train_loss": -27.568023681640625, "global_step": 490969, "epoch": 5915} {"train_loss": -27.41815757751465, "global_step": 490970, "epoch": 5915} {"train_loss": -27.24757957458496, "global_step": 490971, "epoch": 5915} {"train_loss": -27.203521728515625, "global_step": 490972, "epoch": 5915} {"train_loss": -27.422964096069336, "global_step": 490973, "epoch": 5915} {"train_loss": -27.288259506225586, "global_step": 490974, "epoch": 5915} {"train_loss": -27.153100967407227, "global_step": 490975, "epoch": 5915} {"train_loss": -27.581689834594727, "global_step": 490976, "epoch": 5915} {"train_loss": -27.575796127319336, "global_step": 490977, "epoch": 5915} {"train_loss": -27.447065353393555, "global_step": 490978, "epoch": 5915} {"train_loss": -27.50154685974121, "global_step": 490979, "epoch": 5915} {"train_loss": -27.41791343688965, "global_step": 490980, "epoch": 5915} {"train_loss": -27.506500244140625, "global_step": 490981, "epoch": 5915} {"train_loss": -27.378522872924805, "global_step": 490982, "epoch": 5915} {"train_loss": -27.437347412109375, "global_step": 490983, "epoch": 5915} {"train_loss": -27.07358741760254, "global_step": 490984, "epoch": 5915} {"train_loss": -27.6701717376709, "global_step": 490985, "epoch": 5915} {"train_loss": -27.402206420898438, "global_step": 490986, "epoch": 5915} {"train_loss": -27.647199630737305, "global_step": 490987, "epoch": 5915} {"train_loss": -27.549657821655273, "global_step": 490988, "epoch": 5915} {"train_loss": -26.99909019470215, "global_step": 490989, "epoch": 5915} {"train_loss": -27.451812744140625, "global_step": 490990, "epoch": 5915} {"train_loss": -27.379098892211914, "global_step": 490991, "epoch": 5915} {"train_loss": -27.367069244384766, "global_step": 490992, "epoch": 5915} {"train_loss": -27.582666397094727, "global_step": 490993, "epoch": 5915} {"train_loss": -27.313526153564453, "global_step": 490994, "epoch": 5915} {"train_loss": -26.9987735748291, "global_step": 490995, "epoch": 5915} {"train_loss": -27.457433700561523, "global_step": 490996, "epoch": 5915} {"train_loss": -27.615985870361328, "global_step": 490997, "epoch": 5915} {"train_loss": -27.437406539916992, "global_step": 490998, "epoch": 5915} {"train_loss": -27.479949951171875, "global_step": 490999, "epoch": 5915} {"train_loss": -27.328876495361328, "global_step": 491000, "epoch": 5915} {"train_loss": -27.5660457611084, "global_step": 491001, "epoch": 5915} {"train_loss": -27.366178512573242, "global_step": 491002, "epoch": 5915} {"train_loss": -27.15983009338379, "global_step": 491003, "epoch": 5915} {"train_loss": -27.128950119018555, "global_step": 491004, "epoch": 5915} {"train_loss": -27.03791618347168, "global_step": 491005, "epoch": 5915} {"train_loss": -27.57073402404785, "global_step": 491006, "epoch": 5915} {"train_loss": -27.39735221862793, "global_step": 491007, "epoch": 5915} {"train_loss": -27.588653564453125, "global_step": 491008, "epoch": 5915} {"train_loss": -27.95454216003418, "global_step": 491009, "epoch": 5915} {"train_loss": -27.301111221313477, "global_step": 491010, "epoch": 5915} {"train_loss": -27.3551082611084, "global_step": 491011, "epoch": 5915} {"train_loss": -27.63685417175293, "global_step": 491012, "epoch": 5915} {"train_loss": -27.4963436126709, "global_step": 491013, "epoch": 5915} {"train_loss": -27.42864990234375, "global_step": 491014, "epoch": 5915} {"train_loss": -27.43079948425293, "global_step": 491015, "epoch": 5915} {"train_loss": -27.176593780517578, "global_step": 491016, "epoch": 5915} {"train_loss": -27.424102783203125, "global_step": 491017, "epoch": 5915} {"train_loss": -27.562788009643555, "global_step": 491018, "epoch": 5915} {"train_loss": -27.529041290283203, "global_step": 491019, "epoch": 5915} {"train_loss": -27.533313751220703, "global_step": 491020, "epoch": 5915} {"train_loss": -27.378278732299805, "global_step": 491021, "epoch": 5915} {"train_loss": -27.28875160217285, "global_step": 491022, "epoch": 5915} {"train_loss": -27.43771743774414, "global_step": 491023, "epoch": 5915} {"train_loss": -27.515411376953125, "global_step": 491024, "epoch": 5915} {"train_loss": -27.483154296875, "global_step": 491025, "epoch": 5915} {"train_loss": -27.49991226196289, "global_step": 491026, "epoch": 5915} {"train_loss": -27.359265890466162, "global_step": 491027, "epoch": 5915, "val_loss": 6460239.5} {"train_loss": -25.542736053466797, "global_step": 491028, "epoch": 5916} {"train_loss": -25.308977127075195, "global_step": 491029, "epoch": 5916} {"train_loss": -25.35679054260254, "global_step": 491030, "epoch": 5916} {"train_loss": -25.692092895507812, "global_step": 491031, "epoch": 5916} {"train_loss": -26.529998779296875, "global_step": 491032, "epoch": 5916} {"train_loss": -25.778961181640625, "global_step": 491033, "epoch": 5916} {"train_loss": -26.32993507385254, "global_step": 491034, "epoch": 5916} {"train_loss": -26.162445068359375, "global_step": 491035, "epoch": 5916} {"train_loss": -26.31988525390625, "global_step": 491036, "epoch": 5916} {"train_loss": -26.447019577026367, "global_step": 491037, "epoch": 5916} {"train_loss": -26.11920166015625, "global_step": 491038, "epoch": 5916} {"train_loss": -26.748647689819336, "global_step": 491039, "epoch": 5916} {"train_loss": -26.65298843383789, "global_step": 491040, "epoch": 5916} {"train_loss": -26.410818099975586, "global_step": 491041, "epoch": 5916} {"train_loss": -26.471845626831055, "global_step": 491042, "epoch": 5916} {"train_loss": -26.6529483795166, "global_step": 491043, "epoch": 5916} {"train_loss": -26.62934684753418, "global_step": 491044, "epoch": 5916} {"train_loss": -26.73185157775879, "global_step": 491045, "epoch": 5916} {"train_loss": -26.803619384765625, "global_step": 491046, "epoch": 5916} {"train_loss": -26.984058380126953, "global_step": 491047, "epoch": 5916} {"train_loss": -26.831710815429688, "global_step": 491048, "epoch": 5916} {"train_loss": -27.10402488708496, "global_step": 491049, "epoch": 5916} {"train_loss": -26.762128829956055, "global_step": 491050, "epoch": 5916} {"train_loss": -26.689868927001953, "global_step": 491051, "epoch": 5916} {"train_loss": -27.00776481628418, "global_step": 491052, "epoch": 5916} {"train_loss": -27.168664932250977, "global_step": 491053, "epoch": 5916} {"train_loss": -26.859848022460938, "global_step": 491054, "epoch": 5916} {"train_loss": -27.083967208862305, "global_step": 491055, "epoch": 5916} {"train_loss": -27.081464767456055, "global_step": 491056, "epoch": 5916} {"train_loss": -27.112131118774414, "global_step": 491057, "epoch": 5916} {"train_loss": -27.3504581451416, "global_step": 491058, "epoch": 5916} {"train_loss": -27.3070125579834, "global_step": 491059, "epoch": 5916} {"train_loss": -27.068267822265625, "global_step": 491060, "epoch": 5916} {"train_loss": -27.312307357788086, "global_step": 491061, "epoch": 5916} {"train_loss": -27.055402755737305, "global_step": 491062, "epoch": 5916} {"train_loss": -26.917160034179688, "global_step": 491063, "epoch": 5916} {"train_loss": -27.465564727783203, "global_step": 491064, "epoch": 5916} {"train_loss": -27.268924713134766, "global_step": 491065, "epoch": 5916} {"train_loss": -27.512292861938477, "global_step": 491066, "epoch": 5916} {"train_loss": -27.244037628173828, "global_step": 491067, "epoch": 5916} {"train_loss": -27.76266860961914, "global_step": 491068, "epoch": 5916} {"train_loss": -27.37261390686035, "global_step": 491069, "epoch": 5916} {"train_loss": -27.38527488708496, "global_step": 491070, "epoch": 5916} {"train_loss": -27.280500411987305, "global_step": 491071, "epoch": 5916} {"train_loss": -27.489704132080078, "global_step": 491072, "epoch": 5916} {"train_loss": -27.30225944519043, "global_step": 491073, "epoch": 5916} {"train_loss": -27.51490592956543, "global_step": 491074, "epoch": 5916} {"train_loss": -27.437490463256836, "global_step": 491075, "epoch": 5916} {"train_loss": -27.485645294189453, "global_step": 491076, "epoch": 5916} {"train_loss": -27.59478187561035, "global_step": 491077, "epoch": 5916} {"train_loss": -27.871463775634766, "global_step": 491078, "epoch": 5916} {"train_loss": -27.712665557861328, "global_step": 491079, "epoch": 5916} {"train_loss": -27.518817901611328, "global_step": 491080, "epoch": 5916} {"train_loss": -27.43048667907715, "global_step": 491081, "epoch": 5916} {"train_loss": -27.714040756225586, "global_step": 491082, "epoch": 5916} {"train_loss": -27.759008407592773, "global_step": 491083, "epoch": 5916} {"train_loss": -27.58014488220215, "global_step": 491084, "epoch": 5916} {"train_loss": -27.366857528686523, "global_step": 491085, "epoch": 5916} {"train_loss": -27.267393112182617, "global_step": 491086, "epoch": 5916} {"train_loss": -27.496307373046875, "global_step": 491087, "epoch": 5916} {"train_loss": -27.754169464111328, "global_step": 491088, "epoch": 5916} {"train_loss": -27.4608211517334, "global_step": 491089, "epoch": 5916} {"train_loss": -27.354522705078125, "global_step": 491090, "epoch": 5916} {"train_loss": -26.91413688659668, "global_step": 491091, "epoch": 5916} {"train_loss": -26.45751953125, "global_step": 491092, "epoch": 5916} {"train_loss": -26.623910903930664, "global_step": 491093, "epoch": 5916} {"train_loss": -27.184350967407227, "global_step": 491094, "epoch": 5916} {"train_loss": -27.736719131469727, "global_step": 491095, "epoch": 5916} {"train_loss": -27.371057510375977, "global_step": 491096, "epoch": 5916} {"train_loss": -27.129947662353516, "global_step": 491097, "epoch": 5916} {"train_loss": -27.40667724609375, "global_step": 491098, "epoch": 5916} {"train_loss": -27.12224769592285, "global_step": 491099, "epoch": 5916} {"train_loss": -26.872303009033203, "global_step": 491100, "epoch": 5916} {"train_loss": -26.86151695251465, "global_step": 491101, "epoch": 5916} {"train_loss": -27.617568969726562, "global_step": 491102, "epoch": 5916} {"train_loss": -27.277917861938477, "global_step": 491103, "epoch": 5916} {"train_loss": -27.078210830688477, "global_step": 491104, "epoch": 5916} {"train_loss": -27.284154891967773, "global_step": 491105, "epoch": 5916} {"train_loss": -27.70802116394043, "global_step": 491106, "epoch": 5916} {"train_loss": -27.465808868408203, "global_step": 491107, "epoch": 5916} {"train_loss": -27.389856338500977, "global_step": 491108, "epoch": 5916} {"train_loss": -27.391117095947266, "global_step": 491109, "epoch": 5916} {"train_loss": -27.061295589768743, "global_step": 491110, "epoch": 5916, "val_loss": 6517756.0} {"train_loss": -26.7467041015625, "global_step": 491111, "epoch": 5917} {"train_loss": -26.472455978393555, "global_step": 491112, "epoch": 5917} {"train_loss": -26.764917373657227, "global_step": 491113, "epoch": 5917} {"train_loss": -26.413166046142578, "global_step": 491114, "epoch": 5917} {"train_loss": -26.92545509338379, "global_step": 491115, "epoch": 5917} {"train_loss": -26.90839195251465, "global_step": 491116, "epoch": 5917} {"train_loss": -26.814401626586914, "global_step": 491117, "epoch": 5917} {"train_loss": -26.855249404907227, "global_step": 491118, "epoch": 5917} {"train_loss": -27.1617374420166, "global_step": 491119, "epoch": 5917} {"train_loss": -26.781442642211914, "global_step": 491120, "epoch": 5917} {"train_loss": -27.257665634155273, "global_step": 491121, "epoch": 5917} {"train_loss": -26.82356834411621, "global_step": 491122, "epoch": 5917} {"train_loss": -26.9425106048584, "global_step": 491123, "epoch": 5917} {"train_loss": -26.94202995300293, "global_step": 491124, "epoch": 5917} {"train_loss": -27.26482582092285, "global_step": 491125, "epoch": 5917} {"train_loss": -27.123504638671875, "global_step": 491126, "epoch": 5917} {"train_loss": -27.34221839904785, "global_step": 491127, "epoch": 5917} {"train_loss": -27.152341842651367, "global_step": 491128, "epoch": 5917} {"train_loss": -27.12713050842285, "global_step": 491129, "epoch": 5917} {"train_loss": -26.935394287109375, "global_step": 491130, "epoch": 5917} {"train_loss": -27.20240592956543, "global_step": 491131, "epoch": 5917} {"train_loss": -27.155282974243164, "global_step": 491132, "epoch": 5917} {"train_loss": -27.462438583374023, "global_step": 491133, "epoch": 5917} {"train_loss": -27.29025650024414, "global_step": 491134, "epoch": 5917} {"train_loss": -27.1877498626709, "global_step": 491135, "epoch": 5917} {"train_loss": -27.289587020874023, "global_step": 491136, "epoch": 5917} {"train_loss": -27.079593658447266, "global_step": 491137, "epoch": 5917} {"train_loss": -26.93440055847168, "global_step": 491138, "epoch": 5917} {"train_loss": -27.15950584411621, "global_step": 491139, "epoch": 5917} {"train_loss": -27.245141983032227, "global_step": 491140, "epoch": 5917} {"train_loss": -27.323429107666016, "global_step": 491141, "epoch": 5917} {"train_loss": -27.26466178894043, "global_step": 491142, "epoch": 5917} {"train_loss": -27.19329261779785, "global_step": 491143, "epoch": 5917} {"train_loss": -27.32419204711914, "global_step": 491144, "epoch": 5917} {"train_loss": -27.225025177001953, "global_step": 491145, "epoch": 5917} {"train_loss": -27.53857421875, "global_step": 491146, "epoch": 5917} {"train_loss": -27.33465003967285, "global_step": 491147, "epoch": 5917} {"train_loss": -27.424707412719727, "global_step": 491148, "epoch": 5917} {"train_loss": -27.137006759643555, "global_step": 491149, "epoch": 5917} {"train_loss": -27.477054595947266, "global_step": 491150, "epoch": 5917} {"train_loss": -27.349903106689453, "global_step": 491151, "epoch": 5917} {"train_loss": -27.5030574798584, "global_step": 491152, "epoch": 5917} {"train_loss": -27.01777458190918, "global_step": 491153, "epoch": 5917} {"train_loss": -27.793262481689453, "global_step": 491154, "epoch": 5917} {"train_loss": -27.32183265686035, "global_step": 491155, "epoch": 5917} {"train_loss": -27.18282127380371, "global_step": 491156, "epoch": 5917} {"train_loss": -27.3197078704834, "global_step": 491157, "epoch": 5917} {"train_loss": -27.478322982788086, "global_step": 491158, "epoch": 5917} {"train_loss": -27.30341148376465, "global_step": 491159, "epoch": 5917} {"train_loss": -27.600305557250977, "global_step": 491160, "epoch": 5917} {"train_loss": -27.367908477783203, "global_step": 491161, "epoch": 5917} {"train_loss": -27.592554092407227, "global_step": 491162, "epoch": 5917} {"train_loss": -27.5225830078125, "global_step": 491163, "epoch": 5917} {"train_loss": -27.490543365478516, "global_step": 491164, "epoch": 5917} {"train_loss": -27.49616050720215, "global_step": 491165, "epoch": 5917} {"train_loss": -27.6212158203125, "global_step": 491166, "epoch": 5917} {"train_loss": -27.7192325592041, "global_step": 491167, "epoch": 5917} {"train_loss": -27.69207763671875, "global_step": 491168, "epoch": 5917} {"train_loss": -27.428913116455078, "global_step": 491169, "epoch": 5917} {"train_loss": -27.95993423461914, "global_step": 491170, "epoch": 5917} {"train_loss": -27.41218376159668, "global_step": 491171, "epoch": 5917} {"train_loss": -27.567737579345703, "global_step": 491172, "epoch": 5917} {"train_loss": -27.339197158813477, "global_step": 491173, "epoch": 5917} {"train_loss": -27.535247802734375, "global_step": 491174, "epoch": 5917} {"train_loss": -27.048376083374023, "global_step": 491175, "epoch": 5917} {"train_loss": -26.79745864868164, "global_step": 491176, "epoch": 5917} {"train_loss": -27.083337783813477, "global_step": 491177, "epoch": 5917} {"train_loss": -27.367639541625977, "global_step": 491178, "epoch": 5917} {"train_loss": -26.808359146118164, "global_step": 491179, "epoch": 5917} {"train_loss": -27.273151397705078, "global_step": 491180, "epoch": 5917} {"train_loss": -27.3027286529541, "global_step": 491181, "epoch": 5917} {"train_loss": -27.2614688873291, "global_step": 491182, "epoch": 5917} {"train_loss": -27.570526123046875, "global_step": 491183, "epoch": 5917} {"train_loss": -27.394149780273438, "global_step": 491184, "epoch": 5917} {"train_loss": -26.707468032836914, "global_step": 491185, "epoch": 5917} {"train_loss": -26.900577545166016, "global_step": 491186, "epoch": 5917} {"train_loss": -27.124902725219727, "global_step": 491187, "epoch": 5917} {"train_loss": -26.93015480041504, "global_step": 491188, "epoch": 5917} {"train_loss": -27.398996353149414, "global_step": 491189, "epoch": 5917} {"train_loss": -27.095672607421875, "global_step": 491190, "epoch": 5917} {"train_loss": -26.891387939453125, "global_step": 491191, "epoch": 5917} {"train_loss": -27.1124324798584, "global_step": 491192, "epoch": 5917} {"train_loss": -27.21616457743817, "global_step": 491193, "epoch": 5917, "val_loss": 6506358.0} {"train_loss": -26.851394653320312, "global_step": 491194, "epoch": 5918} {"train_loss": -26.0947265625, "global_step": 491195, "epoch": 5918} {"train_loss": -25.950551986694336, "global_step": 491196, "epoch": 5918} {"train_loss": -25.656314849853516, "global_step": 491197, "epoch": 5918} {"train_loss": -26.473615646362305, "global_step": 491198, "epoch": 5918} {"train_loss": -26.607025146484375, "global_step": 491199, "epoch": 5918} {"train_loss": -26.641996383666992, "global_step": 491200, "epoch": 5918} {"train_loss": -26.77743911743164, "global_step": 491201, "epoch": 5918} {"train_loss": -27.03802490234375, "global_step": 491202, "epoch": 5918} {"train_loss": -26.863327026367188, "global_step": 491203, "epoch": 5918} {"train_loss": -26.809192657470703, "global_step": 491204, "epoch": 5918} {"train_loss": -27.006793975830078, "global_step": 491205, "epoch": 5918} {"train_loss": -27.163818359375, "global_step": 491206, "epoch": 5918} {"train_loss": -26.893484115600586, "global_step": 491207, "epoch": 5918} {"train_loss": -27.06048583984375, "global_step": 491208, "epoch": 5918} {"train_loss": -27.12711524963379, "global_step": 491209, "epoch": 5918} {"train_loss": -27.01291847229004, "global_step": 491210, "epoch": 5918} {"train_loss": -27.512592315673828, "global_step": 491211, "epoch": 5918} {"train_loss": -26.66259765625, "global_step": 491212, "epoch": 5918} {"train_loss": -27.425439834594727, "global_step": 491213, "epoch": 5918} {"train_loss": -26.92262840270996, "global_step": 491214, "epoch": 5918} {"train_loss": -27.260498046875, "global_step": 491215, "epoch": 5918} {"train_loss": -27.174280166625977, "global_step": 491216, "epoch": 5918} {"train_loss": -27.00568962097168, "global_step": 491217, "epoch": 5918} {"train_loss": -27.2607421875, "global_step": 491218, "epoch": 5918} {"train_loss": -27.145246505737305, "global_step": 491219, "epoch": 5918} {"train_loss": -27.1729736328125, "global_step": 491220, "epoch": 5918} {"train_loss": -27.5867862701416, "global_step": 491221, "epoch": 5918} {"train_loss": -27.3696346282959, "global_step": 491222, "epoch": 5918} {"train_loss": -27.069538116455078, "global_step": 491223, "epoch": 5918} {"train_loss": -27.199079513549805, "global_step": 491224, "epoch": 5918} {"train_loss": -27.608123779296875, "global_step": 491225, "epoch": 5918} {"train_loss": -27.028608322143555, "global_step": 491226, "epoch": 5918} {"train_loss": -27.325546264648438, "global_step": 491227, "epoch": 5918} {"train_loss": -27.520254135131836, "global_step": 491228, "epoch": 5918} {"train_loss": -27.096250534057617, "global_step": 491229, "epoch": 5918} {"train_loss": -27.721723556518555, "global_step": 491230, "epoch": 5918} {"train_loss": -27.236753463745117, "global_step": 491231, "epoch": 5918} {"train_loss": -27.512487411499023, "global_step": 491232, "epoch": 5918} {"train_loss": -27.14044761657715, "global_step": 491233, "epoch": 5918} {"train_loss": -27.714502334594727, "global_step": 491234, "epoch": 5918} {"train_loss": -27.44585609436035, "global_step": 491235, "epoch": 5918} {"train_loss": -27.57398796081543, "global_step": 491236, "epoch": 5918} {"train_loss": -26.973590850830078, "global_step": 491237, "epoch": 5918} {"train_loss": -27.381784439086914, "global_step": 491238, "epoch": 5918} {"train_loss": -27.181665420532227, "global_step": 491239, "epoch": 5918} {"train_loss": -27.452560424804688, "global_step": 491240, "epoch": 5918} {"train_loss": -27.011051177978516, "global_step": 491241, "epoch": 5918} {"train_loss": -27.20261573791504, "global_step": 491242, "epoch": 5918} {"train_loss": -27.197187423706055, "global_step": 491243, "epoch": 5918} {"train_loss": -27.220325469970703, "global_step": 491244, "epoch": 5918} {"train_loss": -27.175674438476562, "global_step": 491245, "epoch": 5918} {"train_loss": -27.21355628967285, "global_step": 491246, "epoch": 5918} {"train_loss": -27.051916122436523, "global_step": 491247, "epoch": 5918} {"train_loss": -26.633987426757812, "global_step": 491248, "epoch": 5918} {"train_loss": -27.02191734313965, "global_step": 491249, "epoch": 5918} {"train_loss": -27.50507926940918, "global_step": 491250, "epoch": 5918} {"train_loss": -27.3492431640625, "global_step": 491251, "epoch": 5918} {"train_loss": -26.959253311157227, "global_step": 491252, "epoch": 5918} {"train_loss": -26.833545684814453, "global_step": 491253, "epoch": 5918} {"train_loss": -26.90223503112793, "global_step": 491254, "epoch": 5918} {"train_loss": -26.817548751831055, "global_step": 491255, "epoch": 5918} {"train_loss": -27.329076766967773, "global_step": 491256, "epoch": 5918} {"train_loss": -27.60023307800293, "global_step": 491257, "epoch": 5918} {"train_loss": -27.264535903930664, "global_step": 491258, "epoch": 5918} {"train_loss": -27.172250747680664, "global_step": 491259, "epoch": 5918} {"train_loss": -27.14312171936035, "global_step": 491260, "epoch": 5918} {"train_loss": -27.564605712890625, "global_step": 491261, "epoch": 5918} {"train_loss": -27.206090927124023, "global_step": 491262, "epoch": 5918} {"train_loss": -27.436248779296875, "global_step": 491263, "epoch": 5918} {"train_loss": -27.606382369995117, "global_step": 491264, "epoch": 5918} {"train_loss": -27.247278213500977, "global_step": 491265, "epoch": 5918} {"train_loss": -27.144094467163086, "global_step": 491266, "epoch": 5918} {"train_loss": -27.3248348236084, "global_step": 491267, "epoch": 5918} {"train_loss": -27.72157096862793, "global_step": 491268, "epoch": 5918} {"train_loss": -27.676305770874023, "global_step": 491269, "epoch": 5918} {"train_loss": -27.24336051940918, "global_step": 491270, "epoch": 5918} {"train_loss": -27.668588638305664, "global_step": 491271, "epoch": 5918} {"train_loss": -27.439599990844727, "global_step": 491272, "epoch": 5918} {"train_loss": -27.498987197875977, "global_step": 491273, "epoch": 5918} {"train_loss": -26.933135986328125, "global_step": 491274, "epoch": 5918} {"train_loss": -27.293609619140625, "global_step": 491275, "epoch": 5918} {"train_loss": -27.130619922316217, "global_step": 491276, "epoch": 5918, "val_loss": 6506794.5} {"train_loss": -26.780603408813477, "global_step": 491277, "epoch": 5919} {"train_loss": -26.737394332885742, "global_step": 491278, "epoch": 5919} {"train_loss": -26.684186935424805, "global_step": 491279, "epoch": 5919} {"train_loss": -26.942718505859375, "global_step": 491280, "epoch": 5919} {"train_loss": -27.04891014099121, "global_step": 491281, "epoch": 5919} {"train_loss": -27.39114761352539, "global_step": 491282, "epoch": 5919} {"train_loss": -26.897598266601562, "global_step": 491283, "epoch": 5919} {"train_loss": -26.761396408081055, "global_step": 491284, "epoch": 5919} {"train_loss": -27.22967529296875, "global_step": 491285, "epoch": 5919} {"train_loss": -26.883886337280273, "global_step": 491286, "epoch": 5919} {"train_loss": -26.88187026977539, "global_step": 491287, "epoch": 5919} {"train_loss": -26.930891036987305, "global_step": 491288, "epoch": 5919} {"train_loss": -27.2491512298584, "global_step": 491289, "epoch": 5919} {"train_loss": -26.93934440612793, "global_step": 491290, "epoch": 5919} {"train_loss": -27.274234771728516, "global_step": 491291, "epoch": 5919} {"train_loss": -26.93048095703125, "global_step": 491292, "epoch": 5919} {"train_loss": -26.919391632080078, "global_step": 491293, "epoch": 5919} {"train_loss": -27.416711807250977, "global_step": 491294, "epoch": 5919} {"train_loss": -27.313024520874023, "global_step": 491295, "epoch": 5919} {"train_loss": -26.760345458984375, "global_step": 491296, "epoch": 5919} {"train_loss": -27.038375854492188, "global_step": 491297, "epoch": 5919} {"train_loss": -27.099517822265625, "global_step": 491298, "epoch": 5919} {"train_loss": -26.963214874267578, "global_step": 491299, "epoch": 5919} {"train_loss": -26.951810836791992, "global_step": 491300, "epoch": 5919} {"train_loss": -27.746047973632812, "global_step": 491301, "epoch": 5919} {"train_loss": -27.2829647064209, "global_step": 491302, "epoch": 5919} {"train_loss": -27.609455108642578, "global_step": 491303, "epoch": 5919} {"train_loss": -27.390457153320312, "global_step": 491304, "epoch": 5919} {"train_loss": -27.586719512939453, "global_step": 491305, "epoch": 5919} {"train_loss": -27.2408504486084, "global_step": 491306, "epoch": 5919} {"train_loss": -27.407495498657227, "global_step": 491307, "epoch": 5919} {"train_loss": -27.118061065673828, "global_step": 491308, "epoch": 5919} {"train_loss": -27.871862411499023, "global_step": 491309, "epoch": 5919} {"train_loss": -27.542922973632812, "global_step": 491310, "epoch": 5919} {"train_loss": -27.255844116210938, "global_step": 491311, "epoch": 5919} {"train_loss": -27.34430503845215, "global_step": 491312, "epoch": 5919} {"train_loss": -27.437429428100586, "global_step": 491313, "epoch": 5919} {"train_loss": -27.247333526611328, "global_step": 491314, "epoch": 5919} {"train_loss": -27.04865837097168, "global_step": 491315, "epoch": 5919} {"train_loss": -27.3735408782959, "global_step": 491316, "epoch": 5919} {"train_loss": -27.52976417541504, "global_step": 491317, "epoch": 5919} {"train_loss": -27.55714988708496, "global_step": 491318, "epoch": 5919} {"train_loss": -27.65058708190918, "global_step": 491319, "epoch": 5919} {"train_loss": -27.60337257385254, "global_step": 491320, "epoch": 5919} {"train_loss": -27.382526397705078, "global_step": 491321, "epoch": 5919} {"train_loss": -27.699384689331055, "global_step": 491322, "epoch": 5919} {"train_loss": -27.467945098876953, "global_step": 491323, "epoch": 5919} {"train_loss": -27.611581802368164, "global_step": 491324, "epoch": 5919} {"train_loss": -27.76323890686035, "global_step": 491325, "epoch": 5919} {"train_loss": -27.621784210205078, "global_step": 491326, "epoch": 5919} {"train_loss": -27.290876388549805, "global_step": 491327, "epoch": 5919} {"train_loss": -27.4631404876709, "global_step": 491328, "epoch": 5919} {"train_loss": -27.254119873046875, "global_step": 491329, "epoch": 5919} {"train_loss": -27.672605514526367, "global_step": 491330, "epoch": 5919} {"train_loss": -27.634870529174805, "global_step": 491331, "epoch": 5919} {"train_loss": -27.2569637298584, "global_step": 491332, "epoch": 5919} {"train_loss": -27.588281631469727, "global_step": 491333, "epoch": 5919} {"train_loss": -27.194360733032227, "global_step": 491334, "epoch": 5919} {"train_loss": -27.833951950073242, "global_step": 491335, "epoch": 5919} {"train_loss": -27.3599853515625, "global_step": 491336, "epoch": 5919} {"train_loss": -27.254413604736328, "global_step": 491337, "epoch": 5919} {"train_loss": -27.392822265625, "global_step": 491338, "epoch": 5919} {"train_loss": -26.746753692626953, "global_step": 491339, "epoch": 5919} {"train_loss": -26.973331451416016, "global_step": 491340, "epoch": 5919} {"train_loss": -26.90643310546875, "global_step": 491341, "epoch": 5919} {"train_loss": -26.669769287109375, "global_step": 491342, "epoch": 5919} {"train_loss": -26.9003849029541, "global_step": 491343, "epoch": 5919} {"train_loss": -27.060651779174805, "global_step": 491344, "epoch": 5919} {"train_loss": -26.52392578125, "global_step": 491345, "epoch": 5919} {"train_loss": -26.545469284057617, "global_step": 491346, "epoch": 5919} {"train_loss": -26.441373825073242, "global_step": 491347, "epoch": 5919} {"train_loss": -26.972394943237305, "global_step": 491348, "epoch": 5919} {"train_loss": -26.748117446899414, "global_step": 491349, "epoch": 5919} {"train_loss": -26.826370239257812, "global_step": 491350, "epoch": 5919} {"train_loss": -27.154489517211914, "global_step": 491351, "epoch": 5919} {"train_loss": -26.54331398010254, "global_step": 491352, "epoch": 5919} {"train_loss": -27.202234268188477, "global_step": 491353, "epoch": 5919} {"train_loss": -27.026844024658203, "global_step": 491354, "epoch": 5919} {"train_loss": -26.92901039123535, "global_step": 491355, "epoch": 5919} {"train_loss": -27.248075485229492, "global_step": 491356, "epoch": 5919} {"train_loss": -26.6817569732666, "global_step": 491357, "epoch": 5919} {"train_loss": -27.32663917541504, "global_step": 491358, "epoch": 5919} {"train_loss": -27.168902707387165, "global_step": 491359, "epoch": 5919, "val_loss": 6453253.5} {"train_loss": -26.46698570251465, "global_step": 491360, "epoch": 5920} {"train_loss": -26.522886276245117, "global_step": 491361, "epoch": 5920} {"train_loss": -26.497344970703125, "global_step": 491362, "epoch": 5920} {"train_loss": -26.404035568237305, "global_step": 491363, "epoch": 5920} {"train_loss": -26.67962074279785, "global_step": 491364, "epoch": 5920} {"train_loss": -26.828699111938477, "global_step": 491365, "epoch": 5920} {"train_loss": -26.879037857055664, "global_step": 491366, "epoch": 5920} {"train_loss": -26.74972915649414, "global_step": 491367, "epoch": 5920} {"train_loss": -26.765583038330078, "global_step": 491368, "epoch": 5920} {"train_loss": -26.986509323120117, "global_step": 491369, "epoch": 5920} {"train_loss": -26.864398956298828, "global_step": 491370, "epoch": 5920} {"train_loss": -26.805240631103516, "global_step": 491371, "epoch": 5920} {"train_loss": -27.136213302612305, "global_step": 491372, "epoch": 5920} {"train_loss": -26.871570587158203, "global_step": 491373, "epoch": 5920} {"train_loss": -27.05181312561035, "global_step": 491374, "epoch": 5920} {"train_loss": -27.17852210998535, "global_step": 491375, "epoch": 5920} {"train_loss": -27.17913246154785, "global_step": 491376, "epoch": 5920} {"train_loss": -26.806446075439453, "global_step": 491377, "epoch": 5920} {"train_loss": -27.46518325805664, "global_step": 491378, "epoch": 5920} {"train_loss": -27.36615562438965, "global_step": 491379, "epoch": 5920} {"train_loss": -27.25372886657715, "global_step": 491380, "epoch": 5920} {"train_loss": -27.488183975219727, "global_step": 491381, "epoch": 5920} {"train_loss": -27.38116455078125, "global_step": 491382, "epoch": 5920} {"train_loss": -27.0665283203125, "global_step": 491383, "epoch": 5920} {"train_loss": -27.428497314453125, "global_step": 491384, "epoch": 5920} {"train_loss": -27.159423828125, "global_step": 491385, "epoch": 5920} {"train_loss": -27.385787963867188, "global_step": 491386, "epoch": 5920} {"train_loss": -27.34467887878418, "global_step": 491387, "epoch": 5920} {"train_loss": -27.49554443359375, "global_step": 491388, "epoch": 5920} {"train_loss": -27.022159576416016, "global_step": 491389, "epoch": 5920} {"train_loss": -27.0351505279541, "global_step": 491390, "epoch": 5920} {"train_loss": -27.374860763549805, "global_step": 491391, "epoch": 5920} {"train_loss": -27.38692283630371, "global_step": 491392, "epoch": 5920} {"train_loss": -27.45596694946289, "global_step": 491393, "epoch": 5920} {"train_loss": -27.487136840820312, "global_step": 491394, "epoch": 5920} {"train_loss": -27.652130126953125, "global_step": 491395, "epoch": 5920} {"train_loss": -27.71906089782715, "global_step": 491396, "epoch": 5920} {"train_loss": -27.650177001953125, "global_step": 491397, "epoch": 5920} {"train_loss": -27.45162010192871, "global_step": 491398, "epoch": 5920} {"train_loss": -27.531187057495117, "global_step": 491399, "epoch": 5920} {"train_loss": -27.76007652282715, "global_step": 491400, "epoch": 5920} {"train_loss": -27.361303329467773, "global_step": 491401, "epoch": 5920} {"train_loss": -26.99124526977539, "global_step": 491402, "epoch": 5920} {"train_loss": -27.600072860717773, "global_step": 491403, "epoch": 5920} {"train_loss": -27.4587459564209, "global_step": 491404, "epoch": 5920} {"train_loss": -26.935077667236328, "global_step": 491405, "epoch": 5920} {"train_loss": -27.653635025024414, "global_step": 491406, "epoch": 5920} {"train_loss": -27.510305404663086, "global_step": 491407, "epoch": 5920} {"train_loss": -27.761581420898438, "global_step": 491408, "epoch": 5920} {"train_loss": -27.420068740844727, "global_step": 491409, "epoch": 5920} {"train_loss": -27.50862693786621, "global_step": 491410, "epoch": 5920} {"train_loss": -27.5825138092041, "global_step": 491411, "epoch": 5920} {"train_loss": -27.54475975036621, "global_step": 491412, "epoch": 5920} {"train_loss": -27.39920997619629, "global_step": 491413, "epoch": 5920} {"train_loss": -27.454395294189453, "global_step": 491414, "epoch": 5920} {"train_loss": -27.5131893157959, "global_step": 491415, "epoch": 5920} {"train_loss": -27.447540283203125, "global_step": 491416, "epoch": 5920} {"train_loss": -27.822254180908203, "global_step": 491417, "epoch": 5920} {"train_loss": -27.117557525634766, "global_step": 491418, "epoch": 5920} {"train_loss": -27.355371475219727, "global_step": 491419, "epoch": 5920} {"train_loss": -27.40911293029785, "global_step": 491420, "epoch": 5920} {"train_loss": -27.252532958984375, "global_step": 491421, "epoch": 5920} {"train_loss": -27.07501220703125, "global_step": 491422, "epoch": 5920} {"train_loss": -27.08829116821289, "global_step": 491423, "epoch": 5920} {"train_loss": -26.83429527282715, "global_step": 491424, "epoch": 5920} {"train_loss": -26.877893447875977, "global_step": 491425, "epoch": 5920} {"train_loss": -27.67156982421875, "global_step": 491426, "epoch": 5920} {"train_loss": -27.677526473999023, "global_step": 491427, "epoch": 5920} {"train_loss": -27.0863037109375, "global_step": 491428, "epoch": 5920} {"train_loss": -26.860660552978516, "global_step": 491429, "epoch": 5920} {"train_loss": -27.223997116088867, "global_step": 491430, "epoch": 5920} {"train_loss": -27.1907958984375, "global_step": 491431, "epoch": 5920} {"train_loss": -27.11732292175293, "global_step": 491432, "epoch": 5920} {"train_loss": -26.95405387878418, "global_step": 491433, "epoch": 5920} {"train_loss": -27.205591201782227, "global_step": 491434, "epoch": 5920} {"train_loss": -27.337478637695312, "global_step": 491435, "epoch": 5920} {"train_loss": -27.159521102905273, "global_step": 491436, "epoch": 5920} {"train_loss": -27.013349533081055, "global_step": 491437, "epoch": 5920} {"train_loss": -27.205158233642578, "global_step": 491438, "epoch": 5920} {"train_loss": -27.20879554748535, "global_step": 491439, "epoch": 5920} {"train_loss": -27.6236515045166, "global_step": 491440, "epoch": 5920} {"train_loss": -27.049606323242188, "global_step": 491441, "epoch": 5920} {"train_loss": -27.22360983239599, "global_step": 491442, "epoch": 5920, "val_loss": 6497382.0} {"train_loss": -27.178937911987305, "global_step": 491443, "epoch": 5921} {"train_loss": -26.65217399597168, "global_step": 491444, "epoch": 5921} {"train_loss": -26.629486083984375, "global_step": 491445, "epoch": 5921} {"train_loss": -26.71893310546875, "global_step": 491446, "epoch": 5921} {"train_loss": -26.569067001342773, "global_step": 491447, "epoch": 5921} {"train_loss": -26.071533203125, "global_step": 491448, "epoch": 5921} {"train_loss": -26.24163818359375, "global_step": 491449, "epoch": 5921} {"train_loss": -26.845733642578125, "global_step": 491450, "epoch": 5921} {"train_loss": -26.465301513671875, "global_step": 491451, "epoch": 5921} {"train_loss": -26.572568893432617, "global_step": 491452, "epoch": 5921} {"train_loss": -27.057157516479492, "global_step": 491453, "epoch": 5921} {"train_loss": -27.095056533813477, "global_step": 491454, "epoch": 5921} {"train_loss": -26.480701446533203, "global_step": 491455, "epoch": 5921} {"train_loss": -27.30341911315918, "global_step": 491456, "epoch": 5921} {"train_loss": -26.965606689453125, "global_step": 491457, "epoch": 5921} {"train_loss": -27.081241607666016, "global_step": 491458, "epoch": 5921} {"train_loss": -26.73447608947754, "global_step": 491459, "epoch": 5921} {"train_loss": -27.001760482788086, "global_step": 491460, "epoch": 5921} {"train_loss": -26.900440216064453, "global_step": 491461, "epoch": 5921} {"train_loss": -27.101978302001953, "global_step": 491462, "epoch": 5921} {"train_loss": -26.917631149291992, "global_step": 491463, "epoch": 5921} {"train_loss": -26.707782745361328, "global_step": 491464, "epoch": 5921} {"train_loss": -27.160978317260742, "global_step": 491465, "epoch": 5921} {"train_loss": -27.085493087768555, "global_step": 491466, "epoch": 5921} {"train_loss": -26.853849411010742, "global_step": 491467, "epoch": 5921} {"train_loss": -27.135772705078125, "global_step": 491468, "epoch": 5921} {"train_loss": -26.971521377563477, "global_step": 491469, "epoch": 5921} {"train_loss": -27.169958114624023, "global_step": 491470, "epoch": 5921} {"train_loss": -26.82929039001465, "global_step": 491471, "epoch": 5921} {"train_loss": -27.103271484375, "global_step": 491472, "epoch": 5921} {"train_loss": -26.653589248657227, "global_step": 491473, "epoch": 5921} {"train_loss": -26.97344398498535, "global_step": 491474, "epoch": 5921} {"train_loss": -26.79229164123535, "global_step": 491475, "epoch": 5921} {"train_loss": -27.448278427124023, "global_step": 491476, "epoch": 5921} {"train_loss": -27.40531349182129, "global_step": 491477, "epoch": 5921} {"train_loss": -27.297748565673828, "global_step": 491478, "epoch": 5921} {"train_loss": -27.247116088867188, "global_step": 491479, "epoch": 5921} {"train_loss": -27.68482780456543, "global_step": 491480, "epoch": 5921} {"train_loss": -27.673315048217773, "global_step": 491481, "epoch": 5921} {"train_loss": -27.188404083251953, "global_step": 491482, "epoch": 5921} {"train_loss": -27.632522583007812, "global_step": 491483, "epoch": 5921} {"train_loss": -27.144001007080078, "global_step": 491484, "epoch": 5921} {"train_loss": -27.158044815063477, "global_step": 491485, "epoch": 5921} {"train_loss": -27.218358993530273, "global_step": 491486, "epoch": 5921} {"train_loss": -27.32698631286621, "global_step": 491487, "epoch": 5921} {"train_loss": -27.630895614624023, "global_step": 491488, "epoch": 5921} {"train_loss": -27.38087272644043, "global_step": 491489, "epoch": 5921} {"train_loss": -27.190282821655273, "global_step": 491490, "epoch": 5921} {"train_loss": -27.308584213256836, "global_step": 491491, "epoch": 5921} {"train_loss": -27.750930786132812, "global_step": 491492, "epoch": 5921} {"train_loss": -27.274763107299805, "global_step": 491493, "epoch": 5921} {"train_loss": -27.314905166625977, "global_step": 491494, "epoch": 5921} {"train_loss": -27.431493759155273, "global_step": 491495, "epoch": 5921} {"train_loss": -27.626157760620117, "global_step": 491496, "epoch": 5921} {"train_loss": -27.315427780151367, "global_step": 491497, "epoch": 5921} {"train_loss": -27.3426570892334, "global_step": 491498, "epoch": 5921} {"train_loss": -27.14666748046875, "global_step": 491499, "epoch": 5921} {"train_loss": -27.094226837158203, "global_step": 491500, "epoch": 5921} {"train_loss": -27.255807876586914, "global_step": 491501, "epoch": 5921} {"train_loss": -27.199604034423828, "global_step": 491502, "epoch": 5921} {"train_loss": -27.53816032409668, "global_step": 491503, "epoch": 5921} {"train_loss": -27.13836097717285, "global_step": 491504, "epoch": 5921} {"train_loss": -27.18463706970215, "global_step": 491505, "epoch": 5921} {"train_loss": -27.10638999938965, "global_step": 491506, "epoch": 5921} {"train_loss": -27.611738204956055, "global_step": 491507, "epoch": 5921} {"train_loss": -27.5430850982666, "global_step": 491508, "epoch": 5921} {"train_loss": -27.85773277282715, "global_step": 491509, "epoch": 5921} {"train_loss": -27.485097885131836, "global_step": 491510, "epoch": 5921} {"train_loss": -27.084314346313477, "global_step": 491511, "epoch": 5921} {"train_loss": -27.2330322265625, "global_step": 491512, "epoch": 5921} {"train_loss": -27.234344482421875, "global_step": 491513, "epoch": 5921} {"train_loss": -26.94672203063965, "global_step": 491514, "epoch": 5921} {"train_loss": -27.602783203125, "global_step": 491515, "epoch": 5921} {"train_loss": -26.8897647857666, "global_step": 491516, "epoch": 5921} {"train_loss": -27.5626163482666, "global_step": 491517, "epoch": 5921} {"train_loss": -27.3829288482666, "global_step": 491518, "epoch": 5921} {"train_loss": -27.333118438720703, "global_step": 491519, "epoch": 5921} {"train_loss": -27.295679092407227, "global_step": 491520, "epoch": 5921} {"train_loss": -27.126556396484375, "global_step": 491521, "epoch": 5921} {"train_loss": -26.974273681640625, "global_step": 491522, "epoch": 5921} {"train_loss": -27.638553619384766, "global_step": 491523, "epoch": 5921} {"train_loss": -27.34663200378418, "global_step": 491524, "epoch": 5921} {"train_loss": -27.14278508381671, "global_step": 491525, "epoch": 5921, "val_loss": 6545915.5} {"train_loss": -27.053558349609375, "global_step": 491526, "epoch": 5922} {"train_loss": -27.17103385925293, "global_step": 491527, "epoch": 5922} {"train_loss": -27.2994327545166, "global_step": 491528, "epoch": 5922} {"train_loss": -26.661895751953125, "global_step": 491529, "epoch": 5922} {"train_loss": -26.574289321899414, "global_step": 491530, "epoch": 5922} {"train_loss": -26.956939697265625, "global_step": 491531, "epoch": 5922} {"train_loss": -26.276208877563477, "global_step": 491532, "epoch": 5922} {"train_loss": -26.499677658081055, "global_step": 491533, "epoch": 5922} {"train_loss": -26.696516036987305, "global_step": 491534, "epoch": 5922} {"train_loss": -26.864797592163086, "global_step": 491535, "epoch": 5922} {"train_loss": -27.136398315429688, "global_step": 491536, "epoch": 5922} {"train_loss": -26.323795318603516, "global_step": 491537, "epoch": 5922} {"train_loss": -26.719213485717773, "global_step": 491538, "epoch": 5922} {"train_loss": -26.8942813873291, "global_step": 491539, "epoch": 5922} {"train_loss": -26.211170196533203, "global_step": 491540, "epoch": 5922} {"train_loss": -26.92084312438965, "global_step": 491541, "epoch": 5922} {"train_loss": -26.954511642456055, "global_step": 491542, "epoch": 5922} {"train_loss": -27.053695678710938, "global_step": 491543, "epoch": 5922} {"train_loss": -27.07900047302246, "global_step": 491544, "epoch": 5922} {"train_loss": -26.97450065612793, "global_step": 491545, "epoch": 5922} {"train_loss": -27.15704917907715, "global_step": 491546, "epoch": 5922} {"train_loss": -26.742074966430664, "global_step": 491547, "epoch": 5922} {"train_loss": -26.81147575378418, "global_step": 491548, "epoch": 5922} {"train_loss": -27.17706871032715, "global_step": 491549, "epoch": 5922} {"train_loss": -27.260969161987305, "global_step": 491550, "epoch": 5922} {"train_loss": -27.409467697143555, "global_step": 491551, "epoch": 5922} {"train_loss": -27.318098068237305, "global_step": 491552, "epoch": 5922} {"train_loss": -27.121984481811523, "global_step": 491553, "epoch": 5922} {"train_loss": -27.0810489654541, "global_step": 491554, "epoch": 5922} {"train_loss": -27.25994873046875, "global_step": 491555, "epoch": 5922} {"train_loss": -27.179004669189453, "global_step": 491556, "epoch": 5922} {"train_loss": -27.07037925720215, "global_step": 491557, "epoch": 5922} {"train_loss": -27.033905029296875, "global_step": 491558, "epoch": 5922} {"train_loss": -27.19205665588379, "global_step": 491559, "epoch": 5922} {"train_loss": -27.249225616455078, "global_step": 491560, "epoch": 5922} {"train_loss": -27.505971908569336, "global_step": 491561, "epoch": 5922} {"train_loss": -27.26584815979004, "global_step": 491562, "epoch": 5922} {"train_loss": -27.293012619018555, "global_step": 491563, "epoch": 5922} {"train_loss": -27.537702560424805, "global_step": 491564, "epoch": 5922} {"train_loss": -27.5498046875, "global_step": 491565, "epoch": 5922} {"train_loss": -27.654266357421875, "global_step": 491566, "epoch": 5922} {"train_loss": -27.402982711791992, "global_step": 491567, "epoch": 5922} {"train_loss": -27.45428466796875, "global_step": 491568, "epoch": 5922} {"train_loss": -27.418676376342773, "global_step": 491569, "epoch": 5922} {"train_loss": -27.630048751831055, "global_step": 491570, "epoch": 5922} {"train_loss": -27.3151798248291, "global_step": 491571, "epoch": 5922} {"train_loss": -27.6734561920166, "global_step": 491572, "epoch": 5922} {"train_loss": -27.3861026763916, "global_step": 491573, "epoch": 5922} {"train_loss": -27.38678550720215, "global_step": 491574, "epoch": 5922} {"train_loss": -27.698286056518555, "global_step": 491575, "epoch": 5922} {"train_loss": -27.699621200561523, "global_step": 491576, "epoch": 5922} {"train_loss": -27.46355628967285, "global_step": 491577, "epoch": 5922} {"train_loss": -26.97040367126465, "global_step": 491578, "epoch": 5922} {"train_loss": -27.48499870300293, "global_step": 491579, "epoch": 5922} {"train_loss": -27.33820152282715, "global_step": 491580, "epoch": 5922} {"train_loss": -27.519927978515625, "global_step": 491581, "epoch": 5922} {"train_loss": -27.387014389038086, "global_step": 491582, "epoch": 5922} {"train_loss": -27.227209091186523, "global_step": 491583, "epoch": 5922} {"train_loss": -27.581037521362305, "global_step": 491584, "epoch": 5922} {"train_loss": -27.566028594970703, "global_step": 491585, "epoch": 5922} {"train_loss": -27.510595321655273, "global_step": 491586, "epoch": 5922} {"train_loss": -27.87827491760254, "global_step": 491587, "epoch": 5922} {"train_loss": -27.070877075195312, "global_step": 491588, "epoch": 5922} {"train_loss": -26.673803329467773, "global_step": 491589, "epoch": 5922} {"train_loss": -26.8845157623291, "global_step": 491590, "epoch": 5922} {"train_loss": -26.67852783203125, "global_step": 491591, "epoch": 5922} {"train_loss": -27.058496475219727, "global_step": 491592, "epoch": 5922} {"train_loss": -27.43017578125, "global_step": 491593, "epoch": 5922} {"train_loss": -26.57077407836914, "global_step": 491594, "epoch": 5922} {"train_loss": -26.857425689697266, "global_step": 491595, "epoch": 5922} {"train_loss": -26.299152374267578, "global_step": 491596, "epoch": 5922} {"train_loss": -26.929615020751953, "global_step": 491597, "epoch": 5922} {"train_loss": -26.948694229125977, "global_step": 491598, "epoch": 5922} {"train_loss": -26.801218032836914, "global_step": 491599, "epoch": 5922} {"train_loss": -27.24932861328125, "global_step": 491600, "epoch": 5922} {"train_loss": -27.2521915435791, "global_step": 491601, "epoch": 5922} {"train_loss": -27.352035522460938, "global_step": 491602, "epoch": 5922} {"train_loss": -26.952672958374023, "global_step": 491603, "epoch": 5922} {"train_loss": -27.357995986938477, "global_step": 491604, "epoch": 5922} {"train_loss": -26.955045700073242, "global_step": 491605, "epoch": 5922} {"train_loss": -27.312744140625, "global_step": 491606, "epoch": 5922} {"train_loss": -27.210540771484375, "global_step": 491607, "epoch": 5922} {"train_loss": -27.15430388393172, "global_step": 491608, "epoch": 5922, "val_loss": 6613075.5} {"train_loss": -27.243879318237305, "global_step": 491609, "epoch": 5923} {"train_loss": -26.087987899780273, "global_step": 491610, "epoch": 5923} {"train_loss": -26.250415802001953, "global_step": 491611, "epoch": 5923} {"train_loss": -26.57916831970215, "global_step": 491612, "epoch": 5923} {"train_loss": -26.94598388671875, "global_step": 491613, "epoch": 5923} {"train_loss": -26.70159339904785, "global_step": 491614, "epoch": 5923} {"train_loss": -27.123188018798828, "global_step": 491615, "epoch": 5923} {"train_loss": -27.000574111938477, "global_step": 491616, "epoch": 5923} {"train_loss": -26.829355239868164, "global_step": 491617, "epoch": 5923} {"train_loss": -26.84043312072754, "global_step": 491618, "epoch": 5923} {"train_loss": -27.027877807617188, "global_step": 491619, "epoch": 5923} {"train_loss": -26.773611068725586, "global_step": 491620, "epoch": 5923} {"train_loss": -26.491086959838867, "global_step": 491621, "epoch": 5923} {"train_loss": -27.073822021484375, "global_step": 491622, "epoch": 5923} {"train_loss": -26.821008682250977, "global_step": 491623, "epoch": 5923} {"train_loss": -27.242279052734375, "global_step": 491624, "epoch": 5923} {"train_loss": -26.919050216674805, "global_step": 491625, "epoch": 5923} {"train_loss": -27.10552978515625, "global_step": 491626, "epoch": 5923} {"train_loss": -27.26703453063965, "global_step": 491627, "epoch": 5923} {"train_loss": -26.886205673217773, "global_step": 491628, "epoch": 5923} {"train_loss": -26.576642990112305, "global_step": 491629, "epoch": 5923} {"train_loss": -26.93031120300293, "global_step": 491630, "epoch": 5923} {"train_loss": -26.965585708618164, "global_step": 491631, "epoch": 5923} {"train_loss": -27.1857967376709, "global_step": 491632, "epoch": 5923} {"train_loss": -27.528303146362305, "global_step": 491633, "epoch": 5923} {"train_loss": -27.138507843017578, "global_step": 491634, "epoch": 5923} {"train_loss": -27.196447372436523, "global_step": 491635, "epoch": 5923} {"train_loss": -27.27894401550293, "global_step": 491636, "epoch": 5923} {"train_loss": -27.640216827392578, "global_step": 491637, "epoch": 5923} {"train_loss": -27.40142250061035, "global_step": 491638, "epoch": 5923} {"train_loss": -27.46160888671875, "global_step": 491639, "epoch": 5923} {"train_loss": -27.5858097076416, "global_step": 491640, "epoch": 5923} {"train_loss": -27.589136123657227, "global_step": 491641, "epoch": 5923} {"train_loss": -27.5135555267334, "global_step": 491642, "epoch": 5923} {"train_loss": -27.609909057617188, "global_step": 491643, "epoch": 5923} {"train_loss": -27.703222274780273, "global_step": 491644, "epoch": 5923} {"train_loss": -27.595380783081055, "global_step": 491645, "epoch": 5923} {"train_loss": -27.4691219329834, "global_step": 491646, "epoch": 5923} {"train_loss": -27.617156982421875, "global_step": 491647, "epoch": 5923} {"train_loss": -27.568342208862305, "global_step": 491648, "epoch": 5923} {"train_loss": -27.441373825073242, "global_step": 491649, "epoch": 5923} {"train_loss": -27.290124893188477, "global_step": 491650, "epoch": 5923} {"train_loss": -27.40608024597168, "global_step": 491651, "epoch": 5923} {"train_loss": -27.598718643188477, "global_step": 491652, "epoch": 5923} {"train_loss": -27.408430099487305, "global_step": 491653, "epoch": 5923} {"train_loss": -27.523340225219727, "global_step": 491654, "epoch": 5923} {"train_loss": -27.307336807250977, "global_step": 491655, "epoch": 5923} {"train_loss": -27.630237579345703, "global_step": 491656, "epoch": 5923} {"train_loss": -27.416364669799805, "global_step": 491657, "epoch": 5923} {"train_loss": -27.904226303100586, "global_step": 491658, "epoch": 5923} {"train_loss": -27.16813087463379, "global_step": 491659, "epoch": 5923} {"train_loss": -27.553197860717773, "global_step": 491660, "epoch": 5923} {"train_loss": -27.517475128173828, "global_step": 491661, "epoch": 5923} {"train_loss": -27.803054809570312, "global_step": 491662, "epoch": 5923} {"train_loss": -27.28046989440918, "global_step": 491663, "epoch": 5923} {"train_loss": -27.783777236938477, "global_step": 491664, "epoch": 5923} {"train_loss": -27.35298728942871, "global_step": 491665, "epoch": 5923} {"train_loss": -27.4599552154541, "global_step": 491666, "epoch": 5923} {"train_loss": -27.169469833374023, "global_step": 491667, "epoch": 5923} {"train_loss": -27.514936447143555, "global_step": 491668, "epoch": 5923} {"train_loss": -27.102766036987305, "global_step": 491669, "epoch": 5923} {"train_loss": -26.9820556640625, "global_step": 491670, "epoch": 5923} {"train_loss": -26.79448890686035, "global_step": 491671, "epoch": 5923} {"train_loss": -27.19276237487793, "global_step": 491672, "epoch": 5923} {"train_loss": -27.379470825195312, "global_step": 491673, "epoch": 5923} {"train_loss": -27.26504898071289, "global_step": 491674, "epoch": 5923} {"train_loss": -26.7409610748291, "global_step": 491675, "epoch": 5923} {"train_loss": -26.830093383789062, "global_step": 491676, "epoch": 5923} {"train_loss": -27.36289405822754, "global_step": 491677, "epoch": 5923} {"train_loss": -27.26776123046875, "global_step": 491678, "epoch": 5923} {"train_loss": -27.253284454345703, "global_step": 491679, "epoch": 5923} {"train_loss": -27.718902587890625, "global_step": 491680, "epoch": 5923} {"train_loss": -26.995838165283203, "global_step": 491681, "epoch": 5923} {"train_loss": -27.158910751342773, "global_step": 491682, "epoch": 5923} {"train_loss": -27.262470245361328, "global_step": 491683, "epoch": 5923} {"train_loss": -26.956567764282227, "global_step": 491684, "epoch": 5923} {"train_loss": -27.3377685546875, "global_step": 491685, "epoch": 5923} {"train_loss": -27.115442276000977, "global_step": 491686, "epoch": 5923} {"train_loss": -27.57074546813965, "global_step": 491687, "epoch": 5923} {"train_loss": -27.160343170166016, "global_step": 491688, "epoch": 5923} {"train_loss": -27.566999435424805, "global_step": 491689, "epoch": 5923} {"train_loss": -26.729917526245117, "global_step": 491690, "epoch": 5923} {"train_loss": -27.236709479826043, "global_step": 491691, "epoch": 5923, "val_loss": 6564729.5} {"train_loss": -27.038257598876953, "global_step": 491692, "epoch": 5924} {"train_loss": -27.289159774780273, "global_step": 491693, "epoch": 5924} {"train_loss": -26.765241622924805, "global_step": 491694, "epoch": 5924} {"train_loss": -27.161819458007812, "global_step": 491695, "epoch": 5924} {"train_loss": -27.300954818725586, "global_step": 491696, "epoch": 5924} {"train_loss": -27.36126708984375, "global_step": 491697, "epoch": 5924} {"train_loss": -27.136280059814453, "global_step": 491698, "epoch": 5924} {"train_loss": -27.35614013671875, "global_step": 491699, "epoch": 5924} {"train_loss": -27.367902755737305, "global_step": 491700, "epoch": 5924} {"train_loss": -26.70465660095215, "global_step": 491701, "epoch": 5924} {"train_loss": -27.36797523498535, "global_step": 491702, "epoch": 5924} {"train_loss": -27.215356826782227, "global_step": 491703, "epoch": 5924} {"train_loss": -27.20172119140625, "global_step": 491704, "epoch": 5924} {"train_loss": -27.085683822631836, "global_step": 491705, "epoch": 5924} {"train_loss": -27.394744873046875, "global_step": 491706, "epoch": 5924} {"train_loss": -27.567047119140625, "global_step": 491707, "epoch": 5924} {"train_loss": -27.52589225769043, "global_step": 491708, "epoch": 5924} {"train_loss": -27.461380004882812, "global_step": 491709, "epoch": 5924} {"train_loss": -27.676748275756836, "global_step": 491710, "epoch": 5924} {"train_loss": -27.3106746673584, "global_step": 491711, "epoch": 5924} {"train_loss": -26.9325008392334, "global_step": 491712, "epoch": 5924} {"train_loss": -27.35706901550293, "global_step": 491713, "epoch": 5924} {"train_loss": -27.176132202148438, "global_step": 491714, "epoch": 5924} {"train_loss": -27.5739688873291, "global_step": 491715, "epoch": 5924} {"train_loss": -27.075937271118164, "global_step": 491716, "epoch": 5924} {"train_loss": -27.882068634033203, "global_step": 491717, "epoch": 5924} {"train_loss": -27.47150230407715, "global_step": 491718, "epoch": 5924} {"train_loss": -27.579151153564453, "global_step": 491719, "epoch": 5924} {"train_loss": -27.30381202697754, "global_step": 491720, "epoch": 5924} {"train_loss": -27.177021026611328, "global_step": 491721, "epoch": 5924} {"train_loss": -27.560138702392578, "global_step": 491722, "epoch": 5924} {"train_loss": -27.73247718811035, "global_step": 491723, "epoch": 5924} {"train_loss": -27.414377212524414, "global_step": 491724, "epoch": 5924} {"train_loss": -27.38924217224121, "global_step": 491725, "epoch": 5924} {"train_loss": -27.3206787109375, "global_step": 491726, "epoch": 5924} {"train_loss": -27.317279815673828, "global_step": 491727, "epoch": 5924} {"train_loss": -27.5657958984375, "global_step": 491728, "epoch": 5924} {"train_loss": -27.306777954101562, "global_step": 491729, "epoch": 5924} {"train_loss": -27.948734283447266, "global_step": 491730, "epoch": 5924} {"train_loss": -27.646015167236328, "global_step": 491731, "epoch": 5924} {"train_loss": -27.748046875, "global_step": 491732, "epoch": 5924} {"train_loss": -27.238752365112305, "global_step": 491733, "epoch": 5924} {"train_loss": -26.65875244140625, "global_step": 491734, "epoch": 5924} {"train_loss": -25.484128952026367, "global_step": 491735, "epoch": 5924} {"train_loss": -24.3572940826416, "global_step": 491736, "epoch": 5924} {"train_loss": -25.225154876708984, "global_step": 491737, "epoch": 5924} {"train_loss": -25.548995971679688, "global_step": 491738, "epoch": 5924} {"train_loss": -26.438098907470703, "global_step": 491739, "epoch": 5924} {"train_loss": -25.909439086914062, "global_step": 491740, "epoch": 5924} {"train_loss": -26.53321647644043, "global_step": 491741, "epoch": 5924} {"train_loss": -26.035825729370117, "global_step": 491742, "epoch": 5924} {"train_loss": -26.90785026550293, "global_step": 491743, "epoch": 5924} {"train_loss": -26.457611083984375, "global_step": 491744, "epoch": 5924} {"train_loss": -26.6646728515625, "global_step": 491745, "epoch": 5924} {"train_loss": -26.98508644104004, "global_step": 491746, "epoch": 5924} {"train_loss": -26.58223533630371, "global_step": 491747, "epoch": 5924} {"train_loss": -26.48532485961914, "global_step": 491748, "epoch": 5924} {"train_loss": -27.289642333984375, "global_step": 491749, "epoch": 5924} {"train_loss": -26.702634811401367, "global_step": 491750, "epoch": 5924} {"train_loss": -27.041357040405273, "global_step": 491751, "epoch": 5924} {"train_loss": -26.955280303955078, "global_step": 491752, "epoch": 5924} {"train_loss": -26.81985855102539, "global_step": 491753, "epoch": 5924} {"train_loss": -27.105993270874023, "global_step": 491754, "epoch": 5924} {"train_loss": -26.96822166442871, "global_step": 491755, "epoch": 5924} {"train_loss": -26.970172882080078, "global_step": 491756, "epoch": 5924} {"train_loss": -26.947772979736328, "global_step": 491757, "epoch": 5924} {"train_loss": -26.830102920532227, "global_step": 491758, "epoch": 5924} {"train_loss": -26.964447021484375, "global_step": 491759, "epoch": 5924} {"train_loss": -26.821271896362305, "global_step": 491760, "epoch": 5924} {"train_loss": -27.447431564331055, "global_step": 491761, "epoch": 5924} {"train_loss": -27.131235122680664, "global_step": 491762, "epoch": 5924} {"train_loss": -27.25724220275879, "global_step": 491763, "epoch": 5924} {"train_loss": -27.052078247070312, "global_step": 491764, "epoch": 5924} {"train_loss": -27.08810806274414, "global_step": 491765, "epoch": 5924} {"train_loss": -26.927160263061523, "global_step": 491766, "epoch": 5924} {"train_loss": -27.0106201171875, "global_step": 491767, "epoch": 5924} {"train_loss": -27.471643447875977, "global_step": 491768, "epoch": 5924} {"train_loss": -27.38822364807129, "global_step": 491769, "epoch": 5924} {"train_loss": -27.579309463500977, "global_step": 491770, "epoch": 5924} {"train_loss": -27.51556396484375, "global_step": 491771, "epoch": 5924} {"train_loss": -27.65369987487793, "global_step": 491772, "epoch": 5924} {"train_loss": -27.47913932800293, "global_step": 491773, "epoch": 5924} {"train_loss": -27.073907760252435, "global_step": 491774, "epoch": 5924, "val_loss": 6626072.0} {"train_loss": -27.17884635925293, "global_step": 491775, "epoch": 5925} {"train_loss": -27.324487686157227, "global_step": 491776, "epoch": 5925} {"train_loss": -27.310041427612305, "global_step": 491777, "epoch": 5925} {"train_loss": -27.036518096923828, "global_step": 491778, "epoch": 5925} {"train_loss": -27.082555770874023, "global_step": 491779, "epoch": 5925} {"train_loss": -26.87057876586914, "global_step": 491780, "epoch": 5925} {"train_loss": -27.75188636779785, "global_step": 491781, "epoch": 5925} {"train_loss": -27.354389190673828, "global_step": 491782, "epoch": 5925} {"train_loss": -27.4356689453125, "global_step": 491783, "epoch": 5925} {"train_loss": -27.980016708374023, "global_step": 491784, "epoch": 5925} {"train_loss": -27.291507720947266, "global_step": 491785, "epoch": 5925} {"train_loss": -27.46051597595215, "global_step": 491786, "epoch": 5925} {"train_loss": -27.611474990844727, "global_step": 491787, "epoch": 5925} {"train_loss": -27.213403701782227, "global_step": 491788, "epoch": 5925} {"train_loss": -27.378711700439453, "global_step": 491789, "epoch": 5925} {"train_loss": -27.63535499572754, "global_step": 491790, "epoch": 5925} {"train_loss": -27.330554962158203, "global_step": 491791, "epoch": 5925} {"train_loss": -27.5068359375, "global_step": 491792, "epoch": 5925} {"train_loss": -27.24098014831543, "global_step": 491793, "epoch": 5925} {"train_loss": -27.524747848510742, "global_step": 491794, "epoch": 5925} {"train_loss": -27.57509422302246, "global_step": 491795, "epoch": 5925} {"train_loss": -27.640716552734375, "global_step": 491796, "epoch": 5925} {"train_loss": -27.283201217651367, "global_step": 491797, "epoch": 5925} {"train_loss": -27.381460189819336, "global_step": 491798, "epoch": 5925} {"train_loss": -27.325239181518555, "global_step": 491799, "epoch": 5925} {"train_loss": -27.47633171081543, "global_step": 491800, "epoch": 5925} {"train_loss": -27.504638671875, "global_step": 491801, "epoch": 5925} {"train_loss": -27.263761520385742, "global_step": 491802, "epoch": 5925} {"train_loss": -27.482818603515625, "global_step": 491803, "epoch": 5925} {"train_loss": -27.207056045532227, "global_step": 491804, "epoch": 5925} {"train_loss": -27.405649185180664, "global_step": 491805, "epoch": 5925} {"train_loss": -27.76630973815918, "global_step": 491806, "epoch": 5925} {"train_loss": -27.058279037475586, "global_step": 491807, "epoch": 5925} {"train_loss": -27.126447677612305, "global_step": 491808, "epoch": 5925} {"train_loss": -27.126007080078125, "global_step": 491809, "epoch": 5925} {"train_loss": -27.78217124938965, "global_step": 491810, "epoch": 5925} {"train_loss": -27.235300064086914, "global_step": 491811, "epoch": 5925} {"train_loss": -27.27518653869629, "global_step": 491812, "epoch": 5925} {"train_loss": -26.5556583404541, "global_step": 491813, "epoch": 5925} {"train_loss": -27.124710083007812, "global_step": 491814, "epoch": 5925} {"train_loss": -27.006677627563477, "global_step": 491815, "epoch": 5925} {"train_loss": -27.107892990112305, "global_step": 491816, "epoch": 5925} {"train_loss": -26.768102645874023, "global_step": 491817, "epoch": 5925} {"train_loss": -27.42232322692871, "global_step": 491818, "epoch": 5925} {"train_loss": -27.37501335144043, "global_step": 491819, "epoch": 5925} {"train_loss": -27.211095809936523, "global_step": 491820, "epoch": 5925} {"train_loss": -26.991125106811523, "global_step": 491821, "epoch": 5925} {"train_loss": -27.380163192749023, "global_step": 491822, "epoch": 5925} {"train_loss": -26.80661392211914, "global_step": 491823, "epoch": 5925} {"train_loss": -27.288671493530273, "global_step": 491824, "epoch": 5925} {"train_loss": -26.758275985717773, "global_step": 491825, "epoch": 5925} {"train_loss": -27.073740005493164, "global_step": 491826, "epoch": 5925} {"train_loss": -27.45587730407715, "global_step": 491827, "epoch": 5925} {"train_loss": -27.557931900024414, "global_step": 491828, "epoch": 5925} {"train_loss": -27.19174575805664, "global_step": 491829, "epoch": 5925} {"train_loss": -26.959369659423828, "global_step": 491830, "epoch": 5925} {"train_loss": -27.329559326171875, "global_step": 491831, "epoch": 5925} {"train_loss": -27.322351455688477, "global_step": 491832, "epoch": 5925} {"train_loss": -27.025110244750977, "global_step": 491833, "epoch": 5925} {"train_loss": -27.328149795532227, "global_step": 491834, "epoch": 5925} {"train_loss": -27.002431869506836, "global_step": 491835, "epoch": 5925} {"train_loss": -27.40302085876465, "global_step": 491836, "epoch": 5925} {"train_loss": -26.988393783569336, "global_step": 491837, "epoch": 5925} {"train_loss": -26.69121742248535, "global_step": 491838, "epoch": 5925} {"train_loss": -27.48267936706543, "global_step": 491839, "epoch": 5925} {"train_loss": -27.0596923828125, "global_step": 491840, "epoch": 5925} {"train_loss": -27.48451042175293, "global_step": 491841, "epoch": 5925} {"train_loss": -27.17009925842285, "global_step": 491842, "epoch": 5925} {"train_loss": -27.165197372436523, "global_step": 491843, "epoch": 5925} {"train_loss": -26.995969772338867, "global_step": 491844, "epoch": 5925} {"train_loss": -27.721765518188477, "global_step": 491845, "epoch": 5925} {"train_loss": -26.94498062133789, "global_step": 491846, "epoch": 5925} {"train_loss": -27.180618286132812, "global_step": 491847, "epoch": 5925} {"train_loss": -26.85270118713379, "global_step": 491848, "epoch": 5925} {"train_loss": -27.17359733581543, "global_step": 491849, "epoch": 5925} {"train_loss": -26.648944854736328, "global_step": 491850, "epoch": 5925} {"train_loss": -27.335046768188477, "global_step": 491851, "epoch": 5925} {"train_loss": -26.69785499572754, "global_step": 491852, "epoch": 5925} {"train_loss": -27.091894149780273, "global_step": 491853, "epoch": 5925} {"train_loss": -27.350393295288086, "global_step": 491854, "epoch": 5925} {"train_loss": -27.2379207611084, "global_step": 491855, "epoch": 5925} {"train_loss": -26.85723304748535, "global_step": 491856, "epoch": 5925} {"train_loss": -27.236890356224702, "global_step": 491857, "epoch": 5925, "val_loss": 6526262.0} {"train_loss": -26.70673179626465, "global_step": 491858, "epoch": 5926} {"train_loss": -27.2188720703125, "global_step": 491859, "epoch": 5926} {"train_loss": -26.673267364501953, "global_step": 491860, "epoch": 5926} {"train_loss": -26.94583511352539, "global_step": 491861, "epoch": 5926} {"train_loss": -26.919652938842773, "global_step": 491862, "epoch": 5926} {"train_loss": -27.118398666381836, "global_step": 491863, "epoch": 5926} {"train_loss": -27.073989868164062, "global_step": 491864, "epoch": 5926} {"train_loss": -26.760236740112305, "global_step": 491865, "epoch": 5926} {"train_loss": -27.214202880859375, "global_step": 491866, "epoch": 5926} {"train_loss": -27.12222671508789, "global_step": 491867, "epoch": 5926} {"train_loss": -27.178466796875, "global_step": 491868, "epoch": 5926} {"train_loss": -27.28253746032715, "global_step": 491869, "epoch": 5926} {"train_loss": -27.343097686767578, "global_step": 491870, "epoch": 5926} {"train_loss": -27.030303955078125, "global_step": 491871, "epoch": 5926} {"train_loss": -27.1462459564209, "global_step": 491872, "epoch": 5926} {"train_loss": -27.018142700195312, "global_step": 491873, "epoch": 5926} {"train_loss": -27.07123374938965, "global_step": 491874, "epoch": 5926} {"train_loss": -27.42902183532715, "global_step": 491875, "epoch": 5926} {"train_loss": -27.112640380859375, "global_step": 491876, "epoch": 5926} {"train_loss": -27.647266387939453, "global_step": 491877, "epoch": 5926} {"train_loss": -27.41558265686035, "global_step": 491878, "epoch": 5926} {"train_loss": -27.60331153869629, "global_step": 491879, "epoch": 5926} {"train_loss": -27.312158584594727, "global_step": 491880, "epoch": 5926} {"train_loss": -27.26093101501465, "global_step": 491881, "epoch": 5926} {"train_loss": -27.18023109436035, "global_step": 491882, "epoch": 5926} {"train_loss": -27.55653190612793, "global_step": 491883, "epoch": 5926} {"train_loss": -27.722156524658203, "global_step": 491884, "epoch": 5926} {"train_loss": -27.528675079345703, "global_step": 491885, "epoch": 5926} {"train_loss": -27.541946411132812, "global_step": 491886, "epoch": 5926} {"train_loss": -27.846113204956055, "global_step": 491887, "epoch": 5926} {"train_loss": -27.263540267944336, "global_step": 491888, "epoch": 5926} {"train_loss": -27.296844482421875, "global_step": 491889, "epoch": 5926} {"train_loss": -27.588836669921875, "global_step": 491890, "epoch": 5926} {"train_loss": -27.681781768798828, "global_step": 491891, "epoch": 5926} {"train_loss": -28.157861709594727, "global_step": 491892, "epoch": 5926} {"train_loss": -27.484668731689453, "global_step": 491893, "epoch": 5926} {"train_loss": -27.837194442749023, "global_step": 491894, "epoch": 5926} {"train_loss": -27.25571632385254, "global_step": 491895, "epoch": 5926} {"train_loss": -27.831253051757812, "global_step": 491896, "epoch": 5926} {"train_loss": -27.170093536376953, "global_step": 491897, "epoch": 5926} {"train_loss": -27.59998893737793, "global_step": 491898, "epoch": 5926} {"train_loss": -27.21209144592285, "global_step": 491899, "epoch": 5926} {"train_loss": -27.85031509399414, "global_step": 491900, "epoch": 5926} {"train_loss": -27.442594528198242, "global_step": 491901, "epoch": 5926} {"train_loss": -27.5018367767334, "global_step": 491902, "epoch": 5926} {"train_loss": -27.640674591064453, "global_step": 491903, "epoch": 5926} {"train_loss": -27.86639404296875, "global_step": 491904, "epoch": 5926} {"train_loss": -27.526777267456055, "global_step": 491905, "epoch": 5926} {"train_loss": -27.309412002563477, "global_step": 491906, "epoch": 5926} {"train_loss": -27.268054962158203, "global_step": 491907, "epoch": 5926} {"train_loss": -27.740875244140625, "global_step": 491908, "epoch": 5926} {"train_loss": -27.458648681640625, "global_step": 491909, "epoch": 5926} {"train_loss": -27.47625732421875, "global_step": 491910, "epoch": 5926} {"train_loss": -27.186368942260742, "global_step": 491911, "epoch": 5926} {"train_loss": -27.271650314331055, "global_step": 491912, "epoch": 5926} {"train_loss": -27.313928604125977, "global_step": 491913, "epoch": 5926} {"train_loss": -27.258853912353516, "global_step": 491914, "epoch": 5926} {"train_loss": -26.733795166015625, "global_step": 491915, "epoch": 5926} {"train_loss": -25.86441421508789, "global_step": 491916, "epoch": 5926} {"train_loss": -24.96988868713379, "global_step": 491917, "epoch": 5926} {"train_loss": -24.532339096069336, "global_step": 491918, "epoch": 5926} {"train_loss": -25.343814849853516, "global_step": 491919, "epoch": 5926} {"train_loss": -25.944272994995117, "global_step": 491920, "epoch": 5926} {"train_loss": -26.978925704956055, "global_step": 491921, "epoch": 5926} {"train_loss": -26.01680564880371, "global_step": 491922, "epoch": 5926} {"train_loss": -26.69028663635254, "global_step": 491923, "epoch": 5926} {"train_loss": -26.595800399780273, "global_step": 491924, "epoch": 5926} {"train_loss": -26.602008819580078, "global_step": 491925, "epoch": 5926} {"train_loss": -27.0633544921875, "global_step": 491926, "epoch": 5926} {"train_loss": -26.797199249267578, "global_step": 491927, "epoch": 5926} {"train_loss": -27.072437286376953, "global_step": 491928, "epoch": 5926} {"train_loss": -26.10931968688965, "global_step": 491929, "epoch": 5926} {"train_loss": -26.799474716186523, "global_step": 491930, "epoch": 5926} {"train_loss": -26.866113662719727, "global_step": 491931, "epoch": 5926} {"train_loss": -27.2866268157959, "global_step": 491932, "epoch": 5926} {"train_loss": -26.491376876831055, "global_step": 491933, "epoch": 5926} {"train_loss": -26.90882682800293, "global_step": 491934, "epoch": 5926} {"train_loss": -27.056859970092773, "global_step": 491935, "epoch": 5926} {"train_loss": -26.792709350585938, "global_step": 491936, "epoch": 5926} {"train_loss": -27.238367080688477, "global_step": 491937, "epoch": 5926} {"train_loss": -26.764184951782227, "global_step": 491938, "epoch": 5926} {"train_loss": -26.877399444580078, "global_step": 491939, "epoch": 5926} {"train_loss": -27.102119790502343, "global_step": 491940, "epoch": 5926, "val_loss": 6616175.5} {"train_loss": -26.65972900390625, "global_step": 491941, "epoch": 5927} {"train_loss": -26.51422119140625, "global_step": 491942, "epoch": 5927} {"train_loss": -26.742353439331055, "global_step": 491943, "epoch": 5927} {"train_loss": -26.583898544311523, "global_step": 491944, "epoch": 5927} {"train_loss": -26.484548568725586, "global_step": 491945, "epoch": 5927} {"train_loss": -26.576126098632812, "global_step": 491946, "epoch": 5927} {"train_loss": -26.776670455932617, "global_step": 491947, "epoch": 5927} {"train_loss": -26.8472843170166, "global_step": 491948, "epoch": 5927} {"train_loss": -26.7512264251709, "global_step": 491949, "epoch": 5927} {"train_loss": -26.692304611206055, "global_step": 491950, "epoch": 5927} {"train_loss": -26.765644073486328, "global_step": 491951, "epoch": 5927} {"train_loss": -26.8342342376709, "global_step": 491952, "epoch": 5927} {"train_loss": -27.01289176940918, "global_step": 491953, "epoch": 5927} {"train_loss": -26.697574615478516, "global_step": 491954, "epoch": 5927} {"train_loss": -27.07513999938965, "global_step": 491955, "epoch": 5927} {"train_loss": -27.05242347717285, "global_step": 491956, "epoch": 5927} {"train_loss": -27.119449615478516, "global_step": 491957, "epoch": 5927} {"train_loss": -26.98810386657715, "global_step": 491958, "epoch": 5927} {"train_loss": -26.93265724182129, "global_step": 491959, "epoch": 5927} {"train_loss": -26.889272689819336, "global_step": 491960, "epoch": 5927} {"train_loss": -27.276214599609375, "global_step": 491961, "epoch": 5927} {"train_loss": -27.15924072265625, "global_step": 491962, "epoch": 5927} {"train_loss": -27.000701904296875, "global_step": 491963, "epoch": 5927} {"train_loss": -27.31818199157715, "global_step": 491964, "epoch": 5927} {"train_loss": -27.188404083251953, "global_step": 491965, "epoch": 5927} {"train_loss": -27.44412612915039, "global_step": 491966, "epoch": 5927} {"train_loss": -27.157352447509766, "global_step": 491967, "epoch": 5927} {"train_loss": -27.187152862548828, "global_step": 491968, "epoch": 5927} {"train_loss": -27.1284122467041, "global_step": 491969, "epoch": 5927} {"train_loss": -27.41163444519043, "global_step": 491970, "epoch": 5927} {"train_loss": -27.253482818603516, "global_step": 491971, "epoch": 5927} {"train_loss": -27.51576805114746, "global_step": 491972, "epoch": 5927} {"train_loss": -27.14727783203125, "global_step": 491973, "epoch": 5927} {"train_loss": -27.299951553344727, "global_step": 491974, "epoch": 5927} {"train_loss": -27.525039672851562, "global_step": 491975, "epoch": 5927} {"train_loss": -27.2982120513916, "global_step": 491976, "epoch": 5927} {"train_loss": -27.408597946166992, "global_step": 491977, "epoch": 5927} {"train_loss": -27.220884323120117, "global_step": 491978, "epoch": 5927} {"train_loss": -27.865589141845703, "global_step": 491979, "epoch": 5927} {"train_loss": -27.32611656188965, "global_step": 491980, "epoch": 5927} {"train_loss": -27.389745712280273, "global_step": 491981, "epoch": 5927} {"train_loss": -27.64861488342285, "global_step": 491982, "epoch": 5927} {"train_loss": -27.546056747436523, "global_step": 491983, "epoch": 5927} {"train_loss": -27.187143325805664, "global_step": 491984, "epoch": 5927} {"train_loss": -27.2447566986084, "global_step": 491985, "epoch": 5927} {"train_loss": -27.676782608032227, "global_step": 491986, "epoch": 5927} {"train_loss": -27.366437911987305, "global_step": 491987, "epoch": 5927} {"train_loss": -27.337278366088867, "global_step": 491988, "epoch": 5927} {"train_loss": -27.295495986938477, "global_step": 491989, "epoch": 5927} {"train_loss": -27.462804794311523, "global_step": 491990, "epoch": 5927} {"train_loss": -27.518564224243164, "global_step": 491991, "epoch": 5927} {"train_loss": -27.517194747924805, "global_step": 491992, "epoch": 5927} {"train_loss": -27.37982749938965, "global_step": 491993, "epoch": 5927} {"train_loss": -27.530517578125, "global_step": 491994, "epoch": 5927} {"train_loss": -27.168563842773438, "global_step": 491995, "epoch": 5927} {"train_loss": -27.289642333984375, "global_step": 491996, "epoch": 5927} {"train_loss": -27.106201171875, "global_step": 491997, "epoch": 5927} {"train_loss": -27.595325469970703, "global_step": 491998, "epoch": 5927} {"train_loss": -27.36115074157715, "global_step": 491999, "epoch": 5927} {"train_loss": -27.21341323852539, "global_step": 492000, "epoch": 5927} {"train_loss": -27.175512313842773, "global_step": 492001, "epoch": 5927} {"train_loss": -27.759180068969727, "global_step": 492002, "epoch": 5927} {"train_loss": -26.985761642456055, "global_step": 492003, "epoch": 5927} {"train_loss": -27.463211059570312, "global_step": 492004, "epoch": 5927} {"train_loss": -27.48346519470215, "global_step": 492005, "epoch": 5927} {"train_loss": -27.267175674438477, "global_step": 492006, "epoch": 5927} {"train_loss": -27.571277618408203, "global_step": 492007, "epoch": 5927} {"train_loss": -26.958831787109375, "global_step": 492008, "epoch": 5927} {"train_loss": -27.030485153198242, "global_step": 492009, "epoch": 5927} {"train_loss": -27.0373592376709, "global_step": 492010, "epoch": 5927} {"train_loss": -27.25001335144043, "global_step": 492011, "epoch": 5927} {"train_loss": -27.373931884765625, "global_step": 492012, "epoch": 5927} {"train_loss": -27.443695068359375, "global_step": 492013, "epoch": 5927} {"train_loss": -27.2103214263916, "global_step": 492014, "epoch": 5927} {"train_loss": -27.01311683654785, "global_step": 492015, "epoch": 5927} {"train_loss": -27.548858642578125, "global_step": 492016, "epoch": 5927} {"train_loss": -27.352191925048828, "global_step": 492017, "epoch": 5927} {"train_loss": -27.180307388305664, "global_step": 492018, "epoch": 5927} {"train_loss": -27.342126846313477, "global_step": 492019, "epoch": 5927} {"train_loss": -27.4329833984375, "global_step": 492020, "epoch": 5927} {"train_loss": -27.47015380859375, "global_step": 492021, "epoch": 5927} {"train_loss": -27.27876853942871, "global_step": 492022, "epoch": 5927} {"train_loss": -27.18619029493217, "global_step": 492023, "epoch": 5927, "val_loss": 6620322.0} {"train_loss": -26.474706649780273, "global_step": 492024, "epoch": 5928} {"train_loss": -26.4051513671875, "global_step": 492025, "epoch": 5928} {"train_loss": -26.6363525390625, "global_step": 492026, "epoch": 5928} {"train_loss": -26.652297973632812, "global_step": 492027, "epoch": 5928} {"train_loss": -26.357105255126953, "global_step": 492028, "epoch": 5928} {"train_loss": -26.374176025390625, "global_step": 492029, "epoch": 5928} {"train_loss": -27.35023307800293, "global_step": 492030, "epoch": 5928} {"train_loss": -26.78944206237793, "global_step": 492031, "epoch": 5928} {"train_loss": -26.5235595703125, "global_step": 492032, "epoch": 5928} {"train_loss": -26.809904098510742, "global_step": 492033, "epoch": 5928} {"train_loss": -26.951513290405273, "global_step": 492034, "epoch": 5928} {"train_loss": -26.80784034729004, "global_step": 492035, "epoch": 5928} {"train_loss": -26.95352554321289, "global_step": 492036, "epoch": 5928} {"train_loss": -27.028339385986328, "global_step": 492037, "epoch": 5928} {"train_loss": -27.068653106689453, "global_step": 492038, "epoch": 5928} {"train_loss": -26.921655654907227, "global_step": 492039, "epoch": 5928} {"train_loss": -27.17902946472168, "global_step": 492040, "epoch": 5928} {"train_loss": -27.073144912719727, "global_step": 492041, "epoch": 5928} {"train_loss": -27.02490234375, "global_step": 492042, "epoch": 5928} {"train_loss": -27.418338775634766, "global_step": 492043, "epoch": 5928} {"train_loss": -27.13370704650879, "global_step": 492044, "epoch": 5928} {"train_loss": -26.715240478515625, "global_step": 492045, "epoch": 5928} {"train_loss": -27.17982292175293, "global_step": 492046, "epoch": 5928} {"train_loss": -27.66584587097168, "global_step": 492047, "epoch": 5928} {"train_loss": -27.07465934753418, "global_step": 492048, "epoch": 5928} {"train_loss": -27.5667781829834, "global_step": 492049, "epoch": 5928} {"train_loss": -27.35247802734375, "global_step": 492050, "epoch": 5928} {"train_loss": -27.192276000976562, "global_step": 492051, "epoch": 5928} {"train_loss": -27.387054443359375, "global_step": 492052, "epoch": 5928} {"train_loss": -27.388330459594727, "global_step": 492053, "epoch": 5928} {"train_loss": -27.3309326171875, "global_step": 492054, "epoch": 5928} {"train_loss": -27.744421005249023, "global_step": 492055, "epoch": 5928} {"train_loss": -26.919504165649414, "global_step": 492056, "epoch": 5928} {"train_loss": -27.327932357788086, "global_step": 492057, "epoch": 5928} {"train_loss": -27.336627960205078, "global_step": 492058, "epoch": 5928} {"train_loss": -27.705738067626953, "global_step": 492059, "epoch": 5928} {"train_loss": -27.274961471557617, "global_step": 492060, "epoch": 5928} {"train_loss": -27.464359283447266, "global_step": 492061, "epoch": 5928} {"train_loss": -27.398923873901367, "global_step": 492062, "epoch": 5928} {"train_loss": -27.27152442932129, "global_step": 492063, "epoch": 5928} {"train_loss": -27.702096939086914, "global_step": 492064, "epoch": 5928} {"train_loss": -27.672595977783203, "global_step": 492065, "epoch": 5928} {"train_loss": -27.539045333862305, "global_step": 492066, "epoch": 5928} {"train_loss": -27.374998092651367, "global_step": 492067, "epoch": 5928} {"train_loss": -27.607568740844727, "global_step": 492068, "epoch": 5928} {"train_loss": -27.994077682495117, "global_step": 492069, "epoch": 5928} {"train_loss": -27.483057022094727, "global_step": 492070, "epoch": 5928} {"train_loss": -27.186315536499023, "global_step": 492071, "epoch": 5928} {"train_loss": -27.051198959350586, "global_step": 492072, "epoch": 5928} {"train_loss": -26.92530632019043, "global_step": 492073, "epoch": 5928} {"train_loss": -26.446247100830078, "global_step": 492074, "epoch": 5928} {"train_loss": -27.257810592651367, "global_step": 492075, "epoch": 5928} {"train_loss": -27.966018676757812, "global_step": 492076, "epoch": 5928} {"train_loss": -26.981176376342773, "global_step": 492077, "epoch": 5928} {"train_loss": -27.4058780670166, "global_step": 492078, "epoch": 5928} {"train_loss": -27.154394149780273, "global_step": 492079, "epoch": 5928} {"train_loss": -26.977048873901367, "global_step": 492080, "epoch": 5928} {"train_loss": -27.432641983032227, "global_step": 492081, "epoch": 5928} {"train_loss": -27.248355865478516, "global_step": 492082, "epoch": 5928} {"train_loss": -27.202741622924805, "global_step": 492083, "epoch": 5928} {"train_loss": -27.222293853759766, "global_step": 492084, "epoch": 5928} {"train_loss": -27.15714454650879, "global_step": 492085, "epoch": 5928} {"train_loss": -27.40447998046875, "global_step": 492086, "epoch": 5928} {"train_loss": -27.501331329345703, "global_step": 492087, "epoch": 5928} {"train_loss": -27.474599838256836, "global_step": 492088, "epoch": 5928} {"train_loss": -27.511478424072266, "global_step": 492089, "epoch": 5928} {"train_loss": -27.02876853942871, "global_step": 492090, "epoch": 5928} {"train_loss": -27.24457359313965, "global_step": 492091, "epoch": 5928} {"train_loss": -26.833160400390625, "global_step": 492092, "epoch": 5928} {"train_loss": -27.33967399597168, "global_step": 492093, "epoch": 5928} {"train_loss": -27.38400650024414, "global_step": 492094, "epoch": 5928} {"train_loss": -27.429956436157227, "global_step": 492095, "epoch": 5928} {"train_loss": -26.961166381835938, "global_step": 492096, "epoch": 5928} {"train_loss": -27.492273330688477, "global_step": 492097, "epoch": 5928} {"train_loss": -27.5281925201416, "global_step": 492098, "epoch": 5928} {"train_loss": -27.247573852539062, "global_step": 492099, "epoch": 5928} {"train_loss": -27.03704261779785, "global_step": 492100, "epoch": 5928} {"train_loss": -27.3140926361084, "global_step": 492101, "epoch": 5928} {"train_loss": -27.2175350189209, "global_step": 492102, "epoch": 5928} {"train_loss": -27.4522647857666, "global_step": 492103, "epoch": 5928} {"train_loss": -27.168521881103516, "global_step": 492104, "epoch": 5928} {"train_loss": -27.214237213134766, "global_step": 492105, "epoch": 5928} {"train_loss": -27.195811329117742, "global_step": 492106, "epoch": 5928, "val_loss": 6543149.0} {"train_loss": -27.118270874023438, "global_step": 492107, "epoch": 5929} {"train_loss": -26.56683921813965, "global_step": 492108, "epoch": 5929} {"train_loss": -27.010400772094727, "global_step": 492109, "epoch": 5929} {"train_loss": -27.269643783569336, "global_step": 492110, "epoch": 5929} {"train_loss": -27.28523826599121, "global_step": 492111, "epoch": 5929} {"train_loss": -26.804035186767578, "global_step": 492112, "epoch": 5929} {"train_loss": -27.184467315673828, "global_step": 492113, "epoch": 5929} {"train_loss": -27.090351104736328, "global_step": 492114, "epoch": 5929} {"train_loss": -27.32606315612793, "global_step": 492115, "epoch": 5929} {"train_loss": -27.351125717163086, "global_step": 492116, "epoch": 5929} {"train_loss": -27.062580108642578, "global_step": 492117, "epoch": 5929} {"train_loss": -27.2012882232666, "global_step": 492118, "epoch": 5929} {"train_loss": -26.89800453186035, "global_step": 492119, "epoch": 5929} {"train_loss": -27.369543075561523, "global_step": 492120, "epoch": 5929} {"train_loss": -27.22694206237793, "global_step": 492121, "epoch": 5929} {"train_loss": -27.327619552612305, "global_step": 492122, "epoch": 5929} {"train_loss": -27.317493438720703, "global_step": 492123, "epoch": 5929} {"train_loss": -27.12911033630371, "global_step": 492124, "epoch": 5929} {"train_loss": -27.676254272460938, "global_step": 492125, "epoch": 5929} {"train_loss": -27.13612937927246, "global_step": 492126, "epoch": 5929} {"train_loss": -26.38246726989746, "global_step": 492127, "epoch": 5929} {"train_loss": -26.80777359008789, "global_step": 492128, "epoch": 5929} {"train_loss": -27.275775909423828, "global_step": 492129, "epoch": 5929} {"train_loss": -27.441511154174805, "global_step": 492130, "epoch": 5929} {"train_loss": -27.19537353515625, "global_step": 492131, "epoch": 5929} {"train_loss": -27.05246353149414, "global_step": 492132, "epoch": 5929} {"train_loss": -27.36683464050293, "global_step": 492133, "epoch": 5929} {"train_loss": -27.156280517578125, "global_step": 492134, "epoch": 5929} {"train_loss": -27.0692138671875, "global_step": 492135, "epoch": 5929} {"train_loss": -27.018463134765625, "global_step": 492136, "epoch": 5929} {"train_loss": -27.4395694732666, "global_step": 492137, "epoch": 5929} {"train_loss": -26.990524291992188, "global_step": 492138, "epoch": 5929} {"train_loss": -27.146154403686523, "global_step": 492139, "epoch": 5929} {"train_loss": -27.26210594177246, "global_step": 492140, "epoch": 5929} {"train_loss": -27.31621742248535, "global_step": 492141, "epoch": 5929} {"train_loss": -27.546478271484375, "global_step": 492142, "epoch": 5929} {"train_loss": -27.058923721313477, "global_step": 492143, "epoch": 5929} {"train_loss": -27.314579010009766, "global_step": 492144, "epoch": 5929} {"train_loss": -27.3515625, "global_step": 492145, "epoch": 5929} {"train_loss": -27.60906410217285, "global_step": 492146, "epoch": 5929} {"train_loss": -27.163679122924805, "global_step": 492147, "epoch": 5929} {"train_loss": -27.273611068725586, "global_step": 492148, "epoch": 5929} {"train_loss": -27.771717071533203, "global_step": 492149, "epoch": 5929} {"train_loss": -27.356748580932617, "global_step": 492150, "epoch": 5929} {"train_loss": -27.294208526611328, "global_step": 492151, "epoch": 5929} {"train_loss": -27.61041259765625, "global_step": 492152, "epoch": 5929} {"train_loss": -27.449462890625, "global_step": 492153, "epoch": 5929} {"train_loss": -27.08418846130371, "global_step": 492154, "epoch": 5929} {"train_loss": -27.661184310913086, "global_step": 492155, "epoch": 5929} {"train_loss": -27.459741592407227, "global_step": 492156, "epoch": 5929} {"train_loss": -27.58607292175293, "global_step": 492157, "epoch": 5929} {"train_loss": -27.544570922851562, "global_step": 492158, "epoch": 5929} {"train_loss": -27.59278678894043, "global_step": 492159, "epoch": 5929} {"train_loss": -27.427642822265625, "global_step": 492160, "epoch": 5929} {"train_loss": -27.41522216796875, "global_step": 492161, "epoch": 5929} {"train_loss": -27.39455223083496, "global_step": 492162, "epoch": 5929} {"train_loss": -26.890735626220703, "global_step": 492163, "epoch": 5929} {"train_loss": -26.766992568969727, "global_step": 492164, "epoch": 5929} {"train_loss": -27.207691192626953, "global_step": 492165, "epoch": 5929} {"train_loss": -27.181049346923828, "global_step": 492166, "epoch": 5929} {"train_loss": -26.751047134399414, "global_step": 492167, "epoch": 5929} {"train_loss": -26.88226890563965, "global_step": 492168, "epoch": 5929} {"train_loss": -26.871784210205078, "global_step": 492169, "epoch": 5929} {"train_loss": -26.940542221069336, "global_step": 492170, "epoch": 5929} {"train_loss": -27.05620765686035, "global_step": 492171, "epoch": 5929} {"train_loss": -27.240768432617188, "global_step": 492172, "epoch": 5929} {"train_loss": -27.098173141479492, "global_step": 492173, "epoch": 5929} {"train_loss": -27.2273006439209, "global_step": 492174, "epoch": 5929} {"train_loss": -27.0157413482666, "global_step": 492175, "epoch": 5929} {"train_loss": -27.019086837768555, "global_step": 492176, "epoch": 5929} {"train_loss": -27.200321197509766, "global_step": 492177, "epoch": 5929} {"train_loss": -26.89655876159668, "global_step": 492178, "epoch": 5929} {"train_loss": -27.41998291015625, "global_step": 492179, "epoch": 5929} {"train_loss": -26.8792781829834, "global_step": 492180, "epoch": 5929} {"train_loss": -27.38563346862793, "global_step": 492181, "epoch": 5929} {"train_loss": -27.264978408813477, "global_step": 492182, "epoch": 5929} {"train_loss": -27.187223434448242, "global_step": 492183, "epoch": 5929} {"train_loss": -27.006122589111328, "global_step": 492184, "epoch": 5929} {"train_loss": -27.52054214477539, "global_step": 492185, "epoch": 5929} {"train_loss": -27.065332412719727, "global_step": 492186, "epoch": 5929} {"train_loss": -27.362045288085938, "global_step": 492187, "epoch": 5929} {"train_loss": -27.420520782470703, "global_step": 492188, "epoch": 5929} {"train_loss": -27.20213570652238, "global_step": 492189, "epoch": 5929, "val_loss": 6603610.0} {"train_loss": -26.982620239257812, "global_step": 492190, "epoch": 5930} {"train_loss": -27.06143569946289, "global_step": 492191, "epoch": 5930} {"train_loss": -27.627893447875977, "global_step": 492192, "epoch": 5930} {"train_loss": -27.38791847229004, "global_step": 492193, "epoch": 5930} {"train_loss": -26.855518341064453, "global_step": 492194, "epoch": 5930} {"train_loss": -27.42085838317871, "global_step": 492195, "epoch": 5930} {"train_loss": -27.41773796081543, "global_step": 492196, "epoch": 5930} {"train_loss": -27.104536056518555, "global_step": 492197, "epoch": 5930} {"train_loss": -27.153715133666992, "global_step": 492198, "epoch": 5930} {"train_loss": -27.67642593383789, "global_step": 492199, "epoch": 5930} {"train_loss": -27.11768913269043, "global_step": 492200, "epoch": 5930} {"train_loss": -27.060827255249023, "global_step": 492201, "epoch": 5930} {"train_loss": -27.158905029296875, "global_step": 492202, "epoch": 5930} {"train_loss": -27.265323638916016, "global_step": 492203, "epoch": 5930} {"train_loss": -27.084074020385742, "global_step": 492204, "epoch": 5930} {"train_loss": -26.98650550842285, "global_step": 492205, "epoch": 5930} {"train_loss": -27.036701202392578, "global_step": 492206, "epoch": 5930} {"train_loss": -27.15260124206543, "global_step": 492207, "epoch": 5930} {"train_loss": -27.275787353515625, "global_step": 492208, "epoch": 5930} {"train_loss": -27.0253849029541, "global_step": 492209, "epoch": 5930} {"train_loss": -27.45218849182129, "global_step": 492210, "epoch": 5930} {"train_loss": -27.147510528564453, "global_step": 492211, "epoch": 5930} {"train_loss": -27.288681030273438, "global_step": 492212, "epoch": 5930} {"train_loss": -27.583730697631836, "global_step": 492213, "epoch": 5930} {"train_loss": -27.649763107299805, "global_step": 492214, "epoch": 5930} {"train_loss": -27.24238395690918, "global_step": 492215, "epoch": 5930} {"train_loss": -27.23435401916504, "global_step": 492216, "epoch": 5930} {"train_loss": -27.499237060546875, "global_step": 492217, "epoch": 5930} {"train_loss": -27.531641006469727, "global_step": 492218, "epoch": 5930} {"train_loss": -27.7385311126709, "global_step": 492219, "epoch": 5930} {"train_loss": -27.765823364257812, "global_step": 492220, "epoch": 5930} {"train_loss": -27.998350143432617, "global_step": 492221, "epoch": 5930} {"train_loss": -27.579330444335938, "global_step": 492222, "epoch": 5930} {"train_loss": -27.5128173828125, "global_step": 492223, "epoch": 5930} {"train_loss": -27.67059326171875, "global_step": 492224, "epoch": 5930} {"train_loss": -27.893543243408203, "global_step": 492225, "epoch": 5930} {"train_loss": -27.316919326782227, "global_step": 492226, "epoch": 5930} {"train_loss": -27.721851348876953, "global_step": 492227, "epoch": 5930} {"train_loss": -27.27798843383789, "global_step": 492228, "epoch": 5930} {"train_loss": -27.649200439453125, "global_step": 492229, "epoch": 5930} {"train_loss": -27.5389404296875, "global_step": 492230, "epoch": 5930} {"train_loss": -27.82208824157715, "global_step": 492231, "epoch": 5930} {"train_loss": -27.36582374572754, "global_step": 492232, "epoch": 5930} {"train_loss": -27.416696548461914, "global_step": 492233, "epoch": 5930} {"train_loss": -27.567535400390625, "global_step": 492234, "epoch": 5930} {"train_loss": -27.353900909423828, "global_step": 492235, "epoch": 5930} {"train_loss": -27.760526657104492, "global_step": 492236, "epoch": 5930} {"train_loss": -27.6875, "global_step": 492237, "epoch": 5930} {"train_loss": -27.531957626342773, "global_step": 492238, "epoch": 5930} {"train_loss": -27.2188720703125, "global_step": 492239, "epoch": 5930} {"train_loss": -27.60113525390625, "global_step": 492240, "epoch": 5930} {"train_loss": -27.5143985748291, "global_step": 492241, "epoch": 5930} {"train_loss": -27.250120162963867, "global_step": 492242, "epoch": 5930} {"train_loss": -27.53309440612793, "global_step": 492243, "epoch": 5930} {"train_loss": -27.754175186157227, "global_step": 492244, "epoch": 5930} {"train_loss": -27.21759605407715, "global_step": 492245, "epoch": 5930} {"train_loss": -26.97491455078125, "global_step": 492246, "epoch": 5930} {"train_loss": -26.5068302154541, "global_step": 492247, "epoch": 5930} {"train_loss": -26.017805099487305, "global_step": 492248, "epoch": 5930} {"train_loss": -26.14202308654785, "global_step": 492249, "epoch": 5930} {"train_loss": -25.991653442382812, "global_step": 492250, "epoch": 5930} {"train_loss": -26.682403564453125, "global_step": 492251, "epoch": 5930} {"train_loss": -26.760665893554688, "global_step": 492252, "epoch": 5930} {"train_loss": -26.26777458190918, "global_step": 492253, "epoch": 5930} {"train_loss": -26.58548927307129, "global_step": 492254, "epoch": 5930} {"train_loss": -26.896411895751953, "global_step": 492255, "epoch": 5930} {"train_loss": -26.67130470275879, "global_step": 492256, "epoch": 5930} {"train_loss": -26.9636173248291, "global_step": 492257, "epoch": 5930} {"train_loss": -26.969161987304688, "global_step": 492258, "epoch": 5930} {"train_loss": -26.866992950439453, "global_step": 492259, "epoch": 5930} {"train_loss": -27.14747428894043, "global_step": 492260, "epoch": 5930} {"train_loss": -27.1169490814209, "global_step": 492261, "epoch": 5930} {"train_loss": -26.89190101623535, "global_step": 492262, "epoch": 5930} {"train_loss": -27.06450843811035, "global_step": 492263, "epoch": 5930} {"train_loss": -26.784814834594727, "global_step": 492264, "epoch": 5930} {"train_loss": -27.340505599975586, "global_step": 492265, "epoch": 5930} {"train_loss": -26.81208610534668, "global_step": 492266, "epoch": 5930} {"train_loss": -27.004886627197266, "global_step": 492267, "epoch": 5930} {"train_loss": -27.10576820373535, "global_step": 492268, "epoch": 5930} {"train_loss": -27.420774459838867, "global_step": 492269, "epoch": 5930} {"train_loss": -27.224760055541992, "global_step": 492270, "epoch": 5930} {"train_loss": -27.1073055267334, "global_step": 492271, "epoch": 5930} {"train_loss": -27.22245285309941, "global_step": 492272, "epoch": 5930, "val_loss": 6541308.0} {"train_loss": -27.172348022460938, "global_step": 492273, "epoch": 5931} {"train_loss": -26.913293838500977, "global_step": 492274, "epoch": 5931} {"train_loss": -27.034162521362305, "global_step": 492275, "epoch": 5931} {"train_loss": -26.80991554260254, "global_step": 492276, "epoch": 5931} {"train_loss": -26.662824630737305, "global_step": 492277, "epoch": 5931} {"train_loss": -27.161396026611328, "global_step": 492278, "epoch": 5931} {"train_loss": -27.212574005126953, "global_step": 492279, "epoch": 5931} {"train_loss": -27.20416259765625, "global_step": 492280, "epoch": 5931} {"train_loss": -27.03973388671875, "global_step": 492281, "epoch": 5931} {"train_loss": -27.130828857421875, "global_step": 492282, "epoch": 5931} {"train_loss": -27.015100479125977, "global_step": 492283, "epoch": 5931} {"train_loss": -27.192825317382812, "global_step": 492284, "epoch": 5931} {"train_loss": -27.503143310546875, "global_step": 492285, "epoch": 5931} {"train_loss": -27.157501220703125, "global_step": 492286, "epoch": 5931} {"train_loss": -27.369525909423828, "global_step": 492287, "epoch": 5931} {"train_loss": -27.00165367126465, "global_step": 492288, "epoch": 5931} {"train_loss": -27.454126358032227, "global_step": 492289, "epoch": 5931} {"train_loss": -27.3773136138916, "global_step": 492290, "epoch": 5931} {"train_loss": -27.455774307250977, "global_step": 492291, "epoch": 5931} {"train_loss": -27.25553321838379, "global_step": 492292, "epoch": 5931} {"train_loss": -27.16314697265625, "global_step": 492293, "epoch": 5931} {"train_loss": -27.362646102905273, "global_step": 492294, "epoch": 5931} {"train_loss": -27.7832088470459, "global_step": 492295, "epoch": 5931} {"train_loss": -27.36846923828125, "global_step": 492296, "epoch": 5931} {"train_loss": -27.45417594909668, "global_step": 492297, "epoch": 5931} {"train_loss": -27.321210861206055, "global_step": 492298, "epoch": 5931} {"train_loss": -27.516437530517578, "global_step": 492299, "epoch": 5931} {"train_loss": -27.21405029296875, "global_step": 492300, "epoch": 5931} {"train_loss": -27.455472946166992, "global_step": 492301, "epoch": 5931} {"train_loss": -27.418933868408203, "global_step": 492302, "epoch": 5931} {"train_loss": -27.27217674255371, "global_step": 492303, "epoch": 5931} {"train_loss": -27.633514404296875, "global_step": 492304, "epoch": 5931} {"train_loss": -27.478687286376953, "global_step": 492305, "epoch": 5931} {"train_loss": -27.1566104888916, "global_step": 492306, "epoch": 5931} {"train_loss": -27.17426872253418, "global_step": 492307, "epoch": 5931} {"train_loss": -27.415180206298828, "global_step": 492308, "epoch": 5931} {"train_loss": -27.457365036010742, "global_step": 492309, "epoch": 5931} {"train_loss": -27.244842529296875, "global_step": 492310, "epoch": 5931} {"train_loss": -27.53577995300293, "global_step": 492311, "epoch": 5931} {"train_loss": -27.518192291259766, "global_step": 492312, "epoch": 5931} {"train_loss": -27.404815673828125, "global_step": 492313, "epoch": 5931} {"train_loss": -27.529870986938477, "global_step": 492314, "epoch": 5931} {"train_loss": -27.48151969909668, "global_step": 492315, "epoch": 5931} {"train_loss": -27.635971069335938, "global_step": 492316, "epoch": 5931} {"train_loss": -27.418455123901367, "global_step": 492317, "epoch": 5931} {"train_loss": -27.52642822265625, "global_step": 492318, "epoch": 5931} {"train_loss": -27.591217041015625, "global_step": 492319, "epoch": 5931} {"train_loss": -27.435537338256836, "global_step": 492320, "epoch": 5931} {"train_loss": -27.481374740600586, "global_step": 492321, "epoch": 5931} {"train_loss": -27.575902938842773, "global_step": 492322, "epoch": 5931} {"train_loss": -27.4661865234375, "global_step": 492323, "epoch": 5931} {"train_loss": -27.396026611328125, "global_step": 492324, "epoch": 5931} {"train_loss": -27.48017692565918, "global_step": 492325, "epoch": 5931} {"train_loss": -27.312976837158203, "global_step": 492326, "epoch": 5931} {"train_loss": -27.246610641479492, "global_step": 492327, "epoch": 5931} {"train_loss": -26.802108764648438, "global_step": 492328, "epoch": 5931} {"train_loss": -27.51057243347168, "global_step": 492329, "epoch": 5931} {"train_loss": -27.688879013061523, "global_step": 492330, "epoch": 5931} {"train_loss": -27.2315616607666, "global_step": 492331, "epoch": 5931} {"train_loss": -27.172760009765625, "global_step": 492332, "epoch": 5931} {"train_loss": -27.127506256103516, "global_step": 492333, "epoch": 5931} {"train_loss": -27.200653076171875, "global_step": 492334, "epoch": 5931} {"train_loss": -27.395166397094727, "global_step": 492335, "epoch": 5931} {"train_loss": -26.81878089904785, "global_step": 492336, "epoch": 5931} {"train_loss": -27.201541900634766, "global_step": 492337, "epoch": 5931} {"train_loss": -27.7337589263916, "global_step": 492338, "epoch": 5931} {"train_loss": -27.653060913085938, "global_step": 492339, "epoch": 5931} {"train_loss": -27.02534294128418, "global_step": 492340, "epoch": 5931} {"train_loss": -27.49580192565918, "global_step": 492341, "epoch": 5931} {"train_loss": -27.20916748046875, "global_step": 492342, "epoch": 5931} {"train_loss": -27.114410400390625, "global_step": 492343, "epoch": 5931} {"train_loss": -27.214826583862305, "global_step": 492344, "epoch": 5931} {"train_loss": -27.417404174804688, "global_step": 492345, "epoch": 5931} {"train_loss": -26.91592788696289, "global_step": 492346, "epoch": 5931} {"train_loss": -27.581146240234375, "global_step": 492347, "epoch": 5931} {"train_loss": -27.353906631469727, "global_step": 492348, "epoch": 5931} {"train_loss": -27.537302017211914, "global_step": 492349, "epoch": 5931} {"train_loss": -27.312469482421875, "global_step": 492350, "epoch": 5931} {"train_loss": -27.183624267578125, "global_step": 492351, "epoch": 5931} {"train_loss": -26.909276962280273, "global_step": 492352, "epoch": 5931} {"train_loss": -27.064786911010742, "global_step": 492353, "epoch": 5931} {"train_loss": -27.6595458984375, "global_step": 492354, "epoch": 5931} {"train_loss": -27.31488793154797, "global_step": 492355, "epoch": 5931, "val_loss": 6560110.0} {"train_loss": -26.754119873046875, "global_step": 492356, "epoch": 5932} {"train_loss": -26.9869384765625, "global_step": 492357, "epoch": 5932} {"train_loss": -27.26126480102539, "global_step": 492358, "epoch": 5932} {"train_loss": -27.002058029174805, "global_step": 492359, "epoch": 5932} {"train_loss": -27.070199966430664, "global_step": 492360, "epoch": 5932} {"train_loss": -27.0050048828125, "global_step": 492361, "epoch": 5932} {"train_loss": -27.079587936401367, "global_step": 492362, "epoch": 5932} {"train_loss": -26.867877960205078, "global_step": 492363, "epoch": 5932} {"train_loss": -26.862075805664062, "global_step": 492364, "epoch": 5932} {"train_loss": -27.349594116210938, "global_step": 492365, "epoch": 5932} {"train_loss": -26.742273330688477, "global_step": 492366, "epoch": 5932} {"train_loss": -26.87774085998535, "global_step": 492367, "epoch": 5932} {"train_loss": -27.261615753173828, "global_step": 492368, "epoch": 5932} {"train_loss": -26.90961265563965, "global_step": 492369, "epoch": 5932} {"train_loss": -27.10454750061035, "global_step": 492370, "epoch": 5932} {"train_loss": -27.256921768188477, "global_step": 492371, "epoch": 5932} {"train_loss": -27.161123275756836, "global_step": 492372, "epoch": 5932} {"train_loss": -27.222553253173828, "global_step": 492373, "epoch": 5932} {"train_loss": -26.946455001831055, "global_step": 492374, "epoch": 5932} {"train_loss": -27.683053970336914, "global_step": 492375, "epoch": 5932} {"train_loss": -26.9993839263916, "global_step": 492376, "epoch": 5932} {"train_loss": -27.530597686767578, "global_step": 492377, "epoch": 5932} {"train_loss": -27.242612838745117, "global_step": 492378, "epoch": 5932} {"train_loss": -27.771764755249023, "global_step": 492379, "epoch": 5932} {"train_loss": -27.36915397644043, "global_step": 492380, "epoch": 5932} {"train_loss": -27.466211318969727, "global_step": 492381, "epoch": 5932} {"train_loss": -26.889474868774414, "global_step": 492382, "epoch": 5932} {"train_loss": -27.655807495117188, "global_step": 492383, "epoch": 5932} {"train_loss": -27.5335636138916, "global_step": 492384, "epoch": 5932} {"train_loss": -27.331945419311523, "global_step": 492385, "epoch": 5932} {"train_loss": -27.625701904296875, "global_step": 492386, "epoch": 5932} {"train_loss": -27.199100494384766, "global_step": 492387, "epoch": 5932} {"train_loss": -27.434858322143555, "global_step": 492388, "epoch": 5932} {"train_loss": -27.355478286743164, "global_step": 492389, "epoch": 5932} {"train_loss": -27.612598419189453, "global_step": 492390, "epoch": 5932} {"train_loss": -27.04319190979004, "global_step": 492391, "epoch": 5932} {"train_loss": -27.24456214904785, "global_step": 492392, "epoch": 5932} {"train_loss": -27.170124053955078, "global_step": 492393, "epoch": 5932} {"train_loss": -27.113758087158203, "global_step": 492394, "epoch": 5932} {"train_loss": -27.137237548828125, "global_step": 492395, "epoch": 5932} {"train_loss": -27.663333892822266, "global_step": 492396, "epoch": 5932} {"train_loss": -27.4145450592041, "global_step": 492397, "epoch": 5932} {"train_loss": -27.319501876831055, "global_step": 492398, "epoch": 5932} {"train_loss": -27.157011032104492, "global_step": 492399, "epoch": 5932} {"train_loss": -27.57868003845215, "global_step": 492400, "epoch": 5932} {"train_loss": -27.35370445251465, "global_step": 492401, "epoch": 5932} {"train_loss": -27.12994956970215, "global_step": 492402, "epoch": 5932} {"train_loss": -27.44170570373535, "global_step": 492403, "epoch": 5932} {"train_loss": -27.520832061767578, "global_step": 492404, "epoch": 5932} {"train_loss": -27.115591049194336, "global_step": 492405, "epoch": 5932} {"train_loss": -27.660566329956055, "global_step": 492406, "epoch": 5932} {"train_loss": -27.593469619750977, "global_step": 492407, "epoch": 5932} {"train_loss": -27.50489616394043, "global_step": 492408, "epoch": 5932} {"train_loss": -27.747907638549805, "global_step": 492409, "epoch": 5932} {"train_loss": -27.163549423217773, "global_step": 492410, "epoch": 5932} {"train_loss": -27.743362426757812, "global_step": 492411, "epoch": 5932} {"train_loss": -27.374469757080078, "global_step": 492412, "epoch": 5932} {"train_loss": -27.398025512695312, "global_step": 492413, "epoch": 5932} {"train_loss": -27.39826774597168, "global_step": 492414, "epoch": 5932} {"train_loss": -27.45062255859375, "global_step": 492415, "epoch": 5932} {"train_loss": -27.448993682861328, "global_step": 492416, "epoch": 5932} {"train_loss": -27.72258949279785, "global_step": 492417, "epoch": 5932} {"train_loss": -27.407068252563477, "global_step": 492418, "epoch": 5932} {"train_loss": -27.608869552612305, "global_step": 492419, "epoch": 5932} {"train_loss": -27.497272491455078, "global_step": 492420, "epoch": 5932} {"train_loss": -27.545141220092773, "global_step": 492421, "epoch": 5932} {"train_loss": -27.232553482055664, "global_step": 492422, "epoch": 5932} {"train_loss": -27.5117244720459, "global_step": 492423, "epoch": 5932} {"train_loss": -27.392047882080078, "global_step": 492424, "epoch": 5932} {"train_loss": -27.205408096313477, "global_step": 492425, "epoch": 5932} {"train_loss": -27.594053268432617, "global_step": 492426, "epoch": 5932} {"train_loss": -27.627166748046875, "global_step": 492427, "epoch": 5932} {"train_loss": -27.35573387145996, "global_step": 492428, "epoch": 5932} {"train_loss": -27.379987716674805, "global_step": 492429, "epoch": 5932} {"train_loss": -27.345413208007812, "global_step": 492430, "epoch": 5932} {"train_loss": -27.661489486694336, "global_step": 492431, "epoch": 5932} {"train_loss": -27.78496742248535, "global_step": 492432, "epoch": 5932} {"train_loss": -27.36775779724121, "global_step": 492433, "epoch": 5932} {"train_loss": -27.659454345703125, "global_step": 492434, "epoch": 5932} {"train_loss": -27.029043197631836, "global_step": 492435, "epoch": 5932} {"train_loss": -27.707284927368164, "global_step": 492436, "epoch": 5932} {"train_loss": -27.4345645904541, "global_step": 492437, "epoch": 5932} {"train_loss": -27.3319074561797, "global_step": 492438, "epoch": 5932, "val_loss": 6670682.0} {"train_loss": -27.314010620117188, "global_step": 492439, "epoch": 5933} {"train_loss": -27.357664108276367, "global_step": 492440, "epoch": 5933} {"train_loss": -26.488866806030273, "global_step": 492441, "epoch": 5933} {"train_loss": -26.82028579711914, "global_step": 492442, "epoch": 5933} {"train_loss": -27.18829917907715, "global_step": 492443, "epoch": 5933} {"train_loss": -26.98211097717285, "global_step": 492444, "epoch": 5933} {"train_loss": -26.710773468017578, "global_step": 492445, "epoch": 5933} {"train_loss": -26.53716468811035, "global_step": 492446, "epoch": 5933} {"train_loss": -27.006641387939453, "global_step": 492447, "epoch": 5933} {"train_loss": -27.307565689086914, "global_step": 492448, "epoch": 5933} {"train_loss": -26.47344970703125, "global_step": 492449, "epoch": 5933} {"train_loss": -26.895709991455078, "global_step": 492450, "epoch": 5933} {"train_loss": -27.064340591430664, "global_step": 492451, "epoch": 5933} {"train_loss": -27.005950927734375, "global_step": 492452, "epoch": 5933} {"train_loss": -27.20711326599121, "global_step": 492453, "epoch": 5933} {"train_loss": -27.126129150390625, "global_step": 492454, "epoch": 5933} {"train_loss": -27.327972412109375, "global_step": 492455, "epoch": 5933} {"train_loss": -27.009475708007812, "global_step": 492456, "epoch": 5933} {"train_loss": -27.10529899597168, "global_step": 492457, "epoch": 5933} {"train_loss": -27.42416763305664, "global_step": 492458, "epoch": 5933} {"train_loss": -26.686330795288086, "global_step": 492459, "epoch": 5933} {"train_loss": -27.509185791015625, "global_step": 492460, "epoch": 5933} {"train_loss": -26.72751808166504, "global_step": 492461, "epoch": 5933} {"train_loss": -27.027088165283203, "global_step": 492462, "epoch": 5933} {"train_loss": -27.282958984375, "global_step": 492463, "epoch": 5933} {"train_loss": -27.31597328186035, "global_step": 492464, "epoch": 5933} {"train_loss": -26.937543869018555, "global_step": 492465, "epoch": 5933} {"train_loss": -27.199995040893555, "global_step": 492466, "epoch": 5933} {"train_loss": -26.929662704467773, "global_step": 492467, "epoch": 5933} {"train_loss": -27.445959091186523, "global_step": 492468, "epoch": 5933} {"train_loss": -26.80279541015625, "global_step": 492469, "epoch": 5933} {"train_loss": -27.467004776000977, "global_step": 492470, "epoch": 5933} {"train_loss": -26.839298248291016, "global_step": 492471, "epoch": 5933} {"train_loss": -27.464282989501953, "global_step": 492472, "epoch": 5933} {"train_loss": -27.319263458251953, "global_step": 492473, "epoch": 5933} {"train_loss": -27.224063873291016, "global_step": 492474, "epoch": 5933} {"train_loss": -27.37556266784668, "global_step": 492475, "epoch": 5933} {"train_loss": -27.13800048828125, "global_step": 492476, "epoch": 5933} {"train_loss": -27.69512939453125, "global_step": 492477, "epoch": 5933} {"train_loss": -27.308317184448242, "global_step": 492478, "epoch": 5933} {"train_loss": -27.220361709594727, "global_step": 492479, "epoch": 5933} {"train_loss": -27.494047164916992, "global_step": 492480, "epoch": 5933} {"train_loss": -27.419218063354492, "global_step": 492481, "epoch": 5933} {"train_loss": -27.255380630493164, "global_step": 492482, "epoch": 5933} {"train_loss": -27.2983341217041, "global_step": 492483, "epoch": 5933} {"train_loss": -27.211963653564453, "global_step": 492484, "epoch": 5933} {"train_loss": -27.112110137939453, "global_step": 492485, "epoch": 5933} {"train_loss": -27.218969345092773, "global_step": 492486, "epoch": 5933} {"train_loss": -26.93719482421875, "global_step": 492487, "epoch": 5933} {"train_loss": -27.394775390625, "global_step": 492488, "epoch": 5933} {"train_loss": -27.33255958557129, "global_step": 492489, "epoch": 5933} {"train_loss": -27.28508949279785, "global_step": 492490, "epoch": 5933} {"train_loss": -27.467426300048828, "global_step": 492491, "epoch": 5933} {"train_loss": -27.49908447265625, "global_step": 492492, "epoch": 5933} {"train_loss": -27.766687393188477, "global_step": 492493, "epoch": 5933} {"train_loss": -27.377655029296875, "global_step": 492494, "epoch": 5933} {"train_loss": -27.441801071166992, "global_step": 492495, "epoch": 5933} {"train_loss": -27.426671981811523, "global_step": 492496, "epoch": 5933} {"train_loss": -27.4332275390625, "global_step": 492497, "epoch": 5933} {"train_loss": -27.526926040649414, "global_step": 492498, "epoch": 5933} {"train_loss": -27.726484298706055, "global_step": 492499, "epoch": 5933} {"train_loss": -27.04071044921875, "global_step": 492500, "epoch": 5933} {"train_loss": -27.268665313720703, "global_step": 492501, "epoch": 5933} {"train_loss": -27.61411476135254, "global_step": 492502, "epoch": 5933} {"train_loss": -27.2768497467041, "global_step": 492503, "epoch": 5933} {"train_loss": -27.415250778198242, "global_step": 492504, "epoch": 5933} {"train_loss": -27.465314865112305, "global_step": 492505, "epoch": 5933} {"train_loss": -27.091100692749023, "global_step": 492506, "epoch": 5933} {"train_loss": -27.663434982299805, "global_step": 492507, "epoch": 5933} {"train_loss": -27.5211181640625, "global_step": 492508, "epoch": 5933} {"train_loss": -27.41314125061035, "global_step": 492509, "epoch": 5933} {"train_loss": -27.197107315063477, "global_step": 492510, "epoch": 5933} {"train_loss": -27.718130111694336, "global_step": 492511, "epoch": 5933} {"train_loss": -27.48276138305664, "global_step": 492512, "epoch": 5933} {"train_loss": -27.40595054626465, "global_step": 492513, "epoch": 5933} {"train_loss": -27.374988555908203, "global_step": 492514, "epoch": 5933} {"train_loss": -27.44339370727539, "global_step": 492515, "epoch": 5933} {"train_loss": -27.333942413330078, "global_step": 492516, "epoch": 5933} {"train_loss": -27.422119140625, "global_step": 492517, "epoch": 5933} {"train_loss": -27.28766441345215, "global_step": 492518, "epoch": 5933} {"train_loss": -27.553913116455078, "global_step": 492519, "epoch": 5933} {"train_loss": -27.749271392822266, "global_step": 492520, "epoch": 5933} {"train_loss": -27.234481903443854, "global_step": 492521, "epoch": 5933, "val_loss": 6532178.0} {"train_loss": -22.96837615966797, "global_step": 492522, "epoch": 5934} {"train_loss": -23.62801170349121, "global_step": 492523, "epoch": 5934} {"train_loss": -25.9914493560791, "global_step": 492524, "epoch": 5934} {"train_loss": -24.79726219177246, "global_step": 492525, "epoch": 5934} {"train_loss": -25.197813034057617, "global_step": 492526, "epoch": 5934} {"train_loss": -25.589744567871094, "global_step": 492527, "epoch": 5934} {"train_loss": -25.71435546875, "global_step": 492528, "epoch": 5934} {"train_loss": -25.37275505065918, "global_step": 492529, "epoch": 5934} {"train_loss": -25.301237106323242, "global_step": 492530, "epoch": 5934} {"train_loss": -26.04412269592285, "global_step": 492531, "epoch": 5934} {"train_loss": -25.4121150970459, "global_step": 492532, "epoch": 5934} {"train_loss": -26.012405395507812, "global_step": 492533, "epoch": 5934} {"train_loss": -25.9623966217041, "global_step": 492534, "epoch": 5934} {"train_loss": -26.025543212890625, "global_step": 492535, "epoch": 5934} {"train_loss": -26.504587173461914, "global_step": 492536, "epoch": 5934} {"train_loss": -26.1694278717041, "global_step": 492537, "epoch": 5934} {"train_loss": -26.03887939453125, "global_step": 492538, "epoch": 5934} {"train_loss": -25.9976806640625, "global_step": 492539, "epoch": 5934} {"train_loss": -25.964834213256836, "global_step": 492540, "epoch": 5934} {"train_loss": -26.660627365112305, "global_step": 492541, "epoch": 5934} {"train_loss": -25.999114990234375, "global_step": 492542, "epoch": 5934} {"train_loss": -26.072284698486328, "global_step": 492543, "epoch": 5934} {"train_loss": -26.60542106628418, "global_step": 492544, "epoch": 5934} {"train_loss": -26.65679359436035, "global_step": 492545, "epoch": 5934} {"train_loss": -26.46430015563965, "global_step": 492546, "epoch": 5934} {"train_loss": -26.43466567993164, "global_step": 492547, "epoch": 5934} {"train_loss": -26.39426612854004, "global_step": 492548, "epoch": 5934} {"train_loss": -26.788663864135742, "global_step": 492549, "epoch": 5934} {"train_loss": -26.6156005859375, "global_step": 492550, "epoch": 5934} {"train_loss": -27.006668090820312, "global_step": 492551, "epoch": 5934} {"train_loss": -27.181493759155273, "global_step": 492552, "epoch": 5934} {"train_loss": -26.9013671875, "global_step": 492553, "epoch": 5934} {"train_loss": -26.628997802734375, "global_step": 492554, "epoch": 5934} {"train_loss": -26.86200523376465, "global_step": 492555, "epoch": 5934} {"train_loss": -26.995813369750977, "global_step": 492556, "epoch": 5934} {"train_loss": -27.152692794799805, "global_step": 492557, "epoch": 5934} {"train_loss": -26.97489356994629, "global_step": 492558, "epoch": 5934} {"train_loss": -26.908552169799805, "global_step": 492559, "epoch": 5934} {"train_loss": -27.37103843688965, "global_step": 492560, "epoch": 5934} {"train_loss": -26.67597007751465, "global_step": 492561, "epoch": 5934} {"train_loss": -27.044967651367188, "global_step": 492562, "epoch": 5934} {"train_loss": -27.133581161499023, "global_step": 492563, "epoch": 5934} {"train_loss": -26.918493270874023, "global_step": 492564, "epoch": 5934} {"train_loss": -27.147504806518555, "global_step": 492565, "epoch": 5934} {"train_loss": -27.204919815063477, "global_step": 492566, "epoch": 5934} {"train_loss": -27.245630264282227, "global_step": 492567, "epoch": 5934} {"train_loss": -27.362567901611328, "global_step": 492568, "epoch": 5934} {"train_loss": -27.084325790405273, "global_step": 492569, "epoch": 5934} {"train_loss": -27.39118003845215, "global_step": 492570, "epoch": 5934} {"train_loss": -27.371505737304688, "global_step": 492571, "epoch": 5934} {"train_loss": -27.317611694335938, "global_step": 492572, "epoch": 5934} {"train_loss": -27.316919326782227, "global_step": 492573, "epoch": 5934} {"train_loss": -27.017370223999023, "global_step": 492574, "epoch": 5934} {"train_loss": -27.48151969909668, "global_step": 492575, "epoch": 5934} {"train_loss": -27.29461097717285, "global_step": 492576, "epoch": 5934} {"train_loss": -27.170063018798828, "global_step": 492577, "epoch": 5934} {"train_loss": -27.360843658447266, "global_step": 492578, "epoch": 5934} {"train_loss": -27.43149185180664, "global_step": 492579, "epoch": 5934} {"train_loss": -27.12470054626465, "global_step": 492580, "epoch": 5934} {"train_loss": -27.293548583984375, "global_step": 492581, "epoch": 5934} {"train_loss": -27.324743270874023, "global_step": 492582, "epoch": 5934} {"train_loss": -27.76942253112793, "global_step": 492583, "epoch": 5934} {"train_loss": -27.45309829711914, "global_step": 492584, "epoch": 5934} {"train_loss": -27.373891830444336, "global_step": 492585, "epoch": 5934} {"train_loss": -27.432907104492188, "global_step": 492586, "epoch": 5934} {"train_loss": -27.1306095123291, "global_step": 492587, "epoch": 5934} {"train_loss": -27.288055419921875, "global_step": 492588, "epoch": 5934} {"train_loss": -27.460439682006836, "global_step": 492589, "epoch": 5934} {"train_loss": -27.41194725036621, "global_step": 492590, "epoch": 5934} {"train_loss": -27.076507568359375, "global_step": 492591, "epoch": 5934} {"train_loss": -27.410465240478516, "global_step": 492592, "epoch": 5934} {"train_loss": -26.916248321533203, "global_step": 492593, "epoch": 5934} {"train_loss": -27.444128036499023, "global_step": 492594, "epoch": 5934} {"train_loss": -27.670928955078125, "global_step": 492595, "epoch": 5934} {"train_loss": -27.922800064086914, "global_step": 492596, "epoch": 5934} {"train_loss": -27.594043731689453, "global_step": 492597, "epoch": 5934} {"train_loss": -27.47748374938965, "global_step": 492598, "epoch": 5934} {"train_loss": -27.216577529907227, "global_step": 492599, "epoch": 5934} {"train_loss": -27.524311065673828, "global_step": 492600, "epoch": 5934} {"train_loss": -27.75172996520996, "global_step": 492601, "epoch": 5934} {"train_loss": -27.227087020874023, "global_step": 492602, "epoch": 5934} {"train_loss": -27.629108428955078, "global_step": 492603, "epoch": 5934} {"train_loss": -26.775867829839868, "global_step": 492604, "epoch": 5934, "val_loss": 6592002.0} {"train_loss": -26.84541130065918, "global_step": 492605, "epoch": 5935} {"train_loss": -26.328693389892578, "global_step": 492606, "epoch": 5935} {"train_loss": -26.28645133972168, "global_step": 492607, "epoch": 5935} {"train_loss": -26.56267738342285, "global_step": 492608, "epoch": 5935} {"train_loss": -26.310867309570312, "global_step": 492609, "epoch": 5935} {"train_loss": -26.770465850830078, "global_step": 492610, "epoch": 5935} {"train_loss": -26.635297775268555, "global_step": 492611, "epoch": 5935} {"train_loss": -26.7075252532959, "global_step": 492612, "epoch": 5935} {"train_loss": -26.84968376159668, "global_step": 492613, "epoch": 5935} {"train_loss": -26.900238037109375, "global_step": 492614, "epoch": 5935} {"train_loss": -26.522113800048828, "global_step": 492615, "epoch": 5935} {"train_loss": -26.83631706237793, "global_step": 492616, "epoch": 5935} {"train_loss": -26.995166778564453, "global_step": 492617, "epoch": 5935} {"train_loss": -26.712081909179688, "global_step": 492618, "epoch": 5935} {"train_loss": -26.750207901000977, "global_step": 492619, "epoch": 5935} {"train_loss": -26.999893188476562, "global_step": 492620, "epoch": 5935} {"train_loss": -26.718236923217773, "global_step": 492621, "epoch": 5935} {"train_loss": -26.77471351623535, "global_step": 492622, "epoch": 5935} {"train_loss": -27.375741958618164, "global_step": 492623, "epoch": 5935} {"train_loss": -26.980581283569336, "global_step": 492624, "epoch": 5935} {"train_loss": -27.23701286315918, "global_step": 492625, "epoch": 5935} {"train_loss": -26.939496994018555, "global_step": 492626, "epoch": 5935} {"train_loss": -27.13590431213379, "global_step": 492627, "epoch": 5935} {"train_loss": -27.087095260620117, "global_step": 492628, "epoch": 5935} {"train_loss": -26.941247940063477, "global_step": 492629, "epoch": 5935} {"train_loss": -27.455127716064453, "global_step": 492630, "epoch": 5935} {"train_loss": -27.02045249938965, "global_step": 492631, "epoch": 5935} {"train_loss": -27.277069091796875, "global_step": 492632, "epoch": 5935} {"train_loss": -26.816736221313477, "global_step": 492633, "epoch": 5935} {"train_loss": -27.358524322509766, "global_step": 492634, "epoch": 5935} {"train_loss": -27.257986068725586, "global_step": 492635, "epoch": 5935} {"train_loss": -27.123432159423828, "global_step": 492636, "epoch": 5935} {"train_loss": -27.167423248291016, "global_step": 492637, "epoch": 5935} {"train_loss": -27.325727462768555, "global_step": 492638, "epoch": 5935} {"train_loss": -27.258161544799805, "global_step": 492639, "epoch": 5935} {"train_loss": -27.450183868408203, "global_step": 492640, "epoch": 5935} {"train_loss": -27.452564239501953, "global_step": 492641, "epoch": 5935} {"train_loss": -26.998510360717773, "global_step": 492642, "epoch": 5935} {"train_loss": -27.594806671142578, "global_step": 492643, "epoch": 5935} {"train_loss": -27.867238998413086, "global_step": 492644, "epoch": 5935} {"train_loss": -27.505374908447266, "global_step": 492645, "epoch": 5935} {"train_loss": -27.448043823242188, "global_step": 492646, "epoch": 5935} {"train_loss": -27.60369300842285, "global_step": 492647, "epoch": 5935} {"train_loss": -27.629810333251953, "global_step": 492648, "epoch": 5935} {"train_loss": -27.817956924438477, "global_step": 492649, "epoch": 5935} {"train_loss": -27.53424644470215, "global_step": 492650, "epoch": 5935} {"train_loss": -27.45525550842285, "global_step": 492651, "epoch": 5935} {"train_loss": -27.328596115112305, "global_step": 492652, "epoch": 5935} {"train_loss": -27.61366081237793, "global_step": 492653, "epoch": 5935} {"train_loss": -27.652484893798828, "global_step": 492654, "epoch": 5935} {"train_loss": -27.219823837280273, "global_step": 492655, "epoch": 5935} {"train_loss": -27.597503662109375, "global_step": 492656, "epoch": 5935} {"train_loss": -27.42608070373535, "global_step": 492657, "epoch": 5935} {"train_loss": -27.698434829711914, "global_step": 492658, "epoch": 5935} {"train_loss": -27.8928279876709, "global_step": 492659, "epoch": 5935} {"train_loss": -27.545398712158203, "global_step": 492660, "epoch": 5935} {"train_loss": -27.590330123901367, "global_step": 492661, "epoch": 5935} {"train_loss": -27.1033935546875, "global_step": 492662, "epoch": 5935} {"train_loss": -27.36537742614746, "global_step": 492663, "epoch": 5935} {"train_loss": -27.129520416259766, "global_step": 492664, "epoch": 5935} {"train_loss": -27.31465721130371, "global_step": 492665, "epoch": 5935} {"train_loss": -27.2364444732666, "global_step": 492666, "epoch": 5935} {"train_loss": -27.556583404541016, "global_step": 492667, "epoch": 5935} {"train_loss": -26.82059669494629, "global_step": 492668, "epoch": 5935} {"train_loss": -26.757415771484375, "global_step": 492669, "epoch": 5935} {"train_loss": -25.862396240234375, "global_step": 492670, "epoch": 5935} {"train_loss": -26.5172061920166, "global_step": 492671, "epoch": 5935} {"train_loss": -27.511505126953125, "global_step": 492672, "epoch": 5935} {"train_loss": -26.904937744140625, "global_step": 492673, "epoch": 5935} {"train_loss": -27.2037296295166, "global_step": 492674, "epoch": 5935} {"train_loss": -27.177976608276367, "global_step": 492675, "epoch": 5935} {"train_loss": -26.803756713867188, "global_step": 492676, "epoch": 5935} {"train_loss": -27.165945053100586, "global_step": 492677, "epoch": 5935} {"train_loss": -27.168228149414062, "global_step": 492678, "epoch": 5935} {"train_loss": -27.164411544799805, "global_step": 492679, "epoch": 5935} {"train_loss": -26.991552352905273, "global_step": 492680, "epoch": 5935} {"train_loss": -27.01199722290039, "global_step": 492681, "epoch": 5935} {"train_loss": -27.312332153320312, "global_step": 492682, "epoch": 5935} {"train_loss": -27.22321128845215, "global_step": 492683, "epoch": 5935} {"train_loss": -27.29737663269043, "global_step": 492684, "epoch": 5935} {"train_loss": -27.134490966796875, "global_step": 492685, "epoch": 5935} {"train_loss": -27.066776275634766, "global_step": 492686, "epoch": 5935} {"train_loss": -27.136592819030028, "global_step": 492687, "epoch": 5935, "val_loss": 6499748.0} {"train_loss": -26.86244010925293, "global_step": 492688, "epoch": 5936} {"train_loss": -26.72951316833496, "global_step": 492689, "epoch": 5936} {"train_loss": -26.267547607421875, "global_step": 492690, "epoch": 5936} {"train_loss": -26.080411911010742, "global_step": 492691, "epoch": 5936} {"train_loss": -25.799896240234375, "global_step": 492692, "epoch": 5936} {"train_loss": -26.075963973999023, "global_step": 492693, "epoch": 5936} {"train_loss": -26.8975830078125, "global_step": 492694, "epoch": 5936} {"train_loss": -26.462427139282227, "global_step": 492695, "epoch": 5936} {"train_loss": -26.619007110595703, "global_step": 492696, "epoch": 5936} {"train_loss": -26.857196807861328, "global_step": 492697, "epoch": 5936} {"train_loss": -26.531885147094727, "global_step": 492698, "epoch": 5936} {"train_loss": -26.9635009765625, "global_step": 492699, "epoch": 5936} {"train_loss": -26.5692138671875, "global_step": 492700, "epoch": 5936} {"train_loss": -26.770465850830078, "global_step": 492701, "epoch": 5936} {"train_loss": -26.888402938842773, "global_step": 492702, "epoch": 5936} {"train_loss": -26.084497451782227, "global_step": 492703, "epoch": 5936} {"train_loss": -26.9951229095459, "global_step": 492704, "epoch": 5936} {"train_loss": -27.006383895874023, "global_step": 492705, "epoch": 5936} {"train_loss": -26.905908584594727, "global_step": 492706, "epoch": 5936} {"train_loss": -26.88656997680664, "global_step": 492707, "epoch": 5936} {"train_loss": -27.088918685913086, "global_step": 492708, "epoch": 5936} {"train_loss": -27.04006004333496, "global_step": 492709, "epoch": 5936} {"train_loss": -26.901748657226562, "global_step": 492710, "epoch": 5936} {"train_loss": -27.217960357666016, "global_step": 492711, "epoch": 5936} {"train_loss": -27.368804931640625, "global_step": 492712, "epoch": 5936} {"train_loss": -27.331039428710938, "global_step": 492713, "epoch": 5936} {"train_loss": -27.38846206665039, "global_step": 492714, "epoch": 5936} {"train_loss": -27.64348793029785, "global_step": 492715, "epoch": 5936} {"train_loss": -26.98076820373535, "global_step": 492716, "epoch": 5936} {"train_loss": -27.071706771850586, "global_step": 492717, "epoch": 5936} {"train_loss": -27.198841094970703, "global_step": 492718, "epoch": 5936} {"train_loss": -27.19439125061035, "global_step": 492719, "epoch": 5936} {"train_loss": -27.44364356994629, "global_step": 492720, "epoch": 5936} {"train_loss": -27.2276668548584, "global_step": 492721, "epoch": 5936} {"train_loss": -27.619754791259766, "global_step": 492722, "epoch": 5936} {"train_loss": -27.26165771484375, "global_step": 492723, "epoch": 5936} {"train_loss": -27.5695743560791, "global_step": 492724, "epoch": 5936} {"train_loss": -27.27554702758789, "global_step": 492725, "epoch": 5936} {"train_loss": -27.316015243530273, "global_step": 492726, "epoch": 5936} {"train_loss": -27.514942169189453, "global_step": 492727, "epoch": 5936} {"train_loss": -27.139928817749023, "global_step": 492728, "epoch": 5936} {"train_loss": -27.110116958618164, "global_step": 492729, "epoch": 5936} {"train_loss": -27.74853515625, "global_step": 492730, "epoch": 5936} {"train_loss": -27.514739990234375, "global_step": 492731, "epoch": 5936} {"train_loss": -27.474645614624023, "global_step": 492732, "epoch": 5936} {"train_loss": -27.577131271362305, "global_step": 492733, "epoch": 5936} {"train_loss": -27.684803009033203, "global_step": 492734, "epoch": 5936} {"train_loss": -27.402667999267578, "global_step": 492735, "epoch": 5936} {"train_loss": -27.48846435546875, "global_step": 492736, "epoch": 5936} {"train_loss": -27.28251075744629, "global_step": 492737, "epoch": 5936} {"train_loss": -27.609180450439453, "global_step": 492738, "epoch": 5936} {"train_loss": -27.8402042388916, "global_step": 492739, "epoch": 5936} {"train_loss": -27.499347686767578, "global_step": 492740, "epoch": 5936} {"train_loss": -27.494953155517578, "global_step": 492741, "epoch": 5936} {"train_loss": -27.796188354492188, "global_step": 492742, "epoch": 5936} {"train_loss": -27.442596435546875, "global_step": 492743, "epoch": 5936} {"train_loss": -27.641727447509766, "global_step": 492744, "epoch": 5936} {"train_loss": -27.724014282226562, "global_step": 492745, "epoch": 5936} {"train_loss": -27.353260040283203, "global_step": 492746, "epoch": 5936} {"train_loss": -27.39398193359375, "global_step": 492747, "epoch": 5936} {"train_loss": -27.287189483642578, "global_step": 492748, "epoch": 5936} {"train_loss": -27.876331329345703, "global_step": 492749, "epoch": 5936} {"train_loss": -27.912841796875, "global_step": 492750, "epoch": 5936} {"train_loss": -27.47406005859375, "global_step": 492751, "epoch": 5936} {"train_loss": -27.59576416015625, "global_step": 492752, "epoch": 5936} {"train_loss": -27.471567153930664, "global_step": 492753, "epoch": 5936} {"train_loss": -27.454145431518555, "global_step": 492754, "epoch": 5936} {"train_loss": -27.41938591003418, "global_step": 492755, "epoch": 5936} {"train_loss": -27.55145835876465, "global_step": 492756, "epoch": 5936} {"train_loss": -27.794437408447266, "global_step": 492757, "epoch": 5936} {"train_loss": -27.4619140625, "global_step": 492758, "epoch": 5936} {"train_loss": -27.69998550415039, "global_step": 492759, "epoch": 5936} {"train_loss": -27.53724479675293, "global_step": 492760, "epoch": 5936} {"train_loss": -27.212865829467773, "global_step": 492761, "epoch": 5936} {"train_loss": -27.688613891601562, "global_step": 492762, "epoch": 5936} {"train_loss": -27.67789649963379, "global_step": 492763, "epoch": 5936} {"train_loss": -27.621185302734375, "global_step": 492764, "epoch": 5936} {"train_loss": -27.583026885986328, "global_step": 492765, "epoch": 5936} {"train_loss": -27.494007110595703, "global_step": 492766, "epoch": 5936} {"train_loss": -27.08302116394043, "global_step": 492767, "epoch": 5936} {"train_loss": -27.429677963256836, "global_step": 492768, "epoch": 5936} {"train_loss": -27.098798751831055, "global_step": 492769, "epoch": 5936} {"train_loss": -27.235235995556934, "global_step": 492770, "epoch": 5936, "val_loss": 6552778.0} {"train_loss": -26.679468154907227, "global_step": 492771, "epoch": 5937} {"train_loss": -26.01215171813965, "global_step": 492772, "epoch": 5937} {"train_loss": -25.511362075805664, "global_step": 492773, "epoch": 5937} {"train_loss": -26.57282066345215, "global_step": 492774, "epoch": 5937} {"train_loss": -26.803638458251953, "global_step": 492775, "epoch": 5937} {"train_loss": -26.312952041625977, "global_step": 492776, "epoch": 5937} {"train_loss": -26.57464027404785, "global_step": 492777, "epoch": 5937} {"train_loss": -26.47638511657715, "global_step": 492778, "epoch": 5937} {"train_loss": -26.752246856689453, "global_step": 492779, "epoch": 5937} {"train_loss": -27.119165420532227, "global_step": 492780, "epoch": 5937} {"train_loss": -27.083837509155273, "global_step": 492781, "epoch": 5937} {"train_loss": -26.901599884033203, "global_step": 492782, "epoch": 5937} {"train_loss": -27.074735641479492, "global_step": 492783, "epoch": 5937} {"train_loss": -27.026060104370117, "global_step": 492784, "epoch": 5937} {"train_loss": -27.149658203125, "global_step": 492785, "epoch": 5937} {"train_loss": -27.0045108795166, "global_step": 492786, "epoch": 5937} {"train_loss": -27.261825561523438, "global_step": 492787, "epoch": 5937} {"train_loss": -27.162443161010742, "global_step": 492788, "epoch": 5937} {"train_loss": -26.848526000976562, "global_step": 492789, "epoch": 5937} {"train_loss": -27.1651611328125, "global_step": 492790, "epoch": 5937} {"train_loss": -27.262928009033203, "global_step": 492791, "epoch": 5937} {"train_loss": -26.989953994750977, "global_step": 492792, "epoch": 5937} {"train_loss": -27.256940841674805, "global_step": 492793, "epoch": 5937} {"train_loss": -27.09517478942871, "global_step": 492794, "epoch": 5937} {"train_loss": -27.051542282104492, "global_step": 492795, "epoch": 5937} {"train_loss": -27.720800399780273, "global_step": 492796, "epoch": 5937} {"train_loss": -27.582265853881836, "global_step": 492797, "epoch": 5937} {"train_loss": -27.35888671875, "global_step": 492798, "epoch": 5937} {"train_loss": -27.344327926635742, "global_step": 492799, "epoch": 5937} {"train_loss": -27.292404174804688, "global_step": 492800, "epoch": 5937} {"train_loss": -27.464597702026367, "global_step": 492801, "epoch": 5937} {"train_loss": -27.35759925842285, "global_step": 492802, "epoch": 5937} {"train_loss": -27.629642486572266, "global_step": 492803, "epoch": 5937} {"train_loss": -27.483585357666016, "global_step": 492804, "epoch": 5937} {"train_loss": -27.44814109802246, "global_step": 492805, "epoch": 5937} {"train_loss": -27.272043228149414, "global_step": 492806, "epoch": 5937} {"train_loss": -27.591384887695312, "global_step": 492807, "epoch": 5937} {"train_loss": -27.386219024658203, "global_step": 492808, "epoch": 5937} {"train_loss": -27.79166030883789, "global_step": 492809, "epoch": 5937} {"train_loss": -27.385915756225586, "global_step": 492810, "epoch": 5937} {"train_loss": -27.67339515686035, "global_step": 492811, "epoch": 5937} {"train_loss": -27.865371704101562, "global_step": 492812, "epoch": 5937} {"train_loss": -27.394834518432617, "global_step": 492813, "epoch": 5937} {"train_loss": -27.2482967376709, "global_step": 492814, "epoch": 5937} {"train_loss": -27.17534828186035, "global_step": 492815, "epoch": 5937} {"train_loss": -27.125436782836914, "global_step": 492816, "epoch": 5937} {"train_loss": -27.465967178344727, "global_step": 492817, "epoch": 5937} {"train_loss": -27.324167251586914, "global_step": 492818, "epoch": 5937} {"train_loss": -27.410985946655273, "global_step": 492819, "epoch": 5937} {"train_loss": -27.596363067626953, "global_step": 492820, "epoch": 5937} {"train_loss": -27.85407066345215, "global_step": 492821, "epoch": 5937} {"train_loss": -27.337759017944336, "global_step": 492822, "epoch": 5937} {"train_loss": -27.538488388061523, "global_step": 492823, "epoch": 5937} {"train_loss": -27.826770782470703, "global_step": 492824, "epoch": 5937} {"train_loss": -27.709308624267578, "global_step": 492825, "epoch": 5937} {"train_loss": -27.39219093322754, "global_step": 492826, "epoch": 5937} {"train_loss": -26.9620304107666, "global_step": 492827, "epoch": 5937} {"train_loss": -27.107351303100586, "global_step": 492828, "epoch": 5937} {"train_loss": -27.400012969970703, "global_step": 492829, "epoch": 5937} {"train_loss": -27.56962013244629, "global_step": 492830, "epoch": 5937} {"train_loss": -27.351348876953125, "global_step": 492831, "epoch": 5937} {"train_loss": -27.483203887939453, "global_step": 492832, "epoch": 5937} {"train_loss": -27.30738639831543, "global_step": 492833, "epoch": 5937} {"train_loss": -26.975860595703125, "global_step": 492834, "epoch": 5937} {"train_loss": -26.981311798095703, "global_step": 492835, "epoch": 5937} {"train_loss": -27.04605484008789, "global_step": 492836, "epoch": 5937} {"train_loss": -27.12225341796875, "global_step": 492837, "epoch": 5937} {"train_loss": -27.431867599487305, "global_step": 492838, "epoch": 5937} {"train_loss": -27.49063491821289, "global_step": 492839, "epoch": 5937} {"train_loss": -27.312469482421875, "global_step": 492840, "epoch": 5937} {"train_loss": -27.41889762878418, "global_step": 492841, "epoch": 5937} {"train_loss": -27.474592208862305, "global_step": 492842, "epoch": 5937} {"train_loss": -27.32425308227539, "global_step": 492843, "epoch": 5937} {"train_loss": -27.202075958251953, "global_step": 492844, "epoch": 5937} {"train_loss": -27.58234214782715, "global_step": 492845, "epoch": 5937} {"train_loss": -27.72051429748535, "global_step": 492846, "epoch": 5937} {"train_loss": -27.191007614135742, "global_step": 492847, "epoch": 5937} {"train_loss": -27.130273818969727, "global_step": 492848, "epoch": 5937} {"train_loss": -27.4875545501709, "global_step": 492849, "epoch": 5937} {"train_loss": -27.24713706970215, "global_step": 492850, "epoch": 5937} {"train_loss": -27.628997802734375, "global_step": 492851, "epoch": 5937} {"train_loss": -27.243961334228516, "global_step": 492852, "epoch": 5937} {"train_loss": -27.2378520046372, "global_step": 492853, "epoch": 5937, "val_loss": 6558816.0} {"train_loss": -26.797582626342773, "global_step": 492854, "epoch": 5938} {"train_loss": -26.131900787353516, "global_step": 492855, "epoch": 5938} {"train_loss": -26.23208999633789, "global_step": 492856, "epoch": 5938} {"train_loss": -25.629169464111328, "global_step": 492857, "epoch": 5938} {"train_loss": -25.8726749420166, "global_step": 492858, "epoch": 5938} {"train_loss": -26.04383659362793, "global_step": 492859, "epoch": 5938} {"train_loss": -26.462940216064453, "global_step": 492860, "epoch": 5938} {"train_loss": -26.615381240844727, "global_step": 492861, "epoch": 5938} {"train_loss": -25.97273826599121, "global_step": 492862, "epoch": 5938} {"train_loss": -26.877363204956055, "global_step": 492863, "epoch": 5938} {"train_loss": -26.533273696899414, "global_step": 492864, "epoch": 5938} {"train_loss": -26.770593643188477, "global_step": 492865, "epoch": 5938} {"train_loss": -26.876373291015625, "global_step": 492866, "epoch": 5938} {"train_loss": -27.024005889892578, "global_step": 492867, "epoch": 5938} {"train_loss": -26.803686141967773, "global_step": 492868, "epoch": 5938} {"train_loss": -26.676218032836914, "global_step": 492869, "epoch": 5938} {"train_loss": -26.670379638671875, "global_step": 492870, "epoch": 5938} {"train_loss": -27.058673858642578, "global_step": 492871, "epoch": 5938} {"train_loss": -26.796585083007812, "global_step": 492872, "epoch": 5938} {"train_loss": -27.135608673095703, "global_step": 492873, "epoch": 5938} {"train_loss": -26.893726348876953, "global_step": 492874, "epoch": 5938} {"train_loss": -26.960159301757812, "global_step": 492875, "epoch": 5938} {"train_loss": -27.017108917236328, "global_step": 492876, "epoch": 5938} {"train_loss": -26.994680404663086, "global_step": 492877, "epoch": 5938} {"train_loss": -26.89552116394043, "global_step": 492878, "epoch": 5938} {"train_loss": -27.13671875, "global_step": 492879, "epoch": 5938} {"train_loss": -27.3436279296875, "global_step": 492880, "epoch": 5938} {"train_loss": -26.89902687072754, "global_step": 492881, "epoch": 5938} {"train_loss": -27.475229263305664, "global_step": 492882, "epoch": 5938} {"train_loss": -27.009815216064453, "global_step": 492883, "epoch": 5938} {"train_loss": -27.354736328125, "global_step": 492884, "epoch": 5938} {"train_loss": -27.33906364440918, "global_step": 492885, "epoch": 5938} {"train_loss": -27.4658260345459, "global_step": 492886, "epoch": 5938} {"train_loss": -26.93572998046875, "global_step": 492887, "epoch": 5938} {"train_loss": -27.558639526367188, "global_step": 492888, "epoch": 5938} {"train_loss": -27.57192039489746, "global_step": 492889, "epoch": 5938} {"train_loss": -27.092193603515625, "global_step": 492890, "epoch": 5938} {"train_loss": -27.381025314331055, "global_step": 492891, "epoch": 5938} {"train_loss": -27.54817008972168, "global_step": 492892, "epoch": 5938} {"train_loss": -27.483686447143555, "global_step": 492893, "epoch": 5938} {"train_loss": -27.48418617248535, "global_step": 492894, "epoch": 5938} {"train_loss": -27.0977725982666, "global_step": 492895, "epoch": 5938} {"train_loss": -27.632963180541992, "global_step": 492896, "epoch": 5938} {"train_loss": -27.48198890686035, "global_step": 492897, "epoch": 5938} {"train_loss": -27.368854522705078, "global_step": 492898, "epoch": 5938} {"train_loss": -27.394262313842773, "global_step": 492899, "epoch": 5938} {"train_loss": -27.42921257019043, "global_step": 492900, "epoch": 5938} {"train_loss": -27.706146240234375, "global_step": 492901, "epoch": 5938} {"train_loss": -27.466663360595703, "global_step": 492902, "epoch": 5938} {"train_loss": -27.59345817565918, "global_step": 492903, "epoch": 5938} {"train_loss": -27.192914962768555, "global_step": 492904, "epoch": 5938} {"train_loss": -27.675683975219727, "global_step": 492905, "epoch": 5938} {"train_loss": -27.565038681030273, "global_step": 492906, "epoch": 5938} {"train_loss": -27.566761016845703, "global_step": 492907, "epoch": 5938} {"train_loss": -27.51960563659668, "global_step": 492908, "epoch": 5938} {"train_loss": -27.466781616210938, "global_step": 492909, "epoch": 5938} {"train_loss": -27.474645614624023, "global_step": 492910, "epoch": 5938} {"train_loss": -27.699369430541992, "global_step": 492911, "epoch": 5938} {"train_loss": -27.411558151245117, "global_step": 492912, "epoch": 5938} {"train_loss": -27.511310577392578, "global_step": 492913, "epoch": 5938} {"train_loss": -27.349973678588867, "global_step": 492914, "epoch": 5938} {"train_loss": -27.354171752929688, "global_step": 492915, "epoch": 5938} {"train_loss": -27.37611198425293, "global_step": 492916, "epoch": 5938} {"train_loss": -27.652353286743164, "global_step": 492917, "epoch": 5938} {"train_loss": -27.579599380493164, "global_step": 492918, "epoch": 5938} {"train_loss": -27.2007999420166, "global_step": 492919, "epoch": 5938} {"train_loss": -27.516956329345703, "global_step": 492920, "epoch": 5938} {"train_loss": -27.578046798706055, "global_step": 492921, "epoch": 5938} {"train_loss": -27.1651668548584, "global_step": 492922, "epoch": 5938} {"train_loss": -27.118383407592773, "global_step": 492923, "epoch": 5938} {"train_loss": -26.816741943359375, "global_step": 492924, "epoch": 5938} {"train_loss": -26.875091552734375, "global_step": 492925, "epoch": 5938} {"train_loss": -27.013473510742188, "global_step": 492926, "epoch": 5938} {"train_loss": -27.234277725219727, "global_step": 492927, "epoch": 5938} {"train_loss": -26.837799072265625, "global_step": 492928, "epoch": 5938} {"train_loss": -27.049291610717773, "global_step": 492929, "epoch": 5938} {"train_loss": -27.160144805908203, "global_step": 492930, "epoch": 5938} {"train_loss": -26.939916610717773, "global_step": 492931, "epoch": 5938} {"train_loss": -27.28895378112793, "global_step": 492932, "epoch": 5938} {"train_loss": -27.31572914123535, "global_step": 492933, "epoch": 5938} {"train_loss": -27.525501251220703, "global_step": 492934, "epoch": 5938} {"train_loss": -27.2982234954834, "global_step": 492935, "epoch": 5938} {"train_loss": -27.125518569027086, "global_step": 492936, "epoch": 5938, "val_loss": 6600563.0} {"train_loss": -26.90321159362793, "global_step": 492937, "epoch": 5939} {"train_loss": -26.893585205078125, "global_step": 492938, "epoch": 5939} {"train_loss": -26.809539794921875, "global_step": 492939, "epoch": 5939} {"train_loss": -26.50397300720215, "global_step": 492940, "epoch": 5939} {"train_loss": -27.120574951171875, "global_step": 492941, "epoch": 5939} {"train_loss": -26.76323890686035, "global_step": 492942, "epoch": 5939} {"train_loss": -26.661096572875977, "global_step": 492943, "epoch": 5939} {"train_loss": -26.22816276550293, "global_step": 492944, "epoch": 5939} {"train_loss": -27.181798934936523, "global_step": 492945, "epoch": 5939} {"train_loss": -26.73076820373535, "global_step": 492946, "epoch": 5939} {"train_loss": -26.87424659729004, "global_step": 492947, "epoch": 5939} {"train_loss": -26.928619384765625, "global_step": 492948, "epoch": 5939} {"train_loss": -27.02790641784668, "global_step": 492949, "epoch": 5939} {"train_loss": -26.854284286499023, "global_step": 492950, "epoch": 5939} {"train_loss": -27.080942153930664, "global_step": 492951, "epoch": 5939} {"train_loss": -26.989521026611328, "global_step": 492952, "epoch": 5939} {"train_loss": -27.0125675201416, "global_step": 492953, "epoch": 5939} {"train_loss": -26.855121612548828, "global_step": 492954, "epoch": 5939} {"train_loss": -27.008535385131836, "global_step": 492955, "epoch": 5939} {"train_loss": -26.962646484375, "global_step": 492956, "epoch": 5939} {"train_loss": -27.384811401367188, "global_step": 492957, "epoch": 5939} {"train_loss": -27.110300064086914, "global_step": 492958, "epoch": 5939} {"train_loss": -27.123865127563477, "global_step": 492959, "epoch": 5939} {"train_loss": -27.173120498657227, "global_step": 492960, "epoch": 5939} {"train_loss": -26.953369140625, "global_step": 492961, "epoch": 5939} {"train_loss": -27.17964744567871, "global_step": 492962, "epoch": 5939} {"train_loss": -27.326257705688477, "global_step": 492963, "epoch": 5939} {"train_loss": -27.136526107788086, "global_step": 492964, "epoch": 5939} {"train_loss": -27.044626235961914, "global_step": 492965, "epoch": 5939} {"train_loss": -27.1748104095459, "global_step": 492966, "epoch": 5939} {"train_loss": -27.08802604675293, "global_step": 492967, "epoch": 5939} {"train_loss": -27.040292739868164, "global_step": 492968, "epoch": 5939} {"train_loss": -27.2073917388916, "global_step": 492969, "epoch": 5939} {"train_loss": -27.642648696899414, "global_step": 492970, "epoch": 5939} {"train_loss": -27.220373153686523, "global_step": 492971, "epoch": 5939} {"train_loss": -27.519256591796875, "global_step": 492972, "epoch": 5939} {"train_loss": -27.21380615234375, "global_step": 492973, "epoch": 5939} {"train_loss": -27.468854904174805, "global_step": 492974, "epoch": 5939} {"train_loss": -27.26715660095215, "global_step": 492975, "epoch": 5939} {"train_loss": -27.591665267944336, "global_step": 492976, "epoch": 5939} {"train_loss": -27.436416625976562, "global_step": 492977, "epoch": 5939} {"train_loss": -27.627487182617188, "global_step": 492978, "epoch": 5939} {"train_loss": -27.485021591186523, "global_step": 492979, "epoch": 5939} {"train_loss": -27.43950843811035, "global_step": 492980, "epoch": 5939} {"train_loss": -27.300048828125, "global_step": 492981, "epoch": 5939} {"train_loss": -27.297346115112305, "global_step": 492982, "epoch": 5939} {"train_loss": -27.591358184814453, "global_step": 492983, "epoch": 5939} {"train_loss": -27.606550216674805, "global_step": 492984, "epoch": 5939} {"train_loss": -27.591306686401367, "global_step": 492985, "epoch": 5939} {"train_loss": -27.334985733032227, "global_step": 492986, "epoch": 5939} {"train_loss": -27.2958927154541, "global_step": 492987, "epoch": 5939} {"train_loss": -27.558252334594727, "global_step": 492988, "epoch": 5939} {"train_loss": -27.378870010375977, "global_step": 492989, "epoch": 5939} {"train_loss": -27.45496940612793, "global_step": 492990, "epoch": 5939} {"train_loss": -26.656970977783203, "global_step": 492991, "epoch": 5939} {"train_loss": -27.37062644958496, "global_step": 492992, "epoch": 5939} {"train_loss": -27.2595157623291, "global_step": 492993, "epoch": 5939} {"train_loss": -27.098114013671875, "global_step": 492994, "epoch": 5939} {"train_loss": -27.134790420532227, "global_step": 492995, "epoch": 5939} {"train_loss": -27.1212215423584, "global_step": 492996, "epoch": 5939} {"train_loss": -27.16877555847168, "global_step": 492997, "epoch": 5939} {"train_loss": -27.077289581298828, "global_step": 492998, "epoch": 5939} {"train_loss": -27.517065048217773, "global_step": 492999, "epoch": 5939} {"train_loss": -26.990997314453125, "global_step": 493000, "epoch": 5939} {"train_loss": -26.906164169311523, "global_step": 493001, "epoch": 5939} {"train_loss": -26.82732582092285, "global_step": 493002, "epoch": 5939} {"train_loss": -27.272445678710938, "global_step": 493003, "epoch": 5939} {"train_loss": -27.276758193969727, "global_step": 493004, "epoch": 5939} {"train_loss": -27.064945220947266, "global_step": 493005, "epoch": 5939} {"train_loss": -26.8203182220459, "global_step": 493006, "epoch": 5939} {"train_loss": -26.7182674407959, "global_step": 493007, "epoch": 5939} {"train_loss": -27.167585372924805, "global_step": 493008, "epoch": 5939} {"train_loss": -27.156982421875, "global_step": 493009, "epoch": 5939} {"train_loss": -27.13739013671875, "global_step": 493010, "epoch": 5939} {"train_loss": -27.216827392578125, "global_step": 493011, "epoch": 5939} {"train_loss": -27.41876792907715, "global_step": 493012, "epoch": 5939} {"train_loss": -27.2358341217041, "global_step": 493013, "epoch": 5939} {"train_loss": -27.490182876586914, "global_step": 493014, "epoch": 5939} {"train_loss": -27.341821670532227, "global_step": 493015, "epoch": 5939} {"train_loss": -27.57034683227539, "global_step": 493016, "epoch": 5939} {"train_loss": -27.233564376831055, "global_step": 493017, "epoch": 5939} {"train_loss": -27.485754013061523, "global_step": 493018, "epoch": 5939} {"train_loss": -27.162259963621576, "global_step": 493019, "epoch": 5939, "val_loss": 6541174.0} {"train_loss": -26.781036376953125, "global_step": 493020, "epoch": 5940} {"train_loss": -26.577960968017578, "global_step": 493021, "epoch": 5940} {"train_loss": -26.749242782592773, "global_step": 493022, "epoch": 5940} {"train_loss": -26.638660430908203, "global_step": 493023, "epoch": 5940} {"train_loss": -26.5480899810791, "global_step": 493024, "epoch": 5940} {"train_loss": -26.999902725219727, "global_step": 493025, "epoch": 5940} {"train_loss": -26.64072608947754, "global_step": 493026, "epoch": 5940} {"train_loss": -26.80415153503418, "global_step": 493027, "epoch": 5940} {"train_loss": -26.885589599609375, "global_step": 493028, "epoch": 5940} {"train_loss": -27.53567886352539, "global_step": 493029, "epoch": 5940} {"train_loss": -27.38758659362793, "global_step": 493030, "epoch": 5940} {"train_loss": -27.218534469604492, "global_step": 493031, "epoch": 5940} {"train_loss": -27.14217185974121, "global_step": 493032, "epoch": 5940} {"train_loss": -26.949966430664062, "global_step": 493033, "epoch": 5940} {"train_loss": -26.725971221923828, "global_step": 493034, "epoch": 5940} {"train_loss": -27.2591609954834, "global_step": 493035, "epoch": 5940} {"train_loss": -27.13164710998535, "global_step": 493036, "epoch": 5940} {"train_loss": -27.0659122467041, "global_step": 493037, "epoch": 5940} {"train_loss": -26.9056453704834, "global_step": 493038, "epoch": 5940} {"train_loss": -27.066797256469727, "global_step": 493039, "epoch": 5940} {"train_loss": -26.938858032226562, "global_step": 493040, "epoch": 5940} {"train_loss": -27.08843421936035, "global_step": 493041, "epoch": 5940} {"train_loss": -27.088306427001953, "global_step": 493042, "epoch": 5940} {"train_loss": -27.155054092407227, "global_step": 493043, "epoch": 5940} {"train_loss": -26.952545166015625, "global_step": 493044, "epoch": 5940} {"train_loss": -27.239980697631836, "global_step": 493045, "epoch": 5940} {"train_loss": -27.129470825195312, "global_step": 493046, "epoch": 5940} {"train_loss": -27.48769187927246, "global_step": 493047, "epoch": 5940} {"train_loss": -27.585651397705078, "global_step": 493048, "epoch": 5940} {"train_loss": -27.20052146911621, "global_step": 493049, "epoch": 5940} {"train_loss": -27.545291900634766, "global_step": 493050, "epoch": 5940} {"train_loss": -27.382394790649414, "global_step": 493051, "epoch": 5940} {"train_loss": -27.368345260620117, "global_step": 493052, "epoch": 5940} {"train_loss": -27.3903865814209, "global_step": 493053, "epoch": 5940} {"train_loss": -27.58780860900879, "global_step": 493054, "epoch": 5940} {"train_loss": -27.391950607299805, "global_step": 493055, "epoch": 5940} {"train_loss": -27.402511596679688, "global_step": 493056, "epoch": 5940} {"train_loss": -27.347524642944336, "global_step": 493057, "epoch": 5940} {"train_loss": -27.45855712890625, "global_step": 493058, "epoch": 5940} {"train_loss": -27.413379669189453, "global_step": 493059, "epoch": 5940} {"train_loss": -27.193933486938477, "global_step": 493060, "epoch": 5940} {"train_loss": -27.538358688354492, "global_step": 493061, "epoch": 5940} {"train_loss": -27.2271671295166, "global_step": 493062, "epoch": 5940} {"train_loss": -27.658811569213867, "global_step": 493063, "epoch": 5940} {"train_loss": -27.656232833862305, "global_step": 493064, "epoch": 5940} {"train_loss": -27.55202293395996, "global_step": 493065, "epoch": 5940} {"train_loss": -27.336339950561523, "global_step": 493066, "epoch": 5940} {"train_loss": -27.72037124633789, "global_step": 493067, "epoch": 5940} {"train_loss": -27.769916534423828, "global_step": 493068, "epoch": 5940} {"train_loss": -27.756223678588867, "global_step": 493069, "epoch": 5940} {"train_loss": -27.3463077545166, "global_step": 493070, "epoch": 5940} {"train_loss": -27.360685348510742, "global_step": 493071, "epoch": 5940} {"train_loss": -27.59125328063965, "global_step": 493072, "epoch": 5940} {"train_loss": -27.69108009338379, "global_step": 493073, "epoch": 5940} {"train_loss": -27.313617706298828, "global_step": 493074, "epoch": 5940} {"train_loss": -27.407983779907227, "global_step": 493075, "epoch": 5940} {"train_loss": -27.40787124633789, "global_step": 493076, "epoch": 5940} {"train_loss": -26.714115142822266, "global_step": 493077, "epoch": 5940} {"train_loss": -26.911914825439453, "global_step": 493078, "epoch": 5940} {"train_loss": -27.200424194335938, "global_step": 493079, "epoch": 5940} {"train_loss": -27.255903244018555, "global_step": 493080, "epoch": 5940} {"train_loss": -26.984155654907227, "global_step": 493081, "epoch": 5940} {"train_loss": -27.246337890625, "global_step": 493082, "epoch": 5940} {"train_loss": -27.317296981811523, "global_step": 493083, "epoch": 5940} {"train_loss": -27.238439559936523, "global_step": 493084, "epoch": 5940} {"train_loss": -26.952396392822266, "global_step": 493085, "epoch": 5940} {"train_loss": -27.15186882019043, "global_step": 493086, "epoch": 5940} {"train_loss": -27.01051139831543, "global_step": 493087, "epoch": 5940} {"train_loss": -27.226816177368164, "global_step": 493088, "epoch": 5940} {"train_loss": -27.042661666870117, "global_step": 493089, "epoch": 5940} {"train_loss": -27.24299430847168, "global_step": 493090, "epoch": 5940} {"train_loss": -27.105093002319336, "global_step": 493091, "epoch": 5940} {"train_loss": -27.553403854370117, "global_step": 493092, "epoch": 5940} {"train_loss": -27.3937931060791, "global_step": 493093, "epoch": 5940} {"train_loss": -27.315876007080078, "global_step": 493094, "epoch": 5940} {"train_loss": -27.489309310913086, "global_step": 493095, "epoch": 5940} {"train_loss": -27.61549186706543, "global_step": 493096, "epoch": 5940} {"train_loss": -27.139352798461914, "global_step": 493097, "epoch": 5940} {"train_loss": -27.119043350219727, "global_step": 493098, "epoch": 5940} {"train_loss": -27.151838302612305, "global_step": 493099, "epoch": 5940} {"train_loss": -27.4808349609375, "global_step": 493100, "epoch": 5940} {"train_loss": -27.64047622680664, "global_step": 493101, "epoch": 5940} {"train_loss": -27.254418062876507, "global_step": 493102, "epoch": 5940, "val_loss": 6611989.5} {"train_loss": -27.02315330505371, "global_step": 493103, "epoch": 5941} {"train_loss": -25.493783950805664, "global_step": 493104, "epoch": 5941} {"train_loss": -26.46077537536621, "global_step": 493105, "epoch": 5941} {"train_loss": -26.69175148010254, "global_step": 493106, "epoch": 5941} {"train_loss": -25.971694946289062, "global_step": 493107, "epoch": 5941} {"train_loss": -26.937580108642578, "global_step": 493108, "epoch": 5941} {"train_loss": -26.84783935546875, "global_step": 493109, "epoch": 5941} {"train_loss": -26.33082389831543, "global_step": 493110, "epoch": 5941} {"train_loss": -27.091785430908203, "global_step": 493111, "epoch": 5941} {"train_loss": -26.154687881469727, "global_step": 493112, "epoch": 5941} {"train_loss": -26.941070556640625, "global_step": 493113, "epoch": 5941} {"train_loss": -26.952478408813477, "global_step": 493114, "epoch": 5941} {"train_loss": -26.7977352142334, "global_step": 493115, "epoch": 5941} {"train_loss": -26.69349479675293, "global_step": 493116, "epoch": 5941} {"train_loss": -27.392837524414062, "global_step": 493117, "epoch": 5941} {"train_loss": -27.02937126159668, "global_step": 493118, "epoch": 5941} {"train_loss": -27.331647872924805, "global_step": 493119, "epoch": 5941} {"train_loss": -27.082727432250977, "global_step": 493120, "epoch": 5941} {"train_loss": -27.022296905517578, "global_step": 493121, "epoch": 5941} {"train_loss": -27.36115837097168, "global_step": 493122, "epoch": 5941} {"train_loss": -27.146387100219727, "global_step": 493123, "epoch": 5941} {"train_loss": -27.190631866455078, "global_step": 493124, "epoch": 5941} {"train_loss": -27.134870529174805, "global_step": 493125, "epoch": 5941} {"train_loss": -27.45502281188965, "global_step": 493126, "epoch": 5941} {"train_loss": -27.337095260620117, "global_step": 493127, "epoch": 5941} {"train_loss": -27.1475830078125, "global_step": 493128, "epoch": 5941} {"train_loss": -27.2602481842041, "global_step": 493129, "epoch": 5941} {"train_loss": -27.425628662109375, "global_step": 493130, "epoch": 5941} {"train_loss": -27.485883712768555, "global_step": 493131, "epoch": 5941} {"train_loss": -27.251928329467773, "global_step": 493132, "epoch": 5941} {"train_loss": -27.08746910095215, "global_step": 493133, "epoch": 5941} {"train_loss": -27.361738204956055, "global_step": 493134, "epoch": 5941} {"train_loss": -27.251007080078125, "global_step": 493135, "epoch": 5941} {"train_loss": -27.556610107421875, "global_step": 493136, "epoch": 5941} {"train_loss": -27.45435905456543, "global_step": 493137, "epoch": 5941} {"train_loss": -27.188764572143555, "global_step": 493138, "epoch": 5941} {"train_loss": -27.462066650390625, "global_step": 493139, "epoch": 5941} {"train_loss": -27.41949462890625, "global_step": 493140, "epoch": 5941} {"train_loss": -27.507375717163086, "global_step": 493141, "epoch": 5941} {"train_loss": -27.446313858032227, "global_step": 493142, "epoch": 5941} {"train_loss": -27.279748916625977, "global_step": 493143, "epoch": 5941} {"train_loss": -27.423246383666992, "global_step": 493144, "epoch": 5941} {"train_loss": -27.53228187561035, "global_step": 493145, "epoch": 5941} {"train_loss": -27.808191299438477, "global_step": 493146, "epoch": 5941} {"train_loss": -27.728078842163086, "global_step": 493147, "epoch": 5941} {"train_loss": -27.57854652404785, "global_step": 493148, "epoch": 5941} {"train_loss": -27.559406280517578, "global_step": 493149, "epoch": 5941} {"train_loss": -27.86041831970215, "global_step": 493150, "epoch": 5941} {"train_loss": -27.78419303894043, "global_step": 493151, "epoch": 5941} {"train_loss": -27.611616134643555, "global_step": 493152, "epoch": 5941} {"train_loss": -27.65530776977539, "global_step": 493153, "epoch": 5941} {"train_loss": -27.413421630859375, "global_step": 493154, "epoch": 5941} {"train_loss": -27.288562774658203, "global_step": 493155, "epoch": 5941} {"train_loss": -27.767078399658203, "global_step": 493156, "epoch": 5941} {"train_loss": -27.578800201416016, "global_step": 493157, "epoch": 5941} {"train_loss": -27.441089630126953, "global_step": 493158, "epoch": 5941} {"train_loss": -27.863052368164062, "global_step": 493159, "epoch": 5941} {"train_loss": -27.32196617126465, "global_step": 493160, "epoch": 5941} {"train_loss": -27.477705001831055, "global_step": 493161, "epoch": 5941} {"train_loss": -27.632959365844727, "global_step": 493162, "epoch": 5941} {"train_loss": -27.92018699645996, "global_step": 493163, "epoch": 5941} {"train_loss": -27.223249435424805, "global_step": 493164, "epoch": 5941} {"train_loss": -27.2137393951416, "global_step": 493165, "epoch": 5941} {"train_loss": -27.656824111938477, "global_step": 493166, "epoch": 5941} {"train_loss": -27.293994903564453, "global_step": 493167, "epoch": 5941} {"train_loss": -27.097593307495117, "global_step": 493168, "epoch": 5941} {"train_loss": -27.2692928314209, "global_step": 493169, "epoch": 5941} {"train_loss": -27.01328468322754, "global_step": 493170, "epoch": 5941} {"train_loss": -27.79359245300293, "global_step": 493171, "epoch": 5941} {"train_loss": -27.365447998046875, "global_step": 493172, "epoch": 5941} {"train_loss": -26.93499183654785, "global_step": 493173, "epoch": 5941} {"train_loss": -27.204181671142578, "global_step": 493174, "epoch": 5941} {"train_loss": -26.964435577392578, "global_step": 493175, "epoch": 5941} {"train_loss": -27.2512149810791, "global_step": 493176, "epoch": 5941} {"train_loss": -27.002918243408203, "global_step": 493177, "epoch": 5941} {"train_loss": -27.576629638671875, "global_step": 493178, "epoch": 5941} {"train_loss": -27.185565948486328, "global_step": 493179, "epoch": 5941} {"train_loss": -27.366836547851562, "global_step": 493180, "epoch": 5941} {"train_loss": -27.59303092956543, "global_step": 493181, "epoch": 5941} {"train_loss": -27.31629753112793, "global_step": 493182, "epoch": 5941} {"train_loss": -27.434341430664062, "global_step": 493183, "epoch": 5941} {"train_loss": -27.1800537109375, "global_step": 493184, "epoch": 5941} {"train_loss": -27.268548919493895, "global_step": 493185, "epoch": 5941, "val_loss": 6597563.0} {"train_loss": -26.177011489868164, "global_step": 493186, "epoch": 5942} {"train_loss": -25.629308700561523, "global_step": 493187, "epoch": 5942} {"train_loss": -26.770841598510742, "global_step": 493188, "epoch": 5942} {"train_loss": -27.115222930908203, "global_step": 493189, "epoch": 5942} {"train_loss": -26.561370849609375, "global_step": 493190, "epoch": 5942} {"train_loss": -27.4206600189209, "global_step": 493191, "epoch": 5942} {"train_loss": -26.93522071838379, "global_step": 493192, "epoch": 5942} {"train_loss": -27.584333419799805, "global_step": 493193, "epoch": 5942} {"train_loss": -26.735151290893555, "global_step": 493194, "epoch": 5942} {"train_loss": -27.437103271484375, "global_step": 493195, "epoch": 5942} {"train_loss": -27.00030517578125, "global_step": 493196, "epoch": 5942} {"train_loss": -27.254438400268555, "global_step": 493197, "epoch": 5942} {"train_loss": -27.433813095092773, "global_step": 493198, "epoch": 5942} {"train_loss": -27.144149780273438, "global_step": 493199, "epoch": 5942} {"train_loss": -27.44634437561035, "global_step": 493200, "epoch": 5942} {"train_loss": -26.850194931030273, "global_step": 493201, "epoch": 5942} {"train_loss": -27.56626319885254, "global_step": 493202, "epoch": 5942} {"train_loss": -27.376468658447266, "global_step": 493203, "epoch": 5942} {"train_loss": -27.22779655456543, "global_step": 493204, "epoch": 5942} {"train_loss": -27.23126792907715, "global_step": 493205, "epoch": 5942} {"train_loss": -27.1884765625, "global_step": 493206, "epoch": 5942} {"train_loss": -27.12788200378418, "global_step": 493207, "epoch": 5942} {"train_loss": -27.2847957611084, "global_step": 493208, "epoch": 5942} {"train_loss": -27.186481475830078, "global_step": 493209, "epoch": 5942} {"train_loss": -27.657184600830078, "global_step": 493210, "epoch": 5942} {"train_loss": -27.584054946899414, "global_step": 493211, "epoch": 5942} {"train_loss": -27.08595085144043, "global_step": 493212, "epoch": 5942} {"train_loss": -27.330957412719727, "global_step": 493213, "epoch": 5942} {"train_loss": -27.146686553955078, "global_step": 493214, "epoch": 5942} {"train_loss": -27.0860652923584, "global_step": 493215, "epoch": 5942} {"train_loss": -27.111413955688477, "global_step": 493216, "epoch": 5942} {"train_loss": -27.1748046875, "global_step": 493217, "epoch": 5942} {"train_loss": -27.45904541015625, "global_step": 493218, "epoch": 5942} {"train_loss": -27.536996841430664, "global_step": 493219, "epoch": 5942} {"train_loss": -27.102895736694336, "global_step": 493220, "epoch": 5942} {"train_loss": -27.29469108581543, "global_step": 493221, "epoch": 5942} {"train_loss": -27.158065795898438, "global_step": 493222, "epoch": 5942} {"train_loss": -27.02754020690918, "global_step": 493223, "epoch": 5942} {"train_loss": -27.254186630249023, "global_step": 493224, "epoch": 5942} {"train_loss": -27.632354736328125, "global_step": 493225, "epoch": 5942} {"train_loss": -27.218402862548828, "global_step": 493226, "epoch": 5942} {"train_loss": -27.671661376953125, "global_step": 493227, "epoch": 5942} {"train_loss": -27.511693954467773, "global_step": 493228, "epoch": 5942} {"train_loss": -27.429962158203125, "global_step": 493229, "epoch": 5942} {"train_loss": -27.281930923461914, "global_step": 493230, "epoch": 5942} {"train_loss": -27.168548583984375, "global_step": 493231, "epoch": 5942} {"train_loss": -27.72893714904785, "global_step": 493232, "epoch": 5942} {"train_loss": -27.415430068969727, "global_step": 493233, "epoch": 5942} {"train_loss": -27.469404220581055, "global_step": 493234, "epoch": 5942} {"train_loss": -27.410436630249023, "global_step": 493235, "epoch": 5942} {"train_loss": -27.1763858795166, "global_step": 493236, "epoch": 5942} {"train_loss": -27.411148071289062, "global_step": 493237, "epoch": 5942} {"train_loss": -27.36699867248535, "global_step": 493238, "epoch": 5942} {"train_loss": -27.402923583984375, "global_step": 493239, "epoch": 5942} {"train_loss": -27.374032974243164, "global_step": 493240, "epoch": 5942} {"train_loss": -27.02228355407715, "global_step": 493241, "epoch": 5942} {"train_loss": -27.477508544921875, "global_step": 493242, "epoch": 5942} {"train_loss": -27.616003036499023, "global_step": 493243, "epoch": 5942} {"train_loss": -27.1041259765625, "global_step": 493244, "epoch": 5942} {"train_loss": -27.579198837280273, "global_step": 493245, "epoch": 5942} {"train_loss": -27.243513107299805, "global_step": 493246, "epoch": 5942} {"train_loss": -27.250431060791016, "global_step": 493247, "epoch": 5942} {"train_loss": -27.528112411499023, "global_step": 493248, "epoch": 5942} {"train_loss": -27.16094970703125, "global_step": 493249, "epoch": 5942} {"train_loss": -27.06952476501465, "global_step": 493250, "epoch": 5942} {"train_loss": -27.082828521728516, "global_step": 493251, "epoch": 5942} {"train_loss": -27.297582626342773, "global_step": 493252, "epoch": 5942} {"train_loss": -26.69138526916504, "global_step": 493253, "epoch": 5942} {"train_loss": -27.8054256439209, "global_step": 493254, "epoch": 5942} {"train_loss": -27.2141056060791, "global_step": 493255, "epoch": 5942} {"train_loss": -26.777963638305664, "global_step": 493256, "epoch": 5942} {"train_loss": -26.768661499023438, "global_step": 493257, "epoch": 5942} {"train_loss": -26.881149291992188, "global_step": 493258, "epoch": 5942} {"train_loss": -27.21156120300293, "global_step": 493259, "epoch": 5942} {"train_loss": -27.38111686706543, "global_step": 493260, "epoch": 5942} {"train_loss": -27.27589225769043, "global_step": 493261, "epoch": 5942} {"train_loss": -27.316919326782227, "global_step": 493262, "epoch": 5942} {"train_loss": -27.672916412353516, "global_step": 493263, "epoch": 5942} {"train_loss": -27.32476234436035, "global_step": 493264, "epoch": 5942} {"train_loss": -27.033100128173828, "global_step": 493265, "epoch": 5942} {"train_loss": -27.22150230407715, "global_step": 493266, "epoch": 5942} {"train_loss": -27.1025390625, "global_step": 493267, "epoch": 5942} {"train_loss": -27.220071195119836, "global_step": 493268, "epoch": 5942, "val_loss": 6540750.0} {"train_loss": -26.902099609375, "global_step": 493269, "epoch": 5943} {"train_loss": -27.082422256469727, "global_step": 493270, "epoch": 5943} {"train_loss": -26.98492431640625, "global_step": 493271, "epoch": 5943} {"train_loss": -26.99751853942871, "global_step": 493272, "epoch": 5943} {"train_loss": -26.592182159423828, "global_step": 493273, "epoch": 5943} {"train_loss": -27.270416259765625, "global_step": 493274, "epoch": 5943} {"train_loss": -26.97328758239746, "global_step": 493275, "epoch": 5943} {"train_loss": -27.210424423217773, "global_step": 493276, "epoch": 5943} {"train_loss": -27.09535026550293, "global_step": 493277, "epoch": 5943} {"train_loss": -27.1893367767334, "global_step": 493278, "epoch": 5943} {"train_loss": -27.157291412353516, "global_step": 493279, "epoch": 5943} {"train_loss": -27.027395248413086, "global_step": 493280, "epoch": 5943} {"train_loss": -27.221281051635742, "global_step": 493281, "epoch": 5943} {"train_loss": -27.234479904174805, "global_step": 493282, "epoch": 5943} {"train_loss": -27.075231552124023, "global_step": 493283, "epoch": 5943} {"train_loss": -27.5333194732666, "global_step": 493284, "epoch": 5943} {"train_loss": -27.43436050415039, "global_step": 493285, "epoch": 5943} {"train_loss": -27.200973510742188, "global_step": 493286, "epoch": 5943} {"train_loss": -27.397998809814453, "global_step": 493287, "epoch": 5943} {"train_loss": -27.1436710357666, "global_step": 493288, "epoch": 5943} {"train_loss": -27.4315185546875, "global_step": 493289, "epoch": 5943} {"train_loss": -27.173925399780273, "global_step": 493290, "epoch": 5943} {"train_loss": -27.510900497436523, "global_step": 493291, "epoch": 5943} {"train_loss": -27.719970703125, "global_step": 493292, "epoch": 5943} {"train_loss": -27.021421432495117, "global_step": 493293, "epoch": 5943} {"train_loss": -27.549585342407227, "global_step": 493294, "epoch": 5943} {"train_loss": -27.34866714477539, "global_step": 493295, "epoch": 5943} {"train_loss": -27.5576229095459, "global_step": 493296, "epoch": 5943} {"train_loss": -27.4736385345459, "global_step": 493297, "epoch": 5943} {"train_loss": -27.275741577148438, "global_step": 493298, "epoch": 5943} {"train_loss": -27.334644317626953, "global_step": 493299, "epoch": 5943} {"train_loss": -27.747711181640625, "global_step": 493300, "epoch": 5943} {"train_loss": -27.376737594604492, "global_step": 493301, "epoch": 5943} {"train_loss": -27.42947769165039, "global_step": 493302, "epoch": 5943} {"train_loss": -27.45831298828125, "global_step": 493303, "epoch": 5943} {"train_loss": -27.483922958374023, "global_step": 493304, "epoch": 5943} {"train_loss": -27.374174118041992, "global_step": 493305, "epoch": 5943} {"train_loss": -27.34635353088379, "global_step": 493306, "epoch": 5943} {"train_loss": -27.541227340698242, "global_step": 493307, "epoch": 5943} {"train_loss": -27.251850128173828, "global_step": 493308, "epoch": 5943} {"train_loss": -27.243783950805664, "global_step": 493309, "epoch": 5943} {"train_loss": -27.65874671936035, "global_step": 493310, "epoch": 5943} {"train_loss": -27.076950073242188, "global_step": 493311, "epoch": 5943} {"train_loss": -27.47596549987793, "global_step": 493312, "epoch": 5943} {"train_loss": -27.109619140625, "global_step": 493313, "epoch": 5943} {"train_loss": -27.19325065612793, "global_step": 493314, "epoch": 5943} {"train_loss": -27.125375747680664, "global_step": 493315, "epoch": 5943} {"train_loss": -27.695083618164062, "global_step": 493316, "epoch": 5943} {"train_loss": -27.246557235717773, "global_step": 493317, "epoch": 5943} {"train_loss": -27.12452507019043, "global_step": 493318, "epoch": 5943} {"train_loss": -27.451313018798828, "global_step": 493319, "epoch": 5943} {"train_loss": -27.271224975585938, "global_step": 493320, "epoch": 5943} {"train_loss": -27.587377548217773, "global_step": 493321, "epoch": 5943} {"train_loss": -27.12579345703125, "global_step": 493322, "epoch": 5943} {"train_loss": -27.377790451049805, "global_step": 493323, "epoch": 5943} {"train_loss": -27.34173583984375, "global_step": 493324, "epoch": 5943} {"train_loss": -27.647480010986328, "global_step": 493325, "epoch": 5943} {"train_loss": -27.527942657470703, "global_step": 493326, "epoch": 5943} {"train_loss": -26.79833984375, "global_step": 493327, "epoch": 5943} {"train_loss": -27.30970573425293, "global_step": 493328, "epoch": 5943} {"train_loss": -27.081775665283203, "global_step": 493329, "epoch": 5943} {"train_loss": -27.088153839111328, "global_step": 493330, "epoch": 5943} {"train_loss": -27.288251876831055, "global_step": 493331, "epoch": 5943} {"train_loss": -27.297800064086914, "global_step": 493332, "epoch": 5943} {"train_loss": -27.320371627807617, "global_step": 493333, "epoch": 5943} {"train_loss": -27.666913986206055, "global_step": 493334, "epoch": 5943} {"train_loss": -27.189483642578125, "global_step": 493335, "epoch": 5943} {"train_loss": -27.481306076049805, "global_step": 493336, "epoch": 5943} {"train_loss": -27.276172637939453, "global_step": 493337, "epoch": 5943} {"train_loss": -27.517942428588867, "global_step": 493338, "epoch": 5943} {"train_loss": -27.765518188476562, "global_step": 493339, "epoch": 5943} {"train_loss": -27.213104248046875, "global_step": 493340, "epoch": 5943} {"train_loss": -27.800750732421875, "global_step": 493341, "epoch": 5943} {"train_loss": -26.98641014099121, "global_step": 493342, "epoch": 5943} {"train_loss": -27.580291748046875, "global_step": 493343, "epoch": 5943} {"train_loss": -27.199575424194336, "global_step": 493344, "epoch": 5943} {"train_loss": -26.961450576782227, "global_step": 493345, "epoch": 5943} {"train_loss": -27.272119522094727, "global_step": 493346, "epoch": 5943} {"train_loss": -27.325916290283203, "global_step": 493347, "epoch": 5943} {"train_loss": -27.483346939086914, "global_step": 493348, "epoch": 5943} {"train_loss": -27.49708366394043, "global_step": 493349, "epoch": 5943} {"train_loss": -27.440122604370117, "global_step": 493350, "epoch": 5943} {"train_loss": -27.293314577585242, "global_step": 493351, "epoch": 5943, "val_loss": 6641566.0} {"train_loss": -27.151351928710938, "global_step": 493352, "epoch": 5944} {"train_loss": -26.061298370361328, "global_step": 493353, "epoch": 5944} {"train_loss": -26.638477325439453, "global_step": 493354, "epoch": 5944} {"train_loss": -26.435773849487305, "global_step": 493355, "epoch": 5944} {"train_loss": -25.9617919921875, "global_step": 493356, "epoch": 5944} {"train_loss": -26.967741012573242, "global_step": 493357, "epoch": 5944} {"train_loss": -26.498157501220703, "global_step": 493358, "epoch": 5944} {"train_loss": -26.8291072845459, "global_step": 493359, "epoch": 5944} {"train_loss": -26.482141494750977, "global_step": 493360, "epoch": 5944} {"train_loss": -27.1254825592041, "global_step": 493361, "epoch": 5944} {"train_loss": -26.783639907836914, "global_step": 493362, "epoch": 5944} {"train_loss": -27.099740982055664, "global_step": 493363, "epoch": 5944} {"train_loss": -27.044910430908203, "global_step": 493364, "epoch": 5944} {"train_loss": -27.173803329467773, "global_step": 493365, "epoch": 5944} {"train_loss": -26.78769302368164, "global_step": 493366, "epoch": 5944} {"train_loss": -27.1226863861084, "global_step": 493367, "epoch": 5944} {"train_loss": -26.775665283203125, "global_step": 493368, "epoch": 5944} {"train_loss": -27.026336669921875, "global_step": 493369, "epoch": 5944} {"train_loss": -27.144912719726562, "global_step": 493370, "epoch": 5944} {"train_loss": -27.017797470092773, "global_step": 493371, "epoch": 5944} {"train_loss": -26.940876007080078, "global_step": 493372, "epoch": 5944} {"train_loss": -27.158477783203125, "global_step": 493373, "epoch": 5944} {"train_loss": -27.417322158813477, "global_step": 493374, "epoch": 5944} {"train_loss": -27.18779945373535, "global_step": 493375, "epoch": 5944} {"train_loss": -27.22609519958496, "global_step": 493376, "epoch": 5944} {"train_loss": -27.0616397857666, "global_step": 493377, "epoch": 5944} {"train_loss": -27.476545333862305, "global_step": 493378, "epoch": 5944} {"train_loss": -27.312238693237305, "global_step": 493379, "epoch": 5944} {"train_loss": -27.285070419311523, "global_step": 493380, "epoch": 5944} {"train_loss": -27.3968505859375, "global_step": 493381, "epoch": 5944} {"train_loss": -27.527265548706055, "global_step": 493382, "epoch": 5944} {"train_loss": -27.74613380432129, "global_step": 493383, "epoch": 5944} {"train_loss": -27.5336856842041, "global_step": 493384, "epoch": 5944} {"train_loss": -26.94156265258789, "global_step": 493385, "epoch": 5944} {"train_loss": -27.373498916625977, "global_step": 493386, "epoch": 5944} {"train_loss": -27.491857528686523, "global_step": 493387, "epoch": 5944} {"train_loss": -27.532535552978516, "global_step": 493388, "epoch": 5944} {"train_loss": -27.263092041015625, "global_step": 493389, "epoch": 5944} {"train_loss": -27.09848976135254, "global_step": 493390, "epoch": 5944} {"train_loss": -26.951215744018555, "global_step": 493391, "epoch": 5944} {"train_loss": -26.7512264251709, "global_step": 493392, "epoch": 5944} {"train_loss": -26.90508460998535, "global_step": 493393, "epoch": 5944} {"train_loss": -27.17469596862793, "global_step": 493394, "epoch": 5944} {"train_loss": -27.462507247924805, "global_step": 493395, "epoch": 5944} {"train_loss": -27.414777755737305, "global_step": 493396, "epoch": 5944} {"train_loss": -27.470746994018555, "global_step": 493397, "epoch": 5944} {"train_loss": -27.360248565673828, "global_step": 493398, "epoch": 5944} {"train_loss": -27.670984268188477, "global_step": 493399, "epoch": 5944} {"train_loss": -27.196796417236328, "global_step": 493400, "epoch": 5944} {"train_loss": -27.371051788330078, "global_step": 493401, "epoch": 5944} {"train_loss": -27.255634307861328, "global_step": 493402, "epoch": 5944} {"train_loss": -27.364133834838867, "global_step": 493403, "epoch": 5944} {"train_loss": -27.482023239135742, "global_step": 493404, "epoch": 5944} {"train_loss": -27.454975128173828, "global_step": 493405, "epoch": 5944} {"train_loss": -27.58009910583496, "global_step": 493406, "epoch": 5944} {"train_loss": -27.605371475219727, "global_step": 493407, "epoch": 5944} {"train_loss": -27.415851593017578, "global_step": 493408, "epoch": 5944} {"train_loss": -27.188779830932617, "global_step": 493409, "epoch": 5944} {"train_loss": -27.766468048095703, "global_step": 493410, "epoch": 5944} {"train_loss": -27.796630859375, "global_step": 493411, "epoch": 5944} {"train_loss": -27.32229995727539, "global_step": 493412, "epoch": 5944} {"train_loss": -27.0784969329834, "global_step": 493413, "epoch": 5944} {"train_loss": -27.59246253967285, "global_step": 493414, "epoch": 5944} {"train_loss": -27.17431640625, "global_step": 493415, "epoch": 5944} {"train_loss": -27.482147216796875, "global_step": 493416, "epoch": 5944} {"train_loss": -27.199857711791992, "global_step": 493417, "epoch": 5944} {"train_loss": -27.226797103881836, "global_step": 493418, "epoch": 5944} {"train_loss": -26.818252563476562, "global_step": 493419, "epoch": 5944} {"train_loss": -27.470067977905273, "global_step": 493420, "epoch": 5944} {"train_loss": -27.800628662109375, "global_step": 493421, "epoch": 5944} {"train_loss": -27.576923370361328, "global_step": 493422, "epoch": 5944} {"train_loss": -27.02508544921875, "global_step": 493423, "epoch": 5944} {"train_loss": -27.777814865112305, "global_step": 493424, "epoch": 5944} {"train_loss": -27.285184860229492, "global_step": 493425, "epoch": 5944} {"train_loss": -27.49932861328125, "global_step": 493426, "epoch": 5944} {"train_loss": -27.016813278198242, "global_step": 493427, "epoch": 5944} {"train_loss": -27.495481491088867, "global_step": 493428, "epoch": 5944} {"train_loss": -27.1259708404541, "global_step": 493429, "epoch": 5944} {"train_loss": -27.236974716186523, "global_step": 493430, "epoch": 5944} {"train_loss": -27.5631160736084, "global_step": 493431, "epoch": 5944} {"train_loss": -27.253570556640625, "global_step": 493432, "epoch": 5944} {"train_loss": -26.686124801635742, "global_step": 493433, "epoch": 5944} {"train_loss": -27.180619044476245, "global_step": 493434, "epoch": 5944, "val_loss": 6557331.0} {"train_loss": -25.9852237701416, "global_step": 493435, "epoch": 5945} {"train_loss": -25.8515567779541, "global_step": 493436, "epoch": 5945} {"train_loss": -27.0624942779541, "global_step": 493437, "epoch": 5945} {"train_loss": -26.47454261779785, "global_step": 493438, "epoch": 5945} {"train_loss": -26.250690460205078, "global_step": 493439, "epoch": 5945} {"train_loss": -26.94618034362793, "global_step": 493440, "epoch": 5945} {"train_loss": -26.14423179626465, "global_step": 493441, "epoch": 5945} {"train_loss": -26.714553833007812, "global_step": 493442, "epoch": 5945} {"train_loss": -26.535003662109375, "global_step": 493443, "epoch": 5945} {"train_loss": -26.50681495666504, "global_step": 493444, "epoch": 5945} {"train_loss": -26.32508659362793, "global_step": 493445, "epoch": 5945} {"train_loss": -26.878253936767578, "global_step": 493446, "epoch": 5945} {"train_loss": -27.0111083984375, "global_step": 493447, "epoch": 5945} {"train_loss": -27.118488311767578, "global_step": 493448, "epoch": 5945} {"train_loss": -26.644617080688477, "global_step": 493449, "epoch": 5945} {"train_loss": -27.148681640625, "global_step": 493450, "epoch": 5945} {"train_loss": -27.08734130859375, "global_step": 493451, "epoch": 5945} {"train_loss": -26.78004264831543, "global_step": 493452, "epoch": 5945} {"train_loss": -27.016233444213867, "global_step": 493453, "epoch": 5945} {"train_loss": -27.06467628479004, "global_step": 493454, "epoch": 5945} {"train_loss": -26.936798095703125, "global_step": 493455, "epoch": 5945} {"train_loss": -26.978361129760742, "global_step": 493456, "epoch": 5945} {"train_loss": -27.04876708984375, "global_step": 493457, "epoch": 5945} {"train_loss": -27.043073654174805, "global_step": 493458, "epoch": 5945} {"train_loss": -27.342493057250977, "global_step": 493459, "epoch": 5945} {"train_loss": -27.33465003967285, "global_step": 493460, "epoch": 5945} {"train_loss": -27.149744033813477, "global_step": 493461, "epoch": 5945} {"train_loss": -27.4427547454834, "global_step": 493462, "epoch": 5945} {"train_loss": -27.083206176757812, "global_step": 493463, "epoch": 5945} {"train_loss": -26.970386505126953, "global_step": 493464, "epoch": 5945} {"train_loss": -27.22023582458496, "global_step": 493465, "epoch": 5945} {"train_loss": -27.172351837158203, "global_step": 493466, "epoch": 5945} {"train_loss": -27.341938018798828, "global_step": 493467, "epoch": 5945} {"train_loss": -27.329450607299805, "global_step": 493468, "epoch": 5945} {"train_loss": -27.365427017211914, "global_step": 493469, "epoch": 5945} {"train_loss": -27.374876022338867, "global_step": 493470, "epoch": 5945} {"train_loss": -27.313690185546875, "global_step": 493471, "epoch": 5945} {"train_loss": -27.437397003173828, "global_step": 493472, "epoch": 5945} {"train_loss": -27.311460494995117, "global_step": 493473, "epoch": 5945} {"train_loss": -27.38168716430664, "global_step": 493474, "epoch": 5945} {"train_loss": -27.38892936706543, "global_step": 493475, "epoch": 5945} {"train_loss": -27.5445613861084, "global_step": 493476, "epoch": 5945} {"train_loss": -27.380218505859375, "global_step": 493477, "epoch": 5945} {"train_loss": -27.367145538330078, "global_step": 493478, "epoch": 5945} {"train_loss": -27.146087646484375, "global_step": 493479, "epoch": 5945} {"train_loss": -27.419097900390625, "global_step": 493480, "epoch": 5945} {"train_loss": -27.734989166259766, "global_step": 493481, "epoch": 5945} {"train_loss": -27.443647384643555, "global_step": 493482, "epoch": 5945} {"train_loss": -27.5057373046875, "global_step": 493483, "epoch": 5945} {"train_loss": -27.116300582885742, "global_step": 493484, "epoch": 5945} {"train_loss": -27.439844131469727, "global_step": 493485, "epoch": 5945} {"train_loss": -27.025815963745117, "global_step": 493486, "epoch": 5945} {"train_loss": -27.749399185180664, "global_step": 493487, "epoch": 5945} {"train_loss": -27.268354415893555, "global_step": 493488, "epoch": 5945} {"train_loss": -27.47310447692871, "global_step": 493489, "epoch": 5945} {"train_loss": -27.092859268188477, "global_step": 493490, "epoch": 5945} {"train_loss": -27.23133659362793, "global_step": 493491, "epoch": 5945} {"train_loss": -27.430395126342773, "global_step": 493492, "epoch": 5945} {"train_loss": -27.56324577331543, "global_step": 493493, "epoch": 5945} {"train_loss": -27.27314567565918, "global_step": 493494, "epoch": 5945} {"train_loss": -27.356237411499023, "global_step": 493495, "epoch": 5945} {"train_loss": -27.60993766784668, "global_step": 493496, "epoch": 5945} {"train_loss": -27.503870010375977, "global_step": 493497, "epoch": 5945} {"train_loss": -27.647165298461914, "global_step": 493498, "epoch": 5945} {"train_loss": -27.221952438354492, "global_step": 493499, "epoch": 5945} {"train_loss": -27.32889175415039, "global_step": 493500, "epoch": 5945} {"train_loss": -27.28203773498535, "global_step": 493501, "epoch": 5945} {"train_loss": -27.294544219970703, "global_step": 493502, "epoch": 5945} {"train_loss": -27.422637939453125, "global_step": 493503, "epoch": 5945} {"train_loss": -26.998310089111328, "global_step": 493504, "epoch": 5945} {"train_loss": -26.8419246673584, "global_step": 493505, "epoch": 5945} {"train_loss": -27.1544246673584, "global_step": 493506, "epoch": 5945} {"train_loss": -27.177717208862305, "global_step": 493507, "epoch": 5945} {"train_loss": -27.057886123657227, "global_step": 493508, "epoch": 5945} {"train_loss": -27.471115112304688, "global_step": 493509, "epoch": 5945} {"train_loss": -27.740766525268555, "global_step": 493510, "epoch": 5945} {"train_loss": -27.51264762878418, "global_step": 493511, "epoch": 5945} {"train_loss": -27.369104385375977, "global_step": 493512, "epoch": 5945} {"train_loss": -27.682153701782227, "global_step": 493513, "epoch": 5945} {"train_loss": -27.608905792236328, "global_step": 493514, "epoch": 5945} {"train_loss": -27.259235382080078, "global_step": 493515, "epoch": 5945} {"train_loss": -27.590423583984375, "global_step": 493516, "epoch": 5945} {"train_loss": -27.166725503392968, "global_step": 493517, "epoch": 5945, "val_loss": 6682488.0} {"train_loss": -27.059650421142578, "global_step": 493518, "epoch": 5946} {"train_loss": -27.0728816986084, "global_step": 493519, "epoch": 5946} {"train_loss": -27.486433029174805, "global_step": 493520, "epoch": 5946} {"train_loss": -27.022186279296875, "global_step": 493521, "epoch": 5946} {"train_loss": -27.065170288085938, "global_step": 493522, "epoch": 5946} {"train_loss": -26.98520851135254, "global_step": 493523, "epoch": 5946} {"train_loss": -27.019750595092773, "global_step": 493524, "epoch": 5946} {"train_loss": -27.31879997253418, "global_step": 493525, "epoch": 5946} {"train_loss": -27.050317764282227, "global_step": 493526, "epoch": 5946} {"train_loss": -27.198871612548828, "global_step": 493527, "epoch": 5946} {"train_loss": -27.344709396362305, "global_step": 493528, "epoch": 5946} {"train_loss": -27.083189010620117, "global_step": 493529, "epoch": 5946} {"train_loss": -27.189626693725586, "global_step": 493530, "epoch": 5946} {"train_loss": -27.643054962158203, "global_step": 493531, "epoch": 5946} {"train_loss": -26.942707061767578, "global_step": 493532, "epoch": 5946} {"train_loss": -27.2418212890625, "global_step": 493533, "epoch": 5946} {"train_loss": -27.291635513305664, "global_step": 493534, "epoch": 5946} {"train_loss": -27.404052734375, "global_step": 493535, "epoch": 5946} {"train_loss": -26.9990234375, "global_step": 493536, "epoch": 5946} {"train_loss": -27.000654220581055, "global_step": 493537, "epoch": 5946} {"train_loss": -27.396350860595703, "global_step": 493538, "epoch": 5946} {"train_loss": -27.448593139648438, "global_step": 493539, "epoch": 5946} {"train_loss": -27.632781982421875, "global_step": 493540, "epoch": 5946} {"train_loss": -27.5308780670166, "global_step": 493541, "epoch": 5946} {"train_loss": -27.513751983642578, "global_step": 493542, "epoch": 5946} {"train_loss": -27.226673126220703, "global_step": 493543, "epoch": 5946} {"train_loss": -27.318639755249023, "global_step": 493544, "epoch": 5946} {"train_loss": -27.473159790039062, "global_step": 493545, "epoch": 5946} {"train_loss": -27.17598533630371, "global_step": 493546, "epoch": 5946} {"train_loss": -27.156091690063477, "global_step": 493547, "epoch": 5946} {"train_loss": -27.586200714111328, "global_step": 493548, "epoch": 5946} {"train_loss": -27.530780792236328, "global_step": 493549, "epoch": 5946} {"train_loss": -27.5791072845459, "global_step": 493550, "epoch": 5946} {"train_loss": -27.53426170349121, "global_step": 493551, "epoch": 5946} {"train_loss": -27.454492568969727, "global_step": 493552, "epoch": 5946} {"train_loss": -27.50086784362793, "global_step": 493553, "epoch": 5946} {"train_loss": -27.40633201599121, "global_step": 493554, "epoch": 5946} {"train_loss": -27.455541610717773, "global_step": 493555, "epoch": 5946} {"train_loss": -27.380447387695312, "global_step": 493556, "epoch": 5946} {"train_loss": -27.461685180664062, "global_step": 493557, "epoch": 5946} {"train_loss": -27.35029411315918, "global_step": 493558, "epoch": 5946} {"train_loss": -27.560565948486328, "global_step": 493559, "epoch": 5946} {"train_loss": -27.652372360229492, "global_step": 493560, "epoch": 5946} {"train_loss": -27.369699478149414, "global_step": 493561, "epoch": 5946} {"train_loss": -27.361539840698242, "global_step": 493562, "epoch": 5946} {"train_loss": -27.307296752929688, "global_step": 493563, "epoch": 5946} {"train_loss": -27.218860626220703, "global_step": 493564, "epoch": 5946} {"train_loss": -27.123632431030273, "global_step": 493565, "epoch": 5946} {"train_loss": -27.578710556030273, "global_step": 493566, "epoch": 5946} {"train_loss": -27.31985855102539, "global_step": 493567, "epoch": 5946} {"train_loss": -27.320348739624023, "global_step": 493568, "epoch": 5946} {"train_loss": -26.784971237182617, "global_step": 493569, "epoch": 5946} {"train_loss": -27.123807907104492, "global_step": 493570, "epoch": 5946} {"train_loss": -27.120962142944336, "global_step": 493571, "epoch": 5946} {"train_loss": -27.054540634155273, "global_step": 493572, "epoch": 5946} {"train_loss": -26.70656394958496, "global_step": 493573, "epoch": 5946} {"train_loss": -27.36844825744629, "global_step": 493574, "epoch": 5946} {"train_loss": -27.051685333251953, "global_step": 493575, "epoch": 5946} {"train_loss": -27.136877059936523, "global_step": 493576, "epoch": 5946} {"train_loss": -27.075519561767578, "global_step": 493577, "epoch": 5946} {"train_loss": -27.438430786132812, "global_step": 493578, "epoch": 5946} {"train_loss": -27.185333251953125, "global_step": 493579, "epoch": 5946} {"train_loss": -27.18401527404785, "global_step": 493580, "epoch": 5946} {"train_loss": -27.071699142456055, "global_step": 493581, "epoch": 5946} {"train_loss": -27.00383949279785, "global_step": 493582, "epoch": 5946} {"train_loss": -27.055822372436523, "global_step": 493583, "epoch": 5946} {"train_loss": -27.224781036376953, "global_step": 493584, "epoch": 5946} {"train_loss": -27.379316329956055, "global_step": 493585, "epoch": 5946} {"train_loss": -27.12982177734375, "global_step": 493586, "epoch": 5946} {"train_loss": -27.215576171875, "global_step": 493587, "epoch": 5946} {"train_loss": -27.4329891204834, "global_step": 493588, "epoch": 5946} {"train_loss": -27.436603546142578, "global_step": 493589, "epoch": 5946} {"train_loss": -26.8740177154541, "global_step": 493590, "epoch": 5946} {"train_loss": -27.368024826049805, "global_step": 493591, "epoch": 5946} {"train_loss": -27.020429611206055, "global_step": 493592, "epoch": 5946} {"train_loss": -27.069839477539062, "global_step": 493593, "epoch": 5946} {"train_loss": -27.432540893554688, "global_step": 493594, "epoch": 5946} {"train_loss": -27.23286247253418, "global_step": 493595, "epoch": 5946} {"train_loss": -27.263931274414062, "global_step": 493596, "epoch": 5946} {"train_loss": -27.596349716186523, "global_step": 493597, "epoch": 5946} {"train_loss": -27.2112979888916, "global_step": 493598, "epoch": 5946} {"train_loss": -27.15704917907715, "global_step": 493599, "epoch": 5946} {"train_loss": -27.27067499275667, "global_step": 493600, "epoch": 5946, "val_loss": 6624350.0} {"train_loss": -26.866790771484375, "global_step": 493601, "epoch": 5947} {"train_loss": -26.833179473876953, "global_step": 493602, "epoch": 5947} {"train_loss": -27.000396728515625, "global_step": 493603, "epoch": 5947} {"train_loss": -26.56867790222168, "global_step": 493604, "epoch": 5947} {"train_loss": -26.868284225463867, "global_step": 493605, "epoch": 5947} {"train_loss": -26.618906021118164, "global_step": 493606, "epoch": 5947} {"train_loss": -27.121967315673828, "global_step": 493607, "epoch": 5947} {"train_loss": -26.943220138549805, "global_step": 493608, "epoch": 5947} {"train_loss": -26.505115509033203, "global_step": 493609, "epoch": 5947} {"train_loss": -26.928058624267578, "global_step": 493610, "epoch": 5947} {"train_loss": -26.980670928955078, "global_step": 493611, "epoch": 5947} {"train_loss": -26.865076065063477, "global_step": 493612, "epoch": 5947} {"train_loss": -27.01239013671875, "global_step": 493613, "epoch": 5947} {"train_loss": -26.858489990234375, "global_step": 493614, "epoch": 5947} {"train_loss": -26.974029541015625, "global_step": 493615, "epoch": 5947} {"train_loss": -26.948888778686523, "global_step": 493616, "epoch": 5947} {"train_loss": -27.378355026245117, "global_step": 493617, "epoch": 5947} {"train_loss": -27.009485244750977, "global_step": 493618, "epoch": 5947} {"train_loss": -27.121353149414062, "global_step": 493619, "epoch": 5947} {"train_loss": -27.358083724975586, "global_step": 493620, "epoch": 5947} {"train_loss": -27.02606773376465, "global_step": 493621, "epoch": 5947} {"train_loss": -26.9605655670166, "global_step": 493622, "epoch": 5947} {"train_loss": -27.48529624938965, "global_step": 493623, "epoch": 5947} {"train_loss": -26.888351440429688, "global_step": 493624, "epoch": 5947} {"train_loss": -26.98533058166504, "global_step": 493625, "epoch": 5947} {"train_loss": -26.526403427124023, "global_step": 493626, "epoch": 5947} {"train_loss": -27.33087730407715, "global_step": 493627, "epoch": 5947} {"train_loss": -27.435346603393555, "global_step": 493628, "epoch": 5947} {"train_loss": -27.2496280670166, "global_step": 493629, "epoch": 5947} {"train_loss": -27.2333927154541, "global_step": 493630, "epoch": 5947} {"train_loss": -27.255054473876953, "global_step": 493631, "epoch": 5947} {"train_loss": -27.2476863861084, "global_step": 493632, "epoch": 5947} {"train_loss": -27.12151527404785, "global_step": 493633, "epoch": 5947} {"train_loss": -27.220006942749023, "global_step": 493634, "epoch": 5947} {"train_loss": -27.417409896850586, "global_step": 493635, "epoch": 5947} {"train_loss": -27.346790313720703, "global_step": 493636, "epoch": 5947} {"train_loss": -27.531171798706055, "global_step": 493637, "epoch": 5947} {"train_loss": -27.31393814086914, "global_step": 493638, "epoch": 5947} {"train_loss": -27.18241310119629, "global_step": 493639, "epoch": 5947} {"train_loss": -27.14473533630371, "global_step": 493640, "epoch": 5947} {"train_loss": -27.43655776977539, "global_step": 493641, "epoch": 5947} {"train_loss": -27.33579444885254, "global_step": 493642, "epoch": 5947} {"train_loss": -27.429189682006836, "global_step": 493643, "epoch": 5947} {"train_loss": -27.00341796875, "global_step": 493644, "epoch": 5947} {"train_loss": -27.1845703125, "global_step": 493645, "epoch": 5947} {"train_loss": -27.340290069580078, "global_step": 493646, "epoch": 5947} {"train_loss": -27.416675567626953, "global_step": 493647, "epoch": 5947} {"train_loss": -27.25581932067871, "global_step": 493648, "epoch": 5947} {"train_loss": -27.16471290588379, "global_step": 493649, "epoch": 5947} {"train_loss": -27.27716636657715, "global_step": 493650, "epoch": 5947} {"train_loss": -27.126510620117188, "global_step": 493651, "epoch": 5947} {"train_loss": -27.798675537109375, "global_step": 493652, "epoch": 5947} {"train_loss": -27.7292537689209, "global_step": 493653, "epoch": 5947} {"train_loss": -27.417621612548828, "global_step": 493654, "epoch": 5947} {"train_loss": -27.53596305847168, "global_step": 493655, "epoch": 5947} {"train_loss": -27.292829513549805, "global_step": 493656, "epoch": 5947} {"train_loss": -27.888065338134766, "global_step": 493657, "epoch": 5947} {"train_loss": -27.175168991088867, "global_step": 493658, "epoch": 5947} {"train_loss": -27.46366310119629, "global_step": 493659, "epoch": 5947} {"train_loss": -27.790699005126953, "global_step": 493660, "epoch": 5947} {"train_loss": -27.60906982421875, "global_step": 493661, "epoch": 5947} {"train_loss": -27.545515060424805, "global_step": 493662, "epoch": 5947} {"train_loss": -27.396671295166016, "global_step": 493663, "epoch": 5947} {"train_loss": -27.665863037109375, "global_step": 493664, "epoch": 5947} {"train_loss": -27.508899688720703, "global_step": 493665, "epoch": 5947} {"train_loss": -27.05292320251465, "global_step": 493666, "epoch": 5947} {"train_loss": -27.34989356994629, "global_step": 493667, "epoch": 5947} {"train_loss": -27.40337562561035, "global_step": 493668, "epoch": 5947} {"train_loss": -27.196075439453125, "global_step": 493669, "epoch": 5947} {"train_loss": -27.204578399658203, "global_step": 493670, "epoch": 5947} {"train_loss": -27.28753662109375, "global_step": 493671, "epoch": 5947} {"train_loss": -27.05194664001465, "global_step": 493672, "epoch": 5947} {"train_loss": -27.193517684936523, "global_step": 493673, "epoch": 5947} {"train_loss": -27.079294204711914, "global_step": 493674, "epoch": 5947} {"train_loss": -26.825153350830078, "global_step": 493675, "epoch": 5947} {"train_loss": -27.467477798461914, "global_step": 493676, "epoch": 5947} {"train_loss": -27.18165397644043, "global_step": 493677, "epoch": 5947} {"train_loss": -27.440275192260742, "global_step": 493678, "epoch": 5947} {"train_loss": -26.704870223999023, "global_step": 493679, "epoch": 5947} {"train_loss": -26.815540313720703, "global_step": 493680, "epoch": 5947} {"train_loss": -27.03358268737793, "global_step": 493681, "epoch": 5947} {"train_loss": -27.515928268432617, "global_step": 493682, "epoch": 5947} {"train_loss": -27.183420319155037, "global_step": 493683, "epoch": 5947, "val_loss": 6575182.0} {"train_loss": -26.923376083374023, "global_step": 493684, "epoch": 5948} {"train_loss": -27.299762725830078, "global_step": 493685, "epoch": 5948} {"train_loss": -26.839406967163086, "global_step": 493686, "epoch": 5948} {"train_loss": -27.169864654541016, "global_step": 493687, "epoch": 5948} {"train_loss": -27.157520294189453, "global_step": 493688, "epoch": 5948} {"train_loss": -26.971221923828125, "global_step": 493689, "epoch": 5948} {"train_loss": -26.982641220092773, "global_step": 493690, "epoch": 5948} {"train_loss": -27.140974044799805, "global_step": 493691, "epoch": 5948} {"train_loss": -26.886280059814453, "global_step": 493692, "epoch": 5948} {"train_loss": -27.25868797302246, "global_step": 493693, "epoch": 5948} {"train_loss": -27.191694259643555, "global_step": 493694, "epoch": 5948} {"train_loss": -26.828107833862305, "global_step": 493695, "epoch": 5948} {"train_loss": -27.266462326049805, "global_step": 493696, "epoch": 5948} {"train_loss": -26.837665557861328, "global_step": 493697, "epoch": 5948} {"train_loss": -27.159887313842773, "global_step": 493698, "epoch": 5948} {"train_loss": -27.223546981811523, "global_step": 493699, "epoch": 5948} {"train_loss": -27.38714599609375, "global_step": 493700, "epoch": 5948} {"train_loss": -26.838449478149414, "global_step": 493701, "epoch": 5948} {"train_loss": -26.9979190826416, "global_step": 493702, "epoch": 5948} {"train_loss": -27.051034927368164, "global_step": 493703, "epoch": 5948} {"train_loss": -27.51837158203125, "global_step": 493704, "epoch": 5948} {"train_loss": -27.21831703186035, "global_step": 493705, "epoch": 5948} {"train_loss": -26.798059463500977, "global_step": 493706, "epoch": 5948} {"train_loss": -26.879119873046875, "global_step": 493707, "epoch": 5948} {"train_loss": -27.207311630249023, "global_step": 493708, "epoch": 5948} {"train_loss": -27.547208786010742, "global_step": 493709, "epoch": 5948} {"train_loss": -27.013540267944336, "global_step": 493710, "epoch": 5948} {"train_loss": -27.17915916442871, "global_step": 493711, "epoch": 5948} {"train_loss": -27.320758819580078, "global_step": 493712, "epoch": 5948} {"train_loss": -27.308765411376953, "global_step": 493713, "epoch": 5948} {"train_loss": -27.5087833404541, "global_step": 493714, "epoch": 5948} {"train_loss": -27.567121505737305, "global_step": 493715, "epoch": 5948} {"train_loss": -27.006223678588867, "global_step": 493716, "epoch": 5948} {"train_loss": -27.432233810424805, "global_step": 493717, "epoch": 5948} {"train_loss": -27.370594024658203, "global_step": 493718, "epoch": 5948} {"train_loss": -27.30242347717285, "global_step": 493719, "epoch": 5948} {"train_loss": -27.42856216430664, "global_step": 493720, "epoch": 5948} {"train_loss": -27.2574405670166, "global_step": 493721, "epoch": 5948} {"train_loss": -27.590131759643555, "global_step": 493722, "epoch": 5948} {"train_loss": -27.564666748046875, "global_step": 493723, "epoch": 5948} {"train_loss": -27.398218154907227, "global_step": 493724, "epoch": 5948} {"train_loss": -27.35127067565918, "global_step": 493725, "epoch": 5948} {"train_loss": -27.442296981811523, "global_step": 493726, "epoch": 5948} {"train_loss": -27.669397354125977, "global_step": 493727, "epoch": 5948} {"train_loss": -27.532114028930664, "global_step": 493728, "epoch": 5948} {"train_loss": -27.2889404296875, "global_step": 493729, "epoch": 5948} {"train_loss": -27.37220573425293, "global_step": 493730, "epoch": 5948} {"train_loss": -27.422086715698242, "global_step": 493731, "epoch": 5948} {"train_loss": -27.386167526245117, "global_step": 493732, "epoch": 5948} {"train_loss": -27.845380783081055, "global_step": 493733, "epoch": 5948} {"train_loss": -27.462804794311523, "global_step": 493734, "epoch": 5948} {"train_loss": -27.443256378173828, "global_step": 493735, "epoch": 5948} {"train_loss": -27.499784469604492, "global_step": 493736, "epoch": 5948} {"train_loss": -27.628376007080078, "global_step": 493737, "epoch": 5948} {"train_loss": -27.45448112487793, "global_step": 493738, "epoch": 5948} {"train_loss": -27.60764503479004, "global_step": 493739, "epoch": 5948} {"train_loss": -27.555572509765625, "global_step": 493740, "epoch": 5948} {"train_loss": -27.52948570251465, "global_step": 493741, "epoch": 5948} {"train_loss": -27.3209228515625, "global_step": 493742, "epoch": 5948} {"train_loss": -27.3709659576416, "global_step": 493743, "epoch": 5948} {"train_loss": -27.546552658081055, "global_step": 493744, "epoch": 5948} {"train_loss": -27.5247859954834, "global_step": 493745, "epoch": 5948} {"train_loss": -27.192556381225586, "global_step": 493746, "epoch": 5948} {"train_loss": -26.912885665893555, "global_step": 493747, "epoch": 5948} {"train_loss": -26.502256393432617, "global_step": 493748, "epoch": 5948} {"train_loss": -26.731897354125977, "global_step": 493749, "epoch": 5948} {"train_loss": -27.052793502807617, "global_step": 493750, "epoch": 5948} {"train_loss": -26.871810913085938, "global_step": 493751, "epoch": 5948} {"train_loss": -27.28407096862793, "global_step": 493752, "epoch": 5948} {"train_loss": -27.572189331054688, "global_step": 493753, "epoch": 5948} {"train_loss": -27.104772567749023, "global_step": 493754, "epoch": 5948} {"train_loss": -27.590179443359375, "global_step": 493755, "epoch": 5948} {"train_loss": -27.4107723236084, "global_step": 493756, "epoch": 5948} {"train_loss": -27.500961303710938, "global_step": 493757, "epoch": 5948} {"train_loss": -27.389484405517578, "global_step": 493758, "epoch": 5948} {"train_loss": -27.07411003112793, "global_step": 493759, "epoch": 5948} {"train_loss": -27.20480728149414, "global_step": 493760, "epoch": 5948} {"train_loss": -27.5977840423584, "global_step": 493761, "epoch": 5948} {"train_loss": -27.395963668823242, "global_step": 493762, "epoch": 5948} {"train_loss": -27.09673500061035, "global_step": 493763, "epoch": 5948} {"train_loss": -27.320022583007812, "global_step": 493764, "epoch": 5948} {"train_loss": -27.37774085998535, "global_step": 493765, "epoch": 5948} {"train_loss": -27.275423739329877, "global_step": 493766, "epoch": 5948, "val_loss": 6635173.0} {"train_loss": -26.948225021362305, "global_step": 493767, "epoch": 5949} {"train_loss": -26.18181800842285, "global_step": 493768, "epoch": 5949} {"train_loss": -26.747547149658203, "global_step": 493769, "epoch": 5949} {"train_loss": -26.816259384155273, "global_step": 493770, "epoch": 5949} {"train_loss": -26.3656005859375, "global_step": 493771, "epoch": 5949} {"train_loss": -26.81646156311035, "global_step": 493772, "epoch": 5949} {"train_loss": -26.776718139648438, "global_step": 493773, "epoch": 5949} {"train_loss": -26.241230010986328, "global_step": 493774, "epoch": 5949} {"train_loss": -26.990055084228516, "global_step": 493775, "epoch": 5949} {"train_loss": -26.443195343017578, "global_step": 493776, "epoch": 5949} {"train_loss": -26.937244415283203, "global_step": 493777, "epoch": 5949} {"train_loss": -26.60239028930664, "global_step": 493778, "epoch": 5949} {"train_loss": -27.060596466064453, "global_step": 493779, "epoch": 5949} {"train_loss": -27.528867721557617, "global_step": 493780, "epoch": 5949} {"train_loss": -26.983545303344727, "global_step": 493781, "epoch": 5949} {"train_loss": -26.958662033081055, "global_step": 493782, "epoch": 5949} {"train_loss": -26.833871841430664, "global_step": 493783, "epoch": 5949} {"train_loss": -26.94338035583496, "global_step": 493784, "epoch": 5949} {"train_loss": -26.972997665405273, "global_step": 493785, "epoch": 5949} {"train_loss": -27.077661514282227, "global_step": 493786, "epoch": 5949} {"train_loss": -26.90533447265625, "global_step": 493787, "epoch": 5949} {"train_loss": -27.005163192749023, "global_step": 493788, "epoch": 5949} {"train_loss": -26.96356773376465, "global_step": 493789, "epoch": 5949} {"train_loss": -27.262760162353516, "global_step": 493790, "epoch": 5949} {"train_loss": -26.96278190612793, "global_step": 493791, "epoch": 5949} {"train_loss": -27.060705184936523, "global_step": 493792, "epoch": 5949} {"train_loss": -27.073749542236328, "global_step": 493793, "epoch": 5949} {"train_loss": -27.190692901611328, "global_step": 493794, "epoch": 5949} {"train_loss": -27.05964469909668, "global_step": 493795, "epoch": 5949} {"train_loss": -27.062335968017578, "global_step": 493796, "epoch": 5949} {"train_loss": -27.121383666992188, "global_step": 493797, "epoch": 5949} {"train_loss": -27.7396297454834, "global_step": 493798, "epoch": 5949} {"train_loss": -27.13689613342285, "global_step": 493799, "epoch": 5949} {"train_loss": -27.0651798248291, "global_step": 493800, "epoch": 5949} {"train_loss": -27.141061782836914, "global_step": 493801, "epoch": 5949} {"train_loss": -27.06510353088379, "global_step": 493802, "epoch": 5949} {"train_loss": -27.29360008239746, "global_step": 493803, "epoch": 5949} {"train_loss": -27.320154190063477, "global_step": 493804, "epoch": 5949} {"train_loss": -27.406421661376953, "global_step": 493805, "epoch": 5949} {"train_loss": -27.54896354675293, "global_step": 493806, "epoch": 5949} {"train_loss": -27.3164119720459, "global_step": 493807, "epoch": 5949} {"train_loss": -27.087127685546875, "global_step": 493808, "epoch": 5949} {"train_loss": -27.367084503173828, "global_step": 493809, "epoch": 5949} {"train_loss": -27.200611114501953, "global_step": 493810, "epoch": 5949} {"train_loss": -27.314971923828125, "global_step": 493811, "epoch": 5949} {"train_loss": -27.50275230407715, "global_step": 493812, "epoch": 5949} {"train_loss": -27.64507484436035, "global_step": 493813, "epoch": 5949} {"train_loss": -27.179840087890625, "global_step": 493814, "epoch": 5949} {"train_loss": -27.191598892211914, "global_step": 493815, "epoch": 5949} {"train_loss": -27.344518661499023, "global_step": 493816, "epoch": 5949} {"train_loss": -27.574811935424805, "global_step": 493817, "epoch": 5949} {"train_loss": -27.4256649017334, "global_step": 493818, "epoch": 5949} {"train_loss": -27.781774520874023, "global_step": 493819, "epoch": 5949} {"train_loss": -27.477481842041016, "global_step": 493820, "epoch": 5949} {"train_loss": -27.181360244750977, "global_step": 493821, "epoch": 5949} {"train_loss": -26.462921142578125, "global_step": 493822, "epoch": 5949} {"train_loss": -27.011947631835938, "global_step": 493823, "epoch": 5949} {"train_loss": -27.32465171813965, "global_step": 493824, "epoch": 5949} {"train_loss": -27.57062339782715, "global_step": 493825, "epoch": 5949} {"train_loss": -27.15791893005371, "global_step": 493826, "epoch": 5949} {"train_loss": -27.232080459594727, "global_step": 493827, "epoch": 5949} {"train_loss": -27.512725830078125, "global_step": 493828, "epoch": 5949} {"train_loss": -27.37200355529785, "global_step": 493829, "epoch": 5949} {"train_loss": -26.87434196472168, "global_step": 493830, "epoch": 5949} {"train_loss": -26.821548461914062, "global_step": 493831, "epoch": 5949} {"train_loss": -26.820138931274414, "global_step": 493832, "epoch": 5949} {"train_loss": -27.087177276611328, "global_step": 493833, "epoch": 5949} {"train_loss": -27.16219139099121, "global_step": 493834, "epoch": 5949} {"train_loss": -26.616912841796875, "global_step": 493835, "epoch": 5949} {"train_loss": -27.370086669921875, "global_step": 493836, "epoch": 5949} {"train_loss": -27.2805233001709, "global_step": 493837, "epoch": 5949} {"train_loss": -26.69317626953125, "global_step": 493838, "epoch": 5949} {"train_loss": -27.4775447845459, "global_step": 493839, "epoch": 5949} {"train_loss": -26.944690704345703, "global_step": 493840, "epoch": 5949} {"train_loss": -26.991886138916016, "global_step": 493841, "epoch": 5949} {"train_loss": -26.953006744384766, "global_step": 493842, "epoch": 5949} {"train_loss": -27.269256591796875, "global_step": 493843, "epoch": 5949} {"train_loss": -27.23910903930664, "global_step": 493844, "epoch": 5949} {"train_loss": -26.933120727539062, "global_step": 493845, "epoch": 5949} {"train_loss": -26.762540817260742, "global_step": 493846, "epoch": 5949} {"train_loss": -27.061664581298828, "global_step": 493847, "epoch": 5949} {"train_loss": -27.108280181884766, "global_step": 493848, "epoch": 5949} {"train_loss": -27.089101308799652, "global_step": 493849, "epoch": 5949, "val_loss": 6591611.0} {"train_loss": -26.38100242614746, "global_step": 493850, "epoch": 5950} {"train_loss": -26.2917537689209, "global_step": 493851, "epoch": 5950} {"train_loss": -26.725189208984375, "global_step": 493852, "epoch": 5950} {"train_loss": -26.573781967163086, "global_step": 493853, "epoch": 5950} {"train_loss": -26.673175811767578, "global_step": 493854, "epoch": 5950} {"train_loss": -26.58638572692871, "global_step": 493855, "epoch": 5950} {"train_loss": -26.267139434814453, "global_step": 493856, "epoch": 5950} {"train_loss": -26.721860885620117, "global_step": 493857, "epoch": 5950} {"train_loss": -26.720611572265625, "global_step": 493858, "epoch": 5950} {"train_loss": -26.897388458251953, "global_step": 493859, "epoch": 5950} {"train_loss": -27.07865333557129, "global_step": 493860, "epoch": 5950} {"train_loss": -26.692569732666016, "global_step": 493861, "epoch": 5950} {"train_loss": -27.396963119506836, "global_step": 493862, "epoch": 5950} {"train_loss": -26.7669734954834, "global_step": 493863, "epoch": 5950} {"train_loss": -27.0467472076416, "global_step": 493864, "epoch": 5950} {"train_loss": -27.215240478515625, "global_step": 493865, "epoch": 5950} {"train_loss": -27.103906631469727, "global_step": 493866, "epoch": 5950} {"train_loss": -27.06756019592285, "global_step": 493867, "epoch": 5950} {"train_loss": -27.229345321655273, "global_step": 493868, "epoch": 5950} {"train_loss": -27.258291244506836, "global_step": 493869, "epoch": 5950} {"train_loss": -27.464923858642578, "global_step": 493870, "epoch": 5950} {"train_loss": -26.951629638671875, "global_step": 493871, "epoch": 5950} {"train_loss": -27.458642959594727, "global_step": 493872, "epoch": 5950} {"train_loss": -27.337926864624023, "global_step": 493873, "epoch": 5950} {"train_loss": -26.975080490112305, "global_step": 493874, "epoch": 5950} {"train_loss": -27.397415161132812, "global_step": 493875, "epoch": 5950} {"train_loss": -27.389083862304688, "global_step": 493876, "epoch": 5950} {"train_loss": -27.21343994140625, "global_step": 493877, "epoch": 5950} {"train_loss": -27.186498641967773, "global_step": 493878, "epoch": 5950} {"train_loss": -27.60633659362793, "global_step": 493879, "epoch": 5950} {"train_loss": -27.39896583557129, "global_step": 493880, "epoch": 5950} {"train_loss": -27.42959976196289, "global_step": 493881, "epoch": 5950} {"train_loss": -27.27796745300293, "global_step": 493882, "epoch": 5950} {"train_loss": -27.043561935424805, "global_step": 493883, "epoch": 5950} {"train_loss": -27.392913818359375, "global_step": 493884, "epoch": 5950} {"train_loss": -27.598554611206055, "global_step": 493885, "epoch": 5950} {"train_loss": -27.360523223876953, "global_step": 493886, "epoch": 5950} {"train_loss": -27.000934600830078, "global_step": 493887, "epoch": 5950} {"train_loss": -27.416919708251953, "global_step": 493888, "epoch": 5950} {"train_loss": -27.266759872436523, "global_step": 493889, "epoch": 5950} {"train_loss": -27.235504150390625, "global_step": 493890, "epoch": 5950} {"train_loss": -27.26365089416504, "global_step": 493891, "epoch": 5950} {"train_loss": -27.435977935791016, "global_step": 493892, "epoch": 5950} {"train_loss": -27.304243087768555, "global_step": 493893, "epoch": 5950} {"train_loss": -27.299962997436523, "global_step": 493894, "epoch": 5950} {"train_loss": -27.234851837158203, "global_step": 493895, "epoch": 5950} {"train_loss": -27.321319580078125, "global_step": 493896, "epoch": 5950} {"train_loss": -27.655805587768555, "global_step": 493897, "epoch": 5950} {"train_loss": -27.332563400268555, "global_step": 493898, "epoch": 5950} {"train_loss": -27.652191162109375, "global_step": 493899, "epoch": 5950} {"train_loss": -27.318744659423828, "global_step": 493900, "epoch": 5950} {"train_loss": -27.5278263092041, "global_step": 493901, "epoch": 5950} {"train_loss": -27.070409774780273, "global_step": 493902, "epoch": 5950} {"train_loss": -26.948776245117188, "global_step": 493903, "epoch": 5950} {"train_loss": -27.318883895874023, "global_step": 493904, "epoch": 5950} {"train_loss": -27.612075805664062, "global_step": 493905, "epoch": 5950} {"train_loss": -26.895282745361328, "global_step": 493906, "epoch": 5950} {"train_loss": -26.536161422729492, "global_step": 493907, "epoch": 5950} {"train_loss": -26.9716854095459, "global_step": 493908, "epoch": 5950} {"train_loss": -27.255878448486328, "global_step": 493909, "epoch": 5950} {"train_loss": -27.096210479736328, "global_step": 493910, "epoch": 5950} {"train_loss": -27.525959014892578, "global_step": 493911, "epoch": 5950} {"train_loss": -26.7720947265625, "global_step": 493912, "epoch": 5950} {"train_loss": -27.422821044921875, "global_step": 493913, "epoch": 5950} {"train_loss": -27.170515060424805, "global_step": 493914, "epoch": 5950} {"train_loss": -27.403234481811523, "global_step": 493915, "epoch": 5950} {"train_loss": -26.95771598815918, "global_step": 493916, "epoch": 5950} {"train_loss": -27.650318145751953, "global_step": 493917, "epoch": 5950} {"train_loss": -27.18678855895996, "global_step": 493918, "epoch": 5950} {"train_loss": -26.9351806640625, "global_step": 493919, "epoch": 5950} {"train_loss": -27.27606773376465, "global_step": 493920, "epoch": 5950} {"train_loss": -27.091039657592773, "global_step": 493921, "epoch": 5950} {"train_loss": -26.412750244140625, "global_step": 493922, "epoch": 5950} {"train_loss": -26.637720108032227, "global_step": 493923, "epoch": 5950} {"train_loss": -27.102338790893555, "global_step": 493924, "epoch": 5950} {"train_loss": -26.32459831237793, "global_step": 493925, "epoch": 5950} {"train_loss": -26.899694442749023, "global_step": 493926, "epoch": 5950} {"train_loss": -27.321035385131836, "global_step": 493927, "epoch": 5950} {"train_loss": -26.9144344329834, "global_step": 493928, "epoch": 5950} {"train_loss": -27.045408248901367, "global_step": 493929, "epoch": 5950} {"train_loss": -26.997589111328125, "global_step": 493930, "epoch": 5950} {"train_loss": -27.296279907226562, "global_step": 493931, "epoch": 5950} {"train_loss": -27.11168831515025, "global_step": 493932, "epoch": 5950, "train/sim_max_reward_0": 0.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4500000": 1.0, "test/sim_max_reward_4500001": 1.0, "test/sim_max_reward_4500002": 1.0, "test/sim_max_reward_4500003": 1.0, "test/sim_max_reward_4500004": 0.0, "test/sim_max_reward_4500005": 1.0, "test/sim_max_reward_4500006": 1.0, "test/sim_max_reward_4500007": 0.0, "test/sim_max_reward_4500008": 1.0, "test/sim_max_reward_4500009": 1.0, "test/sim_max_reward_4500010": 1.0, "test/sim_max_reward_4500011": 1.0, "test/sim_max_reward_4500012": 1.0, "test/sim_max_reward_4500013": 1.0, "test/sim_max_reward_4500014": 1.0, "test/sim_max_reward_4500015": 1.0, "test/sim_max_reward_4500016": 1.0, "test/sim_max_reward_4500017": 1.0, "test/sim_max_reward_4500018": 0.0, "test/sim_max_reward_4500019": 1.0, "test/sim_max_reward_4500020": 1.0, "test/sim_max_reward_4500021": 1.0, "train/mean_score": 0.8333333333333334, "test/mean_score": 0.8636363636363636, "val_loss": 6664158.5} {"train_loss": -26.278623580932617, "global_step": 493933, "epoch": 5951} {"train_loss": -26.222482681274414, "global_step": 493934, "epoch": 5951} {"train_loss": -26.5052547454834, "global_step": 493935, "epoch": 5951} {"train_loss": -26.053882598876953, "global_step": 493936, "epoch": 5951} {"train_loss": -26.521909713745117, "global_step": 493937, "epoch": 5951} {"train_loss": -26.33077049255371, "global_step": 493938, "epoch": 5951} {"train_loss": -26.497236251831055, "global_step": 493939, "epoch": 5951} {"train_loss": -26.683155059814453, "global_step": 493940, "epoch": 5951} {"train_loss": -26.71368980407715, "global_step": 493941, "epoch": 5951} {"train_loss": -26.678640365600586, "global_step": 493942, "epoch": 5951} {"train_loss": -26.95222282409668, "global_step": 493943, "epoch": 5951} {"train_loss": -26.865570068359375, "global_step": 493944, "epoch": 5951} {"train_loss": -27.048725128173828, "global_step": 493945, "epoch": 5951} {"train_loss": -26.886167526245117, "global_step": 493946, "epoch": 5951} {"train_loss": -27.242101669311523, "global_step": 493947, "epoch": 5951} {"train_loss": -27.03179931640625, "global_step": 493948, "epoch": 5951} {"train_loss": -27.22772789001465, "global_step": 493949, "epoch": 5951} {"train_loss": -27.137374877929688, "global_step": 493950, "epoch": 5951} {"train_loss": -27.016942977905273, "global_step": 493951, "epoch": 5951} {"train_loss": -27.38982582092285, "global_step": 493952, "epoch": 5951} {"train_loss": -27.009443283081055, "global_step": 493953, "epoch": 5951} {"train_loss": -26.917041778564453, "global_step": 493954, "epoch": 5951} {"train_loss": -27.168994903564453, "global_step": 493955, "epoch": 5951} {"train_loss": -27.221466064453125, "global_step": 493956, "epoch": 5951} {"train_loss": -27.3129825592041, "global_step": 493957, "epoch": 5951} {"train_loss": -27.15985679626465, "global_step": 493958, "epoch": 5951} {"train_loss": -27.48406982421875, "global_step": 493959, "epoch": 5951} {"train_loss": -27.205001831054688, "global_step": 493960, "epoch": 5951} {"train_loss": -27.44390869140625, "global_step": 493961, "epoch": 5951} {"train_loss": -27.179906845092773, "global_step": 493962, "epoch": 5951} {"train_loss": -27.494749069213867, "global_step": 493963, "epoch": 5951} {"train_loss": -27.086938858032227, "global_step": 493964, "epoch": 5951} {"train_loss": -27.40756607055664, "global_step": 493965, "epoch": 5951} {"train_loss": -27.353063583374023, "global_step": 493966, "epoch": 5951} {"train_loss": -27.314990997314453, "global_step": 493967, "epoch": 5951} {"train_loss": -27.211505889892578, "global_step": 493968, "epoch": 5951} {"train_loss": -27.399866104125977, "global_step": 493969, "epoch": 5951} {"train_loss": -27.103784561157227, "global_step": 493970, "epoch": 5951} {"train_loss": -27.677078247070312, "global_step": 493971, "epoch": 5951} {"train_loss": -27.54012107849121, "global_step": 493972, "epoch": 5951} {"train_loss": -27.337121963500977, "global_step": 493973, "epoch": 5951} {"train_loss": -27.219131469726562, "global_step": 493974, "epoch": 5951} {"train_loss": -27.237186431884766, "global_step": 493975, "epoch": 5951} {"train_loss": -27.673583984375, "global_step": 493976, "epoch": 5951} {"train_loss": -27.5214900970459, "global_step": 493977, "epoch": 5951} {"train_loss": -27.389892578125, "global_step": 493978, "epoch": 5951} {"train_loss": -27.325719833374023, "global_step": 493979, "epoch": 5951} {"train_loss": -27.70045280456543, "global_step": 493980, "epoch": 5951} {"train_loss": -27.399621963500977, "global_step": 493981, "epoch": 5951} {"train_loss": -27.064687728881836, "global_step": 493982, "epoch": 5951} {"train_loss": -27.065107345581055, "global_step": 493983, "epoch": 5951} {"train_loss": -27.676435470581055, "global_step": 493984, "epoch": 5951} {"train_loss": -27.5956974029541, "global_step": 493985, "epoch": 5951} {"train_loss": -27.290851593017578, "global_step": 493986, "epoch": 5951} {"train_loss": -27.142683029174805, "global_step": 493987, "epoch": 5951} {"train_loss": -27.598230361938477, "global_step": 493988, "epoch": 5951} {"train_loss": -27.395797729492188, "global_step": 493989, "epoch": 5951} {"train_loss": -27.51025390625, "global_step": 493990, "epoch": 5951} {"train_loss": -27.639328002929688, "global_step": 493991, "epoch": 5951} {"train_loss": -27.509756088256836, "global_step": 493992, "epoch": 5951} {"train_loss": -27.39912223815918, "global_step": 493993, "epoch": 5951} {"train_loss": -27.586645126342773, "global_step": 493994, "epoch": 5951} {"train_loss": -27.499792098999023, "global_step": 493995, "epoch": 5951} {"train_loss": -27.34283447265625, "global_step": 493996, "epoch": 5951} {"train_loss": -26.94600486755371, "global_step": 493997, "epoch": 5951} {"train_loss": -27.215167999267578, "global_step": 493998, "epoch": 5951} {"train_loss": -27.432947158813477, "global_step": 493999, "epoch": 5951} {"train_loss": -27.65376091003418, "global_step": 494000, "epoch": 5951} {"train_loss": -27.3564510345459, "global_step": 494001, "epoch": 5951} {"train_loss": -27.61342430114746, "global_step": 494002, "epoch": 5951} {"train_loss": -27.26533317565918, "global_step": 494003, "epoch": 5951} {"train_loss": -27.191940307617188, "global_step": 494004, "epoch": 5951} {"train_loss": -27.840503692626953, "global_step": 494005, "epoch": 5951} {"train_loss": -27.299081802368164, "global_step": 494006, "epoch": 5951} {"train_loss": -27.25054359436035, "global_step": 494007, "epoch": 5951} {"train_loss": -27.283721923828125, "global_step": 494008, "epoch": 5951} {"train_loss": -27.55048942565918, "global_step": 494009, "epoch": 5951} {"train_loss": -27.116491317749023, "global_step": 494010, "epoch": 5951} {"train_loss": -27.385635375976562, "global_step": 494011, "epoch": 5951} {"train_loss": -27.614105224609375, "global_step": 494012, "epoch": 5951} {"train_loss": -26.939428329467773, "global_step": 494013, "epoch": 5951} {"train_loss": -26.939550399780273, "global_step": 494014, "epoch": 5951} {"train_loss": -27.201844020062182, "global_step": 494015, "epoch": 5951, "val_loss": 6653033.5} {"train_loss": -26.74250602722168, "global_step": 494016, "epoch": 5952} {"train_loss": -26.536117553710938, "global_step": 494017, "epoch": 5952} {"train_loss": -25.887786865234375, "global_step": 494018, "epoch": 5952} {"train_loss": -26.50031089782715, "global_step": 494019, "epoch": 5952} {"train_loss": -26.4237117767334, "global_step": 494020, "epoch": 5952} {"train_loss": -26.6469783782959, "global_step": 494021, "epoch": 5952} {"train_loss": -26.24639892578125, "global_step": 494022, "epoch": 5952} {"train_loss": -26.950571060180664, "global_step": 494023, "epoch": 5952} {"train_loss": -26.87318229675293, "global_step": 494024, "epoch": 5952} {"train_loss": -26.9409236907959, "global_step": 494025, "epoch": 5952} {"train_loss": -27.07565689086914, "global_step": 494026, "epoch": 5952} {"train_loss": -27.201826095581055, "global_step": 494027, "epoch": 5952} {"train_loss": -26.580759048461914, "global_step": 494028, "epoch": 5952} {"train_loss": -26.86933708190918, "global_step": 494029, "epoch": 5952} {"train_loss": -27.226490020751953, "global_step": 494030, "epoch": 5952} {"train_loss": -27.010242462158203, "global_step": 494031, "epoch": 5952} {"train_loss": -27.267364501953125, "global_step": 494032, "epoch": 5952} {"train_loss": -27.079702377319336, "global_step": 494033, "epoch": 5952} {"train_loss": -27.033315658569336, "global_step": 494034, "epoch": 5952} {"train_loss": -27.25690269470215, "global_step": 494035, "epoch": 5952} {"train_loss": -27.14094352722168, "global_step": 494036, "epoch": 5952} {"train_loss": -27.493085861206055, "global_step": 494037, "epoch": 5952} {"train_loss": -27.224552154541016, "global_step": 494038, "epoch": 5952} {"train_loss": -27.29768943786621, "global_step": 494039, "epoch": 5952} {"train_loss": -27.35235595703125, "global_step": 494040, "epoch": 5952} {"train_loss": -27.574506759643555, "global_step": 494041, "epoch": 5952} {"train_loss": -27.250593185424805, "global_step": 494042, "epoch": 5952} {"train_loss": -27.143198013305664, "global_step": 494043, "epoch": 5952} {"train_loss": -27.354944229125977, "global_step": 494044, "epoch": 5952} {"train_loss": -27.4749755859375, "global_step": 494045, "epoch": 5952} {"train_loss": -27.3612060546875, "global_step": 494046, "epoch": 5952} {"train_loss": -27.5301570892334, "global_step": 494047, "epoch": 5952} {"train_loss": -27.313953399658203, "global_step": 494048, "epoch": 5952} {"train_loss": -27.43934440612793, "global_step": 494049, "epoch": 5952} {"train_loss": -27.754150390625, "global_step": 494050, "epoch": 5952} {"train_loss": -26.954938888549805, "global_step": 494051, "epoch": 5952} {"train_loss": -27.516653060913086, "global_step": 494052, "epoch": 5952} {"train_loss": -27.2783203125, "global_step": 494053, "epoch": 5952} {"train_loss": -26.98935317993164, "global_step": 494054, "epoch": 5952} {"train_loss": -26.29117202758789, "global_step": 494055, "epoch": 5952} {"train_loss": -27.1873836517334, "global_step": 494056, "epoch": 5952} {"train_loss": -27.28590202331543, "global_step": 494057, "epoch": 5952} {"train_loss": -27.53374671936035, "global_step": 494058, "epoch": 5952} {"train_loss": -27.187427520751953, "global_step": 494059, "epoch": 5952} {"train_loss": -26.9411563873291, "global_step": 494060, "epoch": 5952} {"train_loss": -26.838842391967773, "global_step": 494061, "epoch": 5952} {"train_loss": -27.402673721313477, "global_step": 494062, "epoch": 5952} {"train_loss": -26.829132080078125, "global_step": 494063, "epoch": 5952} {"train_loss": -27.23468589782715, "global_step": 494064, "epoch": 5952} {"train_loss": -27.019147872924805, "global_step": 494065, "epoch": 5952} {"train_loss": -27.145965576171875, "global_step": 494066, "epoch": 5952} {"train_loss": -27.165014266967773, "global_step": 494067, "epoch": 5952} {"train_loss": -27.76824378967285, "global_step": 494068, "epoch": 5952} {"train_loss": -27.377185821533203, "global_step": 494069, "epoch": 5952} {"train_loss": -27.462278366088867, "global_step": 494070, "epoch": 5952} {"train_loss": -27.90235710144043, "global_step": 494071, "epoch": 5952} {"train_loss": -27.43699073791504, "global_step": 494072, "epoch": 5952} {"train_loss": -27.480077743530273, "global_step": 494073, "epoch": 5952} {"train_loss": -27.575286865234375, "global_step": 494074, "epoch": 5952} {"train_loss": -27.718048095703125, "global_step": 494075, "epoch": 5952} {"train_loss": -27.411121368408203, "global_step": 494076, "epoch": 5952} {"train_loss": -27.118982315063477, "global_step": 494077, "epoch": 5952} {"train_loss": -27.315027236938477, "global_step": 494078, "epoch": 5952} {"train_loss": -27.457721710205078, "global_step": 494079, "epoch": 5952} {"train_loss": -27.473535537719727, "global_step": 494080, "epoch": 5952} {"train_loss": -27.189252853393555, "global_step": 494081, "epoch": 5952} {"train_loss": -27.546554565429688, "global_step": 494082, "epoch": 5952} {"train_loss": -26.76006507873535, "global_step": 494083, "epoch": 5952} {"train_loss": -27.361867904663086, "global_step": 494084, "epoch": 5952} {"train_loss": -26.98006248474121, "global_step": 494085, "epoch": 5952} {"train_loss": -27.067310333251953, "global_step": 494086, "epoch": 5952} {"train_loss": -27.185483932495117, "global_step": 494087, "epoch": 5952} {"train_loss": -27.387317657470703, "global_step": 494088, "epoch": 5952} {"train_loss": -27.06397819519043, "global_step": 494089, "epoch": 5952} {"train_loss": -27.29767417907715, "global_step": 494090, "epoch": 5952} {"train_loss": -26.97075843811035, "global_step": 494091, "epoch": 5952} {"train_loss": -27.23362159729004, "global_step": 494092, "epoch": 5952} {"train_loss": -27.3133544921875, "global_step": 494093, "epoch": 5952} {"train_loss": -27.315526962280273, "global_step": 494094, "epoch": 5952} {"train_loss": -27.404333114624023, "global_step": 494095, "epoch": 5952} {"train_loss": -27.45306396484375, "global_step": 494096, "epoch": 5952} {"train_loss": -27.527191162109375, "global_step": 494097, "epoch": 5952} {"train_loss": -27.184958722217974, "global_step": 494098, "epoch": 5952, "val_loss": 6639563.0} {"train_loss": -27.48658561706543, "global_step": 494099, "epoch": 5953} {"train_loss": -26.932825088500977, "global_step": 494100, "epoch": 5953} {"train_loss": -26.53262710571289, "global_step": 494101, "epoch": 5953} {"train_loss": -27.03093910217285, "global_step": 494102, "epoch": 5953} {"train_loss": -26.684553146362305, "global_step": 494103, "epoch": 5953} {"train_loss": -27.05377769470215, "global_step": 494104, "epoch": 5953} {"train_loss": -27.095251083374023, "global_step": 494105, "epoch": 5953} {"train_loss": -27.426050186157227, "global_step": 494106, "epoch": 5953} {"train_loss": -27.300128936767578, "global_step": 494107, "epoch": 5953} {"train_loss": -27.05278968811035, "global_step": 494108, "epoch": 5953} {"train_loss": -27.084720611572266, "global_step": 494109, "epoch": 5953} {"train_loss": -27.276660919189453, "global_step": 494110, "epoch": 5953} {"train_loss": -27.372150421142578, "global_step": 494111, "epoch": 5953} {"train_loss": -27.1378173828125, "global_step": 494112, "epoch": 5953} {"train_loss": -27.782800674438477, "global_step": 494113, "epoch": 5953} {"train_loss": -27.39362907409668, "global_step": 494114, "epoch": 5953} {"train_loss": -26.406896591186523, "global_step": 494115, "epoch": 5953} {"train_loss": -26.84512710571289, "global_step": 494116, "epoch": 5953} {"train_loss": -27.092721939086914, "global_step": 494117, "epoch": 5953} {"train_loss": -27.279407501220703, "global_step": 494118, "epoch": 5953} {"train_loss": -27.513019561767578, "global_step": 494119, "epoch": 5953} {"train_loss": -27.170074462890625, "global_step": 494120, "epoch": 5953} {"train_loss": -27.26679039001465, "global_step": 494121, "epoch": 5953} {"train_loss": -26.85727882385254, "global_step": 494122, "epoch": 5953} {"train_loss": -27.318836212158203, "global_step": 494123, "epoch": 5953} {"train_loss": -27.326812744140625, "global_step": 494124, "epoch": 5953} {"train_loss": -27.5738468170166, "global_step": 494125, "epoch": 5953} {"train_loss": -27.45393180847168, "global_step": 494126, "epoch": 5953} {"train_loss": -27.236310958862305, "global_step": 494127, "epoch": 5953} {"train_loss": -27.197589874267578, "global_step": 494128, "epoch": 5953} {"train_loss": -27.34469985961914, "global_step": 494129, "epoch": 5953} {"train_loss": -27.402517318725586, "global_step": 494130, "epoch": 5953} {"train_loss": -27.376068115234375, "global_step": 494131, "epoch": 5953} {"train_loss": -27.444644927978516, "global_step": 494132, "epoch": 5953} {"train_loss": -27.38465690612793, "global_step": 494133, "epoch": 5953} {"train_loss": -27.226057052612305, "global_step": 494134, "epoch": 5953} {"train_loss": -27.32452392578125, "global_step": 494135, "epoch": 5953} {"train_loss": -27.193572998046875, "global_step": 494136, "epoch": 5953} {"train_loss": -27.506967544555664, "global_step": 494137, "epoch": 5953} {"train_loss": -27.52337074279785, "global_step": 494138, "epoch": 5953} {"train_loss": -27.456327438354492, "global_step": 494139, "epoch": 5953} {"train_loss": -27.513751983642578, "global_step": 494140, "epoch": 5953} {"train_loss": -27.734716415405273, "global_step": 494141, "epoch": 5953} {"train_loss": -27.377124786376953, "global_step": 494142, "epoch": 5953} {"train_loss": -27.26473045349121, "global_step": 494143, "epoch": 5953} {"train_loss": -27.34397315979004, "global_step": 494144, "epoch": 5953} {"train_loss": -27.024560928344727, "global_step": 494145, "epoch": 5953} {"train_loss": -27.402875900268555, "global_step": 494146, "epoch": 5953} {"train_loss": -27.664037704467773, "global_step": 494147, "epoch": 5953} {"train_loss": -27.24078369140625, "global_step": 494148, "epoch": 5953} {"train_loss": -27.57863426208496, "global_step": 494149, "epoch": 5953} {"train_loss": -27.56304931640625, "global_step": 494150, "epoch": 5953} {"train_loss": -27.699417114257812, "global_step": 494151, "epoch": 5953} {"train_loss": -27.4095516204834, "global_step": 494152, "epoch": 5953} {"train_loss": -27.715402603149414, "global_step": 494153, "epoch": 5953} {"train_loss": -27.96327018737793, "global_step": 494154, "epoch": 5953} {"train_loss": -27.660608291625977, "global_step": 494155, "epoch": 5953} {"train_loss": -27.206146240234375, "global_step": 494156, "epoch": 5953} {"train_loss": -27.52919578552246, "global_step": 494157, "epoch": 5953} {"train_loss": -27.3415470123291, "global_step": 494158, "epoch": 5953} {"train_loss": -27.415903091430664, "global_step": 494159, "epoch": 5953} {"train_loss": -27.557783126831055, "global_step": 494160, "epoch": 5953} {"train_loss": -27.43180274963379, "global_step": 494161, "epoch": 5953} {"train_loss": -27.391271591186523, "global_step": 494162, "epoch": 5953} {"train_loss": -27.373449325561523, "global_step": 494163, "epoch": 5953} {"train_loss": -27.544157028198242, "global_step": 494164, "epoch": 5953} {"train_loss": -27.36639976501465, "global_step": 494165, "epoch": 5953} {"train_loss": -26.964126586914062, "global_step": 494166, "epoch": 5953} {"train_loss": -27.042951583862305, "global_step": 494167, "epoch": 5953} {"train_loss": -27.133609771728516, "global_step": 494168, "epoch": 5953} {"train_loss": -26.822162628173828, "global_step": 494169, "epoch": 5953} {"train_loss": -26.70924186706543, "global_step": 494170, "epoch": 5953} {"train_loss": -26.609472274780273, "global_step": 494171, "epoch": 5953} {"train_loss": -27.191755294799805, "global_step": 494172, "epoch": 5953} {"train_loss": -27.25244140625, "global_step": 494173, "epoch": 5953} {"train_loss": -27.23468589782715, "global_step": 494174, "epoch": 5953} {"train_loss": -26.963180541992188, "global_step": 494175, "epoch": 5953} {"train_loss": -26.892133712768555, "global_step": 494176, "epoch": 5953} {"train_loss": -26.74256706237793, "global_step": 494177, "epoch": 5953} {"train_loss": -26.768268585205078, "global_step": 494178, "epoch": 5953} {"train_loss": -27.587692260742188, "global_step": 494179, "epoch": 5953} {"train_loss": -27.0538387298584, "global_step": 494180, "epoch": 5953} {"train_loss": -27.245146257331573, "global_step": 494181, "epoch": 5953, "val_loss": 6638908.0} {"train_loss": -25.70203971862793, "global_step": 494182, "epoch": 5954} {"train_loss": -25.202383041381836, "global_step": 494183, "epoch": 5954} {"train_loss": -26.58038902282715, "global_step": 494184, "epoch": 5954} {"train_loss": -26.081724166870117, "global_step": 494185, "epoch": 5954} {"train_loss": -26.48782730102539, "global_step": 494186, "epoch": 5954} {"train_loss": -26.815673828125, "global_step": 494187, "epoch": 5954} {"train_loss": -26.30673599243164, "global_step": 494188, "epoch": 5954} {"train_loss": -26.43967056274414, "global_step": 494189, "epoch": 5954} {"train_loss": -26.79229164123535, "global_step": 494190, "epoch": 5954} {"train_loss": -26.602060317993164, "global_step": 494191, "epoch": 5954} {"train_loss": -26.957172393798828, "global_step": 494192, "epoch": 5954} {"train_loss": -26.69428062438965, "global_step": 494193, "epoch": 5954} {"train_loss": -26.51056480407715, "global_step": 494194, "epoch": 5954} {"train_loss": -26.948348999023438, "global_step": 494195, "epoch": 5954} {"train_loss": -26.70184898376465, "global_step": 494196, "epoch": 5954} {"train_loss": -26.80063819885254, "global_step": 494197, "epoch": 5954} {"train_loss": -26.812744140625, "global_step": 494198, "epoch": 5954} {"train_loss": -26.604602813720703, "global_step": 494199, "epoch": 5954} {"train_loss": -26.804738998413086, "global_step": 494200, "epoch": 5954} {"train_loss": -27.582935333251953, "global_step": 494201, "epoch": 5954} {"train_loss": -27.301847457885742, "global_step": 494202, "epoch": 5954} {"train_loss": -27.120880126953125, "global_step": 494203, "epoch": 5954} {"train_loss": -26.934228897094727, "global_step": 494204, "epoch": 5954} {"train_loss": -26.935205459594727, "global_step": 494205, "epoch": 5954} {"train_loss": -26.9960994720459, "global_step": 494206, "epoch": 5954} {"train_loss": -26.991125106811523, "global_step": 494207, "epoch": 5954} {"train_loss": -26.994281768798828, "global_step": 494208, "epoch": 5954} {"train_loss": -27.418874740600586, "global_step": 494209, "epoch": 5954} {"train_loss": -27.274307250976562, "global_step": 494210, "epoch": 5954} {"train_loss": -27.256738662719727, "global_step": 494211, "epoch": 5954} {"train_loss": -27.37849998474121, "global_step": 494212, "epoch": 5954} {"train_loss": -27.43073844909668, "global_step": 494213, "epoch": 5954} {"train_loss": -27.338958740234375, "global_step": 494214, "epoch": 5954} {"train_loss": -27.7401180267334, "global_step": 494215, "epoch": 5954} {"train_loss": -27.368200302124023, "global_step": 494216, "epoch": 5954} {"train_loss": -27.2083683013916, "global_step": 494217, "epoch": 5954} {"train_loss": -27.193281173706055, "global_step": 494218, "epoch": 5954} {"train_loss": -27.517499923706055, "global_step": 494219, "epoch": 5954} {"train_loss": -27.1320858001709, "global_step": 494220, "epoch": 5954} {"train_loss": -27.249479293823242, "global_step": 494221, "epoch": 5954} {"train_loss": -27.534753799438477, "global_step": 494222, "epoch": 5954} {"train_loss": -27.239362716674805, "global_step": 494223, "epoch": 5954} {"train_loss": -27.546497344970703, "global_step": 494224, "epoch": 5954} {"train_loss": -27.44233512878418, "global_step": 494225, "epoch": 5954} {"train_loss": -27.257247924804688, "global_step": 494226, "epoch": 5954} {"train_loss": -27.058713912963867, "global_step": 494227, "epoch": 5954} {"train_loss": -27.567218780517578, "global_step": 494228, "epoch": 5954} {"train_loss": -27.669513702392578, "global_step": 494229, "epoch": 5954} {"train_loss": -27.696237564086914, "global_step": 494230, "epoch": 5954} {"train_loss": -27.659748077392578, "global_step": 494231, "epoch": 5954} {"train_loss": -27.360614776611328, "global_step": 494232, "epoch": 5954} {"train_loss": -27.65854835510254, "global_step": 494233, "epoch": 5954} {"train_loss": -27.30885124206543, "global_step": 494234, "epoch": 5954} {"train_loss": -27.4530029296875, "global_step": 494235, "epoch": 5954} {"train_loss": -27.440753936767578, "global_step": 494236, "epoch": 5954} {"train_loss": -27.496313095092773, "global_step": 494237, "epoch": 5954} {"train_loss": -27.23206901550293, "global_step": 494238, "epoch": 5954} {"train_loss": -27.435338973999023, "global_step": 494239, "epoch": 5954} {"train_loss": -27.6007137298584, "global_step": 494240, "epoch": 5954} {"train_loss": -27.320600509643555, "global_step": 494241, "epoch": 5954} {"train_loss": -27.205615997314453, "global_step": 494242, "epoch": 5954} {"train_loss": -27.10420036315918, "global_step": 494243, "epoch": 5954} {"train_loss": -27.26410484313965, "global_step": 494244, "epoch": 5954} {"train_loss": -27.310895919799805, "global_step": 494245, "epoch": 5954} {"train_loss": -27.2589111328125, "global_step": 494246, "epoch": 5954} {"train_loss": -27.314361572265625, "global_step": 494247, "epoch": 5954} {"train_loss": -27.17255210876465, "global_step": 494248, "epoch": 5954} {"train_loss": -27.462488174438477, "global_step": 494249, "epoch": 5954} {"train_loss": -27.127960205078125, "global_step": 494250, "epoch": 5954} {"train_loss": -27.663496017456055, "global_step": 494251, "epoch": 5954} {"train_loss": -26.982091903686523, "global_step": 494252, "epoch": 5954} {"train_loss": -27.627033233642578, "global_step": 494253, "epoch": 5954} {"train_loss": -27.354267120361328, "global_step": 494254, "epoch": 5954} {"train_loss": -27.54005241394043, "global_step": 494255, "epoch": 5954} {"train_loss": -27.573999404907227, "global_step": 494256, "epoch": 5954} {"train_loss": -27.2747745513916, "global_step": 494257, "epoch": 5954} {"train_loss": -27.938058853149414, "global_step": 494258, "epoch": 5954} {"train_loss": -27.725082397460938, "global_step": 494259, "epoch": 5954} {"train_loss": -27.483692169189453, "global_step": 494260, "epoch": 5954} {"train_loss": -27.39832878112793, "global_step": 494261, "epoch": 5954} {"train_loss": -27.388538360595703, "global_step": 494262, "epoch": 5954} {"train_loss": -27.508832931518555, "global_step": 494263, "epoch": 5954} {"train_loss": -27.176517348691643, "global_step": 494264, "epoch": 5954, "val_loss": 6675435.0} {"train_loss": -27.492691040039062, "global_step": 494265, "epoch": 5955} {"train_loss": -27.395238876342773, "global_step": 494266, "epoch": 5955} {"train_loss": -26.938623428344727, "global_step": 494267, "epoch": 5955} {"train_loss": -27.27997398376465, "global_step": 494268, "epoch": 5955} {"train_loss": -26.725549697875977, "global_step": 494269, "epoch": 5955} {"train_loss": -26.7030086517334, "global_step": 494270, "epoch": 5955} {"train_loss": -26.749267578125, "global_step": 494271, "epoch": 5955} {"train_loss": -27.604108810424805, "global_step": 494272, "epoch": 5955} {"train_loss": -27.314695358276367, "global_step": 494273, "epoch": 5955} {"train_loss": -27.30658531188965, "global_step": 494274, "epoch": 5955} {"train_loss": -26.6727237701416, "global_step": 494275, "epoch": 5955} {"train_loss": -27.233753204345703, "global_step": 494276, "epoch": 5955} {"train_loss": -27.28474235534668, "global_step": 494277, "epoch": 5955} {"train_loss": -27.432632446289062, "global_step": 494278, "epoch": 5955} {"train_loss": -27.108692169189453, "global_step": 494279, "epoch": 5955} {"train_loss": -26.677900314331055, "global_step": 494280, "epoch": 5955} {"train_loss": -27.255084991455078, "global_step": 494281, "epoch": 5955} {"train_loss": -26.901050567626953, "global_step": 494282, "epoch": 5955} {"train_loss": -27.35029411315918, "global_step": 494283, "epoch": 5955} {"train_loss": -27.2300968170166, "global_step": 494284, "epoch": 5955} {"train_loss": -27.5159969329834, "global_step": 494285, "epoch": 5955} {"train_loss": -27.228687286376953, "global_step": 494286, "epoch": 5955} {"train_loss": -27.076587677001953, "global_step": 494287, "epoch": 5955} {"train_loss": -27.414966583251953, "global_step": 494288, "epoch": 5955} {"train_loss": -27.46036148071289, "global_step": 494289, "epoch": 5955} {"train_loss": -27.354572296142578, "global_step": 494290, "epoch": 5955} {"train_loss": -27.670568466186523, "global_step": 494291, "epoch": 5955} {"train_loss": -27.1297550201416, "global_step": 494292, "epoch": 5955} {"train_loss": -27.573896408081055, "global_step": 494293, "epoch": 5955} {"train_loss": -27.368234634399414, "global_step": 494294, "epoch": 5955} {"train_loss": -27.54322624206543, "global_step": 494295, "epoch": 5955} {"train_loss": -27.225439071655273, "global_step": 494296, "epoch": 5955} {"train_loss": -27.635583877563477, "global_step": 494297, "epoch": 5955} {"train_loss": -27.503225326538086, "global_step": 494298, "epoch": 5955} {"train_loss": -27.34708023071289, "global_step": 494299, "epoch": 5955} {"train_loss": -27.479562759399414, "global_step": 494300, "epoch": 5955} {"train_loss": -27.132492065429688, "global_step": 494301, "epoch": 5955} {"train_loss": -27.20026969909668, "global_step": 494302, "epoch": 5955} {"train_loss": -27.81715202331543, "global_step": 494303, "epoch": 5955} {"train_loss": -27.610919952392578, "global_step": 494304, "epoch": 5955} {"train_loss": -27.55021095275879, "global_step": 494305, "epoch": 5955} {"train_loss": -27.568653106689453, "global_step": 494306, "epoch": 5955} {"train_loss": -27.1315860748291, "global_step": 494307, "epoch": 5955} {"train_loss": -27.080646514892578, "global_step": 494308, "epoch": 5955} {"train_loss": -27.86981773376465, "global_step": 494309, "epoch": 5955} {"train_loss": -27.496801376342773, "global_step": 494310, "epoch": 5955} {"train_loss": -27.56570816040039, "global_step": 494311, "epoch": 5955} {"train_loss": -27.52496337890625, "global_step": 494312, "epoch": 5955} {"train_loss": -27.1770076751709, "global_step": 494313, "epoch": 5955} {"train_loss": -27.276166915893555, "global_step": 494314, "epoch": 5955} {"train_loss": -27.530410766601562, "global_step": 494315, "epoch": 5955} {"train_loss": -27.495498657226562, "global_step": 494316, "epoch": 5955} {"train_loss": -27.287134170532227, "global_step": 494317, "epoch": 5955} {"train_loss": -27.73441505432129, "global_step": 494318, "epoch": 5955} {"train_loss": -27.60383415222168, "global_step": 494319, "epoch": 5955} {"train_loss": -27.33900260925293, "global_step": 494320, "epoch": 5955} {"train_loss": -27.505475997924805, "global_step": 494321, "epoch": 5955} {"train_loss": -27.453977584838867, "global_step": 494322, "epoch": 5955} {"train_loss": -27.45102882385254, "global_step": 494323, "epoch": 5955} {"train_loss": -27.81361961364746, "global_step": 494324, "epoch": 5955} {"train_loss": -27.189462661743164, "global_step": 494325, "epoch": 5955} {"train_loss": -27.39936637878418, "global_step": 494326, "epoch": 5955} {"train_loss": -27.273080825805664, "global_step": 494327, "epoch": 5955} {"train_loss": -27.373682022094727, "global_step": 494328, "epoch": 5955} {"train_loss": -27.468618392944336, "global_step": 494329, "epoch": 5955} {"train_loss": -27.8195743560791, "global_step": 494330, "epoch": 5955} {"train_loss": -27.682065963745117, "global_step": 494331, "epoch": 5955} {"train_loss": -27.454076766967773, "global_step": 494332, "epoch": 5955} {"train_loss": -27.332006454467773, "global_step": 494333, "epoch": 5955} {"train_loss": -27.704181671142578, "global_step": 494334, "epoch": 5955} {"train_loss": -27.347970962524414, "global_step": 494335, "epoch": 5955} {"train_loss": -27.399641036987305, "global_step": 494336, "epoch": 5955} {"train_loss": -27.61439323425293, "global_step": 494337, "epoch": 5955} {"train_loss": -27.579572677612305, "global_step": 494338, "epoch": 5955} {"train_loss": -27.808958053588867, "global_step": 494339, "epoch": 5955} {"train_loss": -27.511890411376953, "global_step": 494340, "epoch": 5955} {"train_loss": -27.26209831237793, "global_step": 494341, "epoch": 5955} {"train_loss": -27.095062255859375, "global_step": 494342, "epoch": 5955} {"train_loss": -27.282455444335938, "global_step": 494343, "epoch": 5955} {"train_loss": -26.93692398071289, "global_step": 494344, "epoch": 5955} {"train_loss": -27.4289608001709, "global_step": 494345, "epoch": 5955} {"train_loss": -27.3082275390625, "global_step": 494346, "epoch": 5955} {"train_loss": -27.36216692177646, "global_step": 494347, "epoch": 5955, "val_loss": 6840735.0} {"train_loss": -24.095794677734375, "global_step": 494348, "epoch": 5956} {"train_loss": -23.622678756713867, "global_step": 494349, "epoch": 5956} {"train_loss": -24.899837493896484, "global_step": 494350, "epoch": 5956} {"train_loss": -25.28804588317871, "global_step": 494351, "epoch": 5956} {"train_loss": -25.292070388793945, "global_step": 494352, "epoch": 5956} {"train_loss": -25.96567726135254, "global_step": 494353, "epoch": 5956} {"train_loss": -26.25872802734375, "global_step": 494354, "epoch": 5956} {"train_loss": -25.839385986328125, "global_step": 494355, "epoch": 5956} {"train_loss": -26.11012077331543, "global_step": 494356, "epoch": 5956} {"train_loss": -25.92828369140625, "global_step": 494357, "epoch": 5956} {"train_loss": -25.854612350463867, "global_step": 494358, "epoch": 5956} {"train_loss": -26.944162368774414, "global_step": 494359, "epoch": 5956} {"train_loss": -25.895526885986328, "global_step": 494360, "epoch": 5956} {"train_loss": -26.4570255279541, "global_step": 494361, "epoch": 5956} {"train_loss": -26.549707412719727, "global_step": 494362, "epoch": 5956} {"train_loss": -26.08699607849121, "global_step": 494363, "epoch": 5956} {"train_loss": -26.1224365234375, "global_step": 494364, "epoch": 5956} {"train_loss": -26.123746871948242, "global_step": 494365, "epoch": 5956} {"train_loss": -26.49041748046875, "global_step": 494366, "epoch": 5956} {"train_loss": -26.07940101623535, "global_step": 494367, "epoch": 5956} {"train_loss": -26.704181671142578, "global_step": 494368, "epoch": 5956} {"train_loss": -26.484668731689453, "global_step": 494369, "epoch": 5956} {"train_loss": -26.460142135620117, "global_step": 494370, "epoch": 5956} {"train_loss": -26.773183822631836, "global_step": 494371, "epoch": 5956} {"train_loss": -26.694120407104492, "global_step": 494372, "epoch": 5956} {"train_loss": -26.697498321533203, "global_step": 494373, "epoch": 5956} {"train_loss": -26.626617431640625, "global_step": 494374, "epoch": 5956} {"train_loss": -26.37624168395996, "global_step": 494375, "epoch": 5956} {"train_loss": -27.007904052734375, "global_step": 494376, "epoch": 5956} {"train_loss": -26.747400283813477, "global_step": 494377, "epoch": 5956} {"train_loss": -26.74420738220215, "global_step": 494378, "epoch": 5956} {"train_loss": -27.0709171295166, "global_step": 494379, "epoch": 5956} {"train_loss": -26.75333595275879, "global_step": 494380, "epoch": 5956} {"train_loss": -27.15436363220215, "global_step": 494381, "epoch": 5956} {"train_loss": -26.7314395904541, "global_step": 494382, "epoch": 5956} {"train_loss": -27.345325469970703, "global_step": 494383, "epoch": 5956} {"train_loss": -26.723453521728516, "global_step": 494384, "epoch": 5956} {"train_loss": -27.026874542236328, "global_step": 494385, "epoch": 5956} {"train_loss": -26.997791290283203, "global_step": 494386, "epoch": 5956} {"train_loss": -26.883270263671875, "global_step": 494387, "epoch": 5956} {"train_loss": -27.145788192749023, "global_step": 494388, "epoch": 5956} {"train_loss": -27.285669326782227, "global_step": 494389, "epoch": 5956} {"train_loss": -27.451513290405273, "global_step": 494390, "epoch": 5956} {"train_loss": -27.108579635620117, "global_step": 494391, "epoch": 5956} {"train_loss": -27.02857780456543, "global_step": 494392, "epoch": 5956} {"train_loss": -27.182722091674805, "global_step": 494393, "epoch": 5956} {"train_loss": -27.13382911682129, "global_step": 494394, "epoch": 5956} {"train_loss": -27.445241928100586, "global_step": 494395, "epoch": 5956} {"train_loss": -27.347394943237305, "global_step": 494396, "epoch": 5956} {"train_loss": -27.476886749267578, "global_step": 494397, "epoch": 5956} {"train_loss": -27.272491455078125, "global_step": 494398, "epoch": 5956} {"train_loss": -27.61049461364746, "global_step": 494399, "epoch": 5956} {"train_loss": -27.3414363861084, "global_step": 494400, "epoch": 5956} {"train_loss": -27.129316329956055, "global_step": 494401, "epoch": 5956} {"train_loss": -27.187347412109375, "global_step": 494402, "epoch": 5956} {"train_loss": -27.330463409423828, "global_step": 494403, "epoch": 5956} {"train_loss": -27.47433853149414, "global_step": 494404, "epoch": 5956} {"train_loss": -27.408477783203125, "global_step": 494405, "epoch": 5956} {"train_loss": -27.26007080078125, "global_step": 494406, "epoch": 5956} {"train_loss": -27.2323055267334, "global_step": 494407, "epoch": 5956} {"train_loss": -27.247922897338867, "global_step": 494408, "epoch": 5956} {"train_loss": -27.55141258239746, "global_step": 494409, "epoch": 5956} {"train_loss": -27.178632736206055, "global_step": 494410, "epoch": 5956} {"train_loss": -27.472579956054688, "global_step": 494411, "epoch": 5956} {"train_loss": -27.86209487915039, "global_step": 494412, "epoch": 5956} {"train_loss": -27.439422607421875, "global_step": 494413, "epoch": 5956} {"train_loss": -27.004968643188477, "global_step": 494414, "epoch": 5956} {"train_loss": -27.34909439086914, "global_step": 494415, "epoch": 5956} {"train_loss": -27.38271141052246, "global_step": 494416, "epoch": 5956} {"train_loss": -27.356586456298828, "global_step": 494417, "epoch": 5956} {"train_loss": -27.48577880859375, "global_step": 494418, "epoch": 5956} {"train_loss": -27.426090240478516, "global_step": 494419, "epoch": 5956} {"train_loss": -27.541671752929688, "global_step": 494420, "epoch": 5956} {"train_loss": -27.496091842651367, "global_step": 494421, "epoch": 5956} {"train_loss": -27.736703872680664, "global_step": 494422, "epoch": 5956} {"train_loss": -27.694669723510742, "global_step": 494423, "epoch": 5956} {"train_loss": -27.594635009765625, "global_step": 494424, "epoch": 5956} {"train_loss": -27.760141372680664, "global_step": 494425, "epoch": 5956} {"train_loss": -27.62117576599121, "global_step": 494426, "epoch": 5956} {"train_loss": -27.648733139038086, "global_step": 494427, "epoch": 5956} {"train_loss": -27.615371704101562, "global_step": 494428, "epoch": 5956} {"train_loss": -27.495624542236328, "global_step": 494429, "epoch": 5956} {"train_loss": -26.859227008130176, "global_step": 494430, "epoch": 5956, "val_loss": 6504965.0} {"train_loss": -24.957359313964844, "global_step": 494431, "epoch": 5957} {"train_loss": -23.21272087097168, "global_step": 494432, "epoch": 5957} {"train_loss": -24.051294326782227, "global_step": 494433, "epoch": 5957} {"train_loss": -25.53230857849121, "global_step": 494434, "epoch": 5957} {"train_loss": -25.570173263549805, "global_step": 494435, "epoch": 5957} {"train_loss": -25.7504825592041, "global_step": 494436, "epoch": 5957} {"train_loss": -25.283018112182617, "global_step": 494437, "epoch": 5957} {"train_loss": -26.35639762878418, "global_step": 494438, "epoch": 5957} {"train_loss": -26.320276260375977, "global_step": 494439, "epoch": 5957} {"train_loss": -25.854267120361328, "global_step": 494440, "epoch": 5957} {"train_loss": -26.55116844177246, "global_step": 494441, "epoch": 5957} {"train_loss": -26.646575927734375, "global_step": 494442, "epoch": 5957} {"train_loss": -26.736494064331055, "global_step": 494443, "epoch": 5957} {"train_loss": -26.544111251831055, "global_step": 494444, "epoch": 5957} {"train_loss": -26.391651153564453, "global_step": 494445, "epoch": 5957} {"train_loss": -26.98371696472168, "global_step": 494446, "epoch": 5957} {"train_loss": -26.706892013549805, "global_step": 494447, "epoch": 5957} {"train_loss": -26.479572296142578, "global_step": 494448, "epoch": 5957} {"train_loss": -26.705081939697266, "global_step": 494449, "epoch": 5957} {"train_loss": -26.633100509643555, "global_step": 494450, "epoch": 5957} {"train_loss": -26.718902587890625, "global_step": 494451, "epoch": 5957} {"train_loss": -26.629730224609375, "global_step": 494452, "epoch": 5957} {"train_loss": -26.962696075439453, "global_step": 494453, "epoch": 5957} {"train_loss": -26.72471046447754, "global_step": 494454, "epoch": 5957} {"train_loss": -26.654499053955078, "global_step": 494455, "epoch": 5957} {"train_loss": -26.913959503173828, "global_step": 494456, "epoch": 5957} {"train_loss": -26.945098876953125, "global_step": 494457, "epoch": 5957} {"train_loss": -27.210418701171875, "global_step": 494458, "epoch": 5957} {"train_loss": -27.065521240234375, "global_step": 494459, "epoch": 5957} {"train_loss": -27.066761016845703, "global_step": 494460, "epoch": 5957} {"train_loss": -27.014245986938477, "global_step": 494461, "epoch": 5957} {"train_loss": -27.02967643737793, "global_step": 494462, "epoch": 5957} {"train_loss": -26.980697631835938, "global_step": 494463, "epoch": 5957} {"train_loss": -27.247222900390625, "global_step": 494464, "epoch": 5957} {"train_loss": -26.946369171142578, "global_step": 494465, "epoch": 5957} {"train_loss": -27.207691192626953, "global_step": 494466, "epoch": 5957} {"train_loss": -27.140310287475586, "global_step": 494467, "epoch": 5957} {"train_loss": -27.28226661682129, "global_step": 494468, "epoch": 5957} {"train_loss": -27.2717227935791, "global_step": 494469, "epoch": 5957} {"train_loss": -27.312646865844727, "global_step": 494470, "epoch": 5957} {"train_loss": -27.070470809936523, "global_step": 494471, "epoch": 5957} {"train_loss": -27.410846710205078, "global_step": 494472, "epoch": 5957} {"train_loss": -27.413726806640625, "global_step": 494473, "epoch": 5957} {"train_loss": -27.36890983581543, "global_step": 494474, "epoch": 5957} {"train_loss": -27.215198516845703, "global_step": 494475, "epoch": 5957} {"train_loss": -27.445865631103516, "global_step": 494476, "epoch": 5957} {"train_loss": -27.2373046875, "global_step": 494477, "epoch": 5957} {"train_loss": -27.53667640686035, "global_step": 494478, "epoch": 5957} {"train_loss": -27.415908813476562, "global_step": 494479, "epoch": 5957} {"train_loss": -27.599401473999023, "global_step": 494480, "epoch": 5957} {"train_loss": -27.737049102783203, "global_step": 494481, "epoch": 5957} {"train_loss": -27.504796981811523, "global_step": 494482, "epoch": 5957} {"train_loss": -27.785146713256836, "global_step": 494483, "epoch": 5957} {"train_loss": -27.56924819946289, "global_step": 494484, "epoch": 5957} {"train_loss": -27.65557289123535, "global_step": 494485, "epoch": 5957} {"train_loss": -27.728635787963867, "global_step": 494486, "epoch": 5957} {"train_loss": -27.463109970092773, "global_step": 494487, "epoch": 5957} {"train_loss": -27.538232803344727, "global_step": 494488, "epoch": 5957} {"train_loss": -27.740650177001953, "global_step": 494489, "epoch": 5957} {"train_loss": -27.96759605407715, "global_step": 494490, "epoch": 5957} {"train_loss": -27.519582748413086, "global_step": 494491, "epoch": 5957} {"train_loss": -27.506513595581055, "global_step": 494492, "epoch": 5957} {"train_loss": -27.4813175201416, "global_step": 494493, "epoch": 5957} {"train_loss": -27.891162872314453, "global_step": 494494, "epoch": 5957} {"train_loss": -27.43654441833496, "global_step": 494495, "epoch": 5957} {"train_loss": -27.652639389038086, "global_step": 494496, "epoch": 5957} {"train_loss": -27.302764892578125, "global_step": 494497, "epoch": 5957} {"train_loss": -27.080488204956055, "global_step": 494498, "epoch": 5957} {"train_loss": -27.218347549438477, "global_step": 494499, "epoch": 5957} {"train_loss": -27.562719345092773, "global_step": 494500, "epoch": 5957} {"train_loss": -26.93070411682129, "global_step": 494501, "epoch": 5957} {"train_loss": -26.977140426635742, "global_step": 494502, "epoch": 5957} {"train_loss": -27.124164581298828, "global_step": 494503, "epoch": 5957} {"train_loss": -26.9017333984375, "global_step": 494504, "epoch": 5957} {"train_loss": -27.508405685424805, "global_step": 494505, "epoch": 5957} {"train_loss": -27.367938995361328, "global_step": 494506, "epoch": 5957} {"train_loss": -26.91877555847168, "global_step": 494507, "epoch": 5957} {"train_loss": -27.338027954101562, "global_step": 494508, "epoch": 5957} {"train_loss": -27.301969528198242, "global_step": 494509, "epoch": 5957} {"train_loss": -27.259979248046875, "global_step": 494510, "epoch": 5957} {"train_loss": -26.81797218322754, "global_step": 494511, "epoch": 5957} {"train_loss": -27.336181640625, "global_step": 494512, "epoch": 5957} {"train_loss": -26.975675077323455, "global_step": 494513, "epoch": 5957, "val_loss": 6475790.0} {"train_loss": -26.689172744750977, "global_step": 494514, "epoch": 5958} {"train_loss": -26.71405029296875, "global_step": 494515, "epoch": 5958} {"train_loss": -26.56217384338379, "global_step": 494516, "epoch": 5958} {"train_loss": -26.76227378845215, "global_step": 494517, "epoch": 5958} {"train_loss": -26.780424118041992, "global_step": 494518, "epoch": 5958} {"train_loss": -27.141454696655273, "global_step": 494519, "epoch": 5958} {"train_loss": -26.664270401000977, "global_step": 494520, "epoch": 5958} {"train_loss": -27.3429012298584, "global_step": 494521, "epoch": 5958} {"train_loss": -27.08595085144043, "global_step": 494522, "epoch": 5958} {"train_loss": -26.448383331298828, "global_step": 494523, "epoch": 5958} {"train_loss": -26.982019424438477, "global_step": 494524, "epoch": 5958} {"train_loss": -26.98969841003418, "global_step": 494525, "epoch": 5958} {"train_loss": -27.38416862487793, "global_step": 494526, "epoch": 5958} {"train_loss": -27.489038467407227, "global_step": 494527, "epoch": 5958} {"train_loss": -27.199872970581055, "global_step": 494528, "epoch": 5958} {"train_loss": -27.311853408813477, "global_step": 494529, "epoch": 5958} {"train_loss": -27.29631996154785, "global_step": 494530, "epoch": 5958} {"train_loss": -27.06609535217285, "global_step": 494531, "epoch": 5958} {"train_loss": -27.162992477416992, "global_step": 494532, "epoch": 5958} {"train_loss": -27.012537002563477, "global_step": 494533, "epoch": 5958} {"train_loss": -27.296506881713867, "global_step": 494534, "epoch": 5958} {"train_loss": -27.38898277282715, "global_step": 494535, "epoch": 5958} {"train_loss": -27.151376724243164, "global_step": 494536, "epoch": 5958} {"train_loss": -27.563886642456055, "global_step": 494537, "epoch": 5958} {"train_loss": -27.50105094909668, "global_step": 494538, "epoch": 5958} {"train_loss": -27.245691299438477, "global_step": 494539, "epoch": 5958} {"train_loss": -27.42966651916504, "global_step": 494540, "epoch": 5958} {"train_loss": -27.162677764892578, "global_step": 494541, "epoch": 5958} {"train_loss": -27.479581832885742, "global_step": 494542, "epoch": 5958} {"train_loss": -27.551115036010742, "global_step": 494543, "epoch": 5958} {"train_loss": -27.171985626220703, "global_step": 494544, "epoch": 5958} {"train_loss": -27.249670028686523, "global_step": 494545, "epoch": 5958} {"train_loss": -27.413480758666992, "global_step": 494546, "epoch": 5958} {"train_loss": -27.45045280456543, "global_step": 494547, "epoch": 5958} {"train_loss": -27.540884017944336, "global_step": 494548, "epoch": 5958} {"train_loss": -27.30694007873535, "global_step": 494549, "epoch": 5958} {"train_loss": -27.5299015045166, "global_step": 494550, "epoch": 5958} {"train_loss": -27.343338012695312, "global_step": 494551, "epoch": 5958} {"train_loss": -27.589563369750977, "global_step": 494552, "epoch": 5958} {"train_loss": -27.677534103393555, "global_step": 494553, "epoch": 5958} {"train_loss": -27.676319122314453, "global_step": 494554, "epoch": 5958} {"train_loss": -27.444324493408203, "global_step": 494555, "epoch": 5958} {"train_loss": -27.417118072509766, "global_step": 494556, "epoch": 5958} {"train_loss": -27.430097579956055, "global_step": 494557, "epoch": 5958} {"train_loss": -27.115087509155273, "global_step": 494558, "epoch": 5958} {"train_loss": -27.68153953552246, "global_step": 494559, "epoch": 5958} {"train_loss": -27.38217544555664, "global_step": 494560, "epoch": 5958} {"train_loss": -27.408084869384766, "global_step": 494561, "epoch": 5958} {"train_loss": -27.38702392578125, "global_step": 494562, "epoch": 5958} {"train_loss": -27.552902221679688, "global_step": 494563, "epoch": 5958} {"train_loss": -27.423547744750977, "global_step": 494564, "epoch": 5958} {"train_loss": -27.327667236328125, "global_step": 494565, "epoch": 5958} {"train_loss": -26.986936569213867, "global_step": 494566, "epoch": 5958} {"train_loss": -27.19468116760254, "global_step": 494567, "epoch": 5958} {"train_loss": -27.359487533569336, "global_step": 494568, "epoch": 5958} {"train_loss": -27.584197998046875, "global_step": 494569, "epoch": 5958} {"train_loss": -27.538043975830078, "global_step": 494570, "epoch": 5958} {"train_loss": -27.237060546875, "global_step": 494571, "epoch": 5958} {"train_loss": -27.1450252532959, "global_step": 494572, "epoch": 5958} {"train_loss": -27.415149688720703, "global_step": 494573, "epoch": 5958} {"train_loss": -27.158395767211914, "global_step": 494574, "epoch": 5958} {"train_loss": -27.506134033203125, "global_step": 494575, "epoch": 5958} {"train_loss": -27.34933853149414, "global_step": 494576, "epoch": 5958} {"train_loss": -27.760852813720703, "global_step": 494577, "epoch": 5958} {"train_loss": -27.306928634643555, "global_step": 494578, "epoch": 5958} {"train_loss": -27.20448112487793, "global_step": 494579, "epoch": 5958} {"train_loss": -27.1000919342041, "global_step": 494580, "epoch": 5958} {"train_loss": -27.24445152282715, "global_step": 494581, "epoch": 5958} {"train_loss": -27.260135650634766, "global_step": 494582, "epoch": 5958} {"train_loss": -26.902435302734375, "global_step": 494583, "epoch": 5958} {"train_loss": -27.663244247436523, "global_step": 494584, "epoch": 5958} {"train_loss": -27.22356605529785, "global_step": 494585, "epoch": 5958} {"train_loss": -27.248647689819336, "global_step": 494586, "epoch": 5958} {"train_loss": -27.33746337890625, "global_step": 494587, "epoch": 5958} {"train_loss": -27.480615615844727, "global_step": 494588, "epoch": 5958} {"train_loss": -27.51844596862793, "global_step": 494589, "epoch": 5958} {"train_loss": -27.535125732421875, "global_step": 494590, "epoch": 5958} {"train_loss": -27.16609001159668, "global_step": 494591, "epoch": 5958} {"train_loss": -27.032995223999023, "global_step": 494592, "epoch": 5958} {"train_loss": -27.42890739440918, "global_step": 494593, "epoch": 5958} {"train_loss": -27.772367477416992, "global_step": 494594, "epoch": 5958} {"train_loss": -27.600788116455078, "global_step": 494595, "epoch": 5958} {"train_loss": -27.294007060039473, "global_step": 494596, "epoch": 5958, "val_loss": 6488796.0} {"train_loss": -26.530120849609375, "global_step": 494597, "epoch": 5959} {"train_loss": -26.1958065032959, "global_step": 494598, "epoch": 5959} {"train_loss": -26.593536376953125, "global_step": 494599, "epoch": 5959} {"train_loss": -26.834592819213867, "global_step": 494600, "epoch": 5959} {"train_loss": -26.626001358032227, "global_step": 494601, "epoch": 5959} {"train_loss": -26.776647567749023, "global_step": 494602, "epoch": 5959} {"train_loss": -26.954349517822266, "global_step": 494603, "epoch": 5959} {"train_loss": -27.000350952148438, "global_step": 494604, "epoch": 5959} {"train_loss": -26.879352569580078, "global_step": 494605, "epoch": 5959} {"train_loss": -26.801849365234375, "global_step": 494606, "epoch": 5959} {"train_loss": -27.168140411376953, "global_step": 494607, "epoch": 5959} {"train_loss": -26.754444122314453, "global_step": 494608, "epoch": 5959} {"train_loss": -27.171903610229492, "global_step": 494609, "epoch": 5959} {"train_loss": -26.937902450561523, "global_step": 494610, "epoch": 5959} {"train_loss": -27.18953514099121, "global_step": 494611, "epoch": 5959} {"train_loss": -26.38239860534668, "global_step": 494612, "epoch": 5959} {"train_loss": -26.827966690063477, "global_step": 494613, "epoch": 5959} {"train_loss": -27.027847290039062, "global_step": 494614, "epoch": 5959} {"train_loss": -26.893091201782227, "global_step": 494615, "epoch": 5959} {"train_loss": -26.97981834411621, "global_step": 494616, "epoch": 5959} {"train_loss": -27.512250900268555, "global_step": 494617, "epoch": 5959} {"train_loss": -27.402151107788086, "global_step": 494618, "epoch": 5959} {"train_loss": -26.870275497436523, "global_step": 494619, "epoch": 5959} {"train_loss": -27.007055282592773, "global_step": 494620, "epoch": 5959} {"train_loss": -27.15582275390625, "global_step": 494621, "epoch": 5959} {"train_loss": -26.894559860229492, "global_step": 494622, "epoch": 5959} {"train_loss": -27.212507247924805, "global_step": 494623, "epoch": 5959} {"train_loss": -27.550067901611328, "global_step": 494624, "epoch": 5959} {"train_loss": -26.97784423828125, "global_step": 494625, "epoch": 5959} {"train_loss": -27.328205108642578, "global_step": 494626, "epoch": 5959} {"train_loss": -27.260400772094727, "global_step": 494627, "epoch": 5959} {"train_loss": -27.302404403686523, "global_step": 494628, "epoch": 5959} {"train_loss": -27.701709747314453, "global_step": 494629, "epoch": 5959} {"train_loss": -27.23736000061035, "global_step": 494630, "epoch": 5959} {"train_loss": -27.41554069519043, "global_step": 494631, "epoch": 5959} {"train_loss": -27.6243839263916, "global_step": 494632, "epoch": 5959} {"train_loss": -27.481088638305664, "global_step": 494633, "epoch": 5959} {"train_loss": -27.541122436523438, "global_step": 494634, "epoch": 5959} {"train_loss": -27.490589141845703, "global_step": 494635, "epoch": 5959} {"train_loss": -27.341419219970703, "global_step": 494636, "epoch": 5959} {"train_loss": -27.75787925720215, "global_step": 494637, "epoch": 5959} {"train_loss": -27.49928855895996, "global_step": 494638, "epoch": 5959} {"train_loss": -27.309722900390625, "global_step": 494639, "epoch": 5959} {"train_loss": -27.41714859008789, "global_step": 494640, "epoch": 5959} {"train_loss": -27.617706298828125, "global_step": 494641, "epoch": 5959} {"train_loss": -27.65378189086914, "global_step": 494642, "epoch": 5959} {"train_loss": -27.5233211517334, "global_step": 494643, "epoch": 5959} {"train_loss": -27.450239181518555, "global_step": 494644, "epoch": 5959} {"train_loss": -27.305164337158203, "global_step": 494645, "epoch": 5959} {"train_loss": -27.507062911987305, "global_step": 494646, "epoch": 5959} {"train_loss": -27.480453491210938, "global_step": 494647, "epoch": 5959} {"train_loss": -27.332782745361328, "global_step": 494648, "epoch": 5959} {"train_loss": -27.08487319946289, "global_step": 494649, "epoch": 5959} {"train_loss": -27.010007858276367, "global_step": 494650, "epoch": 5959} {"train_loss": -26.869464874267578, "global_step": 494651, "epoch": 5959} {"train_loss": -27.59765625, "global_step": 494652, "epoch": 5959} {"train_loss": -27.517988204956055, "global_step": 494653, "epoch": 5959} {"train_loss": -27.337793350219727, "global_step": 494654, "epoch": 5959} {"train_loss": -27.133655548095703, "global_step": 494655, "epoch": 5959} {"train_loss": -27.567432403564453, "global_step": 494656, "epoch": 5959} {"train_loss": -27.33851432800293, "global_step": 494657, "epoch": 5959} {"train_loss": -27.722700119018555, "global_step": 494658, "epoch": 5959} {"train_loss": -27.342437744140625, "global_step": 494659, "epoch": 5959} {"train_loss": -27.573291778564453, "global_step": 494660, "epoch": 5959} {"train_loss": -27.5355281829834, "global_step": 494661, "epoch": 5959} {"train_loss": -27.95686912536621, "global_step": 494662, "epoch": 5959} {"train_loss": -27.091459274291992, "global_step": 494663, "epoch": 5959} {"train_loss": -27.22342872619629, "global_step": 494664, "epoch": 5959} {"train_loss": -27.16008949279785, "global_step": 494665, "epoch": 5959} {"train_loss": -27.28826332092285, "global_step": 494666, "epoch": 5959} {"train_loss": -27.351850509643555, "global_step": 494667, "epoch": 5959} {"train_loss": -27.521299362182617, "global_step": 494668, "epoch": 5959} {"train_loss": -27.753253936767578, "global_step": 494669, "epoch": 5959} {"train_loss": -27.743555068969727, "global_step": 494670, "epoch": 5959} {"train_loss": -27.60907554626465, "global_step": 494671, "epoch": 5959} {"train_loss": -27.316526412963867, "global_step": 494672, "epoch": 5959} {"train_loss": -27.4608211517334, "global_step": 494673, "epoch": 5959} {"train_loss": -27.27020263671875, "global_step": 494674, "epoch": 5959} {"train_loss": -27.304162979125977, "global_step": 494675, "epoch": 5959} {"train_loss": -27.751953125, "global_step": 494676, "epoch": 5959} {"train_loss": -27.32147789001465, "global_step": 494677, "epoch": 5959} {"train_loss": -27.412063598632812, "global_step": 494678, "epoch": 5959} {"train_loss": -27.252583676073925, "global_step": 494679, "epoch": 5959, "val_loss": 6523820.0} {"train_loss": -26.6143798828125, "global_step": 494680, "epoch": 5960} {"train_loss": -25.92340660095215, "global_step": 494681, "epoch": 5960} {"train_loss": -26.2663631439209, "global_step": 494682, "epoch": 5960} {"train_loss": -27.055479049682617, "global_step": 494683, "epoch": 5960} {"train_loss": -26.71083641052246, "global_step": 494684, "epoch": 5960} {"train_loss": -27.068653106689453, "global_step": 494685, "epoch": 5960} {"train_loss": -26.97413444519043, "global_step": 494686, "epoch": 5960} {"train_loss": -26.9869441986084, "global_step": 494687, "epoch": 5960} {"train_loss": -26.847747802734375, "global_step": 494688, "epoch": 5960} {"train_loss": -26.981184005737305, "global_step": 494689, "epoch": 5960} {"train_loss": -26.9882869720459, "global_step": 494690, "epoch": 5960} {"train_loss": -26.884695053100586, "global_step": 494691, "epoch": 5960} {"train_loss": -27.284177780151367, "global_step": 494692, "epoch": 5960} {"train_loss": -27.14180564880371, "global_step": 494693, "epoch": 5960} {"train_loss": -27.042755126953125, "global_step": 494694, "epoch": 5960} {"train_loss": -27.364282608032227, "global_step": 494695, "epoch": 5960} {"train_loss": -26.819049835205078, "global_step": 494696, "epoch": 5960} {"train_loss": -27.15162467956543, "global_step": 494697, "epoch": 5960} {"train_loss": -26.647214889526367, "global_step": 494698, "epoch": 5960} {"train_loss": -27.178823471069336, "global_step": 494699, "epoch": 5960} {"train_loss": -27.23003578186035, "global_step": 494700, "epoch": 5960} {"train_loss": -27.02392578125, "global_step": 494701, "epoch": 5960} {"train_loss": -27.27493667602539, "global_step": 494702, "epoch": 5960} {"train_loss": -27.071943283081055, "global_step": 494703, "epoch": 5960} {"train_loss": -27.520919799804688, "global_step": 494704, "epoch": 5960} {"train_loss": -27.02947998046875, "global_step": 494705, "epoch": 5960} {"train_loss": -27.241926193237305, "global_step": 494706, "epoch": 5960} {"train_loss": -27.1525936126709, "global_step": 494707, "epoch": 5960} {"train_loss": -26.78106689453125, "global_step": 494708, "epoch": 5960} {"train_loss": -27.184436798095703, "global_step": 494709, "epoch": 5960} {"train_loss": -27.310306549072266, "global_step": 494710, "epoch": 5960} {"train_loss": -27.2574520111084, "global_step": 494711, "epoch": 5960} {"train_loss": -27.356891632080078, "global_step": 494712, "epoch": 5960} {"train_loss": -27.218603134155273, "global_step": 494713, "epoch": 5960} {"train_loss": -27.291950225830078, "global_step": 494714, "epoch": 5960} {"train_loss": -27.498554229736328, "global_step": 494715, "epoch": 5960} {"train_loss": -27.274274826049805, "global_step": 494716, "epoch": 5960} {"train_loss": -27.343896865844727, "global_step": 494717, "epoch": 5960} {"train_loss": -27.49390983581543, "global_step": 494718, "epoch": 5960} {"train_loss": -27.65242576599121, "global_step": 494719, "epoch": 5960} {"train_loss": -26.773075103759766, "global_step": 494720, "epoch": 5960} {"train_loss": -26.937713623046875, "global_step": 494721, "epoch": 5960} {"train_loss": -27.442535400390625, "global_step": 494722, "epoch": 5960} {"train_loss": -27.17462730407715, "global_step": 494723, "epoch": 5960} {"train_loss": -27.32193374633789, "global_step": 494724, "epoch": 5960} {"train_loss": -27.455408096313477, "global_step": 494725, "epoch": 5960} {"train_loss": -27.582122802734375, "global_step": 494726, "epoch": 5960} {"train_loss": -27.5295352935791, "global_step": 494727, "epoch": 5960} {"train_loss": -27.24676513671875, "global_step": 494728, "epoch": 5960} {"train_loss": -27.55027198791504, "global_step": 494729, "epoch": 5960} {"train_loss": -27.562641143798828, "global_step": 494730, "epoch": 5960} {"train_loss": -27.524076461791992, "global_step": 494731, "epoch": 5960} {"train_loss": -27.717573165893555, "global_step": 494732, "epoch": 5960} {"train_loss": -27.364490509033203, "global_step": 494733, "epoch": 5960} {"train_loss": -27.654016494750977, "global_step": 494734, "epoch": 5960} {"train_loss": -27.28104591369629, "global_step": 494735, "epoch": 5960} {"train_loss": -27.42302894592285, "global_step": 494736, "epoch": 5960} {"train_loss": -27.397268295288086, "global_step": 494737, "epoch": 5960} {"train_loss": -27.233198165893555, "global_step": 494738, "epoch": 5960} {"train_loss": -27.570098876953125, "global_step": 494739, "epoch": 5960} {"train_loss": -27.46927833557129, "global_step": 494740, "epoch": 5960} {"train_loss": -27.4941463470459, "global_step": 494741, "epoch": 5960} {"train_loss": -27.794187545776367, "global_step": 494742, "epoch": 5960} {"train_loss": -27.68903923034668, "global_step": 494743, "epoch": 5960} {"train_loss": -27.205408096313477, "global_step": 494744, "epoch": 5960} {"train_loss": -27.130590438842773, "global_step": 494745, "epoch": 5960} {"train_loss": -26.229511260986328, "global_step": 494746, "epoch": 5960} {"train_loss": -25.407739639282227, "global_step": 494747, "epoch": 5960} {"train_loss": -26.167200088500977, "global_step": 494748, "epoch": 5960} {"train_loss": -27.02994728088379, "global_step": 494749, "epoch": 5960} {"train_loss": -26.491662979125977, "global_step": 494750, "epoch": 5960} {"train_loss": -27.33088493347168, "global_step": 494751, "epoch": 5960} {"train_loss": -26.652496337890625, "global_step": 494752, "epoch": 5960} {"train_loss": -27.1021785736084, "global_step": 494753, "epoch": 5960} {"train_loss": -26.94716453552246, "global_step": 494754, "epoch": 5960} {"train_loss": -27.26690673828125, "global_step": 494755, "epoch": 5960} {"train_loss": -27.142919540405273, "global_step": 494756, "epoch": 5960} {"train_loss": -26.898639678955078, "global_step": 494757, "epoch": 5960} {"train_loss": -27.7580623626709, "global_step": 494758, "epoch": 5960} {"train_loss": -26.644662857055664, "global_step": 494759, "epoch": 5960} {"train_loss": -27.21595573425293, "global_step": 494760, "epoch": 5960} {"train_loss": -27.553653717041016, "global_step": 494761, "epoch": 5960} {"train_loss": -27.138362792601068, "global_step": 494762, "epoch": 5960, "val_loss": 6478945.0} {"train_loss": -27.056867599487305, "global_step": 494763, "epoch": 5961} {"train_loss": -26.926855087280273, "global_step": 494764, "epoch": 5961} {"train_loss": -27.018085479736328, "global_step": 494765, "epoch": 5961} {"train_loss": -26.783349990844727, "global_step": 494766, "epoch": 5961} {"train_loss": -26.60761833190918, "global_step": 494767, "epoch": 5961} {"train_loss": -27.134565353393555, "global_step": 494768, "epoch": 5961} {"train_loss": -26.65070915222168, "global_step": 494769, "epoch": 5961} {"train_loss": -27.24741554260254, "global_step": 494770, "epoch": 5961} {"train_loss": -27.33698081970215, "global_step": 494771, "epoch": 5961} {"train_loss": -27.069623947143555, "global_step": 494772, "epoch": 5961} {"train_loss": -26.964282989501953, "global_step": 494773, "epoch": 5961} {"train_loss": -27.078283309936523, "global_step": 494774, "epoch": 5961} {"train_loss": -27.202051162719727, "global_step": 494775, "epoch": 5961} {"train_loss": -26.961673736572266, "global_step": 494776, "epoch": 5961} {"train_loss": -27.02859878540039, "global_step": 494777, "epoch": 5961} {"train_loss": -26.473169326782227, "global_step": 494778, "epoch": 5961} {"train_loss": -27.212438583374023, "global_step": 494779, "epoch": 5961} {"train_loss": -27.447845458984375, "global_step": 494780, "epoch": 5961} {"train_loss": -27.05438804626465, "global_step": 494781, "epoch": 5961} {"train_loss": -26.794103622436523, "global_step": 494782, "epoch": 5961} {"train_loss": -27.15673828125, "global_step": 494783, "epoch": 5961} {"train_loss": -26.953577041625977, "global_step": 494784, "epoch": 5961} {"train_loss": -26.78486442565918, "global_step": 494785, "epoch": 5961} {"train_loss": -27.38191032409668, "global_step": 494786, "epoch": 5961} {"train_loss": -27.576322555541992, "global_step": 494787, "epoch": 5961} {"train_loss": -27.20635986328125, "global_step": 494788, "epoch": 5961} {"train_loss": -27.676183700561523, "global_step": 494789, "epoch": 5961} {"train_loss": -27.252460479736328, "global_step": 494790, "epoch": 5961} {"train_loss": -27.380502700805664, "global_step": 494791, "epoch": 5961} {"train_loss": -27.54974365234375, "global_step": 494792, "epoch": 5961} {"train_loss": -27.622817993164062, "global_step": 494793, "epoch": 5961} {"train_loss": -27.65011978149414, "global_step": 494794, "epoch": 5961} {"train_loss": -27.524030685424805, "global_step": 494795, "epoch": 5961} {"train_loss": -27.574588775634766, "global_step": 494796, "epoch": 5961} {"train_loss": -27.599761962890625, "global_step": 494797, "epoch": 5961} {"train_loss": -27.37981605529785, "global_step": 494798, "epoch": 5961} {"train_loss": -27.597503662109375, "global_step": 494799, "epoch": 5961} {"train_loss": -27.32406997680664, "global_step": 494800, "epoch": 5961} {"train_loss": -27.396686553955078, "global_step": 494801, "epoch": 5961} {"train_loss": -27.336057662963867, "global_step": 494802, "epoch": 5961} {"train_loss": -27.33172607421875, "global_step": 494803, "epoch": 5961} {"train_loss": -27.75477409362793, "global_step": 494804, "epoch": 5961} {"train_loss": -27.685739517211914, "global_step": 494805, "epoch": 5961} {"train_loss": -27.68818473815918, "global_step": 494806, "epoch": 5961} {"train_loss": -27.450592041015625, "global_step": 494807, "epoch": 5961} {"train_loss": -27.989349365234375, "global_step": 494808, "epoch": 5961} {"train_loss": -27.593341827392578, "global_step": 494809, "epoch": 5961} {"train_loss": -27.352930068969727, "global_step": 494810, "epoch": 5961} {"train_loss": -27.350866317749023, "global_step": 494811, "epoch": 5961} {"train_loss": -26.77740478515625, "global_step": 494812, "epoch": 5961} {"train_loss": -27.540241241455078, "global_step": 494813, "epoch": 5961} {"train_loss": -27.08066749572754, "global_step": 494814, "epoch": 5961} {"train_loss": -27.2353515625, "global_step": 494815, "epoch": 5961} {"train_loss": -27.69060707092285, "global_step": 494816, "epoch": 5961} {"train_loss": -27.483428955078125, "global_step": 494817, "epoch": 5961} {"train_loss": -27.438276290893555, "global_step": 494818, "epoch": 5961} {"train_loss": -27.03435707092285, "global_step": 494819, "epoch": 5961} {"train_loss": -27.556058883666992, "global_step": 494820, "epoch": 5961} {"train_loss": -27.248600006103516, "global_step": 494821, "epoch": 5961} {"train_loss": -27.237958908081055, "global_step": 494822, "epoch": 5961} {"train_loss": -27.445642471313477, "global_step": 494823, "epoch": 5961} {"train_loss": -27.226852416992188, "global_step": 494824, "epoch": 5961} {"train_loss": -27.306333541870117, "global_step": 494825, "epoch": 5961} {"train_loss": -26.418909072875977, "global_step": 494826, "epoch": 5961} {"train_loss": -26.83509635925293, "global_step": 494827, "epoch": 5961} {"train_loss": -26.947345733642578, "global_step": 494828, "epoch": 5961} {"train_loss": -26.981725692749023, "global_step": 494829, "epoch": 5961} {"train_loss": -26.626935958862305, "global_step": 494830, "epoch": 5961} {"train_loss": -27.084674835205078, "global_step": 494831, "epoch": 5961} {"train_loss": -26.883575439453125, "global_step": 494832, "epoch": 5961} {"train_loss": -27.108875274658203, "global_step": 494833, "epoch": 5961} {"train_loss": -26.732702255249023, "global_step": 494834, "epoch": 5961} {"train_loss": -27.029022216796875, "global_step": 494835, "epoch": 5961} {"train_loss": -26.64259147644043, "global_step": 494836, "epoch": 5961} {"train_loss": -26.5723819732666, "global_step": 494837, "epoch": 5961} {"train_loss": -26.386749267578125, "global_step": 494838, "epoch": 5961} {"train_loss": -26.810138702392578, "global_step": 494839, "epoch": 5961} {"train_loss": -26.898178100585938, "global_step": 494840, "epoch": 5961} {"train_loss": -26.692005157470703, "global_step": 494841, "epoch": 5961} {"train_loss": -26.89374351501465, "global_step": 494842, "epoch": 5961} {"train_loss": -27.30963706970215, "global_step": 494843, "epoch": 5961} {"train_loss": -26.765806198120117, "global_step": 494844, "epoch": 5961} {"train_loss": -27.197235521063746, "global_step": 494845, "epoch": 5961, "val_loss": 6469882.5} {"train_loss": -26.246841430664062, "global_step": 494846, "epoch": 5962} {"train_loss": -27.087848663330078, "global_step": 494847, "epoch": 5962} {"train_loss": -26.64552879333496, "global_step": 494848, "epoch": 5962} {"train_loss": -26.65162467956543, "global_step": 494849, "epoch": 5962} {"train_loss": -26.484731674194336, "global_step": 494850, "epoch": 5962} {"train_loss": -26.528608322143555, "global_step": 494851, "epoch": 5962} {"train_loss": -26.655887603759766, "global_step": 494852, "epoch": 5962} {"train_loss": -26.926239013671875, "global_step": 494853, "epoch": 5962} {"train_loss": -26.64997673034668, "global_step": 494854, "epoch": 5962} {"train_loss": -26.556903839111328, "global_step": 494855, "epoch": 5962} {"train_loss": -27.366865158081055, "global_step": 494856, "epoch": 5962} {"train_loss": -26.581296920776367, "global_step": 494857, "epoch": 5962} {"train_loss": -26.8248291015625, "global_step": 494858, "epoch": 5962} {"train_loss": -27.268020629882812, "global_step": 494859, "epoch": 5962} {"train_loss": -27.126953125, "global_step": 494860, "epoch": 5962} {"train_loss": -27.192285537719727, "global_step": 494861, "epoch": 5962} {"train_loss": -26.810718536376953, "global_step": 494862, "epoch": 5962} {"train_loss": -27.147602081298828, "global_step": 494863, "epoch": 5962} {"train_loss": -27.397489547729492, "global_step": 494864, "epoch": 5962} {"train_loss": -27.0459041595459, "global_step": 494865, "epoch": 5962} {"train_loss": -26.95362663269043, "global_step": 494866, "epoch": 5962} {"train_loss": -27.310461044311523, "global_step": 494867, "epoch": 5962} {"train_loss": -27.333465576171875, "global_step": 494868, "epoch": 5962} {"train_loss": -27.145288467407227, "global_step": 494869, "epoch": 5962} {"train_loss": -27.055328369140625, "global_step": 494870, "epoch": 5962} {"train_loss": -26.925256729125977, "global_step": 494871, "epoch": 5962} {"train_loss": -27.378843307495117, "global_step": 494872, "epoch": 5962} {"train_loss": -27.163434982299805, "global_step": 494873, "epoch": 5962} {"train_loss": -27.657306671142578, "global_step": 494874, "epoch": 5962} {"train_loss": -27.305700302124023, "global_step": 494875, "epoch": 5962} {"train_loss": -26.761402130126953, "global_step": 494876, "epoch": 5962} {"train_loss": -27.194766998291016, "global_step": 494877, "epoch": 5962} {"train_loss": -27.238523483276367, "global_step": 494878, "epoch": 5962} {"train_loss": -27.452686309814453, "global_step": 494879, "epoch": 5962} {"train_loss": -27.442846298217773, "global_step": 494880, "epoch": 5962} {"train_loss": -27.31873893737793, "global_step": 494881, "epoch": 5962} {"train_loss": -27.425811767578125, "global_step": 494882, "epoch": 5962} {"train_loss": -27.24151611328125, "global_step": 494883, "epoch": 5962} {"train_loss": -27.349836349487305, "global_step": 494884, "epoch": 5962} {"train_loss": -27.385663986206055, "global_step": 494885, "epoch": 5962} {"train_loss": -27.043609619140625, "global_step": 494886, "epoch": 5962} {"train_loss": -27.474746704101562, "global_step": 494887, "epoch": 5962} {"train_loss": -27.36345863342285, "global_step": 494888, "epoch": 5962} {"train_loss": -27.581212997436523, "global_step": 494889, "epoch": 5962} {"train_loss": -27.554306030273438, "global_step": 494890, "epoch": 5962} {"train_loss": -27.256580352783203, "global_step": 494891, "epoch": 5962} {"train_loss": -27.646881103515625, "global_step": 494892, "epoch": 5962} {"train_loss": -27.577489852905273, "global_step": 494893, "epoch": 5962} {"train_loss": -27.302099227905273, "global_step": 494894, "epoch": 5962} {"train_loss": -27.333755493164062, "global_step": 494895, "epoch": 5962} {"train_loss": -27.322961807250977, "global_step": 494896, "epoch": 5962} {"train_loss": -27.450002670288086, "global_step": 494897, "epoch": 5962} {"train_loss": -27.4534854888916, "global_step": 494898, "epoch": 5962} {"train_loss": -27.580596923828125, "global_step": 494899, "epoch": 5962} {"train_loss": -27.430770874023438, "global_step": 494900, "epoch": 5962} {"train_loss": -27.57913589477539, "global_step": 494901, "epoch": 5962} {"train_loss": -27.306671142578125, "global_step": 494902, "epoch": 5962} {"train_loss": -27.74635887145996, "global_step": 494903, "epoch": 5962} {"train_loss": -27.654584884643555, "global_step": 494904, "epoch": 5962} {"train_loss": -27.249011993408203, "global_step": 494905, "epoch": 5962} {"train_loss": -27.346515655517578, "global_step": 494906, "epoch": 5962} {"train_loss": -26.997634887695312, "global_step": 494907, "epoch": 5962} {"train_loss": -27.326465606689453, "global_step": 494908, "epoch": 5962} {"train_loss": -27.289386749267578, "global_step": 494909, "epoch": 5962} {"train_loss": -27.58321189880371, "global_step": 494910, "epoch": 5962} {"train_loss": -27.03826332092285, "global_step": 494911, "epoch": 5962} {"train_loss": -27.236310958862305, "global_step": 494912, "epoch": 5962} {"train_loss": -27.54682731628418, "global_step": 494913, "epoch": 5962} {"train_loss": -27.427600860595703, "global_step": 494914, "epoch": 5962} {"train_loss": -27.326953887939453, "global_step": 494915, "epoch": 5962} {"train_loss": -27.417724609375, "global_step": 494916, "epoch": 5962} {"train_loss": -27.2703857421875, "global_step": 494917, "epoch": 5962} {"train_loss": -27.46625328063965, "global_step": 494918, "epoch": 5962} {"train_loss": -27.80975341796875, "global_step": 494919, "epoch": 5962} {"train_loss": -27.491352081298828, "global_step": 494920, "epoch": 5962} {"train_loss": -27.084665298461914, "global_step": 494921, "epoch": 5962} {"train_loss": -27.246824264526367, "global_step": 494922, "epoch": 5962} {"train_loss": -27.42795753479004, "global_step": 494923, "epoch": 5962} {"train_loss": -27.18417739868164, "global_step": 494924, "epoch": 5962} {"train_loss": -27.107023239135742, "global_step": 494925, "epoch": 5962} {"train_loss": -27.396808624267578, "global_step": 494926, "epoch": 5962} {"train_loss": -27.3171443939209, "global_step": 494927, "epoch": 5962} {"train_loss": -27.232224981468843, "global_step": 494928, "epoch": 5962, "val_loss": 6465258.0} {"train_loss": -26.605382919311523, "global_step": 494929, "epoch": 5963} {"train_loss": -26.283315658569336, "global_step": 494930, "epoch": 5963} {"train_loss": -26.243152618408203, "global_step": 494931, "epoch": 5963} {"train_loss": -26.481555938720703, "global_step": 494932, "epoch": 5963} {"train_loss": -26.746566772460938, "global_step": 494933, "epoch": 5963} {"train_loss": -26.46907615661621, "global_step": 494934, "epoch": 5963} {"train_loss": -26.416913986206055, "global_step": 494935, "epoch": 5963} {"train_loss": -26.734655380249023, "global_step": 494936, "epoch": 5963} {"train_loss": -26.659473419189453, "global_step": 494937, "epoch": 5963} {"train_loss": -26.633590698242188, "global_step": 494938, "epoch": 5963} {"train_loss": -26.955251693725586, "global_step": 494939, "epoch": 5963} {"train_loss": -26.91486930847168, "global_step": 494940, "epoch": 5963} {"train_loss": -26.755950927734375, "global_step": 494941, "epoch": 5963} {"train_loss": -26.958036422729492, "global_step": 494942, "epoch": 5963} {"train_loss": -26.627023696899414, "global_step": 494943, "epoch": 5963} {"train_loss": -27.103113174438477, "global_step": 494944, "epoch": 5963} {"train_loss": -26.53554344177246, "global_step": 494945, "epoch": 5963} {"train_loss": -26.707990646362305, "global_step": 494946, "epoch": 5963} {"train_loss": -27.262292861938477, "global_step": 494947, "epoch": 5963} {"train_loss": -27.207706451416016, "global_step": 494948, "epoch": 5963} {"train_loss": -26.86628532409668, "global_step": 494949, "epoch": 5963} {"train_loss": -27.425275802612305, "global_step": 494950, "epoch": 5963} {"train_loss": -27.080663681030273, "global_step": 494951, "epoch": 5963} {"train_loss": -27.297473907470703, "global_step": 494952, "epoch": 5963} {"train_loss": -27.22088050842285, "global_step": 494953, "epoch": 5963} {"train_loss": -27.0043888092041, "global_step": 494954, "epoch": 5963} {"train_loss": -27.539167404174805, "global_step": 494955, "epoch": 5963} {"train_loss": -27.47846794128418, "global_step": 494956, "epoch": 5963} {"train_loss": -27.218053817749023, "global_step": 494957, "epoch": 5963} {"train_loss": -27.367053985595703, "global_step": 494958, "epoch": 5963} {"train_loss": -26.85336685180664, "global_step": 494959, "epoch": 5963} {"train_loss": -27.49603843688965, "global_step": 494960, "epoch": 5963} {"train_loss": -27.3934268951416, "global_step": 494961, "epoch": 5963} {"train_loss": -27.42764663696289, "global_step": 494962, "epoch": 5963} {"train_loss": -27.216129302978516, "global_step": 494963, "epoch": 5963} {"train_loss": -27.352197647094727, "global_step": 494964, "epoch": 5963} {"train_loss": -27.567846298217773, "global_step": 494965, "epoch": 5963} {"train_loss": -27.387842178344727, "global_step": 494966, "epoch": 5963} {"train_loss": -27.308979034423828, "global_step": 494967, "epoch": 5963} {"train_loss": -27.89291763305664, "global_step": 494968, "epoch": 5963} {"train_loss": -27.35498046875, "global_step": 494969, "epoch": 5963} {"train_loss": -27.38599967956543, "global_step": 494970, "epoch": 5963} {"train_loss": -27.74629020690918, "global_step": 494971, "epoch": 5963} {"train_loss": -27.171798706054688, "global_step": 494972, "epoch": 5963} {"train_loss": -27.291946411132812, "global_step": 494973, "epoch": 5963} {"train_loss": -27.45490074157715, "global_step": 494974, "epoch": 5963} {"train_loss": -27.619110107421875, "global_step": 494975, "epoch": 5963} {"train_loss": -27.519683837890625, "global_step": 494976, "epoch": 5963} {"train_loss": -27.91413688659668, "global_step": 494977, "epoch": 5963} {"train_loss": -27.4639835357666, "global_step": 494978, "epoch": 5963} {"train_loss": -27.49190330505371, "global_step": 494979, "epoch": 5963} {"train_loss": -27.49277114868164, "global_step": 494980, "epoch": 5963} {"train_loss": -27.50018882751465, "global_step": 494981, "epoch": 5963} {"train_loss": -27.12973403930664, "global_step": 494982, "epoch": 5963} {"train_loss": -27.112442016601562, "global_step": 494983, "epoch": 5963} {"train_loss": -27.287378311157227, "global_step": 494984, "epoch": 5963} {"train_loss": -27.608367919921875, "global_step": 494985, "epoch": 5963} {"train_loss": -27.376117706298828, "global_step": 494986, "epoch": 5963} {"train_loss": -27.156208038330078, "global_step": 494987, "epoch": 5963} {"train_loss": -27.7269287109375, "global_step": 494988, "epoch": 5963} {"train_loss": -27.817968368530273, "global_step": 494989, "epoch": 5963} {"train_loss": -27.19312858581543, "global_step": 494990, "epoch": 5963} {"train_loss": -27.26788330078125, "global_step": 494991, "epoch": 5963} {"train_loss": -27.075864791870117, "global_step": 494992, "epoch": 5963} {"train_loss": -27.1637020111084, "global_step": 494993, "epoch": 5963} {"train_loss": -27.102691650390625, "global_step": 494994, "epoch": 5963} {"train_loss": -26.79975700378418, "global_step": 494995, "epoch": 5963} {"train_loss": -27.059911727905273, "global_step": 494996, "epoch": 5963} {"train_loss": -26.763904571533203, "global_step": 494997, "epoch": 5963} {"train_loss": -27.005346298217773, "global_step": 494998, "epoch": 5963} {"train_loss": -26.981393814086914, "global_step": 494999, "epoch": 5963} {"train_loss": -27.22669792175293, "global_step": 495000, "epoch": 5963} {"train_loss": -27.153234481811523, "global_step": 495001, "epoch": 5963} {"train_loss": -26.972700119018555, "global_step": 495002, "epoch": 5963} {"train_loss": -27.1934814453125, "global_step": 495003, "epoch": 5963} {"train_loss": -27.458829879760742, "global_step": 495004, "epoch": 5963} {"train_loss": -27.420286178588867, "global_step": 495005, "epoch": 5963} {"train_loss": -27.0524959564209, "global_step": 495006, "epoch": 5963} {"train_loss": -27.27651023864746, "global_step": 495007, "epoch": 5963} {"train_loss": -27.296201705932617, "global_step": 495008, "epoch": 5963} {"train_loss": -27.194868087768555, "global_step": 495009, "epoch": 5963} {"train_loss": -27.498441696166992, "global_step": 495010, "epoch": 5963} {"train_loss": -27.17261688967785, "global_step": 495011, "epoch": 5963, "val_loss": 6480036.5} {"train_loss": -26.872055053710938, "global_step": 495012, "epoch": 5964} {"train_loss": -26.842798233032227, "global_step": 495013, "epoch": 5964} {"train_loss": -26.570087432861328, "global_step": 495014, "epoch": 5964} {"train_loss": -27.039045333862305, "global_step": 495015, "epoch": 5964} {"train_loss": -26.758466720581055, "global_step": 495016, "epoch": 5964} {"train_loss": -26.727508544921875, "global_step": 495017, "epoch": 5964} {"train_loss": -26.990564346313477, "global_step": 495018, "epoch": 5964} {"train_loss": -26.566877365112305, "global_step": 495019, "epoch": 5964} {"train_loss": -26.533117294311523, "global_step": 495020, "epoch": 5964} {"train_loss": -27.035236358642578, "global_step": 495021, "epoch": 5964} {"train_loss": -26.686359405517578, "global_step": 495022, "epoch": 5964} {"train_loss": -27.000253677368164, "global_step": 495023, "epoch": 5964} {"train_loss": -26.795217514038086, "global_step": 495024, "epoch": 5964} {"train_loss": -26.70005226135254, "global_step": 495025, "epoch": 5964} {"train_loss": -27.1919002532959, "global_step": 495026, "epoch": 5964} {"train_loss": -27.001440048217773, "global_step": 495027, "epoch": 5964} {"train_loss": -26.84685707092285, "global_step": 495028, "epoch": 5964} {"train_loss": -27.092533111572266, "global_step": 495029, "epoch": 5964} {"train_loss": -27.02994728088379, "global_step": 495030, "epoch": 5964} {"train_loss": -27.2343807220459, "global_step": 495031, "epoch": 5964} {"train_loss": -27.417633056640625, "global_step": 495032, "epoch": 5964} {"train_loss": -27.2927303314209, "global_step": 495033, "epoch": 5964} {"train_loss": -27.180896759033203, "global_step": 495034, "epoch": 5964} {"train_loss": -27.351062774658203, "global_step": 495035, "epoch": 5964} {"train_loss": -27.33451271057129, "global_step": 495036, "epoch": 5964} {"train_loss": -27.242124557495117, "global_step": 495037, "epoch": 5964} {"train_loss": -27.495588302612305, "global_step": 495038, "epoch": 5964} {"train_loss": -27.33734703063965, "global_step": 495039, "epoch": 5964} {"train_loss": -26.96833610534668, "global_step": 495040, "epoch": 5964} {"train_loss": -27.345304489135742, "global_step": 495041, "epoch": 5964} {"train_loss": -27.441354751586914, "global_step": 495042, "epoch": 5964} {"train_loss": -27.426111221313477, "global_step": 495043, "epoch": 5964} {"train_loss": -27.21917152404785, "global_step": 495044, "epoch": 5964} {"train_loss": -27.154499053955078, "global_step": 495045, "epoch": 5964} {"train_loss": -26.77432632446289, "global_step": 495046, "epoch": 5964} {"train_loss": -27.296539306640625, "global_step": 495047, "epoch": 5964} {"train_loss": -27.23811149597168, "global_step": 495048, "epoch": 5964} {"train_loss": -27.1081485748291, "global_step": 495049, "epoch": 5964} {"train_loss": -26.97873306274414, "global_step": 495050, "epoch": 5964} {"train_loss": -27.395191192626953, "global_step": 495051, "epoch": 5964} {"train_loss": -27.229724884033203, "global_step": 495052, "epoch": 5964} {"train_loss": -27.31084632873535, "global_step": 495053, "epoch": 5964} {"train_loss": -27.195926666259766, "global_step": 495054, "epoch": 5964} {"train_loss": -27.37412452697754, "global_step": 495055, "epoch": 5964} {"train_loss": -26.996383666992188, "global_step": 495056, "epoch": 5964} {"train_loss": -27.233774185180664, "global_step": 495057, "epoch": 5964} {"train_loss": -27.338281631469727, "global_step": 495058, "epoch": 5964} {"train_loss": -27.22010612487793, "global_step": 495059, "epoch": 5964} {"train_loss": -27.32660484313965, "global_step": 495060, "epoch": 5964} {"train_loss": -27.469282150268555, "global_step": 495061, "epoch": 5964} {"train_loss": -27.641942977905273, "global_step": 495062, "epoch": 5964} {"train_loss": -27.272397994995117, "global_step": 495063, "epoch": 5964} {"train_loss": -27.269067764282227, "global_step": 495064, "epoch": 5964} {"train_loss": -27.453323364257812, "global_step": 495065, "epoch": 5964} {"train_loss": -27.280832290649414, "global_step": 495066, "epoch": 5964} {"train_loss": -27.43172264099121, "global_step": 495067, "epoch": 5964} {"train_loss": -27.205915451049805, "global_step": 495068, "epoch": 5964} {"train_loss": -27.6691837310791, "global_step": 495069, "epoch": 5964} {"train_loss": -27.670751571655273, "global_step": 495070, "epoch": 5964} {"train_loss": -27.33088493347168, "global_step": 495071, "epoch": 5964} {"train_loss": -27.82062339782715, "global_step": 495072, "epoch": 5964} {"train_loss": -27.457242965698242, "global_step": 495073, "epoch": 5964} {"train_loss": -27.48744010925293, "global_step": 495074, "epoch": 5964} {"train_loss": -27.55592155456543, "global_step": 495075, "epoch": 5964} {"train_loss": -27.8664493560791, "global_step": 495076, "epoch": 5964} {"train_loss": -27.752857208251953, "global_step": 495077, "epoch": 5964} {"train_loss": -27.612096786499023, "global_step": 495078, "epoch": 5964} {"train_loss": -28.02019691467285, "global_step": 495079, "epoch": 5964} {"train_loss": -27.462926864624023, "global_step": 495080, "epoch": 5964} {"train_loss": -27.211755752563477, "global_step": 495081, "epoch": 5964} {"train_loss": -27.62714195251465, "global_step": 495082, "epoch": 5964} {"train_loss": -27.251134872436523, "global_step": 495083, "epoch": 5964} {"train_loss": -27.77475929260254, "global_step": 495084, "epoch": 5964} {"train_loss": -27.64655113220215, "global_step": 495085, "epoch": 5964} {"train_loss": -27.579788208007812, "global_step": 495086, "epoch": 5964} {"train_loss": -27.45138931274414, "global_step": 495087, "epoch": 5964} {"train_loss": -27.860687255859375, "global_step": 495088, "epoch": 5964} {"train_loss": -27.73854637145996, "global_step": 495089, "epoch": 5964} {"train_loss": -27.601516723632812, "global_step": 495090, "epoch": 5964} {"train_loss": -27.24798583984375, "global_step": 495091, "epoch": 5964} {"train_loss": -27.660816192626953, "global_step": 495092, "epoch": 5964} {"train_loss": -27.630701065063477, "global_step": 495093, "epoch": 5964} {"train_loss": -27.27964309324701, "global_step": 495094, "epoch": 5964, "val_loss": 6566724.0} {"train_loss": -26.912946701049805, "global_step": 495095, "epoch": 5965} {"train_loss": -25.68169593811035, "global_step": 495096, "epoch": 5965} {"train_loss": -25.47872543334961, "global_step": 495097, "epoch": 5965} {"train_loss": -23.946029663085938, "global_step": 495098, "epoch": 5965} {"train_loss": -24.839746475219727, "global_step": 495099, "epoch": 5965} {"train_loss": -26.832876205444336, "global_step": 495100, "epoch": 5965} {"train_loss": -26.091001510620117, "global_step": 495101, "epoch": 5965} {"train_loss": -25.8657169342041, "global_step": 495102, "epoch": 5965} {"train_loss": -26.676305770874023, "global_step": 495103, "epoch": 5965} {"train_loss": -26.53388023376465, "global_step": 495104, "epoch": 5965} {"train_loss": -26.433761596679688, "global_step": 495105, "epoch": 5965} {"train_loss": -26.1275634765625, "global_step": 495106, "epoch": 5965} {"train_loss": -26.444067001342773, "global_step": 495107, "epoch": 5965} {"train_loss": -26.2340030670166, "global_step": 495108, "epoch": 5965} {"train_loss": -26.392675399780273, "global_step": 495109, "epoch": 5965} {"train_loss": -26.840625762939453, "global_step": 495110, "epoch": 5965} {"train_loss": -26.877038955688477, "global_step": 495111, "epoch": 5965} {"train_loss": -26.8369197845459, "global_step": 495112, "epoch": 5965} {"train_loss": -26.696441650390625, "global_step": 495113, "epoch": 5965} {"train_loss": -26.83778190612793, "global_step": 495114, "epoch": 5965} {"train_loss": -26.930082321166992, "global_step": 495115, "epoch": 5965} {"train_loss": -26.91290283203125, "global_step": 495116, "epoch": 5965} {"train_loss": -27.1546630859375, "global_step": 495117, "epoch": 5965} {"train_loss": -26.95474624633789, "global_step": 495118, "epoch": 5965} {"train_loss": -27.02813148498535, "global_step": 495119, "epoch": 5965} {"train_loss": -26.785032272338867, "global_step": 495120, "epoch": 5965} {"train_loss": -27.057653427124023, "global_step": 495121, "epoch": 5965} {"train_loss": -27.260650634765625, "global_step": 495122, "epoch": 5965} {"train_loss": -27.116230010986328, "global_step": 495123, "epoch": 5965} {"train_loss": -27.0117244720459, "global_step": 495124, "epoch": 5965} {"train_loss": -27.44073486328125, "global_step": 495125, "epoch": 5965} {"train_loss": -27.084075927734375, "global_step": 495126, "epoch": 5965} {"train_loss": -27.196063995361328, "global_step": 495127, "epoch": 5965} {"train_loss": -27.24542808532715, "global_step": 495128, "epoch": 5965} {"train_loss": -27.048120498657227, "global_step": 495129, "epoch": 5965} {"train_loss": -27.262699127197266, "global_step": 495130, "epoch": 5965} {"train_loss": -27.071088790893555, "global_step": 495131, "epoch": 5965} {"train_loss": -27.349933624267578, "global_step": 495132, "epoch": 5965} {"train_loss": -27.328763961791992, "global_step": 495133, "epoch": 5965} {"train_loss": -27.289447784423828, "global_step": 495134, "epoch": 5965} {"train_loss": -27.16794776916504, "global_step": 495135, "epoch": 5965} {"train_loss": -27.354816436767578, "global_step": 495136, "epoch": 5965} {"train_loss": -27.486572265625, "global_step": 495137, "epoch": 5965} {"train_loss": -27.246185302734375, "global_step": 495138, "epoch": 5965} {"train_loss": -27.587629318237305, "global_step": 495139, "epoch": 5965} {"train_loss": -27.300373077392578, "global_step": 495140, "epoch": 5965} {"train_loss": -27.7413330078125, "global_step": 495141, "epoch": 5965} {"train_loss": -27.068140029907227, "global_step": 495142, "epoch": 5965} {"train_loss": -27.583831787109375, "global_step": 495143, "epoch": 5965} {"train_loss": -27.34214210510254, "global_step": 495144, "epoch": 5965} {"train_loss": -27.123258590698242, "global_step": 495145, "epoch": 5965} {"train_loss": -27.18507194519043, "global_step": 495146, "epoch": 5965} {"train_loss": -27.17496681213379, "global_step": 495147, "epoch": 5965} {"train_loss": -27.36334800720215, "global_step": 495148, "epoch": 5965} {"train_loss": -27.26227378845215, "global_step": 495149, "epoch": 5965} {"train_loss": -27.42498207092285, "global_step": 495150, "epoch": 5965} {"train_loss": -27.27988624572754, "global_step": 495151, "epoch": 5965} {"train_loss": -27.53737449645996, "global_step": 495152, "epoch": 5965} {"train_loss": -27.4761962890625, "global_step": 495153, "epoch": 5965} {"train_loss": -27.686368942260742, "global_step": 495154, "epoch": 5965} {"train_loss": -27.53558921813965, "global_step": 495155, "epoch": 5965} {"train_loss": -27.362791061401367, "global_step": 495156, "epoch": 5965} {"train_loss": -27.38710594177246, "global_step": 495157, "epoch": 5965} {"train_loss": -27.169408798217773, "global_step": 495158, "epoch": 5965} {"train_loss": -27.384626388549805, "global_step": 495159, "epoch": 5965} {"train_loss": -27.58658790588379, "global_step": 495160, "epoch": 5965} {"train_loss": -27.513534545898438, "global_step": 495161, "epoch": 5965} {"train_loss": -27.723896026611328, "global_step": 495162, "epoch": 5965} {"train_loss": -27.72841453552246, "global_step": 495163, "epoch": 5965} {"train_loss": -27.314722061157227, "global_step": 495164, "epoch": 5965} {"train_loss": -27.633941650390625, "global_step": 495165, "epoch": 5965} {"train_loss": -27.772113800048828, "global_step": 495166, "epoch": 5965} {"train_loss": -27.49570083618164, "global_step": 495167, "epoch": 5965} {"train_loss": -27.942228317260742, "global_step": 495168, "epoch": 5965} {"train_loss": -27.440067291259766, "global_step": 495169, "epoch": 5965} {"train_loss": -27.557836532592773, "global_step": 495170, "epoch": 5965} {"train_loss": -27.7081298828125, "global_step": 495171, "epoch": 5965} {"train_loss": -27.79559326171875, "global_step": 495172, "epoch": 5965} {"train_loss": -27.69870376586914, "global_step": 495173, "epoch": 5965} {"train_loss": -27.82163429260254, "global_step": 495174, "epoch": 5965} {"train_loss": -27.244909286499023, "global_step": 495175, "epoch": 5965} {"train_loss": -27.523340225219727, "global_step": 495176, "epoch": 5965} {"train_loss": -27.070794691522437, "global_step": 495177, "epoch": 5965, "val_loss": 6456271.0} {"train_loss": -24.404356002807617, "global_step": 495178, "epoch": 5966} {"train_loss": -18.64509391784668, "global_step": 495179, "epoch": 5966} {"train_loss": -22.343786239624023, "global_step": 495180, "epoch": 5966} {"train_loss": -24.809980392456055, "global_step": 495181, "epoch": 5966} {"train_loss": -24.96286392211914, "global_step": 495182, "epoch": 5966} {"train_loss": -24.855560302734375, "global_step": 495183, "epoch": 5966} {"train_loss": -25.95961570739746, "global_step": 495184, "epoch": 5966} {"train_loss": -24.499706268310547, "global_step": 495185, "epoch": 5966} {"train_loss": -25.59856605529785, "global_step": 495186, "epoch": 5966} {"train_loss": -26.512781143188477, "global_step": 495187, "epoch": 5966} {"train_loss": -25.8886661529541, "global_step": 495188, "epoch": 5966} {"train_loss": -26.081201553344727, "global_step": 495189, "epoch": 5966} {"train_loss": -26.25679588317871, "global_step": 495190, "epoch": 5966} {"train_loss": -26.490293502807617, "global_step": 495191, "epoch": 5966} {"train_loss": -26.132551193237305, "global_step": 495192, "epoch": 5966} {"train_loss": -26.162342071533203, "global_step": 495193, "epoch": 5966} {"train_loss": -26.111042022705078, "global_step": 495194, "epoch": 5966} {"train_loss": -26.252737045288086, "global_step": 495195, "epoch": 5966} {"train_loss": -26.92927360534668, "global_step": 495196, "epoch": 5966} {"train_loss": -26.550039291381836, "global_step": 495197, "epoch": 5966} {"train_loss": -26.201818466186523, "global_step": 495198, "epoch": 5966} {"train_loss": -26.058332443237305, "global_step": 495199, "epoch": 5966} {"train_loss": -26.5203857421875, "global_step": 495200, "epoch": 5966} {"train_loss": -25.851499557495117, "global_step": 495201, "epoch": 5966} {"train_loss": -26.57732582092285, "global_step": 495202, "epoch": 5966} {"train_loss": -26.582477569580078, "global_step": 495203, "epoch": 5966} {"train_loss": -26.696462631225586, "global_step": 495204, "epoch": 5966} {"train_loss": -26.579914093017578, "global_step": 495205, "epoch": 5966} {"train_loss": -26.83314323425293, "global_step": 495206, "epoch": 5966} {"train_loss": -26.89849853515625, "global_step": 495207, "epoch": 5966} {"train_loss": -26.89045524597168, "global_step": 495208, "epoch": 5966} {"train_loss": -26.83406639099121, "global_step": 495209, "epoch": 5966} {"train_loss": -26.8917293548584, "global_step": 495210, "epoch": 5966} {"train_loss": -26.61600112915039, "global_step": 495211, "epoch": 5966} {"train_loss": -26.8857421875, "global_step": 495212, "epoch": 5966} {"train_loss": -27.242090225219727, "global_step": 495213, "epoch": 5966} {"train_loss": -26.5455379486084, "global_step": 495214, "epoch": 5966} {"train_loss": -26.993377685546875, "global_step": 495215, "epoch": 5966} {"train_loss": -26.919361114501953, "global_step": 495216, "epoch": 5966} {"train_loss": -27.066669464111328, "global_step": 495217, "epoch": 5966} {"train_loss": -27.267419815063477, "global_step": 495218, "epoch": 5966} {"train_loss": -26.968158721923828, "global_step": 495219, "epoch": 5966} {"train_loss": -27.074438095092773, "global_step": 495220, "epoch": 5966} {"train_loss": -26.967885971069336, "global_step": 495221, "epoch": 5966} {"train_loss": -27.372909545898438, "global_step": 495222, "epoch": 5966} {"train_loss": -27.140933990478516, "global_step": 495223, "epoch": 5966} {"train_loss": -27.18442726135254, "global_step": 495224, "epoch": 5966} {"train_loss": -27.102453231811523, "global_step": 495225, "epoch": 5966} {"train_loss": -27.283252716064453, "global_step": 495226, "epoch": 5966} {"train_loss": -27.168378829956055, "global_step": 495227, "epoch": 5966} {"train_loss": -26.778711318969727, "global_step": 495228, "epoch": 5966} {"train_loss": -26.9315185546875, "global_step": 495229, "epoch": 5966} {"train_loss": -27.33831214904785, "global_step": 495230, "epoch": 5966} {"train_loss": -26.890310287475586, "global_step": 495231, "epoch": 5966} {"train_loss": -27.20195960998535, "global_step": 495232, "epoch": 5966} {"train_loss": -27.42725944519043, "global_step": 495233, "epoch": 5966} {"train_loss": -27.374099731445312, "global_step": 495234, "epoch": 5966} {"train_loss": -27.046478271484375, "global_step": 495235, "epoch": 5966} {"train_loss": -27.27720069885254, "global_step": 495236, "epoch": 5966} {"train_loss": -27.386709213256836, "global_step": 495237, "epoch": 5966} {"train_loss": -27.134265899658203, "global_step": 495238, "epoch": 5966} {"train_loss": -27.291852951049805, "global_step": 495239, "epoch": 5966} {"train_loss": -27.388660430908203, "global_step": 495240, "epoch": 5966} {"train_loss": -27.42374038696289, "global_step": 495241, "epoch": 5966} {"train_loss": -27.338510513305664, "global_step": 495242, "epoch": 5966} {"train_loss": -27.48581886291504, "global_step": 495243, "epoch": 5966} {"train_loss": -27.391773223876953, "global_step": 495244, "epoch": 5966} {"train_loss": -27.03558921813965, "global_step": 495245, "epoch": 5966} {"train_loss": -27.12589454650879, "global_step": 495246, "epoch": 5966} {"train_loss": -27.161985397338867, "global_step": 495247, "epoch": 5966} {"train_loss": -27.370763778686523, "global_step": 495248, "epoch": 5966} {"train_loss": -27.05535316467285, "global_step": 495249, "epoch": 5966} {"train_loss": -27.613927841186523, "global_step": 495250, "epoch": 5966} {"train_loss": -27.225690841674805, "global_step": 495251, "epoch": 5966} {"train_loss": -27.34907341003418, "global_step": 495252, "epoch": 5966} {"train_loss": -27.170135498046875, "global_step": 495253, "epoch": 5966} {"train_loss": -27.4049015045166, "global_step": 495254, "epoch": 5966} {"train_loss": -27.310321807861328, "global_step": 495255, "epoch": 5966} {"train_loss": -26.991485595703125, "global_step": 495256, "epoch": 5966} {"train_loss": -26.728378295898438, "global_step": 495257, "epoch": 5966} {"train_loss": -26.637434005737305, "global_step": 495258, "epoch": 5966} {"train_loss": -27.214303970336914, "global_step": 495259, "epoch": 5966} {"train_loss": -26.61815535304058, "global_step": 495260, "epoch": 5966, "val_loss": 6476785.0} {"train_loss": -25.9414005279541, "global_step": 495261, "epoch": 5967} {"train_loss": -26.181732177734375, "global_step": 495262, "epoch": 5967} {"train_loss": -26.679767608642578, "global_step": 495263, "epoch": 5967} {"train_loss": -26.72934341430664, "global_step": 495264, "epoch": 5967} {"train_loss": -26.84807777404785, "global_step": 495265, "epoch": 5967} {"train_loss": -26.53982925415039, "global_step": 495266, "epoch": 5967} {"train_loss": -26.569610595703125, "global_step": 495267, "epoch": 5967} {"train_loss": -26.55585289001465, "global_step": 495268, "epoch": 5967} {"train_loss": -26.119144439697266, "global_step": 495269, "epoch": 5967} {"train_loss": -26.644933700561523, "global_step": 495270, "epoch": 5967} {"train_loss": -26.517126083374023, "global_step": 495271, "epoch": 5967} {"train_loss": -26.853504180908203, "global_step": 495272, "epoch": 5967} {"train_loss": -27.332563400268555, "global_step": 495273, "epoch": 5967} {"train_loss": -27.237539291381836, "global_step": 495274, "epoch": 5967} {"train_loss": -27.14838981628418, "global_step": 495275, "epoch": 5967} {"train_loss": -27.08233642578125, "global_step": 495276, "epoch": 5967} {"train_loss": -27.123748779296875, "global_step": 495277, "epoch": 5967} {"train_loss": -27.168317794799805, "global_step": 495278, "epoch": 5967} {"train_loss": -26.752355575561523, "global_step": 495279, "epoch": 5967} {"train_loss": -27.353429794311523, "global_step": 495280, "epoch": 5967} {"train_loss": -27.12105369567871, "global_step": 495281, "epoch": 5967} {"train_loss": -27.324995040893555, "global_step": 495282, "epoch": 5967} {"train_loss": -27.320484161376953, "global_step": 495283, "epoch": 5967} {"train_loss": -27.059412002563477, "global_step": 495284, "epoch": 5967} {"train_loss": -27.1195011138916, "global_step": 495285, "epoch": 5967} {"train_loss": -27.227121353149414, "global_step": 495286, "epoch": 5967} {"train_loss": -27.122220993041992, "global_step": 495287, "epoch": 5967} {"train_loss": -27.4580135345459, "global_step": 495288, "epoch": 5967} {"train_loss": -27.61121940612793, "global_step": 495289, "epoch": 5967} {"train_loss": -27.546527862548828, "global_step": 495290, "epoch": 5967} {"train_loss": -27.50836181640625, "global_step": 495291, "epoch": 5967} {"train_loss": -27.225698471069336, "global_step": 495292, "epoch": 5967} {"train_loss": -27.17179298400879, "global_step": 495293, "epoch": 5967} {"train_loss": -27.47590446472168, "global_step": 495294, "epoch": 5967} {"train_loss": -27.111373901367188, "global_step": 495295, "epoch": 5967} {"train_loss": -27.3955135345459, "global_step": 495296, "epoch": 5967} {"train_loss": -27.44386863708496, "global_step": 495297, "epoch": 5967} {"train_loss": -27.40296745300293, "global_step": 495298, "epoch": 5967} {"train_loss": -27.310546875, "global_step": 495299, "epoch": 5967} {"train_loss": -27.473865509033203, "global_step": 495300, "epoch": 5967} {"train_loss": -27.665283203125, "global_step": 495301, "epoch": 5967} {"train_loss": -27.4652156829834, "global_step": 495302, "epoch": 5967} {"train_loss": -27.73650550842285, "global_step": 495303, "epoch": 5967} {"train_loss": -27.28362464904785, "global_step": 495304, "epoch": 5967} {"train_loss": -27.281824111938477, "global_step": 495305, "epoch": 5967} {"train_loss": -27.386646270751953, "global_step": 495306, "epoch": 5967} {"train_loss": -27.511554718017578, "global_step": 495307, "epoch": 5967} {"train_loss": -27.877460479736328, "global_step": 495308, "epoch": 5967} {"train_loss": -27.478134155273438, "global_step": 495309, "epoch": 5967} {"train_loss": -27.955078125, "global_step": 495310, "epoch": 5967} {"train_loss": -27.377105712890625, "global_step": 495311, "epoch": 5967} {"train_loss": -27.47425651550293, "global_step": 495312, "epoch": 5967} {"train_loss": -27.976337432861328, "global_step": 495313, "epoch": 5967} {"train_loss": -27.38616371154785, "global_step": 495314, "epoch": 5967} {"train_loss": -27.514249801635742, "global_step": 495315, "epoch": 5967} {"train_loss": -27.41937828063965, "global_step": 495316, "epoch": 5967} {"train_loss": -27.499479293823242, "global_step": 495317, "epoch": 5967} {"train_loss": -27.3779296875, "global_step": 495318, "epoch": 5967} {"train_loss": -27.84407615661621, "global_step": 495319, "epoch": 5967} {"train_loss": -27.213184356689453, "global_step": 495320, "epoch": 5967} {"train_loss": -27.856964111328125, "global_step": 495321, "epoch": 5967} {"train_loss": -28.048303604125977, "global_step": 495322, "epoch": 5967} {"train_loss": -27.606739044189453, "global_step": 495323, "epoch": 5967} {"train_loss": -27.54414176940918, "global_step": 495324, "epoch": 5967} {"train_loss": -27.45209312438965, "global_step": 495325, "epoch": 5967} {"train_loss": -27.5767765045166, "global_step": 495326, "epoch": 5967} {"train_loss": -27.665185928344727, "global_step": 495327, "epoch": 5967} {"train_loss": -27.3712100982666, "global_step": 495328, "epoch": 5967} {"train_loss": -27.518054962158203, "global_step": 495329, "epoch": 5967} {"train_loss": -27.833349227905273, "global_step": 495330, "epoch": 5967} {"train_loss": -27.62202262878418, "global_step": 495331, "epoch": 5967} {"train_loss": -27.510208129882812, "global_step": 495332, "epoch": 5967} {"train_loss": -27.325551986694336, "global_step": 495333, "epoch": 5967} {"train_loss": -26.627084732055664, "global_step": 495334, "epoch": 5967} {"train_loss": -26.58184242248535, "global_step": 495335, "epoch": 5967} {"train_loss": -26.886316299438477, "global_step": 495336, "epoch": 5967} {"train_loss": -27.19929313659668, "global_step": 495337, "epoch": 5967} {"train_loss": -27.163497924804688, "global_step": 495338, "epoch": 5967} {"train_loss": -26.74867820739746, "global_step": 495339, "epoch": 5967} {"train_loss": -26.8028564453125, "global_step": 495340, "epoch": 5967} {"train_loss": -27.083240509033203, "global_step": 495341, "epoch": 5967} {"train_loss": -27.017675399780273, "global_step": 495342, "epoch": 5967} {"train_loss": -27.23103886340038, "global_step": 495343, "epoch": 5967, "val_loss": 6490039.0} {"train_loss": -26.958532333374023, "global_step": 495344, "epoch": 5968} {"train_loss": -26.751928329467773, "global_step": 495345, "epoch": 5968} {"train_loss": -27.337106704711914, "global_step": 495346, "epoch": 5968} {"train_loss": -27.192768096923828, "global_step": 495347, "epoch": 5968} {"train_loss": -27.096088409423828, "global_step": 495348, "epoch": 5968} {"train_loss": -27.532867431640625, "global_step": 495349, "epoch": 5968} {"train_loss": -27.103271484375, "global_step": 495350, "epoch": 5968} {"train_loss": -27.37841796875, "global_step": 495351, "epoch": 5968} {"train_loss": -27.06489372253418, "global_step": 495352, "epoch": 5968} {"train_loss": -27.25946617126465, "global_step": 495353, "epoch": 5968} {"train_loss": -27.64362144470215, "global_step": 495354, "epoch": 5968} {"train_loss": -27.411060333251953, "global_step": 495355, "epoch": 5968} {"train_loss": -27.25386619567871, "global_step": 495356, "epoch": 5968} {"train_loss": -27.511184692382812, "global_step": 495357, "epoch": 5968} {"train_loss": -27.49615478515625, "global_step": 495358, "epoch": 5968} {"train_loss": -27.151742935180664, "global_step": 495359, "epoch": 5968} {"train_loss": -27.426044464111328, "global_step": 495360, "epoch": 5968} {"train_loss": -27.107391357421875, "global_step": 495361, "epoch": 5968} {"train_loss": -27.168354034423828, "global_step": 495362, "epoch": 5968} {"train_loss": -27.1312255859375, "global_step": 495363, "epoch": 5968} {"train_loss": -27.231403350830078, "global_step": 495364, "epoch": 5968} {"train_loss": -27.52251625061035, "global_step": 495365, "epoch": 5968} {"train_loss": -26.82466697692871, "global_step": 495366, "epoch": 5968} {"train_loss": -27.0806941986084, "global_step": 495367, "epoch": 5968} {"train_loss": -27.546661376953125, "global_step": 495368, "epoch": 5968} {"train_loss": -27.383405685424805, "global_step": 495369, "epoch": 5968} {"train_loss": -27.312347412109375, "global_step": 495370, "epoch": 5968} {"train_loss": -27.4858341217041, "global_step": 495371, "epoch": 5968} {"train_loss": -27.515899658203125, "global_step": 495372, "epoch": 5968} {"train_loss": -27.181615829467773, "global_step": 495373, "epoch": 5968} {"train_loss": -27.43717384338379, "global_step": 495374, "epoch": 5968} {"train_loss": -27.274261474609375, "global_step": 495375, "epoch": 5968} {"train_loss": -27.78302001953125, "global_step": 495376, "epoch": 5968} {"train_loss": -27.4312744140625, "global_step": 495377, "epoch": 5968} {"train_loss": -27.670148849487305, "global_step": 495378, "epoch": 5968} {"train_loss": -27.294921875, "global_step": 495379, "epoch": 5968} {"train_loss": -27.045801162719727, "global_step": 495380, "epoch": 5968} {"train_loss": -27.520263671875, "global_step": 495381, "epoch": 5968} {"train_loss": -27.437210083007812, "global_step": 495382, "epoch": 5968} {"train_loss": -27.462568283081055, "global_step": 495383, "epoch": 5968} {"train_loss": -27.250009536743164, "global_step": 495384, "epoch": 5968} {"train_loss": -27.755224227905273, "global_step": 495385, "epoch": 5968} {"train_loss": -27.473331451416016, "global_step": 495386, "epoch": 5968} {"train_loss": -27.580488204956055, "global_step": 495387, "epoch": 5968} {"train_loss": -27.324176788330078, "global_step": 495388, "epoch": 5968} {"train_loss": -27.413043975830078, "global_step": 495389, "epoch": 5968} {"train_loss": -27.367090225219727, "global_step": 495390, "epoch": 5968} {"train_loss": -27.48276138305664, "global_step": 495391, "epoch": 5968} {"train_loss": -27.147687911987305, "global_step": 495392, "epoch": 5968} {"train_loss": -26.567930221557617, "global_step": 495393, "epoch": 5968} {"train_loss": -26.326440811157227, "global_step": 495394, "epoch": 5968} {"train_loss": -26.739215850830078, "global_step": 495395, "epoch": 5968} {"train_loss": -27.501026153564453, "global_step": 495396, "epoch": 5968} {"train_loss": -26.90018653869629, "global_step": 495397, "epoch": 5968} {"train_loss": -26.964099884033203, "global_step": 495398, "epoch": 5968} {"train_loss": -27.339818954467773, "global_step": 495399, "epoch": 5968} {"train_loss": -26.894474029541016, "global_step": 495400, "epoch": 5968} {"train_loss": -27.321680068969727, "global_step": 495401, "epoch": 5968} {"train_loss": -27.251859664916992, "global_step": 495402, "epoch": 5968} {"train_loss": -27.5803165435791, "global_step": 495403, "epoch": 5968} {"train_loss": -27.482330322265625, "global_step": 495404, "epoch": 5968} {"train_loss": -26.968280792236328, "global_step": 495405, "epoch": 5968} {"train_loss": -27.26601219177246, "global_step": 495406, "epoch": 5968} {"train_loss": -27.246429443359375, "global_step": 495407, "epoch": 5968} {"train_loss": -27.211200714111328, "global_step": 495408, "epoch": 5968} {"train_loss": -27.081851959228516, "global_step": 495409, "epoch": 5968} {"train_loss": -26.97255516052246, "global_step": 495410, "epoch": 5968} {"train_loss": -27.334806442260742, "global_step": 495411, "epoch": 5968} {"train_loss": -27.11773109436035, "global_step": 495412, "epoch": 5968} {"train_loss": -27.08102798461914, "global_step": 495413, "epoch": 5968} {"train_loss": -27.083398818969727, "global_step": 495414, "epoch": 5968} {"train_loss": -27.421606063842773, "global_step": 495415, "epoch": 5968} {"train_loss": -27.332178115844727, "global_step": 495416, "epoch": 5968} {"train_loss": -27.08745765686035, "global_step": 495417, "epoch": 5968} {"train_loss": -27.296863555908203, "global_step": 495418, "epoch": 5968} {"train_loss": -27.2242374420166, "global_step": 495419, "epoch": 5968} {"train_loss": -27.495208740234375, "global_step": 495420, "epoch": 5968} {"train_loss": -27.388629913330078, "global_step": 495421, "epoch": 5968} {"train_loss": -27.698450088500977, "global_step": 495422, "epoch": 5968} {"train_loss": -27.13474464416504, "global_step": 495423, "epoch": 5968} {"train_loss": -27.307819366455078, "global_step": 495424, "epoch": 5968} {"train_loss": -27.46892738342285, "global_step": 495425, "epoch": 5968} {"train_loss": -27.27513828047787, "global_step": 495426, "epoch": 5968, "val_loss": 6475005.0} {"train_loss": -26.16913414001465, "global_step": 495427, "epoch": 5969} {"train_loss": -26.141550064086914, "global_step": 495428, "epoch": 5969} {"train_loss": -26.702899932861328, "global_step": 495429, "epoch": 5969} {"train_loss": -26.558612823486328, "global_step": 495430, "epoch": 5969} {"train_loss": -26.73109245300293, "global_step": 495431, "epoch": 5969} {"train_loss": -26.397397994995117, "global_step": 495432, "epoch": 5969} {"train_loss": -27.15313148498535, "global_step": 495433, "epoch": 5969} {"train_loss": -26.768634796142578, "global_step": 495434, "epoch": 5969} {"train_loss": -26.85333251953125, "global_step": 495435, "epoch": 5969} {"train_loss": -26.719745635986328, "global_step": 495436, "epoch": 5969} {"train_loss": -27.07244300842285, "global_step": 495437, "epoch": 5969} {"train_loss": -27.15887451171875, "global_step": 495438, "epoch": 5969} {"train_loss": -27.169340133666992, "global_step": 495439, "epoch": 5969} {"train_loss": -26.886693954467773, "global_step": 495440, "epoch": 5969} {"train_loss": -27.257659912109375, "global_step": 495441, "epoch": 5969} {"train_loss": -27.23956871032715, "global_step": 495442, "epoch": 5969} {"train_loss": -27.56751823425293, "global_step": 495443, "epoch": 5969} {"train_loss": -27.525876998901367, "global_step": 495444, "epoch": 5969} {"train_loss": -27.2198429107666, "global_step": 495445, "epoch": 5969} {"train_loss": -27.051061630249023, "global_step": 495446, "epoch": 5969} {"train_loss": -27.47755241394043, "global_step": 495447, "epoch": 5969} {"train_loss": -27.10837745666504, "global_step": 495448, "epoch": 5969} {"train_loss": -27.183225631713867, "global_step": 495449, "epoch": 5969} {"train_loss": -27.309457778930664, "global_step": 495450, "epoch": 5969} {"train_loss": -27.236459732055664, "global_step": 495451, "epoch": 5969} {"train_loss": -27.3790340423584, "global_step": 495452, "epoch": 5969} {"train_loss": -27.206327438354492, "global_step": 495453, "epoch": 5969} {"train_loss": -27.340612411499023, "global_step": 495454, "epoch": 5969} {"train_loss": -27.077411651611328, "global_step": 495455, "epoch": 5969} {"train_loss": -27.39129638671875, "global_step": 495456, "epoch": 5969} {"train_loss": -27.4873104095459, "global_step": 495457, "epoch": 5969} {"train_loss": -27.353864669799805, "global_step": 495458, "epoch": 5969} {"train_loss": -27.332040786743164, "global_step": 495459, "epoch": 5969} {"train_loss": -27.168655395507812, "global_step": 495460, "epoch": 5969} {"train_loss": -27.472532272338867, "global_step": 495461, "epoch": 5969} {"train_loss": -27.31019401550293, "global_step": 495462, "epoch": 5969} {"train_loss": -27.6085262298584, "global_step": 495463, "epoch": 5969} {"train_loss": -27.369312286376953, "global_step": 495464, "epoch": 5969} {"train_loss": -27.323734283447266, "global_step": 495465, "epoch": 5969} {"train_loss": -27.231714248657227, "global_step": 495466, "epoch": 5969} {"train_loss": -27.843732833862305, "global_step": 495467, "epoch": 5969} {"train_loss": -27.311279296875, "global_step": 495468, "epoch": 5969} {"train_loss": -27.71686363220215, "global_step": 495469, "epoch": 5969} {"train_loss": -27.474130630493164, "global_step": 495470, "epoch": 5969} {"train_loss": -27.5963077545166, "global_step": 495471, "epoch": 5969} {"train_loss": -27.46903419494629, "global_step": 495472, "epoch": 5969} {"train_loss": -27.63567543029785, "global_step": 495473, "epoch": 5969} {"train_loss": -27.48850440979004, "global_step": 495474, "epoch": 5969} {"train_loss": -27.306182861328125, "global_step": 495475, "epoch": 5969} {"train_loss": -27.640735626220703, "global_step": 495476, "epoch": 5969} {"train_loss": -27.592824935913086, "global_step": 495477, "epoch": 5969} {"train_loss": -27.309858322143555, "global_step": 495478, "epoch": 5969} {"train_loss": -27.63336753845215, "global_step": 495479, "epoch": 5969} {"train_loss": -27.77497673034668, "global_step": 495480, "epoch": 5969} {"train_loss": -27.564733505249023, "global_step": 495481, "epoch": 5969} {"train_loss": -27.644323348999023, "global_step": 495482, "epoch": 5969} {"train_loss": -27.704862594604492, "global_step": 495483, "epoch": 5969} {"train_loss": -27.625146865844727, "global_step": 495484, "epoch": 5969} {"train_loss": -27.72687339782715, "global_step": 495485, "epoch": 5969} {"train_loss": -27.74176597595215, "global_step": 495486, "epoch": 5969} {"train_loss": -27.2833309173584, "global_step": 495487, "epoch": 5969} {"train_loss": -27.280048370361328, "global_step": 495488, "epoch": 5969} {"train_loss": -27.035968780517578, "global_step": 495489, "epoch": 5969} {"train_loss": -27.698841094970703, "global_step": 495490, "epoch": 5969} {"train_loss": -27.54974937438965, "global_step": 495491, "epoch": 5969} {"train_loss": -27.385908126831055, "global_step": 495492, "epoch": 5969} {"train_loss": -27.295825958251953, "global_step": 495493, "epoch": 5969} {"train_loss": -27.39176368713379, "global_step": 495494, "epoch": 5969} {"train_loss": -27.16229820251465, "global_step": 495495, "epoch": 5969} {"train_loss": -27.148895263671875, "global_step": 495496, "epoch": 5969} {"train_loss": -27.317962646484375, "global_step": 495497, "epoch": 5969} {"train_loss": -27.280242919921875, "global_step": 495498, "epoch": 5969} {"train_loss": -27.260334014892578, "global_step": 495499, "epoch": 5969} {"train_loss": -27.37454605102539, "global_step": 495500, "epoch": 5969} {"train_loss": -27.727319717407227, "global_step": 495501, "epoch": 5969} {"train_loss": -27.39307975769043, "global_step": 495502, "epoch": 5969} {"train_loss": -27.82159996032715, "global_step": 495503, "epoch": 5969} {"train_loss": -27.464279174804688, "global_step": 495504, "epoch": 5969} {"train_loss": -27.666364669799805, "global_step": 495505, "epoch": 5969} {"train_loss": -27.721546173095703, "global_step": 495506, "epoch": 5969} {"train_loss": -27.339096069335938, "global_step": 495507, "epoch": 5969} {"train_loss": -27.560382843017578, "global_step": 495508, "epoch": 5969} {"train_loss": -27.311784744262695, "global_step": 495509, "epoch": 5969, "val_loss": 6485510.0} {"train_loss": -27.139392852783203, "global_step": 495510, "epoch": 5970} {"train_loss": -27.158666610717773, "global_step": 495511, "epoch": 5970} {"train_loss": -27.151636123657227, "global_step": 495512, "epoch": 5970} {"train_loss": -27.277692794799805, "global_step": 495513, "epoch": 5970} {"train_loss": -26.780637741088867, "global_step": 495514, "epoch": 5970} {"train_loss": -27.076419830322266, "global_step": 495515, "epoch": 5970} {"train_loss": -27.245874404907227, "global_step": 495516, "epoch": 5970} {"train_loss": -26.226364135742188, "global_step": 495517, "epoch": 5970} {"train_loss": -27.495107650756836, "global_step": 495518, "epoch": 5970} {"train_loss": -26.594654083251953, "global_step": 495519, "epoch": 5970} {"train_loss": -26.761701583862305, "global_step": 495520, "epoch": 5970} {"train_loss": -27.01459312438965, "global_step": 495521, "epoch": 5970} {"train_loss": -26.6126651763916, "global_step": 495522, "epoch": 5970} {"train_loss": -27.59925651550293, "global_step": 495523, "epoch": 5970} {"train_loss": -26.695127487182617, "global_step": 495524, "epoch": 5970} {"train_loss": -27.08514976501465, "global_step": 495525, "epoch": 5970} {"train_loss": -27.047887802124023, "global_step": 495526, "epoch": 5970} {"train_loss": -26.99127197265625, "global_step": 495527, "epoch": 5970} {"train_loss": -26.798086166381836, "global_step": 495528, "epoch": 5970} {"train_loss": -27.258319854736328, "global_step": 495529, "epoch": 5970} {"train_loss": -27.290796279907227, "global_step": 495530, "epoch": 5970} {"train_loss": -27.099594116210938, "global_step": 495531, "epoch": 5970} {"train_loss": -27.042221069335938, "global_step": 495532, "epoch": 5970} {"train_loss": -26.80240249633789, "global_step": 495533, "epoch": 5970} {"train_loss": -27.517257690429688, "global_step": 495534, "epoch": 5970} {"train_loss": -26.99751853942871, "global_step": 495535, "epoch": 5970} {"train_loss": -27.027551651000977, "global_step": 495536, "epoch": 5970} {"train_loss": -27.178144454956055, "global_step": 495537, "epoch": 5970} {"train_loss": -27.21820068359375, "global_step": 495538, "epoch": 5970} {"train_loss": -26.748876571655273, "global_step": 495539, "epoch": 5970} {"train_loss": -27.17378807067871, "global_step": 495540, "epoch": 5970} {"train_loss": -27.494482040405273, "global_step": 495541, "epoch": 5970} {"train_loss": -27.146987915039062, "global_step": 495542, "epoch": 5970} {"train_loss": -27.685239791870117, "global_step": 495543, "epoch": 5970} {"train_loss": -27.000104904174805, "global_step": 495544, "epoch": 5970} {"train_loss": -27.353824615478516, "global_step": 495545, "epoch": 5970} {"train_loss": -27.16213035583496, "global_step": 495546, "epoch": 5970} {"train_loss": -27.3577880859375, "global_step": 495547, "epoch": 5970} {"train_loss": -27.273456573486328, "global_step": 495548, "epoch": 5970} {"train_loss": -27.155996322631836, "global_step": 495549, "epoch": 5970} {"train_loss": -27.381107330322266, "global_step": 495550, "epoch": 5970} {"train_loss": -27.472278594970703, "global_step": 495551, "epoch": 5970} {"train_loss": -27.224979400634766, "global_step": 495552, "epoch": 5970} {"train_loss": -27.189056396484375, "global_step": 495553, "epoch": 5970} {"train_loss": -27.2014102935791, "global_step": 495554, "epoch": 5970} {"train_loss": -27.260168075561523, "global_step": 495555, "epoch": 5970} {"train_loss": -27.54612159729004, "global_step": 495556, "epoch": 5970} {"train_loss": -27.33351707458496, "global_step": 495557, "epoch": 5970} {"train_loss": -27.34183692932129, "global_step": 495558, "epoch": 5970} {"train_loss": -27.388898849487305, "global_step": 495559, "epoch": 5970} {"train_loss": -27.49325942993164, "global_step": 495560, "epoch": 5970} {"train_loss": -27.429609298706055, "global_step": 495561, "epoch": 5970} {"train_loss": -27.546045303344727, "global_step": 495562, "epoch": 5970} {"train_loss": -27.711164474487305, "global_step": 495563, "epoch": 5970} {"train_loss": -27.15947914123535, "global_step": 495564, "epoch": 5970} {"train_loss": -27.43212890625, "global_step": 495565, "epoch": 5970} {"train_loss": -27.360605239868164, "global_step": 495566, "epoch": 5970} {"train_loss": -27.36150550842285, "global_step": 495567, "epoch": 5970} {"train_loss": -27.653127670288086, "global_step": 495568, "epoch": 5970} {"train_loss": -27.679113388061523, "global_step": 495569, "epoch": 5970} {"train_loss": -27.388263702392578, "global_step": 495570, "epoch": 5970} {"train_loss": -27.546903610229492, "global_step": 495571, "epoch": 5970} {"train_loss": -27.6345272064209, "global_step": 495572, "epoch": 5970} {"train_loss": -27.34101676940918, "global_step": 495573, "epoch": 5970} {"train_loss": -27.450702667236328, "global_step": 495574, "epoch": 5970} {"train_loss": -26.911972045898438, "global_step": 495575, "epoch": 5970} {"train_loss": -27.284276962280273, "global_step": 495576, "epoch": 5970} {"train_loss": -27.294631958007812, "global_step": 495577, "epoch": 5970} {"train_loss": -27.37619400024414, "global_step": 495578, "epoch": 5970} {"train_loss": -27.323644638061523, "global_step": 495579, "epoch": 5970} {"train_loss": -27.40192222595215, "global_step": 495580, "epoch": 5970} {"train_loss": -27.426422119140625, "global_step": 495581, "epoch": 5970} {"train_loss": -27.37323570251465, "global_step": 495582, "epoch": 5970} {"train_loss": -27.5538272857666, "global_step": 495583, "epoch": 5970} {"train_loss": -26.851795196533203, "global_step": 495584, "epoch": 5970} {"train_loss": -27.552581787109375, "global_step": 495585, "epoch": 5970} {"train_loss": -27.768163681030273, "global_step": 495586, "epoch": 5970} {"train_loss": -27.429712295532227, "global_step": 495587, "epoch": 5970} {"train_loss": -27.69990348815918, "global_step": 495588, "epoch": 5970} {"train_loss": -27.600116729736328, "global_step": 495589, "epoch": 5970} {"train_loss": -27.634008407592773, "global_step": 495590, "epoch": 5970} {"train_loss": -27.5948486328125, "global_step": 495591, "epoch": 5970} {"train_loss": -27.28396700663739, "global_step": 495592, "epoch": 5970, "val_loss": 6556351.0} {"train_loss": -27.14922523498535, "global_step": 495593, "epoch": 5971} {"train_loss": -26.893569946289062, "global_step": 495594, "epoch": 5971} {"train_loss": -27.12701416015625, "global_step": 495595, "epoch": 5971} {"train_loss": -27.1994571685791, "global_step": 495596, "epoch": 5971} {"train_loss": -27.547805786132812, "global_step": 495597, "epoch": 5971} {"train_loss": -27.167829513549805, "global_step": 495598, "epoch": 5971} {"train_loss": -27.208881378173828, "global_step": 495599, "epoch": 5971} {"train_loss": -27.35967445373535, "global_step": 495600, "epoch": 5971} {"train_loss": -26.783964157104492, "global_step": 495601, "epoch": 5971} {"train_loss": -26.902801513671875, "global_step": 495602, "epoch": 5971} {"train_loss": -27.123367309570312, "global_step": 495603, "epoch": 5971} {"train_loss": -27.3527774810791, "global_step": 495604, "epoch": 5971} {"train_loss": -27.297819137573242, "global_step": 495605, "epoch": 5971} {"train_loss": -27.131494522094727, "global_step": 495606, "epoch": 5971} {"train_loss": -27.41346549987793, "global_step": 495607, "epoch": 5971} {"train_loss": -27.025232315063477, "global_step": 495608, "epoch": 5971} {"train_loss": -27.119821548461914, "global_step": 495609, "epoch": 5971} {"train_loss": -27.204803466796875, "global_step": 495610, "epoch": 5971} {"train_loss": -27.256240844726562, "global_step": 495611, "epoch": 5971} {"train_loss": -26.966604232788086, "global_step": 495612, "epoch": 5971} {"train_loss": -27.181446075439453, "global_step": 495613, "epoch": 5971} {"train_loss": -27.475614547729492, "global_step": 495614, "epoch": 5971} {"train_loss": -27.031097412109375, "global_step": 495615, "epoch": 5971} {"train_loss": -27.427417755126953, "global_step": 495616, "epoch": 5971} {"train_loss": -27.57472038269043, "global_step": 495617, "epoch": 5971} {"train_loss": -27.42325210571289, "global_step": 495618, "epoch": 5971} {"train_loss": -27.167072296142578, "global_step": 495619, "epoch": 5971} {"train_loss": -27.38092041015625, "global_step": 495620, "epoch": 5971} {"train_loss": -27.190656661987305, "global_step": 495621, "epoch": 5971} {"train_loss": -27.27511978149414, "global_step": 495622, "epoch": 5971} {"train_loss": -27.17034339904785, "global_step": 495623, "epoch": 5971} {"train_loss": -27.315509796142578, "global_step": 495624, "epoch": 5971} {"train_loss": -27.153921127319336, "global_step": 495625, "epoch": 5971} {"train_loss": -27.67919921875, "global_step": 495626, "epoch": 5971} {"train_loss": -27.680891036987305, "global_step": 495627, "epoch": 5971} {"train_loss": -27.059972763061523, "global_step": 495628, "epoch": 5971} {"train_loss": -27.408451080322266, "global_step": 495629, "epoch": 5971} {"train_loss": -27.255634307861328, "global_step": 495630, "epoch": 5971} {"train_loss": -27.374664306640625, "global_step": 495631, "epoch": 5971} {"train_loss": -27.453388214111328, "global_step": 495632, "epoch": 5971} {"train_loss": -27.61725425720215, "global_step": 495633, "epoch": 5971} {"train_loss": -27.257543563842773, "global_step": 495634, "epoch": 5971} {"train_loss": -27.507516860961914, "global_step": 495635, "epoch": 5971} {"train_loss": -27.517065048217773, "global_step": 495636, "epoch": 5971} {"train_loss": -27.301660537719727, "global_step": 495637, "epoch": 5971} {"train_loss": -27.44343376159668, "global_step": 495638, "epoch": 5971} {"train_loss": -27.641427993774414, "global_step": 495639, "epoch": 5971} {"train_loss": -27.23115348815918, "global_step": 495640, "epoch": 5971} {"train_loss": -27.444238662719727, "global_step": 495641, "epoch": 5971} {"train_loss": -27.613433837890625, "global_step": 495642, "epoch": 5971} {"train_loss": -27.12485694885254, "global_step": 495643, "epoch": 5971} {"train_loss": -27.609848022460938, "global_step": 495644, "epoch": 5971} {"train_loss": -27.370880126953125, "global_step": 495645, "epoch": 5971} {"train_loss": -27.585784912109375, "global_step": 495646, "epoch": 5971} {"train_loss": -27.690088272094727, "global_step": 495647, "epoch": 5971} {"train_loss": -27.33072280883789, "global_step": 495648, "epoch": 5971} {"train_loss": -27.160858154296875, "global_step": 495649, "epoch": 5971} {"train_loss": -27.378503799438477, "global_step": 495650, "epoch": 5971} {"train_loss": -27.736682891845703, "global_step": 495651, "epoch": 5971} {"train_loss": -27.451522827148438, "global_step": 495652, "epoch": 5971} {"train_loss": -27.547775268554688, "global_step": 495653, "epoch": 5971} {"train_loss": -27.513858795166016, "global_step": 495654, "epoch": 5971} {"train_loss": -26.972951889038086, "global_step": 495655, "epoch": 5971} {"train_loss": -27.137205123901367, "global_step": 495656, "epoch": 5971} {"train_loss": -27.40283203125, "global_step": 495657, "epoch": 5971} {"train_loss": -27.53365135192871, "global_step": 495658, "epoch": 5971} {"train_loss": -27.32767105102539, "global_step": 495659, "epoch": 5971} {"train_loss": -27.272375106811523, "global_step": 495660, "epoch": 5971} {"train_loss": -27.4965877532959, "global_step": 495661, "epoch": 5971} {"train_loss": -27.321796417236328, "global_step": 495662, "epoch": 5971} {"train_loss": -27.207141876220703, "global_step": 495663, "epoch": 5971} {"train_loss": -27.676015853881836, "global_step": 495664, "epoch": 5971} {"train_loss": -27.361663818359375, "global_step": 495665, "epoch": 5971} {"train_loss": -27.42011833190918, "global_step": 495666, "epoch": 5971} {"train_loss": -27.377195358276367, "global_step": 495667, "epoch": 5971} {"train_loss": -27.533203125, "global_step": 495668, "epoch": 5971} {"train_loss": -27.54303550720215, "global_step": 495669, "epoch": 5971} {"train_loss": -27.168354034423828, "global_step": 495670, "epoch": 5971} {"train_loss": -26.333845138549805, "global_step": 495671, "epoch": 5971} {"train_loss": -26.130125045776367, "global_step": 495672, "epoch": 5971} {"train_loss": -26.7123966217041, "global_step": 495673, "epoch": 5971} {"train_loss": -27.024194717407227, "global_step": 495674, "epoch": 5971} {"train_loss": -27.28085501797228, "global_step": 495675, "epoch": 5971, "val_loss": 6507882.5} {"train_loss": -25.067066192626953, "global_step": 495676, "epoch": 5972} {"train_loss": -25.295137405395508, "global_step": 495677, "epoch": 5972} {"train_loss": -26.922285079956055, "global_step": 495678, "epoch": 5972} {"train_loss": -26.171741485595703, "global_step": 495679, "epoch": 5972} {"train_loss": -26.2210693359375, "global_step": 495680, "epoch": 5972} {"train_loss": -26.473773956298828, "global_step": 495681, "epoch": 5972} {"train_loss": -25.896453857421875, "global_step": 495682, "epoch": 5972} {"train_loss": -26.18007469177246, "global_step": 495683, "epoch": 5972} {"train_loss": -26.682504653930664, "global_step": 495684, "epoch": 5972} {"train_loss": -26.744665145874023, "global_step": 495685, "epoch": 5972} {"train_loss": -27.1494083404541, "global_step": 495686, "epoch": 5972} {"train_loss": -26.582672119140625, "global_step": 495687, "epoch": 5972} {"train_loss": -26.78497314453125, "global_step": 495688, "epoch": 5972} {"train_loss": -26.4666805267334, "global_step": 495689, "epoch": 5972} {"train_loss": -26.82688331604004, "global_step": 495690, "epoch": 5972} {"train_loss": -26.976287841796875, "global_step": 495691, "epoch": 5972} {"train_loss": -26.579681396484375, "global_step": 495692, "epoch": 5972} {"train_loss": -27.018659591674805, "global_step": 495693, "epoch": 5972} {"train_loss": -26.93597412109375, "global_step": 495694, "epoch": 5972} {"train_loss": -26.795337677001953, "global_step": 495695, "epoch": 5972} {"train_loss": -26.815418243408203, "global_step": 495696, "epoch": 5972} {"train_loss": -27.319929122924805, "global_step": 495697, "epoch": 5972} {"train_loss": -27.168994903564453, "global_step": 495698, "epoch": 5972} {"train_loss": -27.080432891845703, "global_step": 495699, "epoch": 5972} {"train_loss": -27.039716720581055, "global_step": 495700, "epoch": 5972} {"train_loss": -26.813474655151367, "global_step": 495701, "epoch": 5972} {"train_loss": -27.25778579711914, "global_step": 495702, "epoch": 5972} {"train_loss": -27.226224899291992, "global_step": 495703, "epoch": 5972} {"train_loss": -27.41169548034668, "global_step": 495704, "epoch": 5972} {"train_loss": -27.727588653564453, "global_step": 495705, "epoch": 5972} {"train_loss": -27.219079971313477, "global_step": 495706, "epoch": 5972} {"train_loss": -27.098270416259766, "global_step": 495707, "epoch": 5972} {"train_loss": -27.346410751342773, "global_step": 495708, "epoch": 5972} {"train_loss": -27.42828941345215, "global_step": 495709, "epoch": 5972} {"train_loss": -27.47294044494629, "global_step": 495710, "epoch": 5972} {"train_loss": -27.578235626220703, "global_step": 495711, "epoch": 5972} {"train_loss": -27.435224533081055, "global_step": 495712, "epoch": 5972} {"train_loss": -27.147886276245117, "global_step": 495713, "epoch": 5972} {"train_loss": -27.2330379486084, "global_step": 495714, "epoch": 5972} {"train_loss": -27.585330963134766, "global_step": 495715, "epoch": 5972} {"train_loss": -26.976367950439453, "global_step": 495716, "epoch": 5972} {"train_loss": -27.4915714263916, "global_step": 495717, "epoch": 5972} {"train_loss": -27.50177001953125, "global_step": 495718, "epoch": 5972} {"train_loss": -27.4200496673584, "global_step": 495719, "epoch": 5972} {"train_loss": -27.415815353393555, "global_step": 495720, "epoch": 5972} {"train_loss": -27.446725845336914, "global_step": 495721, "epoch": 5972} {"train_loss": -27.43745231628418, "global_step": 495722, "epoch": 5972} {"train_loss": -27.816864013671875, "global_step": 495723, "epoch": 5972} {"train_loss": -27.675079345703125, "global_step": 495724, "epoch": 5972} {"train_loss": -27.28516960144043, "global_step": 495725, "epoch": 5972} {"train_loss": -27.246423721313477, "global_step": 495726, "epoch": 5972} {"train_loss": -27.505420684814453, "global_step": 495727, "epoch": 5972} {"train_loss": -27.27838134765625, "global_step": 495728, "epoch": 5972} {"train_loss": -27.156919479370117, "global_step": 495729, "epoch": 5972} {"train_loss": -26.18511962890625, "global_step": 495730, "epoch": 5972} {"train_loss": -26.169784545898438, "global_step": 495731, "epoch": 5972} {"train_loss": -26.271284103393555, "global_step": 495732, "epoch": 5972} {"train_loss": -26.72043228149414, "global_step": 495733, "epoch": 5972} {"train_loss": -26.229787826538086, "global_step": 495734, "epoch": 5972} {"train_loss": -26.247053146362305, "global_step": 495735, "epoch": 5972} {"train_loss": -27.21795654296875, "global_step": 495736, "epoch": 5972} {"train_loss": -26.532819747924805, "global_step": 495737, "epoch": 5972} {"train_loss": -26.794485092163086, "global_step": 495738, "epoch": 5972} {"train_loss": -27.115869522094727, "global_step": 495739, "epoch": 5972} {"train_loss": -26.674163818359375, "global_step": 495740, "epoch": 5972} {"train_loss": -26.976764678955078, "global_step": 495741, "epoch": 5972} {"train_loss": -27.10389518737793, "global_step": 495742, "epoch": 5972} {"train_loss": -27.04288673400879, "global_step": 495743, "epoch": 5972} {"train_loss": -27.399051666259766, "global_step": 495744, "epoch": 5972} {"train_loss": -27.161413192749023, "global_step": 495745, "epoch": 5972} {"train_loss": -27.206079483032227, "global_step": 495746, "epoch": 5972} {"train_loss": -27.006879806518555, "global_step": 495747, "epoch": 5972} {"train_loss": -26.812850952148438, "global_step": 495748, "epoch": 5972} {"train_loss": -27.09391212463379, "global_step": 495749, "epoch": 5972} {"train_loss": -27.28120231628418, "global_step": 495750, "epoch": 5972} {"train_loss": -27.1706600189209, "global_step": 495751, "epoch": 5972} {"train_loss": -27.02231788635254, "global_step": 495752, "epoch": 5972} {"train_loss": -27.38569450378418, "global_step": 495753, "epoch": 5972} {"train_loss": -27.272497177124023, "global_step": 495754, "epoch": 5972} {"train_loss": -26.861392974853516, "global_step": 495755, "epoch": 5972} {"train_loss": -26.875329971313477, "global_step": 495756, "epoch": 5972} {"train_loss": -27.44925308227539, "global_step": 495757, "epoch": 5972} {"train_loss": -26.973242909075267, "global_step": 495758, "epoch": 5972, "val_loss": 6514559.0} {"train_loss": -25.360458374023438, "global_step": 495759, "epoch": 5973} {"train_loss": -24.722089767456055, "global_step": 495760, "epoch": 5973} {"train_loss": -26.530500411987305, "global_step": 495761, "epoch": 5973} {"train_loss": -26.5390625, "global_step": 495762, "epoch": 5973} {"train_loss": -26.338781356811523, "global_step": 495763, "epoch": 5973} {"train_loss": -26.30820083618164, "global_step": 495764, "epoch": 5973} {"train_loss": -26.250263214111328, "global_step": 495765, "epoch": 5973} {"train_loss": -26.9086971282959, "global_step": 495766, "epoch": 5973} {"train_loss": -26.20331382751465, "global_step": 495767, "epoch": 5973} {"train_loss": -27.001571655273438, "global_step": 495768, "epoch": 5973} {"train_loss": -26.436431884765625, "global_step": 495769, "epoch": 5973} {"train_loss": -26.471357345581055, "global_step": 495770, "epoch": 5973} {"train_loss": -26.561471939086914, "global_step": 495771, "epoch": 5973} {"train_loss": -26.874731063842773, "global_step": 495772, "epoch": 5973} {"train_loss": -26.605688095092773, "global_step": 495773, "epoch": 5973} {"train_loss": -26.830829620361328, "global_step": 495774, "epoch": 5973} {"train_loss": -26.820905685424805, "global_step": 495775, "epoch": 5973} {"train_loss": -27.169416427612305, "global_step": 495776, "epoch": 5973} {"train_loss": -27.143796920776367, "global_step": 495777, "epoch": 5973} {"train_loss": -27.092309951782227, "global_step": 495778, "epoch": 5973} {"train_loss": -26.887781143188477, "global_step": 495779, "epoch": 5973} {"train_loss": -27.266494750976562, "global_step": 495780, "epoch": 5973} {"train_loss": -26.804861068725586, "global_step": 495781, "epoch": 5973} {"train_loss": -26.761865615844727, "global_step": 495782, "epoch": 5973} {"train_loss": -27.24350929260254, "global_step": 495783, "epoch": 5973} {"train_loss": -26.9660701751709, "global_step": 495784, "epoch": 5973} {"train_loss": -27.247724533081055, "global_step": 495785, "epoch": 5973} {"train_loss": -26.980947494506836, "global_step": 495786, "epoch": 5973} {"train_loss": -27.024534225463867, "global_step": 495787, "epoch": 5973} {"train_loss": -27.296066284179688, "global_step": 495788, "epoch": 5973} {"train_loss": -27.355976104736328, "global_step": 495789, "epoch": 5973} {"train_loss": -26.866230010986328, "global_step": 495790, "epoch": 5973} {"train_loss": -27.131744384765625, "global_step": 495791, "epoch": 5973} {"train_loss": -27.275537490844727, "global_step": 495792, "epoch": 5973} {"train_loss": -27.584949493408203, "global_step": 495793, "epoch": 5973} {"train_loss": -27.309186935424805, "global_step": 495794, "epoch": 5973} {"train_loss": -27.705759048461914, "global_step": 495795, "epoch": 5973} {"train_loss": -27.871118545532227, "global_step": 495796, "epoch": 5973} {"train_loss": -27.387298583984375, "global_step": 495797, "epoch": 5973} {"train_loss": -27.62031364440918, "global_step": 495798, "epoch": 5973} {"train_loss": -27.557342529296875, "global_step": 495799, "epoch": 5973} {"train_loss": -27.662168502807617, "global_step": 495800, "epoch": 5973} {"train_loss": -27.439443588256836, "global_step": 495801, "epoch": 5973} {"train_loss": -27.419775009155273, "global_step": 495802, "epoch": 5973} {"train_loss": -27.569992065429688, "global_step": 495803, "epoch": 5973} {"train_loss": -27.50986671447754, "global_step": 495804, "epoch": 5973} {"train_loss": -27.49732780456543, "global_step": 495805, "epoch": 5973} {"train_loss": -27.485570907592773, "global_step": 495806, "epoch": 5973} {"train_loss": -27.268884658813477, "global_step": 495807, "epoch": 5973} {"train_loss": -27.24006462097168, "global_step": 495808, "epoch": 5973} {"train_loss": -27.3353328704834, "global_step": 495809, "epoch": 5973} {"train_loss": -27.6377010345459, "global_step": 495810, "epoch": 5973} {"train_loss": -27.809497833251953, "global_step": 495811, "epoch": 5973} {"train_loss": -27.741281509399414, "global_step": 495812, "epoch": 5973} {"train_loss": -27.63750648498535, "global_step": 495813, "epoch": 5973} {"train_loss": -27.69854736328125, "global_step": 495814, "epoch": 5973} {"train_loss": -27.73150634765625, "global_step": 495815, "epoch": 5973} {"train_loss": -27.579914093017578, "global_step": 495816, "epoch": 5973} {"train_loss": -27.419538497924805, "global_step": 495817, "epoch": 5973} {"train_loss": -27.64047622680664, "global_step": 495818, "epoch": 5973} {"train_loss": -27.574542999267578, "global_step": 495819, "epoch": 5973} {"train_loss": -27.2484188079834, "global_step": 495820, "epoch": 5973} {"train_loss": -27.426956176757812, "global_step": 495821, "epoch": 5973} {"train_loss": -27.209716796875, "global_step": 495822, "epoch": 5973} {"train_loss": -26.6562442779541, "global_step": 495823, "epoch": 5973} {"train_loss": -26.073577880859375, "global_step": 495824, "epoch": 5973} {"train_loss": -26.640857696533203, "global_step": 495825, "epoch": 5973} {"train_loss": -27.376129150390625, "global_step": 495826, "epoch": 5973} {"train_loss": -26.70098304748535, "global_step": 495827, "epoch": 5973} {"train_loss": -27.12232780456543, "global_step": 495828, "epoch": 5973} {"train_loss": -27.006269454956055, "global_step": 495829, "epoch": 5973} {"train_loss": -27.24403190612793, "global_step": 495830, "epoch": 5973} {"train_loss": -27.339670181274414, "global_step": 495831, "epoch": 5973} {"train_loss": -27.2060489654541, "global_step": 495832, "epoch": 5973} {"train_loss": -27.018842697143555, "global_step": 495833, "epoch": 5973} {"train_loss": -26.994836807250977, "global_step": 495834, "epoch": 5973} {"train_loss": -27.32131004333496, "global_step": 495835, "epoch": 5973} {"train_loss": -27.493122100830078, "global_step": 495836, "epoch": 5973} {"train_loss": -27.36103630065918, "global_step": 495837, "epoch": 5973} {"train_loss": -27.391042709350586, "global_step": 495838, "epoch": 5973} {"train_loss": -27.473371505737305, "global_step": 495839, "epoch": 5973} {"train_loss": -27.43656349182129, "global_step": 495840, "epoch": 5973} {"train_loss": -27.12176168970315, "global_step": 495841, "epoch": 5973, "val_loss": 6584462.0} {"train_loss": -26.859582901000977, "global_step": 495842, "epoch": 5974} {"train_loss": -27.003833770751953, "global_step": 495843, "epoch": 5974} {"train_loss": -26.68499183654785, "global_step": 495844, "epoch": 5974} {"train_loss": -26.901514053344727, "global_step": 495845, "epoch": 5974} {"train_loss": -26.830097198486328, "global_step": 495846, "epoch": 5974} {"train_loss": -27.05775260925293, "global_step": 495847, "epoch": 5974} {"train_loss": -27.228580474853516, "global_step": 495848, "epoch": 5974} {"train_loss": -26.668231964111328, "global_step": 495849, "epoch": 5974} {"train_loss": -27.347341537475586, "global_step": 495850, "epoch": 5974} {"train_loss": -26.841888427734375, "global_step": 495851, "epoch": 5974} {"train_loss": -26.893644332885742, "global_step": 495852, "epoch": 5974} {"train_loss": -27.057727813720703, "global_step": 495853, "epoch": 5974} {"train_loss": -26.69435691833496, "global_step": 495854, "epoch": 5974} {"train_loss": -27.314619064331055, "global_step": 495855, "epoch": 5974} {"train_loss": -26.903188705444336, "global_step": 495856, "epoch": 5974} {"train_loss": -26.93902587890625, "global_step": 495857, "epoch": 5974} {"train_loss": -27.660070419311523, "global_step": 495858, "epoch": 5974} {"train_loss": -26.994611740112305, "global_step": 495859, "epoch": 5974} {"train_loss": -27.59498405456543, "global_step": 495860, "epoch": 5974} {"train_loss": -27.26678466796875, "global_step": 495861, "epoch": 5974} {"train_loss": -27.212100982666016, "global_step": 495862, "epoch": 5974} {"train_loss": -27.511219024658203, "global_step": 495863, "epoch": 5974} {"train_loss": -27.527795791625977, "global_step": 495864, "epoch": 5974} {"train_loss": -27.07008171081543, "global_step": 495865, "epoch": 5974} {"train_loss": -27.39084243774414, "global_step": 495866, "epoch": 5974} {"train_loss": -27.200925827026367, "global_step": 495867, "epoch": 5974} {"train_loss": -27.230712890625, "global_step": 495868, "epoch": 5974} {"train_loss": -26.50107765197754, "global_step": 495869, "epoch": 5974} {"train_loss": -27.13336753845215, "global_step": 495870, "epoch": 5974} {"train_loss": -27.5474853515625, "global_step": 495871, "epoch": 5974} {"train_loss": -27.098129272460938, "global_step": 495872, "epoch": 5974} {"train_loss": -27.47286033630371, "global_step": 495873, "epoch": 5974} {"train_loss": -27.649755477905273, "global_step": 495874, "epoch": 5974} {"train_loss": -27.449934005737305, "global_step": 495875, "epoch": 5974} {"train_loss": -27.1309871673584, "global_step": 495876, "epoch": 5974} {"train_loss": -27.332128524780273, "global_step": 495877, "epoch": 5974} {"train_loss": -27.457494735717773, "global_step": 495878, "epoch": 5974} {"train_loss": -27.47248649597168, "global_step": 495879, "epoch": 5974} {"train_loss": -27.649738311767578, "global_step": 495880, "epoch": 5974} {"train_loss": -27.563709259033203, "global_step": 495881, "epoch": 5974} {"train_loss": -27.352313995361328, "global_step": 495882, "epoch": 5974} {"train_loss": -27.59405517578125, "global_step": 495883, "epoch": 5974} {"train_loss": -27.598093032836914, "global_step": 495884, "epoch": 5974} {"train_loss": -27.117786407470703, "global_step": 495885, "epoch": 5974} {"train_loss": -27.867115020751953, "global_step": 495886, "epoch": 5974} {"train_loss": -27.50501823425293, "global_step": 495887, "epoch": 5974} {"train_loss": -27.46946144104004, "global_step": 495888, "epoch": 5974} {"train_loss": -27.293140411376953, "global_step": 495889, "epoch": 5974} {"train_loss": -27.581226348876953, "global_step": 495890, "epoch": 5974} {"train_loss": -27.4140567779541, "global_step": 495891, "epoch": 5974} {"train_loss": -27.13177490234375, "global_step": 495892, "epoch": 5974} {"train_loss": -27.32454490661621, "global_step": 495893, "epoch": 5974} {"train_loss": -27.499221801757812, "global_step": 495894, "epoch": 5974} {"train_loss": -27.77065086364746, "global_step": 495895, "epoch": 5974} {"train_loss": -27.553207397460938, "global_step": 495896, "epoch": 5974} {"train_loss": -27.53326416015625, "global_step": 495897, "epoch": 5974} {"train_loss": -27.313344955444336, "global_step": 495898, "epoch": 5974} {"train_loss": -27.397043228149414, "global_step": 495899, "epoch": 5974} {"train_loss": -27.8608341217041, "global_step": 495900, "epoch": 5974} {"train_loss": -27.5508975982666, "global_step": 495901, "epoch": 5974} {"train_loss": -27.4583740234375, "global_step": 495902, "epoch": 5974} {"train_loss": -27.529504776000977, "global_step": 495903, "epoch": 5974} {"train_loss": -27.522626876831055, "global_step": 495904, "epoch": 5974} {"train_loss": -27.80878257751465, "global_step": 495905, "epoch": 5974} {"train_loss": -27.529407501220703, "global_step": 495906, "epoch": 5974} {"train_loss": -27.518163681030273, "global_step": 495907, "epoch": 5974} {"train_loss": -27.366153717041016, "global_step": 495908, "epoch": 5974} {"train_loss": -27.55158805847168, "global_step": 495909, "epoch": 5974} {"train_loss": -27.069507598876953, "global_step": 495910, "epoch": 5974} {"train_loss": -27.4775390625, "global_step": 495911, "epoch": 5974} {"train_loss": -27.526418685913086, "global_step": 495912, "epoch": 5974} {"train_loss": -27.469348907470703, "global_step": 495913, "epoch": 5974} {"train_loss": -27.392425537109375, "global_step": 495914, "epoch": 5974} {"train_loss": -27.413503646850586, "global_step": 495915, "epoch": 5974} {"train_loss": -27.374805450439453, "global_step": 495916, "epoch": 5974} {"train_loss": -27.48381996154785, "global_step": 495917, "epoch": 5974} {"train_loss": -27.750268936157227, "global_step": 495918, "epoch": 5974} {"train_loss": -27.52009391784668, "global_step": 495919, "epoch": 5974} {"train_loss": -27.04304313659668, "global_step": 495920, "epoch": 5974} {"train_loss": -26.74244499206543, "global_step": 495921, "epoch": 5974} {"train_loss": -26.902326583862305, "global_step": 495922, "epoch": 5974} {"train_loss": -27.320743560791016, "global_step": 495923, "epoch": 5974} {"train_loss": -27.322487750685358, "global_step": 495924, "epoch": 5974, "val_loss": 6663196.0} {"train_loss": -27.050933837890625, "global_step": 495925, "epoch": 5975} {"train_loss": -26.89605712890625, "global_step": 495926, "epoch": 5975} {"train_loss": -26.806488037109375, "global_step": 495927, "epoch": 5975} {"train_loss": -27.05091667175293, "global_step": 495928, "epoch": 5975} {"train_loss": -26.754199981689453, "global_step": 495929, "epoch": 5975} {"train_loss": -27.257673263549805, "global_step": 495930, "epoch": 5975} {"train_loss": -26.8253116607666, "global_step": 495931, "epoch": 5975} {"train_loss": -26.902021408081055, "global_step": 495932, "epoch": 5975} {"train_loss": -26.797327041625977, "global_step": 495933, "epoch": 5975} {"train_loss": -26.839223861694336, "global_step": 495934, "epoch": 5975} {"train_loss": -26.74818229675293, "global_step": 495935, "epoch": 5975} {"train_loss": -26.969022750854492, "global_step": 495936, "epoch": 5975} {"train_loss": -26.605920791625977, "global_step": 495937, "epoch": 5975} {"train_loss": -26.9969539642334, "global_step": 495938, "epoch": 5975} {"train_loss": -27.207101821899414, "global_step": 495939, "epoch": 5975} {"train_loss": -27.3817138671875, "global_step": 495940, "epoch": 5975} {"train_loss": -27.1488094329834, "global_step": 495941, "epoch": 5975} {"train_loss": -27.625890731811523, "global_step": 495942, "epoch": 5975} {"train_loss": -27.171483993530273, "global_step": 495943, "epoch": 5975} {"train_loss": -27.4155330657959, "global_step": 495944, "epoch": 5975} {"train_loss": -27.289655685424805, "global_step": 495945, "epoch": 5975} {"train_loss": -27.567779541015625, "global_step": 495946, "epoch": 5975} {"train_loss": -27.4229679107666, "global_step": 495947, "epoch": 5975} {"train_loss": -27.32142448425293, "global_step": 495948, "epoch": 5975} {"train_loss": -27.105146408081055, "global_step": 495949, "epoch": 5975} {"train_loss": -27.07962989807129, "global_step": 495950, "epoch": 5975} {"train_loss": -27.231983184814453, "global_step": 495951, "epoch": 5975} {"train_loss": -27.272403717041016, "global_step": 495952, "epoch": 5975} {"train_loss": -27.472909927368164, "global_step": 495953, "epoch": 5975} {"train_loss": -27.486419677734375, "global_step": 495954, "epoch": 5975} {"train_loss": -27.37483024597168, "global_step": 495955, "epoch": 5975} {"train_loss": -27.787012100219727, "global_step": 495956, "epoch": 5975} {"train_loss": -27.53059196472168, "global_step": 495957, "epoch": 5975} {"train_loss": -27.695669174194336, "global_step": 495958, "epoch": 5975} {"train_loss": -27.640573501586914, "global_step": 495959, "epoch": 5975} {"train_loss": -27.898298263549805, "global_step": 495960, "epoch": 5975} {"train_loss": -27.22772216796875, "global_step": 495961, "epoch": 5975} {"train_loss": -27.48300552368164, "global_step": 495962, "epoch": 5975} {"train_loss": -27.535608291625977, "global_step": 495963, "epoch": 5975} {"train_loss": -27.542865753173828, "global_step": 495964, "epoch": 5975} {"train_loss": -27.859888076782227, "global_step": 495965, "epoch": 5975} {"train_loss": -27.617841720581055, "global_step": 495966, "epoch": 5975} {"train_loss": -27.573108673095703, "global_step": 495967, "epoch": 5975} {"train_loss": -27.458057403564453, "global_step": 495968, "epoch": 5975} {"train_loss": -27.356109619140625, "global_step": 495969, "epoch": 5975} {"train_loss": -27.406518936157227, "global_step": 495970, "epoch": 5975} {"train_loss": -27.33725357055664, "global_step": 495971, "epoch": 5975} {"train_loss": -27.377283096313477, "global_step": 495972, "epoch": 5975} {"train_loss": -27.366165161132812, "global_step": 495973, "epoch": 5975} {"train_loss": -27.745777130126953, "global_step": 495974, "epoch": 5975} {"train_loss": -27.043842315673828, "global_step": 495975, "epoch": 5975} {"train_loss": -27.10291862487793, "global_step": 495976, "epoch": 5975} {"train_loss": -27.56499671936035, "global_step": 495977, "epoch": 5975} {"train_loss": -27.13921546936035, "global_step": 495978, "epoch": 5975} {"train_loss": -27.079483032226562, "global_step": 495979, "epoch": 5975} {"train_loss": -27.22319984436035, "global_step": 495980, "epoch": 5975} {"train_loss": -26.710041046142578, "global_step": 495981, "epoch": 5975} {"train_loss": -27.330854415893555, "global_step": 495982, "epoch": 5975} {"train_loss": -27.12883949279785, "global_step": 495983, "epoch": 5975} {"train_loss": -26.877735137939453, "global_step": 495984, "epoch": 5975} {"train_loss": -26.80242919921875, "global_step": 495985, "epoch": 5975} {"train_loss": -27.283002853393555, "global_step": 495986, "epoch": 5975} {"train_loss": -26.999563217163086, "global_step": 495987, "epoch": 5975} {"train_loss": -26.99493980407715, "global_step": 495988, "epoch": 5975} {"train_loss": -26.9306640625, "global_step": 495989, "epoch": 5975} {"train_loss": -27.32931900024414, "global_step": 495990, "epoch": 5975} {"train_loss": -27.398962020874023, "global_step": 495991, "epoch": 5975} {"train_loss": -26.461450576782227, "global_step": 495992, "epoch": 5975} {"train_loss": -27.340620040893555, "global_step": 495993, "epoch": 5975} {"train_loss": -26.767194747924805, "global_step": 495994, "epoch": 5975} {"train_loss": -27.2559757232666, "global_step": 495995, "epoch": 5975} {"train_loss": -27.628332138061523, "global_step": 495996, "epoch": 5975} {"train_loss": -27.324670791625977, "global_step": 495997, "epoch": 5975} {"train_loss": -27.3538761138916, "global_step": 495998, "epoch": 5975} {"train_loss": -27.522613525390625, "global_step": 495999, "epoch": 5975} {"train_loss": -27.410552978515625, "global_step": 496000, "epoch": 5975} {"train_loss": -27.512420654296875, "global_step": 496001, "epoch": 5975} {"train_loss": -27.64434242248535, "global_step": 496002, "epoch": 5975} {"train_loss": -27.389862060546875, "global_step": 496003, "epoch": 5975} {"train_loss": -27.24177360534668, "global_step": 496004, "epoch": 5975} {"train_loss": -27.20698356628418, "global_step": 496005, "epoch": 5975} {"train_loss": -27.350500106811523, "global_step": 496006, "epoch": 5975} {"train_loss": -27.231832596192877, "global_step": 496007, "epoch": 5975, "val_loss": 6574158.0} {"train_loss": -26.828710556030273, "global_step": 496008, "epoch": 5976} {"train_loss": -27.023120880126953, "global_step": 496009, "epoch": 5976} {"train_loss": -27.418994903564453, "global_step": 496010, "epoch": 5976} {"train_loss": -26.35206413269043, "global_step": 496011, "epoch": 5976} {"train_loss": -27.114212036132812, "global_step": 496012, "epoch": 5976} {"train_loss": -26.926645278930664, "global_step": 496013, "epoch": 5976} {"train_loss": -27.131025314331055, "global_step": 496014, "epoch": 5976} {"train_loss": -26.7724666595459, "global_step": 496015, "epoch": 5976} {"train_loss": -26.495786666870117, "global_step": 496016, "epoch": 5976} {"train_loss": -26.894826889038086, "global_step": 496017, "epoch": 5976} {"train_loss": -26.87176513671875, "global_step": 496018, "epoch": 5976} {"train_loss": -26.98909568786621, "global_step": 496019, "epoch": 5976} {"train_loss": -26.900985717773438, "global_step": 496020, "epoch": 5976} {"train_loss": -27.61199378967285, "global_step": 496021, "epoch": 5976} {"train_loss": -26.945362091064453, "global_step": 496022, "epoch": 5976} {"train_loss": -26.903522491455078, "global_step": 496023, "epoch": 5976} {"train_loss": -27.091598510742188, "global_step": 496024, "epoch": 5976} {"train_loss": -27.224029541015625, "global_step": 496025, "epoch": 5976} {"train_loss": -26.68757438659668, "global_step": 496026, "epoch": 5976} {"train_loss": -27.3802433013916, "global_step": 496027, "epoch": 5976} {"train_loss": -27.156864166259766, "global_step": 496028, "epoch": 5976} {"train_loss": -27.267026901245117, "global_step": 496029, "epoch": 5976} {"train_loss": -27.011320114135742, "global_step": 496030, "epoch": 5976} {"train_loss": -27.530500411987305, "global_step": 496031, "epoch": 5976} {"train_loss": -27.552892684936523, "global_step": 496032, "epoch": 5976} {"train_loss": -26.83258056640625, "global_step": 496033, "epoch": 5976} {"train_loss": -27.15778923034668, "global_step": 496034, "epoch": 5976} {"train_loss": -26.961694717407227, "global_step": 496035, "epoch": 5976} {"train_loss": -27.223432540893555, "global_step": 496036, "epoch": 5976} {"train_loss": -27.433197021484375, "global_step": 496037, "epoch": 5976} {"train_loss": -27.074499130249023, "global_step": 496038, "epoch": 5976} {"train_loss": -27.34746742248535, "global_step": 496039, "epoch": 5976} {"train_loss": -27.31757164001465, "global_step": 496040, "epoch": 5976} {"train_loss": -27.468225479125977, "global_step": 496041, "epoch": 5976} {"train_loss": -27.569732666015625, "global_step": 496042, "epoch": 5976} {"train_loss": -27.39577293395996, "global_step": 496043, "epoch": 5976} {"train_loss": -27.557138442993164, "global_step": 496044, "epoch": 5976} {"train_loss": -27.664392471313477, "global_step": 496045, "epoch": 5976} {"train_loss": -27.279743194580078, "global_step": 496046, "epoch": 5976} {"train_loss": -27.406864166259766, "global_step": 496047, "epoch": 5976} {"train_loss": -27.584461212158203, "global_step": 496048, "epoch": 5976} {"train_loss": -27.555017471313477, "global_step": 496049, "epoch": 5976} {"train_loss": -27.635456085205078, "global_step": 496050, "epoch": 5976} {"train_loss": -27.269439697265625, "global_step": 496051, "epoch": 5976} {"train_loss": -27.2791805267334, "global_step": 496052, "epoch": 5976} {"train_loss": -27.38701820373535, "global_step": 496053, "epoch": 5976} {"train_loss": -27.299652099609375, "global_step": 496054, "epoch": 5976} {"train_loss": -27.772430419921875, "global_step": 496055, "epoch": 5976} {"train_loss": -27.456933975219727, "global_step": 496056, "epoch": 5976} {"train_loss": -27.549407958984375, "global_step": 496057, "epoch": 5976} {"train_loss": -27.189407348632812, "global_step": 496058, "epoch": 5976} {"train_loss": -27.28789710998535, "global_step": 496059, "epoch": 5976} {"train_loss": -27.644500732421875, "global_step": 496060, "epoch": 5976} {"train_loss": -27.06534767150879, "global_step": 496061, "epoch": 5976} {"train_loss": -27.41627311706543, "global_step": 496062, "epoch": 5976} {"train_loss": -27.43025779724121, "global_step": 496063, "epoch": 5976} {"train_loss": -27.778715133666992, "global_step": 496064, "epoch": 5976} {"train_loss": -27.081241607666016, "global_step": 496065, "epoch": 5976} {"train_loss": -27.912214279174805, "global_step": 496066, "epoch": 5976} {"train_loss": -28.043731689453125, "global_step": 496067, "epoch": 5976} {"train_loss": -27.772790908813477, "global_step": 496068, "epoch": 5976} {"train_loss": -27.782073974609375, "global_step": 496069, "epoch": 5976} {"train_loss": -27.489465713500977, "global_step": 496070, "epoch": 5976} {"train_loss": -27.33393669128418, "global_step": 496071, "epoch": 5976} {"train_loss": -27.35865592956543, "global_step": 496072, "epoch": 5976} {"train_loss": -27.24790382385254, "global_step": 496073, "epoch": 5976} {"train_loss": -27.37168312072754, "global_step": 496074, "epoch": 5976} {"train_loss": -27.791059494018555, "global_step": 496075, "epoch": 5976} {"train_loss": -27.665090560913086, "global_step": 496076, "epoch": 5976} {"train_loss": -27.798059463500977, "global_step": 496077, "epoch": 5976} {"train_loss": -27.457822799682617, "global_step": 496078, "epoch": 5976} {"train_loss": -27.213855743408203, "global_step": 496079, "epoch": 5976} {"train_loss": -27.413965225219727, "global_step": 496080, "epoch": 5976} {"train_loss": -27.428924560546875, "global_step": 496081, "epoch": 5976} {"train_loss": -27.22429847717285, "global_step": 496082, "epoch": 5976} {"train_loss": -28.0311279296875, "global_step": 496083, "epoch": 5976} {"train_loss": -27.515579223632812, "global_step": 496084, "epoch": 5976} {"train_loss": -27.495655059814453, "global_step": 496085, "epoch": 5976} {"train_loss": -27.57900047302246, "global_step": 496086, "epoch": 5976} {"train_loss": -27.31130027770996, "global_step": 496087, "epoch": 5976} {"train_loss": -27.399494171142578, "global_step": 496088, "epoch": 5976} {"train_loss": -27.2276668548584, "global_step": 496089, "epoch": 5976} {"train_loss": -27.323366693703527, "global_step": 496090, "epoch": 5976, "val_loss": 6614999.0} {"train_loss": -26.92339515686035, "global_step": 496091, "epoch": 5977} {"train_loss": -26.756427764892578, "global_step": 496092, "epoch": 5977} {"train_loss": -26.373523712158203, "global_step": 496093, "epoch": 5977} {"train_loss": -26.07942771911621, "global_step": 496094, "epoch": 5977} {"train_loss": -25.76987648010254, "global_step": 496095, "epoch": 5977} {"train_loss": -26.318510055541992, "global_step": 496096, "epoch": 5977} {"train_loss": -26.653644561767578, "global_step": 496097, "epoch": 5977} {"train_loss": -26.667285919189453, "global_step": 496098, "epoch": 5977} {"train_loss": -27.0360164642334, "global_step": 496099, "epoch": 5977} {"train_loss": -26.606470108032227, "global_step": 496100, "epoch": 5977} {"train_loss": -27.185083389282227, "global_step": 496101, "epoch": 5977} {"train_loss": -26.77121353149414, "global_step": 496102, "epoch": 5977} {"train_loss": -27.00006103515625, "global_step": 496103, "epoch": 5977} {"train_loss": -26.7285099029541, "global_step": 496104, "epoch": 5977} {"train_loss": -27.263381958007812, "global_step": 496105, "epoch": 5977} {"train_loss": -26.870309829711914, "global_step": 496106, "epoch": 5977} {"train_loss": -26.945026397705078, "global_step": 496107, "epoch": 5977} {"train_loss": -27.18267822265625, "global_step": 496108, "epoch": 5977} {"train_loss": -26.83363151550293, "global_step": 496109, "epoch": 5977} {"train_loss": -27.284427642822266, "global_step": 496110, "epoch": 5977} {"train_loss": -27.0572452545166, "global_step": 496111, "epoch": 5977} {"train_loss": -27.005212783813477, "global_step": 496112, "epoch": 5977} {"train_loss": -27.3432559967041, "global_step": 496113, "epoch": 5977} {"train_loss": -27.5054988861084, "global_step": 496114, "epoch": 5977} {"train_loss": -27.560171127319336, "global_step": 496115, "epoch": 5977} {"train_loss": -27.091705322265625, "global_step": 496116, "epoch": 5977} {"train_loss": -27.51203727722168, "global_step": 496117, "epoch": 5977} {"train_loss": -27.19813346862793, "global_step": 496118, "epoch": 5977} {"train_loss": -27.415388107299805, "global_step": 496119, "epoch": 5977} {"train_loss": -26.993793487548828, "global_step": 496120, "epoch": 5977} {"train_loss": -28.192672729492188, "global_step": 496121, "epoch": 5977} {"train_loss": -27.4646053314209, "global_step": 496122, "epoch": 5977} {"train_loss": -27.448572158813477, "global_step": 496123, "epoch": 5977} {"train_loss": -27.22088623046875, "global_step": 496124, "epoch": 5977} {"train_loss": -27.175369262695312, "global_step": 496125, "epoch": 5977} {"train_loss": -27.769916534423828, "global_step": 496126, "epoch": 5977} {"train_loss": -27.56768226623535, "global_step": 496127, "epoch": 5977} {"train_loss": -27.70122718811035, "global_step": 496128, "epoch": 5977} {"train_loss": -27.513761520385742, "global_step": 496129, "epoch": 5977} {"train_loss": -27.47406005859375, "global_step": 496130, "epoch": 5977} {"train_loss": -27.397525787353516, "global_step": 496131, "epoch": 5977} {"train_loss": -27.34562110900879, "global_step": 496132, "epoch": 5977} {"train_loss": -27.452306747436523, "global_step": 496133, "epoch": 5977} {"train_loss": -27.65803337097168, "global_step": 496134, "epoch": 5977} {"train_loss": -27.38089942932129, "global_step": 496135, "epoch": 5977} {"train_loss": -27.598377227783203, "global_step": 496136, "epoch": 5977} {"train_loss": -27.347461700439453, "global_step": 496137, "epoch": 5977} {"train_loss": -27.345304489135742, "global_step": 496138, "epoch": 5977} {"train_loss": -27.353601455688477, "global_step": 496139, "epoch": 5977} {"train_loss": -27.280120849609375, "global_step": 496140, "epoch": 5977} {"train_loss": -27.237146377563477, "global_step": 496141, "epoch": 5977} {"train_loss": -27.51092529296875, "global_step": 496142, "epoch": 5977} {"train_loss": -27.523365020751953, "global_step": 496143, "epoch": 5977} {"train_loss": -27.588729858398438, "global_step": 496144, "epoch": 5977} {"train_loss": -27.638355255126953, "global_step": 496145, "epoch": 5977} {"train_loss": -27.409467697143555, "global_step": 496146, "epoch": 5977} {"train_loss": -27.777057647705078, "global_step": 496147, "epoch": 5977} {"train_loss": -27.66742515563965, "global_step": 496148, "epoch": 5977} {"train_loss": -27.225112915039062, "global_step": 496149, "epoch": 5977} {"train_loss": -27.580102920532227, "global_step": 496150, "epoch": 5977} {"train_loss": -27.54481315612793, "global_step": 496151, "epoch": 5977} {"train_loss": -27.488874435424805, "global_step": 496152, "epoch": 5977} {"train_loss": -27.24007225036621, "global_step": 496153, "epoch": 5977} {"train_loss": -27.396961212158203, "global_step": 496154, "epoch": 5977} {"train_loss": -27.43482780456543, "global_step": 496155, "epoch": 5977} {"train_loss": -27.439697265625, "global_step": 496156, "epoch": 5977} {"train_loss": -27.295209884643555, "global_step": 496157, "epoch": 5977} {"train_loss": -27.088409423828125, "global_step": 496158, "epoch": 5977} {"train_loss": -27.323400497436523, "global_step": 496159, "epoch": 5977} {"train_loss": -27.49210548400879, "global_step": 496160, "epoch": 5977} {"train_loss": -27.174814224243164, "global_step": 496161, "epoch": 5977} {"train_loss": -27.47784423828125, "global_step": 496162, "epoch": 5977} {"train_loss": -27.50347328186035, "global_step": 496163, "epoch": 5977} {"train_loss": -27.351476669311523, "global_step": 496164, "epoch": 5977} {"train_loss": -27.216535568237305, "global_step": 496165, "epoch": 5977} {"train_loss": -27.597217559814453, "global_step": 496166, "epoch": 5977} {"train_loss": -27.054929733276367, "global_step": 496167, "epoch": 5977} {"train_loss": -27.3549747467041, "global_step": 496168, "epoch": 5977} {"train_loss": -27.53248405456543, "global_step": 496169, "epoch": 5977} {"train_loss": -27.537527084350586, "global_step": 496170, "epoch": 5977} {"train_loss": -27.173795700073242, "global_step": 496171, "epoch": 5977} {"train_loss": -27.529617309570312, "global_step": 496172, "epoch": 5977} {"train_loss": -27.26277891411839, "global_step": 496173, "epoch": 5977, "val_loss": 6614273.0} {"train_loss": -26.844879150390625, "global_step": 496174, "epoch": 5978} {"train_loss": -26.52984619140625, "global_step": 496175, "epoch": 5978} {"train_loss": -27.229129791259766, "global_step": 496176, "epoch": 5978} {"train_loss": -26.900854110717773, "global_step": 496177, "epoch": 5978} {"train_loss": -26.725610733032227, "global_step": 496178, "epoch": 5978} {"train_loss": -26.69597816467285, "global_step": 496179, "epoch": 5978} {"train_loss": -27.32423210144043, "global_step": 496180, "epoch": 5978} {"train_loss": -26.688323974609375, "global_step": 496181, "epoch": 5978} {"train_loss": -27.112567901611328, "global_step": 496182, "epoch": 5978} {"train_loss": -27.355512619018555, "global_step": 496183, "epoch": 5978} {"train_loss": -26.6521053314209, "global_step": 496184, "epoch": 5978} {"train_loss": -27.261138916015625, "global_step": 496185, "epoch": 5978} {"train_loss": -26.183069229125977, "global_step": 496186, "epoch": 5978} {"train_loss": -27.02593421936035, "global_step": 496187, "epoch": 5978} {"train_loss": -26.124210357666016, "global_step": 496188, "epoch": 5978} {"train_loss": -27.12916374206543, "global_step": 496189, "epoch": 5978} {"train_loss": -26.548995971679688, "global_step": 496190, "epoch": 5978} {"train_loss": -27.44808006286621, "global_step": 496191, "epoch": 5978} {"train_loss": -26.835845947265625, "global_step": 496192, "epoch": 5978} {"train_loss": -27.076618194580078, "global_step": 496193, "epoch": 5978} {"train_loss": -26.988412857055664, "global_step": 496194, "epoch": 5978} {"train_loss": -27.12808609008789, "global_step": 496195, "epoch": 5978} {"train_loss": -27.33026123046875, "global_step": 496196, "epoch": 5978} {"train_loss": -27.124677658081055, "global_step": 496197, "epoch": 5978} {"train_loss": -27.39176368713379, "global_step": 496198, "epoch": 5978} {"train_loss": -27.21123695373535, "global_step": 496199, "epoch": 5978} {"train_loss": -27.18903160095215, "global_step": 496200, "epoch": 5978} {"train_loss": -27.55442237854004, "global_step": 496201, "epoch": 5978} {"train_loss": -27.178604125976562, "global_step": 496202, "epoch": 5978} {"train_loss": -27.356306076049805, "global_step": 496203, "epoch": 5978} {"train_loss": -27.6778621673584, "global_step": 496204, "epoch": 5978} {"train_loss": -27.090518951416016, "global_step": 496205, "epoch": 5978} {"train_loss": -27.4027156829834, "global_step": 496206, "epoch": 5978} {"train_loss": -27.05621910095215, "global_step": 496207, "epoch": 5978} {"train_loss": -27.110883712768555, "global_step": 496208, "epoch": 5978} {"train_loss": -27.168676376342773, "global_step": 496209, "epoch": 5978} {"train_loss": -26.789051055908203, "global_step": 496210, "epoch": 5978} {"train_loss": -27.352466583251953, "global_step": 496211, "epoch": 5978} {"train_loss": -27.102066040039062, "global_step": 496212, "epoch": 5978} {"train_loss": -27.083026885986328, "global_step": 496213, "epoch": 5978} {"train_loss": -27.423450469970703, "global_step": 496214, "epoch": 5978} {"train_loss": -26.649927139282227, "global_step": 496215, "epoch": 5978} {"train_loss": -26.99409294128418, "global_step": 496216, "epoch": 5978} {"train_loss": -26.7200870513916, "global_step": 496217, "epoch": 5978} {"train_loss": -26.92317771911621, "global_step": 496218, "epoch": 5978} {"train_loss": -27.398977279663086, "global_step": 496219, "epoch": 5978} {"train_loss": -27.046728134155273, "global_step": 496220, "epoch": 5978} {"train_loss": -27.327198028564453, "global_step": 496221, "epoch": 5978} {"train_loss": -27.217681884765625, "global_step": 496222, "epoch": 5978} {"train_loss": -27.003278732299805, "global_step": 496223, "epoch": 5978} {"train_loss": -27.152307510375977, "global_step": 496224, "epoch": 5978} {"train_loss": -27.247220993041992, "global_step": 496225, "epoch": 5978} {"train_loss": -26.849185943603516, "global_step": 496226, "epoch": 5978} {"train_loss": -27.13671875, "global_step": 496227, "epoch": 5978} {"train_loss": -27.325836181640625, "global_step": 496228, "epoch": 5978} {"train_loss": -27.3460750579834, "global_step": 496229, "epoch": 5978} {"train_loss": -27.146337509155273, "global_step": 496230, "epoch": 5978} {"train_loss": -27.017562866210938, "global_step": 496231, "epoch": 5978} {"train_loss": -26.905057907104492, "global_step": 496232, "epoch": 5978} {"train_loss": -27.375181198120117, "global_step": 496233, "epoch": 5978} {"train_loss": -27.37152099609375, "global_step": 496234, "epoch": 5978} {"train_loss": -27.21015739440918, "global_step": 496235, "epoch": 5978} {"train_loss": -27.191892623901367, "global_step": 496236, "epoch": 5978} {"train_loss": -27.485004425048828, "global_step": 496237, "epoch": 5978} {"train_loss": -27.156408309936523, "global_step": 496238, "epoch": 5978} {"train_loss": -27.31353759765625, "global_step": 496239, "epoch": 5978} {"train_loss": -27.568750381469727, "global_step": 496240, "epoch": 5978} {"train_loss": -27.2569522857666, "global_step": 496241, "epoch": 5978} {"train_loss": -27.376821517944336, "global_step": 496242, "epoch": 5978} {"train_loss": -27.310108184814453, "global_step": 496243, "epoch": 5978} {"train_loss": -27.425764083862305, "global_step": 496244, "epoch": 5978} {"train_loss": -27.387475967407227, "global_step": 496245, "epoch": 5978} {"train_loss": -27.667943954467773, "global_step": 496246, "epoch": 5978} {"train_loss": -27.650644302368164, "global_step": 496247, "epoch": 5978} {"train_loss": -27.743810653686523, "global_step": 496248, "epoch": 5978} {"train_loss": -27.913482666015625, "global_step": 496249, "epoch": 5978} {"train_loss": -27.6750431060791, "global_step": 496250, "epoch": 5978} {"train_loss": -27.24615478515625, "global_step": 496251, "epoch": 5978} {"train_loss": -27.275074005126953, "global_step": 496252, "epoch": 5978} {"train_loss": -27.28264808654785, "global_step": 496253, "epoch": 5978} {"train_loss": -27.476415634155273, "global_step": 496254, "epoch": 5978} {"train_loss": -26.99652099609375, "global_step": 496255, "epoch": 5978} {"train_loss": -27.156126642801677, "global_step": 496256, "epoch": 5978, "val_loss": 6531954.5} {"train_loss": -23.878923416137695, "global_step": 496257, "epoch": 5979} {"train_loss": -23.780864715576172, "global_step": 496258, "epoch": 5979} {"train_loss": -26.65256118774414, "global_step": 496259, "epoch": 5979} {"train_loss": -23.299936294555664, "global_step": 496260, "epoch": 5979} {"train_loss": -26.07952880859375, "global_step": 496261, "epoch": 5979} {"train_loss": -25.381202697753906, "global_step": 496262, "epoch": 5979} {"train_loss": -26.330488204956055, "global_step": 496263, "epoch": 5979} {"train_loss": -25.62330436706543, "global_step": 496264, "epoch": 5979} {"train_loss": -26.586816787719727, "global_step": 496265, "epoch": 5979} {"train_loss": -26.600086212158203, "global_step": 496266, "epoch": 5979} {"train_loss": -26.395170211791992, "global_step": 496267, "epoch": 5979} {"train_loss": -26.110090255737305, "global_step": 496268, "epoch": 5979} {"train_loss": -26.764535903930664, "global_step": 496269, "epoch": 5979} {"train_loss": -26.529111862182617, "global_step": 496270, "epoch": 5979} {"train_loss": -26.629377365112305, "global_step": 496271, "epoch": 5979} {"train_loss": -26.558612823486328, "global_step": 496272, "epoch": 5979} {"train_loss": -26.473804473876953, "global_step": 496273, "epoch": 5979} {"train_loss": -26.946996688842773, "global_step": 496274, "epoch": 5979} {"train_loss": -26.589452743530273, "global_step": 496275, "epoch": 5979} {"train_loss": -26.64351463317871, "global_step": 496276, "epoch": 5979} {"train_loss": -26.784061431884766, "global_step": 496277, "epoch": 5979} {"train_loss": -26.741498947143555, "global_step": 496278, "epoch": 5979} {"train_loss": -26.6322078704834, "global_step": 496279, "epoch": 5979} {"train_loss": -26.716217041015625, "global_step": 496280, "epoch": 5979} {"train_loss": -26.638891220092773, "global_step": 496281, "epoch": 5979} {"train_loss": -26.925312042236328, "global_step": 496282, "epoch": 5979} {"train_loss": -26.467519760131836, "global_step": 496283, "epoch": 5979} {"train_loss": -26.756643295288086, "global_step": 496284, "epoch": 5979} {"train_loss": -27.33180046081543, "global_step": 496285, "epoch": 5979} {"train_loss": -26.88313865661621, "global_step": 496286, "epoch": 5979} {"train_loss": -27.159454345703125, "global_step": 496287, "epoch": 5979} {"train_loss": -26.994577407836914, "global_step": 496288, "epoch": 5979} {"train_loss": -27.19657325744629, "global_step": 496289, "epoch": 5979} {"train_loss": -27.309192657470703, "global_step": 496290, "epoch": 5979} {"train_loss": -27.392866134643555, "global_step": 496291, "epoch": 5979} {"train_loss": -27.384353637695312, "global_step": 496292, "epoch": 5979} {"train_loss": -27.172399520874023, "global_step": 496293, "epoch": 5979} {"train_loss": -27.011066436767578, "global_step": 496294, "epoch": 5979} {"train_loss": -27.003021240234375, "global_step": 496295, "epoch": 5979} {"train_loss": -26.770612716674805, "global_step": 496296, "epoch": 5979} {"train_loss": -27.048349380493164, "global_step": 496297, "epoch": 5979} {"train_loss": -27.351293563842773, "global_step": 496298, "epoch": 5979} {"train_loss": -27.448545455932617, "global_step": 496299, "epoch": 5979} {"train_loss": -27.27199363708496, "global_step": 496300, "epoch": 5979} {"train_loss": -27.493406295776367, "global_step": 496301, "epoch": 5979} {"train_loss": -27.09527587890625, "global_step": 496302, "epoch": 5979} {"train_loss": -27.11199951171875, "global_step": 496303, "epoch": 5979} {"train_loss": -27.479694366455078, "global_step": 496304, "epoch": 5979} {"train_loss": -27.45179557800293, "global_step": 496305, "epoch": 5979} {"train_loss": -27.2254695892334, "global_step": 496306, "epoch": 5979} {"train_loss": -27.287687301635742, "global_step": 496307, "epoch": 5979} {"train_loss": -27.357152938842773, "global_step": 496308, "epoch": 5979} {"train_loss": -27.286457061767578, "global_step": 496309, "epoch": 5979} {"train_loss": -27.267139434814453, "global_step": 496310, "epoch": 5979} {"train_loss": -27.122543334960938, "global_step": 496311, "epoch": 5979} {"train_loss": -27.3831729888916, "global_step": 496312, "epoch": 5979} {"train_loss": -27.34186363220215, "global_step": 496313, "epoch": 5979} {"train_loss": -27.56098747253418, "global_step": 496314, "epoch": 5979} {"train_loss": -27.096960067749023, "global_step": 496315, "epoch": 5979} {"train_loss": -26.8659725189209, "global_step": 496316, "epoch": 5979} {"train_loss": -27.290332794189453, "global_step": 496317, "epoch": 5979} {"train_loss": -27.457258224487305, "global_step": 496318, "epoch": 5979} {"train_loss": -27.469694137573242, "global_step": 496319, "epoch": 5979} {"train_loss": -27.27290916442871, "global_step": 496320, "epoch": 5979} {"train_loss": -27.4144344329834, "global_step": 496321, "epoch": 5979} {"train_loss": -27.492557525634766, "global_step": 496322, "epoch": 5979} {"train_loss": -27.20001792907715, "global_step": 496323, "epoch": 5979} {"train_loss": -27.300857543945312, "global_step": 496324, "epoch": 5979} {"train_loss": -27.24848747253418, "global_step": 496325, "epoch": 5979} {"train_loss": -27.317956924438477, "global_step": 496326, "epoch": 5979} {"train_loss": -27.20166015625, "global_step": 496327, "epoch": 5979} {"train_loss": -26.827878952026367, "global_step": 496328, "epoch": 5979} {"train_loss": -27.39947509765625, "global_step": 496329, "epoch": 5979} {"train_loss": -27.051599502563477, "global_step": 496330, "epoch": 5979} {"train_loss": -27.14496421813965, "global_step": 496331, "epoch": 5979} {"train_loss": -27.550647735595703, "global_step": 496332, "epoch": 5979} {"train_loss": -27.512237548828125, "global_step": 496333, "epoch": 5979} {"train_loss": -27.30767822265625, "global_step": 496334, "epoch": 5979} {"train_loss": -26.89227867126465, "global_step": 496335, "epoch": 5979} {"train_loss": -27.25840187072754, "global_step": 496336, "epoch": 5979} {"train_loss": -27.3615665435791, "global_step": 496337, "epoch": 5979} {"train_loss": -27.13006019592285, "global_step": 496338, "epoch": 5979} {"train_loss": -26.894633442522533, "global_step": 496339, "epoch": 5979, "val_loss": 6625467.5} {"train_loss": -27.052845001220703, "global_step": 496340, "epoch": 5980} {"train_loss": -27.13467788696289, "global_step": 496341, "epoch": 5980} {"train_loss": -27.269678115844727, "global_step": 496342, "epoch": 5980} {"train_loss": -27.519901275634766, "global_step": 496343, "epoch": 5980} {"train_loss": -27.11630630493164, "global_step": 496344, "epoch": 5980} {"train_loss": -27.378131866455078, "global_step": 496345, "epoch": 5980} {"train_loss": -27.341733932495117, "global_step": 496346, "epoch": 5980} {"train_loss": -27.490331649780273, "global_step": 496347, "epoch": 5980} {"train_loss": -27.63138771057129, "global_step": 496348, "epoch": 5980} {"train_loss": -27.165637969970703, "global_step": 496349, "epoch": 5980} {"train_loss": -27.72001075744629, "global_step": 496350, "epoch": 5980} {"train_loss": -26.993879318237305, "global_step": 496351, "epoch": 5980} {"train_loss": -27.79286003112793, "global_step": 496352, "epoch": 5980} {"train_loss": -26.981382369995117, "global_step": 496353, "epoch": 5980} {"train_loss": -27.801654815673828, "global_step": 496354, "epoch": 5980} {"train_loss": -27.132373809814453, "global_step": 496355, "epoch": 5980} {"train_loss": -27.3272705078125, "global_step": 496356, "epoch": 5980} {"train_loss": -27.340402603149414, "global_step": 496357, "epoch": 5980} {"train_loss": -27.12237548828125, "global_step": 496358, "epoch": 5980} {"train_loss": -27.434452056884766, "global_step": 496359, "epoch": 5980} {"train_loss": -27.46124839782715, "global_step": 496360, "epoch": 5980} {"train_loss": -27.07610511779785, "global_step": 496361, "epoch": 5980} {"train_loss": -27.447843551635742, "global_step": 496362, "epoch": 5980} {"train_loss": -27.468006134033203, "global_step": 496363, "epoch": 5980} {"train_loss": -27.299848556518555, "global_step": 496364, "epoch": 5980} {"train_loss": -27.600204467773438, "global_step": 496365, "epoch": 5980} {"train_loss": -27.208520889282227, "global_step": 496366, "epoch": 5980} {"train_loss": -27.3930721282959, "global_step": 496367, "epoch": 5980} {"train_loss": -27.65885353088379, "global_step": 496368, "epoch": 5980} {"train_loss": -27.54583740234375, "global_step": 496369, "epoch": 5980} {"train_loss": -27.346786499023438, "global_step": 496370, "epoch": 5980} {"train_loss": -27.587621688842773, "global_step": 496371, "epoch": 5980} {"train_loss": -27.68037223815918, "global_step": 496372, "epoch": 5980} {"train_loss": -27.25176429748535, "global_step": 496373, "epoch": 5980} {"train_loss": -27.45326042175293, "global_step": 496374, "epoch": 5980} {"train_loss": -27.40833854675293, "global_step": 496375, "epoch": 5980} {"train_loss": -27.26922035217285, "global_step": 496376, "epoch": 5980} {"train_loss": -27.272382736206055, "global_step": 496377, "epoch": 5980} {"train_loss": -27.378828048706055, "global_step": 496378, "epoch": 5980} {"train_loss": -27.617948532104492, "global_step": 496379, "epoch": 5980} {"train_loss": -27.393674850463867, "global_step": 496380, "epoch": 5980} {"train_loss": -27.279027938842773, "global_step": 496381, "epoch": 5980} {"train_loss": -27.328144073486328, "global_step": 496382, "epoch": 5980} {"train_loss": -27.32779884338379, "global_step": 496383, "epoch": 5980} {"train_loss": -27.57618522644043, "global_step": 496384, "epoch": 5980} {"train_loss": -26.78191566467285, "global_step": 496385, "epoch": 5980} {"train_loss": -27.129730224609375, "global_step": 496386, "epoch": 5980} {"train_loss": -27.392484664916992, "global_step": 496387, "epoch": 5980} {"train_loss": -26.943023681640625, "global_step": 496388, "epoch": 5980} {"train_loss": -26.68958854675293, "global_step": 496389, "epoch": 5980} {"train_loss": -26.894805908203125, "global_step": 496390, "epoch": 5980} {"train_loss": -26.8952693939209, "global_step": 496391, "epoch": 5980} {"train_loss": -26.95015525817871, "global_step": 496392, "epoch": 5980} {"train_loss": -26.97541618347168, "global_step": 496393, "epoch": 5980} {"train_loss": -27.294036865234375, "global_step": 496394, "epoch": 5980} {"train_loss": -27.34539222717285, "global_step": 496395, "epoch": 5980} {"train_loss": -27.394506454467773, "global_step": 496396, "epoch": 5980} {"train_loss": -26.697559356689453, "global_step": 496397, "epoch": 5980} {"train_loss": -26.917724609375, "global_step": 496398, "epoch": 5980} {"train_loss": -26.58448600769043, "global_step": 496399, "epoch": 5980} {"train_loss": -26.56597900390625, "global_step": 496400, "epoch": 5980} {"train_loss": -27.18291664123535, "global_step": 496401, "epoch": 5980} {"train_loss": -27.656391143798828, "global_step": 496402, "epoch": 5980} {"train_loss": -27.297744750976562, "global_step": 496403, "epoch": 5980} {"train_loss": -27.36842918395996, "global_step": 496404, "epoch": 5980} {"train_loss": -27.335922241210938, "global_step": 496405, "epoch": 5980} {"train_loss": -27.471118927001953, "global_step": 496406, "epoch": 5980} {"train_loss": -27.54376792907715, "global_step": 496407, "epoch": 5980} {"train_loss": -27.309167861938477, "global_step": 496408, "epoch": 5980} {"train_loss": -27.409833908081055, "global_step": 496409, "epoch": 5980} {"train_loss": -27.253320693969727, "global_step": 496410, "epoch": 5980} {"train_loss": -27.58827018737793, "global_step": 496411, "epoch": 5980} {"train_loss": -27.710437774658203, "global_step": 496412, "epoch": 5980} {"train_loss": -27.350605010986328, "global_step": 496413, "epoch": 5980} {"train_loss": -27.33099937438965, "global_step": 496414, "epoch": 5980} {"train_loss": -27.305389404296875, "global_step": 496415, "epoch": 5980} {"train_loss": -27.44272232055664, "global_step": 496416, "epoch": 5980} {"train_loss": -27.725366592407227, "global_step": 496417, "epoch": 5980} {"train_loss": -27.42218017578125, "global_step": 496418, "epoch": 5980} {"train_loss": -27.477991104125977, "global_step": 496419, "epoch": 5980} {"train_loss": -27.06696891784668, "global_step": 496420, "epoch": 5980} {"train_loss": -27.4560604095459, "global_step": 496421, "epoch": 5980} {"train_loss": -27.324382046619093, "global_step": 496422, "epoch": 5980, "val_loss": 6640755.0} {"train_loss": -27.064130783081055, "global_step": 496423, "epoch": 5981} {"train_loss": -26.93183708190918, "global_step": 496424, "epoch": 5981} {"train_loss": -27.054655075073242, "global_step": 496425, "epoch": 5981} {"train_loss": -27.32940101623535, "global_step": 496426, "epoch": 5981} {"train_loss": -26.729482650756836, "global_step": 496427, "epoch": 5981} {"train_loss": -26.196420669555664, "global_step": 496428, "epoch": 5981} {"train_loss": -27.001379013061523, "global_step": 496429, "epoch": 5981} {"train_loss": -26.6471004486084, "global_step": 496430, "epoch": 5981} {"train_loss": -26.916431427001953, "global_step": 496431, "epoch": 5981} {"train_loss": -27.077863693237305, "global_step": 496432, "epoch": 5981} {"train_loss": -26.931753158569336, "global_step": 496433, "epoch": 5981} {"train_loss": -27.4774227142334, "global_step": 496434, "epoch": 5981} {"train_loss": -27.151464462280273, "global_step": 496435, "epoch": 5981} {"train_loss": -27.192218780517578, "global_step": 496436, "epoch": 5981} {"train_loss": -27.173391342163086, "global_step": 496437, "epoch": 5981} {"train_loss": -27.451623916625977, "global_step": 496438, "epoch": 5981} {"train_loss": -27.360380172729492, "global_step": 496439, "epoch": 5981} {"train_loss": -27.5172176361084, "global_step": 496440, "epoch": 5981} {"train_loss": -27.283910751342773, "global_step": 496441, "epoch": 5981} {"train_loss": -27.461441040039062, "global_step": 496442, "epoch": 5981} {"train_loss": -27.117938995361328, "global_step": 496443, "epoch": 5981} {"train_loss": -27.57343101501465, "global_step": 496444, "epoch": 5981} {"train_loss": -26.9619197845459, "global_step": 496445, "epoch": 5981} {"train_loss": -27.691516876220703, "global_step": 496446, "epoch": 5981} {"train_loss": -27.376754760742188, "global_step": 496447, "epoch": 5981} {"train_loss": -27.171743392944336, "global_step": 496448, "epoch": 5981} {"train_loss": -27.218839645385742, "global_step": 496449, "epoch": 5981} {"train_loss": -27.002771377563477, "global_step": 496450, "epoch": 5981} {"train_loss": -27.268951416015625, "global_step": 496451, "epoch": 5981} {"train_loss": -27.139890670776367, "global_step": 496452, "epoch": 5981} {"train_loss": -27.743772506713867, "global_step": 496453, "epoch": 5981} {"train_loss": -27.359243392944336, "global_step": 496454, "epoch": 5981} {"train_loss": -27.642837524414062, "global_step": 496455, "epoch": 5981} {"train_loss": -27.205657958984375, "global_step": 496456, "epoch": 5981} {"train_loss": -27.68549919128418, "global_step": 496457, "epoch": 5981} {"train_loss": -27.449926376342773, "global_step": 496458, "epoch": 5981} {"train_loss": -27.28098487854004, "global_step": 496459, "epoch": 5981} {"train_loss": -26.889692306518555, "global_step": 496460, "epoch": 5981} {"train_loss": -27.007537841796875, "global_step": 496461, "epoch": 5981} {"train_loss": -27.081775665283203, "global_step": 496462, "epoch": 5981} {"train_loss": -26.723392486572266, "global_step": 496463, "epoch": 5981} {"train_loss": -27.046361923217773, "global_step": 496464, "epoch": 5981} {"train_loss": -27.2951717376709, "global_step": 496465, "epoch": 5981} {"train_loss": -27.4073429107666, "global_step": 496466, "epoch": 5981} {"train_loss": -27.513330459594727, "global_step": 496467, "epoch": 5981} {"train_loss": -27.213302612304688, "global_step": 496468, "epoch": 5981} {"train_loss": -27.4060115814209, "global_step": 496469, "epoch": 5981} {"train_loss": -27.400360107421875, "global_step": 496470, "epoch": 5981} {"train_loss": -27.283124923706055, "global_step": 496471, "epoch": 5981} {"train_loss": -27.25343132019043, "global_step": 496472, "epoch": 5981} {"train_loss": -27.064300537109375, "global_step": 496473, "epoch": 5981} {"train_loss": -26.996646881103516, "global_step": 496474, "epoch": 5981} {"train_loss": -27.521337509155273, "global_step": 496475, "epoch": 5981} {"train_loss": -27.574417114257812, "global_step": 496476, "epoch": 5981} {"train_loss": -27.5911808013916, "global_step": 496477, "epoch": 5981} {"train_loss": -27.4378604888916, "global_step": 496478, "epoch": 5981} {"train_loss": -27.541763305664062, "global_step": 496479, "epoch": 5981} {"train_loss": -27.516996383666992, "global_step": 496480, "epoch": 5981} {"train_loss": -27.44677734375, "global_step": 496481, "epoch": 5981} {"train_loss": -27.20135498046875, "global_step": 496482, "epoch": 5981} {"train_loss": -27.2988338470459, "global_step": 496483, "epoch": 5981} {"train_loss": -27.296667098999023, "global_step": 496484, "epoch": 5981} {"train_loss": -27.78940773010254, "global_step": 496485, "epoch": 5981} {"train_loss": -27.658483505249023, "global_step": 496486, "epoch": 5981} {"train_loss": -27.526819229125977, "global_step": 496487, "epoch": 5981} {"train_loss": -27.575668334960938, "global_step": 496488, "epoch": 5981} {"train_loss": -27.836349487304688, "global_step": 496489, "epoch": 5981} {"train_loss": -27.149566650390625, "global_step": 496490, "epoch": 5981} {"train_loss": -27.43950843811035, "global_step": 496491, "epoch": 5981} {"train_loss": -27.313785552978516, "global_step": 496492, "epoch": 5981} {"train_loss": -27.336917877197266, "global_step": 496493, "epoch": 5981} {"train_loss": -27.36740493774414, "global_step": 496494, "epoch": 5981} {"train_loss": -27.729480743408203, "global_step": 496495, "epoch": 5981} {"train_loss": -27.4941463470459, "global_step": 496496, "epoch": 5981} {"train_loss": -27.285236358642578, "global_step": 496497, "epoch": 5981} {"train_loss": -27.98455238342285, "global_step": 496498, "epoch": 5981} {"train_loss": -27.541767120361328, "global_step": 496499, "epoch": 5981} {"train_loss": -27.466821670532227, "global_step": 496500, "epoch": 5981} {"train_loss": -27.697834014892578, "global_step": 496501, "epoch": 5981} {"train_loss": -27.181655883789062, "global_step": 496502, "epoch": 5981} {"train_loss": -27.49561882019043, "global_step": 496503, "epoch": 5981} {"train_loss": -27.513355255126953, "global_step": 496504, "epoch": 5981} {"train_loss": -27.30624771118164, "global_step": 496505, "epoch": 5981, "val_loss": 6566676.0} {"train_loss": -26.44805908203125, "global_step": 496506, "epoch": 5982} {"train_loss": -25.913467407226562, "global_step": 496507, "epoch": 5982} {"train_loss": -26.09151268005371, "global_step": 496508, "epoch": 5982} {"train_loss": -26.32611083984375, "global_step": 496509, "epoch": 5982} {"train_loss": -26.955432891845703, "global_step": 496510, "epoch": 5982} {"train_loss": -26.141748428344727, "global_step": 496511, "epoch": 5982} {"train_loss": -26.629316329956055, "global_step": 496512, "epoch": 5982} {"train_loss": -26.470739364624023, "global_step": 496513, "epoch": 5982} {"train_loss": -27.076831817626953, "global_step": 496514, "epoch": 5982} {"train_loss": -26.939550399780273, "global_step": 496515, "epoch": 5982} {"train_loss": -26.743865966796875, "global_step": 496516, "epoch": 5982} {"train_loss": -27.0206298828125, "global_step": 496517, "epoch": 5982} {"train_loss": -26.849828720092773, "global_step": 496518, "epoch": 5982} {"train_loss": -27.132627487182617, "global_step": 496519, "epoch": 5982} {"train_loss": -26.820959091186523, "global_step": 496520, "epoch": 5982} {"train_loss": -27.236846923828125, "global_step": 496521, "epoch": 5982} {"train_loss": -27.39430046081543, "global_step": 496522, "epoch": 5982} {"train_loss": -27.040836334228516, "global_step": 496523, "epoch": 5982} {"train_loss": -27.08289909362793, "global_step": 496524, "epoch": 5982} {"train_loss": -27.281585693359375, "global_step": 496525, "epoch": 5982} {"train_loss": -26.7718563079834, "global_step": 496526, "epoch": 5982} {"train_loss": -27.018518447875977, "global_step": 496527, "epoch": 5982} {"train_loss": -27.61516761779785, "global_step": 496528, "epoch": 5982} {"train_loss": -27.341169357299805, "global_step": 496529, "epoch": 5982} {"train_loss": -27.413442611694336, "global_step": 496530, "epoch": 5982} {"train_loss": -27.022216796875, "global_step": 496531, "epoch": 5982} {"train_loss": -27.227441787719727, "global_step": 496532, "epoch": 5982} {"train_loss": -27.342432022094727, "global_step": 496533, "epoch": 5982} {"train_loss": -27.203454971313477, "global_step": 496534, "epoch": 5982} {"train_loss": -26.877578735351562, "global_step": 496535, "epoch": 5982} {"train_loss": -26.971052169799805, "global_step": 496536, "epoch": 5982} {"train_loss": -27.4066219329834, "global_step": 496537, "epoch": 5982} {"train_loss": -27.130813598632812, "global_step": 496538, "epoch": 5982} {"train_loss": -27.0268611907959, "global_step": 496539, "epoch": 5982} {"train_loss": -27.091779708862305, "global_step": 496540, "epoch": 5982} {"train_loss": -27.10590934753418, "global_step": 496541, "epoch": 5982} {"train_loss": -27.454822540283203, "global_step": 496542, "epoch": 5982} {"train_loss": -27.084436416625977, "global_step": 496543, "epoch": 5982} {"train_loss": -26.97896385192871, "global_step": 496544, "epoch": 5982} {"train_loss": -27.33473777770996, "global_step": 496545, "epoch": 5982} {"train_loss": -27.34113121032715, "global_step": 496546, "epoch": 5982} {"train_loss": -27.77153968811035, "global_step": 496547, "epoch": 5982} {"train_loss": -27.284637451171875, "global_step": 496548, "epoch": 5982} {"train_loss": -27.612720489501953, "global_step": 496549, "epoch": 5982} {"train_loss": -27.508411407470703, "global_step": 496550, "epoch": 5982} {"train_loss": -27.31048583984375, "global_step": 496551, "epoch": 5982} {"train_loss": -27.368284225463867, "global_step": 496552, "epoch": 5982} {"train_loss": -27.266082763671875, "global_step": 496553, "epoch": 5982} {"train_loss": -27.753992080688477, "global_step": 496554, "epoch": 5982} {"train_loss": -27.3002872467041, "global_step": 496555, "epoch": 5982} {"train_loss": -27.638324737548828, "global_step": 496556, "epoch": 5982} {"train_loss": -27.756616592407227, "global_step": 496557, "epoch": 5982} {"train_loss": -27.520910263061523, "global_step": 496558, "epoch": 5982} {"train_loss": -27.50702476501465, "global_step": 496559, "epoch": 5982} {"train_loss": -27.35309410095215, "global_step": 496560, "epoch": 5982} {"train_loss": -27.5843505859375, "global_step": 496561, "epoch": 5982} {"train_loss": -27.883895874023438, "global_step": 496562, "epoch": 5982} {"train_loss": -27.54192543029785, "global_step": 496563, "epoch": 5982} {"train_loss": -27.427091598510742, "global_step": 496564, "epoch": 5982} {"train_loss": -27.46082878112793, "global_step": 496565, "epoch": 5982} {"train_loss": -27.22236442565918, "global_step": 496566, "epoch": 5982} {"train_loss": -27.25678062438965, "global_step": 496567, "epoch": 5982} {"train_loss": -27.353010177612305, "global_step": 496568, "epoch": 5982} {"train_loss": -27.34309196472168, "global_step": 496569, "epoch": 5982} {"train_loss": -26.979297637939453, "global_step": 496570, "epoch": 5982} {"train_loss": -27.43880271911621, "global_step": 496571, "epoch": 5982} {"train_loss": -27.3570613861084, "global_step": 496572, "epoch": 5982} {"train_loss": -27.464344024658203, "global_step": 496573, "epoch": 5982} {"train_loss": -27.588064193725586, "global_step": 496574, "epoch": 5982} {"train_loss": -27.02980613708496, "global_step": 496575, "epoch": 5982} {"train_loss": -27.088281631469727, "global_step": 496576, "epoch": 5982} {"train_loss": -27.102970123291016, "global_step": 496577, "epoch": 5982} {"train_loss": -27.43816566467285, "global_step": 496578, "epoch": 5982} {"train_loss": -26.780349731445312, "global_step": 496579, "epoch": 5982} {"train_loss": -26.531421661376953, "global_step": 496580, "epoch": 5982} {"train_loss": -27.08015251159668, "global_step": 496581, "epoch": 5982} {"train_loss": -27.301782608032227, "global_step": 496582, "epoch": 5982} {"train_loss": -26.807580947875977, "global_step": 496583, "epoch": 5982} {"train_loss": -27.47308349609375, "global_step": 496584, "epoch": 5982} {"train_loss": -27.394678115844727, "global_step": 496585, "epoch": 5982} {"train_loss": -27.304157257080078, "global_step": 496586, "epoch": 5982} {"train_loss": -27.375049591064453, "global_step": 496587, "epoch": 5982} {"train_loss": -27.148092522678606, "global_step": 496588, "epoch": 5982, "val_loss": 6619563.0} {"train_loss": -27.121967315673828, "global_step": 496589, "epoch": 5983} {"train_loss": -26.90268325805664, "global_step": 496590, "epoch": 5983} {"train_loss": -26.9432315826416, "global_step": 496591, "epoch": 5983} {"train_loss": -27.152868270874023, "global_step": 496592, "epoch": 5983} {"train_loss": -26.96177101135254, "global_step": 496593, "epoch": 5983} {"train_loss": -26.715173721313477, "global_step": 496594, "epoch": 5983} {"train_loss": -26.77294921875, "global_step": 496595, "epoch": 5983} {"train_loss": -26.818822860717773, "global_step": 496596, "epoch": 5983} {"train_loss": -27.121667861938477, "global_step": 496597, "epoch": 5983} {"train_loss": -27.018268585205078, "global_step": 496598, "epoch": 5983} {"train_loss": -27.031726837158203, "global_step": 496599, "epoch": 5983} {"train_loss": -27.2009334564209, "global_step": 496600, "epoch": 5983} {"train_loss": -26.82081413269043, "global_step": 496601, "epoch": 5983} {"train_loss": -27.152795791625977, "global_step": 496602, "epoch": 5983} {"train_loss": -27.298803329467773, "global_step": 496603, "epoch": 5983} {"train_loss": -27.223596572875977, "global_step": 496604, "epoch": 5983} {"train_loss": -27.084394454956055, "global_step": 496605, "epoch": 5983} {"train_loss": -27.073856353759766, "global_step": 496606, "epoch": 5983} {"train_loss": -26.922117233276367, "global_step": 496607, "epoch": 5983} {"train_loss": -27.231311798095703, "global_step": 496608, "epoch": 5983} {"train_loss": -27.175500869750977, "global_step": 496609, "epoch": 5983} {"train_loss": -27.487768173217773, "global_step": 496610, "epoch": 5983} {"train_loss": -27.5218448638916, "global_step": 496611, "epoch": 5983} {"train_loss": -27.58984375, "global_step": 496612, "epoch": 5983} {"train_loss": -27.55047607421875, "global_step": 496613, "epoch": 5983} {"train_loss": -27.180240631103516, "global_step": 496614, "epoch": 5983} {"train_loss": -27.579389572143555, "global_step": 496615, "epoch": 5983} {"train_loss": -27.704633712768555, "global_step": 496616, "epoch": 5983} {"train_loss": -27.27577781677246, "global_step": 496617, "epoch": 5983} {"train_loss": -27.0987606048584, "global_step": 496618, "epoch": 5983} {"train_loss": -27.408666610717773, "global_step": 496619, "epoch": 5983} {"train_loss": -27.351587295532227, "global_step": 496620, "epoch": 5983} {"train_loss": -27.46721839904785, "global_step": 496621, "epoch": 5983} {"train_loss": -27.430133819580078, "global_step": 496622, "epoch": 5983} {"train_loss": -27.58974266052246, "global_step": 496623, "epoch": 5983} {"train_loss": -27.73685646057129, "global_step": 496624, "epoch": 5983} {"train_loss": -27.3710880279541, "global_step": 496625, "epoch": 5983} {"train_loss": -27.157011032104492, "global_step": 496626, "epoch": 5983} {"train_loss": -27.539703369140625, "global_step": 496627, "epoch": 5983} {"train_loss": -27.279266357421875, "global_step": 496628, "epoch": 5983} {"train_loss": -27.55486488342285, "global_step": 496629, "epoch": 5983} {"train_loss": -27.563720703125, "global_step": 496630, "epoch": 5983} {"train_loss": -27.44915199279785, "global_step": 496631, "epoch": 5983} {"train_loss": -27.568140029907227, "global_step": 496632, "epoch": 5983} {"train_loss": -28.10759925842285, "global_step": 496633, "epoch": 5983} {"train_loss": -27.630390167236328, "global_step": 496634, "epoch": 5983} {"train_loss": -27.722517013549805, "global_step": 496635, "epoch": 5983} {"train_loss": -27.124841690063477, "global_step": 496636, "epoch": 5983} {"train_loss": -27.505584716796875, "global_step": 496637, "epoch": 5983} {"train_loss": -27.205778121948242, "global_step": 496638, "epoch": 5983} {"train_loss": -27.6253662109375, "global_step": 496639, "epoch": 5983} {"train_loss": -27.532577514648438, "global_step": 496640, "epoch": 5983} {"train_loss": -27.292804718017578, "global_step": 496641, "epoch": 5983} {"train_loss": -27.37586784362793, "global_step": 496642, "epoch": 5983} {"train_loss": -27.292407989501953, "global_step": 496643, "epoch": 5983} {"train_loss": -27.134353637695312, "global_step": 496644, "epoch": 5983} {"train_loss": -27.619953155517578, "global_step": 496645, "epoch": 5983} {"train_loss": -27.51985740661621, "global_step": 496646, "epoch": 5983} {"train_loss": -27.151830673217773, "global_step": 496647, "epoch": 5983} {"train_loss": -27.780231475830078, "global_step": 496648, "epoch": 5983} {"train_loss": -27.203338623046875, "global_step": 496649, "epoch": 5983} {"train_loss": -27.405847549438477, "global_step": 496650, "epoch": 5983} {"train_loss": -27.207799911499023, "global_step": 496651, "epoch": 5983} {"train_loss": -27.16839599609375, "global_step": 496652, "epoch": 5983} {"train_loss": -27.498151779174805, "global_step": 496653, "epoch": 5983} {"train_loss": -27.587308883666992, "global_step": 496654, "epoch": 5983} {"train_loss": -27.133203506469727, "global_step": 496655, "epoch": 5983} {"train_loss": -26.876249313354492, "global_step": 496656, "epoch": 5983} {"train_loss": -26.5353946685791, "global_step": 496657, "epoch": 5983} {"train_loss": -26.892471313476562, "global_step": 496658, "epoch": 5983} {"train_loss": -27.557886123657227, "global_step": 496659, "epoch": 5983} {"train_loss": -27.818302154541016, "global_step": 496660, "epoch": 5983} {"train_loss": -27.335092544555664, "global_step": 496661, "epoch": 5983} {"train_loss": -27.23615074157715, "global_step": 496662, "epoch": 5983} {"train_loss": -27.29102897644043, "global_step": 496663, "epoch": 5983} {"train_loss": -27.329833984375, "global_step": 496664, "epoch": 5983} {"train_loss": -27.413049697875977, "global_step": 496665, "epoch": 5983} {"train_loss": -27.340991973876953, "global_step": 496666, "epoch": 5983} {"train_loss": -26.8004093170166, "global_step": 496667, "epoch": 5983} {"train_loss": -26.810300827026367, "global_step": 496668, "epoch": 5983} {"train_loss": -27.43592643737793, "global_step": 496669, "epoch": 5983} {"train_loss": -27.46317481994629, "global_step": 496670, "epoch": 5983} {"train_loss": -27.294431801301887, "global_step": 496671, "epoch": 5983, "val_loss": 6564478.0} {"train_loss": -26.205564498901367, "global_step": 496672, "epoch": 5984} {"train_loss": -26.09686279296875, "global_step": 496673, "epoch": 5984} {"train_loss": -27.019819259643555, "global_step": 496674, "epoch": 5984} {"train_loss": -26.22540283203125, "global_step": 496675, "epoch": 5984} {"train_loss": -27.129669189453125, "global_step": 496676, "epoch": 5984} {"train_loss": -26.29941177368164, "global_step": 496677, "epoch": 5984} {"train_loss": -26.205896377563477, "global_step": 496678, "epoch": 5984} {"train_loss": -26.29155921936035, "global_step": 496679, "epoch": 5984} {"train_loss": -27.046483993530273, "global_step": 496680, "epoch": 5984} {"train_loss": -26.538503646850586, "global_step": 496681, "epoch": 5984} {"train_loss": -26.64934730529785, "global_step": 496682, "epoch": 5984} {"train_loss": -26.694793701171875, "global_step": 496683, "epoch": 5984} {"train_loss": -26.875263214111328, "global_step": 496684, "epoch": 5984} {"train_loss": -26.81141471862793, "global_step": 496685, "epoch": 5984} {"train_loss": -27.047882080078125, "global_step": 496686, "epoch": 5984} {"train_loss": -26.758502960205078, "global_step": 496687, "epoch": 5984} {"train_loss": -26.581836700439453, "global_step": 496688, "epoch": 5984} {"train_loss": -26.9619140625, "global_step": 496689, "epoch": 5984} {"train_loss": -26.99305534362793, "global_step": 496690, "epoch": 5984} {"train_loss": -26.96931266784668, "global_step": 496691, "epoch": 5984} {"train_loss": -27.322467803955078, "global_step": 496692, "epoch": 5984} {"train_loss": -27.052881240844727, "global_step": 496693, "epoch": 5984} {"train_loss": -26.477996826171875, "global_step": 496694, "epoch": 5984} {"train_loss": -27.015735626220703, "global_step": 496695, "epoch": 5984} {"train_loss": -27.173795700073242, "global_step": 496696, "epoch": 5984} {"train_loss": -27.341907501220703, "global_step": 496697, "epoch": 5984} {"train_loss": -27.40313148498535, "global_step": 496698, "epoch": 5984} {"train_loss": -26.744098663330078, "global_step": 496699, "epoch": 5984} {"train_loss": -27.274219512939453, "global_step": 496700, "epoch": 5984} {"train_loss": -27.259552001953125, "global_step": 496701, "epoch": 5984} {"train_loss": -27.14288330078125, "global_step": 496702, "epoch": 5984} {"train_loss": -27.233509063720703, "global_step": 496703, "epoch": 5984} {"train_loss": -27.298160552978516, "global_step": 496704, "epoch": 5984} {"train_loss": -27.52410316467285, "global_step": 496705, "epoch": 5984} {"train_loss": -26.89985466003418, "global_step": 496706, "epoch": 5984} {"train_loss": -27.703344345092773, "global_step": 496707, "epoch": 5984} {"train_loss": -27.07472801208496, "global_step": 496708, "epoch": 5984} {"train_loss": -27.434179306030273, "global_step": 496709, "epoch": 5984} {"train_loss": -27.881946563720703, "global_step": 496710, "epoch": 5984} {"train_loss": -27.049396514892578, "global_step": 496711, "epoch": 5984} {"train_loss": -27.310773849487305, "global_step": 496712, "epoch": 5984} {"train_loss": -27.454320907592773, "global_step": 496713, "epoch": 5984} {"train_loss": -27.606306076049805, "global_step": 496714, "epoch": 5984} {"train_loss": -27.53571128845215, "global_step": 496715, "epoch": 5984} {"train_loss": -27.4755859375, "global_step": 496716, "epoch": 5984} {"train_loss": -27.646595001220703, "global_step": 496717, "epoch": 5984} {"train_loss": -27.45944595336914, "global_step": 496718, "epoch": 5984} {"train_loss": -27.5244140625, "global_step": 496719, "epoch": 5984} {"train_loss": -27.318567276000977, "global_step": 496720, "epoch": 5984} {"train_loss": -27.544286727905273, "global_step": 496721, "epoch": 5984} {"train_loss": -27.43180274963379, "global_step": 496722, "epoch": 5984} {"train_loss": -27.6728515625, "global_step": 496723, "epoch": 5984} {"train_loss": -27.656970977783203, "global_step": 496724, "epoch": 5984} {"train_loss": -27.751117706298828, "global_step": 496725, "epoch": 5984} {"train_loss": -27.862701416015625, "global_step": 496726, "epoch": 5984} {"train_loss": -27.462690353393555, "global_step": 496727, "epoch": 5984} {"train_loss": -27.316558837890625, "global_step": 496728, "epoch": 5984} {"train_loss": -27.696989059448242, "global_step": 496729, "epoch": 5984} {"train_loss": -27.632909774780273, "global_step": 496730, "epoch": 5984} {"train_loss": -27.429040908813477, "global_step": 496731, "epoch": 5984} {"train_loss": -27.199186325073242, "global_step": 496732, "epoch": 5984} {"train_loss": -27.41800880432129, "global_step": 496733, "epoch": 5984} {"train_loss": -27.769681930541992, "global_step": 496734, "epoch": 5984} {"train_loss": -27.838611602783203, "global_step": 496735, "epoch": 5984} {"train_loss": -27.959644317626953, "global_step": 496736, "epoch": 5984} {"train_loss": -27.482315063476562, "global_step": 496737, "epoch": 5984} {"train_loss": -27.546594619750977, "global_step": 496738, "epoch": 5984} {"train_loss": -27.70172119140625, "global_step": 496739, "epoch": 5984} {"train_loss": -27.37006187438965, "global_step": 496740, "epoch": 5984} {"train_loss": -27.542373657226562, "global_step": 496741, "epoch": 5984} {"train_loss": -27.47577476501465, "global_step": 496742, "epoch": 5984} {"train_loss": -27.448795318603516, "global_step": 496743, "epoch": 5984} {"train_loss": -27.361618041992188, "global_step": 496744, "epoch": 5984} {"train_loss": -27.463592529296875, "global_step": 496745, "epoch": 5984} {"train_loss": -27.166547775268555, "global_step": 496746, "epoch": 5984} {"train_loss": -27.065662384033203, "global_step": 496747, "epoch": 5984} {"train_loss": -27.341434478759766, "global_step": 496748, "epoch": 5984} {"train_loss": -26.917688369750977, "global_step": 496749, "epoch": 5984} {"train_loss": -26.914209365844727, "global_step": 496750, "epoch": 5984} {"train_loss": -27.228515625, "global_step": 496751, "epoch": 5984} {"train_loss": -26.4826602935791, "global_step": 496752, "epoch": 5984} {"train_loss": -26.023914337158203, "global_step": 496753, "epoch": 5984} {"train_loss": -27.178292837487646, "global_step": 496754, "epoch": 5984, "val_loss": 6695908.0} {"train_loss": -26.480390548706055, "global_step": 496755, "epoch": 5985} {"train_loss": -27.13409423828125, "global_step": 496756, "epoch": 5985} {"train_loss": -26.725448608398438, "global_step": 496757, "epoch": 5985} {"train_loss": -26.74220085144043, "global_step": 496758, "epoch": 5985} {"train_loss": -26.805280685424805, "global_step": 496759, "epoch": 5985} {"train_loss": -27.04168701171875, "global_step": 496760, "epoch": 5985} {"train_loss": -26.212696075439453, "global_step": 496761, "epoch": 5985} {"train_loss": -26.350683212280273, "global_step": 496762, "epoch": 5985} {"train_loss": -26.303070068359375, "global_step": 496763, "epoch": 5985} {"train_loss": -26.791364669799805, "global_step": 496764, "epoch": 5985} {"train_loss": -26.419692993164062, "global_step": 496765, "epoch": 5985} {"train_loss": -26.7890682220459, "global_step": 496766, "epoch": 5985} {"train_loss": -26.67347526550293, "global_step": 496767, "epoch": 5985} {"train_loss": -26.776763916015625, "global_step": 496768, "epoch": 5985} {"train_loss": -26.685739517211914, "global_step": 496769, "epoch": 5985} {"train_loss": -26.8486270904541, "global_step": 496770, "epoch": 5985} {"train_loss": -27.014219284057617, "global_step": 496771, "epoch": 5985} {"train_loss": -26.92579460144043, "global_step": 496772, "epoch": 5985} {"train_loss": -27.167016983032227, "global_step": 496773, "epoch": 5985} {"train_loss": -26.906827926635742, "global_step": 496774, "epoch": 5985} {"train_loss": -26.838659286499023, "global_step": 496775, "epoch": 5985} {"train_loss": -26.829971313476562, "global_step": 496776, "epoch": 5985} {"train_loss": -27.133563995361328, "global_step": 496777, "epoch": 5985} {"train_loss": -27.131732940673828, "global_step": 496778, "epoch": 5985} {"train_loss": -27.176328659057617, "global_step": 496779, "epoch": 5985} {"train_loss": -26.86219596862793, "global_step": 496780, "epoch": 5985} {"train_loss": -27.072736740112305, "global_step": 496781, "epoch": 5985} {"train_loss": -26.997394561767578, "global_step": 496782, "epoch": 5985} {"train_loss": -27.375274658203125, "global_step": 496783, "epoch": 5985} {"train_loss": -27.724140167236328, "global_step": 496784, "epoch": 5985} {"train_loss": -27.7605037689209, "global_step": 496785, "epoch": 5985} {"train_loss": -27.192657470703125, "global_step": 496786, "epoch": 5985} {"train_loss": -27.357664108276367, "global_step": 496787, "epoch": 5985} {"train_loss": -27.4481201171875, "global_step": 496788, "epoch": 5985} {"train_loss": -27.23419189453125, "global_step": 496789, "epoch": 5985} {"train_loss": -27.311115264892578, "global_step": 496790, "epoch": 5985} {"train_loss": -27.352575302124023, "global_step": 496791, "epoch": 5985} {"train_loss": -27.29071617126465, "global_step": 496792, "epoch": 5985} {"train_loss": -27.395343780517578, "global_step": 496793, "epoch": 5985} {"train_loss": -27.3310546875, "global_step": 496794, "epoch": 5985} {"train_loss": -27.51325798034668, "global_step": 496795, "epoch": 5985} {"train_loss": -27.355737686157227, "global_step": 496796, "epoch": 5985} {"train_loss": -26.865293502807617, "global_step": 496797, "epoch": 5985} {"train_loss": -27.462793350219727, "global_step": 496798, "epoch": 5985} {"train_loss": -27.230131149291992, "global_step": 496799, "epoch": 5985} {"train_loss": -27.65597915649414, "global_step": 496800, "epoch": 5985} {"train_loss": -27.49794578552246, "global_step": 496801, "epoch": 5985} {"train_loss": -27.28095054626465, "global_step": 496802, "epoch": 5985} {"train_loss": -27.635385513305664, "global_step": 496803, "epoch": 5985} {"train_loss": -27.10249137878418, "global_step": 496804, "epoch": 5985} {"train_loss": -27.53883171081543, "global_step": 496805, "epoch": 5985} {"train_loss": -27.2606201171875, "global_step": 496806, "epoch": 5985} {"train_loss": -27.022754669189453, "global_step": 496807, "epoch": 5985} {"train_loss": -27.460193634033203, "global_step": 496808, "epoch": 5985} {"train_loss": -27.383527755737305, "global_step": 496809, "epoch": 5985} {"train_loss": -27.361896514892578, "global_step": 496810, "epoch": 5985} {"train_loss": -27.410709381103516, "global_step": 496811, "epoch": 5985} {"train_loss": -27.581064224243164, "global_step": 496812, "epoch": 5985} {"train_loss": -27.43767738342285, "global_step": 496813, "epoch": 5985} {"train_loss": -27.5216007232666, "global_step": 496814, "epoch": 5985} {"train_loss": -27.233579635620117, "global_step": 496815, "epoch": 5985} {"train_loss": -27.228302001953125, "global_step": 496816, "epoch": 5985} {"train_loss": -27.476367950439453, "global_step": 496817, "epoch": 5985} {"train_loss": -27.471479415893555, "global_step": 496818, "epoch": 5985} {"train_loss": -27.39173698425293, "global_step": 496819, "epoch": 5985} {"train_loss": -27.58905601501465, "global_step": 496820, "epoch": 5985} {"train_loss": -26.883106231689453, "global_step": 496821, "epoch": 5985} {"train_loss": -27.463205337524414, "global_step": 496822, "epoch": 5985} {"train_loss": -27.470233917236328, "global_step": 496823, "epoch": 5985} {"train_loss": -27.212167739868164, "global_step": 496824, "epoch": 5985} {"train_loss": -27.057218551635742, "global_step": 496825, "epoch": 5985} {"train_loss": -27.2967529296875, "global_step": 496826, "epoch": 5985} {"train_loss": -27.065475463867188, "global_step": 496827, "epoch": 5985} {"train_loss": -26.819257736206055, "global_step": 496828, "epoch": 5985} {"train_loss": -26.92563247680664, "global_step": 496829, "epoch": 5985} {"train_loss": -27.18996238708496, "global_step": 496830, "epoch": 5985} {"train_loss": -27.336872100830078, "global_step": 496831, "epoch": 5985} {"train_loss": -27.407394409179688, "global_step": 496832, "epoch": 5985} {"train_loss": -27.275175094604492, "global_step": 496833, "epoch": 5985} {"train_loss": -27.501264572143555, "global_step": 496834, "epoch": 5985} {"train_loss": -27.5546932220459, "global_step": 496835, "epoch": 5985} {"train_loss": -27.376358032226562, "global_step": 496836, "epoch": 5985} {"train_loss": -27.167693241533026, "global_step": 496837, "epoch": 5985, "val_loss": 6599595.5} {"train_loss": -26.77897071838379, "global_step": 496838, "epoch": 5986} {"train_loss": -27.16943359375, "global_step": 496839, "epoch": 5986} {"train_loss": -27.06416893005371, "global_step": 496840, "epoch": 5986} {"train_loss": -27.138593673706055, "global_step": 496841, "epoch": 5986} {"train_loss": -27.22614097595215, "global_step": 496842, "epoch": 5986} {"train_loss": -27.05906105041504, "global_step": 496843, "epoch": 5986} {"train_loss": -27.30584144592285, "global_step": 496844, "epoch": 5986} {"train_loss": -27.226165771484375, "global_step": 496845, "epoch": 5986} {"train_loss": -27.6225643157959, "global_step": 496846, "epoch": 5986} {"train_loss": -27.154577255249023, "global_step": 496847, "epoch": 5986} {"train_loss": -27.1788330078125, "global_step": 496848, "epoch": 5986} {"train_loss": -27.53908348083496, "global_step": 496849, "epoch": 5986} {"train_loss": -26.979787826538086, "global_step": 496850, "epoch": 5986} {"train_loss": -27.302734375, "global_step": 496851, "epoch": 5986} {"train_loss": -27.20425796508789, "global_step": 496852, "epoch": 5986} {"train_loss": -27.166610717773438, "global_step": 496853, "epoch": 5986} {"train_loss": -27.263525009155273, "global_step": 496854, "epoch": 5986} {"train_loss": -27.397424697875977, "global_step": 496855, "epoch": 5986} {"train_loss": -27.753223419189453, "global_step": 496856, "epoch": 5986} {"train_loss": -27.29559326171875, "global_step": 496857, "epoch": 5986} {"train_loss": -27.1881160736084, "global_step": 496858, "epoch": 5986} {"train_loss": -27.57343864440918, "global_step": 496859, "epoch": 5986} {"train_loss": -27.889007568359375, "global_step": 496860, "epoch": 5986} {"train_loss": -27.65143394470215, "global_step": 496861, "epoch": 5986} {"train_loss": -27.46343994140625, "global_step": 496862, "epoch": 5986} {"train_loss": -27.521909713745117, "global_step": 496863, "epoch": 5986} {"train_loss": -27.383813858032227, "global_step": 496864, "epoch": 5986} {"train_loss": -27.769861221313477, "global_step": 496865, "epoch": 5986} {"train_loss": -27.413700103759766, "global_step": 496866, "epoch": 5986} {"train_loss": -27.809680938720703, "global_step": 496867, "epoch": 5986} {"train_loss": -27.665836334228516, "global_step": 496868, "epoch": 5986} {"train_loss": -27.769201278686523, "global_step": 496869, "epoch": 5986} {"train_loss": -27.815296173095703, "global_step": 496870, "epoch": 5986} {"train_loss": -27.81488609313965, "global_step": 496871, "epoch": 5986} {"train_loss": -27.605422973632812, "global_step": 496872, "epoch": 5986} {"train_loss": -27.816638946533203, "global_step": 496873, "epoch": 5986} {"train_loss": -27.53399085998535, "global_step": 496874, "epoch": 5986} {"train_loss": -27.788476943969727, "global_step": 496875, "epoch": 5986} {"train_loss": -27.403491973876953, "global_step": 496876, "epoch": 5986} {"train_loss": -27.18067741394043, "global_step": 496877, "epoch": 5986} {"train_loss": -27.526172637939453, "global_step": 496878, "epoch": 5986} {"train_loss": -27.645471572875977, "global_step": 496879, "epoch": 5986} {"train_loss": -27.390323638916016, "global_step": 496880, "epoch": 5986} {"train_loss": -27.43572998046875, "global_step": 496881, "epoch": 5986} {"train_loss": -27.009672164916992, "global_step": 496882, "epoch": 5986} {"train_loss": -26.46783447265625, "global_step": 496883, "epoch": 5986} {"train_loss": -26.8599910736084, "global_step": 496884, "epoch": 5986} {"train_loss": -26.131757736206055, "global_step": 496885, "epoch": 5986} {"train_loss": -26.267927169799805, "global_step": 496886, "epoch": 5986} {"train_loss": -26.82413673400879, "global_step": 496887, "epoch": 5986} {"train_loss": -26.816162109375, "global_step": 496888, "epoch": 5986} {"train_loss": -26.941436767578125, "global_step": 496889, "epoch": 5986} {"train_loss": -27.006378173828125, "global_step": 496890, "epoch": 5986} {"train_loss": -27.12228775024414, "global_step": 496891, "epoch": 5986} {"train_loss": -27.153051376342773, "global_step": 496892, "epoch": 5986} {"train_loss": -27.284448623657227, "global_step": 496893, "epoch": 5986} {"train_loss": -27.22784423828125, "global_step": 496894, "epoch": 5986} {"train_loss": -27.29404067993164, "global_step": 496895, "epoch": 5986} {"train_loss": -26.8079891204834, "global_step": 496896, "epoch": 5986} {"train_loss": -27.249792098999023, "global_step": 496897, "epoch": 5986} {"train_loss": -27.0787410736084, "global_step": 496898, "epoch": 5986} {"train_loss": -27.397109985351562, "global_step": 496899, "epoch": 5986} {"train_loss": -27.33355712890625, "global_step": 496900, "epoch": 5986} {"train_loss": -27.37628173828125, "global_step": 496901, "epoch": 5986} {"train_loss": -27.078659057617188, "global_step": 496902, "epoch": 5986} {"train_loss": -27.274198532104492, "global_step": 496903, "epoch": 5986} {"train_loss": -27.6307430267334, "global_step": 496904, "epoch": 5986} {"train_loss": -27.377614974975586, "global_step": 496905, "epoch": 5986} {"train_loss": -27.340986251831055, "global_step": 496906, "epoch": 5986} {"train_loss": -27.771682739257812, "global_step": 496907, "epoch": 5986} {"train_loss": -27.691247940063477, "global_step": 496908, "epoch": 5986} {"train_loss": -27.201141357421875, "global_step": 496909, "epoch": 5986} {"train_loss": -27.322507858276367, "global_step": 496910, "epoch": 5986} {"train_loss": -27.3250789642334, "global_step": 496911, "epoch": 5986} {"train_loss": -27.626434326171875, "global_step": 496912, "epoch": 5986} {"train_loss": -27.486164093017578, "global_step": 496913, "epoch": 5986} {"train_loss": -27.46950340270996, "global_step": 496914, "epoch": 5986} {"train_loss": -27.532901763916016, "global_step": 496915, "epoch": 5986} {"train_loss": -27.54071617126465, "global_step": 496916, "epoch": 5986} {"train_loss": -27.583158493041992, "global_step": 496917, "epoch": 5986} {"train_loss": -27.70068359375, "global_step": 496918, "epoch": 5986} {"train_loss": -27.710590362548828, "global_step": 496919, "epoch": 5986} {"train_loss": -27.32887192232063, "global_step": 496920, "epoch": 5986, "val_loss": 6656783.0} {"train_loss": -27.272247314453125, "global_step": 496921, "epoch": 5987} {"train_loss": -27.056493759155273, "global_step": 496922, "epoch": 5987} {"train_loss": -27.021909713745117, "global_step": 496923, "epoch": 5987} {"train_loss": -27.0301456451416, "global_step": 496924, "epoch": 5987} {"train_loss": -26.81638526916504, "global_step": 496925, "epoch": 5987} {"train_loss": -26.999908447265625, "global_step": 496926, "epoch": 5987} {"train_loss": -27.14932632446289, "global_step": 496927, "epoch": 5987} {"train_loss": -27.09088706970215, "global_step": 496928, "epoch": 5987} {"train_loss": -27.163782119750977, "global_step": 496929, "epoch": 5987} {"train_loss": -26.892868041992188, "global_step": 496930, "epoch": 5987} {"train_loss": -27.116413116455078, "global_step": 496931, "epoch": 5987} {"train_loss": -27.1063175201416, "global_step": 496932, "epoch": 5987} {"train_loss": -26.594074249267578, "global_step": 496933, "epoch": 5987} {"train_loss": -26.91139793395996, "global_step": 496934, "epoch": 5987} {"train_loss": -27.387176513671875, "global_step": 496935, "epoch": 5987} {"train_loss": -26.535375595092773, "global_step": 496936, "epoch": 5987} {"train_loss": -26.508886337280273, "global_step": 496937, "epoch": 5987} {"train_loss": -27.207548141479492, "global_step": 496938, "epoch": 5987} {"train_loss": -26.690969467163086, "global_step": 496939, "epoch": 5987} {"train_loss": -27.2440128326416, "global_step": 496940, "epoch": 5987} {"train_loss": -26.694242477416992, "global_step": 496941, "epoch": 5987} {"train_loss": -27.56073570251465, "global_step": 496942, "epoch": 5987} {"train_loss": -27.313282012939453, "global_step": 496943, "epoch": 5987} {"train_loss": -27.099445343017578, "global_step": 496944, "epoch": 5987} {"train_loss": -27.143096923828125, "global_step": 496945, "epoch": 5987} {"train_loss": -27.2753963470459, "global_step": 496946, "epoch": 5987} {"train_loss": -26.999052047729492, "global_step": 496947, "epoch": 5987} {"train_loss": -27.2891788482666, "global_step": 496948, "epoch": 5987} {"train_loss": -26.98542594909668, "global_step": 496949, "epoch": 5987} {"train_loss": -27.468870162963867, "global_step": 496950, "epoch": 5987} {"train_loss": -26.924728393554688, "global_step": 496951, "epoch": 5987} {"train_loss": -27.383039474487305, "global_step": 496952, "epoch": 5987} {"train_loss": -27.309904098510742, "global_step": 496953, "epoch": 5987} {"train_loss": -27.5487117767334, "global_step": 496954, "epoch": 5987} {"train_loss": -27.5618896484375, "global_step": 496955, "epoch": 5987} {"train_loss": -27.837295532226562, "global_step": 496956, "epoch": 5987} {"train_loss": -27.209745407104492, "global_step": 496957, "epoch": 5987} {"train_loss": -27.750350952148438, "global_step": 496958, "epoch": 5987} {"train_loss": -27.342512130737305, "global_step": 496959, "epoch": 5987} {"train_loss": -27.61238670349121, "global_step": 496960, "epoch": 5987} {"train_loss": -27.849023818969727, "global_step": 496961, "epoch": 5987} {"train_loss": -27.484418869018555, "global_step": 496962, "epoch": 5987} {"train_loss": -27.762012481689453, "global_step": 496963, "epoch": 5987} {"train_loss": -27.3548526763916, "global_step": 496964, "epoch": 5987} {"train_loss": -27.513593673706055, "global_step": 496965, "epoch": 5987} {"train_loss": -27.360523223876953, "global_step": 496966, "epoch": 5987} {"train_loss": -27.433984756469727, "global_step": 496967, "epoch": 5987} {"train_loss": -27.322956085205078, "global_step": 496968, "epoch": 5987} {"train_loss": -27.86379051208496, "global_step": 496969, "epoch": 5987} {"train_loss": -27.655445098876953, "global_step": 496970, "epoch": 5987} {"train_loss": -27.42206382751465, "global_step": 496971, "epoch": 5987} {"train_loss": -27.53912925720215, "global_step": 496972, "epoch": 5987} {"train_loss": -27.606372833251953, "global_step": 496973, "epoch": 5987} {"train_loss": -27.391515731811523, "global_step": 496974, "epoch": 5987} {"train_loss": -27.498571395874023, "global_step": 496975, "epoch": 5987} {"train_loss": -27.464435577392578, "global_step": 496976, "epoch": 5987} {"train_loss": -27.68084144592285, "global_step": 496977, "epoch": 5987} {"train_loss": -27.451086044311523, "global_step": 496978, "epoch": 5987} {"train_loss": -27.345056533813477, "global_step": 496979, "epoch": 5987} {"train_loss": -27.17714500427246, "global_step": 496980, "epoch": 5987} {"train_loss": -27.527557373046875, "global_step": 496981, "epoch": 5987} {"train_loss": -27.753173828125, "global_step": 496982, "epoch": 5987} {"train_loss": -27.428991317749023, "global_step": 496983, "epoch": 5987} {"train_loss": -27.391332626342773, "global_step": 496984, "epoch": 5987} {"train_loss": -27.686010360717773, "global_step": 496985, "epoch": 5987} {"train_loss": -27.411304473876953, "global_step": 496986, "epoch": 5987} {"train_loss": -27.376142501831055, "global_step": 496987, "epoch": 5987} {"train_loss": -27.57490348815918, "global_step": 496988, "epoch": 5987} {"train_loss": -27.538679122924805, "global_step": 496989, "epoch": 5987} {"train_loss": -27.121109008789062, "global_step": 496990, "epoch": 5987} {"train_loss": -27.1106014251709, "global_step": 496991, "epoch": 5987} {"train_loss": -27.348953247070312, "global_step": 496992, "epoch": 5987} {"train_loss": -27.485843658447266, "global_step": 496993, "epoch": 5987} {"train_loss": -27.41874122619629, "global_step": 496994, "epoch": 5987} {"train_loss": -27.247289657592773, "global_step": 496995, "epoch": 5987} {"train_loss": -27.302820205688477, "global_step": 496996, "epoch": 5987} {"train_loss": -27.420392990112305, "global_step": 496997, "epoch": 5987} {"train_loss": -27.207778930664062, "global_step": 496998, "epoch": 5987} {"train_loss": -27.26642417907715, "global_step": 496999, "epoch": 5987} {"train_loss": -27.09615135192871, "global_step": 497000, "epoch": 5987} {"train_loss": -27.35682487487793, "global_step": 497001, "epoch": 5987} {"train_loss": -26.99420738220215, "global_step": 497002, "epoch": 5987} {"train_loss": -27.28575966157109, "global_step": 497003, "epoch": 5987, "val_loss": 6698186.0} {"train_loss": -26.907114028930664, "global_step": 497004, "epoch": 5988} {"train_loss": -25.983509063720703, "global_step": 497005, "epoch": 5988} {"train_loss": -26.318374633789062, "global_step": 497006, "epoch": 5988} {"train_loss": -27.0053653717041, "global_step": 497007, "epoch": 5988} {"train_loss": -26.661584854125977, "global_step": 497008, "epoch": 5988} {"train_loss": -26.677499771118164, "global_step": 497009, "epoch": 5988} {"train_loss": -27.286529541015625, "global_step": 497010, "epoch": 5988} {"train_loss": -26.776412963867188, "global_step": 497011, "epoch": 5988} {"train_loss": -27.1756534576416, "global_step": 497012, "epoch": 5988} {"train_loss": -26.482873916625977, "global_step": 497013, "epoch": 5988} {"train_loss": -26.5314884185791, "global_step": 497014, "epoch": 5988} {"train_loss": -26.872339248657227, "global_step": 497015, "epoch": 5988} {"train_loss": -26.57862663269043, "global_step": 497016, "epoch": 5988} {"train_loss": -26.814279556274414, "global_step": 497017, "epoch": 5988} {"train_loss": -27.072141647338867, "global_step": 497018, "epoch": 5988} {"train_loss": -27.1895809173584, "global_step": 497019, "epoch": 5988} {"train_loss": -26.962772369384766, "global_step": 497020, "epoch": 5988} {"train_loss": -27.406614303588867, "global_step": 497021, "epoch": 5988} {"train_loss": -27.020002365112305, "global_step": 497022, "epoch": 5988} {"train_loss": -27.270166397094727, "global_step": 497023, "epoch": 5988} {"train_loss": -26.947616577148438, "global_step": 497024, "epoch": 5988} {"train_loss": -27.111846923828125, "global_step": 497025, "epoch": 5988} {"train_loss": -27.50495719909668, "global_step": 497026, "epoch": 5988} {"train_loss": -26.991357803344727, "global_step": 497027, "epoch": 5988} {"train_loss": -27.19000244140625, "global_step": 497028, "epoch": 5988} {"train_loss": -27.669193267822266, "global_step": 497029, "epoch": 5988} {"train_loss": -27.358875274658203, "global_step": 497030, "epoch": 5988} {"train_loss": -27.364521026611328, "global_step": 497031, "epoch": 5988} {"train_loss": -27.570398330688477, "global_step": 497032, "epoch": 5988} {"train_loss": -27.570541381835938, "global_step": 497033, "epoch": 5988} {"train_loss": -27.359846115112305, "global_step": 497034, "epoch": 5988} {"train_loss": -27.589176177978516, "global_step": 497035, "epoch": 5988} {"train_loss": -27.364713668823242, "global_step": 497036, "epoch": 5988} {"train_loss": -27.525604248046875, "global_step": 497037, "epoch": 5988} {"train_loss": -27.6090145111084, "global_step": 497038, "epoch": 5988} {"train_loss": -27.40213394165039, "global_step": 497039, "epoch": 5988} {"train_loss": -27.62701416015625, "global_step": 497040, "epoch": 5988} {"train_loss": -27.211166381835938, "global_step": 497041, "epoch": 5988} {"train_loss": -27.44794273376465, "global_step": 497042, "epoch": 5988} {"train_loss": -27.65546226501465, "global_step": 497043, "epoch": 5988} {"train_loss": -27.225858688354492, "global_step": 497044, "epoch": 5988} {"train_loss": -27.617856979370117, "global_step": 497045, "epoch": 5988} {"train_loss": -27.58650779724121, "global_step": 497046, "epoch": 5988} {"train_loss": -27.90925407409668, "global_step": 497047, "epoch": 5988} {"train_loss": -27.329498291015625, "global_step": 497048, "epoch": 5988} {"train_loss": -27.308094024658203, "global_step": 497049, "epoch": 5988} {"train_loss": -27.041793823242188, "global_step": 497050, "epoch": 5988} {"train_loss": -26.92596435546875, "global_step": 497051, "epoch": 5988} {"train_loss": -26.50787353515625, "global_step": 497052, "epoch": 5988} {"train_loss": -26.541913986206055, "global_step": 497053, "epoch": 5988} {"train_loss": -27.218896865844727, "global_step": 497054, "epoch": 5988} {"train_loss": -27.689910888671875, "global_step": 497055, "epoch": 5988} {"train_loss": -27.28842544555664, "global_step": 497056, "epoch": 5988} {"train_loss": -26.92822265625, "global_step": 497057, "epoch": 5988} {"train_loss": -27.394804000854492, "global_step": 497058, "epoch": 5988} {"train_loss": -26.89443016052246, "global_step": 497059, "epoch": 5988} {"train_loss": -27.375329971313477, "global_step": 497060, "epoch": 5988} {"train_loss": -27.47028923034668, "global_step": 497061, "epoch": 5988} {"train_loss": -27.354206085205078, "global_step": 497062, "epoch": 5988} {"train_loss": -27.185047149658203, "global_step": 497063, "epoch": 5988} {"train_loss": -27.427474975585938, "global_step": 497064, "epoch": 5988} {"train_loss": -27.27524185180664, "global_step": 497065, "epoch": 5988} {"train_loss": -27.2266788482666, "global_step": 497066, "epoch": 5988} {"train_loss": -27.466760635375977, "global_step": 497067, "epoch": 5988} {"train_loss": -27.67469596862793, "global_step": 497068, "epoch": 5988} {"train_loss": -27.578710556030273, "global_step": 497069, "epoch": 5988} {"train_loss": -27.971954345703125, "global_step": 497070, "epoch": 5988} {"train_loss": -27.464080810546875, "global_step": 497071, "epoch": 5988} {"train_loss": -27.5629940032959, "global_step": 497072, "epoch": 5988} {"train_loss": -27.878570556640625, "global_step": 497073, "epoch": 5988} {"train_loss": -27.368810653686523, "global_step": 497074, "epoch": 5988} {"train_loss": -27.41872215270996, "global_step": 497075, "epoch": 5988} {"train_loss": -26.946081161499023, "global_step": 497076, "epoch": 5988} {"train_loss": -27.03141212463379, "global_step": 497077, "epoch": 5988} {"train_loss": -27.099512100219727, "global_step": 497078, "epoch": 5988} {"train_loss": -26.739938735961914, "global_step": 497079, "epoch": 5988} {"train_loss": -27.085859298706055, "global_step": 497080, "epoch": 5988} {"train_loss": -26.4032039642334, "global_step": 497081, "epoch": 5988} {"train_loss": -26.718679428100586, "global_step": 497082, "epoch": 5988} {"train_loss": -27.136526107788086, "global_step": 497083, "epoch": 5988} {"train_loss": -27.557727813720703, "global_step": 497084, "epoch": 5988} {"train_loss": -26.767047882080078, "global_step": 497085, "epoch": 5988} {"train_loss": -27.188041043568806, "global_step": 497086, "epoch": 5988, "val_loss": 6609516.0} {"train_loss": -25.569869995117188, "global_step": 497087, "epoch": 5989} {"train_loss": -24.978271484375, "global_step": 497088, "epoch": 5989} {"train_loss": -26.474777221679688, "global_step": 497089, "epoch": 5989} {"train_loss": -25.87104606628418, "global_step": 497090, "epoch": 5989} {"train_loss": -26.71708106994629, "global_step": 497091, "epoch": 5989} {"train_loss": -26.11812400817871, "global_step": 497092, "epoch": 5989} {"train_loss": -26.18206787109375, "global_step": 497093, "epoch": 5989} {"train_loss": -26.6937313079834, "global_step": 497094, "epoch": 5989} {"train_loss": -26.39644432067871, "global_step": 497095, "epoch": 5989} {"train_loss": -27.035612106323242, "global_step": 497096, "epoch": 5989} {"train_loss": -26.67377281188965, "global_step": 497097, "epoch": 5989} {"train_loss": -26.817773818969727, "global_step": 497098, "epoch": 5989} {"train_loss": -26.439544677734375, "global_step": 497099, "epoch": 5989} {"train_loss": -26.657445907592773, "global_step": 497100, "epoch": 5989} {"train_loss": -26.9787654876709, "global_step": 497101, "epoch": 5989} {"train_loss": -26.83261489868164, "global_step": 497102, "epoch": 5989} {"train_loss": -26.637414932250977, "global_step": 497103, "epoch": 5989} {"train_loss": -27.007156372070312, "global_step": 497104, "epoch": 5989} {"train_loss": -26.84159278869629, "global_step": 497105, "epoch": 5989} {"train_loss": -27.110824584960938, "global_step": 497106, "epoch": 5989} {"train_loss": -26.821399688720703, "global_step": 497107, "epoch": 5989} {"train_loss": -26.77033042907715, "global_step": 497108, "epoch": 5989} {"train_loss": -27.02461051940918, "global_step": 497109, "epoch": 5989} {"train_loss": -27.131484985351562, "global_step": 497110, "epoch": 5989} {"train_loss": -27.144662857055664, "global_step": 497111, "epoch": 5989} {"train_loss": -26.931873321533203, "global_step": 497112, "epoch": 5989} {"train_loss": -27.279346466064453, "global_step": 497113, "epoch": 5989} {"train_loss": -27.052520751953125, "global_step": 497114, "epoch": 5989} {"train_loss": -27.147565841674805, "global_step": 497115, "epoch": 5989} {"train_loss": -27.360498428344727, "global_step": 497116, "epoch": 5989} {"train_loss": -27.526098251342773, "global_step": 497117, "epoch": 5989} {"train_loss": -27.01629638671875, "global_step": 497118, "epoch": 5989} {"train_loss": -27.26947593688965, "global_step": 497119, "epoch": 5989} {"train_loss": -27.70521354675293, "global_step": 497120, "epoch": 5989} {"train_loss": -27.426864624023438, "global_step": 497121, "epoch": 5989} {"train_loss": -27.29249382019043, "global_step": 497122, "epoch": 5989} {"train_loss": -27.168304443359375, "global_step": 497123, "epoch": 5989} {"train_loss": -27.567880630493164, "global_step": 497124, "epoch": 5989} {"train_loss": -27.5802059173584, "global_step": 497125, "epoch": 5989} {"train_loss": -27.50398063659668, "global_step": 497126, "epoch": 5989} {"train_loss": -27.529129028320312, "global_step": 497127, "epoch": 5989} {"train_loss": -27.629743576049805, "global_step": 497128, "epoch": 5989} {"train_loss": -27.68082046508789, "global_step": 497129, "epoch": 5989} {"train_loss": -27.438217163085938, "global_step": 497130, "epoch": 5989} {"train_loss": -27.668079376220703, "global_step": 497131, "epoch": 5989} {"train_loss": -27.681396484375, "global_step": 497132, "epoch": 5989} {"train_loss": -27.41182518005371, "global_step": 497133, "epoch": 5989} {"train_loss": -27.568267822265625, "global_step": 497134, "epoch": 5989} {"train_loss": -27.645612716674805, "global_step": 497135, "epoch": 5989} {"train_loss": -27.575895309448242, "global_step": 497136, "epoch": 5989} {"train_loss": -27.730457305908203, "global_step": 497137, "epoch": 5989} {"train_loss": -27.559057235717773, "global_step": 497138, "epoch": 5989} {"train_loss": -27.210538864135742, "global_step": 497139, "epoch": 5989} {"train_loss": -27.498291015625, "global_step": 497140, "epoch": 5989} {"train_loss": -27.444156646728516, "global_step": 497141, "epoch": 5989} {"train_loss": -27.608917236328125, "global_step": 497142, "epoch": 5989} {"train_loss": -27.39580726623535, "global_step": 497143, "epoch": 5989} {"train_loss": -27.21046257019043, "global_step": 497144, "epoch": 5989} {"train_loss": -26.44171142578125, "global_step": 497145, "epoch": 5989} {"train_loss": -26.418893814086914, "global_step": 497146, "epoch": 5989} {"train_loss": -26.6076602935791, "global_step": 497147, "epoch": 5989} {"train_loss": -27.109323501586914, "global_step": 497148, "epoch": 5989} {"train_loss": -27.69637107849121, "global_step": 497149, "epoch": 5989} {"train_loss": -27.1959228515625, "global_step": 497150, "epoch": 5989} {"train_loss": -27.276220321655273, "global_step": 497151, "epoch": 5989} {"train_loss": -27.309040069580078, "global_step": 497152, "epoch": 5989} {"train_loss": -27.168394088745117, "global_step": 497153, "epoch": 5989} {"train_loss": -27.01065444946289, "global_step": 497154, "epoch": 5989} {"train_loss": -27.27064323425293, "global_step": 497155, "epoch": 5989} {"train_loss": -27.009885787963867, "global_step": 497156, "epoch": 5989} {"train_loss": -27.433340072631836, "global_step": 497157, "epoch": 5989} {"train_loss": -27.16292381286621, "global_step": 497158, "epoch": 5989} {"train_loss": -27.152616500854492, "global_step": 497159, "epoch": 5989} {"train_loss": -27.528135299682617, "global_step": 497160, "epoch": 5989} {"train_loss": -27.265485763549805, "global_step": 497161, "epoch": 5989} {"train_loss": -27.47035026550293, "global_step": 497162, "epoch": 5989} {"train_loss": -27.498517990112305, "global_step": 497163, "epoch": 5989} {"train_loss": -27.12017822265625, "global_step": 497164, "epoch": 5989} {"train_loss": -27.08164405822754, "global_step": 497165, "epoch": 5989} {"train_loss": -26.917556762695312, "global_step": 497166, "epoch": 5989} {"train_loss": -27.650482177734375, "global_step": 497167, "epoch": 5989} {"train_loss": -27.246448516845703, "global_step": 497168, "epoch": 5989} {"train_loss": -27.09101635576731, "global_step": 497169, "epoch": 5989, "val_loss": 6590166.0} {"train_loss": -24.05011749267578, "global_step": 497170, "epoch": 5990} {"train_loss": -25.21078872680664, "global_step": 497171, "epoch": 5990} {"train_loss": -26.394880294799805, "global_step": 497172, "epoch": 5990} {"train_loss": -26.198110580444336, "global_step": 497173, "epoch": 5990} {"train_loss": -26.021764755249023, "global_step": 497174, "epoch": 5990} {"train_loss": -26.569625854492188, "global_step": 497175, "epoch": 5990} {"train_loss": -26.40333366394043, "global_step": 497176, "epoch": 5990} {"train_loss": -26.60597038269043, "global_step": 497177, "epoch": 5990} {"train_loss": -26.579254150390625, "global_step": 497178, "epoch": 5990} {"train_loss": -27.07611656188965, "global_step": 497179, "epoch": 5990} {"train_loss": -26.659650802612305, "global_step": 497180, "epoch": 5990} {"train_loss": -26.72182273864746, "global_step": 497181, "epoch": 5990} {"train_loss": -26.57248306274414, "global_step": 497182, "epoch": 5990} {"train_loss": -26.617151260375977, "global_step": 497183, "epoch": 5990} {"train_loss": -27.095510482788086, "global_step": 497184, "epoch": 5990} {"train_loss": -26.760852813720703, "global_step": 497185, "epoch": 5990} {"train_loss": -26.805561065673828, "global_step": 497186, "epoch": 5990} {"train_loss": -27.311140060424805, "global_step": 497187, "epoch": 5990} {"train_loss": -26.987775802612305, "global_step": 497188, "epoch": 5990} {"train_loss": -26.90851402282715, "global_step": 497189, "epoch": 5990} {"train_loss": -27.122695922851562, "global_step": 497190, "epoch": 5990} {"train_loss": -27.2429256439209, "global_step": 497191, "epoch": 5990} {"train_loss": -26.842748641967773, "global_step": 497192, "epoch": 5990} {"train_loss": -26.84174156188965, "global_step": 497193, "epoch": 5990} {"train_loss": -26.921798706054688, "global_step": 497194, "epoch": 5990} {"train_loss": -26.896472930908203, "global_step": 497195, "epoch": 5990} {"train_loss": -26.99848747253418, "global_step": 497196, "epoch": 5990} {"train_loss": -26.950483322143555, "global_step": 497197, "epoch": 5990} {"train_loss": -27.08624839782715, "global_step": 497198, "epoch": 5990} {"train_loss": -27.185333251953125, "global_step": 497199, "epoch": 5990} {"train_loss": -26.997961044311523, "global_step": 497200, "epoch": 5990} {"train_loss": -27.401708602905273, "global_step": 497201, "epoch": 5990} {"train_loss": -27.355457305908203, "global_step": 497202, "epoch": 5990} {"train_loss": -27.431528091430664, "global_step": 497203, "epoch": 5990} {"train_loss": -27.375869750976562, "global_step": 497204, "epoch": 5990} {"train_loss": -27.434982299804688, "global_step": 497205, "epoch": 5990} {"train_loss": -27.02865982055664, "global_step": 497206, "epoch": 5990} {"train_loss": -27.335342407226562, "global_step": 497207, "epoch": 5990} {"train_loss": -27.180038452148438, "global_step": 497208, "epoch": 5990} {"train_loss": -27.658212661743164, "global_step": 497209, "epoch": 5990} {"train_loss": -27.31855583190918, "global_step": 497210, "epoch": 5990} {"train_loss": -27.347681045532227, "global_step": 497211, "epoch": 5990} {"train_loss": -27.157596588134766, "global_step": 497212, "epoch": 5990} {"train_loss": -27.446271896362305, "global_step": 497213, "epoch": 5990} {"train_loss": -27.812490463256836, "global_step": 497214, "epoch": 5990} {"train_loss": -27.56965446472168, "global_step": 497215, "epoch": 5990} {"train_loss": -27.5803279876709, "global_step": 497216, "epoch": 5990} {"train_loss": -27.462980270385742, "global_step": 497217, "epoch": 5990} {"train_loss": -27.3078670501709, "global_step": 497218, "epoch": 5990} {"train_loss": -27.30633544921875, "global_step": 497219, "epoch": 5990} {"train_loss": -27.467426300048828, "global_step": 497220, "epoch": 5990} {"train_loss": -27.395828247070312, "global_step": 497221, "epoch": 5990} {"train_loss": -27.6706600189209, "global_step": 497222, "epoch": 5990} {"train_loss": -27.728870391845703, "global_step": 497223, "epoch": 5990} {"train_loss": -27.609821319580078, "global_step": 497224, "epoch": 5990} {"train_loss": -27.846677780151367, "global_step": 497225, "epoch": 5990} {"train_loss": -27.68831443786621, "global_step": 497226, "epoch": 5990} {"train_loss": -27.06367301940918, "global_step": 497227, "epoch": 5990} {"train_loss": -27.386449813842773, "global_step": 497228, "epoch": 5990} {"train_loss": -27.139280319213867, "global_step": 497229, "epoch": 5990} {"train_loss": -27.558813095092773, "global_step": 497230, "epoch": 5990} {"train_loss": -27.80217933654785, "global_step": 497231, "epoch": 5990} {"train_loss": -27.504247665405273, "global_step": 497232, "epoch": 5990} {"train_loss": -27.3388614654541, "global_step": 497233, "epoch": 5990} {"train_loss": -27.67781639099121, "global_step": 497234, "epoch": 5990} {"train_loss": -27.536304473876953, "global_step": 497235, "epoch": 5990} {"train_loss": -27.331018447875977, "global_step": 497236, "epoch": 5990} {"train_loss": -27.888324737548828, "global_step": 497237, "epoch": 5990} {"train_loss": -27.230504989624023, "global_step": 497238, "epoch": 5990} {"train_loss": -27.388593673706055, "global_step": 497239, "epoch": 5990} {"train_loss": -27.74969482421875, "global_step": 497240, "epoch": 5990} {"train_loss": -27.375015258789062, "global_step": 497241, "epoch": 5990} {"train_loss": -27.285785675048828, "global_step": 497242, "epoch": 5990} {"train_loss": -27.471393585205078, "global_step": 497243, "epoch": 5990} {"train_loss": -27.3494873046875, "global_step": 497244, "epoch": 5990} {"train_loss": -27.78323745727539, "global_step": 497245, "epoch": 5990} {"train_loss": -27.680404663085938, "global_step": 497246, "epoch": 5990} {"train_loss": -27.42578125, "global_step": 497247, "epoch": 5990} {"train_loss": -27.332361221313477, "global_step": 497248, "epoch": 5990} {"train_loss": -27.562768936157227, "global_step": 497249, "epoch": 5990} {"train_loss": -27.289398193359375, "global_step": 497250, "epoch": 5990} {"train_loss": -27.22458839416504, "global_step": 497251, "epoch": 5990} {"train_loss": -27.167218863245953, "global_step": 497252, "epoch": 5990, "val_loss": 6605777.0} {"train_loss": -26.884674072265625, "global_step": 497253, "epoch": 5991} {"train_loss": -26.80817985534668, "global_step": 497254, "epoch": 5991} {"train_loss": -26.874969482421875, "global_step": 497255, "epoch": 5991} {"train_loss": -26.99880027770996, "global_step": 497256, "epoch": 5991} {"train_loss": -27.00798988342285, "global_step": 497257, "epoch": 5991} {"train_loss": -26.322484970092773, "global_step": 497258, "epoch": 5991} {"train_loss": -27.131845474243164, "global_step": 497259, "epoch": 5991} {"train_loss": -27.09140968322754, "global_step": 497260, "epoch": 5991} {"train_loss": -26.990863800048828, "global_step": 497261, "epoch": 5991} {"train_loss": -27.26746940612793, "global_step": 497262, "epoch": 5991} {"train_loss": -27.098073959350586, "global_step": 497263, "epoch": 5991} {"train_loss": -26.96497917175293, "global_step": 497264, "epoch": 5991} {"train_loss": -27.115636825561523, "global_step": 497265, "epoch": 5991} {"train_loss": -27.1539363861084, "global_step": 497266, "epoch": 5991} {"train_loss": -27.258331298828125, "global_step": 497267, "epoch": 5991} {"train_loss": -26.964941024780273, "global_step": 497268, "epoch": 5991} {"train_loss": -27.1143741607666, "global_step": 497269, "epoch": 5991} {"train_loss": -27.17449378967285, "global_step": 497270, "epoch": 5991} {"train_loss": -27.538299560546875, "global_step": 497271, "epoch": 5991} {"train_loss": -27.577917098999023, "global_step": 497272, "epoch": 5991} {"train_loss": -27.561279296875, "global_step": 497273, "epoch": 5991} {"train_loss": -27.444091796875, "global_step": 497274, "epoch": 5991} {"train_loss": -27.4908447265625, "global_step": 497275, "epoch": 5991} {"train_loss": -27.100055694580078, "global_step": 497276, "epoch": 5991} {"train_loss": -27.546295166015625, "global_step": 497277, "epoch": 5991} {"train_loss": -27.099760055541992, "global_step": 497278, "epoch": 5991} {"train_loss": -27.58756446838379, "global_step": 497279, "epoch": 5991} {"train_loss": -27.48267936706543, "global_step": 497280, "epoch": 5991} {"train_loss": -27.265104293823242, "global_step": 497281, "epoch": 5991} {"train_loss": -27.37635612487793, "global_step": 497282, "epoch": 5991} {"train_loss": -27.593664169311523, "global_step": 497283, "epoch": 5991} {"train_loss": -27.671173095703125, "global_step": 497284, "epoch": 5991} {"train_loss": -27.433368682861328, "global_step": 497285, "epoch": 5991} {"train_loss": -27.439191818237305, "global_step": 497286, "epoch": 5991} {"train_loss": -27.474817276000977, "global_step": 497287, "epoch": 5991} {"train_loss": -27.33393669128418, "global_step": 497288, "epoch": 5991} {"train_loss": -27.29599380493164, "global_step": 497289, "epoch": 5991} {"train_loss": -27.3651180267334, "global_step": 497290, "epoch": 5991} {"train_loss": -27.557397842407227, "global_step": 497291, "epoch": 5991} {"train_loss": -27.657514572143555, "global_step": 497292, "epoch": 5991} {"train_loss": -27.334814071655273, "global_step": 497293, "epoch": 5991} {"train_loss": -27.56757926940918, "global_step": 497294, "epoch": 5991} {"train_loss": -27.686920166015625, "global_step": 497295, "epoch": 5991} {"train_loss": -27.8654727935791, "global_step": 497296, "epoch": 5991} {"train_loss": -27.284229278564453, "global_step": 497297, "epoch": 5991} {"train_loss": -27.31902503967285, "global_step": 497298, "epoch": 5991} {"train_loss": -27.148151397705078, "global_step": 497299, "epoch": 5991} {"train_loss": -27.704803466796875, "global_step": 497300, "epoch": 5991} {"train_loss": -27.47385597229004, "global_step": 497301, "epoch": 5991} {"train_loss": -26.8145694732666, "global_step": 497302, "epoch": 5991} {"train_loss": -27.04292869567871, "global_step": 497303, "epoch": 5991} {"train_loss": -27.19659423828125, "global_step": 497304, "epoch": 5991} {"train_loss": -27.132038116455078, "global_step": 497305, "epoch": 5991} {"train_loss": -27.176198959350586, "global_step": 497306, "epoch": 5991} {"train_loss": -27.3978328704834, "global_step": 497307, "epoch": 5991} {"train_loss": -27.19122314453125, "global_step": 497308, "epoch": 5991} {"train_loss": -26.866987228393555, "global_step": 497309, "epoch": 5991} {"train_loss": -27.258075714111328, "global_step": 497310, "epoch": 5991} {"train_loss": -27.4986515045166, "global_step": 497311, "epoch": 5991} {"train_loss": -27.24602699279785, "global_step": 497312, "epoch": 5991} {"train_loss": -27.322668075561523, "global_step": 497313, "epoch": 5991} {"train_loss": -27.149816513061523, "global_step": 497314, "epoch": 5991} {"train_loss": -27.2301082611084, "global_step": 497315, "epoch": 5991} {"train_loss": -27.313215255737305, "global_step": 497316, "epoch": 5991} {"train_loss": -27.245803833007812, "global_step": 497317, "epoch": 5991} {"train_loss": -27.295392990112305, "global_step": 497318, "epoch": 5991} {"train_loss": -27.56222915649414, "global_step": 497319, "epoch": 5991} {"train_loss": -27.1964168548584, "global_step": 497320, "epoch": 5991} {"train_loss": -27.74161720275879, "global_step": 497321, "epoch": 5991} {"train_loss": -27.241409301757812, "global_step": 497322, "epoch": 5991} {"train_loss": -27.218671798706055, "global_step": 497323, "epoch": 5991} {"train_loss": -27.382837295532227, "global_step": 497324, "epoch": 5991} {"train_loss": -27.17574119567871, "global_step": 497325, "epoch": 5991} {"train_loss": -26.917810440063477, "global_step": 497326, "epoch": 5991} {"train_loss": -27.064056396484375, "global_step": 497327, "epoch": 5991} {"train_loss": -27.506866455078125, "global_step": 497328, "epoch": 5991} {"train_loss": -27.589344024658203, "global_step": 497329, "epoch": 5991} {"train_loss": -27.196470260620117, "global_step": 497330, "epoch": 5991} {"train_loss": -27.587158203125, "global_step": 497331, "epoch": 5991} {"train_loss": -27.20770263671875, "global_step": 497332, "epoch": 5991} {"train_loss": -27.1168212890625, "global_step": 497333, "epoch": 5991} {"train_loss": -27.431493759155273, "global_step": 497334, "epoch": 5991} {"train_loss": -27.2760107201266, "global_step": 497335, "epoch": 5991, "val_loss": 6639766.5} {"train_loss": -27.4571475982666, "global_step": 497336, "epoch": 5992} {"train_loss": -27.020307540893555, "global_step": 497337, "epoch": 5992} {"train_loss": -27.282194137573242, "global_step": 497338, "epoch": 5992} {"train_loss": -26.84193992614746, "global_step": 497339, "epoch": 5992} {"train_loss": -26.517414093017578, "global_step": 497340, "epoch": 5992} {"train_loss": -27.125513076782227, "global_step": 497341, "epoch": 5992} {"train_loss": -27.068714141845703, "global_step": 497342, "epoch": 5992} {"train_loss": -27.178613662719727, "global_step": 497343, "epoch": 5992} {"train_loss": -27.09964942932129, "global_step": 497344, "epoch": 5992} {"train_loss": -27.19807243347168, "global_step": 497345, "epoch": 5992} {"train_loss": -26.64642906188965, "global_step": 497346, "epoch": 5992} {"train_loss": -27.07539176940918, "global_step": 497347, "epoch": 5992} {"train_loss": -26.72410011291504, "global_step": 497348, "epoch": 5992} {"train_loss": -26.83294677734375, "global_step": 497349, "epoch": 5992} {"train_loss": -27.570209503173828, "global_step": 497350, "epoch": 5992} {"train_loss": -27.442296981811523, "global_step": 497351, "epoch": 5992} {"train_loss": -27.40630531311035, "global_step": 497352, "epoch": 5992} {"train_loss": -27.349531173706055, "global_step": 497353, "epoch": 5992} {"train_loss": -27.44598960876465, "global_step": 497354, "epoch": 5992} {"train_loss": -27.412683486938477, "global_step": 497355, "epoch": 5992} {"train_loss": -27.2713623046875, "global_step": 497356, "epoch": 5992} {"train_loss": -27.292516708374023, "global_step": 497357, "epoch": 5992} {"train_loss": -27.14896011352539, "global_step": 497358, "epoch": 5992} {"train_loss": -27.145587921142578, "global_step": 497359, "epoch": 5992} {"train_loss": -27.601032257080078, "global_step": 497360, "epoch": 5992} {"train_loss": -27.283246994018555, "global_step": 497361, "epoch": 5992} {"train_loss": -27.435943603515625, "global_step": 497362, "epoch": 5992} {"train_loss": -27.363056182861328, "global_step": 497363, "epoch": 5992} {"train_loss": -27.818470001220703, "global_step": 497364, "epoch": 5992} {"train_loss": -27.61004066467285, "global_step": 497365, "epoch": 5992} {"train_loss": -27.753904342651367, "global_step": 497366, "epoch": 5992} {"train_loss": -27.45242691040039, "global_step": 497367, "epoch": 5992} {"train_loss": -28.1766357421875, "global_step": 497368, "epoch": 5992} {"train_loss": -27.718341827392578, "global_step": 497369, "epoch": 5992} {"train_loss": -27.630390167236328, "global_step": 497370, "epoch": 5992} {"train_loss": -26.90369987487793, "global_step": 497371, "epoch": 5992} {"train_loss": -27.354480743408203, "global_step": 497372, "epoch": 5992} {"train_loss": -27.22711753845215, "global_step": 497373, "epoch": 5992} {"train_loss": -27.433935165405273, "global_step": 497374, "epoch": 5992} {"train_loss": -27.5947265625, "global_step": 497375, "epoch": 5992} {"train_loss": -27.495771408081055, "global_step": 497376, "epoch": 5992} {"train_loss": -27.480932235717773, "global_step": 497377, "epoch": 5992} {"train_loss": -27.12131118774414, "global_step": 497378, "epoch": 5992} {"train_loss": -27.238203048706055, "global_step": 497379, "epoch": 5992} {"train_loss": -27.589298248291016, "global_step": 497380, "epoch": 5992} {"train_loss": -27.50931739807129, "global_step": 497381, "epoch": 5992} {"train_loss": -27.48702049255371, "global_step": 497382, "epoch": 5992} {"train_loss": -27.354673385620117, "global_step": 497383, "epoch": 5992} {"train_loss": -27.712675094604492, "global_step": 497384, "epoch": 5992} {"train_loss": -26.811756134033203, "global_step": 497385, "epoch": 5992} {"train_loss": -27.10870933532715, "global_step": 497386, "epoch": 5992} {"train_loss": -27.54831886291504, "global_step": 497387, "epoch": 5992} {"train_loss": -27.02445411682129, "global_step": 497388, "epoch": 5992} {"train_loss": -27.58881187438965, "global_step": 497389, "epoch": 5992} {"train_loss": -26.90447425842285, "global_step": 497390, "epoch": 5992} {"train_loss": -27.860157012939453, "global_step": 497391, "epoch": 5992} {"train_loss": -27.189435958862305, "global_step": 497392, "epoch": 5992} {"train_loss": -27.239089965820312, "global_step": 497393, "epoch": 5992} {"train_loss": -27.727588653564453, "global_step": 497394, "epoch": 5992} {"train_loss": -27.08087730407715, "global_step": 497395, "epoch": 5992} {"train_loss": -27.281635284423828, "global_step": 497396, "epoch": 5992} {"train_loss": -26.943227767944336, "global_step": 497397, "epoch": 5992} {"train_loss": -27.2154598236084, "global_step": 497398, "epoch": 5992} {"train_loss": -27.2020206451416, "global_step": 497399, "epoch": 5992} {"train_loss": -27.371078491210938, "global_step": 497400, "epoch": 5992} {"train_loss": -27.012317657470703, "global_step": 497401, "epoch": 5992} {"train_loss": -27.302093505859375, "global_step": 497402, "epoch": 5992} {"train_loss": -27.409048080444336, "global_step": 497403, "epoch": 5992} {"train_loss": -26.835721969604492, "global_step": 497404, "epoch": 5992} {"train_loss": -27.213428497314453, "global_step": 497405, "epoch": 5992} {"train_loss": -27.171436309814453, "global_step": 497406, "epoch": 5992} {"train_loss": -27.460189819335938, "global_step": 497407, "epoch": 5992} {"train_loss": -27.46470069885254, "global_step": 497408, "epoch": 5992} {"train_loss": -27.411222457885742, "global_step": 497409, "epoch": 5992} {"train_loss": -27.122589111328125, "global_step": 497410, "epoch": 5992} {"train_loss": -27.18475341796875, "global_step": 497411, "epoch": 5992} {"train_loss": -27.298147201538086, "global_step": 497412, "epoch": 5992} {"train_loss": -26.99700927734375, "global_step": 497413, "epoch": 5992} {"train_loss": -27.51820182800293, "global_step": 497414, "epoch": 5992} {"train_loss": -27.155813217163086, "global_step": 497415, "epoch": 5992} {"train_loss": -27.187788009643555, "global_step": 497416, "epoch": 5992} {"train_loss": -27.48227310180664, "global_step": 497417, "epoch": 5992} {"train_loss": -27.313423041837762, "global_step": 497418, "epoch": 5992, "val_loss": 6577603.5} {"train_loss": -26.86981201171875, "global_step": 497419, "epoch": 5993} {"train_loss": -25.951465606689453, "global_step": 497420, "epoch": 5993} {"train_loss": -26.29139518737793, "global_step": 497421, "epoch": 5993} {"train_loss": -27.22615623474121, "global_step": 497422, "epoch": 5993} {"train_loss": -26.825010299682617, "global_step": 497423, "epoch": 5993} {"train_loss": -27.01837730407715, "global_step": 497424, "epoch": 5993} {"train_loss": -26.765399932861328, "global_step": 497425, "epoch": 5993} {"train_loss": -27.209247589111328, "global_step": 497426, "epoch": 5993} {"train_loss": -27.443761825561523, "global_step": 497427, "epoch": 5993} {"train_loss": -26.905004501342773, "global_step": 497428, "epoch": 5993} {"train_loss": -27.419708251953125, "global_step": 497429, "epoch": 5993} {"train_loss": -26.902551651000977, "global_step": 497430, "epoch": 5993} {"train_loss": -27.133209228515625, "global_step": 497431, "epoch": 5993} {"train_loss": -27.104528427124023, "global_step": 497432, "epoch": 5993} {"train_loss": -27.376846313476562, "global_step": 497433, "epoch": 5993} {"train_loss": -27.1557674407959, "global_step": 497434, "epoch": 5993} {"train_loss": -27.42622947692871, "global_step": 497435, "epoch": 5993} {"train_loss": -27.404516220092773, "global_step": 497436, "epoch": 5993} {"train_loss": -27.2059268951416, "global_step": 497437, "epoch": 5993} {"train_loss": -27.25896644592285, "global_step": 497438, "epoch": 5993} {"train_loss": -27.64896583557129, "global_step": 497439, "epoch": 5993} {"train_loss": -27.36991310119629, "global_step": 497440, "epoch": 5993} {"train_loss": -27.324918746948242, "global_step": 497441, "epoch": 5993} {"train_loss": -27.578296661376953, "global_step": 497442, "epoch": 5993} {"train_loss": -27.253076553344727, "global_step": 497443, "epoch": 5993} {"train_loss": -27.363815307617188, "global_step": 497444, "epoch": 5993} {"train_loss": -27.46148681640625, "global_step": 497445, "epoch": 5993} {"train_loss": -27.378173828125, "global_step": 497446, "epoch": 5993} {"train_loss": -27.594573974609375, "global_step": 497447, "epoch": 5993} {"train_loss": -27.317462921142578, "global_step": 497448, "epoch": 5993} {"train_loss": -27.511438369750977, "global_step": 497449, "epoch": 5993} {"train_loss": -27.587589263916016, "global_step": 497450, "epoch": 5993} {"train_loss": -27.60292625427246, "global_step": 497451, "epoch": 5993} {"train_loss": -27.691354751586914, "global_step": 497452, "epoch": 5993} {"train_loss": -27.172607421875, "global_step": 497453, "epoch": 5993} {"train_loss": -27.515310287475586, "global_step": 497454, "epoch": 5993} {"train_loss": -27.951135635375977, "global_step": 497455, "epoch": 5993} {"train_loss": -27.736469268798828, "global_step": 497456, "epoch": 5993} {"train_loss": -27.29497718811035, "global_step": 497457, "epoch": 5993} {"train_loss": -27.453948974609375, "global_step": 497458, "epoch": 5993} {"train_loss": -27.1879825592041, "global_step": 497459, "epoch": 5993} {"train_loss": -27.588369369506836, "global_step": 497460, "epoch": 5993} {"train_loss": -27.36985206604004, "global_step": 497461, "epoch": 5993} {"train_loss": -27.573083877563477, "global_step": 497462, "epoch": 5993} {"train_loss": -26.941442489624023, "global_step": 497463, "epoch": 5993} {"train_loss": -27.000232696533203, "global_step": 497464, "epoch": 5993} {"train_loss": -26.990331649780273, "global_step": 497465, "epoch": 5993} {"train_loss": -27.350666046142578, "global_step": 497466, "epoch": 5993} {"train_loss": -26.903501510620117, "global_step": 497467, "epoch": 5993} {"train_loss": -26.662656784057617, "global_step": 497468, "epoch": 5993} {"train_loss": -26.464197158813477, "global_step": 497469, "epoch": 5993} {"train_loss": -26.295881271362305, "global_step": 497470, "epoch": 5993} {"train_loss": -26.72705078125, "global_step": 497471, "epoch": 5993} {"train_loss": -27.243356704711914, "global_step": 497472, "epoch": 5993} {"train_loss": -26.960132598876953, "global_step": 497473, "epoch": 5993} {"train_loss": -27.277057647705078, "global_step": 497474, "epoch": 5993} {"train_loss": -27.113080978393555, "global_step": 497475, "epoch": 5993} {"train_loss": -26.94068717956543, "global_step": 497476, "epoch": 5993} {"train_loss": -27.256576538085938, "global_step": 497477, "epoch": 5993} {"train_loss": -26.92645263671875, "global_step": 497478, "epoch": 5993} {"train_loss": -26.86151123046875, "global_step": 497479, "epoch": 5993} {"train_loss": -27.216466903686523, "global_step": 497480, "epoch": 5993} {"train_loss": -27.29135513305664, "global_step": 497481, "epoch": 5993} {"train_loss": -26.93520164489746, "global_step": 497482, "epoch": 5993} {"train_loss": -27.0338191986084, "global_step": 497483, "epoch": 5993} {"train_loss": -27.659957885742188, "global_step": 497484, "epoch": 5993} {"train_loss": -27.375244140625, "global_step": 497485, "epoch": 5993} {"train_loss": -27.143224716186523, "global_step": 497486, "epoch": 5993} {"train_loss": -27.030866622924805, "global_step": 497487, "epoch": 5993} {"train_loss": -26.982648849487305, "global_step": 497488, "epoch": 5993} {"train_loss": -27.305419921875, "global_step": 497489, "epoch": 5993} {"train_loss": -27.11820411682129, "global_step": 497490, "epoch": 5993} {"train_loss": -26.952728271484375, "global_step": 497491, "epoch": 5993} {"train_loss": -27.119653701782227, "global_step": 497492, "epoch": 5993} {"train_loss": -27.209257125854492, "global_step": 497493, "epoch": 5993} {"train_loss": -27.38052749633789, "global_step": 497494, "epoch": 5993} {"train_loss": -27.313800811767578, "global_step": 497495, "epoch": 5993} {"train_loss": -27.523279190063477, "global_step": 497496, "epoch": 5993} {"train_loss": -27.287860870361328, "global_step": 497497, "epoch": 5993} {"train_loss": -27.720457077026367, "global_step": 497498, "epoch": 5993} {"train_loss": -26.98118019104004, "global_step": 497499, "epoch": 5993} {"train_loss": -27.437091827392578, "global_step": 497500, "epoch": 5993} {"train_loss": -27.21852913822036, "global_step": 497501, "epoch": 5993, "val_loss": 6587736.0} {"train_loss": -26.65183448791504, "global_step": 497502, "epoch": 5994} {"train_loss": -26.79634666442871, "global_step": 497503, "epoch": 5994} {"train_loss": -27.316186904907227, "global_step": 497504, "epoch": 5994} {"train_loss": -26.85000991821289, "global_step": 497505, "epoch": 5994} {"train_loss": -26.76535415649414, "global_step": 497506, "epoch": 5994} {"train_loss": -27.022418975830078, "global_step": 497507, "epoch": 5994} {"train_loss": -27.104597091674805, "global_step": 497508, "epoch": 5994} {"train_loss": -27.088525772094727, "global_step": 497509, "epoch": 5994} {"train_loss": -26.905029296875, "global_step": 497510, "epoch": 5994} {"train_loss": -27.262845993041992, "global_step": 497511, "epoch": 5994} {"train_loss": -26.991132736206055, "global_step": 497512, "epoch": 5994} {"train_loss": -27.1379337310791, "global_step": 497513, "epoch": 5994} {"train_loss": -27.0772705078125, "global_step": 497514, "epoch": 5994} {"train_loss": -27.598621368408203, "global_step": 497515, "epoch": 5994} {"train_loss": -27.30374526977539, "global_step": 497516, "epoch": 5994} {"train_loss": -26.79007911682129, "global_step": 497517, "epoch": 5994} {"train_loss": -27.18732261657715, "global_step": 497518, "epoch": 5994} {"train_loss": -27.275964736938477, "global_step": 497519, "epoch": 5994} {"train_loss": -26.925928115844727, "global_step": 497520, "epoch": 5994} {"train_loss": -27.04848289489746, "global_step": 497521, "epoch": 5994} {"train_loss": -27.793264389038086, "global_step": 497522, "epoch": 5994} {"train_loss": -26.852582931518555, "global_step": 497523, "epoch": 5994} {"train_loss": -27.10050392150879, "global_step": 497524, "epoch": 5994} {"train_loss": -26.69172477722168, "global_step": 497525, "epoch": 5994} {"train_loss": -27.034744262695312, "global_step": 497526, "epoch": 5994} {"train_loss": -27.531021118164062, "global_step": 497527, "epoch": 5994} {"train_loss": -27.004194259643555, "global_step": 497528, "epoch": 5994} {"train_loss": -27.310577392578125, "global_step": 497529, "epoch": 5994} {"train_loss": -27.166656494140625, "global_step": 497530, "epoch": 5994} {"train_loss": -27.34415626525879, "global_step": 497531, "epoch": 5994} {"train_loss": -27.010135650634766, "global_step": 497532, "epoch": 5994} {"train_loss": -27.380765914916992, "global_step": 497533, "epoch": 5994} {"train_loss": -27.253400802612305, "global_step": 497534, "epoch": 5994} {"train_loss": -27.63319969177246, "global_step": 497535, "epoch": 5994} {"train_loss": -26.956409454345703, "global_step": 497536, "epoch": 5994} {"train_loss": -27.58111000061035, "global_step": 497537, "epoch": 5994} {"train_loss": -27.064634323120117, "global_step": 497538, "epoch": 5994} {"train_loss": -27.326135635375977, "global_step": 497539, "epoch": 5994} {"train_loss": -26.70843505859375, "global_step": 497540, "epoch": 5994} {"train_loss": -27.49454116821289, "global_step": 497541, "epoch": 5994} {"train_loss": -27.368677139282227, "global_step": 497542, "epoch": 5994} {"train_loss": -27.206085205078125, "global_step": 497543, "epoch": 5994} {"train_loss": -27.257596969604492, "global_step": 497544, "epoch": 5994} {"train_loss": -27.14447021484375, "global_step": 497545, "epoch": 5994} {"train_loss": -27.23822021484375, "global_step": 497546, "epoch": 5994} {"train_loss": -27.63028335571289, "global_step": 497547, "epoch": 5994} {"train_loss": -27.599721908569336, "global_step": 497548, "epoch": 5994} {"train_loss": -27.43212890625, "global_step": 497549, "epoch": 5994} {"train_loss": -27.034183502197266, "global_step": 497550, "epoch": 5994} {"train_loss": -27.23270606994629, "global_step": 497551, "epoch": 5994} {"train_loss": -27.4820499420166, "global_step": 497552, "epoch": 5994} {"train_loss": -27.07215690612793, "global_step": 497553, "epoch": 5994} {"train_loss": -27.1549072265625, "global_step": 497554, "epoch": 5994} {"train_loss": -27.616849899291992, "global_step": 497555, "epoch": 5994} {"train_loss": -27.681522369384766, "global_step": 497556, "epoch": 5994} {"train_loss": -27.159290313720703, "global_step": 497557, "epoch": 5994} {"train_loss": -27.7231502532959, "global_step": 497558, "epoch": 5994} {"train_loss": -27.296161651611328, "global_step": 497559, "epoch": 5994} {"train_loss": -27.319080352783203, "global_step": 497560, "epoch": 5994} {"train_loss": -26.863306045532227, "global_step": 497561, "epoch": 5994} {"train_loss": -27.535999298095703, "global_step": 497562, "epoch": 5994} {"train_loss": -27.66596031188965, "global_step": 497563, "epoch": 5994} {"train_loss": -27.051450729370117, "global_step": 497564, "epoch": 5994} {"train_loss": -27.598175048828125, "global_step": 497565, "epoch": 5994} {"train_loss": -27.459644317626953, "global_step": 497566, "epoch": 5994} {"train_loss": -27.257537841796875, "global_step": 497567, "epoch": 5994} {"train_loss": -27.44993019104004, "global_step": 497568, "epoch": 5994} {"train_loss": -27.558435440063477, "global_step": 497569, "epoch": 5994} {"train_loss": -27.380172729492188, "global_step": 497570, "epoch": 5994} {"train_loss": -27.46491050720215, "global_step": 497571, "epoch": 5994} {"train_loss": -27.014667510986328, "global_step": 497572, "epoch": 5994} {"train_loss": -27.55083656311035, "global_step": 497573, "epoch": 5994} {"train_loss": -27.129560470581055, "global_step": 497574, "epoch": 5994} {"train_loss": -27.430099487304688, "global_step": 497575, "epoch": 5994} {"train_loss": -27.580642700195312, "global_step": 497576, "epoch": 5994} {"train_loss": -27.397205352783203, "global_step": 497577, "epoch": 5994} {"train_loss": -27.50858497619629, "global_step": 497578, "epoch": 5994} {"train_loss": -27.6190185546875, "global_step": 497579, "epoch": 5994} {"train_loss": -27.6291561126709, "global_step": 497580, "epoch": 5994} {"train_loss": -27.820722579956055, "global_step": 497581, "epoch": 5994} {"train_loss": -27.504974365234375, "global_step": 497582, "epoch": 5994} {"train_loss": -27.400848388671875, "global_step": 497583, "epoch": 5994} {"train_loss": -27.261610697550946, "global_step": 497584, "epoch": 5994, "val_loss": 6607457.0} {"train_loss": -26.763065338134766, "global_step": 497585, "epoch": 5995} {"train_loss": -26.695764541625977, "global_step": 497586, "epoch": 5995} {"train_loss": -26.823379516601562, "global_step": 497587, "epoch": 5995} {"train_loss": -27.176427841186523, "global_step": 497588, "epoch": 5995} {"train_loss": -27.027942657470703, "global_step": 497589, "epoch": 5995} {"train_loss": -27.474288940429688, "global_step": 497590, "epoch": 5995} {"train_loss": -27.364151000976562, "global_step": 497591, "epoch": 5995} {"train_loss": -26.948535919189453, "global_step": 497592, "epoch": 5995} {"train_loss": -27.410995483398438, "global_step": 497593, "epoch": 5995} {"train_loss": -27.792505264282227, "global_step": 497594, "epoch": 5995} {"train_loss": -27.609167098999023, "global_step": 497595, "epoch": 5995} {"train_loss": -26.805280685424805, "global_step": 497596, "epoch": 5995} {"train_loss": -27.021453857421875, "global_step": 497597, "epoch": 5995} {"train_loss": -27.06626319885254, "global_step": 497598, "epoch": 5995} {"train_loss": -26.992273330688477, "global_step": 497599, "epoch": 5995} {"train_loss": -26.949506759643555, "global_step": 497600, "epoch": 5995} {"train_loss": -27.54281997680664, "global_step": 497601, "epoch": 5995} {"train_loss": -27.58363914489746, "global_step": 497602, "epoch": 5995} {"train_loss": -27.08108901977539, "global_step": 497603, "epoch": 5995} {"train_loss": -27.863651275634766, "global_step": 497604, "epoch": 5995} {"train_loss": -27.26108741760254, "global_step": 497605, "epoch": 5995} {"train_loss": -27.38633155822754, "global_step": 497606, "epoch": 5995} {"train_loss": -27.4031982421875, "global_step": 497607, "epoch": 5995} {"train_loss": -26.978992462158203, "global_step": 497608, "epoch": 5995} {"train_loss": -27.205066680908203, "global_step": 497609, "epoch": 5995} {"train_loss": -27.2404842376709, "global_step": 497610, "epoch": 5995} {"train_loss": -27.509275436401367, "global_step": 497611, "epoch": 5995} {"train_loss": -27.339651107788086, "global_step": 497612, "epoch": 5995} {"train_loss": -27.196096420288086, "global_step": 497613, "epoch": 5995} {"train_loss": -27.4658145904541, "global_step": 497614, "epoch": 5995} {"train_loss": -27.228025436401367, "global_step": 497615, "epoch": 5995} {"train_loss": -27.631256103515625, "global_step": 497616, "epoch": 5995} {"train_loss": -27.402204513549805, "global_step": 497617, "epoch": 5995} {"train_loss": -27.823474884033203, "global_step": 497618, "epoch": 5995} {"train_loss": -27.4357967376709, "global_step": 497619, "epoch": 5995} {"train_loss": -27.660978317260742, "global_step": 497620, "epoch": 5995} {"train_loss": -27.382246017456055, "global_step": 497621, "epoch": 5995} {"train_loss": -27.429296493530273, "global_step": 497622, "epoch": 5995} {"train_loss": -27.5555419921875, "global_step": 497623, "epoch": 5995} {"train_loss": -27.3519287109375, "global_step": 497624, "epoch": 5995} {"train_loss": -27.7940673828125, "global_step": 497625, "epoch": 5995} {"train_loss": -27.84564781188965, "global_step": 497626, "epoch": 5995} {"train_loss": -27.167652130126953, "global_step": 497627, "epoch": 5995} {"train_loss": -27.58839225769043, "global_step": 497628, "epoch": 5995} {"train_loss": -27.535898208618164, "global_step": 497629, "epoch": 5995} {"train_loss": -28.047094345092773, "global_step": 497630, "epoch": 5995} {"train_loss": -27.725980758666992, "global_step": 497631, "epoch": 5995} {"train_loss": -27.86496353149414, "global_step": 497632, "epoch": 5995} {"train_loss": -27.80727195739746, "global_step": 497633, "epoch": 5995} {"train_loss": -27.696226119995117, "global_step": 497634, "epoch": 5995} {"train_loss": -27.541187286376953, "global_step": 497635, "epoch": 5995} {"train_loss": -27.6679744720459, "global_step": 497636, "epoch": 5995} {"train_loss": -27.4669189453125, "global_step": 497637, "epoch": 5995} {"train_loss": -27.656042098999023, "global_step": 497638, "epoch": 5995} {"train_loss": -27.79859733581543, "global_step": 497639, "epoch": 5995} {"train_loss": -27.350509643554688, "global_step": 497640, "epoch": 5995} {"train_loss": -27.517541885375977, "global_step": 497641, "epoch": 5995} {"train_loss": -27.9697208404541, "global_step": 497642, "epoch": 5995} {"train_loss": -27.50444984436035, "global_step": 497643, "epoch": 5995} {"train_loss": -27.51666831970215, "global_step": 497644, "epoch": 5995} {"train_loss": -27.54768180847168, "global_step": 497645, "epoch": 5995} {"train_loss": -27.556196212768555, "global_step": 497646, "epoch": 5995} {"train_loss": -27.17096519470215, "global_step": 497647, "epoch": 5995} {"train_loss": -27.210046768188477, "global_step": 497648, "epoch": 5995} {"train_loss": -27.320281982421875, "global_step": 497649, "epoch": 5995} {"train_loss": -27.745807647705078, "global_step": 497650, "epoch": 5995} {"train_loss": -27.349594116210938, "global_step": 497651, "epoch": 5995} {"train_loss": -27.454608917236328, "global_step": 497652, "epoch": 5995} {"train_loss": -27.484235763549805, "global_step": 497653, "epoch": 5995} {"train_loss": -27.14815330505371, "global_step": 497654, "epoch": 5995} {"train_loss": -27.54243278503418, "global_step": 497655, "epoch": 5995} {"train_loss": -27.177825927734375, "global_step": 497656, "epoch": 5995} {"train_loss": -27.028583526611328, "global_step": 497657, "epoch": 5995} {"train_loss": -27.015548706054688, "global_step": 497658, "epoch": 5995} {"train_loss": -27.262664794921875, "global_step": 497659, "epoch": 5995} {"train_loss": -27.161142349243164, "global_step": 497660, "epoch": 5995} {"train_loss": -26.90433692932129, "global_step": 497661, "epoch": 5995} {"train_loss": -27.388473510742188, "global_step": 497662, "epoch": 5995} {"train_loss": -27.197797775268555, "global_step": 497663, "epoch": 5995} {"train_loss": -27.550312042236328, "global_step": 497664, "epoch": 5995} {"train_loss": -27.28618812561035, "global_step": 497665, "epoch": 5995} {"train_loss": -27.35749626159668, "global_step": 497666, "epoch": 5995} {"train_loss": -27.395328866430077, "global_step": 497667, "epoch": 5995, "val_loss": 6648692.5} {"train_loss": -26.510116577148438, "global_step": 497668, "epoch": 5996} {"train_loss": -26.63942527770996, "global_step": 497669, "epoch": 5996} {"train_loss": -26.296995162963867, "global_step": 497670, "epoch": 5996} {"train_loss": -26.553464889526367, "global_step": 497671, "epoch": 5996} {"train_loss": -26.931964874267578, "global_step": 497672, "epoch": 5996} {"train_loss": -26.660079956054688, "global_step": 497673, "epoch": 5996} {"train_loss": -26.570728302001953, "global_step": 497674, "epoch": 5996} {"train_loss": -26.842731475830078, "global_step": 497675, "epoch": 5996} {"train_loss": -26.948347091674805, "global_step": 497676, "epoch": 5996} {"train_loss": -26.96588134765625, "global_step": 497677, "epoch": 5996} {"train_loss": -26.61054801940918, "global_step": 497678, "epoch": 5996} {"train_loss": -27.160327911376953, "global_step": 497679, "epoch": 5996} {"train_loss": -27.025772094726562, "global_step": 497680, "epoch": 5996} {"train_loss": -27.106815338134766, "global_step": 497681, "epoch": 5996} {"train_loss": -26.567731857299805, "global_step": 497682, "epoch": 5996} {"train_loss": -27.108423233032227, "global_step": 497683, "epoch": 5996} {"train_loss": -26.760223388671875, "global_step": 497684, "epoch": 5996} {"train_loss": -27.273832321166992, "global_step": 497685, "epoch": 5996} {"train_loss": -26.908512115478516, "global_step": 497686, "epoch": 5996} {"train_loss": -26.750534057617188, "global_step": 497687, "epoch": 5996} {"train_loss": -27.15691566467285, "global_step": 497688, "epoch": 5996} {"train_loss": -26.6025447845459, "global_step": 497689, "epoch": 5996} {"train_loss": -27.29014015197754, "global_step": 497690, "epoch": 5996} {"train_loss": -26.999082565307617, "global_step": 497691, "epoch": 5996} {"train_loss": -27.192453384399414, "global_step": 497692, "epoch": 5996} {"train_loss": -26.993972778320312, "global_step": 497693, "epoch": 5996} {"train_loss": -27.2620849609375, "global_step": 497694, "epoch": 5996} {"train_loss": -27.030553817749023, "global_step": 497695, "epoch": 5996} {"train_loss": -27.7860164642334, "global_step": 497696, "epoch": 5996} {"train_loss": -27.226648330688477, "global_step": 497697, "epoch": 5996} {"train_loss": -27.408924102783203, "global_step": 497698, "epoch": 5996} {"train_loss": -27.436445236206055, "global_step": 497699, "epoch": 5996} {"train_loss": -27.443525314331055, "global_step": 497700, "epoch": 5996} {"train_loss": -27.011816024780273, "global_step": 497701, "epoch": 5996} {"train_loss": -27.49326515197754, "global_step": 497702, "epoch": 5996} {"train_loss": -27.290241241455078, "global_step": 497703, "epoch": 5996} {"train_loss": -27.264026641845703, "global_step": 497704, "epoch": 5996} {"train_loss": -27.419193267822266, "global_step": 497705, "epoch": 5996} {"train_loss": -27.39666175842285, "global_step": 497706, "epoch": 5996} {"train_loss": -27.68766212463379, "global_step": 497707, "epoch": 5996} {"train_loss": -27.158344268798828, "global_step": 497708, "epoch": 5996} {"train_loss": -27.665769577026367, "global_step": 497709, "epoch": 5996} {"train_loss": -27.45221519470215, "global_step": 497710, "epoch": 5996} {"train_loss": -27.6198787689209, "global_step": 497711, "epoch": 5996} {"train_loss": -27.651212692260742, "global_step": 497712, "epoch": 5996} {"train_loss": -27.73848533630371, "global_step": 497713, "epoch": 5996} {"train_loss": -27.390966415405273, "global_step": 497714, "epoch": 5996} {"train_loss": -27.140491485595703, "global_step": 497715, "epoch": 5996} {"train_loss": -27.30299186706543, "global_step": 497716, "epoch": 5996} {"train_loss": -27.430444717407227, "global_step": 497717, "epoch": 5996} {"train_loss": -27.354761123657227, "global_step": 497718, "epoch": 5996} {"train_loss": -27.54878807067871, "global_step": 497719, "epoch": 5996} {"train_loss": -27.676618576049805, "global_step": 497720, "epoch": 5996} {"train_loss": -27.595495223999023, "global_step": 497721, "epoch": 5996} {"train_loss": -27.4201717376709, "global_step": 497722, "epoch": 5996} {"train_loss": -27.434528350830078, "global_step": 497723, "epoch": 5996} {"train_loss": -27.44110679626465, "global_step": 497724, "epoch": 5996} {"train_loss": -27.452259063720703, "global_step": 497725, "epoch": 5996} {"train_loss": -27.24881935119629, "global_step": 497726, "epoch": 5996} {"train_loss": -27.575393676757812, "global_step": 497727, "epoch": 5996} {"train_loss": -27.663843154907227, "global_step": 497728, "epoch": 5996} {"train_loss": -27.177352905273438, "global_step": 497729, "epoch": 5996} {"train_loss": -27.566394805908203, "global_step": 497730, "epoch": 5996} {"train_loss": -27.347070693969727, "global_step": 497731, "epoch": 5996} {"train_loss": -27.092844009399414, "global_step": 497732, "epoch": 5996} {"train_loss": -27.556909561157227, "global_step": 497733, "epoch": 5996} {"train_loss": -27.27203369140625, "global_step": 497734, "epoch": 5996} {"train_loss": -27.13361930847168, "global_step": 497735, "epoch": 5996} {"train_loss": -27.650165557861328, "global_step": 497736, "epoch": 5996} {"train_loss": -27.5272159576416, "global_step": 497737, "epoch": 5996} {"train_loss": -27.365314483642578, "global_step": 497738, "epoch": 5996} {"train_loss": -27.23078727722168, "global_step": 497739, "epoch": 5996} {"train_loss": -27.072036743164062, "global_step": 497740, "epoch": 5996} {"train_loss": -26.93023681640625, "global_step": 497741, "epoch": 5996} {"train_loss": -27.23849868774414, "global_step": 497742, "epoch": 5996} {"train_loss": -27.632429122924805, "global_step": 497743, "epoch": 5996} {"train_loss": -27.229562759399414, "global_step": 497744, "epoch": 5996} {"train_loss": -27.157072067260742, "global_step": 497745, "epoch": 5996} {"train_loss": -26.957868576049805, "global_step": 497746, "epoch": 5996} {"train_loss": -27.455663681030273, "global_step": 497747, "epoch": 5996} {"train_loss": -27.03556251525879, "global_step": 497748, "epoch": 5996} {"train_loss": -27.255781173706055, "global_step": 497749, "epoch": 5996} {"train_loss": -27.21531334842544, "global_step": 497750, "epoch": 5996, "val_loss": 6493624.0} {"train_loss": -26.924081802368164, "global_step": 497751, "epoch": 5997} {"train_loss": -26.367177963256836, "global_step": 497752, "epoch": 5997} {"train_loss": -27.261703491210938, "global_step": 497753, "epoch": 5997} {"train_loss": -26.83272361755371, "global_step": 497754, "epoch": 5997} {"train_loss": -26.28080177307129, "global_step": 497755, "epoch": 5997} {"train_loss": -27.258609771728516, "global_step": 497756, "epoch": 5997} {"train_loss": -26.7430362701416, "global_step": 497757, "epoch": 5997} {"train_loss": -26.779529571533203, "global_step": 497758, "epoch": 5997} {"train_loss": -27.216413497924805, "global_step": 497759, "epoch": 5997} {"train_loss": -26.8116512298584, "global_step": 497760, "epoch": 5997} {"train_loss": -26.817731857299805, "global_step": 497761, "epoch": 5997} {"train_loss": -27.29483413696289, "global_step": 497762, "epoch": 5997} {"train_loss": -27.216760635375977, "global_step": 497763, "epoch": 5997} {"train_loss": -27.033597946166992, "global_step": 497764, "epoch": 5997} {"train_loss": -27.048206329345703, "global_step": 497765, "epoch": 5997} {"train_loss": -27.082977294921875, "global_step": 497766, "epoch": 5997} {"train_loss": -27.4624080657959, "global_step": 497767, "epoch": 5997} {"train_loss": -26.950641632080078, "global_step": 497768, "epoch": 5997} {"train_loss": -27.149993896484375, "global_step": 497769, "epoch": 5997} {"train_loss": -27.342090606689453, "global_step": 497770, "epoch": 5997} {"train_loss": -27.293664932250977, "global_step": 497771, "epoch": 5997} {"train_loss": -27.370513916015625, "global_step": 497772, "epoch": 5997} {"train_loss": -27.365163803100586, "global_step": 497773, "epoch": 5997} {"train_loss": -27.07452392578125, "global_step": 497774, "epoch": 5997} {"train_loss": -27.357145309448242, "global_step": 497775, "epoch": 5997} {"train_loss": -27.101699829101562, "global_step": 497776, "epoch": 5997} {"train_loss": -27.097761154174805, "global_step": 497777, "epoch": 5997} {"train_loss": -27.083255767822266, "global_step": 497778, "epoch": 5997} {"train_loss": -27.270599365234375, "global_step": 497779, "epoch": 5997} {"train_loss": -27.075428009033203, "global_step": 497780, "epoch": 5997} {"train_loss": -27.100086212158203, "global_step": 497781, "epoch": 5997} {"train_loss": -27.78230094909668, "global_step": 497782, "epoch": 5997} {"train_loss": -27.726831436157227, "global_step": 497783, "epoch": 5997} {"train_loss": -27.381427764892578, "global_step": 497784, "epoch": 5997} {"train_loss": -27.544052124023438, "global_step": 497785, "epoch": 5997} {"train_loss": -27.50786781311035, "global_step": 497786, "epoch": 5997} {"train_loss": -27.23495864868164, "global_step": 497787, "epoch": 5997} {"train_loss": -27.311437606811523, "global_step": 497788, "epoch": 5997} {"train_loss": -27.411813735961914, "global_step": 497789, "epoch": 5997} {"train_loss": -27.593826293945312, "global_step": 497790, "epoch": 5997} {"train_loss": -27.54339027404785, "global_step": 497791, "epoch": 5997} {"train_loss": -27.614511489868164, "global_step": 497792, "epoch": 5997} {"train_loss": -27.557523727416992, "global_step": 497793, "epoch": 5997} {"train_loss": -27.571386337280273, "global_step": 497794, "epoch": 5997} {"train_loss": -27.425397872924805, "global_step": 497795, "epoch": 5997} {"train_loss": -27.231908798217773, "global_step": 497796, "epoch": 5997} {"train_loss": -27.67435646057129, "global_step": 497797, "epoch": 5997} {"train_loss": -27.430469512939453, "global_step": 497798, "epoch": 5997} {"train_loss": -27.415430068969727, "global_step": 497799, "epoch": 5997} {"train_loss": -27.53335952758789, "global_step": 497800, "epoch": 5997} {"train_loss": -27.42127799987793, "global_step": 497801, "epoch": 5997} {"train_loss": -27.27225685119629, "global_step": 497802, "epoch": 5997} {"train_loss": -27.743505477905273, "global_step": 497803, "epoch": 5997} {"train_loss": -27.544950485229492, "global_step": 497804, "epoch": 5997} {"train_loss": -27.4190731048584, "global_step": 497805, "epoch": 5997} {"train_loss": -26.9163875579834, "global_step": 497806, "epoch": 5997} {"train_loss": -26.919721603393555, "global_step": 497807, "epoch": 5997} {"train_loss": -26.814374923706055, "global_step": 497808, "epoch": 5997} {"train_loss": -27.529678344726562, "global_step": 497809, "epoch": 5997} {"train_loss": -26.821073532104492, "global_step": 497810, "epoch": 5997} {"train_loss": -27.122238159179688, "global_step": 497811, "epoch": 5997} {"train_loss": -27.165136337280273, "global_step": 497812, "epoch": 5997} {"train_loss": -26.912830352783203, "global_step": 497813, "epoch": 5997} {"train_loss": -27.373144149780273, "global_step": 497814, "epoch": 5997} {"train_loss": -27.430755615234375, "global_step": 497815, "epoch": 5997} {"train_loss": -27.405670166015625, "global_step": 497816, "epoch": 5997} {"train_loss": -27.105154037475586, "global_step": 497817, "epoch": 5997} {"train_loss": -27.7254695892334, "global_step": 497818, "epoch": 5997} {"train_loss": -26.92168617248535, "global_step": 497819, "epoch": 5997} {"train_loss": -27.45223045349121, "global_step": 497820, "epoch": 5997} {"train_loss": -27.46662712097168, "global_step": 497821, "epoch": 5997} {"train_loss": -27.789255142211914, "global_step": 497822, "epoch": 5997} {"train_loss": -27.599533081054688, "global_step": 497823, "epoch": 5997} {"train_loss": -27.35283851623535, "global_step": 497824, "epoch": 5997} {"train_loss": -27.41840934753418, "global_step": 497825, "epoch": 5997} {"train_loss": -27.400959014892578, "global_step": 497826, "epoch": 5997} {"train_loss": -27.37554359436035, "global_step": 497827, "epoch": 5997} {"train_loss": -27.360090255737305, "global_step": 497828, "epoch": 5997} {"train_loss": -27.626508712768555, "global_step": 497829, "epoch": 5997} {"train_loss": -27.29363441467285, "global_step": 497830, "epoch": 5997} {"train_loss": -27.233366012573242, "global_step": 497831, "epoch": 5997} {"train_loss": -27.35761070251465, "global_step": 497832, "epoch": 5997} {"train_loss": -27.261256574148156, "global_step": 497833, "epoch": 5997, "val_loss": 6557807.5} {"train_loss": -26.77265739440918, "global_step": 497834, "epoch": 5998} {"train_loss": -26.476194381713867, "global_step": 497835, "epoch": 5998} {"train_loss": -27.279977798461914, "global_step": 497836, "epoch": 5998} {"train_loss": -26.749231338500977, "global_step": 497837, "epoch": 5998} {"train_loss": -26.55696678161621, "global_step": 497838, "epoch": 5998} {"train_loss": -26.820404052734375, "global_step": 497839, "epoch": 5998} {"train_loss": -26.935293197631836, "global_step": 497840, "epoch": 5998} {"train_loss": -26.9041748046875, "global_step": 497841, "epoch": 5998} {"train_loss": -26.89859962463379, "global_step": 497842, "epoch": 5998} {"train_loss": -27.103260040283203, "global_step": 497843, "epoch": 5998} {"train_loss": -26.9123592376709, "global_step": 497844, "epoch": 5998} {"train_loss": -27.05327796936035, "global_step": 497845, "epoch": 5998} {"train_loss": -27.34480094909668, "global_step": 497846, "epoch": 5998} {"train_loss": -27.02467155456543, "global_step": 497847, "epoch": 5998} {"train_loss": -27.154199600219727, "global_step": 497848, "epoch": 5998} {"train_loss": -27.158863067626953, "global_step": 497849, "epoch": 5998} {"train_loss": -27.515762329101562, "global_step": 497850, "epoch": 5998} {"train_loss": -27.278701782226562, "global_step": 497851, "epoch": 5998} {"train_loss": -27.198688507080078, "global_step": 497852, "epoch": 5998} {"train_loss": -27.23377799987793, "global_step": 497853, "epoch": 5998} {"train_loss": -27.286468505859375, "global_step": 497854, "epoch": 5998} {"train_loss": -27.249998092651367, "global_step": 497855, "epoch": 5998} {"train_loss": -26.89303970336914, "global_step": 497856, "epoch": 5998} {"train_loss": -27.408002853393555, "global_step": 497857, "epoch": 5998} {"train_loss": -27.440509796142578, "global_step": 497858, "epoch": 5998} {"train_loss": -27.185422897338867, "global_step": 497859, "epoch": 5998} {"train_loss": -27.148334503173828, "global_step": 497860, "epoch": 5998} {"train_loss": -27.13783073425293, "global_step": 497861, "epoch": 5998} {"train_loss": -27.33890151977539, "global_step": 497862, "epoch": 5998} {"train_loss": -26.983718872070312, "global_step": 497863, "epoch": 5998} {"train_loss": -27.33380699157715, "global_step": 497864, "epoch": 5998} {"train_loss": -27.187299728393555, "global_step": 497865, "epoch": 5998} {"train_loss": -27.397674560546875, "global_step": 497866, "epoch": 5998} {"train_loss": -27.237689971923828, "global_step": 497867, "epoch": 5998} {"train_loss": -27.161956787109375, "global_step": 497868, "epoch": 5998} {"train_loss": -27.098907470703125, "global_step": 497869, "epoch": 5998} {"train_loss": -27.493518829345703, "global_step": 497870, "epoch": 5998} {"train_loss": -26.955921173095703, "global_step": 497871, "epoch": 5998} {"train_loss": -27.15168571472168, "global_step": 497872, "epoch": 5998} {"train_loss": -27.19952964782715, "global_step": 497873, "epoch": 5998} {"train_loss": -27.333560943603516, "global_step": 497874, "epoch": 5998} {"train_loss": -27.07740592956543, "global_step": 497875, "epoch": 5998} {"train_loss": -27.475421905517578, "global_step": 497876, "epoch": 5998} {"train_loss": -27.158069610595703, "global_step": 497877, "epoch": 5998} {"train_loss": -27.191038131713867, "global_step": 497878, "epoch": 5998} {"train_loss": -27.47541618347168, "global_step": 497879, "epoch": 5998} {"train_loss": -27.105575561523438, "global_step": 497880, "epoch": 5998} {"train_loss": -27.639728546142578, "global_step": 497881, "epoch": 5998} {"train_loss": -27.575895309448242, "global_step": 497882, "epoch": 5998} {"train_loss": -27.4296932220459, "global_step": 497883, "epoch": 5998} {"train_loss": -27.488656997680664, "global_step": 497884, "epoch": 5998} {"train_loss": -27.520755767822266, "global_step": 497885, "epoch": 5998} {"train_loss": -27.24977684020996, "global_step": 497886, "epoch": 5998} {"train_loss": -27.249267578125, "global_step": 497887, "epoch": 5998} {"train_loss": -27.20987892150879, "global_step": 497888, "epoch": 5998} {"train_loss": -27.779233932495117, "global_step": 497889, "epoch": 5998} {"train_loss": -27.181964874267578, "global_step": 497890, "epoch": 5998} {"train_loss": -27.550464630126953, "global_step": 497891, "epoch": 5998} {"train_loss": -27.651418685913086, "global_step": 497892, "epoch": 5998} {"train_loss": -27.437314987182617, "global_step": 497893, "epoch": 5998} {"train_loss": -27.5350284576416, "global_step": 497894, "epoch": 5998} {"train_loss": -27.65069007873535, "global_step": 497895, "epoch": 5998} {"train_loss": -27.270706176757812, "global_step": 497896, "epoch": 5998} {"train_loss": -27.57988929748535, "global_step": 497897, "epoch": 5998} {"train_loss": -27.480274200439453, "global_step": 497898, "epoch": 5998} {"train_loss": -27.249624252319336, "global_step": 497899, "epoch": 5998} {"train_loss": -27.638303756713867, "global_step": 497900, "epoch": 5998} {"train_loss": -27.412673950195312, "global_step": 497901, "epoch": 5998} {"train_loss": -27.449756622314453, "global_step": 497902, "epoch": 5998} {"train_loss": -27.55478286743164, "global_step": 497903, "epoch": 5998} {"train_loss": -27.87869644165039, "global_step": 497904, "epoch": 5998} {"train_loss": -27.620710372924805, "global_step": 497905, "epoch": 5998} {"train_loss": -27.523517608642578, "global_step": 497906, "epoch": 5998} {"train_loss": -27.5828857421875, "global_step": 497907, "epoch": 5998} {"train_loss": -27.6146240234375, "global_step": 497908, "epoch": 5998} {"train_loss": -27.68564796447754, "global_step": 497909, "epoch": 5998} {"train_loss": -27.5218505859375, "global_step": 497910, "epoch": 5998} {"train_loss": -27.72037696838379, "global_step": 497911, "epoch": 5998} {"train_loss": -27.243793487548828, "global_step": 497912, "epoch": 5998} {"train_loss": -27.571582794189453, "global_step": 497913, "epoch": 5998} {"train_loss": -27.5235652923584, "global_step": 497914, "epoch": 5998} {"train_loss": -27.704898834228516, "global_step": 497915, "epoch": 5998} {"train_loss": -27.30067597814353, "global_step": 497916, "epoch": 5998, "val_loss": 6623393.0} {"train_loss": -26.822036743164062, "global_step": 497917, "epoch": 5999} {"train_loss": -26.3712158203125, "global_step": 497918, "epoch": 5999} {"train_loss": -25.09769058227539, "global_step": 497919, "epoch": 5999} {"train_loss": -24.735092163085938, "global_step": 497920, "epoch": 5999} {"train_loss": -25.06962013244629, "global_step": 497921, "epoch": 5999} {"train_loss": -25.1671142578125, "global_step": 497922, "epoch": 5999} {"train_loss": -25.307716369628906, "global_step": 497923, "epoch": 5999} {"train_loss": -26.49466896057129, "global_step": 497924, "epoch": 5999} {"train_loss": -25.593015670776367, "global_step": 497925, "epoch": 5999} {"train_loss": -26.86417007446289, "global_step": 497926, "epoch": 5999} {"train_loss": -25.904743194580078, "global_step": 497927, "epoch": 5999} {"train_loss": -26.484699249267578, "global_step": 497928, "epoch": 5999} {"train_loss": -26.40581703186035, "global_step": 497929, "epoch": 5999} {"train_loss": -26.649667739868164, "global_step": 497930, "epoch": 5999} {"train_loss": -26.366186141967773, "global_step": 497931, "epoch": 5999} {"train_loss": -26.669050216674805, "global_step": 497932, "epoch": 5999} {"train_loss": -27.025100708007812, "global_step": 497933, "epoch": 5999} {"train_loss": -26.672147750854492, "global_step": 497934, "epoch": 5999} {"train_loss": -26.635953903198242, "global_step": 497935, "epoch": 5999} {"train_loss": -26.918701171875, "global_step": 497936, "epoch": 5999} {"train_loss": -27.06846046447754, "global_step": 497937, "epoch": 5999} {"train_loss": -27.18292808532715, "global_step": 497938, "epoch": 5999} {"train_loss": -27.114151000976562, "global_step": 497939, "epoch": 5999} {"train_loss": -26.764463424682617, "global_step": 497940, "epoch": 5999} {"train_loss": -27.0566463470459, "global_step": 497941, "epoch": 5999} {"train_loss": -26.694562911987305, "global_step": 497942, "epoch": 5999} {"train_loss": -26.929859161376953, "global_step": 497943, "epoch": 5999} {"train_loss": -26.979333877563477, "global_step": 497944, "epoch": 5999} {"train_loss": -27.028076171875, "global_step": 497945, "epoch": 5999} {"train_loss": -27.169279098510742, "global_step": 497946, "epoch": 5999} {"train_loss": -26.9652099609375, "global_step": 497947, "epoch": 5999} {"train_loss": -27.277612686157227, "global_step": 497948, "epoch": 5999} {"train_loss": -27.010089874267578, "global_step": 497949, "epoch": 5999} {"train_loss": -27.3572940826416, "global_step": 497950, "epoch": 5999} {"train_loss": -26.839292526245117, "global_step": 497951, "epoch": 5999} {"train_loss": -27.053037643432617, "global_step": 497952, "epoch": 5999} {"train_loss": -27.194692611694336, "global_step": 497953, "epoch": 5999} {"train_loss": -27.251768112182617, "global_step": 497954, "epoch": 5999} {"train_loss": -27.257465362548828, "global_step": 497955, "epoch": 5999} {"train_loss": -27.298734664916992, "global_step": 497956, "epoch": 5999} {"train_loss": -27.463621139526367, "global_step": 497957, "epoch": 5999} {"train_loss": -27.31715202331543, "global_step": 497958, "epoch": 5999} {"train_loss": -27.402942657470703, "global_step": 497959, "epoch": 5999} {"train_loss": -27.445249557495117, "global_step": 497960, "epoch": 5999} {"train_loss": -27.272186279296875, "global_step": 497961, "epoch": 5999} {"train_loss": -27.375518798828125, "global_step": 497962, "epoch": 5999} {"train_loss": -27.456775665283203, "global_step": 497963, "epoch": 5999} {"train_loss": -27.76078224182129, "global_step": 497964, "epoch": 5999} {"train_loss": -27.62672233581543, "global_step": 497965, "epoch": 5999} {"train_loss": -27.388891220092773, "global_step": 497966, "epoch": 5999} {"train_loss": -27.459558486938477, "global_step": 497967, "epoch": 5999} {"train_loss": -27.532867431640625, "global_step": 497968, "epoch": 5999} {"train_loss": -27.54682731628418, "global_step": 497969, "epoch": 5999} {"train_loss": -27.80204200744629, "global_step": 497970, "epoch": 5999} {"train_loss": -27.393665313720703, "global_step": 497971, "epoch": 5999} {"train_loss": -27.388303756713867, "global_step": 497972, "epoch": 5999} {"train_loss": -27.678564071655273, "global_step": 497973, "epoch": 5999} {"train_loss": -27.2860107421875, "global_step": 497974, "epoch": 5999} {"train_loss": -27.48712158203125, "global_step": 497975, "epoch": 5999} {"train_loss": -27.673919677734375, "global_step": 497976, "epoch": 5999} {"train_loss": -27.968671798706055, "global_step": 497977, "epoch": 5999} {"train_loss": -27.58611488342285, "global_step": 497978, "epoch": 5999} {"train_loss": -27.46746826171875, "global_step": 497979, "epoch": 5999} {"train_loss": -27.448394775390625, "global_step": 497980, "epoch": 5999} {"train_loss": -27.448810577392578, "global_step": 497981, "epoch": 5999} {"train_loss": -27.345937728881836, "global_step": 497982, "epoch": 5999} {"train_loss": -27.23164176940918, "global_step": 497983, "epoch": 5999} {"train_loss": -27.819793701171875, "global_step": 497984, "epoch": 5999} {"train_loss": -27.387128829956055, "global_step": 497985, "epoch": 5999} {"train_loss": -27.93283462524414, "global_step": 497986, "epoch": 5999} {"train_loss": -27.208837509155273, "global_step": 497987, "epoch": 5999} {"train_loss": -27.940149307250977, "global_step": 497988, "epoch": 5999} {"train_loss": -27.555875778198242, "global_step": 497989, "epoch": 5999} {"train_loss": -27.80243492126465, "global_step": 497990, "epoch": 5999} {"train_loss": -27.607177734375, "global_step": 497991, "epoch": 5999} {"train_loss": -27.749128341674805, "global_step": 497992, "epoch": 5999} {"train_loss": -27.256437301635742, "global_step": 497993, "epoch": 5999} {"train_loss": -27.91143226623535, "global_step": 497994, "epoch": 5999} {"train_loss": -27.8824405670166, "global_step": 497995, "epoch": 5999} {"train_loss": -27.596485137939453, "global_step": 497996, "epoch": 5999} {"train_loss": -27.102689743041992, "global_step": 497997, "epoch": 5999} {"train_loss": -26.968341827392578, "global_step": 497998, "epoch": 5999} {"train_loss": -27.079127897699195, "global_step": 497999, "epoch": 5999, "val_loss": 6599180.0} {"train_loss": -22.244321823120117, "global_step": 498000, "epoch": 6000} {"train_loss": -20.897464752197266, "global_step": 498001, "epoch": 6000} {"train_loss": -24.52427101135254, "global_step": 498002, "epoch": 6000} {"train_loss": -23.98602294921875, "global_step": 498003, "epoch": 6000} {"train_loss": -24.331533432006836, "global_step": 498004, "epoch": 6000} {"train_loss": -24.912172317504883, "global_step": 498005, "epoch": 6000} {"train_loss": -25.38629722595215, "global_step": 498006, "epoch": 6000} {"train_loss": -24.89838218688965, "global_step": 498007, "epoch": 6000} {"train_loss": -25.50884437561035, "global_step": 498008, "epoch": 6000} {"train_loss": -25.45124626159668, "global_step": 498009, "epoch": 6000} {"train_loss": -25.161684036254883, "global_step": 498010, "epoch": 6000} {"train_loss": -25.423477172851562, "global_step": 498011, "epoch": 6000} {"train_loss": -25.59476089477539, "global_step": 498012, "epoch": 6000} {"train_loss": -25.928884506225586, "global_step": 498013, "epoch": 6000} {"train_loss": -26.05214500427246, "global_step": 498014, "epoch": 6000} {"train_loss": -25.263866424560547, "global_step": 498015, "epoch": 6000} {"train_loss": -25.73695945739746, "global_step": 498016, "epoch": 6000} {"train_loss": -25.8297119140625, "global_step": 498017, "epoch": 6000} {"train_loss": -26.41450309753418, "global_step": 498018, "epoch": 6000} {"train_loss": -25.868803024291992, "global_step": 498019, "epoch": 6000} {"train_loss": -26.269811630249023, "global_step": 498020, "epoch": 6000} {"train_loss": -26.057861328125, "global_step": 498021, "epoch": 6000} {"train_loss": -26.109601974487305, "global_step": 498022, "epoch": 6000} {"train_loss": -26.068592071533203, "global_step": 498023, "epoch": 6000} {"train_loss": -26.51045036315918, "global_step": 498024, "epoch": 6000} {"train_loss": -26.34932518005371, "global_step": 498025, "epoch": 6000} {"train_loss": -26.52121925354004, "global_step": 498026, "epoch": 6000} {"train_loss": -26.4561710357666, "global_step": 498027, "epoch": 6000} {"train_loss": -26.471668243408203, "global_step": 498028, "epoch": 6000} {"train_loss": -26.540502548217773, "global_step": 498029, "epoch": 6000} {"train_loss": -26.36871910095215, "global_step": 498030, "epoch": 6000} {"train_loss": -26.724609375, "global_step": 498031, "epoch": 6000} {"train_loss": -26.478322982788086, "global_step": 498032, "epoch": 6000} {"train_loss": -26.64943504333496, "global_step": 498033, "epoch": 6000} {"train_loss": -26.885700225830078, "global_step": 498034, "epoch": 6000} {"train_loss": -26.839929580688477, "global_step": 498035, "epoch": 6000} {"train_loss": -26.64820671081543, "global_step": 498036, "epoch": 6000} {"train_loss": -27.004758834838867, "global_step": 498037, "epoch": 6000} {"train_loss": -27.128372192382812, "global_step": 498038, "epoch": 6000} {"train_loss": -26.824155807495117, "global_step": 498039, "epoch": 6000} {"train_loss": -26.907123565673828, "global_step": 498040, "epoch": 6000} {"train_loss": -27.060956954956055, "global_step": 498041, "epoch": 6000} {"train_loss": -27.187284469604492, "global_step": 498042, "epoch": 6000} {"train_loss": -27.334003448486328, "global_step": 498043, "epoch": 6000} {"train_loss": -27.1604061126709, "global_step": 498044, "epoch": 6000} {"train_loss": -27.190963745117188, "global_step": 498045, "epoch": 6000} {"train_loss": -27.344837188720703, "global_step": 498046, "epoch": 6000} {"train_loss": -27.376630783081055, "global_step": 498047, "epoch": 6000} {"train_loss": -27.17122459411621, "global_step": 498048, "epoch": 6000} {"train_loss": -26.95356559753418, "global_step": 498049, "epoch": 6000} {"train_loss": -27.00105094909668, "global_step": 498050, "epoch": 6000} {"train_loss": -27.251203536987305, "global_step": 498051, "epoch": 6000} {"train_loss": -27.198810577392578, "global_step": 498052, "epoch": 6000} {"train_loss": -27.204315185546875, "global_step": 498053, "epoch": 6000} {"train_loss": -27.30280113220215, "global_step": 498054, "epoch": 6000} {"train_loss": -26.98850440979004, "global_step": 498055, "epoch": 6000} {"train_loss": -27.34808921813965, "global_step": 498056, "epoch": 6000} {"train_loss": -27.139545440673828, "global_step": 498057, "epoch": 6000} {"train_loss": -27.485937118530273, "global_step": 498058, "epoch": 6000} {"train_loss": -27.42635154724121, "global_step": 498059, "epoch": 6000} {"train_loss": -27.61366081237793, "global_step": 498060, "epoch": 6000} {"train_loss": -27.50819206237793, "global_step": 498061, "epoch": 6000} {"train_loss": -27.315881729125977, "global_step": 498062, "epoch": 6000} {"train_loss": -27.501880645751953, "global_step": 498063, "epoch": 6000} {"train_loss": -27.265277862548828, "global_step": 498064, "epoch": 6000} {"train_loss": -27.28944206237793, "global_step": 498065, "epoch": 6000} {"train_loss": -27.176916122436523, "global_step": 498066, "epoch": 6000} {"train_loss": -27.80838966369629, "global_step": 498067, "epoch": 6000} {"train_loss": -27.02631187438965, "global_step": 498068, "epoch": 6000} {"train_loss": -27.459867477416992, "global_step": 498069, "epoch": 6000} {"train_loss": -27.257205963134766, "global_step": 498070, "epoch": 6000} {"train_loss": -27.418079376220703, "global_step": 498071, "epoch": 6000} {"train_loss": -27.291845321655273, "global_step": 498072, "epoch": 6000} {"train_loss": -27.636295318603516, "global_step": 498073, "epoch": 6000} {"train_loss": -27.438024520874023, "global_step": 498074, "epoch": 6000} {"train_loss": -26.989179611206055, "global_step": 498075, "epoch": 6000} {"train_loss": -27.18031120300293, "global_step": 498076, "epoch": 6000} {"train_loss": -27.572589874267578, "global_step": 498077, "epoch": 6000} {"train_loss": -27.144180297851562, "global_step": 498078, "epoch": 6000} {"train_loss": -27.448312759399414, "global_step": 498079, "epoch": 6000} {"train_loss": -27.251379013061523, "global_step": 498080, "epoch": 6000} {"train_loss": -27.495868682861328, "global_step": 498081, "epoch": 6000} {"train_loss": -26.53816781561059, "global_step": 498082, "epoch": 6000, "train/sim_max_reward_0": 0.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 0.0, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4500000": 1.0, "test/sim_max_reward_4500001": 1.0, "test/sim_max_reward_4500002": 1.0, "test/sim_max_reward_4500003": 1.0, "test/sim_max_reward_4500004": 1.0, "test/sim_max_reward_4500005": 1.0, "test/sim_max_reward_4500006": 1.0, "test/sim_max_reward_4500007": 0.0, "test/sim_max_reward_4500008": 1.0, "test/sim_max_reward_4500009": 1.0, "test/sim_max_reward_4500010": 1.0, "test/sim_max_reward_4500011": 1.0, "test/sim_max_reward_4500012": 1.0, "test/sim_max_reward_4500013": 0.0, "test/sim_max_reward_4500014": 1.0, "test/sim_max_reward_4500015": 1.0, "test/sim_max_reward_4500016": 1.0, "test/sim_max_reward_4500017": 1.0, "test/sim_max_reward_4500018": 1.0, "test/sim_max_reward_4500019": 0.0, "test/sim_max_reward_4500020": 1.0, "test/sim_max_reward_4500021": 1.0, "train/mean_score": 0.6666666666666666, "test/mean_score": 0.8636363636363636, "val_loss": 6526465.0} {"train_loss": -25.40052604675293, "global_step": 498083, "epoch": 6001} {"train_loss": -25.04506492614746, "global_step": 498084, "epoch": 6001} {"train_loss": -26.34158706665039, "global_step": 498085, "epoch": 6001} {"train_loss": -24.91163444519043, "global_step": 498086, "epoch": 6001} {"train_loss": -25.986684799194336, "global_step": 498087, "epoch": 6001} {"train_loss": -26.14434814453125, "global_step": 498088, "epoch": 6001} {"train_loss": -26.235708236694336, "global_step": 498089, "epoch": 6001} {"train_loss": -25.596771240234375, "global_step": 498090, "epoch": 6001} {"train_loss": -25.894742965698242, "global_step": 498091, "epoch": 6001} {"train_loss": -26.9105167388916, "global_step": 498092, "epoch": 6001} {"train_loss": -26.4088134765625, "global_step": 498093, "epoch": 6001} {"train_loss": -26.396100997924805, "global_step": 498094, "epoch": 6001} {"train_loss": -26.58062744140625, "global_step": 498095, "epoch": 6001} {"train_loss": -26.598913192749023, "global_step": 498096, "epoch": 6001} {"train_loss": -26.516815185546875, "global_step": 498097, "epoch": 6001} {"train_loss": -26.75775718688965, "global_step": 498098, "epoch": 6001} {"train_loss": -26.644439697265625, "global_step": 498099, "epoch": 6001} {"train_loss": -26.79229164123535, "global_step": 498100, "epoch": 6001} {"train_loss": -26.8782958984375, "global_step": 498101, "epoch": 6001} {"train_loss": -26.258319854736328, "global_step": 498102, "epoch": 6001} {"train_loss": -26.823240280151367, "global_step": 498103, "epoch": 6001} {"train_loss": -26.938688278198242, "global_step": 498104, "epoch": 6001} {"train_loss": -26.90955924987793, "global_step": 498105, "epoch": 6001} {"train_loss": -27.080585479736328, "global_step": 498106, "epoch": 6001} {"train_loss": -27.24842643737793, "global_step": 498107, "epoch": 6001} {"train_loss": -26.91065788269043, "global_step": 498108, "epoch": 6001} {"train_loss": -26.859039306640625, "global_step": 498109, "epoch": 6001} {"train_loss": -26.847009658813477, "global_step": 498110, "epoch": 6001} {"train_loss": -26.979034423828125, "global_step": 498111, "epoch": 6001} {"train_loss": -26.96173667907715, "global_step": 498112, "epoch": 6001} {"train_loss": -26.999267578125, "global_step": 498113, "epoch": 6001} {"train_loss": -27.60500144958496, "global_step": 498114, "epoch": 6001} {"train_loss": -27.433557510375977, "global_step": 498115, "epoch": 6001} {"train_loss": -27.17127799987793, "global_step": 498116, "epoch": 6001} {"train_loss": -27.276554107666016, "global_step": 498117, "epoch": 6001} {"train_loss": -27.092071533203125, "global_step": 498118, "epoch": 6001} {"train_loss": -27.355224609375, "global_step": 498119, "epoch": 6001} {"train_loss": -27.51360511779785, "global_step": 498120, "epoch": 6001} {"train_loss": -27.365102767944336, "global_step": 498121, "epoch": 6001} {"train_loss": -27.44549560546875, "global_step": 498122, "epoch": 6001} {"train_loss": -27.447458267211914, "global_step": 498123, "epoch": 6001} {"train_loss": -27.28095817565918, "global_step": 498124, "epoch": 6001} {"train_loss": -27.18720817565918, "global_step": 498125, "epoch": 6001} {"train_loss": -27.704883575439453, "global_step": 498126, "epoch": 6001} {"train_loss": -27.4300594329834, "global_step": 498127, "epoch": 6001} {"train_loss": -27.50937843322754, "global_step": 498128, "epoch": 6001} {"train_loss": -27.599058151245117, "global_step": 498129, "epoch": 6001} {"train_loss": -27.511953353881836, "global_step": 498130, "epoch": 6001} {"train_loss": -27.439619064331055, "global_step": 498131, "epoch": 6001} {"train_loss": -27.520660400390625, "global_step": 498132, "epoch": 6001} {"train_loss": -27.6927433013916, "global_step": 498133, "epoch": 6001} {"train_loss": -27.664997100830078, "global_step": 498134, "epoch": 6001} {"train_loss": -27.52158546447754, "global_step": 498135, "epoch": 6001} {"train_loss": -27.86824607849121, "global_step": 498136, "epoch": 6001} {"train_loss": -27.642410278320312, "global_step": 498137, "epoch": 6001} {"train_loss": -27.648040771484375, "global_step": 498138, "epoch": 6001} {"train_loss": -27.29267692565918, "global_step": 498139, "epoch": 6001} {"train_loss": -27.2976016998291, "global_step": 498140, "epoch": 6001} {"train_loss": -27.82318687438965, "global_step": 498141, "epoch": 6001} {"train_loss": -27.649229049682617, "global_step": 498142, "epoch": 6001} {"train_loss": -27.7608642578125, "global_step": 498143, "epoch": 6001} {"train_loss": -27.620946884155273, "global_step": 498144, "epoch": 6001} {"train_loss": -27.51141929626465, "global_step": 498145, "epoch": 6001} {"train_loss": -27.58746910095215, "global_step": 498146, "epoch": 6001} {"train_loss": -27.71258544921875, "global_step": 498147, "epoch": 6001} {"train_loss": -27.654199600219727, "global_step": 498148, "epoch": 6001} {"train_loss": -27.344440460205078, "global_step": 498149, "epoch": 6001} {"train_loss": -27.410314559936523, "global_step": 498150, "epoch": 6001} {"train_loss": -27.25910758972168, "global_step": 498151, "epoch": 6001} {"train_loss": -27.198225021362305, "global_step": 498152, "epoch": 6001} {"train_loss": -27.8525390625, "global_step": 498153, "epoch": 6001} {"train_loss": -27.442907333374023, "global_step": 498154, "epoch": 6001} {"train_loss": -27.622547149658203, "global_step": 498155, "epoch": 6001} {"train_loss": -27.40189552307129, "global_step": 498156, "epoch": 6001} {"train_loss": -27.636463165283203, "global_step": 498157, "epoch": 6001} {"train_loss": -27.68931007385254, "global_step": 498158, "epoch": 6001} {"train_loss": -27.872699737548828, "global_step": 498159, "epoch": 6001} {"train_loss": -27.56304359436035, "global_step": 498160, "epoch": 6001} {"train_loss": -27.423215866088867, "global_step": 498161, "epoch": 6001} {"train_loss": -27.435577392578125, "global_step": 498162, "epoch": 6001} {"train_loss": -27.66512107849121, "global_step": 498163, "epoch": 6001} {"train_loss": -27.416736602783203, "global_step": 498164, "epoch": 6001} {"train_loss": -27.113880640052887, "global_step": 498165, "epoch": 6001, "val_loss": 6536730.0} {"train_loss": -26.94631004333496, "global_step": 498166, "epoch": 6002} {"train_loss": -26.795215606689453, "global_step": 498167, "epoch": 6002} {"train_loss": -26.956558227539062, "global_step": 498168, "epoch": 6002} {"train_loss": -26.759357452392578, "global_step": 498169, "epoch": 6002} {"train_loss": -26.44173240661621, "global_step": 498170, "epoch": 6002} {"train_loss": -26.28322410583496, "global_step": 498171, "epoch": 6002} {"train_loss": -27.000751495361328, "global_step": 498172, "epoch": 6002} {"train_loss": -27.0982666015625, "global_step": 498173, "epoch": 6002} {"train_loss": -26.803579330444336, "global_step": 498174, "epoch": 6002} {"train_loss": -26.615554809570312, "global_step": 498175, "epoch": 6002} {"train_loss": -26.974597930908203, "global_step": 498176, "epoch": 6002} {"train_loss": -27.008655548095703, "global_step": 498177, "epoch": 6002} {"train_loss": -26.9658203125, "global_step": 498178, "epoch": 6002} {"train_loss": -27.081928253173828, "global_step": 498179, "epoch": 6002} {"train_loss": -26.653884887695312, "global_step": 498180, "epoch": 6002} {"train_loss": -26.942792892456055, "global_step": 498181, "epoch": 6002} {"train_loss": -27.09929847717285, "global_step": 498182, "epoch": 6002} {"train_loss": -27.208948135375977, "global_step": 498183, "epoch": 6002} {"train_loss": -27.124326705932617, "global_step": 498184, "epoch": 6002} {"train_loss": -26.992374420166016, "global_step": 498185, "epoch": 6002} {"train_loss": -27.030624389648438, "global_step": 498186, "epoch": 6002} {"train_loss": -27.228445053100586, "global_step": 498187, "epoch": 6002} {"train_loss": -27.04612159729004, "global_step": 498188, "epoch": 6002} {"train_loss": -27.24464225769043, "global_step": 498189, "epoch": 6002} {"train_loss": -27.01166343688965, "global_step": 498190, "epoch": 6002} {"train_loss": -27.294036865234375, "global_step": 498191, "epoch": 6002} {"train_loss": -27.5980224609375, "global_step": 498192, "epoch": 6002} {"train_loss": -27.557083129882812, "global_step": 498193, "epoch": 6002} {"train_loss": -27.064428329467773, "global_step": 498194, "epoch": 6002} {"train_loss": -26.944732666015625, "global_step": 498195, "epoch": 6002} {"train_loss": -27.528512954711914, "global_step": 498196, "epoch": 6002} {"train_loss": -27.295318603515625, "global_step": 498197, "epoch": 6002} {"train_loss": -27.161718368530273, "global_step": 498198, "epoch": 6002} {"train_loss": -26.537403106689453, "global_step": 498199, "epoch": 6002} {"train_loss": -26.855321884155273, "global_step": 498200, "epoch": 6002} {"train_loss": -27.34119987487793, "global_step": 498201, "epoch": 6002} {"train_loss": -27.081409454345703, "global_step": 498202, "epoch": 6002} {"train_loss": -27.27338981628418, "global_step": 498203, "epoch": 6002} {"train_loss": -27.116403579711914, "global_step": 498204, "epoch": 6002} {"train_loss": -27.0379581451416, "global_step": 498205, "epoch": 6002} {"train_loss": -27.287967681884766, "global_step": 498206, "epoch": 6002} {"train_loss": -27.3646183013916, "global_step": 498207, "epoch": 6002} {"train_loss": -27.3592529296875, "global_step": 498208, "epoch": 6002} {"train_loss": -27.656869888305664, "global_step": 498209, "epoch": 6002} {"train_loss": -26.902790069580078, "global_step": 498210, "epoch": 6002} {"train_loss": -27.424118041992188, "global_step": 498211, "epoch": 6002} {"train_loss": -27.297704696655273, "global_step": 498212, "epoch": 6002} {"train_loss": -27.142688751220703, "global_step": 498213, "epoch": 6002} {"train_loss": -27.492334365844727, "global_step": 498214, "epoch": 6002} {"train_loss": -27.347015380859375, "global_step": 498215, "epoch": 6002} {"train_loss": -27.514371871948242, "global_step": 498216, "epoch": 6002} {"train_loss": -27.582101821899414, "global_step": 498217, "epoch": 6002} {"train_loss": -27.448041915893555, "global_step": 498218, "epoch": 6002} {"train_loss": -27.737014770507812, "global_step": 498219, "epoch": 6002} {"train_loss": -27.346027374267578, "global_step": 498220, "epoch": 6002} {"train_loss": -27.258056640625, "global_step": 498221, "epoch": 6002} {"train_loss": -27.1181583404541, "global_step": 498222, "epoch": 6002} {"train_loss": -27.541357040405273, "global_step": 498223, "epoch": 6002} {"train_loss": -27.50689697265625, "global_step": 498224, "epoch": 6002} {"train_loss": -27.4503173828125, "global_step": 498225, "epoch": 6002} {"train_loss": -27.409595489501953, "global_step": 498226, "epoch": 6002} {"train_loss": -27.3978328704834, "global_step": 498227, "epoch": 6002} {"train_loss": -27.443628311157227, "global_step": 498228, "epoch": 6002} {"train_loss": -27.46490478515625, "global_step": 498229, "epoch": 6002} {"train_loss": -27.888708114624023, "global_step": 498230, "epoch": 6002} {"train_loss": -27.701187133789062, "global_step": 498231, "epoch": 6002} {"train_loss": -27.19581413269043, "global_step": 498232, "epoch": 6002} {"train_loss": -27.70240592956543, "global_step": 498233, "epoch": 6002} {"train_loss": -27.277801513671875, "global_step": 498234, "epoch": 6002} {"train_loss": -27.648303985595703, "global_step": 498235, "epoch": 6002} {"train_loss": -27.2017879486084, "global_step": 498236, "epoch": 6002} {"train_loss": -27.447265625, "global_step": 498237, "epoch": 6002} {"train_loss": -27.408660888671875, "global_step": 498238, "epoch": 6002} {"train_loss": -27.42354393005371, "global_step": 498239, "epoch": 6002} {"train_loss": -27.477319717407227, "global_step": 498240, "epoch": 6002} {"train_loss": -27.6435604095459, "global_step": 498241, "epoch": 6002} {"train_loss": -27.6821346282959, "global_step": 498242, "epoch": 6002} {"train_loss": -27.96763038635254, "global_step": 498243, "epoch": 6002} {"train_loss": -27.6511287689209, "global_step": 498244, "epoch": 6002} {"train_loss": -27.639312744140625, "global_step": 498245, "epoch": 6002} {"train_loss": -27.700790405273438, "global_step": 498246, "epoch": 6002} {"train_loss": -27.488574981689453, "global_step": 498247, "epoch": 6002} {"train_loss": -27.258097866931593, "global_step": 498248, "epoch": 6002, "val_loss": 6511951.0} {"train_loss": -27.343103408813477, "global_step": 498249, "epoch": 6003} {"train_loss": -26.87369728088379, "global_step": 498250, "epoch": 6003} {"train_loss": -26.435705184936523, "global_step": 498251, "epoch": 6003} {"train_loss": -26.437292098999023, "global_step": 498252, "epoch": 6003} {"train_loss": -26.464019775390625, "global_step": 498253, "epoch": 6003} {"train_loss": -26.130163192749023, "global_step": 498254, "epoch": 6003} {"train_loss": -26.723480224609375, "global_step": 498255, "epoch": 6003} {"train_loss": -27.14306640625, "global_step": 498256, "epoch": 6003} {"train_loss": -27.36964225769043, "global_step": 498257, "epoch": 6003} {"train_loss": -26.695453643798828, "global_step": 498258, "epoch": 6003} {"train_loss": -27.240894317626953, "global_step": 498259, "epoch": 6003} {"train_loss": -27.340972900390625, "global_step": 498260, "epoch": 6003} {"train_loss": -27.070287704467773, "global_step": 498261, "epoch": 6003} {"train_loss": -27.392475128173828, "global_step": 498262, "epoch": 6003} {"train_loss": -27.232501983642578, "global_step": 498263, "epoch": 6003} {"train_loss": -27.242664337158203, "global_step": 498264, "epoch": 6003} {"train_loss": -27.023054122924805, "global_step": 498265, "epoch": 6003} {"train_loss": -27.19403648376465, "global_step": 498266, "epoch": 6003} {"train_loss": -27.25819206237793, "global_step": 498267, "epoch": 6003} {"train_loss": -27.128711700439453, "global_step": 498268, "epoch": 6003} {"train_loss": -27.297718048095703, "global_step": 498269, "epoch": 6003} {"train_loss": -27.537078857421875, "global_step": 498270, "epoch": 6003} {"train_loss": -26.907154083251953, "global_step": 498271, "epoch": 6003} {"train_loss": -27.536136627197266, "global_step": 498272, "epoch": 6003} {"train_loss": -27.43836784362793, "global_step": 498273, "epoch": 6003} {"train_loss": -27.446456909179688, "global_step": 498274, "epoch": 6003} {"train_loss": -27.121234893798828, "global_step": 498275, "epoch": 6003} {"train_loss": -27.535755157470703, "global_step": 498276, "epoch": 6003} {"train_loss": -27.010629653930664, "global_step": 498277, "epoch": 6003} {"train_loss": -27.570871353149414, "global_step": 498278, "epoch": 6003} {"train_loss": -27.281787872314453, "global_step": 498279, "epoch": 6003} {"train_loss": -27.314407348632812, "global_step": 498280, "epoch": 6003} {"train_loss": -27.333417892456055, "global_step": 498281, "epoch": 6003} {"train_loss": -27.42732048034668, "global_step": 498282, "epoch": 6003} {"train_loss": -27.327795028686523, "global_step": 498283, "epoch": 6003} {"train_loss": -26.99860954284668, "global_step": 498284, "epoch": 6003} {"train_loss": -27.228551864624023, "global_step": 498285, "epoch": 6003} {"train_loss": -27.315332412719727, "global_step": 498286, "epoch": 6003} {"train_loss": -27.219568252563477, "global_step": 498287, "epoch": 6003} {"train_loss": -27.3947811126709, "global_step": 498288, "epoch": 6003} {"train_loss": -27.0693416595459, "global_step": 498289, "epoch": 6003} {"train_loss": -27.430953979492188, "global_step": 498290, "epoch": 6003} {"train_loss": -27.27615737915039, "global_step": 498291, "epoch": 6003} {"train_loss": -27.788171768188477, "global_step": 498292, "epoch": 6003} {"train_loss": -27.088098526000977, "global_step": 498293, "epoch": 6003} {"train_loss": -27.989049911499023, "global_step": 498294, "epoch": 6003} {"train_loss": -27.534460067749023, "global_step": 498295, "epoch": 6003} {"train_loss": -27.20448875427246, "global_step": 498296, "epoch": 6003} {"train_loss": -27.02606773376465, "global_step": 498297, "epoch": 6003} {"train_loss": -27.492483139038086, "global_step": 498298, "epoch": 6003} {"train_loss": -27.677457809448242, "global_step": 498299, "epoch": 6003} {"train_loss": -27.2878360748291, "global_step": 498300, "epoch": 6003} {"train_loss": -27.457656860351562, "global_step": 498301, "epoch": 6003} {"train_loss": -27.478307723999023, "global_step": 498302, "epoch": 6003} {"train_loss": -27.603973388671875, "global_step": 498303, "epoch": 6003} {"train_loss": -27.470783233642578, "global_step": 498304, "epoch": 6003} {"train_loss": -27.575422286987305, "global_step": 498305, "epoch": 6003} {"train_loss": -27.037921905517578, "global_step": 498306, "epoch": 6003} {"train_loss": -26.94778823852539, "global_step": 498307, "epoch": 6003} {"train_loss": -27.3729248046875, "global_step": 498308, "epoch": 6003} {"train_loss": -27.2244815826416, "global_step": 498309, "epoch": 6003} {"train_loss": -26.816211700439453, "global_step": 498310, "epoch": 6003} {"train_loss": -27.340497970581055, "global_step": 498311, "epoch": 6003} {"train_loss": -27.6603946685791, "global_step": 498312, "epoch": 6003} {"train_loss": -27.33639907836914, "global_step": 498313, "epoch": 6003} {"train_loss": -27.3705997467041, "global_step": 498314, "epoch": 6003} {"train_loss": -27.577672958374023, "global_step": 498315, "epoch": 6003} {"train_loss": -27.601430892944336, "global_step": 498316, "epoch": 6003} {"train_loss": -27.6129093170166, "global_step": 498317, "epoch": 6003} {"train_loss": -27.299579620361328, "global_step": 498318, "epoch": 6003} {"train_loss": -27.429248809814453, "global_step": 498319, "epoch": 6003} {"train_loss": -27.672168731689453, "global_step": 498320, "epoch": 6003} {"train_loss": -27.600732803344727, "global_step": 498321, "epoch": 6003} {"train_loss": -27.595108032226562, "global_step": 498322, "epoch": 6003} {"train_loss": -27.35182762145996, "global_step": 498323, "epoch": 6003} {"train_loss": -27.59286880493164, "global_step": 498324, "epoch": 6003} {"train_loss": -27.38677978515625, "global_step": 498325, "epoch": 6003} {"train_loss": -27.50274658203125, "global_step": 498326, "epoch": 6003} {"train_loss": -27.534351348876953, "global_step": 498327, "epoch": 6003} {"train_loss": -27.390396118164062, "global_step": 498328, "epoch": 6003} {"train_loss": -27.6647891998291, "global_step": 498329, "epoch": 6003} {"train_loss": -27.327716827392578, "global_step": 498330, "epoch": 6003} {"train_loss": -27.30132672872888, "global_step": 498331, "epoch": 6003, "val_loss": 6491721.0} {"train_loss": -27.02168083190918, "global_step": 498332, "epoch": 6004} {"train_loss": -26.791120529174805, "global_step": 498333, "epoch": 6004} {"train_loss": -26.394866943359375, "global_step": 498334, "epoch": 6004} {"train_loss": -27.104761123657227, "global_step": 498335, "epoch": 6004} {"train_loss": -26.81442642211914, "global_step": 498336, "epoch": 6004} {"train_loss": -26.958295822143555, "global_step": 498337, "epoch": 6004} {"train_loss": -26.53080177307129, "global_step": 498338, "epoch": 6004} {"train_loss": -26.859243392944336, "global_step": 498339, "epoch": 6004} {"train_loss": -26.724822998046875, "global_step": 498340, "epoch": 6004} {"train_loss": -27.30750846862793, "global_step": 498341, "epoch": 6004} {"train_loss": -26.778553009033203, "global_step": 498342, "epoch": 6004} {"train_loss": -26.942096710205078, "global_step": 498343, "epoch": 6004} {"train_loss": -27.120203018188477, "global_step": 498344, "epoch": 6004} {"train_loss": -26.930744171142578, "global_step": 498345, "epoch": 6004} {"train_loss": -26.842573165893555, "global_step": 498346, "epoch": 6004} {"train_loss": -27.219507217407227, "global_step": 498347, "epoch": 6004} {"train_loss": -27.07046890258789, "global_step": 498348, "epoch": 6004} {"train_loss": -26.989044189453125, "global_step": 498349, "epoch": 6004} {"train_loss": -27.093902587890625, "global_step": 498350, "epoch": 6004} {"train_loss": -27.170459747314453, "global_step": 498351, "epoch": 6004} {"train_loss": -26.973407745361328, "global_step": 498352, "epoch": 6004} {"train_loss": -27.226001739501953, "global_step": 498353, "epoch": 6004} {"train_loss": -27.125003814697266, "global_step": 498354, "epoch": 6004} {"train_loss": -27.0847225189209, "global_step": 498355, "epoch": 6004} {"train_loss": -27.1165714263916, "global_step": 498356, "epoch": 6004} {"train_loss": -27.18109703063965, "global_step": 498357, "epoch": 6004} {"train_loss": -27.268701553344727, "global_step": 498358, "epoch": 6004} {"train_loss": -27.50826072692871, "global_step": 498359, "epoch": 6004} {"train_loss": -27.034948348999023, "global_step": 498360, "epoch": 6004} {"train_loss": -27.137067794799805, "global_step": 498361, "epoch": 6004} {"train_loss": -27.12000846862793, "global_step": 498362, "epoch": 6004} {"train_loss": -27.2294921875, "global_step": 498363, "epoch": 6004} {"train_loss": -27.269193649291992, "global_step": 498364, "epoch": 6004} {"train_loss": -27.262250900268555, "global_step": 498365, "epoch": 6004} {"train_loss": -26.913888931274414, "global_step": 498366, "epoch": 6004} {"train_loss": -27.405920028686523, "global_step": 498367, "epoch": 6004} {"train_loss": -27.021371841430664, "global_step": 498368, "epoch": 6004} {"train_loss": -27.225955963134766, "global_step": 498369, "epoch": 6004} {"train_loss": -27.56601333618164, "global_step": 498370, "epoch": 6004} {"train_loss": -27.348541259765625, "global_step": 498371, "epoch": 6004} {"train_loss": -27.006010055541992, "global_step": 498372, "epoch": 6004} {"train_loss": -27.173017501831055, "global_step": 498373, "epoch": 6004} {"train_loss": -27.24812126159668, "global_step": 498374, "epoch": 6004} {"train_loss": -27.61280632019043, "global_step": 498375, "epoch": 6004} {"train_loss": -27.574371337890625, "global_step": 498376, "epoch": 6004} {"train_loss": -26.90192222595215, "global_step": 498377, "epoch": 6004} {"train_loss": -27.271759033203125, "global_step": 498378, "epoch": 6004} {"train_loss": -27.50934410095215, "global_step": 498379, "epoch": 6004} {"train_loss": -27.3176326751709, "global_step": 498380, "epoch": 6004} {"train_loss": -27.772602081298828, "global_step": 498381, "epoch": 6004} {"train_loss": -27.426252365112305, "global_step": 498382, "epoch": 6004} {"train_loss": -27.412704467773438, "global_step": 498383, "epoch": 6004} {"train_loss": -27.452611923217773, "global_step": 498384, "epoch": 6004} {"train_loss": -27.448776245117188, "global_step": 498385, "epoch": 6004} {"train_loss": -27.498220443725586, "global_step": 498386, "epoch": 6004} {"train_loss": -27.5295467376709, "global_step": 498387, "epoch": 6004} {"train_loss": -27.176137924194336, "global_step": 498388, "epoch": 6004} {"train_loss": -27.0790958404541, "global_step": 498389, "epoch": 6004} {"train_loss": -26.96912956237793, "global_step": 498390, "epoch": 6004} {"train_loss": -27.449060440063477, "global_step": 498391, "epoch": 6004} {"train_loss": -27.18231773376465, "global_step": 498392, "epoch": 6004} {"train_loss": -27.50933265686035, "global_step": 498393, "epoch": 6004} {"train_loss": -27.22037124633789, "global_step": 498394, "epoch": 6004} {"train_loss": -27.65192222595215, "global_step": 498395, "epoch": 6004} {"train_loss": -27.555749893188477, "global_step": 498396, "epoch": 6004} {"train_loss": -27.53594398498535, "global_step": 498397, "epoch": 6004} {"train_loss": -27.8217830657959, "global_step": 498398, "epoch": 6004} {"train_loss": -27.3519344329834, "global_step": 498399, "epoch": 6004} {"train_loss": -27.377256393432617, "global_step": 498400, "epoch": 6004} {"train_loss": -27.284067153930664, "global_step": 498401, "epoch": 6004} {"train_loss": -27.776914596557617, "global_step": 498402, "epoch": 6004} {"train_loss": -27.26584815979004, "global_step": 498403, "epoch": 6004} {"train_loss": -27.738306045532227, "global_step": 498404, "epoch": 6004} {"train_loss": -27.339111328125, "global_step": 498405, "epoch": 6004} {"train_loss": -28.030805587768555, "global_step": 498406, "epoch": 6004} {"train_loss": -27.471593856811523, "global_step": 498407, "epoch": 6004} {"train_loss": -27.87841796875, "global_step": 498408, "epoch": 6004} {"train_loss": -27.858993530273438, "global_step": 498409, "epoch": 6004} {"train_loss": -27.557119369506836, "global_step": 498410, "epoch": 6004} {"train_loss": -27.405736923217773, "global_step": 498411, "epoch": 6004} {"train_loss": -27.496021270751953, "global_step": 498412, "epoch": 6004} {"train_loss": -27.412153244018555, "global_step": 498413, "epoch": 6004} {"train_loss": -27.26997701805758, "global_step": 498414, "epoch": 6004, "val_loss": 6545292.5} {"train_loss": -27.20639991760254, "global_step": 498415, "epoch": 6005} {"train_loss": -27.002283096313477, "global_step": 498416, "epoch": 6005} {"train_loss": -26.85621452331543, "global_step": 498417, "epoch": 6005} {"train_loss": -26.403303146362305, "global_step": 498418, "epoch": 6005} {"train_loss": -26.886138916015625, "global_step": 498419, "epoch": 6005} {"train_loss": -27.012723922729492, "global_step": 498420, "epoch": 6005} {"train_loss": -26.993093490600586, "global_step": 498421, "epoch": 6005} {"train_loss": -27.5308837890625, "global_step": 498422, "epoch": 6005} {"train_loss": -27.469594955444336, "global_step": 498423, "epoch": 6005} {"train_loss": -27.273807525634766, "global_step": 498424, "epoch": 6005} {"train_loss": -27.09783363342285, "global_step": 498425, "epoch": 6005} {"train_loss": -27.333759307861328, "global_step": 498426, "epoch": 6005} {"train_loss": -27.2216854095459, "global_step": 498427, "epoch": 6005} {"train_loss": -27.128889083862305, "global_step": 498428, "epoch": 6005} {"train_loss": -27.45733070373535, "global_step": 498429, "epoch": 6005} {"train_loss": -26.8338680267334, "global_step": 498430, "epoch": 6005} {"train_loss": -27.548688888549805, "global_step": 498431, "epoch": 6005} {"train_loss": -27.242151260375977, "global_step": 498432, "epoch": 6005} {"train_loss": -27.196125030517578, "global_step": 498433, "epoch": 6005} {"train_loss": -27.389392852783203, "global_step": 498434, "epoch": 6005} {"train_loss": -27.39594841003418, "global_step": 498435, "epoch": 6005} {"train_loss": -27.15283203125, "global_step": 498436, "epoch": 6005} {"train_loss": -27.076566696166992, "global_step": 498437, "epoch": 6005} {"train_loss": -27.497180938720703, "global_step": 498438, "epoch": 6005} {"train_loss": -27.3763427734375, "global_step": 498439, "epoch": 6005} {"train_loss": -27.268238067626953, "global_step": 498440, "epoch": 6005} {"train_loss": -27.66522789001465, "global_step": 498441, "epoch": 6005} {"train_loss": -27.742361068725586, "global_step": 498442, "epoch": 6005} {"train_loss": -27.535022735595703, "global_step": 498443, "epoch": 6005} {"train_loss": -27.574848175048828, "global_step": 498444, "epoch": 6005} {"train_loss": -27.800397872924805, "global_step": 498445, "epoch": 6005} {"train_loss": -27.9049072265625, "global_step": 498446, "epoch": 6005} {"train_loss": -27.376462936401367, "global_step": 498447, "epoch": 6005} {"train_loss": -27.59639549255371, "global_step": 498448, "epoch": 6005} {"train_loss": -27.624176025390625, "global_step": 498449, "epoch": 6005} {"train_loss": -27.25068473815918, "global_step": 498450, "epoch": 6005} {"train_loss": -27.2761287689209, "global_step": 498451, "epoch": 6005} {"train_loss": -27.383222579956055, "global_step": 498452, "epoch": 6005} {"train_loss": -27.19451332092285, "global_step": 498453, "epoch": 6005} {"train_loss": -27.581140518188477, "global_step": 498454, "epoch": 6005} {"train_loss": -27.097370147705078, "global_step": 498455, "epoch": 6005} {"train_loss": -26.745813369750977, "global_step": 498456, "epoch": 6005} {"train_loss": -26.749536514282227, "global_step": 498457, "epoch": 6005} {"train_loss": -27.02602195739746, "global_step": 498458, "epoch": 6005} {"train_loss": -27.14466667175293, "global_step": 498459, "epoch": 6005} {"train_loss": -26.821735382080078, "global_step": 498460, "epoch": 6005} {"train_loss": -26.076892852783203, "global_step": 498461, "epoch": 6005} {"train_loss": -27.16334342956543, "global_step": 498462, "epoch": 6005} {"train_loss": -27.21073341369629, "global_step": 498463, "epoch": 6005} {"train_loss": -26.729511260986328, "global_step": 498464, "epoch": 6005} {"train_loss": -26.61530113220215, "global_step": 498465, "epoch": 6005} {"train_loss": -27.32329750061035, "global_step": 498466, "epoch": 6005} {"train_loss": -26.91645622253418, "global_step": 498467, "epoch": 6005} {"train_loss": -26.84228515625, "global_step": 498468, "epoch": 6005} {"train_loss": -26.7368106842041, "global_step": 498469, "epoch": 6005} {"train_loss": -27.45123291015625, "global_step": 498470, "epoch": 6005} {"train_loss": -27.097440719604492, "global_step": 498471, "epoch": 6005} {"train_loss": -26.885025024414062, "global_step": 498472, "epoch": 6005} {"train_loss": -27.252954483032227, "global_step": 498473, "epoch": 6005} {"train_loss": -27.229888916015625, "global_step": 498474, "epoch": 6005} {"train_loss": -27.42243003845215, "global_step": 498475, "epoch": 6005} {"train_loss": -27.49787712097168, "global_step": 498476, "epoch": 6005} {"train_loss": -27.26371192932129, "global_step": 498477, "epoch": 6005} {"train_loss": -27.475141525268555, "global_step": 498478, "epoch": 6005} {"train_loss": -27.438562393188477, "global_step": 498479, "epoch": 6005} {"train_loss": -27.591516494750977, "global_step": 498480, "epoch": 6005} {"train_loss": -27.427600860595703, "global_step": 498481, "epoch": 6005} {"train_loss": -27.517993927001953, "global_step": 498482, "epoch": 6005} {"train_loss": -26.956470489501953, "global_step": 498483, "epoch": 6005} {"train_loss": -27.418115615844727, "global_step": 498484, "epoch": 6005} {"train_loss": -27.391199111938477, "global_step": 498485, "epoch": 6005} {"train_loss": -27.4456787109375, "global_step": 498486, "epoch": 6005} {"train_loss": -28.036300659179688, "global_step": 498487, "epoch": 6005} {"train_loss": -27.689111709594727, "global_step": 498488, "epoch": 6005} {"train_loss": -27.572620391845703, "global_step": 498489, "epoch": 6005} {"train_loss": -27.66623306274414, "global_step": 498490, "epoch": 6005} {"train_loss": -27.311752319335938, "global_step": 498491, "epoch": 6005} {"train_loss": -27.4478759765625, "global_step": 498492, "epoch": 6005} {"train_loss": -27.891523361206055, "global_step": 498493, "epoch": 6005} {"train_loss": -27.375751495361328, "global_step": 498494, "epoch": 6005} {"train_loss": -27.533002853393555, "global_step": 498495, "epoch": 6005} {"train_loss": -27.205921173095703, "global_step": 498496, "epoch": 6005} {"train_loss": -27.27298711294151, "global_step": 498497, "epoch": 6005, "val_loss": 6540240.5} {"train_loss": -26.5478572845459, "global_step": 498498, "epoch": 6006} {"train_loss": -26.958036422729492, "global_step": 498499, "epoch": 6006} {"train_loss": -26.752939224243164, "global_step": 498500, "epoch": 6006} {"train_loss": -26.638280868530273, "global_step": 498501, "epoch": 6006} {"train_loss": -26.648969650268555, "global_step": 498502, "epoch": 6006} {"train_loss": -26.146270751953125, "global_step": 498503, "epoch": 6006} {"train_loss": -26.227659225463867, "global_step": 498504, "epoch": 6006} {"train_loss": -26.874963760375977, "global_step": 498505, "epoch": 6006} {"train_loss": -26.512714385986328, "global_step": 498506, "epoch": 6006} {"train_loss": -26.507827758789062, "global_step": 498507, "epoch": 6006} {"train_loss": -26.925222396850586, "global_step": 498508, "epoch": 6006} {"train_loss": -26.507604598999023, "global_step": 498509, "epoch": 6006} {"train_loss": -26.853235244750977, "global_step": 498510, "epoch": 6006} {"train_loss": -27.076129913330078, "global_step": 498511, "epoch": 6006} {"train_loss": -27.014575958251953, "global_step": 498512, "epoch": 6006} {"train_loss": -26.773426055908203, "global_step": 498513, "epoch": 6006} {"train_loss": -27.196182250976562, "global_step": 498514, "epoch": 6006} {"train_loss": -27.081201553344727, "global_step": 498515, "epoch": 6006} {"train_loss": -27.079376220703125, "global_step": 498516, "epoch": 6006} {"train_loss": -27.0271053314209, "global_step": 498517, "epoch": 6006} {"train_loss": -27.055139541625977, "global_step": 498518, "epoch": 6006} {"train_loss": -27.399450302124023, "global_step": 498519, "epoch": 6006} {"train_loss": -27.450464248657227, "global_step": 498520, "epoch": 6006} {"train_loss": -27.333791732788086, "global_step": 498521, "epoch": 6006} {"train_loss": -27.267059326171875, "global_step": 498522, "epoch": 6006} {"train_loss": -27.352930068969727, "global_step": 498523, "epoch": 6006} {"train_loss": -27.23838233947754, "global_step": 498524, "epoch": 6006} {"train_loss": -27.178604125976562, "global_step": 498525, "epoch": 6006} {"train_loss": -27.269428253173828, "global_step": 498526, "epoch": 6006} {"train_loss": -27.255252838134766, "global_step": 498527, "epoch": 6006} {"train_loss": -27.58379554748535, "global_step": 498528, "epoch": 6006} {"train_loss": -27.50345802307129, "global_step": 498529, "epoch": 6006} {"train_loss": -27.302536010742188, "global_step": 498530, "epoch": 6006} {"train_loss": -27.347919464111328, "global_step": 498531, "epoch": 6006} {"train_loss": -27.152860641479492, "global_step": 498532, "epoch": 6006} {"train_loss": -27.910400390625, "global_step": 498533, "epoch": 6006} {"train_loss": -27.773273468017578, "global_step": 498534, "epoch": 6006} {"train_loss": -27.378997802734375, "global_step": 498535, "epoch": 6006} {"train_loss": -27.26197624206543, "global_step": 498536, "epoch": 6006} {"train_loss": -27.29608726501465, "global_step": 498537, "epoch": 6006} {"train_loss": -27.490951538085938, "global_step": 498538, "epoch": 6006} {"train_loss": -27.31560707092285, "global_step": 498539, "epoch": 6006} {"train_loss": -27.4997501373291, "global_step": 498540, "epoch": 6006} {"train_loss": -27.62578773498535, "global_step": 498541, "epoch": 6006} {"train_loss": -27.83042335510254, "global_step": 498542, "epoch": 6006} {"train_loss": -27.50823402404785, "global_step": 498543, "epoch": 6006} {"train_loss": -27.326990127563477, "global_step": 498544, "epoch": 6006} {"train_loss": -27.638702392578125, "global_step": 498545, "epoch": 6006} {"train_loss": -27.942800521850586, "global_step": 498546, "epoch": 6006} {"train_loss": -27.2861328125, "global_step": 498547, "epoch": 6006} {"train_loss": -27.722822189331055, "global_step": 498548, "epoch": 6006} {"train_loss": -27.73487663269043, "global_step": 498549, "epoch": 6006} {"train_loss": -27.76969337463379, "global_step": 498550, "epoch": 6006} {"train_loss": -27.294992446899414, "global_step": 498551, "epoch": 6006} {"train_loss": -27.50783348083496, "global_step": 498552, "epoch": 6006} {"train_loss": -27.340505599975586, "global_step": 498553, "epoch": 6006} {"train_loss": -27.6669864654541, "global_step": 498554, "epoch": 6006} {"train_loss": -27.635913848876953, "global_step": 498555, "epoch": 6006} {"train_loss": -27.56995964050293, "global_step": 498556, "epoch": 6006} {"train_loss": -27.7996826171875, "global_step": 498557, "epoch": 6006} {"train_loss": -27.327667236328125, "global_step": 498558, "epoch": 6006} {"train_loss": -27.329242706298828, "global_step": 498559, "epoch": 6006} {"train_loss": -27.316343307495117, "global_step": 498560, "epoch": 6006} {"train_loss": -27.26666259765625, "global_step": 498561, "epoch": 6006} {"train_loss": -27.452896118164062, "global_step": 498562, "epoch": 6006} {"train_loss": -27.1294002532959, "global_step": 498563, "epoch": 6006} {"train_loss": -27.227527618408203, "global_step": 498564, "epoch": 6006} {"train_loss": -27.4963321685791, "global_step": 498565, "epoch": 6006} {"train_loss": -26.972562789916992, "global_step": 498566, "epoch": 6006} {"train_loss": -26.732030868530273, "global_step": 498567, "epoch": 6006} {"train_loss": -26.673070907592773, "global_step": 498568, "epoch": 6006} {"train_loss": -27.032669067382812, "global_step": 498569, "epoch": 6006} {"train_loss": -27.650379180908203, "global_step": 498570, "epoch": 6006} {"train_loss": -27.403491973876953, "global_step": 498571, "epoch": 6006} {"train_loss": -27.3419189453125, "global_step": 498572, "epoch": 6006} {"train_loss": -27.877628326416016, "global_step": 498573, "epoch": 6006} {"train_loss": -27.227460861206055, "global_step": 498574, "epoch": 6006} {"train_loss": -27.289716720581055, "global_step": 498575, "epoch": 6006} {"train_loss": -27.2518367767334, "global_step": 498576, "epoch": 6006} {"train_loss": -27.67438316345215, "global_step": 498577, "epoch": 6006} {"train_loss": -27.21670913696289, "global_step": 498578, "epoch": 6006} {"train_loss": -27.583648681640625, "global_step": 498579, "epoch": 6006} {"train_loss": -27.247040185583643, "global_step": 498580, "epoch": 6006, "val_loss": 6717000.0} {"train_loss": -26.21790885925293, "global_step": 498581, "epoch": 6007} {"train_loss": -27.116506576538086, "global_step": 498582, "epoch": 6007} {"train_loss": -26.980422973632812, "global_step": 498583, "epoch": 6007} {"train_loss": -26.6372013092041, "global_step": 498584, "epoch": 6007} {"train_loss": -27.006208419799805, "global_step": 498585, "epoch": 6007} {"train_loss": -26.818801879882812, "global_step": 498586, "epoch": 6007} {"train_loss": -26.4902400970459, "global_step": 498587, "epoch": 6007} {"train_loss": -26.790075302124023, "global_step": 498588, "epoch": 6007} {"train_loss": -26.988584518432617, "global_step": 498589, "epoch": 6007} {"train_loss": -27.012624740600586, "global_step": 498590, "epoch": 6007} {"train_loss": -27.176288604736328, "global_step": 498591, "epoch": 6007} {"train_loss": -27.2205867767334, "global_step": 498592, "epoch": 6007} {"train_loss": -27.133319854736328, "global_step": 498593, "epoch": 6007} {"train_loss": -27.061330795288086, "global_step": 498594, "epoch": 6007} {"train_loss": -27.34078025817871, "global_step": 498595, "epoch": 6007} {"train_loss": -27.060022354125977, "global_step": 498596, "epoch": 6007} {"train_loss": -27.111499786376953, "global_step": 498597, "epoch": 6007} {"train_loss": -27.5033016204834, "global_step": 498598, "epoch": 6007} {"train_loss": -27.17463493347168, "global_step": 498599, "epoch": 6007} {"train_loss": -27.392566680908203, "global_step": 498600, "epoch": 6007} {"train_loss": -27.1297607421875, "global_step": 498601, "epoch": 6007} {"train_loss": -27.22119140625, "global_step": 498602, "epoch": 6007} {"train_loss": -27.298572540283203, "global_step": 498603, "epoch": 6007} {"train_loss": -27.758981704711914, "global_step": 498604, "epoch": 6007} {"train_loss": -27.399093627929688, "global_step": 498605, "epoch": 6007} {"train_loss": -27.48905372619629, "global_step": 498606, "epoch": 6007} {"train_loss": -27.455774307250977, "global_step": 498607, "epoch": 6007} {"train_loss": -27.1722354888916, "global_step": 498608, "epoch": 6007} {"train_loss": -27.280553817749023, "global_step": 498609, "epoch": 6007} {"train_loss": -27.59145164489746, "global_step": 498610, "epoch": 6007} {"train_loss": -27.47186851501465, "global_step": 498611, "epoch": 6007} {"train_loss": -27.489377975463867, "global_step": 498612, "epoch": 6007} {"train_loss": -27.72475242614746, "global_step": 498613, "epoch": 6007} {"train_loss": -27.486600875854492, "global_step": 498614, "epoch": 6007} {"train_loss": -27.51953125, "global_step": 498615, "epoch": 6007} {"train_loss": -27.499433517456055, "global_step": 498616, "epoch": 6007} {"train_loss": -27.73433494567871, "global_step": 498617, "epoch": 6007} {"train_loss": -27.204303741455078, "global_step": 498618, "epoch": 6007} {"train_loss": -27.680572509765625, "global_step": 498619, "epoch": 6007} {"train_loss": -27.911911010742188, "global_step": 498620, "epoch": 6007} {"train_loss": -28.098134994506836, "global_step": 498621, "epoch": 6007} {"train_loss": -27.31586265563965, "global_step": 498622, "epoch": 6007} {"train_loss": -27.460906982421875, "global_step": 498623, "epoch": 6007} {"train_loss": -27.567533493041992, "global_step": 498624, "epoch": 6007} {"train_loss": -27.276479721069336, "global_step": 498625, "epoch": 6007} {"train_loss": -27.559656143188477, "global_step": 498626, "epoch": 6007} {"train_loss": -27.668182373046875, "global_step": 498627, "epoch": 6007} {"train_loss": -27.597394943237305, "global_step": 498628, "epoch": 6007} {"train_loss": -27.424604415893555, "global_step": 498629, "epoch": 6007} {"train_loss": -27.7687931060791, "global_step": 498630, "epoch": 6007} {"train_loss": -27.610198974609375, "global_step": 498631, "epoch": 6007} {"train_loss": -27.160430908203125, "global_step": 498632, "epoch": 6007} {"train_loss": -27.9409122467041, "global_step": 498633, "epoch": 6007} {"train_loss": -27.42624855041504, "global_step": 498634, "epoch": 6007} {"train_loss": -27.367238998413086, "global_step": 498635, "epoch": 6007} {"train_loss": -27.994409561157227, "global_step": 498636, "epoch": 6007} {"train_loss": -27.448266983032227, "global_step": 498637, "epoch": 6007} {"train_loss": -27.404062271118164, "global_step": 498638, "epoch": 6007} {"train_loss": -27.43636131286621, "global_step": 498639, "epoch": 6007} {"train_loss": -27.395862579345703, "global_step": 498640, "epoch": 6007} {"train_loss": -27.27545166015625, "global_step": 498641, "epoch": 6007} {"train_loss": -27.084096908569336, "global_step": 498642, "epoch": 6007} {"train_loss": -27.02192497253418, "global_step": 498643, "epoch": 6007} {"train_loss": -26.49751853942871, "global_step": 498644, "epoch": 6007} {"train_loss": -26.58280372619629, "global_step": 498645, "epoch": 6007} {"train_loss": -26.824554443359375, "global_step": 498646, "epoch": 6007} {"train_loss": -26.95393943786621, "global_step": 498647, "epoch": 6007} {"train_loss": -27.425634384155273, "global_step": 498648, "epoch": 6007} {"train_loss": -26.92578125, "global_step": 498649, "epoch": 6007} {"train_loss": -26.911413192749023, "global_step": 498650, "epoch": 6007} {"train_loss": -26.86927604675293, "global_step": 498651, "epoch": 6007} {"train_loss": -27.284835815429688, "global_step": 498652, "epoch": 6007} {"train_loss": -27.105792999267578, "global_step": 498653, "epoch": 6007} {"train_loss": -27.286222457885742, "global_step": 498654, "epoch": 6007} {"train_loss": -27.48274040222168, "global_step": 498655, "epoch": 6007} {"train_loss": -27.362451553344727, "global_step": 498656, "epoch": 6007} {"train_loss": -27.489654541015625, "global_step": 498657, "epoch": 6007} {"train_loss": -27.156829833984375, "global_step": 498658, "epoch": 6007} {"train_loss": -27.64931297302246, "global_step": 498659, "epoch": 6007} {"train_loss": -27.69085121154785, "global_step": 498660, "epoch": 6007} {"train_loss": -27.274738311767578, "global_step": 498661, "epoch": 6007} {"train_loss": -27.68729591369629, "global_step": 498662, "epoch": 6007} {"train_loss": -27.300185192062195, "global_step": 498663, "epoch": 6007, "val_loss": 6628779.0} {"train_loss": -26.30057144165039, "global_step": 498664, "epoch": 6008} {"train_loss": -26.843780517578125, "global_step": 498665, "epoch": 6008} {"train_loss": -26.378860473632812, "global_step": 498666, "epoch": 6008} {"train_loss": -26.974157333374023, "global_step": 498667, "epoch": 6008} {"train_loss": -26.298526763916016, "global_step": 498668, "epoch": 6008} {"train_loss": -26.965967178344727, "global_step": 498669, "epoch": 6008} {"train_loss": -26.744770050048828, "global_step": 498670, "epoch": 6008} {"train_loss": -26.766782760620117, "global_step": 498671, "epoch": 6008} {"train_loss": -27.13815689086914, "global_step": 498672, "epoch": 6008} {"train_loss": -26.644872665405273, "global_step": 498673, "epoch": 6008} {"train_loss": -26.862043380737305, "global_step": 498674, "epoch": 6008} {"train_loss": -26.962553024291992, "global_step": 498675, "epoch": 6008} {"train_loss": -27.10733985900879, "global_step": 498676, "epoch": 6008} {"train_loss": -27.292469024658203, "global_step": 498677, "epoch": 6008} {"train_loss": -26.786828994750977, "global_step": 498678, "epoch": 6008} {"train_loss": -27.012388229370117, "global_step": 498679, "epoch": 6008} {"train_loss": -27.24482536315918, "global_step": 498680, "epoch": 6008} {"train_loss": -26.896366119384766, "global_step": 498681, "epoch": 6008} {"train_loss": -26.95965576171875, "global_step": 498682, "epoch": 6008} {"train_loss": -27.08005714416504, "global_step": 498683, "epoch": 6008} {"train_loss": -26.8613338470459, "global_step": 498684, "epoch": 6008} {"train_loss": -27.087453842163086, "global_step": 498685, "epoch": 6008} {"train_loss": -27.218921661376953, "global_step": 498686, "epoch": 6008} {"train_loss": -27.30843162536621, "global_step": 498687, "epoch": 6008} {"train_loss": -27.494037628173828, "global_step": 498688, "epoch": 6008} {"train_loss": -27.164758682250977, "global_step": 498689, "epoch": 6008} {"train_loss": -27.239002227783203, "global_step": 498690, "epoch": 6008} {"train_loss": -27.47939109802246, "global_step": 498691, "epoch": 6008} {"train_loss": -27.488706588745117, "global_step": 498692, "epoch": 6008} {"train_loss": -27.460865020751953, "global_step": 498693, "epoch": 6008} {"train_loss": -27.353357315063477, "global_step": 498694, "epoch": 6008} {"train_loss": -27.443456649780273, "global_step": 498695, "epoch": 6008} {"train_loss": -27.034616470336914, "global_step": 498696, "epoch": 6008} {"train_loss": -27.0892276763916, "global_step": 498697, "epoch": 6008} {"train_loss": -27.563858032226562, "global_step": 498698, "epoch": 6008} {"train_loss": -27.5538387298584, "global_step": 498699, "epoch": 6008} {"train_loss": -27.342126846313477, "global_step": 498700, "epoch": 6008} {"train_loss": -27.244434356689453, "global_step": 498701, "epoch": 6008} {"train_loss": -27.716522216796875, "global_step": 498702, "epoch": 6008} {"train_loss": -27.908706665039062, "global_step": 498703, "epoch": 6008} {"train_loss": -27.301908493041992, "global_step": 498704, "epoch": 6008} {"train_loss": -27.7670841217041, "global_step": 498705, "epoch": 6008} {"train_loss": -27.72395133972168, "global_step": 498706, "epoch": 6008} {"train_loss": -27.55024528503418, "global_step": 498707, "epoch": 6008} {"train_loss": -27.427337646484375, "global_step": 498708, "epoch": 6008} {"train_loss": -27.661230087280273, "global_step": 498709, "epoch": 6008} {"train_loss": -27.489831924438477, "global_step": 498710, "epoch": 6008} {"train_loss": -27.409748077392578, "global_step": 498711, "epoch": 6008} {"train_loss": -27.74903678894043, "global_step": 498712, "epoch": 6008} {"train_loss": -27.458505630493164, "global_step": 498713, "epoch": 6008} {"train_loss": -27.458234786987305, "global_step": 498714, "epoch": 6008} {"train_loss": -27.6685848236084, "global_step": 498715, "epoch": 6008} {"train_loss": -27.783557891845703, "global_step": 498716, "epoch": 6008} {"train_loss": -27.659305572509766, "global_step": 498717, "epoch": 6008} {"train_loss": -27.888919830322266, "global_step": 498718, "epoch": 6008} {"train_loss": -27.772886276245117, "global_step": 498719, "epoch": 6008} {"train_loss": -27.320911407470703, "global_step": 498720, "epoch": 6008} {"train_loss": -27.43115234375, "global_step": 498721, "epoch": 6008} {"train_loss": -27.1297550201416, "global_step": 498722, "epoch": 6008} {"train_loss": -27.71888542175293, "global_step": 498723, "epoch": 6008} {"train_loss": -27.169031143188477, "global_step": 498724, "epoch": 6008} {"train_loss": -27.385894775390625, "global_step": 498725, "epoch": 6008} {"train_loss": -27.1689395904541, "global_step": 498726, "epoch": 6008} {"train_loss": -27.353748321533203, "global_step": 498727, "epoch": 6008} {"train_loss": -27.344375610351562, "global_step": 498728, "epoch": 6008} {"train_loss": -27.038013458251953, "global_step": 498729, "epoch": 6008} {"train_loss": -27.244924545288086, "global_step": 498730, "epoch": 6008} {"train_loss": -26.8292236328125, "global_step": 498731, "epoch": 6008} {"train_loss": -26.729602813720703, "global_step": 498732, "epoch": 6008} {"train_loss": -27.115514755249023, "global_step": 498733, "epoch": 6008} {"train_loss": -27.211700439453125, "global_step": 498734, "epoch": 6008} {"train_loss": -27.212491989135742, "global_step": 498735, "epoch": 6008} {"train_loss": -26.72116470336914, "global_step": 498736, "epoch": 6008} {"train_loss": -27.096826553344727, "global_step": 498737, "epoch": 6008} {"train_loss": -27.39908218383789, "global_step": 498738, "epoch": 6008} {"train_loss": -27.3671817779541, "global_step": 498739, "epoch": 6008} {"train_loss": -26.765966415405273, "global_step": 498740, "epoch": 6008} {"train_loss": -27.270788192749023, "global_step": 498741, "epoch": 6008} {"train_loss": -27.263671875, "global_step": 498742, "epoch": 6008} {"train_loss": -27.4757022857666, "global_step": 498743, "epoch": 6008} {"train_loss": -27.5092830657959, "global_step": 498744, "epoch": 6008} {"train_loss": -27.69524574279785, "global_step": 498745, "epoch": 6008} {"train_loss": -27.24163232366723, "global_step": 498746, "epoch": 6008, "val_loss": 6605005.0} {"train_loss": -27.08111000061035, "global_step": 498747, "epoch": 6009} {"train_loss": -26.757349014282227, "global_step": 498748, "epoch": 6009} {"train_loss": -27.002466201782227, "global_step": 498749, "epoch": 6009} {"train_loss": -26.67144203186035, "global_step": 498750, "epoch": 6009} {"train_loss": -26.860387802124023, "global_step": 498751, "epoch": 6009} {"train_loss": -26.829986572265625, "global_step": 498752, "epoch": 6009} {"train_loss": -26.644962310791016, "global_step": 498753, "epoch": 6009} {"train_loss": -27.159460067749023, "global_step": 498754, "epoch": 6009} {"train_loss": -26.714874267578125, "global_step": 498755, "epoch": 6009} {"train_loss": -27.143115997314453, "global_step": 498756, "epoch": 6009} {"train_loss": -26.758153915405273, "global_step": 498757, "epoch": 6009} {"train_loss": -27.382923126220703, "global_step": 498758, "epoch": 6009} {"train_loss": -26.977460861206055, "global_step": 498759, "epoch": 6009} {"train_loss": -27.380695343017578, "global_step": 498760, "epoch": 6009} {"train_loss": -26.83113670349121, "global_step": 498761, "epoch": 6009} {"train_loss": -27.489953994750977, "global_step": 498762, "epoch": 6009} {"train_loss": -27.226200103759766, "global_step": 498763, "epoch": 6009} {"train_loss": -27.2141056060791, "global_step": 498764, "epoch": 6009} {"train_loss": -27.073455810546875, "global_step": 498765, "epoch": 6009} {"train_loss": -26.784082412719727, "global_step": 498766, "epoch": 6009} {"train_loss": -26.895883560180664, "global_step": 498767, "epoch": 6009} {"train_loss": -26.871129989624023, "global_step": 498768, "epoch": 6009} {"train_loss": -27.04164695739746, "global_step": 498769, "epoch": 6009} {"train_loss": -27.4074764251709, "global_step": 498770, "epoch": 6009} {"train_loss": -27.148523330688477, "global_step": 498771, "epoch": 6009} {"train_loss": -27.594846725463867, "global_step": 498772, "epoch": 6009} {"train_loss": -27.35318946838379, "global_step": 498773, "epoch": 6009} {"train_loss": -27.15351676940918, "global_step": 498774, "epoch": 6009} {"train_loss": -27.175769805908203, "global_step": 498775, "epoch": 6009} {"train_loss": -27.30427360534668, "global_step": 498776, "epoch": 6009} {"train_loss": -27.586780548095703, "global_step": 498777, "epoch": 6009} {"train_loss": -27.303512573242188, "global_step": 498778, "epoch": 6009} {"train_loss": -27.781354904174805, "global_step": 498779, "epoch": 6009} {"train_loss": -27.3121280670166, "global_step": 498780, "epoch": 6009} {"train_loss": -27.591638565063477, "global_step": 498781, "epoch": 6009} {"train_loss": -27.8061580657959, "global_step": 498782, "epoch": 6009} {"train_loss": -27.393817901611328, "global_step": 498783, "epoch": 6009} {"train_loss": -27.733570098876953, "global_step": 498784, "epoch": 6009} {"train_loss": -27.34711265563965, "global_step": 498785, "epoch": 6009} {"train_loss": -27.989578247070312, "global_step": 498786, "epoch": 6009} {"train_loss": -27.576126098632812, "global_step": 498787, "epoch": 6009} {"train_loss": -27.45918083190918, "global_step": 498788, "epoch": 6009} {"train_loss": -27.52863121032715, "global_step": 498789, "epoch": 6009} {"train_loss": -27.584365844726562, "global_step": 498790, "epoch": 6009} {"train_loss": -27.36686134338379, "global_step": 498791, "epoch": 6009} {"train_loss": -27.587202072143555, "global_step": 498792, "epoch": 6009} {"train_loss": -27.5141658782959, "global_step": 498793, "epoch": 6009} {"train_loss": -27.566205978393555, "global_step": 498794, "epoch": 6009} {"train_loss": -27.54852867126465, "global_step": 498795, "epoch": 6009} {"train_loss": -27.74671745300293, "global_step": 498796, "epoch": 6009} {"train_loss": -27.806543350219727, "global_step": 498797, "epoch": 6009} {"train_loss": -27.426868438720703, "global_step": 498798, "epoch": 6009} {"train_loss": -27.578989028930664, "global_step": 498799, "epoch": 6009} {"train_loss": -27.560224533081055, "global_step": 498800, "epoch": 6009} {"train_loss": -27.63947105407715, "global_step": 498801, "epoch": 6009} {"train_loss": -27.576818466186523, "global_step": 498802, "epoch": 6009} {"train_loss": -27.461841583251953, "global_step": 498803, "epoch": 6009} {"train_loss": -27.751550674438477, "global_step": 498804, "epoch": 6009} {"train_loss": -27.702682495117188, "global_step": 498805, "epoch": 6009} {"train_loss": -27.300329208374023, "global_step": 498806, "epoch": 6009} {"train_loss": -26.930627822875977, "global_step": 498807, "epoch": 6009} {"train_loss": -26.970935821533203, "global_step": 498808, "epoch": 6009} {"train_loss": -26.5206298828125, "global_step": 498809, "epoch": 6009} {"train_loss": -26.09061050415039, "global_step": 498810, "epoch": 6009} {"train_loss": -25.80097007751465, "global_step": 498811, "epoch": 6009} {"train_loss": -26.45538902282715, "global_step": 498812, "epoch": 6009} {"train_loss": -27.351303100585938, "global_step": 498813, "epoch": 6009} {"train_loss": -26.802881240844727, "global_step": 498814, "epoch": 6009} {"train_loss": -27.192304611206055, "global_step": 498815, "epoch": 6009} {"train_loss": -27.395599365234375, "global_step": 498816, "epoch": 6009} {"train_loss": -27.19025993347168, "global_step": 498817, "epoch": 6009} {"train_loss": -27.1658992767334, "global_step": 498818, "epoch": 6009} {"train_loss": -27.07316017150879, "global_step": 498819, "epoch": 6009} {"train_loss": -26.966205596923828, "global_step": 498820, "epoch": 6009} {"train_loss": -27.15407371520996, "global_step": 498821, "epoch": 6009} {"train_loss": -27.2313289642334, "global_step": 498822, "epoch": 6009} {"train_loss": -27.3945255279541, "global_step": 498823, "epoch": 6009} {"train_loss": -27.277069091796875, "global_step": 498824, "epoch": 6009} {"train_loss": -27.44482421875, "global_step": 498825, "epoch": 6009} {"train_loss": -27.408172607421875, "global_step": 498826, "epoch": 6009} {"train_loss": -27.081806182861328, "global_step": 498827, "epoch": 6009} {"train_loss": -27.568466186523438, "global_step": 498828, "epoch": 6009} {"train_loss": -27.240053291780402, "global_step": 498829, "epoch": 6009, "val_loss": 6647233.5} {"train_loss": -26.887922286987305, "global_step": 498830, "epoch": 6010} {"train_loss": -27.42889976501465, "global_step": 498831, "epoch": 6010} {"train_loss": -27.095739364624023, "global_step": 498832, "epoch": 6010} {"train_loss": -27.300939559936523, "global_step": 498833, "epoch": 6010} {"train_loss": -27.1943359375, "global_step": 498834, "epoch": 6010} {"train_loss": -27.01434898376465, "global_step": 498835, "epoch": 6010} {"train_loss": -26.97065544128418, "global_step": 498836, "epoch": 6010} {"train_loss": -27.13213539123535, "global_step": 498837, "epoch": 6010} {"train_loss": -27.19434928894043, "global_step": 498838, "epoch": 6010} {"train_loss": -27.404434204101562, "global_step": 498839, "epoch": 6010} {"train_loss": -26.98200035095215, "global_step": 498840, "epoch": 6010} {"train_loss": -27.621610641479492, "global_step": 498841, "epoch": 6010} {"train_loss": -27.366071701049805, "global_step": 498842, "epoch": 6010} {"train_loss": -27.170795440673828, "global_step": 498843, "epoch": 6010} {"train_loss": -27.680404663085938, "global_step": 498844, "epoch": 6010} {"train_loss": -27.178482055664062, "global_step": 498845, "epoch": 6010} {"train_loss": -27.02486228942871, "global_step": 498846, "epoch": 6010} {"train_loss": -27.057788848876953, "global_step": 498847, "epoch": 6010} {"train_loss": -27.05293083190918, "global_step": 498848, "epoch": 6010} {"train_loss": -27.12045669555664, "global_step": 498849, "epoch": 6010} {"train_loss": -27.507831573486328, "global_step": 498850, "epoch": 6010} {"train_loss": -27.627979278564453, "global_step": 498851, "epoch": 6010} {"train_loss": -27.253026962280273, "global_step": 498852, "epoch": 6010} {"train_loss": -27.350086212158203, "global_step": 498853, "epoch": 6010} {"train_loss": -27.24989891052246, "global_step": 498854, "epoch": 6010} {"train_loss": -27.3479061126709, "global_step": 498855, "epoch": 6010} {"train_loss": -27.495285034179688, "global_step": 498856, "epoch": 6010} {"train_loss": -27.0312442779541, "global_step": 498857, "epoch": 6010} {"train_loss": -27.722274780273438, "global_step": 498858, "epoch": 6010} {"train_loss": -27.068103790283203, "global_step": 498859, "epoch": 6010} {"train_loss": -27.128711700439453, "global_step": 498860, "epoch": 6010} {"train_loss": -27.376266479492188, "global_step": 498861, "epoch": 6010} {"train_loss": -27.259674072265625, "global_step": 498862, "epoch": 6010} {"train_loss": -27.29389762878418, "global_step": 498863, "epoch": 6010} {"train_loss": -27.55584144592285, "global_step": 498864, "epoch": 6010} {"train_loss": -27.237720489501953, "global_step": 498865, "epoch": 6010} {"train_loss": -27.231698989868164, "global_step": 498866, "epoch": 6010} {"train_loss": -27.464313507080078, "global_step": 498867, "epoch": 6010} {"train_loss": -27.536279678344727, "global_step": 498868, "epoch": 6010} {"train_loss": -27.532190322875977, "global_step": 498869, "epoch": 6010} {"train_loss": -27.807287216186523, "global_step": 498870, "epoch": 6010} {"train_loss": -27.594186782836914, "global_step": 498871, "epoch": 6010} {"train_loss": -27.654754638671875, "global_step": 498872, "epoch": 6010} {"train_loss": -27.37666130065918, "global_step": 498873, "epoch": 6010} {"train_loss": -27.822498321533203, "global_step": 498874, "epoch": 6010} {"train_loss": -27.426679611206055, "global_step": 498875, "epoch": 6010} {"train_loss": -27.547683715820312, "global_step": 498876, "epoch": 6010} {"train_loss": -27.48992347717285, "global_step": 498877, "epoch": 6010} {"train_loss": -26.86800193786621, "global_step": 498878, "epoch": 6010} {"train_loss": -27.504621505737305, "global_step": 498879, "epoch": 6010} {"train_loss": -27.5183162689209, "global_step": 498880, "epoch": 6010} {"train_loss": -27.5555362701416, "global_step": 498881, "epoch": 6010} {"train_loss": -27.66162109375, "global_step": 498882, "epoch": 6010} {"train_loss": -27.86164665222168, "global_step": 498883, "epoch": 6010} {"train_loss": -27.471099853515625, "global_step": 498884, "epoch": 6010} {"train_loss": -27.16318702697754, "global_step": 498885, "epoch": 6010} {"train_loss": -26.512802124023438, "global_step": 498886, "epoch": 6010} {"train_loss": -27.083776473999023, "global_step": 498887, "epoch": 6010} {"train_loss": -27.484790802001953, "global_step": 498888, "epoch": 6010} {"train_loss": -27.226171493530273, "global_step": 498889, "epoch": 6010} {"train_loss": -26.825910568237305, "global_step": 498890, "epoch": 6010} {"train_loss": -27.235492706298828, "global_step": 498891, "epoch": 6010} {"train_loss": -27.286218643188477, "global_step": 498892, "epoch": 6010} {"train_loss": -27.665027618408203, "global_step": 498893, "epoch": 6010} {"train_loss": -27.19866943359375, "global_step": 498894, "epoch": 6010} {"train_loss": -26.97010612487793, "global_step": 498895, "epoch": 6010} {"train_loss": -27.251562118530273, "global_step": 498896, "epoch": 6010} {"train_loss": -27.311384201049805, "global_step": 498897, "epoch": 6010} {"train_loss": -27.223556518554688, "global_step": 498898, "epoch": 6010} {"train_loss": -27.23079490661621, "global_step": 498899, "epoch": 6010} {"train_loss": -27.14859390258789, "global_step": 498900, "epoch": 6010} {"train_loss": -27.321157455444336, "global_step": 498901, "epoch": 6010} {"train_loss": -27.09205436706543, "global_step": 498902, "epoch": 6010} {"train_loss": -27.2060546875, "global_step": 498903, "epoch": 6010} {"train_loss": -27.27438735961914, "global_step": 498904, "epoch": 6010} {"train_loss": -27.4637451171875, "global_step": 498905, "epoch": 6010} {"train_loss": -27.351781845092773, "global_step": 498906, "epoch": 6010} {"train_loss": -27.14237403869629, "global_step": 498907, "epoch": 6010} {"train_loss": -27.44864845275879, "global_step": 498908, "epoch": 6010} {"train_loss": -27.611692428588867, "global_step": 498909, "epoch": 6010} {"train_loss": -27.034687042236328, "global_step": 498910, "epoch": 6010} {"train_loss": -26.942310333251953, "global_step": 498911, "epoch": 6010} {"train_loss": -27.300101337662664, "global_step": 498912, "epoch": 6010, "val_loss": 6674861.0} {"train_loss": -26.770221710205078, "global_step": 498913, "epoch": 6011} {"train_loss": -26.763141632080078, "global_step": 498914, "epoch": 6011} {"train_loss": -26.823896408081055, "global_step": 498915, "epoch": 6011} {"train_loss": -26.59756851196289, "global_step": 498916, "epoch": 6011} {"train_loss": -26.759246826171875, "global_step": 498917, "epoch": 6011} {"train_loss": -27.031003952026367, "global_step": 498918, "epoch": 6011} {"train_loss": -27.596601486206055, "global_step": 498919, "epoch": 6011} {"train_loss": -27.096088409423828, "global_step": 498920, "epoch": 6011} {"train_loss": -26.2777042388916, "global_step": 498921, "epoch": 6011} {"train_loss": -26.67264175415039, "global_step": 498922, "epoch": 6011} {"train_loss": -27.067285537719727, "global_step": 498923, "epoch": 6011} {"train_loss": -26.81581687927246, "global_step": 498924, "epoch": 6011} {"train_loss": -27.110761642456055, "global_step": 498925, "epoch": 6011} {"train_loss": -26.90703773498535, "global_step": 498926, "epoch": 6011} {"train_loss": -26.97025489807129, "global_step": 498927, "epoch": 6011} {"train_loss": -27.243682861328125, "global_step": 498928, "epoch": 6011} {"train_loss": -27.3129825592041, "global_step": 498929, "epoch": 6011} {"train_loss": -26.996591567993164, "global_step": 498930, "epoch": 6011} {"train_loss": -27.615102767944336, "global_step": 498931, "epoch": 6011} {"train_loss": -27.193578720092773, "global_step": 498932, "epoch": 6011} {"train_loss": -27.1694278717041, "global_step": 498933, "epoch": 6011} {"train_loss": -27.158935546875, "global_step": 498934, "epoch": 6011} {"train_loss": -26.826398849487305, "global_step": 498935, "epoch": 6011} {"train_loss": -27.237232208251953, "global_step": 498936, "epoch": 6011} {"train_loss": -27.554279327392578, "global_step": 498937, "epoch": 6011} {"train_loss": -27.446155548095703, "global_step": 498938, "epoch": 6011} {"train_loss": -27.577716827392578, "global_step": 498939, "epoch": 6011} {"train_loss": -27.143888473510742, "global_step": 498940, "epoch": 6011} {"train_loss": -27.212976455688477, "global_step": 498941, "epoch": 6011} {"train_loss": -27.4562931060791, "global_step": 498942, "epoch": 6011} {"train_loss": -27.306533813476562, "global_step": 498943, "epoch": 6011} {"train_loss": -27.853744506835938, "global_step": 498944, "epoch": 6011} {"train_loss": -27.660999298095703, "global_step": 498945, "epoch": 6011} {"train_loss": -27.45490074157715, "global_step": 498946, "epoch": 6011} {"train_loss": -27.447845458984375, "global_step": 498947, "epoch": 6011} {"train_loss": -27.562091827392578, "global_step": 498948, "epoch": 6011} {"train_loss": -27.48493003845215, "global_step": 498949, "epoch": 6011} {"train_loss": -27.5031681060791, "global_step": 498950, "epoch": 6011} {"train_loss": -27.086872100830078, "global_step": 498951, "epoch": 6011} {"train_loss": -27.74087905883789, "global_step": 498952, "epoch": 6011} {"train_loss": -27.58649253845215, "global_step": 498953, "epoch": 6011} {"train_loss": -27.17767906188965, "global_step": 498954, "epoch": 6011} {"train_loss": -27.30572509765625, "global_step": 498955, "epoch": 6011} {"train_loss": -27.159570693969727, "global_step": 498956, "epoch": 6011} {"train_loss": -27.529630661010742, "global_step": 498957, "epoch": 6011} {"train_loss": -27.248624801635742, "global_step": 498958, "epoch": 6011} {"train_loss": -27.4066219329834, "global_step": 498959, "epoch": 6011} {"train_loss": -27.31768226623535, "global_step": 498960, "epoch": 6011} {"train_loss": -27.376047134399414, "global_step": 498961, "epoch": 6011} {"train_loss": -27.375165939331055, "global_step": 498962, "epoch": 6011} {"train_loss": -27.48856544494629, "global_step": 498963, "epoch": 6011} {"train_loss": -26.907428741455078, "global_step": 498964, "epoch": 6011} {"train_loss": -27.383529663085938, "global_step": 498965, "epoch": 6011} {"train_loss": -27.323230743408203, "global_step": 498966, "epoch": 6011} {"train_loss": -27.056610107421875, "global_step": 498967, "epoch": 6011} {"train_loss": -27.771020889282227, "global_step": 498968, "epoch": 6011} {"train_loss": -27.62981605529785, "global_step": 498969, "epoch": 6011} {"train_loss": -27.478063583374023, "global_step": 498970, "epoch": 6011} {"train_loss": -27.542327880859375, "global_step": 498971, "epoch": 6011} {"train_loss": -27.3438720703125, "global_step": 498972, "epoch": 6011} {"train_loss": -27.18433952331543, "global_step": 498973, "epoch": 6011} {"train_loss": -27.32547378540039, "global_step": 498974, "epoch": 6011} {"train_loss": -27.042856216430664, "global_step": 498975, "epoch": 6011} {"train_loss": -26.96613883972168, "global_step": 498976, "epoch": 6011} {"train_loss": -27.2544002532959, "global_step": 498977, "epoch": 6011} {"train_loss": -27.6304931640625, "global_step": 498978, "epoch": 6011} {"train_loss": -27.26691246032715, "global_step": 498979, "epoch": 6011} {"train_loss": -27.39483642578125, "global_step": 498980, "epoch": 6011} {"train_loss": -27.601163864135742, "global_step": 498981, "epoch": 6011} {"train_loss": -27.321796417236328, "global_step": 498982, "epoch": 6011} {"train_loss": -27.179458618164062, "global_step": 498983, "epoch": 6011} {"train_loss": -27.597705841064453, "global_step": 498984, "epoch": 6011} {"train_loss": -27.796070098876953, "global_step": 498985, "epoch": 6011} {"train_loss": -27.298877716064453, "global_step": 498986, "epoch": 6011} {"train_loss": -27.326740264892578, "global_step": 498987, "epoch": 6011} {"train_loss": -27.318531036376953, "global_step": 498988, "epoch": 6011} {"train_loss": -27.197885513305664, "global_step": 498989, "epoch": 6011} {"train_loss": -27.332895278930664, "global_step": 498990, "epoch": 6011} {"train_loss": -27.384180068969727, "global_step": 498991, "epoch": 6011} {"train_loss": -27.577682495117188, "global_step": 498992, "epoch": 6011} {"train_loss": -27.665616989135742, "global_step": 498993, "epoch": 6011} {"train_loss": -27.226825714111328, "global_step": 498994, "epoch": 6011} {"train_loss": -27.29109901979745, "global_step": 498995, "epoch": 6011, "val_loss": 6606391.5} {"train_loss": -27.534503936767578, "global_step": 498996, "epoch": 6012} {"train_loss": -27.37114906311035, "global_step": 498997, "epoch": 6012} {"train_loss": -26.93668556213379, "global_step": 498998, "epoch": 6012} {"train_loss": -27.398847579956055, "global_step": 498999, "epoch": 6012} {"train_loss": -27.089139938354492, "global_step": 499000, "epoch": 6012} {"train_loss": -27.339984893798828, "global_step": 499001, "epoch": 6012} {"train_loss": -27.31012535095215, "global_step": 499002, "epoch": 6012} {"train_loss": -27.382558822631836, "global_step": 499003, "epoch": 6012} {"train_loss": -27.13323402404785, "global_step": 499004, "epoch": 6012} {"train_loss": -26.91225242614746, "global_step": 499005, "epoch": 6012} {"train_loss": -27.200468063354492, "global_step": 499006, "epoch": 6012} {"train_loss": -27.4820499420166, "global_step": 499007, "epoch": 6012} {"train_loss": -27.180099487304688, "global_step": 499008, "epoch": 6012} {"train_loss": -26.763656616210938, "global_step": 499009, "epoch": 6012} {"train_loss": -27.104450225830078, "global_step": 499010, "epoch": 6012} {"train_loss": -27.623977661132812, "global_step": 499011, "epoch": 6012} {"train_loss": -27.856124877929688, "global_step": 499012, "epoch": 6012} {"train_loss": -27.23726463317871, "global_step": 499013, "epoch": 6012} {"train_loss": -27.23237419128418, "global_step": 499014, "epoch": 6012} {"train_loss": -27.19814109802246, "global_step": 499015, "epoch": 6012} {"train_loss": -27.19547462463379, "global_step": 499016, "epoch": 6012} {"train_loss": -27.1553955078125, "global_step": 499017, "epoch": 6012} {"train_loss": -26.989255905151367, "global_step": 499018, "epoch": 6012} {"train_loss": -27.009374618530273, "global_step": 499019, "epoch": 6012} {"train_loss": -27.177600860595703, "global_step": 499020, "epoch": 6012} {"train_loss": -27.686975479125977, "global_step": 499021, "epoch": 6012} {"train_loss": -27.14995765686035, "global_step": 499022, "epoch": 6012} {"train_loss": -26.772754669189453, "global_step": 499023, "epoch": 6012} {"train_loss": -27.12152671813965, "global_step": 499024, "epoch": 6012} {"train_loss": -26.934736251831055, "global_step": 499025, "epoch": 6012} {"train_loss": -27.306982040405273, "global_step": 499026, "epoch": 6012} {"train_loss": -27.07313346862793, "global_step": 499027, "epoch": 6012} {"train_loss": -27.16518211364746, "global_step": 499028, "epoch": 6012} {"train_loss": -27.615697860717773, "global_step": 499029, "epoch": 6012} {"train_loss": -27.34864616394043, "global_step": 499030, "epoch": 6012} {"train_loss": -27.334360122680664, "global_step": 499031, "epoch": 6012} {"train_loss": -27.54334831237793, "global_step": 499032, "epoch": 6012} {"train_loss": -27.591358184814453, "global_step": 499033, "epoch": 6012} {"train_loss": -27.266698837280273, "global_step": 499034, "epoch": 6012} {"train_loss": -27.35316276550293, "global_step": 499035, "epoch": 6012} {"train_loss": -27.435333251953125, "global_step": 499036, "epoch": 6012} {"train_loss": -27.463031768798828, "global_step": 499037, "epoch": 6012} {"train_loss": -27.43361473083496, "global_step": 499038, "epoch": 6012} {"train_loss": -27.390018463134766, "global_step": 499039, "epoch": 6012} {"train_loss": -27.27829933166504, "global_step": 499040, "epoch": 6012} {"train_loss": -27.14020347595215, "global_step": 499041, "epoch": 6012} {"train_loss": -27.35883903503418, "global_step": 499042, "epoch": 6012} {"train_loss": -27.56479263305664, "global_step": 499043, "epoch": 6012} {"train_loss": -27.216217041015625, "global_step": 499044, "epoch": 6012} {"train_loss": -27.52039909362793, "global_step": 499045, "epoch": 6012} {"train_loss": -27.64576530456543, "global_step": 499046, "epoch": 6012} {"train_loss": -27.330469131469727, "global_step": 499047, "epoch": 6012} {"train_loss": -27.613245010375977, "global_step": 499048, "epoch": 6012} {"train_loss": -27.278106689453125, "global_step": 499049, "epoch": 6012} {"train_loss": -27.706995010375977, "global_step": 499050, "epoch": 6012} {"train_loss": -27.24460220336914, "global_step": 499051, "epoch": 6012} {"train_loss": -27.381927490234375, "global_step": 499052, "epoch": 6012} {"train_loss": -27.163105010986328, "global_step": 499053, "epoch": 6012} {"train_loss": -28.0085391998291, "global_step": 499054, "epoch": 6012} {"train_loss": -27.194543838500977, "global_step": 499055, "epoch": 6012} {"train_loss": -27.678543090820312, "global_step": 499056, "epoch": 6012} {"train_loss": -27.235727310180664, "global_step": 499057, "epoch": 6012} {"train_loss": -26.48602867126465, "global_step": 499058, "epoch": 6012} {"train_loss": -26.45256996154785, "global_step": 499059, "epoch": 6012} {"train_loss": -26.635395050048828, "global_step": 499060, "epoch": 6012} {"train_loss": -27.357009887695312, "global_step": 499061, "epoch": 6012} {"train_loss": -27.254779815673828, "global_step": 499062, "epoch": 6012} {"train_loss": -26.2386474609375, "global_step": 499063, "epoch": 6012} {"train_loss": -27.201440811157227, "global_step": 499064, "epoch": 6012} {"train_loss": -26.8330078125, "global_step": 499065, "epoch": 6012} {"train_loss": -27.301191329956055, "global_step": 499066, "epoch": 6012} {"train_loss": -26.757986068725586, "global_step": 499067, "epoch": 6012} {"train_loss": -26.701284408569336, "global_step": 499068, "epoch": 6012} {"train_loss": -27.01449966430664, "global_step": 499069, "epoch": 6012} {"train_loss": -27.246728897094727, "global_step": 499070, "epoch": 6012} {"train_loss": -26.91058349609375, "global_step": 499071, "epoch": 6012} {"train_loss": -27.083417892456055, "global_step": 499072, "epoch": 6012} {"train_loss": -27.150787353515625, "global_step": 499073, "epoch": 6012} {"train_loss": -27.3514347076416, "global_step": 499074, "epoch": 6012} {"train_loss": -27.114669799804688, "global_step": 499075, "epoch": 6012} {"train_loss": -26.889501571655273, "global_step": 499076, "epoch": 6012} {"train_loss": -26.655593872070312, "global_step": 499077, "epoch": 6012} {"train_loss": -27.226570956678277, "global_step": 499078, "epoch": 6012, "val_loss": 6646992.0} {"train_loss": -26.89093589782715, "global_step": 499079, "epoch": 6013} {"train_loss": -26.860151290893555, "global_step": 499080, "epoch": 6013} {"train_loss": -26.656408309936523, "global_step": 499081, "epoch": 6013} {"train_loss": -26.626571655273438, "global_step": 499082, "epoch": 6013} {"train_loss": -26.744882583618164, "global_step": 499083, "epoch": 6013} {"train_loss": -26.8975772857666, "global_step": 499084, "epoch": 6013} {"train_loss": -26.964380264282227, "global_step": 499085, "epoch": 6013} {"train_loss": -26.45485496520996, "global_step": 499086, "epoch": 6013} {"train_loss": -27.2117919921875, "global_step": 499087, "epoch": 6013} {"train_loss": -26.58503532409668, "global_step": 499088, "epoch": 6013} {"train_loss": -26.893964767456055, "global_step": 499089, "epoch": 6013} {"train_loss": -27.223913192749023, "global_step": 499090, "epoch": 6013} {"train_loss": -27.27239990234375, "global_step": 499091, "epoch": 6013} {"train_loss": -26.865833282470703, "global_step": 499092, "epoch": 6013} {"train_loss": -26.82171630859375, "global_step": 499093, "epoch": 6013} {"train_loss": -27.076292037963867, "global_step": 499094, "epoch": 6013} {"train_loss": -27.38117790222168, "global_step": 499095, "epoch": 6013} {"train_loss": -26.99720573425293, "global_step": 499096, "epoch": 6013} {"train_loss": -27.032541275024414, "global_step": 499097, "epoch": 6013} {"train_loss": -27.141666412353516, "global_step": 499098, "epoch": 6013} {"train_loss": -27.346343994140625, "global_step": 499099, "epoch": 6013} {"train_loss": -27.180944442749023, "global_step": 499100, "epoch": 6013} {"train_loss": -26.85626220703125, "global_step": 499101, "epoch": 6013} {"train_loss": -27.416528701782227, "global_step": 499102, "epoch": 6013} {"train_loss": -27.13404655456543, "global_step": 499103, "epoch": 6013} {"train_loss": -27.4171199798584, "global_step": 499104, "epoch": 6013} {"train_loss": -27.28543472290039, "global_step": 499105, "epoch": 6013} {"train_loss": -27.609394073486328, "global_step": 499106, "epoch": 6013} {"train_loss": -27.2096004486084, "global_step": 499107, "epoch": 6013} {"train_loss": -27.154882431030273, "global_step": 499108, "epoch": 6013} {"train_loss": -27.43072509765625, "global_step": 499109, "epoch": 6013} {"train_loss": -27.52561378479004, "global_step": 499110, "epoch": 6013} {"train_loss": -27.7344970703125, "global_step": 499111, "epoch": 6013} {"train_loss": -27.311609268188477, "global_step": 499112, "epoch": 6013} {"train_loss": -27.65769386291504, "global_step": 499113, "epoch": 6013} {"train_loss": -27.67275047302246, "global_step": 499114, "epoch": 6013} {"train_loss": -27.412368774414062, "global_step": 499115, "epoch": 6013} {"train_loss": -27.295751571655273, "global_step": 499116, "epoch": 6013} {"train_loss": -27.6508846282959, "global_step": 499117, "epoch": 6013} {"train_loss": -27.796228408813477, "global_step": 499118, "epoch": 6013} {"train_loss": -28.0366153717041, "global_step": 499119, "epoch": 6013} {"train_loss": -27.771230697631836, "global_step": 499120, "epoch": 6013} {"train_loss": -27.330286026000977, "global_step": 499121, "epoch": 6013} {"train_loss": -27.642414093017578, "global_step": 499122, "epoch": 6013} {"train_loss": -27.518634796142578, "global_step": 499123, "epoch": 6013} {"train_loss": -27.768789291381836, "global_step": 499124, "epoch": 6013} {"train_loss": -27.521970748901367, "global_step": 499125, "epoch": 6013} {"train_loss": -28.10906410217285, "global_step": 499126, "epoch": 6013} {"train_loss": -27.395124435424805, "global_step": 499127, "epoch": 6013} {"train_loss": -27.29572105407715, "global_step": 499128, "epoch": 6013} {"train_loss": -27.32270622253418, "global_step": 499129, "epoch": 6013} {"train_loss": -26.822036743164062, "global_step": 499130, "epoch": 6013} {"train_loss": -26.2519588470459, "global_step": 499131, "epoch": 6013} {"train_loss": -26.23154067993164, "global_step": 499132, "epoch": 6013} {"train_loss": -26.797754287719727, "global_step": 499133, "epoch": 6013} {"train_loss": -27.044692993164062, "global_step": 499134, "epoch": 6013} {"train_loss": -27.0186767578125, "global_step": 499135, "epoch": 6013} {"train_loss": -27.38869285583496, "global_step": 499136, "epoch": 6013} {"train_loss": -27.003070831298828, "global_step": 499137, "epoch": 6013} {"train_loss": -27.972461700439453, "global_step": 499138, "epoch": 6013} {"train_loss": -27.128265380859375, "global_step": 499139, "epoch": 6013} {"train_loss": -27.752609252929688, "global_step": 499140, "epoch": 6013} {"train_loss": -27.368976593017578, "global_step": 499141, "epoch": 6013} {"train_loss": -27.1657657623291, "global_step": 499142, "epoch": 6013} {"train_loss": -27.58087158203125, "global_step": 499143, "epoch": 6013} {"train_loss": -26.982458114624023, "global_step": 499144, "epoch": 6013} {"train_loss": -27.046445846557617, "global_step": 499145, "epoch": 6013} {"train_loss": -27.603839874267578, "global_step": 499146, "epoch": 6013} {"train_loss": -27.488666534423828, "global_step": 499147, "epoch": 6013} {"train_loss": -27.301122665405273, "global_step": 499148, "epoch": 6013} {"train_loss": -26.834760665893555, "global_step": 499149, "epoch": 6013} {"train_loss": -27.203222274780273, "global_step": 499150, "epoch": 6013} {"train_loss": -27.040847778320312, "global_step": 499151, "epoch": 6013} {"train_loss": -27.41525650024414, "global_step": 499152, "epoch": 6013} {"train_loss": -27.399328231811523, "global_step": 499153, "epoch": 6013} {"train_loss": -27.13422966003418, "global_step": 499154, "epoch": 6013} {"train_loss": -27.5145263671875, "global_step": 499155, "epoch": 6013} {"train_loss": -27.339086532592773, "global_step": 499156, "epoch": 6013} {"train_loss": -27.53464126586914, "global_step": 499157, "epoch": 6013} {"train_loss": -27.60492515563965, "global_step": 499158, "epoch": 6013} {"train_loss": -27.232894897460938, "global_step": 499159, "epoch": 6013} {"train_loss": -27.3217830657959, "global_step": 499160, "epoch": 6013} {"train_loss": -27.24216943763825, "global_step": 499161, "epoch": 6013, "val_loss": 6675864.5} {"train_loss": -27.067962646484375, "global_step": 499162, "epoch": 6014} {"train_loss": -27.072067260742188, "global_step": 499163, "epoch": 6014} {"train_loss": -26.935094833374023, "global_step": 499164, "epoch": 6014} {"train_loss": -27.170623779296875, "global_step": 499165, "epoch": 6014} {"train_loss": -26.957416534423828, "global_step": 499166, "epoch": 6014} {"train_loss": -26.7723445892334, "global_step": 499167, "epoch": 6014} {"train_loss": -27.442676544189453, "global_step": 499168, "epoch": 6014} {"train_loss": -26.9845027923584, "global_step": 499169, "epoch": 6014} {"train_loss": -26.96240234375, "global_step": 499170, "epoch": 6014} {"train_loss": -27.22292137145996, "global_step": 499171, "epoch": 6014} {"train_loss": -27.1572208404541, "global_step": 499172, "epoch": 6014} {"train_loss": -27.550512313842773, "global_step": 499173, "epoch": 6014} {"train_loss": -27.237030029296875, "global_step": 499174, "epoch": 6014} {"train_loss": -27.059906005859375, "global_step": 499175, "epoch": 6014} {"train_loss": -27.195886611938477, "global_step": 499176, "epoch": 6014} {"train_loss": -27.598602294921875, "global_step": 499177, "epoch": 6014} {"train_loss": -27.32535743713379, "global_step": 499178, "epoch": 6014} {"train_loss": -26.949462890625, "global_step": 499179, "epoch": 6014} {"train_loss": -27.17474365234375, "global_step": 499180, "epoch": 6014} {"train_loss": -27.199935913085938, "global_step": 499181, "epoch": 6014} {"train_loss": -27.731714248657227, "global_step": 499182, "epoch": 6014} {"train_loss": -27.192245483398438, "global_step": 499183, "epoch": 6014} {"train_loss": -27.78578758239746, "global_step": 499184, "epoch": 6014} {"train_loss": -27.482666015625, "global_step": 499185, "epoch": 6014} {"train_loss": -27.698110580444336, "global_step": 499186, "epoch": 6014} {"train_loss": -27.417821884155273, "global_step": 499187, "epoch": 6014} {"train_loss": -27.501108169555664, "global_step": 499188, "epoch": 6014} {"train_loss": -27.440229415893555, "global_step": 499189, "epoch": 6014} {"train_loss": -27.350936889648438, "global_step": 499190, "epoch": 6014} {"train_loss": -27.6568546295166, "global_step": 499191, "epoch": 6014} {"train_loss": -27.536596298217773, "global_step": 499192, "epoch": 6014} {"train_loss": -27.644739151000977, "global_step": 499193, "epoch": 6014} {"train_loss": -27.75725746154785, "global_step": 499194, "epoch": 6014} {"train_loss": -27.735198974609375, "global_step": 499195, "epoch": 6014} {"train_loss": -27.69563865661621, "global_step": 499196, "epoch": 6014} {"train_loss": -27.584064483642578, "global_step": 499197, "epoch": 6014} {"train_loss": -27.35560417175293, "global_step": 499198, "epoch": 6014} {"train_loss": -27.123361587524414, "global_step": 499199, "epoch": 6014} {"train_loss": -27.733747482299805, "global_step": 499200, "epoch": 6014} {"train_loss": -27.458219528198242, "global_step": 499201, "epoch": 6014} {"train_loss": -27.61520767211914, "global_step": 499202, "epoch": 6014} {"train_loss": -27.460412979125977, "global_step": 499203, "epoch": 6014} {"train_loss": -27.507516860961914, "global_step": 499204, "epoch": 6014} {"train_loss": -27.39515495300293, "global_step": 499205, "epoch": 6014} {"train_loss": -27.194000244140625, "global_step": 499206, "epoch": 6014} {"train_loss": -27.354084014892578, "global_step": 499207, "epoch": 6014} {"train_loss": -27.4036865234375, "global_step": 499208, "epoch": 6014} {"train_loss": -27.418228149414062, "global_step": 499209, "epoch": 6014} {"train_loss": -27.11417007446289, "global_step": 499210, "epoch": 6014} {"train_loss": -27.3176212310791, "global_step": 499211, "epoch": 6014} {"train_loss": -27.27203941345215, "global_step": 499212, "epoch": 6014} {"train_loss": -26.7978515625, "global_step": 499213, "epoch": 6014} {"train_loss": -27.291336059570312, "global_step": 499214, "epoch": 6014} {"train_loss": -27.412267684936523, "global_step": 499215, "epoch": 6014} {"train_loss": -27.37823486328125, "global_step": 499216, "epoch": 6014} {"train_loss": -27.276763916015625, "global_step": 499217, "epoch": 6014} {"train_loss": -27.6820011138916, "global_step": 499218, "epoch": 6014} {"train_loss": -27.322528839111328, "global_step": 499219, "epoch": 6014} {"train_loss": -27.360748291015625, "global_step": 499220, "epoch": 6014} {"train_loss": -27.225133895874023, "global_step": 499221, "epoch": 6014} {"train_loss": -27.367048263549805, "global_step": 499222, "epoch": 6014} {"train_loss": -27.373620986938477, "global_step": 499223, "epoch": 6014} {"train_loss": -27.610275268554688, "global_step": 499224, "epoch": 6014} {"train_loss": -27.289880752563477, "global_step": 499225, "epoch": 6014} {"train_loss": -27.14410972595215, "global_step": 499226, "epoch": 6014} {"train_loss": -27.27675437927246, "global_step": 499227, "epoch": 6014} {"train_loss": -27.617401123046875, "global_step": 499228, "epoch": 6014} {"train_loss": -27.444473266601562, "global_step": 499229, "epoch": 6014} {"train_loss": -27.478668212890625, "global_step": 499230, "epoch": 6014} {"train_loss": -27.407245635986328, "global_step": 499231, "epoch": 6014} {"train_loss": -27.304492950439453, "global_step": 499232, "epoch": 6014} {"train_loss": -27.661579132080078, "global_step": 499233, "epoch": 6014} {"train_loss": -27.20513916015625, "global_step": 499234, "epoch": 6014} {"train_loss": -27.302978515625, "global_step": 499235, "epoch": 6014} {"train_loss": -27.304203033447266, "global_step": 499236, "epoch": 6014} {"train_loss": -27.695789337158203, "global_step": 499237, "epoch": 6014} {"train_loss": -27.821735382080078, "global_step": 499238, "epoch": 6014} {"train_loss": -27.435901641845703, "global_step": 499239, "epoch": 6014} {"train_loss": -27.648527145385742, "global_step": 499240, "epoch": 6014} {"train_loss": -27.56570816040039, "global_step": 499241, "epoch": 6014} {"train_loss": -27.523334503173828, "global_step": 499242, "epoch": 6014} {"train_loss": -27.471969604492188, "global_step": 499243, "epoch": 6014} {"train_loss": -27.380748404077735, "global_step": 499244, "epoch": 6014, "val_loss": 6688118.0} {"train_loss": -26.320737838745117, "global_step": 499245, "epoch": 6015} {"train_loss": -25.40546226501465, "global_step": 499246, "epoch": 6015} {"train_loss": -25.394622802734375, "global_step": 499247, "epoch": 6015} {"train_loss": -26.524011611938477, "global_step": 499248, "epoch": 6015} {"train_loss": -26.482990264892578, "global_step": 499249, "epoch": 6015} {"train_loss": -26.186140060424805, "global_step": 499250, "epoch": 6015} {"train_loss": -27.10346794128418, "global_step": 499251, "epoch": 6015} {"train_loss": -26.45734977722168, "global_step": 499252, "epoch": 6015} {"train_loss": -26.916187286376953, "global_step": 499253, "epoch": 6015} {"train_loss": -26.478124618530273, "global_step": 499254, "epoch": 6015} {"train_loss": -26.628040313720703, "global_step": 499255, "epoch": 6015} {"train_loss": -26.6621150970459, "global_step": 499256, "epoch": 6015} {"train_loss": -26.68729019165039, "global_step": 499257, "epoch": 6015} {"train_loss": -26.662275314331055, "global_step": 499258, "epoch": 6015} {"train_loss": -26.8021240234375, "global_step": 499259, "epoch": 6015} {"train_loss": -26.877248764038086, "global_step": 499260, "epoch": 6015} {"train_loss": -27.1274356842041, "global_step": 499261, "epoch": 6015} {"train_loss": -27.395328521728516, "global_step": 499262, "epoch": 6015} {"train_loss": -26.976409912109375, "global_step": 499263, "epoch": 6015} {"train_loss": -27.02886962890625, "global_step": 499264, "epoch": 6015} {"train_loss": -27.1331787109375, "global_step": 499265, "epoch": 6015} {"train_loss": -27.291479110717773, "global_step": 499266, "epoch": 6015} {"train_loss": -26.82480812072754, "global_step": 499267, "epoch": 6015} {"train_loss": -27.00016212463379, "global_step": 499268, "epoch": 6015} {"train_loss": -27.195409774780273, "global_step": 499269, "epoch": 6015} {"train_loss": -26.93743324279785, "global_step": 499270, "epoch": 6015} {"train_loss": -27.092649459838867, "global_step": 499271, "epoch": 6015} {"train_loss": -27.123266220092773, "global_step": 499272, "epoch": 6015} {"train_loss": -27.388946533203125, "global_step": 499273, "epoch": 6015} {"train_loss": -27.26896095275879, "global_step": 499274, "epoch": 6015} {"train_loss": -26.971694946289062, "global_step": 499275, "epoch": 6015} {"train_loss": -27.173095703125, "global_step": 499276, "epoch": 6015} {"train_loss": -27.345605850219727, "global_step": 499277, "epoch": 6015} {"train_loss": -27.143787384033203, "global_step": 499278, "epoch": 6015} {"train_loss": -27.43922996520996, "global_step": 499279, "epoch": 6015} {"train_loss": -27.04837417602539, "global_step": 499280, "epoch": 6015} {"train_loss": -27.0813045501709, "global_step": 499281, "epoch": 6015} {"train_loss": -27.176258087158203, "global_step": 499282, "epoch": 6015} {"train_loss": -27.28596305847168, "global_step": 499283, "epoch": 6015} {"train_loss": -26.98822021484375, "global_step": 499284, "epoch": 6015} {"train_loss": -26.96099281311035, "global_step": 499285, "epoch": 6015} {"train_loss": -27.1019344329834, "global_step": 499286, "epoch": 6015} {"train_loss": -27.57355308532715, "global_step": 499287, "epoch": 6015} {"train_loss": -27.15033531188965, "global_step": 499288, "epoch": 6015} {"train_loss": -27.432144165039062, "global_step": 499289, "epoch": 6015} {"train_loss": -27.185321807861328, "global_step": 499290, "epoch": 6015} {"train_loss": -27.644412994384766, "global_step": 499291, "epoch": 6015} {"train_loss": -27.35190773010254, "global_step": 499292, "epoch": 6015} {"train_loss": -27.680578231811523, "global_step": 499293, "epoch": 6015} {"train_loss": -27.3262882232666, "global_step": 499294, "epoch": 6015} {"train_loss": -27.28888511657715, "global_step": 499295, "epoch": 6015} {"train_loss": -27.4132022857666, "global_step": 499296, "epoch": 6015} {"train_loss": -27.256696701049805, "global_step": 499297, "epoch": 6015} {"train_loss": -27.6173038482666, "global_step": 499298, "epoch": 6015} {"train_loss": -27.528661727905273, "global_step": 499299, "epoch": 6015} {"train_loss": -27.151769638061523, "global_step": 499300, "epoch": 6015} {"train_loss": -27.292333602905273, "global_step": 499301, "epoch": 6015} {"train_loss": -27.24897575378418, "global_step": 499302, "epoch": 6015} {"train_loss": -27.782407760620117, "global_step": 499303, "epoch": 6015} {"train_loss": -27.770893096923828, "global_step": 499304, "epoch": 6015} {"train_loss": -27.540185928344727, "global_step": 499305, "epoch": 6015} {"train_loss": -27.426233291625977, "global_step": 499306, "epoch": 6015} {"train_loss": -27.4565372467041, "global_step": 499307, "epoch": 6015} {"train_loss": -27.324493408203125, "global_step": 499308, "epoch": 6015} {"train_loss": -27.115161895751953, "global_step": 499309, "epoch": 6015} {"train_loss": -27.63313102722168, "global_step": 499310, "epoch": 6015} {"train_loss": -27.36931800842285, "global_step": 499311, "epoch": 6015} {"train_loss": -27.616199493408203, "global_step": 499312, "epoch": 6015} {"train_loss": -27.132410049438477, "global_step": 499313, "epoch": 6015} {"train_loss": -27.30478858947754, "global_step": 499314, "epoch": 6015} {"train_loss": -27.48121452331543, "global_step": 499315, "epoch": 6015} {"train_loss": -27.477741241455078, "global_step": 499316, "epoch": 6015} {"train_loss": -27.46137046813965, "global_step": 499317, "epoch": 6015} {"train_loss": -26.614948272705078, "global_step": 499318, "epoch": 6015} {"train_loss": -26.86952018737793, "global_step": 499319, "epoch": 6015} {"train_loss": -27.430072784423828, "global_step": 499320, "epoch": 6015} {"train_loss": -27.54833984375, "global_step": 499321, "epoch": 6015} {"train_loss": -27.387113571166992, "global_step": 499322, "epoch": 6015} {"train_loss": -27.892919540405273, "global_step": 499323, "epoch": 6015} {"train_loss": -27.233753204345703, "global_step": 499324, "epoch": 6015} {"train_loss": -27.5717716217041, "global_step": 499325, "epoch": 6015} {"train_loss": -27.473302841186523, "global_step": 499326, "epoch": 6015} {"train_loss": -27.132434270468103, "global_step": 499327, "epoch": 6015, "val_loss": 6711914.0} {"train_loss": -27.24171257019043, "global_step": 499328, "epoch": 6016} {"train_loss": -26.441287994384766, "global_step": 499329, "epoch": 6016} {"train_loss": -27.359365463256836, "global_step": 499330, "epoch": 6016} {"train_loss": -26.64698600769043, "global_step": 499331, "epoch": 6016} {"train_loss": -26.934919357299805, "global_step": 499332, "epoch": 6016} {"train_loss": -26.425739288330078, "global_step": 499333, "epoch": 6016} {"train_loss": -26.710386276245117, "global_step": 499334, "epoch": 6016} {"train_loss": -26.88945960998535, "global_step": 499335, "epoch": 6016} {"train_loss": -26.740009307861328, "global_step": 499336, "epoch": 6016} {"train_loss": -26.964460372924805, "global_step": 499337, "epoch": 6016} {"train_loss": -26.3572940826416, "global_step": 499338, "epoch": 6016} {"train_loss": -27.216278076171875, "global_step": 499339, "epoch": 6016} {"train_loss": -27.29603385925293, "global_step": 499340, "epoch": 6016} {"train_loss": -27.23468017578125, "global_step": 499341, "epoch": 6016} {"train_loss": -27.08194351196289, "global_step": 499342, "epoch": 6016} {"train_loss": -26.865060806274414, "global_step": 499343, "epoch": 6016} {"train_loss": -27.13236427307129, "global_step": 499344, "epoch": 6016} {"train_loss": -27.269575119018555, "global_step": 499345, "epoch": 6016} {"train_loss": -26.77484130859375, "global_step": 499346, "epoch": 6016} {"train_loss": -27.35434341430664, "global_step": 499347, "epoch": 6016} {"train_loss": -27.520578384399414, "global_step": 499348, "epoch": 6016} {"train_loss": -27.632925033569336, "global_step": 499349, "epoch": 6016} {"train_loss": -27.131250381469727, "global_step": 499350, "epoch": 6016} {"train_loss": -27.181432723999023, "global_step": 499351, "epoch": 6016} {"train_loss": -27.517465591430664, "global_step": 499352, "epoch": 6016} {"train_loss": -27.48187255859375, "global_step": 499353, "epoch": 6016} {"train_loss": -27.52685546875, "global_step": 499354, "epoch": 6016} {"train_loss": -27.648263931274414, "global_step": 499355, "epoch": 6016} {"train_loss": -27.493152618408203, "global_step": 499356, "epoch": 6016} {"train_loss": -27.481359481811523, "global_step": 499357, "epoch": 6016} {"train_loss": -27.3355655670166, "global_step": 499358, "epoch": 6016} {"train_loss": -27.464277267456055, "global_step": 499359, "epoch": 6016} {"train_loss": -27.274351119995117, "global_step": 499360, "epoch": 6016} {"train_loss": -27.57196617126465, "global_step": 499361, "epoch": 6016} {"train_loss": -27.47477149963379, "global_step": 499362, "epoch": 6016} {"train_loss": -27.49904441833496, "global_step": 499363, "epoch": 6016} {"train_loss": -27.37946891784668, "global_step": 499364, "epoch": 6016} {"train_loss": -27.327077865600586, "global_step": 499365, "epoch": 6016} {"train_loss": -27.295820236206055, "global_step": 499366, "epoch": 6016} {"train_loss": -27.60361099243164, "global_step": 499367, "epoch": 6016} {"train_loss": -27.626758575439453, "global_step": 499368, "epoch": 6016} {"train_loss": -27.718420028686523, "global_step": 499369, "epoch": 6016} {"train_loss": -27.343957901000977, "global_step": 499370, "epoch": 6016} {"train_loss": -27.157779693603516, "global_step": 499371, "epoch": 6016} {"train_loss": -27.665760040283203, "global_step": 499372, "epoch": 6016} {"train_loss": -27.680999755859375, "global_step": 499373, "epoch": 6016} {"train_loss": -27.29243278503418, "global_step": 499374, "epoch": 6016} {"train_loss": -26.662769317626953, "global_step": 499375, "epoch": 6016} {"train_loss": -27.543466567993164, "global_step": 499376, "epoch": 6016} {"train_loss": -27.682132720947266, "global_step": 499377, "epoch": 6016} {"train_loss": -27.432477951049805, "global_step": 499378, "epoch": 6016} {"train_loss": -27.38479995727539, "global_step": 499379, "epoch": 6016} {"train_loss": -27.34291648864746, "global_step": 499380, "epoch": 6016} {"train_loss": -27.535123825073242, "global_step": 499381, "epoch": 6016} {"train_loss": -27.18800163269043, "global_step": 499382, "epoch": 6016} {"train_loss": -27.53999137878418, "global_step": 499383, "epoch": 6016} {"train_loss": -27.42022132873535, "global_step": 499384, "epoch": 6016} {"train_loss": -27.635009765625, "global_step": 499385, "epoch": 6016} {"train_loss": -27.127399444580078, "global_step": 499386, "epoch": 6016} {"train_loss": -27.5391845703125, "global_step": 499387, "epoch": 6016} {"train_loss": -27.592748641967773, "global_step": 499388, "epoch": 6016} {"train_loss": -27.257482528686523, "global_step": 499389, "epoch": 6016} {"train_loss": -27.590856552124023, "global_step": 499390, "epoch": 6016} {"train_loss": -27.26995849609375, "global_step": 499391, "epoch": 6016} {"train_loss": -27.24627685546875, "global_step": 499392, "epoch": 6016} {"train_loss": -27.276519775390625, "global_step": 499393, "epoch": 6016} {"train_loss": -26.761194229125977, "global_step": 499394, "epoch": 6016} {"train_loss": -27.5443172454834, "global_step": 499395, "epoch": 6016} {"train_loss": -27.6855411529541, "global_step": 499396, "epoch": 6016} {"train_loss": -27.319019317626953, "global_step": 499397, "epoch": 6016} {"train_loss": -27.097753524780273, "global_step": 499398, "epoch": 6016} {"train_loss": -27.439062118530273, "global_step": 499399, "epoch": 6016} {"train_loss": -27.696191787719727, "global_step": 499400, "epoch": 6016} {"train_loss": -27.344839096069336, "global_step": 499401, "epoch": 6016} {"train_loss": -27.36211585998535, "global_step": 499402, "epoch": 6016} {"train_loss": -27.330047607421875, "global_step": 499403, "epoch": 6016} {"train_loss": -27.46002769470215, "global_step": 499404, "epoch": 6016} {"train_loss": -27.247217178344727, "global_step": 499405, "epoch": 6016} {"train_loss": -27.623498916625977, "global_step": 499406, "epoch": 6016} {"train_loss": -27.68214225769043, "global_step": 499407, "epoch": 6016} {"train_loss": -27.48097038269043, "global_step": 499408, "epoch": 6016} {"train_loss": -27.77512550354004, "global_step": 499409, "epoch": 6016} {"train_loss": -27.333328453891248, "global_step": 499410, "epoch": 6016, "val_loss": 6653851.0} {"train_loss": -27.114124298095703, "global_step": 499411, "epoch": 6017} {"train_loss": -26.958600997924805, "global_step": 499412, "epoch": 6017} {"train_loss": -25.86408805847168, "global_step": 499413, "epoch": 6017} {"train_loss": -23.97492027282715, "global_step": 499414, "epoch": 6017} {"train_loss": -23.998273849487305, "global_step": 499415, "epoch": 6017} {"train_loss": -26.201871871948242, "global_step": 499416, "epoch": 6017} {"train_loss": -26.169660568237305, "global_step": 499417, "epoch": 6017} {"train_loss": -26.311670303344727, "global_step": 499418, "epoch": 6017} {"train_loss": -26.102888107299805, "global_step": 499419, "epoch": 6017} {"train_loss": -26.912765502929688, "global_step": 499420, "epoch": 6017} {"train_loss": -26.21170425415039, "global_step": 499421, "epoch": 6017} {"train_loss": -26.598758697509766, "global_step": 499422, "epoch": 6017} {"train_loss": -27.122461318969727, "global_step": 499423, "epoch": 6017} {"train_loss": -26.375158309936523, "global_step": 499424, "epoch": 6017} {"train_loss": -26.6575870513916, "global_step": 499425, "epoch": 6017} {"train_loss": -26.873380661010742, "global_step": 499426, "epoch": 6017} {"train_loss": -26.525739669799805, "global_step": 499427, "epoch": 6017} {"train_loss": -27.175739288330078, "global_step": 499428, "epoch": 6017} {"train_loss": -26.782846450805664, "global_step": 499429, "epoch": 6017} {"train_loss": -26.751373291015625, "global_step": 499430, "epoch": 6017} {"train_loss": -26.82086753845215, "global_step": 499431, "epoch": 6017} {"train_loss": -27.09077262878418, "global_step": 499432, "epoch": 6017} {"train_loss": -27.114221572875977, "global_step": 499433, "epoch": 6017} {"train_loss": -26.860565185546875, "global_step": 499434, "epoch": 6017} {"train_loss": -26.980817794799805, "global_step": 499435, "epoch": 6017} {"train_loss": -26.809064865112305, "global_step": 499436, "epoch": 6017} {"train_loss": -27.21986961364746, "global_step": 499437, "epoch": 6017} {"train_loss": -27.023107528686523, "global_step": 499438, "epoch": 6017} {"train_loss": -27.282995223999023, "global_step": 499439, "epoch": 6017} {"train_loss": -27.552841186523438, "global_step": 499440, "epoch": 6017} {"train_loss": -26.85466957092285, "global_step": 499441, "epoch": 6017} {"train_loss": -27.324979782104492, "global_step": 499442, "epoch": 6017} {"train_loss": -26.971418380737305, "global_step": 499443, "epoch": 6017} {"train_loss": -27.273900985717773, "global_step": 499444, "epoch": 6017} {"train_loss": -26.808317184448242, "global_step": 499445, "epoch": 6017} {"train_loss": -27.3544864654541, "global_step": 499446, "epoch": 6017} {"train_loss": -26.946304321289062, "global_step": 499447, "epoch": 6017} {"train_loss": -27.160491943359375, "global_step": 499448, "epoch": 6017} {"train_loss": -27.258962631225586, "global_step": 499449, "epoch": 6017} {"train_loss": -27.159748077392578, "global_step": 499450, "epoch": 6017} {"train_loss": -27.111066818237305, "global_step": 499451, "epoch": 6017} {"train_loss": -27.395221710205078, "global_step": 499452, "epoch": 6017} {"train_loss": -27.031463623046875, "global_step": 499453, "epoch": 6017} {"train_loss": -27.377660751342773, "global_step": 499454, "epoch": 6017} {"train_loss": -27.422727584838867, "global_step": 499455, "epoch": 6017} {"train_loss": -27.63300132751465, "global_step": 499456, "epoch": 6017} {"train_loss": -27.147668838500977, "global_step": 499457, "epoch": 6017} {"train_loss": -27.49802589416504, "global_step": 499458, "epoch": 6017} {"train_loss": -27.73921012878418, "global_step": 499459, "epoch": 6017} {"train_loss": -27.415380477905273, "global_step": 499460, "epoch": 6017} {"train_loss": -27.073667526245117, "global_step": 499461, "epoch": 6017} {"train_loss": -27.18402099609375, "global_step": 499462, "epoch": 6017} {"train_loss": -27.50115394592285, "global_step": 499463, "epoch": 6017} {"train_loss": -27.08416748046875, "global_step": 499464, "epoch": 6017} {"train_loss": -27.404813766479492, "global_step": 499465, "epoch": 6017} {"train_loss": -27.440656661987305, "global_step": 499466, "epoch": 6017} {"train_loss": -27.800613403320312, "global_step": 499467, "epoch": 6017} {"train_loss": -27.450485229492188, "global_step": 499468, "epoch": 6017} {"train_loss": -27.500919342041016, "global_step": 499469, "epoch": 6017} {"train_loss": -27.034936904907227, "global_step": 499470, "epoch": 6017} {"train_loss": -27.519811630249023, "global_step": 499471, "epoch": 6017} {"train_loss": -27.376296997070312, "global_step": 499472, "epoch": 6017} {"train_loss": -27.848352432250977, "global_step": 499473, "epoch": 6017} {"train_loss": -27.504608154296875, "global_step": 499474, "epoch": 6017} {"train_loss": -27.354833602905273, "global_step": 499475, "epoch": 6017} {"train_loss": -27.753698348999023, "global_step": 499476, "epoch": 6017} {"train_loss": -27.16180419921875, "global_step": 499477, "epoch": 6017} {"train_loss": -27.721521377563477, "global_step": 499478, "epoch": 6017} {"train_loss": -27.302167892456055, "global_step": 499479, "epoch": 6017} {"train_loss": -27.74662208557129, "global_step": 499480, "epoch": 6017} {"train_loss": -27.32557487487793, "global_step": 499481, "epoch": 6017} {"train_loss": -27.5233211517334, "global_step": 499482, "epoch": 6017} {"train_loss": -27.682458877563477, "global_step": 499483, "epoch": 6017} {"train_loss": -27.646015167236328, "global_step": 499484, "epoch": 6017} {"train_loss": -27.692663192749023, "global_step": 499485, "epoch": 6017} {"train_loss": -27.3245849609375, "global_step": 499486, "epoch": 6017} {"train_loss": -27.343250274658203, "global_step": 499487, "epoch": 6017} {"train_loss": -27.710554122924805, "global_step": 499488, "epoch": 6017} {"train_loss": -27.355560302734375, "global_step": 499489, "epoch": 6017} {"train_loss": -27.803466796875, "global_step": 499490, "epoch": 6017} {"train_loss": -27.790292739868164, "global_step": 499491, "epoch": 6017} {"train_loss": -27.61824607849121, "global_step": 499492, "epoch": 6017} {"train_loss": -27.091417404542486, "global_step": 499493, "epoch": 6017, "val_loss": 6734933.0} {"train_loss": -26.469152450561523, "global_step": 499494, "epoch": 6018} {"train_loss": -26.024972915649414, "global_step": 499495, "epoch": 6018} {"train_loss": -26.33807373046875, "global_step": 499496, "epoch": 6018} {"train_loss": -27.212121963500977, "global_step": 499497, "epoch": 6018} {"train_loss": -26.711721420288086, "global_step": 499498, "epoch": 6018} {"train_loss": -26.413543701171875, "global_step": 499499, "epoch": 6018} {"train_loss": -27.206350326538086, "global_step": 499500, "epoch": 6018} {"train_loss": -27.06618309020996, "global_step": 499501, "epoch": 6018} {"train_loss": -27.19233512878418, "global_step": 499502, "epoch": 6018} {"train_loss": -26.79792594909668, "global_step": 499503, "epoch": 6018} {"train_loss": -27.45047378540039, "global_step": 499504, "epoch": 6018} {"train_loss": -26.61993980407715, "global_step": 499505, "epoch": 6018} {"train_loss": -27.15069580078125, "global_step": 499506, "epoch": 6018} {"train_loss": -27.04743766784668, "global_step": 499507, "epoch": 6018} {"train_loss": -26.930145263671875, "global_step": 499508, "epoch": 6018} {"train_loss": -26.937423706054688, "global_step": 499509, "epoch": 6018} {"train_loss": -27.2716007232666, "global_step": 499510, "epoch": 6018} {"train_loss": -27.150699615478516, "global_step": 499511, "epoch": 6018} {"train_loss": -27.146167755126953, "global_step": 499512, "epoch": 6018} {"train_loss": -26.859760284423828, "global_step": 499513, "epoch": 6018} {"train_loss": -27.0582332611084, "global_step": 499514, "epoch": 6018} {"train_loss": -27.14339256286621, "global_step": 499515, "epoch": 6018} {"train_loss": -27.101104736328125, "global_step": 499516, "epoch": 6018} {"train_loss": -27.31092643737793, "global_step": 499517, "epoch": 6018} {"train_loss": -26.93011474609375, "global_step": 499518, "epoch": 6018} {"train_loss": -27.12387466430664, "global_step": 499519, "epoch": 6018} {"train_loss": -27.5505428314209, "global_step": 499520, "epoch": 6018} {"train_loss": -27.409727096557617, "global_step": 499521, "epoch": 6018} {"train_loss": -27.411136627197266, "global_step": 499522, "epoch": 6018} {"train_loss": -27.49102210998535, "global_step": 499523, "epoch": 6018} {"train_loss": -27.201948165893555, "global_step": 499524, "epoch": 6018} {"train_loss": -27.496002197265625, "global_step": 499525, "epoch": 6018} {"train_loss": -27.084741592407227, "global_step": 499526, "epoch": 6018} {"train_loss": -27.378372192382812, "global_step": 499527, "epoch": 6018} {"train_loss": -27.186254501342773, "global_step": 499528, "epoch": 6018} {"train_loss": -27.366865158081055, "global_step": 499529, "epoch": 6018} {"train_loss": -27.3405818939209, "global_step": 499530, "epoch": 6018} {"train_loss": -27.117578506469727, "global_step": 499531, "epoch": 6018} {"train_loss": -27.306289672851562, "global_step": 499532, "epoch": 6018} {"train_loss": -27.72389030456543, "global_step": 499533, "epoch": 6018} {"train_loss": -27.41912269592285, "global_step": 499534, "epoch": 6018} {"train_loss": -27.49042320251465, "global_step": 499535, "epoch": 6018} {"train_loss": -27.644765853881836, "global_step": 499536, "epoch": 6018} {"train_loss": -27.289066314697266, "global_step": 499537, "epoch": 6018} {"train_loss": -27.648761749267578, "global_step": 499538, "epoch": 6018} {"train_loss": -27.650617599487305, "global_step": 499539, "epoch": 6018} {"train_loss": -27.346479415893555, "global_step": 499540, "epoch": 6018} {"train_loss": -27.696165084838867, "global_step": 499541, "epoch": 6018} {"train_loss": -27.486175537109375, "global_step": 499542, "epoch": 6018} {"train_loss": -27.186628341674805, "global_step": 499543, "epoch": 6018} {"train_loss": -27.8698673248291, "global_step": 499544, "epoch": 6018} {"train_loss": -27.156591415405273, "global_step": 499545, "epoch": 6018} {"train_loss": -27.8084716796875, "global_step": 499546, "epoch": 6018} {"train_loss": -27.893415451049805, "global_step": 499547, "epoch": 6018} {"train_loss": -27.907215118408203, "global_step": 499548, "epoch": 6018} {"train_loss": -27.570667266845703, "global_step": 499549, "epoch": 6018} {"train_loss": -27.172178268432617, "global_step": 499550, "epoch": 6018} {"train_loss": -27.210025787353516, "global_step": 499551, "epoch": 6018} {"train_loss": -27.506732940673828, "global_step": 499552, "epoch": 6018} {"train_loss": -27.390954971313477, "global_step": 499553, "epoch": 6018} {"train_loss": -27.54758071899414, "global_step": 499554, "epoch": 6018} {"train_loss": -27.42545509338379, "global_step": 499555, "epoch": 6018} {"train_loss": -27.26791763305664, "global_step": 499556, "epoch": 6018} {"train_loss": -27.377197265625, "global_step": 499557, "epoch": 6018} {"train_loss": -27.609704971313477, "global_step": 499558, "epoch": 6018} {"train_loss": -27.7220458984375, "global_step": 499559, "epoch": 6018} {"train_loss": -27.386987686157227, "global_step": 499560, "epoch": 6018} {"train_loss": -27.462858200073242, "global_step": 499561, "epoch": 6018} {"train_loss": -27.397506713867188, "global_step": 499562, "epoch": 6018} {"train_loss": -27.331830978393555, "global_step": 499563, "epoch": 6018} {"train_loss": -26.97428321838379, "global_step": 499564, "epoch": 6018} {"train_loss": -27.07367515563965, "global_step": 499565, "epoch": 6018} {"train_loss": -27.270389556884766, "global_step": 499566, "epoch": 6018} {"train_loss": -27.530004501342773, "global_step": 499567, "epoch": 6018} {"train_loss": -27.430585861206055, "global_step": 499568, "epoch": 6018} {"train_loss": -27.04970359802246, "global_step": 499569, "epoch": 6018} {"train_loss": -27.582334518432617, "global_step": 499570, "epoch": 6018} {"train_loss": -27.436176300048828, "global_step": 499571, "epoch": 6018} {"train_loss": -27.509836196899414, "global_step": 499572, "epoch": 6018} {"train_loss": -27.17424964904785, "global_step": 499573, "epoch": 6018} {"train_loss": -27.609420776367188, "global_step": 499574, "epoch": 6018} {"train_loss": -27.448047637939453, "global_step": 499575, "epoch": 6018} {"train_loss": -27.290185170001294, "global_step": 499576, "epoch": 6018, "val_loss": 6711994.5} {"train_loss": -26.1492977142334, "global_step": 499577, "epoch": 6019} {"train_loss": -25.343402862548828, "global_step": 499578, "epoch": 6019} {"train_loss": -26.286575317382812, "global_step": 499579, "epoch": 6019} {"train_loss": -27.043249130249023, "global_step": 499580, "epoch": 6019} {"train_loss": -26.489126205444336, "global_step": 499581, "epoch": 6019} {"train_loss": -26.795719146728516, "global_step": 499582, "epoch": 6019} {"train_loss": -27.02488136291504, "global_step": 499583, "epoch": 6019} {"train_loss": -26.510339736938477, "global_step": 499584, "epoch": 6019} {"train_loss": -27.018613815307617, "global_step": 499585, "epoch": 6019} {"train_loss": -26.951501846313477, "global_step": 499586, "epoch": 6019} {"train_loss": -27.0675048828125, "global_step": 499587, "epoch": 6019} {"train_loss": -27.027692794799805, "global_step": 499588, "epoch": 6019} {"train_loss": -27.118371963500977, "global_step": 499589, "epoch": 6019} {"train_loss": -26.374256134033203, "global_step": 499590, "epoch": 6019} {"train_loss": -26.708541870117188, "global_step": 499591, "epoch": 6019} {"train_loss": -27.065582275390625, "global_step": 499592, "epoch": 6019} {"train_loss": -26.86187744140625, "global_step": 499593, "epoch": 6019} {"train_loss": -26.967880249023438, "global_step": 499594, "epoch": 6019} {"train_loss": -26.939239501953125, "global_step": 499595, "epoch": 6019} {"train_loss": -26.691099166870117, "global_step": 499596, "epoch": 6019} {"train_loss": -27.203784942626953, "global_step": 499597, "epoch": 6019} {"train_loss": -26.843570709228516, "global_step": 499598, "epoch": 6019} {"train_loss": -27.245697021484375, "global_step": 499599, "epoch": 6019} {"train_loss": -27.19563102722168, "global_step": 499600, "epoch": 6019} {"train_loss": -27.33308219909668, "global_step": 499601, "epoch": 6019} {"train_loss": -26.903112411499023, "global_step": 499602, "epoch": 6019} {"train_loss": -26.57855796813965, "global_step": 499603, "epoch": 6019} {"train_loss": -27.0357723236084, "global_step": 499604, "epoch": 6019} {"train_loss": -26.907459259033203, "global_step": 499605, "epoch": 6019} {"train_loss": -27.103525161743164, "global_step": 499606, "epoch": 6019} {"train_loss": -27.34576988220215, "global_step": 499607, "epoch": 6019} {"train_loss": -27.088653564453125, "global_step": 499608, "epoch": 6019} {"train_loss": -27.015501022338867, "global_step": 499609, "epoch": 6019} {"train_loss": -27.3837947845459, "global_step": 499610, "epoch": 6019} {"train_loss": -27.225433349609375, "global_step": 499611, "epoch": 6019} {"train_loss": -27.63632583618164, "global_step": 499612, "epoch": 6019} {"train_loss": -27.34384536743164, "global_step": 499613, "epoch": 6019} {"train_loss": -27.345340728759766, "global_step": 499614, "epoch": 6019} {"train_loss": -27.201391220092773, "global_step": 499615, "epoch": 6019} {"train_loss": -27.56977653503418, "global_step": 499616, "epoch": 6019} {"train_loss": -27.264204025268555, "global_step": 499617, "epoch": 6019} {"train_loss": -27.415557861328125, "global_step": 499618, "epoch": 6019} {"train_loss": -27.5463809967041, "global_step": 499619, "epoch": 6019} {"train_loss": -27.279296875, "global_step": 499620, "epoch": 6019} {"train_loss": -27.12479591369629, "global_step": 499621, "epoch": 6019} {"train_loss": -27.270450592041016, "global_step": 499622, "epoch": 6019} {"train_loss": -27.1514949798584, "global_step": 499623, "epoch": 6019} {"train_loss": -27.151174545288086, "global_step": 499624, "epoch": 6019} {"train_loss": -27.587299346923828, "global_step": 499625, "epoch": 6019} {"train_loss": -27.39580726623535, "global_step": 499626, "epoch": 6019} {"train_loss": -27.2988224029541, "global_step": 499627, "epoch": 6019} {"train_loss": -27.389368057250977, "global_step": 499628, "epoch": 6019} {"train_loss": -27.72173500061035, "global_step": 499629, "epoch": 6019} {"train_loss": -27.6361141204834, "global_step": 499630, "epoch": 6019} {"train_loss": -27.37015724182129, "global_step": 499631, "epoch": 6019} {"train_loss": -27.435577392578125, "global_step": 499632, "epoch": 6019} {"train_loss": -27.19482421875, "global_step": 499633, "epoch": 6019} {"train_loss": -27.761621475219727, "global_step": 499634, "epoch": 6019} {"train_loss": -27.251373291015625, "global_step": 499635, "epoch": 6019} {"train_loss": -27.29410171508789, "global_step": 499636, "epoch": 6019} {"train_loss": -27.61362075805664, "global_step": 499637, "epoch": 6019} {"train_loss": -27.277145385742188, "global_step": 499638, "epoch": 6019} {"train_loss": -27.216588973999023, "global_step": 499639, "epoch": 6019} {"train_loss": -27.24369239807129, "global_step": 499640, "epoch": 6019} {"train_loss": -27.6380672454834, "global_step": 499641, "epoch": 6019} {"train_loss": -27.163623809814453, "global_step": 499642, "epoch": 6019} {"train_loss": -27.3338565826416, "global_step": 499643, "epoch": 6019} {"train_loss": -27.18958854675293, "global_step": 499644, "epoch": 6019} {"train_loss": -27.2563533782959, "global_step": 499645, "epoch": 6019} {"train_loss": -27.274255752563477, "global_step": 499646, "epoch": 6019} {"train_loss": -27.22889518737793, "global_step": 499647, "epoch": 6019} {"train_loss": -27.62930679321289, "global_step": 499648, "epoch": 6019} {"train_loss": -27.642337799072266, "global_step": 499649, "epoch": 6019} {"train_loss": -27.19205665588379, "global_step": 499650, "epoch": 6019} {"train_loss": -27.747314453125, "global_step": 499651, "epoch": 6019} {"train_loss": -27.3332462310791, "global_step": 499652, "epoch": 6019} {"train_loss": -27.099807739257812, "global_step": 499653, "epoch": 6019} {"train_loss": -27.4426212310791, "global_step": 499654, "epoch": 6019} {"train_loss": -27.40065574645996, "global_step": 499655, "epoch": 6019} {"train_loss": -27.446889877319336, "global_step": 499656, "epoch": 6019} {"train_loss": -27.54877281188965, "global_step": 499657, "epoch": 6019} {"train_loss": -27.354206085205078, "global_step": 499658, "epoch": 6019} {"train_loss": -27.174807330211962, "global_step": 499659, "epoch": 6019, "val_loss": 6723321.5} {"train_loss": -27.14151954650879, "global_step": 499660, "epoch": 6020} {"train_loss": -27.234594345092773, "global_step": 499661, "epoch": 6020} {"train_loss": -27.243032455444336, "global_step": 499662, "epoch": 6020} {"train_loss": -26.86232566833496, "global_step": 499663, "epoch": 6020} {"train_loss": -27.36371421813965, "global_step": 499664, "epoch": 6020} {"train_loss": -27.186420440673828, "global_step": 499665, "epoch": 6020} {"train_loss": -27.195661544799805, "global_step": 499666, "epoch": 6020} {"train_loss": -27.362049102783203, "global_step": 499667, "epoch": 6020} {"train_loss": -26.9487247467041, "global_step": 499668, "epoch": 6020} {"train_loss": -27.3129825592041, "global_step": 499669, "epoch": 6020} {"train_loss": -27.16016960144043, "global_step": 499670, "epoch": 6020} {"train_loss": -27.196319580078125, "global_step": 499671, "epoch": 6020} {"train_loss": -26.997222900390625, "global_step": 499672, "epoch": 6020} {"train_loss": -27.23606300354004, "global_step": 499673, "epoch": 6020} {"train_loss": -27.160980224609375, "global_step": 499674, "epoch": 6020} {"train_loss": -27.2178897857666, "global_step": 499675, "epoch": 6020} {"train_loss": -27.40574073791504, "global_step": 499676, "epoch": 6020} {"train_loss": -27.061569213867188, "global_step": 499677, "epoch": 6020} {"train_loss": -27.322559356689453, "global_step": 499678, "epoch": 6020} {"train_loss": -27.321704864501953, "global_step": 499679, "epoch": 6020} {"train_loss": -27.029727935791016, "global_step": 499680, "epoch": 6020} {"train_loss": -27.137165069580078, "global_step": 499681, "epoch": 6020} {"train_loss": -27.21341323852539, "global_step": 499682, "epoch": 6020} {"train_loss": -27.18132972717285, "global_step": 499683, "epoch": 6020} {"train_loss": -27.285314559936523, "global_step": 499684, "epoch": 6020} {"train_loss": -27.211217880249023, "global_step": 499685, "epoch": 6020} {"train_loss": -26.96709632873535, "global_step": 499686, "epoch": 6020} {"train_loss": -27.30999755859375, "global_step": 499687, "epoch": 6020} {"train_loss": -27.231515884399414, "global_step": 499688, "epoch": 6020} {"train_loss": -27.048437118530273, "global_step": 499689, "epoch": 6020} {"train_loss": -27.64411735534668, "global_step": 499690, "epoch": 6020} {"train_loss": -26.93726921081543, "global_step": 499691, "epoch": 6020} {"train_loss": -27.172119140625, "global_step": 499692, "epoch": 6020} {"train_loss": -27.500751495361328, "global_step": 499693, "epoch": 6020} {"train_loss": -27.20291519165039, "global_step": 499694, "epoch": 6020} {"train_loss": -27.419519424438477, "global_step": 499695, "epoch": 6020} {"train_loss": -27.53348159790039, "global_step": 499696, "epoch": 6020} {"train_loss": -27.5129337310791, "global_step": 499697, "epoch": 6020} {"train_loss": -27.474628448486328, "global_step": 499698, "epoch": 6020} {"train_loss": -27.400196075439453, "global_step": 499699, "epoch": 6020} {"train_loss": -27.7270565032959, "global_step": 499700, "epoch": 6020} {"train_loss": -27.346057891845703, "global_step": 499701, "epoch": 6020} {"train_loss": -27.6613826751709, "global_step": 499702, "epoch": 6020} {"train_loss": -27.376859664916992, "global_step": 499703, "epoch": 6020} {"train_loss": -27.268537521362305, "global_step": 499704, "epoch": 6020} {"train_loss": -27.375730514526367, "global_step": 499705, "epoch": 6020} {"train_loss": -27.399688720703125, "global_step": 499706, "epoch": 6020} {"train_loss": -27.49187660217285, "global_step": 499707, "epoch": 6020} {"train_loss": -27.270483016967773, "global_step": 499708, "epoch": 6020} {"train_loss": -27.46963882446289, "global_step": 499709, "epoch": 6020} {"train_loss": -27.471776962280273, "global_step": 499710, "epoch": 6020} {"train_loss": -27.64814567565918, "global_step": 499711, "epoch": 6020} {"train_loss": -27.30020523071289, "global_step": 499712, "epoch": 6020} {"train_loss": -27.521686553955078, "global_step": 499713, "epoch": 6020} {"train_loss": -27.48941993713379, "global_step": 499714, "epoch": 6020} {"train_loss": -27.091527938842773, "global_step": 499715, "epoch": 6020} {"train_loss": -27.473657608032227, "global_step": 499716, "epoch": 6020} {"train_loss": -27.3284854888916, "global_step": 499717, "epoch": 6020} {"train_loss": -27.26629638671875, "global_step": 499718, "epoch": 6020} {"train_loss": -27.79395866394043, "global_step": 499719, "epoch": 6020} {"train_loss": -27.07794189453125, "global_step": 499720, "epoch": 6020} {"train_loss": -27.975391387939453, "global_step": 499721, "epoch": 6020} {"train_loss": -27.50050163269043, "global_step": 499722, "epoch": 6020} {"train_loss": -27.217626571655273, "global_step": 499723, "epoch": 6020} {"train_loss": -27.466825485229492, "global_step": 499724, "epoch": 6020} {"train_loss": -27.313201904296875, "global_step": 499725, "epoch": 6020} {"train_loss": -27.746246337890625, "global_step": 499726, "epoch": 6020} {"train_loss": -27.465652465820312, "global_step": 499727, "epoch": 6020} {"train_loss": -27.5596923828125, "global_step": 499728, "epoch": 6020} {"train_loss": -27.64764976501465, "global_step": 499729, "epoch": 6020} {"train_loss": -27.447040557861328, "global_step": 499730, "epoch": 6020} {"train_loss": -27.59952163696289, "global_step": 499731, "epoch": 6020} {"train_loss": -27.225255966186523, "global_step": 499732, "epoch": 6020} {"train_loss": -27.88826560974121, "global_step": 499733, "epoch": 6020} {"train_loss": -26.91926383972168, "global_step": 499734, "epoch": 6020} {"train_loss": -27.468542098999023, "global_step": 499735, "epoch": 6020} {"train_loss": -27.175128936767578, "global_step": 499736, "epoch": 6020} {"train_loss": -27.596891403198242, "global_step": 499737, "epoch": 6020} {"train_loss": -27.679838180541992, "global_step": 499738, "epoch": 6020} {"train_loss": -27.588180541992188, "global_step": 499739, "epoch": 6020} {"train_loss": -27.42487144470215, "global_step": 499740, "epoch": 6020} {"train_loss": -27.17628288269043, "global_step": 499741, "epoch": 6020} {"train_loss": -27.34467400700213, "global_step": 499742, "epoch": 6020, "val_loss": 6758219.5} {"train_loss": -26.79889488220215, "global_step": 499743, "epoch": 6021} {"train_loss": -26.47345542907715, "global_step": 499744, "epoch": 6021} {"train_loss": -26.7652530670166, "global_step": 499745, "epoch": 6021} {"train_loss": -26.643056869506836, "global_step": 499746, "epoch": 6021} {"train_loss": -26.4965877532959, "global_step": 499747, "epoch": 6021} {"train_loss": -26.369855880737305, "global_step": 499748, "epoch": 6021} {"train_loss": -26.722808837890625, "global_step": 499749, "epoch": 6021} {"train_loss": -26.9183349609375, "global_step": 499750, "epoch": 6021} {"train_loss": -27.342426300048828, "global_step": 499751, "epoch": 6021} {"train_loss": -27.409198760986328, "global_step": 499752, "epoch": 6021} {"train_loss": -26.6464786529541, "global_step": 499753, "epoch": 6021} {"train_loss": -27.119226455688477, "global_step": 499754, "epoch": 6021} {"train_loss": -27.12164306640625, "global_step": 499755, "epoch": 6021} {"train_loss": -27.068334579467773, "global_step": 499756, "epoch": 6021} {"train_loss": -27.147855758666992, "global_step": 499757, "epoch": 6021} {"train_loss": -27.218536376953125, "global_step": 499758, "epoch": 6021} {"train_loss": -27.539813995361328, "global_step": 499759, "epoch": 6021} {"train_loss": -27.730213165283203, "global_step": 499760, "epoch": 6021} {"train_loss": -27.2633056640625, "global_step": 499761, "epoch": 6021} {"train_loss": -27.152069091796875, "global_step": 499762, "epoch": 6021} {"train_loss": -27.397876739501953, "global_step": 499763, "epoch": 6021} {"train_loss": -27.1469783782959, "global_step": 499764, "epoch": 6021} {"train_loss": -27.339111328125, "global_step": 499765, "epoch": 6021} {"train_loss": -27.27532958984375, "global_step": 499766, "epoch": 6021} {"train_loss": -27.51641845703125, "global_step": 499767, "epoch": 6021} {"train_loss": -26.874250411987305, "global_step": 499768, "epoch": 6021} {"train_loss": -27.365711212158203, "global_step": 499769, "epoch": 6021} {"train_loss": -27.52780532836914, "global_step": 499770, "epoch": 6021} {"train_loss": -27.23286247253418, "global_step": 499771, "epoch": 6021} {"train_loss": -27.452863693237305, "global_step": 499772, "epoch": 6021} {"train_loss": -27.59381103515625, "global_step": 499773, "epoch": 6021} {"train_loss": -27.524906158447266, "global_step": 499774, "epoch": 6021} {"train_loss": -27.277881622314453, "global_step": 499775, "epoch": 6021} {"train_loss": -27.56927490234375, "global_step": 499776, "epoch": 6021} {"train_loss": -27.3720703125, "global_step": 499777, "epoch": 6021} {"train_loss": -27.628097534179688, "global_step": 499778, "epoch": 6021} {"train_loss": -27.490976333618164, "global_step": 499779, "epoch": 6021} {"train_loss": -27.56328773498535, "global_step": 499780, "epoch": 6021} {"train_loss": -27.3170223236084, "global_step": 499781, "epoch": 6021} {"train_loss": -27.550180435180664, "global_step": 499782, "epoch": 6021} {"train_loss": -27.509140014648438, "global_step": 499783, "epoch": 6021} {"train_loss": -26.79949951171875, "global_step": 499784, "epoch": 6021} {"train_loss": -27.399734497070312, "global_step": 499785, "epoch": 6021} {"train_loss": -27.155628204345703, "global_step": 499786, "epoch": 6021} {"train_loss": -27.607572555541992, "global_step": 499787, "epoch": 6021} {"train_loss": -27.476871490478516, "global_step": 499788, "epoch": 6021} {"train_loss": -27.638891220092773, "global_step": 499789, "epoch": 6021} {"train_loss": -27.660465240478516, "global_step": 499790, "epoch": 6021} {"train_loss": -27.3429012298584, "global_step": 499791, "epoch": 6021} {"train_loss": -27.348087310791016, "global_step": 499792, "epoch": 6021} {"train_loss": -27.943038940429688, "global_step": 499793, "epoch": 6021} {"train_loss": -27.37298583984375, "global_step": 499794, "epoch": 6021} {"train_loss": -27.465686798095703, "global_step": 499795, "epoch": 6021} {"train_loss": -27.462060928344727, "global_step": 499796, "epoch": 6021} {"train_loss": -27.35470962524414, "global_step": 499797, "epoch": 6021} {"train_loss": -27.446674346923828, "global_step": 499798, "epoch": 6021} {"train_loss": -27.880416870117188, "global_step": 499799, "epoch": 6021} {"train_loss": -27.627477645874023, "global_step": 499800, "epoch": 6021} {"train_loss": -27.418760299682617, "global_step": 499801, "epoch": 6021} {"train_loss": -27.768543243408203, "global_step": 499802, "epoch": 6021} {"train_loss": -27.32722282409668, "global_step": 499803, "epoch": 6021} {"train_loss": -27.633453369140625, "global_step": 499804, "epoch": 6021} {"train_loss": -27.511194229125977, "global_step": 499805, "epoch": 6021} {"train_loss": -27.502410888671875, "global_step": 499806, "epoch": 6021} {"train_loss": -27.48672866821289, "global_step": 499807, "epoch": 6021} {"train_loss": -27.472509384155273, "global_step": 499808, "epoch": 6021} {"train_loss": -27.49641227722168, "global_step": 499809, "epoch": 6021} {"train_loss": -27.686023712158203, "global_step": 499810, "epoch": 6021} {"train_loss": -27.43149757385254, "global_step": 499811, "epoch": 6021} {"train_loss": -27.539661407470703, "global_step": 499812, "epoch": 6021} {"train_loss": -27.658918380737305, "global_step": 499813, "epoch": 6021} {"train_loss": -27.877294540405273, "global_step": 499814, "epoch": 6021} {"train_loss": -27.6990909576416, "global_step": 499815, "epoch": 6021} {"train_loss": -27.111608505249023, "global_step": 499816, "epoch": 6021} {"train_loss": -27.14100456237793, "global_step": 499817, "epoch": 6021} {"train_loss": -27.333328247070312, "global_step": 499818, "epoch": 6021} {"train_loss": -27.439794540405273, "global_step": 499819, "epoch": 6021} {"train_loss": -27.790185928344727, "global_step": 499820, "epoch": 6021} {"train_loss": -27.50425148010254, "global_step": 499821, "epoch": 6021} {"train_loss": -27.443572998046875, "global_step": 499822, "epoch": 6021} {"train_loss": -27.143033981323242, "global_step": 499823, "epoch": 6021} {"train_loss": -27.516874313354492, "global_step": 499824, "epoch": 6021} {"train_loss": -27.34956307009042, "global_step": 499825, "epoch": 6021, "val_loss": 6643666.0} {"train_loss": -27.104694366455078, "global_step": 499826, "epoch": 6022} {"train_loss": -26.806013107299805, "global_step": 499827, "epoch": 6022} {"train_loss": -26.685388565063477, "global_step": 499828, "epoch": 6022} {"train_loss": -27.132307052612305, "global_step": 499829, "epoch": 6022} {"train_loss": -26.76263999938965, "global_step": 499830, "epoch": 6022} {"train_loss": -27.069711685180664, "global_step": 499831, "epoch": 6022} {"train_loss": -27.14749526977539, "global_step": 499832, "epoch": 6022} {"train_loss": -26.68194580078125, "global_step": 499833, "epoch": 6022} {"train_loss": -27.102100372314453, "global_step": 499834, "epoch": 6022} {"train_loss": -27.228803634643555, "global_step": 499835, "epoch": 6022} {"train_loss": -27.39271354675293, "global_step": 499836, "epoch": 6022} {"train_loss": -27.006479263305664, "global_step": 499837, "epoch": 6022} {"train_loss": -27.37050437927246, "global_step": 499838, "epoch": 6022} {"train_loss": -27.410974502563477, "global_step": 499839, "epoch": 6022} {"train_loss": -27.188451766967773, "global_step": 499840, "epoch": 6022} {"train_loss": -27.157697677612305, "global_step": 499841, "epoch": 6022} {"train_loss": -27.4357852935791, "global_step": 499842, "epoch": 6022} {"train_loss": -27.003454208374023, "global_step": 499843, "epoch": 6022} {"train_loss": -27.4061336517334, "global_step": 499844, "epoch": 6022} {"train_loss": -27.03590202331543, "global_step": 499845, "epoch": 6022} {"train_loss": -27.340469360351562, "global_step": 499846, "epoch": 6022} {"train_loss": -27.138660430908203, "global_step": 499847, "epoch": 6022} {"train_loss": -27.50246238708496, "global_step": 499848, "epoch": 6022} {"train_loss": -27.182947158813477, "global_step": 499849, "epoch": 6022} {"train_loss": -27.486387252807617, "global_step": 499850, "epoch": 6022} {"train_loss": -27.412994384765625, "global_step": 499851, "epoch": 6022} {"train_loss": -27.49830436706543, "global_step": 499852, "epoch": 6022} {"train_loss": -27.207855224609375, "global_step": 499853, "epoch": 6022} {"train_loss": -27.220264434814453, "global_step": 499854, "epoch": 6022} {"train_loss": -27.51319694519043, "global_step": 499855, "epoch": 6022} {"train_loss": -27.560760498046875, "global_step": 499856, "epoch": 6022} {"train_loss": -27.5664005279541, "global_step": 499857, "epoch": 6022} {"train_loss": -27.464216232299805, "global_step": 499858, "epoch": 6022} {"train_loss": -27.383087158203125, "global_step": 499859, "epoch": 6022} {"train_loss": -27.4527530670166, "global_step": 499860, "epoch": 6022} {"train_loss": -27.175825119018555, "global_step": 499861, "epoch": 6022} {"train_loss": -27.12262535095215, "global_step": 499862, "epoch": 6022} {"train_loss": -26.463346481323242, "global_step": 499863, "epoch": 6022} {"train_loss": -26.6658878326416, "global_step": 499864, "epoch": 6022} {"train_loss": -26.725204467773438, "global_step": 499865, "epoch": 6022} {"train_loss": -27.652761459350586, "global_step": 499866, "epoch": 6022} {"train_loss": -27.173126220703125, "global_step": 499867, "epoch": 6022} {"train_loss": -26.718542098999023, "global_step": 499868, "epoch": 6022} {"train_loss": -27.234643936157227, "global_step": 499869, "epoch": 6022} {"train_loss": -26.865976333618164, "global_step": 499870, "epoch": 6022} {"train_loss": -27.270130157470703, "global_step": 499871, "epoch": 6022} {"train_loss": -27.554975509643555, "global_step": 499872, "epoch": 6022} {"train_loss": -27.3582706451416, "global_step": 499873, "epoch": 6022} {"train_loss": -27.09004020690918, "global_step": 499874, "epoch": 6022} {"train_loss": -27.943750381469727, "global_step": 499875, "epoch": 6022} {"train_loss": -27.128332138061523, "global_step": 499876, "epoch": 6022} {"train_loss": -27.653186798095703, "global_step": 499877, "epoch": 6022} {"train_loss": -27.11871910095215, "global_step": 499878, "epoch": 6022} {"train_loss": -27.432470321655273, "global_step": 499879, "epoch": 6022} {"train_loss": -27.28851890563965, "global_step": 499880, "epoch": 6022} {"train_loss": -27.2379207611084, "global_step": 499881, "epoch": 6022} {"train_loss": -27.527713775634766, "global_step": 499882, "epoch": 6022} {"train_loss": -27.052764892578125, "global_step": 499883, "epoch": 6022} {"train_loss": -27.252248764038086, "global_step": 499884, "epoch": 6022} {"train_loss": -27.325225830078125, "global_step": 499885, "epoch": 6022} {"train_loss": -26.973615646362305, "global_step": 499886, "epoch": 6022} {"train_loss": -27.08414649963379, "global_step": 499887, "epoch": 6022} {"train_loss": -27.4664306640625, "global_step": 499888, "epoch": 6022} {"train_loss": -27.49420738220215, "global_step": 499889, "epoch": 6022} {"train_loss": -27.260894775390625, "global_step": 499890, "epoch": 6022} {"train_loss": -27.318220138549805, "global_step": 499891, "epoch": 6022} {"train_loss": -27.479650497436523, "global_step": 499892, "epoch": 6022} {"train_loss": -27.45509147644043, "global_step": 499893, "epoch": 6022} {"train_loss": -27.772565841674805, "global_step": 499894, "epoch": 6022} {"train_loss": -27.25653648376465, "global_step": 499895, "epoch": 6022} {"train_loss": -27.022878646850586, "global_step": 499896, "epoch": 6022} {"train_loss": -27.35127067565918, "global_step": 499897, "epoch": 6022} {"train_loss": -26.986892700195312, "global_step": 499898, "epoch": 6022} {"train_loss": -27.26432228088379, "global_step": 499899, "epoch": 6022} {"train_loss": -26.925504684448242, "global_step": 499900, "epoch": 6022} {"train_loss": -27.014036178588867, "global_step": 499901, "epoch": 6022} {"train_loss": -27.285688400268555, "global_step": 499902, "epoch": 6022} {"train_loss": -27.832366943359375, "global_step": 499903, "epoch": 6022} {"train_loss": -26.665546417236328, "global_step": 499904, "epoch": 6022} {"train_loss": -26.284719467163086, "global_step": 499905, "epoch": 6022} {"train_loss": -26.10699462890625, "global_step": 499906, "epoch": 6022} {"train_loss": -26.899444580078125, "global_step": 499907, "epoch": 6022} {"train_loss": -27.199904660144483, "global_step": 499908, "epoch": 6022, "val_loss": 6688146.5} {"train_loss": -25.06011390686035, "global_step": 499909, "epoch": 6023} {"train_loss": -25.903034210205078, "global_step": 499910, "epoch": 6023} {"train_loss": -26.51543617248535, "global_step": 499911, "epoch": 6023} {"train_loss": -26.0113525390625, "global_step": 499912, "epoch": 6023} {"train_loss": -26.056842803955078, "global_step": 499913, "epoch": 6023} {"train_loss": -26.241907119750977, "global_step": 499914, "epoch": 6023} {"train_loss": -25.986997604370117, "global_step": 499915, "epoch": 6023} {"train_loss": -26.068166732788086, "global_step": 499916, "epoch": 6023} {"train_loss": -26.35536003112793, "global_step": 499917, "epoch": 6023} {"train_loss": -26.073734283447266, "global_step": 499918, "epoch": 6023} {"train_loss": -26.337066650390625, "global_step": 499919, "epoch": 6023} {"train_loss": -26.58821678161621, "global_step": 499920, "epoch": 6023} {"train_loss": -26.42901611328125, "global_step": 499921, "epoch": 6023} {"train_loss": -26.784040451049805, "global_step": 499922, "epoch": 6023} {"train_loss": -26.63593864440918, "global_step": 499923, "epoch": 6023} {"train_loss": -26.693603515625, "global_step": 499924, "epoch": 6023} {"train_loss": -26.631061553955078, "global_step": 499925, "epoch": 6023} {"train_loss": -26.865503311157227, "global_step": 499926, "epoch": 6023} {"train_loss": -26.757415771484375, "global_step": 499927, "epoch": 6023} {"train_loss": -26.732498168945312, "global_step": 499928, "epoch": 6023} {"train_loss": -27.21698570251465, "global_step": 499929, "epoch": 6023} {"train_loss": -26.83516502380371, "global_step": 499930, "epoch": 6023} {"train_loss": -27.019865036010742, "global_step": 499931, "epoch": 6023} {"train_loss": -27.028762817382812, "global_step": 499932, "epoch": 6023} {"train_loss": -26.94658851623535, "global_step": 499933, "epoch": 6023} {"train_loss": -26.853376388549805, "global_step": 499934, "epoch": 6023} {"train_loss": -26.827899932861328, "global_step": 499935, "epoch": 6023} {"train_loss": -27.418689727783203, "global_step": 499936, "epoch": 6023} {"train_loss": -27.029972076416016, "global_step": 499937, "epoch": 6023} {"train_loss": -26.83478355407715, "global_step": 499938, "epoch": 6023} {"train_loss": -27.298307418823242, "global_step": 499939, "epoch": 6023} {"train_loss": -26.880529403686523, "global_step": 499940, "epoch": 6023} {"train_loss": -27.445093154907227, "global_step": 499941, "epoch": 6023} {"train_loss": -27.497024536132812, "global_step": 499942, "epoch": 6023} {"train_loss": -27.057861328125, "global_step": 499943, "epoch": 6023} {"train_loss": -27.460485458374023, "global_step": 499944, "epoch": 6023} {"train_loss": -27.421289443969727, "global_step": 499945, "epoch": 6023} {"train_loss": -27.493207931518555, "global_step": 499946, "epoch": 6023} {"train_loss": -27.14861488342285, "global_step": 499947, "epoch": 6023} {"train_loss": -27.095678329467773, "global_step": 499948, "epoch": 6023} {"train_loss": -27.2169189453125, "global_step": 499949, "epoch": 6023} {"train_loss": -27.23641014099121, "global_step": 499950, "epoch": 6023} {"train_loss": -27.21736717224121, "global_step": 499951, "epoch": 6023} {"train_loss": -27.378110885620117, "global_step": 499952, "epoch": 6023} {"train_loss": -27.207273483276367, "global_step": 499953, "epoch": 6023} {"train_loss": -27.83966064453125, "global_step": 499954, "epoch": 6023} {"train_loss": -27.290998458862305, "global_step": 499955, "epoch": 6023} {"train_loss": -27.63410758972168, "global_step": 499956, "epoch": 6023} {"train_loss": -27.707914352416992, "global_step": 499957, "epoch": 6023} {"train_loss": -27.04884147644043, "global_step": 499958, "epoch": 6023} {"train_loss": -27.80567741394043, "global_step": 499959, "epoch": 6023} {"train_loss": -27.290220260620117, "global_step": 499960, "epoch": 6023} {"train_loss": -27.66511344909668, "global_step": 499961, "epoch": 6023} {"train_loss": -27.363513946533203, "global_step": 499962, "epoch": 6023} {"train_loss": -27.564300537109375, "global_step": 499963, "epoch": 6023} {"train_loss": -27.570154190063477, "global_step": 499964, "epoch": 6023} {"train_loss": -27.518707275390625, "global_step": 499965, "epoch": 6023} {"train_loss": -27.49041175842285, "global_step": 499966, "epoch": 6023} {"train_loss": -27.53653907775879, "global_step": 499967, "epoch": 6023} {"train_loss": -27.322187423706055, "global_step": 499968, "epoch": 6023} {"train_loss": -26.794281005859375, "global_step": 499969, "epoch": 6023} {"train_loss": -25.911544799804688, "global_step": 499970, "epoch": 6023} {"train_loss": -24.491479873657227, "global_step": 499971, "epoch": 6023} {"train_loss": -25.79937744140625, "global_step": 499972, "epoch": 6023} {"train_loss": -27.3155574798584, "global_step": 499973, "epoch": 6023} {"train_loss": -26.705331802368164, "global_step": 499974, "epoch": 6023} {"train_loss": -27.562530517578125, "global_step": 499975, "epoch": 6023} {"train_loss": -26.687170028686523, "global_step": 499976, "epoch": 6023} {"train_loss": -27.272497177124023, "global_step": 499977, "epoch": 6023} {"train_loss": -26.841537475585938, "global_step": 499978, "epoch": 6023} {"train_loss": -27.0117130279541, "global_step": 499979, "epoch": 6023} {"train_loss": -26.983917236328125, "global_step": 499980, "epoch": 6023} {"train_loss": -26.92035484313965, "global_step": 499981, "epoch": 6023} {"train_loss": -27.262741088867188, "global_step": 499982, "epoch": 6023} {"train_loss": -27.037153244018555, "global_step": 499983, "epoch": 6023} {"train_loss": -27.603168487548828, "global_step": 499984, "epoch": 6023} {"train_loss": -27.320302963256836, "global_step": 499985, "epoch": 6023} {"train_loss": -27.684228897094727, "global_step": 499986, "epoch": 6023} {"train_loss": -26.7596492767334, "global_step": 499987, "epoch": 6023} {"train_loss": -27.17984390258789, "global_step": 499988, "epoch": 6023} {"train_loss": -27.278589248657227, "global_step": 499989, "epoch": 6023} {"train_loss": -27.473342895507812, "global_step": 499990, "epoch": 6023} {"train_loss": -26.9405024654894, "global_step": 499991, "epoch": 6023, "val_loss": 6767414.0} {"train_loss": -26.445974349975586, "global_step": 499992, "epoch": 6024} {"train_loss": -25.750402450561523, "global_step": 499993, "epoch": 6024} {"train_loss": -26.704389572143555, "global_step": 499994, "epoch": 6024} {"train_loss": -27.277433395385742, "global_step": 499995, "epoch": 6024} {"train_loss": -26.539936065673828, "global_step": 499996, "epoch": 6024} {"train_loss": -26.955738067626953, "global_step": 499997, "epoch": 6024} {"train_loss": -26.888593673706055, "global_step": 499998, "epoch": 6024} {"train_loss": -26.991214752197266, "global_step": 499999, "epoch": 6024} {"train_loss": -26.887060165405273, "global_step": 500000, "epoch": 6024} {"train_loss": -26.758453369140625, "global_step": 500001, "epoch": 6024} {"train_loss": -26.694381713867188, "global_step": 500002, "epoch": 6024} {"train_loss": -26.743330001831055, "global_step": 500003, "epoch": 6024} {"train_loss": -26.864994049072266, "global_step": 500004, "epoch": 6024} {"train_loss": -27.10076904296875, "global_step": 500005, "epoch": 6024} {"train_loss": -27.26690101623535, "global_step": 500006, "epoch": 6024} {"train_loss": -26.971521377563477, "global_step": 500007, "epoch": 6024} {"train_loss": -26.9698543548584, "global_step": 500008, "epoch": 6024} {"train_loss": -27.453723907470703, "global_step": 500009, "epoch": 6024} {"train_loss": -27.02693748474121, "global_step": 500010, "epoch": 6024} {"train_loss": -26.911712646484375, "global_step": 500011, "epoch": 6024} {"train_loss": -27.63154411315918, "global_step": 500012, "epoch": 6024} {"train_loss": -27.389266967773438, "global_step": 500013, "epoch": 6024} {"train_loss": -27.39583396911621, "global_step": 500014, "epoch": 6024} {"train_loss": -27.55881690979004, "global_step": 500015, "epoch": 6024} {"train_loss": -27.53485679626465, "global_step": 500016, "epoch": 6024} {"train_loss": -27.163007736206055, "global_step": 500017, "epoch": 6024} {"train_loss": -27.326587677001953, "global_step": 500018, "epoch": 6024} {"train_loss": -27.682144165039062, "global_step": 500019, "epoch": 6024} {"train_loss": -27.399328231811523, "global_step": 500020, "epoch": 6024} {"train_loss": -27.778371810913086, "global_step": 500021, "epoch": 6024} {"train_loss": -27.342926025390625, "global_step": 500022, "epoch": 6024} {"train_loss": -27.470117568969727, "global_step": 500023, "epoch": 6024} {"train_loss": -27.541967391967773, "global_step": 500024, "epoch": 6024} {"train_loss": -27.838464736938477, "global_step": 500025, "epoch": 6024} {"train_loss": -27.28458023071289, "global_step": 500026, "epoch": 6024} {"train_loss": -27.60389518737793, "global_step": 500027, "epoch": 6024} {"train_loss": -27.27943229675293, "global_step": 500028, "epoch": 6024} {"train_loss": -27.32337760925293, "global_step": 500029, "epoch": 6024} {"train_loss": -27.66985511779785, "global_step": 500030, "epoch": 6024} {"train_loss": -27.32278823852539, "global_step": 500031, "epoch": 6024} {"train_loss": -27.119094848632812, "global_step": 500032, "epoch": 6024} {"train_loss": -27.309438705444336, "global_step": 500033, "epoch": 6024} {"train_loss": -27.51482582092285, "global_step": 500034, "epoch": 6024} {"train_loss": -27.662424087524414, "global_step": 500035, "epoch": 6024} {"train_loss": -27.443506240844727, "global_step": 500036, "epoch": 6024} {"train_loss": -27.583911895751953, "global_step": 500037, "epoch": 6024} {"train_loss": -27.632617950439453, "global_step": 500038, "epoch": 6024} {"train_loss": -27.440397262573242, "global_step": 500039, "epoch": 6024} {"train_loss": -27.53902244567871, "global_step": 500040, "epoch": 6024} {"train_loss": -27.384199142456055, "global_step": 500041, "epoch": 6024} {"train_loss": -27.678619384765625, "global_step": 500042, "epoch": 6024} {"train_loss": -27.477161407470703, "global_step": 500043, "epoch": 6024} {"train_loss": -27.777761459350586, "global_step": 500044, "epoch": 6024} {"train_loss": -27.3787899017334, "global_step": 500045, "epoch": 6024} {"train_loss": -27.512287139892578, "global_step": 500046, "epoch": 6024} {"train_loss": -27.69159507751465, "global_step": 500047, "epoch": 6024} {"train_loss": -27.7048282623291, "global_step": 500048, "epoch": 6024} {"train_loss": -27.56207275390625, "global_step": 500049, "epoch": 6024} {"train_loss": -27.089399337768555, "global_step": 500050, "epoch": 6024} {"train_loss": -27.409616470336914, "global_step": 500051, "epoch": 6024} {"train_loss": -27.08049964904785, "global_step": 500052, "epoch": 6024} {"train_loss": -27.47806167602539, "global_step": 500053, "epoch": 6024} {"train_loss": -27.208972930908203, "global_step": 500054, "epoch": 6024} {"train_loss": -27.286346435546875, "global_step": 500055, "epoch": 6024} {"train_loss": -27.76374626159668, "global_step": 500056, "epoch": 6024} {"train_loss": -27.409658432006836, "global_step": 500057, "epoch": 6024} {"train_loss": -26.97489356994629, "global_step": 500058, "epoch": 6024} {"train_loss": -27.021411895751953, "global_step": 500059, "epoch": 6024} {"train_loss": -27.264310836791992, "global_step": 500060, "epoch": 6024} {"train_loss": -27.138904571533203, "global_step": 500061, "epoch": 6024} {"train_loss": -27.263914108276367, "global_step": 500062, "epoch": 6024} {"train_loss": -27.438718795776367, "global_step": 500063, "epoch": 6024} {"train_loss": -26.724716186523438, "global_step": 500064, "epoch": 6024} {"train_loss": -27.232336044311523, "global_step": 500065, "epoch": 6024} {"train_loss": -27.331464767456055, "global_step": 500066, "epoch": 6024} {"train_loss": -27.322650909423828, "global_step": 500067, "epoch": 6024} {"train_loss": -27.0351619720459, "global_step": 500068, "epoch": 6024} {"train_loss": -27.222700119018555, "global_step": 500069, "epoch": 6024} {"train_loss": -27.242218017578125, "global_step": 500070, "epoch": 6024} {"train_loss": -27.396514892578125, "global_step": 500071, "epoch": 6024} {"train_loss": -27.419681549072266, "global_step": 500072, "epoch": 6024} {"train_loss": -27.169708251953125, "global_step": 500073, "epoch": 6024} {"train_loss": -27.269859199064324, "global_step": 500074, "epoch": 6024, "val_loss": 6666233.0} {"train_loss": -26.564716339111328, "global_step": 500075, "epoch": 6025} {"train_loss": -27.00738525390625, "global_step": 500076, "epoch": 6025} {"train_loss": -26.87183952331543, "global_step": 500077, "epoch": 6025} {"train_loss": -26.52070426940918, "global_step": 500078, "epoch": 6025} {"train_loss": -27.09541130065918, "global_step": 500079, "epoch": 6025} {"train_loss": -26.568805694580078, "global_step": 500080, "epoch": 6025} {"train_loss": -26.84022331237793, "global_step": 500081, "epoch": 6025} {"train_loss": -26.574018478393555, "global_step": 500082, "epoch": 6025} {"train_loss": -26.73103141784668, "global_step": 500083, "epoch": 6025} {"train_loss": -27.02618408203125, "global_step": 500084, "epoch": 6025} {"train_loss": -27.033445358276367, "global_step": 500085, "epoch": 6025} {"train_loss": -27.052799224853516, "global_step": 500086, "epoch": 6025} {"train_loss": -26.9166316986084, "global_step": 500087, "epoch": 6025} {"train_loss": -27.389175415039062, "global_step": 500088, "epoch": 6025} {"train_loss": -27.616193771362305, "global_step": 500089, "epoch": 6025} {"train_loss": -27.028228759765625, "global_step": 500090, "epoch": 6025} {"train_loss": -26.99848747253418, "global_step": 500091, "epoch": 6025} {"train_loss": -27.240478515625, "global_step": 500092, "epoch": 6025} {"train_loss": -27.245746612548828, "global_step": 500093, "epoch": 6025} {"train_loss": -27.243627548217773, "global_step": 500094, "epoch": 6025} {"train_loss": -27.419677734375, "global_step": 500095, "epoch": 6025} {"train_loss": -27.6385498046875, "global_step": 500096, "epoch": 6025} {"train_loss": -27.573705673217773, "global_step": 500097, "epoch": 6025} {"train_loss": -27.32191276550293, "global_step": 500098, "epoch": 6025} {"train_loss": -27.675458908081055, "global_step": 500099, "epoch": 6025} {"train_loss": -27.394018173217773, "global_step": 500100, "epoch": 6025} {"train_loss": -27.39117431640625, "global_step": 500101, "epoch": 6025} {"train_loss": -27.493865966796875, "global_step": 500102, "epoch": 6025} {"train_loss": -27.447675704956055, "global_step": 500103, "epoch": 6025} {"train_loss": -27.535425186157227, "global_step": 500104, "epoch": 6025} {"train_loss": -27.789764404296875, "global_step": 500105, "epoch": 6025} {"train_loss": -27.28383445739746, "global_step": 500106, "epoch": 6025} {"train_loss": -27.825834274291992, "global_step": 500107, "epoch": 6025} {"train_loss": -27.230756759643555, "global_step": 500108, "epoch": 6025} {"train_loss": -27.883438110351562, "global_step": 500109, "epoch": 6025} {"train_loss": -27.69845962524414, "global_step": 500110, "epoch": 6025} {"train_loss": -27.460712432861328, "global_step": 500111, "epoch": 6025} {"train_loss": -27.454782485961914, "global_step": 500112, "epoch": 6025} {"train_loss": -27.499792098999023, "global_step": 500113, "epoch": 6025} {"train_loss": -27.516056060791016, "global_step": 500114, "epoch": 6025} {"train_loss": -27.672454833984375, "global_step": 500115, "epoch": 6025} {"train_loss": -27.781946182250977, "global_step": 500116, "epoch": 6025} {"train_loss": -27.831762313842773, "global_step": 500117, "epoch": 6025} {"train_loss": -27.7562198638916, "global_step": 500118, "epoch": 6025} {"train_loss": -27.626876831054688, "global_step": 500119, "epoch": 6025} {"train_loss": -27.336151123046875, "global_step": 500120, "epoch": 6025} {"train_loss": -27.67508316040039, "global_step": 500121, "epoch": 6025} {"train_loss": -27.651641845703125, "global_step": 500122, "epoch": 6025} {"train_loss": -27.8702335357666, "global_step": 500123, "epoch": 6025} {"train_loss": -27.69032096862793, "global_step": 500124, "epoch": 6025} {"train_loss": -27.8500919342041, "global_step": 500125, "epoch": 6025} {"train_loss": -27.492895126342773, "global_step": 500126, "epoch": 6025} {"train_loss": -26.967838287353516, "global_step": 500127, "epoch": 6025} {"train_loss": -26.93112564086914, "global_step": 500128, "epoch": 6025} {"train_loss": -26.613143920898438, "global_step": 500129, "epoch": 6025} {"train_loss": -27.31634521484375, "global_step": 500130, "epoch": 6025} {"train_loss": -27.482929229736328, "global_step": 500131, "epoch": 6025} {"train_loss": -27.635162353515625, "global_step": 500132, "epoch": 6025} {"train_loss": -27.650724411010742, "global_step": 500133, "epoch": 6025} {"train_loss": -27.784259796142578, "global_step": 500134, "epoch": 6025} {"train_loss": -27.47296142578125, "global_step": 500135, "epoch": 6025} {"train_loss": -27.022296905517578, "global_step": 500136, "epoch": 6025} {"train_loss": -27.2187557220459, "global_step": 500137, "epoch": 6025} {"train_loss": -27.082813262939453, "global_step": 500138, "epoch": 6025} {"train_loss": -27.361312866210938, "global_step": 500139, "epoch": 6025} {"train_loss": -27.51026725769043, "global_step": 500140, "epoch": 6025} {"train_loss": -27.43477439880371, "global_step": 500141, "epoch": 6025} {"train_loss": -27.3599796295166, "global_step": 500142, "epoch": 6025} {"train_loss": -27.53725242614746, "global_step": 500143, "epoch": 6025} {"train_loss": -27.487287521362305, "global_step": 500144, "epoch": 6025} {"train_loss": -27.48664665222168, "global_step": 500145, "epoch": 6025} {"train_loss": -27.455472946166992, "global_step": 500146, "epoch": 6025} {"train_loss": -27.200525283813477, "global_step": 500147, "epoch": 6025} {"train_loss": -27.215789794921875, "global_step": 500148, "epoch": 6025} {"train_loss": -27.115131378173828, "global_step": 500149, "epoch": 6025} {"train_loss": -27.6385440826416, "global_step": 500150, "epoch": 6025} {"train_loss": -27.249174118041992, "global_step": 500151, "epoch": 6025} {"train_loss": -27.102039337158203, "global_step": 500152, "epoch": 6025} {"train_loss": -27.46648597717285, "global_step": 500153, "epoch": 6025} {"train_loss": -27.3597354888916, "global_step": 500154, "epoch": 6025} {"train_loss": -27.369733810424805, "global_step": 500155, "epoch": 6025} {"train_loss": -27.559656143188477, "global_step": 500156, "epoch": 6025} {"train_loss": -27.354651600481517, "global_step": 500157, "epoch": 6025, "val_loss": 6690316.0} {"train_loss": -26.720142364501953, "global_step": 500158, "epoch": 6026} {"train_loss": -26.946287155151367, "global_step": 500159, "epoch": 6026} {"train_loss": -27.051862716674805, "global_step": 500160, "epoch": 6026} {"train_loss": -26.665618896484375, "global_step": 500161, "epoch": 6026} {"train_loss": -26.749114990234375, "global_step": 500162, "epoch": 6026} {"train_loss": -27.062549591064453, "global_step": 500163, "epoch": 6026} {"train_loss": -27.29250144958496, "global_step": 500164, "epoch": 6026} {"train_loss": -26.83304214477539, "global_step": 500165, "epoch": 6026} {"train_loss": -26.843610763549805, "global_step": 500166, "epoch": 6026} {"train_loss": -27.040319442749023, "global_step": 500167, "epoch": 6026} {"train_loss": -27.301589965820312, "global_step": 500168, "epoch": 6026} {"train_loss": -27.354232788085938, "global_step": 500169, "epoch": 6026} {"train_loss": -26.960859298706055, "global_step": 500170, "epoch": 6026} {"train_loss": -27.10133171081543, "global_step": 500171, "epoch": 6026} {"train_loss": -27.450408935546875, "global_step": 500172, "epoch": 6026} {"train_loss": -27.565357208251953, "global_step": 500173, "epoch": 6026} {"train_loss": -27.170591354370117, "global_step": 500174, "epoch": 6026} {"train_loss": -27.648120880126953, "global_step": 500175, "epoch": 6026} {"train_loss": -27.238544464111328, "global_step": 500176, "epoch": 6026} {"train_loss": -27.222431182861328, "global_step": 500177, "epoch": 6026} {"train_loss": -27.490774154663086, "global_step": 500178, "epoch": 6026} {"train_loss": -27.51215934753418, "global_step": 500179, "epoch": 6026} {"train_loss": -27.456409454345703, "global_step": 500180, "epoch": 6026} {"train_loss": -27.0533447265625, "global_step": 500181, "epoch": 6026} {"train_loss": -27.18733787536621, "global_step": 500182, "epoch": 6026} {"train_loss": -27.505990982055664, "global_step": 500183, "epoch": 6026} {"train_loss": -27.276229858398438, "global_step": 500184, "epoch": 6026} {"train_loss": -27.481977462768555, "global_step": 500185, "epoch": 6026} {"train_loss": -27.466272354125977, "global_step": 500186, "epoch": 6026} {"train_loss": -27.57594108581543, "global_step": 500187, "epoch": 6026} {"train_loss": -27.57118034362793, "global_step": 500188, "epoch": 6026} {"train_loss": -27.729385375976562, "global_step": 500189, "epoch": 6026} {"train_loss": -27.534215927124023, "global_step": 500190, "epoch": 6026} {"train_loss": -27.578054428100586, "global_step": 500191, "epoch": 6026} {"train_loss": -27.891010284423828, "global_step": 500192, "epoch": 6026} {"train_loss": -27.440011978149414, "global_step": 500193, "epoch": 6026} {"train_loss": -27.112783432006836, "global_step": 500194, "epoch": 6026} {"train_loss": -27.6852970123291, "global_step": 500195, "epoch": 6026} {"train_loss": -27.721464157104492, "global_step": 500196, "epoch": 6026} {"train_loss": -27.473676681518555, "global_step": 500197, "epoch": 6026} {"train_loss": -26.858259201049805, "global_step": 500198, "epoch": 6026} {"train_loss": -27.060911178588867, "global_step": 500199, "epoch": 6026} {"train_loss": -27.67757225036621, "global_step": 500200, "epoch": 6026} {"train_loss": -27.2315616607666, "global_step": 500201, "epoch": 6026} {"train_loss": -27.100391387939453, "global_step": 500202, "epoch": 6026} {"train_loss": -27.0349178314209, "global_step": 500203, "epoch": 6026} {"train_loss": -26.633106231689453, "global_step": 500204, "epoch": 6026} {"train_loss": -26.914045333862305, "global_step": 500205, "epoch": 6026} {"train_loss": -27.474889755249023, "global_step": 500206, "epoch": 6026} {"train_loss": -27.463794708251953, "global_step": 500207, "epoch": 6026} {"train_loss": -27.338943481445312, "global_step": 500208, "epoch": 6026} {"train_loss": -27.498687744140625, "global_step": 500209, "epoch": 6026} {"train_loss": -27.602935791015625, "global_step": 500210, "epoch": 6026} {"train_loss": -27.01822280883789, "global_step": 500211, "epoch": 6026} {"train_loss": -27.514535903930664, "global_step": 500212, "epoch": 6026} {"train_loss": -27.711545944213867, "global_step": 500213, "epoch": 6026} {"train_loss": -27.223196029663086, "global_step": 500214, "epoch": 6026} {"train_loss": -27.42938804626465, "global_step": 500215, "epoch": 6026} {"train_loss": -27.550745010375977, "global_step": 500216, "epoch": 6026} {"train_loss": -26.9500789642334, "global_step": 500217, "epoch": 6026} {"train_loss": -27.66634178161621, "global_step": 500218, "epoch": 6026} {"train_loss": -27.543670654296875, "global_step": 500219, "epoch": 6026} {"train_loss": -27.721261978149414, "global_step": 500220, "epoch": 6026} {"train_loss": -27.916650772094727, "global_step": 500221, "epoch": 6026} {"train_loss": -27.317096710205078, "global_step": 500222, "epoch": 6026} {"train_loss": -27.44268226623535, "global_step": 500223, "epoch": 6026} {"train_loss": -27.2821102142334, "global_step": 500224, "epoch": 6026} {"train_loss": -27.41815757751465, "global_step": 500225, "epoch": 6026} {"train_loss": -27.356443405151367, "global_step": 500226, "epoch": 6026} {"train_loss": -27.733169555664062, "global_step": 500227, "epoch": 6026} {"train_loss": -27.337621688842773, "global_step": 500228, "epoch": 6026} {"train_loss": -27.47723388671875, "global_step": 500229, "epoch": 6026} {"train_loss": -27.536468505859375, "global_step": 500230, "epoch": 6026} {"train_loss": -27.844945907592773, "global_step": 500231, "epoch": 6026} {"train_loss": -27.26218032836914, "global_step": 500232, "epoch": 6026} {"train_loss": -27.554996490478516, "global_step": 500233, "epoch": 6026} {"train_loss": -27.18995475769043, "global_step": 500234, "epoch": 6026} {"train_loss": -27.728469848632812, "global_step": 500235, "epoch": 6026} {"train_loss": -27.33612060546875, "global_step": 500236, "epoch": 6026} {"train_loss": -27.308088302612305, "global_step": 500237, "epoch": 6026} {"train_loss": -27.691452026367188, "global_step": 500238, "epoch": 6026} {"train_loss": -27.598608016967773, "global_step": 500239, "epoch": 6026} {"train_loss": -27.337294681962714, "global_step": 500240, "epoch": 6026, "val_loss": 6678798.0} {"train_loss": -27.254980087280273, "global_step": 500241, "epoch": 6027} {"train_loss": -26.92063331604004, "global_step": 500242, "epoch": 6027} {"train_loss": -27.241928100585938, "global_step": 500243, "epoch": 6027} {"train_loss": -26.892301559448242, "global_step": 500244, "epoch": 6027} {"train_loss": -26.510578155517578, "global_step": 500245, "epoch": 6027} {"train_loss": -26.68073844909668, "global_step": 500246, "epoch": 6027} {"train_loss": -27.174360275268555, "global_step": 500247, "epoch": 6027} {"train_loss": -27.416624069213867, "global_step": 500248, "epoch": 6027} {"train_loss": -27.312606811523438, "global_step": 500249, "epoch": 6027} {"train_loss": -26.879669189453125, "global_step": 500250, "epoch": 6027} {"train_loss": -27.25638771057129, "global_step": 500251, "epoch": 6027} {"train_loss": -26.865283966064453, "global_step": 500252, "epoch": 6027} {"train_loss": -27.107446670532227, "global_step": 500253, "epoch": 6027} {"train_loss": -27.109832763671875, "global_step": 500254, "epoch": 6027} {"train_loss": -26.819543838500977, "global_step": 500255, "epoch": 6027} {"train_loss": -27.441492080688477, "global_step": 500256, "epoch": 6027} {"train_loss": -27.216772079467773, "global_step": 500257, "epoch": 6027} {"train_loss": -26.731794357299805, "global_step": 500258, "epoch": 6027} {"train_loss": -27.217432022094727, "global_step": 500259, "epoch": 6027} {"train_loss": -26.9974365234375, "global_step": 500260, "epoch": 6027} {"train_loss": -27.202619552612305, "global_step": 500261, "epoch": 6027} {"train_loss": -27.128515243530273, "global_step": 500262, "epoch": 6027} {"train_loss": -27.260894775390625, "global_step": 500263, "epoch": 6027} {"train_loss": -27.21209144592285, "global_step": 500264, "epoch": 6027} {"train_loss": -27.089828491210938, "global_step": 500265, "epoch": 6027} {"train_loss": -27.3103084564209, "global_step": 500266, "epoch": 6027} {"train_loss": -27.199132919311523, "global_step": 500267, "epoch": 6027} {"train_loss": -27.307592391967773, "global_step": 500268, "epoch": 6027} {"train_loss": -27.638458251953125, "global_step": 500269, "epoch": 6027} {"train_loss": -27.369306564331055, "global_step": 500270, "epoch": 6027} {"train_loss": -27.31622314453125, "global_step": 500271, "epoch": 6027} {"train_loss": -27.642507553100586, "global_step": 500272, "epoch": 6027} {"train_loss": -27.487384796142578, "global_step": 500273, "epoch": 6027} {"train_loss": -27.51397132873535, "global_step": 500274, "epoch": 6027} {"train_loss": -27.402755737304688, "global_step": 500275, "epoch": 6027} {"train_loss": -27.836393356323242, "global_step": 500276, "epoch": 6027} {"train_loss": -27.17242431640625, "global_step": 500277, "epoch": 6027} {"train_loss": -27.25748634338379, "global_step": 500278, "epoch": 6027} {"train_loss": -27.226423263549805, "global_step": 500279, "epoch": 6027} {"train_loss": -27.404409408569336, "global_step": 500280, "epoch": 6027} {"train_loss": -27.4710636138916, "global_step": 500281, "epoch": 6027} {"train_loss": -27.64615821838379, "global_step": 500282, "epoch": 6027} {"train_loss": -27.733814239501953, "global_step": 500283, "epoch": 6027} {"train_loss": -27.82883071899414, "global_step": 500284, "epoch": 6027} {"train_loss": -27.555734634399414, "global_step": 500285, "epoch": 6027} {"train_loss": -27.462072372436523, "global_step": 500286, "epoch": 6027} {"train_loss": -27.3193302154541, "global_step": 500287, "epoch": 6027} {"train_loss": -27.713336944580078, "global_step": 500288, "epoch": 6027} {"train_loss": -27.314733505249023, "global_step": 500289, "epoch": 6027} {"train_loss": -27.782812118530273, "global_step": 500290, "epoch": 6027} {"train_loss": -27.535730361938477, "global_step": 500291, "epoch": 6027} {"train_loss": -27.66407585144043, "global_step": 500292, "epoch": 6027} {"train_loss": -27.767669677734375, "global_step": 500293, "epoch": 6027} {"train_loss": -27.478452682495117, "global_step": 500294, "epoch": 6027} {"train_loss": -27.67069435119629, "global_step": 500295, "epoch": 6027} {"train_loss": -27.606107711791992, "global_step": 500296, "epoch": 6027} {"train_loss": -27.283334732055664, "global_step": 500297, "epoch": 6027} {"train_loss": -26.926361083984375, "global_step": 500298, "epoch": 6027} {"train_loss": -27.14520835876465, "global_step": 500299, "epoch": 6027} {"train_loss": -27.334033966064453, "global_step": 500300, "epoch": 6027} {"train_loss": -27.536436080932617, "global_step": 500301, "epoch": 6027} {"train_loss": -27.316394805908203, "global_step": 500302, "epoch": 6027} {"train_loss": -27.40858268737793, "global_step": 500303, "epoch": 6027} {"train_loss": -27.698089599609375, "global_step": 500304, "epoch": 6027} {"train_loss": -27.715442657470703, "global_step": 500305, "epoch": 6027} {"train_loss": -27.344955444335938, "global_step": 500306, "epoch": 6027} {"train_loss": -27.047901153564453, "global_step": 500307, "epoch": 6027} {"train_loss": -27.372894287109375, "global_step": 500308, "epoch": 6027} {"train_loss": -27.264585494995117, "global_step": 500309, "epoch": 6027} {"train_loss": -27.487272262573242, "global_step": 500310, "epoch": 6027} {"train_loss": -27.788190841674805, "global_step": 500311, "epoch": 6027} {"train_loss": -27.223220825195312, "global_step": 500312, "epoch": 6027} {"train_loss": -27.26730728149414, "global_step": 500313, "epoch": 6027} {"train_loss": -27.63614845275879, "global_step": 500314, "epoch": 6027} {"train_loss": -27.448974609375, "global_step": 500315, "epoch": 6027} {"train_loss": -26.7554988861084, "global_step": 500316, "epoch": 6027} {"train_loss": -27.01381492614746, "global_step": 500317, "epoch": 6027} {"train_loss": -27.637802124023438, "global_step": 500318, "epoch": 6027} {"train_loss": -27.065587997436523, "global_step": 500319, "epoch": 6027} {"train_loss": -26.87202262878418, "global_step": 500320, "epoch": 6027} {"train_loss": -27.2564754486084, "global_step": 500321, "epoch": 6027} {"train_loss": -27.211240768432617, "global_step": 500322, "epoch": 6027} {"train_loss": -27.317876930696418, "global_step": 500323, "epoch": 6027, "val_loss": 6622676.0} {"train_loss": -27.172760009765625, "global_step": 500324, "epoch": 6028} {"train_loss": -26.239904403686523, "global_step": 500325, "epoch": 6028} {"train_loss": -26.728519439697266, "global_step": 500326, "epoch": 6028} {"train_loss": -25.90561866760254, "global_step": 500327, "epoch": 6028} {"train_loss": -26.793994903564453, "global_step": 500328, "epoch": 6028} {"train_loss": -26.198963165283203, "global_step": 500329, "epoch": 6028} {"train_loss": -26.7450008392334, "global_step": 500330, "epoch": 6028} {"train_loss": -26.369863510131836, "global_step": 500331, "epoch": 6028} {"train_loss": -26.979862213134766, "global_step": 500332, "epoch": 6028} {"train_loss": -26.940155029296875, "global_step": 500333, "epoch": 6028} {"train_loss": -26.880582809448242, "global_step": 500334, "epoch": 6028} {"train_loss": -26.691511154174805, "global_step": 500335, "epoch": 6028} {"train_loss": -26.74433708190918, "global_step": 500336, "epoch": 6028} {"train_loss": -26.9758358001709, "global_step": 500337, "epoch": 6028} {"train_loss": -26.752859115600586, "global_step": 500338, "epoch": 6028} {"train_loss": -26.638349533081055, "global_step": 500339, "epoch": 6028} {"train_loss": -26.956769943237305, "global_step": 500340, "epoch": 6028} {"train_loss": -26.8334903717041, "global_step": 500341, "epoch": 6028} {"train_loss": -27.380704879760742, "global_step": 500342, "epoch": 6028} {"train_loss": -27.058408737182617, "global_step": 500343, "epoch": 6028} {"train_loss": -27.385908126831055, "global_step": 500344, "epoch": 6028} {"train_loss": -27.06060218811035, "global_step": 500345, "epoch": 6028} {"train_loss": -27.00699234008789, "global_step": 500346, "epoch": 6028} {"train_loss": -27.265201568603516, "global_step": 500347, "epoch": 6028} {"train_loss": -27.38652992248535, "global_step": 500348, "epoch": 6028} {"train_loss": -27.299182891845703, "global_step": 500349, "epoch": 6028} {"train_loss": -27.424530029296875, "global_step": 500350, "epoch": 6028} {"train_loss": -27.027257919311523, "global_step": 500351, "epoch": 6028} {"train_loss": -27.202056884765625, "global_step": 500352, "epoch": 6028} {"train_loss": -27.657760620117188, "global_step": 500353, "epoch": 6028} {"train_loss": -27.272207260131836, "global_step": 500354, "epoch": 6028} {"train_loss": -27.36933708190918, "global_step": 500355, "epoch": 6028} {"train_loss": -27.612354278564453, "global_step": 500356, "epoch": 6028} {"train_loss": -27.530725479125977, "global_step": 500357, "epoch": 6028} {"train_loss": -27.363327026367188, "global_step": 500358, "epoch": 6028} {"train_loss": -27.566186904907227, "global_step": 500359, "epoch": 6028} {"train_loss": -27.522184371948242, "global_step": 500360, "epoch": 6028} {"train_loss": -27.587697982788086, "global_step": 500361, "epoch": 6028} {"train_loss": -27.7531795501709, "global_step": 500362, "epoch": 6028} {"train_loss": -27.448461532592773, "global_step": 500363, "epoch": 6028} {"train_loss": -27.338027954101562, "global_step": 500364, "epoch": 6028} {"train_loss": -27.261022567749023, "global_step": 500365, "epoch": 6028} {"train_loss": -27.615528106689453, "global_step": 500366, "epoch": 6028} {"train_loss": -27.20798110961914, "global_step": 500367, "epoch": 6028} {"train_loss": -27.59113121032715, "global_step": 500368, "epoch": 6028} {"train_loss": -27.58426856994629, "global_step": 500369, "epoch": 6028} {"train_loss": -27.62775230407715, "global_step": 500370, "epoch": 6028} {"train_loss": -27.536169052124023, "global_step": 500371, "epoch": 6028} {"train_loss": -27.433425903320312, "global_step": 500372, "epoch": 6028} {"train_loss": -27.2961483001709, "global_step": 500373, "epoch": 6028} {"train_loss": -27.882843017578125, "global_step": 500374, "epoch": 6028} {"train_loss": -27.603225708007812, "global_step": 500375, "epoch": 6028} {"train_loss": -27.73481559753418, "global_step": 500376, "epoch": 6028} {"train_loss": -27.6243953704834, "global_step": 500377, "epoch": 6028} {"train_loss": -27.24616813659668, "global_step": 500378, "epoch": 6028} {"train_loss": -27.394458770751953, "global_step": 500379, "epoch": 6028} {"train_loss": -27.099897384643555, "global_step": 500380, "epoch": 6028} {"train_loss": -27.472431182861328, "global_step": 500381, "epoch": 6028} {"train_loss": -27.593494415283203, "global_step": 500382, "epoch": 6028} {"train_loss": -27.65715980529785, "global_step": 500383, "epoch": 6028} {"train_loss": -27.416425704956055, "global_step": 500384, "epoch": 6028} {"train_loss": -27.517454147338867, "global_step": 500385, "epoch": 6028} {"train_loss": -27.41855239868164, "global_step": 500386, "epoch": 6028} {"train_loss": -27.390106201171875, "global_step": 500387, "epoch": 6028} {"train_loss": -27.41259765625, "global_step": 500388, "epoch": 6028} {"train_loss": -27.27284049987793, "global_step": 500389, "epoch": 6028} {"train_loss": -27.21050453186035, "global_step": 500390, "epoch": 6028} {"train_loss": -27.26711082458496, "global_step": 500391, "epoch": 6028} {"train_loss": -27.273542404174805, "global_step": 500392, "epoch": 6028} {"train_loss": -26.873449325561523, "global_step": 500393, "epoch": 6028} {"train_loss": -27.971115112304688, "global_step": 500394, "epoch": 6028} {"train_loss": -26.865842819213867, "global_step": 500395, "epoch": 6028} {"train_loss": -26.52656364440918, "global_step": 500396, "epoch": 6028} {"train_loss": -27.0473575592041, "global_step": 500397, "epoch": 6028} {"train_loss": -26.914520263671875, "global_step": 500398, "epoch": 6028} {"train_loss": -27.315357208251953, "global_step": 500399, "epoch": 6028} {"train_loss": -27.01445960998535, "global_step": 500400, "epoch": 6028} {"train_loss": -26.47865104675293, "global_step": 500401, "epoch": 6028} {"train_loss": -27.08121681213379, "global_step": 500402, "epoch": 6028} {"train_loss": -26.848072052001953, "global_step": 500403, "epoch": 6028} {"train_loss": -26.656177520751953, "global_step": 500404, "epoch": 6028} {"train_loss": -26.89202308654785, "global_step": 500405, "epoch": 6028} {"train_loss": -27.172215381300592, "global_step": 500406, "epoch": 6028, "val_loss": 6818465.0} {"train_loss": -26.80963706970215, "global_step": 500407, "epoch": 6029} {"train_loss": -26.699542999267578, "global_step": 500408, "epoch": 6029} {"train_loss": -27.43226432800293, "global_step": 500409, "epoch": 6029} {"train_loss": -26.569433212280273, "global_step": 500410, "epoch": 6029} {"train_loss": -26.89023780822754, "global_step": 500411, "epoch": 6029} {"train_loss": -27.689382553100586, "global_step": 500412, "epoch": 6029} {"train_loss": -26.5870304107666, "global_step": 500413, "epoch": 6029} {"train_loss": -27.102630615234375, "global_step": 500414, "epoch": 6029} {"train_loss": -27.158735275268555, "global_step": 500415, "epoch": 6029} {"train_loss": -27.06263542175293, "global_step": 500416, "epoch": 6029} {"train_loss": -27.540685653686523, "global_step": 500417, "epoch": 6029} {"train_loss": -27.214340209960938, "global_step": 500418, "epoch": 6029} {"train_loss": -26.88837242126465, "global_step": 500419, "epoch": 6029} {"train_loss": -27.18650245666504, "global_step": 500420, "epoch": 6029} {"train_loss": -27.561248779296875, "global_step": 500421, "epoch": 6029} {"train_loss": -26.964324951171875, "global_step": 500422, "epoch": 6029} {"train_loss": -27.037567138671875, "global_step": 500423, "epoch": 6029} {"train_loss": -27.404285430908203, "global_step": 500424, "epoch": 6029} {"train_loss": -27.371984481811523, "global_step": 500425, "epoch": 6029} {"train_loss": -27.11065673828125, "global_step": 500426, "epoch": 6029} {"train_loss": -27.2928409576416, "global_step": 500427, "epoch": 6029} {"train_loss": -27.306304931640625, "global_step": 500428, "epoch": 6029} {"train_loss": -27.2152042388916, "global_step": 500429, "epoch": 6029} {"train_loss": -27.24287223815918, "global_step": 500430, "epoch": 6029} {"train_loss": -27.3939266204834, "global_step": 500431, "epoch": 6029} {"train_loss": -27.19745445251465, "global_step": 500432, "epoch": 6029} {"train_loss": -27.420703887939453, "global_step": 500433, "epoch": 6029} {"train_loss": -27.595930099487305, "global_step": 500434, "epoch": 6029} {"train_loss": -27.27213478088379, "global_step": 500435, "epoch": 6029} {"train_loss": -27.52705192565918, "global_step": 500436, "epoch": 6029} {"train_loss": -27.503341674804688, "global_step": 500437, "epoch": 6029} {"train_loss": -27.790130615234375, "global_step": 500438, "epoch": 6029} {"train_loss": -27.44631004333496, "global_step": 500439, "epoch": 6029} {"train_loss": -27.574207305908203, "global_step": 500440, "epoch": 6029} {"train_loss": -27.343835830688477, "global_step": 500441, "epoch": 6029} {"train_loss": -27.713001251220703, "global_step": 500442, "epoch": 6029} {"train_loss": -27.933212280273438, "global_step": 500443, "epoch": 6029} {"train_loss": -27.710437774658203, "global_step": 500444, "epoch": 6029} {"train_loss": -27.823455810546875, "global_step": 500445, "epoch": 6029} {"train_loss": -27.63343620300293, "global_step": 500446, "epoch": 6029} {"train_loss": -27.396757125854492, "global_step": 500447, "epoch": 6029} {"train_loss": -27.443878173828125, "global_step": 500448, "epoch": 6029} {"train_loss": -27.285236358642578, "global_step": 500449, "epoch": 6029} {"train_loss": -27.68381690979004, "global_step": 500450, "epoch": 6029} {"train_loss": -27.708454132080078, "global_step": 500451, "epoch": 6029} {"train_loss": -27.944446563720703, "global_step": 500452, "epoch": 6029} {"train_loss": -27.577665328979492, "global_step": 500453, "epoch": 6029} {"train_loss": -27.6859073638916, "global_step": 500454, "epoch": 6029} {"train_loss": -27.204191207885742, "global_step": 500455, "epoch": 6029} {"train_loss": -27.105365753173828, "global_step": 500456, "epoch": 6029} {"train_loss": -26.64349365234375, "global_step": 500457, "epoch": 6029} {"train_loss": -26.37830924987793, "global_step": 500458, "epoch": 6029} {"train_loss": -26.762054443359375, "global_step": 500459, "epoch": 6029} {"train_loss": -26.998533248901367, "global_step": 500460, "epoch": 6029} {"train_loss": -26.71826171875, "global_step": 500461, "epoch": 6029} {"train_loss": -26.533935546875, "global_step": 500462, "epoch": 6029} {"train_loss": -26.810901641845703, "global_step": 500463, "epoch": 6029} {"train_loss": -26.899261474609375, "global_step": 500464, "epoch": 6029} {"train_loss": -27.368820190429688, "global_step": 500465, "epoch": 6029} {"train_loss": -27.399097442626953, "global_step": 500466, "epoch": 6029} {"train_loss": -27.172531127929688, "global_step": 500467, "epoch": 6029} {"train_loss": -27.623510360717773, "global_step": 500468, "epoch": 6029} {"train_loss": -27.286039352416992, "global_step": 500469, "epoch": 6029} {"train_loss": -27.60450553894043, "global_step": 500470, "epoch": 6029} {"train_loss": -27.394535064697266, "global_step": 500471, "epoch": 6029} {"train_loss": -27.59405517578125, "global_step": 500472, "epoch": 6029} {"train_loss": -27.492902755737305, "global_step": 500473, "epoch": 6029} {"train_loss": -27.22296714782715, "global_step": 500474, "epoch": 6029} {"train_loss": -26.794391632080078, "global_step": 500475, "epoch": 6029} {"train_loss": -27.365339279174805, "global_step": 500476, "epoch": 6029} {"train_loss": -27.2216854095459, "global_step": 500477, "epoch": 6029} {"train_loss": -27.013193130493164, "global_step": 500478, "epoch": 6029} {"train_loss": -27.481830596923828, "global_step": 500479, "epoch": 6029} {"train_loss": -27.014429092407227, "global_step": 500480, "epoch": 6029} {"train_loss": -27.218259811401367, "global_step": 500481, "epoch": 6029} {"train_loss": -27.280942916870117, "global_step": 500482, "epoch": 6029} {"train_loss": -27.210424423217773, "global_step": 500483, "epoch": 6029} {"train_loss": -27.472675323486328, "global_step": 500484, "epoch": 6029} {"train_loss": -27.507654190063477, "global_step": 500485, "epoch": 6029} {"train_loss": -27.541757583618164, "global_step": 500486, "epoch": 6029} {"train_loss": -27.54273796081543, "global_step": 500487, "epoch": 6029} {"train_loss": -27.382474899291992, "global_step": 500488, "epoch": 6029} {"train_loss": -27.281657621084925, "global_step": 500489, "epoch": 6029, "val_loss": 6659127.0} {"train_loss": -27.58758544921875, "global_step": 500490, "epoch": 6030} {"train_loss": -27.5176944732666, "global_step": 500491, "epoch": 6030} {"train_loss": -27.64109230041504, "global_step": 500492, "epoch": 6030} {"train_loss": -27.5953426361084, "global_step": 500493, "epoch": 6030} {"train_loss": -27.34305763244629, "global_step": 500494, "epoch": 6030} {"train_loss": -27.423154830932617, "global_step": 500495, "epoch": 6030} {"train_loss": -27.643884658813477, "global_step": 500496, "epoch": 6030} {"train_loss": -27.147384643554688, "global_step": 500497, "epoch": 6030} {"train_loss": -27.4647216796875, "global_step": 500498, "epoch": 6030} {"train_loss": -27.33595085144043, "global_step": 500499, "epoch": 6030} {"train_loss": -27.43629264831543, "global_step": 500500, "epoch": 6030} {"train_loss": -27.057647705078125, "global_step": 500501, "epoch": 6030} {"train_loss": -27.629486083984375, "global_step": 500502, "epoch": 6030} {"train_loss": -27.277023315429688, "global_step": 500503, "epoch": 6030} {"train_loss": -27.243518829345703, "global_step": 500504, "epoch": 6030} {"train_loss": -27.03272819519043, "global_step": 500505, "epoch": 6030} {"train_loss": -26.51833152770996, "global_step": 500506, "epoch": 6030} {"train_loss": -26.924840927124023, "global_step": 500507, "epoch": 6030} {"train_loss": -27.2014217376709, "global_step": 500508, "epoch": 6030} {"train_loss": -27.279102325439453, "global_step": 500509, "epoch": 6030} {"train_loss": -27.356061935424805, "global_step": 500510, "epoch": 6030} {"train_loss": -26.950891494750977, "global_step": 500511, "epoch": 6030} {"train_loss": -26.742431640625, "global_step": 500512, "epoch": 6030} {"train_loss": -27.514495849609375, "global_step": 500513, "epoch": 6030} {"train_loss": -27.351428985595703, "global_step": 500514, "epoch": 6030} {"train_loss": -26.912433624267578, "global_step": 500515, "epoch": 6030} {"train_loss": -26.895709991455078, "global_step": 500516, "epoch": 6030} {"train_loss": -27.478504180908203, "global_step": 500517, "epoch": 6030} {"train_loss": -27.059295654296875, "global_step": 500518, "epoch": 6030} {"train_loss": -27.086462020874023, "global_step": 500519, "epoch": 6030} {"train_loss": -27.64985466003418, "global_step": 500520, "epoch": 6030} {"train_loss": -27.067707061767578, "global_step": 500521, "epoch": 6030} {"train_loss": -27.182968139648438, "global_step": 500522, "epoch": 6030} {"train_loss": -27.5629940032959, "global_step": 500523, "epoch": 6030} {"train_loss": -27.383319854736328, "global_step": 500524, "epoch": 6030} {"train_loss": -27.51344108581543, "global_step": 500525, "epoch": 6030} {"train_loss": -27.17091941833496, "global_step": 500526, "epoch": 6030} {"train_loss": -27.568933486938477, "global_step": 500527, "epoch": 6030} {"train_loss": -26.73261833190918, "global_step": 500528, "epoch": 6030} {"train_loss": -27.583215713500977, "global_step": 500529, "epoch": 6030} {"train_loss": -27.031192779541016, "global_step": 500530, "epoch": 6030} {"train_loss": -27.434423446655273, "global_step": 500531, "epoch": 6030} {"train_loss": -27.2708740234375, "global_step": 500532, "epoch": 6030} {"train_loss": -26.941015243530273, "global_step": 500533, "epoch": 6030} {"train_loss": -27.226842880249023, "global_step": 500534, "epoch": 6030} {"train_loss": -27.330963134765625, "global_step": 500535, "epoch": 6030} {"train_loss": -27.343982696533203, "global_step": 500536, "epoch": 6030} {"train_loss": -27.3512020111084, "global_step": 500537, "epoch": 6030} {"train_loss": -27.251495361328125, "global_step": 500538, "epoch": 6030} {"train_loss": -27.290119171142578, "global_step": 500539, "epoch": 6030} {"train_loss": -27.819507598876953, "global_step": 500540, "epoch": 6030} {"train_loss": -27.34552001953125, "global_step": 500541, "epoch": 6030} {"train_loss": -27.601816177368164, "global_step": 500542, "epoch": 6030} {"train_loss": -27.515644073486328, "global_step": 500543, "epoch": 6030} {"train_loss": -27.413986206054688, "global_step": 500544, "epoch": 6030} {"train_loss": -27.850040435791016, "global_step": 500545, "epoch": 6030} {"train_loss": -27.453458786010742, "global_step": 500546, "epoch": 6030} {"train_loss": -27.5712890625, "global_step": 500547, "epoch": 6030} {"train_loss": -27.570951461791992, "global_step": 500548, "epoch": 6030} {"train_loss": -27.63924217224121, "global_step": 500549, "epoch": 6030} {"train_loss": -27.588266372680664, "global_step": 500550, "epoch": 6030} {"train_loss": -27.549463272094727, "global_step": 500551, "epoch": 6030} {"train_loss": -27.164480209350586, "global_step": 500552, "epoch": 6030} {"train_loss": -27.6085147857666, "global_step": 500553, "epoch": 6030} {"train_loss": -27.39983558654785, "global_step": 500554, "epoch": 6030} {"train_loss": -27.449182510375977, "global_step": 500555, "epoch": 6030} {"train_loss": -27.414901733398438, "global_step": 500556, "epoch": 6030} {"train_loss": -27.480566024780273, "global_step": 500557, "epoch": 6030} {"train_loss": -27.421558380126953, "global_step": 500558, "epoch": 6030} {"train_loss": -27.45501708984375, "global_step": 500559, "epoch": 6030} {"train_loss": -27.63511085510254, "global_step": 500560, "epoch": 6030} {"train_loss": -27.514007568359375, "global_step": 500561, "epoch": 6030} {"train_loss": -27.632678985595703, "global_step": 500562, "epoch": 6030} {"train_loss": -27.346057891845703, "global_step": 500563, "epoch": 6030} {"train_loss": -27.87094497680664, "global_step": 500564, "epoch": 6030} {"train_loss": -27.414464950561523, "global_step": 500565, "epoch": 6030} {"train_loss": -27.81081199645996, "global_step": 500566, "epoch": 6030} {"train_loss": -27.458267211914062, "global_step": 500567, "epoch": 6030} {"train_loss": -27.433704376220703, "global_step": 500568, "epoch": 6030} {"train_loss": -27.57887077331543, "global_step": 500569, "epoch": 6030} {"train_loss": -27.39240074157715, "global_step": 500570, "epoch": 6030} {"train_loss": -27.451404571533203, "global_step": 500571, "epoch": 6030} {"train_loss": -27.37517961249294, "global_step": 500572, "epoch": 6030, "val_loss": 6629426.0} {"train_loss": -26.740985870361328, "global_step": 500573, "epoch": 6031} {"train_loss": -26.8096866607666, "global_step": 500574, "epoch": 6031} {"train_loss": -26.38773536682129, "global_step": 500575, "epoch": 6031} {"train_loss": -27.00201416015625, "global_step": 500576, "epoch": 6031} {"train_loss": -27.07362174987793, "global_step": 500577, "epoch": 6031} {"train_loss": -27.304981231689453, "global_step": 500578, "epoch": 6031} {"train_loss": -27.072763442993164, "global_step": 500579, "epoch": 6031} {"train_loss": -27.102237701416016, "global_step": 500580, "epoch": 6031} {"train_loss": -26.78223991394043, "global_step": 500581, "epoch": 6031} {"train_loss": -26.91214942932129, "global_step": 500582, "epoch": 6031} {"train_loss": -27.1422176361084, "global_step": 500583, "epoch": 6031} {"train_loss": -27.420425415039062, "global_step": 500584, "epoch": 6031} {"train_loss": -27.340301513671875, "global_step": 500585, "epoch": 6031} {"train_loss": -26.844785690307617, "global_step": 500586, "epoch": 6031} {"train_loss": -27.41212272644043, "global_step": 500587, "epoch": 6031} {"train_loss": -26.898019790649414, "global_step": 500588, "epoch": 6031} {"train_loss": -27.516660690307617, "global_step": 500589, "epoch": 6031} {"train_loss": -27.102827072143555, "global_step": 500590, "epoch": 6031} {"train_loss": -27.029071807861328, "global_step": 500591, "epoch": 6031} {"train_loss": -27.191869735717773, "global_step": 500592, "epoch": 6031} {"train_loss": -26.850116729736328, "global_step": 500593, "epoch": 6031} {"train_loss": -27.280902862548828, "global_step": 500594, "epoch": 6031} {"train_loss": -27.121078491210938, "global_step": 500595, "epoch": 6031} {"train_loss": -27.194494247436523, "global_step": 500596, "epoch": 6031} {"train_loss": -27.305662155151367, "global_step": 500597, "epoch": 6031} {"train_loss": -27.412397384643555, "global_step": 500598, "epoch": 6031} {"train_loss": -27.368295669555664, "global_step": 500599, "epoch": 6031} {"train_loss": -27.284582138061523, "global_step": 500600, "epoch": 6031} {"train_loss": -27.289426803588867, "global_step": 500601, "epoch": 6031} {"train_loss": -27.413040161132812, "global_step": 500602, "epoch": 6031} {"train_loss": -27.463422775268555, "global_step": 500603, "epoch": 6031} {"train_loss": -27.29694175720215, "global_step": 500604, "epoch": 6031} {"train_loss": -27.219762802124023, "global_step": 500605, "epoch": 6031} {"train_loss": -27.17144775390625, "global_step": 500606, "epoch": 6031} {"train_loss": -27.26630973815918, "global_step": 500607, "epoch": 6031} {"train_loss": -27.623197555541992, "global_step": 500608, "epoch": 6031} {"train_loss": -27.48065185546875, "global_step": 500609, "epoch": 6031} {"train_loss": -27.38178062438965, "global_step": 500610, "epoch": 6031} {"train_loss": -27.7866153717041, "global_step": 500611, "epoch": 6031} {"train_loss": -27.336414337158203, "global_step": 500612, "epoch": 6031} {"train_loss": -27.538007736206055, "global_step": 500613, "epoch": 6031} {"train_loss": -27.88775634765625, "global_step": 500614, "epoch": 6031} {"train_loss": -27.53339958190918, "global_step": 500615, "epoch": 6031} {"train_loss": -27.55706787109375, "global_step": 500616, "epoch": 6031} {"train_loss": -27.53133201599121, "global_step": 500617, "epoch": 6031} {"train_loss": -27.0573673248291, "global_step": 500618, "epoch": 6031} {"train_loss": -27.45112419128418, "global_step": 500619, "epoch": 6031} {"train_loss": -27.34273338317871, "global_step": 500620, "epoch": 6031} {"train_loss": -27.536392211914062, "global_step": 500621, "epoch": 6031} {"train_loss": -27.56324577331543, "global_step": 500622, "epoch": 6031} {"train_loss": -27.561689376831055, "global_step": 500623, "epoch": 6031} {"train_loss": -27.894290924072266, "global_step": 500624, "epoch": 6031} {"train_loss": -27.67964744567871, "global_step": 500625, "epoch": 6031} {"train_loss": -27.605396270751953, "global_step": 500626, "epoch": 6031} {"train_loss": -27.493244171142578, "global_step": 500627, "epoch": 6031} {"train_loss": -27.45513343811035, "global_step": 500628, "epoch": 6031} {"train_loss": -27.477069854736328, "global_step": 500629, "epoch": 6031} {"train_loss": -27.3847599029541, "global_step": 500630, "epoch": 6031} {"train_loss": -27.460355758666992, "global_step": 500631, "epoch": 6031} {"train_loss": -27.72041130065918, "global_step": 500632, "epoch": 6031} {"train_loss": -27.292652130126953, "global_step": 500633, "epoch": 6031} {"train_loss": -27.8809757232666, "global_step": 500634, "epoch": 6031} {"train_loss": -27.260488510131836, "global_step": 500635, "epoch": 6031} {"train_loss": -27.137784957885742, "global_step": 500636, "epoch": 6031} {"train_loss": -27.719751358032227, "global_step": 500637, "epoch": 6031} {"train_loss": -27.724912643432617, "global_step": 500638, "epoch": 6031} {"train_loss": -27.298364639282227, "global_step": 500639, "epoch": 6031} {"train_loss": -27.522241592407227, "global_step": 500640, "epoch": 6031} {"train_loss": -27.8856201171875, "global_step": 500641, "epoch": 6031} {"train_loss": -27.5611629486084, "global_step": 500642, "epoch": 6031} {"train_loss": -27.5277099609375, "global_step": 500643, "epoch": 6031} {"train_loss": -27.285358428955078, "global_step": 500644, "epoch": 6031} {"train_loss": -27.36842918395996, "global_step": 500645, "epoch": 6031} {"train_loss": -27.08003807067871, "global_step": 500646, "epoch": 6031} {"train_loss": -26.934783935546875, "global_step": 500647, "epoch": 6031} {"train_loss": -26.750415802001953, "global_step": 500648, "epoch": 6031} {"train_loss": -26.98762321472168, "global_step": 500649, "epoch": 6031} {"train_loss": -27.30109214782715, "global_step": 500650, "epoch": 6031} {"train_loss": -26.691085815429688, "global_step": 500651, "epoch": 6031} {"train_loss": -26.852319717407227, "global_step": 500652, "epoch": 6031} {"train_loss": -27.05234718322754, "global_step": 500653, "epoch": 6031} {"train_loss": -26.966588973999023, "global_step": 500654, "epoch": 6031} {"train_loss": -27.304607023675757, "global_step": 500655, "epoch": 6031, "val_loss": 6652062.5} {"train_loss": -26.306486129760742, "global_step": 500656, "epoch": 6032} {"train_loss": -26.237979888916016, "global_step": 500657, "epoch": 6032} {"train_loss": -26.9852352142334, "global_step": 500658, "epoch": 6032} {"train_loss": -26.806676864624023, "global_step": 500659, "epoch": 6032} {"train_loss": -26.22393798828125, "global_step": 500660, "epoch": 6032} {"train_loss": -26.90308952331543, "global_step": 500661, "epoch": 6032} {"train_loss": -26.715774536132812, "global_step": 500662, "epoch": 6032} {"train_loss": -26.747940063476562, "global_step": 500663, "epoch": 6032} {"train_loss": -26.8304500579834, "global_step": 500664, "epoch": 6032} {"train_loss": -26.61651039123535, "global_step": 500665, "epoch": 6032} {"train_loss": -27.003503799438477, "global_step": 500666, "epoch": 6032} {"train_loss": -26.8388729095459, "global_step": 500667, "epoch": 6032} {"train_loss": -27.163557052612305, "global_step": 500668, "epoch": 6032} {"train_loss": -26.941003799438477, "global_step": 500669, "epoch": 6032} {"train_loss": -27.180282592773438, "global_step": 500670, "epoch": 6032} {"train_loss": -26.781824111938477, "global_step": 500671, "epoch": 6032} {"train_loss": -26.913543701171875, "global_step": 500672, "epoch": 6032} {"train_loss": -27.130401611328125, "global_step": 500673, "epoch": 6032} {"train_loss": -27.326812744140625, "global_step": 500674, "epoch": 6032} {"train_loss": -27.295801162719727, "global_step": 500675, "epoch": 6032} {"train_loss": -27.302722930908203, "global_step": 500676, "epoch": 6032} {"train_loss": -27.001230239868164, "global_step": 500677, "epoch": 6032} {"train_loss": -27.04913330078125, "global_step": 500678, "epoch": 6032} {"train_loss": -27.508819580078125, "global_step": 500679, "epoch": 6032} {"train_loss": -26.904199600219727, "global_step": 500680, "epoch": 6032} {"train_loss": -27.278654098510742, "global_step": 500681, "epoch": 6032} {"train_loss": -27.072479248046875, "global_step": 500682, "epoch": 6032} {"train_loss": -27.431232452392578, "global_step": 500683, "epoch": 6032} {"train_loss": -27.461593627929688, "global_step": 500684, "epoch": 6032} {"train_loss": -27.392541885375977, "global_step": 500685, "epoch": 6032} {"train_loss": -27.41097068786621, "global_step": 500686, "epoch": 6032} {"train_loss": -27.255645751953125, "global_step": 500687, "epoch": 6032} {"train_loss": -27.192712783813477, "global_step": 500688, "epoch": 6032} {"train_loss": -27.477008819580078, "global_step": 500689, "epoch": 6032} {"train_loss": -27.95184326171875, "global_step": 500690, "epoch": 6032} {"train_loss": -27.521045684814453, "global_step": 500691, "epoch": 6032} {"train_loss": -27.022802352905273, "global_step": 500692, "epoch": 6032} {"train_loss": -27.666471481323242, "global_step": 500693, "epoch": 6032} {"train_loss": -27.257572174072266, "global_step": 500694, "epoch": 6032} {"train_loss": -27.62338638305664, "global_step": 500695, "epoch": 6032} {"train_loss": -27.231287002563477, "global_step": 500696, "epoch": 6032} {"train_loss": -27.5677433013916, "global_step": 500697, "epoch": 6032} {"train_loss": -27.370941162109375, "global_step": 500698, "epoch": 6032} {"train_loss": -27.424030303955078, "global_step": 500699, "epoch": 6032} {"train_loss": -27.41250991821289, "global_step": 500700, "epoch": 6032} {"train_loss": -27.394439697265625, "global_step": 500701, "epoch": 6032} {"train_loss": -27.394006729125977, "global_step": 500702, "epoch": 6032} {"train_loss": -27.197412490844727, "global_step": 500703, "epoch": 6032} {"train_loss": -27.23624610900879, "global_step": 500704, "epoch": 6032} {"train_loss": -27.670557022094727, "global_step": 500705, "epoch": 6032} {"train_loss": -27.597126007080078, "global_step": 500706, "epoch": 6032} {"train_loss": -27.867918014526367, "global_step": 500707, "epoch": 6032} {"train_loss": -27.362823486328125, "global_step": 500708, "epoch": 6032} {"train_loss": -27.329294204711914, "global_step": 500709, "epoch": 6032} {"train_loss": -27.600830078125, "global_step": 500710, "epoch": 6032} {"train_loss": -27.406818389892578, "global_step": 500711, "epoch": 6032} {"train_loss": -27.388702392578125, "global_step": 500712, "epoch": 6032} {"train_loss": -27.372180938720703, "global_step": 500713, "epoch": 6032} {"train_loss": -27.731769561767578, "global_step": 500714, "epoch": 6032} {"train_loss": -27.8249454498291, "global_step": 500715, "epoch": 6032} {"train_loss": -27.548816680908203, "global_step": 500716, "epoch": 6032} {"train_loss": -27.763843536376953, "global_step": 500717, "epoch": 6032} {"train_loss": -27.492008209228516, "global_step": 500718, "epoch": 6032} {"train_loss": -27.378767013549805, "global_step": 500719, "epoch": 6032} {"train_loss": -27.452695846557617, "global_step": 500720, "epoch": 6032} {"train_loss": -27.60590171813965, "global_step": 500721, "epoch": 6032} {"train_loss": -27.434595108032227, "global_step": 500722, "epoch": 6032} {"train_loss": -27.589950561523438, "global_step": 500723, "epoch": 6032} {"train_loss": -27.6783447265625, "global_step": 500724, "epoch": 6032} {"train_loss": -27.54937171936035, "global_step": 500725, "epoch": 6032} {"train_loss": -27.633100509643555, "global_step": 500726, "epoch": 6032} {"train_loss": -26.788434982299805, "global_step": 500727, "epoch": 6032} {"train_loss": -27.10782814025879, "global_step": 500728, "epoch": 6032} {"train_loss": -27.46770668029785, "global_step": 500729, "epoch": 6032} {"train_loss": -27.20267677307129, "global_step": 500730, "epoch": 6032} {"train_loss": -26.751012802124023, "global_step": 500731, "epoch": 6032} {"train_loss": -26.670557022094727, "global_step": 500732, "epoch": 6032} {"train_loss": -27.1879825592041, "global_step": 500733, "epoch": 6032} {"train_loss": -27.333847045898438, "global_step": 500734, "epoch": 6032} {"train_loss": -27.479846954345703, "global_step": 500735, "epoch": 6032} {"train_loss": -26.506366729736328, "global_step": 500736, "epoch": 6032} {"train_loss": -27.301593780517578, "global_step": 500737, "epoch": 6032} {"train_loss": -27.25487506820495, "global_step": 500738, "epoch": 6032, "val_loss": 6654804.0} {"train_loss": -26.95269203186035, "global_step": 500739, "epoch": 6033} {"train_loss": -26.16033363342285, "global_step": 500740, "epoch": 6033} {"train_loss": -26.762537002563477, "global_step": 500741, "epoch": 6033} {"train_loss": -26.631332397460938, "global_step": 500742, "epoch": 6033} {"train_loss": -26.832300186157227, "global_step": 500743, "epoch": 6033} {"train_loss": -27.0932674407959, "global_step": 500744, "epoch": 6033} {"train_loss": -26.69805908203125, "global_step": 500745, "epoch": 6033} {"train_loss": -27.108875274658203, "global_step": 500746, "epoch": 6033} {"train_loss": -26.939023971557617, "global_step": 500747, "epoch": 6033} {"train_loss": -26.880380630493164, "global_step": 500748, "epoch": 6033} {"train_loss": -26.948217391967773, "global_step": 500749, "epoch": 6033} {"train_loss": -26.94831657409668, "global_step": 500750, "epoch": 6033} {"train_loss": -26.741037368774414, "global_step": 500751, "epoch": 6033} {"train_loss": -27.160572052001953, "global_step": 500752, "epoch": 6033} {"train_loss": -27.106687545776367, "global_step": 500753, "epoch": 6033} {"train_loss": -26.97285270690918, "global_step": 500754, "epoch": 6033} {"train_loss": -27.102130889892578, "global_step": 500755, "epoch": 6033} {"train_loss": -27.122211456298828, "global_step": 500756, "epoch": 6033} {"train_loss": -27.41940689086914, "global_step": 500757, "epoch": 6033} {"train_loss": -27.10145378112793, "global_step": 500758, "epoch": 6033} {"train_loss": -27.028467178344727, "global_step": 500759, "epoch": 6033} {"train_loss": -27.37483024597168, "global_step": 500760, "epoch": 6033} {"train_loss": -27.412946701049805, "global_step": 500761, "epoch": 6033} {"train_loss": -27.172866821289062, "global_step": 500762, "epoch": 6033} {"train_loss": -27.248462677001953, "global_step": 500763, "epoch": 6033} {"train_loss": -27.377893447875977, "global_step": 500764, "epoch": 6033} {"train_loss": -27.75396728515625, "global_step": 500765, "epoch": 6033} {"train_loss": -27.596323013305664, "global_step": 500766, "epoch": 6033} {"train_loss": -27.554065704345703, "global_step": 500767, "epoch": 6033} {"train_loss": -27.6748104095459, "global_step": 500768, "epoch": 6033} {"train_loss": -27.48065757751465, "global_step": 500769, "epoch": 6033} {"train_loss": -27.2309513092041, "global_step": 500770, "epoch": 6033} {"train_loss": -27.566669464111328, "global_step": 500771, "epoch": 6033} {"train_loss": -27.622833251953125, "global_step": 500772, "epoch": 6033} {"train_loss": -27.381805419921875, "global_step": 500773, "epoch": 6033} {"train_loss": -27.561847686767578, "global_step": 500774, "epoch": 6033} {"train_loss": -27.525238037109375, "global_step": 500775, "epoch": 6033} {"train_loss": -27.721881866455078, "global_step": 500776, "epoch": 6033} {"train_loss": -27.059906005859375, "global_step": 500777, "epoch": 6033} {"train_loss": -27.6734561920166, "global_step": 500778, "epoch": 6033} {"train_loss": -27.477014541625977, "global_step": 500779, "epoch": 6033} {"train_loss": -27.545568466186523, "global_step": 500780, "epoch": 6033} {"train_loss": -27.68646812438965, "global_step": 500781, "epoch": 6033} {"train_loss": -27.665851593017578, "global_step": 500782, "epoch": 6033} {"train_loss": -27.586627960205078, "global_step": 500783, "epoch": 6033} {"train_loss": -27.67885398864746, "global_step": 500784, "epoch": 6033} {"train_loss": -27.3084659576416, "global_step": 500785, "epoch": 6033} {"train_loss": -28.01862144470215, "global_step": 500786, "epoch": 6033} {"train_loss": -27.57281494140625, "global_step": 500787, "epoch": 6033} {"train_loss": -27.600128173828125, "global_step": 500788, "epoch": 6033} {"train_loss": -27.33835220336914, "global_step": 500789, "epoch": 6033} {"train_loss": -27.451313018798828, "global_step": 500790, "epoch": 6033} {"train_loss": -27.5070743560791, "global_step": 500791, "epoch": 6033} {"train_loss": -27.589496612548828, "global_step": 500792, "epoch": 6033} {"train_loss": -26.578393936157227, "global_step": 500793, "epoch": 6033} {"train_loss": -26.60102653503418, "global_step": 500794, "epoch": 6033} {"train_loss": -27.378767013549805, "global_step": 500795, "epoch": 6033} {"train_loss": -27.12555503845215, "global_step": 500796, "epoch": 6033} {"train_loss": -27.425983428955078, "global_step": 500797, "epoch": 6033} {"train_loss": -27.14935302734375, "global_step": 500798, "epoch": 6033} {"train_loss": -27.201202392578125, "global_step": 500799, "epoch": 6033} {"train_loss": -27.25221061706543, "global_step": 500800, "epoch": 6033} {"train_loss": -27.247568130493164, "global_step": 500801, "epoch": 6033} {"train_loss": -27.208127975463867, "global_step": 500802, "epoch": 6033} {"train_loss": -26.968046188354492, "global_step": 500803, "epoch": 6033} {"train_loss": -27.572168350219727, "global_step": 500804, "epoch": 6033} {"train_loss": -27.258947372436523, "global_step": 500805, "epoch": 6033} {"train_loss": -27.309558868408203, "global_step": 500806, "epoch": 6033} {"train_loss": -27.140729904174805, "global_step": 500807, "epoch": 6033} {"train_loss": -27.3629150390625, "global_step": 500808, "epoch": 6033} {"train_loss": -27.59815788269043, "global_step": 500809, "epoch": 6033} {"train_loss": -27.353342056274414, "global_step": 500810, "epoch": 6033} {"train_loss": -27.257858276367188, "global_step": 500811, "epoch": 6033} {"train_loss": -27.3861026763916, "global_step": 500812, "epoch": 6033} {"train_loss": -26.990610122680664, "global_step": 500813, "epoch": 6033} {"train_loss": -27.280166625976562, "global_step": 500814, "epoch": 6033} {"train_loss": -27.318775177001953, "global_step": 500815, "epoch": 6033} {"train_loss": -27.486438751220703, "global_step": 500816, "epoch": 6033} {"train_loss": -27.18366050720215, "global_step": 500817, "epoch": 6033} {"train_loss": -27.215417861938477, "global_step": 500818, "epoch": 6033} {"train_loss": -27.535919189453125, "global_step": 500819, "epoch": 6033} {"train_loss": -27.557592391967773, "global_step": 500820, "epoch": 6033} {"train_loss": -27.28000041088426, "global_step": 500821, "epoch": 6033, "val_loss": 6653855.0} {"train_loss": -26.7675838470459, "global_step": 500822, "epoch": 6034} {"train_loss": -26.7216854095459, "global_step": 500823, "epoch": 6034} {"train_loss": -26.408523559570312, "global_step": 500824, "epoch": 6034} {"train_loss": -27.20228385925293, "global_step": 500825, "epoch": 6034} {"train_loss": -26.608356475830078, "global_step": 500826, "epoch": 6034} {"train_loss": -26.86130714416504, "global_step": 500827, "epoch": 6034} {"train_loss": -27.442686080932617, "global_step": 500828, "epoch": 6034} {"train_loss": -27.1885986328125, "global_step": 500829, "epoch": 6034} {"train_loss": -26.9570255279541, "global_step": 500830, "epoch": 6034} {"train_loss": -27.257062911987305, "global_step": 500831, "epoch": 6034} {"train_loss": -27.125207901000977, "global_step": 500832, "epoch": 6034} {"train_loss": -26.83979606628418, "global_step": 500833, "epoch": 6034} {"train_loss": -27.23613929748535, "global_step": 500834, "epoch": 6034} {"train_loss": -26.86463737487793, "global_step": 500835, "epoch": 6034} {"train_loss": -26.876922607421875, "global_step": 500836, "epoch": 6034} {"train_loss": -27.368366241455078, "global_step": 500837, "epoch": 6034} {"train_loss": -26.895658493041992, "global_step": 500838, "epoch": 6034} {"train_loss": -26.731367111206055, "global_step": 500839, "epoch": 6034} {"train_loss": -27.03657341003418, "global_step": 500840, "epoch": 6034} {"train_loss": -27.481510162353516, "global_step": 500841, "epoch": 6034} {"train_loss": -26.869958877563477, "global_step": 500842, "epoch": 6034} {"train_loss": -27.56025505065918, "global_step": 500843, "epoch": 6034} {"train_loss": -27.28425407409668, "global_step": 500844, "epoch": 6034} {"train_loss": -27.097869873046875, "global_step": 500845, "epoch": 6034} {"train_loss": -27.61223793029785, "global_step": 500846, "epoch": 6034} {"train_loss": -27.032751083374023, "global_step": 500847, "epoch": 6034} {"train_loss": -27.134021759033203, "global_step": 500848, "epoch": 6034} {"train_loss": -27.2632999420166, "global_step": 500849, "epoch": 6034} {"train_loss": -27.387449264526367, "global_step": 500850, "epoch": 6034} {"train_loss": -26.755414962768555, "global_step": 500851, "epoch": 6034} {"train_loss": -27.78204345703125, "global_step": 500852, "epoch": 6034} {"train_loss": -27.50261878967285, "global_step": 500853, "epoch": 6034} {"train_loss": -27.25848960876465, "global_step": 500854, "epoch": 6034} {"train_loss": -27.43181800842285, "global_step": 500855, "epoch": 6034} {"train_loss": -27.245746612548828, "global_step": 500856, "epoch": 6034} {"train_loss": -27.432331085205078, "global_step": 500857, "epoch": 6034} {"train_loss": -27.46356773376465, "global_step": 500858, "epoch": 6034} {"train_loss": -27.626514434814453, "global_step": 500859, "epoch": 6034} {"train_loss": -27.406240463256836, "global_step": 500860, "epoch": 6034} {"train_loss": -27.77032470703125, "global_step": 500861, "epoch": 6034} {"train_loss": -27.026403427124023, "global_step": 500862, "epoch": 6034} {"train_loss": -27.468908309936523, "global_step": 500863, "epoch": 6034} {"train_loss": -27.557830810546875, "global_step": 500864, "epoch": 6034} {"train_loss": -27.036376953125, "global_step": 500865, "epoch": 6034} {"train_loss": -27.47022819519043, "global_step": 500866, "epoch": 6034} {"train_loss": -27.507226943969727, "global_step": 500867, "epoch": 6034} {"train_loss": -27.035566329956055, "global_step": 500868, "epoch": 6034} {"train_loss": -27.642993927001953, "global_step": 500869, "epoch": 6034} {"train_loss": -27.547128677368164, "global_step": 500870, "epoch": 6034} {"train_loss": -27.141199111938477, "global_step": 500871, "epoch": 6034} {"train_loss": -27.736923217773438, "global_step": 500872, "epoch": 6034} {"train_loss": -27.30341911315918, "global_step": 500873, "epoch": 6034} {"train_loss": -27.887109756469727, "global_step": 500874, "epoch": 6034} {"train_loss": -27.265228271484375, "global_step": 500875, "epoch": 6034} {"train_loss": -27.34799575805664, "global_step": 500876, "epoch": 6034} {"train_loss": -27.45713233947754, "global_step": 500877, "epoch": 6034} {"train_loss": -27.408613204956055, "global_step": 500878, "epoch": 6034} {"train_loss": -27.128416061401367, "global_step": 500879, "epoch": 6034} {"train_loss": -27.430740356445312, "global_step": 500880, "epoch": 6034} {"train_loss": -27.360105514526367, "global_step": 500881, "epoch": 6034} {"train_loss": -27.372968673706055, "global_step": 500882, "epoch": 6034} {"train_loss": -27.4064998626709, "global_step": 500883, "epoch": 6034} {"train_loss": -26.82242202758789, "global_step": 500884, "epoch": 6034} {"train_loss": -27.2089786529541, "global_step": 500885, "epoch": 6034} {"train_loss": -27.637304306030273, "global_step": 500886, "epoch": 6034} {"train_loss": -27.24897575378418, "global_step": 500887, "epoch": 6034} {"train_loss": -27.503173828125, "global_step": 500888, "epoch": 6034} {"train_loss": -27.23874282836914, "global_step": 500889, "epoch": 6034} {"train_loss": -27.39851188659668, "global_step": 500890, "epoch": 6034} {"train_loss": -27.37896728515625, "global_step": 500891, "epoch": 6034} {"train_loss": -27.36089515686035, "global_step": 500892, "epoch": 6034} {"train_loss": -27.55872917175293, "global_step": 500893, "epoch": 6034} {"train_loss": -27.393396377563477, "global_step": 500894, "epoch": 6034} {"train_loss": -27.603864669799805, "global_step": 500895, "epoch": 6034} {"train_loss": -27.604379653930664, "global_step": 500896, "epoch": 6034} {"train_loss": -27.699390411376953, "global_step": 500897, "epoch": 6034} {"train_loss": -27.843353271484375, "global_step": 500898, "epoch": 6034} {"train_loss": -27.828083038330078, "global_step": 500899, "epoch": 6034} {"train_loss": -27.436004638671875, "global_step": 500900, "epoch": 6034} {"train_loss": -27.081846237182617, "global_step": 500901, "epoch": 6034} {"train_loss": -27.24532127380371, "global_step": 500902, "epoch": 6034} {"train_loss": -27.512914657592773, "global_step": 500903, "epoch": 6034} {"train_loss": -27.303830939603138, "global_step": 500904, "epoch": 6034, "val_loss": 6644827.0} {"train_loss": -26.220245361328125, "global_step": 500905, "epoch": 6035} {"train_loss": -26.4638614654541, "global_step": 500906, "epoch": 6035} {"train_loss": -26.09771156311035, "global_step": 500907, "epoch": 6035} {"train_loss": -26.61812400817871, "global_step": 500908, "epoch": 6035} {"train_loss": -27.044910430908203, "global_step": 500909, "epoch": 6035} {"train_loss": -26.979597091674805, "global_step": 500910, "epoch": 6035} {"train_loss": -26.60637855529785, "global_step": 500911, "epoch": 6035} {"train_loss": -26.76454734802246, "global_step": 500912, "epoch": 6035} {"train_loss": -26.911218643188477, "global_step": 500913, "epoch": 6035} {"train_loss": -27.21359634399414, "global_step": 500914, "epoch": 6035} {"train_loss": -26.871051788330078, "global_step": 500915, "epoch": 6035} {"train_loss": -26.949005126953125, "global_step": 500916, "epoch": 6035} {"train_loss": -27.004562377929688, "global_step": 500917, "epoch": 6035} {"train_loss": -26.963626861572266, "global_step": 500918, "epoch": 6035} {"train_loss": -27.3348388671875, "global_step": 500919, "epoch": 6035} {"train_loss": -26.972196578979492, "global_step": 500920, "epoch": 6035} {"train_loss": -26.977075576782227, "global_step": 500921, "epoch": 6035} {"train_loss": -27.444116592407227, "global_step": 500922, "epoch": 6035} {"train_loss": -27.145288467407227, "global_step": 500923, "epoch": 6035} {"train_loss": -27.249048233032227, "global_step": 500924, "epoch": 6035} {"train_loss": -26.89942741394043, "global_step": 500925, "epoch": 6035} {"train_loss": -27.505979537963867, "global_step": 500926, "epoch": 6035} {"train_loss": -27.227399826049805, "global_step": 500927, "epoch": 6035} {"train_loss": -27.474775314331055, "global_step": 500928, "epoch": 6035} {"train_loss": -27.049026489257812, "global_step": 500929, "epoch": 6035} {"train_loss": -27.2970027923584, "global_step": 500930, "epoch": 6035} {"train_loss": -27.31048011779785, "global_step": 500931, "epoch": 6035} {"train_loss": -27.577564239501953, "global_step": 500932, "epoch": 6035} {"train_loss": -27.443464279174805, "global_step": 500933, "epoch": 6035} {"train_loss": -27.28779411315918, "global_step": 500934, "epoch": 6035} {"train_loss": -27.3455753326416, "global_step": 500935, "epoch": 6035} {"train_loss": -27.567258834838867, "global_step": 500936, "epoch": 6035} {"train_loss": -27.53558921813965, "global_step": 500937, "epoch": 6035} {"train_loss": -27.578800201416016, "global_step": 500938, "epoch": 6035} {"train_loss": -27.525007247924805, "global_step": 500939, "epoch": 6035} {"train_loss": -27.342782974243164, "global_step": 500940, "epoch": 6035} {"train_loss": -27.413116455078125, "global_step": 500941, "epoch": 6035} {"train_loss": -27.498828887939453, "global_step": 500942, "epoch": 6035} {"train_loss": -27.394210815429688, "global_step": 500943, "epoch": 6035} {"train_loss": -27.526105880737305, "global_step": 500944, "epoch": 6035} {"train_loss": -27.784109115600586, "global_step": 500945, "epoch": 6035} {"train_loss": -27.63722038269043, "global_step": 500946, "epoch": 6035} {"train_loss": -27.159149169921875, "global_step": 500947, "epoch": 6035} {"train_loss": -27.7397403717041, "global_step": 500948, "epoch": 6035} {"train_loss": -27.219480514526367, "global_step": 500949, "epoch": 6035} {"train_loss": -27.526630401611328, "global_step": 500950, "epoch": 6035} {"train_loss": -27.567188262939453, "global_step": 500951, "epoch": 6035} {"train_loss": -27.50310707092285, "global_step": 500952, "epoch": 6035} {"train_loss": -27.517486572265625, "global_step": 500953, "epoch": 6035} {"train_loss": -27.233551025390625, "global_step": 500954, "epoch": 6035} {"train_loss": -27.470001220703125, "global_step": 500955, "epoch": 6035} {"train_loss": -27.50465202331543, "global_step": 500956, "epoch": 6035} {"train_loss": -27.595502853393555, "global_step": 500957, "epoch": 6035} {"train_loss": -27.386829376220703, "global_step": 500958, "epoch": 6035} {"train_loss": -27.037912368774414, "global_step": 500959, "epoch": 6035} {"train_loss": -27.520751953125, "global_step": 500960, "epoch": 6035} {"train_loss": -27.731781005859375, "global_step": 500961, "epoch": 6035} {"train_loss": -27.126142501831055, "global_step": 500962, "epoch": 6035} {"train_loss": -26.858274459838867, "global_step": 500963, "epoch": 6035} {"train_loss": -27.482131958007812, "global_step": 500964, "epoch": 6035} {"train_loss": -27.1824951171875, "global_step": 500965, "epoch": 6035} {"train_loss": -27.681238174438477, "global_step": 500966, "epoch": 6035} {"train_loss": -27.454004287719727, "global_step": 500967, "epoch": 6035} {"train_loss": -27.666427612304688, "global_step": 500968, "epoch": 6035} {"train_loss": -27.785120010375977, "global_step": 500969, "epoch": 6035} {"train_loss": -27.335813522338867, "global_step": 500970, "epoch": 6035} {"train_loss": -26.73504638671875, "global_step": 500971, "epoch": 6035} {"train_loss": -27.709308624267578, "global_step": 500972, "epoch": 6035} {"train_loss": -27.162412643432617, "global_step": 500973, "epoch": 6035} {"train_loss": -27.401092529296875, "global_step": 500974, "epoch": 6035} {"train_loss": -27.152618408203125, "global_step": 500975, "epoch": 6035} {"train_loss": -27.54669189453125, "global_step": 500976, "epoch": 6035} {"train_loss": -27.700347900390625, "global_step": 500977, "epoch": 6035} {"train_loss": -27.3297176361084, "global_step": 500978, "epoch": 6035} {"train_loss": -27.196481704711914, "global_step": 500979, "epoch": 6035} {"train_loss": -27.472110748291016, "global_step": 500980, "epoch": 6035} {"train_loss": -27.13298988342285, "global_step": 500981, "epoch": 6035} {"train_loss": -27.116657257080078, "global_step": 500982, "epoch": 6035} {"train_loss": -26.839757919311523, "global_step": 500983, "epoch": 6035} {"train_loss": -27.475675582885742, "global_step": 500984, "epoch": 6035} {"train_loss": -27.338321685791016, "global_step": 500985, "epoch": 6035} {"train_loss": -27.2003231048584, "global_step": 500986, "epoch": 6035} {"train_loss": -27.25771272038839, "global_step": 500987, "epoch": 6035, "val_loss": 6598725.0} {"train_loss": -26.58770751953125, "global_step": 500988, "epoch": 6036} {"train_loss": -27.041278839111328, "global_step": 500989, "epoch": 6036} {"train_loss": -27.096487045288086, "global_step": 500990, "epoch": 6036} {"train_loss": -26.938467025756836, "global_step": 500991, "epoch": 6036} {"train_loss": -26.878925323486328, "global_step": 500992, "epoch": 6036} {"train_loss": -26.80610466003418, "global_step": 500993, "epoch": 6036} {"train_loss": -26.880542755126953, "global_step": 500994, "epoch": 6036} {"train_loss": -27.0032958984375, "global_step": 500995, "epoch": 6036} {"train_loss": -27.18548011779785, "global_step": 500996, "epoch": 6036} {"train_loss": -26.71708106994629, "global_step": 500997, "epoch": 6036} {"train_loss": -27.068384170532227, "global_step": 500998, "epoch": 6036} {"train_loss": -27.0288143157959, "global_step": 500999, "epoch": 6036} {"train_loss": -27.148681640625, "global_step": 501000, "epoch": 6036} {"train_loss": -27.427566528320312, "global_step": 501001, "epoch": 6036} {"train_loss": -26.984821319580078, "global_step": 501002, "epoch": 6036} {"train_loss": -27.28748893737793, "global_step": 501003, "epoch": 6036} {"train_loss": -27.29233169555664, "global_step": 501004, "epoch": 6036} {"train_loss": -27.225605010986328, "global_step": 501005, "epoch": 6036} {"train_loss": -27.347944259643555, "global_step": 501006, "epoch": 6036} {"train_loss": -27.081867218017578, "global_step": 501007, "epoch": 6036} {"train_loss": -27.233545303344727, "global_step": 501008, "epoch": 6036} {"train_loss": -27.54375648498535, "global_step": 501009, "epoch": 6036} {"train_loss": -27.444934844970703, "global_step": 501010, "epoch": 6036} {"train_loss": -27.26179313659668, "global_step": 501011, "epoch": 6036} {"train_loss": -27.45490074157715, "global_step": 501012, "epoch": 6036} {"train_loss": -27.380170822143555, "global_step": 501013, "epoch": 6036} {"train_loss": -27.458616256713867, "global_step": 501014, "epoch": 6036} {"train_loss": -27.231109619140625, "global_step": 501015, "epoch": 6036} {"train_loss": -27.111536026000977, "global_step": 501016, "epoch": 6036} {"train_loss": -27.383020401000977, "global_step": 501017, "epoch": 6036} {"train_loss": -27.429534912109375, "global_step": 501018, "epoch": 6036} {"train_loss": -27.543014526367188, "global_step": 501019, "epoch": 6036} {"train_loss": -27.64076042175293, "global_step": 501020, "epoch": 6036} {"train_loss": -27.3093204498291, "global_step": 501021, "epoch": 6036} {"train_loss": -26.963037490844727, "global_step": 501022, "epoch": 6036} {"train_loss": -27.454242706298828, "global_step": 501023, "epoch": 6036} {"train_loss": -27.36976432800293, "global_step": 501024, "epoch": 6036} {"train_loss": -27.769681930541992, "global_step": 501025, "epoch": 6036} {"train_loss": -27.58846092224121, "global_step": 501026, "epoch": 6036} {"train_loss": -27.29412269592285, "global_step": 501027, "epoch": 6036} {"train_loss": -27.279199600219727, "global_step": 501028, "epoch": 6036} {"train_loss": -27.5457763671875, "global_step": 501029, "epoch": 6036} {"train_loss": -27.419586181640625, "global_step": 501030, "epoch": 6036} {"train_loss": -27.315723419189453, "global_step": 501031, "epoch": 6036} {"train_loss": -27.631872177124023, "global_step": 501032, "epoch": 6036} {"train_loss": -27.70488929748535, "global_step": 501033, "epoch": 6036} {"train_loss": -27.58538818359375, "global_step": 501034, "epoch": 6036} {"train_loss": -27.382673263549805, "global_step": 501035, "epoch": 6036} {"train_loss": -27.55670738220215, "global_step": 501036, "epoch": 6036} {"train_loss": -27.487415313720703, "global_step": 501037, "epoch": 6036} {"train_loss": -27.51676368713379, "global_step": 501038, "epoch": 6036} {"train_loss": -27.333282470703125, "global_step": 501039, "epoch": 6036} {"train_loss": -27.30897331237793, "global_step": 501040, "epoch": 6036} {"train_loss": -27.189977645874023, "global_step": 501041, "epoch": 6036} {"train_loss": -27.40032958984375, "global_step": 501042, "epoch": 6036} {"train_loss": -27.517704010009766, "global_step": 501043, "epoch": 6036} {"train_loss": -27.607824325561523, "global_step": 501044, "epoch": 6036} {"train_loss": -27.627063751220703, "global_step": 501045, "epoch": 6036} {"train_loss": -27.25324821472168, "global_step": 501046, "epoch": 6036} {"train_loss": -27.4766788482666, "global_step": 501047, "epoch": 6036} {"train_loss": -27.82352066040039, "global_step": 501048, "epoch": 6036} {"train_loss": -27.556608200073242, "global_step": 501049, "epoch": 6036} {"train_loss": -27.35835075378418, "global_step": 501050, "epoch": 6036} {"train_loss": -26.917234420776367, "global_step": 501051, "epoch": 6036} {"train_loss": -26.860076904296875, "global_step": 501052, "epoch": 6036} {"train_loss": -27.735326766967773, "global_step": 501053, "epoch": 6036} {"train_loss": -27.774362564086914, "global_step": 501054, "epoch": 6036} {"train_loss": -27.04998779296875, "global_step": 501055, "epoch": 6036} {"train_loss": -27.1652774810791, "global_step": 501056, "epoch": 6036} {"train_loss": -27.367401123046875, "global_step": 501057, "epoch": 6036} {"train_loss": -27.6159725189209, "global_step": 501058, "epoch": 6036} {"train_loss": -27.568445205688477, "global_step": 501059, "epoch": 6036} {"train_loss": -27.534326553344727, "global_step": 501060, "epoch": 6036} {"train_loss": -27.4189395904541, "global_step": 501061, "epoch": 6036} {"train_loss": -27.605838775634766, "global_step": 501062, "epoch": 6036} {"train_loss": -27.186735153198242, "global_step": 501063, "epoch": 6036} {"train_loss": -27.415632247924805, "global_step": 501064, "epoch": 6036} {"train_loss": -27.5163516998291, "global_step": 501065, "epoch": 6036} {"train_loss": -27.398527145385742, "global_step": 501066, "epoch": 6036} {"train_loss": -27.527944564819336, "global_step": 501067, "epoch": 6036} {"train_loss": -27.532855987548828, "global_step": 501068, "epoch": 6036} {"train_loss": -27.308094024658203, "global_step": 501069, "epoch": 6036} {"train_loss": -27.310884222926862, "global_step": 501070, "epoch": 6036, "val_loss": 6675437.0} {"train_loss": -27.35505485534668, "global_step": 501071, "epoch": 6037} {"train_loss": -26.639440536499023, "global_step": 501072, "epoch": 6037} {"train_loss": -26.389251708984375, "global_step": 501073, "epoch": 6037} {"train_loss": -26.71197509765625, "global_step": 501074, "epoch": 6037} {"train_loss": -27.131153106689453, "global_step": 501075, "epoch": 6037} {"train_loss": -27.30158805847168, "global_step": 501076, "epoch": 6037} {"train_loss": -27.10443115234375, "global_step": 501077, "epoch": 6037} {"train_loss": -26.97639274597168, "global_step": 501078, "epoch": 6037} {"train_loss": -27.395034790039062, "global_step": 501079, "epoch": 6037} {"train_loss": -27.451398849487305, "global_step": 501080, "epoch": 6037} {"train_loss": -27.0560359954834, "global_step": 501081, "epoch": 6037} {"train_loss": -26.91297721862793, "global_step": 501082, "epoch": 6037} {"train_loss": -27.17938232421875, "global_step": 501083, "epoch": 6037} {"train_loss": -26.918989181518555, "global_step": 501084, "epoch": 6037} {"train_loss": -26.61908531188965, "global_step": 501085, "epoch": 6037} {"train_loss": -27.596267700195312, "global_step": 501086, "epoch": 6037} {"train_loss": -27.50397300720215, "global_step": 501087, "epoch": 6037} {"train_loss": -27.088720321655273, "global_step": 501088, "epoch": 6037} {"train_loss": -27.450611114501953, "global_step": 501089, "epoch": 6037} {"train_loss": -27.049606323242188, "global_step": 501090, "epoch": 6037} {"train_loss": -27.1398983001709, "global_step": 501091, "epoch": 6037} {"train_loss": -27.265289306640625, "global_step": 501092, "epoch": 6037} {"train_loss": -27.27487564086914, "global_step": 501093, "epoch": 6037} {"train_loss": -27.506711959838867, "global_step": 501094, "epoch": 6037} {"train_loss": -26.98982048034668, "global_step": 501095, "epoch": 6037} {"train_loss": -27.626840591430664, "global_step": 501096, "epoch": 6037} {"train_loss": -27.391321182250977, "global_step": 501097, "epoch": 6037} {"train_loss": -27.52491569519043, "global_step": 501098, "epoch": 6037} {"train_loss": -27.155187606811523, "global_step": 501099, "epoch": 6037} {"train_loss": -27.6743221282959, "global_step": 501100, "epoch": 6037} {"train_loss": -27.3095645904541, "global_step": 501101, "epoch": 6037} {"train_loss": -27.451129913330078, "global_step": 501102, "epoch": 6037} {"train_loss": -27.386646270751953, "global_step": 501103, "epoch": 6037} {"train_loss": -26.9659481048584, "global_step": 501104, "epoch": 6037} {"train_loss": -27.289220809936523, "global_step": 501105, "epoch": 6037} {"train_loss": -27.376026153564453, "global_step": 501106, "epoch": 6037} {"train_loss": -27.165746688842773, "global_step": 501107, "epoch": 6037} {"train_loss": -27.4123477935791, "global_step": 501108, "epoch": 6037} {"train_loss": -27.56640625, "global_step": 501109, "epoch": 6037} {"train_loss": -27.76551628112793, "global_step": 501110, "epoch": 6037} {"train_loss": -27.13166618347168, "global_step": 501111, "epoch": 6037} {"train_loss": -27.610177993774414, "global_step": 501112, "epoch": 6037} {"train_loss": -27.335668563842773, "global_step": 501113, "epoch": 6037} {"train_loss": -27.63983726501465, "global_step": 501114, "epoch": 6037} {"train_loss": -27.299203872680664, "global_step": 501115, "epoch": 6037} {"train_loss": -27.774066925048828, "global_step": 501116, "epoch": 6037} {"train_loss": -27.0609073638916, "global_step": 501117, "epoch": 6037} {"train_loss": -27.706090927124023, "global_step": 501118, "epoch": 6037} {"train_loss": -27.62872886657715, "global_step": 501119, "epoch": 6037} {"train_loss": -27.39577293395996, "global_step": 501120, "epoch": 6037} {"train_loss": -27.44632339477539, "global_step": 501121, "epoch": 6037} {"train_loss": -27.17689323425293, "global_step": 501122, "epoch": 6037} {"train_loss": -27.320531845092773, "global_step": 501123, "epoch": 6037} {"train_loss": -27.327451705932617, "global_step": 501124, "epoch": 6037} {"train_loss": -27.373594284057617, "global_step": 501125, "epoch": 6037} {"train_loss": -27.30702018737793, "global_step": 501126, "epoch": 6037} {"train_loss": -27.483625411987305, "global_step": 501127, "epoch": 6037} {"train_loss": -27.35402488708496, "global_step": 501128, "epoch": 6037} {"train_loss": -27.576459884643555, "global_step": 501129, "epoch": 6037} {"train_loss": -27.576705932617188, "global_step": 501130, "epoch": 6037} {"train_loss": -27.26004981994629, "global_step": 501131, "epoch": 6037} {"train_loss": -27.49018669128418, "global_step": 501132, "epoch": 6037} {"train_loss": -27.455968856811523, "global_step": 501133, "epoch": 6037} {"train_loss": -27.109268188476562, "global_step": 501134, "epoch": 6037} {"train_loss": -26.845335006713867, "global_step": 501135, "epoch": 6037} {"train_loss": -26.775182723999023, "global_step": 501136, "epoch": 6037} {"train_loss": -27.193891525268555, "global_step": 501137, "epoch": 6037} {"train_loss": -26.9187068939209, "global_step": 501138, "epoch": 6037} {"train_loss": -27.127033233642578, "global_step": 501139, "epoch": 6037} {"train_loss": -27.24533462524414, "global_step": 501140, "epoch": 6037} {"train_loss": -26.681732177734375, "global_step": 501141, "epoch": 6037} {"train_loss": -26.493152618408203, "global_step": 501142, "epoch": 6037} {"train_loss": -26.928510665893555, "global_step": 501143, "epoch": 6037} {"train_loss": -27.053619384765625, "global_step": 501144, "epoch": 6037} {"train_loss": -27.533796310424805, "global_step": 501145, "epoch": 6037} {"train_loss": -27.005239486694336, "global_step": 501146, "epoch": 6037} {"train_loss": -27.31049156188965, "global_step": 501147, "epoch": 6037} {"train_loss": -27.2761173248291, "global_step": 501148, "epoch": 6037} {"train_loss": -27.214618682861328, "global_step": 501149, "epoch": 6037} {"train_loss": -27.337909698486328, "global_step": 501150, "epoch": 6037} {"train_loss": -27.442626953125, "global_step": 501151, "epoch": 6037} {"train_loss": -27.158843994140625, "global_step": 501152, "epoch": 6037} {"train_loss": -27.234457728374434, "global_step": 501153, "epoch": 6037, "val_loss": 6572949.0} {"train_loss": -26.5134334564209, "global_step": 501154, "epoch": 6038} {"train_loss": -26.705230712890625, "global_step": 501155, "epoch": 6038} {"train_loss": -26.593570709228516, "global_step": 501156, "epoch": 6038} {"train_loss": -26.552480697631836, "global_step": 501157, "epoch": 6038} {"train_loss": -26.927703857421875, "global_step": 501158, "epoch": 6038} {"train_loss": -26.626089096069336, "global_step": 501159, "epoch": 6038} {"train_loss": -27.17815589904785, "global_step": 501160, "epoch": 6038} {"train_loss": -26.83609390258789, "global_step": 501161, "epoch": 6038} {"train_loss": -26.490558624267578, "global_step": 501162, "epoch": 6038} {"train_loss": -27.0426025390625, "global_step": 501163, "epoch": 6038} {"train_loss": -26.916906356811523, "global_step": 501164, "epoch": 6038} {"train_loss": -26.87225341796875, "global_step": 501165, "epoch": 6038} {"train_loss": -27.3045654296875, "global_step": 501166, "epoch": 6038} {"train_loss": -26.862791061401367, "global_step": 501167, "epoch": 6038} {"train_loss": -27.0345516204834, "global_step": 501168, "epoch": 6038} {"train_loss": -27.10212516784668, "global_step": 501169, "epoch": 6038} {"train_loss": -27.25030517578125, "global_step": 501170, "epoch": 6038} {"train_loss": -27.32472038269043, "global_step": 501171, "epoch": 6038} {"train_loss": -27.380231857299805, "global_step": 501172, "epoch": 6038} {"train_loss": -27.281396865844727, "global_step": 501173, "epoch": 6038} {"train_loss": -27.517377853393555, "global_step": 501174, "epoch": 6038} {"train_loss": -27.426313400268555, "global_step": 501175, "epoch": 6038} {"train_loss": -27.307132720947266, "global_step": 501176, "epoch": 6038} {"train_loss": -26.92087745666504, "global_step": 501177, "epoch": 6038} {"train_loss": -27.61441993713379, "global_step": 501178, "epoch": 6038} {"train_loss": -27.774005889892578, "global_step": 501179, "epoch": 6038} {"train_loss": -27.547290802001953, "global_step": 501180, "epoch": 6038} {"train_loss": -27.107105255126953, "global_step": 501181, "epoch": 6038} {"train_loss": -27.224863052368164, "global_step": 501182, "epoch": 6038} {"train_loss": -27.4974308013916, "global_step": 501183, "epoch": 6038} {"train_loss": -27.184720993041992, "global_step": 501184, "epoch": 6038} {"train_loss": -27.398120880126953, "global_step": 501185, "epoch": 6038} {"train_loss": -27.8023738861084, "global_step": 501186, "epoch": 6038} {"train_loss": -27.420042037963867, "global_step": 501187, "epoch": 6038} {"train_loss": -27.466938018798828, "global_step": 501188, "epoch": 6038} {"train_loss": -27.4284610748291, "global_step": 501189, "epoch": 6038} {"train_loss": -27.56106948852539, "global_step": 501190, "epoch": 6038} {"train_loss": -27.269683837890625, "global_step": 501191, "epoch": 6038} {"train_loss": -27.507221221923828, "global_step": 501192, "epoch": 6038} {"train_loss": -27.5037899017334, "global_step": 501193, "epoch": 6038} {"train_loss": -27.32436180114746, "global_step": 501194, "epoch": 6038} {"train_loss": -27.264591217041016, "global_step": 501195, "epoch": 6038} {"train_loss": -27.349454879760742, "global_step": 501196, "epoch": 6038} {"train_loss": -27.365070343017578, "global_step": 501197, "epoch": 6038} {"train_loss": -27.7042293548584, "global_step": 501198, "epoch": 6038} {"train_loss": -27.5924072265625, "global_step": 501199, "epoch": 6038} {"train_loss": -27.630023956298828, "global_step": 501200, "epoch": 6038} {"train_loss": -27.56219482421875, "global_step": 501201, "epoch": 6038} {"train_loss": -27.630722045898438, "global_step": 501202, "epoch": 6038} {"train_loss": -27.881086349487305, "global_step": 501203, "epoch": 6038} {"train_loss": -27.29783058166504, "global_step": 501204, "epoch": 6038} {"train_loss": -27.470325469970703, "global_step": 501205, "epoch": 6038} {"train_loss": -27.336334228515625, "global_step": 501206, "epoch": 6038} {"train_loss": -27.080402374267578, "global_step": 501207, "epoch": 6038} {"train_loss": -27.12662696838379, "global_step": 501208, "epoch": 6038} {"train_loss": -27.61635398864746, "global_step": 501209, "epoch": 6038} {"train_loss": -27.909637451171875, "global_step": 501210, "epoch": 6038} {"train_loss": -27.932165145874023, "global_step": 501211, "epoch": 6038} {"train_loss": -27.20920753479004, "global_step": 501212, "epoch": 6038} {"train_loss": -27.3384952545166, "global_step": 501213, "epoch": 6038} {"train_loss": -27.4117488861084, "global_step": 501214, "epoch": 6038} {"train_loss": -27.32085609436035, "global_step": 501215, "epoch": 6038} {"train_loss": -27.466772079467773, "global_step": 501216, "epoch": 6038} {"train_loss": -27.661365509033203, "global_step": 501217, "epoch": 6038} {"train_loss": -27.551624298095703, "global_step": 501218, "epoch": 6038} {"train_loss": -27.471601486206055, "global_step": 501219, "epoch": 6038} {"train_loss": -27.74648094177246, "global_step": 501220, "epoch": 6038} {"train_loss": -27.6401424407959, "global_step": 501221, "epoch": 6038} {"train_loss": -27.361358642578125, "global_step": 501222, "epoch": 6038} {"train_loss": -27.273664474487305, "global_step": 501223, "epoch": 6038} {"train_loss": -27.35624122619629, "global_step": 501224, "epoch": 6038} {"train_loss": -27.576147079467773, "global_step": 501225, "epoch": 6038} {"train_loss": -27.22829246520996, "global_step": 501226, "epoch": 6038} {"train_loss": -27.25717544555664, "global_step": 501227, "epoch": 6038} {"train_loss": -27.22540283203125, "global_step": 501228, "epoch": 6038} {"train_loss": -27.107772827148438, "global_step": 501229, "epoch": 6038} {"train_loss": -27.213647842407227, "global_step": 501230, "epoch": 6038} {"train_loss": -27.308441162109375, "global_step": 501231, "epoch": 6038} {"train_loss": -27.30141258239746, "global_step": 501232, "epoch": 6038} {"train_loss": -27.17460060119629, "global_step": 501233, "epoch": 6038} {"train_loss": -27.735776901245117, "global_step": 501234, "epoch": 6038} {"train_loss": -27.11102294921875, "global_step": 501235, "epoch": 6038} {"train_loss": -27.30583262156291, "global_step": 501236, "epoch": 6038, "val_loss": 6659524.0} {"train_loss": -26.4243221282959, "global_step": 501237, "epoch": 6039} {"train_loss": -24.991365432739258, "global_step": 501238, "epoch": 6039} {"train_loss": -24.936569213867188, "global_step": 501239, "epoch": 6039} {"train_loss": -26.361225128173828, "global_step": 501240, "epoch": 6039} {"train_loss": -25.25452423095703, "global_step": 501241, "epoch": 6039} {"train_loss": -25.90201187133789, "global_step": 501242, "epoch": 6039} {"train_loss": -25.73073387145996, "global_step": 501243, "epoch": 6039} {"train_loss": -25.7530517578125, "global_step": 501244, "epoch": 6039} {"train_loss": -26.262659072875977, "global_step": 501245, "epoch": 6039} {"train_loss": -25.95338249206543, "global_step": 501246, "epoch": 6039} {"train_loss": -26.322290420532227, "global_step": 501247, "epoch": 6039} {"train_loss": -26.43488883972168, "global_step": 501248, "epoch": 6039} {"train_loss": -26.535703659057617, "global_step": 501249, "epoch": 6039} {"train_loss": -25.71400260925293, "global_step": 501250, "epoch": 6039} {"train_loss": -27.15052604675293, "global_step": 501251, "epoch": 6039} {"train_loss": -26.152185440063477, "global_step": 501252, "epoch": 6039} {"train_loss": -26.816137313842773, "global_step": 501253, "epoch": 6039} {"train_loss": -26.707275390625, "global_step": 501254, "epoch": 6039} {"train_loss": -26.71097755432129, "global_step": 501255, "epoch": 6039} {"train_loss": -26.832197189331055, "global_step": 501256, "epoch": 6039} {"train_loss": -26.86016845703125, "global_step": 501257, "epoch": 6039} {"train_loss": -26.71066665649414, "global_step": 501258, "epoch": 6039} {"train_loss": -26.806961059570312, "global_step": 501259, "epoch": 6039} {"train_loss": -26.95157814025879, "global_step": 501260, "epoch": 6039} {"train_loss": -26.650390625, "global_step": 501261, "epoch": 6039} {"train_loss": -27.141111373901367, "global_step": 501262, "epoch": 6039} {"train_loss": -26.676984786987305, "global_step": 501263, "epoch": 6039} {"train_loss": -26.794086456298828, "global_step": 501264, "epoch": 6039} {"train_loss": -27.392898559570312, "global_step": 501265, "epoch": 6039} {"train_loss": -27.223241806030273, "global_step": 501266, "epoch": 6039} {"train_loss": -26.903650283813477, "global_step": 501267, "epoch": 6039} {"train_loss": -27.01468276977539, "global_step": 501268, "epoch": 6039} {"train_loss": -27.336828231811523, "global_step": 501269, "epoch": 6039} {"train_loss": -27.16482925415039, "global_step": 501270, "epoch": 6039} {"train_loss": -27.338642120361328, "global_step": 501271, "epoch": 6039} {"train_loss": -27.366886138916016, "global_step": 501272, "epoch": 6039} {"train_loss": -27.08896827697754, "global_step": 501273, "epoch": 6039} {"train_loss": -27.030141830444336, "global_step": 501274, "epoch": 6039} {"train_loss": -27.300256729125977, "global_step": 501275, "epoch": 6039} {"train_loss": -27.357309341430664, "global_step": 501276, "epoch": 6039} {"train_loss": -27.325719833374023, "global_step": 501277, "epoch": 6039} {"train_loss": -27.711902618408203, "global_step": 501278, "epoch": 6039} {"train_loss": -27.421401977539062, "global_step": 501279, "epoch": 6039} {"train_loss": -27.392053604125977, "global_step": 501280, "epoch": 6039} {"train_loss": -27.824878692626953, "global_step": 501281, "epoch": 6039} {"train_loss": -27.61008071899414, "global_step": 501282, "epoch": 6039} {"train_loss": -27.608972549438477, "global_step": 501283, "epoch": 6039} {"train_loss": -27.51812171936035, "global_step": 501284, "epoch": 6039} {"train_loss": -27.341440200805664, "global_step": 501285, "epoch": 6039} {"train_loss": -28.07838249206543, "global_step": 501286, "epoch": 6039} {"train_loss": -27.550275802612305, "global_step": 501287, "epoch": 6039} {"train_loss": -27.51896095275879, "global_step": 501288, "epoch": 6039} {"train_loss": -27.399871826171875, "global_step": 501289, "epoch": 6039} {"train_loss": -27.460712432861328, "global_step": 501290, "epoch": 6039} {"train_loss": -27.3978271484375, "global_step": 501291, "epoch": 6039} {"train_loss": -27.423690795898438, "global_step": 501292, "epoch": 6039} {"train_loss": -27.152734756469727, "global_step": 501293, "epoch": 6039} {"train_loss": -27.254302978515625, "global_step": 501294, "epoch": 6039} {"train_loss": -27.357421875, "global_step": 501295, "epoch": 6039} {"train_loss": -27.869338989257812, "global_step": 501296, "epoch": 6039} {"train_loss": -27.25238609313965, "global_step": 501297, "epoch": 6039} {"train_loss": -27.966068267822266, "global_step": 501298, "epoch": 6039} {"train_loss": -27.466955184936523, "global_step": 501299, "epoch": 6039} {"train_loss": -27.6272029876709, "global_step": 501300, "epoch": 6039} {"train_loss": -28.01641273498535, "global_step": 501301, "epoch": 6039} {"train_loss": -27.716293334960938, "global_step": 501302, "epoch": 6039} {"train_loss": -27.4124813079834, "global_step": 501303, "epoch": 6039} {"train_loss": -28.045690536499023, "global_step": 501304, "epoch": 6039} {"train_loss": -27.6328125, "global_step": 501305, "epoch": 6039} {"train_loss": -27.437585830688477, "global_step": 501306, "epoch": 6039} {"train_loss": -27.63435173034668, "global_step": 501307, "epoch": 6039} {"train_loss": -27.68036460876465, "global_step": 501308, "epoch": 6039} {"train_loss": -27.405893325805664, "global_step": 501309, "epoch": 6039} {"train_loss": -28.03193473815918, "global_step": 501310, "epoch": 6039} {"train_loss": -27.508499145507812, "global_step": 501311, "epoch": 6039} {"train_loss": -27.221942901611328, "global_step": 501312, "epoch": 6039} {"train_loss": -27.5671329498291, "global_step": 501313, "epoch": 6039} {"train_loss": -27.167011260986328, "global_step": 501314, "epoch": 6039} {"train_loss": -27.275659561157227, "global_step": 501315, "epoch": 6039} {"train_loss": -27.297616958618164, "global_step": 501316, "epoch": 6039} {"train_loss": -26.73579216003418, "global_step": 501317, "epoch": 6039} {"train_loss": -26.39857292175293, "global_step": 501318, "epoch": 6039} {"train_loss": -27.074166677084314, "global_step": 501319, "epoch": 6039, "val_loss": 6694011.0} {"train_loss": -26.70759391784668, "global_step": 501320, "epoch": 6040} {"train_loss": -26.794605255126953, "global_step": 501321, "epoch": 6040} {"train_loss": -26.97226905822754, "global_step": 501322, "epoch": 6040} {"train_loss": -26.192419052124023, "global_step": 501323, "epoch": 6040} {"train_loss": -26.918994903564453, "global_step": 501324, "epoch": 6040} {"train_loss": -26.4993953704834, "global_step": 501325, "epoch": 6040} {"train_loss": -26.710357666015625, "global_step": 501326, "epoch": 6040} {"train_loss": -26.969379425048828, "global_step": 501327, "epoch": 6040} {"train_loss": -25.69730567932129, "global_step": 501328, "epoch": 6040} {"train_loss": -26.407489776611328, "global_step": 501329, "epoch": 6040} {"train_loss": -26.5885066986084, "global_step": 501330, "epoch": 6040} {"train_loss": -26.868122100830078, "global_step": 501331, "epoch": 6040} {"train_loss": -26.76553726196289, "global_step": 501332, "epoch": 6040} {"train_loss": -26.935754776000977, "global_step": 501333, "epoch": 6040} {"train_loss": -26.90363883972168, "global_step": 501334, "epoch": 6040} {"train_loss": -26.879308700561523, "global_step": 501335, "epoch": 6040} {"train_loss": -26.925024032592773, "global_step": 501336, "epoch": 6040} {"train_loss": -26.87456703186035, "global_step": 501337, "epoch": 6040} {"train_loss": -26.862640380859375, "global_step": 501338, "epoch": 6040} {"train_loss": -26.803598403930664, "global_step": 501339, "epoch": 6040} {"train_loss": -27.224639892578125, "global_step": 501340, "epoch": 6040} {"train_loss": -27.238855361938477, "global_step": 501341, "epoch": 6040} {"train_loss": -27.03192138671875, "global_step": 501342, "epoch": 6040} {"train_loss": -27.07044792175293, "global_step": 501343, "epoch": 6040} {"train_loss": -27.24692726135254, "global_step": 501344, "epoch": 6040} {"train_loss": -27.32451820373535, "global_step": 501345, "epoch": 6040} {"train_loss": -27.035694122314453, "global_step": 501346, "epoch": 6040} {"train_loss": -27.091150283813477, "global_step": 501347, "epoch": 6040} {"train_loss": -27.069616317749023, "global_step": 501348, "epoch": 6040} {"train_loss": -27.125951766967773, "global_step": 501349, "epoch": 6040} {"train_loss": -27.322660446166992, "global_step": 501350, "epoch": 6040} {"train_loss": -27.2611026763916, "global_step": 501351, "epoch": 6040} {"train_loss": -27.26209831237793, "global_step": 501352, "epoch": 6040} {"train_loss": -27.3984317779541, "global_step": 501353, "epoch": 6040} {"train_loss": -27.184803009033203, "global_step": 501354, "epoch": 6040} {"train_loss": -27.61240577697754, "global_step": 501355, "epoch": 6040} {"train_loss": -27.55853271484375, "global_step": 501356, "epoch": 6040} {"train_loss": -27.061172485351562, "global_step": 501357, "epoch": 6040} {"train_loss": -27.156387329101562, "global_step": 501358, "epoch": 6040} {"train_loss": -27.10993003845215, "global_step": 501359, "epoch": 6040} {"train_loss": -27.5339298248291, "global_step": 501360, "epoch": 6040} {"train_loss": -27.517719268798828, "global_step": 501361, "epoch": 6040} {"train_loss": -27.49671745300293, "global_step": 501362, "epoch": 6040} {"train_loss": -27.27918815612793, "global_step": 501363, "epoch": 6040} {"train_loss": -27.725549697875977, "global_step": 501364, "epoch": 6040} {"train_loss": -27.531360626220703, "global_step": 501365, "epoch": 6040} {"train_loss": -27.418020248413086, "global_step": 501366, "epoch": 6040} {"train_loss": -27.460128784179688, "global_step": 501367, "epoch": 6040} {"train_loss": -27.69207191467285, "global_step": 501368, "epoch": 6040} {"train_loss": -27.475141525268555, "global_step": 501369, "epoch": 6040} {"train_loss": -27.8742733001709, "global_step": 501370, "epoch": 6040} {"train_loss": -27.578449249267578, "global_step": 501371, "epoch": 6040} {"train_loss": -28.0838565826416, "global_step": 501372, "epoch": 6040} {"train_loss": -27.611312866210938, "global_step": 501373, "epoch": 6040} {"train_loss": -27.873762130737305, "global_step": 501374, "epoch": 6040} {"train_loss": -27.544010162353516, "global_step": 501375, "epoch": 6040} {"train_loss": -27.65633201599121, "global_step": 501376, "epoch": 6040} {"train_loss": -27.259750366210938, "global_step": 501377, "epoch": 6040} {"train_loss": -27.57862663269043, "global_step": 501378, "epoch": 6040} {"train_loss": -27.50641441345215, "global_step": 501379, "epoch": 6040} {"train_loss": -27.371774673461914, "global_step": 501380, "epoch": 6040} {"train_loss": -27.414398193359375, "global_step": 501381, "epoch": 6040} {"train_loss": -27.711523056030273, "global_step": 501382, "epoch": 6040} {"train_loss": -27.57806968688965, "global_step": 501383, "epoch": 6040} {"train_loss": -27.766925811767578, "global_step": 501384, "epoch": 6040} {"train_loss": -27.587600708007812, "global_step": 501385, "epoch": 6040} {"train_loss": -27.61590576171875, "global_step": 501386, "epoch": 6040} {"train_loss": -27.560550689697266, "global_step": 501387, "epoch": 6040} {"train_loss": -27.144498825073242, "global_step": 501388, "epoch": 6040} {"train_loss": -26.368310928344727, "global_step": 501389, "epoch": 6040} {"train_loss": -25.89552879333496, "global_step": 501390, "epoch": 6040} {"train_loss": -26.24798011779785, "global_step": 501391, "epoch": 6040} {"train_loss": -27.28911781311035, "global_step": 501392, "epoch": 6040} {"train_loss": -27.1033935546875, "global_step": 501393, "epoch": 6040} {"train_loss": -26.637964248657227, "global_step": 501394, "epoch": 6040} {"train_loss": -26.74312400817871, "global_step": 501395, "epoch": 6040} {"train_loss": -27.047040939331055, "global_step": 501396, "epoch": 6040} {"train_loss": -26.455692291259766, "global_step": 501397, "epoch": 6040} {"train_loss": -27.519062042236328, "global_step": 501398, "epoch": 6040} {"train_loss": -26.73548698425293, "global_step": 501399, "epoch": 6040} {"train_loss": -27.197967529296875, "global_step": 501400, "epoch": 6040} {"train_loss": -26.89469337463379, "global_step": 501401, "epoch": 6040} {"train_loss": -27.157733089952583, "global_step": 501402, "epoch": 6040, "val_loss": 6726813.0} {"train_loss": -26.2216796875, "global_step": 501403, "epoch": 6041} {"train_loss": -26.21259117126465, "global_step": 501404, "epoch": 6041} {"train_loss": -25.81270408630371, "global_step": 501405, "epoch": 6041} {"train_loss": -26.567829132080078, "global_step": 501406, "epoch": 6041} {"train_loss": -26.332321166992188, "global_step": 501407, "epoch": 6041} {"train_loss": -26.66522789001465, "global_step": 501408, "epoch": 6041} {"train_loss": -26.49436378479004, "global_step": 501409, "epoch": 6041} {"train_loss": -26.985361099243164, "global_step": 501410, "epoch": 6041} {"train_loss": -27.068119049072266, "global_step": 501411, "epoch": 6041} {"train_loss": -26.660688400268555, "global_step": 501412, "epoch": 6041} {"train_loss": -26.85749626159668, "global_step": 501413, "epoch": 6041} {"train_loss": -26.875036239624023, "global_step": 501414, "epoch": 6041} {"train_loss": -26.97210121154785, "global_step": 501415, "epoch": 6041} {"train_loss": -26.86665153503418, "global_step": 501416, "epoch": 6041} {"train_loss": -26.998844146728516, "global_step": 501417, "epoch": 6041} {"train_loss": -27.053943634033203, "global_step": 501418, "epoch": 6041} {"train_loss": -27.144062042236328, "global_step": 501419, "epoch": 6041} {"train_loss": -27.136762619018555, "global_step": 501420, "epoch": 6041} {"train_loss": -27.074604034423828, "global_step": 501421, "epoch": 6041} {"train_loss": -26.8896427154541, "global_step": 501422, "epoch": 6041} {"train_loss": -27.130529403686523, "global_step": 501423, "epoch": 6041} {"train_loss": -27.078214645385742, "global_step": 501424, "epoch": 6041} {"train_loss": -27.34970474243164, "global_step": 501425, "epoch": 6041} {"train_loss": -27.196012496948242, "global_step": 501426, "epoch": 6041} {"train_loss": -27.184484481811523, "global_step": 501427, "epoch": 6041} {"train_loss": -26.89642906188965, "global_step": 501428, "epoch": 6041} {"train_loss": -27.020872116088867, "global_step": 501429, "epoch": 6041} {"train_loss": -27.353525161743164, "global_step": 501430, "epoch": 6041} {"train_loss": -27.510700225830078, "global_step": 501431, "epoch": 6041} {"train_loss": -26.720014572143555, "global_step": 501432, "epoch": 6041} {"train_loss": -27.123279571533203, "global_step": 501433, "epoch": 6041} {"train_loss": -27.623233795166016, "global_step": 501434, "epoch": 6041} {"train_loss": -27.3341121673584, "global_step": 501435, "epoch": 6041} {"train_loss": -27.192651748657227, "global_step": 501436, "epoch": 6041} {"train_loss": -27.3675594329834, "global_step": 501437, "epoch": 6041} {"train_loss": -27.050947189331055, "global_step": 501438, "epoch": 6041} {"train_loss": -27.3207950592041, "global_step": 501439, "epoch": 6041} {"train_loss": -27.197202682495117, "global_step": 501440, "epoch": 6041} {"train_loss": -27.3216495513916, "global_step": 501441, "epoch": 6041} {"train_loss": -27.06049919128418, "global_step": 501442, "epoch": 6041} {"train_loss": -27.37595558166504, "global_step": 501443, "epoch": 6041} {"train_loss": -27.497013092041016, "global_step": 501444, "epoch": 6041} {"train_loss": -27.2891845703125, "global_step": 501445, "epoch": 6041} {"train_loss": -27.461109161376953, "global_step": 501446, "epoch": 6041} {"train_loss": -27.322797775268555, "global_step": 501447, "epoch": 6041} {"train_loss": -27.232547760009766, "global_step": 501448, "epoch": 6041} {"train_loss": -27.464075088500977, "global_step": 501449, "epoch": 6041} {"train_loss": -27.4321346282959, "global_step": 501450, "epoch": 6041} {"train_loss": -27.5931453704834, "global_step": 501451, "epoch": 6041} {"train_loss": -27.177932739257812, "global_step": 501452, "epoch": 6041} {"train_loss": -27.695880889892578, "global_step": 501453, "epoch": 6041} {"train_loss": -27.416410446166992, "global_step": 501454, "epoch": 6041} {"train_loss": -27.303577423095703, "global_step": 501455, "epoch": 6041} {"train_loss": -27.446531295776367, "global_step": 501456, "epoch": 6041} {"train_loss": -27.451513290405273, "global_step": 501457, "epoch": 6041} {"train_loss": -27.6250057220459, "global_step": 501458, "epoch": 6041} {"train_loss": -27.497114181518555, "global_step": 501459, "epoch": 6041} {"train_loss": -27.565515518188477, "global_step": 501460, "epoch": 6041} {"train_loss": -27.568384170532227, "global_step": 501461, "epoch": 6041} {"train_loss": -27.47345542907715, "global_step": 501462, "epoch": 6041} {"train_loss": -27.4501953125, "global_step": 501463, "epoch": 6041} {"train_loss": -27.308990478515625, "global_step": 501464, "epoch": 6041} {"train_loss": -27.767927169799805, "global_step": 501465, "epoch": 6041} {"train_loss": -27.364776611328125, "global_step": 501466, "epoch": 6041} {"train_loss": -27.82745933532715, "global_step": 501467, "epoch": 6041} {"train_loss": -27.44679069519043, "global_step": 501468, "epoch": 6041} {"train_loss": -27.16438102722168, "global_step": 501469, "epoch": 6041} {"train_loss": -27.68708610534668, "global_step": 501470, "epoch": 6041} {"train_loss": -27.46552085876465, "global_step": 501471, "epoch": 6041} {"train_loss": -27.498579025268555, "global_step": 501472, "epoch": 6041} {"train_loss": -27.56141471862793, "global_step": 501473, "epoch": 6041} {"train_loss": -27.523578643798828, "global_step": 501474, "epoch": 6041} {"train_loss": -26.926599502563477, "global_step": 501475, "epoch": 6041} {"train_loss": -27.282434463500977, "global_step": 501476, "epoch": 6041} {"train_loss": -27.342578887939453, "global_step": 501477, "epoch": 6041} {"train_loss": -27.383283615112305, "global_step": 501478, "epoch": 6041} {"train_loss": -27.2890625, "global_step": 501479, "epoch": 6041} {"train_loss": -27.2375545501709, "global_step": 501480, "epoch": 6041} {"train_loss": -27.276914596557617, "global_step": 501481, "epoch": 6041} {"train_loss": -27.786029815673828, "global_step": 501482, "epoch": 6041} {"train_loss": -27.435827255249023, "global_step": 501483, "epoch": 6041} {"train_loss": -27.220733642578125, "global_step": 501484, "epoch": 6041} {"train_loss": -27.21141695689006, "global_step": 501485, "epoch": 6041, "val_loss": 6601338.0} {"train_loss": -26.844335556030273, "global_step": 501486, "epoch": 6042} {"train_loss": -26.76028823852539, "global_step": 501487, "epoch": 6042} {"train_loss": -27.116302490234375, "global_step": 501488, "epoch": 6042} {"train_loss": -27.1142578125, "global_step": 501489, "epoch": 6042} {"train_loss": -26.867263793945312, "global_step": 501490, "epoch": 6042} {"train_loss": -26.673688888549805, "global_step": 501491, "epoch": 6042} {"train_loss": -27.2499942779541, "global_step": 501492, "epoch": 6042} {"train_loss": -27.039274215698242, "global_step": 501493, "epoch": 6042} {"train_loss": -27.04437828063965, "global_step": 501494, "epoch": 6042} {"train_loss": -26.82452964782715, "global_step": 501495, "epoch": 6042} {"train_loss": -26.96713638305664, "global_step": 501496, "epoch": 6042} {"train_loss": -26.70957374572754, "global_step": 501497, "epoch": 6042} {"train_loss": -27.310810089111328, "global_step": 501498, "epoch": 6042} {"train_loss": -27.05794334411621, "global_step": 501499, "epoch": 6042} {"train_loss": -27.242462158203125, "global_step": 501500, "epoch": 6042} {"train_loss": -26.90472412109375, "global_step": 501501, "epoch": 6042} {"train_loss": -27.1497745513916, "global_step": 501502, "epoch": 6042} {"train_loss": -27.032245635986328, "global_step": 501503, "epoch": 6042} {"train_loss": -27.568531036376953, "global_step": 501504, "epoch": 6042} {"train_loss": -26.867725372314453, "global_step": 501505, "epoch": 6042} {"train_loss": -27.258264541625977, "global_step": 501506, "epoch": 6042} {"train_loss": -27.3289737701416, "global_step": 501507, "epoch": 6042} {"train_loss": -27.379850387573242, "global_step": 501508, "epoch": 6042} {"train_loss": -27.566547393798828, "global_step": 501509, "epoch": 6042} {"train_loss": -26.935094833374023, "global_step": 501510, "epoch": 6042} {"train_loss": -27.367090225219727, "global_step": 501511, "epoch": 6042} {"train_loss": -27.310205459594727, "global_step": 501512, "epoch": 6042} {"train_loss": -27.249364852905273, "global_step": 501513, "epoch": 6042} {"train_loss": -26.86030387878418, "global_step": 501514, "epoch": 6042} {"train_loss": -27.101911544799805, "global_step": 501515, "epoch": 6042} {"train_loss": -27.539752960205078, "global_step": 501516, "epoch": 6042} {"train_loss": -27.49091911315918, "global_step": 501517, "epoch": 6042} {"train_loss": -27.408483505249023, "global_step": 501518, "epoch": 6042} {"train_loss": -27.84244728088379, "global_step": 501519, "epoch": 6042} {"train_loss": -27.647958755493164, "global_step": 501520, "epoch": 6042} {"train_loss": -27.6514949798584, "global_step": 501521, "epoch": 6042} {"train_loss": -27.42792320251465, "global_step": 501522, "epoch": 6042} {"train_loss": -27.435474395751953, "global_step": 501523, "epoch": 6042} {"train_loss": -27.31427574157715, "global_step": 501524, "epoch": 6042} {"train_loss": -27.165618896484375, "global_step": 501525, "epoch": 6042} {"train_loss": -27.543872833251953, "global_step": 501526, "epoch": 6042} {"train_loss": -27.608814239501953, "global_step": 501527, "epoch": 6042} {"train_loss": -27.3354549407959, "global_step": 501528, "epoch": 6042} {"train_loss": -27.200056076049805, "global_step": 501529, "epoch": 6042} {"train_loss": -27.416955947875977, "global_step": 501530, "epoch": 6042} {"train_loss": -27.02028465270996, "global_step": 501531, "epoch": 6042} {"train_loss": -27.391986846923828, "global_step": 501532, "epoch": 6042} {"train_loss": -27.416675567626953, "global_step": 501533, "epoch": 6042} {"train_loss": -27.40375328063965, "global_step": 501534, "epoch": 6042} {"train_loss": -27.899648666381836, "global_step": 501535, "epoch": 6042} {"train_loss": -27.722293853759766, "global_step": 501536, "epoch": 6042} {"train_loss": -27.647192001342773, "global_step": 501537, "epoch": 6042} {"train_loss": -27.370975494384766, "global_step": 501538, "epoch": 6042} {"train_loss": -27.728992462158203, "global_step": 501539, "epoch": 6042} {"train_loss": -27.071643829345703, "global_step": 501540, "epoch": 6042} {"train_loss": -27.517980575561523, "global_step": 501541, "epoch": 6042} {"train_loss": -27.39923095703125, "global_step": 501542, "epoch": 6042} {"train_loss": -27.197925567626953, "global_step": 501543, "epoch": 6042} {"train_loss": -27.410364151000977, "global_step": 501544, "epoch": 6042} {"train_loss": -27.114179611206055, "global_step": 501545, "epoch": 6042} {"train_loss": -27.772796630859375, "global_step": 501546, "epoch": 6042} {"train_loss": -27.558868408203125, "global_step": 501547, "epoch": 6042} {"train_loss": -27.831851959228516, "global_step": 501548, "epoch": 6042} {"train_loss": -27.488224029541016, "global_step": 501549, "epoch": 6042} {"train_loss": -27.638071060180664, "global_step": 501550, "epoch": 6042} {"train_loss": -27.675931930541992, "global_step": 501551, "epoch": 6042} {"train_loss": -27.661413192749023, "global_step": 501552, "epoch": 6042} {"train_loss": -27.515094757080078, "global_step": 501553, "epoch": 6042} {"train_loss": -27.159442901611328, "global_step": 501554, "epoch": 6042} {"train_loss": -27.614683151245117, "global_step": 501555, "epoch": 6042} {"train_loss": -27.178369522094727, "global_step": 501556, "epoch": 6042} {"train_loss": -26.803510665893555, "global_step": 501557, "epoch": 6042} {"train_loss": -27.037771224975586, "global_step": 501558, "epoch": 6042} {"train_loss": -27.534015655517578, "global_step": 501559, "epoch": 6042} {"train_loss": -27.034393310546875, "global_step": 501560, "epoch": 6042} {"train_loss": -27.172317504882812, "global_step": 501561, "epoch": 6042} {"train_loss": -27.07773208618164, "global_step": 501562, "epoch": 6042} {"train_loss": -26.86505126953125, "global_step": 501563, "epoch": 6042} {"train_loss": -27.5546932220459, "global_step": 501564, "epoch": 6042} {"train_loss": -27.6168155670166, "global_step": 501565, "epoch": 6042} {"train_loss": -27.206928253173828, "global_step": 501566, "epoch": 6042} {"train_loss": -27.437469482421875, "global_step": 501567, "epoch": 6042} {"train_loss": -27.308840717177794, "global_step": 501568, "epoch": 6042, "val_loss": 6674252.0} {"train_loss": -26.56174087524414, "global_step": 501569, "epoch": 6043} {"train_loss": -27.137939453125, "global_step": 501570, "epoch": 6043} {"train_loss": -27.00689125061035, "global_step": 501571, "epoch": 6043} {"train_loss": -26.871753692626953, "global_step": 501572, "epoch": 6043} {"train_loss": -26.89362144470215, "global_step": 501573, "epoch": 6043} {"train_loss": -26.798547744750977, "global_step": 501574, "epoch": 6043} {"train_loss": -27.21333122253418, "global_step": 501575, "epoch": 6043} {"train_loss": -26.733112335205078, "global_step": 501576, "epoch": 6043} {"train_loss": -27.345991134643555, "global_step": 501577, "epoch": 6043} {"train_loss": -26.929014205932617, "global_step": 501578, "epoch": 6043} {"train_loss": -27.3747501373291, "global_step": 501579, "epoch": 6043} {"train_loss": -26.813385009765625, "global_step": 501580, "epoch": 6043} {"train_loss": -27.370935440063477, "global_step": 501581, "epoch": 6043} {"train_loss": -27.310583114624023, "global_step": 501582, "epoch": 6043} {"train_loss": -27.0664119720459, "global_step": 501583, "epoch": 6043} {"train_loss": -27.087387084960938, "global_step": 501584, "epoch": 6043} {"train_loss": -27.118438720703125, "global_step": 501585, "epoch": 6043} {"train_loss": -26.993030548095703, "global_step": 501586, "epoch": 6043} {"train_loss": -27.29740333557129, "global_step": 501587, "epoch": 6043} {"train_loss": -27.2228946685791, "global_step": 501588, "epoch": 6043} {"train_loss": -27.47723960876465, "global_step": 501589, "epoch": 6043} {"train_loss": -26.960468292236328, "global_step": 501590, "epoch": 6043} {"train_loss": -27.339529037475586, "global_step": 501591, "epoch": 6043} {"train_loss": -27.197092056274414, "global_step": 501592, "epoch": 6043} {"train_loss": -27.44134521484375, "global_step": 501593, "epoch": 6043} {"train_loss": -26.89484977722168, "global_step": 501594, "epoch": 6043} {"train_loss": -27.066247940063477, "global_step": 501595, "epoch": 6043} {"train_loss": -27.26358985900879, "global_step": 501596, "epoch": 6043} {"train_loss": -27.079166412353516, "global_step": 501597, "epoch": 6043} {"train_loss": -27.140869140625, "global_step": 501598, "epoch": 6043} {"train_loss": -27.075031280517578, "global_step": 501599, "epoch": 6043} {"train_loss": -27.669647216796875, "global_step": 501600, "epoch": 6043} {"train_loss": -27.21663475036621, "global_step": 501601, "epoch": 6043} {"train_loss": -27.1794490814209, "global_step": 501602, "epoch": 6043} {"train_loss": -27.410337448120117, "global_step": 501603, "epoch": 6043} {"train_loss": -27.196378707885742, "global_step": 501604, "epoch": 6043} {"train_loss": -27.23828125, "global_step": 501605, "epoch": 6043} {"train_loss": -27.227313995361328, "global_step": 501606, "epoch": 6043} {"train_loss": -27.280927658081055, "global_step": 501607, "epoch": 6043} {"train_loss": -27.931161880493164, "global_step": 501608, "epoch": 6043} {"train_loss": -27.616180419921875, "global_step": 501609, "epoch": 6043} {"train_loss": -27.470510482788086, "global_step": 501610, "epoch": 6043} {"train_loss": -27.594995498657227, "global_step": 501611, "epoch": 6043} {"train_loss": -27.099475860595703, "global_step": 501612, "epoch": 6043} {"train_loss": -27.298248291015625, "global_step": 501613, "epoch": 6043} {"train_loss": -27.4329776763916, "global_step": 501614, "epoch": 6043} {"train_loss": -27.7297420501709, "global_step": 501615, "epoch": 6043} {"train_loss": -27.49045181274414, "global_step": 501616, "epoch": 6043} {"train_loss": -27.409442901611328, "global_step": 501617, "epoch": 6043} {"train_loss": -27.342041015625, "global_step": 501618, "epoch": 6043} {"train_loss": -27.33057975769043, "global_step": 501619, "epoch": 6043} {"train_loss": -27.570295333862305, "global_step": 501620, "epoch": 6043} {"train_loss": -26.97114372253418, "global_step": 501621, "epoch": 6043} {"train_loss": -27.501279830932617, "global_step": 501622, "epoch": 6043} {"train_loss": -27.34099769592285, "global_step": 501623, "epoch": 6043} {"train_loss": -27.398462295532227, "global_step": 501624, "epoch": 6043} {"train_loss": -27.614545822143555, "global_step": 501625, "epoch": 6043} {"train_loss": -27.488611221313477, "global_step": 501626, "epoch": 6043} {"train_loss": -27.790403366088867, "global_step": 501627, "epoch": 6043} {"train_loss": -27.122516632080078, "global_step": 501628, "epoch": 6043} {"train_loss": -27.212751388549805, "global_step": 501629, "epoch": 6043} {"train_loss": -27.028324127197266, "global_step": 501630, "epoch": 6043} {"train_loss": -27.337926864624023, "global_step": 501631, "epoch": 6043} {"train_loss": -27.634082794189453, "global_step": 501632, "epoch": 6043} {"train_loss": -27.14884376525879, "global_step": 501633, "epoch": 6043} {"train_loss": -27.877399444580078, "global_step": 501634, "epoch": 6043} {"train_loss": -27.5242862701416, "global_step": 501635, "epoch": 6043} {"train_loss": -27.53004264831543, "global_step": 501636, "epoch": 6043} {"train_loss": -27.598825454711914, "global_step": 501637, "epoch": 6043} {"train_loss": -27.393213272094727, "global_step": 501638, "epoch": 6043} {"train_loss": -27.285837173461914, "global_step": 501639, "epoch": 6043} {"train_loss": -27.676807403564453, "global_step": 501640, "epoch": 6043} {"train_loss": -27.489572525024414, "global_step": 501641, "epoch": 6043} {"train_loss": -27.426589965820312, "global_step": 501642, "epoch": 6043} {"train_loss": -27.921985626220703, "global_step": 501643, "epoch": 6043} {"train_loss": -27.43157958984375, "global_step": 501644, "epoch": 6043} {"train_loss": -27.577539443969727, "global_step": 501645, "epoch": 6043} {"train_loss": -27.24932289123535, "global_step": 501646, "epoch": 6043} {"train_loss": -27.7128963470459, "global_step": 501647, "epoch": 6043} {"train_loss": -27.235319137573242, "global_step": 501648, "epoch": 6043} {"train_loss": -27.251813888549805, "global_step": 501649, "epoch": 6043} {"train_loss": -27.934545516967773, "global_step": 501650, "epoch": 6043} {"train_loss": -27.308505644281226, "global_step": 501651, "epoch": 6043, "val_loss": 6569853.0} {"train_loss": -25.974781036376953, "global_step": 501652, "epoch": 6044} {"train_loss": -26.188678741455078, "global_step": 501653, "epoch": 6044} {"train_loss": -26.973011016845703, "global_step": 501654, "epoch": 6044} {"train_loss": -26.630847930908203, "global_step": 501655, "epoch": 6044} {"train_loss": -26.704206466674805, "global_step": 501656, "epoch": 6044} {"train_loss": -27.21941566467285, "global_step": 501657, "epoch": 6044} {"train_loss": -27.087305068969727, "global_step": 501658, "epoch": 6044} {"train_loss": -26.196134567260742, "global_step": 501659, "epoch": 6044} {"train_loss": -26.5896053314209, "global_step": 501660, "epoch": 6044} {"train_loss": -26.636682510375977, "global_step": 501661, "epoch": 6044} {"train_loss": -27.295957565307617, "global_step": 501662, "epoch": 6044} {"train_loss": -26.65351676940918, "global_step": 501663, "epoch": 6044} {"train_loss": -26.48524284362793, "global_step": 501664, "epoch": 6044} {"train_loss": -27.339630126953125, "global_step": 501665, "epoch": 6044} {"train_loss": -26.6143741607666, "global_step": 501666, "epoch": 6044} {"train_loss": -27.369232177734375, "global_step": 501667, "epoch": 6044} {"train_loss": -27.213483810424805, "global_step": 501668, "epoch": 6044} {"train_loss": -26.973562240600586, "global_step": 501669, "epoch": 6044} {"train_loss": -26.928302764892578, "global_step": 501670, "epoch": 6044} {"train_loss": -27.014312744140625, "global_step": 501671, "epoch": 6044} {"train_loss": -27.626386642456055, "global_step": 501672, "epoch": 6044} {"train_loss": -26.71986961364746, "global_step": 501673, "epoch": 6044} {"train_loss": -26.934158325195312, "global_step": 501674, "epoch": 6044} {"train_loss": -27.54296875, "global_step": 501675, "epoch": 6044} {"train_loss": -26.897733688354492, "global_step": 501676, "epoch": 6044} {"train_loss": -27.330123901367188, "global_step": 501677, "epoch": 6044} {"train_loss": -26.831388473510742, "global_step": 501678, "epoch": 6044} {"train_loss": -27.211078643798828, "global_step": 501679, "epoch": 6044} {"train_loss": -26.794836044311523, "global_step": 501680, "epoch": 6044} {"train_loss": -27.18999671936035, "global_step": 501681, "epoch": 6044} {"train_loss": -26.976104736328125, "global_step": 501682, "epoch": 6044} {"train_loss": -27.305707931518555, "global_step": 501683, "epoch": 6044} {"train_loss": -27.287464141845703, "global_step": 501684, "epoch": 6044} {"train_loss": -27.239444732666016, "global_step": 501685, "epoch": 6044} {"train_loss": -27.084857940673828, "global_step": 501686, "epoch": 6044} {"train_loss": -27.18147850036621, "global_step": 501687, "epoch": 6044} {"train_loss": -26.900476455688477, "global_step": 501688, "epoch": 6044} {"train_loss": -27.23720359802246, "global_step": 501689, "epoch": 6044} {"train_loss": -27.227502822875977, "global_step": 501690, "epoch": 6044} {"train_loss": -27.478544235229492, "global_step": 501691, "epoch": 6044} {"train_loss": -27.234821319580078, "global_step": 501692, "epoch": 6044} {"train_loss": -27.09356117248535, "global_step": 501693, "epoch": 6044} {"train_loss": -27.601028442382812, "global_step": 501694, "epoch": 6044} {"train_loss": -26.924793243408203, "global_step": 501695, "epoch": 6044} {"train_loss": -27.333831787109375, "global_step": 501696, "epoch": 6044} {"train_loss": -27.518529891967773, "global_step": 501697, "epoch": 6044} {"train_loss": -27.0631103515625, "global_step": 501698, "epoch": 6044} {"train_loss": -27.377450942993164, "global_step": 501699, "epoch": 6044} {"train_loss": -27.27544593811035, "global_step": 501700, "epoch": 6044} {"train_loss": -27.428436279296875, "global_step": 501701, "epoch": 6044} {"train_loss": -27.40205192565918, "global_step": 501702, "epoch": 6044} {"train_loss": -27.288557052612305, "global_step": 501703, "epoch": 6044} {"train_loss": -26.994831085205078, "global_step": 501704, "epoch": 6044} {"train_loss": -27.316303253173828, "global_step": 501705, "epoch": 6044} {"train_loss": -27.244476318359375, "global_step": 501706, "epoch": 6044} {"train_loss": -27.002344131469727, "global_step": 501707, "epoch": 6044} {"train_loss": -27.453704833984375, "global_step": 501708, "epoch": 6044} {"train_loss": -27.2766056060791, "global_step": 501709, "epoch": 6044} {"train_loss": -27.922576904296875, "global_step": 501710, "epoch": 6044} {"train_loss": -27.577316284179688, "global_step": 501711, "epoch": 6044} {"train_loss": -27.490402221679688, "global_step": 501712, "epoch": 6044} {"train_loss": -27.444562911987305, "global_step": 501713, "epoch": 6044} {"train_loss": -27.669031143188477, "global_step": 501714, "epoch": 6044} {"train_loss": -27.744558334350586, "global_step": 501715, "epoch": 6044} {"train_loss": -27.275495529174805, "global_step": 501716, "epoch": 6044} {"train_loss": -27.56330680847168, "global_step": 501717, "epoch": 6044} {"train_loss": -27.227069854736328, "global_step": 501718, "epoch": 6044} {"train_loss": -27.6835994720459, "global_step": 501719, "epoch": 6044} {"train_loss": -27.7386417388916, "global_step": 501720, "epoch": 6044} {"train_loss": -27.538684844970703, "global_step": 501721, "epoch": 6044} {"train_loss": -27.5596866607666, "global_step": 501722, "epoch": 6044} {"train_loss": -27.56043815612793, "global_step": 501723, "epoch": 6044} {"train_loss": -27.507720947265625, "global_step": 501724, "epoch": 6044} {"train_loss": -27.494647979736328, "global_step": 501725, "epoch": 6044} {"train_loss": -27.49595069885254, "global_step": 501726, "epoch": 6044} {"train_loss": -27.79498863220215, "global_step": 501727, "epoch": 6044} {"train_loss": -27.542203903198242, "global_step": 501728, "epoch": 6044} {"train_loss": -26.886205673217773, "global_step": 501729, "epoch": 6044} {"train_loss": -26.971515655517578, "global_step": 501730, "epoch": 6044} {"train_loss": -26.605484008789062, "global_step": 501731, "epoch": 6044} {"train_loss": -26.65374755859375, "global_step": 501732, "epoch": 6044} {"train_loss": -27.526208877563477, "global_step": 501733, "epoch": 6044} {"train_loss": -27.15905446891325, "global_step": 501734, "epoch": 6044, "val_loss": 6492655.0} {"train_loss": -25.30584144592285, "global_step": 501735, "epoch": 6045} {"train_loss": -25.89630126953125, "global_step": 501736, "epoch": 6045} {"train_loss": -25.793867111206055, "global_step": 501737, "epoch": 6045} {"train_loss": -26.26801872253418, "global_step": 501738, "epoch": 6045} {"train_loss": -26.377044677734375, "global_step": 501739, "epoch": 6045} {"train_loss": -26.609350204467773, "global_step": 501740, "epoch": 6045} {"train_loss": -26.45965576171875, "global_step": 501741, "epoch": 6045} {"train_loss": -26.908313751220703, "global_step": 501742, "epoch": 6045} {"train_loss": -26.55643653869629, "global_step": 501743, "epoch": 6045} {"train_loss": -26.786191940307617, "global_step": 501744, "epoch": 6045} {"train_loss": -26.67991065979004, "global_step": 501745, "epoch": 6045} {"train_loss": -26.680099487304688, "global_step": 501746, "epoch": 6045} {"train_loss": -26.30144691467285, "global_step": 501747, "epoch": 6045} {"train_loss": -26.45330810546875, "global_step": 501748, "epoch": 6045} {"train_loss": -27.070789337158203, "global_step": 501749, "epoch": 6045} {"train_loss": -27.13232421875, "global_step": 501750, "epoch": 6045} {"train_loss": -26.939289093017578, "global_step": 501751, "epoch": 6045} {"train_loss": -26.61574363708496, "global_step": 501752, "epoch": 6045} {"train_loss": -26.6787166595459, "global_step": 501753, "epoch": 6045} {"train_loss": -27.04800796508789, "global_step": 501754, "epoch": 6045} {"train_loss": -26.758136749267578, "global_step": 501755, "epoch": 6045} {"train_loss": -27.319562911987305, "global_step": 501756, "epoch": 6045} {"train_loss": -26.904163360595703, "global_step": 501757, "epoch": 6045} {"train_loss": -27.322179794311523, "global_step": 501758, "epoch": 6045} {"train_loss": -26.711942672729492, "global_step": 501759, "epoch": 6045} {"train_loss": -27.48444175720215, "global_step": 501760, "epoch": 6045} {"train_loss": -26.876691818237305, "global_step": 501761, "epoch": 6045} {"train_loss": -26.991107940673828, "global_step": 501762, "epoch": 6045} {"train_loss": -27.344343185424805, "global_step": 501763, "epoch": 6045} {"train_loss": -27.160934448242188, "global_step": 501764, "epoch": 6045} {"train_loss": -27.03046989440918, "global_step": 501765, "epoch": 6045} {"train_loss": -27.018823623657227, "global_step": 501766, "epoch": 6045} {"train_loss": -27.061506271362305, "global_step": 501767, "epoch": 6045} {"train_loss": -26.968856811523438, "global_step": 501768, "epoch": 6045} {"train_loss": -27.561695098876953, "global_step": 501769, "epoch": 6045} {"train_loss": -27.5047607421875, "global_step": 501770, "epoch": 6045} {"train_loss": -27.302127838134766, "global_step": 501771, "epoch": 6045} {"train_loss": -26.9771728515625, "global_step": 501772, "epoch": 6045} {"train_loss": -27.440282821655273, "global_step": 501773, "epoch": 6045} {"train_loss": -27.718891143798828, "global_step": 501774, "epoch": 6045} {"train_loss": -27.34976577758789, "global_step": 501775, "epoch": 6045} {"train_loss": -27.382375717163086, "global_step": 501776, "epoch": 6045} {"train_loss": -27.503864288330078, "global_step": 501777, "epoch": 6045} {"train_loss": -27.71852684020996, "global_step": 501778, "epoch": 6045} {"train_loss": -27.476760864257812, "global_step": 501779, "epoch": 6045} {"train_loss": -27.567951202392578, "global_step": 501780, "epoch": 6045} {"train_loss": -27.813749313354492, "global_step": 501781, "epoch": 6045} {"train_loss": -27.72515296936035, "global_step": 501782, "epoch": 6045} {"train_loss": -27.453638076782227, "global_step": 501783, "epoch": 6045} {"train_loss": -27.916156768798828, "global_step": 501784, "epoch": 6045} {"train_loss": -27.699567794799805, "global_step": 501785, "epoch": 6045} {"train_loss": -27.96441650390625, "global_step": 501786, "epoch": 6045} {"train_loss": -27.8328800201416, "global_step": 501787, "epoch": 6045} {"train_loss": -27.653076171875, "global_step": 501788, "epoch": 6045} {"train_loss": -27.518753051757812, "global_step": 501789, "epoch": 6045} {"train_loss": -27.548227310180664, "global_step": 501790, "epoch": 6045} {"train_loss": -27.60431480407715, "global_step": 501791, "epoch": 6045} {"train_loss": -27.432706832885742, "global_step": 501792, "epoch": 6045} {"train_loss": -27.97625732421875, "global_step": 501793, "epoch": 6045} {"train_loss": -27.356515884399414, "global_step": 501794, "epoch": 6045} {"train_loss": -27.801916122436523, "global_step": 501795, "epoch": 6045} {"train_loss": -27.742843627929688, "global_step": 501796, "epoch": 6045} {"train_loss": -28.016895294189453, "global_step": 501797, "epoch": 6045} {"train_loss": -27.231298446655273, "global_step": 501798, "epoch": 6045} {"train_loss": -27.306262969970703, "global_step": 501799, "epoch": 6045} {"train_loss": -27.4471378326416, "global_step": 501800, "epoch": 6045} {"train_loss": -27.309064865112305, "global_step": 501801, "epoch": 6045} {"train_loss": -27.372425079345703, "global_step": 501802, "epoch": 6045} {"train_loss": -27.28352165222168, "global_step": 501803, "epoch": 6045} {"train_loss": -26.80609703063965, "global_step": 501804, "epoch": 6045} {"train_loss": -26.459096908569336, "global_step": 501805, "epoch": 6045} {"train_loss": -26.18351173400879, "global_step": 501806, "epoch": 6045} {"train_loss": -26.31241226196289, "global_step": 501807, "epoch": 6045} {"train_loss": -26.65459632873535, "global_step": 501808, "epoch": 6045} {"train_loss": -27.695356369018555, "global_step": 501809, "epoch": 6045} {"train_loss": -27.1596736907959, "global_step": 501810, "epoch": 6045} {"train_loss": -26.865921020507812, "global_step": 501811, "epoch": 6045} {"train_loss": -27.09640884399414, "global_step": 501812, "epoch": 6045} {"train_loss": -26.9044246673584, "global_step": 501813, "epoch": 6045} {"train_loss": -27.006500244140625, "global_step": 501814, "epoch": 6045} {"train_loss": -27.33698844909668, "global_step": 501815, "epoch": 6045} {"train_loss": -27.214441299438477, "global_step": 501816, "epoch": 6045} {"train_loss": -27.131844279277754, "global_step": 501817, "epoch": 6045, "val_loss": 6467213.0} {"train_loss": -26.88054847717285, "global_step": 501818, "epoch": 6046} {"train_loss": -27.272069931030273, "global_step": 501819, "epoch": 6046} {"train_loss": -26.663976669311523, "global_step": 501820, "epoch": 6046} {"train_loss": -27.04192543029785, "global_step": 501821, "epoch": 6046} {"train_loss": -26.409128189086914, "global_step": 501822, "epoch": 6046} {"train_loss": -27.17138671875, "global_step": 501823, "epoch": 6046} {"train_loss": -27.35184669494629, "global_step": 501824, "epoch": 6046} {"train_loss": -27.1157283782959, "global_step": 501825, "epoch": 6046} {"train_loss": -27.2785587310791, "global_step": 501826, "epoch": 6046} {"train_loss": -27.0953311920166, "global_step": 501827, "epoch": 6046} {"train_loss": -27.191272735595703, "global_step": 501828, "epoch": 6046} {"train_loss": -27.2927303314209, "global_step": 501829, "epoch": 6046} {"train_loss": -27.29949951171875, "global_step": 501830, "epoch": 6046} {"train_loss": -27.240467071533203, "global_step": 501831, "epoch": 6046} {"train_loss": -27.061887741088867, "global_step": 501832, "epoch": 6046} {"train_loss": -27.417346954345703, "global_step": 501833, "epoch": 6046} {"train_loss": -27.437475204467773, "global_step": 501834, "epoch": 6046} {"train_loss": -27.108606338500977, "global_step": 501835, "epoch": 6046} {"train_loss": -27.400938034057617, "global_step": 501836, "epoch": 6046} {"train_loss": -27.577594757080078, "global_step": 501837, "epoch": 6046} {"train_loss": -27.42498779296875, "global_step": 501838, "epoch": 6046} {"train_loss": -27.638824462890625, "global_step": 501839, "epoch": 6046} {"train_loss": -27.182464599609375, "global_step": 501840, "epoch": 6046} {"train_loss": -26.85431480407715, "global_step": 501841, "epoch": 6046} {"train_loss": -27.561573028564453, "global_step": 501842, "epoch": 6046} {"train_loss": -27.717041015625, "global_step": 501843, "epoch": 6046} {"train_loss": -27.543045043945312, "global_step": 501844, "epoch": 6046} {"train_loss": -27.747556686401367, "global_step": 501845, "epoch": 6046} {"train_loss": -27.25539207458496, "global_step": 501846, "epoch": 6046} {"train_loss": -27.810476303100586, "global_step": 501847, "epoch": 6046} {"train_loss": -27.64692497253418, "global_step": 501848, "epoch": 6046} {"train_loss": -27.760324478149414, "global_step": 501849, "epoch": 6046} {"train_loss": -27.267669677734375, "global_step": 501850, "epoch": 6046} {"train_loss": -27.606138229370117, "global_step": 501851, "epoch": 6046} {"train_loss": -27.336889266967773, "global_step": 501852, "epoch": 6046} {"train_loss": -27.557397842407227, "global_step": 501853, "epoch": 6046} {"train_loss": -27.259021759033203, "global_step": 501854, "epoch": 6046} {"train_loss": -27.166996002197266, "global_step": 501855, "epoch": 6046} {"train_loss": -27.57876968383789, "global_step": 501856, "epoch": 6046} {"train_loss": -27.369592666625977, "global_step": 501857, "epoch": 6046} {"train_loss": -27.502811431884766, "global_step": 501858, "epoch": 6046} {"train_loss": -27.404088973999023, "global_step": 501859, "epoch": 6046} {"train_loss": -27.190149307250977, "global_step": 501860, "epoch": 6046} {"train_loss": -27.43562126159668, "global_step": 501861, "epoch": 6046} {"train_loss": -27.17336082458496, "global_step": 501862, "epoch": 6046} {"train_loss": -27.27764892578125, "global_step": 501863, "epoch": 6046} {"train_loss": -27.364194869995117, "global_step": 501864, "epoch": 6046} {"train_loss": -27.80250358581543, "global_step": 501865, "epoch": 6046} {"train_loss": -27.04143714904785, "global_step": 501866, "epoch": 6046} {"train_loss": -27.3026065826416, "global_step": 501867, "epoch": 6046} {"train_loss": -27.146350860595703, "global_step": 501868, "epoch": 6046} {"train_loss": -27.511117935180664, "global_step": 501869, "epoch": 6046} {"train_loss": -27.36553955078125, "global_step": 501870, "epoch": 6046} {"train_loss": -27.472339630126953, "global_step": 501871, "epoch": 6046} {"train_loss": -27.036054611206055, "global_step": 501872, "epoch": 6046} {"train_loss": -26.976110458374023, "global_step": 501873, "epoch": 6046} {"train_loss": -27.338003158569336, "global_step": 501874, "epoch": 6046} {"train_loss": -27.238920211791992, "global_step": 501875, "epoch": 6046} {"train_loss": -27.34577751159668, "global_step": 501876, "epoch": 6046} {"train_loss": -27.688634872436523, "global_step": 501877, "epoch": 6046} {"train_loss": -26.777551651000977, "global_step": 501878, "epoch": 6046} {"train_loss": -26.879194259643555, "global_step": 501879, "epoch": 6046} {"train_loss": -27.70355224609375, "global_step": 501880, "epoch": 6046} {"train_loss": -27.52033042907715, "global_step": 501881, "epoch": 6046} {"train_loss": -27.197290420532227, "global_step": 501882, "epoch": 6046} {"train_loss": -27.650848388671875, "global_step": 501883, "epoch": 6046} {"train_loss": -27.2370662689209, "global_step": 501884, "epoch": 6046} {"train_loss": -26.88238525390625, "global_step": 501885, "epoch": 6046} {"train_loss": -27.40008544921875, "global_step": 501886, "epoch": 6046} {"train_loss": -27.152435302734375, "global_step": 501887, "epoch": 6046} {"train_loss": -27.066450119018555, "global_step": 501888, "epoch": 6046} {"train_loss": -27.508193969726562, "global_step": 501889, "epoch": 6046} {"train_loss": -27.228918075561523, "global_step": 501890, "epoch": 6046} {"train_loss": -27.323999404907227, "global_step": 501891, "epoch": 6046} {"train_loss": -27.839475631713867, "global_step": 501892, "epoch": 6046} {"train_loss": -27.382238388061523, "global_step": 501893, "epoch": 6046} {"train_loss": -26.9726505279541, "global_step": 501894, "epoch": 6046} {"train_loss": -27.377277374267578, "global_step": 501895, "epoch": 6046} {"train_loss": -27.188709259033203, "global_step": 501896, "epoch": 6046} {"train_loss": -27.474533081054688, "global_step": 501897, "epoch": 6046} {"train_loss": -26.945972442626953, "global_step": 501898, "epoch": 6046} {"train_loss": -27.359487533569336, "global_step": 501899, "epoch": 6046} {"train_loss": -27.29653882405844, "global_step": 501900, "epoch": 6046, "val_loss": 6487995.5} {"train_loss": -25.613983154296875, "global_step": 501901, "epoch": 6047} {"train_loss": -24.293256759643555, "global_step": 501902, "epoch": 6047} {"train_loss": -26.22202491760254, "global_step": 501903, "epoch": 6047} {"train_loss": -25.990774154663086, "global_step": 501904, "epoch": 6047} {"train_loss": -25.2137508392334, "global_step": 501905, "epoch": 6047} {"train_loss": -26.876983642578125, "global_step": 501906, "epoch": 6047} {"train_loss": -26.171552658081055, "global_step": 501907, "epoch": 6047} {"train_loss": -26.32977294921875, "global_step": 501908, "epoch": 6047} {"train_loss": -25.55348014831543, "global_step": 501909, "epoch": 6047} {"train_loss": -25.93500328063965, "global_step": 501910, "epoch": 6047} {"train_loss": -26.508848190307617, "global_step": 501911, "epoch": 6047} {"train_loss": -25.9487361907959, "global_step": 501912, "epoch": 6047} {"train_loss": -26.5782413482666, "global_step": 501913, "epoch": 6047} {"train_loss": -26.652191162109375, "global_step": 501914, "epoch": 6047} {"train_loss": -26.177371978759766, "global_step": 501915, "epoch": 6047} {"train_loss": -26.8372745513916, "global_step": 501916, "epoch": 6047} {"train_loss": -26.68596839904785, "global_step": 501917, "epoch": 6047} {"train_loss": -26.735157012939453, "global_step": 501918, "epoch": 6047} {"train_loss": -26.692899703979492, "global_step": 501919, "epoch": 6047} {"train_loss": -26.47649574279785, "global_step": 501920, "epoch": 6047} {"train_loss": -26.822509765625, "global_step": 501921, "epoch": 6047} {"train_loss": -26.842914581298828, "global_step": 501922, "epoch": 6047} {"train_loss": -26.9970645904541, "global_step": 501923, "epoch": 6047} {"train_loss": -26.5777645111084, "global_step": 501924, "epoch": 6047} {"train_loss": -26.602447509765625, "global_step": 501925, "epoch": 6047} {"train_loss": -26.6456356048584, "global_step": 501926, "epoch": 6047} {"train_loss": -26.869699478149414, "global_step": 501927, "epoch": 6047} {"train_loss": -27.07435417175293, "global_step": 501928, "epoch": 6047} {"train_loss": -27.1961669921875, "global_step": 501929, "epoch": 6047} {"train_loss": -27.06941795349121, "global_step": 501930, "epoch": 6047} {"train_loss": -27.049787521362305, "global_step": 501931, "epoch": 6047} {"train_loss": -27.239938735961914, "global_step": 501932, "epoch": 6047} {"train_loss": -27.177709579467773, "global_step": 501933, "epoch": 6047} {"train_loss": -27.311904907226562, "global_step": 501934, "epoch": 6047} {"train_loss": -27.431970596313477, "global_step": 501935, "epoch": 6047} {"train_loss": -27.365997314453125, "global_step": 501936, "epoch": 6047} {"train_loss": -27.209936141967773, "global_step": 501937, "epoch": 6047} {"train_loss": -27.197315216064453, "global_step": 501938, "epoch": 6047} {"train_loss": -27.23602867126465, "global_step": 501939, "epoch": 6047} {"train_loss": -27.30572509765625, "global_step": 501940, "epoch": 6047} {"train_loss": -27.3002872467041, "global_step": 501941, "epoch": 6047} {"train_loss": -27.658100128173828, "global_step": 501942, "epoch": 6047} {"train_loss": -27.614795684814453, "global_step": 501943, "epoch": 6047} {"train_loss": -27.607202529907227, "global_step": 501944, "epoch": 6047} {"train_loss": -27.135278701782227, "global_step": 501945, "epoch": 6047} {"train_loss": -27.524585723876953, "global_step": 501946, "epoch": 6047} {"train_loss": -27.43593406677246, "global_step": 501947, "epoch": 6047} {"train_loss": -27.3443546295166, "global_step": 501948, "epoch": 6047} {"train_loss": -27.407367706298828, "global_step": 501949, "epoch": 6047} {"train_loss": -27.854650497436523, "global_step": 501950, "epoch": 6047} {"train_loss": -27.5320987701416, "global_step": 501951, "epoch": 6047} {"train_loss": -27.30291748046875, "global_step": 501952, "epoch": 6047} {"train_loss": -27.534381866455078, "global_step": 501953, "epoch": 6047} {"train_loss": -27.363035202026367, "global_step": 501954, "epoch": 6047} {"train_loss": -27.602048873901367, "global_step": 501955, "epoch": 6047} {"train_loss": -27.513198852539062, "global_step": 501956, "epoch": 6047} {"train_loss": -27.617883682250977, "global_step": 501957, "epoch": 6047} {"train_loss": -27.786163330078125, "global_step": 501958, "epoch": 6047} {"train_loss": -27.431427001953125, "global_step": 501959, "epoch": 6047} {"train_loss": -27.365629196166992, "global_step": 501960, "epoch": 6047} {"train_loss": -27.510778427124023, "global_step": 501961, "epoch": 6047} {"train_loss": -27.2319278717041, "global_step": 501962, "epoch": 6047} {"train_loss": -27.51972007751465, "global_step": 501963, "epoch": 6047} {"train_loss": -27.145750045776367, "global_step": 501964, "epoch": 6047} {"train_loss": -27.304624557495117, "global_step": 501965, "epoch": 6047} {"train_loss": -27.638486862182617, "global_step": 501966, "epoch": 6047} {"train_loss": -27.270299911499023, "global_step": 501967, "epoch": 6047} {"train_loss": -27.684431076049805, "global_step": 501968, "epoch": 6047} {"train_loss": -27.871484756469727, "global_step": 501969, "epoch": 6047} {"train_loss": -27.704792022705078, "global_step": 501970, "epoch": 6047} {"train_loss": -27.0423583984375, "global_step": 501971, "epoch": 6047} {"train_loss": -27.153064727783203, "global_step": 501972, "epoch": 6047} {"train_loss": -27.56476402282715, "global_step": 501973, "epoch": 6047} {"train_loss": -27.14600944519043, "global_step": 501974, "epoch": 6047} {"train_loss": -27.307111740112305, "global_step": 501975, "epoch": 6047} {"train_loss": -27.05238151550293, "global_step": 501976, "epoch": 6047} {"train_loss": -26.663726806640625, "global_step": 501977, "epoch": 6047} {"train_loss": -26.9277400970459, "global_step": 501978, "epoch": 6047} {"train_loss": -27.192392349243164, "global_step": 501979, "epoch": 6047} {"train_loss": -27.614852905273438, "global_step": 501980, "epoch": 6047} {"train_loss": -27.455127716064453, "global_step": 501981, "epoch": 6047} {"train_loss": -27.0604190826416, "global_step": 501982, "epoch": 6047} {"train_loss": -27.017839615603528, "global_step": 501983, "epoch": 6047, "val_loss": 6500874.5} {"train_loss": -26.16205406188965, "global_step": 501984, "epoch": 6048} {"train_loss": -26.3470401763916, "global_step": 501985, "epoch": 6048} {"train_loss": -26.919504165649414, "global_step": 501986, "epoch": 6048} {"train_loss": -26.913755416870117, "global_step": 501987, "epoch": 6048} {"train_loss": -26.4427490234375, "global_step": 501988, "epoch": 6048} {"train_loss": -27.2437686920166, "global_step": 501989, "epoch": 6048} {"train_loss": -26.65903663635254, "global_step": 501990, "epoch": 6048} {"train_loss": -27.072004318237305, "global_step": 501991, "epoch": 6048} {"train_loss": -26.90754508972168, "global_step": 501992, "epoch": 6048} {"train_loss": -26.950769424438477, "global_step": 501993, "epoch": 6048} {"train_loss": -26.832834243774414, "global_step": 501994, "epoch": 6048} {"train_loss": -26.90165138244629, "global_step": 501995, "epoch": 6048} {"train_loss": -26.86272621154785, "global_step": 501996, "epoch": 6048} {"train_loss": -27.214435577392578, "global_step": 501997, "epoch": 6048} {"train_loss": -26.91153335571289, "global_step": 501998, "epoch": 6048} {"train_loss": -27.04811668395996, "global_step": 501999, "epoch": 6048} {"train_loss": -26.94605827331543, "global_step": 502000, "epoch": 6048} {"train_loss": -26.9857120513916, "global_step": 502001, "epoch": 6048} {"train_loss": -27.055240631103516, "global_step": 502002, "epoch": 6048} {"train_loss": -26.97286033630371, "global_step": 502003, "epoch": 6048} {"train_loss": -26.921680450439453, "global_step": 502004, "epoch": 6048} {"train_loss": -26.991809844970703, "global_step": 502005, "epoch": 6048} {"train_loss": -27.08049964904785, "global_step": 502006, "epoch": 6048} {"train_loss": -26.982328414916992, "global_step": 502007, "epoch": 6048} {"train_loss": -27.213781356811523, "global_step": 502008, "epoch": 6048} {"train_loss": -27.22943687438965, "global_step": 502009, "epoch": 6048} {"train_loss": -27.303442001342773, "global_step": 502010, "epoch": 6048} {"train_loss": -26.829877853393555, "global_step": 502011, "epoch": 6048} {"train_loss": -27.296308517456055, "global_step": 502012, "epoch": 6048} {"train_loss": -27.44597816467285, "global_step": 502013, "epoch": 6048} {"train_loss": -27.129987716674805, "global_step": 502014, "epoch": 6048} {"train_loss": -27.51553726196289, "global_step": 502015, "epoch": 6048} {"train_loss": -27.0004825592041, "global_step": 502016, "epoch": 6048} {"train_loss": -27.62628746032715, "global_step": 502017, "epoch": 6048} {"train_loss": -27.430383682250977, "global_step": 502018, "epoch": 6048} {"train_loss": -27.24268913269043, "global_step": 502019, "epoch": 6048} {"train_loss": -27.083953857421875, "global_step": 502020, "epoch": 6048} {"train_loss": -27.58856201171875, "global_step": 502021, "epoch": 6048} {"train_loss": -27.256986618041992, "global_step": 502022, "epoch": 6048} {"train_loss": -27.48238182067871, "global_step": 502023, "epoch": 6048} {"train_loss": -27.291461944580078, "global_step": 502024, "epoch": 6048} {"train_loss": -27.476476669311523, "global_step": 502025, "epoch": 6048} {"train_loss": -27.267480850219727, "global_step": 502026, "epoch": 6048} {"train_loss": -27.410114288330078, "global_step": 502027, "epoch": 6048} {"train_loss": -27.560285568237305, "global_step": 502028, "epoch": 6048} {"train_loss": -27.6912899017334, "global_step": 502029, "epoch": 6048} {"train_loss": -27.387359619140625, "global_step": 502030, "epoch": 6048} {"train_loss": -27.52007484436035, "global_step": 502031, "epoch": 6048} {"train_loss": -27.586069107055664, "global_step": 502032, "epoch": 6048} {"train_loss": -27.641199111938477, "global_step": 502033, "epoch": 6048} {"train_loss": -27.432233810424805, "global_step": 502034, "epoch": 6048} {"train_loss": -27.488983154296875, "global_step": 502035, "epoch": 6048} {"train_loss": -27.53980827331543, "global_step": 502036, "epoch": 6048} {"train_loss": -27.564401626586914, "global_step": 502037, "epoch": 6048} {"train_loss": -27.50092124938965, "global_step": 502038, "epoch": 6048} {"train_loss": -27.483930587768555, "global_step": 502039, "epoch": 6048} {"train_loss": -27.397724151611328, "global_step": 502040, "epoch": 6048} {"train_loss": -27.499343872070312, "global_step": 502041, "epoch": 6048} {"train_loss": -27.569141387939453, "global_step": 502042, "epoch": 6048} {"train_loss": -27.617660522460938, "global_step": 502043, "epoch": 6048} {"train_loss": -27.387659072875977, "global_step": 502044, "epoch": 6048} {"train_loss": -26.991058349609375, "global_step": 502045, "epoch": 6048} {"train_loss": -27.30031394958496, "global_step": 502046, "epoch": 6048} {"train_loss": -27.0541934967041, "global_step": 502047, "epoch": 6048} {"train_loss": -26.762296676635742, "global_step": 502048, "epoch": 6048} {"train_loss": -26.82996940612793, "global_step": 502049, "epoch": 6048} {"train_loss": -26.206562042236328, "global_step": 502050, "epoch": 6048} {"train_loss": -26.255292892456055, "global_step": 502051, "epoch": 6048} {"train_loss": -27.18115234375, "global_step": 502052, "epoch": 6048} {"train_loss": -26.872791290283203, "global_step": 502053, "epoch": 6048} {"train_loss": -27.46034812927246, "global_step": 502054, "epoch": 6048} {"train_loss": -26.933622360229492, "global_step": 502055, "epoch": 6048} {"train_loss": -27.354761123657227, "global_step": 502056, "epoch": 6048} {"train_loss": -27.201658248901367, "global_step": 502057, "epoch": 6048} {"train_loss": -27.568439483642578, "global_step": 502058, "epoch": 6048} {"train_loss": -27.166528701782227, "global_step": 502059, "epoch": 6048} {"train_loss": -27.57752799987793, "global_step": 502060, "epoch": 6048} {"train_loss": -27.40781593322754, "global_step": 502061, "epoch": 6048} {"train_loss": -27.504358291625977, "global_step": 502062, "epoch": 6048} {"train_loss": -27.522979736328125, "global_step": 502063, "epoch": 6048} {"train_loss": -27.372329711914062, "global_step": 502064, "epoch": 6048} {"train_loss": -27.3215389251709, "global_step": 502065, "epoch": 6048} {"train_loss": -27.19285011291504, "global_step": 502066, "epoch": 6048, "val_loss": 6532902.0} {"train_loss": -27.086694717407227, "global_step": 502067, "epoch": 6049} {"train_loss": -27.219640731811523, "global_step": 502068, "epoch": 6049} {"train_loss": -27.10739517211914, "global_step": 502069, "epoch": 6049} {"train_loss": -27.570331573486328, "global_step": 502070, "epoch": 6049} {"train_loss": -26.832212448120117, "global_step": 502071, "epoch": 6049} {"train_loss": -27.49323844909668, "global_step": 502072, "epoch": 6049} {"train_loss": -26.9534854888916, "global_step": 502073, "epoch": 6049} {"train_loss": -27.160247802734375, "global_step": 502074, "epoch": 6049} {"train_loss": -26.959247589111328, "global_step": 502075, "epoch": 6049} {"train_loss": -26.865253448486328, "global_step": 502076, "epoch": 6049} {"train_loss": -26.81011962890625, "global_step": 502077, "epoch": 6049} {"train_loss": -26.6490421295166, "global_step": 502078, "epoch": 6049} {"train_loss": -26.899656295776367, "global_step": 502079, "epoch": 6049} {"train_loss": -26.53451919555664, "global_step": 502080, "epoch": 6049} {"train_loss": -26.5152530670166, "global_step": 502081, "epoch": 6049} {"train_loss": -27.35675621032715, "global_step": 502082, "epoch": 6049} {"train_loss": -26.936279296875, "global_step": 502083, "epoch": 6049} {"train_loss": -27.171985626220703, "global_step": 502084, "epoch": 6049} {"train_loss": -26.984994888305664, "global_step": 502085, "epoch": 6049} {"train_loss": -26.88003921508789, "global_step": 502086, "epoch": 6049} {"train_loss": -27.13031578063965, "global_step": 502087, "epoch": 6049} {"train_loss": -27.315902709960938, "global_step": 502088, "epoch": 6049} {"train_loss": -27.193500518798828, "global_step": 502089, "epoch": 6049} {"train_loss": -27.28955078125, "global_step": 502090, "epoch": 6049} {"train_loss": -27.161527633666992, "global_step": 502091, "epoch": 6049} {"train_loss": -27.19105339050293, "global_step": 502092, "epoch": 6049} {"train_loss": -27.540634155273438, "global_step": 502093, "epoch": 6049} {"train_loss": -27.079120635986328, "global_step": 502094, "epoch": 6049} {"train_loss": -27.5483341217041, "global_step": 502095, "epoch": 6049} {"train_loss": -27.441640853881836, "global_step": 502096, "epoch": 6049} {"train_loss": -27.6429500579834, "global_step": 502097, "epoch": 6049} {"train_loss": -27.652685165405273, "global_step": 502098, "epoch": 6049} {"train_loss": -27.613195419311523, "global_step": 502099, "epoch": 6049} {"train_loss": -27.170034408569336, "global_step": 502100, "epoch": 6049} {"train_loss": -27.634048461914062, "global_step": 502101, "epoch": 6049} {"train_loss": -27.610214233398438, "global_step": 502102, "epoch": 6049} {"train_loss": -27.556528091430664, "global_step": 502103, "epoch": 6049} {"train_loss": -27.502954483032227, "global_step": 502104, "epoch": 6049} {"train_loss": -27.305988311767578, "global_step": 502105, "epoch": 6049} {"train_loss": -27.73102378845215, "global_step": 502106, "epoch": 6049} {"train_loss": -27.69917106628418, "global_step": 502107, "epoch": 6049} {"train_loss": -27.3214054107666, "global_step": 502108, "epoch": 6049} {"train_loss": -27.497467041015625, "global_step": 502109, "epoch": 6049} {"train_loss": -28.00800895690918, "global_step": 502110, "epoch": 6049} {"train_loss": -27.354419708251953, "global_step": 502111, "epoch": 6049} {"train_loss": -27.570688247680664, "global_step": 502112, "epoch": 6049} {"train_loss": -27.371389389038086, "global_step": 502113, "epoch": 6049} {"train_loss": -27.547550201416016, "global_step": 502114, "epoch": 6049} {"train_loss": -27.665231704711914, "global_step": 502115, "epoch": 6049} {"train_loss": -27.628271102905273, "global_step": 502116, "epoch": 6049} {"train_loss": -27.70423698425293, "global_step": 502117, "epoch": 6049} {"train_loss": -27.813650131225586, "global_step": 502118, "epoch": 6049} {"train_loss": -27.547895431518555, "global_step": 502119, "epoch": 6049} {"train_loss": -27.445648193359375, "global_step": 502120, "epoch": 6049} {"train_loss": -27.87617301940918, "global_step": 502121, "epoch": 6049} {"train_loss": -27.504776000976562, "global_step": 502122, "epoch": 6049} {"train_loss": -27.752485275268555, "global_step": 502123, "epoch": 6049} {"train_loss": -27.600385665893555, "global_step": 502124, "epoch": 6049} {"train_loss": -27.27524185180664, "global_step": 502125, "epoch": 6049} {"train_loss": -27.338504791259766, "global_step": 502126, "epoch": 6049} {"train_loss": -27.06393814086914, "global_step": 502127, "epoch": 6049} {"train_loss": -27.378305435180664, "global_step": 502128, "epoch": 6049} {"train_loss": -27.473051071166992, "global_step": 502129, "epoch": 6049} {"train_loss": -27.125492095947266, "global_step": 502130, "epoch": 6049} {"train_loss": -27.49228858947754, "global_step": 502131, "epoch": 6049} {"train_loss": -27.645063400268555, "global_step": 502132, "epoch": 6049} {"train_loss": -27.433584213256836, "global_step": 502133, "epoch": 6049} {"train_loss": -27.299545288085938, "global_step": 502134, "epoch": 6049} {"train_loss": -27.203460693359375, "global_step": 502135, "epoch": 6049} {"train_loss": -27.335311889648438, "global_step": 502136, "epoch": 6049} {"train_loss": -27.24967384338379, "global_step": 502137, "epoch": 6049} {"train_loss": -27.34381675720215, "global_step": 502138, "epoch": 6049} {"train_loss": -27.59002685546875, "global_step": 502139, "epoch": 6049} {"train_loss": -27.430810928344727, "global_step": 502140, "epoch": 6049} {"train_loss": -27.442773818969727, "global_step": 502141, "epoch": 6049} {"train_loss": -27.5515193939209, "global_step": 502142, "epoch": 6049} {"train_loss": -27.58200454711914, "global_step": 502143, "epoch": 6049} {"train_loss": -27.5402774810791, "global_step": 502144, "epoch": 6049} {"train_loss": -27.56353759765625, "global_step": 502145, "epoch": 6049} {"train_loss": -27.654254913330078, "global_step": 502146, "epoch": 6049} {"train_loss": -27.407873153686523, "global_step": 502147, "epoch": 6049} {"train_loss": -27.26594352722168, "global_step": 502148, "epoch": 6049} {"train_loss": -27.353429219808923, "global_step": 502149, "epoch": 6049, "val_loss": 6507693.0} {"train_loss": -26.69573974609375, "global_step": 502150, "epoch": 6050} {"train_loss": -26.599145889282227, "global_step": 502151, "epoch": 6050} {"train_loss": -26.558897018432617, "global_step": 502152, "epoch": 6050} {"train_loss": -26.827011108398438, "global_step": 502153, "epoch": 6050} {"train_loss": -26.652429580688477, "global_step": 502154, "epoch": 6050} {"train_loss": -26.68122673034668, "global_step": 502155, "epoch": 6050} {"train_loss": -26.62164878845215, "global_step": 502156, "epoch": 6050} {"train_loss": -26.806982040405273, "global_step": 502157, "epoch": 6050} {"train_loss": -26.81072425842285, "global_step": 502158, "epoch": 6050} {"train_loss": -26.671142578125, "global_step": 502159, "epoch": 6050} {"train_loss": -27.044025421142578, "global_step": 502160, "epoch": 6050} {"train_loss": -27.250219345092773, "global_step": 502161, "epoch": 6050} {"train_loss": -26.47303581237793, "global_step": 502162, "epoch": 6050} {"train_loss": -26.634265899658203, "global_step": 502163, "epoch": 6050} {"train_loss": -27.0655460357666, "global_step": 502164, "epoch": 6050} {"train_loss": -26.92115592956543, "global_step": 502165, "epoch": 6050} {"train_loss": -26.863962173461914, "global_step": 502166, "epoch": 6050} {"train_loss": -26.805377960205078, "global_step": 502167, "epoch": 6050} {"train_loss": -27.19495964050293, "global_step": 502168, "epoch": 6050} {"train_loss": -27.1968936920166, "global_step": 502169, "epoch": 6050} {"train_loss": -27.078125, "global_step": 502170, "epoch": 6050} {"train_loss": -27.35527992248535, "global_step": 502171, "epoch": 6050} {"train_loss": -27.082807540893555, "global_step": 502172, "epoch": 6050} {"train_loss": -27.09779930114746, "global_step": 502173, "epoch": 6050} {"train_loss": -27.065359115600586, "global_step": 502174, "epoch": 6050} {"train_loss": -27.1339168548584, "global_step": 502175, "epoch": 6050} {"train_loss": -27.488574981689453, "global_step": 502176, "epoch": 6050} {"train_loss": -27.28008460998535, "global_step": 502177, "epoch": 6050} {"train_loss": -27.477949142456055, "global_step": 502178, "epoch": 6050} {"train_loss": -27.175979614257812, "global_step": 502179, "epoch": 6050} {"train_loss": -27.327722549438477, "global_step": 502180, "epoch": 6050} {"train_loss": -27.265302658081055, "global_step": 502181, "epoch": 6050} {"train_loss": -26.89794921875, "global_step": 502182, "epoch": 6050} {"train_loss": -27.599328994750977, "global_step": 502183, "epoch": 6050} {"train_loss": -27.225183486938477, "global_step": 502184, "epoch": 6050} {"train_loss": -27.432912826538086, "global_step": 502185, "epoch": 6050} {"train_loss": -27.609851837158203, "global_step": 502186, "epoch": 6050} {"train_loss": -26.969507217407227, "global_step": 502187, "epoch": 6050} {"train_loss": -27.45074462890625, "global_step": 502188, "epoch": 6050} {"train_loss": -26.94724464416504, "global_step": 502189, "epoch": 6050} {"train_loss": -27.225278854370117, "global_step": 502190, "epoch": 6050} {"train_loss": -27.521142959594727, "global_step": 502191, "epoch": 6050} {"train_loss": -27.345779418945312, "global_step": 502192, "epoch": 6050} {"train_loss": -27.442861557006836, "global_step": 502193, "epoch": 6050} {"train_loss": -27.4411563873291, "global_step": 502194, "epoch": 6050} {"train_loss": -27.531219482421875, "global_step": 502195, "epoch": 6050} {"train_loss": -27.42462730407715, "global_step": 502196, "epoch": 6050} {"train_loss": -27.5624942779541, "global_step": 502197, "epoch": 6050} {"train_loss": -27.5767822265625, "global_step": 502198, "epoch": 6050} {"train_loss": -27.565265655517578, "global_step": 502199, "epoch": 6050} {"train_loss": -27.66851806640625, "global_step": 502200, "epoch": 6050} {"train_loss": -27.6851806640625, "global_step": 502201, "epoch": 6050} {"train_loss": -27.534534454345703, "global_step": 502202, "epoch": 6050} {"train_loss": -27.755279541015625, "global_step": 502203, "epoch": 6050} {"train_loss": -26.952707290649414, "global_step": 502204, "epoch": 6050} {"train_loss": -27.59636878967285, "global_step": 502205, "epoch": 6050} {"train_loss": -26.665884017944336, "global_step": 502206, "epoch": 6050} {"train_loss": -27.36882972717285, "global_step": 502207, "epoch": 6050} {"train_loss": -27.518558502197266, "global_step": 502208, "epoch": 6050} {"train_loss": -27.394495010375977, "global_step": 502209, "epoch": 6050} {"train_loss": -26.583280563354492, "global_step": 502210, "epoch": 6050} {"train_loss": -27.086212158203125, "global_step": 502211, "epoch": 6050} {"train_loss": -27.171283721923828, "global_step": 502212, "epoch": 6050} {"train_loss": -27.22553825378418, "global_step": 502213, "epoch": 6050} {"train_loss": -26.460351943969727, "global_step": 502214, "epoch": 6050} {"train_loss": -26.608551025390625, "global_step": 502215, "epoch": 6050} {"train_loss": -26.994495391845703, "global_step": 502216, "epoch": 6050} {"train_loss": -26.548486709594727, "global_step": 502217, "epoch": 6050} {"train_loss": -27.18075942993164, "global_step": 502218, "epoch": 6050} {"train_loss": -27.536457061767578, "global_step": 502219, "epoch": 6050} {"train_loss": -27.218677520751953, "global_step": 502220, "epoch": 6050} {"train_loss": -27.609222412109375, "global_step": 502221, "epoch": 6050} {"train_loss": -27.111791610717773, "global_step": 502222, "epoch": 6050} {"train_loss": -27.249616622924805, "global_step": 502223, "epoch": 6050} {"train_loss": -27.443439483642578, "global_step": 502224, "epoch": 6050} {"train_loss": -27.653980255126953, "global_step": 502225, "epoch": 6050} {"train_loss": -27.367523193359375, "global_step": 502226, "epoch": 6050} {"train_loss": -27.462039947509766, "global_step": 502227, "epoch": 6050} {"train_loss": -27.524534225463867, "global_step": 502228, "epoch": 6050} {"train_loss": -27.214706420898438, "global_step": 502229, "epoch": 6050} {"train_loss": -27.315702438354492, "global_step": 502230, "epoch": 6050} {"train_loss": -27.301898956298828, "global_step": 502231, "epoch": 6050} {"train_loss": -27.178560762520295, "global_step": 502232, "epoch": 6050, "train/sim_max_reward_0": 0.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4500000": 1.0, "test/sim_max_reward_4500001": 1.0, "test/sim_max_reward_4500002": 1.0, "test/sim_max_reward_4500003": 1.0, "test/sim_max_reward_4500004": 1.0, "test/sim_max_reward_4500005": 1.0, "test/sim_max_reward_4500006": 1.0, "test/sim_max_reward_4500007": 0.0, "test/sim_max_reward_4500008": 1.0, "test/sim_max_reward_4500009": 1.0, "test/sim_max_reward_4500010": 1.0, "test/sim_max_reward_4500011": 1.0, "test/sim_max_reward_4500012": 1.0, "test/sim_max_reward_4500013": 1.0, "test/sim_max_reward_4500014": 1.0, "test/sim_max_reward_4500015": 1.0, "test/sim_max_reward_4500016": 1.0, "test/sim_max_reward_4500017": 1.0, "test/sim_max_reward_4500018": 0.0, "test/sim_max_reward_4500019": 0.0, "test/sim_max_reward_4500020": 1.0, "test/sim_max_reward_4500021": 1.0, "train/mean_score": 0.8333333333333334, "test/mean_score": 0.8636363636363636, "val_loss": 6567432.5} {"train_loss": -27.554479598999023, "global_step": 502233, "epoch": 6051} {"train_loss": -27.225784301757812, "global_step": 502234, "epoch": 6051} {"train_loss": -27.19281005859375, "global_step": 502235, "epoch": 6051} {"train_loss": -26.970172882080078, "global_step": 502236, "epoch": 6051} {"train_loss": -27.128162384033203, "global_step": 502237, "epoch": 6051} {"train_loss": -26.97307777404785, "global_step": 502238, "epoch": 6051} {"train_loss": -27.22775650024414, "global_step": 502239, "epoch": 6051} {"train_loss": -27.210041046142578, "global_step": 502240, "epoch": 6051} {"train_loss": -27.4066219329834, "global_step": 502241, "epoch": 6051} {"train_loss": -27.2593994140625, "global_step": 502242, "epoch": 6051} {"train_loss": -27.20770835876465, "global_step": 502243, "epoch": 6051} {"train_loss": -27.006439208984375, "global_step": 502244, "epoch": 6051} {"train_loss": -27.068878173828125, "global_step": 502245, "epoch": 6051} {"train_loss": -27.057065963745117, "global_step": 502246, "epoch": 6051} {"train_loss": -27.167638778686523, "global_step": 502247, "epoch": 6051} {"train_loss": -27.540821075439453, "global_step": 502248, "epoch": 6051} {"train_loss": -27.09968376159668, "global_step": 502249, "epoch": 6051} {"train_loss": -27.01140785217285, "global_step": 502250, "epoch": 6051} {"train_loss": -26.93878746032715, "global_step": 502251, "epoch": 6051} {"train_loss": -27.057783126831055, "global_step": 502252, "epoch": 6051} {"train_loss": -27.338098526000977, "global_step": 502253, "epoch": 6051} {"train_loss": -26.9134578704834, "global_step": 502254, "epoch": 6051} {"train_loss": -27.379806518554688, "global_step": 502255, "epoch": 6051} {"train_loss": -27.626617431640625, "global_step": 502256, "epoch": 6051} {"train_loss": -27.19711685180664, "global_step": 502257, "epoch": 6051} {"train_loss": -27.13860511779785, "global_step": 502258, "epoch": 6051} {"train_loss": -27.488515853881836, "global_step": 502259, "epoch": 6051} {"train_loss": -27.58257484436035, "global_step": 502260, "epoch": 6051} {"train_loss": -27.34445571899414, "global_step": 502261, "epoch": 6051} {"train_loss": -27.71427345275879, "global_step": 502262, "epoch": 6051} {"train_loss": -27.424076080322266, "global_step": 502263, "epoch": 6051} {"train_loss": -27.18343162536621, "global_step": 502264, "epoch": 6051} {"train_loss": -27.467920303344727, "global_step": 502265, "epoch": 6051} {"train_loss": -26.95464515686035, "global_step": 502266, "epoch": 6051} {"train_loss": -27.403675079345703, "global_step": 502267, "epoch": 6051} {"train_loss": -27.596572875976562, "global_step": 502268, "epoch": 6051} {"train_loss": -27.6740665435791, "global_step": 502269, "epoch": 6051} {"train_loss": -27.319807052612305, "global_step": 502270, "epoch": 6051} {"train_loss": -27.638280868530273, "global_step": 502271, "epoch": 6051} {"train_loss": -27.4912166595459, "global_step": 502272, "epoch": 6051} {"train_loss": -27.47832679748535, "global_step": 502273, "epoch": 6051} {"train_loss": -27.46504020690918, "global_step": 502274, "epoch": 6051} {"train_loss": -27.253189086914062, "global_step": 502275, "epoch": 6051} {"train_loss": -27.401844024658203, "global_step": 502276, "epoch": 6051} {"train_loss": -27.50382423400879, "global_step": 502277, "epoch": 6051} {"train_loss": -27.557275772094727, "global_step": 502278, "epoch": 6051} {"train_loss": -27.6031436920166, "global_step": 502279, "epoch": 6051} {"train_loss": -27.238492965698242, "global_step": 502280, "epoch": 6051} {"train_loss": -26.91182518005371, "global_step": 502281, "epoch": 6051} {"train_loss": -27.168777465820312, "global_step": 502282, "epoch": 6051} {"train_loss": -27.383569717407227, "global_step": 502283, "epoch": 6051} {"train_loss": -27.918516159057617, "global_step": 502284, "epoch": 6051} {"train_loss": -27.1997127532959, "global_step": 502285, "epoch": 6051} {"train_loss": -27.750329971313477, "global_step": 502286, "epoch": 6051} {"train_loss": -27.504852294921875, "global_step": 502287, "epoch": 6051} {"train_loss": -27.611921310424805, "global_step": 502288, "epoch": 6051} {"train_loss": -27.48662757873535, "global_step": 502289, "epoch": 6051} {"train_loss": -27.5188045501709, "global_step": 502290, "epoch": 6051} {"train_loss": -27.385892868041992, "global_step": 502291, "epoch": 6051} {"train_loss": -27.0546817779541, "global_step": 502292, "epoch": 6051} {"train_loss": -27.483266830444336, "global_step": 502293, "epoch": 6051} {"train_loss": -27.677398681640625, "global_step": 502294, "epoch": 6051} {"train_loss": -27.21612548828125, "global_step": 502295, "epoch": 6051} {"train_loss": -27.366703033447266, "global_step": 502296, "epoch": 6051} {"train_loss": -27.619461059570312, "global_step": 502297, "epoch": 6051} {"train_loss": -27.803571701049805, "global_step": 502298, "epoch": 6051} {"train_loss": -27.436725616455078, "global_step": 502299, "epoch": 6051} {"train_loss": -27.142745971679688, "global_step": 502300, "epoch": 6051} {"train_loss": -27.377328872680664, "global_step": 502301, "epoch": 6051} {"train_loss": -27.287946701049805, "global_step": 502302, "epoch": 6051} {"train_loss": -27.19707679748535, "global_step": 502303, "epoch": 6051} {"train_loss": -27.576562881469727, "global_step": 502304, "epoch": 6051} {"train_loss": -27.353845596313477, "global_step": 502305, "epoch": 6051} {"train_loss": -27.372180938720703, "global_step": 502306, "epoch": 6051} {"train_loss": -27.048450469970703, "global_step": 502307, "epoch": 6051} {"train_loss": -27.5398006439209, "global_step": 502308, "epoch": 6051} {"train_loss": -27.584827423095703, "global_step": 502309, "epoch": 6051} {"train_loss": -27.268930435180664, "global_step": 502310, "epoch": 6051} {"train_loss": -27.333417892456055, "global_step": 502311, "epoch": 6051} {"train_loss": -27.28955078125, "global_step": 502312, "epoch": 6051} {"train_loss": -27.18829345703125, "global_step": 502313, "epoch": 6051} {"train_loss": -27.10865592956543, "global_step": 502314, "epoch": 6051} {"train_loss": -27.33575731300446, "global_step": 502315, "epoch": 6051, "val_loss": 6636161.0} {"train_loss": -26.085193634033203, "global_step": 502316, "epoch": 6052} {"train_loss": -26.506778717041016, "global_step": 502317, "epoch": 6052} {"train_loss": -26.603302001953125, "global_step": 502318, "epoch": 6052} {"train_loss": -26.58332633972168, "global_step": 502319, "epoch": 6052} {"train_loss": -26.442075729370117, "global_step": 502320, "epoch": 6052} {"train_loss": -26.658111572265625, "global_step": 502321, "epoch": 6052} {"train_loss": -26.922321319580078, "global_step": 502322, "epoch": 6052} {"train_loss": -26.19685173034668, "global_step": 502323, "epoch": 6052} {"train_loss": -27.02533531188965, "global_step": 502324, "epoch": 6052} {"train_loss": -26.809417724609375, "global_step": 502325, "epoch": 6052} {"train_loss": -27.131610870361328, "global_step": 502326, "epoch": 6052} {"train_loss": -27.01471519470215, "global_step": 502327, "epoch": 6052} {"train_loss": -26.753768920898438, "global_step": 502328, "epoch": 6052} {"train_loss": -26.96195411682129, "global_step": 502329, "epoch": 6052} {"train_loss": -26.920873641967773, "global_step": 502330, "epoch": 6052} {"train_loss": -27.011560440063477, "global_step": 502331, "epoch": 6052} {"train_loss": -26.980987548828125, "global_step": 502332, "epoch": 6052} {"train_loss": -26.879117965698242, "global_step": 502333, "epoch": 6052} {"train_loss": -26.959692001342773, "global_step": 502334, "epoch": 6052} {"train_loss": -27.00745964050293, "global_step": 502335, "epoch": 6052} {"train_loss": -27.278888702392578, "global_step": 502336, "epoch": 6052} {"train_loss": -27.494571685791016, "global_step": 502337, "epoch": 6052} {"train_loss": -27.047107696533203, "global_step": 502338, "epoch": 6052} {"train_loss": -27.196338653564453, "global_step": 502339, "epoch": 6052} {"train_loss": -27.23052406311035, "global_step": 502340, "epoch": 6052} {"train_loss": -27.025501251220703, "global_step": 502341, "epoch": 6052} {"train_loss": -27.148740768432617, "global_step": 502342, "epoch": 6052} {"train_loss": -27.322132110595703, "global_step": 502343, "epoch": 6052} {"train_loss": -27.40093994140625, "global_step": 502344, "epoch": 6052} {"train_loss": -27.3625431060791, "global_step": 502345, "epoch": 6052} {"train_loss": -27.46124267578125, "global_step": 502346, "epoch": 6052} {"train_loss": -27.095956802368164, "global_step": 502347, "epoch": 6052} {"train_loss": -27.156713485717773, "global_step": 502348, "epoch": 6052} {"train_loss": -27.25898551940918, "global_step": 502349, "epoch": 6052} {"train_loss": -27.53090476989746, "global_step": 502350, "epoch": 6052} {"train_loss": -27.419036865234375, "global_step": 502351, "epoch": 6052} {"train_loss": -27.635761260986328, "global_step": 502352, "epoch": 6052} {"train_loss": -27.39328384399414, "global_step": 502353, "epoch": 6052} {"train_loss": -27.131818771362305, "global_step": 502354, "epoch": 6052} {"train_loss": -27.826801300048828, "global_step": 502355, "epoch": 6052} {"train_loss": -27.47205924987793, "global_step": 502356, "epoch": 6052} {"train_loss": -26.754735946655273, "global_step": 502357, "epoch": 6052} {"train_loss": -27.42189598083496, "global_step": 502358, "epoch": 6052} {"train_loss": -27.503625869750977, "global_step": 502359, "epoch": 6052} {"train_loss": -27.129180908203125, "global_step": 502360, "epoch": 6052} {"train_loss": -27.003515243530273, "global_step": 502361, "epoch": 6052} {"train_loss": -26.806791305541992, "global_step": 502362, "epoch": 6052} {"train_loss": -27.364532470703125, "global_step": 502363, "epoch": 6052} {"train_loss": -27.429279327392578, "global_step": 502364, "epoch": 6052} {"train_loss": -27.529882431030273, "global_step": 502365, "epoch": 6052} {"train_loss": -27.589685440063477, "global_step": 502366, "epoch": 6052} {"train_loss": -27.356597900390625, "global_step": 502367, "epoch": 6052} {"train_loss": -26.95985984802246, "global_step": 502368, "epoch": 6052} {"train_loss": -27.64130973815918, "global_step": 502369, "epoch": 6052} {"train_loss": -27.418121337890625, "global_step": 502370, "epoch": 6052} {"train_loss": -27.652414321899414, "global_step": 502371, "epoch": 6052} {"train_loss": -26.691120147705078, "global_step": 502372, "epoch": 6052} {"train_loss": -26.550771713256836, "global_step": 502373, "epoch": 6052} {"train_loss": -26.695066452026367, "global_step": 502374, "epoch": 6052} {"train_loss": -26.8748722076416, "global_step": 502375, "epoch": 6052} {"train_loss": -27.42106056213379, "global_step": 502376, "epoch": 6052} {"train_loss": -27.17108154296875, "global_step": 502377, "epoch": 6052} {"train_loss": -27.428485870361328, "global_step": 502378, "epoch": 6052} {"train_loss": -26.708826065063477, "global_step": 502379, "epoch": 6052} {"train_loss": -26.800729751586914, "global_step": 502380, "epoch": 6052} {"train_loss": -27.406274795532227, "global_step": 502381, "epoch": 6052} {"train_loss": -27.395633697509766, "global_step": 502382, "epoch": 6052} {"train_loss": -27.034326553344727, "global_step": 502383, "epoch": 6052} {"train_loss": -26.911529541015625, "global_step": 502384, "epoch": 6052} {"train_loss": -27.260787963867188, "global_step": 502385, "epoch": 6052} {"train_loss": -27.616056442260742, "global_step": 502386, "epoch": 6052} {"train_loss": -27.135854721069336, "global_step": 502387, "epoch": 6052} {"train_loss": -27.262683868408203, "global_step": 502388, "epoch": 6052} {"train_loss": -27.28717041015625, "global_step": 502389, "epoch": 6052} {"train_loss": -27.014942169189453, "global_step": 502390, "epoch": 6052} {"train_loss": -27.12214469909668, "global_step": 502391, "epoch": 6052} {"train_loss": -27.252485275268555, "global_step": 502392, "epoch": 6052} {"train_loss": -27.621109008789062, "global_step": 502393, "epoch": 6052} {"train_loss": -27.57490348815918, "global_step": 502394, "epoch": 6052} {"train_loss": -27.5490665435791, "global_step": 502395, "epoch": 6052} {"train_loss": -27.524932861328125, "global_step": 502396, "epoch": 6052} {"train_loss": -27.576745986938477, "global_step": 502397, "epoch": 6052} {"train_loss": -27.148539485701594, "global_step": 502398, "epoch": 6052, "val_loss": 6536831.0} {"train_loss": -27.39204978942871, "global_step": 502399, "epoch": 6053} {"train_loss": -26.890609741210938, "global_step": 502400, "epoch": 6053} {"train_loss": -27.442428588867188, "global_step": 502401, "epoch": 6053} {"train_loss": -26.886743545532227, "global_step": 502402, "epoch": 6053} {"train_loss": -26.946670532226562, "global_step": 502403, "epoch": 6053} {"train_loss": -27.068140029907227, "global_step": 502404, "epoch": 6053} {"train_loss": -26.8905029296875, "global_step": 502405, "epoch": 6053} {"train_loss": -26.953855514526367, "global_step": 502406, "epoch": 6053} {"train_loss": -26.997879028320312, "global_step": 502407, "epoch": 6053} {"train_loss": -26.995046615600586, "global_step": 502408, "epoch": 6053} {"train_loss": -27.358020782470703, "global_step": 502409, "epoch": 6053} {"train_loss": -26.996200561523438, "global_step": 502410, "epoch": 6053} {"train_loss": -27.064289093017578, "global_step": 502411, "epoch": 6053} {"train_loss": -27.043720245361328, "global_step": 502412, "epoch": 6053} {"train_loss": -27.170822143554688, "global_step": 502413, "epoch": 6053} {"train_loss": -27.398725509643555, "global_step": 502414, "epoch": 6053} {"train_loss": -27.31117057800293, "global_step": 502415, "epoch": 6053} {"train_loss": -27.289825439453125, "global_step": 502416, "epoch": 6053} {"train_loss": -27.030704498291016, "global_step": 502417, "epoch": 6053} {"train_loss": -27.24432373046875, "global_step": 502418, "epoch": 6053} {"train_loss": -26.983869552612305, "global_step": 502419, "epoch": 6053} {"train_loss": -27.305191040039062, "global_step": 502420, "epoch": 6053} {"train_loss": -27.420917510986328, "global_step": 502421, "epoch": 6053} {"train_loss": -27.562835693359375, "global_step": 502422, "epoch": 6053} {"train_loss": -27.52935791015625, "global_step": 502423, "epoch": 6053} {"train_loss": -27.47852897644043, "global_step": 502424, "epoch": 6053} {"train_loss": -27.938867568969727, "global_step": 502425, "epoch": 6053} {"train_loss": -27.34417152404785, "global_step": 502426, "epoch": 6053} {"train_loss": -27.433141708374023, "global_step": 502427, "epoch": 6053} {"train_loss": -27.548725128173828, "global_step": 502428, "epoch": 6053} {"train_loss": -27.63160514831543, "global_step": 502429, "epoch": 6053} {"train_loss": -27.165267944335938, "global_step": 502430, "epoch": 6053} {"train_loss": -27.3093204498291, "global_step": 502431, "epoch": 6053} {"train_loss": -27.302030563354492, "global_step": 502432, "epoch": 6053} {"train_loss": -27.186767578125, "global_step": 502433, "epoch": 6053} {"train_loss": -27.623926162719727, "global_step": 502434, "epoch": 6053} {"train_loss": -27.91669273376465, "global_step": 502435, "epoch": 6053} {"train_loss": -27.52179527282715, "global_step": 502436, "epoch": 6053} {"train_loss": -27.192386627197266, "global_step": 502437, "epoch": 6053} {"train_loss": -27.395238876342773, "global_step": 502438, "epoch": 6053} {"train_loss": -27.861745834350586, "global_step": 502439, "epoch": 6053} {"train_loss": -27.56841468811035, "global_step": 502440, "epoch": 6053} {"train_loss": -27.65250015258789, "global_step": 502441, "epoch": 6053} {"train_loss": -27.30464744567871, "global_step": 502442, "epoch": 6053} {"train_loss": -27.419004440307617, "global_step": 502443, "epoch": 6053} {"train_loss": -27.774213790893555, "global_step": 502444, "epoch": 6053} {"train_loss": -27.36639976501465, "global_step": 502445, "epoch": 6053} {"train_loss": -27.3664608001709, "global_step": 502446, "epoch": 6053} {"train_loss": -27.431726455688477, "global_step": 502447, "epoch": 6053} {"train_loss": -27.644851684570312, "global_step": 502448, "epoch": 6053} {"train_loss": -27.014684677124023, "global_step": 502449, "epoch": 6053} {"train_loss": -27.407880783081055, "global_step": 502450, "epoch": 6053} {"train_loss": -27.15134048461914, "global_step": 502451, "epoch": 6053} {"train_loss": -26.0426025390625, "global_step": 502452, "epoch": 6053} {"train_loss": -26.557886123657227, "global_step": 502453, "epoch": 6053} {"train_loss": -26.961149215698242, "global_step": 502454, "epoch": 6053} {"train_loss": -26.930389404296875, "global_step": 502455, "epoch": 6053} {"train_loss": -27.391193389892578, "global_step": 502456, "epoch": 6053} {"train_loss": -27.206384658813477, "global_step": 502457, "epoch": 6053} {"train_loss": -27.187124252319336, "global_step": 502458, "epoch": 6053} {"train_loss": -27.114850997924805, "global_step": 502459, "epoch": 6053} {"train_loss": -27.32867431640625, "global_step": 502460, "epoch": 6053} {"train_loss": -27.54743766784668, "global_step": 502461, "epoch": 6053} {"train_loss": -27.880517959594727, "global_step": 502462, "epoch": 6053} {"train_loss": -27.335500717163086, "global_step": 502463, "epoch": 6053} {"train_loss": -27.608617782592773, "global_step": 502464, "epoch": 6053} {"train_loss": -27.302021026611328, "global_step": 502465, "epoch": 6053} {"train_loss": -27.4569091796875, "global_step": 502466, "epoch": 6053} {"train_loss": -27.181381225585938, "global_step": 502467, "epoch": 6053} {"train_loss": -27.47245216369629, "global_step": 502468, "epoch": 6053} {"train_loss": -27.314435958862305, "global_step": 502469, "epoch": 6053} {"train_loss": -27.389074325561523, "global_step": 502470, "epoch": 6053} {"train_loss": -27.76722526550293, "global_step": 502471, "epoch": 6053} {"train_loss": -27.334619522094727, "global_step": 502472, "epoch": 6053} {"train_loss": -27.73847007751465, "global_step": 502473, "epoch": 6053} {"train_loss": -27.360666275024414, "global_step": 502474, "epoch": 6053} {"train_loss": -27.650924682617188, "global_step": 502475, "epoch": 6053} {"train_loss": -27.409860610961914, "global_step": 502476, "epoch": 6053} {"train_loss": -27.57842445373535, "global_step": 502477, "epoch": 6053} {"train_loss": -27.715778350830078, "global_step": 502478, "epoch": 6053} {"train_loss": -27.55841636657715, "global_step": 502479, "epoch": 6053} {"train_loss": -27.205469131469727, "global_step": 502480, "epoch": 6053} {"train_loss": -27.32833166007536, "global_step": 502481, "epoch": 6053, "val_loss": 6537910.5} {"train_loss": -26.9289608001709, "global_step": 502482, "epoch": 6054} {"train_loss": -26.644575119018555, "global_step": 502483, "epoch": 6054} {"train_loss": -26.486881256103516, "global_step": 502484, "epoch": 6054} {"train_loss": -27.2115535736084, "global_step": 502485, "epoch": 6054} {"train_loss": -26.716840744018555, "global_step": 502486, "epoch": 6054} {"train_loss": -26.444616317749023, "global_step": 502487, "epoch": 6054} {"train_loss": -26.546401977539062, "global_step": 502488, "epoch": 6054} {"train_loss": -27.52012062072754, "global_step": 502489, "epoch": 6054} {"train_loss": -27.029516220092773, "global_step": 502490, "epoch": 6054} {"train_loss": -27.261798858642578, "global_step": 502491, "epoch": 6054} {"train_loss": -26.717493057250977, "global_step": 502492, "epoch": 6054} {"train_loss": -27.14246940612793, "global_step": 502493, "epoch": 6054} {"train_loss": -27.41867446899414, "global_step": 502494, "epoch": 6054} {"train_loss": -27.17937660217285, "global_step": 502495, "epoch": 6054} {"train_loss": -27.306686401367188, "global_step": 502496, "epoch": 6054} {"train_loss": -26.872739791870117, "global_step": 502497, "epoch": 6054} {"train_loss": -27.453994750976562, "global_step": 502498, "epoch": 6054} {"train_loss": -27.324003219604492, "global_step": 502499, "epoch": 6054} {"train_loss": -27.06636619567871, "global_step": 502500, "epoch": 6054} {"train_loss": -27.225244522094727, "global_step": 502501, "epoch": 6054} {"train_loss": -27.05230712890625, "global_step": 502502, "epoch": 6054} {"train_loss": -27.370223999023438, "global_step": 502503, "epoch": 6054} {"train_loss": -27.2635440826416, "global_step": 502504, "epoch": 6054} {"train_loss": -27.48184585571289, "global_step": 502505, "epoch": 6054} {"train_loss": -27.365619659423828, "global_step": 502506, "epoch": 6054} {"train_loss": -27.68024253845215, "global_step": 502507, "epoch": 6054} {"train_loss": -27.548059463500977, "global_step": 502508, "epoch": 6054} {"train_loss": -27.4249210357666, "global_step": 502509, "epoch": 6054} {"train_loss": -27.3190860748291, "global_step": 502510, "epoch": 6054} {"train_loss": -27.31490135192871, "global_step": 502511, "epoch": 6054} {"train_loss": -27.54096794128418, "global_step": 502512, "epoch": 6054} {"train_loss": -27.77638053894043, "global_step": 502513, "epoch": 6054} {"train_loss": -27.31214714050293, "global_step": 502514, "epoch": 6054} {"train_loss": -27.344892501831055, "global_step": 502515, "epoch": 6054} {"train_loss": -27.645471572875977, "global_step": 502516, "epoch": 6054} {"train_loss": -27.68833351135254, "global_step": 502517, "epoch": 6054} {"train_loss": -27.5255184173584, "global_step": 502518, "epoch": 6054} {"train_loss": -28.032093048095703, "global_step": 502519, "epoch": 6054} {"train_loss": -27.38685417175293, "global_step": 502520, "epoch": 6054} {"train_loss": -27.8489933013916, "global_step": 502521, "epoch": 6054} {"train_loss": -27.773223876953125, "global_step": 502522, "epoch": 6054} {"train_loss": -27.671964645385742, "global_step": 502523, "epoch": 6054} {"train_loss": -27.709857940673828, "global_step": 502524, "epoch": 6054} {"train_loss": -27.330076217651367, "global_step": 502525, "epoch": 6054} {"train_loss": -27.273651123046875, "global_step": 502526, "epoch": 6054} {"train_loss": -27.823591232299805, "global_step": 502527, "epoch": 6054} {"train_loss": -27.38970947265625, "global_step": 502528, "epoch": 6054} {"train_loss": -27.704389572143555, "global_step": 502529, "epoch": 6054} {"train_loss": -27.06776237487793, "global_step": 502530, "epoch": 6054} {"train_loss": -27.17453384399414, "global_step": 502531, "epoch": 6054} {"train_loss": -26.736371994018555, "global_step": 502532, "epoch": 6054} {"train_loss": -25.766620635986328, "global_step": 502533, "epoch": 6054} {"train_loss": -26.01837158203125, "global_step": 502534, "epoch": 6054} {"train_loss": -27.02935791015625, "global_step": 502535, "epoch": 6054} {"train_loss": -27.21010398864746, "global_step": 502536, "epoch": 6054} {"train_loss": -26.9894962310791, "global_step": 502537, "epoch": 6054} {"train_loss": -27.334882736206055, "global_step": 502538, "epoch": 6054} {"train_loss": -27.671533584594727, "global_step": 502539, "epoch": 6054} {"train_loss": -27.29034423828125, "global_step": 502540, "epoch": 6054} {"train_loss": -27.01902198791504, "global_step": 502541, "epoch": 6054} {"train_loss": -27.02768898010254, "global_step": 502542, "epoch": 6054} {"train_loss": -27.092060089111328, "global_step": 502543, "epoch": 6054} {"train_loss": -27.342145919799805, "global_step": 502544, "epoch": 6054} {"train_loss": -27.127227783203125, "global_step": 502545, "epoch": 6054} {"train_loss": -26.90024185180664, "global_step": 502546, "epoch": 6054} {"train_loss": -27.193130493164062, "global_step": 502547, "epoch": 6054} {"train_loss": -27.183115005493164, "global_step": 502548, "epoch": 6054} {"train_loss": -27.016759872436523, "global_step": 502549, "epoch": 6054} {"train_loss": -27.176151275634766, "global_step": 502550, "epoch": 6054} {"train_loss": -27.149890899658203, "global_step": 502551, "epoch": 6054} {"train_loss": -27.26544761657715, "global_step": 502552, "epoch": 6054} {"train_loss": -27.149169921875, "global_step": 502553, "epoch": 6054} {"train_loss": -27.371023178100586, "global_step": 502554, "epoch": 6054} {"train_loss": -27.150863647460938, "global_step": 502555, "epoch": 6054} {"train_loss": -27.066181182861328, "global_step": 502556, "epoch": 6054} {"train_loss": -27.297775268554688, "global_step": 502557, "epoch": 6054} {"train_loss": -27.129077911376953, "global_step": 502558, "epoch": 6054} {"train_loss": -27.46146011352539, "global_step": 502559, "epoch": 6054} {"train_loss": -27.060338973999023, "global_step": 502560, "epoch": 6054} {"train_loss": -27.4836368560791, "global_step": 502561, "epoch": 6054} {"train_loss": -27.199872970581055, "global_step": 502562, "epoch": 6054} {"train_loss": -26.96630859375, "global_step": 502563, "epoch": 6054} {"train_loss": -27.221242674862047, "global_step": 502564, "epoch": 6054, "val_loss": 6548940.5} {"train_loss": -27.09067153930664, "global_step": 502565, "epoch": 6055} {"train_loss": -27.250015258789062, "global_step": 502566, "epoch": 6055} {"train_loss": -26.994897842407227, "global_step": 502567, "epoch": 6055} {"train_loss": -27.061655044555664, "global_step": 502568, "epoch": 6055} {"train_loss": -27.197004318237305, "global_step": 502569, "epoch": 6055} {"train_loss": -27.010543823242188, "global_step": 502570, "epoch": 6055} {"train_loss": -27.208206176757812, "global_step": 502571, "epoch": 6055} {"train_loss": -27.04996109008789, "global_step": 502572, "epoch": 6055} {"train_loss": -27.28116798400879, "global_step": 502573, "epoch": 6055} {"train_loss": -27.289487838745117, "global_step": 502574, "epoch": 6055} {"train_loss": -27.266061782836914, "global_step": 502575, "epoch": 6055} {"train_loss": -27.431970596313477, "global_step": 502576, "epoch": 6055} {"train_loss": -27.404592514038086, "global_step": 502577, "epoch": 6055} {"train_loss": -27.567899703979492, "global_step": 502578, "epoch": 6055} {"train_loss": -27.482908248901367, "global_step": 502579, "epoch": 6055} {"train_loss": -27.123693466186523, "global_step": 502580, "epoch": 6055} {"train_loss": -27.474384307861328, "global_step": 502581, "epoch": 6055} {"train_loss": -27.354236602783203, "global_step": 502582, "epoch": 6055} {"train_loss": -27.559680938720703, "global_step": 502583, "epoch": 6055} {"train_loss": -27.474225997924805, "global_step": 502584, "epoch": 6055} {"train_loss": -27.229902267456055, "global_step": 502585, "epoch": 6055} {"train_loss": -27.41287612915039, "global_step": 502586, "epoch": 6055} {"train_loss": -27.51470947265625, "global_step": 502587, "epoch": 6055} {"train_loss": -27.581098556518555, "global_step": 502588, "epoch": 6055} {"train_loss": -27.5853328704834, "global_step": 502589, "epoch": 6055} {"train_loss": -27.680917739868164, "global_step": 502590, "epoch": 6055} {"train_loss": -27.392990112304688, "global_step": 502591, "epoch": 6055} {"train_loss": -27.66737174987793, "global_step": 502592, "epoch": 6055} {"train_loss": -27.668079376220703, "global_step": 502593, "epoch": 6055} {"train_loss": -27.3214111328125, "global_step": 502594, "epoch": 6055} {"train_loss": -27.535566329956055, "global_step": 502595, "epoch": 6055} {"train_loss": -27.452621459960938, "global_step": 502596, "epoch": 6055} {"train_loss": -27.52511978149414, "global_step": 502597, "epoch": 6055} {"train_loss": -27.51106071472168, "global_step": 502598, "epoch": 6055} {"train_loss": -27.426481246948242, "global_step": 502599, "epoch": 6055} {"train_loss": -27.60232925415039, "global_step": 502600, "epoch": 6055} {"train_loss": -27.49427604675293, "global_step": 502601, "epoch": 6055} {"train_loss": -27.47047233581543, "global_step": 502602, "epoch": 6055} {"train_loss": -27.468549728393555, "global_step": 502603, "epoch": 6055} {"train_loss": -27.204654693603516, "global_step": 502604, "epoch": 6055} {"train_loss": -27.33833122253418, "global_step": 502605, "epoch": 6055} {"train_loss": -27.621484756469727, "global_step": 502606, "epoch": 6055} {"train_loss": -27.67110252380371, "global_step": 502607, "epoch": 6055} {"train_loss": -27.618289947509766, "global_step": 502608, "epoch": 6055} {"train_loss": -27.594100952148438, "global_step": 502609, "epoch": 6055} {"train_loss": -27.752811431884766, "global_step": 502610, "epoch": 6055} {"train_loss": -27.433252334594727, "global_step": 502611, "epoch": 6055} {"train_loss": -27.561094284057617, "global_step": 502612, "epoch": 6055} {"train_loss": -27.638046264648438, "global_step": 502613, "epoch": 6055} {"train_loss": -27.86952018737793, "global_step": 502614, "epoch": 6055} {"train_loss": -27.292572021484375, "global_step": 502615, "epoch": 6055} {"train_loss": -27.691701889038086, "global_step": 502616, "epoch": 6055} {"train_loss": -27.893213272094727, "global_step": 502617, "epoch": 6055} {"train_loss": -27.433218002319336, "global_step": 502618, "epoch": 6055} {"train_loss": -27.060688018798828, "global_step": 502619, "epoch": 6055} {"train_loss": -27.4431209564209, "global_step": 502620, "epoch": 6055} {"train_loss": -27.663354873657227, "global_step": 502621, "epoch": 6055} {"train_loss": -27.49513053894043, "global_step": 502622, "epoch": 6055} {"train_loss": -27.4471378326416, "global_step": 502623, "epoch": 6055} {"train_loss": -27.528085708618164, "global_step": 502624, "epoch": 6055} {"train_loss": -27.3176212310791, "global_step": 502625, "epoch": 6055} {"train_loss": -27.456796646118164, "global_step": 502626, "epoch": 6055} {"train_loss": -26.98677635192871, "global_step": 502627, "epoch": 6055} {"train_loss": -26.51569938659668, "global_step": 502628, "epoch": 6055} {"train_loss": -26.273786544799805, "global_step": 502629, "epoch": 6055} {"train_loss": -26.67799186706543, "global_step": 502630, "epoch": 6055} {"train_loss": -26.762121200561523, "global_step": 502631, "epoch": 6055} {"train_loss": -27.610065460205078, "global_step": 502632, "epoch": 6055} {"train_loss": -27.176528930664062, "global_step": 502633, "epoch": 6055} {"train_loss": -27.066797256469727, "global_step": 502634, "epoch": 6055} {"train_loss": -27.489917755126953, "global_step": 502635, "epoch": 6055} {"train_loss": -27.36359214782715, "global_step": 502636, "epoch": 6055} {"train_loss": -26.901166915893555, "global_step": 502637, "epoch": 6055} {"train_loss": -27.171689987182617, "global_step": 502638, "epoch": 6055} {"train_loss": -27.042917251586914, "global_step": 502639, "epoch": 6055} {"train_loss": -27.2747859954834, "global_step": 502640, "epoch": 6055} {"train_loss": -27.400617599487305, "global_step": 502641, "epoch": 6055} {"train_loss": -27.261762619018555, "global_step": 502642, "epoch": 6055} {"train_loss": -26.9538516998291, "global_step": 502643, "epoch": 6055} {"train_loss": -27.2330265045166, "global_step": 502644, "epoch": 6055} {"train_loss": -27.11945152282715, "global_step": 502645, "epoch": 6055} {"train_loss": -27.38661766052246, "global_step": 502646, "epoch": 6055} {"train_loss": -27.341981520135718, "global_step": 502647, "epoch": 6055, "val_loss": 6635692.0} {"train_loss": -27.12771987915039, "global_step": 502648, "epoch": 6056} {"train_loss": -27.1528377532959, "global_step": 502649, "epoch": 6056} {"train_loss": -27.0316162109375, "global_step": 502650, "epoch": 6056} {"train_loss": -27.15000343322754, "global_step": 502651, "epoch": 6056} {"train_loss": -27.036325454711914, "global_step": 502652, "epoch": 6056} {"train_loss": -27.3617000579834, "global_step": 502653, "epoch": 6056} {"train_loss": -27.17952537536621, "global_step": 502654, "epoch": 6056} {"train_loss": -26.905563354492188, "global_step": 502655, "epoch": 6056} {"train_loss": -27.30183982849121, "global_step": 502656, "epoch": 6056} {"train_loss": -27.155517578125, "global_step": 502657, "epoch": 6056} {"train_loss": -27.33785057067871, "global_step": 502658, "epoch": 6056} {"train_loss": -27.526845932006836, "global_step": 502659, "epoch": 6056} {"train_loss": -27.464252471923828, "global_step": 502660, "epoch": 6056} {"train_loss": -26.908227920532227, "global_step": 502661, "epoch": 6056} {"train_loss": -27.107070922851562, "global_step": 502662, "epoch": 6056} {"train_loss": -27.374860763549805, "global_step": 502663, "epoch": 6056} {"train_loss": -27.61103630065918, "global_step": 502664, "epoch": 6056} {"train_loss": -27.351062774658203, "global_step": 502665, "epoch": 6056} {"train_loss": -27.569360733032227, "global_step": 502666, "epoch": 6056} {"train_loss": -27.58247184753418, "global_step": 502667, "epoch": 6056} {"train_loss": -27.718225479125977, "global_step": 502668, "epoch": 6056} {"train_loss": -27.713953018188477, "global_step": 502669, "epoch": 6056} {"train_loss": -27.372251510620117, "global_step": 502670, "epoch": 6056} {"train_loss": -27.445846557617188, "global_step": 502671, "epoch": 6056} {"train_loss": -27.47259521484375, "global_step": 502672, "epoch": 6056} {"train_loss": -27.441068649291992, "global_step": 502673, "epoch": 6056} {"train_loss": -27.73304557800293, "global_step": 502674, "epoch": 6056} {"train_loss": -27.620676040649414, "global_step": 502675, "epoch": 6056} {"train_loss": -27.616199493408203, "global_step": 502676, "epoch": 6056} {"train_loss": -27.46100425720215, "global_step": 502677, "epoch": 6056} {"train_loss": -26.959430694580078, "global_step": 502678, "epoch": 6056} {"train_loss": -27.340253829956055, "global_step": 502679, "epoch": 6056} {"train_loss": -27.257080078125, "global_step": 502680, "epoch": 6056} {"train_loss": -27.45271110534668, "global_step": 502681, "epoch": 6056} {"train_loss": -27.657623291015625, "global_step": 502682, "epoch": 6056} {"train_loss": -27.602521896362305, "global_step": 502683, "epoch": 6056} {"train_loss": -27.697509765625, "global_step": 502684, "epoch": 6056} {"train_loss": -27.635034561157227, "global_step": 502685, "epoch": 6056} {"train_loss": -27.7053279876709, "global_step": 502686, "epoch": 6056} {"train_loss": -27.050512313842773, "global_step": 502687, "epoch": 6056} {"train_loss": -27.543806076049805, "global_step": 502688, "epoch": 6056} {"train_loss": -27.16974449157715, "global_step": 502689, "epoch": 6056} {"train_loss": -27.614105224609375, "global_step": 502690, "epoch": 6056} {"train_loss": -27.3432674407959, "global_step": 502691, "epoch": 6056} {"train_loss": -27.43037223815918, "global_step": 502692, "epoch": 6056} {"train_loss": -27.560550689697266, "global_step": 502693, "epoch": 6056} {"train_loss": -27.353315353393555, "global_step": 502694, "epoch": 6056} {"train_loss": -27.2808780670166, "global_step": 502695, "epoch": 6056} {"train_loss": -27.34458351135254, "global_step": 502696, "epoch": 6056} {"train_loss": -27.177377700805664, "global_step": 502697, "epoch": 6056} {"train_loss": -27.23929786682129, "global_step": 502698, "epoch": 6056} {"train_loss": -27.047521591186523, "global_step": 502699, "epoch": 6056} {"train_loss": -27.5303897857666, "global_step": 502700, "epoch": 6056} {"train_loss": -27.17178726196289, "global_step": 502701, "epoch": 6056} {"train_loss": -27.1490478515625, "global_step": 502702, "epoch": 6056} {"train_loss": -27.522998809814453, "global_step": 502703, "epoch": 6056} {"train_loss": -27.536346435546875, "global_step": 502704, "epoch": 6056} {"train_loss": -27.394311904907227, "global_step": 502705, "epoch": 6056} {"train_loss": -27.26352310180664, "global_step": 502706, "epoch": 6056} {"train_loss": -27.550806045532227, "global_step": 502707, "epoch": 6056} {"train_loss": -27.467267990112305, "global_step": 502708, "epoch": 6056} {"train_loss": -27.62835693359375, "global_step": 502709, "epoch": 6056} {"train_loss": -27.659198760986328, "global_step": 502710, "epoch": 6056} {"train_loss": -27.50201988220215, "global_step": 502711, "epoch": 6056} {"train_loss": -27.447134017944336, "global_step": 502712, "epoch": 6056} {"train_loss": -27.334186553955078, "global_step": 502713, "epoch": 6056} {"train_loss": -27.642108917236328, "global_step": 502714, "epoch": 6056} {"train_loss": -27.2220401763916, "global_step": 502715, "epoch": 6056} {"train_loss": -27.50420570373535, "global_step": 502716, "epoch": 6056} {"train_loss": -27.528940200805664, "global_step": 502717, "epoch": 6056} {"train_loss": -27.1951904296875, "global_step": 502718, "epoch": 6056} {"train_loss": -26.964263916015625, "global_step": 502719, "epoch": 6056} {"train_loss": -26.017358779907227, "global_step": 502720, "epoch": 6056} {"train_loss": -25.75537109375, "global_step": 502721, "epoch": 6056} {"train_loss": -26.613489151000977, "global_step": 502722, "epoch": 6056} {"train_loss": -26.999481201171875, "global_step": 502723, "epoch": 6056} {"train_loss": -26.447927474975586, "global_step": 502724, "epoch": 6056} {"train_loss": -27.257232666015625, "global_step": 502725, "epoch": 6056} {"train_loss": -26.973697662353516, "global_step": 502726, "epoch": 6056} {"train_loss": -26.914249420166016, "global_step": 502727, "epoch": 6056} {"train_loss": -26.735876083374023, "global_step": 502728, "epoch": 6056} {"train_loss": -27.00025749206543, "global_step": 502729, "epoch": 6056} {"train_loss": -27.2863379788686, "global_step": 502730, "epoch": 6056, "val_loss": 6641762.0} {"train_loss": -26.80927848815918, "global_step": 502731, "epoch": 6057} {"train_loss": -26.498762130737305, "global_step": 502732, "epoch": 6057} {"train_loss": -26.869577407836914, "global_step": 502733, "epoch": 6057} {"train_loss": -26.37356948852539, "global_step": 502734, "epoch": 6057} {"train_loss": -26.328641891479492, "global_step": 502735, "epoch": 6057} {"train_loss": -27.01785659790039, "global_step": 502736, "epoch": 6057} {"train_loss": -26.441938400268555, "global_step": 502737, "epoch": 6057} {"train_loss": -26.71858024597168, "global_step": 502738, "epoch": 6057} {"train_loss": -26.268054962158203, "global_step": 502739, "epoch": 6057} {"train_loss": -26.834924697875977, "global_step": 502740, "epoch": 6057} {"train_loss": -26.810394287109375, "global_step": 502741, "epoch": 6057} {"train_loss": -27.30462074279785, "global_step": 502742, "epoch": 6057} {"train_loss": -26.159351348876953, "global_step": 502743, "epoch": 6057} {"train_loss": -27.176355361938477, "global_step": 502744, "epoch": 6057} {"train_loss": -26.62501335144043, "global_step": 502745, "epoch": 6057} {"train_loss": -27.119089126586914, "global_step": 502746, "epoch": 6057} {"train_loss": -26.75916862487793, "global_step": 502747, "epoch": 6057} {"train_loss": -26.800159454345703, "global_step": 502748, "epoch": 6057} {"train_loss": -26.868383407592773, "global_step": 502749, "epoch": 6057} {"train_loss": -26.888248443603516, "global_step": 502750, "epoch": 6057} {"train_loss": -27.16498374938965, "global_step": 502751, "epoch": 6057} {"train_loss": -27.160552978515625, "global_step": 502752, "epoch": 6057} {"train_loss": -26.73737907409668, "global_step": 502753, "epoch": 6057} {"train_loss": -27.328781127929688, "global_step": 502754, "epoch": 6057} {"train_loss": -27.08253288269043, "global_step": 502755, "epoch": 6057} {"train_loss": -27.289306640625, "global_step": 502756, "epoch": 6057} {"train_loss": -27.0828857421875, "global_step": 502757, "epoch": 6057} {"train_loss": -27.087106704711914, "global_step": 502758, "epoch": 6057} {"train_loss": -27.189849853515625, "global_step": 502759, "epoch": 6057} {"train_loss": -27.323902130126953, "global_step": 502760, "epoch": 6057} {"train_loss": -27.586414337158203, "global_step": 502761, "epoch": 6057} {"train_loss": -27.4721622467041, "global_step": 502762, "epoch": 6057} {"train_loss": -27.227018356323242, "global_step": 502763, "epoch": 6057} {"train_loss": -27.30695915222168, "global_step": 502764, "epoch": 6057} {"train_loss": -27.4547061920166, "global_step": 502765, "epoch": 6057} {"train_loss": -27.389509201049805, "global_step": 502766, "epoch": 6057} {"train_loss": -27.534650802612305, "global_step": 502767, "epoch": 6057} {"train_loss": -27.03104019165039, "global_step": 502768, "epoch": 6057} {"train_loss": -27.440887451171875, "global_step": 502769, "epoch": 6057} {"train_loss": -27.256208419799805, "global_step": 502770, "epoch": 6057} {"train_loss": -27.399656295776367, "global_step": 502771, "epoch": 6057} {"train_loss": -27.570938110351562, "global_step": 502772, "epoch": 6057} {"train_loss": -27.447895050048828, "global_step": 502773, "epoch": 6057} {"train_loss": -27.295881271362305, "global_step": 502774, "epoch": 6057} {"train_loss": -27.424543380737305, "global_step": 502775, "epoch": 6057} {"train_loss": -27.403913497924805, "global_step": 502776, "epoch": 6057} {"train_loss": -27.06024169921875, "global_step": 502777, "epoch": 6057} {"train_loss": -27.391077041625977, "global_step": 502778, "epoch": 6057} {"train_loss": -27.3727970123291, "global_step": 502779, "epoch": 6057} {"train_loss": -27.216176986694336, "global_step": 502780, "epoch": 6057} {"train_loss": -27.43546485900879, "global_step": 502781, "epoch": 6057} {"train_loss": -27.45859146118164, "global_step": 502782, "epoch": 6057} {"train_loss": -27.242446899414062, "global_step": 502783, "epoch": 6057} {"train_loss": -27.577136993408203, "global_step": 502784, "epoch": 6057} {"train_loss": -27.37782096862793, "global_step": 502785, "epoch": 6057} {"train_loss": -27.699390411376953, "global_step": 502786, "epoch": 6057} {"train_loss": -27.576818466186523, "global_step": 502787, "epoch": 6057} {"train_loss": -27.592853546142578, "global_step": 502788, "epoch": 6057} {"train_loss": -27.51959228515625, "global_step": 502789, "epoch": 6057} {"train_loss": -27.749414443969727, "global_step": 502790, "epoch": 6057} {"train_loss": -27.560504913330078, "global_step": 502791, "epoch": 6057} {"train_loss": -27.385181427001953, "global_step": 502792, "epoch": 6057} {"train_loss": -27.968524932861328, "global_step": 502793, "epoch": 6057} {"train_loss": -27.023544311523438, "global_step": 502794, "epoch": 6057} {"train_loss": -27.45249366760254, "global_step": 502795, "epoch": 6057} {"train_loss": -27.207916259765625, "global_step": 502796, "epoch": 6057} {"train_loss": -27.95246696472168, "global_step": 502797, "epoch": 6057} {"train_loss": -27.763320922851562, "global_step": 502798, "epoch": 6057} {"train_loss": -27.428939819335938, "global_step": 502799, "epoch": 6057} {"train_loss": -27.251556396484375, "global_step": 502800, "epoch": 6057} {"train_loss": -27.65984535217285, "global_step": 502801, "epoch": 6057} {"train_loss": -27.74765968322754, "global_step": 502802, "epoch": 6057} {"train_loss": -27.296314239501953, "global_step": 502803, "epoch": 6057} {"train_loss": -27.669910430908203, "global_step": 502804, "epoch": 6057} {"train_loss": -27.25420570373535, "global_step": 502805, "epoch": 6057} {"train_loss": -27.821237564086914, "global_step": 502806, "epoch": 6057} {"train_loss": -27.685626983642578, "global_step": 502807, "epoch": 6057} {"train_loss": -27.08819007873535, "global_step": 502808, "epoch": 6057} {"train_loss": -27.290878295898438, "global_step": 502809, "epoch": 6057} {"train_loss": -27.76800537109375, "global_step": 502810, "epoch": 6057} {"train_loss": -27.417123794555664, "global_step": 502811, "epoch": 6057} {"train_loss": -27.264923095703125, "global_step": 502812, "epoch": 6057} {"train_loss": -27.232674403362964, "global_step": 502813, "epoch": 6057, "val_loss": 6616991.0} {"train_loss": -22.667667388916016, "global_step": 502814, "epoch": 6058} {"train_loss": -25.35240936279297, "global_step": 502815, "epoch": 6058} {"train_loss": -25.018293380737305, "global_step": 502816, "epoch": 6058} {"train_loss": -25.30926513671875, "global_step": 502817, "epoch": 6058} {"train_loss": -25.38031005859375, "global_step": 502818, "epoch": 6058} {"train_loss": -25.304540634155273, "global_step": 502819, "epoch": 6058} {"train_loss": -25.6596622467041, "global_step": 502820, "epoch": 6058} {"train_loss": -25.814411163330078, "global_step": 502821, "epoch": 6058} {"train_loss": -25.82868766784668, "global_step": 502822, "epoch": 6058} {"train_loss": -25.677770614624023, "global_step": 502823, "epoch": 6058} {"train_loss": -25.79022789001465, "global_step": 502824, "epoch": 6058} {"train_loss": -26.27423095703125, "global_step": 502825, "epoch": 6058} {"train_loss": -26.375553131103516, "global_step": 502826, "epoch": 6058} {"train_loss": -26.257740020751953, "global_step": 502827, "epoch": 6058} {"train_loss": -26.67756462097168, "global_step": 502828, "epoch": 6058} {"train_loss": -26.230304718017578, "global_step": 502829, "epoch": 6058} {"train_loss": -26.59568214416504, "global_step": 502830, "epoch": 6058} {"train_loss": -26.255630493164062, "global_step": 502831, "epoch": 6058} {"train_loss": -26.346776962280273, "global_step": 502832, "epoch": 6058} {"train_loss": -26.100860595703125, "global_step": 502833, "epoch": 6058} {"train_loss": -26.420246124267578, "global_step": 502834, "epoch": 6058} {"train_loss": -26.409774780273438, "global_step": 502835, "epoch": 6058} {"train_loss": -26.656940460205078, "global_step": 502836, "epoch": 6058} {"train_loss": -26.484846115112305, "global_step": 502837, "epoch": 6058} {"train_loss": -26.56304931640625, "global_step": 502838, "epoch": 6058} {"train_loss": -26.83066177368164, "global_step": 502839, "epoch": 6058} {"train_loss": -26.63800621032715, "global_step": 502840, "epoch": 6058} {"train_loss": -26.66226577758789, "global_step": 502841, "epoch": 6058} {"train_loss": -26.454069137573242, "global_step": 502842, "epoch": 6058} {"train_loss": -27.078283309936523, "global_step": 502843, "epoch": 6058} {"train_loss": -27.20369529724121, "global_step": 502844, "epoch": 6058} {"train_loss": -26.913742065429688, "global_step": 502845, "epoch": 6058} {"train_loss": -27.011865615844727, "global_step": 502846, "epoch": 6058} {"train_loss": -26.79450798034668, "global_step": 502847, "epoch": 6058} {"train_loss": -26.9077091217041, "global_step": 502848, "epoch": 6058} {"train_loss": -27.00884437561035, "global_step": 502849, "epoch": 6058} {"train_loss": -26.897659301757812, "global_step": 502850, "epoch": 6058} {"train_loss": -26.958921432495117, "global_step": 502851, "epoch": 6058} {"train_loss": -26.8426456451416, "global_step": 502852, "epoch": 6058} {"train_loss": -27.06598472595215, "global_step": 502853, "epoch": 6058} {"train_loss": -27.1809139251709, "global_step": 502854, "epoch": 6058} {"train_loss": -26.95111083984375, "global_step": 502855, "epoch": 6058} {"train_loss": -26.87171745300293, "global_step": 502856, "epoch": 6058} {"train_loss": -27.231536865234375, "global_step": 502857, "epoch": 6058} {"train_loss": -27.1142520904541, "global_step": 502858, "epoch": 6058} {"train_loss": -27.55694580078125, "global_step": 502859, "epoch": 6058} {"train_loss": -27.4262752532959, "global_step": 502860, "epoch": 6058} {"train_loss": -27.350629806518555, "global_step": 502861, "epoch": 6058} {"train_loss": -27.06317710876465, "global_step": 502862, "epoch": 6058} {"train_loss": -27.17097282409668, "global_step": 502863, "epoch": 6058} {"train_loss": -27.64373779296875, "global_step": 502864, "epoch": 6058} {"train_loss": -27.360828399658203, "global_step": 502865, "epoch": 6058} {"train_loss": -27.29654884338379, "global_step": 502866, "epoch": 6058} {"train_loss": -27.041324615478516, "global_step": 502867, "epoch": 6058} {"train_loss": -27.36713981628418, "global_step": 502868, "epoch": 6058} {"train_loss": -27.292062759399414, "global_step": 502869, "epoch": 6058} {"train_loss": -27.452619552612305, "global_step": 502870, "epoch": 6058} {"train_loss": -27.12151527404785, "global_step": 502871, "epoch": 6058} {"train_loss": -27.4832706451416, "global_step": 502872, "epoch": 6058} {"train_loss": -27.452978134155273, "global_step": 502873, "epoch": 6058} {"train_loss": -27.776403427124023, "global_step": 502874, "epoch": 6058} {"train_loss": -27.411075592041016, "global_step": 502875, "epoch": 6058} {"train_loss": -27.51534080505371, "global_step": 502876, "epoch": 6058} {"train_loss": -27.049230575561523, "global_step": 502877, "epoch": 6058} {"train_loss": -27.813016891479492, "global_step": 502878, "epoch": 6058} {"train_loss": -27.444061279296875, "global_step": 502879, "epoch": 6058} {"train_loss": -27.506189346313477, "global_step": 502880, "epoch": 6058} {"train_loss": -27.321645736694336, "global_step": 502881, "epoch": 6058} {"train_loss": -27.33740234375, "global_step": 502882, "epoch": 6058} {"train_loss": -27.480722427368164, "global_step": 502883, "epoch": 6058} {"train_loss": -27.628442764282227, "global_step": 502884, "epoch": 6058} {"train_loss": -27.658344268798828, "global_step": 502885, "epoch": 6058} {"train_loss": -27.626728057861328, "global_step": 502886, "epoch": 6058} {"train_loss": -27.565570831298828, "global_step": 502887, "epoch": 6058} {"train_loss": -27.694501876831055, "global_step": 502888, "epoch": 6058} {"train_loss": -27.54950523376465, "global_step": 502889, "epoch": 6058} {"train_loss": -27.60909080505371, "global_step": 502890, "epoch": 6058} {"train_loss": -27.202199935913086, "global_step": 502891, "epoch": 6058} {"train_loss": -27.406463623046875, "global_step": 502892, "epoch": 6058} {"train_loss": -27.764575958251953, "global_step": 502893, "epoch": 6058} {"train_loss": -27.423547744750977, "global_step": 502894, "epoch": 6058} {"train_loss": -27.571735382080078, "global_step": 502895, "epoch": 6058} {"train_loss": -26.86128347465791, "global_step": 502896, "epoch": 6058, "val_loss": 6609056.0} {"train_loss": -26.108428955078125, "global_step": 502897, "epoch": 6059} {"train_loss": -24.848377227783203, "global_step": 502898, "epoch": 6059} {"train_loss": -26.132795333862305, "global_step": 502899, "epoch": 6059} {"train_loss": -26.818506240844727, "global_step": 502900, "epoch": 6059} {"train_loss": -26.141098022460938, "global_step": 502901, "epoch": 6059} {"train_loss": -26.904132843017578, "global_step": 502902, "epoch": 6059} {"train_loss": -26.17669105529785, "global_step": 502903, "epoch": 6059} {"train_loss": -26.39703941345215, "global_step": 502904, "epoch": 6059} {"train_loss": -26.193878173828125, "global_step": 502905, "epoch": 6059} {"train_loss": -27.28297233581543, "global_step": 502906, "epoch": 6059} {"train_loss": -26.564453125, "global_step": 502907, "epoch": 6059} {"train_loss": -26.65862464904785, "global_step": 502908, "epoch": 6059} {"train_loss": -26.906707763671875, "global_step": 502909, "epoch": 6059} {"train_loss": -26.44315528869629, "global_step": 502910, "epoch": 6059} {"train_loss": -26.811742782592773, "global_step": 502911, "epoch": 6059} {"train_loss": -26.88079261779785, "global_step": 502912, "epoch": 6059} {"train_loss": -26.892560958862305, "global_step": 502913, "epoch": 6059} {"train_loss": -27.137914657592773, "global_step": 502914, "epoch": 6059} {"train_loss": -27.02383804321289, "global_step": 502915, "epoch": 6059} {"train_loss": -27.605222702026367, "global_step": 502916, "epoch": 6059} {"train_loss": -27.00676918029785, "global_step": 502917, "epoch": 6059} {"train_loss": -27.13372802734375, "global_step": 502918, "epoch": 6059} {"train_loss": -26.88728141784668, "global_step": 502919, "epoch": 6059} {"train_loss": -27.036237716674805, "global_step": 502920, "epoch": 6059} {"train_loss": -27.047534942626953, "global_step": 502921, "epoch": 6059} {"train_loss": -27.07355308532715, "global_step": 502922, "epoch": 6059} {"train_loss": -27.3437557220459, "global_step": 502923, "epoch": 6059} {"train_loss": -26.892858505249023, "global_step": 502924, "epoch": 6059} {"train_loss": -27.476621627807617, "global_step": 502925, "epoch": 6059} {"train_loss": -27.258634567260742, "global_step": 502926, "epoch": 6059} {"train_loss": -27.602527618408203, "global_step": 502927, "epoch": 6059} {"train_loss": -27.57380485534668, "global_step": 502928, "epoch": 6059} {"train_loss": -27.33774757385254, "global_step": 502929, "epoch": 6059} {"train_loss": -27.2031192779541, "global_step": 502930, "epoch": 6059} {"train_loss": -27.357818603515625, "global_step": 502931, "epoch": 6059} {"train_loss": -27.527307510375977, "global_step": 502932, "epoch": 6059} {"train_loss": -27.51955223083496, "global_step": 502933, "epoch": 6059} {"train_loss": -27.5443058013916, "global_step": 502934, "epoch": 6059} {"train_loss": -27.502399444580078, "global_step": 502935, "epoch": 6059} {"train_loss": -27.47039794921875, "global_step": 502936, "epoch": 6059} {"train_loss": -27.607196807861328, "global_step": 502937, "epoch": 6059} {"train_loss": -27.589292526245117, "global_step": 502938, "epoch": 6059} {"train_loss": -27.31231117248535, "global_step": 502939, "epoch": 6059} {"train_loss": -27.486682891845703, "global_step": 502940, "epoch": 6059} {"train_loss": -27.4052791595459, "global_step": 502941, "epoch": 6059} {"train_loss": -27.624807357788086, "global_step": 502942, "epoch": 6059} {"train_loss": -27.914325714111328, "global_step": 502943, "epoch": 6059} {"train_loss": -27.243335723876953, "global_step": 502944, "epoch": 6059} {"train_loss": -27.205158233642578, "global_step": 502945, "epoch": 6059} {"train_loss": -27.608291625976562, "global_step": 502946, "epoch": 6059} {"train_loss": -27.858800888061523, "global_step": 502947, "epoch": 6059} {"train_loss": -27.275190353393555, "global_step": 502948, "epoch": 6059} {"train_loss": -27.235280990600586, "global_step": 502949, "epoch": 6059} {"train_loss": -27.33246421813965, "global_step": 502950, "epoch": 6059} {"train_loss": -27.506925582885742, "global_step": 502951, "epoch": 6059} {"train_loss": -27.396352767944336, "global_step": 502952, "epoch": 6059} {"train_loss": -27.811267852783203, "global_step": 502953, "epoch": 6059} {"train_loss": -27.663467407226562, "global_step": 502954, "epoch": 6059} {"train_loss": -27.586898803710938, "global_step": 502955, "epoch": 6059} {"train_loss": -27.299230575561523, "global_step": 502956, "epoch": 6059} {"train_loss": -27.579809188842773, "global_step": 502957, "epoch": 6059} {"train_loss": -27.52503776550293, "global_step": 502958, "epoch": 6059} {"train_loss": -27.279159545898438, "global_step": 502959, "epoch": 6059} {"train_loss": -27.27898597717285, "global_step": 502960, "epoch": 6059} {"train_loss": -27.49879264831543, "global_step": 502961, "epoch": 6059} {"train_loss": -27.7341251373291, "global_step": 502962, "epoch": 6059} {"train_loss": -27.44318199157715, "global_step": 502963, "epoch": 6059} {"train_loss": -27.35627555847168, "global_step": 502964, "epoch": 6059} {"train_loss": -27.317916870117188, "global_step": 502965, "epoch": 6059} {"train_loss": -26.120502471923828, "global_step": 502966, "epoch": 6059} {"train_loss": -26.19571876525879, "global_step": 502967, "epoch": 6059} {"train_loss": -26.5843448638916, "global_step": 502968, "epoch": 6059} {"train_loss": -27.12432861328125, "global_step": 502969, "epoch": 6059} {"train_loss": -26.664838790893555, "global_step": 502970, "epoch": 6059} {"train_loss": -26.865924835205078, "global_step": 502971, "epoch": 6059} {"train_loss": -26.491422653198242, "global_step": 502972, "epoch": 6059} {"train_loss": -26.447711944580078, "global_step": 502973, "epoch": 6059} {"train_loss": -26.776477813720703, "global_step": 502974, "epoch": 6059} {"train_loss": -26.87018394470215, "global_step": 502975, "epoch": 6059} {"train_loss": -26.202138900756836, "global_step": 502976, "epoch": 6059} {"train_loss": -27.0494384765625, "global_step": 502977, "epoch": 6059} {"train_loss": -27.0704402923584, "global_step": 502978, "epoch": 6059} {"train_loss": -27.085974199226104, "global_step": 502979, "epoch": 6059, "val_loss": 6617754.0} {"train_loss": -26.557043075561523, "global_step": 502980, "epoch": 6060} {"train_loss": -25.903644561767578, "global_step": 502981, "epoch": 6060} {"train_loss": -26.562042236328125, "global_step": 502982, "epoch": 6060} {"train_loss": -26.04302406311035, "global_step": 502983, "epoch": 6060} {"train_loss": -26.7060489654541, "global_step": 502984, "epoch": 6060} {"train_loss": -26.05671501159668, "global_step": 502985, "epoch": 6060} {"train_loss": -26.739044189453125, "global_step": 502986, "epoch": 6060} {"train_loss": -26.722274780273438, "global_step": 502987, "epoch": 6060} {"train_loss": -26.560148239135742, "global_step": 502988, "epoch": 6060} {"train_loss": -26.56597900390625, "global_step": 502989, "epoch": 6060} {"train_loss": -26.132970809936523, "global_step": 502990, "epoch": 6060} {"train_loss": -26.7574462890625, "global_step": 502991, "epoch": 6060} {"train_loss": -26.713184356689453, "global_step": 502992, "epoch": 6060} {"train_loss": -27.055936813354492, "global_step": 502993, "epoch": 6060} {"train_loss": -27.0841121673584, "global_step": 502994, "epoch": 6060} {"train_loss": -26.477344512939453, "global_step": 502995, "epoch": 6060} {"train_loss": -26.944990158081055, "global_step": 502996, "epoch": 6060} {"train_loss": -26.929351806640625, "global_step": 502997, "epoch": 6060} {"train_loss": -27.00203514099121, "global_step": 502998, "epoch": 6060} {"train_loss": -27.135284423828125, "global_step": 502999, "epoch": 6060} {"train_loss": -27.227584838867188, "global_step": 503000, "epoch": 6060} {"train_loss": -26.81326675415039, "global_step": 503001, "epoch": 6060} {"train_loss": -26.932241439819336, "global_step": 503002, "epoch": 6060} {"train_loss": -27.192306518554688, "global_step": 503003, "epoch": 6060} {"train_loss": -27.36329460144043, "global_step": 503004, "epoch": 6060} {"train_loss": -26.900848388671875, "global_step": 503005, "epoch": 6060} {"train_loss": -27.60898780822754, "global_step": 503006, "epoch": 6060} {"train_loss": -27.504016876220703, "global_step": 503007, "epoch": 6060} {"train_loss": -27.522916793823242, "global_step": 503008, "epoch": 6060} {"train_loss": -27.2236328125, "global_step": 503009, "epoch": 6060} {"train_loss": -27.30498695373535, "global_step": 503010, "epoch": 6060} {"train_loss": -27.33088493347168, "global_step": 503011, "epoch": 6060} {"train_loss": -27.624988555908203, "global_step": 503012, "epoch": 6060} {"train_loss": -27.445898056030273, "global_step": 503013, "epoch": 6060} {"train_loss": -27.130537033081055, "global_step": 503014, "epoch": 6060} {"train_loss": -27.4724178314209, "global_step": 503015, "epoch": 6060} {"train_loss": -27.21735191345215, "global_step": 503016, "epoch": 6060} {"train_loss": -27.81280517578125, "global_step": 503017, "epoch": 6060} {"train_loss": -27.499067306518555, "global_step": 503018, "epoch": 6060} {"train_loss": -27.3209171295166, "global_step": 503019, "epoch": 6060} {"train_loss": -27.400426864624023, "global_step": 503020, "epoch": 6060} {"train_loss": -27.26637840270996, "global_step": 503021, "epoch": 6060} {"train_loss": -27.363208770751953, "global_step": 503022, "epoch": 6060} {"train_loss": -27.509552001953125, "global_step": 503023, "epoch": 6060} {"train_loss": -27.60068130493164, "global_step": 503024, "epoch": 6060} {"train_loss": -27.721820831298828, "global_step": 503025, "epoch": 6060} {"train_loss": -27.405567169189453, "global_step": 503026, "epoch": 6060} {"train_loss": -27.642974853515625, "global_step": 503027, "epoch": 6060} {"train_loss": -27.300382614135742, "global_step": 503028, "epoch": 6060} {"train_loss": -27.486957550048828, "global_step": 503029, "epoch": 6060} {"train_loss": -27.6014461517334, "global_step": 503030, "epoch": 6060} {"train_loss": -27.677900314331055, "global_step": 503031, "epoch": 6060} {"train_loss": -27.639251708984375, "global_step": 503032, "epoch": 6060} {"train_loss": -27.4061336517334, "global_step": 503033, "epoch": 6060} {"train_loss": -27.238683700561523, "global_step": 503034, "epoch": 6060} {"train_loss": -26.66880226135254, "global_step": 503035, "epoch": 6060} {"train_loss": -27.191436767578125, "global_step": 503036, "epoch": 6060} {"train_loss": -27.575597763061523, "global_step": 503037, "epoch": 6060} {"train_loss": -27.323362350463867, "global_step": 503038, "epoch": 6060} {"train_loss": -27.26597023010254, "global_step": 503039, "epoch": 6060} {"train_loss": -27.520978927612305, "global_step": 503040, "epoch": 6060} {"train_loss": -27.012664794921875, "global_step": 503041, "epoch": 6060} {"train_loss": -27.39534568786621, "global_step": 503042, "epoch": 6060} {"train_loss": -27.359851837158203, "global_step": 503043, "epoch": 6060} {"train_loss": -27.58353042602539, "global_step": 503044, "epoch": 6060} {"train_loss": -27.620370864868164, "global_step": 503045, "epoch": 6060} {"train_loss": -27.178464889526367, "global_step": 503046, "epoch": 6060} {"train_loss": -27.5429630279541, "global_step": 503047, "epoch": 6060} {"train_loss": -27.541162490844727, "global_step": 503048, "epoch": 6060} {"train_loss": -27.591089248657227, "global_step": 503049, "epoch": 6060} {"train_loss": -27.6373348236084, "global_step": 503050, "epoch": 6060} {"train_loss": -27.372220993041992, "global_step": 503051, "epoch": 6060} {"train_loss": -27.511011123657227, "global_step": 503052, "epoch": 6060} {"train_loss": -27.453109741210938, "global_step": 503053, "epoch": 6060} {"train_loss": -27.408905029296875, "global_step": 503054, "epoch": 6060} {"train_loss": -27.167768478393555, "global_step": 503055, "epoch": 6060} {"train_loss": -27.190032958984375, "global_step": 503056, "epoch": 6060} {"train_loss": -27.543832778930664, "global_step": 503057, "epoch": 6060} {"train_loss": -27.314411163330078, "global_step": 503058, "epoch": 6060} {"train_loss": -27.528064727783203, "global_step": 503059, "epoch": 6060} {"train_loss": -27.31095314025879, "global_step": 503060, "epoch": 6060} {"train_loss": -27.525787353515625, "global_step": 503061, "epoch": 6060} {"train_loss": -27.206412786460785, "global_step": 503062, "epoch": 6060, "val_loss": 6565307.5} {"train_loss": -26.81882095336914, "global_step": 503063, "epoch": 6061} {"train_loss": -26.128698348999023, "global_step": 503064, "epoch": 6061} {"train_loss": -26.804737091064453, "global_step": 503065, "epoch": 6061} {"train_loss": -27.1842041015625, "global_step": 503066, "epoch": 6061} {"train_loss": -26.418298721313477, "global_step": 503067, "epoch": 6061} {"train_loss": -27.225555419921875, "global_step": 503068, "epoch": 6061} {"train_loss": -26.380552291870117, "global_step": 503069, "epoch": 6061} {"train_loss": -27.16388511657715, "global_step": 503070, "epoch": 6061} {"train_loss": -26.6932430267334, "global_step": 503071, "epoch": 6061} {"train_loss": -26.75174331665039, "global_step": 503072, "epoch": 6061} {"train_loss": -26.81560707092285, "global_step": 503073, "epoch": 6061} {"train_loss": -26.898761749267578, "global_step": 503074, "epoch": 6061} {"train_loss": -26.81510353088379, "global_step": 503075, "epoch": 6061} {"train_loss": -27.04389762878418, "global_step": 503076, "epoch": 6061} {"train_loss": -27.186853408813477, "global_step": 503077, "epoch": 6061} {"train_loss": -26.72249412536621, "global_step": 503078, "epoch": 6061} {"train_loss": -27.264204025268555, "global_step": 503079, "epoch": 6061} {"train_loss": -27.21065330505371, "global_step": 503080, "epoch": 6061} {"train_loss": -27.243383407592773, "global_step": 503081, "epoch": 6061} {"train_loss": -26.99248695373535, "global_step": 503082, "epoch": 6061} {"train_loss": -26.635244369506836, "global_step": 503083, "epoch": 6061} {"train_loss": -26.995986938476562, "global_step": 503084, "epoch": 6061} {"train_loss": -27.201324462890625, "global_step": 503085, "epoch": 6061} {"train_loss": -27.382959365844727, "global_step": 503086, "epoch": 6061} {"train_loss": -26.922712326049805, "global_step": 503087, "epoch": 6061} {"train_loss": -27.03814125061035, "global_step": 503088, "epoch": 6061} {"train_loss": -27.062488555908203, "global_step": 503089, "epoch": 6061} {"train_loss": -26.872243881225586, "global_step": 503090, "epoch": 6061} {"train_loss": -27.405149459838867, "global_step": 503091, "epoch": 6061} {"train_loss": -27.48187828063965, "global_step": 503092, "epoch": 6061} {"train_loss": -27.5419864654541, "global_step": 503093, "epoch": 6061} {"train_loss": -27.33943748474121, "global_step": 503094, "epoch": 6061} {"train_loss": -27.406667709350586, "global_step": 503095, "epoch": 6061} {"train_loss": -27.389326095581055, "global_step": 503096, "epoch": 6061} {"train_loss": -27.01129150390625, "global_step": 503097, "epoch": 6061} {"train_loss": -27.318220138549805, "global_step": 503098, "epoch": 6061} {"train_loss": -27.639326095581055, "global_step": 503099, "epoch": 6061} {"train_loss": -27.16275405883789, "global_step": 503100, "epoch": 6061} {"train_loss": -27.303375244140625, "global_step": 503101, "epoch": 6061} {"train_loss": -27.517431259155273, "global_step": 503102, "epoch": 6061} {"train_loss": -27.619293212890625, "global_step": 503103, "epoch": 6061} {"train_loss": -27.366317749023438, "global_step": 503104, "epoch": 6061} {"train_loss": -27.49256706237793, "global_step": 503105, "epoch": 6061} {"train_loss": -27.4454345703125, "global_step": 503106, "epoch": 6061} {"train_loss": -27.752851486206055, "global_step": 503107, "epoch": 6061} {"train_loss": -27.602624893188477, "global_step": 503108, "epoch": 6061} {"train_loss": -27.759485244750977, "global_step": 503109, "epoch": 6061} {"train_loss": -27.923725128173828, "global_step": 503110, "epoch": 6061} {"train_loss": -27.582162857055664, "global_step": 503111, "epoch": 6061} {"train_loss": -27.227872848510742, "global_step": 503112, "epoch": 6061} {"train_loss": -27.34674644470215, "global_step": 503113, "epoch": 6061} {"train_loss": -27.199298858642578, "global_step": 503114, "epoch": 6061} {"train_loss": -27.300678253173828, "global_step": 503115, "epoch": 6061} {"train_loss": -28.069305419921875, "global_step": 503116, "epoch": 6061} {"train_loss": -27.39069938659668, "global_step": 503117, "epoch": 6061} {"train_loss": -27.936710357666016, "global_step": 503118, "epoch": 6061} {"train_loss": -27.103490829467773, "global_step": 503119, "epoch": 6061} {"train_loss": -27.489530563354492, "global_step": 503120, "epoch": 6061} {"train_loss": -27.857852935791016, "global_step": 503121, "epoch": 6061} {"train_loss": -27.0396728515625, "global_step": 503122, "epoch": 6061} {"train_loss": -26.741498947143555, "global_step": 503123, "epoch": 6061} {"train_loss": -26.675525665283203, "global_step": 503124, "epoch": 6061} {"train_loss": -26.452804565429688, "global_step": 503125, "epoch": 6061} {"train_loss": -26.847843170166016, "global_step": 503126, "epoch": 6061} {"train_loss": -27.53470230102539, "global_step": 503127, "epoch": 6061} {"train_loss": -27.28850746154785, "global_step": 503128, "epoch": 6061} {"train_loss": -26.874042510986328, "global_step": 503129, "epoch": 6061} {"train_loss": -27.230520248413086, "global_step": 503130, "epoch": 6061} {"train_loss": -27.145456314086914, "global_step": 503131, "epoch": 6061} {"train_loss": -27.27446937561035, "global_step": 503132, "epoch": 6061} {"train_loss": -27.65420913696289, "global_step": 503133, "epoch": 6061} {"train_loss": -27.302204132080078, "global_step": 503134, "epoch": 6061} {"train_loss": -27.344358444213867, "global_step": 503135, "epoch": 6061} {"train_loss": -27.674924850463867, "global_step": 503136, "epoch": 6061} {"train_loss": -27.248859405517578, "global_step": 503137, "epoch": 6061} {"train_loss": -27.241260528564453, "global_step": 503138, "epoch": 6061} {"train_loss": -27.131723403930664, "global_step": 503139, "epoch": 6061} {"train_loss": -27.36260986328125, "global_step": 503140, "epoch": 6061} {"train_loss": -27.57489585876465, "global_step": 503141, "epoch": 6061} {"train_loss": -27.138357162475586, "global_step": 503142, "epoch": 6061} {"train_loss": -27.588611602783203, "global_step": 503143, "epoch": 6061} {"train_loss": -26.937808990478516, "global_step": 503144, "epoch": 6061} {"train_loss": -27.204559716833643, "global_step": 503145, "epoch": 6061, "val_loss": 6538849.0} {"train_loss": -26.5768985748291, "global_step": 503146, "epoch": 6062} {"train_loss": -26.52808952331543, "global_step": 503147, "epoch": 6062} {"train_loss": -26.85365104675293, "global_step": 503148, "epoch": 6062} {"train_loss": -26.732898712158203, "global_step": 503149, "epoch": 6062} {"train_loss": -26.732702255249023, "global_step": 503150, "epoch": 6062} {"train_loss": -26.71240234375, "global_step": 503151, "epoch": 6062} {"train_loss": -26.51173210144043, "global_step": 503152, "epoch": 6062} {"train_loss": -26.664941787719727, "global_step": 503153, "epoch": 6062} {"train_loss": -27.086252212524414, "global_step": 503154, "epoch": 6062} {"train_loss": -26.917936325073242, "global_step": 503155, "epoch": 6062} {"train_loss": -26.98333168029785, "global_step": 503156, "epoch": 6062} {"train_loss": -26.903034210205078, "global_step": 503157, "epoch": 6062} {"train_loss": -26.66937828063965, "global_step": 503158, "epoch": 6062} {"train_loss": -26.93310546875, "global_step": 503159, "epoch": 6062} {"train_loss": -26.85536766052246, "global_step": 503160, "epoch": 6062} {"train_loss": -27.046005249023438, "global_step": 503161, "epoch": 6062} {"train_loss": -26.90341567993164, "global_step": 503162, "epoch": 6062} {"train_loss": -27.03407096862793, "global_step": 503163, "epoch": 6062} {"train_loss": -26.746265411376953, "global_step": 503164, "epoch": 6062} {"train_loss": -27.494110107421875, "global_step": 503165, "epoch": 6062} {"train_loss": -26.84417152404785, "global_step": 503166, "epoch": 6062} {"train_loss": -27.40424919128418, "global_step": 503167, "epoch": 6062} {"train_loss": -26.944446563720703, "global_step": 503168, "epoch": 6062} {"train_loss": -27.164709091186523, "global_step": 503169, "epoch": 6062} {"train_loss": -27.3139591217041, "global_step": 503170, "epoch": 6062} {"train_loss": -27.330341339111328, "global_step": 503171, "epoch": 6062} {"train_loss": -27.509342193603516, "global_step": 503172, "epoch": 6062} {"train_loss": -27.446155548095703, "global_step": 503173, "epoch": 6062} {"train_loss": -27.5578670501709, "global_step": 503174, "epoch": 6062} {"train_loss": -27.260211944580078, "global_step": 503175, "epoch": 6062} {"train_loss": -27.163434982299805, "global_step": 503176, "epoch": 6062} {"train_loss": -27.215063095092773, "global_step": 503177, "epoch": 6062} {"train_loss": -27.41498374938965, "global_step": 503178, "epoch": 6062} {"train_loss": -27.525379180908203, "global_step": 503179, "epoch": 6062} {"train_loss": -27.563879013061523, "global_step": 503180, "epoch": 6062} {"train_loss": -27.08111572265625, "global_step": 503181, "epoch": 6062} {"train_loss": -27.4791259765625, "global_step": 503182, "epoch": 6062} {"train_loss": -27.44830322265625, "global_step": 503183, "epoch": 6062} {"train_loss": -27.366363525390625, "global_step": 503184, "epoch": 6062} {"train_loss": -27.149091720581055, "global_step": 503185, "epoch": 6062} {"train_loss": -27.090656280517578, "global_step": 503186, "epoch": 6062} {"train_loss": -27.631393432617188, "global_step": 503187, "epoch": 6062} {"train_loss": -27.176055908203125, "global_step": 503188, "epoch": 6062} {"train_loss": -27.544330596923828, "global_step": 503189, "epoch": 6062} {"train_loss": -27.7891788482666, "global_step": 503190, "epoch": 6062} {"train_loss": -27.26119041442871, "global_step": 503191, "epoch": 6062} {"train_loss": -27.2205867767334, "global_step": 503192, "epoch": 6062} {"train_loss": -27.80245018005371, "global_step": 503193, "epoch": 6062} {"train_loss": -27.864166259765625, "global_step": 503194, "epoch": 6062} {"train_loss": -27.7575740814209, "global_step": 503195, "epoch": 6062} {"train_loss": -27.714111328125, "global_step": 503196, "epoch": 6062} {"train_loss": -27.581653594970703, "global_step": 503197, "epoch": 6062} {"train_loss": -27.58538818359375, "global_step": 503198, "epoch": 6062} {"train_loss": -27.609649658203125, "global_step": 503199, "epoch": 6062} {"train_loss": -27.45478630065918, "global_step": 503200, "epoch": 6062} {"train_loss": -27.546045303344727, "global_step": 503201, "epoch": 6062} {"train_loss": -27.390302658081055, "global_step": 503202, "epoch": 6062} {"train_loss": -27.529321670532227, "global_step": 503203, "epoch": 6062} {"train_loss": -27.65576171875, "global_step": 503204, "epoch": 6062} {"train_loss": -27.876081466674805, "global_step": 503205, "epoch": 6062} {"train_loss": -27.38971519470215, "global_step": 503206, "epoch": 6062} {"train_loss": -27.585311889648438, "global_step": 503207, "epoch": 6062} {"train_loss": -27.606420516967773, "global_step": 503208, "epoch": 6062} {"train_loss": -27.782779693603516, "global_step": 503209, "epoch": 6062} {"train_loss": -27.7597713470459, "global_step": 503210, "epoch": 6062} {"train_loss": -27.544330596923828, "global_step": 503211, "epoch": 6062} {"train_loss": -27.463422775268555, "global_step": 503212, "epoch": 6062} {"train_loss": -27.693618774414062, "global_step": 503213, "epoch": 6062} {"train_loss": -27.618728637695312, "global_step": 503214, "epoch": 6062} {"train_loss": -27.4960994720459, "global_step": 503215, "epoch": 6062} {"train_loss": -27.704132080078125, "global_step": 503216, "epoch": 6062} {"train_loss": -27.235107421875, "global_step": 503217, "epoch": 6062} {"train_loss": -27.672937393188477, "global_step": 503218, "epoch": 6062} {"train_loss": -27.417245864868164, "global_step": 503219, "epoch": 6062} {"train_loss": -27.469823837280273, "global_step": 503220, "epoch": 6062} {"train_loss": -27.465795516967773, "global_step": 503221, "epoch": 6062} {"train_loss": -26.982511520385742, "global_step": 503222, "epoch": 6062} {"train_loss": -26.792835235595703, "global_step": 503223, "epoch": 6062} {"train_loss": -26.97999382019043, "global_step": 503224, "epoch": 6062} {"train_loss": -27.403217315673828, "global_step": 503225, "epoch": 6062} {"train_loss": -27.176502227783203, "global_step": 503226, "epoch": 6062} {"train_loss": -27.0659122467041, "global_step": 503227, "epoch": 6062} {"train_loss": -27.307298269616552, "global_step": 503228, "epoch": 6062, "val_loss": 6498895.0} {"train_loss": -27.123559951782227, "global_step": 503229, "epoch": 6063} {"train_loss": -26.95893669128418, "global_step": 503230, "epoch": 6063} {"train_loss": -27.154926300048828, "global_step": 503231, "epoch": 6063} {"train_loss": -26.715957641601562, "global_step": 503232, "epoch": 6063} {"train_loss": -26.635229110717773, "global_step": 503233, "epoch": 6063} {"train_loss": -26.788061141967773, "global_step": 503234, "epoch": 6063} {"train_loss": -26.876575469970703, "global_step": 503235, "epoch": 6063} {"train_loss": -27.432767868041992, "global_step": 503236, "epoch": 6063} {"train_loss": -26.57236671447754, "global_step": 503237, "epoch": 6063} {"train_loss": -26.926746368408203, "global_step": 503238, "epoch": 6063} {"train_loss": -26.53541374206543, "global_step": 503239, "epoch": 6063} {"train_loss": -27.064863204956055, "global_step": 503240, "epoch": 6063} {"train_loss": -26.86748695373535, "global_step": 503241, "epoch": 6063} {"train_loss": -27.059545516967773, "global_step": 503242, "epoch": 6063} {"train_loss": -27.4248104095459, "global_step": 503243, "epoch": 6063} {"train_loss": -27.118009567260742, "global_step": 503244, "epoch": 6063} {"train_loss": -26.636022567749023, "global_step": 503245, "epoch": 6063} {"train_loss": -27.355533599853516, "global_step": 503246, "epoch": 6063} {"train_loss": -27.16766357421875, "global_step": 503247, "epoch": 6063} {"train_loss": -27.13532066345215, "global_step": 503248, "epoch": 6063} {"train_loss": -27.058917999267578, "global_step": 503249, "epoch": 6063} {"train_loss": -27.42225456237793, "global_step": 503250, "epoch": 6063} {"train_loss": -27.150497436523438, "global_step": 503251, "epoch": 6063} {"train_loss": -27.34332847595215, "global_step": 503252, "epoch": 6063} {"train_loss": -27.537490844726562, "global_step": 503253, "epoch": 6063} {"train_loss": -27.416748046875, "global_step": 503254, "epoch": 6063} {"train_loss": -27.203046798706055, "global_step": 503255, "epoch": 6063} {"train_loss": -27.232336044311523, "global_step": 503256, "epoch": 6063} {"train_loss": -27.292621612548828, "global_step": 503257, "epoch": 6063} {"train_loss": -27.687108993530273, "global_step": 503258, "epoch": 6063} {"train_loss": -27.47153091430664, "global_step": 503259, "epoch": 6063} {"train_loss": -27.375879287719727, "global_step": 503260, "epoch": 6063} {"train_loss": -27.27564811706543, "global_step": 503261, "epoch": 6063} {"train_loss": -27.577716827392578, "global_step": 503262, "epoch": 6063} {"train_loss": -27.24488639831543, "global_step": 503263, "epoch": 6063} {"train_loss": -27.3411808013916, "global_step": 503264, "epoch": 6063} {"train_loss": -27.00263786315918, "global_step": 503265, "epoch": 6063} {"train_loss": -27.54847526550293, "global_step": 503266, "epoch": 6063} {"train_loss": -27.438385009765625, "global_step": 503267, "epoch": 6063} {"train_loss": -27.540372848510742, "global_step": 503268, "epoch": 6063} {"train_loss": -27.40618324279785, "global_step": 503269, "epoch": 6063} {"train_loss": -27.11920166015625, "global_step": 503270, "epoch": 6063} {"train_loss": -27.356159210205078, "global_step": 503271, "epoch": 6063} {"train_loss": -27.4114933013916, "global_step": 503272, "epoch": 6063} {"train_loss": -27.35111427307129, "global_step": 503273, "epoch": 6063} {"train_loss": -27.531341552734375, "global_step": 503274, "epoch": 6063} {"train_loss": -27.238428115844727, "global_step": 503275, "epoch": 6063} {"train_loss": -27.177692413330078, "global_step": 503276, "epoch": 6063} {"train_loss": -27.476606369018555, "global_step": 503277, "epoch": 6063} {"train_loss": -27.36551856994629, "global_step": 503278, "epoch": 6063} {"train_loss": -27.580764770507812, "global_step": 503279, "epoch": 6063} {"train_loss": -27.58062171936035, "global_step": 503280, "epoch": 6063} {"train_loss": -27.151294708251953, "global_step": 503281, "epoch": 6063} {"train_loss": -27.505451202392578, "global_step": 503282, "epoch": 6063} {"train_loss": -28.001636505126953, "global_step": 503283, "epoch": 6063} {"train_loss": -27.72007179260254, "global_step": 503284, "epoch": 6063} {"train_loss": -26.945859909057617, "global_step": 503285, "epoch": 6063} {"train_loss": -27.483877182006836, "global_step": 503286, "epoch": 6063} {"train_loss": -27.453414916992188, "global_step": 503287, "epoch": 6063} {"train_loss": -27.498868942260742, "global_step": 503288, "epoch": 6063} {"train_loss": -27.60340690612793, "global_step": 503289, "epoch": 6063} {"train_loss": -27.400846481323242, "global_step": 503290, "epoch": 6063} {"train_loss": -27.530298233032227, "global_step": 503291, "epoch": 6063} {"train_loss": -27.041357040405273, "global_step": 503292, "epoch": 6063} {"train_loss": -27.344379425048828, "global_step": 503293, "epoch": 6063} {"train_loss": -27.65541648864746, "global_step": 503294, "epoch": 6063} {"train_loss": -27.661685943603516, "global_step": 503295, "epoch": 6063} {"train_loss": -27.724170684814453, "global_step": 503296, "epoch": 6063} {"train_loss": -27.392370223999023, "global_step": 503297, "epoch": 6063} {"train_loss": -27.52521324157715, "global_step": 503298, "epoch": 6063} {"train_loss": -27.488525390625, "global_step": 503299, "epoch": 6063} {"train_loss": -27.23563575744629, "global_step": 503300, "epoch": 6063} {"train_loss": -27.71388816833496, "global_step": 503301, "epoch": 6063} {"train_loss": -27.58832359313965, "global_step": 503302, "epoch": 6063} {"train_loss": -27.673681259155273, "global_step": 503303, "epoch": 6063} {"train_loss": -27.93048667907715, "global_step": 503304, "epoch": 6063} {"train_loss": -27.579435348510742, "global_step": 503305, "epoch": 6063} {"train_loss": -27.64251708984375, "global_step": 503306, "epoch": 6063} {"train_loss": -28.031599044799805, "global_step": 503307, "epoch": 6063} {"train_loss": -27.458663940429688, "global_step": 503308, "epoch": 6063} {"train_loss": -27.56239128112793, "global_step": 503309, "epoch": 6063} {"train_loss": -27.394489288330078, "global_step": 503310, "epoch": 6063} {"train_loss": -27.353723503020873, "global_step": 503311, "epoch": 6063, "val_loss": 6511362.0} {"train_loss": -27.114057540893555, "global_step": 503312, "epoch": 6064} {"train_loss": -27.135868072509766, "global_step": 503313, "epoch": 6064} {"train_loss": -27.059894561767578, "global_step": 503314, "epoch": 6064} {"train_loss": -27.625226974487305, "global_step": 503315, "epoch": 6064} {"train_loss": -27.265832901000977, "global_step": 503316, "epoch": 6064} {"train_loss": -27.67108726501465, "global_step": 503317, "epoch": 6064} {"train_loss": -26.4989013671875, "global_step": 503318, "epoch": 6064} {"train_loss": -27.21895408630371, "global_step": 503319, "epoch": 6064} {"train_loss": -27.012948989868164, "global_step": 503320, "epoch": 6064} {"train_loss": -27.41950035095215, "global_step": 503321, "epoch": 6064} {"train_loss": -26.874561309814453, "global_step": 503322, "epoch": 6064} {"train_loss": -27.1705379486084, "global_step": 503323, "epoch": 6064} {"train_loss": -26.788299560546875, "global_step": 503324, "epoch": 6064} {"train_loss": -26.138105392456055, "global_step": 503325, "epoch": 6064} {"train_loss": -26.96405029296875, "global_step": 503326, "epoch": 6064} {"train_loss": -26.954931259155273, "global_step": 503327, "epoch": 6064} {"train_loss": -27.196048736572266, "global_step": 503328, "epoch": 6064} {"train_loss": -26.900836944580078, "global_step": 503329, "epoch": 6064} {"train_loss": -26.9417724609375, "global_step": 503330, "epoch": 6064} {"train_loss": -26.640506744384766, "global_step": 503331, "epoch": 6064} {"train_loss": -27.289474487304688, "global_step": 503332, "epoch": 6064} {"train_loss": -26.97712516784668, "global_step": 503333, "epoch": 6064} {"train_loss": -27.058069229125977, "global_step": 503334, "epoch": 6064} {"train_loss": -27.36457633972168, "global_step": 503335, "epoch": 6064} {"train_loss": -27.064197540283203, "global_step": 503336, "epoch": 6064} {"train_loss": -27.39459800720215, "global_step": 503337, "epoch": 6064} {"train_loss": -27.766265869140625, "global_step": 503338, "epoch": 6064} {"train_loss": -27.5164737701416, "global_step": 503339, "epoch": 6064} {"train_loss": -27.544824600219727, "global_step": 503340, "epoch": 6064} {"train_loss": -27.34796714782715, "global_step": 503341, "epoch": 6064} {"train_loss": -27.614215850830078, "global_step": 503342, "epoch": 6064} {"train_loss": -27.76141357421875, "global_step": 503343, "epoch": 6064} {"train_loss": -27.4986572265625, "global_step": 503344, "epoch": 6064} {"train_loss": -27.5643253326416, "global_step": 503345, "epoch": 6064} {"train_loss": -27.31760597229004, "global_step": 503346, "epoch": 6064} {"train_loss": -27.561826705932617, "global_step": 503347, "epoch": 6064} {"train_loss": -27.49713706970215, "global_step": 503348, "epoch": 6064} {"train_loss": -27.38872718811035, "global_step": 503349, "epoch": 6064} {"train_loss": -27.4294490814209, "global_step": 503350, "epoch": 6064} {"train_loss": -27.16419792175293, "global_step": 503351, "epoch": 6064} {"train_loss": -27.267698287963867, "global_step": 503352, "epoch": 6064} {"train_loss": -27.550947189331055, "global_step": 503353, "epoch": 6064} {"train_loss": -27.351337432861328, "global_step": 503354, "epoch": 6064} {"train_loss": -27.68763542175293, "global_step": 503355, "epoch": 6064} {"train_loss": -27.552509307861328, "global_step": 503356, "epoch": 6064} {"train_loss": -27.087568283081055, "global_step": 503357, "epoch": 6064} {"train_loss": -27.6506404876709, "global_step": 503358, "epoch": 6064} {"train_loss": -27.376773834228516, "global_step": 503359, "epoch": 6064} {"train_loss": -27.10597038269043, "global_step": 503360, "epoch": 6064} {"train_loss": -27.595300674438477, "global_step": 503361, "epoch": 6064} {"train_loss": -27.4951229095459, "global_step": 503362, "epoch": 6064} {"train_loss": -27.269245147705078, "global_step": 503363, "epoch": 6064} {"train_loss": -27.455121994018555, "global_step": 503364, "epoch": 6064} {"train_loss": -27.18488121032715, "global_step": 503365, "epoch": 6064} {"train_loss": -27.429967880249023, "global_step": 503366, "epoch": 6064} {"train_loss": -27.286670684814453, "global_step": 503367, "epoch": 6064} {"train_loss": -27.55104637145996, "global_step": 503368, "epoch": 6064} {"train_loss": -27.561506271362305, "global_step": 503369, "epoch": 6064} {"train_loss": -27.5172061920166, "global_step": 503370, "epoch": 6064} {"train_loss": -27.10672378540039, "global_step": 503371, "epoch": 6064} {"train_loss": -27.03852653503418, "global_step": 503372, "epoch": 6064} {"train_loss": -25.97442626953125, "global_step": 503373, "epoch": 6064} {"train_loss": -25.9337158203125, "global_step": 503374, "epoch": 6064} {"train_loss": -26.74409294128418, "global_step": 503375, "epoch": 6064} {"train_loss": -26.905988693237305, "global_step": 503376, "epoch": 6064} {"train_loss": -26.93255615234375, "global_step": 503377, "epoch": 6064} {"train_loss": -26.84004783630371, "global_step": 503378, "epoch": 6064} {"train_loss": -27.2587833404541, "global_step": 503379, "epoch": 6064} {"train_loss": -26.527021408081055, "global_step": 503380, "epoch": 6064} {"train_loss": -27.36026382446289, "global_step": 503381, "epoch": 6064} {"train_loss": -27.1739501953125, "global_step": 503382, "epoch": 6064} {"train_loss": -27.368635177612305, "global_step": 503383, "epoch": 6064} {"train_loss": -27.5527286529541, "global_step": 503384, "epoch": 6064} {"train_loss": -27.362720489501953, "global_step": 503385, "epoch": 6064} {"train_loss": -27.304105758666992, "global_step": 503386, "epoch": 6064} {"train_loss": -27.420698165893555, "global_step": 503387, "epoch": 6064} {"train_loss": -27.406091690063477, "global_step": 503388, "epoch": 6064} {"train_loss": -26.9985294342041, "global_step": 503389, "epoch": 6064} {"train_loss": -27.205297470092773, "global_step": 503390, "epoch": 6064} {"train_loss": -27.431812286376953, "global_step": 503391, "epoch": 6064} {"train_loss": -27.322620391845703, "global_step": 503392, "epoch": 6064} {"train_loss": -27.49615478515625, "global_step": 503393, "epoch": 6064} {"train_loss": -27.226239928280016, "global_step": 503394, "epoch": 6064, "val_loss": 6548886.0} {"train_loss": -26.82465934753418, "global_step": 503395, "epoch": 6065} {"train_loss": -27.336658477783203, "global_step": 503396, "epoch": 6065} {"train_loss": -27.465803146362305, "global_step": 503397, "epoch": 6065} {"train_loss": -27.202966690063477, "global_step": 503398, "epoch": 6065} {"train_loss": -27.058612823486328, "global_step": 503399, "epoch": 6065} {"train_loss": -27.815765380859375, "global_step": 503400, "epoch": 6065} {"train_loss": -26.9482421875, "global_step": 503401, "epoch": 6065} {"train_loss": -27.36683464050293, "global_step": 503402, "epoch": 6065} {"train_loss": -27.370458602905273, "global_step": 503403, "epoch": 6065} {"train_loss": -27.27815818786621, "global_step": 503404, "epoch": 6065} {"train_loss": -26.8720645904541, "global_step": 503405, "epoch": 6065} {"train_loss": -27.63922119140625, "global_step": 503406, "epoch": 6065} {"train_loss": -27.164386749267578, "global_step": 503407, "epoch": 6065} {"train_loss": -27.872486114501953, "global_step": 503408, "epoch": 6065} {"train_loss": -27.39801597595215, "global_step": 503409, "epoch": 6065} {"train_loss": -27.504287719726562, "global_step": 503410, "epoch": 6065} {"train_loss": -27.53106117248535, "global_step": 503411, "epoch": 6065} {"train_loss": -27.4730224609375, "global_step": 503412, "epoch": 6065} {"train_loss": -27.28901481628418, "global_step": 503413, "epoch": 6065} {"train_loss": -27.520246505737305, "global_step": 503414, "epoch": 6065} {"train_loss": -27.477222442626953, "global_step": 503415, "epoch": 6065} {"train_loss": -27.21563148498535, "global_step": 503416, "epoch": 6065} {"train_loss": -27.11932373046875, "global_step": 503417, "epoch": 6065} {"train_loss": -27.35101318359375, "global_step": 503418, "epoch": 6065} {"train_loss": -27.5447940826416, "global_step": 503419, "epoch": 6065} {"train_loss": -27.67396354675293, "global_step": 503420, "epoch": 6065} {"train_loss": -27.528980255126953, "global_step": 503421, "epoch": 6065} {"train_loss": -27.3859806060791, "global_step": 503422, "epoch": 6065} {"train_loss": -27.511920928955078, "global_step": 503423, "epoch": 6065} {"train_loss": -27.47064208984375, "global_step": 503424, "epoch": 6065} {"train_loss": -27.731725692749023, "global_step": 503425, "epoch": 6065} {"train_loss": -27.562475204467773, "global_step": 503426, "epoch": 6065} {"train_loss": -27.265140533447266, "global_step": 503427, "epoch": 6065} {"train_loss": -27.491453170776367, "global_step": 503428, "epoch": 6065} {"train_loss": -27.4144229888916, "global_step": 503429, "epoch": 6065} {"train_loss": -27.568695068359375, "global_step": 503430, "epoch": 6065} {"train_loss": -27.615232467651367, "global_step": 503431, "epoch": 6065} {"train_loss": -27.339176177978516, "global_step": 503432, "epoch": 6065} {"train_loss": -27.560888290405273, "global_step": 503433, "epoch": 6065} {"train_loss": -27.86118507385254, "global_step": 503434, "epoch": 6065} {"train_loss": -27.522689819335938, "global_step": 503435, "epoch": 6065} {"train_loss": -27.545705795288086, "global_step": 503436, "epoch": 6065} {"train_loss": -27.693744659423828, "global_step": 503437, "epoch": 6065} {"train_loss": -27.372995376586914, "global_step": 503438, "epoch": 6065} {"train_loss": -27.638629913330078, "global_step": 503439, "epoch": 6065} {"train_loss": -27.418188095092773, "global_step": 503440, "epoch": 6065} {"train_loss": -27.475189208984375, "global_step": 503441, "epoch": 6065} {"train_loss": -27.22479820251465, "global_step": 503442, "epoch": 6065} {"train_loss": -27.10379981994629, "global_step": 503443, "epoch": 6065} {"train_loss": -26.98567771911621, "global_step": 503444, "epoch": 6065} {"train_loss": -26.960926055908203, "global_step": 503445, "epoch": 6065} {"train_loss": -27.580963134765625, "global_step": 503446, "epoch": 6065} {"train_loss": -27.23236656188965, "global_step": 503447, "epoch": 6065} {"train_loss": -27.386245727539062, "global_step": 503448, "epoch": 6065} {"train_loss": -27.083112716674805, "global_step": 503449, "epoch": 6065} {"train_loss": -27.21261978149414, "global_step": 503450, "epoch": 6065} {"train_loss": -27.06294059753418, "global_step": 503451, "epoch": 6065} {"train_loss": -27.42014503479004, "global_step": 503452, "epoch": 6065} {"train_loss": -27.172271728515625, "global_step": 503453, "epoch": 6065} {"train_loss": -27.28571128845215, "global_step": 503454, "epoch": 6065} {"train_loss": -27.51356315612793, "global_step": 503455, "epoch": 6065} {"train_loss": -27.269296646118164, "global_step": 503456, "epoch": 6065} {"train_loss": -27.18692398071289, "global_step": 503457, "epoch": 6065} {"train_loss": -27.53082847595215, "global_step": 503458, "epoch": 6065} {"train_loss": -27.569395065307617, "global_step": 503459, "epoch": 6065} {"train_loss": -27.537214279174805, "global_step": 503460, "epoch": 6065} {"train_loss": -27.634384155273438, "global_step": 503461, "epoch": 6065} {"train_loss": -27.428442001342773, "global_step": 503462, "epoch": 6065} {"train_loss": -27.524173736572266, "global_step": 503463, "epoch": 6065} {"train_loss": -27.4169921875, "global_step": 503464, "epoch": 6065} {"train_loss": -27.3331241607666, "global_step": 503465, "epoch": 6065} {"train_loss": -27.367700576782227, "global_step": 503466, "epoch": 6065} {"train_loss": -27.4782657623291, "global_step": 503467, "epoch": 6065} {"train_loss": -27.508371353149414, "global_step": 503468, "epoch": 6065} {"train_loss": -27.483905792236328, "global_step": 503469, "epoch": 6065} {"train_loss": -27.578771591186523, "global_step": 503470, "epoch": 6065} {"train_loss": -27.2052059173584, "global_step": 503471, "epoch": 6065} {"train_loss": -27.373981475830078, "global_step": 503472, "epoch": 6065} {"train_loss": -27.489160537719727, "global_step": 503473, "epoch": 6065} {"train_loss": -27.285263061523438, "global_step": 503474, "epoch": 6065} {"train_loss": -27.5565128326416, "global_step": 503475, "epoch": 6065} {"train_loss": -27.581388473510742, "global_step": 503476, "epoch": 6065} {"train_loss": -27.405801520290144, "global_step": 503477, "epoch": 6065, "val_loss": 6517629.0} {"train_loss": -26.803674697875977, "global_step": 503478, "epoch": 6066} {"train_loss": -27.033506393432617, "global_step": 503479, "epoch": 6066} {"train_loss": -26.22175407409668, "global_step": 503480, "epoch": 6066} {"train_loss": -26.963987350463867, "global_step": 503481, "epoch": 6066} {"train_loss": -27.352157592773438, "global_step": 503482, "epoch": 6066} {"train_loss": -26.764469146728516, "global_step": 503483, "epoch": 6066} {"train_loss": -26.667327880859375, "global_step": 503484, "epoch": 6066} {"train_loss": -26.950071334838867, "global_step": 503485, "epoch": 6066} {"train_loss": -26.804401397705078, "global_step": 503486, "epoch": 6066} {"train_loss": -27.21845054626465, "global_step": 503487, "epoch": 6066} {"train_loss": -27.001737594604492, "global_step": 503488, "epoch": 6066} {"train_loss": -26.9974422454834, "global_step": 503489, "epoch": 6066} {"train_loss": -27.17618751525879, "global_step": 503490, "epoch": 6066} {"train_loss": -26.8009090423584, "global_step": 503491, "epoch": 6066} {"train_loss": -27.04685401916504, "global_step": 503492, "epoch": 6066} {"train_loss": -27.331220626831055, "global_step": 503493, "epoch": 6066} {"train_loss": -27.106189727783203, "global_step": 503494, "epoch": 6066} {"train_loss": -27.16348648071289, "global_step": 503495, "epoch": 6066} {"train_loss": -27.396032333374023, "global_step": 503496, "epoch": 6066} {"train_loss": -27.282623291015625, "global_step": 503497, "epoch": 6066} {"train_loss": -27.228824615478516, "global_step": 503498, "epoch": 6066} {"train_loss": -27.209991455078125, "global_step": 503499, "epoch": 6066} {"train_loss": -27.179046630859375, "global_step": 503500, "epoch": 6066} {"train_loss": -26.91876220703125, "global_step": 503501, "epoch": 6066} {"train_loss": -27.492002487182617, "global_step": 503502, "epoch": 6066} {"train_loss": -27.083972930908203, "global_step": 503503, "epoch": 6066} {"train_loss": -27.0491943359375, "global_step": 503504, "epoch": 6066} {"train_loss": -26.81818962097168, "global_step": 503505, "epoch": 6066} {"train_loss": -27.96392822265625, "global_step": 503506, "epoch": 6066} {"train_loss": -27.32159996032715, "global_step": 503507, "epoch": 6066} {"train_loss": -27.631942749023438, "global_step": 503508, "epoch": 6066} {"train_loss": -27.38811683654785, "global_step": 503509, "epoch": 6066} {"train_loss": -27.16636085510254, "global_step": 503510, "epoch": 6066} {"train_loss": -27.243432998657227, "global_step": 503511, "epoch": 6066} {"train_loss": -27.6774959564209, "global_step": 503512, "epoch": 6066} {"train_loss": -27.560754776000977, "global_step": 503513, "epoch": 6066} {"train_loss": -27.354970932006836, "global_step": 503514, "epoch": 6066} {"train_loss": -27.596698760986328, "global_step": 503515, "epoch": 6066} {"train_loss": -27.699859619140625, "global_step": 503516, "epoch": 6066} {"train_loss": -27.433734893798828, "global_step": 503517, "epoch": 6066} {"train_loss": -27.59260368347168, "global_step": 503518, "epoch": 6066} {"train_loss": -27.476781845092773, "global_step": 503519, "epoch": 6066} {"train_loss": -27.466272354125977, "global_step": 503520, "epoch": 6066} {"train_loss": -27.370044708251953, "global_step": 503521, "epoch": 6066} {"train_loss": -27.899972915649414, "global_step": 503522, "epoch": 6066} {"train_loss": -27.653024673461914, "global_step": 503523, "epoch": 6066} {"train_loss": -27.116886138916016, "global_step": 503524, "epoch": 6066} {"train_loss": -27.276891708374023, "global_step": 503525, "epoch": 6066} {"train_loss": -27.791364669799805, "global_step": 503526, "epoch": 6066} {"train_loss": -27.432937622070312, "global_step": 503527, "epoch": 6066} {"train_loss": -27.68854331970215, "global_step": 503528, "epoch": 6066} {"train_loss": -27.67463493347168, "global_step": 503529, "epoch": 6066} {"train_loss": -27.50641441345215, "global_step": 503530, "epoch": 6066} {"train_loss": -27.94244384765625, "global_step": 503531, "epoch": 6066} {"train_loss": -27.346576690673828, "global_step": 503532, "epoch": 6066} {"train_loss": -27.504261016845703, "global_step": 503533, "epoch": 6066} {"train_loss": -27.2910099029541, "global_step": 503534, "epoch": 6066} {"train_loss": -27.635284423828125, "global_step": 503535, "epoch": 6066} {"train_loss": -27.627017974853516, "global_step": 503536, "epoch": 6066} {"train_loss": -27.555994033813477, "global_step": 503537, "epoch": 6066} {"train_loss": -26.49676513671875, "global_step": 503538, "epoch": 6066} {"train_loss": -26.4337158203125, "global_step": 503539, "epoch": 6066} {"train_loss": -27.335920333862305, "global_step": 503540, "epoch": 6066} {"train_loss": -27.130300521850586, "global_step": 503541, "epoch": 6066} {"train_loss": -26.879377365112305, "global_step": 503542, "epoch": 6066} {"train_loss": -27.755712509155273, "global_step": 503543, "epoch": 6066} {"train_loss": -27.29634666442871, "global_step": 503544, "epoch": 6066} {"train_loss": -27.37495231628418, "global_step": 503545, "epoch": 6066} {"train_loss": -27.0584659576416, "global_step": 503546, "epoch": 6066} {"train_loss": -27.58693504333496, "global_step": 503547, "epoch": 6066} {"train_loss": -27.25685691833496, "global_step": 503548, "epoch": 6066} {"train_loss": -27.192840576171875, "global_step": 503549, "epoch": 6066} {"train_loss": -27.508392333984375, "global_step": 503550, "epoch": 6066} {"train_loss": -27.584943771362305, "global_step": 503551, "epoch": 6066} {"train_loss": -27.5709228515625, "global_step": 503552, "epoch": 6066} {"train_loss": -27.4807186126709, "global_step": 503553, "epoch": 6066} {"train_loss": -27.299596786499023, "global_step": 503554, "epoch": 6066} {"train_loss": -27.320783615112305, "global_step": 503555, "epoch": 6066} {"train_loss": -27.197019577026367, "global_step": 503556, "epoch": 6066} {"train_loss": -27.367822647094727, "global_step": 503557, "epoch": 6066} {"train_loss": -27.061649322509766, "global_step": 503558, "epoch": 6066} {"train_loss": -27.522266387939453, "global_step": 503559, "epoch": 6066} {"train_loss": -27.296512259058204, "global_step": 503560, "epoch": 6066, "val_loss": 6568255.0} {"train_loss": -26.834457397460938, "global_step": 503561, "epoch": 6067} {"train_loss": -26.6229248046875, "global_step": 503562, "epoch": 6067} {"train_loss": -26.477258682250977, "global_step": 503563, "epoch": 6067} {"train_loss": -27.21453285217285, "global_step": 503564, "epoch": 6067} {"train_loss": -26.186965942382812, "global_step": 503565, "epoch": 6067} {"train_loss": -27.018707275390625, "global_step": 503566, "epoch": 6067} {"train_loss": -26.713354110717773, "global_step": 503567, "epoch": 6067} {"train_loss": -27.203601837158203, "global_step": 503568, "epoch": 6067} {"train_loss": -26.629621505737305, "global_step": 503569, "epoch": 6067} {"train_loss": -26.008773803710938, "global_step": 503570, "epoch": 6067} {"train_loss": -26.505706787109375, "global_step": 503571, "epoch": 6067} {"train_loss": -27.03997802734375, "global_step": 503572, "epoch": 6067} {"train_loss": -26.191503524780273, "global_step": 503573, "epoch": 6067} {"train_loss": -26.902332305908203, "global_step": 503574, "epoch": 6067} {"train_loss": -27.178205490112305, "global_step": 503575, "epoch": 6067} {"train_loss": -26.5999698638916, "global_step": 503576, "epoch": 6067} {"train_loss": -26.79450035095215, "global_step": 503577, "epoch": 6067} {"train_loss": -26.923477172851562, "global_step": 503578, "epoch": 6067} {"train_loss": -27.10957145690918, "global_step": 503579, "epoch": 6067} {"train_loss": -26.868200302124023, "global_step": 503580, "epoch": 6067} {"train_loss": -27.18854331970215, "global_step": 503581, "epoch": 6067} {"train_loss": -27.295551300048828, "global_step": 503582, "epoch": 6067} {"train_loss": -27.133289337158203, "global_step": 503583, "epoch": 6067} {"train_loss": -27.509429931640625, "global_step": 503584, "epoch": 6067} {"train_loss": -27.22615623474121, "global_step": 503585, "epoch": 6067} {"train_loss": -27.175928115844727, "global_step": 503586, "epoch": 6067} {"train_loss": -27.091690063476562, "global_step": 503587, "epoch": 6067} {"train_loss": -27.355438232421875, "global_step": 503588, "epoch": 6067} {"train_loss": -26.9874324798584, "global_step": 503589, "epoch": 6067} {"train_loss": -27.11823081970215, "global_step": 503590, "epoch": 6067} {"train_loss": -27.132123947143555, "global_step": 503591, "epoch": 6067} {"train_loss": -27.4641056060791, "global_step": 503592, "epoch": 6067} {"train_loss": -27.190082550048828, "global_step": 503593, "epoch": 6067} {"train_loss": -27.049543380737305, "global_step": 503594, "epoch": 6067} {"train_loss": -27.352807998657227, "global_step": 503595, "epoch": 6067} {"train_loss": -27.242307662963867, "global_step": 503596, "epoch": 6067} {"train_loss": -26.84250259399414, "global_step": 503597, "epoch": 6067} {"train_loss": -27.582990646362305, "global_step": 503598, "epoch": 6067} {"train_loss": -27.027429580688477, "global_step": 503599, "epoch": 6067} {"train_loss": -27.397705078125, "global_step": 503600, "epoch": 6067} {"train_loss": -27.63360595703125, "global_step": 503601, "epoch": 6067} {"train_loss": -27.29255485534668, "global_step": 503602, "epoch": 6067} {"train_loss": -27.79620933532715, "global_step": 503603, "epoch": 6067} {"train_loss": -27.33247947692871, "global_step": 503604, "epoch": 6067} {"train_loss": -27.24329948425293, "global_step": 503605, "epoch": 6067} {"train_loss": -27.461807250976562, "global_step": 503606, "epoch": 6067} {"train_loss": -27.0849552154541, "global_step": 503607, "epoch": 6067} {"train_loss": -27.537160873413086, "global_step": 503608, "epoch": 6067} {"train_loss": -27.300586700439453, "global_step": 503609, "epoch": 6067} {"train_loss": -27.0871524810791, "global_step": 503610, "epoch": 6067} {"train_loss": -27.177549362182617, "global_step": 503611, "epoch": 6067} {"train_loss": -27.484146118164062, "global_step": 503612, "epoch": 6067} {"train_loss": -27.227182388305664, "global_step": 503613, "epoch": 6067} {"train_loss": -27.566253662109375, "global_step": 503614, "epoch": 6067} {"train_loss": -27.42042350769043, "global_step": 503615, "epoch": 6067} {"train_loss": -27.57269859313965, "global_step": 503616, "epoch": 6067} {"train_loss": -27.564260482788086, "global_step": 503617, "epoch": 6067} {"train_loss": -27.40839195251465, "global_step": 503618, "epoch": 6067} {"train_loss": -27.398218154907227, "global_step": 503619, "epoch": 6067} {"train_loss": -27.734848022460938, "global_step": 503620, "epoch": 6067} {"train_loss": -27.521026611328125, "global_step": 503621, "epoch": 6067} {"train_loss": -27.11165428161621, "global_step": 503622, "epoch": 6067} {"train_loss": -27.34228515625, "global_step": 503623, "epoch": 6067} {"train_loss": -27.231184005737305, "global_step": 503624, "epoch": 6067} {"train_loss": -27.417936325073242, "global_step": 503625, "epoch": 6067} {"train_loss": -27.431259155273438, "global_step": 503626, "epoch": 6067} {"train_loss": -27.502323150634766, "global_step": 503627, "epoch": 6067} {"train_loss": -27.655973434448242, "global_step": 503628, "epoch": 6067} {"train_loss": -27.097259521484375, "global_step": 503629, "epoch": 6067} {"train_loss": -27.102252960205078, "global_step": 503630, "epoch": 6067} {"train_loss": -27.053808212280273, "global_step": 503631, "epoch": 6067} {"train_loss": -27.745258331298828, "global_step": 503632, "epoch": 6067} {"train_loss": -27.6588191986084, "global_step": 503633, "epoch": 6067} {"train_loss": -27.435546875, "global_step": 503634, "epoch": 6067} {"train_loss": -27.025836944580078, "global_step": 503635, "epoch": 6067} {"train_loss": -27.44782829284668, "global_step": 503636, "epoch": 6067} {"train_loss": -27.83577537536621, "global_step": 503637, "epoch": 6067} {"train_loss": -27.708484649658203, "global_step": 503638, "epoch": 6067} {"train_loss": -27.611303329467773, "global_step": 503639, "epoch": 6067} {"train_loss": -27.557697296142578, "global_step": 503640, "epoch": 6067} {"train_loss": -27.62273597717285, "global_step": 503641, "epoch": 6067} {"train_loss": -27.448301315307617, "global_step": 503642, "epoch": 6067} {"train_loss": -27.223661675510638, "global_step": 503643, "epoch": 6067, "val_loss": 6486217.0} {"train_loss": -26.868432998657227, "global_step": 503644, "epoch": 6068} {"train_loss": -27.0192928314209, "global_step": 503645, "epoch": 6068} {"train_loss": -27.096158981323242, "global_step": 503646, "epoch": 6068} {"train_loss": -26.810932159423828, "global_step": 503647, "epoch": 6068} {"train_loss": -26.846891403198242, "global_step": 503648, "epoch": 6068} {"train_loss": -27.2630672454834, "global_step": 503649, "epoch": 6068} {"train_loss": -27.1175594329834, "global_step": 503650, "epoch": 6068} {"train_loss": -27.270526885986328, "global_step": 503651, "epoch": 6068} {"train_loss": -26.780431747436523, "global_step": 503652, "epoch": 6068} {"train_loss": -27.1652774810791, "global_step": 503653, "epoch": 6068} {"train_loss": -27.4013729095459, "global_step": 503654, "epoch": 6068} {"train_loss": -26.936420440673828, "global_step": 503655, "epoch": 6068} {"train_loss": -27.084508895874023, "global_step": 503656, "epoch": 6068} {"train_loss": -27.864917755126953, "global_step": 503657, "epoch": 6068} {"train_loss": -27.020185470581055, "global_step": 503658, "epoch": 6068} {"train_loss": -27.075681686401367, "global_step": 503659, "epoch": 6068} {"train_loss": -27.352615356445312, "global_step": 503660, "epoch": 6068} {"train_loss": -27.708051681518555, "global_step": 503661, "epoch": 6068} {"train_loss": -27.315963745117188, "global_step": 503662, "epoch": 6068} {"train_loss": -27.061689376831055, "global_step": 503663, "epoch": 6068} {"train_loss": -27.502933502197266, "global_step": 503664, "epoch": 6068} {"train_loss": -27.301361083984375, "global_step": 503665, "epoch": 6068} {"train_loss": -27.765104293823242, "global_step": 503666, "epoch": 6068} {"train_loss": -27.431894302368164, "global_step": 503667, "epoch": 6068} {"train_loss": -27.516637802124023, "global_step": 503668, "epoch": 6068} {"train_loss": -27.561832427978516, "global_step": 503669, "epoch": 6068} {"train_loss": -27.113428115844727, "global_step": 503670, "epoch": 6068} {"train_loss": -27.605457305908203, "global_step": 503671, "epoch": 6068} {"train_loss": -27.9295711517334, "global_step": 503672, "epoch": 6068} {"train_loss": -27.412418365478516, "global_step": 503673, "epoch": 6068} {"train_loss": -27.76534080505371, "global_step": 503674, "epoch": 6068} {"train_loss": -27.551008224487305, "global_step": 503675, "epoch": 6068} {"train_loss": -27.544763565063477, "global_step": 503676, "epoch": 6068} {"train_loss": -27.40164566040039, "global_step": 503677, "epoch": 6068} {"train_loss": -27.33307456970215, "global_step": 503678, "epoch": 6068} {"train_loss": -27.467212677001953, "global_step": 503679, "epoch": 6068} {"train_loss": -27.940393447875977, "global_step": 503680, "epoch": 6068} {"train_loss": -27.456390380859375, "global_step": 503681, "epoch": 6068} {"train_loss": -27.68898582458496, "global_step": 503682, "epoch": 6068} {"train_loss": -27.283117294311523, "global_step": 503683, "epoch": 6068} {"train_loss": -27.493452072143555, "global_step": 503684, "epoch": 6068} {"train_loss": -27.6636905670166, "global_step": 503685, "epoch": 6068} {"train_loss": -27.32032585144043, "global_step": 503686, "epoch": 6068} {"train_loss": -27.560382843017578, "global_step": 503687, "epoch": 6068} {"train_loss": -27.372175216674805, "global_step": 503688, "epoch": 6068} {"train_loss": -27.32196617126465, "global_step": 503689, "epoch": 6068} {"train_loss": -26.63538932800293, "global_step": 503690, "epoch": 6068} {"train_loss": -26.197025299072266, "global_step": 503691, "epoch": 6068} {"train_loss": -26.5488338470459, "global_step": 503692, "epoch": 6068} {"train_loss": -27.085500717163086, "global_step": 503693, "epoch": 6068} {"train_loss": -27.419147491455078, "global_step": 503694, "epoch": 6068} {"train_loss": -27.316986083984375, "global_step": 503695, "epoch": 6068} {"train_loss": -27.131744384765625, "global_step": 503696, "epoch": 6068} {"train_loss": -27.289026260375977, "global_step": 503697, "epoch": 6068} {"train_loss": -27.407766342163086, "global_step": 503698, "epoch": 6068} {"train_loss": -27.474563598632812, "global_step": 503699, "epoch": 6068} {"train_loss": -27.209442138671875, "global_step": 503700, "epoch": 6068} {"train_loss": -27.58344841003418, "global_step": 503701, "epoch": 6068} {"train_loss": -27.577136993408203, "global_step": 503702, "epoch": 6068} {"train_loss": -27.4462890625, "global_step": 503703, "epoch": 6068} {"train_loss": -27.557092666625977, "global_step": 503704, "epoch": 6068} {"train_loss": -27.43910026550293, "global_step": 503705, "epoch": 6068} {"train_loss": -27.604785919189453, "global_step": 503706, "epoch": 6068} {"train_loss": -27.454328536987305, "global_step": 503707, "epoch": 6068} {"train_loss": -27.397079467773438, "global_step": 503708, "epoch": 6068} {"train_loss": -27.764556884765625, "global_step": 503709, "epoch": 6068} {"train_loss": -27.63422966003418, "global_step": 503710, "epoch": 6068} {"train_loss": -27.469785690307617, "global_step": 503711, "epoch": 6068} {"train_loss": -27.61897850036621, "global_step": 503712, "epoch": 6068} {"train_loss": -27.471471786499023, "global_step": 503713, "epoch": 6068} {"train_loss": -27.664072036743164, "global_step": 503714, "epoch": 6068} {"train_loss": -27.775609970092773, "global_step": 503715, "epoch": 6068} {"train_loss": -27.60888671875, "global_step": 503716, "epoch": 6068} {"train_loss": -27.7376766204834, "global_step": 503717, "epoch": 6068} {"train_loss": -27.471179962158203, "global_step": 503718, "epoch": 6068} {"train_loss": -27.620737075805664, "global_step": 503719, "epoch": 6068} {"train_loss": -27.393278121948242, "global_step": 503720, "epoch": 6068} {"train_loss": -27.605497360229492, "global_step": 503721, "epoch": 6068} {"train_loss": -28.028308868408203, "global_step": 503722, "epoch": 6068} {"train_loss": -27.619461059570312, "global_step": 503723, "epoch": 6068} {"train_loss": -27.503570556640625, "global_step": 503724, "epoch": 6068} {"train_loss": -27.921934127807617, "global_step": 503725, "epoch": 6068} {"train_loss": -27.37777585868376, "global_step": 503726, "epoch": 6068, "val_loss": 6448145.0} {"train_loss": -25.579288482666016, "global_step": 503727, "epoch": 6069} {"train_loss": -22.389572143554688, "global_step": 503728, "epoch": 6069} {"train_loss": -21.833667755126953, "global_step": 503729, "epoch": 6069} {"train_loss": -25.84486961364746, "global_step": 503730, "epoch": 6069} {"train_loss": -23.451234817504883, "global_step": 503731, "epoch": 6069} {"train_loss": -25.803848266601562, "global_step": 503732, "epoch": 6069} {"train_loss": -25.422813415527344, "global_step": 503733, "epoch": 6069} {"train_loss": -25.746057510375977, "global_step": 503734, "epoch": 6069} {"train_loss": -25.951093673706055, "global_step": 503735, "epoch": 6069} {"train_loss": -26.06316566467285, "global_step": 503736, "epoch": 6069} {"train_loss": -26.2115421295166, "global_step": 503737, "epoch": 6069} {"train_loss": -26.476240158081055, "global_step": 503738, "epoch": 6069} {"train_loss": -26.21687889099121, "global_step": 503739, "epoch": 6069} {"train_loss": -26.368579864501953, "global_step": 503740, "epoch": 6069} {"train_loss": -26.748950958251953, "global_step": 503741, "epoch": 6069} {"train_loss": -26.49822998046875, "global_step": 503742, "epoch": 6069} {"train_loss": -26.597448348999023, "global_step": 503743, "epoch": 6069} {"train_loss": -26.541654586791992, "global_step": 503744, "epoch": 6069} {"train_loss": -26.739465713500977, "global_step": 503745, "epoch": 6069} {"train_loss": -26.606054306030273, "global_step": 503746, "epoch": 6069} {"train_loss": -26.33669090270996, "global_step": 503747, "epoch": 6069} {"train_loss": -26.362043380737305, "global_step": 503748, "epoch": 6069} {"train_loss": -26.9202880859375, "global_step": 503749, "epoch": 6069} {"train_loss": -26.780553817749023, "global_step": 503750, "epoch": 6069} {"train_loss": -26.757856369018555, "global_step": 503751, "epoch": 6069} {"train_loss": -27.278045654296875, "global_step": 503752, "epoch": 6069} {"train_loss": -26.588781356811523, "global_step": 503753, "epoch": 6069} {"train_loss": -26.950048446655273, "global_step": 503754, "epoch": 6069} {"train_loss": -27.271595001220703, "global_step": 503755, "epoch": 6069} {"train_loss": -27.03462028503418, "global_step": 503756, "epoch": 6069} {"train_loss": -26.854373931884766, "global_step": 503757, "epoch": 6069} {"train_loss": -27.089664459228516, "global_step": 503758, "epoch": 6069} {"train_loss": -27.134479522705078, "global_step": 503759, "epoch": 6069} {"train_loss": -27.10463523864746, "global_step": 503760, "epoch": 6069} {"train_loss": -27.144739151000977, "global_step": 503761, "epoch": 6069} {"train_loss": -27.18668556213379, "global_step": 503762, "epoch": 6069} {"train_loss": -27.038293838500977, "global_step": 503763, "epoch": 6069} {"train_loss": -27.630950927734375, "global_step": 503764, "epoch": 6069} {"train_loss": -27.568098068237305, "global_step": 503765, "epoch": 6069} {"train_loss": -27.023059844970703, "global_step": 503766, "epoch": 6069} {"train_loss": -27.20086097717285, "global_step": 503767, "epoch": 6069} {"train_loss": -27.40011978149414, "global_step": 503768, "epoch": 6069} {"train_loss": -27.449079513549805, "global_step": 503769, "epoch": 6069} {"train_loss": -27.372121810913086, "global_step": 503770, "epoch": 6069} {"train_loss": -27.508087158203125, "global_step": 503771, "epoch": 6069} {"train_loss": -27.508365631103516, "global_step": 503772, "epoch": 6069} {"train_loss": -27.051767349243164, "global_step": 503773, "epoch": 6069} {"train_loss": -27.599023818969727, "global_step": 503774, "epoch": 6069} {"train_loss": -27.399133682250977, "global_step": 503775, "epoch": 6069} {"train_loss": -27.460723876953125, "global_step": 503776, "epoch": 6069} {"train_loss": -27.67023277282715, "global_step": 503777, "epoch": 6069} {"train_loss": -27.425312042236328, "global_step": 503778, "epoch": 6069} {"train_loss": -27.183002471923828, "global_step": 503779, "epoch": 6069} {"train_loss": -27.642614364624023, "global_step": 503780, "epoch": 6069} {"train_loss": -27.407861709594727, "global_step": 503781, "epoch": 6069} {"train_loss": -27.083311080932617, "global_step": 503782, "epoch": 6069} {"train_loss": -27.003326416015625, "global_step": 503783, "epoch": 6069} {"train_loss": -27.16340446472168, "global_step": 503784, "epoch": 6069} {"train_loss": -27.275089263916016, "global_step": 503785, "epoch": 6069} {"train_loss": -27.443262100219727, "global_step": 503786, "epoch": 6069} {"train_loss": -27.424528121948242, "global_step": 503787, "epoch": 6069} {"train_loss": -27.30622673034668, "global_step": 503788, "epoch": 6069} {"train_loss": -27.387723922729492, "global_step": 503789, "epoch": 6069} {"train_loss": -27.037734985351562, "global_step": 503790, "epoch": 6069} {"train_loss": -27.634252548217773, "global_step": 503791, "epoch": 6069} {"train_loss": -27.081140518188477, "global_step": 503792, "epoch": 6069} {"train_loss": -27.386981964111328, "global_step": 503793, "epoch": 6069} {"train_loss": -27.424474716186523, "global_step": 503794, "epoch": 6069} {"train_loss": -27.440031051635742, "global_step": 503795, "epoch": 6069} {"train_loss": -27.313146591186523, "global_step": 503796, "epoch": 6069} {"train_loss": -27.4970760345459, "global_step": 503797, "epoch": 6069} {"train_loss": -27.38654899597168, "global_step": 503798, "epoch": 6069} {"train_loss": -27.733922958374023, "global_step": 503799, "epoch": 6069} {"train_loss": -27.63980484008789, "global_step": 503800, "epoch": 6069} {"train_loss": -27.611042022705078, "global_step": 503801, "epoch": 6069} {"train_loss": -27.3559513092041, "global_step": 503802, "epoch": 6069} {"train_loss": -27.699609756469727, "global_step": 503803, "epoch": 6069} {"train_loss": -27.53680419921875, "global_step": 503804, "epoch": 6069} {"train_loss": -27.36066246032715, "global_step": 503805, "epoch": 6069} {"train_loss": -27.861434936523438, "global_step": 503806, "epoch": 6069} {"train_loss": -27.579824447631836, "global_step": 503807, "epoch": 6069} {"train_loss": -27.911523818969727, "global_step": 503808, "epoch": 6069} {"train_loss": -26.912664964974645, "global_step": 503809, "epoch": 6069, "val_loss": 6553527.0} {"train_loss": -26.888452529907227, "global_step": 503810, "epoch": 6070} {"train_loss": -26.842756271362305, "global_step": 503811, "epoch": 6070} {"train_loss": -27.132104873657227, "global_step": 503812, "epoch": 6070} {"train_loss": -27.10687255859375, "global_step": 503813, "epoch": 6070} {"train_loss": -26.941761016845703, "global_step": 503814, "epoch": 6070} {"train_loss": -27.212011337280273, "global_step": 503815, "epoch": 6070} {"train_loss": -27.18250846862793, "global_step": 503816, "epoch": 6070} {"train_loss": -27.27579689025879, "global_step": 503817, "epoch": 6070} {"train_loss": -27.12320327758789, "global_step": 503818, "epoch": 6070} {"train_loss": -27.781696319580078, "global_step": 503819, "epoch": 6070} {"train_loss": -27.278400421142578, "global_step": 503820, "epoch": 6070} {"train_loss": -26.975732803344727, "global_step": 503821, "epoch": 6070} {"train_loss": -27.317245483398438, "global_step": 503822, "epoch": 6070} {"train_loss": -27.364633560180664, "global_step": 503823, "epoch": 6070} {"train_loss": -27.103530883789062, "global_step": 503824, "epoch": 6070} {"train_loss": -26.806049346923828, "global_step": 503825, "epoch": 6070} {"train_loss": -27.519775390625, "global_step": 503826, "epoch": 6070} {"train_loss": -27.309650421142578, "global_step": 503827, "epoch": 6070} {"train_loss": -27.267166137695312, "global_step": 503828, "epoch": 6070} {"train_loss": -27.458038330078125, "global_step": 503829, "epoch": 6070} {"train_loss": -27.361352920532227, "global_step": 503830, "epoch": 6070} {"train_loss": -27.44778823852539, "global_step": 503831, "epoch": 6070} {"train_loss": -27.593368530273438, "global_step": 503832, "epoch": 6070} {"train_loss": -27.41245460510254, "global_step": 503833, "epoch": 6070} {"train_loss": -27.849111557006836, "global_step": 503834, "epoch": 6070} {"train_loss": -27.589099884033203, "global_step": 503835, "epoch": 6070} {"train_loss": -27.646595001220703, "global_step": 503836, "epoch": 6070} {"train_loss": -27.35470962524414, "global_step": 503837, "epoch": 6070} {"train_loss": -27.75604820251465, "global_step": 503838, "epoch": 6070} {"train_loss": -27.56304931640625, "global_step": 503839, "epoch": 6070} {"train_loss": -27.339191436767578, "global_step": 503840, "epoch": 6070} {"train_loss": -27.591840744018555, "global_step": 503841, "epoch": 6070} {"train_loss": -27.356420516967773, "global_step": 503842, "epoch": 6070} {"train_loss": -27.538061141967773, "global_step": 503843, "epoch": 6070} {"train_loss": -27.34895896911621, "global_step": 503844, "epoch": 6070} {"train_loss": -27.456195831298828, "global_step": 503845, "epoch": 6070} {"train_loss": -27.62859535217285, "global_step": 503846, "epoch": 6070} {"train_loss": -27.75726890563965, "global_step": 503847, "epoch": 6070} {"train_loss": -27.301258087158203, "global_step": 503848, "epoch": 6070} {"train_loss": -27.043691635131836, "global_step": 503849, "epoch": 6070} {"train_loss": -27.639745712280273, "global_step": 503850, "epoch": 6070} {"train_loss": -27.60153579711914, "global_step": 503851, "epoch": 6070} {"train_loss": -27.34319496154785, "global_step": 503852, "epoch": 6070} {"train_loss": -27.71564292907715, "global_step": 503853, "epoch": 6070} {"train_loss": -27.63427734375, "global_step": 503854, "epoch": 6070} {"train_loss": -27.79315757751465, "global_step": 503855, "epoch": 6070} {"train_loss": -27.379953384399414, "global_step": 503856, "epoch": 6070} {"train_loss": -27.76456642150879, "global_step": 503857, "epoch": 6070} {"train_loss": -28.099515914916992, "global_step": 503858, "epoch": 6070} {"train_loss": -27.873580932617188, "global_step": 503859, "epoch": 6070} {"train_loss": -27.361713409423828, "global_step": 503860, "epoch": 6070} {"train_loss": -27.573196411132812, "global_step": 503861, "epoch": 6070} {"train_loss": -27.362401962280273, "global_step": 503862, "epoch": 6070} {"train_loss": -27.403339385986328, "global_step": 503863, "epoch": 6070} {"train_loss": -27.291290283203125, "global_step": 503864, "epoch": 6070} {"train_loss": -27.5163631439209, "global_step": 503865, "epoch": 6070} {"train_loss": -27.823942184448242, "global_step": 503866, "epoch": 6070} {"train_loss": -27.35101318359375, "global_step": 503867, "epoch": 6070} {"train_loss": -27.583906173706055, "global_step": 503868, "epoch": 6070} {"train_loss": -27.173786163330078, "global_step": 503869, "epoch": 6070} {"train_loss": -27.59039878845215, "global_step": 503870, "epoch": 6070} {"train_loss": -27.580154418945312, "global_step": 503871, "epoch": 6070} {"train_loss": -27.31805992126465, "global_step": 503872, "epoch": 6070} {"train_loss": -27.3775577545166, "global_step": 503873, "epoch": 6070} {"train_loss": -27.48609733581543, "global_step": 503874, "epoch": 6070} {"train_loss": -27.55573081970215, "global_step": 503875, "epoch": 6070} {"train_loss": -27.70208740234375, "global_step": 503876, "epoch": 6070} {"train_loss": -27.358362197875977, "global_step": 503877, "epoch": 6070} {"train_loss": -27.29290199279785, "global_step": 503878, "epoch": 6070} {"train_loss": -27.481287002563477, "global_step": 503879, "epoch": 6070} {"train_loss": -27.525671005249023, "global_step": 503880, "epoch": 6070} {"train_loss": -27.658002853393555, "global_step": 503881, "epoch": 6070} {"train_loss": -27.521970748901367, "global_step": 503882, "epoch": 6070} {"train_loss": -27.918380737304688, "global_step": 503883, "epoch": 6070} {"train_loss": -27.617603302001953, "global_step": 503884, "epoch": 6070} {"train_loss": -27.77528190612793, "global_step": 503885, "epoch": 6070} {"train_loss": -27.794036865234375, "global_step": 503886, "epoch": 6070} {"train_loss": -27.610578536987305, "global_step": 503887, "epoch": 6070} {"train_loss": -27.59748649597168, "global_step": 503888, "epoch": 6070} {"train_loss": -27.651599884033203, "global_step": 503889, "epoch": 6070} {"train_loss": -27.698827743530273, "global_step": 503890, "epoch": 6070} {"train_loss": -27.266834259033203, "global_step": 503891, "epoch": 6070} {"train_loss": -27.45048897524914, "global_step": 503892, "epoch": 6070, "val_loss": 6522419.0} {"train_loss": -27.389509201049805, "global_step": 503893, "epoch": 6071} {"train_loss": -27.055463790893555, "global_step": 503894, "epoch": 6071} {"train_loss": -26.8655948638916, "global_step": 503895, "epoch": 6071} {"train_loss": -27.000049591064453, "global_step": 503896, "epoch": 6071} {"train_loss": -26.990619659423828, "global_step": 503897, "epoch": 6071} {"train_loss": -27.611536026000977, "global_step": 503898, "epoch": 6071} {"train_loss": -27.493417739868164, "global_step": 503899, "epoch": 6071} {"train_loss": -27.694547653198242, "global_step": 503900, "epoch": 6071} {"train_loss": -27.113330841064453, "global_step": 503901, "epoch": 6071} {"train_loss": -27.31790542602539, "global_step": 503902, "epoch": 6071} {"train_loss": -27.473236083984375, "global_step": 503903, "epoch": 6071} {"train_loss": -27.2432918548584, "global_step": 503904, "epoch": 6071} {"train_loss": -26.99675941467285, "global_step": 503905, "epoch": 6071} {"train_loss": -27.187408447265625, "global_step": 503906, "epoch": 6071} {"train_loss": -27.066577911376953, "global_step": 503907, "epoch": 6071} {"train_loss": -27.7344970703125, "global_step": 503908, "epoch": 6071} {"train_loss": -27.202621459960938, "global_step": 503909, "epoch": 6071} {"train_loss": -27.164731979370117, "global_step": 503910, "epoch": 6071} {"train_loss": -27.695804595947266, "global_step": 503911, "epoch": 6071} {"train_loss": -27.30788230895996, "global_step": 503912, "epoch": 6071} {"train_loss": -27.01743507385254, "global_step": 503913, "epoch": 6071} {"train_loss": -27.16571044921875, "global_step": 503914, "epoch": 6071} {"train_loss": -27.34554100036621, "global_step": 503915, "epoch": 6071} {"train_loss": -27.43593406677246, "global_step": 503916, "epoch": 6071} {"train_loss": -27.527908325195312, "global_step": 503917, "epoch": 6071} {"train_loss": -27.18351173400879, "global_step": 503918, "epoch": 6071} {"train_loss": -27.49207878112793, "global_step": 503919, "epoch": 6071} {"train_loss": -27.44893455505371, "global_step": 503920, "epoch": 6071} {"train_loss": -27.124876022338867, "global_step": 503921, "epoch": 6071} {"train_loss": -27.754907608032227, "global_step": 503922, "epoch": 6071} {"train_loss": -27.417707443237305, "global_step": 503923, "epoch": 6071} {"train_loss": -27.122663497924805, "global_step": 503924, "epoch": 6071} {"train_loss": -27.4627628326416, "global_step": 503925, "epoch": 6071} {"train_loss": -27.407678604125977, "global_step": 503926, "epoch": 6071} {"train_loss": -27.548755645751953, "global_step": 503927, "epoch": 6071} {"train_loss": -27.13897705078125, "global_step": 503928, "epoch": 6071} {"train_loss": -27.487873077392578, "global_step": 503929, "epoch": 6071} {"train_loss": -27.711584091186523, "global_step": 503930, "epoch": 6071} {"train_loss": -27.648975372314453, "global_step": 503931, "epoch": 6071} {"train_loss": -28.062097549438477, "global_step": 503932, "epoch": 6071} {"train_loss": -27.595905303955078, "global_step": 503933, "epoch": 6071} {"train_loss": -27.521148681640625, "global_step": 503934, "epoch": 6071} {"train_loss": -27.355188369750977, "global_step": 503935, "epoch": 6071} {"train_loss": -27.566741943359375, "global_step": 503936, "epoch": 6071} {"train_loss": -27.335805892944336, "global_step": 503937, "epoch": 6071} {"train_loss": -27.46083641052246, "global_step": 503938, "epoch": 6071} {"train_loss": -27.462726593017578, "global_step": 503939, "epoch": 6071} {"train_loss": -27.3229923248291, "global_step": 503940, "epoch": 6071} {"train_loss": -27.635297775268555, "global_step": 503941, "epoch": 6071} {"train_loss": -27.428152084350586, "global_step": 503942, "epoch": 6071} {"train_loss": -27.30927848815918, "global_step": 503943, "epoch": 6071} {"train_loss": -27.528339385986328, "global_step": 503944, "epoch": 6071} {"train_loss": -27.503448486328125, "global_step": 503945, "epoch": 6071} {"train_loss": -27.741580963134766, "global_step": 503946, "epoch": 6071} {"train_loss": -27.874448776245117, "global_step": 503947, "epoch": 6071} {"train_loss": -27.670690536499023, "global_step": 503948, "epoch": 6071} {"train_loss": -27.521015167236328, "global_step": 503949, "epoch": 6071} {"train_loss": -27.496601104736328, "global_step": 503950, "epoch": 6071} {"train_loss": -27.754465103149414, "global_step": 503951, "epoch": 6071} {"train_loss": -27.540821075439453, "global_step": 503952, "epoch": 6071} {"train_loss": -27.619842529296875, "global_step": 503953, "epoch": 6071} {"train_loss": -27.496274948120117, "global_step": 503954, "epoch": 6071} {"train_loss": -27.4205322265625, "global_step": 503955, "epoch": 6071} {"train_loss": -27.149707794189453, "global_step": 503956, "epoch": 6071} {"train_loss": -28.059467315673828, "global_step": 503957, "epoch": 6071} {"train_loss": -27.458337783813477, "global_step": 503958, "epoch": 6071} {"train_loss": -27.406457901000977, "global_step": 503959, "epoch": 6071} {"train_loss": -27.44441032409668, "global_step": 503960, "epoch": 6071} {"train_loss": -27.836597442626953, "global_step": 503961, "epoch": 6071} {"train_loss": -27.3817138671875, "global_step": 503962, "epoch": 6071} {"train_loss": -27.242467880249023, "global_step": 503963, "epoch": 6071} {"train_loss": -26.9185848236084, "global_step": 503964, "epoch": 6071} {"train_loss": -26.920276641845703, "global_step": 503965, "epoch": 6071} {"train_loss": -26.989105224609375, "global_step": 503966, "epoch": 6071} {"train_loss": -27.030553817749023, "global_step": 503967, "epoch": 6071} {"train_loss": -27.27374839782715, "global_step": 503968, "epoch": 6071} {"train_loss": -27.590927124023438, "global_step": 503969, "epoch": 6071} {"train_loss": -27.304346084594727, "global_step": 503970, "epoch": 6071} {"train_loss": -27.225494384765625, "global_step": 503971, "epoch": 6071} {"train_loss": -27.558828353881836, "global_step": 503972, "epoch": 6071} {"train_loss": -27.421234130859375, "global_step": 503973, "epoch": 6071} {"train_loss": -27.380460739135742, "global_step": 503974, "epoch": 6071} {"train_loss": -27.409499501607502, "global_step": 503975, "epoch": 6071, "val_loss": 6556610.5} {"train_loss": -26.849334716796875, "global_step": 503976, "epoch": 6072} {"train_loss": -26.73394203186035, "global_step": 503977, "epoch": 6072} {"train_loss": -26.833683013916016, "global_step": 503978, "epoch": 6072} {"train_loss": -27.07574462890625, "global_step": 503979, "epoch": 6072} {"train_loss": -27.1072998046875, "global_step": 503980, "epoch": 6072} {"train_loss": -26.659610748291016, "global_step": 503981, "epoch": 6072} {"train_loss": -26.89145278930664, "global_step": 503982, "epoch": 6072} {"train_loss": -26.869375228881836, "global_step": 503983, "epoch": 6072} {"train_loss": -26.933658599853516, "global_step": 503984, "epoch": 6072} {"train_loss": -26.94056510925293, "global_step": 503985, "epoch": 6072} {"train_loss": -26.77076530456543, "global_step": 503986, "epoch": 6072} {"train_loss": -26.939008712768555, "global_step": 503987, "epoch": 6072} {"train_loss": -27.183629989624023, "global_step": 503988, "epoch": 6072} {"train_loss": -27.125553131103516, "global_step": 503989, "epoch": 6072} {"train_loss": -26.712249755859375, "global_step": 503990, "epoch": 6072} {"train_loss": -27.72312355041504, "global_step": 503991, "epoch": 6072} {"train_loss": -27.056806564331055, "global_step": 503992, "epoch": 6072} {"train_loss": -27.621540069580078, "global_step": 503993, "epoch": 6072} {"train_loss": -27.253576278686523, "global_step": 503994, "epoch": 6072} {"train_loss": -27.52828025817871, "global_step": 503995, "epoch": 6072} {"train_loss": -27.171096801757812, "global_step": 503996, "epoch": 6072} {"train_loss": -27.1299991607666, "global_step": 503997, "epoch": 6072} {"train_loss": -27.16584587097168, "global_step": 503998, "epoch": 6072} {"train_loss": -27.160247802734375, "global_step": 503999, "epoch": 6072} {"train_loss": -27.1627254486084, "global_step": 504000, "epoch": 6072} {"train_loss": -27.425256729125977, "global_step": 504001, "epoch": 6072} {"train_loss": -27.427656173706055, "global_step": 504002, "epoch": 6072} {"train_loss": -27.0385684967041, "global_step": 504003, "epoch": 6072} {"train_loss": -27.330984115600586, "global_step": 504004, "epoch": 6072} {"train_loss": -27.351913452148438, "global_step": 504005, "epoch": 6072} {"train_loss": -27.46686363220215, "global_step": 504006, "epoch": 6072} {"train_loss": -27.031024932861328, "global_step": 504007, "epoch": 6072} {"train_loss": -27.678735733032227, "global_step": 504008, "epoch": 6072} {"train_loss": -27.472888946533203, "global_step": 504009, "epoch": 6072} {"train_loss": -27.611425399780273, "global_step": 504010, "epoch": 6072} {"train_loss": -26.983341217041016, "global_step": 504011, "epoch": 6072} {"train_loss": -27.42852783203125, "global_step": 504012, "epoch": 6072} {"train_loss": -27.190448760986328, "global_step": 504013, "epoch": 6072} {"train_loss": -27.657590866088867, "global_step": 504014, "epoch": 6072} {"train_loss": -27.090009689331055, "global_step": 504015, "epoch": 6072} {"train_loss": -27.48738670349121, "global_step": 504016, "epoch": 6072} {"train_loss": -27.478656768798828, "global_step": 504017, "epoch": 6072} {"train_loss": -27.337949752807617, "global_step": 504018, "epoch": 6072} {"train_loss": -27.29025650024414, "global_step": 504019, "epoch": 6072} {"train_loss": -27.440811157226562, "global_step": 504020, "epoch": 6072} {"train_loss": -27.170225143432617, "global_step": 504021, "epoch": 6072} {"train_loss": -27.498655319213867, "global_step": 504022, "epoch": 6072} {"train_loss": -26.973678588867188, "global_step": 504023, "epoch": 6072} {"train_loss": -27.371692657470703, "global_step": 504024, "epoch": 6072} {"train_loss": -27.501943588256836, "global_step": 504025, "epoch": 6072} {"train_loss": -27.84575843811035, "global_step": 504026, "epoch": 6072} {"train_loss": -27.390613555908203, "global_step": 504027, "epoch": 6072} {"train_loss": -27.362533569335938, "global_step": 504028, "epoch": 6072} {"train_loss": -27.633512496948242, "global_step": 504029, "epoch": 6072} {"train_loss": -27.697330474853516, "global_step": 504030, "epoch": 6072} {"train_loss": -27.577381134033203, "global_step": 504031, "epoch": 6072} {"train_loss": -27.42864418029785, "global_step": 504032, "epoch": 6072} {"train_loss": -27.442874908447266, "global_step": 504033, "epoch": 6072} {"train_loss": -27.227035522460938, "global_step": 504034, "epoch": 6072} {"train_loss": -27.18665885925293, "global_step": 504035, "epoch": 6072} {"train_loss": -26.736495971679688, "global_step": 504036, "epoch": 6072} {"train_loss": -26.578699111938477, "global_step": 504037, "epoch": 6072} {"train_loss": -26.19671630859375, "global_step": 504038, "epoch": 6072} {"train_loss": -26.820043563842773, "global_step": 504039, "epoch": 6072} {"train_loss": -27.532337188720703, "global_step": 504040, "epoch": 6072} {"train_loss": -27.00419044494629, "global_step": 504041, "epoch": 6072} {"train_loss": -27.440927505493164, "global_step": 504042, "epoch": 6072} {"train_loss": -27.133026123046875, "global_step": 504043, "epoch": 6072} {"train_loss": -27.4423828125, "global_step": 504044, "epoch": 6072} {"train_loss": -27.324750900268555, "global_step": 504045, "epoch": 6072} {"train_loss": -27.204641342163086, "global_step": 504046, "epoch": 6072} {"train_loss": -27.215635299682617, "global_step": 504047, "epoch": 6072} {"train_loss": -27.844806671142578, "global_step": 504048, "epoch": 6072} {"train_loss": -27.3320369720459, "global_step": 504049, "epoch": 6072} {"train_loss": -27.1064510345459, "global_step": 504050, "epoch": 6072} {"train_loss": -27.666784286499023, "global_step": 504051, "epoch": 6072} {"train_loss": -27.392404556274414, "global_step": 504052, "epoch": 6072} {"train_loss": -27.508773803710938, "global_step": 504053, "epoch": 6072} {"train_loss": -27.567493438720703, "global_step": 504054, "epoch": 6072} {"train_loss": -27.21815299987793, "global_step": 504055, "epoch": 6072} {"train_loss": -27.347448348999023, "global_step": 504056, "epoch": 6072} {"train_loss": -27.236326217651367, "global_step": 504057, "epoch": 6072} {"train_loss": -27.25527227930276, "global_step": 504058, "epoch": 6072, "val_loss": 6652467.0} {"train_loss": -26.59564208984375, "global_step": 504059, "epoch": 6073} {"train_loss": -24.819307327270508, "global_step": 504060, "epoch": 6073} {"train_loss": -26.19086265563965, "global_step": 504061, "epoch": 6073} {"train_loss": -26.774999618530273, "global_step": 504062, "epoch": 6073} {"train_loss": -25.17303466796875, "global_step": 504063, "epoch": 6073} {"train_loss": -26.66110610961914, "global_step": 504064, "epoch": 6073} {"train_loss": -26.17938804626465, "global_step": 504065, "epoch": 6073} {"train_loss": -26.65694236755371, "global_step": 504066, "epoch": 6073} {"train_loss": -26.612110137939453, "global_step": 504067, "epoch": 6073} {"train_loss": -26.051074981689453, "global_step": 504068, "epoch": 6073} {"train_loss": -26.396127700805664, "global_step": 504069, "epoch": 6073} {"train_loss": -26.17844581604004, "global_step": 504070, "epoch": 6073} {"train_loss": -27.259580612182617, "global_step": 504071, "epoch": 6073} {"train_loss": -26.576520919799805, "global_step": 504072, "epoch": 6073} {"train_loss": -26.862112045288086, "global_step": 504073, "epoch": 6073} {"train_loss": -26.679065704345703, "global_step": 504074, "epoch": 6073} {"train_loss": -26.518835067749023, "global_step": 504075, "epoch": 6073} {"train_loss": -26.5119571685791, "global_step": 504076, "epoch": 6073} {"train_loss": -27.052570343017578, "global_step": 504077, "epoch": 6073} {"train_loss": -26.959976196289062, "global_step": 504078, "epoch": 6073} {"train_loss": -27.32830238342285, "global_step": 504079, "epoch": 6073} {"train_loss": -27.65834617614746, "global_step": 504080, "epoch": 6073} {"train_loss": -27.176929473876953, "global_step": 504081, "epoch": 6073} {"train_loss": -26.866119384765625, "global_step": 504082, "epoch": 6073} {"train_loss": -26.88387107849121, "global_step": 504083, "epoch": 6073} {"train_loss": -27.2065486907959, "global_step": 504084, "epoch": 6073} {"train_loss": -27.142377853393555, "global_step": 504085, "epoch": 6073} {"train_loss": -27.347681045532227, "global_step": 504086, "epoch": 6073} {"train_loss": -27.150060653686523, "global_step": 504087, "epoch": 6073} {"train_loss": -26.700407028198242, "global_step": 504088, "epoch": 6073} {"train_loss": -27.25286865234375, "global_step": 504089, "epoch": 6073} {"train_loss": -27.028493881225586, "global_step": 504090, "epoch": 6073} {"train_loss": -27.163965225219727, "global_step": 504091, "epoch": 6073} {"train_loss": -27.12433433532715, "global_step": 504092, "epoch": 6073} {"train_loss": -27.208532333374023, "global_step": 504093, "epoch": 6073} {"train_loss": -27.28907585144043, "global_step": 504094, "epoch": 6073} {"train_loss": -27.41059684753418, "global_step": 504095, "epoch": 6073} {"train_loss": -27.500232696533203, "global_step": 504096, "epoch": 6073} {"train_loss": -27.139814376831055, "global_step": 504097, "epoch": 6073} {"train_loss": -27.235029220581055, "global_step": 504098, "epoch": 6073} {"train_loss": -27.387969970703125, "global_step": 504099, "epoch": 6073} {"train_loss": -27.120929718017578, "global_step": 504100, "epoch": 6073} {"train_loss": -27.301721572875977, "global_step": 504101, "epoch": 6073} {"train_loss": -27.58277702331543, "global_step": 504102, "epoch": 6073} {"train_loss": -27.54975700378418, "global_step": 504103, "epoch": 6073} {"train_loss": -27.58310890197754, "global_step": 504104, "epoch": 6073} {"train_loss": -27.35989761352539, "global_step": 504105, "epoch": 6073} {"train_loss": -27.141876220703125, "global_step": 504106, "epoch": 6073} {"train_loss": -27.585941314697266, "global_step": 504107, "epoch": 6073} {"train_loss": -27.335712432861328, "global_step": 504108, "epoch": 6073} {"train_loss": -27.72823143005371, "global_step": 504109, "epoch": 6073} {"train_loss": -27.520475387573242, "global_step": 504110, "epoch": 6073} {"train_loss": -27.443145751953125, "global_step": 504111, "epoch": 6073} {"train_loss": -27.829273223876953, "global_step": 504112, "epoch": 6073} {"train_loss": -27.441259384155273, "global_step": 504113, "epoch": 6073} {"train_loss": -27.423643112182617, "global_step": 504114, "epoch": 6073} {"train_loss": -27.2127685546875, "global_step": 504115, "epoch": 6073} {"train_loss": -26.40302085876465, "global_step": 504116, "epoch": 6073} {"train_loss": -26.820911407470703, "global_step": 504117, "epoch": 6073} {"train_loss": -27.029483795166016, "global_step": 504118, "epoch": 6073} {"train_loss": -27.49147605895996, "global_step": 504119, "epoch": 6073} {"train_loss": -27.358850479125977, "global_step": 504120, "epoch": 6073} {"train_loss": -26.92603874206543, "global_step": 504121, "epoch": 6073} {"train_loss": -26.582427978515625, "global_step": 504122, "epoch": 6073} {"train_loss": -26.90361976623535, "global_step": 504123, "epoch": 6073} {"train_loss": -25.666040420532227, "global_step": 504124, "epoch": 6073} {"train_loss": -26.057371139526367, "global_step": 504125, "epoch": 6073} {"train_loss": -26.78215980529785, "global_step": 504126, "epoch": 6073} {"train_loss": -27.255664825439453, "global_step": 504127, "epoch": 6073} {"train_loss": -27.194507598876953, "global_step": 504128, "epoch": 6073} {"train_loss": -26.9999942779541, "global_step": 504129, "epoch": 6073} {"train_loss": -27.326751708984375, "global_step": 504130, "epoch": 6073} {"train_loss": -27.104894638061523, "global_step": 504131, "epoch": 6073} {"train_loss": -26.64926528930664, "global_step": 504132, "epoch": 6073} {"train_loss": -27.211095809936523, "global_step": 504133, "epoch": 6073} {"train_loss": -26.974828720092773, "global_step": 504134, "epoch": 6073} {"train_loss": -27.194477081298828, "global_step": 504135, "epoch": 6073} {"train_loss": -27.173908233642578, "global_step": 504136, "epoch": 6073} {"train_loss": -27.16238784790039, "global_step": 504137, "epoch": 6073} {"train_loss": -27.325855255126953, "global_step": 504138, "epoch": 6073} {"train_loss": -27.343236923217773, "global_step": 504139, "epoch": 6073} {"train_loss": -27.491683959960938, "global_step": 504140, "epoch": 6073} {"train_loss": -26.997342948453973, "global_step": 504141, "epoch": 6073, "val_loss": 6685725.0} {"train_loss": -25.97467041015625, "global_step": 504142, "epoch": 6074} {"train_loss": -26.793323516845703, "global_step": 504143, "epoch": 6074} {"train_loss": -26.605371475219727, "global_step": 504144, "epoch": 6074} {"train_loss": -25.845794677734375, "global_step": 504145, "epoch": 6074} {"train_loss": -26.846160888671875, "global_step": 504146, "epoch": 6074} {"train_loss": -26.52326011657715, "global_step": 504147, "epoch": 6074} {"train_loss": -26.494718551635742, "global_step": 504148, "epoch": 6074} {"train_loss": -26.5036678314209, "global_step": 504149, "epoch": 6074} {"train_loss": -26.865659713745117, "global_step": 504150, "epoch": 6074} {"train_loss": -27.385278701782227, "global_step": 504151, "epoch": 6074} {"train_loss": -26.876422882080078, "global_step": 504152, "epoch": 6074} {"train_loss": -26.747922897338867, "global_step": 504153, "epoch": 6074} {"train_loss": -26.888538360595703, "global_step": 504154, "epoch": 6074} {"train_loss": -27.102630615234375, "global_step": 504155, "epoch": 6074} {"train_loss": -27.119953155517578, "global_step": 504156, "epoch": 6074} {"train_loss": -26.9298038482666, "global_step": 504157, "epoch": 6074} {"train_loss": -27.135602951049805, "global_step": 504158, "epoch": 6074} {"train_loss": -26.842981338500977, "global_step": 504159, "epoch": 6074} {"train_loss": -27.33265495300293, "global_step": 504160, "epoch": 6074} {"train_loss": -27.350006103515625, "global_step": 504161, "epoch": 6074} {"train_loss": -27.209949493408203, "global_step": 504162, "epoch": 6074} {"train_loss": -27.355121612548828, "global_step": 504163, "epoch": 6074} {"train_loss": -27.500341415405273, "global_step": 504164, "epoch": 6074} {"train_loss": -27.198923110961914, "global_step": 504165, "epoch": 6074} {"train_loss": -27.2338924407959, "global_step": 504166, "epoch": 6074} {"train_loss": -27.43332290649414, "global_step": 504167, "epoch": 6074} {"train_loss": -27.28596305847168, "global_step": 504168, "epoch": 6074} {"train_loss": -27.352697372436523, "global_step": 504169, "epoch": 6074} {"train_loss": -27.438806533813477, "global_step": 504170, "epoch": 6074} {"train_loss": -27.200672149658203, "global_step": 504171, "epoch": 6074} {"train_loss": -27.194456100463867, "global_step": 504172, "epoch": 6074} {"train_loss": -27.547998428344727, "global_step": 504173, "epoch": 6074} {"train_loss": -27.308273315429688, "global_step": 504174, "epoch": 6074} {"train_loss": -27.122892379760742, "global_step": 504175, "epoch": 6074} {"train_loss": -27.687732696533203, "global_step": 504176, "epoch": 6074} {"train_loss": -27.498891830444336, "global_step": 504177, "epoch": 6074} {"train_loss": -27.718738555908203, "global_step": 504178, "epoch": 6074} {"train_loss": -27.680200576782227, "global_step": 504179, "epoch": 6074} {"train_loss": -27.678424835205078, "global_step": 504180, "epoch": 6074} {"train_loss": -27.07293701171875, "global_step": 504181, "epoch": 6074} {"train_loss": -27.392074584960938, "global_step": 504182, "epoch": 6074} {"train_loss": -27.61146354675293, "global_step": 504183, "epoch": 6074} {"train_loss": -27.35398292541504, "global_step": 504184, "epoch": 6074} {"train_loss": -27.790283203125, "global_step": 504185, "epoch": 6074} {"train_loss": -27.75315284729004, "global_step": 504186, "epoch": 6074} {"train_loss": -27.67414665222168, "global_step": 504187, "epoch": 6074} {"train_loss": -27.22450828552246, "global_step": 504188, "epoch": 6074} {"train_loss": -27.430435180664062, "global_step": 504189, "epoch": 6074} {"train_loss": -27.610700607299805, "global_step": 504190, "epoch": 6074} {"train_loss": -27.407629013061523, "global_step": 504191, "epoch": 6074} {"train_loss": -28.058568954467773, "global_step": 504192, "epoch": 6074} {"train_loss": -27.387481689453125, "global_step": 504193, "epoch": 6074} {"train_loss": -27.248132705688477, "global_step": 504194, "epoch": 6074} {"train_loss": -27.66609764099121, "global_step": 504195, "epoch": 6074} {"train_loss": -27.383161544799805, "global_step": 504196, "epoch": 6074} {"train_loss": -27.02301597595215, "global_step": 504197, "epoch": 6074} {"train_loss": -26.67679214477539, "global_step": 504198, "epoch": 6074} {"train_loss": -26.672826766967773, "global_step": 504199, "epoch": 6074} {"train_loss": -26.00008201599121, "global_step": 504200, "epoch": 6074} {"train_loss": -26.72707176208496, "global_step": 504201, "epoch": 6074} {"train_loss": -26.923492431640625, "global_step": 504202, "epoch": 6074} {"train_loss": -26.494192123413086, "global_step": 504203, "epoch": 6074} {"train_loss": -27.062116622924805, "global_step": 504204, "epoch": 6074} {"train_loss": -27.052215576171875, "global_step": 504205, "epoch": 6074} {"train_loss": -26.885900497436523, "global_step": 504206, "epoch": 6074} {"train_loss": -27.313024520874023, "global_step": 504207, "epoch": 6074} {"train_loss": -27.0615291595459, "global_step": 504208, "epoch": 6074} {"train_loss": -26.9655704498291, "global_step": 504209, "epoch": 6074} {"train_loss": -27.038888931274414, "global_step": 504210, "epoch": 6074} {"train_loss": -26.804471969604492, "global_step": 504211, "epoch": 6074} {"train_loss": -27.08953857421875, "global_step": 504212, "epoch": 6074} {"train_loss": -26.9495906829834, "global_step": 504213, "epoch": 6074} {"train_loss": -27.321496963500977, "global_step": 504214, "epoch": 6074} {"train_loss": -27.515966415405273, "global_step": 504215, "epoch": 6074} {"train_loss": -27.51442527770996, "global_step": 504216, "epoch": 6074} {"train_loss": -27.330108642578125, "global_step": 504217, "epoch": 6074} {"train_loss": -27.070331573486328, "global_step": 504218, "epoch": 6074} {"train_loss": -27.619718551635742, "global_step": 504219, "epoch": 6074} {"train_loss": -27.141571044921875, "global_step": 504220, "epoch": 6074} {"train_loss": -27.660741806030273, "global_step": 504221, "epoch": 6074} {"train_loss": -27.229028701782227, "global_step": 504222, "epoch": 6074} {"train_loss": -27.274423599243164, "global_step": 504223, "epoch": 6074} {"train_loss": -27.16298758265484, "global_step": 504224, "epoch": 6074, "val_loss": 6473349.0} {"train_loss": -27.49969482421875, "global_step": 504225, "epoch": 6075} {"train_loss": -26.835346221923828, "global_step": 504226, "epoch": 6075} {"train_loss": -27.17585563659668, "global_step": 504227, "epoch": 6075} {"train_loss": -26.82423973083496, "global_step": 504228, "epoch": 6075} {"train_loss": -27.683837890625, "global_step": 504229, "epoch": 6075} {"train_loss": -27.3577938079834, "global_step": 504230, "epoch": 6075} {"train_loss": -27.302814483642578, "global_step": 504231, "epoch": 6075} {"train_loss": -27.442291259765625, "global_step": 504232, "epoch": 6075} {"train_loss": -26.970800399780273, "global_step": 504233, "epoch": 6075} {"train_loss": -27.007678985595703, "global_step": 504234, "epoch": 6075} {"train_loss": -27.23056411743164, "global_step": 504235, "epoch": 6075} {"train_loss": -27.191532135009766, "global_step": 504236, "epoch": 6075} {"train_loss": -27.27093505859375, "global_step": 504237, "epoch": 6075} {"train_loss": -26.98648452758789, "global_step": 504238, "epoch": 6075} {"train_loss": -27.414960861206055, "global_step": 504239, "epoch": 6075} {"train_loss": -27.212671279907227, "global_step": 504240, "epoch": 6075} {"train_loss": -27.39520263671875, "global_step": 504241, "epoch": 6075} {"train_loss": -27.426916122436523, "global_step": 504242, "epoch": 6075} {"train_loss": -27.12607765197754, "global_step": 504243, "epoch": 6075} {"train_loss": -27.756052017211914, "global_step": 504244, "epoch": 6075} {"train_loss": -27.725996017456055, "global_step": 504245, "epoch": 6075} {"train_loss": -27.625818252563477, "global_step": 504246, "epoch": 6075} {"train_loss": -27.644092559814453, "global_step": 504247, "epoch": 6075} {"train_loss": -27.512014389038086, "global_step": 504248, "epoch": 6075} {"train_loss": -27.66571617126465, "global_step": 504249, "epoch": 6075} {"train_loss": -27.27277946472168, "global_step": 504250, "epoch": 6075} {"train_loss": -27.56987953186035, "global_step": 504251, "epoch": 6075} {"train_loss": -27.49188232421875, "global_step": 504252, "epoch": 6075} {"train_loss": -27.54449462890625, "global_step": 504253, "epoch": 6075} {"train_loss": -27.278966903686523, "global_step": 504254, "epoch": 6075} {"train_loss": -27.390893936157227, "global_step": 504255, "epoch": 6075} {"train_loss": -27.381229400634766, "global_step": 504256, "epoch": 6075} {"train_loss": -27.496118545532227, "global_step": 504257, "epoch": 6075} {"train_loss": -28.014495849609375, "global_step": 504258, "epoch": 6075} {"train_loss": -27.650358200073242, "global_step": 504259, "epoch": 6075} {"train_loss": -27.595748901367188, "global_step": 504260, "epoch": 6075} {"train_loss": -27.613128662109375, "global_step": 504261, "epoch": 6075} {"train_loss": -27.61573600769043, "global_step": 504262, "epoch": 6075} {"train_loss": -27.777292251586914, "global_step": 504263, "epoch": 6075} {"train_loss": -27.265796661376953, "global_step": 504264, "epoch": 6075} {"train_loss": -27.485721588134766, "global_step": 504265, "epoch": 6075} {"train_loss": -27.255136489868164, "global_step": 504266, "epoch": 6075} {"train_loss": -27.8046875, "global_step": 504267, "epoch": 6075} {"train_loss": -27.67608642578125, "global_step": 504268, "epoch": 6075} {"train_loss": -27.419042587280273, "global_step": 504269, "epoch": 6075} {"train_loss": -27.260379791259766, "global_step": 504270, "epoch": 6075} {"train_loss": -27.42461585998535, "global_step": 504271, "epoch": 6075} {"train_loss": -27.55609130859375, "global_step": 504272, "epoch": 6075} {"train_loss": -27.13911247253418, "global_step": 504273, "epoch": 6075} {"train_loss": -27.837158203125, "global_step": 504274, "epoch": 6075} {"train_loss": -27.369537353515625, "global_step": 504275, "epoch": 6075} {"train_loss": -27.429407119750977, "global_step": 504276, "epoch": 6075} {"train_loss": -27.130359649658203, "global_step": 504277, "epoch": 6075} {"train_loss": -27.467151641845703, "global_step": 504278, "epoch": 6075} {"train_loss": -27.41585350036621, "global_step": 504279, "epoch": 6075} {"train_loss": -27.540023803710938, "global_step": 504280, "epoch": 6075} {"train_loss": -27.47125244140625, "global_step": 504281, "epoch": 6075} {"train_loss": -27.353500366210938, "global_step": 504282, "epoch": 6075} {"train_loss": -27.434223175048828, "global_step": 504283, "epoch": 6075} {"train_loss": -27.223920822143555, "global_step": 504284, "epoch": 6075} {"train_loss": -27.728479385375977, "global_step": 504285, "epoch": 6075} {"train_loss": -27.336191177368164, "global_step": 504286, "epoch": 6075} {"train_loss": -27.22321891784668, "global_step": 504287, "epoch": 6075} {"train_loss": -27.23723793029785, "global_step": 504288, "epoch": 6075} {"train_loss": -27.437793731689453, "global_step": 504289, "epoch": 6075} {"train_loss": -27.337787628173828, "global_step": 504290, "epoch": 6075} {"train_loss": -27.320051193237305, "global_step": 504291, "epoch": 6075} {"train_loss": -27.567785263061523, "global_step": 504292, "epoch": 6075} {"train_loss": -27.599157333374023, "global_step": 504293, "epoch": 6075} {"train_loss": -27.535202026367188, "global_step": 504294, "epoch": 6075} {"train_loss": -27.672134399414062, "global_step": 504295, "epoch": 6075} {"train_loss": -27.268817901611328, "global_step": 504296, "epoch": 6075} {"train_loss": -27.738248825073242, "global_step": 504297, "epoch": 6075} {"train_loss": -27.432373046875, "global_step": 504298, "epoch": 6075} {"train_loss": -27.213550567626953, "global_step": 504299, "epoch": 6075} {"train_loss": -27.42317008972168, "global_step": 504300, "epoch": 6075} {"train_loss": -27.655776977539062, "global_step": 504301, "epoch": 6075} {"train_loss": -27.349227905273438, "global_step": 504302, "epoch": 6075} {"train_loss": -27.416906356811523, "global_step": 504303, "epoch": 6075} {"train_loss": -27.34966468811035, "global_step": 504304, "epoch": 6075} {"train_loss": -27.306554794311523, "global_step": 504305, "epoch": 6075} {"train_loss": -27.984973907470703, "global_step": 504306, "epoch": 6075} {"train_loss": -27.444896950779192, "global_step": 504307, "epoch": 6075, "val_loss": 6444070.0} {"train_loss": -26.984521865844727, "global_step": 504308, "epoch": 6076} {"train_loss": -27.149276733398438, "global_step": 504309, "epoch": 6076} {"train_loss": -27.1230525970459, "global_step": 504310, "epoch": 6076} {"train_loss": -26.9879207611084, "global_step": 504311, "epoch": 6076} {"train_loss": -27.24072265625, "global_step": 504312, "epoch": 6076} {"train_loss": -26.914661407470703, "global_step": 504313, "epoch": 6076} {"train_loss": -26.827167510986328, "global_step": 504314, "epoch": 6076} {"train_loss": -27.084257125854492, "global_step": 504315, "epoch": 6076} {"train_loss": -27.2906494140625, "global_step": 504316, "epoch": 6076} {"train_loss": -27.37114906311035, "global_step": 504317, "epoch": 6076} {"train_loss": -27.061758041381836, "global_step": 504318, "epoch": 6076} {"train_loss": -27.435211181640625, "global_step": 504319, "epoch": 6076} {"train_loss": -27.267576217651367, "global_step": 504320, "epoch": 6076} {"train_loss": -27.21600914001465, "global_step": 504321, "epoch": 6076} {"train_loss": -26.9122371673584, "global_step": 504322, "epoch": 6076} {"train_loss": -27.029211044311523, "global_step": 504323, "epoch": 6076} {"train_loss": -27.161611557006836, "global_step": 504324, "epoch": 6076} {"train_loss": -27.25266456604004, "global_step": 504325, "epoch": 6076} {"train_loss": -27.43537712097168, "global_step": 504326, "epoch": 6076} {"train_loss": -27.156513214111328, "global_step": 504327, "epoch": 6076} {"train_loss": -27.289142608642578, "global_step": 504328, "epoch": 6076} {"train_loss": -27.22503089904785, "global_step": 504329, "epoch": 6076} {"train_loss": -27.226470947265625, "global_step": 504330, "epoch": 6076} {"train_loss": -27.319501876831055, "global_step": 504331, "epoch": 6076} {"train_loss": -27.464008331298828, "global_step": 504332, "epoch": 6076} {"train_loss": -27.707916259765625, "global_step": 504333, "epoch": 6076} {"train_loss": -27.265287399291992, "global_step": 504334, "epoch": 6076} {"train_loss": -27.3787899017334, "global_step": 504335, "epoch": 6076} {"train_loss": -27.541135787963867, "global_step": 504336, "epoch": 6076} {"train_loss": -27.596097946166992, "global_step": 504337, "epoch": 6076} {"train_loss": -27.493860244750977, "global_step": 504338, "epoch": 6076} {"train_loss": -27.685834884643555, "global_step": 504339, "epoch": 6076} {"train_loss": -27.800506591796875, "global_step": 504340, "epoch": 6076} {"train_loss": -27.77324867248535, "global_step": 504341, "epoch": 6076} {"train_loss": -27.365034103393555, "global_step": 504342, "epoch": 6076} {"train_loss": -28.06606101989746, "global_step": 504343, "epoch": 6076} {"train_loss": -27.371143341064453, "global_step": 504344, "epoch": 6076} {"train_loss": -27.59583854675293, "global_step": 504345, "epoch": 6076} {"train_loss": -27.142532348632812, "global_step": 504346, "epoch": 6076} {"train_loss": -27.43336296081543, "global_step": 504347, "epoch": 6076} {"train_loss": -27.22370719909668, "global_step": 504348, "epoch": 6076} {"train_loss": -27.013120651245117, "global_step": 504349, "epoch": 6076} {"train_loss": -27.447439193725586, "global_step": 504350, "epoch": 6076} {"train_loss": -27.620208740234375, "global_step": 504351, "epoch": 6076} {"train_loss": -27.77028465270996, "global_step": 504352, "epoch": 6076} {"train_loss": -27.6367130279541, "global_step": 504353, "epoch": 6076} {"train_loss": -27.569412231445312, "global_step": 504354, "epoch": 6076} {"train_loss": -27.61659049987793, "global_step": 504355, "epoch": 6076} {"train_loss": -27.49421501159668, "global_step": 504356, "epoch": 6076} {"train_loss": -27.31935691833496, "global_step": 504357, "epoch": 6076} {"train_loss": -27.697900772094727, "global_step": 504358, "epoch": 6076} {"train_loss": -27.566862106323242, "global_step": 504359, "epoch": 6076} {"train_loss": -27.523822784423828, "global_step": 504360, "epoch": 6076} {"train_loss": -28.045820236206055, "global_step": 504361, "epoch": 6076} {"train_loss": -27.482187271118164, "global_step": 504362, "epoch": 6076} {"train_loss": -27.515216827392578, "global_step": 504363, "epoch": 6076} {"train_loss": -27.29804801940918, "global_step": 504364, "epoch": 6076} {"train_loss": -26.997949600219727, "global_step": 504365, "epoch": 6076} {"train_loss": -27.162450790405273, "global_step": 504366, "epoch": 6076} {"train_loss": -27.419971466064453, "global_step": 504367, "epoch": 6076} {"train_loss": -27.410436630249023, "global_step": 504368, "epoch": 6076} {"train_loss": -27.644018173217773, "global_step": 504369, "epoch": 6076} {"train_loss": -27.0122013092041, "global_step": 504370, "epoch": 6076} {"train_loss": -27.396728515625, "global_step": 504371, "epoch": 6076} {"train_loss": -27.54157066345215, "global_step": 504372, "epoch": 6076} {"train_loss": -27.62058448791504, "global_step": 504373, "epoch": 6076} {"train_loss": -27.882795333862305, "global_step": 504374, "epoch": 6076} {"train_loss": -27.404455184936523, "global_step": 504375, "epoch": 6076} {"train_loss": -27.33731460571289, "global_step": 504376, "epoch": 6076} {"train_loss": -27.620361328125, "global_step": 504377, "epoch": 6076} {"train_loss": -27.493017196655273, "global_step": 504378, "epoch": 6076} {"train_loss": -27.845407485961914, "global_step": 504379, "epoch": 6076} {"train_loss": -27.707416534423828, "global_step": 504380, "epoch": 6076} {"train_loss": -27.182897567749023, "global_step": 504381, "epoch": 6076} {"train_loss": -27.69648551940918, "global_step": 504382, "epoch": 6076} {"train_loss": -27.490747451782227, "global_step": 504383, "epoch": 6076} {"train_loss": -27.144123077392578, "global_step": 504384, "epoch": 6076} {"train_loss": -27.635343551635742, "global_step": 504385, "epoch": 6076} {"train_loss": -27.316877365112305, "global_step": 504386, "epoch": 6076} {"train_loss": -27.754764556884766, "global_step": 504387, "epoch": 6076} {"train_loss": -27.5417423248291, "global_step": 504388, "epoch": 6076} {"train_loss": -27.3974609375, "global_step": 504389, "epoch": 6076} {"train_loss": -27.40803440507636, "global_step": 504390, "epoch": 6076, "val_loss": 6487891.0} {"train_loss": -26.270465850830078, "global_step": 504391, "epoch": 6077} {"train_loss": -25.84870719909668, "global_step": 504392, "epoch": 6077} {"train_loss": -26.830503463745117, "global_step": 504393, "epoch": 6077} {"train_loss": -26.95135498046875, "global_step": 504394, "epoch": 6077} {"train_loss": -27.016050338745117, "global_step": 504395, "epoch": 6077} {"train_loss": -26.460437774658203, "global_step": 504396, "epoch": 6077} {"train_loss": -26.526264190673828, "global_step": 504397, "epoch": 6077} {"train_loss": -26.894872665405273, "global_step": 504398, "epoch": 6077} {"train_loss": -26.51703453063965, "global_step": 504399, "epoch": 6077} {"train_loss": -26.811132431030273, "global_step": 504400, "epoch": 6077} {"train_loss": -26.81159782409668, "global_step": 504401, "epoch": 6077} {"train_loss": -26.381317138671875, "global_step": 504402, "epoch": 6077} {"train_loss": -26.994495391845703, "global_step": 504403, "epoch": 6077} {"train_loss": -26.831867218017578, "global_step": 504404, "epoch": 6077} {"train_loss": -27.2490291595459, "global_step": 504405, "epoch": 6077} {"train_loss": -26.71485710144043, "global_step": 504406, "epoch": 6077} {"train_loss": -27.09089469909668, "global_step": 504407, "epoch": 6077} {"train_loss": -26.85398292541504, "global_step": 504408, "epoch": 6077} {"train_loss": -26.861408233642578, "global_step": 504409, "epoch": 6077} {"train_loss": -26.8804988861084, "global_step": 504410, "epoch": 6077} {"train_loss": -27.04163932800293, "global_step": 504411, "epoch": 6077} {"train_loss": -27.27085304260254, "global_step": 504412, "epoch": 6077} {"train_loss": -27.118377685546875, "global_step": 504413, "epoch": 6077} {"train_loss": -27.299955368041992, "global_step": 504414, "epoch": 6077} {"train_loss": -27.028827667236328, "global_step": 504415, "epoch": 6077} {"train_loss": -26.908557891845703, "global_step": 504416, "epoch": 6077} {"train_loss": -27.049137115478516, "global_step": 504417, "epoch": 6077} {"train_loss": -27.067874908447266, "global_step": 504418, "epoch": 6077} {"train_loss": -27.137741088867188, "global_step": 504419, "epoch": 6077} {"train_loss": -27.21382713317871, "global_step": 504420, "epoch": 6077} {"train_loss": -26.611913681030273, "global_step": 504421, "epoch": 6077} {"train_loss": -27.83888053894043, "global_step": 504422, "epoch": 6077} {"train_loss": -27.47149085998535, "global_step": 504423, "epoch": 6077} {"train_loss": -27.412826538085938, "global_step": 504424, "epoch": 6077} {"train_loss": -27.544981002807617, "global_step": 504425, "epoch": 6077} {"train_loss": -27.476043701171875, "global_step": 504426, "epoch": 6077} {"train_loss": -27.2370662689209, "global_step": 504427, "epoch": 6077} {"train_loss": -27.803022384643555, "global_step": 504428, "epoch": 6077} {"train_loss": -27.26836585998535, "global_step": 504429, "epoch": 6077} {"train_loss": -27.53582763671875, "global_step": 504430, "epoch": 6077} {"train_loss": -27.34639549255371, "global_step": 504431, "epoch": 6077} {"train_loss": -27.057416915893555, "global_step": 504432, "epoch": 6077} {"train_loss": -27.70069694519043, "global_step": 504433, "epoch": 6077} {"train_loss": -27.585660934448242, "global_step": 504434, "epoch": 6077} {"train_loss": -27.469221115112305, "global_step": 504435, "epoch": 6077} {"train_loss": -27.312255859375, "global_step": 504436, "epoch": 6077} {"train_loss": -27.78445816040039, "global_step": 504437, "epoch": 6077} {"train_loss": -27.91633415222168, "global_step": 504438, "epoch": 6077} {"train_loss": -27.799047470092773, "global_step": 504439, "epoch": 6077} {"train_loss": -27.344654083251953, "global_step": 504440, "epoch": 6077} {"train_loss": -27.576568603515625, "global_step": 504441, "epoch": 6077} {"train_loss": -27.67074966430664, "global_step": 504442, "epoch": 6077} {"train_loss": -27.962772369384766, "global_step": 504443, "epoch": 6077} {"train_loss": -27.554187774658203, "global_step": 504444, "epoch": 6077} {"train_loss": -27.765012741088867, "global_step": 504445, "epoch": 6077} {"train_loss": -27.846893310546875, "global_step": 504446, "epoch": 6077} {"train_loss": -27.793277740478516, "global_step": 504447, "epoch": 6077} {"train_loss": -27.576292037963867, "global_step": 504448, "epoch": 6077} {"train_loss": -27.449283599853516, "global_step": 504449, "epoch": 6077} {"train_loss": -27.80817222595215, "global_step": 504450, "epoch": 6077} {"train_loss": -27.96710205078125, "global_step": 504451, "epoch": 6077} {"train_loss": -27.760725021362305, "global_step": 504452, "epoch": 6077} {"train_loss": -27.883533477783203, "global_step": 504453, "epoch": 6077} {"train_loss": -27.40167808532715, "global_step": 504454, "epoch": 6077} {"train_loss": -27.803730010986328, "global_step": 504455, "epoch": 6077} {"train_loss": -27.897912979125977, "global_step": 504456, "epoch": 6077} {"train_loss": -27.51412010192871, "global_step": 504457, "epoch": 6077} {"train_loss": -27.574386596679688, "global_step": 504458, "epoch": 6077} {"train_loss": -27.457136154174805, "global_step": 504459, "epoch": 6077} {"train_loss": -27.633508682250977, "global_step": 504460, "epoch": 6077} {"train_loss": -27.7721004486084, "global_step": 504461, "epoch": 6077} {"train_loss": -27.395795822143555, "global_step": 504462, "epoch": 6077} {"train_loss": -27.337162017822266, "global_step": 504463, "epoch": 6077} {"train_loss": -27.503753662109375, "global_step": 504464, "epoch": 6077} {"train_loss": -27.8953914642334, "global_step": 504465, "epoch": 6077} {"train_loss": -27.27473258972168, "global_step": 504466, "epoch": 6077} {"train_loss": -27.644025802612305, "global_step": 504467, "epoch": 6077} {"train_loss": -27.04009437561035, "global_step": 504468, "epoch": 6077} {"train_loss": -26.66639518737793, "global_step": 504469, "epoch": 6077} {"train_loss": -25.725133895874023, "global_step": 504470, "epoch": 6077} {"train_loss": -26.451269149780273, "global_step": 504471, "epoch": 6077} {"train_loss": -27.24213981628418, "global_step": 504472, "epoch": 6077} {"train_loss": -27.268490458109294, "global_step": 504473, "epoch": 6077, "val_loss": 6483476.0} {"train_loss": -26.177444458007812, "global_step": 504474, "epoch": 6078} {"train_loss": -25.837270736694336, "global_step": 504475, "epoch": 6078} {"train_loss": -26.137882232666016, "global_step": 504476, "epoch": 6078} {"train_loss": -26.375812530517578, "global_step": 504477, "epoch": 6078} {"train_loss": -25.830551147460938, "global_step": 504478, "epoch": 6078} {"train_loss": -26.798583984375, "global_step": 504479, "epoch": 6078} {"train_loss": -25.902311325073242, "global_step": 504480, "epoch": 6078} {"train_loss": -26.752887725830078, "global_step": 504481, "epoch": 6078} {"train_loss": -26.374582290649414, "global_step": 504482, "epoch": 6078} {"train_loss": -26.474506378173828, "global_step": 504483, "epoch": 6078} {"train_loss": -26.489246368408203, "global_step": 504484, "epoch": 6078} {"train_loss": -26.494144439697266, "global_step": 504485, "epoch": 6078} {"train_loss": -26.67466163635254, "global_step": 504486, "epoch": 6078} {"train_loss": -27.003009796142578, "global_step": 504487, "epoch": 6078} {"train_loss": -26.97171401977539, "global_step": 504488, "epoch": 6078} {"train_loss": -26.42450523376465, "global_step": 504489, "epoch": 6078} {"train_loss": -27.007923126220703, "global_step": 504490, "epoch": 6078} {"train_loss": -26.9941463470459, "global_step": 504491, "epoch": 6078} {"train_loss": -26.95490074157715, "global_step": 504492, "epoch": 6078} {"train_loss": -26.978931427001953, "global_step": 504493, "epoch": 6078} {"train_loss": -26.768808364868164, "global_step": 504494, "epoch": 6078} {"train_loss": -27.11542320251465, "global_step": 504495, "epoch": 6078} {"train_loss": -26.905790328979492, "global_step": 504496, "epoch": 6078} {"train_loss": -27.129383087158203, "global_step": 504497, "epoch": 6078} {"train_loss": -27.239831924438477, "global_step": 504498, "epoch": 6078} {"train_loss": -26.902938842773438, "global_step": 504499, "epoch": 6078} {"train_loss": -27.30966567993164, "global_step": 504500, "epoch": 6078} {"train_loss": -27.270910263061523, "global_step": 504501, "epoch": 6078} {"train_loss": -26.966093063354492, "global_step": 504502, "epoch": 6078} {"train_loss": -27.17563819885254, "global_step": 504503, "epoch": 6078} {"train_loss": -27.37025260925293, "global_step": 504504, "epoch": 6078} {"train_loss": -27.239852905273438, "global_step": 504505, "epoch": 6078} {"train_loss": -27.061065673828125, "global_step": 504506, "epoch": 6078} {"train_loss": -27.161584854125977, "global_step": 504507, "epoch": 6078} {"train_loss": -27.525299072265625, "global_step": 504508, "epoch": 6078} {"train_loss": -27.40130615234375, "global_step": 504509, "epoch": 6078} {"train_loss": -27.237852096557617, "global_step": 504510, "epoch": 6078} {"train_loss": -27.577484130859375, "global_step": 504511, "epoch": 6078} {"train_loss": -27.787830352783203, "global_step": 504512, "epoch": 6078} {"train_loss": -27.461164474487305, "global_step": 504513, "epoch": 6078} {"train_loss": -27.58544921875, "global_step": 504514, "epoch": 6078} {"train_loss": -27.08527946472168, "global_step": 504515, "epoch": 6078} {"train_loss": -27.714069366455078, "global_step": 504516, "epoch": 6078} {"train_loss": -27.793561935424805, "global_step": 504517, "epoch": 6078} {"train_loss": -27.7511043548584, "global_step": 504518, "epoch": 6078} {"train_loss": -27.674753189086914, "global_step": 504519, "epoch": 6078} {"train_loss": -27.390771865844727, "global_step": 504520, "epoch": 6078} {"train_loss": -27.41560173034668, "global_step": 504521, "epoch": 6078} {"train_loss": -27.831146240234375, "global_step": 504522, "epoch": 6078} {"train_loss": -27.653656005859375, "global_step": 504523, "epoch": 6078} {"train_loss": -27.059585571289062, "global_step": 504524, "epoch": 6078} {"train_loss": -27.466094970703125, "global_step": 504525, "epoch": 6078} {"train_loss": -27.449289321899414, "global_step": 504526, "epoch": 6078} {"train_loss": -27.69916343688965, "global_step": 504527, "epoch": 6078} {"train_loss": -27.551013946533203, "global_step": 504528, "epoch": 6078} {"train_loss": -27.36907386779785, "global_step": 504529, "epoch": 6078} {"train_loss": -27.38606071472168, "global_step": 504530, "epoch": 6078} {"train_loss": -27.34598731994629, "global_step": 504531, "epoch": 6078} {"train_loss": -27.67474365234375, "global_step": 504532, "epoch": 6078} {"train_loss": -27.7336368560791, "global_step": 504533, "epoch": 6078} {"train_loss": -27.711339950561523, "global_step": 504534, "epoch": 6078} {"train_loss": -27.71942710876465, "global_step": 504535, "epoch": 6078} {"train_loss": -27.584882736206055, "global_step": 504536, "epoch": 6078} {"train_loss": -27.544668197631836, "global_step": 504537, "epoch": 6078} {"train_loss": -27.723987579345703, "global_step": 504538, "epoch": 6078} {"train_loss": -27.686695098876953, "global_step": 504539, "epoch": 6078} {"train_loss": -27.76849937438965, "global_step": 504540, "epoch": 6078} {"train_loss": -27.838855743408203, "global_step": 504541, "epoch": 6078} {"train_loss": -27.969593048095703, "global_step": 504542, "epoch": 6078} {"train_loss": -27.70777702331543, "global_step": 504543, "epoch": 6078} {"train_loss": -27.410253524780273, "global_step": 504544, "epoch": 6078} {"train_loss": -27.754114151000977, "global_step": 504545, "epoch": 6078} {"train_loss": -27.834903717041016, "global_step": 504546, "epoch": 6078} {"train_loss": -27.590112686157227, "global_step": 504547, "epoch": 6078} {"train_loss": -27.784626007080078, "global_step": 504548, "epoch": 6078} {"train_loss": -27.76218605041504, "global_step": 504549, "epoch": 6078} {"train_loss": -27.3031063079834, "global_step": 504550, "epoch": 6078} {"train_loss": -27.9482421875, "global_step": 504551, "epoch": 6078} {"train_loss": -27.788654327392578, "global_step": 504552, "epoch": 6078} {"train_loss": -27.43802261352539, "global_step": 504553, "epoch": 6078} {"train_loss": -27.382022857666016, "global_step": 504554, "epoch": 6078} {"train_loss": -27.276147842407227, "global_step": 504555, "epoch": 6078} {"train_loss": -27.22711082826178, "global_step": 504556, "epoch": 6078, "val_loss": 6463585.5} {"train_loss": -23.935056686401367, "global_step": 504557, "epoch": 6079} {"train_loss": -23.558935165405273, "global_step": 504558, "epoch": 6079} {"train_loss": -25.155317306518555, "global_step": 504559, "epoch": 6079} {"train_loss": -24.43379020690918, "global_step": 504560, "epoch": 6079} {"train_loss": -25.07111930847168, "global_step": 504561, "epoch": 6079} {"train_loss": -24.87244987487793, "global_step": 504562, "epoch": 6079} {"train_loss": -25.518524169921875, "global_step": 504563, "epoch": 6079} {"train_loss": -26.1696720123291, "global_step": 504564, "epoch": 6079} {"train_loss": -26.29668617248535, "global_step": 504565, "epoch": 6079} {"train_loss": -26.377185821533203, "global_step": 504566, "epoch": 6079} {"train_loss": -26.1654109954834, "global_step": 504567, "epoch": 6079} {"train_loss": -26.533950805664062, "global_step": 504568, "epoch": 6079} {"train_loss": -25.994617462158203, "global_step": 504569, "epoch": 6079} {"train_loss": -26.27788734436035, "global_step": 504570, "epoch": 6079} {"train_loss": -26.16741371154785, "global_step": 504571, "epoch": 6079} {"train_loss": -26.423694610595703, "global_step": 504572, "epoch": 6079} {"train_loss": -26.347625732421875, "global_step": 504573, "epoch": 6079} {"train_loss": -26.31390953063965, "global_step": 504574, "epoch": 6079} {"train_loss": -26.3078670501709, "global_step": 504575, "epoch": 6079} {"train_loss": -26.725147247314453, "global_step": 504576, "epoch": 6079} {"train_loss": -26.68391990661621, "global_step": 504577, "epoch": 6079} {"train_loss": -26.41277503967285, "global_step": 504578, "epoch": 6079} {"train_loss": -26.933841705322266, "global_step": 504579, "epoch": 6079} {"train_loss": -26.71953773498535, "global_step": 504580, "epoch": 6079} {"train_loss": -26.5856876373291, "global_step": 504581, "epoch": 6079} {"train_loss": -26.433765411376953, "global_step": 504582, "epoch": 6079} {"train_loss": -26.805753707885742, "global_step": 504583, "epoch": 6079} {"train_loss": -26.79132080078125, "global_step": 504584, "epoch": 6079} {"train_loss": -26.84761619567871, "global_step": 504585, "epoch": 6079} {"train_loss": -26.972305297851562, "global_step": 504586, "epoch": 6079} {"train_loss": -26.718219757080078, "global_step": 504587, "epoch": 6079} {"train_loss": -27.099979400634766, "global_step": 504588, "epoch": 6079} {"train_loss": -26.9386043548584, "global_step": 504589, "epoch": 6079} {"train_loss": -26.917236328125, "global_step": 504590, "epoch": 6079} {"train_loss": -27.13270378112793, "global_step": 504591, "epoch": 6079} {"train_loss": -27.241132736206055, "global_step": 504592, "epoch": 6079} {"train_loss": -26.954452514648438, "global_step": 504593, "epoch": 6079} {"train_loss": -27.059782028198242, "global_step": 504594, "epoch": 6079} {"train_loss": -27.398029327392578, "global_step": 504595, "epoch": 6079} {"train_loss": -27.418750762939453, "global_step": 504596, "epoch": 6079} {"train_loss": -27.246122360229492, "global_step": 504597, "epoch": 6079} {"train_loss": -27.230436325073242, "global_step": 504598, "epoch": 6079} {"train_loss": -27.511098861694336, "global_step": 504599, "epoch": 6079} {"train_loss": -27.58843421936035, "global_step": 504600, "epoch": 6079} {"train_loss": -27.39727783203125, "global_step": 504601, "epoch": 6079} {"train_loss": -27.4210205078125, "global_step": 504602, "epoch": 6079} {"train_loss": -27.478254318237305, "global_step": 504603, "epoch": 6079} {"train_loss": -27.36919593811035, "global_step": 504604, "epoch": 6079} {"train_loss": -27.190221786499023, "global_step": 504605, "epoch": 6079} {"train_loss": -27.35271644592285, "global_step": 504606, "epoch": 6079} {"train_loss": -27.396223068237305, "global_step": 504607, "epoch": 6079} {"train_loss": -27.497732162475586, "global_step": 504608, "epoch": 6079} {"train_loss": -27.2897891998291, "global_step": 504609, "epoch": 6079} {"train_loss": -27.311853408813477, "global_step": 504610, "epoch": 6079} {"train_loss": -27.183271408081055, "global_step": 504611, "epoch": 6079} {"train_loss": -27.652454376220703, "global_step": 504612, "epoch": 6079} {"train_loss": -27.439111709594727, "global_step": 504613, "epoch": 6079} {"train_loss": -27.664575576782227, "global_step": 504614, "epoch": 6079} {"train_loss": -27.663665771484375, "global_step": 504615, "epoch": 6079} {"train_loss": -27.496301651000977, "global_step": 504616, "epoch": 6079} {"train_loss": -27.188390731811523, "global_step": 504617, "epoch": 6079} {"train_loss": -27.644765853881836, "global_step": 504618, "epoch": 6079} {"train_loss": -27.542743682861328, "global_step": 504619, "epoch": 6079} {"train_loss": -27.56743812561035, "global_step": 504620, "epoch": 6079} {"train_loss": -27.698408126831055, "global_step": 504621, "epoch": 6079} {"train_loss": -27.30586051940918, "global_step": 504622, "epoch": 6079} {"train_loss": -27.4316463470459, "global_step": 504623, "epoch": 6079} {"train_loss": -27.4261531829834, "global_step": 504624, "epoch": 6079} {"train_loss": -27.618555068969727, "global_step": 504625, "epoch": 6079} {"train_loss": -27.30824089050293, "global_step": 504626, "epoch": 6079} {"train_loss": -27.53980827331543, "global_step": 504627, "epoch": 6079} {"train_loss": -27.839813232421875, "global_step": 504628, "epoch": 6079} {"train_loss": -27.73406410217285, "global_step": 504629, "epoch": 6079} {"train_loss": -27.620899200439453, "global_step": 504630, "epoch": 6079} {"train_loss": -27.498693466186523, "global_step": 504631, "epoch": 6079} {"train_loss": -27.862634658813477, "global_step": 504632, "epoch": 6079} {"train_loss": -27.679275512695312, "global_step": 504633, "epoch": 6079} {"train_loss": -27.821741104125977, "global_step": 504634, "epoch": 6079} {"train_loss": -27.995086669921875, "global_step": 504635, "epoch": 6079} {"train_loss": -27.640783309936523, "global_step": 504636, "epoch": 6079} {"train_loss": -27.761444091796875, "global_step": 504637, "epoch": 6079} {"train_loss": -28.016132354736328, "global_step": 504638, "epoch": 6079} {"train_loss": -26.947056161351952, "global_step": 504639, "epoch": 6079, "val_loss": 6482127.5} {"train_loss": -27.0513973236084, "global_step": 504640, "epoch": 6080} {"train_loss": -26.630834579467773, "global_step": 504641, "epoch": 6080} {"train_loss": -26.71038818359375, "global_step": 504642, "epoch": 6080} {"train_loss": -26.415266036987305, "global_step": 504643, "epoch": 6080} {"train_loss": -26.97637939453125, "global_step": 504644, "epoch": 6080} {"train_loss": -26.869892120361328, "global_step": 504645, "epoch": 6080} {"train_loss": -27.00412368774414, "global_step": 504646, "epoch": 6080} {"train_loss": -26.456451416015625, "global_step": 504647, "epoch": 6080} {"train_loss": -27.101160049438477, "global_step": 504648, "epoch": 6080} {"train_loss": -26.842803955078125, "global_step": 504649, "epoch": 6080} {"train_loss": -26.6491756439209, "global_step": 504650, "epoch": 6080} {"train_loss": -27.492834091186523, "global_step": 504651, "epoch": 6080} {"train_loss": -26.91371726989746, "global_step": 504652, "epoch": 6080} {"train_loss": -27.483312606811523, "global_step": 504653, "epoch": 6080} {"train_loss": -26.928146362304688, "global_step": 504654, "epoch": 6080} {"train_loss": -27.053791046142578, "global_step": 504655, "epoch": 6080} {"train_loss": -26.928213119506836, "global_step": 504656, "epoch": 6080} {"train_loss": -27.308027267456055, "global_step": 504657, "epoch": 6080} {"train_loss": -27.299396514892578, "global_step": 504658, "epoch": 6080} {"train_loss": -27.125579833984375, "global_step": 504659, "epoch": 6080} {"train_loss": -27.164051055908203, "global_step": 504660, "epoch": 6080} {"train_loss": -27.115034103393555, "global_step": 504661, "epoch": 6080} {"train_loss": -27.3924560546875, "global_step": 504662, "epoch": 6080} {"train_loss": -27.412967681884766, "global_step": 504663, "epoch": 6080} {"train_loss": -27.423063278198242, "global_step": 504664, "epoch": 6080} {"train_loss": -27.41578483581543, "global_step": 504665, "epoch": 6080} {"train_loss": -27.1754150390625, "global_step": 504666, "epoch": 6080} {"train_loss": -27.490278244018555, "global_step": 504667, "epoch": 6080} {"train_loss": -27.692655563354492, "global_step": 504668, "epoch": 6080} {"train_loss": -27.63966178894043, "global_step": 504669, "epoch": 6080} {"train_loss": -27.16206932067871, "global_step": 504670, "epoch": 6080} {"train_loss": -27.287378311157227, "global_step": 504671, "epoch": 6080} {"train_loss": -27.531660079956055, "global_step": 504672, "epoch": 6080} {"train_loss": -27.356128692626953, "global_step": 504673, "epoch": 6080} {"train_loss": -27.733678817749023, "global_step": 504674, "epoch": 6080} {"train_loss": -27.557519912719727, "global_step": 504675, "epoch": 6080} {"train_loss": -27.917722702026367, "global_step": 504676, "epoch": 6080} {"train_loss": -27.38578224182129, "global_step": 504677, "epoch": 6080} {"train_loss": -27.584991455078125, "global_step": 504678, "epoch": 6080} {"train_loss": -27.487104415893555, "global_step": 504679, "epoch": 6080} {"train_loss": -27.84808349609375, "global_step": 504680, "epoch": 6080} {"train_loss": -27.599958419799805, "global_step": 504681, "epoch": 6080} {"train_loss": -27.74078941345215, "global_step": 504682, "epoch": 6080} {"train_loss": -27.54207420349121, "global_step": 504683, "epoch": 6080} {"train_loss": -27.4176025390625, "global_step": 504684, "epoch": 6080} {"train_loss": -27.6393985748291, "global_step": 504685, "epoch": 6080} {"train_loss": -27.968276977539062, "global_step": 504686, "epoch": 6080} {"train_loss": -27.817153930664062, "global_step": 504687, "epoch": 6080} {"train_loss": -27.74346351623535, "global_step": 504688, "epoch": 6080} {"train_loss": -27.200021743774414, "global_step": 504689, "epoch": 6080} {"train_loss": -27.152734756469727, "global_step": 504690, "epoch": 6080} {"train_loss": -27.49226188659668, "global_step": 504691, "epoch": 6080} {"train_loss": -27.5349063873291, "global_step": 504692, "epoch": 6080} {"train_loss": -27.78095054626465, "global_step": 504693, "epoch": 6080} {"train_loss": -27.71392250061035, "global_step": 504694, "epoch": 6080} {"train_loss": -27.479658126831055, "global_step": 504695, "epoch": 6080} {"train_loss": -27.527297973632812, "global_step": 504696, "epoch": 6080} {"train_loss": -27.620304107666016, "global_step": 504697, "epoch": 6080} {"train_loss": -27.5849552154541, "global_step": 504698, "epoch": 6080} {"train_loss": -27.60662841796875, "global_step": 504699, "epoch": 6080} {"train_loss": -27.392288208007812, "global_step": 504700, "epoch": 6080} {"train_loss": -27.608686447143555, "global_step": 504701, "epoch": 6080} {"train_loss": -27.788623809814453, "global_step": 504702, "epoch": 6080} {"train_loss": -27.532201766967773, "global_step": 504703, "epoch": 6080} {"train_loss": -27.239599227905273, "global_step": 504704, "epoch": 6080} {"train_loss": -27.5860595703125, "global_step": 504705, "epoch": 6080} {"train_loss": -27.571292877197266, "global_step": 504706, "epoch": 6080} {"train_loss": -27.3830623626709, "global_step": 504707, "epoch": 6080} {"train_loss": -27.274988174438477, "global_step": 504708, "epoch": 6080} {"train_loss": -26.747024536132812, "global_step": 504709, "epoch": 6080} {"train_loss": -26.49378776550293, "global_step": 504710, "epoch": 6080} {"train_loss": -27.036558151245117, "global_step": 504711, "epoch": 6080} {"train_loss": -27.264404296875, "global_step": 504712, "epoch": 6080} {"train_loss": -27.611379623413086, "global_step": 504713, "epoch": 6080} {"train_loss": -27.077024459838867, "global_step": 504714, "epoch": 6080} {"train_loss": -27.76740837097168, "global_step": 504715, "epoch": 6080} {"train_loss": -27.2269287109375, "global_step": 504716, "epoch": 6080} {"train_loss": -27.145343780517578, "global_step": 504717, "epoch": 6080} {"train_loss": -27.377477645874023, "global_step": 504718, "epoch": 6080} {"train_loss": -26.699853897094727, "global_step": 504719, "epoch": 6080} {"train_loss": -26.772565841674805, "global_step": 504720, "epoch": 6080} {"train_loss": -26.6856632232666, "global_step": 504721, "epoch": 6080} {"train_loss": -27.30516213106822, "global_step": 504722, "epoch": 6080, "val_loss": 6459172.5} {"train_loss": -24.219884872436523, "global_step": 504723, "epoch": 6081} {"train_loss": -24.888906478881836, "global_step": 504724, "epoch": 6081} {"train_loss": -25.836029052734375, "global_step": 504725, "epoch": 6081} {"train_loss": -24.943531036376953, "global_step": 504726, "epoch": 6081} {"train_loss": -24.976043701171875, "global_step": 504727, "epoch": 6081} {"train_loss": -25.28901481628418, "global_step": 504728, "epoch": 6081} {"train_loss": -25.938892364501953, "global_step": 504729, "epoch": 6081} {"train_loss": -25.662811279296875, "global_step": 504730, "epoch": 6081} {"train_loss": -26.125659942626953, "global_step": 504731, "epoch": 6081} {"train_loss": -25.760251998901367, "global_step": 504732, "epoch": 6081} {"train_loss": -25.907743453979492, "global_step": 504733, "epoch": 6081} {"train_loss": -26.497465133666992, "global_step": 504734, "epoch": 6081} {"train_loss": -25.478317260742188, "global_step": 504735, "epoch": 6081} {"train_loss": -26.56199073791504, "global_step": 504736, "epoch": 6081} {"train_loss": -26.256683349609375, "global_step": 504737, "epoch": 6081} {"train_loss": -26.27937126159668, "global_step": 504738, "epoch": 6081} {"train_loss": -26.383527755737305, "global_step": 504739, "epoch": 6081} {"train_loss": -26.585248947143555, "global_step": 504740, "epoch": 6081} {"train_loss": -26.271259307861328, "global_step": 504741, "epoch": 6081} {"train_loss": -26.5349063873291, "global_step": 504742, "epoch": 6081} {"train_loss": -26.496912002563477, "global_step": 504743, "epoch": 6081} {"train_loss": -26.42937660217285, "global_step": 504744, "epoch": 6081} {"train_loss": -26.836362838745117, "global_step": 504745, "epoch": 6081} {"train_loss": -26.677661895751953, "global_step": 504746, "epoch": 6081} {"train_loss": -26.60202407836914, "global_step": 504747, "epoch": 6081} {"train_loss": -26.805206298828125, "global_step": 504748, "epoch": 6081} {"train_loss": -27.257278442382812, "global_step": 504749, "epoch": 6081} {"train_loss": -26.78264808654785, "global_step": 504750, "epoch": 6081} {"train_loss": -27.075763702392578, "global_step": 504751, "epoch": 6081} {"train_loss": -26.947179794311523, "global_step": 504752, "epoch": 6081} {"train_loss": -27.037139892578125, "global_step": 504753, "epoch": 6081} {"train_loss": -27.067590713500977, "global_step": 504754, "epoch": 6081} {"train_loss": -26.957889556884766, "global_step": 504755, "epoch": 6081} {"train_loss": -26.83407974243164, "global_step": 504756, "epoch": 6081} {"train_loss": -27.090225219726562, "global_step": 504757, "epoch": 6081} {"train_loss": -27.139575958251953, "global_step": 504758, "epoch": 6081} {"train_loss": -27.125036239624023, "global_step": 504759, "epoch": 6081} {"train_loss": -27.237979888916016, "global_step": 504760, "epoch": 6081} {"train_loss": -27.291555404663086, "global_step": 504761, "epoch": 6081} {"train_loss": -27.26661491394043, "global_step": 504762, "epoch": 6081} {"train_loss": -27.447519302368164, "global_step": 504763, "epoch": 6081} {"train_loss": -26.88250160217285, "global_step": 504764, "epoch": 6081} {"train_loss": -27.3248233795166, "global_step": 504765, "epoch": 6081} {"train_loss": -27.312728881835938, "global_step": 504766, "epoch": 6081} {"train_loss": -27.435571670532227, "global_step": 504767, "epoch": 6081} {"train_loss": -27.375080108642578, "global_step": 504768, "epoch": 6081} {"train_loss": -27.218358993530273, "global_step": 504769, "epoch": 6081} {"train_loss": -27.178665161132812, "global_step": 504770, "epoch": 6081} {"train_loss": -27.143400192260742, "global_step": 504771, "epoch": 6081} {"train_loss": -27.218305587768555, "global_step": 504772, "epoch": 6081} {"train_loss": -27.5717716217041, "global_step": 504773, "epoch": 6081} {"train_loss": -27.517663955688477, "global_step": 504774, "epoch": 6081} {"train_loss": -27.261096954345703, "global_step": 504775, "epoch": 6081} {"train_loss": -27.6195125579834, "global_step": 504776, "epoch": 6081} {"train_loss": -27.528472900390625, "global_step": 504777, "epoch": 6081} {"train_loss": -27.6189022064209, "global_step": 504778, "epoch": 6081} {"train_loss": -27.7810115814209, "global_step": 504779, "epoch": 6081} {"train_loss": -27.564306259155273, "global_step": 504780, "epoch": 6081} {"train_loss": -27.242475509643555, "global_step": 504781, "epoch": 6081} {"train_loss": -27.49505615234375, "global_step": 504782, "epoch": 6081} {"train_loss": -27.4906005859375, "global_step": 504783, "epoch": 6081} {"train_loss": -27.329425811767578, "global_step": 504784, "epoch": 6081} {"train_loss": -27.761505126953125, "global_step": 504785, "epoch": 6081} {"train_loss": -27.598281860351562, "global_step": 504786, "epoch": 6081} {"train_loss": -27.24342155456543, "global_step": 504787, "epoch": 6081} {"train_loss": -27.437366485595703, "global_step": 504788, "epoch": 6081} {"train_loss": -27.7154541015625, "global_step": 504789, "epoch": 6081} {"train_loss": -27.580657958984375, "global_step": 504790, "epoch": 6081} {"train_loss": -27.64578628540039, "global_step": 504791, "epoch": 6081} {"train_loss": -28.14776039123535, "global_step": 504792, "epoch": 6081} {"train_loss": -27.71246337890625, "global_step": 504793, "epoch": 6081} {"train_loss": -26.990222930908203, "global_step": 504794, "epoch": 6081} {"train_loss": -26.920286178588867, "global_step": 504795, "epoch": 6081} {"train_loss": -27.010480880737305, "global_step": 504796, "epoch": 6081} {"train_loss": -27.116376876831055, "global_step": 504797, "epoch": 6081} {"train_loss": -27.024311065673828, "global_step": 504798, "epoch": 6081} {"train_loss": -27.3834228515625, "global_step": 504799, "epoch": 6081} {"train_loss": -26.87883949279785, "global_step": 504800, "epoch": 6081} {"train_loss": -27.334136962890625, "global_step": 504801, "epoch": 6081} {"train_loss": -27.39166259765625, "global_step": 504802, "epoch": 6081} {"train_loss": -27.229766845703125, "global_step": 504803, "epoch": 6081} {"train_loss": -27.160633087158203, "global_step": 504804, "epoch": 6081} {"train_loss": -26.88163775708302, "global_step": 504805, "epoch": 6081, "val_loss": 6534168.0} {"train_loss": -26.14857292175293, "global_step": 504806, "epoch": 6082} {"train_loss": -25.9976749420166, "global_step": 504807, "epoch": 6082} {"train_loss": -26.738752365112305, "global_step": 504808, "epoch": 6082} {"train_loss": -26.193241119384766, "global_step": 504809, "epoch": 6082} {"train_loss": -26.819488525390625, "global_step": 504810, "epoch": 6082} {"train_loss": -25.99627685546875, "global_step": 504811, "epoch": 6082} {"train_loss": -26.38675880432129, "global_step": 504812, "epoch": 6082} {"train_loss": -26.748382568359375, "global_step": 504813, "epoch": 6082} {"train_loss": -26.4731502532959, "global_step": 504814, "epoch": 6082} {"train_loss": -26.937143325805664, "global_step": 504815, "epoch": 6082} {"train_loss": -26.819318771362305, "global_step": 504816, "epoch": 6082} {"train_loss": -27.0159854888916, "global_step": 504817, "epoch": 6082} {"train_loss": -26.966876983642578, "global_step": 504818, "epoch": 6082} {"train_loss": -26.919391632080078, "global_step": 504819, "epoch": 6082} {"train_loss": -27.354394912719727, "global_step": 504820, "epoch": 6082} {"train_loss": -27.150745391845703, "global_step": 504821, "epoch": 6082} {"train_loss": -26.618497848510742, "global_step": 504822, "epoch": 6082} {"train_loss": -27.57221794128418, "global_step": 504823, "epoch": 6082} {"train_loss": -27.211002349853516, "global_step": 504824, "epoch": 6082} {"train_loss": -27.0136661529541, "global_step": 504825, "epoch": 6082} {"train_loss": -27.0533447265625, "global_step": 504826, "epoch": 6082} {"train_loss": -27.131620407104492, "global_step": 504827, "epoch": 6082} {"train_loss": -27.252241134643555, "global_step": 504828, "epoch": 6082} {"train_loss": -27.437788009643555, "global_step": 504829, "epoch": 6082} {"train_loss": -27.119855880737305, "global_step": 504830, "epoch": 6082} {"train_loss": -27.411239624023438, "global_step": 504831, "epoch": 6082} {"train_loss": -27.250701904296875, "global_step": 504832, "epoch": 6082} {"train_loss": -27.446081161499023, "global_step": 504833, "epoch": 6082} {"train_loss": -27.066852569580078, "global_step": 504834, "epoch": 6082} {"train_loss": -27.5466365814209, "global_step": 504835, "epoch": 6082} {"train_loss": -27.596464157104492, "global_step": 504836, "epoch": 6082} {"train_loss": -27.592687606811523, "global_step": 504837, "epoch": 6082} {"train_loss": -27.405094146728516, "global_step": 504838, "epoch": 6082} {"train_loss": -27.60813331604004, "global_step": 504839, "epoch": 6082} {"train_loss": -27.312204360961914, "global_step": 504840, "epoch": 6082} {"train_loss": -27.34978675842285, "global_step": 504841, "epoch": 6082} {"train_loss": -27.54768180847168, "global_step": 504842, "epoch": 6082} {"train_loss": -27.535675048828125, "global_step": 504843, "epoch": 6082} {"train_loss": -27.687244415283203, "global_step": 504844, "epoch": 6082} {"train_loss": -27.753189086914062, "global_step": 504845, "epoch": 6082} {"train_loss": -27.5944881439209, "global_step": 504846, "epoch": 6082} {"train_loss": -27.27357292175293, "global_step": 504847, "epoch": 6082} {"train_loss": -27.29792594909668, "global_step": 504848, "epoch": 6082} {"train_loss": -27.72064208984375, "global_step": 504849, "epoch": 6082} {"train_loss": -27.618743896484375, "global_step": 504850, "epoch": 6082} {"train_loss": -27.53553581237793, "global_step": 504851, "epoch": 6082} {"train_loss": -27.589460372924805, "global_step": 504852, "epoch": 6082} {"train_loss": -27.243942260742188, "global_step": 504853, "epoch": 6082} {"train_loss": -27.817739486694336, "global_step": 504854, "epoch": 6082} {"train_loss": -27.40122413635254, "global_step": 504855, "epoch": 6082} {"train_loss": -27.51163101196289, "global_step": 504856, "epoch": 6082} {"train_loss": -27.695276260375977, "global_step": 504857, "epoch": 6082} {"train_loss": -27.880615234375, "global_step": 504858, "epoch": 6082} {"train_loss": -27.59174156188965, "global_step": 504859, "epoch": 6082} {"train_loss": -27.608083724975586, "global_step": 504860, "epoch": 6082} {"train_loss": -27.467731475830078, "global_step": 504861, "epoch": 6082} {"train_loss": -26.983047485351562, "global_step": 504862, "epoch": 6082} {"train_loss": -26.46320152282715, "global_step": 504863, "epoch": 6082} {"train_loss": -26.31537437438965, "global_step": 504864, "epoch": 6082} {"train_loss": -27.14167594909668, "global_step": 504865, "epoch": 6082} {"train_loss": -27.407413482666016, "global_step": 504866, "epoch": 6082} {"train_loss": -27.609058380126953, "global_step": 504867, "epoch": 6082} {"train_loss": -27.406925201416016, "global_step": 504868, "epoch": 6082} {"train_loss": -27.321386337280273, "global_step": 504869, "epoch": 6082} {"train_loss": -27.15168571472168, "global_step": 504870, "epoch": 6082} {"train_loss": -27.074878692626953, "global_step": 504871, "epoch": 6082} {"train_loss": -27.578094482421875, "global_step": 504872, "epoch": 6082} {"train_loss": -27.478321075439453, "global_step": 504873, "epoch": 6082} {"train_loss": -26.931737899780273, "global_step": 504874, "epoch": 6082} {"train_loss": -27.112598419189453, "global_step": 504875, "epoch": 6082} {"train_loss": -27.37060546875, "global_step": 504876, "epoch": 6082} {"train_loss": -27.447219848632812, "global_step": 504877, "epoch": 6082} {"train_loss": -27.229536056518555, "global_step": 504878, "epoch": 6082} {"train_loss": -27.298063278198242, "global_step": 504879, "epoch": 6082} {"train_loss": -27.216049194335938, "global_step": 504880, "epoch": 6082} {"train_loss": -27.60104751586914, "global_step": 504881, "epoch": 6082} {"train_loss": -27.397802352905273, "global_step": 504882, "epoch": 6082} {"train_loss": -27.331979751586914, "global_step": 504883, "epoch": 6082} {"train_loss": -27.564809799194336, "global_step": 504884, "epoch": 6082} {"train_loss": -27.330366134643555, "global_step": 504885, "epoch": 6082} {"train_loss": -27.6499080657959, "global_step": 504886, "epoch": 6082} {"train_loss": -27.231521606445312, "global_step": 504887, "epoch": 6082} {"train_loss": -27.226120684520307, "global_step": 504888, "epoch": 6082, "val_loss": 6663036.0} {"train_loss": -27.378646850585938, "global_step": 504889, "epoch": 6083} {"train_loss": -26.9790096282959, "global_step": 504890, "epoch": 6083} {"train_loss": -26.959339141845703, "global_step": 504891, "epoch": 6083} {"train_loss": -27.1749267578125, "global_step": 504892, "epoch": 6083} {"train_loss": -27.220184326171875, "global_step": 504893, "epoch": 6083} {"train_loss": -27.058704376220703, "global_step": 504894, "epoch": 6083} {"train_loss": -27.19745445251465, "global_step": 504895, "epoch": 6083} {"train_loss": -27.404890060424805, "global_step": 504896, "epoch": 6083} {"train_loss": -27.321271896362305, "global_step": 504897, "epoch": 6083} {"train_loss": -27.096302032470703, "global_step": 504898, "epoch": 6083} {"train_loss": -27.23744010925293, "global_step": 504899, "epoch": 6083} {"train_loss": -27.193876266479492, "global_step": 504900, "epoch": 6083} {"train_loss": -27.11604118347168, "global_step": 504901, "epoch": 6083} {"train_loss": -27.11345863342285, "global_step": 504902, "epoch": 6083} {"train_loss": -27.343170166015625, "global_step": 504903, "epoch": 6083} {"train_loss": -27.183298110961914, "global_step": 504904, "epoch": 6083} {"train_loss": -27.468902587890625, "global_step": 504905, "epoch": 6083} {"train_loss": -27.39117431640625, "global_step": 504906, "epoch": 6083} {"train_loss": -27.310199737548828, "global_step": 504907, "epoch": 6083} {"train_loss": -27.581207275390625, "global_step": 504908, "epoch": 6083} {"train_loss": -27.434890747070312, "global_step": 504909, "epoch": 6083} {"train_loss": -27.553674697875977, "global_step": 504910, "epoch": 6083} {"train_loss": -27.622655868530273, "global_step": 504911, "epoch": 6083} {"train_loss": -27.194787979125977, "global_step": 504912, "epoch": 6083} {"train_loss": -27.70819664001465, "global_step": 504913, "epoch": 6083} {"train_loss": -27.603879928588867, "global_step": 504914, "epoch": 6083} {"train_loss": -27.449209213256836, "global_step": 504915, "epoch": 6083} {"train_loss": -27.372329711914062, "global_step": 504916, "epoch": 6083} {"train_loss": -27.163251876831055, "global_step": 504917, "epoch": 6083} {"train_loss": -28.064762115478516, "global_step": 504918, "epoch": 6083} {"train_loss": -27.40248680114746, "global_step": 504919, "epoch": 6083} {"train_loss": -27.50274085998535, "global_step": 504920, "epoch": 6083} {"train_loss": -27.633581161499023, "global_step": 504921, "epoch": 6083} {"train_loss": -27.34200096130371, "global_step": 504922, "epoch": 6083} {"train_loss": -27.31438636779785, "global_step": 504923, "epoch": 6083} {"train_loss": -27.940561294555664, "global_step": 504924, "epoch": 6083} {"train_loss": -27.402414321899414, "global_step": 504925, "epoch": 6083} {"train_loss": -27.882373809814453, "global_step": 504926, "epoch": 6083} {"train_loss": -27.593061447143555, "global_step": 504927, "epoch": 6083} {"train_loss": -27.711362838745117, "global_step": 504928, "epoch": 6083} {"train_loss": -27.4432373046875, "global_step": 504929, "epoch": 6083} {"train_loss": -27.561527252197266, "global_step": 504930, "epoch": 6083} {"train_loss": -27.809751510620117, "global_step": 504931, "epoch": 6083} {"train_loss": -27.771352767944336, "global_step": 504932, "epoch": 6083} {"train_loss": -27.80824851989746, "global_step": 504933, "epoch": 6083} {"train_loss": -27.654203414916992, "global_step": 504934, "epoch": 6083} {"train_loss": -27.5700626373291, "global_step": 504935, "epoch": 6083} {"train_loss": -27.51422119140625, "global_step": 504936, "epoch": 6083} {"train_loss": -27.381988525390625, "global_step": 504937, "epoch": 6083} {"train_loss": -27.23906898498535, "global_step": 504938, "epoch": 6083} {"train_loss": -27.312271118164062, "global_step": 504939, "epoch": 6083} {"train_loss": -27.248519897460938, "global_step": 504940, "epoch": 6083} {"train_loss": -27.34320640563965, "global_step": 504941, "epoch": 6083} {"train_loss": -27.09745216369629, "global_step": 504942, "epoch": 6083} {"train_loss": -27.032245635986328, "global_step": 504943, "epoch": 6083} {"train_loss": -26.199106216430664, "global_step": 504944, "epoch": 6083} {"train_loss": -26.106937408447266, "global_step": 504945, "epoch": 6083} {"train_loss": -27.00272560119629, "global_step": 504946, "epoch": 6083} {"train_loss": -26.9759521484375, "global_step": 504947, "epoch": 6083} {"train_loss": -26.513330459594727, "global_step": 504948, "epoch": 6083} {"train_loss": -25.65839958190918, "global_step": 504949, "epoch": 6083} {"train_loss": -26.804489135742188, "global_step": 504950, "epoch": 6083} {"train_loss": -27.003671646118164, "global_step": 504951, "epoch": 6083} {"train_loss": -26.105518341064453, "global_step": 504952, "epoch": 6083} {"train_loss": -26.81031608581543, "global_step": 504953, "epoch": 6083} {"train_loss": -27.19844627380371, "global_step": 504954, "epoch": 6083} {"train_loss": -27.613325119018555, "global_step": 504955, "epoch": 6083} {"train_loss": -27.00849723815918, "global_step": 504956, "epoch": 6083} {"train_loss": -27.10663414001465, "global_step": 504957, "epoch": 6083} {"train_loss": -27.21728515625, "global_step": 504958, "epoch": 6083} {"train_loss": -26.624181747436523, "global_step": 504959, "epoch": 6083} {"train_loss": -26.959247589111328, "global_step": 504960, "epoch": 6083} {"train_loss": -27.21915626525879, "global_step": 504961, "epoch": 6083} {"train_loss": -27.425048828125, "global_step": 504962, "epoch": 6083} {"train_loss": -27.181854248046875, "global_step": 504963, "epoch": 6083} {"train_loss": -27.054296493530273, "global_step": 504964, "epoch": 6083} {"train_loss": -27.258222579956055, "global_step": 504965, "epoch": 6083} {"train_loss": -27.138751983642578, "global_step": 504966, "epoch": 6083} {"train_loss": -27.207727432250977, "global_step": 504967, "epoch": 6083} {"train_loss": -27.2307186126709, "global_step": 504968, "epoch": 6083} {"train_loss": -27.675216674804688, "global_step": 504969, "epoch": 6083} {"train_loss": -27.172338485717773, "global_step": 504970, "epoch": 6083} {"train_loss": -27.246128220156013, "global_step": 504971, "epoch": 6083, "val_loss": 6549234.0} {"train_loss": -26.32789421081543, "global_step": 504972, "epoch": 6084} {"train_loss": -26.665857315063477, "global_step": 504973, "epoch": 6084} {"train_loss": -26.714923858642578, "global_step": 504974, "epoch": 6084} {"train_loss": -26.703954696655273, "global_step": 504975, "epoch": 6084} {"train_loss": -26.594009399414062, "global_step": 504976, "epoch": 6084} {"train_loss": -26.940229415893555, "global_step": 504977, "epoch": 6084} {"train_loss": -26.548688888549805, "global_step": 504978, "epoch": 6084} {"train_loss": -26.704126358032227, "global_step": 504979, "epoch": 6084} {"train_loss": -26.576858520507812, "global_step": 504980, "epoch": 6084} {"train_loss": -26.592395782470703, "global_step": 504981, "epoch": 6084} {"train_loss": -27.0970516204834, "global_step": 504982, "epoch": 6084} {"train_loss": -26.751392364501953, "global_step": 504983, "epoch": 6084} {"train_loss": -27.29522705078125, "global_step": 504984, "epoch": 6084} {"train_loss": -27.444059371948242, "global_step": 504985, "epoch": 6084} {"train_loss": -26.813800811767578, "global_step": 504986, "epoch": 6084} {"train_loss": -27.45529556274414, "global_step": 504987, "epoch": 6084} {"train_loss": -27.145334243774414, "global_step": 504988, "epoch": 6084} {"train_loss": -27.09198570251465, "global_step": 504989, "epoch": 6084} {"train_loss": -27.35371971130371, "global_step": 504990, "epoch": 6084} {"train_loss": -27.265151977539062, "global_step": 504991, "epoch": 6084} {"train_loss": -27.522876739501953, "global_step": 504992, "epoch": 6084} {"train_loss": -27.2055606842041, "global_step": 504993, "epoch": 6084} {"train_loss": -27.2540225982666, "global_step": 504994, "epoch": 6084} {"train_loss": -27.337350845336914, "global_step": 504995, "epoch": 6084} {"train_loss": -27.54860496520996, "global_step": 504996, "epoch": 6084} {"train_loss": -27.235931396484375, "global_step": 504997, "epoch": 6084} {"train_loss": -27.610462188720703, "global_step": 504998, "epoch": 6084} {"train_loss": -27.347288131713867, "global_step": 504999, "epoch": 6084} {"train_loss": -27.41788101196289, "global_step": 505000, "epoch": 6084} {"train_loss": -27.765043258666992, "global_step": 505001, "epoch": 6084} {"train_loss": -27.5318603515625, "global_step": 505002, "epoch": 6084} {"train_loss": -27.368906021118164, "global_step": 505003, "epoch": 6084} {"train_loss": -27.484037399291992, "global_step": 505004, "epoch": 6084} {"train_loss": -27.484390258789062, "global_step": 505005, "epoch": 6084} {"train_loss": -27.802026748657227, "global_step": 505006, "epoch": 6084} {"train_loss": -27.72275161743164, "global_step": 505007, "epoch": 6084} {"train_loss": -27.84564208984375, "global_step": 505008, "epoch": 6084} {"train_loss": -27.513248443603516, "global_step": 505009, "epoch": 6084} {"train_loss": -27.514358520507812, "global_step": 505010, "epoch": 6084} {"train_loss": -27.683765411376953, "global_step": 505011, "epoch": 6084} {"train_loss": -27.516748428344727, "global_step": 505012, "epoch": 6084} {"train_loss": -27.257965087890625, "global_step": 505013, "epoch": 6084} {"train_loss": -27.54844093322754, "global_step": 505014, "epoch": 6084} {"train_loss": -27.603439331054688, "global_step": 505015, "epoch": 6084} {"train_loss": -27.658248901367188, "global_step": 505016, "epoch": 6084} {"train_loss": -27.796497344970703, "global_step": 505017, "epoch": 6084} {"train_loss": -27.221582412719727, "global_step": 505018, "epoch": 6084} {"train_loss": -27.451025009155273, "global_step": 505019, "epoch": 6084} {"train_loss": -27.15447998046875, "global_step": 505020, "epoch": 6084} {"train_loss": -27.54691505432129, "global_step": 505021, "epoch": 6084} {"train_loss": -27.617094039916992, "global_step": 505022, "epoch": 6084} {"train_loss": -27.5179386138916, "global_step": 505023, "epoch": 6084} {"train_loss": -27.46016502380371, "global_step": 505024, "epoch": 6084} {"train_loss": -27.553503036499023, "global_step": 505025, "epoch": 6084} {"train_loss": -27.488554000854492, "global_step": 505026, "epoch": 6084} {"train_loss": -27.537443161010742, "global_step": 505027, "epoch": 6084} {"train_loss": -27.173297882080078, "global_step": 505028, "epoch": 6084} {"train_loss": -27.334674835205078, "global_step": 505029, "epoch": 6084} {"train_loss": -27.132211685180664, "global_step": 505030, "epoch": 6084} {"train_loss": -27.292871475219727, "global_step": 505031, "epoch": 6084} {"train_loss": -27.525068283081055, "global_step": 505032, "epoch": 6084} {"train_loss": -27.767044067382812, "global_step": 505033, "epoch": 6084} {"train_loss": -27.363256454467773, "global_step": 505034, "epoch": 6084} {"train_loss": -27.066186904907227, "global_step": 505035, "epoch": 6084} {"train_loss": -27.031152725219727, "global_step": 505036, "epoch": 6084} {"train_loss": -27.557992935180664, "global_step": 505037, "epoch": 6084} {"train_loss": -27.03437614440918, "global_step": 505038, "epoch": 6084} {"train_loss": -26.775955200195312, "global_step": 505039, "epoch": 6084} {"train_loss": -26.963077545166016, "global_step": 505040, "epoch": 6084} {"train_loss": -27.531339645385742, "global_step": 505041, "epoch": 6084} {"train_loss": -27.474584579467773, "global_step": 505042, "epoch": 6084} {"train_loss": -27.495283126831055, "global_step": 505043, "epoch": 6084} {"train_loss": -27.0618896484375, "global_step": 505044, "epoch": 6084} {"train_loss": -27.5638370513916, "global_step": 505045, "epoch": 6084} {"train_loss": -26.733789443969727, "global_step": 505046, "epoch": 6084} {"train_loss": -27.105924606323242, "global_step": 505047, "epoch": 6084} {"train_loss": -27.241865158081055, "global_step": 505048, "epoch": 6084} {"train_loss": -27.52044105529785, "global_step": 505049, "epoch": 6084} {"train_loss": -27.405643463134766, "global_step": 505050, "epoch": 6084} {"train_loss": -27.43440818786621, "global_step": 505051, "epoch": 6084} {"train_loss": -27.026187896728516, "global_step": 505052, "epoch": 6084} {"train_loss": -27.088476181030273, "global_step": 505053, "epoch": 6084} {"train_loss": -27.27790411983628, "global_step": 505054, "epoch": 6084, "val_loss": 6545927.0} {"train_loss": -26.88014793395996, "global_step": 505055, "epoch": 6085} {"train_loss": -27.405033111572266, "global_step": 505056, "epoch": 6085} {"train_loss": -26.759647369384766, "global_step": 505057, "epoch": 6085} {"train_loss": -27.301443099975586, "global_step": 505058, "epoch": 6085} {"train_loss": -27.02286148071289, "global_step": 505059, "epoch": 6085} {"train_loss": -27.253149032592773, "global_step": 505060, "epoch": 6085} {"train_loss": -26.99519157409668, "global_step": 505061, "epoch": 6085} {"train_loss": -27.46771240234375, "global_step": 505062, "epoch": 6085} {"train_loss": -27.180768966674805, "global_step": 505063, "epoch": 6085} {"train_loss": -27.43927001953125, "global_step": 505064, "epoch": 6085} {"train_loss": -27.254413604736328, "global_step": 505065, "epoch": 6085} {"train_loss": -27.301593780517578, "global_step": 505066, "epoch": 6085} {"train_loss": -27.36042594909668, "global_step": 505067, "epoch": 6085} {"train_loss": -27.38042640686035, "global_step": 505068, "epoch": 6085} {"train_loss": -27.309370040893555, "global_step": 505069, "epoch": 6085} {"train_loss": -27.29389762878418, "global_step": 505070, "epoch": 6085} {"train_loss": -27.187850952148438, "global_step": 505071, "epoch": 6085} {"train_loss": -27.16938591003418, "global_step": 505072, "epoch": 6085} {"train_loss": -27.575910568237305, "global_step": 505073, "epoch": 6085} {"train_loss": -27.155614852905273, "global_step": 505074, "epoch": 6085} {"train_loss": -27.192285537719727, "global_step": 505075, "epoch": 6085} {"train_loss": -27.720834732055664, "global_step": 505076, "epoch": 6085} {"train_loss": -27.834035873413086, "global_step": 505077, "epoch": 6085} {"train_loss": -27.832782745361328, "global_step": 505078, "epoch": 6085} {"train_loss": -27.544836044311523, "global_step": 505079, "epoch": 6085} {"train_loss": -27.68793296813965, "global_step": 505080, "epoch": 6085} {"train_loss": -27.627805709838867, "global_step": 505081, "epoch": 6085} {"train_loss": -26.99458122253418, "global_step": 505082, "epoch": 6085} {"train_loss": -27.2130184173584, "global_step": 505083, "epoch": 6085} {"train_loss": -27.52335548400879, "global_step": 505084, "epoch": 6085} {"train_loss": -27.410200119018555, "global_step": 505085, "epoch": 6085} {"train_loss": -27.359180450439453, "global_step": 505086, "epoch": 6085} {"train_loss": -27.625396728515625, "global_step": 505087, "epoch": 6085} {"train_loss": -27.750757217407227, "global_step": 505088, "epoch": 6085} {"train_loss": -27.392562866210938, "global_step": 505089, "epoch": 6085} {"train_loss": -27.493305206298828, "global_step": 505090, "epoch": 6085} {"train_loss": -27.43914794921875, "global_step": 505091, "epoch": 6085} {"train_loss": -27.073017120361328, "global_step": 505092, "epoch": 6085} {"train_loss": -27.43366813659668, "global_step": 505093, "epoch": 6085} {"train_loss": -27.117517471313477, "global_step": 505094, "epoch": 6085} {"train_loss": -27.247522354125977, "global_step": 505095, "epoch": 6085} {"train_loss": -27.56591796875, "global_step": 505096, "epoch": 6085} {"train_loss": -27.292455673217773, "global_step": 505097, "epoch": 6085} {"train_loss": -27.618680953979492, "global_step": 505098, "epoch": 6085} {"train_loss": -27.590429306030273, "global_step": 505099, "epoch": 6085} {"train_loss": -27.789398193359375, "global_step": 505100, "epoch": 6085} {"train_loss": -27.389877319335938, "global_step": 505101, "epoch": 6085} {"train_loss": -27.464111328125, "global_step": 505102, "epoch": 6085} {"train_loss": -27.452442169189453, "global_step": 505103, "epoch": 6085} {"train_loss": -27.349950790405273, "global_step": 505104, "epoch": 6085} {"train_loss": -27.506473541259766, "global_step": 505105, "epoch": 6085} {"train_loss": -27.578556060791016, "global_step": 505106, "epoch": 6085} {"train_loss": -27.344831466674805, "global_step": 505107, "epoch": 6085} {"train_loss": -27.54498291015625, "global_step": 505108, "epoch": 6085} {"train_loss": -27.315759658813477, "global_step": 505109, "epoch": 6085} {"train_loss": -27.421186447143555, "global_step": 505110, "epoch": 6085} {"train_loss": -27.680587768554688, "global_step": 505111, "epoch": 6085} {"train_loss": -28.004901885986328, "global_step": 505112, "epoch": 6085} {"train_loss": -27.713468551635742, "global_step": 505113, "epoch": 6085} {"train_loss": -27.84185218811035, "global_step": 505114, "epoch": 6085} {"train_loss": -27.93650245666504, "global_step": 505115, "epoch": 6085} {"train_loss": -27.37074089050293, "global_step": 505116, "epoch": 6085} {"train_loss": -27.790515899658203, "global_step": 505117, "epoch": 6085} {"train_loss": -27.88245964050293, "global_step": 505118, "epoch": 6085} {"train_loss": -27.6446590423584, "global_step": 505119, "epoch": 6085} {"train_loss": -27.77345848083496, "global_step": 505120, "epoch": 6085} {"train_loss": -27.686599731445312, "global_step": 505121, "epoch": 6085} {"train_loss": -27.680999755859375, "global_step": 505122, "epoch": 6085} {"train_loss": -27.379718780517578, "global_step": 505123, "epoch": 6085} {"train_loss": -27.464984893798828, "global_step": 505124, "epoch": 6085} {"train_loss": -27.17337417602539, "global_step": 505125, "epoch": 6085} {"train_loss": -27.581567764282227, "global_step": 505126, "epoch": 6085} {"train_loss": -27.350269317626953, "global_step": 505127, "epoch": 6085} {"train_loss": -27.602136611938477, "global_step": 505128, "epoch": 6085} {"train_loss": -27.395538330078125, "global_step": 505129, "epoch": 6085} {"train_loss": -27.756092071533203, "global_step": 505130, "epoch": 6085} {"train_loss": -27.4925537109375, "global_step": 505131, "epoch": 6085} {"train_loss": -27.66463279724121, "global_step": 505132, "epoch": 6085} {"train_loss": -27.587182998657227, "global_step": 505133, "epoch": 6085} {"train_loss": -27.482080459594727, "global_step": 505134, "epoch": 6085} {"train_loss": -27.239362716674805, "global_step": 505135, "epoch": 6085} {"train_loss": -27.357568740844727, "global_step": 505136, "epoch": 6085} {"train_loss": -27.453070652054016, "global_step": 505137, "epoch": 6085, "val_loss": 6503154.0} {"train_loss": -26.168424606323242, "global_step": 505138, "epoch": 6086} {"train_loss": -26.689977645874023, "global_step": 505139, "epoch": 6086} {"train_loss": -26.917875289916992, "global_step": 505140, "epoch": 6086} {"train_loss": -26.016372680664062, "global_step": 505141, "epoch": 6086} {"train_loss": -26.7277774810791, "global_step": 505142, "epoch": 6086} {"train_loss": -26.92716407775879, "global_step": 505143, "epoch": 6086} {"train_loss": -26.412677764892578, "global_step": 505144, "epoch": 6086} {"train_loss": -27.0238037109375, "global_step": 505145, "epoch": 6086} {"train_loss": -26.67120361328125, "global_step": 505146, "epoch": 6086} {"train_loss": -27.05490493774414, "global_step": 505147, "epoch": 6086} {"train_loss": -26.76287269592285, "global_step": 505148, "epoch": 6086} {"train_loss": -27.12411880493164, "global_step": 505149, "epoch": 6086} {"train_loss": -27.274662017822266, "global_step": 505150, "epoch": 6086} {"train_loss": -27.362577438354492, "global_step": 505151, "epoch": 6086} {"train_loss": -27.093219757080078, "global_step": 505152, "epoch": 6086} {"train_loss": -27.215848922729492, "global_step": 505153, "epoch": 6086} {"train_loss": -26.914749145507812, "global_step": 505154, "epoch": 6086} {"train_loss": -27.098621368408203, "global_step": 505155, "epoch": 6086} {"train_loss": -27.3005428314209, "global_step": 505156, "epoch": 6086} {"train_loss": -27.63043785095215, "global_step": 505157, "epoch": 6086} {"train_loss": -27.53675651550293, "global_step": 505158, "epoch": 6086} {"train_loss": -27.270557403564453, "global_step": 505159, "epoch": 6086} {"train_loss": -27.108015060424805, "global_step": 505160, "epoch": 6086} {"train_loss": -27.433013916015625, "global_step": 505161, "epoch": 6086} {"train_loss": -27.523839950561523, "global_step": 505162, "epoch": 6086} {"train_loss": -26.952802658081055, "global_step": 505163, "epoch": 6086} {"train_loss": -27.21868896484375, "global_step": 505164, "epoch": 6086} {"train_loss": -27.414554595947266, "global_step": 505165, "epoch": 6086} {"train_loss": -27.157978057861328, "global_step": 505166, "epoch": 6086} {"train_loss": -27.307050704956055, "global_step": 505167, "epoch": 6086} {"train_loss": -27.24103355407715, "global_step": 505168, "epoch": 6086} {"train_loss": -27.29420280456543, "global_step": 505169, "epoch": 6086} {"train_loss": -27.094709396362305, "global_step": 505170, "epoch": 6086} {"train_loss": -27.161518096923828, "global_step": 505171, "epoch": 6086} {"train_loss": -27.483728408813477, "global_step": 505172, "epoch": 6086} {"train_loss": -27.367252349853516, "global_step": 505173, "epoch": 6086} {"train_loss": -27.832294464111328, "global_step": 505174, "epoch": 6086} {"train_loss": -27.49409294128418, "global_step": 505175, "epoch": 6086} {"train_loss": -27.766508102416992, "global_step": 505176, "epoch": 6086} {"train_loss": -27.72652244567871, "global_step": 505177, "epoch": 6086} {"train_loss": -27.488834381103516, "global_step": 505178, "epoch": 6086} {"train_loss": -27.652734756469727, "global_step": 505179, "epoch": 6086} {"train_loss": -27.61414909362793, "global_step": 505180, "epoch": 6086} {"train_loss": -27.933923721313477, "global_step": 505181, "epoch": 6086} {"train_loss": -27.2381649017334, "global_step": 505182, "epoch": 6086} {"train_loss": -27.329370498657227, "global_step": 505183, "epoch": 6086} {"train_loss": -26.945255279541016, "global_step": 505184, "epoch": 6086} {"train_loss": -27.12690544128418, "global_step": 505185, "epoch": 6086} {"train_loss": -27.35515785217285, "global_step": 505186, "epoch": 6086} {"train_loss": -27.742258071899414, "global_step": 505187, "epoch": 6086} {"train_loss": -27.415197372436523, "global_step": 505188, "epoch": 6086} {"train_loss": -27.27997398376465, "global_step": 505189, "epoch": 6086} {"train_loss": -27.79743003845215, "global_step": 505190, "epoch": 6086} {"train_loss": -27.263776779174805, "global_step": 505191, "epoch": 6086} {"train_loss": -27.2409610748291, "global_step": 505192, "epoch": 6086} {"train_loss": -27.498132705688477, "global_step": 505193, "epoch": 6086} {"train_loss": -27.082422256469727, "global_step": 505194, "epoch": 6086} {"train_loss": -26.941303253173828, "global_step": 505195, "epoch": 6086} {"train_loss": -27.381399154663086, "global_step": 505196, "epoch": 6086} {"train_loss": -26.962263107299805, "global_step": 505197, "epoch": 6086} {"train_loss": -26.786252975463867, "global_step": 505198, "epoch": 6086} {"train_loss": -27.352996826171875, "global_step": 505199, "epoch": 6086} {"train_loss": -27.38345718383789, "global_step": 505200, "epoch": 6086} {"train_loss": -27.5401668548584, "global_step": 505201, "epoch": 6086} {"train_loss": -27.33762550354004, "global_step": 505202, "epoch": 6086} {"train_loss": -27.55401611328125, "global_step": 505203, "epoch": 6086} {"train_loss": -26.8441104888916, "global_step": 505204, "epoch": 6086} {"train_loss": -27.238189697265625, "global_step": 505205, "epoch": 6086} {"train_loss": -27.28717613220215, "global_step": 505206, "epoch": 6086} {"train_loss": -27.717634201049805, "global_step": 505207, "epoch": 6086} {"train_loss": -27.414810180664062, "global_step": 505208, "epoch": 6086} {"train_loss": -27.520177841186523, "global_step": 505209, "epoch": 6086} {"train_loss": -27.25712013244629, "global_step": 505210, "epoch": 6086} {"train_loss": -27.74934196472168, "global_step": 505211, "epoch": 6086} {"train_loss": -27.713794708251953, "global_step": 505212, "epoch": 6086} {"train_loss": -27.294851303100586, "global_step": 505213, "epoch": 6086} {"train_loss": -27.297208786010742, "global_step": 505214, "epoch": 6086} {"train_loss": -27.699344635009766, "global_step": 505215, "epoch": 6086} {"train_loss": -27.572601318359375, "global_step": 505216, "epoch": 6086} {"train_loss": -27.586145401000977, "global_step": 505217, "epoch": 6086} {"train_loss": -27.363126754760742, "global_step": 505218, "epoch": 6086} {"train_loss": -27.514087677001953, "global_step": 505219, "epoch": 6086} {"train_loss": -27.25407777349633, "global_step": 505220, "epoch": 6086, "val_loss": 6507967.0} {"train_loss": -27.012414932250977, "global_step": 505221, "epoch": 6087} {"train_loss": -27.241657257080078, "global_step": 505222, "epoch": 6087} {"train_loss": -27.167272567749023, "global_step": 505223, "epoch": 6087} {"train_loss": -27.422916412353516, "global_step": 505224, "epoch": 6087} {"train_loss": -27.228498458862305, "global_step": 505225, "epoch": 6087} {"train_loss": -27.095754623413086, "global_step": 505226, "epoch": 6087} {"train_loss": -27.265857696533203, "global_step": 505227, "epoch": 6087} {"train_loss": -27.501758575439453, "global_step": 505228, "epoch": 6087} {"train_loss": -27.42585563659668, "global_step": 505229, "epoch": 6087} {"train_loss": -27.246826171875, "global_step": 505230, "epoch": 6087} {"train_loss": -27.976484298706055, "global_step": 505231, "epoch": 6087} {"train_loss": -27.197498321533203, "global_step": 505232, "epoch": 6087} {"train_loss": -27.31743812561035, "global_step": 505233, "epoch": 6087} {"train_loss": -27.06136131286621, "global_step": 505234, "epoch": 6087} {"train_loss": -27.912992477416992, "global_step": 505235, "epoch": 6087} {"train_loss": -27.430356979370117, "global_step": 505236, "epoch": 6087} {"train_loss": -27.764541625976562, "global_step": 505237, "epoch": 6087} {"train_loss": -27.051895141601562, "global_step": 505238, "epoch": 6087} {"train_loss": -27.65801429748535, "global_step": 505239, "epoch": 6087} {"train_loss": -27.382598876953125, "global_step": 505240, "epoch": 6087} {"train_loss": -27.92901611328125, "global_step": 505241, "epoch": 6087} {"train_loss": -27.356830596923828, "global_step": 505242, "epoch": 6087} {"train_loss": -27.739667892456055, "global_step": 505243, "epoch": 6087} {"train_loss": -27.287092208862305, "global_step": 505244, "epoch": 6087} {"train_loss": -27.382028579711914, "global_step": 505245, "epoch": 6087} {"train_loss": -27.467487335205078, "global_step": 505246, "epoch": 6087} {"train_loss": -27.29023551940918, "global_step": 505247, "epoch": 6087} {"train_loss": -27.5850887298584, "global_step": 505248, "epoch": 6087} {"train_loss": -27.3627986907959, "global_step": 505249, "epoch": 6087} {"train_loss": -27.422460556030273, "global_step": 505250, "epoch": 6087} {"train_loss": -27.223119735717773, "global_step": 505251, "epoch": 6087} {"train_loss": -27.50361442565918, "global_step": 505252, "epoch": 6087} {"train_loss": -27.578901290893555, "global_step": 505253, "epoch": 6087} {"train_loss": -27.410985946655273, "global_step": 505254, "epoch": 6087} {"train_loss": -27.70273780822754, "global_step": 505255, "epoch": 6087} {"train_loss": -27.504241943359375, "global_step": 505256, "epoch": 6087} {"train_loss": -27.295866012573242, "global_step": 505257, "epoch": 6087} {"train_loss": -27.358407974243164, "global_step": 505258, "epoch": 6087} {"train_loss": -27.334192276000977, "global_step": 505259, "epoch": 6087} {"train_loss": -27.56707763671875, "global_step": 505260, "epoch": 6087} {"train_loss": -27.41937255859375, "global_step": 505261, "epoch": 6087} {"train_loss": -27.22016716003418, "global_step": 505262, "epoch": 6087} {"train_loss": -27.26740074157715, "global_step": 505263, "epoch": 6087} {"train_loss": -27.27935218811035, "global_step": 505264, "epoch": 6087} {"train_loss": -27.421051025390625, "global_step": 505265, "epoch": 6087} {"train_loss": -27.543304443359375, "global_step": 505266, "epoch": 6087} {"train_loss": -27.489233016967773, "global_step": 505267, "epoch": 6087} {"train_loss": -27.413114547729492, "global_step": 505268, "epoch": 6087} {"train_loss": -27.47372817993164, "global_step": 505269, "epoch": 6087} {"train_loss": -27.633161544799805, "global_step": 505270, "epoch": 6087} {"train_loss": -27.49567985534668, "global_step": 505271, "epoch": 6087} {"train_loss": -27.567289352416992, "global_step": 505272, "epoch": 6087} {"train_loss": -27.574426651000977, "global_step": 505273, "epoch": 6087} {"train_loss": -27.827550888061523, "global_step": 505274, "epoch": 6087} {"train_loss": -27.260839462280273, "global_step": 505275, "epoch": 6087} {"train_loss": -27.713851928710938, "global_step": 505276, "epoch": 6087} {"train_loss": -27.469579696655273, "global_step": 505277, "epoch": 6087} {"train_loss": -27.65018653869629, "global_step": 505278, "epoch": 6087} {"train_loss": -27.26584815979004, "global_step": 505279, "epoch": 6087} {"train_loss": -27.6761474609375, "global_step": 505280, "epoch": 6087} {"train_loss": -27.531400680541992, "global_step": 505281, "epoch": 6087} {"train_loss": -27.416690826416016, "global_step": 505282, "epoch": 6087} {"train_loss": -27.564563751220703, "global_step": 505283, "epoch": 6087} {"train_loss": -27.509511947631836, "global_step": 505284, "epoch": 6087} {"train_loss": -27.481931686401367, "global_step": 505285, "epoch": 6087} {"train_loss": -27.65447425842285, "global_step": 505286, "epoch": 6087} {"train_loss": -27.271642684936523, "global_step": 505287, "epoch": 6087} {"train_loss": -27.089282989501953, "global_step": 505288, "epoch": 6087} {"train_loss": -27.639789581298828, "global_step": 505289, "epoch": 6087} {"train_loss": -27.684192657470703, "global_step": 505290, "epoch": 6087} {"train_loss": -27.330533981323242, "global_step": 505291, "epoch": 6087} {"train_loss": -27.314334869384766, "global_step": 505292, "epoch": 6087} {"train_loss": -26.995929718017578, "global_step": 505293, "epoch": 6087} {"train_loss": -27.212982177734375, "global_step": 505294, "epoch": 6087} {"train_loss": -27.032949447631836, "global_step": 505295, "epoch": 6087} {"train_loss": -26.643268585205078, "global_step": 505296, "epoch": 6087} {"train_loss": -27.168256759643555, "global_step": 505297, "epoch": 6087} {"train_loss": -27.492401123046875, "global_step": 505298, "epoch": 6087} {"train_loss": -26.5599422454834, "global_step": 505299, "epoch": 6087} {"train_loss": -26.986337661743164, "global_step": 505300, "epoch": 6087} {"train_loss": -26.55061149597168, "global_step": 505301, "epoch": 6087} {"train_loss": -27.63238525390625, "global_step": 505302, "epoch": 6087} {"train_loss": -27.394768289772863, "global_step": 505303, "epoch": 6087, "val_loss": 6489865.5} {"train_loss": -26.74660301208496, "global_step": 505304, "epoch": 6088} {"train_loss": -26.69477653503418, "global_step": 505305, "epoch": 6088} {"train_loss": -26.331134796142578, "global_step": 505306, "epoch": 6088} {"train_loss": -26.250946044921875, "global_step": 505307, "epoch": 6088} {"train_loss": -26.4540958404541, "global_step": 505308, "epoch": 6088} {"train_loss": -26.523168563842773, "global_step": 505309, "epoch": 6088} {"train_loss": -26.582136154174805, "global_step": 505310, "epoch": 6088} {"train_loss": -27.333032608032227, "global_step": 505311, "epoch": 6088} {"train_loss": -26.512699127197266, "global_step": 505312, "epoch": 6088} {"train_loss": -26.918792724609375, "global_step": 505313, "epoch": 6088} {"train_loss": -26.79654884338379, "global_step": 505314, "epoch": 6088} {"train_loss": -27.062000274658203, "global_step": 505315, "epoch": 6088} {"train_loss": -26.261327743530273, "global_step": 505316, "epoch": 6088} {"train_loss": -26.896936416625977, "global_step": 505317, "epoch": 6088} {"train_loss": -27.084741592407227, "global_step": 505318, "epoch": 6088} {"train_loss": -26.96938133239746, "global_step": 505319, "epoch": 6088} {"train_loss": -27.153125762939453, "global_step": 505320, "epoch": 6088} {"train_loss": -27.357385635375977, "global_step": 505321, "epoch": 6088} {"train_loss": -27.159215927124023, "global_step": 505322, "epoch": 6088} {"train_loss": -26.943384170532227, "global_step": 505323, "epoch": 6088} {"train_loss": -27.466413497924805, "global_step": 505324, "epoch": 6088} {"train_loss": -27.346515655517578, "global_step": 505325, "epoch": 6088} {"train_loss": -27.120588302612305, "global_step": 505326, "epoch": 6088} {"train_loss": -27.205907821655273, "global_step": 505327, "epoch": 6088} {"train_loss": -27.143787384033203, "global_step": 505328, "epoch": 6088} {"train_loss": -27.533971786499023, "global_step": 505329, "epoch": 6088} {"train_loss": -27.49716567993164, "global_step": 505330, "epoch": 6088} {"train_loss": -27.448749542236328, "global_step": 505331, "epoch": 6088} {"train_loss": -27.383380889892578, "global_step": 505332, "epoch": 6088} {"train_loss": -27.4079532623291, "global_step": 505333, "epoch": 6088} {"train_loss": -27.43625259399414, "global_step": 505334, "epoch": 6088} {"train_loss": -27.731109619140625, "global_step": 505335, "epoch": 6088} {"train_loss": -27.39820671081543, "global_step": 505336, "epoch": 6088} {"train_loss": -27.317419052124023, "global_step": 505337, "epoch": 6088} {"train_loss": -27.32244300842285, "global_step": 505338, "epoch": 6088} {"train_loss": -27.44439125061035, "global_step": 505339, "epoch": 6088} {"train_loss": -27.699384689331055, "global_step": 505340, "epoch": 6088} {"train_loss": -27.487995147705078, "global_step": 505341, "epoch": 6088} {"train_loss": -27.50733757019043, "global_step": 505342, "epoch": 6088} {"train_loss": -27.96237564086914, "global_step": 505343, "epoch": 6088} {"train_loss": -27.289081573486328, "global_step": 505344, "epoch": 6088} {"train_loss": -27.145551681518555, "global_step": 505345, "epoch": 6088} {"train_loss": -27.279422760009766, "global_step": 505346, "epoch": 6088} {"train_loss": -27.289209365844727, "global_step": 505347, "epoch": 6088} {"train_loss": -27.132299423217773, "global_step": 505348, "epoch": 6088} {"train_loss": -27.22535514831543, "global_step": 505349, "epoch": 6088} {"train_loss": -26.919803619384766, "global_step": 505350, "epoch": 6088} {"train_loss": -27.220783233642578, "global_step": 505351, "epoch": 6088} {"train_loss": -27.956390380859375, "global_step": 505352, "epoch": 6088} {"train_loss": -27.48443603515625, "global_step": 505353, "epoch": 6088} {"train_loss": -27.372522354125977, "global_step": 505354, "epoch": 6088} {"train_loss": -27.23530387878418, "global_step": 505355, "epoch": 6088} {"train_loss": -27.558862686157227, "global_step": 505356, "epoch": 6088} {"train_loss": -27.406949996948242, "global_step": 505357, "epoch": 6088} {"train_loss": -27.471776962280273, "global_step": 505358, "epoch": 6088} {"train_loss": -27.28837013244629, "global_step": 505359, "epoch": 6088} {"train_loss": -27.156173706054688, "global_step": 505360, "epoch": 6088} {"train_loss": -27.4963436126709, "global_step": 505361, "epoch": 6088} {"train_loss": -26.802200317382812, "global_step": 505362, "epoch": 6088} {"train_loss": -27.504138946533203, "global_step": 505363, "epoch": 6088} {"train_loss": -27.171667098999023, "global_step": 505364, "epoch": 6088} {"train_loss": -27.570648193359375, "global_step": 505365, "epoch": 6088} {"train_loss": -27.21332359313965, "global_step": 505366, "epoch": 6088} {"train_loss": -27.430185317993164, "global_step": 505367, "epoch": 6088} {"train_loss": -27.13075065612793, "global_step": 505368, "epoch": 6088} {"train_loss": -27.2221736907959, "global_step": 505369, "epoch": 6088} {"train_loss": -27.31914710998535, "global_step": 505370, "epoch": 6088} {"train_loss": -27.284332275390625, "global_step": 505371, "epoch": 6088} {"train_loss": -27.34893798828125, "global_step": 505372, "epoch": 6088} {"train_loss": -27.447223663330078, "global_step": 505373, "epoch": 6088} {"train_loss": -26.8680419921875, "global_step": 505374, "epoch": 6088} {"train_loss": -27.29802894592285, "global_step": 505375, "epoch": 6088} {"train_loss": -27.274137496948242, "global_step": 505376, "epoch": 6088} {"train_loss": -27.303482055664062, "global_step": 505377, "epoch": 6088} {"train_loss": -27.506330490112305, "global_step": 505378, "epoch": 6088} {"train_loss": -27.160459518432617, "global_step": 505379, "epoch": 6088} {"train_loss": -27.11091423034668, "global_step": 505380, "epoch": 6088} {"train_loss": -27.320749282836914, "global_step": 505381, "epoch": 6088} {"train_loss": -27.429784774780273, "global_step": 505382, "epoch": 6088} {"train_loss": -27.655935287475586, "global_step": 505383, "epoch": 6088} {"train_loss": -27.201684951782227, "global_step": 505384, "epoch": 6088} {"train_loss": -27.182178497314453, "global_step": 505385, "epoch": 6088} {"train_loss": -27.223809115857964, "global_step": 505386, "epoch": 6088, "val_loss": 6435135.0} {"train_loss": -26.663068771362305, "global_step": 505387, "epoch": 6089} {"train_loss": -26.502233505249023, "global_step": 505388, "epoch": 6089} {"train_loss": -26.701581954956055, "global_step": 505389, "epoch": 6089} {"train_loss": -26.820043563842773, "global_step": 505390, "epoch": 6089} {"train_loss": -26.09221839904785, "global_step": 505391, "epoch": 6089} {"train_loss": -26.972198486328125, "global_step": 505392, "epoch": 6089} {"train_loss": -27.249530792236328, "global_step": 505393, "epoch": 6089} {"train_loss": -26.58588218688965, "global_step": 505394, "epoch": 6089} {"train_loss": -26.944761276245117, "global_step": 505395, "epoch": 6089} {"train_loss": -27.116907119750977, "global_step": 505396, "epoch": 6089} {"train_loss": -26.912885665893555, "global_step": 505397, "epoch": 6089} {"train_loss": -27.132177352905273, "global_step": 505398, "epoch": 6089} {"train_loss": -26.93329429626465, "global_step": 505399, "epoch": 6089} {"train_loss": -27.22918128967285, "global_step": 505400, "epoch": 6089} {"train_loss": -27.441686630249023, "global_step": 505401, "epoch": 6089} {"train_loss": -27.098791122436523, "global_step": 505402, "epoch": 6089} {"train_loss": -27.212915420532227, "global_step": 505403, "epoch": 6089} {"train_loss": -27.494007110595703, "global_step": 505404, "epoch": 6089} {"train_loss": -27.32381248474121, "global_step": 505405, "epoch": 6089} {"train_loss": -27.2849178314209, "global_step": 505406, "epoch": 6089} {"train_loss": -27.05792236328125, "global_step": 505407, "epoch": 6089} {"train_loss": -27.324512481689453, "global_step": 505408, "epoch": 6089} {"train_loss": -27.59309196472168, "global_step": 505409, "epoch": 6089} {"train_loss": -27.65030860900879, "global_step": 505410, "epoch": 6089} {"train_loss": -27.51239013671875, "global_step": 505411, "epoch": 6089} {"train_loss": -27.248815536499023, "global_step": 505412, "epoch": 6089} {"train_loss": -27.3547306060791, "global_step": 505413, "epoch": 6089} {"train_loss": -27.492767333984375, "global_step": 505414, "epoch": 6089} {"train_loss": -27.763647079467773, "global_step": 505415, "epoch": 6089} {"train_loss": -27.742292404174805, "global_step": 505416, "epoch": 6089} {"train_loss": -27.3509521484375, "global_step": 505417, "epoch": 6089} {"train_loss": -27.263044357299805, "global_step": 505418, "epoch": 6089} {"train_loss": -27.169824600219727, "global_step": 505419, "epoch": 6089} {"train_loss": -27.616323471069336, "global_step": 505420, "epoch": 6089} {"train_loss": -27.211267471313477, "global_step": 505421, "epoch": 6089} {"train_loss": -27.52141761779785, "global_step": 505422, "epoch": 6089} {"train_loss": -27.723363876342773, "global_step": 505423, "epoch": 6089} {"train_loss": -27.39649772644043, "global_step": 505424, "epoch": 6089} {"train_loss": -27.720661163330078, "global_step": 505425, "epoch": 6089} {"train_loss": -27.384374618530273, "global_step": 505426, "epoch": 6089} {"train_loss": -27.781774520874023, "global_step": 505427, "epoch": 6089} {"train_loss": -27.71173667907715, "global_step": 505428, "epoch": 6089} {"train_loss": -27.28029441833496, "global_step": 505429, "epoch": 6089} {"train_loss": -27.47999382019043, "global_step": 505430, "epoch": 6089} {"train_loss": -27.50439453125, "global_step": 505431, "epoch": 6089} {"train_loss": -27.026330947875977, "global_step": 505432, "epoch": 6089} {"train_loss": -27.864049911499023, "global_step": 505433, "epoch": 6089} {"train_loss": -27.468463897705078, "global_step": 505434, "epoch": 6089} {"train_loss": -27.591588973999023, "global_step": 505435, "epoch": 6089} {"train_loss": -27.620361328125, "global_step": 505436, "epoch": 6089} {"train_loss": -27.673460006713867, "global_step": 505437, "epoch": 6089} {"train_loss": -27.815082550048828, "global_step": 505438, "epoch": 6089} {"train_loss": -27.783344268798828, "global_step": 505439, "epoch": 6089} {"train_loss": -27.650190353393555, "global_step": 505440, "epoch": 6089} {"train_loss": -27.363794326782227, "global_step": 505441, "epoch": 6089} {"train_loss": -27.5488338470459, "global_step": 505442, "epoch": 6089} {"train_loss": -27.50336265563965, "global_step": 505443, "epoch": 6089} {"train_loss": -27.490644454956055, "global_step": 505444, "epoch": 6089} {"train_loss": -27.694284439086914, "global_step": 505445, "epoch": 6089} {"train_loss": -27.0474796295166, "global_step": 505446, "epoch": 6089} {"train_loss": -27.537290573120117, "global_step": 505447, "epoch": 6089} {"train_loss": -27.293598175048828, "global_step": 505448, "epoch": 6089} {"train_loss": -27.112890243530273, "global_step": 505449, "epoch": 6089} {"train_loss": -26.592926025390625, "global_step": 505450, "epoch": 6089} {"train_loss": -26.69072914123535, "global_step": 505451, "epoch": 6089} {"train_loss": -26.96626853942871, "global_step": 505452, "epoch": 6089} {"train_loss": -27.516653060913086, "global_step": 505453, "epoch": 6089} {"train_loss": -27.89002799987793, "global_step": 505454, "epoch": 6089} {"train_loss": -27.476049423217773, "global_step": 505455, "epoch": 6089} {"train_loss": -27.356714248657227, "global_step": 505456, "epoch": 6089} {"train_loss": -27.817157745361328, "global_step": 505457, "epoch": 6089} {"train_loss": -27.455402374267578, "global_step": 505458, "epoch": 6089} {"train_loss": -27.5476131439209, "global_step": 505459, "epoch": 6089} {"train_loss": -27.494680404663086, "global_step": 505460, "epoch": 6089} {"train_loss": -27.71357536315918, "global_step": 505461, "epoch": 6089} {"train_loss": -27.529041290283203, "global_step": 505462, "epoch": 6089} {"train_loss": -27.5960636138916, "global_step": 505463, "epoch": 6089} {"train_loss": -27.494543075561523, "global_step": 505464, "epoch": 6089} {"train_loss": -27.407861709594727, "global_step": 505465, "epoch": 6089} {"train_loss": -27.48927116394043, "global_step": 505466, "epoch": 6089} {"train_loss": -27.52528953552246, "global_step": 505467, "epoch": 6089} {"train_loss": -27.591588973999023, "global_step": 505468, "epoch": 6089} {"train_loss": -27.35012700184282, "global_step": 505469, "epoch": 6089, "val_loss": 6556946.0} {"train_loss": -27.185657501220703, "global_step": 505470, "epoch": 6090} {"train_loss": -27.180932998657227, "global_step": 505471, "epoch": 6090} {"train_loss": -27.377344131469727, "global_step": 505472, "epoch": 6090} {"train_loss": -27.424036026000977, "global_step": 505473, "epoch": 6090} {"train_loss": -27.18135643005371, "global_step": 505474, "epoch": 6090} {"train_loss": -26.973541259765625, "global_step": 505475, "epoch": 6090} {"train_loss": -26.784957885742188, "global_step": 505476, "epoch": 6090} {"train_loss": -27.280933380126953, "global_step": 505477, "epoch": 6090} {"train_loss": -27.449506759643555, "global_step": 505478, "epoch": 6090} {"train_loss": -27.21136474609375, "global_step": 505479, "epoch": 6090} {"train_loss": -27.713727951049805, "global_step": 505480, "epoch": 6090} {"train_loss": -27.345067977905273, "global_step": 505481, "epoch": 6090} {"train_loss": -27.50390625, "global_step": 505482, "epoch": 6090} {"train_loss": -27.300643920898438, "global_step": 505483, "epoch": 6090} {"train_loss": -27.738285064697266, "global_step": 505484, "epoch": 6090} {"train_loss": -27.268964767456055, "global_step": 505485, "epoch": 6090} {"train_loss": -27.289737701416016, "global_step": 505486, "epoch": 6090} {"train_loss": -27.102710723876953, "global_step": 505487, "epoch": 6090} {"train_loss": -27.323963165283203, "global_step": 505488, "epoch": 6090} {"train_loss": -27.374597549438477, "global_step": 505489, "epoch": 6090} {"train_loss": -27.362018585205078, "global_step": 505490, "epoch": 6090} {"train_loss": -27.510244369506836, "global_step": 505491, "epoch": 6090} {"train_loss": -27.457340240478516, "global_step": 505492, "epoch": 6090} {"train_loss": -27.508365631103516, "global_step": 505493, "epoch": 6090} {"train_loss": -27.513212203979492, "global_step": 505494, "epoch": 6090} {"train_loss": -27.71491050720215, "global_step": 505495, "epoch": 6090} {"train_loss": -27.570449829101562, "global_step": 505496, "epoch": 6090} {"train_loss": -27.438770294189453, "global_step": 505497, "epoch": 6090} {"train_loss": -27.43195915222168, "global_step": 505498, "epoch": 6090} {"train_loss": -27.644407272338867, "global_step": 505499, "epoch": 6090} {"train_loss": -27.46351432800293, "global_step": 505500, "epoch": 6090} {"train_loss": -27.444799423217773, "global_step": 505501, "epoch": 6090} {"train_loss": -27.643423080444336, "global_step": 505502, "epoch": 6090} {"train_loss": -27.449298858642578, "global_step": 505503, "epoch": 6090} {"train_loss": -27.577808380126953, "global_step": 505504, "epoch": 6090} {"train_loss": -27.548995971679688, "global_step": 505505, "epoch": 6090} {"train_loss": -28.065521240234375, "global_step": 505506, "epoch": 6090} {"train_loss": -27.505483627319336, "global_step": 505507, "epoch": 6090} {"train_loss": -27.231903076171875, "global_step": 505508, "epoch": 6090} {"train_loss": -27.44075584411621, "global_step": 505509, "epoch": 6090} {"train_loss": -27.732141494750977, "global_step": 505510, "epoch": 6090} {"train_loss": -27.54743003845215, "global_step": 505511, "epoch": 6090} {"train_loss": -27.557086944580078, "global_step": 505512, "epoch": 6090} {"train_loss": -27.241846084594727, "global_step": 505513, "epoch": 6090} {"train_loss": -27.0319881439209, "global_step": 505514, "epoch": 6090} {"train_loss": -27.39838981628418, "global_step": 505515, "epoch": 6090} {"train_loss": -27.5017147064209, "global_step": 505516, "epoch": 6090} {"train_loss": -27.294458389282227, "global_step": 505517, "epoch": 6090} {"train_loss": -27.366474151611328, "global_step": 505518, "epoch": 6090} {"train_loss": -27.04816246032715, "global_step": 505519, "epoch": 6090} {"train_loss": -26.328149795532227, "global_step": 505520, "epoch": 6090} {"train_loss": -26.938800811767578, "global_step": 505521, "epoch": 6090} {"train_loss": -26.8348331451416, "global_step": 505522, "epoch": 6090} {"train_loss": -26.887304306030273, "global_step": 505523, "epoch": 6090} {"train_loss": -27.209436416625977, "global_step": 505524, "epoch": 6090} {"train_loss": -26.961801528930664, "global_step": 505525, "epoch": 6090} {"train_loss": -27.198993682861328, "global_step": 505526, "epoch": 6090} {"train_loss": -27.184524536132812, "global_step": 505527, "epoch": 6090} {"train_loss": -26.87346839904785, "global_step": 505528, "epoch": 6090} {"train_loss": -27.09049415588379, "global_step": 505529, "epoch": 6090} {"train_loss": -27.447362899780273, "global_step": 505530, "epoch": 6090} {"train_loss": -26.9154052734375, "global_step": 505531, "epoch": 6090} {"train_loss": -27.494998931884766, "global_step": 505532, "epoch": 6090} {"train_loss": -27.261510848999023, "global_step": 505533, "epoch": 6090} {"train_loss": -27.61056900024414, "global_step": 505534, "epoch": 6090} {"train_loss": -27.11410903930664, "global_step": 505535, "epoch": 6090} {"train_loss": -27.290769577026367, "global_step": 505536, "epoch": 6090} {"train_loss": -27.3930721282959, "global_step": 505537, "epoch": 6090} {"train_loss": -27.228443145751953, "global_step": 505538, "epoch": 6090} {"train_loss": -27.860910415649414, "global_step": 505539, "epoch": 6090} {"train_loss": -27.411273956298828, "global_step": 505540, "epoch": 6090} {"train_loss": -27.0644588470459, "global_step": 505541, "epoch": 6090} {"train_loss": -27.59404945373535, "global_step": 505542, "epoch": 6090} {"train_loss": -27.429889678955078, "global_step": 505543, "epoch": 6090} {"train_loss": -27.530683517456055, "global_step": 505544, "epoch": 6090} {"train_loss": -27.384321212768555, "global_step": 505545, "epoch": 6090} {"train_loss": -27.699024200439453, "global_step": 505546, "epoch": 6090} {"train_loss": -27.373310089111328, "global_step": 505547, "epoch": 6090} {"train_loss": -27.6803035736084, "global_step": 505548, "epoch": 6090} {"train_loss": -27.48943519592285, "global_step": 505549, "epoch": 6090} {"train_loss": -27.173856735229492, "global_step": 505550, "epoch": 6090} {"train_loss": -27.540424346923828, "global_step": 505551, "epoch": 6090} {"train_loss": -27.340912324836456, "global_step": 505552, "epoch": 6090, "val_loss": 6578454.0} {"train_loss": -27.13348960876465, "global_step": 505553, "epoch": 6091} {"train_loss": -27.077661514282227, "global_step": 505554, "epoch": 6091} {"train_loss": -27.080564498901367, "global_step": 505555, "epoch": 6091} {"train_loss": -27.38442039489746, "global_step": 505556, "epoch": 6091} {"train_loss": -26.914642333984375, "global_step": 505557, "epoch": 6091} {"train_loss": -27.1944637298584, "global_step": 505558, "epoch": 6091} {"train_loss": -27.438093185424805, "global_step": 505559, "epoch": 6091} {"train_loss": -27.188312530517578, "global_step": 505560, "epoch": 6091} {"train_loss": -27.259628295898438, "global_step": 505561, "epoch": 6091} {"train_loss": -27.53887939453125, "global_step": 505562, "epoch": 6091} {"train_loss": -27.24527359008789, "global_step": 505563, "epoch": 6091} {"train_loss": -27.18963623046875, "global_step": 505564, "epoch": 6091} {"train_loss": -27.47141456604004, "global_step": 505565, "epoch": 6091} {"train_loss": -27.08563232421875, "global_step": 505566, "epoch": 6091} {"train_loss": -27.385671615600586, "global_step": 505567, "epoch": 6091} {"train_loss": -27.733423233032227, "global_step": 505568, "epoch": 6091} {"train_loss": -27.18166160583496, "global_step": 505569, "epoch": 6091} {"train_loss": -27.401105880737305, "global_step": 505570, "epoch": 6091} {"train_loss": -27.19805335998535, "global_step": 505571, "epoch": 6091} {"train_loss": -27.436725616455078, "global_step": 505572, "epoch": 6091} {"train_loss": -27.30646324157715, "global_step": 505573, "epoch": 6091} {"train_loss": -27.39900016784668, "global_step": 505574, "epoch": 6091} {"train_loss": -27.449865341186523, "global_step": 505575, "epoch": 6091} {"train_loss": -27.677722930908203, "global_step": 505576, "epoch": 6091} {"train_loss": -27.03896141052246, "global_step": 505577, "epoch": 6091} {"train_loss": -27.38494300842285, "global_step": 505578, "epoch": 6091} {"train_loss": -27.217910766601562, "global_step": 505579, "epoch": 6091} {"train_loss": -27.649747848510742, "global_step": 505580, "epoch": 6091} {"train_loss": -27.5528564453125, "global_step": 505581, "epoch": 6091} {"train_loss": -26.968107223510742, "global_step": 505582, "epoch": 6091} {"train_loss": -27.472009658813477, "global_step": 505583, "epoch": 6091} {"train_loss": -27.574193954467773, "global_step": 505584, "epoch": 6091} {"train_loss": -27.277530670166016, "global_step": 505585, "epoch": 6091} {"train_loss": -27.440418243408203, "global_step": 505586, "epoch": 6091} {"train_loss": -27.369062423706055, "global_step": 505587, "epoch": 6091} {"train_loss": -27.527185440063477, "global_step": 505588, "epoch": 6091} {"train_loss": -27.713653564453125, "global_step": 505589, "epoch": 6091} {"train_loss": -27.44746208190918, "global_step": 505590, "epoch": 6091} {"train_loss": -27.940128326416016, "global_step": 505591, "epoch": 6091} {"train_loss": -27.641204833984375, "global_step": 505592, "epoch": 6091} {"train_loss": -26.9461727142334, "global_step": 505593, "epoch": 6091} {"train_loss": -27.501880645751953, "global_step": 505594, "epoch": 6091} {"train_loss": -28.063932418823242, "global_step": 505595, "epoch": 6091} {"train_loss": -27.70977210998535, "global_step": 505596, "epoch": 6091} {"train_loss": -27.888288497924805, "global_step": 505597, "epoch": 6091} {"train_loss": -27.640039443969727, "global_step": 505598, "epoch": 6091} {"train_loss": -27.464344024658203, "global_step": 505599, "epoch": 6091} {"train_loss": -27.9338436126709, "global_step": 505600, "epoch": 6091} {"train_loss": -27.863855361938477, "global_step": 505601, "epoch": 6091} {"train_loss": -27.553186416625977, "global_step": 505602, "epoch": 6091} {"train_loss": -27.578205108642578, "global_step": 505603, "epoch": 6091} {"train_loss": -27.910064697265625, "global_step": 505604, "epoch": 6091} {"train_loss": -27.606863021850586, "global_step": 505605, "epoch": 6091} {"train_loss": -27.225055694580078, "global_step": 505606, "epoch": 6091} {"train_loss": -27.244348526000977, "global_step": 505607, "epoch": 6091} {"train_loss": -27.453948974609375, "global_step": 505608, "epoch": 6091} {"train_loss": -27.538156509399414, "global_step": 505609, "epoch": 6091} {"train_loss": -27.64436149597168, "global_step": 505610, "epoch": 6091} {"train_loss": -27.472217559814453, "global_step": 505611, "epoch": 6091} {"train_loss": -27.379779815673828, "global_step": 505612, "epoch": 6091} {"train_loss": -27.364730834960938, "global_step": 505613, "epoch": 6091} {"train_loss": -27.448013305664062, "global_step": 505614, "epoch": 6091} {"train_loss": -27.129230499267578, "global_step": 505615, "epoch": 6091} {"train_loss": -26.866836547851562, "global_step": 505616, "epoch": 6091} {"train_loss": -27.112964630126953, "global_step": 505617, "epoch": 6091} {"train_loss": -26.89474868774414, "global_step": 505618, "epoch": 6091} {"train_loss": -27.370824813842773, "global_step": 505619, "epoch": 6091} {"train_loss": -27.161767959594727, "global_step": 505620, "epoch": 6091} {"train_loss": -27.350879669189453, "global_step": 505621, "epoch": 6091} {"train_loss": -27.386962890625, "global_step": 505622, "epoch": 6091} {"train_loss": -27.16712760925293, "global_step": 505623, "epoch": 6091} {"train_loss": -27.262054443359375, "global_step": 505624, "epoch": 6091} {"train_loss": -27.490188598632812, "global_step": 505625, "epoch": 6091} {"train_loss": -27.301633834838867, "global_step": 505626, "epoch": 6091} {"train_loss": -27.35365104675293, "global_step": 505627, "epoch": 6091} {"train_loss": -27.20863151550293, "global_step": 505628, "epoch": 6091} {"train_loss": -27.534255981445312, "global_step": 505629, "epoch": 6091} {"train_loss": -27.016071319580078, "global_step": 505630, "epoch": 6091} {"train_loss": -27.08344078063965, "global_step": 505631, "epoch": 6091} {"train_loss": -27.306415557861328, "global_step": 505632, "epoch": 6091} {"train_loss": -27.63294792175293, "global_step": 505633, "epoch": 6091} {"train_loss": -27.049728393554688, "global_step": 505634, "epoch": 6091} {"train_loss": -27.383475085338915, "global_step": 505635, "epoch": 6091, "val_loss": 6610258.0} {"train_loss": -26.039966583251953, "global_step": 505636, "epoch": 6092} {"train_loss": -26.60636329650879, "global_step": 505637, "epoch": 6092} {"train_loss": -26.792449951171875, "global_step": 505638, "epoch": 6092} {"train_loss": -26.7619686126709, "global_step": 505639, "epoch": 6092} {"train_loss": -26.64524269104004, "global_step": 505640, "epoch": 6092} {"train_loss": -26.723188400268555, "global_step": 505641, "epoch": 6092} {"train_loss": -25.853540420532227, "global_step": 505642, "epoch": 6092} {"train_loss": -26.690155029296875, "global_step": 505643, "epoch": 6092} {"train_loss": -26.499664306640625, "global_step": 505644, "epoch": 6092} {"train_loss": -26.756372451782227, "global_step": 505645, "epoch": 6092} {"train_loss": -26.950366973876953, "global_step": 505646, "epoch": 6092} {"train_loss": -26.51679039001465, "global_step": 505647, "epoch": 6092} {"train_loss": -26.829492568969727, "global_step": 505648, "epoch": 6092} {"train_loss": -26.73438835144043, "global_step": 505649, "epoch": 6092} {"train_loss": -26.799823760986328, "global_step": 505650, "epoch": 6092} {"train_loss": -26.509292602539062, "global_step": 505651, "epoch": 6092} {"train_loss": -26.975601196289062, "global_step": 505652, "epoch": 6092} {"train_loss": -27.28934669494629, "global_step": 505653, "epoch": 6092} {"train_loss": -26.791763305664062, "global_step": 505654, "epoch": 6092} {"train_loss": -26.829980850219727, "global_step": 505655, "epoch": 6092} {"train_loss": -27.287817001342773, "global_step": 505656, "epoch": 6092} {"train_loss": -27.199249267578125, "global_step": 505657, "epoch": 6092} {"train_loss": -26.879501342773438, "global_step": 505658, "epoch": 6092} {"train_loss": -27.397085189819336, "global_step": 505659, "epoch": 6092} {"train_loss": -27.119327545166016, "global_step": 505660, "epoch": 6092} {"train_loss": -27.019702911376953, "global_step": 505661, "epoch": 6092} {"train_loss": -27.301389694213867, "global_step": 505662, "epoch": 6092} {"train_loss": -27.691680908203125, "global_step": 505663, "epoch": 6092} {"train_loss": -27.28521156311035, "global_step": 505664, "epoch": 6092} {"train_loss": -26.98876953125, "global_step": 505665, "epoch": 6092} {"train_loss": -27.311737060546875, "global_step": 505666, "epoch": 6092} {"train_loss": -27.483600616455078, "global_step": 505667, "epoch": 6092} {"train_loss": -27.37636375427246, "global_step": 505668, "epoch": 6092} {"train_loss": -27.290729522705078, "global_step": 505669, "epoch": 6092} {"train_loss": -27.45254898071289, "global_step": 505670, "epoch": 6092} {"train_loss": -27.3172550201416, "global_step": 505671, "epoch": 6092} {"train_loss": -26.970172882080078, "global_step": 505672, "epoch": 6092} {"train_loss": -27.216123580932617, "global_step": 505673, "epoch": 6092} {"train_loss": -27.211612701416016, "global_step": 505674, "epoch": 6092} {"train_loss": -27.456329345703125, "global_step": 505675, "epoch": 6092} {"train_loss": -27.319244384765625, "global_step": 505676, "epoch": 6092} {"train_loss": -27.227466583251953, "global_step": 505677, "epoch": 6092} {"train_loss": -27.44141960144043, "global_step": 505678, "epoch": 6092} {"train_loss": -27.805814743041992, "global_step": 505679, "epoch": 6092} {"train_loss": -27.427921295166016, "global_step": 505680, "epoch": 6092} {"train_loss": -27.356311798095703, "global_step": 505681, "epoch": 6092} {"train_loss": -27.412158966064453, "global_step": 505682, "epoch": 6092} {"train_loss": -27.270465850830078, "global_step": 505683, "epoch": 6092} {"train_loss": -27.3220272064209, "global_step": 505684, "epoch": 6092} {"train_loss": -27.75687599182129, "global_step": 505685, "epoch": 6092} {"train_loss": -27.512434005737305, "global_step": 505686, "epoch": 6092} {"train_loss": -27.75479507446289, "global_step": 505687, "epoch": 6092} {"train_loss": -27.50146484375, "global_step": 505688, "epoch": 6092} {"train_loss": -27.44487953186035, "global_step": 505689, "epoch": 6092} {"train_loss": -27.543167114257812, "global_step": 505690, "epoch": 6092} {"train_loss": -27.590417861938477, "global_step": 505691, "epoch": 6092} {"train_loss": -27.59320068359375, "global_step": 505692, "epoch": 6092} {"train_loss": -27.65414810180664, "global_step": 505693, "epoch": 6092} {"train_loss": -27.685705184936523, "global_step": 505694, "epoch": 6092} {"train_loss": -27.550235748291016, "global_step": 505695, "epoch": 6092} {"train_loss": -27.768049240112305, "global_step": 505696, "epoch": 6092} {"train_loss": -27.93045425415039, "global_step": 505697, "epoch": 6092} {"train_loss": -27.757062911987305, "global_step": 505698, "epoch": 6092} {"train_loss": -27.631254196166992, "global_step": 505699, "epoch": 6092} {"train_loss": -27.345630645751953, "global_step": 505700, "epoch": 6092} {"train_loss": -27.44998550415039, "global_step": 505701, "epoch": 6092} {"train_loss": -26.960784912109375, "global_step": 505702, "epoch": 6092} {"train_loss": -26.9888858795166, "global_step": 505703, "epoch": 6092} {"train_loss": -26.513025283813477, "global_step": 505704, "epoch": 6092} {"train_loss": -27.61895179748535, "global_step": 505705, "epoch": 6092} {"train_loss": -27.443653106689453, "global_step": 505706, "epoch": 6092} {"train_loss": -27.454076766967773, "global_step": 505707, "epoch": 6092} {"train_loss": -27.31619644165039, "global_step": 505708, "epoch": 6092} {"train_loss": -26.907896041870117, "global_step": 505709, "epoch": 6092} {"train_loss": -27.20450210571289, "global_step": 505710, "epoch": 6092} {"train_loss": -26.760236740112305, "global_step": 505711, "epoch": 6092} {"train_loss": -26.665679931640625, "global_step": 505712, "epoch": 6092} {"train_loss": -26.784696578979492, "global_step": 505713, "epoch": 6092} {"train_loss": -26.983448028564453, "global_step": 505714, "epoch": 6092} {"train_loss": -27.170522689819336, "global_step": 505715, "epoch": 6092} {"train_loss": -27.032562255859375, "global_step": 505716, "epoch": 6092} {"train_loss": -27.19388198852539, "global_step": 505717, "epoch": 6092} {"train_loss": -27.178530038121234, "global_step": 505718, "epoch": 6092, "val_loss": 6580547.5} {"train_loss": -25.67951774597168, "global_step": 505719, "epoch": 6093} {"train_loss": -25.230802536010742, "global_step": 505720, "epoch": 6093} {"train_loss": -26.540699005126953, "global_step": 505721, "epoch": 6093} {"train_loss": -26.118188858032227, "global_step": 505722, "epoch": 6093} {"train_loss": -26.61907386779785, "global_step": 505723, "epoch": 6093} {"train_loss": -25.922332763671875, "global_step": 505724, "epoch": 6093} {"train_loss": -26.08388328552246, "global_step": 505725, "epoch": 6093} {"train_loss": -26.665002822875977, "global_step": 505726, "epoch": 6093} {"train_loss": -26.660852432250977, "global_step": 505727, "epoch": 6093} {"train_loss": -26.23040771484375, "global_step": 505728, "epoch": 6093} {"train_loss": -26.46095085144043, "global_step": 505729, "epoch": 6093} {"train_loss": -26.72222328186035, "global_step": 505730, "epoch": 6093} {"train_loss": -26.470548629760742, "global_step": 505731, "epoch": 6093} {"train_loss": -26.852645874023438, "global_step": 505732, "epoch": 6093} {"train_loss": -26.5284481048584, "global_step": 505733, "epoch": 6093} {"train_loss": -26.96796989440918, "global_step": 505734, "epoch": 6093} {"train_loss": -26.477069854736328, "global_step": 505735, "epoch": 6093} {"train_loss": -26.986148834228516, "global_step": 505736, "epoch": 6093} {"train_loss": -26.92013931274414, "global_step": 505737, "epoch": 6093} {"train_loss": -26.636001586914062, "global_step": 505738, "epoch": 6093} {"train_loss": -26.903226852416992, "global_step": 505739, "epoch": 6093} {"train_loss": -27.00687026977539, "global_step": 505740, "epoch": 6093} {"train_loss": -26.78778648376465, "global_step": 505741, "epoch": 6093} {"train_loss": -26.929174423217773, "global_step": 505742, "epoch": 6093} {"train_loss": -27.226465225219727, "global_step": 505743, "epoch": 6093} {"train_loss": -27.040836334228516, "global_step": 505744, "epoch": 6093} {"train_loss": -27.305410385131836, "global_step": 505745, "epoch": 6093} {"train_loss": -27.0826473236084, "global_step": 505746, "epoch": 6093} {"train_loss": -27.257604598999023, "global_step": 505747, "epoch": 6093} {"train_loss": -27.451581954956055, "global_step": 505748, "epoch": 6093} {"train_loss": -27.309507369995117, "global_step": 505749, "epoch": 6093} {"train_loss": -27.0401611328125, "global_step": 505750, "epoch": 6093} {"train_loss": -27.382003784179688, "global_step": 505751, "epoch": 6093} {"train_loss": -27.398290634155273, "global_step": 505752, "epoch": 6093} {"train_loss": -27.226490020751953, "global_step": 505753, "epoch": 6093} {"train_loss": -27.429584503173828, "global_step": 505754, "epoch": 6093} {"train_loss": -27.429244995117188, "global_step": 505755, "epoch": 6093} {"train_loss": -27.541391372680664, "global_step": 505756, "epoch": 6093} {"train_loss": -27.8332462310791, "global_step": 505757, "epoch": 6093} {"train_loss": -27.335819244384766, "global_step": 505758, "epoch": 6093} {"train_loss": -27.52294921875, "global_step": 505759, "epoch": 6093} {"train_loss": -26.96209716796875, "global_step": 505760, "epoch": 6093} {"train_loss": -27.241552352905273, "global_step": 505761, "epoch": 6093} {"train_loss": -27.527908325195312, "global_step": 505762, "epoch": 6093} {"train_loss": -27.515371322631836, "global_step": 505763, "epoch": 6093} {"train_loss": -27.585676193237305, "global_step": 505764, "epoch": 6093} {"train_loss": -27.52776527404785, "global_step": 505765, "epoch": 6093} {"train_loss": -27.645566940307617, "global_step": 505766, "epoch": 6093} {"train_loss": -27.474512100219727, "global_step": 505767, "epoch": 6093} {"train_loss": -27.255908966064453, "global_step": 505768, "epoch": 6093} {"train_loss": -27.628149032592773, "global_step": 505769, "epoch": 6093} {"train_loss": -27.354663848876953, "global_step": 505770, "epoch": 6093} {"train_loss": -27.688873291015625, "global_step": 505771, "epoch": 6093} {"train_loss": -27.783405303955078, "global_step": 505772, "epoch": 6093} {"train_loss": -27.42755126953125, "global_step": 505773, "epoch": 6093} {"train_loss": -27.40069580078125, "global_step": 505774, "epoch": 6093} {"train_loss": -27.5642147064209, "global_step": 505775, "epoch": 6093} {"train_loss": -27.756696701049805, "global_step": 505776, "epoch": 6093} {"train_loss": -27.463178634643555, "global_step": 505777, "epoch": 6093} {"train_loss": -27.6416072845459, "global_step": 505778, "epoch": 6093} {"train_loss": -27.38587760925293, "global_step": 505779, "epoch": 6093} {"train_loss": -27.452930450439453, "global_step": 505780, "epoch": 6093} {"train_loss": -27.249555587768555, "global_step": 505781, "epoch": 6093} {"train_loss": -27.396387100219727, "global_step": 505782, "epoch": 6093} {"train_loss": -27.743101119995117, "global_step": 505783, "epoch": 6093} {"train_loss": -27.140167236328125, "global_step": 505784, "epoch": 6093} {"train_loss": -27.002660751342773, "global_step": 505785, "epoch": 6093} {"train_loss": -26.655776977539062, "global_step": 505786, "epoch": 6093} {"train_loss": -27.4155330657959, "global_step": 505787, "epoch": 6093} {"train_loss": -26.955371856689453, "global_step": 505788, "epoch": 6093} {"train_loss": -27.18299674987793, "global_step": 505789, "epoch": 6093} {"train_loss": -26.916919708251953, "global_step": 505790, "epoch": 6093} {"train_loss": -27.089618682861328, "global_step": 505791, "epoch": 6093} {"train_loss": -27.144498825073242, "global_step": 505792, "epoch": 6093} {"train_loss": -26.850784301757812, "global_step": 505793, "epoch": 6093} {"train_loss": -26.95806884765625, "global_step": 505794, "epoch": 6093} {"train_loss": -27.31636619567871, "global_step": 505795, "epoch": 6093} {"train_loss": -27.209035873413086, "global_step": 505796, "epoch": 6093} {"train_loss": -27.23984718322754, "global_step": 505797, "epoch": 6093} {"train_loss": -27.399200439453125, "global_step": 505798, "epoch": 6093} {"train_loss": -26.92701530456543, "global_step": 505799, "epoch": 6093} {"train_loss": -27.275012969970703, "global_step": 505800, "epoch": 6093} {"train_loss": -27.100438244371528, "global_step": 505801, "epoch": 6093, "val_loss": 6544375.0} {"train_loss": -27.01376724243164, "global_step": 505802, "epoch": 6094} {"train_loss": -26.987396240234375, "global_step": 505803, "epoch": 6094} {"train_loss": -27.197818756103516, "global_step": 505804, "epoch": 6094} {"train_loss": -27.055871963500977, "global_step": 505805, "epoch": 6094} {"train_loss": -26.739660263061523, "global_step": 505806, "epoch": 6094} {"train_loss": -26.465438842773438, "global_step": 505807, "epoch": 6094} {"train_loss": -27.314380645751953, "global_step": 505808, "epoch": 6094} {"train_loss": -27.285924911499023, "global_step": 505809, "epoch": 6094} {"train_loss": -26.693756103515625, "global_step": 505810, "epoch": 6094} {"train_loss": -26.934162139892578, "global_step": 505811, "epoch": 6094} {"train_loss": -26.82526969909668, "global_step": 505812, "epoch": 6094} {"train_loss": -27.05667495727539, "global_step": 505813, "epoch": 6094} {"train_loss": -27.0656795501709, "global_step": 505814, "epoch": 6094} {"train_loss": -27.266637802124023, "global_step": 505815, "epoch": 6094} {"train_loss": -26.924713134765625, "global_step": 505816, "epoch": 6094} {"train_loss": -27.657501220703125, "global_step": 505817, "epoch": 6094} {"train_loss": -27.24016761779785, "global_step": 505818, "epoch": 6094} {"train_loss": -27.208227157592773, "global_step": 505819, "epoch": 6094} {"train_loss": -27.181354522705078, "global_step": 505820, "epoch": 6094} {"train_loss": -27.32515525817871, "global_step": 505821, "epoch": 6094} {"train_loss": -27.360692977905273, "global_step": 505822, "epoch": 6094} {"train_loss": -27.22260093688965, "global_step": 505823, "epoch": 6094} {"train_loss": -27.4711856842041, "global_step": 505824, "epoch": 6094} {"train_loss": -27.0557861328125, "global_step": 505825, "epoch": 6094} {"train_loss": -27.423877716064453, "global_step": 505826, "epoch": 6094} {"train_loss": -27.144031524658203, "global_step": 505827, "epoch": 6094} {"train_loss": -27.4420108795166, "global_step": 505828, "epoch": 6094} {"train_loss": -27.70208740234375, "global_step": 505829, "epoch": 6094} {"train_loss": -27.363494873046875, "global_step": 505830, "epoch": 6094} {"train_loss": -27.533044815063477, "global_step": 505831, "epoch": 6094} {"train_loss": -27.199676513671875, "global_step": 505832, "epoch": 6094} {"train_loss": -27.03546714782715, "global_step": 505833, "epoch": 6094} {"train_loss": -27.69797134399414, "global_step": 505834, "epoch": 6094} {"train_loss": -27.421045303344727, "global_step": 505835, "epoch": 6094} {"train_loss": -27.196523666381836, "global_step": 505836, "epoch": 6094} {"train_loss": -27.75335121154785, "global_step": 505837, "epoch": 6094} {"train_loss": -27.371383666992188, "global_step": 505838, "epoch": 6094} {"train_loss": -27.806913375854492, "global_step": 505839, "epoch": 6094} {"train_loss": -27.3941707611084, "global_step": 505840, "epoch": 6094} {"train_loss": -27.751434326171875, "global_step": 505841, "epoch": 6094} {"train_loss": -27.5782413482666, "global_step": 505842, "epoch": 6094} {"train_loss": -27.570409774780273, "global_step": 505843, "epoch": 6094} {"train_loss": -27.238250732421875, "global_step": 505844, "epoch": 6094} {"train_loss": -28.080869674682617, "global_step": 505845, "epoch": 6094} {"train_loss": -27.667951583862305, "global_step": 505846, "epoch": 6094} {"train_loss": -27.59423828125, "global_step": 505847, "epoch": 6094} {"train_loss": -27.461206436157227, "global_step": 505848, "epoch": 6094} {"train_loss": -27.612686157226562, "global_step": 505849, "epoch": 6094} {"train_loss": -27.547510147094727, "global_step": 505850, "epoch": 6094} {"train_loss": -27.987628936767578, "global_step": 505851, "epoch": 6094} {"train_loss": -27.74493980407715, "global_step": 505852, "epoch": 6094} {"train_loss": -27.77949333190918, "global_step": 505853, "epoch": 6094} {"train_loss": -27.10687255859375, "global_step": 505854, "epoch": 6094} {"train_loss": -27.482044219970703, "global_step": 505855, "epoch": 6094} {"train_loss": -27.531797409057617, "global_step": 505856, "epoch": 6094} {"train_loss": -27.35645866394043, "global_step": 505857, "epoch": 6094} {"train_loss": -27.138504028320312, "global_step": 505858, "epoch": 6094} {"train_loss": -27.335996627807617, "global_step": 505859, "epoch": 6094} {"train_loss": -27.01775550842285, "global_step": 505860, "epoch": 6094} {"train_loss": -26.958332061767578, "global_step": 505861, "epoch": 6094} {"train_loss": -27.199417114257812, "global_step": 505862, "epoch": 6094} {"train_loss": -26.874515533447266, "global_step": 505863, "epoch": 6094} {"train_loss": -27.470319747924805, "global_step": 505864, "epoch": 6094} {"train_loss": -27.13531494140625, "global_step": 505865, "epoch": 6094} {"train_loss": -26.839319229125977, "global_step": 505866, "epoch": 6094} {"train_loss": -26.800413131713867, "global_step": 505867, "epoch": 6094} {"train_loss": -26.86376953125, "global_step": 505868, "epoch": 6094} {"train_loss": -26.9137020111084, "global_step": 505869, "epoch": 6094} {"train_loss": -27.069791793823242, "global_step": 505870, "epoch": 6094} {"train_loss": -27.253936767578125, "global_step": 505871, "epoch": 6094} {"train_loss": -27.27520751953125, "global_step": 505872, "epoch": 6094} {"train_loss": -27.251117706298828, "global_step": 505873, "epoch": 6094} {"train_loss": -27.13720703125, "global_step": 505874, "epoch": 6094} {"train_loss": -26.952579498291016, "global_step": 505875, "epoch": 6094} {"train_loss": -27.382360458374023, "global_step": 505876, "epoch": 6094} {"train_loss": -27.180883407592773, "global_step": 505877, "epoch": 6094} {"train_loss": -26.941625595092773, "global_step": 505878, "epoch": 6094} {"train_loss": -26.965734481811523, "global_step": 505879, "epoch": 6094} {"train_loss": -27.176538467407227, "global_step": 505880, "epoch": 6094} {"train_loss": -27.42291259765625, "global_step": 505881, "epoch": 6094} {"train_loss": -27.597211837768555, "global_step": 505882, "epoch": 6094} {"train_loss": -27.49075698852539, "global_step": 505883, "epoch": 6094} {"train_loss": -27.263433042779027, "global_step": 505884, "epoch": 6094, "val_loss": 6505968.5} {"train_loss": -27.1120662689209, "global_step": 505885, "epoch": 6095} {"train_loss": -26.94504737854004, "global_step": 505886, "epoch": 6095} {"train_loss": -27.130163192749023, "global_step": 505887, "epoch": 6095} {"train_loss": -26.980255126953125, "global_step": 505888, "epoch": 6095} {"train_loss": -26.99603843688965, "global_step": 505889, "epoch": 6095} {"train_loss": -27.362939834594727, "global_step": 505890, "epoch": 6095} {"train_loss": -27.228483200073242, "global_step": 505891, "epoch": 6095} {"train_loss": -27.00494384765625, "global_step": 505892, "epoch": 6095} {"train_loss": -27.626562118530273, "global_step": 505893, "epoch": 6095} {"train_loss": -27.302682876586914, "global_step": 505894, "epoch": 6095} {"train_loss": -26.96809196472168, "global_step": 505895, "epoch": 6095} {"train_loss": -27.529767990112305, "global_step": 505896, "epoch": 6095} {"train_loss": -27.030969619750977, "global_step": 505897, "epoch": 6095} {"train_loss": -26.94228172302246, "global_step": 505898, "epoch": 6095} {"train_loss": -27.58096694946289, "global_step": 505899, "epoch": 6095} {"train_loss": -27.366003036499023, "global_step": 505900, "epoch": 6095} {"train_loss": -27.6623592376709, "global_step": 505901, "epoch": 6095} {"train_loss": -27.819183349609375, "global_step": 505902, "epoch": 6095} {"train_loss": -27.083784103393555, "global_step": 505903, "epoch": 6095} {"train_loss": -27.282550811767578, "global_step": 505904, "epoch": 6095} {"train_loss": -27.55898094177246, "global_step": 505905, "epoch": 6095} {"train_loss": -27.300827026367188, "global_step": 505906, "epoch": 6095} {"train_loss": -27.36979103088379, "global_step": 505907, "epoch": 6095} {"train_loss": -27.699987411499023, "global_step": 505908, "epoch": 6095} {"train_loss": -27.676191329956055, "global_step": 505909, "epoch": 6095} {"train_loss": -27.600309371948242, "global_step": 505910, "epoch": 6095} {"train_loss": -27.24818229675293, "global_step": 505911, "epoch": 6095} {"train_loss": -27.97224998474121, "global_step": 505912, "epoch": 6095} {"train_loss": -27.66739273071289, "global_step": 505913, "epoch": 6095} {"train_loss": -27.582265853881836, "global_step": 505914, "epoch": 6095} {"train_loss": -27.634937286376953, "global_step": 505915, "epoch": 6095} {"train_loss": -27.93940544128418, "global_step": 505916, "epoch": 6095} {"train_loss": -28.04188346862793, "global_step": 505917, "epoch": 6095} {"train_loss": -27.681171417236328, "global_step": 505918, "epoch": 6095} {"train_loss": -27.5135440826416, "global_step": 505919, "epoch": 6095} {"train_loss": -27.580408096313477, "global_step": 505920, "epoch": 6095} {"train_loss": -27.314453125, "global_step": 505921, "epoch": 6095} {"train_loss": -27.575794219970703, "global_step": 505922, "epoch": 6095} {"train_loss": -27.42889404296875, "global_step": 505923, "epoch": 6095} {"train_loss": -27.967697143554688, "global_step": 505924, "epoch": 6095} {"train_loss": -27.467798233032227, "global_step": 505925, "epoch": 6095} {"train_loss": -27.507230758666992, "global_step": 505926, "epoch": 6095} {"train_loss": -27.649829864501953, "global_step": 505927, "epoch": 6095} {"train_loss": -27.511459350585938, "global_step": 505928, "epoch": 6095} {"train_loss": -27.159509658813477, "global_step": 505929, "epoch": 6095} {"train_loss": -27.2572078704834, "global_step": 505930, "epoch": 6095} {"train_loss": -26.960906982421875, "global_step": 505931, "epoch": 6095} {"train_loss": -27.625324249267578, "global_step": 505932, "epoch": 6095} {"train_loss": -27.651111602783203, "global_step": 505933, "epoch": 6095} {"train_loss": -27.448652267456055, "global_step": 505934, "epoch": 6095} {"train_loss": -27.793302536010742, "global_step": 505935, "epoch": 6095} {"train_loss": -27.372156143188477, "global_step": 505936, "epoch": 6095} {"train_loss": -27.567035675048828, "global_step": 505937, "epoch": 6095} {"train_loss": -27.69080924987793, "global_step": 505938, "epoch": 6095} {"train_loss": -27.19768714904785, "global_step": 505939, "epoch": 6095} {"train_loss": -27.332250595092773, "global_step": 505940, "epoch": 6095} {"train_loss": -27.2435302734375, "global_step": 505941, "epoch": 6095} {"train_loss": -27.33492088317871, "global_step": 505942, "epoch": 6095} {"train_loss": -27.53378677368164, "global_step": 505943, "epoch": 6095} {"train_loss": -27.382429122924805, "global_step": 505944, "epoch": 6095} {"train_loss": -27.43887710571289, "global_step": 505945, "epoch": 6095} {"train_loss": -27.35377311706543, "global_step": 505946, "epoch": 6095} {"train_loss": -27.677749633789062, "global_step": 505947, "epoch": 6095} {"train_loss": -27.373205184936523, "global_step": 505948, "epoch": 6095} {"train_loss": -27.3983097076416, "global_step": 505949, "epoch": 6095} {"train_loss": -27.651647567749023, "global_step": 505950, "epoch": 6095} {"train_loss": -27.61634635925293, "global_step": 505951, "epoch": 6095} {"train_loss": -27.42664909362793, "global_step": 505952, "epoch": 6095} {"train_loss": -26.93268394470215, "global_step": 505953, "epoch": 6095} {"train_loss": -26.948352813720703, "global_step": 505954, "epoch": 6095} {"train_loss": -27.3402099609375, "global_step": 505955, "epoch": 6095} {"train_loss": -26.848480224609375, "global_step": 505956, "epoch": 6095} {"train_loss": -27.291854858398438, "global_step": 505957, "epoch": 6095} {"train_loss": -27.490827560424805, "global_step": 505958, "epoch": 6095} {"train_loss": -26.95452308654785, "global_step": 505959, "epoch": 6095} {"train_loss": -27.242374420166016, "global_step": 505960, "epoch": 6095} {"train_loss": -26.95206069946289, "global_step": 505961, "epoch": 6095} {"train_loss": -27.015201568603516, "global_step": 505962, "epoch": 6095} {"train_loss": -27.554529190063477, "global_step": 505963, "epoch": 6095} {"train_loss": -27.301782608032227, "global_step": 505964, "epoch": 6095} {"train_loss": -27.5754337310791, "global_step": 505965, "epoch": 6095} {"train_loss": -27.532623291015625, "global_step": 505966, "epoch": 6095} {"train_loss": -27.39305689248694, "global_step": 505967, "epoch": 6095, "val_loss": 6450122.0} {"train_loss": -27.2059383392334, "global_step": 505968, "epoch": 6096} {"train_loss": -27.239410400390625, "global_step": 505969, "epoch": 6096} {"train_loss": -27.3503360748291, "global_step": 505970, "epoch": 6096} {"train_loss": -27.365747451782227, "global_step": 505971, "epoch": 6096} {"train_loss": -26.857105255126953, "global_step": 505972, "epoch": 6096} {"train_loss": -27.19833755493164, "global_step": 505973, "epoch": 6096} {"train_loss": -26.8512020111084, "global_step": 505974, "epoch": 6096} {"train_loss": -27.225011825561523, "global_step": 505975, "epoch": 6096} {"train_loss": -26.984237670898438, "global_step": 505976, "epoch": 6096} {"train_loss": -27.618412017822266, "global_step": 505977, "epoch": 6096} {"train_loss": -27.08747673034668, "global_step": 505978, "epoch": 6096} {"train_loss": -26.96063804626465, "global_step": 505979, "epoch": 6096} {"train_loss": -27.51630210876465, "global_step": 505980, "epoch": 6096} {"train_loss": -27.115854263305664, "global_step": 505981, "epoch": 6096} {"train_loss": -27.35736083984375, "global_step": 505982, "epoch": 6096} {"train_loss": -27.152124404907227, "global_step": 505983, "epoch": 6096} {"train_loss": -27.08608055114746, "global_step": 505984, "epoch": 6096} {"train_loss": -27.460371017456055, "global_step": 505985, "epoch": 6096} {"train_loss": -27.27533531188965, "global_step": 505986, "epoch": 6096} {"train_loss": -27.365402221679688, "global_step": 505987, "epoch": 6096} {"train_loss": -27.372785568237305, "global_step": 505988, "epoch": 6096} {"train_loss": -27.675968170166016, "global_step": 505989, "epoch": 6096} {"train_loss": -27.59002113342285, "global_step": 505990, "epoch": 6096} {"train_loss": -27.413000106811523, "global_step": 505991, "epoch": 6096} {"train_loss": -27.65400505065918, "global_step": 505992, "epoch": 6096} {"train_loss": -27.31966209411621, "global_step": 505993, "epoch": 6096} {"train_loss": -27.329008102416992, "global_step": 505994, "epoch": 6096} {"train_loss": -27.462499618530273, "global_step": 505995, "epoch": 6096} {"train_loss": -27.75764274597168, "global_step": 505996, "epoch": 6096} {"train_loss": -27.83246421813965, "global_step": 505997, "epoch": 6096} {"train_loss": -27.255170822143555, "global_step": 505998, "epoch": 6096} {"train_loss": -27.529022216796875, "global_step": 505999, "epoch": 6096} {"train_loss": -27.662830352783203, "global_step": 506000, "epoch": 6096} {"train_loss": -27.549535751342773, "global_step": 506001, "epoch": 6096} {"train_loss": -27.348058700561523, "global_step": 506002, "epoch": 6096} {"train_loss": -27.96717643737793, "global_step": 506003, "epoch": 6096} {"train_loss": -27.444660186767578, "global_step": 506004, "epoch": 6096} {"train_loss": -27.7182559967041, "global_step": 506005, "epoch": 6096} {"train_loss": -27.3083553314209, "global_step": 506006, "epoch": 6096} {"train_loss": -27.929224014282227, "global_step": 506007, "epoch": 6096} {"train_loss": -27.55254554748535, "global_step": 506008, "epoch": 6096} {"train_loss": -27.405771255493164, "global_step": 506009, "epoch": 6096} {"train_loss": -27.488784790039062, "global_step": 506010, "epoch": 6096} {"train_loss": -27.274084091186523, "global_step": 506011, "epoch": 6096} {"train_loss": -27.800756454467773, "global_step": 506012, "epoch": 6096} {"train_loss": -27.638782501220703, "global_step": 506013, "epoch": 6096} {"train_loss": -27.57538414001465, "global_step": 506014, "epoch": 6096} {"train_loss": -27.197912216186523, "global_step": 506015, "epoch": 6096} {"train_loss": -26.97597312927246, "global_step": 506016, "epoch": 6096} {"train_loss": -27.597583770751953, "global_step": 506017, "epoch": 6096} {"train_loss": -27.33710289001465, "global_step": 506018, "epoch": 6096} {"train_loss": -27.51690673828125, "global_step": 506019, "epoch": 6096} {"train_loss": -27.620344161987305, "global_step": 506020, "epoch": 6096} {"train_loss": -27.625629425048828, "global_step": 506021, "epoch": 6096} {"train_loss": -27.4774227142334, "global_step": 506022, "epoch": 6096} {"train_loss": -27.31376075744629, "global_step": 506023, "epoch": 6096} {"train_loss": -27.58426856994629, "global_step": 506024, "epoch": 6096} {"train_loss": -27.262313842773438, "global_step": 506025, "epoch": 6096} {"train_loss": -27.7010498046875, "global_step": 506026, "epoch": 6096} {"train_loss": -27.659589767456055, "global_step": 506027, "epoch": 6096} {"train_loss": -27.426939010620117, "global_step": 506028, "epoch": 6096} {"train_loss": -27.30720329284668, "global_step": 506029, "epoch": 6096} {"train_loss": -27.420673370361328, "global_step": 506030, "epoch": 6096} {"train_loss": -27.474475860595703, "global_step": 506031, "epoch": 6096} {"train_loss": -27.23894691467285, "global_step": 506032, "epoch": 6096} {"train_loss": -27.598417282104492, "global_step": 506033, "epoch": 6096} {"train_loss": -27.22177505493164, "global_step": 506034, "epoch": 6096} {"train_loss": -27.16922950744629, "global_step": 506035, "epoch": 6096} {"train_loss": -27.578800201416016, "global_step": 506036, "epoch": 6096} {"train_loss": -27.353368759155273, "global_step": 506037, "epoch": 6096} {"train_loss": -27.21869468688965, "global_step": 506038, "epoch": 6096} {"train_loss": -27.404541015625, "global_step": 506039, "epoch": 6096} {"train_loss": -27.18827247619629, "global_step": 506040, "epoch": 6096} {"train_loss": -27.45252799987793, "global_step": 506041, "epoch": 6096} {"train_loss": -27.55694580078125, "global_step": 506042, "epoch": 6096} {"train_loss": -27.285720825195312, "global_step": 506043, "epoch": 6096} {"train_loss": -27.2169246673584, "global_step": 506044, "epoch": 6096} {"train_loss": -27.68012046813965, "global_step": 506045, "epoch": 6096} {"train_loss": -27.971115112304688, "global_step": 506046, "epoch": 6096} {"train_loss": -27.365583419799805, "global_step": 506047, "epoch": 6096} {"train_loss": -27.63134765625, "global_step": 506048, "epoch": 6096} {"train_loss": -27.173871994018555, "global_step": 506049, "epoch": 6096} {"train_loss": -27.415235197687725, "global_step": 506050, "epoch": 6096, "val_loss": 6580863.0} {"train_loss": -26.256635665893555, "global_step": 506051, "epoch": 6097} {"train_loss": -25.98602867126465, "global_step": 506052, "epoch": 6097} {"train_loss": -26.68324089050293, "global_step": 506053, "epoch": 6097} {"train_loss": -26.600122451782227, "global_step": 506054, "epoch": 6097} {"train_loss": -26.883167266845703, "global_step": 506055, "epoch": 6097} {"train_loss": -26.601078033447266, "global_step": 506056, "epoch": 6097} {"train_loss": -26.818334579467773, "global_step": 506057, "epoch": 6097} {"train_loss": -26.8829402923584, "global_step": 506058, "epoch": 6097} {"train_loss": -26.69944190979004, "global_step": 506059, "epoch": 6097} {"train_loss": -26.926300048828125, "global_step": 506060, "epoch": 6097} {"train_loss": -26.74198341369629, "global_step": 506061, "epoch": 6097} {"train_loss": -27.147247314453125, "global_step": 506062, "epoch": 6097} {"train_loss": -27.162057876586914, "global_step": 506063, "epoch": 6097} {"train_loss": -27.08045768737793, "global_step": 506064, "epoch": 6097} {"train_loss": -27.163227081298828, "global_step": 506065, "epoch": 6097} {"train_loss": -27.0678768157959, "global_step": 506066, "epoch": 6097} {"train_loss": -27.160009384155273, "global_step": 506067, "epoch": 6097} {"train_loss": -27.483179092407227, "global_step": 506068, "epoch": 6097} {"train_loss": -27.48072624206543, "global_step": 506069, "epoch": 6097} {"train_loss": -27.290363311767578, "global_step": 506070, "epoch": 6097} {"train_loss": -27.2935791015625, "global_step": 506071, "epoch": 6097} {"train_loss": -27.42498779296875, "global_step": 506072, "epoch": 6097} {"train_loss": -27.52021598815918, "global_step": 506073, "epoch": 6097} {"train_loss": -27.503049850463867, "global_step": 506074, "epoch": 6097} {"train_loss": -27.26478385925293, "global_step": 506075, "epoch": 6097} {"train_loss": -27.5402774810791, "global_step": 506076, "epoch": 6097} {"train_loss": -27.36285972595215, "global_step": 506077, "epoch": 6097} {"train_loss": -27.428442001342773, "global_step": 506078, "epoch": 6097} {"train_loss": -27.24751091003418, "global_step": 506079, "epoch": 6097} {"train_loss": -27.198535919189453, "global_step": 506080, "epoch": 6097} {"train_loss": -27.38248062133789, "global_step": 506081, "epoch": 6097} {"train_loss": -27.321802139282227, "global_step": 506082, "epoch": 6097} {"train_loss": -27.28254508972168, "global_step": 506083, "epoch": 6097} {"train_loss": -27.746816635131836, "global_step": 506084, "epoch": 6097} {"train_loss": -27.5584774017334, "global_step": 506085, "epoch": 6097} {"train_loss": -27.449466705322266, "global_step": 506086, "epoch": 6097} {"train_loss": -27.564422607421875, "global_step": 506087, "epoch": 6097} {"train_loss": -27.732934951782227, "global_step": 506088, "epoch": 6097} {"train_loss": -27.326696395874023, "global_step": 506089, "epoch": 6097} {"train_loss": -27.619443893432617, "global_step": 506090, "epoch": 6097} {"train_loss": -27.43879508972168, "global_step": 506091, "epoch": 6097} {"train_loss": -27.22136878967285, "global_step": 506092, "epoch": 6097} {"train_loss": -27.599271774291992, "global_step": 506093, "epoch": 6097} {"train_loss": -27.480772018432617, "global_step": 506094, "epoch": 6097} {"train_loss": -27.313928604125977, "global_step": 506095, "epoch": 6097} {"train_loss": -27.196557998657227, "global_step": 506096, "epoch": 6097} {"train_loss": -27.352880477905273, "global_step": 506097, "epoch": 6097} {"train_loss": -27.307910919189453, "global_step": 506098, "epoch": 6097} {"train_loss": -27.35849952697754, "global_step": 506099, "epoch": 6097} {"train_loss": -27.23349380493164, "global_step": 506100, "epoch": 6097} {"train_loss": -27.313827514648438, "global_step": 506101, "epoch": 6097} {"train_loss": -27.463891983032227, "global_step": 506102, "epoch": 6097} {"train_loss": -27.511844635009766, "global_step": 506103, "epoch": 6097} {"train_loss": -27.4580135345459, "global_step": 506104, "epoch": 6097} {"train_loss": -27.28577995300293, "global_step": 506105, "epoch": 6097} {"train_loss": -27.83355140686035, "global_step": 506106, "epoch": 6097} {"train_loss": -26.887298583984375, "global_step": 506107, "epoch": 6097} {"train_loss": -27.53315544128418, "global_step": 506108, "epoch": 6097} {"train_loss": -27.433393478393555, "global_step": 506109, "epoch": 6097} {"train_loss": -27.09857177734375, "global_step": 506110, "epoch": 6097} {"train_loss": -27.490604400634766, "global_step": 506111, "epoch": 6097} {"train_loss": -27.42954444885254, "global_step": 506112, "epoch": 6097} {"train_loss": -27.3262996673584, "global_step": 506113, "epoch": 6097} {"train_loss": -27.2960147857666, "global_step": 506114, "epoch": 6097} {"train_loss": -27.510351181030273, "global_step": 506115, "epoch": 6097} {"train_loss": -27.27303123474121, "global_step": 506116, "epoch": 6097} {"train_loss": -27.268096923828125, "global_step": 506117, "epoch": 6097} {"train_loss": -27.72684669494629, "global_step": 506118, "epoch": 6097} {"train_loss": -27.297521591186523, "global_step": 506119, "epoch": 6097} {"train_loss": -27.289020538330078, "global_step": 506120, "epoch": 6097} {"train_loss": -27.06528091430664, "global_step": 506121, "epoch": 6097} {"train_loss": -27.416091918945312, "global_step": 506122, "epoch": 6097} {"train_loss": -27.541431427001953, "global_step": 506123, "epoch": 6097} {"train_loss": -27.551130294799805, "global_step": 506124, "epoch": 6097} {"train_loss": -27.514301300048828, "global_step": 506125, "epoch": 6097} {"train_loss": -27.761337280273438, "global_step": 506126, "epoch": 6097} {"train_loss": -27.424726486206055, "global_step": 506127, "epoch": 6097} {"train_loss": -27.58551597595215, "global_step": 506128, "epoch": 6097} {"train_loss": -27.522825241088867, "global_step": 506129, "epoch": 6097} {"train_loss": -27.4906005859375, "global_step": 506130, "epoch": 6097} {"train_loss": -27.663318634033203, "global_step": 506131, "epoch": 6097} {"train_loss": -27.305822372436523, "global_step": 506132, "epoch": 6097} {"train_loss": -27.30486957136407, "global_step": 506133, "epoch": 6097, "val_loss": 6555888.0} {"train_loss": -26.941625595092773, "global_step": 506134, "epoch": 6098} {"train_loss": -26.9638614654541, "global_step": 506135, "epoch": 6098} {"train_loss": -26.935338973999023, "global_step": 506136, "epoch": 6098} {"train_loss": -26.627588272094727, "global_step": 506137, "epoch": 6098} {"train_loss": -27.026514053344727, "global_step": 506138, "epoch": 6098} {"train_loss": -27.466333389282227, "global_step": 506139, "epoch": 6098} {"train_loss": -27.136856079101562, "global_step": 506140, "epoch": 6098} {"train_loss": -27.05708122253418, "global_step": 506141, "epoch": 6098} {"train_loss": -27.06939125061035, "global_step": 506142, "epoch": 6098} {"train_loss": -27.422809600830078, "global_step": 506143, "epoch": 6098} {"train_loss": -27.33770179748535, "global_step": 506144, "epoch": 6098} {"train_loss": -27.256994247436523, "global_step": 506145, "epoch": 6098} {"train_loss": -27.32093620300293, "global_step": 506146, "epoch": 6098} {"train_loss": -27.0689754486084, "global_step": 506147, "epoch": 6098} {"train_loss": -27.286819458007812, "global_step": 506148, "epoch": 6098} {"train_loss": -27.229116439819336, "global_step": 506149, "epoch": 6098} {"train_loss": -27.36117935180664, "global_step": 506150, "epoch": 6098} {"train_loss": -27.733539581298828, "global_step": 506151, "epoch": 6098} {"train_loss": -26.983856201171875, "global_step": 506152, "epoch": 6098} {"train_loss": -27.247894287109375, "global_step": 506153, "epoch": 6098} {"train_loss": -26.987756729125977, "global_step": 506154, "epoch": 6098} {"train_loss": -27.1842098236084, "global_step": 506155, "epoch": 6098} {"train_loss": -27.509485244750977, "global_step": 506156, "epoch": 6098} {"train_loss": -27.23166275024414, "global_step": 506157, "epoch": 6098} {"train_loss": -26.93657875061035, "global_step": 506158, "epoch": 6098} {"train_loss": -27.1428279876709, "global_step": 506159, "epoch": 6098} {"train_loss": -27.32016372680664, "global_step": 506160, "epoch": 6098} {"train_loss": -27.33785057067871, "global_step": 506161, "epoch": 6098} {"train_loss": -27.54389762878418, "global_step": 506162, "epoch": 6098} {"train_loss": -27.510831832885742, "global_step": 506163, "epoch": 6098} {"train_loss": -27.562177658081055, "global_step": 506164, "epoch": 6098} {"train_loss": -27.2738094329834, "global_step": 506165, "epoch": 6098} {"train_loss": -27.33698081970215, "global_step": 506166, "epoch": 6098} {"train_loss": -27.49295425415039, "global_step": 506167, "epoch": 6098} {"train_loss": -27.386144638061523, "global_step": 506168, "epoch": 6098} {"train_loss": -27.354455947875977, "global_step": 506169, "epoch": 6098} {"train_loss": -27.385099411010742, "global_step": 506170, "epoch": 6098} {"train_loss": -27.204730987548828, "global_step": 506171, "epoch": 6098} {"train_loss": -27.23846435546875, "global_step": 506172, "epoch": 6098} {"train_loss": -26.94287109375, "global_step": 506173, "epoch": 6098} {"train_loss": -27.801721572875977, "global_step": 506174, "epoch": 6098} {"train_loss": -27.444738388061523, "global_step": 506175, "epoch": 6098} {"train_loss": -27.3640079498291, "global_step": 506176, "epoch": 6098} {"train_loss": -27.554046630859375, "global_step": 506177, "epoch": 6098} {"train_loss": -27.626739501953125, "global_step": 506178, "epoch": 6098} {"train_loss": -27.210006713867188, "global_step": 506179, "epoch": 6098} {"train_loss": -27.19950294494629, "global_step": 506180, "epoch": 6098} {"train_loss": -27.44415855407715, "global_step": 506181, "epoch": 6098} {"train_loss": -27.408823013305664, "global_step": 506182, "epoch": 6098} {"train_loss": -27.525257110595703, "global_step": 506183, "epoch": 6098} {"train_loss": -27.803876876831055, "global_step": 506184, "epoch": 6098} {"train_loss": -27.755197525024414, "global_step": 506185, "epoch": 6098} {"train_loss": -27.392553329467773, "global_step": 506186, "epoch": 6098} {"train_loss": -27.418304443359375, "global_step": 506187, "epoch": 6098} {"train_loss": -27.366342544555664, "global_step": 506188, "epoch": 6098} {"train_loss": -27.518850326538086, "global_step": 506189, "epoch": 6098} {"train_loss": -27.82400894165039, "global_step": 506190, "epoch": 6098} {"train_loss": -27.6821346282959, "global_step": 506191, "epoch": 6098} {"train_loss": -27.26295280456543, "global_step": 506192, "epoch": 6098} {"train_loss": -26.976993560791016, "global_step": 506193, "epoch": 6098} {"train_loss": -27.424650192260742, "global_step": 506194, "epoch": 6098} {"train_loss": -27.31048011779785, "global_step": 506195, "epoch": 6098} {"train_loss": -27.561767578125, "global_step": 506196, "epoch": 6098} {"train_loss": -27.51938819885254, "global_step": 506197, "epoch": 6098} {"train_loss": -27.193140029907227, "global_step": 506198, "epoch": 6098} {"train_loss": -26.97018814086914, "global_step": 506199, "epoch": 6098} {"train_loss": -27.267927169799805, "global_step": 506200, "epoch": 6098} {"train_loss": -27.54559326171875, "global_step": 506201, "epoch": 6098} {"train_loss": -27.7054443359375, "global_step": 506202, "epoch": 6098} {"train_loss": -27.41334342956543, "global_step": 506203, "epoch": 6098} {"train_loss": -26.78011131286621, "global_step": 506204, "epoch": 6098} {"train_loss": -26.589658737182617, "global_step": 506205, "epoch": 6098} {"train_loss": -27.475814819335938, "global_step": 506206, "epoch": 6098} {"train_loss": -27.31978416442871, "global_step": 506207, "epoch": 6098} {"train_loss": -27.122913360595703, "global_step": 506208, "epoch": 6098} {"train_loss": -27.167987823486328, "global_step": 506209, "epoch": 6098} {"train_loss": -27.55232048034668, "global_step": 506210, "epoch": 6098} {"train_loss": -27.310850143432617, "global_step": 506211, "epoch": 6098} {"train_loss": -27.231964111328125, "global_step": 506212, "epoch": 6098} {"train_loss": -27.173452377319336, "global_step": 506213, "epoch": 6098} {"train_loss": -27.545745849609375, "global_step": 506214, "epoch": 6098} {"train_loss": -27.317686080932617, "global_step": 506215, "epoch": 6098} {"train_loss": -27.306044681962714, "global_step": 506216, "epoch": 6098, "val_loss": 6523763.5} {"train_loss": -27.2998046875, "global_step": 506217, "epoch": 6099} {"train_loss": -27.17363929748535, "global_step": 506218, "epoch": 6099} {"train_loss": -26.77294921875, "global_step": 506219, "epoch": 6099} {"train_loss": -26.814502716064453, "global_step": 506220, "epoch": 6099} {"train_loss": -27.194000244140625, "global_step": 506221, "epoch": 6099} {"train_loss": -27.127262115478516, "global_step": 506222, "epoch": 6099} {"train_loss": -27.075902938842773, "global_step": 506223, "epoch": 6099} {"train_loss": -27.056884765625, "global_step": 506224, "epoch": 6099} {"train_loss": -27.541370391845703, "global_step": 506225, "epoch": 6099} {"train_loss": -27.326461791992188, "global_step": 506226, "epoch": 6099} {"train_loss": -27.260868072509766, "global_step": 506227, "epoch": 6099} {"train_loss": -27.287458419799805, "global_step": 506228, "epoch": 6099} {"train_loss": -26.998615264892578, "global_step": 506229, "epoch": 6099} {"train_loss": -27.358346939086914, "global_step": 506230, "epoch": 6099} {"train_loss": -27.30238151550293, "global_step": 506231, "epoch": 6099} {"train_loss": -27.61065101623535, "global_step": 506232, "epoch": 6099} {"train_loss": -27.45108413696289, "global_step": 506233, "epoch": 6099} {"train_loss": -27.551746368408203, "global_step": 506234, "epoch": 6099} {"train_loss": -27.29706382751465, "global_step": 506235, "epoch": 6099} {"train_loss": -27.408985137939453, "global_step": 506236, "epoch": 6099} {"train_loss": -27.454771041870117, "global_step": 506237, "epoch": 6099} {"train_loss": -27.405202865600586, "global_step": 506238, "epoch": 6099} {"train_loss": -26.97590446472168, "global_step": 506239, "epoch": 6099} {"train_loss": -26.983694076538086, "global_step": 506240, "epoch": 6099} {"train_loss": -27.427839279174805, "global_step": 506241, "epoch": 6099} {"train_loss": -27.84767723083496, "global_step": 506242, "epoch": 6099} {"train_loss": -27.646392822265625, "global_step": 506243, "epoch": 6099} {"train_loss": -27.728437423706055, "global_step": 506244, "epoch": 6099} {"train_loss": -27.61834716796875, "global_step": 506245, "epoch": 6099} {"train_loss": -27.523717880249023, "global_step": 506246, "epoch": 6099} {"train_loss": -27.553913116455078, "global_step": 506247, "epoch": 6099} {"train_loss": -27.31964111328125, "global_step": 506248, "epoch": 6099} {"train_loss": -27.310510635375977, "global_step": 506249, "epoch": 6099} {"train_loss": -27.494604110717773, "global_step": 506250, "epoch": 6099} {"train_loss": -27.528491973876953, "global_step": 506251, "epoch": 6099} {"train_loss": -27.283796310424805, "global_step": 506252, "epoch": 6099} {"train_loss": -27.6751766204834, "global_step": 506253, "epoch": 6099} {"train_loss": -27.22547721862793, "global_step": 506254, "epoch": 6099} {"train_loss": -27.73811149597168, "global_step": 506255, "epoch": 6099} {"train_loss": -27.614246368408203, "global_step": 506256, "epoch": 6099} {"train_loss": -27.860675811767578, "global_step": 506257, "epoch": 6099} {"train_loss": -27.36795997619629, "global_step": 506258, "epoch": 6099} {"train_loss": -27.900983810424805, "global_step": 506259, "epoch": 6099} {"train_loss": -27.31959342956543, "global_step": 506260, "epoch": 6099} {"train_loss": -27.14600944519043, "global_step": 506261, "epoch": 6099} {"train_loss": -27.213544845581055, "global_step": 506262, "epoch": 6099} {"train_loss": -27.554370880126953, "global_step": 506263, "epoch": 6099} {"train_loss": -27.812108993530273, "global_step": 506264, "epoch": 6099} {"train_loss": -27.33280372619629, "global_step": 506265, "epoch": 6099} {"train_loss": -27.088830947875977, "global_step": 506266, "epoch": 6099} {"train_loss": -27.010400772094727, "global_step": 506267, "epoch": 6099} {"train_loss": -26.882678985595703, "global_step": 506268, "epoch": 6099} {"train_loss": -26.69915199279785, "global_step": 506269, "epoch": 6099} {"train_loss": -27.378931045532227, "global_step": 506270, "epoch": 6099} {"train_loss": -27.685684204101562, "global_step": 506271, "epoch": 6099} {"train_loss": -27.2709903717041, "global_step": 506272, "epoch": 6099} {"train_loss": -27.438684463500977, "global_step": 506273, "epoch": 6099} {"train_loss": -27.415393829345703, "global_step": 506274, "epoch": 6099} {"train_loss": -27.66355323791504, "global_step": 506275, "epoch": 6099} {"train_loss": -27.22920036315918, "global_step": 506276, "epoch": 6099} {"train_loss": -27.351165771484375, "global_step": 506277, "epoch": 6099} {"train_loss": -27.3953914642334, "global_step": 506278, "epoch": 6099} {"train_loss": -27.23701286315918, "global_step": 506279, "epoch": 6099} {"train_loss": -27.857877731323242, "global_step": 506280, "epoch": 6099} {"train_loss": -27.435409545898438, "global_step": 506281, "epoch": 6099} {"train_loss": -27.612451553344727, "global_step": 506282, "epoch": 6099} {"train_loss": -27.43341636657715, "global_step": 506283, "epoch": 6099} {"train_loss": -27.623647689819336, "global_step": 506284, "epoch": 6099} {"train_loss": -27.308990478515625, "global_step": 506285, "epoch": 6099} {"train_loss": -27.635461807250977, "global_step": 506286, "epoch": 6099} {"train_loss": -27.567733764648438, "global_step": 506287, "epoch": 6099} {"train_loss": -27.451135635375977, "global_step": 506288, "epoch": 6099} {"train_loss": -27.536706924438477, "global_step": 506289, "epoch": 6099} {"train_loss": -27.41840934753418, "global_step": 506290, "epoch": 6099} {"train_loss": -27.5132999420166, "global_step": 506291, "epoch": 6099} {"train_loss": -27.32562255859375, "global_step": 506292, "epoch": 6099} {"train_loss": -27.397119522094727, "global_step": 506293, "epoch": 6099} {"train_loss": -27.078760147094727, "global_step": 506294, "epoch": 6099} {"train_loss": -27.547565460205078, "global_step": 506295, "epoch": 6099} {"train_loss": -27.25506591796875, "global_step": 506296, "epoch": 6099} {"train_loss": -27.177722930908203, "global_step": 506297, "epoch": 6099} {"train_loss": -27.416318893432617, "global_step": 506298, "epoch": 6099} {"train_loss": -27.379685987909156, "global_step": 506299, "epoch": 6099, "val_loss": 6554127.0} {"train_loss": -26.824542999267578, "global_step": 506300, "epoch": 6100} {"train_loss": -26.171600341796875, "global_step": 506301, "epoch": 6100} {"train_loss": -27.019866943359375, "global_step": 506302, "epoch": 6100} {"train_loss": -26.810901641845703, "global_step": 506303, "epoch": 6100} {"train_loss": -26.364896774291992, "global_step": 506304, "epoch": 6100} {"train_loss": -26.932889938354492, "global_step": 506305, "epoch": 6100} {"train_loss": -26.92254066467285, "global_step": 506306, "epoch": 6100} {"train_loss": -26.974319458007812, "global_step": 506307, "epoch": 6100} {"train_loss": -26.91803550720215, "global_step": 506308, "epoch": 6100} {"train_loss": -27.06781578063965, "global_step": 506309, "epoch": 6100} {"train_loss": -26.999853134155273, "global_step": 506310, "epoch": 6100} {"train_loss": -26.84323501586914, "global_step": 506311, "epoch": 6100} {"train_loss": -26.760953903198242, "global_step": 506312, "epoch": 6100} {"train_loss": -26.4254093170166, "global_step": 506313, "epoch": 6100} {"train_loss": -27.1684627532959, "global_step": 506314, "epoch": 6100} {"train_loss": -26.92603874206543, "global_step": 506315, "epoch": 6100} {"train_loss": -26.99983024597168, "global_step": 506316, "epoch": 6100} {"train_loss": -26.97236442565918, "global_step": 506317, "epoch": 6100} {"train_loss": -26.648000717163086, "global_step": 506318, "epoch": 6100} {"train_loss": -26.819061279296875, "global_step": 506319, "epoch": 6100} {"train_loss": -26.94426918029785, "global_step": 506320, "epoch": 6100} {"train_loss": -27.439407348632812, "global_step": 506321, "epoch": 6100} {"train_loss": -27.195026397705078, "global_step": 506322, "epoch": 6100} {"train_loss": -27.161828994750977, "global_step": 506323, "epoch": 6100} {"train_loss": -27.099365234375, "global_step": 506324, "epoch": 6100} {"train_loss": -27.092086791992188, "global_step": 506325, "epoch": 6100} {"train_loss": -27.230310440063477, "global_step": 506326, "epoch": 6100} {"train_loss": -27.10841178894043, "global_step": 506327, "epoch": 6100} {"train_loss": -27.36568260192871, "global_step": 506328, "epoch": 6100} {"train_loss": -27.30194091796875, "global_step": 506329, "epoch": 6100} {"train_loss": -27.600976943969727, "global_step": 506330, "epoch": 6100} {"train_loss": -27.5166072845459, "global_step": 506331, "epoch": 6100} {"train_loss": -27.396032333374023, "global_step": 506332, "epoch": 6100} {"train_loss": -27.4482421875, "global_step": 506333, "epoch": 6100} {"train_loss": -27.274030685424805, "global_step": 506334, "epoch": 6100} {"train_loss": -27.456655502319336, "global_step": 506335, "epoch": 6100} {"train_loss": -27.5590877532959, "global_step": 506336, "epoch": 6100} {"train_loss": -27.44167137145996, "global_step": 506337, "epoch": 6100} {"train_loss": -27.557180404663086, "global_step": 506338, "epoch": 6100} {"train_loss": -27.518768310546875, "global_step": 506339, "epoch": 6100} {"train_loss": -27.696115493774414, "global_step": 506340, "epoch": 6100} {"train_loss": -27.513044357299805, "global_step": 506341, "epoch": 6100} {"train_loss": -27.36997413635254, "global_step": 506342, "epoch": 6100} {"train_loss": -27.68853187561035, "global_step": 506343, "epoch": 6100} {"train_loss": -27.42571449279785, "global_step": 506344, "epoch": 6100} {"train_loss": -27.350433349609375, "global_step": 506345, "epoch": 6100} {"train_loss": -27.609113693237305, "global_step": 506346, "epoch": 6100} {"train_loss": -27.584125518798828, "global_step": 506347, "epoch": 6100} {"train_loss": -27.735031127929688, "global_step": 506348, "epoch": 6100} {"train_loss": -27.685184478759766, "global_step": 506349, "epoch": 6100} {"train_loss": -27.729902267456055, "global_step": 506350, "epoch": 6100} {"train_loss": -27.503711700439453, "global_step": 506351, "epoch": 6100} {"train_loss": -27.747541427612305, "global_step": 506352, "epoch": 6100} {"train_loss": -27.41969871520996, "global_step": 506353, "epoch": 6100} {"train_loss": -27.39712905883789, "global_step": 506354, "epoch": 6100} {"train_loss": -27.898685455322266, "global_step": 506355, "epoch": 6100} {"train_loss": -27.330347061157227, "global_step": 506356, "epoch": 6100} {"train_loss": -27.24526023864746, "global_step": 506357, "epoch": 6100} {"train_loss": -26.7514591217041, "global_step": 506358, "epoch": 6100} {"train_loss": -26.788009643554688, "global_step": 506359, "epoch": 6100} {"train_loss": -27.109975814819336, "global_step": 506360, "epoch": 6100} {"train_loss": -27.313587188720703, "global_step": 506361, "epoch": 6100} {"train_loss": -27.389617919921875, "global_step": 506362, "epoch": 6100} {"train_loss": -27.267505645751953, "global_step": 506363, "epoch": 6100} {"train_loss": -27.241657257080078, "global_step": 506364, "epoch": 6100} {"train_loss": -27.272932052612305, "global_step": 506365, "epoch": 6100} {"train_loss": -27.927453994750977, "global_step": 506366, "epoch": 6100} {"train_loss": -27.45071792602539, "global_step": 506367, "epoch": 6100} {"train_loss": -27.40949821472168, "global_step": 506368, "epoch": 6100} {"train_loss": -26.767248153686523, "global_step": 506369, "epoch": 6100} {"train_loss": -26.990636825561523, "global_step": 506370, "epoch": 6100} {"train_loss": -27.41912841796875, "global_step": 506371, "epoch": 6100} {"train_loss": -27.092126846313477, "global_step": 506372, "epoch": 6100} {"train_loss": -26.752546310424805, "global_step": 506373, "epoch": 6100} {"train_loss": -26.959150314331055, "global_step": 506374, "epoch": 6100} {"train_loss": -27.01637077331543, "global_step": 506375, "epoch": 6100} {"train_loss": -27.796247482299805, "global_step": 506376, "epoch": 6100} {"train_loss": -27.1683349609375, "global_step": 506377, "epoch": 6100} {"train_loss": -26.899158477783203, "global_step": 506378, "epoch": 6100} {"train_loss": -26.857593536376953, "global_step": 506379, "epoch": 6100} {"train_loss": -27.35504722595215, "global_step": 506380, "epoch": 6100} {"train_loss": -27.318668365478516, "global_step": 506381, "epoch": 6100} {"train_loss": -27.222778642033955, "global_step": 506382, "epoch": 6100, "train/sim_max_reward_0": 1.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4500000": 1.0, "test/sim_max_reward_4500001": 1.0, "test/sim_max_reward_4500002": 1.0, "test/sim_max_reward_4500003": 1.0, "test/sim_max_reward_4500004": 1.0, "test/sim_max_reward_4500005": 1.0, "test/sim_max_reward_4500006": 1.0, "test/sim_max_reward_4500007": 0.0, "test/sim_max_reward_4500008": 1.0, "test/sim_max_reward_4500009": 1.0, "test/sim_max_reward_4500010": 1.0, "test/sim_max_reward_4500011": 1.0, "test/sim_max_reward_4500012": 1.0, "test/sim_max_reward_4500013": 0.0, "test/sim_max_reward_4500014": 1.0, "test/sim_max_reward_4500015": 1.0, "test/sim_max_reward_4500016": 1.0, "test/sim_max_reward_4500017": 1.0, "test/sim_max_reward_4500018": 1.0, "test/sim_max_reward_4500019": 1.0, "test/sim_max_reward_4500020": 1.0, "test/sim_max_reward_4500021": 1.0, "train/mean_score": 1.0, "test/mean_score": 0.9090909090909091, "val_loss": 6551024.0} {"train_loss": -26.962787628173828, "global_step": 506383, "epoch": 6101} {"train_loss": -26.647275924682617, "global_step": 506384, "epoch": 6101} {"train_loss": -26.979022979736328, "global_step": 506385, "epoch": 6101} {"train_loss": -27.152664184570312, "global_step": 506386, "epoch": 6101} {"train_loss": -26.967803955078125, "global_step": 506387, "epoch": 6101} {"train_loss": -27.22834587097168, "global_step": 506388, "epoch": 6101} {"train_loss": -26.611913681030273, "global_step": 506389, "epoch": 6101} {"train_loss": -27.112058639526367, "global_step": 506390, "epoch": 6101} {"train_loss": -27.090805053710938, "global_step": 506391, "epoch": 6101} {"train_loss": -26.95122718811035, "global_step": 506392, "epoch": 6101} {"train_loss": -27.455493927001953, "global_step": 506393, "epoch": 6101} {"train_loss": -26.934667587280273, "global_step": 506394, "epoch": 6101} {"train_loss": -27.303918838500977, "global_step": 506395, "epoch": 6101} {"train_loss": -27.114988327026367, "global_step": 506396, "epoch": 6101} {"train_loss": -27.208715438842773, "global_step": 506397, "epoch": 6101} {"train_loss": -27.01935386657715, "global_step": 506398, "epoch": 6101} {"train_loss": -27.4759464263916, "global_step": 506399, "epoch": 6101} {"train_loss": -27.692663192749023, "global_step": 506400, "epoch": 6101} {"train_loss": -27.389230728149414, "global_step": 506401, "epoch": 6101} {"train_loss": -27.164587020874023, "global_step": 506402, "epoch": 6101} {"train_loss": -27.426315307617188, "global_step": 506403, "epoch": 6101} {"train_loss": -27.559925079345703, "global_step": 506404, "epoch": 6101} {"train_loss": -27.465967178344727, "global_step": 506405, "epoch": 6101} {"train_loss": -27.54608154296875, "global_step": 506406, "epoch": 6101} {"train_loss": -27.302770614624023, "global_step": 506407, "epoch": 6101} {"train_loss": -27.534330368041992, "global_step": 506408, "epoch": 6101} {"train_loss": -27.612640380859375, "global_step": 506409, "epoch": 6101} {"train_loss": -27.753040313720703, "global_step": 506410, "epoch": 6101} {"train_loss": -27.526437759399414, "global_step": 506411, "epoch": 6101} {"train_loss": -27.09181785583496, "global_step": 506412, "epoch": 6101} {"train_loss": -27.59331703186035, "global_step": 506413, "epoch": 6101} {"train_loss": -27.611997604370117, "global_step": 506414, "epoch": 6101} {"train_loss": -27.382028579711914, "global_step": 506415, "epoch": 6101} {"train_loss": -27.44562339782715, "global_step": 506416, "epoch": 6101} {"train_loss": -27.3327693939209, "global_step": 506417, "epoch": 6101} {"train_loss": -27.481647491455078, "global_step": 506418, "epoch": 6101} {"train_loss": -27.9960994720459, "global_step": 506419, "epoch": 6101} {"train_loss": -27.356489181518555, "global_step": 506420, "epoch": 6101} {"train_loss": -27.639404296875, "global_step": 506421, "epoch": 6101} {"train_loss": -27.682077407836914, "global_step": 506422, "epoch": 6101} {"train_loss": -28.06513023376465, "global_step": 506423, "epoch": 6101} {"train_loss": -27.505258560180664, "global_step": 506424, "epoch": 6101} {"train_loss": -27.90756607055664, "global_step": 506425, "epoch": 6101} {"train_loss": -27.758214950561523, "global_step": 506426, "epoch": 6101} {"train_loss": -27.358688354492188, "global_step": 506427, "epoch": 6101} {"train_loss": -27.7352237701416, "global_step": 506428, "epoch": 6101} {"train_loss": -27.43562126159668, "global_step": 506429, "epoch": 6101} {"train_loss": -27.366363525390625, "global_step": 506430, "epoch": 6101} {"train_loss": -26.99106788635254, "global_step": 506431, "epoch": 6101} {"train_loss": -27.478656768798828, "global_step": 506432, "epoch": 6101} {"train_loss": -27.603796005249023, "global_step": 506433, "epoch": 6101} {"train_loss": -27.994375228881836, "global_step": 506434, "epoch": 6101} {"train_loss": -27.681970596313477, "global_step": 506435, "epoch": 6101} {"train_loss": -27.2180118560791, "global_step": 506436, "epoch": 6101} {"train_loss": -27.53651237487793, "global_step": 506437, "epoch": 6101} {"train_loss": -27.252201080322266, "global_step": 506438, "epoch": 6101} {"train_loss": -27.25760841369629, "global_step": 506439, "epoch": 6101} {"train_loss": -27.607839584350586, "global_step": 506440, "epoch": 6101} {"train_loss": -27.553564071655273, "global_step": 506441, "epoch": 6101} {"train_loss": -27.343664169311523, "global_step": 506442, "epoch": 6101} {"train_loss": -27.650999069213867, "global_step": 506443, "epoch": 6101} {"train_loss": -26.923654556274414, "global_step": 506444, "epoch": 6101} {"train_loss": -27.201658248901367, "global_step": 506445, "epoch": 6101} {"train_loss": -27.371871948242188, "global_step": 506446, "epoch": 6101} {"train_loss": -27.026342391967773, "global_step": 506447, "epoch": 6101} {"train_loss": -27.60028648376465, "global_step": 506448, "epoch": 6101} {"train_loss": -27.32781982421875, "global_step": 506449, "epoch": 6101} {"train_loss": -26.94097328186035, "global_step": 506450, "epoch": 6101} {"train_loss": -27.265857696533203, "global_step": 506451, "epoch": 6101} {"train_loss": -27.392486572265625, "global_step": 506452, "epoch": 6101} {"train_loss": -27.8306884765625, "global_step": 506453, "epoch": 6101} {"train_loss": -27.3509464263916, "global_step": 506454, "epoch": 6101} {"train_loss": -27.117828369140625, "global_step": 506455, "epoch": 6101} {"train_loss": -27.2568359375, "global_step": 506456, "epoch": 6101} {"train_loss": -27.298858642578125, "global_step": 506457, "epoch": 6101} {"train_loss": -27.300460815429688, "global_step": 506458, "epoch": 6101} {"train_loss": -27.53057289123535, "global_step": 506459, "epoch": 6101} {"train_loss": -27.274377822875977, "global_step": 506460, "epoch": 6101} {"train_loss": -27.476171493530273, "global_step": 506461, "epoch": 6101} {"train_loss": -27.502716064453125, "global_step": 506462, "epoch": 6101} {"train_loss": -27.590103149414062, "global_step": 506463, "epoch": 6101} {"train_loss": -27.294281005859375, "global_step": 506464, "epoch": 6101} {"train_loss": -27.360203088047992, "global_step": 506465, "epoch": 6101, "val_loss": 6517577.5} {"train_loss": -26.787649154663086, "global_step": 506466, "epoch": 6102} {"train_loss": -26.52739906311035, "global_step": 506467, "epoch": 6102} {"train_loss": -26.684707641601562, "global_step": 506468, "epoch": 6102} {"train_loss": -27.106664657592773, "global_step": 506469, "epoch": 6102} {"train_loss": -27.1898136138916, "global_step": 506470, "epoch": 6102} {"train_loss": -26.954059600830078, "global_step": 506471, "epoch": 6102} {"train_loss": -26.929309844970703, "global_step": 506472, "epoch": 6102} {"train_loss": -26.850080490112305, "global_step": 506473, "epoch": 6102} {"train_loss": -27.221698760986328, "global_step": 506474, "epoch": 6102} {"train_loss": -26.9442138671875, "global_step": 506475, "epoch": 6102} {"train_loss": -26.925683975219727, "global_step": 506476, "epoch": 6102} {"train_loss": -27.271686553955078, "global_step": 506477, "epoch": 6102} {"train_loss": -26.97913932800293, "global_step": 506478, "epoch": 6102} {"train_loss": -27.364755630493164, "global_step": 506479, "epoch": 6102} {"train_loss": -27.355112075805664, "global_step": 506480, "epoch": 6102} {"train_loss": -27.02705192565918, "global_step": 506481, "epoch": 6102} {"train_loss": -27.443359375, "global_step": 506482, "epoch": 6102} {"train_loss": -27.334232330322266, "global_step": 506483, "epoch": 6102} {"train_loss": -27.312376022338867, "global_step": 506484, "epoch": 6102} {"train_loss": -27.557514190673828, "global_step": 506485, "epoch": 6102} {"train_loss": -27.328344345092773, "global_step": 506486, "epoch": 6102} {"train_loss": -27.68988037109375, "global_step": 506487, "epoch": 6102} {"train_loss": -27.280548095703125, "global_step": 506488, "epoch": 6102} {"train_loss": -27.500244140625, "global_step": 506489, "epoch": 6102} {"train_loss": -27.7112979888916, "global_step": 506490, "epoch": 6102} {"train_loss": -27.080902099609375, "global_step": 506491, "epoch": 6102} {"train_loss": -27.475122451782227, "global_step": 506492, "epoch": 6102} {"train_loss": -27.352636337280273, "global_step": 506493, "epoch": 6102} {"train_loss": -27.4532470703125, "global_step": 506494, "epoch": 6102} {"train_loss": -27.4073486328125, "global_step": 506495, "epoch": 6102} {"train_loss": -27.29532241821289, "global_step": 506496, "epoch": 6102} {"train_loss": -27.493301391601562, "global_step": 506497, "epoch": 6102} {"train_loss": -27.109695434570312, "global_step": 506498, "epoch": 6102} {"train_loss": -27.455259323120117, "global_step": 506499, "epoch": 6102} {"train_loss": -27.0264949798584, "global_step": 506500, "epoch": 6102} {"train_loss": -27.287841796875, "global_step": 506501, "epoch": 6102} {"train_loss": -27.388479232788086, "global_step": 506502, "epoch": 6102} {"train_loss": -27.530750274658203, "global_step": 506503, "epoch": 6102} {"train_loss": -27.45125389099121, "global_step": 506504, "epoch": 6102} {"train_loss": -27.602949142456055, "global_step": 506505, "epoch": 6102} {"train_loss": -27.854543685913086, "global_step": 506506, "epoch": 6102} {"train_loss": -27.5030517578125, "global_step": 506507, "epoch": 6102} {"train_loss": -27.4515323638916, "global_step": 506508, "epoch": 6102} {"train_loss": -27.0966796875, "global_step": 506509, "epoch": 6102} {"train_loss": -27.523664474487305, "global_step": 506510, "epoch": 6102} {"train_loss": -27.404071807861328, "global_step": 506511, "epoch": 6102} {"train_loss": -27.45099449157715, "global_step": 506512, "epoch": 6102} {"train_loss": -27.00410270690918, "global_step": 506513, "epoch": 6102} {"train_loss": -27.14052391052246, "global_step": 506514, "epoch": 6102} {"train_loss": -27.338281631469727, "global_step": 506515, "epoch": 6102} {"train_loss": -27.44040298461914, "global_step": 506516, "epoch": 6102} {"train_loss": -27.508405685424805, "global_step": 506517, "epoch": 6102} {"train_loss": -27.03619956970215, "global_step": 506518, "epoch": 6102} {"train_loss": -27.71673583984375, "global_step": 506519, "epoch": 6102} {"train_loss": -27.73956871032715, "global_step": 506520, "epoch": 6102} {"train_loss": -27.54825782775879, "global_step": 506521, "epoch": 6102} {"train_loss": -27.27988624572754, "global_step": 506522, "epoch": 6102} {"train_loss": -27.835189819335938, "global_step": 506523, "epoch": 6102} {"train_loss": -27.535306930541992, "global_step": 506524, "epoch": 6102} {"train_loss": -27.625329971313477, "global_step": 506525, "epoch": 6102} {"train_loss": -27.35528564453125, "global_step": 506526, "epoch": 6102} {"train_loss": -27.360462188720703, "global_step": 506527, "epoch": 6102} {"train_loss": -27.697683334350586, "global_step": 506528, "epoch": 6102} {"train_loss": -27.6666316986084, "global_step": 506529, "epoch": 6102} {"train_loss": -28.021728515625, "global_step": 506530, "epoch": 6102} {"train_loss": -27.55293083190918, "global_step": 506531, "epoch": 6102} {"train_loss": -27.108322143554688, "global_step": 506532, "epoch": 6102} {"train_loss": -27.332578659057617, "global_step": 506533, "epoch": 6102} {"train_loss": -27.332305908203125, "global_step": 506534, "epoch": 6102} {"train_loss": -27.21100425720215, "global_step": 506535, "epoch": 6102} {"train_loss": -27.394001007080078, "global_step": 506536, "epoch": 6102} {"train_loss": -27.261350631713867, "global_step": 506537, "epoch": 6102} {"train_loss": -27.440465927124023, "global_step": 506538, "epoch": 6102} {"train_loss": -27.007165908813477, "global_step": 506539, "epoch": 6102} {"train_loss": -27.227949142456055, "global_step": 506540, "epoch": 6102} {"train_loss": -26.884967803955078, "global_step": 506541, "epoch": 6102} {"train_loss": -27.009618759155273, "global_step": 506542, "epoch": 6102} {"train_loss": -26.665332794189453, "global_step": 506543, "epoch": 6102} {"train_loss": -26.850341796875, "global_step": 506544, "epoch": 6102} {"train_loss": -27.450857162475586, "global_step": 506545, "epoch": 6102} {"train_loss": -27.25092887878418, "global_step": 506546, "epoch": 6102} {"train_loss": -27.231931686401367, "global_step": 506547, "epoch": 6102} {"train_loss": -27.304386828319135, "global_step": 506548, "epoch": 6102, "val_loss": 6562567.0} {"train_loss": -26.7447509765625, "global_step": 506549, "epoch": 6103} {"train_loss": -26.57752799987793, "global_step": 506550, "epoch": 6103} {"train_loss": -27.05641746520996, "global_step": 506551, "epoch": 6103} {"train_loss": -26.919219970703125, "global_step": 506552, "epoch": 6103} {"train_loss": -26.919851303100586, "global_step": 506553, "epoch": 6103} {"train_loss": -27.01310157775879, "global_step": 506554, "epoch": 6103} {"train_loss": -26.9124813079834, "global_step": 506555, "epoch": 6103} {"train_loss": -26.804868698120117, "global_step": 506556, "epoch": 6103} {"train_loss": -27.259862899780273, "global_step": 506557, "epoch": 6103} {"train_loss": -26.616601943969727, "global_step": 506558, "epoch": 6103} {"train_loss": -26.98529624938965, "global_step": 506559, "epoch": 6103} {"train_loss": -26.909259796142578, "global_step": 506560, "epoch": 6103} {"train_loss": -27.06792640686035, "global_step": 506561, "epoch": 6103} {"train_loss": -26.83966636657715, "global_step": 506562, "epoch": 6103} {"train_loss": -27.284351348876953, "global_step": 506563, "epoch": 6103} {"train_loss": -27.278568267822266, "global_step": 506564, "epoch": 6103} {"train_loss": -26.515356063842773, "global_step": 506565, "epoch": 6103} {"train_loss": -26.84528923034668, "global_step": 506566, "epoch": 6103} {"train_loss": -27.098529815673828, "global_step": 506567, "epoch": 6103} {"train_loss": -27.20729637145996, "global_step": 506568, "epoch": 6103} {"train_loss": -26.787353515625, "global_step": 506569, "epoch": 6103} {"train_loss": -27.074390411376953, "global_step": 506570, "epoch": 6103} {"train_loss": -27.394601821899414, "global_step": 506571, "epoch": 6103} {"train_loss": -27.3258056640625, "global_step": 506572, "epoch": 6103} {"train_loss": -27.125598907470703, "global_step": 506573, "epoch": 6103} {"train_loss": -27.427845001220703, "global_step": 506574, "epoch": 6103} {"train_loss": -27.109806060791016, "global_step": 506575, "epoch": 6103} {"train_loss": -27.233442306518555, "global_step": 506576, "epoch": 6103} {"train_loss": -27.379480361938477, "global_step": 506577, "epoch": 6103} {"train_loss": -27.19718360900879, "global_step": 506578, "epoch": 6103} {"train_loss": -27.106000900268555, "global_step": 506579, "epoch": 6103} {"train_loss": -27.133214950561523, "global_step": 506580, "epoch": 6103} {"train_loss": -27.36881446838379, "global_step": 506581, "epoch": 6103} {"train_loss": -27.252241134643555, "global_step": 506582, "epoch": 6103} {"train_loss": -27.39710807800293, "global_step": 506583, "epoch": 6103} {"train_loss": -27.294599533081055, "global_step": 506584, "epoch": 6103} {"train_loss": -27.4528751373291, "global_step": 506585, "epoch": 6103} {"train_loss": -27.284460067749023, "global_step": 506586, "epoch": 6103} {"train_loss": -27.5011043548584, "global_step": 506587, "epoch": 6103} {"train_loss": -27.429462432861328, "global_step": 506588, "epoch": 6103} {"train_loss": -27.645832061767578, "global_step": 506589, "epoch": 6103} {"train_loss": -27.50199317932129, "global_step": 506590, "epoch": 6103} {"train_loss": -27.50422477722168, "global_step": 506591, "epoch": 6103} {"train_loss": -27.40152359008789, "global_step": 506592, "epoch": 6103} {"train_loss": -27.757226943969727, "global_step": 506593, "epoch": 6103} {"train_loss": -27.82441520690918, "global_step": 506594, "epoch": 6103} {"train_loss": -27.4537296295166, "global_step": 506595, "epoch": 6103} {"train_loss": -27.653608322143555, "global_step": 506596, "epoch": 6103} {"train_loss": -27.3892879486084, "global_step": 506597, "epoch": 6103} {"train_loss": -27.34552574157715, "global_step": 506598, "epoch": 6103} {"train_loss": -27.266889572143555, "global_step": 506599, "epoch": 6103} {"train_loss": -27.104917526245117, "global_step": 506600, "epoch": 6103} {"train_loss": -27.48113441467285, "global_step": 506601, "epoch": 6103} {"train_loss": -27.415313720703125, "global_step": 506602, "epoch": 6103} {"train_loss": -27.524518966674805, "global_step": 506603, "epoch": 6103} {"train_loss": -27.294118881225586, "global_step": 506604, "epoch": 6103} {"train_loss": -27.388492584228516, "global_step": 506605, "epoch": 6103} {"train_loss": -27.677753448486328, "global_step": 506606, "epoch": 6103} {"train_loss": -27.728076934814453, "global_step": 506607, "epoch": 6103} {"train_loss": -27.3714542388916, "global_step": 506608, "epoch": 6103} {"train_loss": -27.3089542388916, "global_step": 506609, "epoch": 6103} {"train_loss": -27.55792236328125, "global_step": 506610, "epoch": 6103} {"train_loss": -27.385156631469727, "global_step": 506611, "epoch": 6103} {"train_loss": -27.6567440032959, "global_step": 506612, "epoch": 6103} {"train_loss": -27.369985580444336, "global_step": 506613, "epoch": 6103} {"train_loss": -27.60939598083496, "global_step": 506614, "epoch": 6103} {"train_loss": -27.498544692993164, "global_step": 506615, "epoch": 6103} {"train_loss": -27.55792808532715, "global_step": 506616, "epoch": 6103} {"train_loss": -27.36408805847168, "global_step": 506617, "epoch": 6103} {"train_loss": -27.586923599243164, "global_step": 506618, "epoch": 6103} {"train_loss": -27.542692184448242, "global_step": 506619, "epoch": 6103} {"train_loss": -27.708036422729492, "global_step": 506620, "epoch": 6103} {"train_loss": -27.647062301635742, "global_step": 506621, "epoch": 6103} {"train_loss": -27.366779327392578, "global_step": 506622, "epoch": 6103} {"train_loss": -27.5725040435791, "global_step": 506623, "epoch": 6103} {"train_loss": -27.746917724609375, "global_step": 506624, "epoch": 6103} {"train_loss": -27.646520614624023, "global_step": 506625, "epoch": 6103} {"train_loss": -27.465362548828125, "global_step": 506626, "epoch": 6103} {"train_loss": -27.61748695373535, "global_step": 506627, "epoch": 6103} {"train_loss": -27.609235763549805, "global_step": 506628, "epoch": 6103} {"train_loss": -27.170759201049805, "global_step": 506629, "epoch": 6103} {"train_loss": -27.40204429626465, "global_step": 506630, "epoch": 6103} {"train_loss": -27.310645988188593, "global_step": 506631, "epoch": 6103, "val_loss": 6583431.0} {"train_loss": -27.150049209594727, "global_step": 506632, "epoch": 6104} {"train_loss": -27.08168601989746, "global_step": 506633, "epoch": 6104} {"train_loss": -27.398569107055664, "global_step": 506634, "epoch": 6104} {"train_loss": -27.0971622467041, "global_step": 506635, "epoch": 6104} {"train_loss": -27.238439559936523, "global_step": 506636, "epoch": 6104} {"train_loss": -27.53363609313965, "global_step": 506637, "epoch": 6104} {"train_loss": -27.10236930847168, "global_step": 506638, "epoch": 6104} {"train_loss": -26.8336181640625, "global_step": 506639, "epoch": 6104} {"train_loss": -27.532129287719727, "global_step": 506640, "epoch": 6104} {"train_loss": -27.2813720703125, "global_step": 506641, "epoch": 6104} {"train_loss": -27.302968978881836, "global_step": 506642, "epoch": 6104} {"train_loss": -26.8529052734375, "global_step": 506643, "epoch": 6104} {"train_loss": -26.481433868408203, "global_step": 506644, "epoch": 6104} {"train_loss": -26.515003204345703, "global_step": 506645, "epoch": 6104} {"train_loss": -26.77174186706543, "global_step": 506646, "epoch": 6104} {"train_loss": -27.380720138549805, "global_step": 506647, "epoch": 6104} {"train_loss": -27.001981735229492, "global_step": 506648, "epoch": 6104} {"train_loss": -26.843280792236328, "global_step": 506649, "epoch": 6104} {"train_loss": -27.27671241760254, "global_step": 506650, "epoch": 6104} {"train_loss": -26.534109115600586, "global_step": 506651, "epoch": 6104} {"train_loss": -26.843265533447266, "global_step": 506652, "epoch": 6104} {"train_loss": -26.786413192749023, "global_step": 506653, "epoch": 6104} {"train_loss": -26.783063888549805, "global_step": 506654, "epoch": 6104} {"train_loss": -27.116254806518555, "global_step": 506655, "epoch": 6104} {"train_loss": -27.25843620300293, "global_step": 506656, "epoch": 6104} {"train_loss": -26.954700469970703, "global_step": 506657, "epoch": 6104} {"train_loss": -27.70393180847168, "global_step": 506658, "epoch": 6104} {"train_loss": -27.103580474853516, "global_step": 506659, "epoch": 6104} {"train_loss": -27.44904136657715, "global_step": 506660, "epoch": 6104} {"train_loss": -27.330739974975586, "global_step": 506661, "epoch": 6104} {"train_loss": -27.334827423095703, "global_step": 506662, "epoch": 6104} {"train_loss": -27.178054809570312, "global_step": 506663, "epoch": 6104} {"train_loss": -27.02186393737793, "global_step": 506664, "epoch": 6104} {"train_loss": -27.31784439086914, "global_step": 506665, "epoch": 6104} {"train_loss": -27.6040096282959, "global_step": 506666, "epoch": 6104} {"train_loss": -27.641260147094727, "global_step": 506667, "epoch": 6104} {"train_loss": -27.3201847076416, "global_step": 506668, "epoch": 6104} {"train_loss": -27.505102157592773, "global_step": 506669, "epoch": 6104} {"train_loss": -27.516691207885742, "global_step": 506670, "epoch": 6104} {"train_loss": -27.32297134399414, "global_step": 506671, "epoch": 6104} {"train_loss": -27.731882095336914, "global_step": 506672, "epoch": 6104} {"train_loss": -27.412405014038086, "global_step": 506673, "epoch": 6104} {"train_loss": -27.584491729736328, "global_step": 506674, "epoch": 6104} {"train_loss": -27.155929565429688, "global_step": 506675, "epoch": 6104} {"train_loss": -27.556161880493164, "global_step": 506676, "epoch": 6104} {"train_loss": -27.29937744140625, "global_step": 506677, "epoch": 6104} {"train_loss": -27.4642276763916, "global_step": 506678, "epoch": 6104} {"train_loss": -27.73895263671875, "global_step": 506679, "epoch": 6104} {"train_loss": -27.51862144470215, "global_step": 506680, "epoch": 6104} {"train_loss": -27.779422760009766, "global_step": 506681, "epoch": 6104} {"train_loss": -27.753149032592773, "global_step": 506682, "epoch": 6104} {"train_loss": -27.658090591430664, "global_step": 506683, "epoch": 6104} {"train_loss": -27.5816707611084, "global_step": 506684, "epoch": 6104} {"train_loss": -27.56861686706543, "global_step": 506685, "epoch": 6104} {"train_loss": -27.328826904296875, "global_step": 506686, "epoch": 6104} {"train_loss": -27.467443466186523, "global_step": 506687, "epoch": 6104} {"train_loss": -27.5701961517334, "global_step": 506688, "epoch": 6104} {"train_loss": -27.843957901000977, "global_step": 506689, "epoch": 6104} {"train_loss": -27.113122940063477, "global_step": 506690, "epoch": 6104} {"train_loss": -27.399518966674805, "global_step": 506691, "epoch": 6104} {"train_loss": -27.218185424804688, "global_step": 506692, "epoch": 6104} {"train_loss": -27.343786239624023, "global_step": 506693, "epoch": 6104} {"train_loss": -27.494836807250977, "global_step": 506694, "epoch": 6104} {"train_loss": -27.46466636657715, "global_step": 506695, "epoch": 6104} {"train_loss": -27.43560218811035, "global_step": 506696, "epoch": 6104} {"train_loss": -27.30352783203125, "global_step": 506697, "epoch": 6104} {"train_loss": -27.4013614654541, "global_step": 506698, "epoch": 6104} {"train_loss": -27.43427848815918, "global_step": 506699, "epoch": 6104} {"train_loss": -27.633056640625, "global_step": 506700, "epoch": 6104} {"train_loss": -27.59136390686035, "global_step": 506701, "epoch": 6104} {"train_loss": -26.88313865661621, "global_step": 506702, "epoch": 6104} {"train_loss": -27.283842086791992, "global_step": 506703, "epoch": 6104} {"train_loss": -27.16379737854004, "global_step": 506704, "epoch": 6104} {"train_loss": -27.453649520874023, "global_step": 506705, "epoch": 6104} {"train_loss": -27.00661277770996, "global_step": 506706, "epoch": 6104} {"train_loss": -27.253808975219727, "global_step": 506707, "epoch": 6104} {"train_loss": -27.249921798706055, "global_step": 506708, "epoch": 6104} {"train_loss": -26.517560958862305, "global_step": 506709, "epoch": 6104} {"train_loss": -27.854248046875, "global_step": 506710, "epoch": 6104} {"train_loss": -26.94437599182129, "global_step": 506711, "epoch": 6104} {"train_loss": -27.455829620361328, "global_step": 506712, "epoch": 6104} {"train_loss": -27.5638427734375, "global_step": 506713, "epoch": 6104} {"train_loss": -27.27435314224427, "global_step": 506714, "epoch": 6104, "val_loss": 6521307.5} {"train_loss": -26.335315704345703, "global_step": 506715, "epoch": 6105} {"train_loss": -25.825300216674805, "global_step": 506716, "epoch": 6105} {"train_loss": -25.66982078552246, "global_step": 506717, "epoch": 6105} {"train_loss": -26.719587326049805, "global_step": 506718, "epoch": 6105} {"train_loss": -26.847503662109375, "global_step": 506719, "epoch": 6105} {"train_loss": -26.459033966064453, "global_step": 506720, "epoch": 6105} {"train_loss": -26.13848304748535, "global_step": 506721, "epoch": 6105} {"train_loss": -26.5876407623291, "global_step": 506722, "epoch": 6105} {"train_loss": -26.175052642822266, "global_step": 506723, "epoch": 6105} {"train_loss": -26.80011558532715, "global_step": 506724, "epoch": 6105} {"train_loss": -26.534372329711914, "global_step": 506725, "epoch": 6105} {"train_loss": -26.753692626953125, "global_step": 506726, "epoch": 6105} {"train_loss": -26.848302841186523, "global_step": 506727, "epoch": 6105} {"train_loss": -26.870777130126953, "global_step": 506728, "epoch": 6105} {"train_loss": -27.03936767578125, "global_step": 506729, "epoch": 6105} {"train_loss": -26.6124267578125, "global_step": 506730, "epoch": 6105} {"train_loss": -26.653549194335938, "global_step": 506731, "epoch": 6105} {"train_loss": -26.671483993530273, "global_step": 506732, "epoch": 6105} {"train_loss": -26.857086181640625, "global_step": 506733, "epoch": 6105} {"train_loss": -27.137083053588867, "global_step": 506734, "epoch": 6105} {"train_loss": -26.498960494995117, "global_step": 506735, "epoch": 6105} {"train_loss": -26.937646865844727, "global_step": 506736, "epoch": 6105} {"train_loss": -27.18994140625, "global_step": 506737, "epoch": 6105} {"train_loss": -26.61414909362793, "global_step": 506738, "epoch": 6105} {"train_loss": -26.985193252563477, "global_step": 506739, "epoch": 6105} {"train_loss": -26.738767623901367, "global_step": 506740, "epoch": 6105} {"train_loss": -26.895593643188477, "global_step": 506741, "epoch": 6105} {"train_loss": -27.2197322845459, "global_step": 506742, "epoch": 6105} {"train_loss": -26.73042106628418, "global_step": 506743, "epoch": 6105} {"train_loss": -26.88004493713379, "global_step": 506744, "epoch": 6105} {"train_loss": -27.307153701782227, "global_step": 506745, "epoch": 6105} {"train_loss": -27.449865341186523, "global_step": 506746, "epoch": 6105} {"train_loss": -27.3233585357666, "global_step": 506747, "epoch": 6105} {"train_loss": -27.012863159179688, "global_step": 506748, "epoch": 6105} {"train_loss": -27.096506118774414, "global_step": 506749, "epoch": 6105} {"train_loss": -27.638898849487305, "global_step": 506750, "epoch": 6105} {"train_loss": -27.445173263549805, "global_step": 506751, "epoch": 6105} {"train_loss": -27.499820709228516, "global_step": 506752, "epoch": 6105} {"train_loss": -27.67445945739746, "global_step": 506753, "epoch": 6105} {"train_loss": -27.67270278930664, "global_step": 506754, "epoch": 6105} {"train_loss": -27.804800033569336, "global_step": 506755, "epoch": 6105} {"train_loss": -27.47410011291504, "global_step": 506756, "epoch": 6105} {"train_loss": -27.316709518432617, "global_step": 506757, "epoch": 6105} {"train_loss": -27.312042236328125, "global_step": 506758, "epoch": 6105} {"train_loss": -27.676008224487305, "global_step": 506759, "epoch": 6105} {"train_loss": -27.517908096313477, "global_step": 506760, "epoch": 6105} {"train_loss": -27.657312393188477, "global_step": 506761, "epoch": 6105} {"train_loss": -27.8091983795166, "global_step": 506762, "epoch": 6105} {"train_loss": -27.380615234375, "global_step": 506763, "epoch": 6105} {"train_loss": -27.288467407226562, "global_step": 506764, "epoch": 6105} {"train_loss": -27.738828659057617, "global_step": 506765, "epoch": 6105} {"train_loss": -27.43003273010254, "global_step": 506766, "epoch": 6105} {"train_loss": -27.4110164642334, "global_step": 506767, "epoch": 6105} {"train_loss": -27.494464874267578, "global_step": 506768, "epoch": 6105} {"train_loss": -26.777929306030273, "global_step": 506769, "epoch": 6105} {"train_loss": -26.484067916870117, "global_step": 506770, "epoch": 6105} {"train_loss": -27.01981544494629, "global_step": 506771, "epoch": 6105} {"train_loss": -27.687108993530273, "global_step": 506772, "epoch": 6105} {"train_loss": -27.662036895751953, "global_step": 506773, "epoch": 6105} {"train_loss": -27.45659828186035, "global_step": 506774, "epoch": 6105} {"train_loss": -27.495513916015625, "global_step": 506775, "epoch": 6105} {"train_loss": -27.7568302154541, "global_step": 506776, "epoch": 6105} {"train_loss": -27.67316246032715, "global_step": 506777, "epoch": 6105} {"train_loss": -27.310409545898438, "global_step": 506778, "epoch": 6105} {"train_loss": -27.7855281829834, "global_step": 506779, "epoch": 6105} {"train_loss": -26.742528915405273, "global_step": 506780, "epoch": 6105} {"train_loss": -27.53857421875, "global_step": 506781, "epoch": 6105} {"train_loss": -27.184080123901367, "global_step": 506782, "epoch": 6105} {"train_loss": -26.85829734802246, "global_step": 506783, "epoch": 6105} {"train_loss": -26.51434326171875, "global_step": 506784, "epoch": 6105} {"train_loss": -25.853498458862305, "global_step": 506785, "epoch": 6105} {"train_loss": -26.81723976135254, "global_step": 506786, "epoch": 6105} {"train_loss": -27.0920467376709, "global_step": 506787, "epoch": 6105} {"train_loss": -26.6496639251709, "global_step": 506788, "epoch": 6105} {"train_loss": -26.89605712890625, "global_step": 506789, "epoch": 6105} {"train_loss": -27.671497344970703, "global_step": 506790, "epoch": 6105} {"train_loss": -26.910110473632812, "global_step": 506791, "epoch": 6105} {"train_loss": -27.864032745361328, "global_step": 506792, "epoch": 6105} {"train_loss": -27.26468849182129, "global_step": 506793, "epoch": 6105} {"train_loss": -28.041357040405273, "global_step": 506794, "epoch": 6105} {"train_loss": -27.13433265686035, "global_step": 506795, "epoch": 6105} {"train_loss": -27.401798248291016, "global_step": 506796, "epoch": 6105} {"train_loss": -27.08649860519961, "global_step": 506797, "epoch": 6105, "val_loss": 6572331.5} {"train_loss": -27.375059127807617, "global_step": 506798, "epoch": 6106} {"train_loss": -27.0378360748291, "global_step": 506799, "epoch": 6106} {"train_loss": -27.03864097595215, "global_step": 506800, "epoch": 6106} {"train_loss": -26.481201171875, "global_step": 506801, "epoch": 6106} {"train_loss": -27.141233444213867, "global_step": 506802, "epoch": 6106} {"train_loss": -27.481311798095703, "global_step": 506803, "epoch": 6106} {"train_loss": -27.246341705322266, "global_step": 506804, "epoch": 6106} {"train_loss": -27.3063907623291, "global_step": 506805, "epoch": 6106} {"train_loss": -26.92323112487793, "global_step": 506806, "epoch": 6106} {"train_loss": -27.200790405273438, "global_step": 506807, "epoch": 6106} {"train_loss": -26.95950698852539, "global_step": 506808, "epoch": 6106} {"train_loss": -27.56894302368164, "global_step": 506809, "epoch": 6106} {"train_loss": -27.39166259765625, "global_step": 506810, "epoch": 6106} {"train_loss": -26.777557373046875, "global_step": 506811, "epoch": 6106} {"train_loss": -26.696264266967773, "global_step": 506812, "epoch": 6106} {"train_loss": -27.6142520904541, "global_step": 506813, "epoch": 6106} {"train_loss": -27.15398597717285, "global_step": 506814, "epoch": 6106} {"train_loss": -27.313552856445312, "global_step": 506815, "epoch": 6106} {"train_loss": -27.11728858947754, "global_step": 506816, "epoch": 6106} {"train_loss": -27.141565322875977, "global_step": 506817, "epoch": 6106} {"train_loss": -27.208356857299805, "global_step": 506818, "epoch": 6106} {"train_loss": -27.270038604736328, "global_step": 506819, "epoch": 6106} {"train_loss": -27.569814682006836, "global_step": 506820, "epoch": 6106} {"train_loss": -27.034698486328125, "global_step": 506821, "epoch": 6106} {"train_loss": -27.41278076171875, "global_step": 506822, "epoch": 6106} {"train_loss": -27.512399673461914, "global_step": 506823, "epoch": 6106} {"train_loss": -27.529386520385742, "global_step": 506824, "epoch": 6106} {"train_loss": -27.556066513061523, "global_step": 506825, "epoch": 6106} {"train_loss": -27.35883903503418, "global_step": 506826, "epoch": 6106} {"train_loss": -27.154687881469727, "global_step": 506827, "epoch": 6106} {"train_loss": -27.54231071472168, "global_step": 506828, "epoch": 6106} {"train_loss": -27.250146865844727, "global_step": 506829, "epoch": 6106} {"train_loss": -27.480253219604492, "global_step": 506830, "epoch": 6106} {"train_loss": -27.43754005432129, "global_step": 506831, "epoch": 6106} {"train_loss": -27.834699630737305, "global_step": 506832, "epoch": 6106} {"train_loss": -27.646085739135742, "global_step": 506833, "epoch": 6106} {"train_loss": -27.42304801940918, "global_step": 506834, "epoch": 6106} {"train_loss": -27.671674728393555, "global_step": 506835, "epoch": 6106} {"train_loss": -27.31000328063965, "global_step": 506836, "epoch": 6106} {"train_loss": -27.489896774291992, "global_step": 506837, "epoch": 6106} {"train_loss": -27.703693389892578, "global_step": 506838, "epoch": 6106} {"train_loss": -27.43988037109375, "global_step": 506839, "epoch": 6106} {"train_loss": -27.490478515625, "global_step": 506840, "epoch": 6106} {"train_loss": -27.62527847290039, "global_step": 506841, "epoch": 6106} {"train_loss": -27.673917770385742, "global_step": 506842, "epoch": 6106} {"train_loss": -27.298383712768555, "global_step": 506843, "epoch": 6106} {"train_loss": -27.530902862548828, "global_step": 506844, "epoch": 6106} {"train_loss": -27.795026779174805, "global_step": 506845, "epoch": 6106} {"train_loss": -27.54668617248535, "global_step": 506846, "epoch": 6106} {"train_loss": -27.638639450073242, "global_step": 506847, "epoch": 6106} {"train_loss": -27.2375545501709, "global_step": 506848, "epoch": 6106} {"train_loss": -27.186376571655273, "global_step": 506849, "epoch": 6106} {"train_loss": -26.95684242248535, "global_step": 506850, "epoch": 6106} {"train_loss": -27.260009765625, "global_step": 506851, "epoch": 6106} {"train_loss": -27.030261993408203, "global_step": 506852, "epoch": 6106} {"train_loss": -27.889806747436523, "global_step": 506853, "epoch": 6106} {"train_loss": -27.701017379760742, "global_step": 506854, "epoch": 6106} {"train_loss": -27.506500244140625, "global_step": 506855, "epoch": 6106} {"train_loss": -27.414779663085938, "global_step": 506856, "epoch": 6106} {"train_loss": -27.667282104492188, "global_step": 506857, "epoch": 6106} {"train_loss": -27.503585815429688, "global_step": 506858, "epoch": 6106} {"train_loss": -27.887659072875977, "global_step": 506859, "epoch": 6106} {"train_loss": -27.379667282104492, "global_step": 506860, "epoch": 6106} {"train_loss": -27.479507446289062, "global_step": 506861, "epoch": 6106} {"train_loss": -27.514657974243164, "global_step": 506862, "epoch": 6106} {"train_loss": -27.536779403686523, "global_step": 506863, "epoch": 6106} {"train_loss": -27.490121841430664, "global_step": 506864, "epoch": 6106} {"train_loss": -27.416101455688477, "global_step": 506865, "epoch": 6106} {"train_loss": -27.684309005737305, "global_step": 506866, "epoch": 6106} {"train_loss": -27.39949607849121, "global_step": 506867, "epoch": 6106} {"train_loss": -27.60340690612793, "global_step": 506868, "epoch": 6106} {"train_loss": -27.445362091064453, "global_step": 506869, "epoch": 6106} {"train_loss": -27.127958297729492, "global_step": 506870, "epoch": 6106} {"train_loss": -27.504846572875977, "global_step": 506871, "epoch": 6106} {"train_loss": -27.40516471862793, "global_step": 506872, "epoch": 6106} {"train_loss": -27.44581413269043, "global_step": 506873, "epoch": 6106} {"train_loss": -26.975360870361328, "global_step": 506874, "epoch": 6106} {"train_loss": -27.96539306640625, "global_step": 506875, "epoch": 6106} {"train_loss": -27.686187744140625, "global_step": 506876, "epoch": 6106} {"train_loss": -27.332895278930664, "global_step": 506877, "epoch": 6106} {"train_loss": -27.425485610961914, "global_step": 506878, "epoch": 6106} {"train_loss": -27.316431045532227, "global_step": 506879, "epoch": 6106} {"train_loss": -27.37488790305264, "global_step": 506880, "epoch": 6106, "val_loss": 6589988.0} {"train_loss": -26.8757381439209, "global_step": 506881, "epoch": 6107} {"train_loss": -26.440933227539062, "global_step": 506882, "epoch": 6107} {"train_loss": -27.063446044921875, "global_step": 506883, "epoch": 6107} {"train_loss": -27.311237335205078, "global_step": 506884, "epoch": 6107} {"train_loss": -26.8066463470459, "global_step": 506885, "epoch": 6107} {"train_loss": -27.148529052734375, "global_step": 506886, "epoch": 6107} {"train_loss": -27.078115463256836, "global_step": 506887, "epoch": 6107} {"train_loss": -27.433210372924805, "global_step": 506888, "epoch": 6107} {"train_loss": -27.55224609375, "global_step": 506889, "epoch": 6107} {"train_loss": -26.745832443237305, "global_step": 506890, "epoch": 6107} {"train_loss": -27.37213706970215, "global_step": 506891, "epoch": 6107} {"train_loss": -27.59360122680664, "global_step": 506892, "epoch": 6107} {"train_loss": -27.552881240844727, "global_step": 506893, "epoch": 6107} {"train_loss": -26.58209228515625, "global_step": 506894, "epoch": 6107} {"train_loss": -27.151596069335938, "global_step": 506895, "epoch": 6107} {"train_loss": -27.104660034179688, "global_step": 506896, "epoch": 6107} {"train_loss": -27.313642501831055, "global_step": 506897, "epoch": 6107} {"train_loss": -27.18304443359375, "global_step": 506898, "epoch": 6107} {"train_loss": -27.39771842956543, "global_step": 506899, "epoch": 6107} {"train_loss": -27.585050582885742, "global_step": 506900, "epoch": 6107} {"train_loss": -27.431177139282227, "global_step": 506901, "epoch": 6107} {"train_loss": -27.47587013244629, "global_step": 506902, "epoch": 6107} {"train_loss": -27.357763290405273, "global_step": 506903, "epoch": 6107} {"train_loss": -27.39505386352539, "global_step": 506904, "epoch": 6107} {"train_loss": -27.145376205444336, "global_step": 506905, "epoch": 6107} {"train_loss": -27.596487045288086, "global_step": 506906, "epoch": 6107} {"train_loss": -27.066726684570312, "global_step": 506907, "epoch": 6107} {"train_loss": -27.546899795532227, "global_step": 506908, "epoch": 6107} {"train_loss": -27.663543701171875, "global_step": 506909, "epoch": 6107} {"train_loss": -27.28897476196289, "global_step": 506910, "epoch": 6107} {"train_loss": -27.469629287719727, "global_step": 506911, "epoch": 6107} {"train_loss": -27.486312866210938, "global_step": 506912, "epoch": 6107} {"train_loss": -27.59791374206543, "global_step": 506913, "epoch": 6107} {"train_loss": -27.71992301940918, "global_step": 506914, "epoch": 6107} {"train_loss": -27.304845809936523, "global_step": 506915, "epoch": 6107} {"train_loss": -27.451557159423828, "global_step": 506916, "epoch": 6107} {"train_loss": -27.5186824798584, "global_step": 506917, "epoch": 6107} {"train_loss": -27.617816925048828, "global_step": 506918, "epoch": 6107} {"train_loss": -27.649051666259766, "global_step": 506919, "epoch": 6107} {"train_loss": -27.262487411499023, "global_step": 506920, "epoch": 6107} {"train_loss": -27.65869140625, "global_step": 506921, "epoch": 6107} {"train_loss": -28.02658462524414, "global_step": 506922, "epoch": 6107} {"train_loss": -27.762601852416992, "global_step": 506923, "epoch": 6107} {"train_loss": -27.7561092376709, "global_step": 506924, "epoch": 6107} {"train_loss": -27.267316818237305, "global_step": 506925, "epoch": 6107} {"train_loss": -27.738840103149414, "global_step": 506926, "epoch": 6107} {"train_loss": -27.69496726989746, "global_step": 506927, "epoch": 6107} {"train_loss": -27.578887939453125, "global_step": 506928, "epoch": 6107} {"train_loss": -27.41423988342285, "global_step": 506929, "epoch": 6107} {"train_loss": -27.58662223815918, "global_step": 506930, "epoch": 6107} {"train_loss": -27.484222412109375, "global_step": 506931, "epoch": 6107} {"train_loss": -27.745594024658203, "global_step": 506932, "epoch": 6107} {"train_loss": -27.232038497924805, "global_step": 506933, "epoch": 6107} {"train_loss": -27.424829483032227, "global_step": 506934, "epoch": 6107} {"train_loss": -27.19428825378418, "global_step": 506935, "epoch": 6107} {"train_loss": -26.686370849609375, "global_step": 506936, "epoch": 6107} {"train_loss": -27.53729820251465, "global_step": 506937, "epoch": 6107} {"train_loss": -27.23243522644043, "global_step": 506938, "epoch": 6107} {"train_loss": -27.665973663330078, "global_step": 506939, "epoch": 6107} {"train_loss": -27.167484283447266, "global_step": 506940, "epoch": 6107} {"train_loss": -27.307043075561523, "global_step": 506941, "epoch": 6107} {"train_loss": -27.19696617126465, "global_step": 506942, "epoch": 6107} {"train_loss": -27.021350860595703, "global_step": 506943, "epoch": 6107} {"train_loss": -27.134140014648438, "global_step": 506944, "epoch": 6107} {"train_loss": -27.482892990112305, "global_step": 506945, "epoch": 6107} {"train_loss": -27.570642471313477, "global_step": 506946, "epoch": 6107} {"train_loss": -27.431013107299805, "global_step": 506947, "epoch": 6107} {"train_loss": -27.54676628112793, "global_step": 506948, "epoch": 6107} {"train_loss": -27.711179733276367, "global_step": 506949, "epoch": 6107} {"train_loss": -27.312976837158203, "global_step": 506950, "epoch": 6107} {"train_loss": -27.450897216796875, "global_step": 506951, "epoch": 6107} {"train_loss": -27.345518112182617, "global_step": 506952, "epoch": 6107} {"train_loss": -27.683908462524414, "global_step": 506953, "epoch": 6107} {"train_loss": -27.49005699157715, "global_step": 506954, "epoch": 6107} {"train_loss": -27.436437606811523, "global_step": 506955, "epoch": 6107} {"train_loss": -27.278278350830078, "global_step": 506956, "epoch": 6107} {"train_loss": -27.273853302001953, "global_step": 506957, "epoch": 6107} {"train_loss": -27.295337677001953, "global_step": 506958, "epoch": 6107} {"train_loss": -27.5076961517334, "global_step": 506959, "epoch": 6107} {"train_loss": -27.637418746948242, "global_step": 506960, "epoch": 6107} {"train_loss": -27.720016479492188, "global_step": 506961, "epoch": 6107} {"train_loss": -27.207611083984375, "global_step": 506962, "epoch": 6107} {"train_loss": -27.382060453116175, "global_step": 506963, "epoch": 6107, "val_loss": 6568323.0} {"train_loss": -26.948022842407227, "global_step": 506964, "epoch": 6108} {"train_loss": -27.142541885375977, "global_step": 506965, "epoch": 6108} {"train_loss": -27.218896865844727, "global_step": 506966, "epoch": 6108} {"train_loss": -27.20969009399414, "global_step": 506967, "epoch": 6108} {"train_loss": -27.703937530517578, "global_step": 506968, "epoch": 6108} {"train_loss": -26.961658477783203, "global_step": 506969, "epoch": 6108} {"train_loss": -26.979108810424805, "global_step": 506970, "epoch": 6108} {"train_loss": -27.124631881713867, "global_step": 506971, "epoch": 6108} {"train_loss": -27.949665069580078, "global_step": 506972, "epoch": 6108} {"train_loss": -26.9908390045166, "global_step": 506973, "epoch": 6108} {"train_loss": -27.49627113342285, "global_step": 506974, "epoch": 6108} {"train_loss": -27.11031150817871, "global_step": 506975, "epoch": 6108} {"train_loss": -27.43696403503418, "global_step": 506976, "epoch": 6108} {"train_loss": -27.32227897644043, "global_step": 506977, "epoch": 6108} {"train_loss": -27.50533103942871, "global_step": 506978, "epoch": 6108} {"train_loss": -27.1502742767334, "global_step": 506979, "epoch": 6108} {"train_loss": -27.547103881835938, "global_step": 506980, "epoch": 6108} {"train_loss": -26.976367950439453, "global_step": 506981, "epoch": 6108} {"train_loss": -27.60405921936035, "global_step": 506982, "epoch": 6108} {"train_loss": -27.535781860351562, "global_step": 506983, "epoch": 6108} {"train_loss": -27.688688278198242, "global_step": 506984, "epoch": 6108} {"train_loss": -27.274826049804688, "global_step": 506985, "epoch": 6108} {"train_loss": -27.42563247680664, "global_step": 506986, "epoch": 6108} {"train_loss": -27.5457706451416, "global_step": 506987, "epoch": 6108} {"train_loss": -27.215946197509766, "global_step": 506988, "epoch": 6108} {"train_loss": -27.488195419311523, "global_step": 506989, "epoch": 6108} {"train_loss": -27.46198081970215, "global_step": 506990, "epoch": 6108} {"train_loss": -27.603368759155273, "global_step": 506991, "epoch": 6108} {"train_loss": -27.50880241394043, "global_step": 506992, "epoch": 6108} {"train_loss": -27.60809898376465, "global_step": 506993, "epoch": 6108} {"train_loss": -27.8850040435791, "global_step": 506994, "epoch": 6108} {"train_loss": -27.443628311157227, "global_step": 506995, "epoch": 6108} {"train_loss": -27.40066909790039, "global_step": 506996, "epoch": 6108} {"train_loss": -27.517728805541992, "global_step": 506997, "epoch": 6108} {"train_loss": -27.723859786987305, "global_step": 506998, "epoch": 6108} {"train_loss": -27.551105499267578, "global_step": 506999, "epoch": 6108} {"train_loss": -27.210973739624023, "global_step": 507000, "epoch": 6108} {"train_loss": -27.20118522644043, "global_step": 507001, "epoch": 6108} {"train_loss": -27.409107208251953, "global_step": 507002, "epoch": 6108} {"train_loss": -27.755298614501953, "global_step": 507003, "epoch": 6108} {"train_loss": -27.950780868530273, "global_step": 507004, "epoch": 6108} {"train_loss": -27.714033126831055, "global_step": 507005, "epoch": 6108} {"train_loss": -27.545673370361328, "global_step": 507006, "epoch": 6108} {"train_loss": -27.352384567260742, "global_step": 507007, "epoch": 6108} {"train_loss": -27.745786666870117, "global_step": 507008, "epoch": 6108} {"train_loss": -27.578125, "global_step": 507009, "epoch": 6108} {"train_loss": -27.813018798828125, "global_step": 507010, "epoch": 6108} {"train_loss": -27.41444206237793, "global_step": 507011, "epoch": 6108} {"train_loss": -27.949148178100586, "global_step": 507012, "epoch": 6108} {"train_loss": -27.42673683166504, "global_step": 507013, "epoch": 6108} {"train_loss": -27.83296775817871, "global_step": 507014, "epoch": 6108} {"train_loss": -27.57122230529785, "global_step": 507015, "epoch": 6108} {"train_loss": -27.477481842041016, "global_step": 507016, "epoch": 6108} {"train_loss": -27.20440673828125, "global_step": 507017, "epoch": 6108} {"train_loss": -27.09431266784668, "global_step": 507018, "epoch": 6108} {"train_loss": -27.4948673248291, "global_step": 507019, "epoch": 6108} {"train_loss": -27.3703556060791, "global_step": 507020, "epoch": 6108} {"train_loss": -27.655500411987305, "global_step": 507021, "epoch": 6108} {"train_loss": -28.000152587890625, "global_step": 507022, "epoch": 6108} {"train_loss": -27.425994873046875, "global_step": 507023, "epoch": 6108} {"train_loss": -27.338836669921875, "global_step": 507024, "epoch": 6108} {"train_loss": -27.808761596679688, "global_step": 507025, "epoch": 6108} {"train_loss": -27.936853408813477, "global_step": 507026, "epoch": 6108} {"train_loss": -27.581369400024414, "global_step": 507027, "epoch": 6108} {"train_loss": -27.6610107421875, "global_step": 507028, "epoch": 6108} {"train_loss": -27.461822509765625, "global_step": 507029, "epoch": 6108} {"train_loss": -27.573017120361328, "global_step": 507030, "epoch": 6108} {"train_loss": -27.62109375, "global_step": 507031, "epoch": 6108} {"train_loss": -27.298086166381836, "global_step": 507032, "epoch": 6108} {"train_loss": -27.313154220581055, "global_step": 507033, "epoch": 6108} {"train_loss": -27.199935913085938, "global_step": 507034, "epoch": 6108} {"train_loss": -27.381250381469727, "global_step": 507035, "epoch": 6108} {"train_loss": -27.791955947875977, "global_step": 507036, "epoch": 6108} {"train_loss": -27.438505172729492, "global_step": 507037, "epoch": 6108} {"train_loss": -27.508655548095703, "global_step": 507038, "epoch": 6108} {"train_loss": -27.549726486206055, "global_step": 507039, "epoch": 6108} {"train_loss": -27.57440757751465, "global_step": 507040, "epoch": 6108} {"train_loss": -27.682336807250977, "global_step": 507041, "epoch": 6108} {"train_loss": -27.736234664916992, "global_step": 507042, "epoch": 6108} {"train_loss": -27.283050537109375, "global_step": 507043, "epoch": 6108} {"train_loss": -27.313003540039062, "global_step": 507044, "epoch": 6108} {"train_loss": -27.118427276611328, "global_step": 507045, "epoch": 6108} {"train_loss": -27.44534448830478, "global_step": 507046, "epoch": 6108, "val_loss": 6648339.0} {"train_loss": -25.08149528503418, "global_step": 507047, "epoch": 6109} {"train_loss": -22.60928726196289, "global_step": 507048, "epoch": 6109} {"train_loss": -22.982913970947266, "global_step": 507049, "epoch": 6109} {"train_loss": -26.32673454284668, "global_step": 507050, "epoch": 6109} {"train_loss": -24.457412719726562, "global_step": 507051, "epoch": 6109} {"train_loss": -26.267927169799805, "global_step": 507052, "epoch": 6109} {"train_loss": -24.788196563720703, "global_step": 507053, "epoch": 6109} {"train_loss": -26.126605987548828, "global_step": 507054, "epoch": 6109} {"train_loss": -26.02498435974121, "global_step": 507055, "epoch": 6109} {"train_loss": -25.912763595581055, "global_step": 507056, "epoch": 6109} {"train_loss": -26.468128204345703, "global_step": 507057, "epoch": 6109} {"train_loss": -26.5631103515625, "global_step": 507058, "epoch": 6109} {"train_loss": -26.44580078125, "global_step": 507059, "epoch": 6109} {"train_loss": -26.81800651550293, "global_step": 507060, "epoch": 6109} {"train_loss": -26.561391830444336, "global_step": 507061, "epoch": 6109} {"train_loss": -26.61040687561035, "global_step": 507062, "epoch": 6109} {"train_loss": -26.3321590423584, "global_step": 507063, "epoch": 6109} {"train_loss": -26.605270385742188, "global_step": 507064, "epoch": 6109} {"train_loss": -26.555511474609375, "global_step": 507065, "epoch": 6109} {"train_loss": -26.48560905456543, "global_step": 507066, "epoch": 6109} {"train_loss": -26.942365646362305, "global_step": 507067, "epoch": 6109} {"train_loss": -26.78729248046875, "global_step": 507068, "epoch": 6109} {"train_loss": -27.078750610351562, "global_step": 507069, "epoch": 6109} {"train_loss": -26.492963790893555, "global_step": 507070, "epoch": 6109} {"train_loss": -26.881641387939453, "global_step": 507071, "epoch": 6109} {"train_loss": -27.038562774658203, "global_step": 507072, "epoch": 6109} {"train_loss": -27.075647354125977, "global_step": 507073, "epoch": 6109} {"train_loss": -26.951446533203125, "global_step": 507074, "epoch": 6109} {"train_loss": -26.87837028503418, "global_step": 507075, "epoch": 6109} {"train_loss": -26.717376708984375, "global_step": 507076, "epoch": 6109} {"train_loss": -27.122119903564453, "global_step": 507077, "epoch": 6109} {"train_loss": -26.936166763305664, "global_step": 507078, "epoch": 6109} {"train_loss": -27.1286563873291, "global_step": 507079, "epoch": 6109} {"train_loss": -27.16082763671875, "global_step": 507080, "epoch": 6109} {"train_loss": -26.9234619140625, "global_step": 507081, "epoch": 6109} {"train_loss": -27.170394897460938, "global_step": 507082, "epoch": 6109} {"train_loss": -27.231592178344727, "global_step": 507083, "epoch": 6109} {"train_loss": -27.1868953704834, "global_step": 507084, "epoch": 6109} {"train_loss": -27.31548500061035, "global_step": 507085, "epoch": 6109} {"train_loss": -27.033905029296875, "global_step": 507086, "epoch": 6109} {"train_loss": -27.236852645874023, "global_step": 507087, "epoch": 6109} {"train_loss": -27.21632957458496, "global_step": 507088, "epoch": 6109} {"train_loss": -27.306461334228516, "global_step": 507089, "epoch": 6109} {"train_loss": -27.996305465698242, "global_step": 507090, "epoch": 6109} {"train_loss": -27.40260124206543, "global_step": 507091, "epoch": 6109} {"train_loss": -27.41240882873535, "global_step": 507092, "epoch": 6109} {"train_loss": -27.426166534423828, "global_step": 507093, "epoch": 6109} {"train_loss": -27.574758529663086, "global_step": 507094, "epoch": 6109} {"train_loss": -27.47902488708496, "global_step": 507095, "epoch": 6109} {"train_loss": -27.43524742126465, "global_step": 507096, "epoch": 6109} {"train_loss": -27.524511337280273, "global_step": 507097, "epoch": 6109} {"train_loss": -27.26666259765625, "global_step": 507098, "epoch": 6109} {"train_loss": -27.371173858642578, "global_step": 507099, "epoch": 6109} {"train_loss": -27.026321411132812, "global_step": 507100, "epoch": 6109} {"train_loss": -26.96760368347168, "global_step": 507101, "epoch": 6109} {"train_loss": -26.713565826416016, "global_step": 507102, "epoch": 6109} {"train_loss": -26.502105712890625, "global_step": 507103, "epoch": 6109} {"train_loss": -26.976806640625, "global_step": 507104, "epoch": 6109} {"train_loss": -27.269855499267578, "global_step": 507105, "epoch": 6109} {"train_loss": -26.862340927124023, "global_step": 507106, "epoch": 6109} {"train_loss": -27.251089096069336, "global_step": 507107, "epoch": 6109} {"train_loss": -27.55769157409668, "global_step": 507108, "epoch": 6109} {"train_loss": -27.5524959564209, "global_step": 507109, "epoch": 6109} {"train_loss": -27.155380249023438, "global_step": 507110, "epoch": 6109} {"train_loss": -27.53388023376465, "global_step": 507111, "epoch": 6109} {"train_loss": -27.487974166870117, "global_step": 507112, "epoch": 6109} {"train_loss": -27.490478515625, "global_step": 507113, "epoch": 6109} {"train_loss": -27.377490997314453, "global_step": 507114, "epoch": 6109} {"train_loss": -27.341039657592773, "global_step": 507115, "epoch": 6109} {"train_loss": -27.8010311126709, "global_step": 507116, "epoch": 6109} {"train_loss": -27.513647079467773, "global_step": 507117, "epoch": 6109} {"train_loss": -27.136810302734375, "global_step": 507118, "epoch": 6109} {"train_loss": -27.24468994140625, "global_step": 507119, "epoch": 6109} {"train_loss": -27.366247177124023, "global_step": 507120, "epoch": 6109} {"train_loss": -27.275537490844727, "global_step": 507121, "epoch": 6109} {"train_loss": -27.761978149414062, "global_step": 507122, "epoch": 6109} {"train_loss": -27.585187911987305, "global_step": 507123, "epoch": 6109} {"train_loss": -27.496906280517578, "global_step": 507124, "epoch": 6109} {"train_loss": -27.327661514282227, "global_step": 507125, "epoch": 6109} {"train_loss": -27.506277084350586, "global_step": 507126, "epoch": 6109} {"train_loss": -27.925146102905273, "global_step": 507127, "epoch": 6109} {"train_loss": -27.622812271118164, "global_step": 507128, "epoch": 6109} {"train_loss": -26.89520762340132, "global_step": 507129, "epoch": 6109, "val_loss": 6542440.0} {"train_loss": -26.802404403686523, "global_step": 507130, "epoch": 6110} {"train_loss": -27.00593376159668, "global_step": 507131, "epoch": 6110} {"train_loss": -26.731948852539062, "global_step": 507132, "epoch": 6110} {"train_loss": -26.8328857421875, "global_step": 507133, "epoch": 6110} {"train_loss": -26.6796932220459, "global_step": 507134, "epoch": 6110} {"train_loss": -26.7935848236084, "global_step": 507135, "epoch": 6110} {"train_loss": -26.912139892578125, "global_step": 507136, "epoch": 6110} {"train_loss": -26.84242057800293, "global_step": 507137, "epoch": 6110} {"train_loss": -26.919580459594727, "global_step": 507138, "epoch": 6110} {"train_loss": -27.21917724609375, "global_step": 507139, "epoch": 6110} {"train_loss": -26.62353515625, "global_step": 507140, "epoch": 6110} {"train_loss": -26.660125732421875, "global_step": 507141, "epoch": 6110} {"train_loss": -27.084716796875, "global_step": 507142, "epoch": 6110} {"train_loss": -27.251142501831055, "global_step": 507143, "epoch": 6110} {"train_loss": -27.22260093688965, "global_step": 507144, "epoch": 6110} {"train_loss": -27.22675132751465, "global_step": 507145, "epoch": 6110} {"train_loss": -27.077733993530273, "global_step": 507146, "epoch": 6110} {"train_loss": -26.81532859802246, "global_step": 507147, "epoch": 6110} {"train_loss": -27.16104507446289, "global_step": 507148, "epoch": 6110} {"train_loss": -27.187881469726562, "global_step": 507149, "epoch": 6110} {"train_loss": -26.814105987548828, "global_step": 507150, "epoch": 6110} {"train_loss": -27.046142578125, "global_step": 507151, "epoch": 6110} {"train_loss": -27.222747802734375, "global_step": 507152, "epoch": 6110} {"train_loss": -27.162799835205078, "global_step": 507153, "epoch": 6110} {"train_loss": -27.40087890625, "global_step": 507154, "epoch": 6110} {"train_loss": -27.373281478881836, "global_step": 507155, "epoch": 6110} {"train_loss": -27.39735221862793, "global_step": 507156, "epoch": 6110} {"train_loss": -26.879804611206055, "global_step": 507157, "epoch": 6110} {"train_loss": -27.10725212097168, "global_step": 507158, "epoch": 6110} {"train_loss": -27.20485496520996, "global_step": 507159, "epoch": 6110} {"train_loss": -27.913740158081055, "global_step": 507160, "epoch": 6110} {"train_loss": -27.273807525634766, "global_step": 507161, "epoch": 6110} {"train_loss": -27.288373947143555, "global_step": 507162, "epoch": 6110} {"train_loss": -27.6333065032959, "global_step": 507163, "epoch": 6110} {"train_loss": -27.652135848999023, "global_step": 507164, "epoch": 6110} {"train_loss": -27.408496856689453, "global_step": 507165, "epoch": 6110} {"train_loss": -27.986846923828125, "global_step": 507166, "epoch": 6110} {"train_loss": -27.558874130249023, "global_step": 507167, "epoch": 6110} {"train_loss": -27.68754005432129, "global_step": 507168, "epoch": 6110} {"train_loss": -27.407751083374023, "global_step": 507169, "epoch": 6110} {"train_loss": -27.39288902282715, "global_step": 507170, "epoch": 6110} {"train_loss": -27.509130477905273, "global_step": 507171, "epoch": 6110} {"train_loss": -27.6292724609375, "global_step": 507172, "epoch": 6110} {"train_loss": -27.77349853515625, "global_step": 507173, "epoch": 6110} {"train_loss": -27.590238571166992, "global_step": 507174, "epoch": 6110} {"train_loss": -27.193464279174805, "global_step": 507175, "epoch": 6110} {"train_loss": -27.656982421875, "global_step": 507176, "epoch": 6110} {"train_loss": -27.66330909729004, "global_step": 507177, "epoch": 6110} {"train_loss": -27.3964786529541, "global_step": 507178, "epoch": 6110} {"train_loss": -27.062925338745117, "global_step": 507179, "epoch": 6110} {"train_loss": -27.1117000579834, "global_step": 507180, "epoch": 6110} {"train_loss": -27.53226661682129, "global_step": 507181, "epoch": 6110} {"train_loss": -27.74530029296875, "global_step": 507182, "epoch": 6110} {"train_loss": -27.4057674407959, "global_step": 507183, "epoch": 6110} {"train_loss": -27.235889434814453, "global_step": 507184, "epoch": 6110} {"train_loss": -27.10589599609375, "global_step": 507185, "epoch": 6110} {"train_loss": -27.329565048217773, "global_step": 507186, "epoch": 6110} {"train_loss": -27.14814567565918, "global_step": 507187, "epoch": 6110} {"train_loss": -27.5954532623291, "global_step": 507188, "epoch": 6110} {"train_loss": -27.4778995513916, "global_step": 507189, "epoch": 6110} {"train_loss": -27.327655792236328, "global_step": 507190, "epoch": 6110} {"train_loss": -27.523624420166016, "global_step": 507191, "epoch": 6110} {"train_loss": -27.72687339782715, "global_step": 507192, "epoch": 6110} {"train_loss": -27.652929306030273, "global_step": 507193, "epoch": 6110} {"train_loss": -27.9309024810791, "global_step": 507194, "epoch": 6110} {"train_loss": -27.781482696533203, "global_step": 507195, "epoch": 6110} {"train_loss": -27.775609970092773, "global_step": 507196, "epoch": 6110} {"train_loss": -27.634729385375977, "global_step": 507197, "epoch": 6110} {"train_loss": -27.451873779296875, "global_step": 507198, "epoch": 6110} {"train_loss": -27.682373046875, "global_step": 507199, "epoch": 6110} {"train_loss": -27.789310455322266, "global_step": 507200, "epoch": 6110} {"train_loss": -27.527902603149414, "global_step": 507201, "epoch": 6110} {"train_loss": -27.475194931030273, "global_step": 507202, "epoch": 6110} {"train_loss": -27.616531372070312, "global_step": 507203, "epoch": 6110} {"train_loss": -27.677885055541992, "global_step": 507204, "epoch": 6110} {"train_loss": -27.553958892822266, "global_step": 507205, "epoch": 6110} {"train_loss": -27.242624282836914, "global_step": 507206, "epoch": 6110} {"train_loss": -27.412893295288086, "global_step": 507207, "epoch": 6110} {"train_loss": -27.51607322692871, "global_step": 507208, "epoch": 6110} {"train_loss": -26.99934959411621, "global_step": 507209, "epoch": 6110} {"train_loss": -27.388036727905273, "global_step": 507210, "epoch": 6110} {"train_loss": -27.51959228515625, "global_step": 507211, "epoch": 6110} {"train_loss": -27.336727601936065, "global_step": 507212, "epoch": 6110, "val_loss": 6644282.0} {"train_loss": -27.216949462890625, "global_step": 507213, "epoch": 6111} {"train_loss": -27.309738159179688, "global_step": 507214, "epoch": 6111} {"train_loss": -26.226123809814453, "global_step": 507215, "epoch": 6111} {"train_loss": -25.86170768737793, "global_step": 507216, "epoch": 6111} {"train_loss": -26.597684860229492, "global_step": 507217, "epoch": 6111} {"train_loss": -26.697101593017578, "global_step": 507218, "epoch": 6111} {"train_loss": -26.495222091674805, "global_step": 507219, "epoch": 6111} {"train_loss": -26.517181396484375, "global_step": 507220, "epoch": 6111} {"train_loss": -26.981231689453125, "global_step": 507221, "epoch": 6111} {"train_loss": -26.53891372680664, "global_step": 507222, "epoch": 6111} {"train_loss": -26.504919052124023, "global_step": 507223, "epoch": 6111} {"train_loss": -27.205915451049805, "global_step": 507224, "epoch": 6111} {"train_loss": -26.712238311767578, "global_step": 507225, "epoch": 6111} {"train_loss": -26.748205184936523, "global_step": 507226, "epoch": 6111} {"train_loss": -27.056360244750977, "global_step": 507227, "epoch": 6111} {"train_loss": -27.12334632873535, "global_step": 507228, "epoch": 6111} {"train_loss": -26.649518966674805, "global_step": 507229, "epoch": 6111} {"train_loss": -26.901395797729492, "global_step": 507230, "epoch": 6111} {"train_loss": -26.868621826171875, "global_step": 507231, "epoch": 6111} {"train_loss": -27.133468627929688, "global_step": 507232, "epoch": 6111} {"train_loss": -26.873132705688477, "global_step": 507233, "epoch": 6111} {"train_loss": -27.41143226623535, "global_step": 507234, "epoch": 6111} {"train_loss": -26.8424129486084, "global_step": 507235, "epoch": 6111} {"train_loss": -26.92024040222168, "global_step": 507236, "epoch": 6111} {"train_loss": -27.305021286010742, "global_step": 507237, "epoch": 6111} {"train_loss": -27.07110595703125, "global_step": 507238, "epoch": 6111} {"train_loss": -27.525135040283203, "global_step": 507239, "epoch": 6111} {"train_loss": -27.33274269104004, "global_step": 507240, "epoch": 6111} {"train_loss": -27.654691696166992, "global_step": 507241, "epoch": 6111} {"train_loss": -27.572580337524414, "global_step": 507242, "epoch": 6111} {"train_loss": -27.462173461914062, "global_step": 507243, "epoch": 6111} {"train_loss": -27.386926651000977, "global_step": 507244, "epoch": 6111} {"train_loss": -27.136554718017578, "global_step": 507245, "epoch": 6111} {"train_loss": -27.315576553344727, "global_step": 507246, "epoch": 6111} {"train_loss": -27.845569610595703, "global_step": 507247, "epoch": 6111} {"train_loss": -27.50126075744629, "global_step": 507248, "epoch": 6111} {"train_loss": -27.678558349609375, "global_step": 507249, "epoch": 6111} {"train_loss": -27.293521881103516, "global_step": 507250, "epoch": 6111} {"train_loss": -27.24366569519043, "global_step": 507251, "epoch": 6111} {"train_loss": -27.590778350830078, "global_step": 507252, "epoch": 6111} {"train_loss": -27.31770896911621, "global_step": 507253, "epoch": 6111} {"train_loss": -27.341495513916016, "global_step": 507254, "epoch": 6111} {"train_loss": -27.412372589111328, "global_step": 507255, "epoch": 6111} {"train_loss": -27.683385848999023, "global_step": 507256, "epoch": 6111} {"train_loss": -27.634906768798828, "global_step": 507257, "epoch": 6111} {"train_loss": -27.661401748657227, "global_step": 507258, "epoch": 6111} {"train_loss": -27.443899154663086, "global_step": 507259, "epoch": 6111} {"train_loss": -27.415637969970703, "global_step": 507260, "epoch": 6111} {"train_loss": -27.426904678344727, "global_step": 507261, "epoch": 6111} {"train_loss": -27.480304718017578, "global_step": 507262, "epoch": 6111} {"train_loss": -27.287214279174805, "global_step": 507263, "epoch": 6111} {"train_loss": -27.605798721313477, "global_step": 507264, "epoch": 6111} {"train_loss": -27.787357330322266, "global_step": 507265, "epoch": 6111} {"train_loss": -27.605731964111328, "global_step": 507266, "epoch": 6111} {"train_loss": -27.75543212890625, "global_step": 507267, "epoch": 6111} {"train_loss": -27.58745765686035, "global_step": 507268, "epoch": 6111} {"train_loss": -27.411855697631836, "global_step": 507269, "epoch": 6111} {"train_loss": -27.300704956054688, "global_step": 507270, "epoch": 6111} {"train_loss": -27.582441329956055, "global_step": 507271, "epoch": 6111} {"train_loss": -26.797399520874023, "global_step": 507272, "epoch": 6111} {"train_loss": -25.490690231323242, "global_step": 507273, "epoch": 6111} {"train_loss": -25.67388916015625, "global_step": 507274, "epoch": 6111} {"train_loss": -27.067365646362305, "global_step": 507275, "epoch": 6111} {"train_loss": -27.002225875854492, "global_step": 507276, "epoch": 6111} {"train_loss": -27.198627471923828, "global_step": 507277, "epoch": 6111} {"train_loss": -27.050260543823242, "global_step": 507278, "epoch": 6111} {"train_loss": -27.000690460205078, "global_step": 507279, "epoch": 6111} {"train_loss": -27.415607452392578, "global_step": 507280, "epoch": 6111} {"train_loss": -26.944799423217773, "global_step": 507281, "epoch": 6111} {"train_loss": -27.170246124267578, "global_step": 507282, "epoch": 6111} {"train_loss": -27.2291202545166, "global_step": 507283, "epoch": 6111} {"train_loss": -27.423892974853516, "global_step": 507284, "epoch": 6111} {"train_loss": -27.337051391601562, "global_step": 507285, "epoch": 6111} {"train_loss": -27.2136287689209, "global_step": 507286, "epoch": 6111} {"train_loss": -27.32917594909668, "global_step": 507287, "epoch": 6111} {"train_loss": -27.2888126373291, "global_step": 507288, "epoch": 6111} {"train_loss": -27.410985946655273, "global_step": 507289, "epoch": 6111} {"train_loss": -27.286285400390625, "global_step": 507290, "epoch": 6111} {"train_loss": -27.423389434814453, "global_step": 507291, "epoch": 6111} {"train_loss": -27.221073150634766, "global_step": 507292, "epoch": 6111} {"train_loss": -27.44904899597168, "global_step": 507293, "epoch": 6111} {"train_loss": -27.51429557800293, "global_step": 507294, "epoch": 6111} {"train_loss": -27.182543352425817, "global_step": 507295, "epoch": 6111, "val_loss": 6658632.0} {"train_loss": -26.587289810180664, "global_step": 507296, "epoch": 6112} {"train_loss": -26.832874298095703, "global_step": 507297, "epoch": 6112} {"train_loss": -26.851606369018555, "global_step": 507298, "epoch": 6112} {"train_loss": -26.7276611328125, "global_step": 507299, "epoch": 6112} {"train_loss": -27.17860984802246, "global_step": 507300, "epoch": 6112} {"train_loss": -26.98560905456543, "global_step": 507301, "epoch": 6112} {"train_loss": -26.5920467376709, "global_step": 507302, "epoch": 6112} {"train_loss": -27.36417579650879, "global_step": 507303, "epoch": 6112} {"train_loss": -26.729700088500977, "global_step": 507304, "epoch": 6112} {"train_loss": -27.251935958862305, "global_step": 507305, "epoch": 6112} {"train_loss": -27.029829025268555, "global_step": 507306, "epoch": 6112} {"train_loss": -27.024667739868164, "global_step": 507307, "epoch": 6112} {"train_loss": -27.162351608276367, "global_step": 507308, "epoch": 6112} {"train_loss": -27.223377227783203, "global_step": 507309, "epoch": 6112} {"train_loss": -27.393476486206055, "global_step": 507310, "epoch": 6112} {"train_loss": -27.627933502197266, "global_step": 507311, "epoch": 6112} {"train_loss": -27.471683502197266, "global_step": 507312, "epoch": 6112} {"train_loss": -27.23322868347168, "global_step": 507313, "epoch": 6112} {"train_loss": -27.355112075805664, "global_step": 507314, "epoch": 6112} {"train_loss": -27.40875816345215, "global_step": 507315, "epoch": 6112} {"train_loss": -27.423887252807617, "global_step": 507316, "epoch": 6112} {"train_loss": -27.0494441986084, "global_step": 507317, "epoch": 6112} {"train_loss": -27.44148063659668, "global_step": 507318, "epoch": 6112} {"train_loss": -26.951963424682617, "global_step": 507319, "epoch": 6112} {"train_loss": -27.32198143005371, "global_step": 507320, "epoch": 6112} {"train_loss": -27.5565242767334, "global_step": 507321, "epoch": 6112} {"train_loss": -27.167455673217773, "global_step": 507322, "epoch": 6112} {"train_loss": -27.85774040222168, "global_step": 507323, "epoch": 6112} {"train_loss": -27.570636749267578, "global_step": 507324, "epoch": 6112} {"train_loss": -27.679426193237305, "global_step": 507325, "epoch": 6112} {"train_loss": -27.522485733032227, "global_step": 507326, "epoch": 6112} {"train_loss": -27.37676429748535, "global_step": 507327, "epoch": 6112} {"train_loss": -27.388092041015625, "global_step": 507328, "epoch": 6112} {"train_loss": -27.423383712768555, "global_step": 507329, "epoch": 6112} {"train_loss": -27.714385986328125, "global_step": 507330, "epoch": 6112} {"train_loss": -27.61199378967285, "global_step": 507331, "epoch": 6112} {"train_loss": -27.596424102783203, "global_step": 507332, "epoch": 6112} {"train_loss": -27.553058624267578, "global_step": 507333, "epoch": 6112} {"train_loss": -27.51795768737793, "global_step": 507334, "epoch": 6112} {"train_loss": -27.4306583404541, "global_step": 507335, "epoch": 6112} {"train_loss": -27.719266891479492, "global_step": 507336, "epoch": 6112} {"train_loss": -27.26068115234375, "global_step": 507337, "epoch": 6112} {"train_loss": -27.63836669921875, "global_step": 507338, "epoch": 6112} {"train_loss": -27.57887077331543, "global_step": 507339, "epoch": 6112} {"train_loss": -27.281265258789062, "global_step": 507340, "epoch": 6112} {"train_loss": -27.13909912109375, "global_step": 507341, "epoch": 6112} {"train_loss": -27.38547706604004, "global_step": 507342, "epoch": 6112} {"train_loss": -27.157506942749023, "global_step": 507343, "epoch": 6112} {"train_loss": -27.482955932617188, "global_step": 507344, "epoch": 6112} {"train_loss": -27.309555053710938, "global_step": 507345, "epoch": 6112} {"train_loss": -27.32742691040039, "global_step": 507346, "epoch": 6112} {"train_loss": -27.625579833984375, "global_step": 507347, "epoch": 6112} {"train_loss": -27.171585083007812, "global_step": 507348, "epoch": 6112} {"train_loss": -27.316883087158203, "global_step": 507349, "epoch": 6112} {"train_loss": -27.341115951538086, "global_step": 507350, "epoch": 6112} {"train_loss": -27.412282943725586, "global_step": 507351, "epoch": 6112} {"train_loss": -27.366506576538086, "global_step": 507352, "epoch": 6112} {"train_loss": -27.03277015686035, "global_step": 507353, "epoch": 6112} {"train_loss": -27.639501571655273, "global_step": 507354, "epoch": 6112} {"train_loss": -27.58502769470215, "global_step": 507355, "epoch": 6112} {"train_loss": -27.5593204498291, "global_step": 507356, "epoch": 6112} {"train_loss": -27.696985244750977, "global_step": 507357, "epoch": 6112} {"train_loss": -27.153594970703125, "global_step": 507358, "epoch": 6112} {"train_loss": -27.883935928344727, "global_step": 507359, "epoch": 6112} {"train_loss": -27.092741012573242, "global_step": 507360, "epoch": 6112} {"train_loss": -27.204870223999023, "global_step": 507361, "epoch": 6112} {"train_loss": -27.300384521484375, "global_step": 507362, "epoch": 6112} {"train_loss": -27.415847778320312, "global_step": 507363, "epoch": 6112} {"train_loss": -27.31873893737793, "global_step": 507364, "epoch": 6112} {"train_loss": -27.363004684448242, "global_step": 507365, "epoch": 6112} {"train_loss": -27.3707218170166, "global_step": 507366, "epoch": 6112} {"train_loss": -27.112958908081055, "global_step": 507367, "epoch": 6112} {"train_loss": -27.22157096862793, "global_step": 507368, "epoch": 6112} {"train_loss": -27.187299728393555, "global_step": 507369, "epoch": 6112} {"train_loss": -27.455062866210938, "global_step": 507370, "epoch": 6112} {"train_loss": -27.493671417236328, "global_step": 507371, "epoch": 6112} {"train_loss": -27.002017974853516, "global_step": 507372, "epoch": 6112} {"train_loss": -27.321332931518555, "global_step": 507373, "epoch": 6112} {"train_loss": -27.460159301757812, "global_step": 507374, "epoch": 6112} {"train_loss": -27.29075050354004, "global_step": 507375, "epoch": 6112} {"train_loss": -27.5922794342041, "global_step": 507376, "epoch": 6112} {"train_loss": -27.325393676757812, "global_step": 507377, "epoch": 6112} {"train_loss": -27.331044116652155, "global_step": 507378, "epoch": 6112, "val_loss": 6696590.0} {"train_loss": -27.55145835876465, "global_step": 507379, "epoch": 6113} {"train_loss": -27.145965576171875, "global_step": 507380, "epoch": 6113} {"train_loss": -27.52985954284668, "global_step": 507381, "epoch": 6113} {"train_loss": -26.90424156188965, "global_step": 507382, "epoch": 6113} {"train_loss": -26.898792266845703, "global_step": 507383, "epoch": 6113} {"train_loss": -27.207387924194336, "global_step": 507384, "epoch": 6113} {"train_loss": -27.350080490112305, "global_step": 507385, "epoch": 6113} {"train_loss": -27.564178466796875, "global_step": 507386, "epoch": 6113} {"train_loss": -26.908004760742188, "global_step": 507387, "epoch": 6113} {"train_loss": -26.70648193359375, "global_step": 507388, "epoch": 6113} {"train_loss": -27.006452560424805, "global_step": 507389, "epoch": 6113} {"train_loss": -27.7924861907959, "global_step": 507390, "epoch": 6113} {"train_loss": -26.934167861938477, "global_step": 507391, "epoch": 6113} {"train_loss": -27.21661376953125, "global_step": 507392, "epoch": 6113} {"train_loss": -27.311325073242188, "global_step": 507393, "epoch": 6113} {"train_loss": -27.225814819335938, "global_step": 507394, "epoch": 6113} {"train_loss": -27.504907608032227, "global_step": 507395, "epoch": 6113} {"train_loss": -27.09502601623535, "global_step": 507396, "epoch": 6113} {"train_loss": -27.756444931030273, "global_step": 507397, "epoch": 6113} {"train_loss": -27.054712295532227, "global_step": 507398, "epoch": 6113} {"train_loss": -27.152036666870117, "global_step": 507399, "epoch": 6113} {"train_loss": -27.263824462890625, "global_step": 507400, "epoch": 6113} {"train_loss": -27.446386337280273, "global_step": 507401, "epoch": 6113} {"train_loss": -27.21649742126465, "global_step": 507402, "epoch": 6113} {"train_loss": -27.322528839111328, "global_step": 507403, "epoch": 6113} {"train_loss": -27.3790225982666, "global_step": 507404, "epoch": 6113} {"train_loss": -27.24493980407715, "global_step": 507405, "epoch": 6113} {"train_loss": -27.299713134765625, "global_step": 507406, "epoch": 6113} {"train_loss": -27.235015869140625, "global_step": 507407, "epoch": 6113} {"train_loss": -27.325952529907227, "global_step": 507408, "epoch": 6113} {"train_loss": -27.114795684814453, "global_step": 507409, "epoch": 6113} {"train_loss": -27.277917861938477, "global_step": 507410, "epoch": 6113} {"train_loss": -27.298986434936523, "global_step": 507411, "epoch": 6113} {"train_loss": -27.066991806030273, "global_step": 507412, "epoch": 6113} {"train_loss": -27.243650436401367, "global_step": 507413, "epoch": 6113} {"train_loss": -27.43304443359375, "global_step": 507414, "epoch": 6113} {"train_loss": -27.667646408081055, "global_step": 507415, "epoch": 6113} {"train_loss": -27.541061401367188, "global_step": 507416, "epoch": 6113} {"train_loss": -27.015607833862305, "global_step": 507417, "epoch": 6113} {"train_loss": -27.642099380493164, "global_step": 507418, "epoch": 6113} {"train_loss": -27.451440811157227, "global_step": 507419, "epoch": 6113} {"train_loss": -27.106536865234375, "global_step": 507420, "epoch": 6113} {"train_loss": -27.239789962768555, "global_step": 507421, "epoch": 6113} {"train_loss": -27.20600700378418, "global_step": 507422, "epoch": 6113} {"train_loss": -27.439151763916016, "global_step": 507423, "epoch": 6113} {"train_loss": -27.190256118774414, "global_step": 507424, "epoch": 6113} {"train_loss": -27.543243408203125, "global_step": 507425, "epoch": 6113} {"train_loss": -27.475296020507812, "global_step": 507426, "epoch": 6113} {"train_loss": -27.406530380249023, "global_step": 507427, "epoch": 6113} {"train_loss": -27.863866806030273, "global_step": 507428, "epoch": 6113} {"train_loss": -27.48777198791504, "global_step": 507429, "epoch": 6113} {"train_loss": -27.759876251220703, "global_step": 507430, "epoch": 6113} {"train_loss": -27.676513671875, "global_step": 507431, "epoch": 6113} {"train_loss": -27.52388572692871, "global_step": 507432, "epoch": 6113} {"train_loss": -27.625640869140625, "global_step": 507433, "epoch": 6113} {"train_loss": -27.672338485717773, "global_step": 507434, "epoch": 6113} {"train_loss": -27.421558380126953, "global_step": 507435, "epoch": 6113} {"train_loss": -27.465442657470703, "global_step": 507436, "epoch": 6113} {"train_loss": -27.452890396118164, "global_step": 507437, "epoch": 6113} {"train_loss": -27.83437156677246, "global_step": 507438, "epoch": 6113} {"train_loss": -27.53315544128418, "global_step": 507439, "epoch": 6113} {"train_loss": -27.399572372436523, "global_step": 507440, "epoch": 6113} {"train_loss": -27.38458251953125, "global_step": 507441, "epoch": 6113} {"train_loss": -27.670825958251953, "global_step": 507442, "epoch": 6113} {"train_loss": -27.588178634643555, "global_step": 507443, "epoch": 6113} {"train_loss": -27.523324966430664, "global_step": 507444, "epoch": 6113} {"train_loss": -27.817920684814453, "global_step": 507445, "epoch": 6113} {"train_loss": -27.332075119018555, "global_step": 507446, "epoch": 6113} {"train_loss": -27.471487045288086, "global_step": 507447, "epoch": 6113} {"train_loss": -27.450159072875977, "global_step": 507448, "epoch": 6113} {"train_loss": -27.68739128112793, "global_step": 507449, "epoch": 6113} {"train_loss": -27.7650203704834, "global_step": 507450, "epoch": 6113} {"train_loss": -27.679046630859375, "global_step": 507451, "epoch": 6113} {"train_loss": -27.694074630737305, "global_step": 507452, "epoch": 6113} {"train_loss": -27.471878051757812, "global_step": 507453, "epoch": 6113} {"train_loss": -27.780029296875, "global_step": 507454, "epoch": 6113} {"train_loss": -27.089502334594727, "global_step": 507455, "epoch": 6113} {"train_loss": -27.7691593170166, "global_step": 507456, "epoch": 6113} {"train_loss": -27.4578914642334, "global_step": 507457, "epoch": 6113} {"train_loss": -27.847314834594727, "global_step": 507458, "epoch": 6113} {"train_loss": -27.568130493164062, "global_step": 507459, "epoch": 6113} {"train_loss": -28.04119873046875, "global_step": 507460, "epoch": 6113} {"train_loss": -27.422389317707843, "global_step": 507461, "epoch": 6113, "val_loss": 6679465.0} {"train_loss": -27.044553756713867, "global_step": 507462, "epoch": 6114} {"train_loss": -26.341266632080078, "global_step": 507463, "epoch": 6114} {"train_loss": -25.866186141967773, "global_step": 507464, "epoch": 6114} {"train_loss": -25.851221084594727, "global_step": 507465, "epoch": 6114} {"train_loss": -25.861663818359375, "global_step": 507466, "epoch": 6114} {"train_loss": -26.877063751220703, "global_step": 507467, "epoch": 6114} {"train_loss": -26.7423095703125, "global_step": 507468, "epoch": 6114} {"train_loss": -25.73322868347168, "global_step": 507469, "epoch": 6114} {"train_loss": -27.187219619750977, "global_step": 507470, "epoch": 6114} {"train_loss": -26.353473663330078, "global_step": 507471, "epoch": 6114} {"train_loss": -26.995954513549805, "global_step": 507472, "epoch": 6114} {"train_loss": -26.710346221923828, "global_step": 507473, "epoch": 6114} {"train_loss": -26.527801513671875, "global_step": 507474, "epoch": 6114} {"train_loss": -26.51319694519043, "global_step": 507475, "epoch": 6114} {"train_loss": -26.89503288269043, "global_step": 507476, "epoch": 6114} {"train_loss": -26.775869369506836, "global_step": 507477, "epoch": 6114} {"train_loss": -27.04852294921875, "global_step": 507478, "epoch": 6114} {"train_loss": -27.1541690826416, "global_step": 507479, "epoch": 6114} {"train_loss": -26.889057159423828, "global_step": 507480, "epoch": 6114} {"train_loss": -26.803314208984375, "global_step": 507481, "epoch": 6114} {"train_loss": -27.077787399291992, "global_step": 507482, "epoch": 6114} {"train_loss": -27.66507339477539, "global_step": 507483, "epoch": 6114} {"train_loss": -27.21404457092285, "global_step": 507484, "epoch": 6114} {"train_loss": -27.365453720092773, "global_step": 507485, "epoch": 6114} {"train_loss": -27.584379196166992, "global_step": 507486, "epoch": 6114} {"train_loss": -27.13544273376465, "global_step": 507487, "epoch": 6114} {"train_loss": -27.33119773864746, "global_step": 507488, "epoch": 6114} {"train_loss": -27.3930606842041, "global_step": 507489, "epoch": 6114} {"train_loss": -27.17310905456543, "global_step": 507490, "epoch": 6114} {"train_loss": -27.546009063720703, "global_step": 507491, "epoch": 6114} {"train_loss": -27.178131103515625, "global_step": 507492, "epoch": 6114} {"train_loss": -27.607666015625, "global_step": 507493, "epoch": 6114} {"train_loss": -27.50238037109375, "global_step": 507494, "epoch": 6114} {"train_loss": -27.76751708984375, "global_step": 507495, "epoch": 6114} {"train_loss": -27.48590660095215, "global_step": 507496, "epoch": 6114} {"train_loss": -27.56206703186035, "global_step": 507497, "epoch": 6114} {"train_loss": -27.852161407470703, "global_step": 507498, "epoch": 6114} {"train_loss": -27.573495864868164, "global_step": 507499, "epoch": 6114} {"train_loss": -27.662494659423828, "global_step": 507500, "epoch": 6114} {"train_loss": -27.779926300048828, "global_step": 507501, "epoch": 6114} {"train_loss": -27.766550064086914, "global_step": 507502, "epoch": 6114} {"train_loss": -27.782751083374023, "global_step": 507503, "epoch": 6114} {"train_loss": -27.685739517211914, "global_step": 507504, "epoch": 6114} {"train_loss": -27.62603759765625, "global_step": 507505, "epoch": 6114} {"train_loss": -27.60917091369629, "global_step": 507506, "epoch": 6114} {"train_loss": -27.623083114624023, "global_step": 507507, "epoch": 6114} {"train_loss": -27.80419921875, "global_step": 507508, "epoch": 6114} {"train_loss": -27.598831176757812, "global_step": 507509, "epoch": 6114} {"train_loss": -27.798736572265625, "global_step": 507510, "epoch": 6114} {"train_loss": -27.47016716003418, "global_step": 507511, "epoch": 6114} {"train_loss": -27.426843643188477, "global_step": 507512, "epoch": 6114} {"train_loss": -27.62067222595215, "global_step": 507513, "epoch": 6114} {"train_loss": -27.67206382751465, "global_step": 507514, "epoch": 6114} {"train_loss": -27.605792999267578, "global_step": 507515, "epoch": 6114} {"train_loss": -27.802978515625, "global_step": 507516, "epoch": 6114} {"train_loss": -27.92024040222168, "global_step": 507517, "epoch": 6114} {"train_loss": -27.556873321533203, "global_step": 507518, "epoch": 6114} {"train_loss": -26.859867095947266, "global_step": 507519, "epoch": 6114} {"train_loss": -27.321805953979492, "global_step": 507520, "epoch": 6114} {"train_loss": -27.392654418945312, "global_step": 507521, "epoch": 6114} {"train_loss": -27.204376220703125, "global_step": 507522, "epoch": 6114} {"train_loss": -27.756412506103516, "global_step": 507523, "epoch": 6114} {"train_loss": -27.212085723876953, "global_step": 507524, "epoch": 6114} {"train_loss": -27.000669479370117, "global_step": 507525, "epoch": 6114} {"train_loss": -27.085580825805664, "global_step": 507526, "epoch": 6114} {"train_loss": -26.8999080657959, "global_step": 507527, "epoch": 6114} {"train_loss": -26.97102165222168, "global_step": 507528, "epoch": 6114} {"train_loss": -26.914642333984375, "global_step": 507529, "epoch": 6114} {"train_loss": -27.080474853515625, "global_step": 507530, "epoch": 6114} {"train_loss": -27.253400802612305, "global_step": 507531, "epoch": 6114} {"train_loss": -26.477643966674805, "global_step": 507532, "epoch": 6114} {"train_loss": -27.210844039916992, "global_step": 507533, "epoch": 6114} {"train_loss": -26.9084415435791, "global_step": 507534, "epoch": 6114} {"train_loss": -27.004392623901367, "global_step": 507535, "epoch": 6114} {"train_loss": -27.165576934814453, "global_step": 507536, "epoch": 6114} {"train_loss": -27.150405883789062, "global_step": 507537, "epoch": 6114} {"train_loss": -27.114761352539062, "global_step": 507538, "epoch": 6114} {"train_loss": -27.54302406311035, "global_step": 507539, "epoch": 6114} {"train_loss": -27.226354598999023, "global_step": 507540, "epoch": 6114} {"train_loss": -27.334827423095703, "global_step": 507541, "epoch": 6114} {"train_loss": -27.33296012878418, "global_step": 507542, "epoch": 6114} {"train_loss": -27.912267684936523, "global_step": 507543, "epoch": 6114} {"train_loss": -27.210556696696454, "global_step": 507544, "epoch": 6114, "val_loss": 6630188.0} {"train_loss": -26.845829010009766, "global_step": 507545, "epoch": 6115} {"train_loss": -26.739837646484375, "global_step": 507546, "epoch": 6115} {"train_loss": -26.853124618530273, "global_step": 507547, "epoch": 6115} {"train_loss": -27.425016403198242, "global_step": 507548, "epoch": 6115} {"train_loss": -27.30742835998535, "global_step": 507549, "epoch": 6115} {"train_loss": -27.439489364624023, "global_step": 507550, "epoch": 6115} {"train_loss": -26.86628532409668, "global_step": 507551, "epoch": 6115} {"train_loss": -27.082624435424805, "global_step": 507552, "epoch": 6115} {"train_loss": -27.381383895874023, "global_step": 507553, "epoch": 6115} {"train_loss": -27.67361831665039, "global_step": 507554, "epoch": 6115} {"train_loss": -27.239377975463867, "global_step": 507555, "epoch": 6115} {"train_loss": -27.261520385742188, "global_step": 507556, "epoch": 6115} {"train_loss": -26.921667098999023, "global_step": 507557, "epoch": 6115} {"train_loss": -27.44428062438965, "global_step": 507558, "epoch": 6115} {"train_loss": -27.427780151367188, "global_step": 507559, "epoch": 6115} {"train_loss": -27.273183822631836, "global_step": 507560, "epoch": 6115} {"train_loss": -27.24680519104004, "global_step": 507561, "epoch": 6115} {"train_loss": -27.47443962097168, "global_step": 507562, "epoch": 6115} {"train_loss": -27.4046630859375, "global_step": 507563, "epoch": 6115} {"train_loss": -27.24755859375, "global_step": 507564, "epoch": 6115} {"train_loss": -27.59441566467285, "global_step": 507565, "epoch": 6115} {"train_loss": -27.386188507080078, "global_step": 507566, "epoch": 6115} {"train_loss": -27.29542350769043, "global_step": 507567, "epoch": 6115} {"train_loss": -27.23430824279785, "global_step": 507568, "epoch": 6115} {"train_loss": -27.543909072875977, "global_step": 507569, "epoch": 6115} {"train_loss": -27.33697509765625, "global_step": 507570, "epoch": 6115} {"train_loss": -27.697132110595703, "global_step": 507571, "epoch": 6115} {"train_loss": -27.572895050048828, "global_step": 507572, "epoch": 6115} {"train_loss": -27.318883895874023, "global_step": 507573, "epoch": 6115} {"train_loss": -27.10027503967285, "global_step": 507574, "epoch": 6115} {"train_loss": -27.55845069885254, "global_step": 507575, "epoch": 6115} {"train_loss": -27.66936683654785, "global_step": 507576, "epoch": 6115} {"train_loss": -27.785297393798828, "global_step": 507577, "epoch": 6115} {"train_loss": -27.61338233947754, "global_step": 507578, "epoch": 6115} {"train_loss": -27.3743896484375, "global_step": 507579, "epoch": 6115} {"train_loss": -27.434188842773438, "global_step": 507580, "epoch": 6115} {"train_loss": -27.605575561523438, "global_step": 507581, "epoch": 6115} {"train_loss": -27.707015991210938, "global_step": 507582, "epoch": 6115} {"train_loss": -27.81864356994629, "global_step": 507583, "epoch": 6115} {"train_loss": -27.61335563659668, "global_step": 507584, "epoch": 6115} {"train_loss": -27.5268611907959, "global_step": 507585, "epoch": 6115} {"train_loss": -27.651838302612305, "global_step": 507586, "epoch": 6115} {"train_loss": -27.490020751953125, "global_step": 507587, "epoch": 6115} {"train_loss": -27.806745529174805, "global_step": 507588, "epoch": 6115} {"train_loss": -27.54534912109375, "global_step": 507589, "epoch": 6115} {"train_loss": -27.83660316467285, "global_step": 507590, "epoch": 6115} {"train_loss": -27.511884689331055, "global_step": 507591, "epoch": 6115} {"train_loss": -27.644514083862305, "global_step": 507592, "epoch": 6115} {"train_loss": -27.654865264892578, "global_step": 507593, "epoch": 6115} {"train_loss": -27.415857315063477, "global_step": 507594, "epoch": 6115} {"train_loss": -27.682058334350586, "global_step": 507595, "epoch": 6115} {"train_loss": -27.7022647857666, "global_step": 507596, "epoch": 6115} {"train_loss": -27.268360137939453, "global_step": 507597, "epoch": 6115} {"train_loss": -26.926959991455078, "global_step": 507598, "epoch": 6115} {"train_loss": -26.835874557495117, "global_step": 507599, "epoch": 6115} {"train_loss": -26.594831466674805, "global_step": 507600, "epoch": 6115} {"train_loss": -26.74989128112793, "global_step": 507601, "epoch": 6115} {"train_loss": -27.279428482055664, "global_step": 507602, "epoch": 6115} {"train_loss": -27.232351303100586, "global_step": 507603, "epoch": 6115} {"train_loss": -27.311264038085938, "global_step": 507604, "epoch": 6115} {"train_loss": -27.08111572265625, "global_step": 507605, "epoch": 6115} {"train_loss": -27.237594604492188, "global_step": 507606, "epoch": 6115} {"train_loss": -27.36944580078125, "global_step": 507607, "epoch": 6115} {"train_loss": -27.247100830078125, "global_step": 507608, "epoch": 6115} {"train_loss": -27.23988151550293, "global_step": 507609, "epoch": 6115} {"train_loss": -27.505481719970703, "global_step": 507610, "epoch": 6115} {"train_loss": -27.581451416015625, "global_step": 507611, "epoch": 6115} {"train_loss": -27.44589614868164, "global_step": 507612, "epoch": 6115} {"train_loss": -27.03094482421875, "global_step": 507613, "epoch": 6115} {"train_loss": -27.347976684570312, "global_step": 507614, "epoch": 6115} {"train_loss": -27.3698787689209, "global_step": 507615, "epoch": 6115} {"train_loss": -26.89190673828125, "global_step": 507616, "epoch": 6115} {"train_loss": -27.244871139526367, "global_step": 507617, "epoch": 6115} {"train_loss": -27.3342227935791, "global_step": 507618, "epoch": 6115} {"train_loss": -27.54705238342285, "global_step": 507619, "epoch": 6115} {"train_loss": -27.615827560424805, "global_step": 507620, "epoch": 6115} {"train_loss": -27.146020889282227, "global_step": 507621, "epoch": 6115} {"train_loss": -27.405384063720703, "global_step": 507622, "epoch": 6115} {"train_loss": -27.291471481323242, "global_step": 507623, "epoch": 6115} {"train_loss": -27.801544189453125, "global_step": 507624, "epoch": 6115} {"train_loss": -27.417585372924805, "global_step": 507625, "epoch": 6115} {"train_loss": -27.63348960876465, "global_step": 507626, "epoch": 6115} {"train_loss": -27.361450149352294, "global_step": 507627, "epoch": 6115, "val_loss": 6561271.0} {"train_loss": -26.799213409423828, "global_step": 507628, "epoch": 6116} {"train_loss": -25.15499496459961, "global_step": 507629, "epoch": 6116} {"train_loss": -26.40976905822754, "global_step": 507630, "epoch": 6116} {"train_loss": -26.555105209350586, "global_step": 507631, "epoch": 6116} {"train_loss": -25.854230880737305, "global_step": 507632, "epoch": 6116} {"train_loss": -26.821075439453125, "global_step": 507633, "epoch": 6116} {"train_loss": -26.616437911987305, "global_step": 507634, "epoch": 6116} {"train_loss": -26.90972900390625, "global_step": 507635, "epoch": 6116} {"train_loss": -26.916357040405273, "global_step": 507636, "epoch": 6116} {"train_loss": -26.77589225769043, "global_step": 507637, "epoch": 6116} {"train_loss": -26.921340942382812, "global_step": 507638, "epoch": 6116} {"train_loss": -26.675546646118164, "global_step": 507639, "epoch": 6116} {"train_loss": -26.99567222595215, "global_step": 507640, "epoch": 6116} {"train_loss": -26.9339656829834, "global_step": 507641, "epoch": 6116} {"train_loss": -27.201440811157227, "global_step": 507642, "epoch": 6116} {"train_loss": -26.55340003967285, "global_step": 507643, "epoch": 6116} {"train_loss": -26.871061325073242, "global_step": 507644, "epoch": 6116} {"train_loss": -26.900592803955078, "global_step": 507645, "epoch": 6116} {"train_loss": -26.8571834564209, "global_step": 507646, "epoch": 6116} {"train_loss": -27.344806671142578, "global_step": 507647, "epoch": 6116} {"train_loss": -26.951765060424805, "global_step": 507648, "epoch": 6116} {"train_loss": -27.2548770904541, "global_step": 507649, "epoch": 6116} {"train_loss": -26.945371627807617, "global_step": 507650, "epoch": 6116} {"train_loss": -27.469629287719727, "global_step": 507651, "epoch": 6116} {"train_loss": -27.39015769958496, "global_step": 507652, "epoch": 6116} {"train_loss": -27.587772369384766, "global_step": 507653, "epoch": 6116} {"train_loss": -27.270889282226562, "global_step": 507654, "epoch": 6116} {"train_loss": -27.237213134765625, "global_step": 507655, "epoch": 6116} {"train_loss": -27.4576473236084, "global_step": 507656, "epoch": 6116} {"train_loss": -27.5658016204834, "global_step": 507657, "epoch": 6116} {"train_loss": -27.408987045288086, "global_step": 507658, "epoch": 6116} {"train_loss": -27.592945098876953, "global_step": 507659, "epoch": 6116} {"train_loss": -27.44061279296875, "global_step": 507660, "epoch": 6116} {"train_loss": -27.392688751220703, "global_step": 507661, "epoch": 6116} {"train_loss": -27.414276123046875, "global_step": 507662, "epoch": 6116} {"train_loss": -27.56537437438965, "global_step": 507663, "epoch": 6116} {"train_loss": -27.716169357299805, "global_step": 507664, "epoch": 6116} {"train_loss": -27.120359420776367, "global_step": 507665, "epoch": 6116} {"train_loss": -27.86610221862793, "global_step": 507666, "epoch": 6116} {"train_loss": -27.381315231323242, "global_step": 507667, "epoch": 6116} {"train_loss": -27.844770431518555, "global_step": 507668, "epoch": 6116} {"train_loss": -27.56037712097168, "global_step": 507669, "epoch": 6116} {"train_loss": -27.986743927001953, "global_step": 507670, "epoch": 6116} {"train_loss": -27.8035831451416, "global_step": 507671, "epoch": 6116} {"train_loss": -27.79098892211914, "global_step": 507672, "epoch": 6116} {"train_loss": -27.010269165039062, "global_step": 507673, "epoch": 6116} {"train_loss": -27.574792861938477, "global_step": 507674, "epoch": 6116} {"train_loss": -27.406118392944336, "global_step": 507675, "epoch": 6116} {"train_loss": -27.74384880065918, "global_step": 507676, "epoch": 6116} {"train_loss": -27.8914852142334, "global_step": 507677, "epoch": 6116} {"train_loss": -27.586837768554688, "global_step": 507678, "epoch": 6116} {"train_loss": -26.76006507873535, "global_step": 507679, "epoch": 6116} {"train_loss": -27.07306480407715, "global_step": 507680, "epoch": 6116} {"train_loss": -27.532241821289062, "global_step": 507681, "epoch": 6116} {"train_loss": -27.45108985900879, "global_step": 507682, "epoch": 6116} {"train_loss": -27.167266845703125, "global_step": 507683, "epoch": 6116} {"train_loss": -27.24432373046875, "global_step": 507684, "epoch": 6116} {"train_loss": -27.7380313873291, "global_step": 507685, "epoch": 6116} {"train_loss": -27.534046173095703, "global_step": 507686, "epoch": 6116} {"train_loss": -27.3813533782959, "global_step": 507687, "epoch": 6116} {"train_loss": -27.427322387695312, "global_step": 507688, "epoch": 6116} {"train_loss": -27.465900421142578, "global_step": 507689, "epoch": 6116} {"train_loss": -27.269678115844727, "global_step": 507690, "epoch": 6116} {"train_loss": -27.033227920532227, "global_step": 507691, "epoch": 6116} {"train_loss": -27.375110626220703, "global_step": 507692, "epoch": 6116} {"train_loss": -27.190824508666992, "global_step": 507693, "epoch": 6116} {"train_loss": -27.318761825561523, "global_step": 507694, "epoch": 6116} {"train_loss": -27.49526023864746, "global_step": 507695, "epoch": 6116} {"train_loss": -27.635419845581055, "global_step": 507696, "epoch": 6116} {"train_loss": -27.684614181518555, "global_step": 507697, "epoch": 6116} {"train_loss": -26.864728927612305, "global_step": 507698, "epoch": 6116} {"train_loss": -26.94283103942871, "global_step": 507699, "epoch": 6116} {"train_loss": -26.95777702331543, "global_step": 507700, "epoch": 6116} {"train_loss": -27.33049964904785, "global_step": 507701, "epoch": 6116} {"train_loss": -27.449249267578125, "global_step": 507702, "epoch": 6116} {"train_loss": -27.243112564086914, "global_step": 507703, "epoch": 6116} {"train_loss": -27.213796615600586, "global_step": 507704, "epoch": 6116} {"train_loss": -26.775726318359375, "global_step": 507705, "epoch": 6116} {"train_loss": -27.298202514648438, "global_step": 507706, "epoch": 6116} {"train_loss": -27.118350982666016, "global_step": 507707, "epoch": 6116} {"train_loss": -27.1547794342041, "global_step": 507708, "epoch": 6116} {"train_loss": -27.172433853149414, "global_step": 507709, "epoch": 6116} {"train_loss": -27.202986751694276, "global_step": 507710, "epoch": 6116, "val_loss": 6702850.0} {"train_loss": -24.668729782104492, "global_step": 507711, "epoch": 6117} {"train_loss": -24.361448287963867, "global_step": 507712, "epoch": 6117} {"train_loss": -24.658775329589844, "global_step": 507713, "epoch": 6117} {"train_loss": -24.94304084777832, "global_step": 507714, "epoch": 6117} {"train_loss": -24.333505630493164, "global_step": 507715, "epoch": 6117} {"train_loss": -25.43896484375, "global_step": 507716, "epoch": 6117} {"train_loss": -26.05401039123535, "global_step": 507717, "epoch": 6117} {"train_loss": -26.034286499023438, "global_step": 507718, "epoch": 6117} {"train_loss": -25.919790267944336, "global_step": 507719, "epoch": 6117} {"train_loss": -26.376224517822266, "global_step": 507720, "epoch": 6117} {"train_loss": -26.501794815063477, "global_step": 507721, "epoch": 6117} {"train_loss": -26.3115291595459, "global_step": 507722, "epoch": 6117} {"train_loss": -26.611480712890625, "global_step": 507723, "epoch": 6117} {"train_loss": -26.354772567749023, "global_step": 507724, "epoch": 6117} {"train_loss": -26.6092472076416, "global_step": 507725, "epoch": 6117} {"train_loss": -26.58003807067871, "global_step": 507726, "epoch": 6117} {"train_loss": -26.751474380493164, "global_step": 507727, "epoch": 6117} {"train_loss": -26.786054611206055, "global_step": 507728, "epoch": 6117} {"train_loss": -26.691959381103516, "global_step": 507729, "epoch": 6117} {"train_loss": -26.812103271484375, "global_step": 507730, "epoch": 6117} {"train_loss": -26.926259994506836, "global_step": 507731, "epoch": 6117} {"train_loss": -26.44429588317871, "global_step": 507732, "epoch": 6117} {"train_loss": -27.248615264892578, "global_step": 507733, "epoch": 6117} {"train_loss": -27.119033813476562, "global_step": 507734, "epoch": 6117} {"train_loss": -26.691577911376953, "global_step": 507735, "epoch": 6117} {"train_loss": -27.15117835998535, "global_step": 507736, "epoch": 6117} {"train_loss": -26.78351402282715, "global_step": 507737, "epoch": 6117} {"train_loss": -26.99525260925293, "global_step": 507738, "epoch": 6117} {"train_loss": -26.9518985748291, "global_step": 507739, "epoch": 6117} {"train_loss": -27.06040382385254, "global_step": 507740, "epoch": 6117} {"train_loss": -27.492170333862305, "global_step": 507741, "epoch": 6117} {"train_loss": -27.193511962890625, "global_step": 507742, "epoch": 6117} {"train_loss": -27.23797607421875, "global_step": 507743, "epoch": 6117} {"train_loss": -27.07448387145996, "global_step": 507744, "epoch": 6117} {"train_loss": -27.607746124267578, "global_step": 507745, "epoch": 6117} {"train_loss": -27.040790557861328, "global_step": 507746, "epoch": 6117} {"train_loss": -27.551666259765625, "global_step": 507747, "epoch": 6117} {"train_loss": -27.243188858032227, "global_step": 507748, "epoch": 6117} {"train_loss": -27.28519630432129, "global_step": 507749, "epoch": 6117} {"train_loss": -27.388599395751953, "global_step": 507750, "epoch": 6117} {"train_loss": -27.4425048828125, "global_step": 507751, "epoch": 6117} {"train_loss": -27.21949577331543, "global_step": 507752, "epoch": 6117} {"train_loss": -27.37103843688965, "global_step": 507753, "epoch": 6117} {"train_loss": -27.291217803955078, "global_step": 507754, "epoch": 6117} {"train_loss": -27.032026290893555, "global_step": 507755, "epoch": 6117} {"train_loss": -27.77798843383789, "global_step": 507756, "epoch": 6117} {"train_loss": -27.435720443725586, "global_step": 507757, "epoch": 6117} {"train_loss": -27.603988647460938, "global_step": 507758, "epoch": 6117} {"train_loss": -27.818384170532227, "global_step": 507759, "epoch": 6117} {"train_loss": -27.58674430847168, "global_step": 507760, "epoch": 6117} {"train_loss": -27.707517623901367, "global_step": 507761, "epoch": 6117} {"train_loss": -27.35602378845215, "global_step": 507762, "epoch": 6117} {"train_loss": -27.20631217956543, "global_step": 507763, "epoch": 6117} {"train_loss": -27.30377197265625, "global_step": 507764, "epoch": 6117} {"train_loss": -27.76032066345215, "global_step": 507765, "epoch": 6117} {"train_loss": -27.5770206451416, "global_step": 507766, "epoch": 6117} {"train_loss": -27.935211181640625, "global_step": 507767, "epoch": 6117} {"train_loss": -27.281787872314453, "global_step": 507768, "epoch": 6117} {"train_loss": -27.464374542236328, "global_step": 507769, "epoch": 6117} {"train_loss": -27.470075607299805, "global_step": 507770, "epoch": 6117} {"train_loss": -27.541187286376953, "global_step": 507771, "epoch": 6117} {"train_loss": -27.28741455078125, "global_step": 507772, "epoch": 6117} {"train_loss": -27.546823501586914, "global_step": 507773, "epoch": 6117} {"train_loss": -27.16989517211914, "global_step": 507774, "epoch": 6117} {"train_loss": -27.268274307250977, "global_step": 507775, "epoch": 6117} {"train_loss": -27.55609130859375, "global_step": 507776, "epoch": 6117} {"train_loss": -27.694766998291016, "global_step": 507777, "epoch": 6117} {"train_loss": -27.477008819580078, "global_step": 507778, "epoch": 6117} {"train_loss": -27.456527709960938, "global_step": 507779, "epoch": 6117} {"train_loss": -27.463592529296875, "global_step": 507780, "epoch": 6117} {"train_loss": -27.226404190063477, "global_step": 507781, "epoch": 6117} {"train_loss": -27.35593032836914, "global_step": 507782, "epoch": 6117} {"train_loss": -26.681272506713867, "global_step": 507783, "epoch": 6117} {"train_loss": -27.499225616455078, "global_step": 507784, "epoch": 6117} {"train_loss": -27.595609664916992, "global_step": 507785, "epoch": 6117} {"train_loss": -27.1439151763916, "global_step": 507786, "epoch": 6117} {"train_loss": -27.414844512939453, "global_step": 507787, "epoch": 6117} {"train_loss": -27.373157501220703, "global_step": 507788, "epoch": 6117} {"train_loss": -27.58182716369629, "global_step": 507789, "epoch": 6117} {"train_loss": -27.28736686706543, "global_step": 507790, "epoch": 6117} {"train_loss": -27.374195098876953, "global_step": 507791, "epoch": 6117} {"train_loss": -27.23714256286621, "global_step": 507792, "epoch": 6117} {"train_loss": -26.99024692213679, "global_step": 507793, "epoch": 6117, "val_loss": 6594024.0} {"train_loss": -25.41425323486328, "global_step": 507794, "epoch": 6118} {"train_loss": -26.241104125976562, "global_step": 507795, "epoch": 6118} {"train_loss": -26.77420997619629, "global_step": 507796, "epoch": 6118} {"train_loss": -26.3271427154541, "global_step": 507797, "epoch": 6118} {"train_loss": -26.843311309814453, "global_step": 507798, "epoch": 6118} {"train_loss": -26.049219131469727, "global_step": 507799, "epoch": 6118} {"train_loss": -27.35413932800293, "global_step": 507800, "epoch": 6118} {"train_loss": -26.771656036376953, "global_step": 507801, "epoch": 6118} {"train_loss": -27.310110092163086, "global_step": 507802, "epoch": 6118} {"train_loss": -26.288480758666992, "global_step": 507803, "epoch": 6118} {"train_loss": -27.330869674682617, "global_step": 507804, "epoch": 6118} {"train_loss": -26.621747970581055, "global_step": 507805, "epoch": 6118} {"train_loss": -27.349597930908203, "global_step": 507806, "epoch": 6118} {"train_loss": -26.697528839111328, "global_step": 507807, "epoch": 6118} {"train_loss": -26.944976806640625, "global_step": 507808, "epoch": 6118} {"train_loss": -27.312482833862305, "global_step": 507809, "epoch": 6118} {"train_loss": -27.096704483032227, "global_step": 507810, "epoch": 6118} {"train_loss": -26.977466583251953, "global_step": 507811, "epoch": 6118} {"train_loss": -26.928434371948242, "global_step": 507812, "epoch": 6118} {"train_loss": -27.52312660217285, "global_step": 507813, "epoch": 6118} {"train_loss": -27.240203857421875, "global_step": 507814, "epoch": 6118} {"train_loss": -27.266834259033203, "global_step": 507815, "epoch": 6118} {"train_loss": -27.58616065979004, "global_step": 507816, "epoch": 6118} {"train_loss": -27.561038970947266, "global_step": 507817, "epoch": 6118} {"train_loss": -27.340993881225586, "global_step": 507818, "epoch": 6118} {"train_loss": -27.08670425415039, "global_step": 507819, "epoch": 6118} {"train_loss": -27.363489151000977, "global_step": 507820, "epoch": 6118} {"train_loss": -27.3470401763916, "global_step": 507821, "epoch": 6118} {"train_loss": -27.611547470092773, "global_step": 507822, "epoch": 6118} {"train_loss": -27.672382354736328, "global_step": 507823, "epoch": 6118} {"train_loss": -27.67180824279785, "global_step": 507824, "epoch": 6118} {"train_loss": -27.51276206970215, "global_step": 507825, "epoch": 6118} {"train_loss": -27.645994186401367, "global_step": 507826, "epoch": 6118} {"train_loss": -27.48404312133789, "global_step": 507827, "epoch": 6118} {"train_loss": -27.509923934936523, "global_step": 507828, "epoch": 6118} {"train_loss": -27.235422134399414, "global_step": 507829, "epoch": 6118} {"train_loss": -27.966413497924805, "global_step": 507830, "epoch": 6118} {"train_loss": -27.4775333404541, "global_step": 507831, "epoch": 6118} {"train_loss": -27.37192153930664, "global_step": 507832, "epoch": 6118} {"train_loss": -27.599088668823242, "global_step": 507833, "epoch": 6118} {"train_loss": -27.69928550720215, "global_step": 507834, "epoch": 6118} {"train_loss": -27.76104164123535, "global_step": 507835, "epoch": 6118} {"train_loss": -27.433563232421875, "global_step": 507836, "epoch": 6118} {"train_loss": -27.287763595581055, "global_step": 507837, "epoch": 6118} {"train_loss": -27.38714027404785, "global_step": 507838, "epoch": 6118} {"train_loss": -27.45246696472168, "global_step": 507839, "epoch": 6118} {"train_loss": -27.611661911010742, "global_step": 507840, "epoch": 6118} {"train_loss": -27.52535057067871, "global_step": 507841, "epoch": 6118} {"train_loss": -27.391523361206055, "global_step": 507842, "epoch": 6118} {"train_loss": -27.239795684814453, "global_step": 507843, "epoch": 6118} {"train_loss": -27.452245712280273, "global_step": 507844, "epoch": 6118} {"train_loss": -27.436756134033203, "global_step": 507845, "epoch": 6118} {"train_loss": -27.34376335144043, "global_step": 507846, "epoch": 6118} {"train_loss": -28.02351188659668, "global_step": 507847, "epoch": 6118} {"train_loss": -27.406442642211914, "global_step": 507848, "epoch": 6118} {"train_loss": -28.06153678894043, "global_step": 507849, "epoch": 6118} {"train_loss": -27.692691802978516, "global_step": 507850, "epoch": 6118} {"train_loss": -27.725629806518555, "global_step": 507851, "epoch": 6118} {"train_loss": -27.78466796875, "global_step": 507852, "epoch": 6118} {"train_loss": -27.59283447265625, "global_step": 507853, "epoch": 6118} {"train_loss": -27.491687774658203, "global_step": 507854, "epoch": 6118} {"train_loss": -27.582706451416016, "global_step": 507855, "epoch": 6118} {"train_loss": -27.594440460205078, "global_step": 507856, "epoch": 6118} {"train_loss": -27.30029296875, "global_step": 507857, "epoch": 6118} {"train_loss": -27.18132972717285, "global_step": 507858, "epoch": 6118} {"train_loss": -27.253158569335938, "global_step": 507859, "epoch": 6118} {"train_loss": -27.8708553314209, "global_step": 507860, "epoch": 6118} {"train_loss": -27.534931182861328, "global_step": 507861, "epoch": 6118} {"train_loss": -27.72330093383789, "global_step": 507862, "epoch": 6118} {"train_loss": -27.5775146484375, "global_step": 507863, "epoch": 6118} {"train_loss": -27.599639892578125, "global_step": 507864, "epoch": 6118} {"train_loss": -27.490201950073242, "global_step": 507865, "epoch": 6118} {"train_loss": -27.363391876220703, "global_step": 507866, "epoch": 6118} {"train_loss": -26.9744873046875, "global_step": 507867, "epoch": 6118} {"train_loss": -26.86054039001465, "global_step": 507868, "epoch": 6118} {"train_loss": -27.351221084594727, "global_step": 507869, "epoch": 6118} {"train_loss": -27.6495304107666, "global_step": 507870, "epoch": 6118} {"train_loss": -27.408069610595703, "global_step": 507871, "epoch": 6118} {"train_loss": -27.04031753540039, "global_step": 507872, "epoch": 6118} {"train_loss": -27.49263572692871, "global_step": 507873, "epoch": 6118} {"train_loss": -27.389404296875, "global_step": 507874, "epoch": 6118} {"train_loss": -27.64899253845215, "global_step": 507875, "epoch": 6118} {"train_loss": -27.333408263792474, "global_step": 507876, "epoch": 6118, "val_loss": 6533778.0} {"train_loss": -26.60210609436035, "global_step": 507877, "epoch": 6119} {"train_loss": -26.21453857421875, "global_step": 507878, "epoch": 6119} {"train_loss": -26.469511032104492, "global_step": 507879, "epoch": 6119} {"train_loss": -26.109790802001953, "global_step": 507880, "epoch": 6119} {"train_loss": -26.60467529296875, "global_step": 507881, "epoch": 6119} {"train_loss": -26.722198486328125, "global_step": 507882, "epoch": 6119} {"train_loss": -26.338285446166992, "global_step": 507883, "epoch": 6119} {"train_loss": -26.727121353149414, "global_step": 507884, "epoch": 6119} {"train_loss": -26.709095001220703, "global_step": 507885, "epoch": 6119} {"train_loss": -26.884479522705078, "global_step": 507886, "epoch": 6119} {"train_loss": -26.884326934814453, "global_step": 507887, "epoch": 6119} {"train_loss": -26.840478897094727, "global_step": 507888, "epoch": 6119} {"train_loss": -26.717788696289062, "global_step": 507889, "epoch": 6119} {"train_loss": -27.332752227783203, "global_step": 507890, "epoch": 6119} {"train_loss": -27.064374923706055, "global_step": 507891, "epoch": 6119} {"train_loss": -27.20557975769043, "global_step": 507892, "epoch": 6119} {"train_loss": -27.175378799438477, "global_step": 507893, "epoch": 6119} {"train_loss": -26.845382690429688, "global_step": 507894, "epoch": 6119} {"train_loss": -27.321319580078125, "global_step": 507895, "epoch": 6119} {"train_loss": -27.189620971679688, "global_step": 507896, "epoch": 6119} {"train_loss": -27.38567543029785, "global_step": 507897, "epoch": 6119} {"train_loss": -27.2137451171875, "global_step": 507898, "epoch": 6119} {"train_loss": -27.271930694580078, "global_step": 507899, "epoch": 6119} {"train_loss": -27.3129940032959, "global_step": 507900, "epoch": 6119} {"train_loss": -27.18827247619629, "global_step": 507901, "epoch": 6119} {"train_loss": -27.24252700805664, "global_step": 507902, "epoch": 6119} {"train_loss": -27.464399337768555, "global_step": 507903, "epoch": 6119} {"train_loss": -27.3137264251709, "global_step": 507904, "epoch": 6119} {"train_loss": -27.581195831298828, "global_step": 507905, "epoch": 6119} {"train_loss": -27.566457748413086, "global_step": 507906, "epoch": 6119} {"train_loss": -27.4208927154541, "global_step": 507907, "epoch": 6119} {"train_loss": -27.394025802612305, "global_step": 507908, "epoch": 6119} {"train_loss": -27.43239402770996, "global_step": 507909, "epoch": 6119} {"train_loss": -27.598337173461914, "global_step": 507910, "epoch": 6119} {"train_loss": -27.70464515686035, "global_step": 507911, "epoch": 6119} {"train_loss": -27.381723403930664, "global_step": 507912, "epoch": 6119} {"train_loss": -27.12735366821289, "global_step": 507913, "epoch": 6119} {"train_loss": -27.0885066986084, "global_step": 507914, "epoch": 6119} {"train_loss": -27.611896514892578, "global_step": 507915, "epoch": 6119} {"train_loss": -27.68804931640625, "global_step": 507916, "epoch": 6119} {"train_loss": -27.583026885986328, "global_step": 507917, "epoch": 6119} {"train_loss": -27.94866943359375, "global_step": 507918, "epoch": 6119} {"train_loss": -27.52545166015625, "global_step": 507919, "epoch": 6119} {"train_loss": -27.747882843017578, "global_step": 507920, "epoch": 6119} {"train_loss": -27.412805557250977, "global_step": 507921, "epoch": 6119} {"train_loss": -27.393238067626953, "global_step": 507922, "epoch": 6119} {"train_loss": -27.625762939453125, "global_step": 507923, "epoch": 6119} {"train_loss": -27.47307777404785, "global_step": 507924, "epoch": 6119} {"train_loss": -27.493072509765625, "global_step": 507925, "epoch": 6119} {"train_loss": -27.511999130249023, "global_step": 507926, "epoch": 6119} {"train_loss": -27.548858642578125, "global_step": 507927, "epoch": 6119} {"train_loss": -27.263166427612305, "global_step": 507928, "epoch": 6119} {"train_loss": -27.49968910217285, "global_step": 507929, "epoch": 6119} {"train_loss": -27.608327865600586, "global_step": 507930, "epoch": 6119} {"train_loss": -27.60678482055664, "global_step": 507931, "epoch": 6119} {"train_loss": -27.624414443969727, "global_step": 507932, "epoch": 6119} {"train_loss": -27.682416915893555, "global_step": 507933, "epoch": 6119} {"train_loss": -27.440515518188477, "global_step": 507934, "epoch": 6119} {"train_loss": -27.702911376953125, "global_step": 507935, "epoch": 6119} {"train_loss": -27.941741943359375, "global_step": 507936, "epoch": 6119} {"train_loss": -27.900577545166016, "global_step": 507937, "epoch": 6119} {"train_loss": -27.555240631103516, "global_step": 507938, "epoch": 6119} {"train_loss": -27.616952896118164, "global_step": 507939, "epoch": 6119} {"train_loss": -27.723663330078125, "global_step": 507940, "epoch": 6119} {"train_loss": -27.259933471679688, "global_step": 507941, "epoch": 6119} {"train_loss": -27.449487686157227, "global_step": 507942, "epoch": 6119} {"train_loss": -27.571577072143555, "global_step": 507943, "epoch": 6119} {"train_loss": -27.686960220336914, "global_step": 507944, "epoch": 6119} {"train_loss": -27.7015323638916, "global_step": 507945, "epoch": 6119} {"train_loss": -27.655792236328125, "global_step": 507946, "epoch": 6119} {"train_loss": -27.582014083862305, "global_step": 507947, "epoch": 6119} {"train_loss": -27.09858512878418, "global_step": 507948, "epoch": 6119} {"train_loss": -27.427322387695312, "global_step": 507949, "epoch": 6119} {"train_loss": -26.80084228515625, "global_step": 507950, "epoch": 6119} {"train_loss": -27.837793350219727, "global_step": 507951, "epoch": 6119} {"train_loss": -27.52912712097168, "global_step": 507952, "epoch": 6119} {"train_loss": -27.4659423828125, "global_step": 507953, "epoch": 6119} {"train_loss": -27.17987632751465, "global_step": 507954, "epoch": 6119} {"train_loss": -27.2240047454834, "global_step": 507955, "epoch": 6119} {"train_loss": -27.185836791992188, "global_step": 507956, "epoch": 6119} {"train_loss": -27.21050453186035, "global_step": 507957, "epoch": 6119} {"train_loss": -27.356678009033203, "global_step": 507958, "epoch": 6119} {"train_loss": -27.31389245642237, "global_step": 507959, "epoch": 6119, "val_loss": 6549288.5} {"train_loss": -26.18622398376465, "global_step": 507960, "epoch": 6120} {"train_loss": -25.918737411499023, "global_step": 507961, "epoch": 6120} {"train_loss": -26.4832706451416, "global_step": 507962, "epoch": 6120} {"train_loss": -25.783727645874023, "global_step": 507963, "epoch": 6120} {"train_loss": -26.98805046081543, "global_step": 507964, "epoch": 6120} {"train_loss": -26.389318466186523, "global_step": 507965, "epoch": 6120} {"train_loss": -26.552854537963867, "global_step": 507966, "epoch": 6120} {"train_loss": -26.091907501220703, "global_step": 507967, "epoch": 6120} {"train_loss": -26.616195678710938, "global_step": 507968, "epoch": 6120} {"train_loss": -26.75497817993164, "global_step": 507969, "epoch": 6120} {"train_loss": -27.086938858032227, "global_step": 507970, "epoch": 6120} {"train_loss": -26.6094970703125, "global_step": 507971, "epoch": 6120} {"train_loss": -27.12880516052246, "global_step": 507972, "epoch": 6120} {"train_loss": -26.723188400268555, "global_step": 507973, "epoch": 6120} {"train_loss": -27.042346954345703, "global_step": 507974, "epoch": 6120} {"train_loss": -27.168048858642578, "global_step": 507975, "epoch": 6120} {"train_loss": -26.732152938842773, "global_step": 507976, "epoch": 6120} {"train_loss": -26.609302520751953, "global_step": 507977, "epoch": 6120} {"train_loss": -27.35693359375, "global_step": 507978, "epoch": 6120} {"train_loss": -27.107025146484375, "global_step": 507979, "epoch": 6120} {"train_loss": -26.94757080078125, "global_step": 507980, "epoch": 6120} {"train_loss": -26.73233413696289, "global_step": 507981, "epoch": 6120} {"train_loss": -27.158985137939453, "global_step": 507982, "epoch": 6120} {"train_loss": -27.441564559936523, "global_step": 507983, "epoch": 6120} {"train_loss": -27.17583656311035, "global_step": 507984, "epoch": 6120} {"train_loss": -27.41176414489746, "global_step": 507985, "epoch": 6120} {"train_loss": -27.440900802612305, "global_step": 507986, "epoch": 6120} {"train_loss": -27.3092098236084, "global_step": 507987, "epoch": 6120} {"train_loss": -27.22364616394043, "global_step": 507988, "epoch": 6120} {"train_loss": -27.62996482849121, "global_step": 507989, "epoch": 6120} {"train_loss": -27.62886619567871, "global_step": 507990, "epoch": 6120} {"train_loss": -27.02655601501465, "global_step": 507991, "epoch": 6120} {"train_loss": -27.109365463256836, "global_step": 507992, "epoch": 6120} {"train_loss": -27.48919105529785, "global_step": 507993, "epoch": 6120} {"train_loss": -27.629241943359375, "global_step": 507994, "epoch": 6120} {"train_loss": -27.16541862487793, "global_step": 507995, "epoch": 6120} {"train_loss": -27.24513816833496, "global_step": 507996, "epoch": 6120} {"train_loss": -27.21962547302246, "global_step": 507997, "epoch": 6120} {"train_loss": -27.42646598815918, "global_step": 507998, "epoch": 6120} {"train_loss": -27.231847763061523, "global_step": 507999, "epoch": 6120} {"train_loss": -27.496753692626953, "global_step": 508000, "epoch": 6120} {"train_loss": -27.55816650390625, "global_step": 508001, "epoch": 6120} {"train_loss": -27.6350040435791, "global_step": 508002, "epoch": 6120} {"train_loss": -27.71659278869629, "global_step": 508003, "epoch": 6120} {"train_loss": -27.661422729492188, "global_step": 508004, "epoch": 6120} {"train_loss": -27.330469131469727, "global_step": 508005, "epoch": 6120} {"train_loss": -27.640859603881836, "global_step": 508006, "epoch": 6120} {"train_loss": -27.510324478149414, "global_step": 508007, "epoch": 6120} {"train_loss": -27.16511344909668, "global_step": 508008, "epoch": 6120} {"train_loss": -27.585189819335938, "global_step": 508009, "epoch": 6120} {"train_loss": -27.58070182800293, "global_step": 508010, "epoch": 6120} {"train_loss": -27.566654205322266, "global_step": 508011, "epoch": 6120} {"train_loss": -27.690937042236328, "global_step": 508012, "epoch": 6120} {"train_loss": -27.77461814880371, "global_step": 508013, "epoch": 6120} {"train_loss": -27.623336791992188, "global_step": 508014, "epoch": 6120} {"train_loss": -27.23197364807129, "global_step": 508015, "epoch": 6120} {"train_loss": -26.833393096923828, "global_step": 508016, "epoch": 6120} {"train_loss": -26.953481674194336, "global_step": 508017, "epoch": 6120} {"train_loss": -27.159870147705078, "global_step": 508018, "epoch": 6120} {"train_loss": -27.36930274963379, "global_step": 508019, "epoch": 6120} {"train_loss": -27.61358070373535, "global_step": 508020, "epoch": 6120} {"train_loss": -27.55781364440918, "global_step": 508021, "epoch": 6120} {"train_loss": -27.6230525970459, "global_step": 508022, "epoch": 6120} {"train_loss": -27.4422664642334, "global_step": 508023, "epoch": 6120} {"train_loss": -27.57085609436035, "global_step": 508024, "epoch": 6120} {"train_loss": -27.802982330322266, "global_step": 508025, "epoch": 6120} {"train_loss": -27.31720542907715, "global_step": 508026, "epoch": 6120} {"train_loss": -27.762928009033203, "global_step": 508027, "epoch": 6120} {"train_loss": -27.182336807250977, "global_step": 508028, "epoch": 6120} {"train_loss": -27.322341918945312, "global_step": 508029, "epoch": 6120} {"train_loss": -27.79375648498535, "global_step": 508030, "epoch": 6120} {"train_loss": -27.47574806213379, "global_step": 508031, "epoch": 6120} {"train_loss": -27.340530395507812, "global_step": 508032, "epoch": 6120} {"train_loss": -27.57590103149414, "global_step": 508033, "epoch": 6120} {"train_loss": -27.641651153564453, "global_step": 508034, "epoch": 6120} {"train_loss": -27.483264923095703, "global_step": 508035, "epoch": 6120} {"train_loss": -27.438695907592773, "global_step": 508036, "epoch": 6120} {"train_loss": -27.578832626342773, "global_step": 508037, "epoch": 6120} {"train_loss": -27.5941104888916, "global_step": 508038, "epoch": 6120} {"train_loss": -27.87605094909668, "global_step": 508039, "epoch": 6120} {"train_loss": -27.342676162719727, "global_step": 508040, "epoch": 6120} {"train_loss": -27.564924240112305, "global_step": 508041, "epoch": 6120} {"train_loss": -27.2471941063203, "global_step": 508042, "epoch": 6120, "val_loss": 6475627.0} {"train_loss": -26.631351470947266, "global_step": 508043, "epoch": 6121} {"train_loss": -26.53766441345215, "global_step": 508044, "epoch": 6121} {"train_loss": -26.876876831054688, "global_step": 508045, "epoch": 6121} {"train_loss": -26.860769271850586, "global_step": 508046, "epoch": 6121} {"train_loss": -26.696685791015625, "global_step": 508047, "epoch": 6121} {"train_loss": -26.651569366455078, "global_step": 508048, "epoch": 6121} {"train_loss": -26.68813133239746, "global_step": 508049, "epoch": 6121} {"train_loss": -27.27142906188965, "global_step": 508050, "epoch": 6121} {"train_loss": -26.360244750976562, "global_step": 508051, "epoch": 6121} {"train_loss": -26.021316528320312, "global_step": 508052, "epoch": 6121} {"train_loss": -27.067325592041016, "global_step": 508053, "epoch": 6121} {"train_loss": -26.451135635375977, "global_step": 508054, "epoch": 6121} {"train_loss": -26.785083770751953, "global_step": 508055, "epoch": 6121} {"train_loss": -26.58685302734375, "global_step": 508056, "epoch": 6121} {"train_loss": -27.271289825439453, "global_step": 508057, "epoch": 6121} {"train_loss": -27.179380416870117, "global_step": 508058, "epoch": 6121} {"train_loss": -26.88130760192871, "global_step": 508059, "epoch": 6121} {"train_loss": -27.4510440826416, "global_step": 508060, "epoch": 6121} {"train_loss": -27.298099517822266, "global_step": 508061, "epoch": 6121} {"train_loss": -27.08026123046875, "global_step": 508062, "epoch": 6121} {"train_loss": -27.408294677734375, "global_step": 508063, "epoch": 6121} {"train_loss": -27.165395736694336, "global_step": 508064, "epoch": 6121} {"train_loss": -27.14377212524414, "global_step": 508065, "epoch": 6121} {"train_loss": -27.066869735717773, "global_step": 508066, "epoch": 6121} {"train_loss": -26.888593673706055, "global_step": 508067, "epoch": 6121} {"train_loss": -27.188695907592773, "global_step": 508068, "epoch": 6121} {"train_loss": -27.392780303955078, "global_step": 508069, "epoch": 6121} {"train_loss": -27.350812911987305, "global_step": 508070, "epoch": 6121} {"train_loss": -27.198078155517578, "global_step": 508071, "epoch": 6121} {"train_loss": -27.342334747314453, "global_step": 508072, "epoch": 6121} {"train_loss": -27.460376739501953, "global_step": 508073, "epoch": 6121} {"train_loss": -27.630023956298828, "global_step": 508074, "epoch": 6121} {"train_loss": -27.5045223236084, "global_step": 508075, "epoch": 6121} {"train_loss": -27.538040161132812, "global_step": 508076, "epoch": 6121} {"train_loss": -27.113508224487305, "global_step": 508077, "epoch": 6121} {"train_loss": -27.49188804626465, "global_step": 508078, "epoch": 6121} {"train_loss": -27.674100875854492, "global_step": 508079, "epoch": 6121} {"train_loss": -27.320831298828125, "global_step": 508080, "epoch": 6121} {"train_loss": -27.545013427734375, "global_step": 508081, "epoch": 6121} {"train_loss": -27.51004981994629, "global_step": 508082, "epoch": 6121} {"train_loss": -27.6804256439209, "global_step": 508083, "epoch": 6121} {"train_loss": -27.29343605041504, "global_step": 508084, "epoch": 6121} {"train_loss": -27.669034957885742, "global_step": 508085, "epoch": 6121} {"train_loss": -28.009668350219727, "global_step": 508086, "epoch": 6121} {"train_loss": -27.857873916625977, "global_step": 508087, "epoch": 6121} {"train_loss": -27.62067985534668, "global_step": 508088, "epoch": 6121} {"train_loss": -27.964696884155273, "global_step": 508089, "epoch": 6121} {"train_loss": -27.655179977416992, "global_step": 508090, "epoch": 6121} {"train_loss": -27.790863037109375, "global_step": 508091, "epoch": 6121} {"train_loss": -27.546194076538086, "global_step": 508092, "epoch": 6121} {"train_loss": -27.82037353515625, "global_step": 508093, "epoch": 6121} {"train_loss": -27.714162826538086, "global_step": 508094, "epoch": 6121} {"train_loss": -27.962121963500977, "global_step": 508095, "epoch": 6121} {"train_loss": -27.627588272094727, "global_step": 508096, "epoch": 6121} {"train_loss": -27.371490478515625, "global_step": 508097, "epoch": 6121} {"train_loss": -27.77859878540039, "global_step": 508098, "epoch": 6121} {"train_loss": -27.89924430847168, "global_step": 508099, "epoch": 6121} {"train_loss": -27.600400924682617, "global_step": 508100, "epoch": 6121} {"train_loss": -27.74700355529785, "global_step": 508101, "epoch": 6121} {"train_loss": -27.745208740234375, "global_step": 508102, "epoch": 6121} {"train_loss": -27.515607833862305, "global_step": 508103, "epoch": 6121} {"train_loss": -28.039203643798828, "global_step": 508104, "epoch": 6121} {"train_loss": -27.396442413330078, "global_step": 508105, "epoch": 6121} {"train_loss": -27.232297897338867, "global_step": 508106, "epoch": 6121} {"train_loss": -26.867605209350586, "global_step": 508107, "epoch": 6121} {"train_loss": -26.072168350219727, "global_step": 508108, "epoch": 6121} {"train_loss": -25.741107940673828, "global_step": 508109, "epoch": 6121} {"train_loss": -26.72054100036621, "global_step": 508110, "epoch": 6121} {"train_loss": -27.8956356048584, "global_step": 508111, "epoch": 6121} {"train_loss": -26.981037139892578, "global_step": 508112, "epoch": 6121} {"train_loss": -27.188379287719727, "global_step": 508113, "epoch": 6121} {"train_loss": -27.329771041870117, "global_step": 508114, "epoch": 6121} {"train_loss": -27.3306884765625, "global_step": 508115, "epoch": 6121} {"train_loss": -27.569684982299805, "global_step": 508116, "epoch": 6121} {"train_loss": -27.489364624023438, "global_step": 508117, "epoch": 6121} {"train_loss": -27.43182373046875, "global_step": 508118, "epoch": 6121} {"train_loss": -27.347274780273438, "global_step": 508119, "epoch": 6121} {"train_loss": -27.37613296508789, "global_step": 508120, "epoch": 6121} {"train_loss": -27.293325424194336, "global_step": 508121, "epoch": 6121} {"train_loss": -27.260610580444336, "global_step": 508122, "epoch": 6121} {"train_loss": -27.695510864257812, "global_step": 508123, "epoch": 6121} {"train_loss": -27.432886123657227, "global_step": 508124, "epoch": 6121} {"train_loss": -27.277433395385742, "global_step": 508125, "epoch": 6121, "val_loss": 6619356.0} {"train_loss": -26.9164981842041, "global_step": 508126, "epoch": 6122} {"train_loss": -27.02663230895996, "global_step": 508127, "epoch": 6122} {"train_loss": -26.6429500579834, "global_step": 508128, "epoch": 6122} {"train_loss": -26.42396354675293, "global_step": 508129, "epoch": 6122} {"train_loss": -27.080270767211914, "global_step": 508130, "epoch": 6122} {"train_loss": -26.513608932495117, "global_step": 508131, "epoch": 6122} {"train_loss": -27.009733200073242, "global_step": 508132, "epoch": 6122} {"train_loss": -26.96917724609375, "global_step": 508133, "epoch": 6122} {"train_loss": -27.150726318359375, "global_step": 508134, "epoch": 6122} {"train_loss": -27.23976707458496, "global_step": 508135, "epoch": 6122} {"train_loss": -27.507171630859375, "global_step": 508136, "epoch": 6122} {"train_loss": -27.43250846862793, "global_step": 508137, "epoch": 6122} {"train_loss": -27.3895206451416, "global_step": 508138, "epoch": 6122} {"train_loss": -26.845840454101562, "global_step": 508139, "epoch": 6122} {"train_loss": -27.066389083862305, "global_step": 508140, "epoch": 6122} {"train_loss": -27.422439575195312, "global_step": 508141, "epoch": 6122} {"train_loss": -27.511865615844727, "global_step": 508142, "epoch": 6122} {"train_loss": -27.214441299438477, "global_step": 508143, "epoch": 6122} {"train_loss": -27.218769073486328, "global_step": 508144, "epoch": 6122} {"train_loss": -27.084095001220703, "global_step": 508145, "epoch": 6122} {"train_loss": -27.378889083862305, "global_step": 508146, "epoch": 6122} {"train_loss": -27.815351486206055, "global_step": 508147, "epoch": 6122} {"train_loss": -27.211414337158203, "global_step": 508148, "epoch": 6122} {"train_loss": -27.0157527923584, "global_step": 508149, "epoch": 6122} {"train_loss": -27.18499183654785, "global_step": 508150, "epoch": 6122} {"train_loss": -27.12188148498535, "global_step": 508151, "epoch": 6122} {"train_loss": -27.356719970703125, "global_step": 508152, "epoch": 6122} {"train_loss": -27.374820709228516, "global_step": 508153, "epoch": 6122} {"train_loss": -27.6651554107666, "global_step": 508154, "epoch": 6122} {"train_loss": -27.235187530517578, "global_step": 508155, "epoch": 6122} {"train_loss": -27.518930435180664, "global_step": 508156, "epoch": 6122} {"train_loss": -27.51087760925293, "global_step": 508157, "epoch": 6122} {"train_loss": -27.731861114501953, "global_step": 508158, "epoch": 6122} {"train_loss": -27.549123764038086, "global_step": 508159, "epoch": 6122} {"train_loss": -27.646011352539062, "global_step": 508160, "epoch": 6122} {"train_loss": -27.400304794311523, "global_step": 508161, "epoch": 6122} {"train_loss": -27.753576278686523, "global_step": 508162, "epoch": 6122} {"train_loss": -27.671728134155273, "global_step": 508163, "epoch": 6122} {"train_loss": -27.811050415039062, "global_step": 508164, "epoch": 6122} {"train_loss": -27.6505126953125, "global_step": 508165, "epoch": 6122} {"train_loss": -27.729719161987305, "global_step": 508166, "epoch": 6122} {"train_loss": -27.4703311920166, "global_step": 508167, "epoch": 6122} {"train_loss": -27.626373291015625, "global_step": 508168, "epoch": 6122} {"train_loss": -27.73395347595215, "global_step": 508169, "epoch": 6122} {"train_loss": -27.1837100982666, "global_step": 508170, "epoch": 6122} {"train_loss": -27.690692901611328, "global_step": 508171, "epoch": 6122} {"train_loss": -27.428836822509766, "global_step": 508172, "epoch": 6122} {"train_loss": -27.251575469970703, "global_step": 508173, "epoch": 6122} {"train_loss": -27.334802627563477, "global_step": 508174, "epoch": 6122} {"train_loss": -26.973474502563477, "global_step": 508175, "epoch": 6122} {"train_loss": -27.082189559936523, "global_step": 508176, "epoch": 6122} {"train_loss": -27.040149688720703, "global_step": 508177, "epoch": 6122} {"train_loss": -27.047760009765625, "global_step": 508178, "epoch": 6122} {"train_loss": -27.417245864868164, "global_step": 508179, "epoch": 6122} {"train_loss": -27.146936416625977, "global_step": 508180, "epoch": 6122} {"train_loss": -27.531055450439453, "global_step": 508181, "epoch": 6122} {"train_loss": -27.34383201599121, "global_step": 508182, "epoch": 6122} {"train_loss": -26.826618194580078, "global_step": 508183, "epoch": 6122} {"train_loss": -27.68143081665039, "global_step": 508184, "epoch": 6122} {"train_loss": -26.96122169494629, "global_step": 508185, "epoch": 6122} {"train_loss": -26.797515869140625, "global_step": 508186, "epoch": 6122} {"train_loss": -27.1574649810791, "global_step": 508187, "epoch": 6122} {"train_loss": -27.34122085571289, "global_step": 508188, "epoch": 6122} {"train_loss": -26.61699867248535, "global_step": 508189, "epoch": 6122} {"train_loss": -27.5609130859375, "global_step": 508190, "epoch": 6122} {"train_loss": -27.35285758972168, "global_step": 508191, "epoch": 6122} {"train_loss": -27.02666664123535, "global_step": 508192, "epoch": 6122} {"train_loss": -27.069604873657227, "global_step": 508193, "epoch": 6122} {"train_loss": -27.21980094909668, "global_step": 508194, "epoch": 6122} {"train_loss": -26.947370529174805, "global_step": 508195, "epoch": 6122} {"train_loss": -27.144119262695312, "global_step": 508196, "epoch": 6122} {"train_loss": -27.3093204498291, "global_step": 508197, "epoch": 6122} {"train_loss": -27.259033203125, "global_step": 508198, "epoch": 6122} {"train_loss": -27.48565673828125, "global_step": 508199, "epoch": 6122} {"train_loss": -27.444168090820312, "global_step": 508200, "epoch": 6122} {"train_loss": -27.678760528564453, "global_step": 508201, "epoch": 6122} {"train_loss": -27.02166748046875, "global_step": 508202, "epoch": 6122} {"train_loss": -27.146509170532227, "global_step": 508203, "epoch": 6122} {"train_loss": -27.524580001831055, "global_step": 508204, "epoch": 6122} {"train_loss": -27.1498966217041, "global_step": 508205, "epoch": 6122} {"train_loss": -27.319416046142578, "global_step": 508206, "epoch": 6122} {"train_loss": -27.32306480407715, "global_step": 508207, "epoch": 6122} {"train_loss": -27.279240642685487, "global_step": 508208, "epoch": 6122, "val_loss": 6633539.0} {"train_loss": -27.352888107299805, "global_step": 508209, "epoch": 6123} {"train_loss": -27.396575927734375, "global_step": 508210, "epoch": 6123} {"train_loss": -27.15650749206543, "global_step": 508211, "epoch": 6123} {"train_loss": -27.31146240234375, "global_step": 508212, "epoch": 6123} {"train_loss": -27.40950584411621, "global_step": 508213, "epoch": 6123} {"train_loss": -27.0463924407959, "global_step": 508214, "epoch": 6123} {"train_loss": -27.445371627807617, "global_step": 508215, "epoch": 6123} {"train_loss": -27.35164451599121, "global_step": 508216, "epoch": 6123} {"train_loss": -27.112390518188477, "global_step": 508217, "epoch": 6123} {"train_loss": -27.509862899780273, "global_step": 508218, "epoch": 6123} {"train_loss": -27.40361976623535, "global_step": 508219, "epoch": 6123} {"train_loss": -27.45000648498535, "global_step": 508220, "epoch": 6123} {"train_loss": -27.478622436523438, "global_step": 508221, "epoch": 6123} {"train_loss": -27.53021812438965, "global_step": 508222, "epoch": 6123} {"train_loss": -27.687763214111328, "global_step": 508223, "epoch": 6123} {"train_loss": -27.68763542175293, "global_step": 508224, "epoch": 6123} {"train_loss": -27.56941032409668, "global_step": 508225, "epoch": 6123} {"train_loss": -27.53253173828125, "global_step": 508226, "epoch": 6123} {"train_loss": -27.525060653686523, "global_step": 508227, "epoch": 6123} {"train_loss": -27.655256271362305, "global_step": 508228, "epoch": 6123} {"train_loss": -27.383682250976562, "global_step": 508229, "epoch": 6123} {"train_loss": -27.381244659423828, "global_step": 508230, "epoch": 6123} {"train_loss": -27.598154067993164, "global_step": 508231, "epoch": 6123} {"train_loss": -27.417490005493164, "global_step": 508232, "epoch": 6123} {"train_loss": -27.284204483032227, "global_step": 508233, "epoch": 6123} {"train_loss": -27.712554931640625, "global_step": 508234, "epoch": 6123} {"train_loss": -27.517690658569336, "global_step": 508235, "epoch": 6123} {"train_loss": -27.642053604125977, "global_step": 508236, "epoch": 6123} {"train_loss": -26.976659774780273, "global_step": 508237, "epoch": 6123} {"train_loss": -26.83530044555664, "global_step": 508238, "epoch": 6123} {"train_loss": -27.132415771484375, "global_step": 508239, "epoch": 6123} {"train_loss": -26.942157745361328, "global_step": 508240, "epoch": 6123} {"train_loss": -27.289112091064453, "global_step": 508241, "epoch": 6123} {"train_loss": -26.9507999420166, "global_step": 508242, "epoch": 6123} {"train_loss": -26.65936279296875, "global_step": 508243, "epoch": 6123} {"train_loss": -26.742645263671875, "global_step": 508244, "epoch": 6123} {"train_loss": -27.87026023864746, "global_step": 508245, "epoch": 6123} {"train_loss": -27.330503463745117, "global_step": 508246, "epoch": 6123} {"train_loss": -27.22590446472168, "global_step": 508247, "epoch": 6123} {"train_loss": -27.373327255249023, "global_step": 508248, "epoch": 6123} {"train_loss": -27.67783546447754, "global_step": 508249, "epoch": 6123} {"train_loss": -27.14655876159668, "global_step": 508250, "epoch": 6123} {"train_loss": -27.08747673034668, "global_step": 508251, "epoch": 6123} {"train_loss": -27.151391983032227, "global_step": 508252, "epoch": 6123} {"train_loss": -27.6340274810791, "global_step": 508253, "epoch": 6123} {"train_loss": -27.643911361694336, "global_step": 508254, "epoch": 6123} {"train_loss": -27.798995971679688, "global_step": 508255, "epoch": 6123} {"train_loss": -27.7344970703125, "global_step": 508256, "epoch": 6123} {"train_loss": -27.453201293945312, "global_step": 508257, "epoch": 6123} {"train_loss": -27.45771598815918, "global_step": 508258, "epoch": 6123} {"train_loss": -27.60492515563965, "global_step": 508259, "epoch": 6123} {"train_loss": -27.14762306213379, "global_step": 508260, "epoch": 6123} {"train_loss": -27.314044952392578, "global_step": 508261, "epoch": 6123} {"train_loss": -27.201831817626953, "global_step": 508262, "epoch": 6123} {"train_loss": -27.533716201782227, "global_step": 508263, "epoch": 6123} {"train_loss": -27.7564640045166, "global_step": 508264, "epoch": 6123} {"train_loss": -27.6058406829834, "global_step": 508265, "epoch": 6123} {"train_loss": -27.467756271362305, "global_step": 508266, "epoch": 6123} {"train_loss": -27.508447647094727, "global_step": 508267, "epoch": 6123} {"train_loss": -27.417638778686523, "global_step": 508268, "epoch": 6123} {"train_loss": -27.4451961517334, "global_step": 508269, "epoch": 6123} {"train_loss": -27.381378173828125, "global_step": 508270, "epoch": 6123} {"train_loss": -27.52130699157715, "global_step": 508271, "epoch": 6123} {"train_loss": -27.6313419342041, "global_step": 508272, "epoch": 6123} {"train_loss": -27.4860782623291, "global_step": 508273, "epoch": 6123} {"train_loss": -27.200353622436523, "global_step": 508274, "epoch": 6123} {"train_loss": -27.55579948425293, "global_step": 508275, "epoch": 6123} {"train_loss": -27.619909286499023, "global_step": 508276, "epoch": 6123} {"train_loss": -27.463272094726562, "global_step": 508277, "epoch": 6123} {"train_loss": -27.78687858581543, "global_step": 508278, "epoch": 6123} {"train_loss": -27.968780517578125, "global_step": 508279, "epoch": 6123} {"train_loss": -27.592899322509766, "global_step": 508280, "epoch": 6123} {"train_loss": -27.249343872070312, "global_step": 508281, "epoch": 6123} {"train_loss": -27.43665885925293, "global_step": 508282, "epoch": 6123} {"train_loss": -28.001081466674805, "global_step": 508283, "epoch": 6123} {"train_loss": -27.789236068725586, "global_step": 508284, "epoch": 6123} {"train_loss": -27.419904708862305, "global_step": 508285, "epoch": 6123} {"train_loss": -27.946508407592773, "global_step": 508286, "epoch": 6123} {"train_loss": -27.66753578186035, "global_step": 508287, "epoch": 6123} {"train_loss": -27.199247360229492, "global_step": 508288, "epoch": 6123} {"train_loss": -27.435718536376953, "global_step": 508289, "epoch": 6123} {"train_loss": -27.217151641845703, "global_step": 508290, "epoch": 6123} {"train_loss": -27.444208788584515, "global_step": 508291, "epoch": 6123, "val_loss": 6540981.0} {"train_loss": -26.91475486755371, "global_step": 508292, "epoch": 6124} {"train_loss": -26.101377487182617, "global_step": 508293, "epoch": 6124} {"train_loss": -26.538930892944336, "global_step": 508294, "epoch": 6124} {"train_loss": -26.783294677734375, "global_step": 508295, "epoch": 6124} {"train_loss": -26.25909996032715, "global_step": 508296, "epoch": 6124} {"train_loss": -27.367645263671875, "global_step": 508297, "epoch": 6124} {"train_loss": -27.017683029174805, "global_step": 508298, "epoch": 6124} {"train_loss": -26.8847599029541, "global_step": 508299, "epoch": 6124} {"train_loss": -26.289514541625977, "global_step": 508300, "epoch": 6124} {"train_loss": -27.019086837768555, "global_step": 508301, "epoch": 6124} {"train_loss": -26.607290267944336, "global_step": 508302, "epoch": 6124} {"train_loss": -27.061811447143555, "global_step": 508303, "epoch": 6124} {"train_loss": -26.89420509338379, "global_step": 508304, "epoch": 6124} {"train_loss": -27.025617599487305, "global_step": 508305, "epoch": 6124} {"train_loss": -27.232358932495117, "global_step": 508306, "epoch": 6124} {"train_loss": -26.8177433013916, "global_step": 508307, "epoch": 6124} {"train_loss": -27.01609230041504, "global_step": 508308, "epoch": 6124} {"train_loss": -27.167102813720703, "global_step": 508309, "epoch": 6124} {"train_loss": -27.023900985717773, "global_step": 508310, "epoch": 6124} {"train_loss": -26.993335723876953, "global_step": 508311, "epoch": 6124} {"train_loss": -26.78382682800293, "global_step": 508312, "epoch": 6124} {"train_loss": -26.846410751342773, "global_step": 508313, "epoch": 6124} {"train_loss": -27.107511520385742, "global_step": 508314, "epoch": 6124} {"train_loss": -27.00251579284668, "global_step": 508315, "epoch": 6124} {"train_loss": -27.268341064453125, "global_step": 508316, "epoch": 6124} {"train_loss": -27.452381134033203, "global_step": 508317, "epoch": 6124} {"train_loss": -27.015798568725586, "global_step": 508318, "epoch": 6124} {"train_loss": -27.188703536987305, "global_step": 508319, "epoch": 6124} {"train_loss": -26.887948989868164, "global_step": 508320, "epoch": 6124} {"train_loss": -27.184112548828125, "global_step": 508321, "epoch": 6124} {"train_loss": -27.491880416870117, "global_step": 508322, "epoch": 6124} {"train_loss": -27.3698673248291, "global_step": 508323, "epoch": 6124} {"train_loss": -27.206457138061523, "global_step": 508324, "epoch": 6124} {"train_loss": -27.19867515563965, "global_step": 508325, "epoch": 6124} {"train_loss": -27.444351196289062, "global_step": 508326, "epoch": 6124} {"train_loss": -27.36737060546875, "global_step": 508327, "epoch": 6124} {"train_loss": -27.41913414001465, "global_step": 508328, "epoch": 6124} {"train_loss": -27.745275497436523, "global_step": 508329, "epoch": 6124} {"train_loss": -27.589567184448242, "global_step": 508330, "epoch": 6124} {"train_loss": -27.43096351623535, "global_step": 508331, "epoch": 6124} {"train_loss": -27.473440170288086, "global_step": 508332, "epoch": 6124} {"train_loss": -27.56298828125, "global_step": 508333, "epoch": 6124} {"train_loss": -27.25042724609375, "global_step": 508334, "epoch": 6124} {"train_loss": -27.012033462524414, "global_step": 508335, "epoch": 6124} {"train_loss": -27.243946075439453, "global_step": 508336, "epoch": 6124} {"train_loss": -28.05405616760254, "global_step": 508337, "epoch": 6124} {"train_loss": -27.847631454467773, "global_step": 508338, "epoch": 6124} {"train_loss": -27.43096351623535, "global_step": 508339, "epoch": 6124} {"train_loss": -27.6960391998291, "global_step": 508340, "epoch": 6124} {"train_loss": -27.562711715698242, "global_step": 508341, "epoch": 6124} {"train_loss": -27.508081436157227, "global_step": 508342, "epoch": 6124} {"train_loss": -27.77775001525879, "global_step": 508343, "epoch": 6124} {"train_loss": -27.796777725219727, "global_step": 508344, "epoch": 6124} {"train_loss": -27.491016387939453, "global_step": 508345, "epoch": 6124} {"train_loss": -27.538745880126953, "global_step": 508346, "epoch": 6124} {"train_loss": -27.399702072143555, "global_step": 508347, "epoch": 6124} {"train_loss": -27.818456649780273, "global_step": 508348, "epoch": 6124} {"train_loss": -27.742572784423828, "global_step": 508349, "epoch": 6124} {"train_loss": -27.78594398498535, "global_step": 508350, "epoch": 6124} {"train_loss": -27.866453170776367, "global_step": 508351, "epoch": 6124} {"train_loss": -27.706342697143555, "global_step": 508352, "epoch": 6124} {"train_loss": -27.305700302124023, "global_step": 508353, "epoch": 6124} {"train_loss": -27.106372833251953, "global_step": 508354, "epoch": 6124} {"train_loss": -27.06633949279785, "global_step": 508355, "epoch": 6124} {"train_loss": -27.41102409362793, "global_step": 508356, "epoch": 6124} {"train_loss": -27.667028427124023, "global_step": 508357, "epoch": 6124} {"train_loss": -27.2044734954834, "global_step": 508358, "epoch": 6124} {"train_loss": -27.170547485351562, "global_step": 508359, "epoch": 6124} {"train_loss": -27.24224281311035, "global_step": 508360, "epoch": 6124} {"train_loss": -27.33111000061035, "global_step": 508361, "epoch": 6124} {"train_loss": -27.37353515625, "global_step": 508362, "epoch": 6124} {"train_loss": -27.388227462768555, "global_step": 508363, "epoch": 6124} {"train_loss": -27.160776138305664, "global_step": 508364, "epoch": 6124} {"train_loss": -27.742658615112305, "global_step": 508365, "epoch": 6124} {"train_loss": -27.410181045532227, "global_step": 508366, "epoch": 6124} {"train_loss": -27.489669799804688, "global_step": 508367, "epoch": 6124} {"train_loss": -27.5908260345459, "global_step": 508368, "epoch": 6124} {"train_loss": -27.306554794311523, "global_step": 508369, "epoch": 6124} {"train_loss": -27.325056076049805, "global_step": 508370, "epoch": 6124} {"train_loss": -27.154706954956055, "global_step": 508371, "epoch": 6124} {"train_loss": -26.881818771362305, "global_step": 508372, "epoch": 6124} {"train_loss": -26.438440322875977, "global_step": 508373, "epoch": 6124} {"train_loss": -27.243378811571972, "global_step": 508374, "epoch": 6124, "val_loss": 6628898.0} {"train_loss": -26.640869140625, "global_step": 508375, "epoch": 6125} {"train_loss": -26.545133590698242, "global_step": 508376, "epoch": 6125} {"train_loss": -25.985876083374023, "global_step": 508377, "epoch": 6125} {"train_loss": -26.43281364440918, "global_step": 508378, "epoch": 6125} {"train_loss": -26.449308395385742, "global_step": 508379, "epoch": 6125} {"train_loss": -27.039264678955078, "global_step": 508380, "epoch": 6125} {"train_loss": -26.549306869506836, "global_step": 508381, "epoch": 6125} {"train_loss": -26.873502731323242, "global_step": 508382, "epoch": 6125} {"train_loss": -26.671667098999023, "global_step": 508383, "epoch": 6125} {"train_loss": -26.592981338500977, "global_step": 508384, "epoch": 6125} {"train_loss": -26.61918067932129, "global_step": 508385, "epoch": 6125} {"train_loss": -26.68195915222168, "global_step": 508386, "epoch": 6125} {"train_loss": -26.907140731811523, "global_step": 508387, "epoch": 6125} {"train_loss": -26.849882125854492, "global_step": 508388, "epoch": 6125} {"train_loss": -26.8091983795166, "global_step": 508389, "epoch": 6125} {"train_loss": -26.6662654876709, "global_step": 508390, "epoch": 6125} {"train_loss": -27.153120040893555, "global_step": 508391, "epoch": 6125} {"train_loss": -26.949371337890625, "global_step": 508392, "epoch": 6125} {"train_loss": -27.073331832885742, "global_step": 508393, "epoch": 6125} {"train_loss": -27.261999130249023, "global_step": 508394, "epoch": 6125} {"train_loss": -27.0740966796875, "global_step": 508395, "epoch": 6125} {"train_loss": -27.389404296875, "global_step": 508396, "epoch": 6125} {"train_loss": -27.358062744140625, "global_step": 508397, "epoch": 6125} {"train_loss": -26.851804733276367, "global_step": 508398, "epoch": 6125} {"train_loss": -27.42486000061035, "global_step": 508399, "epoch": 6125} {"train_loss": -27.129962921142578, "global_step": 508400, "epoch": 6125} {"train_loss": -27.15717887878418, "global_step": 508401, "epoch": 6125} {"train_loss": -27.22677993774414, "global_step": 508402, "epoch": 6125} {"train_loss": -26.987646102905273, "global_step": 508403, "epoch": 6125} {"train_loss": -27.379180908203125, "global_step": 508404, "epoch": 6125} {"train_loss": -27.414648056030273, "global_step": 508405, "epoch": 6125} {"train_loss": -27.421161651611328, "global_step": 508406, "epoch": 6125} {"train_loss": -27.69215965270996, "global_step": 508407, "epoch": 6125} {"train_loss": -27.84039878845215, "global_step": 508408, "epoch": 6125} {"train_loss": -27.24647331237793, "global_step": 508409, "epoch": 6125} {"train_loss": -27.43766212463379, "global_step": 508410, "epoch": 6125} {"train_loss": -27.631439208984375, "global_step": 508411, "epoch": 6125} {"train_loss": -27.33439064025879, "global_step": 508412, "epoch": 6125} {"train_loss": -27.32415199279785, "global_step": 508413, "epoch": 6125} {"train_loss": -27.57159423828125, "global_step": 508414, "epoch": 6125} {"train_loss": -27.301645278930664, "global_step": 508415, "epoch": 6125} {"train_loss": -27.520370483398438, "global_step": 508416, "epoch": 6125} {"train_loss": -27.6871395111084, "global_step": 508417, "epoch": 6125} {"train_loss": -27.42792320251465, "global_step": 508418, "epoch": 6125} {"train_loss": -27.5683536529541, "global_step": 508419, "epoch": 6125} {"train_loss": -27.7362117767334, "global_step": 508420, "epoch": 6125} {"train_loss": -27.6318416595459, "global_step": 508421, "epoch": 6125} {"train_loss": -27.642475128173828, "global_step": 508422, "epoch": 6125} {"train_loss": -27.676624298095703, "global_step": 508423, "epoch": 6125} {"train_loss": -27.552270889282227, "global_step": 508424, "epoch": 6125} {"train_loss": -27.361743927001953, "global_step": 508425, "epoch": 6125} {"train_loss": -27.2514705657959, "global_step": 508426, "epoch": 6125} {"train_loss": -27.558134078979492, "global_step": 508427, "epoch": 6125} {"train_loss": -27.110172271728516, "global_step": 508428, "epoch": 6125} {"train_loss": -27.575347900390625, "global_step": 508429, "epoch": 6125} {"train_loss": -27.756458282470703, "global_step": 508430, "epoch": 6125} {"train_loss": -27.3740291595459, "global_step": 508431, "epoch": 6125} {"train_loss": -27.242605209350586, "global_step": 508432, "epoch": 6125} {"train_loss": -27.445358276367188, "global_step": 508433, "epoch": 6125} {"train_loss": -27.3612003326416, "global_step": 508434, "epoch": 6125} {"train_loss": -27.615848541259766, "global_step": 508435, "epoch": 6125} {"train_loss": -27.297290802001953, "global_step": 508436, "epoch": 6125} {"train_loss": -27.3312931060791, "global_step": 508437, "epoch": 6125} {"train_loss": -27.769886016845703, "global_step": 508438, "epoch": 6125} {"train_loss": -27.633819580078125, "global_step": 508439, "epoch": 6125} {"train_loss": -27.422077178955078, "global_step": 508440, "epoch": 6125} {"train_loss": -27.48480224609375, "global_step": 508441, "epoch": 6125} {"train_loss": -27.41639518737793, "global_step": 508442, "epoch": 6125} {"train_loss": -27.702829360961914, "global_step": 508443, "epoch": 6125} {"train_loss": -27.548437118530273, "global_step": 508444, "epoch": 6125} {"train_loss": -27.389907836914062, "global_step": 508445, "epoch": 6125} {"train_loss": -27.73370933532715, "global_step": 508446, "epoch": 6125} {"train_loss": -27.8618106842041, "global_step": 508447, "epoch": 6125} {"train_loss": -27.741281509399414, "global_step": 508448, "epoch": 6125} {"train_loss": -27.95466423034668, "global_step": 508449, "epoch": 6125} {"train_loss": -27.500507354736328, "global_step": 508450, "epoch": 6125} {"train_loss": -27.668537139892578, "global_step": 508451, "epoch": 6125} {"train_loss": -27.621679306030273, "global_step": 508452, "epoch": 6125} {"train_loss": -27.61836051940918, "global_step": 508453, "epoch": 6125} {"train_loss": -27.637434005737305, "global_step": 508454, "epoch": 6125} {"train_loss": -27.54188346862793, "global_step": 508455, "epoch": 6125} {"train_loss": -27.809534072875977, "global_step": 508456, "epoch": 6125} {"train_loss": -27.32317409745182, "global_step": 508457, "epoch": 6125, "val_loss": 6596063.5} {"train_loss": -26.819488525390625, "global_step": 508458, "epoch": 6126} {"train_loss": -26.656600952148438, "global_step": 508459, "epoch": 6126} {"train_loss": -26.69590187072754, "global_step": 508460, "epoch": 6126} {"train_loss": -26.58200454711914, "global_step": 508461, "epoch": 6126} {"train_loss": -26.394433975219727, "global_step": 508462, "epoch": 6126} {"train_loss": -27.244848251342773, "global_step": 508463, "epoch": 6126} {"train_loss": -27.059986114501953, "global_step": 508464, "epoch": 6126} {"train_loss": -27.00494956970215, "global_step": 508465, "epoch": 6126} {"train_loss": -26.572351455688477, "global_step": 508466, "epoch": 6126} {"train_loss": -27.09710693359375, "global_step": 508467, "epoch": 6126} {"train_loss": -26.95192527770996, "global_step": 508468, "epoch": 6126} {"train_loss": -26.973752975463867, "global_step": 508469, "epoch": 6126} {"train_loss": -26.597875595092773, "global_step": 508470, "epoch": 6126} {"train_loss": -27.074628829956055, "global_step": 508471, "epoch": 6126} {"train_loss": -27.374128341674805, "global_step": 508472, "epoch": 6126} {"train_loss": -26.948883056640625, "global_step": 508473, "epoch": 6126} {"train_loss": -27.00412940979004, "global_step": 508474, "epoch": 6126} {"train_loss": -27.146747589111328, "global_step": 508475, "epoch": 6126} {"train_loss": -27.260969161987305, "global_step": 508476, "epoch": 6126} {"train_loss": -27.151411056518555, "global_step": 508477, "epoch": 6126} {"train_loss": -27.281890869140625, "global_step": 508478, "epoch": 6126} {"train_loss": -27.88779067993164, "global_step": 508479, "epoch": 6126} {"train_loss": -27.307226181030273, "global_step": 508480, "epoch": 6126} {"train_loss": -27.20746421813965, "global_step": 508481, "epoch": 6126} {"train_loss": -27.016162872314453, "global_step": 508482, "epoch": 6126} {"train_loss": -27.267292022705078, "global_step": 508483, "epoch": 6126} {"train_loss": -27.46587562561035, "global_step": 508484, "epoch": 6126} {"train_loss": -27.700796127319336, "global_step": 508485, "epoch": 6126} {"train_loss": -27.623889923095703, "global_step": 508486, "epoch": 6126} {"train_loss": -27.462940216064453, "global_step": 508487, "epoch": 6126} {"train_loss": -27.35758399963379, "global_step": 508488, "epoch": 6126} {"train_loss": -27.160415649414062, "global_step": 508489, "epoch": 6126} {"train_loss": -27.496606826782227, "global_step": 508490, "epoch": 6126} {"train_loss": -27.6074161529541, "global_step": 508491, "epoch": 6126} {"train_loss": -27.76032066345215, "global_step": 508492, "epoch": 6126} {"train_loss": -27.517709732055664, "global_step": 508493, "epoch": 6126} {"train_loss": -27.555057525634766, "global_step": 508494, "epoch": 6126} {"train_loss": -27.593597412109375, "global_step": 508495, "epoch": 6126} {"train_loss": -27.683103561401367, "global_step": 508496, "epoch": 6126} {"train_loss": -27.65534782409668, "global_step": 508497, "epoch": 6126} {"train_loss": -27.765634536743164, "global_step": 508498, "epoch": 6126} {"train_loss": -27.368335723876953, "global_step": 508499, "epoch": 6126} {"train_loss": -28.03241539001465, "global_step": 508500, "epoch": 6126} {"train_loss": -27.655029296875, "global_step": 508501, "epoch": 6126} {"train_loss": -27.695154190063477, "global_step": 508502, "epoch": 6126} {"train_loss": -27.782995223999023, "global_step": 508503, "epoch": 6126} {"train_loss": -27.281675338745117, "global_step": 508504, "epoch": 6126} {"train_loss": -27.55853843688965, "global_step": 508505, "epoch": 6126} {"train_loss": -27.819412231445312, "global_step": 508506, "epoch": 6126} {"train_loss": -27.604602813720703, "global_step": 508507, "epoch": 6126} {"train_loss": -27.751047134399414, "global_step": 508508, "epoch": 6126} {"train_loss": -27.63850212097168, "global_step": 508509, "epoch": 6126} {"train_loss": -27.495086669921875, "global_step": 508510, "epoch": 6126} {"train_loss": -27.368316650390625, "global_step": 508511, "epoch": 6126} {"train_loss": -27.6917781829834, "global_step": 508512, "epoch": 6126} {"train_loss": -27.565099716186523, "global_step": 508513, "epoch": 6126} {"train_loss": -26.943708419799805, "global_step": 508514, "epoch": 6126} {"train_loss": -27.252933502197266, "global_step": 508515, "epoch": 6126} {"train_loss": -26.949951171875, "global_step": 508516, "epoch": 6126} {"train_loss": -26.505823135375977, "global_step": 508517, "epoch": 6126} {"train_loss": -26.76027488708496, "global_step": 508518, "epoch": 6126} {"train_loss": -26.97315788269043, "global_step": 508519, "epoch": 6126} {"train_loss": -27.354358673095703, "global_step": 508520, "epoch": 6126} {"train_loss": -27.18594741821289, "global_step": 508521, "epoch": 6126} {"train_loss": -27.430688858032227, "global_step": 508522, "epoch": 6126} {"train_loss": -26.889362335205078, "global_step": 508523, "epoch": 6126} {"train_loss": -27.15961265563965, "global_step": 508524, "epoch": 6126} {"train_loss": -27.179895401000977, "global_step": 508525, "epoch": 6126} {"train_loss": -27.411945343017578, "global_step": 508526, "epoch": 6126} {"train_loss": -27.420654296875, "global_step": 508527, "epoch": 6126} {"train_loss": -27.229644775390625, "global_step": 508528, "epoch": 6126} {"train_loss": -27.611865997314453, "global_step": 508529, "epoch": 6126} {"train_loss": -27.534027099609375, "global_step": 508530, "epoch": 6126} {"train_loss": -27.295856475830078, "global_step": 508531, "epoch": 6126} {"train_loss": -27.436370849609375, "global_step": 508532, "epoch": 6126} {"train_loss": -27.26117515563965, "global_step": 508533, "epoch": 6126} {"train_loss": -27.6719913482666, "global_step": 508534, "epoch": 6126} {"train_loss": -27.231063842773438, "global_step": 508535, "epoch": 6126} {"train_loss": -27.471038818359375, "global_step": 508536, "epoch": 6126} {"train_loss": -27.68971824645996, "global_step": 508537, "epoch": 6126} {"train_loss": -27.455097198486328, "global_step": 508538, "epoch": 6126} {"train_loss": -27.74604606628418, "global_step": 508539, "epoch": 6126} {"train_loss": -27.310205298733997, "global_step": 508540, "epoch": 6126, "val_loss": 6553741.0} {"train_loss": -26.604883193969727, "global_step": 508541, "epoch": 6127} {"train_loss": -26.519025802612305, "global_step": 508542, "epoch": 6127} {"train_loss": -26.929990768432617, "global_step": 508543, "epoch": 6127} {"train_loss": -26.80414390563965, "global_step": 508544, "epoch": 6127} {"train_loss": -26.920114517211914, "global_step": 508545, "epoch": 6127} {"train_loss": -26.4512882232666, "global_step": 508546, "epoch": 6127} {"train_loss": -26.78553581237793, "global_step": 508547, "epoch": 6127} {"train_loss": -27.00007438659668, "global_step": 508548, "epoch": 6127} {"train_loss": -26.734323501586914, "global_step": 508549, "epoch": 6127} {"train_loss": -27.017440795898438, "global_step": 508550, "epoch": 6127} {"train_loss": -26.94217300415039, "global_step": 508551, "epoch": 6127} {"train_loss": -27.08743667602539, "global_step": 508552, "epoch": 6127} {"train_loss": -27.257598876953125, "global_step": 508553, "epoch": 6127} {"train_loss": -27.358869552612305, "global_step": 508554, "epoch": 6127} {"train_loss": -26.830453872680664, "global_step": 508555, "epoch": 6127} {"train_loss": -27.247812271118164, "global_step": 508556, "epoch": 6127} {"train_loss": -27.015823364257812, "global_step": 508557, "epoch": 6127} {"train_loss": -27.033161163330078, "global_step": 508558, "epoch": 6127} {"train_loss": -27.14130973815918, "global_step": 508559, "epoch": 6127} {"train_loss": -27.058401107788086, "global_step": 508560, "epoch": 6127} {"train_loss": -27.486770629882812, "global_step": 508561, "epoch": 6127} {"train_loss": -27.228967666625977, "global_step": 508562, "epoch": 6127} {"train_loss": -27.397756576538086, "global_step": 508563, "epoch": 6127} {"train_loss": -27.507404327392578, "global_step": 508564, "epoch": 6127} {"train_loss": -27.31426429748535, "global_step": 508565, "epoch": 6127} {"train_loss": -27.207443237304688, "global_step": 508566, "epoch": 6127} {"train_loss": -27.698999404907227, "global_step": 508567, "epoch": 6127} {"train_loss": -27.816242218017578, "global_step": 508568, "epoch": 6127} {"train_loss": -27.24159049987793, "global_step": 508569, "epoch": 6127} {"train_loss": -27.911453247070312, "global_step": 508570, "epoch": 6127} {"train_loss": -27.648706436157227, "global_step": 508571, "epoch": 6127} {"train_loss": -27.501829147338867, "global_step": 508572, "epoch": 6127} {"train_loss": -27.13803482055664, "global_step": 508573, "epoch": 6127} {"train_loss": -27.8543701171875, "global_step": 508574, "epoch": 6127} {"train_loss": -27.526203155517578, "global_step": 508575, "epoch": 6127} {"train_loss": -27.61585807800293, "global_step": 508576, "epoch": 6127} {"train_loss": -27.199234008789062, "global_step": 508577, "epoch": 6127} {"train_loss": -27.608463287353516, "global_step": 508578, "epoch": 6127} {"train_loss": -27.697370529174805, "global_step": 508579, "epoch": 6127} {"train_loss": -27.7747802734375, "global_step": 508580, "epoch": 6127} {"train_loss": -27.44928550720215, "global_step": 508581, "epoch": 6127} {"train_loss": -27.403711318969727, "global_step": 508582, "epoch": 6127} {"train_loss": -27.57144546508789, "global_step": 508583, "epoch": 6127} {"train_loss": -27.86859703063965, "global_step": 508584, "epoch": 6127} {"train_loss": -27.301624298095703, "global_step": 508585, "epoch": 6127} {"train_loss": -27.266942977905273, "global_step": 508586, "epoch": 6127} {"train_loss": -27.346820831298828, "global_step": 508587, "epoch": 6127} {"train_loss": -27.016956329345703, "global_step": 508588, "epoch": 6127} {"train_loss": -27.354639053344727, "global_step": 508589, "epoch": 6127} {"train_loss": -27.354736328125, "global_step": 508590, "epoch": 6127} {"train_loss": -27.886091232299805, "global_step": 508591, "epoch": 6127} {"train_loss": -26.98419189453125, "global_step": 508592, "epoch": 6127} {"train_loss": -27.10288429260254, "global_step": 508593, "epoch": 6127} {"train_loss": -26.449499130249023, "global_step": 508594, "epoch": 6127} {"train_loss": -25.830060958862305, "global_step": 508595, "epoch": 6127} {"train_loss": -26.255603790283203, "global_step": 508596, "epoch": 6127} {"train_loss": -26.851856231689453, "global_step": 508597, "epoch": 6127} {"train_loss": -27.07657814025879, "global_step": 508598, "epoch": 6127} {"train_loss": -26.189191818237305, "global_step": 508599, "epoch": 6127} {"train_loss": -26.109949111938477, "global_step": 508600, "epoch": 6127} {"train_loss": -26.268299102783203, "global_step": 508601, "epoch": 6127} {"train_loss": -26.421100616455078, "global_step": 508602, "epoch": 6127} {"train_loss": -26.05647087097168, "global_step": 508603, "epoch": 6127} {"train_loss": -26.004796981811523, "global_step": 508604, "epoch": 6127} {"train_loss": -26.863798141479492, "global_step": 508605, "epoch": 6127} {"train_loss": -26.5865421295166, "global_step": 508606, "epoch": 6127} {"train_loss": -27.04971694946289, "global_step": 508607, "epoch": 6127} {"train_loss": -26.94573974609375, "global_step": 508608, "epoch": 6127} {"train_loss": -26.5670108795166, "global_step": 508609, "epoch": 6127} {"train_loss": -26.876020431518555, "global_step": 508610, "epoch": 6127} {"train_loss": -26.80401039123535, "global_step": 508611, "epoch": 6127} {"train_loss": -26.802988052368164, "global_step": 508612, "epoch": 6127} {"train_loss": -26.757963180541992, "global_step": 508613, "epoch": 6127} {"train_loss": -26.9034423828125, "global_step": 508614, "epoch": 6127} {"train_loss": -26.923812866210938, "global_step": 508615, "epoch": 6127} {"train_loss": -26.94659423828125, "global_step": 508616, "epoch": 6127} {"train_loss": -27.216543197631836, "global_step": 508617, "epoch": 6127} {"train_loss": -26.884565353393555, "global_step": 508618, "epoch": 6127} {"train_loss": -27.04575538635254, "global_step": 508619, "epoch": 6127} {"train_loss": -26.944501876831055, "global_step": 508620, "epoch": 6127} {"train_loss": -27.07425880432129, "global_step": 508621, "epoch": 6127} {"train_loss": -27.147979736328125, "global_step": 508622, "epoch": 6127} {"train_loss": -27.05845184785774, "global_step": 508623, "epoch": 6127, "val_loss": 6534247.0} {"train_loss": -26.763324737548828, "global_step": 508624, "epoch": 6128} {"train_loss": -26.795698165893555, "global_step": 508625, "epoch": 6128} {"train_loss": -26.24252700805664, "global_step": 508626, "epoch": 6128} {"train_loss": -26.6336727142334, "global_step": 508627, "epoch": 6128} {"train_loss": -27.064558029174805, "global_step": 508628, "epoch": 6128} {"train_loss": -26.45905113220215, "global_step": 508629, "epoch": 6128} {"train_loss": -26.81753921508789, "global_step": 508630, "epoch": 6128} {"train_loss": -26.713342666625977, "global_step": 508631, "epoch": 6128} {"train_loss": -26.928558349609375, "global_step": 508632, "epoch": 6128} {"train_loss": -26.836807250976562, "global_step": 508633, "epoch": 6128} {"train_loss": -27.124439239501953, "global_step": 508634, "epoch": 6128} {"train_loss": -27.22013282775879, "global_step": 508635, "epoch": 6128} {"train_loss": -27.51190185546875, "global_step": 508636, "epoch": 6128} {"train_loss": -27.250202178955078, "global_step": 508637, "epoch": 6128} {"train_loss": -27.062408447265625, "global_step": 508638, "epoch": 6128} {"train_loss": -27.119043350219727, "global_step": 508639, "epoch": 6128} {"train_loss": -27.299650192260742, "global_step": 508640, "epoch": 6128} {"train_loss": -27.294757843017578, "global_step": 508641, "epoch": 6128} {"train_loss": -27.210851669311523, "global_step": 508642, "epoch": 6128} {"train_loss": -27.438919067382812, "global_step": 508643, "epoch": 6128} {"train_loss": -27.177978515625, "global_step": 508644, "epoch": 6128} {"train_loss": -27.554824829101562, "global_step": 508645, "epoch": 6128} {"train_loss": -27.303314208984375, "global_step": 508646, "epoch": 6128} {"train_loss": -27.39504051208496, "global_step": 508647, "epoch": 6128} {"train_loss": -27.621341705322266, "global_step": 508648, "epoch": 6128} {"train_loss": -27.5916690826416, "global_step": 508649, "epoch": 6128} {"train_loss": -27.52448081970215, "global_step": 508650, "epoch": 6128} {"train_loss": -27.324506759643555, "global_step": 508651, "epoch": 6128} {"train_loss": -27.435327529907227, "global_step": 508652, "epoch": 6128} {"train_loss": -27.25764274597168, "global_step": 508653, "epoch": 6128} {"train_loss": -27.660383224487305, "global_step": 508654, "epoch": 6128} {"train_loss": -27.619958877563477, "global_step": 508655, "epoch": 6128} {"train_loss": -27.811338424682617, "global_step": 508656, "epoch": 6128} {"train_loss": -27.61802101135254, "global_step": 508657, "epoch": 6128} {"train_loss": -27.169355392456055, "global_step": 508658, "epoch": 6128} {"train_loss": -27.754941940307617, "global_step": 508659, "epoch": 6128} {"train_loss": -27.676664352416992, "global_step": 508660, "epoch": 6128} {"train_loss": -27.80750846862793, "global_step": 508661, "epoch": 6128} {"train_loss": -27.437429428100586, "global_step": 508662, "epoch": 6128} {"train_loss": -27.659442901611328, "global_step": 508663, "epoch": 6128} {"train_loss": -27.266529083251953, "global_step": 508664, "epoch": 6128} {"train_loss": -27.141620635986328, "global_step": 508665, "epoch": 6128} {"train_loss": -26.75359535217285, "global_step": 508666, "epoch": 6128} {"train_loss": -25.99362564086914, "global_step": 508667, "epoch": 6128} {"train_loss": -26.80635643005371, "global_step": 508668, "epoch": 6128} {"train_loss": -27.466110229492188, "global_step": 508669, "epoch": 6128} {"train_loss": -27.422277450561523, "global_step": 508670, "epoch": 6128} {"train_loss": -27.28993034362793, "global_step": 508671, "epoch": 6128} {"train_loss": -27.448932647705078, "global_step": 508672, "epoch": 6128} {"train_loss": -27.465290069580078, "global_step": 508673, "epoch": 6128} {"train_loss": -27.086820602416992, "global_step": 508674, "epoch": 6128} {"train_loss": -26.8361759185791, "global_step": 508675, "epoch": 6128} {"train_loss": -27.83660888671875, "global_step": 508676, "epoch": 6128} {"train_loss": -27.734405517578125, "global_step": 508677, "epoch": 6128} {"train_loss": -27.518430709838867, "global_step": 508678, "epoch": 6128} {"train_loss": -27.5047550201416, "global_step": 508679, "epoch": 6128} {"train_loss": -26.8074951171875, "global_step": 508680, "epoch": 6128} {"train_loss": -27.11115837097168, "global_step": 508681, "epoch": 6128} {"train_loss": -27.306821823120117, "global_step": 508682, "epoch": 6128} {"train_loss": -26.899869918823242, "global_step": 508683, "epoch": 6128} {"train_loss": -27.226306915283203, "global_step": 508684, "epoch": 6128} {"train_loss": -27.1545352935791, "global_step": 508685, "epoch": 6128} {"train_loss": -27.498029708862305, "global_step": 508686, "epoch": 6128} {"train_loss": -27.2601261138916, "global_step": 508687, "epoch": 6128} {"train_loss": -27.527271270751953, "global_step": 508688, "epoch": 6128} {"train_loss": -27.245595932006836, "global_step": 508689, "epoch": 6128} {"train_loss": -27.5542049407959, "global_step": 508690, "epoch": 6128} {"train_loss": -27.299787521362305, "global_step": 508691, "epoch": 6128} {"train_loss": -27.213367462158203, "global_step": 508692, "epoch": 6128} {"train_loss": -27.43121910095215, "global_step": 508693, "epoch": 6128} {"train_loss": -27.1700382232666, "global_step": 508694, "epoch": 6128} {"train_loss": -27.203800201416016, "global_step": 508695, "epoch": 6128} {"train_loss": -27.522968292236328, "global_step": 508696, "epoch": 6128} {"train_loss": -27.249948501586914, "global_step": 508697, "epoch": 6128} {"train_loss": -27.859893798828125, "global_step": 508698, "epoch": 6128} {"train_loss": -27.880329132080078, "global_step": 508699, "epoch": 6128} {"train_loss": -27.64763832092285, "global_step": 508700, "epoch": 6128} {"train_loss": -27.713354110717773, "global_step": 508701, "epoch": 6128} {"train_loss": -27.59004783630371, "global_step": 508702, "epoch": 6128} {"train_loss": -27.2039852142334, "global_step": 508703, "epoch": 6128} {"train_loss": -27.789281845092773, "global_step": 508704, "epoch": 6128} {"train_loss": -27.824981689453125, "global_step": 508705, "epoch": 6128} {"train_loss": -27.291699995477515, "global_step": 508706, "epoch": 6128, "val_loss": 6569106.0} {"train_loss": -26.20411491394043, "global_step": 508707, "epoch": 6129} {"train_loss": -26.804412841796875, "global_step": 508708, "epoch": 6129} {"train_loss": -27.339990615844727, "global_step": 508709, "epoch": 6129} {"train_loss": -26.632543563842773, "global_step": 508710, "epoch": 6129} {"train_loss": -27.018970489501953, "global_step": 508711, "epoch": 6129} {"train_loss": -27.2210693359375, "global_step": 508712, "epoch": 6129} {"train_loss": -26.675235748291016, "global_step": 508713, "epoch": 6129} {"train_loss": -27.199600219726562, "global_step": 508714, "epoch": 6129} {"train_loss": -26.8619384765625, "global_step": 508715, "epoch": 6129} {"train_loss": -27.46882438659668, "global_step": 508716, "epoch": 6129} {"train_loss": -26.91634178161621, "global_step": 508717, "epoch": 6129} {"train_loss": -27.141416549682617, "global_step": 508718, "epoch": 6129} {"train_loss": -27.113636016845703, "global_step": 508719, "epoch": 6129} {"train_loss": -27.05769157409668, "global_step": 508720, "epoch": 6129} {"train_loss": -27.126577377319336, "global_step": 508721, "epoch": 6129} {"train_loss": -27.008956909179688, "global_step": 508722, "epoch": 6129} {"train_loss": -27.057546615600586, "global_step": 508723, "epoch": 6129} {"train_loss": -26.878061294555664, "global_step": 508724, "epoch": 6129} {"train_loss": -27.566938400268555, "global_step": 508725, "epoch": 6129} {"train_loss": -27.123926162719727, "global_step": 508726, "epoch": 6129} {"train_loss": -27.20745277404785, "global_step": 508727, "epoch": 6129} {"train_loss": -27.043333053588867, "global_step": 508728, "epoch": 6129} {"train_loss": -27.196014404296875, "global_step": 508729, "epoch": 6129} {"train_loss": -27.253131866455078, "global_step": 508730, "epoch": 6129} {"train_loss": -27.47796630859375, "global_step": 508731, "epoch": 6129} {"train_loss": -27.34248161315918, "global_step": 508732, "epoch": 6129} {"train_loss": -27.458545684814453, "global_step": 508733, "epoch": 6129} {"train_loss": -27.269412994384766, "global_step": 508734, "epoch": 6129} {"train_loss": -26.98188591003418, "global_step": 508735, "epoch": 6129} {"train_loss": -27.417699813842773, "global_step": 508736, "epoch": 6129} {"train_loss": -27.71430778503418, "global_step": 508737, "epoch": 6129} {"train_loss": -27.579700469970703, "global_step": 508738, "epoch": 6129} {"train_loss": -27.82415771484375, "global_step": 508739, "epoch": 6129} {"train_loss": -27.37152671813965, "global_step": 508740, "epoch": 6129} {"train_loss": -27.4995059967041, "global_step": 508741, "epoch": 6129} {"train_loss": -27.01885414123535, "global_step": 508742, "epoch": 6129} {"train_loss": -27.5532283782959, "global_step": 508743, "epoch": 6129} {"train_loss": -27.81418800354004, "global_step": 508744, "epoch": 6129} {"train_loss": -27.134735107421875, "global_step": 508745, "epoch": 6129} {"train_loss": -27.4792537689209, "global_step": 508746, "epoch": 6129} {"train_loss": -27.357837677001953, "global_step": 508747, "epoch": 6129} {"train_loss": -28.09140968322754, "global_step": 508748, "epoch": 6129} {"train_loss": -27.4637451171875, "global_step": 508749, "epoch": 6129} {"train_loss": -27.692529678344727, "global_step": 508750, "epoch": 6129} {"train_loss": -27.741077423095703, "global_step": 508751, "epoch": 6129} {"train_loss": -27.884906768798828, "global_step": 508752, "epoch": 6129} {"train_loss": -27.602222442626953, "global_step": 508753, "epoch": 6129} {"train_loss": -27.4697322845459, "global_step": 508754, "epoch": 6129} {"train_loss": -27.263614654541016, "global_step": 508755, "epoch": 6129} {"train_loss": -27.614429473876953, "global_step": 508756, "epoch": 6129} {"train_loss": -27.601789474487305, "global_step": 508757, "epoch": 6129} {"train_loss": -27.860095977783203, "global_step": 508758, "epoch": 6129} {"train_loss": -27.490751266479492, "global_step": 508759, "epoch": 6129} {"train_loss": -27.63722801208496, "global_step": 508760, "epoch": 6129} {"train_loss": -27.50067138671875, "global_step": 508761, "epoch": 6129} {"train_loss": -27.725576400756836, "global_step": 508762, "epoch": 6129} {"train_loss": -27.161062240600586, "global_step": 508763, "epoch": 6129} {"train_loss": -27.240039825439453, "global_step": 508764, "epoch": 6129} {"train_loss": -27.757461547851562, "global_step": 508765, "epoch": 6129} {"train_loss": -27.29900550842285, "global_step": 508766, "epoch": 6129} {"train_loss": -27.2857723236084, "global_step": 508767, "epoch": 6129} {"train_loss": -27.357763290405273, "global_step": 508768, "epoch": 6129} {"train_loss": -27.383316040039062, "global_step": 508769, "epoch": 6129} {"train_loss": -27.738439559936523, "global_step": 508770, "epoch": 6129} {"train_loss": -27.46354103088379, "global_step": 508771, "epoch": 6129} {"train_loss": -27.6134090423584, "global_step": 508772, "epoch": 6129} {"train_loss": -27.389892578125, "global_step": 508773, "epoch": 6129} {"train_loss": -27.681732177734375, "global_step": 508774, "epoch": 6129} {"train_loss": -27.58704948425293, "global_step": 508775, "epoch": 6129} {"train_loss": -27.748449325561523, "global_step": 508776, "epoch": 6129} {"train_loss": -26.92705726623535, "global_step": 508777, "epoch": 6129} {"train_loss": -27.4793643951416, "global_step": 508778, "epoch": 6129} {"train_loss": -27.659976959228516, "global_step": 508779, "epoch": 6129} {"train_loss": -27.39374351501465, "global_step": 508780, "epoch": 6129} {"train_loss": -27.48105239868164, "global_step": 508781, "epoch": 6129} {"train_loss": -27.40370750427246, "global_step": 508782, "epoch": 6129} {"train_loss": -27.431034088134766, "global_step": 508783, "epoch": 6129} {"train_loss": -27.560068130493164, "global_step": 508784, "epoch": 6129} {"train_loss": -27.496679306030273, "global_step": 508785, "epoch": 6129} {"train_loss": -27.283283233642578, "global_step": 508786, "epoch": 6129} {"train_loss": -27.153894424438477, "global_step": 508787, "epoch": 6129} {"train_loss": -27.596899032592773, "global_step": 508788, "epoch": 6129} {"train_loss": -27.379812125700067, "global_step": 508789, "epoch": 6129, "val_loss": 6573070.0} {"train_loss": -26.76199722290039, "global_step": 508790, "epoch": 6130} {"train_loss": -26.6241455078125, "global_step": 508791, "epoch": 6130} {"train_loss": -26.824756622314453, "global_step": 508792, "epoch": 6130} {"train_loss": -26.69587516784668, "global_step": 508793, "epoch": 6130} {"train_loss": -27.55414390563965, "global_step": 508794, "epoch": 6130} {"train_loss": -26.904590606689453, "global_step": 508795, "epoch": 6130} {"train_loss": -27.353540420532227, "global_step": 508796, "epoch": 6130} {"train_loss": -27.312768936157227, "global_step": 508797, "epoch": 6130} {"train_loss": -27.523822784423828, "global_step": 508798, "epoch": 6130} {"train_loss": -27.357019424438477, "global_step": 508799, "epoch": 6130} {"train_loss": -27.008581161499023, "global_step": 508800, "epoch": 6130} {"train_loss": -27.491912841796875, "global_step": 508801, "epoch": 6130} {"train_loss": -27.476865768432617, "global_step": 508802, "epoch": 6130} {"train_loss": -27.448034286499023, "global_step": 508803, "epoch": 6130} {"train_loss": -27.151376724243164, "global_step": 508804, "epoch": 6130} {"train_loss": -27.365646362304688, "global_step": 508805, "epoch": 6130} {"train_loss": -27.609891891479492, "global_step": 508806, "epoch": 6130} {"train_loss": -27.205896377563477, "global_step": 508807, "epoch": 6130} {"train_loss": -27.166357040405273, "global_step": 508808, "epoch": 6130} {"train_loss": -27.354841232299805, "global_step": 508809, "epoch": 6130} {"train_loss": -27.2596435546875, "global_step": 508810, "epoch": 6130} {"train_loss": -27.427488327026367, "global_step": 508811, "epoch": 6130} {"train_loss": -27.298288345336914, "global_step": 508812, "epoch": 6130} {"train_loss": -27.0521183013916, "global_step": 508813, "epoch": 6130} {"train_loss": -27.185928344726562, "global_step": 508814, "epoch": 6130} {"train_loss": -27.555700302124023, "global_step": 508815, "epoch": 6130} {"train_loss": -27.708799362182617, "global_step": 508816, "epoch": 6130} {"train_loss": -27.1224365234375, "global_step": 508817, "epoch": 6130} {"train_loss": -27.1050968170166, "global_step": 508818, "epoch": 6130} {"train_loss": -27.440046310424805, "global_step": 508819, "epoch": 6130} {"train_loss": -27.168777465820312, "global_step": 508820, "epoch": 6130} {"train_loss": -27.382287979125977, "global_step": 508821, "epoch": 6130} {"train_loss": -27.650623321533203, "global_step": 508822, "epoch": 6130} {"train_loss": -27.3077392578125, "global_step": 508823, "epoch": 6130} {"train_loss": -27.301502227783203, "global_step": 508824, "epoch": 6130} {"train_loss": -27.390859603881836, "global_step": 508825, "epoch": 6130} {"train_loss": -27.213470458984375, "global_step": 508826, "epoch": 6130} {"train_loss": -26.785058975219727, "global_step": 508827, "epoch": 6130} {"train_loss": -27.438003540039062, "global_step": 508828, "epoch": 6130} {"train_loss": -27.459360122680664, "global_step": 508829, "epoch": 6130} {"train_loss": -27.344308853149414, "global_step": 508830, "epoch": 6130} {"train_loss": -27.429853439331055, "global_step": 508831, "epoch": 6130} {"train_loss": -27.83563232421875, "global_step": 508832, "epoch": 6130} {"train_loss": -27.303298950195312, "global_step": 508833, "epoch": 6130} {"train_loss": -27.73737144470215, "global_step": 508834, "epoch": 6130} {"train_loss": -27.462560653686523, "global_step": 508835, "epoch": 6130} {"train_loss": -27.180505752563477, "global_step": 508836, "epoch": 6130} {"train_loss": -27.6292724609375, "global_step": 508837, "epoch": 6130} {"train_loss": -27.520238876342773, "global_step": 508838, "epoch": 6130} {"train_loss": -27.27705192565918, "global_step": 508839, "epoch": 6130} {"train_loss": -27.602624893188477, "global_step": 508840, "epoch": 6130} {"train_loss": -27.51352310180664, "global_step": 508841, "epoch": 6130} {"train_loss": -27.159778594970703, "global_step": 508842, "epoch": 6130} {"train_loss": -27.65907096862793, "global_step": 508843, "epoch": 6130} {"train_loss": -27.373071670532227, "global_step": 508844, "epoch": 6130} {"train_loss": -27.580982208251953, "global_step": 508845, "epoch": 6130} {"train_loss": -27.4146728515625, "global_step": 508846, "epoch": 6130} {"train_loss": -27.764196395874023, "global_step": 508847, "epoch": 6130} {"train_loss": -27.2081298828125, "global_step": 508848, "epoch": 6130} {"train_loss": -27.481901168823242, "global_step": 508849, "epoch": 6130} {"train_loss": -27.257232666015625, "global_step": 508850, "epoch": 6130} {"train_loss": -27.3028621673584, "global_step": 508851, "epoch": 6130} {"train_loss": -27.074033737182617, "global_step": 508852, "epoch": 6130} {"train_loss": -27.2945613861084, "global_step": 508853, "epoch": 6130} {"train_loss": -27.507009506225586, "global_step": 508854, "epoch": 6130} {"train_loss": -27.61872673034668, "global_step": 508855, "epoch": 6130} {"train_loss": -27.34151268005371, "global_step": 508856, "epoch": 6130} {"train_loss": -27.417470932006836, "global_step": 508857, "epoch": 6130} {"train_loss": -27.518402099609375, "global_step": 508858, "epoch": 6130} {"train_loss": -27.693099975585938, "global_step": 508859, "epoch": 6130} {"train_loss": -27.917865753173828, "global_step": 508860, "epoch": 6130} {"train_loss": -27.2864933013916, "global_step": 508861, "epoch": 6130} {"train_loss": -27.51235008239746, "global_step": 508862, "epoch": 6130} {"train_loss": -27.527740478515625, "global_step": 508863, "epoch": 6130} {"train_loss": -27.602746963500977, "global_step": 508864, "epoch": 6130} {"train_loss": -27.459375381469727, "global_step": 508865, "epoch": 6130} {"train_loss": -27.7249813079834, "global_step": 508866, "epoch": 6130} {"train_loss": -27.56854248046875, "global_step": 508867, "epoch": 6130} {"train_loss": -27.697708129882812, "global_step": 508868, "epoch": 6130} {"train_loss": -27.563434600830078, "global_step": 508869, "epoch": 6130} {"train_loss": -27.2292537689209, "global_step": 508870, "epoch": 6130} {"train_loss": -27.54095458984375, "global_step": 508871, "epoch": 6130} {"train_loss": -27.358406434576196, "global_step": 508872, "epoch": 6130, "val_loss": 6618440.5} {"train_loss": -27.333852767944336, "global_step": 508873, "epoch": 6131} {"train_loss": -27.50770378112793, "global_step": 508874, "epoch": 6131} {"train_loss": -27.290685653686523, "global_step": 508875, "epoch": 6131} {"train_loss": -27.036914825439453, "global_step": 508876, "epoch": 6131} {"train_loss": -26.923490524291992, "global_step": 508877, "epoch": 6131} {"train_loss": -26.83217430114746, "global_step": 508878, "epoch": 6131} {"train_loss": -27.56165885925293, "global_step": 508879, "epoch": 6131} {"train_loss": -26.934616088867188, "global_step": 508880, "epoch": 6131} {"train_loss": -27.122608184814453, "global_step": 508881, "epoch": 6131} {"train_loss": -26.778364181518555, "global_step": 508882, "epoch": 6131} {"train_loss": -27.015674591064453, "global_step": 508883, "epoch": 6131} {"train_loss": -27.407424926757812, "global_step": 508884, "epoch": 6131} {"train_loss": -27.177587509155273, "global_step": 508885, "epoch": 6131} {"train_loss": -27.614013671875, "global_step": 508886, "epoch": 6131} {"train_loss": -27.46723747253418, "global_step": 508887, "epoch": 6131} {"train_loss": -27.097204208374023, "global_step": 508888, "epoch": 6131} {"train_loss": -27.15643882751465, "global_step": 508889, "epoch": 6131} {"train_loss": -27.30313491821289, "global_step": 508890, "epoch": 6131} {"train_loss": -27.141408920288086, "global_step": 508891, "epoch": 6131} {"train_loss": -27.091068267822266, "global_step": 508892, "epoch": 6131} {"train_loss": -27.351343154907227, "global_step": 508893, "epoch": 6131} {"train_loss": -27.55811882019043, "global_step": 508894, "epoch": 6131} {"train_loss": -27.616418838500977, "global_step": 508895, "epoch": 6131} {"train_loss": -27.22926139831543, "global_step": 508896, "epoch": 6131} {"train_loss": -26.98712730407715, "global_step": 508897, "epoch": 6131} {"train_loss": -27.154882431030273, "global_step": 508898, "epoch": 6131} {"train_loss": -27.272397994995117, "global_step": 508899, "epoch": 6131} {"train_loss": -27.555500030517578, "global_step": 508900, "epoch": 6131} {"train_loss": -27.49335289001465, "global_step": 508901, "epoch": 6131} {"train_loss": -26.9324951171875, "global_step": 508902, "epoch": 6131} {"train_loss": -27.118671417236328, "global_step": 508903, "epoch": 6131} {"train_loss": -27.5418758392334, "global_step": 508904, "epoch": 6131} {"train_loss": -26.987323760986328, "global_step": 508905, "epoch": 6131} {"train_loss": -26.991683959960938, "global_step": 508906, "epoch": 6131} {"train_loss": -27.443185806274414, "global_step": 508907, "epoch": 6131} {"train_loss": -27.758686065673828, "global_step": 508908, "epoch": 6131} {"train_loss": -27.269681930541992, "global_step": 508909, "epoch": 6131} {"train_loss": -27.6466121673584, "global_step": 508910, "epoch": 6131} {"train_loss": -27.4388484954834, "global_step": 508911, "epoch": 6131} {"train_loss": -27.57147789001465, "global_step": 508912, "epoch": 6131} {"train_loss": -27.39698600769043, "global_step": 508913, "epoch": 6131} {"train_loss": -27.71878433227539, "global_step": 508914, "epoch": 6131} {"train_loss": -27.659454345703125, "global_step": 508915, "epoch": 6131} {"train_loss": -27.423608779907227, "global_step": 508916, "epoch": 6131} {"train_loss": -27.577478408813477, "global_step": 508917, "epoch": 6131} {"train_loss": -27.584613800048828, "global_step": 508918, "epoch": 6131} {"train_loss": -27.449979782104492, "global_step": 508919, "epoch": 6131} {"train_loss": -27.750823974609375, "global_step": 508920, "epoch": 6131} {"train_loss": -27.690671920776367, "global_step": 508921, "epoch": 6131} {"train_loss": -27.78481101989746, "global_step": 508922, "epoch": 6131} {"train_loss": -26.941177368164062, "global_step": 508923, "epoch": 6131} {"train_loss": -27.437402725219727, "global_step": 508924, "epoch": 6131} {"train_loss": -27.59286880493164, "global_step": 508925, "epoch": 6131} {"train_loss": -27.288122177124023, "global_step": 508926, "epoch": 6131} {"train_loss": -27.59779167175293, "global_step": 508927, "epoch": 6131} {"train_loss": -27.653396606445312, "global_step": 508928, "epoch": 6131} {"train_loss": -27.40143394470215, "global_step": 508929, "epoch": 6131} {"train_loss": -27.66400718688965, "global_step": 508930, "epoch": 6131} {"train_loss": -27.862457275390625, "global_step": 508931, "epoch": 6131} {"train_loss": -27.418075561523438, "global_step": 508932, "epoch": 6131} {"train_loss": -27.7377872467041, "global_step": 508933, "epoch": 6131} {"train_loss": -27.7442684173584, "global_step": 508934, "epoch": 6131} {"train_loss": -27.621435165405273, "global_step": 508935, "epoch": 6131} {"train_loss": -27.18291664123535, "global_step": 508936, "epoch": 6131} {"train_loss": -27.530866622924805, "global_step": 508937, "epoch": 6131} {"train_loss": -27.6228084564209, "global_step": 508938, "epoch": 6131} {"train_loss": -27.508214950561523, "global_step": 508939, "epoch": 6131} {"train_loss": -27.600849151611328, "global_step": 508940, "epoch": 6131} {"train_loss": -26.913808822631836, "global_step": 508941, "epoch": 6131} {"train_loss": -27.4540958404541, "global_step": 508942, "epoch": 6131} {"train_loss": -27.200674057006836, "global_step": 508943, "epoch": 6131} {"train_loss": -27.585412979125977, "global_step": 508944, "epoch": 6131} {"train_loss": -27.42206382751465, "global_step": 508945, "epoch": 6131} {"train_loss": -27.2150936126709, "global_step": 508946, "epoch": 6131} {"train_loss": -27.37591552734375, "global_step": 508947, "epoch": 6131} {"train_loss": -27.15314292907715, "global_step": 508948, "epoch": 6131} {"train_loss": -27.408279418945312, "global_step": 508949, "epoch": 6131} {"train_loss": -27.475515365600586, "global_step": 508950, "epoch": 6131} {"train_loss": -27.621007919311523, "global_step": 508951, "epoch": 6131} {"train_loss": -27.162006378173828, "global_step": 508952, "epoch": 6131} {"train_loss": -27.743616104125977, "global_step": 508953, "epoch": 6131} {"train_loss": -26.977643966674805, "global_step": 508954, "epoch": 6131} {"train_loss": -27.363458426601916, "global_step": 508955, "epoch": 6131, "val_loss": 6535087.5} {"train_loss": -25.286619186401367, "global_step": 508956, "epoch": 6132} {"train_loss": -24.806015014648438, "global_step": 508957, "epoch": 6132} {"train_loss": -23.78175926208496, "global_step": 508958, "epoch": 6132} {"train_loss": -24.52541160583496, "global_step": 508959, "epoch": 6132} {"train_loss": -25.921838760375977, "global_step": 508960, "epoch": 6132} {"train_loss": -26.185001373291016, "global_step": 508961, "epoch": 6132} {"train_loss": -26.21699333190918, "global_step": 508962, "epoch": 6132} {"train_loss": -26.077096939086914, "global_step": 508963, "epoch": 6132} {"train_loss": -26.63348960876465, "global_step": 508964, "epoch": 6132} {"train_loss": -26.562952041625977, "global_step": 508965, "epoch": 6132} {"train_loss": -26.09698486328125, "global_step": 508966, "epoch": 6132} {"train_loss": -26.720468521118164, "global_step": 508967, "epoch": 6132} {"train_loss": -26.274755477905273, "global_step": 508968, "epoch": 6132} {"train_loss": -26.607696533203125, "global_step": 508969, "epoch": 6132} {"train_loss": -26.555723190307617, "global_step": 508970, "epoch": 6132} {"train_loss": -27.029815673828125, "global_step": 508971, "epoch": 6132} {"train_loss": -26.782745361328125, "global_step": 508972, "epoch": 6132} {"train_loss": -26.71974754333496, "global_step": 508973, "epoch": 6132} {"train_loss": -26.842512130737305, "global_step": 508974, "epoch": 6132} {"train_loss": -26.935394287109375, "global_step": 508975, "epoch": 6132} {"train_loss": -26.918964385986328, "global_step": 508976, "epoch": 6132} {"train_loss": -26.969125747680664, "global_step": 508977, "epoch": 6132} {"train_loss": -26.926916122436523, "global_step": 508978, "epoch": 6132} {"train_loss": -27.353601455688477, "global_step": 508979, "epoch": 6132} {"train_loss": -27.115222930908203, "global_step": 508980, "epoch": 6132} {"train_loss": -27.276336669921875, "global_step": 508981, "epoch": 6132} {"train_loss": -27.184799194335938, "global_step": 508982, "epoch": 6132} {"train_loss": -27.31894874572754, "global_step": 508983, "epoch": 6132} {"train_loss": -27.20769691467285, "global_step": 508984, "epoch": 6132} {"train_loss": -26.921558380126953, "global_step": 508985, "epoch": 6132} {"train_loss": -26.930368423461914, "global_step": 508986, "epoch": 6132} {"train_loss": -27.150766372680664, "global_step": 508987, "epoch": 6132} {"train_loss": -27.342737197875977, "global_step": 508988, "epoch": 6132} {"train_loss": -27.557966232299805, "global_step": 508989, "epoch": 6132} {"train_loss": -27.601232528686523, "global_step": 508990, "epoch": 6132} {"train_loss": -27.379255294799805, "global_step": 508991, "epoch": 6132} {"train_loss": -27.336181640625, "global_step": 508992, "epoch": 6132} {"train_loss": -27.4870548248291, "global_step": 508993, "epoch": 6132} {"train_loss": -27.41552734375, "global_step": 508994, "epoch": 6132} {"train_loss": -27.16581153869629, "global_step": 508995, "epoch": 6132} {"train_loss": -27.282367706298828, "global_step": 508996, "epoch": 6132} {"train_loss": -27.61317253112793, "global_step": 508997, "epoch": 6132} {"train_loss": -27.611194610595703, "global_step": 508998, "epoch": 6132} {"train_loss": -27.89080238342285, "global_step": 508999, "epoch": 6132} {"train_loss": -27.718063354492188, "global_step": 509000, "epoch": 6132} {"train_loss": -27.79059410095215, "global_step": 509001, "epoch": 6132} {"train_loss": -27.565982818603516, "global_step": 509002, "epoch": 6132} {"train_loss": -27.96010398864746, "global_step": 509003, "epoch": 6132} {"train_loss": -28.03799819946289, "global_step": 509004, "epoch": 6132} {"train_loss": -27.727697372436523, "global_step": 509005, "epoch": 6132} {"train_loss": -27.45220375061035, "global_step": 509006, "epoch": 6132} {"train_loss": -27.833358764648438, "global_step": 509007, "epoch": 6132} {"train_loss": -27.50457763671875, "global_step": 509008, "epoch": 6132} {"train_loss": -27.561933517456055, "global_step": 509009, "epoch": 6132} {"train_loss": -27.588672637939453, "global_step": 509010, "epoch": 6132} {"train_loss": -27.48701286315918, "global_step": 509011, "epoch": 6132} {"train_loss": -27.547094345092773, "global_step": 509012, "epoch": 6132} {"train_loss": -27.731525421142578, "global_step": 509013, "epoch": 6132} {"train_loss": -27.6147518157959, "global_step": 509014, "epoch": 6132} {"train_loss": -27.550872802734375, "global_step": 509015, "epoch": 6132} {"train_loss": -27.888513565063477, "global_step": 509016, "epoch": 6132} {"train_loss": -27.61932945251465, "global_step": 509017, "epoch": 6132} {"train_loss": -27.493183135986328, "global_step": 509018, "epoch": 6132} {"train_loss": -27.398107528686523, "global_step": 509019, "epoch": 6132} {"train_loss": -27.197235107421875, "global_step": 509020, "epoch": 6132} {"train_loss": -27.09102439880371, "global_step": 509021, "epoch": 6132} {"train_loss": -27.065855026245117, "global_step": 509022, "epoch": 6132} {"train_loss": -26.56708335876465, "global_step": 509023, "epoch": 6132} {"train_loss": -26.58247184753418, "global_step": 509024, "epoch": 6132} {"train_loss": -26.928089141845703, "global_step": 509025, "epoch": 6132} {"train_loss": -27.43671989440918, "global_step": 509026, "epoch": 6132} {"train_loss": -27.33761978149414, "global_step": 509027, "epoch": 6132} {"train_loss": -26.977420806884766, "global_step": 509028, "epoch": 6132} {"train_loss": -26.76308250427246, "global_step": 509029, "epoch": 6132} {"train_loss": -27.164743423461914, "global_step": 509030, "epoch": 6132} {"train_loss": -27.476537704467773, "global_step": 509031, "epoch": 6132} {"train_loss": -26.7063045501709, "global_step": 509032, "epoch": 6132} {"train_loss": -27.231876373291016, "global_step": 509033, "epoch": 6132} {"train_loss": -27.12078285217285, "global_step": 509034, "epoch": 6132} {"train_loss": -27.364990234375, "global_step": 509035, "epoch": 6132} {"train_loss": -27.20309829711914, "global_step": 509036, "epoch": 6132} {"train_loss": -27.260351181030273, "global_step": 509037, "epoch": 6132} {"train_loss": -27.045914799334057, "global_step": 509038, "epoch": 6132, "val_loss": 6580077.5} {"train_loss": -26.664087295532227, "global_step": 509039, "epoch": 6133} {"train_loss": -26.903156280517578, "global_step": 509040, "epoch": 6133} {"train_loss": -26.079944610595703, "global_step": 509041, "epoch": 6133} {"train_loss": -26.53378677368164, "global_step": 509042, "epoch": 6133} {"train_loss": -26.315160751342773, "global_step": 509043, "epoch": 6133} {"train_loss": -26.531400680541992, "global_step": 509044, "epoch": 6133} {"train_loss": -26.70794105529785, "global_step": 509045, "epoch": 6133} {"train_loss": -26.753528594970703, "global_step": 509046, "epoch": 6133} {"train_loss": -26.544580459594727, "global_step": 509047, "epoch": 6133} {"train_loss": -26.81068229675293, "global_step": 509048, "epoch": 6133} {"train_loss": -26.998327255249023, "global_step": 509049, "epoch": 6133} {"train_loss": -26.848386764526367, "global_step": 509050, "epoch": 6133} {"train_loss": -27.256383895874023, "global_step": 509051, "epoch": 6133} {"train_loss": -26.921972274780273, "global_step": 509052, "epoch": 6133} {"train_loss": -26.904712677001953, "global_step": 509053, "epoch": 6133} {"train_loss": -27.36586570739746, "global_step": 509054, "epoch": 6133} {"train_loss": -27.184478759765625, "global_step": 509055, "epoch": 6133} {"train_loss": -26.804630279541016, "global_step": 509056, "epoch": 6133} {"train_loss": -27.32160758972168, "global_step": 509057, "epoch": 6133} {"train_loss": -27.4632625579834, "global_step": 509058, "epoch": 6133} {"train_loss": -27.023700714111328, "global_step": 509059, "epoch": 6133} {"train_loss": -27.437000274658203, "global_step": 509060, "epoch": 6133} {"train_loss": -27.08989906311035, "global_step": 509061, "epoch": 6133} {"train_loss": -27.423791885375977, "global_step": 509062, "epoch": 6133} {"train_loss": -27.39381217956543, "global_step": 509063, "epoch": 6133} {"train_loss": -27.5645751953125, "global_step": 509064, "epoch": 6133} {"train_loss": -27.511215209960938, "global_step": 509065, "epoch": 6133} {"train_loss": -27.439960479736328, "global_step": 509066, "epoch": 6133} {"train_loss": -27.30584716796875, "global_step": 509067, "epoch": 6133} {"train_loss": -27.322223663330078, "global_step": 509068, "epoch": 6133} {"train_loss": -27.591094970703125, "global_step": 509069, "epoch": 6133} {"train_loss": -27.553762435913086, "global_step": 509070, "epoch": 6133} {"train_loss": -27.38971519470215, "global_step": 509071, "epoch": 6133} {"train_loss": -28.009246826171875, "global_step": 509072, "epoch": 6133} {"train_loss": -27.68023681640625, "global_step": 509073, "epoch": 6133} {"train_loss": -27.172510147094727, "global_step": 509074, "epoch": 6133} {"train_loss": -28.011825561523438, "global_step": 509075, "epoch": 6133} {"train_loss": -27.301359176635742, "global_step": 509076, "epoch": 6133} {"train_loss": -27.7938175201416, "global_step": 509077, "epoch": 6133} {"train_loss": -27.701221466064453, "global_step": 509078, "epoch": 6133} {"train_loss": -27.720691680908203, "global_step": 509079, "epoch": 6133} {"train_loss": -27.483068466186523, "global_step": 509080, "epoch": 6133} {"train_loss": -27.360645294189453, "global_step": 509081, "epoch": 6133} {"train_loss": -27.76690673828125, "global_step": 509082, "epoch": 6133} {"train_loss": -27.517507553100586, "global_step": 509083, "epoch": 6133} {"train_loss": -27.65296745300293, "global_step": 509084, "epoch": 6133} {"train_loss": -27.659870147705078, "global_step": 509085, "epoch": 6133} {"train_loss": -27.704404830932617, "global_step": 509086, "epoch": 6133} {"train_loss": -27.492446899414062, "global_step": 509087, "epoch": 6133} {"train_loss": -27.614242553710938, "global_step": 509088, "epoch": 6133} {"train_loss": -27.8184814453125, "global_step": 509089, "epoch": 6133} {"train_loss": -27.2436580657959, "global_step": 509090, "epoch": 6133} {"train_loss": -27.293720245361328, "global_step": 509091, "epoch": 6133} {"train_loss": -27.554889678955078, "global_step": 509092, "epoch": 6133} {"train_loss": -27.68169593811035, "global_step": 509093, "epoch": 6133} {"train_loss": -27.360015869140625, "global_step": 509094, "epoch": 6133} {"train_loss": -27.3751277923584, "global_step": 509095, "epoch": 6133} {"train_loss": -27.50806999206543, "global_step": 509096, "epoch": 6133} {"train_loss": -27.23456382751465, "global_step": 509097, "epoch": 6133} {"train_loss": -27.20403480529785, "global_step": 509098, "epoch": 6133} {"train_loss": -27.217191696166992, "global_step": 509099, "epoch": 6133} {"train_loss": -27.339263916015625, "global_step": 509100, "epoch": 6133} {"train_loss": -27.32728385925293, "global_step": 509101, "epoch": 6133} {"train_loss": -27.307147979736328, "global_step": 509102, "epoch": 6133} {"train_loss": -27.63262367248535, "global_step": 509103, "epoch": 6133} {"train_loss": -27.709197998046875, "global_step": 509104, "epoch": 6133} {"train_loss": -27.487262725830078, "global_step": 509105, "epoch": 6133} {"train_loss": -27.5858097076416, "global_step": 509106, "epoch": 6133} {"train_loss": -27.643756866455078, "global_step": 509107, "epoch": 6133} {"train_loss": -27.958642959594727, "global_step": 509108, "epoch": 6133} {"train_loss": -27.437366485595703, "global_step": 509109, "epoch": 6133} {"train_loss": -27.100217819213867, "global_step": 509110, "epoch": 6133} {"train_loss": -27.244384765625, "global_step": 509111, "epoch": 6133} {"train_loss": -27.58278465270996, "global_step": 509112, "epoch": 6133} {"train_loss": -27.654052734375, "global_step": 509113, "epoch": 6133} {"train_loss": -27.395523071289062, "global_step": 509114, "epoch": 6133} {"train_loss": -27.207448959350586, "global_step": 509115, "epoch": 6133} {"train_loss": -27.661523818969727, "global_step": 509116, "epoch": 6133} {"train_loss": -27.918054580688477, "global_step": 509117, "epoch": 6133} {"train_loss": -27.2037410736084, "global_step": 509118, "epoch": 6133} {"train_loss": -27.01340103149414, "global_step": 509119, "epoch": 6133} {"train_loss": -26.96067237854004, "global_step": 509120, "epoch": 6133} {"train_loss": -27.314459076846937, "global_step": 509121, "epoch": 6133, "val_loss": 6490129.0} {"train_loss": -26.165273666381836, "global_step": 509122, "epoch": 6134} {"train_loss": -25.653249740600586, "global_step": 509123, "epoch": 6134} {"train_loss": -26.132986068725586, "global_step": 509124, "epoch": 6134} {"train_loss": -26.641483306884766, "global_step": 509125, "epoch": 6134} {"train_loss": -26.6168155670166, "global_step": 509126, "epoch": 6134} {"train_loss": -26.692895889282227, "global_step": 509127, "epoch": 6134} {"train_loss": -26.730621337890625, "global_step": 509128, "epoch": 6134} {"train_loss": -26.794179916381836, "global_step": 509129, "epoch": 6134} {"train_loss": -26.865833282470703, "global_step": 509130, "epoch": 6134} {"train_loss": -26.965438842773438, "global_step": 509131, "epoch": 6134} {"train_loss": -26.89165687561035, "global_step": 509132, "epoch": 6134} {"train_loss": -26.782018661499023, "global_step": 509133, "epoch": 6134} {"train_loss": -27.361631393432617, "global_step": 509134, "epoch": 6134} {"train_loss": -26.9646053314209, "global_step": 509135, "epoch": 6134} {"train_loss": -27.205106735229492, "global_step": 509136, "epoch": 6134} {"train_loss": -27.3253116607666, "global_step": 509137, "epoch": 6134} {"train_loss": -27.345529556274414, "global_step": 509138, "epoch": 6134} {"train_loss": -27.070470809936523, "global_step": 509139, "epoch": 6134} {"train_loss": -27.22576332092285, "global_step": 509140, "epoch": 6134} {"train_loss": -27.117582321166992, "global_step": 509141, "epoch": 6134} {"train_loss": -27.461389541625977, "global_step": 509142, "epoch": 6134} {"train_loss": -27.23910903930664, "global_step": 509143, "epoch": 6134} {"train_loss": -27.321664810180664, "global_step": 509144, "epoch": 6134} {"train_loss": -27.190185546875, "global_step": 509145, "epoch": 6134} {"train_loss": -27.422056198120117, "global_step": 509146, "epoch": 6134} {"train_loss": -27.4718017578125, "global_step": 509147, "epoch": 6134} {"train_loss": -27.57599449157715, "global_step": 509148, "epoch": 6134} {"train_loss": -27.734710693359375, "global_step": 509149, "epoch": 6134} {"train_loss": -27.2934627532959, "global_step": 509150, "epoch": 6134} {"train_loss": -27.0272159576416, "global_step": 509151, "epoch": 6134} {"train_loss": -27.440725326538086, "global_step": 509152, "epoch": 6134} {"train_loss": -27.65390968322754, "global_step": 509153, "epoch": 6134} {"train_loss": -27.385156631469727, "global_step": 509154, "epoch": 6134} {"train_loss": -27.43987464904785, "global_step": 509155, "epoch": 6134} {"train_loss": -27.653162002563477, "global_step": 509156, "epoch": 6134} {"train_loss": -27.458087921142578, "global_step": 509157, "epoch": 6134} {"train_loss": -27.407119750976562, "global_step": 509158, "epoch": 6134} {"train_loss": -27.19618034362793, "global_step": 509159, "epoch": 6134} {"train_loss": -27.632007598876953, "global_step": 509160, "epoch": 6134} {"train_loss": -27.277637481689453, "global_step": 509161, "epoch": 6134} {"train_loss": -27.43512535095215, "global_step": 509162, "epoch": 6134} {"train_loss": -27.53101921081543, "global_step": 509163, "epoch": 6134} {"train_loss": -27.79631996154785, "global_step": 509164, "epoch": 6134} {"train_loss": -27.705493927001953, "global_step": 509165, "epoch": 6134} {"train_loss": -27.7066593170166, "global_step": 509166, "epoch": 6134} {"train_loss": -27.657672882080078, "global_step": 509167, "epoch": 6134} {"train_loss": -27.705976486206055, "global_step": 509168, "epoch": 6134} {"train_loss": -27.801441192626953, "global_step": 509169, "epoch": 6134} {"train_loss": -27.532318115234375, "global_step": 509170, "epoch": 6134} {"train_loss": -27.960153579711914, "global_step": 509171, "epoch": 6134} {"train_loss": -27.474472045898438, "global_step": 509172, "epoch": 6134} {"train_loss": -27.977218627929688, "global_step": 509173, "epoch": 6134} {"train_loss": -27.49371337890625, "global_step": 509174, "epoch": 6134} {"train_loss": -27.588285446166992, "global_step": 509175, "epoch": 6134} {"train_loss": -27.619918823242188, "global_step": 509176, "epoch": 6134} {"train_loss": -27.2103214263916, "global_step": 509177, "epoch": 6134} {"train_loss": -26.87461280822754, "global_step": 509178, "epoch": 6134} {"train_loss": -27.479917526245117, "global_step": 509179, "epoch": 6134} {"train_loss": -26.8944034576416, "global_step": 509180, "epoch": 6134} {"train_loss": -27.294422149658203, "global_step": 509181, "epoch": 6134} {"train_loss": -27.46885108947754, "global_step": 509182, "epoch": 6134} {"train_loss": -27.735275268554688, "global_step": 509183, "epoch": 6134} {"train_loss": -27.755239486694336, "global_step": 509184, "epoch": 6134} {"train_loss": -27.405149459838867, "global_step": 509185, "epoch": 6134} {"train_loss": -27.35574722290039, "global_step": 509186, "epoch": 6134} {"train_loss": -27.569555282592773, "global_step": 509187, "epoch": 6134} {"train_loss": -27.359556198120117, "global_step": 509188, "epoch": 6134} {"train_loss": -27.022586822509766, "global_step": 509189, "epoch": 6134} {"train_loss": -26.760725021362305, "global_step": 509190, "epoch": 6134} {"train_loss": -26.129261016845703, "global_step": 509191, "epoch": 6134} {"train_loss": -26.342981338500977, "global_step": 509192, "epoch": 6134} {"train_loss": -27.107568740844727, "global_step": 509193, "epoch": 6134} {"train_loss": -27.568408966064453, "global_step": 509194, "epoch": 6134} {"train_loss": -26.60481834411621, "global_step": 509195, "epoch": 6134} {"train_loss": -27.214574813842773, "global_step": 509196, "epoch": 6134} {"train_loss": -27.400196075439453, "global_step": 509197, "epoch": 6134} {"train_loss": -27.016510009765625, "global_step": 509198, "epoch": 6134} {"train_loss": -27.738439559936523, "global_step": 509199, "epoch": 6134} {"train_loss": -27.28631591796875, "global_step": 509200, "epoch": 6134} {"train_loss": -27.238264083862305, "global_step": 509201, "epoch": 6134} {"train_loss": -27.56129264831543, "global_step": 509202, "epoch": 6134} {"train_loss": -27.345483779907227, "global_step": 509203, "epoch": 6134} {"train_loss": -27.266467220811958, "global_step": 509204, "epoch": 6134, "val_loss": 6556151.0} {"train_loss": -26.699798583984375, "global_step": 509205, "epoch": 6135} {"train_loss": -27.28937339782715, "global_step": 509206, "epoch": 6135} {"train_loss": -26.451099395751953, "global_step": 509207, "epoch": 6135} {"train_loss": -26.52088737487793, "global_step": 509208, "epoch": 6135} {"train_loss": -26.50616455078125, "global_step": 509209, "epoch": 6135} {"train_loss": -27.451416015625, "global_step": 509210, "epoch": 6135} {"train_loss": -26.4060001373291, "global_step": 509211, "epoch": 6135} {"train_loss": -26.75845718383789, "global_step": 509212, "epoch": 6135} {"train_loss": -27.022876739501953, "global_step": 509213, "epoch": 6135} {"train_loss": -26.744840621948242, "global_step": 509214, "epoch": 6135} {"train_loss": -26.820226669311523, "global_step": 509215, "epoch": 6135} {"train_loss": -27.065778732299805, "global_step": 509216, "epoch": 6135} {"train_loss": -26.890777587890625, "global_step": 509217, "epoch": 6135} {"train_loss": -27.1342830657959, "global_step": 509218, "epoch": 6135} {"train_loss": -27.124303817749023, "global_step": 509219, "epoch": 6135} {"train_loss": -27.4366455078125, "global_step": 509220, "epoch": 6135} {"train_loss": -27.162921905517578, "global_step": 509221, "epoch": 6135} {"train_loss": -27.552114486694336, "global_step": 509222, "epoch": 6135} {"train_loss": -27.57758140563965, "global_step": 509223, "epoch": 6135} {"train_loss": -27.256546020507812, "global_step": 509224, "epoch": 6135} {"train_loss": -27.453649520874023, "global_step": 509225, "epoch": 6135} {"train_loss": -27.49700927734375, "global_step": 509226, "epoch": 6135} {"train_loss": -27.4534854888916, "global_step": 509227, "epoch": 6135} {"train_loss": -27.333776473999023, "global_step": 509228, "epoch": 6135} {"train_loss": -27.431610107421875, "global_step": 509229, "epoch": 6135} {"train_loss": -27.233362197875977, "global_step": 509230, "epoch": 6135} {"train_loss": -26.9121150970459, "global_step": 509231, "epoch": 6135} {"train_loss": -27.478168487548828, "global_step": 509232, "epoch": 6135} {"train_loss": -27.54559326171875, "global_step": 509233, "epoch": 6135} {"train_loss": -27.515527725219727, "global_step": 509234, "epoch": 6135} {"train_loss": -27.496442794799805, "global_step": 509235, "epoch": 6135} {"train_loss": -27.821557998657227, "global_step": 509236, "epoch": 6135} {"train_loss": -27.875558853149414, "global_step": 509237, "epoch": 6135} {"train_loss": -27.29974937438965, "global_step": 509238, "epoch": 6135} {"train_loss": -27.732614517211914, "global_step": 509239, "epoch": 6135} {"train_loss": -27.746753692626953, "global_step": 509240, "epoch": 6135} {"train_loss": -27.439977645874023, "global_step": 509241, "epoch": 6135} {"train_loss": -27.38006591796875, "global_step": 509242, "epoch": 6135} {"train_loss": -27.781299591064453, "global_step": 509243, "epoch": 6135} {"train_loss": -27.636457443237305, "global_step": 509244, "epoch": 6135} {"train_loss": -27.551298141479492, "global_step": 509245, "epoch": 6135} {"train_loss": -27.46381187438965, "global_step": 509246, "epoch": 6135} {"train_loss": -27.604955673217773, "global_step": 509247, "epoch": 6135} {"train_loss": -27.5929012298584, "global_step": 509248, "epoch": 6135} {"train_loss": -27.75970458984375, "global_step": 509249, "epoch": 6135} {"train_loss": -27.660064697265625, "global_step": 509250, "epoch": 6135} {"train_loss": -27.900156021118164, "global_step": 509251, "epoch": 6135} {"train_loss": -27.656036376953125, "global_step": 509252, "epoch": 6135} {"train_loss": -27.909912109375, "global_step": 509253, "epoch": 6135} {"train_loss": -28.01129150390625, "global_step": 509254, "epoch": 6135} {"train_loss": -27.777973175048828, "global_step": 509255, "epoch": 6135} {"train_loss": -27.703210830688477, "global_step": 509256, "epoch": 6135} {"train_loss": -27.32838249206543, "global_step": 509257, "epoch": 6135} {"train_loss": -27.102689743041992, "global_step": 509258, "epoch": 6135} {"train_loss": -26.427099227905273, "global_step": 509259, "epoch": 6135} {"train_loss": -25.501951217651367, "global_step": 509260, "epoch": 6135} {"train_loss": -24.196584701538086, "global_step": 509261, "epoch": 6135} {"train_loss": -25.448535919189453, "global_step": 509262, "epoch": 6135} {"train_loss": -27.07081413269043, "global_step": 509263, "epoch": 6135} {"train_loss": -26.05523681640625, "global_step": 509264, "epoch": 6135} {"train_loss": -27.04486656188965, "global_step": 509265, "epoch": 6135} {"train_loss": -26.30708122253418, "global_step": 509266, "epoch": 6135} {"train_loss": -27.303579330444336, "global_step": 509267, "epoch": 6135} {"train_loss": -27.028345108032227, "global_step": 509268, "epoch": 6135} {"train_loss": -26.8970890045166, "global_step": 509269, "epoch": 6135} {"train_loss": -26.739810943603516, "global_step": 509270, "epoch": 6135} {"train_loss": -27.2703800201416, "global_step": 509271, "epoch": 6135} {"train_loss": -27.501834869384766, "global_step": 509272, "epoch": 6135} {"train_loss": -27.26822280883789, "global_step": 509273, "epoch": 6135} {"train_loss": -27.074209213256836, "global_step": 509274, "epoch": 6135} {"train_loss": -27.184667587280273, "global_step": 509275, "epoch": 6135} {"train_loss": -27.234786987304688, "global_step": 509276, "epoch": 6135} {"train_loss": -27.5194034576416, "global_step": 509277, "epoch": 6135} {"train_loss": -26.94268226623535, "global_step": 509278, "epoch": 6135} {"train_loss": -27.592432022094727, "global_step": 509279, "epoch": 6135} {"train_loss": -27.30043601989746, "global_step": 509280, "epoch": 6135} {"train_loss": -27.20361328125, "global_step": 509281, "epoch": 6135} {"train_loss": -27.746549606323242, "global_step": 509282, "epoch": 6135} {"train_loss": -27.1453800201416, "global_step": 509283, "epoch": 6135} {"train_loss": -27.98297691345215, "global_step": 509284, "epoch": 6135} {"train_loss": -27.359350204467773, "global_step": 509285, "epoch": 6135} {"train_loss": -27.276809692382812, "global_step": 509286, "epoch": 6135} {"train_loss": -27.192953891064747, "global_step": 509287, "epoch": 6135, "val_loss": 6584065.0} {"train_loss": -27.242218017578125, "global_step": 509288, "epoch": 6136} {"train_loss": -27.5136775970459, "global_step": 509289, "epoch": 6136} {"train_loss": -27.3022518157959, "global_step": 509290, "epoch": 6136} {"train_loss": -27.387372970581055, "global_step": 509291, "epoch": 6136} {"train_loss": -27.100194931030273, "global_step": 509292, "epoch": 6136} {"train_loss": -27.272052764892578, "global_step": 509293, "epoch": 6136} {"train_loss": -27.11692237854004, "global_step": 509294, "epoch": 6136} {"train_loss": -27.47626304626465, "global_step": 509295, "epoch": 6136} {"train_loss": -27.199966430664062, "global_step": 509296, "epoch": 6136} {"train_loss": -26.887786865234375, "global_step": 509297, "epoch": 6136} {"train_loss": -27.59583854675293, "global_step": 509298, "epoch": 6136} {"train_loss": -27.191959381103516, "global_step": 509299, "epoch": 6136} {"train_loss": -26.88616943359375, "global_step": 509300, "epoch": 6136} {"train_loss": -27.288227081298828, "global_step": 509301, "epoch": 6136} {"train_loss": -27.194293975830078, "global_step": 509302, "epoch": 6136} {"train_loss": -27.43259620666504, "global_step": 509303, "epoch": 6136} {"train_loss": -27.681766510009766, "global_step": 509304, "epoch": 6136} {"train_loss": -27.555883407592773, "global_step": 509305, "epoch": 6136} {"train_loss": -27.31963539123535, "global_step": 509306, "epoch": 6136} {"train_loss": -27.599634170532227, "global_step": 509307, "epoch": 6136} {"train_loss": -27.47136878967285, "global_step": 509308, "epoch": 6136} {"train_loss": -27.501422882080078, "global_step": 509309, "epoch": 6136} {"train_loss": -27.617895126342773, "global_step": 509310, "epoch": 6136} {"train_loss": -27.581586837768555, "global_step": 509311, "epoch": 6136} {"train_loss": -27.62115478515625, "global_step": 509312, "epoch": 6136} {"train_loss": -27.79803466796875, "global_step": 509313, "epoch": 6136} {"train_loss": -27.816858291625977, "global_step": 509314, "epoch": 6136} {"train_loss": -27.167463302612305, "global_step": 509315, "epoch": 6136} {"train_loss": -27.59992790222168, "global_step": 509316, "epoch": 6136} {"train_loss": -27.6297607421875, "global_step": 509317, "epoch": 6136} {"train_loss": -27.416494369506836, "global_step": 509318, "epoch": 6136} {"train_loss": -27.48829460144043, "global_step": 509319, "epoch": 6136} {"train_loss": -27.40949058532715, "global_step": 509320, "epoch": 6136} {"train_loss": -27.663043975830078, "global_step": 509321, "epoch": 6136} {"train_loss": -27.734827041625977, "global_step": 509322, "epoch": 6136} {"train_loss": -27.55409812927246, "global_step": 509323, "epoch": 6136} {"train_loss": -27.495492935180664, "global_step": 509324, "epoch": 6136} {"train_loss": -27.550146102905273, "global_step": 509325, "epoch": 6136} {"train_loss": -27.284271240234375, "global_step": 509326, "epoch": 6136} {"train_loss": -27.858535766601562, "global_step": 509327, "epoch": 6136} {"train_loss": -27.64235496520996, "global_step": 509328, "epoch": 6136} {"train_loss": -27.494842529296875, "global_step": 509329, "epoch": 6136} {"train_loss": -27.686065673828125, "global_step": 509330, "epoch": 6136} {"train_loss": -27.741796493530273, "global_step": 509331, "epoch": 6136} {"train_loss": -27.4024715423584, "global_step": 509332, "epoch": 6136} {"train_loss": -27.481115341186523, "global_step": 509333, "epoch": 6136} {"train_loss": -27.644620895385742, "global_step": 509334, "epoch": 6136} {"train_loss": -27.373016357421875, "global_step": 509335, "epoch": 6136} {"train_loss": -27.520751953125, "global_step": 509336, "epoch": 6136} {"train_loss": -28.022165298461914, "global_step": 509337, "epoch": 6136} {"train_loss": -27.684659957885742, "global_step": 509338, "epoch": 6136} {"train_loss": -27.6013126373291, "global_step": 509339, "epoch": 6136} {"train_loss": -27.818511962890625, "global_step": 509340, "epoch": 6136} {"train_loss": -27.779434204101562, "global_step": 509341, "epoch": 6136} {"train_loss": -27.74061393737793, "global_step": 509342, "epoch": 6136} {"train_loss": -27.724262237548828, "global_step": 509343, "epoch": 6136} {"train_loss": -27.68472671508789, "global_step": 509344, "epoch": 6136} {"train_loss": -27.516998291015625, "global_step": 509345, "epoch": 6136} {"train_loss": -27.598041534423828, "global_step": 509346, "epoch": 6136} {"train_loss": -27.464162826538086, "global_step": 509347, "epoch": 6136} {"train_loss": -26.842243194580078, "global_step": 509348, "epoch": 6136} {"train_loss": -27.305194854736328, "global_step": 509349, "epoch": 6136} {"train_loss": -27.589990615844727, "global_step": 509350, "epoch": 6136} {"train_loss": -27.351194381713867, "global_step": 509351, "epoch": 6136} {"train_loss": -27.531347274780273, "global_step": 509352, "epoch": 6136} {"train_loss": -27.344165802001953, "global_step": 509353, "epoch": 6136} {"train_loss": -27.907184600830078, "global_step": 509354, "epoch": 6136} {"train_loss": -28.19107437133789, "global_step": 509355, "epoch": 6136} {"train_loss": -27.792022705078125, "global_step": 509356, "epoch": 6136} {"train_loss": -27.56373405456543, "global_step": 509357, "epoch": 6136} {"train_loss": -27.605432510375977, "global_step": 509358, "epoch": 6136} {"train_loss": -27.430479049682617, "global_step": 509359, "epoch": 6136} {"train_loss": -27.277374267578125, "global_step": 509360, "epoch": 6136} {"train_loss": -27.404224395751953, "global_step": 509361, "epoch": 6136} {"train_loss": -27.32978630065918, "global_step": 509362, "epoch": 6136} {"train_loss": -27.617359161376953, "global_step": 509363, "epoch": 6136} {"train_loss": -27.5961971282959, "global_step": 509364, "epoch": 6136} {"train_loss": -27.36139488220215, "global_step": 509365, "epoch": 6136} {"train_loss": -27.932376861572266, "global_step": 509366, "epoch": 6136} {"train_loss": -27.734731674194336, "global_step": 509367, "epoch": 6136} {"train_loss": -27.817636489868164, "global_step": 509368, "epoch": 6136} {"train_loss": -27.480039596557617, "global_step": 509369, "epoch": 6136} {"train_loss": -27.504328693252013, "global_step": 509370, "epoch": 6136, "val_loss": 6586130.0} {"train_loss": -26.060163497924805, "global_step": 509371, "epoch": 6137} {"train_loss": -25.522459030151367, "global_step": 509372, "epoch": 6137} {"train_loss": -26.811710357666016, "global_step": 509373, "epoch": 6137} {"train_loss": -26.744001388549805, "global_step": 509374, "epoch": 6137} {"train_loss": -26.343677520751953, "global_step": 509375, "epoch": 6137} {"train_loss": -26.787799835205078, "global_step": 509376, "epoch": 6137} {"train_loss": -26.533008575439453, "global_step": 509377, "epoch": 6137} {"train_loss": -26.63068962097168, "global_step": 509378, "epoch": 6137} {"train_loss": -26.708667755126953, "global_step": 509379, "epoch": 6137} {"train_loss": -26.95403480529785, "global_step": 509380, "epoch": 6137} {"train_loss": -27.098398208618164, "global_step": 509381, "epoch": 6137} {"train_loss": -26.356061935424805, "global_step": 509382, "epoch": 6137} {"train_loss": -27.123199462890625, "global_step": 509383, "epoch": 6137} {"train_loss": -26.767927169799805, "global_step": 509384, "epoch": 6137} {"train_loss": -27.11086082458496, "global_step": 509385, "epoch": 6137} {"train_loss": -26.39058494567871, "global_step": 509386, "epoch": 6137} {"train_loss": -27.457340240478516, "global_step": 509387, "epoch": 6137} {"train_loss": -26.99175453186035, "global_step": 509388, "epoch": 6137} {"train_loss": -26.703815460205078, "global_step": 509389, "epoch": 6137} {"train_loss": -27.10914421081543, "global_step": 509390, "epoch": 6137} {"train_loss": -27.127180099487305, "global_step": 509391, "epoch": 6137} {"train_loss": -27.245121002197266, "global_step": 509392, "epoch": 6137} {"train_loss": -27.1333065032959, "global_step": 509393, "epoch": 6137} {"train_loss": -27.226703643798828, "global_step": 509394, "epoch": 6137} {"train_loss": -27.141098022460938, "global_step": 509395, "epoch": 6137} {"train_loss": -27.31790542602539, "global_step": 509396, "epoch": 6137} {"train_loss": -27.332433700561523, "global_step": 509397, "epoch": 6137} {"train_loss": -27.422943115234375, "global_step": 509398, "epoch": 6137} {"train_loss": -27.581390380859375, "global_step": 509399, "epoch": 6137} {"train_loss": -27.444915771484375, "global_step": 509400, "epoch": 6137} {"train_loss": -27.5083065032959, "global_step": 509401, "epoch": 6137} {"train_loss": -27.442102432250977, "global_step": 509402, "epoch": 6137} {"train_loss": -27.442441940307617, "global_step": 509403, "epoch": 6137} {"train_loss": -27.32281494140625, "global_step": 509404, "epoch": 6137} {"train_loss": -27.54062271118164, "global_step": 509405, "epoch": 6137} {"train_loss": -27.47102165222168, "global_step": 509406, "epoch": 6137} {"train_loss": -27.665103912353516, "global_step": 509407, "epoch": 6137} {"train_loss": -27.877490997314453, "global_step": 509408, "epoch": 6137} {"train_loss": -27.846149444580078, "global_step": 509409, "epoch": 6137} {"train_loss": -27.692724227905273, "global_step": 509410, "epoch": 6137} {"train_loss": -27.67462730407715, "global_step": 509411, "epoch": 6137} {"train_loss": -27.88848876953125, "global_step": 509412, "epoch": 6137} {"train_loss": -27.4410457611084, "global_step": 509413, "epoch": 6137} {"train_loss": -28.0537052154541, "global_step": 509414, "epoch": 6137} {"train_loss": -27.71429443359375, "global_step": 509415, "epoch": 6137} {"train_loss": -27.600818634033203, "global_step": 509416, "epoch": 6137} {"train_loss": -27.322263717651367, "global_step": 509417, "epoch": 6137} {"train_loss": -27.622690200805664, "global_step": 509418, "epoch": 6137} {"train_loss": -27.701160430908203, "global_step": 509419, "epoch": 6137} {"train_loss": -27.977542877197266, "global_step": 509420, "epoch": 6137} {"train_loss": -27.90594482421875, "global_step": 509421, "epoch": 6137} {"train_loss": -27.4862060546875, "global_step": 509422, "epoch": 6137} {"train_loss": -27.7801513671875, "global_step": 509423, "epoch": 6137} {"train_loss": -27.43446159362793, "global_step": 509424, "epoch": 6137} {"train_loss": -27.80726432800293, "global_step": 509425, "epoch": 6137} {"train_loss": -27.661848068237305, "global_step": 509426, "epoch": 6137} {"train_loss": -27.794401168823242, "global_step": 509427, "epoch": 6137} {"train_loss": -28.023725509643555, "global_step": 509428, "epoch": 6137} {"train_loss": -27.74464225769043, "global_step": 509429, "epoch": 6137} {"train_loss": -27.427936553955078, "global_step": 509430, "epoch": 6137} {"train_loss": -28.099035263061523, "global_step": 509431, "epoch": 6137} {"train_loss": -27.0631160736084, "global_step": 509432, "epoch": 6137} {"train_loss": -27.1939697265625, "global_step": 509433, "epoch": 6137} {"train_loss": -26.773895263671875, "global_step": 509434, "epoch": 6137} {"train_loss": -26.134958267211914, "global_step": 509435, "epoch": 6137} {"train_loss": -25.6068115234375, "global_step": 509436, "epoch": 6137} {"train_loss": -26.513898849487305, "global_step": 509437, "epoch": 6137} {"train_loss": -27.463781356811523, "global_step": 509438, "epoch": 6137} {"train_loss": -27.40398597717285, "global_step": 509439, "epoch": 6137} {"train_loss": -27.0119686126709, "global_step": 509440, "epoch": 6137} {"train_loss": -26.580951690673828, "global_step": 509441, "epoch": 6137} {"train_loss": -27.231189727783203, "global_step": 509442, "epoch": 6137} {"train_loss": -27.227094650268555, "global_step": 509443, "epoch": 6137} {"train_loss": -26.794269561767578, "global_step": 509444, "epoch": 6137} {"train_loss": -27.534244537353516, "global_step": 509445, "epoch": 6137} {"train_loss": -27.011987686157227, "global_step": 509446, "epoch": 6137} {"train_loss": -27.009363174438477, "global_step": 509447, "epoch": 6137} {"train_loss": -26.723371505737305, "global_step": 509448, "epoch": 6137} {"train_loss": -27.045068740844727, "global_step": 509449, "epoch": 6137} {"train_loss": -27.384923934936523, "global_step": 509450, "epoch": 6137} {"train_loss": -26.9093017578125, "global_step": 509451, "epoch": 6137} {"train_loss": -27.415441513061523, "global_step": 509452, "epoch": 6137} {"train_loss": -27.20101101427193, "global_step": 509453, "epoch": 6137, "val_loss": 6502866.5} {"train_loss": -26.60902214050293, "global_step": 509454, "epoch": 6138} {"train_loss": -27.347471237182617, "global_step": 509455, "epoch": 6138} {"train_loss": -27.09034538269043, "global_step": 509456, "epoch": 6138} {"train_loss": -27.24053955078125, "global_step": 509457, "epoch": 6138} {"train_loss": -26.7889461517334, "global_step": 509458, "epoch": 6138} {"train_loss": -27.1097412109375, "global_step": 509459, "epoch": 6138} {"train_loss": -27.12969398498535, "global_step": 509460, "epoch": 6138} {"train_loss": -27.248905181884766, "global_step": 509461, "epoch": 6138} {"train_loss": -26.752416610717773, "global_step": 509462, "epoch": 6138} {"train_loss": -27.13934898376465, "global_step": 509463, "epoch": 6138} {"train_loss": -26.980487823486328, "global_step": 509464, "epoch": 6138} {"train_loss": -26.606176376342773, "global_step": 509465, "epoch": 6138} {"train_loss": -26.943836212158203, "global_step": 509466, "epoch": 6138} {"train_loss": -27.251550674438477, "global_step": 509467, "epoch": 6138} {"train_loss": -27.431020736694336, "global_step": 509468, "epoch": 6138} {"train_loss": -27.08953285217285, "global_step": 509469, "epoch": 6138} {"train_loss": -27.043394088745117, "global_step": 509470, "epoch": 6138} {"train_loss": -27.43461036682129, "global_step": 509471, "epoch": 6138} {"train_loss": -27.554590225219727, "global_step": 509472, "epoch": 6138} {"train_loss": -27.709863662719727, "global_step": 509473, "epoch": 6138} {"train_loss": -27.40308952331543, "global_step": 509474, "epoch": 6138} {"train_loss": -27.54901695251465, "global_step": 509475, "epoch": 6138} {"train_loss": -27.18208122253418, "global_step": 509476, "epoch": 6138} {"train_loss": -27.10848045349121, "global_step": 509477, "epoch": 6138} {"train_loss": -27.410375595092773, "global_step": 509478, "epoch": 6138} {"train_loss": -27.65680503845215, "global_step": 509479, "epoch": 6138} {"train_loss": -27.15464210510254, "global_step": 509480, "epoch": 6138} {"train_loss": -26.92133903503418, "global_step": 509481, "epoch": 6138} {"train_loss": -27.32839012145996, "global_step": 509482, "epoch": 6138} {"train_loss": -27.50339698791504, "global_step": 509483, "epoch": 6138} {"train_loss": -27.338891983032227, "global_step": 509484, "epoch": 6138} {"train_loss": -27.258092880249023, "global_step": 509485, "epoch": 6138} {"train_loss": -27.32269287109375, "global_step": 509486, "epoch": 6138} {"train_loss": -27.710453033447266, "global_step": 509487, "epoch": 6138} {"train_loss": -27.445154190063477, "global_step": 509488, "epoch": 6138} {"train_loss": -27.817047119140625, "global_step": 509489, "epoch": 6138} {"train_loss": -27.714984893798828, "global_step": 509490, "epoch": 6138} {"train_loss": -27.370466232299805, "global_step": 509491, "epoch": 6138} {"train_loss": -27.4331111907959, "global_step": 509492, "epoch": 6138} {"train_loss": -27.558862686157227, "global_step": 509493, "epoch": 6138} {"train_loss": -27.43984031677246, "global_step": 509494, "epoch": 6138} {"train_loss": -27.638202667236328, "global_step": 509495, "epoch": 6138} {"train_loss": -27.694732666015625, "global_step": 509496, "epoch": 6138} {"train_loss": -27.785627365112305, "global_step": 509497, "epoch": 6138} {"train_loss": -27.647485733032227, "global_step": 509498, "epoch": 6138} {"train_loss": -27.582977294921875, "global_step": 509499, "epoch": 6138} {"train_loss": -27.434040069580078, "global_step": 509500, "epoch": 6138} {"train_loss": -27.033828735351562, "global_step": 509501, "epoch": 6138} {"train_loss": -27.806961059570312, "global_step": 509502, "epoch": 6138} {"train_loss": -27.402389526367188, "global_step": 509503, "epoch": 6138} {"train_loss": -27.7014102935791, "global_step": 509504, "epoch": 6138} {"train_loss": -27.45631980895996, "global_step": 509505, "epoch": 6138} {"train_loss": -27.655197143554688, "global_step": 509506, "epoch": 6138} {"train_loss": -27.69585609436035, "global_step": 509507, "epoch": 6138} {"train_loss": -27.35807228088379, "global_step": 509508, "epoch": 6138} {"train_loss": -27.13348388671875, "global_step": 509509, "epoch": 6138} {"train_loss": -27.48432731628418, "global_step": 509510, "epoch": 6138} {"train_loss": -27.401159286499023, "global_step": 509511, "epoch": 6138} {"train_loss": -27.383392333984375, "global_step": 509512, "epoch": 6138} {"train_loss": -27.109100341796875, "global_step": 509513, "epoch": 6138} {"train_loss": -27.8062686920166, "global_step": 509514, "epoch": 6138} {"train_loss": -27.812183380126953, "global_step": 509515, "epoch": 6138} {"train_loss": -27.699188232421875, "global_step": 509516, "epoch": 6138} {"train_loss": -27.157434463500977, "global_step": 509517, "epoch": 6138} {"train_loss": -27.54422378540039, "global_step": 509518, "epoch": 6138} {"train_loss": -27.241302490234375, "global_step": 509519, "epoch": 6138} {"train_loss": -27.325763702392578, "global_step": 509520, "epoch": 6138} {"train_loss": -27.6237735748291, "global_step": 509521, "epoch": 6138} {"train_loss": -27.226520538330078, "global_step": 509522, "epoch": 6138} {"train_loss": -27.415088653564453, "global_step": 509523, "epoch": 6138} {"train_loss": -27.189117431640625, "global_step": 509524, "epoch": 6138} {"train_loss": -27.316314697265625, "global_step": 509525, "epoch": 6138} {"train_loss": -27.246320724487305, "global_step": 509526, "epoch": 6138} {"train_loss": -27.29974365234375, "global_step": 509527, "epoch": 6138} {"train_loss": -27.551252365112305, "global_step": 509528, "epoch": 6138} {"train_loss": -27.30319595336914, "global_step": 509529, "epoch": 6138} {"train_loss": -26.736181259155273, "global_step": 509530, "epoch": 6138} {"train_loss": -27.23453140258789, "global_step": 509531, "epoch": 6138} {"train_loss": -27.2130184173584, "global_step": 509532, "epoch": 6138} {"train_loss": -26.620502471923828, "global_step": 509533, "epoch": 6138} {"train_loss": -27.550073623657227, "global_step": 509534, "epoch": 6138} {"train_loss": -26.996051788330078, "global_step": 509535, "epoch": 6138} {"train_loss": -27.34055532892066, "global_step": 509536, "epoch": 6138, "val_loss": 6677662.0} {"train_loss": -24.985692977905273, "global_step": 509537, "epoch": 6139} {"train_loss": -25.8815975189209, "global_step": 509538, "epoch": 6139} {"train_loss": -26.511123657226562, "global_step": 509539, "epoch": 6139} {"train_loss": -26.29547119140625, "global_step": 509540, "epoch": 6139} {"train_loss": -26.47052001953125, "global_step": 509541, "epoch": 6139} {"train_loss": -26.221435546875, "global_step": 509542, "epoch": 6139} {"train_loss": -26.626129150390625, "global_step": 509543, "epoch": 6139} {"train_loss": -26.777318954467773, "global_step": 509544, "epoch": 6139} {"train_loss": -26.91522789001465, "global_step": 509545, "epoch": 6139} {"train_loss": -26.832807540893555, "global_step": 509546, "epoch": 6139} {"train_loss": -26.80072021484375, "global_step": 509547, "epoch": 6139} {"train_loss": -27.014678955078125, "global_step": 509548, "epoch": 6139} {"train_loss": -26.7023983001709, "global_step": 509549, "epoch": 6139} {"train_loss": -26.512048721313477, "global_step": 509550, "epoch": 6139} {"train_loss": -26.9350643157959, "global_step": 509551, "epoch": 6139} {"train_loss": -26.8872127532959, "global_step": 509552, "epoch": 6139} {"train_loss": -27.21955680847168, "global_step": 509553, "epoch": 6139} {"train_loss": -27.127756118774414, "global_step": 509554, "epoch": 6139} {"train_loss": -27.178516387939453, "global_step": 509555, "epoch": 6139} {"train_loss": -27.066192626953125, "global_step": 509556, "epoch": 6139} {"train_loss": -27.334814071655273, "global_step": 509557, "epoch": 6139} {"train_loss": -27.40363121032715, "global_step": 509558, "epoch": 6139} {"train_loss": -27.232446670532227, "global_step": 509559, "epoch": 6139} {"train_loss": -27.228849411010742, "global_step": 509560, "epoch": 6139} {"train_loss": -27.186569213867188, "global_step": 509561, "epoch": 6139} {"train_loss": -27.27022361755371, "global_step": 509562, "epoch": 6139} {"train_loss": -27.195280075073242, "global_step": 509563, "epoch": 6139} {"train_loss": -27.281497955322266, "global_step": 509564, "epoch": 6139} {"train_loss": -26.915637969970703, "global_step": 509565, "epoch": 6139} {"train_loss": -27.209936141967773, "global_step": 509566, "epoch": 6139} {"train_loss": -27.391931533813477, "global_step": 509567, "epoch": 6139} {"train_loss": -27.501972198486328, "global_step": 509568, "epoch": 6139} {"train_loss": -27.389448165893555, "global_step": 509569, "epoch": 6139} {"train_loss": -27.606201171875, "global_step": 509570, "epoch": 6139} {"train_loss": -27.176435470581055, "global_step": 509571, "epoch": 6139} {"train_loss": -27.092182159423828, "global_step": 509572, "epoch": 6139} {"train_loss": -27.47513198852539, "global_step": 509573, "epoch": 6139} {"train_loss": -27.461660385131836, "global_step": 509574, "epoch": 6139} {"train_loss": -27.392047882080078, "global_step": 509575, "epoch": 6139} {"train_loss": -27.602832794189453, "global_step": 509576, "epoch": 6139} {"train_loss": -27.671253204345703, "global_step": 509577, "epoch": 6139} {"train_loss": -27.518651962280273, "global_step": 509578, "epoch": 6139} {"train_loss": -27.360645294189453, "global_step": 509579, "epoch": 6139} {"train_loss": -27.613000869750977, "global_step": 509580, "epoch": 6139} {"train_loss": -27.484039306640625, "global_step": 509581, "epoch": 6139} {"train_loss": -27.80426597595215, "global_step": 509582, "epoch": 6139} {"train_loss": -27.4730167388916, "global_step": 509583, "epoch": 6139} {"train_loss": -27.162805557250977, "global_step": 509584, "epoch": 6139} {"train_loss": -27.71541404724121, "global_step": 509585, "epoch": 6139} {"train_loss": -27.6190185546875, "global_step": 509586, "epoch": 6139} {"train_loss": -27.392852783203125, "global_step": 509587, "epoch": 6139} {"train_loss": -27.526880264282227, "global_step": 509588, "epoch": 6139} {"train_loss": -27.351293563842773, "global_step": 509589, "epoch": 6139} {"train_loss": -27.855798721313477, "global_step": 509590, "epoch": 6139} {"train_loss": -27.49167823791504, "global_step": 509591, "epoch": 6139} {"train_loss": -27.475290298461914, "global_step": 509592, "epoch": 6139} {"train_loss": -27.319311141967773, "global_step": 509593, "epoch": 6139} {"train_loss": -26.18299674987793, "global_step": 509594, "epoch": 6139} {"train_loss": -25.54812240600586, "global_step": 509595, "epoch": 6139} {"train_loss": -24.951107025146484, "global_step": 509596, "epoch": 6139} {"train_loss": -26.429855346679688, "global_step": 509597, "epoch": 6139} {"train_loss": -26.847183227539062, "global_step": 509598, "epoch": 6139} {"train_loss": -26.91884422302246, "global_step": 509599, "epoch": 6139} {"train_loss": -26.929168701171875, "global_step": 509600, "epoch": 6139} {"train_loss": -26.335126876831055, "global_step": 509601, "epoch": 6139} {"train_loss": -27.10772132873535, "global_step": 509602, "epoch": 6139} {"train_loss": -26.45953941345215, "global_step": 509603, "epoch": 6139} {"train_loss": -26.996992111206055, "global_step": 509604, "epoch": 6139} {"train_loss": -27.22747802734375, "global_step": 509605, "epoch": 6139} {"train_loss": -27.058349609375, "global_step": 509606, "epoch": 6139} {"train_loss": -27.44757652282715, "global_step": 509607, "epoch": 6139} {"train_loss": -27.324140548706055, "global_step": 509608, "epoch": 6139} {"train_loss": -27.35297203063965, "global_step": 509609, "epoch": 6139} {"train_loss": -27.20711326599121, "global_step": 509610, "epoch": 6139} {"train_loss": -27.39166259765625, "global_step": 509611, "epoch": 6139} {"train_loss": -27.278305053710938, "global_step": 509612, "epoch": 6139} {"train_loss": -27.01338005065918, "global_step": 509613, "epoch": 6139} {"train_loss": -27.474889755249023, "global_step": 509614, "epoch": 6139} {"train_loss": -27.452728271484375, "global_step": 509615, "epoch": 6139} {"train_loss": -27.4570369720459, "global_step": 509616, "epoch": 6139} {"train_loss": -27.499494552612305, "global_step": 509617, "epoch": 6139} {"train_loss": -27.2769832611084, "global_step": 509618, "epoch": 6139} {"train_loss": -27.078748197440643, "global_step": 509619, "epoch": 6139, "val_loss": 6558700.0} {"train_loss": -26.997594833374023, "global_step": 509620, "epoch": 6140} {"train_loss": -27.49686622619629, "global_step": 509621, "epoch": 6140} {"train_loss": -27.32695960998535, "global_step": 509622, "epoch": 6140} {"train_loss": -27.2890682220459, "global_step": 509623, "epoch": 6140} {"train_loss": -27.040815353393555, "global_step": 509624, "epoch": 6140} {"train_loss": -27.221973419189453, "global_step": 509625, "epoch": 6140} {"train_loss": -27.15814781188965, "global_step": 509626, "epoch": 6140} {"train_loss": -27.267230987548828, "global_step": 509627, "epoch": 6140} {"train_loss": -27.36223793029785, "global_step": 509628, "epoch": 6140} {"train_loss": -26.91274070739746, "global_step": 509629, "epoch": 6140} {"train_loss": -27.405447006225586, "global_step": 509630, "epoch": 6140} {"train_loss": -27.758819580078125, "global_step": 509631, "epoch": 6140} {"train_loss": -27.4528865814209, "global_step": 509632, "epoch": 6140} {"train_loss": -27.25239372253418, "global_step": 509633, "epoch": 6140} {"train_loss": -27.673871994018555, "global_step": 509634, "epoch": 6140} {"train_loss": -27.2908992767334, "global_step": 509635, "epoch": 6140} {"train_loss": -27.255170822143555, "global_step": 509636, "epoch": 6140} {"train_loss": -27.462127685546875, "global_step": 509637, "epoch": 6140} {"train_loss": -27.64642906188965, "global_step": 509638, "epoch": 6140} {"train_loss": -27.396677017211914, "global_step": 509639, "epoch": 6140} {"train_loss": -27.584272384643555, "global_step": 509640, "epoch": 6140} {"train_loss": -27.50542640686035, "global_step": 509641, "epoch": 6140} {"train_loss": -27.61335563659668, "global_step": 509642, "epoch": 6140} {"train_loss": -27.649158477783203, "global_step": 509643, "epoch": 6140} {"train_loss": -27.525409698486328, "global_step": 509644, "epoch": 6140} {"train_loss": -26.785398483276367, "global_step": 509645, "epoch": 6140} {"train_loss": -27.533645629882812, "global_step": 509646, "epoch": 6140} {"train_loss": -27.469806671142578, "global_step": 509647, "epoch": 6140} {"train_loss": -27.622182846069336, "global_step": 509648, "epoch": 6140} {"train_loss": -27.230804443359375, "global_step": 509649, "epoch": 6140} {"train_loss": -27.81022071838379, "global_step": 509650, "epoch": 6140} {"train_loss": -27.429275512695312, "global_step": 509651, "epoch": 6140} {"train_loss": -27.76604652404785, "global_step": 509652, "epoch": 6140} {"train_loss": -27.370014190673828, "global_step": 509653, "epoch": 6140} {"train_loss": -27.384143829345703, "global_step": 509654, "epoch": 6140} {"train_loss": -27.82941246032715, "global_step": 509655, "epoch": 6140} {"train_loss": -27.6143741607666, "global_step": 509656, "epoch": 6140} {"train_loss": -27.598175048828125, "global_step": 509657, "epoch": 6140} {"train_loss": -27.25437355041504, "global_step": 509658, "epoch": 6140} {"train_loss": -28.000158309936523, "global_step": 509659, "epoch": 6140} {"train_loss": -27.783227920532227, "global_step": 509660, "epoch": 6140} {"train_loss": -27.62017822265625, "global_step": 509661, "epoch": 6140} {"train_loss": -27.660064697265625, "global_step": 509662, "epoch": 6140} {"train_loss": -27.576873779296875, "global_step": 509663, "epoch": 6140} {"train_loss": -27.866785049438477, "global_step": 509664, "epoch": 6140} {"train_loss": -27.445409774780273, "global_step": 509665, "epoch": 6140} {"train_loss": -27.851364135742188, "global_step": 509666, "epoch": 6140} {"train_loss": -27.532697677612305, "global_step": 509667, "epoch": 6140} {"train_loss": -27.807270050048828, "global_step": 509668, "epoch": 6140} {"train_loss": -27.365524291992188, "global_step": 509669, "epoch": 6140} {"train_loss": -27.735965728759766, "global_step": 509670, "epoch": 6140} {"train_loss": -27.1682186126709, "global_step": 509671, "epoch": 6140} {"train_loss": -27.353300094604492, "global_step": 509672, "epoch": 6140} {"train_loss": -27.3132266998291, "global_step": 509673, "epoch": 6140} {"train_loss": -27.477262496948242, "global_step": 509674, "epoch": 6140} {"train_loss": -27.301334381103516, "global_step": 509675, "epoch": 6140} {"train_loss": -27.645349502563477, "global_step": 509676, "epoch": 6140} {"train_loss": -27.340356826782227, "global_step": 509677, "epoch": 6140} {"train_loss": -27.858694076538086, "global_step": 509678, "epoch": 6140} {"train_loss": -27.68924903869629, "global_step": 509679, "epoch": 6140} {"train_loss": -27.640583038330078, "global_step": 509680, "epoch": 6140} {"train_loss": -27.431516647338867, "global_step": 509681, "epoch": 6140} {"train_loss": -27.742176055908203, "global_step": 509682, "epoch": 6140} {"train_loss": -27.49383544921875, "global_step": 509683, "epoch": 6140} {"train_loss": -28.0014591217041, "global_step": 509684, "epoch": 6140} {"train_loss": -27.382192611694336, "global_step": 509685, "epoch": 6140} {"train_loss": -27.871381759643555, "global_step": 509686, "epoch": 6140} {"train_loss": -28.014623641967773, "global_step": 509687, "epoch": 6140} {"train_loss": -27.4948673248291, "global_step": 509688, "epoch": 6140} {"train_loss": -27.515167236328125, "global_step": 509689, "epoch": 6140} {"train_loss": -27.748077392578125, "global_step": 509690, "epoch": 6140} {"train_loss": -27.422224044799805, "global_step": 509691, "epoch": 6140} {"train_loss": -27.6396427154541, "global_step": 509692, "epoch": 6140} {"train_loss": -27.48603630065918, "global_step": 509693, "epoch": 6140} {"train_loss": -27.10304832458496, "global_step": 509694, "epoch": 6140} {"train_loss": -27.2066593170166, "global_step": 509695, "epoch": 6140} {"train_loss": -27.867719650268555, "global_step": 509696, "epoch": 6140} {"train_loss": -27.719013214111328, "global_step": 509697, "epoch": 6140} {"train_loss": -27.882984161376953, "global_step": 509698, "epoch": 6140} {"train_loss": -27.11151695251465, "global_step": 509699, "epoch": 6140} {"train_loss": -26.298871994018555, "global_step": 509700, "epoch": 6140} {"train_loss": -26.119770050048828, "global_step": 509701, "epoch": 6140} {"train_loss": -27.449237180043415, "global_step": 509702, "epoch": 6140, "val_loss": 6612834.0} {"train_loss": -26.181415557861328, "global_step": 509703, "epoch": 6141} {"train_loss": -25.45349884033203, "global_step": 509704, "epoch": 6141} {"train_loss": -25.951847076416016, "global_step": 509705, "epoch": 6141} {"train_loss": -26.446813583374023, "global_step": 509706, "epoch": 6141} {"train_loss": -25.466562271118164, "global_step": 509707, "epoch": 6141} {"train_loss": -25.977069854736328, "global_step": 509708, "epoch": 6141} {"train_loss": -26.109617233276367, "global_step": 509709, "epoch": 6141} {"train_loss": -26.134998321533203, "global_step": 509710, "epoch": 6141} {"train_loss": -26.507781982421875, "global_step": 509711, "epoch": 6141} {"train_loss": -26.231281280517578, "global_step": 509712, "epoch": 6141} {"train_loss": -26.47873306274414, "global_step": 509713, "epoch": 6141} {"train_loss": -26.15164566040039, "global_step": 509714, "epoch": 6141} {"train_loss": -26.675046920776367, "global_step": 509715, "epoch": 6141} {"train_loss": -26.51498794555664, "global_step": 509716, "epoch": 6141} {"train_loss": -26.4011173248291, "global_step": 509717, "epoch": 6141} {"train_loss": -26.520404815673828, "global_step": 509718, "epoch": 6141} {"train_loss": -26.940160751342773, "global_step": 509719, "epoch": 6141} {"train_loss": -26.84881019592285, "global_step": 509720, "epoch": 6141} {"train_loss": -26.78955078125, "global_step": 509721, "epoch": 6141} {"train_loss": -26.337797164916992, "global_step": 509722, "epoch": 6141} {"train_loss": -26.771512985229492, "global_step": 509723, "epoch": 6141} {"train_loss": -27.0189266204834, "global_step": 509724, "epoch": 6141} {"train_loss": -26.324481964111328, "global_step": 509725, "epoch": 6141} {"train_loss": -26.853687286376953, "global_step": 509726, "epoch": 6141} {"train_loss": -26.763845443725586, "global_step": 509727, "epoch": 6141} {"train_loss": -26.9957332611084, "global_step": 509728, "epoch": 6141} {"train_loss": -26.989887237548828, "global_step": 509729, "epoch": 6141} {"train_loss": -27.604124069213867, "global_step": 509730, "epoch": 6141} {"train_loss": -27.129377365112305, "global_step": 509731, "epoch": 6141} {"train_loss": -27.37494468688965, "global_step": 509732, "epoch": 6141} {"train_loss": -27.25416374206543, "global_step": 509733, "epoch": 6141} {"train_loss": -27.32288932800293, "global_step": 509734, "epoch": 6141} {"train_loss": -27.251752853393555, "global_step": 509735, "epoch": 6141} {"train_loss": -26.940542221069336, "global_step": 509736, "epoch": 6141} {"train_loss": -27.183761596679688, "global_step": 509737, "epoch": 6141} {"train_loss": -26.859960556030273, "global_step": 509738, "epoch": 6141} {"train_loss": -27.19003677368164, "global_step": 509739, "epoch": 6141} {"train_loss": -27.503955841064453, "global_step": 509740, "epoch": 6141} {"train_loss": -27.539960861206055, "global_step": 509741, "epoch": 6141} {"train_loss": -27.43621253967285, "global_step": 509742, "epoch": 6141} {"train_loss": -27.57557487487793, "global_step": 509743, "epoch": 6141} {"train_loss": -27.586410522460938, "global_step": 509744, "epoch": 6141} {"train_loss": -27.38568115234375, "global_step": 509745, "epoch": 6141} {"train_loss": -27.59701919555664, "global_step": 509746, "epoch": 6141} {"train_loss": -27.46958351135254, "global_step": 509747, "epoch": 6141} {"train_loss": -27.372251510620117, "global_step": 509748, "epoch": 6141} {"train_loss": -27.665552139282227, "global_step": 509749, "epoch": 6141} {"train_loss": -27.929462432861328, "global_step": 509750, "epoch": 6141} {"train_loss": -27.584379196166992, "global_step": 509751, "epoch": 6141} {"train_loss": -27.844573974609375, "global_step": 509752, "epoch": 6141} {"train_loss": -27.800683975219727, "global_step": 509753, "epoch": 6141} {"train_loss": -27.6000919342041, "global_step": 509754, "epoch": 6141} {"train_loss": -27.64729881286621, "global_step": 509755, "epoch": 6141} {"train_loss": -27.57852554321289, "global_step": 509756, "epoch": 6141} {"train_loss": -27.387969970703125, "global_step": 509757, "epoch": 6141} {"train_loss": -27.602140426635742, "global_step": 509758, "epoch": 6141} {"train_loss": -27.625165939331055, "global_step": 509759, "epoch": 6141} {"train_loss": -27.610748291015625, "global_step": 509760, "epoch": 6141} {"train_loss": -27.426939010620117, "global_step": 509761, "epoch": 6141} {"train_loss": -27.69289207458496, "global_step": 509762, "epoch": 6141} {"train_loss": -27.609952926635742, "global_step": 509763, "epoch": 6141} {"train_loss": -27.720022201538086, "global_step": 509764, "epoch": 6141} {"train_loss": -27.656482696533203, "global_step": 509765, "epoch": 6141} {"train_loss": -27.582809448242188, "global_step": 509766, "epoch": 6141} {"train_loss": -27.8173885345459, "global_step": 509767, "epoch": 6141} {"train_loss": -27.604053497314453, "global_step": 509768, "epoch": 6141} {"train_loss": -27.528470993041992, "global_step": 509769, "epoch": 6141} {"train_loss": -27.709360122680664, "global_step": 509770, "epoch": 6141} {"train_loss": -27.543472290039062, "global_step": 509771, "epoch": 6141} {"train_loss": -27.484542846679688, "global_step": 509772, "epoch": 6141} {"train_loss": -27.798053741455078, "global_step": 509773, "epoch": 6141} {"train_loss": -27.64923667907715, "global_step": 509774, "epoch": 6141} {"train_loss": -27.8442440032959, "global_step": 509775, "epoch": 6141} {"train_loss": -27.3741455078125, "global_step": 509776, "epoch": 6141} {"train_loss": -27.302534103393555, "global_step": 509777, "epoch": 6141} {"train_loss": -27.427839279174805, "global_step": 509778, "epoch": 6141} {"train_loss": -27.430349349975586, "global_step": 509779, "epoch": 6141} {"train_loss": -27.186853408813477, "global_step": 509780, "epoch": 6141} {"train_loss": -26.946121215820312, "global_step": 509781, "epoch": 6141} {"train_loss": -27.551115036010742, "global_step": 509782, "epoch": 6141} {"train_loss": -26.894824981689453, "global_step": 509783, "epoch": 6141} {"train_loss": -27.648040771484375, "global_step": 509784, "epoch": 6141} {"train_loss": -27.170559733746998, "global_step": 509785, "epoch": 6141, "val_loss": 6460163.0} {"train_loss": -26.098005294799805, "global_step": 509786, "epoch": 6142} {"train_loss": -26.826547622680664, "global_step": 509787, "epoch": 6142} {"train_loss": -26.264514923095703, "global_step": 509788, "epoch": 6142} {"train_loss": -25.94830322265625, "global_step": 509789, "epoch": 6142} {"train_loss": -25.8640193939209, "global_step": 509790, "epoch": 6142} {"train_loss": -27.117177963256836, "global_step": 509791, "epoch": 6142} {"train_loss": -25.81390953063965, "global_step": 509792, "epoch": 6142} {"train_loss": -26.427282333374023, "global_step": 509793, "epoch": 6142} {"train_loss": -26.774463653564453, "global_step": 509794, "epoch": 6142} {"train_loss": -26.652738571166992, "global_step": 509795, "epoch": 6142} {"train_loss": -26.461334228515625, "global_step": 509796, "epoch": 6142} {"train_loss": -26.65180778503418, "global_step": 509797, "epoch": 6142} {"train_loss": -26.70635414123535, "global_step": 509798, "epoch": 6142} {"train_loss": -26.193689346313477, "global_step": 509799, "epoch": 6142} {"train_loss": -27.045150756835938, "global_step": 509800, "epoch": 6142} {"train_loss": -26.71355628967285, "global_step": 509801, "epoch": 6142} {"train_loss": -26.777936935424805, "global_step": 509802, "epoch": 6142} {"train_loss": -26.980451583862305, "global_step": 509803, "epoch": 6142} {"train_loss": -26.975341796875, "global_step": 509804, "epoch": 6142} {"train_loss": -26.81277847290039, "global_step": 509805, "epoch": 6142} {"train_loss": -27.097314834594727, "global_step": 509806, "epoch": 6142} {"train_loss": -27.153640747070312, "global_step": 509807, "epoch": 6142} {"train_loss": -27.09747886657715, "global_step": 509808, "epoch": 6142} {"train_loss": -27.4460506439209, "global_step": 509809, "epoch": 6142} {"train_loss": -27.227094650268555, "global_step": 509810, "epoch": 6142} {"train_loss": -27.16796875, "global_step": 509811, "epoch": 6142} {"train_loss": -26.698827743530273, "global_step": 509812, "epoch": 6142} {"train_loss": -27.4055118560791, "global_step": 509813, "epoch": 6142} {"train_loss": -26.961536407470703, "global_step": 509814, "epoch": 6142} {"train_loss": -26.849658966064453, "global_step": 509815, "epoch": 6142} {"train_loss": -26.544565200805664, "global_step": 509816, "epoch": 6142} {"train_loss": -27.043262481689453, "global_step": 509817, "epoch": 6142} {"train_loss": -27.05991554260254, "global_step": 509818, "epoch": 6142} {"train_loss": -27.194562911987305, "global_step": 509819, "epoch": 6142} {"train_loss": -27.358915328979492, "global_step": 509820, "epoch": 6142} {"train_loss": -27.354248046875, "global_step": 509821, "epoch": 6142} {"train_loss": -27.313953399658203, "global_step": 509822, "epoch": 6142} {"train_loss": -27.52247428894043, "global_step": 509823, "epoch": 6142} {"train_loss": -27.035390853881836, "global_step": 509824, "epoch": 6142} {"train_loss": -27.455137252807617, "global_step": 509825, "epoch": 6142} {"train_loss": -27.7468204498291, "global_step": 509826, "epoch": 6142} {"train_loss": -27.35028076171875, "global_step": 509827, "epoch": 6142} {"train_loss": -27.221790313720703, "global_step": 509828, "epoch": 6142} {"train_loss": -27.175146102905273, "global_step": 509829, "epoch": 6142} {"train_loss": -27.360212326049805, "global_step": 509830, "epoch": 6142} {"train_loss": -27.549423217773438, "global_step": 509831, "epoch": 6142} {"train_loss": -27.82868766784668, "global_step": 509832, "epoch": 6142} {"train_loss": -27.533554077148438, "global_step": 509833, "epoch": 6142} {"train_loss": -27.482196807861328, "global_step": 509834, "epoch": 6142} {"train_loss": -27.454320907592773, "global_step": 509835, "epoch": 6142} {"train_loss": -27.924264907836914, "global_step": 509836, "epoch": 6142} {"train_loss": -27.64045524597168, "global_step": 509837, "epoch": 6142} {"train_loss": -27.62811851501465, "global_step": 509838, "epoch": 6142} {"train_loss": -27.777923583984375, "global_step": 509839, "epoch": 6142} {"train_loss": -27.62150001525879, "global_step": 509840, "epoch": 6142} {"train_loss": -27.137958526611328, "global_step": 509841, "epoch": 6142} {"train_loss": -27.68255043029785, "global_step": 509842, "epoch": 6142} {"train_loss": -27.48301124572754, "global_step": 509843, "epoch": 6142} {"train_loss": -27.505781173706055, "global_step": 509844, "epoch": 6142} {"train_loss": -27.805150985717773, "global_step": 509845, "epoch": 6142} {"train_loss": -27.353559494018555, "global_step": 509846, "epoch": 6142} {"train_loss": -27.4178524017334, "global_step": 509847, "epoch": 6142} {"train_loss": -27.699277877807617, "global_step": 509848, "epoch": 6142} {"train_loss": -27.393238067626953, "global_step": 509849, "epoch": 6142} {"train_loss": -27.665771484375, "global_step": 509850, "epoch": 6142} {"train_loss": -27.448877334594727, "global_step": 509851, "epoch": 6142} {"train_loss": -27.199079513549805, "global_step": 509852, "epoch": 6142} {"train_loss": -27.55208396911621, "global_step": 509853, "epoch": 6142} {"train_loss": -26.820301055908203, "global_step": 509854, "epoch": 6142} {"train_loss": -27.476455688476562, "global_step": 509855, "epoch": 6142} {"train_loss": -27.420827865600586, "global_step": 509856, "epoch": 6142} {"train_loss": -27.2634220123291, "global_step": 509857, "epoch": 6142} {"train_loss": -27.295866012573242, "global_step": 509858, "epoch": 6142} {"train_loss": -27.7832088470459, "global_step": 509859, "epoch": 6142} {"train_loss": -27.574140548706055, "global_step": 509860, "epoch": 6142} {"train_loss": -27.444013595581055, "global_step": 509861, "epoch": 6142} {"train_loss": -27.271869659423828, "global_step": 509862, "epoch": 6142} {"train_loss": -27.277545928955078, "global_step": 509863, "epoch": 6142} {"train_loss": -27.51999855041504, "global_step": 509864, "epoch": 6142} {"train_loss": -27.50787925720215, "global_step": 509865, "epoch": 6142} {"train_loss": -27.437423706054688, "global_step": 509866, "epoch": 6142} {"train_loss": -27.698110580444336, "global_step": 509867, "epoch": 6142} {"train_loss": -27.192692216620387, "global_step": 509868, "epoch": 6142, "val_loss": 6552272.5} {"train_loss": -27.36494255065918, "global_step": 509869, "epoch": 6143} {"train_loss": -27.414047241210938, "global_step": 509870, "epoch": 6143} {"train_loss": -27.047321319580078, "global_step": 509871, "epoch": 6143} {"train_loss": -26.772714614868164, "global_step": 509872, "epoch": 6143} {"train_loss": -26.95142936706543, "global_step": 509873, "epoch": 6143} {"train_loss": -26.749469757080078, "global_step": 509874, "epoch": 6143} {"train_loss": -27.191877365112305, "global_step": 509875, "epoch": 6143} {"train_loss": -27.243825912475586, "global_step": 509876, "epoch": 6143} {"train_loss": -27.176233291625977, "global_step": 509877, "epoch": 6143} {"train_loss": -27.01691246032715, "global_step": 509878, "epoch": 6143} {"train_loss": -26.84433364868164, "global_step": 509879, "epoch": 6143} {"train_loss": -27.037006378173828, "global_step": 509880, "epoch": 6143} {"train_loss": -26.96949577331543, "global_step": 509881, "epoch": 6143} {"train_loss": -27.123151779174805, "global_step": 509882, "epoch": 6143} {"train_loss": -26.937225341796875, "global_step": 509883, "epoch": 6143} {"train_loss": -27.22681999206543, "global_step": 509884, "epoch": 6143} {"train_loss": -27.049884796142578, "global_step": 509885, "epoch": 6143} {"train_loss": -27.277334213256836, "global_step": 509886, "epoch": 6143} {"train_loss": -27.270719528198242, "global_step": 509887, "epoch": 6143} {"train_loss": -27.1931209564209, "global_step": 509888, "epoch": 6143} {"train_loss": -27.169208526611328, "global_step": 509889, "epoch": 6143} {"train_loss": -27.271930694580078, "global_step": 509890, "epoch": 6143} {"train_loss": -27.160358428955078, "global_step": 509891, "epoch": 6143} {"train_loss": -27.317737579345703, "global_step": 509892, "epoch": 6143} {"train_loss": -27.476715087890625, "global_step": 509893, "epoch": 6143} {"train_loss": -27.4631404876709, "global_step": 509894, "epoch": 6143} {"train_loss": -27.545690536499023, "global_step": 509895, "epoch": 6143} {"train_loss": -26.98750114440918, "global_step": 509896, "epoch": 6143} {"train_loss": -27.46375846862793, "global_step": 509897, "epoch": 6143} {"train_loss": -27.10127830505371, "global_step": 509898, "epoch": 6143} {"train_loss": -27.442188262939453, "global_step": 509899, "epoch": 6143} {"train_loss": -27.306812286376953, "global_step": 509900, "epoch": 6143} {"train_loss": -27.577173233032227, "global_step": 509901, "epoch": 6143} {"train_loss": -27.566253662109375, "global_step": 509902, "epoch": 6143} {"train_loss": -27.555952072143555, "global_step": 509903, "epoch": 6143} {"train_loss": -27.543928146362305, "global_step": 509904, "epoch": 6143} {"train_loss": -27.552764892578125, "global_step": 509905, "epoch": 6143} {"train_loss": -27.647153854370117, "global_step": 509906, "epoch": 6143} {"train_loss": -27.367795944213867, "global_step": 509907, "epoch": 6143} {"train_loss": -27.346160888671875, "global_step": 509908, "epoch": 6143} {"train_loss": -27.737781524658203, "global_step": 509909, "epoch": 6143} {"train_loss": -27.71771240234375, "global_step": 509910, "epoch": 6143} {"train_loss": -27.762210845947266, "global_step": 509911, "epoch": 6143} {"train_loss": -27.641632080078125, "global_step": 509912, "epoch": 6143} {"train_loss": -27.765399932861328, "global_step": 509913, "epoch": 6143} {"train_loss": -27.735532760620117, "global_step": 509914, "epoch": 6143} {"train_loss": -27.8029727935791, "global_step": 509915, "epoch": 6143} {"train_loss": -27.639392852783203, "global_step": 509916, "epoch": 6143} {"train_loss": -27.561752319335938, "global_step": 509917, "epoch": 6143} {"train_loss": -27.592214584350586, "global_step": 509918, "epoch": 6143} {"train_loss": -27.411523818969727, "global_step": 509919, "epoch": 6143} {"train_loss": -27.74500846862793, "global_step": 509920, "epoch": 6143} {"train_loss": -27.537734985351562, "global_step": 509921, "epoch": 6143} {"train_loss": -27.530170440673828, "global_step": 509922, "epoch": 6143} {"train_loss": -28.05497169494629, "global_step": 509923, "epoch": 6143} {"train_loss": -27.600269317626953, "global_step": 509924, "epoch": 6143} {"train_loss": -27.786701202392578, "global_step": 509925, "epoch": 6143} {"train_loss": -27.48431968688965, "global_step": 509926, "epoch": 6143} {"train_loss": -27.750822067260742, "global_step": 509927, "epoch": 6143} {"train_loss": -27.227102279663086, "global_step": 509928, "epoch": 6143} {"train_loss": -27.41139030456543, "global_step": 509929, "epoch": 6143} {"train_loss": -27.4755802154541, "global_step": 509930, "epoch": 6143} {"train_loss": -27.973590850830078, "global_step": 509931, "epoch": 6143} {"train_loss": -27.71539878845215, "global_step": 509932, "epoch": 6143} {"train_loss": -28.112085342407227, "global_step": 509933, "epoch": 6143} {"train_loss": -27.393798828125, "global_step": 509934, "epoch": 6143} {"train_loss": -27.933935165405273, "global_step": 509935, "epoch": 6143} {"train_loss": -27.535476684570312, "global_step": 509936, "epoch": 6143} {"train_loss": -27.666528701782227, "global_step": 509937, "epoch": 6143} {"train_loss": -28.201507568359375, "global_step": 509938, "epoch": 6143} {"train_loss": -27.93047523498535, "global_step": 509939, "epoch": 6143} {"train_loss": -27.8592529296875, "global_step": 509940, "epoch": 6143} {"train_loss": -27.301843643188477, "global_step": 509941, "epoch": 6143} {"train_loss": -26.874425888061523, "global_step": 509942, "epoch": 6143} {"train_loss": -26.03132438659668, "global_step": 509943, "epoch": 6143} {"train_loss": -26.09779167175293, "global_step": 509944, "epoch": 6143} {"train_loss": -26.818695068359375, "global_step": 509945, "epoch": 6143} {"train_loss": -27.31268310546875, "global_step": 509946, "epoch": 6143} {"train_loss": -27.018756866455078, "global_step": 509947, "epoch": 6143} {"train_loss": -27.013315200805664, "global_step": 509948, "epoch": 6143} {"train_loss": -27.816381454467773, "global_step": 509949, "epoch": 6143} {"train_loss": -27.205846786499023, "global_step": 509950, "epoch": 6143} {"train_loss": -27.38438994625965, "global_step": 509951, "epoch": 6143, "val_loss": 6599067.0} {"train_loss": -26.586048126220703, "global_step": 509952, "epoch": 6144} {"train_loss": -26.90042495727539, "global_step": 509953, "epoch": 6144} {"train_loss": -26.641422271728516, "global_step": 509954, "epoch": 6144} {"train_loss": -26.92120361328125, "global_step": 509955, "epoch": 6144} {"train_loss": -26.414688110351562, "global_step": 509956, "epoch": 6144} {"train_loss": -26.859821319580078, "global_step": 509957, "epoch": 6144} {"train_loss": -26.62407875061035, "global_step": 509958, "epoch": 6144} {"train_loss": -26.840290069580078, "global_step": 509959, "epoch": 6144} {"train_loss": -26.612897872924805, "global_step": 509960, "epoch": 6144} {"train_loss": -27.098234176635742, "global_step": 509961, "epoch": 6144} {"train_loss": -26.850309371948242, "global_step": 509962, "epoch": 6144} {"train_loss": -27.037372589111328, "global_step": 509963, "epoch": 6144} {"train_loss": -26.924545288085938, "global_step": 509964, "epoch": 6144} {"train_loss": -26.900318145751953, "global_step": 509965, "epoch": 6144} {"train_loss": -27.152074813842773, "global_step": 509966, "epoch": 6144} {"train_loss": -27.2613468170166, "global_step": 509967, "epoch": 6144} {"train_loss": -26.76123046875, "global_step": 509968, "epoch": 6144} {"train_loss": -26.720569610595703, "global_step": 509969, "epoch": 6144} {"train_loss": -27.622222900390625, "global_step": 509970, "epoch": 6144} {"train_loss": -27.440155029296875, "global_step": 509971, "epoch": 6144} {"train_loss": -27.355417251586914, "global_step": 509972, "epoch": 6144} {"train_loss": -27.344593048095703, "global_step": 509973, "epoch": 6144} {"train_loss": -27.615554809570312, "global_step": 509974, "epoch": 6144} {"train_loss": -27.13703727722168, "global_step": 509975, "epoch": 6144} {"train_loss": -27.32489585876465, "global_step": 509976, "epoch": 6144} {"train_loss": -27.11911392211914, "global_step": 509977, "epoch": 6144} {"train_loss": -27.214862823486328, "global_step": 509978, "epoch": 6144} {"train_loss": -27.34912109375, "global_step": 509979, "epoch": 6144} {"train_loss": -27.031524658203125, "global_step": 509980, "epoch": 6144} {"train_loss": -27.24561882019043, "global_step": 509981, "epoch": 6144} {"train_loss": -27.299589157104492, "global_step": 509982, "epoch": 6144} {"train_loss": -27.47080421447754, "global_step": 509983, "epoch": 6144} {"train_loss": -27.2255859375, "global_step": 509984, "epoch": 6144} {"train_loss": -27.5513973236084, "global_step": 509985, "epoch": 6144} {"train_loss": -26.90622901916504, "global_step": 509986, "epoch": 6144} {"train_loss": -27.407712936401367, "global_step": 509987, "epoch": 6144} {"train_loss": -27.410459518432617, "global_step": 509988, "epoch": 6144} {"train_loss": -27.239704132080078, "global_step": 509989, "epoch": 6144} {"train_loss": -27.235843658447266, "global_step": 509990, "epoch": 6144} {"train_loss": -27.554224014282227, "global_step": 509991, "epoch": 6144} {"train_loss": -27.177988052368164, "global_step": 509992, "epoch": 6144} {"train_loss": -27.552001953125, "global_step": 509993, "epoch": 6144} {"train_loss": -27.23056411743164, "global_step": 509994, "epoch": 6144} {"train_loss": -27.37508201599121, "global_step": 509995, "epoch": 6144} {"train_loss": -27.665115356445312, "global_step": 509996, "epoch": 6144} {"train_loss": -27.395721435546875, "global_step": 509997, "epoch": 6144} {"train_loss": -27.49287986755371, "global_step": 509998, "epoch": 6144} {"train_loss": -27.889301300048828, "global_step": 509999, "epoch": 6144} {"train_loss": -27.745410919189453, "global_step": 510000, "epoch": 6144} {"train_loss": -27.147809982299805, "global_step": 510001, "epoch": 6144} {"train_loss": -27.714929580688477, "global_step": 510002, "epoch": 6144} {"train_loss": -27.694034576416016, "global_step": 510003, "epoch": 6144} {"train_loss": -27.566089630126953, "global_step": 510004, "epoch": 6144} {"train_loss": -27.682682037353516, "global_step": 510005, "epoch": 6144} {"train_loss": -27.741260528564453, "global_step": 510006, "epoch": 6144} {"train_loss": -27.588520050048828, "global_step": 510007, "epoch": 6144} {"train_loss": -27.72698402404785, "global_step": 510008, "epoch": 6144} {"train_loss": -27.704038619995117, "global_step": 510009, "epoch": 6144} {"train_loss": -27.568395614624023, "global_step": 510010, "epoch": 6144} {"train_loss": -27.716333389282227, "global_step": 510011, "epoch": 6144} {"train_loss": -27.451318740844727, "global_step": 510012, "epoch": 6144} {"train_loss": -27.618558883666992, "global_step": 510013, "epoch": 6144} {"train_loss": -27.484546661376953, "global_step": 510014, "epoch": 6144} {"train_loss": -27.292724609375, "global_step": 510015, "epoch": 6144} {"train_loss": -27.63288688659668, "global_step": 510016, "epoch": 6144} {"train_loss": -27.56849479675293, "global_step": 510017, "epoch": 6144} {"train_loss": -27.246936798095703, "global_step": 510018, "epoch": 6144} {"train_loss": -27.15513038635254, "global_step": 510019, "epoch": 6144} {"train_loss": -27.443683624267578, "global_step": 510020, "epoch": 6144} {"train_loss": -27.620450973510742, "global_step": 510021, "epoch": 6144} {"train_loss": -28.050628662109375, "global_step": 510022, "epoch": 6144} {"train_loss": -27.337743759155273, "global_step": 510023, "epoch": 6144} {"train_loss": -27.25542640686035, "global_step": 510024, "epoch": 6144} {"train_loss": -27.5046443939209, "global_step": 510025, "epoch": 6144} {"train_loss": -27.070953369140625, "global_step": 510026, "epoch": 6144} {"train_loss": -27.321063995361328, "global_step": 510027, "epoch": 6144} {"train_loss": -27.539844512939453, "global_step": 510028, "epoch": 6144} {"train_loss": -27.511157989501953, "global_step": 510029, "epoch": 6144} {"train_loss": -26.869110107421875, "global_step": 510030, "epoch": 6144} {"train_loss": -26.5864200592041, "global_step": 510031, "epoch": 6144} {"train_loss": -27.186756134033203, "global_step": 510032, "epoch": 6144} {"train_loss": -27.374053955078125, "global_step": 510033, "epoch": 6144} {"train_loss": -27.296307621232, "global_step": 510034, "epoch": 6144, "val_loss": 6608160.5} {"train_loss": -27.137983322143555, "global_step": 510035, "epoch": 6145} {"train_loss": -26.371923446655273, "global_step": 510036, "epoch": 6145} {"train_loss": -26.979536056518555, "global_step": 510037, "epoch": 6145} {"train_loss": -27.215314865112305, "global_step": 510038, "epoch": 6145} {"train_loss": -26.750614166259766, "global_step": 510039, "epoch": 6145} {"train_loss": -27.25750732421875, "global_step": 510040, "epoch": 6145} {"train_loss": -27.00739860534668, "global_step": 510041, "epoch": 6145} {"train_loss": -26.978229522705078, "global_step": 510042, "epoch": 6145} {"train_loss": -27.072040557861328, "global_step": 510043, "epoch": 6145} {"train_loss": -27.220722198486328, "global_step": 510044, "epoch": 6145} {"train_loss": -26.953052520751953, "global_step": 510045, "epoch": 6145} {"train_loss": -26.720630645751953, "global_step": 510046, "epoch": 6145} {"train_loss": -27.265851974487305, "global_step": 510047, "epoch": 6145} {"train_loss": -27.155431747436523, "global_step": 510048, "epoch": 6145} {"train_loss": -27.3245906829834, "global_step": 510049, "epoch": 6145} {"train_loss": -27.017379760742188, "global_step": 510050, "epoch": 6145} {"train_loss": -27.283222198486328, "global_step": 510051, "epoch": 6145} {"train_loss": -27.26166343688965, "global_step": 510052, "epoch": 6145} {"train_loss": -27.178543090820312, "global_step": 510053, "epoch": 6145} {"train_loss": -27.19471549987793, "global_step": 510054, "epoch": 6145} {"train_loss": -27.17046546936035, "global_step": 510055, "epoch": 6145} {"train_loss": -27.086252212524414, "global_step": 510056, "epoch": 6145} {"train_loss": -28.0118465423584, "global_step": 510057, "epoch": 6145} {"train_loss": -26.909210205078125, "global_step": 510058, "epoch": 6145} {"train_loss": -27.466108322143555, "global_step": 510059, "epoch": 6145} {"train_loss": -27.28802490234375, "global_step": 510060, "epoch": 6145} {"train_loss": -27.412649154663086, "global_step": 510061, "epoch": 6145} {"train_loss": -27.36678123474121, "global_step": 510062, "epoch": 6145} {"train_loss": -27.481460571289062, "global_step": 510063, "epoch": 6145} {"train_loss": -27.437244415283203, "global_step": 510064, "epoch": 6145} {"train_loss": -27.3018798828125, "global_step": 510065, "epoch": 6145} {"train_loss": -27.026147842407227, "global_step": 510066, "epoch": 6145} {"train_loss": -27.605972290039062, "global_step": 510067, "epoch": 6145} {"train_loss": -27.38062858581543, "global_step": 510068, "epoch": 6145} {"train_loss": -27.550573348999023, "global_step": 510069, "epoch": 6145} {"train_loss": -27.514612197875977, "global_step": 510070, "epoch": 6145} {"train_loss": -27.27277183532715, "global_step": 510071, "epoch": 6145} {"train_loss": -27.493967056274414, "global_step": 510072, "epoch": 6145} {"train_loss": -27.65931510925293, "global_step": 510073, "epoch": 6145} {"train_loss": -27.668598175048828, "global_step": 510074, "epoch": 6145} {"train_loss": -27.632246017456055, "global_step": 510075, "epoch": 6145} {"train_loss": -27.723907470703125, "global_step": 510076, "epoch": 6145} {"train_loss": -27.72298240661621, "global_step": 510077, "epoch": 6145} {"train_loss": -27.72953224182129, "global_step": 510078, "epoch": 6145} {"train_loss": -27.335468292236328, "global_step": 510079, "epoch": 6145} {"train_loss": -27.82600212097168, "global_step": 510080, "epoch": 6145} {"train_loss": -27.083911895751953, "global_step": 510081, "epoch": 6145} {"train_loss": -27.805866241455078, "global_step": 510082, "epoch": 6145} {"train_loss": -27.66971206665039, "global_step": 510083, "epoch": 6145} {"train_loss": -27.43731689453125, "global_step": 510084, "epoch": 6145} {"train_loss": -27.633075714111328, "global_step": 510085, "epoch": 6145} {"train_loss": -27.636438369750977, "global_step": 510086, "epoch": 6145} {"train_loss": -27.598800659179688, "global_step": 510087, "epoch": 6145} {"train_loss": -27.760107040405273, "global_step": 510088, "epoch": 6145} {"train_loss": -27.689716339111328, "global_step": 510089, "epoch": 6145} {"train_loss": -27.890186309814453, "global_step": 510090, "epoch": 6145} {"train_loss": -27.890073776245117, "global_step": 510091, "epoch": 6145} {"train_loss": -27.973651885986328, "global_step": 510092, "epoch": 6145} {"train_loss": -27.772052764892578, "global_step": 510093, "epoch": 6145} {"train_loss": -27.4178524017334, "global_step": 510094, "epoch": 6145} {"train_loss": -27.681488037109375, "global_step": 510095, "epoch": 6145} {"train_loss": -27.084491729736328, "global_step": 510096, "epoch": 6145} {"train_loss": -27.285703659057617, "global_step": 510097, "epoch": 6145} {"train_loss": -27.51202964782715, "global_step": 510098, "epoch": 6145} {"train_loss": -27.740631103515625, "global_step": 510099, "epoch": 6145} {"train_loss": -27.458118438720703, "global_step": 510100, "epoch": 6145} {"train_loss": -27.033918380737305, "global_step": 510101, "epoch": 6145} {"train_loss": -27.041519165039062, "global_step": 510102, "epoch": 6145} {"train_loss": -27.1868839263916, "global_step": 510103, "epoch": 6145} {"train_loss": -27.262434005737305, "global_step": 510104, "epoch": 6145} {"train_loss": -27.600976943969727, "global_step": 510105, "epoch": 6145} {"train_loss": -27.34199333190918, "global_step": 510106, "epoch": 6145} {"train_loss": -27.2965145111084, "global_step": 510107, "epoch": 6145} {"train_loss": -27.557538986206055, "global_step": 510108, "epoch": 6145} {"train_loss": -27.41145896911621, "global_step": 510109, "epoch": 6145} {"train_loss": -27.625579833984375, "global_step": 510110, "epoch": 6145} {"train_loss": -27.32740592956543, "global_step": 510111, "epoch": 6145} {"train_loss": -27.94691276550293, "global_step": 510112, "epoch": 6145} {"train_loss": -27.222803115844727, "global_step": 510113, "epoch": 6145} {"train_loss": -27.60755729675293, "global_step": 510114, "epoch": 6145} {"train_loss": -27.216400146484375, "global_step": 510115, "epoch": 6145} {"train_loss": -27.39011001586914, "global_step": 510116, "epoch": 6145} {"train_loss": -27.39368110105216, "global_step": 510117, "epoch": 6145, "val_loss": 6540330.5} {"train_loss": -26.30073356628418, "global_step": 510118, "epoch": 6146} {"train_loss": -27.26447105407715, "global_step": 510119, "epoch": 6146} {"train_loss": -26.65748405456543, "global_step": 510120, "epoch": 6146} {"train_loss": -26.834033966064453, "global_step": 510121, "epoch": 6146} {"train_loss": -26.98402214050293, "global_step": 510122, "epoch": 6146} {"train_loss": -26.059396743774414, "global_step": 510123, "epoch": 6146} {"train_loss": -26.963613510131836, "global_step": 510124, "epoch": 6146} {"train_loss": -26.588315963745117, "global_step": 510125, "epoch": 6146} {"train_loss": -26.98956871032715, "global_step": 510126, "epoch": 6146} {"train_loss": -26.525787353515625, "global_step": 510127, "epoch": 6146} {"train_loss": -26.870197296142578, "global_step": 510128, "epoch": 6146} {"train_loss": -26.6556339263916, "global_step": 510129, "epoch": 6146} {"train_loss": -27.399885177612305, "global_step": 510130, "epoch": 6146} {"train_loss": -27.052265167236328, "global_step": 510131, "epoch": 6146} {"train_loss": -27.099668502807617, "global_step": 510132, "epoch": 6146} {"train_loss": -27.037195205688477, "global_step": 510133, "epoch": 6146} {"train_loss": -26.927814483642578, "global_step": 510134, "epoch": 6146} {"train_loss": -27.297504425048828, "global_step": 510135, "epoch": 6146} {"train_loss": -27.281055450439453, "global_step": 510136, "epoch": 6146} {"train_loss": -27.44585609436035, "global_step": 510137, "epoch": 6146} {"train_loss": -27.464155197143555, "global_step": 510138, "epoch": 6146} {"train_loss": -27.31415367126465, "global_step": 510139, "epoch": 6146} {"train_loss": -27.370725631713867, "global_step": 510140, "epoch": 6146} {"train_loss": -27.07378578186035, "global_step": 510141, "epoch": 6146} {"train_loss": -27.204626083374023, "global_step": 510142, "epoch": 6146} {"train_loss": -27.643659591674805, "global_step": 510143, "epoch": 6146} {"train_loss": -26.852096557617188, "global_step": 510144, "epoch": 6146} {"train_loss": -27.243127822875977, "global_step": 510145, "epoch": 6146} {"train_loss": -27.507349014282227, "global_step": 510146, "epoch": 6146} {"train_loss": -27.13753318786621, "global_step": 510147, "epoch": 6146} {"train_loss": -27.1395263671875, "global_step": 510148, "epoch": 6146} {"train_loss": -27.281925201416016, "global_step": 510149, "epoch": 6146} {"train_loss": -27.059213638305664, "global_step": 510150, "epoch": 6146} {"train_loss": -26.972036361694336, "global_step": 510151, "epoch": 6146} {"train_loss": -27.46649169921875, "global_step": 510152, "epoch": 6146} {"train_loss": -27.426870346069336, "global_step": 510153, "epoch": 6146} {"train_loss": -27.234821319580078, "global_step": 510154, "epoch": 6146} {"train_loss": -27.299640655517578, "global_step": 510155, "epoch": 6146} {"train_loss": -27.314960479736328, "global_step": 510156, "epoch": 6146} {"train_loss": -27.430395126342773, "global_step": 510157, "epoch": 6146} {"train_loss": -27.530288696289062, "global_step": 510158, "epoch": 6146} {"train_loss": -27.054357528686523, "global_step": 510159, "epoch": 6146} {"train_loss": -27.136072158813477, "global_step": 510160, "epoch": 6146} {"train_loss": -27.053735733032227, "global_step": 510161, "epoch": 6146} {"train_loss": -27.514429092407227, "global_step": 510162, "epoch": 6146} {"train_loss": -27.24006462097168, "global_step": 510163, "epoch": 6146} {"train_loss": -27.8216495513916, "global_step": 510164, "epoch": 6146} {"train_loss": -27.597440719604492, "global_step": 510165, "epoch": 6146} {"train_loss": -27.857263565063477, "global_step": 510166, "epoch": 6146} {"train_loss": -27.309467315673828, "global_step": 510167, "epoch": 6146} {"train_loss": -27.29657554626465, "global_step": 510168, "epoch": 6146} {"train_loss": -27.2097110748291, "global_step": 510169, "epoch": 6146} {"train_loss": -27.37749671936035, "global_step": 510170, "epoch": 6146} {"train_loss": -27.522232055664062, "global_step": 510171, "epoch": 6146} {"train_loss": -27.1949520111084, "global_step": 510172, "epoch": 6146} {"train_loss": -27.882043838500977, "global_step": 510173, "epoch": 6146} {"train_loss": -27.68813133239746, "global_step": 510174, "epoch": 6146} {"train_loss": -27.810205459594727, "global_step": 510175, "epoch": 6146} {"train_loss": -27.39922523498535, "global_step": 510176, "epoch": 6146} {"train_loss": -27.509719848632812, "global_step": 510177, "epoch": 6146} {"train_loss": -27.293746948242188, "global_step": 510178, "epoch": 6146} {"train_loss": -27.270111083984375, "global_step": 510179, "epoch": 6146} {"train_loss": -27.645374298095703, "global_step": 510180, "epoch": 6146} {"train_loss": -27.450504302978516, "global_step": 510181, "epoch": 6146} {"train_loss": -27.21051025390625, "global_step": 510182, "epoch": 6146} {"train_loss": -27.568679809570312, "global_step": 510183, "epoch": 6146} {"train_loss": -27.3831844329834, "global_step": 510184, "epoch": 6146} {"train_loss": -27.491317749023438, "global_step": 510185, "epoch": 6146} {"train_loss": -27.5296630859375, "global_step": 510186, "epoch": 6146} {"train_loss": -27.5377254486084, "global_step": 510187, "epoch": 6146} {"train_loss": -27.837177276611328, "global_step": 510188, "epoch": 6146} {"train_loss": -27.404264450073242, "global_step": 510189, "epoch": 6146} {"train_loss": -27.97408103942871, "global_step": 510190, "epoch": 6146} {"train_loss": -27.63189125061035, "global_step": 510191, "epoch": 6146} {"train_loss": -27.28382682800293, "global_step": 510192, "epoch": 6146} {"train_loss": -27.403451919555664, "global_step": 510193, "epoch": 6146} {"train_loss": -27.594770431518555, "global_step": 510194, "epoch": 6146} {"train_loss": -27.790250778198242, "global_step": 510195, "epoch": 6146} {"train_loss": -27.597278594970703, "global_step": 510196, "epoch": 6146} {"train_loss": -27.686948776245117, "global_step": 510197, "epoch": 6146} {"train_loss": -27.59626579284668, "global_step": 510198, "epoch": 6146} {"train_loss": -27.41377067565918, "global_step": 510199, "epoch": 6146} {"train_loss": -27.297593059309992, "global_step": 510200, "epoch": 6146, "val_loss": 6551665.0} {"train_loss": -27.164752960205078, "global_step": 510201, "epoch": 6147} {"train_loss": -26.534133911132812, "global_step": 510202, "epoch": 6147} {"train_loss": -26.799884796142578, "global_step": 510203, "epoch": 6147} {"train_loss": -26.890600204467773, "global_step": 510204, "epoch": 6147} {"train_loss": -26.55494499206543, "global_step": 510205, "epoch": 6147} {"train_loss": -27.224857330322266, "global_step": 510206, "epoch": 6147} {"train_loss": -27.268896102905273, "global_step": 510207, "epoch": 6147} {"train_loss": -26.815271377563477, "global_step": 510208, "epoch": 6147} {"train_loss": -27.282623291015625, "global_step": 510209, "epoch": 6147} {"train_loss": -27.03547477722168, "global_step": 510210, "epoch": 6147} {"train_loss": -27.18656349182129, "global_step": 510211, "epoch": 6147} {"train_loss": -27.083511352539062, "global_step": 510212, "epoch": 6147} {"train_loss": -27.308029174804688, "global_step": 510213, "epoch": 6147} {"train_loss": -27.304458618164062, "global_step": 510214, "epoch": 6147} {"train_loss": -27.43466567993164, "global_step": 510215, "epoch": 6147} {"train_loss": -27.469135284423828, "global_step": 510216, "epoch": 6147} {"train_loss": -27.06524658203125, "global_step": 510217, "epoch": 6147} {"train_loss": -27.81751823425293, "global_step": 510218, "epoch": 6147} {"train_loss": -27.434228897094727, "global_step": 510219, "epoch": 6147} {"train_loss": -27.346220016479492, "global_step": 510220, "epoch": 6147} {"train_loss": -27.26009178161621, "global_step": 510221, "epoch": 6147} {"train_loss": -27.449371337890625, "global_step": 510222, "epoch": 6147} {"train_loss": -27.205148696899414, "global_step": 510223, "epoch": 6147} {"train_loss": -27.578571319580078, "global_step": 510224, "epoch": 6147} {"train_loss": -27.389453887939453, "global_step": 510225, "epoch": 6147} {"train_loss": -27.260900497436523, "global_step": 510226, "epoch": 6147} {"train_loss": -27.590017318725586, "global_step": 510227, "epoch": 6147} {"train_loss": -27.608572006225586, "global_step": 510228, "epoch": 6147} {"train_loss": -27.477447509765625, "global_step": 510229, "epoch": 6147} {"train_loss": -27.6429500579834, "global_step": 510230, "epoch": 6147} {"train_loss": -27.88639259338379, "global_step": 510231, "epoch": 6147} {"train_loss": -27.713321685791016, "global_step": 510232, "epoch": 6147} {"train_loss": -27.50359535217285, "global_step": 510233, "epoch": 6147} {"train_loss": -27.104400634765625, "global_step": 510234, "epoch": 6147} {"train_loss": -27.20774269104004, "global_step": 510235, "epoch": 6147} {"train_loss": -27.01954460144043, "global_step": 510236, "epoch": 6147} {"train_loss": -27.386789321899414, "global_step": 510237, "epoch": 6147} {"train_loss": -27.10502052307129, "global_step": 510238, "epoch": 6147} {"train_loss": -27.427087783813477, "global_step": 510239, "epoch": 6147} {"train_loss": -27.543121337890625, "global_step": 510240, "epoch": 6147} {"train_loss": -27.541128158569336, "global_step": 510241, "epoch": 6147} {"train_loss": -27.049039840698242, "global_step": 510242, "epoch": 6147} {"train_loss": -27.152023315429688, "global_step": 510243, "epoch": 6147} {"train_loss": -27.47254753112793, "global_step": 510244, "epoch": 6147} {"train_loss": -27.763168334960938, "global_step": 510245, "epoch": 6147} {"train_loss": -26.92888832092285, "global_step": 510246, "epoch": 6147} {"train_loss": -27.088409423828125, "global_step": 510247, "epoch": 6147} {"train_loss": -27.30061149597168, "global_step": 510248, "epoch": 6147} {"train_loss": -26.93916130065918, "global_step": 510249, "epoch": 6147} {"train_loss": -27.296289443969727, "global_step": 510250, "epoch": 6147} {"train_loss": -27.094247817993164, "global_step": 510251, "epoch": 6147} {"train_loss": -26.986846923828125, "global_step": 510252, "epoch": 6147} {"train_loss": -27.721485137939453, "global_step": 510253, "epoch": 6147} {"train_loss": -27.63128089904785, "global_step": 510254, "epoch": 6147} {"train_loss": -27.513294219970703, "global_step": 510255, "epoch": 6147} {"train_loss": -27.617023468017578, "global_step": 510256, "epoch": 6147} {"train_loss": -27.11869239807129, "global_step": 510257, "epoch": 6147} {"train_loss": -27.503177642822266, "global_step": 510258, "epoch": 6147} {"train_loss": -27.719257354736328, "global_step": 510259, "epoch": 6147} {"train_loss": -27.80940818786621, "global_step": 510260, "epoch": 6147} {"train_loss": -27.216711044311523, "global_step": 510261, "epoch": 6147} {"train_loss": -27.15569496154785, "global_step": 510262, "epoch": 6147} {"train_loss": -27.227243423461914, "global_step": 510263, "epoch": 6147} {"train_loss": -26.822813034057617, "global_step": 510264, "epoch": 6147} {"train_loss": -27.451007843017578, "global_step": 510265, "epoch": 6147} {"train_loss": -27.367048263549805, "global_step": 510266, "epoch": 6147} {"train_loss": -27.494770050048828, "global_step": 510267, "epoch": 6147} {"train_loss": -27.185941696166992, "global_step": 510268, "epoch": 6147} {"train_loss": -27.68295669555664, "global_step": 510269, "epoch": 6147} {"train_loss": -27.28775405883789, "global_step": 510270, "epoch": 6147} {"train_loss": -27.7503662109375, "global_step": 510271, "epoch": 6147} {"train_loss": -27.643802642822266, "global_step": 510272, "epoch": 6147} {"train_loss": -27.425886154174805, "global_step": 510273, "epoch": 6147} {"train_loss": -27.485082626342773, "global_step": 510274, "epoch": 6147} {"train_loss": -27.582834243774414, "global_step": 510275, "epoch": 6147} {"train_loss": -27.421234130859375, "global_step": 510276, "epoch": 6147} {"train_loss": -27.540719985961914, "global_step": 510277, "epoch": 6147} {"train_loss": -27.62635612487793, "global_step": 510278, "epoch": 6147} {"train_loss": -27.781330108642578, "global_step": 510279, "epoch": 6147} {"train_loss": -27.107080459594727, "global_step": 510280, "epoch": 6147} {"train_loss": -27.513031005859375, "global_step": 510281, "epoch": 6147} {"train_loss": -27.678607940673828, "global_step": 510282, "epoch": 6147} {"train_loss": -27.35520576568971, "global_step": 510283, "epoch": 6147, "val_loss": 6610222.0} {"train_loss": -25.7945613861084, "global_step": 510284, "epoch": 6148} {"train_loss": -23.591400146484375, "global_step": 510285, "epoch": 6148} {"train_loss": -22.926151275634766, "global_step": 510286, "epoch": 6148} {"train_loss": -26.370492935180664, "global_step": 510287, "epoch": 6148} {"train_loss": -25.165267944335938, "global_step": 510288, "epoch": 6148} {"train_loss": -23.781702041625977, "global_step": 510289, "epoch": 6148} {"train_loss": -26.201019287109375, "global_step": 510290, "epoch": 6148} {"train_loss": -24.293716430664062, "global_step": 510291, "epoch": 6148} {"train_loss": -25.490482330322266, "global_step": 510292, "epoch": 6148} {"train_loss": -25.597349166870117, "global_step": 510293, "epoch": 6148} {"train_loss": -25.577190399169922, "global_step": 510294, "epoch": 6148} {"train_loss": -26.346267700195312, "global_step": 510295, "epoch": 6148} {"train_loss": -26.002796173095703, "global_step": 510296, "epoch": 6148} {"train_loss": -25.8687686920166, "global_step": 510297, "epoch": 6148} {"train_loss": -26.382322311401367, "global_step": 510298, "epoch": 6148} {"train_loss": -25.8583984375, "global_step": 510299, "epoch": 6148} {"train_loss": -26.688140869140625, "global_step": 510300, "epoch": 6148} {"train_loss": -26.05539321899414, "global_step": 510301, "epoch": 6148} {"train_loss": -26.69010353088379, "global_step": 510302, "epoch": 6148} {"train_loss": -26.241729736328125, "global_step": 510303, "epoch": 6148} {"train_loss": -26.493865966796875, "global_step": 510304, "epoch": 6148} {"train_loss": -26.40304946899414, "global_step": 510305, "epoch": 6148} {"train_loss": -26.792236328125, "global_step": 510306, "epoch": 6148} {"train_loss": -26.467975616455078, "global_step": 510307, "epoch": 6148} {"train_loss": -26.637115478515625, "global_step": 510308, "epoch": 6148} {"train_loss": -26.610403060913086, "global_step": 510309, "epoch": 6148} {"train_loss": -26.49848747253418, "global_step": 510310, "epoch": 6148} {"train_loss": -26.592493057250977, "global_step": 510311, "epoch": 6148} {"train_loss": -26.72600746154785, "global_step": 510312, "epoch": 6148} {"train_loss": -26.939716339111328, "global_step": 510313, "epoch": 6148} {"train_loss": -26.610525131225586, "global_step": 510314, "epoch": 6148} {"train_loss": -26.327991485595703, "global_step": 510315, "epoch": 6148} {"train_loss": -26.6170597076416, "global_step": 510316, "epoch": 6148} {"train_loss": -26.753467559814453, "global_step": 510317, "epoch": 6148} {"train_loss": -26.762502670288086, "global_step": 510318, "epoch": 6148} {"train_loss": -26.805530548095703, "global_step": 510319, "epoch": 6148} {"train_loss": -27.08990478515625, "global_step": 510320, "epoch": 6148} {"train_loss": -26.959203720092773, "global_step": 510321, "epoch": 6148} {"train_loss": -26.932327270507812, "global_step": 510322, "epoch": 6148} {"train_loss": -26.759357452392578, "global_step": 510323, "epoch": 6148} {"train_loss": -26.894134521484375, "global_step": 510324, "epoch": 6148} {"train_loss": -26.9459171295166, "global_step": 510325, "epoch": 6148} {"train_loss": -27.018085479736328, "global_step": 510326, "epoch": 6148} {"train_loss": -27.31591796875, "global_step": 510327, "epoch": 6148} {"train_loss": -27.129779815673828, "global_step": 510328, "epoch": 6148} {"train_loss": -27.51717185974121, "global_step": 510329, "epoch": 6148} {"train_loss": -27.250059127807617, "global_step": 510330, "epoch": 6148} {"train_loss": -27.491703033447266, "global_step": 510331, "epoch": 6148} {"train_loss": -27.563703536987305, "global_step": 510332, "epoch": 6148} {"train_loss": -27.149112701416016, "global_step": 510333, "epoch": 6148} {"train_loss": -27.125146865844727, "global_step": 510334, "epoch": 6148} {"train_loss": -27.195852279663086, "global_step": 510335, "epoch": 6148} {"train_loss": -27.427106857299805, "global_step": 510336, "epoch": 6148} {"train_loss": -27.4000186920166, "global_step": 510337, "epoch": 6148} {"train_loss": -27.441877365112305, "global_step": 510338, "epoch": 6148} {"train_loss": -27.380401611328125, "global_step": 510339, "epoch": 6148} {"train_loss": -27.781457901000977, "global_step": 510340, "epoch": 6148} {"train_loss": -27.446134567260742, "global_step": 510341, "epoch": 6148} {"train_loss": -27.724212646484375, "global_step": 510342, "epoch": 6148} {"train_loss": -27.52723503112793, "global_step": 510343, "epoch": 6148} {"train_loss": -27.585973739624023, "global_step": 510344, "epoch": 6148} {"train_loss": -27.279966354370117, "global_step": 510345, "epoch": 6148} {"train_loss": -27.5098819732666, "global_step": 510346, "epoch": 6148} {"train_loss": -27.663970947265625, "global_step": 510347, "epoch": 6148} {"train_loss": -27.439001083374023, "global_step": 510348, "epoch": 6148} {"train_loss": -27.684223175048828, "global_step": 510349, "epoch": 6148} {"train_loss": -27.924667358398438, "global_step": 510350, "epoch": 6148} {"train_loss": -27.567657470703125, "global_step": 510351, "epoch": 6148} {"train_loss": -27.86136817932129, "global_step": 510352, "epoch": 6148} {"train_loss": -27.367431640625, "global_step": 510353, "epoch": 6148} {"train_loss": -27.683263778686523, "global_step": 510354, "epoch": 6148} {"train_loss": -26.9854793548584, "global_step": 510355, "epoch": 6148} {"train_loss": -27.25825309753418, "global_step": 510356, "epoch": 6148} {"train_loss": -27.969282150268555, "global_step": 510357, "epoch": 6148} {"train_loss": -27.58717155456543, "global_step": 510358, "epoch": 6148} {"train_loss": -27.263233184814453, "global_step": 510359, "epoch": 6148} {"train_loss": -26.884057998657227, "global_step": 510360, "epoch": 6148} {"train_loss": -27.94779396057129, "global_step": 510361, "epoch": 6148} {"train_loss": -27.56024742126465, "global_step": 510362, "epoch": 6148} {"train_loss": -27.461088180541992, "global_step": 510363, "epoch": 6148} {"train_loss": -28.024932861328125, "global_step": 510364, "epoch": 6148} {"train_loss": -27.87506675720215, "global_step": 510365, "epoch": 6148} {"train_loss": -26.811714654945465, "global_step": 510366, "epoch": 6148, "val_loss": 6670475.0} {"train_loss": -27.58754539489746, "global_step": 510367, "epoch": 6149} {"train_loss": -27.22993278503418, "global_step": 510368, "epoch": 6149} {"train_loss": -27.2200927734375, "global_step": 510369, "epoch": 6149} {"train_loss": -27.22258949279785, "global_step": 510370, "epoch": 6149} {"train_loss": -27.23420524597168, "global_step": 510371, "epoch": 6149} {"train_loss": -27.34425163269043, "global_step": 510372, "epoch": 6149} {"train_loss": -27.364755630493164, "global_step": 510373, "epoch": 6149} {"train_loss": -26.96657371520996, "global_step": 510374, "epoch": 6149} {"train_loss": -27.138198852539062, "global_step": 510375, "epoch": 6149} {"train_loss": -26.787506103515625, "global_step": 510376, "epoch": 6149} {"train_loss": -27.587051391601562, "global_step": 510377, "epoch": 6149} {"train_loss": -26.794782638549805, "global_step": 510378, "epoch": 6149} {"train_loss": -27.18519401550293, "global_step": 510379, "epoch": 6149} {"train_loss": -27.74534034729004, "global_step": 510380, "epoch": 6149} {"train_loss": -27.24517822265625, "global_step": 510381, "epoch": 6149} {"train_loss": -27.588809967041016, "global_step": 510382, "epoch": 6149} {"train_loss": -27.208393096923828, "global_step": 510383, "epoch": 6149} {"train_loss": -27.485279083251953, "global_step": 510384, "epoch": 6149} {"train_loss": -27.486352920532227, "global_step": 510385, "epoch": 6149} {"train_loss": -27.27546501159668, "global_step": 510386, "epoch": 6149} {"train_loss": -27.230859756469727, "global_step": 510387, "epoch": 6149} {"train_loss": -27.713415145874023, "global_step": 510388, "epoch": 6149} {"train_loss": -27.212635040283203, "global_step": 510389, "epoch": 6149} {"train_loss": -27.172311782836914, "global_step": 510390, "epoch": 6149} {"train_loss": -27.256982803344727, "global_step": 510391, "epoch": 6149} {"train_loss": -27.4642391204834, "global_step": 510392, "epoch": 6149} {"train_loss": -27.42266273498535, "global_step": 510393, "epoch": 6149} {"train_loss": -27.681135177612305, "global_step": 510394, "epoch": 6149} {"train_loss": -27.063077926635742, "global_step": 510395, "epoch": 6149} {"train_loss": -27.547876358032227, "global_step": 510396, "epoch": 6149} {"train_loss": -27.64813232421875, "global_step": 510397, "epoch": 6149} {"train_loss": -27.69487953186035, "global_step": 510398, "epoch": 6149} {"train_loss": -27.3562068939209, "global_step": 510399, "epoch": 6149} {"train_loss": -27.41315269470215, "global_step": 510400, "epoch": 6149} {"train_loss": -27.37748146057129, "global_step": 510401, "epoch": 6149} {"train_loss": -27.612207412719727, "global_step": 510402, "epoch": 6149} {"train_loss": -27.361188888549805, "global_step": 510403, "epoch": 6149} {"train_loss": -27.422388076782227, "global_step": 510404, "epoch": 6149} {"train_loss": -27.601287841796875, "global_step": 510405, "epoch": 6149} {"train_loss": -27.728918075561523, "global_step": 510406, "epoch": 6149} {"train_loss": -27.566247940063477, "global_step": 510407, "epoch": 6149} {"train_loss": -27.605634689331055, "global_step": 510408, "epoch": 6149} {"train_loss": -27.226110458374023, "global_step": 510409, "epoch": 6149} {"train_loss": -27.21728515625, "global_step": 510410, "epoch": 6149} {"train_loss": -27.394672393798828, "global_step": 510411, "epoch": 6149} {"train_loss": -27.509632110595703, "global_step": 510412, "epoch": 6149} {"train_loss": -26.847412109375, "global_step": 510413, "epoch": 6149} {"train_loss": -27.37579345703125, "global_step": 510414, "epoch": 6149} {"train_loss": -27.29253578186035, "global_step": 510415, "epoch": 6149} {"train_loss": -27.334110260009766, "global_step": 510416, "epoch": 6149} {"train_loss": -27.748594284057617, "global_step": 510417, "epoch": 6149} {"train_loss": -27.4084529876709, "global_step": 510418, "epoch": 6149} {"train_loss": -27.62925148010254, "global_step": 510419, "epoch": 6149} {"train_loss": -27.632043838500977, "global_step": 510420, "epoch": 6149} {"train_loss": -27.42976951599121, "global_step": 510421, "epoch": 6149} {"train_loss": -27.321502685546875, "global_step": 510422, "epoch": 6149} {"train_loss": -27.313146591186523, "global_step": 510423, "epoch": 6149} {"train_loss": -27.559064865112305, "global_step": 510424, "epoch": 6149} {"train_loss": -27.6558895111084, "global_step": 510425, "epoch": 6149} {"train_loss": -27.438337326049805, "global_step": 510426, "epoch": 6149} {"train_loss": -27.318029403686523, "global_step": 510427, "epoch": 6149} {"train_loss": -27.424787521362305, "global_step": 510428, "epoch": 6149} {"train_loss": -27.3674373626709, "global_step": 510429, "epoch": 6149} {"train_loss": -27.571802139282227, "global_step": 510430, "epoch": 6149} {"train_loss": -27.44679069519043, "global_step": 510431, "epoch": 6149} {"train_loss": -27.905811309814453, "global_step": 510432, "epoch": 6149} {"train_loss": -27.3004093170166, "global_step": 510433, "epoch": 6149} {"train_loss": -27.78180503845215, "global_step": 510434, "epoch": 6149} {"train_loss": -27.837234497070312, "global_step": 510435, "epoch": 6149} {"train_loss": -27.663854598999023, "global_step": 510436, "epoch": 6149} {"train_loss": -27.52838134765625, "global_step": 510437, "epoch": 6149} {"train_loss": -27.604028701782227, "global_step": 510438, "epoch": 6149} {"train_loss": -27.306013107299805, "global_step": 510439, "epoch": 6149} {"train_loss": -27.668848037719727, "global_step": 510440, "epoch": 6149} {"train_loss": -27.70570182800293, "global_step": 510441, "epoch": 6149} {"train_loss": -27.775989532470703, "global_step": 510442, "epoch": 6149} {"train_loss": -27.53778648376465, "global_step": 510443, "epoch": 6149} {"train_loss": -27.603933334350586, "global_step": 510444, "epoch": 6149} {"train_loss": -27.7335262298584, "global_step": 510445, "epoch": 6149} {"train_loss": -27.76791763305664, "global_step": 510446, "epoch": 6149} {"train_loss": -27.511632919311523, "global_step": 510447, "epoch": 6149} {"train_loss": -27.5721378326416, "global_step": 510448, "epoch": 6149} {"train_loss": -27.447878412453527, "global_step": 510449, "epoch": 6149, "val_loss": 6629759.0} {"train_loss": -25.700153350830078, "global_step": 510450, "epoch": 6150} {"train_loss": -25.417692184448242, "global_step": 510451, "epoch": 6150} {"train_loss": -25.670001983642578, "global_step": 510452, "epoch": 6150} {"train_loss": -25.35944938659668, "global_step": 510453, "epoch": 6150} {"train_loss": -25.9881591796875, "global_step": 510454, "epoch": 6150} {"train_loss": -24.894437789916992, "global_step": 510455, "epoch": 6150} {"train_loss": -26.858407974243164, "global_step": 510456, "epoch": 6150} {"train_loss": -25.793588638305664, "global_step": 510457, "epoch": 6150} {"train_loss": -26.009634017944336, "global_step": 510458, "epoch": 6150} {"train_loss": -26.74334716796875, "global_step": 510459, "epoch": 6150} {"train_loss": -26.289846420288086, "global_step": 510460, "epoch": 6150} {"train_loss": -26.346052169799805, "global_step": 510461, "epoch": 6150} {"train_loss": -26.20160484313965, "global_step": 510462, "epoch": 6150} {"train_loss": -26.738479614257812, "global_step": 510463, "epoch": 6150} {"train_loss": -26.5905818939209, "global_step": 510464, "epoch": 6150} {"train_loss": -26.76025390625, "global_step": 510465, "epoch": 6150} {"train_loss": -26.363916397094727, "global_step": 510466, "epoch": 6150} {"train_loss": -26.498920440673828, "global_step": 510467, "epoch": 6150} {"train_loss": -26.69083023071289, "global_step": 510468, "epoch": 6150} {"train_loss": -26.433515548706055, "global_step": 510469, "epoch": 6150} {"train_loss": -26.585920333862305, "global_step": 510470, "epoch": 6150} {"train_loss": -26.742136001586914, "global_step": 510471, "epoch": 6150} {"train_loss": -26.68402671813965, "global_step": 510472, "epoch": 6150} {"train_loss": -26.734378814697266, "global_step": 510473, "epoch": 6150} {"train_loss": -27.07423210144043, "global_step": 510474, "epoch": 6150} {"train_loss": -26.947843551635742, "global_step": 510475, "epoch": 6150} {"train_loss": -26.95058250427246, "global_step": 510476, "epoch": 6150} {"train_loss": -26.78975486755371, "global_step": 510477, "epoch": 6150} {"train_loss": -26.817916870117188, "global_step": 510478, "epoch": 6150} {"train_loss": -27.129531860351562, "global_step": 510479, "epoch": 6150} {"train_loss": -26.979034423828125, "global_step": 510480, "epoch": 6150} {"train_loss": -27.32257652282715, "global_step": 510481, "epoch": 6150} {"train_loss": -27.246826171875, "global_step": 510482, "epoch": 6150} {"train_loss": -27.056806564331055, "global_step": 510483, "epoch": 6150} {"train_loss": -26.7805118560791, "global_step": 510484, "epoch": 6150} {"train_loss": -27.178802490234375, "global_step": 510485, "epoch": 6150} {"train_loss": -27.51837730407715, "global_step": 510486, "epoch": 6150} {"train_loss": -27.362049102783203, "global_step": 510487, "epoch": 6150} {"train_loss": -27.155200958251953, "global_step": 510488, "epoch": 6150} {"train_loss": -27.33440589904785, "global_step": 510489, "epoch": 6150} {"train_loss": -27.405282974243164, "global_step": 510490, "epoch": 6150} {"train_loss": -27.482196807861328, "global_step": 510491, "epoch": 6150} {"train_loss": -27.468652725219727, "global_step": 510492, "epoch": 6150} {"train_loss": -27.2308292388916, "global_step": 510493, "epoch": 6150} {"train_loss": -27.473617553710938, "global_step": 510494, "epoch": 6150} {"train_loss": -27.72650718688965, "global_step": 510495, "epoch": 6150} {"train_loss": -27.352460861206055, "global_step": 510496, "epoch": 6150} {"train_loss": -27.222654342651367, "global_step": 510497, "epoch": 6150} {"train_loss": -27.538679122924805, "global_step": 510498, "epoch": 6150} {"train_loss": -27.66371726989746, "global_step": 510499, "epoch": 6150} {"train_loss": -27.339994430541992, "global_step": 510500, "epoch": 6150} {"train_loss": -27.407201766967773, "global_step": 510501, "epoch": 6150} {"train_loss": -27.879789352416992, "global_step": 510502, "epoch": 6150} {"train_loss": -27.453027725219727, "global_step": 510503, "epoch": 6150} {"train_loss": -27.679519653320312, "global_step": 510504, "epoch": 6150} {"train_loss": -27.578048706054688, "global_step": 510505, "epoch": 6150} {"train_loss": -27.48142433166504, "global_step": 510506, "epoch": 6150} {"train_loss": -27.597583770751953, "global_step": 510507, "epoch": 6150} {"train_loss": -27.554365158081055, "global_step": 510508, "epoch": 6150} {"train_loss": -27.421072006225586, "global_step": 510509, "epoch": 6150} {"train_loss": -27.572452545166016, "global_step": 510510, "epoch": 6150} {"train_loss": -27.884260177612305, "global_step": 510511, "epoch": 6150} {"train_loss": -27.572500228881836, "global_step": 510512, "epoch": 6150} {"train_loss": -27.595951080322266, "global_step": 510513, "epoch": 6150} {"train_loss": -27.383787155151367, "global_step": 510514, "epoch": 6150} {"train_loss": -27.42592430114746, "global_step": 510515, "epoch": 6150} {"train_loss": -27.887866973876953, "global_step": 510516, "epoch": 6150} {"train_loss": -27.835407257080078, "global_step": 510517, "epoch": 6150} {"train_loss": -27.1412296295166, "global_step": 510518, "epoch": 6150} {"train_loss": -27.614866256713867, "global_step": 510519, "epoch": 6150} {"train_loss": -27.368701934814453, "global_step": 510520, "epoch": 6150} {"train_loss": -27.519113540649414, "global_step": 510521, "epoch": 6150} {"train_loss": -27.732114791870117, "global_step": 510522, "epoch": 6150} {"train_loss": -27.980432510375977, "global_step": 510523, "epoch": 6150} {"train_loss": -27.760114669799805, "global_step": 510524, "epoch": 6150} {"train_loss": -27.503507614135742, "global_step": 510525, "epoch": 6150} {"train_loss": -27.810840606689453, "global_step": 510526, "epoch": 6150} {"train_loss": -27.573577880859375, "global_step": 510527, "epoch": 6150} {"train_loss": -27.27426528930664, "global_step": 510528, "epoch": 6150} {"train_loss": -27.712726593017578, "global_step": 510529, "epoch": 6150} {"train_loss": -27.714324951171875, "global_step": 510530, "epoch": 6150} {"train_loss": -27.636930465698242, "global_step": 510531, "epoch": 6150} {"train_loss": -27.083336336066925, "global_step": 510532, "epoch": 6150, "train/sim_max_reward_0": 0.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 0.0, "test/sim_max_reward_4500000": 1.0, "test/sim_max_reward_4500001": 1.0, "test/sim_max_reward_4500002": 1.0, "test/sim_max_reward_4500003": 1.0, "test/sim_max_reward_4500004": 1.0, "test/sim_max_reward_4500005": 1.0, "test/sim_max_reward_4500006": 1.0, "test/sim_max_reward_4500007": 1.0, "test/sim_max_reward_4500008": 1.0, "test/sim_max_reward_4500009": 1.0, "test/sim_max_reward_4500010": 1.0, "test/sim_max_reward_4500011": 1.0, "test/sim_max_reward_4500012": 1.0, "test/sim_max_reward_4500013": 0.0, "test/sim_max_reward_4500014": 1.0, "test/sim_max_reward_4500015": 1.0, "test/sim_max_reward_4500016": 0.0, "test/sim_max_reward_4500017": 1.0, "test/sim_max_reward_4500018": 0.0, "test/sim_max_reward_4500019": 0.0, "test/sim_max_reward_4500020": 1.0, "test/sim_max_reward_4500021": 1.0, "train/mean_score": 0.6666666666666666, "test/mean_score": 0.8181818181818182, "val_loss": 6602755.5} {"train_loss": -27.04136085510254, "global_step": 510533, "epoch": 6151} {"train_loss": -26.834104537963867, "global_step": 510534, "epoch": 6151} {"train_loss": -27.1635684967041, "global_step": 510535, "epoch": 6151} {"train_loss": -26.83673667907715, "global_step": 510536, "epoch": 6151} {"train_loss": -27.216039657592773, "global_step": 510537, "epoch": 6151} {"train_loss": -27.173480987548828, "global_step": 510538, "epoch": 6151} {"train_loss": -26.68133544921875, "global_step": 510539, "epoch": 6151} {"train_loss": -26.96036720275879, "global_step": 510540, "epoch": 6151} {"train_loss": -26.637510299682617, "global_step": 510541, "epoch": 6151} {"train_loss": -27.161808013916016, "global_step": 510542, "epoch": 6151} {"train_loss": -26.55555534362793, "global_step": 510543, "epoch": 6151} {"train_loss": -26.6632080078125, "global_step": 510544, "epoch": 6151} {"train_loss": -26.708526611328125, "global_step": 510545, "epoch": 6151} {"train_loss": -26.71149253845215, "global_step": 510546, "epoch": 6151} {"train_loss": -27.139530181884766, "global_step": 510547, "epoch": 6151} {"train_loss": -27.18171501159668, "global_step": 510548, "epoch": 6151} {"train_loss": -26.93442153930664, "global_step": 510549, "epoch": 6151} {"train_loss": -26.8284912109375, "global_step": 510550, "epoch": 6151} {"train_loss": -26.823148727416992, "global_step": 510551, "epoch": 6151} {"train_loss": -27.31015968322754, "global_step": 510552, "epoch": 6151} {"train_loss": -27.176645278930664, "global_step": 510553, "epoch": 6151} {"train_loss": -27.431806564331055, "global_step": 510554, "epoch": 6151} {"train_loss": -27.125097274780273, "global_step": 510555, "epoch": 6151} {"train_loss": -27.031965255737305, "global_step": 510556, "epoch": 6151} {"train_loss": -27.120080947875977, "global_step": 510557, "epoch": 6151} {"train_loss": -27.226837158203125, "global_step": 510558, "epoch": 6151} {"train_loss": -27.287473678588867, "global_step": 510559, "epoch": 6151} {"train_loss": -27.322843551635742, "global_step": 510560, "epoch": 6151} {"train_loss": -27.280303955078125, "global_step": 510561, "epoch": 6151} {"train_loss": -27.430822372436523, "global_step": 510562, "epoch": 6151} {"train_loss": -27.214935302734375, "global_step": 510563, "epoch": 6151} {"train_loss": -27.43802833557129, "global_step": 510564, "epoch": 6151} {"train_loss": -27.32477378845215, "global_step": 510565, "epoch": 6151} {"train_loss": -27.47919273376465, "global_step": 510566, "epoch": 6151} {"train_loss": -27.410755157470703, "global_step": 510567, "epoch": 6151} {"train_loss": -27.5296688079834, "global_step": 510568, "epoch": 6151} {"train_loss": -27.422033309936523, "global_step": 510569, "epoch": 6151} {"train_loss": -27.714588165283203, "global_step": 510570, "epoch": 6151} {"train_loss": -27.43312644958496, "global_step": 510571, "epoch": 6151} {"train_loss": -27.330535888671875, "global_step": 510572, "epoch": 6151} {"train_loss": -27.598346710205078, "global_step": 510573, "epoch": 6151} {"train_loss": -27.367919921875, "global_step": 510574, "epoch": 6151} {"train_loss": -27.72553062438965, "global_step": 510575, "epoch": 6151} {"train_loss": -27.385862350463867, "global_step": 510576, "epoch": 6151} {"train_loss": -27.713537216186523, "global_step": 510577, "epoch": 6151} {"train_loss": -27.827611923217773, "global_step": 510578, "epoch": 6151} {"train_loss": -27.581995010375977, "global_step": 510579, "epoch": 6151} {"train_loss": -27.646991729736328, "global_step": 510580, "epoch": 6151} {"train_loss": -27.572351455688477, "global_step": 510581, "epoch": 6151} {"train_loss": -27.607084274291992, "global_step": 510582, "epoch": 6151} {"train_loss": -27.568525314331055, "global_step": 510583, "epoch": 6151} {"train_loss": -27.791013717651367, "global_step": 510584, "epoch": 6151} {"train_loss": -27.416767120361328, "global_step": 510585, "epoch": 6151} {"train_loss": -27.721311569213867, "global_step": 510586, "epoch": 6151} {"train_loss": -27.25105094909668, "global_step": 510587, "epoch": 6151} {"train_loss": -27.3734073638916, "global_step": 510588, "epoch": 6151} {"train_loss": -27.37420654296875, "global_step": 510589, "epoch": 6151} {"train_loss": -27.483957290649414, "global_step": 510590, "epoch": 6151} {"train_loss": -27.462472915649414, "global_step": 510591, "epoch": 6151} {"train_loss": -27.4970645904541, "global_step": 510592, "epoch": 6151} {"train_loss": -27.461780548095703, "global_step": 510593, "epoch": 6151} {"train_loss": -27.430551528930664, "global_step": 510594, "epoch": 6151} {"train_loss": -27.2650203704834, "global_step": 510595, "epoch": 6151} {"train_loss": -27.33942222595215, "global_step": 510596, "epoch": 6151} {"train_loss": -27.369848251342773, "global_step": 510597, "epoch": 6151} {"train_loss": -27.330236434936523, "global_step": 510598, "epoch": 6151} {"train_loss": -27.078475952148438, "global_step": 510599, "epoch": 6151} {"train_loss": -27.540082931518555, "global_step": 510600, "epoch": 6151} {"train_loss": -27.03712272644043, "global_step": 510601, "epoch": 6151} {"train_loss": -27.26276206970215, "global_step": 510602, "epoch": 6151} {"train_loss": -27.721771240234375, "global_step": 510603, "epoch": 6151} {"train_loss": -27.378087997436523, "global_step": 510604, "epoch": 6151} {"train_loss": -27.3519287109375, "global_step": 510605, "epoch": 6151} {"train_loss": -27.24005699157715, "global_step": 510606, "epoch": 6151} {"train_loss": -27.589405059814453, "global_step": 510607, "epoch": 6151} {"train_loss": -27.163654327392578, "global_step": 510608, "epoch": 6151} {"train_loss": -27.2633056640625, "global_step": 510609, "epoch": 6151} {"train_loss": -27.552886962890625, "global_step": 510610, "epoch": 6151} {"train_loss": -27.76582145690918, "global_step": 510611, "epoch": 6151} {"train_loss": -27.3261661529541, "global_step": 510612, "epoch": 6151} {"train_loss": -27.3900146484375, "global_step": 510613, "epoch": 6151} {"train_loss": -27.470319747924805, "global_step": 510614, "epoch": 6151} {"train_loss": -27.311690502856152, "global_step": 510615, "epoch": 6151, "val_loss": 6491792.5} {"train_loss": -26.822479248046875, "global_step": 510616, "epoch": 6152} {"train_loss": -27.121997833251953, "global_step": 510617, "epoch": 6152} {"train_loss": -27.142826080322266, "global_step": 510618, "epoch": 6152} {"train_loss": -27.095197677612305, "global_step": 510619, "epoch": 6152} {"train_loss": -27.081907272338867, "global_step": 510620, "epoch": 6152} {"train_loss": -27.053205490112305, "global_step": 510621, "epoch": 6152} {"train_loss": -27.062137603759766, "global_step": 510622, "epoch": 6152} {"train_loss": -27.214197158813477, "global_step": 510623, "epoch": 6152} {"train_loss": -26.80476951599121, "global_step": 510624, "epoch": 6152} {"train_loss": -27.0112247467041, "global_step": 510625, "epoch": 6152} {"train_loss": -26.7273006439209, "global_step": 510626, "epoch": 6152} {"train_loss": -26.82810401916504, "global_step": 510627, "epoch": 6152} {"train_loss": -27.554590225219727, "global_step": 510628, "epoch": 6152} {"train_loss": -26.90467643737793, "global_step": 510629, "epoch": 6152} {"train_loss": -26.974628448486328, "global_step": 510630, "epoch": 6152} {"train_loss": -26.87839126586914, "global_step": 510631, "epoch": 6152} {"train_loss": -27.243255615234375, "global_step": 510632, "epoch": 6152} {"train_loss": -27.47222328186035, "global_step": 510633, "epoch": 6152} {"train_loss": -27.05617332458496, "global_step": 510634, "epoch": 6152} {"train_loss": -27.286304473876953, "global_step": 510635, "epoch": 6152} {"train_loss": -27.3909912109375, "global_step": 510636, "epoch": 6152} {"train_loss": -26.690643310546875, "global_step": 510637, "epoch": 6152} {"train_loss": -27.83563804626465, "global_step": 510638, "epoch": 6152} {"train_loss": -27.3801326751709, "global_step": 510639, "epoch": 6152} {"train_loss": -27.31159019470215, "global_step": 510640, "epoch": 6152} {"train_loss": -27.537158966064453, "global_step": 510641, "epoch": 6152} {"train_loss": -27.243005752563477, "global_step": 510642, "epoch": 6152} {"train_loss": -27.399093627929688, "global_step": 510643, "epoch": 6152} {"train_loss": -27.317487716674805, "global_step": 510644, "epoch": 6152} {"train_loss": -27.382043838500977, "global_step": 510645, "epoch": 6152} {"train_loss": -27.100452423095703, "global_step": 510646, "epoch": 6152} {"train_loss": -27.345144271850586, "global_step": 510647, "epoch": 6152} {"train_loss": -27.729084014892578, "global_step": 510648, "epoch": 6152} {"train_loss": -27.465408325195312, "global_step": 510649, "epoch": 6152} {"train_loss": -27.321420669555664, "global_step": 510650, "epoch": 6152} {"train_loss": -27.77650260925293, "global_step": 510651, "epoch": 6152} {"train_loss": -27.426401138305664, "global_step": 510652, "epoch": 6152} {"train_loss": -27.5335636138916, "global_step": 510653, "epoch": 6152} {"train_loss": -27.590381622314453, "global_step": 510654, "epoch": 6152} {"train_loss": -27.514509201049805, "global_step": 510655, "epoch": 6152} {"train_loss": -27.70461082458496, "global_step": 510656, "epoch": 6152} {"train_loss": -27.65056800842285, "global_step": 510657, "epoch": 6152} {"train_loss": -27.51384925842285, "global_step": 510658, "epoch": 6152} {"train_loss": -27.644062042236328, "global_step": 510659, "epoch": 6152} {"train_loss": -27.557031631469727, "global_step": 510660, "epoch": 6152} {"train_loss": -27.5878849029541, "global_step": 510661, "epoch": 6152} {"train_loss": -27.535221099853516, "global_step": 510662, "epoch": 6152} {"train_loss": -27.722888946533203, "global_step": 510663, "epoch": 6152} {"train_loss": -27.34248161315918, "global_step": 510664, "epoch": 6152} {"train_loss": -27.456573486328125, "global_step": 510665, "epoch": 6152} {"train_loss": -27.61273765563965, "global_step": 510666, "epoch": 6152} {"train_loss": -27.62525749206543, "global_step": 510667, "epoch": 6152} {"train_loss": -27.571409225463867, "global_step": 510668, "epoch": 6152} {"train_loss": -27.367706298828125, "global_step": 510669, "epoch": 6152} {"train_loss": -27.25629997253418, "global_step": 510670, "epoch": 6152} {"train_loss": -27.671064376831055, "global_step": 510671, "epoch": 6152} {"train_loss": -27.698644638061523, "global_step": 510672, "epoch": 6152} {"train_loss": -27.302576065063477, "global_step": 510673, "epoch": 6152} {"train_loss": -26.504480361938477, "global_step": 510674, "epoch": 6152} {"train_loss": -26.813400268554688, "global_step": 510675, "epoch": 6152} {"train_loss": -26.9066104888916, "global_step": 510676, "epoch": 6152} {"train_loss": -27.39871597290039, "global_step": 510677, "epoch": 6152} {"train_loss": -27.2917537689209, "global_step": 510678, "epoch": 6152} {"train_loss": -27.02589988708496, "global_step": 510679, "epoch": 6152} {"train_loss": -27.508398056030273, "global_step": 510680, "epoch": 6152} {"train_loss": -27.368085861206055, "global_step": 510681, "epoch": 6152} {"train_loss": -27.344085693359375, "global_step": 510682, "epoch": 6152} {"train_loss": -27.335325241088867, "global_step": 510683, "epoch": 6152} {"train_loss": -27.644901275634766, "global_step": 510684, "epoch": 6152} {"train_loss": -27.2559871673584, "global_step": 510685, "epoch": 6152} {"train_loss": -27.55694007873535, "global_step": 510686, "epoch": 6152} {"train_loss": -27.6680850982666, "global_step": 510687, "epoch": 6152} {"train_loss": -27.573017120361328, "global_step": 510688, "epoch": 6152} {"train_loss": -27.597644805908203, "global_step": 510689, "epoch": 6152} {"train_loss": -27.66765785217285, "global_step": 510690, "epoch": 6152} {"train_loss": -27.747045516967773, "global_step": 510691, "epoch": 6152} {"train_loss": -27.526081085205078, "global_step": 510692, "epoch": 6152} {"train_loss": -27.124526977539062, "global_step": 510693, "epoch": 6152} {"train_loss": -27.518238067626953, "global_step": 510694, "epoch": 6152} {"train_loss": -27.744794845581055, "global_step": 510695, "epoch": 6152} {"train_loss": -27.422901153564453, "global_step": 510696, "epoch": 6152} {"train_loss": -27.58930778503418, "global_step": 510697, "epoch": 6152} {"train_loss": -27.33776621071689, "global_step": 510698, "epoch": 6152, "val_loss": 6643924.5} {"train_loss": -25.931676864624023, "global_step": 510699, "epoch": 6153} {"train_loss": -25.487680435180664, "global_step": 510700, "epoch": 6153} {"train_loss": -26.652082443237305, "global_step": 510701, "epoch": 6153} {"train_loss": -27.077911376953125, "global_step": 510702, "epoch": 6153} {"train_loss": -26.301305770874023, "global_step": 510703, "epoch": 6153} {"train_loss": -26.851364135742188, "global_step": 510704, "epoch": 6153} {"train_loss": -27.212594985961914, "global_step": 510705, "epoch": 6153} {"train_loss": -27.2947940826416, "global_step": 510706, "epoch": 6153} {"train_loss": -27.12066650390625, "global_step": 510707, "epoch": 6153} {"train_loss": -27.151962280273438, "global_step": 510708, "epoch": 6153} {"train_loss": -27.263458251953125, "global_step": 510709, "epoch": 6153} {"train_loss": -27.2586727142334, "global_step": 510710, "epoch": 6153} {"train_loss": -27.1049861907959, "global_step": 510711, "epoch": 6153} {"train_loss": -27.138763427734375, "global_step": 510712, "epoch": 6153} {"train_loss": -27.2995548248291, "global_step": 510713, "epoch": 6153} {"train_loss": -27.1122989654541, "global_step": 510714, "epoch": 6153} {"train_loss": -27.646881103515625, "global_step": 510715, "epoch": 6153} {"train_loss": -27.258609771728516, "global_step": 510716, "epoch": 6153} {"train_loss": -27.245214462280273, "global_step": 510717, "epoch": 6153} {"train_loss": -27.54778480529785, "global_step": 510718, "epoch": 6153} {"train_loss": -26.8563289642334, "global_step": 510719, "epoch": 6153} {"train_loss": -27.319726943969727, "global_step": 510720, "epoch": 6153} {"train_loss": -27.2565975189209, "global_step": 510721, "epoch": 6153} {"train_loss": -27.012439727783203, "global_step": 510722, "epoch": 6153} {"train_loss": -27.294157028198242, "global_step": 510723, "epoch": 6153} {"train_loss": -27.05535888671875, "global_step": 510724, "epoch": 6153} {"train_loss": -26.937345504760742, "global_step": 510725, "epoch": 6153} {"train_loss": -27.646142959594727, "global_step": 510726, "epoch": 6153} {"train_loss": -27.63007926940918, "global_step": 510727, "epoch": 6153} {"train_loss": -27.165380477905273, "global_step": 510728, "epoch": 6153} {"train_loss": -27.486337661743164, "global_step": 510729, "epoch": 6153} {"train_loss": -27.660400390625, "global_step": 510730, "epoch": 6153} {"train_loss": -27.483667373657227, "global_step": 510731, "epoch": 6153} {"train_loss": -27.795095443725586, "global_step": 510732, "epoch": 6153} {"train_loss": -27.630781173706055, "global_step": 510733, "epoch": 6153} {"train_loss": -27.499103546142578, "global_step": 510734, "epoch": 6153} {"train_loss": -27.106847763061523, "global_step": 510735, "epoch": 6153} {"train_loss": -27.657751083374023, "global_step": 510736, "epoch": 6153} {"train_loss": -27.79766273498535, "global_step": 510737, "epoch": 6153} {"train_loss": -27.470224380493164, "global_step": 510738, "epoch": 6153} {"train_loss": -27.432239532470703, "global_step": 510739, "epoch": 6153} {"train_loss": -27.255582809448242, "global_step": 510740, "epoch": 6153} {"train_loss": -27.285581588745117, "global_step": 510741, "epoch": 6153} {"train_loss": -27.351318359375, "global_step": 510742, "epoch": 6153} {"train_loss": -27.504226684570312, "global_step": 510743, "epoch": 6153} {"train_loss": -27.474140167236328, "global_step": 510744, "epoch": 6153} {"train_loss": -27.324567794799805, "global_step": 510745, "epoch": 6153} {"train_loss": -27.6492977142334, "global_step": 510746, "epoch": 6153} {"train_loss": -27.395437240600586, "global_step": 510747, "epoch": 6153} {"train_loss": -27.158777236938477, "global_step": 510748, "epoch": 6153} {"train_loss": -27.936431884765625, "global_step": 510749, "epoch": 6153} {"train_loss": -27.243635177612305, "global_step": 510750, "epoch": 6153} {"train_loss": -27.46619987487793, "global_step": 510751, "epoch": 6153} {"train_loss": -27.399158477783203, "global_step": 510752, "epoch": 6153} {"train_loss": -27.232711791992188, "global_step": 510753, "epoch": 6153} {"train_loss": -27.125757217407227, "global_step": 510754, "epoch": 6153} {"train_loss": -27.198415756225586, "global_step": 510755, "epoch": 6153} {"train_loss": -27.24860191345215, "global_step": 510756, "epoch": 6153} {"train_loss": -27.643310546875, "global_step": 510757, "epoch": 6153} {"train_loss": -27.70844841003418, "global_step": 510758, "epoch": 6153} {"train_loss": -27.181867599487305, "global_step": 510759, "epoch": 6153} {"train_loss": -27.225879669189453, "global_step": 510760, "epoch": 6153} {"train_loss": -27.53216552734375, "global_step": 510761, "epoch": 6153} {"train_loss": -27.534067153930664, "global_step": 510762, "epoch": 6153} {"train_loss": -27.516645431518555, "global_step": 510763, "epoch": 6153} {"train_loss": -27.708032608032227, "global_step": 510764, "epoch": 6153} {"train_loss": -27.59246253967285, "global_step": 510765, "epoch": 6153} {"train_loss": -27.8333683013916, "global_step": 510766, "epoch": 6153} {"train_loss": -27.586654663085938, "global_step": 510767, "epoch": 6153} {"train_loss": -27.288238525390625, "global_step": 510768, "epoch": 6153} {"train_loss": -27.525165557861328, "global_step": 510769, "epoch": 6153} {"train_loss": -27.5913028717041, "global_step": 510770, "epoch": 6153} {"train_loss": -27.7758731842041, "global_step": 510771, "epoch": 6153} {"train_loss": -27.65204429626465, "global_step": 510772, "epoch": 6153} {"train_loss": -27.62176513671875, "global_step": 510773, "epoch": 6153} {"train_loss": -27.268329620361328, "global_step": 510774, "epoch": 6153} {"train_loss": -27.680566787719727, "global_step": 510775, "epoch": 6153} {"train_loss": -27.612207412719727, "global_step": 510776, "epoch": 6153} {"train_loss": -27.51629066467285, "global_step": 510777, "epoch": 6153} {"train_loss": -27.609338760375977, "global_step": 510778, "epoch": 6153} {"train_loss": -27.660879135131836, "global_step": 510779, "epoch": 6153} {"train_loss": -27.655908584594727, "global_step": 510780, "epoch": 6153} {"train_loss": -27.32954661817436, "global_step": 510781, "epoch": 6153, "val_loss": 6587662.0} {"train_loss": -27.099170684814453, "global_step": 510782, "epoch": 6154} {"train_loss": -26.513341903686523, "global_step": 510783, "epoch": 6154} {"train_loss": -27.232059478759766, "global_step": 510784, "epoch": 6154} {"train_loss": -27.51206398010254, "global_step": 510785, "epoch": 6154} {"train_loss": -26.777109146118164, "global_step": 510786, "epoch": 6154} {"train_loss": -27.096960067749023, "global_step": 510787, "epoch": 6154} {"train_loss": -27.1702880859375, "global_step": 510788, "epoch": 6154} {"train_loss": -27.163854598999023, "global_step": 510789, "epoch": 6154} {"train_loss": -26.794702529907227, "global_step": 510790, "epoch": 6154} {"train_loss": -27.33673667907715, "global_step": 510791, "epoch": 6154} {"train_loss": -27.26348304748535, "global_step": 510792, "epoch": 6154} {"train_loss": -26.770587921142578, "global_step": 510793, "epoch": 6154} {"train_loss": -27.242231369018555, "global_step": 510794, "epoch": 6154} {"train_loss": -27.026779174804688, "global_step": 510795, "epoch": 6154} {"train_loss": -27.28028678894043, "global_step": 510796, "epoch": 6154} {"train_loss": -27.227224349975586, "global_step": 510797, "epoch": 6154} {"train_loss": -27.24629020690918, "global_step": 510798, "epoch": 6154} {"train_loss": -27.090967178344727, "global_step": 510799, "epoch": 6154} {"train_loss": -27.31049156188965, "global_step": 510800, "epoch": 6154} {"train_loss": -27.12407875061035, "global_step": 510801, "epoch": 6154} {"train_loss": -27.66153907775879, "global_step": 510802, "epoch": 6154} {"train_loss": -27.559965133666992, "global_step": 510803, "epoch": 6154} {"train_loss": -27.569738388061523, "global_step": 510804, "epoch": 6154} {"train_loss": -27.35904312133789, "global_step": 510805, "epoch": 6154} {"train_loss": -27.35822105407715, "global_step": 510806, "epoch": 6154} {"train_loss": -27.486902236938477, "global_step": 510807, "epoch": 6154} {"train_loss": -27.388513565063477, "global_step": 510808, "epoch": 6154} {"train_loss": -27.560277938842773, "global_step": 510809, "epoch": 6154} {"train_loss": -27.756397247314453, "global_step": 510810, "epoch": 6154} {"train_loss": -27.3804874420166, "global_step": 510811, "epoch": 6154} {"train_loss": -27.478363037109375, "global_step": 510812, "epoch": 6154} {"train_loss": -27.50616455078125, "global_step": 510813, "epoch": 6154} {"train_loss": -27.372528076171875, "global_step": 510814, "epoch": 6154} {"train_loss": -27.4439697265625, "global_step": 510815, "epoch": 6154} {"train_loss": -27.705204010009766, "global_step": 510816, "epoch": 6154} {"train_loss": -27.280988693237305, "global_step": 510817, "epoch": 6154} {"train_loss": -27.45557975769043, "global_step": 510818, "epoch": 6154} {"train_loss": -27.560651779174805, "global_step": 510819, "epoch": 6154} {"train_loss": -27.497114181518555, "global_step": 510820, "epoch": 6154} {"train_loss": -27.37275505065918, "global_step": 510821, "epoch": 6154} {"train_loss": -27.72248649597168, "global_step": 510822, "epoch": 6154} {"train_loss": -27.577606201171875, "global_step": 510823, "epoch": 6154} {"train_loss": -27.538043975830078, "global_step": 510824, "epoch": 6154} {"train_loss": -27.740711212158203, "global_step": 510825, "epoch": 6154} {"train_loss": -27.816761016845703, "global_step": 510826, "epoch": 6154} {"train_loss": -27.627349853515625, "global_step": 510827, "epoch": 6154} {"train_loss": -27.488513946533203, "global_step": 510828, "epoch": 6154} {"train_loss": -27.788000106811523, "global_step": 510829, "epoch": 6154} {"train_loss": -27.804706573486328, "global_step": 510830, "epoch": 6154} {"train_loss": -27.767614364624023, "global_step": 510831, "epoch": 6154} {"train_loss": -27.601226806640625, "global_step": 510832, "epoch": 6154} {"train_loss": -28.074323654174805, "global_step": 510833, "epoch": 6154} {"train_loss": -27.73847007751465, "global_step": 510834, "epoch": 6154} {"train_loss": -27.09814453125, "global_step": 510835, "epoch": 6154} {"train_loss": -27.8405818939209, "global_step": 510836, "epoch": 6154} {"train_loss": -27.89478874206543, "global_step": 510837, "epoch": 6154} {"train_loss": -27.646621704101562, "global_step": 510838, "epoch": 6154} {"train_loss": -27.62118911743164, "global_step": 510839, "epoch": 6154} {"train_loss": -26.9693660736084, "global_step": 510840, "epoch": 6154} {"train_loss": -26.321258544921875, "global_step": 510841, "epoch": 6154} {"train_loss": -26.62961196899414, "global_step": 510842, "epoch": 6154} {"train_loss": -25.827756881713867, "global_step": 510843, "epoch": 6154} {"train_loss": -25.57746696472168, "global_step": 510844, "epoch": 6154} {"train_loss": -27.119794845581055, "global_step": 510845, "epoch": 6154} {"train_loss": -26.40645408630371, "global_step": 510846, "epoch": 6154} {"train_loss": -25.64266014099121, "global_step": 510847, "epoch": 6154} {"train_loss": -27.33844566345215, "global_step": 510848, "epoch": 6154} {"train_loss": -26.921966552734375, "global_step": 510849, "epoch": 6154} {"train_loss": -27.16375160217285, "global_step": 510850, "epoch": 6154} {"train_loss": -26.454137802124023, "global_step": 510851, "epoch": 6154} {"train_loss": -26.612646102905273, "global_step": 510852, "epoch": 6154} {"train_loss": -26.835590362548828, "global_step": 510853, "epoch": 6154} {"train_loss": -26.851165771484375, "global_step": 510854, "epoch": 6154} {"train_loss": -26.5926513671875, "global_step": 510855, "epoch": 6154} {"train_loss": -26.740137100219727, "global_step": 510856, "epoch": 6154} {"train_loss": -26.90138053894043, "global_step": 510857, "epoch": 6154} {"train_loss": -26.749258041381836, "global_step": 510858, "epoch": 6154} {"train_loss": -27.161951065063477, "global_step": 510859, "epoch": 6154} {"train_loss": -27.192291259765625, "global_step": 510860, "epoch": 6154} {"train_loss": -27.16096305847168, "global_step": 510861, "epoch": 6154} {"train_loss": -26.687713623046875, "global_step": 510862, "epoch": 6154} {"train_loss": -27.411746978759766, "global_step": 510863, "epoch": 6154} {"train_loss": -27.21508812042604, "global_step": 510864, "epoch": 6154, "val_loss": 6593779.0} {"train_loss": -26.453031539916992, "global_step": 510865, "epoch": 6155} {"train_loss": -27.105060577392578, "global_step": 510866, "epoch": 6155} {"train_loss": -26.228607177734375, "global_step": 510867, "epoch": 6155} {"train_loss": -26.940855026245117, "global_step": 510868, "epoch": 6155} {"train_loss": -26.83652114868164, "global_step": 510869, "epoch": 6155} {"train_loss": -27.22902488708496, "global_step": 510870, "epoch": 6155} {"train_loss": -26.520709991455078, "global_step": 510871, "epoch": 6155} {"train_loss": -27.0218505859375, "global_step": 510872, "epoch": 6155} {"train_loss": -26.68642234802246, "global_step": 510873, "epoch": 6155} {"train_loss": -27.106159210205078, "global_step": 510874, "epoch": 6155} {"train_loss": -27.146764755249023, "global_step": 510875, "epoch": 6155} {"train_loss": -26.998945236206055, "global_step": 510876, "epoch": 6155} {"train_loss": -27.110767364501953, "global_step": 510877, "epoch": 6155} {"train_loss": -27.41910171508789, "global_step": 510878, "epoch": 6155} {"train_loss": -26.880908966064453, "global_step": 510879, "epoch": 6155} {"train_loss": -27.48995018005371, "global_step": 510880, "epoch": 6155} {"train_loss": -27.126419067382812, "global_step": 510881, "epoch": 6155} {"train_loss": -26.952167510986328, "global_step": 510882, "epoch": 6155} {"train_loss": -27.283063888549805, "global_step": 510883, "epoch": 6155} {"train_loss": -27.182798385620117, "global_step": 510884, "epoch": 6155} {"train_loss": -27.409460067749023, "global_step": 510885, "epoch": 6155} {"train_loss": -27.3071231842041, "global_step": 510886, "epoch": 6155} {"train_loss": -27.280292510986328, "global_step": 510887, "epoch": 6155} {"train_loss": -27.199609756469727, "global_step": 510888, "epoch": 6155} {"train_loss": -27.677249908447266, "global_step": 510889, "epoch": 6155} {"train_loss": -27.012104034423828, "global_step": 510890, "epoch": 6155} {"train_loss": -27.401777267456055, "global_step": 510891, "epoch": 6155} {"train_loss": -27.8947811126709, "global_step": 510892, "epoch": 6155} {"train_loss": -27.919879913330078, "global_step": 510893, "epoch": 6155} {"train_loss": -27.44854164123535, "global_step": 510894, "epoch": 6155} {"train_loss": -27.75830078125, "global_step": 510895, "epoch": 6155} {"train_loss": -27.29984474182129, "global_step": 510896, "epoch": 6155} {"train_loss": -27.353515625, "global_step": 510897, "epoch": 6155} {"train_loss": -27.656301498413086, "global_step": 510898, "epoch": 6155} {"train_loss": -27.603656768798828, "global_step": 510899, "epoch": 6155} {"train_loss": -27.838598251342773, "global_step": 510900, "epoch": 6155} {"train_loss": -27.6013240814209, "global_step": 510901, "epoch": 6155} {"train_loss": -27.70414161682129, "global_step": 510902, "epoch": 6155} {"train_loss": -27.424482345581055, "global_step": 510903, "epoch": 6155} {"train_loss": -27.556859970092773, "global_step": 510904, "epoch": 6155} {"train_loss": -27.89912223815918, "global_step": 510905, "epoch": 6155} {"train_loss": -27.64845848083496, "global_step": 510906, "epoch": 6155} {"train_loss": -27.795324325561523, "global_step": 510907, "epoch": 6155} {"train_loss": -27.916080474853516, "global_step": 510908, "epoch": 6155} {"train_loss": -27.665822982788086, "global_step": 510909, "epoch": 6155} {"train_loss": -28.14626121520996, "global_step": 510910, "epoch": 6155} {"train_loss": -27.941593170166016, "global_step": 510911, "epoch": 6155} {"train_loss": -27.9967041015625, "global_step": 510912, "epoch": 6155} {"train_loss": -27.60135269165039, "global_step": 510913, "epoch": 6155} {"train_loss": -27.675390243530273, "global_step": 510914, "epoch": 6155} {"train_loss": -28.061681747436523, "global_step": 510915, "epoch": 6155} {"train_loss": -27.355621337890625, "global_step": 510916, "epoch": 6155} {"train_loss": -27.603857040405273, "global_step": 510917, "epoch": 6155} {"train_loss": -27.302839279174805, "global_step": 510918, "epoch": 6155} {"train_loss": -27.163196563720703, "global_step": 510919, "epoch": 6155} {"train_loss": -26.810571670532227, "global_step": 510920, "epoch": 6155} {"train_loss": -26.75446128845215, "global_step": 510921, "epoch": 6155} {"train_loss": -26.47800636291504, "global_step": 510922, "epoch": 6155} {"train_loss": -27.181705474853516, "global_step": 510923, "epoch": 6155} {"train_loss": -27.7280330657959, "global_step": 510924, "epoch": 6155} {"train_loss": -27.104528427124023, "global_step": 510925, "epoch": 6155} {"train_loss": -27.270475387573242, "global_step": 510926, "epoch": 6155} {"train_loss": -27.132654190063477, "global_step": 510927, "epoch": 6155} {"train_loss": -27.532827377319336, "global_step": 510928, "epoch": 6155} {"train_loss": -26.969924926757812, "global_step": 510929, "epoch": 6155} {"train_loss": -27.1651554107666, "global_step": 510930, "epoch": 6155} {"train_loss": -26.766141891479492, "global_step": 510931, "epoch": 6155} {"train_loss": -27.498291015625, "global_step": 510932, "epoch": 6155} {"train_loss": -27.0689697265625, "global_step": 510933, "epoch": 6155} {"train_loss": -27.38019371032715, "global_step": 510934, "epoch": 6155} {"train_loss": -27.237951278686523, "global_step": 510935, "epoch": 6155} {"train_loss": -27.594404220581055, "global_step": 510936, "epoch": 6155} {"train_loss": -27.288101196289062, "global_step": 510937, "epoch": 6155} {"train_loss": -27.285940170288086, "global_step": 510938, "epoch": 6155} {"train_loss": -27.232086181640625, "global_step": 510939, "epoch": 6155} {"train_loss": -26.9893856048584, "global_step": 510940, "epoch": 6155} {"train_loss": -27.2453556060791, "global_step": 510941, "epoch": 6155} {"train_loss": -27.41530418395996, "global_step": 510942, "epoch": 6155} {"train_loss": -27.411779403686523, "global_step": 510943, "epoch": 6155} {"train_loss": -27.745351791381836, "global_step": 510944, "epoch": 6155} {"train_loss": -27.222105026245117, "global_step": 510945, "epoch": 6155} {"train_loss": -27.570241928100586, "global_step": 510946, "epoch": 6155} {"train_loss": -27.34721942120288, "global_step": 510947, "epoch": 6155, "val_loss": 6541643.0} {"train_loss": -27.3214168548584, "global_step": 510948, "epoch": 6156} {"train_loss": -26.420995712280273, "global_step": 510949, "epoch": 6156} {"train_loss": -26.785242080688477, "global_step": 510950, "epoch": 6156} {"train_loss": -27.028018951416016, "global_step": 510951, "epoch": 6156} {"train_loss": -26.642242431640625, "global_step": 510952, "epoch": 6156} {"train_loss": -26.6767520904541, "global_step": 510953, "epoch": 6156} {"train_loss": -27.257736206054688, "global_step": 510954, "epoch": 6156} {"train_loss": -26.87906265258789, "global_step": 510955, "epoch": 6156} {"train_loss": -26.710779190063477, "global_step": 510956, "epoch": 6156} {"train_loss": -27.3033447265625, "global_step": 510957, "epoch": 6156} {"train_loss": -26.888996124267578, "global_step": 510958, "epoch": 6156} {"train_loss": -26.689050674438477, "global_step": 510959, "epoch": 6156} {"train_loss": -27.391870498657227, "global_step": 510960, "epoch": 6156} {"train_loss": -26.826156616210938, "global_step": 510961, "epoch": 6156} {"train_loss": -27.239770889282227, "global_step": 510962, "epoch": 6156} {"train_loss": -27.126211166381836, "global_step": 510963, "epoch": 6156} {"train_loss": -27.091894149780273, "global_step": 510964, "epoch": 6156} {"train_loss": -27.175222396850586, "global_step": 510965, "epoch": 6156} {"train_loss": -27.311115264892578, "global_step": 510966, "epoch": 6156} {"train_loss": -27.022485733032227, "global_step": 510967, "epoch": 6156} {"train_loss": -27.780282974243164, "global_step": 510968, "epoch": 6156} {"train_loss": -27.454071044921875, "global_step": 510969, "epoch": 6156} {"train_loss": -27.440656661987305, "global_step": 510970, "epoch": 6156} {"train_loss": -27.555591583251953, "global_step": 510971, "epoch": 6156} {"train_loss": -27.383264541625977, "global_step": 510972, "epoch": 6156} {"train_loss": -27.495325088500977, "global_step": 510973, "epoch": 6156} {"train_loss": -27.391910552978516, "global_step": 510974, "epoch": 6156} {"train_loss": -27.268218994140625, "global_step": 510975, "epoch": 6156} {"train_loss": -27.3935546875, "global_step": 510976, "epoch": 6156} {"train_loss": -27.667266845703125, "global_step": 510977, "epoch": 6156} {"train_loss": -27.140501022338867, "global_step": 510978, "epoch": 6156} {"train_loss": -27.625385284423828, "global_step": 510979, "epoch": 6156} {"train_loss": -27.622650146484375, "global_step": 510980, "epoch": 6156} {"train_loss": -28.042739868164062, "global_step": 510981, "epoch": 6156} {"train_loss": -27.286590576171875, "global_step": 510982, "epoch": 6156} {"train_loss": -27.620166778564453, "global_step": 510983, "epoch": 6156} {"train_loss": -27.25803565979004, "global_step": 510984, "epoch": 6156} {"train_loss": -27.774188995361328, "global_step": 510985, "epoch": 6156} {"train_loss": -26.957489013671875, "global_step": 510986, "epoch": 6156} {"train_loss": -27.316022872924805, "global_step": 510987, "epoch": 6156} {"train_loss": -27.524322509765625, "global_step": 510988, "epoch": 6156} {"train_loss": -27.53841209411621, "global_step": 510989, "epoch": 6156} {"train_loss": -27.358938217163086, "global_step": 510990, "epoch": 6156} {"train_loss": -27.57082176208496, "global_step": 510991, "epoch": 6156} {"train_loss": -27.671262741088867, "global_step": 510992, "epoch": 6156} {"train_loss": -27.542844772338867, "global_step": 510993, "epoch": 6156} {"train_loss": -26.77848243713379, "global_step": 510994, "epoch": 6156} {"train_loss": -27.4403018951416, "global_step": 510995, "epoch": 6156} {"train_loss": -27.1982479095459, "global_step": 510996, "epoch": 6156} {"train_loss": -27.404321670532227, "global_step": 510997, "epoch": 6156} {"train_loss": -27.79756736755371, "global_step": 510998, "epoch": 6156} {"train_loss": -27.67681312561035, "global_step": 510999, "epoch": 6156} {"train_loss": -27.74416160583496, "global_step": 511000, "epoch": 6156} {"train_loss": -27.579313278198242, "global_step": 511001, "epoch": 6156} {"train_loss": -27.615026473999023, "global_step": 511002, "epoch": 6156} {"train_loss": -27.6966609954834, "global_step": 511003, "epoch": 6156} {"train_loss": -27.547407150268555, "global_step": 511004, "epoch": 6156} {"train_loss": -27.46600341796875, "global_step": 511005, "epoch": 6156} {"train_loss": -27.76569938659668, "global_step": 511006, "epoch": 6156} {"train_loss": -27.90128517150879, "global_step": 511007, "epoch": 6156} {"train_loss": -28.095062255859375, "global_step": 511008, "epoch": 6156} {"train_loss": -27.811691284179688, "global_step": 511009, "epoch": 6156} {"train_loss": -27.494653701782227, "global_step": 511010, "epoch": 6156} {"train_loss": -27.439254760742188, "global_step": 511011, "epoch": 6156} {"train_loss": -27.794696807861328, "global_step": 511012, "epoch": 6156} {"train_loss": -27.804401397705078, "global_step": 511013, "epoch": 6156} {"train_loss": -27.835474014282227, "global_step": 511014, "epoch": 6156} {"train_loss": -27.310871124267578, "global_step": 511015, "epoch": 6156} {"train_loss": -27.303491592407227, "global_step": 511016, "epoch": 6156} {"train_loss": -27.660236358642578, "global_step": 511017, "epoch": 6156} {"train_loss": -27.50448989868164, "global_step": 511018, "epoch": 6156} {"train_loss": -27.661060333251953, "global_step": 511019, "epoch": 6156} {"train_loss": -27.664880752563477, "global_step": 511020, "epoch": 6156} {"train_loss": -27.862741470336914, "global_step": 511021, "epoch": 6156} {"train_loss": -27.574975967407227, "global_step": 511022, "epoch": 6156} {"train_loss": -26.950468063354492, "global_step": 511023, "epoch": 6156} {"train_loss": -26.838306427001953, "global_step": 511024, "epoch": 6156} {"train_loss": -26.505456924438477, "global_step": 511025, "epoch": 6156} {"train_loss": -27.881017684936523, "global_step": 511026, "epoch": 6156} {"train_loss": -27.440261840820312, "global_step": 511027, "epoch": 6156} {"train_loss": -26.517606735229492, "global_step": 511028, "epoch": 6156} {"train_loss": -27.328536987304688, "global_step": 511029, "epoch": 6156} {"train_loss": -27.364607592663134, "global_step": 511030, "epoch": 6156, "val_loss": 6600222.0} {"train_loss": -25.3785457611084, "global_step": 511031, "epoch": 6157} {"train_loss": -25.927453994750977, "global_step": 511032, "epoch": 6157} {"train_loss": -26.96929931640625, "global_step": 511033, "epoch": 6157} {"train_loss": -26.214223861694336, "global_step": 511034, "epoch": 6157} {"train_loss": -26.6507511138916, "global_step": 511035, "epoch": 6157} {"train_loss": -26.369857788085938, "global_step": 511036, "epoch": 6157} {"train_loss": -27.020862579345703, "global_step": 511037, "epoch": 6157} {"train_loss": -26.47859764099121, "global_step": 511038, "epoch": 6157} {"train_loss": -27.11603355407715, "global_step": 511039, "epoch": 6157} {"train_loss": -26.676532745361328, "global_step": 511040, "epoch": 6157} {"train_loss": -27.028156280517578, "global_step": 511041, "epoch": 6157} {"train_loss": -26.905445098876953, "global_step": 511042, "epoch": 6157} {"train_loss": -27.105337142944336, "global_step": 511043, "epoch": 6157} {"train_loss": -26.726415634155273, "global_step": 511044, "epoch": 6157} {"train_loss": -26.777908325195312, "global_step": 511045, "epoch": 6157} {"train_loss": -26.899005889892578, "global_step": 511046, "epoch": 6157} {"train_loss": -26.9395694732666, "global_step": 511047, "epoch": 6157} {"train_loss": -27.31955909729004, "global_step": 511048, "epoch": 6157} {"train_loss": -27.067575454711914, "global_step": 511049, "epoch": 6157} {"train_loss": -27.04768180847168, "global_step": 511050, "epoch": 6157} {"train_loss": -27.190372467041016, "global_step": 511051, "epoch": 6157} {"train_loss": -27.11964225769043, "global_step": 511052, "epoch": 6157} {"train_loss": -27.405609130859375, "global_step": 511053, "epoch": 6157} {"train_loss": -27.46026039123535, "global_step": 511054, "epoch": 6157} {"train_loss": -26.79450035095215, "global_step": 511055, "epoch": 6157} {"train_loss": -27.15509033203125, "global_step": 511056, "epoch": 6157} {"train_loss": -27.622251510620117, "global_step": 511057, "epoch": 6157} {"train_loss": -27.06562614440918, "global_step": 511058, "epoch": 6157} {"train_loss": -27.267202377319336, "global_step": 511059, "epoch": 6157} {"train_loss": -27.1602783203125, "global_step": 511060, "epoch": 6157} {"train_loss": -27.30548667907715, "global_step": 511061, "epoch": 6157} {"train_loss": -27.2119197845459, "global_step": 511062, "epoch": 6157} {"train_loss": -27.5706729888916, "global_step": 511063, "epoch": 6157} {"train_loss": -27.742572784423828, "global_step": 511064, "epoch": 6157} {"train_loss": -27.62044334411621, "global_step": 511065, "epoch": 6157} {"train_loss": -27.349170684814453, "global_step": 511066, "epoch": 6157} {"train_loss": -27.823989868164062, "global_step": 511067, "epoch": 6157} {"train_loss": -27.290441513061523, "global_step": 511068, "epoch": 6157} {"train_loss": -27.530065536499023, "global_step": 511069, "epoch": 6157} {"train_loss": -27.60715103149414, "global_step": 511070, "epoch": 6157} {"train_loss": -27.484704971313477, "global_step": 511071, "epoch": 6157} {"train_loss": -27.45012855529785, "global_step": 511072, "epoch": 6157} {"train_loss": -27.504535675048828, "global_step": 511073, "epoch": 6157} {"train_loss": -27.319425582885742, "global_step": 511074, "epoch": 6157} {"train_loss": -27.587177276611328, "global_step": 511075, "epoch": 6157} {"train_loss": -27.404178619384766, "global_step": 511076, "epoch": 6157} {"train_loss": -27.378498077392578, "global_step": 511077, "epoch": 6157} {"train_loss": -27.168920516967773, "global_step": 511078, "epoch": 6157} {"train_loss": -27.39515495300293, "global_step": 511079, "epoch": 6157} {"train_loss": -27.84992790222168, "global_step": 511080, "epoch": 6157} {"train_loss": -27.68218994140625, "global_step": 511081, "epoch": 6157} {"train_loss": -27.197280883789062, "global_step": 511082, "epoch": 6157} {"train_loss": -27.754199981689453, "global_step": 511083, "epoch": 6157} {"train_loss": -27.561315536499023, "global_step": 511084, "epoch": 6157} {"train_loss": -27.653888702392578, "global_step": 511085, "epoch": 6157} {"train_loss": -27.807600021362305, "global_step": 511086, "epoch": 6157} {"train_loss": -27.47210693359375, "global_step": 511087, "epoch": 6157} {"train_loss": -27.47942543029785, "global_step": 511088, "epoch": 6157} {"train_loss": -27.59065818786621, "global_step": 511089, "epoch": 6157} {"train_loss": -27.33021354675293, "global_step": 511090, "epoch": 6157} {"train_loss": -28.099292755126953, "global_step": 511091, "epoch": 6157} {"train_loss": -27.3564510345459, "global_step": 511092, "epoch": 6157} {"train_loss": -27.051849365234375, "global_step": 511093, "epoch": 6157} {"train_loss": -26.984634399414062, "global_step": 511094, "epoch": 6157} {"train_loss": -27.477981567382812, "global_step": 511095, "epoch": 6157} {"train_loss": -27.675445556640625, "global_step": 511096, "epoch": 6157} {"train_loss": -27.309375762939453, "global_step": 511097, "epoch": 6157} {"train_loss": -27.2321834564209, "global_step": 511098, "epoch": 6157} {"train_loss": -27.52825355529785, "global_step": 511099, "epoch": 6157} {"train_loss": -27.441761016845703, "global_step": 511100, "epoch": 6157} {"train_loss": -27.57488441467285, "global_step": 511101, "epoch": 6157} {"train_loss": -27.651416778564453, "global_step": 511102, "epoch": 6157} {"train_loss": -27.44740867614746, "global_step": 511103, "epoch": 6157} {"train_loss": -27.901153564453125, "global_step": 511104, "epoch": 6157} {"train_loss": -27.876388549804688, "global_step": 511105, "epoch": 6157} {"train_loss": -27.06241226196289, "global_step": 511106, "epoch": 6157} {"train_loss": -28.038848876953125, "global_step": 511107, "epoch": 6157} {"train_loss": -27.6903018951416, "global_step": 511108, "epoch": 6157} {"train_loss": -27.925073623657227, "global_step": 511109, "epoch": 6157} {"train_loss": -27.91169548034668, "global_step": 511110, "epoch": 6157} {"train_loss": -27.6641902923584, "global_step": 511111, "epoch": 6157} {"train_loss": -27.83363151550293, "global_step": 511112, "epoch": 6157} {"train_loss": -27.32006675076772, "global_step": 511113, "epoch": 6157, "val_loss": 6551958.0} {"train_loss": -26.2640323638916, "global_step": 511114, "epoch": 6158} {"train_loss": -26.24063491821289, "global_step": 511115, "epoch": 6158} {"train_loss": -26.485990524291992, "global_step": 511116, "epoch": 6158} {"train_loss": -26.18317222595215, "global_step": 511117, "epoch": 6158} {"train_loss": -26.455862045288086, "global_step": 511118, "epoch": 6158} {"train_loss": -26.477142333984375, "global_step": 511119, "epoch": 6158} {"train_loss": -26.38990592956543, "global_step": 511120, "epoch": 6158} {"train_loss": -26.850860595703125, "global_step": 511121, "epoch": 6158} {"train_loss": -26.56625747680664, "global_step": 511122, "epoch": 6158} {"train_loss": -26.985980987548828, "global_step": 511123, "epoch": 6158} {"train_loss": -26.890233993530273, "global_step": 511124, "epoch": 6158} {"train_loss": -27.06183433532715, "global_step": 511125, "epoch": 6158} {"train_loss": -27.01068687438965, "global_step": 511126, "epoch": 6158} {"train_loss": -27.312732696533203, "global_step": 511127, "epoch": 6158} {"train_loss": -27.047208786010742, "global_step": 511128, "epoch": 6158} {"train_loss": -27.145355224609375, "global_step": 511129, "epoch": 6158} {"train_loss": -27.24993896484375, "global_step": 511130, "epoch": 6158} {"train_loss": -27.209259033203125, "global_step": 511131, "epoch": 6158} {"train_loss": -27.534591674804688, "global_step": 511132, "epoch": 6158} {"train_loss": -27.25263786315918, "global_step": 511133, "epoch": 6158} {"train_loss": -27.250141143798828, "global_step": 511134, "epoch": 6158} {"train_loss": -26.979721069335938, "global_step": 511135, "epoch": 6158} {"train_loss": -27.259809494018555, "global_step": 511136, "epoch": 6158} {"train_loss": -27.103723526000977, "global_step": 511137, "epoch": 6158} {"train_loss": -27.7091064453125, "global_step": 511138, "epoch": 6158} {"train_loss": -27.33794593811035, "global_step": 511139, "epoch": 6158} {"train_loss": -27.412036895751953, "global_step": 511140, "epoch": 6158} {"train_loss": -27.172805786132812, "global_step": 511141, "epoch": 6158} {"train_loss": -27.27752685546875, "global_step": 511142, "epoch": 6158} {"train_loss": -27.429426193237305, "global_step": 511143, "epoch": 6158} {"train_loss": -27.03191566467285, "global_step": 511144, "epoch": 6158} {"train_loss": -27.611806869506836, "global_step": 511145, "epoch": 6158} {"train_loss": -27.598861694335938, "global_step": 511146, "epoch": 6158} {"train_loss": -27.327930450439453, "global_step": 511147, "epoch": 6158} {"train_loss": -27.62017822265625, "global_step": 511148, "epoch": 6158} {"train_loss": -27.80744743347168, "global_step": 511149, "epoch": 6158} {"train_loss": -27.288455963134766, "global_step": 511150, "epoch": 6158} {"train_loss": -27.660917282104492, "global_step": 511151, "epoch": 6158} {"train_loss": -27.457544326782227, "global_step": 511152, "epoch": 6158} {"train_loss": -27.618906021118164, "global_step": 511153, "epoch": 6158} {"train_loss": -26.91010856628418, "global_step": 511154, "epoch": 6158} {"train_loss": -27.603717803955078, "global_step": 511155, "epoch": 6158} {"train_loss": -27.387067794799805, "global_step": 511156, "epoch": 6158} {"train_loss": -27.57879066467285, "global_step": 511157, "epoch": 6158} {"train_loss": -27.92830467224121, "global_step": 511158, "epoch": 6158} {"train_loss": -27.68133544921875, "global_step": 511159, "epoch": 6158} {"train_loss": -27.38209342956543, "global_step": 511160, "epoch": 6158} {"train_loss": -27.60450553894043, "global_step": 511161, "epoch": 6158} {"train_loss": -27.477575302124023, "global_step": 511162, "epoch": 6158} {"train_loss": -27.68537712097168, "global_step": 511163, "epoch": 6158} {"train_loss": -27.38118553161621, "global_step": 511164, "epoch": 6158} {"train_loss": -27.1687068939209, "global_step": 511165, "epoch": 6158} {"train_loss": -27.495386123657227, "global_step": 511166, "epoch": 6158} {"train_loss": -27.45061683654785, "global_step": 511167, "epoch": 6158} {"train_loss": -27.850683212280273, "global_step": 511168, "epoch": 6158} {"train_loss": -27.62566566467285, "global_step": 511169, "epoch": 6158} {"train_loss": -27.400634765625, "global_step": 511170, "epoch": 6158} {"train_loss": -27.35984230041504, "global_step": 511171, "epoch": 6158} {"train_loss": -27.154081344604492, "global_step": 511172, "epoch": 6158} {"train_loss": -27.22979736328125, "global_step": 511173, "epoch": 6158} {"train_loss": -27.349292755126953, "global_step": 511174, "epoch": 6158} {"train_loss": -27.110010147094727, "global_step": 511175, "epoch": 6158} {"train_loss": -27.191192626953125, "global_step": 511176, "epoch": 6158} {"train_loss": -27.580631256103516, "global_step": 511177, "epoch": 6158} {"train_loss": -27.586408615112305, "global_step": 511178, "epoch": 6158} {"train_loss": -27.62098503112793, "global_step": 511179, "epoch": 6158} {"train_loss": -27.078872680664062, "global_step": 511180, "epoch": 6158} {"train_loss": -27.898639678955078, "global_step": 511181, "epoch": 6158} {"train_loss": -27.482650756835938, "global_step": 511182, "epoch": 6158} {"train_loss": -27.4376277923584, "global_step": 511183, "epoch": 6158} {"train_loss": -27.409595489501953, "global_step": 511184, "epoch": 6158} {"train_loss": -28.178686141967773, "global_step": 511185, "epoch": 6158} {"train_loss": -27.421253204345703, "global_step": 511186, "epoch": 6158} {"train_loss": -27.53205680847168, "global_step": 511187, "epoch": 6158} {"train_loss": -27.30877685546875, "global_step": 511188, "epoch": 6158} {"train_loss": -27.56081199645996, "global_step": 511189, "epoch": 6158} {"train_loss": -27.283233642578125, "global_step": 511190, "epoch": 6158} {"train_loss": -27.3448429107666, "global_step": 511191, "epoch": 6158} {"train_loss": -27.513776779174805, "global_step": 511192, "epoch": 6158} {"train_loss": -27.613712310791016, "global_step": 511193, "epoch": 6158} {"train_loss": -27.350284576416016, "global_step": 511194, "epoch": 6158} {"train_loss": -27.150440216064453, "global_step": 511195, "epoch": 6158} {"train_loss": -27.292730607182147, "global_step": 511196, "epoch": 6158, "val_loss": 6559459.0} {"train_loss": -26.828039169311523, "global_step": 511197, "epoch": 6159} {"train_loss": -27.048786163330078, "global_step": 511198, "epoch": 6159} {"train_loss": -26.85450553894043, "global_step": 511199, "epoch": 6159} {"train_loss": -27.3225040435791, "global_step": 511200, "epoch": 6159} {"train_loss": -26.9157772064209, "global_step": 511201, "epoch": 6159} {"train_loss": -27.248340606689453, "global_step": 511202, "epoch": 6159} {"train_loss": -26.658767700195312, "global_step": 511203, "epoch": 6159} {"train_loss": -27.49875831604004, "global_step": 511204, "epoch": 6159} {"train_loss": -27.486738204956055, "global_step": 511205, "epoch": 6159} {"train_loss": -27.023218154907227, "global_step": 511206, "epoch": 6159} {"train_loss": -27.249990463256836, "global_step": 511207, "epoch": 6159} {"train_loss": -27.245697021484375, "global_step": 511208, "epoch": 6159} {"train_loss": -27.210285186767578, "global_step": 511209, "epoch": 6159} {"train_loss": -26.91914176940918, "global_step": 511210, "epoch": 6159} {"train_loss": -27.09624671936035, "global_step": 511211, "epoch": 6159} {"train_loss": -27.30873680114746, "global_step": 511212, "epoch": 6159} {"train_loss": -27.011274337768555, "global_step": 511213, "epoch": 6159} {"train_loss": -27.244125366210938, "global_step": 511214, "epoch": 6159} {"train_loss": -27.160303115844727, "global_step": 511215, "epoch": 6159} {"train_loss": -27.088836669921875, "global_step": 511216, "epoch": 6159} {"train_loss": -27.048330307006836, "global_step": 511217, "epoch": 6159} {"train_loss": -27.514501571655273, "global_step": 511218, "epoch": 6159} {"train_loss": -27.287389755249023, "global_step": 511219, "epoch": 6159} {"train_loss": -27.59746742248535, "global_step": 511220, "epoch": 6159} {"train_loss": -27.593002319335938, "global_step": 511221, "epoch": 6159} {"train_loss": -27.60076904296875, "global_step": 511222, "epoch": 6159} {"train_loss": -27.4100284576416, "global_step": 511223, "epoch": 6159} {"train_loss": -27.012638092041016, "global_step": 511224, "epoch": 6159} {"train_loss": -27.378820419311523, "global_step": 511225, "epoch": 6159} {"train_loss": -27.101215362548828, "global_step": 511226, "epoch": 6159} {"train_loss": -27.529394149780273, "global_step": 511227, "epoch": 6159} {"train_loss": -27.0668888092041, "global_step": 511228, "epoch": 6159} {"train_loss": -27.383563995361328, "global_step": 511229, "epoch": 6159} {"train_loss": -27.16913414001465, "global_step": 511230, "epoch": 6159} {"train_loss": -27.287109375, "global_step": 511231, "epoch": 6159} {"train_loss": -27.566421508789062, "global_step": 511232, "epoch": 6159} {"train_loss": -27.291242599487305, "global_step": 511233, "epoch": 6159} {"train_loss": -27.287662506103516, "global_step": 511234, "epoch": 6159} {"train_loss": -27.64973258972168, "global_step": 511235, "epoch": 6159} {"train_loss": -27.756887435913086, "global_step": 511236, "epoch": 6159} {"train_loss": -27.1087703704834, "global_step": 511237, "epoch": 6159} {"train_loss": -27.877973556518555, "global_step": 511238, "epoch": 6159} {"train_loss": -27.360578536987305, "global_step": 511239, "epoch": 6159} {"train_loss": -27.185449600219727, "global_step": 511240, "epoch": 6159} {"train_loss": -27.57427978515625, "global_step": 511241, "epoch": 6159} {"train_loss": -27.48801040649414, "global_step": 511242, "epoch": 6159} {"train_loss": -27.254602432250977, "global_step": 511243, "epoch": 6159} {"train_loss": -26.87330436706543, "global_step": 511244, "epoch": 6159} {"train_loss": -27.49285888671875, "global_step": 511245, "epoch": 6159} {"train_loss": -27.693008422851562, "global_step": 511246, "epoch": 6159} {"train_loss": -27.77618980407715, "global_step": 511247, "epoch": 6159} {"train_loss": -27.569198608398438, "global_step": 511248, "epoch": 6159} {"train_loss": -27.80543327331543, "global_step": 511249, "epoch": 6159} {"train_loss": -27.665790557861328, "global_step": 511250, "epoch": 6159} {"train_loss": -27.6868839263916, "global_step": 511251, "epoch": 6159} {"train_loss": -27.855548858642578, "global_step": 511252, "epoch": 6159} {"train_loss": -27.57901954650879, "global_step": 511253, "epoch": 6159} {"train_loss": -27.665542602539062, "global_step": 511254, "epoch": 6159} {"train_loss": -27.716772079467773, "global_step": 511255, "epoch": 6159} {"train_loss": -27.5701847076416, "global_step": 511256, "epoch": 6159} {"train_loss": -27.681537628173828, "global_step": 511257, "epoch": 6159} {"train_loss": -27.723600387573242, "global_step": 511258, "epoch": 6159} {"train_loss": -27.769445419311523, "global_step": 511259, "epoch": 6159} {"train_loss": -27.43024253845215, "global_step": 511260, "epoch": 6159} {"train_loss": -28.042768478393555, "global_step": 511261, "epoch": 6159} {"train_loss": -27.599699020385742, "global_step": 511262, "epoch": 6159} {"train_loss": -27.577350616455078, "global_step": 511263, "epoch": 6159} {"train_loss": -27.8629093170166, "global_step": 511264, "epoch": 6159} {"train_loss": -26.935327529907227, "global_step": 511265, "epoch": 6159} {"train_loss": -26.55423927307129, "global_step": 511266, "epoch": 6159} {"train_loss": -26.9945068359375, "global_step": 511267, "epoch": 6159} {"train_loss": -27.143095016479492, "global_step": 511268, "epoch": 6159} {"train_loss": -27.125503540039062, "global_step": 511269, "epoch": 6159} {"train_loss": -27.395498275756836, "global_step": 511270, "epoch": 6159} {"train_loss": -27.539587020874023, "global_step": 511271, "epoch": 6159} {"train_loss": -27.706892013549805, "global_step": 511272, "epoch": 6159} {"train_loss": -27.460193634033203, "global_step": 511273, "epoch": 6159} {"train_loss": -27.418943405151367, "global_step": 511274, "epoch": 6159} {"train_loss": -27.92095947265625, "global_step": 511275, "epoch": 6159} {"train_loss": -27.189664840698242, "global_step": 511276, "epoch": 6159} {"train_loss": -27.447315216064453, "global_step": 511277, "epoch": 6159} {"train_loss": -27.39442253112793, "global_step": 511278, "epoch": 6159} {"train_loss": -27.361616019743035, "global_step": 511279, "epoch": 6159, "val_loss": 6574537.0} {"train_loss": -26.447980880737305, "global_step": 511280, "epoch": 6160} {"train_loss": -26.190967559814453, "global_step": 511281, "epoch": 6160} {"train_loss": -27.223047256469727, "global_step": 511282, "epoch": 6160} {"train_loss": -26.967334747314453, "global_step": 511283, "epoch": 6160} {"train_loss": -27.035465240478516, "global_step": 511284, "epoch": 6160} {"train_loss": -27.213459014892578, "global_step": 511285, "epoch": 6160} {"train_loss": -26.779699325561523, "global_step": 511286, "epoch": 6160} {"train_loss": -27.022428512573242, "global_step": 511287, "epoch": 6160} {"train_loss": -27.5275821685791, "global_step": 511288, "epoch": 6160} {"train_loss": -26.904417037963867, "global_step": 511289, "epoch": 6160} {"train_loss": -27.329919815063477, "global_step": 511290, "epoch": 6160} {"train_loss": -27.10617446899414, "global_step": 511291, "epoch": 6160} {"train_loss": -27.235187530517578, "global_step": 511292, "epoch": 6160} {"train_loss": -27.54669189453125, "global_step": 511293, "epoch": 6160} {"train_loss": -27.482772827148438, "global_step": 511294, "epoch": 6160} {"train_loss": -27.475555419921875, "global_step": 511295, "epoch": 6160} {"train_loss": -27.48847770690918, "global_step": 511296, "epoch": 6160} {"train_loss": -27.417627334594727, "global_step": 511297, "epoch": 6160} {"train_loss": -27.717870712280273, "global_step": 511298, "epoch": 6160} {"train_loss": -27.239049911499023, "global_step": 511299, "epoch": 6160} {"train_loss": -27.56537437438965, "global_step": 511300, "epoch": 6160} {"train_loss": -27.1173095703125, "global_step": 511301, "epoch": 6160} {"train_loss": -27.326725006103516, "global_step": 511302, "epoch": 6160} {"train_loss": -27.169876098632812, "global_step": 511303, "epoch": 6160} {"train_loss": -27.147113800048828, "global_step": 511304, "epoch": 6160} {"train_loss": -27.41582679748535, "global_step": 511305, "epoch": 6160} {"train_loss": -27.1604061126709, "global_step": 511306, "epoch": 6160} {"train_loss": -27.073627471923828, "global_step": 511307, "epoch": 6160} {"train_loss": -26.974185943603516, "global_step": 511308, "epoch": 6160} {"train_loss": -27.084043502807617, "global_step": 511309, "epoch": 6160} {"train_loss": -27.30518913269043, "global_step": 511310, "epoch": 6160} {"train_loss": -27.372406005859375, "global_step": 511311, "epoch": 6160} {"train_loss": -27.028955459594727, "global_step": 511312, "epoch": 6160} {"train_loss": -26.89580726623535, "global_step": 511313, "epoch": 6160} {"train_loss": -27.241565704345703, "global_step": 511314, "epoch": 6160} {"train_loss": -27.06317138671875, "global_step": 511315, "epoch": 6160} {"train_loss": -27.541418075561523, "global_step": 511316, "epoch": 6160} {"train_loss": -27.43780517578125, "global_step": 511317, "epoch": 6160} {"train_loss": -27.51911735534668, "global_step": 511318, "epoch": 6160} {"train_loss": -27.406835556030273, "global_step": 511319, "epoch": 6160} {"train_loss": -27.476560592651367, "global_step": 511320, "epoch": 6160} {"train_loss": -27.274967193603516, "global_step": 511321, "epoch": 6160} {"train_loss": -27.50478172302246, "global_step": 511322, "epoch": 6160} {"train_loss": -27.554523468017578, "global_step": 511323, "epoch": 6160} {"train_loss": -27.591049194335938, "global_step": 511324, "epoch": 6160} {"train_loss": -27.435972213745117, "global_step": 511325, "epoch": 6160} {"train_loss": -27.33367919921875, "global_step": 511326, "epoch": 6160} {"train_loss": -27.94125747680664, "global_step": 511327, "epoch": 6160} {"train_loss": -27.382251739501953, "global_step": 511328, "epoch": 6160} {"train_loss": -27.463098526000977, "global_step": 511329, "epoch": 6160} {"train_loss": -27.39801025390625, "global_step": 511330, "epoch": 6160} {"train_loss": -27.31622314453125, "global_step": 511331, "epoch": 6160} {"train_loss": -27.355484008789062, "global_step": 511332, "epoch": 6160} {"train_loss": -27.50348472595215, "global_step": 511333, "epoch": 6160} {"train_loss": -27.77667236328125, "global_step": 511334, "epoch": 6160} {"train_loss": -27.2570743560791, "global_step": 511335, "epoch": 6160} {"train_loss": -27.136869430541992, "global_step": 511336, "epoch": 6160} {"train_loss": -27.35560417175293, "global_step": 511337, "epoch": 6160} {"train_loss": -27.519071578979492, "global_step": 511338, "epoch": 6160} {"train_loss": -27.571866989135742, "global_step": 511339, "epoch": 6160} {"train_loss": -27.549457550048828, "global_step": 511340, "epoch": 6160} {"train_loss": -27.417844772338867, "global_step": 511341, "epoch": 6160} {"train_loss": -27.31060218811035, "global_step": 511342, "epoch": 6160} {"train_loss": -27.602033615112305, "global_step": 511343, "epoch": 6160} {"train_loss": -27.683624267578125, "global_step": 511344, "epoch": 6160} {"train_loss": -27.486026763916016, "global_step": 511345, "epoch": 6160} {"train_loss": -28.01734733581543, "global_step": 511346, "epoch": 6160} {"train_loss": -27.886123657226562, "global_step": 511347, "epoch": 6160} {"train_loss": -27.5577335357666, "global_step": 511348, "epoch": 6160} {"train_loss": -27.251331329345703, "global_step": 511349, "epoch": 6160} {"train_loss": -27.516138076782227, "global_step": 511350, "epoch": 6160} {"train_loss": -27.467370986938477, "global_step": 511351, "epoch": 6160} {"train_loss": -27.4912109375, "global_step": 511352, "epoch": 6160} {"train_loss": -27.6295108795166, "global_step": 511353, "epoch": 6160} {"train_loss": -27.411544799804688, "global_step": 511354, "epoch": 6160} {"train_loss": -27.878406524658203, "global_step": 511355, "epoch": 6160} {"train_loss": -27.78017234802246, "global_step": 511356, "epoch": 6160} {"train_loss": -27.71265983581543, "global_step": 511357, "epoch": 6160} {"train_loss": -27.7462158203125, "global_step": 511358, "epoch": 6160} {"train_loss": -27.888410568237305, "global_step": 511359, "epoch": 6160} {"train_loss": -27.80695915222168, "global_step": 511360, "epoch": 6160} {"train_loss": -27.636892318725586, "global_step": 511361, "epoch": 6160} {"train_loss": -27.379771703697113, "global_step": 511362, "epoch": 6160, "val_loss": 6620059.0} {"train_loss": -26.914020538330078, "global_step": 511363, "epoch": 6161} {"train_loss": -27.032384872436523, "global_step": 511364, "epoch": 6161} {"train_loss": -27.00343132019043, "global_step": 511365, "epoch": 6161} {"train_loss": -26.835041046142578, "global_step": 511366, "epoch": 6161} {"train_loss": -26.876331329345703, "global_step": 511367, "epoch": 6161} {"train_loss": -26.3565673828125, "global_step": 511368, "epoch": 6161} {"train_loss": -27.182401657104492, "global_step": 511369, "epoch": 6161} {"train_loss": -26.484521865844727, "global_step": 511370, "epoch": 6161} {"train_loss": -26.900259017944336, "global_step": 511371, "epoch": 6161} {"train_loss": -26.5854434967041, "global_step": 511372, "epoch": 6161} {"train_loss": -27.46815299987793, "global_step": 511373, "epoch": 6161} {"train_loss": -26.977466583251953, "global_step": 511374, "epoch": 6161} {"train_loss": -26.94341468811035, "global_step": 511375, "epoch": 6161} {"train_loss": -27.177412033081055, "global_step": 511376, "epoch": 6161} {"train_loss": -27.240949630737305, "global_step": 511377, "epoch": 6161} {"train_loss": -27.144174575805664, "global_step": 511378, "epoch": 6161} {"train_loss": -27.292993545532227, "global_step": 511379, "epoch": 6161} {"train_loss": -27.0624942779541, "global_step": 511380, "epoch": 6161} {"train_loss": -27.21512794494629, "global_step": 511381, "epoch": 6161} {"train_loss": -27.26141929626465, "global_step": 511382, "epoch": 6161} {"train_loss": -27.405426025390625, "global_step": 511383, "epoch": 6161} {"train_loss": -27.295133590698242, "global_step": 511384, "epoch": 6161} {"train_loss": -27.126989364624023, "global_step": 511385, "epoch": 6161} {"train_loss": -27.279752731323242, "global_step": 511386, "epoch": 6161} {"train_loss": -27.41094970703125, "global_step": 511387, "epoch": 6161} {"train_loss": -27.805465698242188, "global_step": 511388, "epoch": 6161} {"train_loss": -27.412952423095703, "global_step": 511389, "epoch": 6161} {"train_loss": -27.610605239868164, "global_step": 511390, "epoch": 6161} {"train_loss": -27.48282241821289, "global_step": 511391, "epoch": 6161} {"train_loss": -27.320148468017578, "global_step": 511392, "epoch": 6161} {"train_loss": -26.8078670501709, "global_step": 511393, "epoch": 6161} {"train_loss": -26.846784591674805, "global_step": 511394, "epoch": 6161} {"train_loss": -26.768888473510742, "global_step": 511395, "epoch": 6161} {"train_loss": -27.340417861938477, "global_step": 511396, "epoch": 6161} {"train_loss": -26.636098861694336, "global_step": 511397, "epoch": 6161} {"train_loss": -26.537235260009766, "global_step": 511398, "epoch": 6161} {"train_loss": -27.455968856811523, "global_step": 511399, "epoch": 6161} {"train_loss": -26.540756225585938, "global_step": 511400, "epoch": 6161} {"train_loss": -27.253976821899414, "global_step": 511401, "epoch": 6161} {"train_loss": -27.32451820373535, "global_step": 511402, "epoch": 6161} {"train_loss": -26.852783203125, "global_step": 511403, "epoch": 6161} {"train_loss": -27.365453720092773, "global_step": 511404, "epoch": 6161} {"train_loss": -26.99665641784668, "global_step": 511405, "epoch": 6161} {"train_loss": -27.456995010375977, "global_step": 511406, "epoch": 6161} {"train_loss": -27.119726181030273, "global_step": 511407, "epoch": 6161} {"train_loss": -27.494604110717773, "global_step": 511408, "epoch": 6161} {"train_loss": -27.078006744384766, "global_step": 511409, "epoch": 6161} {"train_loss": -27.3055477142334, "global_step": 511410, "epoch": 6161} {"train_loss": -27.25949478149414, "global_step": 511411, "epoch": 6161} {"train_loss": -27.227079391479492, "global_step": 511412, "epoch": 6161} {"train_loss": -27.264265060424805, "global_step": 511413, "epoch": 6161} {"train_loss": -27.2576847076416, "global_step": 511414, "epoch": 6161} {"train_loss": -27.16462516784668, "global_step": 511415, "epoch": 6161} {"train_loss": -27.183679580688477, "global_step": 511416, "epoch": 6161} {"train_loss": -27.507619857788086, "global_step": 511417, "epoch": 6161} {"train_loss": -27.500720977783203, "global_step": 511418, "epoch": 6161} {"train_loss": -27.64906120300293, "global_step": 511419, "epoch": 6161} {"train_loss": -27.371423721313477, "global_step": 511420, "epoch": 6161} {"train_loss": -27.34051513671875, "global_step": 511421, "epoch": 6161} {"train_loss": -27.52559471130371, "global_step": 511422, "epoch": 6161} {"train_loss": -27.521255493164062, "global_step": 511423, "epoch": 6161} {"train_loss": -27.504138946533203, "global_step": 511424, "epoch": 6161} {"train_loss": -27.227792739868164, "global_step": 511425, "epoch": 6161} {"train_loss": -27.7694149017334, "global_step": 511426, "epoch": 6161} {"train_loss": -27.530414581298828, "global_step": 511427, "epoch": 6161} {"train_loss": -27.673812866210938, "global_step": 511428, "epoch": 6161} {"train_loss": -27.754369735717773, "global_step": 511429, "epoch": 6161} {"train_loss": -27.670385360717773, "global_step": 511430, "epoch": 6161} {"train_loss": -27.360647201538086, "global_step": 511431, "epoch": 6161} {"train_loss": -27.721494674682617, "global_step": 511432, "epoch": 6161} {"train_loss": -27.860776901245117, "global_step": 511433, "epoch": 6161} {"train_loss": -27.47562599182129, "global_step": 511434, "epoch": 6161} {"train_loss": -27.736927032470703, "global_step": 511435, "epoch": 6161} {"train_loss": -27.618513107299805, "global_step": 511436, "epoch": 6161} {"train_loss": -27.5239315032959, "global_step": 511437, "epoch": 6161} {"train_loss": -27.748950958251953, "global_step": 511438, "epoch": 6161} {"train_loss": -27.605915069580078, "global_step": 511439, "epoch": 6161} {"train_loss": -27.683338165283203, "global_step": 511440, "epoch": 6161} {"train_loss": -27.331518173217773, "global_step": 511441, "epoch": 6161} {"train_loss": -27.583362579345703, "global_step": 511442, "epoch": 6161} {"train_loss": -27.89655113220215, "global_step": 511443, "epoch": 6161} {"train_loss": -27.98597526550293, "global_step": 511444, "epoch": 6161} {"train_loss": -27.28241952643337, "global_step": 511445, "epoch": 6161, "val_loss": 6541858.0} {"train_loss": -27.213748931884766, "global_step": 511446, "epoch": 6162} {"train_loss": -27.128055572509766, "global_step": 511447, "epoch": 6162} {"train_loss": -26.90113639831543, "global_step": 511448, "epoch": 6162} {"train_loss": -26.804311752319336, "global_step": 511449, "epoch": 6162} {"train_loss": -26.6512393951416, "global_step": 511450, "epoch": 6162} {"train_loss": -26.718358993530273, "global_step": 511451, "epoch": 6162} {"train_loss": -26.953048706054688, "global_step": 511452, "epoch": 6162} {"train_loss": -27.1107234954834, "global_step": 511453, "epoch": 6162} {"train_loss": -27.1165828704834, "global_step": 511454, "epoch": 6162} {"train_loss": -27.05224609375, "global_step": 511455, "epoch": 6162} {"train_loss": -26.86280632019043, "global_step": 511456, "epoch": 6162} {"train_loss": -27.567007064819336, "global_step": 511457, "epoch": 6162} {"train_loss": -27.091108322143555, "global_step": 511458, "epoch": 6162} {"train_loss": -26.977567672729492, "global_step": 511459, "epoch": 6162} {"train_loss": -27.330480575561523, "global_step": 511460, "epoch": 6162} {"train_loss": -27.04630470275879, "global_step": 511461, "epoch": 6162} {"train_loss": -27.122211456298828, "global_step": 511462, "epoch": 6162} {"train_loss": -27.49271583557129, "global_step": 511463, "epoch": 6162} {"train_loss": -27.242528915405273, "global_step": 511464, "epoch": 6162} {"train_loss": -26.931976318359375, "global_step": 511465, "epoch": 6162} {"train_loss": -27.082937240600586, "global_step": 511466, "epoch": 6162} {"train_loss": -26.9808406829834, "global_step": 511467, "epoch": 6162} {"train_loss": -27.248214721679688, "global_step": 511468, "epoch": 6162} {"train_loss": -27.775482177734375, "global_step": 511469, "epoch": 6162} {"train_loss": -27.302127838134766, "global_step": 511470, "epoch": 6162} {"train_loss": -26.90705680847168, "global_step": 511471, "epoch": 6162} {"train_loss": -27.1679630279541, "global_step": 511472, "epoch": 6162} {"train_loss": -27.10540199279785, "global_step": 511473, "epoch": 6162} {"train_loss": -27.4638729095459, "global_step": 511474, "epoch": 6162} {"train_loss": -27.34779930114746, "global_step": 511475, "epoch": 6162} {"train_loss": -27.373762130737305, "global_step": 511476, "epoch": 6162} {"train_loss": -27.522729873657227, "global_step": 511477, "epoch": 6162} {"train_loss": -27.100202560424805, "global_step": 511478, "epoch": 6162} {"train_loss": -27.114002227783203, "global_step": 511479, "epoch": 6162} {"train_loss": -27.380298614501953, "global_step": 511480, "epoch": 6162} {"train_loss": -27.374866485595703, "global_step": 511481, "epoch": 6162} {"train_loss": -27.41397476196289, "global_step": 511482, "epoch": 6162} {"train_loss": -27.151050567626953, "global_step": 511483, "epoch": 6162} {"train_loss": -27.377344131469727, "global_step": 511484, "epoch": 6162} {"train_loss": -27.424026489257812, "global_step": 511485, "epoch": 6162} {"train_loss": -27.681177139282227, "global_step": 511486, "epoch": 6162} {"train_loss": -27.55914306640625, "global_step": 511487, "epoch": 6162} {"train_loss": -27.510211944580078, "global_step": 511488, "epoch": 6162} {"train_loss": -27.543195724487305, "global_step": 511489, "epoch": 6162} {"train_loss": -27.21882438659668, "global_step": 511490, "epoch": 6162} {"train_loss": -27.45208168029785, "global_step": 511491, "epoch": 6162} {"train_loss": -27.390899658203125, "global_step": 511492, "epoch": 6162} {"train_loss": -27.606351852416992, "global_step": 511493, "epoch": 6162} {"train_loss": -27.370283126831055, "global_step": 511494, "epoch": 6162} {"train_loss": -27.581327438354492, "global_step": 511495, "epoch": 6162} {"train_loss": -27.270795822143555, "global_step": 511496, "epoch": 6162} {"train_loss": -27.561914443969727, "global_step": 511497, "epoch": 6162} {"train_loss": -27.15234375, "global_step": 511498, "epoch": 6162} {"train_loss": -27.406232833862305, "global_step": 511499, "epoch": 6162} {"train_loss": -27.889163970947266, "global_step": 511500, "epoch": 6162} {"train_loss": -27.435606002807617, "global_step": 511501, "epoch": 6162} {"train_loss": -27.72416114807129, "global_step": 511502, "epoch": 6162} {"train_loss": -27.52423095703125, "global_step": 511503, "epoch": 6162} {"train_loss": -27.591266632080078, "global_step": 511504, "epoch": 6162} {"train_loss": -27.33465576171875, "global_step": 511505, "epoch": 6162} {"train_loss": -27.578521728515625, "global_step": 511506, "epoch": 6162} {"train_loss": -27.92426872253418, "global_step": 511507, "epoch": 6162} {"train_loss": -27.72028923034668, "global_step": 511508, "epoch": 6162} {"train_loss": -27.1621150970459, "global_step": 511509, "epoch": 6162} {"train_loss": -27.209964752197266, "global_step": 511510, "epoch": 6162} {"train_loss": -27.78485679626465, "global_step": 511511, "epoch": 6162} {"train_loss": -27.66187858581543, "global_step": 511512, "epoch": 6162} {"train_loss": -27.39850425720215, "global_step": 511513, "epoch": 6162} {"train_loss": -27.692584991455078, "global_step": 511514, "epoch": 6162} {"train_loss": -26.96071434020996, "global_step": 511515, "epoch": 6162} {"train_loss": -27.354455947875977, "global_step": 511516, "epoch": 6162} {"train_loss": -27.44099235534668, "global_step": 511517, "epoch": 6162} {"train_loss": -27.441715240478516, "global_step": 511518, "epoch": 6162} {"train_loss": -27.1202449798584, "global_step": 511519, "epoch": 6162} {"train_loss": -27.261117935180664, "global_step": 511520, "epoch": 6162} {"train_loss": -27.3863582611084, "global_step": 511521, "epoch": 6162} {"train_loss": -27.661640167236328, "global_step": 511522, "epoch": 6162} {"train_loss": -27.423095703125, "global_step": 511523, "epoch": 6162} {"train_loss": -27.8875675201416, "global_step": 511524, "epoch": 6162} {"train_loss": -27.734582901000977, "global_step": 511525, "epoch": 6162} {"train_loss": -27.556201934814453, "global_step": 511526, "epoch": 6162} {"train_loss": -27.723058700561523, "global_step": 511527, "epoch": 6162} {"train_loss": -27.33136002414198, "global_step": 511528, "epoch": 6162, "val_loss": 6587076.0} {"train_loss": -26.775836944580078, "global_step": 511529, "epoch": 6163} {"train_loss": -26.898168563842773, "global_step": 511530, "epoch": 6163} {"train_loss": -26.926721572875977, "global_step": 511531, "epoch": 6163} {"train_loss": -27.083744049072266, "global_step": 511532, "epoch": 6163} {"train_loss": -27.176095962524414, "global_step": 511533, "epoch": 6163} {"train_loss": -27.118885040283203, "global_step": 511534, "epoch": 6163} {"train_loss": -26.660043716430664, "global_step": 511535, "epoch": 6163} {"train_loss": -27.035245895385742, "global_step": 511536, "epoch": 6163} {"train_loss": -27.003253936767578, "global_step": 511537, "epoch": 6163} {"train_loss": -26.796253204345703, "global_step": 511538, "epoch": 6163} {"train_loss": -27.016895294189453, "global_step": 511539, "epoch": 6163} {"train_loss": -26.680856704711914, "global_step": 511540, "epoch": 6163} {"train_loss": -26.83487892150879, "global_step": 511541, "epoch": 6163} {"train_loss": -26.4310302734375, "global_step": 511542, "epoch": 6163} {"train_loss": -27.367324829101562, "global_step": 511543, "epoch": 6163} {"train_loss": -26.851526260375977, "global_step": 511544, "epoch": 6163} {"train_loss": -26.917144775390625, "global_step": 511545, "epoch": 6163} {"train_loss": -27.07502555847168, "global_step": 511546, "epoch": 6163} {"train_loss": -26.802534103393555, "global_step": 511547, "epoch": 6163} {"train_loss": -27.27686882019043, "global_step": 511548, "epoch": 6163} {"train_loss": -26.962793350219727, "global_step": 511549, "epoch": 6163} {"train_loss": -27.11091423034668, "global_step": 511550, "epoch": 6163} {"train_loss": -27.001840591430664, "global_step": 511551, "epoch": 6163} {"train_loss": -26.958524703979492, "global_step": 511552, "epoch": 6163} {"train_loss": -27.08270263671875, "global_step": 511553, "epoch": 6163} {"train_loss": -27.03311538696289, "global_step": 511554, "epoch": 6163} {"train_loss": -27.260833740234375, "global_step": 511555, "epoch": 6163} {"train_loss": -27.2971248626709, "global_step": 511556, "epoch": 6163} {"train_loss": -27.27544593811035, "global_step": 511557, "epoch": 6163} {"train_loss": -27.284072875976562, "global_step": 511558, "epoch": 6163} {"train_loss": -27.539106369018555, "global_step": 511559, "epoch": 6163} {"train_loss": -27.248891830444336, "global_step": 511560, "epoch": 6163} {"train_loss": -27.35914421081543, "global_step": 511561, "epoch": 6163} {"train_loss": -27.282636642456055, "global_step": 511562, "epoch": 6163} {"train_loss": -27.55072021484375, "global_step": 511563, "epoch": 6163} {"train_loss": -27.285043716430664, "global_step": 511564, "epoch": 6163} {"train_loss": -26.60481071472168, "global_step": 511565, "epoch": 6163} {"train_loss": -27.04054832458496, "global_step": 511566, "epoch": 6163} {"train_loss": -27.586820602416992, "global_step": 511567, "epoch": 6163} {"train_loss": -27.195484161376953, "global_step": 511568, "epoch": 6163} {"train_loss": -27.542083740234375, "global_step": 511569, "epoch": 6163} {"train_loss": -27.252832412719727, "global_step": 511570, "epoch": 6163} {"train_loss": -27.10736656188965, "global_step": 511571, "epoch": 6163} {"train_loss": -27.24311637878418, "global_step": 511572, "epoch": 6163} {"train_loss": -27.336801528930664, "global_step": 511573, "epoch": 6163} {"train_loss": -27.366926193237305, "global_step": 511574, "epoch": 6163} {"train_loss": -27.005475997924805, "global_step": 511575, "epoch": 6163} {"train_loss": -27.486682891845703, "global_step": 511576, "epoch": 6163} {"train_loss": -27.54052734375, "global_step": 511577, "epoch": 6163} {"train_loss": -27.38638687133789, "global_step": 511578, "epoch": 6163} {"train_loss": -27.491132736206055, "global_step": 511579, "epoch": 6163} {"train_loss": -27.6556339263916, "global_step": 511580, "epoch": 6163} {"train_loss": -27.850378036499023, "global_step": 511581, "epoch": 6163} {"train_loss": -27.59649085998535, "global_step": 511582, "epoch": 6163} {"train_loss": -27.506744384765625, "global_step": 511583, "epoch": 6163} {"train_loss": -27.591781616210938, "global_step": 511584, "epoch": 6163} {"train_loss": -27.6693058013916, "global_step": 511585, "epoch": 6163} {"train_loss": -27.298215866088867, "global_step": 511586, "epoch": 6163} {"train_loss": -27.60455322265625, "global_step": 511587, "epoch": 6163} {"train_loss": -27.660797119140625, "global_step": 511588, "epoch": 6163} {"train_loss": -27.383987426757812, "global_step": 511589, "epoch": 6163} {"train_loss": -27.466400146484375, "global_step": 511590, "epoch": 6163} {"train_loss": -27.509790420532227, "global_step": 511591, "epoch": 6163} {"train_loss": -27.990386962890625, "global_step": 511592, "epoch": 6163} {"train_loss": -27.32000732421875, "global_step": 511593, "epoch": 6163} {"train_loss": -27.27886390686035, "global_step": 511594, "epoch": 6163} {"train_loss": -27.536603927612305, "global_step": 511595, "epoch": 6163} {"train_loss": -27.42835807800293, "global_step": 511596, "epoch": 6163} {"train_loss": -28.25554847717285, "global_step": 511597, "epoch": 6163} {"train_loss": -27.493459701538086, "global_step": 511598, "epoch": 6163} {"train_loss": -27.643970489501953, "global_step": 511599, "epoch": 6163} {"train_loss": -27.373029708862305, "global_step": 511600, "epoch": 6163} {"train_loss": -27.35968589782715, "global_step": 511601, "epoch": 6163} {"train_loss": -27.223875045776367, "global_step": 511602, "epoch": 6163} {"train_loss": -26.754972457885742, "global_step": 511603, "epoch": 6163} {"train_loss": -26.001693725585938, "global_step": 511604, "epoch": 6163} {"train_loss": -27.204883575439453, "global_step": 511605, "epoch": 6163} {"train_loss": -27.529556274414062, "global_step": 511606, "epoch": 6163} {"train_loss": -26.82271385192871, "global_step": 511607, "epoch": 6163} {"train_loss": -27.31245231628418, "global_step": 511608, "epoch": 6163} {"train_loss": -27.13983154296875, "global_step": 511609, "epoch": 6163} {"train_loss": -27.034772872924805, "global_step": 511610, "epoch": 6163} {"train_loss": -27.227664671748517, "global_step": 511611, "epoch": 6163, "val_loss": 6576245.0} {"train_loss": -27.402912139892578, "global_step": 511612, "epoch": 6164} {"train_loss": -27.059310913085938, "global_step": 511613, "epoch": 6164} {"train_loss": -27.069265365600586, "global_step": 511614, "epoch": 6164} {"train_loss": -27.566999435424805, "global_step": 511615, "epoch": 6164} {"train_loss": -27.083560943603516, "global_step": 511616, "epoch": 6164} {"train_loss": -26.80971336364746, "global_step": 511617, "epoch": 6164} {"train_loss": -27.15824317932129, "global_step": 511618, "epoch": 6164} {"train_loss": -27.24696159362793, "global_step": 511619, "epoch": 6164} {"train_loss": -27.591354370117188, "global_step": 511620, "epoch": 6164} {"train_loss": -27.457120895385742, "global_step": 511621, "epoch": 6164} {"train_loss": -27.390893936157227, "global_step": 511622, "epoch": 6164} {"train_loss": -27.50605583190918, "global_step": 511623, "epoch": 6164} {"train_loss": -27.179174423217773, "global_step": 511624, "epoch": 6164} {"train_loss": -27.45206642150879, "global_step": 511625, "epoch": 6164} {"train_loss": -27.441877365112305, "global_step": 511626, "epoch": 6164} {"train_loss": -27.346609115600586, "global_step": 511627, "epoch": 6164} {"train_loss": -27.38689613342285, "global_step": 511628, "epoch": 6164} {"train_loss": -27.679174423217773, "global_step": 511629, "epoch": 6164} {"train_loss": -27.841333389282227, "global_step": 511630, "epoch": 6164} {"train_loss": -27.5476016998291, "global_step": 511631, "epoch": 6164} {"train_loss": -27.737340927124023, "global_step": 511632, "epoch": 6164} {"train_loss": -27.498289108276367, "global_step": 511633, "epoch": 6164} {"train_loss": -27.5308837890625, "global_step": 511634, "epoch": 6164} {"train_loss": -27.40177345275879, "global_step": 511635, "epoch": 6164} {"train_loss": -27.790800094604492, "global_step": 511636, "epoch": 6164} {"train_loss": -27.685827255249023, "global_step": 511637, "epoch": 6164} {"train_loss": -27.622594833374023, "global_step": 511638, "epoch": 6164} {"train_loss": -27.593503952026367, "global_step": 511639, "epoch": 6164} {"train_loss": -27.445514678955078, "global_step": 511640, "epoch": 6164} {"train_loss": -27.997608184814453, "global_step": 511641, "epoch": 6164} {"train_loss": -27.546125411987305, "global_step": 511642, "epoch": 6164} {"train_loss": -27.424835205078125, "global_step": 511643, "epoch": 6164} {"train_loss": -27.58497428894043, "global_step": 511644, "epoch": 6164} {"train_loss": -27.613529205322266, "global_step": 511645, "epoch": 6164} {"train_loss": -27.52197265625, "global_step": 511646, "epoch": 6164} {"train_loss": -27.662494659423828, "global_step": 511647, "epoch": 6164} {"train_loss": -27.493406295776367, "global_step": 511648, "epoch": 6164} {"train_loss": -27.39759635925293, "global_step": 511649, "epoch": 6164} {"train_loss": -27.20731544494629, "global_step": 511650, "epoch": 6164} {"train_loss": -27.39312744140625, "global_step": 511651, "epoch": 6164} {"train_loss": -27.79304313659668, "global_step": 511652, "epoch": 6164} {"train_loss": -27.536890029907227, "global_step": 511653, "epoch": 6164} {"train_loss": -27.527698516845703, "global_step": 511654, "epoch": 6164} {"train_loss": -27.56829833984375, "global_step": 511655, "epoch": 6164} {"train_loss": -27.440587997436523, "global_step": 511656, "epoch": 6164} {"train_loss": -27.666641235351562, "global_step": 511657, "epoch": 6164} {"train_loss": -27.94264030456543, "global_step": 511658, "epoch": 6164} {"train_loss": -27.648151397705078, "global_step": 511659, "epoch": 6164} {"train_loss": -27.398584365844727, "global_step": 511660, "epoch": 6164} {"train_loss": -27.695234298706055, "global_step": 511661, "epoch": 6164} {"train_loss": -28.025381088256836, "global_step": 511662, "epoch": 6164} {"train_loss": -28.199188232421875, "global_step": 511663, "epoch": 6164} {"train_loss": -27.186695098876953, "global_step": 511664, "epoch": 6164} {"train_loss": -27.7919921875, "global_step": 511665, "epoch": 6164} {"train_loss": -27.688100814819336, "global_step": 511666, "epoch": 6164} {"train_loss": -27.871286392211914, "global_step": 511667, "epoch": 6164} {"train_loss": -27.653854370117188, "global_step": 511668, "epoch": 6164} {"train_loss": -27.46122169494629, "global_step": 511669, "epoch": 6164} {"train_loss": -27.515329360961914, "global_step": 511670, "epoch": 6164} {"train_loss": -27.584802627563477, "global_step": 511671, "epoch": 6164} {"train_loss": -27.641599655151367, "global_step": 511672, "epoch": 6164} {"train_loss": -27.561126708984375, "global_step": 511673, "epoch": 6164} {"train_loss": -26.91334342956543, "global_step": 511674, "epoch": 6164} {"train_loss": -27.280359268188477, "global_step": 511675, "epoch": 6164} {"train_loss": -27.690311431884766, "global_step": 511676, "epoch": 6164} {"train_loss": -27.347314834594727, "global_step": 511677, "epoch": 6164} {"train_loss": -27.82220458984375, "global_step": 511678, "epoch": 6164} {"train_loss": -27.79575538635254, "global_step": 511679, "epoch": 6164} {"train_loss": -27.680261611938477, "global_step": 511680, "epoch": 6164} {"train_loss": -27.642892837524414, "global_step": 511681, "epoch": 6164} {"train_loss": -27.663663864135742, "global_step": 511682, "epoch": 6164} {"train_loss": -27.508193969726562, "global_step": 511683, "epoch": 6164} {"train_loss": -27.430225372314453, "global_step": 511684, "epoch": 6164} {"train_loss": -27.6019229888916, "global_step": 511685, "epoch": 6164} {"train_loss": -27.465673446655273, "global_step": 511686, "epoch": 6164} {"train_loss": -27.95562744140625, "global_step": 511687, "epoch": 6164} {"train_loss": -27.115304946899414, "global_step": 511688, "epoch": 6164} {"train_loss": -27.695486068725586, "global_step": 511689, "epoch": 6164} {"train_loss": -27.293615341186523, "global_step": 511690, "epoch": 6164} {"train_loss": -27.36121940612793, "global_step": 511691, "epoch": 6164} {"train_loss": -27.206506729125977, "global_step": 511692, "epoch": 6164} {"train_loss": -26.94772720336914, "global_step": 511693, "epoch": 6164} {"train_loss": -27.51106374809541, "global_step": 511694, "epoch": 6164, "val_loss": 6647651.0} {"train_loss": -26.943342208862305, "global_step": 511695, "epoch": 6165} {"train_loss": -26.658935546875, "global_step": 511696, "epoch": 6165} {"train_loss": -26.597553253173828, "global_step": 511697, "epoch": 6165} {"train_loss": -26.635786056518555, "global_step": 511698, "epoch": 6165} {"train_loss": -26.12757682800293, "global_step": 511699, "epoch": 6165} {"train_loss": -26.23127555847168, "global_step": 511700, "epoch": 6165} {"train_loss": -26.692676544189453, "global_step": 511701, "epoch": 6165} {"train_loss": -26.47974967956543, "global_step": 511702, "epoch": 6165} {"train_loss": -26.46302604675293, "global_step": 511703, "epoch": 6165} {"train_loss": -26.504362106323242, "global_step": 511704, "epoch": 6165} {"train_loss": -26.184619903564453, "global_step": 511705, "epoch": 6165} {"train_loss": -26.5512752532959, "global_step": 511706, "epoch": 6165} {"train_loss": -27.2347412109375, "global_step": 511707, "epoch": 6165} {"train_loss": -26.68623161315918, "global_step": 511708, "epoch": 6165} {"train_loss": -26.825428009033203, "global_step": 511709, "epoch": 6165} {"train_loss": -26.883996963500977, "global_step": 511710, "epoch": 6165} {"train_loss": -27.104084014892578, "global_step": 511711, "epoch": 6165} {"train_loss": -26.794586181640625, "global_step": 511712, "epoch": 6165} {"train_loss": -27.359949111938477, "global_step": 511713, "epoch": 6165} {"train_loss": -27.033178329467773, "global_step": 511714, "epoch": 6165} {"train_loss": -27.288053512573242, "global_step": 511715, "epoch": 6165} {"train_loss": -27.246479034423828, "global_step": 511716, "epoch": 6165} {"train_loss": -27.332895278930664, "global_step": 511717, "epoch": 6165} {"train_loss": -27.07730484008789, "global_step": 511718, "epoch": 6165} {"train_loss": -27.120941162109375, "global_step": 511719, "epoch": 6165} {"train_loss": -27.253437042236328, "global_step": 511720, "epoch": 6165} {"train_loss": -27.256284713745117, "global_step": 511721, "epoch": 6165} {"train_loss": -27.36270523071289, "global_step": 511722, "epoch": 6165} {"train_loss": -27.15460205078125, "global_step": 511723, "epoch": 6165} {"train_loss": -27.578439712524414, "global_step": 511724, "epoch": 6165} {"train_loss": -26.8619327545166, "global_step": 511725, "epoch": 6165} {"train_loss": -27.1093807220459, "global_step": 511726, "epoch": 6165} {"train_loss": -26.970182418823242, "global_step": 511727, "epoch": 6165} {"train_loss": -27.503223419189453, "global_step": 511728, "epoch": 6165} {"train_loss": -27.501184463500977, "global_step": 511729, "epoch": 6165} {"train_loss": -26.894433975219727, "global_step": 511730, "epoch": 6165} {"train_loss": -27.512317657470703, "global_step": 511731, "epoch": 6165} {"train_loss": -27.768192291259766, "global_step": 511732, "epoch": 6165} {"train_loss": -26.960235595703125, "global_step": 511733, "epoch": 6165} {"train_loss": -27.561649322509766, "global_step": 511734, "epoch": 6165} {"train_loss": -27.254043579101562, "global_step": 511735, "epoch": 6165} {"train_loss": -27.581924438476562, "global_step": 511736, "epoch": 6165} {"train_loss": -27.606908798217773, "global_step": 511737, "epoch": 6165} {"train_loss": -27.58637809753418, "global_step": 511738, "epoch": 6165} {"train_loss": -27.419477462768555, "global_step": 511739, "epoch": 6165} {"train_loss": -27.297826766967773, "global_step": 511740, "epoch": 6165} {"train_loss": -27.449060440063477, "global_step": 511741, "epoch": 6165} {"train_loss": -27.522418975830078, "global_step": 511742, "epoch": 6165} {"train_loss": -27.712621688842773, "global_step": 511743, "epoch": 6165} {"train_loss": -27.47075843811035, "global_step": 511744, "epoch": 6165} {"train_loss": -27.503711700439453, "global_step": 511745, "epoch": 6165} {"train_loss": -27.375913619995117, "global_step": 511746, "epoch": 6165} {"train_loss": -27.273447036743164, "global_step": 511747, "epoch": 6165} {"train_loss": -27.49078941345215, "global_step": 511748, "epoch": 6165} {"train_loss": -27.8986873626709, "global_step": 511749, "epoch": 6165} {"train_loss": -27.5092830657959, "global_step": 511750, "epoch": 6165} {"train_loss": -27.659948348999023, "global_step": 511751, "epoch": 6165} {"train_loss": -27.779224395751953, "global_step": 511752, "epoch": 6165} {"train_loss": -27.821842193603516, "global_step": 511753, "epoch": 6165} {"train_loss": -27.55083656311035, "global_step": 511754, "epoch": 6165} {"train_loss": -27.3404598236084, "global_step": 511755, "epoch": 6165} {"train_loss": -27.585363388061523, "global_step": 511756, "epoch": 6165} {"train_loss": -27.852338790893555, "global_step": 511757, "epoch": 6165} {"train_loss": -27.51059341430664, "global_step": 511758, "epoch": 6165} {"train_loss": -27.52695083618164, "global_step": 511759, "epoch": 6165} {"train_loss": -27.40089988708496, "global_step": 511760, "epoch": 6165} {"train_loss": -27.5899715423584, "global_step": 511761, "epoch": 6165} {"train_loss": -27.87942886352539, "global_step": 511762, "epoch": 6165} {"train_loss": -27.334463119506836, "global_step": 511763, "epoch": 6165} {"train_loss": -27.1863956451416, "global_step": 511764, "epoch": 6165} {"train_loss": -27.364805221557617, "global_step": 511765, "epoch": 6165} {"train_loss": -27.964548110961914, "global_step": 511766, "epoch": 6165} {"train_loss": -27.732934951782227, "global_step": 511767, "epoch": 6165} {"train_loss": -27.5174560546875, "global_step": 511768, "epoch": 6165} {"train_loss": -27.682920455932617, "global_step": 511769, "epoch": 6165} {"train_loss": -27.297210693359375, "global_step": 511770, "epoch": 6165} {"train_loss": -27.398731231689453, "global_step": 511771, "epoch": 6165} {"train_loss": -27.835128784179688, "global_step": 511772, "epoch": 6165} {"train_loss": -27.811115264892578, "global_step": 511773, "epoch": 6165} {"train_loss": -27.679367065429688, "global_step": 511774, "epoch": 6165} {"train_loss": -27.459714889526367, "global_step": 511775, "epoch": 6165} {"train_loss": -27.445281982421875, "global_step": 511776, "epoch": 6165} {"train_loss": -27.279033545988153, "global_step": 511777, "epoch": 6165, "val_loss": 6598199.5} {"train_loss": -26.66253662109375, "global_step": 511778, "epoch": 6166} {"train_loss": -25.10482406616211, "global_step": 511779, "epoch": 6166} {"train_loss": -23.890119552612305, "global_step": 511780, "epoch": 6166} {"train_loss": -26.416513442993164, "global_step": 511781, "epoch": 6166} {"train_loss": -26.020587921142578, "global_step": 511782, "epoch": 6166} {"train_loss": -26.009170532226562, "global_step": 511783, "epoch": 6166} {"train_loss": -25.683053970336914, "global_step": 511784, "epoch": 6166} {"train_loss": -26.4879150390625, "global_step": 511785, "epoch": 6166} {"train_loss": -26.043649673461914, "global_step": 511786, "epoch": 6166} {"train_loss": -26.066884994506836, "global_step": 511787, "epoch": 6166} {"train_loss": -26.348270416259766, "global_step": 511788, "epoch": 6166} {"train_loss": -26.4675350189209, "global_step": 511789, "epoch": 6166} {"train_loss": -26.22450065612793, "global_step": 511790, "epoch": 6166} {"train_loss": -27.256763458251953, "global_step": 511791, "epoch": 6166} {"train_loss": -26.827869415283203, "global_step": 511792, "epoch": 6166} {"train_loss": -26.21590232849121, "global_step": 511793, "epoch": 6166} {"train_loss": -27.033323287963867, "global_step": 511794, "epoch": 6166} {"train_loss": -26.861801147460938, "global_step": 511795, "epoch": 6166} {"train_loss": -26.844131469726562, "global_step": 511796, "epoch": 6166} {"train_loss": -27.0004825592041, "global_step": 511797, "epoch": 6166} {"train_loss": -26.5574893951416, "global_step": 511798, "epoch": 6166} {"train_loss": -26.920398712158203, "global_step": 511799, "epoch": 6166} {"train_loss": -27.150537490844727, "global_step": 511800, "epoch": 6166} {"train_loss": -26.986982345581055, "global_step": 511801, "epoch": 6166} {"train_loss": -27.082983016967773, "global_step": 511802, "epoch": 6166} {"train_loss": -27.206043243408203, "global_step": 511803, "epoch": 6166} {"train_loss": -27.296131134033203, "global_step": 511804, "epoch": 6166} {"train_loss": -27.445035934448242, "global_step": 511805, "epoch": 6166} {"train_loss": -26.960798263549805, "global_step": 511806, "epoch": 6166} {"train_loss": -27.002182006835938, "global_step": 511807, "epoch": 6166} {"train_loss": -27.533361434936523, "global_step": 511808, "epoch": 6166} {"train_loss": -27.094696044921875, "global_step": 511809, "epoch": 6166} {"train_loss": -27.235519409179688, "global_step": 511810, "epoch": 6166} {"train_loss": -27.279895782470703, "global_step": 511811, "epoch": 6166} {"train_loss": -27.09015464782715, "global_step": 511812, "epoch": 6166} {"train_loss": -27.20590591430664, "global_step": 511813, "epoch": 6166} {"train_loss": -27.558347702026367, "global_step": 511814, "epoch": 6166} {"train_loss": -27.41951560974121, "global_step": 511815, "epoch": 6166} {"train_loss": -27.367603302001953, "global_step": 511816, "epoch": 6166} {"train_loss": -27.076765060424805, "global_step": 511817, "epoch": 6166} {"train_loss": -27.3988094329834, "global_step": 511818, "epoch": 6166} {"train_loss": -27.729780197143555, "global_step": 511819, "epoch": 6166} {"train_loss": -27.89776611328125, "global_step": 511820, "epoch": 6166} {"train_loss": -27.514636993408203, "global_step": 511821, "epoch": 6166} {"train_loss": -27.673547744750977, "global_step": 511822, "epoch": 6166} {"train_loss": -27.56659507751465, "global_step": 511823, "epoch": 6166} {"train_loss": -27.378198623657227, "global_step": 511824, "epoch": 6166} {"train_loss": -27.340295791625977, "global_step": 511825, "epoch": 6166} {"train_loss": -27.521520614624023, "global_step": 511826, "epoch": 6166} {"train_loss": -27.894550323486328, "global_step": 511827, "epoch": 6166} {"train_loss": -27.799518585205078, "global_step": 511828, "epoch": 6166} {"train_loss": -27.683155059814453, "global_step": 511829, "epoch": 6166} {"train_loss": -27.899444580078125, "global_step": 511830, "epoch": 6166} {"train_loss": -27.56355857849121, "global_step": 511831, "epoch": 6166} {"train_loss": -27.779027938842773, "global_step": 511832, "epoch": 6166} {"train_loss": -27.737279891967773, "global_step": 511833, "epoch": 6166} {"train_loss": -27.754165649414062, "global_step": 511834, "epoch": 6166} {"train_loss": -27.58296012878418, "global_step": 511835, "epoch": 6166} {"train_loss": -27.797128677368164, "global_step": 511836, "epoch": 6166} {"train_loss": -27.44312858581543, "global_step": 511837, "epoch": 6166} {"train_loss": -27.864765167236328, "global_step": 511838, "epoch": 6166} {"train_loss": -27.525671005249023, "global_step": 511839, "epoch": 6166} {"train_loss": -27.47223472595215, "global_step": 511840, "epoch": 6166} {"train_loss": -28.085041046142578, "global_step": 511841, "epoch": 6166} {"train_loss": -27.48162841796875, "global_step": 511842, "epoch": 6166} {"train_loss": -27.565311431884766, "global_step": 511843, "epoch": 6166} {"train_loss": -27.43269157409668, "global_step": 511844, "epoch": 6166} {"train_loss": -27.689167022705078, "global_step": 511845, "epoch": 6166} {"train_loss": -27.407855987548828, "global_step": 511846, "epoch": 6166} {"train_loss": -27.602018356323242, "global_step": 511847, "epoch": 6166} {"train_loss": -27.60358238220215, "global_step": 511848, "epoch": 6166} {"train_loss": -27.966205596923828, "global_step": 511849, "epoch": 6166} {"train_loss": -27.785221099853516, "global_step": 511850, "epoch": 6166} {"train_loss": -27.570539474487305, "global_step": 511851, "epoch": 6166} {"train_loss": -27.8648624420166, "global_step": 511852, "epoch": 6166} {"train_loss": -27.927148818969727, "global_step": 511853, "epoch": 6166} {"train_loss": -27.682348251342773, "global_step": 511854, "epoch": 6166} {"train_loss": -27.757598876953125, "global_step": 511855, "epoch": 6166} {"train_loss": -27.50933837890625, "global_step": 511856, "epoch": 6166} {"train_loss": -27.1762638092041, "global_step": 511857, "epoch": 6166} {"train_loss": -27.534753799438477, "global_step": 511858, "epoch": 6166} {"train_loss": -27.658798217773438, "global_step": 511859, "epoch": 6166} {"train_loss": -27.183201732405696, "global_step": 511860, "epoch": 6166, "val_loss": 6683594.0} {"train_loss": -26.338272094726562, "global_step": 511861, "epoch": 6167} {"train_loss": -26.52374839782715, "global_step": 511862, "epoch": 6167} {"train_loss": -26.854141235351562, "global_step": 511863, "epoch": 6167} {"train_loss": -26.690473556518555, "global_step": 511864, "epoch": 6167} {"train_loss": -26.059555053710938, "global_step": 511865, "epoch": 6167} {"train_loss": -26.661102294921875, "global_step": 511866, "epoch": 6167} {"train_loss": -26.848663330078125, "global_step": 511867, "epoch": 6167} {"train_loss": -26.822589874267578, "global_step": 511868, "epoch": 6167} {"train_loss": -26.42535400390625, "global_step": 511869, "epoch": 6167} {"train_loss": -26.3765869140625, "global_step": 511870, "epoch": 6167} {"train_loss": -26.610971450805664, "global_step": 511871, "epoch": 6167} {"train_loss": -26.30628776550293, "global_step": 511872, "epoch": 6167} {"train_loss": -26.89896583557129, "global_step": 511873, "epoch": 6167} {"train_loss": -27.1173152923584, "global_step": 511874, "epoch": 6167} {"train_loss": -26.810956954956055, "global_step": 511875, "epoch": 6167} {"train_loss": -26.855199813842773, "global_step": 511876, "epoch": 6167} {"train_loss": -26.75071144104004, "global_step": 511877, "epoch": 6167} {"train_loss": -26.86505699157715, "global_step": 511878, "epoch": 6167} {"train_loss": -26.796955108642578, "global_step": 511879, "epoch": 6167} {"train_loss": -27.138105392456055, "global_step": 511880, "epoch": 6167} {"train_loss": -26.995710372924805, "global_step": 511881, "epoch": 6167} {"train_loss": -26.81245231628418, "global_step": 511882, "epoch": 6167} {"train_loss": -26.86725425720215, "global_step": 511883, "epoch": 6167} {"train_loss": -27.336212158203125, "global_step": 511884, "epoch": 6167} {"train_loss": -27.07550621032715, "global_step": 511885, "epoch": 6167} {"train_loss": -27.460407257080078, "global_step": 511886, "epoch": 6167} {"train_loss": -26.78607749938965, "global_step": 511887, "epoch": 6167} {"train_loss": -27.233015060424805, "global_step": 511888, "epoch": 6167} {"train_loss": -27.210479736328125, "global_step": 511889, "epoch": 6167} {"train_loss": -27.373388290405273, "global_step": 511890, "epoch": 6167} {"train_loss": -27.56570816040039, "global_step": 511891, "epoch": 6167} {"train_loss": -27.33846092224121, "global_step": 511892, "epoch": 6167} {"train_loss": -27.512298583984375, "global_step": 511893, "epoch": 6167} {"train_loss": -27.415109634399414, "global_step": 511894, "epoch": 6167} {"train_loss": -27.683725357055664, "global_step": 511895, "epoch": 6167} {"train_loss": -27.005970001220703, "global_step": 511896, "epoch": 6167} {"train_loss": -27.31926918029785, "global_step": 511897, "epoch": 6167} {"train_loss": -27.444747924804688, "global_step": 511898, "epoch": 6167} {"train_loss": -27.713773727416992, "global_step": 511899, "epoch": 6167} {"train_loss": -27.600263595581055, "global_step": 511900, "epoch": 6167} {"train_loss": -27.553241729736328, "global_step": 511901, "epoch": 6167} {"train_loss": -27.73418617248535, "global_step": 511902, "epoch": 6167} {"train_loss": -27.32977867126465, "global_step": 511903, "epoch": 6167} {"train_loss": -27.189289093017578, "global_step": 511904, "epoch": 6167} {"train_loss": -27.52850914001465, "global_step": 511905, "epoch": 6167} {"train_loss": -27.651525497436523, "global_step": 511906, "epoch": 6167} {"train_loss": -27.640207290649414, "global_step": 511907, "epoch": 6167} {"train_loss": -27.669208526611328, "global_step": 511908, "epoch": 6167} {"train_loss": -27.488927841186523, "global_step": 511909, "epoch": 6167} {"train_loss": -27.646331787109375, "global_step": 511910, "epoch": 6167} {"train_loss": -27.634496688842773, "global_step": 511911, "epoch": 6167} {"train_loss": -27.285741806030273, "global_step": 511912, "epoch": 6167} {"train_loss": -27.591222763061523, "global_step": 511913, "epoch": 6167} {"train_loss": -27.582489013671875, "global_step": 511914, "epoch": 6167} {"train_loss": -27.304677963256836, "global_step": 511915, "epoch": 6167} {"train_loss": -27.2530460357666, "global_step": 511916, "epoch": 6167} {"train_loss": -27.660558700561523, "global_step": 511917, "epoch": 6167} {"train_loss": -27.50737953186035, "global_step": 511918, "epoch": 6167} {"train_loss": -27.155790328979492, "global_step": 511919, "epoch": 6167} {"train_loss": -27.21294593811035, "global_step": 511920, "epoch": 6167} {"train_loss": -27.231658935546875, "global_step": 511921, "epoch": 6167} {"train_loss": -27.554548263549805, "global_step": 511922, "epoch": 6167} {"train_loss": -27.286436080932617, "global_step": 511923, "epoch": 6167} {"train_loss": -27.437345504760742, "global_step": 511924, "epoch": 6167} {"train_loss": -27.60330581665039, "global_step": 511925, "epoch": 6167} {"train_loss": -27.4893856048584, "global_step": 511926, "epoch": 6167} {"train_loss": -27.6276798248291, "global_step": 511927, "epoch": 6167} {"train_loss": -27.64447593688965, "global_step": 511928, "epoch": 6167} {"train_loss": -27.262449264526367, "global_step": 511929, "epoch": 6167} {"train_loss": -27.83308982849121, "global_step": 511930, "epoch": 6167} {"train_loss": -27.591796875, "global_step": 511931, "epoch": 6167} {"train_loss": -27.601144790649414, "global_step": 511932, "epoch": 6167} {"train_loss": -27.640161514282227, "global_step": 511933, "epoch": 6167} {"train_loss": -27.661527633666992, "global_step": 511934, "epoch": 6167} {"train_loss": -27.31318473815918, "global_step": 511935, "epoch": 6167} {"train_loss": -27.90121841430664, "global_step": 511936, "epoch": 6167} {"train_loss": -27.318756103515625, "global_step": 511937, "epoch": 6167} {"train_loss": -26.47047233581543, "global_step": 511938, "epoch": 6167} {"train_loss": -25.240705490112305, "global_step": 511939, "epoch": 6167} {"train_loss": -23.123950958251953, "global_step": 511940, "epoch": 6167} {"train_loss": -24.69338035583496, "global_step": 511941, "epoch": 6167} {"train_loss": -26.419235229492188, "global_step": 511942, "epoch": 6167} {"train_loss": -27.127190739275463, "global_step": 511943, "epoch": 6167, "val_loss": 6692986.0} {"train_loss": -22.96393585205078, "global_step": 511944, "epoch": 6168} {"train_loss": -26.452350616455078, "global_step": 511945, "epoch": 6168} {"train_loss": -23.922292709350586, "global_step": 511946, "epoch": 6168} {"train_loss": -25.666812896728516, "global_step": 511947, "epoch": 6168} {"train_loss": -25.648944854736328, "global_step": 511948, "epoch": 6168} {"train_loss": -25.180953979492188, "global_step": 511949, "epoch": 6168} {"train_loss": -26.524993896484375, "global_step": 511950, "epoch": 6168} {"train_loss": -25.232318878173828, "global_step": 511951, "epoch": 6168} {"train_loss": -25.98382568359375, "global_step": 511952, "epoch": 6168} {"train_loss": -26.317169189453125, "global_step": 511953, "epoch": 6168} {"train_loss": -26.097888946533203, "global_step": 511954, "epoch": 6168} {"train_loss": -25.72842788696289, "global_step": 511955, "epoch": 6168} {"train_loss": -25.98642921447754, "global_step": 511956, "epoch": 6168} {"train_loss": -26.13726234436035, "global_step": 511957, "epoch": 6168} {"train_loss": -26.101613998413086, "global_step": 511958, "epoch": 6168} {"train_loss": -25.691232681274414, "global_step": 511959, "epoch": 6168} {"train_loss": -26.282886505126953, "global_step": 511960, "epoch": 6168} {"train_loss": -26.20830726623535, "global_step": 511961, "epoch": 6168} {"train_loss": -25.877954483032227, "global_step": 511962, "epoch": 6168} {"train_loss": -26.404531478881836, "global_step": 511963, "epoch": 6168} {"train_loss": -26.382532119750977, "global_step": 511964, "epoch": 6168} {"train_loss": -26.441314697265625, "global_step": 511965, "epoch": 6168} {"train_loss": -26.39029312133789, "global_step": 511966, "epoch": 6168} {"train_loss": -26.54230308532715, "global_step": 511967, "epoch": 6168} {"train_loss": -26.117883682250977, "global_step": 511968, "epoch": 6168} {"train_loss": -26.325653076171875, "global_step": 511969, "epoch": 6168} {"train_loss": -26.41156005859375, "global_step": 511970, "epoch": 6168} {"train_loss": -26.75238037109375, "global_step": 511971, "epoch": 6168} {"train_loss": -26.5960750579834, "global_step": 511972, "epoch": 6168} {"train_loss": -26.903034210205078, "global_step": 511973, "epoch": 6168} {"train_loss": -27.405349731445312, "global_step": 511974, "epoch": 6168} {"train_loss": -27.186695098876953, "global_step": 511975, "epoch": 6168} {"train_loss": -26.87039566040039, "global_step": 511976, "epoch": 6168} {"train_loss": -26.969038009643555, "global_step": 511977, "epoch": 6168} {"train_loss": -26.76576042175293, "global_step": 511978, "epoch": 6168} {"train_loss": -26.653797149658203, "global_step": 511979, "epoch": 6168} {"train_loss": -26.867765426635742, "global_step": 511980, "epoch": 6168} {"train_loss": -27.156721115112305, "global_step": 511981, "epoch": 6168} {"train_loss": -27.15223503112793, "global_step": 511982, "epoch": 6168} {"train_loss": -27.014013290405273, "global_step": 511983, "epoch": 6168} {"train_loss": -27.034931182861328, "global_step": 511984, "epoch": 6168} {"train_loss": -27.19051170349121, "global_step": 511985, "epoch": 6168} {"train_loss": -27.341217041015625, "global_step": 511986, "epoch": 6168} {"train_loss": -26.729516983032227, "global_step": 511987, "epoch": 6168} {"train_loss": -27.2185001373291, "global_step": 511988, "epoch": 6168} {"train_loss": -27.23066520690918, "global_step": 511989, "epoch": 6168} {"train_loss": -27.2011775970459, "global_step": 511990, "epoch": 6168} {"train_loss": -27.310260772705078, "global_step": 511991, "epoch": 6168} {"train_loss": -27.557966232299805, "global_step": 511992, "epoch": 6168} {"train_loss": -27.537342071533203, "global_step": 511993, "epoch": 6168} {"train_loss": -27.27605628967285, "global_step": 511994, "epoch": 6168} {"train_loss": -27.84771728515625, "global_step": 511995, "epoch": 6168} {"train_loss": -27.53834342956543, "global_step": 511996, "epoch": 6168} {"train_loss": -27.551177978515625, "global_step": 511997, "epoch": 6168} {"train_loss": -27.780960083007812, "global_step": 511998, "epoch": 6168} {"train_loss": -27.42218017578125, "global_step": 511999, "epoch": 6168} {"train_loss": -27.512191772460938, "global_step": 512000, "epoch": 6168} {"train_loss": -27.555761337280273, "global_step": 512001, "epoch": 6168} {"train_loss": -27.72258949279785, "global_step": 512002, "epoch": 6168} {"train_loss": -27.47928810119629, "global_step": 512003, "epoch": 6168} {"train_loss": -27.697906494140625, "global_step": 512004, "epoch": 6168} {"train_loss": -27.53643798828125, "global_step": 512005, "epoch": 6168} {"train_loss": -27.659833908081055, "global_step": 512006, "epoch": 6168} {"train_loss": -27.4575252532959, "global_step": 512007, "epoch": 6168} {"train_loss": -27.296600341796875, "global_step": 512008, "epoch": 6168} {"train_loss": -27.698688507080078, "global_step": 512009, "epoch": 6168} {"train_loss": -27.53384780883789, "global_step": 512010, "epoch": 6168} {"train_loss": -28.040878295898438, "global_step": 512011, "epoch": 6168} {"train_loss": -27.279010772705078, "global_step": 512012, "epoch": 6168} {"train_loss": -27.648290634155273, "global_step": 512013, "epoch": 6168} {"train_loss": -27.727497100830078, "global_step": 512014, "epoch": 6168} {"train_loss": -27.646839141845703, "global_step": 512015, "epoch": 6168} {"train_loss": -27.393529891967773, "global_step": 512016, "epoch": 6168} {"train_loss": -27.22565269470215, "global_step": 512017, "epoch": 6168} {"train_loss": -27.384998321533203, "global_step": 512018, "epoch": 6168} {"train_loss": -27.70489501953125, "global_step": 512019, "epoch": 6168} {"train_loss": -27.539499282836914, "global_step": 512020, "epoch": 6168} {"train_loss": -27.53853416442871, "global_step": 512021, "epoch": 6168} {"train_loss": -27.588134765625, "global_step": 512022, "epoch": 6168} {"train_loss": -27.7761173248291, "global_step": 512023, "epoch": 6168} {"train_loss": -27.417739868164062, "global_step": 512024, "epoch": 6168} {"train_loss": -27.79498291015625, "global_step": 512025, "epoch": 6168} {"train_loss": -26.886745360960443, "global_step": 512026, "epoch": 6168, "val_loss": 6478747.0} {"train_loss": -27.057199478149414, "global_step": 512027, "epoch": 6169} {"train_loss": -26.078998565673828, "global_step": 512028, "epoch": 6169} {"train_loss": -26.6737117767334, "global_step": 512029, "epoch": 6169} {"train_loss": -26.655942916870117, "global_step": 512030, "epoch": 6169} {"train_loss": -26.30189323425293, "global_step": 512031, "epoch": 6169} {"train_loss": -27.08622169494629, "global_step": 512032, "epoch": 6169} {"train_loss": -26.24173927307129, "global_step": 512033, "epoch": 6169} {"train_loss": -26.751739501953125, "global_step": 512034, "epoch": 6169} {"train_loss": -26.5967960357666, "global_step": 512035, "epoch": 6169} {"train_loss": -27.34089469909668, "global_step": 512036, "epoch": 6169} {"train_loss": -26.634592056274414, "global_step": 512037, "epoch": 6169} {"train_loss": -27.111066818237305, "global_step": 512038, "epoch": 6169} {"train_loss": -27.18291664123535, "global_step": 512039, "epoch": 6169} {"train_loss": -26.63602638244629, "global_step": 512040, "epoch": 6169} {"train_loss": -26.89533042907715, "global_step": 512041, "epoch": 6169} {"train_loss": -26.974180221557617, "global_step": 512042, "epoch": 6169} {"train_loss": -27.121862411499023, "global_step": 512043, "epoch": 6169} {"train_loss": -26.909116744995117, "global_step": 512044, "epoch": 6169} {"train_loss": -27.334440231323242, "global_step": 512045, "epoch": 6169} {"train_loss": -27.13429069519043, "global_step": 512046, "epoch": 6169} {"train_loss": -26.99281120300293, "global_step": 512047, "epoch": 6169} {"train_loss": -27.405750274658203, "global_step": 512048, "epoch": 6169} {"train_loss": -27.61713981628418, "global_step": 512049, "epoch": 6169} {"train_loss": -27.499242782592773, "global_step": 512050, "epoch": 6169} {"train_loss": -27.416101455688477, "global_step": 512051, "epoch": 6169} {"train_loss": -27.473554611206055, "global_step": 512052, "epoch": 6169} {"train_loss": -27.708234786987305, "global_step": 512053, "epoch": 6169} {"train_loss": -27.766752243041992, "global_step": 512054, "epoch": 6169} {"train_loss": -27.35986328125, "global_step": 512055, "epoch": 6169} {"train_loss": -27.582141876220703, "global_step": 512056, "epoch": 6169} {"train_loss": -27.798490524291992, "global_step": 512057, "epoch": 6169} {"train_loss": -27.507944107055664, "global_step": 512058, "epoch": 6169} {"train_loss": -27.38779067993164, "global_step": 512059, "epoch": 6169} {"train_loss": -27.3162899017334, "global_step": 512060, "epoch": 6169} {"train_loss": -27.584339141845703, "global_step": 512061, "epoch": 6169} {"train_loss": -28.07087516784668, "global_step": 512062, "epoch": 6169} {"train_loss": -27.662616729736328, "global_step": 512063, "epoch": 6169} {"train_loss": -27.877613067626953, "global_step": 512064, "epoch": 6169} {"train_loss": -27.616199493408203, "global_step": 512065, "epoch": 6169} {"train_loss": -27.90460777282715, "global_step": 512066, "epoch": 6169} {"train_loss": -27.2708683013916, "global_step": 512067, "epoch": 6169} {"train_loss": -27.7362060546875, "global_step": 512068, "epoch": 6169} {"train_loss": -27.42396354675293, "global_step": 512069, "epoch": 6169} {"train_loss": -27.728595733642578, "global_step": 512070, "epoch": 6169} {"train_loss": -27.304920196533203, "global_step": 512071, "epoch": 6169} {"train_loss": -27.66871452331543, "global_step": 512072, "epoch": 6169} {"train_loss": -27.569120407104492, "global_step": 512073, "epoch": 6169} {"train_loss": -27.887907028198242, "global_step": 512074, "epoch": 6169} {"train_loss": -27.50410270690918, "global_step": 512075, "epoch": 6169} {"train_loss": -27.779932022094727, "global_step": 512076, "epoch": 6169} {"train_loss": -27.76611328125, "global_step": 512077, "epoch": 6169} {"train_loss": -27.885284423828125, "global_step": 512078, "epoch": 6169} {"train_loss": -27.4661808013916, "global_step": 512079, "epoch": 6169} {"train_loss": -27.728546142578125, "global_step": 512080, "epoch": 6169} {"train_loss": -27.81365966796875, "global_step": 512081, "epoch": 6169} {"train_loss": -27.9786434173584, "global_step": 512082, "epoch": 6169} {"train_loss": -27.32539176940918, "global_step": 512083, "epoch": 6169} {"train_loss": -27.879608154296875, "global_step": 512084, "epoch": 6169} {"train_loss": -27.562597274780273, "global_step": 512085, "epoch": 6169} {"train_loss": -27.782257080078125, "global_step": 512086, "epoch": 6169} {"train_loss": -27.37519645690918, "global_step": 512087, "epoch": 6169} {"train_loss": -27.514942169189453, "global_step": 512088, "epoch": 6169} {"train_loss": -27.175729751586914, "global_step": 512089, "epoch": 6169} {"train_loss": -27.002119064331055, "global_step": 512090, "epoch": 6169} {"train_loss": -27.88007164001465, "global_step": 512091, "epoch": 6169} {"train_loss": -27.205753326416016, "global_step": 512092, "epoch": 6169} {"train_loss": -27.332006454467773, "global_step": 512093, "epoch": 6169} {"train_loss": -27.243789672851562, "global_step": 512094, "epoch": 6169} {"train_loss": -27.76466178894043, "global_step": 512095, "epoch": 6169} {"train_loss": -27.226465225219727, "global_step": 512096, "epoch": 6169} {"train_loss": -27.097909927368164, "global_step": 512097, "epoch": 6169} {"train_loss": -27.496057510375977, "global_step": 512098, "epoch": 6169} {"train_loss": -27.278539657592773, "global_step": 512099, "epoch": 6169} {"train_loss": -27.314746856689453, "global_step": 512100, "epoch": 6169} {"train_loss": -27.741846084594727, "global_step": 512101, "epoch": 6169} {"train_loss": -27.50007438659668, "global_step": 512102, "epoch": 6169} {"train_loss": -27.089008331298828, "global_step": 512103, "epoch": 6169} {"train_loss": -27.380903244018555, "global_step": 512104, "epoch": 6169} {"train_loss": -27.634946823120117, "global_step": 512105, "epoch": 6169} {"train_loss": -27.562824249267578, "global_step": 512106, "epoch": 6169} {"train_loss": -27.36842918395996, "global_step": 512107, "epoch": 6169} {"train_loss": -27.345413208007812, "global_step": 512108, "epoch": 6169} {"train_loss": -27.37570916600974, "global_step": 512109, "epoch": 6169, "val_loss": 6607903.0} {"train_loss": -27.004343032836914, "global_step": 512110, "epoch": 6170} {"train_loss": -27.058984756469727, "global_step": 512111, "epoch": 6170} {"train_loss": -26.774097442626953, "global_step": 512112, "epoch": 6170} {"train_loss": -27.19306755065918, "global_step": 512113, "epoch": 6170} {"train_loss": -27.212696075439453, "global_step": 512114, "epoch": 6170} {"train_loss": -26.64661979675293, "global_step": 512115, "epoch": 6170} {"train_loss": -27.00398826599121, "global_step": 512116, "epoch": 6170} {"train_loss": -27.3461856842041, "global_step": 512117, "epoch": 6170} {"train_loss": -26.9388370513916, "global_step": 512118, "epoch": 6170} {"train_loss": -27.640045166015625, "global_step": 512119, "epoch": 6170} {"train_loss": -27.365955352783203, "global_step": 512120, "epoch": 6170} {"train_loss": -27.372425079345703, "global_step": 512121, "epoch": 6170} {"train_loss": -27.367162704467773, "global_step": 512122, "epoch": 6170} {"train_loss": -27.323383331298828, "global_step": 512123, "epoch": 6170} {"train_loss": -27.527606964111328, "global_step": 512124, "epoch": 6170} {"train_loss": -27.64495277404785, "global_step": 512125, "epoch": 6170} {"train_loss": -27.38691520690918, "global_step": 512126, "epoch": 6170} {"train_loss": -27.677011489868164, "global_step": 512127, "epoch": 6170} {"train_loss": -27.33249855041504, "global_step": 512128, "epoch": 6170} {"train_loss": -27.685094833374023, "global_step": 512129, "epoch": 6170} {"train_loss": -27.77252769470215, "global_step": 512130, "epoch": 6170} {"train_loss": -27.686614990234375, "global_step": 512131, "epoch": 6170} {"train_loss": -27.476171493530273, "global_step": 512132, "epoch": 6170} {"train_loss": -27.35770034790039, "global_step": 512133, "epoch": 6170} {"train_loss": -27.40436363220215, "global_step": 512134, "epoch": 6170} {"train_loss": -27.1976318359375, "global_step": 512135, "epoch": 6170} {"train_loss": -27.469287872314453, "global_step": 512136, "epoch": 6170} {"train_loss": -27.6016788482666, "global_step": 512137, "epoch": 6170} {"train_loss": -27.46917152404785, "global_step": 512138, "epoch": 6170} {"train_loss": -27.347436904907227, "global_step": 512139, "epoch": 6170} {"train_loss": -27.713285446166992, "global_step": 512140, "epoch": 6170} {"train_loss": -27.39991569519043, "global_step": 512141, "epoch": 6170} {"train_loss": -27.705642700195312, "global_step": 512142, "epoch": 6170} {"train_loss": -27.604597091674805, "global_step": 512143, "epoch": 6170} {"train_loss": -27.47124671936035, "global_step": 512144, "epoch": 6170} {"train_loss": -27.600549697875977, "global_step": 512145, "epoch": 6170} {"train_loss": -27.559864044189453, "global_step": 512146, "epoch": 6170} {"train_loss": -27.339385986328125, "global_step": 512147, "epoch": 6170} {"train_loss": -27.56201171875, "global_step": 512148, "epoch": 6170} {"train_loss": -27.302581787109375, "global_step": 512149, "epoch": 6170} {"train_loss": -26.9577579498291, "global_step": 512150, "epoch": 6170} {"train_loss": -27.42124366760254, "global_step": 512151, "epoch": 6170} {"train_loss": -27.65192985534668, "global_step": 512152, "epoch": 6170} {"train_loss": -27.312915802001953, "global_step": 512153, "epoch": 6170} {"train_loss": -27.735599517822266, "global_step": 512154, "epoch": 6170} {"train_loss": -27.258960723876953, "global_step": 512155, "epoch": 6170} {"train_loss": -27.102869033813477, "global_step": 512156, "epoch": 6170} {"train_loss": -27.839811325073242, "global_step": 512157, "epoch": 6170} {"train_loss": -27.666034698486328, "global_step": 512158, "epoch": 6170} {"train_loss": -27.456405639648438, "global_step": 512159, "epoch": 6170} {"train_loss": -27.284387588500977, "global_step": 512160, "epoch": 6170} {"train_loss": -27.892786026000977, "global_step": 512161, "epoch": 6170} {"train_loss": -27.804758071899414, "global_step": 512162, "epoch": 6170} {"train_loss": -27.604581832885742, "global_step": 512163, "epoch": 6170} {"train_loss": -27.81357765197754, "global_step": 512164, "epoch": 6170} {"train_loss": -27.892736434936523, "global_step": 512165, "epoch": 6170} {"train_loss": -27.492218017578125, "global_step": 512166, "epoch": 6170} {"train_loss": -27.48579216003418, "global_step": 512167, "epoch": 6170} {"train_loss": -27.59718894958496, "global_step": 512168, "epoch": 6170} {"train_loss": -27.720579147338867, "global_step": 512169, "epoch": 6170} {"train_loss": -27.8090763092041, "global_step": 512170, "epoch": 6170} {"train_loss": -27.710840225219727, "global_step": 512171, "epoch": 6170} {"train_loss": -27.621814727783203, "global_step": 512172, "epoch": 6170} {"train_loss": -27.792959213256836, "global_step": 512173, "epoch": 6170} {"train_loss": -28.157129287719727, "global_step": 512174, "epoch": 6170} {"train_loss": -27.6572208404541, "global_step": 512175, "epoch": 6170} {"train_loss": -27.687543869018555, "global_step": 512176, "epoch": 6170} {"train_loss": -27.749601364135742, "global_step": 512177, "epoch": 6170} {"train_loss": -27.607995986938477, "global_step": 512178, "epoch": 6170} {"train_loss": -27.73286247253418, "global_step": 512179, "epoch": 6170} {"train_loss": -27.344633102416992, "global_step": 512180, "epoch": 6170} {"train_loss": -27.662378311157227, "global_step": 512181, "epoch": 6170} {"train_loss": -27.4210262298584, "global_step": 512182, "epoch": 6170} {"train_loss": -27.72772789001465, "global_step": 512183, "epoch": 6170} {"train_loss": -27.5123348236084, "global_step": 512184, "epoch": 6170} {"train_loss": -27.74776268005371, "global_step": 512185, "epoch": 6170} {"train_loss": -27.616260528564453, "global_step": 512186, "epoch": 6170} {"train_loss": -27.545873641967773, "global_step": 512187, "epoch": 6170} {"train_loss": -27.5747013092041, "global_step": 512188, "epoch": 6170} {"train_loss": -27.73554801940918, "global_step": 512189, "epoch": 6170} {"train_loss": -27.53742790222168, "global_step": 512190, "epoch": 6170} {"train_loss": -27.486764907836914, "global_step": 512191, "epoch": 6170} {"train_loss": -27.486384770956384, "global_step": 512192, "epoch": 6170, "val_loss": 6617257.0} {"train_loss": -22.486713409423828, "global_step": 512193, "epoch": 6171} {"train_loss": -21.955066680908203, "global_step": 512194, "epoch": 6171} {"train_loss": -25.718481063842773, "global_step": 512195, "epoch": 6171} {"train_loss": -24.9162654876709, "global_step": 512196, "epoch": 6171} {"train_loss": -23.879581451416016, "global_step": 512197, "epoch": 6171} {"train_loss": -24.658973693847656, "global_step": 512198, "epoch": 6171} {"train_loss": -24.639678955078125, "global_step": 512199, "epoch": 6171} {"train_loss": -25.16629409790039, "global_step": 512200, "epoch": 6171} {"train_loss": -25.435144424438477, "global_step": 512201, "epoch": 6171} {"train_loss": -24.847469329833984, "global_step": 512202, "epoch": 6171} {"train_loss": -25.70367431640625, "global_step": 512203, "epoch": 6171} {"train_loss": -25.414396286010742, "global_step": 512204, "epoch": 6171} {"train_loss": -25.776525497436523, "global_step": 512205, "epoch": 6171} {"train_loss": -25.619367599487305, "global_step": 512206, "epoch": 6171} {"train_loss": -25.757156372070312, "global_step": 512207, "epoch": 6171} {"train_loss": -25.727127075195312, "global_step": 512208, "epoch": 6171} {"train_loss": -25.8853759765625, "global_step": 512209, "epoch": 6171} {"train_loss": -25.65754508972168, "global_step": 512210, "epoch": 6171} {"train_loss": -26.240339279174805, "global_step": 512211, "epoch": 6171} {"train_loss": -25.912525177001953, "global_step": 512212, "epoch": 6171} {"train_loss": -26.381067276000977, "global_step": 512213, "epoch": 6171} {"train_loss": -26.018869400024414, "global_step": 512214, "epoch": 6171} {"train_loss": -26.499652862548828, "global_step": 512215, "epoch": 6171} {"train_loss": -26.277118682861328, "global_step": 512216, "epoch": 6171} {"train_loss": -26.21333122253418, "global_step": 512217, "epoch": 6171} {"train_loss": -26.538053512573242, "global_step": 512218, "epoch": 6171} {"train_loss": -26.502307891845703, "global_step": 512219, "epoch": 6171} {"train_loss": -26.66754150390625, "global_step": 512220, "epoch": 6171} {"train_loss": -26.50510597229004, "global_step": 512221, "epoch": 6171} {"train_loss": -26.82490348815918, "global_step": 512222, "epoch": 6171} {"train_loss": -26.84706687927246, "global_step": 512223, "epoch": 6171} {"train_loss": -26.61309814453125, "global_step": 512224, "epoch": 6171} {"train_loss": -26.7850341796875, "global_step": 512225, "epoch": 6171} {"train_loss": -26.471832275390625, "global_step": 512226, "epoch": 6171} {"train_loss": -26.7236385345459, "global_step": 512227, "epoch": 6171} {"train_loss": -26.575214385986328, "global_step": 512228, "epoch": 6171} {"train_loss": -27.116138458251953, "global_step": 512229, "epoch": 6171} {"train_loss": -27.17621421813965, "global_step": 512230, "epoch": 6171} {"train_loss": -27.067703247070312, "global_step": 512231, "epoch": 6171} {"train_loss": -27.008275985717773, "global_step": 512232, "epoch": 6171} {"train_loss": -26.797760009765625, "global_step": 512233, "epoch": 6171} {"train_loss": -27.50371742248535, "global_step": 512234, "epoch": 6171} {"train_loss": -27.32405662536621, "global_step": 512235, "epoch": 6171} {"train_loss": -27.275543212890625, "global_step": 512236, "epoch": 6171} {"train_loss": -27.489044189453125, "global_step": 512237, "epoch": 6171} {"train_loss": -27.355764389038086, "global_step": 512238, "epoch": 6171} {"train_loss": -27.21283531188965, "global_step": 512239, "epoch": 6171} {"train_loss": -26.81989860534668, "global_step": 512240, "epoch": 6171} {"train_loss": -27.35972023010254, "global_step": 512241, "epoch": 6171} {"train_loss": -27.52935218811035, "global_step": 512242, "epoch": 6171} {"train_loss": -27.3599796295166, "global_step": 512243, "epoch": 6171} {"train_loss": -27.772886276245117, "global_step": 512244, "epoch": 6171} {"train_loss": -27.030920028686523, "global_step": 512245, "epoch": 6171} {"train_loss": -27.6831111907959, "global_step": 512246, "epoch": 6171} {"train_loss": -27.06912612915039, "global_step": 512247, "epoch": 6171} {"train_loss": -27.26624870300293, "global_step": 512248, "epoch": 6171} {"train_loss": -27.2508487701416, "global_step": 512249, "epoch": 6171} {"train_loss": -27.529321670532227, "global_step": 512250, "epoch": 6171} {"train_loss": -27.790945053100586, "global_step": 512251, "epoch": 6171} {"train_loss": -27.523046493530273, "global_step": 512252, "epoch": 6171} {"train_loss": -27.516260147094727, "global_step": 512253, "epoch": 6171} {"train_loss": -27.45918083190918, "global_step": 512254, "epoch": 6171} {"train_loss": -27.635709762573242, "global_step": 512255, "epoch": 6171} {"train_loss": -27.394872665405273, "global_step": 512256, "epoch": 6171} {"train_loss": -27.275625228881836, "global_step": 512257, "epoch": 6171} {"train_loss": -27.626012802124023, "global_step": 512258, "epoch": 6171} {"train_loss": -27.995758056640625, "global_step": 512259, "epoch": 6171} {"train_loss": -27.579166412353516, "global_step": 512260, "epoch": 6171} {"train_loss": -27.442346572875977, "global_step": 512261, "epoch": 6171} {"train_loss": -27.449676513671875, "global_step": 512262, "epoch": 6171} {"train_loss": -27.552453994750977, "global_step": 512263, "epoch": 6171} {"train_loss": -28.001554489135742, "global_step": 512264, "epoch": 6171} {"train_loss": -27.1928653717041, "global_step": 512265, "epoch": 6171} {"train_loss": -27.511077880859375, "global_step": 512266, "epoch": 6171} {"train_loss": -27.5983943939209, "global_step": 512267, "epoch": 6171} {"train_loss": -27.020002365112305, "global_step": 512268, "epoch": 6171} {"train_loss": -27.424482345581055, "global_step": 512269, "epoch": 6171} {"train_loss": -27.69398307800293, "global_step": 512270, "epoch": 6171} {"train_loss": -27.50779151916504, "global_step": 512271, "epoch": 6171} {"train_loss": -27.772077560424805, "global_step": 512272, "epoch": 6171} {"train_loss": -27.660175323486328, "global_step": 512273, "epoch": 6171} {"train_loss": -27.71912956237793, "global_step": 512274, "epoch": 6171} {"train_loss": -26.68475070631648, "global_step": 512275, "epoch": 6171, "val_loss": 6738093.0} {"train_loss": -27.272489547729492, "global_step": 512276, "epoch": 6172} {"train_loss": -27.524473190307617, "global_step": 512277, "epoch": 6172} {"train_loss": -27.20706558227539, "global_step": 512278, "epoch": 6172} {"train_loss": -27.089330673217773, "global_step": 512279, "epoch": 6172} {"train_loss": -26.853540420532227, "global_step": 512280, "epoch": 6172} {"train_loss": -26.952268600463867, "global_step": 512281, "epoch": 6172} {"train_loss": -27.280527114868164, "global_step": 512282, "epoch": 6172} {"train_loss": -27.257186889648438, "global_step": 512283, "epoch": 6172} {"train_loss": -26.39141845703125, "global_step": 512284, "epoch": 6172} {"train_loss": -27.059850692749023, "global_step": 512285, "epoch": 6172} {"train_loss": -27.021337509155273, "global_step": 512286, "epoch": 6172} {"train_loss": -27.11117935180664, "global_step": 512287, "epoch": 6172} {"train_loss": -27.271039962768555, "global_step": 512288, "epoch": 6172} {"train_loss": -27.135095596313477, "global_step": 512289, "epoch": 6172} {"train_loss": -27.0565185546875, "global_step": 512290, "epoch": 6172} {"train_loss": -27.37213134765625, "global_step": 512291, "epoch": 6172} {"train_loss": -27.3599853515625, "global_step": 512292, "epoch": 6172} {"train_loss": -27.127120971679688, "global_step": 512293, "epoch": 6172} {"train_loss": -27.344572067260742, "global_step": 512294, "epoch": 6172} {"train_loss": -27.48040199279785, "global_step": 512295, "epoch": 6172} {"train_loss": -27.556730270385742, "global_step": 512296, "epoch": 6172} {"train_loss": -27.19460105895996, "global_step": 512297, "epoch": 6172} {"train_loss": -27.738758087158203, "global_step": 512298, "epoch": 6172} {"train_loss": -27.394027709960938, "global_step": 512299, "epoch": 6172} {"train_loss": -27.26482582092285, "global_step": 512300, "epoch": 6172} {"train_loss": -27.340421676635742, "global_step": 512301, "epoch": 6172} {"train_loss": -27.605066299438477, "global_step": 512302, "epoch": 6172} {"train_loss": -27.66103172302246, "global_step": 512303, "epoch": 6172} {"train_loss": -27.548419952392578, "global_step": 512304, "epoch": 6172} {"train_loss": -27.369726181030273, "global_step": 512305, "epoch": 6172} {"train_loss": -27.181533813476562, "global_step": 512306, "epoch": 6172} {"train_loss": -27.543842315673828, "global_step": 512307, "epoch": 6172} {"train_loss": -27.15216636657715, "global_step": 512308, "epoch": 6172} {"train_loss": -27.87030029296875, "global_step": 512309, "epoch": 6172} {"train_loss": -27.731115341186523, "global_step": 512310, "epoch": 6172} {"train_loss": -27.641721725463867, "global_step": 512311, "epoch": 6172} {"train_loss": -27.532255172729492, "global_step": 512312, "epoch": 6172} {"train_loss": -27.893774032592773, "global_step": 512313, "epoch": 6172} {"train_loss": -27.55405616760254, "global_step": 512314, "epoch": 6172} {"train_loss": -27.64239501953125, "global_step": 512315, "epoch": 6172} {"train_loss": -27.78326988220215, "global_step": 512316, "epoch": 6172} {"train_loss": -27.78626823425293, "global_step": 512317, "epoch": 6172} {"train_loss": -27.513015747070312, "global_step": 512318, "epoch": 6172} {"train_loss": -27.553457260131836, "global_step": 512319, "epoch": 6172} {"train_loss": -27.262561798095703, "global_step": 512320, "epoch": 6172} {"train_loss": -27.47321128845215, "global_step": 512321, "epoch": 6172} {"train_loss": -27.358076095581055, "global_step": 512322, "epoch": 6172} {"train_loss": -27.892698287963867, "global_step": 512323, "epoch": 6172} {"train_loss": -27.821836471557617, "global_step": 512324, "epoch": 6172} {"train_loss": -27.877180099487305, "global_step": 512325, "epoch": 6172} {"train_loss": -27.732990264892578, "global_step": 512326, "epoch": 6172} {"train_loss": -27.492528915405273, "global_step": 512327, "epoch": 6172} {"train_loss": -27.6317081451416, "global_step": 512328, "epoch": 6172} {"train_loss": -27.510435104370117, "global_step": 512329, "epoch": 6172} {"train_loss": -27.979602813720703, "global_step": 512330, "epoch": 6172} {"train_loss": -27.714401245117188, "global_step": 512331, "epoch": 6172} {"train_loss": -27.569580078125, "global_step": 512332, "epoch": 6172} {"train_loss": -27.386981964111328, "global_step": 512333, "epoch": 6172} {"train_loss": -27.442447662353516, "global_step": 512334, "epoch": 6172} {"train_loss": -27.28130531311035, "global_step": 512335, "epoch": 6172} {"train_loss": -26.788969039916992, "global_step": 512336, "epoch": 6172} {"train_loss": -27.179279327392578, "global_step": 512337, "epoch": 6172} {"train_loss": -27.61171531677246, "global_step": 512338, "epoch": 6172} {"train_loss": -27.334436416625977, "global_step": 512339, "epoch": 6172} {"train_loss": -26.93389320373535, "global_step": 512340, "epoch": 6172} {"train_loss": -27.124420166015625, "global_step": 512341, "epoch": 6172} {"train_loss": -27.365619659423828, "global_step": 512342, "epoch": 6172} {"train_loss": -27.43359375, "global_step": 512343, "epoch": 6172} {"train_loss": -27.228544235229492, "global_step": 512344, "epoch": 6172} {"train_loss": -27.616010665893555, "global_step": 512345, "epoch": 6172} {"train_loss": -27.23386001586914, "global_step": 512346, "epoch": 6172} {"train_loss": -27.222797393798828, "global_step": 512347, "epoch": 6172} {"train_loss": -27.725629806518555, "global_step": 512348, "epoch": 6172} {"train_loss": -27.371246337890625, "global_step": 512349, "epoch": 6172} {"train_loss": -27.67628288269043, "global_step": 512350, "epoch": 6172} {"train_loss": -27.29917335510254, "global_step": 512351, "epoch": 6172} {"train_loss": -27.126928329467773, "global_step": 512352, "epoch": 6172} {"train_loss": -26.950963973999023, "global_step": 512353, "epoch": 6172} {"train_loss": -27.131301879882812, "global_step": 512354, "epoch": 6172} {"train_loss": -27.608762741088867, "global_step": 512355, "epoch": 6172} {"train_loss": -27.751806259155273, "global_step": 512356, "epoch": 6172} {"train_loss": -27.073450088500977, "global_step": 512357, "epoch": 6172} {"train_loss": -27.41278662164527, "global_step": 512358, "epoch": 6172, "val_loss": 6741571.0} {"train_loss": -25.82820701599121, "global_step": 512359, "epoch": 6173} {"train_loss": -23.231510162353516, "global_step": 512360, "epoch": 6173} {"train_loss": -23.62422752380371, "global_step": 512361, "epoch": 6173} {"train_loss": -26.3301944732666, "global_step": 512362, "epoch": 6173} {"train_loss": -26.122968673706055, "global_step": 512363, "epoch": 6173} {"train_loss": -25.577224731445312, "global_step": 512364, "epoch": 6173} {"train_loss": -26.068195343017578, "global_step": 512365, "epoch": 6173} {"train_loss": -25.816513061523438, "global_step": 512366, "epoch": 6173} {"train_loss": -26.288471221923828, "global_step": 512367, "epoch": 6173} {"train_loss": -26.347198486328125, "global_step": 512368, "epoch": 6173} {"train_loss": -26.868270874023438, "global_step": 512369, "epoch": 6173} {"train_loss": -26.813068389892578, "global_step": 512370, "epoch": 6173} {"train_loss": -26.869937896728516, "global_step": 512371, "epoch": 6173} {"train_loss": -26.464282989501953, "global_step": 512372, "epoch": 6173} {"train_loss": -26.742238998413086, "global_step": 512373, "epoch": 6173} {"train_loss": -26.363239288330078, "global_step": 512374, "epoch": 6173} {"train_loss": -26.8144588470459, "global_step": 512375, "epoch": 6173} {"train_loss": -27.049951553344727, "global_step": 512376, "epoch": 6173} {"train_loss": -26.994482040405273, "global_step": 512377, "epoch": 6173} {"train_loss": -26.674665451049805, "global_step": 512378, "epoch": 6173} {"train_loss": -27.017526626586914, "global_step": 512379, "epoch": 6173} {"train_loss": -27.087909698486328, "global_step": 512380, "epoch": 6173} {"train_loss": -26.836902618408203, "global_step": 512381, "epoch": 6173} {"train_loss": -27.218597412109375, "global_step": 512382, "epoch": 6173} {"train_loss": -27.015960693359375, "global_step": 512383, "epoch": 6173} {"train_loss": -27.424030303955078, "global_step": 512384, "epoch": 6173} {"train_loss": -27.239648818969727, "global_step": 512385, "epoch": 6173} {"train_loss": -27.20216178894043, "global_step": 512386, "epoch": 6173} {"train_loss": -27.051244735717773, "global_step": 512387, "epoch": 6173} {"train_loss": -26.820825576782227, "global_step": 512388, "epoch": 6173} {"train_loss": -27.58094596862793, "global_step": 512389, "epoch": 6173} {"train_loss": -27.038421630859375, "global_step": 512390, "epoch": 6173} {"train_loss": -27.12770652770996, "global_step": 512391, "epoch": 6173} {"train_loss": -27.078428268432617, "global_step": 512392, "epoch": 6173} {"train_loss": -27.35662841796875, "global_step": 512393, "epoch": 6173} {"train_loss": -27.513280868530273, "global_step": 512394, "epoch": 6173} {"train_loss": -27.18136978149414, "global_step": 512395, "epoch": 6173} {"train_loss": -27.284818649291992, "global_step": 512396, "epoch": 6173} {"train_loss": -27.489704132080078, "global_step": 512397, "epoch": 6173} {"train_loss": -27.596181869506836, "global_step": 512398, "epoch": 6173} {"train_loss": -27.54511070251465, "global_step": 512399, "epoch": 6173} {"train_loss": -27.72216796875, "global_step": 512400, "epoch": 6173} {"train_loss": -27.395727157592773, "global_step": 512401, "epoch": 6173} {"train_loss": -27.171161651611328, "global_step": 512402, "epoch": 6173} {"train_loss": -27.416370391845703, "global_step": 512403, "epoch": 6173} {"train_loss": -27.596729278564453, "global_step": 512404, "epoch": 6173} {"train_loss": -27.50662612915039, "global_step": 512405, "epoch": 6173} {"train_loss": -27.781116485595703, "global_step": 512406, "epoch": 6173} {"train_loss": -27.353057861328125, "global_step": 512407, "epoch": 6173} {"train_loss": -27.461042404174805, "global_step": 512408, "epoch": 6173} {"train_loss": -27.600141525268555, "global_step": 512409, "epoch": 6173} {"train_loss": -27.79252052307129, "global_step": 512410, "epoch": 6173} {"train_loss": -27.908185958862305, "global_step": 512411, "epoch": 6173} {"train_loss": -27.54291343688965, "global_step": 512412, "epoch": 6173} {"train_loss": -27.740209579467773, "global_step": 512413, "epoch": 6173} {"train_loss": -27.660871505737305, "global_step": 512414, "epoch": 6173} {"train_loss": -27.94384765625, "global_step": 512415, "epoch": 6173} {"train_loss": -27.72198486328125, "global_step": 512416, "epoch": 6173} {"train_loss": -27.48017692565918, "global_step": 512417, "epoch": 6173} {"train_loss": -27.741443634033203, "global_step": 512418, "epoch": 6173} {"train_loss": -27.769927978515625, "global_step": 512419, "epoch": 6173} {"train_loss": -27.694738388061523, "global_step": 512420, "epoch": 6173} {"train_loss": -27.754724502563477, "global_step": 512421, "epoch": 6173} {"train_loss": -27.6723575592041, "global_step": 512422, "epoch": 6173} {"train_loss": -27.911035537719727, "global_step": 512423, "epoch": 6173} {"train_loss": -27.86503028869629, "global_step": 512424, "epoch": 6173} {"train_loss": -27.862308502197266, "global_step": 512425, "epoch": 6173} {"train_loss": -27.746923446655273, "global_step": 512426, "epoch": 6173} {"train_loss": -27.67469596862793, "global_step": 512427, "epoch": 6173} {"train_loss": -27.773040771484375, "global_step": 512428, "epoch": 6173} {"train_loss": -27.617956161499023, "global_step": 512429, "epoch": 6173} {"train_loss": -28.003070831298828, "global_step": 512430, "epoch": 6173} {"train_loss": -27.531579971313477, "global_step": 512431, "epoch": 6173} {"train_loss": -27.381391525268555, "global_step": 512432, "epoch": 6173} {"train_loss": -27.525379180908203, "global_step": 512433, "epoch": 6173} {"train_loss": -27.846006393432617, "global_step": 512434, "epoch": 6173} {"train_loss": -27.617145538330078, "global_step": 512435, "epoch": 6173} {"train_loss": -27.901342391967773, "global_step": 512436, "epoch": 6173} {"train_loss": -28.234699249267578, "global_step": 512437, "epoch": 6173} {"train_loss": -27.531356811523438, "global_step": 512438, "epoch": 6173} {"train_loss": -27.695226669311523, "global_step": 512439, "epoch": 6173} {"train_loss": -27.6834716796875, "global_step": 512440, "epoch": 6173} {"train_loss": -27.19855974955731, "global_step": 512441, "epoch": 6173, "val_loss": 6666870.0} {"train_loss": -26.662158966064453, "global_step": 512442, "epoch": 6174} {"train_loss": -25.474506378173828, "global_step": 512443, "epoch": 6174} {"train_loss": -25.020477294921875, "global_step": 512444, "epoch": 6174} {"train_loss": -26.514816284179688, "global_step": 512445, "epoch": 6174} {"train_loss": -26.158105850219727, "global_step": 512446, "epoch": 6174} {"train_loss": -26.47743797302246, "global_step": 512447, "epoch": 6174} {"train_loss": -26.78693199157715, "global_step": 512448, "epoch": 6174} {"train_loss": -26.304981231689453, "global_step": 512449, "epoch": 6174} {"train_loss": -26.413877487182617, "global_step": 512450, "epoch": 6174} {"train_loss": -26.836017608642578, "global_step": 512451, "epoch": 6174} {"train_loss": -27.436222076416016, "global_step": 512452, "epoch": 6174} {"train_loss": -26.65302085876465, "global_step": 512453, "epoch": 6174} {"train_loss": -26.265329360961914, "global_step": 512454, "epoch": 6174} {"train_loss": -27.06150245666504, "global_step": 512455, "epoch": 6174} {"train_loss": -27.109548568725586, "global_step": 512456, "epoch": 6174} {"train_loss": -27.16163444519043, "global_step": 512457, "epoch": 6174} {"train_loss": -26.36427116394043, "global_step": 512458, "epoch": 6174} {"train_loss": -27.009641647338867, "global_step": 512459, "epoch": 6174} {"train_loss": -26.886777877807617, "global_step": 512460, "epoch": 6174} {"train_loss": -27.129602432250977, "global_step": 512461, "epoch": 6174} {"train_loss": -27.050708770751953, "global_step": 512462, "epoch": 6174} {"train_loss": -27.119068145751953, "global_step": 512463, "epoch": 6174} {"train_loss": -26.957717895507812, "global_step": 512464, "epoch": 6174} {"train_loss": -27.1193790435791, "global_step": 512465, "epoch": 6174} {"train_loss": -27.20001220703125, "global_step": 512466, "epoch": 6174} {"train_loss": -27.287267684936523, "global_step": 512467, "epoch": 6174} {"train_loss": -27.537586212158203, "global_step": 512468, "epoch": 6174} {"train_loss": -27.04447364807129, "global_step": 512469, "epoch": 6174} {"train_loss": -27.144216537475586, "global_step": 512470, "epoch": 6174} {"train_loss": -27.6916446685791, "global_step": 512471, "epoch": 6174} {"train_loss": -27.402502059936523, "global_step": 512472, "epoch": 6174} {"train_loss": -27.66376304626465, "global_step": 512473, "epoch": 6174} {"train_loss": -27.532007217407227, "global_step": 512474, "epoch": 6174} {"train_loss": -27.5905818939209, "global_step": 512475, "epoch": 6174} {"train_loss": -27.277912139892578, "global_step": 512476, "epoch": 6174} {"train_loss": -27.19044303894043, "global_step": 512477, "epoch": 6174} {"train_loss": -27.427099227905273, "global_step": 512478, "epoch": 6174} {"train_loss": -27.870121002197266, "global_step": 512479, "epoch": 6174} {"train_loss": -27.24788475036621, "global_step": 512480, "epoch": 6174} {"train_loss": -27.423994064331055, "global_step": 512481, "epoch": 6174} {"train_loss": -27.59894371032715, "global_step": 512482, "epoch": 6174} {"train_loss": -27.164438247680664, "global_step": 512483, "epoch": 6174} {"train_loss": -27.674148559570312, "global_step": 512484, "epoch": 6174} {"train_loss": -27.474695205688477, "global_step": 512485, "epoch": 6174} {"train_loss": -27.21112060546875, "global_step": 512486, "epoch": 6174} {"train_loss": -27.271677017211914, "global_step": 512487, "epoch": 6174} {"train_loss": -27.746417999267578, "global_step": 512488, "epoch": 6174} {"train_loss": -27.637842178344727, "global_step": 512489, "epoch": 6174} {"train_loss": -27.4123592376709, "global_step": 512490, "epoch": 6174} {"train_loss": -27.588123321533203, "global_step": 512491, "epoch": 6174} {"train_loss": -27.180347442626953, "global_step": 512492, "epoch": 6174} {"train_loss": -27.564558029174805, "global_step": 512493, "epoch": 6174} {"train_loss": -27.14973258972168, "global_step": 512494, "epoch": 6174} {"train_loss": -27.681137084960938, "global_step": 512495, "epoch": 6174} {"train_loss": -27.636260986328125, "global_step": 512496, "epoch": 6174} {"train_loss": -27.77680015563965, "global_step": 512497, "epoch": 6174} {"train_loss": -27.4310245513916, "global_step": 512498, "epoch": 6174} {"train_loss": -27.67767333984375, "global_step": 512499, "epoch": 6174} {"train_loss": -27.64322853088379, "global_step": 512500, "epoch": 6174} {"train_loss": -27.45454216003418, "global_step": 512501, "epoch": 6174} {"train_loss": -27.240310668945312, "global_step": 512502, "epoch": 6174} {"train_loss": -27.68353271484375, "global_step": 512503, "epoch": 6174} {"train_loss": -27.687763214111328, "global_step": 512504, "epoch": 6174} {"train_loss": -27.44815444946289, "global_step": 512505, "epoch": 6174} {"train_loss": -27.500879287719727, "global_step": 512506, "epoch": 6174} {"train_loss": -27.84977149963379, "global_step": 512507, "epoch": 6174} {"train_loss": -27.50778579711914, "global_step": 512508, "epoch": 6174} {"train_loss": -27.5640869140625, "global_step": 512509, "epoch": 6174} {"train_loss": -27.981369018554688, "global_step": 512510, "epoch": 6174} {"train_loss": -27.275928497314453, "global_step": 512511, "epoch": 6174} {"train_loss": -27.2731876373291, "global_step": 512512, "epoch": 6174} {"train_loss": -27.776899337768555, "global_step": 512513, "epoch": 6174} {"train_loss": -27.451574325561523, "global_step": 512514, "epoch": 6174} {"train_loss": -27.7789306640625, "global_step": 512515, "epoch": 6174} {"train_loss": -27.441740036010742, "global_step": 512516, "epoch": 6174} {"train_loss": -27.560171127319336, "global_step": 512517, "epoch": 6174} {"train_loss": -27.723785400390625, "global_step": 512518, "epoch": 6174} {"train_loss": -27.374359130859375, "global_step": 512519, "epoch": 6174} {"train_loss": -27.316604614257812, "global_step": 512520, "epoch": 6174} {"train_loss": -27.26350975036621, "global_step": 512521, "epoch": 6174} {"train_loss": -27.978628158569336, "global_step": 512522, "epoch": 6174} {"train_loss": -27.34291648864746, "global_step": 512523, "epoch": 6174} {"train_loss": -27.25482791303152, "global_step": 512524, "epoch": 6174, "val_loss": 6631336.0} {"train_loss": -26.860273361206055, "global_step": 512525, "epoch": 6175} {"train_loss": -26.933670043945312, "global_step": 512526, "epoch": 6175} {"train_loss": -26.798419952392578, "global_step": 512527, "epoch": 6175} {"train_loss": -27.069721221923828, "global_step": 512528, "epoch": 6175} {"train_loss": -27.108678817749023, "global_step": 512529, "epoch": 6175} {"train_loss": -26.958866119384766, "global_step": 512530, "epoch": 6175} {"train_loss": -27.511016845703125, "global_step": 512531, "epoch": 6175} {"train_loss": -26.796911239624023, "global_step": 512532, "epoch": 6175} {"train_loss": -26.828092575073242, "global_step": 512533, "epoch": 6175} {"train_loss": -26.9764461517334, "global_step": 512534, "epoch": 6175} {"train_loss": -26.847700119018555, "global_step": 512535, "epoch": 6175} {"train_loss": -26.91627311706543, "global_step": 512536, "epoch": 6175} {"train_loss": -27.07696533203125, "global_step": 512537, "epoch": 6175} {"train_loss": -27.158926010131836, "global_step": 512538, "epoch": 6175} {"train_loss": -27.252307891845703, "global_step": 512539, "epoch": 6175} {"train_loss": -27.303125381469727, "global_step": 512540, "epoch": 6175} {"train_loss": -27.356475830078125, "global_step": 512541, "epoch": 6175} {"train_loss": -27.59417724609375, "global_step": 512542, "epoch": 6175} {"train_loss": -26.835546493530273, "global_step": 512543, "epoch": 6175} {"train_loss": -27.378955841064453, "global_step": 512544, "epoch": 6175} {"train_loss": -27.34186363220215, "global_step": 512545, "epoch": 6175} {"train_loss": -27.2115478515625, "global_step": 512546, "epoch": 6175} {"train_loss": -27.317108154296875, "global_step": 512547, "epoch": 6175} {"train_loss": -27.16499137878418, "global_step": 512548, "epoch": 6175} {"train_loss": -27.217397689819336, "global_step": 512549, "epoch": 6175} {"train_loss": -27.223438262939453, "global_step": 512550, "epoch": 6175} {"train_loss": -27.083826065063477, "global_step": 512551, "epoch": 6175} {"train_loss": -27.522846221923828, "global_step": 512552, "epoch": 6175} {"train_loss": -27.647741317749023, "global_step": 512553, "epoch": 6175} {"train_loss": -27.355199813842773, "global_step": 512554, "epoch": 6175} {"train_loss": -27.501005172729492, "global_step": 512555, "epoch": 6175} {"train_loss": -27.29322624206543, "global_step": 512556, "epoch": 6175} {"train_loss": -27.557331085205078, "global_step": 512557, "epoch": 6175} {"train_loss": -27.43926429748535, "global_step": 512558, "epoch": 6175} {"train_loss": -27.59763526916504, "global_step": 512559, "epoch": 6175} {"train_loss": -27.578603744506836, "global_step": 512560, "epoch": 6175} {"train_loss": -27.71958351135254, "global_step": 512561, "epoch": 6175} {"train_loss": -27.302778244018555, "global_step": 512562, "epoch": 6175} {"train_loss": -27.834400177001953, "global_step": 512563, "epoch": 6175} {"train_loss": -27.4909725189209, "global_step": 512564, "epoch": 6175} {"train_loss": -27.457040786743164, "global_step": 512565, "epoch": 6175} {"train_loss": -27.73002052307129, "global_step": 512566, "epoch": 6175} {"train_loss": -27.554901123046875, "global_step": 512567, "epoch": 6175} {"train_loss": -28.050872802734375, "global_step": 512568, "epoch": 6175} {"train_loss": -27.773517608642578, "global_step": 512569, "epoch": 6175} {"train_loss": -27.564102172851562, "global_step": 512570, "epoch": 6175} {"train_loss": -27.3835391998291, "global_step": 512571, "epoch": 6175} {"train_loss": -27.58631706237793, "global_step": 512572, "epoch": 6175} {"train_loss": -27.263959884643555, "global_step": 512573, "epoch": 6175} {"train_loss": -27.806379318237305, "global_step": 512574, "epoch": 6175} {"train_loss": -27.508344650268555, "global_step": 512575, "epoch": 6175} {"train_loss": -27.682279586791992, "global_step": 512576, "epoch": 6175} {"train_loss": -27.610828399658203, "global_step": 512577, "epoch": 6175} {"train_loss": -27.60552978515625, "global_step": 512578, "epoch": 6175} {"train_loss": -27.203702926635742, "global_step": 512579, "epoch": 6175} {"train_loss": -27.586877822875977, "global_step": 512580, "epoch": 6175} {"train_loss": -27.733123779296875, "global_step": 512581, "epoch": 6175} {"train_loss": -27.336339950561523, "global_step": 512582, "epoch": 6175} {"train_loss": -27.495771408081055, "global_step": 512583, "epoch": 6175} {"train_loss": -27.333484649658203, "global_step": 512584, "epoch": 6175} {"train_loss": -27.2622127532959, "global_step": 512585, "epoch": 6175} {"train_loss": -27.404285430908203, "global_step": 512586, "epoch": 6175} {"train_loss": -27.919452667236328, "global_step": 512587, "epoch": 6175} {"train_loss": -27.582853317260742, "global_step": 512588, "epoch": 6175} {"train_loss": -27.414838790893555, "global_step": 512589, "epoch": 6175} {"train_loss": -27.474035263061523, "global_step": 512590, "epoch": 6175} {"train_loss": -27.61707878112793, "global_step": 512591, "epoch": 6175} {"train_loss": -27.536197662353516, "global_step": 512592, "epoch": 6175} {"train_loss": -27.392053604125977, "global_step": 512593, "epoch": 6175} {"train_loss": -27.386432647705078, "global_step": 512594, "epoch": 6175} {"train_loss": -27.417510986328125, "global_step": 512595, "epoch": 6175} {"train_loss": -27.3009090423584, "global_step": 512596, "epoch": 6175} {"train_loss": -27.41961669921875, "global_step": 512597, "epoch": 6175} {"train_loss": -27.70142936706543, "global_step": 512598, "epoch": 6175} {"train_loss": -27.940139770507812, "global_step": 512599, "epoch": 6175} {"train_loss": -27.653961181640625, "global_step": 512600, "epoch": 6175} {"train_loss": -27.539026260375977, "global_step": 512601, "epoch": 6175} {"train_loss": -27.83553123474121, "global_step": 512602, "epoch": 6175} {"train_loss": -27.493091583251953, "global_step": 512603, "epoch": 6175} {"train_loss": -27.663803100585938, "global_step": 512604, "epoch": 6175} {"train_loss": -27.839832305908203, "global_step": 512605, "epoch": 6175} {"train_loss": -27.543378829956055, "global_step": 512606, "epoch": 6175} {"train_loss": -27.429510783000165, "global_step": 512607, "epoch": 6175, "val_loss": 6604137.0} {"train_loss": -27.526935577392578, "global_step": 512608, "epoch": 6176} {"train_loss": -26.353933334350586, "global_step": 512609, "epoch": 6176} {"train_loss": -26.570606231689453, "global_step": 512610, "epoch": 6176} {"train_loss": -26.972248077392578, "global_step": 512611, "epoch": 6176} {"train_loss": -26.616662979125977, "global_step": 512612, "epoch": 6176} {"train_loss": -27.05426025390625, "global_step": 512613, "epoch": 6176} {"train_loss": -26.73406982421875, "global_step": 512614, "epoch": 6176} {"train_loss": -27.101367950439453, "global_step": 512615, "epoch": 6176} {"train_loss": -27.035480499267578, "global_step": 512616, "epoch": 6176} {"train_loss": -27.0833797454834, "global_step": 512617, "epoch": 6176} {"train_loss": -26.771352767944336, "global_step": 512618, "epoch": 6176} {"train_loss": -27.033802032470703, "global_step": 512619, "epoch": 6176} {"train_loss": -27.4184627532959, "global_step": 512620, "epoch": 6176} {"train_loss": -27.43050193786621, "global_step": 512621, "epoch": 6176} {"train_loss": -26.990615844726562, "global_step": 512622, "epoch": 6176} {"train_loss": -27.244306564331055, "global_step": 512623, "epoch": 6176} {"train_loss": -27.185285568237305, "global_step": 512624, "epoch": 6176} {"train_loss": -27.53077507019043, "global_step": 512625, "epoch": 6176} {"train_loss": -27.100879669189453, "global_step": 512626, "epoch": 6176} {"train_loss": -27.614765167236328, "global_step": 512627, "epoch": 6176} {"train_loss": -27.586658477783203, "global_step": 512628, "epoch": 6176} {"train_loss": -27.2412166595459, "global_step": 512629, "epoch": 6176} {"train_loss": -27.54254722595215, "global_step": 512630, "epoch": 6176} {"train_loss": -27.234283447265625, "global_step": 512631, "epoch": 6176} {"train_loss": -27.083057403564453, "global_step": 512632, "epoch": 6176} {"train_loss": -27.02094078063965, "global_step": 512633, "epoch": 6176} {"train_loss": -27.467985153198242, "global_step": 512634, "epoch": 6176} {"train_loss": -27.106536865234375, "global_step": 512635, "epoch": 6176} {"train_loss": -27.464466094970703, "global_step": 512636, "epoch": 6176} {"train_loss": -27.54695701599121, "global_step": 512637, "epoch": 6176} {"train_loss": -27.694822311401367, "global_step": 512638, "epoch": 6176} {"train_loss": -27.809284210205078, "global_step": 512639, "epoch": 6176} {"train_loss": -27.565542221069336, "global_step": 512640, "epoch": 6176} {"train_loss": -27.223386764526367, "global_step": 512641, "epoch": 6176} {"train_loss": -27.49751091003418, "global_step": 512642, "epoch": 6176} {"train_loss": -27.090595245361328, "global_step": 512643, "epoch": 6176} {"train_loss": -27.317487716674805, "global_step": 512644, "epoch": 6176} {"train_loss": -27.405858993530273, "global_step": 512645, "epoch": 6176} {"train_loss": -27.4305419921875, "global_step": 512646, "epoch": 6176} {"train_loss": -27.37336540222168, "global_step": 512647, "epoch": 6176} {"train_loss": -27.5938777923584, "global_step": 512648, "epoch": 6176} {"train_loss": -27.888113021850586, "global_step": 512649, "epoch": 6176} {"train_loss": -27.8143310546875, "global_step": 512650, "epoch": 6176} {"train_loss": -27.83002281188965, "global_step": 512651, "epoch": 6176} {"train_loss": -27.936676025390625, "global_step": 512652, "epoch": 6176} {"train_loss": -27.656585693359375, "global_step": 512653, "epoch": 6176} {"train_loss": -27.775983810424805, "global_step": 512654, "epoch": 6176} {"train_loss": -27.33868408203125, "global_step": 512655, "epoch": 6176} {"train_loss": -27.715871810913086, "global_step": 512656, "epoch": 6176} {"train_loss": -27.599695205688477, "global_step": 512657, "epoch": 6176} {"train_loss": -27.51625633239746, "global_step": 512658, "epoch": 6176} {"train_loss": -27.396047592163086, "global_step": 512659, "epoch": 6176} {"train_loss": -27.654905319213867, "global_step": 512660, "epoch": 6176} {"train_loss": -28.003742218017578, "global_step": 512661, "epoch": 6176} {"train_loss": -27.48822021484375, "global_step": 512662, "epoch": 6176} {"train_loss": -27.6619930267334, "global_step": 512663, "epoch": 6176} {"train_loss": -27.1885986328125, "global_step": 512664, "epoch": 6176} {"train_loss": -27.68390464782715, "global_step": 512665, "epoch": 6176} {"train_loss": -27.139631271362305, "global_step": 512666, "epoch": 6176} {"train_loss": -27.38765525817871, "global_step": 512667, "epoch": 6176} {"train_loss": -27.704822540283203, "global_step": 512668, "epoch": 6176} {"train_loss": -27.834455490112305, "global_step": 512669, "epoch": 6176} {"train_loss": -26.88276481628418, "global_step": 512670, "epoch": 6176} {"train_loss": -27.75821876525879, "global_step": 512671, "epoch": 6176} {"train_loss": -27.52386474609375, "global_step": 512672, "epoch": 6176} {"train_loss": -27.368024826049805, "global_step": 512673, "epoch": 6176} {"train_loss": -27.27296257019043, "global_step": 512674, "epoch": 6176} {"train_loss": -27.424890518188477, "global_step": 512675, "epoch": 6176} {"train_loss": -27.549091339111328, "global_step": 512676, "epoch": 6176} {"train_loss": -27.651548385620117, "global_step": 512677, "epoch": 6176} {"train_loss": -27.65204429626465, "global_step": 512678, "epoch": 6176} {"train_loss": -27.272125244140625, "global_step": 512679, "epoch": 6176} {"train_loss": -27.789777755737305, "global_step": 512680, "epoch": 6176} {"train_loss": -27.964101791381836, "global_step": 512681, "epoch": 6176} {"train_loss": -27.84592628479004, "global_step": 512682, "epoch": 6176} {"train_loss": -27.512826919555664, "global_step": 512683, "epoch": 6176} {"train_loss": -27.402830123901367, "global_step": 512684, "epoch": 6176} {"train_loss": -27.380908966064453, "global_step": 512685, "epoch": 6176} {"train_loss": -27.781543731689453, "global_step": 512686, "epoch": 6176} {"train_loss": -27.755706787109375, "global_step": 512687, "epoch": 6176} {"train_loss": -27.877044677734375, "global_step": 512688, "epoch": 6176} {"train_loss": -27.568103790283203, "global_step": 512689, "epoch": 6176} {"train_loss": -27.4007127141378, "global_step": 512690, "epoch": 6176, "val_loss": 6598477.0} {"train_loss": -27.269662857055664, "global_step": 512691, "epoch": 6177} {"train_loss": -26.798810958862305, "global_step": 512692, "epoch": 6177} {"train_loss": -26.853759765625, "global_step": 512693, "epoch": 6177} {"train_loss": -26.9532413482666, "global_step": 512694, "epoch": 6177} {"train_loss": -27.171430587768555, "global_step": 512695, "epoch": 6177} {"train_loss": -27.01166343688965, "global_step": 512696, "epoch": 6177} {"train_loss": -26.85346031188965, "global_step": 512697, "epoch": 6177} {"train_loss": -27.076099395751953, "global_step": 512698, "epoch": 6177} {"train_loss": -26.49534034729004, "global_step": 512699, "epoch": 6177} {"train_loss": -26.88298988342285, "global_step": 512700, "epoch": 6177} {"train_loss": -27.07517433166504, "global_step": 512701, "epoch": 6177} {"train_loss": -26.677305221557617, "global_step": 512702, "epoch": 6177} {"train_loss": -27.375152587890625, "global_step": 512703, "epoch": 6177} {"train_loss": -27.042388916015625, "global_step": 512704, "epoch": 6177} {"train_loss": -27.282764434814453, "global_step": 512705, "epoch": 6177} {"train_loss": -27.233551025390625, "global_step": 512706, "epoch": 6177} {"train_loss": -27.517004013061523, "global_step": 512707, "epoch": 6177} {"train_loss": -27.295150756835938, "global_step": 512708, "epoch": 6177} {"train_loss": -27.391550064086914, "global_step": 512709, "epoch": 6177} {"train_loss": -27.292438507080078, "global_step": 512710, "epoch": 6177} {"train_loss": -27.783117294311523, "global_step": 512711, "epoch": 6177} {"train_loss": -27.149871826171875, "global_step": 512712, "epoch": 6177} {"train_loss": -27.487226486206055, "global_step": 512713, "epoch": 6177} {"train_loss": -27.270893096923828, "global_step": 512714, "epoch": 6177} {"train_loss": -26.98078727722168, "global_step": 512715, "epoch": 6177} {"train_loss": -27.441564559936523, "global_step": 512716, "epoch": 6177} {"train_loss": -27.494281768798828, "global_step": 512717, "epoch": 6177} {"train_loss": -27.482696533203125, "global_step": 512718, "epoch": 6177} {"train_loss": -27.5891170501709, "global_step": 512719, "epoch": 6177} {"train_loss": -27.723072052001953, "global_step": 512720, "epoch": 6177} {"train_loss": -27.437353134155273, "global_step": 512721, "epoch": 6177} {"train_loss": -27.40778160095215, "global_step": 512722, "epoch": 6177} {"train_loss": -27.304462432861328, "global_step": 512723, "epoch": 6177} {"train_loss": -27.34589958190918, "global_step": 512724, "epoch": 6177} {"train_loss": -27.222156524658203, "global_step": 512725, "epoch": 6177} {"train_loss": -27.568679809570312, "global_step": 512726, "epoch": 6177} {"train_loss": -27.108137130737305, "global_step": 512727, "epoch": 6177} {"train_loss": -27.325284957885742, "global_step": 512728, "epoch": 6177} {"train_loss": -27.52351188659668, "global_step": 512729, "epoch": 6177} {"train_loss": -27.677045822143555, "global_step": 512730, "epoch": 6177} {"train_loss": -27.413349151611328, "global_step": 512731, "epoch": 6177} {"train_loss": -27.6744384765625, "global_step": 512732, "epoch": 6177} {"train_loss": -27.545888900756836, "global_step": 512733, "epoch": 6177} {"train_loss": -27.5747013092041, "global_step": 512734, "epoch": 6177} {"train_loss": -27.690673828125, "global_step": 512735, "epoch": 6177} {"train_loss": -27.732770919799805, "global_step": 512736, "epoch": 6177} {"train_loss": -27.743383407592773, "global_step": 512737, "epoch": 6177} {"train_loss": -27.409650802612305, "global_step": 512738, "epoch": 6177} {"train_loss": -27.549423217773438, "global_step": 512739, "epoch": 6177} {"train_loss": -27.2592716217041, "global_step": 512740, "epoch": 6177} {"train_loss": -27.54971694946289, "global_step": 512741, "epoch": 6177} {"train_loss": -27.176959991455078, "global_step": 512742, "epoch": 6177} {"train_loss": -27.08998680114746, "global_step": 512743, "epoch": 6177} {"train_loss": -27.478296279907227, "global_step": 512744, "epoch": 6177} {"train_loss": -27.56624412536621, "global_step": 512745, "epoch": 6177} {"train_loss": -27.26930046081543, "global_step": 512746, "epoch": 6177} {"train_loss": -27.26654624938965, "global_step": 512747, "epoch": 6177} {"train_loss": -27.311426162719727, "global_step": 512748, "epoch": 6177} {"train_loss": -27.347692489624023, "global_step": 512749, "epoch": 6177} {"train_loss": -27.120407104492188, "global_step": 512750, "epoch": 6177} {"train_loss": -27.43104362487793, "global_step": 512751, "epoch": 6177} {"train_loss": -27.77362632751465, "global_step": 512752, "epoch": 6177} {"train_loss": -27.300830841064453, "global_step": 512753, "epoch": 6177} {"train_loss": -27.42976188659668, "global_step": 512754, "epoch": 6177} {"train_loss": -27.49323081970215, "global_step": 512755, "epoch": 6177} {"train_loss": -27.536901473999023, "global_step": 512756, "epoch": 6177} {"train_loss": -27.774587631225586, "global_step": 512757, "epoch": 6177} {"train_loss": -27.58064079284668, "global_step": 512758, "epoch": 6177} {"train_loss": -27.507299423217773, "global_step": 512759, "epoch": 6177} {"train_loss": -27.600147247314453, "global_step": 512760, "epoch": 6177} {"train_loss": -27.513107299804688, "global_step": 512761, "epoch": 6177} {"train_loss": -27.33991813659668, "global_step": 512762, "epoch": 6177} {"train_loss": -27.46319580078125, "global_step": 512763, "epoch": 6177} {"train_loss": -27.248823165893555, "global_step": 512764, "epoch": 6177} {"train_loss": -27.023502349853516, "global_step": 512765, "epoch": 6177} {"train_loss": -27.696741104125977, "global_step": 512766, "epoch": 6177} {"train_loss": -27.104969024658203, "global_step": 512767, "epoch": 6177} {"train_loss": -27.088520050048828, "global_step": 512768, "epoch": 6177} {"train_loss": -27.15581703186035, "global_step": 512769, "epoch": 6177} {"train_loss": -27.453662872314453, "global_step": 512770, "epoch": 6177} {"train_loss": -27.182174682617188, "global_step": 512771, "epoch": 6177} {"train_loss": -27.494958877563477, "global_step": 512772, "epoch": 6177} {"train_loss": -27.341708930141955, "global_step": 512773, "epoch": 6177, "val_loss": 6456412.5} {"train_loss": -25.420604705810547, "global_step": 512774, "epoch": 6178} {"train_loss": -24.53617286682129, "global_step": 512775, "epoch": 6178} {"train_loss": -25.510831832885742, "global_step": 512776, "epoch": 6178} {"train_loss": -25.5367431640625, "global_step": 512777, "epoch": 6178} {"train_loss": -25.2406005859375, "global_step": 512778, "epoch": 6178} {"train_loss": -26.4189510345459, "global_step": 512779, "epoch": 6178} {"train_loss": -26.175168991088867, "global_step": 512780, "epoch": 6178} {"train_loss": -26.52509117126465, "global_step": 512781, "epoch": 6178} {"train_loss": -26.175546646118164, "global_step": 512782, "epoch": 6178} {"train_loss": -26.633655548095703, "global_step": 512783, "epoch": 6178} {"train_loss": -26.971561431884766, "global_step": 512784, "epoch": 6178} {"train_loss": -26.61519432067871, "global_step": 512785, "epoch": 6178} {"train_loss": -26.3232364654541, "global_step": 512786, "epoch": 6178} {"train_loss": -26.624155044555664, "global_step": 512787, "epoch": 6178} {"train_loss": -26.90900230407715, "global_step": 512788, "epoch": 6178} {"train_loss": -26.6149845123291, "global_step": 512789, "epoch": 6178} {"train_loss": -26.544239044189453, "global_step": 512790, "epoch": 6178} {"train_loss": -26.65642738342285, "global_step": 512791, "epoch": 6178} {"train_loss": -26.635019302368164, "global_step": 512792, "epoch": 6178} {"train_loss": -26.75058937072754, "global_step": 512793, "epoch": 6178} {"train_loss": -26.625965118408203, "global_step": 512794, "epoch": 6178} {"train_loss": -26.945178985595703, "global_step": 512795, "epoch": 6178} {"train_loss": -26.9697322845459, "global_step": 512796, "epoch": 6178} {"train_loss": -27.34454345703125, "global_step": 512797, "epoch": 6178} {"train_loss": -26.90696144104004, "global_step": 512798, "epoch": 6178} {"train_loss": -27.26523780822754, "global_step": 512799, "epoch": 6178} {"train_loss": -27.06159782409668, "global_step": 512800, "epoch": 6178} {"train_loss": -27.09726905822754, "global_step": 512801, "epoch": 6178} {"train_loss": -27.25825309753418, "global_step": 512802, "epoch": 6178} {"train_loss": -27.180084228515625, "global_step": 512803, "epoch": 6178} {"train_loss": -27.095733642578125, "global_step": 512804, "epoch": 6178} {"train_loss": -26.94990348815918, "global_step": 512805, "epoch": 6178} {"train_loss": -27.090564727783203, "global_step": 512806, "epoch": 6178} {"train_loss": -27.545984268188477, "global_step": 512807, "epoch": 6178} {"train_loss": -27.405088424682617, "global_step": 512808, "epoch": 6178} {"train_loss": -27.664403915405273, "global_step": 512809, "epoch": 6178} {"train_loss": -27.607091903686523, "global_step": 512810, "epoch": 6178} {"train_loss": -27.50897216796875, "global_step": 512811, "epoch": 6178} {"train_loss": -27.25665283203125, "global_step": 512812, "epoch": 6178} {"train_loss": -27.59229850769043, "global_step": 512813, "epoch": 6178} {"train_loss": -27.837146759033203, "global_step": 512814, "epoch": 6178} {"train_loss": -27.42024803161621, "global_step": 512815, "epoch": 6178} {"train_loss": -27.350025177001953, "global_step": 512816, "epoch": 6178} {"train_loss": -27.469482421875, "global_step": 512817, "epoch": 6178} {"train_loss": -27.30130958557129, "global_step": 512818, "epoch": 6178} {"train_loss": -27.394506454467773, "global_step": 512819, "epoch": 6178} {"train_loss": -27.280710220336914, "global_step": 512820, "epoch": 6178} {"train_loss": -27.629974365234375, "global_step": 512821, "epoch": 6178} {"train_loss": -27.465518951416016, "global_step": 512822, "epoch": 6178} {"train_loss": -27.694690704345703, "global_step": 512823, "epoch": 6178} {"train_loss": -28.017715454101562, "global_step": 512824, "epoch": 6178} {"train_loss": -27.649845123291016, "global_step": 512825, "epoch": 6178} {"train_loss": -27.6497745513916, "global_step": 512826, "epoch": 6178} {"train_loss": -27.66058349609375, "global_step": 512827, "epoch": 6178} {"train_loss": -27.588491439819336, "global_step": 512828, "epoch": 6178} {"train_loss": -27.42484474182129, "global_step": 512829, "epoch": 6178} {"train_loss": -27.63189697265625, "global_step": 512830, "epoch": 6178} {"train_loss": -27.569284439086914, "global_step": 512831, "epoch": 6178} {"train_loss": -27.825916290283203, "global_step": 512832, "epoch": 6178} {"train_loss": -27.52167320251465, "global_step": 512833, "epoch": 6178} {"train_loss": -27.574731826782227, "global_step": 512834, "epoch": 6178} {"train_loss": -27.587743759155273, "global_step": 512835, "epoch": 6178} {"train_loss": -27.891361236572266, "global_step": 512836, "epoch": 6178} {"train_loss": -28.00813102722168, "global_step": 512837, "epoch": 6178} {"train_loss": -27.650671005249023, "global_step": 512838, "epoch": 6178} {"train_loss": -27.82559585571289, "global_step": 512839, "epoch": 6178} {"train_loss": -27.698484420776367, "global_step": 512840, "epoch": 6178} {"train_loss": -27.556732177734375, "global_step": 512841, "epoch": 6178} {"train_loss": -27.593677520751953, "global_step": 512842, "epoch": 6178} {"train_loss": -27.833288192749023, "global_step": 512843, "epoch": 6178} {"train_loss": -27.707569122314453, "global_step": 512844, "epoch": 6178} {"train_loss": -27.422040939331055, "global_step": 512845, "epoch": 6178} {"train_loss": -27.76315689086914, "global_step": 512846, "epoch": 6178} {"train_loss": -27.567264556884766, "global_step": 512847, "epoch": 6178} {"train_loss": -27.408390045166016, "global_step": 512848, "epoch": 6178} {"train_loss": -27.7109317779541, "global_step": 512849, "epoch": 6178} {"train_loss": -27.289709091186523, "global_step": 512850, "epoch": 6178} {"train_loss": -27.502643585205078, "global_step": 512851, "epoch": 6178} {"train_loss": -27.340246200561523, "global_step": 512852, "epoch": 6178} {"train_loss": -27.272754669189453, "global_step": 512853, "epoch": 6178} {"train_loss": -27.565250396728516, "global_step": 512854, "epoch": 6178} {"train_loss": -27.094003677368164, "global_step": 512855, "epoch": 6178} {"train_loss": -27.16406679727945, "global_step": 512856, "epoch": 6178, "val_loss": 6607582.0} {"train_loss": -26.07461929321289, "global_step": 512857, "epoch": 6179} {"train_loss": -24.786291122436523, "global_step": 512858, "epoch": 6179} {"train_loss": -25.7576904296875, "global_step": 512859, "epoch": 6179} {"train_loss": -25.5770206451416, "global_step": 512860, "epoch": 6179} {"train_loss": -26.528295516967773, "global_step": 512861, "epoch": 6179} {"train_loss": -26.33627700805664, "global_step": 512862, "epoch": 6179} {"train_loss": -26.719167709350586, "global_step": 512863, "epoch": 6179} {"train_loss": -26.448272705078125, "global_step": 512864, "epoch": 6179} {"train_loss": -26.99285316467285, "global_step": 512865, "epoch": 6179} {"train_loss": -26.929183959960938, "global_step": 512866, "epoch": 6179} {"train_loss": -26.6032772064209, "global_step": 512867, "epoch": 6179} {"train_loss": -26.818470001220703, "global_step": 512868, "epoch": 6179} {"train_loss": -26.867542266845703, "global_step": 512869, "epoch": 6179} {"train_loss": -27.34537696838379, "global_step": 512870, "epoch": 6179} {"train_loss": -27.050703048706055, "global_step": 512871, "epoch": 6179} {"train_loss": -26.730457305908203, "global_step": 512872, "epoch": 6179} {"train_loss": -27.113351821899414, "global_step": 512873, "epoch": 6179} {"train_loss": -27.124937057495117, "global_step": 512874, "epoch": 6179} {"train_loss": -27.169843673706055, "global_step": 512875, "epoch": 6179} {"train_loss": -27.21527671813965, "global_step": 512876, "epoch": 6179} {"train_loss": -26.90934181213379, "global_step": 512877, "epoch": 6179} {"train_loss": -27.1506404876709, "global_step": 512878, "epoch": 6179} {"train_loss": -27.051572799682617, "global_step": 512879, "epoch": 6179} {"train_loss": -27.2778377532959, "global_step": 512880, "epoch": 6179} {"train_loss": -27.2890625, "global_step": 512881, "epoch": 6179} {"train_loss": -26.834569931030273, "global_step": 512882, "epoch": 6179} {"train_loss": -27.10186195373535, "global_step": 512883, "epoch": 6179} {"train_loss": -27.24139404296875, "global_step": 512884, "epoch": 6179} {"train_loss": -27.238977432250977, "global_step": 512885, "epoch": 6179} {"train_loss": -27.774805068969727, "global_step": 512886, "epoch": 6179} {"train_loss": -27.313007354736328, "global_step": 512887, "epoch": 6179} {"train_loss": -27.43303871154785, "global_step": 512888, "epoch": 6179} {"train_loss": -27.204334259033203, "global_step": 512889, "epoch": 6179} {"train_loss": -26.865360260009766, "global_step": 512890, "epoch": 6179} {"train_loss": -27.422672271728516, "global_step": 512891, "epoch": 6179} {"train_loss": -27.52411460876465, "global_step": 512892, "epoch": 6179} {"train_loss": -27.197265625, "global_step": 512893, "epoch": 6179} {"train_loss": -27.588104248046875, "global_step": 512894, "epoch": 6179} {"train_loss": -27.13618278503418, "global_step": 512895, "epoch": 6179} {"train_loss": -27.133249282836914, "global_step": 512896, "epoch": 6179} {"train_loss": -27.42129898071289, "global_step": 512897, "epoch": 6179} {"train_loss": -27.62281608581543, "global_step": 512898, "epoch": 6179} {"train_loss": -27.263879776000977, "global_step": 512899, "epoch": 6179} {"train_loss": -27.548480987548828, "global_step": 512900, "epoch": 6179} {"train_loss": -27.697650909423828, "global_step": 512901, "epoch": 6179} {"train_loss": -27.59967613220215, "global_step": 512902, "epoch": 6179} {"train_loss": -27.683073043823242, "global_step": 512903, "epoch": 6179} {"train_loss": -27.544605255126953, "global_step": 512904, "epoch": 6179} {"train_loss": -27.84006118774414, "global_step": 512905, "epoch": 6179} {"train_loss": -27.958683013916016, "global_step": 512906, "epoch": 6179} {"train_loss": -27.22467041015625, "global_step": 512907, "epoch": 6179} {"train_loss": -27.854032516479492, "global_step": 512908, "epoch": 6179} {"train_loss": -27.566190719604492, "global_step": 512909, "epoch": 6179} {"train_loss": -27.815404891967773, "global_step": 512910, "epoch": 6179} {"train_loss": -28.023868560791016, "global_step": 512911, "epoch": 6179} {"train_loss": -27.887540817260742, "global_step": 512912, "epoch": 6179} {"train_loss": -27.571197509765625, "global_step": 512913, "epoch": 6179} {"train_loss": -27.494953155517578, "global_step": 512914, "epoch": 6179} {"train_loss": -27.80853843688965, "global_step": 512915, "epoch": 6179} {"train_loss": -27.59604835510254, "global_step": 512916, "epoch": 6179} {"train_loss": -27.693449020385742, "global_step": 512917, "epoch": 6179} {"train_loss": -27.842132568359375, "global_step": 512918, "epoch": 6179} {"train_loss": -27.428537368774414, "global_step": 512919, "epoch": 6179} {"train_loss": -27.678741455078125, "global_step": 512920, "epoch": 6179} {"train_loss": -27.442779541015625, "global_step": 512921, "epoch": 6179} {"train_loss": -27.432764053344727, "global_step": 512922, "epoch": 6179} {"train_loss": -27.28826904296875, "global_step": 512923, "epoch": 6179} {"train_loss": -27.476211547851562, "global_step": 512924, "epoch": 6179} {"train_loss": -27.488956451416016, "global_step": 512925, "epoch": 6179} {"train_loss": -27.473926544189453, "global_step": 512926, "epoch": 6179} {"train_loss": -27.358722686767578, "global_step": 512927, "epoch": 6179} {"train_loss": -27.45488929748535, "global_step": 512928, "epoch": 6179} {"train_loss": -27.550281524658203, "global_step": 512929, "epoch": 6179} {"train_loss": -27.85589599609375, "global_step": 512930, "epoch": 6179} {"train_loss": -27.57447624206543, "global_step": 512931, "epoch": 6179} {"train_loss": -27.561498641967773, "global_step": 512932, "epoch": 6179} {"train_loss": -27.170679092407227, "global_step": 512933, "epoch": 6179} {"train_loss": -26.995527267456055, "global_step": 512934, "epoch": 6179} {"train_loss": -26.491363525390625, "global_step": 512935, "epoch": 6179} {"train_loss": -27.642499923706055, "global_step": 512936, "epoch": 6179} {"train_loss": -26.819860458374023, "global_step": 512937, "epoch": 6179} {"train_loss": -26.45343589782715, "global_step": 512938, "epoch": 6179} {"train_loss": -27.20310958035021, "global_step": 512939, "epoch": 6179, "val_loss": 6541047.0} {"train_loss": -23.24355125427246, "global_step": 512940, "epoch": 6180} {"train_loss": -23.1276912689209, "global_step": 512941, "epoch": 6180} {"train_loss": -26.124486923217773, "global_step": 512942, "epoch": 6180} {"train_loss": -23.86903953552246, "global_step": 512943, "epoch": 6180} {"train_loss": -24.768783569335938, "global_step": 512944, "epoch": 6180} {"train_loss": -24.80326271057129, "global_step": 512945, "epoch": 6180} {"train_loss": -24.922765731811523, "global_step": 512946, "epoch": 6180} {"train_loss": -24.70101547241211, "global_step": 512947, "epoch": 6180} {"train_loss": -25.499248504638672, "global_step": 512948, "epoch": 6180} {"train_loss": -25.533889770507812, "global_step": 512949, "epoch": 6180} {"train_loss": -25.149017333984375, "global_step": 512950, "epoch": 6180} {"train_loss": -25.80975914001465, "global_step": 512951, "epoch": 6180} {"train_loss": -25.627460479736328, "global_step": 512952, "epoch": 6180} {"train_loss": -25.992746353149414, "global_step": 512953, "epoch": 6180} {"train_loss": -26.4848690032959, "global_step": 512954, "epoch": 6180} {"train_loss": -25.711536407470703, "global_step": 512955, "epoch": 6180} {"train_loss": -26.091018676757812, "global_step": 512956, "epoch": 6180} {"train_loss": -26.350812911987305, "global_step": 512957, "epoch": 6180} {"train_loss": -25.930566787719727, "global_step": 512958, "epoch": 6180} {"train_loss": -26.221588134765625, "global_step": 512959, "epoch": 6180} {"train_loss": -26.259672164916992, "global_step": 512960, "epoch": 6180} {"train_loss": -25.7573299407959, "global_step": 512961, "epoch": 6180} {"train_loss": -26.180694580078125, "global_step": 512962, "epoch": 6180} {"train_loss": -26.323835372924805, "global_step": 512963, "epoch": 6180} {"train_loss": -26.58115005493164, "global_step": 512964, "epoch": 6180} {"train_loss": -26.44178581237793, "global_step": 512965, "epoch": 6180} {"train_loss": -26.420093536376953, "global_step": 512966, "epoch": 6180} {"train_loss": -26.39656639099121, "global_step": 512967, "epoch": 6180} {"train_loss": -26.4998779296875, "global_step": 512968, "epoch": 6180} {"train_loss": -26.5953426361084, "global_step": 512969, "epoch": 6180} {"train_loss": -26.64715576171875, "global_step": 512970, "epoch": 6180} {"train_loss": -26.783695220947266, "global_step": 512971, "epoch": 6180} {"train_loss": -26.99622917175293, "global_step": 512972, "epoch": 6180} {"train_loss": -26.771947860717773, "global_step": 512973, "epoch": 6180} {"train_loss": -27.085357666015625, "global_step": 512974, "epoch": 6180} {"train_loss": -26.613147735595703, "global_step": 512975, "epoch": 6180} {"train_loss": -27.18494987487793, "global_step": 512976, "epoch": 6180} {"train_loss": -26.91132926940918, "global_step": 512977, "epoch": 6180} {"train_loss": -26.966527938842773, "global_step": 512978, "epoch": 6180} {"train_loss": -27.051227569580078, "global_step": 512979, "epoch": 6180} {"train_loss": -26.887128829956055, "global_step": 512980, "epoch": 6180} {"train_loss": -27.399188995361328, "global_step": 512981, "epoch": 6180} {"train_loss": -26.76521110534668, "global_step": 512982, "epoch": 6180} {"train_loss": -27.170978546142578, "global_step": 512983, "epoch": 6180} {"train_loss": -27.319522857666016, "global_step": 512984, "epoch": 6180} {"train_loss": -27.275665283203125, "global_step": 512985, "epoch": 6180} {"train_loss": -27.367694854736328, "global_step": 512986, "epoch": 6180} {"train_loss": -27.686634063720703, "global_step": 512987, "epoch": 6180} {"train_loss": -27.328893661499023, "global_step": 512988, "epoch": 6180} {"train_loss": -27.46514892578125, "global_step": 512989, "epoch": 6180} {"train_loss": -27.57925796508789, "global_step": 512990, "epoch": 6180} {"train_loss": -27.540393829345703, "global_step": 512991, "epoch": 6180} {"train_loss": -27.596668243408203, "global_step": 512992, "epoch": 6180} {"train_loss": -27.70423698425293, "global_step": 512993, "epoch": 6180} {"train_loss": -27.36067008972168, "global_step": 512994, "epoch": 6180} {"train_loss": -27.049060821533203, "global_step": 512995, "epoch": 6180} {"train_loss": -27.235132217407227, "global_step": 512996, "epoch": 6180} {"train_loss": -27.551258087158203, "global_step": 512997, "epoch": 6180} {"train_loss": -27.445602416992188, "global_step": 512998, "epoch": 6180} {"train_loss": -27.5694580078125, "global_step": 512999, "epoch": 6180} {"train_loss": -27.46821403503418, "global_step": 513000, "epoch": 6180} {"train_loss": -27.755435943603516, "global_step": 513001, "epoch": 6180} {"train_loss": -27.66974449157715, "global_step": 513002, "epoch": 6180} {"train_loss": -27.86060905456543, "global_step": 513003, "epoch": 6180} {"train_loss": -27.666595458984375, "global_step": 513004, "epoch": 6180} {"train_loss": -27.6614933013916, "global_step": 513005, "epoch": 6180} {"train_loss": -27.776752471923828, "global_step": 513006, "epoch": 6180} {"train_loss": -27.416746139526367, "global_step": 513007, "epoch": 6180} {"train_loss": -27.410348892211914, "global_step": 513008, "epoch": 6180} {"train_loss": -27.46347427368164, "global_step": 513009, "epoch": 6180} {"train_loss": -27.488407135009766, "global_step": 513010, "epoch": 6180} {"train_loss": -27.527099609375, "global_step": 513011, "epoch": 6180} {"train_loss": -27.29701042175293, "global_step": 513012, "epoch": 6180} {"train_loss": -26.71819496154785, "global_step": 513013, "epoch": 6180} {"train_loss": -27.12698745727539, "global_step": 513014, "epoch": 6180} {"train_loss": -27.18372917175293, "global_step": 513015, "epoch": 6180} {"train_loss": -27.628747940063477, "global_step": 513016, "epoch": 6180} {"train_loss": -27.862791061401367, "global_step": 513017, "epoch": 6180} {"train_loss": -26.962360382080078, "global_step": 513018, "epoch": 6180} {"train_loss": -27.57406997680664, "global_step": 513019, "epoch": 6180} {"train_loss": -27.29117774963379, "global_step": 513020, "epoch": 6180} {"train_loss": -27.763885498046875, "global_step": 513021, "epoch": 6180} {"train_loss": -26.72449612904744, "global_step": 513022, "epoch": 6180, "val_loss": 6448827.5} {"train_loss": -26.199874877929688, "global_step": 513023, "epoch": 6181} {"train_loss": -25.470815658569336, "global_step": 513024, "epoch": 6181} {"train_loss": -27.001815795898438, "global_step": 513025, "epoch": 6181} {"train_loss": -26.2781925201416, "global_step": 513026, "epoch": 6181} {"train_loss": -25.303861618041992, "global_step": 513027, "epoch": 6181} {"train_loss": -26.186487197875977, "global_step": 513028, "epoch": 6181} {"train_loss": -25.972278594970703, "global_step": 513029, "epoch": 6181} {"train_loss": -25.994705200195312, "global_step": 513030, "epoch": 6181} {"train_loss": -26.28058433532715, "global_step": 513031, "epoch": 6181} {"train_loss": -26.10532569885254, "global_step": 513032, "epoch": 6181} {"train_loss": -26.08522605895996, "global_step": 513033, "epoch": 6181} {"train_loss": -26.24778175354004, "global_step": 513034, "epoch": 6181} {"train_loss": -26.298269271850586, "global_step": 513035, "epoch": 6181} {"train_loss": -26.72135353088379, "global_step": 513036, "epoch": 6181} {"train_loss": -26.83721923828125, "global_step": 513037, "epoch": 6181} {"train_loss": -26.28553581237793, "global_step": 513038, "epoch": 6181} {"train_loss": -26.559865951538086, "global_step": 513039, "epoch": 6181} {"train_loss": -26.840051651000977, "global_step": 513040, "epoch": 6181} {"train_loss": -26.417699813842773, "global_step": 513041, "epoch": 6181} {"train_loss": -26.571008682250977, "global_step": 513042, "epoch": 6181} {"train_loss": -26.80929946899414, "global_step": 513043, "epoch": 6181} {"train_loss": -26.54560661315918, "global_step": 513044, "epoch": 6181} {"train_loss": -27.081872940063477, "global_step": 513045, "epoch": 6181} {"train_loss": -27.0969295501709, "global_step": 513046, "epoch": 6181} {"train_loss": -26.94959831237793, "global_step": 513047, "epoch": 6181} {"train_loss": -26.979894638061523, "global_step": 513048, "epoch": 6181} {"train_loss": -27.08249855041504, "global_step": 513049, "epoch": 6181} {"train_loss": -27.10797119140625, "global_step": 513050, "epoch": 6181} {"train_loss": -27.2244815826416, "global_step": 513051, "epoch": 6181} {"train_loss": -27.0528564453125, "global_step": 513052, "epoch": 6181} {"train_loss": -27.12384033203125, "global_step": 513053, "epoch": 6181} {"train_loss": -27.19317626953125, "global_step": 513054, "epoch": 6181} {"train_loss": -26.816791534423828, "global_step": 513055, "epoch": 6181} {"train_loss": -27.214990615844727, "global_step": 513056, "epoch": 6181} {"train_loss": -27.540380477905273, "global_step": 513057, "epoch": 6181} {"train_loss": -27.19306755065918, "global_step": 513058, "epoch": 6181} {"train_loss": -27.659021377563477, "global_step": 513059, "epoch": 6181} {"train_loss": -26.905603408813477, "global_step": 513060, "epoch": 6181} {"train_loss": -27.431238174438477, "global_step": 513061, "epoch": 6181} {"train_loss": -27.265735626220703, "global_step": 513062, "epoch": 6181} {"train_loss": -27.535446166992188, "global_step": 513063, "epoch": 6181} {"train_loss": -27.995624542236328, "global_step": 513064, "epoch": 6181} {"train_loss": -27.57057762145996, "global_step": 513065, "epoch": 6181} {"train_loss": -27.28561782836914, "global_step": 513066, "epoch": 6181} {"train_loss": -27.809371948242188, "global_step": 513067, "epoch": 6181} {"train_loss": -27.6568546295166, "global_step": 513068, "epoch": 6181} {"train_loss": -27.530258178710938, "global_step": 513069, "epoch": 6181} {"train_loss": -27.79546546936035, "global_step": 513070, "epoch": 6181} {"train_loss": -27.67755699157715, "global_step": 513071, "epoch": 6181} {"train_loss": -27.48211097717285, "global_step": 513072, "epoch": 6181} {"train_loss": -27.610055923461914, "global_step": 513073, "epoch": 6181} {"train_loss": -27.86127281188965, "global_step": 513074, "epoch": 6181} {"train_loss": -27.32985496520996, "global_step": 513075, "epoch": 6181} {"train_loss": -27.51704216003418, "global_step": 513076, "epoch": 6181} {"train_loss": -27.633359909057617, "global_step": 513077, "epoch": 6181} {"train_loss": -27.425695419311523, "global_step": 513078, "epoch": 6181} {"train_loss": -27.676471710205078, "global_step": 513079, "epoch": 6181} {"train_loss": -27.633563995361328, "global_step": 513080, "epoch": 6181} {"train_loss": -27.490863800048828, "global_step": 513081, "epoch": 6181} {"train_loss": -27.379653930664062, "global_step": 513082, "epoch": 6181} {"train_loss": -27.763059616088867, "global_step": 513083, "epoch": 6181} {"train_loss": -27.530542373657227, "global_step": 513084, "epoch": 6181} {"train_loss": -27.271459579467773, "global_step": 513085, "epoch": 6181} {"train_loss": -27.45124626159668, "global_step": 513086, "epoch": 6181} {"train_loss": -27.573862075805664, "global_step": 513087, "epoch": 6181} {"train_loss": -27.45448112487793, "global_step": 513088, "epoch": 6181} {"train_loss": -27.758365631103516, "global_step": 513089, "epoch": 6181} {"train_loss": -27.25104331970215, "global_step": 513090, "epoch": 6181} {"train_loss": -27.130996704101562, "global_step": 513091, "epoch": 6181} {"train_loss": -27.12646484375, "global_step": 513092, "epoch": 6181} {"train_loss": -27.166324615478516, "global_step": 513093, "epoch": 6181} {"train_loss": -27.68232536315918, "global_step": 513094, "epoch": 6181} {"train_loss": -27.02984619140625, "global_step": 513095, "epoch": 6181} {"train_loss": -26.973133087158203, "global_step": 513096, "epoch": 6181} {"train_loss": -27.4949951171875, "global_step": 513097, "epoch": 6181} {"train_loss": -27.29823875427246, "global_step": 513098, "epoch": 6181} {"train_loss": -27.3868408203125, "global_step": 513099, "epoch": 6181} {"train_loss": -27.282012939453125, "global_step": 513100, "epoch": 6181} {"train_loss": -26.82712173461914, "global_step": 513101, "epoch": 6181} {"train_loss": -27.512588500976562, "global_step": 513102, "epoch": 6181} {"train_loss": -27.40126609802246, "global_step": 513103, "epoch": 6181} {"train_loss": -27.44414710998535, "global_step": 513104, "epoch": 6181} {"train_loss": -27.100077112037017, "global_step": 513105, "epoch": 6181, "val_loss": 6712369.0} {"train_loss": -27.51570701599121, "global_step": 513106, "epoch": 6182} {"train_loss": -27.443952560424805, "global_step": 513107, "epoch": 6182} {"train_loss": -27.148435592651367, "global_step": 513108, "epoch": 6182} {"train_loss": -27.168684005737305, "global_step": 513109, "epoch": 6182} {"train_loss": -27.285795211791992, "global_step": 513110, "epoch": 6182} {"train_loss": -27.06146812438965, "global_step": 513111, "epoch": 6182} {"train_loss": -27.376174926757812, "global_step": 513112, "epoch": 6182} {"train_loss": -27.151071548461914, "global_step": 513113, "epoch": 6182} {"train_loss": -27.107030868530273, "global_step": 513114, "epoch": 6182} {"train_loss": -27.44024658203125, "global_step": 513115, "epoch": 6182} {"train_loss": -27.352781295776367, "global_step": 513116, "epoch": 6182} {"train_loss": -27.64899253845215, "global_step": 513117, "epoch": 6182} {"train_loss": -27.4425048828125, "global_step": 513118, "epoch": 6182} {"train_loss": -27.629419326782227, "global_step": 513119, "epoch": 6182} {"train_loss": -27.48026466369629, "global_step": 513120, "epoch": 6182} {"train_loss": -27.20167350769043, "global_step": 513121, "epoch": 6182} {"train_loss": -27.535999298095703, "global_step": 513122, "epoch": 6182} {"train_loss": -27.39111328125, "global_step": 513123, "epoch": 6182} {"train_loss": -27.776342391967773, "global_step": 513124, "epoch": 6182} {"train_loss": -27.305206298828125, "global_step": 513125, "epoch": 6182} {"train_loss": -27.495126724243164, "global_step": 513126, "epoch": 6182} {"train_loss": -27.26307487487793, "global_step": 513127, "epoch": 6182} {"train_loss": -27.4465389251709, "global_step": 513128, "epoch": 6182} {"train_loss": -27.343564987182617, "global_step": 513129, "epoch": 6182} {"train_loss": -27.35308837890625, "global_step": 513130, "epoch": 6182} {"train_loss": -27.577396392822266, "global_step": 513131, "epoch": 6182} {"train_loss": -27.856470108032227, "global_step": 513132, "epoch": 6182} {"train_loss": -27.21708106994629, "global_step": 513133, "epoch": 6182} {"train_loss": -26.94304847717285, "global_step": 513134, "epoch": 6182} {"train_loss": -27.2445068359375, "global_step": 513135, "epoch": 6182} {"train_loss": -27.719654083251953, "global_step": 513136, "epoch": 6182} {"train_loss": -27.734689712524414, "global_step": 513137, "epoch": 6182} {"train_loss": -27.299047470092773, "global_step": 513138, "epoch": 6182} {"train_loss": -27.74595069885254, "global_step": 513139, "epoch": 6182} {"train_loss": -27.355966567993164, "global_step": 513140, "epoch": 6182} {"train_loss": -27.482542037963867, "global_step": 513141, "epoch": 6182} {"train_loss": -27.406030654907227, "global_step": 513142, "epoch": 6182} {"train_loss": -27.348651885986328, "global_step": 513143, "epoch": 6182} {"train_loss": -27.828369140625, "global_step": 513144, "epoch": 6182} {"train_loss": -27.69879722595215, "global_step": 513145, "epoch": 6182} {"train_loss": -27.413471221923828, "global_step": 513146, "epoch": 6182} {"train_loss": -27.6519718170166, "global_step": 513147, "epoch": 6182} {"train_loss": -27.77642250061035, "global_step": 513148, "epoch": 6182} {"train_loss": -27.633453369140625, "global_step": 513149, "epoch": 6182} {"train_loss": -27.397348403930664, "global_step": 513150, "epoch": 6182} {"train_loss": -27.300806045532227, "global_step": 513151, "epoch": 6182} {"train_loss": -27.33489418029785, "global_step": 513152, "epoch": 6182} {"train_loss": -27.611276626586914, "global_step": 513153, "epoch": 6182} {"train_loss": -27.811431884765625, "global_step": 513154, "epoch": 6182} {"train_loss": -27.179880142211914, "global_step": 513155, "epoch": 6182} {"train_loss": -28.28775978088379, "global_step": 513156, "epoch": 6182} {"train_loss": -27.52130126953125, "global_step": 513157, "epoch": 6182} {"train_loss": -27.641260147094727, "global_step": 513158, "epoch": 6182} {"train_loss": -27.492162704467773, "global_step": 513159, "epoch": 6182} {"train_loss": -27.7783145904541, "global_step": 513160, "epoch": 6182} {"train_loss": -27.62969970703125, "global_step": 513161, "epoch": 6182} {"train_loss": -27.671585083007812, "global_step": 513162, "epoch": 6182} {"train_loss": -27.49452018737793, "global_step": 513163, "epoch": 6182} {"train_loss": -27.41468620300293, "global_step": 513164, "epoch": 6182} {"train_loss": -27.7385311126709, "global_step": 513165, "epoch": 6182} {"train_loss": -27.518964767456055, "global_step": 513166, "epoch": 6182} {"train_loss": -27.73512077331543, "global_step": 513167, "epoch": 6182} {"train_loss": -27.695220947265625, "global_step": 513168, "epoch": 6182} {"train_loss": -27.656415939331055, "global_step": 513169, "epoch": 6182} {"train_loss": -27.725021362304688, "global_step": 513170, "epoch": 6182} {"train_loss": -27.40283203125, "global_step": 513171, "epoch": 6182} {"train_loss": -27.702672958374023, "global_step": 513172, "epoch": 6182} {"train_loss": -27.739938735961914, "global_step": 513173, "epoch": 6182} {"train_loss": -27.82672691345215, "global_step": 513174, "epoch": 6182} {"train_loss": -27.450178146362305, "global_step": 513175, "epoch": 6182} {"train_loss": -27.534513473510742, "global_step": 513176, "epoch": 6182} {"train_loss": -27.512802124023438, "global_step": 513177, "epoch": 6182} {"train_loss": -27.389545440673828, "global_step": 513178, "epoch": 6182} {"train_loss": -27.657855987548828, "global_step": 513179, "epoch": 6182} {"train_loss": -27.52353858947754, "global_step": 513180, "epoch": 6182} {"train_loss": -27.077600479125977, "global_step": 513181, "epoch": 6182} {"train_loss": -27.37574577331543, "global_step": 513182, "epoch": 6182} {"train_loss": -27.04568862915039, "global_step": 513183, "epoch": 6182} {"train_loss": -27.576513290405273, "global_step": 513184, "epoch": 6182} {"train_loss": -27.318103790283203, "global_step": 513185, "epoch": 6182} {"train_loss": -27.64325523376465, "global_step": 513186, "epoch": 6182} {"train_loss": -27.0438175201416, "global_step": 513187, "epoch": 6182} {"train_loss": -27.460880900003826, "global_step": 513188, "epoch": 6182, "val_loss": 6725387.0} {"train_loss": -26.657028198242188, "global_step": 513189, "epoch": 6183} {"train_loss": -25.034963607788086, "global_step": 513190, "epoch": 6183} {"train_loss": -25.142520904541016, "global_step": 513191, "epoch": 6183} {"train_loss": -25.667783737182617, "global_step": 513192, "epoch": 6183} {"train_loss": -25.774686813354492, "global_step": 513193, "epoch": 6183} {"train_loss": -26.988550186157227, "global_step": 513194, "epoch": 6183} {"train_loss": -26.038013458251953, "global_step": 513195, "epoch": 6183} {"train_loss": -27.2903995513916, "global_step": 513196, "epoch": 6183} {"train_loss": -26.533004760742188, "global_step": 513197, "epoch": 6183} {"train_loss": -26.570159912109375, "global_step": 513198, "epoch": 6183} {"train_loss": -26.832061767578125, "global_step": 513199, "epoch": 6183} {"train_loss": -27.2456111907959, "global_step": 513200, "epoch": 6183} {"train_loss": -26.992450714111328, "global_step": 513201, "epoch": 6183} {"train_loss": -26.962671279907227, "global_step": 513202, "epoch": 6183} {"train_loss": -26.980609893798828, "global_step": 513203, "epoch": 6183} {"train_loss": -26.999067306518555, "global_step": 513204, "epoch": 6183} {"train_loss": -26.702178955078125, "global_step": 513205, "epoch": 6183} {"train_loss": -26.959264755249023, "global_step": 513206, "epoch": 6183} {"train_loss": -26.860382080078125, "global_step": 513207, "epoch": 6183} {"train_loss": -27.27907371520996, "global_step": 513208, "epoch": 6183} {"train_loss": -27.24921226501465, "global_step": 513209, "epoch": 6183} {"train_loss": -26.988245010375977, "global_step": 513210, "epoch": 6183} {"train_loss": -27.3801326751709, "global_step": 513211, "epoch": 6183} {"train_loss": -27.191572189331055, "global_step": 513212, "epoch": 6183} {"train_loss": -27.2189884185791, "global_step": 513213, "epoch": 6183} {"train_loss": -27.31732177734375, "global_step": 513214, "epoch": 6183} {"train_loss": -27.253509521484375, "global_step": 513215, "epoch": 6183} {"train_loss": -27.625402450561523, "global_step": 513216, "epoch": 6183} {"train_loss": -27.34539794921875, "global_step": 513217, "epoch": 6183} {"train_loss": -27.435083389282227, "global_step": 513218, "epoch": 6183} {"train_loss": -27.436542510986328, "global_step": 513219, "epoch": 6183} {"train_loss": -27.40988540649414, "global_step": 513220, "epoch": 6183} {"train_loss": -27.4053897857666, "global_step": 513221, "epoch": 6183} {"train_loss": -27.512182235717773, "global_step": 513222, "epoch": 6183} {"train_loss": -27.37342643737793, "global_step": 513223, "epoch": 6183} {"train_loss": -27.767414093017578, "global_step": 513224, "epoch": 6183} {"train_loss": -27.448583602905273, "global_step": 513225, "epoch": 6183} {"train_loss": -27.5703182220459, "global_step": 513226, "epoch": 6183} {"train_loss": -27.643781661987305, "global_step": 513227, "epoch": 6183} {"train_loss": -27.983081817626953, "global_step": 513228, "epoch": 6183} {"train_loss": -27.388593673706055, "global_step": 513229, "epoch": 6183} {"train_loss": -27.461475372314453, "global_step": 513230, "epoch": 6183} {"train_loss": -27.522809982299805, "global_step": 513231, "epoch": 6183} {"train_loss": -27.63103675842285, "global_step": 513232, "epoch": 6183} {"train_loss": -27.68682289123535, "global_step": 513233, "epoch": 6183} {"train_loss": -27.78957176208496, "global_step": 513234, "epoch": 6183} {"train_loss": -27.589208602905273, "global_step": 513235, "epoch": 6183} {"train_loss": -27.257099151611328, "global_step": 513236, "epoch": 6183} {"train_loss": -27.278717041015625, "global_step": 513237, "epoch": 6183} {"train_loss": -27.67536735534668, "global_step": 513238, "epoch": 6183} {"train_loss": -27.553314208984375, "global_step": 513239, "epoch": 6183} {"train_loss": -27.86529541015625, "global_step": 513240, "epoch": 6183} {"train_loss": -27.469655990600586, "global_step": 513241, "epoch": 6183} {"train_loss": -27.40496826171875, "global_step": 513242, "epoch": 6183} {"train_loss": -27.78400230407715, "global_step": 513243, "epoch": 6183} {"train_loss": -27.68084144592285, "global_step": 513244, "epoch": 6183} {"train_loss": -27.859771728515625, "global_step": 513245, "epoch": 6183} {"train_loss": -27.80305290222168, "global_step": 513246, "epoch": 6183} {"train_loss": -27.205270767211914, "global_step": 513247, "epoch": 6183} {"train_loss": -26.976520538330078, "global_step": 513248, "epoch": 6183} {"train_loss": -26.850927352905273, "global_step": 513249, "epoch": 6183} {"train_loss": -26.342117309570312, "global_step": 513250, "epoch": 6183} {"train_loss": -27.40729331970215, "global_step": 513251, "epoch": 6183} {"train_loss": -27.3359432220459, "global_step": 513252, "epoch": 6183} {"train_loss": -27.509862899780273, "global_step": 513253, "epoch": 6183} {"train_loss": -27.565998077392578, "global_step": 513254, "epoch": 6183} {"train_loss": -27.15692710876465, "global_step": 513255, "epoch": 6183} {"train_loss": -27.883670806884766, "global_step": 513256, "epoch": 6183} {"train_loss": -27.35112953186035, "global_step": 513257, "epoch": 6183} {"train_loss": -27.421716690063477, "global_step": 513258, "epoch": 6183} {"train_loss": -27.22637939453125, "global_step": 513259, "epoch": 6183} {"train_loss": -27.2921085357666, "global_step": 513260, "epoch": 6183} {"train_loss": -27.48555564880371, "global_step": 513261, "epoch": 6183} {"train_loss": -27.166366577148438, "global_step": 513262, "epoch": 6183} {"train_loss": -27.26448631286621, "global_step": 513263, "epoch": 6183} {"train_loss": -26.773162841796875, "global_step": 513264, "epoch": 6183} {"train_loss": -27.19935417175293, "global_step": 513265, "epoch": 6183} {"train_loss": -27.118555068969727, "global_step": 513266, "epoch": 6183} {"train_loss": -26.987470626831055, "global_step": 513267, "epoch": 6183} {"train_loss": -26.879514694213867, "global_step": 513268, "epoch": 6183} {"train_loss": -27.237890243530273, "global_step": 513269, "epoch": 6183} {"train_loss": -26.936735153198242, "global_step": 513270, "epoch": 6183} {"train_loss": -27.192555852683192, "global_step": 513271, "epoch": 6183, "val_loss": 6625816.0} {"train_loss": -26.402484893798828, "global_step": 513272, "epoch": 6184} {"train_loss": -26.581787109375, "global_step": 513273, "epoch": 6184} {"train_loss": -26.191797256469727, "global_step": 513274, "epoch": 6184} {"train_loss": -26.55866050720215, "global_step": 513275, "epoch": 6184} {"train_loss": -26.843597412109375, "global_step": 513276, "epoch": 6184} {"train_loss": -26.472986221313477, "global_step": 513277, "epoch": 6184} {"train_loss": -26.784143447875977, "global_step": 513278, "epoch": 6184} {"train_loss": -26.72515869140625, "global_step": 513279, "epoch": 6184} {"train_loss": -26.503448486328125, "global_step": 513280, "epoch": 6184} {"train_loss": -26.754011154174805, "global_step": 513281, "epoch": 6184} {"train_loss": -26.948028564453125, "global_step": 513282, "epoch": 6184} {"train_loss": -26.706689834594727, "global_step": 513283, "epoch": 6184} {"train_loss": -26.71638298034668, "global_step": 513284, "epoch": 6184} {"train_loss": -27.262863159179688, "global_step": 513285, "epoch": 6184} {"train_loss": -26.664081573486328, "global_step": 513286, "epoch": 6184} {"train_loss": -27.15850257873535, "global_step": 513287, "epoch": 6184} {"train_loss": -26.974658966064453, "global_step": 513288, "epoch": 6184} {"train_loss": -27.088037490844727, "global_step": 513289, "epoch": 6184} {"train_loss": -27.323095321655273, "global_step": 513290, "epoch": 6184} {"train_loss": -26.84161949157715, "global_step": 513291, "epoch": 6184} {"train_loss": -27.374326705932617, "global_step": 513292, "epoch": 6184} {"train_loss": -27.096405029296875, "global_step": 513293, "epoch": 6184} {"train_loss": -27.399662017822266, "global_step": 513294, "epoch": 6184} {"train_loss": -27.52008056640625, "global_step": 513295, "epoch": 6184} {"train_loss": -27.475574493408203, "global_step": 513296, "epoch": 6184} {"train_loss": -27.252592086791992, "global_step": 513297, "epoch": 6184} {"train_loss": -27.441864013671875, "global_step": 513298, "epoch": 6184} {"train_loss": -27.70054054260254, "global_step": 513299, "epoch": 6184} {"train_loss": -27.187124252319336, "global_step": 513300, "epoch": 6184} {"train_loss": -27.4627628326416, "global_step": 513301, "epoch": 6184} {"train_loss": -27.238401412963867, "global_step": 513302, "epoch": 6184} {"train_loss": -27.477142333984375, "global_step": 513303, "epoch": 6184} {"train_loss": -27.607397079467773, "global_step": 513304, "epoch": 6184} {"train_loss": -27.605426788330078, "global_step": 513305, "epoch": 6184} {"train_loss": -27.643056869506836, "global_step": 513306, "epoch": 6184} {"train_loss": -27.40992546081543, "global_step": 513307, "epoch": 6184} {"train_loss": -27.778762817382812, "global_step": 513308, "epoch": 6184} {"train_loss": -27.076627731323242, "global_step": 513309, "epoch": 6184} {"train_loss": -27.55414390563965, "global_step": 513310, "epoch": 6184} {"train_loss": -27.671127319335938, "global_step": 513311, "epoch": 6184} {"train_loss": -28.060855865478516, "global_step": 513312, "epoch": 6184} {"train_loss": -27.73358154296875, "global_step": 513313, "epoch": 6184} {"train_loss": -28.081693649291992, "global_step": 513314, "epoch": 6184} {"train_loss": -27.611875534057617, "global_step": 513315, "epoch": 6184} {"train_loss": -27.63178062438965, "global_step": 513316, "epoch": 6184} {"train_loss": -27.56373405456543, "global_step": 513317, "epoch": 6184} {"train_loss": -27.64291763305664, "global_step": 513318, "epoch": 6184} {"train_loss": -27.268152236938477, "global_step": 513319, "epoch": 6184} {"train_loss": -27.749399185180664, "global_step": 513320, "epoch": 6184} {"train_loss": -27.67828941345215, "global_step": 513321, "epoch": 6184} {"train_loss": -27.67327308654785, "global_step": 513322, "epoch": 6184} {"train_loss": -27.414352416992188, "global_step": 513323, "epoch": 6184} {"train_loss": -27.53928565979004, "global_step": 513324, "epoch": 6184} {"train_loss": -27.45989990234375, "global_step": 513325, "epoch": 6184} {"train_loss": -27.848758697509766, "global_step": 513326, "epoch": 6184} {"train_loss": -27.77189064025879, "global_step": 513327, "epoch": 6184} {"train_loss": -27.664718627929688, "global_step": 513328, "epoch": 6184} {"train_loss": -27.6889705657959, "global_step": 513329, "epoch": 6184} {"train_loss": -27.714773178100586, "global_step": 513330, "epoch": 6184} {"train_loss": -28.08074378967285, "global_step": 513331, "epoch": 6184} {"train_loss": -27.935606002807617, "global_step": 513332, "epoch": 6184} {"train_loss": -27.66628074645996, "global_step": 513333, "epoch": 6184} {"train_loss": -27.610498428344727, "global_step": 513334, "epoch": 6184} {"train_loss": -27.71209144592285, "global_step": 513335, "epoch": 6184} {"train_loss": -27.67595863342285, "global_step": 513336, "epoch": 6184} {"train_loss": -27.95465087890625, "global_step": 513337, "epoch": 6184} {"train_loss": -27.70686912536621, "global_step": 513338, "epoch": 6184} {"train_loss": -27.78708839416504, "global_step": 513339, "epoch": 6184} {"train_loss": -27.864240646362305, "global_step": 513340, "epoch": 6184} {"train_loss": -27.424152374267578, "global_step": 513341, "epoch": 6184} {"train_loss": -27.787555694580078, "global_step": 513342, "epoch": 6184} {"train_loss": -27.355884552001953, "global_step": 513343, "epoch": 6184} {"train_loss": -27.421493530273438, "global_step": 513344, "epoch": 6184} {"train_loss": -27.4942626953125, "global_step": 513345, "epoch": 6184} {"train_loss": -27.751026153564453, "global_step": 513346, "epoch": 6184} {"train_loss": -27.73963737487793, "global_step": 513347, "epoch": 6184} {"train_loss": -27.436920166015625, "global_step": 513348, "epoch": 6184} {"train_loss": -27.518096923828125, "global_step": 513349, "epoch": 6184} {"train_loss": -27.69244384765625, "global_step": 513350, "epoch": 6184} {"train_loss": -27.84366226196289, "global_step": 513351, "epoch": 6184} {"train_loss": -27.578144073486328, "global_step": 513352, "epoch": 6184} {"train_loss": -27.5107479095459, "global_step": 513353, "epoch": 6184} {"train_loss": -27.414264908756117, "global_step": 513354, "epoch": 6184, "val_loss": 6578336.0} {"train_loss": -26.667341232299805, "global_step": 513355, "epoch": 6185} {"train_loss": -25.147069931030273, "global_step": 513356, "epoch": 6185} {"train_loss": -24.28470802307129, "global_step": 513357, "epoch": 6185} {"train_loss": -25.740503311157227, "global_step": 513358, "epoch": 6185} {"train_loss": -26.552106857299805, "global_step": 513359, "epoch": 6185} {"train_loss": -25.793970108032227, "global_step": 513360, "epoch": 6185} {"train_loss": -26.488849639892578, "global_step": 513361, "epoch": 6185} {"train_loss": -26.336515426635742, "global_step": 513362, "epoch": 6185} {"train_loss": -26.558746337890625, "global_step": 513363, "epoch": 6185} {"train_loss": -26.598615646362305, "global_step": 513364, "epoch": 6185} {"train_loss": -27.058603286743164, "global_step": 513365, "epoch": 6185} {"train_loss": -26.5178279876709, "global_step": 513366, "epoch": 6185} {"train_loss": -27.067663192749023, "global_step": 513367, "epoch": 6185} {"train_loss": -26.592334747314453, "global_step": 513368, "epoch": 6185} {"train_loss": -26.833593368530273, "global_step": 513369, "epoch": 6185} {"train_loss": -27.116363525390625, "global_step": 513370, "epoch": 6185} {"train_loss": -26.545806884765625, "global_step": 513371, "epoch": 6185} {"train_loss": -26.897165298461914, "global_step": 513372, "epoch": 6185} {"train_loss": -27.213438034057617, "global_step": 513373, "epoch": 6185} {"train_loss": -26.742841720581055, "global_step": 513374, "epoch": 6185} {"train_loss": -26.805410385131836, "global_step": 513375, "epoch": 6185} {"train_loss": -26.72303581237793, "global_step": 513376, "epoch": 6185} {"train_loss": -26.969751358032227, "global_step": 513377, "epoch": 6185} {"train_loss": -27.290220260620117, "global_step": 513378, "epoch": 6185} {"train_loss": -27.087339401245117, "global_step": 513379, "epoch": 6185} {"train_loss": -27.433349609375, "global_step": 513380, "epoch": 6185} {"train_loss": -26.847003936767578, "global_step": 513381, "epoch": 6185} {"train_loss": -27.197208404541016, "global_step": 513382, "epoch": 6185} {"train_loss": -27.185016632080078, "global_step": 513383, "epoch": 6185} {"train_loss": -27.29459571838379, "global_step": 513384, "epoch": 6185} {"train_loss": -26.996816635131836, "global_step": 513385, "epoch": 6185} {"train_loss": -27.04779624938965, "global_step": 513386, "epoch": 6185} {"train_loss": -27.7015380859375, "global_step": 513387, "epoch": 6185} {"train_loss": -27.034290313720703, "global_step": 513388, "epoch": 6185} {"train_loss": -27.30665397644043, "global_step": 513389, "epoch": 6185} {"train_loss": -27.363813400268555, "global_step": 513390, "epoch": 6185} {"train_loss": -27.53329849243164, "global_step": 513391, "epoch": 6185} {"train_loss": -27.380084991455078, "global_step": 513392, "epoch": 6185} {"train_loss": -27.25739860534668, "global_step": 513393, "epoch": 6185} {"train_loss": -27.399938583374023, "global_step": 513394, "epoch": 6185} {"train_loss": -27.47178077697754, "global_step": 513395, "epoch": 6185} {"train_loss": -27.156896591186523, "global_step": 513396, "epoch": 6185} {"train_loss": -27.36866569519043, "global_step": 513397, "epoch": 6185} {"train_loss": -27.53485679626465, "global_step": 513398, "epoch": 6185} {"train_loss": -27.456769943237305, "global_step": 513399, "epoch": 6185} {"train_loss": -27.62453269958496, "global_step": 513400, "epoch": 6185} {"train_loss": -27.667572021484375, "global_step": 513401, "epoch": 6185} {"train_loss": -27.23040771484375, "global_step": 513402, "epoch": 6185} {"train_loss": -27.620044708251953, "global_step": 513403, "epoch": 6185} {"train_loss": -27.610015869140625, "global_step": 513404, "epoch": 6185} {"train_loss": -27.432403564453125, "global_step": 513405, "epoch": 6185} {"train_loss": -27.716459274291992, "global_step": 513406, "epoch": 6185} {"train_loss": -27.424283981323242, "global_step": 513407, "epoch": 6185} {"train_loss": -27.379880905151367, "global_step": 513408, "epoch": 6185} {"train_loss": -27.401508331298828, "global_step": 513409, "epoch": 6185} {"train_loss": -27.7554931640625, "global_step": 513410, "epoch": 6185} {"train_loss": -27.425573348999023, "global_step": 513411, "epoch": 6185} {"train_loss": -27.62282371520996, "global_step": 513412, "epoch": 6185} {"train_loss": -27.281164169311523, "global_step": 513413, "epoch": 6185} {"train_loss": -27.867721557617188, "global_step": 513414, "epoch": 6185} {"train_loss": -27.269933700561523, "global_step": 513415, "epoch": 6185} {"train_loss": -27.48919677734375, "global_step": 513416, "epoch": 6185} {"train_loss": -27.384784698486328, "global_step": 513417, "epoch": 6185} {"train_loss": -27.4384822845459, "global_step": 513418, "epoch": 6185} {"train_loss": -27.488916397094727, "global_step": 513419, "epoch": 6185} {"train_loss": -27.5550537109375, "global_step": 513420, "epoch": 6185} {"train_loss": -27.440109252929688, "global_step": 513421, "epoch": 6185} {"train_loss": -27.538223266601562, "global_step": 513422, "epoch": 6185} {"train_loss": -27.0223331451416, "global_step": 513423, "epoch": 6185} {"train_loss": -27.265832901000977, "global_step": 513424, "epoch": 6185} {"train_loss": -26.737146377563477, "global_step": 513425, "epoch": 6185} {"train_loss": -27.296905517578125, "global_step": 513426, "epoch": 6185} {"train_loss": -27.581037521362305, "global_step": 513427, "epoch": 6185} {"train_loss": -27.281652450561523, "global_step": 513428, "epoch": 6185} {"train_loss": -27.965234756469727, "global_step": 513429, "epoch": 6185} {"train_loss": -27.45751953125, "global_step": 513430, "epoch": 6185} {"train_loss": -27.64594078063965, "global_step": 513431, "epoch": 6185} {"train_loss": -27.562170028686523, "global_step": 513432, "epoch": 6185} {"train_loss": -27.290796279907227, "global_step": 513433, "epoch": 6185} {"train_loss": -27.59470558166504, "global_step": 513434, "epoch": 6185} {"train_loss": -27.621734619140625, "global_step": 513435, "epoch": 6185} {"train_loss": -27.553747177124023, "global_step": 513436, "epoch": 6185} {"train_loss": -27.13954762378371, "global_step": 513437, "epoch": 6185, "val_loss": 6720742.0} {"train_loss": -25.997146606445312, "global_step": 513438, "epoch": 6186} {"train_loss": -24.530988693237305, "global_step": 513439, "epoch": 6186} {"train_loss": -25.53878402709961, "global_step": 513440, "epoch": 6186} {"train_loss": -26.76300621032715, "global_step": 513441, "epoch": 6186} {"train_loss": -25.545412063598633, "global_step": 513442, "epoch": 6186} {"train_loss": -27.149555206298828, "global_step": 513443, "epoch": 6186} {"train_loss": -26.36309814453125, "global_step": 513444, "epoch": 6186} {"train_loss": -27.292694091796875, "global_step": 513445, "epoch": 6186} {"train_loss": -26.771154403686523, "global_step": 513446, "epoch": 6186} {"train_loss": -26.860944747924805, "global_step": 513447, "epoch": 6186} {"train_loss": -26.953638076782227, "global_step": 513448, "epoch": 6186} {"train_loss": -26.72308349609375, "global_step": 513449, "epoch": 6186} {"train_loss": -27.08649253845215, "global_step": 513450, "epoch": 6186} {"train_loss": -27.28008460998535, "global_step": 513451, "epoch": 6186} {"train_loss": -26.910980224609375, "global_step": 513452, "epoch": 6186} {"train_loss": -27.112417221069336, "global_step": 513453, "epoch": 6186} {"train_loss": -26.9569091796875, "global_step": 513454, "epoch": 6186} {"train_loss": -26.97085952758789, "global_step": 513455, "epoch": 6186} {"train_loss": -27.38335609436035, "global_step": 513456, "epoch": 6186} {"train_loss": -26.881513595581055, "global_step": 513457, "epoch": 6186} {"train_loss": -27.265644073486328, "global_step": 513458, "epoch": 6186} {"train_loss": -26.5980281829834, "global_step": 513459, "epoch": 6186} {"train_loss": -27.501972198486328, "global_step": 513460, "epoch": 6186} {"train_loss": -26.85711097717285, "global_step": 513461, "epoch": 6186} {"train_loss": -27.183273315429688, "global_step": 513462, "epoch": 6186} {"train_loss": -27.157846450805664, "global_step": 513463, "epoch": 6186} {"train_loss": -27.389013290405273, "global_step": 513464, "epoch": 6186} {"train_loss": -27.924421310424805, "global_step": 513465, "epoch": 6186} {"train_loss": -27.174484252929688, "global_step": 513466, "epoch": 6186} {"train_loss": -27.441120147705078, "global_step": 513467, "epoch": 6186} {"train_loss": -27.087369918823242, "global_step": 513468, "epoch": 6186} {"train_loss": -27.217004776000977, "global_step": 513469, "epoch": 6186} {"train_loss": -27.431066513061523, "global_step": 513470, "epoch": 6186} {"train_loss": -27.407840728759766, "global_step": 513471, "epoch": 6186} {"train_loss": -27.0028076171875, "global_step": 513472, "epoch": 6186} {"train_loss": -27.2420654296875, "global_step": 513473, "epoch": 6186} {"train_loss": -27.40899085998535, "global_step": 513474, "epoch": 6186} {"train_loss": -27.321552276611328, "global_step": 513475, "epoch": 6186} {"train_loss": -27.250192642211914, "global_step": 513476, "epoch": 6186} {"train_loss": -27.473722457885742, "global_step": 513477, "epoch": 6186} {"train_loss": -27.63812255859375, "global_step": 513478, "epoch": 6186} {"train_loss": -27.307348251342773, "global_step": 513479, "epoch": 6186} {"train_loss": -27.39617347717285, "global_step": 513480, "epoch": 6186} {"train_loss": -27.2705078125, "global_step": 513481, "epoch": 6186} {"train_loss": -27.26271629333496, "global_step": 513482, "epoch": 6186} {"train_loss": -27.520673751831055, "global_step": 513483, "epoch": 6186} {"train_loss": -27.450483322143555, "global_step": 513484, "epoch": 6186} {"train_loss": -27.242116928100586, "global_step": 513485, "epoch": 6186} {"train_loss": -27.247034072875977, "global_step": 513486, "epoch": 6186} {"train_loss": -27.48074722290039, "global_step": 513487, "epoch": 6186} {"train_loss": -27.626440048217773, "global_step": 513488, "epoch": 6186} {"train_loss": -27.2518253326416, "global_step": 513489, "epoch": 6186} {"train_loss": -27.12652015686035, "global_step": 513490, "epoch": 6186} {"train_loss": -27.31926918029785, "global_step": 513491, "epoch": 6186} {"train_loss": -27.142181396484375, "global_step": 513492, "epoch": 6186} {"train_loss": -27.82858657836914, "global_step": 513493, "epoch": 6186} {"train_loss": -27.404577255249023, "global_step": 513494, "epoch": 6186} {"train_loss": -27.299161911010742, "global_step": 513495, "epoch": 6186} {"train_loss": -27.499420166015625, "global_step": 513496, "epoch": 6186} {"train_loss": -27.569494247436523, "global_step": 513497, "epoch": 6186} {"train_loss": -27.420825958251953, "global_step": 513498, "epoch": 6186} {"train_loss": -27.268598556518555, "global_step": 513499, "epoch": 6186} {"train_loss": -27.452611923217773, "global_step": 513500, "epoch": 6186} {"train_loss": -27.51299476623535, "global_step": 513501, "epoch": 6186} {"train_loss": -26.880353927612305, "global_step": 513502, "epoch": 6186} {"train_loss": -27.208593368530273, "global_step": 513503, "epoch": 6186} {"train_loss": -27.15388298034668, "global_step": 513504, "epoch": 6186} {"train_loss": -27.509382247924805, "global_step": 513505, "epoch": 6186} {"train_loss": -27.54828453063965, "global_step": 513506, "epoch": 6186} {"train_loss": -27.47205924987793, "global_step": 513507, "epoch": 6186} {"train_loss": -27.415632247924805, "global_step": 513508, "epoch": 6186} {"train_loss": -27.636993408203125, "global_step": 513509, "epoch": 6186} {"train_loss": -27.410139083862305, "global_step": 513510, "epoch": 6186} {"train_loss": -27.564504623413086, "global_step": 513511, "epoch": 6186} {"train_loss": -27.58039665222168, "global_step": 513512, "epoch": 6186} {"train_loss": -27.345251083374023, "global_step": 513513, "epoch": 6186} {"train_loss": -27.339231491088867, "global_step": 513514, "epoch": 6186} {"train_loss": -27.54326820373535, "global_step": 513515, "epoch": 6186} {"train_loss": -27.241952896118164, "global_step": 513516, "epoch": 6186} {"train_loss": -27.677967071533203, "global_step": 513517, "epoch": 6186} {"train_loss": -27.311120986938477, "global_step": 513518, "epoch": 6186} {"train_loss": -27.289884567260742, "global_step": 513519, "epoch": 6186} {"train_loss": -27.219130734363233, "global_step": 513520, "epoch": 6186, "val_loss": 6674787.0} {"train_loss": -23.131912231445312, "global_step": 513521, "epoch": 6187} {"train_loss": -26.572866439819336, "global_step": 513522, "epoch": 6187} {"train_loss": -24.220983505249023, "global_step": 513523, "epoch": 6187} {"train_loss": -25.6722354888916, "global_step": 513524, "epoch": 6187} {"train_loss": -26.134191513061523, "global_step": 513525, "epoch": 6187} {"train_loss": -25.864181518554688, "global_step": 513526, "epoch": 6187} {"train_loss": -26.592920303344727, "global_step": 513527, "epoch": 6187} {"train_loss": -26.395456314086914, "global_step": 513528, "epoch": 6187} {"train_loss": -25.82516860961914, "global_step": 513529, "epoch": 6187} {"train_loss": -26.068729400634766, "global_step": 513530, "epoch": 6187} {"train_loss": -26.31707191467285, "global_step": 513531, "epoch": 6187} {"train_loss": -26.041364669799805, "global_step": 513532, "epoch": 6187} {"train_loss": -26.505462646484375, "global_step": 513533, "epoch": 6187} {"train_loss": -26.517492294311523, "global_step": 513534, "epoch": 6187} {"train_loss": -26.31333351135254, "global_step": 513535, "epoch": 6187} {"train_loss": -26.394479751586914, "global_step": 513536, "epoch": 6187} {"train_loss": -26.442169189453125, "global_step": 513537, "epoch": 6187} {"train_loss": -26.5496826171875, "global_step": 513538, "epoch": 6187} {"train_loss": -26.250308990478516, "global_step": 513539, "epoch": 6187} {"train_loss": -26.37141990661621, "global_step": 513540, "epoch": 6187} {"train_loss": -26.318449020385742, "global_step": 513541, "epoch": 6187} {"train_loss": -26.73805809020996, "global_step": 513542, "epoch": 6187} {"train_loss": -26.528797149658203, "global_step": 513543, "epoch": 6187} {"train_loss": -26.492298126220703, "global_step": 513544, "epoch": 6187} {"train_loss": -26.884546279907227, "global_step": 513545, "epoch": 6187} {"train_loss": -26.78192138671875, "global_step": 513546, "epoch": 6187} {"train_loss": -27.261947631835938, "global_step": 513547, "epoch": 6187} {"train_loss": -26.68994140625, "global_step": 513548, "epoch": 6187} {"train_loss": -26.918140411376953, "global_step": 513549, "epoch": 6187} {"train_loss": -26.806066513061523, "global_step": 513550, "epoch": 6187} {"train_loss": -26.886037826538086, "global_step": 513551, "epoch": 6187} {"train_loss": -26.821298599243164, "global_step": 513552, "epoch": 6187} {"train_loss": -26.7558536529541, "global_step": 513553, "epoch": 6187} {"train_loss": -26.8017578125, "global_step": 513554, "epoch": 6187} {"train_loss": -26.970062255859375, "global_step": 513555, "epoch": 6187} {"train_loss": -27.063928604125977, "global_step": 513556, "epoch": 6187} {"train_loss": -27.242700576782227, "global_step": 513557, "epoch": 6187} {"train_loss": -27.00197410583496, "global_step": 513558, "epoch": 6187} {"train_loss": -27.176015853881836, "global_step": 513559, "epoch": 6187} {"train_loss": -27.152572631835938, "global_step": 513560, "epoch": 6187} {"train_loss": -27.189472198486328, "global_step": 513561, "epoch": 6187} {"train_loss": -27.06011390686035, "global_step": 513562, "epoch": 6187} {"train_loss": -27.291034698486328, "global_step": 513563, "epoch": 6187} {"train_loss": -27.219970703125, "global_step": 513564, "epoch": 6187} {"train_loss": -26.87617301940918, "global_step": 513565, "epoch": 6187} {"train_loss": -27.48732566833496, "global_step": 513566, "epoch": 6187} {"train_loss": -27.190723419189453, "global_step": 513567, "epoch": 6187} {"train_loss": -27.303089141845703, "global_step": 513568, "epoch": 6187} {"train_loss": -27.769927978515625, "global_step": 513569, "epoch": 6187} {"train_loss": -27.19496726989746, "global_step": 513570, "epoch": 6187} {"train_loss": -27.448781967163086, "global_step": 513571, "epoch": 6187} {"train_loss": -27.204076766967773, "global_step": 513572, "epoch": 6187} {"train_loss": -27.4708194732666, "global_step": 513573, "epoch": 6187} {"train_loss": -27.646085739135742, "global_step": 513574, "epoch": 6187} {"train_loss": -27.467321395874023, "global_step": 513575, "epoch": 6187} {"train_loss": -27.489416122436523, "global_step": 513576, "epoch": 6187} {"train_loss": -27.831912994384766, "global_step": 513577, "epoch": 6187} {"train_loss": -27.576171875, "global_step": 513578, "epoch": 6187} {"train_loss": -27.30975914001465, "global_step": 513579, "epoch": 6187} {"train_loss": -27.630598068237305, "global_step": 513580, "epoch": 6187} {"train_loss": -27.61842155456543, "global_step": 513581, "epoch": 6187} {"train_loss": -27.48853874206543, "global_step": 513582, "epoch": 6187} {"train_loss": -27.7052059173584, "global_step": 513583, "epoch": 6187} {"train_loss": -27.7222843170166, "global_step": 513584, "epoch": 6187} {"train_loss": -27.784149169921875, "global_step": 513585, "epoch": 6187} {"train_loss": -27.659561157226562, "global_step": 513586, "epoch": 6187} {"train_loss": -27.361570358276367, "global_step": 513587, "epoch": 6187} {"train_loss": -27.237085342407227, "global_step": 513588, "epoch": 6187} {"train_loss": -27.18952751159668, "global_step": 513589, "epoch": 6187} {"train_loss": -27.893125534057617, "global_step": 513590, "epoch": 6187} {"train_loss": -27.4500675201416, "global_step": 513591, "epoch": 6187} {"train_loss": -27.430837631225586, "global_step": 513592, "epoch": 6187} {"train_loss": -27.62948989868164, "global_step": 513593, "epoch": 6187} {"train_loss": -27.27028465270996, "global_step": 513594, "epoch": 6187} {"train_loss": -27.531024932861328, "global_step": 513595, "epoch": 6187} {"train_loss": -27.513782501220703, "global_step": 513596, "epoch": 6187} {"train_loss": -27.222919464111328, "global_step": 513597, "epoch": 6187} {"train_loss": -27.390995025634766, "global_step": 513598, "epoch": 6187} {"train_loss": -27.181732177734375, "global_step": 513599, "epoch": 6187} {"train_loss": -27.448774337768555, "global_step": 513600, "epoch": 6187} {"train_loss": -27.3856201171875, "global_step": 513601, "epoch": 6187} {"train_loss": -27.840051651000977, "global_step": 513602, "epoch": 6187} {"train_loss": -26.96090934937259, "global_step": 513603, "epoch": 6187, "val_loss": 6654558.0} {"train_loss": -24.040985107421875, "global_step": 513604, "epoch": 6188} {"train_loss": -25.720703125, "global_step": 513605, "epoch": 6188} {"train_loss": -26.357892990112305, "global_step": 513606, "epoch": 6188} {"train_loss": -24.991519927978516, "global_step": 513607, "epoch": 6188} {"train_loss": -26.31111717224121, "global_step": 513608, "epoch": 6188} {"train_loss": -25.750030517578125, "global_step": 513609, "epoch": 6188} {"train_loss": -26.617462158203125, "global_step": 513610, "epoch": 6188} {"train_loss": -25.851064682006836, "global_step": 513611, "epoch": 6188} {"train_loss": -26.528390884399414, "global_step": 513612, "epoch": 6188} {"train_loss": -26.33839225769043, "global_step": 513613, "epoch": 6188} {"train_loss": -27.159818649291992, "global_step": 513614, "epoch": 6188} {"train_loss": -26.383270263671875, "global_step": 513615, "epoch": 6188} {"train_loss": -26.926977157592773, "global_step": 513616, "epoch": 6188} {"train_loss": -26.647815704345703, "global_step": 513617, "epoch": 6188} {"train_loss": -27.037555694580078, "global_step": 513618, "epoch": 6188} {"train_loss": -26.743417739868164, "global_step": 513619, "epoch": 6188} {"train_loss": -26.76519203186035, "global_step": 513620, "epoch": 6188} {"train_loss": -27.241321563720703, "global_step": 513621, "epoch": 6188} {"train_loss": -26.660398483276367, "global_step": 513622, "epoch": 6188} {"train_loss": -27.722858428955078, "global_step": 513623, "epoch": 6188} {"train_loss": -27.1373291015625, "global_step": 513624, "epoch": 6188} {"train_loss": -27.203012466430664, "global_step": 513625, "epoch": 6188} {"train_loss": -26.867462158203125, "global_step": 513626, "epoch": 6188} {"train_loss": -26.89361572265625, "global_step": 513627, "epoch": 6188} {"train_loss": -27.216358184814453, "global_step": 513628, "epoch": 6188} {"train_loss": -27.786924362182617, "global_step": 513629, "epoch": 6188} {"train_loss": -27.24983024597168, "global_step": 513630, "epoch": 6188} {"train_loss": -27.5776424407959, "global_step": 513631, "epoch": 6188} {"train_loss": -27.503082275390625, "global_step": 513632, "epoch": 6188} {"train_loss": -27.472501754760742, "global_step": 513633, "epoch": 6188} {"train_loss": -27.360889434814453, "global_step": 513634, "epoch": 6188} {"train_loss": -27.28066062927246, "global_step": 513635, "epoch": 6188} {"train_loss": -27.159406661987305, "global_step": 513636, "epoch": 6188} {"train_loss": -27.040985107421875, "global_step": 513637, "epoch": 6188} {"train_loss": -27.664173126220703, "global_step": 513638, "epoch": 6188} {"train_loss": -27.58216667175293, "global_step": 513639, "epoch": 6188} {"train_loss": -27.299055099487305, "global_step": 513640, "epoch": 6188} {"train_loss": -27.217391967773438, "global_step": 513641, "epoch": 6188} {"train_loss": -27.052478790283203, "global_step": 513642, "epoch": 6188} {"train_loss": -26.973388671875, "global_step": 513643, "epoch": 6188} {"train_loss": -27.513458251953125, "global_step": 513644, "epoch": 6188} {"train_loss": -27.515552520751953, "global_step": 513645, "epoch": 6188} {"train_loss": -27.32147789001465, "global_step": 513646, "epoch": 6188} {"train_loss": -27.567174911499023, "global_step": 513647, "epoch": 6188} {"train_loss": -27.247007369995117, "global_step": 513648, "epoch": 6188} {"train_loss": -27.57048988342285, "global_step": 513649, "epoch": 6188} {"train_loss": -27.48310661315918, "global_step": 513650, "epoch": 6188} {"train_loss": -27.512418746948242, "global_step": 513651, "epoch": 6188} {"train_loss": -27.61456298828125, "global_step": 513652, "epoch": 6188} {"train_loss": -27.688642501831055, "global_step": 513653, "epoch": 6188} {"train_loss": -27.494037628173828, "global_step": 513654, "epoch": 6188} {"train_loss": -27.484024047851562, "global_step": 513655, "epoch": 6188} {"train_loss": -27.59661865234375, "global_step": 513656, "epoch": 6188} {"train_loss": -27.317798614501953, "global_step": 513657, "epoch": 6188} {"train_loss": -27.427967071533203, "global_step": 513658, "epoch": 6188} {"train_loss": -27.519989013671875, "global_step": 513659, "epoch": 6188} {"train_loss": -27.88507080078125, "global_step": 513660, "epoch": 6188} {"train_loss": -27.54166030883789, "global_step": 513661, "epoch": 6188} {"train_loss": -27.384815216064453, "global_step": 513662, "epoch": 6188} {"train_loss": -27.543237686157227, "global_step": 513663, "epoch": 6188} {"train_loss": -27.393451690673828, "global_step": 513664, "epoch": 6188} {"train_loss": -27.675525665283203, "global_step": 513665, "epoch": 6188} {"train_loss": -27.6068115234375, "global_step": 513666, "epoch": 6188} {"train_loss": -27.58867835998535, "global_step": 513667, "epoch": 6188} {"train_loss": -27.75244140625, "global_step": 513668, "epoch": 6188} {"train_loss": -27.96476173400879, "global_step": 513669, "epoch": 6188} {"train_loss": -27.864978790283203, "global_step": 513670, "epoch": 6188} {"train_loss": -27.572711944580078, "global_step": 513671, "epoch": 6188} {"train_loss": -27.58369255065918, "global_step": 513672, "epoch": 6188} {"train_loss": -27.184370040893555, "global_step": 513673, "epoch": 6188} {"train_loss": -27.365707397460938, "global_step": 513674, "epoch": 6188} {"train_loss": -27.838882446289062, "global_step": 513675, "epoch": 6188} {"train_loss": -27.868316650390625, "global_step": 513676, "epoch": 6188} {"train_loss": -27.775293350219727, "global_step": 513677, "epoch": 6188} {"train_loss": -27.405038833618164, "global_step": 513678, "epoch": 6188} {"train_loss": -27.716083526611328, "global_step": 513679, "epoch": 6188} {"train_loss": -27.842681884765625, "global_step": 513680, "epoch": 6188} {"train_loss": -27.5443172454834, "global_step": 513681, "epoch": 6188} {"train_loss": -27.175756454467773, "global_step": 513682, "epoch": 6188} {"train_loss": -27.740070343017578, "global_step": 513683, "epoch": 6188} {"train_loss": -27.578516006469727, "global_step": 513684, "epoch": 6188} {"train_loss": -27.749048233032227, "global_step": 513685, "epoch": 6188} {"train_loss": -27.207166487912097, "global_step": 513686, "epoch": 6188, "val_loss": 6698392.0} {"train_loss": -27.42677116394043, "global_step": 513687, "epoch": 6189} {"train_loss": -27.264495849609375, "global_step": 513688, "epoch": 6189} {"train_loss": -27.52760124206543, "global_step": 513689, "epoch": 6189} {"train_loss": -27.32099723815918, "global_step": 513690, "epoch": 6189} {"train_loss": -27.002765655517578, "global_step": 513691, "epoch": 6189} {"train_loss": -27.371448516845703, "global_step": 513692, "epoch": 6189} {"train_loss": -27.02656364440918, "global_step": 513693, "epoch": 6189} {"train_loss": -27.090543746948242, "global_step": 513694, "epoch": 6189} {"train_loss": -27.500120162963867, "global_step": 513695, "epoch": 6189} {"train_loss": -27.120548248291016, "global_step": 513696, "epoch": 6189} {"train_loss": -27.187158584594727, "global_step": 513697, "epoch": 6189} {"train_loss": -27.229232788085938, "global_step": 513698, "epoch": 6189} {"train_loss": -27.506582260131836, "global_step": 513699, "epoch": 6189} {"train_loss": -27.40642738342285, "global_step": 513700, "epoch": 6189} {"train_loss": -27.312198638916016, "global_step": 513701, "epoch": 6189} {"train_loss": -27.467578887939453, "global_step": 513702, "epoch": 6189} {"train_loss": -27.192289352416992, "global_step": 513703, "epoch": 6189} {"train_loss": -27.6025333404541, "global_step": 513704, "epoch": 6189} {"train_loss": -27.37043571472168, "global_step": 513705, "epoch": 6189} {"train_loss": -27.50489616394043, "global_step": 513706, "epoch": 6189} {"train_loss": -27.502710342407227, "global_step": 513707, "epoch": 6189} {"train_loss": -27.947940826416016, "global_step": 513708, "epoch": 6189} {"train_loss": -27.397109985351562, "global_step": 513709, "epoch": 6189} {"train_loss": -27.720844268798828, "global_step": 513710, "epoch": 6189} {"train_loss": -27.721561431884766, "global_step": 513711, "epoch": 6189} {"train_loss": -27.713876724243164, "global_step": 513712, "epoch": 6189} {"train_loss": -27.35857582092285, "global_step": 513713, "epoch": 6189} {"train_loss": -27.301328659057617, "global_step": 513714, "epoch": 6189} {"train_loss": -27.720922470092773, "global_step": 513715, "epoch": 6189} {"train_loss": -27.713287353515625, "global_step": 513716, "epoch": 6189} {"train_loss": -27.44231605529785, "global_step": 513717, "epoch": 6189} {"train_loss": -27.41525650024414, "global_step": 513718, "epoch": 6189} {"train_loss": -27.530420303344727, "global_step": 513719, "epoch": 6189} {"train_loss": -27.39773941040039, "global_step": 513720, "epoch": 6189} {"train_loss": -27.288549423217773, "global_step": 513721, "epoch": 6189} {"train_loss": -27.708593368530273, "global_step": 513722, "epoch": 6189} {"train_loss": -27.67190933227539, "global_step": 513723, "epoch": 6189} {"train_loss": -27.7077579498291, "global_step": 513724, "epoch": 6189} {"train_loss": -27.6163387298584, "global_step": 513725, "epoch": 6189} {"train_loss": -27.753833770751953, "global_step": 513726, "epoch": 6189} {"train_loss": -27.673608779907227, "global_step": 513727, "epoch": 6189} {"train_loss": -27.722028732299805, "global_step": 513728, "epoch": 6189} {"train_loss": -27.833356857299805, "global_step": 513729, "epoch": 6189} {"train_loss": -27.61748695373535, "global_step": 513730, "epoch": 6189} {"train_loss": -27.602375030517578, "global_step": 513731, "epoch": 6189} {"train_loss": -27.605955123901367, "global_step": 513732, "epoch": 6189} {"train_loss": -27.688535690307617, "global_step": 513733, "epoch": 6189} {"train_loss": -27.380517959594727, "global_step": 513734, "epoch": 6189} {"train_loss": -27.8712215423584, "global_step": 513735, "epoch": 6189} {"train_loss": -27.806787490844727, "global_step": 513736, "epoch": 6189} {"train_loss": -27.65753746032715, "global_step": 513737, "epoch": 6189} {"train_loss": -27.676050186157227, "global_step": 513738, "epoch": 6189} {"train_loss": -27.82435417175293, "global_step": 513739, "epoch": 6189} {"train_loss": -27.627466201782227, "global_step": 513740, "epoch": 6189} {"train_loss": -27.779294967651367, "global_step": 513741, "epoch": 6189} {"train_loss": -27.529083251953125, "global_step": 513742, "epoch": 6189} {"train_loss": -27.621458053588867, "global_step": 513743, "epoch": 6189} {"train_loss": -27.694623947143555, "global_step": 513744, "epoch": 6189} {"train_loss": -27.78364372253418, "global_step": 513745, "epoch": 6189} {"train_loss": -27.414297103881836, "global_step": 513746, "epoch": 6189} {"train_loss": -27.61427879333496, "global_step": 513747, "epoch": 6189} {"train_loss": -27.60236167907715, "global_step": 513748, "epoch": 6189} {"train_loss": -27.54844093322754, "global_step": 513749, "epoch": 6189} {"train_loss": -27.458826065063477, "global_step": 513750, "epoch": 6189} {"train_loss": -27.291568756103516, "global_step": 513751, "epoch": 6189} {"train_loss": -27.131183624267578, "global_step": 513752, "epoch": 6189} {"train_loss": -27.497411727905273, "global_step": 513753, "epoch": 6189} {"train_loss": -27.361059188842773, "global_step": 513754, "epoch": 6189} {"train_loss": -27.7898006439209, "global_step": 513755, "epoch": 6189} {"train_loss": -27.62177085876465, "global_step": 513756, "epoch": 6189} {"train_loss": -27.974151611328125, "global_step": 513757, "epoch": 6189} {"train_loss": -27.37742042541504, "global_step": 513758, "epoch": 6189} {"train_loss": -27.85133171081543, "global_step": 513759, "epoch": 6189} {"train_loss": -27.949079513549805, "global_step": 513760, "epoch": 6189} {"train_loss": -27.417316436767578, "global_step": 513761, "epoch": 6189} {"train_loss": -27.543872833251953, "global_step": 513762, "epoch": 6189} {"train_loss": -27.687936782836914, "global_step": 513763, "epoch": 6189} {"train_loss": -27.535858154296875, "global_step": 513764, "epoch": 6189} {"train_loss": -27.752737045288086, "global_step": 513765, "epoch": 6189} {"train_loss": -27.7150821685791, "global_step": 513766, "epoch": 6189} {"train_loss": -27.54310417175293, "global_step": 513767, "epoch": 6189} {"train_loss": -27.976648330688477, "global_step": 513768, "epoch": 6189} {"train_loss": -27.55162151750312, "global_step": 513769, "epoch": 6189, "val_loss": 6671280.0} {"train_loss": -26.1982421875, "global_step": 513770, "epoch": 6190} {"train_loss": -25.690576553344727, "global_step": 513771, "epoch": 6190} {"train_loss": -26.778162002563477, "global_step": 513772, "epoch": 6190} {"train_loss": -26.391498565673828, "global_step": 513773, "epoch": 6190} {"train_loss": -25.552433013916016, "global_step": 513774, "epoch": 6190} {"train_loss": -25.6453800201416, "global_step": 513775, "epoch": 6190} {"train_loss": -26.83778953552246, "global_step": 513776, "epoch": 6190} {"train_loss": -26.826047897338867, "global_step": 513777, "epoch": 6190} {"train_loss": -26.657026290893555, "global_step": 513778, "epoch": 6190} {"train_loss": -26.8847599029541, "global_step": 513779, "epoch": 6190} {"train_loss": -26.80805778503418, "global_step": 513780, "epoch": 6190} {"train_loss": -26.55069351196289, "global_step": 513781, "epoch": 6190} {"train_loss": -26.68622398376465, "global_step": 513782, "epoch": 6190} {"train_loss": -27.03177833557129, "global_step": 513783, "epoch": 6190} {"train_loss": -26.883398056030273, "global_step": 513784, "epoch": 6190} {"train_loss": -26.874399185180664, "global_step": 513785, "epoch": 6190} {"train_loss": -26.67005729675293, "global_step": 513786, "epoch": 6190} {"train_loss": -26.815372467041016, "global_step": 513787, "epoch": 6190} {"train_loss": -27.407928466796875, "global_step": 513788, "epoch": 6190} {"train_loss": -27.152801513671875, "global_step": 513789, "epoch": 6190} {"train_loss": -26.762197494506836, "global_step": 513790, "epoch": 6190} {"train_loss": -27.176095962524414, "global_step": 513791, "epoch": 6190} {"train_loss": -27.560211181640625, "global_step": 513792, "epoch": 6190} {"train_loss": -26.98514747619629, "global_step": 513793, "epoch": 6190} {"train_loss": -27.426538467407227, "global_step": 513794, "epoch": 6190} {"train_loss": -27.10700798034668, "global_step": 513795, "epoch": 6190} {"train_loss": -27.46161460876465, "global_step": 513796, "epoch": 6190} {"train_loss": -26.905426025390625, "global_step": 513797, "epoch": 6190} {"train_loss": -27.415021896362305, "global_step": 513798, "epoch": 6190} {"train_loss": -26.972135543823242, "global_step": 513799, "epoch": 6190} {"train_loss": -27.406660079956055, "global_step": 513800, "epoch": 6190} {"train_loss": -27.092981338500977, "global_step": 513801, "epoch": 6190} {"train_loss": -27.32990837097168, "global_step": 513802, "epoch": 6190} {"train_loss": -27.64569664001465, "global_step": 513803, "epoch": 6190} {"train_loss": -27.652694702148438, "global_step": 513804, "epoch": 6190} {"train_loss": -27.38313102722168, "global_step": 513805, "epoch": 6190} {"train_loss": -27.53960609436035, "global_step": 513806, "epoch": 6190} {"train_loss": -27.38416862487793, "global_step": 513807, "epoch": 6190} {"train_loss": -27.574268341064453, "global_step": 513808, "epoch": 6190} {"train_loss": -27.4989013671875, "global_step": 513809, "epoch": 6190} {"train_loss": -27.521554946899414, "global_step": 513810, "epoch": 6190} {"train_loss": -27.624738693237305, "global_step": 513811, "epoch": 6190} {"train_loss": -27.295658111572266, "global_step": 513812, "epoch": 6190} {"train_loss": -27.658689498901367, "global_step": 513813, "epoch": 6190} {"train_loss": -27.775232315063477, "global_step": 513814, "epoch": 6190} {"train_loss": -27.598297119140625, "global_step": 513815, "epoch": 6190} {"train_loss": -27.920591354370117, "global_step": 513816, "epoch": 6190} {"train_loss": -27.82619285583496, "global_step": 513817, "epoch": 6190} {"train_loss": -27.7923641204834, "global_step": 513818, "epoch": 6190} {"train_loss": -27.7410888671875, "global_step": 513819, "epoch": 6190} {"train_loss": -27.871246337890625, "global_step": 513820, "epoch": 6190} {"train_loss": -27.906721115112305, "global_step": 513821, "epoch": 6190} {"train_loss": -27.8856201171875, "global_step": 513822, "epoch": 6190} {"train_loss": -27.411352157592773, "global_step": 513823, "epoch": 6190} {"train_loss": -27.46290397644043, "global_step": 513824, "epoch": 6190} {"train_loss": -27.792469024658203, "global_step": 513825, "epoch": 6190} {"train_loss": -27.510135650634766, "global_step": 513826, "epoch": 6190} {"train_loss": -27.744338989257812, "global_step": 513827, "epoch": 6190} {"train_loss": -27.369619369506836, "global_step": 513828, "epoch": 6190} {"train_loss": -27.530750274658203, "global_step": 513829, "epoch": 6190} {"train_loss": -27.932035446166992, "global_step": 513830, "epoch": 6190} {"train_loss": -27.66876220703125, "global_step": 513831, "epoch": 6190} {"train_loss": -27.57337760925293, "global_step": 513832, "epoch": 6190} {"train_loss": -27.727624893188477, "global_step": 513833, "epoch": 6190} {"train_loss": -27.642547607421875, "global_step": 513834, "epoch": 6190} {"train_loss": -27.076984405517578, "global_step": 513835, "epoch": 6190} {"train_loss": -27.57268714904785, "global_step": 513836, "epoch": 6190} {"train_loss": -27.448606491088867, "global_step": 513837, "epoch": 6190} {"train_loss": -27.543476104736328, "global_step": 513838, "epoch": 6190} {"train_loss": -27.910633087158203, "global_step": 513839, "epoch": 6190} {"train_loss": -27.890411376953125, "global_step": 513840, "epoch": 6190} {"train_loss": -27.71478843688965, "global_step": 513841, "epoch": 6190} {"train_loss": -27.55171012878418, "global_step": 513842, "epoch": 6190} {"train_loss": -27.379541397094727, "global_step": 513843, "epoch": 6190} {"train_loss": -27.52240562438965, "global_step": 513844, "epoch": 6190} {"train_loss": -27.72504234313965, "global_step": 513845, "epoch": 6190} {"train_loss": -27.84369468688965, "global_step": 513846, "epoch": 6190} {"train_loss": -27.643890380859375, "global_step": 513847, "epoch": 6190} {"train_loss": -27.471683502197266, "global_step": 513848, "epoch": 6190} {"train_loss": -27.639724731445312, "global_step": 513849, "epoch": 6190} {"train_loss": -28.112951278686523, "global_step": 513850, "epoch": 6190} {"train_loss": -27.48365592956543, "global_step": 513851, "epoch": 6190} {"train_loss": -27.307798753301782, "global_step": 513852, "epoch": 6190, "val_loss": 6627626.0} {"train_loss": -23.414880752563477, "global_step": 513853, "epoch": 6191} {"train_loss": -21.8348331451416, "global_step": 513854, "epoch": 6191} {"train_loss": -24.25667381286621, "global_step": 513855, "epoch": 6191} {"train_loss": -25.2970027923584, "global_step": 513856, "epoch": 6191} {"train_loss": -24.83490753173828, "global_step": 513857, "epoch": 6191} {"train_loss": -25.4652156829834, "global_step": 513858, "epoch": 6191} {"train_loss": -25.53504753112793, "global_step": 513859, "epoch": 6191} {"train_loss": -25.721420288085938, "global_step": 513860, "epoch": 6191} {"train_loss": -25.819543838500977, "global_step": 513861, "epoch": 6191} {"train_loss": -25.954803466796875, "global_step": 513862, "epoch": 6191} {"train_loss": -26.076574325561523, "global_step": 513863, "epoch": 6191} {"train_loss": -25.891265869140625, "global_step": 513864, "epoch": 6191} {"train_loss": -26.340585708618164, "global_step": 513865, "epoch": 6191} {"train_loss": -26.099985122680664, "global_step": 513866, "epoch": 6191} {"train_loss": -26.076887130737305, "global_step": 513867, "epoch": 6191} {"train_loss": -26.609907150268555, "global_step": 513868, "epoch": 6191} {"train_loss": -26.414783477783203, "global_step": 513869, "epoch": 6191} {"train_loss": -26.669530868530273, "global_step": 513870, "epoch": 6191} {"train_loss": -26.45051383972168, "global_step": 513871, "epoch": 6191} {"train_loss": -26.64092445373535, "global_step": 513872, "epoch": 6191} {"train_loss": -26.424850463867188, "global_step": 513873, "epoch": 6191} {"train_loss": -27.01543617248535, "global_step": 513874, "epoch": 6191} {"train_loss": -26.289142608642578, "global_step": 513875, "epoch": 6191} {"train_loss": -27.06198501586914, "global_step": 513876, "epoch": 6191} {"train_loss": -26.72532081604004, "global_step": 513877, "epoch": 6191} {"train_loss": -26.936939239501953, "global_step": 513878, "epoch": 6191} {"train_loss": -26.69880485534668, "global_step": 513879, "epoch": 6191} {"train_loss": -26.98318862915039, "global_step": 513880, "epoch": 6191} {"train_loss": -26.87623405456543, "global_step": 513881, "epoch": 6191} {"train_loss": -26.966522216796875, "global_step": 513882, "epoch": 6191} {"train_loss": -27.231250762939453, "global_step": 513883, "epoch": 6191} {"train_loss": -26.70440673828125, "global_step": 513884, "epoch": 6191} {"train_loss": -27.14338493347168, "global_step": 513885, "epoch": 6191} {"train_loss": -27.078399658203125, "global_step": 513886, "epoch": 6191} {"train_loss": -27.171064376831055, "global_step": 513887, "epoch": 6191} {"train_loss": -26.65247917175293, "global_step": 513888, "epoch": 6191} {"train_loss": -27.379114151000977, "global_step": 513889, "epoch": 6191} {"train_loss": -27.2752742767334, "global_step": 513890, "epoch": 6191} {"train_loss": -27.26312255859375, "global_step": 513891, "epoch": 6191} {"train_loss": -26.88974952697754, "global_step": 513892, "epoch": 6191} {"train_loss": -27.4097843170166, "global_step": 513893, "epoch": 6191} {"train_loss": -27.0285701751709, "global_step": 513894, "epoch": 6191} {"train_loss": -27.34379005432129, "global_step": 513895, "epoch": 6191} {"train_loss": -27.556623458862305, "global_step": 513896, "epoch": 6191} {"train_loss": -27.6961612701416, "global_step": 513897, "epoch": 6191} {"train_loss": -27.367263793945312, "global_step": 513898, "epoch": 6191} {"train_loss": -27.633085250854492, "global_step": 513899, "epoch": 6191} {"train_loss": -27.3508358001709, "global_step": 513900, "epoch": 6191} {"train_loss": -27.21435546875, "global_step": 513901, "epoch": 6191} {"train_loss": -27.548892974853516, "global_step": 513902, "epoch": 6191} {"train_loss": -27.72662353515625, "global_step": 513903, "epoch": 6191} {"train_loss": -27.63043212890625, "global_step": 513904, "epoch": 6191} {"train_loss": -27.68348503112793, "global_step": 513905, "epoch": 6191} {"train_loss": -27.621931076049805, "global_step": 513906, "epoch": 6191} {"train_loss": -27.522998809814453, "global_step": 513907, "epoch": 6191} {"train_loss": -27.48301124572754, "global_step": 513908, "epoch": 6191} {"train_loss": -27.64023208618164, "global_step": 513909, "epoch": 6191} {"train_loss": -27.687414169311523, "global_step": 513910, "epoch": 6191} {"train_loss": -28.010009765625, "global_step": 513911, "epoch": 6191} {"train_loss": -27.558990478515625, "global_step": 513912, "epoch": 6191} {"train_loss": -27.72226333618164, "global_step": 513913, "epoch": 6191} {"train_loss": -27.572525024414062, "global_step": 513914, "epoch": 6191} {"train_loss": -27.74928092956543, "global_step": 513915, "epoch": 6191} {"train_loss": -27.56463623046875, "global_step": 513916, "epoch": 6191} {"train_loss": -27.60809326171875, "global_step": 513917, "epoch": 6191} {"train_loss": -27.7614803314209, "global_step": 513918, "epoch": 6191} {"train_loss": -27.529052734375, "global_step": 513919, "epoch": 6191} {"train_loss": -27.659778594970703, "global_step": 513920, "epoch": 6191} {"train_loss": -27.464466094970703, "global_step": 513921, "epoch": 6191} {"train_loss": -27.53759765625, "global_step": 513922, "epoch": 6191} {"train_loss": -27.362539291381836, "global_step": 513923, "epoch": 6191} {"train_loss": -27.423755645751953, "global_step": 513924, "epoch": 6191} {"train_loss": -27.25127601623535, "global_step": 513925, "epoch": 6191} {"train_loss": -27.484088897705078, "global_step": 513926, "epoch": 6191} {"train_loss": -27.79090690612793, "global_step": 513927, "epoch": 6191} {"train_loss": -27.700366973876953, "global_step": 513928, "epoch": 6191} {"train_loss": -27.530487060546875, "global_step": 513929, "epoch": 6191} {"train_loss": -27.840524673461914, "global_step": 513930, "epoch": 6191} {"train_loss": -27.398019790649414, "global_step": 513931, "epoch": 6191} {"train_loss": -27.495100021362305, "global_step": 513932, "epoch": 6191} {"train_loss": -27.53876304626465, "global_step": 513933, "epoch": 6191} {"train_loss": -27.549047470092773, "global_step": 513934, "epoch": 6191} {"train_loss": -26.92737108253571, "global_step": 513935, "epoch": 6191, "val_loss": 6652461.5} {"train_loss": -27.65594482421875, "global_step": 513936, "epoch": 6192} {"train_loss": -27.73101234436035, "global_step": 513937, "epoch": 6192} {"train_loss": -27.643753051757812, "global_step": 513938, "epoch": 6192} {"train_loss": -27.63425064086914, "global_step": 513939, "epoch": 6192} {"train_loss": -26.96953773498535, "global_step": 513940, "epoch": 6192} {"train_loss": -27.549091339111328, "global_step": 513941, "epoch": 6192} {"train_loss": -27.741607666015625, "global_step": 513942, "epoch": 6192} {"train_loss": -27.20957374572754, "global_step": 513943, "epoch": 6192} {"train_loss": -27.307788848876953, "global_step": 513944, "epoch": 6192} {"train_loss": -27.3126277923584, "global_step": 513945, "epoch": 6192} {"train_loss": -27.32390785217285, "global_step": 513946, "epoch": 6192} {"train_loss": -27.540576934814453, "global_step": 513947, "epoch": 6192} {"train_loss": -27.131671905517578, "global_step": 513948, "epoch": 6192} {"train_loss": -27.3709774017334, "global_step": 513949, "epoch": 6192} {"train_loss": -27.070215225219727, "global_step": 513950, "epoch": 6192} {"train_loss": -27.488916397094727, "global_step": 513951, "epoch": 6192} {"train_loss": -27.534940719604492, "global_step": 513952, "epoch": 6192} {"train_loss": -27.3380069732666, "global_step": 513953, "epoch": 6192} {"train_loss": -27.574853897094727, "global_step": 513954, "epoch": 6192} {"train_loss": -27.53816795349121, "global_step": 513955, "epoch": 6192} {"train_loss": -27.508533477783203, "global_step": 513956, "epoch": 6192} {"train_loss": -27.519001007080078, "global_step": 513957, "epoch": 6192} {"train_loss": -27.5, "global_step": 513958, "epoch": 6192} {"train_loss": -27.610593795776367, "global_step": 513959, "epoch": 6192} {"train_loss": -27.60650062561035, "global_step": 513960, "epoch": 6192} {"train_loss": -27.529651641845703, "global_step": 513961, "epoch": 6192} {"train_loss": -27.602466583251953, "global_step": 513962, "epoch": 6192} {"train_loss": -27.81036949157715, "global_step": 513963, "epoch": 6192} {"train_loss": -27.792089462280273, "global_step": 513964, "epoch": 6192} {"train_loss": -27.82283592224121, "global_step": 513965, "epoch": 6192} {"train_loss": -27.428247451782227, "global_step": 513966, "epoch": 6192} {"train_loss": -27.474775314331055, "global_step": 513967, "epoch": 6192} {"train_loss": -27.726415634155273, "global_step": 513968, "epoch": 6192} {"train_loss": -27.64043617248535, "global_step": 513969, "epoch": 6192} {"train_loss": -27.90791893005371, "global_step": 513970, "epoch": 6192} {"train_loss": -27.658533096313477, "global_step": 513971, "epoch": 6192} {"train_loss": -27.32985496520996, "global_step": 513972, "epoch": 6192} {"train_loss": -27.531721115112305, "global_step": 513973, "epoch": 6192} {"train_loss": -27.846267700195312, "global_step": 513974, "epoch": 6192} {"train_loss": -27.35820960998535, "global_step": 513975, "epoch": 6192} {"train_loss": -27.593137741088867, "global_step": 513976, "epoch": 6192} {"train_loss": -27.863950729370117, "global_step": 513977, "epoch": 6192} {"train_loss": -27.92803955078125, "global_step": 513978, "epoch": 6192} {"train_loss": -27.7150821685791, "global_step": 513979, "epoch": 6192} {"train_loss": -27.45537757873535, "global_step": 513980, "epoch": 6192} {"train_loss": -27.530481338500977, "global_step": 513981, "epoch": 6192} {"train_loss": -27.55353355407715, "global_step": 513982, "epoch": 6192} {"train_loss": -27.497034072875977, "global_step": 513983, "epoch": 6192} {"train_loss": -28.061765670776367, "global_step": 513984, "epoch": 6192} {"train_loss": -27.73029136657715, "global_step": 513985, "epoch": 6192} {"train_loss": -27.558639526367188, "global_step": 513986, "epoch": 6192} {"train_loss": -27.28955078125, "global_step": 513987, "epoch": 6192} {"train_loss": -27.894302368164062, "global_step": 513988, "epoch": 6192} {"train_loss": -27.806976318359375, "global_step": 513989, "epoch": 6192} {"train_loss": -27.488489151000977, "global_step": 513990, "epoch": 6192} {"train_loss": -27.83917236328125, "global_step": 513991, "epoch": 6192} {"train_loss": -27.422576904296875, "global_step": 513992, "epoch": 6192} {"train_loss": -27.135847091674805, "global_step": 513993, "epoch": 6192} {"train_loss": -27.5610294342041, "global_step": 513994, "epoch": 6192} {"train_loss": -27.4853515625, "global_step": 513995, "epoch": 6192} {"train_loss": -27.45576286315918, "global_step": 513996, "epoch": 6192} {"train_loss": -27.603275299072266, "global_step": 513997, "epoch": 6192} {"train_loss": -27.669631958007812, "global_step": 513998, "epoch": 6192} {"train_loss": -27.052587509155273, "global_step": 513999, "epoch": 6192} {"train_loss": -26.907733917236328, "global_step": 514000, "epoch": 6192} {"train_loss": -27.207538604736328, "global_step": 514001, "epoch": 6192} {"train_loss": -27.389936447143555, "global_step": 514002, "epoch": 6192} {"train_loss": -27.158857345581055, "global_step": 514003, "epoch": 6192} {"train_loss": -27.56622886657715, "global_step": 514004, "epoch": 6192} {"train_loss": -27.3103084564209, "global_step": 514005, "epoch": 6192} {"train_loss": -27.635761260986328, "global_step": 514006, "epoch": 6192} {"train_loss": -27.520034790039062, "global_step": 514007, "epoch": 6192} {"train_loss": -27.355161666870117, "global_step": 514008, "epoch": 6192} {"train_loss": -27.432519912719727, "global_step": 514009, "epoch": 6192} {"train_loss": -27.326812744140625, "global_step": 514010, "epoch": 6192} {"train_loss": -27.467121124267578, "global_step": 514011, "epoch": 6192} {"train_loss": -27.600622177124023, "global_step": 514012, "epoch": 6192} {"train_loss": -27.670379638671875, "global_step": 514013, "epoch": 6192} {"train_loss": -27.55097007751465, "global_step": 514014, "epoch": 6192} {"train_loss": -27.074819564819336, "global_step": 514015, "epoch": 6192} {"train_loss": -27.332141876220703, "global_step": 514016, "epoch": 6192} {"train_loss": -27.511066436767578, "global_step": 514017, "epoch": 6192} {"train_loss": -27.50831987771643, "global_step": 514018, "epoch": 6192, "val_loss": 6728907.0} {"train_loss": -27.221149444580078, "global_step": 514019, "epoch": 6193} {"train_loss": -26.342138290405273, "global_step": 514020, "epoch": 6193} {"train_loss": -26.45063591003418, "global_step": 514021, "epoch": 6193} {"train_loss": -27.080951690673828, "global_step": 514022, "epoch": 6193} {"train_loss": -27.086095809936523, "global_step": 514023, "epoch": 6193} {"train_loss": -26.780670166015625, "global_step": 514024, "epoch": 6193} {"train_loss": -27.22478675842285, "global_step": 514025, "epoch": 6193} {"train_loss": -26.622678756713867, "global_step": 514026, "epoch": 6193} {"train_loss": -26.828617095947266, "global_step": 514027, "epoch": 6193} {"train_loss": -26.839218139648438, "global_step": 514028, "epoch": 6193} {"train_loss": -26.75054931640625, "global_step": 514029, "epoch": 6193} {"train_loss": -26.623807907104492, "global_step": 514030, "epoch": 6193} {"train_loss": -26.91792106628418, "global_step": 514031, "epoch": 6193} {"train_loss": -27.040800094604492, "global_step": 514032, "epoch": 6193} {"train_loss": -27.027454376220703, "global_step": 514033, "epoch": 6193} {"train_loss": -26.705602645874023, "global_step": 514034, "epoch": 6193} {"train_loss": -27.015851974487305, "global_step": 514035, "epoch": 6193} {"train_loss": -27.203948974609375, "global_step": 514036, "epoch": 6193} {"train_loss": -27.3344783782959, "global_step": 514037, "epoch": 6193} {"train_loss": -27.5970401763916, "global_step": 514038, "epoch": 6193} {"train_loss": -27.209394454956055, "global_step": 514039, "epoch": 6193} {"train_loss": -27.37018394470215, "global_step": 514040, "epoch": 6193} {"train_loss": -27.05731773376465, "global_step": 514041, "epoch": 6193} {"train_loss": -27.422290802001953, "global_step": 514042, "epoch": 6193} {"train_loss": -27.3292293548584, "global_step": 514043, "epoch": 6193} {"train_loss": -26.738056182861328, "global_step": 514044, "epoch": 6193} {"train_loss": -27.134408950805664, "global_step": 514045, "epoch": 6193} {"train_loss": -27.667133331298828, "global_step": 514046, "epoch": 6193} {"train_loss": -27.54011344909668, "global_step": 514047, "epoch": 6193} {"train_loss": -26.972570419311523, "global_step": 514048, "epoch": 6193} {"train_loss": -27.599029541015625, "global_step": 514049, "epoch": 6193} {"train_loss": -27.3057861328125, "global_step": 514050, "epoch": 6193} {"train_loss": -27.341949462890625, "global_step": 514051, "epoch": 6193} {"train_loss": -27.7515926361084, "global_step": 514052, "epoch": 6193} {"train_loss": -27.49964714050293, "global_step": 514053, "epoch": 6193} {"train_loss": -27.473596572875977, "global_step": 514054, "epoch": 6193} {"train_loss": -27.3521671295166, "global_step": 514055, "epoch": 6193} {"train_loss": -27.126678466796875, "global_step": 514056, "epoch": 6193} {"train_loss": -27.61606216430664, "global_step": 514057, "epoch": 6193} {"train_loss": -27.673248291015625, "global_step": 514058, "epoch": 6193} {"train_loss": -27.60038185119629, "global_step": 514059, "epoch": 6193} {"train_loss": -27.607046127319336, "global_step": 514060, "epoch": 6193} {"train_loss": -27.5996150970459, "global_step": 514061, "epoch": 6193} {"train_loss": -27.927963256835938, "global_step": 514062, "epoch": 6193} {"train_loss": -27.87611198425293, "global_step": 514063, "epoch": 6193} {"train_loss": -27.93474769592285, "global_step": 514064, "epoch": 6193} {"train_loss": -27.819311141967773, "global_step": 514065, "epoch": 6193} {"train_loss": -27.86762809753418, "global_step": 514066, "epoch": 6193} {"train_loss": -27.777759552001953, "global_step": 514067, "epoch": 6193} {"train_loss": -27.692663192749023, "global_step": 514068, "epoch": 6193} {"train_loss": -27.67171287536621, "global_step": 514069, "epoch": 6193} {"train_loss": -27.516199111938477, "global_step": 514070, "epoch": 6193} {"train_loss": -27.69940185546875, "global_step": 514071, "epoch": 6193} {"train_loss": -27.816553115844727, "global_step": 514072, "epoch": 6193} {"train_loss": -27.795515060424805, "global_step": 514073, "epoch": 6193} {"train_loss": -27.631759643554688, "global_step": 514074, "epoch": 6193} {"train_loss": -28.0725154876709, "global_step": 514075, "epoch": 6193} {"train_loss": -27.510746002197266, "global_step": 514076, "epoch": 6193} {"train_loss": -27.696807861328125, "global_step": 514077, "epoch": 6193} {"train_loss": -27.653039932250977, "global_step": 514078, "epoch": 6193} {"train_loss": -27.751819610595703, "global_step": 514079, "epoch": 6193} {"train_loss": -27.910062789916992, "global_step": 514080, "epoch": 6193} {"train_loss": -28.043548583984375, "global_step": 514081, "epoch": 6193} {"train_loss": -27.421802520751953, "global_step": 514082, "epoch": 6193} {"train_loss": -27.219404220581055, "global_step": 514083, "epoch": 6193} {"train_loss": -27.327566146850586, "global_step": 514084, "epoch": 6193} {"train_loss": -27.260360717773438, "global_step": 514085, "epoch": 6193} {"train_loss": -26.8021183013916, "global_step": 514086, "epoch": 6193} {"train_loss": -27.360675811767578, "global_step": 514087, "epoch": 6193} {"train_loss": -28.004261016845703, "global_step": 514088, "epoch": 6193} {"train_loss": -27.53302001953125, "global_step": 514089, "epoch": 6193} {"train_loss": -27.143301010131836, "global_step": 514090, "epoch": 6193} {"train_loss": -27.366987228393555, "global_step": 514091, "epoch": 6193} {"train_loss": -27.9049015045166, "global_step": 514092, "epoch": 6193} {"train_loss": -27.265918731689453, "global_step": 514093, "epoch": 6193} {"train_loss": -27.351886749267578, "global_step": 514094, "epoch": 6193} {"train_loss": -27.682424545288086, "global_step": 514095, "epoch": 6193} {"train_loss": -27.18073844909668, "global_step": 514096, "epoch": 6193} {"train_loss": -27.4032039642334, "global_step": 514097, "epoch": 6193} {"train_loss": -27.30575942993164, "global_step": 514098, "epoch": 6193} {"train_loss": -27.69366455078125, "global_step": 514099, "epoch": 6193} {"train_loss": -28.128250122070312, "global_step": 514100, "epoch": 6193} {"train_loss": -27.39333593988993, "global_step": 514101, "epoch": 6193, "val_loss": 6597903.0} {"train_loss": -26.938312530517578, "global_step": 514102, "epoch": 6194} {"train_loss": -26.893720626831055, "global_step": 514103, "epoch": 6194} {"train_loss": -27.358240127563477, "global_step": 514104, "epoch": 6194} {"train_loss": -27.5931396484375, "global_step": 514105, "epoch": 6194} {"train_loss": -27.004240036010742, "global_step": 514106, "epoch": 6194} {"train_loss": -27.30632972717285, "global_step": 514107, "epoch": 6194} {"train_loss": -26.786611557006836, "global_step": 514108, "epoch": 6194} {"train_loss": -26.937055587768555, "global_step": 514109, "epoch": 6194} {"train_loss": -27.5738525390625, "global_step": 514110, "epoch": 6194} {"train_loss": -27.203845977783203, "global_step": 514111, "epoch": 6194} {"train_loss": -26.6259708404541, "global_step": 514112, "epoch": 6194} {"train_loss": -27.499927520751953, "global_step": 514113, "epoch": 6194} {"train_loss": -27.101186752319336, "global_step": 514114, "epoch": 6194} {"train_loss": -27.151931762695312, "global_step": 514115, "epoch": 6194} {"train_loss": -26.882917404174805, "global_step": 514116, "epoch": 6194} {"train_loss": -26.792022705078125, "global_step": 514117, "epoch": 6194} {"train_loss": -26.803054809570312, "global_step": 514118, "epoch": 6194} {"train_loss": -26.97796058654785, "global_step": 514119, "epoch": 6194} {"train_loss": -27.485279083251953, "global_step": 514120, "epoch": 6194} {"train_loss": -27.920673370361328, "global_step": 514121, "epoch": 6194} {"train_loss": -26.83547019958496, "global_step": 514122, "epoch": 6194} {"train_loss": -27.140607833862305, "global_step": 514123, "epoch": 6194} {"train_loss": -27.570981979370117, "global_step": 514124, "epoch": 6194} {"train_loss": -27.029590606689453, "global_step": 514125, "epoch": 6194} {"train_loss": -27.201156616210938, "global_step": 514126, "epoch": 6194} {"train_loss": -27.721601486206055, "global_step": 514127, "epoch": 6194} {"train_loss": -27.2628231048584, "global_step": 514128, "epoch": 6194} {"train_loss": -27.806671142578125, "global_step": 514129, "epoch": 6194} {"train_loss": -27.36848258972168, "global_step": 514130, "epoch": 6194} {"train_loss": -27.31062126159668, "global_step": 514131, "epoch": 6194} {"train_loss": -27.721786499023438, "global_step": 514132, "epoch": 6194} {"train_loss": -27.49696159362793, "global_step": 514133, "epoch": 6194} {"train_loss": -27.513776779174805, "global_step": 514134, "epoch": 6194} {"train_loss": -27.670185089111328, "global_step": 514135, "epoch": 6194} {"train_loss": -27.50400161743164, "global_step": 514136, "epoch": 6194} {"train_loss": -27.554533004760742, "global_step": 514137, "epoch": 6194} {"train_loss": -27.586090087890625, "global_step": 514138, "epoch": 6194} {"train_loss": -27.59653091430664, "global_step": 514139, "epoch": 6194} {"train_loss": -27.178821563720703, "global_step": 514140, "epoch": 6194} {"train_loss": -27.703857421875, "global_step": 514141, "epoch": 6194} {"train_loss": -27.651870727539062, "global_step": 514142, "epoch": 6194} {"train_loss": -27.534605026245117, "global_step": 514143, "epoch": 6194} {"train_loss": -27.623212814331055, "global_step": 514144, "epoch": 6194} {"train_loss": -27.15266227722168, "global_step": 514145, "epoch": 6194} {"train_loss": -27.937942504882812, "global_step": 514146, "epoch": 6194} {"train_loss": -27.304899215698242, "global_step": 514147, "epoch": 6194} {"train_loss": -27.258264541625977, "global_step": 514148, "epoch": 6194} {"train_loss": -27.517724990844727, "global_step": 514149, "epoch": 6194} {"train_loss": -27.558141708374023, "global_step": 514150, "epoch": 6194} {"train_loss": -27.297504425048828, "global_step": 514151, "epoch": 6194} {"train_loss": -27.376615524291992, "global_step": 514152, "epoch": 6194} {"train_loss": -27.269773483276367, "global_step": 514153, "epoch": 6194} {"train_loss": -27.247114181518555, "global_step": 514154, "epoch": 6194} {"train_loss": -27.6943359375, "global_step": 514155, "epoch": 6194} {"train_loss": -27.806604385375977, "global_step": 514156, "epoch": 6194} {"train_loss": -27.797901153564453, "global_step": 514157, "epoch": 6194} {"train_loss": -27.5692195892334, "global_step": 514158, "epoch": 6194} {"train_loss": -27.632450103759766, "global_step": 514159, "epoch": 6194} {"train_loss": -27.495031356811523, "global_step": 514160, "epoch": 6194} {"train_loss": -28.17352294921875, "global_step": 514161, "epoch": 6194} {"train_loss": -27.705860137939453, "global_step": 514162, "epoch": 6194} {"train_loss": -27.663700103759766, "global_step": 514163, "epoch": 6194} {"train_loss": -27.724145889282227, "global_step": 514164, "epoch": 6194} {"train_loss": -27.674930572509766, "global_step": 514165, "epoch": 6194} {"train_loss": -27.622699737548828, "global_step": 514166, "epoch": 6194} {"train_loss": -27.584070205688477, "global_step": 514167, "epoch": 6194} {"train_loss": -27.60328483581543, "global_step": 514168, "epoch": 6194} {"train_loss": -27.569849014282227, "global_step": 514169, "epoch": 6194} {"train_loss": -27.443490982055664, "global_step": 514170, "epoch": 6194} {"train_loss": -27.901350021362305, "global_step": 514171, "epoch": 6194} {"train_loss": -27.259754180908203, "global_step": 514172, "epoch": 6194} {"train_loss": -27.834430694580078, "global_step": 514173, "epoch": 6194} {"train_loss": -27.597793579101562, "global_step": 514174, "epoch": 6194} {"train_loss": -27.5603084564209, "global_step": 514175, "epoch": 6194} {"train_loss": -27.31610679626465, "global_step": 514176, "epoch": 6194} {"train_loss": -27.55712890625, "global_step": 514177, "epoch": 6194} {"train_loss": -27.13355827331543, "global_step": 514178, "epoch": 6194} {"train_loss": -26.074243545532227, "global_step": 514179, "epoch": 6194} {"train_loss": -26.291494369506836, "global_step": 514180, "epoch": 6194} {"train_loss": -26.127485275268555, "global_step": 514181, "epoch": 6194} {"train_loss": -26.9020938873291, "global_step": 514182, "epoch": 6194} {"train_loss": -27.3914794921875, "global_step": 514183, "epoch": 6194} {"train_loss": -27.356746696564088, "global_step": 514184, "epoch": 6194, "val_loss": 6689344.5} {"train_loss": -24.90839958190918, "global_step": 514185, "epoch": 6195} {"train_loss": -26.263036727905273, "global_step": 514186, "epoch": 6195} {"train_loss": -26.216815948486328, "global_step": 514187, "epoch": 6195} {"train_loss": -26.017044067382812, "global_step": 514188, "epoch": 6195} {"train_loss": -26.25444984436035, "global_step": 514189, "epoch": 6195} {"train_loss": -26.38567543029785, "global_step": 514190, "epoch": 6195} {"train_loss": -26.050968170166016, "global_step": 514191, "epoch": 6195} {"train_loss": -26.570402145385742, "global_step": 514192, "epoch": 6195} {"train_loss": -26.296823501586914, "global_step": 514193, "epoch": 6195} {"train_loss": -26.6433162689209, "global_step": 514194, "epoch": 6195} {"train_loss": -26.5988826751709, "global_step": 514195, "epoch": 6195} {"train_loss": -26.57478141784668, "global_step": 514196, "epoch": 6195} {"train_loss": -26.12891960144043, "global_step": 514197, "epoch": 6195} {"train_loss": -26.613239288330078, "global_step": 514198, "epoch": 6195} {"train_loss": -26.234167098999023, "global_step": 514199, "epoch": 6195} {"train_loss": -26.56977653503418, "global_step": 514200, "epoch": 6195} {"train_loss": -26.732257843017578, "global_step": 514201, "epoch": 6195} {"train_loss": -27.04627799987793, "global_step": 514202, "epoch": 6195} {"train_loss": -27.12617301940918, "global_step": 514203, "epoch": 6195} {"train_loss": -26.5705509185791, "global_step": 514204, "epoch": 6195} {"train_loss": -27.168176651000977, "global_step": 514205, "epoch": 6195} {"train_loss": -26.876819610595703, "global_step": 514206, "epoch": 6195} {"train_loss": -26.975133895874023, "global_step": 514207, "epoch": 6195} {"train_loss": -27.0023136138916, "global_step": 514208, "epoch": 6195} {"train_loss": -26.8687744140625, "global_step": 514209, "epoch": 6195} {"train_loss": -26.76836585998535, "global_step": 514210, "epoch": 6195} {"train_loss": -26.953237533569336, "global_step": 514211, "epoch": 6195} {"train_loss": -26.919010162353516, "global_step": 514212, "epoch": 6195} {"train_loss": -27.40541648864746, "global_step": 514213, "epoch": 6195} {"train_loss": -27.21949577331543, "global_step": 514214, "epoch": 6195} {"train_loss": -27.243005752563477, "global_step": 514215, "epoch": 6195} {"train_loss": -27.249502182006836, "global_step": 514216, "epoch": 6195} {"train_loss": -27.047754287719727, "global_step": 514217, "epoch": 6195} {"train_loss": -27.356592178344727, "global_step": 514218, "epoch": 6195} {"train_loss": -27.687421798706055, "global_step": 514219, "epoch": 6195} {"train_loss": -27.344558715820312, "global_step": 514220, "epoch": 6195} {"train_loss": -27.22456169128418, "global_step": 514221, "epoch": 6195} {"train_loss": -27.376996994018555, "global_step": 514222, "epoch": 6195} {"train_loss": -27.577512741088867, "global_step": 514223, "epoch": 6195} {"train_loss": -27.36747169494629, "global_step": 514224, "epoch": 6195} {"train_loss": -27.62412452697754, "global_step": 514225, "epoch": 6195} {"train_loss": -27.161212921142578, "global_step": 514226, "epoch": 6195} {"train_loss": -27.382537841796875, "global_step": 514227, "epoch": 6195} {"train_loss": -27.625690460205078, "global_step": 514228, "epoch": 6195} {"train_loss": -27.791906356811523, "global_step": 514229, "epoch": 6195} {"train_loss": -28.15018081665039, "global_step": 514230, "epoch": 6195} {"train_loss": -27.590978622436523, "global_step": 514231, "epoch": 6195} {"train_loss": -27.291522979736328, "global_step": 514232, "epoch": 6195} {"train_loss": -27.646137237548828, "global_step": 514233, "epoch": 6195} {"train_loss": -27.515777587890625, "global_step": 514234, "epoch": 6195} {"train_loss": -27.67084312438965, "global_step": 514235, "epoch": 6195} {"train_loss": -27.70770263671875, "global_step": 514236, "epoch": 6195} {"train_loss": -27.740375518798828, "global_step": 514237, "epoch": 6195} {"train_loss": -27.443578720092773, "global_step": 514238, "epoch": 6195} {"train_loss": -27.53289794921875, "global_step": 514239, "epoch": 6195} {"train_loss": -27.394256591796875, "global_step": 514240, "epoch": 6195} {"train_loss": -27.801239013671875, "global_step": 514241, "epoch": 6195} {"train_loss": -27.19879150390625, "global_step": 514242, "epoch": 6195} {"train_loss": -27.76700782775879, "global_step": 514243, "epoch": 6195} {"train_loss": -27.726490020751953, "global_step": 514244, "epoch": 6195} {"train_loss": -27.766590118408203, "global_step": 514245, "epoch": 6195} {"train_loss": -27.683801651000977, "global_step": 514246, "epoch": 6195} {"train_loss": -27.9305362701416, "global_step": 514247, "epoch": 6195} {"train_loss": -27.7596435546875, "global_step": 514248, "epoch": 6195} {"train_loss": -27.666601181030273, "global_step": 514249, "epoch": 6195} {"train_loss": -27.436288833618164, "global_step": 514250, "epoch": 6195} {"train_loss": -27.994138717651367, "global_step": 514251, "epoch": 6195} {"train_loss": -27.842493057250977, "global_step": 514252, "epoch": 6195} {"train_loss": -27.75444984436035, "global_step": 514253, "epoch": 6195} {"train_loss": -27.720258712768555, "global_step": 514254, "epoch": 6195} {"train_loss": -27.644092559814453, "global_step": 514255, "epoch": 6195} {"train_loss": -27.96278190612793, "global_step": 514256, "epoch": 6195} {"train_loss": -27.583454132080078, "global_step": 514257, "epoch": 6195} {"train_loss": -27.620031356811523, "global_step": 514258, "epoch": 6195} {"train_loss": -27.547372817993164, "global_step": 514259, "epoch": 6195} {"train_loss": -27.967065811157227, "global_step": 514260, "epoch": 6195} {"train_loss": -27.591482162475586, "global_step": 514261, "epoch": 6195} {"train_loss": -27.8705997467041, "global_step": 514262, "epoch": 6195} {"train_loss": -27.625930786132812, "global_step": 514263, "epoch": 6195} {"train_loss": -27.169431686401367, "global_step": 514264, "epoch": 6195} {"train_loss": -27.393598556518555, "global_step": 514265, "epoch": 6195} {"train_loss": -26.96481704711914, "global_step": 514266, "epoch": 6195} {"train_loss": -27.216729612235564, "global_step": 514267, "epoch": 6195, "val_loss": 6655343.0} {"train_loss": -26.87235450744629, "global_step": 514268, "epoch": 6196} {"train_loss": -26.325531005859375, "global_step": 514269, "epoch": 6196} {"train_loss": -26.506927490234375, "global_step": 514270, "epoch": 6196} {"train_loss": -26.43729019165039, "global_step": 514271, "epoch": 6196} {"train_loss": -27.030935287475586, "global_step": 514272, "epoch": 6196} {"train_loss": -26.89141273498535, "global_step": 514273, "epoch": 6196} {"train_loss": -27.20771598815918, "global_step": 514274, "epoch": 6196} {"train_loss": -27.228200912475586, "global_step": 514275, "epoch": 6196} {"train_loss": -27.11640739440918, "global_step": 514276, "epoch": 6196} {"train_loss": -27.06812858581543, "global_step": 514277, "epoch": 6196} {"train_loss": -27.285505294799805, "global_step": 514278, "epoch": 6196} {"train_loss": -26.787158966064453, "global_step": 514279, "epoch": 6196} {"train_loss": -27.03419303894043, "global_step": 514280, "epoch": 6196} {"train_loss": -26.940521240234375, "global_step": 514281, "epoch": 6196} {"train_loss": -27.34185218811035, "global_step": 514282, "epoch": 6196} {"train_loss": -27.631982803344727, "global_step": 514283, "epoch": 6196} {"train_loss": -27.317014694213867, "global_step": 514284, "epoch": 6196} {"train_loss": -27.538232803344727, "global_step": 514285, "epoch": 6196} {"train_loss": -27.128271102905273, "global_step": 514286, "epoch": 6196} {"train_loss": -27.63477897644043, "global_step": 514287, "epoch": 6196} {"train_loss": -27.23259925842285, "global_step": 514288, "epoch": 6196} {"train_loss": -27.415807723999023, "global_step": 514289, "epoch": 6196} {"train_loss": -27.240966796875, "global_step": 514290, "epoch": 6196} {"train_loss": -27.101215362548828, "global_step": 514291, "epoch": 6196} {"train_loss": -27.544281005859375, "global_step": 514292, "epoch": 6196} {"train_loss": -27.427656173706055, "global_step": 514293, "epoch": 6196} {"train_loss": -27.546960830688477, "global_step": 514294, "epoch": 6196} {"train_loss": -27.457677841186523, "global_step": 514295, "epoch": 6196} {"train_loss": -27.443927764892578, "global_step": 514296, "epoch": 6196} {"train_loss": -27.534162521362305, "global_step": 514297, "epoch": 6196} {"train_loss": -27.503538131713867, "global_step": 514298, "epoch": 6196} {"train_loss": -27.512754440307617, "global_step": 514299, "epoch": 6196} {"train_loss": -27.725299835205078, "global_step": 514300, "epoch": 6196} {"train_loss": -27.712671279907227, "global_step": 514301, "epoch": 6196} {"train_loss": -27.54377555847168, "global_step": 514302, "epoch": 6196} {"train_loss": -27.68763542175293, "global_step": 514303, "epoch": 6196} {"train_loss": -27.564355850219727, "global_step": 514304, "epoch": 6196} {"train_loss": -27.750244140625, "global_step": 514305, "epoch": 6196} {"train_loss": -27.581151962280273, "global_step": 514306, "epoch": 6196} {"train_loss": -27.745471954345703, "global_step": 514307, "epoch": 6196} {"train_loss": -27.821313858032227, "global_step": 514308, "epoch": 6196} {"train_loss": -27.435758590698242, "global_step": 514309, "epoch": 6196} {"train_loss": -27.66233253479004, "global_step": 514310, "epoch": 6196} {"train_loss": -27.365446090698242, "global_step": 514311, "epoch": 6196} {"train_loss": -27.866540908813477, "global_step": 514312, "epoch": 6196} {"train_loss": -27.6082820892334, "global_step": 514313, "epoch": 6196} {"train_loss": -27.459692001342773, "global_step": 514314, "epoch": 6196} {"train_loss": -27.67949867248535, "global_step": 514315, "epoch": 6196} {"train_loss": -27.40134620666504, "global_step": 514316, "epoch": 6196} {"train_loss": -27.47064208984375, "global_step": 514317, "epoch": 6196} {"train_loss": -27.529455184936523, "global_step": 514318, "epoch": 6196} {"train_loss": -27.39398193359375, "global_step": 514319, "epoch": 6196} {"train_loss": -27.370849609375, "global_step": 514320, "epoch": 6196} {"train_loss": -27.562543869018555, "global_step": 514321, "epoch": 6196} {"train_loss": -27.60487174987793, "global_step": 514322, "epoch": 6196} {"train_loss": -27.461597442626953, "global_step": 514323, "epoch": 6196} {"train_loss": -27.414398193359375, "global_step": 514324, "epoch": 6196} {"train_loss": -27.41973304748535, "global_step": 514325, "epoch": 6196} {"train_loss": -27.783674240112305, "global_step": 514326, "epoch": 6196} {"train_loss": -27.739776611328125, "global_step": 514327, "epoch": 6196} {"train_loss": -27.489490509033203, "global_step": 514328, "epoch": 6196} {"train_loss": -28.02094078063965, "global_step": 514329, "epoch": 6196} {"train_loss": -27.95339012145996, "global_step": 514330, "epoch": 6196} {"train_loss": -27.315031051635742, "global_step": 514331, "epoch": 6196} {"train_loss": -27.539335250854492, "global_step": 514332, "epoch": 6196} {"train_loss": -27.012964248657227, "global_step": 514333, "epoch": 6196} {"train_loss": -27.53566551208496, "global_step": 514334, "epoch": 6196} {"train_loss": -27.066207885742188, "global_step": 514335, "epoch": 6196} {"train_loss": -26.902755737304688, "global_step": 514336, "epoch": 6196} {"train_loss": -27.441904067993164, "global_step": 514337, "epoch": 6196} {"train_loss": -27.555524826049805, "global_step": 514338, "epoch": 6196} {"train_loss": -27.4388427734375, "global_step": 514339, "epoch": 6196} {"train_loss": -27.1966495513916, "global_step": 514340, "epoch": 6196} {"train_loss": -27.36884117126465, "global_step": 514341, "epoch": 6196} {"train_loss": -27.780012130737305, "global_step": 514342, "epoch": 6196} {"train_loss": -27.691831588745117, "global_step": 514343, "epoch": 6196} {"train_loss": -27.482349395751953, "global_step": 514344, "epoch": 6196} {"train_loss": -27.71797752380371, "global_step": 514345, "epoch": 6196} {"train_loss": -27.65688133239746, "global_step": 514346, "epoch": 6196} {"train_loss": -27.81671142578125, "global_step": 514347, "epoch": 6196} {"train_loss": -27.512821197509766, "global_step": 514348, "epoch": 6196} {"train_loss": -27.102933883666992, "global_step": 514349, "epoch": 6196} {"train_loss": -27.40204489374735, "global_step": 514350, "epoch": 6196, "val_loss": 6554793.0} {"train_loss": -26.5645751953125, "global_step": 514351, "epoch": 6197} {"train_loss": -27.313129425048828, "global_step": 514352, "epoch": 6197} {"train_loss": -27.100027084350586, "global_step": 514353, "epoch": 6197} {"train_loss": -27.052906036376953, "global_step": 514354, "epoch": 6197} {"train_loss": -27.48578453063965, "global_step": 514355, "epoch": 6197} {"train_loss": -26.710988998413086, "global_step": 514356, "epoch": 6197} {"train_loss": -26.825525283813477, "global_step": 514357, "epoch": 6197} {"train_loss": -27.214385986328125, "global_step": 514358, "epoch": 6197} {"train_loss": -27.140594482421875, "global_step": 514359, "epoch": 6197} {"train_loss": -27.004316329956055, "global_step": 514360, "epoch": 6197} {"train_loss": -26.954639434814453, "global_step": 514361, "epoch": 6197} {"train_loss": -27.4785099029541, "global_step": 514362, "epoch": 6197} {"train_loss": -27.430023193359375, "global_step": 514363, "epoch": 6197} {"train_loss": -27.5400390625, "global_step": 514364, "epoch": 6197} {"train_loss": -27.449949264526367, "global_step": 514365, "epoch": 6197} {"train_loss": -27.081785202026367, "global_step": 514366, "epoch": 6197} {"train_loss": -27.416461944580078, "global_step": 514367, "epoch": 6197} {"train_loss": -27.40290641784668, "global_step": 514368, "epoch": 6197} {"train_loss": -27.2384090423584, "global_step": 514369, "epoch": 6197} {"train_loss": -27.364337921142578, "global_step": 514370, "epoch": 6197} {"train_loss": -27.30780029296875, "global_step": 514371, "epoch": 6197} {"train_loss": -27.89401626586914, "global_step": 514372, "epoch": 6197} {"train_loss": -27.196109771728516, "global_step": 514373, "epoch": 6197} {"train_loss": -27.33575439453125, "global_step": 514374, "epoch": 6197} {"train_loss": -27.051483154296875, "global_step": 514375, "epoch": 6197} {"train_loss": -27.430179595947266, "global_step": 514376, "epoch": 6197} {"train_loss": -27.46028709411621, "global_step": 514377, "epoch": 6197} {"train_loss": -27.153919219970703, "global_step": 514378, "epoch": 6197} {"train_loss": -27.056732177734375, "global_step": 514379, "epoch": 6197} {"train_loss": -27.386205673217773, "global_step": 514380, "epoch": 6197} {"train_loss": -27.293798446655273, "global_step": 514381, "epoch": 6197} {"train_loss": -27.298105239868164, "global_step": 514382, "epoch": 6197} {"train_loss": -27.076129913330078, "global_step": 514383, "epoch": 6197} {"train_loss": -27.273202896118164, "global_step": 514384, "epoch": 6197} {"train_loss": -27.396503448486328, "global_step": 514385, "epoch": 6197} {"train_loss": -27.228748321533203, "global_step": 514386, "epoch": 6197} {"train_loss": -27.077041625976562, "global_step": 514387, "epoch": 6197} {"train_loss": -27.827423095703125, "global_step": 514388, "epoch": 6197} {"train_loss": -26.89509391784668, "global_step": 514389, "epoch": 6197} {"train_loss": -27.112384796142578, "global_step": 514390, "epoch": 6197} {"train_loss": -27.47067642211914, "global_step": 514391, "epoch": 6197} {"train_loss": -26.966388702392578, "global_step": 514392, "epoch": 6197} {"train_loss": -27.028827667236328, "global_step": 514393, "epoch": 6197} {"train_loss": -27.516870498657227, "global_step": 514394, "epoch": 6197} {"train_loss": -27.31336784362793, "global_step": 514395, "epoch": 6197} {"train_loss": -26.81817626953125, "global_step": 514396, "epoch": 6197} {"train_loss": -27.12308692932129, "global_step": 514397, "epoch": 6197} {"train_loss": -27.137622833251953, "global_step": 514398, "epoch": 6197} {"train_loss": -27.330982208251953, "global_step": 514399, "epoch": 6197} {"train_loss": -27.2349796295166, "global_step": 514400, "epoch": 6197} {"train_loss": -27.043243408203125, "global_step": 514401, "epoch": 6197} {"train_loss": -27.384571075439453, "global_step": 514402, "epoch": 6197} {"train_loss": -27.220840454101562, "global_step": 514403, "epoch": 6197} {"train_loss": -27.3522891998291, "global_step": 514404, "epoch": 6197} {"train_loss": -27.2525577545166, "global_step": 514405, "epoch": 6197} {"train_loss": -26.39774513244629, "global_step": 514406, "epoch": 6197} {"train_loss": -26.73451042175293, "global_step": 514407, "epoch": 6197} {"train_loss": -27.2996768951416, "global_step": 514408, "epoch": 6197} {"train_loss": -27.115039825439453, "global_step": 514409, "epoch": 6197} {"train_loss": -27.037504196166992, "global_step": 514410, "epoch": 6197} {"train_loss": -26.537555694580078, "global_step": 514411, "epoch": 6197} {"train_loss": -27.192800521850586, "global_step": 514412, "epoch": 6197} {"train_loss": -27.484689712524414, "global_step": 514413, "epoch": 6197} {"train_loss": -27.4509220123291, "global_step": 514414, "epoch": 6197} {"train_loss": -27.062580108642578, "global_step": 514415, "epoch": 6197} {"train_loss": -28.12923240661621, "global_step": 514416, "epoch": 6197} {"train_loss": -27.6554012298584, "global_step": 514417, "epoch": 6197} {"train_loss": -27.40742301940918, "global_step": 514418, "epoch": 6197} {"train_loss": -27.368173599243164, "global_step": 514419, "epoch": 6197} {"train_loss": -27.71919059753418, "global_step": 514420, "epoch": 6197} {"train_loss": -27.734851837158203, "global_step": 514421, "epoch": 6197} {"train_loss": -27.65789222717285, "global_step": 514422, "epoch": 6197} {"train_loss": -27.1749210357666, "global_step": 514423, "epoch": 6197} {"train_loss": -27.489919662475586, "global_step": 514424, "epoch": 6197} {"train_loss": -27.792255401611328, "global_step": 514425, "epoch": 6197} {"train_loss": -27.495574951171875, "global_step": 514426, "epoch": 6197} {"train_loss": -27.256103515625, "global_step": 514427, "epoch": 6197} {"train_loss": -27.719778060913086, "global_step": 514428, "epoch": 6197} {"train_loss": -27.654876708984375, "global_step": 514429, "epoch": 6197} {"train_loss": -27.515222549438477, "global_step": 514430, "epoch": 6197} {"train_loss": -27.711042404174805, "global_step": 514431, "epoch": 6197} {"train_loss": -27.678354263305664, "global_step": 514432, "epoch": 6197} {"train_loss": -27.27229256227792, "global_step": 514433, "epoch": 6197, "val_loss": 6673148.0} {"train_loss": -26.825958251953125, "global_step": 514434, "epoch": 6198} {"train_loss": -27.158645629882812, "global_step": 514435, "epoch": 6198} {"train_loss": -26.972761154174805, "global_step": 514436, "epoch": 6198} {"train_loss": -27.156982421875, "global_step": 514437, "epoch": 6198} {"train_loss": -26.782562255859375, "global_step": 514438, "epoch": 6198} {"train_loss": -26.921728134155273, "global_step": 514439, "epoch": 6198} {"train_loss": -27.028833389282227, "global_step": 514440, "epoch": 6198} {"train_loss": -27.25687599182129, "global_step": 514441, "epoch": 6198} {"train_loss": -26.989933013916016, "global_step": 514442, "epoch": 6198} {"train_loss": -27.66716957092285, "global_step": 514443, "epoch": 6198} {"train_loss": -27.6320743560791, "global_step": 514444, "epoch": 6198} {"train_loss": -27.39849281311035, "global_step": 514445, "epoch": 6198} {"train_loss": -27.723388671875, "global_step": 514446, "epoch": 6198} {"train_loss": -27.441755294799805, "global_step": 514447, "epoch": 6198} {"train_loss": -27.5705509185791, "global_step": 514448, "epoch": 6198} {"train_loss": -27.260046005249023, "global_step": 514449, "epoch": 6198} {"train_loss": -27.614038467407227, "global_step": 514450, "epoch": 6198} {"train_loss": -27.535367965698242, "global_step": 514451, "epoch": 6198} {"train_loss": -27.562253952026367, "global_step": 514452, "epoch": 6198} {"train_loss": -27.168699264526367, "global_step": 514453, "epoch": 6198} {"train_loss": -27.000934600830078, "global_step": 514454, "epoch": 6198} {"train_loss": -27.66224479675293, "global_step": 514455, "epoch": 6198} {"train_loss": -27.41180992126465, "global_step": 514456, "epoch": 6198} {"train_loss": -27.636962890625, "global_step": 514457, "epoch": 6198} {"train_loss": -27.422962188720703, "global_step": 514458, "epoch": 6198} {"train_loss": -27.73322868347168, "global_step": 514459, "epoch": 6198} {"train_loss": -27.508909225463867, "global_step": 514460, "epoch": 6198} {"train_loss": -27.175983428955078, "global_step": 514461, "epoch": 6198} {"train_loss": -27.27044677734375, "global_step": 514462, "epoch": 6198} {"train_loss": -27.680585861206055, "global_step": 514463, "epoch": 6198} {"train_loss": -26.8656005859375, "global_step": 514464, "epoch": 6198} {"train_loss": -27.379674911499023, "global_step": 514465, "epoch": 6198} {"train_loss": -27.592329025268555, "global_step": 514466, "epoch": 6198} {"train_loss": -27.5434627532959, "global_step": 514467, "epoch": 6198} {"train_loss": -27.606107711791992, "global_step": 514468, "epoch": 6198} {"train_loss": -27.55624771118164, "global_step": 514469, "epoch": 6198} {"train_loss": -27.50314712524414, "global_step": 514470, "epoch": 6198} {"train_loss": -27.668283462524414, "global_step": 514471, "epoch": 6198} {"train_loss": -27.637060165405273, "global_step": 514472, "epoch": 6198} {"train_loss": -27.487241744995117, "global_step": 514473, "epoch": 6198} {"train_loss": -27.448577880859375, "global_step": 514474, "epoch": 6198} {"train_loss": -27.375198364257812, "global_step": 514475, "epoch": 6198} {"train_loss": -27.44221305847168, "global_step": 514476, "epoch": 6198} {"train_loss": -27.4858455657959, "global_step": 514477, "epoch": 6198} {"train_loss": -27.6550235748291, "global_step": 514478, "epoch": 6198} {"train_loss": -27.103519439697266, "global_step": 514479, "epoch": 6198} {"train_loss": -27.359670639038086, "global_step": 514480, "epoch": 6198} {"train_loss": -28.08332633972168, "global_step": 514481, "epoch": 6198} {"train_loss": -27.579864501953125, "global_step": 514482, "epoch": 6198} {"train_loss": -27.955230712890625, "global_step": 514483, "epoch": 6198} {"train_loss": -27.91542625427246, "global_step": 514484, "epoch": 6198} {"train_loss": -27.735509872436523, "global_step": 514485, "epoch": 6198} {"train_loss": -27.539234161376953, "global_step": 514486, "epoch": 6198} {"train_loss": -27.322589874267578, "global_step": 514487, "epoch": 6198} {"train_loss": -27.655210494995117, "global_step": 514488, "epoch": 6198} {"train_loss": -27.875885009765625, "global_step": 514489, "epoch": 6198} {"train_loss": -27.588102340698242, "global_step": 514490, "epoch": 6198} {"train_loss": -27.750879287719727, "global_step": 514491, "epoch": 6198} {"train_loss": -27.50493812561035, "global_step": 514492, "epoch": 6198} {"train_loss": -27.5972957611084, "global_step": 514493, "epoch": 6198} {"train_loss": -27.529890060424805, "global_step": 514494, "epoch": 6198} {"train_loss": -27.637378692626953, "global_step": 514495, "epoch": 6198} {"train_loss": -27.812780380249023, "global_step": 514496, "epoch": 6198} {"train_loss": -27.373212814331055, "global_step": 514497, "epoch": 6198} {"train_loss": -27.398395538330078, "global_step": 514498, "epoch": 6198} {"train_loss": -27.689542770385742, "global_step": 514499, "epoch": 6198} {"train_loss": -27.700927734375, "global_step": 514500, "epoch": 6198} {"train_loss": -27.828693389892578, "global_step": 514501, "epoch": 6198} {"train_loss": -27.727264404296875, "global_step": 514502, "epoch": 6198} {"train_loss": -27.522083282470703, "global_step": 514503, "epoch": 6198} {"train_loss": -26.990585327148438, "global_step": 514504, "epoch": 6198} {"train_loss": -27.380395889282227, "global_step": 514505, "epoch": 6198} {"train_loss": -26.956302642822266, "global_step": 514506, "epoch": 6198} {"train_loss": -26.632904052734375, "global_step": 514507, "epoch": 6198} {"train_loss": -27.177814483642578, "global_step": 514508, "epoch": 6198} {"train_loss": -27.66228675842285, "global_step": 514509, "epoch": 6198} {"train_loss": -27.067520141601562, "global_step": 514510, "epoch": 6198} {"train_loss": -27.055273056030273, "global_step": 514511, "epoch": 6198} {"train_loss": -27.563241958618164, "global_step": 514512, "epoch": 6198} {"train_loss": -27.6309814453125, "global_step": 514513, "epoch": 6198} {"train_loss": -27.26240348815918, "global_step": 514514, "epoch": 6198} {"train_loss": -27.4005184173584, "global_step": 514515, "epoch": 6198} {"train_loss": -27.457368322165614, "global_step": 514516, "epoch": 6198, "val_loss": 6697000.5} {"train_loss": -25.475542068481445, "global_step": 514517, "epoch": 6199} {"train_loss": -25.919418334960938, "global_step": 514518, "epoch": 6199} {"train_loss": -25.258955001831055, "global_step": 514519, "epoch": 6199} {"train_loss": -25.908771514892578, "global_step": 514520, "epoch": 6199} {"train_loss": -26.232440948486328, "global_step": 514521, "epoch": 6199} {"train_loss": -25.717609405517578, "global_step": 514522, "epoch": 6199} {"train_loss": -26.074142456054688, "global_step": 514523, "epoch": 6199} {"train_loss": -26.022314071655273, "global_step": 514524, "epoch": 6199} {"train_loss": -26.574934005737305, "global_step": 514525, "epoch": 6199} {"train_loss": -26.5388240814209, "global_step": 514526, "epoch": 6199} {"train_loss": -26.905426025390625, "global_step": 514527, "epoch": 6199} {"train_loss": -26.227720260620117, "global_step": 514528, "epoch": 6199} {"train_loss": -26.479299545288086, "global_step": 514529, "epoch": 6199} {"train_loss": -26.620258331298828, "global_step": 514530, "epoch": 6199} {"train_loss": -26.58991050720215, "global_step": 514531, "epoch": 6199} {"train_loss": -26.90646743774414, "global_step": 514532, "epoch": 6199} {"train_loss": -26.866918563842773, "global_step": 514533, "epoch": 6199} {"train_loss": -26.7360782623291, "global_step": 514534, "epoch": 6199} {"train_loss": -26.745275497436523, "global_step": 514535, "epoch": 6199} {"train_loss": -26.88172721862793, "global_step": 514536, "epoch": 6199} {"train_loss": -26.878345489501953, "global_step": 514537, "epoch": 6199} {"train_loss": -26.72391700744629, "global_step": 514538, "epoch": 6199} {"train_loss": -27.323759078979492, "global_step": 514539, "epoch": 6199} {"train_loss": -27.032215118408203, "global_step": 514540, "epoch": 6199} {"train_loss": -27.05360221862793, "global_step": 514541, "epoch": 6199} {"train_loss": -26.97810173034668, "global_step": 514542, "epoch": 6199} {"train_loss": -27.18206787109375, "global_step": 514543, "epoch": 6199} {"train_loss": -27.183561325073242, "global_step": 514544, "epoch": 6199} {"train_loss": -27.10451316833496, "global_step": 514545, "epoch": 6199} {"train_loss": -27.1079044342041, "global_step": 514546, "epoch": 6199} {"train_loss": -27.047983169555664, "global_step": 514547, "epoch": 6199} {"train_loss": -27.10418128967285, "global_step": 514548, "epoch": 6199} {"train_loss": -27.52137565612793, "global_step": 514549, "epoch": 6199} {"train_loss": -27.374698638916016, "global_step": 514550, "epoch": 6199} {"train_loss": -27.078882217407227, "global_step": 514551, "epoch": 6199} {"train_loss": -27.362905502319336, "global_step": 514552, "epoch": 6199} {"train_loss": -27.420011520385742, "global_step": 514553, "epoch": 6199} {"train_loss": -27.440082550048828, "global_step": 514554, "epoch": 6199} {"train_loss": -27.43153953552246, "global_step": 514555, "epoch": 6199} {"train_loss": -27.52191162109375, "global_step": 514556, "epoch": 6199} {"train_loss": -27.625837326049805, "global_step": 514557, "epoch": 6199} {"train_loss": -27.39766502380371, "global_step": 514558, "epoch": 6199} {"train_loss": -27.59299087524414, "global_step": 514559, "epoch": 6199} {"train_loss": -27.49726676940918, "global_step": 514560, "epoch": 6199} {"train_loss": -27.488866806030273, "global_step": 514561, "epoch": 6199} {"train_loss": -27.424726486206055, "global_step": 514562, "epoch": 6199} {"train_loss": -27.397327423095703, "global_step": 514563, "epoch": 6199} {"train_loss": -27.58953285217285, "global_step": 514564, "epoch": 6199} {"train_loss": -27.40751075744629, "global_step": 514565, "epoch": 6199} {"train_loss": -27.331989288330078, "global_step": 514566, "epoch": 6199} {"train_loss": -27.601776123046875, "global_step": 514567, "epoch": 6199} {"train_loss": -27.57940673828125, "global_step": 514568, "epoch": 6199} {"train_loss": -27.371137619018555, "global_step": 514569, "epoch": 6199} {"train_loss": -27.5494327545166, "global_step": 514570, "epoch": 6199} {"train_loss": -27.613142013549805, "global_step": 514571, "epoch": 6199} {"train_loss": -27.667539596557617, "global_step": 514572, "epoch": 6199} {"train_loss": -27.68964195251465, "global_step": 514573, "epoch": 6199} {"train_loss": -27.465961456298828, "global_step": 514574, "epoch": 6199} {"train_loss": -27.454681396484375, "global_step": 514575, "epoch": 6199} {"train_loss": -27.76344108581543, "global_step": 514576, "epoch": 6199} {"train_loss": -27.651214599609375, "global_step": 514577, "epoch": 6199} {"train_loss": -27.686811447143555, "global_step": 514578, "epoch": 6199} {"train_loss": -27.654743194580078, "global_step": 514579, "epoch": 6199} {"train_loss": -27.025653839111328, "global_step": 514580, "epoch": 6199} {"train_loss": -27.33254051208496, "global_step": 514581, "epoch": 6199} {"train_loss": -27.295495986938477, "global_step": 514582, "epoch": 6199} {"train_loss": -27.589262008666992, "global_step": 514583, "epoch": 6199} {"train_loss": -27.447906494140625, "global_step": 514584, "epoch": 6199} {"train_loss": -27.292694091796875, "global_step": 514585, "epoch": 6199} {"train_loss": -27.49207878112793, "global_step": 514586, "epoch": 6199} {"train_loss": -27.16546058654785, "global_step": 514587, "epoch": 6199} {"train_loss": -26.949369430541992, "global_step": 514588, "epoch": 6199} {"train_loss": -26.69936180114746, "global_step": 514589, "epoch": 6199} {"train_loss": -27.08222770690918, "global_step": 514590, "epoch": 6199} {"train_loss": -27.052947998046875, "global_step": 514591, "epoch": 6199} {"train_loss": -27.506790161132812, "global_step": 514592, "epoch": 6199} {"train_loss": -27.328277587890625, "global_step": 514593, "epoch": 6199} {"train_loss": -27.55179214477539, "global_step": 514594, "epoch": 6199} {"train_loss": -27.358722686767578, "global_step": 514595, "epoch": 6199} {"train_loss": -26.99020767211914, "global_step": 514596, "epoch": 6199} {"train_loss": -27.586103439331055, "global_step": 514597, "epoch": 6199} {"train_loss": -27.34735107421875, "global_step": 514598, "epoch": 6199} {"train_loss": -27.115489316273884, "global_step": 514599, "epoch": 6199, "val_loss": 6650982.0} {"train_loss": -27.210302352905273, "global_step": 514600, "epoch": 6200} {"train_loss": -26.63418960571289, "global_step": 514601, "epoch": 6200} {"train_loss": -27.208044052124023, "global_step": 514602, "epoch": 6200} {"train_loss": -26.82782554626465, "global_step": 514603, "epoch": 6200} {"train_loss": -26.85369873046875, "global_step": 514604, "epoch": 6200} {"train_loss": -26.4285888671875, "global_step": 514605, "epoch": 6200} {"train_loss": -26.219039916992188, "global_step": 514606, "epoch": 6200} {"train_loss": -27.029455184936523, "global_step": 514607, "epoch": 6200} {"train_loss": -27.13205337524414, "global_step": 514608, "epoch": 6200} {"train_loss": -26.928298950195312, "global_step": 514609, "epoch": 6200} {"train_loss": -26.59613609313965, "global_step": 514610, "epoch": 6200} {"train_loss": -26.93097496032715, "global_step": 514611, "epoch": 6200} {"train_loss": -27.0887393951416, "global_step": 514612, "epoch": 6200} {"train_loss": -27.383581161499023, "global_step": 514613, "epoch": 6200} {"train_loss": -26.854049682617188, "global_step": 514614, "epoch": 6200} {"train_loss": -27.2399959564209, "global_step": 514615, "epoch": 6200} {"train_loss": -27.350967407226562, "global_step": 514616, "epoch": 6200} {"train_loss": -27.584857940673828, "global_step": 514617, "epoch": 6200} {"train_loss": -27.05588150024414, "global_step": 514618, "epoch": 6200} {"train_loss": -27.26287269592285, "global_step": 514619, "epoch": 6200} {"train_loss": -27.33234977722168, "global_step": 514620, "epoch": 6200} {"train_loss": -27.33744239807129, "global_step": 514621, "epoch": 6200} {"train_loss": -27.24995231628418, "global_step": 514622, "epoch": 6200} {"train_loss": -27.630903244018555, "global_step": 514623, "epoch": 6200} {"train_loss": -27.508136749267578, "global_step": 514624, "epoch": 6200} {"train_loss": -27.69025993347168, "global_step": 514625, "epoch": 6200} {"train_loss": -27.32136344909668, "global_step": 514626, "epoch": 6200} {"train_loss": -27.226804733276367, "global_step": 514627, "epoch": 6200} {"train_loss": -27.577844619750977, "global_step": 514628, "epoch": 6200} {"train_loss": -27.456750869750977, "global_step": 514629, "epoch": 6200} {"train_loss": -27.733667373657227, "global_step": 514630, "epoch": 6200} {"train_loss": -27.524045944213867, "global_step": 514631, "epoch": 6200} {"train_loss": -27.610721588134766, "global_step": 514632, "epoch": 6200} {"train_loss": -27.297195434570312, "global_step": 514633, "epoch": 6200} {"train_loss": -27.249292373657227, "global_step": 514634, "epoch": 6200} {"train_loss": -27.6608829498291, "global_step": 514635, "epoch": 6200} {"train_loss": -27.436880111694336, "global_step": 514636, "epoch": 6200} {"train_loss": -27.773944854736328, "global_step": 514637, "epoch": 6200} {"train_loss": -27.546239852905273, "global_step": 514638, "epoch": 6200} {"train_loss": -27.439401626586914, "global_step": 514639, "epoch": 6200} {"train_loss": -27.425561904907227, "global_step": 514640, "epoch": 6200} {"train_loss": -27.760400772094727, "global_step": 514641, "epoch": 6200} {"train_loss": -27.799346923828125, "global_step": 514642, "epoch": 6200} {"train_loss": -27.690216064453125, "global_step": 514643, "epoch": 6200} {"train_loss": -26.811689376831055, "global_step": 514644, "epoch": 6200} {"train_loss": -27.019519805908203, "global_step": 514645, "epoch": 6200} {"train_loss": -27.31829833984375, "global_step": 514646, "epoch": 6200} {"train_loss": -27.518522262573242, "global_step": 514647, "epoch": 6200} {"train_loss": -27.312545776367188, "global_step": 514648, "epoch": 6200} {"train_loss": -27.511499404907227, "global_step": 514649, "epoch": 6200} {"train_loss": -27.129409790039062, "global_step": 514650, "epoch": 6200} {"train_loss": -27.262008666992188, "global_step": 514651, "epoch": 6200} {"train_loss": -26.887304306030273, "global_step": 514652, "epoch": 6200} {"train_loss": -27.380691528320312, "global_step": 514653, "epoch": 6200} {"train_loss": -27.373193740844727, "global_step": 514654, "epoch": 6200} {"train_loss": -27.660511016845703, "global_step": 514655, "epoch": 6200} {"train_loss": -27.8586483001709, "global_step": 514656, "epoch": 6200} {"train_loss": -27.051849365234375, "global_step": 514657, "epoch": 6200} {"train_loss": -27.6744384765625, "global_step": 514658, "epoch": 6200} {"train_loss": -27.158588409423828, "global_step": 514659, "epoch": 6200} {"train_loss": -27.150487899780273, "global_step": 514660, "epoch": 6200} {"train_loss": -27.580341339111328, "global_step": 514661, "epoch": 6200} {"train_loss": -27.26509666442871, "global_step": 514662, "epoch": 6200} {"train_loss": -27.34393310546875, "global_step": 514663, "epoch": 6200} {"train_loss": -27.069971084594727, "global_step": 514664, "epoch": 6200} {"train_loss": -27.6325740814209, "global_step": 514665, "epoch": 6200} {"train_loss": -27.490406036376953, "global_step": 514666, "epoch": 6200} {"train_loss": -27.307647705078125, "global_step": 514667, "epoch": 6200} {"train_loss": -27.483505249023438, "global_step": 514668, "epoch": 6200} {"train_loss": -27.832345962524414, "global_step": 514669, "epoch": 6200} {"train_loss": -27.37883949279785, "global_step": 514670, "epoch": 6200} {"train_loss": -27.46085548400879, "global_step": 514671, "epoch": 6200} {"train_loss": -27.610126495361328, "global_step": 514672, "epoch": 6200} {"train_loss": -27.2462100982666, "global_step": 514673, "epoch": 6200} {"train_loss": -27.5524845123291, "global_step": 514674, "epoch": 6200} {"train_loss": -27.530963897705078, "global_step": 514675, "epoch": 6200} {"train_loss": -27.44276237487793, "global_step": 514676, "epoch": 6200} {"train_loss": -27.1842098236084, "global_step": 514677, "epoch": 6200} {"train_loss": -27.091527938842773, "global_step": 514678, "epoch": 6200} {"train_loss": -27.576202392578125, "global_step": 514679, "epoch": 6200} {"train_loss": -27.55805778503418, "global_step": 514680, "epoch": 6200} {"train_loss": -27.443273544311523, "global_step": 514681, "epoch": 6200} {"train_loss": -27.32168170055711, "global_step": 514682, "epoch": 6200, "train/sim_max_reward_0": 1.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4500000": 1.0, "test/sim_max_reward_4500001": 1.0, "test/sim_max_reward_4500002": 1.0, "test/sim_max_reward_4500003": 1.0, "test/sim_max_reward_4500004": 1.0, "test/sim_max_reward_4500005": 1.0, "test/sim_max_reward_4500006": 1.0, "test/sim_max_reward_4500007": 0.0, "test/sim_max_reward_4500008": 1.0, "test/sim_max_reward_4500009": 1.0, "test/sim_max_reward_4500010": 1.0, "test/sim_max_reward_4500011": 1.0, "test/sim_max_reward_4500012": 1.0, "test/sim_max_reward_4500013": 0.0, "test/sim_max_reward_4500014": 1.0, "test/sim_max_reward_4500015": 1.0, "test/sim_max_reward_4500016": 1.0, "test/sim_max_reward_4500017": 1.0, "test/sim_max_reward_4500018": 0.0, "test/sim_max_reward_4500019": 0.0, "test/sim_max_reward_4500020": 0.0, "test/sim_max_reward_4500021": 1.0, "train/mean_score": 1.0, "test/mean_score": 0.7727272727272727, "val_loss": 6758921.0} {"train_loss": -25.8730525970459, "global_step": 514683, "epoch": 6201} {"train_loss": -25.84113883972168, "global_step": 514684, "epoch": 6201} {"train_loss": -26.059803009033203, "global_step": 514685, "epoch": 6201} {"train_loss": -26.626636505126953, "global_step": 514686, "epoch": 6201} {"train_loss": -26.302265167236328, "global_step": 514687, "epoch": 6201} {"train_loss": -25.965784072875977, "global_step": 514688, "epoch": 6201} {"train_loss": -26.429859161376953, "global_step": 514689, "epoch": 6201} {"train_loss": -26.253149032592773, "global_step": 514690, "epoch": 6201} {"train_loss": -26.755033493041992, "global_step": 514691, "epoch": 6201} {"train_loss": -26.351154327392578, "global_step": 514692, "epoch": 6201} {"train_loss": -26.7194881439209, "global_step": 514693, "epoch": 6201} {"train_loss": -26.69227409362793, "global_step": 514694, "epoch": 6201} {"train_loss": -26.333356857299805, "global_step": 514695, "epoch": 6201} {"train_loss": -26.823694229125977, "global_step": 514696, "epoch": 6201} {"train_loss": -26.5841064453125, "global_step": 514697, "epoch": 6201} {"train_loss": -27.273147583007812, "global_step": 514698, "epoch": 6201} {"train_loss": -26.809553146362305, "global_step": 514699, "epoch": 6201} {"train_loss": -26.569686889648438, "global_step": 514700, "epoch": 6201} {"train_loss": -26.67207145690918, "global_step": 514701, "epoch": 6201} {"train_loss": -26.912057876586914, "global_step": 514702, "epoch": 6201} {"train_loss": -26.709747314453125, "global_step": 514703, "epoch": 6201} {"train_loss": -26.747486114501953, "global_step": 514704, "epoch": 6201} {"train_loss": -27.235387802124023, "global_step": 514705, "epoch": 6201} {"train_loss": -26.86344337463379, "global_step": 514706, "epoch": 6201} {"train_loss": -27.22528648376465, "global_step": 514707, "epoch": 6201} {"train_loss": -26.93230628967285, "global_step": 514708, "epoch": 6201} {"train_loss": -27.01466178894043, "global_step": 514709, "epoch": 6201} {"train_loss": -27.277820587158203, "global_step": 514710, "epoch": 6201} {"train_loss": -27.122913360595703, "global_step": 514711, "epoch": 6201} {"train_loss": -27.282657623291016, "global_step": 514712, "epoch": 6201} {"train_loss": -27.321985244750977, "global_step": 514713, "epoch": 6201} {"train_loss": -27.30109977722168, "global_step": 514714, "epoch": 6201} {"train_loss": -27.37860679626465, "global_step": 514715, "epoch": 6201} {"train_loss": -27.30897331237793, "global_step": 514716, "epoch": 6201} {"train_loss": -27.42803955078125, "global_step": 514717, "epoch": 6201} {"train_loss": -27.35328483581543, "global_step": 514718, "epoch": 6201} {"train_loss": -27.444915771484375, "global_step": 514719, "epoch": 6201} {"train_loss": -27.305164337158203, "global_step": 514720, "epoch": 6201} {"train_loss": -27.5291690826416, "global_step": 514721, "epoch": 6201} {"train_loss": -27.580020904541016, "global_step": 514722, "epoch": 6201} {"train_loss": -27.332250595092773, "global_step": 514723, "epoch": 6201} {"train_loss": -28.147327423095703, "global_step": 514724, "epoch": 6201} {"train_loss": -27.807693481445312, "global_step": 514725, "epoch": 6201} {"train_loss": -27.55484390258789, "global_step": 514726, "epoch": 6201} {"train_loss": -27.73859977722168, "global_step": 514727, "epoch": 6201} {"train_loss": -27.281957626342773, "global_step": 514728, "epoch": 6201} {"train_loss": -27.598541259765625, "global_step": 514729, "epoch": 6201} {"train_loss": -27.739395141601562, "global_step": 514730, "epoch": 6201} {"train_loss": -27.647445678710938, "global_step": 514731, "epoch": 6201} {"train_loss": -27.873870849609375, "global_step": 514732, "epoch": 6201} {"train_loss": -27.729612350463867, "global_step": 514733, "epoch": 6201} {"train_loss": -27.244617462158203, "global_step": 514734, "epoch": 6201} {"train_loss": -27.8769474029541, "global_step": 514735, "epoch": 6201} {"train_loss": -27.894407272338867, "global_step": 514736, "epoch": 6201} {"train_loss": -27.30475425720215, "global_step": 514737, "epoch": 6201} {"train_loss": -27.63344383239746, "global_step": 514738, "epoch": 6201} {"train_loss": -27.82380485534668, "global_step": 514739, "epoch": 6201} {"train_loss": -28.232507705688477, "global_step": 514740, "epoch": 6201} {"train_loss": -27.630483627319336, "global_step": 514741, "epoch": 6201} {"train_loss": -27.900232315063477, "global_step": 514742, "epoch": 6201} {"train_loss": -27.83289909362793, "global_step": 514743, "epoch": 6201} {"train_loss": -27.603900909423828, "global_step": 514744, "epoch": 6201} {"train_loss": -27.8244571685791, "global_step": 514745, "epoch": 6201} {"train_loss": -27.5889949798584, "global_step": 514746, "epoch": 6201} {"train_loss": -27.587621688842773, "global_step": 514747, "epoch": 6201} {"train_loss": -27.252384185791016, "global_step": 514748, "epoch": 6201} {"train_loss": -27.874841690063477, "global_step": 514749, "epoch": 6201} {"train_loss": -27.488285064697266, "global_step": 514750, "epoch": 6201} {"train_loss": -27.713537216186523, "global_step": 514751, "epoch": 6201} {"train_loss": -27.783849716186523, "global_step": 514752, "epoch": 6201} {"train_loss": -27.504636764526367, "global_step": 514753, "epoch": 6201} {"train_loss": -27.96123695373535, "global_step": 514754, "epoch": 6201} {"train_loss": -27.76691246032715, "global_step": 514755, "epoch": 6201} {"train_loss": -27.88190269470215, "global_step": 514756, "epoch": 6201} {"train_loss": -27.63486099243164, "global_step": 514757, "epoch": 6201} {"train_loss": -26.682647705078125, "global_step": 514758, "epoch": 6201} {"train_loss": -26.902292251586914, "global_step": 514759, "epoch": 6201} {"train_loss": -27.79751968383789, "global_step": 514760, "epoch": 6201} {"train_loss": -27.312469482421875, "global_step": 514761, "epoch": 6201} {"train_loss": -27.74480628967285, "global_step": 514762, "epoch": 6201} {"train_loss": -27.566953659057617, "global_step": 514763, "epoch": 6201} {"train_loss": -27.521860122680664, "global_step": 514764, "epoch": 6201} {"train_loss": -27.252576115619707, "global_step": 514765, "epoch": 6201, "val_loss": 6632318.0} {"train_loss": -27.07633399963379, "global_step": 514766, "epoch": 6202} {"train_loss": -26.178266525268555, "global_step": 514767, "epoch": 6202} {"train_loss": -26.247831344604492, "global_step": 514768, "epoch": 6202} {"train_loss": -26.70881462097168, "global_step": 514769, "epoch": 6202} {"train_loss": -27.281848907470703, "global_step": 514770, "epoch": 6202} {"train_loss": -26.690555572509766, "global_step": 514771, "epoch": 6202} {"train_loss": -27.051218032836914, "global_step": 514772, "epoch": 6202} {"train_loss": -26.8911075592041, "global_step": 514773, "epoch": 6202} {"train_loss": -26.531606674194336, "global_step": 514774, "epoch": 6202} {"train_loss": -27.562620162963867, "global_step": 514775, "epoch": 6202} {"train_loss": -26.84931755065918, "global_step": 514776, "epoch": 6202} {"train_loss": -27.35235023498535, "global_step": 514777, "epoch": 6202} {"train_loss": -27.01979637145996, "global_step": 514778, "epoch": 6202} {"train_loss": -26.63422966003418, "global_step": 514779, "epoch": 6202} {"train_loss": -27.53862953186035, "global_step": 514780, "epoch": 6202} {"train_loss": -26.851659774780273, "global_step": 514781, "epoch": 6202} {"train_loss": -26.899442672729492, "global_step": 514782, "epoch": 6202} {"train_loss": -26.718582153320312, "global_step": 514783, "epoch": 6202} {"train_loss": -27.053449630737305, "global_step": 514784, "epoch": 6202} {"train_loss": -27.073944091796875, "global_step": 514785, "epoch": 6202} {"train_loss": -27.036828994750977, "global_step": 514786, "epoch": 6202} {"train_loss": -26.96840476989746, "global_step": 514787, "epoch": 6202} {"train_loss": -26.82337760925293, "global_step": 514788, "epoch": 6202} {"train_loss": -27.2271671295166, "global_step": 514789, "epoch": 6202} {"train_loss": -27.201223373413086, "global_step": 514790, "epoch": 6202} {"train_loss": -27.146326065063477, "global_step": 514791, "epoch": 6202} {"train_loss": -27.425634384155273, "global_step": 514792, "epoch": 6202} {"train_loss": -27.002552032470703, "global_step": 514793, "epoch": 6202} {"train_loss": -27.611923217773438, "global_step": 514794, "epoch": 6202} {"train_loss": -27.18177604675293, "global_step": 514795, "epoch": 6202} {"train_loss": -27.4238224029541, "global_step": 514796, "epoch": 6202} {"train_loss": -27.58477783203125, "global_step": 514797, "epoch": 6202} {"train_loss": -27.538217544555664, "global_step": 514798, "epoch": 6202} {"train_loss": -27.604812622070312, "global_step": 514799, "epoch": 6202} {"train_loss": -27.375232696533203, "global_step": 514800, "epoch": 6202} {"train_loss": -27.612146377563477, "global_step": 514801, "epoch": 6202} {"train_loss": -27.81402587890625, "global_step": 514802, "epoch": 6202} {"train_loss": -27.654205322265625, "global_step": 514803, "epoch": 6202} {"train_loss": -27.476226806640625, "global_step": 514804, "epoch": 6202} {"train_loss": -27.582239151000977, "global_step": 514805, "epoch": 6202} {"train_loss": -27.954069137573242, "global_step": 514806, "epoch": 6202} {"train_loss": -27.759241104125977, "global_step": 514807, "epoch": 6202} {"train_loss": -27.983673095703125, "global_step": 514808, "epoch": 6202} {"train_loss": -27.424917221069336, "global_step": 514809, "epoch": 6202} {"train_loss": -27.614160537719727, "global_step": 514810, "epoch": 6202} {"train_loss": -28.06168556213379, "global_step": 514811, "epoch": 6202} {"train_loss": -27.503087997436523, "global_step": 514812, "epoch": 6202} {"train_loss": -27.72609519958496, "global_step": 514813, "epoch": 6202} {"train_loss": -27.6755428314209, "global_step": 514814, "epoch": 6202} {"train_loss": -27.754852294921875, "global_step": 514815, "epoch": 6202} {"train_loss": -27.72894859313965, "global_step": 514816, "epoch": 6202} {"train_loss": -27.686304092407227, "global_step": 514817, "epoch": 6202} {"train_loss": -27.77320671081543, "global_step": 514818, "epoch": 6202} {"train_loss": -27.652536392211914, "global_step": 514819, "epoch": 6202} {"train_loss": -27.57931900024414, "global_step": 514820, "epoch": 6202} {"train_loss": -27.49822425842285, "global_step": 514821, "epoch": 6202} {"train_loss": -27.455408096313477, "global_step": 514822, "epoch": 6202} {"train_loss": -27.925922393798828, "global_step": 514823, "epoch": 6202} {"train_loss": -27.285846710205078, "global_step": 514824, "epoch": 6202} {"train_loss": -27.40467643737793, "global_step": 514825, "epoch": 6202} {"train_loss": -27.49492835998535, "global_step": 514826, "epoch": 6202} {"train_loss": -27.43061637878418, "global_step": 514827, "epoch": 6202} {"train_loss": -27.827295303344727, "global_step": 514828, "epoch": 6202} {"train_loss": -27.4575138092041, "global_step": 514829, "epoch": 6202} {"train_loss": -27.057355880737305, "global_step": 514830, "epoch": 6202} {"train_loss": -27.73463249206543, "global_step": 514831, "epoch": 6202} {"train_loss": -27.199176788330078, "global_step": 514832, "epoch": 6202} {"train_loss": -27.621906280517578, "global_step": 514833, "epoch": 6202} {"train_loss": -27.505578994750977, "global_step": 514834, "epoch": 6202} {"train_loss": -27.4477596282959, "global_step": 514835, "epoch": 6202} {"train_loss": -27.47895622253418, "global_step": 514836, "epoch": 6202} {"train_loss": -27.0185604095459, "global_step": 514837, "epoch": 6202} {"train_loss": -27.09799575805664, "global_step": 514838, "epoch": 6202} {"train_loss": -26.89777183532715, "global_step": 514839, "epoch": 6202} {"train_loss": -27.26287841796875, "global_step": 514840, "epoch": 6202} {"train_loss": -27.303598403930664, "global_step": 514841, "epoch": 6202} {"train_loss": -27.475345611572266, "global_step": 514842, "epoch": 6202} {"train_loss": -27.348114013671875, "global_step": 514843, "epoch": 6202} {"train_loss": -27.30289649963379, "global_step": 514844, "epoch": 6202} {"train_loss": -27.40829849243164, "global_step": 514845, "epoch": 6202} {"train_loss": -27.6937198638916, "global_step": 514846, "epoch": 6202} {"train_loss": -27.193832397460938, "global_step": 514847, "epoch": 6202} {"train_loss": -27.345577423831067, "global_step": 514848, "epoch": 6202, "val_loss": 6611264.0} {"train_loss": -26.85321617126465, "global_step": 514849, "epoch": 6203} {"train_loss": -26.658796310424805, "global_step": 514850, "epoch": 6203} {"train_loss": -26.85377311706543, "global_step": 514851, "epoch": 6203} {"train_loss": -26.804080963134766, "global_step": 514852, "epoch": 6203} {"train_loss": -27.007726669311523, "global_step": 514853, "epoch": 6203} {"train_loss": -26.76983070373535, "global_step": 514854, "epoch": 6203} {"train_loss": -27.239049911499023, "global_step": 514855, "epoch": 6203} {"train_loss": -27.071401596069336, "global_step": 514856, "epoch": 6203} {"train_loss": -27.199209213256836, "global_step": 514857, "epoch": 6203} {"train_loss": -27.136693954467773, "global_step": 514858, "epoch": 6203} {"train_loss": -27.378202438354492, "global_step": 514859, "epoch": 6203} {"train_loss": -26.8900146484375, "global_step": 514860, "epoch": 6203} {"train_loss": -27.060749053955078, "global_step": 514861, "epoch": 6203} {"train_loss": -26.571731567382812, "global_step": 514862, "epoch": 6203} {"train_loss": -27.071002960205078, "global_step": 514863, "epoch": 6203} {"train_loss": -27.02264404296875, "global_step": 514864, "epoch": 6203} {"train_loss": -27.42376708984375, "global_step": 514865, "epoch": 6203} {"train_loss": -27.327869415283203, "global_step": 514866, "epoch": 6203} {"train_loss": -27.23748779296875, "global_step": 514867, "epoch": 6203} {"train_loss": -27.5548095703125, "global_step": 514868, "epoch": 6203} {"train_loss": -26.996000289916992, "global_step": 514869, "epoch": 6203} {"train_loss": -27.114490509033203, "global_step": 514870, "epoch": 6203} {"train_loss": -26.804492950439453, "global_step": 514871, "epoch": 6203} {"train_loss": -27.158191680908203, "global_step": 514872, "epoch": 6203} {"train_loss": -27.535062789916992, "global_step": 514873, "epoch": 6203} {"train_loss": -27.154953002929688, "global_step": 514874, "epoch": 6203} {"train_loss": -27.04791831970215, "global_step": 514875, "epoch": 6203} {"train_loss": -27.042316436767578, "global_step": 514876, "epoch": 6203} {"train_loss": -27.129871368408203, "global_step": 514877, "epoch": 6203} {"train_loss": -27.311420440673828, "global_step": 514878, "epoch": 6203} {"train_loss": -27.314285278320312, "global_step": 514879, "epoch": 6203} {"train_loss": -27.374256134033203, "global_step": 514880, "epoch": 6203} {"train_loss": -27.6939697265625, "global_step": 514881, "epoch": 6203} {"train_loss": -27.51145362854004, "global_step": 514882, "epoch": 6203} {"train_loss": -27.470014572143555, "global_step": 514883, "epoch": 6203} {"train_loss": -27.422607421875, "global_step": 514884, "epoch": 6203} {"train_loss": -27.612537384033203, "global_step": 514885, "epoch": 6203} {"train_loss": -27.380786895751953, "global_step": 514886, "epoch": 6203} {"train_loss": -27.982563018798828, "global_step": 514887, "epoch": 6203} {"train_loss": -27.332136154174805, "global_step": 514888, "epoch": 6203} {"train_loss": -27.602970123291016, "global_step": 514889, "epoch": 6203} {"train_loss": -26.88400650024414, "global_step": 514890, "epoch": 6203} {"train_loss": -27.004621505737305, "global_step": 514891, "epoch": 6203} {"train_loss": -27.288806915283203, "global_step": 514892, "epoch": 6203} {"train_loss": -27.74684715270996, "global_step": 514893, "epoch": 6203} {"train_loss": -27.406845092773438, "global_step": 514894, "epoch": 6203} {"train_loss": -27.506338119506836, "global_step": 514895, "epoch": 6203} {"train_loss": -27.708215713500977, "global_step": 514896, "epoch": 6203} {"train_loss": -27.858457565307617, "global_step": 514897, "epoch": 6203} {"train_loss": -27.722553253173828, "global_step": 514898, "epoch": 6203} {"train_loss": -27.6965389251709, "global_step": 514899, "epoch": 6203} {"train_loss": -27.6805362701416, "global_step": 514900, "epoch": 6203} {"train_loss": -27.38673210144043, "global_step": 514901, "epoch": 6203} {"train_loss": -27.413293838500977, "global_step": 514902, "epoch": 6203} {"train_loss": -27.71803855895996, "global_step": 514903, "epoch": 6203} {"train_loss": -27.558008193969727, "global_step": 514904, "epoch": 6203} {"train_loss": -27.8763484954834, "global_step": 514905, "epoch": 6203} {"train_loss": -27.57545280456543, "global_step": 514906, "epoch": 6203} {"train_loss": -27.936614990234375, "global_step": 514907, "epoch": 6203} {"train_loss": -27.96053123474121, "global_step": 514908, "epoch": 6203} {"train_loss": -27.6639404296875, "global_step": 514909, "epoch": 6203} {"train_loss": -27.71429443359375, "global_step": 514910, "epoch": 6203} {"train_loss": -27.872068405151367, "global_step": 514911, "epoch": 6203} {"train_loss": -27.656152725219727, "global_step": 514912, "epoch": 6203} {"train_loss": -27.68503189086914, "global_step": 514913, "epoch": 6203} {"train_loss": -27.625341415405273, "global_step": 514914, "epoch": 6203} {"train_loss": -27.903919219970703, "global_step": 514915, "epoch": 6203} {"train_loss": -27.726598739624023, "global_step": 514916, "epoch": 6203} {"train_loss": -27.788101196289062, "global_step": 514917, "epoch": 6203} {"train_loss": -28.048559188842773, "global_step": 514918, "epoch": 6203} {"train_loss": -27.899091720581055, "global_step": 514919, "epoch": 6203} {"train_loss": -27.47202491760254, "global_step": 514920, "epoch": 6203} {"train_loss": -27.606306076049805, "global_step": 514921, "epoch": 6203} {"train_loss": -27.539655685424805, "global_step": 514922, "epoch": 6203} {"train_loss": -27.524290084838867, "global_step": 514923, "epoch": 6203} {"train_loss": -27.32508659362793, "global_step": 514924, "epoch": 6203} {"train_loss": -27.355703353881836, "global_step": 514925, "epoch": 6203} {"train_loss": -27.25897789001465, "global_step": 514926, "epoch": 6203} {"train_loss": -26.577539443969727, "global_step": 514927, "epoch": 6203} {"train_loss": -26.376235961914062, "global_step": 514928, "epoch": 6203} {"train_loss": -26.925588607788086, "global_step": 514929, "epoch": 6203} {"train_loss": -27.745641708374023, "global_step": 514930, "epoch": 6203} {"train_loss": -27.37982333999082, "global_step": 514931, "epoch": 6203, "val_loss": 6629894.5} {"train_loss": -26.104263305664062, "global_step": 514932, "epoch": 6204} {"train_loss": -25.914234161376953, "global_step": 514933, "epoch": 6204} {"train_loss": -26.454736709594727, "global_step": 514934, "epoch": 6204} {"train_loss": -26.078824996948242, "global_step": 514935, "epoch": 6204} {"train_loss": -26.45212173461914, "global_step": 514936, "epoch": 6204} {"train_loss": -26.436853408813477, "global_step": 514937, "epoch": 6204} {"train_loss": -26.6851863861084, "global_step": 514938, "epoch": 6204} {"train_loss": -26.809711456298828, "global_step": 514939, "epoch": 6204} {"train_loss": -26.798019409179688, "global_step": 514940, "epoch": 6204} {"train_loss": -26.55145835876465, "global_step": 514941, "epoch": 6204} {"train_loss": -26.763229370117188, "global_step": 514942, "epoch": 6204} {"train_loss": -27.106571197509766, "global_step": 514943, "epoch": 6204} {"train_loss": -26.986974716186523, "global_step": 514944, "epoch": 6204} {"train_loss": -26.969924926757812, "global_step": 514945, "epoch": 6204} {"train_loss": -26.862167358398438, "global_step": 514946, "epoch": 6204} {"train_loss": -27.08408546447754, "global_step": 514947, "epoch": 6204} {"train_loss": -27.309131622314453, "global_step": 514948, "epoch": 6204} {"train_loss": -27.0069580078125, "global_step": 514949, "epoch": 6204} {"train_loss": -27.13852310180664, "global_step": 514950, "epoch": 6204} {"train_loss": -26.880796432495117, "global_step": 514951, "epoch": 6204} {"train_loss": -26.918182373046875, "global_step": 514952, "epoch": 6204} {"train_loss": -26.897785186767578, "global_step": 514953, "epoch": 6204} {"train_loss": -27.561050415039062, "global_step": 514954, "epoch": 6204} {"train_loss": -26.960342407226562, "global_step": 514955, "epoch": 6204} {"train_loss": -27.280841827392578, "global_step": 514956, "epoch": 6204} {"train_loss": -27.47764015197754, "global_step": 514957, "epoch": 6204} {"train_loss": -27.60154151916504, "global_step": 514958, "epoch": 6204} {"train_loss": -27.54121208190918, "global_step": 514959, "epoch": 6204} {"train_loss": -27.443140029907227, "global_step": 514960, "epoch": 6204} {"train_loss": -27.32014274597168, "global_step": 514961, "epoch": 6204} {"train_loss": -27.263233184814453, "global_step": 514962, "epoch": 6204} {"train_loss": -27.565082550048828, "global_step": 514963, "epoch": 6204} {"train_loss": -27.45289421081543, "global_step": 514964, "epoch": 6204} {"train_loss": -27.487884521484375, "global_step": 514965, "epoch": 6204} {"train_loss": -27.524667739868164, "global_step": 514966, "epoch": 6204} {"train_loss": -27.575122833251953, "global_step": 514967, "epoch": 6204} {"train_loss": -27.601404190063477, "global_step": 514968, "epoch": 6204} {"train_loss": -27.932111740112305, "global_step": 514969, "epoch": 6204} {"train_loss": -27.454452514648438, "global_step": 514970, "epoch": 6204} {"train_loss": -27.473480224609375, "global_step": 514971, "epoch": 6204} {"train_loss": -27.368457794189453, "global_step": 514972, "epoch": 6204} {"train_loss": -27.712385177612305, "global_step": 514973, "epoch": 6204} {"train_loss": -27.646469116210938, "global_step": 514974, "epoch": 6204} {"train_loss": -27.484792709350586, "global_step": 514975, "epoch": 6204} {"train_loss": -27.31802749633789, "global_step": 514976, "epoch": 6204} {"train_loss": -27.433515548706055, "global_step": 514977, "epoch": 6204} {"train_loss": -27.82150650024414, "global_step": 514978, "epoch": 6204} {"train_loss": -27.428165435791016, "global_step": 514979, "epoch": 6204} {"train_loss": -27.78597068786621, "global_step": 514980, "epoch": 6204} {"train_loss": -27.541101455688477, "global_step": 514981, "epoch": 6204} {"train_loss": -27.61591911315918, "global_step": 514982, "epoch": 6204} {"train_loss": -27.856603622436523, "global_step": 514983, "epoch": 6204} {"train_loss": -27.623767852783203, "global_step": 514984, "epoch": 6204} {"train_loss": -27.683917999267578, "global_step": 514985, "epoch": 6204} {"train_loss": -27.58888816833496, "global_step": 514986, "epoch": 6204} {"train_loss": -27.400842666625977, "global_step": 514987, "epoch": 6204} {"train_loss": -27.439685821533203, "global_step": 514988, "epoch": 6204} {"train_loss": -27.80352783203125, "global_step": 514989, "epoch": 6204} {"train_loss": -27.887853622436523, "global_step": 514990, "epoch": 6204} {"train_loss": -27.43106460571289, "global_step": 514991, "epoch": 6204} {"train_loss": -27.455841064453125, "global_step": 514992, "epoch": 6204} {"train_loss": -27.297088623046875, "global_step": 514993, "epoch": 6204} {"train_loss": -27.5425968170166, "global_step": 514994, "epoch": 6204} {"train_loss": -27.569040298461914, "global_step": 514995, "epoch": 6204} {"train_loss": -28.21223258972168, "global_step": 514996, "epoch": 6204} {"train_loss": -27.700769424438477, "global_step": 514997, "epoch": 6204} {"train_loss": -27.40217399597168, "global_step": 514998, "epoch": 6204} {"train_loss": -27.041217803955078, "global_step": 514999, "epoch": 6204} {"train_loss": -26.962284088134766, "global_step": 515000, "epoch": 6204} {"train_loss": -26.9864501953125, "global_step": 515001, "epoch": 6204} {"train_loss": -27.313032150268555, "global_step": 515002, "epoch": 6204} {"train_loss": -27.41310691833496, "global_step": 515003, "epoch": 6204} {"train_loss": -27.34381675720215, "global_step": 515004, "epoch": 6204} {"train_loss": -27.40907096862793, "global_step": 515005, "epoch": 6204} {"train_loss": -27.134241104125977, "global_step": 515006, "epoch": 6204} {"train_loss": -27.45255470275879, "global_step": 515007, "epoch": 6204} {"train_loss": -27.614561080932617, "global_step": 515008, "epoch": 6204} {"train_loss": -27.633697509765625, "global_step": 515009, "epoch": 6204} {"train_loss": -27.40473747253418, "global_step": 515010, "epoch": 6204} {"train_loss": -27.404132843017578, "global_step": 515011, "epoch": 6204} {"train_loss": -27.444128036499023, "global_step": 515012, "epoch": 6204} {"train_loss": -27.087921142578125, "global_step": 515013, "epoch": 6204} {"train_loss": -27.28688019442271, "global_step": 515014, "epoch": 6204, "val_loss": 6639837.0} {"train_loss": -27.11374855041504, "global_step": 515015, "epoch": 6205} {"train_loss": -27.0165958404541, "global_step": 515016, "epoch": 6205} {"train_loss": -27.53547477722168, "global_step": 515017, "epoch": 6205} {"train_loss": -27.278106689453125, "global_step": 515018, "epoch": 6205} {"train_loss": -27.0821590423584, "global_step": 515019, "epoch": 6205} {"train_loss": -27.160444259643555, "global_step": 515020, "epoch": 6205} {"train_loss": -27.179563522338867, "global_step": 515021, "epoch": 6205} {"train_loss": -27.276763916015625, "global_step": 515022, "epoch": 6205} {"train_loss": -27.236988067626953, "global_step": 515023, "epoch": 6205} {"train_loss": -27.11680030822754, "global_step": 515024, "epoch": 6205} {"train_loss": -27.642730712890625, "global_step": 515025, "epoch": 6205} {"train_loss": -27.49794578552246, "global_step": 515026, "epoch": 6205} {"train_loss": -27.5093994140625, "global_step": 515027, "epoch": 6205} {"train_loss": -27.27276039123535, "global_step": 515028, "epoch": 6205} {"train_loss": -27.740497589111328, "global_step": 515029, "epoch": 6205} {"train_loss": -27.36640739440918, "global_step": 515030, "epoch": 6205} {"train_loss": -27.32076072692871, "global_step": 515031, "epoch": 6205} {"train_loss": -27.47772216796875, "global_step": 515032, "epoch": 6205} {"train_loss": -27.47126579284668, "global_step": 515033, "epoch": 6205} {"train_loss": -27.225513458251953, "global_step": 515034, "epoch": 6205} {"train_loss": -27.67339515686035, "global_step": 515035, "epoch": 6205} {"train_loss": -27.193456649780273, "global_step": 515036, "epoch": 6205} {"train_loss": -27.759496688842773, "global_step": 515037, "epoch": 6205} {"train_loss": -27.446447372436523, "global_step": 515038, "epoch": 6205} {"train_loss": -27.25664710998535, "global_step": 515039, "epoch": 6205} {"train_loss": -27.491500854492188, "global_step": 515040, "epoch": 6205} {"train_loss": -27.26318359375, "global_step": 515041, "epoch": 6205} {"train_loss": -27.361616134643555, "global_step": 515042, "epoch": 6205} {"train_loss": -27.50874137878418, "global_step": 515043, "epoch": 6205} {"train_loss": -27.517200469970703, "global_step": 515044, "epoch": 6205} {"train_loss": -27.357995986938477, "global_step": 515045, "epoch": 6205} {"train_loss": -27.463281631469727, "global_step": 515046, "epoch": 6205} {"train_loss": -27.24761390686035, "global_step": 515047, "epoch": 6205} {"train_loss": -27.754770278930664, "global_step": 515048, "epoch": 6205} {"train_loss": -27.204010009765625, "global_step": 515049, "epoch": 6205} {"train_loss": -27.512113571166992, "global_step": 515050, "epoch": 6205} {"train_loss": -27.612699508666992, "global_step": 515051, "epoch": 6205} {"train_loss": -27.21241569519043, "global_step": 515052, "epoch": 6205} {"train_loss": -27.479358673095703, "global_step": 515053, "epoch": 6205} {"train_loss": -28.072843551635742, "global_step": 515054, "epoch": 6205} {"train_loss": -27.387327194213867, "global_step": 515055, "epoch": 6205} {"train_loss": -27.778539657592773, "global_step": 515056, "epoch": 6205} {"train_loss": -27.425683975219727, "global_step": 515057, "epoch": 6205} {"train_loss": -27.791223526000977, "global_step": 515058, "epoch": 6205} {"train_loss": -27.435199737548828, "global_step": 515059, "epoch": 6205} {"train_loss": -27.40401268005371, "global_step": 515060, "epoch": 6205} {"train_loss": -27.57826805114746, "global_step": 515061, "epoch": 6205} {"train_loss": -27.99827003479004, "global_step": 515062, "epoch": 6205} {"train_loss": -27.306665420532227, "global_step": 515063, "epoch": 6205} {"train_loss": -27.482852935791016, "global_step": 515064, "epoch": 6205} {"train_loss": -26.756668090820312, "global_step": 515065, "epoch": 6205} {"train_loss": -27.819110870361328, "global_step": 515066, "epoch": 6205} {"train_loss": -27.26582908630371, "global_step": 515067, "epoch": 6205} {"train_loss": -27.71552848815918, "global_step": 515068, "epoch": 6205} {"train_loss": -27.068124771118164, "global_step": 515069, "epoch": 6205} {"train_loss": -27.529592514038086, "global_step": 515070, "epoch": 6205} {"train_loss": -27.233856201171875, "global_step": 515071, "epoch": 6205} {"train_loss": -27.782276153564453, "global_step": 515072, "epoch": 6205} {"train_loss": -27.635526657104492, "global_step": 515073, "epoch": 6205} {"train_loss": -27.511676788330078, "global_step": 515074, "epoch": 6205} {"train_loss": -27.669422149658203, "global_step": 515075, "epoch": 6205} {"train_loss": -27.30510902404785, "global_step": 515076, "epoch": 6205} {"train_loss": -27.558080673217773, "global_step": 515077, "epoch": 6205} {"train_loss": -27.730987548828125, "global_step": 515078, "epoch": 6205} {"train_loss": -27.844226837158203, "global_step": 515079, "epoch": 6205} {"train_loss": -27.676685333251953, "global_step": 515080, "epoch": 6205} {"train_loss": -27.870086669921875, "global_step": 515081, "epoch": 6205} {"train_loss": -27.72905921936035, "global_step": 515082, "epoch": 6205} {"train_loss": -27.712797164916992, "global_step": 515083, "epoch": 6205} {"train_loss": -27.602224349975586, "global_step": 515084, "epoch": 6205} {"train_loss": -27.728118896484375, "global_step": 515085, "epoch": 6205} {"train_loss": -27.413190841674805, "global_step": 515086, "epoch": 6205} {"train_loss": -27.40766716003418, "global_step": 515087, "epoch": 6205} {"train_loss": -27.569793701171875, "global_step": 515088, "epoch": 6205} {"train_loss": -27.515121459960938, "global_step": 515089, "epoch": 6205} {"train_loss": -27.757654190063477, "global_step": 515090, "epoch": 6205} {"train_loss": -27.461902618408203, "global_step": 515091, "epoch": 6205} {"train_loss": -27.326618194580078, "global_step": 515092, "epoch": 6205} {"train_loss": -27.613473892211914, "global_step": 515093, "epoch": 6205} {"train_loss": -27.204456329345703, "global_step": 515094, "epoch": 6205} {"train_loss": -27.57801628112793, "global_step": 515095, "epoch": 6205} {"train_loss": -27.413618087768555, "global_step": 515096, "epoch": 6205} {"train_loss": -27.46765658367111, "global_step": 515097, "epoch": 6205, "val_loss": 6643346.5} {"train_loss": -26.56488037109375, "global_step": 515098, "epoch": 6206} {"train_loss": -26.0770206451416, "global_step": 515099, "epoch": 6206} {"train_loss": -26.42571449279785, "global_step": 515100, "epoch": 6206} {"train_loss": -26.54176902770996, "global_step": 515101, "epoch": 6206} {"train_loss": -26.775390625, "global_step": 515102, "epoch": 6206} {"train_loss": -25.76978874206543, "global_step": 515103, "epoch": 6206} {"train_loss": -26.47565269470215, "global_step": 515104, "epoch": 6206} {"train_loss": -27.135669708251953, "global_step": 515105, "epoch": 6206} {"train_loss": -26.431299209594727, "global_step": 515106, "epoch": 6206} {"train_loss": -26.959583282470703, "global_step": 515107, "epoch": 6206} {"train_loss": -26.525449752807617, "global_step": 515108, "epoch": 6206} {"train_loss": -26.46107292175293, "global_step": 515109, "epoch": 6206} {"train_loss": -27.246295928955078, "global_step": 515110, "epoch": 6206} {"train_loss": -27.159393310546875, "global_step": 515111, "epoch": 6206} {"train_loss": -26.940643310546875, "global_step": 515112, "epoch": 6206} {"train_loss": -26.738492965698242, "global_step": 515113, "epoch": 6206} {"train_loss": -27.223407745361328, "global_step": 515114, "epoch": 6206} {"train_loss": -27.60752296447754, "global_step": 515115, "epoch": 6206} {"train_loss": -27.32684326171875, "global_step": 515116, "epoch": 6206} {"train_loss": -27.184667587280273, "global_step": 515117, "epoch": 6206} {"train_loss": -27.433149337768555, "global_step": 515118, "epoch": 6206} {"train_loss": -26.700529098510742, "global_step": 515119, "epoch": 6206} {"train_loss": -27.132375717163086, "global_step": 515120, "epoch": 6206} {"train_loss": -27.554540634155273, "global_step": 515121, "epoch": 6206} {"train_loss": -27.112396240234375, "global_step": 515122, "epoch": 6206} {"train_loss": -26.880725860595703, "global_step": 515123, "epoch": 6206} {"train_loss": -27.309707641601562, "global_step": 515124, "epoch": 6206} {"train_loss": -27.28440284729004, "global_step": 515125, "epoch": 6206} {"train_loss": -27.165241241455078, "global_step": 515126, "epoch": 6206} {"train_loss": -27.742889404296875, "global_step": 515127, "epoch": 6206} {"train_loss": -27.27256202697754, "global_step": 515128, "epoch": 6206} {"train_loss": -27.184391021728516, "global_step": 515129, "epoch": 6206} {"train_loss": -27.529218673706055, "global_step": 515130, "epoch": 6206} {"train_loss": -27.389257431030273, "global_step": 515131, "epoch": 6206} {"train_loss": -27.313440322875977, "global_step": 515132, "epoch": 6206} {"train_loss": -27.072635650634766, "global_step": 515133, "epoch": 6206} {"train_loss": -27.645048141479492, "global_step": 515134, "epoch": 6206} {"train_loss": -27.02685546875, "global_step": 515135, "epoch": 6206} {"train_loss": -27.206985473632812, "global_step": 515136, "epoch": 6206} {"train_loss": -27.569793701171875, "global_step": 515137, "epoch": 6206} {"train_loss": -27.647199630737305, "global_step": 515138, "epoch": 6206} {"train_loss": -27.453216552734375, "global_step": 515139, "epoch": 6206} {"train_loss": -27.36348533630371, "global_step": 515140, "epoch": 6206} {"train_loss": -27.398162841796875, "global_step": 515141, "epoch": 6206} {"train_loss": -27.29523277282715, "global_step": 515142, "epoch": 6206} {"train_loss": -27.6154842376709, "global_step": 515143, "epoch": 6206} {"train_loss": -27.375242233276367, "global_step": 515144, "epoch": 6206} {"train_loss": -27.123083114624023, "global_step": 515145, "epoch": 6206} {"train_loss": -27.5759334564209, "global_step": 515146, "epoch": 6206} {"train_loss": -27.722501754760742, "global_step": 515147, "epoch": 6206} {"train_loss": -27.44635581970215, "global_step": 515148, "epoch": 6206} {"train_loss": -27.51541519165039, "global_step": 515149, "epoch": 6206} {"train_loss": -27.94447135925293, "global_step": 515150, "epoch": 6206} {"train_loss": -27.63160514831543, "global_step": 515151, "epoch": 6206} {"train_loss": -27.06233024597168, "global_step": 515152, "epoch": 6206} {"train_loss": -26.99567222595215, "global_step": 515153, "epoch": 6206} {"train_loss": -26.93476676940918, "global_step": 515154, "epoch": 6206} {"train_loss": -27.668075561523438, "global_step": 515155, "epoch": 6206} {"train_loss": -26.5712890625, "global_step": 515156, "epoch": 6206} {"train_loss": -25.482318878173828, "global_step": 515157, "epoch": 6206} {"train_loss": -24.75641632080078, "global_step": 515158, "epoch": 6206} {"train_loss": -26.828662872314453, "global_step": 515159, "epoch": 6206} {"train_loss": -27.026330947875977, "global_step": 515160, "epoch": 6206} {"train_loss": -26.92791748046875, "global_step": 515161, "epoch": 6206} {"train_loss": -27.21567153930664, "global_step": 515162, "epoch": 6206} {"train_loss": -26.976978302001953, "global_step": 515163, "epoch": 6206} {"train_loss": -26.946313858032227, "global_step": 515164, "epoch": 6206} {"train_loss": -27.004932403564453, "global_step": 515165, "epoch": 6206} {"train_loss": -27.036535263061523, "global_step": 515166, "epoch": 6206} {"train_loss": -27.06551170349121, "global_step": 515167, "epoch": 6206} {"train_loss": -27.168045043945312, "global_step": 515168, "epoch": 6206} {"train_loss": -26.985837936401367, "global_step": 515169, "epoch": 6206} {"train_loss": -27.242919921875, "global_step": 515170, "epoch": 6206} {"train_loss": -27.61210060119629, "global_step": 515171, "epoch": 6206} {"train_loss": -26.9345645904541, "global_step": 515172, "epoch": 6206} {"train_loss": -26.965625762939453, "global_step": 515173, "epoch": 6206} {"train_loss": -27.463836669921875, "global_step": 515174, "epoch": 6206} {"train_loss": -27.20636558532715, "global_step": 515175, "epoch": 6206} {"train_loss": -27.13545036315918, "global_step": 515176, "epoch": 6206} {"train_loss": -27.503692626953125, "global_step": 515177, "epoch": 6206} {"train_loss": -27.0341739654541, "global_step": 515178, "epoch": 6206} {"train_loss": -27.19508934020996, "global_step": 515179, "epoch": 6206} {"train_loss": -27.09171876562647, "global_step": 515180, "epoch": 6206, "val_loss": 6561000.5} {"train_loss": -27.1212215423584, "global_step": 515181, "epoch": 6207} {"train_loss": -26.49004554748535, "global_step": 515182, "epoch": 6207} {"train_loss": -26.93473243713379, "global_step": 515183, "epoch": 6207} {"train_loss": -26.882246017456055, "global_step": 515184, "epoch": 6207} {"train_loss": -27.086301803588867, "global_step": 515185, "epoch": 6207} {"train_loss": -27.118915557861328, "global_step": 515186, "epoch": 6207} {"train_loss": -27.450164794921875, "global_step": 515187, "epoch": 6207} {"train_loss": -26.925912857055664, "global_step": 515188, "epoch": 6207} {"train_loss": -26.643966674804688, "global_step": 515189, "epoch": 6207} {"train_loss": -27.452911376953125, "global_step": 515190, "epoch": 6207} {"train_loss": -27.0039005279541, "global_step": 515191, "epoch": 6207} {"train_loss": -27.26787757873535, "global_step": 515192, "epoch": 6207} {"train_loss": -27.449743270874023, "global_step": 515193, "epoch": 6207} {"train_loss": -27.13503074645996, "global_step": 515194, "epoch": 6207} {"train_loss": -27.547163009643555, "global_step": 515195, "epoch": 6207} {"train_loss": -27.363922119140625, "global_step": 515196, "epoch": 6207} {"train_loss": -26.925846099853516, "global_step": 515197, "epoch": 6207} {"train_loss": -27.294504165649414, "global_step": 515198, "epoch": 6207} {"train_loss": -27.459156036376953, "global_step": 515199, "epoch": 6207} {"train_loss": -27.649194717407227, "global_step": 515200, "epoch": 6207} {"train_loss": -27.34810447692871, "global_step": 515201, "epoch": 6207} {"train_loss": -27.057941436767578, "global_step": 515202, "epoch": 6207} {"train_loss": -27.457386016845703, "global_step": 515203, "epoch": 6207} {"train_loss": -27.389179229736328, "global_step": 515204, "epoch": 6207} {"train_loss": -27.48624610900879, "global_step": 515205, "epoch": 6207} {"train_loss": -27.349151611328125, "global_step": 515206, "epoch": 6207} {"train_loss": -27.651355743408203, "global_step": 515207, "epoch": 6207} {"train_loss": -27.45600700378418, "global_step": 515208, "epoch": 6207} {"train_loss": -27.4144287109375, "global_step": 515209, "epoch": 6207} {"train_loss": -27.558624267578125, "global_step": 515210, "epoch": 6207} {"train_loss": -27.840545654296875, "global_step": 515211, "epoch": 6207} {"train_loss": -27.5670166015625, "global_step": 515212, "epoch": 6207} {"train_loss": -27.65736961364746, "global_step": 515213, "epoch": 6207} {"train_loss": -27.495101928710938, "global_step": 515214, "epoch": 6207} {"train_loss": -27.617502212524414, "global_step": 515215, "epoch": 6207} {"train_loss": -27.4427547454834, "global_step": 515216, "epoch": 6207} {"train_loss": -27.571271896362305, "global_step": 515217, "epoch": 6207} {"train_loss": -27.853208541870117, "global_step": 515218, "epoch": 6207} {"train_loss": -27.4321231842041, "global_step": 515219, "epoch": 6207} {"train_loss": -27.40955924987793, "global_step": 515220, "epoch": 6207} {"train_loss": -27.30171012878418, "global_step": 515221, "epoch": 6207} {"train_loss": -27.320667266845703, "global_step": 515222, "epoch": 6207} {"train_loss": -27.279699325561523, "global_step": 515223, "epoch": 6207} {"train_loss": -27.351886749267578, "global_step": 515224, "epoch": 6207} {"train_loss": -27.581125259399414, "global_step": 515225, "epoch": 6207} {"train_loss": -27.614093780517578, "global_step": 515226, "epoch": 6207} {"train_loss": -27.587848663330078, "global_step": 515227, "epoch": 6207} {"train_loss": -27.600452423095703, "global_step": 515228, "epoch": 6207} {"train_loss": -27.507522583007812, "global_step": 515229, "epoch": 6207} {"train_loss": -27.538223266601562, "global_step": 515230, "epoch": 6207} {"train_loss": -27.631885528564453, "global_step": 515231, "epoch": 6207} {"train_loss": -27.26434898376465, "global_step": 515232, "epoch": 6207} {"train_loss": -27.46133804321289, "global_step": 515233, "epoch": 6207} {"train_loss": -27.46854019165039, "global_step": 515234, "epoch": 6207} {"train_loss": -27.641265869140625, "global_step": 515235, "epoch": 6207} {"train_loss": -27.582077026367188, "global_step": 515236, "epoch": 6207} {"train_loss": -27.141342163085938, "global_step": 515237, "epoch": 6207} {"train_loss": -27.021926879882812, "global_step": 515238, "epoch": 6207} {"train_loss": -27.7340145111084, "global_step": 515239, "epoch": 6207} {"train_loss": -27.025915145874023, "global_step": 515240, "epoch": 6207} {"train_loss": -27.452838897705078, "global_step": 515241, "epoch": 6207} {"train_loss": -27.210163116455078, "global_step": 515242, "epoch": 6207} {"train_loss": -27.173847198486328, "global_step": 515243, "epoch": 6207} {"train_loss": -27.789941787719727, "global_step": 515244, "epoch": 6207} {"train_loss": -27.18134117126465, "global_step": 515245, "epoch": 6207} {"train_loss": -27.545026779174805, "global_step": 515246, "epoch": 6207} {"train_loss": -27.1461238861084, "global_step": 515247, "epoch": 6207} {"train_loss": -27.130578994750977, "global_step": 515248, "epoch": 6207} {"train_loss": -27.646268844604492, "global_step": 515249, "epoch": 6207} {"train_loss": -27.145483016967773, "global_step": 515250, "epoch": 6207} {"train_loss": -27.622678756713867, "global_step": 515251, "epoch": 6207} {"train_loss": -27.076642990112305, "global_step": 515252, "epoch": 6207} {"train_loss": -27.278295516967773, "global_step": 515253, "epoch": 6207} {"train_loss": -27.22369956970215, "global_step": 515254, "epoch": 6207} {"train_loss": -27.121540069580078, "global_step": 515255, "epoch": 6207} {"train_loss": -27.541650772094727, "global_step": 515256, "epoch": 6207} {"train_loss": -27.453907012939453, "global_step": 515257, "epoch": 6207} {"train_loss": -27.612531661987305, "global_step": 515258, "epoch": 6207} {"train_loss": -27.49749183654785, "global_step": 515259, "epoch": 6207} {"train_loss": -26.955276489257812, "global_step": 515260, "epoch": 6207} {"train_loss": -27.556320190429688, "global_step": 515261, "epoch": 6207} {"train_loss": -27.487165451049805, "global_step": 515262, "epoch": 6207} {"train_loss": -27.351536923144238, "global_step": 515263, "epoch": 6207, "val_loss": 6515688.0} {"train_loss": -24.79034423828125, "global_step": 515264, "epoch": 6208} {"train_loss": -23.06332778930664, "global_step": 515265, "epoch": 6208} {"train_loss": -26.0086612701416, "global_step": 515266, "epoch": 6208} {"train_loss": -26.204639434814453, "global_step": 515267, "epoch": 6208} {"train_loss": -25.26173210144043, "global_step": 515268, "epoch": 6208} {"train_loss": -26.708282470703125, "global_step": 515269, "epoch": 6208} {"train_loss": -26.159208297729492, "global_step": 515270, "epoch": 6208} {"train_loss": -26.1401309967041, "global_step": 515271, "epoch": 6208} {"train_loss": -26.6536808013916, "global_step": 515272, "epoch": 6208} {"train_loss": -25.72421646118164, "global_step": 515273, "epoch": 6208} {"train_loss": -26.90718650817871, "global_step": 515274, "epoch": 6208} {"train_loss": -26.264774322509766, "global_step": 515275, "epoch": 6208} {"train_loss": -26.775390625, "global_step": 515276, "epoch": 6208} {"train_loss": -26.264429092407227, "global_step": 515277, "epoch": 6208} {"train_loss": -27.279647827148438, "global_step": 515278, "epoch": 6208} {"train_loss": -26.845727920532227, "global_step": 515279, "epoch": 6208} {"train_loss": -26.817676544189453, "global_step": 515280, "epoch": 6208} {"train_loss": -26.692712783813477, "global_step": 515281, "epoch": 6208} {"train_loss": -26.821365356445312, "global_step": 515282, "epoch": 6208} {"train_loss": -26.74445152282715, "global_step": 515283, "epoch": 6208} {"train_loss": -27.2327823638916, "global_step": 515284, "epoch": 6208} {"train_loss": -27.01559829711914, "global_step": 515285, "epoch": 6208} {"train_loss": -26.86713218688965, "global_step": 515286, "epoch": 6208} {"train_loss": -27.01456069946289, "global_step": 515287, "epoch": 6208} {"train_loss": -27.21245765686035, "global_step": 515288, "epoch": 6208} {"train_loss": -27.139307022094727, "global_step": 515289, "epoch": 6208} {"train_loss": -27.06208610534668, "global_step": 515290, "epoch": 6208} {"train_loss": -27.697317123413086, "global_step": 515291, "epoch": 6208} {"train_loss": -27.17744255065918, "global_step": 515292, "epoch": 6208} {"train_loss": -27.246984481811523, "global_step": 515293, "epoch": 6208} {"train_loss": -27.22735595703125, "global_step": 515294, "epoch": 6208} {"train_loss": -27.44647789001465, "global_step": 515295, "epoch": 6208} {"train_loss": -26.98554039001465, "global_step": 515296, "epoch": 6208} {"train_loss": -27.316267013549805, "global_step": 515297, "epoch": 6208} {"train_loss": -26.972091674804688, "global_step": 515298, "epoch": 6208} {"train_loss": -27.455907821655273, "global_step": 515299, "epoch": 6208} {"train_loss": -27.39887046813965, "global_step": 515300, "epoch": 6208} {"train_loss": -27.456457138061523, "global_step": 515301, "epoch": 6208} {"train_loss": -27.505695343017578, "global_step": 515302, "epoch": 6208} {"train_loss": -27.315326690673828, "global_step": 515303, "epoch": 6208} {"train_loss": -27.385786056518555, "global_step": 515304, "epoch": 6208} {"train_loss": -27.62137794494629, "global_step": 515305, "epoch": 6208} {"train_loss": -27.709552764892578, "global_step": 515306, "epoch": 6208} {"train_loss": -27.170141220092773, "global_step": 515307, "epoch": 6208} {"train_loss": -28.032978057861328, "global_step": 515308, "epoch": 6208} {"train_loss": -27.179880142211914, "global_step": 515309, "epoch": 6208} {"train_loss": -27.495380401611328, "global_step": 515310, "epoch": 6208} {"train_loss": -27.737470626831055, "global_step": 515311, "epoch": 6208} {"train_loss": -27.606107711791992, "global_step": 515312, "epoch": 6208} {"train_loss": -27.56974220275879, "global_step": 515313, "epoch": 6208} {"train_loss": -27.658544540405273, "global_step": 515314, "epoch": 6208} {"train_loss": -27.24753189086914, "global_step": 515315, "epoch": 6208} {"train_loss": -27.779951095581055, "global_step": 515316, "epoch": 6208} {"train_loss": -27.40040397644043, "global_step": 515317, "epoch": 6208} {"train_loss": -27.9352970123291, "global_step": 515318, "epoch": 6208} {"train_loss": -27.28004264831543, "global_step": 515319, "epoch": 6208} {"train_loss": -27.885074615478516, "global_step": 515320, "epoch": 6208} {"train_loss": -27.576370239257812, "global_step": 515321, "epoch": 6208} {"train_loss": -27.947317123413086, "global_step": 515322, "epoch": 6208} {"train_loss": -27.43613052368164, "global_step": 515323, "epoch": 6208} {"train_loss": -27.793792724609375, "global_step": 515324, "epoch": 6208} {"train_loss": -27.72883415222168, "global_step": 515325, "epoch": 6208} {"train_loss": -27.939258575439453, "global_step": 515326, "epoch": 6208} {"train_loss": -27.720722198486328, "global_step": 515327, "epoch": 6208} {"train_loss": -28.142602920532227, "global_step": 515328, "epoch": 6208} {"train_loss": -27.651819229125977, "global_step": 515329, "epoch": 6208} {"train_loss": -27.64796257019043, "global_step": 515330, "epoch": 6208} {"train_loss": -28.003406524658203, "global_step": 515331, "epoch": 6208} {"train_loss": -27.5711669921875, "global_step": 515332, "epoch": 6208} {"train_loss": -27.44287109375, "global_step": 515333, "epoch": 6208} {"train_loss": -27.724393844604492, "global_step": 515334, "epoch": 6208} {"train_loss": -26.9665584564209, "global_step": 515335, "epoch": 6208} {"train_loss": -27.429433822631836, "global_step": 515336, "epoch": 6208} {"train_loss": -27.274398803710938, "global_step": 515337, "epoch": 6208} {"train_loss": -26.340539932250977, "global_step": 515338, "epoch": 6208} {"train_loss": -26.529016494750977, "global_step": 515339, "epoch": 6208} {"train_loss": -26.591278076171875, "global_step": 515340, "epoch": 6208} {"train_loss": -26.815954208374023, "global_step": 515341, "epoch": 6208} {"train_loss": -27.630615234375, "global_step": 515342, "epoch": 6208} {"train_loss": -27.04749870300293, "global_step": 515343, "epoch": 6208} {"train_loss": -27.514862060546875, "global_step": 515344, "epoch": 6208} {"train_loss": -27.070907592773438, "global_step": 515345, "epoch": 6208} {"train_loss": -27.105593141303004, "global_step": 515346, "epoch": 6208, "val_loss": 6539246.0} {"train_loss": -25.972095489501953, "global_step": 515347, "epoch": 6209} {"train_loss": -26.05169105529785, "global_step": 515348, "epoch": 6209} {"train_loss": -26.27370262145996, "global_step": 515349, "epoch": 6209} {"train_loss": -26.4879150390625, "global_step": 515350, "epoch": 6209} {"train_loss": -26.2606201171875, "global_step": 515351, "epoch": 6209} {"train_loss": -26.774433135986328, "global_step": 515352, "epoch": 6209} {"train_loss": -25.992414474487305, "global_step": 515353, "epoch": 6209} {"train_loss": -27.05719566345215, "global_step": 515354, "epoch": 6209} {"train_loss": -26.604406356811523, "global_step": 515355, "epoch": 6209} {"train_loss": -26.480560302734375, "global_step": 515356, "epoch": 6209} {"train_loss": -26.972064971923828, "global_step": 515357, "epoch": 6209} {"train_loss": -26.936237335205078, "global_step": 515358, "epoch": 6209} {"train_loss": -26.7476806640625, "global_step": 515359, "epoch": 6209} {"train_loss": -26.962406158447266, "global_step": 515360, "epoch": 6209} {"train_loss": -27.0308780670166, "global_step": 515361, "epoch": 6209} {"train_loss": -26.988698959350586, "global_step": 515362, "epoch": 6209} {"train_loss": -26.89410972595215, "global_step": 515363, "epoch": 6209} {"train_loss": -26.85409927368164, "global_step": 515364, "epoch": 6209} {"train_loss": -27.45936393737793, "global_step": 515365, "epoch": 6209} {"train_loss": -27.050397872924805, "global_step": 515366, "epoch": 6209} {"train_loss": -26.810638427734375, "global_step": 515367, "epoch": 6209} {"train_loss": -27.24396324157715, "global_step": 515368, "epoch": 6209} {"train_loss": -27.437286376953125, "global_step": 515369, "epoch": 6209} {"train_loss": -27.145313262939453, "global_step": 515370, "epoch": 6209} {"train_loss": -27.402982711791992, "global_step": 515371, "epoch": 6209} {"train_loss": -27.83123207092285, "global_step": 515372, "epoch": 6209} {"train_loss": -27.12933349609375, "global_step": 515373, "epoch": 6209} {"train_loss": -27.8111515045166, "global_step": 515374, "epoch": 6209} {"train_loss": -27.254785537719727, "global_step": 515375, "epoch": 6209} {"train_loss": -27.638641357421875, "global_step": 515376, "epoch": 6209} {"train_loss": -27.747671127319336, "global_step": 515377, "epoch": 6209} {"train_loss": -27.7551212310791, "global_step": 515378, "epoch": 6209} {"train_loss": -27.942411422729492, "global_step": 515379, "epoch": 6209} {"train_loss": -27.24041748046875, "global_step": 515380, "epoch": 6209} {"train_loss": -27.54962158203125, "global_step": 515381, "epoch": 6209} {"train_loss": -27.411710739135742, "global_step": 515382, "epoch": 6209} {"train_loss": -27.79318618774414, "global_step": 515383, "epoch": 6209} {"train_loss": -27.765058517456055, "global_step": 515384, "epoch": 6209} {"train_loss": -27.468000411987305, "global_step": 515385, "epoch": 6209} {"train_loss": -27.44940185546875, "global_step": 515386, "epoch": 6209} {"train_loss": -27.409061431884766, "global_step": 515387, "epoch": 6209} {"train_loss": -27.706579208374023, "global_step": 515388, "epoch": 6209} {"train_loss": -27.6937313079834, "global_step": 515389, "epoch": 6209} {"train_loss": -27.67457389831543, "global_step": 515390, "epoch": 6209} {"train_loss": -27.61432456970215, "global_step": 515391, "epoch": 6209} {"train_loss": -27.79483413696289, "global_step": 515392, "epoch": 6209} {"train_loss": -27.868743896484375, "global_step": 515393, "epoch": 6209} {"train_loss": -27.97083854675293, "global_step": 515394, "epoch": 6209} {"train_loss": -27.800878524780273, "global_step": 515395, "epoch": 6209} {"train_loss": -27.655282974243164, "global_step": 515396, "epoch": 6209} {"train_loss": -27.7730655670166, "global_step": 515397, "epoch": 6209} {"train_loss": -27.600133895874023, "global_step": 515398, "epoch": 6209} {"train_loss": -27.671894073486328, "global_step": 515399, "epoch": 6209} {"train_loss": -27.52874183654785, "global_step": 515400, "epoch": 6209} {"train_loss": -27.71626091003418, "global_step": 515401, "epoch": 6209} {"train_loss": -28.03021812438965, "global_step": 515402, "epoch": 6209} {"train_loss": -27.889469146728516, "global_step": 515403, "epoch": 6209} {"train_loss": -27.835617065429688, "global_step": 515404, "epoch": 6209} {"train_loss": -27.528125762939453, "global_step": 515405, "epoch": 6209} {"train_loss": -27.56757926940918, "global_step": 515406, "epoch": 6209} {"train_loss": -27.73638916015625, "global_step": 515407, "epoch": 6209} {"train_loss": -27.726226806640625, "global_step": 515408, "epoch": 6209} {"train_loss": -27.3637638092041, "global_step": 515409, "epoch": 6209} {"train_loss": -27.281635284423828, "global_step": 515410, "epoch": 6209} {"train_loss": -26.42108726501465, "global_step": 515411, "epoch": 6209} {"train_loss": -26.87444496154785, "global_step": 515412, "epoch": 6209} {"train_loss": -27.3365535736084, "global_step": 515413, "epoch": 6209} {"train_loss": -27.01798439025879, "global_step": 515414, "epoch": 6209} {"train_loss": -27.19559669494629, "global_step": 515415, "epoch": 6209} {"train_loss": -26.947357177734375, "global_step": 515416, "epoch": 6209} {"train_loss": -27.331958770751953, "global_step": 515417, "epoch": 6209} {"train_loss": -27.749713897705078, "global_step": 515418, "epoch": 6209} {"train_loss": -27.65142250061035, "global_step": 515419, "epoch": 6209} {"train_loss": -27.078245162963867, "global_step": 515420, "epoch": 6209} {"train_loss": -27.54387855529785, "global_step": 515421, "epoch": 6209} {"train_loss": -27.35699462890625, "global_step": 515422, "epoch": 6209} {"train_loss": -27.3227481842041, "global_step": 515423, "epoch": 6209} {"train_loss": -26.959705352783203, "global_step": 515424, "epoch": 6209} {"train_loss": -27.577009201049805, "global_step": 515425, "epoch": 6209} {"train_loss": -27.184179306030273, "global_step": 515426, "epoch": 6209} {"train_loss": -27.256567001342773, "global_step": 515427, "epoch": 6209} {"train_loss": -27.737451553344727, "global_step": 515428, "epoch": 6209} {"train_loss": -27.294921553278545, "global_step": 515429, "epoch": 6209, "val_loss": 6612378.0} {"train_loss": -25.80100440979004, "global_step": 515430, "epoch": 6210} {"train_loss": -26.13911247253418, "global_step": 515431, "epoch": 6210} {"train_loss": -26.0196475982666, "global_step": 515432, "epoch": 6210} {"train_loss": -26.415424346923828, "global_step": 515433, "epoch": 6210} {"train_loss": -26.588245391845703, "global_step": 515434, "epoch": 6210} {"train_loss": -26.245908737182617, "global_step": 515435, "epoch": 6210} {"train_loss": -26.762741088867188, "global_step": 515436, "epoch": 6210} {"train_loss": -26.56336784362793, "global_step": 515437, "epoch": 6210} {"train_loss": -27.026172637939453, "global_step": 515438, "epoch": 6210} {"train_loss": -26.819555282592773, "global_step": 515439, "epoch": 6210} {"train_loss": -26.76431655883789, "global_step": 515440, "epoch": 6210} {"train_loss": -26.479230880737305, "global_step": 515441, "epoch": 6210} {"train_loss": -26.611408233642578, "global_step": 515442, "epoch": 6210} {"train_loss": -26.9793701171875, "global_step": 515443, "epoch": 6210} {"train_loss": -26.575891494750977, "global_step": 515444, "epoch": 6210} {"train_loss": -26.909992218017578, "global_step": 515445, "epoch": 6210} {"train_loss": -26.73878288269043, "global_step": 515446, "epoch": 6210} {"train_loss": -26.76211929321289, "global_step": 515447, "epoch": 6210} {"train_loss": -26.9960994720459, "global_step": 515448, "epoch": 6210} {"train_loss": -26.823942184448242, "global_step": 515449, "epoch": 6210} {"train_loss": -26.818227767944336, "global_step": 515450, "epoch": 6210} {"train_loss": -27.30426597595215, "global_step": 515451, "epoch": 6210} {"train_loss": -27.092700958251953, "global_step": 515452, "epoch": 6210} {"train_loss": -27.3138484954834, "global_step": 515453, "epoch": 6210} {"train_loss": -27.26405143737793, "global_step": 515454, "epoch": 6210} {"train_loss": -27.074420928955078, "global_step": 515455, "epoch": 6210} {"train_loss": -27.316390991210938, "global_step": 515456, "epoch": 6210} {"train_loss": -27.064855575561523, "global_step": 515457, "epoch": 6210} {"train_loss": -27.588605880737305, "global_step": 515458, "epoch": 6210} {"train_loss": -27.327136993408203, "global_step": 515459, "epoch": 6210} {"train_loss": -27.34608268737793, "global_step": 515460, "epoch": 6210} {"train_loss": -27.420032501220703, "global_step": 515461, "epoch": 6210} {"train_loss": -27.302738189697266, "global_step": 515462, "epoch": 6210} {"train_loss": -27.461196899414062, "global_step": 515463, "epoch": 6210} {"train_loss": -27.519189834594727, "global_step": 515464, "epoch": 6210} {"train_loss": -27.41973304748535, "global_step": 515465, "epoch": 6210} {"train_loss": -27.6520938873291, "global_step": 515466, "epoch": 6210} {"train_loss": -27.9920711517334, "global_step": 515467, "epoch": 6210} {"train_loss": -27.244873046875, "global_step": 515468, "epoch": 6210} {"train_loss": -27.525312423706055, "global_step": 515469, "epoch": 6210} {"train_loss": -27.38726806640625, "global_step": 515470, "epoch": 6210} {"train_loss": -27.469867706298828, "global_step": 515471, "epoch": 6210} {"train_loss": -27.581287384033203, "global_step": 515472, "epoch": 6210} {"train_loss": -27.45232582092285, "global_step": 515473, "epoch": 6210} {"train_loss": -27.536041259765625, "global_step": 515474, "epoch": 6210} {"train_loss": -27.7014217376709, "global_step": 515475, "epoch": 6210} {"train_loss": -27.763715744018555, "global_step": 515476, "epoch": 6210} {"train_loss": -27.7409725189209, "global_step": 515477, "epoch": 6210} {"train_loss": -27.783435821533203, "global_step": 515478, "epoch": 6210} {"train_loss": -27.891590118408203, "global_step": 515479, "epoch": 6210} {"train_loss": -28.0445613861084, "global_step": 515480, "epoch": 6210} {"train_loss": -27.530908584594727, "global_step": 515481, "epoch": 6210} {"train_loss": -27.75129508972168, "global_step": 515482, "epoch": 6210} {"train_loss": -27.3890438079834, "global_step": 515483, "epoch": 6210} {"train_loss": -27.648679733276367, "global_step": 515484, "epoch": 6210} {"train_loss": -27.18256950378418, "global_step": 515485, "epoch": 6210} {"train_loss": -27.51045799255371, "global_step": 515486, "epoch": 6210} {"train_loss": -27.46698570251465, "global_step": 515487, "epoch": 6210} {"train_loss": -27.759016036987305, "global_step": 515488, "epoch": 6210} {"train_loss": -27.55974769592285, "global_step": 515489, "epoch": 6210} {"train_loss": -27.48089599609375, "global_step": 515490, "epoch": 6210} {"train_loss": -27.698583602905273, "global_step": 515491, "epoch": 6210} {"train_loss": -27.661108016967773, "global_step": 515492, "epoch": 6210} {"train_loss": -27.73072624206543, "global_step": 515493, "epoch": 6210} {"train_loss": -27.717771530151367, "global_step": 515494, "epoch": 6210} {"train_loss": -27.32510757446289, "global_step": 515495, "epoch": 6210} {"train_loss": -27.879159927368164, "global_step": 515496, "epoch": 6210} {"train_loss": -27.406208038330078, "global_step": 515497, "epoch": 6210} {"train_loss": -27.483932495117188, "global_step": 515498, "epoch": 6210} {"train_loss": -27.0390682220459, "global_step": 515499, "epoch": 6210} {"train_loss": -27.409473419189453, "global_step": 515500, "epoch": 6210} {"train_loss": -27.453805923461914, "global_step": 515501, "epoch": 6210} {"train_loss": -27.576154708862305, "global_step": 515502, "epoch": 6210} {"train_loss": -27.34457778930664, "global_step": 515503, "epoch": 6210} {"train_loss": -27.3638916015625, "global_step": 515504, "epoch": 6210} {"train_loss": -27.257633209228516, "global_step": 515505, "epoch": 6210} {"train_loss": -27.336084365844727, "global_step": 515506, "epoch": 6210} {"train_loss": -27.306869506835938, "global_step": 515507, "epoch": 6210} {"train_loss": -27.6030216217041, "global_step": 515508, "epoch": 6210} {"train_loss": -27.205169677734375, "global_step": 515509, "epoch": 6210} {"train_loss": -27.53619384765625, "global_step": 515510, "epoch": 6210} {"train_loss": -27.430770874023438, "global_step": 515511, "epoch": 6210} {"train_loss": -27.265070559030555, "global_step": 515512, "epoch": 6210, "val_loss": 6532367.0} {"train_loss": -26.9708194732666, "global_step": 515513, "epoch": 6211} {"train_loss": -26.482898712158203, "global_step": 515514, "epoch": 6211} {"train_loss": -26.8282413482666, "global_step": 515515, "epoch": 6211} {"train_loss": -27.100605010986328, "global_step": 515516, "epoch": 6211} {"train_loss": -26.13656997680664, "global_step": 515517, "epoch": 6211} {"train_loss": -26.27166175842285, "global_step": 515518, "epoch": 6211} {"train_loss": -26.469058990478516, "global_step": 515519, "epoch": 6211} {"train_loss": -27.474994659423828, "global_step": 515520, "epoch": 6211} {"train_loss": -26.492298126220703, "global_step": 515521, "epoch": 6211} {"train_loss": -27.066314697265625, "global_step": 515522, "epoch": 6211} {"train_loss": -26.670246124267578, "global_step": 515523, "epoch": 6211} {"train_loss": -27.14652442932129, "global_step": 515524, "epoch": 6211} {"train_loss": -26.958093643188477, "global_step": 515525, "epoch": 6211} {"train_loss": -26.859619140625, "global_step": 515526, "epoch": 6211} {"train_loss": -27.259674072265625, "global_step": 515527, "epoch": 6211} {"train_loss": -27.154584884643555, "global_step": 515528, "epoch": 6211} {"train_loss": -27.009525299072266, "global_step": 515529, "epoch": 6211} {"train_loss": -27.298444747924805, "global_step": 515530, "epoch": 6211} {"train_loss": -27.0388240814209, "global_step": 515531, "epoch": 6211} {"train_loss": -27.213727951049805, "global_step": 515532, "epoch": 6211} {"train_loss": -27.143014907836914, "global_step": 515533, "epoch": 6211} {"train_loss": -27.544652938842773, "global_step": 515534, "epoch": 6211} {"train_loss": -27.002309799194336, "global_step": 515535, "epoch": 6211} {"train_loss": -27.144723892211914, "global_step": 515536, "epoch": 6211} {"train_loss": -27.137983322143555, "global_step": 515537, "epoch": 6211} {"train_loss": -27.53719139099121, "global_step": 515538, "epoch": 6211} {"train_loss": -27.465280532836914, "global_step": 515539, "epoch": 6211} {"train_loss": -27.731618881225586, "global_step": 515540, "epoch": 6211} {"train_loss": -27.428253173828125, "global_step": 515541, "epoch": 6211} {"train_loss": -27.713891983032227, "global_step": 515542, "epoch": 6211} {"train_loss": -27.58223533630371, "global_step": 515543, "epoch": 6211} {"train_loss": -27.357885360717773, "global_step": 515544, "epoch": 6211} {"train_loss": -27.693771362304688, "global_step": 515545, "epoch": 6211} {"train_loss": -27.550296783447266, "global_step": 515546, "epoch": 6211} {"train_loss": -27.25819969177246, "global_step": 515547, "epoch": 6211} {"train_loss": -27.3651065826416, "global_step": 515548, "epoch": 6211} {"train_loss": -27.2408390045166, "global_step": 515549, "epoch": 6211} {"train_loss": -27.44684410095215, "global_step": 515550, "epoch": 6211} {"train_loss": -27.7441463470459, "global_step": 515551, "epoch": 6211} {"train_loss": -27.42238426208496, "global_step": 515552, "epoch": 6211} {"train_loss": -27.523889541625977, "global_step": 515553, "epoch": 6211} {"train_loss": -27.871322631835938, "global_step": 515554, "epoch": 6211} {"train_loss": -27.328527450561523, "global_step": 515555, "epoch": 6211} {"train_loss": -26.975011825561523, "global_step": 515556, "epoch": 6211} {"train_loss": -26.658048629760742, "global_step": 515557, "epoch": 6211} {"train_loss": -26.749496459960938, "global_step": 515558, "epoch": 6211} {"train_loss": -27.463642120361328, "global_step": 515559, "epoch": 6211} {"train_loss": -27.4692440032959, "global_step": 515560, "epoch": 6211} {"train_loss": -27.121658325195312, "global_step": 515561, "epoch": 6211} {"train_loss": -27.74879264831543, "global_step": 515562, "epoch": 6211} {"train_loss": -27.800329208374023, "global_step": 515563, "epoch": 6211} {"train_loss": -27.150808334350586, "global_step": 515564, "epoch": 6211} {"train_loss": -27.406848907470703, "global_step": 515565, "epoch": 6211} {"train_loss": -27.5059757232666, "global_step": 515566, "epoch": 6211} {"train_loss": -27.739826202392578, "global_step": 515567, "epoch": 6211} {"train_loss": -27.63238525390625, "global_step": 515568, "epoch": 6211} {"train_loss": -27.50711441040039, "global_step": 515569, "epoch": 6211} {"train_loss": -27.576786041259766, "global_step": 515570, "epoch": 6211} {"train_loss": -27.212499618530273, "global_step": 515571, "epoch": 6211} {"train_loss": -27.778562545776367, "global_step": 515572, "epoch": 6211} {"train_loss": -27.475086212158203, "global_step": 515573, "epoch": 6211} {"train_loss": -27.51003074645996, "global_step": 515574, "epoch": 6211} {"train_loss": -27.249622344970703, "global_step": 515575, "epoch": 6211} {"train_loss": -27.035802841186523, "global_step": 515576, "epoch": 6211} {"train_loss": -27.65944480895996, "global_step": 515577, "epoch": 6211} {"train_loss": -27.659936904907227, "global_step": 515578, "epoch": 6211} {"train_loss": -27.573352813720703, "global_step": 515579, "epoch": 6211} {"train_loss": -27.44883155822754, "global_step": 515580, "epoch": 6211} {"train_loss": -27.620193481445312, "global_step": 515581, "epoch": 6211} {"train_loss": -27.837890625, "global_step": 515582, "epoch": 6211} {"train_loss": -27.288259506225586, "global_step": 515583, "epoch": 6211} {"train_loss": -27.4739933013916, "global_step": 515584, "epoch": 6211} {"train_loss": -27.40008544921875, "global_step": 515585, "epoch": 6211} {"train_loss": -27.694965362548828, "global_step": 515586, "epoch": 6211} {"train_loss": -27.389556884765625, "global_step": 515587, "epoch": 6211} {"train_loss": -27.508636474609375, "global_step": 515588, "epoch": 6211} {"train_loss": -27.658340454101562, "global_step": 515589, "epoch": 6211} {"train_loss": -27.92896842956543, "global_step": 515590, "epoch": 6211} {"train_loss": -28.232666015625, "global_step": 515591, "epoch": 6211} {"train_loss": -27.548673629760742, "global_step": 515592, "epoch": 6211} {"train_loss": -27.490915298461914, "global_step": 515593, "epoch": 6211} {"train_loss": -27.352041244506836, "global_step": 515594, "epoch": 6211} {"train_loss": -27.321683217243976, "global_step": 515595, "epoch": 6211, "val_loss": 6521065.0} {"train_loss": -26.79986000061035, "global_step": 515596, "epoch": 6212} {"train_loss": -26.62689781188965, "global_step": 515597, "epoch": 6212} {"train_loss": -27.011022567749023, "global_step": 515598, "epoch": 6212} {"train_loss": -26.591894149780273, "global_step": 515599, "epoch": 6212} {"train_loss": -27.237274169921875, "global_step": 515600, "epoch": 6212} {"train_loss": -27.11697769165039, "global_step": 515601, "epoch": 6212} {"train_loss": -27.40345573425293, "global_step": 515602, "epoch": 6212} {"train_loss": -26.702558517456055, "global_step": 515603, "epoch": 6212} {"train_loss": -26.927534103393555, "global_step": 515604, "epoch": 6212} {"train_loss": -27.320852279663086, "global_step": 515605, "epoch": 6212} {"train_loss": -27.129053115844727, "global_step": 515606, "epoch": 6212} {"train_loss": -27.14798355102539, "global_step": 515607, "epoch": 6212} {"train_loss": -26.97919273376465, "global_step": 515608, "epoch": 6212} {"train_loss": -26.89459800720215, "global_step": 515609, "epoch": 6212} {"train_loss": -27.092437744140625, "global_step": 515610, "epoch": 6212} {"train_loss": -27.23685646057129, "global_step": 515611, "epoch": 6212} {"train_loss": -27.14449119567871, "global_step": 515612, "epoch": 6212} {"train_loss": -26.830175399780273, "global_step": 515613, "epoch": 6212} {"train_loss": -27.188053131103516, "global_step": 515614, "epoch": 6212} {"train_loss": -27.38286781311035, "global_step": 515615, "epoch": 6212} {"train_loss": -27.272069931030273, "global_step": 515616, "epoch": 6212} {"train_loss": -27.21455192565918, "global_step": 515617, "epoch": 6212} {"train_loss": -27.214096069335938, "global_step": 515618, "epoch": 6212} {"train_loss": -27.3475399017334, "global_step": 515619, "epoch": 6212} {"train_loss": -27.098012924194336, "global_step": 515620, "epoch": 6212} {"train_loss": -27.47748374938965, "global_step": 515621, "epoch": 6212} {"train_loss": -27.555341720581055, "global_step": 515622, "epoch": 6212} {"train_loss": -27.151655197143555, "global_step": 515623, "epoch": 6212} {"train_loss": -27.35297203063965, "global_step": 515624, "epoch": 6212} {"train_loss": -27.342914581298828, "global_step": 515625, "epoch": 6212} {"train_loss": -27.398025512695312, "global_step": 515626, "epoch": 6212} {"train_loss": -27.030750274658203, "global_step": 515627, "epoch": 6212} {"train_loss": -27.632755279541016, "global_step": 515628, "epoch": 6212} {"train_loss": -27.389326095581055, "global_step": 515629, "epoch": 6212} {"train_loss": -27.381628036499023, "global_step": 515630, "epoch": 6212} {"train_loss": -27.139301300048828, "global_step": 515631, "epoch": 6212} {"train_loss": -27.45965003967285, "global_step": 515632, "epoch": 6212} {"train_loss": -27.307477951049805, "global_step": 515633, "epoch": 6212} {"train_loss": -27.746809005737305, "global_step": 515634, "epoch": 6212} {"train_loss": -27.464887619018555, "global_step": 515635, "epoch": 6212} {"train_loss": -27.677953720092773, "global_step": 515636, "epoch": 6212} {"train_loss": -27.512250900268555, "global_step": 515637, "epoch": 6212} {"train_loss": -27.653366088867188, "global_step": 515638, "epoch": 6212} {"train_loss": -27.56766700744629, "global_step": 515639, "epoch": 6212} {"train_loss": -27.41705322265625, "global_step": 515640, "epoch": 6212} {"train_loss": -27.781787872314453, "global_step": 515641, "epoch": 6212} {"train_loss": -27.31081199645996, "global_step": 515642, "epoch": 6212} {"train_loss": -27.66729164123535, "global_step": 515643, "epoch": 6212} {"train_loss": -27.768835067749023, "global_step": 515644, "epoch": 6212} {"train_loss": -27.782379150390625, "global_step": 515645, "epoch": 6212} {"train_loss": -27.70576286315918, "global_step": 515646, "epoch": 6212} {"train_loss": -27.54458999633789, "global_step": 515647, "epoch": 6212} {"train_loss": -27.657567977905273, "global_step": 515648, "epoch": 6212} {"train_loss": -27.553747177124023, "global_step": 515649, "epoch": 6212} {"train_loss": -27.424779891967773, "global_step": 515650, "epoch": 6212} {"train_loss": -27.524179458618164, "global_step": 515651, "epoch": 6212} {"train_loss": -27.630908966064453, "global_step": 515652, "epoch": 6212} {"train_loss": -27.560291290283203, "global_step": 515653, "epoch": 6212} {"train_loss": -27.524337768554688, "global_step": 515654, "epoch": 6212} {"train_loss": -28.1861515045166, "global_step": 515655, "epoch": 6212} {"train_loss": -27.595006942749023, "global_step": 515656, "epoch": 6212} {"train_loss": -27.7951717376709, "global_step": 515657, "epoch": 6212} {"train_loss": -27.528165817260742, "global_step": 515658, "epoch": 6212} {"train_loss": -27.78132438659668, "global_step": 515659, "epoch": 6212} {"train_loss": -27.8410701751709, "global_step": 515660, "epoch": 6212} {"train_loss": -28.04169273376465, "global_step": 515661, "epoch": 6212} {"train_loss": -28.058658599853516, "global_step": 515662, "epoch": 6212} {"train_loss": -27.29166030883789, "global_step": 515663, "epoch": 6212} {"train_loss": -27.350452423095703, "global_step": 515664, "epoch": 6212} {"train_loss": -27.59689712524414, "global_step": 515665, "epoch": 6212} {"train_loss": -27.884769439697266, "global_step": 515666, "epoch": 6212} {"train_loss": -28.020099639892578, "global_step": 515667, "epoch": 6212} {"train_loss": -27.711566925048828, "global_step": 515668, "epoch": 6212} {"train_loss": -27.928186416625977, "global_step": 515669, "epoch": 6212} {"train_loss": -27.506437301635742, "global_step": 515670, "epoch": 6212} {"train_loss": -27.686914443969727, "global_step": 515671, "epoch": 6212} {"train_loss": -27.374792098999023, "global_step": 515672, "epoch": 6212} {"train_loss": -27.385578155517578, "global_step": 515673, "epoch": 6212} {"train_loss": -27.944665908813477, "global_step": 515674, "epoch": 6212} {"train_loss": -27.672651290893555, "global_step": 515675, "epoch": 6212} {"train_loss": -27.28098487854004, "global_step": 515676, "epoch": 6212} {"train_loss": -27.705224990844727, "global_step": 515677, "epoch": 6212} {"train_loss": -27.42355167434876, "global_step": 515678, "epoch": 6212, "val_loss": 6544564.5} {"train_loss": -27.0030517578125, "global_step": 515679, "epoch": 6213} {"train_loss": -26.341466903686523, "global_step": 515680, "epoch": 6213} {"train_loss": -27.24091911315918, "global_step": 515681, "epoch": 6213} {"train_loss": -27.430662155151367, "global_step": 515682, "epoch": 6213} {"train_loss": -27.007558822631836, "global_step": 515683, "epoch": 6213} {"train_loss": -26.653213500976562, "global_step": 515684, "epoch": 6213} {"train_loss": -26.528079986572266, "global_step": 515685, "epoch": 6213} {"train_loss": -26.687047958374023, "global_step": 515686, "epoch": 6213} {"train_loss": -26.968748092651367, "global_step": 515687, "epoch": 6213} {"train_loss": -26.87848472595215, "global_step": 515688, "epoch": 6213} {"train_loss": -26.6381893157959, "global_step": 515689, "epoch": 6213} {"train_loss": -26.908063888549805, "global_step": 515690, "epoch": 6213} {"train_loss": -27.40937614440918, "global_step": 515691, "epoch": 6213} {"train_loss": -26.71919822692871, "global_step": 515692, "epoch": 6213} {"train_loss": -27.325841903686523, "global_step": 515693, "epoch": 6213} {"train_loss": -27.089807510375977, "global_step": 515694, "epoch": 6213} {"train_loss": -27.175201416015625, "global_step": 515695, "epoch": 6213} {"train_loss": -27.4429874420166, "global_step": 515696, "epoch": 6213} {"train_loss": -27.3090877532959, "global_step": 515697, "epoch": 6213} {"train_loss": -27.10310935974121, "global_step": 515698, "epoch": 6213} {"train_loss": -27.310169219970703, "global_step": 515699, "epoch": 6213} {"train_loss": -27.44647789001465, "global_step": 515700, "epoch": 6213} {"train_loss": -27.295629501342773, "global_step": 515701, "epoch": 6213} {"train_loss": -27.408185958862305, "global_step": 515702, "epoch": 6213} {"train_loss": -27.73480796813965, "global_step": 515703, "epoch": 6213} {"train_loss": -27.453754425048828, "global_step": 515704, "epoch": 6213} {"train_loss": -27.591196060180664, "global_step": 515705, "epoch": 6213} {"train_loss": -27.708845138549805, "global_step": 515706, "epoch": 6213} {"train_loss": -27.27176284790039, "global_step": 515707, "epoch": 6213} {"train_loss": -27.515277862548828, "global_step": 515708, "epoch": 6213} {"train_loss": -27.470991134643555, "global_step": 515709, "epoch": 6213} {"train_loss": -27.095855712890625, "global_step": 515710, "epoch": 6213} {"train_loss": -27.583349227905273, "global_step": 515711, "epoch": 6213} {"train_loss": -27.10637855529785, "global_step": 515712, "epoch": 6213} {"train_loss": -27.865812301635742, "global_step": 515713, "epoch": 6213} {"train_loss": -27.6215877532959, "global_step": 515714, "epoch": 6213} {"train_loss": -27.551382064819336, "global_step": 515715, "epoch": 6213} {"train_loss": -27.098295211791992, "global_step": 515716, "epoch": 6213} {"train_loss": -27.2076416015625, "global_step": 515717, "epoch": 6213} {"train_loss": -27.45608901977539, "global_step": 515718, "epoch": 6213} {"train_loss": -27.49126625061035, "global_step": 515719, "epoch": 6213} {"train_loss": -27.5308780670166, "global_step": 515720, "epoch": 6213} {"train_loss": -27.404184341430664, "global_step": 515721, "epoch": 6213} {"train_loss": -27.5556697845459, "global_step": 515722, "epoch": 6213} {"train_loss": -27.83234977722168, "global_step": 515723, "epoch": 6213} {"train_loss": -27.655481338500977, "global_step": 515724, "epoch": 6213} {"train_loss": -27.7427978515625, "global_step": 515725, "epoch": 6213} {"train_loss": -27.421772003173828, "global_step": 515726, "epoch": 6213} {"train_loss": -27.405729293823242, "global_step": 515727, "epoch": 6213} {"train_loss": -27.55768394470215, "global_step": 515728, "epoch": 6213} {"train_loss": -27.895751953125, "global_step": 515729, "epoch": 6213} {"train_loss": -27.625537872314453, "global_step": 515730, "epoch": 6213} {"train_loss": -27.90353775024414, "global_step": 515731, "epoch": 6213} {"train_loss": -27.552032470703125, "global_step": 515732, "epoch": 6213} {"train_loss": -27.69923210144043, "global_step": 515733, "epoch": 6213} {"train_loss": -27.37409782409668, "global_step": 515734, "epoch": 6213} {"train_loss": -27.008527755737305, "global_step": 515735, "epoch": 6213} {"train_loss": -27.602102279663086, "global_step": 515736, "epoch": 6213} {"train_loss": -27.637022018432617, "global_step": 515737, "epoch": 6213} {"train_loss": -27.86687660217285, "global_step": 515738, "epoch": 6213} {"train_loss": -27.838031768798828, "global_step": 515739, "epoch": 6213} {"train_loss": -27.61737632751465, "global_step": 515740, "epoch": 6213} {"train_loss": -27.775714874267578, "global_step": 515741, "epoch": 6213} {"train_loss": -27.386417388916016, "global_step": 515742, "epoch": 6213} {"train_loss": -27.15288734436035, "global_step": 515743, "epoch": 6213} {"train_loss": -27.882970809936523, "global_step": 515744, "epoch": 6213} {"train_loss": -27.779260635375977, "global_step": 515745, "epoch": 6213} {"train_loss": -27.594053268432617, "global_step": 515746, "epoch": 6213} {"train_loss": -27.5949764251709, "global_step": 515747, "epoch": 6213} {"train_loss": -27.481046676635742, "global_step": 515748, "epoch": 6213} {"train_loss": -27.411930084228516, "global_step": 515749, "epoch": 6213} {"train_loss": -27.6697940826416, "global_step": 515750, "epoch": 6213} {"train_loss": -27.983112335205078, "global_step": 515751, "epoch": 6213} {"train_loss": -27.2426815032959, "global_step": 515752, "epoch": 6213} {"train_loss": -27.546072006225586, "global_step": 515753, "epoch": 6213} {"train_loss": -27.633325576782227, "global_step": 515754, "epoch": 6213} {"train_loss": -27.479684829711914, "global_step": 515755, "epoch": 6213} {"train_loss": -27.677610397338867, "global_step": 515756, "epoch": 6213} {"train_loss": -27.566308975219727, "global_step": 515757, "epoch": 6213} {"train_loss": -27.363611221313477, "global_step": 515758, "epoch": 6213} {"train_loss": -27.591175079345703, "global_step": 515759, "epoch": 6213} {"train_loss": -27.071277618408203, "global_step": 515760, "epoch": 6213} {"train_loss": -27.38259834841073, "global_step": 515761, "epoch": 6213, "val_loss": 6661375.0} {"train_loss": -26.083959579467773, "global_step": 515762, "epoch": 6214} {"train_loss": -27.00649070739746, "global_step": 515763, "epoch": 6214} {"train_loss": -26.010467529296875, "global_step": 515764, "epoch": 6214} {"train_loss": -26.245702743530273, "global_step": 515765, "epoch": 6214} {"train_loss": -26.35782814025879, "global_step": 515766, "epoch": 6214} {"train_loss": -26.652326583862305, "global_step": 515767, "epoch": 6214} {"train_loss": -27.032316207885742, "global_step": 515768, "epoch": 6214} {"train_loss": -26.64349365234375, "global_step": 515769, "epoch": 6214} {"train_loss": -26.73974609375, "global_step": 515770, "epoch": 6214} {"train_loss": -26.70599365234375, "global_step": 515771, "epoch": 6214} {"train_loss": -27.24199867248535, "global_step": 515772, "epoch": 6214} {"train_loss": -26.406360626220703, "global_step": 515773, "epoch": 6214} {"train_loss": -27.239309310913086, "global_step": 515774, "epoch": 6214} {"train_loss": -26.826629638671875, "global_step": 515775, "epoch": 6214} {"train_loss": -27.04085350036621, "global_step": 515776, "epoch": 6214} {"train_loss": -26.938764572143555, "global_step": 515777, "epoch": 6214} {"train_loss": -26.47212028503418, "global_step": 515778, "epoch": 6214} {"train_loss": -27.11036491394043, "global_step": 515779, "epoch": 6214} {"train_loss": -26.965930938720703, "global_step": 515780, "epoch": 6214} {"train_loss": -26.900177001953125, "global_step": 515781, "epoch": 6214} {"train_loss": -27.183698654174805, "global_step": 515782, "epoch": 6214} {"train_loss": -26.865264892578125, "global_step": 515783, "epoch": 6214} {"train_loss": -26.89780044555664, "global_step": 515784, "epoch": 6214} {"train_loss": -27.336027145385742, "global_step": 515785, "epoch": 6214} {"train_loss": -27.0860538482666, "global_step": 515786, "epoch": 6214} {"train_loss": -27.22027015686035, "global_step": 515787, "epoch": 6214} {"train_loss": -27.489770889282227, "global_step": 515788, "epoch": 6214} {"train_loss": -27.462814331054688, "global_step": 515789, "epoch": 6214} {"train_loss": -27.509017944335938, "global_step": 515790, "epoch": 6214} {"train_loss": -27.31340980529785, "global_step": 515791, "epoch": 6214} {"train_loss": -27.014087677001953, "global_step": 515792, "epoch": 6214} {"train_loss": -27.290802001953125, "global_step": 515793, "epoch": 6214} {"train_loss": -27.246389389038086, "global_step": 515794, "epoch": 6214} {"train_loss": -27.604162216186523, "global_step": 515795, "epoch": 6214} {"train_loss": -27.35308265686035, "global_step": 515796, "epoch": 6214} {"train_loss": -27.581562042236328, "global_step": 515797, "epoch": 6214} {"train_loss": -27.740224838256836, "global_step": 515798, "epoch": 6214} {"train_loss": -27.56902503967285, "global_step": 515799, "epoch": 6214} {"train_loss": -27.26161003112793, "global_step": 515800, "epoch": 6214} {"train_loss": -27.492467880249023, "global_step": 515801, "epoch": 6214} {"train_loss": -27.6710147857666, "global_step": 515802, "epoch": 6214} {"train_loss": -27.615894317626953, "global_step": 515803, "epoch": 6214} {"train_loss": -27.896240234375, "global_step": 515804, "epoch": 6214} {"train_loss": -27.732446670532227, "global_step": 515805, "epoch": 6214} {"train_loss": -27.77581214904785, "global_step": 515806, "epoch": 6214} {"train_loss": -27.924081802368164, "global_step": 515807, "epoch": 6214} {"train_loss": -27.527143478393555, "global_step": 515808, "epoch": 6214} {"train_loss": -27.809064865112305, "global_step": 515809, "epoch": 6214} {"train_loss": -27.69415855407715, "global_step": 515810, "epoch": 6214} {"train_loss": -27.539403915405273, "global_step": 515811, "epoch": 6214} {"train_loss": -27.336889266967773, "global_step": 515812, "epoch": 6214} {"train_loss": -27.650959014892578, "global_step": 515813, "epoch": 6214} {"train_loss": -27.394689559936523, "global_step": 515814, "epoch": 6214} {"train_loss": -27.904138565063477, "global_step": 515815, "epoch": 6214} {"train_loss": -27.76446533203125, "global_step": 515816, "epoch": 6214} {"train_loss": -27.67726707458496, "global_step": 515817, "epoch": 6214} {"train_loss": -27.490697860717773, "global_step": 515818, "epoch": 6214} {"train_loss": -27.154020309448242, "global_step": 515819, "epoch": 6214} {"train_loss": -27.25569725036621, "global_step": 515820, "epoch": 6214} {"train_loss": -27.182397842407227, "global_step": 515821, "epoch": 6214} {"train_loss": -27.351043701171875, "global_step": 515822, "epoch": 6214} {"train_loss": -27.38214683532715, "global_step": 515823, "epoch": 6214} {"train_loss": -28.050764083862305, "global_step": 515824, "epoch": 6214} {"train_loss": -27.134979248046875, "global_step": 515825, "epoch": 6214} {"train_loss": -27.591047286987305, "global_step": 515826, "epoch": 6214} {"train_loss": -27.425153732299805, "global_step": 515827, "epoch": 6214} {"train_loss": -27.362445831298828, "global_step": 515828, "epoch": 6214} {"train_loss": -27.420120239257812, "global_step": 515829, "epoch": 6214} {"train_loss": -27.600666046142578, "global_step": 515830, "epoch": 6214} {"train_loss": -27.3317928314209, "global_step": 515831, "epoch": 6214} {"train_loss": -27.706130981445312, "global_step": 515832, "epoch": 6214} {"train_loss": -27.48731803894043, "global_step": 515833, "epoch": 6214} {"train_loss": -27.239789962768555, "global_step": 515834, "epoch": 6214} {"train_loss": -27.213306427001953, "global_step": 515835, "epoch": 6214} {"train_loss": -27.76240348815918, "global_step": 515836, "epoch": 6214} {"train_loss": -27.658695220947266, "global_step": 515837, "epoch": 6214} {"train_loss": -27.751636505126953, "global_step": 515838, "epoch": 6214} {"train_loss": -27.491992950439453, "global_step": 515839, "epoch": 6214} {"train_loss": -27.695133209228516, "global_step": 515840, "epoch": 6214} {"train_loss": -27.4256591796875, "global_step": 515841, "epoch": 6214} {"train_loss": -27.946537017822266, "global_step": 515842, "epoch": 6214} {"train_loss": -27.72468376159668, "global_step": 515843, "epoch": 6214} {"train_loss": -27.309724807739258, "global_step": 515844, "epoch": 6214, "val_loss": 6528096.0} {"train_loss": -27.25079917907715, "global_step": 515845, "epoch": 6215} {"train_loss": -27.290149688720703, "global_step": 515846, "epoch": 6215} {"train_loss": -27.22870445251465, "global_step": 515847, "epoch": 6215} {"train_loss": -26.982440948486328, "global_step": 515848, "epoch": 6215} {"train_loss": -27.035327911376953, "global_step": 515849, "epoch": 6215} {"train_loss": -27.033649444580078, "global_step": 515850, "epoch": 6215} {"train_loss": -27.012598037719727, "global_step": 515851, "epoch": 6215} {"train_loss": -27.494232177734375, "global_step": 515852, "epoch": 6215} {"train_loss": -26.902820587158203, "global_step": 515853, "epoch": 6215} {"train_loss": -26.717741012573242, "global_step": 515854, "epoch": 6215} {"train_loss": -27.416112899780273, "global_step": 515855, "epoch": 6215} {"train_loss": -27.239538192749023, "global_step": 515856, "epoch": 6215} {"train_loss": -26.887481689453125, "global_step": 515857, "epoch": 6215} {"train_loss": -26.970579147338867, "global_step": 515858, "epoch": 6215} {"train_loss": -27.249618530273438, "global_step": 515859, "epoch": 6215} {"train_loss": -27.180892944335938, "global_step": 515860, "epoch": 6215} {"train_loss": -27.3342342376709, "global_step": 515861, "epoch": 6215} {"train_loss": -27.354406356811523, "global_step": 515862, "epoch": 6215} {"train_loss": -27.378992080688477, "global_step": 515863, "epoch": 6215} {"train_loss": -27.530258178710938, "global_step": 515864, "epoch": 6215} {"train_loss": -27.39957046508789, "global_step": 515865, "epoch": 6215} {"train_loss": -27.19365882873535, "global_step": 515866, "epoch": 6215} {"train_loss": -27.32370376586914, "global_step": 515867, "epoch": 6215} {"train_loss": -27.494293212890625, "global_step": 515868, "epoch": 6215} {"train_loss": -27.562280654907227, "global_step": 515869, "epoch": 6215} {"train_loss": -27.486236572265625, "global_step": 515870, "epoch": 6215} {"train_loss": -27.840234756469727, "global_step": 515871, "epoch": 6215} {"train_loss": -27.253280639648438, "global_step": 515872, "epoch": 6215} {"train_loss": -27.45485496520996, "global_step": 515873, "epoch": 6215} {"train_loss": -27.56207275390625, "global_step": 515874, "epoch": 6215} {"train_loss": -27.357715606689453, "global_step": 515875, "epoch": 6215} {"train_loss": -27.3712158203125, "global_step": 515876, "epoch": 6215} {"train_loss": -27.537084579467773, "global_step": 515877, "epoch": 6215} {"train_loss": -27.601842880249023, "global_step": 515878, "epoch": 6215} {"train_loss": -27.22478675842285, "global_step": 515879, "epoch": 6215} {"train_loss": -27.229068756103516, "global_step": 515880, "epoch": 6215} {"train_loss": -27.1434383392334, "global_step": 515881, "epoch": 6215} {"train_loss": -27.3060359954834, "global_step": 515882, "epoch": 6215} {"train_loss": -27.859933853149414, "global_step": 515883, "epoch": 6215} {"train_loss": -27.713525772094727, "global_step": 515884, "epoch": 6215} {"train_loss": -27.561059951782227, "global_step": 515885, "epoch": 6215} {"train_loss": -27.482107162475586, "global_step": 515886, "epoch": 6215} {"train_loss": -27.576322555541992, "global_step": 515887, "epoch": 6215} {"train_loss": -27.512372970581055, "global_step": 515888, "epoch": 6215} {"train_loss": -27.569448471069336, "global_step": 515889, "epoch": 6215} {"train_loss": -27.000158309936523, "global_step": 515890, "epoch": 6215} {"train_loss": -27.485671997070312, "global_step": 515891, "epoch": 6215} {"train_loss": -27.52900505065918, "global_step": 515892, "epoch": 6215} {"train_loss": -27.35578727722168, "global_step": 515893, "epoch": 6215} {"train_loss": -27.595151901245117, "global_step": 515894, "epoch": 6215} {"train_loss": -27.488874435424805, "global_step": 515895, "epoch": 6215} {"train_loss": -26.95905876159668, "global_step": 515896, "epoch": 6215} {"train_loss": -27.8563175201416, "global_step": 515897, "epoch": 6215} {"train_loss": -27.38909912109375, "global_step": 515898, "epoch": 6215} {"train_loss": -27.40852165222168, "global_step": 515899, "epoch": 6215} {"train_loss": -27.6879940032959, "global_step": 515900, "epoch": 6215} {"train_loss": -27.424774169921875, "global_step": 515901, "epoch": 6215} {"train_loss": -27.4458065032959, "global_step": 515902, "epoch": 6215} {"train_loss": -27.66074562072754, "global_step": 515903, "epoch": 6215} {"train_loss": -27.341800689697266, "global_step": 515904, "epoch": 6215} {"train_loss": -27.383228302001953, "global_step": 515905, "epoch": 6215} {"train_loss": -27.160785675048828, "global_step": 515906, "epoch": 6215} {"train_loss": -27.40464210510254, "global_step": 515907, "epoch": 6215} {"train_loss": -27.265094757080078, "global_step": 515908, "epoch": 6215} {"train_loss": -27.537343978881836, "global_step": 515909, "epoch": 6215} {"train_loss": -27.263111114501953, "global_step": 515910, "epoch": 6215} {"train_loss": -27.572187423706055, "global_step": 515911, "epoch": 6215} {"train_loss": -27.2794189453125, "global_step": 515912, "epoch": 6215} {"train_loss": -27.786895751953125, "global_step": 515913, "epoch": 6215} {"train_loss": -27.1911563873291, "global_step": 515914, "epoch": 6215} {"train_loss": -27.44569206237793, "global_step": 515915, "epoch": 6215} {"train_loss": -27.440387725830078, "global_step": 515916, "epoch": 6215} {"train_loss": -27.17506217956543, "global_step": 515917, "epoch": 6215} {"train_loss": -27.1949462890625, "global_step": 515918, "epoch": 6215} {"train_loss": -27.40390396118164, "global_step": 515919, "epoch": 6215} {"train_loss": -27.084793090820312, "global_step": 515920, "epoch": 6215} {"train_loss": -27.144201278686523, "global_step": 515921, "epoch": 6215} {"train_loss": -27.848386764526367, "global_step": 515922, "epoch": 6215} {"train_loss": -27.556188583374023, "global_step": 515923, "epoch": 6215} {"train_loss": -27.351293563842773, "global_step": 515924, "epoch": 6215} {"train_loss": -27.124052047729492, "global_step": 515925, "epoch": 6215} {"train_loss": -27.342071533203125, "global_step": 515926, "epoch": 6215} {"train_loss": -27.374329256724163, "global_step": 515927, "epoch": 6215, "val_loss": 6533379.0} {"train_loss": -26.231107711791992, "global_step": 515928, "epoch": 6216} {"train_loss": -26.406309127807617, "global_step": 515929, "epoch": 6216} {"train_loss": -26.9285945892334, "global_step": 515930, "epoch": 6216} {"train_loss": -26.290678024291992, "global_step": 515931, "epoch": 6216} {"train_loss": -26.661008834838867, "global_step": 515932, "epoch": 6216} {"train_loss": -26.611623764038086, "global_step": 515933, "epoch": 6216} {"train_loss": -26.94172477722168, "global_step": 515934, "epoch": 6216} {"train_loss": -26.63816261291504, "global_step": 515935, "epoch": 6216} {"train_loss": -26.922637939453125, "global_step": 515936, "epoch": 6216} {"train_loss": -26.931808471679688, "global_step": 515937, "epoch": 6216} {"train_loss": -26.59320068359375, "global_step": 515938, "epoch": 6216} {"train_loss": -26.888336181640625, "global_step": 515939, "epoch": 6216} {"train_loss": -26.651535034179688, "global_step": 515940, "epoch": 6216} {"train_loss": -26.934194564819336, "global_step": 515941, "epoch": 6216} {"train_loss": -26.6014347076416, "global_step": 515942, "epoch": 6216} {"train_loss": -26.92035484313965, "global_step": 515943, "epoch": 6216} {"train_loss": -26.957752227783203, "global_step": 515944, "epoch": 6216} {"train_loss": -26.839374542236328, "global_step": 515945, "epoch": 6216} {"train_loss": -27.438629150390625, "global_step": 515946, "epoch": 6216} {"train_loss": -27.026752471923828, "global_step": 515947, "epoch": 6216} {"train_loss": -27.368183135986328, "global_step": 515948, "epoch": 6216} {"train_loss": -27.01910972595215, "global_step": 515949, "epoch": 6216} {"train_loss": -26.908283233642578, "global_step": 515950, "epoch": 6216} {"train_loss": -27.240921020507812, "global_step": 515951, "epoch": 6216} {"train_loss": -27.1755428314209, "global_step": 515952, "epoch": 6216} {"train_loss": -27.25654411315918, "global_step": 515953, "epoch": 6216} {"train_loss": -27.010217666625977, "global_step": 515954, "epoch": 6216} {"train_loss": -27.656309127807617, "global_step": 515955, "epoch": 6216} {"train_loss": -27.320571899414062, "global_step": 515956, "epoch": 6216} {"train_loss": -27.232019424438477, "global_step": 515957, "epoch": 6216} {"train_loss": -27.350833892822266, "global_step": 515958, "epoch": 6216} {"train_loss": -27.1901912689209, "global_step": 515959, "epoch": 6216} {"train_loss": -27.057132720947266, "global_step": 515960, "epoch": 6216} {"train_loss": -27.2919921875, "global_step": 515961, "epoch": 6216} {"train_loss": -27.590198516845703, "global_step": 515962, "epoch": 6216} {"train_loss": -27.366392135620117, "global_step": 515963, "epoch": 6216} {"train_loss": -27.49073600769043, "global_step": 515964, "epoch": 6216} {"train_loss": -27.477066040039062, "global_step": 515965, "epoch": 6216} {"train_loss": -27.242483139038086, "global_step": 515966, "epoch": 6216} {"train_loss": -27.714019775390625, "global_step": 515967, "epoch": 6216} {"train_loss": -27.28529167175293, "global_step": 515968, "epoch": 6216} {"train_loss": -27.208532333374023, "global_step": 515969, "epoch": 6216} {"train_loss": -27.6586856842041, "global_step": 515970, "epoch": 6216} {"train_loss": -27.30043601989746, "global_step": 515971, "epoch": 6216} {"train_loss": -27.376312255859375, "global_step": 515972, "epoch": 6216} {"train_loss": -27.475757598876953, "global_step": 515973, "epoch": 6216} {"train_loss": -27.685794830322266, "global_step": 515974, "epoch": 6216} {"train_loss": -27.783462524414062, "global_step": 515975, "epoch": 6216} {"train_loss": -27.58148765563965, "global_step": 515976, "epoch": 6216} {"train_loss": -27.578882217407227, "global_step": 515977, "epoch": 6216} {"train_loss": -27.52610206604004, "global_step": 515978, "epoch": 6216} {"train_loss": -27.383161544799805, "global_step": 515979, "epoch": 6216} {"train_loss": -27.380910873413086, "global_step": 515980, "epoch": 6216} {"train_loss": -27.820449829101562, "global_step": 515981, "epoch": 6216} {"train_loss": -27.669652938842773, "global_step": 515982, "epoch": 6216} {"train_loss": -27.658191680908203, "global_step": 515983, "epoch": 6216} {"train_loss": -27.591882705688477, "global_step": 515984, "epoch": 6216} {"train_loss": -27.66437339782715, "global_step": 515985, "epoch": 6216} {"train_loss": -27.58416175842285, "global_step": 515986, "epoch": 6216} {"train_loss": -27.3283634185791, "global_step": 515987, "epoch": 6216} {"train_loss": -27.5587215423584, "global_step": 515988, "epoch": 6216} {"train_loss": -27.870880126953125, "global_step": 515989, "epoch": 6216} {"train_loss": -28.096450805664062, "global_step": 515990, "epoch": 6216} {"train_loss": -27.395673751831055, "global_step": 515991, "epoch": 6216} {"train_loss": -27.490406036376953, "global_step": 515992, "epoch": 6216} {"train_loss": -27.78291130065918, "global_step": 515993, "epoch": 6216} {"train_loss": -27.63042640686035, "global_step": 515994, "epoch": 6216} {"train_loss": -28.116037368774414, "global_step": 515995, "epoch": 6216} {"train_loss": -27.837263107299805, "global_step": 515996, "epoch": 6216} {"train_loss": -27.688451766967773, "global_step": 515997, "epoch": 6216} {"train_loss": -27.728473663330078, "global_step": 515998, "epoch": 6216} {"train_loss": -27.758264541625977, "global_step": 515999, "epoch": 6216} {"train_loss": -27.647001266479492, "global_step": 516000, "epoch": 6216} {"train_loss": -27.467660903930664, "global_step": 516001, "epoch": 6216} {"train_loss": -27.420141220092773, "global_step": 516002, "epoch": 6216} {"train_loss": -27.8851261138916, "global_step": 516003, "epoch": 6216} {"train_loss": -27.913257598876953, "global_step": 516004, "epoch": 6216} {"train_loss": -27.383466720581055, "global_step": 516005, "epoch": 6216} {"train_loss": -26.794706344604492, "global_step": 516006, "epoch": 6216} {"train_loss": -26.502853393554688, "global_step": 516007, "epoch": 6216} {"train_loss": -26.190229415893555, "global_step": 516008, "epoch": 6216} {"train_loss": -25.82940673828125, "global_step": 516009, "epoch": 6216} {"train_loss": -27.278460284313525, "global_step": 516010, "epoch": 6216, "val_loss": 6637252.0} {"train_loss": -25.407184600830078, "global_step": 516011, "epoch": 6217} {"train_loss": -23.404754638671875, "global_step": 516012, "epoch": 6217} {"train_loss": -24.894155502319336, "global_step": 516013, "epoch": 6217} {"train_loss": -25.712787628173828, "global_step": 516014, "epoch": 6217} {"train_loss": -24.864126205444336, "global_step": 516015, "epoch": 6217} {"train_loss": -25.721332550048828, "global_step": 516016, "epoch": 6217} {"train_loss": -25.76041030883789, "global_step": 516017, "epoch": 6217} {"train_loss": -25.420169830322266, "global_step": 516018, "epoch": 6217} {"train_loss": -25.42575454711914, "global_step": 516019, "epoch": 6217} {"train_loss": -26.431594848632812, "global_step": 516020, "epoch": 6217} {"train_loss": -25.679895401000977, "global_step": 516021, "epoch": 6217} {"train_loss": -26.492877960205078, "global_step": 516022, "epoch": 6217} {"train_loss": -26.338953018188477, "global_step": 516023, "epoch": 6217} {"train_loss": -25.77044105529785, "global_step": 516024, "epoch": 6217} {"train_loss": -25.933523178100586, "global_step": 516025, "epoch": 6217} {"train_loss": -26.37898063659668, "global_step": 516026, "epoch": 6217} {"train_loss": -26.057300567626953, "global_step": 516027, "epoch": 6217} {"train_loss": -26.360559463500977, "global_step": 516028, "epoch": 6217} {"train_loss": -26.21656608581543, "global_step": 516029, "epoch": 6217} {"train_loss": -26.547571182250977, "global_step": 516030, "epoch": 6217} {"train_loss": -26.6415958404541, "global_step": 516031, "epoch": 6217} {"train_loss": -26.738367080688477, "global_step": 516032, "epoch": 6217} {"train_loss": -26.469867706298828, "global_step": 516033, "epoch": 6217} {"train_loss": -26.729089736938477, "global_step": 516034, "epoch": 6217} {"train_loss": -26.74321937561035, "global_step": 516035, "epoch": 6217} {"train_loss": -26.813573837280273, "global_step": 516036, "epoch": 6217} {"train_loss": -26.59517478942871, "global_step": 516037, "epoch": 6217} {"train_loss": -26.929975509643555, "global_step": 516038, "epoch": 6217} {"train_loss": -27.339710235595703, "global_step": 516039, "epoch": 6217} {"train_loss": -26.59006690979004, "global_step": 516040, "epoch": 6217} {"train_loss": -26.885889053344727, "global_step": 516041, "epoch": 6217} {"train_loss": -26.98956871032715, "global_step": 516042, "epoch": 6217} {"train_loss": -26.92640495300293, "global_step": 516043, "epoch": 6217} {"train_loss": -27.145252227783203, "global_step": 516044, "epoch": 6217} {"train_loss": -26.940967559814453, "global_step": 516045, "epoch": 6217} {"train_loss": -27.036914825439453, "global_step": 516046, "epoch": 6217} {"train_loss": -27.115524291992188, "global_step": 516047, "epoch": 6217} {"train_loss": -27.282190322875977, "global_step": 516048, "epoch": 6217} {"train_loss": -27.269824981689453, "global_step": 516049, "epoch": 6217} {"train_loss": -27.47139549255371, "global_step": 516050, "epoch": 6217} {"train_loss": -27.48992919921875, "global_step": 516051, "epoch": 6217} {"train_loss": -27.3706111907959, "global_step": 516052, "epoch": 6217} {"train_loss": -27.42014503479004, "global_step": 516053, "epoch": 6217} {"train_loss": -27.343891143798828, "global_step": 516054, "epoch": 6217} {"train_loss": -27.34235191345215, "global_step": 516055, "epoch": 6217} {"train_loss": -27.598358154296875, "global_step": 516056, "epoch": 6217} {"train_loss": -27.57807731628418, "global_step": 516057, "epoch": 6217} {"train_loss": -27.443195343017578, "global_step": 516058, "epoch": 6217} {"train_loss": -27.50140953063965, "global_step": 516059, "epoch": 6217} {"train_loss": -27.3416748046875, "global_step": 516060, "epoch": 6217} {"train_loss": -27.791248321533203, "global_step": 516061, "epoch": 6217} {"train_loss": -27.475473403930664, "global_step": 516062, "epoch": 6217} {"train_loss": -27.827747344970703, "global_step": 516063, "epoch": 6217} {"train_loss": -27.89118766784668, "global_step": 516064, "epoch": 6217} {"train_loss": -27.57575798034668, "global_step": 516065, "epoch": 6217} {"train_loss": -27.656742095947266, "global_step": 516066, "epoch": 6217} {"train_loss": -27.603107452392578, "global_step": 516067, "epoch": 6217} {"train_loss": -27.757535934448242, "global_step": 516068, "epoch": 6217} {"train_loss": -27.630294799804688, "global_step": 516069, "epoch": 6217} {"train_loss": -27.72894859313965, "global_step": 516070, "epoch": 6217} {"train_loss": -27.61338233947754, "global_step": 516071, "epoch": 6217} {"train_loss": -27.802509307861328, "global_step": 516072, "epoch": 6217} {"train_loss": -27.837268829345703, "global_step": 516073, "epoch": 6217} {"train_loss": -27.8460636138916, "global_step": 516074, "epoch": 6217} {"train_loss": -27.82013511657715, "global_step": 516075, "epoch": 6217} {"train_loss": -27.583444595336914, "global_step": 516076, "epoch": 6217} {"train_loss": -27.589841842651367, "global_step": 516077, "epoch": 6217} {"train_loss": -27.843297958374023, "global_step": 516078, "epoch": 6217} {"train_loss": -27.919721603393555, "global_step": 516079, "epoch": 6217} {"train_loss": -27.45423698425293, "global_step": 516080, "epoch": 6217} {"train_loss": -27.639942169189453, "global_step": 516081, "epoch": 6217} {"train_loss": -28.025711059570312, "global_step": 516082, "epoch": 6217} {"train_loss": -27.656875610351562, "global_step": 516083, "epoch": 6217} {"train_loss": -27.85654640197754, "global_step": 516084, "epoch": 6217} {"train_loss": -27.42987632751465, "global_step": 516085, "epoch": 6217} {"train_loss": -27.880512237548828, "global_step": 516086, "epoch": 6217} {"train_loss": -27.57940673828125, "global_step": 516087, "epoch": 6217} {"train_loss": -27.469385147094727, "global_step": 516088, "epoch": 6217} {"train_loss": -27.8005428314209, "global_step": 516089, "epoch": 6217} {"train_loss": -27.7702693939209, "global_step": 516090, "epoch": 6217} {"train_loss": -27.71844482421875, "global_step": 516091, "epoch": 6217} {"train_loss": -27.670602798461914, "global_step": 516092, "epoch": 6217} {"train_loss": -27.011034448462798, "global_step": 516093, "epoch": 6217, "val_loss": 6531448.0} {"train_loss": -27.30048179626465, "global_step": 516094, "epoch": 6218} {"train_loss": -26.646047592163086, "global_step": 516095, "epoch": 6218} {"train_loss": -24.360565185546875, "global_step": 516096, "epoch": 6218} {"train_loss": -23.939163208007812, "global_step": 516097, "epoch": 6218} {"train_loss": -25.27381706237793, "global_step": 516098, "epoch": 6218} {"train_loss": -26.882226943969727, "global_step": 516099, "epoch": 6218} {"train_loss": -25.92914390563965, "global_step": 516100, "epoch": 6218} {"train_loss": -26.675668716430664, "global_step": 516101, "epoch": 6218} {"train_loss": -27.143070220947266, "global_step": 516102, "epoch": 6218} {"train_loss": -26.233306884765625, "global_step": 516103, "epoch": 6218} {"train_loss": -26.52997398376465, "global_step": 516104, "epoch": 6218} {"train_loss": -26.737592697143555, "global_step": 516105, "epoch": 6218} {"train_loss": -26.63336181640625, "global_step": 516106, "epoch": 6218} {"train_loss": -27.131330490112305, "global_step": 516107, "epoch": 6218} {"train_loss": -26.964954376220703, "global_step": 516108, "epoch": 6218} {"train_loss": -26.551441192626953, "global_step": 516109, "epoch": 6218} {"train_loss": -27.004369735717773, "global_step": 516110, "epoch": 6218} {"train_loss": -26.55419921875, "global_step": 516111, "epoch": 6218} {"train_loss": -26.8804988861084, "global_step": 516112, "epoch": 6218} {"train_loss": -27.151813507080078, "global_step": 516113, "epoch": 6218} {"train_loss": -26.927581787109375, "global_step": 516114, "epoch": 6218} {"train_loss": -26.933576583862305, "global_step": 516115, "epoch": 6218} {"train_loss": -26.962982177734375, "global_step": 516116, "epoch": 6218} {"train_loss": -26.854772567749023, "global_step": 516117, "epoch": 6218} {"train_loss": -27.274383544921875, "global_step": 516118, "epoch": 6218} {"train_loss": -27.117191314697266, "global_step": 516119, "epoch": 6218} {"train_loss": -27.240259170532227, "global_step": 516120, "epoch": 6218} {"train_loss": -27.2890567779541, "global_step": 516121, "epoch": 6218} {"train_loss": -27.020404815673828, "global_step": 516122, "epoch": 6218} {"train_loss": -27.021432876586914, "global_step": 516123, "epoch": 6218} {"train_loss": -27.34547233581543, "global_step": 516124, "epoch": 6218} {"train_loss": -27.158262252807617, "global_step": 516125, "epoch": 6218} {"train_loss": -27.681766510009766, "global_step": 516126, "epoch": 6218} {"train_loss": -27.56459617614746, "global_step": 516127, "epoch": 6218} {"train_loss": -27.5389404296875, "global_step": 516128, "epoch": 6218} {"train_loss": -27.272724151611328, "global_step": 516129, "epoch": 6218} {"train_loss": -27.105947494506836, "global_step": 516130, "epoch": 6218} {"train_loss": -27.370336532592773, "global_step": 516131, "epoch": 6218} {"train_loss": -27.254369735717773, "global_step": 516132, "epoch": 6218} {"train_loss": -27.402265548706055, "global_step": 516133, "epoch": 6218} {"train_loss": -27.437671661376953, "global_step": 516134, "epoch": 6218} {"train_loss": -27.88762855529785, "global_step": 516135, "epoch": 6218} {"train_loss": -27.760419845581055, "global_step": 516136, "epoch": 6218} {"train_loss": -27.434051513671875, "global_step": 516137, "epoch": 6218} {"train_loss": -27.483951568603516, "global_step": 516138, "epoch": 6218} {"train_loss": -27.643659591674805, "global_step": 516139, "epoch": 6218} {"train_loss": -27.70062828063965, "global_step": 516140, "epoch": 6218} {"train_loss": -27.236358642578125, "global_step": 516141, "epoch": 6218} {"train_loss": -27.377038955688477, "global_step": 516142, "epoch": 6218} {"train_loss": -27.949649810791016, "global_step": 516143, "epoch": 6218} {"train_loss": -27.660186767578125, "global_step": 516144, "epoch": 6218} {"train_loss": -27.787260055541992, "global_step": 516145, "epoch": 6218} {"train_loss": -27.380451202392578, "global_step": 516146, "epoch": 6218} {"train_loss": -27.9313907623291, "global_step": 516147, "epoch": 6218} {"train_loss": -27.77459144592285, "global_step": 516148, "epoch": 6218} {"train_loss": -27.455169677734375, "global_step": 516149, "epoch": 6218} {"train_loss": -27.696638107299805, "global_step": 516150, "epoch": 6218} {"train_loss": -27.492399215698242, "global_step": 516151, "epoch": 6218} {"train_loss": -27.6938419342041, "global_step": 516152, "epoch": 6218} {"train_loss": -27.673843383789062, "global_step": 516153, "epoch": 6218} {"train_loss": -27.60833740234375, "global_step": 516154, "epoch": 6218} {"train_loss": -27.825855255126953, "global_step": 516155, "epoch": 6218} {"train_loss": -27.742969512939453, "global_step": 516156, "epoch": 6218} {"train_loss": -27.571563720703125, "global_step": 516157, "epoch": 6218} {"train_loss": -27.499433517456055, "global_step": 516158, "epoch": 6218} {"train_loss": -27.792367935180664, "global_step": 516159, "epoch": 6218} {"train_loss": -27.78120231628418, "global_step": 516160, "epoch": 6218} {"train_loss": -28.033435821533203, "global_step": 516161, "epoch": 6218} {"train_loss": -27.490314483642578, "global_step": 516162, "epoch": 6218} {"train_loss": -27.905847549438477, "global_step": 516163, "epoch": 6218} {"train_loss": -27.471866607666016, "global_step": 516164, "epoch": 6218} {"train_loss": -27.8194522857666, "global_step": 516165, "epoch": 6218} {"train_loss": -27.649463653564453, "global_step": 516166, "epoch": 6218} {"train_loss": -27.70075035095215, "global_step": 516167, "epoch": 6218} {"train_loss": -27.721099853515625, "global_step": 516168, "epoch": 6218} {"train_loss": -27.226871490478516, "global_step": 516169, "epoch": 6218} {"train_loss": -27.9520263671875, "global_step": 516170, "epoch": 6218} {"train_loss": -27.34685707092285, "global_step": 516171, "epoch": 6218} {"train_loss": -27.6274471282959, "global_step": 516172, "epoch": 6218} {"train_loss": -27.877222061157227, "global_step": 516173, "epoch": 6218} {"train_loss": -27.777917861938477, "global_step": 516174, "epoch": 6218} {"train_loss": -27.62746238708496, "global_step": 516175, "epoch": 6218} {"train_loss": -27.256684314773743, "global_step": 516176, "epoch": 6218, "val_loss": 6530868.5} {"train_loss": -26.906147003173828, "global_step": 516177, "epoch": 6219} {"train_loss": -26.598859786987305, "global_step": 516178, "epoch": 6219} {"train_loss": -26.3144474029541, "global_step": 516179, "epoch": 6219} {"train_loss": -26.0207462310791, "global_step": 516180, "epoch": 6219} {"train_loss": -26.16520118713379, "global_step": 516181, "epoch": 6219} {"train_loss": -26.8585262298584, "global_step": 516182, "epoch": 6219} {"train_loss": -25.791471481323242, "global_step": 516183, "epoch": 6219} {"train_loss": -27.051599502563477, "global_step": 516184, "epoch": 6219} {"train_loss": -26.86869239807129, "global_step": 516185, "epoch": 6219} {"train_loss": -26.471044540405273, "global_step": 516186, "epoch": 6219} {"train_loss": -27.06821632385254, "global_step": 516187, "epoch": 6219} {"train_loss": -26.559097290039062, "global_step": 516188, "epoch": 6219} {"train_loss": -26.444625854492188, "global_step": 516189, "epoch": 6219} {"train_loss": -26.88401222229004, "global_step": 516190, "epoch": 6219} {"train_loss": -26.243005752563477, "global_step": 516191, "epoch": 6219} {"train_loss": -27.166833877563477, "global_step": 516192, "epoch": 6219} {"train_loss": -26.712188720703125, "global_step": 516193, "epoch": 6219} {"train_loss": -27.11545753479004, "global_step": 516194, "epoch": 6219} {"train_loss": -26.866628646850586, "global_step": 516195, "epoch": 6219} {"train_loss": -27.348907470703125, "global_step": 516196, "epoch": 6219} {"train_loss": -27.269500732421875, "global_step": 516197, "epoch": 6219} {"train_loss": -27.119665145874023, "global_step": 516198, "epoch": 6219} {"train_loss": -26.8582706451416, "global_step": 516199, "epoch": 6219} {"train_loss": -27.34425163269043, "global_step": 516200, "epoch": 6219} {"train_loss": -27.224964141845703, "global_step": 516201, "epoch": 6219} {"train_loss": -27.303380966186523, "global_step": 516202, "epoch": 6219} {"train_loss": -27.59735107421875, "global_step": 516203, "epoch": 6219} {"train_loss": -27.373044967651367, "global_step": 516204, "epoch": 6219} {"train_loss": -27.29453468322754, "global_step": 516205, "epoch": 6219} {"train_loss": -27.195783615112305, "global_step": 516206, "epoch": 6219} {"train_loss": -27.416553497314453, "global_step": 516207, "epoch": 6219} {"train_loss": -27.870325088500977, "global_step": 516208, "epoch": 6219} {"train_loss": -27.529855728149414, "global_step": 516209, "epoch": 6219} {"train_loss": -27.248632431030273, "global_step": 516210, "epoch": 6219} {"train_loss": -27.73248291015625, "global_step": 516211, "epoch": 6219} {"train_loss": -27.477087020874023, "global_step": 516212, "epoch": 6219} {"train_loss": -27.45453453063965, "global_step": 516213, "epoch": 6219} {"train_loss": -27.590848922729492, "global_step": 516214, "epoch": 6219} {"train_loss": -27.618682861328125, "global_step": 516215, "epoch": 6219} {"train_loss": -27.455224990844727, "global_step": 516216, "epoch": 6219} {"train_loss": -27.656845092773438, "global_step": 516217, "epoch": 6219} {"train_loss": -27.500152587890625, "global_step": 516218, "epoch": 6219} {"train_loss": -27.71087646484375, "global_step": 516219, "epoch": 6219} {"train_loss": -27.88758659362793, "global_step": 516220, "epoch": 6219} {"train_loss": -27.563953399658203, "global_step": 516221, "epoch": 6219} {"train_loss": -27.63287353515625, "global_step": 516222, "epoch": 6219} {"train_loss": -27.6832218170166, "global_step": 516223, "epoch": 6219} {"train_loss": -27.35645866394043, "global_step": 516224, "epoch": 6219} {"train_loss": -27.915700912475586, "global_step": 516225, "epoch": 6219} {"train_loss": -27.183277130126953, "global_step": 516226, "epoch": 6219} {"train_loss": -27.561847686767578, "global_step": 516227, "epoch": 6219} {"train_loss": -27.740631103515625, "global_step": 516228, "epoch": 6219} {"train_loss": -27.663253784179688, "global_step": 516229, "epoch": 6219} {"train_loss": -27.65077781677246, "global_step": 516230, "epoch": 6219} {"train_loss": -27.686782836914062, "global_step": 516231, "epoch": 6219} {"train_loss": -27.746570587158203, "global_step": 516232, "epoch": 6219} {"train_loss": -27.911468505859375, "global_step": 516233, "epoch": 6219} {"train_loss": -27.983016967773438, "global_step": 516234, "epoch": 6219} {"train_loss": -27.849475860595703, "global_step": 516235, "epoch": 6219} {"train_loss": -27.947729110717773, "global_step": 516236, "epoch": 6219} {"train_loss": -27.789518356323242, "global_step": 516237, "epoch": 6219} {"train_loss": -27.776477813720703, "global_step": 516238, "epoch": 6219} {"train_loss": -27.620569229125977, "global_step": 516239, "epoch": 6219} {"train_loss": -27.97132682800293, "global_step": 516240, "epoch": 6219} {"train_loss": -27.939619064331055, "global_step": 516241, "epoch": 6219} {"train_loss": -27.495105743408203, "global_step": 516242, "epoch": 6219} {"train_loss": -27.80531120300293, "global_step": 516243, "epoch": 6219} {"train_loss": -27.722015380859375, "global_step": 516244, "epoch": 6219} {"train_loss": -27.51234245300293, "global_step": 516245, "epoch": 6219} {"train_loss": -27.6026668548584, "global_step": 516246, "epoch": 6219} {"train_loss": -27.41678810119629, "global_step": 516247, "epoch": 6219} {"train_loss": -27.49762535095215, "global_step": 516248, "epoch": 6219} {"train_loss": -27.01112174987793, "global_step": 516249, "epoch": 6219} {"train_loss": -26.377058029174805, "global_step": 516250, "epoch": 6219} {"train_loss": -26.1754150390625, "global_step": 516251, "epoch": 6219} {"train_loss": -26.946741104125977, "global_step": 516252, "epoch": 6219} {"train_loss": -26.2811222076416, "global_step": 516253, "epoch": 6219} {"train_loss": -26.968603134155273, "global_step": 516254, "epoch": 6219} {"train_loss": -26.63245964050293, "global_step": 516255, "epoch": 6219} {"train_loss": -26.478193283081055, "global_step": 516256, "epoch": 6219} {"train_loss": -27.141159057617188, "global_step": 516257, "epoch": 6219} {"train_loss": -26.64434242248535, "global_step": 516258, "epoch": 6219} {"train_loss": -27.253572004387177, "global_step": 516259, "epoch": 6219, "val_loss": 6626979.0} {"train_loss": -25.9274845123291, "global_step": 516260, "epoch": 6220} {"train_loss": -25.87873649597168, "global_step": 516261, "epoch": 6220} {"train_loss": -25.73518180847168, "global_step": 516262, "epoch": 6220} {"train_loss": -26.28995704650879, "global_step": 516263, "epoch": 6220} {"train_loss": -26.57076072692871, "global_step": 516264, "epoch": 6220} {"train_loss": -26.593952178955078, "global_step": 516265, "epoch": 6220} {"train_loss": -26.07659339904785, "global_step": 516266, "epoch": 6220} {"train_loss": -26.435962677001953, "global_step": 516267, "epoch": 6220} {"train_loss": -27.0517578125, "global_step": 516268, "epoch": 6220} {"train_loss": -26.819717407226562, "global_step": 516269, "epoch": 6220} {"train_loss": -26.92914390563965, "global_step": 516270, "epoch": 6220} {"train_loss": -26.677221298217773, "global_step": 516271, "epoch": 6220} {"train_loss": -27.01372718811035, "global_step": 516272, "epoch": 6220} {"train_loss": -27.135618209838867, "global_step": 516273, "epoch": 6220} {"train_loss": -26.796558380126953, "global_step": 516274, "epoch": 6220} {"train_loss": -27.083057403564453, "global_step": 516275, "epoch": 6220} {"train_loss": -26.76090431213379, "global_step": 516276, "epoch": 6220} {"train_loss": -26.755390167236328, "global_step": 516277, "epoch": 6220} {"train_loss": -26.732065200805664, "global_step": 516278, "epoch": 6220} {"train_loss": -27.1088809967041, "global_step": 516279, "epoch": 6220} {"train_loss": -27.062549591064453, "global_step": 516280, "epoch": 6220} {"train_loss": -27.235570907592773, "global_step": 516281, "epoch": 6220} {"train_loss": -27.000751495361328, "global_step": 516282, "epoch": 6220} {"train_loss": -27.065717697143555, "global_step": 516283, "epoch": 6220} {"train_loss": -27.013208389282227, "global_step": 516284, "epoch": 6220} {"train_loss": -27.106534957885742, "global_step": 516285, "epoch": 6220} {"train_loss": -27.139307022094727, "global_step": 516286, "epoch": 6220} {"train_loss": -27.429601669311523, "global_step": 516287, "epoch": 6220} {"train_loss": -27.602293014526367, "global_step": 516288, "epoch": 6220} {"train_loss": -27.576251983642578, "global_step": 516289, "epoch": 6220} {"train_loss": -27.499740600585938, "global_step": 516290, "epoch": 6220} {"train_loss": -27.474140167236328, "global_step": 516291, "epoch": 6220} {"train_loss": -27.413122177124023, "global_step": 516292, "epoch": 6220} {"train_loss": -27.619619369506836, "global_step": 516293, "epoch": 6220} {"train_loss": -27.50111198425293, "global_step": 516294, "epoch": 6220} {"train_loss": -27.72559928894043, "global_step": 516295, "epoch": 6220} {"train_loss": -27.601133346557617, "global_step": 516296, "epoch": 6220} {"train_loss": -27.660078048706055, "global_step": 516297, "epoch": 6220} {"train_loss": -27.62070083618164, "global_step": 516298, "epoch": 6220} {"train_loss": -27.766876220703125, "global_step": 516299, "epoch": 6220} {"train_loss": -27.6225643157959, "global_step": 516300, "epoch": 6220} {"train_loss": -27.806936264038086, "global_step": 516301, "epoch": 6220} {"train_loss": -27.67402458190918, "global_step": 516302, "epoch": 6220} {"train_loss": -27.483922958374023, "global_step": 516303, "epoch": 6220} {"train_loss": -27.728376388549805, "global_step": 516304, "epoch": 6220} {"train_loss": -27.7596492767334, "global_step": 516305, "epoch": 6220} {"train_loss": -27.535619735717773, "global_step": 516306, "epoch": 6220} {"train_loss": -27.64556884765625, "global_step": 516307, "epoch": 6220} {"train_loss": -27.688390731811523, "global_step": 516308, "epoch": 6220} {"train_loss": -27.66672706604004, "global_step": 516309, "epoch": 6220} {"train_loss": -27.464017868041992, "global_step": 516310, "epoch": 6220} {"train_loss": -27.403329849243164, "global_step": 516311, "epoch": 6220} {"train_loss": -27.691150665283203, "global_step": 516312, "epoch": 6220} {"train_loss": -27.769794464111328, "global_step": 516313, "epoch": 6220} {"train_loss": -27.629735946655273, "global_step": 516314, "epoch": 6220} {"train_loss": -27.8992919921875, "global_step": 516315, "epoch": 6220} {"train_loss": -27.892438888549805, "global_step": 516316, "epoch": 6220} {"train_loss": -27.54474449157715, "global_step": 516317, "epoch": 6220} {"train_loss": -27.48457145690918, "global_step": 516318, "epoch": 6220} {"train_loss": -27.791213989257812, "global_step": 516319, "epoch": 6220} {"train_loss": -27.480016708374023, "global_step": 516320, "epoch": 6220} {"train_loss": -27.765043258666992, "global_step": 516321, "epoch": 6220} {"train_loss": -27.4180908203125, "global_step": 516322, "epoch": 6220} {"train_loss": -27.512042999267578, "global_step": 516323, "epoch": 6220} {"train_loss": -27.93646240234375, "global_step": 516324, "epoch": 6220} {"train_loss": -27.70355224609375, "global_step": 516325, "epoch": 6220} {"train_loss": -27.655029296875, "global_step": 516326, "epoch": 6220} {"train_loss": -27.834598541259766, "global_step": 516327, "epoch": 6220} {"train_loss": -27.83608055114746, "global_step": 516328, "epoch": 6220} {"train_loss": -27.78278923034668, "global_step": 516329, "epoch": 6220} {"train_loss": -27.97466468811035, "global_step": 516330, "epoch": 6220} {"train_loss": -27.816314697265625, "global_step": 516331, "epoch": 6220} {"train_loss": -27.895374298095703, "global_step": 516332, "epoch": 6220} {"train_loss": -27.696598052978516, "global_step": 516333, "epoch": 6220} {"train_loss": -27.585290908813477, "global_step": 516334, "epoch": 6220} {"train_loss": -27.621261596679688, "global_step": 516335, "epoch": 6220} {"train_loss": -27.531986236572266, "global_step": 516336, "epoch": 6220} {"train_loss": -27.74127197265625, "global_step": 516337, "epoch": 6220} {"train_loss": -27.046283721923828, "global_step": 516338, "epoch": 6220} {"train_loss": -27.50119400024414, "global_step": 516339, "epoch": 6220} {"train_loss": -27.439035415649414, "global_step": 516340, "epoch": 6220} {"train_loss": -27.485370635986328, "global_step": 516341, "epoch": 6220} {"train_loss": -27.340989560966033, "global_step": 516342, "epoch": 6220, "val_loss": 6574258.0} {"train_loss": -26.683624267578125, "global_step": 516343, "epoch": 6221} {"train_loss": -26.517658233642578, "global_step": 516344, "epoch": 6221} {"train_loss": -25.886249542236328, "global_step": 516345, "epoch": 6221} {"train_loss": -26.29617691040039, "global_step": 516346, "epoch": 6221} {"train_loss": -26.051132202148438, "global_step": 516347, "epoch": 6221} {"train_loss": -26.4924373626709, "global_step": 516348, "epoch": 6221} {"train_loss": -27.0257568359375, "global_step": 516349, "epoch": 6221} {"train_loss": -26.696308135986328, "global_step": 516350, "epoch": 6221} {"train_loss": -27.079334259033203, "global_step": 516351, "epoch": 6221} {"train_loss": -27.32051658630371, "global_step": 516352, "epoch": 6221} {"train_loss": -26.799325942993164, "global_step": 516353, "epoch": 6221} {"train_loss": -27.134408950805664, "global_step": 516354, "epoch": 6221} {"train_loss": -27.201797485351562, "global_step": 516355, "epoch": 6221} {"train_loss": -26.86038589477539, "global_step": 516356, "epoch": 6221} {"train_loss": -27.076501846313477, "global_step": 516357, "epoch": 6221} {"train_loss": -26.689197540283203, "global_step": 516358, "epoch": 6221} {"train_loss": -26.584125518798828, "global_step": 516359, "epoch": 6221} {"train_loss": -27.099246978759766, "global_step": 516360, "epoch": 6221} {"train_loss": -26.799835205078125, "global_step": 516361, "epoch": 6221} {"train_loss": -27.073957443237305, "global_step": 516362, "epoch": 6221} {"train_loss": -27.066638946533203, "global_step": 516363, "epoch": 6221} {"train_loss": -27.1300106048584, "global_step": 516364, "epoch": 6221} {"train_loss": -27.076608657836914, "global_step": 516365, "epoch": 6221} {"train_loss": -27.47541618347168, "global_step": 516366, "epoch": 6221} {"train_loss": -27.299951553344727, "global_step": 516367, "epoch": 6221} {"train_loss": -26.924697875976562, "global_step": 516368, "epoch": 6221} {"train_loss": -27.2774600982666, "global_step": 516369, "epoch": 6221} {"train_loss": -27.1916446685791, "global_step": 516370, "epoch": 6221} {"train_loss": -26.739660263061523, "global_step": 516371, "epoch": 6221} {"train_loss": -27.084522247314453, "global_step": 516372, "epoch": 6221} {"train_loss": -27.1613826751709, "global_step": 516373, "epoch": 6221} {"train_loss": -27.192398071289062, "global_step": 516374, "epoch": 6221} {"train_loss": -27.25189781188965, "global_step": 516375, "epoch": 6221} {"train_loss": -27.121570587158203, "global_step": 516376, "epoch": 6221} {"train_loss": -27.170730590820312, "global_step": 516377, "epoch": 6221} {"train_loss": -27.283161163330078, "global_step": 516378, "epoch": 6221} {"train_loss": -27.217756271362305, "global_step": 516379, "epoch": 6221} {"train_loss": -27.361682891845703, "global_step": 516380, "epoch": 6221} {"train_loss": -27.69399070739746, "global_step": 516381, "epoch": 6221} {"train_loss": -27.005517959594727, "global_step": 516382, "epoch": 6221} {"train_loss": -27.524442672729492, "global_step": 516383, "epoch": 6221} {"train_loss": -27.185659408569336, "global_step": 516384, "epoch": 6221} {"train_loss": -27.19576072692871, "global_step": 516385, "epoch": 6221} {"train_loss": -27.367618560791016, "global_step": 516386, "epoch": 6221} {"train_loss": -27.416629791259766, "global_step": 516387, "epoch": 6221} {"train_loss": -27.443662643432617, "global_step": 516388, "epoch": 6221} {"train_loss": -27.573400497436523, "global_step": 516389, "epoch": 6221} {"train_loss": -27.75123405456543, "global_step": 516390, "epoch": 6221} {"train_loss": -27.857746124267578, "global_step": 516391, "epoch": 6221} {"train_loss": -27.452062606811523, "global_step": 516392, "epoch": 6221} {"train_loss": -27.823429107666016, "global_step": 516393, "epoch": 6221} {"train_loss": -27.814966201782227, "global_step": 516394, "epoch": 6221} {"train_loss": -27.859699249267578, "global_step": 516395, "epoch": 6221} {"train_loss": -28.011930465698242, "global_step": 516396, "epoch": 6221} {"train_loss": -27.546649932861328, "global_step": 516397, "epoch": 6221} {"train_loss": -27.735767364501953, "global_step": 516398, "epoch": 6221} {"train_loss": -28.022186279296875, "global_step": 516399, "epoch": 6221} {"train_loss": -27.60181999206543, "global_step": 516400, "epoch": 6221} {"train_loss": -27.33992576599121, "global_step": 516401, "epoch": 6221} {"train_loss": -27.179590225219727, "global_step": 516402, "epoch": 6221} {"train_loss": -27.408872604370117, "global_step": 516403, "epoch": 6221} {"train_loss": -27.692066192626953, "global_step": 516404, "epoch": 6221} {"train_loss": -27.67144203186035, "global_step": 516405, "epoch": 6221} {"train_loss": -27.582183837890625, "global_step": 516406, "epoch": 6221} {"train_loss": -27.126575469970703, "global_step": 516407, "epoch": 6221} {"train_loss": -27.140180587768555, "global_step": 516408, "epoch": 6221} {"train_loss": -27.048736572265625, "global_step": 516409, "epoch": 6221} {"train_loss": -27.060928344726562, "global_step": 516410, "epoch": 6221} {"train_loss": -27.727783203125, "global_step": 516411, "epoch": 6221} {"train_loss": -27.260574340820312, "global_step": 516412, "epoch": 6221} {"train_loss": -27.780670166015625, "global_step": 516413, "epoch": 6221} {"train_loss": -27.30255126953125, "global_step": 516414, "epoch": 6221} {"train_loss": -27.245925903320312, "global_step": 516415, "epoch": 6221} {"train_loss": -27.838834762573242, "global_step": 516416, "epoch": 6221} {"train_loss": -27.277877807617188, "global_step": 516417, "epoch": 6221} {"train_loss": -27.73270606994629, "global_step": 516418, "epoch": 6221} {"train_loss": -27.935842514038086, "global_step": 516419, "epoch": 6221} {"train_loss": -27.368640899658203, "global_step": 516420, "epoch": 6221} {"train_loss": -27.301069259643555, "global_step": 516421, "epoch": 6221} {"train_loss": -27.769575119018555, "global_step": 516422, "epoch": 6221} {"train_loss": -27.373849868774414, "global_step": 516423, "epoch": 6221} {"train_loss": -27.564929962158203, "global_step": 516424, "epoch": 6221} {"train_loss": -27.273314947105316, "global_step": 516425, "epoch": 6221, "val_loss": 6542531.0} {"train_loss": -26.892187118530273, "global_step": 516426, "epoch": 6222} {"train_loss": -27.072874069213867, "global_step": 516427, "epoch": 6222} {"train_loss": -27.93646812438965, "global_step": 516428, "epoch": 6222} {"train_loss": -27.344831466674805, "global_step": 516429, "epoch": 6222} {"train_loss": -27.046598434448242, "global_step": 516430, "epoch": 6222} {"train_loss": -27.1705379486084, "global_step": 516431, "epoch": 6222} {"train_loss": -27.27851676940918, "global_step": 516432, "epoch": 6222} {"train_loss": -27.178823471069336, "global_step": 516433, "epoch": 6222} {"train_loss": -27.131147384643555, "global_step": 516434, "epoch": 6222} {"train_loss": -27.177261352539062, "global_step": 516435, "epoch": 6222} {"train_loss": -27.24268913269043, "global_step": 516436, "epoch": 6222} {"train_loss": -27.387115478515625, "global_step": 516437, "epoch": 6222} {"train_loss": -27.3387393951416, "global_step": 516438, "epoch": 6222} {"train_loss": -27.416845321655273, "global_step": 516439, "epoch": 6222} {"train_loss": -27.2498722076416, "global_step": 516440, "epoch": 6222} {"train_loss": -27.327436447143555, "global_step": 516441, "epoch": 6222} {"train_loss": -27.468870162963867, "global_step": 516442, "epoch": 6222} {"train_loss": -26.9127140045166, "global_step": 516443, "epoch": 6222} {"train_loss": -27.161945343017578, "global_step": 516444, "epoch": 6222} {"train_loss": -27.869110107421875, "global_step": 516445, "epoch": 6222} {"train_loss": -27.27729606628418, "global_step": 516446, "epoch": 6222} {"train_loss": -27.293842315673828, "global_step": 516447, "epoch": 6222} {"train_loss": -27.46367835998535, "global_step": 516448, "epoch": 6222} {"train_loss": -27.45882225036621, "global_step": 516449, "epoch": 6222} {"train_loss": -27.195993423461914, "global_step": 516450, "epoch": 6222} {"train_loss": -27.17351722717285, "global_step": 516451, "epoch": 6222} {"train_loss": -27.831357955932617, "global_step": 516452, "epoch": 6222} {"train_loss": -27.67573356628418, "global_step": 516453, "epoch": 6222} {"train_loss": -27.4814453125, "global_step": 516454, "epoch": 6222} {"train_loss": -27.2161922454834, "global_step": 516455, "epoch": 6222} {"train_loss": -27.276779174804688, "global_step": 516456, "epoch": 6222} {"train_loss": -27.449560165405273, "global_step": 516457, "epoch": 6222} {"train_loss": -27.470029830932617, "global_step": 516458, "epoch": 6222} {"train_loss": -27.309228897094727, "global_step": 516459, "epoch": 6222} {"train_loss": -27.611907958984375, "global_step": 516460, "epoch": 6222} {"train_loss": -27.881561279296875, "global_step": 516461, "epoch": 6222} {"train_loss": -27.90201759338379, "global_step": 516462, "epoch": 6222} {"train_loss": -27.5384521484375, "global_step": 516463, "epoch": 6222} {"train_loss": -27.50861930847168, "global_step": 516464, "epoch": 6222} {"train_loss": -27.815643310546875, "global_step": 516465, "epoch": 6222} {"train_loss": -27.31751823425293, "global_step": 516466, "epoch": 6222} {"train_loss": -27.85062599182129, "global_step": 516467, "epoch": 6222} {"train_loss": -27.80999183654785, "global_step": 516468, "epoch": 6222} {"train_loss": -27.48713493347168, "global_step": 516469, "epoch": 6222} {"train_loss": -27.5404109954834, "global_step": 516470, "epoch": 6222} {"train_loss": -27.637006759643555, "global_step": 516471, "epoch": 6222} {"train_loss": -28.00530433654785, "global_step": 516472, "epoch": 6222} {"train_loss": -27.81715202331543, "global_step": 516473, "epoch": 6222} {"train_loss": -27.24152183532715, "global_step": 516474, "epoch": 6222} {"train_loss": -27.659332275390625, "global_step": 516475, "epoch": 6222} {"train_loss": -27.73551368713379, "global_step": 516476, "epoch": 6222} {"train_loss": -27.639270782470703, "global_step": 516477, "epoch": 6222} {"train_loss": -27.08377456665039, "global_step": 516478, "epoch": 6222} {"train_loss": -27.45429801940918, "global_step": 516479, "epoch": 6222} {"train_loss": -27.611371994018555, "global_step": 516480, "epoch": 6222} {"train_loss": -27.60395622253418, "global_step": 516481, "epoch": 6222} {"train_loss": -27.393335342407227, "global_step": 516482, "epoch": 6222} {"train_loss": -27.34193992614746, "global_step": 516483, "epoch": 6222} {"train_loss": -27.66145133972168, "global_step": 516484, "epoch": 6222} {"train_loss": -27.553730010986328, "global_step": 516485, "epoch": 6222} {"train_loss": -27.4290771484375, "global_step": 516486, "epoch": 6222} {"train_loss": -27.510839462280273, "global_step": 516487, "epoch": 6222} {"train_loss": -27.437543869018555, "global_step": 516488, "epoch": 6222} {"train_loss": -27.2650146484375, "global_step": 516489, "epoch": 6222} {"train_loss": -27.274351119995117, "global_step": 516490, "epoch": 6222} {"train_loss": -27.505537033081055, "global_step": 516491, "epoch": 6222} {"train_loss": -27.31928062438965, "global_step": 516492, "epoch": 6222} {"train_loss": -27.422346115112305, "global_step": 516493, "epoch": 6222} {"train_loss": -27.757612228393555, "global_step": 516494, "epoch": 6222} {"train_loss": -27.331634521484375, "global_step": 516495, "epoch": 6222} {"train_loss": -28.062305450439453, "global_step": 516496, "epoch": 6222} {"train_loss": -27.373336791992188, "global_step": 516497, "epoch": 6222} {"train_loss": -27.6286563873291, "global_step": 516498, "epoch": 6222} {"train_loss": -27.444644927978516, "global_step": 516499, "epoch": 6222} {"train_loss": -27.576263427734375, "global_step": 516500, "epoch": 6222} {"train_loss": -27.3604793548584, "global_step": 516501, "epoch": 6222} {"train_loss": -27.691455841064453, "global_step": 516502, "epoch": 6222} {"train_loss": -27.325387954711914, "global_step": 516503, "epoch": 6222} {"train_loss": -27.943805694580078, "global_step": 516504, "epoch": 6222} {"train_loss": -27.675504684448242, "global_step": 516505, "epoch": 6222} {"train_loss": -27.845504760742188, "global_step": 516506, "epoch": 6222} {"train_loss": -27.296606063842773, "global_step": 516507, "epoch": 6222} {"train_loss": -27.4904928552099, "global_step": 516508, "epoch": 6222, "val_loss": 6576146.0} {"train_loss": -26.971481323242188, "global_step": 516509, "epoch": 6223} {"train_loss": -26.814245223999023, "global_step": 516510, "epoch": 6223} {"train_loss": -27.52081871032715, "global_step": 516511, "epoch": 6223} {"train_loss": -26.927637100219727, "global_step": 516512, "epoch": 6223} {"train_loss": -27.374317169189453, "global_step": 516513, "epoch": 6223} {"train_loss": -26.74517250061035, "global_step": 516514, "epoch": 6223} {"train_loss": -27.54719352722168, "global_step": 516515, "epoch": 6223} {"train_loss": -27.19801139831543, "global_step": 516516, "epoch": 6223} {"train_loss": -27.30470085144043, "global_step": 516517, "epoch": 6223} {"train_loss": -26.876956939697266, "global_step": 516518, "epoch": 6223} {"train_loss": -26.757551193237305, "global_step": 516519, "epoch": 6223} {"train_loss": -26.492822647094727, "global_step": 516520, "epoch": 6223} {"train_loss": -26.652624130249023, "global_step": 516521, "epoch": 6223} {"train_loss": -27.357696533203125, "global_step": 516522, "epoch": 6223} {"train_loss": -26.55232048034668, "global_step": 516523, "epoch": 6223} {"train_loss": -27.332433700561523, "global_step": 516524, "epoch": 6223} {"train_loss": -27.079797744750977, "global_step": 516525, "epoch": 6223} {"train_loss": -26.81623649597168, "global_step": 516526, "epoch": 6223} {"train_loss": -27.5614013671875, "global_step": 516527, "epoch": 6223} {"train_loss": -26.838266372680664, "global_step": 516528, "epoch": 6223} {"train_loss": -27.20682716369629, "global_step": 516529, "epoch": 6223} {"train_loss": -27.170063018798828, "global_step": 516530, "epoch": 6223} {"train_loss": -27.286651611328125, "global_step": 516531, "epoch": 6223} {"train_loss": -27.37709617614746, "global_step": 516532, "epoch": 6223} {"train_loss": -27.598596572875977, "global_step": 516533, "epoch": 6223} {"train_loss": -27.17999267578125, "global_step": 516534, "epoch": 6223} {"train_loss": -27.506839752197266, "global_step": 516535, "epoch": 6223} {"train_loss": -27.6497802734375, "global_step": 516536, "epoch": 6223} {"train_loss": -27.560510635375977, "global_step": 516537, "epoch": 6223} {"train_loss": -27.85420036315918, "global_step": 516538, "epoch": 6223} {"train_loss": -27.191333770751953, "global_step": 516539, "epoch": 6223} {"train_loss": -27.766748428344727, "global_step": 516540, "epoch": 6223} {"train_loss": -27.28289794921875, "global_step": 516541, "epoch": 6223} {"train_loss": -27.528127670288086, "global_step": 516542, "epoch": 6223} {"train_loss": -27.040802001953125, "global_step": 516543, "epoch": 6223} {"train_loss": -27.656885147094727, "global_step": 516544, "epoch": 6223} {"train_loss": -27.6956729888916, "global_step": 516545, "epoch": 6223} {"train_loss": -27.7932071685791, "global_step": 516546, "epoch": 6223} {"train_loss": -27.541961669921875, "global_step": 516547, "epoch": 6223} {"train_loss": -27.5014705657959, "global_step": 516548, "epoch": 6223} {"train_loss": -27.509429931640625, "global_step": 516549, "epoch": 6223} {"train_loss": -27.731964111328125, "global_step": 516550, "epoch": 6223} {"train_loss": -27.364715576171875, "global_step": 516551, "epoch": 6223} {"train_loss": -27.456510543823242, "global_step": 516552, "epoch": 6223} {"train_loss": -27.1568546295166, "global_step": 516553, "epoch": 6223} {"train_loss": -27.55093765258789, "global_step": 516554, "epoch": 6223} {"train_loss": -27.547082901000977, "global_step": 516555, "epoch": 6223} {"train_loss": -27.509479522705078, "global_step": 516556, "epoch": 6223} {"train_loss": -27.89034080505371, "global_step": 516557, "epoch": 6223} {"train_loss": -27.588953018188477, "global_step": 516558, "epoch": 6223} {"train_loss": -27.457672119140625, "global_step": 516559, "epoch": 6223} {"train_loss": -27.517663955688477, "global_step": 516560, "epoch": 6223} {"train_loss": -27.71005630493164, "global_step": 516561, "epoch": 6223} {"train_loss": -27.37664794921875, "global_step": 516562, "epoch": 6223} {"train_loss": -27.23175621032715, "global_step": 516563, "epoch": 6223} {"train_loss": -27.519872665405273, "global_step": 516564, "epoch": 6223} {"train_loss": -27.74946403503418, "global_step": 516565, "epoch": 6223} {"train_loss": -27.440038681030273, "global_step": 516566, "epoch": 6223} {"train_loss": -27.75680923461914, "global_step": 516567, "epoch": 6223} {"train_loss": -27.80389404296875, "global_step": 516568, "epoch": 6223} {"train_loss": -27.73202896118164, "global_step": 516569, "epoch": 6223} {"train_loss": -27.63056755065918, "global_step": 516570, "epoch": 6223} {"train_loss": -27.958255767822266, "global_step": 516571, "epoch": 6223} {"train_loss": -27.5826416015625, "global_step": 516572, "epoch": 6223} {"train_loss": -27.64169692993164, "global_step": 516573, "epoch": 6223} {"train_loss": -27.678735733032227, "global_step": 516574, "epoch": 6223} {"train_loss": -27.43055534362793, "global_step": 516575, "epoch": 6223} {"train_loss": -27.485427856445312, "global_step": 516576, "epoch": 6223} {"train_loss": -27.621912002563477, "global_step": 516577, "epoch": 6223} {"train_loss": -27.00306510925293, "global_step": 516578, "epoch": 6223} {"train_loss": -27.22144889831543, "global_step": 516579, "epoch": 6223} {"train_loss": -27.324811935424805, "global_step": 516580, "epoch": 6223} {"train_loss": -27.2695255279541, "global_step": 516581, "epoch": 6223} {"train_loss": -27.209686279296875, "global_step": 516582, "epoch": 6223} {"train_loss": -27.4538631439209, "global_step": 516583, "epoch": 6223} {"train_loss": -27.406545639038086, "global_step": 516584, "epoch": 6223} {"train_loss": -27.550235748291016, "global_step": 516585, "epoch": 6223} {"train_loss": -27.646820068359375, "global_step": 516586, "epoch": 6223} {"train_loss": -27.823516845703125, "global_step": 516587, "epoch": 6223} {"train_loss": -27.111291885375977, "global_step": 516588, "epoch": 6223} {"train_loss": -27.29666519165039, "global_step": 516589, "epoch": 6223} {"train_loss": -27.21478271484375, "global_step": 516590, "epoch": 6223} {"train_loss": -27.376923067023956, "global_step": 516591, "epoch": 6223, "val_loss": 6589697.0} {"train_loss": -26.609643936157227, "global_step": 516592, "epoch": 6224} {"train_loss": -27.262939453125, "global_step": 516593, "epoch": 6224} {"train_loss": -26.7691593170166, "global_step": 516594, "epoch": 6224} {"train_loss": -27.02327537536621, "global_step": 516595, "epoch": 6224} {"train_loss": -27.1923828125, "global_step": 516596, "epoch": 6224} {"train_loss": -26.974201202392578, "global_step": 516597, "epoch": 6224} {"train_loss": -26.963552474975586, "global_step": 516598, "epoch": 6224} {"train_loss": -26.854848861694336, "global_step": 516599, "epoch": 6224} {"train_loss": -26.82049560546875, "global_step": 516600, "epoch": 6224} {"train_loss": -27.583953857421875, "global_step": 516601, "epoch": 6224} {"train_loss": -26.8872127532959, "global_step": 516602, "epoch": 6224} {"train_loss": -27.46607780456543, "global_step": 516603, "epoch": 6224} {"train_loss": -27.200597763061523, "global_step": 516604, "epoch": 6224} {"train_loss": -27.373157501220703, "global_step": 516605, "epoch": 6224} {"train_loss": -27.14215660095215, "global_step": 516606, "epoch": 6224} {"train_loss": -27.285043716430664, "global_step": 516607, "epoch": 6224} {"train_loss": -27.457229614257812, "global_step": 516608, "epoch": 6224} {"train_loss": -27.366058349609375, "global_step": 516609, "epoch": 6224} {"train_loss": -27.387144088745117, "global_step": 516610, "epoch": 6224} {"train_loss": -27.7542724609375, "global_step": 516611, "epoch": 6224} {"train_loss": -27.13943862915039, "global_step": 516612, "epoch": 6224} {"train_loss": -27.94538688659668, "global_step": 516613, "epoch": 6224} {"train_loss": -27.48223304748535, "global_step": 516614, "epoch": 6224} {"train_loss": -27.664783477783203, "global_step": 516615, "epoch": 6224} {"train_loss": -27.36219596862793, "global_step": 516616, "epoch": 6224} {"train_loss": -27.52497673034668, "global_step": 516617, "epoch": 6224} {"train_loss": -27.309118270874023, "global_step": 516618, "epoch": 6224} {"train_loss": -27.47216796875, "global_step": 516619, "epoch": 6224} {"train_loss": -27.68716812133789, "global_step": 516620, "epoch": 6224} {"train_loss": -27.889480590820312, "global_step": 516621, "epoch": 6224} {"train_loss": -27.099645614624023, "global_step": 516622, "epoch": 6224} {"train_loss": -27.802520751953125, "global_step": 516623, "epoch": 6224} {"train_loss": -27.469959259033203, "global_step": 516624, "epoch": 6224} {"train_loss": -27.64467430114746, "global_step": 516625, "epoch": 6224} {"train_loss": -27.54924964904785, "global_step": 516626, "epoch": 6224} {"train_loss": -27.642749786376953, "global_step": 516627, "epoch": 6224} {"train_loss": -27.428091049194336, "global_step": 516628, "epoch": 6224} {"train_loss": -27.492841720581055, "global_step": 516629, "epoch": 6224} {"train_loss": -27.2490291595459, "global_step": 516630, "epoch": 6224} {"train_loss": -27.410123825073242, "global_step": 516631, "epoch": 6224} {"train_loss": -27.818500518798828, "global_step": 516632, "epoch": 6224} {"train_loss": -27.71991539001465, "global_step": 516633, "epoch": 6224} {"train_loss": -27.621509552001953, "global_step": 516634, "epoch": 6224} {"train_loss": -27.725988388061523, "global_step": 516635, "epoch": 6224} {"train_loss": -27.542367935180664, "global_step": 516636, "epoch": 6224} {"train_loss": -27.573392868041992, "global_step": 516637, "epoch": 6224} {"train_loss": -27.340473175048828, "global_step": 516638, "epoch": 6224} {"train_loss": -27.819091796875, "global_step": 516639, "epoch": 6224} {"train_loss": -27.56911277770996, "global_step": 516640, "epoch": 6224} {"train_loss": -28.023120880126953, "global_step": 516641, "epoch": 6224} {"train_loss": -27.8291072845459, "global_step": 516642, "epoch": 6224} {"train_loss": -27.836416244506836, "global_step": 516643, "epoch": 6224} {"train_loss": -27.681684494018555, "global_step": 516644, "epoch": 6224} {"train_loss": -27.92401695251465, "global_step": 516645, "epoch": 6224} {"train_loss": -27.979578018188477, "global_step": 516646, "epoch": 6224} {"train_loss": -27.704015731811523, "global_step": 516647, "epoch": 6224} {"train_loss": -27.502704620361328, "global_step": 516648, "epoch": 6224} {"train_loss": -27.494415283203125, "global_step": 516649, "epoch": 6224} {"train_loss": -27.420074462890625, "global_step": 516650, "epoch": 6224} {"train_loss": -27.653945922851562, "global_step": 516651, "epoch": 6224} {"train_loss": -27.756855010986328, "global_step": 516652, "epoch": 6224} {"train_loss": -27.520782470703125, "global_step": 516653, "epoch": 6224} {"train_loss": -27.313739776611328, "global_step": 516654, "epoch": 6224} {"train_loss": -27.838459014892578, "global_step": 516655, "epoch": 6224} {"train_loss": -27.395980834960938, "global_step": 516656, "epoch": 6224} {"train_loss": -27.81431007385254, "global_step": 516657, "epoch": 6224} {"train_loss": -27.26917839050293, "global_step": 516658, "epoch": 6224} {"train_loss": -27.288084030151367, "global_step": 516659, "epoch": 6224} {"train_loss": -27.158918380737305, "global_step": 516660, "epoch": 6224} {"train_loss": -27.001819610595703, "global_step": 516661, "epoch": 6224} {"train_loss": -27.09492301940918, "global_step": 516662, "epoch": 6224} {"train_loss": -27.32696533203125, "global_step": 516663, "epoch": 6224} {"train_loss": -27.232873916625977, "global_step": 516664, "epoch": 6224} {"train_loss": -27.35150146484375, "global_step": 516665, "epoch": 6224} {"train_loss": -27.40467643737793, "global_step": 516666, "epoch": 6224} {"train_loss": -27.203449249267578, "global_step": 516667, "epoch": 6224} {"train_loss": -27.415576934814453, "global_step": 516668, "epoch": 6224} {"train_loss": -27.553485870361328, "global_step": 516669, "epoch": 6224} {"train_loss": -27.492919921875, "global_step": 516670, "epoch": 6224} {"train_loss": -27.334278106689453, "global_step": 516671, "epoch": 6224} {"train_loss": -27.68460464477539, "global_step": 516672, "epoch": 6224} {"train_loss": -27.117813110351562, "global_step": 516673, "epoch": 6224} {"train_loss": -27.45728141141225, "global_step": 516674, "epoch": 6224, "val_loss": 6664878.5} {"train_loss": -27.313800811767578, "global_step": 516675, "epoch": 6225} {"train_loss": -26.70387077331543, "global_step": 516676, "epoch": 6225} {"train_loss": -27.193134307861328, "global_step": 516677, "epoch": 6225} {"train_loss": -27.040502548217773, "global_step": 516678, "epoch": 6225} {"train_loss": -27.2570858001709, "global_step": 516679, "epoch": 6225} {"train_loss": -27.4888858795166, "global_step": 516680, "epoch": 6225} {"train_loss": -26.889678955078125, "global_step": 516681, "epoch": 6225} {"train_loss": -27.26321792602539, "global_step": 516682, "epoch": 6225} {"train_loss": -27.487152099609375, "global_step": 516683, "epoch": 6225} {"train_loss": -27.160058975219727, "global_step": 516684, "epoch": 6225} {"train_loss": -27.248565673828125, "global_step": 516685, "epoch": 6225} {"train_loss": -27.461034774780273, "global_step": 516686, "epoch": 6225} {"train_loss": -27.256933212280273, "global_step": 516687, "epoch": 6225} {"train_loss": -27.608051300048828, "global_step": 516688, "epoch": 6225} {"train_loss": -27.341449737548828, "global_step": 516689, "epoch": 6225} {"train_loss": -27.472742080688477, "global_step": 516690, "epoch": 6225} {"train_loss": -27.769184112548828, "global_step": 516691, "epoch": 6225} {"train_loss": -27.354074478149414, "global_step": 516692, "epoch": 6225} {"train_loss": -27.470529556274414, "global_step": 516693, "epoch": 6225} {"train_loss": -27.708566665649414, "global_step": 516694, "epoch": 6225} {"train_loss": -27.952314376831055, "global_step": 516695, "epoch": 6225} {"train_loss": -27.38637351989746, "global_step": 516696, "epoch": 6225} {"train_loss": -27.220434188842773, "global_step": 516697, "epoch": 6225} {"train_loss": -27.520633697509766, "global_step": 516698, "epoch": 6225} {"train_loss": -27.390295028686523, "global_step": 516699, "epoch": 6225} {"train_loss": -27.691747665405273, "global_step": 516700, "epoch": 6225} {"train_loss": -27.575952529907227, "global_step": 516701, "epoch": 6225} {"train_loss": -27.6798095703125, "global_step": 516702, "epoch": 6225} {"train_loss": -27.523618698120117, "global_step": 516703, "epoch": 6225} {"train_loss": -27.1599063873291, "global_step": 516704, "epoch": 6225} {"train_loss": -27.1798095703125, "global_step": 516705, "epoch": 6225} {"train_loss": -27.571582794189453, "global_step": 516706, "epoch": 6225} {"train_loss": -27.246469497680664, "global_step": 516707, "epoch": 6225} {"train_loss": -27.956750869750977, "global_step": 516708, "epoch": 6225} {"train_loss": -27.845417022705078, "global_step": 516709, "epoch": 6225} {"train_loss": -27.657901763916016, "global_step": 516710, "epoch": 6225} {"train_loss": -27.624982833862305, "global_step": 516711, "epoch": 6225} {"train_loss": -27.23029136657715, "global_step": 516712, "epoch": 6225} {"train_loss": -27.47489356994629, "global_step": 516713, "epoch": 6225} {"train_loss": -28.028152465820312, "global_step": 516714, "epoch": 6225} {"train_loss": -27.653051376342773, "global_step": 516715, "epoch": 6225} {"train_loss": -27.68424415588379, "global_step": 516716, "epoch": 6225} {"train_loss": -27.878171920776367, "global_step": 516717, "epoch": 6225} {"train_loss": -27.4274959564209, "global_step": 516718, "epoch": 6225} {"train_loss": -27.56268882751465, "global_step": 516719, "epoch": 6225} {"train_loss": -27.91632652282715, "global_step": 516720, "epoch": 6225} {"train_loss": -28.125736236572266, "global_step": 516721, "epoch": 6225} {"train_loss": -27.551977157592773, "global_step": 516722, "epoch": 6225} {"train_loss": -27.61004638671875, "global_step": 516723, "epoch": 6225} {"train_loss": -27.26096534729004, "global_step": 516724, "epoch": 6225} {"train_loss": -27.541669845581055, "global_step": 516725, "epoch": 6225} {"train_loss": -27.817304611206055, "global_step": 516726, "epoch": 6225} {"train_loss": -27.714969635009766, "global_step": 516727, "epoch": 6225} {"train_loss": -28.07815933227539, "global_step": 516728, "epoch": 6225} {"train_loss": -27.461181640625, "global_step": 516729, "epoch": 6225} {"train_loss": -27.455495834350586, "global_step": 516730, "epoch": 6225} {"train_loss": -27.66925048828125, "global_step": 516731, "epoch": 6225} {"train_loss": -27.467029571533203, "global_step": 516732, "epoch": 6225} {"train_loss": -27.72572135925293, "global_step": 516733, "epoch": 6225} {"train_loss": -27.604047775268555, "global_step": 516734, "epoch": 6225} {"train_loss": -27.62076759338379, "global_step": 516735, "epoch": 6225} {"train_loss": -27.424652099609375, "global_step": 516736, "epoch": 6225} {"train_loss": -27.32568359375, "global_step": 516737, "epoch": 6225} {"train_loss": -27.21648597717285, "global_step": 516738, "epoch": 6225} {"train_loss": -26.95008659362793, "global_step": 516739, "epoch": 6225} {"train_loss": -27.828662872314453, "global_step": 516740, "epoch": 6225} {"train_loss": -27.08783531188965, "global_step": 516741, "epoch": 6225} {"train_loss": -26.33677101135254, "global_step": 516742, "epoch": 6225} {"train_loss": -26.97110366821289, "global_step": 516743, "epoch": 6225} {"train_loss": -27.56696128845215, "global_step": 516744, "epoch": 6225} {"train_loss": -27.093366622924805, "global_step": 516745, "epoch": 6225} {"train_loss": -27.35797691345215, "global_step": 516746, "epoch": 6225} {"train_loss": -27.062732696533203, "global_step": 516747, "epoch": 6225} {"train_loss": -27.38233757019043, "global_step": 516748, "epoch": 6225} {"train_loss": -27.313146591186523, "global_step": 516749, "epoch": 6225} {"train_loss": -27.3335018157959, "global_step": 516750, "epoch": 6225} {"train_loss": -27.513824462890625, "global_step": 516751, "epoch": 6225} {"train_loss": -27.69024085998535, "global_step": 516752, "epoch": 6225} {"train_loss": -27.52371597290039, "global_step": 516753, "epoch": 6225} {"train_loss": -27.678110122680664, "global_step": 516754, "epoch": 6225} {"train_loss": -27.241262435913086, "global_step": 516755, "epoch": 6225} {"train_loss": -27.644824981689453, "global_step": 516756, "epoch": 6225} {"train_loss": -27.446863473179828, "global_step": 516757, "epoch": 6225, "val_loss": 6662179.5} {"train_loss": -27.4290771484375, "global_step": 516758, "epoch": 6226} {"train_loss": -26.827136993408203, "global_step": 516759, "epoch": 6226} {"train_loss": -26.469228744506836, "global_step": 516760, "epoch": 6226} {"train_loss": -26.39396095275879, "global_step": 516761, "epoch": 6226} {"train_loss": -26.79913330078125, "global_step": 516762, "epoch": 6226} {"train_loss": -27.6430721282959, "global_step": 516763, "epoch": 6226} {"train_loss": -27.085861206054688, "global_step": 516764, "epoch": 6226} {"train_loss": -27.11002540588379, "global_step": 516765, "epoch": 6226} {"train_loss": -27.150293350219727, "global_step": 516766, "epoch": 6226} {"train_loss": -27.2878475189209, "global_step": 516767, "epoch": 6226} {"train_loss": -27.181364059448242, "global_step": 516768, "epoch": 6226} {"train_loss": -26.89863395690918, "global_step": 516769, "epoch": 6226} {"train_loss": -27.467931747436523, "global_step": 516770, "epoch": 6226} {"train_loss": -27.55475425720215, "global_step": 516771, "epoch": 6226} {"train_loss": -27.21931266784668, "global_step": 516772, "epoch": 6226} {"train_loss": -27.701496124267578, "global_step": 516773, "epoch": 6226} {"train_loss": -27.23921012878418, "global_step": 516774, "epoch": 6226} {"train_loss": -27.600940704345703, "global_step": 516775, "epoch": 6226} {"train_loss": -27.271371841430664, "global_step": 516776, "epoch": 6226} {"train_loss": -27.236997604370117, "global_step": 516777, "epoch": 6226} {"train_loss": -27.368896484375, "global_step": 516778, "epoch": 6226} {"train_loss": -27.647130966186523, "global_step": 516779, "epoch": 6226} {"train_loss": -27.670175552368164, "global_step": 516780, "epoch": 6226} {"train_loss": -27.475494384765625, "global_step": 516781, "epoch": 6226} {"train_loss": -27.381744384765625, "global_step": 516782, "epoch": 6226} {"train_loss": -27.41205406188965, "global_step": 516783, "epoch": 6226} {"train_loss": -27.54668617248535, "global_step": 516784, "epoch": 6226} {"train_loss": -27.7081241607666, "global_step": 516785, "epoch": 6226} {"train_loss": -27.406448364257812, "global_step": 516786, "epoch": 6226} {"train_loss": -27.507970809936523, "global_step": 516787, "epoch": 6226} {"train_loss": -27.592727661132812, "global_step": 516788, "epoch": 6226} {"train_loss": -27.517541885375977, "global_step": 516789, "epoch": 6226} {"train_loss": -27.554824829101562, "global_step": 516790, "epoch": 6226} {"train_loss": -27.588088989257812, "global_step": 516791, "epoch": 6226} {"train_loss": -27.654468536376953, "global_step": 516792, "epoch": 6226} {"train_loss": -27.92693519592285, "global_step": 516793, "epoch": 6226} {"train_loss": -27.8743839263916, "global_step": 516794, "epoch": 6226} {"train_loss": -27.5477352142334, "global_step": 516795, "epoch": 6226} {"train_loss": -27.618497848510742, "global_step": 516796, "epoch": 6226} {"train_loss": -27.67109489440918, "global_step": 516797, "epoch": 6226} {"train_loss": -27.4726619720459, "global_step": 516798, "epoch": 6226} {"train_loss": -27.506580352783203, "global_step": 516799, "epoch": 6226} {"train_loss": -27.64558219909668, "global_step": 516800, "epoch": 6226} {"train_loss": -27.8726806640625, "global_step": 516801, "epoch": 6226} {"train_loss": -27.07053565979004, "global_step": 516802, "epoch": 6226} {"train_loss": -26.82610511779785, "global_step": 516803, "epoch": 6226} {"train_loss": -27.532995223999023, "global_step": 516804, "epoch": 6226} {"train_loss": -27.365081787109375, "global_step": 516805, "epoch": 6226} {"train_loss": -26.968549728393555, "global_step": 516806, "epoch": 6226} {"train_loss": -27.10602378845215, "global_step": 516807, "epoch": 6226} {"train_loss": -27.141443252563477, "global_step": 516808, "epoch": 6226} {"train_loss": -27.049884796142578, "global_step": 516809, "epoch": 6226} {"train_loss": -26.930866241455078, "global_step": 516810, "epoch": 6226} {"train_loss": -27.226947784423828, "global_step": 516811, "epoch": 6226} {"train_loss": -27.718652725219727, "global_step": 516812, "epoch": 6226} {"train_loss": -27.33444595336914, "global_step": 516813, "epoch": 6226} {"train_loss": -27.368947982788086, "global_step": 516814, "epoch": 6226} {"train_loss": -26.81304359436035, "global_step": 516815, "epoch": 6226} {"train_loss": -26.95718765258789, "global_step": 516816, "epoch": 6226} {"train_loss": -27.273303985595703, "global_step": 516817, "epoch": 6226} {"train_loss": -27.287433624267578, "global_step": 516818, "epoch": 6226} {"train_loss": -27.335895538330078, "global_step": 516819, "epoch": 6226} {"train_loss": -27.377960205078125, "global_step": 516820, "epoch": 6226} {"train_loss": -26.466339111328125, "global_step": 516821, "epoch": 6226} {"train_loss": -26.819433212280273, "global_step": 516822, "epoch": 6226} {"train_loss": -27.111072540283203, "global_step": 516823, "epoch": 6226} {"train_loss": -27.088659286499023, "global_step": 516824, "epoch": 6226} {"train_loss": -27.127857208251953, "global_step": 516825, "epoch": 6226} {"train_loss": -27.232105255126953, "global_step": 516826, "epoch": 6226} {"train_loss": -27.178436279296875, "global_step": 516827, "epoch": 6226} {"train_loss": -27.422576904296875, "global_step": 516828, "epoch": 6226} {"train_loss": -27.353382110595703, "global_step": 516829, "epoch": 6226} {"train_loss": -27.2075252532959, "global_step": 516830, "epoch": 6226} {"train_loss": -27.591089248657227, "global_step": 516831, "epoch": 6226} {"train_loss": -27.413787841796875, "global_step": 516832, "epoch": 6226} {"train_loss": -27.24717140197754, "global_step": 516833, "epoch": 6226} {"train_loss": -27.862598419189453, "global_step": 516834, "epoch": 6226} {"train_loss": -27.703516006469727, "global_step": 516835, "epoch": 6226} {"train_loss": -27.82305335998535, "global_step": 516836, "epoch": 6226} {"train_loss": -27.661142349243164, "global_step": 516837, "epoch": 6226} {"train_loss": -28.127111434936523, "global_step": 516838, "epoch": 6226} {"train_loss": -27.625213623046875, "global_step": 516839, "epoch": 6226} {"train_loss": -27.35310979636319, "global_step": 516840, "epoch": 6226, "val_loss": 6562362.5} {"train_loss": -27.41180419921875, "global_step": 516841, "epoch": 6227} {"train_loss": -27.5776309967041, "global_step": 516842, "epoch": 6227} {"train_loss": -27.1593074798584, "global_step": 516843, "epoch": 6227} {"train_loss": -27.41680908203125, "global_step": 516844, "epoch": 6227} {"train_loss": -27.276874542236328, "global_step": 516845, "epoch": 6227} {"train_loss": -27.270984649658203, "global_step": 516846, "epoch": 6227} {"train_loss": -27.26372718811035, "global_step": 516847, "epoch": 6227} {"train_loss": -27.2030029296875, "global_step": 516848, "epoch": 6227} {"train_loss": -27.594934463500977, "global_step": 516849, "epoch": 6227} {"train_loss": -27.2154483795166, "global_step": 516850, "epoch": 6227} {"train_loss": -27.242284774780273, "global_step": 516851, "epoch": 6227} {"train_loss": -27.940637588500977, "global_step": 516852, "epoch": 6227} {"train_loss": -27.484670639038086, "global_step": 516853, "epoch": 6227} {"train_loss": -27.281147003173828, "global_step": 516854, "epoch": 6227} {"train_loss": -27.388797760009766, "global_step": 516855, "epoch": 6227} {"train_loss": -27.42713737487793, "global_step": 516856, "epoch": 6227} {"train_loss": -28.020084381103516, "global_step": 516857, "epoch": 6227} {"train_loss": -27.374343872070312, "global_step": 516858, "epoch": 6227} {"train_loss": -27.446365356445312, "global_step": 516859, "epoch": 6227} {"train_loss": -27.627302169799805, "global_step": 516860, "epoch": 6227} {"train_loss": -27.344785690307617, "global_step": 516861, "epoch": 6227} {"train_loss": -27.473163604736328, "global_step": 516862, "epoch": 6227} {"train_loss": -27.495330810546875, "global_step": 516863, "epoch": 6227} {"train_loss": -27.722822189331055, "global_step": 516864, "epoch": 6227} {"train_loss": -27.655492782592773, "global_step": 516865, "epoch": 6227} {"train_loss": -27.59699058532715, "global_step": 516866, "epoch": 6227} {"train_loss": -27.311704635620117, "global_step": 516867, "epoch": 6227} {"train_loss": -27.243576049804688, "global_step": 516868, "epoch": 6227} {"train_loss": -27.575286865234375, "global_step": 516869, "epoch": 6227} {"train_loss": -27.521778106689453, "global_step": 516870, "epoch": 6227} {"train_loss": -27.19069480895996, "global_step": 516871, "epoch": 6227} {"train_loss": -27.475751876831055, "global_step": 516872, "epoch": 6227} {"train_loss": -27.727609634399414, "global_step": 516873, "epoch": 6227} {"train_loss": -27.558185577392578, "global_step": 516874, "epoch": 6227} {"train_loss": -27.764795303344727, "global_step": 516875, "epoch": 6227} {"train_loss": -27.63465690612793, "global_step": 516876, "epoch": 6227} {"train_loss": -27.303869247436523, "global_step": 516877, "epoch": 6227} {"train_loss": -27.804676055908203, "global_step": 516878, "epoch": 6227} {"train_loss": -27.393362045288086, "global_step": 516879, "epoch": 6227} {"train_loss": -27.322336196899414, "global_step": 516880, "epoch": 6227} {"train_loss": -27.713714599609375, "global_step": 516881, "epoch": 6227} {"train_loss": -27.75160026550293, "global_step": 516882, "epoch": 6227} {"train_loss": -27.286914825439453, "global_step": 516883, "epoch": 6227} {"train_loss": -27.3859806060791, "global_step": 516884, "epoch": 6227} {"train_loss": -27.448261260986328, "global_step": 516885, "epoch": 6227} {"train_loss": -28.218671798706055, "global_step": 516886, "epoch": 6227} {"train_loss": -27.645612716674805, "global_step": 516887, "epoch": 6227} {"train_loss": -27.28663444519043, "global_step": 516888, "epoch": 6227} {"train_loss": -27.62599754333496, "global_step": 516889, "epoch": 6227} {"train_loss": -27.603931427001953, "global_step": 516890, "epoch": 6227} {"train_loss": -27.369342803955078, "global_step": 516891, "epoch": 6227} {"train_loss": -27.5520076751709, "global_step": 516892, "epoch": 6227} {"train_loss": -27.44475746154785, "global_step": 516893, "epoch": 6227} {"train_loss": -27.777578353881836, "global_step": 516894, "epoch": 6227} {"train_loss": -27.1492919921875, "global_step": 516895, "epoch": 6227} {"train_loss": -27.27435302734375, "global_step": 516896, "epoch": 6227} {"train_loss": -27.71872901916504, "global_step": 516897, "epoch": 6227} {"train_loss": -28.060346603393555, "global_step": 516898, "epoch": 6227} {"train_loss": -27.539648056030273, "global_step": 516899, "epoch": 6227} {"train_loss": -27.57720375061035, "global_step": 516900, "epoch": 6227} {"train_loss": -27.92072105407715, "global_step": 516901, "epoch": 6227} {"train_loss": -26.989953994750977, "global_step": 516902, "epoch": 6227} {"train_loss": -27.554075241088867, "global_step": 516903, "epoch": 6227} {"train_loss": -27.367761611938477, "global_step": 516904, "epoch": 6227} {"train_loss": -27.402490615844727, "global_step": 516905, "epoch": 6227} {"train_loss": -27.41990089416504, "global_step": 516906, "epoch": 6227} {"train_loss": -27.57000160217285, "global_step": 516907, "epoch": 6227} {"train_loss": -27.64348793029785, "global_step": 516908, "epoch": 6227} {"train_loss": -27.682706832885742, "global_step": 516909, "epoch": 6227} {"train_loss": -27.68353271484375, "global_step": 516910, "epoch": 6227} {"train_loss": -27.832386016845703, "global_step": 516911, "epoch": 6227} {"train_loss": -27.782703399658203, "global_step": 516912, "epoch": 6227} {"train_loss": -27.686084747314453, "global_step": 516913, "epoch": 6227} {"train_loss": -28.250335693359375, "global_step": 516914, "epoch": 6227} {"train_loss": -27.714643478393555, "global_step": 516915, "epoch": 6227} {"train_loss": -27.371124267578125, "global_step": 516916, "epoch": 6227} {"train_loss": -27.386011123657227, "global_step": 516917, "epoch": 6227} {"train_loss": -27.420225143432617, "global_step": 516918, "epoch": 6227} {"train_loss": -27.372589111328125, "global_step": 516919, "epoch": 6227} {"train_loss": -27.16956901550293, "global_step": 516920, "epoch": 6227} {"train_loss": -27.032678604125977, "global_step": 516921, "epoch": 6227} {"train_loss": -27.119781494140625, "global_step": 516922, "epoch": 6227} {"train_loss": -27.49129008097821, "global_step": 516923, "epoch": 6227, "val_loss": 6573864.0} {"train_loss": -26.14027214050293, "global_step": 516924, "epoch": 6228} {"train_loss": -25.677127838134766, "global_step": 516925, "epoch": 6228} {"train_loss": -26.41998863220215, "global_step": 516926, "epoch": 6228} {"train_loss": -26.711856842041016, "global_step": 516927, "epoch": 6228} {"train_loss": -26.80164909362793, "global_step": 516928, "epoch": 6228} {"train_loss": -26.942523956298828, "global_step": 516929, "epoch": 6228} {"train_loss": -26.88623046875, "global_step": 516930, "epoch": 6228} {"train_loss": -26.430723190307617, "global_step": 516931, "epoch": 6228} {"train_loss": -26.7922420501709, "global_step": 516932, "epoch": 6228} {"train_loss": -26.7877254486084, "global_step": 516933, "epoch": 6228} {"train_loss": -27.047895431518555, "global_step": 516934, "epoch": 6228} {"train_loss": -26.706647872924805, "global_step": 516935, "epoch": 6228} {"train_loss": -26.74566650390625, "global_step": 516936, "epoch": 6228} {"train_loss": -27.326887130737305, "global_step": 516937, "epoch": 6228} {"train_loss": -27.227161407470703, "global_step": 516938, "epoch": 6228} {"train_loss": -27.240243911743164, "global_step": 516939, "epoch": 6228} {"train_loss": -27.243896484375, "global_step": 516940, "epoch": 6228} {"train_loss": -27.196767807006836, "global_step": 516941, "epoch": 6228} {"train_loss": -26.878149032592773, "global_step": 516942, "epoch": 6228} {"train_loss": -27.174245834350586, "global_step": 516943, "epoch": 6228} {"train_loss": -27.33683204650879, "global_step": 516944, "epoch": 6228} {"train_loss": -27.3697452545166, "global_step": 516945, "epoch": 6228} {"train_loss": -27.57598304748535, "global_step": 516946, "epoch": 6228} {"train_loss": -27.169458389282227, "global_step": 516947, "epoch": 6228} {"train_loss": -27.243576049804688, "global_step": 516948, "epoch": 6228} {"train_loss": -27.150955200195312, "global_step": 516949, "epoch": 6228} {"train_loss": -27.44891357421875, "global_step": 516950, "epoch": 6228} {"train_loss": -27.225210189819336, "global_step": 516951, "epoch": 6228} {"train_loss": -27.645288467407227, "global_step": 516952, "epoch": 6228} {"train_loss": -27.729711532592773, "global_step": 516953, "epoch": 6228} {"train_loss": -27.35679054260254, "global_step": 516954, "epoch": 6228} {"train_loss": -27.220794677734375, "global_step": 516955, "epoch": 6228} {"train_loss": -27.465198516845703, "global_step": 516956, "epoch": 6228} {"train_loss": -27.40812110900879, "global_step": 516957, "epoch": 6228} {"train_loss": -27.476831436157227, "global_step": 516958, "epoch": 6228} {"train_loss": -27.538101196289062, "global_step": 516959, "epoch": 6228} {"train_loss": -27.365915298461914, "global_step": 516960, "epoch": 6228} {"train_loss": -27.602338790893555, "global_step": 516961, "epoch": 6228} {"train_loss": -27.454633712768555, "global_step": 516962, "epoch": 6228} {"train_loss": -27.403411865234375, "global_step": 516963, "epoch": 6228} {"train_loss": -27.4625186920166, "global_step": 516964, "epoch": 6228} {"train_loss": -27.97913932800293, "global_step": 516965, "epoch": 6228} {"train_loss": -27.390661239624023, "global_step": 516966, "epoch": 6228} {"train_loss": -27.77720069885254, "global_step": 516967, "epoch": 6228} {"train_loss": -27.766515731811523, "global_step": 516968, "epoch": 6228} {"train_loss": -27.765546798706055, "global_step": 516969, "epoch": 6228} {"train_loss": -27.701385498046875, "global_step": 516970, "epoch": 6228} {"train_loss": -27.814863204956055, "global_step": 516971, "epoch": 6228} {"train_loss": -27.386484146118164, "global_step": 516972, "epoch": 6228} {"train_loss": -27.570087432861328, "global_step": 516973, "epoch": 6228} {"train_loss": -27.587621688842773, "global_step": 516974, "epoch": 6228} {"train_loss": -27.824066162109375, "global_step": 516975, "epoch": 6228} {"train_loss": -27.780521392822266, "global_step": 516976, "epoch": 6228} {"train_loss": -27.463333129882812, "global_step": 516977, "epoch": 6228} {"train_loss": -27.594091415405273, "global_step": 516978, "epoch": 6228} {"train_loss": -27.767438888549805, "global_step": 516979, "epoch": 6228} {"train_loss": -27.594396591186523, "global_step": 516980, "epoch": 6228} {"train_loss": -27.90851402282715, "global_step": 516981, "epoch": 6228} {"train_loss": -27.903676986694336, "global_step": 516982, "epoch": 6228} {"train_loss": -27.677200317382812, "global_step": 516983, "epoch": 6228} {"train_loss": -27.135162353515625, "global_step": 516984, "epoch": 6228} {"train_loss": -27.4228572845459, "global_step": 516985, "epoch": 6228} {"train_loss": -27.051624298095703, "global_step": 516986, "epoch": 6228} {"train_loss": -26.650678634643555, "global_step": 516987, "epoch": 6228} {"train_loss": -26.511215209960938, "global_step": 516988, "epoch": 6228} {"train_loss": -26.78497314453125, "global_step": 516989, "epoch": 6228} {"train_loss": -27.57184410095215, "global_step": 516990, "epoch": 6228} {"train_loss": -27.0831298828125, "global_step": 516991, "epoch": 6228} {"train_loss": -27.426498413085938, "global_step": 516992, "epoch": 6228} {"train_loss": -27.419477462768555, "global_step": 516993, "epoch": 6228} {"train_loss": -27.328418731689453, "global_step": 516994, "epoch": 6228} {"train_loss": -27.326807022094727, "global_step": 516995, "epoch": 6228} {"train_loss": -27.32401466369629, "global_step": 516996, "epoch": 6228} {"train_loss": -27.343351364135742, "global_step": 516997, "epoch": 6228} {"train_loss": -27.3738956451416, "global_step": 516998, "epoch": 6228} {"train_loss": -26.83465003967285, "global_step": 516999, "epoch": 6228} {"train_loss": -27.580102920532227, "global_step": 517000, "epoch": 6228} {"train_loss": -27.457616806030273, "global_step": 517001, "epoch": 6228} {"train_loss": -27.439512252807617, "global_step": 517002, "epoch": 6228} {"train_loss": -27.6749267578125, "global_step": 517003, "epoch": 6228} {"train_loss": -27.09974479675293, "global_step": 517004, "epoch": 6228} {"train_loss": -27.239898681640625, "global_step": 517005, "epoch": 6228} {"train_loss": -27.285225695874317, "global_step": 517006, "epoch": 6228, "val_loss": 6605663.0} {"train_loss": -26.203977584838867, "global_step": 517007, "epoch": 6229} {"train_loss": -25.917016983032227, "global_step": 517008, "epoch": 6229} {"train_loss": -26.349817276000977, "global_step": 517009, "epoch": 6229} {"train_loss": -26.2998104095459, "global_step": 517010, "epoch": 6229} {"train_loss": -26.3529052734375, "global_step": 517011, "epoch": 6229} {"train_loss": -26.46811866760254, "global_step": 517012, "epoch": 6229} {"train_loss": -26.88715171813965, "global_step": 517013, "epoch": 6229} {"train_loss": -26.42994499206543, "global_step": 517014, "epoch": 6229} {"train_loss": -26.429990768432617, "global_step": 517015, "epoch": 6229} {"train_loss": -26.86420249938965, "global_step": 517016, "epoch": 6229} {"train_loss": -27.270370483398438, "global_step": 517017, "epoch": 6229} {"train_loss": -26.604022979736328, "global_step": 517018, "epoch": 6229} {"train_loss": -26.803552627563477, "global_step": 517019, "epoch": 6229} {"train_loss": -27.1523380279541, "global_step": 517020, "epoch": 6229} {"train_loss": -26.886642456054688, "global_step": 517021, "epoch": 6229} {"train_loss": -27.005146026611328, "global_step": 517022, "epoch": 6229} {"train_loss": -27.076446533203125, "global_step": 517023, "epoch": 6229} {"train_loss": -27.174245834350586, "global_step": 517024, "epoch": 6229} {"train_loss": -27.144800186157227, "global_step": 517025, "epoch": 6229} {"train_loss": -27.071393966674805, "global_step": 517026, "epoch": 6229} {"train_loss": -26.908971786499023, "global_step": 517027, "epoch": 6229} {"train_loss": -27.013635635375977, "global_step": 517028, "epoch": 6229} {"train_loss": -27.4152889251709, "global_step": 517029, "epoch": 6229} {"train_loss": -26.80023765563965, "global_step": 517030, "epoch": 6229} {"train_loss": -27.059783935546875, "global_step": 517031, "epoch": 6229} {"train_loss": -27.181201934814453, "global_step": 517032, "epoch": 6229} {"train_loss": -27.292905807495117, "global_step": 517033, "epoch": 6229} {"train_loss": -27.13626480102539, "global_step": 517034, "epoch": 6229} {"train_loss": -27.731496810913086, "global_step": 517035, "epoch": 6229} {"train_loss": -27.107263565063477, "global_step": 517036, "epoch": 6229} {"train_loss": -27.454370498657227, "global_step": 517037, "epoch": 6229} {"train_loss": -27.695837020874023, "global_step": 517038, "epoch": 6229} {"train_loss": -27.5411319732666, "global_step": 517039, "epoch": 6229} {"train_loss": -27.787647247314453, "global_step": 517040, "epoch": 6229} {"train_loss": -27.55950355529785, "global_step": 517041, "epoch": 6229} {"train_loss": -27.422794342041016, "global_step": 517042, "epoch": 6229} {"train_loss": -27.5738582611084, "global_step": 517043, "epoch": 6229} {"train_loss": -27.354022979736328, "global_step": 517044, "epoch": 6229} {"train_loss": -27.556385040283203, "global_step": 517045, "epoch": 6229} {"train_loss": -27.580671310424805, "global_step": 517046, "epoch": 6229} {"train_loss": -27.828886032104492, "global_step": 517047, "epoch": 6229} {"train_loss": -27.578617095947266, "global_step": 517048, "epoch": 6229} {"train_loss": -27.7232666015625, "global_step": 517049, "epoch": 6229} {"train_loss": -27.32699966430664, "global_step": 517050, "epoch": 6229} {"train_loss": -27.55306053161621, "global_step": 517051, "epoch": 6229} {"train_loss": -27.833316802978516, "global_step": 517052, "epoch": 6229} {"train_loss": -27.537891387939453, "global_step": 517053, "epoch": 6229} {"train_loss": -27.524749755859375, "global_step": 517054, "epoch": 6229} {"train_loss": -27.34699821472168, "global_step": 517055, "epoch": 6229} {"train_loss": -27.40033531188965, "global_step": 517056, "epoch": 6229} {"train_loss": -27.680448532104492, "global_step": 517057, "epoch": 6229} {"train_loss": -27.349889755249023, "global_step": 517058, "epoch": 6229} {"train_loss": -27.392377853393555, "global_step": 517059, "epoch": 6229} {"train_loss": -27.269079208374023, "global_step": 517060, "epoch": 6229} {"train_loss": -27.65471839904785, "global_step": 517061, "epoch": 6229} {"train_loss": -27.702177047729492, "global_step": 517062, "epoch": 6229} {"train_loss": -27.67506217956543, "global_step": 517063, "epoch": 6229} {"train_loss": -27.48573112487793, "global_step": 517064, "epoch": 6229} {"train_loss": -27.75995445251465, "global_step": 517065, "epoch": 6229} {"train_loss": -27.404438018798828, "global_step": 517066, "epoch": 6229} {"train_loss": -27.524215698242188, "global_step": 517067, "epoch": 6229} {"train_loss": -27.757827758789062, "global_step": 517068, "epoch": 6229} {"train_loss": -27.282758712768555, "global_step": 517069, "epoch": 6229} {"train_loss": -27.444705963134766, "global_step": 517070, "epoch": 6229} {"train_loss": -27.2106876373291, "global_step": 517071, "epoch": 6229} {"train_loss": -27.627639770507812, "global_step": 517072, "epoch": 6229} {"train_loss": -27.34366226196289, "global_step": 517073, "epoch": 6229} {"train_loss": -27.659595489501953, "global_step": 517074, "epoch": 6229} {"train_loss": -27.45440101623535, "global_step": 517075, "epoch": 6229} {"train_loss": -27.384130477905273, "global_step": 517076, "epoch": 6229} {"train_loss": -27.319555282592773, "global_step": 517077, "epoch": 6229} {"train_loss": -27.693296432495117, "global_step": 517078, "epoch": 6229} {"train_loss": -27.13994789123535, "global_step": 517079, "epoch": 6229} {"train_loss": -27.545881271362305, "global_step": 517080, "epoch": 6229} {"train_loss": -27.308862686157227, "global_step": 517081, "epoch": 6229} {"train_loss": -27.36798095703125, "global_step": 517082, "epoch": 6229} {"train_loss": -27.838510513305664, "global_step": 517083, "epoch": 6229} {"train_loss": -27.789031982421875, "global_step": 517084, "epoch": 6229} {"train_loss": -27.678287506103516, "global_step": 517085, "epoch": 6229} {"train_loss": -27.48654556274414, "global_step": 517086, "epoch": 6229} {"train_loss": -27.457321166992188, "global_step": 517087, "epoch": 6229} {"train_loss": -27.752286911010742, "global_step": 517088, "epoch": 6229} {"train_loss": -27.28209270339414, "global_step": 517089, "epoch": 6229, "val_loss": 6553836.0} {"train_loss": -27.154142379760742, "global_step": 517090, "epoch": 6230} {"train_loss": -27.35561180114746, "global_step": 517091, "epoch": 6230} {"train_loss": -27.0376033782959, "global_step": 517092, "epoch": 6230} {"train_loss": -27.316802978515625, "global_step": 517093, "epoch": 6230} {"train_loss": -27.223997116088867, "global_step": 517094, "epoch": 6230} {"train_loss": -27.01389503479004, "global_step": 517095, "epoch": 6230} {"train_loss": -26.977502822875977, "global_step": 517096, "epoch": 6230} {"train_loss": -27.803943634033203, "global_step": 517097, "epoch": 6230} {"train_loss": -27.479467391967773, "global_step": 517098, "epoch": 6230} {"train_loss": -27.05987548828125, "global_step": 517099, "epoch": 6230} {"train_loss": -27.318042755126953, "global_step": 517100, "epoch": 6230} {"train_loss": -27.43820571899414, "global_step": 517101, "epoch": 6230} {"train_loss": -27.65218162536621, "global_step": 517102, "epoch": 6230} {"train_loss": -27.275455474853516, "global_step": 517103, "epoch": 6230} {"train_loss": -27.349319458007812, "global_step": 517104, "epoch": 6230} {"train_loss": -27.58501625061035, "global_step": 517105, "epoch": 6230} {"train_loss": -27.7088623046875, "global_step": 517106, "epoch": 6230} {"train_loss": -27.502817153930664, "global_step": 517107, "epoch": 6230} {"train_loss": -27.339208602905273, "global_step": 517108, "epoch": 6230} {"train_loss": -27.91900634765625, "global_step": 517109, "epoch": 6230} {"train_loss": -27.408679962158203, "global_step": 517110, "epoch": 6230} {"train_loss": -27.396121978759766, "global_step": 517111, "epoch": 6230} {"train_loss": -27.35007667541504, "global_step": 517112, "epoch": 6230} {"train_loss": -27.53303337097168, "global_step": 517113, "epoch": 6230} {"train_loss": -27.54103660583496, "global_step": 517114, "epoch": 6230} {"train_loss": -27.519189834594727, "global_step": 517115, "epoch": 6230} {"train_loss": -27.693750381469727, "global_step": 517116, "epoch": 6230} {"train_loss": -27.6721134185791, "global_step": 517117, "epoch": 6230} {"train_loss": -27.76666259765625, "global_step": 517118, "epoch": 6230} {"train_loss": -27.20814323425293, "global_step": 517119, "epoch": 6230} {"train_loss": -27.387805938720703, "global_step": 517120, "epoch": 6230} {"train_loss": -27.17946434020996, "global_step": 517121, "epoch": 6230} {"train_loss": -27.805150985717773, "global_step": 517122, "epoch": 6230} {"train_loss": -27.523603439331055, "global_step": 517123, "epoch": 6230} {"train_loss": -27.185693740844727, "global_step": 517124, "epoch": 6230} {"train_loss": -27.66700553894043, "global_step": 517125, "epoch": 6230} {"train_loss": -27.757497787475586, "global_step": 517126, "epoch": 6230} {"train_loss": -27.548276901245117, "global_step": 517127, "epoch": 6230} {"train_loss": -27.88245964050293, "global_step": 517128, "epoch": 6230} {"train_loss": -27.5444393157959, "global_step": 517129, "epoch": 6230} {"train_loss": -27.515119552612305, "global_step": 517130, "epoch": 6230} {"train_loss": -27.886920928955078, "global_step": 517131, "epoch": 6230} {"train_loss": -27.558507919311523, "global_step": 517132, "epoch": 6230} {"train_loss": -27.154590606689453, "global_step": 517133, "epoch": 6230} {"train_loss": -27.4656925201416, "global_step": 517134, "epoch": 6230} {"train_loss": -27.7777099609375, "global_step": 517135, "epoch": 6230} {"train_loss": -27.1522274017334, "global_step": 517136, "epoch": 6230} {"train_loss": -27.554372787475586, "global_step": 517137, "epoch": 6230} {"train_loss": -27.54204750061035, "global_step": 517138, "epoch": 6230} {"train_loss": -27.492765426635742, "global_step": 517139, "epoch": 6230} {"train_loss": -27.1809024810791, "global_step": 517140, "epoch": 6230} {"train_loss": -27.452768325805664, "global_step": 517141, "epoch": 6230} {"train_loss": -27.247406005859375, "global_step": 517142, "epoch": 6230} {"train_loss": -27.574975967407227, "global_step": 517143, "epoch": 6230} {"train_loss": -27.64470863342285, "global_step": 517144, "epoch": 6230} {"train_loss": -27.16570472717285, "global_step": 517145, "epoch": 6230} {"train_loss": -27.786060333251953, "global_step": 517146, "epoch": 6230} {"train_loss": -27.419891357421875, "global_step": 517147, "epoch": 6230} {"train_loss": -27.715778350830078, "global_step": 517148, "epoch": 6230} {"train_loss": -27.68662452697754, "global_step": 517149, "epoch": 6230} {"train_loss": -27.759002685546875, "global_step": 517150, "epoch": 6230} {"train_loss": -27.626358032226562, "global_step": 517151, "epoch": 6230} {"train_loss": -27.39936637878418, "global_step": 517152, "epoch": 6230} {"train_loss": -27.225610733032227, "global_step": 517153, "epoch": 6230} {"train_loss": -26.87156105041504, "global_step": 517154, "epoch": 6230} {"train_loss": -26.884946823120117, "global_step": 517155, "epoch": 6230} {"train_loss": -27.415937423706055, "global_step": 517156, "epoch": 6230} {"train_loss": -27.353515625, "global_step": 517157, "epoch": 6230} {"train_loss": -26.906452178955078, "global_step": 517158, "epoch": 6230} {"train_loss": -27.627796173095703, "global_step": 517159, "epoch": 6230} {"train_loss": -27.784101486206055, "global_step": 517160, "epoch": 6230} {"train_loss": -27.14703369140625, "global_step": 517161, "epoch": 6230} {"train_loss": -27.72507095336914, "global_step": 517162, "epoch": 6230} {"train_loss": -27.302032470703125, "global_step": 517163, "epoch": 6230} {"train_loss": -27.815359115600586, "global_step": 517164, "epoch": 6230} {"train_loss": -27.18793296813965, "global_step": 517165, "epoch": 6230} {"train_loss": -27.337011337280273, "global_step": 517166, "epoch": 6230} {"train_loss": -27.357969284057617, "global_step": 517167, "epoch": 6230} {"train_loss": -27.58782386779785, "global_step": 517168, "epoch": 6230} {"train_loss": -27.6400203704834, "global_step": 517169, "epoch": 6230} {"train_loss": -27.532201766967773, "global_step": 517170, "epoch": 6230} {"train_loss": -27.49762535095215, "global_step": 517171, "epoch": 6230} {"train_loss": -27.46601948106145, "global_step": 517172, "epoch": 6230, "val_loss": 6542552.0} {"train_loss": -26.74439811706543, "global_step": 517173, "epoch": 6231} {"train_loss": -26.977619171142578, "global_step": 517174, "epoch": 6231} {"train_loss": -27.3384952545166, "global_step": 517175, "epoch": 6231} {"train_loss": -26.924406051635742, "global_step": 517176, "epoch": 6231} {"train_loss": -26.878986358642578, "global_step": 517177, "epoch": 6231} {"train_loss": -27.103748321533203, "global_step": 517178, "epoch": 6231} {"train_loss": -27.412378311157227, "global_step": 517179, "epoch": 6231} {"train_loss": -27.368061065673828, "global_step": 517180, "epoch": 6231} {"train_loss": -27.244958877563477, "global_step": 517181, "epoch": 6231} {"train_loss": -27.3076171875, "global_step": 517182, "epoch": 6231} {"train_loss": -26.976964950561523, "global_step": 517183, "epoch": 6231} {"train_loss": -27.354211807250977, "global_step": 517184, "epoch": 6231} {"train_loss": -26.924177169799805, "global_step": 517185, "epoch": 6231} {"train_loss": -27.4641170501709, "global_step": 517186, "epoch": 6231} {"train_loss": -27.324905395507812, "global_step": 517187, "epoch": 6231} {"train_loss": -27.380807876586914, "global_step": 517188, "epoch": 6231} {"train_loss": -27.28900146484375, "global_step": 517189, "epoch": 6231} {"train_loss": -27.261322021484375, "global_step": 517190, "epoch": 6231} {"train_loss": -27.54129981994629, "global_step": 517191, "epoch": 6231} {"train_loss": -27.21967887878418, "global_step": 517192, "epoch": 6231} {"train_loss": -27.457242965698242, "global_step": 517193, "epoch": 6231} {"train_loss": -27.040658950805664, "global_step": 517194, "epoch": 6231} {"train_loss": -27.90900993347168, "global_step": 517195, "epoch": 6231} {"train_loss": -27.491186141967773, "global_step": 517196, "epoch": 6231} {"train_loss": -27.293859481811523, "global_step": 517197, "epoch": 6231} {"train_loss": -27.3765926361084, "global_step": 517198, "epoch": 6231} {"train_loss": -27.567472457885742, "global_step": 517199, "epoch": 6231} {"train_loss": -27.44721031188965, "global_step": 517200, "epoch": 6231} {"train_loss": -27.420515060424805, "global_step": 517201, "epoch": 6231} {"train_loss": -27.401824951171875, "global_step": 517202, "epoch": 6231} {"train_loss": -27.711172103881836, "global_step": 517203, "epoch": 6231} {"train_loss": -27.6796875, "global_step": 517204, "epoch": 6231} {"train_loss": -27.559127807617188, "global_step": 517205, "epoch": 6231} {"train_loss": -27.63446617126465, "global_step": 517206, "epoch": 6231} {"train_loss": -27.960248947143555, "global_step": 517207, "epoch": 6231} {"train_loss": -27.81825065612793, "global_step": 517208, "epoch": 6231} {"train_loss": -27.514881134033203, "global_step": 517209, "epoch": 6231} {"train_loss": -27.631067276000977, "global_step": 517210, "epoch": 6231} {"train_loss": -27.30291175842285, "global_step": 517211, "epoch": 6231} {"train_loss": -27.5186824798584, "global_step": 517212, "epoch": 6231} {"train_loss": -27.6283016204834, "global_step": 517213, "epoch": 6231} {"train_loss": -27.495040893554688, "global_step": 517214, "epoch": 6231} {"train_loss": -27.616785049438477, "global_step": 517215, "epoch": 6231} {"train_loss": -27.833723068237305, "global_step": 517216, "epoch": 6231} {"train_loss": -27.52982521057129, "global_step": 517217, "epoch": 6231} {"train_loss": -27.694080352783203, "global_step": 517218, "epoch": 6231} {"train_loss": -27.751256942749023, "global_step": 517219, "epoch": 6231} {"train_loss": -27.479034423828125, "global_step": 517220, "epoch": 6231} {"train_loss": -27.895898818969727, "global_step": 517221, "epoch": 6231} {"train_loss": -27.60867691040039, "global_step": 517222, "epoch": 6231} {"train_loss": -27.31576919555664, "global_step": 517223, "epoch": 6231} {"train_loss": -27.313690185546875, "global_step": 517224, "epoch": 6231} {"train_loss": -27.280105590820312, "global_step": 517225, "epoch": 6231} {"train_loss": -27.151782989501953, "global_step": 517226, "epoch": 6231} {"train_loss": -27.37298011779785, "global_step": 517227, "epoch": 6231} {"train_loss": -27.79740333557129, "global_step": 517228, "epoch": 6231} {"train_loss": -27.707059860229492, "global_step": 517229, "epoch": 6231} {"train_loss": -27.096227645874023, "global_step": 517230, "epoch": 6231} {"train_loss": -27.563922882080078, "global_step": 517231, "epoch": 6231} {"train_loss": -27.569204330444336, "global_step": 517232, "epoch": 6231} {"train_loss": -27.117603302001953, "global_step": 517233, "epoch": 6231} {"train_loss": -27.268115997314453, "global_step": 517234, "epoch": 6231} {"train_loss": -27.40972328186035, "global_step": 517235, "epoch": 6231} {"train_loss": -27.59187126159668, "global_step": 517236, "epoch": 6231} {"train_loss": -27.48592185974121, "global_step": 517237, "epoch": 6231} {"train_loss": -27.54901123046875, "global_step": 517238, "epoch": 6231} {"train_loss": -27.061288833618164, "global_step": 517239, "epoch": 6231} {"train_loss": -27.04068946838379, "global_step": 517240, "epoch": 6231} {"train_loss": -27.2630558013916, "global_step": 517241, "epoch": 6231} {"train_loss": -27.636417388916016, "global_step": 517242, "epoch": 6231} {"train_loss": -27.486547470092773, "global_step": 517243, "epoch": 6231} {"train_loss": -27.23785972595215, "global_step": 517244, "epoch": 6231} {"train_loss": -27.191213607788086, "global_step": 517245, "epoch": 6231} {"train_loss": -27.68116569519043, "global_step": 517246, "epoch": 6231} {"train_loss": -27.36148452758789, "global_step": 517247, "epoch": 6231} {"train_loss": -27.305795669555664, "global_step": 517248, "epoch": 6231} {"train_loss": -27.33709144592285, "global_step": 517249, "epoch": 6231} {"train_loss": -27.667816162109375, "global_step": 517250, "epoch": 6231} {"train_loss": -27.900806427001953, "global_step": 517251, "epoch": 6231} {"train_loss": -27.041000366210938, "global_step": 517252, "epoch": 6231} {"train_loss": -27.694873809814453, "global_step": 517253, "epoch": 6231} {"train_loss": -27.353225708007812, "global_step": 517254, "epoch": 6231} {"train_loss": -27.416493082621013, "global_step": 517255, "epoch": 6231, "val_loss": 6624013.0} {"train_loss": -26.722991943359375, "global_step": 517256, "epoch": 6232} {"train_loss": -26.21489906311035, "global_step": 517257, "epoch": 6232} {"train_loss": -26.39351463317871, "global_step": 517258, "epoch": 6232} {"train_loss": -25.829853057861328, "global_step": 517259, "epoch": 6232} {"train_loss": -26.78041648864746, "global_step": 517260, "epoch": 6232} {"train_loss": -26.91218376159668, "global_step": 517261, "epoch": 6232} {"train_loss": -26.9362735748291, "global_step": 517262, "epoch": 6232} {"train_loss": -26.82192039489746, "global_step": 517263, "epoch": 6232} {"train_loss": -27.310428619384766, "global_step": 517264, "epoch": 6232} {"train_loss": -26.437253952026367, "global_step": 517265, "epoch": 6232} {"train_loss": -26.603662490844727, "global_step": 517266, "epoch": 6232} {"train_loss": -26.9788875579834, "global_step": 517267, "epoch": 6232} {"train_loss": -26.84297752380371, "global_step": 517268, "epoch": 6232} {"train_loss": -27.457651138305664, "global_step": 517269, "epoch": 6232} {"train_loss": -27.09392738342285, "global_step": 517270, "epoch": 6232} {"train_loss": -27.032901763916016, "global_step": 517271, "epoch": 6232} {"train_loss": -27.45484733581543, "global_step": 517272, "epoch": 6232} {"train_loss": -27.1793270111084, "global_step": 517273, "epoch": 6232} {"train_loss": -27.1517276763916, "global_step": 517274, "epoch": 6232} {"train_loss": -27.274499893188477, "global_step": 517275, "epoch": 6232} {"train_loss": -27.034162521362305, "global_step": 517276, "epoch": 6232} {"train_loss": -27.518512725830078, "global_step": 517277, "epoch": 6232} {"train_loss": -27.3236141204834, "global_step": 517278, "epoch": 6232} {"train_loss": -27.239797592163086, "global_step": 517279, "epoch": 6232} {"train_loss": -27.715362548828125, "global_step": 517280, "epoch": 6232} {"train_loss": -27.315673828125, "global_step": 517281, "epoch": 6232} {"train_loss": -27.314756393432617, "global_step": 517282, "epoch": 6232} {"train_loss": -27.292470932006836, "global_step": 517283, "epoch": 6232} {"train_loss": -27.481409072875977, "global_step": 517284, "epoch": 6232} {"train_loss": -27.42426109313965, "global_step": 517285, "epoch": 6232} {"train_loss": -27.37624168395996, "global_step": 517286, "epoch": 6232} {"train_loss": -27.7095947265625, "global_step": 517287, "epoch": 6232} {"train_loss": -27.58203125, "global_step": 517288, "epoch": 6232} {"train_loss": -27.406726837158203, "global_step": 517289, "epoch": 6232} {"train_loss": -27.26479148864746, "global_step": 517290, "epoch": 6232} {"train_loss": -27.2025203704834, "global_step": 517291, "epoch": 6232} {"train_loss": -27.461042404174805, "global_step": 517292, "epoch": 6232} {"train_loss": -27.725540161132812, "global_step": 517293, "epoch": 6232} {"train_loss": -27.306777954101562, "global_step": 517294, "epoch": 6232} {"train_loss": -27.560728073120117, "global_step": 517295, "epoch": 6232} {"train_loss": -27.640213012695312, "global_step": 517296, "epoch": 6232} {"train_loss": -27.88575553894043, "global_step": 517297, "epoch": 6232} {"train_loss": -27.368732452392578, "global_step": 517298, "epoch": 6232} {"train_loss": -27.556921005249023, "global_step": 517299, "epoch": 6232} {"train_loss": -27.494436264038086, "global_step": 517300, "epoch": 6232} {"train_loss": -27.4212703704834, "global_step": 517301, "epoch": 6232} {"train_loss": -27.6070613861084, "global_step": 517302, "epoch": 6232} {"train_loss": -27.539936065673828, "global_step": 517303, "epoch": 6232} {"train_loss": -27.59454917907715, "global_step": 517304, "epoch": 6232} {"train_loss": -27.55792808532715, "global_step": 517305, "epoch": 6232} {"train_loss": -27.700885772705078, "global_step": 517306, "epoch": 6232} {"train_loss": -27.620267868041992, "global_step": 517307, "epoch": 6232} {"train_loss": -27.494094848632812, "global_step": 517308, "epoch": 6232} {"train_loss": -27.544645309448242, "global_step": 517309, "epoch": 6232} {"train_loss": -27.891992568969727, "global_step": 517310, "epoch": 6232} {"train_loss": -27.622312545776367, "global_step": 517311, "epoch": 6232} {"train_loss": -27.477643966674805, "global_step": 517312, "epoch": 6232} {"train_loss": -27.31621742248535, "global_step": 517313, "epoch": 6232} {"train_loss": -27.15180015563965, "global_step": 517314, "epoch": 6232} {"train_loss": -27.082660675048828, "global_step": 517315, "epoch": 6232} {"train_loss": -27.667633056640625, "global_step": 517316, "epoch": 6232} {"train_loss": -27.744964599609375, "global_step": 517317, "epoch": 6232} {"train_loss": -27.689306259155273, "global_step": 517318, "epoch": 6232} {"train_loss": -27.62912368774414, "global_step": 517319, "epoch": 6232} {"train_loss": -27.43619728088379, "global_step": 517320, "epoch": 6232} {"train_loss": -27.49884033203125, "global_step": 517321, "epoch": 6232} {"train_loss": -27.55514907836914, "global_step": 517322, "epoch": 6232} {"train_loss": -27.90593910217285, "global_step": 517323, "epoch": 6232} {"train_loss": -27.813663482666016, "global_step": 517324, "epoch": 6232} {"train_loss": -27.855688095092773, "global_step": 517325, "epoch": 6232} {"train_loss": -27.513025283813477, "global_step": 517326, "epoch": 6232} {"train_loss": -27.87880516052246, "global_step": 517327, "epoch": 6232} {"train_loss": -27.729833602905273, "global_step": 517328, "epoch": 6232} {"train_loss": -27.555639266967773, "global_step": 517329, "epoch": 6232} {"train_loss": -27.63738441467285, "global_step": 517330, "epoch": 6232} {"train_loss": -27.580707550048828, "global_step": 517331, "epoch": 6232} {"train_loss": -27.540170669555664, "global_step": 517332, "epoch": 6232} {"train_loss": -27.741962432861328, "global_step": 517333, "epoch": 6232} {"train_loss": -27.471759796142578, "global_step": 517334, "epoch": 6232} {"train_loss": -27.296253204345703, "global_step": 517335, "epoch": 6232} {"train_loss": -26.949756622314453, "global_step": 517336, "epoch": 6232} {"train_loss": -27.700788497924805, "global_step": 517337, "epoch": 6232} {"train_loss": -27.362370962119964, "global_step": 517338, "epoch": 6232, "val_loss": 6534848.5} {"train_loss": -25.431884765625, "global_step": 517339, "epoch": 6233} {"train_loss": -24.422101974487305, "global_step": 517340, "epoch": 6233} {"train_loss": -26.49692153930664, "global_step": 517341, "epoch": 6233} {"train_loss": -25.491634368896484, "global_step": 517342, "epoch": 6233} {"train_loss": -26.52666664123535, "global_step": 517343, "epoch": 6233} {"train_loss": -26.246179580688477, "global_step": 517344, "epoch": 6233} {"train_loss": -26.206811904907227, "global_step": 517345, "epoch": 6233} {"train_loss": -26.109619140625, "global_step": 517346, "epoch": 6233} {"train_loss": -26.4925537109375, "global_step": 517347, "epoch": 6233} {"train_loss": -26.438739776611328, "global_step": 517348, "epoch": 6233} {"train_loss": -26.829832077026367, "global_step": 517349, "epoch": 6233} {"train_loss": -26.563695907592773, "global_step": 517350, "epoch": 6233} {"train_loss": -27.16338539123535, "global_step": 517351, "epoch": 6233} {"train_loss": -26.6082763671875, "global_step": 517352, "epoch": 6233} {"train_loss": -26.689258575439453, "global_step": 517353, "epoch": 6233} {"train_loss": -26.8028507232666, "global_step": 517354, "epoch": 6233} {"train_loss": -26.920286178588867, "global_step": 517355, "epoch": 6233} {"train_loss": -26.755300521850586, "global_step": 517356, "epoch": 6233} {"train_loss": -27.35322380065918, "global_step": 517357, "epoch": 6233} {"train_loss": -27.185876846313477, "global_step": 517358, "epoch": 6233} {"train_loss": -26.964147567749023, "global_step": 517359, "epoch": 6233} {"train_loss": -26.913578033447266, "global_step": 517360, "epoch": 6233} {"train_loss": -26.896894454956055, "global_step": 517361, "epoch": 6233} {"train_loss": -26.94550132751465, "global_step": 517362, "epoch": 6233} {"train_loss": -27.239572525024414, "global_step": 517363, "epoch": 6233} {"train_loss": -26.89820671081543, "global_step": 517364, "epoch": 6233} {"train_loss": -27.018829345703125, "global_step": 517365, "epoch": 6233} {"train_loss": -27.0703182220459, "global_step": 517366, "epoch": 6233} {"train_loss": -27.328054428100586, "global_step": 517367, "epoch": 6233} {"train_loss": -27.34442710876465, "global_step": 517368, "epoch": 6233} {"train_loss": -26.9898681640625, "global_step": 517369, "epoch": 6233} {"train_loss": -27.70294189453125, "global_step": 517370, "epoch": 6233} {"train_loss": -27.790990829467773, "global_step": 517371, "epoch": 6233} {"train_loss": -27.486677169799805, "global_step": 517372, "epoch": 6233} {"train_loss": -27.378986358642578, "global_step": 517373, "epoch": 6233} {"train_loss": -27.57352066040039, "global_step": 517374, "epoch": 6233} {"train_loss": -26.981245040893555, "global_step": 517375, "epoch": 6233} {"train_loss": -27.5567684173584, "global_step": 517376, "epoch": 6233} {"train_loss": -27.45904541015625, "global_step": 517377, "epoch": 6233} {"train_loss": -27.542856216430664, "global_step": 517378, "epoch": 6233} {"train_loss": -27.7254695892334, "global_step": 517379, "epoch": 6233} {"train_loss": -27.1176700592041, "global_step": 517380, "epoch": 6233} {"train_loss": -26.962451934814453, "global_step": 517381, "epoch": 6233} {"train_loss": -27.100208282470703, "global_step": 517382, "epoch": 6233} {"train_loss": -27.471542358398438, "global_step": 517383, "epoch": 6233} {"train_loss": -27.896392822265625, "global_step": 517384, "epoch": 6233} {"train_loss": -27.69095802307129, "global_step": 517385, "epoch": 6233} {"train_loss": -27.241235733032227, "global_step": 517386, "epoch": 6233} {"train_loss": -27.370716094970703, "global_step": 517387, "epoch": 6233} {"train_loss": -27.508371353149414, "global_step": 517388, "epoch": 6233} {"train_loss": -27.244821548461914, "global_step": 517389, "epoch": 6233} {"train_loss": -27.681720733642578, "global_step": 517390, "epoch": 6233} {"train_loss": -27.469709396362305, "global_step": 517391, "epoch": 6233} {"train_loss": -27.64808464050293, "global_step": 517392, "epoch": 6233} {"train_loss": -27.711444854736328, "global_step": 517393, "epoch": 6233} {"train_loss": -27.54227066040039, "global_step": 517394, "epoch": 6233} {"train_loss": -27.355972290039062, "global_step": 517395, "epoch": 6233} {"train_loss": -27.7903995513916, "global_step": 517396, "epoch": 6233} {"train_loss": -27.605756759643555, "global_step": 517397, "epoch": 6233} {"train_loss": -27.4903621673584, "global_step": 517398, "epoch": 6233} {"train_loss": -27.348241806030273, "global_step": 517399, "epoch": 6233} {"train_loss": -27.480188369750977, "global_step": 517400, "epoch": 6233} {"train_loss": -27.471349716186523, "global_step": 517401, "epoch": 6233} {"train_loss": -27.616363525390625, "global_step": 517402, "epoch": 6233} {"train_loss": -27.478668212890625, "global_step": 517403, "epoch": 6233} {"train_loss": -27.60796546936035, "global_step": 517404, "epoch": 6233} {"train_loss": -27.831151962280273, "global_step": 517405, "epoch": 6233} {"train_loss": -27.6301212310791, "global_step": 517406, "epoch": 6233} {"train_loss": -27.488935470581055, "global_step": 517407, "epoch": 6233} {"train_loss": -27.397092819213867, "global_step": 517408, "epoch": 6233} {"train_loss": -27.6798095703125, "global_step": 517409, "epoch": 6233} {"train_loss": -27.48589515686035, "global_step": 517410, "epoch": 6233} {"train_loss": -27.41029167175293, "global_step": 517411, "epoch": 6233} {"train_loss": -27.517215728759766, "global_step": 517412, "epoch": 6233} {"train_loss": -27.466833114624023, "global_step": 517413, "epoch": 6233} {"train_loss": -27.584707260131836, "global_step": 517414, "epoch": 6233} {"train_loss": -27.6209774017334, "global_step": 517415, "epoch": 6233} {"train_loss": -27.716632843017578, "global_step": 517416, "epoch": 6233} {"train_loss": -27.4907283782959, "global_step": 517417, "epoch": 6233} {"train_loss": -27.35624122619629, "global_step": 517418, "epoch": 6233} {"train_loss": -27.4700984954834, "global_step": 517419, "epoch": 6233} {"train_loss": -27.63722801208496, "global_step": 517420, "epoch": 6233} {"train_loss": -27.180296679577197, "global_step": 517421, "epoch": 6233, "val_loss": 6583684.0} {"train_loss": -26.728315353393555, "global_step": 517422, "epoch": 6234} {"train_loss": -25.45870018005371, "global_step": 517423, "epoch": 6234} {"train_loss": -25.903234481811523, "global_step": 517424, "epoch": 6234} {"train_loss": -26.637420654296875, "global_step": 517425, "epoch": 6234} {"train_loss": -26.33003044128418, "global_step": 517426, "epoch": 6234} {"train_loss": -26.605863571166992, "global_step": 517427, "epoch": 6234} {"train_loss": -26.301733016967773, "global_step": 517428, "epoch": 6234} {"train_loss": -27.039234161376953, "global_step": 517429, "epoch": 6234} {"train_loss": -26.766254425048828, "global_step": 517430, "epoch": 6234} {"train_loss": -27.014432907104492, "global_step": 517431, "epoch": 6234} {"train_loss": -27.203516006469727, "global_step": 517432, "epoch": 6234} {"train_loss": -27.228296279907227, "global_step": 517433, "epoch": 6234} {"train_loss": -26.706735610961914, "global_step": 517434, "epoch": 6234} {"train_loss": -27.217390060424805, "global_step": 517435, "epoch": 6234} {"train_loss": -27.155561447143555, "global_step": 517436, "epoch": 6234} {"train_loss": -27.371280670166016, "global_step": 517437, "epoch": 6234} {"train_loss": -27.300464630126953, "global_step": 517438, "epoch": 6234} {"train_loss": -27.508472442626953, "global_step": 517439, "epoch": 6234} {"train_loss": -26.6757869720459, "global_step": 517440, "epoch": 6234} {"train_loss": -27.4781551361084, "global_step": 517441, "epoch": 6234} {"train_loss": -27.420255661010742, "global_step": 517442, "epoch": 6234} {"train_loss": -27.103662490844727, "global_step": 517443, "epoch": 6234} {"train_loss": -26.94675064086914, "global_step": 517444, "epoch": 6234} {"train_loss": -27.34625816345215, "global_step": 517445, "epoch": 6234} {"train_loss": -27.155853271484375, "global_step": 517446, "epoch": 6234} {"train_loss": -27.415494918823242, "global_step": 517447, "epoch": 6234} {"train_loss": -27.21588134765625, "global_step": 517448, "epoch": 6234} {"train_loss": -27.245380401611328, "global_step": 517449, "epoch": 6234} {"train_loss": -27.521631240844727, "global_step": 517450, "epoch": 6234} {"train_loss": -27.3494930267334, "global_step": 517451, "epoch": 6234} {"train_loss": -27.661731719970703, "global_step": 517452, "epoch": 6234} {"train_loss": -27.474592208862305, "global_step": 517453, "epoch": 6234} {"train_loss": -27.55074119567871, "global_step": 517454, "epoch": 6234} {"train_loss": -27.42130470275879, "global_step": 517455, "epoch": 6234} {"train_loss": -27.414291381835938, "global_step": 517456, "epoch": 6234} {"train_loss": -27.221216201782227, "global_step": 517457, "epoch": 6234} {"train_loss": -27.674299240112305, "global_step": 517458, "epoch": 6234} {"train_loss": -27.747800827026367, "global_step": 517459, "epoch": 6234} {"train_loss": -27.996427536010742, "global_step": 517460, "epoch": 6234} {"train_loss": -27.4382381439209, "global_step": 517461, "epoch": 6234} {"train_loss": -27.405881881713867, "global_step": 517462, "epoch": 6234} {"train_loss": -27.343231201171875, "global_step": 517463, "epoch": 6234} {"train_loss": -27.4097957611084, "global_step": 517464, "epoch": 6234} {"train_loss": -27.413923263549805, "global_step": 517465, "epoch": 6234} {"train_loss": -27.146442413330078, "global_step": 517466, "epoch": 6234} {"train_loss": -27.440343856811523, "global_step": 517467, "epoch": 6234} {"train_loss": -27.92572593688965, "global_step": 517468, "epoch": 6234} {"train_loss": -27.403430938720703, "global_step": 517469, "epoch": 6234} {"train_loss": -28.125720977783203, "global_step": 517470, "epoch": 6234} {"train_loss": -27.443143844604492, "global_step": 517471, "epoch": 6234} {"train_loss": -27.6484432220459, "global_step": 517472, "epoch": 6234} {"train_loss": -27.773115158081055, "global_step": 517473, "epoch": 6234} {"train_loss": -27.769987106323242, "global_step": 517474, "epoch": 6234} {"train_loss": -27.189319610595703, "global_step": 517475, "epoch": 6234} {"train_loss": -27.746551513671875, "global_step": 517476, "epoch": 6234} {"train_loss": -27.863391876220703, "global_step": 517477, "epoch": 6234} {"train_loss": -27.345197677612305, "global_step": 517478, "epoch": 6234} {"train_loss": -27.64676284790039, "global_step": 517479, "epoch": 6234} {"train_loss": -27.52707862854004, "global_step": 517480, "epoch": 6234} {"train_loss": -27.198801040649414, "global_step": 517481, "epoch": 6234} {"train_loss": -27.33066749572754, "global_step": 517482, "epoch": 6234} {"train_loss": -27.092512130737305, "global_step": 517483, "epoch": 6234} {"train_loss": -27.370695114135742, "global_step": 517484, "epoch": 6234} {"train_loss": -27.1009521484375, "global_step": 517485, "epoch": 6234} {"train_loss": -27.293323516845703, "global_step": 517486, "epoch": 6234} {"train_loss": -27.327001571655273, "global_step": 517487, "epoch": 6234} {"train_loss": -27.402585983276367, "global_step": 517488, "epoch": 6234} {"train_loss": -27.468191146850586, "global_step": 517489, "epoch": 6234} {"train_loss": -27.4246768951416, "global_step": 517490, "epoch": 6234} {"train_loss": -27.75847816467285, "global_step": 517491, "epoch": 6234} {"train_loss": -27.41240882873535, "global_step": 517492, "epoch": 6234} {"train_loss": -27.65839958190918, "global_step": 517493, "epoch": 6234} {"train_loss": -27.405195236206055, "global_step": 517494, "epoch": 6234} {"train_loss": -27.574344635009766, "global_step": 517495, "epoch": 6234} {"train_loss": -27.410181045532227, "global_step": 517496, "epoch": 6234} {"train_loss": -27.472381591796875, "global_step": 517497, "epoch": 6234} {"train_loss": -27.313634872436523, "global_step": 517498, "epoch": 6234} {"train_loss": -27.171173095703125, "global_step": 517499, "epoch": 6234} {"train_loss": -27.48194694519043, "global_step": 517500, "epoch": 6234} {"train_loss": -27.338916778564453, "global_step": 517501, "epoch": 6234} {"train_loss": -27.654590606689453, "global_step": 517502, "epoch": 6234} {"train_loss": -27.47273063659668, "global_step": 517503, "epoch": 6234} {"train_loss": -27.30708843828684, "global_step": 517504, "epoch": 6234, "val_loss": 6613868.5} {"train_loss": -26.945056915283203, "global_step": 517505, "epoch": 6235} {"train_loss": -26.9686336517334, "global_step": 517506, "epoch": 6235} {"train_loss": -27.200809478759766, "global_step": 517507, "epoch": 6235} {"train_loss": -27.36138916015625, "global_step": 517508, "epoch": 6235} {"train_loss": -27.1916561126709, "global_step": 517509, "epoch": 6235} {"train_loss": -27.495569229125977, "global_step": 517510, "epoch": 6235} {"train_loss": -27.35996437072754, "global_step": 517511, "epoch": 6235} {"train_loss": -27.34564781188965, "global_step": 517512, "epoch": 6235} {"train_loss": -27.29512596130371, "global_step": 517513, "epoch": 6235} {"train_loss": -27.412811279296875, "global_step": 517514, "epoch": 6235} {"train_loss": -27.51071548461914, "global_step": 517515, "epoch": 6235} {"train_loss": -27.269636154174805, "global_step": 517516, "epoch": 6235} {"train_loss": -26.794036865234375, "global_step": 517517, "epoch": 6235} {"train_loss": -26.72369384765625, "global_step": 517518, "epoch": 6235} {"train_loss": -26.87554359436035, "global_step": 517519, "epoch": 6235} {"train_loss": -27.26814079284668, "global_step": 517520, "epoch": 6235} {"train_loss": -27.194814682006836, "global_step": 517521, "epoch": 6235} {"train_loss": -27.081464767456055, "global_step": 517522, "epoch": 6235} {"train_loss": -27.216272354125977, "global_step": 517523, "epoch": 6235} {"train_loss": -27.675317764282227, "global_step": 517524, "epoch": 6235} {"train_loss": -27.236112594604492, "global_step": 517525, "epoch": 6235} {"train_loss": -27.343738555908203, "global_step": 517526, "epoch": 6235} {"train_loss": -27.58467674255371, "global_step": 517527, "epoch": 6235} {"train_loss": -27.586572647094727, "global_step": 517528, "epoch": 6235} {"train_loss": -27.043882369995117, "global_step": 517529, "epoch": 6235} {"train_loss": -27.339391708374023, "global_step": 517530, "epoch": 6235} {"train_loss": -27.482885360717773, "global_step": 517531, "epoch": 6235} {"train_loss": -27.78863525390625, "global_step": 517532, "epoch": 6235} {"train_loss": -27.3792724609375, "global_step": 517533, "epoch": 6235} {"train_loss": -27.588422775268555, "global_step": 517534, "epoch": 6235} {"train_loss": -27.472761154174805, "global_step": 517535, "epoch": 6235} {"train_loss": -27.796375274658203, "global_step": 517536, "epoch": 6235} {"train_loss": -27.54376220703125, "global_step": 517537, "epoch": 6235} {"train_loss": -27.472461700439453, "global_step": 517538, "epoch": 6235} {"train_loss": -27.645544052124023, "global_step": 517539, "epoch": 6235} {"train_loss": -27.391427993774414, "global_step": 517540, "epoch": 6235} {"train_loss": -27.766324996948242, "global_step": 517541, "epoch": 6235} {"train_loss": -27.876972198486328, "global_step": 517542, "epoch": 6235} {"train_loss": -27.645206451416016, "global_step": 517543, "epoch": 6235} {"train_loss": -27.4074764251709, "global_step": 517544, "epoch": 6235} {"train_loss": -27.51690673828125, "global_step": 517545, "epoch": 6235} {"train_loss": -27.69905662536621, "global_step": 517546, "epoch": 6235} {"train_loss": -27.5876522064209, "global_step": 517547, "epoch": 6235} {"train_loss": -27.315717697143555, "global_step": 517548, "epoch": 6235} {"train_loss": -27.43035888671875, "global_step": 517549, "epoch": 6235} {"train_loss": -27.307159423828125, "global_step": 517550, "epoch": 6235} {"train_loss": -27.250341415405273, "global_step": 517551, "epoch": 6235} {"train_loss": -27.93764305114746, "global_step": 517552, "epoch": 6235} {"train_loss": -27.7767276763916, "global_step": 517553, "epoch": 6235} {"train_loss": -27.27510643005371, "global_step": 517554, "epoch": 6235} {"train_loss": -27.426624298095703, "global_step": 517555, "epoch": 6235} {"train_loss": -26.861286163330078, "global_step": 517556, "epoch": 6235} {"train_loss": -27.720666885375977, "global_step": 517557, "epoch": 6235} {"train_loss": -27.338953018188477, "global_step": 517558, "epoch": 6235} {"train_loss": -27.17304039001465, "global_step": 517559, "epoch": 6235} {"train_loss": -27.590824127197266, "global_step": 517560, "epoch": 6235} {"train_loss": -27.373340606689453, "global_step": 517561, "epoch": 6235} {"train_loss": -26.97918128967285, "global_step": 517562, "epoch": 6235} {"train_loss": -27.46923828125, "global_step": 517563, "epoch": 6235} {"train_loss": -27.692279815673828, "global_step": 517564, "epoch": 6235} {"train_loss": -27.584915161132812, "global_step": 517565, "epoch": 6235} {"train_loss": -27.65713882446289, "global_step": 517566, "epoch": 6235} {"train_loss": -28.061756134033203, "global_step": 517567, "epoch": 6235} {"train_loss": -27.507688522338867, "global_step": 517568, "epoch": 6235} {"train_loss": -27.61862564086914, "global_step": 517569, "epoch": 6235} {"train_loss": -27.46100425720215, "global_step": 517570, "epoch": 6235} {"train_loss": -27.568387985229492, "global_step": 517571, "epoch": 6235} {"train_loss": -27.89948844909668, "global_step": 517572, "epoch": 6235} {"train_loss": -27.52092933654785, "global_step": 517573, "epoch": 6235} {"train_loss": -27.32222557067871, "global_step": 517574, "epoch": 6235} {"train_loss": -27.385034561157227, "global_step": 517575, "epoch": 6235} {"train_loss": -27.498620986938477, "global_step": 517576, "epoch": 6235} {"train_loss": -27.64715003967285, "global_step": 517577, "epoch": 6235} {"train_loss": -27.620807647705078, "global_step": 517578, "epoch": 6235} {"train_loss": -27.413801193237305, "global_step": 517579, "epoch": 6235} {"train_loss": -27.4988956451416, "global_step": 517580, "epoch": 6235} {"train_loss": -27.58979606628418, "global_step": 517581, "epoch": 6235} {"train_loss": -27.378524780273438, "global_step": 517582, "epoch": 6235} {"train_loss": -27.03968620300293, "global_step": 517583, "epoch": 6235} {"train_loss": -27.52020835876465, "global_step": 517584, "epoch": 6235} {"train_loss": -27.4739933013916, "global_step": 517585, "epoch": 6235} {"train_loss": -27.897489547729492, "global_step": 517586, "epoch": 6235} {"train_loss": -27.433801582060664, "global_step": 517587, "epoch": 6235, "val_loss": 6522594.0} {"train_loss": -24.682706832885742, "global_step": 517588, "epoch": 6236} {"train_loss": -22.352392196655273, "global_step": 517589, "epoch": 6236} {"train_loss": -25.31360626220703, "global_step": 517590, "epoch": 6236} {"train_loss": -26.217853546142578, "global_step": 517591, "epoch": 6236} {"train_loss": -25.578001022338867, "global_step": 517592, "epoch": 6236} {"train_loss": -26.531076431274414, "global_step": 517593, "epoch": 6236} {"train_loss": -26.644758224487305, "global_step": 517594, "epoch": 6236} {"train_loss": -26.43085289001465, "global_step": 517595, "epoch": 6236} {"train_loss": -26.501745223999023, "global_step": 517596, "epoch": 6236} {"train_loss": -26.404376983642578, "global_step": 517597, "epoch": 6236} {"train_loss": -26.240896224975586, "global_step": 517598, "epoch": 6236} {"train_loss": -26.901548385620117, "global_step": 517599, "epoch": 6236} {"train_loss": -26.429763793945312, "global_step": 517600, "epoch": 6236} {"train_loss": -26.961084365844727, "global_step": 517601, "epoch": 6236} {"train_loss": -26.5698299407959, "global_step": 517602, "epoch": 6236} {"train_loss": -27.175933837890625, "global_step": 517603, "epoch": 6236} {"train_loss": -26.932876586914062, "global_step": 517604, "epoch": 6236} {"train_loss": -26.91959571838379, "global_step": 517605, "epoch": 6236} {"train_loss": -26.7695255279541, "global_step": 517606, "epoch": 6236} {"train_loss": -26.900043487548828, "global_step": 517607, "epoch": 6236} {"train_loss": -27.45081901550293, "global_step": 517608, "epoch": 6236} {"train_loss": -26.691654205322266, "global_step": 517609, "epoch": 6236} {"train_loss": -27.284088134765625, "global_step": 517610, "epoch": 6236} {"train_loss": -26.645246505737305, "global_step": 517611, "epoch": 6236} {"train_loss": -27.2058048248291, "global_step": 517612, "epoch": 6236} {"train_loss": -27.43121910095215, "global_step": 517613, "epoch": 6236} {"train_loss": -27.579376220703125, "global_step": 517614, "epoch": 6236} {"train_loss": -26.9604434967041, "global_step": 517615, "epoch": 6236} {"train_loss": -26.970808029174805, "global_step": 517616, "epoch": 6236} {"train_loss": -27.30536460876465, "global_step": 517617, "epoch": 6236} {"train_loss": -27.55291748046875, "global_step": 517618, "epoch": 6236} {"train_loss": -26.961872100830078, "global_step": 517619, "epoch": 6236} {"train_loss": -27.185483932495117, "global_step": 517620, "epoch": 6236} {"train_loss": -27.271015167236328, "global_step": 517621, "epoch": 6236} {"train_loss": -27.259418487548828, "global_step": 517622, "epoch": 6236} {"train_loss": -26.89179801940918, "global_step": 517623, "epoch": 6236} {"train_loss": -27.150115966796875, "global_step": 517624, "epoch": 6236} {"train_loss": -27.224231719970703, "global_step": 517625, "epoch": 6236} {"train_loss": -27.298954010009766, "global_step": 517626, "epoch": 6236} {"train_loss": -26.84120750427246, "global_step": 517627, "epoch": 6236} {"train_loss": -27.496923446655273, "global_step": 517628, "epoch": 6236} {"train_loss": -27.67793083190918, "global_step": 517629, "epoch": 6236} {"train_loss": -27.069379806518555, "global_step": 517630, "epoch": 6236} {"train_loss": -27.337018966674805, "global_step": 517631, "epoch": 6236} {"train_loss": -27.101102828979492, "global_step": 517632, "epoch": 6236} {"train_loss": -27.39371109008789, "global_step": 517633, "epoch": 6236} {"train_loss": -27.344579696655273, "global_step": 517634, "epoch": 6236} {"train_loss": -26.97849464416504, "global_step": 517635, "epoch": 6236} {"train_loss": -27.0716495513916, "global_step": 517636, "epoch": 6236} {"train_loss": -27.99715232849121, "global_step": 517637, "epoch": 6236} {"train_loss": -27.505720138549805, "global_step": 517638, "epoch": 6236} {"train_loss": -27.308429718017578, "global_step": 517639, "epoch": 6236} {"train_loss": -27.395618438720703, "global_step": 517640, "epoch": 6236} {"train_loss": -27.512155532836914, "global_step": 517641, "epoch": 6236} {"train_loss": -27.608509063720703, "global_step": 517642, "epoch": 6236} {"train_loss": -27.482227325439453, "global_step": 517643, "epoch": 6236} {"train_loss": -27.874013900756836, "global_step": 517644, "epoch": 6236} {"train_loss": -27.520404815673828, "global_step": 517645, "epoch": 6236} {"train_loss": -27.18863868713379, "global_step": 517646, "epoch": 6236} {"train_loss": -27.402990341186523, "global_step": 517647, "epoch": 6236} {"train_loss": -27.635040283203125, "global_step": 517648, "epoch": 6236} {"train_loss": -27.371591567993164, "global_step": 517649, "epoch": 6236} {"train_loss": -27.359167098999023, "global_step": 517650, "epoch": 6236} {"train_loss": -27.336042404174805, "global_step": 517651, "epoch": 6236} {"train_loss": -26.931455612182617, "global_step": 517652, "epoch": 6236} {"train_loss": -27.248138427734375, "global_step": 517653, "epoch": 6236} {"train_loss": -27.172534942626953, "global_step": 517654, "epoch": 6236} {"train_loss": -27.66444969177246, "global_step": 517655, "epoch": 6236} {"train_loss": -27.394311904907227, "global_step": 517656, "epoch": 6236} {"train_loss": -27.23383903503418, "global_step": 517657, "epoch": 6236} {"train_loss": -27.134347915649414, "global_step": 517658, "epoch": 6236} {"train_loss": -27.233829498291016, "global_step": 517659, "epoch": 6236} {"train_loss": -27.90436363220215, "global_step": 517660, "epoch": 6236} {"train_loss": -27.527454376220703, "global_step": 517661, "epoch": 6236} {"train_loss": -27.391571044921875, "global_step": 517662, "epoch": 6236} {"train_loss": -27.38612937927246, "global_step": 517663, "epoch": 6236} {"train_loss": -27.865543365478516, "global_step": 517664, "epoch": 6236} {"train_loss": -27.437026977539062, "global_step": 517665, "epoch": 6236} {"train_loss": -27.372833251953125, "global_step": 517666, "epoch": 6236} {"train_loss": -27.6146183013916, "global_step": 517667, "epoch": 6236} {"train_loss": -27.431188583374023, "global_step": 517668, "epoch": 6236} {"train_loss": -27.263296127319336, "global_step": 517669, "epoch": 6236} {"train_loss": -27.06845593739705, "global_step": 517670, "epoch": 6236, "val_loss": 6615018.0} {"train_loss": -26.660367965698242, "global_step": 517671, "epoch": 6237} {"train_loss": -27.3507022857666, "global_step": 517672, "epoch": 6237} {"train_loss": -26.741287231445312, "global_step": 517673, "epoch": 6237} {"train_loss": -26.78506851196289, "global_step": 517674, "epoch": 6237} {"train_loss": -26.69723892211914, "global_step": 517675, "epoch": 6237} {"train_loss": -27.28241539001465, "global_step": 517676, "epoch": 6237} {"train_loss": -26.7557430267334, "global_step": 517677, "epoch": 6237} {"train_loss": -27.359912872314453, "global_step": 517678, "epoch": 6237} {"train_loss": -27.161191940307617, "global_step": 517679, "epoch": 6237} {"train_loss": -27.240310668945312, "global_step": 517680, "epoch": 6237} {"train_loss": -27.087738037109375, "global_step": 517681, "epoch": 6237} {"train_loss": -27.665922164916992, "global_step": 517682, "epoch": 6237} {"train_loss": -27.220678329467773, "global_step": 517683, "epoch": 6237} {"train_loss": -26.759479522705078, "global_step": 517684, "epoch": 6237} {"train_loss": -27.337820053100586, "global_step": 517685, "epoch": 6237} {"train_loss": -27.711750030517578, "global_step": 517686, "epoch": 6237} {"train_loss": -27.449359893798828, "global_step": 517687, "epoch": 6237} {"train_loss": -27.090478897094727, "global_step": 517688, "epoch": 6237} {"train_loss": -27.343408584594727, "global_step": 517689, "epoch": 6237} {"train_loss": -27.4285831451416, "global_step": 517690, "epoch": 6237} {"train_loss": -27.2738037109375, "global_step": 517691, "epoch": 6237} {"train_loss": -27.696928024291992, "global_step": 517692, "epoch": 6237} {"train_loss": -27.362323760986328, "global_step": 517693, "epoch": 6237} {"train_loss": -27.326623916625977, "global_step": 517694, "epoch": 6237} {"train_loss": -27.483631134033203, "global_step": 517695, "epoch": 6237} {"train_loss": -27.265344619750977, "global_step": 517696, "epoch": 6237} {"train_loss": -27.4359130859375, "global_step": 517697, "epoch": 6237} {"train_loss": -27.442554473876953, "global_step": 517698, "epoch": 6237} {"train_loss": -27.222076416015625, "global_step": 517699, "epoch": 6237} {"train_loss": -27.61366081237793, "global_step": 517700, "epoch": 6237} {"train_loss": -27.194910049438477, "global_step": 517701, "epoch": 6237} {"train_loss": -27.560230255126953, "global_step": 517702, "epoch": 6237} {"train_loss": -27.687519073486328, "global_step": 517703, "epoch": 6237} {"train_loss": -27.46087074279785, "global_step": 517704, "epoch": 6237} {"train_loss": -27.662206649780273, "global_step": 517705, "epoch": 6237} {"train_loss": -27.34641456604004, "global_step": 517706, "epoch": 6237} {"train_loss": -27.67947769165039, "global_step": 517707, "epoch": 6237} {"train_loss": -27.80010986328125, "global_step": 517708, "epoch": 6237} {"train_loss": -27.7459659576416, "global_step": 517709, "epoch": 6237} {"train_loss": -27.725345611572266, "global_step": 517710, "epoch": 6237} {"train_loss": -27.35088539123535, "global_step": 517711, "epoch": 6237} {"train_loss": -27.420934677124023, "global_step": 517712, "epoch": 6237} {"train_loss": -27.50577163696289, "global_step": 517713, "epoch": 6237} {"train_loss": -27.805761337280273, "global_step": 517714, "epoch": 6237} {"train_loss": -27.4585018157959, "global_step": 517715, "epoch": 6237} {"train_loss": -27.89617919921875, "global_step": 517716, "epoch": 6237} {"train_loss": -27.788732528686523, "global_step": 517717, "epoch": 6237} {"train_loss": -27.487363815307617, "global_step": 517718, "epoch": 6237} {"train_loss": -27.394611358642578, "global_step": 517719, "epoch": 6237} {"train_loss": -27.75162124633789, "global_step": 517720, "epoch": 6237} {"train_loss": -27.833423614501953, "global_step": 517721, "epoch": 6237} {"train_loss": -27.477697372436523, "global_step": 517722, "epoch": 6237} {"train_loss": -27.579442977905273, "global_step": 517723, "epoch": 6237} {"train_loss": -27.07046890258789, "global_step": 517724, "epoch": 6237} {"train_loss": -27.41962242126465, "global_step": 517725, "epoch": 6237} {"train_loss": -27.602087020874023, "global_step": 517726, "epoch": 6237} {"train_loss": -28.12420082092285, "global_step": 517727, "epoch": 6237} {"train_loss": -27.1752872467041, "global_step": 517728, "epoch": 6237} {"train_loss": -27.2592716217041, "global_step": 517729, "epoch": 6237} {"train_loss": -27.56024742126465, "global_step": 517730, "epoch": 6237} {"train_loss": -27.081518173217773, "global_step": 517731, "epoch": 6237} {"train_loss": -26.791738510131836, "global_step": 517732, "epoch": 6237} {"train_loss": -26.816619873046875, "global_step": 517733, "epoch": 6237} {"train_loss": -26.90888023376465, "global_step": 517734, "epoch": 6237} {"train_loss": -27.4847412109375, "global_step": 517735, "epoch": 6237} {"train_loss": -26.954038619995117, "global_step": 517736, "epoch": 6237} {"train_loss": -26.961139678955078, "global_step": 517737, "epoch": 6237} {"train_loss": -27.008893966674805, "global_step": 517738, "epoch": 6237} {"train_loss": -27.46819496154785, "global_step": 517739, "epoch": 6237} {"train_loss": -27.186309814453125, "global_step": 517740, "epoch": 6237} {"train_loss": -27.427616119384766, "global_step": 517741, "epoch": 6237} {"train_loss": -27.379552841186523, "global_step": 517742, "epoch": 6237} {"train_loss": -27.596359252929688, "global_step": 517743, "epoch": 6237} {"train_loss": -27.62873649597168, "global_step": 517744, "epoch": 6237} {"train_loss": -27.0498104095459, "global_step": 517745, "epoch": 6237} {"train_loss": -27.745147705078125, "global_step": 517746, "epoch": 6237} {"train_loss": -26.970901489257812, "global_step": 517747, "epoch": 6237} {"train_loss": -27.560937881469727, "global_step": 517748, "epoch": 6237} {"train_loss": -27.49053955078125, "global_step": 517749, "epoch": 6237} {"train_loss": -27.63368034362793, "global_step": 517750, "epoch": 6237} {"train_loss": -27.235736846923828, "global_step": 517751, "epoch": 6237} {"train_loss": -27.46156120300293, "global_step": 517752, "epoch": 6237} {"train_loss": -27.374776748289545, "global_step": 517753, "epoch": 6237, "val_loss": 6614597.0} {"train_loss": -27.1660213470459, "global_step": 517754, "epoch": 6238} {"train_loss": -27.127111434936523, "global_step": 517755, "epoch": 6238} {"train_loss": -27.44803237915039, "global_step": 517756, "epoch": 6238} {"train_loss": -27.19611930847168, "global_step": 517757, "epoch": 6238} {"train_loss": -27.4453125, "global_step": 517758, "epoch": 6238} {"train_loss": -26.94516372680664, "global_step": 517759, "epoch": 6238} {"train_loss": -27.46225357055664, "global_step": 517760, "epoch": 6238} {"train_loss": -27.36713218688965, "global_step": 517761, "epoch": 6238} {"train_loss": -27.218942642211914, "global_step": 517762, "epoch": 6238} {"train_loss": -27.16267967224121, "global_step": 517763, "epoch": 6238} {"train_loss": -27.55518913269043, "global_step": 517764, "epoch": 6238} {"train_loss": -27.21624183654785, "global_step": 517765, "epoch": 6238} {"train_loss": -27.356977462768555, "global_step": 517766, "epoch": 6238} {"train_loss": -27.62701416015625, "global_step": 517767, "epoch": 6238} {"train_loss": -27.591461181640625, "global_step": 517768, "epoch": 6238} {"train_loss": -27.777481079101562, "global_step": 517769, "epoch": 6238} {"train_loss": -27.743371963500977, "global_step": 517770, "epoch": 6238} {"train_loss": -27.408313751220703, "global_step": 517771, "epoch": 6238} {"train_loss": -27.216583251953125, "global_step": 517772, "epoch": 6238} {"train_loss": -27.85406494140625, "global_step": 517773, "epoch": 6238} {"train_loss": -27.278676986694336, "global_step": 517774, "epoch": 6238} {"train_loss": -27.707778930664062, "global_step": 517775, "epoch": 6238} {"train_loss": -27.758197784423828, "global_step": 517776, "epoch": 6238} {"train_loss": -27.701404571533203, "global_step": 517777, "epoch": 6238} {"train_loss": -27.8702335357666, "global_step": 517778, "epoch": 6238} {"train_loss": -27.79107666015625, "global_step": 517779, "epoch": 6238} {"train_loss": -27.741073608398438, "global_step": 517780, "epoch": 6238} {"train_loss": -27.94520378112793, "global_step": 517781, "epoch": 6238} {"train_loss": -27.699249267578125, "global_step": 517782, "epoch": 6238} {"train_loss": -27.650482177734375, "global_step": 517783, "epoch": 6238} {"train_loss": -27.734317779541016, "global_step": 517784, "epoch": 6238} {"train_loss": -27.397043228149414, "global_step": 517785, "epoch": 6238} {"train_loss": -27.70704460144043, "global_step": 517786, "epoch": 6238} {"train_loss": -27.735788345336914, "global_step": 517787, "epoch": 6238} {"train_loss": -27.290985107421875, "global_step": 517788, "epoch": 6238} {"train_loss": -27.067960739135742, "global_step": 517789, "epoch": 6238} {"train_loss": -27.047910690307617, "global_step": 517790, "epoch": 6238} {"train_loss": -26.708524703979492, "global_step": 517791, "epoch": 6238} {"train_loss": -27.042463302612305, "global_step": 517792, "epoch": 6238} {"train_loss": -26.82962417602539, "global_step": 517793, "epoch": 6238} {"train_loss": -27.01148796081543, "global_step": 517794, "epoch": 6238} {"train_loss": -26.827051162719727, "global_step": 517795, "epoch": 6238} {"train_loss": -26.956811904907227, "global_step": 517796, "epoch": 6238} {"train_loss": -27.3696231842041, "global_step": 517797, "epoch": 6238} {"train_loss": -27.80328941345215, "global_step": 517798, "epoch": 6238} {"train_loss": -26.78818130493164, "global_step": 517799, "epoch": 6238} {"train_loss": -27.631641387939453, "global_step": 517800, "epoch": 6238} {"train_loss": -27.47065544128418, "global_step": 517801, "epoch": 6238} {"train_loss": -27.025251388549805, "global_step": 517802, "epoch": 6238} {"train_loss": -27.1191349029541, "global_step": 517803, "epoch": 6238} {"train_loss": -27.28396987915039, "global_step": 517804, "epoch": 6238} {"train_loss": -27.1740665435791, "global_step": 517805, "epoch": 6238} {"train_loss": -27.091022491455078, "global_step": 517806, "epoch": 6238} {"train_loss": -27.28741455078125, "global_step": 517807, "epoch": 6238} {"train_loss": -27.362995147705078, "global_step": 517808, "epoch": 6238} {"train_loss": -27.551349639892578, "global_step": 517809, "epoch": 6238} {"train_loss": -27.53739356994629, "global_step": 517810, "epoch": 6238} {"train_loss": -27.427148818969727, "global_step": 517811, "epoch": 6238} {"train_loss": -27.31879997253418, "global_step": 517812, "epoch": 6238} {"train_loss": -27.846527099609375, "global_step": 517813, "epoch": 6238} {"train_loss": -27.584630966186523, "global_step": 517814, "epoch": 6238} {"train_loss": -27.519681930541992, "global_step": 517815, "epoch": 6238} {"train_loss": -27.520444869995117, "global_step": 517816, "epoch": 6238} {"train_loss": -27.624256134033203, "global_step": 517817, "epoch": 6238} {"train_loss": -27.73785972595215, "global_step": 517818, "epoch": 6238} {"train_loss": -27.64295768737793, "global_step": 517819, "epoch": 6238} {"train_loss": -27.20281982421875, "global_step": 517820, "epoch": 6238} {"train_loss": -27.641162872314453, "global_step": 517821, "epoch": 6238} {"train_loss": -27.82172966003418, "global_step": 517822, "epoch": 6238} {"train_loss": -27.31473731994629, "global_step": 517823, "epoch": 6238} {"train_loss": -27.52597427368164, "global_step": 517824, "epoch": 6238} {"train_loss": -27.425275802612305, "global_step": 517825, "epoch": 6238} {"train_loss": -27.479787826538086, "global_step": 517826, "epoch": 6238} {"train_loss": -27.791440963745117, "global_step": 517827, "epoch": 6238} {"train_loss": -27.700546264648438, "global_step": 517828, "epoch": 6238} {"train_loss": -27.686120986938477, "global_step": 517829, "epoch": 6238} {"train_loss": -27.618215560913086, "global_step": 517830, "epoch": 6238} {"train_loss": -27.48223876953125, "global_step": 517831, "epoch": 6238} {"train_loss": -27.535444259643555, "global_step": 517832, "epoch": 6238} {"train_loss": -27.581562042236328, "global_step": 517833, "epoch": 6238} {"train_loss": -27.787342071533203, "global_step": 517834, "epoch": 6238} {"train_loss": -27.34821891784668, "global_step": 517835, "epoch": 6238} {"train_loss": -27.442951891795698, "global_step": 517836, "epoch": 6238, "val_loss": 6600158.0} {"train_loss": -27.541711807250977, "global_step": 517837, "epoch": 6239} {"train_loss": -26.751697540283203, "global_step": 517838, "epoch": 6239} {"train_loss": -26.338300704956055, "global_step": 517839, "epoch": 6239} {"train_loss": -26.015594482421875, "global_step": 517840, "epoch": 6239} {"train_loss": -24.946603775024414, "global_step": 517841, "epoch": 6239} {"train_loss": -24.395795822143555, "global_step": 517842, "epoch": 6239} {"train_loss": -27.479333877563477, "global_step": 517843, "epoch": 6239} {"train_loss": -25.213180541992188, "global_step": 517844, "epoch": 6239} {"train_loss": -26.732648849487305, "global_step": 517845, "epoch": 6239} {"train_loss": -25.1112003326416, "global_step": 517846, "epoch": 6239} {"train_loss": -26.468658447265625, "global_step": 517847, "epoch": 6239} {"train_loss": -25.47597312927246, "global_step": 517848, "epoch": 6239} {"train_loss": -26.519948959350586, "global_step": 517849, "epoch": 6239} {"train_loss": -26.823652267456055, "global_step": 517850, "epoch": 6239} {"train_loss": -25.57474136352539, "global_step": 517851, "epoch": 6239} {"train_loss": -26.991790771484375, "global_step": 517852, "epoch": 6239} {"train_loss": -26.478139877319336, "global_step": 517853, "epoch": 6239} {"train_loss": -26.5892391204834, "global_step": 517854, "epoch": 6239} {"train_loss": -26.520130157470703, "global_step": 517855, "epoch": 6239} {"train_loss": -26.7825870513916, "global_step": 517856, "epoch": 6239} {"train_loss": -26.845243453979492, "global_step": 517857, "epoch": 6239} {"train_loss": -27.26629638671875, "global_step": 517858, "epoch": 6239} {"train_loss": -27.13335609436035, "global_step": 517859, "epoch": 6239} {"train_loss": -27.28460693359375, "global_step": 517860, "epoch": 6239} {"train_loss": -27.139474868774414, "global_step": 517861, "epoch": 6239} {"train_loss": -27.267847061157227, "global_step": 517862, "epoch": 6239} {"train_loss": -26.962345123291016, "global_step": 517863, "epoch": 6239} {"train_loss": -27.295923233032227, "global_step": 517864, "epoch": 6239} {"train_loss": -27.08998680114746, "global_step": 517865, "epoch": 6239} {"train_loss": -26.982629776000977, "global_step": 517866, "epoch": 6239} {"train_loss": -26.95529556274414, "global_step": 517867, "epoch": 6239} {"train_loss": -27.30033302307129, "global_step": 517868, "epoch": 6239} {"train_loss": -26.995283126831055, "global_step": 517869, "epoch": 6239} {"train_loss": -27.22269630432129, "global_step": 517870, "epoch": 6239} {"train_loss": -27.18414878845215, "global_step": 517871, "epoch": 6239} {"train_loss": -27.01651382446289, "global_step": 517872, "epoch": 6239} {"train_loss": -27.45545768737793, "global_step": 517873, "epoch": 6239} {"train_loss": -27.217443466186523, "global_step": 517874, "epoch": 6239} {"train_loss": -27.417898178100586, "global_step": 517875, "epoch": 6239} {"train_loss": -27.2117919921875, "global_step": 517876, "epoch": 6239} {"train_loss": -27.373626708984375, "global_step": 517877, "epoch": 6239} {"train_loss": -27.07118034362793, "global_step": 517878, "epoch": 6239} {"train_loss": -27.473051071166992, "global_step": 517879, "epoch": 6239} {"train_loss": -27.387311935424805, "global_step": 517880, "epoch": 6239} {"train_loss": -27.256336212158203, "global_step": 517881, "epoch": 6239} {"train_loss": -27.630781173706055, "global_step": 517882, "epoch": 6239} {"train_loss": -27.680866241455078, "global_step": 517883, "epoch": 6239} {"train_loss": -27.749216079711914, "global_step": 517884, "epoch": 6239} {"train_loss": -27.73975944519043, "global_step": 517885, "epoch": 6239} {"train_loss": -27.660552978515625, "global_step": 517886, "epoch": 6239} {"train_loss": -27.412311553955078, "global_step": 517887, "epoch": 6239} {"train_loss": -27.863479614257812, "global_step": 517888, "epoch": 6239} {"train_loss": -27.27484703063965, "global_step": 517889, "epoch": 6239} {"train_loss": -27.865625381469727, "global_step": 517890, "epoch": 6239} {"train_loss": -27.48138999938965, "global_step": 517891, "epoch": 6239} {"train_loss": -27.773191452026367, "global_step": 517892, "epoch": 6239} {"train_loss": -27.580276489257812, "global_step": 517893, "epoch": 6239} {"train_loss": -26.775161743164062, "global_step": 517894, "epoch": 6239} {"train_loss": -26.946990966796875, "global_step": 517895, "epoch": 6239} {"train_loss": -27.58167839050293, "global_step": 517896, "epoch": 6239} {"train_loss": -26.967090606689453, "global_step": 517897, "epoch": 6239} {"train_loss": -26.927337646484375, "global_step": 517898, "epoch": 6239} {"train_loss": -27.56757926940918, "global_step": 517899, "epoch": 6239} {"train_loss": -27.30226707458496, "global_step": 517900, "epoch": 6239} {"train_loss": -27.047082901000977, "global_step": 517901, "epoch": 6239} {"train_loss": -27.310998916625977, "global_step": 517902, "epoch": 6239} {"train_loss": -26.775785446166992, "global_step": 517903, "epoch": 6239} {"train_loss": -27.514875411987305, "global_step": 517904, "epoch": 6239} {"train_loss": -27.345966339111328, "global_step": 517905, "epoch": 6239} {"train_loss": -26.554214477539062, "global_step": 517906, "epoch": 6239} {"train_loss": -27.0629825592041, "global_step": 517907, "epoch": 6239} {"train_loss": -27.318334579467773, "global_step": 517908, "epoch": 6239} {"train_loss": -27.511581420898438, "global_step": 517909, "epoch": 6239} {"train_loss": -26.97538185119629, "global_step": 517910, "epoch": 6239} {"train_loss": -27.50913429260254, "global_step": 517911, "epoch": 6239} {"train_loss": -27.402761459350586, "global_step": 517912, "epoch": 6239} {"train_loss": -27.92926597595215, "global_step": 517913, "epoch": 6239} {"train_loss": -27.526716232299805, "global_step": 517914, "epoch": 6239} {"train_loss": -27.291440963745117, "global_step": 517915, "epoch": 6239} {"train_loss": -27.185773849487305, "global_step": 517916, "epoch": 6239} {"train_loss": -27.352895736694336, "global_step": 517917, "epoch": 6239} {"train_loss": -26.83235740661621, "global_step": 517918, "epoch": 6239} {"train_loss": -27.052221987620893, "global_step": 517919, "epoch": 6239, "val_loss": 6562842.0} {"train_loss": -26.5462646484375, "global_step": 517920, "epoch": 6240} {"train_loss": -26.887155532836914, "global_step": 517921, "epoch": 6240} {"train_loss": -26.575231552124023, "global_step": 517922, "epoch": 6240} {"train_loss": -26.822193145751953, "global_step": 517923, "epoch": 6240} {"train_loss": -26.823408126831055, "global_step": 517924, "epoch": 6240} {"train_loss": -27.058643341064453, "global_step": 517925, "epoch": 6240} {"train_loss": -27.046926498413086, "global_step": 517926, "epoch": 6240} {"train_loss": -27.04191017150879, "global_step": 517927, "epoch": 6240} {"train_loss": -27.06685447692871, "global_step": 517928, "epoch": 6240} {"train_loss": -27.341999053955078, "global_step": 517929, "epoch": 6240} {"train_loss": -26.839542388916016, "global_step": 517930, "epoch": 6240} {"train_loss": -26.97791862487793, "global_step": 517931, "epoch": 6240} {"train_loss": -27.128461837768555, "global_step": 517932, "epoch": 6240} {"train_loss": -27.07708740234375, "global_step": 517933, "epoch": 6240} {"train_loss": -27.13886070251465, "global_step": 517934, "epoch": 6240} {"train_loss": -27.343496322631836, "global_step": 517935, "epoch": 6240} {"train_loss": -27.085546493530273, "global_step": 517936, "epoch": 6240} {"train_loss": -27.7607364654541, "global_step": 517937, "epoch": 6240} {"train_loss": -27.443368911743164, "global_step": 517938, "epoch": 6240} {"train_loss": -27.29315185546875, "global_step": 517939, "epoch": 6240} {"train_loss": -27.354736328125, "global_step": 517940, "epoch": 6240} {"train_loss": -27.332670211791992, "global_step": 517941, "epoch": 6240} {"train_loss": -27.1885929107666, "global_step": 517942, "epoch": 6240} {"train_loss": -27.39495277404785, "global_step": 517943, "epoch": 6240} {"train_loss": -27.764972686767578, "global_step": 517944, "epoch": 6240} {"train_loss": -27.645200729370117, "global_step": 517945, "epoch": 6240} {"train_loss": -27.248401641845703, "global_step": 517946, "epoch": 6240} {"train_loss": -27.41314125061035, "global_step": 517947, "epoch": 6240} {"train_loss": -27.709211349487305, "global_step": 517948, "epoch": 6240} {"train_loss": -27.6804141998291, "global_step": 517949, "epoch": 6240} {"train_loss": -27.69919776916504, "global_step": 517950, "epoch": 6240} {"train_loss": -27.4778995513916, "global_step": 517951, "epoch": 6240} {"train_loss": -27.749155044555664, "global_step": 517952, "epoch": 6240} {"train_loss": -27.591379165649414, "global_step": 517953, "epoch": 6240} {"train_loss": -27.503021240234375, "global_step": 517954, "epoch": 6240} {"train_loss": -27.70545768737793, "global_step": 517955, "epoch": 6240} {"train_loss": -27.68918228149414, "global_step": 517956, "epoch": 6240} {"train_loss": -27.843027114868164, "global_step": 517957, "epoch": 6240} {"train_loss": -27.12678337097168, "global_step": 517958, "epoch": 6240} {"train_loss": -27.660873413085938, "global_step": 517959, "epoch": 6240} {"train_loss": -27.50827407836914, "global_step": 517960, "epoch": 6240} {"train_loss": -27.6228084564209, "global_step": 517961, "epoch": 6240} {"train_loss": -27.747190475463867, "global_step": 517962, "epoch": 6240} {"train_loss": -27.60105323791504, "global_step": 517963, "epoch": 6240} {"train_loss": -27.605960845947266, "global_step": 517964, "epoch": 6240} {"train_loss": -27.840993881225586, "global_step": 517965, "epoch": 6240} {"train_loss": -27.6035099029541, "global_step": 517966, "epoch": 6240} {"train_loss": -28.0118350982666, "global_step": 517967, "epoch": 6240} {"train_loss": -27.66431999206543, "global_step": 517968, "epoch": 6240} {"train_loss": -27.31402015686035, "global_step": 517969, "epoch": 6240} {"train_loss": -27.753692626953125, "global_step": 517970, "epoch": 6240} {"train_loss": -28.147357940673828, "global_step": 517971, "epoch": 6240} {"train_loss": -27.6577091217041, "global_step": 517972, "epoch": 6240} {"train_loss": -27.480972290039062, "global_step": 517973, "epoch": 6240} {"train_loss": -26.989465713500977, "global_step": 517974, "epoch": 6240} {"train_loss": -27.52204704284668, "global_step": 517975, "epoch": 6240} {"train_loss": -27.64446449279785, "global_step": 517976, "epoch": 6240} {"train_loss": -27.455820083618164, "global_step": 517977, "epoch": 6240} {"train_loss": -27.59673500061035, "global_step": 517978, "epoch": 6240} {"train_loss": -27.569116592407227, "global_step": 517979, "epoch": 6240} {"train_loss": -27.673450469970703, "global_step": 517980, "epoch": 6240} {"train_loss": -27.59469985961914, "global_step": 517981, "epoch": 6240} {"train_loss": -27.560728073120117, "global_step": 517982, "epoch": 6240} {"train_loss": -27.888025283813477, "global_step": 517983, "epoch": 6240} {"train_loss": -27.54006004333496, "global_step": 517984, "epoch": 6240} {"train_loss": -27.839704513549805, "global_step": 517985, "epoch": 6240} {"train_loss": -27.509998321533203, "global_step": 517986, "epoch": 6240} {"train_loss": -27.508207321166992, "global_step": 517987, "epoch": 6240} {"train_loss": -27.666227340698242, "global_step": 517988, "epoch": 6240} {"train_loss": -27.883840560913086, "global_step": 517989, "epoch": 6240} {"train_loss": -27.165435791015625, "global_step": 517990, "epoch": 6240} {"train_loss": -27.288198471069336, "global_step": 517991, "epoch": 6240} {"train_loss": -26.983301162719727, "global_step": 517992, "epoch": 6240} {"train_loss": -27.0283145904541, "global_step": 517993, "epoch": 6240} {"train_loss": -27.368045806884766, "global_step": 517994, "epoch": 6240} {"train_loss": -27.65553092956543, "global_step": 517995, "epoch": 6240} {"train_loss": -27.17807388305664, "global_step": 517996, "epoch": 6240} {"train_loss": -27.498077392578125, "global_step": 517997, "epoch": 6240} {"train_loss": -27.342710494995117, "global_step": 517998, "epoch": 6240} {"train_loss": -27.237913131713867, "global_step": 517999, "epoch": 6240} {"train_loss": -27.584980010986328, "global_step": 518000, "epoch": 6240} {"train_loss": -27.628870010375977, "global_step": 518001, "epoch": 6240} {"train_loss": -27.424835365938854, "global_step": 518002, "epoch": 6240, "val_loss": 6554855.0} {"train_loss": -26.44758415222168, "global_step": 518003, "epoch": 6241} {"train_loss": -26.49454116821289, "global_step": 518004, "epoch": 6241} {"train_loss": -26.817996978759766, "global_step": 518005, "epoch": 6241} {"train_loss": -26.58540153503418, "global_step": 518006, "epoch": 6241} {"train_loss": -27.094970703125, "global_step": 518007, "epoch": 6241} {"train_loss": -26.89519691467285, "global_step": 518008, "epoch": 6241} {"train_loss": -26.910552978515625, "global_step": 518009, "epoch": 6241} {"train_loss": -27.24749755859375, "global_step": 518010, "epoch": 6241} {"train_loss": -26.310693740844727, "global_step": 518011, "epoch": 6241} {"train_loss": -26.891738891601562, "global_step": 518012, "epoch": 6241} {"train_loss": -27.54043960571289, "global_step": 518013, "epoch": 6241} {"train_loss": -26.968664169311523, "global_step": 518014, "epoch": 6241} {"train_loss": -27.092151641845703, "global_step": 518015, "epoch": 6241} {"train_loss": -26.686445236206055, "global_step": 518016, "epoch": 6241} {"train_loss": -26.937368392944336, "global_step": 518017, "epoch": 6241} {"train_loss": -27.314722061157227, "global_step": 518018, "epoch": 6241} {"train_loss": -27.113250732421875, "global_step": 518019, "epoch": 6241} {"train_loss": -27.2115478515625, "global_step": 518020, "epoch": 6241} {"train_loss": -27.0360164642334, "global_step": 518021, "epoch": 6241} {"train_loss": -27.395273208618164, "global_step": 518022, "epoch": 6241} {"train_loss": -27.344635009765625, "global_step": 518023, "epoch": 6241} {"train_loss": -27.25421714782715, "global_step": 518024, "epoch": 6241} {"train_loss": -27.59695816040039, "global_step": 518025, "epoch": 6241} {"train_loss": -27.644636154174805, "global_step": 518026, "epoch": 6241} {"train_loss": -27.41509437561035, "global_step": 518027, "epoch": 6241} {"train_loss": -27.59406852722168, "global_step": 518028, "epoch": 6241} {"train_loss": -26.95222282409668, "global_step": 518029, "epoch": 6241} {"train_loss": -27.570331573486328, "global_step": 518030, "epoch": 6241} {"train_loss": -27.29499626159668, "global_step": 518031, "epoch": 6241} {"train_loss": -27.403207778930664, "global_step": 518032, "epoch": 6241} {"train_loss": -27.217121124267578, "global_step": 518033, "epoch": 6241} {"train_loss": -27.695276260375977, "global_step": 518034, "epoch": 6241} {"train_loss": -27.450881958007812, "global_step": 518035, "epoch": 6241} {"train_loss": -27.4998779296875, "global_step": 518036, "epoch": 6241} {"train_loss": -27.3765811920166, "global_step": 518037, "epoch": 6241} {"train_loss": -27.75868797302246, "global_step": 518038, "epoch": 6241} {"train_loss": -27.662353515625, "global_step": 518039, "epoch": 6241} {"train_loss": -27.7357177734375, "global_step": 518040, "epoch": 6241} {"train_loss": -27.37888526916504, "global_step": 518041, "epoch": 6241} {"train_loss": -27.759185791015625, "global_step": 518042, "epoch": 6241} {"train_loss": -27.47357749938965, "global_step": 518043, "epoch": 6241} {"train_loss": -27.47503089904785, "global_step": 518044, "epoch": 6241} {"train_loss": -27.815046310424805, "global_step": 518045, "epoch": 6241} {"train_loss": -27.576932907104492, "global_step": 518046, "epoch": 6241} {"train_loss": -27.93170738220215, "global_step": 518047, "epoch": 6241} {"train_loss": -27.705480575561523, "global_step": 518048, "epoch": 6241} {"train_loss": -27.834508895874023, "global_step": 518049, "epoch": 6241} {"train_loss": -27.7325496673584, "global_step": 518050, "epoch": 6241} {"train_loss": -27.691190719604492, "global_step": 518051, "epoch": 6241} {"train_loss": -27.61005973815918, "global_step": 518052, "epoch": 6241} {"train_loss": -27.665075302124023, "global_step": 518053, "epoch": 6241} {"train_loss": -27.12310218811035, "global_step": 518054, "epoch": 6241} {"train_loss": -27.75813102722168, "global_step": 518055, "epoch": 6241} {"train_loss": -27.88210105895996, "global_step": 518056, "epoch": 6241} {"train_loss": -27.7303466796875, "global_step": 518057, "epoch": 6241} {"train_loss": -27.8367862701416, "global_step": 518058, "epoch": 6241} {"train_loss": -27.491809844970703, "global_step": 518059, "epoch": 6241} {"train_loss": -27.42677879333496, "global_step": 518060, "epoch": 6241} {"train_loss": -27.475263595581055, "global_step": 518061, "epoch": 6241} {"train_loss": -27.787214279174805, "global_step": 518062, "epoch": 6241} {"train_loss": -27.84381103515625, "global_step": 518063, "epoch": 6241} {"train_loss": -27.85257339477539, "global_step": 518064, "epoch": 6241} {"train_loss": -27.426055908203125, "global_step": 518065, "epoch": 6241} {"train_loss": -27.601165771484375, "global_step": 518066, "epoch": 6241} {"train_loss": -27.635679244995117, "global_step": 518067, "epoch": 6241} {"train_loss": -28.01515007019043, "global_step": 518068, "epoch": 6241} {"train_loss": -27.31744384765625, "global_step": 518069, "epoch": 6241} {"train_loss": -27.874027252197266, "global_step": 518070, "epoch": 6241} {"train_loss": -27.74070167541504, "global_step": 518071, "epoch": 6241} {"train_loss": -27.287939071655273, "global_step": 518072, "epoch": 6241} {"train_loss": -27.57415771484375, "global_step": 518073, "epoch": 6241} {"train_loss": -26.9273624420166, "global_step": 518074, "epoch": 6241} {"train_loss": -26.96803092956543, "global_step": 518075, "epoch": 6241} {"train_loss": -27.03742027282715, "global_step": 518076, "epoch": 6241} {"train_loss": -27.47076416015625, "global_step": 518077, "epoch": 6241} {"train_loss": -27.400741577148438, "global_step": 518078, "epoch": 6241} {"train_loss": -27.2828369140625, "global_step": 518079, "epoch": 6241} {"train_loss": -27.029769897460938, "global_step": 518080, "epoch": 6241} {"train_loss": -27.48015785217285, "global_step": 518081, "epoch": 6241} {"train_loss": -27.455961227416992, "global_step": 518082, "epoch": 6241} {"train_loss": -26.8854923248291, "global_step": 518083, "epoch": 6241} {"train_loss": -26.940038681030273, "global_step": 518084, "epoch": 6241} {"train_loss": -27.370597241872765, "global_step": 518085, "epoch": 6241, "val_loss": 6578674.0} {"train_loss": -26.595312118530273, "global_step": 518086, "epoch": 6242} {"train_loss": -25.590402603149414, "global_step": 518087, "epoch": 6242} {"train_loss": -26.1577205657959, "global_step": 518088, "epoch": 6242} {"train_loss": -26.879810333251953, "global_step": 518089, "epoch": 6242} {"train_loss": -26.14405632019043, "global_step": 518090, "epoch": 6242} {"train_loss": -26.5313777923584, "global_step": 518091, "epoch": 6242} {"train_loss": -26.89676856994629, "global_step": 518092, "epoch": 6242} {"train_loss": -27.078039169311523, "global_step": 518093, "epoch": 6242} {"train_loss": -26.71784019470215, "global_step": 518094, "epoch": 6242} {"train_loss": -27.259679794311523, "global_step": 518095, "epoch": 6242} {"train_loss": -26.744068145751953, "global_step": 518096, "epoch": 6242} {"train_loss": -27.2474308013916, "global_step": 518097, "epoch": 6242} {"train_loss": -26.882970809936523, "global_step": 518098, "epoch": 6242} {"train_loss": -26.948537826538086, "global_step": 518099, "epoch": 6242} {"train_loss": -26.712255477905273, "global_step": 518100, "epoch": 6242} {"train_loss": -27.2576904296875, "global_step": 518101, "epoch": 6242} {"train_loss": -27.0986328125, "global_step": 518102, "epoch": 6242} {"train_loss": -26.903539657592773, "global_step": 518103, "epoch": 6242} {"train_loss": -27.050647735595703, "global_step": 518104, "epoch": 6242} {"train_loss": -27.393421173095703, "global_step": 518105, "epoch": 6242} {"train_loss": -27.296142578125, "global_step": 518106, "epoch": 6242} {"train_loss": -27.354511260986328, "global_step": 518107, "epoch": 6242} {"train_loss": -27.090961456298828, "global_step": 518108, "epoch": 6242} {"train_loss": -27.21538734436035, "global_step": 518109, "epoch": 6242} {"train_loss": -27.730085372924805, "global_step": 518110, "epoch": 6242} {"train_loss": -27.676538467407227, "global_step": 518111, "epoch": 6242} {"train_loss": -27.040067672729492, "global_step": 518112, "epoch": 6242} {"train_loss": -27.383102416992188, "global_step": 518113, "epoch": 6242} {"train_loss": -27.62855339050293, "global_step": 518114, "epoch": 6242} {"train_loss": -27.562192916870117, "global_step": 518115, "epoch": 6242} {"train_loss": -27.490631103515625, "global_step": 518116, "epoch": 6242} {"train_loss": -27.665205001831055, "global_step": 518117, "epoch": 6242} {"train_loss": -27.790735244750977, "global_step": 518118, "epoch": 6242} {"train_loss": -27.446578979492188, "global_step": 518119, "epoch": 6242} {"train_loss": -27.839950561523438, "global_step": 518120, "epoch": 6242} {"train_loss": -27.600290298461914, "global_step": 518121, "epoch": 6242} {"train_loss": -27.1596736907959, "global_step": 518122, "epoch": 6242} {"train_loss": -27.97450065612793, "global_step": 518123, "epoch": 6242} {"train_loss": -27.231475830078125, "global_step": 518124, "epoch": 6242} {"train_loss": -27.169586181640625, "global_step": 518125, "epoch": 6242} {"train_loss": -27.722497940063477, "global_step": 518126, "epoch": 6242} {"train_loss": -27.87188720703125, "global_step": 518127, "epoch": 6242} {"train_loss": -27.68606948852539, "global_step": 518128, "epoch": 6242} {"train_loss": -27.724105834960938, "global_step": 518129, "epoch": 6242} {"train_loss": -27.44635009765625, "global_step": 518130, "epoch": 6242} {"train_loss": -27.795129776000977, "global_step": 518131, "epoch": 6242} {"train_loss": -27.80805778503418, "global_step": 518132, "epoch": 6242} {"train_loss": -27.599903106689453, "global_step": 518133, "epoch": 6242} {"train_loss": -27.814956665039062, "global_step": 518134, "epoch": 6242} {"train_loss": -27.53679847717285, "global_step": 518135, "epoch": 6242} {"train_loss": -27.64112663269043, "global_step": 518136, "epoch": 6242} {"train_loss": -27.817718505859375, "global_step": 518137, "epoch": 6242} {"train_loss": -27.52402687072754, "global_step": 518138, "epoch": 6242} {"train_loss": -28.23992347717285, "global_step": 518139, "epoch": 6242} {"train_loss": -28.274585723876953, "global_step": 518140, "epoch": 6242} {"train_loss": -27.33211326599121, "global_step": 518141, "epoch": 6242} {"train_loss": -27.573516845703125, "global_step": 518142, "epoch": 6242} {"train_loss": -27.466022491455078, "global_step": 518143, "epoch": 6242} {"train_loss": -27.53053092956543, "global_step": 518144, "epoch": 6242} {"train_loss": -27.546628952026367, "global_step": 518145, "epoch": 6242} {"train_loss": -27.733768463134766, "global_step": 518146, "epoch": 6242} {"train_loss": -27.269012451171875, "global_step": 518147, "epoch": 6242} {"train_loss": -27.40690040588379, "global_step": 518148, "epoch": 6242} {"train_loss": -27.485998153686523, "global_step": 518149, "epoch": 6242} {"train_loss": -27.731109619140625, "global_step": 518150, "epoch": 6242} {"train_loss": -27.22885513305664, "global_step": 518151, "epoch": 6242} {"train_loss": -27.495132446289062, "global_step": 518152, "epoch": 6242} {"train_loss": -26.991369247436523, "global_step": 518153, "epoch": 6242} {"train_loss": -26.844934463500977, "global_step": 518154, "epoch": 6242} {"train_loss": -26.684720993041992, "global_step": 518155, "epoch": 6242} {"train_loss": -27.396167755126953, "global_step": 518156, "epoch": 6242} {"train_loss": -27.85004997253418, "global_step": 518157, "epoch": 6242} {"train_loss": -27.067981719970703, "global_step": 518158, "epoch": 6242} {"train_loss": -27.295948028564453, "global_step": 518159, "epoch": 6242} {"train_loss": -27.6872501373291, "global_step": 518160, "epoch": 6242} {"train_loss": -27.4831600189209, "global_step": 518161, "epoch": 6242} {"train_loss": -27.595462799072266, "global_step": 518162, "epoch": 6242} {"train_loss": -27.455554962158203, "global_step": 518163, "epoch": 6242} {"train_loss": -27.48223876953125, "global_step": 518164, "epoch": 6242} {"train_loss": -27.52850341796875, "global_step": 518165, "epoch": 6242} {"train_loss": -27.80706787109375, "global_step": 518166, "epoch": 6242} {"train_loss": -27.271102905273438, "global_step": 518167, "epoch": 6242} {"train_loss": -27.343296809368823, "global_step": 518168, "epoch": 6242, "val_loss": 6526503.0} {"train_loss": -26.83426284790039, "global_step": 518169, "epoch": 6243} {"train_loss": -26.395389556884766, "global_step": 518170, "epoch": 6243} {"train_loss": -26.23508644104004, "global_step": 518171, "epoch": 6243} {"train_loss": -26.55024528503418, "global_step": 518172, "epoch": 6243} {"train_loss": -26.52667808532715, "global_step": 518173, "epoch": 6243} {"train_loss": -26.52117347717285, "global_step": 518174, "epoch": 6243} {"train_loss": -26.93367576599121, "global_step": 518175, "epoch": 6243} {"train_loss": -27.05085563659668, "global_step": 518176, "epoch": 6243} {"train_loss": -27.013320922851562, "global_step": 518177, "epoch": 6243} {"train_loss": -26.815204620361328, "global_step": 518178, "epoch": 6243} {"train_loss": -27.005834579467773, "global_step": 518179, "epoch": 6243} {"train_loss": -27.145755767822266, "global_step": 518180, "epoch": 6243} {"train_loss": -27.341211318969727, "global_step": 518181, "epoch": 6243} {"train_loss": -27.120527267456055, "global_step": 518182, "epoch": 6243} {"train_loss": -27.082014083862305, "global_step": 518183, "epoch": 6243} {"train_loss": -27.219457626342773, "global_step": 518184, "epoch": 6243} {"train_loss": -27.542621612548828, "global_step": 518185, "epoch": 6243} {"train_loss": -27.109100341796875, "global_step": 518186, "epoch": 6243} {"train_loss": -27.404394149780273, "global_step": 518187, "epoch": 6243} {"train_loss": -27.45002555847168, "global_step": 518188, "epoch": 6243} {"train_loss": -27.530487060546875, "global_step": 518189, "epoch": 6243} {"train_loss": -27.727462768554688, "global_step": 518190, "epoch": 6243} {"train_loss": -27.4188232421875, "global_step": 518191, "epoch": 6243} {"train_loss": -27.320880889892578, "global_step": 518192, "epoch": 6243} {"train_loss": -27.154287338256836, "global_step": 518193, "epoch": 6243} {"train_loss": -27.76495361328125, "global_step": 518194, "epoch": 6243} {"train_loss": -27.29325294494629, "global_step": 518195, "epoch": 6243} {"train_loss": -27.416996002197266, "global_step": 518196, "epoch": 6243} {"train_loss": -27.459421157836914, "global_step": 518197, "epoch": 6243} {"train_loss": -27.5997371673584, "global_step": 518198, "epoch": 6243} {"train_loss": -27.342626571655273, "global_step": 518199, "epoch": 6243} {"train_loss": -27.7847900390625, "global_step": 518200, "epoch": 6243} {"train_loss": -27.381860733032227, "global_step": 518201, "epoch": 6243} {"train_loss": -27.623350143432617, "global_step": 518202, "epoch": 6243} {"train_loss": -27.72348403930664, "global_step": 518203, "epoch": 6243} {"train_loss": -27.729217529296875, "global_step": 518204, "epoch": 6243} {"train_loss": -27.439300537109375, "global_step": 518205, "epoch": 6243} {"train_loss": -27.489273071289062, "global_step": 518206, "epoch": 6243} {"train_loss": -27.288610458374023, "global_step": 518207, "epoch": 6243} {"train_loss": -27.738935470581055, "global_step": 518208, "epoch": 6243} {"train_loss": -27.236265182495117, "global_step": 518209, "epoch": 6243} {"train_loss": -27.241596221923828, "global_step": 518210, "epoch": 6243} {"train_loss": -26.464765548706055, "global_step": 518211, "epoch": 6243} {"train_loss": -26.335729598999023, "global_step": 518212, "epoch": 6243} {"train_loss": -26.8806209564209, "global_step": 518213, "epoch": 6243} {"train_loss": -27.6580753326416, "global_step": 518214, "epoch": 6243} {"train_loss": -25.265933990478516, "global_step": 518215, "epoch": 6243} {"train_loss": -26.528766632080078, "global_step": 518216, "epoch": 6243} {"train_loss": -26.879934310913086, "global_step": 518217, "epoch": 6243} {"train_loss": -26.5104923248291, "global_step": 518218, "epoch": 6243} {"train_loss": -26.7928524017334, "global_step": 518219, "epoch": 6243} {"train_loss": -27.0758056640625, "global_step": 518220, "epoch": 6243} {"train_loss": -26.689899444580078, "global_step": 518221, "epoch": 6243} {"train_loss": -26.846662521362305, "global_step": 518222, "epoch": 6243} {"train_loss": -26.860021591186523, "global_step": 518223, "epoch": 6243} {"train_loss": -26.974271774291992, "global_step": 518224, "epoch": 6243} {"train_loss": -27.14137077331543, "global_step": 518225, "epoch": 6243} {"train_loss": -27.091888427734375, "global_step": 518226, "epoch": 6243} {"train_loss": -27.27089500427246, "global_step": 518227, "epoch": 6243} {"train_loss": -27.135547637939453, "global_step": 518228, "epoch": 6243} {"train_loss": -27.184797286987305, "global_step": 518229, "epoch": 6243} {"train_loss": -27.445993423461914, "global_step": 518230, "epoch": 6243} {"train_loss": -27.40435791015625, "global_step": 518231, "epoch": 6243} {"train_loss": -27.144073486328125, "global_step": 518232, "epoch": 6243} {"train_loss": -27.23810386657715, "global_step": 518233, "epoch": 6243} {"train_loss": -27.121337890625, "global_step": 518234, "epoch": 6243} {"train_loss": -27.06550407409668, "global_step": 518235, "epoch": 6243} {"train_loss": -27.205942153930664, "global_step": 518236, "epoch": 6243} {"train_loss": -27.23691749572754, "global_step": 518237, "epoch": 6243} {"train_loss": -27.064916610717773, "global_step": 518238, "epoch": 6243} {"train_loss": -27.659116744995117, "global_step": 518239, "epoch": 6243} {"train_loss": -27.529443740844727, "global_step": 518240, "epoch": 6243} {"train_loss": -27.614877700805664, "global_step": 518241, "epoch": 6243} {"train_loss": -27.277509689331055, "global_step": 518242, "epoch": 6243} {"train_loss": -27.38665771484375, "global_step": 518243, "epoch": 6243} {"train_loss": -27.521474838256836, "global_step": 518244, "epoch": 6243} {"train_loss": -27.238361358642578, "global_step": 518245, "epoch": 6243} {"train_loss": -27.469884872436523, "global_step": 518246, "epoch": 6243} {"train_loss": -27.350116729736328, "global_step": 518247, "epoch": 6243} {"train_loss": -27.742212295532227, "global_step": 518248, "epoch": 6243} {"train_loss": -27.05191993713379, "global_step": 518249, "epoch": 6243} {"train_loss": -27.668481826782227, "global_step": 518250, "epoch": 6243} {"train_loss": -27.196178551179816, "global_step": 518251, "epoch": 6243, "val_loss": 6521399.5} {"train_loss": -26.4638729095459, "global_step": 518252, "epoch": 6244} {"train_loss": -26.82537841796875, "global_step": 518253, "epoch": 6244} {"train_loss": -26.666580200195312, "global_step": 518254, "epoch": 6244} {"train_loss": -26.928632736206055, "global_step": 518255, "epoch": 6244} {"train_loss": -26.916147232055664, "global_step": 518256, "epoch": 6244} {"train_loss": -26.7252140045166, "global_step": 518257, "epoch": 6244} {"train_loss": -26.8922176361084, "global_step": 518258, "epoch": 6244} {"train_loss": -27.12483024597168, "global_step": 518259, "epoch": 6244} {"train_loss": -27.1405029296875, "global_step": 518260, "epoch": 6244} {"train_loss": -27.14088249206543, "global_step": 518261, "epoch": 6244} {"train_loss": -26.764602661132812, "global_step": 518262, "epoch": 6244} {"train_loss": -27.240264892578125, "global_step": 518263, "epoch": 6244} {"train_loss": -26.744672775268555, "global_step": 518264, "epoch": 6244} {"train_loss": -27.311328887939453, "global_step": 518265, "epoch": 6244} {"train_loss": -27.295995712280273, "global_step": 518266, "epoch": 6244} {"train_loss": -27.425373077392578, "global_step": 518267, "epoch": 6244} {"train_loss": -27.390287399291992, "global_step": 518268, "epoch": 6244} {"train_loss": -27.24970817565918, "global_step": 518269, "epoch": 6244} {"train_loss": -27.26228141784668, "global_step": 518270, "epoch": 6244} {"train_loss": -27.423084259033203, "global_step": 518271, "epoch": 6244} {"train_loss": -27.482954025268555, "global_step": 518272, "epoch": 6244} {"train_loss": -26.680072784423828, "global_step": 518273, "epoch": 6244} {"train_loss": -27.30133628845215, "global_step": 518274, "epoch": 6244} {"train_loss": -27.564411163330078, "global_step": 518275, "epoch": 6244} {"train_loss": -27.099838256835938, "global_step": 518276, "epoch": 6244} {"train_loss": -27.219945907592773, "global_step": 518277, "epoch": 6244} {"train_loss": -27.062652587890625, "global_step": 518278, "epoch": 6244} {"train_loss": -27.33258056640625, "global_step": 518279, "epoch": 6244} {"train_loss": -27.273969650268555, "global_step": 518280, "epoch": 6244} {"train_loss": -27.11459732055664, "global_step": 518281, "epoch": 6244} {"train_loss": -27.119449615478516, "global_step": 518282, "epoch": 6244} {"train_loss": -27.319746017456055, "global_step": 518283, "epoch": 6244} {"train_loss": -27.094995498657227, "global_step": 518284, "epoch": 6244} {"train_loss": -27.172170639038086, "global_step": 518285, "epoch": 6244} {"train_loss": -27.286645889282227, "global_step": 518286, "epoch": 6244} {"train_loss": -27.293542861938477, "global_step": 518287, "epoch": 6244} {"train_loss": -27.593225479125977, "global_step": 518288, "epoch": 6244} {"train_loss": -27.771987915039062, "global_step": 518289, "epoch": 6244} {"train_loss": -27.441986083984375, "global_step": 518290, "epoch": 6244} {"train_loss": -27.53993034362793, "global_step": 518291, "epoch": 6244} {"train_loss": -27.525495529174805, "global_step": 518292, "epoch": 6244} {"train_loss": -27.537662506103516, "global_step": 518293, "epoch": 6244} {"train_loss": -27.32193946838379, "global_step": 518294, "epoch": 6244} {"train_loss": -27.70844841003418, "global_step": 518295, "epoch": 6244} {"train_loss": -27.051502227783203, "global_step": 518296, "epoch": 6244} {"train_loss": -27.832815170288086, "global_step": 518297, "epoch": 6244} {"train_loss": -27.381860733032227, "global_step": 518298, "epoch": 6244} {"train_loss": -27.389551162719727, "global_step": 518299, "epoch": 6244} {"train_loss": -27.559619903564453, "global_step": 518300, "epoch": 6244} {"train_loss": -27.856430053710938, "global_step": 518301, "epoch": 6244} {"train_loss": -27.72540283203125, "global_step": 518302, "epoch": 6244} {"train_loss": -27.628881454467773, "global_step": 518303, "epoch": 6244} {"train_loss": -27.16179847717285, "global_step": 518304, "epoch": 6244} {"train_loss": -27.471094131469727, "global_step": 518305, "epoch": 6244} {"train_loss": -27.45100212097168, "global_step": 518306, "epoch": 6244} {"train_loss": -27.65272331237793, "global_step": 518307, "epoch": 6244} {"train_loss": -27.873687744140625, "global_step": 518308, "epoch": 6244} {"train_loss": -27.485212326049805, "global_step": 518309, "epoch": 6244} {"train_loss": -27.8079891204834, "global_step": 518310, "epoch": 6244} {"train_loss": -27.62080192565918, "global_step": 518311, "epoch": 6244} {"train_loss": -27.682373046875, "global_step": 518312, "epoch": 6244} {"train_loss": -27.841352462768555, "global_step": 518313, "epoch": 6244} {"train_loss": -27.73040771484375, "global_step": 518314, "epoch": 6244} {"train_loss": -27.874658584594727, "global_step": 518315, "epoch": 6244} {"train_loss": -28.07498550415039, "global_step": 518316, "epoch": 6244} {"train_loss": -27.2294864654541, "global_step": 518317, "epoch": 6244} {"train_loss": -27.914047241210938, "global_step": 518318, "epoch": 6244} {"train_loss": -27.868576049804688, "global_step": 518319, "epoch": 6244} {"train_loss": -27.277027130126953, "global_step": 518320, "epoch": 6244} {"train_loss": -27.409006118774414, "global_step": 518321, "epoch": 6244} {"train_loss": -27.595590591430664, "global_step": 518322, "epoch": 6244} {"train_loss": -27.511585235595703, "global_step": 518323, "epoch": 6244} {"train_loss": -27.60824966430664, "global_step": 518324, "epoch": 6244} {"train_loss": -27.36813735961914, "global_step": 518325, "epoch": 6244} {"train_loss": -27.39691734313965, "global_step": 518326, "epoch": 6244} {"train_loss": -27.11020851135254, "global_step": 518327, "epoch": 6244} {"train_loss": -27.61878776550293, "global_step": 518328, "epoch": 6244} {"train_loss": -27.473133087158203, "global_step": 518329, "epoch": 6244} {"train_loss": -26.99595069885254, "global_step": 518330, "epoch": 6244} {"train_loss": -26.426420211791992, "global_step": 518331, "epoch": 6244} {"train_loss": -25.951379776000977, "global_step": 518332, "epoch": 6244} {"train_loss": -26.890817642211914, "global_step": 518333, "epoch": 6244} {"train_loss": -27.30562874208014, "global_step": 518334, "epoch": 6244, "val_loss": 6527750.0} {"train_loss": -25.970508575439453, "global_step": 518335, "epoch": 6245} {"train_loss": -25.81317138671875, "global_step": 518336, "epoch": 6245} {"train_loss": -26.37594985961914, "global_step": 518337, "epoch": 6245} {"train_loss": -25.67083168029785, "global_step": 518338, "epoch": 6245} {"train_loss": -26.836950302124023, "global_step": 518339, "epoch": 6245} {"train_loss": -25.975561141967773, "global_step": 518340, "epoch": 6245} {"train_loss": -26.654376983642578, "global_step": 518341, "epoch": 6245} {"train_loss": -26.61444664001465, "global_step": 518342, "epoch": 6245} {"train_loss": -26.714345932006836, "global_step": 518343, "epoch": 6245} {"train_loss": -26.34901237487793, "global_step": 518344, "epoch": 6245} {"train_loss": -26.852521896362305, "global_step": 518345, "epoch": 6245} {"train_loss": -26.90274429321289, "global_step": 518346, "epoch": 6245} {"train_loss": -26.63209342956543, "global_step": 518347, "epoch": 6245} {"train_loss": -26.912845611572266, "global_step": 518348, "epoch": 6245} {"train_loss": -27.056299209594727, "global_step": 518349, "epoch": 6245} {"train_loss": -26.51838493347168, "global_step": 518350, "epoch": 6245} {"train_loss": -27.010562896728516, "global_step": 518351, "epoch": 6245} {"train_loss": -27.246265411376953, "global_step": 518352, "epoch": 6245} {"train_loss": -27.306188583374023, "global_step": 518353, "epoch": 6245} {"train_loss": -27.375410079956055, "global_step": 518354, "epoch": 6245} {"train_loss": -27.053970336914062, "global_step": 518355, "epoch": 6245} {"train_loss": -27.360898971557617, "global_step": 518356, "epoch": 6245} {"train_loss": -27.419214248657227, "global_step": 518357, "epoch": 6245} {"train_loss": -26.74500846862793, "global_step": 518358, "epoch": 6245} {"train_loss": -27.5770320892334, "global_step": 518359, "epoch": 6245} {"train_loss": -27.33599853515625, "global_step": 518360, "epoch": 6245} {"train_loss": -27.210290908813477, "global_step": 518361, "epoch": 6245} {"train_loss": -27.444412231445312, "global_step": 518362, "epoch": 6245} {"train_loss": -27.9310245513916, "global_step": 518363, "epoch": 6245} {"train_loss": -27.46661376953125, "global_step": 518364, "epoch": 6245} {"train_loss": -27.048742294311523, "global_step": 518365, "epoch": 6245} {"train_loss": -27.306690216064453, "global_step": 518366, "epoch": 6245} {"train_loss": -27.688047409057617, "global_step": 518367, "epoch": 6245} {"train_loss": -27.112873077392578, "global_step": 518368, "epoch": 6245} {"train_loss": -27.426435470581055, "global_step": 518369, "epoch": 6245} {"train_loss": -26.94687843322754, "global_step": 518370, "epoch": 6245} {"train_loss": -27.610706329345703, "global_step": 518371, "epoch": 6245} {"train_loss": -27.583948135375977, "global_step": 518372, "epoch": 6245} {"train_loss": -27.41586685180664, "global_step": 518373, "epoch": 6245} {"train_loss": -27.679670333862305, "global_step": 518374, "epoch": 6245} {"train_loss": -27.502796173095703, "global_step": 518375, "epoch": 6245} {"train_loss": -27.5085391998291, "global_step": 518376, "epoch": 6245} {"train_loss": -27.788511276245117, "global_step": 518377, "epoch": 6245} {"train_loss": -27.604328155517578, "global_step": 518378, "epoch": 6245} {"train_loss": -27.764392852783203, "global_step": 518379, "epoch": 6245} {"train_loss": -27.625574111938477, "global_step": 518380, "epoch": 6245} {"train_loss": -27.71114158630371, "global_step": 518381, "epoch": 6245} {"train_loss": -27.903303146362305, "global_step": 518382, "epoch": 6245} {"train_loss": -27.526227951049805, "global_step": 518383, "epoch": 6245} {"train_loss": -27.83115005493164, "global_step": 518384, "epoch": 6245} {"train_loss": -27.545270919799805, "global_step": 518385, "epoch": 6245} {"train_loss": -27.45891761779785, "global_step": 518386, "epoch": 6245} {"train_loss": -27.883630752563477, "global_step": 518387, "epoch": 6245} {"train_loss": -27.466028213500977, "global_step": 518388, "epoch": 6245} {"train_loss": -27.70263671875, "global_step": 518389, "epoch": 6245} {"train_loss": -27.635290145874023, "global_step": 518390, "epoch": 6245} {"train_loss": -27.724271774291992, "global_step": 518391, "epoch": 6245} {"train_loss": -27.959793090820312, "global_step": 518392, "epoch": 6245} {"train_loss": -27.557275772094727, "global_step": 518393, "epoch": 6245} {"train_loss": -28.00690269470215, "global_step": 518394, "epoch": 6245} {"train_loss": -27.36737632751465, "global_step": 518395, "epoch": 6245} {"train_loss": -28.09113883972168, "global_step": 518396, "epoch": 6245} {"train_loss": -27.504735946655273, "global_step": 518397, "epoch": 6245} {"train_loss": -27.497577667236328, "global_step": 518398, "epoch": 6245} {"train_loss": -27.8223876953125, "global_step": 518399, "epoch": 6245} {"train_loss": -27.5967960357666, "global_step": 518400, "epoch": 6245} {"train_loss": -27.711023330688477, "global_step": 518401, "epoch": 6245} {"train_loss": -27.823904037475586, "global_step": 518402, "epoch": 6245} {"train_loss": -27.776159286499023, "global_step": 518403, "epoch": 6245} {"train_loss": -27.59882164001465, "global_step": 518404, "epoch": 6245} {"train_loss": -27.84335708618164, "global_step": 518405, "epoch": 6245} {"train_loss": -27.53497886657715, "global_step": 518406, "epoch": 6245} {"train_loss": -27.75068473815918, "global_step": 518407, "epoch": 6245} {"train_loss": -27.72492027282715, "global_step": 518408, "epoch": 6245} {"train_loss": -27.66580581665039, "global_step": 518409, "epoch": 6245} {"train_loss": -27.479537963867188, "global_step": 518410, "epoch": 6245} {"train_loss": -27.4879207611084, "global_step": 518411, "epoch": 6245} {"train_loss": -27.106369018554688, "global_step": 518412, "epoch": 6245} {"train_loss": -27.286291122436523, "global_step": 518413, "epoch": 6245} {"train_loss": -27.266382217407227, "global_step": 518414, "epoch": 6245} {"train_loss": -27.72108268737793, "global_step": 518415, "epoch": 6245} {"train_loss": -27.67885398864746, "global_step": 518416, "epoch": 6245} {"train_loss": -27.333223779517485, "global_step": 518417, "epoch": 6245, "val_loss": 6505683.0} {"train_loss": -27.281726837158203, "global_step": 518418, "epoch": 6246} {"train_loss": -27.04473876953125, "global_step": 518419, "epoch": 6246} {"train_loss": -27.04145622253418, "global_step": 518420, "epoch": 6246} {"train_loss": -26.80352783203125, "global_step": 518421, "epoch": 6246} {"train_loss": -26.3740291595459, "global_step": 518422, "epoch": 6246} {"train_loss": -27.22323989868164, "global_step": 518423, "epoch": 6246} {"train_loss": -26.880706787109375, "global_step": 518424, "epoch": 6246} {"train_loss": -26.6317081451416, "global_step": 518425, "epoch": 6246} {"train_loss": -26.704730987548828, "global_step": 518426, "epoch": 6246} {"train_loss": -26.780668258666992, "global_step": 518427, "epoch": 6246} {"train_loss": -27.04451560974121, "global_step": 518428, "epoch": 6246} {"train_loss": -26.832050323486328, "global_step": 518429, "epoch": 6246} {"train_loss": -27.107715606689453, "global_step": 518430, "epoch": 6246} {"train_loss": -27.168323516845703, "global_step": 518431, "epoch": 6246} {"train_loss": -26.661462783813477, "global_step": 518432, "epoch": 6246} {"train_loss": -27.391462326049805, "global_step": 518433, "epoch": 6246} {"train_loss": -27.137836456298828, "global_step": 518434, "epoch": 6246} {"train_loss": -27.349258422851562, "global_step": 518435, "epoch": 6246} {"train_loss": -27.25606346130371, "global_step": 518436, "epoch": 6246} {"train_loss": -27.305908203125, "global_step": 518437, "epoch": 6246} {"train_loss": -27.48530387878418, "global_step": 518438, "epoch": 6246} {"train_loss": -27.396209716796875, "global_step": 518439, "epoch": 6246} {"train_loss": -27.133657455444336, "global_step": 518440, "epoch": 6246} {"train_loss": -27.441085815429688, "global_step": 518441, "epoch": 6246} {"train_loss": -27.401716232299805, "global_step": 518442, "epoch": 6246} {"train_loss": -27.592477798461914, "global_step": 518443, "epoch": 6246} {"train_loss": -27.092605590820312, "global_step": 518444, "epoch": 6246} {"train_loss": -27.50105094909668, "global_step": 518445, "epoch": 6246} {"train_loss": -27.247289657592773, "global_step": 518446, "epoch": 6246} {"train_loss": -27.20081901550293, "global_step": 518447, "epoch": 6246} {"train_loss": -27.223129272460938, "global_step": 518448, "epoch": 6246} {"train_loss": -27.49940299987793, "global_step": 518449, "epoch": 6246} {"train_loss": -27.83587646484375, "global_step": 518450, "epoch": 6246} {"train_loss": -27.480716705322266, "global_step": 518451, "epoch": 6246} {"train_loss": -27.609922409057617, "global_step": 518452, "epoch": 6246} {"train_loss": -27.226089477539062, "global_step": 518453, "epoch": 6246} {"train_loss": -27.401086807250977, "global_step": 518454, "epoch": 6246} {"train_loss": -27.33782386779785, "global_step": 518455, "epoch": 6246} {"train_loss": -27.72246742248535, "global_step": 518456, "epoch": 6246} {"train_loss": -27.544599533081055, "global_step": 518457, "epoch": 6246} {"train_loss": -27.858503341674805, "global_step": 518458, "epoch": 6246} {"train_loss": -27.223052978515625, "global_step": 518459, "epoch": 6246} {"train_loss": -27.912256240844727, "global_step": 518460, "epoch": 6246} {"train_loss": -27.458515167236328, "global_step": 518461, "epoch": 6246} {"train_loss": -27.753097534179688, "global_step": 518462, "epoch": 6246} {"train_loss": -27.749601364135742, "global_step": 518463, "epoch": 6246} {"train_loss": -27.75249671936035, "global_step": 518464, "epoch": 6246} {"train_loss": -27.51995849609375, "global_step": 518465, "epoch": 6246} {"train_loss": -27.659164428710938, "global_step": 518466, "epoch": 6246} {"train_loss": -27.74891471862793, "global_step": 518467, "epoch": 6246} {"train_loss": -27.740192413330078, "global_step": 518468, "epoch": 6246} {"train_loss": -27.403778076171875, "global_step": 518469, "epoch": 6246} {"train_loss": -27.880844116210938, "global_step": 518470, "epoch": 6246} {"train_loss": -27.428964614868164, "global_step": 518471, "epoch": 6246} {"train_loss": -27.805316925048828, "global_step": 518472, "epoch": 6246} {"train_loss": -27.63291358947754, "global_step": 518473, "epoch": 6246} {"train_loss": -27.83648109436035, "global_step": 518474, "epoch": 6246} {"train_loss": -27.493865966796875, "global_step": 518475, "epoch": 6246} {"train_loss": -27.83028221130371, "global_step": 518476, "epoch": 6246} {"train_loss": -27.660486221313477, "global_step": 518477, "epoch": 6246} {"train_loss": -27.5814266204834, "global_step": 518478, "epoch": 6246} {"train_loss": -27.6210880279541, "global_step": 518479, "epoch": 6246} {"train_loss": -27.874176025390625, "global_step": 518480, "epoch": 6246} {"train_loss": -27.83648681640625, "global_step": 518481, "epoch": 6246} {"train_loss": -27.650482177734375, "global_step": 518482, "epoch": 6246} {"train_loss": -27.80194664001465, "global_step": 518483, "epoch": 6246} {"train_loss": -27.739099502563477, "global_step": 518484, "epoch": 6246} {"train_loss": -27.9927921295166, "global_step": 518485, "epoch": 6246} {"train_loss": -27.289472579956055, "global_step": 518486, "epoch": 6246} {"train_loss": -27.547571182250977, "global_step": 518487, "epoch": 6246} {"train_loss": -27.774816513061523, "global_step": 518488, "epoch": 6246} {"train_loss": -27.761432647705078, "global_step": 518489, "epoch": 6246} {"train_loss": -27.482624053955078, "global_step": 518490, "epoch": 6246} {"train_loss": -27.483556747436523, "global_step": 518491, "epoch": 6246} {"train_loss": -27.709674835205078, "global_step": 518492, "epoch": 6246} {"train_loss": -27.5860595703125, "global_step": 518493, "epoch": 6246} {"train_loss": -27.331892013549805, "global_step": 518494, "epoch": 6246} {"train_loss": -27.881067276000977, "global_step": 518495, "epoch": 6246} {"train_loss": -27.67804527282715, "global_step": 518496, "epoch": 6246} {"train_loss": -27.203664779663086, "global_step": 518497, "epoch": 6246} {"train_loss": -27.3935489654541, "global_step": 518498, "epoch": 6246} {"train_loss": -27.31770896911621, "global_step": 518499, "epoch": 6246} {"train_loss": -27.434581021228468, "global_step": 518500, "epoch": 6246, "val_loss": 6617797.5} {"train_loss": -26.676361083984375, "global_step": 518501, "epoch": 6247} {"train_loss": -26.373920440673828, "global_step": 518502, "epoch": 6247} {"train_loss": -26.880359649658203, "global_step": 518503, "epoch": 6247} {"train_loss": -26.35609245300293, "global_step": 518504, "epoch": 6247} {"train_loss": -26.873188018798828, "global_step": 518505, "epoch": 6247} {"train_loss": -26.893665313720703, "global_step": 518506, "epoch": 6247} {"train_loss": -26.6372013092041, "global_step": 518507, "epoch": 6247} {"train_loss": -26.614355087280273, "global_step": 518508, "epoch": 6247} {"train_loss": -26.400800704956055, "global_step": 518509, "epoch": 6247} {"train_loss": -27.214618682861328, "global_step": 518510, "epoch": 6247} {"train_loss": -26.745397567749023, "global_step": 518511, "epoch": 6247} {"train_loss": -26.52802848815918, "global_step": 518512, "epoch": 6247} {"train_loss": -26.60540199279785, "global_step": 518513, "epoch": 6247} {"train_loss": -26.9754581451416, "global_step": 518514, "epoch": 6247} {"train_loss": -26.567203521728516, "global_step": 518515, "epoch": 6247} {"train_loss": -27.029804229736328, "global_step": 518516, "epoch": 6247} {"train_loss": -26.866296768188477, "global_step": 518517, "epoch": 6247} {"train_loss": -27.079620361328125, "global_step": 518518, "epoch": 6247} {"train_loss": -27.1147403717041, "global_step": 518519, "epoch": 6247} {"train_loss": -26.95350456237793, "global_step": 518520, "epoch": 6247} {"train_loss": -27.207427978515625, "global_step": 518521, "epoch": 6247} {"train_loss": -27.07081413269043, "global_step": 518522, "epoch": 6247} {"train_loss": -27.034687042236328, "global_step": 518523, "epoch": 6247} {"train_loss": -27.065963745117188, "global_step": 518524, "epoch": 6247} {"train_loss": -27.12007713317871, "global_step": 518525, "epoch": 6247} {"train_loss": -26.93659019470215, "global_step": 518526, "epoch": 6247} {"train_loss": -27.496335983276367, "global_step": 518527, "epoch": 6247} {"train_loss": -27.286230087280273, "global_step": 518528, "epoch": 6247} {"train_loss": -27.1539249420166, "global_step": 518529, "epoch": 6247} {"train_loss": -27.139022827148438, "global_step": 518530, "epoch": 6247} {"train_loss": -27.0793399810791, "global_step": 518531, "epoch": 6247} {"train_loss": -27.501508712768555, "global_step": 518532, "epoch": 6247} {"train_loss": -27.492605209350586, "global_step": 518533, "epoch": 6247} {"train_loss": -27.29522132873535, "global_step": 518534, "epoch": 6247} {"train_loss": -27.67828941345215, "global_step": 518535, "epoch": 6247} {"train_loss": -27.50208854675293, "global_step": 518536, "epoch": 6247} {"train_loss": -27.285675048828125, "global_step": 518537, "epoch": 6247} {"train_loss": -27.644651412963867, "global_step": 518538, "epoch": 6247} {"train_loss": -27.413564682006836, "global_step": 518539, "epoch": 6247} {"train_loss": -27.35236930847168, "global_step": 518540, "epoch": 6247} {"train_loss": -27.254806518554688, "global_step": 518541, "epoch": 6247} {"train_loss": -27.673898696899414, "global_step": 518542, "epoch": 6247} {"train_loss": -27.592458724975586, "global_step": 518543, "epoch": 6247} {"train_loss": -27.428625106811523, "global_step": 518544, "epoch": 6247} {"train_loss": -27.6934814453125, "global_step": 518545, "epoch": 6247} {"train_loss": -27.557538986206055, "global_step": 518546, "epoch": 6247} {"train_loss": -27.679662704467773, "global_step": 518547, "epoch": 6247} {"train_loss": -27.670312881469727, "global_step": 518548, "epoch": 6247} {"train_loss": -27.602331161499023, "global_step": 518549, "epoch": 6247} {"train_loss": -27.751468658447266, "global_step": 518550, "epoch": 6247} {"train_loss": -27.739816665649414, "global_step": 518551, "epoch": 6247} {"train_loss": -27.623870849609375, "global_step": 518552, "epoch": 6247} {"train_loss": -27.245819091796875, "global_step": 518553, "epoch": 6247} {"train_loss": -27.552555084228516, "global_step": 518554, "epoch": 6247} {"train_loss": -27.48593521118164, "global_step": 518555, "epoch": 6247} {"train_loss": -27.313129425048828, "global_step": 518556, "epoch": 6247} {"train_loss": -27.4395809173584, "global_step": 518557, "epoch": 6247} {"train_loss": -27.692880630493164, "global_step": 518558, "epoch": 6247} {"train_loss": -27.57704734802246, "global_step": 518559, "epoch": 6247} {"train_loss": -27.389728546142578, "global_step": 518560, "epoch": 6247} {"train_loss": -27.550216674804688, "global_step": 518561, "epoch": 6247} {"train_loss": -27.72601318359375, "global_step": 518562, "epoch": 6247} {"train_loss": -27.261945724487305, "global_step": 518563, "epoch": 6247} {"train_loss": -27.34998893737793, "global_step": 518564, "epoch": 6247} {"train_loss": -27.5284481048584, "global_step": 518565, "epoch": 6247} {"train_loss": -27.62959098815918, "global_step": 518566, "epoch": 6247} {"train_loss": -27.230335235595703, "global_step": 518567, "epoch": 6247} {"train_loss": -27.40386962890625, "global_step": 518568, "epoch": 6247} {"train_loss": -27.347858428955078, "global_step": 518569, "epoch": 6247} {"train_loss": -27.210851669311523, "global_step": 518570, "epoch": 6247} {"train_loss": -27.50424575805664, "global_step": 518571, "epoch": 6247} {"train_loss": -27.8662166595459, "global_step": 518572, "epoch": 6247} {"train_loss": -26.92255973815918, "global_step": 518573, "epoch": 6247} {"train_loss": -27.58814811706543, "global_step": 518574, "epoch": 6247} {"train_loss": -27.5645751953125, "global_step": 518575, "epoch": 6247} {"train_loss": -27.65211296081543, "global_step": 518576, "epoch": 6247} {"train_loss": -27.505146026611328, "global_step": 518577, "epoch": 6247} {"train_loss": -27.168991088867188, "global_step": 518578, "epoch": 6247} {"train_loss": -27.607309341430664, "global_step": 518579, "epoch": 6247} {"train_loss": -27.7384090423584, "global_step": 518580, "epoch": 6247} {"train_loss": -27.4882755279541, "global_step": 518581, "epoch": 6247} {"train_loss": -27.57264518737793, "global_step": 518582, "epoch": 6247} {"train_loss": -27.29665940066418, "global_step": 518583, "epoch": 6247, "val_loss": 6525083.5} {"train_loss": -26.978397369384766, "global_step": 518584, "epoch": 6248} {"train_loss": -26.75128173828125, "global_step": 518585, "epoch": 6248} {"train_loss": -26.803974151611328, "global_step": 518586, "epoch": 6248} {"train_loss": -27.002063751220703, "global_step": 518587, "epoch": 6248} {"train_loss": -27.19923973083496, "global_step": 518588, "epoch": 6248} {"train_loss": -26.896259307861328, "global_step": 518589, "epoch": 6248} {"train_loss": -26.495237350463867, "global_step": 518590, "epoch": 6248} {"train_loss": -26.959463119506836, "global_step": 518591, "epoch": 6248} {"train_loss": -27.295942306518555, "global_step": 518592, "epoch": 6248} {"train_loss": -27.25543212890625, "global_step": 518593, "epoch": 6248} {"train_loss": -27.09366798400879, "global_step": 518594, "epoch": 6248} {"train_loss": -27.437368392944336, "global_step": 518595, "epoch": 6248} {"train_loss": -27.15988540649414, "global_step": 518596, "epoch": 6248} {"train_loss": -27.264245986938477, "global_step": 518597, "epoch": 6248} {"train_loss": -27.133153915405273, "global_step": 518598, "epoch": 6248} {"train_loss": -27.36262321472168, "global_step": 518599, "epoch": 6248} {"train_loss": -27.283971786499023, "global_step": 518600, "epoch": 6248} {"train_loss": -27.602781295776367, "global_step": 518601, "epoch": 6248} {"train_loss": -27.484619140625, "global_step": 518602, "epoch": 6248} {"train_loss": -27.493146896362305, "global_step": 518603, "epoch": 6248} {"train_loss": -27.448684692382812, "global_step": 518604, "epoch": 6248} {"train_loss": -27.3862361907959, "global_step": 518605, "epoch": 6248} {"train_loss": -27.08319091796875, "global_step": 518606, "epoch": 6248} {"train_loss": -27.652313232421875, "global_step": 518607, "epoch": 6248} {"train_loss": -27.4306697845459, "global_step": 518608, "epoch": 6248} {"train_loss": -27.532678604125977, "global_step": 518609, "epoch": 6248} {"train_loss": -27.506906509399414, "global_step": 518610, "epoch": 6248} {"train_loss": -27.462045669555664, "global_step": 518611, "epoch": 6248} {"train_loss": -27.41257095336914, "global_step": 518612, "epoch": 6248} {"train_loss": -27.797754287719727, "global_step": 518613, "epoch": 6248} {"train_loss": -27.290433883666992, "global_step": 518614, "epoch": 6248} {"train_loss": -27.63490867614746, "global_step": 518615, "epoch": 6248} {"train_loss": -27.72311782836914, "global_step": 518616, "epoch": 6248} {"train_loss": -27.623096466064453, "global_step": 518617, "epoch": 6248} {"train_loss": -27.518049240112305, "global_step": 518618, "epoch": 6248} {"train_loss": -27.517536163330078, "global_step": 518619, "epoch": 6248} {"train_loss": -27.821115493774414, "global_step": 518620, "epoch": 6248} {"train_loss": -27.4729061126709, "global_step": 518621, "epoch": 6248} {"train_loss": -27.550079345703125, "global_step": 518622, "epoch": 6248} {"train_loss": -27.668899536132812, "global_step": 518623, "epoch": 6248} {"train_loss": -27.51079750061035, "global_step": 518624, "epoch": 6248} {"train_loss": -27.66766357421875, "global_step": 518625, "epoch": 6248} {"train_loss": -27.439289093017578, "global_step": 518626, "epoch": 6248} {"train_loss": -28.085737228393555, "global_step": 518627, "epoch": 6248} {"train_loss": -27.885278701782227, "global_step": 518628, "epoch": 6248} {"train_loss": -27.998798370361328, "global_step": 518629, "epoch": 6248} {"train_loss": -27.801191329956055, "global_step": 518630, "epoch": 6248} {"train_loss": -27.443267822265625, "global_step": 518631, "epoch": 6248} {"train_loss": -27.782461166381836, "global_step": 518632, "epoch": 6248} {"train_loss": -27.887704849243164, "global_step": 518633, "epoch": 6248} {"train_loss": -27.310651779174805, "global_step": 518634, "epoch": 6248} {"train_loss": -27.639938354492188, "global_step": 518635, "epoch": 6248} {"train_loss": -27.619836807250977, "global_step": 518636, "epoch": 6248} {"train_loss": -27.65989112854004, "global_step": 518637, "epoch": 6248} {"train_loss": -27.590742111206055, "global_step": 518638, "epoch": 6248} {"train_loss": -27.762231826782227, "global_step": 518639, "epoch": 6248} {"train_loss": -27.6460018157959, "global_step": 518640, "epoch": 6248} {"train_loss": -27.717472076416016, "global_step": 518641, "epoch": 6248} {"train_loss": -27.91347312927246, "global_step": 518642, "epoch": 6248} {"train_loss": -27.459135055541992, "global_step": 518643, "epoch": 6248} {"train_loss": -27.710254669189453, "global_step": 518644, "epoch": 6248} {"train_loss": -27.818349838256836, "global_step": 518645, "epoch": 6248} {"train_loss": -27.685775756835938, "global_step": 518646, "epoch": 6248} {"train_loss": -27.421743392944336, "global_step": 518647, "epoch": 6248} {"train_loss": -27.424604415893555, "global_step": 518648, "epoch": 6248} {"train_loss": -27.7706298828125, "global_step": 518649, "epoch": 6248} {"train_loss": -27.743778228759766, "global_step": 518650, "epoch": 6248} {"train_loss": -27.67413330078125, "global_step": 518651, "epoch": 6248} {"train_loss": -27.7159481048584, "global_step": 518652, "epoch": 6248} {"train_loss": -28.129108428955078, "global_step": 518653, "epoch": 6248} {"train_loss": -27.854217529296875, "global_step": 518654, "epoch": 6248} {"train_loss": -27.36543083190918, "global_step": 518655, "epoch": 6248} {"train_loss": -28.106800079345703, "global_step": 518656, "epoch": 6248} {"train_loss": -27.952131271362305, "global_step": 518657, "epoch": 6248} {"train_loss": -27.3504695892334, "global_step": 518658, "epoch": 6248} {"train_loss": -27.475738525390625, "global_step": 518659, "epoch": 6248} {"train_loss": -27.4949951171875, "global_step": 518660, "epoch": 6248} {"train_loss": -27.776823043823242, "global_step": 518661, "epoch": 6248} {"train_loss": -27.4879093170166, "global_step": 518662, "epoch": 6248} {"train_loss": -27.4339542388916, "global_step": 518663, "epoch": 6248} {"train_loss": -27.45381736755371, "global_step": 518664, "epoch": 6248} {"train_loss": -27.594928741455078, "global_step": 518665, "epoch": 6248} {"train_loss": -27.49030519968056, "global_step": 518666, "epoch": 6248, "val_loss": 6578800.0} {"train_loss": -26.296003341674805, "global_step": 518667, "epoch": 6249} {"train_loss": -25.84601402282715, "global_step": 518668, "epoch": 6249} {"train_loss": -26.658451080322266, "global_step": 518669, "epoch": 6249} {"train_loss": -26.811094284057617, "global_step": 518670, "epoch": 6249} {"train_loss": -26.744943618774414, "global_step": 518671, "epoch": 6249} {"train_loss": -27.006261825561523, "global_step": 518672, "epoch": 6249} {"train_loss": -26.16973876953125, "global_step": 518673, "epoch": 6249} {"train_loss": -27.1492919921875, "global_step": 518674, "epoch": 6249} {"train_loss": -27.353742599487305, "global_step": 518675, "epoch": 6249} {"train_loss": -26.834033966064453, "global_step": 518676, "epoch": 6249} {"train_loss": -26.746784210205078, "global_step": 518677, "epoch": 6249} {"train_loss": -26.847976684570312, "global_step": 518678, "epoch": 6249} {"train_loss": -27.16205406188965, "global_step": 518679, "epoch": 6249} {"train_loss": -27.03461265563965, "global_step": 518680, "epoch": 6249} {"train_loss": -26.776187896728516, "global_step": 518681, "epoch": 6249} {"train_loss": -27.32451820373535, "global_step": 518682, "epoch": 6249} {"train_loss": -27.07462501525879, "global_step": 518683, "epoch": 6249} {"train_loss": -27.35175895690918, "global_step": 518684, "epoch": 6249} {"train_loss": -27.356664657592773, "global_step": 518685, "epoch": 6249} {"train_loss": -27.059402465820312, "global_step": 518686, "epoch": 6249} {"train_loss": -27.053085327148438, "global_step": 518687, "epoch": 6249} {"train_loss": -27.715625762939453, "global_step": 518688, "epoch": 6249} {"train_loss": -26.90506362915039, "global_step": 518689, "epoch": 6249} {"train_loss": -27.2574520111084, "global_step": 518690, "epoch": 6249} {"train_loss": -27.248586654663086, "global_step": 518691, "epoch": 6249} {"train_loss": -27.59943962097168, "global_step": 518692, "epoch": 6249} {"train_loss": -27.49517250061035, "global_step": 518693, "epoch": 6249} {"train_loss": -27.266706466674805, "global_step": 518694, "epoch": 6249} {"train_loss": -27.36890983581543, "global_step": 518695, "epoch": 6249} {"train_loss": -27.305578231811523, "global_step": 518696, "epoch": 6249} {"train_loss": -27.442907333374023, "global_step": 518697, "epoch": 6249} {"train_loss": -27.733734130859375, "global_step": 518698, "epoch": 6249} {"train_loss": -27.60784912109375, "global_step": 518699, "epoch": 6249} {"train_loss": -27.466114044189453, "global_step": 518700, "epoch": 6249} {"train_loss": -27.7556209564209, "global_step": 518701, "epoch": 6249} {"train_loss": -27.5958251953125, "global_step": 518702, "epoch": 6249} {"train_loss": -27.389663696289062, "global_step": 518703, "epoch": 6249} {"train_loss": -27.53534507751465, "global_step": 518704, "epoch": 6249} {"train_loss": -27.664920806884766, "global_step": 518705, "epoch": 6249} {"train_loss": -27.47833824157715, "global_step": 518706, "epoch": 6249} {"train_loss": -28.064069747924805, "global_step": 518707, "epoch": 6249} {"train_loss": -27.338632583618164, "global_step": 518708, "epoch": 6249} {"train_loss": -27.694507598876953, "global_step": 518709, "epoch": 6249} {"train_loss": -27.974592208862305, "global_step": 518710, "epoch": 6249} {"train_loss": -27.41849136352539, "global_step": 518711, "epoch": 6249} {"train_loss": -27.678165435791016, "global_step": 518712, "epoch": 6249} {"train_loss": -27.5820369720459, "global_step": 518713, "epoch": 6249} {"train_loss": -27.496112823486328, "global_step": 518714, "epoch": 6249} {"train_loss": -27.468420028686523, "global_step": 518715, "epoch": 6249} {"train_loss": -27.45612907409668, "global_step": 518716, "epoch": 6249} {"train_loss": -27.36185073852539, "global_step": 518717, "epoch": 6249} {"train_loss": -27.098840713500977, "global_step": 518718, "epoch": 6249} {"train_loss": -27.338672637939453, "global_step": 518719, "epoch": 6249} {"train_loss": -27.640478134155273, "global_step": 518720, "epoch": 6249} {"train_loss": -27.41205406188965, "global_step": 518721, "epoch": 6249} {"train_loss": -27.461944580078125, "global_step": 518722, "epoch": 6249} {"train_loss": -27.512348175048828, "global_step": 518723, "epoch": 6249} {"train_loss": -27.371368408203125, "global_step": 518724, "epoch": 6249} {"train_loss": -27.658353805541992, "global_step": 518725, "epoch": 6249} {"train_loss": -27.7507266998291, "global_step": 518726, "epoch": 6249} {"train_loss": -27.56060218811035, "global_step": 518727, "epoch": 6249} {"train_loss": -27.6922607421875, "global_step": 518728, "epoch": 6249} {"train_loss": -27.81113624572754, "global_step": 518729, "epoch": 6249} {"train_loss": -27.478784561157227, "global_step": 518730, "epoch": 6249} {"train_loss": -27.56209373474121, "global_step": 518731, "epoch": 6249} {"train_loss": -27.584680557250977, "global_step": 518732, "epoch": 6249} {"train_loss": -27.55571937561035, "global_step": 518733, "epoch": 6249} {"train_loss": -27.51832389831543, "global_step": 518734, "epoch": 6249} {"train_loss": -27.432697296142578, "global_step": 518735, "epoch": 6249} {"train_loss": -27.42203712463379, "global_step": 518736, "epoch": 6249} {"train_loss": -27.450048446655273, "global_step": 518737, "epoch": 6249} {"train_loss": -27.402875900268555, "global_step": 518738, "epoch": 6249} {"train_loss": -27.49888038635254, "global_step": 518739, "epoch": 6249} {"train_loss": -27.2189998626709, "global_step": 518740, "epoch": 6249} {"train_loss": -27.785694122314453, "global_step": 518741, "epoch": 6249} {"train_loss": -28.02569580078125, "global_step": 518742, "epoch": 6249} {"train_loss": -27.51898193359375, "global_step": 518743, "epoch": 6249} {"train_loss": -27.626663208007812, "global_step": 518744, "epoch": 6249} {"train_loss": -27.22173500061035, "global_step": 518745, "epoch": 6249} {"train_loss": -27.864948272705078, "global_step": 518746, "epoch": 6249} {"train_loss": -27.791807174682617, "global_step": 518747, "epoch": 6249} {"train_loss": -27.634138107299805, "global_step": 518748, "epoch": 6249} {"train_loss": -27.37342586287533, "global_step": 518749, "epoch": 6249, "val_loss": 6570100.5} {"train_loss": -27.431238174438477, "global_step": 518750, "epoch": 6250} {"train_loss": -27.417062759399414, "global_step": 518751, "epoch": 6250} {"train_loss": -27.0624942779541, "global_step": 518752, "epoch": 6250} {"train_loss": -27.116296768188477, "global_step": 518753, "epoch": 6250} {"train_loss": -27.118270874023438, "global_step": 518754, "epoch": 6250} {"train_loss": -27.451904296875, "global_step": 518755, "epoch": 6250} {"train_loss": -27.05910301208496, "global_step": 518756, "epoch": 6250} {"train_loss": -27.381555557250977, "global_step": 518757, "epoch": 6250} {"train_loss": -27.21245765686035, "global_step": 518758, "epoch": 6250} {"train_loss": -27.479040145874023, "global_step": 518759, "epoch": 6250} {"train_loss": -27.362279891967773, "global_step": 518760, "epoch": 6250} {"train_loss": -27.4908447265625, "global_step": 518761, "epoch": 6250} {"train_loss": -27.374073028564453, "global_step": 518762, "epoch": 6250} {"train_loss": -27.099836349487305, "global_step": 518763, "epoch": 6250} {"train_loss": -27.381580352783203, "global_step": 518764, "epoch": 6250} {"train_loss": -27.296796798706055, "global_step": 518765, "epoch": 6250} {"train_loss": -27.316787719726562, "global_step": 518766, "epoch": 6250} {"train_loss": -27.571720123291016, "global_step": 518767, "epoch": 6250} {"train_loss": -27.17258644104004, "global_step": 518768, "epoch": 6250} {"train_loss": -27.087942123413086, "global_step": 518769, "epoch": 6250} {"train_loss": -26.969709396362305, "global_step": 518770, "epoch": 6250} {"train_loss": -27.463735580444336, "global_step": 518771, "epoch": 6250} {"train_loss": -27.444242477416992, "global_step": 518772, "epoch": 6250} {"train_loss": -27.562917709350586, "global_step": 518773, "epoch": 6250} {"train_loss": -27.5943660736084, "global_step": 518774, "epoch": 6250} {"train_loss": -27.51228141784668, "global_step": 518775, "epoch": 6250} {"train_loss": -27.589935302734375, "global_step": 518776, "epoch": 6250} {"train_loss": -27.503808975219727, "global_step": 518777, "epoch": 6250} {"train_loss": -27.587133407592773, "global_step": 518778, "epoch": 6250} {"train_loss": -27.31622886657715, "global_step": 518779, "epoch": 6250} {"train_loss": -27.41326904296875, "global_step": 518780, "epoch": 6250} {"train_loss": -27.45598793029785, "global_step": 518781, "epoch": 6250} {"train_loss": -27.459272384643555, "global_step": 518782, "epoch": 6250} {"train_loss": -27.458555221557617, "global_step": 518783, "epoch": 6250} {"train_loss": -27.638629913330078, "global_step": 518784, "epoch": 6250} {"train_loss": -27.71673583984375, "global_step": 518785, "epoch": 6250} {"train_loss": -27.197797775268555, "global_step": 518786, "epoch": 6250} {"train_loss": -27.640869140625, "global_step": 518787, "epoch": 6250} {"train_loss": -27.772552490234375, "global_step": 518788, "epoch": 6250} {"train_loss": -27.41791343688965, "global_step": 518789, "epoch": 6250} {"train_loss": -27.707061767578125, "global_step": 518790, "epoch": 6250} {"train_loss": -27.749719619750977, "global_step": 518791, "epoch": 6250} {"train_loss": -27.42997169494629, "global_step": 518792, "epoch": 6250} {"train_loss": -27.266294479370117, "global_step": 518793, "epoch": 6250} {"train_loss": -27.292306900024414, "global_step": 518794, "epoch": 6250} {"train_loss": -27.93161392211914, "global_step": 518795, "epoch": 6250} {"train_loss": -27.50800895690918, "global_step": 518796, "epoch": 6250} {"train_loss": -27.555891036987305, "global_step": 518797, "epoch": 6250} {"train_loss": -27.39828872680664, "global_step": 518798, "epoch": 6250} {"train_loss": -27.545190811157227, "global_step": 518799, "epoch": 6250} {"train_loss": -27.63922691345215, "global_step": 518800, "epoch": 6250} {"train_loss": -27.78291893005371, "global_step": 518801, "epoch": 6250} {"train_loss": -27.742141723632812, "global_step": 518802, "epoch": 6250} {"train_loss": -27.426258087158203, "global_step": 518803, "epoch": 6250} {"train_loss": -27.878122329711914, "global_step": 518804, "epoch": 6250} {"train_loss": -27.76470947265625, "global_step": 518805, "epoch": 6250} {"train_loss": -27.945972442626953, "global_step": 518806, "epoch": 6250} {"train_loss": -27.593780517578125, "global_step": 518807, "epoch": 6250} {"train_loss": -27.46121597290039, "global_step": 518808, "epoch": 6250} {"train_loss": -27.968891143798828, "global_step": 518809, "epoch": 6250} {"train_loss": -27.240331649780273, "global_step": 518810, "epoch": 6250} {"train_loss": -27.538236618041992, "global_step": 518811, "epoch": 6250} {"train_loss": -27.1849422454834, "global_step": 518812, "epoch": 6250} {"train_loss": -26.797353744506836, "global_step": 518813, "epoch": 6250} {"train_loss": -27.3796443939209, "global_step": 518814, "epoch": 6250} {"train_loss": -27.36745262145996, "global_step": 518815, "epoch": 6250} {"train_loss": -27.366235733032227, "global_step": 518816, "epoch": 6250} {"train_loss": -27.117399215698242, "global_step": 518817, "epoch": 6250} {"train_loss": -27.111377716064453, "global_step": 518818, "epoch": 6250} {"train_loss": -27.51726722717285, "global_step": 518819, "epoch": 6250} {"train_loss": -26.923141479492188, "global_step": 518820, "epoch": 6250} {"train_loss": -27.02595329284668, "global_step": 518821, "epoch": 6250} {"train_loss": -26.94793701171875, "global_step": 518822, "epoch": 6250} {"train_loss": -28.04341697692871, "global_step": 518823, "epoch": 6250} {"train_loss": -27.239654541015625, "global_step": 518824, "epoch": 6250} {"train_loss": -27.14227867126465, "global_step": 518825, "epoch": 6250} {"train_loss": -27.41322898864746, "global_step": 518826, "epoch": 6250} {"train_loss": -26.958648681640625, "global_step": 518827, "epoch": 6250} {"train_loss": -27.41082191467285, "global_step": 518828, "epoch": 6250} {"train_loss": -27.012592315673828, "global_step": 518829, "epoch": 6250} {"train_loss": -27.495206832885742, "global_step": 518830, "epoch": 6250} {"train_loss": -27.403762817382812, "global_step": 518831, "epoch": 6250} {"train_loss": -27.414624731224702, "global_step": 518832, "epoch": 6250, "train/sim_max_reward_0": 1.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4500000": 1.0, "test/sim_max_reward_4500001": 1.0, "test/sim_max_reward_4500002": 1.0, "test/sim_max_reward_4500003": 1.0, "test/sim_max_reward_4500004": 1.0, "test/sim_max_reward_4500005": 1.0, "test/sim_max_reward_4500006": 1.0, "test/sim_max_reward_4500007": 0.0, "test/sim_max_reward_4500008": 1.0, "test/sim_max_reward_4500009": 1.0, "test/sim_max_reward_4500010": 1.0, "test/sim_max_reward_4500011": 1.0, "test/sim_max_reward_4500012": 1.0, "test/sim_max_reward_4500013": 0.0, "test/sim_max_reward_4500014": 1.0, "test/sim_max_reward_4500015": 1.0, "test/sim_max_reward_4500016": 1.0, "test/sim_max_reward_4500017": 1.0, "test/sim_max_reward_4500018": 0.0, "test/sim_max_reward_4500019": 0.0, "test/sim_max_reward_4500020": 1.0, "test/sim_max_reward_4500021": 1.0, "train/mean_score": 1.0, "test/mean_score": 0.8181818181818182, "val_loss": 6656319.0} {"train_loss": -27.265974044799805, "global_step": 518833, "epoch": 6251} {"train_loss": -26.867313385009766, "global_step": 518834, "epoch": 6251} {"train_loss": -27.3052978515625, "global_step": 518835, "epoch": 6251} {"train_loss": -27.39246940612793, "global_step": 518836, "epoch": 6251} {"train_loss": -27.71917724609375, "global_step": 518837, "epoch": 6251} {"train_loss": -27.005313873291016, "global_step": 518838, "epoch": 6251} {"train_loss": -27.490354537963867, "global_step": 518839, "epoch": 6251} {"train_loss": -26.956714630126953, "global_step": 518840, "epoch": 6251} {"train_loss": -27.602344512939453, "global_step": 518841, "epoch": 6251} {"train_loss": -26.952966690063477, "global_step": 518842, "epoch": 6251} {"train_loss": -27.46021842956543, "global_step": 518843, "epoch": 6251} {"train_loss": -27.395620346069336, "global_step": 518844, "epoch": 6251} {"train_loss": -27.479429244995117, "global_step": 518845, "epoch": 6251} {"train_loss": -27.085214614868164, "global_step": 518846, "epoch": 6251} {"train_loss": -27.689483642578125, "global_step": 518847, "epoch": 6251} {"train_loss": -27.687824249267578, "global_step": 518848, "epoch": 6251} {"train_loss": -27.33400535583496, "global_step": 518849, "epoch": 6251} {"train_loss": -27.37957191467285, "global_step": 518850, "epoch": 6251} {"train_loss": -27.560632705688477, "global_step": 518851, "epoch": 6251} {"train_loss": -27.771207809448242, "global_step": 518852, "epoch": 6251} {"train_loss": -27.463342666625977, "global_step": 518853, "epoch": 6251} {"train_loss": -27.5941219329834, "global_step": 518854, "epoch": 6251} {"train_loss": -27.687198638916016, "global_step": 518855, "epoch": 6251} {"train_loss": -27.442428588867188, "global_step": 518856, "epoch": 6251} {"train_loss": -27.369977951049805, "global_step": 518857, "epoch": 6251} {"train_loss": -27.202375411987305, "global_step": 518858, "epoch": 6251} {"train_loss": -27.611005783081055, "global_step": 518859, "epoch": 6251} {"train_loss": -27.75098991394043, "global_step": 518860, "epoch": 6251} {"train_loss": -27.785053253173828, "global_step": 518861, "epoch": 6251} {"train_loss": -27.353769302368164, "global_step": 518862, "epoch": 6251} {"train_loss": -27.380359649658203, "global_step": 518863, "epoch": 6251} {"train_loss": -27.634851455688477, "global_step": 518864, "epoch": 6251} {"train_loss": -27.3620662689209, "global_step": 518865, "epoch": 6251} {"train_loss": -27.80134391784668, "global_step": 518866, "epoch": 6251} {"train_loss": -27.77016258239746, "global_step": 518867, "epoch": 6251} {"train_loss": -27.795495986938477, "global_step": 518868, "epoch": 6251} {"train_loss": -27.74094581604004, "global_step": 518869, "epoch": 6251} {"train_loss": -27.814130783081055, "global_step": 518870, "epoch": 6251} {"train_loss": -27.294879913330078, "global_step": 518871, "epoch": 6251} {"train_loss": -27.744409561157227, "global_step": 518872, "epoch": 6251} {"train_loss": -27.752395629882812, "global_step": 518873, "epoch": 6251} {"train_loss": -27.619964599609375, "global_step": 518874, "epoch": 6251} {"train_loss": -27.715972900390625, "global_step": 518875, "epoch": 6251} {"train_loss": -27.476337432861328, "global_step": 518876, "epoch": 6251} {"train_loss": -26.922353744506836, "global_step": 518877, "epoch": 6251} {"train_loss": -27.478193283081055, "global_step": 518878, "epoch": 6251} {"train_loss": -27.251514434814453, "global_step": 518879, "epoch": 6251} {"train_loss": -27.328699111938477, "global_step": 518880, "epoch": 6251} {"train_loss": -27.510595321655273, "global_step": 518881, "epoch": 6251} {"train_loss": -27.53289794921875, "global_step": 518882, "epoch": 6251} {"train_loss": -27.870187759399414, "global_step": 518883, "epoch": 6251} {"train_loss": -27.613393783569336, "global_step": 518884, "epoch": 6251} {"train_loss": -27.478002548217773, "global_step": 518885, "epoch": 6251} {"train_loss": -27.686004638671875, "global_step": 518886, "epoch": 6251} {"train_loss": -27.667367935180664, "global_step": 518887, "epoch": 6251} {"train_loss": -27.814105987548828, "global_step": 518888, "epoch": 6251} {"train_loss": -27.550756454467773, "global_step": 518889, "epoch": 6251} {"train_loss": -27.828901290893555, "global_step": 518890, "epoch": 6251} {"train_loss": -27.71880531311035, "global_step": 518891, "epoch": 6251} {"train_loss": -27.37679100036621, "global_step": 518892, "epoch": 6251} {"train_loss": -27.661880493164062, "global_step": 518893, "epoch": 6251} {"train_loss": -27.71883201599121, "global_step": 518894, "epoch": 6251} {"train_loss": -27.852563858032227, "global_step": 518895, "epoch": 6251} {"train_loss": -27.865863800048828, "global_step": 518896, "epoch": 6251} {"train_loss": -27.380826950073242, "global_step": 518897, "epoch": 6251} {"train_loss": -27.847333908081055, "global_step": 518898, "epoch": 6251} {"train_loss": -27.70428466796875, "global_step": 518899, "epoch": 6251} {"train_loss": -27.6143856048584, "global_step": 518900, "epoch": 6251} {"train_loss": -27.8673152923584, "global_step": 518901, "epoch": 6251} {"train_loss": -27.459009170532227, "global_step": 518902, "epoch": 6251} {"train_loss": -27.629459381103516, "global_step": 518903, "epoch": 6251} {"train_loss": -27.704309463500977, "global_step": 518904, "epoch": 6251} {"train_loss": -27.696317672729492, "global_step": 518905, "epoch": 6251} {"train_loss": -27.60419273376465, "global_step": 518906, "epoch": 6251} {"train_loss": -27.1544246673584, "global_step": 518907, "epoch": 6251} {"train_loss": -27.374755859375, "global_step": 518908, "epoch": 6251} {"train_loss": -25.74489402770996, "global_step": 518909, "epoch": 6251} {"train_loss": -24.9909725189209, "global_step": 518910, "epoch": 6251} {"train_loss": -25.078588485717773, "global_step": 518911, "epoch": 6251} {"train_loss": -27.327924728393555, "global_step": 518912, "epoch": 6251} {"train_loss": -26.558338165283203, "global_step": 518913, "epoch": 6251} {"train_loss": -27.117694854736328, "global_step": 518914, "epoch": 6251} {"train_loss": -27.409013725188842, "global_step": 518915, "epoch": 6251, "val_loss": 6557607.0} {"train_loss": -26.376371383666992, "global_step": 518916, "epoch": 6252} {"train_loss": -26.045862197875977, "global_step": 518917, "epoch": 6252} {"train_loss": -26.2670841217041, "global_step": 518918, "epoch": 6252} {"train_loss": -26.448820114135742, "global_step": 518919, "epoch": 6252} {"train_loss": -26.277917861938477, "global_step": 518920, "epoch": 6252} {"train_loss": -25.9410343170166, "global_step": 518921, "epoch": 6252} {"train_loss": -26.3350830078125, "global_step": 518922, "epoch": 6252} {"train_loss": -25.912647247314453, "global_step": 518923, "epoch": 6252} {"train_loss": -26.590307235717773, "global_step": 518924, "epoch": 6252} {"train_loss": -26.433826446533203, "global_step": 518925, "epoch": 6252} {"train_loss": -26.506561279296875, "global_step": 518926, "epoch": 6252} {"train_loss": -26.400266647338867, "global_step": 518927, "epoch": 6252} {"train_loss": -26.467809677124023, "global_step": 518928, "epoch": 6252} {"train_loss": -26.6134033203125, "global_step": 518929, "epoch": 6252} {"train_loss": -26.97085952758789, "global_step": 518930, "epoch": 6252} {"train_loss": -26.291418075561523, "global_step": 518931, "epoch": 6252} {"train_loss": -26.710464477539062, "global_step": 518932, "epoch": 6252} {"train_loss": -26.562122344970703, "global_step": 518933, "epoch": 6252} {"train_loss": -26.596704483032227, "global_step": 518934, "epoch": 6252} {"train_loss": -26.823190689086914, "global_step": 518935, "epoch": 6252} {"train_loss": -26.77211570739746, "global_step": 518936, "epoch": 6252} {"train_loss": -26.992145538330078, "global_step": 518937, "epoch": 6252} {"train_loss": -26.8622989654541, "global_step": 518938, "epoch": 6252} {"train_loss": -27.336456298828125, "global_step": 518939, "epoch": 6252} {"train_loss": -26.88202476501465, "global_step": 518940, "epoch": 6252} {"train_loss": -27.16225242614746, "global_step": 518941, "epoch": 6252} {"train_loss": -26.882104873657227, "global_step": 518942, "epoch": 6252} {"train_loss": -26.955541610717773, "global_step": 518943, "epoch": 6252} {"train_loss": -27.410999298095703, "global_step": 518944, "epoch": 6252} {"train_loss": -26.929174423217773, "global_step": 518945, "epoch": 6252} {"train_loss": -27.1750545501709, "global_step": 518946, "epoch": 6252} {"train_loss": -27.439062118530273, "global_step": 518947, "epoch": 6252} {"train_loss": -27.455610275268555, "global_step": 518948, "epoch": 6252} {"train_loss": -27.227670669555664, "global_step": 518949, "epoch": 6252} {"train_loss": -27.23845863342285, "global_step": 518950, "epoch": 6252} {"train_loss": -27.17451286315918, "global_step": 518951, "epoch": 6252} {"train_loss": -27.54182243347168, "global_step": 518952, "epoch": 6252} {"train_loss": -27.328039169311523, "global_step": 518953, "epoch": 6252} {"train_loss": -26.933835983276367, "global_step": 518954, "epoch": 6252} {"train_loss": -27.054489135742188, "global_step": 518955, "epoch": 6252} {"train_loss": -27.31159782409668, "global_step": 518956, "epoch": 6252} {"train_loss": -27.226043701171875, "global_step": 518957, "epoch": 6252} {"train_loss": -27.5072078704834, "global_step": 518958, "epoch": 6252} {"train_loss": -27.659534454345703, "global_step": 518959, "epoch": 6252} {"train_loss": -26.90983009338379, "global_step": 518960, "epoch": 6252} {"train_loss": -27.90036392211914, "global_step": 518961, "epoch": 6252} {"train_loss": -27.190412521362305, "global_step": 518962, "epoch": 6252} {"train_loss": -27.645750045776367, "global_step": 518963, "epoch": 6252} {"train_loss": -27.152090072631836, "global_step": 518964, "epoch": 6252} {"train_loss": -27.521331787109375, "global_step": 518965, "epoch": 6252} {"train_loss": -27.32734489440918, "global_step": 518966, "epoch": 6252} {"train_loss": -27.124927520751953, "global_step": 518967, "epoch": 6252} {"train_loss": -27.435522079467773, "global_step": 518968, "epoch": 6252} {"train_loss": -27.417251586914062, "global_step": 518969, "epoch": 6252} {"train_loss": -27.08917808532715, "global_step": 518970, "epoch": 6252} {"train_loss": -26.700820922851562, "global_step": 518971, "epoch": 6252} {"train_loss": -26.691181182861328, "global_step": 518972, "epoch": 6252} {"train_loss": -27.2899112701416, "global_step": 518973, "epoch": 6252} {"train_loss": -27.170942306518555, "global_step": 518974, "epoch": 6252} {"train_loss": -26.795490264892578, "global_step": 518975, "epoch": 6252} {"train_loss": -27.390295028686523, "global_step": 518976, "epoch": 6252} {"train_loss": -27.21613883972168, "global_step": 518977, "epoch": 6252} {"train_loss": -27.346277236938477, "global_step": 518978, "epoch": 6252} {"train_loss": -27.520639419555664, "global_step": 518979, "epoch": 6252} {"train_loss": -27.084747314453125, "global_step": 518980, "epoch": 6252} {"train_loss": -27.069467544555664, "global_step": 518981, "epoch": 6252} {"train_loss": -27.07993507385254, "global_step": 518982, "epoch": 6252} {"train_loss": -27.43464469909668, "global_step": 518983, "epoch": 6252} {"train_loss": -27.507780075073242, "global_step": 518984, "epoch": 6252} {"train_loss": -27.35068702697754, "global_step": 518985, "epoch": 6252} {"train_loss": -27.3293514251709, "global_step": 518986, "epoch": 6252} {"train_loss": -27.844757080078125, "global_step": 518987, "epoch": 6252} {"train_loss": -27.676010131835938, "global_step": 518988, "epoch": 6252} {"train_loss": -27.706151962280273, "global_step": 518989, "epoch": 6252} {"train_loss": -27.75994300842285, "global_step": 518990, "epoch": 6252} {"train_loss": -27.49173355102539, "global_step": 518991, "epoch": 6252} {"train_loss": -27.673248291015625, "global_step": 518992, "epoch": 6252} {"train_loss": -27.41412353515625, "global_step": 518993, "epoch": 6252} {"train_loss": -27.5373477935791, "global_step": 518994, "epoch": 6252} {"train_loss": -27.750375747680664, "global_step": 518995, "epoch": 6252} {"train_loss": -27.65931510925293, "global_step": 518996, "epoch": 6252} {"train_loss": -27.76023292541504, "global_step": 518997, "epoch": 6252} {"train_loss": -27.075872283384026, "global_step": 518998, "epoch": 6252, "val_loss": 6529342.0} {"train_loss": -27.021265029907227, "global_step": 518999, "epoch": 6253} {"train_loss": -27.13471794128418, "global_step": 519000, "epoch": 6253} {"train_loss": -27.081384658813477, "global_step": 519001, "epoch": 6253} {"train_loss": -27.478601455688477, "global_step": 519002, "epoch": 6253} {"train_loss": -27.3239803314209, "global_step": 519003, "epoch": 6253} {"train_loss": -27.168588638305664, "global_step": 519004, "epoch": 6253} {"train_loss": -27.134084701538086, "global_step": 519005, "epoch": 6253} {"train_loss": -27.741287231445312, "global_step": 519006, "epoch": 6253} {"train_loss": -27.60023307800293, "global_step": 519007, "epoch": 6253} {"train_loss": -27.2332706451416, "global_step": 519008, "epoch": 6253} {"train_loss": -27.520177841186523, "global_step": 519009, "epoch": 6253} {"train_loss": -27.28302001953125, "global_step": 519010, "epoch": 6253} {"train_loss": -27.889135360717773, "global_step": 519011, "epoch": 6253} {"train_loss": -27.73833656311035, "global_step": 519012, "epoch": 6253} {"train_loss": -27.63254737854004, "global_step": 519013, "epoch": 6253} {"train_loss": -27.59783935546875, "global_step": 519014, "epoch": 6253} {"train_loss": -27.40460777282715, "global_step": 519015, "epoch": 6253} {"train_loss": -27.842132568359375, "global_step": 519016, "epoch": 6253} {"train_loss": -27.594486236572266, "global_step": 519017, "epoch": 6253} {"train_loss": -27.961811065673828, "global_step": 519018, "epoch": 6253} {"train_loss": -27.5978946685791, "global_step": 519019, "epoch": 6253} {"train_loss": -27.32797622680664, "global_step": 519020, "epoch": 6253} {"train_loss": -27.617822647094727, "global_step": 519021, "epoch": 6253} {"train_loss": -27.743345260620117, "global_step": 519022, "epoch": 6253} {"train_loss": -27.464187622070312, "global_step": 519023, "epoch": 6253} {"train_loss": -27.564899444580078, "global_step": 519024, "epoch": 6253} {"train_loss": -27.45212745666504, "global_step": 519025, "epoch": 6253} {"train_loss": -27.775922775268555, "global_step": 519026, "epoch": 6253} {"train_loss": -27.887048721313477, "global_step": 519027, "epoch": 6253} {"train_loss": -27.765827178955078, "global_step": 519028, "epoch": 6253} {"train_loss": -27.820032119750977, "global_step": 519029, "epoch": 6253} {"train_loss": -27.798303604125977, "global_step": 519030, "epoch": 6253} {"train_loss": -27.671003341674805, "global_step": 519031, "epoch": 6253} {"train_loss": -27.41131591796875, "global_step": 519032, "epoch": 6253} {"train_loss": -27.72940444946289, "global_step": 519033, "epoch": 6253} {"train_loss": -27.20050048828125, "global_step": 519034, "epoch": 6253} {"train_loss": -27.469884872436523, "global_step": 519035, "epoch": 6253} {"train_loss": -27.37290382385254, "global_step": 519036, "epoch": 6253} {"train_loss": -27.36673927307129, "global_step": 519037, "epoch": 6253} {"train_loss": -27.841779708862305, "global_step": 519038, "epoch": 6253} {"train_loss": -27.4913272857666, "global_step": 519039, "epoch": 6253} {"train_loss": -27.30254554748535, "global_step": 519040, "epoch": 6253} {"train_loss": -27.631885528564453, "global_step": 519041, "epoch": 6253} {"train_loss": -27.690872192382812, "global_step": 519042, "epoch": 6253} {"train_loss": -27.453998565673828, "global_step": 519043, "epoch": 6253} {"train_loss": -27.80974769592285, "global_step": 519044, "epoch": 6253} {"train_loss": -27.22468376159668, "global_step": 519045, "epoch": 6253} {"train_loss": -27.80777931213379, "global_step": 519046, "epoch": 6253} {"train_loss": -27.813791275024414, "global_step": 519047, "epoch": 6253} {"train_loss": -27.127548217773438, "global_step": 519048, "epoch": 6253} {"train_loss": -27.514083862304688, "global_step": 519049, "epoch": 6253} {"train_loss": -27.544462203979492, "global_step": 519050, "epoch": 6253} {"train_loss": -27.80978775024414, "global_step": 519051, "epoch": 6253} {"train_loss": -27.358108520507812, "global_step": 519052, "epoch": 6253} {"train_loss": -27.636091232299805, "global_step": 519053, "epoch": 6253} {"train_loss": -27.823659896850586, "global_step": 519054, "epoch": 6253} {"train_loss": -27.643667221069336, "global_step": 519055, "epoch": 6253} {"train_loss": -27.722888946533203, "global_step": 519056, "epoch": 6253} {"train_loss": -27.542081832885742, "global_step": 519057, "epoch": 6253} {"train_loss": -28.295774459838867, "global_step": 519058, "epoch": 6253} {"train_loss": -27.58201026916504, "global_step": 519059, "epoch": 6253} {"train_loss": -27.3877010345459, "global_step": 519060, "epoch": 6253} {"train_loss": -27.02118492126465, "global_step": 519061, "epoch": 6253} {"train_loss": -27.557546615600586, "global_step": 519062, "epoch": 6253} {"train_loss": -27.499713897705078, "global_step": 519063, "epoch": 6253} {"train_loss": -27.098621368408203, "global_step": 519064, "epoch": 6253} {"train_loss": -27.488859176635742, "global_step": 519065, "epoch": 6253} {"train_loss": -27.282459259033203, "global_step": 519066, "epoch": 6253} {"train_loss": -27.863245010375977, "global_step": 519067, "epoch": 6253} {"train_loss": -27.152368545532227, "global_step": 519068, "epoch": 6253} {"train_loss": -27.33340835571289, "global_step": 519069, "epoch": 6253} {"train_loss": -27.669158935546875, "global_step": 519070, "epoch": 6253} {"train_loss": -27.39759635925293, "global_step": 519071, "epoch": 6253} {"train_loss": -27.493017196655273, "global_step": 519072, "epoch": 6253} {"train_loss": -27.375686645507812, "global_step": 519073, "epoch": 6253} {"train_loss": -27.787841796875, "global_step": 519074, "epoch": 6253} {"train_loss": -27.80588722229004, "global_step": 519075, "epoch": 6253} {"train_loss": -27.564218521118164, "global_step": 519076, "epoch": 6253} {"train_loss": -27.623676300048828, "global_step": 519077, "epoch": 6253} {"train_loss": -27.736425399780273, "global_step": 519078, "epoch": 6253} {"train_loss": -27.413806915283203, "global_step": 519079, "epoch": 6253} {"train_loss": -27.348480224609375, "global_step": 519080, "epoch": 6253} {"train_loss": -27.538330744548016, "global_step": 519081, "epoch": 6253, "val_loss": 6543247.5} {"train_loss": -25.41766929626465, "global_step": 519082, "epoch": 6254} {"train_loss": -24.35927391052246, "global_step": 519083, "epoch": 6254} {"train_loss": -25.00634765625, "global_step": 519084, "epoch": 6254} {"train_loss": -25.837976455688477, "global_step": 519085, "epoch": 6254} {"train_loss": -26.129907608032227, "global_step": 519086, "epoch": 6254} {"train_loss": -26.501508712768555, "global_step": 519087, "epoch": 6254} {"train_loss": -25.91224479675293, "global_step": 519088, "epoch": 6254} {"train_loss": -26.073392868041992, "global_step": 519089, "epoch": 6254} {"train_loss": -26.553159713745117, "global_step": 519090, "epoch": 6254} {"train_loss": -26.232336044311523, "global_step": 519091, "epoch": 6254} {"train_loss": -26.652725219726562, "global_step": 519092, "epoch": 6254} {"train_loss": -26.348220825195312, "global_step": 519093, "epoch": 6254} {"train_loss": -26.641916275024414, "global_step": 519094, "epoch": 6254} {"train_loss": -26.58636474609375, "global_step": 519095, "epoch": 6254} {"train_loss": -26.327672958374023, "global_step": 519096, "epoch": 6254} {"train_loss": -26.37982177734375, "global_step": 519097, "epoch": 6254} {"train_loss": -27.030744552612305, "global_step": 519098, "epoch": 6254} {"train_loss": -26.466064453125, "global_step": 519099, "epoch": 6254} {"train_loss": -26.657978057861328, "global_step": 519100, "epoch": 6254} {"train_loss": -26.82474136352539, "global_step": 519101, "epoch": 6254} {"train_loss": -26.84722900390625, "global_step": 519102, "epoch": 6254} {"train_loss": -27.0819149017334, "global_step": 519103, "epoch": 6254} {"train_loss": -27.062625885009766, "global_step": 519104, "epoch": 6254} {"train_loss": -27.314624786376953, "global_step": 519105, "epoch": 6254} {"train_loss": -26.962757110595703, "global_step": 519106, "epoch": 6254} {"train_loss": -27.098346710205078, "global_step": 519107, "epoch": 6254} {"train_loss": -27.03759765625, "global_step": 519108, "epoch": 6254} {"train_loss": -27.007049560546875, "global_step": 519109, "epoch": 6254} {"train_loss": -26.869659423828125, "global_step": 519110, "epoch": 6254} {"train_loss": -27.0607967376709, "global_step": 519111, "epoch": 6254} {"train_loss": -27.203628540039062, "global_step": 519112, "epoch": 6254} {"train_loss": -27.228979110717773, "global_step": 519113, "epoch": 6254} {"train_loss": -27.31793212890625, "global_step": 519114, "epoch": 6254} {"train_loss": -27.388830184936523, "global_step": 519115, "epoch": 6254} {"train_loss": -27.25965690612793, "global_step": 519116, "epoch": 6254} {"train_loss": -27.308740615844727, "global_step": 519117, "epoch": 6254} {"train_loss": -27.613508224487305, "global_step": 519118, "epoch": 6254} {"train_loss": -27.256933212280273, "global_step": 519119, "epoch": 6254} {"train_loss": -27.628103256225586, "global_step": 519120, "epoch": 6254} {"train_loss": -27.524017333984375, "global_step": 519121, "epoch": 6254} {"train_loss": -27.602994918823242, "global_step": 519122, "epoch": 6254} {"train_loss": -27.060199737548828, "global_step": 519123, "epoch": 6254} {"train_loss": -27.68877601623535, "global_step": 519124, "epoch": 6254} {"train_loss": -27.221908569335938, "global_step": 519125, "epoch": 6254} {"train_loss": -27.739892959594727, "global_step": 519126, "epoch": 6254} {"train_loss": -27.621139526367188, "global_step": 519127, "epoch": 6254} {"train_loss": -27.64101219177246, "global_step": 519128, "epoch": 6254} {"train_loss": -27.813446044921875, "global_step": 519129, "epoch": 6254} {"train_loss": -27.676504135131836, "global_step": 519130, "epoch": 6254} {"train_loss": -27.528369903564453, "global_step": 519131, "epoch": 6254} {"train_loss": -27.925485610961914, "global_step": 519132, "epoch": 6254} {"train_loss": -27.93158531188965, "global_step": 519133, "epoch": 6254} {"train_loss": -27.5529727935791, "global_step": 519134, "epoch": 6254} {"train_loss": -27.90079116821289, "global_step": 519135, "epoch": 6254} {"train_loss": -27.426868438720703, "global_step": 519136, "epoch": 6254} {"train_loss": -27.913496017456055, "global_step": 519137, "epoch": 6254} {"train_loss": -27.852468490600586, "global_step": 519138, "epoch": 6254} {"train_loss": -27.4893741607666, "global_step": 519139, "epoch": 6254} {"train_loss": -27.574359893798828, "global_step": 519140, "epoch": 6254} {"train_loss": -27.426822662353516, "global_step": 519141, "epoch": 6254} {"train_loss": -27.44040870666504, "global_step": 519142, "epoch": 6254} {"train_loss": -27.311588287353516, "global_step": 519143, "epoch": 6254} {"train_loss": -27.20826530456543, "global_step": 519144, "epoch": 6254} {"train_loss": -26.562652587890625, "global_step": 519145, "epoch": 6254} {"train_loss": -27.19111442565918, "global_step": 519146, "epoch": 6254} {"train_loss": -27.36969566345215, "global_step": 519147, "epoch": 6254} {"train_loss": -27.47216796875, "global_step": 519148, "epoch": 6254} {"train_loss": -27.019201278686523, "global_step": 519149, "epoch": 6254} {"train_loss": -27.27176284790039, "global_step": 519150, "epoch": 6254} {"train_loss": -27.359155654907227, "global_step": 519151, "epoch": 6254} {"train_loss": -26.709211349487305, "global_step": 519152, "epoch": 6254} {"train_loss": -27.803831100463867, "global_step": 519153, "epoch": 6254} {"train_loss": -27.261693954467773, "global_step": 519154, "epoch": 6254} {"train_loss": -27.265365600585938, "global_step": 519155, "epoch": 6254} {"train_loss": -27.33888053894043, "global_step": 519156, "epoch": 6254} {"train_loss": -27.461042404174805, "global_step": 519157, "epoch": 6254} {"train_loss": -27.302717208862305, "global_step": 519158, "epoch": 6254} {"train_loss": -27.549854278564453, "global_step": 519159, "epoch": 6254} {"train_loss": -27.707609176635742, "global_step": 519160, "epoch": 6254} {"train_loss": -27.097030639648438, "global_step": 519161, "epoch": 6254} {"train_loss": -27.274396896362305, "global_step": 519162, "epoch": 6254} {"train_loss": -27.67462730407715, "global_step": 519163, "epoch": 6254} {"train_loss": -27.11555094891284, "global_step": 519164, "epoch": 6254, "val_loss": 6454560.0} {"train_loss": -26.970590591430664, "global_step": 519165, "epoch": 6255} {"train_loss": -26.773977279663086, "global_step": 519166, "epoch": 6255} {"train_loss": -27.28290367126465, "global_step": 519167, "epoch": 6255} {"train_loss": -27.02984046936035, "global_step": 519168, "epoch": 6255} {"train_loss": -27.2850341796875, "global_step": 519169, "epoch": 6255} {"train_loss": -27.077163696289062, "global_step": 519170, "epoch": 6255} {"train_loss": -27.30067253112793, "global_step": 519171, "epoch": 6255} {"train_loss": -27.312963485717773, "global_step": 519172, "epoch": 6255} {"train_loss": -27.397815704345703, "global_step": 519173, "epoch": 6255} {"train_loss": -27.26896095275879, "global_step": 519174, "epoch": 6255} {"train_loss": -27.638151168823242, "global_step": 519175, "epoch": 6255} {"train_loss": -27.406652450561523, "global_step": 519176, "epoch": 6255} {"train_loss": -27.17719078063965, "global_step": 519177, "epoch": 6255} {"train_loss": -27.364294052124023, "global_step": 519178, "epoch": 6255} {"train_loss": -27.512426376342773, "global_step": 519179, "epoch": 6255} {"train_loss": -27.232315063476562, "global_step": 519180, "epoch": 6255} {"train_loss": -27.74744987487793, "global_step": 519181, "epoch": 6255} {"train_loss": -27.355884552001953, "global_step": 519182, "epoch": 6255} {"train_loss": -27.15876579284668, "global_step": 519183, "epoch": 6255} {"train_loss": -27.407312393188477, "global_step": 519184, "epoch": 6255} {"train_loss": -27.607690811157227, "global_step": 519185, "epoch": 6255} {"train_loss": -26.951465606689453, "global_step": 519186, "epoch": 6255} {"train_loss": -27.34748649597168, "global_step": 519187, "epoch": 6255} {"train_loss": -27.73298454284668, "global_step": 519188, "epoch": 6255} {"train_loss": -27.47893714904785, "global_step": 519189, "epoch": 6255} {"train_loss": -27.446868896484375, "global_step": 519190, "epoch": 6255} {"train_loss": -27.373998641967773, "global_step": 519191, "epoch": 6255} {"train_loss": -27.825698852539062, "global_step": 519192, "epoch": 6255} {"train_loss": -27.418701171875, "global_step": 519193, "epoch": 6255} {"train_loss": -27.3375244140625, "global_step": 519194, "epoch": 6255} {"train_loss": -27.5585880279541, "global_step": 519195, "epoch": 6255} {"train_loss": -27.808429718017578, "global_step": 519196, "epoch": 6255} {"train_loss": -27.84810447692871, "global_step": 519197, "epoch": 6255} {"train_loss": -27.689289093017578, "global_step": 519198, "epoch": 6255} {"train_loss": -27.476892471313477, "global_step": 519199, "epoch": 6255} {"train_loss": -27.300413131713867, "global_step": 519200, "epoch": 6255} {"train_loss": -27.214725494384766, "global_step": 519201, "epoch": 6255} {"train_loss": -27.64056968688965, "global_step": 519202, "epoch": 6255} {"train_loss": -27.480182647705078, "global_step": 519203, "epoch": 6255} {"train_loss": -27.834228515625, "global_step": 519204, "epoch": 6255} {"train_loss": -27.548370361328125, "global_step": 519205, "epoch": 6255} {"train_loss": -27.159011840820312, "global_step": 519206, "epoch": 6255} {"train_loss": -27.386388778686523, "global_step": 519207, "epoch": 6255} {"train_loss": -27.38709831237793, "global_step": 519208, "epoch": 6255} {"train_loss": -27.623432159423828, "global_step": 519209, "epoch": 6255} {"train_loss": -27.200117111206055, "global_step": 519210, "epoch": 6255} {"train_loss": -27.396610260009766, "global_step": 519211, "epoch": 6255} {"train_loss": -27.03400993347168, "global_step": 519212, "epoch": 6255} {"train_loss": -27.783300399780273, "global_step": 519213, "epoch": 6255} {"train_loss": -27.476428985595703, "global_step": 519214, "epoch": 6255} {"train_loss": -27.491933822631836, "global_step": 519215, "epoch": 6255} {"train_loss": -27.2111873626709, "global_step": 519216, "epoch": 6255} {"train_loss": -27.454700469970703, "global_step": 519217, "epoch": 6255} {"train_loss": -27.782917022705078, "global_step": 519218, "epoch": 6255} {"train_loss": -27.77593421936035, "global_step": 519219, "epoch": 6255} {"train_loss": -27.63863182067871, "global_step": 519220, "epoch": 6255} {"train_loss": -27.516332626342773, "global_step": 519221, "epoch": 6255} {"train_loss": -27.582977294921875, "global_step": 519222, "epoch": 6255} {"train_loss": -27.446619033813477, "global_step": 519223, "epoch": 6255} {"train_loss": -27.39743423461914, "global_step": 519224, "epoch": 6255} {"train_loss": -27.23648452758789, "global_step": 519225, "epoch": 6255} {"train_loss": -27.75788688659668, "global_step": 519226, "epoch": 6255} {"train_loss": -27.58198356628418, "global_step": 519227, "epoch": 6255} {"train_loss": -27.450592041015625, "global_step": 519228, "epoch": 6255} {"train_loss": -27.5508975982666, "global_step": 519229, "epoch": 6255} {"train_loss": -27.280614852905273, "global_step": 519230, "epoch": 6255} {"train_loss": -27.15313148498535, "global_step": 519231, "epoch": 6255} {"train_loss": -27.591201782226562, "global_step": 519232, "epoch": 6255} {"train_loss": -27.635990142822266, "global_step": 519233, "epoch": 6255} {"train_loss": -27.141202926635742, "global_step": 519234, "epoch": 6255} {"train_loss": -27.56521987915039, "global_step": 519235, "epoch": 6255} {"train_loss": -27.544416427612305, "global_step": 519236, "epoch": 6255} {"train_loss": -27.50620460510254, "global_step": 519237, "epoch": 6255} {"train_loss": -27.60810661315918, "global_step": 519238, "epoch": 6255} {"train_loss": -27.97699546813965, "global_step": 519239, "epoch": 6255} {"train_loss": -27.528772354125977, "global_step": 519240, "epoch": 6255} {"train_loss": -27.403043746948242, "global_step": 519241, "epoch": 6255} {"train_loss": -27.3124942779541, "global_step": 519242, "epoch": 6255} {"train_loss": -27.65825843811035, "global_step": 519243, "epoch": 6255} {"train_loss": -27.828474044799805, "global_step": 519244, "epoch": 6255} {"train_loss": -27.217041015625, "global_step": 519245, "epoch": 6255} {"train_loss": -27.67476463317871, "global_step": 519246, "epoch": 6255} {"train_loss": -27.435235540550874, "global_step": 519247, "epoch": 6255, "val_loss": 6553491.0} {"train_loss": -27.048315048217773, "global_step": 519248, "epoch": 6256} {"train_loss": -26.770795822143555, "global_step": 519249, "epoch": 6256} {"train_loss": -26.75074577331543, "global_step": 519250, "epoch": 6256} {"train_loss": -27.193042755126953, "global_step": 519251, "epoch": 6256} {"train_loss": -27.2574405670166, "global_step": 519252, "epoch": 6256} {"train_loss": -26.794458389282227, "global_step": 519253, "epoch": 6256} {"train_loss": -27.29493522644043, "global_step": 519254, "epoch": 6256} {"train_loss": -26.831762313842773, "global_step": 519255, "epoch": 6256} {"train_loss": -26.89093589782715, "global_step": 519256, "epoch": 6256} {"train_loss": -27.324377059936523, "global_step": 519257, "epoch": 6256} {"train_loss": -26.9326171875, "global_step": 519258, "epoch": 6256} {"train_loss": -27.4118595123291, "global_step": 519259, "epoch": 6256} {"train_loss": -27.281042098999023, "global_step": 519260, "epoch": 6256} {"train_loss": -27.308670043945312, "global_step": 519261, "epoch": 6256} {"train_loss": -27.692413330078125, "global_step": 519262, "epoch": 6256} {"train_loss": -27.39969825744629, "global_step": 519263, "epoch": 6256} {"train_loss": -27.509607315063477, "global_step": 519264, "epoch": 6256} {"train_loss": -27.586877822875977, "global_step": 519265, "epoch": 6256} {"train_loss": -27.270328521728516, "global_step": 519266, "epoch": 6256} {"train_loss": -27.67471694946289, "global_step": 519267, "epoch": 6256} {"train_loss": -27.522653579711914, "global_step": 519268, "epoch": 6256} {"train_loss": -27.301990509033203, "global_step": 519269, "epoch": 6256} {"train_loss": -27.632795333862305, "global_step": 519270, "epoch": 6256} {"train_loss": -27.0975284576416, "global_step": 519271, "epoch": 6256} {"train_loss": -27.180028915405273, "global_step": 519272, "epoch": 6256} {"train_loss": -27.49994468688965, "global_step": 519273, "epoch": 6256} {"train_loss": -27.248123168945312, "global_step": 519274, "epoch": 6256} {"train_loss": -27.5057430267334, "global_step": 519275, "epoch": 6256} {"train_loss": -27.495450973510742, "global_step": 519276, "epoch": 6256} {"train_loss": -27.67036247253418, "global_step": 519277, "epoch": 6256} {"train_loss": -27.238525390625, "global_step": 519278, "epoch": 6256} {"train_loss": -27.275146484375, "global_step": 519279, "epoch": 6256} {"train_loss": -27.68696403503418, "global_step": 519280, "epoch": 6256} {"train_loss": -27.252307891845703, "global_step": 519281, "epoch": 6256} {"train_loss": -27.33745765686035, "global_step": 519282, "epoch": 6256} {"train_loss": -27.4771671295166, "global_step": 519283, "epoch": 6256} {"train_loss": -27.32655143737793, "global_step": 519284, "epoch": 6256} {"train_loss": -27.52630043029785, "global_step": 519285, "epoch": 6256} {"train_loss": -27.23472023010254, "global_step": 519286, "epoch": 6256} {"train_loss": -27.441513061523438, "global_step": 519287, "epoch": 6256} {"train_loss": -27.531869888305664, "global_step": 519288, "epoch": 6256} {"train_loss": -27.666288375854492, "global_step": 519289, "epoch": 6256} {"train_loss": -27.6854305267334, "global_step": 519290, "epoch": 6256} {"train_loss": -27.604883193969727, "global_step": 519291, "epoch": 6256} {"train_loss": -27.98493003845215, "global_step": 519292, "epoch": 6256} {"train_loss": -27.38193702697754, "global_step": 519293, "epoch": 6256} {"train_loss": -27.355798721313477, "global_step": 519294, "epoch": 6256} {"train_loss": -27.366077423095703, "global_step": 519295, "epoch": 6256} {"train_loss": -27.453540802001953, "global_step": 519296, "epoch": 6256} {"train_loss": -27.481521606445312, "global_step": 519297, "epoch": 6256} {"train_loss": -27.649322509765625, "global_step": 519298, "epoch": 6256} {"train_loss": -27.482030868530273, "global_step": 519299, "epoch": 6256} {"train_loss": -27.68230628967285, "global_step": 519300, "epoch": 6256} {"train_loss": -27.541065216064453, "global_step": 519301, "epoch": 6256} {"train_loss": -27.49163818359375, "global_step": 519302, "epoch": 6256} {"train_loss": -27.391077041625977, "global_step": 519303, "epoch": 6256} {"train_loss": -27.771732330322266, "global_step": 519304, "epoch": 6256} {"train_loss": -27.920270919799805, "global_step": 519305, "epoch": 6256} {"train_loss": -27.627490997314453, "global_step": 519306, "epoch": 6256} {"train_loss": -27.595849990844727, "global_step": 519307, "epoch": 6256} {"train_loss": -27.6435604095459, "global_step": 519308, "epoch": 6256} {"train_loss": -27.895465850830078, "global_step": 519309, "epoch": 6256} {"train_loss": -27.200855255126953, "global_step": 519310, "epoch": 6256} {"train_loss": -27.560440063476562, "global_step": 519311, "epoch": 6256} {"train_loss": -28.006561279296875, "global_step": 519312, "epoch": 6256} {"train_loss": -27.476058959960938, "global_step": 519313, "epoch": 6256} {"train_loss": -27.641637802124023, "global_step": 519314, "epoch": 6256} {"train_loss": -27.48431968688965, "global_step": 519315, "epoch": 6256} {"train_loss": -27.70513343811035, "global_step": 519316, "epoch": 6256} {"train_loss": -27.58133888244629, "global_step": 519317, "epoch": 6256} {"train_loss": -27.47385597229004, "global_step": 519318, "epoch": 6256} {"train_loss": -27.82838249206543, "global_step": 519319, "epoch": 6256} {"train_loss": -28.023645401000977, "global_step": 519320, "epoch": 6256} {"train_loss": -27.581640243530273, "global_step": 519321, "epoch": 6256} {"train_loss": -27.63215446472168, "global_step": 519322, "epoch": 6256} {"train_loss": -27.919818878173828, "global_step": 519323, "epoch": 6256} {"train_loss": -27.637847900390625, "global_step": 519324, "epoch": 6256} {"train_loss": -27.7156925201416, "global_step": 519325, "epoch": 6256} {"train_loss": -27.421960830688477, "global_step": 519326, "epoch": 6256} {"train_loss": -27.567224502563477, "global_step": 519327, "epoch": 6256} {"train_loss": -27.67548179626465, "global_step": 519328, "epoch": 6256} {"train_loss": -27.38887596130371, "global_step": 519329, "epoch": 6256} {"train_loss": -27.45632415219962, "global_step": 519330, "epoch": 6256, "val_loss": 6581659.0} {"train_loss": -25.718658447265625, "global_step": 519331, "epoch": 6257} {"train_loss": -20.868873596191406, "global_step": 519332, "epoch": 6257} {"train_loss": -18.937414169311523, "global_step": 519333, "epoch": 6257} {"train_loss": -25.731739044189453, "global_step": 519334, "epoch": 6257} {"train_loss": -23.479917526245117, "global_step": 519335, "epoch": 6257} {"train_loss": -26.001148223876953, "global_step": 519336, "epoch": 6257} {"train_loss": -24.39702796936035, "global_step": 519337, "epoch": 6257} {"train_loss": -25.620624542236328, "global_step": 519338, "epoch": 6257} {"train_loss": -25.644824981689453, "global_step": 519339, "epoch": 6257} {"train_loss": -25.82069206237793, "global_step": 519340, "epoch": 6257} {"train_loss": -25.805927276611328, "global_step": 519341, "epoch": 6257} {"train_loss": -26.185001373291016, "global_step": 519342, "epoch": 6257} {"train_loss": -26.208410263061523, "global_step": 519343, "epoch": 6257} {"train_loss": -26.062143325805664, "global_step": 519344, "epoch": 6257} {"train_loss": -25.9047908782959, "global_step": 519345, "epoch": 6257} {"train_loss": -26.20096206665039, "global_step": 519346, "epoch": 6257} {"train_loss": -26.55942153930664, "global_step": 519347, "epoch": 6257} {"train_loss": -26.5966854095459, "global_step": 519348, "epoch": 6257} {"train_loss": -26.295942306518555, "global_step": 519349, "epoch": 6257} {"train_loss": -26.234777450561523, "global_step": 519350, "epoch": 6257} {"train_loss": -26.529083251953125, "global_step": 519351, "epoch": 6257} {"train_loss": -26.331506729125977, "global_step": 519352, "epoch": 6257} {"train_loss": -26.409299850463867, "global_step": 519353, "epoch": 6257} {"train_loss": -26.530466079711914, "global_step": 519354, "epoch": 6257} {"train_loss": -26.744543075561523, "global_step": 519355, "epoch": 6257} {"train_loss": -26.98211097717285, "global_step": 519356, "epoch": 6257} {"train_loss": -27.18842124938965, "global_step": 519357, "epoch": 6257} {"train_loss": -26.72616958618164, "global_step": 519358, "epoch": 6257} {"train_loss": -26.611225128173828, "global_step": 519359, "epoch": 6257} {"train_loss": -27.034189224243164, "global_step": 519360, "epoch": 6257} {"train_loss": -26.402448654174805, "global_step": 519361, "epoch": 6257} {"train_loss": -26.8695068359375, "global_step": 519362, "epoch": 6257} {"train_loss": -27.052515029907227, "global_step": 519363, "epoch": 6257} {"train_loss": -26.893842697143555, "global_step": 519364, "epoch": 6257} {"train_loss": -26.6047306060791, "global_step": 519365, "epoch": 6257} {"train_loss": -26.885986328125, "global_step": 519366, "epoch": 6257} {"train_loss": -26.88421630859375, "global_step": 519367, "epoch": 6257} {"train_loss": -27.20347023010254, "global_step": 519368, "epoch": 6257} {"train_loss": -27.13494873046875, "global_step": 519369, "epoch": 6257} {"train_loss": -27.08099937438965, "global_step": 519370, "epoch": 6257} {"train_loss": -27.142242431640625, "global_step": 519371, "epoch": 6257} {"train_loss": -27.305200576782227, "global_step": 519372, "epoch": 6257} {"train_loss": -27.189252853393555, "global_step": 519373, "epoch": 6257} {"train_loss": -27.130491256713867, "global_step": 519374, "epoch": 6257} {"train_loss": -27.082630157470703, "global_step": 519375, "epoch": 6257} {"train_loss": -27.45277976989746, "global_step": 519376, "epoch": 6257} {"train_loss": -27.584228515625, "global_step": 519377, "epoch": 6257} {"train_loss": -27.42695426940918, "global_step": 519378, "epoch": 6257} {"train_loss": -27.309858322143555, "global_step": 519379, "epoch": 6257} {"train_loss": -27.53069496154785, "global_step": 519380, "epoch": 6257} {"train_loss": -27.350879669189453, "global_step": 519381, "epoch": 6257} {"train_loss": -27.257532119750977, "global_step": 519382, "epoch": 6257} {"train_loss": -27.62919044494629, "global_step": 519383, "epoch": 6257} {"train_loss": -27.455602645874023, "global_step": 519384, "epoch": 6257} {"train_loss": -27.474546432495117, "global_step": 519385, "epoch": 6257} {"train_loss": -27.15437889099121, "global_step": 519386, "epoch": 6257} {"train_loss": -27.557025909423828, "global_step": 519387, "epoch": 6257} {"train_loss": -27.620819091796875, "global_step": 519388, "epoch": 6257} {"train_loss": -27.630828857421875, "global_step": 519389, "epoch": 6257} {"train_loss": -27.18609619140625, "global_step": 519390, "epoch": 6257} {"train_loss": -27.68304443359375, "global_step": 519391, "epoch": 6257} {"train_loss": -27.413833618164062, "global_step": 519392, "epoch": 6257} {"train_loss": -27.620025634765625, "global_step": 519393, "epoch": 6257} {"train_loss": -27.3297176361084, "global_step": 519394, "epoch": 6257} {"train_loss": -27.49220085144043, "global_step": 519395, "epoch": 6257} {"train_loss": -27.88043785095215, "global_step": 519396, "epoch": 6257} {"train_loss": -27.507740020751953, "global_step": 519397, "epoch": 6257} {"train_loss": -27.183151245117188, "global_step": 519398, "epoch": 6257} {"train_loss": -27.547012329101562, "global_step": 519399, "epoch": 6257} {"train_loss": -27.389524459838867, "global_step": 519400, "epoch": 6257} {"train_loss": -27.174346923828125, "global_step": 519401, "epoch": 6257} {"train_loss": -27.833698272705078, "global_step": 519402, "epoch": 6257} {"train_loss": -27.14417839050293, "global_step": 519403, "epoch": 6257} {"train_loss": -27.711755752563477, "global_step": 519404, "epoch": 6257} {"train_loss": -27.116504669189453, "global_step": 519405, "epoch": 6257} {"train_loss": -27.949316024780273, "global_step": 519406, "epoch": 6257} {"train_loss": -27.461353302001953, "global_step": 519407, "epoch": 6257} {"train_loss": -27.613265991210938, "global_step": 519408, "epoch": 6257} {"train_loss": -27.57123374938965, "global_step": 519409, "epoch": 6257} {"train_loss": -27.54401969909668, "global_step": 519410, "epoch": 6257} {"train_loss": -27.255582809448242, "global_step": 519411, "epoch": 6257} {"train_loss": -27.420358657836914, "global_step": 519412, "epoch": 6257} {"train_loss": -26.73693974046822, "global_step": 519413, "epoch": 6257, "val_loss": 6544031.0} {"train_loss": -27.034772872924805, "global_step": 519414, "epoch": 6258} {"train_loss": -26.696731567382812, "global_step": 519415, "epoch": 6258} {"train_loss": -26.18802261352539, "global_step": 519416, "epoch": 6258} {"train_loss": -26.89919090270996, "global_step": 519417, "epoch": 6258} {"train_loss": -27.297637939453125, "global_step": 519418, "epoch": 6258} {"train_loss": -27.183734893798828, "global_step": 519419, "epoch": 6258} {"train_loss": -27.364221572875977, "global_step": 519420, "epoch": 6258} {"train_loss": -27.14979362487793, "global_step": 519421, "epoch": 6258} {"train_loss": -27.3558292388916, "global_step": 519422, "epoch": 6258} {"train_loss": -27.73699951171875, "global_step": 519423, "epoch": 6258} {"train_loss": -27.18372917175293, "global_step": 519424, "epoch": 6258} {"train_loss": -27.30951499938965, "global_step": 519425, "epoch": 6258} {"train_loss": -27.28312110900879, "global_step": 519426, "epoch": 6258} {"train_loss": -26.932172775268555, "global_step": 519427, "epoch": 6258} {"train_loss": -27.898700714111328, "global_step": 519428, "epoch": 6258} {"train_loss": -27.578237533569336, "global_step": 519429, "epoch": 6258} {"train_loss": -26.9824275970459, "global_step": 519430, "epoch": 6258} {"train_loss": -27.83515739440918, "global_step": 519431, "epoch": 6258} {"train_loss": -27.289020538330078, "global_step": 519432, "epoch": 6258} {"train_loss": -27.361053466796875, "global_step": 519433, "epoch": 6258} {"train_loss": -27.31305503845215, "global_step": 519434, "epoch": 6258} {"train_loss": -27.339008331298828, "global_step": 519435, "epoch": 6258} {"train_loss": -27.065465927124023, "global_step": 519436, "epoch": 6258} {"train_loss": -26.81477165222168, "global_step": 519437, "epoch": 6258} {"train_loss": -27.39314842224121, "global_step": 519438, "epoch": 6258} {"train_loss": -27.570707321166992, "global_step": 519439, "epoch": 6258} {"train_loss": -27.1463623046875, "global_step": 519440, "epoch": 6258} {"train_loss": -27.61556053161621, "global_step": 519441, "epoch": 6258} {"train_loss": -27.31561851501465, "global_step": 519442, "epoch": 6258} {"train_loss": -27.373401641845703, "global_step": 519443, "epoch": 6258} {"train_loss": -27.366857528686523, "global_step": 519444, "epoch": 6258} {"train_loss": -27.29509925842285, "global_step": 519445, "epoch": 6258} {"train_loss": -27.419513702392578, "global_step": 519446, "epoch": 6258} {"train_loss": -27.637914657592773, "global_step": 519447, "epoch": 6258} {"train_loss": -27.202545166015625, "global_step": 519448, "epoch": 6258} {"train_loss": -27.582763671875, "global_step": 519449, "epoch": 6258} {"train_loss": -27.665380477905273, "global_step": 519450, "epoch": 6258} {"train_loss": -27.683429718017578, "global_step": 519451, "epoch": 6258} {"train_loss": -27.549346923828125, "global_step": 519452, "epoch": 6258} {"train_loss": -27.485824584960938, "global_step": 519453, "epoch": 6258} {"train_loss": -27.4927921295166, "global_step": 519454, "epoch": 6258} {"train_loss": -27.534347534179688, "global_step": 519455, "epoch": 6258} {"train_loss": -27.36355972290039, "global_step": 519456, "epoch": 6258} {"train_loss": -27.41724967956543, "global_step": 519457, "epoch": 6258} {"train_loss": -27.81422233581543, "global_step": 519458, "epoch": 6258} {"train_loss": -27.428369522094727, "global_step": 519459, "epoch": 6258} {"train_loss": -27.8411865234375, "global_step": 519460, "epoch": 6258} {"train_loss": -27.42024040222168, "global_step": 519461, "epoch": 6258} {"train_loss": -27.886005401611328, "global_step": 519462, "epoch": 6258} {"train_loss": -27.6140193939209, "global_step": 519463, "epoch": 6258} {"train_loss": -27.660968780517578, "global_step": 519464, "epoch": 6258} {"train_loss": -27.374664306640625, "global_step": 519465, "epoch": 6258} {"train_loss": -27.730915069580078, "global_step": 519466, "epoch": 6258} {"train_loss": -27.706884384155273, "global_step": 519467, "epoch": 6258} {"train_loss": -27.466907501220703, "global_step": 519468, "epoch": 6258} {"train_loss": -27.6391544342041, "global_step": 519469, "epoch": 6258} {"train_loss": -27.492090225219727, "global_step": 519470, "epoch": 6258} {"train_loss": -27.088886260986328, "global_step": 519471, "epoch": 6258} {"train_loss": -27.710742950439453, "global_step": 519472, "epoch": 6258} {"train_loss": -27.411584854125977, "global_step": 519473, "epoch": 6258} {"train_loss": -27.821949005126953, "global_step": 519474, "epoch": 6258} {"train_loss": -27.438007354736328, "global_step": 519475, "epoch": 6258} {"train_loss": -27.722585678100586, "global_step": 519476, "epoch": 6258} {"train_loss": -27.705530166625977, "global_step": 519477, "epoch": 6258} {"train_loss": -27.693283081054688, "global_step": 519478, "epoch": 6258} {"train_loss": -27.760791778564453, "global_step": 519479, "epoch": 6258} {"train_loss": -27.48304557800293, "global_step": 519480, "epoch": 6258} {"train_loss": -27.9204158782959, "global_step": 519481, "epoch": 6258} {"train_loss": -27.452322006225586, "global_step": 519482, "epoch": 6258} {"train_loss": -27.470678329467773, "global_step": 519483, "epoch": 6258} {"train_loss": -27.258893966674805, "global_step": 519484, "epoch": 6258} {"train_loss": -27.199295043945312, "global_step": 519485, "epoch": 6258} {"train_loss": -27.543664932250977, "global_step": 519486, "epoch": 6258} {"train_loss": -27.432050704956055, "global_step": 519487, "epoch": 6258} {"train_loss": -27.387353897094727, "global_step": 519488, "epoch": 6258} {"train_loss": -27.478300094604492, "global_step": 519489, "epoch": 6258} {"train_loss": -27.495025634765625, "global_step": 519490, "epoch": 6258} {"train_loss": -27.3565731048584, "global_step": 519491, "epoch": 6258} {"train_loss": -27.797983169555664, "global_step": 519492, "epoch": 6258} {"train_loss": -27.657638549804688, "global_step": 519493, "epoch": 6258} {"train_loss": -27.83355140686035, "global_step": 519494, "epoch": 6258} {"train_loss": -27.62995719909668, "global_step": 519495, "epoch": 6258} {"train_loss": -27.461648872099726, "global_step": 519496, "epoch": 6258, "val_loss": 6424061.0} {"train_loss": -26.838903427124023, "global_step": 519497, "epoch": 6259} {"train_loss": -25.684263229370117, "global_step": 519498, "epoch": 6259} {"train_loss": -26.65907096862793, "global_step": 519499, "epoch": 6259} {"train_loss": -26.903860092163086, "global_step": 519500, "epoch": 6259} {"train_loss": -26.777868270874023, "global_step": 519501, "epoch": 6259} {"train_loss": -26.6176700592041, "global_step": 519502, "epoch": 6259} {"train_loss": -27.0244197845459, "global_step": 519503, "epoch": 6259} {"train_loss": -26.969879150390625, "global_step": 519504, "epoch": 6259} {"train_loss": -26.843923568725586, "global_step": 519505, "epoch": 6259} {"train_loss": -26.743371963500977, "global_step": 519506, "epoch": 6259} {"train_loss": -27.035505294799805, "global_step": 519507, "epoch": 6259} {"train_loss": -27.09518814086914, "global_step": 519508, "epoch": 6259} {"train_loss": -26.898557662963867, "global_step": 519509, "epoch": 6259} {"train_loss": -27.299591064453125, "global_step": 519510, "epoch": 6259} {"train_loss": -26.76235008239746, "global_step": 519511, "epoch": 6259} {"train_loss": -27.149341583251953, "global_step": 519512, "epoch": 6259} {"train_loss": -27.147855758666992, "global_step": 519513, "epoch": 6259} {"train_loss": -26.95794677734375, "global_step": 519514, "epoch": 6259} {"train_loss": -27.407373428344727, "global_step": 519515, "epoch": 6259} {"train_loss": -27.345870971679688, "global_step": 519516, "epoch": 6259} {"train_loss": -27.135766983032227, "global_step": 519517, "epoch": 6259} {"train_loss": -27.337188720703125, "global_step": 519518, "epoch": 6259} {"train_loss": -27.34466552734375, "global_step": 519519, "epoch": 6259} {"train_loss": -27.42994499206543, "global_step": 519520, "epoch": 6259} {"train_loss": -27.2730770111084, "global_step": 519521, "epoch": 6259} {"train_loss": -27.163227081298828, "global_step": 519522, "epoch": 6259} {"train_loss": -27.354963302612305, "global_step": 519523, "epoch": 6259} {"train_loss": -27.572614669799805, "global_step": 519524, "epoch": 6259} {"train_loss": -27.55109214782715, "global_step": 519525, "epoch": 6259} {"train_loss": -27.590438842773438, "global_step": 519526, "epoch": 6259} {"train_loss": -27.27365493774414, "global_step": 519527, "epoch": 6259} {"train_loss": -27.6612548828125, "global_step": 519528, "epoch": 6259} {"train_loss": -27.427289962768555, "global_step": 519529, "epoch": 6259} {"train_loss": -27.583362579345703, "global_step": 519530, "epoch": 6259} {"train_loss": -27.40985679626465, "global_step": 519531, "epoch": 6259} {"train_loss": -27.810565948486328, "global_step": 519532, "epoch": 6259} {"train_loss": -27.679479598999023, "global_step": 519533, "epoch": 6259} {"train_loss": -27.75247573852539, "global_step": 519534, "epoch": 6259} {"train_loss": -27.86688232421875, "global_step": 519535, "epoch": 6259} {"train_loss": -27.63429832458496, "global_step": 519536, "epoch": 6259} {"train_loss": -27.546981811523438, "global_step": 519537, "epoch": 6259} {"train_loss": -27.800445556640625, "global_step": 519538, "epoch": 6259} {"train_loss": -27.694486618041992, "global_step": 519539, "epoch": 6259} {"train_loss": -27.729511260986328, "global_step": 519540, "epoch": 6259} {"train_loss": -27.930150985717773, "global_step": 519541, "epoch": 6259} {"train_loss": -27.80633544921875, "global_step": 519542, "epoch": 6259} {"train_loss": -27.443683624267578, "global_step": 519543, "epoch": 6259} {"train_loss": -27.48560905456543, "global_step": 519544, "epoch": 6259} {"train_loss": -28.03553581237793, "global_step": 519545, "epoch": 6259} {"train_loss": -27.832611083984375, "global_step": 519546, "epoch": 6259} {"train_loss": -27.93424415588379, "global_step": 519547, "epoch": 6259} {"train_loss": -27.526159286499023, "global_step": 519548, "epoch": 6259} {"train_loss": -27.58490562438965, "global_step": 519549, "epoch": 6259} {"train_loss": -27.738208770751953, "global_step": 519550, "epoch": 6259} {"train_loss": -27.702463150024414, "global_step": 519551, "epoch": 6259} {"train_loss": -27.661258697509766, "global_step": 519552, "epoch": 6259} {"train_loss": -27.644428253173828, "global_step": 519553, "epoch": 6259} {"train_loss": -27.859527587890625, "global_step": 519554, "epoch": 6259} {"train_loss": -27.669803619384766, "global_step": 519555, "epoch": 6259} {"train_loss": -28.178955078125, "global_step": 519556, "epoch": 6259} {"train_loss": -27.514799118041992, "global_step": 519557, "epoch": 6259} {"train_loss": -27.912168502807617, "global_step": 519558, "epoch": 6259} {"train_loss": -27.770370483398438, "global_step": 519559, "epoch": 6259} {"train_loss": -27.4608154296875, "global_step": 519560, "epoch": 6259} {"train_loss": -27.01226806640625, "global_step": 519561, "epoch": 6259} {"train_loss": -26.740177154541016, "global_step": 519562, "epoch": 6259} {"train_loss": -26.64333152770996, "global_step": 519563, "epoch": 6259} {"train_loss": -26.986297607421875, "global_step": 519564, "epoch": 6259} {"train_loss": -27.798755645751953, "global_step": 519565, "epoch": 6259} {"train_loss": -27.212421417236328, "global_step": 519566, "epoch": 6259} {"train_loss": -27.304990768432617, "global_step": 519567, "epoch": 6259} {"train_loss": -27.345666885375977, "global_step": 519568, "epoch": 6259} {"train_loss": -27.205219268798828, "global_step": 519569, "epoch": 6259} {"train_loss": -27.64670753479004, "global_step": 519570, "epoch": 6259} {"train_loss": -27.621994018554688, "global_step": 519571, "epoch": 6259} {"train_loss": -27.32331657409668, "global_step": 519572, "epoch": 6259} {"train_loss": -27.419677734375, "global_step": 519573, "epoch": 6259} {"train_loss": -27.318017959594727, "global_step": 519574, "epoch": 6259} {"train_loss": -27.7064266204834, "global_step": 519575, "epoch": 6259} {"train_loss": -27.57221031188965, "global_step": 519576, "epoch": 6259} {"train_loss": -27.602624893188477, "global_step": 519577, "epoch": 6259} {"train_loss": -27.294513702392578, "global_step": 519578, "epoch": 6259} {"train_loss": -27.3795355141881, "global_step": 519579, "epoch": 6259, "val_loss": 6549969.0} {"train_loss": -27.544702529907227, "global_step": 519580, "epoch": 6260} {"train_loss": -26.734922409057617, "global_step": 519581, "epoch": 6260} {"train_loss": -27.062116622924805, "global_step": 519582, "epoch": 6260} {"train_loss": -27.335708618164062, "global_step": 519583, "epoch": 6260} {"train_loss": -26.72430419921875, "global_step": 519584, "epoch": 6260} {"train_loss": -26.863218307495117, "global_step": 519585, "epoch": 6260} {"train_loss": -27.022253036499023, "global_step": 519586, "epoch": 6260} {"train_loss": -27.301239013671875, "global_step": 519587, "epoch": 6260} {"train_loss": -26.540119171142578, "global_step": 519588, "epoch": 6260} {"train_loss": -26.466516494750977, "global_step": 519589, "epoch": 6260} {"train_loss": -27.10120964050293, "global_step": 519590, "epoch": 6260} {"train_loss": -27.308034896850586, "global_step": 519591, "epoch": 6260} {"train_loss": -26.97943687438965, "global_step": 519592, "epoch": 6260} {"train_loss": -27.23781394958496, "global_step": 519593, "epoch": 6260} {"train_loss": -26.882349014282227, "global_step": 519594, "epoch": 6260} {"train_loss": -27.162256240844727, "global_step": 519595, "epoch": 6260} {"train_loss": -27.19772720336914, "global_step": 519596, "epoch": 6260} {"train_loss": -27.337478637695312, "global_step": 519597, "epoch": 6260} {"train_loss": -27.17486572265625, "global_step": 519598, "epoch": 6260} {"train_loss": -27.525495529174805, "global_step": 519599, "epoch": 6260} {"train_loss": -26.960235595703125, "global_step": 519600, "epoch": 6260} {"train_loss": -27.399200439453125, "global_step": 519601, "epoch": 6260} {"train_loss": -27.218189239501953, "global_step": 519602, "epoch": 6260} {"train_loss": -26.85400390625, "global_step": 519603, "epoch": 6260} {"train_loss": -27.359088897705078, "global_step": 519604, "epoch": 6260} {"train_loss": -27.315338134765625, "global_step": 519605, "epoch": 6260} {"train_loss": -27.310766220092773, "global_step": 519606, "epoch": 6260} {"train_loss": -27.594568252563477, "global_step": 519607, "epoch": 6260} {"train_loss": -27.384063720703125, "global_step": 519608, "epoch": 6260} {"train_loss": -27.410125732421875, "global_step": 519609, "epoch": 6260} {"train_loss": -27.386829376220703, "global_step": 519610, "epoch": 6260} {"train_loss": -27.708723068237305, "global_step": 519611, "epoch": 6260} {"train_loss": -27.787967681884766, "global_step": 519612, "epoch": 6260} {"train_loss": -27.669357299804688, "global_step": 519613, "epoch": 6260} {"train_loss": -27.709325790405273, "global_step": 519614, "epoch": 6260} {"train_loss": -27.5947208404541, "global_step": 519615, "epoch": 6260} {"train_loss": -27.646650314331055, "global_step": 519616, "epoch": 6260} {"train_loss": -27.52040672302246, "global_step": 519617, "epoch": 6260} {"train_loss": -27.67930030822754, "global_step": 519618, "epoch": 6260} {"train_loss": -27.329004287719727, "global_step": 519619, "epoch": 6260} {"train_loss": -27.669418334960938, "global_step": 519620, "epoch": 6260} {"train_loss": -27.415725708007812, "global_step": 519621, "epoch": 6260} {"train_loss": -27.918127059936523, "global_step": 519622, "epoch": 6260} {"train_loss": -27.511341094970703, "global_step": 519623, "epoch": 6260} {"train_loss": -27.70488929748535, "global_step": 519624, "epoch": 6260} {"train_loss": -27.632740020751953, "global_step": 519625, "epoch": 6260} {"train_loss": -28.247486114501953, "global_step": 519626, "epoch": 6260} {"train_loss": -27.710927963256836, "global_step": 519627, "epoch": 6260} {"train_loss": -27.76751136779785, "global_step": 519628, "epoch": 6260} {"train_loss": -27.666738510131836, "global_step": 519629, "epoch": 6260} {"train_loss": -28.2037353515625, "global_step": 519630, "epoch": 6260} {"train_loss": -27.766559600830078, "global_step": 519631, "epoch": 6260} {"train_loss": -27.574819564819336, "global_step": 519632, "epoch": 6260} {"train_loss": -27.347909927368164, "global_step": 519633, "epoch": 6260} {"train_loss": -27.78521728515625, "global_step": 519634, "epoch": 6260} {"train_loss": -27.603076934814453, "global_step": 519635, "epoch": 6260} {"train_loss": -27.135089874267578, "global_step": 519636, "epoch": 6260} {"train_loss": -27.254791259765625, "global_step": 519637, "epoch": 6260} {"train_loss": -26.895898818969727, "global_step": 519638, "epoch": 6260} {"train_loss": -27.166278839111328, "global_step": 519639, "epoch": 6260} {"train_loss": -27.40705680847168, "global_step": 519640, "epoch": 6260} {"train_loss": -27.39170265197754, "global_step": 519641, "epoch": 6260} {"train_loss": -27.973953247070312, "global_step": 519642, "epoch": 6260} {"train_loss": -27.425373077392578, "global_step": 519643, "epoch": 6260} {"train_loss": -27.208398818969727, "global_step": 519644, "epoch": 6260} {"train_loss": -27.796466827392578, "global_step": 519645, "epoch": 6260} {"train_loss": -27.776025772094727, "global_step": 519646, "epoch": 6260} {"train_loss": -27.81690788269043, "global_step": 519647, "epoch": 6260} {"train_loss": -27.413192749023438, "global_step": 519648, "epoch": 6260} {"train_loss": -27.602554321289062, "global_step": 519649, "epoch": 6260} {"train_loss": -27.705347061157227, "global_step": 519650, "epoch": 6260} {"train_loss": -27.917194366455078, "global_step": 519651, "epoch": 6260} {"train_loss": -27.853479385375977, "global_step": 519652, "epoch": 6260} {"train_loss": -27.85731315612793, "global_step": 519653, "epoch": 6260} {"train_loss": -27.544071197509766, "global_step": 519654, "epoch": 6260} {"train_loss": -27.428312301635742, "global_step": 519655, "epoch": 6260} {"train_loss": -27.483060836791992, "global_step": 519656, "epoch": 6260} {"train_loss": -27.739736557006836, "global_step": 519657, "epoch": 6260} {"train_loss": -27.776487350463867, "global_step": 519658, "epoch": 6260} {"train_loss": -27.74774742126465, "global_step": 519659, "epoch": 6260} {"train_loss": -27.23687744140625, "global_step": 519660, "epoch": 6260} {"train_loss": -27.07325553894043, "global_step": 519661, "epoch": 6260} {"train_loss": -27.448128160223902, "global_step": 519662, "epoch": 6260, "val_loss": 6511343.5} {"train_loss": -26.843896865844727, "global_step": 519663, "epoch": 6261} {"train_loss": -26.62689781188965, "global_step": 519664, "epoch": 6261} {"train_loss": -26.230426788330078, "global_step": 519665, "epoch": 6261} {"train_loss": -27.438892364501953, "global_step": 519666, "epoch": 6261} {"train_loss": -26.970136642456055, "global_step": 519667, "epoch": 6261} {"train_loss": -27.26620864868164, "global_step": 519668, "epoch": 6261} {"train_loss": -26.706008911132812, "global_step": 519669, "epoch": 6261} {"train_loss": -26.702472686767578, "global_step": 519670, "epoch": 6261} {"train_loss": -27.12763786315918, "global_step": 519671, "epoch": 6261} {"train_loss": -27.020822525024414, "global_step": 519672, "epoch": 6261} {"train_loss": -27.182966232299805, "global_step": 519673, "epoch": 6261} {"train_loss": -27.094970703125, "global_step": 519674, "epoch": 6261} {"train_loss": -27.217910766601562, "global_step": 519675, "epoch": 6261} {"train_loss": -27.042837142944336, "global_step": 519676, "epoch": 6261} {"train_loss": -27.2984619140625, "global_step": 519677, "epoch": 6261} {"train_loss": -27.204425811767578, "global_step": 519678, "epoch": 6261} {"train_loss": -27.44529151916504, "global_step": 519679, "epoch": 6261} {"train_loss": -27.3574161529541, "global_step": 519680, "epoch": 6261} {"train_loss": -27.650745391845703, "global_step": 519681, "epoch": 6261} {"train_loss": -27.2941951751709, "global_step": 519682, "epoch": 6261} {"train_loss": -27.161916732788086, "global_step": 519683, "epoch": 6261} {"train_loss": -27.2007999420166, "global_step": 519684, "epoch": 6261} {"train_loss": -27.249374389648438, "global_step": 519685, "epoch": 6261} {"train_loss": -27.671350479125977, "global_step": 519686, "epoch": 6261} {"train_loss": -27.351490020751953, "global_step": 519687, "epoch": 6261} {"train_loss": -27.68132972717285, "global_step": 519688, "epoch": 6261} {"train_loss": -27.4846134185791, "global_step": 519689, "epoch": 6261} {"train_loss": -27.281784057617188, "global_step": 519690, "epoch": 6261} {"train_loss": -27.662540435791016, "global_step": 519691, "epoch": 6261} {"train_loss": -27.405630111694336, "global_step": 519692, "epoch": 6261} {"train_loss": -27.571401596069336, "global_step": 519693, "epoch": 6261} {"train_loss": -27.710681915283203, "global_step": 519694, "epoch": 6261} {"train_loss": -27.73651123046875, "global_step": 519695, "epoch": 6261} {"train_loss": -27.7379093170166, "global_step": 519696, "epoch": 6261} {"train_loss": -27.412694931030273, "global_step": 519697, "epoch": 6261} {"train_loss": -27.511804580688477, "global_step": 519698, "epoch": 6261} {"train_loss": -27.58513832092285, "global_step": 519699, "epoch": 6261} {"train_loss": -27.662403106689453, "global_step": 519700, "epoch": 6261} {"train_loss": -27.314722061157227, "global_step": 519701, "epoch": 6261} {"train_loss": -27.785680770874023, "global_step": 519702, "epoch": 6261} {"train_loss": -27.7822208404541, "global_step": 519703, "epoch": 6261} {"train_loss": -27.910125732421875, "global_step": 519704, "epoch": 6261} {"train_loss": -27.50738525390625, "global_step": 519705, "epoch": 6261} {"train_loss": -27.7137508392334, "global_step": 519706, "epoch": 6261} {"train_loss": -27.34600830078125, "global_step": 519707, "epoch": 6261} {"train_loss": -27.82539176940918, "global_step": 519708, "epoch": 6261} {"train_loss": -27.588199615478516, "global_step": 519709, "epoch": 6261} {"train_loss": -27.544931411743164, "global_step": 519710, "epoch": 6261} {"train_loss": -27.754135131835938, "global_step": 519711, "epoch": 6261} {"train_loss": -27.4964542388916, "global_step": 519712, "epoch": 6261} {"train_loss": -28.080183029174805, "global_step": 519713, "epoch": 6261} {"train_loss": -27.714704513549805, "global_step": 519714, "epoch": 6261} {"train_loss": -27.25672721862793, "global_step": 519715, "epoch": 6261} {"train_loss": -27.09919548034668, "global_step": 519716, "epoch": 6261} {"train_loss": -27.1099796295166, "global_step": 519717, "epoch": 6261} {"train_loss": -27.375741958618164, "global_step": 519718, "epoch": 6261} {"train_loss": -27.597370147705078, "global_step": 519719, "epoch": 6261} {"train_loss": -27.685049057006836, "global_step": 519720, "epoch": 6261} {"train_loss": -27.486713409423828, "global_step": 519721, "epoch": 6261} {"train_loss": -27.286046981811523, "global_step": 519722, "epoch": 6261} {"train_loss": -27.258718490600586, "global_step": 519723, "epoch": 6261} {"train_loss": -27.47242546081543, "global_step": 519724, "epoch": 6261} {"train_loss": -27.39631462097168, "global_step": 519725, "epoch": 6261} {"train_loss": -27.24605369567871, "global_step": 519726, "epoch": 6261} {"train_loss": -27.61614418029785, "global_step": 519727, "epoch": 6261} {"train_loss": -27.194568634033203, "global_step": 519728, "epoch": 6261} {"train_loss": -27.536901473999023, "global_step": 519729, "epoch": 6261} {"train_loss": -27.0826416015625, "global_step": 519730, "epoch": 6261} {"train_loss": -27.605178833007812, "global_step": 519731, "epoch": 6261} {"train_loss": -27.29154396057129, "global_step": 519732, "epoch": 6261} {"train_loss": -27.361066818237305, "global_step": 519733, "epoch": 6261} {"train_loss": -27.860502243041992, "global_step": 519734, "epoch": 6261} {"train_loss": -27.611902236938477, "global_step": 519735, "epoch": 6261} {"train_loss": -27.131887435913086, "global_step": 519736, "epoch": 6261} {"train_loss": -27.249963760375977, "global_step": 519737, "epoch": 6261} {"train_loss": -27.889892578125, "global_step": 519738, "epoch": 6261} {"train_loss": -27.39235496520996, "global_step": 519739, "epoch": 6261} {"train_loss": -27.737974166870117, "global_step": 519740, "epoch": 6261} {"train_loss": -27.94935417175293, "global_step": 519741, "epoch": 6261} {"train_loss": -27.779586791992188, "global_step": 519742, "epoch": 6261} {"train_loss": -27.649572372436523, "global_step": 519743, "epoch": 6261} {"train_loss": -27.824155807495117, "global_step": 519744, "epoch": 6261} {"train_loss": -27.40920599971909, "global_step": 519745, "epoch": 6261, "val_loss": 6530530.5} {"train_loss": -26.05328369140625, "global_step": 519746, "epoch": 6262} {"train_loss": -26.131072998046875, "global_step": 519747, "epoch": 6262} {"train_loss": -27.260229110717773, "global_step": 519748, "epoch": 6262} {"train_loss": -25.988813400268555, "global_step": 519749, "epoch": 6262} {"train_loss": -26.629629135131836, "global_step": 519750, "epoch": 6262} {"train_loss": -26.25410270690918, "global_step": 519751, "epoch": 6262} {"train_loss": -26.808725357055664, "global_step": 519752, "epoch": 6262} {"train_loss": -26.700910568237305, "global_step": 519753, "epoch": 6262} {"train_loss": -26.854352951049805, "global_step": 519754, "epoch": 6262} {"train_loss": -27.25660514831543, "global_step": 519755, "epoch": 6262} {"train_loss": -27.101242065429688, "global_step": 519756, "epoch": 6262} {"train_loss": -26.780317306518555, "global_step": 519757, "epoch": 6262} {"train_loss": -27.094465255737305, "global_step": 519758, "epoch": 6262} {"train_loss": -27.080137252807617, "global_step": 519759, "epoch": 6262} {"train_loss": -27.37632179260254, "global_step": 519760, "epoch": 6262} {"train_loss": -27.35440444946289, "global_step": 519761, "epoch": 6262} {"train_loss": -27.063467025756836, "global_step": 519762, "epoch": 6262} {"train_loss": -27.584020614624023, "global_step": 519763, "epoch": 6262} {"train_loss": -27.694198608398438, "global_step": 519764, "epoch": 6262} {"train_loss": -27.24725341796875, "global_step": 519765, "epoch": 6262} {"train_loss": -27.363706588745117, "global_step": 519766, "epoch": 6262} {"train_loss": -27.230070114135742, "global_step": 519767, "epoch": 6262} {"train_loss": -27.53533935546875, "global_step": 519768, "epoch": 6262} {"train_loss": -27.85894203186035, "global_step": 519769, "epoch": 6262} {"train_loss": -27.38575553894043, "global_step": 519770, "epoch": 6262} {"train_loss": -27.62592124938965, "global_step": 519771, "epoch": 6262} {"train_loss": -27.54546546936035, "global_step": 519772, "epoch": 6262} {"train_loss": -27.48415184020996, "global_step": 519773, "epoch": 6262} {"train_loss": -27.352096557617188, "global_step": 519774, "epoch": 6262} {"train_loss": -27.474456787109375, "global_step": 519775, "epoch": 6262} {"train_loss": -27.866180419921875, "global_step": 519776, "epoch": 6262} {"train_loss": -27.467639923095703, "global_step": 519777, "epoch": 6262} {"train_loss": -27.578527450561523, "global_step": 519778, "epoch": 6262} {"train_loss": -27.620304107666016, "global_step": 519779, "epoch": 6262} {"train_loss": -27.398603439331055, "global_step": 519780, "epoch": 6262} {"train_loss": -27.47281837463379, "global_step": 519781, "epoch": 6262} {"train_loss": -27.9716739654541, "global_step": 519782, "epoch": 6262} {"train_loss": -27.469633102416992, "global_step": 519783, "epoch": 6262} {"train_loss": -27.594165802001953, "global_step": 519784, "epoch": 6262} {"train_loss": -27.407438278198242, "global_step": 519785, "epoch": 6262} {"train_loss": -27.430761337280273, "global_step": 519786, "epoch": 6262} {"train_loss": -27.64548683166504, "global_step": 519787, "epoch": 6262} {"train_loss": -27.1984806060791, "global_step": 519788, "epoch": 6262} {"train_loss": -27.364822387695312, "global_step": 519789, "epoch": 6262} {"train_loss": -27.548933029174805, "global_step": 519790, "epoch": 6262} {"train_loss": -27.93385124206543, "global_step": 519791, "epoch": 6262} {"train_loss": -27.345539093017578, "global_step": 519792, "epoch": 6262} {"train_loss": -27.444456100463867, "global_step": 519793, "epoch": 6262} {"train_loss": -27.751489639282227, "global_step": 519794, "epoch": 6262} {"train_loss": -27.50542640686035, "global_step": 519795, "epoch": 6262} {"train_loss": -27.1720027923584, "global_step": 519796, "epoch": 6262} {"train_loss": -27.39131736755371, "global_step": 519797, "epoch": 6262} {"train_loss": -27.194183349609375, "global_step": 519798, "epoch": 6262} {"train_loss": -27.535266876220703, "global_step": 519799, "epoch": 6262} {"train_loss": -26.98512077331543, "global_step": 519800, "epoch": 6262} {"train_loss": -27.239233016967773, "global_step": 519801, "epoch": 6262} {"train_loss": -27.225194931030273, "global_step": 519802, "epoch": 6262} {"train_loss": -27.115537643432617, "global_step": 519803, "epoch": 6262} {"train_loss": -27.968017578125, "global_step": 519804, "epoch": 6262} {"train_loss": -27.527515411376953, "global_step": 519805, "epoch": 6262} {"train_loss": -27.516345977783203, "global_step": 519806, "epoch": 6262} {"train_loss": -27.279951095581055, "global_step": 519807, "epoch": 6262} {"train_loss": -27.911413192749023, "global_step": 519808, "epoch": 6262} {"train_loss": -27.52252769470215, "global_step": 519809, "epoch": 6262} {"train_loss": -27.249902725219727, "global_step": 519810, "epoch": 6262} {"train_loss": -27.494665145874023, "global_step": 519811, "epoch": 6262} {"train_loss": -27.46858024597168, "global_step": 519812, "epoch": 6262} {"train_loss": -27.63926124572754, "global_step": 519813, "epoch": 6262} {"train_loss": -27.978052139282227, "global_step": 519814, "epoch": 6262} {"train_loss": -27.31955337524414, "global_step": 519815, "epoch": 6262} {"train_loss": -27.0880126953125, "global_step": 519816, "epoch": 6262} {"train_loss": -27.52130126953125, "global_step": 519817, "epoch": 6262} {"train_loss": -27.594512939453125, "global_step": 519818, "epoch": 6262} {"train_loss": -27.50029945373535, "global_step": 519819, "epoch": 6262} {"train_loss": -27.38958740234375, "global_step": 519820, "epoch": 6262} {"train_loss": -27.61016845703125, "global_step": 519821, "epoch": 6262} {"train_loss": -27.8212890625, "global_step": 519822, "epoch": 6262} {"train_loss": -27.850433349609375, "global_step": 519823, "epoch": 6262} {"train_loss": -27.785314559936523, "global_step": 519824, "epoch": 6262} {"train_loss": -27.44769287109375, "global_step": 519825, "epoch": 6262} {"train_loss": -27.19111442565918, "global_step": 519826, "epoch": 6262} {"train_loss": -27.909900665283203, "global_step": 519827, "epoch": 6262} {"train_loss": -27.36056865554258, "global_step": 519828, "epoch": 6262, "val_loss": 6519387.0} {"train_loss": -24.133800506591797, "global_step": 519829, "epoch": 6263} {"train_loss": -24.22943687438965, "global_step": 519830, "epoch": 6263} {"train_loss": -25.00299072265625, "global_step": 519831, "epoch": 6263} {"train_loss": -25.48602867126465, "global_step": 519832, "epoch": 6263} {"train_loss": -24.25276756286621, "global_step": 519833, "epoch": 6263} {"train_loss": -25.66550064086914, "global_step": 519834, "epoch": 6263} {"train_loss": -25.654394149780273, "global_step": 519835, "epoch": 6263} {"train_loss": -26.030248641967773, "global_step": 519836, "epoch": 6263} {"train_loss": -25.401792526245117, "global_step": 519837, "epoch": 6263} {"train_loss": -26.42392349243164, "global_step": 519838, "epoch": 6263} {"train_loss": -25.881628036499023, "global_step": 519839, "epoch": 6263} {"train_loss": -26.476795196533203, "global_step": 519840, "epoch": 6263} {"train_loss": -25.692296981811523, "global_step": 519841, "epoch": 6263} {"train_loss": -26.637298583984375, "global_step": 519842, "epoch": 6263} {"train_loss": -25.986379623413086, "global_step": 519843, "epoch": 6263} {"train_loss": -26.45486831665039, "global_step": 519844, "epoch": 6263} {"train_loss": -26.410486221313477, "global_step": 519845, "epoch": 6263} {"train_loss": -26.454360961914062, "global_step": 519846, "epoch": 6263} {"train_loss": -26.592382431030273, "global_step": 519847, "epoch": 6263} {"train_loss": -26.696073532104492, "global_step": 519848, "epoch": 6263} {"train_loss": -27.13738441467285, "global_step": 519849, "epoch": 6263} {"train_loss": -26.795103073120117, "global_step": 519850, "epoch": 6263} {"train_loss": -27.131956100463867, "global_step": 519851, "epoch": 6263} {"train_loss": -27.1123104095459, "global_step": 519852, "epoch": 6263} {"train_loss": -26.540821075439453, "global_step": 519853, "epoch": 6263} {"train_loss": -26.54534912109375, "global_step": 519854, "epoch": 6263} {"train_loss": -26.57097816467285, "global_step": 519855, "epoch": 6263} {"train_loss": -26.77533531188965, "global_step": 519856, "epoch": 6263} {"train_loss": -26.90736961364746, "global_step": 519857, "epoch": 6263} {"train_loss": -27.297937393188477, "global_step": 519858, "epoch": 6263} {"train_loss": -26.871091842651367, "global_step": 519859, "epoch": 6263} {"train_loss": -27.10211181640625, "global_step": 519860, "epoch": 6263} {"train_loss": -27.07594108581543, "global_step": 519861, "epoch": 6263} {"train_loss": -27.13209342956543, "global_step": 519862, "epoch": 6263} {"train_loss": -27.117963790893555, "global_step": 519863, "epoch": 6263} {"train_loss": -27.427282333374023, "global_step": 519864, "epoch": 6263} {"train_loss": -27.569852828979492, "global_step": 519865, "epoch": 6263} {"train_loss": -27.1940975189209, "global_step": 519866, "epoch": 6263} {"train_loss": -27.127416610717773, "global_step": 519867, "epoch": 6263} {"train_loss": -27.193695068359375, "global_step": 519868, "epoch": 6263} {"train_loss": -27.10452651977539, "global_step": 519869, "epoch": 6263} {"train_loss": -27.50150489807129, "global_step": 519870, "epoch": 6263} {"train_loss": -27.42706298828125, "global_step": 519871, "epoch": 6263} {"train_loss": -27.68263053894043, "global_step": 519872, "epoch": 6263} {"train_loss": -27.13265037536621, "global_step": 519873, "epoch": 6263} {"train_loss": -27.590473175048828, "global_step": 519874, "epoch": 6263} {"train_loss": -27.4520206451416, "global_step": 519875, "epoch": 6263} {"train_loss": -27.635334014892578, "global_step": 519876, "epoch": 6263} {"train_loss": -27.79401969909668, "global_step": 519877, "epoch": 6263} {"train_loss": -27.444787979125977, "global_step": 519878, "epoch": 6263} {"train_loss": -27.852771759033203, "global_step": 519879, "epoch": 6263} {"train_loss": -27.191396713256836, "global_step": 519880, "epoch": 6263} {"train_loss": -27.449604034423828, "global_step": 519881, "epoch": 6263} {"train_loss": -27.477930068969727, "global_step": 519882, "epoch": 6263} {"train_loss": -27.492334365844727, "global_step": 519883, "epoch": 6263} {"train_loss": -27.680347442626953, "global_step": 519884, "epoch": 6263} {"train_loss": -27.4678955078125, "global_step": 519885, "epoch": 6263} {"train_loss": -27.84418296813965, "global_step": 519886, "epoch": 6263} {"train_loss": -27.912744522094727, "global_step": 519887, "epoch": 6263} {"train_loss": -27.591629028320312, "global_step": 519888, "epoch": 6263} {"train_loss": -27.546979904174805, "global_step": 519889, "epoch": 6263} {"train_loss": -28.09034538269043, "global_step": 519890, "epoch": 6263} {"train_loss": -27.593976974487305, "global_step": 519891, "epoch": 6263} {"train_loss": -27.6780948638916, "global_step": 519892, "epoch": 6263} {"train_loss": -27.66230583190918, "global_step": 519893, "epoch": 6263} {"train_loss": -27.53596305847168, "global_step": 519894, "epoch": 6263} {"train_loss": -27.51386833190918, "global_step": 519895, "epoch": 6263} {"train_loss": -27.965808868408203, "global_step": 519896, "epoch": 6263} {"train_loss": -27.834991455078125, "global_step": 519897, "epoch": 6263} {"train_loss": -27.41866111755371, "global_step": 519898, "epoch": 6263} {"train_loss": -27.665790557861328, "global_step": 519899, "epoch": 6263} {"train_loss": -27.708105087280273, "global_step": 519900, "epoch": 6263} {"train_loss": -27.571985244750977, "global_step": 519901, "epoch": 6263} {"train_loss": -27.400848388671875, "global_step": 519902, "epoch": 6263} {"train_loss": -27.65948486328125, "global_step": 519903, "epoch": 6263} {"train_loss": -27.1121883392334, "global_step": 519904, "epoch": 6263} {"train_loss": -27.98076820373535, "global_step": 519905, "epoch": 6263} {"train_loss": -27.913745880126953, "global_step": 519906, "epoch": 6263} {"train_loss": -27.803613662719727, "global_step": 519907, "epoch": 6263} {"train_loss": -27.14328956604004, "global_step": 519908, "epoch": 6263} {"train_loss": -27.462726593017578, "global_step": 519909, "epoch": 6263} {"train_loss": -27.686920166015625, "global_step": 519910, "epoch": 6263} {"train_loss": -27.006181487117907, "global_step": 519911, "epoch": 6263, "val_loss": 6507544.0} {"train_loss": -26.707990646362305, "global_step": 519912, "epoch": 6264} {"train_loss": -25.83391761779785, "global_step": 519913, "epoch": 6264} {"train_loss": -27.529190063476562, "global_step": 519914, "epoch": 6264} {"train_loss": -26.25910758972168, "global_step": 519915, "epoch": 6264} {"train_loss": -26.61964988708496, "global_step": 519916, "epoch": 6264} {"train_loss": -26.3414363861084, "global_step": 519917, "epoch": 6264} {"train_loss": -26.20134925842285, "global_step": 519918, "epoch": 6264} {"train_loss": -27.000415802001953, "global_step": 519919, "epoch": 6264} {"train_loss": -26.391071319580078, "global_step": 519920, "epoch": 6264} {"train_loss": -26.837621688842773, "global_step": 519921, "epoch": 6264} {"train_loss": -26.878681182861328, "global_step": 519922, "epoch": 6264} {"train_loss": -26.50885009765625, "global_step": 519923, "epoch": 6264} {"train_loss": -27.249242782592773, "global_step": 519924, "epoch": 6264} {"train_loss": -26.930591583251953, "global_step": 519925, "epoch": 6264} {"train_loss": -27.112369537353516, "global_step": 519926, "epoch": 6264} {"train_loss": -27.37158203125, "global_step": 519927, "epoch": 6264} {"train_loss": -26.69101333618164, "global_step": 519928, "epoch": 6264} {"train_loss": -27.26905632019043, "global_step": 519929, "epoch": 6264} {"train_loss": -27.116437911987305, "global_step": 519930, "epoch": 6264} {"train_loss": -27.456104278564453, "global_step": 519931, "epoch": 6264} {"train_loss": -26.928144454956055, "global_step": 519932, "epoch": 6264} {"train_loss": -27.464313507080078, "global_step": 519933, "epoch": 6264} {"train_loss": -26.829792022705078, "global_step": 519934, "epoch": 6264} {"train_loss": -27.550634384155273, "global_step": 519935, "epoch": 6264} {"train_loss": -26.84198570251465, "global_step": 519936, "epoch": 6264} {"train_loss": -27.324377059936523, "global_step": 519937, "epoch": 6264} {"train_loss": -27.25141716003418, "global_step": 519938, "epoch": 6264} {"train_loss": -27.520313262939453, "global_step": 519939, "epoch": 6264} {"train_loss": -27.324878692626953, "global_step": 519940, "epoch": 6264} {"train_loss": -27.512531280517578, "global_step": 519941, "epoch": 6264} {"train_loss": -27.179697036743164, "global_step": 519942, "epoch": 6264} {"train_loss": -27.451675415039062, "global_step": 519943, "epoch": 6264} {"train_loss": -27.28592300415039, "global_step": 519944, "epoch": 6264} {"train_loss": -27.42483901977539, "global_step": 519945, "epoch": 6264} {"train_loss": -27.426528930664062, "global_step": 519946, "epoch": 6264} {"train_loss": -27.859121322631836, "global_step": 519947, "epoch": 6264} {"train_loss": -27.57614517211914, "global_step": 519948, "epoch": 6264} {"train_loss": -27.58038902282715, "global_step": 519949, "epoch": 6264} {"train_loss": -27.664941787719727, "global_step": 519950, "epoch": 6264} {"train_loss": -27.463796615600586, "global_step": 519951, "epoch": 6264} {"train_loss": -27.697952270507812, "global_step": 519952, "epoch": 6264} {"train_loss": -27.490034103393555, "global_step": 519953, "epoch": 6264} {"train_loss": -27.482330322265625, "global_step": 519954, "epoch": 6264} {"train_loss": -27.43226432800293, "global_step": 519955, "epoch": 6264} {"train_loss": -27.742053985595703, "global_step": 519956, "epoch": 6264} {"train_loss": -27.756006240844727, "global_step": 519957, "epoch": 6264} {"train_loss": -27.942419052124023, "global_step": 519958, "epoch": 6264} {"train_loss": -27.604475021362305, "global_step": 519959, "epoch": 6264} {"train_loss": -27.695749282836914, "global_step": 519960, "epoch": 6264} {"train_loss": -27.709028244018555, "global_step": 519961, "epoch": 6264} {"train_loss": -27.865833282470703, "global_step": 519962, "epoch": 6264} {"train_loss": -28.18311882019043, "global_step": 519963, "epoch": 6264} {"train_loss": -27.589492797851562, "global_step": 519964, "epoch": 6264} {"train_loss": -27.555978775024414, "global_step": 519965, "epoch": 6264} {"train_loss": -27.58138084411621, "global_step": 519966, "epoch": 6264} {"train_loss": -27.768146514892578, "global_step": 519967, "epoch": 6264} {"train_loss": -27.459869384765625, "global_step": 519968, "epoch": 6264} {"train_loss": -27.56498146057129, "global_step": 519969, "epoch": 6264} {"train_loss": -27.815847396850586, "global_step": 519970, "epoch": 6264} {"train_loss": -27.821395874023438, "global_step": 519971, "epoch": 6264} {"train_loss": -27.834985733032227, "global_step": 519972, "epoch": 6264} {"train_loss": -27.777210235595703, "global_step": 519973, "epoch": 6264} {"train_loss": -27.60687828063965, "global_step": 519974, "epoch": 6264} {"train_loss": -27.971622467041016, "global_step": 519975, "epoch": 6264} {"train_loss": -28.016271591186523, "global_step": 519976, "epoch": 6264} {"train_loss": -27.93280029296875, "global_step": 519977, "epoch": 6264} {"train_loss": -27.78423500061035, "global_step": 519978, "epoch": 6264} {"train_loss": -27.673913955688477, "global_step": 519979, "epoch": 6264} {"train_loss": -27.748144149780273, "global_step": 519980, "epoch": 6264} {"train_loss": -27.42362403869629, "global_step": 519981, "epoch": 6264} {"train_loss": -27.876462936401367, "global_step": 519982, "epoch": 6264} {"train_loss": -28.037450790405273, "global_step": 519983, "epoch": 6264} {"train_loss": -27.813901901245117, "global_step": 519984, "epoch": 6264} {"train_loss": -27.77019691467285, "global_step": 519985, "epoch": 6264} {"train_loss": -27.898046493530273, "global_step": 519986, "epoch": 6264} {"train_loss": -27.36423110961914, "global_step": 519987, "epoch": 6264} {"train_loss": -27.57416343688965, "global_step": 519988, "epoch": 6264} {"train_loss": -27.713653564453125, "global_step": 519989, "epoch": 6264} {"train_loss": -27.8001651763916, "global_step": 519990, "epoch": 6264} {"train_loss": -27.7950496673584, "global_step": 519991, "epoch": 6264} {"train_loss": -27.716480255126953, "global_step": 519992, "epoch": 6264} {"train_loss": -27.805511474609375, "global_step": 519993, "epoch": 6264} {"train_loss": -27.41482952991164, "global_step": 519994, "epoch": 6264, "val_loss": 6568771.5} {"train_loss": -25.87737464904785, "global_step": 519995, "epoch": 6265} {"train_loss": -26.05128288269043, "global_step": 519996, "epoch": 6265} {"train_loss": -26.192651748657227, "global_step": 519997, "epoch": 6265} {"train_loss": -25.968976974487305, "global_step": 519998, "epoch": 6265} {"train_loss": -26.874561309814453, "global_step": 519999, "epoch": 6265} {"train_loss": -25.339757919311523, "global_step": 520000, "epoch": 6265} {"train_loss": -26.691513061523438, "global_step": 520001, "epoch": 6265} {"train_loss": -26.58167839050293, "global_step": 520002, "epoch": 6265} {"train_loss": -26.04034423828125, "global_step": 520003, "epoch": 6265} {"train_loss": -27.107633590698242, "global_step": 520004, "epoch": 6265} {"train_loss": -26.519994735717773, "global_step": 520005, "epoch": 6265} {"train_loss": -26.893354415893555, "global_step": 520006, "epoch": 6265} {"train_loss": -26.832599639892578, "global_step": 520007, "epoch": 6265} {"train_loss": -26.8339786529541, "global_step": 520008, "epoch": 6265} {"train_loss": -26.50571060180664, "global_step": 520009, "epoch": 6265} {"train_loss": -26.722747802734375, "global_step": 520010, "epoch": 6265} {"train_loss": -26.47443199157715, "global_step": 520011, "epoch": 6265} {"train_loss": -26.95429801940918, "global_step": 520012, "epoch": 6265} {"train_loss": -26.875898361206055, "global_step": 520013, "epoch": 6265} {"train_loss": -26.8588809967041, "global_step": 520014, "epoch": 6265} {"train_loss": -26.8581600189209, "global_step": 520015, "epoch": 6265} {"train_loss": -27.413572311401367, "global_step": 520016, "epoch": 6265} {"train_loss": -27.243505477905273, "global_step": 520017, "epoch": 6265} {"train_loss": -27.120361328125, "global_step": 520018, "epoch": 6265} {"train_loss": -27.309864044189453, "global_step": 520019, "epoch": 6265} {"train_loss": -27.293201446533203, "global_step": 520020, "epoch": 6265} {"train_loss": -27.16007423400879, "global_step": 520021, "epoch": 6265} {"train_loss": -27.48810386657715, "global_step": 520022, "epoch": 6265} {"train_loss": -27.38372230529785, "global_step": 520023, "epoch": 6265} {"train_loss": -26.757532119750977, "global_step": 520024, "epoch": 6265} {"train_loss": -27.1497745513916, "global_step": 520025, "epoch": 6265} {"train_loss": -27.449567794799805, "global_step": 520026, "epoch": 6265} {"train_loss": -27.6054630279541, "global_step": 520027, "epoch": 6265} {"train_loss": -27.2712345123291, "global_step": 520028, "epoch": 6265} {"train_loss": -27.544458389282227, "global_step": 520029, "epoch": 6265} {"train_loss": -27.633819580078125, "global_step": 520030, "epoch": 6265} {"train_loss": -27.394912719726562, "global_step": 520031, "epoch": 6265} {"train_loss": -27.5565242767334, "global_step": 520032, "epoch": 6265} {"train_loss": -27.592798233032227, "global_step": 520033, "epoch": 6265} {"train_loss": -27.530786514282227, "global_step": 520034, "epoch": 6265} {"train_loss": -27.349496841430664, "global_step": 520035, "epoch": 6265} {"train_loss": -27.594043731689453, "global_step": 520036, "epoch": 6265} {"train_loss": -27.493778228759766, "global_step": 520037, "epoch": 6265} {"train_loss": -27.320316314697266, "global_step": 520038, "epoch": 6265} {"train_loss": -27.84645652770996, "global_step": 520039, "epoch": 6265} {"train_loss": -27.705429077148438, "global_step": 520040, "epoch": 6265} {"train_loss": -27.675220489501953, "global_step": 520041, "epoch": 6265} {"train_loss": -27.613107681274414, "global_step": 520042, "epoch": 6265} {"train_loss": -27.408002853393555, "global_step": 520043, "epoch": 6265} {"train_loss": -27.812179565429688, "global_step": 520044, "epoch": 6265} {"train_loss": -27.5916805267334, "global_step": 520045, "epoch": 6265} {"train_loss": -27.95453453063965, "global_step": 520046, "epoch": 6265} {"train_loss": -27.917423248291016, "global_step": 520047, "epoch": 6265} {"train_loss": -27.383405685424805, "global_step": 520048, "epoch": 6265} {"train_loss": -27.455533981323242, "global_step": 520049, "epoch": 6265} {"train_loss": -27.652618408203125, "global_step": 520050, "epoch": 6265} {"train_loss": -27.92816162109375, "global_step": 520051, "epoch": 6265} {"train_loss": -27.584142684936523, "global_step": 520052, "epoch": 6265} {"train_loss": -27.6633358001709, "global_step": 520053, "epoch": 6265} {"train_loss": -28.01942253112793, "global_step": 520054, "epoch": 6265} {"train_loss": -27.670673370361328, "global_step": 520055, "epoch": 6265} {"train_loss": -27.588266372680664, "global_step": 520056, "epoch": 6265} {"train_loss": -27.6751708984375, "global_step": 520057, "epoch": 6265} {"train_loss": -28.054840087890625, "global_step": 520058, "epoch": 6265} {"train_loss": -27.43806266784668, "global_step": 520059, "epoch": 6265} {"train_loss": -27.5103702545166, "global_step": 520060, "epoch": 6265} {"train_loss": -27.5491886138916, "global_step": 520061, "epoch": 6265} {"train_loss": -27.383747100830078, "global_step": 520062, "epoch": 6265} {"train_loss": -27.123441696166992, "global_step": 520063, "epoch": 6265} {"train_loss": -27.75979995727539, "global_step": 520064, "epoch": 6265} {"train_loss": -27.59588623046875, "global_step": 520065, "epoch": 6265} {"train_loss": -27.7042236328125, "global_step": 520066, "epoch": 6265} {"train_loss": -27.80596351623535, "global_step": 520067, "epoch": 6265} {"train_loss": -27.450159072875977, "global_step": 520068, "epoch": 6265} {"train_loss": -27.89283561706543, "global_step": 520069, "epoch": 6265} {"train_loss": -27.410390853881836, "global_step": 520070, "epoch": 6265} {"train_loss": -27.762451171875, "global_step": 520071, "epoch": 6265} {"train_loss": -27.690231323242188, "global_step": 520072, "epoch": 6265} {"train_loss": -27.724767684936523, "global_step": 520073, "epoch": 6265} {"train_loss": -27.65185546875, "global_step": 520074, "epoch": 6265} {"train_loss": -27.16155433654785, "global_step": 520075, "epoch": 6265} {"train_loss": -27.513471603393555, "global_step": 520076, "epoch": 6265} {"train_loss": -27.260032998510155, "global_step": 520077, "epoch": 6265, "val_loss": 6512842.5} {"train_loss": -26.6758975982666, "global_step": 520078, "epoch": 6266} {"train_loss": -26.555219650268555, "global_step": 520079, "epoch": 6266} {"train_loss": -27.164281845092773, "global_step": 520080, "epoch": 6266} {"train_loss": -26.9901065826416, "global_step": 520081, "epoch": 6266} {"train_loss": -26.9589900970459, "global_step": 520082, "epoch": 6266} {"train_loss": -26.76031494140625, "global_step": 520083, "epoch": 6266} {"train_loss": -27.461835861206055, "global_step": 520084, "epoch": 6266} {"train_loss": -27.056690216064453, "global_step": 520085, "epoch": 6266} {"train_loss": -26.560400009155273, "global_step": 520086, "epoch": 6266} {"train_loss": -27.465497970581055, "global_step": 520087, "epoch": 6266} {"train_loss": -26.349241256713867, "global_step": 520088, "epoch": 6266} {"train_loss": -27.176488876342773, "global_step": 520089, "epoch": 6266} {"train_loss": -26.470624923706055, "global_step": 520090, "epoch": 6266} {"train_loss": -26.974475860595703, "global_step": 520091, "epoch": 6266} {"train_loss": -26.976276397705078, "global_step": 520092, "epoch": 6266} {"train_loss": -27.321455001831055, "global_step": 520093, "epoch": 6266} {"train_loss": -27.0175838470459, "global_step": 520094, "epoch": 6266} {"train_loss": -27.368335723876953, "global_step": 520095, "epoch": 6266} {"train_loss": -26.859760284423828, "global_step": 520096, "epoch": 6266} {"train_loss": -27.429121017456055, "global_step": 520097, "epoch": 6266} {"train_loss": -27.119354248046875, "global_step": 520098, "epoch": 6266} {"train_loss": -27.492345809936523, "global_step": 520099, "epoch": 6266} {"train_loss": -27.207273483276367, "global_step": 520100, "epoch": 6266} {"train_loss": -27.109577178955078, "global_step": 520101, "epoch": 6266} {"train_loss": -27.0537052154541, "global_step": 520102, "epoch": 6266} {"train_loss": -27.597980499267578, "global_step": 520103, "epoch": 6266} {"train_loss": -27.472822189331055, "global_step": 520104, "epoch": 6266} {"train_loss": -27.353307723999023, "global_step": 520105, "epoch": 6266} {"train_loss": -27.23663902282715, "global_step": 520106, "epoch": 6266} {"train_loss": -27.556447982788086, "global_step": 520107, "epoch": 6266} {"train_loss": -27.84439468383789, "global_step": 520108, "epoch": 6266} {"train_loss": -27.423492431640625, "global_step": 520109, "epoch": 6266} {"train_loss": -27.63616371154785, "global_step": 520110, "epoch": 6266} {"train_loss": -27.62409782409668, "global_step": 520111, "epoch": 6266} {"train_loss": -27.1351375579834, "global_step": 520112, "epoch": 6266} {"train_loss": -27.73054313659668, "global_step": 520113, "epoch": 6266} {"train_loss": -27.216894149780273, "global_step": 520114, "epoch": 6266} {"train_loss": -27.512298583984375, "global_step": 520115, "epoch": 6266} {"train_loss": -27.46490478515625, "global_step": 520116, "epoch": 6266} {"train_loss": -27.264978408813477, "global_step": 520117, "epoch": 6266} {"train_loss": -27.41407585144043, "global_step": 520118, "epoch": 6266} {"train_loss": -27.233488082885742, "global_step": 520119, "epoch": 6266} {"train_loss": -27.591882705688477, "global_step": 520120, "epoch": 6266} {"train_loss": -27.42413330078125, "global_step": 520121, "epoch": 6266} {"train_loss": -27.689960479736328, "global_step": 520122, "epoch": 6266} {"train_loss": -27.334365844726562, "global_step": 520123, "epoch": 6266} {"train_loss": -27.831745147705078, "global_step": 520124, "epoch": 6266} {"train_loss": -27.425268173217773, "global_step": 520125, "epoch": 6266} {"train_loss": -27.62415885925293, "global_step": 520126, "epoch": 6266} {"train_loss": -27.772491455078125, "global_step": 520127, "epoch": 6266} {"train_loss": -27.586069107055664, "global_step": 520128, "epoch": 6266} {"train_loss": -27.518890380859375, "global_step": 520129, "epoch": 6266} {"train_loss": -27.491500854492188, "global_step": 520130, "epoch": 6266} {"train_loss": -27.644338607788086, "global_step": 520131, "epoch": 6266} {"train_loss": -27.592695236206055, "global_step": 520132, "epoch": 6266} {"train_loss": -28.268869400024414, "global_step": 520133, "epoch": 6266} {"train_loss": -27.238422393798828, "global_step": 520134, "epoch": 6266} {"train_loss": -27.628713607788086, "global_step": 520135, "epoch": 6266} {"train_loss": -27.577838897705078, "global_step": 520136, "epoch": 6266} {"train_loss": -26.958459854125977, "global_step": 520137, "epoch": 6266} {"train_loss": -27.715229034423828, "global_step": 520138, "epoch": 6266} {"train_loss": -27.334293365478516, "global_step": 520139, "epoch": 6266} {"train_loss": -27.794294357299805, "global_step": 520140, "epoch": 6266} {"train_loss": -27.423664093017578, "global_step": 520141, "epoch": 6266} {"train_loss": -27.186355590820312, "global_step": 520142, "epoch": 6266} {"train_loss": -27.725309371948242, "global_step": 520143, "epoch": 6266} {"train_loss": -27.092456817626953, "global_step": 520144, "epoch": 6266} {"train_loss": -27.70943260192871, "global_step": 520145, "epoch": 6266} {"train_loss": -27.24659538269043, "global_step": 520146, "epoch": 6266} {"train_loss": -27.603113174438477, "global_step": 520147, "epoch": 6266} {"train_loss": -27.546649932861328, "global_step": 520148, "epoch": 6266} {"train_loss": -27.48927116394043, "global_step": 520149, "epoch": 6266} {"train_loss": -27.727996826171875, "global_step": 520150, "epoch": 6266} {"train_loss": -27.47358512878418, "global_step": 520151, "epoch": 6266} {"train_loss": -27.64821434020996, "global_step": 520152, "epoch": 6266} {"train_loss": -27.08817481994629, "global_step": 520153, "epoch": 6266} {"train_loss": -26.812183380126953, "global_step": 520154, "epoch": 6266} {"train_loss": -27.622669219970703, "global_step": 520155, "epoch": 6266} {"train_loss": -27.324079513549805, "global_step": 520156, "epoch": 6266} {"train_loss": -27.629751205444336, "global_step": 520157, "epoch": 6266} {"train_loss": -27.33340835571289, "global_step": 520158, "epoch": 6266} {"train_loss": -27.0523624420166, "global_step": 520159, "epoch": 6266} {"train_loss": -27.343652702239623, "global_step": 520160, "epoch": 6266, "val_loss": 6475067.5} {"train_loss": -26.045135498046875, "global_step": 520161, "epoch": 6267} {"train_loss": -25.973291397094727, "global_step": 520162, "epoch": 6267} {"train_loss": -26.411890029907227, "global_step": 520163, "epoch": 6267} {"train_loss": -26.528593063354492, "global_step": 520164, "epoch": 6267} {"train_loss": -26.846027374267578, "global_step": 520165, "epoch": 6267} {"train_loss": -26.041126251220703, "global_step": 520166, "epoch": 6267} {"train_loss": -26.515979766845703, "global_step": 520167, "epoch": 6267} {"train_loss": -26.806293487548828, "global_step": 520168, "epoch": 6267} {"train_loss": -26.812122344970703, "global_step": 520169, "epoch": 6267} {"train_loss": -27.01740837097168, "global_step": 520170, "epoch": 6267} {"train_loss": -27.1127872467041, "global_step": 520171, "epoch": 6267} {"train_loss": -26.89459228515625, "global_step": 520172, "epoch": 6267} {"train_loss": -27.215574264526367, "global_step": 520173, "epoch": 6267} {"train_loss": -27.351226806640625, "global_step": 520174, "epoch": 6267} {"train_loss": -27.08680534362793, "global_step": 520175, "epoch": 6267} {"train_loss": -27.445676803588867, "global_step": 520176, "epoch": 6267} {"train_loss": -27.347461700439453, "global_step": 520177, "epoch": 6267} {"train_loss": -27.3700008392334, "global_step": 520178, "epoch": 6267} {"train_loss": -27.54813003540039, "global_step": 520179, "epoch": 6267} {"train_loss": -27.622196197509766, "global_step": 520180, "epoch": 6267} {"train_loss": -27.497793197631836, "global_step": 520181, "epoch": 6267} {"train_loss": -27.580228805541992, "global_step": 520182, "epoch": 6267} {"train_loss": -27.35487174987793, "global_step": 520183, "epoch": 6267} {"train_loss": -27.117340087890625, "global_step": 520184, "epoch": 6267} {"train_loss": -27.589014053344727, "global_step": 520185, "epoch": 6267} {"train_loss": -27.415924072265625, "global_step": 520186, "epoch": 6267} {"train_loss": -27.321918487548828, "global_step": 520187, "epoch": 6267} {"train_loss": -27.453657150268555, "global_step": 520188, "epoch": 6267} {"train_loss": -27.5144100189209, "global_step": 520189, "epoch": 6267} {"train_loss": -27.790607452392578, "global_step": 520190, "epoch": 6267} {"train_loss": -27.363113403320312, "global_step": 520191, "epoch": 6267} {"train_loss": -27.558286666870117, "global_step": 520192, "epoch": 6267} {"train_loss": -27.71634292602539, "global_step": 520193, "epoch": 6267} {"train_loss": -27.81019401550293, "global_step": 520194, "epoch": 6267} {"train_loss": -27.903310775756836, "global_step": 520195, "epoch": 6267} {"train_loss": -27.781930923461914, "global_step": 520196, "epoch": 6267} {"train_loss": -27.66208839416504, "global_step": 520197, "epoch": 6267} {"train_loss": -27.653852462768555, "global_step": 520198, "epoch": 6267} {"train_loss": -27.995092391967773, "global_step": 520199, "epoch": 6267} {"train_loss": -27.7825927734375, "global_step": 520200, "epoch": 6267} {"train_loss": -28.109420776367188, "global_step": 520201, "epoch": 6267} {"train_loss": -27.72047996520996, "global_step": 520202, "epoch": 6267} {"train_loss": -27.794172286987305, "global_step": 520203, "epoch": 6267} {"train_loss": -27.6513729095459, "global_step": 520204, "epoch": 6267} {"train_loss": -27.849462509155273, "global_step": 520205, "epoch": 6267} {"train_loss": -27.366226196289062, "global_step": 520206, "epoch": 6267} {"train_loss": -27.597156524658203, "global_step": 520207, "epoch": 6267} {"train_loss": -27.677343368530273, "global_step": 520208, "epoch": 6267} {"train_loss": -27.780759811401367, "global_step": 520209, "epoch": 6267} {"train_loss": -27.83930015563965, "global_step": 520210, "epoch": 6267} {"train_loss": -28.065881729125977, "global_step": 520211, "epoch": 6267} {"train_loss": -27.66019630432129, "global_step": 520212, "epoch": 6267} {"train_loss": -27.60023307800293, "global_step": 520213, "epoch": 6267} {"train_loss": -27.835229873657227, "global_step": 520214, "epoch": 6267} {"train_loss": -27.31406593322754, "global_step": 520215, "epoch": 6267} {"train_loss": -27.668781280517578, "global_step": 520216, "epoch": 6267} {"train_loss": -27.547992706298828, "global_step": 520217, "epoch": 6267} {"train_loss": -27.765161514282227, "global_step": 520218, "epoch": 6267} {"train_loss": -27.76094627380371, "global_step": 520219, "epoch": 6267} {"train_loss": -27.3668155670166, "global_step": 520220, "epoch": 6267} {"train_loss": -27.670654296875, "global_step": 520221, "epoch": 6267} {"train_loss": -27.7585391998291, "global_step": 520222, "epoch": 6267} {"train_loss": -27.60581398010254, "global_step": 520223, "epoch": 6267} {"train_loss": -27.435056686401367, "global_step": 520224, "epoch": 6267} {"train_loss": -27.725690841674805, "global_step": 520225, "epoch": 6267} {"train_loss": -27.54117774963379, "global_step": 520226, "epoch": 6267} {"train_loss": -27.524066925048828, "global_step": 520227, "epoch": 6267} {"train_loss": -27.281635284423828, "global_step": 520228, "epoch": 6267} {"train_loss": -27.624805450439453, "global_step": 520229, "epoch": 6267} {"train_loss": -27.7960147857666, "global_step": 520230, "epoch": 6267} {"train_loss": -27.537769317626953, "global_step": 520231, "epoch": 6267} {"train_loss": -27.673419952392578, "global_step": 520232, "epoch": 6267} {"train_loss": -27.73370361328125, "global_step": 520233, "epoch": 6267} {"train_loss": -27.15675163269043, "global_step": 520234, "epoch": 6267} {"train_loss": -27.848676681518555, "global_step": 520235, "epoch": 6267} {"train_loss": -27.54892921447754, "global_step": 520236, "epoch": 6267} {"train_loss": -27.71832847595215, "global_step": 520237, "epoch": 6267} {"train_loss": -27.287921905517578, "global_step": 520238, "epoch": 6267} {"train_loss": -27.7576904296875, "global_step": 520239, "epoch": 6267} {"train_loss": -27.776397705078125, "global_step": 520240, "epoch": 6267} {"train_loss": -27.511646270751953, "global_step": 520241, "epoch": 6267} {"train_loss": -27.453643798828125, "global_step": 520242, "epoch": 6267} {"train_loss": -27.44643997284303, "global_step": 520243, "epoch": 6267, "val_loss": 6584882.0} {"train_loss": -26.755828857421875, "global_step": 520244, "epoch": 6268} {"train_loss": -25.862751007080078, "global_step": 520245, "epoch": 6268} {"train_loss": -26.169137954711914, "global_step": 520246, "epoch": 6268} {"train_loss": -26.920928955078125, "global_step": 520247, "epoch": 6268} {"train_loss": -26.48719596862793, "global_step": 520248, "epoch": 6268} {"train_loss": -26.47725486755371, "global_step": 520249, "epoch": 6268} {"train_loss": -25.519271850585938, "global_step": 520250, "epoch": 6268} {"train_loss": -25.695968627929688, "global_step": 520251, "epoch": 6268} {"train_loss": -27.08754539489746, "global_step": 520252, "epoch": 6268} {"train_loss": -26.240339279174805, "global_step": 520253, "epoch": 6268} {"train_loss": -26.05316734313965, "global_step": 520254, "epoch": 6268} {"train_loss": -26.8656005859375, "global_step": 520255, "epoch": 6268} {"train_loss": -26.4329776763916, "global_step": 520256, "epoch": 6268} {"train_loss": -26.746274948120117, "global_step": 520257, "epoch": 6268} {"train_loss": -26.147384643554688, "global_step": 520258, "epoch": 6268} {"train_loss": -26.977100372314453, "global_step": 520259, "epoch": 6268} {"train_loss": -26.8720645904541, "global_step": 520260, "epoch": 6268} {"train_loss": -27.185016632080078, "global_step": 520261, "epoch": 6268} {"train_loss": -27.084985733032227, "global_step": 520262, "epoch": 6268} {"train_loss": -27.158966064453125, "global_step": 520263, "epoch": 6268} {"train_loss": -27.454320907592773, "global_step": 520264, "epoch": 6268} {"train_loss": -27.46358299255371, "global_step": 520265, "epoch": 6268} {"train_loss": -26.97298240661621, "global_step": 520266, "epoch": 6268} {"train_loss": -27.38591957092285, "global_step": 520267, "epoch": 6268} {"train_loss": -27.3182373046875, "global_step": 520268, "epoch": 6268} {"train_loss": -27.28738784790039, "global_step": 520269, "epoch": 6268} {"train_loss": -26.95075035095215, "global_step": 520270, "epoch": 6268} {"train_loss": -27.635358810424805, "global_step": 520271, "epoch": 6268} {"train_loss": -27.147567749023438, "global_step": 520272, "epoch": 6268} {"train_loss": -27.789915084838867, "global_step": 520273, "epoch": 6268} {"train_loss": -27.19032096862793, "global_step": 520274, "epoch": 6268} {"train_loss": -27.349674224853516, "global_step": 520275, "epoch": 6268} {"train_loss": -27.38079833984375, "global_step": 520276, "epoch": 6268} {"train_loss": -27.277318954467773, "global_step": 520277, "epoch": 6268} {"train_loss": -27.153539657592773, "global_step": 520278, "epoch": 6268} {"train_loss": -27.478525161743164, "global_step": 520279, "epoch": 6268} {"train_loss": -27.247289657592773, "global_step": 520280, "epoch": 6268} {"train_loss": -27.466571807861328, "global_step": 520281, "epoch": 6268} {"train_loss": -27.325641632080078, "global_step": 520282, "epoch": 6268} {"train_loss": -27.471622467041016, "global_step": 520283, "epoch": 6268} {"train_loss": -27.571989059448242, "global_step": 520284, "epoch": 6268} {"train_loss": -27.608945846557617, "global_step": 520285, "epoch": 6268} {"train_loss": -27.4183292388916, "global_step": 520286, "epoch": 6268} {"train_loss": -27.65399169921875, "global_step": 520287, "epoch": 6268} {"train_loss": -27.177953720092773, "global_step": 520288, "epoch": 6268} {"train_loss": -27.689645767211914, "global_step": 520289, "epoch": 6268} {"train_loss": -27.605438232421875, "global_step": 520290, "epoch": 6268} {"train_loss": -27.550159454345703, "global_step": 520291, "epoch": 6268} {"train_loss": -27.470901489257812, "global_step": 520292, "epoch": 6268} {"train_loss": -27.9009952545166, "global_step": 520293, "epoch": 6268} {"train_loss": -27.522382736206055, "global_step": 520294, "epoch": 6268} {"train_loss": -27.57398796081543, "global_step": 520295, "epoch": 6268} {"train_loss": -27.60064697265625, "global_step": 520296, "epoch": 6268} {"train_loss": -27.491586685180664, "global_step": 520297, "epoch": 6268} {"train_loss": -27.719411849975586, "global_step": 520298, "epoch": 6268} {"train_loss": -27.770883560180664, "global_step": 520299, "epoch": 6268} {"train_loss": -27.34493064880371, "global_step": 520300, "epoch": 6268} {"train_loss": -27.735105514526367, "global_step": 520301, "epoch": 6268} {"train_loss": -27.56715202331543, "global_step": 520302, "epoch": 6268} {"train_loss": -27.950529098510742, "global_step": 520303, "epoch": 6268} {"train_loss": -27.87318229675293, "global_step": 520304, "epoch": 6268} {"train_loss": -27.48822593688965, "global_step": 520305, "epoch": 6268} {"train_loss": -27.542072296142578, "global_step": 520306, "epoch": 6268} {"train_loss": -27.707778930664062, "global_step": 520307, "epoch": 6268} {"train_loss": -27.243988037109375, "global_step": 520308, "epoch": 6268} {"train_loss": -26.917236328125, "global_step": 520309, "epoch": 6268} {"train_loss": -26.608938217163086, "global_step": 520310, "epoch": 6268} {"train_loss": -27.790014266967773, "global_step": 520311, "epoch": 6268} {"train_loss": -27.412036895751953, "global_step": 520312, "epoch": 6268} {"train_loss": -27.19024085998535, "global_step": 520313, "epoch": 6268} {"train_loss": -27.27656364440918, "global_step": 520314, "epoch": 6268} {"train_loss": -27.277667999267578, "global_step": 520315, "epoch": 6268} {"train_loss": -27.265172958374023, "global_step": 520316, "epoch": 6268} {"train_loss": -27.334442138671875, "global_step": 520317, "epoch": 6268} {"train_loss": -27.001922607421875, "global_step": 520318, "epoch": 6268} {"train_loss": -27.40512466430664, "global_step": 520319, "epoch": 6268} {"train_loss": -27.219079971313477, "global_step": 520320, "epoch": 6268} {"train_loss": -27.788843154907227, "global_step": 520321, "epoch": 6268} {"train_loss": -27.3540096282959, "global_step": 520322, "epoch": 6268} {"train_loss": -27.41786766052246, "global_step": 520323, "epoch": 6268} {"train_loss": -27.43195152282715, "global_step": 520324, "epoch": 6268} {"train_loss": -27.721271514892578, "global_step": 520325, "epoch": 6268} {"train_loss": -27.22712103142796, "global_step": 520326, "epoch": 6268, "val_loss": 6549360.0} {"train_loss": -27.099964141845703, "global_step": 520327, "epoch": 6269} {"train_loss": -26.77089500427246, "global_step": 520328, "epoch": 6269} {"train_loss": -26.504098892211914, "global_step": 520329, "epoch": 6269} {"train_loss": -26.953039169311523, "global_step": 520330, "epoch": 6269} {"train_loss": -27.463714599609375, "global_step": 520331, "epoch": 6269} {"train_loss": -27.048513412475586, "global_step": 520332, "epoch": 6269} {"train_loss": -27.556074142456055, "global_step": 520333, "epoch": 6269} {"train_loss": -27.29644775390625, "global_step": 520334, "epoch": 6269} {"train_loss": -27.2600040435791, "global_step": 520335, "epoch": 6269} {"train_loss": -27.272781372070312, "global_step": 520336, "epoch": 6269} {"train_loss": -26.988845825195312, "global_step": 520337, "epoch": 6269} {"train_loss": -27.4808292388916, "global_step": 520338, "epoch": 6269} {"train_loss": -27.22355079650879, "global_step": 520339, "epoch": 6269} {"train_loss": -27.355615615844727, "global_step": 520340, "epoch": 6269} {"train_loss": -27.34515953063965, "global_step": 520341, "epoch": 6269} {"train_loss": -27.668493270874023, "global_step": 520342, "epoch": 6269} {"train_loss": -27.265304565429688, "global_step": 520343, "epoch": 6269} {"train_loss": -27.543655395507812, "global_step": 520344, "epoch": 6269} {"train_loss": -27.284616470336914, "global_step": 520345, "epoch": 6269} {"train_loss": -27.005231857299805, "global_step": 520346, "epoch": 6269} {"train_loss": -27.444599151611328, "global_step": 520347, "epoch": 6269} {"train_loss": -27.5570011138916, "global_step": 520348, "epoch": 6269} {"train_loss": -27.581329345703125, "global_step": 520349, "epoch": 6269} {"train_loss": -27.6131649017334, "global_step": 520350, "epoch": 6269} {"train_loss": -27.696908950805664, "global_step": 520351, "epoch": 6269} {"train_loss": -27.875415802001953, "global_step": 520352, "epoch": 6269} {"train_loss": -27.548568725585938, "global_step": 520353, "epoch": 6269} {"train_loss": -27.621490478515625, "global_step": 520354, "epoch": 6269} {"train_loss": -27.4505615234375, "global_step": 520355, "epoch": 6269} {"train_loss": -27.631046295166016, "global_step": 520356, "epoch": 6269} {"train_loss": -27.65985107421875, "global_step": 520357, "epoch": 6269} {"train_loss": -27.78505516052246, "global_step": 520358, "epoch": 6269} {"train_loss": -27.386503219604492, "global_step": 520359, "epoch": 6269} {"train_loss": -27.85736083984375, "global_step": 520360, "epoch": 6269} {"train_loss": -27.413251876831055, "global_step": 520361, "epoch": 6269} {"train_loss": -27.968259811401367, "global_step": 520362, "epoch": 6269} {"train_loss": -27.922948837280273, "global_step": 520363, "epoch": 6269} {"train_loss": -27.68287467956543, "global_step": 520364, "epoch": 6269} {"train_loss": -27.587080001831055, "global_step": 520365, "epoch": 6269} {"train_loss": -27.478017807006836, "global_step": 520366, "epoch": 6269} {"train_loss": -27.386615753173828, "global_step": 520367, "epoch": 6269} {"train_loss": -27.83025550842285, "global_step": 520368, "epoch": 6269} {"train_loss": -27.73459243774414, "global_step": 520369, "epoch": 6269} {"train_loss": -28.173696517944336, "global_step": 520370, "epoch": 6269} {"train_loss": -27.78449058532715, "global_step": 520371, "epoch": 6269} {"train_loss": -27.56450843811035, "global_step": 520372, "epoch": 6269} {"train_loss": -27.53204345703125, "global_step": 520373, "epoch": 6269} {"train_loss": -27.762113571166992, "global_step": 520374, "epoch": 6269} {"train_loss": -27.247446060180664, "global_step": 520375, "epoch": 6269} {"train_loss": -27.96380615234375, "global_step": 520376, "epoch": 6269} {"train_loss": -27.851764678955078, "global_step": 520377, "epoch": 6269} {"train_loss": -27.793827056884766, "global_step": 520378, "epoch": 6269} {"train_loss": -27.070348739624023, "global_step": 520379, "epoch": 6269} {"train_loss": -27.50397300720215, "global_step": 520380, "epoch": 6269} {"train_loss": -27.532825469970703, "global_step": 520381, "epoch": 6269} {"train_loss": -27.47975730895996, "global_step": 520382, "epoch": 6269} {"train_loss": -27.6080265045166, "global_step": 520383, "epoch": 6269} {"train_loss": -27.524158477783203, "global_step": 520384, "epoch": 6269} {"train_loss": -27.462003707885742, "global_step": 520385, "epoch": 6269} {"train_loss": -27.532989501953125, "global_step": 520386, "epoch": 6269} {"train_loss": -27.559066772460938, "global_step": 520387, "epoch": 6269} {"train_loss": -27.552764892578125, "global_step": 520388, "epoch": 6269} {"train_loss": -27.295373916625977, "global_step": 520389, "epoch": 6269} {"train_loss": -26.471235275268555, "global_step": 520390, "epoch": 6269} {"train_loss": -26.990625381469727, "global_step": 520391, "epoch": 6269} {"train_loss": -27.256000518798828, "global_step": 520392, "epoch": 6269} {"train_loss": -27.588958740234375, "global_step": 520393, "epoch": 6269} {"train_loss": -27.309696197509766, "global_step": 520394, "epoch": 6269} {"train_loss": -27.28899574279785, "global_step": 520395, "epoch": 6269} {"train_loss": -27.324872970581055, "global_step": 520396, "epoch": 6269} {"train_loss": -27.436033248901367, "global_step": 520397, "epoch": 6269} {"train_loss": -27.203094482421875, "global_step": 520398, "epoch": 6269} {"train_loss": -27.2578125, "global_step": 520399, "epoch": 6269} {"train_loss": -26.864057540893555, "global_step": 520400, "epoch": 6269} {"train_loss": -27.67612648010254, "global_step": 520401, "epoch": 6269} {"train_loss": -27.321069717407227, "global_step": 520402, "epoch": 6269} {"train_loss": -27.55035400390625, "global_step": 520403, "epoch": 6269} {"train_loss": -27.491174697875977, "global_step": 520404, "epoch": 6269} {"train_loss": -27.260190963745117, "global_step": 520405, "epoch": 6269} {"train_loss": -27.24354362487793, "global_step": 520406, "epoch": 6269} {"train_loss": -27.311126708984375, "global_step": 520407, "epoch": 6269} {"train_loss": -27.33845329284668, "global_step": 520408, "epoch": 6269} {"train_loss": -27.448980997843915, "global_step": 520409, "epoch": 6269, "val_loss": 6632043.5} {"train_loss": -26.64747428894043, "global_step": 520410, "epoch": 6270} {"train_loss": -26.76511001586914, "global_step": 520411, "epoch": 6270} {"train_loss": -26.871000289916992, "global_step": 520412, "epoch": 6270} {"train_loss": -26.64825439453125, "global_step": 520413, "epoch": 6270} {"train_loss": -27.164173126220703, "global_step": 520414, "epoch": 6270} {"train_loss": -26.685026168823242, "global_step": 520415, "epoch": 6270} {"train_loss": -26.545429229736328, "global_step": 520416, "epoch": 6270} {"train_loss": -27.26392936706543, "global_step": 520417, "epoch": 6270} {"train_loss": -27.14666175842285, "global_step": 520418, "epoch": 6270} {"train_loss": -27.09030532836914, "global_step": 520419, "epoch": 6270} {"train_loss": -27.239105224609375, "global_step": 520420, "epoch": 6270} {"train_loss": -26.7286376953125, "global_step": 520421, "epoch": 6270} {"train_loss": -26.83794593811035, "global_step": 520422, "epoch": 6270} {"train_loss": -27.341299057006836, "global_step": 520423, "epoch": 6270} {"train_loss": -26.633447647094727, "global_step": 520424, "epoch": 6270} {"train_loss": -27.41180992126465, "global_step": 520425, "epoch": 6270} {"train_loss": -26.71150016784668, "global_step": 520426, "epoch": 6270} {"train_loss": -27.270734786987305, "global_step": 520427, "epoch": 6270} {"train_loss": -27.22794532775879, "global_step": 520428, "epoch": 6270} {"train_loss": -27.1556396484375, "global_step": 520429, "epoch": 6270} {"train_loss": -27.15608024597168, "global_step": 520430, "epoch": 6270} {"train_loss": -27.2061824798584, "global_step": 520431, "epoch": 6270} {"train_loss": -27.440298080444336, "global_step": 520432, "epoch": 6270} {"train_loss": -27.46238136291504, "global_step": 520433, "epoch": 6270} {"train_loss": -27.301603317260742, "global_step": 520434, "epoch": 6270} {"train_loss": -27.258649826049805, "global_step": 520435, "epoch": 6270} {"train_loss": -27.1635684967041, "global_step": 520436, "epoch": 6270} {"train_loss": -27.6269474029541, "global_step": 520437, "epoch": 6270} {"train_loss": -27.300262451171875, "global_step": 520438, "epoch": 6270} {"train_loss": -27.175100326538086, "global_step": 520439, "epoch": 6270} {"train_loss": -27.628925323486328, "global_step": 520440, "epoch": 6270} {"train_loss": -27.362781524658203, "global_step": 520441, "epoch": 6270} {"train_loss": -27.600019454956055, "global_step": 520442, "epoch": 6270} {"train_loss": -27.577041625976562, "global_step": 520443, "epoch": 6270} {"train_loss": -27.600065231323242, "global_step": 520444, "epoch": 6270} {"train_loss": -27.634246826171875, "global_step": 520445, "epoch": 6270} {"train_loss": -27.406158447265625, "global_step": 520446, "epoch": 6270} {"train_loss": -27.64386558532715, "global_step": 520447, "epoch": 6270} {"train_loss": -27.192365646362305, "global_step": 520448, "epoch": 6270} {"train_loss": -27.806577682495117, "global_step": 520449, "epoch": 6270} {"train_loss": -27.4299259185791, "global_step": 520450, "epoch": 6270} {"train_loss": -27.1594295501709, "global_step": 520451, "epoch": 6270} {"train_loss": -27.3541259765625, "global_step": 520452, "epoch": 6270} {"train_loss": -27.466842651367188, "global_step": 520453, "epoch": 6270} {"train_loss": -27.786285400390625, "global_step": 520454, "epoch": 6270} {"train_loss": -27.62958335876465, "global_step": 520455, "epoch": 6270} {"train_loss": -27.33747673034668, "global_step": 520456, "epoch": 6270} {"train_loss": -27.72954750061035, "global_step": 520457, "epoch": 6270} {"train_loss": -27.446949005126953, "global_step": 520458, "epoch": 6270} {"train_loss": -27.552509307861328, "global_step": 520459, "epoch": 6270} {"train_loss": -27.3919620513916, "global_step": 520460, "epoch": 6270} {"train_loss": -27.632923126220703, "global_step": 520461, "epoch": 6270} {"train_loss": -27.711706161499023, "global_step": 520462, "epoch": 6270} {"train_loss": -27.353113174438477, "global_step": 520463, "epoch": 6270} {"train_loss": -27.557880401611328, "global_step": 520464, "epoch": 6270} {"train_loss": -27.180679321289062, "global_step": 520465, "epoch": 6270} {"train_loss": -27.859088897705078, "global_step": 520466, "epoch": 6270} {"train_loss": -27.43487548828125, "global_step": 520467, "epoch": 6270} {"train_loss": -27.394012451171875, "global_step": 520468, "epoch": 6270} {"train_loss": -27.498022079467773, "global_step": 520469, "epoch": 6270} {"train_loss": -27.994611740112305, "global_step": 520470, "epoch": 6270} {"train_loss": -27.80231285095215, "global_step": 520471, "epoch": 6270} {"train_loss": -27.556842803955078, "global_step": 520472, "epoch": 6270} {"train_loss": -27.079792022705078, "global_step": 520473, "epoch": 6270} {"train_loss": -27.685367584228516, "global_step": 520474, "epoch": 6270} {"train_loss": -27.78704261779785, "global_step": 520475, "epoch": 6270} {"train_loss": -26.985889434814453, "global_step": 520476, "epoch": 6270} {"train_loss": -27.496442794799805, "global_step": 520477, "epoch": 6270} {"train_loss": -27.575164794921875, "global_step": 520478, "epoch": 6270} {"train_loss": -27.138757705688477, "global_step": 520479, "epoch": 6270} {"train_loss": -27.438528060913086, "global_step": 520480, "epoch": 6270} {"train_loss": -27.101734161376953, "global_step": 520481, "epoch": 6270} {"train_loss": -27.542388916015625, "global_step": 520482, "epoch": 6270} {"train_loss": -27.117307662963867, "global_step": 520483, "epoch": 6270} {"train_loss": -27.447568893432617, "global_step": 520484, "epoch": 6270} {"train_loss": -27.1694393157959, "global_step": 520485, "epoch": 6270} {"train_loss": -27.169836044311523, "global_step": 520486, "epoch": 6270} {"train_loss": -27.533405303955078, "global_step": 520487, "epoch": 6270} {"train_loss": -27.75885009765625, "global_step": 520488, "epoch": 6270} {"train_loss": -27.333343505859375, "global_step": 520489, "epoch": 6270} {"train_loss": -27.634540557861328, "global_step": 520490, "epoch": 6270} {"train_loss": -27.237375259399414, "global_step": 520491, "epoch": 6270} {"train_loss": -27.352409753454737, "global_step": 520492, "epoch": 6270, "val_loss": 6695291.0} {"train_loss": -26.462827682495117, "global_step": 520493, "epoch": 6271} {"train_loss": -26.587421417236328, "global_step": 520494, "epoch": 6271} {"train_loss": -27.237512588500977, "global_step": 520495, "epoch": 6271} {"train_loss": -26.413915634155273, "global_step": 520496, "epoch": 6271} {"train_loss": -27.0091495513916, "global_step": 520497, "epoch": 6271} {"train_loss": -26.79778480529785, "global_step": 520498, "epoch": 6271} {"train_loss": -27.089746475219727, "global_step": 520499, "epoch": 6271} {"train_loss": -27.329273223876953, "global_step": 520500, "epoch": 6271} {"train_loss": -27.195966720581055, "global_step": 520501, "epoch": 6271} {"train_loss": -27.45608901977539, "global_step": 520502, "epoch": 6271} {"train_loss": -27.29951286315918, "global_step": 520503, "epoch": 6271} {"train_loss": -27.501794815063477, "global_step": 520504, "epoch": 6271} {"train_loss": -27.903852462768555, "global_step": 520505, "epoch": 6271} {"train_loss": -27.375308990478516, "global_step": 520506, "epoch": 6271} {"train_loss": -27.2091007232666, "global_step": 520507, "epoch": 6271} {"train_loss": -27.398548126220703, "global_step": 520508, "epoch": 6271} {"train_loss": -27.415494918823242, "global_step": 520509, "epoch": 6271} {"train_loss": -27.141271591186523, "global_step": 520510, "epoch": 6271} {"train_loss": -27.42225456237793, "global_step": 520511, "epoch": 6271} {"train_loss": -27.379474639892578, "global_step": 520512, "epoch": 6271} {"train_loss": -27.295942306518555, "global_step": 520513, "epoch": 6271} {"train_loss": -27.4315185546875, "global_step": 520514, "epoch": 6271} {"train_loss": -27.488412857055664, "global_step": 520515, "epoch": 6271} {"train_loss": -27.329090118408203, "global_step": 520516, "epoch": 6271} {"train_loss": -27.409948348999023, "global_step": 520517, "epoch": 6271} {"train_loss": -27.726043701171875, "global_step": 520518, "epoch": 6271} {"train_loss": -27.343900680541992, "global_step": 520519, "epoch": 6271} {"train_loss": -27.97340202331543, "global_step": 520520, "epoch": 6271} {"train_loss": -27.596155166625977, "global_step": 520521, "epoch": 6271} {"train_loss": -27.836307525634766, "global_step": 520522, "epoch": 6271} {"train_loss": -27.341028213500977, "global_step": 520523, "epoch": 6271} {"train_loss": -27.702356338500977, "global_step": 520524, "epoch": 6271} {"train_loss": -27.737262725830078, "global_step": 520525, "epoch": 6271} {"train_loss": -27.72932243347168, "global_step": 520526, "epoch": 6271} {"train_loss": -27.641590118408203, "global_step": 520527, "epoch": 6271} {"train_loss": -28.065582275390625, "global_step": 520528, "epoch": 6271} {"train_loss": -27.34162712097168, "global_step": 520529, "epoch": 6271} {"train_loss": -27.66914176940918, "global_step": 520530, "epoch": 6271} {"train_loss": -27.20002555847168, "global_step": 520531, "epoch": 6271} {"train_loss": -27.64515495300293, "global_step": 520532, "epoch": 6271} {"train_loss": -27.55194664001465, "global_step": 520533, "epoch": 6271} {"train_loss": -28.124420166015625, "global_step": 520534, "epoch": 6271} {"train_loss": -27.66196632385254, "global_step": 520535, "epoch": 6271} {"train_loss": -27.722869873046875, "global_step": 520536, "epoch": 6271} {"train_loss": -27.821210861206055, "global_step": 520537, "epoch": 6271} {"train_loss": -28.03584098815918, "global_step": 520538, "epoch": 6271} {"train_loss": -27.91998291015625, "global_step": 520539, "epoch": 6271} {"train_loss": -27.549463272094727, "global_step": 520540, "epoch": 6271} {"train_loss": -27.83917808532715, "global_step": 520541, "epoch": 6271} {"train_loss": -28.059925079345703, "global_step": 520542, "epoch": 6271} {"train_loss": -27.467493057250977, "global_step": 520543, "epoch": 6271} {"train_loss": -27.523237228393555, "global_step": 520544, "epoch": 6271} {"train_loss": -27.81666374206543, "global_step": 520545, "epoch": 6271} {"train_loss": -27.9014892578125, "global_step": 520546, "epoch": 6271} {"train_loss": -27.634485244750977, "global_step": 520547, "epoch": 6271} {"train_loss": -27.70696449279785, "global_step": 520548, "epoch": 6271} {"train_loss": -27.566925048828125, "global_step": 520549, "epoch": 6271} {"train_loss": -27.438873291015625, "global_step": 520550, "epoch": 6271} {"train_loss": -27.212493896484375, "global_step": 520551, "epoch": 6271} {"train_loss": -26.912281036376953, "global_step": 520552, "epoch": 6271} {"train_loss": -27.062732696533203, "global_step": 520553, "epoch": 6271} {"train_loss": -27.314783096313477, "global_step": 520554, "epoch": 6271} {"train_loss": -27.818195343017578, "global_step": 520555, "epoch": 6271} {"train_loss": -27.46405029296875, "global_step": 520556, "epoch": 6271} {"train_loss": -27.255096435546875, "global_step": 520557, "epoch": 6271} {"train_loss": -27.078779220581055, "global_step": 520558, "epoch": 6271} {"train_loss": -27.112934112548828, "global_step": 520559, "epoch": 6271} {"train_loss": -27.167638778686523, "global_step": 520560, "epoch": 6271} {"train_loss": -27.660367965698242, "global_step": 520561, "epoch": 6271} {"train_loss": -27.48567008972168, "global_step": 520562, "epoch": 6271} {"train_loss": -27.441328048706055, "global_step": 520563, "epoch": 6271} {"train_loss": -27.62909507751465, "global_step": 520564, "epoch": 6271} {"train_loss": -27.578710556030273, "global_step": 520565, "epoch": 6271} {"train_loss": -27.453845977783203, "global_step": 520566, "epoch": 6271} {"train_loss": -27.7202205657959, "global_step": 520567, "epoch": 6271} {"train_loss": -27.43609046936035, "global_step": 520568, "epoch": 6271} {"train_loss": -27.307022094726562, "global_step": 520569, "epoch": 6271} {"train_loss": -28.027013778686523, "global_step": 520570, "epoch": 6271} {"train_loss": -27.531936645507812, "global_step": 520571, "epoch": 6271} {"train_loss": -27.459808349609375, "global_step": 520572, "epoch": 6271} {"train_loss": -27.678800582885742, "global_step": 520573, "epoch": 6271} {"train_loss": -27.449792861938477, "global_step": 520574, "epoch": 6271} {"train_loss": -27.465520192341632, "global_step": 520575, "epoch": 6271, "val_loss": 6692146.5} {"train_loss": -26.98760986328125, "global_step": 520576, "epoch": 6272} {"train_loss": -26.800703048706055, "global_step": 520577, "epoch": 6272} {"train_loss": -26.986297607421875, "global_step": 520578, "epoch": 6272} {"train_loss": -27.06898307800293, "global_step": 520579, "epoch": 6272} {"train_loss": -26.56110191345215, "global_step": 520580, "epoch": 6272} {"train_loss": -27.194189071655273, "global_step": 520581, "epoch": 6272} {"train_loss": -26.91132164001465, "global_step": 520582, "epoch": 6272} {"train_loss": -27.139123916625977, "global_step": 520583, "epoch": 6272} {"train_loss": -27.3306884765625, "global_step": 520584, "epoch": 6272} {"train_loss": -27.601959228515625, "global_step": 520585, "epoch": 6272} {"train_loss": -27.483591079711914, "global_step": 520586, "epoch": 6272} {"train_loss": -27.366348266601562, "global_step": 520587, "epoch": 6272} {"train_loss": -26.819427490234375, "global_step": 520588, "epoch": 6272} {"train_loss": -27.3221378326416, "global_step": 520589, "epoch": 6272} {"train_loss": -27.178518295288086, "global_step": 520590, "epoch": 6272} {"train_loss": -27.014129638671875, "global_step": 520591, "epoch": 6272} {"train_loss": -27.315641403198242, "global_step": 520592, "epoch": 6272} {"train_loss": -27.21613883972168, "global_step": 520593, "epoch": 6272} {"train_loss": -27.012842178344727, "global_step": 520594, "epoch": 6272} {"train_loss": -27.336530685424805, "global_step": 520595, "epoch": 6272} {"train_loss": -27.128564834594727, "global_step": 520596, "epoch": 6272} {"train_loss": -27.636987686157227, "global_step": 520597, "epoch": 6272} {"train_loss": -27.07486915588379, "global_step": 520598, "epoch": 6272} {"train_loss": -27.476303100585938, "global_step": 520599, "epoch": 6272} {"train_loss": -27.294437408447266, "global_step": 520600, "epoch": 6272} {"train_loss": -27.7191219329834, "global_step": 520601, "epoch": 6272} {"train_loss": -27.294591903686523, "global_step": 520602, "epoch": 6272} {"train_loss": -27.715368270874023, "global_step": 520603, "epoch": 6272} {"train_loss": -27.27387046813965, "global_step": 520604, "epoch": 6272} {"train_loss": -27.489704132080078, "global_step": 520605, "epoch": 6272} {"train_loss": -27.119897842407227, "global_step": 520606, "epoch": 6272} {"train_loss": -27.46711540222168, "global_step": 520607, "epoch": 6272} {"train_loss": -27.537586212158203, "global_step": 520608, "epoch": 6272} {"train_loss": -27.389209747314453, "global_step": 520609, "epoch": 6272} {"train_loss": -27.162067413330078, "global_step": 520610, "epoch": 6272} {"train_loss": -27.394372940063477, "global_step": 520611, "epoch": 6272} {"train_loss": -27.474164962768555, "global_step": 520612, "epoch": 6272} {"train_loss": -27.59812355041504, "global_step": 520613, "epoch": 6272} {"train_loss": -27.130680084228516, "global_step": 520614, "epoch": 6272} {"train_loss": -27.16656494140625, "global_step": 520615, "epoch": 6272} {"train_loss": -27.412384033203125, "global_step": 520616, "epoch": 6272} {"train_loss": -27.42789649963379, "global_step": 520617, "epoch": 6272} {"train_loss": -27.507734298706055, "global_step": 520618, "epoch": 6272} {"train_loss": -27.72369956970215, "global_step": 520619, "epoch": 6272} {"train_loss": -27.83076286315918, "global_step": 520620, "epoch": 6272} {"train_loss": -27.54693031311035, "global_step": 520621, "epoch": 6272} {"train_loss": -27.853757858276367, "global_step": 520622, "epoch": 6272} {"train_loss": -27.338415145874023, "global_step": 520623, "epoch": 6272} {"train_loss": -27.181228637695312, "global_step": 520624, "epoch": 6272} {"train_loss": -27.4083194732666, "global_step": 520625, "epoch": 6272} {"train_loss": -27.581323623657227, "global_step": 520626, "epoch": 6272} {"train_loss": -28.04380226135254, "global_step": 520627, "epoch": 6272} {"train_loss": -27.703641891479492, "global_step": 520628, "epoch": 6272} {"train_loss": -27.5629825592041, "global_step": 520629, "epoch": 6272} {"train_loss": -27.436017990112305, "global_step": 520630, "epoch": 6272} {"train_loss": -27.87513542175293, "global_step": 520631, "epoch": 6272} {"train_loss": -27.199874877929688, "global_step": 520632, "epoch": 6272} {"train_loss": -27.412525177001953, "global_step": 520633, "epoch": 6272} {"train_loss": -27.638402938842773, "global_step": 520634, "epoch": 6272} {"train_loss": -27.857410430908203, "global_step": 520635, "epoch": 6272} {"train_loss": -27.944660186767578, "global_step": 520636, "epoch": 6272} {"train_loss": -27.88295555114746, "global_step": 520637, "epoch": 6272} {"train_loss": -27.6237735748291, "global_step": 520638, "epoch": 6272} {"train_loss": -27.756103515625, "global_step": 520639, "epoch": 6272} {"train_loss": -27.4028377532959, "global_step": 520640, "epoch": 6272} {"train_loss": -27.637460708618164, "global_step": 520641, "epoch": 6272} {"train_loss": -27.6361083984375, "global_step": 520642, "epoch": 6272} {"train_loss": -27.546661376953125, "global_step": 520643, "epoch": 6272} {"train_loss": -27.26789665222168, "global_step": 520644, "epoch": 6272} {"train_loss": -27.34339714050293, "global_step": 520645, "epoch": 6272} {"train_loss": -27.63065528869629, "global_step": 520646, "epoch": 6272} {"train_loss": -27.80694580078125, "global_step": 520647, "epoch": 6272} {"train_loss": -27.839242935180664, "global_step": 520648, "epoch": 6272} {"train_loss": -27.914587020874023, "global_step": 520649, "epoch": 6272} {"train_loss": -27.85419273376465, "global_step": 520650, "epoch": 6272} {"train_loss": -27.602697372436523, "global_step": 520651, "epoch": 6272} {"train_loss": -27.776321411132812, "global_step": 520652, "epoch": 6272} {"train_loss": -27.679738998413086, "global_step": 520653, "epoch": 6272} {"train_loss": -27.65509605407715, "global_step": 520654, "epoch": 6272} {"train_loss": -28.0357666015625, "global_step": 520655, "epoch": 6272} {"train_loss": -27.792282104492188, "global_step": 520656, "epoch": 6272} {"train_loss": -27.014007568359375, "global_step": 520657, "epoch": 6272} {"train_loss": -27.4395259259695, "global_step": 520658, "epoch": 6272, "val_loss": 6623937.0} {"train_loss": -25.455121994018555, "global_step": 520659, "epoch": 6273} {"train_loss": -25.90297508239746, "global_step": 520660, "epoch": 6273} {"train_loss": -26.594709396362305, "global_step": 520661, "epoch": 6273} {"train_loss": -25.45618438720703, "global_step": 520662, "epoch": 6273} {"train_loss": -26.252044677734375, "global_step": 520663, "epoch": 6273} {"train_loss": -26.427865982055664, "global_step": 520664, "epoch": 6273} {"train_loss": -26.884540557861328, "global_step": 520665, "epoch": 6273} {"train_loss": -27.053647994995117, "global_step": 520666, "epoch": 6273} {"train_loss": -26.845947265625, "global_step": 520667, "epoch": 6273} {"train_loss": -26.97412109375, "global_step": 520668, "epoch": 6273} {"train_loss": -26.891767501831055, "global_step": 520669, "epoch": 6273} {"train_loss": -26.62284278869629, "global_step": 520670, "epoch": 6273} {"train_loss": -27.005361557006836, "global_step": 520671, "epoch": 6273} {"train_loss": -27.126489639282227, "global_step": 520672, "epoch": 6273} {"train_loss": -27.098651885986328, "global_step": 520673, "epoch": 6273} {"train_loss": -26.71078872680664, "global_step": 520674, "epoch": 6273} {"train_loss": -26.865447998046875, "global_step": 520675, "epoch": 6273} {"train_loss": -27.28818702697754, "global_step": 520676, "epoch": 6273} {"train_loss": -27.19959831237793, "global_step": 520677, "epoch": 6273} {"train_loss": -27.2349910736084, "global_step": 520678, "epoch": 6273} {"train_loss": -27.110944747924805, "global_step": 520679, "epoch": 6273} {"train_loss": -27.18790626525879, "global_step": 520680, "epoch": 6273} {"train_loss": -26.96908950805664, "global_step": 520681, "epoch": 6273} {"train_loss": -27.559751510620117, "global_step": 520682, "epoch": 6273} {"train_loss": -27.259963989257812, "global_step": 520683, "epoch": 6273} {"train_loss": -27.0694637298584, "global_step": 520684, "epoch": 6273} {"train_loss": -27.421972274780273, "global_step": 520685, "epoch": 6273} {"train_loss": -27.079666137695312, "global_step": 520686, "epoch": 6273} {"train_loss": -27.231653213500977, "global_step": 520687, "epoch": 6273} {"train_loss": -27.456335067749023, "global_step": 520688, "epoch": 6273} {"train_loss": -27.492755889892578, "global_step": 520689, "epoch": 6273} {"train_loss": -27.380054473876953, "global_step": 520690, "epoch": 6273} {"train_loss": -27.45179557800293, "global_step": 520691, "epoch": 6273} {"train_loss": -27.494287490844727, "global_step": 520692, "epoch": 6273} {"train_loss": -27.561010360717773, "global_step": 520693, "epoch": 6273} {"train_loss": -27.892200469970703, "global_step": 520694, "epoch": 6273} {"train_loss": -27.63642692565918, "global_step": 520695, "epoch": 6273} {"train_loss": -27.645750045776367, "global_step": 520696, "epoch": 6273} {"train_loss": -27.562376022338867, "global_step": 520697, "epoch": 6273} {"train_loss": -27.512073516845703, "global_step": 520698, "epoch": 6273} {"train_loss": -27.63703727722168, "global_step": 520699, "epoch": 6273} {"train_loss": -27.491125106811523, "global_step": 520700, "epoch": 6273} {"train_loss": -27.940814971923828, "global_step": 520701, "epoch": 6273} {"train_loss": -27.557722091674805, "global_step": 520702, "epoch": 6273} {"train_loss": -27.6798095703125, "global_step": 520703, "epoch": 6273} {"train_loss": -27.655195236206055, "global_step": 520704, "epoch": 6273} {"train_loss": -27.785741806030273, "global_step": 520705, "epoch": 6273} {"train_loss": -27.795841217041016, "global_step": 520706, "epoch": 6273} {"train_loss": -27.527984619140625, "global_step": 520707, "epoch": 6273} {"train_loss": -27.956527709960938, "global_step": 520708, "epoch": 6273} {"train_loss": -27.694578170776367, "global_step": 520709, "epoch": 6273} {"train_loss": -27.63770866394043, "global_step": 520710, "epoch": 6273} {"train_loss": -27.812442779541016, "global_step": 520711, "epoch": 6273} {"train_loss": -27.53553581237793, "global_step": 520712, "epoch": 6273} {"train_loss": -27.595869064331055, "global_step": 520713, "epoch": 6273} {"train_loss": -27.7204647064209, "global_step": 520714, "epoch": 6273} {"train_loss": -28.01569175720215, "global_step": 520715, "epoch": 6273} {"train_loss": -27.892059326171875, "global_step": 520716, "epoch": 6273} {"train_loss": -28.124588012695312, "global_step": 520717, "epoch": 6273} {"train_loss": -27.64348793029785, "global_step": 520718, "epoch": 6273} {"train_loss": -27.566015243530273, "global_step": 520719, "epoch": 6273} {"train_loss": -27.454816818237305, "global_step": 520720, "epoch": 6273} {"train_loss": -27.527257919311523, "global_step": 520721, "epoch": 6273} {"train_loss": -27.394330978393555, "global_step": 520722, "epoch": 6273} {"train_loss": -26.698774337768555, "global_step": 520723, "epoch": 6273} {"train_loss": -25.88006019592285, "global_step": 520724, "epoch": 6273} {"train_loss": -26.110034942626953, "global_step": 520725, "epoch": 6273} {"train_loss": -27.347570419311523, "global_step": 520726, "epoch": 6273} {"train_loss": -27.489545822143555, "global_step": 520727, "epoch": 6273} {"train_loss": -26.583337783813477, "global_step": 520728, "epoch": 6273} {"train_loss": -26.698347091674805, "global_step": 520729, "epoch": 6273} {"train_loss": -27.31426429748535, "global_step": 520730, "epoch": 6273} {"train_loss": -26.948965072631836, "global_step": 520731, "epoch": 6273} {"train_loss": -27.04645347595215, "global_step": 520732, "epoch": 6273} {"train_loss": -27.3712215423584, "global_step": 520733, "epoch": 6273} {"train_loss": -27.3824462890625, "global_step": 520734, "epoch": 6273} {"train_loss": -27.104522705078125, "global_step": 520735, "epoch": 6273} {"train_loss": -27.537755966186523, "global_step": 520736, "epoch": 6273} {"train_loss": -27.070119857788086, "global_step": 520737, "epoch": 6273} {"train_loss": -27.27567481994629, "global_step": 520738, "epoch": 6273} {"train_loss": -27.3818302154541, "global_step": 520739, "epoch": 6273} {"train_loss": -27.546411514282227, "global_step": 520740, "epoch": 6273} {"train_loss": -27.252414565488518, "global_step": 520741, "epoch": 6273, "val_loss": 6632068.5} {"train_loss": -26.901214599609375, "global_step": 520742, "epoch": 6274} {"train_loss": -26.74846839904785, "global_step": 520743, "epoch": 6274} {"train_loss": -26.508197784423828, "global_step": 520744, "epoch": 6274} {"train_loss": -26.6086483001709, "global_step": 520745, "epoch": 6274} {"train_loss": -26.45572280883789, "global_step": 520746, "epoch": 6274} {"train_loss": -26.978290557861328, "global_step": 520747, "epoch": 6274} {"train_loss": -26.980390548706055, "global_step": 520748, "epoch": 6274} {"train_loss": -26.7806396484375, "global_step": 520749, "epoch": 6274} {"train_loss": -27.059110641479492, "global_step": 520750, "epoch": 6274} {"train_loss": -27.62240982055664, "global_step": 520751, "epoch": 6274} {"train_loss": -26.758787155151367, "global_step": 520752, "epoch": 6274} {"train_loss": -27.235904693603516, "global_step": 520753, "epoch": 6274} {"train_loss": -26.99588966369629, "global_step": 520754, "epoch": 6274} {"train_loss": -26.80038833618164, "global_step": 520755, "epoch": 6274} {"train_loss": -27.37017250061035, "global_step": 520756, "epoch": 6274} {"train_loss": -27.67670249938965, "global_step": 520757, "epoch": 6274} {"train_loss": -27.505420684814453, "global_step": 520758, "epoch": 6274} {"train_loss": -27.252216339111328, "global_step": 520759, "epoch": 6274} {"train_loss": -27.343032836914062, "global_step": 520760, "epoch": 6274} {"train_loss": -27.48976707458496, "global_step": 520761, "epoch": 6274} {"train_loss": -27.454843521118164, "global_step": 520762, "epoch": 6274} {"train_loss": -27.72597312927246, "global_step": 520763, "epoch": 6274} {"train_loss": -27.483325958251953, "global_step": 520764, "epoch": 6274} {"train_loss": -27.6191463470459, "global_step": 520765, "epoch": 6274} {"train_loss": -27.947702407836914, "global_step": 520766, "epoch": 6274} {"train_loss": -27.47787857055664, "global_step": 520767, "epoch": 6274} {"train_loss": -27.667997360229492, "global_step": 520768, "epoch": 6274} {"train_loss": -27.3613338470459, "global_step": 520769, "epoch": 6274} {"train_loss": -27.6178035736084, "global_step": 520770, "epoch": 6274} {"train_loss": -27.417774200439453, "global_step": 520771, "epoch": 6274} {"train_loss": -27.792089462280273, "global_step": 520772, "epoch": 6274} {"train_loss": -27.652069091796875, "global_step": 520773, "epoch": 6274} {"train_loss": -28.05413818359375, "global_step": 520774, "epoch": 6274} {"train_loss": -27.755231857299805, "global_step": 520775, "epoch": 6274} {"train_loss": -27.50752067565918, "global_step": 520776, "epoch": 6274} {"train_loss": -27.871082305908203, "global_step": 520777, "epoch": 6274} {"train_loss": -27.651498794555664, "global_step": 520778, "epoch": 6274} {"train_loss": -27.589618682861328, "global_step": 520779, "epoch": 6274} {"train_loss": -27.623762130737305, "global_step": 520780, "epoch": 6274} {"train_loss": -27.874164581298828, "global_step": 520781, "epoch": 6274} {"train_loss": -27.607131958007812, "global_step": 520782, "epoch": 6274} {"train_loss": -27.69019889831543, "global_step": 520783, "epoch": 6274} {"train_loss": -27.697784423828125, "global_step": 520784, "epoch": 6274} {"train_loss": -27.338367462158203, "global_step": 520785, "epoch": 6274} {"train_loss": -27.76676368713379, "global_step": 520786, "epoch": 6274} {"train_loss": -27.625019073486328, "global_step": 520787, "epoch": 6274} {"train_loss": -27.959577560424805, "global_step": 520788, "epoch": 6274} {"train_loss": -27.543176651000977, "global_step": 520789, "epoch": 6274} {"train_loss": -27.601959228515625, "global_step": 520790, "epoch": 6274} {"train_loss": -27.64240837097168, "global_step": 520791, "epoch": 6274} {"train_loss": -27.441572189331055, "global_step": 520792, "epoch": 6274} {"train_loss": -28.049036026000977, "global_step": 520793, "epoch": 6274} {"train_loss": -27.738922119140625, "global_step": 520794, "epoch": 6274} {"train_loss": -27.637243270874023, "global_step": 520795, "epoch": 6274} {"train_loss": -27.729400634765625, "global_step": 520796, "epoch": 6274} {"train_loss": -27.221954345703125, "global_step": 520797, "epoch": 6274} {"train_loss": -27.444204330444336, "global_step": 520798, "epoch": 6274} {"train_loss": -26.946130752563477, "global_step": 520799, "epoch": 6274} {"train_loss": -26.44355583190918, "global_step": 520800, "epoch": 6274} {"train_loss": -27.495229721069336, "global_step": 520801, "epoch": 6274} {"train_loss": -27.66116714477539, "global_step": 520802, "epoch": 6274} {"train_loss": -26.66413688659668, "global_step": 520803, "epoch": 6274} {"train_loss": -27.752613067626953, "global_step": 520804, "epoch": 6274} {"train_loss": -27.2137393951416, "global_step": 520805, "epoch": 6274} {"train_loss": -27.342182159423828, "global_step": 520806, "epoch": 6274} {"train_loss": -27.81003761291504, "global_step": 520807, "epoch": 6274} {"train_loss": -27.5531063079834, "global_step": 520808, "epoch": 6274} {"train_loss": -27.612634658813477, "global_step": 520809, "epoch": 6274} {"train_loss": -27.215402603149414, "global_step": 520810, "epoch": 6274} {"train_loss": -27.07560157775879, "global_step": 520811, "epoch": 6274} {"train_loss": -26.712615966796875, "global_step": 520812, "epoch": 6274} {"train_loss": -26.86536979675293, "global_step": 520813, "epoch": 6274} {"train_loss": -27.007282257080078, "global_step": 520814, "epoch": 6274} {"train_loss": -27.32001304626465, "global_step": 520815, "epoch": 6274} {"train_loss": -27.14845085144043, "global_step": 520816, "epoch": 6274} {"train_loss": -27.071334838867188, "global_step": 520817, "epoch": 6274} {"train_loss": -27.233814239501953, "global_step": 520818, "epoch": 6274} {"train_loss": -27.224262237548828, "global_step": 520819, "epoch": 6274} {"train_loss": -27.105239868164062, "global_step": 520820, "epoch": 6274} {"train_loss": -27.013015747070312, "global_step": 520821, "epoch": 6274} {"train_loss": -27.105329513549805, "global_step": 520822, "epoch": 6274} {"train_loss": -27.515661239624023, "global_step": 520823, "epoch": 6274} {"train_loss": -27.35465047445642, "global_step": 520824, "epoch": 6274, "val_loss": 6460384.0} {"train_loss": -26.754281997680664, "global_step": 520825, "epoch": 6275} {"train_loss": -26.32867431640625, "global_step": 520826, "epoch": 6275} {"train_loss": -26.58167839050293, "global_step": 520827, "epoch": 6275} {"train_loss": -26.439422607421875, "global_step": 520828, "epoch": 6275} {"train_loss": -26.61380386352539, "global_step": 520829, "epoch": 6275} {"train_loss": -26.3704833984375, "global_step": 520830, "epoch": 6275} {"train_loss": -26.912687301635742, "global_step": 520831, "epoch": 6275} {"train_loss": -26.291015625, "global_step": 520832, "epoch": 6275} {"train_loss": -26.86386489868164, "global_step": 520833, "epoch": 6275} {"train_loss": -27.021154403686523, "global_step": 520834, "epoch": 6275} {"train_loss": -26.662450790405273, "global_step": 520835, "epoch": 6275} {"train_loss": -26.71906089782715, "global_step": 520836, "epoch": 6275} {"train_loss": -27.154184341430664, "global_step": 520837, "epoch": 6275} {"train_loss": -26.978910446166992, "global_step": 520838, "epoch": 6275} {"train_loss": -27.020856857299805, "global_step": 520839, "epoch": 6275} {"train_loss": -27.138334274291992, "global_step": 520840, "epoch": 6275} {"train_loss": -26.593896865844727, "global_step": 520841, "epoch": 6275} {"train_loss": -27.26957130432129, "global_step": 520842, "epoch": 6275} {"train_loss": -27.385129928588867, "global_step": 520843, "epoch": 6275} {"train_loss": -26.95513916015625, "global_step": 520844, "epoch": 6275} {"train_loss": -27.422378540039062, "global_step": 520845, "epoch": 6275} {"train_loss": -26.970754623413086, "global_step": 520846, "epoch": 6275} {"train_loss": -27.483579635620117, "global_step": 520847, "epoch": 6275} {"train_loss": -27.42213249206543, "global_step": 520848, "epoch": 6275} {"train_loss": -27.093549728393555, "global_step": 520849, "epoch": 6275} {"train_loss": -27.339309692382812, "global_step": 520850, "epoch": 6275} {"train_loss": -27.358997344970703, "global_step": 520851, "epoch": 6275} {"train_loss": -27.437719345092773, "global_step": 520852, "epoch": 6275} {"train_loss": -27.653173446655273, "global_step": 520853, "epoch": 6275} {"train_loss": -27.196191787719727, "global_step": 520854, "epoch": 6275} {"train_loss": -27.516204833984375, "global_step": 520855, "epoch": 6275} {"train_loss": -27.685821533203125, "global_step": 520856, "epoch": 6275} {"train_loss": -27.630456924438477, "global_step": 520857, "epoch": 6275} {"train_loss": -27.661890029907227, "global_step": 520858, "epoch": 6275} {"train_loss": -27.740880966186523, "global_step": 520859, "epoch": 6275} {"train_loss": -27.763517379760742, "global_step": 520860, "epoch": 6275} {"train_loss": -27.82081413269043, "global_step": 520861, "epoch": 6275} {"train_loss": -27.32523536682129, "global_step": 520862, "epoch": 6275} {"train_loss": -27.703033447265625, "global_step": 520863, "epoch": 6275} {"train_loss": -27.902990341186523, "global_step": 520864, "epoch": 6275} {"train_loss": -27.51409339904785, "global_step": 520865, "epoch": 6275} {"train_loss": -27.083566665649414, "global_step": 520866, "epoch": 6275} {"train_loss": -27.89690589904785, "global_step": 520867, "epoch": 6275} {"train_loss": -27.257654190063477, "global_step": 520868, "epoch": 6275} {"train_loss": -27.640933990478516, "global_step": 520869, "epoch": 6275} {"train_loss": -27.505552291870117, "global_step": 520870, "epoch": 6275} {"train_loss": -27.50233268737793, "global_step": 520871, "epoch": 6275} {"train_loss": -27.446664810180664, "global_step": 520872, "epoch": 6275} {"train_loss": -27.693639755249023, "global_step": 520873, "epoch": 6275} {"train_loss": -27.315692901611328, "global_step": 520874, "epoch": 6275} {"train_loss": -27.366443634033203, "global_step": 520875, "epoch": 6275} {"train_loss": -27.63313865661621, "global_step": 520876, "epoch": 6275} {"train_loss": -27.25372314453125, "global_step": 520877, "epoch": 6275} {"train_loss": -27.770099639892578, "global_step": 520878, "epoch": 6275} {"train_loss": -27.495939254760742, "global_step": 520879, "epoch": 6275} {"train_loss": -27.299774169921875, "global_step": 520880, "epoch": 6275} {"train_loss": -27.479217529296875, "global_step": 520881, "epoch": 6275} {"train_loss": -27.88972282409668, "global_step": 520882, "epoch": 6275} {"train_loss": -27.62265396118164, "global_step": 520883, "epoch": 6275} {"train_loss": -27.48819351196289, "global_step": 520884, "epoch": 6275} {"train_loss": -27.38349723815918, "global_step": 520885, "epoch": 6275} {"train_loss": -27.447607040405273, "global_step": 520886, "epoch": 6275} {"train_loss": -27.69775390625, "global_step": 520887, "epoch": 6275} {"train_loss": -27.21879005432129, "global_step": 520888, "epoch": 6275} {"train_loss": -27.750146865844727, "global_step": 520889, "epoch": 6275} {"train_loss": -27.81953239440918, "global_step": 520890, "epoch": 6275} {"train_loss": -27.700641632080078, "global_step": 520891, "epoch": 6275} {"train_loss": -27.657041549682617, "global_step": 520892, "epoch": 6275} {"train_loss": -27.901885986328125, "global_step": 520893, "epoch": 6275} {"train_loss": -27.816125869750977, "global_step": 520894, "epoch": 6275} {"train_loss": -27.57134437561035, "global_step": 520895, "epoch": 6275} {"train_loss": -27.351713180541992, "global_step": 520896, "epoch": 6275} {"train_loss": -27.502532958984375, "global_step": 520897, "epoch": 6275} {"train_loss": -26.9554500579834, "global_step": 520898, "epoch": 6275} {"train_loss": -27.406591415405273, "global_step": 520899, "epoch": 6275} {"train_loss": -26.748716354370117, "global_step": 520900, "epoch": 6275} {"train_loss": -27.338642120361328, "global_step": 520901, "epoch": 6275} {"train_loss": -27.708765029907227, "global_step": 520902, "epoch": 6275} {"train_loss": -27.42616844177246, "global_step": 520903, "epoch": 6275} {"train_loss": -27.564224243164062, "global_step": 520904, "epoch": 6275} {"train_loss": -27.50874137878418, "global_step": 520905, "epoch": 6275} {"train_loss": -27.598102569580078, "global_step": 520906, "epoch": 6275} {"train_loss": -27.34443055578025, "global_step": 520907, "epoch": 6275, "val_loss": 6645384.0} {"train_loss": -26.90413475036621, "global_step": 520908, "epoch": 6276} {"train_loss": -27.255407333374023, "global_step": 520909, "epoch": 6276} {"train_loss": -26.262958526611328, "global_step": 520910, "epoch": 6276} {"train_loss": -27.007247924804688, "global_step": 520911, "epoch": 6276} {"train_loss": -27.32392692565918, "global_step": 520912, "epoch": 6276} {"train_loss": -26.925046920776367, "global_step": 520913, "epoch": 6276} {"train_loss": -27.0506534576416, "global_step": 520914, "epoch": 6276} {"train_loss": -26.99358558654785, "global_step": 520915, "epoch": 6276} {"train_loss": -27.205036163330078, "global_step": 520916, "epoch": 6276} {"train_loss": -27.149246215820312, "global_step": 520917, "epoch": 6276} {"train_loss": -27.24574089050293, "global_step": 520918, "epoch": 6276} {"train_loss": -26.859235763549805, "global_step": 520919, "epoch": 6276} {"train_loss": -27.481719970703125, "global_step": 520920, "epoch": 6276} {"train_loss": -27.25824546813965, "global_step": 520921, "epoch": 6276} {"train_loss": -27.423437118530273, "global_step": 520922, "epoch": 6276} {"train_loss": -27.2332820892334, "global_step": 520923, "epoch": 6276} {"train_loss": -27.266788482666016, "global_step": 520924, "epoch": 6276} {"train_loss": -27.305606842041016, "global_step": 520925, "epoch": 6276} {"train_loss": -27.711933135986328, "global_step": 520926, "epoch": 6276} {"train_loss": -27.567068099975586, "global_step": 520927, "epoch": 6276} {"train_loss": -27.16834831237793, "global_step": 520928, "epoch": 6276} {"train_loss": -27.54450798034668, "global_step": 520929, "epoch": 6276} {"train_loss": -27.191864013671875, "global_step": 520930, "epoch": 6276} {"train_loss": -27.451269149780273, "global_step": 520931, "epoch": 6276} {"train_loss": -27.047382354736328, "global_step": 520932, "epoch": 6276} {"train_loss": -27.378564834594727, "global_step": 520933, "epoch": 6276} {"train_loss": -27.558874130249023, "global_step": 520934, "epoch": 6276} {"train_loss": -27.56793212890625, "global_step": 520935, "epoch": 6276} {"train_loss": -27.37493896484375, "global_step": 520936, "epoch": 6276} {"train_loss": -27.679763793945312, "global_step": 520937, "epoch": 6276} {"train_loss": -27.310834884643555, "global_step": 520938, "epoch": 6276} {"train_loss": -27.439395904541016, "global_step": 520939, "epoch": 6276} {"train_loss": -27.571775436401367, "global_step": 520940, "epoch": 6276} {"train_loss": -27.849018096923828, "global_step": 520941, "epoch": 6276} {"train_loss": -27.329559326171875, "global_step": 520942, "epoch": 6276} {"train_loss": -27.677326202392578, "global_step": 520943, "epoch": 6276} {"train_loss": -27.692968368530273, "global_step": 520944, "epoch": 6276} {"train_loss": -27.677448272705078, "global_step": 520945, "epoch": 6276} {"train_loss": -27.636890411376953, "global_step": 520946, "epoch": 6276} {"train_loss": -27.862836837768555, "global_step": 520947, "epoch": 6276} {"train_loss": -27.844528198242188, "global_step": 520948, "epoch": 6276} {"train_loss": -27.67281150817871, "global_step": 520949, "epoch": 6276} {"train_loss": -27.4875431060791, "global_step": 520950, "epoch": 6276} {"train_loss": -27.35683250427246, "global_step": 520951, "epoch": 6276} {"train_loss": -27.515369415283203, "global_step": 520952, "epoch": 6276} {"train_loss": -27.768268585205078, "global_step": 520953, "epoch": 6276} {"train_loss": -27.670007705688477, "global_step": 520954, "epoch": 6276} {"train_loss": -27.275684356689453, "global_step": 520955, "epoch": 6276} {"train_loss": -27.815963745117188, "global_step": 520956, "epoch": 6276} {"train_loss": -27.506763458251953, "global_step": 520957, "epoch": 6276} {"train_loss": -27.540693283081055, "global_step": 520958, "epoch": 6276} {"train_loss": -27.681976318359375, "global_step": 520959, "epoch": 6276} {"train_loss": -27.3875732421875, "global_step": 520960, "epoch": 6276} {"train_loss": -27.58316421508789, "global_step": 520961, "epoch": 6276} {"train_loss": -27.76710319519043, "global_step": 520962, "epoch": 6276} {"train_loss": -27.696096420288086, "global_step": 520963, "epoch": 6276} {"train_loss": -28.08112144470215, "global_step": 520964, "epoch": 6276} {"train_loss": -27.42415428161621, "global_step": 520965, "epoch": 6276} {"train_loss": -27.82826805114746, "global_step": 520966, "epoch": 6276} {"train_loss": -28.164304733276367, "global_step": 520967, "epoch": 6276} {"train_loss": -28.068689346313477, "global_step": 520968, "epoch": 6276} {"train_loss": -27.95427894592285, "global_step": 520969, "epoch": 6276} {"train_loss": -27.892255783081055, "global_step": 520970, "epoch": 6276} {"train_loss": -27.79559326171875, "global_step": 520971, "epoch": 6276} {"train_loss": -27.6621036529541, "global_step": 520972, "epoch": 6276} {"train_loss": -27.92811393737793, "global_step": 520973, "epoch": 6276} {"train_loss": -28.13941764831543, "global_step": 520974, "epoch": 6276} {"train_loss": -28.02609634399414, "global_step": 520975, "epoch": 6276} {"train_loss": -27.4899845123291, "global_step": 520976, "epoch": 6276} {"train_loss": -27.370025634765625, "global_step": 520977, "epoch": 6276} {"train_loss": -27.540908813476562, "global_step": 520978, "epoch": 6276} {"train_loss": -27.436878204345703, "global_step": 520979, "epoch": 6276} {"train_loss": -27.2849178314209, "global_step": 520980, "epoch": 6276} {"train_loss": -27.35386085510254, "global_step": 520981, "epoch": 6276} {"train_loss": -27.693836212158203, "global_step": 520982, "epoch": 6276} {"train_loss": -27.611982345581055, "global_step": 520983, "epoch": 6276} {"train_loss": -27.515180587768555, "global_step": 520984, "epoch": 6276} {"train_loss": -27.601272583007812, "global_step": 520985, "epoch": 6276} {"train_loss": -27.569562911987305, "global_step": 520986, "epoch": 6276} {"train_loss": -26.9212703704834, "global_step": 520987, "epoch": 6276} {"train_loss": -26.541730880737305, "global_step": 520988, "epoch": 6276} {"train_loss": -26.234907150268555, "global_step": 520989, "epoch": 6276} {"train_loss": -27.455422987420874, "global_step": 520990, "epoch": 6276, "val_loss": 6614876.5} {"train_loss": -24.119382858276367, "global_step": 520991, "epoch": 6277} {"train_loss": -22.39731788635254, "global_step": 520992, "epoch": 6277} {"train_loss": -23.776504516601562, "global_step": 520993, "epoch": 6277} {"train_loss": -23.992334365844727, "global_step": 520994, "epoch": 6277} {"train_loss": -25.05721092224121, "global_step": 520995, "epoch": 6277} {"train_loss": -25.118436813354492, "global_step": 520996, "epoch": 6277} {"train_loss": -25.190053939819336, "global_step": 520997, "epoch": 6277} {"train_loss": -25.920255661010742, "global_step": 520998, "epoch": 6277} {"train_loss": -25.111684799194336, "global_step": 520999, "epoch": 6277} {"train_loss": -25.719635009765625, "global_step": 521000, "epoch": 6277} {"train_loss": -25.59431266784668, "global_step": 521001, "epoch": 6277} {"train_loss": -25.555204391479492, "global_step": 521002, "epoch": 6277} {"train_loss": -25.766950607299805, "global_step": 521003, "epoch": 6277} {"train_loss": -25.823591232299805, "global_step": 521004, "epoch": 6277} {"train_loss": -25.930927276611328, "global_step": 521005, "epoch": 6277} {"train_loss": -25.67378807067871, "global_step": 521006, "epoch": 6277} {"train_loss": -26.107812881469727, "global_step": 521007, "epoch": 6277} {"train_loss": -26.08428382873535, "global_step": 521008, "epoch": 6277} {"train_loss": -25.782175064086914, "global_step": 521009, "epoch": 6277} {"train_loss": -26.33920669555664, "global_step": 521010, "epoch": 6277} {"train_loss": -26.101547241210938, "global_step": 521011, "epoch": 6277} {"train_loss": -26.197446823120117, "global_step": 521012, "epoch": 6277} {"train_loss": -26.423627853393555, "global_step": 521013, "epoch": 6277} {"train_loss": -26.64349937438965, "global_step": 521014, "epoch": 6277} {"train_loss": -26.52978515625, "global_step": 521015, "epoch": 6277} {"train_loss": -26.662931442260742, "global_step": 521016, "epoch": 6277} {"train_loss": -26.465600967407227, "global_step": 521017, "epoch": 6277} {"train_loss": -26.76429557800293, "global_step": 521018, "epoch": 6277} {"train_loss": -27.06912612915039, "global_step": 521019, "epoch": 6277} {"train_loss": -26.883493423461914, "global_step": 521020, "epoch": 6277} {"train_loss": -26.94264030456543, "global_step": 521021, "epoch": 6277} {"train_loss": -26.478307723999023, "global_step": 521022, "epoch": 6277} {"train_loss": -26.900588989257812, "global_step": 521023, "epoch": 6277} {"train_loss": -26.667022705078125, "global_step": 521024, "epoch": 6277} {"train_loss": -27.179590225219727, "global_step": 521025, "epoch": 6277} {"train_loss": -26.790470123291016, "global_step": 521026, "epoch": 6277} {"train_loss": -26.8685359954834, "global_step": 521027, "epoch": 6277} {"train_loss": -27.183996200561523, "global_step": 521028, "epoch": 6277} {"train_loss": -27.070331573486328, "global_step": 521029, "epoch": 6277} {"train_loss": -27.229909896850586, "global_step": 521030, "epoch": 6277} {"train_loss": -26.90081787109375, "global_step": 521031, "epoch": 6277} {"train_loss": -27.270221710205078, "global_step": 521032, "epoch": 6277} {"train_loss": -26.96367835998535, "global_step": 521033, "epoch": 6277} {"train_loss": -27.140485763549805, "global_step": 521034, "epoch": 6277} {"train_loss": -27.039777755737305, "global_step": 521035, "epoch": 6277} {"train_loss": -27.417978286743164, "global_step": 521036, "epoch": 6277} {"train_loss": -27.426044464111328, "global_step": 521037, "epoch": 6277} {"train_loss": -27.346145629882812, "global_step": 521038, "epoch": 6277} {"train_loss": -27.30270767211914, "global_step": 521039, "epoch": 6277} {"train_loss": -27.340240478515625, "global_step": 521040, "epoch": 6277} {"train_loss": -27.15604591369629, "global_step": 521041, "epoch": 6277} {"train_loss": -27.263879776000977, "global_step": 521042, "epoch": 6277} {"train_loss": -27.400588989257812, "global_step": 521043, "epoch": 6277} {"train_loss": -27.248682022094727, "global_step": 521044, "epoch": 6277} {"train_loss": -27.647695541381836, "global_step": 521045, "epoch": 6277} {"train_loss": -27.357467651367188, "global_step": 521046, "epoch": 6277} {"train_loss": -27.45147705078125, "global_step": 521047, "epoch": 6277} {"train_loss": -27.26875114440918, "global_step": 521048, "epoch": 6277} {"train_loss": -27.608423233032227, "global_step": 521049, "epoch": 6277} {"train_loss": -27.64902687072754, "global_step": 521050, "epoch": 6277} {"train_loss": -27.691299438476562, "global_step": 521051, "epoch": 6277} {"train_loss": -27.712793350219727, "global_step": 521052, "epoch": 6277} {"train_loss": -27.41338539123535, "global_step": 521053, "epoch": 6277} {"train_loss": -27.67685317993164, "global_step": 521054, "epoch": 6277} {"train_loss": -27.346433639526367, "global_step": 521055, "epoch": 6277} {"train_loss": -27.850980758666992, "global_step": 521056, "epoch": 6277} {"train_loss": -27.612899780273438, "global_step": 521057, "epoch": 6277} {"train_loss": -27.641016006469727, "global_step": 521058, "epoch": 6277} {"train_loss": -27.918689727783203, "global_step": 521059, "epoch": 6277} {"train_loss": -27.60784912109375, "global_step": 521060, "epoch": 6277} {"train_loss": -27.469623565673828, "global_step": 521061, "epoch": 6277} {"train_loss": -27.35979652404785, "global_step": 521062, "epoch": 6277} {"train_loss": -27.966535568237305, "global_step": 521063, "epoch": 6277} {"train_loss": -27.668310165405273, "global_step": 521064, "epoch": 6277} {"train_loss": -27.503021240234375, "global_step": 521065, "epoch": 6277} {"train_loss": -28.08680534362793, "global_step": 521066, "epoch": 6277} {"train_loss": -27.9270076751709, "global_step": 521067, "epoch": 6277} {"train_loss": -27.786359786987305, "global_step": 521068, "epoch": 6277} {"train_loss": -28.121313095092773, "global_step": 521069, "epoch": 6277} {"train_loss": -28.20794677734375, "global_step": 521070, "epoch": 6277} {"train_loss": -27.79823875427246, "global_step": 521071, "epoch": 6277} {"train_loss": -27.6923828125, "global_step": 521072, "epoch": 6277} {"train_loss": -26.800228923200123, "global_step": 521073, "epoch": 6277, "val_loss": 6636792.0} {"train_loss": -27.273975372314453, "global_step": 521074, "epoch": 6278} {"train_loss": -27.543292999267578, "global_step": 521075, "epoch": 6278} {"train_loss": -27.338109970092773, "global_step": 521076, "epoch": 6278} {"train_loss": -27.392990112304688, "global_step": 521077, "epoch": 6278} {"train_loss": -27.198379516601562, "global_step": 521078, "epoch": 6278} {"train_loss": -27.5831356048584, "global_step": 521079, "epoch": 6278} {"train_loss": -27.50404930114746, "global_step": 521080, "epoch": 6278} {"train_loss": -27.59873390197754, "global_step": 521081, "epoch": 6278} {"train_loss": -27.40186882019043, "global_step": 521082, "epoch": 6278} {"train_loss": -27.542545318603516, "global_step": 521083, "epoch": 6278} {"train_loss": -27.327848434448242, "global_step": 521084, "epoch": 6278} {"train_loss": -27.31436538696289, "global_step": 521085, "epoch": 6278} {"train_loss": -27.537084579467773, "global_step": 521086, "epoch": 6278} {"train_loss": -27.457468032836914, "global_step": 521087, "epoch": 6278} {"train_loss": -27.09268569946289, "global_step": 521088, "epoch": 6278} {"train_loss": -27.870361328125, "global_step": 521089, "epoch": 6278} {"train_loss": -27.239471435546875, "global_step": 521090, "epoch": 6278} {"train_loss": -27.418298721313477, "global_step": 521091, "epoch": 6278} {"train_loss": -27.374755859375, "global_step": 521092, "epoch": 6278} {"train_loss": -27.524826049804688, "global_step": 521093, "epoch": 6278} {"train_loss": -27.164331436157227, "global_step": 521094, "epoch": 6278} {"train_loss": -27.607938766479492, "global_step": 521095, "epoch": 6278} {"train_loss": -26.959400177001953, "global_step": 521096, "epoch": 6278} {"train_loss": -27.505950927734375, "global_step": 521097, "epoch": 6278} {"train_loss": -27.2709903717041, "global_step": 521098, "epoch": 6278} {"train_loss": -27.09308433532715, "global_step": 521099, "epoch": 6278} {"train_loss": -27.394336700439453, "global_step": 521100, "epoch": 6278} {"train_loss": -26.99757194519043, "global_step": 521101, "epoch": 6278} {"train_loss": -27.522302627563477, "global_step": 521102, "epoch": 6278} {"train_loss": -27.11224937438965, "global_step": 521103, "epoch": 6278} {"train_loss": -27.144256591796875, "global_step": 521104, "epoch": 6278} {"train_loss": -27.0213623046875, "global_step": 521105, "epoch": 6278} {"train_loss": -27.084314346313477, "global_step": 521106, "epoch": 6278} {"train_loss": -27.53944969177246, "global_step": 521107, "epoch": 6278} {"train_loss": -27.351118087768555, "global_step": 521108, "epoch": 6278} {"train_loss": -27.21343994140625, "global_step": 521109, "epoch": 6278} {"train_loss": -28.08979606628418, "global_step": 521110, "epoch": 6278} {"train_loss": -27.063379287719727, "global_step": 521111, "epoch": 6278} {"train_loss": -27.138776779174805, "global_step": 521112, "epoch": 6278} {"train_loss": -27.10212516784668, "global_step": 521113, "epoch": 6278} {"train_loss": -27.123754501342773, "global_step": 521114, "epoch": 6278} {"train_loss": -27.598737716674805, "global_step": 521115, "epoch": 6278} {"train_loss": -27.318008422851562, "global_step": 521116, "epoch": 6278} {"train_loss": -27.58026695251465, "global_step": 521117, "epoch": 6278} {"train_loss": -27.2304744720459, "global_step": 521118, "epoch": 6278} {"train_loss": -27.60981559753418, "global_step": 521119, "epoch": 6278} {"train_loss": -27.21021842956543, "global_step": 521120, "epoch": 6278} {"train_loss": -27.804412841796875, "global_step": 521121, "epoch": 6278} {"train_loss": -27.546483993530273, "global_step": 521122, "epoch": 6278} {"train_loss": -27.739307403564453, "global_step": 521123, "epoch": 6278} {"train_loss": -27.705860137939453, "global_step": 521124, "epoch": 6278} {"train_loss": -28.11958885192871, "global_step": 521125, "epoch": 6278} {"train_loss": -27.423425674438477, "global_step": 521126, "epoch": 6278} {"train_loss": -27.77353858947754, "global_step": 521127, "epoch": 6278} {"train_loss": -27.5565242767334, "global_step": 521128, "epoch": 6278} {"train_loss": -27.324039459228516, "global_step": 521129, "epoch": 6278} {"train_loss": -27.858388900756836, "global_step": 521130, "epoch": 6278} {"train_loss": -27.588354110717773, "global_step": 521131, "epoch": 6278} {"train_loss": -27.35829734802246, "global_step": 521132, "epoch": 6278} {"train_loss": -27.87763786315918, "global_step": 521133, "epoch": 6278} {"train_loss": -27.75551414489746, "global_step": 521134, "epoch": 6278} {"train_loss": -27.564929962158203, "global_step": 521135, "epoch": 6278} {"train_loss": -27.803852081298828, "global_step": 521136, "epoch": 6278} {"train_loss": -27.67822265625, "global_step": 521137, "epoch": 6278} {"train_loss": -27.980682373046875, "global_step": 521138, "epoch": 6278} {"train_loss": -27.63092041015625, "global_step": 521139, "epoch": 6278} {"train_loss": -27.74762535095215, "global_step": 521140, "epoch": 6278} {"train_loss": -27.409488677978516, "global_step": 521141, "epoch": 6278} {"train_loss": -27.738256454467773, "global_step": 521142, "epoch": 6278} {"train_loss": -27.42652702331543, "global_step": 521143, "epoch": 6278} {"train_loss": -27.901330947875977, "global_step": 521144, "epoch": 6278} {"train_loss": -27.4574031829834, "global_step": 521145, "epoch": 6278} {"train_loss": -27.719507217407227, "global_step": 521146, "epoch": 6278} {"train_loss": -27.96175193786621, "global_step": 521147, "epoch": 6278} {"train_loss": -27.928930282592773, "global_step": 521148, "epoch": 6278} {"train_loss": -28.128387451171875, "global_step": 521149, "epoch": 6278} {"train_loss": -27.59505271911621, "global_step": 521150, "epoch": 6278} {"train_loss": -27.878952026367188, "global_step": 521151, "epoch": 6278} {"train_loss": -27.403553009033203, "global_step": 521152, "epoch": 6278} {"train_loss": -27.397451400756836, "global_step": 521153, "epoch": 6278} {"train_loss": -27.4621524810791, "global_step": 521154, "epoch": 6278} {"train_loss": -27.825580596923828, "global_step": 521155, "epoch": 6278} {"train_loss": -27.495320101818407, "global_step": 521156, "epoch": 6278, "val_loss": 6551674.5} {"train_loss": -26.922616958618164, "global_step": 521157, "epoch": 6279} {"train_loss": -25.91358757019043, "global_step": 521158, "epoch": 6279} {"train_loss": -26.260517120361328, "global_step": 521159, "epoch": 6279} {"train_loss": -26.438100814819336, "global_step": 521160, "epoch": 6279} {"train_loss": -25.7791748046875, "global_step": 521161, "epoch": 6279} {"train_loss": -26.597919464111328, "global_step": 521162, "epoch": 6279} {"train_loss": -25.939233779907227, "global_step": 521163, "epoch": 6279} {"train_loss": -25.91615867614746, "global_step": 521164, "epoch": 6279} {"train_loss": -26.694171905517578, "global_step": 521165, "epoch": 6279} {"train_loss": -26.640771865844727, "global_step": 521166, "epoch": 6279} {"train_loss": -27.10280418395996, "global_step": 521167, "epoch": 6279} {"train_loss": -26.66877555847168, "global_step": 521168, "epoch": 6279} {"train_loss": -26.83192253112793, "global_step": 521169, "epoch": 6279} {"train_loss": -26.755741119384766, "global_step": 521170, "epoch": 6279} {"train_loss": -26.8560733795166, "global_step": 521171, "epoch": 6279} {"train_loss": -26.59638786315918, "global_step": 521172, "epoch": 6279} {"train_loss": -26.833759307861328, "global_step": 521173, "epoch": 6279} {"train_loss": -26.86470603942871, "global_step": 521174, "epoch": 6279} {"train_loss": -27.04581069946289, "global_step": 521175, "epoch": 6279} {"train_loss": -27.171894073486328, "global_step": 521176, "epoch": 6279} {"train_loss": -27.061315536499023, "global_step": 521177, "epoch": 6279} {"train_loss": -26.876022338867188, "global_step": 521178, "epoch": 6279} {"train_loss": -26.952802658081055, "global_step": 521179, "epoch": 6279} {"train_loss": -27.089406967163086, "global_step": 521180, "epoch": 6279} {"train_loss": -27.23042106628418, "global_step": 521181, "epoch": 6279} {"train_loss": -27.153100967407227, "global_step": 521182, "epoch": 6279} {"train_loss": -27.203840255737305, "global_step": 521183, "epoch": 6279} {"train_loss": -27.174802780151367, "global_step": 521184, "epoch": 6279} {"train_loss": -27.237939834594727, "global_step": 521185, "epoch": 6279} {"train_loss": -27.4608211517334, "global_step": 521186, "epoch": 6279} {"train_loss": -27.408649444580078, "global_step": 521187, "epoch": 6279} {"train_loss": -27.09016990661621, "global_step": 521188, "epoch": 6279} {"train_loss": -27.368576049804688, "global_step": 521189, "epoch": 6279} {"train_loss": -27.304157257080078, "global_step": 521190, "epoch": 6279} {"train_loss": -27.618408203125, "global_step": 521191, "epoch": 6279} {"train_loss": -27.111352920532227, "global_step": 521192, "epoch": 6279} {"train_loss": -27.8685359954834, "global_step": 521193, "epoch": 6279} {"train_loss": -27.475128173828125, "global_step": 521194, "epoch": 6279} {"train_loss": -27.30377197265625, "global_step": 521195, "epoch": 6279} {"train_loss": -27.249652862548828, "global_step": 521196, "epoch": 6279} {"train_loss": -27.251195907592773, "global_step": 521197, "epoch": 6279} {"train_loss": -27.26238441467285, "global_step": 521198, "epoch": 6279} {"train_loss": -27.584537506103516, "global_step": 521199, "epoch": 6279} {"train_loss": -27.6415958404541, "global_step": 521200, "epoch": 6279} {"train_loss": -27.516462326049805, "global_step": 521201, "epoch": 6279} {"train_loss": -27.39060401916504, "global_step": 521202, "epoch": 6279} {"train_loss": -27.661474227905273, "global_step": 521203, "epoch": 6279} {"train_loss": -27.28253746032715, "global_step": 521204, "epoch": 6279} {"train_loss": -27.55622673034668, "global_step": 521205, "epoch": 6279} {"train_loss": -27.99077796936035, "global_step": 521206, "epoch": 6279} {"train_loss": -27.73193359375, "global_step": 521207, "epoch": 6279} {"train_loss": -27.8627986907959, "global_step": 521208, "epoch": 6279} {"train_loss": -28.1704158782959, "global_step": 521209, "epoch": 6279} {"train_loss": -27.81330680847168, "global_step": 521210, "epoch": 6279} {"train_loss": -27.596094131469727, "global_step": 521211, "epoch": 6279} {"train_loss": -27.630985260009766, "global_step": 521212, "epoch": 6279} {"train_loss": -27.43548583984375, "global_step": 521213, "epoch": 6279} {"train_loss": -28.089635848999023, "global_step": 521214, "epoch": 6279} {"train_loss": -27.510971069335938, "global_step": 521215, "epoch": 6279} {"train_loss": -27.201826095581055, "global_step": 521216, "epoch": 6279} {"train_loss": -27.90985679626465, "global_step": 521217, "epoch": 6279} {"train_loss": -27.805545806884766, "global_step": 521218, "epoch": 6279} {"train_loss": -27.918426513671875, "global_step": 521219, "epoch": 6279} {"train_loss": -27.937280654907227, "global_step": 521220, "epoch": 6279} {"train_loss": -27.77113914489746, "global_step": 521221, "epoch": 6279} {"train_loss": -27.588550567626953, "global_step": 521222, "epoch": 6279} {"train_loss": -27.50001335144043, "global_step": 521223, "epoch": 6279} {"train_loss": -27.913217544555664, "global_step": 521224, "epoch": 6279} {"train_loss": -27.703598022460938, "global_step": 521225, "epoch": 6279} {"train_loss": -27.36530113220215, "global_step": 521226, "epoch": 6279} {"train_loss": -26.47975730895996, "global_step": 521227, "epoch": 6279} {"train_loss": -26.685850143432617, "global_step": 521228, "epoch": 6279} {"train_loss": -27.13970947265625, "global_step": 521229, "epoch": 6279} {"train_loss": -27.494144439697266, "global_step": 521230, "epoch": 6279} {"train_loss": -27.345050811767578, "global_step": 521231, "epoch": 6279} {"train_loss": -27.142736434936523, "global_step": 521232, "epoch": 6279} {"train_loss": -26.832117080688477, "global_step": 521233, "epoch": 6279} {"train_loss": -27.713926315307617, "global_step": 521234, "epoch": 6279} {"train_loss": -27.301727294921875, "global_step": 521235, "epoch": 6279} {"train_loss": -27.69105339050293, "global_step": 521236, "epoch": 6279} {"train_loss": -27.6452693939209, "global_step": 521237, "epoch": 6279} {"train_loss": -27.280866622924805, "global_step": 521238, "epoch": 6279} {"train_loss": -27.239325580826726, "global_step": 521239, "epoch": 6279, "val_loss": 6584905.0} {"train_loss": -26.339452743530273, "global_step": 521240, "epoch": 6280} {"train_loss": -26.18292808532715, "global_step": 521241, "epoch": 6280} {"train_loss": -25.84326171875, "global_step": 521242, "epoch": 6280} {"train_loss": -26.28934669494629, "global_step": 521243, "epoch": 6280} {"train_loss": -26.316532135009766, "global_step": 521244, "epoch": 6280} {"train_loss": -26.105310440063477, "global_step": 521245, "epoch": 6280} {"train_loss": -26.90582275390625, "global_step": 521246, "epoch": 6280} {"train_loss": -26.263233184814453, "global_step": 521247, "epoch": 6280} {"train_loss": -26.494308471679688, "global_step": 521248, "epoch": 6280} {"train_loss": -26.736190795898438, "global_step": 521249, "epoch": 6280} {"train_loss": -26.80685806274414, "global_step": 521250, "epoch": 6280} {"train_loss": -26.439334869384766, "global_step": 521251, "epoch": 6280} {"train_loss": -26.909337997436523, "global_step": 521252, "epoch": 6280} {"train_loss": -26.82718849182129, "global_step": 521253, "epoch": 6280} {"train_loss": -27.00507926940918, "global_step": 521254, "epoch": 6280} {"train_loss": -26.6264591217041, "global_step": 521255, "epoch": 6280} {"train_loss": -27.03961753845215, "global_step": 521256, "epoch": 6280} {"train_loss": -26.666284561157227, "global_step": 521257, "epoch": 6280} {"train_loss": -27.287099838256836, "global_step": 521258, "epoch": 6280} {"train_loss": -26.76974868774414, "global_step": 521259, "epoch": 6280} {"train_loss": -27.475492477416992, "global_step": 521260, "epoch": 6280} {"train_loss": -27.494062423706055, "global_step": 521261, "epoch": 6280} {"train_loss": -27.3939208984375, "global_step": 521262, "epoch": 6280} {"train_loss": -27.423017501831055, "global_step": 521263, "epoch": 6280} {"train_loss": -27.36687660217285, "global_step": 521264, "epoch": 6280} {"train_loss": -27.31659507751465, "global_step": 521265, "epoch": 6280} {"train_loss": -26.93263816833496, "global_step": 521266, "epoch": 6280} {"train_loss": -27.397619247436523, "global_step": 521267, "epoch": 6280} {"train_loss": -27.356122970581055, "global_step": 521268, "epoch": 6280} {"train_loss": -27.4321231842041, "global_step": 521269, "epoch": 6280} {"train_loss": -27.516077041625977, "global_step": 521270, "epoch": 6280} {"train_loss": -27.5084228515625, "global_step": 521271, "epoch": 6280} {"train_loss": -27.30402183532715, "global_step": 521272, "epoch": 6280} {"train_loss": -27.99021339416504, "global_step": 521273, "epoch": 6280} {"train_loss": -27.25599479675293, "global_step": 521274, "epoch": 6280} {"train_loss": -27.645734786987305, "global_step": 521275, "epoch": 6280} {"train_loss": -27.587427139282227, "global_step": 521276, "epoch": 6280} {"train_loss": -27.390888214111328, "global_step": 521277, "epoch": 6280} {"train_loss": -27.81953239440918, "global_step": 521278, "epoch": 6280} {"train_loss": -27.828567504882812, "global_step": 521279, "epoch": 6280} {"train_loss": -27.991384506225586, "global_step": 521280, "epoch": 6280} {"train_loss": -27.5311222076416, "global_step": 521281, "epoch": 6280} {"train_loss": -27.423669815063477, "global_step": 521282, "epoch": 6280} {"train_loss": -27.482046127319336, "global_step": 521283, "epoch": 6280} {"train_loss": -27.33148193359375, "global_step": 521284, "epoch": 6280} {"train_loss": -27.694807052612305, "global_step": 521285, "epoch": 6280} {"train_loss": -27.66045570373535, "global_step": 521286, "epoch": 6280} {"train_loss": -27.55547523498535, "global_step": 521287, "epoch": 6280} {"train_loss": -27.490507125854492, "global_step": 521288, "epoch": 6280} {"train_loss": -27.3112850189209, "global_step": 521289, "epoch": 6280} {"train_loss": -27.656396865844727, "global_step": 521290, "epoch": 6280} {"train_loss": -27.89056396484375, "global_step": 521291, "epoch": 6280} {"train_loss": -27.57227897644043, "global_step": 521292, "epoch": 6280} {"train_loss": -27.84163475036621, "global_step": 521293, "epoch": 6280} {"train_loss": -27.714508056640625, "global_step": 521294, "epoch": 6280} {"train_loss": -27.617507934570312, "global_step": 521295, "epoch": 6280} {"train_loss": -27.5562686920166, "global_step": 521296, "epoch": 6280} {"train_loss": -27.563648223876953, "global_step": 521297, "epoch": 6280} {"train_loss": -27.427444458007812, "global_step": 521298, "epoch": 6280} {"train_loss": -27.699798583984375, "global_step": 521299, "epoch": 6280} {"train_loss": -27.616819381713867, "global_step": 521300, "epoch": 6280} {"train_loss": -27.522674560546875, "global_step": 521301, "epoch": 6280} {"train_loss": -27.824451446533203, "global_step": 521302, "epoch": 6280} {"train_loss": -27.91094970703125, "global_step": 521303, "epoch": 6280} {"train_loss": -27.6866397857666, "global_step": 521304, "epoch": 6280} {"train_loss": -27.516202926635742, "global_step": 521305, "epoch": 6280} {"train_loss": -27.527557373046875, "global_step": 521306, "epoch": 6280} {"train_loss": -27.881723403930664, "global_step": 521307, "epoch": 6280} {"train_loss": -27.353973388671875, "global_step": 521308, "epoch": 6280} {"train_loss": -27.952444076538086, "global_step": 521309, "epoch": 6280} {"train_loss": -28.043378829956055, "global_step": 521310, "epoch": 6280} {"train_loss": -27.603534698486328, "global_step": 521311, "epoch": 6280} {"train_loss": -27.431365966796875, "global_step": 521312, "epoch": 6280} {"train_loss": -27.791839599609375, "global_step": 521313, "epoch": 6280} {"train_loss": -27.316577911376953, "global_step": 521314, "epoch": 6280} {"train_loss": -27.66916275024414, "global_step": 521315, "epoch": 6280} {"train_loss": -27.8405704498291, "global_step": 521316, "epoch": 6280} {"train_loss": -27.7215518951416, "global_step": 521317, "epoch": 6280} {"train_loss": -27.582992553710938, "global_step": 521318, "epoch": 6280} {"train_loss": -28.27392578125, "global_step": 521319, "epoch": 6280} {"train_loss": -27.48189353942871, "global_step": 521320, "epoch": 6280} {"train_loss": -27.881444931030273, "global_step": 521321, "epoch": 6280} {"train_loss": -27.356501383953784, "global_step": 521322, "epoch": 6280, "val_loss": 6697765.0} {"train_loss": -26.831817626953125, "global_step": 521323, "epoch": 6281} {"train_loss": -26.575931549072266, "global_step": 521324, "epoch": 6281} {"train_loss": -27.115253448486328, "global_step": 521325, "epoch": 6281} {"train_loss": -26.688947677612305, "global_step": 521326, "epoch": 6281} {"train_loss": -27.290807723999023, "global_step": 521327, "epoch": 6281} {"train_loss": -27.337003707885742, "global_step": 521328, "epoch": 6281} {"train_loss": -26.956161499023438, "global_step": 521329, "epoch": 6281} {"train_loss": -27.31494140625, "global_step": 521330, "epoch": 6281} {"train_loss": -27.17630958557129, "global_step": 521331, "epoch": 6281} {"train_loss": -27.244714736938477, "global_step": 521332, "epoch": 6281} {"train_loss": -27.345869064331055, "global_step": 521333, "epoch": 6281} {"train_loss": -27.499216079711914, "global_step": 521334, "epoch": 6281} {"train_loss": -27.40066909790039, "global_step": 521335, "epoch": 6281} {"train_loss": -27.370319366455078, "global_step": 521336, "epoch": 6281} {"train_loss": -26.961530685424805, "global_step": 521337, "epoch": 6281} {"train_loss": -27.334182739257812, "global_step": 521338, "epoch": 6281} {"train_loss": -27.28150749206543, "global_step": 521339, "epoch": 6281} {"train_loss": -27.56772232055664, "global_step": 521340, "epoch": 6281} {"train_loss": -27.232440948486328, "global_step": 521341, "epoch": 6281} {"train_loss": -27.31777000427246, "global_step": 521342, "epoch": 6281} {"train_loss": -27.578903198242188, "global_step": 521343, "epoch": 6281} {"train_loss": -27.068567276000977, "global_step": 521344, "epoch": 6281} {"train_loss": -26.112829208374023, "global_step": 521345, "epoch": 6281} {"train_loss": -26.73870277404785, "global_step": 521346, "epoch": 6281} {"train_loss": -27.124591827392578, "global_step": 521347, "epoch": 6281} {"train_loss": -27.28008460998535, "global_step": 521348, "epoch": 6281} {"train_loss": -27.10944938659668, "global_step": 521349, "epoch": 6281} {"train_loss": -27.11736488342285, "global_step": 521350, "epoch": 6281} {"train_loss": -27.090408325195312, "global_step": 521351, "epoch": 6281} {"train_loss": -27.144153594970703, "global_step": 521352, "epoch": 6281} {"train_loss": -27.00592613220215, "global_step": 521353, "epoch": 6281} {"train_loss": -27.000619888305664, "global_step": 521354, "epoch": 6281} {"train_loss": -27.057828903198242, "global_step": 521355, "epoch": 6281} {"train_loss": -27.098058700561523, "global_step": 521356, "epoch": 6281} {"train_loss": -27.533130645751953, "global_step": 521357, "epoch": 6281} {"train_loss": -27.03436851501465, "global_step": 521358, "epoch": 6281} {"train_loss": -27.28376579284668, "global_step": 521359, "epoch": 6281} {"train_loss": -27.366870880126953, "global_step": 521360, "epoch": 6281} {"train_loss": -26.965726852416992, "global_step": 521361, "epoch": 6281} {"train_loss": -27.172779083251953, "global_step": 521362, "epoch": 6281} {"train_loss": -27.604572296142578, "global_step": 521363, "epoch": 6281} {"train_loss": -27.08526039123535, "global_step": 521364, "epoch": 6281} {"train_loss": -27.413410186767578, "global_step": 521365, "epoch": 6281} {"train_loss": -27.261865615844727, "global_step": 521366, "epoch": 6281} {"train_loss": -27.29509925842285, "global_step": 521367, "epoch": 6281} {"train_loss": -27.298969268798828, "global_step": 521368, "epoch": 6281} {"train_loss": -27.29157829284668, "global_step": 521369, "epoch": 6281} {"train_loss": -27.4261531829834, "global_step": 521370, "epoch": 6281} {"train_loss": -26.998798370361328, "global_step": 521371, "epoch": 6281} {"train_loss": -26.840702056884766, "global_step": 521372, "epoch": 6281} {"train_loss": -27.8363037109375, "global_step": 521373, "epoch": 6281} {"train_loss": -27.44840431213379, "global_step": 521374, "epoch": 6281} {"train_loss": -27.689889907836914, "global_step": 521375, "epoch": 6281} {"train_loss": -27.620319366455078, "global_step": 521376, "epoch": 6281} {"train_loss": -27.782012939453125, "global_step": 521377, "epoch": 6281} {"train_loss": -27.672510147094727, "global_step": 521378, "epoch": 6281} {"train_loss": -27.35690689086914, "global_step": 521379, "epoch": 6281} {"train_loss": -27.418670654296875, "global_step": 521380, "epoch": 6281} {"train_loss": -27.834365844726562, "global_step": 521381, "epoch": 6281} {"train_loss": -27.993213653564453, "global_step": 521382, "epoch": 6281} {"train_loss": -27.65040397644043, "global_step": 521383, "epoch": 6281} {"train_loss": -27.636611938476562, "global_step": 521384, "epoch": 6281} {"train_loss": -27.947668075561523, "global_step": 521385, "epoch": 6281} {"train_loss": -27.855600357055664, "global_step": 521386, "epoch": 6281} {"train_loss": -27.516632080078125, "global_step": 521387, "epoch": 6281} {"train_loss": -27.66327476501465, "global_step": 521388, "epoch": 6281} {"train_loss": -27.642969131469727, "global_step": 521389, "epoch": 6281} {"train_loss": -27.563840866088867, "global_step": 521390, "epoch": 6281} {"train_loss": -28.109317779541016, "global_step": 521391, "epoch": 6281} {"train_loss": -27.7430362701416, "global_step": 521392, "epoch": 6281} {"train_loss": -27.796308517456055, "global_step": 521393, "epoch": 6281} {"train_loss": -27.66607666015625, "global_step": 521394, "epoch": 6281} {"train_loss": -27.684326171875, "global_step": 521395, "epoch": 6281} {"train_loss": -27.805164337158203, "global_step": 521396, "epoch": 6281} {"train_loss": -27.8913516998291, "global_step": 521397, "epoch": 6281} {"train_loss": -27.648040771484375, "global_step": 521398, "epoch": 6281} {"train_loss": -27.817163467407227, "global_step": 521399, "epoch": 6281} {"train_loss": -27.947742462158203, "global_step": 521400, "epoch": 6281} {"train_loss": -27.241470336914062, "global_step": 521401, "epoch": 6281} {"train_loss": -27.65717887878418, "global_step": 521402, "epoch": 6281} {"train_loss": -27.803390502929688, "global_step": 521403, "epoch": 6281} {"train_loss": -27.45975685119629, "global_step": 521404, "epoch": 6281} {"train_loss": -27.370361534945935, "global_step": 521405, "epoch": 6281, "val_loss": 6583936.0} {"train_loss": -27.351415634155273, "global_step": 521406, "epoch": 6282} {"train_loss": -26.742938995361328, "global_step": 521407, "epoch": 6282} {"train_loss": -26.19160270690918, "global_step": 521408, "epoch": 6282} {"train_loss": -26.988651275634766, "global_step": 521409, "epoch": 6282} {"train_loss": -26.74976921081543, "global_step": 521410, "epoch": 6282} {"train_loss": -26.633331298828125, "global_step": 521411, "epoch": 6282} {"train_loss": -27.524194717407227, "global_step": 521412, "epoch": 6282} {"train_loss": -26.720815658569336, "global_step": 521413, "epoch": 6282} {"train_loss": -27.125823974609375, "global_step": 521414, "epoch": 6282} {"train_loss": -27.0881404876709, "global_step": 521415, "epoch": 6282} {"train_loss": -27.30658531188965, "global_step": 521416, "epoch": 6282} {"train_loss": -27.2585391998291, "global_step": 521417, "epoch": 6282} {"train_loss": -27.164142608642578, "global_step": 521418, "epoch": 6282} {"train_loss": -27.12464714050293, "global_step": 521419, "epoch": 6282} {"train_loss": -27.405170440673828, "global_step": 521420, "epoch": 6282} {"train_loss": -27.1777400970459, "global_step": 521421, "epoch": 6282} {"train_loss": -27.21895408630371, "global_step": 521422, "epoch": 6282} {"train_loss": -27.049169540405273, "global_step": 521423, "epoch": 6282} {"train_loss": -26.710493087768555, "global_step": 521424, "epoch": 6282} {"train_loss": -27.2697696685791, "global_step": 521425, "epoch": 6282} {"train_loss": -27.224761962890625, "global_step": 521426, "epoch": 6282} {"train_loss": -27.140920639038086, "global_step": 521427, "epoch": 6282} {"train_loss": -27.141387939453125, "global_step": 521428, "epoch": 6282} {"train_loss": -27.054779052734375, "global_step": 521429, "epoch": 6282} {"train_loss": -27.357772827148438, "global_step": 521430, "epoch": 6282} {"train_loss": -27.023284912109375, "global_step": 521431, "epoch": 6282} {"train_loss": -27.38624382019043, "global_step": 521432, "epoch": 6282} {"train_loss": -27.371450424194336, "global_step": 521433, "epoch": 6282} {"train_loss": -27.268049240112305, "global_step": 521434, "epoch": 6282} {"train_loss": -27.347579956054688, "global_step": 521435, "epoch": 6282} {"train_loss": -27.416839599609375, "global_step": 521436, "epoch": 6282} {"train_loss": -27.300390243530273, "global_step": 521437, "epoch": 6282} {"train_loss": -27.74995231628418, "global_step": 521438, "epoch": 6282} {"train_loss": -27.205244064331055, "global_step": 521439, "epoch": 6282} {"train_loss": -27.551679611206055, "global_step": 521440, "epoch": 6282} {"train_loss": -27.676191329956055, "global_step": 521441, "epoch": 6282} {"train_loss": -27.757287979125977, "global_step": 521442, "epoch": 6282} {"train_loss": -27.687223434448242, "global_step": 521443, "epoch": 6282} {"train_loss": -27.702472686767578, "global_step": 521444, "epoch": 6282} {"train_loss": -27.520383834838867, "global_step": 521445, "epoch": 6282} {"train_loss": -27.891340255737305, "global_step": 521446, "epoch": 6282} {"train_loss": -28.092863082885742, "global_step": 521447, "epoch": 6282} {"train_loss": -27.445098876953125, "global_step": 521448, "epoch": 6282} {"train_loss": -27.50343894958496, "global_step": 521449, "epoch": 6282} {"train_loss": -27.593509674072266, "global_step": 521450, "epoch": 6282} {"train_loss": -27.69825553894043, "global_step": 521451, "epoch": 6282} {"train_loss": -27.768817901611328, "global_step": 521452, "epoch": 6282} {"train_loss": -28.152963638305664, "global_step": 521453, "epoch": 6282} {"train_loss": -27.611310958862305, "global_step": 521454, "epoch": 6282} {"train_loss": -27.627532958984375, "global_step": 521455, "epoch": 6282} {"train_loss": -27.803857803344727, "global_step": 521456, "epoch": 6282} {"train_loss": -27.98455238342285, "global_step": 521457, "epoch": 6282} {"train_loss": -27.666645050048828, "global_step": 521458, "epoch": 6282} {"train_loss": -27.735448837280273, "global_step": 521459, "epoch": 6282} {"train_loss": -27.774188995361328, "global_step": 521460, "epoch": 6282} {"train_loss": -27.895111083984375, "global_step": 521461, "epoch": 6282} {"train_loss": -27.722848892211914, "global_step": 521462, "epoch": 6282} {"train_loss": -27.739694595336914, "global_step": 521463, "epoch": 6282} {"train_loss": -27.407455444335938, "global_step": 521464, "epoch": 6282} {"train_loss": -27.933130264282227, "global_step": 521465, "epoch": 6282} {"train_loss": -27.5982666015625, "global_step": 521466, "epoch": 6282} {"train_loss": -27.327611923217773, "global_step": 521467, "epoch": 6282} {"train_loss": -27.061309814453125, "global_step": 521468, "epoch": 6282} {"train_loss": -26.439863204956055, "global_step": 521469, "epoch": 6282} {"train_loss": -27.174253463745117, "global_step": 521470, "epoch": 6282} {"train_loss": -27.593774795532227, "global_step": 521471, "epoch": 6282} {"train_loss": -26.96443748474121, "global_step": 521472, "epoch": 6282} {"train_loss": -26.685169219970703, "global_step": 521473, "epoch": 6282} {"train_loss": -27.68291664123535, "global_step": 521474, "epoch": 6282} {"train_loss": -27.606094360351562, "global_step": 521475, "epoch": 6282} {"train_loss": -27.198278427124023, "global_step": 521476, "epoch": 6282} {"train_loss": -27.456701278686523, "global_step": 521477, "epoch": 6282} {"train_loss": -27.35694694519043, "global_step": 521478, "epoch": 6282} {"train_loss": -27.61042594909668, "global_step": 521479, "epoch": 6282} {"train_loss": -27.101049423217773, "global_step": 521480, "epoch": 6282} {"train_loss": -27.56853675842285, "global_step": 521481, "epoch": 6282} {"train_loss": -27.372770309448242, "global_step": 521482, "epoch": 6282} {"train_loss": -27.631601333618164, "global_step": 521483, "epoch": 6282} {"train_loss": -27.481698989868164, "global_step": 521484, "epoch": 6282} {"train_loss": -27.441425323486328, "global_step": 521485, "epoch": 6282} {"train_loss": -27.23761558532715, "global_step": 521486, "epoch": 6282} {"train_loss": -27.136945724487305, "global_step": 521487, "epoch": 6282} {"train_loss": -27.35986792323101, "global_step": 521488, "epoch": 6282, "val_loss": 6629733.0} {"train_loss": -27.265228271484375, "global_step": 521489, "epoch": 6283} {"train_loss": -27.061975479125977, "global_step": 521490, "epoch": 6283} {"train_loss": -27.327001571655273, "global_step": 521491, "epoch": 6283} {"train_loss": -27.188831329345703, "global_step": 521492, "epoch": 6283} {"train_loss": -27.52549171447754, "global_step": 521493, "epoch": 6283} {"train_loss": -27.185758590698242, "global_step": 521494, "epoch": 6283} {"train_loss": -27.43682861328125, "global_step": 521495, "epoch": 6283} {"train_loss": -26.916656494140625, "global_step": 521496, "epoch": 6283} {"train_loss": -27.315439224243164, "global_step": 521497, "epoch": 6283} {"train_loss": -27.668094635009766, "global_step": 521498, "epoch": 6283} {"train_loss": -26.842987060546875, "global_step": 521499, "epoch": 6283} {"train_loss": -27.330244064331055, "global_step": 521500, "epoch": 6283} {"train_loss": -27.282093048095703, "global_step": 521501, "epoch": 6283} {"train_loss": -27.1994686126709, "global_step": 521502, "epoch": 6283} {"train_loss": -26.9676456451416, "global_step": 521503, "epoch": 6283} {"train_loss": -27.458393096923828, "global_step": 521504, "epoch": 6283} {"train_loss": -27.13190269470215, "global_step": 521505, "epoch": 6283} {"train_loss": -27.4385929107666, "global_step": 521506, "epoch": 6283} {"train_loss": -27.590301513671875, "global_step": 521507, "epoch": 6283} {"train_loss": -27.662067413330078, "global_step": 521508, "epoch": 6283} {"train_loss": -27.105329513549805, "global_step": 521509, "epoch": 6283} {"train_loss": -27.23917007446289, "global_step": 521510, "epoch": 6283} {"train_loss": -27.25526237487793, "global_step": 521511, "epoch": 6283} {"train_loss": -27.283557891845703, "global_step": 521512, "epoch": 6283} {"train_loss": -27.482709884643555, "global_step": 521513, "epoch": 6283} {"train_loss": -27.67816734313965, "global_step": 521514, "epoch": 6283} {"train_loss": -27.228845596313477, "global_step": 521515, "epoch": 6283} {"train_loss": -27.350570678710938, "global_step": 521516, "epoch": 6283} {"train_loss": -27.654285430908203, "global_step": 521517, "epoch": 6283} {"train_loss": -27.4693546295166, "global_step": 521518, "epoch": 6283} {"train_loss": -27.888071060180664, "global_step": 521519, "epoch": 6283} {"train_loss": -27.94148063659668, "global_step": 521520, "epoch": 6283} {"train_loss": -27.218738555908203, "global_step": 521521, "epoch": 6283} {"train_loss": -27.100366592407227, "global_step": 521522, "epoch": 6283} {"train_loss": -27.726011276245117, "global_step": 521523, "epoch": 6283} {"train_loss": -27.835376739501953, "global_step": 521524, "epoch": 6283} {"train_loss": -27.94244384765625, "global_step": 521525, "epoch": 6283} {"train_loss": -27.755355834960938, "global_step": 521526, "epoch": 6283} {"train_loss": -27.563827514648438, "global_step": 521527, "epoch": 6283} {"train_loss": -27.357275009155273, "global_step": 521528, "epoch": 6283} {"train_loss": -27.681537628173828, "global_step": 521529, "epoch": 6283} {"train_loss": -27.611225128173828, "global_step": 521530, "epoch": 6283} {"train_loss": -27.580121994018555, "global_step": 521531, "epoch": 6283} {"train_loss": -27.633230209350586, "global_step": 521532, "epoch": 6283} {"train_loss": -27.659849166870117, "global_step": 521533, "epoch": 6283} {"train_loss": -27.600482940673828, "global_step": 521534, "epoch": 6283} {"train_loss": -27.447223663330078, "global_step": 521535, "epoch": 6283} {"train_loss": -28.15596580505371, "global_step": 521536, "epoch": 6283} {"train_loss": -27.418066024780273, "global_step": 521537, "epoch": 6283} {"train_loss": -27.72663688659668, "global_step": 521538, "epoch": 6283} {"train_loss": -27.640539169311523, "global_step": 521539, "epoch": 6283} {"train_loss": -27.9593448638916, "global_step": 521540, "epoch": 6283} {"train_loss": -27.468891143798828, "global_step": 521541, "epoch": 6283} {"train_loss": -27.857892990112305, "global_step": 521542, "epoch": 6283} {"train_loss": -27.533893585205078, "global_step": 521543, "epoch": 6283} {"train_loss": -27.32063865661621, "global_step": 521544, "epoch": 6283} {"train_loss": -27.153959274291992, "global_step": 521545, "epoch": 6283} {"train_loss": -27.396329879760742, "global_step": 521546, "epoch": 6283} {"train_loss": -27.36319923400879, "global_step": 521547, "epoch": 6283} {"train_loss": -27.1671142578125, "global_step": 521548, "epoch": 6283} {"train_loss": -27.0145320892334, "global_step": 521549, "epoch": 6283} {"train_loss": -27.013879776000977, "global_step": 521550, "epoch": 6283} {"train_loss": -27.39692497253418, "global_step": 521551, "epoch": 6283} {"train_loss": -27.467121124267578, "global_step": 521552, "epoch": 6283} {"train_loss": -27.511219024658203, "global_step": 521553, "epoch": 6283} {"train_loss": -27.2586669921875, "global_step": 521554, "epoch": 6283} {"train_loss": -27.329147338867188, "global_step": 521555, "epoch": 6283} {"train_loss": -27.495542526245117, "global_step": 521556, "epoch": 6283} {"train_loss": -27.75296974182129, "global_step": 521557, "epoch": 6283} {"train_loss": -27.39041519165039, "global_step": 521558, "epoch": 6283} {"train_loss": -27.69349479675293, "global_step": 521559, "epoch": 6283} {"train_loss": -27.634475708007812, "global_step": 521560, "epoch": 6283} {"train_loss": -27.7484130859375, "global_step": 521561, "epoch": 6283} {"train_loss": -27.306350708007812, "global_step": 521562, "epoch": 6283} {"train_loss": -27.46747398376465, "global_step": 521563, "epoch": 6283} {"train_loss": -27.011932373046875, "global_step": 521564, "epoch": 6283} {"train_loss": -27.433670043945312, "global_step": 521565, "epoch": 6283} {"train_loss": -27.51814079284668, "global_step": 521566, "epoch": 6283} {"train_loss": -27.614276885986328, "global_step": 521567, "epoch": 6283} {"train_loss": -27.68720054626465, "global_step": 521568, "epoch": 6283} {"train_loss": -27.43079948425293, "global_step": 521569, "epoch": 6283} {"train_loss": -27.445911407470703, "global_step": 521570, "epoch": 6283} {"train_loss": -27.441104751035393, "global_step": 521571, "epoch": 6283, "val_loss": 6614243.0} {"train_loss": -27.269514083862305, "global_step": 521572, "epoch": 6284} {"train_loss": -26.632831573486328, "global_step": 521573, "epoch": 6284} {"train_loss": -26.9361515045166, "global_step": 521574, "epoch": 6284} {"train_loss": -27.710086822509766, "global_step": 521575, "epoch": 6284} {"train_loss": -27.23316764831543, "global_step": 521576, "epoch": 6284} {"train_loss": -27.308029174804688, "global_step": 521577, "epoch": 6284} {"train_loss": -27.50296401977539, "global_step": 521578, "epoch": 6284} {"train_loss": -27.16486167907715, "global_step": 521579, "epoch": 6284} {"train_loss": -27.317968368530273, "global_step": 521580, "epoch": 6284} {"train_loss": -27.488611221313477, "global_step": 521581, "epoch": 6284} {"train_loss": -27.620046615600586, "global_step": 521582, "epoch": 6284} {"train_loss": -27.31642723083496, "global_step": 521583, "epoch": 6284} {"train_loss": -27.61195945739746, "global_step": 521584, "epoch": 6284} {"train_loss": -27.822418212890625, "global_step": 521585, "epoch": 6284} {"train_loss": -27.35491943359375, "global_step": 521586, "epoch": 6284} {"train_loss": -27.315332412719727, "global_step": 521587, "epoch": 6284} {"train_loss": -27.134475708007812, "global_step": 521588, "epoch": 6284} {"train_loss": -27.921133041381836, "global_step": 521589, "epoch": 6284} {"train_loss": -27.674762725830078, "global_step": 521590, "epoch": 6284} {"train_loss": -27.976282119750977, "global_step": 521591, "epoch": 6284} {"train_loss": -27.3714542388916, "global_step": 521592, "epoch": 6284} {"train_loss": -27.69722557067871, "global_step": 521593, "epoch": 6284} {"train_loss": -27.423633575439453, "global_step": 521594, "epoch": 6284} {"train_loss": -27.313451766967773, "global_step": 521595, "epoch": 6284} {"train_loss": -27.91448974609375, "global_step": 521596, "epoch": 6284} {"train_loss": -27.863187789916992, "global_step": 521597, "epoch": 6284} {"train_loss": -27.56561279296875, "global_step": 521598, "epoch": 6284} {"train_loss": -27.538846969604492, "global_step": 521599, "epoch": 6284} {"train_loss": -27.5277099609375, "global_step": 521600, "epoch": 6284} {"train_loss": -27.365652084350586, "global_step": 521601, "epoch": 6284} {"train_loss": -27.536176681518555, "global_step": 521602, "epoch": 6284} {"train_loss": -27.861774444580078, "global_step": 521603, "epoch": 6284} {"train_loss": -27.51725196838379, "global_step": 521604, "epoch": 6284} {"train_loss": -27.373327255249023, "global_step": 521605, "epoch": 6284} {"train_loss": -27.51515769958496, "global_step": 521606, "epoch": 6284} {"train_loss": -27.31485366821289, "global_step": 521607, "epoch": 6284} {"train_loss": -27.6568603515625, "global_step": 521608, "epoch": 6284} {"train_loss": -27.4012393951416, "global_step": 521609, "epoch": 6284} {"train_loss": -27.892505645751953, "global_step": 521610, "epoch": 6284} {"train_loss": -27.722742080688477, "global_step": 521611, "epoch": 6284} {"train_loss": -27.480680465698242, "global_step": 521612, "epoch": 6284} {"train_loss": -27.60052490234375, "global_step": 521613, "epoch": 6284} {"train_loss": -27.634313583374023, "global_step": 521614, "epoch": 6284} {"train_loss": -27.782068252563477, "global_step": 521615, "epoch": 6284} {"train_loss": -27.412012100219727, "global_step": 521616, "epoch": 6284} {"train_loss": -27.630537033081055, "global_step": 521617, "epoch": 6284} {"train_loss": -27.534757614135742, "global_step": 521618, "epoch": 6284} {"train_loss": -27.65273094177246, "global_step": 521619, "epoch": 6284} {"train_loss": -27.594629287719727, "global_step": 521620, "epoch": 6284} {"train_loss": -28.011457443237305, "global_step": 521621, "epoch": 6284} {"train_loss": -27.570117950439453, "global_step": 521622, "epoch": 6284} {"train_loss": -27.75922966003418, "global_step": 521623, "epoch": 6284} {"train_loss": -27.696359634399414, "global_step": 521624, "epoch": 6284} {"train_loss": -27.622766494750977, "global_step": 521625, "epoch": 6284} {"train_loss": -27.393970489501953, "global_step": 521626, "epoch": 6284} {"train_loss": -27.916147232055664, "global_step": 521627, "epoch": 6284} {"train_loss": -27.752649307250977, "global_step": 521628, "epoch": 6284} {"train_loss": -27.48227310180664, "global_step": 521629, "epoch": 6284} {"train_loss": -27.544788360595703, "global_step": 521630, "epoch": 6284} {"train_loss": -27.704730987548828, "global_step": 521631, "epoch": 6284} {"train_loss": -27.374866485595703, "global_step": 521632, "epoch": 6284} {"train_loss": -27.6536922454834, "global_step": 521633, "epoch": 6284} {"train_loss": -27.521656036376953, "global_step": 521634, "epoch": 6284} {"train_loss": -27.745336532592773, "global_step": 521635, "epoch": 6284} {"train_loss": -27.818212509155273, "global_step": 521636, "epoch": 6284} {"train_loss": -27.751920700073242, "global_step": 521637, "epoch": 6284} {"train_loss": -27.87156105041504, "global_step": 521638, "epoch": 6284} {"train_loss": -27.530319213867188, "global_step": 521639, "epoch": 6284} {"train_loss": -27.76031494140625, "global_step": 521640, "epoch": 6284} {"train_loss": -27.465839385986328, "global_step": 521641, "epoch": 6284} {"train_loss": -27.744464874267578, "global_step": 521642, "epoch": 6284} {"train_loss": -27.302234649658203, "global_step": 521643, "epoch": 6284} {"train_loss": -27.7619571685791, "global_step": 521644, "epoch": 6284} {"train_loss": -27.783008575439453, "global_step": 521645, "epoch": 6284} {"train_loss": -27.510740280151367, "global_step": 521646, "epoch": 6284} {"train_loss": -27.29119300842285, "global_step": 521647, "epoch": 6284} {"train_loss": -27.2012882232666, "global_step": 521648, "epoch": 6284} {"train_loss": -28.0621395111084, "global_step": 521649, "epoch": 6284} {"train_loss": -27.394622802734375, "global_step": 521650, "epoch": 6284} {"train_loss": -27.77100944519043, "global_step": 521651, "epoch": 6284} {"train_loss": -27.406808853149414, "global_step": 521652, "epoch": 6284} {"train_loss": -27.78277587890625, "global_step": 521653, "epoch": 6284} {"train_loss": -27.561749952385224, "global_step": 521654, "epoch": 6284, "val_loss": 6657930.0} {"train_loss": -26.268722534179688, "global_step": 521655, "epoch": 6285} {"train_loss": -25.180334091186523, "global_step": 521656, "epoch": 6285} {"train_loss": -23.051536560058594, "global_step": 521657, "epoch": 6285} {"train_loss": -24.58434295654297, "global_step": 521658, "epoch": 6285} {"train_loss": -25.614273071289062, "global_step": 521659, "epoch": 6285} {"train_loss": -24.687118530273438, "global_step": 521660, "epoch": 6285} {"train_loss": -25.891157150268555, "global_step": 521661, "epoch": 6285} {"train_loss": -26.234323501586914, "global_step": 521662, "epoch": 6285} {"train_loss": -26.305784225463867, "global_step": 521663, "epoch": 6285} {"train_loss": -26.478620529174805, "global_step": 521664, "epoch": 6285} {"train_loss": -26.5238094329834, "global_step": 521665, "epoch": 6285} {"train_loss": -26.342008590698242, "global_step": 521666, "epoch": 6285} {"train_loss": -26.44818687438965, "global_step": 521667, "epoch": 6285} {"train_loss": -26.573627471923828, "global_step": 521668, "epoch": 6285} {"train_loss": -26.09537124633789, "global_step": 521669, "epoch": 6285} {"train_loss": -26.526996612548828, "global_step": 521670, "epoch": 6285} {"train_loss": -26.87583351135254, "global_step": 521671, "epoch": 6285} {"train_loss": -26.96034049987793, "global_step": 521672, "epoch": 6285} {"train_loss": -26.948917388916016, "global_step": 521673, "epoch": 6285} {"train_loss": -26.825536727905273, "global_step": 521674, "epoch": 6285} {"train_loss": -26.73866081237793, "global_step": 521675, "epoch": 6285} {"train_loss": -26.993972778320312, "global_step": 521676, "epoch": 6285} {"train_loss": -26.66275978088379, "global_step": 521677, "epoch": 6285} {"train_loss": -26.91948890686035, "global_step": 521678, "epoch": 6285} {"train_loss": -26.95903968811035, "global_step": 521679, "epoch": 6285} {"train_loss": -26.877965927124023, "global_step": 521680, "epoch": 6285} {"train_loss": -27.468036651611328, "global_step": 521681, "epoch": 6285} {"train_loss": -26.912857055664062, "global_step": 521682, "epoch": 6285} {"train_loss": -27.045989990234375, "global_step": 521683, "epoch": 6285} {"train_loss": -26.883874893188477, "global_step": 521684, "epoch": 6285} {"train_loss": -27.11795425415039, "global_step": 521685, "epoch": 6285} {"train_loss": -27.066974639892578, "global_step": 521686, "epoch": 6285} {"train_loss": -27.219099044799805, "global_step": 521687, "epoch": 6285} {"train_loss": -26.920507431030273, "global_step": 521688, "epoch": 6285} {"train_loss": -27.17093276977539, "global_step": 521689, "epoch": 6285} {"train_loss": -27.224531173706055, "global_step": 521690, "epoch": 6285} {"train_loss": -27.115982055664062, "global_step": 521691, "epoch": 6285} {"train_loss": -27.22269058227539, "global_step": 521692, "epoch": 6285} {"train_loss": -27.046039581298828, "global_step": 521693, "epoch": 6285} {"train_loss": -27.087568283081055, "global_step": 521694, "epoch": 6285} {"train_loss": -27.040359497070312, "global_step": 521695, "epoch": 6285} {"train_loss": -27.45875358581543, "global_step": 521696, "epoch": 6285} {"train_loss": -27.202070236206055, "global_step": 521697, "epoch": 6285} {"train_loss": -27.305490493774414, "global_step": 521698, "epoch": 6285} {"train_loss": -27.329198837280273, "global_step": 521699, "epoch": 6285} {"train_loss": -27.707944869995117, "global_step": 521700, "epoch": 6285} {"train_loss": -27.224689483642578, "global_step": 521701, "epoch": 6285} {"train_loss": -27.49820327758789, "global_step": 521702, "epoch": 6285} {"train_loss": -27.617740631103516, "global_step": 521703, "epoch": 6285} {"train_loss": -27.749998092651367, "global_step": 521704, "epoch": 6285} {"train_loss": -27.52191162109375, "global_step": 521705, "epoch": 6285} {"train_loss": -27.455036163330078, "global_step": 521706, "epoch": 6285} {"train_loss": -27.922895431518555, "global_step": 521707, "epoch": 6285} {"train_loss": -27.704294204711914, "global_step": 521708, "epoch": 6285} {"train_loss": -27.64458656311035, "global_step": 521709, "epoch": 6285} {"train_loss": -27.655561447143555, "global_step": 521710, "epoch": 6285} {"train_loss": -27.784215927124023, "global_step": 521711, "epoch": 6285} {"train_loss": -27.496387481689453, "global_step": 521712, "epoch": 6285} {"train_loss": -27.510839462280273, "global_step": 521713, "epoch": 6285} {"train_loss": -27.459625244140625, "global_step": 521714, "epoch": 6285} {"train_loss": -27.338171005249023, "global_step": 521715, "epoch": 6285} {"train_loss": -27.8013916015625, "global_step": 521716, "epoch": 6285} {"train_loss": -27.882680892944336, "global_step": 521717, "epoch": 6285} {"train_loss": -27.80890464782715, "global_step": 521718, "epoch": 6285} {"train_loss": -28.16212272644043, "global_step": 521719, "epoch": 6285} {"train_loss": -27.392105102539062, "global_step": 521720, "epoch": 6285} {"train_loss": -27.802099227905273, "global_step": 521721, "epoch": 6285} {"train_loss": -27.524368286132812, "global_step": 521722, "epoch": 6285} {"train_loss": -27.409414291381836, "global_step": 521723, "epoch": 6285} {"train_loss": -27.596424102783203, "global_step": 521724, "epoch": 6285} {"train_loss": -27.311695098876953, "global_step": 521725, "epoch": 6285} {"train_loss": -27.383834838867188, "global_step": 521726, "epoch": 6285} {"train_loss": -27.610754013061523, "global_step": 521727, "epoch": 6285} {"train_loss": -27.82892417907715, "global_step": 521728, "epoch": 6285} {"train_loss": -27.756635665893555, "global_step": 521729, "epoch": 6285} {"train_loss": -27.639301300048828, "global_step": 521730, "epoch": 6285} {"train_loss": -27.635467529296875, "global_step": 521731, "epoch": 6285} {"train_loss": -27.931055068969727, "global_step": 521732, "epoch": 6285} {"train_loss": -28.137516021728516, "global_step": 521733, "epoch": 6285} {"train_loss": -27.7706241607666, "global_step": 521734, "epoch": 6285} {"train_loss": -27.672870635986328, "global_step": 521735, "epoch": 6285} {"train_loss": -27.959552764892578, "global_step": 521736, "epoch": 6285} {"train_loss": -27.09022703515478, "global_step": 521737, "epoch": 6285, "val_loss": 6617343.0} {"train_loss": -26.785181045532227, "global_step": 521738, "epoch": 6286} {"train_loss": -25.515539169311523, "global_step": 521739, "epoch": 6286} {"train_loss": -25.934234619140625, "global_step": 521740, "epoch": 6286} {"train_loss": -26.8802490234375, "global_step": 521741, "epoch": 6286} {"train_loss": -26.4340877532959, "global_step": 521742, "epoch": 6286} {"train_loss": -26.934412002563477, "global_step": 521743, "epoch": 6286} {"train_loss": -26.953327178955078, "global_step": 521744, "epoch": 6286} {"train_loss": -26.535131454467773, "global_step": 521745, "epoch": 6286} {"train_loss": -26.940704345703125, "global_step": 521746, "epoch": 6286} {"train_loss": -27.19679832458496, "global_step": 521747, "epoch": 6286} {"train_loss": -26.910736083984375, "global_step": 521748, "epoch": 6286} {"train_loss": -27.381683349609375, "global_step": 521749, "epoch": 6286} {"train_loss": -27.138904571533203, "global_step": 521750, "epoch": 6286} {"train_loss": -27.095556259155273, "global_step": 521751, "epoch": 6286} {"train_loss": -27.259033203125, "global_step": 521752, "epoch": 6286} {"train_loss": -27.182897567749023, "global_step": 521753, "epoch": 6286} {"train_loss": -27.44329833984375, "global_step": 521754, "epoch": 6286} {"train_loss": -27.09925651550293, "global_step": 521755, "epoch": 6286} {"train_loss": -27.165815353393555, "global_step": 521756, "epoch": 6286} {"train_loss": -27.373960494995117, "global_step": 521757, "epoch": 6286} {"train_loss": -27.291107177734375, "global_step": 521758, "epoch": 6286} {"train_loss": -27.336597442626953, "global_step": 521759, "epoch": 6286} {"train_loss": -27.612905502319336, "global_step": 521760, "epoch": 6286} {"train_loss": -27.538604736328125, "global_step": 521761, "epoch": 6286} {"train_loss": -27.381378173828125, "global_step": 521762, "epoch": 6286} {"train_loss": -27.64253044128418, "global_step": 521763, "epoch": 6286} {"train_loss": -27.75070571899414, "global_step": 521764, "epoch": 6286} {"train_loss": -27.586999893188477, "global_step": 521765, "epoch": 6286} {"train_loss": -27.677936553955078, "global_step": 521766, "epoch": 6286} {"train_loss": -27.142566680908203, "global_step": 521767, "epoch": 6286} {"train_loss": -27.478580474853516, "global_step": 521768, "epoch": 6286} {"train_loss": -27.759632110595703, "global_step": 521769, "epoch": 6286} {"train_loss": -27.2630672454834, "global_step": 521770, "epoch": 6286} {"train_loss": -27.725147247314453, "global_step": 521771, "epoch": 6286} {"train_loss": -27.569625854492188, "global_step": 521772, "epoch": 6286} {"train_loss": -27.892047882080078, "global_step": 521773, "epoch": 6286} {"train_loss": -27.493078231811523, "global_step": 521774, "epoch": 6286} {"train_loss": -27.889541625976562, "global_step": 521775, "epoch": 6286} {"train_loss": -27.539819717407227, "global_step": 521776, "epoch": 6286} {"train_loss": -27.768951416015625, "global_step": 521777, "epoch": 6286} {"train_loss": -27.637313842773438, "global_step": 521778, "epoch": 6286} {"train_loss": -28.163105010986328, "global_step": 521779, "epoch": 6286} {"train_loss": -27.338031768798828, "global_step": 521780, "epoch": 6286} {"train_loss": -27.8159236907959, "global_step": 521781, "epoch": 6286} {"train_loss": -27.45770835876465, "global_step": 521782, "epoch": 6286} {"train_loss": -27.59352684020996, "global_step": 521783, "epoch": 6286} {"train_loss": -27.7062931060791, "global_step": 521784, "epoch": 6286} {"train_loss": -27.66792106628418, "global_step": 521785, "epoch": 6286} {"train_loss": -27.614294052124023, "global_step": 521786, "epoch": 6286} {"train_loss": -27.169137954711914, "global_step": 521787, "epoch": 6286} {"train_loss": -26.8919677734375, "global_step": 521788, "epoch": 6286} {"train_loss": -26.200153350830078, "global_step": 521789, "epoch": 6286} {"train_loss": -25.748462677001953, "global_step": 521790, "epoch": 6286} {"train_loss": -26.41810417175293, "global_step": 521791, "epoch": 6286} {"train_loss": -27.340988159179688, "global_step": 521792, "epoch": 6286} {"train_loss": -26.864683151245117, "global_step": 521793, "epoch": 6286} {"train_loss": -26.308536529541016, "global_step": 521794, "epoch": 6286} {"train_loss": -27.134174346923828, "global_step": 521795, "epoch": 6286} {"train_loss": -26.569860458374023, "global_step": 521796, "epoch": 6286} {"train_loss": -27.106916427612305, "global_step": 521797, "epoch": 6286} {"train_loss": -27.010526657104492, "global_step": 521798, "epoch": 6286} {"train_loss": -27.337133407592773, "global_step": 521799, "epoch": 6286} {"train_loss": -27.10402488708496, "global_step": 521800, "epoch": 6286} {"train_loss": -27.813323974609375, "global_step": 521801, "epoch": 6286} {"train_loss": -26.691638946533203, "global_step": 521802, "epoch": 6286} {"train_loss": -27.250518798828125, "global_step": 521803, "epoch": 6286} {"train_loss": -27.274381637573242, "global_step": 521804, "epoch": 6286} {"train_loss": -27.417016983032227, "global_step": 521805, "epoch": 6286} {"train_loss": -27.141586303710938, "global_step": 521806, "epoch": 6286} {"train_loss": -27.16676902770996, "global_step": 521807, "epoch": 6286} {"train_loss": -27.033477783203125, "global_step": 521808, "epoch": 6286} {"train_loss": -27.146991729736328, "global_step": 521809, "epoch": 6286} {"train_loss": -27.261493682861328, "global_step": 521810, "epoch": 6286} {"train_loss": -27.386281967163086, "global_step": 521811, "epoch": 6286} {"train_loss": -27.774621963500977, "global_step": 521812, "epoch": 6286} {"train_loss": -27.148473739624023, "global_step": 521813, "epoch": 6286} {"train_loss": -27.449005126953125, "global_step": 521814, "epoch": 6286} {"train_loss": -27.530820846557617, "global_step": 521815, "epoch": 6286} {"train_loss": -27.653745651245117, "global_step": 521816, "epoch": 6286} {"train_loss": -27.495197296142578, "global_step": 521817, "epoch": 6286} {"train_loss": -27.67852783203125, "global_step": 521818, "epoch": 6286} {"train_loss": -27.40402603149414, "global_step": 521819, "epoch": 6286} {"train_loss": -27.243440375270612, "global_step": 521820, "epoch": 6286, "val_loss": 6639121.5} {"train_loss": -27.403839111328125, "global_step": 521821, "epoch": 6287} {"train_loss": -27.469690322875977, "global_step": 521822, "epoch": 6287} {"train_loss": -27.5743350982666, "global_step": 521823, "epoch": 6287} {"train_loss": -27.332565307617188, "global_step": 521824, "epoch": 6287} {"train_loss": -27.171838760375977, "global_step": 521825, "epoch": 6287} {"train_loss": -27.442493438720703, "global_step": 521826, "epoch": 6287} {"train_loss": -27.269453048706055, "global_step": 521827, "epoch": 6287} {"train_loss": -27.52473258972168, "global_step": 521828, "epoch": 6287} {"train_loss": -27.349201202392578, "global_step": 521829, "epoch": 6287} {"train_loss": -27.853124618530273, "global_step": 521830, "epoch": 6287} {"train_loss": -27.5678768157959, "global_step": 521831, "epoch": 6287} {"train_loss": -27.483184814453125, "global_step": 521832, "epoch": 6287} {"train_loss": -27.56113624572754, "global_step": 521833, "epoch": 6287} {"train_loss": -27.788379669189453, "global_step": 521834, "epoch": 6287} {"train_loss": -27.534000396728516, "global_step": 521835, "epoch": 6287} {"train_loss": -27.324594497680664, "global_step": 521836, "epoch": 6287} {"train_loss": -27.425947189331055, "global_step": 521837, "epoch": 6287} {"train_loss": -27.601734161376953, "global_step": 521838, "epoch": 6287} {"train_loss": -27.995908737182617, "global_step": 521839, "epoch": 6287} {"train_loss": -27.717798233032227, "global_step": 521840, "epoch": 6287} {"train_loss": -27.814306259155273, "global_step": 521841, "epoch": 6287} {"train_loss": -27.803205490112305, "global_step": 521842, "epoch": 6287} {"train_loss": -27.305906295776367, "global_step": 521843, "epoch": 6287} {"train_loss": -27.570667266845703, "global_step": 521844, "epoch": 6287} {"train_loss": -27.7412109375, "global_step": 521845, "epoch": 6287} {"train_loss": -27.563583374023438, "global_step": 521846, "epoch": 6287} {"train_loss": -27.571563720703125, "global_step": 521847, "epoch": 6287} {"train_loss": -27.275909423828125, "global_step": 521848, "epoch": 6287} {"train_loss": -27.906982421875, "global_step": 521849, "epoch": 6287} {"train_loss": -27.633056640625, "global_step": 521850, "epoch": 6287} {"train_loss": -27.22731590270996, "global_step": 521851, "epoch": 6287} {"train_loss": -27.73024559020996, "global_step": 521852, "epoch": 6287} {"train_loss": -27.67841911315918, "global_step": 521853, "epoch": 6287} {"train_loss": -27.795385360717773, "global_step": 521854, "epoch": 6287} {"train_loss": -27.65547752380371, "global_step": 521855, "epoch": 6287} {"train_loss": -27.1518611907959, "global_step": 521856, "epoch": 6287} {"train_loss": -27.38128089904785, "global_step": 521857, "epoch": 6287} {"train_loss": -27.638593673706055, "global_step": 521858, "epoch": 6287} {"train_loss": -27.513044357299805, "global_step": 521859, "epoch": 6287} {"train_loss": -27.028594970703125, "global_step": 521860, "epoch": 6287} {"train_loss": -27.47205924987793, "global_step": 521861, "epoch": 6287} {"train_loss": -27.103946685791016, "global_step": 521862, "epoch": 6287} {"train_loss": -27.67828941345215, "global_step": 521863, "epoch": 6287} {"train_loss": -27.535810470581055, "global_step": 521864, "epoch": 6287} {"train_loss": -27.275854110717773, "global_step": 521865, "epoch": 6287} {"train_loss": -27.186689376831055, "global_step": 521866, "epoch": 6287} {"train_loss": -27.665624618530273, "global_step": 521867, "epoch": 6287} {"train_loss": -27.4831485748291, "global_step": 521868, "epoch": 6287} {"train_loss": -27.542551040649414, "global_step": 521869, "epoch": 6287} {"train_loss": -27.590106964111328, "global_step": 521870, "epoch": 6287} {"train_loss": -27.445722579956055, "global_step": 521871, "epoch": 6287} {"train_loss": -27.4398193359375, "global_step": 521872, "epoch": 6287} {"train_loss": -27.50775718688965, "global_step": 521873, "epoch": 6287} {"train_loss": -27.843297958374023, "global_step": 521874, "epoch": 6287} {"train_loss": -27.75709342956543, "global_step": 521875, "epoch": 6287} {"train_loss": -27.451635360717773, "global_step": 521876, "epoch": 6287} {"train_loss": -27.895557403564453, "global_step": 521877, "epoch": 6287} {"train_loss": -27.505483627319336, "global_step": 521878, "epoch": 6287} {"train_loss": -27.175098419189453, "global_step": 521879, "epoch": 6287} {"train_loss": -27.683013916015625, "global_step": 521880, "epoch": 6287} {"train_loss": -27.316808700561523, "global_step": 521881, "epoch": 6287} {"train_loss": -27.54713249206543, "global_step": 521882, "epoch": 6287} {"train_loss": -27.53737449645996, "global_step": 521883, "epoch": 6287} {"train_loss": -27.4888858795166, "global_step": 521884, "epoch": 6287} {"train_loss": -27.20625114440918, "global_step": 521885, "epoch": 6287} {"train_loss": -27.367542266845703, "global_step": 521886, "epoch": 6287} {"train_loss": -27.522022247314453, "global_step": 521887, "epoch": 6287} {"train_loss": -27.530370712280273, "global_step": 521888, "epoch": 6287} {"train_loss": -27.083654403686523, "global_step": 521889, "epoch": 6287} {"train_loss": -27.715402603149414, "global_step": 521890, "epoch": 6287} {"train_loss": -26.99298667907715, "global_step": 521891, "epoch": 6287} {"train_loss": -27.506179809570312, "global_step": 521892, "epoch": 6287} {"train_loss": -27.567041397094727, "global_step": 521893, "epoch": 6287} {"train_loss": -27.104841232299805, "global_step": 521894, "epoch": 6287} {"train_loss": -27.297903060913086, "global_step": 521895, "epoch": 6287} {"train_loss": -26.9533748626709, "global_step": 521896, "epoch": 6287} {"train_loss": -27.45197105407715, "global_step": 521897, "epoch": 6287} {"train_loss": -26.931821823120117, "global_step": 521898, "epoch": 6287} {"train_loss": -27.738037109375, "global_step": 521899, "epoch": 6287} {"train_loss": -27.55014991760254, "global_step": 521900, "epoch": 6287} {"train_loss": -27.506195068359375, "global_step": 521901, "epoch": 6287} {"train_loss": -27.2889404296875, "global_step": 521902, "epoch": 6287} {"train_loss": -27.475334190460572, "global_step": 521903, "epoch": 6287, "val_loss": 6615304.5} {"train_loss": -27.003564834594727, "global_step": 521904, "epoch": 6288} {"train_loss": -26.451589584350586, "global_step": 521905, "epoch": 6288} {"train_loss": -26.429418563842773, "global_step": 521906, "epoch": 6288} {"train_loss": -27.110107421875, "global_step": 521907, "epoch": 6288} {"train_loss": -26.9504451751709, "global_step": 521908, "epoch": 6288} {"train_loss": -26.747314453125, "global_step": 521909, "epoch": 6288} {"train_loss": -26.93899917602539, "global_step": 521910, "epoch": 6288} {"train_loss": -26.92970085144043, "global_step": 521911, "epoch": 6288} {"train_loss": -26.822900772094727, "global_step": 521912, "epoch": 6288} {"train_loss": -27.332677841186523, "global_step": 521913, "epoch": 6288} {"train_loss": -26.931583404541016, "global_step": 521914, "epoch": 6288} {"train_loss": -27.5123233795166, "global_step": 521915, "epoch": 6288} {"train_loss": -26.985687255859375, "global_step": 521916, "epoch": 6288} {"train_loss": -27.363056182861328, "global_step": 521917, "epoch": 6288} {"train_loss": -27.036590576171875, "global_step": 521918, "epoch": 6288} {"train_loss": -27.265350341796875, "global_step": 521919, "epoch": 6288} {"train_loss": -27.57069206237793, "global_step": 521920, "epoch": 6288} {"train_loss": -27.428815841674805, "global_step": 521921, "epoch": 6288} {"train_loss": -27.7246150970459, "global_step": 521922, "epoch": 6288} {"train_loss": -27.21710205078125, "global_step": 521923, "epoch": 6288} {"train_loss": -27.554767608642578, "global_step": 521924, "epoch": 6288} {"train_loss": -27.405689239501953, "global_step": 521925, "epoch": 6288} {"train_loss": -27.15863037109375, "global_step": 521926, "epoch": 6288} {"train_loss": -27.237548828125, "global_step": 521927, "epoch": 6288} {"train_loss": -27.21375846862793, "global_step": 521928, "epoch": 6288} {"train_loss": -27.374155044555664, "global_step": 521929, "epoch": 6288} {"train_loss": -27.973072052001953, "global_step": 521930, "epoch": 6288} {"train_loss": -27.402021408081055, "global_step": 521931, "epoch": 6288} {"train_loss": -27.219375610351562, "global_step": 521932, "epoch": 6288} {"train_loss": -27.987228393554688, "global_step": 521933, "epoch": 6288} {"train_loss": -27.69904899597168, "global_step": 521934, "epoch": 6288} {"train_loss": -27.55221939086914, "global_step": 521935, "epoch": 6288} {"train_loss": -27.518457412719727, "global_step": 521936, "epoch": 6288} {"train_loss": -27.400049209594727, "global_step": 521937, "epoch": 6288} {"train_loss": -28.089643478393555, "global_step": 521938, "epoch": 6288} {"train_loss": -27.47197914123535, "global_step": 521939, "epoch": 6288} {"train_loss": -27.6628475189209, "global_step": 521940, "epoch": 6288} {"train_loss": -27.868000030517578, "global_step": 521941, "epoch": 6288} {"train_loss": -27.832548141479492, "global_step": 521942, "epoch": 6288} {"train_loss": -27.53436851501465, "global_step": 521943, "epoch": 6288} {"train_loss": -27.462421417236328, "global_step": 521944, "epoch": 6288} {"train_loss": -27.623687744140625, "global_step": 521945, "epoch": 6288} {"train_loss": -27.42353630065918, "global_step": 521946, "epoch": 6288} {"train_loss": -27.355810165405273, "global_step": 521947, "epoch": 6288} {"train_loss": -27.634267807006836, "global_step": 521948, "epoch": 6288} {"train_loss": -27.860183715820312, "global_step": 521949, "epoch": 6288} {"train_loss": -27.214075088500977, "global_step": 521950, "epoch": 6288} {"train_loss": -27.5062313079834, "global_step": 521951, "epoch": 6288} {"train_loss": -27.2923583984375, "global_step": 521952, "epoch": 6288} {"train_loss": -27.535688400268555, "global_step": 521953, "epoch": 6288} {"train_loss": -27.658681869506836, "global_step": 521954, "epoch": 6288} {"train_loss": -27.157148361206055, "global_step": 521955, "epoch": 6288} {"train_loss": -27.602432250976562, "global_step": 521956, "epoch": 6288} {"train_loss": -27.518232345581055, "global_step": 521957, "epoch": 6288} {"train_loss": -27.5002384185791, "global_step": 521958, "epoch": 6288} {"train_loss": -27.801984786987305, "global_step": 521959, "epoch": 6288} {"train_loss": -27.455738067626953, "global_step": 521960, "epoch": 6288} {"train_loss": -27.751859664916992, "global_step": 521961, "epoch": 6288} {"train_loss": -27.53411865234375, "global_step": 521962, "epoch": 6288} {"train_loss": -27.295490264892578, "global_step": 521963, "epoch": 6288} {"train_loss": -27.546049118041992, "global_step": 521964, "epoch": 6288} {"train_loss": -27.7637939453125, "global_step": 521965, "epoch": 6288} {"train_loss": -27.788904190063477, "global_step": 521966, "epoch": 6288} {"train_loss": -28.06743812561035, "global_step": 521967, "epoch": 6288} {"train_loss": -27.701093673706055, "global_step": 521968, "epoch": 6288} {"train_loss": -28.087018966674805, "global_step": 521969, "epoch": 6288} {"train_loss": -27.768768310546875, "global_step": 521970, "epoch": 6288} {"train_loss": -27.678730010986328, "global_step": 521971, "epoch": 6288} {"train_loss": -27.57870864868164, "global_step": 521972, "epoch": 6288} {"train_loss": -27.463550567626953, "global_step": 521973, "epoch": 6288} {"train_loss": -28.038644790649414, "global_step": 521974, "epoch": 6288} {"train_loss": -27.72039794921875, "global_step": 521975, "epoch": 6288} {"train_loss": -27.482177734375, "global_step": 521976, "epoch": 6288} {"train_loss": -27.916608810424805, "global_step": 521977, "epoch": 6288} {"train_loss": -27.677541732788086, "global_step": 521978, "epoch": 6288} {"train_loss": -27.340158462524414, "global_step": 521979, "epoch": 6288} {"train_loss": -27.33173942565918, "global_step": 521980, "epoch": 6288} {"train_loss": -27.835386276245117, "global_step": 521981, "epoch": 6288} {"train_loss": -27.183889389038086, "global_step": 521982, "epoch": 6288} {"train_loss": -27.883508682250977, "global_step": 521983, "epoch": 6288} {"train_loss": -27.497589111328125, "global_step": 521984, "epoch": 6288} {"train_loss": -27.504486083984375, "global_step": 521985, "epoch": 6288} {"train_loss": -27.485652509942113, "global_step": 521986, "epoch": 6288, "val_loss": 6656322.0} {"train_loss": -23.571714401245117, "global_step": 521987, "epoch": 6289} {"train_loss": -20.779340744018555, "global_step": 521988, "epoch": 6289} {"train_loss": -25.665328979492188, "global_step": 521989, "epoch": 6289} {"train_loss": -23.994003295898438, "global_step": 521990, "epoch": 6289} {"train_loss": -25.0267391204834, "global_step": 521991, "epoch": 6289} {"train_loss": -25.887649536132812, "global_step": 521992, "epoch": 6289} {"train_loss": -24.655637741088867, "global_step": 521993, "epoch": 6289} {"train_loss": -26.110916137695312, "global_step": 521994, "epoch": 6289} {"train_loss": -26.036603927612305, "global_step": 521995, "epoch": 6289} {"train_loss": -24.939523696899414, "global_step": 521996, "epoch": 6289} {"train_loss": -25.601810455322266, "global_step": 521997, "epoch": 6289} {"train_loss": -25.679580688476562, "global_step": 521998, "epoch": 6289} {"train_loss": -26.113697052001953, "global_step": 521999, "epoch": 6289} {"train_loss": -25.903486251831055, "global_step": 522000, "epoch": 6289} {"train_loss": -26.134790420532227, "global_step": 522001, "epoch": 6289} {"train_loss": -26.08176612854004, "global_step": 522002, "epoch": 6289} {"train_loss": -26.129199981689453, "global_step": 522003, "epoch": 6289} {"train_loss": -26.561452865600586, "global_step": 522004, "epoch": 6289} {"train_loss": -26.418323516845703, "global_step": 522005, "epoch": 6289} {"train_loss": -26.621103286743164, "global_step": 522006, "epoch": 6289} {"train_loss": -26.286102294921875, "global_step": 522007, "epoch": 6289} {"train_loss": -26.572662353515625, "global_step": 522008, "epoch": 6289} {"train_loss": -26.68219566345215, "global_step": 522009, "epoch": 6289} {"train_loss": -26.41497230529785, "global_step": 522010, "epoch": 6289} {"train_loss": -26.556760787963867, "global_step": 522011, "epoch": 6289} {"train_loss": -26.5457820892334, "global_step": 522012, "epoch": 6289} {"train_loss": -26.9179744720459, "global_step": 522013, "epoch": 6289} {"train_loss": -26.813764572143555, "global_step": 522014, "epoch": 6289} {"train_loss": -26.923986434936523, "global_step": 522015, "epoch": 6289} {"train_loss": -26.771228790283203, "global_step": 522016, "epoch": 6289} {"train_loss": -26.561471939086914, "global_step": 522017, "epoch": 6289} {"train_loss": -26.7015323638916, "global_step": 522018, "epoch": 6289} {"train_loss": -26.94767189025879, "global_step": 522019, "epoch": 6289} {"train_loss": -26.724079132080078, "global_step": 522020, "epoch": 6289} {"train_loss": -27.054641723632812, "global_step": 522021, "epoch": 6289} {"train_loss": -27.186676025390625, "global_step": 522022, "epoch": 6289} {"train_loss": -27.018573760986328, "global_step": 522023, "epoch": 6289} {"train_loss": -27.040586471557617, "global_step": 522024, "epoch": 6289} {"train_loss": -27.175809860229492, "global_step": 522025, "epoch": 6289} {"train_loss": -27.10767936706543, "global_step": 522026, "epoch": 6289} {"train_loss": -27.22391128540039, "global_step": 522027, "epoch": 6289} {"train_loss": -27.428497314453125, "global_step": 522028, "epoch": 6289} {"train_loss": -27.14569091796875, "global_step": 522029, "epoch": 6289} {"train_loss": -27.002609252929688, "global_step": 522030, "epoch": 6289} {"train_loss": -27.196338653564453, "global_step": 522031, "epoch": 6289} {"train_loss": -26.990615844726562, "global_step": 522032, "epoch": 6289} {"train_loss": -27.129602432250977, "global_step": 522033, "epoch": 6289} {"train_loss": -27.28999137878418, "global_step": 522034, "epoch": 6289} {"train_loss": -27.19135093688965, "global_step": 522035, "epoch": 6289} {"train_loss": -27.237409591674805, "global_step": 522036, "epoch": 6289} {"train_loss": -27.16037940979004, "global_step": 522037, "epoch": 6289} {"train_loss": -27.050886154174805, "global_step": 522038, "epoch": 6289} {"train_loss": -27.297504425048828, "global_step": 522039, "epoch": 6289} {"train_loss": -27.4283390045166, "global_step": 522040, "epoch": 6289} {"train_loss": -27.248987197875977, "global_step": 522041, "epoch": 6289} {"train_loss": -27.289020538330078, "global_step": 522042, "epoch": 6289} {"train_loss": -27.359878540039062, "global_step": 522043, "epoch": 6289} {"train_loss": -27.565418243408203, "global_step": 522044, "epoch": 6289} {"train_loss": -27.82207679748535, "global_step": 522045, "epoch": 6289} {"train_loss": -27.598485946655273, "global_step": 522046, "epoch": 6289} {"train_loss": -27.5715274810791, "global_step": 522047, "epoch": 6289} {"train_loss": -27.24204444885254, "global_step": 522048, "epoch": 6289} {"train_loss": -27.462055206298828, "global_step": 522049, "epoch": 6289} {"train_loss": -27.251251220703125, "global_step": 522050, "epoch": 6289} {"train_loss": -27.431461334228516, "global_step": 522051, "epoch": 6289} {"train_loss": -27.374195098876953, "global_step": 522052, "epoch": 6289} {"train_loss": -27.007883071899414, "global_step": 522053, "epoch": 6289} {"train_loss": -27.0877742767334, "global_step": 522054, "epoch": 6289} {"train_loss": -27.210235595703125, "global_step": 522055, "epoch": 6289} {"train_loss": -27.414823532104492, "global_step": 522056, "epoch": 6289} {"train_loss": -27.49814224243164, "global_step": 522057, "epoch": 6289} {"train_loss": -27.176015853881836, "global_step": 522058, "epoch": 6289} {"train_loss": -27.023334503173828, "global_step": 522059, "epoch": 6289} {"train_loss": -27.638519287109375, "global_step": 522060, "epoch": 6289} {"train_loss": -26.961597442626953, "global_step": 522061, "epoch": 6289} {"train_loss": -27.04317283630371, "global_step": 522062, "epoch": 6289} {"train_loss": -27.192794799804688, "global_step": 522063, "epoch": 6289} {"train_loss": -27.153766632080078, "global_step": 522064, "epoch": 6289} {"train_loss": -27.17743492126465, "global_step": 522065, "epoch": 6289} {"train_loss": -27.355945587158203, "global_step": 522066, "epoch": 6289} {"train_loss": -27.128631591796875, "global_step": 522067, "epoch": 6289} {"train_loss": -27.29667091369629, "global_step": 522068, "epoch": 6289} {"train_loss": -26.713605719876576, "global_step": 522069, "epoch": 6289, "val_loss": 6728938.0} {"train_loss": -27.159549713134766, "global_step": 522070, "epoch": 6290} {"train_loss": -26.8633975982666, "global_step": 522071, "epoch": 6290} {"train_loss": -26.973987579345703, "global_step": 522072, "epoch": 6290} {"train_loss": -26.895063400268555, "global_step": 522073, "epoch": 6290} {"train_loss": -27.240026473999023, "global_step": 522074, "epoch": 6290} {"train_loss": -27.14627456665039, "global_step": 522075, "epoch": 6290} {"train_loss": -27.033761978149414, "global_step": 522076, "epoch": 6290} {"train_loss": -27.283918380737305, "global_step": 522077, "epoch": 6290} {"train_loss": -26.774188995361328, "global_step": 522078, "epoch": 6290} {"train_loss": -27.468219757080078, "global_step": 522079, "epoch": 6290} {"train_loss": -27.102991104125977, "global_step": 522080, "epoch": 6290} {"train_loss": -27.19679069519043, "global_step": 522081, "epoch": 6290} {"train_loss": -27.478784561157227, "global_step": 522082, "epoch": 6290} {"train_loss": -27.251813888549805, "global_step": 522083, "epoch": 6290} {"train_loss": -27.205799102783203, "global_step": 522084, "epoch": 6290} {"train_loss": -27.434940338134766, "global_step": 522085, "epoch": 6290} {"train_loss": -27.616300582885742, "global_step": 522086, "epoch": 6290} {"train_loss": -27.593891143798828, "global_step": 522087, "epoch": 6290} {"train_loss": -26.769123077392578, "global_step": 522088, "epoch": 6290} {"train_loss": -27.56717300415039, "global_step": 522089, "epoch": 6290} {"train_loss": -27.597381591796875, "global_step": 522090, "epoch": 6290} {"train_loss": -27.522079467773438, "global_step": 522091, "epoch": 6290} {"train_loss": -27.632720947265625, "global_step": 522092, "epoch": 6290} {"train_loss": -27.78721046447754, "global_step": 522093, "epoch": 6290} {"train_loss": -27.3175106048584, "global_step": 522094, "epoch": 6290} {"train_loss": -27.590656280517578, "global_step": 522095, "epoch": 6290} {"train_loss": -27.687152862548828, "global_step": 522096, "epoch": 6290} {"train_loss": -27.740121841430664, "global_step": 522097, "epoch": 6290} {"train_loss": -27.943830490112305, "global_step": 522098, "epoch": 6290} {"train_loss": -28.06935691833496, "global_step": 522099, "epoch": 6290} {"train_loss": -27.772109985351562, "global_step": 522100, "epoch": 6290} {"train_loss": -27.560592651367188, "global_step": 522101, "epoch": 6290} {"train_loss": -27.6994686126709, "global_step": 522102, "epoch": 6290} {"train_loss": -27.99795913696289, "global_step": 522103, "epoch": 6290} {"train_loss": -27.562238693237305, "global_step": 522104, "epoch": 6290} {"train_loss": -27.728118896484375, "global_step": 522105, "epoch": 6290} {"train_loss": -27.845998764038086, "global_step": 522106, "epoch": 6290} {"train_loss": -27.836669921875, "global_step": 522107, "epoch": 6290} {"train_loss": -27.693450927734375, "global_step": 522108, "epoch": 6290} {"train_loss": -27.887714385986328, "global_step": 522109, "epoch": 6290} {"train_loss": -27.635665893554688, "global_step": 522110, "epoch": 6290} {"train_loss": -27.79475212097168, "global_step": 522111, "epoch": 6290} {"train_loss": -27.950061798095703, "global_step": 522112, "epoch": 6290} {"train_loss": -27.60468864440918, "global_step": 522113, "epoch": 6290} {"train_loss": -27.218053817749023, "global_step": 522114, "epoch": 6290} {"train_loss": -26.304584503173828, "global_step": 522115, "epoch": 6290} {"train_loss": -25.396018981933594, "global_step": 522116, "epoch": 6290} {"train_loss": -25.684741973876953, "global_step": 522117, "epoch": 6290} {"train_loss": -27.280603408813477, "global_step": 522118, "epoch": 6290} {"train_loss": -26.99983787536621, "global_step": 522119, "epoch": 6290} {"train_loss": -26.270465850830078, "global_step": 522120, "epoch": 6290} {"train_loss": -27.198816299438477, "global_step": 522121, "epoch": 6290} {"train_loss": -26.70454978942871, "global_step": 522122, "epoch": 6290} {"train_loss": -26.985870361328125, "global_step": 522123, "epoch": 6290} {"train_loss": -26.47714614868164, "global_step": 522124, "epoch": 6290} {"train_loss": -27.297882080078125, "global_step": 522125, "epoch": 6290} {"train_loss": -26.86343765258789, "global_step": 522126, "epoch": 6290} {"train_loss": -26.9553279876709, "global_step": 522127, "epoch": 6290} {"train_loss": -27.074979782104492, "global_step": 522128, "epoch": 6290} {"train_loss": -27.218671798706055, "global_step": 522129, "epoch": 6290} {"train_loss": -27.110492706298828, "global_step": 522130, "epoch": 6290} {"train_loss": -26.8123722076416, "global_step": 522131, "epoch": 6290} {"train_loss": -27.134729385375977, "global_step": 522132, "epoch": 6290} {"train_loss": -27.366369247436523, "global_step": 522133, "epoch": 6290} {"train_loss": -27.3555965423584, "global_step": 522134, "epoch": 6290} {"train_loss": -27.08832359313965, "global_step": 522135, "epoch": 6290} {"train_loss": -27.26589012145996, "global_step": 522136, "epoch": 6290} {"train_loss": -27.013381958007812, "global_step": 522137, "epoch": 6290} {"train_loss": -27.309982299804688, "global_step": 522138, "epoch": 6290} {"train_loss": -27.40008544921875, "global_step": 522139, "epoch": 6290} {"train_loss": -27.28727149963379, "global_step": 522140, "epoch": 6290} {"train_loss": -27.720285415649414, "global_step": 522141, "epoch": 6290} {"train_loss": -27.484792709350586, "global_step": 522142, "epoch": 6290} {"train_loss": -27.795873641967773, "global_step": 522143, "epoch": 6290} {"train_loss": -27.966522216796875, "global_step": 522144, "epoch": 6290} {"train_loss": -27.399322509765625, "global_step": 522145, "epoch": 6290} {"train_loss": -27.563383102416992, "global_step": 522146, "epoch": 6290} {"train_loss": -27.550796508789062, "global_step": 522147, "epoch": 6290} {"train_loss": -27.340307235717773, "global_step": 522148, "epoch": 6290} {"train_loss": -27.177005767822266, "global_step": 522149, "epoch": 6290} {"train_loss": -27.5052490234375, "global_step": 522150, "epoch": 6290} {"train_loss": -27.300739288330078, "global_step": 522151, "epoch": 6290} {"train_loss": -27.306858775127363, "global_step": 522152, "epoch": 6290, "val_loss": 6637453.0} {"train_loss": -25.880645751953125, "global_step": 522153, "epoch": 6291} {"train_loss": -26.057592391967773, "global_step": 522154, "epoch": 6291} {"train_loss": -27.382349014282227, "global_step": 522155, "epoch": 6291} {"train_loss": -26.80315589904785, "global_step": 522156, "epoch": 6291} {"train_loss": -27.146656036376953, "global_step": 522157, "epoch": 6291} {"train_loss": -26.606338500976562, "global_step": 522158, "epoch": 6291} {"train_loss": -27.222761154174805, "global_step": 522159, "epoch": 6291} {"train_loss": -26.770727157592773, "global_step": 522160, "epoch": 6291} {"train_loss": -27.108694076538086, "global_step": 522161, "epoch": 6291} {"train_loss": -27.2495059967041, "global_step": 522162, "epoch": 6291} {"train_loss": -27.086755752563477, "global_step": 522163, "epoch": 6291} {"train_loss": -26.94025230407715, "global_step": 522164, "epoch": 6291} {"train_loss": -26.94534683227539, "global_step": 522165, "epoch": 6291} {"train_loss": -27.017480850219727, "global_step": 522166, "epoch": 6291} {"train_loss": -27.3814754486084, "global_step": 522167, "epoch": 6291} {"train_loss": -27.352630615234375, "global_step": 522168, "epoch": 6291} {"train_loss": -26.822498321533203, "global_step": 522169, "epoch": 6291} {"train_loss": -26.978839874267578, "global_step": 522170, "epoch": 6291} {"train_loss": -26.926502227783203, "global_step": 522171, "epoch": 6291} {"train_loss": -27.2476749420166, "global_step": 522172, "epoch": 6291} {"train_loss": -27.19599723815918, "global_step": 522173, "epoch": 6291} {"train_loss": -27.452478408813477, "global_step": 522174, "epoch": 6291} {"train_loss": -27.376453399658203, "global_step": 522175, "epoch": 6291} {"train_loss": -27.086706161499023, "global_step": 522176, "epoch": 6291} {"train_loss": -27.414859771728516, "global_step": 522177, "epoch": 6291} {"train_loss": -27.045923233032227, "global_step": 522178, "epoch": 6291} {"train_loss": -26.60318374633789, "global_step": 522179, "epoch": 6291} {"train_loss": -27.780609130859375, "global_step": 522180, "epoch": 6291} {"train_loss": -26.848560333251953, "global_step": 522181, "epoch": 6291} {"train_loss": -27.379480361938477, "global_step": 522182, "epoch": 6291} {"train_loss": -27.356672286987305, "global_step": 522183, "epoch": 6291} {"train_loss": -27.543115615844727, "global_step": 522184, "epoch": 6291} {"train_loss": -27.50311851501465, "global_step": 522185, "epoch": 6291} {"train_loss": -27.331954956054688, "global_step": 522186, "epoch": 6291} {"train_loss": -27.639911651611328, "global_step": 522187, "epoch": 6291} {"train_loss": -27.420392990112305, "global_step": 522188, "epoch": 6291} {"train_loss": -27.68408203125, "global_step": 522189, "epoch": 6291} {"train_loss": -27.527667999267578, "global_step": 522190, "epoch": 6291} {"train_loss": -27.627029418945312, "global_step": 522191, "epoch": 6291} {"train_loss": -27.426864624023438, "global_step": 522192, "epoch": 6291} {"train_loss": -27.597936630249023, "global_step": 522193, "epoch": 6291} {"train_loss": -27.542831420898438, "global_step": 522194, "epoch": 6291} {"train_loss": -27.615400314331055, "global_step": 522195, "epoch": 6291} {"train_loss": -27.533893585205078, "global_step": 522196, "epoch": 6291} {"train_loss": -27.70627212524414, "global_step": 522197, "epoch": 6291} {"train_loss": -27.582143783569336, "global_step": 522198, "epoch": 6291} {"train_loss": -27.6400089263916, "global_step": 522199, "epoch": 6291} {"train_loss": -27.706501007080078, "global_step": 522200, "epoch": 6291} {"train_loss": -27.810199737548828, "global_step": 522201, "epoch": 6291} {"train_loss": -27.638635635375977, "global_step": 522202, "epoch": 6291} {"train_loss": -27.528945922851562, "global_step": 522203, "epoch": 6291} {"train_loss": -27.92413330078125, "global_step": 522204, "epoch": 6291} {"train_loss": -27.89017105102539, "global_step": 522205, "epoch": 6291} {"train_loss": -27.392988204956055, "global_step": 522206, "epoch": 6291} {"train_loss": -27.75895118713379, "global_step": 522207, "epoch": 6291} {"train_loss": -27.898834228515625, "global_step": 522208, "epoch": 6291} {"train_loss": -27.896398544311523, "global_step": 522209, "epoch": 6291} {"train_loss": -27.465972900390625, "global_step": 522210, "epoch": 6291} {"train_loss": -27.77272605895996, "global_step": 522211, "epoch": 6291} {"train_loss": -27.663654327392578, "global_step": 522212, "epoch": 6291} {"train_loss": -27.78394889831543, "global_step": 522213, "epoch": 6291} {"train_loss": -27.641590118408203, "global_step": 522214, "epoch": 6291} {"train_loss": -27.82230567932129, "global_step": 522215, "epoch": 6291} {"train_loss": -27.348127365112305, "global_step": 522216, "epoch": 6291} {"train_loss": -27.785253524780273, "global_step": 522217, "epoch": 6291} {"train_loss": -27.509138107299805, "global_step": 522218, "epoch": 6291} {"train_loss": -27.579381942749023, "global_step": 522219, "epoch": 6291} {"train_loss": -27.327686309814453, "global_step": 522220, "epoch": 6291} {"train_loss": -27.417036056518555, "global_step": 522221, "epoch": 6291} {"train_loss": -27.386075973510742, "global_step": 522222, "epoch": 6291} {"train_loss": -27.381763458251953, "global_step": 522223, "epoch": 6291} {"train_loss": -27.547225952148438, "global_step": 522224, "epoch": 6291} {"train_loss": -27.81251335144043, "global_step": 522225, "epoch": 6291} {"train_loss": -27.79378318786621, "global_step": 522226, "epoch": 6291} {"train_loss": -27.729917526245117, "global_step": 522227, "epoch": 6291} {"train_loss": -27.282190322875977, "global_step": 522228, "epoch": 6291} {"train_loss": -27.51377296447754, "global_step": 522229, "epoch": 6291} {"train_loss": -27.398761749267578, "global_step": 522230, "epoch": 6291} {"train_loss": -27.911636352539062, "global_step": 522231, "epoch": 6291} {"train_loss": -27.752994537353516, "global_step": 522232, "epoch": 6291} {"train_loss": -27.51702880859375, "global_step": 522233, "epoch": 6291} {"train_loss": -27.504003524780273, "global_step": 522234, "epoch": 6291} {"train_loss": -27.39298641250794, "global_step": 522235, "epoch": 6291, "val_loss": 6676219.5} {"train_loss": -26.935754776000977, "global_step": 522236, "epoch": 6292} {"train_loss": -27.3787784576416, "global_step": 522237, "epoch": 6292} {"train_loss": -26.928373336791992, "global_step": 522238, "epoch": 6292} {"train_loss": -27.229642868041992, "global_step": 522239, "epoch": 6292} {"train_loss": -27.108963012695312, "global_step": 522240, "epoch": 6292} {"train_loss": -27.37440299987793, "global_step": 522241, "epoch": 6292} {"train_loss": -27.652130126953125, "global_step": 522242, "epoch": 6292} {"train_loss": -27.53712272644043, "global_step": 522243, "epoch": 6292} {"train_loss": -27.300785064697266, "global_step": 522244, "epoch": 6292} {"train_loss": -27.5782527923584, "global_step": 522245, "epoch": 6292} {"train_loss": -27.009977340698242, "global_step": 522246, "epoch": 6292} {"train_loss": -27.26594352722168, "global_step": 522247, "epoch": 6292} {"train_loss": -27.786710739135742, "global_step": 522248, "epoch": 6292} {"train_loss": -27.104780197143555, "global_step": 522249, "epoch": 6292} {"train_loss": -27.505964279174805, "global_step": 522250, "epoch": 6292} {"train_loss": -27.424768447875977, "global_step": 522251, "epoch": 6292} {"train_loss": -27.441633224487305, "global_step": 522252, "epoch": 6292} {"train_loss": -27.885339736938477, "global_step": 522253, "epoch": 6292} {"train_loss": -27.292551040649414, "global_step": 522254, "epoch": 6292} {"train_loss": -27.478107452392578, "global_step": 522255, "epoch": 6292} {"train_loss": -27.2672061920166, "global_step": 522256, "epoch": 6292} {"train_loss": -27.13490104675293, "global_step": 522257, "epoch": 6292} {"train_loss": -27.456470489501953, "global_step": 522258, "epoch": 6292} {"train_loss": -27.782535552978516, "global_step": 522259, "epoch": 6292} {"train_loss": -27.36761474609375, "global_step": 522260, "epoch": 6292} {"train_loss": -27.22981834411621, "global_step": 522261, "epoch": 6292} {"train_loss": -27.437482833862305, "global_step": 522262, "epoch": 6292} {"train_loss": -27.568750381469727, "global_step": 522263, "epoch": 6292} {"train_loss": -27.3742733001709, "global_step": 522264, "epoch": 6292} {"train_loss": -27.76887321472168, "global_step": 522265, "epoch": 6292} {"train_loss": -27.36932945251465, "global_step": 522266, "epoch": 6292} {"train_loss": -27.398645401000977, "global_step": 522267, "epoch": 6292} {"train_loss": -27.755151748657227, "global_step": 522268, "epoch": 6292} {"train_loss": -27.47161865234375, "global_step": 522269, "epoch": 6292} {"train_loss": -27.2861385345459, "global_step": 522270, "epoch": 6292} {"train_loss": -27.590351104736328, "global_step": 522271, "epoch": 6292} {"train_loss": -27.53167724609375, "global_step": 522272, "epoch": 6292} {"train_loss": -27.43653678894043, "global_step": 522273, "epoch": 6292} {"train_loss": -27.67267417907715, "global_step": 522274, "epoch": 6292} {"train_loss": -27.24302101135254, "global_step": 522275, "epoch": 6292} {"train_loss": -27.153207778930664, "global_step": 522276, "epoch": 6292} {"train_loss": -27.723474502563477, "global_step": 522277, "epoch": 6292} {"train_loss": -27.772397994995117, "global_step": 522278, "epoch": 6292} {"train_loss": -27.524398803710938, "global_step": 522279, "epoch": 6292} {"train_loss": -27.342267990112305, "global_step": 522280, "epoch": 6292} {"train_loss": -27.086729049682617, "global_step": 522281, "epoch": 6292} {"train_loss": -27.54701042175293, "global_step": 522282, "epoch": 6292} {"train_loss": -27.46272087097168, "global_step": 522283, "epoch": 6292} {"train_loss": -27.471881866455078, "global_step": 522284, "epoch": 6292} {"train_loss": -27.910730361938477, "global_step": 522285, "epoch": 6292} {"train_loss": -27.79084587097168, "global_step": 522286, "epoch": 6292} {"train_loss": -27.508825302124023, "global_step": 522287, "epoch": 6292} {"train_loss": -27.496305465698242, "global_step": 522288, "epoch": 6292} {"train_loss": -27.812992095947266, "global_step": 522289, "epoch": 6292} {"train_loss": -27.900970458984375, "global_step": 522290, "epoch": 6292} {"train_loss": -28.070316314697266, "global_step": 522291, "epoch": 6292} {"train_loss": -27.193082809448242, "global_step": 522292, "epoch": 6292} {"train_loss": -28.092548370361328, "global_step": 522293, "epoch": 6292} {"train_loss": -27.798629760742188, "global_step": 522294, "epoch": 6292} {"train_loss": -27.580154418945312, "global_step": 522295, "epoch": 6292} {"train_loss": -27.724939346313477, "global_step": 522296, "epoch": 6292} {"train_loss": -27.581527709960938, "global_step": 522297, "epoch": 6292} {"train_loss": -27.340566635131836, "global_step": 522298, "epoch": 6292} {"train_loss": -27.45654296875, "global_step": 522299, "epoch": 6292} {"train_loss": -27.635883331298828, "global_step": 522300, "epoch": 6292} {"train_loss": -27.68478775024414, "global_step": 522301, "epoch": 6292} {"train_loss": -27.436298370361328, "global_step": 522302, "epoch": 6292} {"train_loss": -27.361572265625, "global_step": 522303, "epoch": 6292} {"train_loss": -27.68768310546875, "global_step": 522304, "epoch": 6292} {"train_loss": -27.681547164916992, "global_step": 522305, "epoch": 6292} {"train_loss": -26.72352409362793, "global_step": 522306, "epoch": 6292} {"train_loss": -27.167890548706055, "global_step": 522307, "epoch": 6292} {"train_loss": -27.57008171081543, "global_step": 522308, "epoch": 6292} {"train_loss": -27.443662643432617, "global_step": 522309, "epoch": 6292} {"train_loss": -26.91129493713379, "global_step": 522310, "epoch": 6292} {"train_loss": -27.361724853515625, "global_step": 522311, "epoch": 6292} {"train_loss": -27.58169937133789, "global_step": 522312, "epoch": 6292} {"train_loss": -27.092374801635742, "global_step": 522313, "epoch": 6292} {"train_loss": -27.6408748626709, "global_step": 522314, "epoch": 6292} {"train_loss": -27.385751724243164, "global_step": 522315, "epoch": 6292} {"train_loss": -27.70172119140625, "global_step": 522316, "epoch": 6292} {"train_loss": -27.308929443359375, "global_step": 522317, "epoch": 6292} {"train_loss": -27.469110121209937, "global_step": 522318, "epoch": 6292, "val_loss": 6652194.0} {"train_loss": -26.912067413330078, "global_step": 522319, "epoch": 6293} {"train_loss": -26.924945831298828, "global_step": 522320, "epoch": 6293} {"train_loss": -26.77567481994629, "global_step": 522321, "epoch": 6293} {"train_loss": -26.577795028686523, "global_step": 522322, "epoch": 6293} {"train_loss": -27.09857749938965, "global_step": 522323, "epoch": 6293} {"train_loss": -27.367223739624023, "global_step": 522324, "epoch": 6293} {"train_loss": -27.01869010925293, "global_step": 522325, "epoch": 6293} {"train_loss": -26.64137077331543, "global_step": 522326, "epoch": 6293} {"train_loss": -26.98223304748535, "global_step": 522327, "epoch": 6293} {"train_loss": -27.48687744140625, "global_step": 522328, "epoch": 6293} {"train_loss": -26.860132217407227, "global_step": 522329, "epoch": 6293} {"train_loss": -27.3957462310791, "global_step": 522330, "epoch": 6293} {"train_loss": -27.211721420288086, "global_step": 522331, "epoch": 6293} {"train_loss": -27.440189361572266, "global_step": 522332, "epoch": 6293} {"train_loss": -27.03631019592285, "global_step": 522333, "epoch": 6293} {"train_loss": -27.1955623626709, "global_step": 522334, "epoch": 6293} {"train_loss": -27.668790817260742, "global_step": 522335, "epoch": 6293} {"train_loss": -27.4539852142334, "global_step": 522336, "epoch": 6293} {"train_loss": -27.18623924255371, "global_step": 522337, "epoch": 6293} {"train_loss": -27.51618003845215, "global_step": 522338, "epoch": 6293} {"train_loss": -27.4389591217041, "global_step": 522339, "epoch": 6293} {"train_loss": -27.24543571472168, "global_step": 522340, "epoch": 6293} {"train_loss": -27.238798141479492, "global_step": 522341, "epoch": 6293} {"train_loss": -27.5611629486084, "global_step": 522342, "epoch": 6293} {"train_loss": -27.715808868408203, "global_step": 522343, "epoch": 6293} {"train_loss": -27.717920303344727, "global_step": 522344, "epoch": 6293} {"train_loss": -27.52557373046875, "global_step": 522345, "epoch": 6293} {"train_loss": -27.501483917236328, "global_step": 522346, "epoch": 6293} {"train_loss": -27.477935791015625, "global_step": 522347, "epoch": 6293} {"train_loss": -27.411605834960938, "global_step": 522348, "epoch": 6293} {"train_loss": -27.544034957885742, "global_step": 522349, "epoch": 6293} {"train_loss": -27.541656494140625, "global_step": 522350, "epoch": 6293} {"train_loss": -27.57844352722168, "global_step": 522351, "epoch": 6293} {"train_loss": -27.703420639038086, "global_step": 522352, "epoch": 6293} {"train_loss": -27.711225509643555, "global_step": 522353, "epoch": 6293} {"train_loss": -27.3763484954834, "global_step": 522354, "epoch": 6293} {"train_loss": -27.818893432617188, "global_step": 522355, "epoch": 6293} {"train_loss": -27.91997718811035, "global_step": 522356, "epoch": 6293} {"train_loss": -27.176416397094727, "global_step": 522357, "epoch": 6293} {"train_loss": -27.444807052612305, "global_step": 522358, "epoch": 6293} {"train_loss": -27.88681411743164, "global_step": 522359, "epoch": 6293} {"train_loss": -27.623626708984375, "global_step": 522360, "epoch": 6293} {"train_loss": -27.6571102142334, "global_step": 522361, "epoch": 6293} {"train_loss": -27.65144157409668, "global_step": 522362, "epoch": 6293} {"train_loss": -27.78651237487793, "global_step": 522363, "epoch": 6293} {"train_loss": -27.762161254882812, "global_step": 522364, "epoch": 6293} {"train_loss": -27.55411148071289, "global_step": 522365, "epoch": 6293} {"train_loss": -27.9501895904541, "global_step": 522366, "epoch": 6293} {"train_loss": -27.84088706970215, "global_step": 522367, "epoch": 6293} {"train_loss": -27.4959774017334, "global_step": 522368, "epoch": 6293} {"train_loss": -27.553800582885742, "global_step": 522369, "epoch": 6293} {"train_loss": -27.731794357299805, "global_step": 522370, "epoch": 6293} {"train_loss": -27.787384033203125, "global_step": 522371, "epoch": 6293} {"train_loss": -27.704233169555664, "global_step": 522372, "epoch": 6293} {"train_loss": -27.691532135009766, "global_step": 522373, "epoch": 6293} {"train_loss": -27.599477767944336, "global_step": 522374, "epoch": 6293} {"train_loss": -27.615869522094727, "global_step": 522375, "epoch": 6293} {"train_loss": -27.713443756103516, "global_step": 522376, "epoch": 6293} {"train_loss": -27.412168502807617, "global_step": 522377, "epoch": 6293} {"train_loss": -27.65460777282715, "global_step": 522378, "epoch": 6293} {"train_loss": -27.387922286987305, "global_step": 522379, "epoch": 6293} {"train_loss": -27.491926193237305, "global_step": 522380, "epoch": 6293} {"train_loss": -27.565509796142578, "global_step": 522381, "epoch": 6293} {"train_loss": -27.720489501953125, "global_step": 522382, "epoch": 6293} {"train_loss": -27.54768180847168, "global_step": 522383, "epoch": 6293} {"train_loss": -28.115833282470703, "global_step": 522384, "epoch": 6293} {"train_loss": -27.575220108032227, "global_step": 522385, "epoch": 6293} {"train_loss": -27.41364860534668, "global_step": 522386, "epoch": 6293} {"train_loss": -27.170379638671875, "global_step": 522387, "epoch": 6293} {"train_loss": -26.829572677612305, "global_step": 522388, "epoch": 6293} {"train_loss": -27.88458251953125, "global_step": 522389, "epoch": 6293} {"train_loss": -27.11701774597168, "global_step": 522390, "epoch": 6293} {"train_loss": -27.139074325561523, "global_step": 522391, "epoch": 6293} {"train_loss": -27.049163818359375, "global_step": 522392, "epoch": 6293} {"train_loss": -27.526044845581055, "global_step": 522393, "epoch": 6293} {"train_loss": -27.3049259185791, "global_step": 522394, "epoch": 6293} {"train_loss": -27.624439239501953, "global_step": 522395, "epoch": 6293} {"train_loss": -27.402145385742188, "global_step": 522396, "epoch": 6293} {"train_loss": -27.830982208251953, "global_step": 522397, "epoch": 6293} {"train_loss": -27.755619049072266, "global_step": 522398, "epoch": 6293} {"train_loss": -26.927392959594727, "global_step": 522399, "epoch": 6293} {"train_loss": -27.391401290893555, "global_step": 522400, "epoch": 6293} {"train_loss": -27.453771200524756, "global_step": 522401, "epoch": 6293, "val_loss": 6655853.0} {"train_loss": -26.82624626159668, "global_step": 522402, "epoch": 6294} {"train_loss": -27.5433292388916, "global_step": 522403, "epoch": 6294} {"train_loss": -27.380126953125, "global_step": 522404, "epoch": 6294} {"train_loss": -27.28338623046875, "global_step": 522405, "epoch": 6294} {"train_loss": -27.392953872680664, "global_step": 522406, "epoch": 6294} {"train_loss": -27.084821701049805, "global_step": 522407, "epoch": 6294} {"train_loss": -26.9341983795166, "global_step": 522408, "epoch": 6294} {"train_loss": -27.145978927612305, "global_step": 522409, "epoch": 6294} {"train_loss": -27.924102783203125, "global_step": 522410, "epoch": 6294} {"train_loss": -27.249267578125, "global_step": 522411, "epoch": 6294} {"train_loss": -27.249216079711914, "global_step": 522412, "epoch": 6294} {"train_loss": -27.2989559173584, "global_step": 522413, "epoch": 6294} {"train_loss": -27.4448299407959, "global_step": 522414, "epoch": 6294} {"train_loss": -27.501684188842773, "global_step": 522415, "epoch": 6294} {"train_loss": -26.963037490844727, "global_step": 522416, "epoch": 6294} {"train_loss": -26.929595947265625, "global_step": 522417, "epoch": 6294} {"train_loss": -27.31252098083496, "global_step": 522418, "epoch": 6294} {"train_loss": -26.981550216674805, "global_step": 522419, "epoch": 6294} {"train_loss": -27.399444580078125, "global_step": 522420, "epoch": 6294} {"train_loss": -26.99994468688965, "global_step": 522421, "epoch": 6294} {"train_loss": -27.22515869140625, "global_step": 522422, "epoch": 6294} {"train_loss": -27.420124053955078, "global_step": 522423, "epoch": 6294} {"train_loss": -27.122587203979492, "global_step": 522424, "epoch": 6294} {"train_loss": -26.97333335876465, "global_step": 522425, "epoch": 6294} {"train_loss": -27.294092178344727, "global_step": 522426, "epoch": 6294} {"train_loss": -27.614990234375, "global_step": 522427, "epoch": 6294} {"train_loss": -27.605926513671875, "global_step": 522428, "epoch": 6294} {"train_loss": -28.01246452331543, "global_step": 522429, "epoch": 6294} {"train_loss": -27.435285568237305, "global_step": 522430, "epoch": 6294} {"train_loss": -27.358667373657227, "global_step": 522431, "epoch": 6294} {"train_loss": -27.678314208984375, "global_step": 522432, "epoch": 6294} {"train_loss": -27.615890502929688, "global_step": 522433, "epoch": 6294} {"train_loss": -27.822301864624023, "global_step": 522434, "epoch": 6294} {"train_loss": -27.762470245361328, "global_step": 522435, "epoch": 6294} {"train_loss": -27.719562530517578, "global_step": 522436, "epoch": 6294} {"train_loss": -27.58013343811035, "global_step": 522437, "epoch": 6294} {"train_loss": -27.617401123046875, "global_step": 522438, "epoch": 6294} {"train_loss": -27.64322853088379, "global_step": 522439, "epoch": 6294} {"train_loss": -27.659391403198242, "global_step": 522440, "epoch": 6294} {"train_loss": -27.429931640625, "global_step": 522441, "epoch": 6294} {"train_loss": -27.781991958618164, "global_step": 522442, "epoch": 6294} {"train_loss": -27.710529327392578, "global_step": 522443, "epoch": 6294} {"train_loss": -27.798603057861328, "global_step": 522444, "epoch": 6294} {"train_loss": -27.588214874267578, "global_step": 522445, "epoch": 6294} {"train_loss": -27.887805938720703, "global_step": 522446, "epoch": 6294} {"train_loss": -27.493879318237305, "global_step": 522447, "epoch": 6294} {"train_loss": -27.67535400390625, "global_step": 522448, "epoch": 6294} {"train_loss": -27.806787490844727, "global_step": 522449, "epoch": 6294} {"train_loss": -27.777942657470703, "global_step": 522450, "epoch": 6294} {"train_loss": -28.054616928100586, "global_step": 522451, "epoch": 6294} {"train_loss": -27.870849609375, "global_step": 522452, "epoch": 6294} {"train_loss": -27.589435577392578, "global_step": 522453, "epoch": 6294} {"train_loss": -27.800466537475586, "global_step": 522454, "epoch": 6294} {"train_loss": -27.9731502532959, "global_step": 522455, "epoch": 6294} {"train_loss": -27.8790283203125, "global_step": 522456, "epoch": 6294} {"train_loss": -27.54560661315918, "global_step": 522457, "epoch": 6294} {"train_loss": -27.774316787719727, "global_step": 522458, "epoch": 6294} {"train_loss": -27.381696701049805, "global_step": 522459, "epoch": 6294} {"train_loss": -27.648839950561523, "global_step": 522460, "epoch": 6294} {"train_loss": -27.74431800842285, "global_step": 522461, "epoch": 6294} {"train_loss": -27.2835636138916, "global_step": 522462, "epoch": 6294} {"train_loss": -27.558826446533203, "global_step": 522463, "epoch": 6294} {"train_loss": -27.788288116455078, "global_step": 522464, "epoch": 6294} {"train_loss": -27.78208351135254, "global_step": 522465, "epoch": 6294} {"train_loss": -27.767324447631836, "global_step": 522466, "epoch": 6294} {"train_loss": -27.588214874267578, "global_step": 522467, "epoch": 6294} {"train_loss": -28.009571075439453, "global_step": 522468, "epoch": 6294} {"train_loss": -27.80023193359375, "global_step": 522469, "epoch": 6294} {"train_loss": -27.9295711517334, "global_step": 522470, "epoch": 6294} {"train_loss": -27.729724884033203, "global_step": 522471, "epoch": 6294} {"train_loss": -27.50094985961914, "global_step": 522472, "epoch": 6294} {"train_loss": -27.620849609375, "global_step": 522473, "epoch": 6294} {"train_loss": -27.1762752532959, "global_step": 522474, "epoch": 6294} {"train_loss": -26.911956787109375, "global_step": 522475, "epoch": 6294} {"train_loss": -26.081037521362305, "global_step": 522476, "epoch": 6294} {"train_loss": -26.700611114501953, "global_step": 522477, "epoch": 6294} {"train_loss": -27.619674682617188, "global_step": 522478, "epoch": 6294} {"train_loss": -27.44012451171875, "global_step": 522479, "epoch": 6294} {"train_loss": -27.0028018951416, "global_step": 522480, "epoch": 6294} {"train_loss": -27.00555992126465, "global_step": 522481, "epoch": 6294} {"train_loss": -27.21649742126465, "global_step": 522482, "epoch": 6294} {"train_loss": -26.99053955078125, "global_step": 522483, "epoch": 6294} {"train_loss": -27.4798807580787, "global_step": 522484, "epoch": 6294, "val_loss": 6547049.0} {"train_loss": -25.698474884033203, "global_step": 522485, "epoch": 6295} {"train_loss": -25.61273193359375, "global_step": 522486, "epoch": 6295} {"train_loss": -25.7632999420166, "global_step": 522487, "epoch": 6295} {"train_loss": -26.3714599609375, "global_step": 522488, "epoch": 6295} {"train_loss": -25.805500030517578, "global_step": 522489, "epoch": 6295} {"train_loss": -25.52661895751953, "global_step": 522490, "epoch": 6295} {"train_loss": -26.670007705688477, "global_step": 522491, "epoch": 6295} {"train_loss": -25.88665199279785, "global_step": 522492, "epoch": 6295} {"train_loss": -26.8056697845459, "global_step": 522493, "epoch": 6295} {"train_loss": -26.45875358581543, "global_step": 522494, "epoch": 6295} {"train_loss": -27.04046058654785, "global_step": 522495, "epoch": 6295} {"train_loss": -26.655414581298828, "global_step": 522496, "epoch": 6295} {"train_loss": -26.89682388305664, "global_step": 522497, "epoch": 6295} {"train_loss": -26.452451705932617, "global_step": 522498, "epoch": 6295} {"train_loss": -26.769153594970703, "global_step": 522499, "epoch": 6295} {"train_loss": -26.941816329956055, "global_step": 522500, "epoch": 6295} {"train_loss": -26.959125518798828, "global_step": 522501, "epoch": 6295} {"train_loss": -27.124908447265625, "global_step": 522502, "epoch": 6295} {"train_loss": -27.295129776000977, "global_step": 522503, "epoch": 6295} {"train_loss": -27.155637741088867, "global_step": 522504, "epoch": 6295} {"train_loss": -26.8262939453125, "global_step": 522505, "epoch": 6295} {"train_loss": -27.094833374023438, "global_step": 522506, "epoch": 6295} {"train_loss": -27.389179229736328, "global_step": 522507, "epoch": 6295} {"train_loss": -27.342864990234375, "global_step": 522508, "epoch": 6295} {"train_loss": -27.099878311157227, "global_step": 522509, "epoch": 6295} {"train_loss": -27.18434715270996, "global_step": 522510, "epoch": 6295} {"train_loss": -27.14326286315918, "global_step": 522511, "epoch": 6295} {"train_loss": -27.34022331237793, "global_step": 522512, "epoch": 6295} {"train_loss": -27.23133659362793, "global_step": 522513, "epoch": 6295} {"train_loss": -27.38348960876465, "global_step": 522514, "epoch": 6295} {"train_loss": -27.3861083984375, "global_step": 522515, "epoch": 6295} {"train_loss": -27.449478149414062, "global_step": 522516, "epoch": 6295} {"train_loss": -27.578445434570312, "global_step": 522517, "epoch": 6295} {"train_loss": -27.38453483581543, "global_step": 522518, "epoch": 6295} {"train_loss": -27.356481552124023, "global_step": 522519, "epoch": 6295} {"train_loss": -27.48834800720215, "global_step": 522520, "epoch": 6295} {"train_loss": -27.06229019165039, "global_step": 522521, "epoch": 6295} {"train_loss": -27.593229293823242, "global_step": 522522, "epoch": 6295} {"train_loss": -27.205408096313477, "global_step": 522523, "epoch": 6295} {"train_loss": -27.44598960876465, "global_step": 522524, "epoch": 6295} {"train_loss": -27.370771408081055, "global_step": 522525, "epoch": 6295} {"train_loss": -27.56325340270996, "global_step": 522526, "epoch": 6295} {"train_loss": -27.45838737487793, "global_step": 522527, "epoch": 6295} {"train_loss": -27.836057662963867, "global_step": 522528, "epoch": 6295} {"train_loss": -27.874103546142578, "global_step": 522529, "epoch": 6295} {"train_loss": -27.466358184814453, "global_step": 522530, "epoch": 6295} {"train_loss": -27.558792114257812, "global_step": 522531, "epoch": 6295} {"train_loss": -27.740869522094727, "global_step": 522532, "epoch": 6295} {"train_loss": -27.587858200073242, "global_step": 522533, "epoch": 6295} {"train_loss": -27.655078887939453, "global_step": 522534, "epoch": 6295} {"train_loss": -27.97430419921875, "global_step": 522535, "epoch": 6295} {"train_loss": -27.48110008239746, "global_step": 522536, "epoch": 6295} {"train_loss": -27.745651245117188, "global_step": 522537, "epoch": 6295} {"train_loss": -27.250226974487305, "global_step": 522538, "epoch": 6295} {"train_loss": -27.308551788330078, "global_step": 522539, "epoch": 6295} {"train_loss": -28.135507583618164, "global_step": 522540, "epoch": 6295} {"train_loss": -27.814777374267578, "global_step": 522541, "epoch": 6295} {"train_loss": -27.90850830078125, "global_step": 522542, "epoch": 6295} {"train_loss": -27.613004684448242, "global_step": 522543, "epoch": 6295} {"train_loss": -27.168441772460938, "global_step": 522544, "epoch": 6295} {"train_loss": -27.450824737548828, "global_step": 522545, "epoch": 6295} {"train_loss": -27.26618003845215, "global_step": 522546, "epoch": 6295} {"train_loss": -27.338598251342773, "global_step": 522547, "epoch": 6295} {"train_loss": -27.9011173248291, "global_step": 522548, "epoch": 6295} {"train_loss": -27.705739974975586, "global_step": 522549, "epoch": 6295} {"train_loss": -27.47211265563965, "global_step": 522550, "epoch": 6295} {"train_loss": -27.978071212768555, "global_step": 522551, "epoch": 6295} {"train_loss": -27.79693603515625, "global_step": 522552, "epoch": 6295} {"train_loss": -27.725828170776367, "global_step": 522553, "epoch": 6295} {"train_loss": -28.169574737548828, "global_step": 522554, "epoch": 6295} {"train_loss": -27.7141170501709, "global_step": 522555, "epoch": 6295} {"train_loss": -27.644393920898438, "global_step": 522556, "epoch": 6295} {"train_loss": -27.612537384033203, "global_step": 522557, "epoch": 6295} {"train_loss": -27.906835556030273, "global_step": 522558, "epoch": 6295} {"train_loss": -27.478925704956055, "global_step": 522559, "epoch": 6295} {"train_loss": -27.324926376342773, "global_step": 522560, "epoch": 6295} {"train_loss": -27.149091720581055, "global_step": 522561, "epoch": 6295} {"train_loss": -27.5799503326416, "global_step": 522562, "epoch": 6295} {"train_loss": -27.49749755859375, "global_step": 522563, "epoch": 6295} {"train_loss": -27.782140731811523, "global_step": 522564, "epoch": 6295} {"train_loss": -27.607336044311523, "global_step": 522565, "epoch": 6295} {"train_loss": -27.582483291625977, "global_step": 522566, "epoch": 6295} {"train_loss": -27.26761245727539, "global_step": 522567, "epoch": 6295, "val_loss": 6596061.0} {"train_loss": -27.298084259033203, "global_step": 522568, "epoch": 6296} {"train_loss": -27.429819107055664, "global_step": 522569, "epoch": 6296} {"train_loss": -27.29401969909668, "global_step": 522570, "epoch": 6296} {"train_loss": -27.19398307800293, "global_step": 522571, "epoch": 6296} {"train_loss": -27.371740341186523, "global_step": 522572, "epoch": 6296} {"train_loss": -27.5875186920166, "global_step": 522573, "epoch": 6296} {"train_loss": -27.328922271728516, "global_step": 522574, "epoch": 6296} {"train_loss": -27.178974151611328, "global_step": 522575, "epoch": 6296} {"train_loss": -27.288272857666016, "global_step": 522576, "epoch": 6296} {"train_loss": -27.2048397064209, "global_step": 522577, "epoch": 6296} {"train_loss": -27.239837646484375, "global_step": 522578, "epoch": 6296} {"train_loss": -27.350561141967773, "global_step": 522579, "epoch": 6296} {"train_loss": -27.476215362548828, "global_step": 522580, "epoch": 6296} {"train_loss": -27.099884033203125, "global_step": 522581, "epoch": 6296} {"train_loss": -27.203805923461914, "global_step": 522582, "epoch": 6296} {"train_loss": -27.306798934936523, "global_step": 522583, "epoch": 6296} {"train_loss": -26.984716415405273, "global_step": 522584, "epoch": 6296} {"train_loss": -27.22125816345215, "global_step": 522585, "epoch": 6296} {"train_loss": -27.25873374938965, "global_step": 522586, "epoch": 6296} {"train_loss": -27.24887466430664, "global_step": 522587, "epoch": 6296} {"train_loss": -27.3128662109375, "global_step": 522588, "epoch": 6296} {"train_loss": -27.69060707092285, "global_step": 522589, "epoch": 6296} {"train_loss": -27.47161865234375, "global_step": 522590, "epoch": 6296} {"train_loss": -27.201374053955078, "global_step": 522591, "epoch": 6296} {"train_loss": -27.258676528930664, "global_step": 522592, "epoch": 6296} {"train_loss": -27.65478515625, "global_step": 522593, "epoch": 6296} {"train_loss": -26.88775062561035, "global_step": 522594, "epoch": 6296} {"train_loss": -27.321868896484375, "global_step": 522595, "epoch": 6296} {"train_loss": -27.543167114257812, "global_step": 522596, "epoch": 6296} {"train_loss": -27.628568649291992, "global_step": 522597, "epoch": 6296} {"train_loss": -27.37074089050293, "global_step": 522598, "epoch": 6296} {"train_loss": -27.26950454711914, "global_step": 522599, "epoch": 6296} {"train_loss": -27.7089786529541, "global_step": 522600, "epoch": 6296} {"train_loss": -27.494693756103516, "global_step": 522601, "epoch": 6296} {"train_loss": -27.826786041259766, "global_step": 522602, "epoch": 6296} {"train_loss": -27.369604110717773, "global_step": 522603, "epoch": 6296} {"train_loss": -27.551481246948242, "global_step": 522604, "epoch": 6296} {"train_loss": -27.767282485961914, "global_step": 522605, "epoch": 6296} {"train_loss": -27.381214141845703, "global_step": 522606, "epoch": 6296} {"train_loss": -27.72601318359375, "global_step": 522607, "epoch": 6296} {"train_loss": -27.535282135009766, "global_step": 522608, "epoch": 6296} {"train_loss": -28.127660751342773, "global_step": 522609, "epoch": 6296} {"train_loss": -28.03424644470215, "global_step": 522610, "epoch": 6296} {"train_loss": -27.55531120300293, "global_step": 522611, "epoch": 6296} {"train_loss": -27.689191818237305, "global_step": 522612, "epoch": 6296} {"train_loss": -27.44398307800293, "global_step": 522613, "epoch": 6296} {"train_loss": -27.793317794799805, "global_step": 522614, "epoch": 6296} {"train_loss": -27.95477294921875, "global_step": 522615, "epoch": 6296} {"train_loss": -27.74545669555664, "global_step": 522616, "epoch": 6296} {"train_loss": -27.537860870361328, "global_step": 522617, "epoch": 6296} {"train_loss": -27.41663932800293, "global_step": 522618, "epoch": 6296} {"train_loss": -28.015790939331055, "global_step": 522619, "epoch": 6296} {"train_loss": -27.490747451782227, "global_step": 522620, "epoch": 6296} {"train_loss": -27.6828556060791, "global_step": 522621, "epoch": 6296} {"train_loss": -26.75970458984375, "global_step": 522622, "epoch": 6296} {"train_loss": -26.65022087097168, "global_step": 522623, "epoch": 6296} {"train_loss": -27.0058536529541, "global_step": 522624, "epoch": 6296} {"train_loss": -27.25459098815918, "global_step": 522625, "epoch": 6296} {"train_loss": -26.966938018798828, "global_step": 522626, "epoch": 6296} {"train_loss": -27.566625595092773, "global_step": 522627, "epoch": 6296} {"train_loss": -27.307844161987305, "global_step": 522628, "epoch": 6296} {"train_loss": -27.712890625, "global_step": 522629, "epoch": 6296} {"train_loss": -27.531824111938477, "global_step": 522630, "epoch": 6296} {"train_loss": -27.374561309814453, "global_step": 522631, "epoch": 6296} {"train_loss": -27.50518798828125, "global_step": 522632, "epoch": 6296} {"train_loss": -27.395233154296875, "global_step": 522633, "epoch": 6296} {"train_loss": -27.919897079467773, "global_step": 522634, "epoch": 6296} {"train_loss": -27.58440589904785, "global_step": 522635, "epoch": 6296} {"train_loss": -27.65748405456543, "global_step": 522636, "epoch": 6296} {"train_loss": -27.453998565673828, "global_step": 522637, "epoch": 6296} {"train_loss": -27.748279571533203, "global_step": 522638, "epoch": 6296} {"train_loss": -28.0751895904541, "global_step": 522639, "epoch": 6296} {"train_loss": -27.394254684448242, "global_step": 522640, "epoch": 6296} {"train_loss": -27.9890079498291, "global_step": 522641, "epoch": 6296} {"train_loss": -28.006315231323242, "global_step": 522642, "epoch": 6296} {"train_loss": -27.587451934814453, "global_step": 522643, "epoch": 6296} {"train_loss": -27.723875045776367, "global_step": 522644, "epoch": 6296} {"train_loss": -27.85395622253418, "global_step": 522645, "epoch": 6296} {"train_loss": -27.67437744140625, "global_step": 522646, "epoch": 6296} {"train_loss": -27.66867446899414, "global_step": 522647, "epoch": 6296} {"train_loss": -27.7773494720459, "global_step": 522648, "epoch": 6296} {"train_loss": -27.902435302734375, "global_step": 522649, "epoch": 6296} {"train_loss": -27.470977553402086, "global_step": 522650, "epoch": 6296, "val_loss": 6671220.5} {"train_loss": -27.606550216674805, "global_step": 522651, "epoch": 6297} {"train_loss": -27.514816284179688, "global_step": 522652, "epoch": 6297} {"train_loss": -27.469308853149414, "global_step": 522653, "epoch": 6297} {"train_loss": -27.33173942565918, "global_step": 522654, "epoch": 6297} {"train_loss": -27.085391998291016, "global_step": 522655, "epoch": 6297} {"train_loss": -27.734134674072266, "global_step": 522656, "epoch": 6297} {"train_loss": -27.609724044799805, "global_step": 522657, "epoch": 6297} {"train_loss": -27.473560333251953, "global_step": 522658, "epoch": 6297} {"train_loss": -27.494903564453125, "global_step": 522659, "epoch": 6297} {"train_loss": -27.549304962158203, "global_step": 522660, "epoch": 6297} {"train_loss": -27.053556442260742, "global_step": 522661, "epoch": 6297} {"train_loss": -26.90996742248535, "global_step": 522662, "epoch": 6297} {"train_loss": -27.304813385009766, "global_step": 522663, "epoch": 6297} {"train_loss": -27.556568145751953, "global_step": 522664, "epoch": 6297} {"train_loss": -27.37883949279785, "global_step": 522665, "epoch": 6297} {"train_loss": -26.98725700378418, "global_step": 522666, "epoch": 6297} {"train_loss": -27.61116600036621, "global_step": 522667, "epoch": 6297} {"train_loss": -27.387943267822266, "global_step": 522668, "epoch": 6297} {"train_loss": -27.317840576171875, "global_step": 522669, "epoch": 6297} {"train_loss": -27.592914581298828, "global_step": 522670, "epoch": 6297} {"train_loss": -27.096683502197266, "global_step": 522671, "epoch": 6297} {"train_loss": -28.059661865234375, "global_step": 522672, "epoch": 6297} {"train_loss": -26.871122360229492, "global_step": 522673, "epoch": 6297} {"train_loss": -27.649484634399414, "global_step": 522674, "epoch": 6297} {"train_loss": -26.928491592407227, "global_step": 522675, "epoch": 6297} {"train_loss": -27.116119384765625, "global_step": 522676, "epoch": 6297} {"train_loss": -27.576679229736328, "global_step": 522677, "epoch": 6297} {"train_loss": -27.351776123046875, "global_step": 522678, "epoch": 6297} {"train_loss": -27.58039665222168, "global_step": 522679, "epoch": 6297} {"train_loss": -27.46192741394043, "global_step": 522680, "epoch": 6297} {"train_loss": -27.513427734375, "global_step": 522681, "epoch": 6297} {"train_loss": -27.563886642456055, "global_step": 522682, "epoch": 6297} {"train_loss": -27.692047119140625, "global_step": 522683, "epoch": 6297} {"train_loss": -27.438302993774414, "global_step": 522684, "epoch": 6297} {"train_loss": -27.579059600830078, "global_step": 522685, "epoch": 6297} {"train_loss": -27.826475143432617, "global_step": 522686, "epoch": 6297} {"train_loss": -27.51677894592285, "global_step": 522687, "epoch": 6297} {"train_loss": -27.265869140625, "global_step": 522688, "epoch": 6297} {"train_loss": -27.518360137939453, "global_step": 522689, "epoch": 6297} {"train_loss": -27.792129516601562, "global_step": 522690, "epoch": 6297} {"train_loss": -27.650842666625977, "global_step": 522691, "epoch": 6297} {"train_loss": -27.776952743530273, "global_step": 522692, "epoch": 6297} {"train_loss": -27.907272338867188, "global_step": 522693, "epoch": 6297} {"train_loss": -27.74763298034668, "global_step": 522694, "epoch": 6297} {"train_loss": -28.234806060791016, "global_step": 522695, "epoch": 6297} {"train_loss": -27.74846839904785, "global_step": 522696, "epoch": 6297} {"train_loss": -27.39346694946289, "global_step": 522697, "epoch": 6297} {"train_loss": -27.77902603149414, "global_step": 522698, "epoch": 6297} {"train_loss": -27.342422485351562, "global_step": 522699, "epoch": 6297} {"train_loss": -27.44019889831543, "global_step": 522700, "epoch": 6297} {"train_loss": -27.33387565612793, "global_step": 522701, "epoch": 6297} {"train_loss": -27.69413185119629, "global_step": 522702, "epoch": 6297} {"train_loss": -27.533788681030273, "global_step": 522703, "epoch": 6297} {"train_loss": -27.5345458984375, "global_step": 522704, "epoch": 6297} {"train_loss": -27.64641761779785, "global_step": 522705, "epoch": 6297} {"train_loss": -27.605478286743164, "global_step": 522706, "epoch": 6297} {"train_loss": -27.257307052612305, "global_step": 522707, "epoch": 6297} {"train_loss": -27.699981689453125, "global_step": 522708, "epoch": 6297} {"train_loss": -27.621158599853516, "global_step": 522709, "epoch": 6297} {"train_loss": -27.360092163085938, "global_step": 522710, "epoch": 6297} {"train_loss": -27.45977210998535, "global_step": 522711, "epoch": 6297} {"train_loss": -27.775604248046875, "global_step": 522712, "epoch": 6297} {"train_loss": -27.608112335205078, "global_step": 522713, "epoch": 6297} {"train_loss": -27.4636287689209, "global_step": 522714, "epoch": 6297} {"train_loss": -27.42132568359375, "global_step": 522715, "epoch": 6297} {"train_loss": -27.59523582458496, "global_step": 522716, "epoch": 6297} {"train_loss": -27.401580810546875, "global_step": 522717, "epoch": 6297} {"train_loss": -27.424360275268555, "global_step": 522718, "epoch": 6297} {"train_loss": -27.480356216430664, "global_step": 522719, "epoch": 6297} {"train_loss": -27.488988876342773, "global_step": 522720, "epoch": 6297} {"train_loss": -27.588361740112305, "global_step": 522721, "epoch": 6297} {"train_loss": -27.5687313079834, "global_step": 522722, "epoch": 6297} {"train_loss": -27.334653854370117, "global_step": 522723, "epoch": 6297} {"train_loss": -27.471044540405273, "global_step": 522724, "epoch": 6297} {"train_loss": -27.457494735717773, "global_step": 522725, "epoch": 6297} {"train_loss": -27.67852210998535, "global_step": 522726, "epoch": 6297} {"train_loss": -27.245920181274414, "global_step": 522727, "epoch": 6297} {"train_loss": -27.155969619750977, "global_step": 522728, "epoch": 6297} {"train_loss": -27.079578399658203, "global_step": 522729, "epoch": 6297} {"train_loss": -27.57709312438965, "global_step": 522730, "epoch": 6297} {"train_loss": -27.5629940032959, "global_step": 522731, "epoch": 6297} {"train_loss": -27.24471092224121, "global_step": 522732, "epoch": 6297} {"train_loss": -27.480874670557228, "global_step": 522733, "epoch": 6297, "val_loss": 6657458.5} {"train_loss": -26.704620361328125, "global_step": 522734, "epoch": 6298} {"train_loss": -27.115869522094727, "global_step": 522735, "epoch": 6298} {"train_loss": -27.19891929626465, "global_step": 522736, "epoch": 6298} {"train_loss": -26.43963050842285, "global_step": 522737, "epoch": 6298} {"train_loss": -26.812585830688477, "global_step": 522738, "epoch": 6298} {"train_loss": -26.82881736755371, "global_step": 522739, "epoch": 6298} {"train_loss": -26.749059677124023, "global_step": 522740, "epoch": 6298} {"train_loss": -27.024702072143555, "global_step": 522741, "epoch": 6298} {"train_loss": -27.02496910095215, "global_step": 522742, "epoch": 6298} {"train_loss": -27.006006240844727, "global_step": 522743, "epoch": 6298} {"train_loss": -26.87714195251465, "global_step": 522744, "epoch": 6298} {"train_loss": -27.362186431884766, "global_step": 522745, "epoch": 6298} {"train_loss": -27.085983276367188, "global_step": 522746, "epoch": 6298} {"train_loss": -27.159605026245117, "global_step": 522747, "epoch": 6298} {"train_loss": -26.989404678344727, "global_step": 522748, "epoch": 6298} {"train_loss": -27.575841903686523, "global_step": 522749, "epoch": 6298} {"train_loss": -27.28690528869629, "global_step": 522750, "epoch": 6298} {"train_loss": -27.159149169921875, "global_step": 522751, "epoch": 6298} {"train_loss": -27.08819007873535, "global_step": 522752, "epoch": 6298} {"train_loss": -27.57329750061035, "global_step": 522753, "epoch": 6298} {"train_loss": -27.124048233032227, "global_step": 522754, "epoch": 6298} {"train_loss": -27.65924072265625, "global_step": 522755, "epoch": 6298} {"train_loss": -27.379150390625, "global_step": 522756, "epoch": 6298} {"train_loss": -27.4644775390625, "global_step": 522757, "epoch": 6298} {"train_loss": -27.294864654541016, "global_step": 522758, "epoch": 6298} {"train_loss": -27.45818519592285, "global_step": 522759, "epoch": 6298} {"train_loss": -27.020429611206055, "global_step": 522760, "epoch": 6298} {"train_loss": -27.525287628173828, "global_step": 522761, "epoch": 6298} {"train_loss": -27.59796142578125, "global_step": 522762, "epoch": 6298} {"train_loss": -27.623117446899414, "global_step": 522763, "epoch": 6298} {"train_loss": -27.707656860351562, "global_step": 522764, "epoch": 6298} {"train_loss": -27.47743034362793, "global_step": 522765, "epoch": 6298} {"train_loss": -27.39715003967285, "global_step": 522766, "epoch": 6298} {"train_loss": -27.286645889282227, "global_step": 522767, "epoch": 6298} {"train_loss": -27.575998306274414, "global_step": 522768, "epoch": 6298} {"train_loss": -27.2752742767334, "global_step": 522769, "epoch": 6298} {"train_loss": -27.615680694580078, "global_step": 522770, "epoch": 6298} {"train_loss": -27.456113815307617, "global_step": 522771, "epoch": 6298} {"train_loss": -27.84417152404785, "global_step": 522772, "epoch": 6298} {"train_loss": -27.350881576538086, "global_step": 522773, "epoch": 6298} {"train_loss": -27.60917091369629, "global_step": 522774, "epoch": 6298} {"train_loss": -27.6449031829834, "global_step": 522775, "epoch": 6298} {"train_loss": -27.65388298034668, "global_step": 522776, "epoch": 6298} {"train_loss": -27.916662216186523, "global_step": 522777, "epoch": 6298} {"train_loss": -27.664899826049805, "global_step": 522778, "epoch": 6298} {"train_loss": -27.861957550048828, "global_step": 522779, "epoch": 6298} {"train_loss": -27.3233585357666, "global_step": 522780, "epoch": 6298} {"train_loss": -27.8279972076416, "global_step": 522781, "epoch": 6298} {"train_loss": -27.825592041015625, "global_step": 522782, "epoch": 6298} {"train_loss": -27.76214027404785, "global_step": 522783, "epoch": 6298} {"train_loss": -27.88433265686035, "global_step": 522784, "epoch": 6298} {"train_loss": -27.401874542236328, "global_step": 522785, "epoch": 6298} {"train_loss": -27.816308975219727, "global_step": 522786, "epoch": 6298} {"train_loss": -27.63623046875, "global_step": 522787, "epoch": 6298} {"train_loss": -27.234777450561523, "global_step": 522788, "epoch": 6298} {"train_loss": -27.830535888671875, "global_step": 522789, "epoch": 6298} {"train_loss": -28.152875900268555, "global_step": 522790, "epoch": 6298} {"train_loss": -27.737491607666016, "global_step": 522791, "epoch": 6298} {"train_loss": -27.780826568603516, "global_step": 522792, "epoch": 6298} {"train_loss": -27.863805770874023, "global_step": 522793, "epoch": 6298} {"train_loss": -27.473037719726562, "global_step": 522794, "epoch": 6298} {"train_loss": -28.14716148376465, "global_step": 522795, "epoch": 6298} {"train_loss": -27.864225387573242, "global_step": 522796, "epoch": 6298} {"train_loss": -27.614978790283203, "global_step": 522797, "epoch": 6298} {"train_loss": -27.53571128845215, "global_step": 522798, "epoch": 6298} {"train_loss": -27.413619995117188, "global_step": 522799, "epoch": 6298} {"train_loss": -27.77266502380371, "global_step": 522800, "epoch": 6298} {"train_loss": -27.278955459594727, "global_step": 522801, "epoch": 6298} {"train_loss": -27.928518295288086, "global_step": 522802, "epoch": 6298} {"train_loss": -27.484365463256836, "global_step": 522803, "epoch": 6298} {"train_loss": -27.56256675720215, "global_step": 522804, "epoch": 6298} {"train_loss": -27.303220748901367, "global_step": 522805, "epoch": 6298} {"train_loss": -26.999357223510742, "global_step": 522806, "epoch": 6298} {"train_loss": -27.346271514892578, "global_step": 522807, "epoch": 6298} {"train_loss": -27.061758041381836, "global_step": 522808, "epoch": 6298} {"train_loss": -27.719541549682617, "global_step": 522809, "epoch": 6298} {"train_loss": -26.890790939331055, "global_step": 522810, "epoch": 6298} {"train_loss": -26.016889572143555, "global_step": 522811, "epoch": 6298} {"train_loss": -26.278528213500977, "global_step": 522812, "epoch": 6298} {"train_loss": -27.320112228393555, "global_step": 522813, "epoch": 6298} {"train_loss": -27.438495635986328, "global_step": 522814, "epoch": 6298} {"train_loss": -26.762882232666016, "global_step": 522815, "epoch": 6298} {"train_loss": -27.409869228500916, "global_step": 522816, "epoch": 6298, "val_loss": 6626304.0} {"train_loss": -24.37211036682129, "global_step": 522817, "epoch": 6299} {"train_loss": -25.6009464263916, "global_step": 522818, "epoch": 6299} {"train_loss": -25.325366973876953, "global_step": 522819, "epoch": 6299} {"train_loss": -26.16591453552246, "global_step": 522820, "epoch": 6299} {"train_loss": -25.17675018310547, "global_step": 522821, "epoch": 6299} {"train_loss": -26.055667877197266, "global_step": 522822, "epoch": 6299} {"train_loss": -25.708044052124023, "global_step": 522823, "epoch": 6299} {"train_loss": -26.09340476989746, "global_step": 522824, "epoch": 6299} {"train_loss": -26.62872314453125, "global_step": 522825, "epoch": 6299} {"train_loss": -25.988744735717773, "global_step": 522826, "epoch": 6299} {"train_loss": -26.442615509033203, "global_step": 522827, "epoch": 6299} {"train_loss": -26.470874786376953, "global_step": 522828, "epoch": 6299} {"train_loss": -26.579853057861328, "global_step": 522829, "epoch": 6299} {"train_loss": -26.379846572875977, "global_step": 522830, "epoch": 6299} {"train_loss": -26.684158325195312, "global_step": 522831, "epoch": 6299} {"train_loss": -26.601972579956055, "global_step": 522832, "epoch": 6299} {"train_loss": -26.357389450073242, "global_step": 522833, "epoch": 6299} {"train_loss": -26.572998046875, "global_step": 522834, "epoch": 6299} {"train_loss": -26.76812744140625, "global_step": 522835, "epoch": 6299} {"train_loss": -26.850149154663086, "global_step": 522836, "epoch": 6299} {"train_loss": -26.74456787109375, "global_step": 522837, "epoch": 6299} {"train_loss": -27.07022476196289, "global_step": 522838, "epoch": 6299} {"train_loss": -26.716205596923828, "global_step": 522839, "epoch": 6299} {"train_loss": -26.87290382385254, "global_step": 522840, "epoch": 6299} {"train_loss": -27.3115291595459, "global_step": 522841, "epoch": 6299} {"train_loss": -26.592199325561523, "global_step": 522842, "epoch": 6299} {"train_loss": -26.96538734436035, "global_step": 522843, "epoch": 6299} {"train_loss": -27.154815673828125, "global_step": 522844, "epoch": 6299} {"train_loss": -27.3188419342041, "global_step": 522845, "epoch": 6299} {"train_loss": -27.56159782409668, "global_step": 522846, "epoch": 6299} {"train_loss": -26.652036666870117, "global_step": 522847, "epoch": 6299} {"train_loss": -27.224042892456055, "global_step": 522848, "epoch": 6299} {"train_loss": -27.46238136291504, "global_step": 522849, "epoch": 6299} {"train_loss": -27.22109031677246, "global_step": 522850, "epoch": 6299} {"train_loss": -27.371076583862305, "global_step": 522851, "epoch": 6299} {"train_loss": -27.500873565673828, "global_step": 522852, "epoch": 6299} {"train_loss": -27.40309715270996, "global_step": 522853, "epoch": 6299} {"train_loss": -27.273242950439453, "global_step": 522854, "epoch": 6299} {"train_loss": -27.650455474853516, "global_step": 522855, "epoch": 6299} {"train_loss": -27.22402000427246, "global_step": 522856, "epoch": 6299} {"train_loss": -27.38901710510254, "global_step": 522857, "epoch": 6299} {"train_loss": -27.885034561157227, "global_step": 522858, "epoch": 6299} {"train_loss": -27.524866104125977, "global_step": 522859, "epoch": 6299} {"train_loss": -27.78188133239746, "global_step": 522860, "epoch": 6299} {"train_loss": -27.528064727783203, "global_step": 522861, "epoch": 6299} {"train_loss": -27.746992111206055, "global_step": 522862, "epoch": 6299} {"train_loss": -27.451993942260742, "global_step": 522863, "epoch": 6299} {"train_loss": -27.813369750976562, "global_step": 522864, "epoch": 6299} {"train_loss": -27.558435440063477, "global_step": 522865, "epoch": 6299} {"train_loss": -27.652698516845703, "global_step": 522866, "epoch": 6299} {"train_loss": -27.133581161499023, "global_step": 522867, "epoch": 6299} {"train_loss": -27.66719627380371, "global_step": 522868, "epoch": 6299} {"train_loss": -27.740081787109375, "global_step": 522869, "epoch": 6299} {"train_loss": -27.474206924438477, "global_step": 522870, "epoch": 6299} {"train_loss": -27.784650802612305, "global_step": 522871, "epoch": 6299} {"train_loss": -27.901453018188477, "global_step": 522872, "epoch": 6299} {"train_loss": -27.5867977142334, "global_step": 522873, "epoch": 6299} {"train_loss": -27.55659294128418, "global_step": 522874, "epoch": 6299} {"train_loss": -27.963205337524414, "global_step": 522875, "epoch": 6299} {"train_loss": -27.856924057006836, "global_step": 522876, "epoch": 6299} {"train_loss": -27.640018463134766, "global_step": 522877, "epoch": 6299} {"train_loss": -27.524383544921875, "global_step": 522878, "epoch": 6299} {"train_loss": -27.51459312438965, "global_step": 522879, "epoch": 6299} {"train_loss": -27.936145782470703, "global_step": 522880, "epoch": 6299} {"train_loss": -27.737781524658203, "global_step": 522881, "epoch": 6299} {"train_loss": -27.976531982421875, "global_step": 522882, "epoch": 6299} {"train_loss": -27.640777587890625, "global_step": 522883, "epoch": 6299} {"train_loss": -27.580081939697266, "global_step": 522884, "epoch": 6299} {"train_loss": -27.81540870666504, "global_step": 522885, "epoch": 6299} {"train_loss": -27.97479248046875, "global_step": 522886, "epoch": 6299} {"train_loss": -27.735122680664062, "global_step": 522887, "epoch": 6299} {"train_loss": -27.592863082885742, "global_step": 522888, "epoch": 6299} {"train_loss": -27.59002685546875, "global_step": 522889, "epoch": 6299} {"train_loss": -27.498493194580078, "global_step": 522890, "epoch": 6299} {"train_loss": -27.726606369018555, "global_step": 522891, "epoch": 6299} {"train_loss": -27.7604923248291, "global_step": 522892, "epoch": 6299} {"train_loss": -27.95285987854004, "global_step": 522893, "epoch": 6299} {"train_loss": -27.4561824798584, "global_step": 522894, "epoch": 6299} {"train_loss": -27.868330001831055, "global_step": 522895, "epoch": 6299} {"train_loss": -27.79072380065918, "global_step": 522896, "epoch": 6299} {"train_loss": -27.512054443359375, "global_step": 522897, "epoch": 6299} {"train_loss": -27.696399688720703, "global_step": 522898, "epoch": 6299} {"train_loss": -27.183306728500916, "global_step": 522899, "epoch": 6299, "val_loss": 6672644.0} {"train_loss": -26.95926856994629, "global_step": 522900, "epoch": 6300} {"train_loss": -27.51416015625, "global_step": 522901, "epoch": 6300} {"train_loss": -26.89227294921875, "global_step": 522902, "epoch": 6300} {"train_loss": -27.270727157592773, "global_step": 522903, "epoch": 6300} {"train_loss": -27.339004516601562, "global_step": 522904, "epoch": 6300} {"train_loss": -27.736799240112305, "global_step": 522905, "epoch": 6300} {"train_loss": -27.63193702697754, "global_step": 522906, "epoch": 6300} {"train_loss": -27.69868278503418, "global_step": 522907, "epoch": 6300} {"train_loss": -27.345600128173828, "global_step": 522908, "epoch": 6300} {"train_loss": -27.0790958404541, "global_step": 522909, "epoch": 6300} {"train_loss": -27.4119930267334, "global_step": 522910, "epoch": 6300} {"train_loss": -27.06256675720215, "global_step": 522911, "epoch": 6300} {"train_loss": -27.655054092407227, "global_step": 522912, "epoch": 6300} {"train_loss": -27.36052894592285, "global_step": 522913, "epoch": 6300} {"train_loss": -27.585580825805664, "global_step": 522914, "epoch": 6300} {"train_loss": -27.337961196899414, "global_step": 522915, "epoch": 6300} {"train_loss": -27.6456241607666, "global_step": 522916, "epoch": 6300} {"train_loss": -27.74213218688965, "global_step": 522917, "epoch": 6300} {"train_loss": -27.496557235717773, "global_step": 522918, "epoch": 6300} {"train_loss": -27.523284912109375, "global_step": 522919, "epoch": 6300} {"train_loss": -27.519760131835938, "global_step": 522920, "epoch": 6300} {"train_loss": -27.5445556640625, "global_step": 522921, "epoch": 6300} {"train_loss": -27.490936279296875, "global_step": 522922, "epoch": 6300} {"train_loss": -27.400583267211914, "global_step": 522923, "epoch": 6300} {"train_loss": -27.520050048828125, "global_step": 522924, "epoch": 6300} {"train_loss": -27.799707412719727, "global_step": 522925, "epoch": 6300} {"train_loss": -27.594898223876953, "global_step": 522926, "epoch": 6300} {"train_loss": -27.582128524780273, "global_step": 522927, "epoch": 6300} {"train_loss": -27.525381088256836, "global_step": 522928, "epoch": 6300} {"train_loss": -27.394580841064453, "global_step": 522929, "epoch": 6300} {"train_loss": -27.640539169311523, "global_step": 522930, "epoch": 6300} {"train_loss": -27.824737548828125, "global_step": 522931, "epoch": 6300} {"train_loss": -27.328290939331055, "global_step": 522932, "epoch": 6300} {"train_loss": -27.692230224609375, "global_step": 522933, "epoch": 6300} {"train_loss": -27.713464736938477, "global_step": 522934, "epoch": 6300} {"train_loss": -27.91552734375, "global_step": 522935, "epoch": 6300} {"train_loss": -28.096057891845703, "global_step": 522936, "epoch": 6300} {"train_loss": -27.876190185546875, "global_step": 522937, "epoch": 6300} {"train_loss": -27.932950973510742, "global_step": 522938, "epoch": 6300} {"train_loss": -28.07708740234375, "global_step": 522939, "epoch": 6300} {"train_loss": -27.690099716186523, "global_step": 522940, "epoch": 6300} {"train_loss": -27.828824996948242, "global_step": 522941, "epoch": 6300} {"train_loss": -27.63216209411621, "global_step": 522942, "epoch": 6300} {"train_loss": -27.433807373046875, "global_step": 522943, "epoch": 6300} {"train_loss": -27.062671661376953, "global_step": 522944, "epoch": 6300} {"train_loss": -27.325641632080078, "global_step": 522945, "epoch": 6300} {"train_loss": -27.298526763916016, "global_step": 522946, "epoch": 6300} {"train_loss": -27.392669677734375, "global_step": 522947, "epoch": 6300} {"train_loss": -26.970417022705078, "global_step": 522948, "epoch": 6300} {"train_loss": -27.402799606323242, "global_step": 522949, "epoch": 6300} {"train_loss": -27.72306251525879, "global_step": 522950, "epoch": 6300} {"train_loss": -27.144811630249023, "global_step": 522951, "epoch": 6300} {"train_loss": -27.503482818603516, "global_step": 522952, "epoch": 6300} {"train_loss": -27.237234115600586, "global_step": 522953, "epoch": 6300} {"train_loss": -27.471298217773438, "global_step": 522954, "epoch": 6300} {"train_loss": -27.626529693603516, "global_step": 522955, "epoch": 6300} {"train_loss": -27.789335250854492, "global_step": 522956, "epoch": 6300} {"train_loss": -27.51738929748535, "global_step": 522957, "epoch": 6300} {"train_loss": -27.58937644958496, "global_step": 522958, "epoch": 6300} {"train_loss": -27.69331932067871, "global_step": 522959, "epoch": 6300} {"train_loss": -27.73682975769043, "global_step": 522960, "epoch": 6300} {"train_loss": -27.239709854125977, "global_step": 522961, "epoch": 6300} {"train_loss": -27.49090003967285, "global_step": 522962, "epoch": 6300} {"train_loss": -27.956663131713867, "global_step": 522963, "epoch": 6300} {"train_loss": -27.766489028930664, "global_step": 522964, "epoch": 6300} {"train_loss": -27.845605850219727, "global_step": 522965, "epoch": 6300} {"train_loss": -27.390777587890625, "global_step": 522966, "epoch": 6300} {"train_loss": -27.482501983642578, "global_step": 522967, "epoch": 6300} {"train_loss": -27.5985107421875, "global_step": 522968, "epoch": 6300} {"train_loss": -27.548521041870117, "global_step": 522969, "epoch": 6300} {"train_loss": -27.466703414916992, "global_step": 522970, "epoch": 6300} {"train_loss": -27.53888511657715, "global_step": 522971, "epoch": 6300} {"train_loss": -27.857961654663086, "global_step": 522972, "epoch": 6300} {"train_loss": -27.8364200592041, "global_step": 522973, "epoch": 6300} {"train_loss": -27.68075942993164, "global_step": 522974, "epoch": 6300} {"train_loss": -27.32373046875, "global_step": 522975, "epoch": 6300} {"train_loss": -27.656686782836914, "global_step": 522976, "epoch": 6300} {"train_loss": -27.45033836364746, "global_step": 522977, "epoch": 6300} {"train_loss": -28.039148330688477, "global_step": 522978, "epoch": 6300} {"train_loss": -27.825897216796875, "global_step": 522979, "epoch": 6300} {"train_loss": -27.937347412109375, "global_step": 522980, "epoch": 6300} {"train_loss": -27.677663803100586, "global_step": 522981, "epoch": 6300} {"train_loss": -27.55371597014278, "global_step": 522982, "epoch": 6300, "train/sim_max_reward_0": 0.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 0.0, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4500000": 1.0, "test/sim_max_reward_4500001": 1.0, "test/sim_max_reward_4500002": 1.0, "test/sim_max_reward_4500003": 1.0, "test/sim_max_reward_4500004": 1.0, "test/sim_max_reward_4500005": 1.0, "test/sim_max_reward_4500006": 1.0, "test/sim_max_reward_4500007": 0.0, "test/sim_max_reward_4500008": 1.0, "test/sim_max_reward_4500009": 1.0, "test/sim_max_reward_4500010": 1.0, "test/sim_max_reward_4500011": 1.0, "test/sim_max_reward_4500012": 1.0, "test/sim_max_reward_4500013": 1.0, "test/sim_max_reward_4500014": 1.0, "test/sim_max_reward_4500015": 1.0, "test/sim_max_reward_4500016": 1.0, "test/sim_max_reward_4500017": 1.0, "test/sim_max_reward_4500018": 1.0, "test/sim_max_reward_4500019": 0.0, "test/sim_max_reward_4500020": 1.0, "test/sim_max_reward_4500021": 1.0, "train/mean_score": 0.6666666666666666, "test/mean_score": 0.9090909090909091, "val_loss": 6610004.5} {"train_loss": -27.163055419921875, "global_step": 522983, "epoch": 6301} {"train_loss": -26.607275009155273, "global_step": 522984, "epoch": 6301} {"train_loss": -26.722061157226562, "global_step": 522985, "epoch": 6301} {"train_loss": -25.978052139282227, "global_step": 522986, "epoch": 6301} {"train_loss": -25.900293350219727, "global_step": 522987, "epoch": 6301} {"train_loss": -26.572986602783203, "global_step": 522988, "epoch": 6301} {"train_loss": -27.299726486206055, "global_step": 522989, "epoch": 6301} {"train_loss": -26.734119415283203, "global_step": 522990, "epoch": 6301} {"train_loss": -26.800617218017578, "global_step": 522991, "epoch": 6301} {"train_loss": -27.00851821899414, "global_step": 522992, "epoch": 6301} {"train_loss": -26.795074462890625, "global_step": 522993, "epoch": 6301} {"train_loss": -26.930749893188477, "global_step": 522994, "epoch": 6301} {"train_loss": -27.102270126342773, "global_step": 522995, "epoch": 6301} {"train_loss": -27.155075073242188, "global_step": 522996, "epoch": 6301} {"train_loss": -26.641681671142578, "global_step": 522997, "epoch": 6301} {"train_loss": -26.740478515625, "global_step": 522998, "epoch": 6301} {"train_loss": -27.225873947143555, "global_step": 522999, "epoch": 6301} {"train_loss": -27.202106475830078, "global_step": 523000, "epoch": 6301} {"train_loss": -27.419775009155273, "global_step": 523001, "epoch": 6301} {"train_loss": -26.608489990234375, "global_step": 523002, "epoch": 6301} {"train_loss": -27.38270378112793, "global_step": 523003, "epoch": 6301} {"train_loss": -27.22163200378418, "global_step": 523004, "epoch": 6301} {"train_loss": -27.184356689453125, "global_step": 523005, "epoch": 6301} {"train_loss": -27.324466705322266, "global_step": 523006, "epoch": 6301} {"train_loss": -27.495203018188477, "global_step": 523007, "epoch": 6301} {"train_loss": -27.64859962463379, "global_step": 523008, "epoch": 6301} {"train_loss": -27.2484188079834, "global_step": 523009, "epoch": 6301} {"train_loss": -27.710752487182617, "global_step": 523010, "epoch": 6301} {"train_loss": -27.558887481689453, "global_step": 523011, "epoch": 6301} {"train_loss": -27.577428817749023, "global_step": 523012, "epoch": 6301} {"train_loss": -27.520572662353516, "global_step": 523013, "epoch": 6301} {"train_loss": -27.4755916595459, "global_step": 523014, "epoch": 6301} {"train_loss": -27.821704864501953, "global_step": 523015, "epoch": 6301} {"train_loss": -27.468114852905273, "global_step": 523016, "epoch": 6301} {"train_loss": -27.818958282470703, "global_step": 523017, "epoch": 6301} {"train_loss": -27.5137996673584, "global_step": 523018, "epoch": 6301} {"train_loss": -27.589405059814453, "global_step": 523019, "epoch": 6301} {"train_loss": -27.29656410217285, "global_step": 523020, "epoch": 6301} {"train_loss": -27.426599502563477, "global_step": 523021, "epoch": 6301} {"train_loss": -27.537763595581055, "global_step": 523022, "epoch": 6301} {"train_loss": -27.806753158569336, "global_step": 523023, "epoch": 6301} {"train_loss": -27.299854278564453, "global_step": 523024, "epoch": 6301} {"train_loss": -27.472461700439453, "global_step": 523025, "epoch": 6301} {"train_loss": -27.7210636138916, "global_step": 523026, "epoch": 6301} {"train_loss": -27.171659469604492, "global_step": 523027, "epoch": 6301} {"train_loss": -27.447986602783203, "global_step": 523028, "epoch": 6301} {"train_loss": -27.427143096923828, "global_step": 523029, "epoch": 6301} {"train_loss": -28.1123104095459, "global_step": 523030, "epoch": 6301} {"train_loss": -27.801660537719727, "global_step": 523031, "epoch": 6301} {"train_loss": -27.67703628540039, "global_step": 523032, "epoch": 6301} {"train_loss": -27.774133682250977, "global_step": 523033, "epoch": 6301} {"train_loss": -27.943891525268555, "global_step": 523034, "epoch": 6301} {"train_loss": -27.3494815826416, "global_step": 523035, "epoch": 6301} {"train_loss": -28.071765899658203, "global_step": 523036, "epoch": 6301} {"train_loss": -27.954334259033203, "global_step": 523037, "epoch": 6301} {"train_loss": -27.44300651550293, "global_step": 523038, "epoch": 6301} {"train_loss": -27.707624435424805, "global_step": 523039, "epoch": 6301} {"train_loss": -27.8599853515625, "global_step": 523040, "epoch": 6301} {"train_loss": -27.621047973632812, "global_step": 523041, "epoch": 6301} {"train_loss": -27.875595092773438, "global_step": 523042, "epoch": 6301} {"train_loss": -27.90215492248535, "global_step": 523043, "epoch": 6301} {"train_loss": -27.750946044921875, "global_step": 523044, "epoch": 6301} {"train_loss": -27.5999813079834, "global_step": 523045, "epoch": 6301} {"train_loss": -27.866870880126953, "global_step": 523046, "epoch": 6301} {"train_loss": -27.858198165893555, "global_step": 523047, "epoch": 6301} {"train_loss": -27.47298240661621, "global_step": 523048, "epoch": 6301} {"train_loss": -27.79303550720215, "global_step": 523049, "epoch": 6301} {"train_loss": -27.099328994750977, "global_step": 523050, "epoch": 6301} {"train_loss": -27.216312408447266, "global_step": 523051, "epoch": 6301} {"train_loss": -27.637609481811523, "global_step": 523052, "epoch": 6301} {"train_loss": -27.478012084960938, "global_step": 523053, "epoch": 6301} {"train_loss": -27.44504737854004, "global_step": 523054, "epoch": 6301} {"train_loss": -27.375, "global_step": 523055, "epoch": 6301} {"train_loss": -27.619983673095703, "global_step": 523056, "epoch": 6301} {"train_loss": -27.813156127929688, "global_step": 523057, "epoch": 6301} {"train_loss": -27.506942749023438, "global_step": 523058, "epoch": 6301} {"train_loss": -27.328033447265625, "global_step": 523059, "epoch": 6301} {"train_loss": -26.8127384185791, "global_step": 523060, "epoch": 6301} {"train_loss": -27.433700561523438, "global_step": 523061, "epoch": 6301} {"train_loss": -27.842008590698242, "global_step": 523062, "epoch": 6301} {"train_loss": -27.409875869750977, "global_step": 523063, "epoch": 6301} {"train_loss": -27.464380264282227, "global_step": 523064, "epoch": 6301} {"train_loss": -27.383626616144756, "global_step": 523065, "epoch": 6301, "val_loss": 6646367.0} {"train_loss": -27.257795333862305, "global_step": 523066, "epoch": 6302} {"train_loss": -26.151403427124023, "global_step": 523067, "epoch": 6302} {"train_loss": -27.062057495117188, "global_step": 523068, "epoch": 6302} {"train_loss": -26.42230224609375, "global_step": 523069, "epoch": 6302} {"train_loss": -26.762617111206055, "global_step": 523070, "epoch": 6302} {"train_loss": -26.865009307861328, "global_step": 523071, "epoch": 6302} {"train_loss": -26.21193504333496, "global_step": 523072, "epoch": 6302} {"train_loss": -26.872241973876953, "global_step": 523073, "epoch": 6302} {"train_loss": -26.576696395874023, "global_step": 523074, "epoch": 6302} {"train_loss": -26.583112716674805, "global_step": 523075, "epoch": 6302} {"train_loss": -26.6173038482666, "global_step": 523076, "epoch": 6302} {"train_loss": -26.895959854125977, "global_step": 523077, "epoch": 6302} {"train_loss": -26.790685653686523, "global_step": 523078, "epoch": 6302} {"train_loss": -26.695600509643555, "global_step": 523079, "epoch": 6302} {"train_loss": -27.0384464263916, "global_step": 523080, "epoch": 6302} {"train_loss": -27.057764053344727, "global_step": 523081, "epoch": 6302} {"train_loss": -27.321725845336914, "global_step": 523082, "epoch": 6302} {"train_loss": -26.74139976501465, "global_step": 523083, "epoch": 6302} {"train_loss": -26.765888214111328, "global_step": 523084, "epoch": 6302} {"train_loss": -26.90803337097168, "global_step": 523085, "epoch": 6302} {"train_loss": -27.077314376831055, "global_step": 523086, "epoch": 6302} {"train_loss": -26.77248191833496, "global_step": 523087, "epoch": 6302} {"train_loss": -27.42496109008789, "global_step": 523088, "epoch": 6302} {"train_loss": -27.25335121154785, "global_step": 523089, "epoch": 6302} {"train_loss": -27.29401969909668, "global_step": 523090, "epoch": 6302} {"train_loss": -27.35941505432129, "global_step": 523091, "epoch": 6302} {"train_loss": -27.20309829711914, "global_step": 523092, "epoch": 6302} {"train_loss": -27.303293228149414, "global_step": 523093, "epoch": 6302} {"train_loss": -27.298818588256836, "global_step": 523094, "epoch": 6302} {"train_loss": -27.314260482788086, "global_step": 523095, "epoch": 6302} {"train_loss": -27.20819091796875, "global_step": 523096, "epoch": 6302} {"train_loss": -27.42438316345215, "global_step": 523097, "epoch": 6302} {"train_loss": -27.442975997924805, "global_step": 523098, "epoch": 6302} {"train_loss": -27.2143611907959, "global_step": 523099, "epoch": 6302} {"train_loss": -27.153167724609375, "global_step": 523100, "epoch": 6302} {"train_loss": -27.571592330932617, "global_step": 523101, "epoch": 6302} {"train_loss": -27.46526527404785, "global_step": 523102, "epoch": 6302} {"train_loss": -27.214401245117188, "global_step": 523103, "epoch": 6302} {"train_loss": -27.118194580078125, "global_step": 523104, "epoch": 6302} {"train_loss": -27.693866729736328, "global_step": 523105, "epoch": 6302} {"train_loss": -27.690988540649414, "global_step": 523106, "epoch": 6302} {"train_loss": -27.397565841674805, "global_step": 523107, "epoch": 6302} {"train_loss": -27.631574630737305, "global_step": 523108, "epoch": 6302} {"train_loss": -28.147918701171875, "global_step": 523109, "epoch": 6302} {"train_loss": -27.30828857421875, "global_step": 523110, "epoch": 6302} {"train_loss": -27.743284225463867, "global_step": 523111, "epoch": 6302} {"train_loss": -27.645360946655273, "global_step": 523112, "epoch": 6302} {"train_loss": -27.766937255859375, "global_step": 523113, "epoch": 6302} {"train_loss": -27.55340576171875, "global_step": 523114, "epoch": 6302} {"train_loss": -27.48746109008789, "global_step": 523115, "epoch": 6302} {"train_loss": -27.532812118530273, "global_step": 523116, "epoch": 6302} {"train_loss": -27.370594024658203, "global_step": 523117, "epoch": 6302} {"train_loss": -26.882062911987305, "global_step": 523118, "epoch": 6302} {"train_loss": -27.028701782226562, "global_step": 523119, "epoch": 6302} {"train_loss": -26.81296730041504, "global_step": 523120, "epoch": 6302} {"train_loss": -27.357940673828125, "global_step": 523121, "epoch": 6302} {"train_loss": -27.394611358642578, "global_step": 523122, "epoch": 6302} {"train_loss": -27.492956161499023, "global_step": 523123, "epoch": 6302} {"train_loss": -26.930511474609375, "global_step": 523124, "epoch": 6302} {"train_loss": -27.250598907470703, "global_step": 523125, "epoch": 6302} {"train_loss": -27.450342178344727, "global_step": 523126, "epoch": 6302} {"train_loss": -27.47002601623535, "global_step": 523127, "epoch": 6302} {"train_loss": -27.70839500427246, "global_step": 523128, "epoch": 6302} {"train_loss": -27.37491798400879, "global_step": 523129, "epoch": 6302} {"train_loss": -27.460058212280273, "global_step": 523130, "epoch": 6302} {"train_loss": -27.33805274963379, "global_step": 523131, "epoch": 6302} {"train_loss": -27.705432891845703, "global_step": 523132, "epoch": 6302} {"train_loss": -27.751468658447266, "global_step": 523133, "epoch": 6302} {"train_loss": -27.295705795288086, "global_step": 523134, "epoch": 6302} {"train_loss": -27.11895751953125, "global_step": 523135, "epoch": 6302} {"train_loss": -27.59238624572754, "global_step": 523136, "epoch": 6302} {"train_loss": -27.67530632019043, "global_step": 523137, "epoch": 6302} {"train_loss": -27.543115615844727, "global_step": 523138, "epoch": 6302} {"train_loss": -27.664600372314453, "global_step": 523139, "epoch": 6302} {"train_loss": -27.758346557617188, "global_step": 523140, "epoch": 6302} {"train_loss": -27.54026222229004, "global_step": 523141, "epoch": 6302} {"train_loss": -27.609088897705078, "global_step": 523142, "epoch": 6302} {"train_loss": -27.27826499938965, "global_step": 523143, "epoch": 6302} {"train_loss": -27.807580947875977, "global_step": 523144, "epoch": 6302} {"train_loss": -27.708581924438477, "global_step": 523145, "epoch": 6302} {"train_loss": -27.216928482055664, "global_step": 523146, "epoch": 6302} {"train_loss": -27.569488525390625, "global_step": 523147, "epoch": 6302} {"train_loss": -27.25363012107022, "global_step": 523148, "epoch": 6302, "val_loss": 6490863.5} {"train_loss": -26.968847274780273, "global_step": 523149, "epoch": 6303} {"train_loss": -26.8698787689209, "global_step": 523150, "epoch": 6303} {"train_loss": -26.798608779907227, "global_step": 523151, "epoch": 6303} {"train_loss": -27.250112533569336, "global_step": 523152, "epoch": 6303} {"train_loss": -26.98822021484375, "global_step": 523153, "epoch": 6303} {"train_loss": -27.305994033813477, "global_step": 523154, "epoch": 6303} {"train_loss": -27.153059005737305, "global_step": 523155, "epoch": 6303} {"train_loss": -27.469579696655273, "global_step": 523156, "epoch": 6303} {"train_loss": -27.484846115112305, "global_step": 523157, "epoch": 6303} {"train_loss": -27.19573974609375, "global_step": 523158, "epoch": 6303} {"train_loss": -27.500486373901367, "global_step": 523159, "epoch": 6303} {"train_loss": -27.304901123046875, "global_step": 523160, "epoch": 6303} {"train_loss": -27.479843139648438, "global_step": 523161, "epoch": 6303} {"train_loss": -27.508161544799805, "global_step": 523162, "epoch": 6303} {"train_loss": -26.944665908813477, "global_step": 523163, "epoch": 6303} {"train_loss": -27.201129913330078, "global_step": 523164, "epoch": 6303} {"train_loss": -27.54676628112793, "global_step": 523165, "epoch": 6303} {"train_loss": -27.491613388061523, "global_step": 523166, "epoch": 6303} {"train_loss": -27.090543746948242, "global_step": 523167, "epoch": 6303} {"train_loss": -27.464033126831055, "global_step": 523168, "epoch": 6303} {"train_loss": -27.494779586791992, "global_step": 523169, "epoch": 6303} {"train_loss": -27.57819175720215, "global_step": 523170, "epoch": 6303} {"train_loss": -27.60458755493164, "global_step": 523171, "epoch": 6303} {"train_loss": -27.288562774658203, "global_step": 523172, "epoch": 6303} {"train_loss": -27.437255859375, "global_step": 523173, "epoch": 6303} {"train_loss": -27.583005905151367, "global_step": 523174, "epoch": 6303} {"train_loss": -27.44434928894043, "global_step": 523175, "epoch": 6303} {"train_loss": -27.644495010375977, "global_step": 523176, "epoch": 6303} {"train_loss": -27.71856117248535, "global_step": 523177, "epoch": 6303} {"train_loss": -27.662891387939453, "global_step": 523178, "epoch": 6303} {"train_loss": -27.790536880493164, "global_step": 523179, "epoch": 6303} {"train_loss": -27.587228775024414, "global_step": 523180, "epoch": 6303} {"train_loss": -27.95551109313965, "global_step": 523181, "epoch": 6303} {"train_loss": -27.450712203979492, "global_step": 523182, "epoch": 6303} {"train_loss": -27.7302303314209, "global_step": 523183, "epoch": 6303} {"train_loss": -27.897672653198242, "global_step": 523184, "epoch": 6303} {"train_loss": -27.8568058013916, "global_step": 523185, "epoch": 6303} {"train_loss": -27.5799503326416, "global_step": 523186, "epoch": 6303} {"train_loss": -27.61530876159668, "global_step": 523187, "epoch": 6303} {"train_loss": -27.6397705078125, "global_step": 523188, "epoch": 6303} {"train_loss": -27.918121337890625, "global_step": 523189, "epoch": 6303} {"train_loss": -27.99727439880371, "global_step": 523190, "epoch": 6303} {"train_loss": -27.84598159790039, "global_step": 523191, "epoch": 6303} {"train_loss": -27.78602409362793, "global_step": 523192, "epoch": 6303} {"train_loss": -27.60554313659668, "global_step": 523193, "epoch": 6303} {"train_loss": -27.241897583007812, "global_step": 523194, "epoch": 6303} {"train_loss": -27.79121971130371, "global_step": 523195, "epoch": 6303} {"train_loss": -27.5820369720459, "global_step": 523196, "epoch": 6303} {"train_loss": -27.60394859313965, "global_step": 523197, "epoch": 6303} {"train_loss": -27.762836456298828, "global_step": 523198, "epoch": 6303} {"train_loss": -27.422353744506836, "global_step": 523199, "epoch": 6303} {"train_loss": -28.060392379760742, "global_step": 523200, "epoch": 6303} {"train_loss": -27.60841941833496, "global_step": 523201, "epoch": 6303} {"train_loss": -27.660369873046875, "global_step": 523202, "epoch": 6303} {"train_loss": -27.24226188659668, "global_step": 523203, "epoch": 6303} {"train_loss": -27.38873863220215, "global_step": 523204, "epoch": 6303} {"train_loss": -28.020889282226562, "global_step": 523205, "epoch": 6303} {"train_loss": -27.30364418029785, "global_step": 523206, "epoch": 6303} {"train_loss": -27.526350021362305, "global_step": 523207, "epoch": 6303} {"train_loss": -27.856115341186523, "global_step": 523208, "epoch": 6303} {"train_loss": -27.73414421081543, "global_step": 523209, "epoch": 6303} {"train_loss": -27.674270629882812, "global_step": 523210, "epoch": 6303} {"train_loss": -27.413908004760742, "global_step": 523211, "epoch": 6303} {"train_loss": -27.7093563079834, "global_step": 523212, "epoch": 6303} {"train_loss": -27.228595733642578, "global_step": 523213, "epoch": 6303} {"train_loss": -27.056814193725586, "global_step": 523214, "epoch": 6303} {"train_loss": -27.447301864624023, "global_step": 523215, "epoch": 6303} {"train_loss": -27.24698829650879, "global_step": 523216, "epoch": 6303} {"train_loss": -27.093496322631836, "global_step": 523217, "epoch": 6303} {"train_loss": -27.5875244140625, "global_step": 523218, "epoch": 6303} {"train_loss": -27.961530685424805, "global_step": 523219, "epoch": 6303} {"train_loss": -27.285053253173828, "global_step": 523220, "epoch": 6303} {"train_loss": -27.032733917236328, "global_step": 523221, "epoch": 6303} {"train_loss": -27.41192054748535, "global_step": 523222, "epoch": 6303} {"train_loss": -27.422712326049805, "global_step": 523223, "epoch": 6303} {"train_loss": -27.492450714111328, "global_step": 523224, "epoch": 6303} {"train_loss": -27.795032501220703, "global_step": 523225, "epoch": 6303} {"train_loss": -27.600357055664062, "global_step": 523226, "epoch": 6303} {"train_loss": -27.42585563659668, "global_step": 523227, "epoch": 6303} {"train_loss": -27.490331649780273, "global_step": 523228, "epoch": 6303} {"train_loss": -27.417255401611328, "global_step": 523229, "epoch": 6303} {"train_loss": -27.647573471069336, "global_step": 523230, "epoch": 6303} {"train_loss": -27.48113135831902, "global_step": 523231, "epoch": 6303, "val_loss": 6515277.0} {"train_loss": -26.993722915649414, "global_step": 523232, "epoch": 6304} {"train_loss": -26.831884384155273, "global_step": 523233, "epoch": 6304} {"train_loss": -27.64533805847168, "global_step": 523234, "epoch": 6304} {"train_loss": -27.014911651611328, "global_step": 523235, "epoch": 6304} {"train_loss": -27.93622398376465, "global_step": 523236, "epoch": 6304} {"train_loss": -27.21339225769043, "global_step": 523237, "epoch": 6304} {"train_loss": -27.182788848876953, "global_step": 523238, "epoch": 6304} {"train_loss": -27.328664779663086, "global_step": 523239, "epoch": 6304} {"train_loss": -26.967376708984375, "global_step": 523240, "epoch": 6304} {"train_loss": -27.636926651000977, "global_step": 523241, "epoch": 6304} {"train_loss": -27.29213523864746, "global_step": 523242, "epoch": 6304} {"train_loss": -27.070417404174805, "global_step": 523243, "epoch": 6304} {"train_loss": -26.955427169799805, "global_step": 523244, "epoch": 6304} {"train_loss": -27.477935791015625, "global_step": 523245, "epoch": 6304} {"train_loss": -27.19122886657715, "global_step": 523246, "epoch": 6304} {"train_loss": -27.451505661010742, "global_step": 523247, "epoch": 6304} {"train_loss": -27.460996627807617, "global_step": 523248, "epoch": 6304} {"train_loss": -27.311920166015625, "global_step": 523249, "epoch": 6304} {"train_loss": -26.974103927612305, "global_step": 523250, "epoch": 6304} {"train_loss": -27.21417808532715, "global_step": 523251, "epoch": 6304} {"train_loss": -27.63544273376465, "global_step": 523252, "epoch": 6304} {"train_loss": -27.39348793029785, "global_step": 523253, "epoch": 6304} {"train_loss": -27.224945068359375, "global_step": 523254, "epoch": 6304} {"train_loss": -27.896265029907227, "global_step": 523255, "epoch": 6304} {"train_loss": -27.168533325195312, "global_step": 523256, "epoch": 6304} {"train_loss": -27.199975967407227, "global_step": 523257, "epoch": 6304} {"train_loss": -27.140939712524414, "global_step": 523258, "epoch": 6304} {"train_loss": -27.106348037719727, "global_step": 523259, "epoch": 6304} {"train_loss": -27.1873722076416, "global_step": 523260, "epoch": 6304} {"train_loss": -26.939685821533203, "global_step": 523261, "epoch": 6304} {"train_loss": -27.48773765563965, "global_step": 523262, "epoch": 6304} {"train_loss": -27.53964614868164, "global_step": 523263, "epoch": 6304} {"train_loss": -27.05428123474121, "global_step": 523264, "epoch": 6304} {"train_loss": -27.486963272094727, "global_step": 523265, "epoch": 6304} {"train_loss": -27.539093017578125, "global_step": 523266, "epoch": 6304} {"train_loss": -27.230905532836914, "global_step": 523267, "epoch": 6304} {"train_loss": -27.74588966369629, "global_step": 523268, "epoch": 6304} {"train_loss": -27.612329483032227, "global_step": 523269, "epoch": 6304} {"train_loss": -27.36627197265625, "global_step": 523270, "epoch": 6304} {"train_loss": -27.328107833862305, "global_step": 523271, "epoch": 6304} {"train_loss": -27.190765380859375, "global_step": 523272, "epoch": 6304} {"train_loss": -27.577905654907227, "global_step": 523273, "epoch": 6304} {"train_loss": -27.7236270904541, "global_step": 523274, "epoch": 6304} {"train_loss": -27.385284423828125, "global_step": 523275, "epoch": 6304} {"train_loss": -27.39930534362793, "global_step": 523276, "epoch": 6304} {"train_loss": -27.7999267578125, "global_step": 523277, "epoch": 6304} {"train_loss": -27.44282341003418, "global_step": 523278, "epoch": 6304} {"train_loss": -27.20362663269043, "global_step": 523279, "epoch": 6304} {"train_loss": -27.70415687561035, "global_step": 523280, "epoch": 6304} {"train_loss": -27.381317138671875, "global_step": 523281, "epoch": 6304} {"train_loss": -27.626264572143555, "global_step": 523282, "epoch": 6304} {"train_loss": -27.859281539916992, "global_step": 523283, "epoch": 6304} {"train_loss": -27.350927352905273, "global_step": 523284, "epoch": 6304} {"train_loss": -27.784345626831055, "global_step": 523285, "epoch": 6304} {"train_loss": -27.41485595703125, "global_step": 523286, "epoch": 6304} {"train_loss": -27.841144561767578, "global_step": 523287, "epoch": 6304} {"train_loss": -28.09547233581543, "global_step": 523288, "epoch": 6304} {"train_loss": -27.45891761779785, "global_step": 523289, "epoch": 6304} {"train_loss": -27.50836181640625, "global_step": 523290, "epoch": 6304} {"train_loss": -27.52924156188965, "global_step": 523291, "epoch": 6304} {"train_loss": -27.576257705688477, "global_step": 523292, "epoch": 6304} {"train_loss": -27.43916130065918, "global_step": 523293, "epoch": 6304} {"train_loss": -27.197845458984375, "global_step": 523294, "epoch": 6304} {"train_loss": -26.35284423828125, "global_step": 523295, "epoch": 6304} {"train_loss": -25.729785919189453, "global_step": 523296, "epoch": 6304} {"train_loss": -25.593460083007812, "global_step": 523297, "epoch": 6304} {"train_loss": -27.452194213867188, "global_step": 523298, "epoch": 6304} {"train_loss": -27.09248924255371, "global_step": 523299, "epoch": 6304} {"train_loss": -27.352497100830078, "global_step": 523300, "epoch": 6304} {"train_loss": -27.518146514892578, "global_step": 523301, "epoch": 6304} {"train_loss": -27.411828994750977, "global_step": 523302, "epoch": 6304} {"train_loss": -27.274152755737305, "global_step": 523303, "epoch": 6304} {"train_loss": -27.122079849243164, "global_step": 523304, "epoch": 6304} {"train_loss": -27.640405654907227, "global_step": 523305, "epoch": 6304} {"train_loss": -27.2993106842041, "global_step": 523306, "epoch": 6304} {"train_loss": -27.29082679748535, "global_step": 523307, "epoch": 6304} {"train_loss": -27.27520751953125, "global_step": 523308, "epoch": 6304} {"train_loss": -27.6104793548584, "global_step": 523309, "epoch": 6304} {"train_loss": -27.49732780456543, "global_step": 523310, "epoch": 6304} {"train_loss": -27.689666748046875, "global_step": 523311, "epoch": 6304} {"train_loss": -27.776565551757812, "global_step": 523312, "epoch": 6304} {"train_loss": -27.418502807617188, "global_step": 523313, "epoch": 6304} {"train_loss": -27.338764305574347, "global_step": 523314, "epoch": 6304, "val_loss": 6605641.0} {"train_loss": -26.482812881469727, "global_step": 523315, "epoch": 6305} {"train_loss": -27.462451934814453, "global_step": 523316, "epoch": 6305} {"train_loss": -27.042652130126953, "global_step": 523317, "epoch": 6305} {"train_loss": -27.109418869018555, "global_step": 523318, "epoch": 6305} {"train_loss": -27.047544479370117, "global_step": 523319, "epoch": 6305} {"train_loss": -27.39851951599121, "global_step": 523320, "epoch": 6305} {"train_loss": -27.126249313354492, "global_step": 523321, "epoch": 6305} {"train_loss": -26.642019271850586, "global_step": 523322, "epoch": 6305} {"train_loss": -27.382436752319336, "global_step": 523323, "epoch": 6305} {"train_loss": -26.9186954498291, "global_step": 523324, "epoch": 6305} {"train_loss": -27.090625762939453, "global_step": 523325, "epoch": 6305} {"train_loss": -27.748310089111328, "global_step": 523326, "epoch": 6305} {"train_loss": -27.361648559570312, "global_step": 523327, "epoch": 6305} {"train_loss": -27.33843994140625, "global_step": 523328, "epoch": 6305} {"train_loss": -27.365890502929688, "global_step": 523329, "epoch": 6305} {"train_loss": -27.24847984313965, "global_step": 523330, "epoch": 6305} {"train_loss": -27.451343536376953, "global_step": 523331, "epoch": 6305} {"train_loss": -27.088781356811523, "global_step": 523332, "epoch": 6305} {"train_loss": -27.45037841796875, "global_step": 523333, "epoch": 6305} {"train_loss": -27.60146141052246, "global_step": 523334, "epoch": 6305} {"train_loss": -27.483779907226562, "global_step": 523335, "epoch": 6305} {"train_loss": -27.444244384765625, "global_step": 523336, "epoch": 6305} {"train_loss": -27.34053611755371, "global_step": 523337, "epoch": 6305} {"train_loss": -27.305179595947266, "global_step": 523338, "epoch": 6305} {"train_loss": -27.343183517456055, "global_step": 523339, "epoch": 6305} {"train_loss": -27.54323387145996, "global_step": 523340, "epoch": 6305} {"train_loss": -27.600788116455078, "global_step": 523341, "epoch": 6305} {"train_loss": -27.330291748046875, "global_step": 523342, "epoch": 6305} {"train_loss": -27.59869956970215, "global_step": 523343, "epoch": 6305} {"train_loss": -27.830352783203125, "global_step": 523344, "epoch": 6305} {"train_loss": -27.51460075378418, "global_step": 523345, "epoch": 6305} {"train_loss": -27.38888931274414, "global_step": 523346, "epoch": 6305} {"train_loss": -27.474573135375977, "global_step": 523347, "epoch": 6305} {"train_loss": -27.447568893432617, "global_step": 523348, "epoch": 6305} {"train_loss": -27.751739501953125, "global_step": 523349, "epoch": 6305} {"train_loss": -28.059967041015625, "global_step": 523350, "epoch": 6305} {"train_loss": -27.2841854095459, "global_step": 523351, "epoch": 6305} {"train_loss": -27.651538848876953, "global_step": 523352, "epoch": 6305} {"train_loss": -27.346790313720703, "global_step": 523353, "epoch": 6305} {"train_loss": -27.877363204956055, "global_step": 523354, "epoch": 6305} {"train_loss": -27.575183868408203, "global_step": 523355, "epoch": 6305} {"train_loss": -27.6258544921875, "global_step": 523356, "epoch": 6305} {"train_loss": -28.262720108032227, "global_step": 523357, "epoch": 6305} {"train_loss": -27.479450225830078, "global_step": 523358, "epoch": 6305} {"train_loss": -27.8389949798584, "global_step": 523359, "epoch": 6305} {"train_loss": -27.629104614257812, "global_step": 523360, "epoch": 6305} {"train_loss": -27.537118911743164, "global_step": 523361, "epoch": 6305} {"train_loss": -27.51484489440918, "global_step": 523362, "epoch": 6305} {"train_loss": -27.834354400634766, "global_step": 523363, "epoch": 6305} {"train_loss": -28.062482833862305, "global_step": 523364, "epoch": 6305} {"train_loss": -27.268096923828125, "global_step": 523365, "epoch": 6305} {"train_loss": -27.3348445892334, "global_step": 523366, "epoch": 6305} {"train_loss": -27.302576065063477, "global_step": 523367, "epoch": 6305} {"train_loss": -27.482206344604492, "global_step": 523368, "epoch": 6305} {"train_loss": -27.609357833862305, "global_step": 523369, "epoch": 6305} {"train_loss": -27.50715446472168, "global_step": 523370, "epoch": 6305} {"train_loss": -27.457120895385742, "global_step": 523371, "epoch": 6305} {"train_loss": -27.87839126586914, "global_step": 523372, "epoch": 6305} {"train_loss": -27.820606231689453, "global_step": 523373, "epoch": 6305} {"train_loss": -27.8251895904541, "global_step": 523374, "epoch": 6305} {"train_loss": -27.663843154907227, "global_step": 523375, "epoch": 6305} {"train_loss": -27.612659454345703, "global_step": 523376, "epoch": 6305} {"train_loss": -27.5358943939209, "global_step": 523377, "epoch": 6305} {"train_loss": -27.369184494018555, "global_step": 523378, "epoch": 6305} {"train_loss": -27.336034774780273, "global_step": 523379, "epoch": 6305} {"train_loss": -27.85080909729004, "global_step": 523380, "epoch": 6305} {"train_loss": -27.63370132446289, "global_step": 523381, "epoch": 6305} {"train_loss": -27.279499053955078, "global_step": 523382, "epoch": 6305} {"train_loss": -27.461456298828125, "global_step": 523383, "epoch": 6305} {"train_loss": -27.269742965698242, "global_step": 523384, "epoch": 6305} {"train_loss": -27.246673583984375, "global_step": 523385, "epoch": 6305} {"train_loss": -27.55571937561035, "global_step": 523386, "epoch": 6305} {"train_loss": -27.46613121032715, "global_step": 523387, "epoch": 6305} {"train_loss": -27.500701904296875, "global_step": 523388, "epoch": 6305} {"train_loss": -27.538013458251953, "global_step": 523389, "epoch": 6305} {"train_loss": -27.549036026000977, "global_step": 523390, "epoch": 6305} {"train_loss": -27.6022891998291, "global_step": 523391, "epoch": 6305} {"train_loss": -27.3250732421875, "global_step": 523392, "epoch": 6305} {"train_loss": -27.264175415039062, "global_step": 523393, "epoch": 6305} {"train_loss": -27.410602569580078, "global_step": 523394, "epoch": 6305} {"train_loss": -27.392026901245117, "global_step": 523395, "epoch": 6305} {"train_loss": -27.25794792175293, "global_step": 523396, "epoch": 6305} {"train_loss": -27.485860870545167, "global_step": 523397, "epoch": 6305, "val_loss": 6467258.0} {"train_loss": -26.453292846679688, "global_step": 523398, "epoch": 6306} {"train_loss": -26.58368492126465, "global_step": 523399, "epoch": 6306} {"train_loss": -27.03797721862793, "global_step": 523400, "epoch": 6306} {"train_loss": -26.0169677734375, "global_step": 523401, "epoch": 6306} {"train_loss": -26.710189819335938, "global_step": 523402, "epoch": 6306} {"train_loss": -26.601917266845703, "global_step": 523403, "epoch": 6306} {"train_loss": -26.710363388061523, "global_step": 523404, "epoch": 6306} {"train_loss": -27.131628036499023, "global_step": 523405, "epoch": 6306} {"train_loss": -26.700971603393555, "global_step": 523406, "epoch": 6306} {"train_loss": -27.349136352539062, "global_step": 523407, "epoch": 6306} {"train_loss": -26.820465087890625, "global_step": 523408, "epoch": 6306} {"train_loss": -26.955419540405273, "global_step": 523409, "epoch": 6306} {"train_loss": -26.65370750427246, "global_step": 523410, "epoch": 6306} {"train_loss": -27.122161865234375, "global_step": 523411, "epoch": 6306} {"train_loss": -26.696226119995117, "global_step": 523412, "epoch": 6306} {"train_loss": -27.151004791259766, "global_step": 523413, "epoch": 6306} {"train_loss": -27.292043685913086, "global_step": 523414, "epoch": 6306} {"train_loss": -26.9218692779541, "global_step": 523415, "epoch": 6306} {"train_loss": -27.06690788269043, "global_step": 523416, "epoch": 6306} {"train_loss": -26.924036026000977, "global_step": 523417, "epoch": 6306} {"train_loss": -27.3598575592041, "global_step": 523418, "epoch": 6306} {"train_loss": -27.11321449279785, "global_step": 523419, "epoch": 6306} {"train_loss": -27.337629318237305, "global_step": 523420, "epoch": 6306} {"train_loss": -27.201129913330078, "global_step": 523421, "epoch": 6306} {"train_loss": -27.35609245300293, "global_step": 523422, "epoch": 6306} {"train_loss": -27.078369140625, "global_step": 523423, "epoch": 6306} {"train_loss": -27.108423233032227, "global_step": 523424, "epoch": 6306} {"train_loss": -27.562824249267578, "global_step": 523425, "epoch": 6306} {"train_loss": -27.251882553100586, "global_step": 523426, "epoch": 6306} {"train_loss": -27.782190322875977, "global_step": 523427, "epoch": 6306} {"train_loss": -27.380155563354492, "global_step": 523428, "epoch": 6306} {"train_loss": -27.371631622314453, "global_step": 523429, "epoch": 6306} {"train_loss": -27.4254207611084, "global_step": 523430, "epoch": 6306} {"train_loss": -27.85205078125, "global_step": 523431, "epoch": 6306} {"train_loss": -27.112232208251953, "global_step": 523432, "epoch": 6306} {"train_loss": -27.192026138305664, "global_step": 523433, "epoch": 6306} {"train_loss": -27.770254135131836, "global_step": 523434, "epoch": 6306} {"train_loss": -27.331064224243164, "global_step": 523435, "epoch": 6306} {"train_loss": -27.938766479492188, "global_step": 523436, "epoch": 6306} {"train_loss": -27.197738647460938, "global_step": 523437, "epoch": 6306} {"train_loss": -27.4671573638916, "global_step": 523438, "epoch": 6306} {"train_loss": -27.08405113220215, "global_step": 523439, "epoch": 6306} {"train_loss": -27.404510498046875, "global_step": 523440, "epoch": 6306} {"train_loss": -27.028335571289062, "global_step": 523441, "epoch": 6306} {"train_loss": -26.499267578125, "global_step": 523442, "epoch": 6306} {"train_loss": -27.24905776977539, "global_step": 523443, "epoch": 6306} {"train_loss": -27.697540283203125, "global_step": 523444, "epoch": 6306} {"train_loss": -27.053380966186523, "global_step": 523445, "epoch": 6306} {"train_loss": -27.34088134765625, "global_step": 523446, "epoch": 6306} {"train_loss": -27.832971572875977, "global_step": 523447, "epoch": 6306} {"train_loss": -27.243209838867188, "global_step": 523448, "epoch": 6306} {"train_loss": -27.486841201782227, "global_step": 523449, "epoch": 6306} {"train_loss": -27.2646427154541, "global_step": 523450, "epoch": 6306} {"train_loss": -27.7562255859375, "global_step": 523451, "epoch": 6306} {"train_loss": -27.63693618774414, "global_step": 523452, "epoch": 6306} {"train_loss": -27.631391525268555, "global_step": 523453, "epoch": 6306} {"train_loss": -27.638717651367188, "global_step": 523454, "epoch": 6306} {"train_loss": -27.68001365661621, "global_step": 523455, "epoch": 6306} {"train_loss": -27.954395294189453, "global_step": 523456, "epoch": 6306} {"train_loss": -27.753311157226562, "global_step": 523457, "epoch": 6306} {"train_loss": -27.814544677734375, "global_step": 523458, "epoch": 6306} {"train_loss": -27.46564292907715, "global_step": 523459, "epoch": 6306} {"train_loss": -27.748361587524414, "global_step": 523460, "epoch": 6306} {"train_loss": -27.986791610717773, "global_step": 523461, "epoch": 6306} {"train_loss": -27.48079490661621, "global_step": 523462, "epoch": 6306} {"train_loss": -27.717269897460938, "global_step": 523463, "epoch": 6306} {"train_loss": -27.491165161132812, "global_step": 523464, "epoch": 6306} {"train_loss": -27.6185359954834, "global_step": 523465, "epoch": 6306} {"train_loss": -27.49796485900879, "global_step": 523466, "epoch": 6306} {"train_loss": -27.59541130065918, "global_step": 523467, "epoch": 6306} {"train_loss": -27.520893096923828, "global_step": 523468, "epoch": 6306} {"train_loss": -27.458271026611328, "global_step": 523469, "epoch": 6306} {"train_loss": -27.3607177734375, "global_step": 523470, "epoch": 6306} {"train_loss": -27.430646896362305, "global_step": 523471, "epoch": 6306} {"train_loss": -27.72491455078125, "global_step": 523472, "epoch": 6306} {"train_loss": -27.878080368041992, "global_step": 523473, "epoch": 6306} {"train_loss": -27.106042861938477, "global_step": 523474, "epoch": 6306} {"train_loss": -26.7047176361084, "global_step": 523475, "epoch": 6306} {"train_loss": -26.59889793395996, "global_step": 523476, "epoch": 6306} {"train_loss": -27.114215850830078, "global_step": 523477, "epoch": 6306} {"train_loss": -27.66167640686035, "global_step": 523478, "epoch": 6306} {"train_loss": -26.959476470947266, "global_step": 523479, "epoch": 6306} {"train_loss": -27.286264534456183, "global_step": 523480, "epoch": 6306, "val_loss": 6422842.0} {"train_loss": -26.019107818603516, "global_step": 523481, "epoch": 6307} {"train_loss": -26.496139526367188, "global_step": 523482, "epoch": 6307} {"train_loss": -26.017749786376953, "global_step": 523483, "epoch": 6307} {"train_loss": -26.24369239807129, "global_step": 523484, "epoch": 6307} {"train_loss": -26.135425567626953, "global_step": 523485, "epoch": 6307} {"train_loss": -26.577747344970703, "global_step": 523486, "epoch": 6307} {"train_loss": -26.538665771484375, "global_step": 523487, "epoch": 6307} {"train_loss": -26.5396671295166, "global_step": 523488, "epoch": 6307} {"train_loss": -26.6251220703125, "global_step": 523489, "epoch": 6307} {"train_loss": -26.59116554260254, "global_step": 523490, "epoch": 6307} {"train_loss": -26.72487449645996, "global_step": 523491, "epoch": 6307} {"train_loss": -26.66070556640625, "global_step": 523492, "epoch": 6307} {"train_loss": -26.599267959594727, "global_step": 523493, "epoch": 6307} {"train_loss": -27.122751235961914, "global_step": 523494, "epoch": 6307} {"train_loss": -26.875324249267578, "global_step": 523495, "epoch": 6307} {"train_loss": -26.50959587097168, "global_step": 523496, "epoch": 6307} {"train_loss": -26.8577938079834, "global_step": 523497, "epoch": 6307} {"train_loss": -26.982715606689453, "global_step": 523498, "epoch": 6307} {"train_loss": -26.584095001220703, "global_step": 523499, "epoch": 6307} {"train_loss": -27.106237411499023, "global_step": 523500, "epoch": 6307} {"train_loss": -26.81171989440918, "global_step": 523501, "epoch": 6307} {"train_loss": -27.257970809936523, "global_step": 523502, "epoch": 6307} {"train_loss": -27.098896026611328, "global_step": 523503, "epoch": 6307} {"train_loss": -27.253311157226562, "global_step": 523504, "epoch": 6307} {"train_loss": -27.037626266479492, "global_step": 523505, "epoch": 6307} {"train_loss": -26.811084747314453, "global_step": 523506, "epoch": 6307} {"train_loss": -27.337671279907227, "global_step": 523507, "epoch": 6307} {"train_loss": -27.008289337158203, "global_step": 523508, "epoch": 6307} {"train_loss": -27.130338668823242, "global_step": 523509, "epoch": 6307} {"train_loss": -27.32097816467285, "global_step": 523510, "epoch": 6307} {"train_loss": -27.545623779296875, "global_step": 523511, "epoch": 6307} {"train_loss": -26.99302101135254, "global_step": 523512, "epoch": 6307} {"train_loss": -27.21052360534668, "global_step": 523513, "epoch": 6307} {"train_loss": -27.243667602539062, "global_step": 523514, "epoch": 6307} {"train_loss": -27.21064567565918, "global_step": 523515, "epoch": 6307} {"train_loss": -27.5476016998291, "global_step": 523516, "epoch": 6307} {"train_loss": -27.515737533569336, "global_step": 523517, "epoch": 6307} {"train_loss": -27.391132354736328, "global_step": 523518, "epoch": 6307} {"train_loss": -27.349044799804688, "global_step": 523519, "epoch": 6307} {"train_loss": -27.21896743774414, "global_step": 523520, "epoch": 6307} {"train_loss": -27.512073516845703, "global_step": 523521, "epoch": 6307} {"train_loss": -27.74831199645996, "global_step": 523522, "epoch": 6307} {"train_loss": -27.4720516204834, "global_step": 523523, "epoch": 6307} {"train_loss": -27.52131462097168, "global_step": 523524, "epoch": 6307} {"train_loss": -27.8321475982666, "global_step": 523525, "epoch": 6307} {"train_loss": -27.9278507232666, "global_step": 523526, "epoch": 6307} {"train_loss": -27.7548885345459, "global_step": 523527, "epoch": 6307} {"train_loss": -27.7696533203125, "global_step": 523528, "epoch": 6307} {"train_loss": -27.54071044921875, "global_step": 523529, "epoch": 6307} {"train_loss": -28.08717155456543, "global_step": 523530, "epoch": 6307} {"train_loss": -27.674421310424805, "global_step": 523531, "epoch": 6307} {"train_loss": -27.581689834594727, "global_step": 523532, "epoch": 6307} {"train_loss": -27.650482177734375, "global_step": 523533, "epoch": 6307} {"train_loss": -27.705215454101562, "global_step": 523534, "epoch": 6307} {"train_loss": -27.916345596313477, "global_step": 523535, "epoch": 6307} {"train_loss": -27.866140365600586, "global_step": 523536, "epoch": 6307} {"train_loss": -27.787710189819336, "global_step": 523537, "epoch": 6307} {"train_loss": -27.677011489868164, "global_step": 523538, "epoch": 6307} {"train_loss": -27.715646743774414, "global_step": 523539, "epoch": 6307} {"train_loss": -27.81241798400879, "global_step": 523540, "epoch": 6307} {"train_loss": -28.158483505249023, "global_step": 523541, "epoch": 6307} {"train_loss": -27.97580909729004, "global_step": 523542, "epoch": 6307} {"train_loss": -27.768274307250977, "global_step": 523543, "epoch": 6307} {"train_loss": -27.83978271484375, "global_step": 523544, "epoch": 6307} {"train_loss": -27.496747970581055, "global_step": 523545, "epoch": 6307} {"train_loss": -27.60780143737793, "global_step": 523546, "epoch": 6307} {"train_loss": -27.015172958374023, "global_step": 523547, "epoch": 6307} {"train_loss": -25.604721069335938, "global_step": 523548, "epoch": 6307} {"train_loss": -24.477191925048828, "global_step": 523549, "epoch": 6307} {"train_loss": -26.645843505859375, "global_step": 523550, "epoch": 6307} {"train_loss": -27.129318237304688, "global_step": 523551, "epoch": 6307} {"train_loss": -26.87628173828125, "global_step": 523552, "epoch": 6307} {"train_loss": -26.995786666870117, "global_step": 523553, "epoch": 6307} {"train_loss": -26.696943283081055, "global_step": 523554, "epoch": 6307} {"train_loss": -27.013843536376953, "global_step": 523555, "epoch": 6307} {"train_loss": -27.239667892456055, "global_step": 523556, "epoch": 6307} {"train_loss": -27.24587059020996, "global_step": 523557, "epoch": 6307} {"train_loss": -27.391977310180664, "global_step": 523558, "epoch": 6307} {"train_loss": -27.22821044921875, "global_step": 523559, "epoch": 6307} {"train_loss": -27.392255783081055, "global_step": 523560, "epoch": 6307} {"train_loss": -27.18263053894043, "global_step": 523561, "epoch": 6307} {"train_loss": -27.23482322692871, "global_step": 523562, "epoch": 6307} {"train_loss": -27.175123421542615, "global_step": 523563, "epoch": 6307, "val_loss": 6655543.0} {"train_loss": -26.534687042236328, "global_step": 523564, "epoch": 6308} {"train_loss": -27.05860710144043, "global_step": 523565, "epoch": 6308} {"train_loss": -27.04059410095215, "global_step": 523566, "epoch": 6308} {"train_loss": -26.796649932861328, "global_step": 523567, "epoch": 6308} {"train_loss": -26.79254722595215, "global_step": 523568, "epoch": 6308} {"train_loss": -26.962738037109375, "global_step": 523569, "epoch": 6308} {"train_loss": -27.062591552734375, "global_step": 523570, "epoch": 6308} {"train_loss": -26.947479248046875, "global_step": 523571, "epoch": 6308} {"train_loss": -27.195178985595703, "global_step": 523572, "epoch": 6308} {"train_loss": -26.905527114868164, "global_step": 523573, "epoch": 6308} {"train_loss": -27.527557373046875, "global_step": 523574, "epoch": 6308} {"train_loss": -26.999475479125977, "global_step": 523575, "epoch": 6308} {"train_loss": -27.3073673248291, "global_step": 523576, "epoch": 6308} {"train_loss": -27.0387020111084, "global_step": 523577, "epoch": 6308} {"train_loss": -27.13620948791504, "global_step": 523578, "epoch": 6308} {"train_loss": -27.3118896484375, "global_step": 523579, "epoch": 6308} {"train_loss": -27.240148544311523, "global_step": 523580, "epoch": 6308} {"train_loss": -27.82232666015625, "global_step": 523581, "epoch": 6308} {"train_loss": -27.170873641967773, "global_step": 523582, "epoch": 6308} {"train_loss": -27.528766632080078, "global_step": 523583, "epoch": 6308} {"train_loss": -27.491870880126953, "global_step": 523584, "epoch": 6308} {"train_loss": -27.909238815307617, "global_step": 523585, "epoch": 6308} {"train_loss": -27.498401641845703, "global_step": 523586, "epoch": 6308} {"train_loss": -27.202966690063477, "global_step": 523587, "epoch": 6308} {"train_loss": -27.57611083984375, "global_step": 523588, "epoch": 6308} {"train_loss": -27.145709991455078, "global_step": 523589, "epoch": 6308} {"train_loss": -27.350311279296875, "global_step": 523590, "epoch": 6308} {"train_loss": -27.538196563720703, "global_step": 523591, "epoch": 6308} {"train_loss": -27.62892723083496, "global_step": 523592, "epoch": 6308} {"train_loss": -27.5356388092041, "global_step": 523593, "epoch": 6308} {"train_loss": -27.63498306274414, "global_step": 523594, "epoch": 6308} {"train_loss": -27.506195068359375, "global_step": 523595, "epoch": 6308} {"train_loss": -27.363332748413086, "global_step": 523596, "epoch": 6308} {"train_loss": -27.421533584594727, "global_step": 523597, "epoch": 6308} {"train_loss": -27.66912269592285, "global_step": 523598, "epoch": 6308} {"train_loss": -27.539098739624023, "global_step": 523599, "epoch": 6308} {"train_loss": -27.85284996032715, "global_step": 523600, "epoch": 6308} {"train_loss": -27.702234268188477, "global_step": 523601, "epoch": 6308} {"train_loss": -27.92987632751465, "global_step": 523602, "epoch": 6308} {"train_loss": -28.007171630859375, "global_step": 523603, "epoch": 6308} {"train_loss": -27.262344360351562, "global_step": 523604, "epoch": 6308} {"train_loss": -28.220102310180664, "global_step": 523605, "epoch": 6308} {"train_loss": -27.490808486938477, "global_step": 523606, "epoch": 6308} {"train_loss": -27.59187126159668, "global_step": 523607, "epoch": 6308} {"train_loss": -27.633703231811523, "global_step": 523608, "epoch": 6308} {"train_loss": -27.404682159423828, "global_step": 523609, "epoch": 6308} {"train_loss": -27.8038272857666, "global_step": 523610, "epoch": 6308} {"train_loss": -27.81473159790039, "global_step": 523611, "epoch": 6308} {"train_loss": -27.669208526611328, "global_step": 523612, "epoch": 6308} {"train_loss": -27.33087730407715, "global_step": 523613, "epoch": 6308} {"train_loss": -27.58281898498535, "global_step": 523614, "epoch": 6308} {"train_loss": -27.92620849609375, "global_step": 523615, "epoch": 6308} {"train_loss": -27.441755294799805, "global_step": 523616, "epoch": 6308} {"train_loss": -27.721973419189453, "global_step": 523617, "epoch": 6308} {"train_loss": -27.332056045532227, "global_step": 523618, "epoch": 6308} {"train_loss": -27.533361434936523, "global_step": 523619, "epoch": 6308} {"train_loss": -27.3325138092041, "global_step": 523620, "epoch": 6308} {"train_loss": -27.6999568939209, "global_step": 523621, "epoch": 6308} {"train_loss": -27.670984268188477, "global_step": 523622, "epoch": 6308} {"train_loss": -27.842687606811523, "global_step": 523623, "epoch": 6308} {"train_loss": -27.623743057250977, "global_step": 523624, "epoch": 6308} {"train_loss": -27.44770622253418, "global_step": 523625, "epoch": 6308} {"train_loss": -27.59669303894043, "global_step": 523626, "epoch": 6308} {"train_loss": -27.469263076782227, "global_step": 523627, "epoch": 6308} {"train_loss": -27.4558162689209, "global_step": 523628, "epoch": 6308} {"train_loss": -27.786422729492188, "global_step": 523629, "epoch": 6308} {"train_loss": -27.636438369750977, "global_step": 523630, "epoch": 6308} {"train_loss": -27.58221435546875, "global_step": 523631, "epoch": 6308} {"train_loss": -27.834379196166992, "global_step": 523632, "epoch": 6308} {"train_loss": -27.930633544921875, "global_step": 523633, "epoch": 6308} {"train_loss": -27.53974723815918, "global_step": 523634, "epoch": 6308} {"train_loss": -27.652063369750977, "global_step": 523635, "epoch": 6308} {"train_loss": -27.48768424987793, "global_step": 523636, "epoch": 6308} {"train_loss": -28.011581420898438, "global_step": 523637, "epoch": 6308} {"train_loss": -27.664236068725586, "global_step": 523638, "epoch": 6308} {"train_loss": -27.406827926635742, "global_step": 523639, "epoch": 6308} {"train_loss": -27.532678604125977, "global_step": 523640, "epoch": 6308} {"train_loss": -27.916488647460938, "global_step": 523641, "epoch": 6308} {"train_loss": -27.726980209350586, "global_step": 523642, "epoch": 6308} {"train_loss": -27.542800903320312, "global_step": 523643, "epoch": 6308} {"train_loss": -27.759296417236328, "global_step": 523644, "epoch": 6308} {"train_loss": -27.93575096130371, "global_step": 523645, "epoch": 6308} {"train_loss": -27.50028490732951, "global_step": 523646, "epoch": 6308, "val_loss": 6636171.0} {"train_loss": -26.195783615112305, "global_step": 523647, "epoch": 6309} {"train_loss": -25.71575927734375, "global_step": 523648, "epoch": 6309} {"train_loss": -26.235462188720703, "global_step": 523649, "epoch": 6309} {"train_loss": -26.22718620300293, "global_step": 523650, "epoch": 6309} {"train_loss": -26.288360595703125, "global_step": 523651, "epoch": 6309} {"train_loss": -26.24049949645996, "global_step": 523652, "epoch": 6309} {"train_loss": -25.349702835083008, "global_step": 523653, "epoch": 6309} {"train_loss": -26.152801513671875, "global_step": 523654, "epoch": 6309} {"train_loss": -26.538862228393555, "global_step": 523655, "epoch": 6309} {"train_loss": -26.443140029907227, "global_step": 523656, "epoch": 6309} {"train_loss": -26.26045036315918, "global_step": 523657, "epoch": 6309} {"train_loss": -26.811695098876953, "global_step": 523658, "epoch": 6309} {"train_loss": -26.576129913330078, "global_step": 523659, "epoch": 6309} {"train_loss": -26.68385124206543, "global_step": 523660, "epoch": 6309} {"train_loss": -26.59925651550293, "global_step": 523661, "epoch": 6309} {"train_loss": -26.22346305847168, "global_step": 523662, "epoch": 6309} {"train_loss": -27.05768394470215, "global_step": 523663, "epoch": 6309} {"train_loss": -26.36174964904785, "global_step": 523664, "epoch": 6309} {"train_loss": -27.065954208374023, "global_step": 523665, "epoch": 6309} {"train_loss": -26.98676109313965, "global_step": 523666, "epoch": 6309} {"train_loss": -26.290679931640625, "global_step": 523667, "epoch": 6309} {"train_loss": -27.288497924804688, "global_step": 523668, "epoch": 6309} {"train_loss": -26.614770889282227, "global_step": 523669, "epoch": 6309} {"train_loss": -27.240848541259766, "global_step": 523670, "epoch": 6309} {"train_loss": -26.59858512878418, "global_step": 523671, "epoch": 6309} {"train_loss": -27.370147705078125, "global_step": 523672, "epoch": 6309} {"train_loss": -27.082056045532227, "global_step": 523673, "epoch": 6309} {"train_loss": -26.923847198486328, "global_step": 523674, "epoch": 6309} {"train_loss": -27.061948776245117, "global_step": 523675, "epoch": 6309} {"train_loss": -26.874792098999023, "global_step": 523676, "epoch": 6309} {"train_loss": -27.244482040405273, "global_step": 523677, "epoch": 6309} {"train_loss": -27.1990966796875, "global_step": 523678, "epoch": 6309} {"train_loss": -27.372821807861328, "global_step": 523679, "epoch": 6309} {"train_loss": -26.959308624267578, "global_step": 523680, "epoch": 6309} {"train_loss": -27.094501495361328, "global_step": 523681, "epoch": 6309} {"train_loss": -27.3660888671875, "global_step": 523682, "epoch": 6309} {"train_loss": -27.169931411743164, "global_step": 523683, "epoch": 6309} {"train_loss": -27.67266273498535, "global_step": 523684, "epoch": 6309} {"train_loss": -27.34201431274414, "global_step": 523685, "epoch": 6309} {"train_loss": -27.1747989654541, "global_step": 523686, "epoch": 6309} {"train_loss": -27.015867233276367, "global_step": 523687, "epoch": 6309} {"train_loss": -27.563541412353516, "global_step": 523688, "epoch": 6309} {"train_loss": -27.872800827026367, "global_step": 523689, "epoch": 6309} {"train_loss": -27.26970863342285, "global_step": 523690, "epoch": 6309} {"train_loss": -27.379301071166992, "global_step": 523691, "epoch": 6309} {"train_loss": -27.361923217773438, "global_step": 523692, "epoch": 6309} {"train_loss": -27.7567195892334, "global_step": 523693, "epoch": 6309} {"train_loss": -27.39838218688965, "global_step": 523694, "epoch": 6309} {"train_loss": -27.633487701416016, "global_step": 523695, "epoch": 6309} {"train_loss": -27.13001823425293, "global_step": 523696, "epoch": 6309} {"train_loss": -27.404321670532227, "global_step": 523697, "epoch": 6309} {"train_loss": -27.636926651000977, "global_step": 523698, "epoch": 6309} {"train_loss": -27.622180938720703, "global_step": 523699, "epoch": 6309} {"train_loss": -27.523273468017578, "global_step": 523700, "epoch": 6309} {"train_loss": -27.447187423706055, "global_step": 523701, "epoch": 6309} {"train_loss": -27.877185821533203, "global_step": 523702, "epoch": 6309} {"train_loss": -27.902509689331055, "global_step": 523703, "epoch": 6309} {"train_loss": -27.627033233642578, "global_step": 523704, "epoch": 6309} {"train_loss": -27.307111740112305, "global_step": 523705, "epoch": 6309} {"train_loss": -27.62178611755371, "global_step": 523706, "epoch": 6309} {"train_loss": -27.820972442626953, "global_step": 523707, "epoch": 6309} {"train_loss": -27.550003051757812, "global_step": 523708, "epoch": 6309} {"train_loss": -27.516279220581055, "global_step": 523709, "epoch": 6309} {"train_loss": -27.577463150024414, "global_step": 523710, "epoch": 6309} {"train_loss": -28.04376220703125, "global_step": 523711, "epoch": 6309} {"train_loss": -27.631122589111328, "global_step": 523712, "epoch": 6309} {"train_loss": -27.36317253112793, "global_step": 523713, "epoch": 6309} {"train_loss": -27.4097843170166, "global_step": 523714, "epoch": 6309} {"train_loss": -27.689111709594727, "global_step": 523715, "epoch": 6309} {"train_loss": -27.627277374267578, "global_step": 523716, "epoch": 6309} {"train_loss": -27.779890060424805, "global_step": 523717, "epoch": 6309} {"train_loss": -27.729629516601562, "global_step": 523718, "epoch": 6309} {"train_loss": -27.543310165405273, "global_step": 523719, "epoch": 6309} {"train_loss": -27.879499435424805, "global_step": 523720, "epoch": 6309} {"train_loss": -27.58986473083496, "global_step": 523721, "epoch": 6309} {"train_loss": -27.644540786743164, "global_step": 523722, "epoch": 6309} {"train_loss": -27.949848175048828, "global_step": 523723, "epoch": 6309} {"train_loss": -27.439929962158203, "global_step": 523724, "epoch": 6309} {"train_loss": -27.966888427734375, "global_step": 523725, "epoch": 6309} {"train_loss": -27.468463897705078, "global_step": 523726, "epoch": 6309} {"train_loss": -27.8935489654541, "global_step": 523727, "epoch": 6309} {"train_loss": -27.378387451171875, "global_step": 523728, "epoch": 6309} {"train_loss": -27.165713666433312, "global_step": 523729, "epoch": 6309, "val_loss": 6630264.0} {"train_loss": -27.3051700592041, "global_step": 523730, "epoch": 6310} {"train_loss": -27.2829647064209, "global_step": 523731, "epoch": 6310} {"train_loss": -27.296369552612305, "global_step": 523732, "epoch": 6310} {"train_loss": -27.372961044311523, "global_step": 523733, "epoch": 6310} {"train_loss": -27.360309600830078, "global_step": 523734, "epoch": 6310} {"train_loss": -27.41171646118164, "global_step": 523735, "epoch": 6310} {"train_loss": -27.45292091369629, "global_step": 523736, "epoch": 6310} {"train_loss": -27.223560333251953, "global_step": 523737, "epoch": 6310} {"train_loss": -27.410314559936523, "global_step": 523738, "epoch": 6310} {"train_loss": -27.516605377197266, "global_step": 523739, "epoch": 6310} {"train_loss": -27.91102409362793, "global_step": 523740, "epoch": 6310} {"train_loss": -27.622150421142578, "global_step": 523741, "epoch": 6310} {"train_loss": -27.23489761352539, "global_step": 523742, "epoch": 6310} {"train_loss": -27.446069717407227, "global_step": 523743, "epoch": 6310} {"train_loss": -27.0648250579834, "global_step": 523744, "epoch": 6310} {"train_loss": -27.600727081298828, "global_step": 523745, "epoch": 6310} {"train_loss": -27.696664810180664, "global_step": 523746, "epoch": 6310} {"train_loss": -27.276981353759766, "global_step": 523747, "epoch": 6310} {"train_loss": -27.383447647094727, "global_step": 523748, "epoch": 6310} {"train_loss": -27.557767868041992, "global_step": 523749, "epoch": 6310} {"train_loss": -27.582721710205078, "global_step": 523750, "epoch": 6310} {"train_loss": -27.33436393737793, "global_step": 523751, "epoch": 6310} {"train_loss": -27.978261947631836, "global_step": 523752, "epoch": 6310} {"train_loss": -27.557540893554688, "global_step": 523753, "epoch": 6310} {"train_loss": -27.333328247070312, "global_step": 523754, "epoch": 6310} {"train_loss": -27.601276397705078, "global_step": 523755, "epoch": 6310} {"train_loss": -27.645557403564453, "global_step": 523756, "epoch": 6310} {"train_loss": -27.023771286010742, "global_step": 523757, "epoch": 6310} {"train_loss": -27.658905029296875, "global_step": 523758, "epoch": 6310} {"train_loss": -27.81207847595215, "global_step": 523759, "epoch": 6310} {"train_loss": -27.3756046295166, "global_step": 523760, "epoch": 6310} {"train_loss": -27.406463623046875, "global_step": 523761, "epoch": 6310} {"train_loss": -27.6811466217041, "global_step": 523762, "epoch": 6310} {"train_loss": -27.586353302001953, "global_step": 523763, "epoch": 6310} {"train_loss": -27.795642852783203, "global_step": 523764, "epoch": 6310} {"train_loss": -27.99114990234375, "global_step": 523765, "epoch": 6310} {"train_loss": -28.076963424682617, "global_step": 523766, "epoch": 6310} {"train_loss": -27.852096557617188, "global_step": 523767, "epoch": 6310} {"train_loss": -27.4676456451416, "global_step": 523768, "epoch": 6310} {"train_loss": -27.74104118347168, "global_step": 523769, "epoch": 6310} {"train_loss": -27.710159301757812, "global_step": 523770, "epoch": 6310} {"train_loss": -27.80634880065918, "global_step": 523771, "epoch": 6310} {"train_loss": -27.645532608032227, "global_step": 523772, "epoch": 6310} {"train_loss": -27.4184513092041, "global_step": 523773, "epoch": 6310} {"train_loss": -28.035459518432617, "global_step": 523774, "epoch": 6310} {"train_loss": -27.875473022460938, "global_step": 523775, "epoch": 6310} {"train_loss": -27.848840713500977, "global_step": 523776, "epoch": 6310} {"train_loss": -27.569177627563477, "global_step": 523777, "epoch": 6310} {"train_loss": -27.452245712280273, "global_step": 523778, "epoch": 6310} {"train_loss": -28.10249137878418, "global_step": 523779, "epoch": 6310} {"train_loss": -27.70660400390625, "global_step": 523780, "epoch": 6310} {"train_loss": -27.729236602783203, "global_step": 523781, "epoch": 6310} {"train_loss": -27.685413360595703, "global_step": 523782, "epoch": 6310} {"train_loss": -27.865264892578125, "global_step": 523783, "epoch": 6310} {"train_loss": -27.906585693359375, "global_step": 523784, "epoch": 6310} {"train_loss": -27.593664169311523, "global_step": 523785, "epoch": 6310} {"train_loss": -27.45962905883789, "global_step": 523786, "epoch": 6310} {"train_loss": -27.8942928314209, "global_step": 523787, "epoch": 6310} {"train_loss": -27.816144943237305, "global_step": 523788, "epoch": 6310} {"train_loss": -27.466638565063477, "global_step": 523789, "epoch": 6310} {"train_loss": -27.96990394592285, "global_step": 523790, "epoch": 6310} {"train_loss": -27.267349243164062, "global_step": 523791, "epoch": 6310} {"train_loss": -27.447134017944336, "global_step": 523792, "epoch": 6310} {"train_loss": -27.95051383972168, "global_step": 523793, "epoch": 6310} {"train_loss": -27.490766525268555, "global_step": 523794, "epoch": 6310} {"train_loss": -27.4495849609375, "global_step": 523795, "epoch": 6310} {"train_loss": -27.529050827026367, "global_step": 523796, "epoch": 6310} {"train_loss": -27.691547393798828, "global_step": 523797, "epoch": 6310} {"train_loss": -27.632314682006836, "global_step": 523798, "epoch": 6310} {"train_loss": -27.3469295501709, "global_step": 523799, "epoch": 6310} {"train_loss": -27.700607299804688, "global_step": 523800, "epoch": 6310} {"train_loss": -27.352203369140625, "global_step": 523801, "epoch": 6310} {"train_loss": -27.547033309936523, "global_step": 523802, "epoch": 6310} {"train_loss": -27.420866012573242, "global_step": 523803, "epoch": 6310} {"train_loss": -27.301843643188477, "global_step": 523804, "epoch": 6310} {"train_loss": -27.598438262939453, "global_step": 523805, "epoch": 6310} {"train_loss": -27.183258056640625, "global_step": 523806, "epoch": 6310} {"train_loss": -27.22840690612793, "global_step": 523807, "epoch": 6310} {"train_loss": -27.21738052368164, "global_step": 523808, "epoch": 6310} {"train_loss": -27.38962745666504, "global_step": 523809, "epoch": 6310} {"train_loss": -27.060880661010742, "global_step": 523810, "epoch": 6310} {"train_loss": -27.398908615112305, "global_step": 523811, "epoch": 6310} {"train_loss": -27.560352072658308, "global_step": 523812, "epoch": 6310, "val_loss": 6609810.0} {"train_loss": -26.2990665435791, "global_step": 523813, "epoch": 6311} {"train_loss": -24.443897247314453, "global_step": 523814, "epoch": 6311} {"train_loss": -24.34804916381836, "global_step": 523815, "epoch": 6311} {"train_loss": -26.794797897338867, "global_step": 523816, "epoch": 6311} {"train_loss": -26.18073844909668, "global_step": 523817, "epoch": 6311} {"train_loss": -24.763206481933594, "global_step": 523818, "epoch": 6311} {"train_loss": -27.046735763549805, "global_step": 523819, "epoch": 6311} {"train_loss": -26.023853302001953, "global_step": 523820, "epoch": 6311} {"train_loss": -26.23453140258789, "global_step": 523821, "epoch": 6311} {"train_loss": -26.13563346862793, "global_step": 523822, "epoch": 6311} {"train_loss": -26.951074600219727, "global_step": 523823, "epoch": 6311} {"train_loss": -26.11359977722168, "global_step": 523824, "epoch": 6311} {"train_loss": -26.833271026611328, "global_step": 523825, "epoch": 6311} {"train_loss": -26.730304718017578, "global_step": 523826, "epoch": 6311} {"train_loss": -26.642004013061523, "global_step": 523827, "epoch": 6311} {"train_loss": -26.769033432006836, "global_step": 523828, "epoch": 6311} {"train_loss": -26.396081924438477, "global_step": 523829, "epoch": 6311} {"train_loss": -27.008773803710938, "global_step": 523830, "epoch": 6311} {"train_loss": -26.80097007751465, "global_step": 523831, "epoch": 6311} {"train_loss": -27.008718490600586, "global_step": 523832, "epoch": 6311} {"train_loss": -26.823917388916016, "global_step": 523833, "epoch": 6311} {"train_loss": -27.17974853515625, "global_step": 523834, "epoch": 6311} {"train_loss": -27.303241729736328, "global_step": 523835, "epoch": 6311} {"train_loss": -27.20307731628418, "global_step": 523836, "epoch": 6311} {"train_loss": -27.03236198425293, "global_step": 523837, "epoch": 6311} {"train_loss": -27.461267471313477, "global_step": 523838, "epoch": 6311} {"train_loss": -26.964197158813477, "global_step": 523839, "epoch": 6311} {"train_loss": -27.2236270904541, "global_step": 523840, "epoch": 6311} {"train_loss": -26.839263916015625, "global_step": 523841, "epoch": 6311} {"train_loss": -27.273221969604492, "global_step": 523842, "epoch": 6311} {"train_loss": -27.015832901000977, "global_step": 523843, "epoch": 6311} {"train_loss": -27.434070587158203, "global_step": 523844, "epoch": 6311} {"train_loss": -27.50693702697754, "global_step": 523845, "epoch": 6311} {"train_loss": -27.182092666625977, "global_step": 523846, "epoch": 6311} {"train_loss": -27.309925079345703, "global_step": 523847, "epoch": 6311} {"train_loss": -27.42762565612793, "global_step": 523848, "epoch": 6311} {"train_loss": -27.352807998657227, "global_step": 523849, "epoch": 6311} {"train_loss": -27.435983657836914, "global_step": 523850, "epoch": 6311} {"train_loss": -27.2078800201416, "global_step": 523851, "epoch": 6311} {"train_loss": -27.24932289123535, "global_step": 523852, "epoch": 6311} {"train_loss": -27.350677490234375, "global_step": 523853, "epoch": 6311} {"train_loss": -27.52711296081543, "global_step": 523854, "epoch": 6311} {"train_loss": -27.553363800048828, "global_step": 523855, "epoch": 6311} {"train_loss": -27.5280818939209, "global_step": 523856, "epoch": 6311} {"train_loss": -27.402013778686523, "global_step": 523857, "epoch": 6311} {"train_loss": -27.76814079284668, "global_step": 523858, "epoch": 6311} {"train_loss": -27.51566505432129, "global_step": 523859, "epoch": 6311} {"train_loss": -27.906646728515625, "global_step": 523860, "epoch": 6311} {"train_loss": -27.512128829956055, "global_step": 523861, "epoch": 6311} {"train_loss": -27.030378341674805, "global_step": 523862, "epoch": 6311} {"train_loss": -27.140104293823242, "global_step": 523863, "epoch": 6311} {"train_loss": -27.607770919799805, "global_step": 523864, "epoch": 6311} {"train_loss": -27.5704402923584, "global_step": 523865, "epoch": 6311} {"train_loss": -27.346649169921875, "global_step": 523866, "epoch": 6311} {"train_loss": -27.154932022094727, "global_step": 523867, "epoch": 6311} {"train_loss": -27.579858779907227, "global_step": 523868, "epoch": 6311} {"train_loss": -27.5376033782959, "global_step": 523869, "epoch": 6311} {"train_loss": -27.596899032592773, "global_step": 523870, "epoch": 6311} {"train_loss": -27.977441787719727, "global_step": 523871, "epoch": 6311} {"train_loss": -27.80051612854004, "global_step": 523872, "epoch": 6311} {"train_loss": -27.513900756835938, "global_step": 523873, "epoch": 6311} {"train_loss": -27.573486328125, "global_step": 523874, "epoch": 6311} {"train_loss": -27.45026969909668, "global_step": 523875, "epoch": 6311} {"train_loss": -27.578832626342773, "global_step": 523876, "epoch": 6311} {"train_loss": -27.6601505279541, "global_step": 523877, "epoch": 6311} {"train_loss": -27.658063888549805, "global_step": 523878, "epoch": 6311} {"train_loss": -27.66309928894043, "global_step": 523879, "epoch": 6311} {"train_loss": -26.956287384033203, "global_step": 523880, "epoch": 6311} {"train_loss": -27.5693359375, "global_step": 523881, "epoch": 6311} {"train_loss": -28.048261642456055, "global_step": 523882, "epoch": 6311} {"train_loss": -27.24051856994629, "global_step": 523883, "epoch": 6311} {"train_loss": -27.466510772705078, "global_step": 523884, "epoch": 6311} {"train_loss": -27.509479522705078, "global_step": 523885, "epoch": 6311} {"train_loss": -27.339847564697266, "global_step": 523886, "epoch": 6311} {"train_loss": -27.718280792236328, "global_step": 523887, "epoch": 6311} {"train_loss": -27.761438369750977, "global_step": 523888, "epoch": 6311} {"train_loss": -27.456083297729492, "global_step": 523889, "epoch": 6311} {"train_loss": -27.782175064086914, "global_step": 523890, "epoch": 6311} {"train_loss": -27.816516876220703, "global_step": 523891, "epoch": 6311} {"train_loss": -27.845203399658203, "global_step": 523892, "epoch": 6311} {"train_loss": -27.485626220703125, "global_step": 523893, "epoch": 6311} {"train_loss": -28.16200065612793, "global_step": 523894, "epoch": 6311} {"train_loss": -27.170182308518743, "global_step": 523895, "epoch": 6311, "val_loss": 6589294.0} {"train_loss": -27.080785751342773, "global_step": 523896, "epoch": 6312} {"train_loss": -26.8565673828125, "global_step": 523897, "epoch": 6312} {"train_loss": -27.264881134033203, "global_step": 523898, "epoch": 6312} {"train_loss": -26.513813018798828, "global_step": 523899, "epoch": 6312} {"train_loss": -26.642780303955078, "global_step": 523900, "epoch": 6312} {"train_loss": -26.674091339111328, "global_step": 523901, "epoch": 6312} {"train_loss": -27.379974365234375, "global_step": 523902, "epoch": 6312} {"train_loss": -27.106470108032227, "global_step": 523903, "epoch": 6312} {"train_loss": -26.807464599609375, "global_step": 523904, "epoch": 6312} {"train_loss": -27.241422653198242, "global_step": 523905, "epoch": 6312} {"train_loss": -27.345178604125977, "global_step": 523906, "epoch": 6312} {"train_loss": -27.206790924072266, "global_step": 523907, "epoch": 6312} {"train_loss": -27.21498680114746, "global_step": 523908, "epoch": 6312} {"train_loss": -27.528076171875, "global_step": 523909, "epoch": 6312} {"train_loss": -27.1669979095459, "global_step": 523910, "epoch": 6312} {"train_loss": -27.77094078063965, "global_step": 523911, "epoch": 6312} {"train_loss": -26.97482681274414, "global_step": 523912, "epoch": 6312} {"train_loss": -26.96921730041504, "global_step": 523913, "epoch": 6312} {"train_loss": -27.3612060546875, "global_step": 523914, "epoch": 6312} {"train_loss": -27.610578536987305, "global_step": 523915, "epoch": 6312} {"train_loss": -27.7398738861084, "global_step": 523916, "epoch": 6312} {"train_loss": -27.414234161376953, "global_step": 523917, "epoch": 6312} {"train_loss": -27.370990753173828, "global_step": 523918, "epoch": 6312} {"train_loss": -27.295608520507812, "global_step": 523919, "epoch": 6312} {"train_loss": -27.619977951049805, "global_step": 523920, "epoch": 6312} {"train_loss": -27.119348526000977, "global_step": 523921, "epoch": 6312} {"train_loss": -27.477685928344727, "global_step": 523922, "epoch": 6312} {"train_loss": -27.5780086517334, "global_step": 523923, "epoch": 6312} {"train_loss": -27.176267623901367, "global_step": 523924, "epoch": 6312} {"train_loss": -27.463354110717773, "global_step": 523925, "epoch": 6312} {"train_loss": -27.185590744018555, "global_step": 523926, "epoch": 6312} {"train_loss": -27.736963272094727, "global_step": 523927, "epoch": 6312} {"train_loss": -27.7791805267334, "global_step": 523928, "epoch": 6312} {"train_loss": -27.366596221923828, "global_step": 523929, "epoch": 6312} {"train_loss": -27.445560455322266, "global_step": 523930, "epoch": 6312} {"train_loss": -27.54278564453125, "global_step": 523931, "epoch": 6312} {"train_loss": -27.818395614624023, "global_step": 523932, "epoch": 6312} {"train_loss": -27.2395076751709, "global_step": 523933, "epoch": 6312} {"train_loss": -27.659290313720703, "global_step": 523934, "epoch": 6312} {"train_loss": -27.621435165405273, "global_step": 523935, "epoch": 6312} {"train_loss": -27.749053955078125, "global_step": 523936, "epoch": 6312} {"train_loss": -27.736892700195312, "global_step": 523937, "epoch": 6312} {"train_loss": -27.733442306518555, "global_step": 523938, "epoch": 6312} {"train_loss": -27.401586532592773, "global_step": 523939, "epoch": 6312} {"train_loss": -27.80047035217285, "global_step": 523940, "epoch": 6312} {"train_loss": -27.972318649291992, "global_step": 523941, "epoch": 6312} {"train_loss": -27.718774795532227, "global_step": 523942, "epoch": 6312} {"train_loss": -27.615192413330078, "global_step": 523943, "epoch": 6312} {"train_loss": -27.55549430847168, "global_step": 523944, "epoch": 6312} {"train_loss": -27.70650291442871, "global_step": 523945, "epoch": 6312} {"train_loss": -27.87995719909668, "global_step": 523946, "epoch": 6312} {"train_loss": -27.83245849609375, "global_step": 523947, "epoch": 6312} {"train_loss": -27.9715633392334, "global_step": 523948, "epoch": 6312} {"train_loss": -27.641342163085938, "global_step": 523949, "epoch": 6312} {"train_loss": -27.401229858398438, "global_step": 523950, "epoch": 6312} {"train_loss": -27.677051544189453, "global_step": 523951, "epoch": 6312} {"train_loss": -27.91567039489746, "global_step": 523952, "epoch": 6312} {"train_loss": -27.827966690063477, "global_step": 523953, "epoch": 6312} {"train_loss": -27.639148712158203, "global_step": 523954, "epoch": 6312} {"train_loss": -27.83411979675293, "global_step": 523955, "epoch": 6312} {"train_loss": -27.62347412109375, "global_step": 523956, "epoch": 6312} {"train_loss": -27.75140953063965, "global_step": 523957, "epoch": 6312} {"train_loss": -27.260028839111328, "global_step": 523958, "epoch": 6312} {"train_loss": -27.243072509765625, "global_step": 523959, "epoch": 6312} {"train_loss": -27.1776123046875, "global_step": 523960, "epoch": 6312} {"train_loss": -26.12013053894043, "global_step": 523961, "epoch": 6312} {"train_loss": -25.751806259155273, "global_step": 523962, "epoch": 6312} {"train_loss": -26.612462997436523, "global_step": 523963, "epoch": 6312} {"train_loss": -27.453046798706055, "global_step": 523964, "epoch": 6312} {"train_loss": -27.15192985534668, "global_step": 523965, "epoch": 6312} {"train_loss": -27.089075088500977, "global_step": 523966, "epoch": 6312} {"train_loss": -27.053125381469727, "global_step": 523967, "epoch": 6312} {"train_loss": -27.77259635925293, "global_step": 523968, "epoch": 6312} {"train_loss": -27.59613609313965, "global_step": 523969, "epoch": 6312} {"train_loss": -27.364835739135742, "global_step": 523970, "epoch": 6312} {"train_loss": -27.530736923217773, "global_step": 523971, "epoch": 6312} {"train_loss": -27.15789222717285, "global_step": 523972, "epoch": 6312} {"train_loss": -27.75785255432129, "global_step": 523973, "epoch": 6312} {"train_loss": -27.468542098999023, "global_step": 523974, "epoch": 6312} {"train_loss": -27.72883415222168, "global_step": 523975, "epoch": 6312} {"train_loss": -27.52105712890625, "global_step": 523976, "epoch": 6312} {"train_loss": -27.578384399414062, "global_step": 523977, "epoch": 6312} {"train_loss": -27.39087585081537, "global_step": 523978, "epoch": 6312, "val_loss": 6659532.0} {"train_loss": -27.145185470581055, "global_step": 523979, "epoch": 6313} {"train_loss": -26.537763595581055, "global_step": 523980, "epoch": 6313} {"train_loss": -27.101469039916992, "global_step": 523981, "epoch": 6313} {"train_loss": -27.322193145751953, "global_step": 523982, "epoch": 6313} {"train_loss": -26.90743064880371, "global_step": 523983, "epoch": 6313} {"train_loss": -26.886709213256836, "global_step": 523984, "epoch": 6313} {"train_loss": -26.26869773864746, "global_step": 523985, "epoch": 6313} {"train_loss": -27.05805015563965, "global_step": 523986, "epoch": 6313} {"train_loss": -27.152570724487305, "global_step": 523987, "epoch": 6313} {"train_loss": -27.0184383392334, "global_step": 523988, "epoch": 6313} {"train_loss": -27.292724609375, "global_step": 523989, "epoch": 6313} {"train_loss": -27.272064208984375, "global_step": 523990, "epoch": 6313} {"train_loss": -27.054157257080078, "global_step": 523991, "epoch": 6313} {"train_loss": -26.9244327545166, "global_step": 523992, "epoch": 6313} {"train_loss": -27.118377685546875, "global_step": 523993, "epoch": 6313} {"train_loss": -27.037893295288086, "global_step": 523994, "epoch": 6313} {"train_loss": -27.284753799438477, "global_step": 523995, "epoch": 6313} {"train_loss": -27.208667755126953, "global_step": 523996, "epoch": 6313} {"train_loss": -27.53106117248535, "global_step": 523997, "epoch": 6313} {"train_loss": -27.4854736328125, "global_step": 523998, "epoch": 6313} {"train_loss": -27.115697860717773, "global_step": 523999, "epoch": 6313} {"train_loss": -27.779129028320312, "global_step": 524000, "epoch": 6313} {"train_loss": -27.19110107421875, "global_step": 524001, "epoch": 6313} {"train_loss": -27.45119285583496, "global_step": 524002, "epoch": 6313} {"train_loss": -27.08326530456543, "global_step": 524003, "epoch": 6313} {"train_loss": -27.771162033081055, "global_step": 524004, "epoch": 6313} {"train_loss": -27.4034366607666, "global_step": 524005, "epoch": 6313} {"train_loss": -27.511341094970703, "global_step": 524006, "epoch": 6313} {"train_loss": -27.626251220703125, "global_step": 524007, "epoch": 6313} {"train_loss": -27.35148048400879, "global_step": 524008, "epoch": 6313} {"train_loss": -27.923425674438477, "global_step": 524009, "epoch": 6313} {"train_loss": -27.22964859008789, "global_step": 524010, "epoch": 6313} {"train_loss": -27.657154083251953, "global_step": 524011, "epoch": 6313} {"train_loss": -27.818262100219727, "global_step": 524012, "epoch": 6313} {"train_loss": -28.039154052734375, "global_step": 524013, "epoch": 6313} {"train_loss": -27.6495418548584, "global_step": 524014, "epoch": 6313} {"train_loss": -27.787586212158203, "global_step": 524015, "epoch": 6313} {"train_loss": -27.50545310974121, "global_step": 524016, "epoch": 6313} {"train_loss": -27.972152709960938, "global_step": 524017, "epoch": 6313} {"train_loss": -27.65775489807129, "global_step": 524018, "epoch": 6313} {"train_loss": -27.42188835144043, "global_step": 524019, "epoch": 6313} {"train_loss": -27.928730010986328, "global_step": 524020, "epoch": 6313} {"train_loss": -27.611860275268555, "global_step": 524021, "epoch": 6313} {"train_loss": -27.541624069213867, "global_step": 524022, "epoch": 6313} {"train_loss": -27.680423736572266, "global_step": 524023, "epoch": 6313} {"train_loss": -27.967145919799805, "global_step": 524024, "epoch": 6313} {"train_loss": -27.602521896362305, "global_step": 524025, "epoch": 6313} {"train_loss": -27.804731369018555, "global_step": 524026, "epoch": 6313} {"train_loss": -27.739500045776367, "global_step": 524027, "epoch": 6313} {"train_loss": -27.68912696838379, "global_step": 524028, "epoch": 6313} {"train_loss": -28.08060073852539, "global_step": 524029, "epoch": 6313} {"train_loss": -27.510517120361328, "global_step": 524030, "epoch": 6313} {"train_loss": -27.494998931884766, "global_step": 524031, "epoch": 6313} {"train_loss": -27.435117721557617, "global_step": 524032, "epoch": 6313} {"train_loss": -27.468463897705078, "global_step": 524033, "epoch": 6313} {"train_loss": -27.906696319580078, "global_step": 524034, "epoch": 6313} {"train_loss": -27.751346588134766, "global_step": 524035, "epoch": 6313} {"train_loss": -27.85715675354004, "global_step": 524036, "epoch": 6313} {"train_loss": -27.681970596313477, "global_step": 524037, "epoch": 6313} {"train_loss": -27.254150390625, "global_step": 524038, "epoch": 6313} {"train_loss": -27.364439010620117, "global_step": 524039, "epoch": 6313} {"train_loss": -27.929962158203125, "global_step": 524040, "epoch": 6313} {"train_loss": -27.5263671875, "global_step": 524041, "epoch": 6313} {"train_loss": -27.411041259765625, "global_step": 524042, "epoch": 6313} {"train_loss": -27.827136993408203, "global_step": 524043, "epoch": 6313} {"train_loss": -27.764272689819336, "global_step": 524044, "epoch": 6313} {"train_loss": -27.506113052368164, "global_step": 524045, "epoch": 6313} {"train_loss": -27.54618263244629, "global_step": 524046, "epoch": 6313} {"train_loss": -27.68597984313965, "global_step": 524047, "epoch": 6313} {"train_loss": -27.38321876525879, "global_step": 524048, "epoch": 6313} {"train_loss": -27.19403648376465, "global_step": 524049, "epoch": 6313} {"train_loss": -27.749313354492188, "global_step": 524050, "epoch": 6313} {"train_loss": -27.13251304626465, "global_step": 524051, "epoch": 6313} {"train_loss": -27.245330810546875, "global_step": 524052, "epoch": 6313} {"train_loss": -27.6375732421875, "global_step": 524053, "epoch": 6313} {"train_loss": -27.974668502807617, "global_step": 524054, "epoch": 6313} {"train_loss": -27.67127799987793, "global_step": 524055, "epoch": 6313} {"train_loss": -27.829328536987305, "global_step": 524056, "epoch": 6313} {"train_loss": -27.692188262939453, "global_step": 524057, "epoch": 6313} {"train_loss": -27.58098793029785, "global_step": 524058, "epoch": 6313} {"train_loss": -27.47494888305664, "global_step": 524059, "epoch": 6313} {"train_loss": -27.41387367248535, "global_step": 524060, "epoch": 6313} {"train_loss": -27.473644141691278, "global_step": 524061, "epoch": 6313, "val_loss": 6616556.0} {"train_loss": -25.472774505615234, "global_step": 524062, "epoch": 6314} {"train_loss": -26.13298988342285, "global_step": 524063, "epoch": 6314} {"train_loss": -26.47889518737793, "global_step": 524064, "epoch": 6314} {"train_loss": -26.665714263916016, "global_step": 524065, "epoch": 6314} {"train_loss": -26.500385284423828, "global_step": 524066, "epoch": 6314} {"train_loss": -26.37531089782715, "global_step": 524067, "epoch": 6314} {"train_loss": -26.456571578979492, "global_step": 524068, "epoch": 6314} {"train_loss": -26.6550350189209, "global_step": 524069, "epoch": 6314} {"train_loss": -26.233768463134766, "global_step": 524070, "epoch": 6314} {"train_loss": -26.8984375, "global_step": 524071, "epoch": 6314} {"train_loss": -26.29132652282715, "global_step": 524072, "epoch": 6314} {"train_loss": -26.369062423706055, "global_step": 524073, "epoch": 6314} {"train_loss": -26.533679962158203, "global_step": 524074, "epoch": 6314} {"train_loss": -26.934202194213867, "global_step": 524075, "epoch": 6314} {"train_loss": -26.86256217956543, "global_step": 524076, "epoch": 6314} {"train_loss": -26.815631866455078, "global_step": 524077, "epoch": 6314} {"train_loss": -26.764074325561523, "global_step": 524078, "epoch": 6314} {"train_loss": -26.52045249938965, "global_step": 524079, "epoch": 6314} {"train_loss": -27.170862197875977, "global_step": 524080, "epoch": 6314} {"train_loss": -26.95493507385254, "global_step": 524081, "epoch": 6314} {"train_loss": -27.20917320251465, "global_step": 524082, "epoch": 6314} {"train_loss": -27.288787841796875, "global_step": 524083, "epoch": 6314} {"train_loss": -26.968969345092773, "global_step": 524084, "epoch": 6314} {"train_loss": -27.200851440429688, "global_step": 524085, "epoch": 6314} {"train_loss": -27.239404678344727, "global_step": 524086, "epoch": 6314} {"train_loss": -27.0450439453125, "global_step": 524087, "epoch": 6314} {"train_loss": -27.406137466430664, "global_step": 524088, "epoch": 6314} {"train_loss": -27.287403106689453, "global_step": 524089, "epoch": 6314} {"train_loss": -27.106719970703125, "global_step": 524090, "epoch": 6314} {"train_loss": -27.20761489868164, "global_step": 524091, "epoch": 6314} {"train_loss": -27.247312545776367, "global_step": 524092, "epoch": 6314} {"train_loss": -27.200986862182617, "global_step": 524093, "epoch": 6314} {"train_loss": -27.54657554626465, "global_step": 524094, "epoch": 6314} {"train_loss": -27.33269691467285, "global_step": 524095, "epoch": 6314} {"train_loss": -27.45853042602539, "global_step": 524096, "epoch": 6314} {"train_loss": -27.45526123046875, "global_step": 524097, "epoch": 6314} {"train_loss": -27.163360595703125, "global_step": 524098, "epoch": 6314} {"train_loss": -27.444555282592773, "global_step": 524099, "epoch": 6314} {"train_loss": -27.39911460876465, "global_step": 524100, "epoch": 6314} {"train_loss": -27.531335830688477, "global_step": 524101, "epoch": 6314} {"train_loss": -27.972272872924805, "global_step": 524102, "epoch": 6314} {"train_loss": -27.1932315826416, "global_step": 524103, "epoch": 6314} {"train_loss": -27.609785079956055, "global_step": 524104, "epoch": 6314} {"train_loss": -27.598663330078125, "global_step": 524105, "epoch": 6314} {"train_loss": -27.48095703125, "global_step": 524106, "epoch": 6314} {"train_loss": -27.575048446655273, "global_step": 524107, "epoch": 6314} {"train_loss": -27.483434677124023, "global_step": 524108, "epoch": 6314} {"train_loss": -27.330305099487305, "global_step": 524109, "epoch": 6314} {"train_loss": -27.464094161987305, "global_step": 524110, "epoch": 6314} {"train_loss": -27.6889705657959, "global_step": 524111, "epoch": 6314} {"train_loss": -27.73042106628418, "global_step": 524112, "epoch": 6314} {"train_loss": -27.611501693725586, "global_step": 524113, "epoch": 6314} {"train_loss": -27.794126510620117, "global_step": 524114, "epoch": 6314} {"train_loss": -27.820404052734375, "global_step": 524115, "epoch": 6314} {"train_loss": -27.62470817565918, "global_step": 524116, "epoch": 6314} {"train_loss": -27.786895751953125, "global_step": 524117, "epoch": 6314} {"train_loss": -27.696691513061523, "global_step": 524118, "epoch": 6314} {"train_loss": -27.238203048706055, "global_step": 524119, "epoch": 6314} {"train_loss": -27.327320098876953, "global_step": 524120, "epoch": 6314} {"train_loss": -27.354965209960938, "global_step": 524121, "epoch": 6314} {"train_loss": -27.579681396484375, "global_step": 524122, "epoch": 6314} {"train_loss": -27.67952537536621, "global_step": 524123, "epoch": 6314} {"train_loss": -27.525617599487305, "global_step": 524124, "epoch": 6314} {"train_loss": -27.577234268188477, "global_step": 524125, "epoch": 6314} {"train_loss": -27.6467342376709, "global_step": 524126, "epoch": 6314} {"train_loss": -27.53687858581543, "global_step": 524127, "epoch": 6314} {"train_loss": -27.570438385009766, "global_step": 524128, "epoch": 6314} {"train_loss": -27.37433433532715, "global_step": 524129, "epoch": 6314} {"train_loss": -27.628442764282227, "global_step": 524130, "epoch": 6314} {"train_loss": -27.572362899780273, "global_step": 524131, "epoch": 6314} {"train_loss": -27.70149803161621, "global_step": 524132, "epoch": 6314} {"train_loss": -28.11805534362793, "global_step": 524133, "epoch": 6314} {"train_loss": -27.678882598876953, "global_step": 524134, "epoch": 6314} {"train_loss": -27.66404151916504, "global_step": 524135, "epoch": 6314} {"train_loss": -27.619291305541992, "global_step": 524136, "epoch": 6314} {"train_loss": -27.73027992248535, "global_step": 524137, "epoch": 6314} {"train_loss": -27.80511474609375, "global_step": 524138, "epoch": 6314} {"train_loss": -27.502166748046875, "global_step": 524139, "epoch": 6314} {"train_loss": -27.27874755859375, "global_step": 524140, "epoch": 6314} {"train_loss": -27.605316162109375, "global_step": 524141, "epoch": 6314} {"train_loss": -27.787878036499023, "global_step": 524142, "epoch": 6314} {"train_loss": -27.192296981811523, "global_step": 524143, "epoch": 6314} {"train_loss": -27.26290254707796, "global_step": 524144, "epoch": 6314, "val_loss": 6639422.0} {"train_loss": -25.776090621948242, "global_step": 524145, "epoch": 6315} {"train_loss": -22.928937911987305, "global_step": 524146, "epoch": 6315} {"train_loss": -25.109106063842773, "global_step": 524147, "epoch": 6315} {"train_loss": -26.023883819580078, "global_step": 524148, "epoch": 6315} {"train_loss": -25.967008590698242, "global_step": 524149, "epoch": 6315} {"train_loss": -26.282907485961914, "global_step": 524150, "epoch": 6315} {"train_loss": -26.490888595581055, "global_step": 524151, "epoch": 6315} {"train_loss": -26.227100372314453, "global_step": 524152, "epoch": 6315} {"train_loss": -26.573827743530273, "global_step": 524153, "epoch": 6315} {"train_loss": -26.948444366455078, "global_step": 524154, "epoch": 6315} {"train_loss": -26.091033935546875, "global_step": 524155, "epoch": 6315} {"train_loss": -27.204059600830078, "global_step": 524156, "epoch": 6315} {"train_loss": -27.100879669189453, "global_step": 524157, "epoch": 6315} {"train_loss": -26.452136993408203, "global_step": 524158, "epoch": 6315} {"train_loss": -26.828840255737305, "global_step": 524159, "epoch": 6315} {"train_loss": -26.740345001220703, "global_step": 524160, "epoch": 6315} {"train_loss": -26.958295822143555, "global_step": 524161, "epoch": 6315} {"train_loss": -26.790525436401367, "global_step": 524162, "epoch": 6315} {"train_loss": -26.578826904296875, "global_step": 524163, "epoch": 6315} {"train_loss": -26.862707138061523, "global_step": 524164, "epoch": 6315} {"train_loss": -26.82838249206543, "global_step": 524165, "epoch": 6315} {"train_loss": -27.16094398498535, "global_step": 524166, "epoch": 6315} {"train_loss": -27.03492546081543, "global_step": 524167, "epoch": 6315} {"train_loss": -26.961536407470703, "global_step": 524168, "epoch": 6315} {"train_loss": -27.154632568359375, "global_step": 524169, "epoch": 6315} {"train_loss": -27.177997589111328, "global_step": 524170, "epoch": 6315} {"train_loss": -27.43059730529785, "global_step": 524171, "epoch": 6315} {"train_loss": -27.256378173828125, "global_step": 524172, "epoch": 6315} {"train_loss": -26.70338249206543, "global_step": 524173, "epoch": 6315} {"train_loss": -27.207178115844727, "global_step": 524174, "epoch": 6315} {"train_loss": -27.164337158203125, "global_step": 524175, "epoch": 6315} {"train_loss": -27.365192413330078, "global_step": 524176, "epoch": 6315} {"train_loss": -27.503087997436523, "global_step": 524177, "epoch": 6315} {"train_loss": -27.04131507873535, "global_step": 524178, "epoch": 6315} {"train_loss": -27.394601821899414, "global_step": 524179, "epoch": 6315} {"train_loss": -27.311248779296875, "global_step": 524180, "epoch": 6315} {"train_loss": -27.163593292236328, "global_step": 524181, "epoch": 6315} {"train_loss": -27.400800704956055, "global_step": 524182, "epoch": 6315} {"train_loss": -27.510944366455078, "global_step": 524183, "epoch": 6315} {"train_loss": -27.12322998046875, "global_step": 524184, "epoch": 6315} {"train_loss": -27.133604049682617, "global_step": 524185, "epoch": 6315} {"train_loss": -27.4243221282959, "global_step": 524186, "epoch": 6315} {"train_loss": -27.201141357421875, "global_step": 524187, "epoch": 6315} {"train_loss": -27.30061149597168, "global_step": 524188, "epoch": 6315} {"train_loss": -27.056623458862305, "global_step": 524189, "epoch": 6315} {"train_loss": -27.120990753173828, "global_step": 524190, "epoch": 6315} {"train_loss": -27.172460556030273, "global_step": 524191, "epoch": 6315} {"train_loss": -27.152420043945312, "global_step": 524192, "epoch": 6315} {"train_loss": -27.174667358398438, "global_step": 524193, "epoch": 6315} {"train_loss": -27.385395050048828, "global_step": 524194, "epoch": 6315} {"train_loss": -27.652639389038086, "global_step": 524195, "epoch": 6315} {"train_loss": -27.043272018432617, "global_step": 524196, "epoch": 6315} {"train_loss": -27.51679039001465, "global_step": 524197, "epoch": 6315} {"train_loss": -27.69976234436035, "global_step": 524198, "epoch": 6315} {"train_loss": -27.317672729492188, "global_step": 524199, "epoch": 6315} {"train_loss": -26.95892333984375, "global_step": 524200, "epoch": 6315} {"train_loss": -27.71600914001465, "global_step": 524201, "epoch": 6315} {"train_loss": -28.155517578125, "global_step": 524202, "epoch": 6315} {"train_loss": -27.549970626831055, "global_step": 524203, "epoch": 6315} {"train_loss": -27.239667892456055, "global_step": 524204, "epoch": 6315} {"train_loss": -27.2849178314209, "global_step": 524205, "epoch": 6315} {"train_loss": -27.73699951171875, "global_step": 524206, "epoch": 6315} {"train_loss": -27.458524703979492, "global_step": 524207, "epoch": 6315} {"train_loss": -27.169971466064453, "global_step": 524208, "epoch": 6315} {"train_loss": -27.961694717407227, "global_step": 524209, "epoch": 6315} {"train_loss": -27.751020431518555, "global_step": 524210, "epoch": 6315} {"train_loss": -27.465747833251953, "global_step": 524211, "epoch": 6315} {"train_loss": -27.68337059020996, "global_step": 524212, "epoch": 6315} {"train_loss": -27.627668380737305, "global_step": 524213, "epoch": 6315} {"train_loss": -27.734546661376953, "global_step": 524214, "epoch": 6315} {"train_loss": -27.272979736328125, "global_step": 524215, "epoch": 6315} {"train_loss": -27.739099502563477, "global_step": 524216, "epoch": 6315} {"train_loss": -27.900983810424805, "global_step": 524217, "epoch": 6315} {"train_loss": -27.547779083251953, "global_step": 524218, "epoch": 6315} {"train_loss": -27.576587677001953, "global_step": 524219, "epoch": 6315} {"train_loss": -27.657934188842773, "global_step": 524220, "epoch": 6315} {"train_loss": -27.291645050048828, "global_step": 524221, "epoch": 6315} {"train_loss": -27.54395866394043, "global_step": 524222, "epoch": 6315} {"train_loss": -27.681516647338867, "global_step": 524223, "epoch": 6315} {"train_loss": -27.452133178710938, "global_step": 524224, "epoch": 6315} {"train_loss": -27.59059715270996, "global_step": 524225, "epoch": 6315} {"train_loss": -27.691375732421875, "global_step": 524226, "epoch": 6315} {"train_loss": -27.128656846931182, "global_step": 524227, "epoch": 6315, "val_loss": 6652922.0} {"train_loss": -27.59895133972168, "global_step": 524228, "epoch": 6316} {"train_loss": -27.70136833190918, "global_step": 524229, "epoch": 6316} {"train_loss": -27.186792373657227, "global_step": 524230, "epoch": 6316} {"train_loss": -27.43792724609375, "global_step": 524231, "epoch": 6316} {"train_loss": -27.500701904296875, "global_step": 524232, "epoch": 6316} {"train_loss": -27.330835342407227, "global_step": 524233, "epoch": 6316} {"train_loss": -27.45545768737793, "global_step": 524234, "epoch": 6316} {"train_loss": -27.121997833251953, "global_step": 524235, "epoch": 6316} {"train_loss": -27.654449462890625, "global_step": 524236, "epoch": 6316} {"train_loss": -27.517475128173828, "global_step": 524237, "epoch": 6316} {"train_loss": -27.597375869750977, "global_step": 524238, "epoch": 6316} {"train_loss": -27.406522750854492, "global_step": 524239, "epoch": 6316} {"train_loss": -27.7347354888916, "global_step": 524240, "epoch": 6316} {"train_loss": -27.564411163330078, "global_step": 524241, "epoch": 6316} {"train_loss": -27.59933853149414, "global_step": 524242, "epoch": 6316} {"train_loss": -27.5305233001709, "global_step": 524243, "epoch": 6316} {"train_loss": -27.573251724243164, "global_step": 524244, "epoch": 6316} {"train_loss": -27.60113525390625, "global_step": 524245, "epoch": 6316} {"train_loss": -27.594018936157227, "global_step": 524246, "epoch": 6316} {"train_loss": -27.61793327331543, "global_step": 524247, "epoch": 6316} {"train_loss": -27.600574493408203, "global_step": 524248, "epoch": 6316} {"train_loss": -27.43842887878418, "global_step": 524249, "epoch": 6316} {"train_loss": -27.92940330505371, "global_step": 524250, "epoch": 6316} {"train_loss": -27.525251388549805, "global_step": 524251, "epoch": 6316} {"train_loss": -27.705646514892578, "global_step": 524252, "epoch": 6316} {"train_loss": -27.68623924255371, "global_step": 524253, "epoch": 6316} {"train_loss": -27.352216720581055, "global_step": 524254, "epoch": 6316} {"train_loss": -27.667402267456055, "global_step": 524255, "epoch": 6316} {"train_loss": -27.372589111328125, "global_step": 524256, "epoch": 6316} {"train_loss": -27.41033363342285, "global_step": 524257, "epoch": 6316} {"train_loss": -27.472522735595703, "global_step": 524258, "epoch": 6316} {"train_loss": -27.576324462890625, "global_step": 524259, "epoch": 6316} {"train_loss": -27.612751007080078, "global_step": 524260, "epoch": 6316} {"train_loss": -27.283782958984375, "global_step": 524261, "epoch": 6316} {"train_loss": -27.300832748413086, "global_step": 524262, "epoch": 6316} {"train_loss": -27.06629753112793, "global_step": 524263, "epoch": 6316} {"train_loss": -27.293014526367188, "global_step": 524264, "epoch": 6316} {"train_loss": -27.12550163269043, "global_step": 524265, "epoch": 6316} {"train_loss": -27.492843627929688, "global_step": 524266, "epoch": 6316} {"train_loss": -26.81430435180664, "global_step": 524267, "epoch": 6316} {"train_loss": -27.538419723510742, "global_step": 524268, "epoch": 6316} {"train_loss": -27.260894775390625, "global_step": 524269, "epoch": 6316} {"train_loss": -27.502777099609375, "global_step": 524270, "epoch": 6316} {"train_loss": -27.479368209838867, "global_step": 524271, "epoch": 6316} {"train_loss": -27.418363571166992, "global_step": 524272, "epoch": 6316} {"train_loss": -27.15496826171875, "global_step": 524273, "epoch": 6316} {"train_loss": -27.765613555908203, "global_step": 524274, "epoch": 6316} {"train_loss": -27.617944717407227, "global_step": 524275, "epoch": 6316} {"train_loss": -27.403852462768555, "global_step": 524276, "epoch": 6316} {"train_loss": -27.518720626831055, "global_step": 524277, "epoch": 6316} {"train_loss": -28.000946044921875, "global_step": 524278, "epoch": 6316} {"train_loss": -27.371572494506836, "global_step": 524279, "epoch": 6316} {"train_loss": -27.441608428955078, "global_step": 524280, "epoch": 6316} {"train_loss": -27.6843204498291, "global_step": 524281, "epoch": 6316} {"train_loss": -27.71905517578125, "global_step": 524282, "epoch": 6316} {"train_loss": -27.26270866394043, "global_step": 524283, "epoch": 6316} {"train_loss": -27.82801628112793, "global_step": 524284, "epoch": 6316} {"train_loss": -27.811981201171875, "global_step": 524285, "epoch": 6316} {"train_loss": -27.54075050354004, "global_step": 524286, "epoch": 6316} {"train_loss": -27.565805435180664, "global_step": 524287, "epoch": 6316} {"train_loss": -28.01548194885254, "global_step": 524288, "epoch": 6316} {"train_loss": -27.17431640625, "global_step": 524289, "epoch": 6316} {"train_loss": -27.743244171142578, "global_step": 524290, "epoch": 6316} {"train_loss": -27.635456085205078, "global_step": 524291, "epoch": 6316} {"train_loss": -28.022192001342773, "global_step": 524292, "epoch": 6316} {"train_loss": -27.422407150268555, "global_step": 524293, "epoch": 6316} {"train_loss": -27.4969425201416, "global_step": 524294, "epoch": 6316} {"train_loss": -27.35466957092285, "global_step": 524295, "epoch": 6316} {"train_loss": -27.62567710876465, "global_step": 524296, "epoch": 6316} {"train_loss": -28.03312110900879, "global_step": 524297, "epoch": 6316} {"train_loss": -27.176868438720703, "global_step": 524298, "epoch": 6316} {"train_loss": -27.548940658569336, "global_step": 524299, "epoch": 6316} {"train_loss": -27.75391960144043, "global_step": 524300, "epoch": 6316} {"train_loss": -27.334924697875977, "global_step": 524301, "epoch": 6316} {"train_loss": -27.67441177368164, "global_step": 524302, "epoch": 6316} {"train_loss": -27.682544708251953, "global_step": 524303, "epoch": 6316} {"train_loss": -27.69384765625, "global_step": 524304, "epoch": 6316} {"train_loss": -27.6843204498291, "global_step": 524305, "epoch": 6316} {"train_loss": -27.962299346923828, "global_step": 524306, "epoch": 6316} {"train_loss": -28.065155029296875, "global_step": 524307, "epoch": 6316} {"train_loss": -27.917455673217773, "global_step": 524308, "epoch": 6316} {"train_loss": -27.539350509643555, "global_step": 524309, "epoch": 6316} {"train_loss": -27.557777519685676, "global_step": 524310, "epoch": 6316, "val_loss": 6599896.5} {"train_loss": -27.020980834960938, "global_step": 524311, "epoch": 6317} {"train_loss": -26.11024284362793, "global_step": 524312, "epoch": 6317} {"train_loss": -26.863183975219727, "global_step": 524313, "epoch": 6317} {"train_loss": -27.251855850219727, "global_step": 524314, "epoch": 6317} {"train_loss": -26.861988067626953, "global_step": 524315, "epoch": 6317} {"train_loss": -26.24820327758789, "global_step": 524316, "epoch": 6317} {"train_loss": -26.76032829284668, "global_step": 524317, "epoch": 6317} {"train_loss": -26.91892433166504, "global_step": 524318, "epoch": 6317} {"train_loss": -26.886526107788086, "global_step": 524319, "epoch": 6317} {"train_loss": -26.4742374420166, "global_step": 524320, "epoch": 6317} {"train_loss": -27.208484649658203, "global_step": 524321, "epoch": 6317} {"train_loss": -26.755720138549805, "global_step": 524322, "epoch": 6317} {"train_loss": -27.41511344909668, "global_step": 524323, "epoch": 6317} {"train_loss": -26.91187858581543, "global_step": 524324, "epoch": 6317} {"train_loss": -26.87192726135254, "global_step": 524325, "epoch": 6317} {"train_loss": -26.722822189331055, "global_step": 524326, "epoch": 6317} {"train_loss": -27.329818725585938, "global_step": 524327, "epoch": 6317} {"train_loss": -26.972143173217773, "global_step": 524328, "epoch": 6317} {"train_loss": -26.952911376953125, "global_step": 524329, "epoch": 6317} {"train_loss": -27.2110538482666, "global_step": 524330, "epoch": 6317} {"train_loss": -27.46005630493164, "global_step": 524331, "epoch": 6317} {"train_loss": -27.23673439025879, "global_step": 524332, "epoch": 6317} {"train_loss": -27.106054306030273, "global_step": 524333, "epoch": 6317} {"train_loss": -27.32832145690918, "global_step": 524334, "epoch": 6317} {"train_loss": -27.302398681640625, "global_step": 524335, "epoch": 6317} {"train_loss": -27.67411231994629, "global_step": 524336, "epoch": 6317} {"train_loss": -27.293033599853516, "global_step": 524337, "epoch": 6317} {"train_loss": -27.056293487548828, "global_step": 524338, "epoch": 6317} {"train_loss": -27.395444869995117, "global_step": 524339, "epoch": 6317} {"train_loss": -27.249719619750977, "global_step": 524340, "epoch": 6317} {"train_loss": -27.390295028686523, "global_step": 524341, "epoch": 6317} {"train_loss": -27.51043128967285, "global_step": 524342, "epoch": 6317} {"train_loss": -27.36322021484375, "global_step": 524343, "epoch": 6317} {"train_loss": -27.504150390625, "global_step": 524344, "epoch": 6317} {"train_loss": -27.492517471313477, "global_step": 524345, "epoch": 6317} {"train_loss": -27.549657821655273, "global_step": 524346, "epoch": 6317} {"train_loss": -27.666357040405273, "global_step": 524347, "epoch": 6317} {"train_loss": -27.379077911376953, "global_step": 524348, "epoch": 6317} {"train_loss": -27.557275772094727, "global_step": 524349, "epoch": 6317} {"train_loss": -27.75410270690918, "global_step": 524350, "epoch": 6317} {"train_loss": -27.55402183532715, "global_step": 524351, "epoch": 6317} {"train_loss": -27.471542358398438, "global_step": 524352, "epoch": 6317} {"train_loss": -27.46821403503418, "global_step": 524353, "epoch": 6317} {"train_loss": -27.441003799438477, "global_step": 524354, "epoch": 6317} {"train_loss": -27.380273818969727, "global_step": 524355, "epoch": 6317} {"train_loss": -27.656843185424805, "global_step": 524356, "epoch": 6317} {"train_loss": -27.450849533081055, "global_step": 524357, "epoch": 6317} {"train_loss": -28.05158042907715, "global_step": 524358, "epoch": 6317} {"train_loss": -27.37387466430664, "global_step": 524359, "epoch": 6317} {"train_loss": -27.431991577148438, "global_step": 524360, "epoch": 6317} {"train_loss": -27.619897842407227, "global_step": 524361, "epoch": 6317} {"train_loss": -27.57343864440918, "global_step": 524362, "epoch": 6317} {"train_loss": -27.66187858581543, "global_step": 524363, "epoch": 6317} {"train_loss": -27.288785934448242, "global_step": 524364, "epoch": 6317} {"train_loss": -27.730138778686523, "global_step": 524365, "epoch": 6317} {"train_loss": -27.89194107055664, "global_step": 524366, "epoch": 6317} {"train_loss": -27.353910446166992, "global_step": 524367, "epoch": 6317} {"train_loss": -27.600759506225586, "global_step": 524368, "epoch": 6317} {"train_loss": -27.46071434020996, "global_step": 524369, "epoch": 6317} {"train_loss": -27.692584991455078, "global_step": 524370, "epoch": 6317} {"train_loss": -27.482563018798828, "global_step": 524371, "epoch": 6317} {"train_loss": -26.855676651000977, "global_step": 524372, "epoch": 6317} {"train_loss": -27.27113151550293, "global_step": 524373, "epoch": 6317} {"train_loss": -27.47517204284668, "global_step": 524374, "epoch": 6317} {"train_loss": -27.524702072143555, "global_step": 524375, "epoch": 6317} {"train_loss": -27.9685115814209, "global_step": 524376, "epoch": 6317} {"train_loss": -27.144079208374023, "global_step": 524377, "epoch": 6317} {"train_loss": -27.221973419189453, "global_step": 524378, "epoch": 6317} {"train_loss": -27.531147003173828, "global_step": 524379, "epoch": 6317} {"train_loss": -28.01593589782715, "global_step": 524380, "epoch": 6317} {"train_loss": -27.439727783203125, "global_step": 524381, "epoch": 6317} {"train_loss": -27.41852378845215, "global_step": 524382, "epoch": 6317} {"train_loss": -27.410200119018555, "global_step": 524383, "epoch": 6317} {"train_loss": -27.700525283813477, "global_step": 524384, "epoch": 6317} {"train_loss": -27.719318389892578, "global_step": 524385, "epoch": 6317} {"train_loss": -28.009353637695312, "global_step": 524386, "epoch": 6317} {"train_loss": -27.55474853515625, "global_step": 524387, "epoch": 6317} {"train_loss": -27.393049240112305, "global_step": 524388, "epoch": 6317} {"train_loss": -27.47871971130371, "global_step": 524389, "epoch": 6317} {"train_loss": -27.557470321655273, "global_step": 524390, "epoch": 6317} {"train_loss": -27.434412002563477, "global_step": 524391, "epoch": 6317} {"train_loss": -27.964635848999023, "global_step": 524392, "epoch": 6317} {"train_loss": -27.355970819312407, "global_step": 524393, "epoch": 6317, "val_loss": 6697438.5} {"train_loss": -26.772939682006836, "global_step": 524394, "epoch": 6318} {"train_loss": -24.906339645385742, "global_step": 524395, "epoch": 6318} {"train_loss": -26.676427841186523, "global_step": 524396, "epoch": 6318} {"train_loss": -26.57108497619629, "global_step": 524397, "epoch": 6318} {"train_loss": -25.66327476501465, "global_step": 524398, "epoch": 6318} {"train_loss": -26.567270278930664, "global_step": 524399, "epoch": 6318} {"train_loss": -25.759740829467773, "global_step": 524400, "epoch": 6318} {"train_loss": -26.879562377929688, "global_step": 524401, "epoch": 6318} {"train_loss": -26.76786231994629, "global_step": 524402, "epoch": 6318} {"train_loss": -26.276443481445312, "global_step": 524403, "epoch": 6318} {"train_loss": -26.948627471923828, "global_step": 524404, "epoch": 6318} {"train_loss": -27.072370529174805, "global_step": 524405, "epoch": 6318} {"train_loss": -27.35256004333496, "global_step": 524406, "epoch": 6318} {"train_loss": -27.00501823425293, "global_step": 524407, "epoch": 6318} {"train_loss": -27.30585289001465, "global_step": 524408, "epoch": 6318} {"train_loss": -27.633716583251953, "global_step": 524409, "epoch": 6318} {"train_loss": -27.042051315307617, "global_step": 524410, "epoch": 6318} {"train_loss": -27.248550415039062, "global_step": 524411, "epoch": 6318} {"train_loss": -26.818923950195312, "global_step": 524412, "epoch": 6318} {"train_loss": -27.411182403564453, "global_step": 524413, "epoch": 6318} {"train_loss": -27.377004623413086, "global_step": 524414, "epoch": 6318} {"train_loss": -27.366748809814453, "global_step": 524415, "epoch": 6318} {"train_loss": -27.002349853515625, "global_step": 524416, "epoch": 6318} {"train_loss": -27.2252140045166, "global_step": 524417, "epoch": 6318} {"train_loss": -27.13172721862793, "global_step": 524418, "epoch": 6318} {"train_loss": -27.087446212768555, "global_step": 524419, "epoch": 6318} {"train_loss": -27.089298248291016, "global_step": 524420, "epoch": 6318} {"train_loss": -27.427936553955078, "global_step": 524421, "epoch": 6318} {"train_loss": -27.195768356323242, "global_step": 524422, "epoch": 6318} {"train_loss": -27.345563888549805, "global_step": 524423, "epoch": 6318} {"train_loss": -27.54701042175293, "global_step": 524424, "epoch": 6318} {"train_loss": -27.30720329284668, "global_step": 524425, "epoch": 6318} {"train_loss": -27.23069190979004, "global_step": 524426, "epoch": 6318} {"train_loss": -27.32074546813965, "global_step": 524427, "epoch": 6318} {"train_loss": -27.408594131469727, "global_step": 524428, "epoch": 6318} {"train_loss": -27.284759521484375, "global_step": 524429, "epoch": 6318} {"train_loss": -27.66073989868164, "global_step": 524430, "epoch": 6318} {"train_loss": -27.351001739501953, "global_step": 524431, "epoch": 6318} {"train_loss": -27.663257598876953, "global_step": 524432, "epoch": 6318} {"train_loss": -27.893997192382812, "global_step": 524433, "epoch": 6318} {"train_loss": -27.552764892578125, "global_step": 524434, "epoch": 6318} {"train_loss": -27.683258056640625, "global_step": 524435, "epoch": 6318} {"train_loss": -27.56597900390625, "global_step": 524436, "epoch": 6318} {"train_loss": -27.394123077392578, "global_step": 524437, "epoch": 6318} {"train_loss": -27.696014404296875, "global_step": 524438, "epoch": 6318} {"train_loss": -27.43317985534668, "global_step": 524439, "epoch": 6318} {"train_loss": -27.897974014282227, "global_step": 524440, "epoch": 6318} {"train_loss": -27.54971694946289, "global_step": 524441, "epoch": 6318} {"train_loss": -27.958206176757812, "global_step": 524442, "epoch": 6318} {"train_loss": -27.64975357055664, "global_step": 524443, "epoch": 6318} {"train_loss": -27.704452514648438, "global_step": 524444, "epoch": 6318} {"train_loss": -27.73287010192871, "global_step": 524445, "epoch": 6318} {"train_loss": -27.274505615234375, "global_step": 524446, "epoch": 6318} {"train_loss": -26.686248779296875, "global_step": 524447, "epoch": 6318} {"train_loss": -26.770465850830078, "global_step": 524448, "epoch": 6318} {"train_loss": -27.230270385742188, "global_step": 524449, "epoch": 6318} {"train_loss": -27.572004318237305, "global_step": 524450, "epoch": 6318} {"train_loss": -27.36661720275879, "global_step": 524451, "epoch": 6318} {"train_loss": -27.1081485748291, "global_step": 524452, "epoch": 6318} {"train_loss": -27.246891021728516, "global_step": 524453, "epoch": 6318} {"train_loss": -27.37737464904785, "global_step": 524454, "epoch": 6318} {"train_loss": -27.159656524658203, "global_step": 524455, "epoch": 6318} {"train_loss": -27.00263023376465, "global_step": 524456, "epoch": 6318} {"train_loss": -27.1649112701416, "global_step": 524457, "epoch": 6318} {"train_loss": -27.409345626831055, "global_step": 524458, "epoch": 6318} {"train_loss": -27.33829689025879, "global_step": 524459, "epoch": 6318} {"train_loss": -27.281330108642578, "global_step": 524460, "epoch": 6318} {"train_loss": -27.29737663269043, "global_step": 524461, "epoch": 6318} {"train_loss": -26.960315704345703, "global_step": 524462, "epoch": 6318} {"train_loss": -27.18987464904785, "global_step": 524463, "epoch": 6318} {"train_loss": -27.5178165435791, "global_step": 524464, "epoch": 6318} {"train_loss": -27.694971084594727, "global_step": 524465, "epoch": 6318} {"train_loss": -27.436120986938477, "global_step": 524466, "epoch": 6318} {"train_loss": -27.176183700561523, "global_step": 524467, "epoch": 6318} {"train_loss": -26.975690841674805, "global_step": 524468, "epoch": 6318} {"train_loss": -27.508981704711914, "global_step": 524469, "epoch": 6318} {"train_loss": -27.495330810546875, "global_step": 524470, "epoch": 6318} {"train_loss": -27.127073287963867, "global_step": 524471, "epoch": 6318} {"train_loss": -27.836523056030273, "global_step": 524472, "epoch": 6318} {"train_loss": -27.213150024414062, "global_step": 524473, "epoch": 6318} {"train_loss": -27.43715476989746, "global_step": 524474, "epoch": 6318} {"train_loss": -27.644947052001953, "global_step": 524475, "epoch": 6318} {"train_loss": -27.241986607930745, "global_step": 524476, "epoch": 6318, "val_loss": 6668754.0} {"train_loss": -26.5872802734375, "global_step": 524477, "epoch": 6319} {"train_loss": -27.168272018432617, "global_step": 524478, "epoch": 6319} {"train_loss": -26.77566909790039, "global_step": 524479, "epoch": 6319} {"train_loss": -26.94015884399414, "global_step": 524480, "epoch": 6319} {"train_loss": -27.32801628112793, "global_step": 524481, "epoch": 6319} {"train_loss": -27.187183380126953, "global_step": 524482, "epoch": 6319} {"train_loss": -26.91724967956543, "global_step": 524483, "epoch": 6319} {"train_loss": -27.372760772705078, "global_step": 524484, "epoch": 6319} {"train_loss": -26.9058780670166, "global_step": 524485, "epoch": 6319} {"train_loss": -27.0881404876709, "global_step": 524486, "epoch": 6319} {"train_loss": -27.02129554748535, "global_step": 524487, "epoch": 6319} {"train_loss": -27.207721710205078, "global_step": 524488, "epoch": 6319} {"train_loss": -27.160486221313477, "global_step": 524489, "epoch": 6319} {"train_loss": -27.173980712890625, "global_step": 524490, "epoch": 6319} {"train_loss": -27.589582443237305, "global_step": 524491, "epoch": 6319} {"train_loss": -27.260364532470703, "global_step": 524492, "epoch": 6319} {"train_loss": -27.37806510925293, "global_step": 524493, "epoch": 6319} {"train_loss": -27.298995971679688, "global_step": 524494, "epoch": 6319} {"train_loss": -27.52259635925293, "global_step": 524495, "epoch": 6319} {"train_loss": -27.437885284423828, "global_step": 524496, "epoch": 6319} {"train_loss": -27.494848251342773, "global_step": 524497, "epoch": 6319} {"train_loss": -27.342390060424805, "global_step": 524498, "epoch": 6319} {"train_loss": -27.525197982788086, "global_step": 524499, "epoch": 6319} {"train_loss": -27.620222091674805, "global_step": 524500, "epoch": 6319} {"train_loss": -27.7232666015625, "global_step": 524501, "epoch": 6319} {"train_loss": -27.72898292541504, "global_step": 524502, "epoch": 6319} {"train_loss": -27.578832626342773, "global_step": 524503, "epoch": 6319} {"train_loss": -27.623212814331055, "global_step": 524504, "epoch": 6319} {"train_loss": -27.826831817626953, "global_step": 524505, "epoch": 6319} {"train_loss": -27.62409782409668, "global_step": 524506, "epoch": 6319} {"train_loss": -27.48908042907715, "global_step": 524507, "epoch": 6319} {"train_loss": -27.161840438842773, "global_step": 524508, "epoch": 6319} {"train_loss": -27.627838134765625, "global_step": 524509, "epoch": 6319} {"train_loss": -27.507526397705078, "global_step": 524510, "epoch": 6319} {"train_loss": -27.678272247314453, "global_step": 524511, "epoch": 6319} {"train_loss": -27.869068145751953, "global_step": 524512, "epoch": 6319} {"train_loss": -27.5659236907959, "global_step": 524513, "epoch": 6319} {"train_loss": -27.457733154296875, "global_step": 524514, "epoch": 6319} {"train_loss": -27.610809326171875, "global_step": 524515, "epoch": 6319} {"train_loss": -28.367151260375977, "global_step": 524516, "epoch": 6319} {"train_loss": -27.45914649963379, "global_step": 524517, "epoch": 6319} {"train_loss": -27.613889694213867, "global_step": 524518, "epoch": 6319} {"train_loss": -27.901655197143555, "global_step": 524519, "epoch": 6319} {"train_loss": -27.655231475830078, "global_step": 524520, "epoch": 6319} {"train_loss": -27.975738525390625, "global_step": 524521, "epoch": 6319} {"train_loss": -27.611608505249023, "global_step": 524522, "epoch": 6319} {"train_loss": -27.996280670166016, "global_step": 524523, "epoch": 6319} {"train_loss": -27.732593536376953, "global_step": 524524, "epoch": 6319} {"train_loss": -27.841617584228516, "global_step": 524525, "epoch": 6319} {"train_loss": -27.6653995513916, "global_step": 524526, "epoch": 6319} {"train_loss": -27.810705184936523, "global_step": 524527, "epoch": 6319} {"train_loss": -27.672290802001953, "global_step": 524528, "epoch": 6319} {"train_loss": -27.8837890625, "global_step": 524529, "epoch": 6319} {"train_loss": -27.996280670166016, "global_step": 524530, "epoch": 6319} {"train_loss": -27.690820693969727, "global_step": 524531, "epoch": 6319} {"train_loss": -27.245569229125977, "global_step": 524532, "epoch": 6319} {"train_loss": -27.66090202331543, "global_step": 524533, "epoch": 6319} {"train_loss": -27.45050048828125, "global_step": 524534, "epoch": 6319} {"train_loss": -27.86543083190918, "global_step": 524535, "epoch": 6319} {"train_loss": -27.596303939819336, "global_step": 524536, "epoch": 6319} {"train_loss": -27.421361923217773, "global_step": 524537, "epoch": 6319} {"train_loss": -27.554656982421875, "global_step": 524538, "epoch": 6319} {"train_loss": -27.259931564331055, "global_step": 524539, "epoch": 6319} {"train_loss": -27.37672996520996, "global_step": 524540, "epoch": 6319} {"train_loss": -27.413211822509766, "global_step": 524541, "epoch": 6319} {"train_loss": -27.854761123657227, "global_step": 524542, "epoch": 6319} {"train_loss": -27.70509147644043, "global_step": 524543, "epoch": 6319} {"train_loss": -27.720911026000977, "global_step": 524544, "epoch": 6319} {"train_loss": -27.470731735229492, "global_step": 524545, "epoch": 6319} {"train_loss": -27.4434814453125, "global_step": 524546, "epoch": 6319} {"train_loss": -27.66948890686035, "global_step": 524547, "epoch": 6319} {"train_loss": -27.70149040222168, "global_step": 524548, "epoch": 6319} {"train_loss": -27.653564453125, "global_step": 524549, "epoch": 6319} {"train_loss": -27.86409568786621, "global_step": 524550, "epoch": 6319} {"train_loss": -27.7706356048584, "global_step": 524551, "epoch": 6319} {"train_loss": -27.68060302734375, "global_step": 524552, "epoch": 6319} {"train_loss": -27.752954483032227, "global_step": 524553, "epoch": 6319} {"train_loss": -27.58597755432129, "global_step": 524554, "epoch": 6319} {"train_loss": -27.944290161132812, "global_step": 524555, "epoch": 6319} {"train_loss": -27.5841064453125, "global_step": 524556, "epoch": 6319} {"train_loss": -28.0336971282959, "global_step": 524557, "epoch": 6319} {"train_loss": -27.94916343688965, "global_step": 524558, "epoch": 6319} {"train_loss": -27.570201712918568, "global_step": 524559, "epoch": 6319, "val_loss": 6643191.0} {"train_loss": -27.28400230407715, "global_step": 524560, "epoch": 6320} {"train_loss": -26.706491470336914, "global_step": 524561, "epoch": 6320} {"train_loss": -27.04803466796875, "global_step": 524562, "epoch": 6320} {"train_loss": -27.243432998657227, "global_step": 524563, "epoch": 6320} {"train_loss": -27.3321475982666, "global_step": 524564, "epoch": 6320} {"train_loss": -26.894758224487305, "global_step": 524565, "epoch": 6320} {"train_loss": -26.950361251831055, "global_step": 524566, "epoch": 6320} {"train_loss": -27.174604415893555, "global_step": 524567, "epoch": 6320} {"train_loss": -27.27997398376465, "global_step": 524568, "epoch": 6320} {"train_loss": -26.98811149597168, "global_step": 524569, "epoch": 6320} {"train_loss": -27.06171226501465, "global_step": 524570, "epoch": 6320} {"train_loss": -27.055007934570312, "global_step": 524571, "epoch": 6320} {"train_loss": -27.158361434936523, "global_step": 524572, "epoch": 6320} {"train_loss": -26.989715576171875, "global_step": 524573, "epoch": 6320} {"train_loss": -27.019821166992188, "global_step": 524574, "epoch": 6320} {"train_loss": -27.28468132019043, "global_step": 524575, "epoch": 6320} {"train_loss": -27.652236938476562, "global_step": 524576, "epoch": 6320} {"train_loss": -27.407514572143555, "global_step": 524577, "epoch": 6320} {"train_loss": -27.30878257751465, "global_step": 524578, "epoch": 6320} {"train_loss": -27.2553653717041, "global_step": 524579, "epoch": 6320} {"train_loss": -27.661609649658203, "global_step": 524580, "epoch": 6320} {"train_loss": -27.42194938659668, "global_step": 524581, "epoch": 6320} {"train_loss": -27.09039306640625, "global_step": 524582, "epoch": 6320} {"train_loss": -27.371747970581055, "global_step": 524583, "epoch": 6320} {"train_loss": -27.553312301635742, "global_step": 524584, "epoch": 6320} {"train_loss": -27.455020904541016, "global_step": 524585, "epoch": 6320} {"train_loss": -27.17559814453125, "global_step": 524586, "epoch": 6320} {"train_loss": -27.677770614624023, "global_step": 524587, "epoch": 6320} {"train_loss": -27.262073516845703, "global_step": 524588, "epoch": 6320} {"train_loss": -27.0920467376709, "global_step": 524589, "epoch": 6320} {"train_loss": -27.872882843017578, "global_step": 524590, "epoch": 6320} {"train_loss": -27.45086669921875, "global_step": 524591, "epoch": 6320} {"train_loss": -27.504901885986328, "global_step": 524592, "epoch": 6320} {"train_loss": -27.23784828186035, "global_step": 524593, "epoch": 6320} {"train_loss": -27.72309684753418, "global_step": 524594, "epoch": 6320} {"train_loss": -27.875837326049805, "global_step": 524595, "epoch": 6320} {"train_loss": -27.69315528869629, "global_step": 524596, "epoch": 6320} {"train_loss": -27.5591983795166, "global_step": 524597, "epoch": 6320} {"train_loss": -27.861093521118164, "global_step": 524598, "epoch": 6320} {"train_loss": -27.740097045898438, "global_step": 524599, "epoch": 6320} {"train_loss": -27.954641342163086, "global_step": 524600, "epoch": 6320} {"train_loss": -27.61065101623535, "global_step": 524601, "epoch": 6320} {"train_loss": -27.912307739257812, "global_step": 524602, "epoch": 6320} {"train_loss": -27.6368465423584, "global_step": 524603, "epoch": 6320} {"train_loss": -27.394702911376953, "global_step": 524604, "epoch": 6320} {"train_loss": -27.418777465820312, "global_step": 524605, "epoch": 6320} {"train_loss": -28.048032760620117, "global_step": 524606, "epoch": 6320} {"train_loss": -28.22649574279785, "global_step": 524607, "epoch": 6320} {"train_loss": -27.680612564086914, "global_step": 524608, "epoch": 6320} {"train_loss": -27.729883193969727, "global_step": 524609, "epoch": 6320} {"train_loss": -27.86358642578125, "global_step": 524610, "epoch": 6320} {"train_loss": -27.945165634155273, "global_step": 524611, "epoch": 6320} {"train_loss": -27.462848663330078, "global_step": 524612, "epoch": 6320} {"train_loss": -27.85723876953125, "global_step": 524613, "epoch": 6320} {"train_loss": -27.775772094726562, "global_step": 524614, "epoch": 6320} {"train_loss": -28.046066284179688, "global_step": 524615, "epoch": 6320} {"train_loss": -27.95338249206543, "global_step": 524616, "epoch": 6320} {"train_loss": -27.49140739440918, "global_step": 524617, "epoch": 6320} {"train_loss": -27.73882484436035, "global_step": 524618, "epoch": 6320} {"train_loss": -27.968555450439453, "global_step": 524619, "epoch": 6320} {"train_loss": -28.15467643737793, "global_step": 524620, "epoch": 6320} {"train_loss": -27.91697120666504, "global_step": 524621, "epoch": 6320} {"train_loss": -28.131338119506836, "global_step": 524622, "epoch": 6320} {"train_loss": -27.360824584960938, "global_step": 524623, "epoch": 6320} {"train_loss": -27.789464950561523, "global_step": 524624, "epoch": 6320} {"train_loss": -27.6049861907959, "global_step": 524625, "epoch": 6320} {"train_loss": -27.921558380126953, "global_step": 524626, "epoch": 6320} {"train_loss": -27.888824462890625, "global_step": 524627, "epoch": 6320} {"train_loss": -27.224365234375, "global_step": 524628, "epoch": 6320} {"train_loss": -27.74683952331543, "global_step": 524629, "epoch": 6320} {"train_loss": -27.521787643432617, "global_step": 524630, "epoch": 6320} {"train_loss": -27.417102813720703, "global_step": 524631, "epoch": 6320} {"train_loss": -27.480310440063477, "global_step": 524632, "epoch": 6320} {"train_loss": -26.567594528198242, "global_step": 524633, "epoch": 6320} {"train_loss": -25.518672943115234, "global_step": 524634, "epoch": 6320} {"train_loss": -24.096481323242188, "global_step": 524635, "epoch": 6320} {"train_loss": -25.20930290222168, "global_step": 524636, "epoch": 6320} {"train_loss": -27.068252563476562, "global_step": 524637, "epoch": 6320} {"train_loss": -26.491994857788086, "global_step": 524638, "epoch": 6320} {"train_loss": -26.203718185424805, "global_step": 524639, "epoch": 6320} {"train_loss": -26.3830509185791, "global_step": 524640, "epoch": 6320} {"train_loss": -27.055755615234375, "global_step": 524641, "epoch": 6320} {"train_loss": -27.34963561827878, "global_step": 524642, "epoch": 6320, "val_loss": 6675087.0} {"train_loss": -26.00860023498535, "global_step": 524643, "epoch": 6321} {"train_loss": -26.40159034729004, "global_step": 524644, "epoch": 6321} {"train_loss": -26.399911880493164, "global_step": 524645, "epoch": 6321} {"train_loss": -26.087148666381836, "global_step": 524646, "epoch": 6321} {"train_loss": -26.36396598815918, "global_step": 524647, "epoch": 6321} {"train_loss": -26.11210060119629, "global_step": 524648, "epoch": 6321} {"train_loss": -26.4703311920166, "global_step": 524649, "epoch": 6321} {"train_loss": -26.340993881225586, "global_step": 524650, "epoch": 6321} {"train_loss": -26.401107788085938, "global_step": 524651, "epoch": 6321} {"train_loss": -26.547290802001953, "global_step": 524652, "epoch": 6321} {"train_loss": -26.64911460876465, "global_step": 524653, "epoch": 6321} {"train_loss": -26.758167266845703, "global_step": 524654, "epoch": 6321} {"train_loss": -26.926898956298828, "global_step": 524655, "epoch": 6321} {"train_loss": -26.6577205657959, "global_step": 524656, "epoch": 6321} {"train_loss": -26.924657821655273, "global_step": 524657, "epoch": 6321} {"train_loss": -26.659818649291992, "global_step": 524658, "epoch": 6321} {"train_loss": -26.75428581237793, "global_step": 524659, "epoch": 6321} {"train_loss": -27.13800048828125, "global_step": 524660, "epoch": 6321} {"train_loss": -27.1167049407959, "global_step": 524661, "epoch": 6321} {"train_loss": -27.00286293029785, "global_step": 524662, "epoch": 6321} {"train_loss": -27.15070152282715, "global_step": 524663, "epoch": 6321} {"train_loss": -26.668304443359375, "global_step": 524664, "epoch": 6321} {"train_loss": -26.861310958862305, "global_step": 524665, "epoch": 6321} {"train_loss": -27.011560440063477, "global_step": 524666, "epoch": 6321} {"train_loss": -27.233783721923828, "global_step": 524667, "epoch": 6321} {"train_loss": -27.34124183654785, "global_step": 524668, "epoch": 6321} {"train_loss": -27.222522735595703, "global_step": 524669, "epoch": 6321} {"train_loss": -27.09613609313965, "global_step": 524670, "epoch": 6321} {"train_loss": -27.108661651611328, "global_step": 524671, "epoch": 6321} {"train_loss": -27.431684494018555, "global_step": 524672, "epoch": 6321} {"train_loss": -27.53679847717285, "global_step": 524673, "epoch": 6321} {"train_loss": -27.60941505432129, "global_step": 524674, "epoch": 6321} {"train_loss": -27.453367233276367, "global_step": 524675, "epoch": 6321} {"train_loss": -27.4675350189209, "global_step": 524676, "epoch": 6321} {"train_loss": -27.452529907226562, "global_step": 524677, "epoch": 6321} {"train_loss": -27.614429473876953, "global_step": 524678, "epoch": 6321} {"train_loss": -27.80475425720215, "global_step": 524679, "epoch": 6321} {"train_loss": -27.120624542236328, "global_step": 524680, "epoch": 6321} {"train_loss": -27.457433700561523, "global_step": 524681, "epoch": 6321} {"train_loss": -27.5666446685791, "global_step": 524682, "epoch": 6321} {"train_loss": -27.597461700439453, "global_step": 524683, "epoch": 6321} {"train_loss": -27.52204704284668, "global_step": 524684, "epoch": 6321} {"train_loss": -27.532377243041992, "global_step": 524685, "epoch": 6321} {"train_loss": -27.439619064331055, "global_step": 524686, "epoch": 6321} {"train_loss": -27.421146392822266, "global_step": 524687, "epoch": 6321} {"train_loss": -27.540563583374023, "global_step": 524688, "epoch": 6321} {"train_loss": -27.517227172851562, "global_step": 524689, "epoch": 6321} {"train_loss": -27.519012451171875, "global_step": 524690, "epoch": 6321} {"train_loss": -27.524621963500977, "global_step": 524691, "epoch": 6321} {"train_loss": -28.010498046875, "global_step": 524692, "epoch": 6321} {"train_loss": -27.92044448852539, "global_step": 524693, "epoch": 6321} {"train_loss": -27.736433029174805, "global_step": 524694, "epoch": 6321} {"train_loss": -27.780920028686523, "global_step": 524695, "epoch": 6321} {"train_loss": -27.73360252380371, "global_step": 524696, "epoch": 6321} {"train_loss": -27.136938095092773, "global_step": 524697, "epoch": 6321} {"train_loss": -27.84503173828125, "global_step": 524698, "epoch": 6321} {"train_loss": -27.935504913330078, "global_step": 524699, "epoch": 6321} {"train_loss": -27.658615112304688, "global_step": 524700, "epoch": 6321} {"train_loss": -27.5346736907959, "global_step": 524701, "epoch": 6321} {"train_loss": -27.559814453125, "global_step": 524702, "epoch": 6321} {"train_loss": -27.572072982788086, "global_step": 524703, "epoch": 6321} {"train_loss": -27.538061141967773, "global_step": 524704, "epoch": 6321} {"train_loss": -27.580549240112305, "global_step": 524705, "epoch": 6321} {"train_loss": -27.787322998046875, "global_step": 524706, "epoch": 6321} {"train_loss": -27.57789421081543, "global_step": 524707, "epoch": 6321} {"train_loss": -27.315048217773438, "global_step": 524708, "epoch": 6321} {"train_loss": -27.419965744018555, "global_step": 524709, "epoch": 6321} {"train_loss": -27.650104522705078, "global_step": 524710, "epoch": 6321} {"train_loss": -27.380651473999023, "global_step": 524711, "epoch": 6321} {"train_loss": -27.283920288085938, "global_step": 524712, "epoch": 6321} {"train_loss": -27.71347999572754, "global_step": 524713, "epoch": 6321} {"train_loss": -27.766645431518555, "global_step": 524714, "epoch": 6321} {"train_loss": -27.425537109375, "global_step": 524715, "epoch": 6321} {"train_loss": -27.669347763061523, "global_step": 524716, "epoch": 6321} {"train_loss": -27.97211265563965, "global_step": 524717, "epoch": 6321} {"train_loss": -27.44364356994629, "global_step": 524718, "epoch": 6321} {"train_loss": -27.259923934936523, "global_step": 524719, "epoch": 6321} {"train_loss": -28.015247344970703, "global_step": 524720, "epoch": 6321} {"train_loss": -27.346372604370117, "global_step": 524721, "epoch": 6321} {"train_loss": -27.788522720336914, "global_step": 524722, "epoch": 6321} {"train_loss": -27.55335807800293, "global_step": 524723, "epoch": 6321} {"train_loss": -27.652124404907227, "global_step": 524724, "epoch": 6321} {"train_loss": -27.296298590051123, "global_step": 524725, "epoch": 6321, "val_loss": 6621864.0} {"train_loss": -26.759765625, "global_step": 524726, "epoch": 6322} {"train_loss": -27.510889053344727, "global_step": 524727, "epoch": 6322} {"train_loss": -27.36331558227539, "global_step": 524728, "epoch": 6322} {"train_loss": -27.030431747436523, "global_step": 524729, "epoch": 6322} {"train_loss": -27.631973266601562, "global_step": 524730, "epoch": 6322} {"train_loss": -27.0824031829834, "global_step": 524731, "epoch": 6322} {"train_loss": -26.54636573791504, "global_step": 524732, "epoch": 6322} {"train_loss": -26.927337646484375, "global_step": 524733, "epoch": 6322} {"train_loss": -27.3391056060791, "global_step": 524734, "epoch": 6322} {"train_loss": -27.358112335205078, "global_step": 524735, "epoch": 6322} {"train_loss": -27.442352294921875, "global_step": 524736, "epoch": 6322} {"train_loss": -27.458011627197266, "global_step": 524737, "epoch": 6322} {"train_loss": -27.197790145874023, "global_step": 524738, "epoch": 6322} {"train_loss": -27.416828155517578, "global_step": 524739, "epoch": 6322} {"train_loss": -27.2940616607666, "global_step": 524740, "epoch": 6322} {"train_loss": -27.06855583190918, "global_step": 524741, "epoch": 6322} {"train_loss": -27.332700729370117, "global_step": 524742, "epoch": 6322} {"train_loss": -27.515399932861328, "global_step": 524743, "epoch": 6322} {"train_loss": -27.561737060546875, "global_step": 524744, "epoch": 6322} {"train_loss": -27.513111114501953, "global_step": 524745, "epoch": 6322} {"train_loss": -27.05289649963379, "global_step": 524746, "epoch": 6322} {"train_loss": -27.374771118164062, "global_step": 524747, "epoch": 6322} {"train_loss": -27.580127716064453, "global_step": 524748, "epoch": 6322} {"train_loss": -27.89253044128418, "global_step": 524749, "epoch": 6322} {"train_loss": -27.28850746154785, "global_step": 524750, "epoch": 6322} {"train_loss": -27.703710556030273, "global_step": 524751, "epoch": 6322} {"train_loss": -27.680286407470703, "global_step": 524752, "epoch": 6322} {"train_loss": -27.760574340820312, "global_step": 524753, "epoch": 6322} {"train_loss": -27.6879940032959, "global_step": 524754, "epoch": 6322} {"train_loss": -27.204004287719727, "global_step": 524755, "epoch": 6322} {"train_loss": -27.46282958984375, "global_step": 524756, "epoch": 6322} {"train_loss": -27.287878036499023, "global_step": 524757, "epoch": 6322} {"train_loss": -27.676349639892578, "global_step": 524758, "epoch": 6322} {"train_loss": -27.60479164123535, "global_step": 524759, "epoch": 6322} {"train_loss": -27.682987213134766, "global_step": 524760, "epoch": 6322} {"train_loss": -27.7949161529541, "global_step": 524761, "epoch": 6322} {"train_loss": -27.45624351501465, "global_step": 524762, "epoch": 6322} {"train_loss": -28.43119239807129, "global_step": 524763, "epoch": 6322} {"train_loss": -27.9938907623291, "global_step": 524764, "epoch": 6322} {"train_loss": -27.453840255737305, "global_step": 524765, "epoch": 6322} {"train_loss": -27.523700714111328, "global_step": 524766, "epoch": 6322} {"train_loss": -27.292200088500977, "global_step": 524767, "epoch": 6322} {"train_loss": -27.383047103881836, "global_step": 524768, "epoch": 6322} {"train_loss": -27.501386642456055, "global_step": 524769, "epoch": 6322} {"train_loss": -27.741422653198242, "global_step": 524770, "epoch": 6322} {"train_loss": -27.536184310913086, "global_step": 524771, "epoch": 6322} {"train_loss": -27.22669792175293, "global_step": 524772, "epoch": 6322} {"train_loss": -27.59494400024414, "global_step": 524773, "epoch": 6322} {"train_loss": -27.57423210144043, "global_step": 524774, "epoch": 6322} {"train_loss": -27.540647506713867, "global_step": 524775, "epoch": 6322} {"train_loss": -27.92408561706543, "global_step": 524776, "epoch": 6322} {"train_loss": -27.925373077392578, "global_step": 524777, "epoch": 6322} {"train_loss": -27.500547409057617, "global_step": 524778, "epoch": 6322} {"train_loss": -27.698118209838867, "global_step": 524779, "epoch": 6322} {"train_loss": -27.883014678955078, "global_step": 524780, "epoch": 6322} {"train_loss": -27.759845733642578, "global_step": 524781, "epoch": 6322} {"train_loss": -28.062061309814453, "global_step": 524782, "epoch": 6322} {"train_loss": -28.02277946472168, "global_step": 524783, "epoch": 6322} {"train_loss": -27.688196182250977, "global_step": 524784, "epoch": 6322} {"train_loss": -28.033706665039062, "global_step": 524785, "epoch": 6322} {"train_loss": -27.856367111206055, "global_step": 524786, "epoch": 6322} {"train_loss": -27.63747215270996, "global_step": 524787, "epoch": 6322} {"train_loss": -27.424549102783203, "global_step": 524788, "epoch": 6322} {"train_loss": -27.392648696899414, "global_step": 524789, "epoch": 6322} {"train_loss": -27.639677047729492, "global_step": 524790, "epoch": 6322} {"train_loss": -27.6185245513916, "global_step": 524791, "epoch": 6322} {"train_loss": -27.31070327758789, "global_step": 524792, "epoch": 6322} {"train_loss": -27.883390426635742, "global_step": 524793, "epoch": 6322} {"train_loss": -27.7469425201416, "global_step": 524794, "epoch": 6322} {"train_loss": -27.17435646057129, "global_step": 524795, "epoch": 6322} {"train_loss": -27.268163681030273, "global_step": 524796, "epoch": 6322} {"train_loss": -26.949438095092773, "global_step": 524797, "epoch": 6322} {"train_loss": -26.471174240112305, "global_step": 524798, "epoch": 6322} {"train_loss": -27.214807510375977, "global_step": 524799, "epoch": 6322} {"train_loss": -27.521665573120117, "global_step": 524800, "epoch": 6322} {"train_loss": -26.65388298034668, "global_step": 524801, "epoch": 6322} {"train_loss": -26.7849178314209, "global_step": 524802, "epoch": 6322} {"train_loss": -27.38960075378418, "global_step": 524803, "epoch": 6322} {"train_loss": -27.04317283630371, "global_step": 524804, "epoch": 6322} {"train_loss": -27.025196075439453, "global_step": 524805, "epoch": 6322} {"train_loss": -27.154254913330078, "global_step": 524806, "epoch": 6322} {"train_loss": -27.327701568603516, "global_step": 524807, "epoch": 6322} {"train_loss": -27.45669737206884, "global_step": 524808, "epoch": 6322, "val_loss": 6616084.0} {"train_loss": -26.21107292175293, "global_step": 524809, "epoch": 6323} {"train_loss": -26.066373825073242, "global_step": 524810, "epoch": 6323} {"train_loss": -26.8083553314209, "global_step": 524811, "epoch": 6323} {"train_loss": -26.514724731445312, "global_step": 524812, "epoch": 6323} {"train_loss": -27.08013916015625, "global_step": 524813, "epoch": 6323} {"train_loss": -26.84458351135254, "global_step": 524814, "epoch": 6323} {"train_loss": -26.666288375854492, "global_step": 524815, "epoch": 6323} {"train_loss": -26.523681640625, "global_step": 524816, "epoch": 6323} {"train_loss": -27.0001277923584, "global_step": 524817, "epoch": 6323} {"train_loss": -26.96892738342285, "global_step": 524818, "epoch": 6323} {"train_loss": -27.02838134765625, "global_step": 524819, "epoch": 6323} {"train_loss": -27.138837814331055, "global_step": 524820, "epoch": 6323} {"train_loss": -27.202573776245117, "global_step": 524821, "epoch": 6323} {"train_loss": -27.02337074279785, "global_step": 524822, "epoch": 6323} {"train_loss": -27.008331298828125, "global_step": 524823, "epoch": 6323} {"train_loss": -27.07084083557129, "global_step": 524824, "epoch": 6323} {"train_loss": -27.33588981628418, "global_step": 524825, "epoch": 6323} {"train_loss": -27.027332305908203, "global_step": 524826, "epoch": 6323} {"train_loss": -27.15546989440918, "global_step": 524827, "epoch": 6323} {"train_loss": -27.158370971679688, "global_step": 524828, "epoch": 6323} {"train_loss": -27.31442642211914, "global_step": 524829, "epoch": 6323} {"train_loss": -27.319931030273438, "global_step": 524830, "epoch": 6323} {"train_loss": -27.198827743530273, "global_step": 524831, "epoch": 6323} {"train_loss": -27.297199249267578, "global_step": 524832, "epoch": 6323} {"train_loss": -27.278018951416016, "global_step": 524833, "epoch": 6323} {"train_loss": -27.150150299072266, "global_step": 524834, "epoch": 6323} {"train_loss": -27.478687286376953, "global_step": 524835, "epoch": 6323} {"train_loss": -27.388315200805664, "global_step": 524836, "epoch": 6323} {"train_loss": -27.4150333404541, "global_step": 524837, "epoch": 6323} {"train_loss": -27.426664352416992, "global_step": 524838, "epoch": 6323} {"train_loss": -27.80661964416504, "global_step": 524839, "epoch": 6323} {"train_loss": -27.774763107299805, "global_step": 524840, "epoch": 6323} {"train_loss": -27.683008193969727, "global_step": 524841, "epoch": 6323} {"train_loss": -27.317899703979492, "global_step": 524842, "epoch": 6323} {"train_loss": -27.67367935180664, "global_step": 524843, "epoch": 6323} {"train_loss": -27.60796546936035, "global_step": 524844, "epoch": 6323} {"train_loss": -27.83096694946289, "global_step": 524845, "epoch": 6323} {"train_loss": -27.570789337158203, "global_step": 524846, "epoch": 6323} {"train_loss": -27.401294708251953, "global_step": 524847, "epoch": 6323} {"train_loss": -27.592304229736328, "global_step": 524848, "epoch": 6323} {"train_loss": -27.442901611328125, "global_step": 524849, "epoch": 6323} {"train_loss": -27.155271530151367, "global_step": 524850, "epoch": 6323} {"train_loss": -27.65443992614746, "global_step": 524851, "epoch": 6323} {"train_loss": -27.547643661499023, "global_step": 524852, "epoch": 6323} {"train_loss": -27.669265747070312, "global_step": 524853, "epoch": 6323} {"train_loss": -27.73346519470215, "global_step": 524854, "epoch": 6323} {"train_loss": -27.971759796142578, "global_step": 524855, "epoch": 6323} {"train_loss": -27.611343383789062, "global_step": 524856, "epoch": 6323} {"train_loss": -27.6415958404541, "global_step": 524857, "epoch": 6323} {"train_loss": -27.37444496154785, "global_step": 524858, "epoch": 6323} {"train_loss": -27.58186149597168, "global_step": 524859, "epoch": 6323} {"train_loss": -27.83734130859375, "global_step": 524860, "epoch": 6323} {"train_loss": -27.829893112182617, "global_step": 524861, "epoch": 6323} {"train_loss": -27.812854766845703, "global_step": 524862, "epoch": 6323} {"train_loss": -27.60462760925293, "global_step": 524863, "epoch": 6323} {"train_loss": -28.0661678314209, "global_step": 524864, "epoch": 6323} {"train_loss": -27.664228439331055, "global_step": 524865, "epoch": 6323} {"train_loss": -27.98023796081543, "global_step": 524866, "epoch": 6323} {"train_loss": -27.674341201782227, "global_step": 524867, "epoch": 6323} {"train_loss": -28.102619171142578, "global_step": 524868, "epoch": 6323} {"train_loss": -27.67341423034668, "global_step": 524869, "epoch": 6323} {"train_loss": -27.946365356445312, "global_step": 524870, "epoch": 6323} {"train_loss": -27.58310890197754, "global_step": 524871, "epoch": 6323} {"train_loss": -27.530786514282227, "global_step": 524872, "epoch": 6323} {"train_loss": -27.279830932617188, "global_step": 524873, "epoch": 6323} {"train_loss": -27.474369049072266, "global_step": 524874, "epoch": 6323} {"train_loss": -26.940214157104492, "global_step": 524875, "epoch": 6323} {"train_loss": -26.343286514282227, "global_step": 524876, "epoch": 6323} {"train_loss": -26.355438232421875, "global_step": 524877, "epoch": 6323} {"train_loss": -26.19991111755371, "global_step": 524878, "epoch": 6323} {"train_loss": -25.792484283447266, "global_step": 524879, "epoch": 6323} {"train_loss": -26.386999130249023, "global_step": 524880, "epoch": 6323} {"train_loss": -27.367050170898438, "global_step": 524881, "epoch": 6323} {"train_loss": -27.219009399414062, "global_step": 524882, "epoch": 6323} {"train_loss": -27.09284782409668, "global_step": 524883, "epoch": 6323} {"train_loss": -27.17213249206543, "global_step": 524884, "epoch": 6323} {"train_loss": -27.18549919128418, "global_step": 524885, "epoch": 6323} {"train_loss": -27.007343292236328, "global_step": 524886, "epoch": 6323} {"train_loss": -27.27298927307129, "global_step": 524887, "epoch": 6323} {"train_loss": -26.851852416992188, "global_step": 524888, "epoch": 6323} {"train_loss": -27.49755859375, "global_step": 524889, "epoch": 6323} {"train_loss": -27.20863151550293, "global_step": 524890, "epoch": 6323} {"train_loss": -27.277098828051464, "global_step": 524891, "epoch": 6323, "val_loss": 6601850.0} {"train_loss": -27.19736671447754, "global_step": 524892, "epoch": 6324} {"train_loss": -26.790130615234375, "global_step": 524893, "epoch": 6324} {"train_loss": -26.86036491394043, "global_step": 524894, "epoch": 6324} {"train_loss": -27.469594955444336, "global_step": 524895, "epoch": 6324} {"train_loss": -27.079914093017578, "global_step": 524896, "epoch": 6324} {"train_loss": -26.8868465423584, "global_step": 524897, "epoch": 6324} {"train_loss": -27.01654052734375, "global_step": 524898, "epoch": 6324} {"train_loss": -27.4499454498291, "global_step": 524899, "epoch": 6324} {"train_loss": -27.310047149658203, "global_step": 524900, "epoch": 6324} {"train_loss": -27.411924362182617, "global_step": 524901, "epoch": 6324} {"train_loss": -27.271360397338867, "global_step": 524902, "epoch": 6324} {"train_loss": -27.47968101501465, "global_step": 524903, "epoch": 6324} {"train_loss": -26.9016170501709, "global_step": 524904, "epoch": 6324} {"train_loss": -27.01129722595215, "global_step": 524905, "epoch": 6324} {"train_loss": -27.43178367614746, "global_step": 524906, "epoch": 6324} {"train_loss": -27.647573471069336, "global_step": 524907, "epoch": 6324} {"train_loss": -26.963565826416016, "global_step": 524908, "epoch": 6324} {"train_loss": -27.170989990234375, "global_step": 524909, "epoch": 6324} {"train_loss": -27.395139694213867, "global_step": 524910, "epoch": 6324} {"train_loss": -27.390033721923828, "global_step": 524911, "epoch": 6324} {"train_loss": -27.561132431030273, "global_step": 524912, "epoch": 6324} {"train_loss": -27.28291130065918, "global_step": 524913, "epoch": 6324} {"train_loss": -27.392536163330078, "global_step": 524914, "epoch": 6324} {"train_loss": -27.681997299194336, "global_step": 524915, "epoch": 6324} {"train_loss": -27.503217697143555, "global_step": 524916, "epoch": 6324} {"train_loss": -27.69775390625, "global_step": 524917, "epoch": 6324} {"train_loss": -27.42921257019043, "global_step": 524918, "epoch": 6324} {"train_loss": -27.720911026000977, "global_step": 524919, "epoch": 6324} {"train_loss": -27.515722274780273, "global_step": 524920, "epoch": 6324} {"train_loss": -27.561487197875977, "global_step": 524921, "epoch": 6324} {"train_loss": -27.492517471313477, "global_step": 524922, "epoch": 6324} {"train_loss": -27.545642852783203, "global_step": 524923, "epoch": 6324} {"train_loss": -27.599578857421875, "global_step": 524924, "epoch": 6324} {"train_loss": -27.810728073120117, "global_step": 524925, "epoch": 6324} {"train_loss": -27.59394645690918, "global_step": 524926, "epoch": 6324} {"train_loss": -27.3546142578125, "global_step": 524927, "epoch": 6324} {"train_loss": -27.59393310546875, "global_step": 524928, "epoch": 6324} {"train_loss": -27.484128952026367, "global_step": 524929, "epoch": 6324} {"train_loss": -27.71087074279785, "global_step": 524930, "epoch": 6324} {"train_loss": -27.98711585998535, "global_step": 524931, "epoch": 6324} {"train_loss": -27.26773452758789, "global_step": 524932, "epoch": 6324} {"train_loss": -27.721908569335938, "global_step": 524933, "epoch": 6324} {"train_loss": -27.995288848876953, "global_step": 524934, "epoch": 6324} {"train_loss": -27.63551902770996, "global_step": 524935, "epoch": 6324} {"train_loss": -27.469125747680664, "global_step": 524936, "epoch": 6324} {"train_loss": -27.527013778686523, "global_step": 524937, "epoch": 6324} {"train_loss": -27.81340980529785, "global_step": 524938, "epoch": 6324} {"train_loss": -28.05552101135254, "global_step": 524939, "epoch": 6324} {"train_loss": -28.049177169799805, "global_step": 524940, "epoch": 6324} {"train_loss": -27.626672744750977, "global_step": 524941, "epoch": 6324} {"train_loss": -28.108549118041992, "global_step": 524942, "epoch": 6324} {"train_loss": -27.500732421875, "global_step": 524943, "epoch": 6324} {"train_loss": -27.557540893554688, "global_step": 524944, "epoch": 6324} {"train_loss": -27.704633712768555, "global_step": 524945, "epoch": 6324} {"train_loss": -27.8072509765625, "global_step": 524946, "epoch": 6324} {"train_loss": -27.67292594909668, "global_step": 524947, "epoch": 6324} {"train_loss": -27.8012752532959, "global_step": 524948, "epoch": 6324} {"train_loss": -27.72053337097168, "global_step": 524949, "epoch": 6324} {"train_loss": -28.20290184020996, "global_step": 524950, "epoch": 6324} {"train_loss": -27.533716201782227, "global_step": 524951, "epoch": 6324} {"train_loss": -27.856616973876953, "global_step": 524952, "epoch": 6324} {"train_loss": -27.793567657470703, "global_step": 524953, "epoch": 6324} {"train_loss": -27.81056785583496, "global_step": 524954, "epoch": 6324} {"train_loss": -27.756256103515625, "global_step": 524955, "epoch": 6324} {"train_loss": -27.71160316467285, "global_step": 524956, "epoch": 6324} {"train_loss": -27.47035026550293, "global_step": 524957, "epoch": 6324} {"train_loss": -27.4468936920166, "global_step": 524958, "epoch": 6324} {"train_loss": -27.81270408630371, "global_step": 524959, "epoch": 6324} {"train_loss": -27.978681564331055, "global_step": 524960, "epoch": 6324} {"train_loss": -27.6484375, "global_step": 524961, "epoch": 6324} {"train_loss": -27.495981216430664, "global_step": 524962, "epoch": 6324} {"train_loss": -27.686817169189453, "global_step": 524963, "epoch": 6324} {"train_loss": -27.78403663635254, "global_step": 524964, "epoch": 6324} {"train_loss": -27.722003936767578, "global_step": 524965, "epoch": 6324} {"train_loss": -27.03400993347168, "global_step": 524966, "epoch": 6324} {"train_loss": -26.570510864257812, "global_step": 524967, "epoch": 6324} {"train_loss": -26.87965202331543, "global_step": 524968, "epoch": 6324} {"train_loss": -27.054676055908203, "global_step": 524969, "epoch": 6324} {"train_loss": -27.19668960571289, "global_step": 524970, "epoch": 6324} {"train_loss": -27.599302291870117, "global_step": 524971, "epoch": 6324} {"train_loss": -27.523107528686523, "global_step": 524972, "epoch": 6324} {"train_loss": -27.141340255737305, "global_step": 524973, "epoch": 6324} {"train_loss": -27.49792779210102, "global_step": 524974, "epoch": 6324, "val_loss": 6627734.0} {"train_loss": -26.51702880859375, "global_step": 524975, "epoch": 6325} {"train_loss": -27.107725143432617, "global_step": 524976, "epoch": 6325} {"train_loss": -26.756195068359375, "global_step": 524977, "epoch": 6325} {"train_loss": -26.650253295898438, "global_step": 524978, "epoch": 6325} {"train_loss": -26.14694595336914, "global_step": 524979, "epoch": 6325} {"train_loss": -26.273542404174805, "global_step": 524980, "epoch": 6325} {"train_loss": -26.358556747436523, "global_step": 524981, "epoch": 6325} {"train_loss": -26.663818359375, "global_step": 524982, "epoch": 6325} {"train_loss": -26.790307998657227, "global_step": 524983, "epoch": 6325} {"train_loss": -27.004438400268555, "global_step": 524984, "epoch": 6325} {"train_loss": -27.54363441467285, "global_step": 524985, "epoch": 6325} {"train_loss": -27.176715850830078, "global_step": 524986, "epoch": 6325} {"train_loss": -27.10032081604004, "global_step": 524987, "epoch": 6325} {"train_loss": -27.168582916259766, "global_step": 524988, "epoch": 6325} {"train_loss": -26.931371688842773, "global_step": 524989, "epoch": 6325} {"train_loss": -27.260629653930664, "global_step": 524990, "epoch": 6325} {"train_loss": -27.10603141784668, "global_step": 524991, "epoch": 6325} {"train_loss": -27.388498306274414, "global_step": 524992, "epoch": 6325} {"train_loss": -26.98829460144043, "global_step": 524993, "epoch": 6325} {"train_loss": -27.337509155273438, "global_step": 524994, "epoch": 6325} {"train_loss": -26.866958618164062, "global_step": 524995, "epoch": 6325} {"train_loss": -27.166345596313477, "global_step": 524996, "epoch": 6325} {"train_loss": -27.36557388305664, "global_step": 524997, "epoch": 6325} {"train_loss": -27.1882266998291, "global_step": 524998, "epoch": 6325} {"train_loss": -27.19120216369629, "global_step": 524999, "epoch": 6325} {"train_loss": -27.366931915283203, "global_step": 525000, "epoch": 6325} {"train_loss": -27.46156120300293, "global_step": 525001, "epoch": 6325} {"train_loss": -27.347620010375977, "global_step": 525002, "epoch": 6325} {"train_loss": -27.700448989868164, "global_step": 525003, "epoch": 6325} {"train_loss": -27.183944702148438, "global_step": 525004, "epoch": 6325} {"train_loss": -27.327741622924805, "global_step": 525005, "epoch": 6325} {"train_loss": -27.09197425842285, "global_step": 525006, "epoch": 6325} {"train_loss": -27.892011642456055, "global_step": 525007, "epoch": 6325} {"train_loss": -27.854902267456055, "global_step": 525008, "epoch": 6325} {"train_loss": -27.42544937133789, "global_step": 525009, "epoch": 6325} {"train_loss": -27.61090087890625, "global_step": 525010, "epoch": 6325} {"train_loss": -27.38394546508789, "global_step": 525011, "epoch": 6325} {"train_loss": -27.30868911743164, "global_step": 525012, "epoch": 6325} {"train_loss": -27.4600830078125, "global_step": 525013, "epoch": 6325} {"train_loss": -27.691247940063477, "global_step": 525014, "epoch": 6325} {"train_loss": -27.485538482666016, "global_step": 525015, "epoch": 6325} {"train_loss": -27.554967880249023, "global_step": 525016, "epoch": 6325} {"train_loss": -27.29102897644043, "global_step": 525017, "epoch": 6325} {"train_loss": -27.5120792388916, "global_step": 525018, "epoch": 6325} {"train_loss": -27.672931671142578, "global_step": 525019, "epoch": 6325} {"train_loss": -27.987903594970703, "global_step": 525020, "epoch": 6325} {"train_loss": -27.465560913085938, "global_step": 525021, "epoch": 6325} {"train_loss": -27.97529411315918, "global_step": 525022, "epoch": 6325} {"train_loss": -27.546222686767578, "global_step": 525023, "epoch": 6325} {"train_loss": -27.763446807861328, "global_step": 525024, "epoch": 6325} {"train_loss": -27.745939254760742, "global_step": 525025, "epoch": 6325} {"train_loss": -27.73593521118164, "global_step": 525026, "epoch": 6325} {"train_loss": -27.44928550720215, "global_step": 525027, "epoch": 6325} {"train_loss": -27.714487075805664, "global_step": 525028, "epoch": 6325} {"train_loss": -27.719385147094727, "global_step": 525029, "epoch": 6325} {"train_loss": -27.578306198120117, "global_step": 525030, "epoch": 6325} {"train_loss": -27.942190170288086, "global_step": 525031, "epoch": 6325} {"train_loss": -27.7238712310791, "global_step": 525032, "epoch": 6325} {"train_loss": -27.609540939331055, "global_step": 525033, "epoch": 6325} {"train_loss": -27.5919246673584, "global_step": 525034, "epoch": 6325} {"train_loss": -27.44586753845215, "global_step": 525035, "epoch": 6325} {"train_loss": -27.604150772094727, "global_step": 525036, "epoch": 6325} {"train_loss": -27.318801879882812, "global_step": 525037, "epoch": 6325} {"train_loss": -27.440155029296875, "global_step": 525038, "epoch": 6325} {"train_loss": -27.5239315032959, "global_step": 525039, "epoch": 6325} {"train_loss": -27.322376251220703, "global_step": 525040, "epoch": 6325} {"train_loss": -27.483997344970703, "global_step": 525041, "epoch": 6325} {"train_loss": -27.448999404907227, "global_step": 525042, "epoch": 6325} {"train_loss": -27.752111434936523, "global_step": 525043, "epoch": 6325} {"train_loss": -27.3990478515625, "global_step": 525044, "epoch": 6325} {"train_loss": -27.61496353149414, "global_step": 525045, "epoch": 6325} {"train_loss": -27.3438777923584, "global_step": 525046, "epoch": 6325} {"train_loss": -27.257314682006836, "global_step": 525047, "epoch": 6325} {"train_loss": -27.28374671936035, "global_step": 525048, "epoch": 6325} {"train_loss": -27.469287872314453, "global_step": 525049, "epoch": 6325} {"train_loss": -27.026660919189453, "global_step": 525050, "epoch": 6325} {"train_loss": -27.5037841796875, "global_step": 525051, "epoch": 6325} {"train_loss": -27.491851806640625, "global_step": 525052, "epoch": 6325} {"train_loss": -27.200475692749023, "global_step": 525053, "epoch": 6325} {"train_loss": -27.332834243774414, "global_step": 525054, "epoch": 6325} {"train_loss": -27.64664077758789, "global_step": 525055, "epoch": 6325} {"train_loss": -26.399158477783203, "global_step": 525056, "epoch": 6325} {"train_loss": -27.32151670341032, "global_step": 525057, "epoch": 6325, "val_loss": 6590773.0} {"train_loss": -25.86441421508789, "global_step": 525058, "epoch": 6326} {"train_loss": -26.022878646850586, "global_step": 525059, "epoch": 6326} {"train_loss": -26.01399803161621, "global_step": 525060, "epoch": 6326} {"train_loss": -25.643640518188477, "global_step": 525061, "epoch": 6326} {"train_loss": -26.9637508392334, "global_step": 525062, "epoch": 6326} {"train_loss": -26.404254913330078, "global_step": 525063, "epoch": 6326} {"train_loss": -26.68824577331543, "global_step": 525064, "epoch": 6326} {"train_loss": -26.498010635375977, "global_step": 525065, "epoch": 6326} {"train_loss": -26.6707763671875, "global_step": 525066, "epoch": 6326} {"train_loss": -26.461669921875, "global_step": 525067, "epoch": 6326} {"train_loss": -26.757831573486328, "global_step": 525068, "epoch": 6326} {"train_loss": -26.6214542388916, "global_step": 525069, "epoch": 6326} {"train_loss": -26.830793380737305, "global_step": 525070, "epoch": 6326} {"train_loss": -27.165658950805664, "global_step": 525071, "epoch": 6326} {"train_loss": -26.962072372436523, "global_step": 525072, "epoch": 6326} {"train_loss": -26.586841583251953, "global_step": 525073, "epoch": 6326} {"train_loss": -26.646717071533203, "global_step": 525074, "epoch": 6326} {"train_loss": -26.673490524291992, "global_step": 525075, "epoch": 6326} {"train_loss": -27.02243423461914, "global_step": 525076, "epoch": 6326} {"train_loss": -26.894134521484375, "global_step": 525077, "epoch": 6326} {"train_loss": -27.175647735595703, "global_step": 525078, "epoch": 6326} {"train_loss": -27.126798629760742, "global_step": 525079, "epoch": 6326} {"train_loss": -26.85637855529785, "global_step": 525080, "epoch": 6326} {"train_loss": -27.412155151367188, "global_step": 525081, "epoch": 6326} {"train_loss": -27.201520919799805, "global_step": 525082, "epoch": 6326} {"train_loss": -27.15974998474121, "global_step": 525083, "epoch": 6326} {"train_loss": -27.281375885009766, "global_step": 525084, "epoch": 6326} {"train_loss": -27.43390464782715, "global_step": 525085, "epoch": 6326} {"train_loss": -27.363208770751953, "global_step": 525086, "epoch": 6326} {"train_loss": -27.222620010375977, "global_step": 525087, "epoch": 6326} {"train_loss": -27.31854248046875, "global_step": 525088, "epoch": 6326} {"train_loss": -27.305089950561523, "global_step": 525089, "epoch": 6326} {"train_loss": -27.499929428100586, "global_step": 525090, "epoch": 6326} {"train_loss": -27.64291763305664, "global_step": 525091, "epoch": 6326} {"train_loss": -27.57111930847168, "global_step": 525092, "epoch": 6326} {"train_loss": -27.507572174072266, "global_step": 525093, "epoch": 6326} {"train_loss": -27.44400405883789, "global_step": 525094, "epoch": 6326} {"train_loss": -27.46747398376465, "global_step": 525095, "epoch": 6326} {"train_loss": -27.322250366210938, "global_step": 525096, "epoch": 6326} {"train_loss": -27.9108943939209, "global_step": 525097, "epoch": 6326} {"train_loss": -27.754913330078125, "global_step": 525098, "epoch": 6326} {"train_loss": -27.7681941986084, "global_step": 525099, "epoch": 6326} {"train_loss": -27.646772384643555, "global_step": 525100, "epoch": 6326} {"train_loss": -27.4602108001709, "global_step": 525101, "epoch": 6326} {"train_loss": -27.51593589782715, "global_step": 525102, "epoch": 6326} {"train_loss": -27.571989059448242, "global_step": 525103, "epoch": 6326} {"train_loss": -27.61777114868164, "global_step": 525104, "epoch": 6326} {"train_loss": -27.327741622924805, "global_step": 525105, "epoch": 6326} {"train_loss": -27.16705322265625, "global_step": 525106, "epoch": 6326} {"train_loss": -27.902868270874023, "global_step": 525107, "epoch": 6326} {"train_loss": -27.775243759155273, "global_step": 525108, "epoch": 6326} {"train_loss": -27.36199951171875, "global_step": 525109, "epoch": 6326} {"train_loss": -27.17138671875, "global_step": 525110, "epoch": 6326} {"train_loss": -27.69120216369629, "global_step": 525111, "epoch": 6326} {"train_loss": -27.780698776245117, "global_step": 525112, "epoch": 6326} {"train_loss": -27.65272331237793, "global_step": 525113, "epoch": 6326} {"train_loss": -27.414030075073242, "global_step": 525114, "epoch": 6326} {"train_loss": -27.67643165588379, "global_step": 525115, "epoch": 6326} {"train_loss": -27.400903701782227, "global_step": 525116, "epoch": 6326} {"train_loss": -27.494735717773438, "global_step": 525117, "epoch": 6326} {"train_loss": -27.668272018432617, "global_step": 525118, "epoch": 6326} {"train_loss": -28.04070472717285, "global_step": 525119, "epoch": 6326} {"train_loss": -27.783161163330078, "global_step": 525120, "epoch": 6326} {"train_loss": -27.67108726501465, "global_step": 525121, "epoch": 6326} {"train_loss": -27.5804500579834, "global_step": 525122, "epoch": 6326} {"train_loss": -27.778594970703125, "global_step": 525123, "epoch": 6326} {"train_loss": -27.570199966430664, "global_step": 525124, "epoch": 6326} {"train_loss": -27.342878341674805, "global_step": 525125, "epoch": 6326} {"train_loss": -27.5402774810791, "global_step": 525126, "epoch": 6326} {"train_loss": -27.608224868774414, "global_step": 525127, "epoch": 6326} {"train_loss": -27.73121452331543, "global_step": 525128, "epoch": 6326} {"train_loss": -27.624988555908203, "global_step": 525129, "epoch": 6326} {"train_loss": -27.55771827697754, "global_step": 525130, "epoch": 6326} {"train_loss": -27.712732315063477, "global_step": 525131, "epoch": 6326} {"train_loss": -27.421493530273438, "global_step": 525132, "epoch": 6326} {"train_loss": -27.657276153564453, "global_step": 525133, "epoch": 6326} {"train_loss": -27.8010311126709, "global_step": 525134, "epoch": 6326} {"train_loss": -27.7850399017334, "global_step": 525135, "epoch": 6326} {"train_loss": -28.0047607421875, "global_step": 525136, "epoch": 6326} {"train_loss": -27.515539169311523, "global_step": 525137, "epoch": 6326} {"train_loss": -27.3682804107666, "global_step": 525138, "epoch": 6326} {"train_loss": -27.65143394470215, "global_step": 525139, "epoch": 6326} {"train_loss": -27.29454702354339, "global_step": 525140, "epoch": 6326, "val_loss": 6572203.0} {"train_loss": -27.696027755737305, "global_step": 525141, "epoch": 6327} {"train_loss": -27.29420280456543, "global_step": 525142, "epoch": 6327} {"train_loss": -27.32307243347168, "global_step": 525143, "epoch": 6327} {"train_loss": -27.553678512573242, "global_step": 525144, "epoch": 6327} {"train_loss": -27.2777156829834, "global_step": 525145, "epoch": 6327} {"train_loss": -27.815977096557617, "global_step": 525146, "epoch": 6327} {"train_loss": -27.330673217773438, "global_step": 525147, "epoch": 6327} {"train_loss": -26.973318099975586, "global_step": 525148, "epoch": 6327} {"train_loss": -27.530675888061523, "global_step": 525149, "epoch": 6327} {"train_loss": -27.521347045898438, "global_step": 525150, "epoch": 6327} {"train_loss": -27.27595329284668, "global_step": 525151, "epoch": 6327} {"train_loss": -27.59931755065918, "global_step": 525152, "epoch": 6327} {"train_loss": -27.521503448486328, "global_step": 525153, "epoch": 6327} {"train_loss": -27.15378189086914, "global_step": 525154, "epoch": 6327} {"train_loss": -27.41426658630371, "global_step": 525155, "epoch": 6327} {"train_loss": -27.623804092407227, "global_step": 525156, "epoch": 6327} {"train_loss": -27.30983543395996, "global_step": 525157, "epoch": 6327} {"train_loss": -27.239973068237305, "global_step": 525158, "epoch": 6327} {"train_loss": -26.9842529296875, "global_step": 525159, "epoch": 6327} {"train_loss": -27.017126083374023, "global_step": 525160, "epoch": 6327} {"train_loss": -27.341928482055664, "global_step": 525161, "epoch": 6327} {"train_loss": -27.680688858032227, "global_step": 525162, "epoch": 6327} {"train_loss": -27.296960830688477, "global_step": 525163, "epoch": 6327} {"train_loss": -27.313329696655273, "global_step": 525164, "epoch": 6327} {"train_loss": -27.37054443359375, "global_step": 525165, "epoch": 6327} {"train_loss": -27.33401870727539, "global_step": 525166, "epoch": 6327} {"train_loss": -27.297473907470703, "global_step": 525167, "epoch": 6327} {"train_loss": -27.655349731445312, "global_step": 525168, "epoch": 6327} {"train_loss": -27.688962936401367, "global_step": 525169, "epoch": 6327} {"train_loss": -27.621068954467773, "global_step": 525170, "epoch": 6327} {"train_loss": -27.79145622253418, "global_step": 525171, "epoch": 6327} {"train_loss": -27.880441665649414, "global_step": 525172, "epoch": 6327} {"train_loss": -27.80130958557129, "global_step": 525173, "epoch": 6327} {"train_loss": -27.85492515563965, "global_step": 525174, "epoch": 6327} {"train_loss": -27.638036727905273, "global_step": 525175, "epoch": 6327} {"train_loss": -27.445953369140625, "global_step": 525176, "epoch": 6327} {"train_loss": -27.837543487548828, "global_step": 525177, "epoch": 6327} {"train_loss": -27.544757843017578, "global_step": 525178, "epoch": 6327} {"train_loss": -28.2033748626709, "global_step": 525179, "epoch": 6327} {"train_loss": -27.469282150268555, "global_step": 525180, "epoch": 6327} {"train_loss": -27.776350021362305, "global_step": 525181, "epoch": 6327} {"train_loss": -27.89571189880371, "global_step": 525182, "epoch": 6327} {"train_loss": -27.642475128173828, "global_step": 525183, "epoch": 6327} {"train_loss": -27.81068229675293, "global_step": 525184, "epoch": 6327} {"train_loss": -27.668766021728516, "global_step": 525185, "epoch": 6327} {"train_loss": -27.702880859375, "global_step": 525186, "epoch": 6327} {"train_loss": -27.788694381713867, "global_step": 525187, "epoch": 6327} {"train_loss": -27.417871475219727, "global_step": 525188, "epoch": 6327} {"train_loss": -27.25446891784668, "global_step": 525189, "epoch": 6327} {"train_loss": -27.57221794128418, "global_step": 525190, "epoch": 6327} {"train_loss": -27.301355361938477, "global_step": 525191, "epoch": 6327} {"train_loss": -27.177988052368164, "global_step": 525192, "epoch": 6327} {"train_loss": -26.895843505859375, "global_step": 525193, "epoch": 6327} {"train_loss": -27.503421783447266, "global_step": 525194, "epoch": 6327} {"train_loss": -27.05128288269043, "global_step": 525195, "epoch": 6327} {"train_loss": -27.610797882080078, "global_step": 525196, "epoch": 6327} {"train_loss": -27.695907592773438, "global_step": 525197, "epoch": 6327} {"train_loss": -27.388891220092773, "global_step": 525198, "epoch": 6327} {"train_loss": -27.485502243041992, "global_step": 525199, "epoch": 6327} {"train_loss": -27.314916610717773, "global_step": 525200, "epoch": 6327} {"train_loss": -27.420297622680664, "global_step": 525201, "epoch": 6327} {"train_loss": -27.63783073425293, "global_step": 525202, "epoch": 6327} {"train_loss": -27.436758041381836, "global_step": 525203, "epoch": 6327} {"train_loss": -27.87128257751465, "global_step": 525204, "epoch": 6327} {"train_loss": -27.589496612548828, "global_step": 525205, "epoch": 6327} {"train_loss": -27.614505767822266, "global_step": 525206, "epoch": 6327} {"train_loss": -27.1214542388916, "global_step": 525207, "epoch": 6327} {"train_loss": -27.165149688720703, "global_step": 525208, "epoch": 6327} {"train_loss": -28.10590171813965, "global_step": 525209, "epoch": 6327} {"train_loss": -27.573928833007812, "global_step": 525210, "epoch": 6327} {"train_loss": -27.754114151000977, "global_step": 525211, "epoch": 6327} {"train_loss": -27.7054500579834, "global_step": 525212, "epoch": 6327} {"train_loss": -27.286096572875977, "global_step": 525213, "epoch": 6327} {"train_loss": -27.560205459594727, "global_step": 525214, "epoch": 6327} {"train_loss": -27.578210830688477, "global_step": 525215, "epoch": 6327} {"train_loss": -27.50569725036621, "global_step": 525216, "epoch": 6327} {"train_loss": -27.487503051757812, "global_step": 525217, "epoch": 6327} {"train_loss": -27.451147079467773, "global_step": 525218, "epoch": 6327} {"train_loss": -27.446670532226562, "global_step": 525219, "epoch": 6327} {"train_loss": -28.158716201782227, "global_step": 525220, "epoch": 6327} {"train_loss": -27.43145179748535, "global_step": 525221, "epoch": 6327} {"train_loss": -27.696521759033203, "global_step": 525222, "epoch": 6327} {"train_loss": -27.512659187776496, "global_step": 525223, "epoch": 6327, "val_loss": 6568067.0} {"train_loss": -26.902053833007812, "global_step": 525224, "epoch": 6328} {"train_loss": -26.64971351623535, "global_step": 525225, "epoch": 6328} {"train_loss": -26.711999893188477, "global_step": 525226, "epoch": 6328} {"train_loss": -26.822769165039062, "global_step": 525227, "epoch": 6328} {"train_loss": -27.39594841003418, "global_step": 525228, "epoch": 6328} {"train_loss": -27.861661911010742, "global_step": 525229, "epoch": 6328} {"train_loss": -26.759780883789062, "global_step": 525230, "epoch": 6328} {"train_loss": -27.36543846130371, "global_step": 525231, "epoch": 6328} {"train_loss": -27.16790199279785, "global_step": 525232, "epoch": 6328} {"train_loss": -27.18379020690918, "global_step": 525233, "epoch": 6328} {"train_loss": -26.945556640625, "global_step": 525234, "epoch": 6328} {"train_loss": -27.165164947509766, "global_step": 525235, "epoch": 6328} {"train_loss": -27.235815048217773, "global_step": 525236, "epoch": 6328} {"train_loss": -27.060123443603516, "global_step": 525237, "epoch": 6328} {"train_loss": -27.154327392578125, "global_step": 525238, "epoch": 6328} {"train_loss": -27.276321411132812, "global_step": 525239, "epoch": 6328} {"train_loss": -27.441669464111328, "global_step": 525240, "epoch": 6328} {"train_loss": -27.5892276763916, "global_step": 525241, "epoch": 6328} {"train_loss": -27.4365177154541, "global_step": 525242, "epoch": 6328} {"train_loss": -27.218000411987305, "global_step": 525243, "epoch": 6328} {"train_loss": -27.532379150390625, "global_step": 525244, "epoch": 6328} {"train_loss": -27.674896240234375, "global_step": 525245, "epoch": 6328} {"train_loss": -27.727584838867188, "global_step": 525246, "epoch": 6328} {"train_loss": -27.73480796813965, "global_step": 525247, "epoch": 6328} {"train_loss": -28.008649826049805, "global_step": 525248, "epoch": 6328} {"train_loss": -27.82161521911621, "global_step": 525249, "epoch": 6328} {"train_loss": -27.50193214416504, "global_step": 525250, "epoch": 6328} {"train_loss": -27.745914459228516, "global_step": 525251, "epoch": 6328} {"train_loss": -27.571287155151367, "global_step": 525252, "epoch": 6328} {"train_loss": -27.653268814086914, "global_step": 525253, "epoch": 6328} {"train_loss": -28.166929244995117, "global_step": 525254, "epoch": 6328} {"train_loss": -27.9525146484375, "global_step": 525255, "epoch": 6328} {"train_loss": -27.503355026245117, "global_step": 525256, "epoch": 6328} {"train_loss": -27.73667335510254, "global_step": 525257, "epoch": 6328} {"train_loss": -27.5935001373291, "global_step": 525258, "epoch": 6328} {"train_loss": -27.792724609375, "global_step": 525259, "epoch": 6328} {"train_loss": -27.95411491394043, "global_step": 525260, "epoch": 6328} {"train_loss": -28.035505294799805, "global_step": 525261, "epoch": 6328} {"train_loss": -27.183197021484375, "global_step": 525262, "epoch": 6328} {"train_loss": -27.7244873046875, "global_step": 525263, "epoch": 6328} {"train_loss": -27.503854751586914, "global_step": 525264, "epoch": 6328} {"train_loss": -27.722808837890625, "global_step": 525265, "epoch": 6328} {"train_loss": -27.54535484313965, "global_step": 525266, "epoch": 6328} {"train_loss": -27.674097061157227, "global_step": 525267, "epoch": 6328} {"train_loss": -27.443628311157227, "global_step": 525268, "epoch": 6328} {"train_loss": -27.528549194335938, "global_step": 525269, "epoch": 6328} {"train_loss": -27.3279972076416, "global_step": 525270, "epoch": 6328} {"train_loss": -27.35694694519043, "global_step": 525271, "epoch": 6328} {"train_loss": -27.492725372314453, "global_step": 525272, "epoch": 6328} {"train_loss": -27.632049560546875, "global_step": 525273, "epoch": 6328} {"train_loss": -27.352848052978516, "global_step": 525274, "epoch": 6328} {"train_loss": -27.727659225463867, "global_step": 525275, "epoch": 6328} {"train_loss": -27.26993179321289, "global_step": 525276, "epoch": 6328} {"train_loss": -27.27020263671875, "global_step": 525277, "epoch": 6328} {"train_loss": -27.438257217407227, "global_step": 525278, "epoch": 6328} {"train_loss": -27.620086669921875, "global_step": 525279, "epoch": 6328} {"train_loss": -27.729150772094727, "global_step": 525280, "epoch": 6328} {"train_loss": -27.60577392578125, "global_step": 525281, "epoch": 6328} {"train_loss": -27.576114654541016, "global_step": 525282, "epoch": 6328} {"train_loss": -27.387958526611328, "global_step": 525283, "epoch": 6328} {"train_loss": -27.830556869506836, "global_step": 525284, "epoch": 6328} {"train_loss": -27.475690841674805, "global_step": 525285, "epoch": 6328} {"train_loss": -27.611326217651367, "global_step": 525286, "epoch": 6328} {"train_loss": -27.34994888305664, "global_step": 525287, "epoch": 6328} {"train_loss": -27.720067977905273, "global_step": 525288, "epoch": 6328} {"train_loss": -27.487348556518555, "global_step": 525289, "epoch": 6328} {"train_loss": -27.49118995666504, "global_step": 525290, "epoch": 6328} {"train_loss": -28.133291244506836, "global_step": 525291, "epoch": 6328} {"train_loss": -27.539941787719727, "global_step": 525292, "epoch": 6328} {"train_loss": -27.511396408081055, "global_step": 525293, "epoch": 6328} {"train_loss": -27.782590866088867, "global_step": 525294, "epoch": 6328} {"train_loss": -27.344038009643555, "global_step": 525295, "epoch": 6328} {"train_loss": -27.7018985748291, "global_step": 525296, "epoch": 6328} {"train_loss": -27.50333023071289, "global_step": 525297, "epoch": 6328} {"train_loss": -27.862714767456055, "global_step": 525298, "epoch": 6328} {"train_loss": -27.639562606811523, "global_step": 525299, "epoch": 6328} {"train_loss": -27.25452995300293, "global_step": 525300, "epoch": 6328} {"train_loss": -27.8038330078125, "global_step": 525301, "epoch": 6328} {"train_loss": -27.699750900268555, "global_step": 525302, "epoch": 6328} {"train_loss": -27.450424194335938, "global_step": 525303, "epoch": 6328} {"train_loss": -27.894546508789062, "global_step": 525304, "epoch": 6328} {"train_loss": -27.403608322143555, "global_step": 525305, "epoch": 6328} {"train_loss": -27.52200910269496, "global_step": 525306, "epoch": 6328, "val_loss": 6577894.5} {"train_loss": -27.071420669555664, "global_step": 525307, "epoch": 6329} {"train_loss": -26.74135398864746, "global_step": 525308, "epoch": 6329} {"train_loss": -27.486759185791016, "global_step": 525309, "epoch": 6329} {"train_loss": -27.246931076049805, "global_step": 525310, "epoch": 6329} {"train_loss": -26.83660316467285, "global_step": 525311, "epoch": 6329} {"train_loss": -26.791364669799805, "global_step": 525312, "epoch": 6329} {"train_loss": -27.212575912475586, "global_step": 525313, "epoch": 6329} {"train_loss": -27.030309677124023, "global_step": 525314, "epoch": 6329} {"train_loss": -26.940750122070312, "global_step": 525315, "epoch": 6329} {"train_loss": -27.27614402770996, "global_step": 525316, "epoch": 6329} {"train_loss": -26.923688888549805, "global_step": 525317, "epoch": 6329} {"train_loss": -27.246068954467773, "global_step": 525318, "epoch": 6329} {"train_loss": -27.108488082885742, "global_step": 525319, "epoch": 6329} {"train_loss": -26.754627227783203, "global_step": 525320, "epoch": 6329} {"train_loss": -27.095067977905273, "global_step": 525321, "epoch": 6329} {"train_loss": -26.958560943603516, "global_step": 525322, "epoch": 6329} {"train_loss": -26.906320571899414, "global_step": 525323, "epoch": 6329} {"train_loss": -27.11775016784668, "global_step": 525324, "epoch": 6329} {"train_loss": -27.26690101623535, "global_step": 525325, "epoch": 6329} {"train_loss": -27.49549674987793, "global_step": 525326, "epoch": 6329} {"train_loss": -27.11431884765625, "global_step": 525327, "epoch": 6329} {"train_loss": -27.398141860961914, "global_step": 525328, "epoch": 6329} {"train_loss": -27.50899314880371, "global_step": 525329, "epoch": 6329} {"train_loss": -27.2622127532959, "global_step": 525330, "epoch": 6329} {"train_loss": -27.515844345092773, "global_step": 525331, "epoch": 6329} {"train_loss": -27.664953231811523, "global_step": 525332, "epoch": 6329} {"train_loss": -27.315261840820312, "global_step": 525333, "epoch": 6329} {"train_loss": -27.677642822265625, "global_step": 525334, "epoch": 6329} {"train_loss": -27.33051109313965, "global_step": 525335, "epoch": 6329} {"train_loss": -27.593175888061523, "global_step": 525336, "epoch": 6329} {"train_loss": -27.337631225585938, "global_step": 525337, "epoch": 6329} {"train_loss": -27.433496475219727, "global_step": 525338, "epoch": 6329} {"train_loss": -27.159326553344727, "global_step": 525339, "epoch": 6329} {"train_loss": -27.6519718170166, "global_step": 525340, "epoch": 6329} {"train_loss": -27.57288932800293, "global_step": 525341, "epoch": 6329} {"train_loss": -27.694311141967773, "global_step": 525342, "epoch": 6329} {"train_loss": -27.3388671875, "global_step": 525343, "epoch": 6329} {"train_loss": -27.315692901611328, "global_step": 525344, "epoch": 6329} {"train_loss": -27.455785751342773, "global_step": 525345, "epoch": 6329} {"train_loss": -27.367822647094727, "global_step": 525346, "epoch": 6329} {"train_loss": -27.364439010620117, "global_step": 525347, "epoch": 6329} {"train_loss": -27.733854293823242, "global_step": 525348, "epoch": 6329} {"train_loss": -27.438451766967773, "global_step": 525349, "epoch": 6329} {"train_loss": -27.240985870361328, "global_step": 525350, "epoch": 6329} {"train_loss": -27.65679359436035, "global_step": 525351, "epoch": 6329} {"train_loss": -27.888809204101562, "global_step": 525352, "epoch": 6329} {"train_loss": -27.663232803344727, "global_step": 525353, "epoch": 6329} {"train_loss": -27.97015380859375, "global_step": 525354, "epoch": 6329} {"train_loss": -27.736921310424805, "global_step": 525355, "epoch": 6329} {"train_loss": -27.711469650268555, "global_step": 525356, "epoch": 6329} {"train_loss": -27.786834716796875, "global_step": 525357, "epoch": 6329} {"train_loss": -27.8394832611084, "global_step": 525358, "epoch": 6329} {"train_loss": -27.642902374267578, "global_step": 525359, "epoch": 6329} {"train_loss": -27.560443878173828, "global_step": 525360, "epoch": 6329} {"train_loss": -27.434452056884766, "global_step": 525361, "epoch": 6329} {"train_loss": -28.01630973815918, "global_step": 525362, "epoch": 6329} {"train_loss": -28.001428604125977, "global_step": 525363, "epoch": 6329} {"train_loss": -27.660858154296875, "global_step": 525364, "epoch": 6329} {"train_loss": -27.83851432800293, "global_step": 525365, "epoch": 6329} {"train_loss": -27.890308380126953, "global_step": 525366, "epoch": 6329} {"train_loss": -27.777240753173828, "global_step": 525367, "epoch": 6329} {"train_loss": -27.855758666992188, "global_step": 525368, "epoch": 6329} {"train_loss": -27.82631492614746, "global_step": 525369, "epoch": 6329} {"train_loss": -27.3270206451416, "global_step": 525370, "epoch": 6329} {"train_loss": -27.608179092407227, "global_step": 525371, "epoch": 6329} {"train_loss": -27.719406127929688, "global_step": 525372, "epoch": 6329} {"train_loss": -27.9615478515625, "global_step": 525373, "epoch": 6329} {"train_loss": -27.747800827026367, "global_step": 525374, "epoch": 6329} {"train_loss": -27.426176071166992, "global_step": 525375, "epoch": 6329} {"train_loss": -27.935394287109375, "global_step": 525376, "epoch": 6329} {"train_loss": -27.468236923217773, "global_step": 525377, "epoch": 6329} {"train_loss": -27.513883590698242, "global_step": 525378, "epoch": 6329} {"train_loss": -27.505720138549805, "global_step": 525379, "epoch": 6329} {"train_loss": -26.9044246673584, "global_step": 525380, "epoch": 6329} {"train_loss": -26.212116241455078, "global_step": 525381, "epoch": 6329} {"train_loss": -24.57499122619629, "global_step": 525382, "epoch": 6329} {"train_loss": -25.743066787719727, "global_step": 525383, "epoch": 6329} {"train_loss": -26.653278350830078, "global_step": 525384, "epoch": 6329} {"train_loss": -26.604373931884766, "global_step": 525385, "epoch": 6329} {"train_loss": -27.217060089111328, "global_step": 525386, "epoch": 6329} {"train_loss": -26.836963653564453, "global_step": 525387, "epoch": 6329} {"train_loss": -27.089155197143555, "global_step": 525388, "epoch": 6329} {"train_loss": -27.34066087653838, "global_step": 525389, "epoch": 6329, "val_loss": 6596612.0} {"train_loss": -26.46754264831543, "global_step": 525390, "epoch": 6330} {"train_loss": -25.893091201782227, "global_step": 525391, "epoch": 6330} {"train_loss": -26.633136749267578, "global_step": 525392, "epoch": 6330} {"train_loss": -26.7802791595459, "global_step": 525393, "epoch": 6330} {"train_loss": -26.187829971313477, "global_step": 525394, "epoch": 6330} {"train_loss": -26.61992835998535, "global_step": 525395, "epoch": 6330} {"train_loss": -26.708667755126953, "global_step": 525396, "epoch": 6330} {"train_loss": -26.4368953704834, "global_step": 525397, "epoch": 6330} {"train_loss": -26.570148468017578, "global_step": 525398, "epoch": 6330} {"train_loss": -26.9663143157959, "global_step": 525399, "epoch": 6330} {"train_loss": -26.633731842041016, "global_step": 525400, "epoch": 6330} {"train_loss": -27.064716339111328, "global_step": 525401, "epoch": 6330} {"train_loss": -26.559057235717773, "global_step": 525402, "epoch": 6330} {"train_loss": -27.06136131286621, "global_step": 525403, "epoch": 6330} {"train_loss": -26.316635131835938, "global_step": 525404, "epoch": 6330} {"train_loss": -26.988550186157227, "global_step": 525405, "epoch": 6330} {"train_loss": -26.659393310546875, "global_step": 525406, "epoch": 6330} {"train_loss": -26.923553466796875, "global_step": 525407, "epoch": 6330} {"train_loss": -26.912036895751953, "global_step": 525408, "epoch": 6330} {"train_loss": -27.213647842407227, "global_step": 525409, "epoch": 6330} {"train_loss": -27.268600463867188, "global_step": 525410, "epoch": 6330} {"train_loss": -27.15549087524414, "global_step": 525411, "epoch": 6330} {"train_loss": -27.36785316467285, "global_step": 525412, "epoch": 6330} {"train_loss": -27.1691837310791, "global_step": 525413, "epoch": 6330} {"train_loss": -27.19137954711914, "global_step": 525414, "epoch": 6330} {"train_loss": -27.06410026550293, "global_step": 525415, "epoch": 6330} {"train_loss": -27.261072158813477, "global_step": 525416, "epoch": 6330} {"train_loss": -27.261463165283203, "global_step": 525417, "epoch": 6330} {"train_loss": -27.52071189880371, "global_step": 525418, "epoch": 6330} {"train_loss": -27.4920711517334, "global_step": 525419, "epoch": 6330} {"train_loss": -27.851165771484375, "global_step": 525420, "epoch": 6330} {"train_loss": -27.447965621948242, "global_step": 525421, "epoch": 6330} {"train_loss": -27.496923446655273, "global_step": 525422, "epoch": 6330} {"train_loss": -27.35757827758789, "global_step": 525423, "epoch": 6330} {"train_loss": -27.659391403198242, "global_step": 525424, "epoch": 6330} {"train_loss": -27.752685546875, "global_step": 525425, "epoch": 6330} {"train_loss": -27.309539794921875, "global_step": 525426, "epoch": 6330} {"train_loss": -27.859619140625, "global_step": 525427, "epoch": 6330} {"train_loss": -27.735015869140625, "global_step": 525428, "epoch": 6330} {"train_loss": -27.512258529663086, "global_step": 525429, "epoch": 6330} {"train_loss": -27.61482048034668, "global_step": 525430, "epoch": 6330} {"train_loss": -27.814722061157227, "global_step": 525431, "epoch": 6330} {"train_loss": -27.646387100219727, "global_step": 525432, "epoch": 6330} {"train_loss": -27.5354061126709, "global_step": 525433, "epoch": 6330} {"train_loss": -27.595449447631836, "global_step": 525434, "epoch": 6330} {"train_loss": -27.84636878967285, "global_step": 525435, "epoch": 6330} {"train_loss": -27.502670288085938, "global_step": 525436, "epoch": 6330} {"train_loss": -27.86764907836914, "global_step": 525437, "epoch": 6330} {"train_loss": -27.603246688842773, "global_step": 525438, "epoch": 6330} {"train_loss": -28.259296417236328, "global_step": 525439, "epoch": 6330} {"train_loss": -27.73578453063965, "global_step": 525440, "epoch": 6330} {"train_loss": -27.661396026611328, "global_step": 525441, "epoch": 6330} {"train_loss": -27.543231964111328, "global_step": 525442, "epoch": 6330} {"train_loss": -27.600601196289062, "global_step": 525443, "epoch": 6330} {"train_loss": -27.5257568359375, "global_step": 525444, "epoch": 6330} {"train_loss": -27.498151779174805, "global_step": 525445, "epoch": 6330} {"train_loss": -27.904834747314453, "global_step": 525446, "epoch": 6330} {"train_loss": -27.9882755279541, "global_step": 525447, "epoch": 6330} {"train_loss": -27.835058212280273, "global_step": 525448, "epoch": 6330} {"train_loss": -27.749067306518555, "global_step": 525449, "epoch": 6330} {"train_loss": -27.96845054626465, "global_step": 525450, "epoch": 6330} {"train_loss": -27.803247451782227, "global_step": 525451, "epoch": 6330} {"train_loss": -27.724328994750977, "global_step": 525452, "epoch": 6330} {"train_loss": -28.158716201782227, "global_step": 525453, "epoch": 6330} {"train_loss": -27.614953994750977, "global_step": 525454, "epoch": 6330} {"train_loss": -27.634870529174805, "global_step": 525455, "epoch": 6330} {"train_loss": -27.785924911499023, "global_step": 525456, "epoch": 6330} {"train_loss": -27.847436904907227, "global_step": 525457, "epoch": 6330} {"train_loss": -27.494787216186523, "global_step": 525458, "epoch": 6330} {"train_loss": -27.843963623046875, "global_step": 525459, "epoch": 6330} {"train_loss": -27.867849349975586, "global_step": 525460, "epoch": 6330} {"train_loss": -27.65667152404785, "global_step": 525461, "epoch": 6330} {"train_loss": -27.94121742248535, "global_step": 525462, "epoch": 6330} {"train_loss": -27.524450302124023, "global_step": 525463, "epoch": 6330} {"train_loss": -27.471454620361328, "global_step": 525464, "epoch": 6330} {"train_loss": -27.821393966674805, "global_step": 525465, "epoch": 6330} {"train_loss": -27.831104278564453, "global_step": 525466, "epoch": 6330} {"train_loss": -27.331268310546875, "global_step": 525467, "epoch": 6330} {"train_loss": -26.97079849243164, "global_step": 525468, "epoch": 6330} {"train_loss": -26.340810775756836, "global_step": 525469, "epoch": 6330} {"train_loss": -25.99637794494629, "global_step": 525470, "epoch": 6330} {"train_loss": -26.5109806060791, "global_step": 525471, "epoch": 6330} {"train_loss": -27.338502056627387, "global_step": 525472, "epoch": 6330, "val_loss": 6568879.0} {"train_loss": -26.8716983795166, "global_step": 525473, "epoch": 6331} {"train_loss": -26.964990615844727, "global_step": 525474, "epoch": 6331} {"train_loss": -27.040433883666992, "global_step": 525475, "epoch": 6331} {"train_loss": -26.84381103515625, "global_step": 525476, "epoch": 6331} {"train_loss": -26.802001953125, "global_step": 525477, "epoch": 6331} {"train_loss": -27.19898796081543, "global_step": 525478, "epoch": 6331} {"train_loss": -26.860883712768555, "global_step": 525479, "epoch": 6331} {"train_loss": -27.436002731323242, "global_step": 525480, "epoch": 6331} {"train_loss": -27.15872573852539, "global_step": 525481, "epoch": 6331} {"train_loss": -26.91205406188965, "global_step": 525482, "epoch": 6331} {"train_loss": -27.1099853515625, "global_step": 525483, "epoch": 6331} {"train_loss": -27.102869033813477, "global_step": 525484, "epoch": 6331} {"train_loss": -27.01156997680664, "global_step": 525485, "epoch": 6331} {"train_loss": -27.196741104125977, "global_step": 525486, "epoch": 6331} {"train_loss": -26.829809188842773, "global_step": 525487, "epoch": 6331} {"train_loss": -27.311609268188477, "global_step": 525488, "epoch": 6331} {"train_loss": -26.999469757080078, "global_step": 525489, "epoch": 6331} {"train_loss": -26.94659996032715, "global_step": 525490, "epoch": 6331} {"train_loss": -26.924840927124023, "global_step": 525491, "epoch": 6331} {"train_loss": -27.036529541015625, "global_step": 525492, "epoch": 6331} {"train_loss": -27.2193660736084, "global_step": 525493, "epoch": 6331} {"train_loss": -27.296045303344727, "global_step": 525494, "epoch": 6331} {"train_loss": -27.193918228149414, "global_step": 525495, "epoch": 6331} {"train_loss": -27.334762573242188, "global_step": 525496, "epoch": 6331} {"train_loss": -27.251956939697266, "global_step": 525497, "epoch": 6331} {"train_loss": -26.864704132080078, "global_step": 525498, "epoch": 6331} {"train_loss": -27.48512840270996, "global_step": 525499, "epoch": 6331} {"train_loss": -27.2022705078125, "global_step": 525500, "epoch": 6331} {"train_loss": -27.39544677734375, "global_step": 525501, "epoch": 6331} {"train_loss": -27.344858169555664, "global_step": 525502, "epoch": 6331} {"train_loss": -27.498676300048828, "global_step": 525503, "epoch": 6331} {"train_loss": -27.5283203125, "global_step": 525504, "epoch": 6331} {"train_loss": -27.336877822875977, "global_step": 525505, "epoch": 6331} {"train_loss": -27.513259887695312, "global_step": 525506, "epoch": 6331} {"train_loss": -27.55348014831543, "global_step": 525507, "epoch": 6331} {"train_loss": -27.220794677734375, "global_step": 525508, "epoch": 6331} {"train_loss": -27.4748477935791, "global_step": 525509, "epoch": 6331} {"train_loss": -27.54047203063965, "global_step": 525510, "epoch": 6331} {"train_loss": -27.954364776611328, "global_step": 525511, "epoch": 6331} {"train_loss": -27.58527183532715, "global_step": 525512, "epoch": 6331} {"train_loss": -27.593505859375, "global_step": 525513, "epoch": 6331} {"train_loss": -27.577600479125977, "global_step": 525514, "epoch": 6331} {"train_loss": -27.746723175048828, "global_step": 525515, "epoch": 6331} {"train_loss": -27.839385986328125, "global_step": 525516, "epoch": 6331} {"train_loss": -28.017562866210938, "global_step": 525517, "epoch": 6331} {"train_loss": -27.30976676940918, "global_step": 525518, "epoch": 6331} {"train_loss": -27.402963638305664, "global_step": 525519, "epoch": 6331} {"train_loss": -27.841840744018555, "global_step": 525520, "epoch": 6331} {"train_loss": -27.820173263549805, "global_step": 525521, "epoch": 6331} {"train_loss": -27.888824462890625, "global_step": 525522, "epoch": 6331} {"train_loss": -27.821115493774414, "global_step": 525523, "epoch": 6331} {"train_loss": -27.759939193725586, "global_step": 525524, "epoch": 6331} {"train_loss": -27.637434005737305, "global_step": 525525, "epoch": 6331} {"train_loss": -27.723188400268555, "global_step": 525526, "epoch": 6331} {"train_loss": -28.00048828125, "global_step": 525527, "epoch": 6331} {"train_loss": -27.612751007080078, "global_step": 525528, "epoch": 6331} {"train_loss": -27.826879501342773, "global_step": 525529, "epoch": 6331} {"train_loss": -27.83704948425293, "global_step": 525530, "epoch": 6331} {"train_loss": -27.8438777923584, "global_step": 525531, "epoch": 6331} {"train_loss": -27.8660831451416, "global_step": 525532, "epoch": 6331} {"train_loss": -27.625568389892578, "global_step": 525533, "epoch": 6331} {"train_loss": -28.2130069732666, "global_step": 525534, "epoch": 6331} {"train_loss": -27.733320236206055, "global_step": 525535, "epoch": 6331} {"train_loss": -27.72442626953125, "global_step": 525536, "epoch": 6331} {"train_loss": -27.532470703125, "global_step": 525537, "epoch": 6331} {"train_loss": -27.74323844909668, "global_step": 525538, "epoch": 6331} {"train_loss": -27.759479522705078, "global_step": 525539, "epoch": 6331} {"train_loss": -27.70013999938965, "global_step": 525540, "epoch": 6331} {"train_loss": -27.16554069519043, "global_step": 525541, "epoch": 6331} {"train_loss": -27.37906265258789, "global_step": 525542, "epoch": 6331} {"train_loss": -27.427536010742188, "global_step": 525543, "epoch": 6331} {"train_loss": -27.58538818359375, "global_step": 525544, "epoch": 6331} {"train_loss": -27.336795806884766, "global_step": 525545, "epoch": 6331} {"train_loss": -27.703588485717773, "global_step": 525546, "epoch": 6331} {"train_loss": -27.42392349243164, "global_step": 525547, "epoch": 6331} {"train_loss": -27.609777450561523, "global_step": 525548, "epoch": 6331} {"train_loss": -27.5821475982666, "global_step": 525549, "epoch": 6331} {"train_loss": -27.70785903930664, "global_step": 525550, "epoch": 6331} {"train_loss": -27.170896530151367, "global_step": 525551, "epoch": 6331} {"train_loss": -27.090967178344727, "global_step": 525552, "epoch": 6331} {"train_loss": -26.41071128845215, "global_step": 525553, "epoch": 6331} {"train_loss": -26.48565673828125, "global_step": 525554, "epoch": 6331} {"train_loss": -27.407854470861963, "global_step": 525555, "epoch": 6331, "val_loss": 6514658.0} {"train_loss": -25.624082565307617, "global_step": 525556, "epoch": 6332} {"train_loss": -25.918750762939453, "global_step": 525557, "epoch": 6332} {"train_loss": -26.435195922851562, "global_step": 525558, "epoch": 6332} {"train_loss": -26.111082077026367, "global_step": 525559, "epoch": 6332} {"train_loss": -26.58750343322754, "global_step": 525560, "epoch": 6332} {"train_loss": -26.39593505859375, "global_step": 525561, "epoch": 6332} {"train_loss": -26.560516357421875, "global_step": 525562, "epoch": 6332} {"train_loss": -26.406696319580078, "global_step": 525563, "epoch": 6332} {"train_loss": -26.368122100830078, "global_step": 525564, "epoch": 6332} {"train_loss": -26.645029067993164, "global_step": 525565, "epoch": 6332} {"train_loss": -26.702146530151367, "global_step": 525566, "epoch": 6332} {"train_loss": -26.491376876831055, "global_step": 525567, "epoch": 6332} {"train_loss": -26.79254150390625, "global_step": 525568, "epoch": 6332} {"train_loss": -26.812612533569336, "global_step": 525569, "epoch": 6332} {"train_loss": -26.53517723083496, "global_step": 525570, "epoch": 6332} {"train_loss": -26.5019474029541, "global_step": 525571, "epoch": 6332} {"train_loss": -26.762537002563477, "global_step": 525572, "epoch": 6332} {"train_loss": -26.703638076782227, "global_step": 525573, "epoch": 6332} {"train_loss": -26.741718292236328, "global_step": 525574, "epoch": 6332} {"train_loss": -27.082061767578125, "global_step": 525575, "epoch": 6332} {"train_loss": -26.6761474609375, "global_step": 525576, "epoch": 6332} {"train_loss": -27.281158447265625, "global_step": 525577, "epoch": 6332} {"train_loss": -26.84388542175293, "global_step": 525578, "epoch": 6332} {"train_loss": -26.760623931884766, "global_step": 525579, "epoch": 6332} {"train_loss": -27.42462158203125, "global_step": 525580, "epoch": 6332} {"train_loss": -27.0184326171875, "global_step": 525581, "epoch": 6332} {"train_loss": -27.145553588867188, "global_step": 525582, "epoch": 6332} {"train_loss": -27.215295791625977, "global_step": 525583, "epoch": 6332} {"train_loss": -27.317136764526367, "global_step": 525584, "epoch": 6332} {"train_loss": -27.553680419921875, "global_step": 525585, "epoch": 6332} {"train_loss": -27.544591903686523, "global_step": 525586, "epoch": 6332} {"train_loss": -27.633453369140625, "global_step": 525587, "epoch": 6332} {"train_loss": -27.682239532470703, "global_step": 525588, "epoch": 6332} {"train_loss": -27.32069206237793, "global_step": 525589, "epoch": 6332} {"train_loss": -27.358112335205078, "global_step": 525590, "epoch": 6332} {"train_loss": -27.711034774780273, "global_step": 525591, "epoch": 6332} {"train_loss": -27.176502227783203, "global_step": 525592, "epoch": 6332} {"train_loss": -27.5, "global_step": 525593, "epoch": 6332} {"train_loss": -27.62959098815918, "global_step": 525594, "epoch": 6332} {"train_loss": -27.645526885986328, "global_step": 525595, "epoch": 6332} {"train_loss": -27.5886287689209, "global_step": 525596, "epoch": 6332} {"train_loss": -27.389257431030273, "global_step": 525597, "epoch": 6332} {"train_loss": -27.516803741455078, "global_step": 525598, "epoch": 6332} {"train_loss": -27.570693969726562, "global_step": 525599, "epoch": 6332} {"train_loss": -27.940967559814453, "global_step": 525600, "epoch": 6332} {"train_loss": -27.525440216064453, "global_step": 525601, "epoch": 6332} {"train_loss": -27.68130874633789, "global_step": 525602, "epoch": 6332} {"train_loss": -27.892324447631836, "global_step": 525603, "epoch": 6332} {"train_loss": -27.63471794128418, "global_step": 525604, "epoch": 6332} {"train_loss": -27.949081420898438, "global_step": 525605, "epoch": 6332} {"train_loss": -27.613393783569336, "global_step": 525606, "epoch": 6332} {"train_loss": -27.602386474609375, "global_step": 525607, "epoch": 6332} {"train_loss": -27.930740356445312, "global_step": 525608, "epoch": 6332} {"train_loss": -27.65549659729004, "global_step": 525609, "epoch": 6332} {"train_loss": -28.116607666015625, "global_step": 525610, "epoch": 6332} {"train_loss": -27.718835830688477, "global_step": 525611, "epoch": 6332} {"train_loss": -28.404251098632812, "global_step": 525612, "epoch": 6332} {"train_loss": -27.868133544921875, "global_step": 525613, "epoch": 6332} {"train_loss": -28.004291534423828, "global_step": 525614, "epoch": 6332} {"train_loss": -27.794025421142578, "global_step": 525615, "epoch": 6332} {"train_loss": -27.953344345092773, "global_step": 525616, "epoch": 6332} {"train_loss": -27.495325088500977, "global_step": 525617, "epoch": 6332} {"train_loss": -27.305286407470703, "global_step": 525618, "epoch": 6332} {"train_loss": -27.781522750854492, "global_step": 525619, "epoch": 6332} {"train_loss": -27.93855094909668, "global_step": 525620, "epoch": 6332} {"train_loss": -27.268512725830078, "global_step": 525621, "epoch": 6332} {"train_loss": -27.563766479492188, "global_step": 525622, "epoch": 6332} {"train_loss": -27.42877197265625, "global_step": 525623, "epoch": 6332} {"train_loss": -27.697919845581055, "global_step": 525624, "epoch": 6332} {"train_loss": -27.90793800354004, "global_step": 525625, "epoch": 6332} {"train_loss": -27.4583740234375, "global_step": 525626, "epoch": 6332} {"train_loss": -27.646499633789062, "global_step": 525627, "epoch": 6332} {"train_loss": -27.407201766967773, "global_step": 525628, "epoch": 6332} {"train_loss": -27.6246337890625, "global_step": 525629, "epoch": 6332} {"train_loss": -27.324207305908203, "global_step": 525630, "epoch": 6332} {"train_loss": -27.20688819885254, "global_step": 525631, "epoch": 6332} {"train_loss": -27.65532875061035, "global_step": 525632, "epoch": 6332} {"train_loss": -27.460172653198242, "global_step": 525633, "epoch": 6332} {"train_loss": -27.314863204956055, "global_step": 525634, "epoch": 6332} {"train_loss": -26.558334350585938, "global_step": 525635, "epoch": 6332} {"train_loss": -26.407888412475586, "global_step": 525636, "epoch": 6332} {"train_loss": -26.762113571166992, "global_step": 525637, "epoch": 6332} {"train_loss": -27.285323728998023, "global_step": 525638, "epoch": 6332, "val_loss": 6560681.0} {"train_loss": -26.253721237182617, "global_step": 525639, "epoch": 6333} {"train_loss": -24.738357543945312, "global_step": 525640, "epoch": 6333} {"train_loss": -26.0979061126709, "global_step": 525641, "epoch": 6333} {"train_loss": -25.981189727783203, "global_step": 525642, "epoch": 6333} {"train_loss": -26.20011329650879, "global_step": 525643, "epoch": 6333} {"train_loss": -26.456745147705078, "global_step": 525644, "epoch": 6333} {"train_loss": -26.505029678344727, "global_step": 525645, "epoch": 6333} {"train_loss": -25.923847198486328, "global_step": 525646, "epoch": 6333} {"train_loss": -26.800552368164062, "global_step": 525647, "epoch": 6333} {"train_loss": -26.172306060791016, "global_step": 525648, "epoch": 6333} {"train_loss": -26.424341201782227, "global_step": 525649, "epoch": 6333} {"train_loss": -26.593168258666992, "global_step": 525650, "epoch": 6333} {"train_loss": -26.806732177734375, "global_step": 525651, "epoch": 6333} {"train_loss": -26.35188102722168, "global_step": 525652, "epoch": 6333} {"train_loss": -26.815481185913086, "global_step": 525653, "epoch": 6333} {"train_loss": -26.858530044555664, "global_step": 525654, "epoch": 6333} {"train_loss": -27.395099639892578, "global_step": 525655, "epoch": 6333} {"train_loss": -26.837528228759766, "global_step": 525656, "epoch": 6333} {"train_loss": -26.9619140625, "global_step": 525657, "epoch": 6333} {"train_loss": -26.805505752563477, "global_step": 525658, "epoch": 6333} {"train_loss": -26.65472984313965, "global_step": 525659, "epoch": 6333} {"train_loss": -27.21402359008789, "global_step": 525660, "epoch": 6333} {"train_loss": -27.24163246154785, "global_step": 525661, "epoch": 6333} {"train_loss": -27.009607315063477, "global_step": 525662, "epoch": 6333} {"train_loss": -27.1989803314209, "global_step": 525663, "epoch": 6333} {"train_loss": -27.103357315063477, "global_step": 525664, "epoch": 6333} {"train_loss": -27.357641220092773, "global_step": 525665, "epoch": 6333} {"train_loss": -26.962549209594727, "global_step": 525666, "epoch": 6333} {"train_loss": -27.42561149597168, "global_step": 525667, "epoch": 6333} {"train_loss": -27.188257217407227, "global_step": 525668, "epoch": 6333} {"train_loss": -27.054838180541992, "global_step": 525669, "epoch": 6333} {"train_loss": -26.76300048828125, "global_step": 525670, "epoch": 6333} {"train_loss": -27.432172775268555, "global_step": 525671, "epoch": 6333} {"train_loss": -26.976598739624023, "global_step": 525672, "epoch": 6333} {"train_loss": -27.66318130493164, "global_step": 525673, "epoch": 6333} {"train_loss": -27.041961669921875, "global_step": 525674, "epoch": 6333} {"train_loss": -26.796079635620117, "global_step": 525675, "epoch": 6333} {"train_loss": -27.4669189453125, "global_step": 525676, "epoch": 6333} {"train_loss": -27.25364112854004, "global_step": 525677, "epoch": 6333} {"train_loss": -27.324722290039062, "global_step": 525678, "epoch": 6333} {"train_loss": -27.094663619995117, "global_step": 525679, "epoch": 6333} {"train_loss": -27.386255264282227, "global_step": 525680, "epoch": 6333} {"train_loss": -27.19135856628418, "global_step": 525681, "epoch": 6333} {"train_loss": -27.07318687438965, "global_step": 525682, "epoch": 6333} {"train_loss": -27.307279586791992, "global_step": 525683, "epoch": 6333} {"train_loss": -27.311023712158203, "global_step": 525684, "epoch": 6333} {"train_loss": -27.440509796142578, "global_step": 525685, "epoch": 6333} {"train_loss": -27.44428062438965, "global_step": 525686, "epoch": 6333} {"train_loss": -27.681838989257812, "global_step": 525687, "epoch": 6333} {"train_loss": -27.36551856994629, "global_step": 525688, "epoch": 6333} {"train_loss": -27.060943603515625, "global_step": 525689, "epoch": 6333} {"train_loss": -27.508344650268555, "global_step": 525690, "epoch": 6333} {"train_loss": -27.409101486206055, "global_step": 525691, "epoch": 6333} {"train_loss": -27.188663482666016, "global_step": 525692, "epoch": 6333} {"train_loss": -27.350849151611328, "global_step": 525693, "epoch": 6333} {"train_loss": -27.648035049438477, "global_step": 525694, "epoch": 6333} {"train_loss": -27.5253849029541, "global_step": 525695, "epoch": 6333} {"train_loss": -27.1463565826416, "global_step": 525696, "epoch": 6333} {"train_loss": -27.362890243530273, "global_step": 525697, "epoch": 6333} {"train_loss": -27.586034774780273, "global_step": 525698, "epoch": 6333} {"train_loss": -27.17426109313965, "global_step": 525699, "epoch": 6333} {"train_loss": -27.494770050048828, "global_step": 525700, "epoch": 6333} {"train_loss": -27.633441925048828, "global_step": 525701, "epoch": 6333} {"train_loss": -27.45452308654785, "global_step": 525702, "epoch": 6333} {"train_loss": -27.623682022094727, "global_step": 525703, "epoch": 6333} {"train_loss": -27.758167266845703, "global_step": 525704, "epoch": 6333} {"train_loss": -27.563695907592773, "global_step": 525705, "epoch": 6333} {"train_loss": -27.791934967041016, "global_step": 525706, "epoch": 6333} {"train_loss": -27.683881759643555, "global_step": 525707, "epoch": 6333} {"train_loss": -27.562458038330078, "global_step": 525708, "epoch": 6333} {"train_loss": -27.676803588867188, "global_step": 525709, "epoch": 6333} {"train_loss": -27.543882369995117, "global_step": 525710, "epoch": 6333} {"train_loss": -27.231924057006836, "global_step": 525711, "epoch": 6333} {"train_loss": -27.491897583007812, "global_step": 525712, "epoch": 6333} {"train_loss": -27.763294219970703, "global_step": 525713, "epoch": 6333} {"train_loss": -27.39655876159668, "global_step": 525714, "epoch": 6333} {"train_loss": -27.3135986328125, "global_step": 525715, "epoch": 6333} {"train_loss": -27.915136337280273, "global_step": 525716, "epoch": 6333} {"train_loss": -27.744287490844727, "global_step": 525717, "epoch": 6333} {"train_loss": -27.44219398498535, "global_step": 525718, "epoch": 6333} {"train_loss": -27.308210372924805, "global_step": 525719, "epoch": 6333} {"train_loss": -27.501422882080078, "global_step": 525720, "epoch": 6333} {"train_loss": -27.152017179741918, "global_step": 525721, "epoch": 6333, "val_loss": 6577617.0} {"train_loss": -27.231054306030273, "global_step": 525722, "epoch": 6334} {"train_loss": -26.937437057495117, "global_step": 525723, "epoch": 6334} {"train_loss": -27.40542984008789, "global_step": 525724, "epoch": 6334} {"train_loss": -27.570880889892578, "global_step": 525725, "epoch": 6334} {"train_loss": -27.074066162109375, "global_step": 525726, "epoch": 6334} {"train_loss": -27.2075138092041, "global_step": 525727, "epoch": 6334} {"train_loss": -27.14166831970215, "global_step": 525728, "epoch": 6334} {"train_loss": -27.51059341430664, "global_step": 525729, "epoch": 6334} {"train_loss": -27.4620361328125, "global_step": 525730, "epoch": 6334} {"train_loss": -27.084287643432617, "global_step": 525731, "epoch": 6334} {"train_loss": -27.238122940063477, "global_step": 525732, "epoch": 6334} {"train_loss": -27.099313735961914, "global_step": 525733, "epoch": 6334} {"train_loss": -27.25016212463379, "global_step": 525734, "epoch": 6334} {"train_loss": -27.07721519470215, "global_step": 525735, "epoch": 6334} {"train_loss": -27.498910903930664, "global_step": 525736, "epoch": 6334} {"train_loss": -27.018142700195312, "global_step": 525737, "epoch": 6334} {"train_loss": -27.502395629882812, "global_step": 525738, "epoch": 6334} {"train_loss": -27.314279556274414, "global_step": 525739, "epoch": 6334} {"train_loss": -27.488798141479492, "global_step": 525740, "epoch": 6334} {"train_loss": -27.754587173461914, "global_step": 525741, "epoch": 6334} {"train_loss": -27.43047523498535, "global_step": 525742, "epoch": 6334} {"train_loss": -27.690780639648438, "global_step": 525743, "epoch": 6334} {"train_loss": -27.364770889282227, "global_step": 525744, "epoch": 6334} {"train_loss": -27.113698959350586, "global_step": 525745, "epoch": 6334} {"train_loss": -27.0180606842041, "global_step": 525746, "epoch": 6334} {"train_loss": -27.517841339111328, "global_step": 525747, "epoch": 6334} {"train_loss": -27.280109405517578, "global_step": 525748, "epoch": 6334} {"train_loss": -27.746246337890625, "global_step": 525749, "epoch": 6334} {"train_loss": -27.76458168029785, "global_step": 525750, "epoch": 6334} {"train_loss": -27.3537654876709, "global_step": 525751, "epoch": 6334} {"train_loss": -27.565933227539062, "global_step": 525752, "epoch": 6334} {"train_loss": -27.693695068359375, "global_step": 525753, "epoch": 6334} {"train_loss": -27.454288482666016, "global_step": 525754, "epoch": 6334} {"train_loss": -27.630102157592773, "global_step": 525755, "epoch": 6334} {"train_loss": -27.54762840270996, "global_step": 525756, "epoch": 6334} {"train_loss": -27.213703155517578, "global_step": 525757, "epoch": 6334} {"train_loss": -27.459613800048828, "global_step": 525758, "epoch": 6334} {"train_loss": -27.733747482299805, "global_step": 525759, "epoch": 6334} {"train_loss": -27.60135841369629, "global_step": 525760, "epoch": 6334} {"train_loss": -27.353458404541016, "global_step": 525761, "epoch": 6334} {"train_loss": -27.891218185424805, "global_step": 525762, "epoch": 6334} {"train_loss": -27.83974266052246, "global_step": 525763, "epoch": 6334} {"train_loss": -27.539169311523438, "global_step": 525764, "epoch": 6334} {"train_loss": -27.646076202392578, "global_step": 525765, "epoch": 6334} {"train_loss": -27.820514678955078, "global_step": 525766, "epoch": 6334} {"train_loss": -27.775720596313477, "global_step": 525767, "epoch": 6334} {"train_loss": -27.6346492767334, "global_step": 525768, "epoch": 6334} {"train_loss": -27.492704391479492, "global_step": 525769, "epoch": 6334} {"train_loss": -27.36052894592285, "global_step": 525770, "epoch": 6334} {"train_loss": -27.749465942382812, "global_step": 525771, "epoch": 6334} {"train_loss": -27.875455856323242, "global_step": 525772, "epoch": 6334} {"train_loss": -27.738962173461914, "global_step": 525773, "epoch": 6334} {"train_loss": -27.56561851501465, "global_step": 525774, "epoch": 6334} {"train_loss": -27.86518669128418, "global_step": 525775, "epoch": 6334} {"train_loss": -28.009735107421875, "global_step": 525776, "epoch": 6334} {"train_loss": -27.634199142456055, "global_step": 525777, "epoch": 6334} {"train_loss": -27.805438995361328, "global_step": 525778, "epoch": 6334} {"train_loss": -27.942794799804688, "global_step": 525779, "epoch": 6334} {"train_loss": -27.59794044494629, "global_step": 525780, "epoch": 6334} {"train_loss": -27.661352157592773, "global_step": 525781, "epoch": 6334} {"train_loss": -27.63263511657715, "global_step": 525782, "epoch": 6334} {"train_loss": -27.846099853515625, "global_step": 525783, "epoch": 6334} {"train_loss": -27.412084579467773, "global_step": 525784, "epoch": 6334} {"train_loss": -27.561365127563477, "global_step": 525785, "epoch": 6334} {"train_loss": -27.20537757873535, "global_step": 525786, "epoch": 6334} {"train_loss": -27.5550537109375, "global_step": 525787, "epoch": 6334} {"train_loss": -27.67926025390625, "global_step": 525788, "epoch": 6334} {"train_loss": -27.483259201049805, "global_step": 525789, "epoch": 6334} {"train_loss": -27.660322189331055, "global_step": 525790, "epoch": 6334} {"train_loss": -27.560382843017578, "global_step": 525791, "epoch": 6334} {"train_loss": -27.523700714111328, "global_step": 525792, "epoch": 6334} {"train_loss": -27.62457847595215, "global_step": 525793, "epoch": 6334} {"train_loss": -27.62809181213379, "global_step": 525794, "epoch": 6334} {"train_loss": -27.373153686523438, "global_step": 525795, "epoch": 6334} {"train_loss": -27.991596221923828, "global_step": 525796, "epoch": 6334} {"train_loss": -27.70951271057129, "global_step": 525797, "epoch": 6334} {"train_loss": -28.034732818603516, "global_step": 525798, "epoch": 6334} {"train_loss": -27.606733322143555, "global_step": 525799, "epoch": 6334} {"train_loss": -27.736480712890625, "global_step": 525800, "epoch": 6334} {"train_loss": -27.657852172851562, "global_step": 525801, "epoch": 6334} {"train_loss": -28.092405319213867, "global_step": 525802, "epoch": 6334} {"train_loss": -28.028793334960938, "global_step": 525803, "epoch": 6334} {"train_loss": -27.55037824791598, "global_step": 525804, "epoch": 6334, "val_loss": 6580901.0} {"train_loss": -27.59071922302246, "global_step": 525805, "epoch": 6335} {"train_loss": -27.448501586914062, "global_step": 525806, "epoch": 6335} {"train_loss": -27.745059967041016, "global_step": 525807, "epoch": 6335} {"train_loss": -27.18763542175293, "global_step": 525808, "epoch": 6335} {"train_loss": -27.535974502563477, "global_step": 525809, "epoch": 6335} {"train_loss": -27.180927276611328, "global_step": 525810, "epoch": 6335} {"train_loss": -27.395658493041992, "global_step": 525811, "epoch": 6335} {"train_loss": -27.020627975463867, "global_step": 525812, "epoch": 6335} {"train_loss": -27.450468063354492, "global_step": 525813, "epoch": 6335} {"train_loss": -27.53314781188965, "global_step": 525814, "epoch": 6335} {"train_loss": -27.564245223999023, "global_step": 525815, "epoch": 6335} {"train_loss": -27.31434440612793, "global_step": 525816, "epoch": 6335} {"train_loss": -27.49713134765625, "global_step": 525817, "epoch": 6335} {"train_loss": -27.32459831237793, "global_step": 525818, "epoch": 6335} {"train_loss": -27.545654296875, "global_step": 525819, "epoch": 6335} {"train_loss": -27.480207443237305, "global_step": 525820, "epoch": 6335} {"train_loss": -27.551166534423828, "global_step": 525821, "epoch": 6335} {"train_loss": -28.005859375, "global_step": 525822, "epoch": 6335} {"train_loss": -27.2860050201416, "global_step": 525823, "epoch": 6335} {"train_loss": -27.354101181030273, "global_step": 525824, "epoch": 6335} {"train_loss": -27.2475643157959, "global_step": 525825, "epoch": 6335} {"train_loss": -27.656835556030273, "global_step": 525826, "epoch": 6335} {"train_loss": -27.649511337280273, "global_step": 525827, "epoch": 6335} {"train_loss": -27.568586349487305, "global_step": 525828, "epoch": 6335} {"train_loss": -27.64422035217285, "global_step": 525829, "epoch": 6335} {"train_loss": -27.843769073486328, "global_step": 525830, "epoch": 6335} {"train_loss": -27.90777015686035, "global_step": 525831, "epoch": 6335} {"train_loss": -27.59248161315918, "global_step": 525832, "epoch": 6335} {"train_loss": -27.557453155517578, "global_step": 525833, "epoch": 6335} {"train_loss": -27.488088607788086, "global_step": 525834, "epoch": 6335} {"train_loss": -27.40289306640625, "global_step": 525835, "epoch": 6335} {"train_loss": -27.73406410217285, "global_step": 525836, "epoch": 6335} {"train_loss": -27.742450714111328, "global_step": 525837, "epoch": 6335} {"train_loss": -27.584020614624023, "global_step": 525838, "epoch": 6335} {"train_loss": -27.525964736938477, "global_step": 525839, "epoch": 6335} {"train_loss": -27.612455368041992, "global_step": 525840, "epoch": 6335} {"train_loss": -27.991254806518555, "global_step": 525841, "epoch": 6335} {"train_loss": -27.507831573486328, "global_step": 525842, "epoch": 6335} {"train_loss": -27.727863311767578, "global_step": 525843, "epoch": 6335} {"train_loss": -28.022241592407227, "global_step": 525844, "epoch": 6335} {"train_loss": -27.808210372924805, "global_step": 525845, "epoch": 6335} {"train_loss": -27.450063705444336, "global_step": 525846, "epoch": 6335} {"train_loss": -27.628204345703125, "global_step": 525847, "epoch": 6335} {"train_loss": -27.83320426940918, "global_step": 525848, "epoch": 6335} {"train_loss": -27.3585262298584, "global_step": 525849, "epoch": 6335} {"train_loss": -27.193037033081055, "global_step": 525850, "epoch": 6335} {"train_loss": -27.290973663330078, "global_step": 525851, "epoch": 6335} {"train_loss": -27.396345138549805, "global_step": 525852, "epoch": 6335} {"train_loss": -27.77117347717285, "global_step": 525853, "epoch": 6335} {"train_loss": -27.99545669555664, "global_step": 525854, "epoch": 6335} {"train_loss": -27.64609718322754, "global_step": 525855, "epoch": 6335} {"train_loss": -27.85576820373535, "global_step": 525856, "epoch": 6335} {"train_loss": -28.151458740234375, "global_step": 525857, "epoch": 6335} {"train_loss": -27.505887985229492, "global_step": 525858, "epoch": 6335} {"train_loss": -27.691131591796875, "global_step": 525859, "epoch": 6335} {"train_loss": -27.6773738861084, "global_step": 525860, "epoch": 6335} {"train_loss": -27.575061798095703, "global_step": 525861, "epoch": 6335} {"train_loss": -27.67437744140625, "global_step": 525862, "epoch": 6335} {"train_loss": -27.772235870361328, "global_step": 525863, "epoch": 6335} {"train_loss": -27.522388458251953, "global_step": 525864, "epoch": 6335} {"train_loss": -27.4732608795166, "global_step": 525865, "epoch": 6335} {"train_loss": -27.84250831604004, "global_step": 525866, "epoch": 6335} {"train_loss": -27.932729721069336, "global_step": 525867, "epoch": 6335} {"train_loss": -27.91655921936035, "global_step": 525868, "epoch": 6335} {"train_loss": -27.89413833618164, "global_step": 525869, "epoch": 6335} {"train_loss": -27.646207809448242, "global_step": 525870, "epoch": 6335} {"train_loss": -27.524267196655273, "global_step": 525871, "epoch": 6335} {"train_loss": -27.674036026000977, "global_step": 525872, "epoch": 6335} {"train_loss": -27.572751998901367, "global_step": 525873, "epoch": 6335} {"train_loss": -27.623327255249023, "global_step": 525874, "epoch": 6335} {"train_loss": -27.710935592651367, "global_step": 525875, "epoch": 6335} {"train_loss": -27.313398361206055, "global_step": 525876, "epoch": 6335} {"train_loss": -27.544336318969727, "global_step": 525877, "epoch": 6335} {"train_loss": -27.881067276000977, "global_step": 525878, "epoch": 6335} {"train_loss": -27.42693519592285, "global_step": 525879, "epoch": 6335} {"train_loss": -27.592252731323242, "global_step": 525880, "epoch": 6335} {"train_loss": -26.896392822265625, "global_step": 525881, "epoch": 6335} {"train_loss": -27.138629913330078, "global_step": 525882, "epoch": 6335} {"train_loss": -27.401611328125, "global_step": 525883, "epoch": 6335} {"train_loss": -27.567312240600586, "global_step": 525884, "epoch": 6335} {"train_loss": -27.63152503967285, "global_step": 525885, "epoch": 6335} {"train_loss": -27.608352661132812, "global_step": 525886, "epoch": 6335} {"train_loss": -27.586233184998292, "global_step": 525887, "epoch": 6335, "val_loss": 6595830.0} {"train_loss": -26.4658203125, "global_step": 525888, "epoch": 6336} {"train_loss": -26.86433219909668, "global_step": 525889, "epoch": 6336} {"train_loss": -26.856786727905273, "global_step": 525890, "epoch": 6336} {"train_loss": -26.5436954498291, "global_step": 525891, "epoch": 6336} {"train_loss": -26.354040145874023, "global_step": 525892, "epoch": 6336} {"train_loss": -26.683313369750977, "global_step": 525893, "epoch": 6336} {"train_loss": -26.73259925842285, "global_step": 525894, "epoch": 6336} {"train_loss": -26.067707061767578, "global_step": 525895, "epoch": 6336} {"train_loss": -27.103717803955078, "global_step": 525896, "epoch": 6336} {"train_loss": -26.915979385375977, "global_step": 525897, "epoch": 6336} {"train_loss": -26.78571128845215, "global_step": 525898, "epoch": 6336} {"train_loss": -26.749059677124023, "global_step": 525899, "epoch": 6336} {"train_loss": -26.695310592651367, "global_step": 525900, "epoch": 6336} {"train_loss": -27.14727210998535, "global_step": 525901, "epoch": 6336} {"train_loss": -27.5553035736084, "global_step": 525902, "epoch": 6336} {"train_loss": -26.66257667541504, "global_step": 525903, "epoch": 6336} {"train_loss": -27.286273956298828, "global_step": 525904, "epoch": 6336} {"train_loss": -27.422027587890625, "global_step": 525905, "epoch": 6336} {"train_loss": -26.99226951599121, "global_step": 525906, "epoch": 6336} {"train_loss": -27.19695472717285, "global_step": 525907, "epoch": 6336} {"train_loss": -27.345932006835938, "global_step": 525908, "epoch": 6336} {"train_loss": -27.334814071655273, "global_step": 525909, "epoch": 6336} {"train_loss": -27.474994659423828, "global_step": 525910, "epoch": 6336} {"train_loss": -27.50288200378418, "global_step": 525911, "epoch": 6336} {"train_loss": -27.27362060546875, "global_step": 525912, "epoch": 6336} {"train_loss": -27.213836669921875, "global_step": 525913, "epoch": 6336} {"train_loss": -27.169540405273438, "global_step": 525914, "epoch": 6336} {"train_loss": -27.586740493774414, "global_step": 525915, "epoch": 6336} {"train_loss": -27.744892120361328, "global_step": 525916, "epoch": 6336} {"train_loss": -27.03413200378418, "global_step": 525917, "epoch": 6336} {"train_loss": -27.578784942626953, "global_step": 525918, "epoch": 6336} {"train_loss": -27.4981632232666, "global_step": 525919, "epoch": 6336} {"train_loss": -27.305261611938477, "global_step": 525920, "epoch": 6336} {"train_loss": -27.8821964263916, "global_step": 525921, "epoch": 6336} {"train_loss": -27.69015884399414, "global_step": 525922, "epoch": 6336} {"train_loss": -27.414737701416016, "global_step": 525923, "epoch": 6336} {"train_loss": -27.598241806030273, "global_step": 525924, "epoch": 6336} {"train_loss": -27.20221519470215, "global_step": 525925, "epoch": 6336} {"train_loss": -27.450510025024414, "global_step": 525926, "epoch": 6336} {"train_loss": -27.514820098876953, "global_step": 525927, "epoch": 6336} {"train_loss": -27.336593627929688, "global_step": 525928, "epoch": 6336} {"train_loss": -27.31683349609375, "global_step": 525929, "epoch": 6336} {"train_loss": -27.482648849487305, "global_step": 525930, "epoch": 6336} {"train_loss": -27.415319442749023, "global_step": 525931, "epoch": 6336} {"train_loss": -27.13209342956543, "global_step": 525932, "epoch": 6336} {"train_loss": -27.375242233276367, "global_step": 525933, "epoch": 6336} {"train_loss": -27.6541805267334, "global_step": 525934, "epoch": 6336} {"train_loss": -27.870655059814453, "global_step": 525935, "epoch": 6336} {"train_loss": -27.662622451782227, "global_step": 525936, "epoch": 6336} {"train_loss": -27.41351318359375, "global_step": 525937, "epoch": 6336} {"train_loss": -27.894800186157227, "global_step": 525938, "epoch": 6336} {"train_loss": -27.73883056640625, "global_step": 525939, "epoch": 6336} {"train_loss": -27.3746337890625, "global_step": 525940, "epoch": 6336} {"train_loss": -27.78157615661621, "global_step": 525941, "epoch": 6336} {"train_loss": -27.58277702331543, "global_step": 525942, "epoch": 6336} {"train_loss": -27.7283992767334, "global_step": 525943, "epoch": 6336} {"train_loss": -27.299184799194336, "global_step": 525944, "epoch": 6336} {"train_loss": -27.81489372253418, "global_step": 525945, "epoch": 6336} {"train_loss": -28.030298233032227, "global_step": 525946, "epoch": 6336} {"train_loss": -27.74842643737793, "global_step": 525947, "epoch": 6336} {"train_loss": -27.634870529174805, "global_step": 525948, "epoch": 6336} {"train_loss": -27.3377628326416, "global_step": 525949, "epoch": 6336} {"train_loss": -27.25303077697754, "global_step": 525950, "epoch": 6336} {"train_loss": -27.504657745361328, "global_step": 525951, "epoch": 6336} {"train_loss": -28.09974479675293, "global_step": 525952, "epoch": 6336} {"train_loss": -27.457412719726562, "global_step": 525953, "epoch": 6336} {"train_loss": -27.883808135986328, "global_step": 525954, "epoch": 6336} {"train_loss": -27.68198585510254, "global_step": 525955, "epoch": 6336} {"train_loss": -27.90765953063965, "global_step": 525956, "epoch": 6336} {"train_loss": -27.41939353942871, "global_step": 525957, "epoch": 6336} {"train_loss": -27.4764347076416, "global_step": 525958, "epoch": 6336} {"train_loss": -27.336816787719727, "global_step": 525959, "epoch": 6336} {"train_loss": -27.633264541625977, "global_step": 525960, "epoch": 6336} {"train_loss": -27.59016227722168, "global_step": 525961, "epoch": 6336} {"train_loss": -27.576032638549805, "global_step": 525962, "epoch": 6336} {"train_loss": -27.985754013061523, "global_step": 525963, "epoch": 6336} {"train_loss": -27.590490341186523, "global_step": 525964, "epoch": 6336} {"train_loss": -27.728260040283203, "global_step": 525965, "epoch": 6336} {"train_loss": -27.75044822692871, "global_step": 525966, "epoch": 6336} {"train_loss": -27.69659423828125, "global_step": 525967, "epoch": 6336} {"train_loss": -27.584253311157227, "global_step": 525968, "epoch": 6336} {"train_loss": -27.6577205657959, "global_step": 525969, "epoch": 6336} {"train_loss": -27.39743710713214, "global_step": 525970, "epoch": 6336, "val_loss": 6619752.5} {"train_loss": -27.155548095703125, "global_step": 525971, "epoch": 6337} {"train_loss": -26.85747718811035, "global_step": 525972, "epoch": 6337} {"train_loss": -27.200592041015625, "global_step": 525973, "epoch": 6337} {"train_loss": -27.5023193359375, "global_step": 525974, "epoch": 6337} {"train_loss": -27.345874786376953, "global_step": 525975, "epoch": 6337} {"train_loss": -27.179889678955078, "global_step": 525976, "epoch": 6337} {"train_loss": -27.472858428955078, "global_step": 525977, "epoch": 6337} {"train_loss": -27.207788467407227, "global_step": 525978, "epoch": 6337} {"train_loss": -27.085840225219727, "global_step": 525979, "epoch": 6337} {"train_loss": -27.503881454467773, "global_step": 525980, "epoch": 6337} {"train_loss": -27.5497989654541, "global_step": 525981, "epoch": 6337} {"train_loss": -26.95346450805664, "global_step": 525982, "epoch": 6337} {"train_loss": -27.657684326171875, "global_step": 525983, "epoch": 6337} {"train_loss": -27.51373291015625, "global_step": 525984, "epoch": 6337} {"train_loss": -27.8458194732666, "global_step": 525985, "epoch": 6337} {"train_loss": -27.434967041015625, "global_step": 525986, "epoch": 6337} {"train_loss": -27.47309684753418, "global_step": 525987, "epoch": 6337} {"train_loss": -27.48325538635254, "global_step": 525988, "epoch": 6337} {"train_loss": -27.30946159362793, "global_step": 525989, "epoch": 6337} {"train_loss": -27.258441925048828, "global_step": 525990, "epoch": 6337} {"train_loss": -27.496671676635742, "global_step": 525991, "epoch": 6337} {"train_loss": -27.368356704711914, "global_step": 525992, "epoch": 6337} {"train_loss": -27.27030372619629, "global_step": 525993, "epoch": 6337} {"train_loss": -27.552743911743164, "global_step": 525994, "epoch": 6337} {"train_loss": -27.435529708862305, "global_step": 525995, "epoch": 6337} {"train_loss": -27.711645126342773, "global_step": 525996, "epoch": 6337} {"train_loss": -27.64082145690918, "global_step": 525997, "epoch": 6337} {"train_loss": -27.338781356811523, "global_step": 525998, "epoch": 6337} {"train_loss": -27.83563232421875, "global_step": 525999, "epoch": 6337} {"train_loss": -27.307098388671875, "global_step": 526000, "epoch": 6337} {"train_loss": -27.206884384155273, "global_step": 526001, "epoch": 6337} {"train_loss": -27.033498764038086, "global_step": 526002, "epoch": 6337} {"train_loss": -27.62923240661621, "global_step": 526003, "epoch": 6337} {"train_loss": -27.5241641998291, "global_step": 526004, "epoch": 6337} {"train_loss": -27.3411865234375, "global_step": 526005, "epoch": 6337} {"train_loss": -27.020898818969727, "global_step": 526006, "epoch": 6337} {"train_loss": -27.683685302734375, "global_step": 526007, "epoch": 6337} {"train_loss": -27.615720748901367, "global_step": 526008, "epoch": 6337} {"train_loss": -27.238813400268555, "global_step": 526009, "epoch": 6337} {"train_loss": -27.639678955078125, "global_step": 526010, "epoch": 6337} {"train_loss": -27.556875228881836, "global_step": 526011, "epoch": 6337} {"train_loss": -27.939741134643555, "global_step": 526012, "epoch": 6337} {"train_loss": -27.293954849243164, "global_step": 526013, "epoch": 6337} {"train_loss": -27.627593994140625, "global_step": 526014, "epoch": 6337} {"train_loss": -27.96042823791504, "global_step": 526015, "epoch": 6337} {"train_loss": -27.704858779907227, "global_step": 526016, "epoch": 6337} {"train_loss": -27.259042739868164, "global_step": 526017, "epoch": 6337} {"train_loss": -27.543060302734375, "global_step": 526018, "epoch": 6337} {"train_loss": -27.51081657409668, "global_step": 526019, "epoch": 6337} {"train_loss": -27.908971786499023, "global_step": 526020, "epoch": 6337} {"train_loss": -27.89276123046875, "global_step": 526021, "epoch": 6337} {"train_loss": -27.465051651000977, "global_step": 526022, "epoch": 6337} {"train_loss": -27.690351486206055, "global_step": 526023, "epoch": 6337} {"train_loss": -27.779315948486328, "global_step": 526024, "epoch": 6337} {"train_loss": -27.850488662719727, "global_step": 526025, "epoch": 6337} {"train_loss": -27.251483917236328, "global_step": 526026, "epoch": 6337} {"train_loss": -27.361753463745117, "global_step": 526027, "epoch": 6337} {"train_loss": -27.4262752532959, "global_step": 526028, "epoch": 6337} {"train_loss": -27.22025489807129, "global_step": 526029, "epoch": 6337} {"train_loss": -26.68588638305664, "global_step": 526030, "epoch": 6337} {"train_loss": -26.531982421875, "global_step": 526031, "epoch": 6337} {"train_loss": -27.1354923248291, "global_step": 526032, "epoch": 6337} {"train_loss": -27.5660400390625, "global_step": 526033, "epoch": 6337} {"train_loss": -27.390851974487305, "global_step": 526034, "epoch": 6337} {"train_loss": -27.267166137695312, "global_step": 526035, "epoch": 6337} {"train_loss": -27.568872451782227, "global_step": 526036, "epoch": 6337} {"train_loss": -27.616819381713867, "global_step": 526037, "epoch": 6337} {"train_loss": -27.64982032775879, "global_step": 526038, "epoch": 6337} {"train_loss": -27.706663131713867, "global_step": 526039, "epoch": 6337} {"train_loss": -27.423715591430664, "global_step": 526040, "epoch": 6337} {"train_loss": -27.628828048706055, "global_step": 526041, "epoch": 6337} {"train_loss": -27.45417594909668, "global_step": 526042, "epoch": 6337} {"train_loss": -27.33688735961914, "global_step": 526043, "epoch": 6337} {"train_loss": -27.6522216796875, "global_step": 526044, "epoch": 6337} {"train_loss": -27.664539337158203, "global_step": 526045, "epoch": 6337} {"train_loss": -27.705713272094727, "global_step": 526046, "epoch": 6337} {"train_loss": -27.63034439086914, "global_step": 526047, "epoch": 6337} {"train_loss": -27.766881942749023, "global_step": 526048, "epoch": 6337} {"train_loss": -27.776935577392578, "global_step": 526049, "epoch": 6337} {"train_loss": -28.080419540405273, "global_step": 526050, "epoch": 6337} {"train_loss": -27.92721939086914, "global_step": 526051, "epoch": 6337} {"train_loss": -27.403656005859375, "global_step": 526052, "epoch": 6337} {"train_loss": -27.44816906480904, "global_step": 526053, "epoch": 6337, "val_loss": 6580065.0} {"train_loss": -26.78217887878418, "global_step": 526054, "epoch": 6338} {"train_loss": -27.122913360595703, "global_step": 526055, "epoch": 6338} {"train_loss": -27.87208366394043, "global_step": 526056, "epoch": 6338} {"train_loss": -27.358112335205078, "global_step": 526057, "epoch": 6338} {"train_loss": -27.160947799682617, "global_step": 526058, "epoch": 6338} {"train_loss": -27.256818771362305, "global_step": 526059, "epoch": 6338} {"train_loss": -27.256366729736328, "global_step": 526060, "epoch": 6338} {"train_loss": -27.873579025268555, "global_step": 526061, "epoch": 6338} {"train_loss": -27.473257064819336, "global_step": 526062, "epoch": 6338} {"train_loss": -27.247772216796875, "global_step": 526063, "epoch": 6338} {"train_loss": -27.54530906677246, "global_step": 526064, "epoch": 6338} {"train_loss": -27.64084815979004, "global_step": 526065, "epoch": 6338} {"train_loss": -27.638647079467773, "global_step": 526066, "epoch": 6338} {"train_loss": -27.72420310974121, "global_step": 526067, "epoch": 6338} {"train_loss": -27.236474990844727, "global_step": 526068, "epoch": 6338} {"train_loss": -27.460168838500977, "global_step": 526069, "epoch": 6338} {"train_loss": -27.446699142456055, "global_step": 526070, "epoch": 6338} {"train_loss": -27.710514068603516, "global_step": 526071, "epoch": 6338} {"train_loss": -27.271215438842773, "global_step": 526072, "epoch": 6338} {"train_loss": -27.45244789123535, "global_step": 526073, "epoch": 6338} {"train_loss": -27.361387252807617, "global_step": 526074, "epoch": 6338} {"train_loss": -27.8543701171875, "global_step": 526075, "epoch": 6338} {"train_loss": -27.601428985595703, "global_step": 526076, "epoch": 6338} {"train_loss": -27.49639320373535, "global_step": 526077, "epoch": 6338} {"train_loss": -27.70619773864746, "global_step": 526078, "epoch": 6338} {"train_loss": -27.369199752807617, "global_step": 526079, "epoch": 6338} {"train_loss": -27.98187828063965, "global_step": 526080, "epoch": 6338} {"train_loss": -27.807104110717773, "global_step": 526081, "epoch": 6338} {"train_loss": -27.701995849609375, "global_step": 526082, "epoch": 6338} {"train_loss": -27.74769401550293, "global_step": 526083, "epoch": 6338} {"train_loss": -27.408971786499023, "global_step": 526084, "epoch": 6338} {"train_loss": -27.0439510345459, "global_step": 526085, "epoch": 6338} {"train_loss": -27.54795265197754, "global_step": 526086, "epoch": 6338} {"train_loss": -27.252960205078125, "global_step": 526087, "epoch": 6338} {"train_loss": -27.639196395874023, "global_step": 526088, "epoch": 6338} {"train_loss": -26.941730499267578, "global_step": 526089, "epoch": 6338} {"train_loss": -27.228540420532227, "global_step": 526090, "epoch": 6338} {"train_loss": -27.959369659423828, "global_step": 526091, "epoch": 6338} {"train_loss": -27.812665939331055, "global_step": 526092, "epoch": 6338} {"train_loss": -27.52374839782715, "global_step": 526093, "epoch": 6338} {"train_loss": -27.78767967224121, "global_step": 526094, "epoch": 6338} {"train_loss": -27.457138061523438, "global_step": 526095, "epoch": 6338} {"train_loss": -27.890899658203125, "global_step": 526096, "epoch": 6338} {"train_loss": -27.218341827392578, "global_step": 526097, "epoch": 6338} {"train_loss": -27.22344970703125, "global_step": 526098, "epoch": 6338} {"train_loss": -27.34147071838379, "global_step": 526099, "epoch": 6338} {"train_loss": -27.452054977416992, "global_step": 526100, "epoch": 6338} {"train_loss": -27.755096435546875, "global_step": 526101, "epoch": 6338} {"train_loss": -27.757932662963867, "global_step": 526102, "epoch": 6338} {"train_loss": -27.39002799987793, "global_step": 526103, "epoch": 6338} {"train_loss": -27.645902633666992, "global_step": 526104, "epoch": 6338} {"train_loss": -27.695362091064453, "global_step": 526105, "epoch": 6338} {"train_loss": -27.515445709228516, "global_step": 526106, "epoch": 6338} {"train_loss": -27.560047149658203, "global_step": 526107, "epoch": 6338} {"train_loss": -27.921695709228516, "global_step": 526108, "epoch": 6338} {"train_loss": -27.828948974609375, "global_step": 526109, "epoch": 6338} {"train_loss": -27.475122451782227, "global_step": 526110, "epoch": 6338} {"train_loss": -27.461278915405273, "global_step": 526111, "epoch": 6338} {"train_loss": -27.48347282409668, "global_step": 526112, "epoch": 6338} {"train_loss": -27.659292221069336, "global_step": 526113, "epoch": 6338} {"train_loss": -27.770971298217773, "global_step": 526114, "epoch": 6338} {"train_loss": -28.011859893798828, "global_step": 526115, "epoch": 6338} {"train_loss": -27.71552085876465, "global_step": 526116, "epoch": 6338} {"train_loss": -27.372594833374023, "global_step": 526117, "epoch": 6338} {"train_loss": -27.85115623474121, "global_step": 526118, "epoch": 6338} {"train_loss": -27.485828399658203, "global_step": 526119, "epoch": 6338} {"train_loss": -27.705198287963867, "global_step": 526120, "epoch": 6338} {"train_loss": -27.63103675842285, "global_step": 526121, "epoch": 6338} {"train_loss": -27.399267196655273, "global_step": 526122, "epoch": 6338} {"train_loss": -27.951406478881836, "global_step": 526123, "epoch": 6338} {"train_loss": -27.5400447845459, "global_step": 526124, "epoch": 6338} {"train_loss": -27.612060546875, "global_step": 526125, "epoch": 6338} {"train_loss": -27.980173110961914, "global_step": 526126, "epoch": 6338} {"train_loss": -27.94185447692871, "global_step": 526127, "epoch": 6338} {"train_loss": -27.6057186126709, "global_step": 526128, "epoch": 6338} {"train_loss": -28.08753776550293, "global_step": 526129, "epoch": 6338} {"train_loss": -27.365407943725586, "global_step": 526130, "epoch": 6338} {"train_loss": -27.6630916595459, "global_step": 526131, "epoch": 6338} {"train_loss": -27.724645614624023, "global_step": 526132, "epoch": 6338} {"train_loss": -27.7423038482666, "global_step": 526133, "epoch": 6338} {"train_loss": -27.677738189697266, "global_step": 526134, "epoch": 6338} {"train_loss": -27.599157333374023, "global_step": 526135, "epoch": 6338} {"train_loss": -27.563096678400616, "global_step": 526136, "epoch": 6338, "val_loss": 6563679.0} {"train_loss": -27.525177001953125, "global_step": 526137, "epoch": 6339} {"train_loss": -26.867151260375977, "global_step": 526138, "epoch": 6339} {"train_loss": -26.93979835510254, "global_step": 526139, "epoch": 6339} {"train_loss": -26.19532585144043, "global_step": 526140, "epoch": 6339} {"train_loss": -26.157312393188477, "global_step": 526141, "epoch": 6339} {"train_loss": -26.00336265563965, "global_step": 526142, "epoch": 6339} {"train_loss": -27.26711082458496, "global_step": 526143, "epoch": 6339} {"train_loss": -27.208784103393555, "global_step": 526144, "epoch": 6339} {"train_loss": -26.70735740661621, "global_step": 526145, "epoch": 6339} {"train_loss": -26.767578125, "global_step": 526146, "epoch": 6339} {"train_loss": -26.799591064453125, "global_step": 526147, "epoch": 6339} {"train_loss": -26.927066802978516, "global_step": 526148, "epoch": 6339} {"train_loss": -27.203125, "global_step": 526149, "epoch": 6339} {"train_loss": -26.656213760375977, "global_step": 526150, "epoch": 6339} {"train_loss": -27.28938102722168, "global_step": 526151, "epoch": 6339} {"train_loss": -26.91092300415039, "global_step": 526152, "epoch": 6339} {"train_loss": -27.110517501831055, "global_step": 526153, "epoch": 6339} {"train_loss": -27.52577018737793, "global_step": 526154, "epoch": 6339} {"train_loss": -27.125274658203125, "global_step": 526155, "epoch": 6339} {"train_loss": -26.97639274597168, "global_step": 526156, "epoch": 6339} {"train_loss": -27.64230728149414, "global_step": 526157, "epoch": 6339} {"train_loss": -26.19345474243164, "global_step": 526158, "epoch": 6339} {"train_loss": -27.316186904907227, "global_step": 526159, "epoch": 6339} {"train_loss": -26.947675704956055, "global_step": 526160, "epoch": 6339} {"train_loss": -27.060535430908203, "global_step": 526161, "epoch": 6339} {"train_loss": -27.062152862548828, "global_step": 526162, "epoch": 6339} {"train_loss": -27.344696044921875, "global_step": 526163, "epoch": 6339} {"train_loss": -27.261144638061523, "global_step": 526164, "epoch": 6339} {"train_loss": -27.40862464904785, "global_step": 526165, "epoch": 6339} {"train_loss": -27.49344825744629, "global_step": 526166, "epoch": 6339} {"train_loss": -27.43108558654785, "global_step": 526167, "epoch": 6339} {"train_loss": -27.373294830322266, "global_step": 526168, "epoch": 6339} {"train_loss": -27.407123565673828, "global_step": 526169, "epoch": 6339} {"train_loss": -27.451202392578125, "global_step": 526170, "epoch": 6339} {"train_loss": -27.931217193603516, "global_step": 526171, "epoch": 6339} {"train_loss": -27.32830810546875, "global_step": 526172, "epoch": 6339} {"train_loss": -27.573705673217773, "global_step": 526173, "epoch": 6339} {"train_loss": -27.81659507751465, "global_step": 526174, "epoch": 6339} {"train_loss": -27.753284454345703, "global_step": 526175, "epoch": 6339} {"train_loss": -27.82661247253418, "global_step": 526176, "epoch": 6339} {"train_loss": -27.68609619140625, "global_step": 526177, "epoch": 6339} {"train_loss": -27.883563995361328, "global_step": 526178, "epoch": 6339} {"train_loss": -27.674768447875977, "global_step": 526179, "epoch": 6339} {"train_loss": -27.348175048828125, "global_step": 526180, "epoch": 6339} {"train_loss": -27.736780166625977, "global_step": 526181, "epoch": 6339} {"train_loss": -27.333295822143555, "global_step": 526182, "epoch": 6339} {"train_loss": -27.830732345581055, "global_step": 526183, "epoch": 6339} {"train_loss": -27.819807052612305, "global_step": 526184, "epoch": 6339} {"train_loss": -27.493011474609375, "global_step": 526185, "epoch": 6339} {"train_loss": -27.883804321289062, "global_step": 526186, "epoch": 6339} {"train_loss": -27.776330947875977, "global_step": 526187, "epoch": 6339} {"train_loss": -27.891698837280273, "global_step": 526188, "epoch": 6339} {"train_loss": -27.702423095703125, "global_step": 526189, "epoch": 6339} {"train_loss": -27.859769821166992, "global_step": 526190, "epoch": 6339} {"train_loss": -27.961475372314453, "global_step": 526191, "epoch": 6339} {"train_loss": -27.917051315307617, "global_step": 526192, "epoch": 6339} {"train_loss": -27.793745040893555, "global_step": 526193, "epoch": 6339} {"train_loss": -27.541345596313477, "global_step": 526194, "epoch": 6339} {"train_loss": -27.666656494140625, "global_step": 526195, "epoch": 6339} {"train_loss": -27.91045570373535, "global_step": 526196, "epoch": 6339} {"train_loss": -27.58445167541504, "global_step": 526197, "epoch": 6339} {"train_loss": -27.8779296875, "global_step": 526198, "epoch": 6339} {"train_loss": -27.891016006469727, "global_step": 526199, "epoch": 6339} {"train_loss": -27.649173736572266, "global_step": 526200, "epoch": 6339} {"train_loss": -28.02996826171875, "global_step": 526201, "epoch": 6339} {"train_loss": -27.326623916625977, "global_step": 526202, "epoch": 6339} {"train_loss": -27.521060943603516, "global_step": 526203, "epoch": 6339} {"train_loss": -27.682758331298828, "global_step": 526204, "epoch": 6339} {"train_loss": -27.571542739868164, "global_step": 526205, "epoch": 6339} {"train_loss": -27.51798439025879, "global_step": 526206, "epoch": 6339} {"train_loss": -27.62299919128418, "global_step": 526207, "epoch": 6339} {"train_loss": -27.87928581237793, "global_step": 526208, "epoch": 6339} {"train_loss": -27.714895248413086, "global_step": 526209, "epoch": 6339} {"train_loss": -27.4858341217041, "global_step": 526210, "epoch": 6339} {"train_loss": -27.1396541595459, "global_step": 526211, "epoch": 6339} {"train_loss": -26.721410751342773, "global_step": 526212, "epoch": 6339} {"train_loss": -26.68963623046875, "global_step": 526213, "epoch": 6339} {"train_loss": -27.38246726989746, "global_step": 526214, "epoch": 6339} {"train_loss": -27.254154205322266, "global_step": 526215, "epoch": 6339} {"train_loss": -27.39954948425293, "global_step": 526216, "epoch": 6339} {"train_loss": -27.141218185424805, "global_step": 526217, "epoch": 6339} {"train_loss": -27.4921932220459, "global_step": 526218, "epoch": 6339} {"train_loss": -27.364685127534063, "global_step": 526219, "epoch": 6339, "val_loss": 6675418.0} {"train_loss": -26.910541534423828, "global_step": 526220, "epoch": 6340} {"train_loss": -25.861059188842773, "global_step": 526221, "epoch": 6340} {"train_loss": -27.54709243774414, "global_step": 526222, "epoch": 6340} {"train_loss": -26.472824096679688, "global_step": 526223, "epoch": 6340} {"train_loss": -26.805028915405273, "global_step": 526224, "epoch": 6340} {"train_loss": -26.758102416992188, "global_step": 526225, "epoch": 6340} {"train_loss": -26.987699508666992, "global_step": 526226, "epoch": 6340} {"train_loss": -26.3751220703125, "global_step": 526227, "epoch": 6340} {"train_loss": -27.068899154663086, "global_step": 526228, "epoch": 6340} {"train_loss": -27.072574615478516, "global_step": 526229, "epoch": 6340} {"train_loss": -26.907257080078125, "global_step": 526230, "epoch": 6340} {"train_loss": -26.816190719604492, "global_step": 526231, "epoch": 6340} {"train_loss": -27.1644344329834, "global_step": 526232, "epoch": 6340} {"train_loss": -26.894926071166992, "global_step": 526233, "epoch": 6340} {"train_loss": -26.87408447265625, "global_step": 526234, "epoch": 6340} {"train_loss": -27.4183349609375, "global_step": 526235, "epoch": 6340} {"train_loss": -27.028989791870117, "global_step": 526236, "epoch": 6340} {"train_loss": -27.41218376159668, "global_step": 526237, "epoch": 6340} {"train_loss": -27.101001739501953, "global_step": 526238, "epoch": 6340} {"train_loss": -26.944997787475586, "global_step": 526239, "epoch": 6340} {"train_loss": -27.449462890625, "global_step": 526240, "epoch": 6340} {"train_loss": -27.3175048828125, "global_step": 526241, "epoch": 6340} {"train_loss": -27.5079345703125, "global_step": 526242, "epoch": 6340} {"train_loss": -27.219562530517578, "global_step": 526243, "epoch": 6340} {"train_loss": -27.234542846679688, "global_step": 526244, "epoch": 6340} {"train_loss": -27.699426651000977, "global_step": 526245, "epoch": 6340} {"train_loss": -27.437936782836914, "global_step": 526246, "epoch": 6340} {"train_loss": -27.55437660217285, "global_step": 526247, "epoch": 6340} {"train_loss": -27.4135799407959, "global_step": 526248, "epoch": 6340} {"train_loss": -27.53608512878418, "global_step": 526249, "epoch": 6340} {"train_loss": -27.55377769470215, "global_step": 526250, "epoch": 6340} {"train_loss": -27.709918975830078, "global_step": 526251, "epoch": 6340} {"train_loss": -27.42095375061035, "global_step": 526252, "epoch": 6340} {"train_loss": -27.92616081237793, "global_step": 526253, "epoch": 6340} {"train_loss": -27.524744033813477, "global_step": 526254, "epoch": 6340} {"train_loss": -27.65801429748535, "global_step": 526255, "epoch": 6340} {"train_loss": -27.86371421813965, "global_step": 526256, "epoch": 6340} {"train_loss": -27.6473331451416, "global_step": 526257, "epoch": 6340} {"train_loss": -27.929168701171875, "global_step": 526258, "epoch": 6340} {"train_loss": -27.575580596923828, "global_step": 526259, "epoch": 6340} {"train_loss": -27.739530563354492, "global_step": 526260, "epoch": 6340} {"train_loss": -27.79517936706543, "global_step": 526261, "epoch": 6340} {"train_loss": -27.441701889038086, "global_step": 526262, "epoch": 6340} {"train_loss": -27.60393714904785, "global_step": 526263, "epoch": 6340} {"train_loss": -27.918121337890625, "global_step": 526264, "epoch": 6340} {"train_loss": -27.54754638671875, "global_step": 526265, "epoch": 6340} {"train_loss": -27.649866104125977, "global_step": 526266, "epoch": 6340} {"train_loss": -27.489301681518555, "global_step": 526267, "epoch": 6340} {"train_loss": -27.51630210876465, "global_step": 526268, "epoch": 6340} {"train_loss": -27.681665420532227, "global_step": 526269, "epoch": 6340} {"train_loss": -27.760644912719727, "global_step": 526270, "epoch": 6340} {"train_loss": -27.309097290039062, "global_step": 526271, "epoch": 6340} {"train_loss": -27.739593505859375, "global_step": 526272, "epoch": 6340} {"train_loss": -27.72698974609375, "global_step": 526273, "epoch": 6340} {"train_loss": -27.390106201171875, "global_step": 526274, "epoch": 6340} {"train_loss": -27.31483268737793, "global_step": 526275, "epoch": 6340} {"train_loss": -27.061548233032227, "global_step": 526276, "epoch": 6340} {"train_loss": -26.681537628173828, "global_step": 526277, "epoch": 6340} {"train_loss": -26.715717315673828, "global_step": 526278, "epoch": 6340} {"train_loss": -26.9117431640625, "global_step": 526279, "epoch": 6340} {"train_loss": -27.4307804107666, "global_step": 526280, "epoch": 6340} {"train_loss": -27.458297729492188, "global_step": 526281, "epoch": 6340} {"train_loss": -26.848241806030273, "global_step": 526282, "epoch": 6340} {"train_loss": -27.00043296813965, "global_step": 526283, "epoch": 6340} {"train_loss": -27.084814071655273, "global_step": 526284, "epoch": 6340} {"train_loss": -27.180713653564453, "global_step": 526285, "epoch": 6340} {"train_loss": -27.303647994995117, "global_step": 526286, "epoch": 6340} {"train_loss": -27.359731674194336, "global_step": 526287, "epoch": 6340} {"train_loss": -27.273834228515625, "global_step": 526288, "epoch": 6340} {"train_loss": -27.42117691040039, "global_step": 526289, "epoch": 6340} {"train_loss": -27.474628448486328, "global_step": 526290, "epoch": 6340} {"train_loss": -27.366397857666016, "global_step": 526291, "epoch": 6340} {"train_loss": -27.4704532623291, "global_step": 526292, "epoch": 6340} {"train_loss": -27.34847068786621, "global_step": 526293, "epoch": 6340} {"train_loss": -27.410430908203125, "global_step": 526294, "epoch": 6340} {"train_loss": -27.35988426208496, "global_step": 526295, "epoch": 6340} {"train_loss": -27.6052188873291, "global_step": 526296, "epoch": 6340} {"train_loss": -27.66594886779785, "global_step": 526297, "epoch": 6340} {"train_loss": -27.902297973632812, "global_step": 526298, "epoch": 6340} {"train_loss": -27.65421485900879, "global_step": 526299, "epoch": 6340} {"train_loss": -27.529144287109375, "global_step": 526300, "epoch": 6340} {"train_loss": -27.720251083374023, "global_step": 526301, "epoch": 6340} {"train_loss": -27.345830894378295, "global_step": 526302, "epoch": 6340, "val_loss": 6612246.0} {"train_loss": -27.134180068969727, "global_step": 526303, "epoch": 6341} {"train_loss": -27.480695724487305, "global_step": 526304, "epoch": 6341} {"train_loss": -27.552276611328125, "global_step": 526305, "epoch": 6341} {"train_loss": -27.2503719329834, "global_step": 526306, "epoch": 6341} {"train_loss": -27.68173599243164, "global_step": 526307, "epoch": 6341} {"train_loss": -27.597248077392578, "global_step": 526308, "epoch": 6341} {"train_loss": -28.0274658203125, "global_step": 526309, "epoch": 6341} {"train_loss": -27.81907081604004, "global_step": 526310, "epoch": 6341} {"train_loss": -27.2520751953125, "global_step": 526311, "epoch": 6341} {"train_loss": -27.819360733032227, "global_step": 526312, "epoch": 6341} {"train_loss": -27.64548683166504, "global_step": 526313, "epoch": 6341} {"train_loss": -27.62812614440918, "global_step": 526314, "epoch": 6341} {"train_loss": -27.689279556274414, "global_step": 526315, "epoch": 6341} {"train_loss": -27.6634578704834, "global_step": 526316, "epoch": 6341} {"train_loss": -27.063907623291016, "global_step": 526317, "epoch": 6341} {"train_loss": -27.707712173461914, "global_step": 526318, "epoch": 6341} {"train_loss": -27.61517333984375, "global_step": 526319, "epoch": 6341} {"train_loss": -27.284570693969727, "global_step": 526320, "epoch": 6341} {"train_loss": -27.4530029296875, "global_step": 526321, "epoch": 6341} {"train_loss": -27.485538482666016, "global_step": 526322, "epoch": 6341} {"train_loss": -27.99665641784668, "global_step": 526323, "epoch": 6341} {"train_loss": -27.3603572845459, "global_step": 526324, "epoch": 6341} {"train_loss": -27.595922470092773, "global_step": 526325, "epoch": 6341} {"train_loss": -27.669981002807617, "global_step": 526326, "epoch": 6341} {"train_loss": -27.655405044555664, "global_step": 526327, "epoch": 6341} {"train_loss": -27.92047691345215, "global_step": 526328, "epoch": 6341} {"train_loss": -27.586200714111328, "global_step": 526329, "epoch": 6341} {"train_loss": -27.879728317260742, "global_step": 526330, "epoch": 6341} {"train_loss": -27.579700469970703, "global_step": 526331, "epoch": 6341} {"train_loss": -27.538806915283203, "global_step": 526332, "epoch": 6341} {"train_loss": -27.5947208404541, "global_step": 526333, "epoch": 6341} {"train_loss": -27.91977310180664, "global_step": 526334, "epoch": 6341} {"train_loss": -27.687942504882812, "global_step": 526335, "epoch": 6341} {"train_loss": -27.31963539123535, "global_step": 526336, "epoch": 6341} {"train_loss": -27.263233184814453, "global_step": 526337, "epoch": 6341} {"train_loss": -26.50774574279785, "global_step": 526338, "epoch": 6341} {"train_loss": -24.550046920776367, "global_step": 526339, "epoch": 6341} {"train_loss": -24.282102584838867, "global_step": 526340, "epoch": 6341} {"train_loss": -26.68726921081543, "global_step": 526341, "epoch": 6341} {"train_loss": -27.03474235534668, "global_step": 526342, "epoch": 6341} {"train_loss": -27.36407470703125, "global_step": 526343, "epoch": 6341} {"train_loss": -27.28213882446289, "global_step": 526344, "epoch": 6341} {"train_loss": -27.02473258972168, "global_step": 526345, "epoch": 6341} {"train_loss": -27.404035568237305, "global_step": 526346, "epoch": 6341} {"train_loss": -27.24383544921875, "global_step": 526347, "epoch": 6341} {"train_loss": -27.388273239135742, "global_step": 526348, "epoch": 6341} {"train_loss": -27.10785484313965, "global_step": 526349, "epoch": 6341} {"train_loss": -27.479740142822266, "global_step": 526350, "epoch": 6341} {"train_loss": -26.993383407592773, "global_step": 526351, "epoch": 6341} {"train_loss": -27.271268844604492, "global_step": 526352, "epoch": 6341} {"train_loss": -27.600378036499023, "global_step": 526353, "epoch": 6341} {"train_loss": -26.91827964782715, "global_step": 526354, "epoch": 6341} {"train_loss": -27.253141403198242, "global_step": 526355, "epoch": 6341} {"train_loss": -27.470569610595703, "global_step": 526356, "epoch": 6341} {"train_loss": -27.812341690063477, "global_step": 526357, "epoch": 6341} {"train_loss": -27.289335250854492, "global_step": 526358, "epoch": 6341} {"train_loss": -27.48447036743164, "global_step": 526359, "epoch": 6341} {"train_loss": -27.38237953186035, "global_step": 526360, "epoch": 6341} {"train_loss": -27.5816650390625, "global_step": 526361, "epoch": 6341} {"train_loss": -27.458072662353516, "global_step": 526362, "epoch": 6341} {"train_loss": -27.344512939453125, "global_step": 526363, "epoch": 6341} {"train_loss": -27.49653434753418, "global_step": 526364, "epoch": 6341} {"train_loss": -27.631744384765625, "global_step": 526365, "epoch": 6341} {"train_loss": -27.48917007446289, "global_step": 526366, "epoch": 6341} {"train_loss": -27.566572189331055, "global_step": 526367, "epoch": 6341} {"train_loss": -27.385122299194336, "global_step": 526368, "epoch": 6341} {"train_loss": -27.32305908203125, "global_step": 526369, "epoch": 6341} {"train_loss": -26.93644142150879, "global_step": 526370, "epoch": 6341} {"train_loss": -27.415241241455078, "global_step": 526371, "epoch": 6341} {"train_loss": -27.069074630737305, "global_step": 526372, "epoch": 6341} {"train_loss": -27.468332290649414, "global_step": 526373, "epoch": 6341} {"train_loss": -27.741943359375, "global_step": 526374, "epoch": 6341} {"train_loss": -27.49663734436035, "global_step": 526375, "epoch": 6341} {"train_loss": -27.6036434173584, "global_step": 526376, "epoch": 6341} {"train_loss": -27.73419189453125, "global_step": 526377, "epoch": 6341} {"train_loss": -27.82954216003418, "global_step": 526378, "epoch": 6341} {"train_loss": -27.422138214111328, "global_step": 526379, "epoch": 6341} {"train_loss": -27.543109893798828, "global_step": 526380, "epoch": 6341} {"train_loss": -27.3104248046875, "global_step": 526381, "epoch": 6341} {"train_loss": -27.77311134338379, "global_step": 526382, "epoch": 6341} {"train_loss": -27.22638511657715, "global_step": 526383, "epoch": 6341} {"train_loss": -27.40182876586914, "global_step": 526384, "epoch": 6341} {"train_loss": -27.3736348669213, "global_step": 526385, "epoch": 6341, "val_loss": 6584364.0} {"train_loss": -27.111875534057617, "global_step": 526386, "epoch": 6342} {"train_loss": -26.26323890686035, "global_step": 526387, "epoch": 6342} {"train_loss": -26.154712677001953, "global_step": 526388, "epoch": 6342} {"train_loss": -26.905792236328125, "global_step": 526389, "epoch": 6342} {"train_loss": -27.14045524597168, "global_step": 526390, "epoch": 6342} {"train_loss": -26.739721298217773, "global_step": 526391, "epoch": 6342} {"train_loss": -27.0578556060791, "global_step": 526392, "epoch": 6342} {"train_loss": -26.631622314453125, "global_step": 526393, "epoch": 6342} {"train_loss": -26.7257080078125, "global_step": 526394, "epoch": 6342} {"train_loss": -26.8075008392334, "global_step": 526395, "epoch": 6342} {"train_loss": -27.28847312927246, "global_step": 526396, "epoch": 6342} {"train_loss": -27.400121688842773, "global_step": 526397, "epoch": 6342} {"train_loss": -27.42063331604004, "global_step": 526398, "epoch": 6342} {"train_loss": -26.980926513671875, "global_step": 526399, "epoch": 6342} {"train_loss": -27.26739501953125, "global_step": 526400, "epoch": 6342} {"train_loss": -27.2152042388916, "global_step": 526401, "epoch": 6342} {"train_loss": -27.43819236755371, "global_step": 526402, "epoch": 6342} {"train_loss": -27.751068115234375, "global_step": 526403, "epoch": 6342} {"train_loss": -27.225936889648438, "global_step": 526404, "epoch": 6342} {"train_loss": -27.37129020690918, "global_step": 526405, "epoch": 6342} {"train_loss": -27.5753116607666, "global_step": 526406, "epoch": 6342} {"train_loss": -27.403318405151367, "global_step": 526407, "epoch": 6342} {"train_loss": -27.28334617614746, "global_step": 526408, "epoch": 6342} {"train_loss": -27.814416885375977, "global_step": 526409, "epoch": 6342} {"train_loss": -27.272403717041016, "global_step": 526410, "epoch": 6342} {"train_loss": -27.32700538635254, "global_step": 526411, "epoch": 6342} {"train_loss": -27.368070602416992, "global_step": 526412, "epoch": 6342} {"train_loss": -27.840167999267578, "global_step": 526413, "epoch": 6342} {"train_loss": -27.4191837310791, "global_step": 526414, "epoch": 6342} {"train_loss": -27.274351119995117, "global_step": 526415, "epoch": 6342} {"train_loss": -27.40597915649414, "global_step": 526416, "epoch": 6342} {"train_loss": -27.373517990112305, "global_step": 526417, "epoch": 6342} {"train_loss": -27.572284698486328, "global_step": 526418, "epoch": 6342} {"train_loss": -27.862213134765625, "global_step": 526419, "epoch": 6342} {"train_loss": -27.704456329345703, "global_step": 526420, "epoch": 6342} {"train_loss": -27.312780380249023, "global_step": 526421, "epoch": 6342} {"train_loss": -27.44831657409668, "global_step": 526422, "epoch": 6342} {"train_loss": -27.579614639282227, "global_step": 526423, "epoch": 6342} {"train_loss": -27.85404396057129, "global_step": 526424, "epoch": 6342} {"train_loss": -27.520517349243164, "global_step": 526425, "epoch": 6342} {"train_loss": -27.5804386138916, "global_step": 526426, "epoch": 6342} {"train_loss": -27.3869686126709, "global_step": 526427, "epoch": 6342} {"train_loss": -27.893301010131836, "global_step": 526428, "epoch": 6342} {"train_loss": -27.408660888671875, "global_step": 526429, "epoch": 6342} {"train_loss": -27.880695343017578, "global_step": 526430, "epoch": 6342} {"train_loss": -27.7459659576416, "global_step": 526431, "epoch": 6342} {"train_loss": -27.750974655151367, "global_step": 526432, "epoch": 6342} {"train_loss": -27.780263900756836, "global_step": 526433, "epoch": 6342} {"train_loss": -27.67073631286621, "global_step": 526434, "epoch": 6342} {"train_loss": -27.591449737548828, "global_step": 526435, "epoch": 6342} {"train_loss": -27.52777099609375, "global_step": 526436, "epoch": 6342} {"train_loss": -27.365209579467773, "global_step": 526437, "epoch": 6342} {"train_loss": -28.240854263305664, "global_step": 526438, "epoch": 6342} {"train_loss": -27.798267364501953, "global_step": 526439, "epoch": 6342} {"train_loss": -27.65107536315918, "global_step": 526440, "epoch": 6342} {"train_loss": -27.54363441467285, "global_step": 526441, "epoch": 6342} {"train_loss": -28.032428741455078, "global_step": 526442, "epoch": 6342} {"train_loss": -27.37250328063965, "global_step": 526443, "epoch": 6342} {"train_loss": -27.937063217163086, "global_step": 526444, "epoch": 6342} {"train_loss": -27.33595085144043, "global_step": 526445, "epoch": 6342} {"train_loss": -27.580890655517578, "global_step": 526446, "epoch": 6342} {"train_loss": -27.266998291015625, "global_step": 526447, "epoch": 6342} {"train_loss": -27.737272262573242, "global_step": 526448, "epoch": 6342} {"train_loss": -27.673192977905273, "global_step": 526449, "epoch": 6342} {"train_loss": -27.21065330505371, "global_step": 526450, "epoch": 6342} {"train_loss": -27.47025489807129, "global_step": 526451, "epoch": 6342} {"train_loss": -27.21918296813965, "global_step": 526452, "epoch": 6342} {"train_loss": -27.529211044311523, "global_step": 526453, "epoch": 6342} {"train_loss": -27.46078872680664, "global_step": 526454, "epoch": 6342} {"train_loss": -27.148706436157227, "global_step": 526455, "epoch": 6342} {"train_loss": -27.810791015625, "global_step": 526456, "epoch": 6342} {"train_loss": -27.299945831298828, "global_step": 526457, "epoch": 6342} {"train_loss": -27.1994571685791, "global_step": 526458, "epoch": 6342} {"train_loss": -27.629684448242188, "global_step": 526459, "epoch": 6342} {"train_loss": -27.432764053344727, "global_step": 526460, "epoch": 6342} {"train_loss": -27.487548828125, "global_step": 526461, "epoch": 6342} {"train_loss": -27.580183029174805, "global_step": 526462, "epoch": 6342} {"train_loss": -27.433584213256836, "global_step": 526463, "epoch": 6342} {"train_loss": -27.42487907409668, "global_step": 526464, "epoch": 6342} {"train_loss": -27.112472534179688, "global_step": 526465, "epoch": 6342} {"train_loss": -27.622699737548828, "global_step": 526466, "epoch": 6342} {"train_loss": -27.76276969909668, "global_step": 526467, "epoch": 6342} {"train_loss": -27.41241427502, "global_step": 526468, "epoch": 6342, "val_loss": 6634109.0} {"train_loss": -26.236434936523438, "global_step": 526469, "epoch": 6343} {"train_loss": -26.853605270385742, "global_step": 526470, "epoch": 6343} {"train_loss": -27.15791893005371, "global_step": 526471, "epoch": 6343} {"train_loss": -26.646230697631836, "global_step": 526472, "epoch": 6343} {"train_loss": -26.890588760375977, "global_step": 526473, "epoch": 6343} {"train_loss": -26.94232749938965, "global_step": 526474, "epoch": 6343} {"train_loss": -27.34441566467285, "global_step": 526475, "epoch": 6343} {"train_loss": -26.869611740112305, "global_step": 526476, "epoch": 6343} {"train_loss": -26.946592330932617, "global_step": 526477, "epoch": 6343} {"train_loss": -27.299850463867188, "global_step": 526478, "epoch": 6343} {"train_loss": -27.2834529876709, "global_step": 526479, "epoch": 6343} {"train_loss": -27.35407066345215, "global_step": 526480, "epoch": 6343} {"train_loss": -27.19708824157715, "global_step": 526481, "epoch": 6343} {"train_loss": -27.555288314819336, "global_step": 526482, "epoch": 6343} {"train_loss": -27.359533309936523, "global_step": 526483, "epoch": 6343} {"train_loss": -27.45979118347168, "global_step": 526484, "epoch": 6343} {"train_loss": -27.89853286743164, "global_step": 526485, "epoch": 6343} {"train_loss": -27.30559730529785, "global_step": 526486, "epoch": 6343} {"train_loss": -27.389184951782227, "global_step": 526487, "epoch": 6343} {"train_loss": -27.620407104492188, "global_step": 526488, "epoch": 6343} {"train_loss": -27.37969970703125, "global_step": 526489, "epoch": 6343} {"train_loss": -27.346237182617188, "global_step": 526490, "epoch": 6343} {"train_loss": -27.135761260986328, "global_step": 526491, "epoch": 6343} {"train_loss": -27.485706329345703, "global_step": 526492, "epoch": 6343} {"train_loss": -27.960968017578125, "global_step": 526493, "epoch": 6343} {"train_loss": -27.445165634155273, "global_step": 526494, "epoch": 6343} {"train_loss": -27.456029891967773, "global_step": 526495, "epoch": 6343} {"train_loss": -27.167184829711914, "global_step": 526496, "epoch": 6343} {"train_loss": -27.099822998046875, "global_step": 526497, "epoch": 6343} {"train_loss": -27.457233428955078, "global_step": 526498, "epoch": 6343} {"train_loss": -27.359668731689453, "global_step": 526499, "epoch": 6343} {"train_loss": -27.348779678344727, "global_step": 526500, "epoch": 6343} {"train_loss": -27.84822654724121, "global_step": 526501, "epoch": 6343} {"train_loss": -27.41427993774414, "global_step": 526502, "epoch": 6343} {"train_loss": -27.55722999572754, "global_step": 526503, "epoch": 6343} {"train_loss": -27.613874435424805, "global_step": 526504, "epoch": 6343} {"train_loss": -27.757923126220703, "global_step": 526505, "epoch": 6343} {"train_loss": -27.693161010742188, "global_step": 526506, "epoch": 6343} {"train_loss": -27.91835594177246, "global_step": 526507, "epoch": 6343} {"train_loss": -27.410242080688477, "global_step": 526508, "epoch": 6343} {"train_loss": -27.521310806274414, "global_step": 526509, "epoch": 6343} {"train_loss": -27.360553741455078, "global_step": 526510, "epoch": 6343} {"train_loss": -27.84137535095215, "global_step": 526511, "epoch": 6343} {"train_loss": -28.011566162109375, "global_step": 526512, "epoch": 6343} {"train_loss": -27.602405548095703, "global_step": 526513, "epoch": 6343} {"train_loss": -27.431564331054688, "global_step": 526514, "epoch": 6343} {"train_loss": -27.433551788330078, "global_step": 526515, "epoch": 6343} {"train_loss": -27.574926376342773, "global_step": 526516, "epoch": 6343} {"train_loss": -27.78313636779785, "global_step": 526517, "epoch": 6343} {"train_loss": -27.416608810424805, "global_step": 526518, "epoch": 6343} {"train_loss": -27.8095760345459, "global_step": 526519, "epoch": 6343} {"train_loss": -27.870038986206055, "global_step": 526520, "epoch": 6343} {"train_loss": -27.556015014648438, "global_step": 526521, "epoch": 6343} {"train_loss": -27.226730346679688, "global_step": 526522, "epoch": 6343} {"train_loss": -27.594501495361328, "global_step": 526523, "epoch": 6343} {"train_loss": -27.824560165405273, "global_step": 526524, "epoch": 6343} {"train_loss": -27.998075485229492, "global_step": 526525, "epoch": 6343} {"train_loss": -27.4654598236084, "global_step": 526526, "epoch": 6343} {"train_loss": -27.70000648498535, "global_step": 526527, "epoch": 6343} {"train_loss": -27.577884674072266, "global_step": 526528, "epoch": 6343} {"train_loss": -27.944828033447266, "global_step": 526529, "epoch": 6343} {"train_loss": -27.298246383666992, "global_step": 526530, "epoch": 6343} {"train_loss": -27.640472412109375, "global_step": 526531, "epoch": 6343} {"train_loss": -27.488513946533203, "global_step": 526532, "epoch": 6343} {"train_loss": -27.755130767822266, "global_step": 526533, "epoch": 6343} {"train_loss": -27.549514770507812, "global_step": 526534, "epoch": 6343} {"train_loss": -27.720367431640625, "global_step": 526535, "epoch": 6343} {"train_loss": -27.704971313476562, "global_step": 526536, "epoch": 6343} {"train_loss": -27.932464599609375, "global_step": 526537, "epoch": 6343} {"train_loss": -28.132068634033203, "global_step": 526538, "epoch": 6343} {"train_loss": -27.73090934753418, "global_step": 526539, "epoch": 6343} {"train_loss": -27.809316635131836, "global_step": 526540, "epoch": 6343} {"train_loss": -27.75465202331543, "global_step": 526541, "epoch": 6343} {"train_loss": -28.17758560180664, "global_step": 526542, "epoch": 6343} {"train_loss": -27.759078979492188, "global_step": 526543, "epoch": 6343} {"train_loss": -27.321502685546875, "global_step": 526544, "epoch": 6343} {"train_loss": -27.465717315673828, "global_step": 526545, "epoch": 6343} {"train_loss": -27.606842041015625, "global_step": 526546, "epoch": 6343} {"train_loss": -27.79005241394043, "global_step": 526547, "epoch": 6343} {"train_loss": -27.701704025268555, "global_step": 526548, "epoch": 6343} {"train_loss": -27.41110610961914, "global_step": 526549, "epoch": 6343} {"train_loss": -27.6042537689209, "global_step": 526550, "epoch": 6343} {"train_loss": -27.523064027349633, "global_step": 526551, "epoch": 6343, "val_loss": 6636205.0} {"train_loss": -27.130910873413086, "global_step": 526552, "epoch": 6344} {"train_loss": -26.70381736755371, "global_step": 526553, "epoch": 6344} {"train_loss": -26.74623680114746, "global_step": 526554, "epoch": 6344} {"train_loss": -27.347570419311523, "global_step": 526555, "epoch": 6344} {"train_loss": -27.4930362701416, "global_step": 526556, "epoch": 6344} {"train_loss": -27.425827026367188, "global_step": 526557, "epoch": 6344} {"train_loss": -27.533618927001953, "global_step": 526558, "epoch": 6344} {"train_loss": -27.101654052734375, "global_step": 526559, "epoch": 6344} {"train_loss": -27.378259658813477, "global_step": 526560, "epoch": 6344} {"train_loss": -27.13837242126465, "global_step": 526561, "epoch": 6344} {"train_loss": -27.356781005859375, "global_step": 526562, "epoch": 6344} {"train_loss": -27.580280303955078, "global_step": 526563, "epoch": 6344} {"train_loss": -27.237707138061523, "global_step": 526564, "epoch": 6344} {"train_loss": -27.53005027770996, "global_step": 526565, "epoch": 6344} {"train_loss": -27.38747215270996, "global_step": 526566, "epoch": 6344} {"train_loss": -27.61237907409668, "global_step": 526567, "epoch": 6344} {"train_loss": -27.45844078063965, "global_step": 526568, "epoch": 6344} {"train_loss": -27.60517692565918, "global_step": 526569, "epoch": 6344} {"train_loss": -27.77988052368164, "global_step": 526570, "epoch": 6344} {"train_loss": -27.487945556640625, "global_step": 526571, "epoch": 6344} {"train_loss": -27.711872100830078, "global_step": 526572, "epoch": 6344} {"train_loss": -27.902612686157227, "global_step": 526573, "epoch": 6344} {"train_loss": -27.785932540893555, "global_step": 526574, "epoch": 6344} {"train_loss": -27.65643882751465, "global_step": 526575, "epoch": 6344} {"train_loss": -27.671634674072266, "global_step": 526576, "epoch": 6344} {"train_loss": -27.76534080505371, "global_step": 526577, "epoch": 6344} {"train_loss": -27.26283073425293, "global_step": 526578, "epoch": 6344} {"train_loss": -27.94443130493164, "global_step": 526579, "epoch": 6344} {"train_loss": -27.766592025756836, "global_step": 526580, "epoch": 6344} {"train_loss": -27.460067749023438, "global_step": 526581, "epoch": 6344} {"train_loss": -27.821029663085938, "global_step": 526582, "epoch": 6344} {"train_loss": -28.050800323486328, "global_step": 526583, "epoch": 6344} {"train_loss": -27.541400909423828, "global_step": 526584, "epoch": 6344} {"train_loss": -26.903217315673828, "global_step": 526585, "epoch": 6344} {"train_loss": -27.6143798828125, "global_step": 526586, "epoch": 6344} {"train_loss": -27.61431884765625, "global_step": 526587, "epoch": 6344} {"train_loss": -28.052831649780273, "global_step": 526588, "epoch": 6344} {"train_loss": -27.59412956237793, "global_step": 526589, "epoch": 6344} {"train_loss": -27.45131492614746, "global_step": 526590, "epoch": 6344} {"train_loss": -27.682373046875, "global_step": 526591, "epoch": 6344} {"train_loss": -27.409814834594727, "global_step": 526592, "epoch": 6344} {"train_loss": -28.023717880249023, "global_step": 526593, "epoch": 6344} {"train_loss": -27.938989639282227, "global_step": 526594, "epoch": 6344} {"train_loss": -27.69175148010254, "global_step": 526595, "epoch": 6344} {"train_loss": -27.478778839111328, "global_step": 526596, "epoch": 6344} {"train_loss": -27.816755294799805, "global_step": 526597, "epoch": 6344} {"train_loss": -27.61744499206543, "global_step": 526598, "epoch": 6344} {"train_loss": -27.82549476623535, "global_step": 526599, "epoch": 6344} {"train_loss": -27.733173370361328, "global_step": 526600, "epoch": 6344} {"train_loss": -27.5291748046875, "global_step": 526601, "epoch": 6344} {"train_loss": -27.834943771362305, "global_step": 526602, "epoch": 6344} {"train_loss": -27.596052169799805, "global_step": 526603, "epoch": 6344} {"train_loss": -27.7803897857666, "global_step": 526604, "epoch": 6344} {"train_loss": -27.74399757385254, "global_step": 526605, "epoch": 6344} {"train_loss": -26.41814613342285, "global_step": 526606, "epoch": 6344} {"train_loss": -24.17464828491211, "global_step": 526607, "epoch": 6344} {"train_loss": -20.409738540649414, "global_step": 526608, "epoch": 6344} {"train_loss": -24.482118606567383, "global_step": 526609, "epoch": 6344} {"train_loss": -26.858612060546875, "global_step": 526610, "epoch": 6344} {"train_loss": -25.468891143798828, "global_step": 526611, "epoch": 6344} {"train_loss": -25.66926383972168, "global_step": 526612, "epoch": 6344} {"train_loss": -25.734113693237305, "global_step": 526613, "epoch": 6344} {"train_loss": -26.234220504760742, "global_step": 526614, "epoch": 6344} {"train_loss": -25.985158920288086, "global_step": 526615, "epoch": 6344} {"train_loss": -26.738279342651367, "global_step": 526616, "epoch": 6344} {"train_loss": -26.624713897705078, "global_step": 526617, "epoch": 6344} {"train_loss": -26.711841583251953, "global_step": 526618, "epoch": 6344} {"train_loss": -26.379398345947266, "global_step": 526619, "epoch": 6344} {"train_loss": -26.329999923706055, "global_step": 526620, "epoch": 6344} {"train_loss": -26.786584854125977, "global_step": 526621, "epoch": 6344} {"train_loss": -26.679153442382812, "global_step": 526622, "epoch": 6344} {"train_loss": -27.07308006286621, "global_step": 526623, "epoch": 6344} {"train_loss": -26.837148666381836, "global_step": 526624, "epoch": 6344} {"train_loss": -26.90360450744629, "global_step": 526625, "epoch": 6344} {"train_loss": -27.01593017578125, "global_step": 526626, "epoch": 6344} {"train_loss": -27.1219482421875, "global_step": 526627, "epoch": 6344} {"train_loss": -27.062702178955078, "global_step": 526628, "epoch": 6344} {"train_loss": -26.721845626831055, "global_step": 526629, "epoch": 6344} {"train_loss": -27.059986114501953, "global_step": 526630, "epoch": 6344} {"train_loss": -27.269086837768555, "global_step": 526631, "epoch": 6344} {"train_loss": -26.84918785095215, "global_step": 526632, "epoch": 6344} {"train_loss": -27.232288360595703, "global_step": 526633, "epoch": 6344} {"train_loss": -27.100772742765496, "global_step": 526634, "epoch": 6344, "val_loss": 6571137.0} {"train_loss": -27.01999855041504, "global_step": 526635, "epoch": 6345} {"train_loss": -26.71282958984375, "global_step": 526636, "epoch": 6345} {"train_loss": -27.093738555908203, "global_step": 526637, "epoch": 6345} {"train_loss": -26.983814239501953, "global_step": 526638, "epoch": 6345} {"train_loss": -26.70263671875, "global_step": 526639, "epoch": 6345} {"train_loss": -26.708911895751953, "global_step": 526640, "epoch": 6345} {"train_loss": -26.83154296875, "global_step": 526641, "epoch": 6345} {"train_loss": -27.18606948852539, "global_step": 526642, "epoch": 6345} {"train_loss": -27.17291831970215, "global_step": 526643, "epoch": 6345} {"train_loss": -27.117334365844727, "global_step": 526644, "epoch": 6345} {"train_loss": -27.289718627929688, "global_step": 526645, "epoch": 6345} {"train_loss": -27.402664184570312, "global_step": 526646, "epoch": 6345} {"train_loss": -27.467514038085938, "global_step": 526647, "epoch": 6345} {"train_loss": -27.192096710205078, "global_step": 526648, "epoch": 6345} {"train_loss": -26.99397087097168, "global_step": 526649, "epoch": 6345} {"train_loss": -27.45808219909668, "global_step": 526650, "epoch": 6345} {"train_loss": -27.520004272460938, "global_step": 526651, "epoch": 6345} {"train_loss": -27.213485717773438, "global_step": 526652, "epoch": 6345} {"train_loss": -27.315998077392578, "global_step": 526653, "epoch": 6345} {"train_loss": -27.602832794189453, "global_step": 526654, "epoch": 6345} {"train_loss": -27.365558624267578, "global_step": 526655, "epoch": 6345} {"train_loss": -27.1178035736084, "global_step": 526656, "epoch": 6345} {"train_loss": -27.371173858642578, "global_step": 526657, "epoch": 6345} {"train_loss": -27.60133171081543, "global_step": 526658, "epoch": 6345} {"train_loss": -27.615036010742188, "global_step": 526659, "epoch": 6345} {"train_loss": -26.952972412109375, "global_step": 526660, "epoch": 6345} {"train_loss": -27.899023056030273, "global_step": 526661, "epoch": 6345} {"train_loss": -27.046125411987305, "global_step": 526662, "epoch": 6345} {"train_loss": -27.33820915222168, "global_step": 526663, "epoch": 6345} {"train_loss": -27.6853084564209, "global_step": 526664, "epoch": 6345} {"train_loss": -27.76368522644043, "global_step": 526665, "epoch": 6345} {"train_loss": -27.437108993530273, "global_step": 526666, "epoch": 6345} {"train_loss": -27.14765739440918, "global_step": 526667, "epoch": 6345} {"train_loss": -27.65622329711914, "global_step": 526668, "epoch": 6345} {"train_loss": -27.398014068603516, "global_step": 526669, "epoch": 6345} {"train_loss": -27.568561553955078, "global_step": 526670, "epoch": 6345} {"train_loss": -27.885639190673828, "global_step": 526671, "epoch": 6345} {"train_loss": -27.396625518798828, "global_step": 526672, "epoch": 6345} {"train_loss": -27.73028564453125, "global_step": 526673, "epoch": 6345} {"train_loss": -27.88471794128418, "global_step": 526674, "epoch": 6345} {"train_loss": -27.409467697143555, "global_step": 526675, "epoch": 6345} {"train_loss": -27.701740264892578, "global_step": 526676, "epoch": 6345} {"train_loss": -27.31315040588379, "global_step": 526677, "epoch": 6345} {"train_loss": -27.375898361206055, "global_step": 526678, "epoch": 6345} {"train_loss": -27.79799461364746, "global_step": 526679, "epoch": 6345} {"train_loss": -27.731958389282227, "global_step": 526680, "epoch": 6345} {"train_loss": -27.577428817749023, "global_step": 526681, "epoch": 6345} {"train_loss": -27.908710479736328, "global_step": 526682, "epoch": 6345} {"train_loss": -27.921112060546875, "global_step": 526683, "epoch": 6345} {"train_loss": -27.46819496154785, "global_step": 526684, "epoch": 6345} {"train_loss": -27.099151611328125, "global_step": 526685, "epoch": 6345} {"train_loss": -27.6192626953125, "global_step": 526686, "epoch": 6345} {"train_loss": -27.72145652770996, "global_step": 526687, "epoch": 6345} {"train_loss": -27.9399356842041, "global_step": 526688, "epoch": 6345} {"train_loss": -27.856292724609375, "global_step": 526689, "epoch": 6345} {"train_loss": -27.40363121032715, "global_step": 526690, "epoch": 6345} {"train_loss": -27.268381118774414, "global_step": 526691, "epoch": 6345} {"train_loss": -27.361326217651367, "global_step": 526692, "epoch": 6345} {"train_loss": -27.695148468017578, "global_step": 526693, "epoch": 6345} {"train_loss": -27.6430721282959, "global_step": 526694, "epoch": 6345} {"train_loss": -27.323633193969727, "global_step": 526695, "epoch": 6345} {"train_loss": -27.83558464050293, "global_step": 526696, "epoch": 6345} {"train_loss": -27.882089614868164, "global_step": 526697, "epoch": 6345} {"train_loss": -27.42176628112793, "global_step": 526698, "epoch": 6345} {"train_loss": -27.78834342956543, "global_step": 526699, "epoch": 6345} {"train_loss": -27.53791618347168, "global_step": 526700, "epoch": 6345} {"train_loss": -27.335485458374023, "global_step": 526701, "epoch": 6345} {"train_loss": -27.794116973876953, "global_step": 526702, "epoch": 6345} {"train_loss": -27.704853057861328, "global_step": 526703, "epoch": 6345} {"train_loss": -27.89594841003418, "global_step": 526704, "epoch": 6345} {"train_loss": -28.03687858581543, "global_step": 526705, "epoch": 6345} {"train_loss": -27.156896591186523, "global_step": 526706, "epoch": 6345} {"train_loss": -27.75762939453125, "global_step": 526707, "epoch": 6345} {"train_loss": -27.3719539642334, "global_step": 526708, "epoch": 6345} {"train_loss": -27.78828239440918, "global_step": 526709, "epoch": 6345} {"train_loss": -27.367467880249023, "global_step": 526710, "epoch": 6345} {"train_loss": -27.6522274017334, "global_step": 526711, "epoch": 6345} {"train_loss": -27.458051681518555, "global_step": 526712, "epoch": 6345} {"train_loss": -27.38423728942871, "global_step": 526713, "epoch": 6345} {"train_loss": -27.23431968688965, "global_step": 526714, "epoch": 6345} {"train_loss": -27.59043312072754, "global_step": 526715, "epoch": 6345} {"train_loss": -27.66360855102539, "global_step": 526716, "epoch": 6345} {"train_loss": -27.45103937172028, "global_step": 526717, "epoch": 6345, "val_loss": 6547772.0} {"train_loss": -26.120346069335938, "global_step": 526718, "epoch": 6346} {"train_loss": -25.64032554626465, "global_step": 526719, "epoch": 6346} {"train_loss": -26.582300186157227, "global_step": 526720, "epoch": 6346} {"train_loss": -26.261274337768555, "global_step": 526721, "epoch": 6346} {"train_loss": -26.573755264282227, "global_step": 526722, "epoch": 6346} {"train_loss": -26.615299224853516, "global_step": 526723, "epoch": 6346} {"train_loss": -26.185791015625, "global_step": 526724, "epoch": 6346} {"train_loss": -26.92669105529785, "global_step": 526725, "epoch": 6346} {"train_loss": -26.616424560546875, "global_step": 526726, "epoch": 6346} {"train_loss": -26.203144073486328, "global_step": 526727, "epoch": 6346} {"train_loss": -26.660459518432617, "global_step": 526728, "epoch": 6346} {"train_loss": -27.048181533813477, "global_step": 526729, "epoch": 6346} {"train_loss": -26.54961585998535, "global_step": 526730, "epoch": 6346} {"train_loss": -26.83601188659668, "global_step": 526731, "epoch": 6346} {"train_loss": -27.031808853149414, "global_step": 526732, "epoch": 6346} {"train_loss": -26.968347549438477, "global_step": 526733, "epoch": 6346} {"train_loss": -26.8796329498291, "global_step": 526734, "epoch": 6346} {"train_loss": -26.870574951171875, "global_step": 526735, "epoch": 6346} {"train_loss": -27.221887588500977, "global_step": 526736, "epoch": 6346} {"train_loss": -27.020063400268555, "global_step": 526737, "epoch": 6346} {"train_loss": -26.898893356323242, "global_step": 526738, "epoch": 6346} {"train_loss": -27.2720890045166, "global_step": 526739, "epoch": 6346} {"train_loss": -27.499073028564453, "global_step": 526740, "epoch": 6346} {"train_loss": -26.957754135131836, "global_step": 526741, "epoch": 6346} {"train_loss": -27.14617347717285, "global_step": 526742, "epoch": 6346} {"train_loss": -27.584278106689453, "global_step": 526743, "epoch": 6346} {"train_loss": -27.385726928710938, "global_step": 526744, "epoch": 6346} {"train_loss": -27.7969913482666, "global_step": 526745, "epoch": 6346} {"train_loss": -27.370935440063477, "global_step": 526746, "epoch": 6346} {"train_loss": -27.631031036376953, "global_step": 526747, "epoch": 6346} {"train_loss": -27.594030380249023, "global_step": 526748, "epoch": 6346} {"train_loss": -27.6220645904541, "global_step": 526749, "epoch": 6346} {"train_loss": -27.417877197265625, "global_step": 526750, "epoch": 6346} {"train_loss": -27.34151268005371, "global_step": 526751, "epoch": 6346} {"train_loss": -27.4045352935791, "global_step": 526752, "epoch": 6346} {"train_loss": -27.362369537353516, "global_step": 526753, "epoch": 6346} {"train_loss": -27.4787654876709, "global_step": 526754, "epoch": 6346} {"train_loss": -27.70159339904785, "global_step": 526755, "epoch": 6346} {"train_loss": -27.343420028686523, "global_step": 526756, "epoch": 6346} {"train_loss": -27.422170639038086, "global_step": 526757, "epoch": 6346} {"train_loss": -27.734647750854492, "global_step": 526758, "epoch": 6346} {"train_loss": -27.5580997467041, "global_step": 526759, "epoch": 6346} {"train_loss": -27.665912628173828, "global_step": 526760, "epoch": 6346} {"train_loss": -27.81772804260254, "global_step": 526761, "epoch": 6346} {"train_loss": -27.352941513061523, "global_step": 526762, "epoch": 6346} {"train_loss": -27.720483779907227, "global_step": 526763, "epoch": 6346} {"train_loss": -27.378265380859375, "global_step": 526764, "epoch": 6346} {"train_loss": -27.838476181030273, "global_step": 526765, "epoch": 6346} {"train_loss": -27.472333908081055, "global_step": 526766, "epoch": 6346} {"train_loss": -27.77764892578125, "global_step": 526767, "epoch": 6346} {"train_loss": -27.66608238220215, "global_step": 526768, "epoch": 6346} {"train_loss": -27.5821475982666, "global_step": 526769, "epoch": 6346} {"train_loss": -27.88189697265625, "global_step": 526770, "epoch": 6346} {"train_loss": -27.62314796447754, "global_step": 526771, "epoch": 6346} {"train_loss": -27.60591697692871, "global_step": 526772, "epoch": 6346} {"train_loss": -27.70865821838379, "global_step": 526773, "epoch": 6346} {"train_loss": -27.72134780883789, "global_step": 526774, "epoch": 6346} {"train_loss": -27.734487533569336, "global_step": 526775, "epoch": 6346} {"train_loss": -27.579504013061523, "global_step": 526776, "epoch": 6346} {"train_loss": -27.977598190307617, "global_step": 526777, "epoch": 6346} {"train_loss": -27.5291748046875, "global_step": 526778, "epoch": 6346} {"train_loss": -27.199115753173828, "global_step": 526779, "epoch": 6346} {"train_loss": -27.097326278686523, "global_step": 526780, "epoch": 6346} {"train_loss": -27.614572525024414, "global_step": 526781, "epoch": 6346} {"train_loss": -27.703290939331055, "global_step": 526782, "epoch": 6346} {"train_loss": -27.182382583618164, "global_step": 526783, "epoch": 6346} {"train_loss": -27.32709312438965, "global_step": 526784, "epoch": 6346} {"train_loss": -27.545080184936523, "global_step": 526785, "epoch": 6346} {"train_loss": -27.854114532470703, "global_step": 526786, "epoch": 6346} {"train_loss": -27.782129287719727, "global_step": 526787, "epoch": 6346} {"train_loss": -27.673192977905273, "global_step": 526788, "epoch": 6346} {"train_loss": -27.75595474243164, "global_step": 526789, "epoch": 6346} {"train_loss": -27.955093383789062, "global_step": 526790, "epoch": 6346} {"train_loss": -27.589391708374023, "global_step": 526791, "epoch": 6346} {"train_loss": -27.70672607421875, "global_step": 526792, "epoch": 6346} {"train_loss": -27.602771759033203, "global_step": 526793, "epoch": 6346} {"train_loss": -27.946643829345703, "global_step": 526794, "epoch": 6346} {"train_loss": -27.80010986328125, "global_step": 526795, "epoch": 6346} {"train_loss": -27.85500144958496, "global_step": 526796, "epoch": 6346} {"train_loss": -27.497278213500977, "global_step": 526797, "epoch": 6346} {"train_loss": -27.613996505737305, "global_step": 526798, "epoch": 6346} {"train_loss": -27.597761154174805, "global_step": 526799, "epoch": 6346} {"train_loss": -27.343003169599786, "global_step": 526800, "epoch": 6346, "val_loss": 6767896.0} {"train_loss": -27.178857803344727, "global_step": 526801, "epoch": 6347} {"train_loss": -27.037628173828125, "global_step": 526802, "epoch": 6347} {"train_loss": -26.662260055541992, "global_step": 526803, "epoch": 6347} {"train_loss": -27.035385131835938, "global_step": 526804, "epoch": 6347} {"train_loss": -26.7572078704834, "global_step": 526805, "epoch": 6347} {"train_loss": -27.533477783203125, "global_step": 526806, "epoch": 6347} {"train_loss": -27.364444732666016, "global_step": 526807, "epoch": 6347} {"train_loss": -27.245893478393555, "global_step": 526808, "epoch": 6347} {"train_loss": -27.260156631469727, "global_step": 526809, "epoch": 6347} {"train_loss": -27.231719970703125, "global_step": 526810, "epoch": 6347} {"train_loss": -27.378021240234375, "global_step": 526811, "epoch": 6347} {"train_loss": -27.592844009399414, "global_step": 526812, "epoch": 6347} {"train_loss": -27.373859405517578, "global_step": 526813, "epoch": 6347} {"train_loss": -27.166431427001953, "global_step": 526814, "epoch": 6347} {"train_loss": -27.597105026245117, "global_step": 526815, "epoch": 6347} {"train_loss": -27.42254066467285, "global_step": 526816, "epoch": 6347} {"train_loss": -27.44189453125, "global_step": 526817, "epoch": 6347} {"train_loss": -27.10259437561035, "global_step": 526818, "epoch": 6347} {"train_loss": -27.68414878845215, "global_step": 526819, "epoch": 6347} {"train_loss": -27.726972579956055, "global_step": 526820, "epoch": 6347} {"train_loss": -27.2574405670166, "global_step": 526821, "epoch": 6347} {"train_loss": -27.66745948791504, "global_step": 526822, "epoch": 6347} {"train_loss": -27.414657592773438, "global_step": 526823, "epoch": 6347} {"train_loss": -27.533700942993164, "global_step": 526824, "epoch": 6347} {"train_loss": -27.683542251586914, "global_step": 526825, "epoch": 6347} {"train_loss": -27.393396377563477, "global_step": 526826, "epoch": 6347} {"train_loss": -27.652667999267578, "global_step": 526827, "epoch": 6347} {"train_loss": -27.60511589050293, "global_step": 526828, "epoch": 6347} {"train_loss": -27.407636642456055, "global_step": 526829, "epoch": 6347} {"train_loss": -27.66815185546875, "global_step": 526830, "epoch": 6347} {"train_loss": -27.78533935546875, "global_step": 526831, "epoch": 6347} {"train_loss": -27.66289710998535, "global_step": 526832, "epoch": 6347} {"train_loss": -27.755268096923828, "global_step": 526833, "epoch": 6347} {"train_loss": -27.51649284362793, "global_step": 526834, "epoch": 6347} {"train_loss": -27.961057662963867, "global_step": 526835, "epoch": 6347} {"train_loss": -27.760940551757812, "global_step": 526836, "epoch": 6347} {"train_loss": -27.981977462768555, "global_step": 526837, "epoch": 6347} {"train_loss": -27.59901237487793, "global_step": 526838, "epoch": 6347} {"train_loss": -27.554035186767578, "global_step": 526839, "epoch": 6347} {"train_loss": -27.7509708404541, "global_step": 526840, "epoch": 6347} {"train_loss": -27.813140869140625, "global_step": 526841, "epoch": 6347} {"train_loss": -27.400522232055664, "global_step": 526842, "epoch": 6347} {"train_loss": -27.69282341003418, "global_step": 526843, "epoch": 6347} {"train_loss": -27.628936767578125, "global_step": 526844, "epoch": 6347} {"train_loss": -27.63837242126465, "global_step": 526845, "epoch": 6347} {"train_loss": -27.687917709350586, "global_step": 526846, "epoch": 6347} {"train_loss": -27.854833602905273, "global_step": 526847, "epoch": 6347} {"train_loss": -27.69156265258789, "global_step": 526848, "epoch": 6347} {"train_loss": -27.463281631469727, "global_step": 526849, "epoch": 6347} {"train_loss": -27.498830795288086, "global_step": 526850, "epoch": 6347} {"train_loss": -27.433897018432617, "global_step": 526851, "epoch": 6347} {"train_loss": -26.92523765563965, "global_step": 526852, "epoch": 6347} {"train_loss": -26.844995498657227, "global_step": 526853, "epoch": 6347} {"train_loss": -27.289752960205078, "global_step": 526854, "epoch": 6347} {"train_loss": -27.357742309570312, "global_step": 526855, "epoch": 6347} {"train_loss": -27.01902198791504, "global_step": 526856, "epoch": 6347} {"train_loss": -27.351490020751953, "global_step": 526857, "epoch": 6347} {"train_loss": -27.254810333251953, "global_step": 526858, "epoch": 6347} {"train_loss": -26.990482330322266, "global_step": 526859, "epoch": 6347} {"train_loss": -27.174802780151367, "global_step": 526860, "epoch": 6347} {"train_loss": -27.136533737182617, "global_step": 526861, "epoch": 6347} {"train_loss": -27.07659339904785, "global_step": 526862, "epoch": 6347} {"train_loss": -27.035110473632812, "global_step": 526863, "epoch": 6347} {"train_loss": -27.54779052734375, "global_step": 526864, "epoch": 6347} {"train_loss": -27.079877853393555, "global_step": 526865, "epoch": 6347} {"train_loss": -27.304304122924805, "global_step": 526866, "epoch": 6347} {"train_loss": -27.36067771911621, "global_step": 526867, "epoch": 6347} {"train_loss": -27.2858829498291, "global_step": 526868, "epoch": 6347} {"train_loss": -27.165678024291992, "global_step": 526869, "epoch": 6347} {"train_loss": -27.2783203125, "global_step": 526870, "epoch": 6347} {"train_loss": -27.362964630126953, "global_step": 526871, "epoch": 6347} {"train_loss": -27.11033058166504, "global_step": 526872, "epoch": 6347} {"train_loss": -27.398456573486328, "global_step": 526873, "epoch": 6347} {"train_loss": -27.336393356323242, "global_step": 526874, "epoch": 6347} {"train_loss": -27.4057674407959, "global_step": 526875, "epoch": 6347} {"train_loss": -27.600650787353516, "global_step": 526876, "epoch": 6347} {"train_loss": -27.454267501831055, "global_step": 526877, "epoch": 6347} {"train_loss": -27.8501033782959, "global_step": 526878, "epoch": 6347} {"train_loss": -27.101171493530273, "global_step": 526879, "epoch": 6347} {"train_loss": -27.834247589111328, "global_step": 526880, "epoch": 6347} {"train_loss": -27.52849769592285, "global_step": 526881, "epoch": 6347} {"train_loss": -27.76417350769043, "global_step": 526882, "epoch": 6347} {"train_loss": -27.430750697492115, "global_step": 526883, "epoch": 6347, "val_loss": 6679352.0} {"train_loss": -26.21320915222168, "global_step": 526884, "epoch": 6348} {"train_loss": -26.43472671508789, "global_step": 526885, "epoch": 6348} {"train_loss": -27.50252342224121, "global_step": 526886, "epoch": 6348} {"train_loss": -27.10794448852539, "global_step": 526887, "epoch": 6348} {"train_loss": -26.4713077545166, "global_step": 526888, "epoch": 6348} {"train_loss": -26.80560874938965, "global_step": 526889, "epoch": 6348} {"train_loss": -27.032007217407227, "global_step": 526890, "epoch": 6348} {"train_loss": -26.888975143432617, "global_step": 526891, "epoch": 6348} {"train_loss": -27.10249137878418, "global_step": 526892, "epoch": 6348} {"train_loss": -26.91924476623535, "global_step": 526893, "epoch": 6348} {"train_loss": -27.293689727783203, "global_step": 526894, "epoch": 6348} {"train_loss": -26.940662384033203, "global_step": 526895, "epoch": 6348} {"train_loss": -27.695728302001953, "global_step": 526896, "epoch": 6348} {"train_loss": -27.148115158081055, "global_step": 526897, "epoch": 6348} {"train_loss": -27.574865341186523, "global_step": 526898, "epoch": 6348} {"train_loss": -27.467756271362305, "global_step": 526899, "epoch": 6348} {"train_loss": -27.538476943969727, "global_step": 526900, "epoch": 6348} {"train_loss": -27.44108009338379, "global_step": 526901, "epoch": 6348} {"train_loss": -27.63569450378418, "global_step": 526902, "epoch": 6348} {"train_loss": -27.31898307800293, "global_step": 526903, "epoch": 6348} {"train_loss": -27.588796615600586, "global_step": 526904, "epoch": 6348} {"train_loss": -27.4299259185791, "global_step": 526905, "epoch": 6348} {"train_loss": -27.727502822875977, "global_step": 526906, "epoch": 6348} {"train_loss": -27.702316284179688, "global_step": 526907, "epoch": 6348} {"train_loss": -27.416168212890625, "global_step": 526908, "epoch": 6348} {"train_loss": -27.422901153564453, "global_step": 526909, "epoch": 6348} {"train_loss": -27.329980850219727, "global_step": 526910, "epoch": 6348} {"train_loss": -27.578887939453125, "global_step": 526911, "epoch": 6348} {"train_loss": -27.45965003967285, "global_step": 526912, "epoch": 6348} {"train_loss": -27.549102783203125, "global_step": 526913, "epoch": 6348} {"train_loss": -27.613311767578125, "global_step": 526914, "epoch": 6348} {"train_loss": -27.339643478393555, "global_step": 526915, "epoch": 6348} {"train_loss": -27.485448837280273, "global_step": 526916, "epoch": 6348} {"train_loss": -27.232290267944336, "global_step": 526917, "epoch": 6348} {"train_loss": -27.47389030456543, "global_step": 526918, "epoch": 6348} {"train_loss": -27.49894142150879, "global_step": 526919, "epoch": 6348} {"train_loss": -27.388870239257812, "global_step": 526920, "epoch": 6348} {"train_loss": -27.45782470703125, "global_step": 526921, "epoch": 6348} {"train_loss": -27.590505599975586, "global_step": 526922, "epoch": 6348} {"train_loss": -27.319995880126953, "global_step": 526923, "epoch": 6348} {"train_loss": -27.846769332885742, "global_step": 526924, "epoch": 6348} {"train_loss": -27.609394073486328, "global_step": 526925, "epoch": 6348} {"train_loss": -27.293720245361328, "global_step": 526926, "epoch": 6348} {"train_loss": -28.087018966674805, "global_step": 526927, "epoch": 6348} {"train_loss": -27.593128204345703, "global_step": 526928, "epoch": 6348} {"train_loss": -27.56943702697754, "global_step": 526929, "epoch": 6348} {"train_loss": -27.710739135742188, "global_step": 526930, "epoch": 6348} {"train_loss": -27.691253662109375, "global_step": 526931, "epoch": 6348} {"train_loss": -27.905981063842773, "global_step": 526932, "epoch": 6348} {"train_loss": -28.065237045288086, "global_step": 526933, "epoch": 6348} {"train_loss": -27.755329132080078, "global_step": 526934, "epoch": 6348} {"train_loss": -27.831018447875977, "global_step": 526935, "epoch": 6348} {"train_loss": -27.8613224029541, "global_step": 526936, "epoch": 6348} {"train_loss": -27.650434494018555, "global_step": 526937, "epoch": 6348} {"train_loss": -27.584699630737305, "global_step": 526938, "epoch": 6348} {"train_loss": -27.7087459564209, "global_step": 526939, "epoch": 6348} {"train_loss": -27.621429443359375, "global_step": 526940, "epoch": 6348} {"train_loss": -27.869583129882812, "global_step": 526941, "epoch": 6348} {"train_loss": -27.868642807006836, "global_step": 526942, "epoch": 6348} {"train_loss": -27.872350692749023, "global_step": 526943, "epoch": 6348} {"train_loss": -27.5970516204834, "global_step": 526944, "epoch": 6348} {"train_loss": -27.380817413330078, "global_step": 526945, "epoch": 6348} {"train_loss": -27.890954971313477, "global_step": 526946, "epoch": 6348} {"train_loss": -28.161853790283203, "global_step": 526947, "epoch": 6348} {"train_loss": -27.8261661529541, "global_step": 526948, "epoch": 6348} {"train_loss": -28.1497745513916, "global_step": 526949, "epoch": 6348} {"train_loss": -27.67131996154785, "global_step": 526950, "epoch": 6348} {"train_loss": -27.793289184570312, "global_step": 526951, "epoch": 6348} {"train_loss": -27.6669979095459, "global_step": 526952, "epoch": 6348} {"train_loss": -27.843891143798828, "global_step": 526953, "epoch": 6348} {"train_loss": -27.7448673248291, "global_step": 526954, "epoch": 6348} {"train_loss": -27.83888053894043, "global_step": 526955, "epoch": 6348} {"train_loss": -27.665430068969727, "global_step": 526956, "epoch": 6348} {"train_loss": -27.6988468170166, "global_step": 526957, "epoch": 6348} {"train_loss": -27.72017478942871, "global_step": 526958, "epoch": 6348} {"train_loss": -27.640756607055664, "global_step": 526959, "epoch": 6348} {"train_loss": -27.71904945373535, "global_step": 526960, "epoch": 6348} {"train_loss": -27.820941925048828, "global_step": 526961, "epoch": 6348} {"train_loss": -27.522790908813477, "global_step": 526962, "epoch": 6348} {"train_loss": -27.427967071533203, "global_step": 526963, "epoch": 6348} {"train_loss": -27.64661979675293, "global_step": 526964, "epoch": 6348} {"train_loss": -27.709762573242188, "global_step": 526965, "epoch": 6348} {"train_loss": -27.524495871670275, "global_step": 526966, "epoch": 6348, "val_loss": 6689085.0} {"train_loss": -26.87738037109375, "global_step": 526967, "epoch": 6349} {"train_loss": -26.00579261779785, "global_step": 526968, "epoch": 6349} {"train_loss": -26.597537994384766, "global_step": 526969, "epoch": 6349} {"train_loss": -27.298933029174805, "global_step": 526970, "epoch": 6349} {"train_loss": -26.621557235717773, "global_step": 526971, "epoch": 6349} {"train_loss": -26.339075088500977, "global_step": 526972, "epoch": 6349} {"train_loss": -26.932697296142578, "global_step": 526973, "epoch": 6349} {"train_loss": -26.461963653564453, "global_step": 526974, "epoch": 6349} {"train_loss": -26.946704864501953, "global_step": 526975, "epoch": 6349} {"train_loss": -26.68868064880371, "global_step": 526976, "epoch": 6349} {"train_loss": -26.60517692565918, "global_step": 526977, "epoch": 6349} {"train_loss": -26.95743751525879, "global_step": 526978, "epoch": 6349} {"train_loss": -26.4005184173584, "global_step": 526979, "epoch": 6349} {"train_loss": -26.978696823120117, "global_step": 526980, "epoch": 6349} {"train_loss": -26.6937255859375, "global_step": 526981, "epoch": 6349} {"train_loss": -27.053207397460938, "global_step": 526982, "epoch": 6349} {"train_loss": -27.2595157623291, "global_step": 526983, "epoch": 6349} {"train_loss": -27.199737548828125, "global_step": 526984, "epoch": 6349} {"train_loss": -27.419830322265625, "global_step": 526985, "epoch": 6349} {"train_loss": -27.458709716796875, "global_step": 526986, "epoch": 6349} {"train_loss": -27.512115478515625, "global_step": 526987, "epoch": 6349} {"train_loss": -26.9228458404541, "global_step": 526988, "epoch": 6349} {"train_loss": -27.29559898376465, "global_step": 526989, "epoch": 6349} {"train_loss": -26.88343620300293, "global_step": 526990, "epoch": 6349} {"train_loss": -27.258451461791992, "global_step": 526991, "epoch": 6349} {"train_loss": -27.157306671142578, "global_step": 526992, "epoch": 6349} {"train_loss": -27.20684814453125, "global_step": 526993, "epoch": 6349} {"train_loss": -27.379037857055664, "global_step": 526994, "epoch": 6349} {"train_loss": -26.999343872070312, "global_step": 526995, "epoch": 6349} {"train_loss": -27.69196891784668, "global_step": 526996, "epoch": 6349} {"train_loss": -27.290908813476562, "global_step": 526997, "epoch": 6349} {"train_loss": -27.550153732299805, "global_step": 526998, "epoch": 6349} {"train_loss": -27.237857818603516, "global_step": 526999, "epoch": 6349} {"train_loss": -27.75165367126465, "global_step": 527000, "epoch": 6349} {"train_loss": -27.3956298828125, "global_step": 527001, "epoch": 6349} {"train_loss": -27.144006729125977, "global_step": 527002, "epoch": 6349} {"train_loss": -27.686477661132812, "global_step": 527003, "epoch": 6349} {"train_loss": -27.377094268798828, "global_step": 527004, "epoch": 6349} {"train_loss": -27.405689239501953, "global_step": 527005, "epoch": 6349} {"train_loss": -27.695175170898438, "global_step": 527006, "epoch": 6349} {"train_loss": -27.57173728942871, "global_step": 527007, "epoch": 6349} {"train_loss": -27.562475204467773, "global_step": 527008, "epoch": 6349} {"train_loss": -28.015283584594727, "global_step": 527009, "epoch": 6349} {"train_loss": -27.853137969970703, "global_step": 527010, "epoch": 6349} {"train_loss": -27.727758407592773, "global_step": 527011, "epoch": 6349} {"train_loss": -27.33635902404785, "global_step": 527012, "epoch": 6349} {"train_loss": -27.34708595275879, "global_step": 527013, "epoch": 6349} {"train_loss": -27.4996337890625, "global_step": 527014, "epoch": 6349} {"train_loss": -27.804990768432617, "global_step": 527015, "epoch": 6349} {"train_loss": -27.66937255859375, "global_step": 527016, "epoch": 6349} {"train_loss": -27.6881103515625, "global_step": 527017, "epoch": 6349} {"train_loss": -27.37803077697754, "global_step": 527018, "epoch": 6349} {"train_loss": -27.410907745361328, "global_step": 527019, "epoch": 6349} {"train_loss": -27.499740600585938, "global_step": 527020, "epoch": 6349} {"train_loss": -27.583871841430664, "global_step": 527021, "epoch": 6349} {"train_loss": -28.056787490844727, "global_step": 527022, "epoch": 6349} {"train_loss": -28.11810874938965, "global_step": 527023, "epoch": 6349} {"train_loss": -27.746801376342773, "global_step": 527024, "epoch": 6349} {"train_loss": -27.833740234375, "global_step": 527025, "epoch": 6349} {"train_loss": -27.7568416595459, "global_step": 527026, "epoch": 6349} {"train_loss": -27.4891414642334, "global_step": 527027, "epoch": 6349} {"train_loss": -27.80476188659668, "global_step": 527028, "epoch": 6349} {"train_loss": -27.83399772644043, "global_step": 527029, "epoch": 6349} {"train_loss": -27.717863082885742, "global_step": 527030, "epoch": 6349} {"train_loss": -27.66619300842285, "global_step": 527031, "epoch": 6349} {"train_loss": -27.787189483642578, "global_step": 527032, "epoch": 6349} {"train_loss": -27.444242477416992, "global_step": 527033, "epoch": 6349} {"train_loss": -27.83527946472168, "global_step": 527034, "epoch": 6349} {"train_loss": -27.855804443359375, "global_step": 527035, "epoch": 6349} {"train_loss": -27.575063705444336, "global_step": 527036, "epoch": 6349} {"train_loss": -27.884061813354492, "global_step": 527037, "epoch": 6349} {"train_loss": -27.911548614501953, "global_step": 527038, "epoch": 6349} {"train_loss": -27.9089298248291, "global_step": 527039, "epoch": 6349} {"train_loss": -27.901403427124023, "global_step": 527040, "epoch": 6349} {"train_loss": -27.84943962097168, "global_step": 527041, "epoch": 6349} {"train_loss": -27.522357940673828, "global_step": 527042, "epoch": 6349} {"train_loss": -27.342121124267578, "global_step": 527043, "epoch": 6349} {"train_loss": -27.633676528930664, "global_step": 527044, "epoch": 6349} {"train_loss": -27.329004287719727, "global_step": 527045, "epoch": 6349} {"train_loss": -27.564523696899414, "global_step": 527046, "epoch": 6349} {"train_loss": -27.357336044311523, "global_step": 527047, "epoch": 6349} {"train_loss": -27.1581974029541, "global_step": 527048, "epoch": 6349} {"train_loss": -27.391588877482587, "global_step": 527049, "epoch": 6349, "val_loss": 6603377.0} {"train_loss": -26.239837646484375, "global_step": 527050, "epoch": 6350} {"train_loss": -24.916173934936523, "global_step": 527051, "epoch": 6350} {"train_loss": -23.500436782836914, "global_step": 527052, "epoch": 6350} {"train_loss": -26.253767013549805, "global_step": 527053, "epoch": 6350} {"train_loss": -26.980274200439453, "global_step": 527054, "epoch": 6350} {"train_loss": -25.53941535949707, "global_step": 527055, "epoch": 6350} {"train_loss": -26.709854125976562, "global_step": 527056, "epoch": 6350} {"train_loss": -26.51372718811035, "global_step": 527057, "epoch": 6350} {"train_loss": -26.601470947265625, "global_step": 527058, "epoch": 6350} {"train_loss": -26.47356605529785, "global_step": 527059, "epoch": 6350} {"train_loss": -26.130023956298828, "global_step": 527060, "epoch": 6350} {"train_loss": -26.546850204467773, "global_step": 527061, "epoch": 6350} {"train_loss": -26.7575740814209, "global_step": 527062, "epoch": 6350} {"train_loss": -27.143329620361328, "global_step": 527063, "epoch": 6350} {"train_loss": -26.77850341796875, "global_step": 527064, "epoch": 6350} {"train_loss": -27.04275894165039, "global_step": 527065, "epoch": 6350} {"train_loss": -27.052099227905273, "global_step": 527066, "epoch": 6350} {"train_loss": -26.87043571472168, "global_step": 527067, "epoch": 6350} {"train_loss": -27.02609634399414, "global_step": 527068, "epoch": 6350} {"train_loss": -26.717615127563477, "global_step": 527069, "epoch": 6350} {"train_loss": -27.185012817382812, "global_step": 527070, "epoch": 6350} {"train_loss": -26.969181060791016, "global_step": 527071, "epoch": 6350} {"train_loss": -27.101470947265625, "global_step": 527072, "epoch": 6350} {"train_loss": -27.2063045501709, "global_step": 527073, "epoch": 6350} {"train_loss": -27.338903427124023, "global_step": 527074, "epoch": 6350} {"train_loss": -27.458087921142578, "global_step": 527075, "epoch": 6350} {"train_loss": -27.20939064025879, "global_step": 527076, "epoch": 6350} {"train_loss": -27.532033920288086, "global_step": 527077, "epoch": 6350} {"train_loss": -27.7752742767334, "global_step": 527078, "epoch": 6350} {"train_loss": -27.418853759765625, "global_step": 527079, "epoch": 6350} {"train_loss": -27.448217391967773, "global_step": 527080, "epoch": 6350} {"train_loss": -27.526941299438477, "global_step": 527081, "epoch": 6350} {"train_loss": -27.46365737915039, "global_step": 527082, "epoch": 6350} {"train_loss": -27.540021896362305, "global_step": 527083, "epoch": 6350} {"train_loss": -27.5894832611084, "global_step": 527084, "epoch": 6350} {"train_loss": -27.6264705657959, "global_step": 527085, "epoch": 6350} {"train_loss": -27.781888961791992, "global_step": 527086, "epoch": 6350} {"train_loss": -27.331968307495117, "global_step": 527087, "epoch": 6350} {"train_loss": -27.75709342956543, "global_step": 527088, "epoch": 6350} {"train_loss": -28.045148849487305, "global_step": 527089, "epoch": 6350} {"train_loss": -27.792394638061523, "global_step": 527090, "epoch": 6350} {"train_loss": -27.364028930664062, "global_step": 527091, "epoch": 6350} {"train_loss": -27.663211822509766, "global_step": 527092, "epoch": 6350} {"train_loss": -27.106977462768555, "global_step": 527093, "epoch": 6350} {"train_loss": -27.74037742614746, "global_step": 527094, "epoch": 6350} {"train_loss": -27.47279930114746, "global_step": 527095, "epoch": 6350} {"train_loss": -27.5776424407959, "global_step": 527096, "epoch": 6350} {"train_loss": -27.363391876220703, "global_step": 527097, "epoch": 6350} {"train_loss": -27.48343849182129, "global_step": 527098, "epoch": 6350} {"train_loss": -27.88129234313965, "global_step": 527099, "epoch": 6350} {"train_loss": -27.609750747680664, "global_step": 527100, "epoch": 6350} {"train_loss": -27.854887008666992, "global_step": 527101, "epoch": 6350} {"train_loss": -27.681501388549805, "global_step": 527102, "epoch": 6350} {"train_loss": -27.54608154296875, "global_step": 527103, "epoch": 6350} {"train_loss": -28.17441749572754, "global_step": 527104, "epoch": 6350} {"train_loss": -27.5236873626709, "global_step": 527105, "epoch": 6350} {"train_loss": -27.221969604492188, "global_step": 527106, "epoch": 6350} {"train_loss": -27.275556564331055, "global_step": 527107, "epoch": 6350} {"train_loss": -27.958877563476562, "global_step": 527108, "epoch": 6350} {"train_loss": -27.52964210510254, "global_step": 527109, "epoch": 6350} {"train_loss": -27.309558868408203, "global_step": 527110, "epoch": 6350} {"train_loss": -27.36348533630371, "global_step": 527111, "epoch": 6350} {"train_loss": -27.77081298828125, "global_step": 527112, "epoch": 6350} {"train_loss": -27.075769424438477, "global_step": 527113, "epoch": 6350} {"train_loss": -27.332807540893555, "global_step": 527114, "epoch": 6350} {"train_loss": -27.425336837768555, "global_step": 527115, "epoch": 6350} {"train_loss": -27.811914443969727, "global_step": 527116, "epoch": 6350} {"train_loss": -27.60516357421875, "global_step": 527117, "epoch": 6350} {"train_loss": -27.538135528564453, "global_step": 527118, "epoch": 6350} {"train_loss": -27.7359619140625, "global_step": 527119, "epoch": 6350} {"train_loss": -27.2396240234375, "global_step": 527120, "epoch": 6350} {"train_loss": -27.494848251342773, "global_step": 527121, "epoch": 6350} {"train_loss": -27.2329158782959, "global_step": 527122, "epoch": 6350} {"train_loss": -27.634313583374023, "global_step": 527123, "epoch": 6350} {"train_loss": -27.531539916992188, "global_step": 527124, "epoch": 6350} {"train_loss": -27.37006950378418, "global_step": 527125, "epoch": 6350} {"train_loss": -27.524505615234375, "global_step": 527126, "epoch": 6350} {"train_loss": -27.571990966796875, "global_step": 527127, "epoch": 6350} {"train_loss": -27.561450958251953, "global_step": 527128, "epoch": 6350} {"train_loss": -27.751752853393555, "global_step": 527129, "epoch": 6350} {"train_loss": -27.706762313842773, "global_step": 527130, "epoch": 6350} {"train_loss": -27.275943756103516, "global_step": 527131, "epoch": 6350} {"train_loss": -27.243859256606505, "global_step": 527132, "epoch": 6350, "train/sim_max_reward_0": 0.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4500000": 1.0, "test/sim_max_reward_4500001": 1.0, "test/sim_max_reward_4500002": 1.0, "test/sim_max_reward_4500003": 1.0, "test/sim_max_reward_4500004": 1.0, "test/sim_max_reward_4500005": 1.0, "test/sim_max_reward_4500006": 1.0, "test/sim_max_reward_4500007": 0.0, "test/sim_max_reward_4500008": 1.0, "test/sim_max_reward_4500009": 1.0, "test/sim_max_reward_4500010": 1.0, "test/sim_max_reward_4500011": 1.0, "test/sim_max_reward_4500012": 1.0, "test/sim_max_reward_4500013": 0.0, "test/sim_max_reward_4500014": 1.0, "test/sim_max_reward_4500015": 1.0, "test/sim_max_reward_4500016": 1.0, "test/sim_max_reward_4500017": 1.0, "test/sim_max_reward_4500018": 1.0, "test/sim_max_reward_4500019": 1.0, "test/sim_max_reward_4500020": 1.0, "test/sim_max_reward_4500021": 1.0, "train/mean_score": 0.8333333333333334, "test/mean_score": 0.9090909090909091, "val_loss": 6822840.0} {"train_loss": -27.647974014282227, "global_step": 527133, "epoch": 6351} {"train_loss": -27.56416130065918, "global_step": 527134, "epoch": 6351} {"train_loss": -27.190601348876953, "global_step": 527135, "epoch": 6351} {"train_loss": -27.057897567749023, "global_step": 527136, "epoch": 6351} {"train_loss": -27.09566307067871, "global_step": 527137, "epoch": 6351} {"train_loss": -27.366296768188477, "global_step": 527138, "epoch": 6351} {"train_loss": -27.393753051757812, "global_step": 527139, "epoch": 6351} {"train_loss": -27.663488388061523, "global_step": 527140, "epoch": 6351} {"train_loss": -27.614181518554688, "global_step": 527141, "epoch": 6351} {"train_loss": -27.24983024597168, "global_step": 527142, "epoch": 6351} {"train_loss": -27.2053165435791, "global_step": 527143, "epoch": 6351} {"train_loss": -27.505292892456055, "global_step": 527144, "epoch": 6351} {"train_loss": -27.317489624023438, "global_step": 527145, "epoch": 6351} {"train_loss": -27.148895263671875, "global_step": 527146, "epoch": 6351} {"train_loss": -27.176252365112305, "global_step": 527147, "epoch": 6351} {"train_loss": -27.0720157623291, "global_step": 527148, "epoch": 6351} {"train_loss": -27.3930606842041, "global_step": 527149, "epoch": 6351} {"train_loss": -27.561182022094727, "global_step": 527150, "epoch": 6351} {"train_loss": -27.121850967407227, "global_step": 527151, "epoch": 6351} {"train_loss": -27.33099365234375, "global_step": 527152, "epoch": 6351} {"train_loss": -27.108434677124023, "global_step": 527153, "epoch": 6351} {"train_loss": -27.39792823791504, "global_step": 527154, "epoch": 6351} {"train_loss": -27.287708282470703, "global_step": 527155, "epoch": 6351} {"train_loss": -27.173969268798828, "global_step": 527156, "epoch": 6351} {"train_loss": -27.016523361206055, "global_step": 527157, "epoch": 6351} {"train_loss": -27.442890167236328, "global_step": 527158, "epoch": 6351} {"train_loss": -27.601303100585938, "global_step": 527159, "epoch": 6351} {"train_loss": -27.508092880249023, "global_step": 527160, "epoch": 6351} {"train_loss": -27.3065128326416, "global_step": 527161, "epoch": 6351} {"train_loss": -27.82407569885254, "global_step": 527162, "epoch": 6351} {"train_loss": -27.67336082458496, "global_step": 527163, "epoch": 6351} {"train_loss": -27.5856876373291, "global_step": 527164, "epoch": 6351} {"train_loss": -27.475248336791992, "global_step": 527165, "epoch": 6351} {"train_loss": -27.701990127563477, "global_step": 527166, "epoch": 6351} {"train_loss": -27.538501739501953, "global_step": 527167, "epoch": 6351} {"train_loss": -27.483325958251953, "global_step": 527168, "epoch": 6351} {"train_loss": -27.570871353149414, "global_step": 527169, "epoch": 6351} {"train_loss": -27.305028915405273, "global_step": 527170, "epoch": 6351} {"train_loss": -27.8886661529541, "global_step": 527171, "epoch": 6351} {"train_loss": -27.56168556213379, "global_step": 527172, "epoch": 6351} {"train_loss": -27.61879539489746, "global_step": 527173, "epoch": 6351} {"train_loss": -27.28022575378418, "global_step": 527174, "epoch": 6351} {"train_loss": -27.60377311706543, "global_step": 527175, "epoch": 6351} {"train_loss": -27.653244018554688, "global_step": 527176, "epoch": 6351} {"train_loss": -27.918827056884766, "global_step": 527177, "epoch": 6351} {"train_loss": -27.830541610717773, "global_step": 527178, "epoch": 6351} {"train_loss": -27.36518669128418, "global_step": 527179, "epoch": 6351} {"train_loss": -27.575424194335938, "global_step": 527180, "epoch": 6351} {"train_loss": -27.602869033813477, "global_step": 527181, "epoch": 6351} {"train_loss": -27.642980575561523, "global_step": 527182, "epoch": 6351} {"train_loss": -27.889944076538086, "global_step": 527183, "epoch": 6351} {"train_loss": -27.850778579711914, "global_step": 527184, "epoch": 6351} {"train_loss": -28.137521743774414, "global_step": 527185, "epoch": 6351} {"train_loss": -27.407764434814453, "global_step": 527186, "epoch": 6351} {"train_loss": -27.928363800048828, "global_step": 527187, "epoch": 6351} {"train_loss": -27.555633544921875, "global_step": 527188, "epoch": 6351} {"train_loss": -27.441329956054688, "global_step": 527189, "epoch": 6351} {"train_loss": -27.779211044311523, "global_step": 527190, "epoch": 6351} {"train_loss": -27.797931671142578, "global_step": 527191, "epoch": 6351} {"train_loss": -27.543914794921875, "global_step": 527192, "epoch": 6351} {"train_loss": -27.687763214111328, "global_step": 527193, "epoch": 6351} {"train_loss": -27.656055450439453, "global_step": 527194, "epoch": 6351} {"train_loss": -27.6549129486084, "global_step": 527195, "epoch": 6351} {"train_loss": -27.259002685546875, "global_step": 527196, "epoch": 6351} {"train_loss": -27.47797203063965, "global_step": 527197, "epoch": 6351} {"train_loss": -27.46668815612793, "global_step": 527198, "epoch": 6351} {"train_loss": -27.532739639282227, "global_step": 527199, "epoch": 6351} {"train_loss": -27.760604858398438, "global_step": 527200, "epoch": 6351} {"train_loss": -27.33368492126465, "global_step": 527201, "epoch": 6351} {"train_loss": -27.225540161132812, "global_step": 527202, "epoch": 6351} {"train_loss": -26.799240112304688, "global_step": 527203, "epoch": 6351} {"train_loss": -27.919702529907227, "global_step": 527204, "epoch": 6351} {"train_loss": -26.86370849609375, "global_step": 527205, "epoch": 6351} {"train_loss": -27.23822593688965, "global_step": 527206, "epoch": 6351} {"train_loss": -27.625293731689453, "global_step": 527207, "epoch": 6351} {"train_loss": -27.6848087310791, "global_step": 527208, "epoch": 6351} {"train_loss": -27.2685604095459, "global_step": 527209, "epoch": 6351} {"train_loss": -27.44954490661621, "global_step": 527210, "epoch": 6351} {"train_loss": -27.775938034057617, "global_step": 527211, "epoch": 6351} {"train_loss": -27.962934494018555, "global_step": 527212, "epoch": 6351} {"train_loss": -27.315759658813477, "global_step": 527213, "epoch": 6351} {"train_loss": -27.813739776611328, "global_step": 527214, "epoch": 6351} {"train_loss": -27.491395628595928, "global_step": 527215, "epoch": 6351, "val_loss": 6758854.0} {"train_loss": -27.510986328125, "global_step": 527216, "epoch": 6352} {"train_loss": -27.4505615234375, "global_step": 527217, "epoch": 6352} {"train_loss": -27.508594512939453, "global_step": 527218, "epoch": 6352} {"train_loss": -27.117258071899414, "global_step": 527219, "epoch": 6352} {"train_loss": -28.118932723999023, "global_step": 527220, "epoch": 6352} {"train_loss": -26.92457389831543, "global_step": 527221, "epoch": 6352} {"train_loss": -26.85227394104004, "global_step": 527222, "epoch": 6352} {"train_loss": -26.31354331970215, "global_step": 527223, "epoch": 6352} {"train_loss": -26.893293380737305, "global_step": 527224, "epoch": 6352} {"train_loss": -26.7695255279541, "global_step": 527225, "epoch": 6352} {"train_loss": -27.188879013061523, "global_step": 527226, "epoch": 6352} {"train_loss": -26.519948959350586, "global_step": 527227, "epoch": 6352} {"train_loss": -26.889678955078125, "global_step": 527228, "epoch": 6352} {"train_loss": -27.107044219970703, "global_step": 527229, "epoch": 6352} {"train_loss": -27.02802848815918, "global_step": 527230, "epoch": 6352} {"train_loss": -27.280447006225586, "global_step": 527231, "epoch": 6352} {"train_loss": -27.353260040283203, "global_step": 527232, "epoch": 6352} {"train_loss": -27.32459831237793, "global_step": 527233, "epoch": 6352} {"train_loss": -27.24954605102539, "global_step": 527234, "epoch": 6352} {"train_loss": -27.647756576538086, "global_step": 527235, "epoch": 6352} {"train_loss": -27.571491241455078, "global_step": 527236, "epoch": 6352} {"train_loss": -27.531850814819336, "global_step": 527237, "epoch": 6352} {"train_loss": -27.27618408203125, "global_step": 527238, "epoch": 6352} {"train_loss": -27.917728424072266, "global_step": 527239, "epoch": 6352} {"train_loss": -27.47043228149414, "global_step": 527240, "epoch": 6352} {"train_loss": -27.40943717956543, "global_step": 527241, "epoch": 6352} {"train_loss": -26.98853874206543, "global_step": 527242, "epoch": 6352} {"train_loss": -27.6895809173584, "global_step": 527243, "epoch": 6352} {"train_loss": -27.552661895751953, "global_step": 527244, "epoch": 6352} {"train_loss": -27.388153076171875, "global_step": 527245, "epoch": 6352} {"train_loss": -27.949254989624023, "global_step": 527246, "epoch": 6352} {"train_loss": -27.582677841186523, "global_step": 527247, "epoch": 6352} {"train_loss": -27.71504020690918, "global_step": 527248, "epoch": 6352} {"train_loss": -27.732955932617188, "global_step": 527249, "epoch": 6352} {"train_loss": -27.477619171142578, "global_step": 527250, "epoch": 6352} {"train_loss": -27.6381893157959, "global_step": 527251, "epoch": 6352} {"train_loss": -27.407773971557617, "global_step": 527252, "epoch": 6352} {"train_loss": -27.882734298706055, "global_step": 527253, "epoch": 6352} {"train_loss": -27.700178146362305, "global_step": 527254, "epoch": 6352} {"train_loss": -27.829553604125977, "global_step": 527255, "epoch": 6352} {"train_loss": -27.751178741455078, "global_step": 527256, "epoch": 6352} {"train_loss": -27.69822120666504, "global_step": 527257, "epoch": 6352} {"train_loss": -27.359628677368164, "global_step": 527258, "epoch": 6352} {"train_loss": -27.621484756469727, "global_step": 527259, "epoch": 6352} {"train_loss": -27.38190269470215, "global_step": 527260, "epoch": 6352} {"train_loss": -27.57598876953125, "global_step": 527261, "epoch": 6352} {"train_loss": -27.772857666015625, "global_step": 527262, "epoch": 6352} {"train_loss": -27.400177001953125, "global_step": 527263, "epoch": 6352} {"train_loss": -27.39772605895996, "global_step": 527264, "epoch": 6352} {"train_loss": -27.84055519104004, "global_step": 527265, "epoch": 6352} {"train_loss": -27.667072296142578, "global_step": 527266, "epoch": 6352} {"train_loss": -27.51104736328125, "global_step": 527267, "epoch": 6352} {"train_loss": -27.544214248657227, "global_step": 527268, "epoch": 6352} {"train_loss": -27.843799591064453, "global_step": 527269, "epoch": 6352} {"train_loss": -27.3814640045166, "global_step": 527270, "epoch": 6352} {"train_loss": -27.562671661376953, "global_step": 527271, "epoch": 6352} {"train_loss": -27.72590446472168, "global_step": 527272, "epoch": 6352} {"train_loss": -27.318195343017578, "global_step": 527273, "epoch": 6352} {"train_loss": -27.65216064453125, "global_step": 527274, "epoch": 6352} {"train_loss": -27.801870346069336, "global_step": 527275, "epoch": 6352} {"train_loss": -27.495431900024414, "global_step": 527276, "epoch": 6352} {"train_loss": -28.190824508666992, "global_step": 527277, "epoch": 6352} {"train_loss": -27.821882247924805, "global_step": 527278, "epoch": 6352} {"train_loss": -27.725605010986328, "global_step": 527279, "epoch": 6352} {"train_loss": -27.499906539916992, "global_step": 527280, "epoch": 6352} {"train_loss": -27.61578369140625, "global_step": 527281, "epoch": 6352} {"train_loss": -27.45977783203125, "global_step": 527282, "epoch": 6352} {"train_loss": -27.74063491821289, "global_step": 527283, "epoch": 6352} {"train_loss": -27.812637329101562, "global_step": 527284, "epoch": 6352} {"train_loss": -27.28098487854004, "global_step": 527285, "epoch": 6352} {"train_loss": -27.005590438842773, "global_step": 527286, "epoch": 6352} {"train_loss": -27.021326065063477, "global_step": 527287, "epoch": 6352} {"train_loss": -28.001239776611328, "global_step": 527288, "epoch": 6352} {"train_loss": -27.196792602539062, "global_step": 527289, "epoch": 6352} {"train_loss": -27.07069969177246, "global_step": 527290, "epoch": 6352} {"train_loss": -27.10540771484375, "global_step": 527291, "epoch": 6352} {"train_loss": -27.6574764251709, "global_step": 527292, "epoch": 6352} {"train_loss": -27.319120407104492, "global_step": 527293, "epoch": 6352} {"train_loss": -27.589757919311523, "global_step": 527294, "epoch": 6352} {"train_loss": -27.064130783081055, "global_step": 527295, "epoch": 6352} {"train_loss": -27.986804962158203, "global_step": 527296, "epoch": 6352} {"train_loss": -27.223499298095703, "global_step": 527297, "epoch": 6352} {"train_loss": -27.436005626816346, "global_step": 527298, "epoch": 6352, "val_loss": 6707864.0} {"train_loss": -27.592573165893555, "global_step": 527299, "epoch": 6353} {"train_loss": -27.100143432617188, "global_step": 527300, "epoch": 6353} {"train_loss": -26.879819869995117, "global_step": 527301, "epoch": 6353} {"train_loss": -27.0202579498291, "global_step": 527302, "epoch": 6353} {"train_loss": -27.21405029296875, "global_step": 527303, "epoch": 6353} {"train_loss": -27.13393211364746, "global_step": 527304, "epoch": 6353} {"train_loss": -27.275671005249023, "global_step": 527305, "epoch": 6353} {"train_loss": -26.983304977416992, "global_step": 527306, "epoch": 6353} {"train_loss": -26.879608154296875, "global_step": 527307, "epoch": 6353} {"train_loss": -27.460371017456055, "global_step": 527308, "epoch": 6353} {"train_loss": -26.427204132080078, "global_step": 527309, "epoch": 6353} {"train_loss": -26.648298263549805, "global_step": 527310, "epoch": 6353} {"train_loss": -27.327295303344727, "global_step": 527311, "epoch": 6353} {"train_loss": -27.132373809814453, "global_step": 527312, "epoch": 6353} {"train_loss": -27.29534339904785, "global_step": 527313, "epoch": 6353} {"train_loss": -27.1787166595459, "global_step": 527314, "epoch": 6353} {"train_loss": -27.388214111328125, "global_step": 527315, "epoch": 6353} {"train_loss": -27.4510555267334, "global_step": 527316, "epoch": 6353} {"train_loss": -27.620685577392578, "global_step": 527317, "epoch": 6353} {"train_loss": -27.581995010375977, "global_step": 527318, "epoch": 6353} {"train_loss": -27.218917846679688, "global_step": 527319, "epoch": 6353} {"train_loss": -27.174137115478516, "global_step": 527320, "epoch": 6353} {"train_loss": -27.650226593017578, "global_step": 527321, "epoch": 6353} {"train_loss": -27.02363395690918, "global_step": 527322, "epoch": 6353} {"train_loss": -27.522735595703125, "global_step": 527323, "epoch": 6353} {"train_loss": -27.623046875, "global_step": 527324, "epoch": 6353} {"train_loss": -27.676313400268555, "global_step": 527325, "epoch": 6353} {"train_loss": -27.431650161743164, "global_step": 527326, "epoch": 6353} {"train_loss": -27.114049911499023, "global_step": 527327, "epoch": 6353} {"train_loss": -27.65921401977539, "global_step": 527328, "epoch": 6353} {"train_loss": -27.32706069946289, "global_step": 527329, "epoch": 6353} {"train_loss": -27.680295944213867, "global_step": 527330, "epoch": 6353} {"train_loss": -27.715808868408203, "global_step": 527331, "epoch": 6353} {"train_loss": -27.508527755737305, "global_step": 527332, "epoch": 6353} {"train_loss": -27.496789932250977, "global_step": 527333, "epoch": 6353} {"train_loss": -27.310895919799805, "global_step": 527334, "epoch": 6353} {"train_loss": -27.73198890686035, "global_step": 527335, "epoch": 6353} {"train_loss": -27.430057525634766, "global_step": 527336, "epoch": 6353} {"train_loss": -27.54241943359375, "global_step": 527337, "epoch": 6353} {"train_loss": -27.33243751525879, "global_step": 527338, "epoch": 6353} {"train_loss": -27.721881866455078, "global_step": 527339, "epoch": 6353} {"train_loss": -27.55490493774414, "global_step": 527340, "epoch": 6353} {"train_loss": -27.500768661499023, "global_step": 527341, "epoch": 6353} {"train_loss": -27.525720596313477, "global_step": 527342, "epoch": 6353} {"train_loss": -27.43631362915039, "global_step": 527343, "epoch": 6353} {"train_loss": -27.41912841796875, "global_step": 527344, "epoch": 6353} {"train_loss": -27.622028350830078, "global_step": 527345, "epoch": 6353} {"train_loss": -27.537689208984375, "global_step": 527346, "epoch": 6353} {"train_loss": -27.517642974853516, "global_step": 527347, "epoch": 6353} {"train_loss": -27.75542640686035, "global_step": 527348, "epoch": 6353} {"train_loss": -27.31691551208496, "global_step": 527349, "epoch": 6353} {"train_loss": -27.782480239868164, "global_step": 527350, "epoch": 6353} {"train_loss": -27.643701553344727, "global_step": 527351, "epoch": 6353} {"train_loss": -27.626062393188477, "global_step": 527352, "epoch": 6353} {"train_loss": -28.069183349609375, "global_step": 527353, "epoch": 6353} {"train_loss": -28.007612228393555, "global_step": 527354, "epoch": 6353} {"train_loss": -27.89423179626465, "global_step": 527355, "epoch": 6353} {"train_loss": -27.283567428588867, "global_step": 527356, "epoch": 6353} {"train_loss": -27.549734115600586, "global_step": 527357, "epoch": 6353} {"train_loss": -27.441577911376953, "global_step": 527358, "epoch": 6353} {"train_loss": -27.67609977722168, "global_step": 527359, "epoch": 6353} {"train_loss": -27.838796615600586, "global_step": 527360, "epoch": 6353} {"train_loss": -27.635700225830078, "global_step": 527361, "epoch": 6353} {"train_loss": -27.552143096923828, "global_step": 527362, "epoch": 6353} {"train_loss": -27.906036376953125, "global_step": 527363, "epoch": 6353} {"train_loss": -27.62587547302246, "global_step": 527364, "epoch": 6353} {"train_loss": -27.996967315673828, "global_step": 527365, "epoch": 6353} {"train_loss": -27.750442504882812, "global_step": 527366, "epoch": 6353} {"train_loss": -28.222274780273438, "global_step": 527367, "epoch": 6353} {"train_loss": -27.76129722595215, "global_step": 527368, "epoch": 6353} {"train_loss": -27.9856014251709, "global_step": 527369, "epoch": 6353} {"train_loss": -27.75880241394043, "global_step": 527370, "epoch": 6353} {"train_loss": -27.69130516052246, "global_step": 527371, "epoch": 6353} {"train_loss": -27.621503829956055, "global_step": 527372, "epoch": 6353} {"train_loss": -27.588682174682617, "global_step": 527373, "epoch": 6353} {"train_loss": -27.9493465423584, "global_step": 527374, "epoch": 6353} {"train_loss": -27.356122970581055, "global_step": 527375, "epoch": 6353} {"train_loss": -26.896169662475586, "global_step": 527376, "epoch": 6353} {"train_loss": -26.917037963867188, "global_step": 527377, "epoch": 6353} {"train_loss": -26.869709014892578, "global_step": 527378, "epoch": 6353} {"train_loss": -27.2764892578125, "global_step": 527379, "epoch": 6353} {"train_loss": -26.884185791015625, "global_step": 527380, "epoch": 6353} {"train_loss": -27.449611709778566, "global_step": 527381, "epoch": 6353, "val_loss": 6694012.0} {"train_loss": -26.97322654724121, "global_step": 527382, "epoch": 6354} {"train_loss": -26.31499671936035, "global_step": 527383, "epoch": 6354} {"train_loss": -26.573455810546875, "global_step": 527384, "epoch": 6354} {"train_loss": -27.144285202026367, "global_step": 527385, "epoch": 6354} {"train_loss": -26.71246337890625, "global_step": 527386, "epoch": 6354} {"train_loss": -26.913694381713867, "global_step": 527387, "epoch": 6354} {"train_loss": -26.7999210357666, "global_step": 527388, "epoch": 6354} {"train_loss": -26.5904598236084, "global_step": 527389, "epoch": 6354} {"train_loss": -26.709136962890625, "global_step": 527390, "epoch": 6354} {"train_loss": -26.230497360229492, "global_step": 527391, "epoch": 6354} {"train_loss": -27.165372848510742, "global_step": 527392, "epoch": 6354} {"train_loss": -27.074508666992188, "global_step": 527393, "epoch": 6354} {"train_loss": -26.995346069335938, "global_step": 527394, "epoch": 6354} {"train_loss": -26.922327041625977, "global_step": 527395, "epoch": 6354} {"train_loss": -27.347097396850586, "global_step": 527396, "epoch": 6354} {"train_loss": -27.152240753173828, "global_step": 527397, "epoch": 6354} {"train_loss": -27.007917404174805, "global_step": 527398, "epoch": 6354} {"train_loss": -27.34205436706543, "global_step": 527399, "epoch": 6354} {"train_loss": -27.324405670166016, "global_step": 527400, "epoch": 6354} {"train_loss": -27.762887954711914, "global_step": 527401, "epoch": 6354} {"train_loss": -27.383167266845703, "global_step": 527402, "epoch": 6354} {"train_loss": -27.41534996032715, "global_step": 527403, "epoch": 6354} {"train_loss": -27.39742088317871, "global_step": 527404, "epoch": 6354} {"train_loss": -27.565460205078125, "global_step": 527405, "epoch": 6354} {"train_loss": -27.780990600585938, "global_step": 527406, "epoch": 6354} {"train_loss": -27.45381736755371, "global_step": 527407, "epoch": 6354} {"train_loss": -27.772022247314453, "global_step": 527408, "epoch": 6354} {"train_loss": -27.550153732299805, "global_step": 527409, "epoch": 6354} {"train_loss": -27.733280181884766, "global_step": 527410, "epoch": 6354} {"train_loss": -27.310903549194336, "global_step": 527411, "epoch": 6354} {"train_loss": -27.361337661743164, "global_step": 527412, "epoch": 6354} {"train_loss": -27.69618034362793, "global_step": 527413, "epoch": 6354} {"train_loss": -27.66309928894043, "global_step": 527414, "epoch": 6354} {"train_loss": -27.686450958251953, "global_step": 527415, "epoch": 6354} {"train_loss": -27.341598510742188, "global_step": 527416, "epoch": 6354} {"train_loss": -27.45412254333496, "global_step": 527417, "epoch": 6354} {"train_loss": -27.581838607788086, "global_step": 527418, "epoch": 6354} {"train_loss": -27.749713897705078, "global_step": 527419, "epoch": 6354} {"train_loss": -27.433094024658203, "global_step": 527420, "epoch": 6354} {"train_loss": -27.442914962768555, "global_step": 527421, "epoch": 6354} {"train_loss": -27.1840877532959, "global_step": 527422, "epoch": 6354} {"train_loss": -27.937299728393555, "global_step": 527423, "epoch": 6354} {"train_loss": -27.729211807250977, "global_step": 527424, "epoch": 6354} {"train_loss": -27.8093318939209, "global_step": 527425, "epoch": 6354} {"train_loss": -27.669492721557617, "global_step": 527426, "epoch": 6354} {"train_loss": -27.757558822631836, "global_step": 527427, "epoch": 6354} {"train_loss": -27.468923568725586, "global_step": 527428, "epoch": 6354} {"train_loss": -27.7105655670166, "global_step": 527429, "epoch": 6354} {"train_loss": -27.752365112304688, "global_step": 527430, "epoch": 6354} {"train_loss": -27.87404441833496, "global_step": 527431, "epoch": 6354} {"train_loss": -27.419042587280273, "global_step": 527432, "epoch": 6354} {"train_loss": -27.839319229125977, "global_step": 527433, "epoch": 6354} {"train_loss": -27.644596099853516, "global_step": 527434, "epoch": 6354} {"train_loss": -27.59612464904785, "global_step": 527435, "epoch": 6354} {"train_loss": -27.782428741455078, "global_step": 527436, "epoch": 6354} {"train_loss": -27.641925811767578, "global_step": 527437, "epoch": 6354} {"train_loss": -27.53191566467285, "global_step": 527438, "epoch": 6354} {"train_loss": -27.922927856445312, "global_step": 527439, "epoch": 6354} {"train_loss": -27.89436149597168, "global_step": 527440, "epoch": 6354} {"train_loss": -27.72592544555664, "global_step": 527441, "epoch": 6354} {"train_loss": -27.737272262573242, "global_step": 527442, "epoch": 6354} {"train_loss": -27.83622169494629, "global_step": 527443, "epoch": 6354} {"train_loss": -27.59052848815918, "global_step": 527444, "epoch": 6354} {"train_loss": -27.255151748657227, "global_step": 527445, "epoch": 6354} {"train_loss": -27.69703483581543, "global_step": 527446, "epoch": 6354} {"train_loss": -27.80472755432129, "global_step": 527447, "epoch": 6354} {"train_loss": -27.433399200439453, "global_step": 527448, "epoch": 6354} {"train_loss": -28.13508415222168, "global_step": 527449, "epoch": 6354} {"train_loss": -27.314075469970703, "global_step": 527450, "epoch": 6354} {"train_loss": -27.91482925415039, "global_step": 527451, "epoch": 6354} {"train_loss": -27.782312393188477, "global_step": 527452, "epoch": 6354} {"train_loss": -27.998090744018555, "global_step": 527453, "epoch": 6354} {"train_loss": -28.068017959594727, "global_step": 527454, "epoch": 6354} {"train_loss": -27.325489044189453, "global_step": 527455, "epoch": 6354} {"train_loss": -27.450170516967773, "global_step": 527456, "epoch": 6354} {"train_loss": -27.3075008392334, "global_step": 527457, "epoch": 6354} {"train_loss": -26.799530029296875, "global_step": 527458, "epoch": 6354} {"train_loss": -25.979053497314453, "global_step": 527459, "epoch": 6354} {"train_loss": -25.817554473876953, "global_step": 527460, "epoch": 6354} {"train_loss": -27.087066650390625, "global_step": 527461, "epoch": 6354} {"train_loss": -27.182809829711914, "global_step": 527462, "epoch": 6354} {"train_loss": -26.89552879333496, "global_step": 527463, "epoch": 6354} {"train_loss": -27.396674374499952, "global_step": 527464, "epoch": 6354, "val_loss": 6720444.0} {"train_loss": -26.956396102905273, "global_step": 527465, "epoch": 6355} {"train_loss": -27.49188804626465, "global_step": 527466, "epoch": 6355} {"train_loss": -27.03122901916504, "global_step": 527467, "epoch": 6355} {"train_loss": -26.917404174804688, "global_step": 527468, "epoch": 6355} {"train_loss": -26.799346923828125, "global_step": 527469, "epoch": 6355} {"train_loss": -26.485431671142578, "global_step": 527470, "epoch": 6355} {"train_loss": -26.822973251342773, "global_step": 527471, "epoch": 6355} {"train_loss": -26.822187423706055, "global_step": 527472, "epoch": 6355} {"train_loss": -27.079666137695312, "global_step": 527473, "epoch": 6355} {"train_loss": -27.14402198791504, "global_step": 527474, "epoch": 6355} {"train_loss": -26.923139572143555, "global_step": 527475, "epoch": 6355} {"train_loss": -26.96614646911621, "global_step": 527476, "epoch": 6355} {"train_loss": -27.218555450439453, "global_step": 527477, "epoch": 6355} {"train_loss": -27.35270118713379, "global_step": 527478, "epoch": 6355} {"train_loss": -26.823654174804688, "global_step": 527479, "epoch": 6355} {"train_loss": -27.27679443359375, "global_step": 527480, "epoch": 6355} {"train_loss": -27.188013076782227, "global_step": 527481, "epoch": 6355} {"train_loss": -27.141315460205078, "global_step": 527482, "epoch": 6355} {"train_loss": -27.241174697875977, "global_step": 527483, "epoch": 6355} {"train_loss": -27.581968307495117, "global_step": 527484, "epoch": 6355} {"train_loss": -27.217863082885742, "global_step": 527485, "epoch": 6355} {"train_loss": -27.52133560180664, "global_step": 527486, "epoch": 6355} {"train_loss": -27.540990829467773, "global_step": 527487, "epoch": 6355} {"train_loss": -27.382410049438477, "global_step": 527488, "epoch": 6355} {"train_loss": -27.268152236938477, "global_step": 527489, "epoch": 6355} {"train_loss": -27.003986358642578, "global_step": 527490, "epoch": 6355} {"train_loss": -27.664051055908203, "global_step": 527491, "epoch": 6355} {"train_loss": -27.383214950561523, "global_step": 527492, "epoch": 6355} {"train_loss": -27.379098892211914, "global_step": 527493, "epoch": 6355} {"train_loss": -27.718626022338867, "global_step": 527494, "epoch": 6355} {"train_loss": -27.29572105407715, "global_step": 527495, "epoch": 6355} {"train_loss": -27.387741088867188, "global_step": 527496, "epoch": 6355} {"train_loss": -27.669082641601562, "global_step": 527497, "epoch": 6355} {"train_loss": -27.859785079956055, "global_step": 527498, "epoch": 6355} {"train_loss": -27.628528594970703, "global_step": 527499, "epoch": 6355} {"train_loss": -27.6353759765625, "global_step": 527500, "epoch": 6355} {"train_loss": -27.3155460357666, "global_step": 527501, "epoch": 6355} {"train_loss": -27.530359268188477, "global_step": 527502, "epoch": 6355} {"train_loss": -27.531341552734375, "global_step": 527503, "epoch": 6355} {"train_loss": -27.467390060424805, "global_step": 527504, "epoch": 6355} {"train_loss": -27.386579513549805, "global_step": 527505, "epoch": 6355} {"train_loss": -28.104536056518555, "global_step": 527506, "epoch": 6355} {"train_loss": -27.24003028869629, "global_step": 527507, "epoch": 6355} {"train_loss": -27.579504013061523, "global_step": 527508, "epoch": 6355} {"train_loss": -27.6234073638916, "global_step": 527509, "epoch": 6355} {"train_loss": -27.847944259643555, "global_step": 527510, "epoch": 6355} {"train_loss": -27.54526710510254, "global_step": 527511, "epoch": 6355} {"train_loss": -27.99053382873535, "global_step": 527512, "epoch": 6355} {"train_loss": -27.525678634643555, "global_step": 527513, "epoch": 6355} {"train_loss": -27.5196590423584, "global_step": 527514, "epoch": 6355} {"train_loss": -27.7346134185791, "global_step": 527515, "epoch": 6355} {"train_loss": -27.73139762878418, "global_step": 527516, "epoch": 6355} {"train_loss": -28.156946182250977, "global_step": 527517, "epoch": 6355} {"train_loss": -27.711111068725586, "global_step": 527518, "epoch": 6355} {"train_loss": -27.75996208190918, "global_step": 527519, "epoch": 6355} {"train_loss": -27.89939308166504, "global_step": 527520, "epoch": 6355} {"train_loss": -27.80584716796875, "global_step": 527521, "epoch": 6355} {"train_loss": -27.550281524658203, "global_step": 527522, "epoch": 6355} {"train_loss": -27.758804321289062, "global_step": 527523, "epoch": 6355} {"train_loss": -27.620508193969727, "global_step": 527524, "epoch": 6355} {"train_loss": -27.27308464050293, "global_step": 527525, "epoch": 6355} {"train_loss": -26.955480575561523, "global_step": 527526, "epoch": 6355} {"train_loss": -26.49104881286621, "global_step": 527527, "epoch": 6355} {"train_loss": -26.72330665588379, "global_step": 527528, "epoch": 6355} {"train_loss": -27.5361385345459, "global_step": 527529, "epoch": 6355} {"train_loss": -26.98455238342285, "global_step": 527530, "epoch": 6355} {"train_loss": -27.439605712890625, "global_step": 527531, "epoch": 6355} {"train_loss": -27.366270065307617, "global_step": 527532, "epoch": 6355} {"train_loss": -27.61484146118164, "global_step": 527533, "epoch": 6355} {"train_loss": -27.4628963470459, "global_step": 527534, "epoch": 6355} {"train_loss": -27.465545654296875, "global_step": 527535, "epoch": 6355} {"train_loss": -27.212329864501953, "global_step": 527536, "epoch": 6355} {"train_loss": -27.604169845581055, "global_step": 527537, "epoch": 6355} {"train_loss": -27.4362735748291, "global_step": 527538, "epoch": 6355} {"train_loss": -27.781248092651367, "global_step": 527539, "epoch": 6355} {"train_loss": -27.615198135375977, "global_step": 527540, "epoch": 6355} {"train_loss": -27.73512077331543, "global_step": 527541, "epoch": 6355} {"train_loss": -27.481342315673828, "global_step": 527542, "epoch": 6355} {"train_loss": -27.893325805664062, "global_step": 527543, "epoch": 6355} {"train_loss": -27.64764976501465, "global_step": 527544, "epoch": 6355} {"train_loss": -27.262365341186523, "global_step": 527545, "epoch": 6355} {"train_loss": -27.74842643737793, "global_step": 527546, "epoch": 6355} {"train_loss": -27.41539019848927, "global_step": 527547, "epoch": 6355, "val_loss": 6743322.5} {"train_loss": -25.90117835998535, "global_step": 527548, "epoch": 6356} {"train_loss": -23.2529239654541, "global_step": 527549, "epoch": 6356} {"train_loss": -24.48956871032715, "global_step": 527550, "epoch": 6356} {"train_loss": -25.883453369140625, "global_step": 527551, "epoch": 6356} {"train_loss": -25.962125778198242, "global_step": 527552, "epoch": 6356} {"train_loss": -25.63368034362793, "global_step": 527553, "epoch": 6356} {"train_loss": -26.109472274780273, "global_step": 527554, "epoch": 6356} {"train_loss": -25.874006271362305, "global_step": 527555, "epoch": 6356} {"train_loss": -25.96848487854004, "global_step": 527556, "epoch": 6356} {"train_loss": -26.369733810424805, "global_step": 527557, "epoch": 6356} {"train_loss": -25.3912410736084, "global_step": 527558, "epoch": 6356} {"train_loss": -26.15703773498535, "global_step": 527559, "epoch": 6356} {"train_loss": -26.020185470581055, "global_step": 527560, "epoch": 6356} {"train_loss": -26.504179000854492, "global_step": 527561, "epoch": 6356} {"train_loss": -26.23748779296875, "global_step": 527562, "epoch": 6356} {"train_loss": -26.11216163635254, "global_step": 527563, "epoch": 6356} {"train_loss": -26.645191192626953, "global_step": 527564, "epoch": 6356} {"train_loss": -26.161062240600586, "global_step": 527565, "epoch": 6356} {"train_loss": -27.085693359375, "global_step": 527566, "epoch": 6356} {"train_loss": -26.328603744506836, "global_step": 527567, "epoch": 6356} {"train_loss": -27.02178955078125, "global_step": 527568, "epoch": 6356} {"train_loss": -26.803674697875977, "global_step": 527569, "epoch": 6356} {"train_loss": -26.71184730529785, "global_step": 527570, "epoch": 6356} {"train_loss": -27.167327880859375, "global_step": 527571, "epoch": 6356} {"train_loss": -26.830493927001953, "global_step": 527572, "epoch": 6356} {"train_loss": -26.95606803894043, "global_step": 527573, "epoch": 6356} {"train_loss": -27.025617599487305, "global_step": 527574, "epoch": 6356} {"train_loss": -26.878454208374023, "global_step": 527575, "epoch": 6356} {"train_loss": -27.0876407623291, "global_step": 527576, "epoch": 6356} {"train_loss": -27.007375717163086, "global_step": 527577, "epoch": 6356} {"train_loss": -27.38519859313965, "global_step": 527578, "epoch": 6356} {"train_loss": -26.95136070251465, "global_step": 527579, "epoch": 6356} {"train_loss": -27.24028968811035, "global_step": 527580, "epoch": 6356} {"train_loss": -27.317529678344727, "global_step": 527581, "epoch": 6356} {"train_loss": -27.308368682861328, "global_step": 527582, "epoch": 6356} {"train_loss": -27.21337890625, "global_step": 527583, "epoch": 6356} {"train_loss": -27.191370010375977, "global_step": 527584, "epoch": 6356} {"train_loss": -27.2683048248291, "global_step": 527585, "epoch": 6356} {"train_loss": -27.53663444519043, "global_step": 527586, "epoch": 6356} {"train_loss": -27.518903732299805, "global_step": 527587, "epoch": 6356} {"train_loss": -27.4204044342041, "global_step": 527588, "epoch": 6356} {"train_loss": -27.612762451171875, "global_step": 527589, "epoch": 6356} {"train_loss": -27.521411895751953, "global_step": 527590, "epoch": 6356} {"train_loss": -27.43130874633789, "global_step": 527591, "epoch": 6356} {"train_loss": -27.751264572143555, "global_step": 527592, "epoch": 6356} {"train_loss": -28.12701416015625, "global_step": 527593, "epoch": 6356} {"train_loss": -27.80657958984375, "global_step": 527594, "epoch": 6356} {"train_loss": -27.58359146118164, "global_step": 527595, "epoch": 6356} {"train_loss": -27.543338775634766, "global_step": 527596, "epoch": 6356} {"train_loss": -27.64230728149414, "global_step": 527597, "epoch": 6356} {"train_loss": -27.136930465698242, "global_step": 527598, "epoch": 6356} {"train_loss": -27.604034423828125, "global_step": 527599, "epoch": 6356} {"train_loss": -27.55816650390625, "global_step": 527600, "epoch": 6356} {"train_loss": -27.49381446838379, "global_step": 527601, "epoch": 6356} {"train_loss": -27.409515380859375, "global_step": 527602, "epoch": 6356} {"train_loss": -27.649396896362305, "global_step": 527603, "epoch": 6356} {"train_loss": -27.464649200439453, "global_step": 527604, "epoch": 6356} {"train_loss": -27.481998443603516, "global_step": 527605, "epoch": 6356} {"train_loss": -27.078378677368164, "global_step": 527606, "epoch": 6356} {"train_loss": -26.704837799072266, "global_step": 527607, "epoch": 6356} {"train_loss": -26.60955810546875, "global_step": 527608, "epoch": 6356} {"train_loss": -27.513370513916016, "global_step": 527609, "epoch": 6356} {"train_loss": -28.027231216430664, "global_step": 527610, "epoch": 6356} {"train_loss": -27.53553581237793, "global_step": 527611, "epoch": 6356} {"train_loss": -27.640607833862305, "global_step": 527612, "epoch": 6356} {"train_loss": -27.506988525390625, "global_step": 527613, "epoch": 6356} {"train_loss": -27.638586044311523, "global_step": 527614, "epoch": 6356} {"train_loss": -27.56540298461914, "global_step": 527615, "epoch": 6356} {"train_loss": -27.816619873046875, "global_step": 527616, "epoch": 6356} {"train_loss": -27.481897354125977, "global_step": 527617, "epoch": 6356} {"train_loss": -27.864486694335938, "global_step": 527618, "epoch": 6356} {"train_loss": -27.52707290649414, "global_step": 527619, "epoch": 6356} {"train_loss": -27.82927894592285, "global_step": 527620, "epoch": 6356} {"train_loss": -27.8185977935791, "global_step": 527621, "epoch": 6356} {"train_loss": -27.707250595092773, "global_step": 527622, "epoch": 6356} {"train_loss": -27.7435359954834, "global_step": 527623, "epoch": 6356} {"train_loss": -27.5848331451416, "global_step": 527624, "epoch": 6356} {"train_loss": -28.086278915405273, "global_step": 527625, "epoch": 6356} {"train_loss": -27.402524948120117, "global_step": 527626, "epoch": 6356} {"train_loss": -27.303735733032227, "global_step": 527627, "epoch": 6356} {"train_loss": -28.0684757232666, "global_step": 527628, "epoch": 6356} {"train_loss": -27.42457389831543, "global_step": 527629, "epoch": 6356} {"train_loss": -27.05694442197501, "global_step": 527630, "epoch": 6356, "val_loss": 6737081.5} {"train_loss": -26.470792770385742, "global_step": 527631, "epoch": 6357} {"train_loss": -25.39288902282715, "global_step": 527632, "epoch": 6357} {"train_loss": -26.56743812561035, "global_step": 527633, "epoch": 6357} {"train_loss": -26.74921226501465, "global_step": 527634, "epoch": 6357} {"train_loss": -26.63117027282715, "global_step": 527635, "epoch": 6357} {"train_loss": -27.004419326782227, "global_step": 527636, "epoch": 6357} {"train_loss": -26.952489852905273, "global_step": 527637, "epoch": 6357} {"train_loss": -27.274967193603516, "global_step": 527638, "epoch": 6357} {"train_loss": -26.5654296875, "global_step": 527639, "epoch": 6357} {"train_loss": -27.45686912536621, "global_step": 527640, "epoch": 6357} {"train_loss": -27.2477970123291, "global_step": 527641, "epoch": 6357} {"train_loss": -27.10011100769043, "global_step": 527642, "epoch": 6357} {"train_loss": -27.219797134399414, "global_step": 527643, "epoch": 6357} {"train_loss": -27.338001251220703, "global_step": 527644, "epoch": 6357} {"train_loss": -27.211170196533203, "global_step": 527645, "epoch": 6357} {"train_loss": -27.207529067993164, "global_step": 527646, "epoch": 6357} {"train_loss": -27.192859649658203, "global_step": 527647, "epoch": 6357} {"train_loss": -27.248004913330078, "global_step": 527648, "epoch": 6357} {"train_loss": -27.081268310546875, "global_step": 527649, "epoch": 6357} {"train_loss": -27.3687744140625, "global_step": 527650, "epoch": 6357} {"train_loss": -27.25446128845215, "global_step": 527651, "epoch": 6357} {"train_loss": -27.435028076171875, "global_step": 527652, "epoch": 6357} {"train_loss": -27.089038848876953, "global_step": 527653, "epoch": 6357} {"train_loss": -27.361480712890625, "global_step": 527654, "epoch": 6357} {"train_loss": -27.377765655517578, "global_step": 527655, "epoch": 6357} {"train_loss": -27.97210693359375, "global_step": 527656, "epoch": 6357} {"train_loss": -27.571897506713867, "global_step": 527657, "epoch": 6357} {"train_loss": -27.431909561157227, "global_step": 527658, "epoch": 6357} {"train_loss": -27.38809585571289, "global_step": 527659, "epoch": 6357} {"train_loss": -27.500104904174805, "global_step": 527660, "epoch": 6357} {"train_loss": -27.461759567260742, "global_step": 527661, "epoch": 6357} {"train_loss": -27.488855361938477, "global_step": 527662, "epoch": 6357} {"train_loss": -27.730426788330078, "global_step": 527663, "epoch": 6357} {"train_loss": -27.655658721923828, "global_step": 527664, "epoch": 6357} {"train_loss": -27.53016471862793, "global_step": 527665, "epoch": 6357} {"train_loss": -27.815887451171875, "global_step": 527666, "epoch": 6357} {"train_loss": -27.66301918029785, "global_step": 527667, "epoch": 6357} {"train_loss": -27.23919105529785, "global_step": 527668, "epoch": 6357} {"train_loss": -27.43009376525879, "global_step": 527669, "epoch": 6357} {"train_loss": -27.649991989135742, "global_step": 527670, "epoch": 6357} {"train_loss": -27.515613555908203, "global_step": 527671, "epoch": 6357} {"train_loss": -27.297016143798828, "global_step": 527672, "epoch": 6357} {"train_loss": -27.856115341186523, "global_step": 527673, "epoch": 6357} {"train_loss": -27.674774169921875, "global_step": 527674, "epoch": 6357} {"train_loss": -27.885120391845703, "global_step": 527675, "epoch": 6357} {"train_loss": -27.6015625, "global_step": 527676, "epoch": 6357} {"train_loss": -27.5878849029541, "global_step": 527677, "epoch": 6357} {"train_loss": -27.761152267456055, "global_step": 527678, "epoch": 6357} {"train_loss": -27.64838981628418, "global_step": 527679, "epoch": 6357} {"train_loss": -27.64971923828125, "global_step": 527680, "epoch": 6357} {"train_loss": -27.70697021484375, "global_step": 527681, "epoch": 6357} {"train_loss": -27.326370239257812, "global_step": 527682, "epoch": 6357} {"train_loss": -27.7270450592041, "global_step": 527683, "epoch": 6357} {"train_loss": -27.49599266052246, "global_step": 527684, "epoch": 6357} {"train_loss": -27.775232315063477, "global_step": 527685, "epoch": 6357} {"train_loss": -27.57716178894043, "global_step": 527686, "epoch": 6357} {"train_loss": -27.345739364624023, "global_step": 527687, "epoch": 6357} {"train_loss": -27.352447509765625, "global_step": 527688, "epoch": 6357} {"train_loss": -27.104721069335938, "global_step": 527689, "epoch": 6357} {"train_loss": -27.62554359436035, "global_step": 527690, "epoch": 6357} {"train_loss": -27.373077392578125, "global_step": 527691, "epoch": 6357} {"train_loss": -27.52406120300293, "global_step": 527692, "epoch": 6357} {"train_loss": -27.58450698852539, "global_step": 527693, "epoch": 6357} {"train_loss": -27.071088790893555, "global_step": 527694, "epoch": 6357} {"train_loss": -27.170886993408203, "global_step": 527695, "epoch": 6357} {"train_loss": -27.096923828125, "global_step": 527696, "epoch": 6357} {"train_loss": -27.842809677124023, "global_step": 527697, "epoch": 6357} {"train_loss": -27.279455184936523, "global_step": 527698, "epoch": 6357} {"train_loss": -27.08196449279785, "global_step": 527699, "epoch": 6357} {"train_loss": -27.670196533203125, "global_step": 527700, "epoch": 6357} {"train_loss": -26.906707763671875, "global_step": 527701, "epoch": 6357} {"train_loss": -27.13184928894043, "global_step": 527702, "epoch": 6357} {"train_loss": -27.595773696899414, "global_step": 527703, "epoch": 6357} {"train_loss": -27.47088623046875, "global_step": 527704, "epoch": 6357} {"train_loss": -27.400842666625977, "global_step": 527705, "epoch": 6357} {"train_loss": -27.358783721923828, "global_step": 527706, "epoch": 6357} {"train_loss": -27.495634078979492, "global_step": 527707, "epoch": 6357} {"train_loss": -27.373676300048828, "global_step": 527708, "epoch": 6357} {"train_loss": -27.817340850830078, "global_step": 527709, "epoch": 6357} {"train_loss": -27.678442001342773, "global_step": 527710, "epoch": 6357} {"train_loss": -27.30811882019043, "global_step": 527711, "epoch": 6357} {"train_loss": -27.5574893951416, "global_step": 527712, "epoch": 6357} {"train_loss": -27.35401684404856, "global_step": 527713, "epoch": 6357, "val_loss": 6636904.0} {"train_loss": -26.581867218017578, "global_step": 527714, "epoch": 6358} {"train_loss": -26.335477828979492, "global_step": 527715, "epoch": 6358} {"train_loss": -26.796125411987305, "global_step": 527716, "epoch": 6358} {"train_loss": -26.110736846923828, "global_step": 527717, "epoch": 6358} {"train_loss": -26.42717933654785, "global_step": 527718, "epoch": 6358} {"train_loss": -27.1240234375, "global_step": 527719, "epoch": 6358} {"train_loss": -26.587955474853516, "global_step": 527720, "epoch": 6358} {"train_loss": -26.940479278564453, "global_step": 527721, "epoch": 6358} {"train_loss": -26.95078468322754, "global_step": 527722, "epoch": 6358} {"train_loss": -27.35264015197754, "global_step": 527723, "epoch": 6358} {"train_loss": -27.324811935424805, "global_step": 527724, "epoch": 6358} {"train_loss": -27.164554595947266, "global_step": 527725, "epoch": 6358} {"train_loss": -27.180322647094727, "global_step": 527726, "epoch": 6358} {"train_loss": -26.702829360961914, "global_step": 527727, "epoch": 6358} {"train_loss": -27.715911865234375, "global_step": 527728, "epoch": 6358} {"train_loss": -27.096837997436523, "global_step": 527729, "epoch": 6358} {"train_loss": -27.182697296142578, "global_step": 527730, "epoch": 6358} {"train_loss": -27.358922958374023, "global_step": 527731, "epoch": 6358} {"train_loss": -27.309619903564453, "global_step": 527732, "epoch": 6358} {"train_loss": -27.3317928314209, "global_step": 527733, "epoch": 6358} {"train_loss": -27.553436279296875, "global_step": 527734, "epoch": 6358} {"train_loss": -27.354013442993164, "global_step": 527735, "epoch": 6358} {"train_loss": -27.2331485748291, "global_step": 527736, "epoch": 6358} {"train_loss": -27.316991806030273, "global_step": 527737, "epoch": 6358} {"train_loss": -27.3718318939209, "global_step": 527738, "epoch": 6358} {"train_loss": -27.59834861755371, "global_step": 527739, "epoch": 6358} {"train_loss": -27.674917221069336, "global_step": 527740, "epoch": 6358} {"train_loss": -27.311635971069336, "global_step": 527741, "epoch": 6358} {"train_loss": -27.592529296875, "global_step": 527742, "epoch": 6358} {"train_loss": -27.382648468017578, "global_step": 527743, "epoch": 6358} {"train_loss": -27.886560440063477, "global_step": 527744, "epoch": 6358} {"train_loss": -27.593137741088867, "global_step": 527745, "epoch": 6358} {"train_loss": -27.51434898376465, "global_step": 527746, "epoch": 6358} {"train_loss": -27.67583656311035, "global_step": 527747, "epoch": 6358} {"train_loss": -27.670495986938477, "global_step": 527748, "epoch": 6358} {"train_loss": -27.838153839111328, "global_step": 527749, "epoch": 6358} {"train_loss": -27.399429321289062, "global_step": 527750, "epoch": 6358} {"train_loss": -27.8955078125, "global_step": 527751, "epoch": 6358} {"train_loss": -27.450891494750977, "global_step": 527752, "epoch": 6358} {"train_loss": -27.822113037109375, "global_step": 527753, "epoch": 6358} {"train_loss": -27.78066062927246, "global_step": 527754, "epoch": 6358} {"train_loss": -28.030126571655273, "global_step": 527755, "epoch": 6358} {"train_loss": -27.784711837768555, "global_step": 527756, "epoch": 6358} {"train_loss": -27.843320846557617, "global_step": 527757, "epoch": 6358} {"train_loss": -27.798749923706055, "global_step": 527758, "epoch": 6358} {"train_loss": -27.7427921295166, "global_step": 527759, "epoch": 6358} {"train_loss": -27.69028663635254, "global_step": 527760, "epoch": 6358} {"train_loss": -27.573505401611328, "global_step": 527761, "epoch": 6358} {"train_loss": -27.767004013061523, "global_step": 527762, "epoch": 6358} {"train_loss": -27.750808715820312, "global_step": 527763, "epoch": 6358} {"train_loss": -27.408567428588867, "global_step": 527764, "epoch": 6358} {"train_loss": -27.549524307250977, "global_step": 527765, "epoch": 6358} {"train_loss": -28.069128036499023, "global_step": 527766, "epoch": 6358} {"train_loss": -27.675922393798828, "global_step": 527767, "epoch": 6358} {"train_loss": -27.6441650390625, "global_step": 527768, "epoch": 6358} {"train_loss": -28.13470458984375, "global_step": 527769, "epoch": 6358} {"train_loss": -27.794904708862305, "global_step": 527770, "epoch": 6358} {"train_loss": -28.07456398010254, "global_step": 527771, "epoch": 6358} {"train_loss": -28.05632972717285, "global_step": 527772, "epoch": 6358} {"train_loss": -27.839706420898438, "global_step": 527773, "epoch": 6358} {"train_loss": -27.5498104095459, "global_step": 527774, "epoch": 6358} {"train_loss": -27.65598487854004, "global_step": 527775, "epoch": 6358} {"train_loss": -27.5535831451416, "global_step": 527776, "epoch": 6358} {"train_loss": -27.966230392456055, "global_step": 527777, "epoch": 6358} {"train_loss": -27.776687622070312, "global_step": 527778, "epoch": 6358} {"train_loss": -28.140811920166016, "global_step": 527779, "epoch": 6358} {"train_loss": -27.867334365844727, "global_step": 527780, "epoch": 6358} {"train_loss": -27.95916748046875, "global_step": 527781, "epoch": 6358} {"train_loss": -27.94696044921875, "global_step": 527782, "epoch": 6358} {"train_loss": -27.860095977783203, "global_step": 527783, "epoch": 6358} {"train_loss": -27.6653995513916, "global_step": 527784, "epoch": 6358} {"train_loss": -27.5645694732666, "global_step": 527785, "epoch": 6358} {"train_loss": -27.397388458251953, "global_step": 527786, "epoch": 6358} {"train_loss": -27.21550941467285, "global_step": 527787, "epoch": 6358} {"train_loss": -27.25217628479004, "global_step": 527788, "epoch": 6358} {"train_loss": -27.76188087463379, "global_step": 527789, "epoch": 6358} {"train_loss": -27.678930282592773, "global_step": 527790, "epoch": 6358} {"train_loss": -27.5863037109375, "global_step": 527791, "epoch": 6358} {"train_loss": -27.67605972290039, "global_step": 527792, "epoch": 6358} {"train_loss": -27.75240135192871, "global_step": 527793, "epoch": 6358} {"train_loss": -27.41670799255371, "global_step": 527794, "epoch": 6358} {"train_loss": -27.829919815063477, "global_step": 527795, "epoch": 6358} {"train_loss": -27.508346235895733, "global_step": 527796, "epoch": 6358, "val_loss": 6774512.0} {"train_loss": -27.675765991210938, "global_step": 527797, "epoch": 6359} {"train_loss": -27.373701095581055, "global_step": 527798, "epoch": 6359} {"train_loss": -27.59950065612793, "global_step": 527799, "epoch": 6359} {"train_loss": -27.945819854736328, "global_step": 527800, "epoch": 6359} {"train_loss": -27.392282485961914, "global_step": 527801, "epoch": 6359} {"train_loss": -27.667993545532227, "global_step": 527802, "epoch": 6359} {"train_loss": -27.21533203125, "global_step": 527803, "epoch": 6359} {"train_loss": -27.1137638092041, "global_step": 527804, "epoch": 6359} {"train_loss": -27.561603546142578, "global_step": 527805, "epoch": 6359} {"train_loss": -27.64761734008789, "global_step": 527806, "epoch": 6359} {"train_loss": -27.6834659576416, "global_step": 527807, "epoch": 6359} {"train_loss": -27.210224151611328, "global_step": 527808, "epoch": 6359} {"train_loss": -27.097732543945312, "global_step": 527809, "epoch": 6359} {"train_loss": -27.441503524780273, "global_step": 527810, "epoch": 6359} {"train_loss": -27.27863883972168, "global_step": 527811, "epoch": 6359} {"train_loss": -27.52008056640625, "global_step": 527812, "epoch": 6359} {"train_loss": -27.08197593688965, "global_step": 527813, "epoch": 6359} {"train_loss": -27.41229820251465, "global_step": 527814, "epoch": 6359} {"train_loss": -27.580097198486328, "global_step": 527815, "epoch": 6359} {"train_loss": -27.774023056030273, "global_step": 527816, "epoch": 6359} {"train_loss": -27.172834396362305, "global_step": 527817, "epoch": 6359} {"train_loss": -27.677448272705078, "global_step": 527818, "epoch": 6359} {"train_loss": -27.109664916992188, "global_step": 527819, "epoch": 6359} {"train_loss": -27.461339950561523, "global_step": 527820, "epoch": 6359} {"train_loss": -27.315841674804688, "global_step": 527821, "epoch": 6359} {"train_loss": -27.448734283447266, "global_step": 527822, "epoch": 6359} {"train_loss": -27.76129150390625, "global_step": 527823, "epoch": 6359} {"train_loss": -27.501920700073242, "global_step": 527824, "epoch": 6359} {"train_loss": -27.605016708374023, "global_step": 527825, "epoch": 6359} {"train_loss": -27.669296264648438, "global_step": 527826, "epoch": 6359} {"train_loss": -27.499698638916016, "global_step": 527827, "epoch": 6359} {"train_loss": -27.533674240112305, "global_step": 527828, "epoch": 6359} {"train_loss": -27.636367797851562, "global_step": 527829, "epoch": 6359} {"train_loss": -27.5306339263916, "global_step": 527830, "epoch": 6359} {"train_loss": -27.66717529296875, "global_step": 527831, "epoch": 6359} {"train_loss": -27.462894439697266, "global_step": 527832, "epoch": 6359} {"train_loss": -27.948596954345703, "global_step": 527833, "epoch": 6359} {"train_loss": -27.620969772338867, "global_step": 527834, "epoch": 6359} {"train_loss": -27.526208877563477, "global_step": 527835, "epoch": 6359} {"train_loss": -27.936466217041016, "global_step": 527836, "epoch": 6359} {"train_loss": -27.699798583984375, "global_step": 527837, "epoch": 6359} {"train_loss": -28.09766960144043, "global_step": 527838, "epoch": 6359} {"train_loss": -27.764799118041992, "global_step": 527839, "epoch": 6359} {"train_loss": -27.792652130126953, "global_step": 527840, "epoch": 6359} {"train_loss": -27.845294952392578, "global_step": 527841, "epoch": 6359} {"train_loss": -27.79266357421875, "global_step": 527842, "epoch": 6359} {"train_loss": -28.040180206298828, "global_step": 527843, "epoch": 6359} {"train_loss": -27.61907386779785, "global_step": 527844, "epoch": 6359} {"train_loss": -27.610715866088867, "global_step": 527845, "epoch": 6359} {"train_loss": -27.11539649963379, "global_step": 527846, "epoch": 6359} {"train_loss": -26.347640991210938, "global_step": 527847, "epoch": 6359} {"train_loss": -26.907129287719727, "global_step": 527848, "epoch": 6359} {"train_loss": -27.87407875061035, "global_step": 527849, "epoch": 6359} {"train_loss": -27.16594886779785, "global_step": 527850, "epoch": 6359} {"train_loss": -27.499282836914062, "global_step": 527851, "epoch": 6359} {"train_loss": -27.118087768554688, "global_step": 527852, "epoch": 6359} {"train_loss": -27.434736251831055, "global_step": 527853, "epoch": 6359} {"train_loss": -27.35065269470215, "global_step": 527854, "epoch": 6359} {"train_loss": -27.4171085357666, "global_step": 527855, "epoch": 6359} {"train_loss": -27.899555206298828, "global_step": 527856, "epoch": 6359} {"train_loss": -27.505146026611328, "global_step": 527857, "epoch": 6359} {"train_loss": -27.507919311523438, "global_step": 527858, "epoch": 6359} {"train_loss": -27.383169174194336, "global_step": 527859, "epoch": 6359} {"train_loss": -27.55672264099121, "global_step": 527860, "epoch": 6359} {"train_loss": -27.37775230407715, "global_step": 527861, "epoch": 6359} {"train_loss": -27.488508224487305, "global_step": 527862, "epoch": 6359} {"train_loss": -27.659687042236328, "global_step": 527863, "epoch": 6359} {"train_loss": -27.293304443359375, "global_step": 527864, "epoch": 6359} {"train_loss": -27.5109920501709, "global_step": 527865, "epoch": 6359} {"train_loss": -27.628402709960938, "global_step": 527866, "epoch": 6359} {"train_loss": -27.760305404663086, "global_step": 527867, "epoch": 6359} {"train_loss": -27.513525009155273, "global_step": 527868, "epoch": 6359} {"train_loss": -27.140491485595703, "global_step": 527869, "epoch": 6359} {"train_loss": -27.38892936706543, "global_step": 527870, "epoch": 6359} {"train_loss": -26.878559112548828, "global_step": 527871, "epoch": 6359} {"train_loss": -26.920074462890625, "global_step": 527872, "epoch": 6359} {"train_loss": -26.951993942260742, "global_step": 527873, "epoch": 6359} {"train_loss": -27.7532958984375, "global_step": 527874, "epoch": 6359} {"train_loss": -27.409561157226562, "global_step": 527875, "epoch": 6359} {"train_loss": -26.99078941345215, "global_step": 527876, "epoch": 6359} {"train_loss": -27.50153923034668, "global_step": 527877, "epoch": 6359} {"train_loss": -27.372838973999023, "global_step": 527878, "epoch": 6359} {"train_loss": -27.48702244586255, "global_step": 527879, "epoch": 6359, "val_loss": 6612846.0} {"train_loss": -27.121023178100586, "global_step": 527880, "epoch": 6360} {"train_loss": -26.63516616821289, "global_step": 527881, "epoch": 6360} {"train_loss": -26.13815689086914, "global_step": 527882, "epoch": 6360} {"train_loss": -26.769529342651367, "global_step": 527883, "epoch": 6360} {"train_loss": -26.512256622314453, "global_step": 527884, "epoch": 6360} {"train_loss": -27.114761352539062, "global_step": 527885, "epoch": 6360} {"train_loss": -26.856922149658203, "global_step": 527886, "epoch": 6360} {"train_loss": -27.035552978515625, "global_step": 527887, "epoch": 6360} {"train_loss": -26.84187889099121, "global_step": 527888, "epoch": 6360} {"train_loss": -26.95281410217285, "global_step": 527889, "epoch": 6360} {"train_loss": -27.11873435974121, "global_step": 527890, "epoch": 6360} {"train_loss": -27.474531173706055, "global_step": 527891, "epoch": 6360} {"train_loss": -27.504972457885742, "global_step": 527892, "epoch": 6360} {"train_loss": -27.028966903686523, "global_step": 527893, "epoch": 6360} {"train_loss": -27.58782386779785, "global_step": 527894, "epoch": 6360} {"train_loss": -26.8282413482666, "global_step": 527895, "epoch": 6360} {"train_loss": -27.331787109375, "global_step": 527896, "epoch": 6360} {"train_loss": -27.18021011352539, "global_step": 527897, "epoch": 6360} {"train_loss": -27.6720027923584, "global_step": 527898, "epoch": 6360} {"train_loss": -27.512243270874023, "global_step": 527899, "epoch": 6360} {"train_loss": -27.534698486328125, "global_step": 527900, "epoch": 6360} {"train_loss": -27.635318756103516, "global_step": 527901, "epoch": 6360} {"train_loss": -27.297521591186523, "global_step": 527902, "epoch": 6360} {"train_loss": -27.817419052124023, "global_step": 527903, "epoch": 6360} {"train_loss": -27.32465171813965, "global_step": 527904, "epoch": 6360} {"train_loss": -27.690509796142578, "global_step": 527905, "epoch": 6360} {"train_loss": -27.7940616607666, "global_step": 527906, "epoch": 6360} {"train_loss": -27.53639030456543, "global_step": 527907, "epoch": 6360} {"train_loss": -27.1958065032959, "global_step": 527908, "epoch": 6360} {"train_loss": -27.649377822875977, "global_step": 527909, "epoch": 6360} {"train_loss": -27.463241577148438, "global_step": 527910, "epoch": 6360} {"train_loss": -27.644428253173828, "global_step": 527911, "epoch": 6360} {"train_loss": -27.72345542907715, "global_step": 527912, "epoch": 6360} {"train_loss": -27.491926193237305, "global_step": 527913, "epoch": 6360} {"train_loss": -27.54754066467285, "global_step": 527914, "epoch": 6360} {"train_loss": -27.634552001953125, "global_step": 527915, "epoch": 6360} {"train_loss": -27.107202529907227, "global_step": 527916, "epoch": 6360} {"train_loss": -27.48335075378418, "global_step": 527917, "epoch": 6360} {"train_loss": -27.573749542236328, "global_step": 527918, "epoch": 6360} {"train_loss": -27.71660804748535, "global_step": 527919, "epoch": 6360} {"train_loss": -27.800098419189453, "global_step": 527920, "epoch": 6360} {"train_loss": -28.111658096313477, "global_step": 527921, "epoch": 6360} {"train_loss": -27.957666397094727, "global_step": 527922, "epoch": 6360} {"train_loss": -27.692291259765625, "global_step": 527923, "epoch": 6360} {"train_loss": -27.65875244140625, "global_step": 527924, "epoch": 6360} {"train_loss": -27.85285758972168, "global_step": 527925, "epoch": 6360} {"train_loss": -27.713733673095703, "global_step": 527926, "epoch": 6360} {"train_loss": -27.632802963256836, "global_step": 527927, "epoch": 6360} {"train_loss": -27.638410568237305, "global_step": 527928, "epoch": 6360} {"train_loss": -27.94068717956543, "global_step": 527929, "epoch": 6360} {"train_loss": -28.073902130126953, "global_step": 527930, "epoch": 6360} {"train_loss": -27.2978515625, "global_step": 527931, "epoch": 6360} {"train_loss": -27.6356258392334, "global_step": 527932, "epoch": 6360} {"train_loss": -27.457685470581055, "global_step": 527933, "epoch": 6360} {"train_loss": -27.323339462280273, "global_step": 527934, "epoch": 6360} {"train_loss": -27.747251510620117, "global_step": 527935, "epoch": 6360} {"train_loss": -27.157052993774414, "global_step": 527936, "epoch": 6360} {"train_loss": -27.851654052734375, "global_step": 527937, "epoch": 6360} {"train_loss": -27.26216697692871, "global_step": 527938, "epoch": 6360} {"train_loss": -27.927030563354492, "global_step": 527939, "epoch": 6360} {"train_loss": -27.173078536987305, "global_step": 527940, "epoch": 6360} {"train_loss": -27.37981605529785, "global_step": 527941, "epoch": 6360} {"train_loss": -27.393949508666992, "global_step": 527942, "epoch": 6360} {"train_loss": -27.496992111206055, "global_step": 527943, "epoch": 6360} {"train_loss": -27.395721435546875, "global_step": 527944, "epoch": 6360} {"train_loss": -27.497989654541016, "global_step": 527945, "epoch": 6360} {"train_loss": -27.629947662353516, "global_step": 527946, "epoch": 6360} {"train_loss": -27.450891494750977, "global_step": 527947, "epoch": 6360} {"train_loss": -27.311384201049805, "global_step": 527948, "epoch": 6360} {"train_loss": -26.993600845336914, "global_step": 527949, "epoch": 6360} {"train_loss": -27.89226722717285, "global_step": 527950, "epoch": 6360} {"train_loss": -27.569860458374023, "global_step": 527951, "epoch": 6360} {"train_loss": -27.433210372924805, "global_step": 527952, "epoch": 6360} {"train_loss": -27.557214736938477, "global_step": 527953, "epoch": 6360} {"train_loss": -27.539636611938477, "global_step": 527954, "epoch": 6360} {"train_loss": -27.39688491821289, "global_step": 527955, "epoch": 6360} {"train_loss": -27.651081085205078, "global_step": 527956, "epoch": 6360} {"train_loss": -27.511316299438477, "global_step": 527957, "epoch": 6360} {"train_loss": -27.424402236938477, "global_step": 527958, "epoch": 6360} {"train_loss": -27.496389389038086, "global_step": 527959, "epoch": 6360} {"train_loss": -27.34632682800293, "global_step": 527960, "epoch": 6360} {"train_loss": -26.95011329650879, "global_step": 527961, "epoch": 6360} {"train_loss": -27.41627150845815, "global_step": 527962, "epoch": 6360, "val_loss": 6554941.0} {"train_loss": -27.0301570892334, "global_step": 527963, "epoch": 6361} {"train_loss": -26.655969619750977, "global_step": 527964, "epoch": 6361} {"train_loss": -27.46795654296875, "global_step": 527965, "epoch": 6361} {"train_loss": -27.2215633392334, "global_step": 527966, "epoch": 6361} {"train_loss": -27.122760772705078, "global_step": 527967, "epoch": 6361} {"train_loss": -26.99165153503418, "global_step": 527968, "epoch": 6361} {"train_loss": -26.82765769958496, "global_step": 527969, "epoch": 6361} {"train_loss": -27.0627498626709, "global_step": 527970, "epoch": 6361} {"train_loss": -27.333105087280273, "global_step": 527971, "epoch": 6361} {"train_loss": -27.25494956970215, "global_step": 527972, "epoch": 6361} {"train_loss": -27.174560546875, "global_step": 527973, "epoch": 6361} {"train_loss": -27.10959243774414, "global_step": 527974, "epoch": 6361} {"train_loss": -27.327051162719727, "global_step": 527975, "epoch": 6361} {"train_loss": -27.305877685546875, "global_step": 527976, "epoch": 6361} {"train_loss": -27.62904167175293, "global_step": 527977, "epoch": 6361} {"train_loss": -27.482568740844727, "global_step": 527978, "epoch": 6361} {"train_loss": -27.480493545532227, "global_step": 527979, "epoch": 6361} {"train_loss": -27.337072372436523, "global_step": 527980, "epoch": 6361} {"train_loss": -27.336883544921875, "global_step": 527981, "epoch": 6361} {"train_loss": -27.66546630859375, "global_step": 527982, "epoch": 6361} {"train_loss": -27.18413734436035, "global_step": 527983, "epoch": 6361} {"train_loss": -27.11109733581543, "global_step": 527984, "epoch": 6361} {"train_loss": -27.83135414123535, "global_step": 527985, "epoch": 6361} {"train_loss": -27.138891220092773, "global_step": 527986, "epoch": 6361} {"train_loss": -27.795026779174805, "global_step": 527987, "epoch": 6361} {"train_loss": -27.62532615661621, "global_step": 527988, "epoch": 6361} {"train_loss": -27.34052085876465, "global_step": 527989, "epoch": 6361} {"train_loss": -27.774585723876953, "global_step": 527990, "epoch": 6361} {"train_loss": -27.211261749267578, "global_step": 527991, "epoch": 6361} {"train_loss": -27.535364151000977, "global_step": 527992, "epoch": 6361} {"train_loss": -27.841236114501953, "global_step": 527993, "epoch": 6361} {"train_loss": -27.364303588867188, "global_step": 527994, "epoch": 6361} {"train_loss": -27.68629264831543, "global_step": 527995, "epoch": 6361} {"train_loss": -27.219934463500977, "global_step": 527996, "epoch": 6361} {"train_loss": -27.35748863220215, "global_step": 527997, "epoch": 6361} {"train_loss": -27.36920738220215, "global_step": 527998, "epoch": 6361} {"train_loss": -27.70440673828125, "global_step": 527999, "epoch": 6361} {"train_loss": -27.716154098510742, "global_step": 528000, "epoch": 6361} {"train_loss": -27.84354591369629, "global_step": 528001, "epoch": 6361} {"train_loss": -27.830917358398438, "global_step": 528002, "epoch": 6361} {"train_loss": -27.7877197265625, "global_step": 528003, "epoch": 6361} {"train_loss": -27.971582412719727, "global_step": 528004, "epoch": 6361} {"train_loss": -27.789020538330078, "global_step": 528005, "epoch": 6361} {"train_loss": -27.6968994140625, "global_step": 528006, "epoch": 6361} {"train_loss": -27.782880783081055, "global_step": 528007, "epoch": 6361} {"train_loss": -27.500335693359375, "global_step": 528008, "epoch": 6361} {"train_loss": -27.75239372253418, "global_step": 528009, "epoch": 6361} {"train_loss": -27.8386173248291, "global_step": 528010, "epoch": 6361} {"train_loss": -27.185544967651367, "global_step": 528011, "epoch": 6361} {"train_loss": -27.6533260345459, "global_step": 528012, "epoch": 6361} {"train_loss": -27.404529571533203, "global_step": 528013, "epoch": 6361} {"train_loss": -27.663415908813477, "global_step": 528014, "epoch": 6361} {"train_loss": -27.598453521728516, "global_step": 528015, "epoch": 6361} {"train_loss": -27.432266235351562, "global_step": 528016, "epoch": 6361} {"train_loss": -27.78907585144043, "global_step": 528017, "epoch": 6361} {"train_loss": -27.493066787719727, "global_step": 528018, "epoch": 6361} {"train_loss": -27.789865493774414, "global_step": 528019, "epoch": 6361} {"train_loss": -27.72468376159668, "global_step": 528020, "epoch": 6361} {"train_loss": -27.49930763244629, "global_step": 528021, "epoch": 6361} {"train_loss": -27.581212997436523, "global_step": 528022, "epoch": 6361} {"train_loss": -27.70529556274414, "global_step": 528023, "epoch": 6361} {"train_loss": -27.485675811767578, "global_step": 528024, "epoch": 6361} {"train_loss": -27.787988662719727, "global_step": 528025, "epoch": 6361} {"train_loss": -27.58902931213379, "global_step": 528026, "epoch": 6361} {"train_loss": -27.481903076171875, "global_step": 528027, "epoch": 6361} {"train_loss": -27.862451553344727, "global_step": 528028, "epoch": 6361} {"train_loss": -27.858234405517578, "global_step": 528029, "epoch": 6361} {"train_loss": -27.60776710510254, "global_step": 528030, "epoch": 6361} {"train_loss": -27.928525924682617, "global_step": 528031, "epoch": 6361} {"train_loss": -27.712268829345703, "global_step": 528032, "epoch": 6361} {"train_loss": -27.677228927612305, "global_step": 528033, "epoch": 6361} {"train_loss": -27.4488582611084, "global_step": 528034, "epoch": 6361} {"train_loss": -27.792627334594727, "global_step": 528035, "epoch": 6361} {"train_loss": -27.7289981842041, "global_step": 528036, "epoch": 6361} {"train_loss": -27.426538467407227, "global_step": 528037, "epoch": 6361} {"train_loss": -27.700056076049805, "global_step": 528038, "epoch": 6361} {"train_loss": -27.354352951049805, "global_step": 528039, "epoch": 6361} {"train_loss": -27.76559829711914, "global_step": 528040, "epoch": 6361} {"train_loss": -28.04966163635254, "global_step": 528041, "epoch": 6361} {"train_loss": -27.80596351623535, "global_step": 528042, "epoch": 6361} {"train_loss": -27.835840225219727, "global_step": 528043, "epoch": 6361} {"train_loss": -27.49134635925293, "global_step": 528044, "epoch": 6361} {"train_loss": -27.511100929903698, "global_step": 528045, "epoch": 6361, "val_loss": 6534037.0} {"train_loss": -24.62994384765625, "global_step": 528046, "epoch": 6362} {"train_loss": -24.996381759643555, "global_step": 528047, "epoch": 6362} {"train_loss": -26.9378719329834, "global_step": 528048, "epoch": 6362} {"train_loss": -25.705663681030273, "global_step": 528049, "epoch": 6362} {"train_loss": -26.57594108581543, "global_step": 528050, "epoch": 6362} {"train_loss": -26.128141403198242, "global_step": 528051, "epoch": 6362} {"train_loss": -26.384313583374023, "global_step": 528052, "epoch": 6362} {"train_loss": -26.60003089904785, "global_step": 528053, "epoch": 6362} {"train_loss": -26.667179107666016, "global_step": 528054, "epoch": 6362} {"train_loss": -26.69375991821289, "global_step": 528055, "epoch": 6362} {"train_loss": -26.878156661987305, "global_step": 528056, "epoch": 6362} {"train_loss": -26.732147216796875, "global_step": 528057, "epoch": 6362} {"train_loss": -26.914306640625, "global_step": 528058, "epoch": 6362} {"train_loss": -27.078245162963867, "global_step": 528059, "epoch": 6362} {"train_loss": -27.02874183654785, "global_step": 528060, "epoch": 6362} {"train_loss": -26.644773483276367, "global_step": 528061, "epoch": 6362} {"train_loss": -27.28577995300293, "global_step": 528062, "epoch": 6362} {"train_loss": -26.931060791015625, "global_step": 528063, "epoch": 6362} {"train_loss": -26.988245010375977, "global_step": 528064, "epoch": 6362} {"train_loss": -27.2501220703125, "global_step": 528065, "epoch": 6362} {"train_loss": -26.77242088317871, "global_step": 528066, "epoch": 6362} {"train_loss": -27.32500648498535, "global_step": 528067, "epoch": 6362} {"train_loss": -27.268451690673828, "global_step": 528068, "epoch": 6362} {"train_loss": -27.50990867614746, "global_step": 528069, "epoch": 6362} {"train_loss": -27.338834762573242, "global_step": 528070, "epoch": 6362} {"train_loss": -27.54047203063965, "global_step": 528071, "epoch": 6362} {"train_loss": -27.315570831298828, "global_step": 528072, "epoch": 6362} {"train_loss": -27.230457305908203, "global_step": 528073, "epoch": 6362} {"train_loss": -27.413715362548828, "global_step": 528074, "epoch": 6362} {"train_loss": -27.476469039916992, "global_step": 528075, "epoch": 6362} {"train_loss": -27.291181564331055, "global_step": 528076, "epoch": 6362} {"train_loss": -27.58021354675293, "global_step": 528077, "epoch": 6362} {"train_loss": -27.64841651916504, "global_step": 528078, "epoch": 6362} {"train_loss": -27.784299850463867, "global_step": 528079, "epoch": 6362} {"train_loss": -27.909320831298828, "global_step": 528080, "epoch": 6362} {"train_loss": -27.04204750061035, "global_step": 528081, "epoch": 6362} {"train_loss": -27.70151138305664, "global_step": 528082, "epoch": 6362} {"train_loss": -27.42286491394043, "global_step": 528083, "epoch": 6362} {"train_loss": -27.534765243530273, "global_step": 528084, "epoch": 6362} {"train_loss": -27.448644638061523, "global_step": 528085, "epoch": 6362} {"train_loss": -27.615407943725586, "global_step": 528086, "epoch": 6362} {"train_loss": -27.818578720092773, "global_step": 528087, "epoch": 6362} {"train_loss": -27.543060302734375, "global_step": 528088, "epoch": 6362} {"train_loss": -27.670896530151367, "global_step": 528089, "epoch": 6362} {"train_loss": -27.478158950805664, "global_step": 528090, "epoch": 6362} {"train_loss": -27.893341064453125, "global_step": 528091, "epoch": 6362} {"train_loss": -27.703094482421875, "global_step": 528092, "epoch": 6362} {"train_loss": -27.62677574157715, "global_step": 528093, "epoch": 6362} {"train_loss": -27.8138427734375, "global_step": 528094, "epoch": 6362} {"train_loss": -28.0269832611084, "global_step": 528095, "epoch": 6362} {"train_loss": -27.8183536529541, "global_step": 528096, "epoch": 6362} {"train_loss": -28.041685104370117, "global_step": 528097, "epoch": 6362} {"train_loss": -27.870512008666992, "global_step": 528098, "epoch": 6362} {"train_loss": -27.77215003967285, "global_step": 528099, "epoch": 6362} {"train_loss": -27.91162109375, "global_step": 528100, "epoch": 6362} {"train_loss": -27.945953369140625, "global_step": 528101, "epoch": 6362} {"train_loss": -27.573713302612305, "global_step": 528102, "epoch": 6362} {"train_loss": -27.943695068359375, "global_step": 528103, "epoch": 6362} {"train_loss": -27.447895050048828, "global_step": 528104, "epoch": 6362} {"train_loss": -27.211200714111328, "global_step": 528105, "epoch": 6362} {"train_loss": -27.99005126953125, "global_step": 528106, "epoch": 6362} {"train_loss": -27.300703048706055, "global_step": 528107, "epoch": 6362} {"train_loss": -27.538898468017578, "global_step": 528108, "epoch": 6362} {"train_loss": -27.65106201171875, "global_step": 528109, "epoch": 6362} {"train_loss": -27.320581436157227, "global_step": 528110, "epoch": 6362} {"train_loss": -27.72043800354004, "global_step": 528111, "epoch": 6362} {"train_loss": -27.09577751159668, "global_step": 528112, "epoch": 6362} {"train_loss": -27.433856964111328, "global_step": 528113, "epoch": 6362} {"train_loss": -27.791650772094727, "global_step": 528114, "epoch": 6362} {"train_loss": -27.44207763671875, "global_step": 528115, "epoch": 6362} {"train_loss": -27.363391876220703, "global_step": 528116, "epoch": 6362} {"train_loss": -27.235166549682617, "global_step": 528117, "epoch": 6362} {"train_loss": -27.577194213867188, "global_step": 528118, "epoch": 6362} {"train_loss": -27.2207088470459, "global_step": 528119, "epoch": 6362} {"train_loss": -27.563007354736328, "global_step": 528120, "epoch": 6362} {"train_loss": -27.45905876159668, "global_step": 528121, "epoch": 6362} {"train_loss": -27.98077964782715, "global_step": 528122, "epoch": 6362} {"train_loss": -27.696399688720703, "global_step": 528123, "epoch": 6362} {"train_loss": -27.4205265045166, "global_step": 528124, "epoch": 6362} {"train_loss": -27.907516479492188, "global_step": 528125, "epoch": 6362} {"train_loss": -27.600889205932617, "global_step": 528126, "epoch": 6362} {"train_loss": -27.658370971679688, "global_step": 528127, "epoch": 6362} {"train_loss": -27.328757780144013, "global_step": 528128, "epoch": 6362, "val_loss": 6489664.0} {"train_loss": -26.517841339111328, "global_step": 528129, "epoch": 6363} {"train_loss": -26.72199058532715, "global_step": 528130, "epoch": 6363} {"train_loss": -26.22043800354004, "global_step": 528131, "epoch": 6363} {"train_loss": -26.558698654174805, "global_step": 528132, "epoch": 6363} {"train_loss": -26.5297908782959, "global_step": 528133, "epoch": 6363} {"train_loss": -27.030731201171875, "global_step": 528134, "epoch": 6363} {"train_loss": -26.5749568939209, "global_step": 528135, "epoch": 6363} {"train_loss": -26.751951217651367, "global_step": 528136, "epoch": 6363} {"train_loss": -26.814258575439453, "global_step": 528137, "epoch": 6363} {"train_loss": -26.62864112854004, "global_step": 528138, "epoch": 6363} {"train_loss": -26.42317771911621, "global_step": 528139, "epoch": 6363} {"train_loss": -26.762720108032227, "global_step": 528140, "epoch": 6363} {"train_loss": -26.4426212310791, "global_step": 528141, "epoch": 6363} {"train_loss": -26.81036949157715, "global_step": 528142, "epoch": 6363} {"train_loss": -26.903844833374023, "global_step": 528143, "epoch": 6363} {"train_loss": -26.3814640045166, "global_step": 528144, "epoch": 6363} {"train_loss": -27.05263328552246, "global_step": 528145, "epoch": 6363} {"train_loss": -27.3105525970459, "global_step": 528146, "epoch": 6363} {"train_loss": -26.590818405151367, "global_step": 528147, "epoch": 6363} {"train_loss": -26.946857452392578, "global_step": 528148, "epoch": 6363} {"train_loss": -27.053363800048828, "global_step": 528149, "epoch": 6363} {"train_loss": -27.144784927368164, "global_step": 528150, "epoch": 6363} {"train_loss": -26.964513778686523, "global_step": 528151, "epoch": 6363} {"train_loss": -27.094263076782227, "global_step": 528152, "epoch": 6363} {"train_loss": -27.162113189697266, "global_step": 528153, "epoch": 6363} {"train_loss": -27.34733009338379, "global_step": 528154, "epoch": 6363} {"train_loss": -27.31226921081543, "global_step": 528155, "epoch": 6363} {"train_loss": -27.14023208618164, "global_step": 528156, "epoch": 6363} {"train_loss": -27.475067138671875, "global_step": 528157, "epoch": 6363} {"train_loss": -27.20637321472168, "global_step": 528158, "epoch": 6363} {"train_loss": -27.141632080078125, "global_step": 528159, "epoch": 6363} {"train_loss": -27.479597091674805, "global_step": 528160, "epoch": 6363} {"train_loss": -27.663928985595703, "global_step": 528161, "epoch": 6363} {"train_loss": -27.45347023010254, "global_step": 528162, "epoch": 6363} {"train_loss": -27.339004516601562, "global_step": 528163, "epoch": 6363} {"train_loss": -27.47608757019043, "global_step": 528164, "epoch": 6363} {"train_loss": -27.272241592407227, "global_step": 528165, "epoch": 6363} {"train_loss": -27.645483016967773, "global_step": 528166, "epoch": 6363} {"train_loss": -27.649890899658203, "global_step": 528167, "epoch": 6363} {"train_loss": -27.640417098999023, "global_step": 528168, "epoch": 6363} {"train_loss": -27.63579750061035, "global_step": 528169, "epoch": 6363} {"train_loss": -27.7674617767334, "global_step": 528170, "epoch": 6363} {"train_loss": -27.658411026000977, "global_step": 528171, "epoch": 6363} {"train_loss": -27.66119384765625, "global_step": 528172, "epoch": 6363} {"train_loss": -27.421613693237305, "global_step": 528173, "epoch": 6363} {"train_loss": -27.695449829101562, "global_step": 528174, "epoch": 6363} {"train_loss": -27.63494300842285, "global_step": 528175, "epoch": 6363} {"train_loss": -27.7291316986084, "global_step": 528176, "epoch": 6363} {"train_loss": -27.55704689025879, "global_step": 528177, "epoch": 6363} {"train_loss": -27.638324737548828, "global_step": 528178, "epoch": 6363} {"train_loss": -27.713104248046875, "global_step": 528179, "epoch": 6363} {"train_loss": -27.723623275756836, "global_step": 528180, "epoch": 6363} {"train_loss": -27.791112899780273, "global_step": 528181, "epoch": 6363} {"train_loss": -28.203290939331055, "global_step": 528182, "epoch": 6363} {"train_loss": -27.772531509399414, "global_step": 528183, "epoch": 6363} {"train_loss": -27.60098648071289, "global_step": 528184, "epoch": 6363} {"train_loss": -28.09501075744629, "global_step": 528185, "epoch": 6363} {"train_loss": -27.575002670288086, "global_step": 528186, "epoch": 6363} {"train_loss": -27.694921493530273, "global_step": 528187, "epoch": 6363} {"train_loss": -27.754240036010742, "global_step": 528188, "epoch": 6363} {"train_loss": -27.906845092773438, "global_step": 528189, "epoch": 6363} {"train_loss": -27.96726417541504, "global_step": 528190, "epoch": 6363} {"train_loss": -27.382837295532227, "global_step": 528191, "epoch": 6363} {"train_loss": -27.353734970092773, "global_step": 528192, "epoch": 6363} {"train_loss": -27.980823516845703, "global_step": 528193, "epoch": 6363} {"train_loss": -27.833908081054688, "global_step": 528194, "epoch": 6363} {"train_loss": -27.79793357849121, "global_step": 528195, "epoch": 6363} {"train_loss": -27.821426391601562, "global_step": 528196, "epoch": 6363} {"train_loss": -27.952850341796875, "global_step": 528197, "epoch": 6363} {"train_loss": -27.84815788269043, "global_step": 528198, "epoch": 6363} {"train_loss": -27.664976119995117, "global_step": 528199, "epoch": 6363} {"train_loss": -27.6207332611084, "global_step": 528200, "epoch": 6363} {"train_loss": -27.295454025268555, "global_step": 528201, "epoch": 6363} {"train_loss": -27.6674747467041, "global_step": 528202, "epoch": 6363} {"train_loss": -27.419452667236328, "global_step": 528203, "epoch": 6363} {"train_loss": -27.206470489501953, "global_step": 528204, "epoch": 6363} {"train_loss": -27.333576202392578, "global_step": 528205, "epoch": 6363} {"train_loss": -27.278461456298828, "global_step": 528206, "epoch": 6363} {"train_loss": -27.383214950561523, "global_step": 528207, "epoch": 6363} {"train_loss": -27.10187339782715, "global_step": 528208, "epoch": 6363} {"train_loss": -27.19856834411621, "global_step": 528209, "epoch": 6363} {"train_loss": -27.658124923706055, "global_step": 528210, "epoch": 6363} {"train_loss": -27.363566547991283, "global_step": 528211, "epoch": 6363, "val_loss": 6600117.0} {"train_loss": -27.01374626159668, "global_step": 528212, "epoch": 6364} {"train_loss": -26.53028678894043, "global_step": 528213, "epoch": 6364} {"train_loss": -26.7106990814209, "global_step": 528214, "epoch": 6364} {"train_loss": -26.66705894470215, "global_step": 528215, "epoch": 6364} {"train_loss": -26.297571182250977, "global_step": 528216, "epoch": 6364} {"train_loss": -26.22791862487793, "global_step": 528217, "epoch": 6364} {"train_loss": -26.89297866821289, "global_step": 528218, "epoch": 6364} {"train_loss": -27.1419620513916, "global_step": 528219, "epoch": 6364} {"train_loss": -26.483850479125977, "global_step": 528220, "epoch": 6364} {"train_loss": -27.0050048828125, "global_step": 528221, "epoch": 6364} {"train_loss": -27.09307289123535, "global_step": 528222, "epoch": 6364} {"train_loss": -27.3963680267334, "global_step": 528223, "epoch": 6364} {"train_loss": -26.916229248046875, "global_step": 528224, "epoch": 6364} {"train_loss": -27.085859298706055, "global_step": 528225, "epoch": 6364} {"train_loss": -27.626508712768555, "global_step": 528226, "epoch": 6364} {"train_loss": -27.095258712768555, "global_step": 528227, "epoch": 6364} {"train_loss": -27.1745662689209, "global_step": 528228, "epoch": 6364} {"train_loss": -27.4544620513916, "global_step": 528229, "epoch": 6364} {"train_loss": -27.061100006103516, "global_step": 528230, "epoch": 6364} {"train_loss": -27.609094619750977, "global_step": 528231, "epoch": 6364} {"train_loss": -27.477569580078125, "global_step": 528232, "epoch": 6364} {"train_loss": -27.540069580078125, "global_step": 528233, "epoch": 6364} {"train_loss": -27.324888229370117, "global_step": 528234, "epoch": 6364} {"train_loss": -27.951086044311523, "global_step": 528235, "epoch": 6364} {"train_loss": -27.606794357299805, "global_step": 528236, "epoch": 6364} {"train_loss": -27.585485458374023, "global_step": 528237, "epoch": 6364} {"train_loss": -27.37507438659668, "global_step": 528238, "epoch": 6364} {"train_loss": -27.506052017211914, "global_step": 528239, "epoch": 6364} {"train_loss": -27.364013671875, "global_step": 528240, "epoch": 6364} {"train_loss": -28.018274307250977, "global_step": 528241, "epoch": 6364} {"train_loss": -27.695255279541016, "global_step": 528242, "epoch": 6364} {"train_loss": -27.55653190612793, "global_step": 528243, "epoch": 6364} {"train_loss": -27.579504013061523, "global_step": 528244, "epoch": 6364} {"train_loss": -27.8442325592041, "global_step": 528245, "epoch": 6364} {"train_loss": -27.774795532226562, "global_step": 528246, "epoch": 6364} {"train_loss": -27.738693237304688, "global_step": 528247, "epoch": 6364} {"train_loss": -27.880151748657227, "global_step": 528248, "epoch": 6364} {"train_loss": -27.90156364440918, "global_step": 528249, "epoch": 6364} {"train_loss": -27.5891170501709, "global_step": 528250, "epoch": 6364} {"train_loss": -27.417707443237305, "global_step": 528251, "epoch": 6364} {"train_loss": -27.530248641967773, "global_step": 528252, "epoch": 6364} {"train_loss": -27.733755111694336, "global_step": 528253, "epoch": 6364} {"train_loss": -27.394006729125977, "global_step": 528254, "epoch": 6364} {"train_loss": -27.86756706237793, "global_step": 528255, "epoch": 6364} {"train_loss": -27.343488693237305, "global_step": 528256, "epoch": 6364} {"train_loss": -28.045455932617188, "global_step": 528257, "epoch": 6364} {"train_loss": -27.73760986328125, "global_step": 528258, "epoch": 6364} {"train_loss": -27.92972183227539, "global_step": 528259, "epoch": 6364} {"train_loss": -27.701202392578125, "global_step": 528260, "epoch": 6364} {"train_loss": -28.035634994506836, "global_step": 528261, "epoch": 6364} {"train_loss": -27.995458602905273, "global_step": 528262, "epoch": 6364} {"train_loss": -27.77699089050293, "global_step": 528263, "epoch": 6364} {"train_loss": -27.90606689453125, "global_step": 528264, "epoch": 6364} {"train_loss": -27.931747436523438, "global_step": 528265, "epoch": 6364} {"train_loss": -27.778675079345703, "global_step": 528266, "epoch": 6364} {"train_loss": -27.52565574645996, "global_step": 528267, "epoch": 6364} {"train_loss": -27.93780517578125, "global_step": 528268, "epoch": 6364} {"train_loss": -27.69809913635254, "global_step": 528269, "epoch": 6364} {"train_loss": -28.0305118560791, "global_step": 528270, "epoch": 6364} {"train_loss": -28.0296630859375, "global_step": 528271, "epoch": 6364} {"train_loss": -27.801971435546875, "global_step": 528272, "epoch": 6364} {"train_loss": -27.418542861938477, "global_step": 528273, "epoch": 6364} {"train_loss": -28.14215087890625, "global_step": 528274, "epoch": 6364} {"train_loss": -28.058469772338867, "global_step": 528275, "epoch": 6364} {"train_loss": -27.479116439819336, "global_step": 528276, "epoch": 6364} {"train_loss": -27.539297103881836, "global_step": 528277, "epoch": 6364} {"train_loss": -27.69679069519043, "global_step": 528278, "epoch": 6364} {"train_loss": -27.588104248046875, "global_step": 528279, "epoch": 6364} {"train_loss": -27.69227409362793, "global_step": 528280, "epoch": 6364} {"train_loss": -27.303937911987305, "global_step": 528281, "epoch": 6364} {"train_loss": -27.20912742614746, "global_step": 528282, "epoch": 6364} {"train_loss": -26.278223037719727, "global_step": 528283, "epoch": 6364} {"train_loss": -25.639511108398438, "global_step": 528284, "epoch": 6364} {"train_loss": -25.588327407836914, "global_step": 528285, "epoch": 6364} {"train_loss": -26.380945205688477, "global_step": 528286, "epoch": 6364} {"train_loss": -26.774890899658203, "global_step": 528287, "epoch": 6364} {"train_loss": -25.789356231689453, "global_step": 528288, "epoch": 6364} {"train_loss": -25.466724395751953, "global_step": 528289, "epoch": 6364} {"train_loss": -27.069107055664062, "global_step": 528290, "epoch": 6364} {"train_loss": -26.417776107788086, "global_step": 528291, "epoch": 6364} {"train_loss": -26.268762588500977, "global_step": 528292, "epoch": 6364} {"train_loss": -27.141016006469727, "global_step": 528293, "epoch": 6364} {"train_loss": -27.31338510168604, "global_step": 528294, "epoch": 6364, "val_loss": 6737884.5} {"train_loss": -26.273731231689453, "global_step": 528295, "epoch": 6365} {"train_loss": -26.50909423828125, "global_step": 528296, "epoch": 6365} {"train_loss": -26.0201416015625, "global_step": 528297, "epoch": 6365} {"train_loss": -26.423877716064453, "global_step": 528298, "epoch": 6365} {"train_loss": -26.25461196899414, "global_step": 528299, "epoch": 6365} {"train_loss": -26.395044326782227, "global_step": 528300, "epoch": 6365} {"train_loss": -26.34730339050293, "global_step": 528301, "epoch": 6365} {"train_loss": -26.60584831237793, "global_step": 528302, "epoch": 6365} {"train_loss": -26.69547462463379, "global_step": 528303, "epoch": 6365} {"train_loss": -26.545576095581055, "global_step": 528304, "epoch": 6365} {"train_loss": -26.773406982421875, "global_step": 528305, "epoch": 6365} {"train_loss": -26.3037166595459, "global_step": 528306, "epoch": 6365} {"train_loss": -26.767404556274414, "global_step": 528307, "epoch": 6365} {"train_loss": -26.818769454956055, "global_step": 528308, "epoch": 6365} {"train_loss": -26.901044845581055, "global_step": 528309, "epoch": 6365} {"train_loss": -26.817808151245117, "global_step": 528310, "epoch": 6365} {"train_loss": -26.96550941467285, "global_step": 528311, "epoch": 6365} {"train_loss": -26.727025985717773, "global_step": 528312, "epoch": 6365} {"train_loss": -27.16497802734375, "global_step": 528313, "epoch": 6365} {"train_loss": -27.138782501220703, "global_step": 528314, "epoch": 6365} {"train_loss": -26.956512451171875, "global_step": 528315, "epoch": 6365} {"train_loss": -27.17266273498535, "global_step": 528316, "epoch": 6365} {"train_loss": -26.729766845703125, "global_step": 528317, "epoch": 6365} {"train_loss": -27.44098472595215, "global_step": 528318, "epoch": 6365} {"train_loss": -27.17453384399414, "global_step": 528319, "epoch": 6365} {"train_loss": -27.058629989624023, "global_step": 528320, "epoch": 6365} {"train_loss": -27.274473190307617, "global_step": 528321, "epoch": 6365} {"train_loss": -27.41244888305664, "global_step": 528322, "epoch": 6365} {"train_loss": -27.049047470092773, "global_step": 528323, "epoch": 6365} {"train_loss": -27.281509399414062, "global_step": 528324, "epoch": 6365} {"train_loss": -27.380727767944336, "global_step": 528325, "epoch": 6365} {"train_loss": -27.604475021362305, "global_step": 528326, "epoch": 6365} {"train_loss": -27.017072677612305, "global_step": 528327, "epoch": 6365} {"train_loss": -27.27654457092285, "global_step": 528328, "epoch": 6365} {"train_loss": -27.5715389251709, "global_step": 528329, "epoch": 6365} {"train_loss": -27.43195152282715, "global_step": 528330, "epoch": 6365} {"train_loss": -27.20587158203125, "global_step": 528331, "epoch": 6365} {"train_loss": -27.685739517211914, "global_step": 528332, "epoch": 6365} {"train_loss": -27.70611000061035, "global_step": 528333, "epoch": 6365} {"train_loss": -27.75082778930664, "global_step": 528334, "epoch": 6365} {"train_loss": -27.50355339050293, "global_step": 528335, "epoch": 6365} {"train_loss": -27.57952880859375, "global_step": 528336, "epoch": 6365} {"train_loss": -27.428104400634766, "global_step": 528337, "epoch": 6365} {"train_loss": -27.811431884765625, "global_step": 528338, "epoch": 6365} {"train_loss": -27.201501846313477, "global_step": 528339, "epoch": 6365} {"train_loss": -27.806171417236328, "global_step": 528340, "epoch": 6365} {"train_loss": -27.52029800415039, "global_step": 528341, "epoch": 6365} {"train_loss": -27.750768661499023, "global_step": 528342, "epoch": 6365} {"train_loss": -27.740262985229492, "global_step": 528343, "epoch": 6365} {"train_loss": -27.897663116455078, "global_step": 528344, "epoch": 6365} {"train_loss": -27.6402587890625, "global_step": 528345, "epoch": 6365} {"train_loss": -27.834823608398438, "global_step": 528346, "epoch": 6365} {"train_loss": -27.772464752197266, "global_step": 528347, "epoch": 6365} {"train_loss": -27.824447631835938, "global_step": 528348, "epoch": 6365} {"train_loss": -27.929519653320312, "global_step": 528349, "epoch": 6365} {"train_loss": -27.822742462158203, "global_step": 528350, "epoch": 6365} {"train_loss": -27.791685104370117, "global_step": 528351, "epoch": 6365} {"train_loss": -27.8630313873291, "global_step": 528352, "epoch": 6365} {"train_loss": -27.6777400970459, "global_step": 528353, "epoch": 6365} {"train_loss": -27.38152503967285, "global_step": 528354, "epoch": 6365} {"train_loss": -27.814477920532227, "global_step": 528355, "epoch": 6365} {"train_loss": -27.734888076782227, "global_step": 528356, "epoch": 6365} {"train_loss": -27.802412033081055, "global_step": 528357, "epoch": 6365} {"train_loss": -27.5640869140625, "global_step": 528358, "epoch": 6365} {"train_loss": -27.770740509033203, "global_step": 528359, "epoch": 6365} {"train_loss": -27.724496841430664, "global_step": 528360, "epoch": 6365} {"train_loss": -27.385801315307617, "global_step": 528361, "epoch": 6365} {"train_loss": -27.698272705078125, "global_step": 528362, "epoch": 6365} {"train_loss": -27.74700355529785, "global_step": 528363, "epoch": 6365} {"train_loss": -27.885787963867188, "global_step": 528364, "epoch": 6365} {"train_loss": -26.890188217163086, "global_step": 528365, "epoch": 6365} {"train_loss": -27.217432022094727, "global_step": 528366, "epoch": 6365} {"train_loss": -27.105825424194336, "global_step": 528367, "epoch": 6365} {"train_loss": -26.624753952026367, "global_step": 528368, "epoch": 6365} {"train_loss": -26.655353546142578, "global_step": 528369, "epoch": 6365} {"train_loss": -26.729108810424805, "global_step": 528370, "epoch": 6365} {"train_loss": -26.976964950561523, "global_step": 528371, "epoch": 6365} {"train_loss": -27.23476219177246, "global_step": 528372, "epoch": 6365} {"train_loss": -26.97480583190918, "global_step": 528373, "epoch": 6365} {"train_loss": -27.269697189331055, "global_step": 528374, "epoch": 6365} {"train_loss": -27.31315040588379, "global_step": 528375, "epoch": 6365} {"train_loss": -27.449045181274414, "global_step": 528376, "epoch": 6365} {"train_loss": -27.249724905174897, "global_step": 528377, "epoch": 6365, "val_loss": 6587752.0} {"train_loss": -26.5089054107666, "global_step": 528378, "epoch": 6366} {"train_loss": -27.244474411010742, "global_step": 528379, "epoch": 6366} {"train_loss": -26.878149032592773, "global_step": 528380, "epoch": 6366} {"train_loss": -27.079381942749023, "global_step": 528381, "epoch": 6366} {"train_loss": -27.074193954467773, "global_step": 528382, "epoch": 6366} {"train_loss": -27.19219398498535, "global_step": 528383, "epoch": 6366} {"train_loss": -27.24793815612793, "global_step": 528384, "epoch": 6366} {"train_loss": -27.16396141052246, "global_step": 528385, "epoch": 6366} {"train_loss": -27.078388214111328, "global_step": 528386, "epoch": 6366} {"train_loss": -27.172910690307617, "global_step": 528387, "epoch": 6366} {"train_loss": -27.488462448120117, "global_step": 528388, "epoch": 6366} {"train_loss": -27.067493438720703, "global_step": 528389, "epoch": 6366} {"train_loss": -27.045440673828125, "global_step": 528390, "epoch": 6366} {"train_loss": -26.9786434173584, "global_step": 528391, "epoch": 6366} {"train_loss": -27.282743453979492, "global_step": 528392, "epoch": 6366} {"train_loss": -27.555694580078125, "global_step": 528393, "epoch": 6366} {"train_loss": -27.197187423706055, "global_step": 528394, "epoch": 6366} {"train_loss": -27.288293838500977, "global_step": 528395, "epoch": 6366} {"train_loss": -27.49457359313965, "global_step": 528396, "epoch": 6366} {"train_loss": -27.41712760925293, "global_step": 528397, "epoch": 6366} {"train_loss": -27.220184326171875, "global_step": 528398, "epoch": 6366} {"train_loss": -27.458276748657227, "global_step": 528399, "epoch": 6366} {"train_loss": -27.551162719726562, "global_step": 528400, "epoch": 6366} {"train_loss": -27.40987205505371, "global_step": 528401, "epoch": 6366} {"train_loss": -27.41908073425293, "global_step": 528402, "epoch": 6366} {"train_loss": -27.36664390563965, "global_step": 528403, "epoch": 6366} {"train_loss": -27.18842887878418, "global_step": 528404, "epoch": 6366} {"train_loss": -27.532001495361328, "global_step": 528405, "epoch": 6366} {"train_loss": -27.599660873413086, "global_step": 528406, "epoch": 6366} {"train_loss": -27.824207305908203, "global_step": 528407, "epoch": 6366} {"train_loss": -27.40497398376465, "global_step": 528408, "epoch": 6366} {"train_loss": -27.66786003112793, "global_step": 528409, "epoch": 6366} {"train_loss": -27.382184982299805, "global_step": 528410, "epoch": 6366} {"train_loss": -27.682233810424805, "global_step": 528411, "epoch": 6366} {"train_loss": -27.768091201782227, "global_step": 528412, "epoch": 6366} {"train_loss": -27.770111083984375, "global_step": 528413, "epoch": 6366} {"train_loss": -27.796894073486328, "global_step": 528414, "epoch": 6366} {"train_loss": -27.500701904296875, "global_step": 528415, "epoch": 6366} {"train_loss": -27.810815811157227, "global_step": 528416, "epoch": 6366} {"train_loss": -27.483295440673828, "global_step": 528417, "epoch": 6366} {"train_loss": -27.63275146484375, "global_step": 528418, "epoch": 6366} {"train_loss": -27.679834365844727, "global_step": 528419, "epoch": 6366} {"train_loss": -27.71796989440918, "global_step": 528420, "epoch": 6366} {"train_loss": -27.637048721313477, "global_step": 528421, "epoch": 6366} {"train_loss": -27.63862419128418, "global_step": 528422, "epoch": 6366} {"train_loss": -27.842365264892578, "global_step": 528423, "epoch": 6366} {"train_loss": -27.61798667907715, "global_step": 528424, "epoch": 6366} {"train_loss": -27.542383193969727, "global_step": 528425, "epoch": 6366} {"train_loss": -28.118762969970703, "global_step": 528426, "epoch": 6366} {"train_loss": -27.349607467651367, "global_step": 528427, "epoch": 6366} {"train_loss": -27.402631759643555, "global_step": 528428, "epoch": 6366} {"train_loss": -27.39533805847168, "global_step": 528429, "epoch": 6366} {"train_loss": -27.380878448486328, "global_step": 528430, "epoch": 6366} {"train_loss": -27.95087242126465, "global_step": 528431, "epoch": 6366} {"train_loss": -27.910974502563477, "global_step": 528432, "epoch": 6366} {"train_loss": -27.44803237915039, "global_step": 528433, "epoch": 6366} {"train_loss": -27.911319732666016, "global_step": 528434, "epoch": 6366} {"train_loss": -27.18099021911621, "global_step": 528435, "epoch": 6366} {"train_loss": -27.448627471923828, "global_step": 528436, "epoch": 6366} {"train_loss": -27.891860961914062, "global_step": 528437, "epoch": 6366} {"train_loss": -27.589359283447266, "global_step": 528438, "epoch": 6366} {"train_loss": -28.134246826171875, "global_step": 528439, "epoch": 6366} {"train_loss": -27.901830673217773, "global_step": 528440, "epoch": 6366} {"train_loss": -27.6490421295166, "global_step": 528441, "epoch": 6366} {"train_loss": -27.597631454467773, "global_step": 528442, "epoch": 6366} {"train_loss": -27.50965690612793, "global_step": 528443, "epoch": 6366} {"train_loss": -27.706052780151367, "global_step": 528444, "epoch": 6366} {"train_loss": -27.6044864654541, "global_step": 528445, "epoch": 6366} {"train_loss": -27.30503273010254, "global_step": 528446, "epoch": 6366} {"train_loss": -27.1262149810791, "global_step": 528447, "epoch": 6366} {"train_loss": -27.377735137939453, "global_step": 528448, "epoch": 6366} {"train_loss": -27.875768661499023, "global_step": 528449, "epoch": 6366} {"train_loss": -27.469161987304688, "global_step": 528450, "epoch": 6366} {"train_loss": -27.505523681640625, "global_step": 528451, "epoch": 6366} {"train_loss": -27.729602813720703, "global_step": 528452, "epoch": 6366} {"train_loss": -27.57935905456543, "global_step": 528453, "epoch": 6366} {"train_loss": -27.728281021118164, "global_step": 528454, "epoch": 6366} {"train_loss": -27.750478744506836, "global_step": 528455, "epoch": 6366} {"train_loss": -27.862272262573242, "global_step": 528456, "epoch": 6366} {"train_loss": -27.231103897094727, "global_step": 528457, "epoch": 6366} {"train_loss": -27.76460838317871, "global_step": 528458, "epoch": 6366} {"train_loss": -27.74696159362793, "global_step": 528459, "epoch": 6366} {"train_loss": -27.50954749785274, "global_step": 528460, "epoch": 6366, "val_loss": 6591399.0} {"train_loss": -27.54969596862793, "global_step": 528461, "epoch": 6367} {"train_loss": -27.1597957611084, "global_step": 528462, "epoch": 6367} {"train_loss": -27.368061065673828, "global_step": 528463, "epoch": 6367} {"train_loss": -27.055328369140625, "global_step": 528464, "epoch": 6367} {"train_loss": -27.306058883666992, "global_step": 528465, "epoch": 6367} {"train_loss": -27.2071533203125, "global_step": 528466, "epoch": 6367} {"train_loss": -27.066869735717773, "global_step": 528467, "epoch": 6367} {"train_loss": -27.061567306518555, "global_step": 528468, "epoch": 6367} {"train_loss": -27.323156356811523, "global_step": 528469, "epoch": 6367} {"train_loss": -27.353836059570312, "global_step": 528470, "epoch": 6367} {"train_loss": -27.580402374267578, "global_step": 528471, "epoch": 6367} {"train_loss": -27.394033432006836, "global_step": 528472, "epoch": 6367} {"train_loss": -27.457874298095703, "global_step": 528473, "epoch": 6367} {"train_loss": -27.328567504882812, "global_step": 528474, "epoch": 6367} {"train_loss": -27.574949264526367, "global_step": 528475, "epoch": 6367} {"train_loss": -27.637516021728516, "global_step": 528476, "epoch": 6367} {"train_loss": -27.3787841796875, "global_step": 528477, "epoch": 6367} {"train_loss": -27.77312660217285, "global_step": 528478, "epoch": 6367} {"train_loss": -27.49299430847168, "global_step": 528479, "epoch": 6367} {"train_loss": -27.537643432617188, "global_step": 528480, "epoch": 6367} {"train_loss": -27.141071319580078, "global_step": 528481, "epoch": 6367} {"train_loss": -27.57974624633789, "global_step": 528482, "epoch": 6367} {"train_loss": -27.970678329467773, "global_step": 528483, "epoch": 6367} {"train_loss": -27.421865463256836, "global_step": 528484, "epoch": 6367} {"train_loss": -27.69550132751465, "global_step": 528485, "epoch": 6367} {"train_loss": -27.59421157836914, "global_step": 528486, "epoch": 6367} {"train_loss": -27.354883193969727, "global_step": 528487, "epoch": 6367} {"train_loss": -27.4465389251709, "global_step": 528488, "epoch": 6367} {"train_loss": -27.59589958190918, "global_step": 528489, "epoch": 6367} {"train_loss": -27.907337188720703, "global_step": 528490, "epoch": 6367} {"train_loss": -27.69111442565918, "global_step": 528491, "epoch": 6367} {"train_loss": -27.8923397064209, "global_step": 528492, "epoch": 6367} {"train_loss": -27.8109188079834, "global_step": 528493, "epoch": 6367} {"train_loss": -27.77768325805664, "global_step": 528494, "epoch": 6367} {"train_loss": -28.05897331237793, "global_step": 528495, "epoch": 6367} {"train_loss": -27.859607696533203, "global_step": 528496, "epoch": 6367} {"train_loss": -27.45425796508789, "global_step": 528497, "epoch": 6367} {"train_loss": -28.038602828979492, "global_step": 528498, "epoch": 6367} {"train_loss": -27.886993408203125, "global_step": 528499, "epoch": 6367} {"train_loss": -27.77870750427246, "global_step": 528500, "epoch": 6367} {"train_loss": -28.212890625, "global_step": 528501, "epoch": 6367} {"train_loss": -27.991403579711914, "global_step": 528502, "epoch": 6367} {"train_loss": -27.639434814453125, "global_step": 528503, "epoch": 6367} {"train_loss": -27.831043243408203, "global_step": 528504, "epoch": 6367} {"train_loss": -27.708784103393555, "global_step": 528505, "epoch": 6367} {"train_loss": -27.693601608276367, "global_step": 528506, "epoch": 6367} {"train_loss": -27.41098976135254, "global_step": 528507, "epoch": 6367} {"train_loss": -27.867422103881836, "global_step": 528508, "epoch": 6367} {"train_loss": -27.899642944335938, "global_step": 528509, "epoch": 6367} {"train_loss": -28.107715606689453, "global_step": 528510, "epoch": 6367} {"train_loss": -27.5291748046875, "global_step": 528511, "epoch": 6367} {"train_loss": -27.75384521484375, "global_step": 528512, "epoch": 6367} {"train_loss": -28.096771240234375, "global_step": 528513, "epoch": 6367} {"train_loss": -27.609024047851562, "global_step": 528514, "epoch": 6367} {"train_loss": -27.601720809936523, "global_step": 528515, "epoch": 6367} {"train_loss": -27.446496963500977, "global_step": 528516, "epoch": 6367} {"train_loss": -27.568496704101562, "global_step": 528517, "epoch": 6367} {"train_loss": -27.295867919921875, "global_step": 528518, "epoch": 6367} {"train_loss": -27.236948013305664, "global_step": 528519, "epoch": 6367} {"train_loss": -26.375558853149414, "global_step": 528520, "epoch": 6367} {"train_loss": -28.163061141967773, "global_step": 528521, "epoch": 6367} {"train_loss": -26.819019317626953, "global_step": 528522, "epoch": 6367} {"train_loss": -27.41412353515625, "global_step": 528523, "epoch": 6367} {"train_loss": -27.275876998901367, "global_step": 528524, "epoch": 6367} {"train_loss": -27.287195205688477, "global_step": 528525, "epoch": 6367} {"train_loss": -27.0064754486084, "global_step": 528526, "epoch": 6367} {"train_loss": -27.573095321655273, "global_step": 528527, "epoch": 6367} {"train_loss": -27.67201805114746, "global_step": 528528, "epoch": 6367} {"train_loss": -27.34221839904785, "global_step": 528529, "epoch": 6367} {"train_loss": -27.42518424987793, "global_step": 528530, "epoch": 6367} {"train_loss": -27.137861251831055, "global_step": 528531, "epoch": 6367} {"train_loss": -27.181848526000977, "global_step": 528532, "epoch": 6367} {"train_loss": -27.8273868560791, "global_step": 528533, "epoch": 6367} {"train_loss": -27.53594970703125, "global_step": 528534, "epoch": 6367} {"train_loss": -27.239709854125977, "global_step": 528535, "epoch": 6367} {"train_loss": -27.177209854125977, "global_step": 528536, "epoch": 6367} {"train_loss": -27.612730026245117, "global_step": 528537, "epoch": 6367} {"train_loss": -27.638166427612305, "global_step": 528538, "epoch": 6367} {"train_loss": -26.9608097076416, "global_step": 528539, "epoch": 6367} {"train_loss": -27.280683517456055, "global_step": 528540, "epoch": 6367} {"train_loss": -27.66060447692871, "global_step": 528541, "epoch": 6367} {"train_loss": -27.31219482421875, "global_step": 528542, "epoch": 6367} {"train_loss": -27.530277803719763, "global_step": 528543, "epoch": 6367, "val_loss": 6571848.0} {"train_loss": -25.16594123840332, "global_step": 528544, "epoch": 6368} {"train_loss": -26.205472946166992, "global_step": 528545, "epoch": 6368} {"train_loss": -25.898975372314453, "global_step": 528546, "epoch": 6368} {"train_loss": -26.145456314086914, "global_step": 528547, "epoch": 6368} {"train_loss": -25.957645416259766, "global_step": 528548, "epoch": 6368} {"train_loss": -26.715978622436523, "global_step": 528549, "epoch": 6368} {"train_loss": -26.265155792236328, "global_step": 528550, "epoch": 6368} {"train_loss": -26.473819732666016, "global_step": 528551, "epoch": 6368} {"train_loss": -26.494598388671875, "global_step": 528552, "epoch": 6368} {"train_loss": -26.853179931640625, "global_step": 528553, "epoch": 6368} {"train_loss": -26.9123477935791, "global_step": 528554, "epoch": 6368} {"train_loss": -26.919601440429688, "global_step": 528555, "epoch": 6368} {"train_loss": -26.731369018554688, "global_step": 528556, "epoch": 6368} {"train_loss": -26.453367233276367, "global_step": 528557, "epoch": 6368} {"train_loss": -26.961408615112305, "global_step": 528558, "epoch": 6368} {"train_loss": -26.981603622436523, "global_step": 528559, "epoch": 6368} {"train_loss": -26.498401641845703, "global_step": 528560, "epoch": 6368} {"train_loss": -27.32514762878418, "global_step": 528561, "epoch": 6368} {"train_loss": -26.94016456604004, "global_step": 528562, "epoch": 6368} {"train_loss": -27.09659194946289, "global_step": 528563, "epoch": 6368} {"train_loss": -27.20517349243164, "global_step": 528564, "epoch": 6368} {"train_loss": -27.234699249267578, "global_step": 528565, "epoch": 6368} {"train_loss": -27.27448081970215, "global_step": 528566, "epoch": 6368} {"train_loss": -27.17911720275879, "global_step": 528567, "epoch": 6368} {"train_loss": -27.576017379760742, "global_step": 528568, "epoch": 6368} {"train_loss": -27.312549591064453, "global_step": 528569, "epoch": 6368} {"train_loss": -27.081119537353516, "global_step": 528570, "epoch": 6368} {"train_loss": -27.240039825439453, "global_step": 528571, "epoch": 6368} {"train_loss": -27.107397079467773, "global_step": 528572, "epoch": 6368} {"train_loss": -27.38055992126465, "global_step": 528573, "epoch": 6368} {"train_loss": -27.152128219604492, "global_step": 528574, "epoch": 6368} {"train_loss": -27.543432235717773, "global_step": 528575, "epoch": 6368} {"train_loss": -27.22578239440918, "global_step": 528576, "epoch": 6368} {"train_loss": -27.407262802124023, "global_step": 528577, "epoch": 6368} {"train_loss": -27.828266143798828, "global_step": 528578, "epoch": 6368} {"train_loss": -27.43585205078125, "global_step": 528579, "epoch": 6368} {"train_loss": -27.392868041992188, "global_step": 528580, "epoch": 6368} {"train_loss": -27.775121688842773, "global_step": 528581, "epoch": 6368} {"train_loss": -27.34384536743164, "global_step": 528582, "epoch": 6368} {"train_loss": -27.409503936767578, "global_step": 528583, "epoch": 6368} {"train_loss": -27.42164421081543, "global_step": 528584, "epoch": 6368} {"train_loss": -27.686939239501953, "global_step": 528585, "epoch": 6368} {"train_loss": -27.659887313842773, "global_step": 528586, "epoch": 6368} {"train_loss": -27.859296798706055, "global_step": 528587, "epoch": 6368} {"train_loss": -27.62167739868164, "global_step": 528588, "epoch": 6368} {"train_loss": -27.554370880126953, "global_step": 528589, "epoch": 6368} {"train_loss": -27.81342124938965, "global_step": 528590, "epoch": 6368} {"train_loss": -27.850971221923828, "global_step": 528591, "epoch": 6368} {"train_loss": -27.497533798217773, "global_step": 528592, "epoch": 6368} {"train_loss": -27.615753173828125, "global_step": 528593, "epoch": 6368} {"train_loss": -27.77325439453125, "global_step": 528594, "epoch": 6368} {"train_loss": -27.586694717407227, "global_step": 528595, "epoch": 6368} {"train_loss": -27.683279037475586, "global_step": 528596, "epoch": 6368} {"train_loss": -27.877573013305664, "global_step": 528597, "epoch": 6368} {"train_loss": -27.77345085144043, "global_step": 528598, "epoch": 6368} {"train_loss": -28.090696334838867, "global_step": 528599, "epoch": 6368} {"train_loss": -27.5770206451416, "global_step": 528600, "epoch": 6368} {"train_loss": -27.648853302001953, "global_step": 528601, "epoch": 6368} {"train_loss": -28.19684410095215, "global_step": 528602, "epoch": 6368} {"train_loss": -27.54730224609375, "global_step": 528603, "epoch": 6368} {"train_loss": -27.855371475219727, "global_step": 528604, "epoch": 6368} {"train_loss": -27.711278915405273, "global_step": 528605, "epoch": 6368} {"train_loss": -27.347646713256836, "global_step": 528606, "epoch": 6368} {"train_loss": -26.89776611328125, "global_step": 528607, "epoch": 6368} {"train_loss": -26.02418327331543, "global_step": 528608, "epoch": 6368} {"train_loss": -25.918310165405273, "global_step": 528609, "epoch": 6368} {"train_loss": -25.640216827392578, "global_step": 528610, "epoch": 6368} {"train_loss": -26.90399742126465, "global_step": 528611, "epoch": 6368} {"train_loss": -26.828140258789062, "global_step": 528612, "epoch": 6368} {"train_loss": -26.77251625061035, "global_step": 528613, "epoch": 6368} {"train_loss": -26.907384872436523, "global_step": 528614, "epoch": 6368} {"train_loss": -27.06795310974121, "global_step": 528615, "epoch": 6368} {"train_loss": -27.10206413269043, "global_step": 528616, "epoch": 6368} {"train_loss": -27.077228546142578, "global_step": 528617, "epoch": 6368} {"train_loss": -27.415943145751953, "global_step": 528618, "epoch": 6368} {"train_loss": -27.398176193237305, "global_step": 528619, "epoch": 6368} {"train_loss": -27.364093780517578, "global_step": 528620, "epoch": 6368} {"train_loss": -27.249176025390625, "global_step": 528621, "epoch": 6368} {"train_loss": -27.053266525268555, "global_step": 528622, "epoch": 6368} {"train_loss": -28.06595802307129, "global_step": 528623, "epoch": 6368} {"train_loss": -27.36359977722168, "global_step": 528624, "epoch": 6368} {"train_loss": -27.313581466674805, "global_step": 528625, "epoch": 6368} {"train_loss": -27.18303751658244, "global_step": 528626, "epoch": 6368, "val_loss": 6541613.0} {"train_loss": -26.88787841796875, "global_step": 528627, "epoch": 6369} {"train_loss": -27.135772705078125, "global_step": 528628, "epoch": 6369} {"train_loss": -27.102827072143555, "global_step": 528629, "epoch": 6369} {"train_loss": -27.412006378173828, "global_step": 528630, "epoch": 6369} {"train_loss": -27.278045654296875, "global_step": 528631, "epoch": 6369} {"train_loss": -27.608983993530273, "global_step": 528632, "epoch": 6369} {"train_loss": -27.007266998291016, "global_step": 528633, "epoch": 6369} {"train_loss": -27.519119262695312, "global_step": 528634, "epoch": 6369} {"train_loss": -27.564306259155273, "global_step": 528635, "epoch": 6369} {"train_loss": -27.228775024414062, "global_step": 528636, "epoch": 6369} {"train_loss": -27.02784538269043, "global_step": 528637, "epoch": 6369} {"train_loss": -27.01520347595215, "global_step": 528638, "epoch": 6369} {"train_loss": -27.020376205444336, "global_step": 528639, "epoch": 6369} {"train_loss": -27.263660430908203, "global_step": 528640, "epoch": 6369} {"train_loss": -27.153778076171875, "global_step": 528641, "epoch": 6369} {"train_loss": -27.426382064819336, "global_step": 528642, "epoch": 6369} {"train_loss": -27.212909698486328, "global_step": 528643, "epoch": 6369} {"train_loss": -27.592945098876953, "global_step": 528644, "epoch": 6369} {"train_loss": -27.6600341796875, "global_step": 528645, "epoch": 6369} {"train_loss": -26.922611236572266, "global_step": 528646, "epoch": 6369} {"train_loss": -27.55909538269043, "global_step": 528647, "epoch": 6369} {"train_loss": -27.800302505493164, "global_step": 528648, "epoch": 6369} {"train_loss": -27.43311882019043, "global_step": 528649, "epoch": 6369} {"train_loss": -27.42426109313965, "global_step": 528650, "epoch": 6369} {"train_loss": -27.57904624938965, "global_step": 528651, "epoch": 6369} {"train_loss": -27.971948623657227, "global_step": 528652, "epoch": 6369} {"train_loss": -27.75806999206543, "global_step": 528653, "epoch": 6369} {"train_loss": -27.644174575805664, "global_step": 528654, "epoch": 6369} {"train_loss": -27.699575424194336, "global_step": 528655, "epoch": 6369} {"train_loss": -27.27631950378418, "global_step": 528656, "epoch": 6369} {"train_loss": -27.632490158081055, "global_step": 528657, "epoch": 6369} {"train_loss": -28.018606185913086, "global_step": 528658, "epoch": 6369} {"train_loss": -27.861005783081055, "global_step": 528659, "epoch": 6369} {"train_loss": -27.654067993164062, "global_step": 528660, "epoch": 6369} {"train_loss": -27.754446029663086, "global_step": 528661, "epoch": 6369} {"train_loss": -27.530990600585938, "global_step": 528662, "epoch": 6369} {"train_loss": -28.0250301361084, "global_step": 528663, "epoch": 6369} {"train_loss": -27.697784423828125, "global_step": 528664, "epoch": 6369} {"train_loss": -27.904926300048828, "global_step": 528665, "epoch": 6369} {"train_loss": -27.957029342651367, "global_step": 528666, "epoch": 6369} {"train_loss": -27.650815963745117, "global_step": 528667, "epoch": 6369} {"train_loss": -27.775110244750977, "global_step": 528668, "epoch": 6369} {"train_loss": -27.46588134765625, "global_step": 528669, "epoch": 6369} {"train_loss": -27.618408203125, "global_step": 528670, "epoch": 6369} {"train_loss": -27.398849487304688, "global_step": 528671, "epoch": 6369} {"train_loss": -27.853246688842773, "global_step": 528672, "epoch": 6369} {"train_loss": -27.791982650756836, "global_step": 528673, "epoch": 6369} {"train_loss": -27.8485107421875, "global_step": 528674, "epoch": 6369} {"train_loss": -27.86753273010254, "global_step": 528675, "epoch": 6369} {"train_loss": -27.521894454956055, "global_step": 528676, "epoch": 6369} {"train_loss": -28.069456100463867, "global_step": 528677, "epoch": 6369} {"train_loss": -27.554426193237305, "global_step": 528678, "epoch": 6369} {"train_loss": -28.199798583984375, "global_step": 528679, "epoch": 6369} {"train_loss": -27.762500762939453, "global_step": 528680, "epoch": 6369} {"train_loss": -27.72772789001465, "global_step": 528681, "epoch": 6369} {"train_loss": -27.602155685424805, "global_step": 528682, "epoch": 6369} {"train_loss": -27.859882354736328, "global_step": 528683, "epoch": 6369} {"train_loss": -27.851001739501953, "global_step": 528684, "epoch": 6369} {"train_loss": -27.710229873657227, "global_step": 528685, "epoch": 6369} {"train_loss": -28.24407386779785, "global_step": 528686, "epoch": 6369} {"train_loss": -27.391584396362305, "global_step": 528687, "epoch": 6369} {"train_loss": -27.584997177124023, "global_step": 528688, "epoch": 6369} {"train_loss": -27.216596603393555, "global_step": 528689, "epoch": 6369} {"train_loss": -27.335834503173828, "global_step": 528690, "epoch": 6369} {"train_loss": -27.392654418945312, "global_step": 528691, "epoch": 6369} {"train_loss": -27.3675537109375, "global_step": 528692, "epoch": 6369} {"train_loss": -27.60957908630371, "global_step": 528693, "epoch": 6369} {"train_loss": -27.37384033203125, "global_step": 528694, "epoch": 6369} {"train_loss": -27.5906982421875, "global_step": 528695, "epoch": 6369} {"train_loss": -27.43440055847168, "global_step": 528696, "epoch": 6369} {"train_loss": -27.585866928100586, "global_step": 528697, "epoch": 6369} {"train_loss": -27.801483154296875, "global_step": 528698, "epoch": 6369} {"train_loss": -27.86268424987793, "global_step": 528699, "epoch": 6369} {"train_loss": -27.59174919128418, "global_step": 528700, "epoch": 6369} {"train_loss": -27.657474517822266, "global_step": 528701, "epoch": 6369} {"train_loss": -27.70686149597168, "global_step": 528702, "epoch": 6369} {"train_loss": -27.382892608642578, "global_step": 528703, "epoch": 6369} {"train_loss": -27.93548583984375, "global_step": 528704, "epoch": 6369} {"train_loss": -27.52727699279785, "global_step": 528705, "epoch": 6369} {"train_loss": -27.763538360595703, "global_step": 528706, "epoch": 6369} {"train_loss": -27.524839401245117, "global_step": 528707, "epoch": 6369} {"train_loss": -27.450504302978516, "global_step": 528708, "epoch": 6369} {"train_loss": -27.550451738288604, "global_step": 528709, "epoch": 6369, "val_loss": 6560626.5} {"train_loss": -26.5026912689209, "global_step": 528710, "epoch": 6370} {"train_loss": -25.921279907226562, "global_step": 528711, "epoch": 6370} {"train_loss": -25.71463394165039, "global_step": 528712, "epoch": 6370} {"train_loss": -25.159175872802734, "global_step": 528713, "epoch": 6370} {"train_loss": -25.923446655273438, "global_step": 528714, "epoch": 6370} {"train_loss": -26.498376846313477, "global_step": 528715, "epoch": 6370} {"train_loss": -25.554182052612305, "global_step": 528716, "epoch": 6370} {"train_loss": -26.226369857788086, "global_step": 528717, "epoch": 6370} {"train_loss": -26.76277732849121, "global_step": 528718, "epoch": 6370} {"train_loss": -26.765729904174805, "global_step": 528719, "epoch": 6370} {"train_loss": -27.11150550842285, "global_step": 528720, "epoch": 6370} {"train_loss": -26.6602725982666, "global_step": 528721, "epoch": 6370} {"train_loss": -27.159704208374023, "global_step": 528722, "epoch": 6370} {"train_loss": -26.973478317260742, "global_step": 528723, "epoch": 6370} {"train_loss": -26.81113052368164, "global_step": 528724, "epoch": 6370} {"train_loss": -26.95904541015625, "global_step": 528725, "epoch": 6370} {"train_loss": -26.36272621154785, "global_step": 528726, "epoch": 6370} {"train_loss": -27.58829116821289, "global_step": 528727, "epoch": 6370} {"train_loss": -26.635404586791992, "global_step": 528728, "epoch": 6370} {"train_loss": -26.63801383972168, "global_step": 528729, "epoch": 6370} {"train_loss": -27.033735275268555, "global_step": 528730, "epoch": 6370} {"train_loss": -27.016101837158203, "global_step": 528731, "epoch": 6370} {"train_loss": -26.738391876220703, "global_step": 528732, "epoch": 6370} {"train_loss": -27.0738582611084, "global_step": 528733, "epoch": 6370} {"train_loss": -26.963062286376953, "global_step": 528734, "epoch": 6370} {"train_loss": -27.00830078125, "global_step": 528735, "epoch": 6370} {"train_loss": -27.349750518798828, "global_step": 528736, "epoch": 6370} {"train_loss": -27.294660568237305, "global_step": 528737, "epoch": 6370} {"train_loss": -27.312108993530273, "global_step": 528738, "epoch": 6370} {"train_loss": -27.29499626159668, "global_step": 528739, "epoch": 6370} {"train_loss": -27.407012939453125, "global_step": 528740, "epoch": 6370} {"train_loss": -27.240848541259766, "global_step": 528741, "epoch": 6370} {"train_loss": -27.466049194335938, "global_step": 528742, "epoch": 6370} {"train_loss": -27.466354370117188, "global_step": 528743, "epoch": 6370} {"train_loss": -27.62245750427246, "global_step": 528744, "epoch": 6370} {"train_loss": -27.215612411499023, "global_step": 528745, "epoch": 6370} {"train_loss": -27.58308982849121, "global_step": 528746, "epoch": 6370} {"train_loss": -27.97437858581543, "global_step": 528747, "epoch": 6370} {"train_loss": -28.079254150390625, "global_step": 528748, "epoch": 6370} {"train_loss": -27.869108200073242, "global_step": 528749, "epoch": 6370} {"train_loss": -27.62579345703125, "global_step": 528750, "epoch": 6370} {"train_loss": -27.841064453125, "global_step": 528751, "epoch": 6370} {"train_loss": -27.61982536315918, "global_step": 528752, "epoch": 6370} {"train_loss": -27.978687286376953, "global_step": 528753, "epoch": 6370} {"train_loss": -28.124570846557617, "global_step": 528754, "epoch": 6370} {"train_loss": -27.718708038330078, "global_step": 528755, "epoch": 6370} {"train_loss": -27.802658081054688, "global_step": 528756, "epoch": 6370} {"train_loss": -27.460433959960938, "global_step": 528757, "epoch": 6370} {"train_loss": -27.308364868164062, "global_step": 528758, "epoch": 6370} {"train_loss": -27.231897354125977, "global_step": 528759, "epoch": 6370} {"train_loss": -27.715381622314453, "global_step": 528760, "epoch": 6370} {"train_loss": -27.836511611938477, "global_step": 528761, "epoch": 6370} {"train_loss": -27.96453285217285, "global_step": 528762, "epoch": 6370} {"train_loss": -27.765766143798828, "global_step": 528763, "epoch": 6370} {"train_loss": -27.927099227905273, "global_step": 528764, "epoch": 6370} {"train_loss": -27.667810440063477, "global_step": 528765, "epoch": 6370} {"train_loss": -27.8038387298584, "global_step": 528766, "epoch": 6370} {"train_loss": -27.661148071289062, "global_step": 528767, "epoch": 6370} {"train_loss": -27.81593132019043, "global_step": 528768, "epoch": 6370} {"train_loss": -27.492090225219727, "global_step": 528769, "epoch": 6370} {"train_loss": -28.17032814025879, "global_step": 528770, "epoch": 6370} {"train_loss": -27.7089786529541, "global_step": 528771, "epoch": 6370} {"train_loss": -27.718420028686523, "global_step": 528772, "epoch": 6370} {"train_loss": -27.851428985595703, "global_step": 528773, "epoch": 6370} {"train_loss": -27.66196060180664, "global_step": 528774, "epoch": 6370} {"train_loss": -27.786945343017578, "global_step": 528775, "epoch": 6370} {"train_loss": -27.751483917236328, "global_step": 528776, "epoch": 6370} {"train_loss": -27.64472770690918, "global_step": 528777, "epoch": 6370} {"train_loss": -27.813871383666992, "global_step": 528778, "epoch": 6370} {"train_loss": -27.968503952026367, "global_step": 528779, "epoch": 6370} {"train_loss": -27.714033126831055, "global_step": 528780, "epoch": 6370} {"train_loss": -27.837209701538086, "global_step": 528781, "epoch": 6370} {"train_loss": -27.8772029876709, "global_step": 528782, "epoch": 6370} {"train_loss": -27.695459365844727, "global_step": 528783, "epoch": 6370} {"train_loss": -27.455469131469727, "global_step": 528784, "epoch": 6370} {"train_loss": -27.565988540649414, "global_step": 528785, "epoch": 6370} {"train_loss": -28.09771156311035, "global_step": 528786, "epoch": 6370} {"train_loss": -27.757099151611328, "global_step": 528787, "epoch": 6370} {"train_loss": -27.783475875854492, "global_step": 528788, "epoch": 6370} {"train_loss": -27.64141273498535, "global_step": 528789, "epoch": 6370} {"train_loss": -27.849475860595703, "global_step": 528790, "epoch": 6370} {"train_loss": -27.680694580078125, "global_step": 528791, "epoch": 6370} {"train_loss": -27.356597440788544, "global_step": 528792, "epoch": 6370, "val_loss": 6605125.5} {"train_loss": -27.365249633789062, "global_step": 528793, "epoch": 6371} {"train_loss": -27.263446807861328, "global_step": 528794, "epoch": 6371} {"train_loss": -27.050146102905273, "global_step": 528795, "epoch": 6371} {"train_loss": -27.28472900390625, "global_step": 528796, "epoch": 6371} {"train_loss": -27.095129013061523, "global_step": 528797, "epoch": 6371} {"train_loss": -26.814661026000977, "global_step": 528798, "epoch": 6371} {"train_loss": -26.541156768798828, "global_step": 528799, "epoch": 6371} {"train_loss": -26.38443946838379, "global_step": 528800, "epoch": 6371} {"train_loss": -26.761371612548828, "global_step": 528801, "epoch": 6371} {"train_loss": -27.55157470703125, "global_step": 528802, "epoch": 6371} {"train_loss": -27.143640518188477, "global_step": 528803, "epoch": 6371} {"train_loss": -26.810626983642578, "global_step": 528804, "epoch": 6371} {"train_loss": -27.167776107788086, "global_step": 528805, "epoch": 6371} {"train_loss": -26.93794059753418, "global_step": 528806, "epoch": 6371} {"train_loss": -27.35580825805664, "global_step": 528807, "epoch": 6371} {"train_loss": -27.739133834838867, "global_step": 528808, "epoch": 6371} {"train_loss": -27.018590927124023, "global_step": 528809, "epoch": 6371} {"train_loss": -27.099470138549805, "global_step": 528810, "epoch": 6371} {"train_loss": -27.35009765625, "global_step": 528811, "epoch": 6371} {"train_loss": -27.230085372924805, "global_step": 528812, "epoch": 6371} {"train_loss": -27.380966186523438, "global_step": 528813, "epoch": 6371} {"train_loss": -27.107213973999023, "global_step": 528814, "epoch": 6371} {"train_loss": -27.353208541870117, "global_step": 528815, "epoch": 6371} {"train_loss": -27.674457550048828, "global_step": 528816, "epoch": 6371} {"train_loss": -27.4635009765625, "global_step": 528817, "epoch": 6371} {"train_loss": -27.149627685546875, "global_step": 528818, "epoch": 6371} {"train_loss": -27.66713523864746, "global_step": 528819, "epoch": 6371} {"train_loss": -26.874408721923828, "global_step": 528820, "epoch": 6371} {"train_loss": -27.37639808654785, "global_step": 528821, "epoch": 6371} {"train_loss": -27.604223251342773, "global_step": 528822, "epoch": 6371} {"train_loss": -27.61054039001465, "global_step": 528823, "epoch": 6371} {"train_loss": -27.00467300415039, "global_step": 528824, "epoch": 6371} {"train_loss": -27.187707901000977, "global_step": 528825, "epoch": 6371} {"train_loss": -27.48427391052246, "global_step": 528826, "epoch": 6371} {"train_loss": -27.36773681640625, "global_step": 528827, "epoch": 6371} {"train_loss": -27.37652587890625, "global_step": 528828, "epoch": 6371} {"train_loss": -27.650415420532227, "global_step": 528829, "epoch": 6371} {"train_loss": -27.491851806640625, "global_step": 528830, "epoch": 6371} {"train_loss": -27.675128936767578, "global_step": 528831, "epoch": 6371} {"train_loss": -27.326322555541992, "global_step": 528832, "epoch": 6371} {"train_loss": -27.76692008972168, "global_step": 528833, "epoch": 6371} {"train_loss": -27.56159782409668, "global_step": 528834, "epoch": 6371} {"train_loss": -27.624164581298828, "global_step": 528835, "epoch": 6371} {"train_loss": -27.569746017456055, "global_step": 528836, "epoch": 6371} {"train_loss": -27.796375274658203, "global_step": 528837, "epoch": 6371} {"train_loss": -27.516843795776367, "global_step": 528838, "epoch": 6371} {"train_loss": -27.959674835205078, "global_step": 528839, "epoch": 6371} {"train_loss": -27.615041732788086, "global_step": 528840, "epoch": 6371} {"train_loss": -27.629749298095703, "global_step": 528841, "epoch": 6371} {"train_loss": -27.911413192749023, "global_step": 528842, "epoch": 6371} {"train_loss": -27.573816299438477, "global_step": 528843, "epoch": 6371} {"train_loss": -28.064451217651367, "global_step": 528844, "epoch": 6371} {"train_loss": -27.661853790283203, "global_step": 528845, "epoch": 6371} {"train_loss": -27.666534423828125, "global_step": 528846, "epoch": 6371} {"train_loss": -27.854663848876953, "global_step": 528847, "epoch": 6371} {"train_loss": -27.658828735351562, "global_step": 528848, "epoch": 6371} {"train_loss": -27.884531021118164, "global_step": 528849, "epoch": 6371} {"train_loss": -27.7491455078125, "global_step": 528850, "epoch": 6371} {"train_loss": -27.723363876342773, "global_step": 528851, "epoch": 6371} {"train_loss": -28.092670440673828, "global_step": 528852, "epoch": 6371} {"train_loss": -27.98691749572754, "global_step": 528853, "epoch": 6371} {"train_loss": -27.980316162109375, "global_step": 528854, "epoch": 6371} {"train_loss": -27.728010177612305, "global_step": 528855, "epoch": 6371} {"train_loss": -27.91472816467285, "global_step": 528856, "epoch": 6371} {"train_loss": -28.332807540893555, "global_step": 528857, "epoch": 6371} {"train_loss": -27.705678939819336, "global_step": 528858, "epoch": 6371} {"train_loss": -27.62222671508789, "global_step": 528859, "epoch": 6371} {"train_loss": -27.905628204345703, "global_step": 528860, "epoch": 6371} {"train_loss": -27.66724967956543, "global_step": 528861, "epoch": 6371} {"train_loss": -27.4840030670166, "global_step": 528862, "epoch": 6371} {"train_loss": -27.87607765197754, "global_step": 528863, "epoch": 6371} {"train_loss": -27.603479385375977, "global_step": 528864, "epoch": 6371} {"train_loss": -28.155588150024414, "global_step": 528865, "epoch": 6371} {"train_loss": -28.024826049804688, "global_step": 528866, "epoch": 6371} {"train_loss": -27.74293327331543, "global_step": 528867, "epoch": 6371} {"train_loss": -27.824359893798828, "global_step": 528868, "epoch": 6371} {"train_loss": -27.66192626953125, "global_step": 528869, "epoch": 6371} {"train_loss": -27.4255428314209, "global_step": 528870, "epoch": 6371} {"train_loss": -27.055505752563477, "global_step": 528871, "epoch": 6371} {"train_loss": -27.304357528686523, "global_step": 528872, "epoch": 6371} {"train_loss": -27.56709098815918, "global_step": 528873, "epoch": 6371} {"train_loss": -28.014917373657227, "global_step": 528874, "epoch": 6371} {"train_loss": -27.496060061167523, "global_step": 528875, "epoch": 6371, "val_loss": 6627168.0} {"train_loss": -27.311920166015625, "global_step": 528876, "epoch": 6372} {"train_loss": -27.06122398376465, "global_step": 528877, "epoch": 6372} {"train_loss": -26.391958236694336, "global_step": 528878, "epoch": 6372} {"train_loss": -25.33282470703125, "global_step": 528879, "epoch": 6372} {"train_loss": -24.75041961669922, "global_step": 528880, "epoch": 6372} {"train_loss": -26.551382064819336, "global_step": 528881, "epoch": 6372} {"train_loss": -27.4550838470459, "global_step": 528882, "epoch": 6372} {"train_loss": -26.523834228515625, "global_step": 528883, "epoch": 6372} {"train_loss": -26.772626876831055, "global_step": 528884, "epoch": 6372} {"train_loss": -26.615442276000977, "global_step": 528885, "epoch": 6372} {"train_loss": -26.962141036987305, "global_step": 528886, "epoch": 6372} {"train_loss": -26.40521240234375, "global_step": 528887, "epoch": 6372} {"train_loss": -27.06351089477539, "global_step": 528888, "epoch": 6372} {"train_loss": -27.11728286743164, "global_step": 528889, "epoch": 6372} {"train_loss": -26.882278442382812, "global_step": 528890, "epoch": 6372} {"train_loss": -27.085357666015625, "global_step": 528891, "epoch": 6372} {"train_loss": -26.825239181518555, "global_step": 528892, "epoch": 6372} {"train_loss": -27.422475814819336, "global_step": 528893, "epoch": 6372} {"train_loss": -26.814472198486328, "global_step": 528894, "epoch": 6372} {"train_loss": -26.982603073120117, "global_step": 528895, "epoch": 6372} {"train_loss": -27.219701766967773, "global_step": 528896, "epoch": 6372} {"train_loss": -27.572580337524414, "global_step": 528897, "epoch": 6372} {"train_loss": -27.508508682250977, "global_step": 528898, "epoch": 6372} {"train_loss": -27.658435821533203, "global_step": 528899, "epoch": 6372} {"train_loss": -27.106098175048828, "global_step": 528900, "epoch": 6372} {"train_loss": -27.417877197265625, "global_step": 528901, "epoch": 6372} {"train_loss": -27.565397262573242, "global_step": 528902, "epoch": 6372} {"train_loss": -27.326236724853516, "global_step": 528903, "epoch": 6372} {"train_loss": -27.215784072875977, "global_step": 528904, "epoch": 6372} {"train_loss": -27.612592697143555, "global_step": 528905, "epoch": 6372} {"train_loss": -27.57134437561035, "global_step": 528906, "epoch": 6372} {"train_loss": -27.450597763061523, "global_step": 528907, "epoch": 6372} {"train_loss": -27.540969848632812, "global_step": 528908, "epoch": 6372} {"train_loss": -27.783361434936523, "global_step": 528909, "epoch": 6372} {"train_loss": -27.59091567993164, "global_step": 528910, "epoch": 6372} {"train_loss": -27.80686378479004, "global_step": 528911, "epoch": 6372} {"train_loss": -27.558454513549805, "global_step": 528912, "epoch": 6372} {"train_loss": -27.63172721862793, "global_step": 528913, "epoch": 6372} {"train_loss": -27.808429718017578, "global_step": 528914, "epoch": 6372} {"train_loss": -27.871313095092773, "global_step": 528915, "epoch": 6372} {"train_loss": -27.805450439453125, "global_step": 528916, "epoch": 6372} {"train_loss": -27.90109634399414, "global_step": 528917, "epoch": 6372} {"train_loss": -27.812536239624023, "global_step": 528918, "epoch": 6372} {"train_loss": -27.737302780151367, "global_step": 528919, "epoch": 6372} {"train_loss": -27.57370376586914, "global_step": 528920, "epoch": 6372} {"train_loss": -27.80153465270996, "global_step": 528921, "epoch": 6372} {"train_loss": -27.87470054626465, "global_step": 528922, "epoch": 6372} {"train_loss": -27.86775779724121, "global_step": 528923, "epoch": 6372} {"train_loss": -27.38690757751465, "global_step": 528924, "epoch": 6372} {"train_loss": -27.999662399291992, "global_step": 528925, "epoch": 6372} {"train_loss": -27.97800064086914, "global_step": 528926, "epoch": 6372} {"train_loss": -27.628803253173828, "global_step": 528927, "epoch": 6372} {"train_loss": -27.6768798828125, "global_step": 528928, "epoch": 6372} {"train_loss": -27.991464614868164, "global_step": 528929, "epoch": 6372} {"train_loss": -28.051237106323242, "global_step": 528930, "epoch": 6372} {"train_loss": -27.953510284423828, "global_step": 528931, "epoch": 6372} {"train_loss": -27.73467445373535, "global_step": 528932, "epoch": 6372} {"train_loss": -27.691822052001953, "global_step": 528933, "epoch": 6372} {"train_loss": -26.817529678344727, "global_step": 528934, "epoch": 6372} {"train_loss": -27.39396095275879, "global_step": 528935, "epoch": 6372} {"train_loss": -27.299148559570312, "global_step": 528936, "epoch": 6372} {"train_loss": -27.689899444580078, "global_step": 528937, "epoch": 6372} {"train_loss": -27.500226974487305, "global_step": 528938, "epoch": 6372} {"train_loss": -27.10186767578125, "global_step": 528939, "epoch": 6372} {"train_loss": -27.47235679626465, "global_step": 528940, "epoch": 6372} {"train_loss": -27.282516479492188, "global_step": 528941, "epoch": 6372} {"train_loss": -27.752893447875977, "global_step": 528942, "epoch": 6372} {"train_loss": -27.490436553955078, "global_step": 528943, "epoch": 6372} {"train_loss": -27.355466842651367, "global_step": 528944, "epoch": 6372} {"train_loss": -27.003156661987305, "global_step": 528945, "epoch": 6372} {"train_loss": -26.944549560546875, "global_step": 528946, "epoch": 6372} {"train_loss": -27.66326904296875, "global_step": 528947, "epoch": 6372} {"train_loss": -27.851343154907227, "global_step": 528948, "epoch": 6372} {"train_loss": -27.728851318359375, "global_step": 528949, "epoch": 6372} {"train_loss": -27.24172019958496, "global_step": 528950, "epoch": 6372} {"train_loss": -27.27203941345215, "global_step": 528951, "epoch": 6372} {"train_loss": -27.345428466796875, "global_step": 528952, "epoch": 6372} {"train_loss": -27.507205963134766, "global_step": 528953, "epoch": 6372} {"train_loss": -27.967111587524414, "global_step": 528954, "epoch": 6372} {"train_loss": -27.703521728515625, "global_step": 528955, "epoch": 6372} {"train_loss": -27.4717960357666, "global_step": 528956, "epoch": 6372} {"train_loss": -27.5797119140625, "global_step": 528957, "epoch": 6372} {"train_loss": -27.359914205160486, "global_step": 528958, "epoch": 6372, "val_loss": 6622283.5} {"train_loss": -27.096113204956055, "global_step": 528959, "epoch": 6373} {"train_loss": -25.140727996826172, "global_step": 528960, "epoch": 6373} {"train_loss": -27.36821937561035, "global_step": 528961, "epoch": 6373} {"train_loss": -26.569849014282227, "global_step": 528962, "epoch": 6373} {"train_loss": -26.925317764282227, "global_step": 528963, "epoch": 6373} {"train_loss": -26.701040267944336, "global_step": 528964, "epoch": 6373} {"train_loss": -26.59441566467285, "global_step": 528965, "epoch": 6373} {"train_loss": -26.304845809936523, "global_step": 528966, "epoch": 6373} {"train_loss": -26.687286376953125, "global_step": 528967, "epoch": 6373} {"train_loss": -27.388845443725586, "global_step": 528968, "epoch": 6373} {"train_loss": -27.033203125, "global_step": 528969, "epoch": 6373} {"train_loss": -27.2515811920166, "global_step": 528970, "epoch": 6373} {"train_loss": -27.162160873413086, "global_step": 528971, "epoch": 6373} {"train_loss": -26.95716667175293, "global_step": 528972, "epoch": 6373} {"train_loss": -27.359561920166016, "global_step": 528973, "epoch": 6373} {"train_loss": -27.152536392211914, "global_step": 528974, "epoch": 6373} {"train_loss": -27.26917839050293, "global_step": 528975, "epoch": 6373} {"train_loss": -27.692657470703125, "global_step": 528976, "epoch": 6373} {"train_loss": -27.480228424072266, "global_step": 528977, "epoch": 6373} {"train_loss": -27.44635581970215, "global_step": 528978, "epoch": 6373} {"train_loss": -27.360000610351562, "global_step": 528979, "epoch": 6373} {"train_loss": -27.555133819580078, "global_step": 528980, "epoch": 6373} {"train_loss": -27.164020538330078, "global_step": 528981, "epoch": 6373} {"train_loss": -27.63521385192871, "global_step": 528982, "epoch": 6373} {"train_loss": -27.430957794189453, "global_step": 528983, "epoch": 6373} {"train_loss": -27.279443740844727, "global_step": 528984, "epoch": 6373} {"train_loss": -27.131616592407227, "global_step": 528985, "epoch": 6373} {"train_loss": -27.0899715423584, "global_step": 528986, "epoch": 6373} {"train_loss": -27.454198837280273, "global_step": 528987, "epoch": 6373} {"train_loss": -27.3313045501709, "global_step": 528988, "epoch": 6373} {"train_loss": -27.62312126159668, "global_step": 528989, "epoch": 6373} {"train_loss": -27.6228084564209, "global_step": 528990, "epoch": 6373} {"train_loss": -27.428237915039062, "global_step": 528991, "epoch": 6373} {"train_loss": -27.5657958984375, "global_step": 528992, "epoch": 6373} {"train_loss": -27.7545166015625, "global_step": 528993, "epoch": 6373} {"train_loss": -27.617145538330078, "global_step": 528994, "epoch": 6373} {"train_loss": -27.45000648498535, "global_step": 528995, "epoch": 6373} {"train_loss": -27.9829044342041, "global_step": 528996, "epoch": 6373} {"train_loss": -27.6113338470459, "global_step": 528997, "epoch": 6373} {"train_loss": -27.709503173828125, "global_step": 528998, "epoch": 6373} {"train_loss": -27.845449447631836, "global_step": 528999, "epoch": 6373} {"train_loss": -27.707321166992188, "global_step": 529000, "epoch": 6373} {"train_loss": -27.547422409057617, "global_step": 529001, "epoch": 6373} {"train_loss": -27.080350875854492, "global_step": 529002, "epoch": 6373} {"train_loss": -27.56216812133789, "global_step": 529003, "epoch": 6373} {"train_loss": -27.46619987487793, "global_step": 529004, "epoch": 6373} {"train_loss": -27.402484893798828, "global_step": 529005, "epoch": 6373} {"train_loss": -27.640735626220703, "global_step": 529006, "epoch": 6373} {"train_loss": -27.518238067626953, "global_step": 529007, "epoch": 6373} {"train_loss": -27.442480087280273, "global_step": 529008, "epoch": 6373} {"train_loss": -27.241559982299805, "global_step": 529009, "epoch": 6373} {"train_loss": -27.807723999023438, "global_step": 529010, "epoch": 6373} {"train_loss": -27.478546142578125, "global_step": 529011, "epoch": 6373} {"train_loss": -27.7120361328125, "global_step": 529012, "epoch": 6373} {"train_loss": -27.875598907470703, "global_step": 529013, "epoch": 6373} {"train_loss": -27.29841423034668, "global_step": 529014, "epoch": 6373} {"train_loss": -27.593128204345703, "global_step": 529015, "epoch": 6373} {"train_loss": -27.961841583251953, "global_step": 529016, "epoch": 6373} {"train_loss": -27.756591796875, "global_step": 529017, "epoch": 6373} {"train_loss": -27.758962631225586, "global_step": 529018, "epoch": 6373} {"train_loss": -27.426488876342773, "global_step": 529019, "epoch": 6373} {"train_loss": -28.041528701782227, "global_step": 529020, "epoch": 6373} {"train_loss": -27.81678581237793, "global_step": 529021, "epoch": 6373} {"train_loss": -27.65610122680664, "global_step": 529022, "epoch": 6373} {"train_loss": -27.695331573486328, "global_step": 529023, "epoch": 6373} {"train_loss": -27.351415634155273, "global_step": 529024, "epoch": 6373} {"train_loss": -28.187753677368164, "global_step": 529025, "epoch": 6373} {"train_loss": -28.04864501953125, "global_step": 529026, "epoch": 6373} {"train_loss": -27.61233901977539, "global_step": 529027, "epoch": 6373} {"train_loss": -28.10102653503418, "global_step": 529028, "epoch": 6373} {"train_loss": -27.208852767944336, "global_step": 529029, "epoch": 6373} {"train_loss": -27.5555419921875, "global_step": 529030, "epoch": 6373} {"train_loss": -27.8234920501709, "global_step": 529031, "epoch": 6373} {"train_loss": -27.257055282592773, "global_step": 529032, "epoch": 6373} {"train_loss": -27.228290557861328, "global_step": 529033, "epoch": 6373} {"train_loss": -27.20000648498535, "global_step": 529034, "epoch": 6373} {"train_loss": -27.707305908203125, "global_step": 529035, "epoch": 6373} {"train_loss": -27.485004425048828, "global_step": 529036, "epoch": 6373} {"train_loss": -26.69815444946289, "global_step": 529037, "epoch": 6373} {"train_loss": -27.4823055267334, "global_step": 529038, "epoch": 6373} {"train_loss": -27.395902633666992, "global_step": 529039, "epoch": 6373} {"train_loss": -27.360212326049805, "global_step": 529040, "epoch": 6373} {"train_loss": -27.423168435154192, "global_step": 529041, "epoch": 6373, "val_loss": 6625434.5} {"train_loss": -26.88654899597168, "global_step": 529042, "epoch": 6374} {"train_loss": -26.825531005859375, "global_step": 529043, "epoch": 6374} {"train_loss": -27.097564697265625, "global_step": 529044, "epoch": 6374} {"train_loss": -27.08349609375, "global_step": 529045, "epoch": 6374} {"train_loss": -26.876611709594727, "global_step": 529046, "epoch": 6374} {"train_loss": -26.923986434936523, "global_step": 529047, "epoch": 6374} {"train_loss": -27.385900497436523, "global_step": 529048, "epoch": 6374} {"train_loss": -27.392866134643555, "global_step": 529049, "epoch": 6374} {"train_loss": -27.25823402404785, "global_step": 529050, "epoch": 6374} {"train_loss": -27.22141456604004, "global_step": 529051, "epoch": 6374} {"train_loss": -27.312824249267578, "global_step": 529052, "epoch": 6374} {"train_loss": -27.22882080078125, "global_step": 529053, "epoch": 6374} {"train_loss": -27.14801025390625, "global_step": 529054, "epoch": 6374} {"train_loss": -27.165008544921875, "global_step": 529055, "epoch": 6374} {"train_loss": -27.397979736328125, "global_step": 529056, "epoch": 6374} {"train_loss": -27.239614486694336, "global_step": 529057, "epoch": 6374} {"train_loss": -27.36250114440918, "global_step": 529058, "epoch": 6374} {"train_loss": -27.136096954345703, "global_step": 529059, "epoch": 6374} {"train_loss": -27.63995361328125, "global_step": 529060, "epoch": 6374} {"train_loss": -27.409692764282227, "global_step": 529061, "epoch": 6374} {"train_loss": -27.37200355529785, "global_step": 529062, "epoch": 6374} {"train_loss": -27.085432052612305, "global_step": 529063, "epoch": 6374} {"train_loss": -26.831064224243164, "global_step": 529064, "epoch": 6374} {"train_loss": -27.535898208618164, "global_step": 529065, "epoch": 6374} {"train_loss": -27.62092399597168, "global_step": 529066, "epoch": 6374} {"train_loss": -27.51851463317871, "global_step": 529067, "epoch": 6374} {"train_loss": -27.631885528564453, "global_step": 529068, "epoch": 6374} {"train_loss": -27.806568145751953, "global_step": 529069, "epoch": 6374} {"train_loss": -27.499866485595703, "global_step": 529070, "epoch": 6374} {"train_loss": -27.535261154174805, "global_step": 529071, "epoch": 6374} {"train_loss": -27.5865421295166, "global_step": 529072, "epoch": 6374} {"train_loss": -27.544843673706055, "global_step": 529073, "epoch": 6374} {"train_loss": -27.508630752563477, "global_step": 529074, "epoch": 6374} {"train_loss": -27.707019805908203, "global_step": 529075, "epoch": 6374} {"train_loss": -27.67738914489746, "global_step": 529076, "epoch": 6374} {"train_loss": -27.57733726501465, "global_step": 529077, "epoch": 6374} {"train_loss": -27.6152400970459, "global_step": 529078, "epoch": 6374} {"train_loss": -27.57362174987793, "global_step": 529079, "epoch": 6374} {"train_loss": -27.66653823852539, "global_step": 529080, "epoch": 6374} {"train_loss": -27.781625747680664, "global_step": 529081, "epoch": 6374} {"train_loss": -27.763748168945312, "global_step": 529082, "epoch": 6374} {"train_loss": -28.170623779296875, "global_step": 529083, "epoch": 6374} {"train_loss": -27.744037628173828, "global_step": 529084, "epoch": 6374} {"train_loss": -27.87604331970215, "global_step": 529085, "epoch": 6374} {"train_loss": -28.034595489501953, "global_step": 529086, "epoch": 6374} {"train_loss": -27.5521240234375, "global_step": 529087, "epoch": 6374} {"train_loss": -27.819345474243164, "global_step": 529088, "epoch": 6374} {"train_loss": -27.846532821655273, "global_step": 529089, "epoch": 6374} {"train_loss": -27.6901912689209, "global_step": 529090, "epoch": 6374} {"train_loss": -27.956281661987305, "global_step": 529091, "epoch": 6374} {"train_loss": -27.971881866455078, "global_step": 529092, "epoch": 6374} {"train_loss": -27.88714027404785, "global_step": 529093, "epoch": 6374} {"train_loss": -27.587987899780273, "global_step": 529094, "epoch": 6374} {"train_loss": -27.59943962097168, "global_step": 529095, "epoch": 6374} {"train_loss": -27.521411895751953, "global_step": 529096, "epoch": 6374} {"train_loss": -27.3780574798584, "global_step": 529097, "epoch": 6374} {"train_loss": -27.593610763549805, "global_step": 529098, "epoch": 6374} {"train_loss": -27.73988151550293, "global_step": 529099, "epoch": 6374} {"train_loss": -27.378772735595703, "global_step": 529100, "epoch": 6374} {"train_loss": -27.5721435546875, "global_step": 529101, "epoch": 6374} {"train_loss": -27.660938262939453, "global_step": 529102, "epoch": 6374} {"train_loss": -27.73963737487793, "global_step": 529103, "epoch": 6374} {"train_loss": -28.101476669311523, "global_step": 529104, "epoch": 6374} {"train_loss": -28.14754295349121, "global_step": 529105, "epoch": 6374} {"train_loss": -27.730005264282227, "global_step": 529106, "epoch": 6374} {"train_loss": -28.024845123291016, "global_step": 529107, "epoch": 6374} {"train_loss": -27.36689567565918, "global_step": 529108, "epoch": 6374} {"train_loss": -27.7096004486084, "global_step": 529109, "epoch": 6374} {"train_loss": -27.721487045288086, "global_step": 529110, "epoch": 6374} {"train_loss": -27.554914474487305, "global_step": 529111, "epoch": 6374} {"train_loss": -27.389501571655273, "global_step": 529112, "epoch": 6374} {"train_loss": -27.388254165649414, "global_step": 529113, "epoch": 6374} {"train_loss": -27.43470573425293, "global_step": 529114, "epoch": 6374} {"train_loss": -27.404312133789062, "global_step": 529115, "epoch": 6374} {"train_loss": -27.825353622436523, "global_step": 529116, "epoch": 6374} {"train_loss": -27.825607299804688, "global_step": 529117, "epoch": 6374} {"train_loss": -27.468826293945312, "global_step": 529118, "epoch": 6374} {"train_loss": -27.871902465820312, "global_step": 529119, "epoch": 6374} {"train_loss": -27.468555450439453, "global_step": 529120, "epoch": 6374} {"train_loss": -27.696439743041992, "global_step": 529121, "epoch": 6374} {"train_loss": -27.46087646484375, "global_step": 529122, "epoch": 6374} {"train_loss": -27.460126876831055, "global_step": 529123, "epoch": 6374} {"train_loss": -27.53177226882383, "global_step": 529124, "epoch": 6374, "val_loss": 6626823.0} {"train_loss": -27.33675193786621, "global_step": 529125, "epoch": 6375} {"train_loss": -25.687671661376953, "global_step": 529126, "epoch": 6375} {"train_loss": -25.444522857666016, "global_step": 529127, "epoch": 6375} {"train_loss": -26.787628173828125, "global_step": 529128, "epoch": 6375} {"train_loss": -26.939472198486328, "global_step": 529129, "epoch": 6375} {"train_loss": -26.179052352905273, "global_step": 529130, "epoch": 6375} {"train_loss": -26.935760498046875, "global_step": 529131, "epoch": 6375} {"train_loss": -26.917776107788086, "global_step": 529132, "epoch": 6375} {"train_loss": -26.979711532592773, "global_step": 529133, "epoch": 6375} {"train_loss": -26.789560317993164, "global_step": 529134, "epoch": 6375} {"train_loss": -27.006027221679688, "global_step": 529135, "epoch": 6375} {"train_loss": -26.903364181518555, "global_step": 529136, "epoch": 6375} {"train_loss": -27.137191772460938, "global_step": 529137, "epoch": 6375} {"train_loss": -27.057682037353516, "global_step": 529138, "epoch": 6375} {"train_loss": -26.561498641967773, "global_step": 529139, "epoch": 6375} {"train_loss": -27.040525436401367, "global_step": 529140, "epoch": 6375} {"train_loss": -27.458393096923828, "global_step": 529141, "epoch": 6375} {"train_loss": -27.09867286682129, "global_step": 529142, "epoch": 6375} {"train_loss": -27.21851921081543, "global_step": 529143, "epoch": 6375} {"train_loss": -27.4384708404541, "global_step": 529144, "epoch": 6375} {"train_loss": -27.58460807800293, "global_step": 529145, "epoch": 6375} {"train_loss": -27.216419219970703, "global_step": 529146, "epoch": 6375} {"train_loss": -27.314741134643555, "global_step": 529147, "epoch": 6375} {"train_loss": -27.339752197265625, "global_step": 529148, "epoch": 6375} {"train_loss": -27.211084365844727, "global_step": 529149, "epoch": 6375} {"train_loss": -27.391477584838867, "global_step": 529150, "epoch": 6375} {"train_loss": -27.59116554260254, "global_step": 529151, "epoch": 6375} {"train_loss": -27.427701950073242, "global_step": 529152, "epoch": 6375} {"train_loss": -27.56964111328125, "global_step": 529153, "epoch": 6375} {"train_loss": -27.626890182495117, "global_step": 529154, "epoch": 6375} {"train_loss": -27.517011642456055, "global_step": 529155, "epoch": 6375} {"train_loss": -27.454736709594727, "global_step": 529156, "epoch": 6375} {"train_loss": -27.698089599609375, "global_step": 529157, "epoch": 6375} {"train_loss": -27.825714111328125, "global_step": 529158, "epoch": 6375} {"train_loss": -27.52604103088379, "global_step": 529159, "epoch": 6375} {"train_loss": -27.568601608276367, "global_step": 529160, "epoch": 6375} {"train_loss": -27.674015045166016, "global_step": 529161, "epoch": 6375} {"train_loss": -27.75831413269043, "global_step": 529162, "epoch": 6375} {"train_loss": -27.6031494140625, "global_step": 529163, "epoch": 6375} {"train_loss": -27.07097816467285, "global_step": 529164, "epoch": 6375} {"train_loss": -27.65201759338379, "global_step": 529165, "epoch": 6375} {"train_loss": -27.312108993530273, "global_step": 529166, "epoch": 6375} {"train_loss": -27.87592124938965, "global_step": 529167, "epoch": 6375} {"train_loss": -27.48670768737793, "global_step": 529168, "epoch": 6375} {"train_loss": -27.607267379760742, "global_step": 529169, "epoch": 6375} {"train_loss": -27.686140060424805, "global_step": 529170, "epoch": 6375} {"train_loss": -27.844528198242188, "global_step": 529171, "epoch": 6375} {"train_loss": -27.54709815979004, "global_step": 529172, "epoch": 6375} {"train_loss": -27.539575576782227, "global_step": 529173, "epoch": 6375} {"train_loss": -27.681961059570312, "global_step": 529174, "epoch": 6375} {"train_loss": -27.63958740234375, "global_step": 529175, "epoch": 6375} {"train_loss": -27.481985092163086, "global_step": 529176, "epoch": 6375} {"train_loss": -27.49163818359375, "global_step": 529177, "epoch": 6375} {"train_loss": -27.60578727722168, "global_step": 529178, "epoch": 6375} {"train_loss": -27.752735137939453, "global_step": 529179, "epoch": 6375} {"train_loss": -27.448745727539062, "global_step": 529180, "epoch": 6375} {"train_loss": -27.539846420288086, "global_step": 529181, "epoch": 6375} {"train_loss": -27.892908096313477, "global_step": 529182, "epoch": 6375} {"train_loss": -28.162628173828125, "global_step": 529183, "epoch": 6375} {"train_loss": -27.61905288696289, "global_step": 529184, "epoch": 6375} {"train_loss": -27.531396865844727, "global_step": 529185, "epoch": 6375} {"train_loss": -28.088315963745117, "global_step": 529186, "epoch": 6375} {"train_loss": -27.117725372314453, "global_step": 529187, "epoch": 6375} {"train_loss": -27.466089248657227, "global_step": 529188, "epoch": 6375} {"train_loss": -27.279821395874023, "global_step": 529189, "epoch": 6375} {"train_loss": -27.667694091796875, "global_step": 529190, "epoch": 6375} {"train_loss": -27.6041259765625, "global_step": 529191, "epoch": 6375} {"train_loss": -27.686986923217773, "global_step": 529192, "epoch": 6375} {"train_loss": -27.559118270874023, "global_step": 529193, "epoch": 6375} {"train_loss": -27.460718154907227, "global_step": 529194, "epoch": 6375} {"train_loss": -27.75369644165039, "global_step": 529195, "epoch": 6375} {"train_loss": -27.59331703186035, "global_step": 529196, "epoch": 6375} {"train_loss": -27.87920570373535, "global_step": 529197, "epoch": 6375} {"train_loss": -27.83611488342285, "global_step": 529198, "epoch": 6375} {"train_loss": -27.3880615234375, "global_step": 529199, "epoch": 6375} {"train_loss": -27.733963012695312, "global_step": 529200, "epoch": 6375} {"train_loss": -27.659900665283203, "global_step": 529201, "epoch": 6375} {"train_loss": -27.485370635986328, "global_step": 529202, "epoch": 6375} {"train_loss": -27.546369552612305, "global_step": 529203, "epoch": 6375} {"train_loss": -27.713199615478516, "global_step": 529204, "epoch": 6375} {"train_loss": -27.378026962280273, "global_step": 529205, "epoch": 6375} {"train_loss": -27.722883224487305, "global_step": 529206, "epoch": 6375} {"train_loss": -27.397277303488856, "global_step": 529207, "epoch": 6375, "val_loss": 6532941.0} {"train_loss": -26.64032554626465, "global_step": 529208, "epoch": 6376} {"train_loss": -26.62287712097168, "global_step": 529209, "epoch": 6376} {"train_loss": -25.858169555664062, "global_step": 529210, "epoch": 6376} {"train_loss": -24.847658157348633, "global_step": 529211, "epoch": 6376} {"train_loss": -25.4599666595459, "global_step": 529212, "epoch": 6376} {"train_loss": -26.7325496673584, "global_step": 529213, "epoch": 6376} {"train_loss": -26.992284774780273, "global_step": 529214, "epoch": 6376} {"train_loss": -26.74127769470215, "global_step": 529215, "epoch": 6376} {"train_loss": -26.863616943359375, "global_step": 529216, "epoch": 6376} {"train_loss": -26.71860694885254, "global_step": 529217, "epoch": 6376} {"train_loss": -26.447111129760742, "global_step": 529218, "epoch": 6376} {"train_loss": -26.97627067565918, "global_step": 529219, "epoch": 6376} {"train_loss": -27.197031021118164, "global_step": 529220, "epoch": 6376} {"train_loss": -26.622528076171875, "global_step": 529221, "epoch": 6376} {"train_loss": -27.362396240234375, "global_step": 529222, "epoch": 6376} {"train_loss": -27.02471351623535, "global_step": 529223, "epoch": 6376} {"train_loss": -27.330163955688477, "global_step": 529224, "epoch": 6376} {"train_loss": -27.28900146484375, "global_step": 529225, "epoch": 6376} {"train_loss": -27.226842880249023, "global_step": 529226, "epoch": 6376} {"train_loss": -26.716217041015625, "global_step": 529227, "epoch": 6376} {"train_loss": -27.33682632446289, "global_step": 529228, "epoch": 6376} {"train_loss": -27.19695472717285, "global_step": 529229, "epoch": 6376} {"train_loss": -27.062942504882812, "global_step": 529230, "epoch": 6376} {"train_loss": -27.01685905456543, "global_step": 529231, "epoch": 6376} {"train_loss": -27.116809844970703, "global_step": 529232, "epoch": 6376} {"train_loss": -26.703475952148438, "global_step": 529233, "epoch": 6376} {"train_loss": -27.50847816467285, "global_step": 529234, "epoch": 6376} {"train_loss": -26.700040817260742, "global_step": 529235, "epoch": 6376} {"train_loss": -27.053083419799805, "global_step": 529236, "epoch": 6376} {"train_loss": -26.86183738708496, "global_step": 529237, "epoch": 6376} {"train_loss": -27.30254554748535, "global_step": 529238, "epoch": 6376} {"train_loss": -27.128259658813477, "global_step": 529239, "epoch": 6376} {"train_loss": -27.1772403717041, "global_step": 529240, "epoch": 6376} {"train_loss": -27.44219970703125, "global_step": 529241, "epoch": 6376} {"train_loss": -27.04621696472168, "global_step": 529242, "epoch": 6376} {"train_loss": -27.73746109008789, "global_step": 529243, "epoch": 6376} {"train_loss": -27.272703170776367, "global_step": 529244, "epoch": 6376} {"train_loss": -27.557373046875, "global_step": 529245, "epoch": 6376} {"train_loss": -27.394073486328125, "global_step": 529246, "epoch": 6376} {"train_loss": -27.390869140625, "global_step": 529247, "epoch": 6376} {"train_loss": -27.360702514648438, "global_step": 529248, "epoch": 6376} {"train_loss": -27.353124618530273, "global_step": 529249, "epoch": 6376} {"train_loss": -27.561614990234375, "global_step": 529250, "epoch": 6376} {"train_loss": -27.36207389831543, "global_step": 529251, "epoch": 6376} {"train_loss": -27.646100997924805, "global_step": 529252, "epoch": 6376} {"train_loss": -27.596343994140625, "global_step": 529253, "epoch": 6376} {"train_loss": -27.48328971862793, "global_step": 529254, "epoch": 6376} {"train_loss": -27.61090087890625, "global_step": 529255, "epoch": 6376} {"train_loss": -27.81133460998535, "global_step": 529256, "epoch": 6376} {"train_loss": -27.4121150970459, "global_step": 529257, "epoch": 6376} {"train_loss": -27.76898765563965, "global_step": 529258, "epoch": 6376} {"train_loss": -27.55177879333496, "global_step": 529259, "epoch": 6376} {"train_loss": -27.591846466064453, "global_step": 529260, "epoch": 6376} {"train_loss": -27.678543090820312, "global_step": 529261, "epoch": 6376} {"train_loss": -27.1001033782959, "global_step": 529262, "epoch": 6376} {"train_loss": -27.46244239807129, "global_step": 529263, "epoch": 6376} {"train_loss": -27.83758544921875, "global_step": 529264, "epoch": 6376} {"train_loss": -27.567874908447266, "global_step": 529265, "epoch": 6376} {"train_loss": -27.681509017944336, "global_step": 529266, "epoch": 6376} {"train_loss": -27.076467514038086, "global_step": 529267, "epoch": 6376} {"train_loss": -27.44630241394043, "global_step": 529268, "epoch": 6376} {"train_loss": -27.479248046875, "global_step": 529269, "epoch": 6376} {"train_loss": -27.4971981048584, "global_step": 529270, "epoch": 6376} {"train_loss": -27.692081451416016, "global_step": 529271, "epoch": 6376} {"train_loss": -27.157611846923828, "global_step": 529272, "epoch": 6376} {"train_loss": -27.741926193237305, "global_step": 529273, "epoch": 6376} {"train_loss": -27.42412757873535, "global_step": 529274, "epoch": 6376} {"train_loss": -27.765262603759766, "global_step": 529275, "epoch": 6376} {"train_loss": -27.270902633666992, "global_step": 529276, "epoch": 6376} {"train_loss": -27.687957763671875, "global_step": 529277, "epoch": 6376} {"train_loss": -27.452436447143555, "global_step": 529278, "epoch": 6376} {"train_loss": -27.46491813659668, "global_step": 529279, "epoch": 6376} {"train_loss": -27.639368057250977, "global_step": 529280, "epoch": 6376} {"train_loss": -27.663354873657227, "global_step": 529281, "epoch": 6376} {"train_loss": -27.771713256835938, "global_step": 529282, "epoch": 6376} {"train_loss": -27.64168357849121, "global_step": 529283, "epoch": 6376} {"train_loss": -27.4100341796875, "global_step": 529284, "epoch": 6376} {"train_loss": -27.68098258972168, "global_step": 529285, "epoch": 6376} {"train_loss": -27.548452377319336, "global_step": 529286, "epoch": 6376} {"train_loss": -27.84222412109375, "global_step": 529287, "epoch": 6376} {"train_loss": -27.750640869140625, "global_step": 529288, "epoch": 6376} {"train_loss": -27.870975494384766, "global_step": 529289, "epoch": 6376} {"train_loss": -27.280396404036555, "global_step": 529290, "epoch": 6376, "val_loss": 6535991.0} {"train_loss": -24.681936264038086, "global_step": 529291, "epoch": 6377} {"train_loss": -25.52202606201172, "global_step": 529292, "epoch": 6377} {"train_loss": -24.916748046875, "global_step": 529293, "epoch": 6377} {"train_loss": -25.49385643005371, "global_step": 529294, "epoch": 6377} {"train_loss": -25.642929077148438, "global_step": 529295, "epoch": 6377} {"train_loss": -26.793859481811523, "global_step": 529296, "epoch": 6377} {"train_loss": -26.294605255126953, "global_step": 529297, "epoch": 6377} {"train_loss": -26.194122314453125, "global_step": 529298, "epoch": 6377} {"train_loss": -27.069669723510742, "global_step": 529299, "epoch": 6377} {"train_loss": -26.349828720092773, "global_step": 529300, "epoch": 6377} {"train_loss": -25.831750869750977, "global_step": 529301, "epoch": 6377} {"train_loss": -26.582639694213867, "global_step": 529302, "epoch": 6377} {"train_loss": -26.485437393188477, "global_step": 529303, "epoch": 6377} {"train_loss": -26.86565589904785, "global_step": 529304, "epoch": 6377} {"train_loss": -26.347360610961914, "global_step": 529305, "epoch": 6377} {"train_loss": -26.382099151611328, "global_step": 529306, "epoch": 6377} {"train_loss": -26.960285186767578, "global_step": 529307, "epoch": 6377} {"train_loss": -26.996631622314453, "global_step": 529308, "epoch": 6377} {"train_loss": -26.51789665222168, "global_step": 529309, "epoch": 6377} {"train_loss": -27.112171173095703, "global_step": 529310, "epoch": 6377} {"train_loss": -26.980566024780273, "global_step": 529311, "epoch": 6377} {"train_loss": -27.444263458251953, "global_step": 529312, "epoch": 6377} {"train_loss": -26.975873947143555, "global_step": 529313, "epoch": 6377} {"train_loss": -27.001617431640625, "global_step": 529314, "epoch": 6377} {"train_loss": -27.143508911132812, "global_step": 529315, "epoch": 6377} {"train_loss": -27.229124069213867, "global_step": 529316, "epoch": 6377} {"train_loss": -27.316503524780273, "global_step": 529317, "epoch": 6377} {"train_loss": -27.10255241394043, "global_step": 529318, "epoch": 6377} {"train_loss": -27.24116325378418, "global_step": 529319, "epoch": 6377} {"train_loss": -27.150196075439453, "global_step": 529320, "epoch": 6377} {"train_loss": -27.240503311157227, "global_step": 529321, "epoch": 6377} {"train_loss": -26.986963272094727, "global_step": 529322, "epoch": 6377} {"train_loss": -27.5195369720459, "global_step": 529323, "epoch": 6377} {"train_loss": -27.18398094177246, "global_step": 529324, "epoch": 6377} {"train_loss": -27.50333023071289, "global_step": 529325, "epoch": 6377} {"train_loss": -27.4674015045166, "global_step": 529326, "epoch": 6377} {"train_loss": -27.24336051940918, "global_step": 529327, "epoch": 6377} {"train_loss": -27.296506881713867, "global_step": 529328, "epoch": 6377} {"train_loss": -27.35346031188965, "global_step": 529329, "epoch": 6377} {"train_loss": -27.47916030883789, "global_step": 529330, "epoch": 6377} {"train_loss": -27.3551025390625, "global_step": 529331, "epoch": 6377} {"train_loss": -27.537389755249023, "global_step": 529332, "epoch": 6377} {"train_loss": -27.64408302307129, "global_step": 529333, "epoch": 6377} {"train_loss": -27.618005752563477, "global_step": 529334, "epoch": 6377} {"train_loss": -27.701013565063477, "global_step": 529335, "epoch": 6377} {"train_loss": -27.283597946166992, "global_step": 529336, "epoch": 6377} {"train_loss": -27.91688346862793, "global_step": 529337, "epoch": 6377} {"train_loss": -27.6016845703125, "global_step": 529338, "epoch": 6377} {"train_loss": -27.586505889892578, "global_step": 529339, "epoch": 6377} {"train_loss": -27.594541549682617, "global_step": 529340, "epoch": 6377} {"train_loss": -27.806583404541016, "global_step": 529341, "epoch": 6377} {"train_loss": -28.13125991821289, "global_step": 529342, "epoch": 6377} {"train_loss": -27.64950942993164, "global_step": 529343, "epoch": 6377} {"train_loss": -27.754507064819336, "global_step": 529344, "epoch": 6377} {"train_loss": -27.528894424438477, "global_step": 529345, "epoch": 6377} {"train_loss": -27.60091209411621, "global_step": 529346, "epoch": 6377} {"train_loss": -27.741744995117188, "global_step": 529347, "epoch": 6377} {"train_loss": -27.718473434448242, "global_step": 529348, "epoch": 6377} {"train_loss": -27.85809898376465, "global_step": 529349, "epoch": 6377} {"train_loss": -27.68490982055664, "global_step": 529350, "epoch": 6377} {"train_loss": -27.871994018554688, "global_step": 529351, "epoch": 6377} {"train_loss": -28.01847267150879, "global_step": 529352, "epoch": 6377} {"train_loss": -28.220046997070312, "global_step": 529353, "epoch": 6377} {"train_loss": -27.673124313354492, "global_step": 529354, "epoch": 6377} {"train_loss": -27.8649845123291, "global_step": 529355, "epoch": 6377} {"train_loss": -27.5406436920166, "global_step": 529356, "epoch": 6377} {"train_loss": -27.55561637878418, "global_step": 529357, "epoch": 6377} {"train_loss": -27.86016273498535, "global_step": 529358, "epoch": 6377} {"train_loss": -27.96484375, "global_step": 529359, "epoch": 6377} {"train_loss": -27.625844955444336, "global_step": 529360, "epoch": 6377} {"train_loss": -27.364978790283203, "global_step": 529361, "epoch": 6377} {"train_loss": -27.378494262695312, "global_step": 529362, "epoch": 6377} {"train_loss": -28.2628116607666, "global_step": 529363, "epoch": 6377} {"train_loss": -27.84376335144043, "global_step": 529364, "epoch": 6377} {"train_loss": -27.465845108032227, "global_step": 529365, "epoch": 6377} {"train_loss": -27.299835205078125, "global_step": 529366, "epoch": 6377} {"train_loss": -27.611181259155273, "global_step": 529367, "epoch": 6377} {"train_loss": -27.440282821655273, "global_step": 529368, "epoch": 6377} {"train_loss": -27.43994140625, "global_step": 529369, "epoch": 6377} {"train_loss": -27.062732696533203, "global_step": 529370, "epoch": 6377} {"train_loss": -27.44996452331543, "global_step": 529371, "epoch": 6377} {"train_loss": -27.54566764831543, "global_step": 529372, "epoch": 6377} {"train_loss": -27.226825392389873, "global_step": 529373, "epoch": 6377, "val_loss": 6585308.0} {"train_loss": -26.1844482421875, "global_step": 529374, "epoch": 6378} {"train_loss": -26.275623321533203, "global_step": 529375, "epoch": 6378} {"train_loss": -25.6530704498291, "global_step": 529376, "epoch": 6378} {"train_loss": -26.619598388671875, "global_step": 529377, "epoch": 6378} {"train_loss": -26.422515869140625, "global_step": 529378, "epoch": 6378} {"train_loss": -26.10467529296875, "global_step": 529379, "epoch": 6378} {"train_loss": -26.663288116455078, "global_step": 529380, "epoch": 6378} {"train_loss": -26.616119384765625, "global_step": 529381, "epoch": 6378} {"train_loss": -25.783679962158203, "global_step": 529382, "epoch": 6378} {"train_loss": -27.097517013549805, "global_step": 529383, "epoch": 6378} {"train_loss": -26.239276885986328, "global_step": 529384, "epoch": 6378} {"train_loss": -27.0220890045166, "global_step": 529385, "epoch": 6378} {"train_loss": -26.544330596923828, "global_step": 529386, "epoch": 6378} {"train_loss": -27.252126693725586, "global_step": 529387, "epoch": 6378} {"train_loss": -26.818510055541992, "global_step": 529388, "epoch": 6378} {"train_loss": -26.794818878173828, "global_step": 529389, "epoch": 6378} {"train_loss": -26.86929702758789, "global_step": 529390, "epoch": 6378} {"train_loss": -26.976642608642578, "global_step": 529391, "epoch": 6378} {"train_loss": -27.23894691467285, "global_step": 529392, "epoch": 6378} {"train_loss": -27.027692794799805, "global_step": 529393, "epoch": 6378} {"train_loss": -26.84891700744629, "global_step": 529394, "epoch": 6378} {"train_loss": -26.994953155517578, "global_step": 529395, "epoch": 6378} {"train_loss": -27.11496925354004, "global_step": 529396, "epoch": 6378} {"train_loss": -27.586084365844727, "global_step": 529397, "epoch": 6378} {"train_loss": -27.295007705688477, "global_step": 529398, "epoch": 6378} {"train_loss": -27.350021362304688, "global_step": 529399, "epoch": 6378} {"train_loss": -27.48432731628418, "global_step": 529400, "epoch": 6378} {"train_loss": -27.580951690673828, "global_step": 529401, "epoch": 6378} {"train_loss": -27.657556533813477, "global_step": 529402, "epoch": 6378} {"train_loss": -27.300500869750977, "global_step": 529403, "epoch": 6378} {"train_loss": -27.305572509765625, "global_step": 529404, "epoch": 6378} {"train_loss": -27.47804069519043, "global_step": 529405, "epoch": 6378} {"train_loss": -27.5304012298584, "global_step": 529406, "epoch": 6378} {"train_loss": -27.669660568237305, "global_step": 529407, "epoch": 6378} {"train_loss": -27.607452392578125, "global_step": 529408, "epoch": 6378} {"train_loss": -28.07192039489746, "global_step": 529409, "epoch": 6378} {"train_loss": -27.23118019104004, "global_step": 529410, "epoch": 6378} {"train_loss": -27.66476821899414, "global_step": 529411, "epoch": 6378} {"train_loss": -27.1906681060791, "global_step": 529412, "epoch": 6378} {"train_loss": -27.375110626220703, "global_step": 529413, "epoch": 6378} {"train_loss": -27.80755043029785, "global_step": 529414, "epoch": 6378} {"train_loss": -27.175565719604492, "global_step": 529415, "epoch": 6378} {"train_loss": -27.478015899658203, "global_step": 529416, "epoch": 6378} {"train_loss": -27.838653564453125, "global_step": 529417, "epoch": 6378} {"train_loss": -27.60308265686035, "global_step": 529418, "epoch": 6378} {"train_loss": -27.86138343811035, "global_step": 529419, "epoch": 6378} {"train_loss": -27.638708114624023, "global_step": 529420, "epoch": 6378} {"train_loss": -28.114953994750977, "global_step": 529421, "epoch": 6378} {"train_loss": -28.048254013061523, "global_step": 529422, "epoch": 6378} {"train_loss": -28.00390625, "global_step": 529423, "epoch": 6378} {"train_loss": -28.1212158203125, "global_step": 529424, "epoch": 6378} {"train_loss": -27.93505859375, "global_step": 529425, "epoch": 6378} {"train_loss": -27.75311279296875, "global_step": 529426, "epoch": 6378} {"train_loss": -27.643320083618164, "global_step": 529427, "epoch": 6378} {"train_loss": -27.453327178955078, "global_step": 529428, "epoch": 6378} {"train_loss": -27.74538230895996, "global_step": 529429, "epoch": 6378} {"train_loss": -27.716754913330078, "global_step": 529430, "epoch": 6378} {"train_loss": -28.005691528320312, "global_step": 529431, "epoch": 6378} {"train_loss": -27.92549705505371, "global_step": 529432, "epoch": 6378} {"train_loss": -28.263593673706055, "global_step": 529433, "epoch": 6378} {"train_loss": -27.4410457611084, "global_step": 529434, "epoch": 6378} {"train_loss": -27.6104736328125, "global_step": 529435, "epoch": 6378} {"train_loss": -27.51857566833496, "global_step": 529436, "epoch": 6378} {"train_loss": -27.672693252563477, "global_step": 529437, "epoch": 6378} {"train_loss": -27.6108455657959, "global_step": 529438, "epoch": 6378} {"train_loss": -27.7559871673584, "global_step": 529439, "epoch": 6378} {"train_loss": -27.8149471282959, "global_step": 529440, "epoch": 6378} {"train_loss": -27.708438873291016, "global_step": 529441, "epoch": 6378} {"train_loss": -27.784626007080078, "global_step": 529442, "epoch": 6378} {"train_loss": -27.862668991088867, "global_step": 529443, "epoch": 6378} {"train_loss": -27.632038116455078, "global_step": 529444, "epoch": 6378} {"train_loss": -27.600759506225586, "global_step": 529445, "epoch": 6378} {"train_loss": -27.328556060791016, "global_step": 529446, "epoch": 6378} {"train_loss": -27.731510162353516, "global_step": 529447, "epoch": 6378} {"train_loss": -28.044174194335938, "global_step": 529448, "epoch": 6378} {"train_loss": -27.826690673828125, "global_step": 529449, "epoch": 6378} {"train_loss": -27.719858169555664, "global_step": 529450, "epoch": 6378} {"train_loss": -27.5853214263916, "global_step": 529451, "epoch": 6378} {"train_loss": -27.884326934814453, "global_step": 529452, "epoch": 6378} {"train_loss": -26.9811954498291, "global_step": 529453, "epoch": 6378} {"train_loss": -27.745344161987305, "global_step": 529454, "epoch": 6378} {"train_loss": -27.605985641479492, "global_step": 529455, "epoch": 6378} {"train_loss": -27.38935146561588, "global_step": 529456, "epoch": 6378, "val_loss": 6596864.0} {"train_loss": -26.1339168548584, "global_step": 529457, "epoch": 6379} {"train_loss": -25.402494430541992, "global_step": 529458, "epoch": 6379} {"train_loss": -25.914875030517578, "global_step": 529459, "epoch": 6379} {"train_loss": -26.1637020111084, "global_step": 529460, "epoch": 6379} {"train_loss": -26.7598876953125, "global_step": 529461, "epoch": 6379} {"train_loss": -27.352771759033203, "global_step": 529462, "epoch": 6379} {"train_loss": -26.40570068359375, "global_step": 529463, "epoch": 6379} {"train_loss": -26.992889404296875, "global_step": 529464, "epoch": 6379} {"train_loss": -26.94849967956543, "global_step": 529465, "epoch": 6379} {"train_loss": -26.599964141845703, "global_step": 529466, "epoch": 6379} {"train_loss": -26.964384078979492, "global_step": 529467, "epoch": 6379} {"train_loss": -26.899459838867188, "global_step": 529468, "epoch": 6379} {"train_loss": -27.35017967224121, "global_step": 529469, "epoch": 6379} {"train_loss": -26.997648239135742, "global_step": 529470, "epoch": 6379} {"train_loss": -27.166126251220703, "global_step": 529471, "epoch": 6379} {"train_loss": -27.095199584960938, "global_step": 529472, "epoch": 6379} {"train_loss": -27.349401473999023, "global_step": 529473, "epoch": 6379} {"train_loss": -27.457000732421875, "global_step": 529474, "epoch": 6379} {"train_loss": -27.46917152404785, "global_step": 529475, "epoch": 6379} {"train_loss": -27.696271896362305, "global_step": 529476, "epoch": 6379} {"train_loss": -26.834293365478516, "global_step": 529477, "epoch": 6379} {"train_loss": -27.54432487487793, "global_step": 529478, "epoch": 6379} {"train_loss": -27.116811752319336, "global_step": 529479, "epoch": 6379} {"train_loss": -27.26812744140625, "global_step": 529480, "epoch": 6379} {"train_loss": -27.38667869567871, "global_step": 529481, "epoch": 6379} {"train_loss": -27.83513832092285, "global_step": 529482, "epoch": 6379} {"train_loss": -28.093976974487305, "global_step": 529483, "epoch": 6379} {"train_loss": -27.267934799194336, "global_step": 529484, "epoch": 6379} {"train_loss": -27.680830001831055, "global_step": 529485, "epoch": 6379} {"train_loss": -27.447601318359375, "global_step": 529486, "epoch": 6379} {"train_loss": -27.3107967376709, "global_step": 529487, "epoch": 6379} {"train_loss": -27.51889991760254, "global_step": 529488, "epoch": 6379} {"train_loss": -28.0202693939209, "global_step": 529489, "epoch": 6379} {"train_loss": -27.37750244140625, "global_step": 529490, "epoch": 6379} {"train_loss": -27.27783203125, "global_step": 529491, "epoch": 6379} {"train_loss": -27.28989601135254, "global_step": 529492, "epoch": 6379} {"train_loss": -27.911529541015625, "global_step": 529493, "epoch": 6379} {"train_loss": -27.565998077392578, "global_step": 529494, "epoch": 6379} {"train_loss": -27.370817184448242, "global_step": 529495, "epoch": 6379} {"train_loss": -27.453094482421875, "global_step": 529496, "epoch": 6379} {"train_loss": -27.70068359375, "global_step": 529497, "epoch": 6379} {"train_loss": -27.7547664642334, "global_step": 529498, "epoch": 6379} {"train_loss": -27.658111572265625, "global_step": 529499, "epoch": 6379} {"train_loss": -27.311023712158203, "global_step": 529500, "epoch": 6379} {"train_loss": -27.6857852935791, "global_step": 529501, "epoch": 6379} {"train_loss": -27.9185848236084, "global_step": 529502, "epoch": 6379} {"train_loss": -27.768335342407227, "global_step": 529503, "epoch": 6379} {"train_loss": -27.22779655456543, "global_step": 529504, "epoch": 6379} {"train_loss": -27.667407989501953, "global_step": 529505, "epoch": 6379} {"train_loss": -28.076160430908203, "global_step": 529506, "epoch": 6379} {"train_loss": -27.90669822692871, "global_step": 529507, "epoch": 6379} {"train_loss": -27.688953399658203, "global_step": 529508, "epoch": 6379} {"train_loss": -27.892553329467773, "global_step": 529509, "epoch": 6379} {"train_loss": -27.691640853881836, "global_step": 529510, "epoch": 6379} {"train_loss": -27.781768798828125, "global_step": 529511, "epoch": 6379} {"train_loss": -28.097644805908203, "global_step": 529512, "epoch": 6379} {"train_loss": -27.699377059936523, "global_step": 529513, "epoch": 6379} {"train_loss": -27.55568504333496, "global_step": 529514, "epoch": 6379} {"train_loss": -27.388263702392578, "global_step": 529515, "epoch": 6379} {"train_loss": -26.914020538330078, "global_step": 529516, "epoch": 6379} {"train_loss": -27.6376953125, "global_step": 529517, "epoch": 6379} {"train_loss": -27.352588653564453, "global_step": 529518, "epoch": 6379} {"train_loss": -27.484304428100586, "global_step": 529519, "epoch": 6379} {"train_loss": -26.933385848999023, "global_step": 529520, "epoch": 6379} {"train_loss": -27.406177520751953, "global_step": 529521, "epoch": 6379} {"train_loss": -27.337247848510742, "global_step": 529522, "epoch": 6379} {"train_loss": -27.748138427734375, "global_step": 529523, "epoch": 6379} {"train_loss": -27.3260555267334, "global_step": 529524, "epoch": 6379} {"train_loss": -27.6071720123291, "global_step": 529525, "epoch": 6379} {"train_loss": -27.168973922729492, "global_step": 529526, "epoch": 6379} {"train_loss": -27.571653366088867, "global_step": 529527, "epoch": 6379} {"train_loss": -27.769622802734375, "global_step": 529528, "epoch": 6379} {"train_loss": -27.311664581298828, "global_step": 529529, "epoch": 6379} {"train_loss": -27.454452514648438, "global_step": 529530, "epoch": 6379} {"train_loss": -27.855255126953125, "global_step": 529531, "epoch": 6379} {"train_loss": -27.2762508392334, "global_step": 529532, "epoch": 6379} {"train_loss": -27.49641227722168, "global_step": 529533, "epoch": 6379} {"train_loss": -27.326032638549805, "global_step": 529534, "epoch": 6379} {"train_loss": -27.2370662689209, "global_step": 529535, "epoch": 6379} {"train_loss": -27.71891212463379, "global_step": 529536, "epoch": 6379} {"train_loss": -27.434040069580078, "global_step": 529537, "epoch": 6379} {"train_loss": -27.560331344604492, "global_step": 529538, "epoch": 6379} {"train_loss": -27.353884662490294, "global_step": 529539, "epoch": 6379, "val_loss": 6597545.0} {"train_loss": -26.755613327026367, "global_step": 529540, "epoch": 6380} {"train_loss": -26.83111000061035, "global_step": 529541, "epoch": 6380} {"train_loss": -25.773406982421875, "global_step": 529542, "epoch": 6380} {"train_loss": -26.506866455078125, "global_step": 529543, "epoch": 6380} {"train_loss": -27.37646484375, "global_step": 529544, "epoch": 6380} {"train_loss": -26.47186279296875, "global_step": 529545, "epoch": 6380} {"train_loss": -26.26798439025879, "global_step": 529546, "epoch": 6380} {"train_loss": -27.36615562438965, "global_step": 529547, "epoch": 6380} {"train_loss": -26.820966720581055, "global_step": 529548, "epoch": 6380} {"train_loss": -27.183759689331055, "global_step": 529549, "epoch": 6380} {"train_loss": -26.955652236938477, "global_step": 529550, "epoch": 6380} {"train_loss": -26.692068099975586, "global_step": 529551, "epoch": 6380} {"train_loss": -27.083831787109375, "global_step": 529552, "epoch": 6380} {"train_loss": -27.092151641845703, "global_step": 529553, "epoch": 6380} {"train_loss": -27.36104393005371, "global_step": 529554, "epoch": 6380} {"train_loss": -27.414306640625, "global_step": 529555, "epoch": 6380} {"train_loss": -27.20782470703125, "global_step": 529556, "epoch": 6380} {"train_loss": -27.25495719909668, "global_step": 529557, "epoch": 6380} {"train_loss": -27.541706085205078, "global_step": 529558, "epoch": 6380} {"train_loss": -27.011621475219727, "global_step": 529559, "epoch": 6380} {"train_loss": -27.002981185913086, "global_step": 529560, "epoch": 6380} {"train_loss": -27.30897331237793, "global_step": 529561, "epoch": 6380} {"train_loss": -27.293476104736328, "global_step": 529562, "epoch": 6380} {"train_loss": -27.516828536987305, "global_step": 529563, "epoch": 6380} {"train_loss": -27.642316818237305, "global_step": 529564, "epoch": 6380} {"train_loss": -27.44294548034668, "global_step": 529565, "epoch": 6380} {"train_loss": -27.078359603881836, "global_step": 529566, "epoch": 6380} {"train_loss": -27.409088134765625, "global_step": 529567, "epoch": 6380} {"train_loss": -27.207324981689453, "global_step": 529568, "epoch": 6380} {"train_loss": -27.357824325561523, "global_step": 529569, "epoch": 6380} {"train_loss": -27.61651611328125, "global_step": 529570, "epoch": 6380} {"train_loss": -27.737390518188477, "global_step": 529571, "epoch": 6380} {"train_loss": -27.523395538330078, "global_step": 529572, "epoch": 6380} {"train_loss": -27.59967041015625, "global_step": 529573, "epoch": 6380} {"train_loss": -27.51410484313965, "global_step": 529574, "epoch": 6380} {"train_loss": -27.6513729095459, "global_step": 529575, "epoch": 6380} {"train_loss": -27.743179321289062, "global_step": 529576, "epoch": 6380} {"train_loss": -27.777820587158203, "global_step": 529577, "epoch": 6380} {"train_loss": -27.602752685546875, "global_step": 529578, "epoch": 6380} {"train_loss": -27.675146102905273, "global_step": 529579, "epoch": 6380} {"train_loss": -27.96409034729004, "global_step": 529580, "epoch": 6380} {"train_loss": -27.612533569335938, "global_step": 529581, "epoch": 6380} {"train_loss": -27.929183959960938, "global_step": 529582, "epoch": 6380} {"train_loss": -27.867895126342773, "global_step": 529583, "epoch": 6380} {"train_loss": -27.800800323486328, "global_step": 529584, "epoch": 6380} {"train_loss": -27.273807525634766, "global_step": 529585, "epoch": 6380} {"train_loss": -27.578210830688477, "global_step": 529586, "epoch": 6380} {"train_loss": -27.77396583557129, "global_step": 529587, "epoch": 6380} {"train_loss": -27.975202560424805, "global_step": 529588, "epoch": 6380} {"train_loss": -27.944787979125977, "global_step": 529589, "epoch": 6380} {"train_loss": -27.696609497070312, "global_step": 529590, "epoch": 6380} {"train_loss": -27.749258041381836, "global_step": 529591, "epoch": 6380} {"train_loss": -28.00188636779785, "global_step": 529592, "epoch": 6380} {"train_loss": -27.76299476623535, "global_step": 529593, "epoch": 6380} {"train_loss": -27.644092559814453, "global_step": 529594, "epoch": 6380} {"train_loss": -27.80488395690918, "global_step": 529595, "epoch": 6380} {"train_loss": -28.111127853393555, "global_step": 529596, "epoch": 6380} {"train_loss": -27.509262084960938, "global_step": 529597, "epoch": 6380} {"train_loss": -27.864154815673828, "global_step": 529598, "epoch": 6380} {"train_loss": -27.753812789916992, "global_step": 529599, "epoch": 6380} {"train_loss": -27.881330490112305, "global_step": 529600, "epoch": 6380} {"train_loss": -28.121103286743164, "global_step": 529601, "epoch": 6380} {"train_loss": -27.709152221679688, "global_step": 529602, "epoch": 6380} {"train_loss": -27.546945571899414, "global_step": 529603, "epoch": 6380} {"train_loss": -27.923791885375977, "global_step": 529604, "epoch": 6380} {"train_loss": -27.521203994750977, "global_step": 529605, "epoch": 6380} {"train_loss": -27.83993911743164, "global_step": 529606, "epoch": 6380} {"train_loss": -27.570941925048828, "global_step": 529607, "epoch": 6380} {"train_loss": -27.8289794921875, "global_step": 529608, "epoch": 6380} {"train_loss": -27.89177894592285, "global_step": 529609, "epoch": 6380} {"train_loss": -27.568954467773438, "global_step": 529610, "epoch": 6380} {"train_loss": -27.52016258239746, "global_step": 529611, "epoch": 6380} {"train_loss": -27.895177841186523, "global_step": 529612, "epoch": 6380} {"train_loss": -27.78217124938965, "global_step": 529613, "epoch": 6380} {"train_loss": -27.55316734313965, "global_step": 529614, "epoch": 6380} {"train_loss": -27.182119369506836, "global_step": 529615, "epoch": 6380} {"train_loss": -27.71238136291504, "global_step": 529616, "epoch": 6380} {"train_loss": -27.719839096069336, "global_step": 529617, "epoch": 6380} {"train_loss": -27.5753173828125, "global_step": 529618, "epoch": 6380} {"train_loss": -27.630634307861328, "global_step": 529619, "epoch": 6380} {"train_loss": -27.387357711791992, "global_step": 529620, "epoch": 6380} {"train_loss": -27.3023738861084, "global_step": 529621, "epoch": 6380} {"train_loss": -27.491818508469915, "global_step": 529622, "epoch": 6380, "val_loss": 6622927.5} {"train_loss": -26.981369018554688, "global_step": 529623, "epoch": 6381} {"train_loss": -27.066015243530273, "global_step": 529624, "epoch": 6381} {"train_loss": -26.883136749267578, "global_step": 529625, "epoch": 6381} {"train_loss": -27.14389419555664, "global_step": 529626, "epoch": 6381} {"train_loss": -26.84760093688965, "global_step": 529627, "epoch": 6381} {"train_loss": -27.070465087890625, "global_step": 529628, "epoch": 6381} {"train_loss": -27.42041015625, "global_step": 529629, "epoch": 6381} {"train_loss": -27.17988395690918, "global_step": 529630, "epoch": 6381} {"train_loss": -27.42108726501465, "global_step": 529631, "epoch": 6381} {"train_loss": -26.575607299804688, "global_step": 529632, "epoch": 6381} {"train_loss": -27.342208862304688, "global_step": 529633, "epoch": 6381} {"train_loss": -27.052154541015625, "global_step": 529634, "epoch": 6381} {"train_loss": -27.3052921295166, "global_step": 529635, "epoch": 6381} {"train_loss": -27.773990631103516, "global_step": 529636, "epoch": 6381} {"train_loss": -27.281644821166992, "global_step": 529637, "epoch": 6381} {"train_loss": -27.20783042907715, "global_step": 529638, "epoch": 6381} {"train_loss": -27.410348892211914, "global_step": 529639, "epoch": 6381} {"train_loss": -27.578989028930664, "global_step": 529640, "epoch": 6381} {"train_loss": -27.391223907470703, "global_step": 529641, "epoch": 6381} {"train_loss": -27.055591583251953, "global_step": 529642, "epoch": 6381} {"train_loss": -27.46795654296875, "global_step": 529643, "epoch": 6381} {"train_loss": -27.696308135986328, "global_step": 529644, "epoch": 6381} {"train_loss": -27.644861221313477, "global_step": 529645, "epoch": 6381} {"train_loss": -27.651098251342773, "global_step": 529646, "epoch": 6381} {"train_loss": -27.565916061401367, "global_step": 529647, "epoch": 6381} {"train_loss": -27.6459903717041, "global_step": 529648, "epoch": 6381} {"train_loss": -27.5040283203125, "global_step": 529649, "epoch": 6381} {"train_loss": -27.40559959411621, "global_step": 529650, "epoch": 6381} {"train_loss": -27.54050064086914, "global_step": 529651, "epoch": 6381} {"train_loss": -27.554798126220703, "global_step": 529652, "epoch": 6381} {"train_loss": -27.403234481811523, "global_step": 529653, "epoch": 6381} {"train_loss": -27.26199722290039, "global_step": 529654, "epoch": 6381} {"train_loss": -27.780729293823242, "global_step": 529655, "epoch": 6381} {"train_loss": -27.808801651000977, "global_step": 529656, "epoch": 6381} {"train_loss": -27.607196807861328, "global_step": 529657, "epoch": 6381} {"train_loss": -27.846609115600586, "global_step": 529658, "epoch": 6381} {"train_loss": -27.85028648376465, "global_step": 529659, "epoch": 6381} {"train_loss": -28.112051010131836, "global_step": 529660, "epoch": 6381} {"train_loss": -27.59998893737793, "global_step": 529661, "epoch": 6381} {"train_loss": -27.532470703125, "global_step": 529662, "epoch": 6381} {"train_loss": -27.99947166442871, "global_step": 529663, "epoch": 6381} {"train_loss": -27.83997917175293, "global_step": 529664, "epoch": 6381} {"train_loss": -27.78680992126465, "global_step": 529665, "epoch": 6381} {"train_loss": -27.32126235961914, "global_step": 529666, "epoch": 6381} {"train_loss": -27.258325576782227, "global_step": 529667, "epoch": 6381} {"train_loss": -27.795629501342773, "global_step": 529668, "epoch": 6381} {"train_loss": -27.695632934570312, "global_step": 529669, "epoch": 6381} {"train_loss": -27.6726016998291, "global_step": 529670, "epoch": 6381} {"train_loss": -27.69514274597168, "global_step": 529671, "epoch": 6381} {"train_loss": -27.31369972229004, "global_step": 529672, "epoch": 6381} {"train_loss": -27.440677642822266, "global_step": 529673, "epoch": 6381} {"train_loss": -27.533615112304688, "global_step": 529674, "epoch": 6381} {"train_loss": -27.57512855529785, "global_step": 529675, "epoch": 6381} {"train_loss": -28.176010131835938, "global_step": 529676, "epoch": 6381} {"train_loss": -27.635498046875, "global_step": 529677, "epoch": 6381} {"train_loss": -28.163848876953125, "global_step": 529678, "epoch": 6381} {"train_loss": -27.502416610717773, "global_step": 529679, "epoch": 6381} {"train_loss": -27.991682052612305, "global_step": 529680, "epoch": 6381} {"train_loss": -28.123920440673828, "global_step": 529681, "epoch": 6381} {"train_loss": -27.55537986755371, "global_step": 529682, "epoch": 6381} {"train_loss": -27.5772647857666, "global_step": 529683, "epoch": 6381} {"train_loss": -27.947799682617188, "global_step": 529684, "epoch": 6381} {"train_loss": -27.238733291625977, "global_step": 529685, "epoch": 6381} {"train_loss": -27.723072052001953, "global_step": 529686, "epoch": 6381} {"train_loss": -27.7200984954834, "global_step": 529687, "epoch": 6381} {"train_loss": -27.63054847717285, "global_step": 529688, "epoch": 6381} {"train_loss": -27.861221313476562, "global_step": 529689, "epoch": 6381} {"train_loss": -27.756256103515625, "global_step": 529690, "epoch": 6381} {"train_loss": -27.481531143188477, "global_step": 529691, "epoch": 6381} {"train_loss": -27.9089298248291, "global_step": 529692, "epoch": 6381} {"train_loss": -27.5668888092041, "global_step": 529693, "epoch": 6381} {"train_loss": -27.484420776367188, "global_step": 529694, "epoch": 6381} {"train_loss": -27.654138565063477, "global_step": 529695, "epoch": 6381} {"train_loss": -27.711278915405273, "global_step": 529696, "epoch": 6381} {"train_loss": -27.7214412689209, "global_step": 529697, "epoch": 6381} {"train_loss": -27.796472549438477, "global_step": 529698, "epoch": 6381} {"train_loss": -27.921079635620117, "global_step": 529699, "epoch": 6381} {"train_loss": -27.19232749938965, "global_step": 529700, "epoch": 6381} {"train_loss": -26.640798568725586, "global_step": 529701, "epoch": 6381} {"train_loss": -26.747241973876953, "global_step": 529702, "epoch": 6381} {"train_loss": -27.627838134765625, "global_step": 529703, "epoch": 6381} {"train_loss": -27.583532333374023, "global_step": 529704, "epoch": 6381} {"train_loss": -27.520112692591656, "global_step": 529705, "epoch": 6381, "val_loss": 6620135.0} {"train_loss": -26.326894760131836, "global_step": 529706, "epoch": 6382} {"train_loss": -24.16596031188965, "global_step": 529707, "epoch": 6382} {"train_loss": -25.8760929107666, "global_step": 529708, "epoch": 6382} {"train_loss": -25.758840560913086, "global_step": 529709, "epoch": 6382} {"train_loss": -25.566650390625, "global_step": 529710, "epoch": 6382} {"train_loss": -26.33536148071289, "global_step": 529711, "epoch": 6382} {"train_loss": -26.199371337890625, "global_step": 529712, "epoch": 6382} {"train_loss": -25.654870986938477, "global_step": 529713, "epoch": 6382} {"train_loss": -26.749303817749023, "global_step": 529714, "epoch": 6382} {"train_loss": -26.13593101501465, "global_step": 529715, "epoch": 6382} {"train_loss": -26.702686309814453, "global_step": 529716, "epoch": 6382} {"train_loss": -26.615903854370117, "global_step": 529717, "epoch": 6382} {"train_loss": -26.376041412353516, "global_step": 529718, "epoch": 6382} {"train_loss": -26.50628662109375, "global_step": 529719, "epoch": 6382} {"train_loss": -26.692890167236328, "global_step": 529720, "epoch": 6382} {"train_loss": -26.755712509155273, "global_step": 529721, "epoch": 6382} {"train_loss": -26.84055519104004, "global_step": 529722, "epoch": 6382} {"train_loss": -26.705520629882812, "global_step": 529723, "epoch": 6382} {"train_loss": -27.33258056640625, "global_step": 529724, "epoch": 6382} {"train_loss": -27.204191207885742, "global_step": 529725, "epoch": 6382} {"train_loss": -26.870641708374023, "global_step": 529726, "epoch": 6382} {"train_loss": -26.870206832885742, "global_step": 529727, "epoch": 6382} {"train_loss": -27.438867568969727, "global_step": 529728, "epoch": 6382} {"train_loss": -27.429182052612305, "global_step": 529729, "epoch": 6382} {"train_loss": -26.936080932617188, "global_step": 529730, "epoch": 6382} {"train_loss": -27.254175186157227, "global_step": 529731, "epoch": 6382} {"train_loss": -27.626239776611328, "global_step": 529732, "epoch": 6382} {"train_loss": -26.678070068359375, "global_step": 529733, "epoch": 6382} {"train_loss": -27.2481632232666, "global_step": 529734, "epoch": 6382} {"train_loss": -27.29669761657715, "global_step": 529735, "epoch": 6382} {"train_loss": -27.6044921875, "global_step": 529736, "epoch": 6382} {"train_loss": -27.139768600463867, "global_step": 529737, "epoch": 6382} {"train_loss": -27.63336181640625, "global_step": 529738, "epoch": 6382} {"train_loss": -27.287494659423828, "global_step": 529739, "epoch": 6382} {"train_loss": -27.2164306640625, "global_step": 529740, "epoch": 6382} {"train_loss": -27.33724021911621, "global_step": 529741, "epoch": 6382} {"train_loss": -27.033172607421875, "global_step": 529742, "epoch": 6382} {"train_loss": -27.293914794921875, "global_step": 529743, "epoch": 6382} {"train_loss": -27.416217803955078, "global_step": 529744, "epoch": 6382} {"train_loss": -27.206256866455078, "global_step": 529745, "epoch": 6382} {"train_loss": -27.49045753479004, "global_step": 529746, "epoch": 6382} {"train_loss": -27.605976104736328, "global_step": 529747, "epoch": 6382} {"train_loss": -27.08229637145996, "global_step": 529748, "epoch": 6382} {"train_loss": -27.318952560424805, "global_step": 529749, "epoch": 6382} {"train_loss": -27.683853149414062, "global_step": 529750, "epoch": 6382} {"train_loss": -27.15485954284668, "global_step": 529751, "epoch": 6382} {"train_loss": -27.856494903564453, "global_step": 529752, "epoch": 6382} {"train_loss": -27.26386833190918, "global_step": 529753, "epoch": 6382} {"train_loss": -27.862075805664062, "global_step": 529754, "epoch": 6382} {"train_loss": -27.698383331298828, "global_step": 529755, "epoch": 6382} {"train_loss": -27.72747230529785, "global_step": 529756, "epoch": 6382} {"train_loss": -27.7912540435791, "global_step": 529757, "epoch": 6382} {"train_loss": -27.901569366455078, "global_step": 529758, "epoch": 6382} {"train_loss": -27.805469512939453, "global_step": 529759, "epoch": 6382} {"train_loss": -27.66347312927246, "global_step": 529760, "epoch": 6382} {"train_loss": -27.83551025390625, "global_step": 529761, "epoch": 6382} {"train_loss": -27.696088790893555, "global_step": 529762, "epoch": 6382} {"train_loss": -27.487722396850586, "global_step": 529763, "epoch": 6382} {"train_loss": -27.685047149658203, "global_step": 529764, "epoch": 6382} {"train_loss": -27.903018951416016, "global_step": 529765, "epoch": 6382} {"train_loss": -28.152027130126953, "global_step": 529766, "epoch": 6382} {"train_loss": -27.571516036987305, "global_step": 529767, "epoch": 6382} {"train_loss": -27.730304718017578, "global_step": 529768, "epoch": 6382} {"train_loss": -27.522626876831055, "global_step": 529769, "epoch": 6382} {"train_loss": -27.274768829345703, "global_step": 529770, "epoch": 6382} {"train_loss": -28.139089584350586, "global_step": 529771, "epoch": 6382} {"train_loss": -27.7834415435791, "global_step": 529772, "epoch": 6382} {"train_loss": -27.370227813720703, "global_step": 529773, "epoch": 6382} {"train_loss": -27.99360466003418, "global_step": 529774, "epoch": 6382} {"train_loss": -27.75838279724121, "global_step": 529775, "epoch": 6382} {"train_loss": -27.568700790405273, "global_step": 529776, "epoch": 6382} {"train_loss": -27.596338272094727, "global_step": 529777, "epoch": 6382} {"train_loss": -27.718671798706055, "global_step": 529778, "epoch": 6382} {"train_loss": -27.71390724182129, "global_step": 529779, "epoch": 6382} {"train_loss": -27.591007232666016, "global_step": 529780, "epoch": 6382} {"train_loss": -27.970809936523438, "global_step": 529781, "epoch": 6382} {"train_loss": -27.845306396484375, "global_step": 529782, "epoch": 6382} {"train_loss": -27.72354507446289, "global_step": 529783, "epoch": 6382} {"train_loss": -28.162710189819336, "global_step": 529784, "epoch": 6382} {"train_loss": -28.097021102905273, "global_step": 529785, "epoch": 6382} {"train_loss": -27.329696655273438, "global_step": 529786, "epoch": 6382} {"train_loss": -27.7813720703125, "global_step": 529787, "epoch": 6382} {"train_loss": -27.234281379056263, "global_step": 529788, "epoch": 6382, "val_loss": 6580851.0} {"train_loss": -26.807727813720703, "global_step": 529789, "epoch": 6383} {"train_loss": -26.877389907836914, "global_step": 529790, "epoch": 6383} {"train_loss": -26.263288497924805, "global_step": 529791, "epoch": 6383} {"train_loss": -25.551528930664062, "global_step": 529792, "epoch": 6383} {"train_loss": -25.837127685546875, "global_step": 529793, "epoch": 6383} {"train_loss": -27.10030174255371, "global_step": 529794, "epoch": 6383} {"train_loss": -26.6590576171875, "global_step": 529795, "epoch": 6383} {"train_loss": -27.51898765563965, "global_step": 529796, "epoch": 6383} {"train_loss": -27.43739891052246, "global_step": 529797, "epoch": 6383} {"train_loss": -26.98779296875, "global_step": 529798, "epoch": 6383} {"train_loss": -27.278181076049805, "global_step": 529799, "epoch": 6383} {"train_loss": -26.939838409423828, "global_step": 529800, "epoch": 6383} {"train_loss": -27.31817054748535, "global_step": 529801, "epoch": 6383} {"train_loss": -27.143299102783203, "global_step": 529802, "epoch": 6383} {"train_loss": -27.231473922729492, "global_step": 529803, "epoch": 6383} {"train_loss": -27.450109481811523, "global_step": 529804, "epoch": 6383} {"train_loss": -27.44630241394043, "global_step": 529805, "epoch": 6383} {"train_loss": -27.466781616210938, "global_step": 529806, "epoch": 6383} {"train_loss": -27.585285186767578, "global_step": 529807, "epoch": 6383} {"train_loss": -27.78700065612793, "global_step": 529808, "epoch": 6383} {"train_loss": -26.96563720703125, "global_step": 529809, "epoch": 6383} {"train_loss": -27.753625869750977, "global_step": 529810, "epoch": 6383} {"train_loss": -27.320816040039062, "global_step": 529811, "epoch": 6383} {"train_loss": -27.54959487915039, "global_step": 529812, "epoch": 6383} {"train_loss": -27.835174560546875, "global_step": 529813, "epoch": 6383} {"train_loss": -27.784183502197266, "global_step": 529814, "epoch": 6383} {"train_loss": -27.661115646362305, "global_step": 529815, "epoch": 6383} {"train_loss": -27.3220272064209, "global_step": 529816, "epoch": 6383} {"train_loss": -27.12546730041504, "global_step": 529817, "epoch": 6383} {"train_loss": -27.60561180114746, "global_step": 529818, "epoch": 6383} {"train_loss": -27.13306999206543, "global_step": 529819, "epoch": 6383} {"train_loss": -27.69783592224121, "global_step": 529820, "epoch": 6383} {"train_loss": -27.626413345336914, "global_step": 529821, "epoch": 6383} {"train_loss": -27.437795639038086, "global_step": 529822, "epoch": 6383} {"train_loss": -27.547555923461914, "global_step": 529823, "epoch": 6383} {"train_loss": -27.30735206604004, "global_step": 529824, "epoch": 6383} {"train_loss": -27.563074111938477, "global_step": 529825, "epoch": 6383} {"train_loss": -27.839609146118164, "global_step": 529826, "epoch": 6383} {"train_loss": -27.75249671936035, "global_step": 529827, "epoch": 6383} {"train_loss": -27.812973022460938, "global_step": 529828, "epoch": 6383} {"train_loss": -27.640790939331055, "global_step": 529829, "epoch": 6383} {"train_loss": -27.71030044555664, "global_step": 529830, "epoch": 6383} {"train_loss": -27.872528076171875, "global_step": 529831, "epoch": 6383} {"train_loss": -27.591064453125, "global_step": 529832, "epoch": 6383} {"train_loss": -27.895971298217773, "global_step": 529833, "epoch": 6383} {"train_loss": -27.47686767578125, "global_step": 529834, "epoch": 6383} {"train_loss": -27.60663414001465, "global_step": 529835, "epoch": 6383} {"train_loss": -27.4909725189209, "global_step": 529836, "epoch": 6383} {"train_loss": -27.440595626831055, "global_step": 529837, "epoch": 6383} {"train_loss": -27.178394317626953, "global_step": 529838, "epoch": 6383} {"train_loss": -27.792388916015625, "global_step": 529839, "epoch": 6383} {"train_loss": -27.540882110595703, "global_step": 529840, "epoch": 6383} {"train_loss": -27.560041427612305, "global_step": 529841, "epoch": 6383} {"train_loss": -27.828596115112305, "global_step": 529842, "epoch": 6383} {"train_loss": -27.309284210205078, "global_step": 529843, "epoch": 6383} {"train_loss": -27.903745651245117, "global_step": 529844, "epoch": 6383} {"train_loss": -27.619409561157227, "global_step": 529845, "epoch": 6383} {"train_loss": -27.711029052734375, "global_step": 529846, "epoch": 6383} {"train_loss": -27.918140411376953, "global_step": 529847, "epoch": 6383} {"train_loss": -27.642419815063477, "global_step": 529848, "epoch": 6383} {"train_loss": -27.115325927734375, "global_step": 529849, "epoch": 6383} {"train_loss": -27.5581111907959, "global_step": 529850, "epoch": 6383} {"train_loss": -27.96341896057129, "global_step": 529851, "epoch": 6383} {"train_loss": -27.71135902404785, "global_step": 529852, "epoch": 6383} {"train_loss": -27.522245407104492, "global_step": 529853, "epoch": 6383} {"train_loss": -27.26902198791504, "global_step": 529854, "epoch": 6383} {"train_loss": -27.128442764282227, "global_step": 529855, "epoch": 6383} {"train_loss": -27.56610107421875, "global_step": 529856, "epoch": 6383} {"train_loss": -27.6729736328125, "global_step": 529857, "epoch": 6383} {"train_loss": -26.83210563659668, "global_step": 529858, "epoch": 6383} {"train_loss": -27.016088485717773, "global_step": 529859, "epoch": 6383} {"train_loss": -27.741376876831055, "global_step": 529860, "epoch": 6383} {"train_loss": -27.34909439086914, "global_step": 529861, "epoch": 6383} {"train_loss": -27.30889320373535, "global_step": 529862, "epoch": 6383} {"train_loss": -27.409093856811523, "global_step": 529863, "epoch": 6383} {"train_loss": -27.374135971069336, "global_step": 529864, "epoch": 6383} {"train_loss": -26.92538833618164, "global_step": 529865, "epoch": 6383} {"train_loss": -27.746397018432617, "global_step": 529866, "epoch": 6383} {"train_loss": -26.908246994018555, "global_step": 529867, "epoch": 6383} {"train_loss": -27.183521270751953, "global_step": 529868, "epoch": 6383} {"train_loss": -27.334569931030273, "global_step": 529869, "epoch": 6383} {"train_loss": -27.880395889282227, "global_step": 529870, "epoch": 6383} {"train_loss": -27.382847085056536, "global_step": 529871, "epoch": 6383, "val_loss": 6613601.0} {"train_loss": -25.7751407623291, "global_step": 529872, "epoch": 6384} {"train_loss": -26.700103759765625, "global_step": 529873, "epoch": 6384} {"train_loss": -26.27740478515625, "global_step": 529874, "epoch": 6384} {"train_loss": -26.054052352905273, "global_step": 529875, "epoch": 6384} {"train_loss": -26.51177978515625, "global_step": 529876, "epoch": 6384} {"train_loss": -26.206775665283203, "global_step": 529877, "epoch": 6384} {"train_loss": -26.777875900268555, "global_step": 529878, "epoch": 6384} {"train_loss": -26.819997787475586, "global_step": 529879, "epoch": 6384} {"train_loss": -27.04465675354004, "global_step": 529880, "epoch": 6384} {"train_loss": -26.78584098815918, "global_step": 529881, "epoch": 6384} {"train_loss": -26.981122970581055, "global_step": 529882, "epoch": 6384} {"train_loss": -26.899267196655273, "global_step": 529883, "epoch": 6384} {"train_loss": -26.615631103515625, "global_step": 529884, "epoch": 6384} {"train_loss": -27.267475128173828, "global_step": 529885, "epoch": 6384} {"train_loss": -26.737640380859375, "global_step": 529886, "epoch": 6384} {"train_loss": -26.902002334594727, "global_step": 529887, "epoch": 6384} {"train_loss": -27.221221923828125, "global_step": 529888, "epoch": 6384} {"train_loss": -26.6348876953125, "global_step": 529889, "epoch": 6384} {"train_loss": -27.033533096313477, "global_step": 529890, "epoch": 6384} {"train_loss": -27.48675537109375, "global_step": 529891, "epoch": 6384} {"train_loss": -27.38943862915039, "global_step": 529892, "epoch": 6384} {"train_loss": -27.065893173217773, "global_step": 529893, "epoch": 6384} {"train_loss": -26.840192794799805, "global_step": 529894, "epoch": 6384} {"train_loss": -27.5900936126709, "global_step": 529895, "epoch": 6384} {"train_loss": -26.98923110961914, "global_step": 529896, "epoch": 6384} {"train_loss": -27.29628562927246, "global_step": 529897, "epoch": 6384} {"train_loss": -27.037160873413086, "global_step": 529898, "epoch": 6384} {"train_loss": -26.99382972717285, "global_step": 529899, "epoch": 6384} {"train_loss": -27.155078887939453, "global_step": 529900, "epoch": 6384} {"train_loss": -27.422260284423828, "global_step": 529901, "epoch": 6384} {"train_loss": -27.1213436126709, "global_step": 529902, "epoch": 6384} {"train_loss": -27.282718658447266, "global_step": 529903, "epoch": 6384} {"train_loss": -27.85902214050293, "global_step": 529904, "epoch": 6384} {"train_loss": -27.629743576049805, "global_step": 529905, "epoch": 6384} {"train_loss": -27.65223503112793, "global_step": 529906, "epoch": 6384} {"train_loss": -27.34033203125, "global_step": 529907, "epoch": 6384} {"train_loss": -27.898550033569336, "global_step": 529908, "epoch": 6384} {"train_loss": -27.388202667236328, "global_step": 529909, "epoch": 6384} {"train_loss": -27.5089054107666, "global_step": 529910, "epoch": 6384} {"train_loss": -27.3346004486084, "global_step": 529911, "epoch": 6384} {"train_loss": -27.43228530883789, "global_step": 529912, "epoch": 6384} {"train_loss": -27.655492782592773, "global_step": 529913, "epoch": 6384} {"train_loss": -27.535720825195312, "global_step": 529914, "epoch": 6384} {"train_loss": -27.4622859954834, "global_step": 529915, "epoch": 6384} {"train_loss": -27.7753963470459, "global_step": 529916, "epoch": 6384} {"train_loss": -27.497425079345703, "global_step": 529917, "epoch": 6384} {"train_loss": -27.384511947631836, "global_step": 529918, "epoch": 6384} {"train_loss": -27.524860382080078, "global_step": 529919, "epoch": 6384} {"train_loss": -27.40199851989746, "global_step": 529920, "epoch": 6384} {"train_loss": -27.3504581451416, "global_step": 529921, "epoch": 6384} {"train_loss": -27.415481567382812, "global_step": 529922, "epoch": 6384} {"train_loss": -27.868213653564453, "global_step": 529923, "epoch": 6384} {"train_loss": -27.52205467224121, "global_step": 529924, "epoch": 6384} {"train_loss": -27.47090721130371, "global_step": 529925, "epoch": 6384} {"train_loss": -27.736974716186523, "global_step": 529926, "epoch": 6384} {"train_loss": -27.901199340820312, "global_step": 529927, "epoch": 6384} {"train_loss": -27.813709259033203, "global_step": 529928, "epoch": 6384} {"train_loss": -27.692602157592773, "global_step": 529929, "epoch": 6384} {"train_loss": -27.590490341186523, "global_step": 529930, "epoch": 6384} {"train_loss": -27.524335861206055, "global_step": 529931, "epoch": 6384} {"train_loss": -27.80190086364746, "global_step": 529932, "epoch": 6384} {"train_loss": -27.571247100830078, "global_step": 529933, "epoch": 6384} {"train_loss": -27.687793731689453, "global_step": 529934, "epoch": 6384} {"train_loss": -27.213773727416992, "global_step": 529935, "epoch": 6384} {"train_loss": -27.656818389892578, "global_step": 529936, "epoch": 6384} {"train_loss": -27.858646392822266, "global_step": 529937, "epoch": 6384} {"train_loss": -27.891529083251953, "global_step": 529938, "epoch": 6384} {"train_loss": -27.86329460144043, "global_step": 529939, "epoch": 6384} {"train_loss": -27.887048721313477, "global_step": 529940, "epoch": 6384} {"train_loss": -27.7921142578125, "global_step": 529941, "epoch": 6384} {"train_loss": -27.6800594329834, "global_step": 529942, "epoch": 6384} {"train_loss": -27.622241973876953, "global_step": 529943, "epoch": 6384} {"train_loss": -27.684879302978516, "global_step": 529944, "epoch": 6384} {"train_loss": -27.804922103881836, "global_step": 529945, "epoch": 6384} {"train_loss": -27.535192489624023, "global_step": 529946, "epoch": 6384} {"train_loss": -27.635700225830078, "global_step": 529947, "epoch": 6384} {"train_loss": -27.7040958404541, "global_step": 529948, "epoch": 6384} {"train_loss": -27.62750244140625, "global_step": 529949, "epoch": 6384} {"train_loss": -27.63746452331543, "global_step": 529950, "epoch": 6384} {"train_loss": -27.3667049407959, "global_step": 529951, "epoch": 6384} {"train_loss": -27.464069366455078, "global_step": 529952, "epoch": 6384} {"train_loss": -27.629552841186523, "global_step": 529953, "epoch": 6384} {"train_loss": -27.333100790000824, "global_step": 529954, "epoch": 6384, "val_loss": 6547913.5} {"train_loss": -27.138818740844727, "global_step": 529955, "epoch": 6385} {"train_loss": -26.153532028198242, "global_step": 529956, "epoch": 6385} {"train_loss": -26.122451782226562, "global_step": 529957, "epoch": 6385} {"train_loss": -26.98590660095215, "global_step": 529958, "epoch": 6385} {"train_loss": -26.257287979125977, "global_step": 529959, "epoch": 6385} {"train_loss": -27.047956466674805, "global_step": 529960, "epoch": 6385} {"train_loss": -26.768991470336914, "global_step": 529961, "epoch": 6385} {"train_loss": -26.683515548706055, "global_step": 529962, "epoch": 6385} {"train_loss": -26.688932418823242, "global_step": 529963, "epoch": 6385} {"train_loss": -27.077924728393555, "global_step": 529964, "epoch": 6385} {"train_loss": -27.107465744018555, "global_step": 529965, "epoch": 6385} {"train_loss": -27.29194450378418, "global_step": 529966, "epoch": 6385} {"train_loss": -27.415271759033203, "global_step": 529967, "epoch": 6385} {"train_loss": -26.801267623901367, "global_step": 529968, "epoch": 6385} {"train_loss": -26.942108154296875, "global_step": 529969, "epoch": 6385} {"train_loss": -27.318628311157227, "global_step": 529970, "epoch": 6385} {"train_loss": -27.482473373413086, "global_step": 529971, "epoch": 6385} {"train_loss": -27.44716453552246, "global_step": 529972, "epoch": 6385} {"train_loss": -27.165563583374023, "global_step": 529973, "epoch": 6385} {"train_loss": -27.584070205688477, "global_step": 529974, "epoch": 6385} {"train_loss": -27.483922958374023, "global_step": 529975, "epoch": 6385} {"train_loss": -27.464862823486328, "global_step": 529976, "epoch": 6385} {"train_loss": -27.433496475219727, "global_step": 529977, "epoch": 6385} {"train_loss": -27.481225967407227, "global_step": 529978, "epoch": 6385} {"train_loss": -27.36356544494629, "global_step": 529979, "epoch": 6385} {"train_loss": -27.88652992248535, "global_step": 529980, "epoch": 6385} {"train_loss": -27.599750518798828, "global_step": 529981, "epoch": 6385} {"train_loss": -27.832494735717773, "global_step": 529982, "epoch": 6385} {"train_loss": -28.12890625, "global_step": 529983, "epoch": 6385} {"train_loss": -27.966815948486328, "global_step": 529984, "epoch": 6385} {"train_loss": -27.74567985534668, "global_step": 529985, "epoch": 6385} {"train_loss": -27.734189987182617, "global_step": 529986, "epoch": 6385} {"train_loss": -27.474878311157227, "global_step": 529987, "epoch": 6385} {"train_loss": -27.7282657623291, "global_step": 529988, "epoch": 6385} {"train_loss": -27.34431266784668, "global_step": 529989, "epoch": 6385} {"train_loss": -27.518198013305664, "global_step": 529990, "epoch": 6385} {"train_loss": -27.67603874206543, "global_step": 529991, "epoch": 6385} {"train_loss": -27.897424697875977, "global_step": 529992, "epoch": 6385} {"train_loss": -27.626205444335938, "global_step": 529993, "epoch": 6385} {"train_loss": -28.160938262939453, "global_step": 529994, "epoch": 6385} {"train_loss": -27.459741592407227, "global_step": 529995, "epoch": 6385} {"train_loss": -27.73647117614746, "global_step": 529996, "epoch": 6385} {"train_loss": -27.893508911132812, "global_step": 529997, "epoch": 6385} {"train_loss": -27.597970962524414, "global_step": 529998, "epoch": 6385} {"train_loss": -27.448205947875977, "global_step": 529999, "epoch": 6385} {"train_loss": -27.67384910583496, "global_step": 530000, "epoch": 6385} {"train_loss": -27.323566436767578, "global_step": 530001, "epoch": 6385} {"train_loss": -27.516611099243164, "global_step": 530002, "epoch": 6385} {"train_loss": -27.472440719604492, "global_step": 530003, "epoch": 6385} {"train_loss": -27.34638023376465, "global_step": 530004, "epoch": 6385} {"train_loss": -27.269636154174805, "global_step": 530005, "epoch": 6385} {"train_loss": -26.83390235900879, "global_step": 530006, "epoch": 6385} {"train_loss": -27.587247848510742, "global_step": 530007, "epoch": 6385} {"train_loss": -27.325159072875977, "global_step": 530008, "epoch": 6385} {"train_loss": -27.230941772460938, "global_step": 530009, "epoch": 6385} {"train_loss": -26.94825553894043, "global_step": 530010, "epoch": 6385} {"train_loss": -27.04010581970215, "global_step": 530011, "epoch": 6385} {"train_loss": -27.33070182800293, "global_step": 530012, "epoch": 6385} {"train_loss": -27.366384506225586, "global_step": 530013, "epoch": 6385} {"train_loss": -27.414794921875, "global_step": 530014, "epoch": 6385} {"train_loss": -26.975116729736328, "global_step": 530015, "epoch": 6385} {"train_loss": -26.97432518005371, "global_step": 530016, "epoch": 6385} {"train_loss": -26.823095321655273, "global_step": 530017, "epoch": 6385} {"train_loss": -26.931415557861328, "global_step": 530018, "epoch": 6385} {"train_loss": -26.928403854370117, "global_step": 530019, "epoch": 6385} {"train_loss": -27.348241806030273, "global_step": 530020, "epoch": 6385} {"train_loss": -26.78997802734375, "global_step": 530021, "epoch": 6385} {"train_loss": -27.11664390563965, "global_step": 530022, "epoch": 6385} {"train_loss": -27.450199127197266, "global_step": 530023, "epoch": 6385} {"train_loss": -27.20358657836914, "global_step": 530024, "epoch": 6385} {"train_loss": -27.65032386779785, "global_step": 530025, "epoch": 6385} {"train_loss": -27.445831298828125, "global_step": 530026, "epoch": 6385} {"train_loss": -27.422809600830078, "global_step": 530027, "epoch": 6385} {"train_loss": -27.435745239257812, "global_step": 530028, "epoch": 6385} {"train_loss": -27.1315860748291, "global_step": 530029, "epoch": 6385} {"train_loss": -27.12409019470215, "global_step": 530030, "epoch": 6385} {"train_loss": -27.187097549438477, "global_step": 530031, "epoch": 6385} {"train_loss": -27.71485710144043, "global_step": 530032, "epoch": 6385} {"train_loss": -27.43758201599121, "global_step": 530033, "epoch": 6385} {"train_loss": -27.648117065429688, "global_step": 530034, "epoch": 6385} {"train_loss": -27.624792098999023, "global_step": 530035, "epoch": 6385} {"train_loss": -27.50086784362793, "global_step": 530036, "epoch": 6385} {"train_loss": -27.327239346791462, "global_step": 530037, "epoch": 6385, "val_loss": 6588169.0} {"train_loss": -27.39161491394043, "global_step": 530038, "epoch": 6386} {"train_loss": -27.14081382751465, "global_step": 530039, "epoch": 6386} {"train_loss": -27.2669620513916, "global_step": 530040, "epoch": 6386} {"train_loss": -27.617284774780273, "global_step": 530041, "epoch": 6386} {"train_loss": -27.244125366210938, "global_step": 530042, "epoch": 6386} {"train_loss": -27.366138458251953, "global_step": 530043, "epoch": 6386} {"train_loss": -27.207569122314453, "global_step": 530044, "epoch": 6386} {"train_loss": -27.46721839904785, "global_step": 530045, "epoch": 6386} {"train_loss": -27.54775047302246, "global_step": 530046, "epoch": 6386} {"train_loss": -27.501834869384766, "global_step": 530047, "epoch": 6386} {"train_loss": -27.22637367248535, "global_step": 530048, "epoch": 6386} {"train_loss": -26.9034481048584, "global_step": 530049, "epoch": 6386} {"train_loss": -27.615127563476562, "global_step": 530050, "epoch": 6386} {"train_loss": -27.345661163330078, "global_step": 530051, "epoch": 6386} {"train_loss": -27.309335708618164, "global_step": 530052, "epoch": 6386} {"train_loss": -27.516223907470703, "global_step": 530053, "epoch": 6386} {"train_loss": -27.180444717407227, "global_step": 530054, "epoch": 6386} {"train_loss": -27.434326171875, "global_step": 530055, "epoch": 6386} {"train_loss": -27.38203239440918, "global_step": 530056, "epoch": 6386} {"train_loss": -27.3803653717041, "global_step": 530057, "epoch": 6386} {"train_loss": -27.47178077697754, "global_step": 530058, "epoch": 6386} {"train_loss": -27.09632682800293, "global_step": 530059, "epoch": 6386} {"train_loss": -27.96396827697754, "global_step": 530060, "epoch": 6386} {"train_loss": -27.152265548706055, "global_step": 530061, "epoch": 6386} {"train_loss": -27.714529037475586, "global_step": 530062, "epoch": 6386} {"train_loss": -27.155426025390625, "global_step": 530063, "epoch": 6386} {"train_loss": -27.472150802612305, "global_step": 530064, "epoch": 6386} {"train_loss": -27.620615005493164, "global_step": 530065, "epoch": 6386} {"train_loss": -27.59873390197754, "global_step": 530066, "epoch": 6386} {"train_loss": -27.614912033081055, "global_step": 530067, "epoch": 6386} {"train_loss": -27.39430046081543, "global_step": 530068, "epoch": 6386} {"train_loss": -27.590986251831055, "global_step": 530069, "epoch": 6386} {"train_loss": -27.328397750854492, "global_step": 530070, "epoch": 6386} {"train_loss": -27.489227294921875, "global_step": 530071, "epoch": 6386} {"train_loss": -27.898603439331055, "global_step": 530072, "epoch": 6386} {"train_loss": -27.7251033782959, "global_step": 530073, "epoch": 6386} {"train_loss": -27.899341583251953, "global_step": 530074, "epoch": 6386} {"train_loss": -27.637939453125, "global_step": 530075, "epoch": 6386} {"train_loss": -27.50676918029785, "global_step": 530076, "epoch": 6386} {"train_loss": -27.74029541015625, "global_step": 530077, "epoch": 6386} {"train_loss": -27.2420597076416, "global_step": 530078, "epoch": 6386} {"train_loss": -27.92131996154785, "global_step": 530079, "epoch": 6386} {"train_loss": -27.460535049438477, "global_step": 530080, "epoch": 6386} {"train_loss": -27.697158813476562, "global_step": 530081, "epoch": 6386} {"train_loss": -27.703128814697266, "global_step": 530082, "epoch": 6386} {"train_loss": -27.396848678588867, "global_step": 530083, "epoch": 6386} {"train_loss": -28.086170196533203, "global_step": 530084, "epoch": 6386} {"train_loss": -27.63813591003418, "global_step": 530085, "epoch": 6386} {"train_loss": -27.742053985595703, "global_step": 530086, "epoch": 6386} {"train_loss": -27.51250648498535, "global_step": 530087, "epoch": 6386} {"train_loss": -28.08782958984375, "global_step": 530088, "epoch": 6386} {"train_loss": -27.699499130249023, "global_step": 530089, "epoch": 6386} {"train_loss": -27.682836532592773, "global_step": 530090, "epoch": 6386} {"train_loss": -27.854047775268555, "global_step": 530091, "epoch": 6386} {"train_loss": -27.484272003173828, "global_step": 530092, "epoch": 6386} {"train_loss": -27.70985221862793, "global_step": 530093, "epoch": 6386} {"train_loss": -27.820743560791016, "global_step": 530094, "epoch": 6386} {"train_loss": -27.686939239501953, "global_step": 530095, "epoch": 6386} {"train_loss": -27.460987091064453, "global_step": 530096, "epoch": 6386} {"train_loss": -27.744482040405273, "global_step": 530097, "epoch": 6386} {"train_loss": -27.644245147705078, "global_step": 530098, "epoch": 6386} {"train_loss": -28.134387969970703, "global_step": 530099, "epoch": 6386} {"train_loss": -27.67005729675293, "global_step": 530100, "epoch": 6386} {"train_loss": -27.73907470703125, "global_step": 530101, "epoch": 6386} {"train_loss": -27.68857192993164, "global_step": 530102, "epoch": 6386} {"train_loss": -27.3197078704834, "global_step": 530103, "epoch": 6386} {"train_loss": -27.35957145690918, "global_step": 530104, "epoch": 6386} {"train_loss": -27.546979904174805, "global_step": 530105, "epoch": 6386} {"train_loss": -27.658843994140625, "global_step": 530106, "epoch": 6386} {"train_loss": -27.5809383392334, "global_step": 530107, "epoch": 6386} {"train_loss": -27.61460304260254, "global_step": 530108, "epoch": 6386} {"train_loss": -27.928064346313477, "global_step": 530109, "epoch": 6386} {"train_loss": -27.362409591674805, "global_step": 530110, "epoch": 6386} {"train_loss": -27.763946533203125, "global_step": 530111, "epoch": 6386} {"train_loss": -27.115772247314453, "global_step": 530112, "epoch": 6386} {"train_loss": -27.768695831298828, "global_step": 530113, "epoch": 6386} {"train_loss": -27.8011531829834, "global_step": 530114, "epoch": 6386} {"train_loss": -27.64373207092285, "global_step": 530115, "epoch": 6386} {"train_loss": -27.23353385925293, "global_step": 530116, "epoch": 6386} {"train_loss": -27.336872100830078, "global_step": 530117, "epoch": 6386} {"train_loss": -27.955846786499023, "global_step": 530118, "epoch": 6386} {"train_loss": -27.405553817749023, "global_step": 530119, "epoch": 6386} {"train_loss": -27.54006020419569, "global_step": 530120, "epoch": 6386, "val_loss": 6653160.5} {"train_loss": -25.886905670166016, "global_step": 530121, "epoch": 6387} {"train_loss": -25.405200958251953, "global_step": 530122, "epoch": 6387} {"train_loss": -25.673131942749023, "global_step": 530123, "epoch": 6387} {"train_loss": -25.9687442779541, "global_step": 530124, "epoch": 6387} {"train_loss": -26.0164737701416, "global_step": 530125, "epoch": 6387} {"train_loss": -25.648473739624023, "global_step": 530126, "epoch": 6387} {"train_loss": -26.56451988220215, "global_step": 530127, "epoch": 6387} {"train_loss": -25.854938507080078, "global_step": 530128, "epoch": 6387} {"train_loss": -26.17293357849121, "global_step": 530129, "epoch": 6387} {"train_loss": -26.674182891845703, "global_step": 530130, "epoch": 6387} {"train_loss": -26.32157325744629, "global_step": 530131, "epoch": 6387} {"train_loss": -26.578399658203125, "global_step": 530132, "epoch": 6387} {"train_loss": -26.5145320892334, "global_step": 530133, "epoch": 6387} {"train_loss": -26.084531784057617, "global_step": 530134, "epoch": 6387} {"train_loss": -26.666629791259766, "global_step": 530135, "epoch": 6387} {"train_loss": -26.60589027404785, "global_step": 530136, "epoch": 6387} {"train_loss": -26.409818649291992, "global_step": 530137, "epoch": 6387} {"train_loss": -26.960763931274414, "global_step": 530138, "epoch": 6387} {"train_loss": -27.039905548095703, "global_step": 530139, "epoch": 6387} {"train_loss": -26.912216186523438, "global_step": 530140, "epoch": 6387} {"train_loss": -26.99773597717285, "global_step": 530141, "epoch": 6387} {"train_loss": -27.237699508666992, "global_step": 530142, "epoch": 6387} {"train_loss": -26.9805908203125, "global_step": 530143, "epoch": 6387} {"train_loss": -26.948974609375, "global_step": 530144, "epoch": 6387} {"train_loss": -27.318899154663086, "global_step": 530145, "epoch": 6387} {"train_loss": -26.5721492767334, "global_step": 530146, "epoch": 6387} {"train_loss": -27.103269577026367, "global_step": 530147, "epoch": 6387} {"train_loss": -27.52915382385254, "global_step": 530148, "epoch": 6387} {"train_loss": -27.293176651000977, "global_step": 530149, "epoch": 6387} {"train_loss": -27.01108741760254, "global_step": 530150, "epoch": 6387} {"train_loss": -26.8820743560791, "global_step": 530151, "epoch": 6387} {"train_loss": -27.42450523376465, "global_step": 530152, "epoch": 6387} {"train_loss": -27.403614044189453, "global_step": 530153, "epoch": 6387} {"train_loss": -27.390050888061523, "global_step": 530154, "epoch": 6387} {"train_loss": -27.402942657470703, "global_step": 530155, "epoch": 6387} {"train_loss": -27.314605712890625, "global_step": 530156, "epoch": 6387} {"train_loss": -27.795856475830078, "global_step": 530157, "epoch": 6387} {"train_loss": -27.590045928955078, "global_step": 530158, "epoch": 6387} {"train_loss": -27.668676376342773, "global_step": 530159, "epoch": 6387} {"train_loss": -27.573469161987305, "global_step": 530160, "epoch": 6387} {"train_loss": -27.7305908203125, "global_step": 530161, "epoch": 6387} {"train_loss": -27.312759399414062, "global_step": 530162, "epoch": 6387} {"train_loss": -27.615955352783203, "global_step": 530163, "epoch": 6387} {"train_loss": -27.55633544921875, "global_step": 530164, "epoch": 6387} {"train_loss": -27.34051513671875, "global_step": 530165, "epoch": 6387} {"train_loss": -27.54072380065918, "global_step": 530166, "epoch": 6387} {"train_loss": -27.425643920898438, "global_step": 530167, "epoch": 6387} {"train_loss": -27.83013343811035, "global_step": 530168, "epoch": 6387} {"train_loss": -27.682586669921875, "global_step": 530169, "epoch": 6387} {"train_loss": -27.7023868560791, "global_step": 530170, "epoch": 6387} {"train_loss": -27.384748458862305, "global_step": 530171, "epoch": 6387} {"train_loss": -27.8256893157959, "global_step": 530172, "epoch": 6387} {"train_loss": -27.75086784362793, "global_step": 530173, "epoch": 6387} {"train_loss": -27.774429321289062, "global_step": 530174, "epoch": 6387} {"train_loss": -27.6481876373291, "global_step": 530175, "epoch": 6387} {"train_loss": -27.453969955444336, "global_step": 530176, "epoch": 6387} {"train_loss": -27.653379440307617, "global_step": 530177, "epoch": 6387} {"train_loss": -27.743371963500977, "global_step": 530178, "epoch": 6387} {"train_loss": -27.42336082458496, "global_step": 530179, "epoch": 6387} {"train_loss": -27.893421173095703, "global_step": 530180, "epoch": 6387} {"train_loss": -27.99289894104004, "global_step": 530181, "epoch": 6387} {"train_loss": -28.036117553710938, "global_step": 530182, "epoch": 6387} {"train_loss": -27.816465377807617, "global_step": 530183, "epoch": 6387} {"train_loss": -27.6756534576416, "global_step": 530184, "epoch": 6387} {"train_loss": -27.711639404296875, "global_step": 530185, "epoch": 6387} {"train_loss": -27.585058212280273, "global_step": 530186, "epoch": 6387} {"train_loss": -28.088623046875, "global_step": 530187, "epoch": 6387} {"train_loss": -27.402265548706055, "global_step": 530188, "epoch": 6387} {"train_loss": -27.490758895874023, "global_step": 530189, "epoch": 6387} {"train_loss": -27.67487907409668, "global_step": 530190, "epoch": 6387} {"train_loss": -27.597949981689453, "global_step": 530191, "epoch": 6387} {"train_loss": -27.737884521484375, "global_step": 530192, "epoch": 6387} {"train_loss": -27.300952911376953, "global_step": 530193, "epoch": 6387} {"train_loss": -27.766998291015625, "global_step": 530194, "epoch": 6387} {"train_loss": -27.63418960571289, "global_step": 530195, "epoch": 6387} {"train_loss": -27.79749870300293, "global_step": 530196, "epoch": 6387} {"train_loss": -27.470849990844727, "global_step": 530197, "epoch": 6387} {"train_loss": -28.32435417175293, "global_step": 530198, "epoch": 6387} {"train_loss": -27.716537475585938, "global_step": 530199, "epoch": 6387} {"train_loss": -27.641281127929688, "global_step": 530200, "epoch": 6387} {"train_loss": -27.5219669342041, "global_step": 530201, "epoch": 6387} {"train_loss": -27.567609786987305, "global_step": 530202, "epoch": 6387} {"train_loss": -27.24050338009754, "global_step": 530203, "epoch": 6387, "val_loss": 6549527.0} {"train_loss": -27.355712890625, "global_step": 530204, "epoch": 6388} {"train_loss": -26.66845703125, "global_step": 530205, "epoch": 6388} {"train_loss": -26.105966567993164, "global_step": 530206, "epoch": 6388} {"train_loss": -26.40158462524414, "global_step": 530207, "epoch": 6388} {"train_loss": -27.0908203125, "global_step": 530208, "epoch": 6388} {"train_loss": -26.471790313720703, "global_step": 530209, "epoch": 6388} {"train_loss": -26.93499755859375, "global_step": 530210, "epoch": 6388} {"train_loss": -27.1695556640625, "global_step": 530211, "epoch": 6388} {"train_loss": -27.084964752197266, "global_step": 530212, "epoch": 6388} {"train_loss": -27.37617301940918, "global_step": 530213, "epoch": 6388} {"train_loss": -27.240400314331055, "global_step": 530214, "epoch": 6388} {"train_loss": -27.50341796875, "global_step": 530215, "epoch": 6388} {"train_loss": -27.51068687438965, "global_step": 530216, "epoch": 6388} {"train_loss": -27.316492080688477, "global_step": 530217, "epoch": 6388} {"train_loss": -27.379199981689453, "global_step": 530218, "epoch": 6388} {"train_loss": -27.254079818725586, "global_step": 530219, "epoch": 6388} {"train_loss": -27.155454635620117, "global_step": 530220, "epoch": 6388} {"train_loss": -27.26824951171875, "global_step": 530221, "epoch": 6388} {"train_loss": -27.140100479125977, "global_step": 530222, "epoch": 6388} {"train_loss": -27.116418838500977, "global_step": 530223, "epoch": 6388} {"train_loss": -27.334793090820312, "global_step": 530224, "epoch": 6388} {"train_loss": -27.48402214050293, "global_step": 530225, "epoch": 6388} {"train_loss": -27.57958984375, "global_step": 530226, "epoch": 6388} {"train_loss": -27.71405029296875, "global_step": 530227, "epoch": 6388} {"train_loss": -27.836572647094727, "global_step": 530228, "epoch": 6388} {"train_loss": -27.489490509033203, "global_step": 530229, "epoch": 6388} {"train_loss": -27.644271850585938, "global_step": 530230, "epoch": 6388} {"train_loss": -27.61701011657715, "global_step": 530231, "epoch": 6388} {"train_loss": -27.340045928955078, "global_step": 530232, "epoch": 6388} {"train_loss": -27.679901123046875, "global_step": 530233, "epoch": 6388} {"train_loss": -27.34871482849121, "global_step": 530234, "epoch": 6388} {"train_loss": -27.433368682861328, "global_step": 530235, "epoch": 6388} {"train_loss": -27.83197021484375, "global_step": 530236, "epoch": 6388} {"train_loss": -27.732868194580078, "global_step": 530237, "epoch": 6388} {"train_loss": -27.531030654907227, "global_step": 530238, "epoch": 6388} {"train_loss": -27.603580474853516, "global_step": 530239, "epoch": 6388} {"train_loss": -27.676862716674805, "global_step": 530240, "epoch": 6388} {"train_loss": -27.48334312438965, "global_step": 530241, "epoch": 6388} {"train_loss": -27.53348731994629, "global_step": 530242, "epoch": 6388} {"train_loss": -27.652944564819336, "global_step": 530243, "epoch": 6388} {"train_loss": -27.5316104888916, "global_step": 530244, "epoch": 6388} {"train_loss": -27.86032485961914, "global_step": 530245, "epoch": 6388} {"train_loss": -27.49323081970215, "global_step": 530246, "epoch": 6388} {"train_loss": -27.631916046142578, "global_step": 530247, "epoch": 6388} {"train_loss": -27.7152042388916, "global_step": 530248, "epoch": 6388} {"train_loss": -27.880783081054688, "global_step": 530249, "epoch": 6388} {"train_loss": -27.8389949798584, "global_step": 530250, "epoch": 6388} {"train_loss": -27.82757568359375, "global_step": 530251, "epoch": 6388} {"train_loss": -27.629785537719727, "global_step": 530252, "epoch": 6388} {"train_loss": -27.7731990814209, "global_step": 530253, "epoch": 6388} {"train_loss": -28.229990005493164, "global_step": 530254, "epoch": 6388} {"train_loss": -27.819812774658203, "global_step": 530255, "epoch": 6388} {"train_loss": -27.714435577392578, "global_step": 530256, "epoch": 6388} {"train_loss": -27.764728546142578, "global_step": 530257, "epoch": 6388} {"train_loss": -27.624128341674805, "global_step": 530258, "epoch": 6388} {"train_loss": -27.304473876953125, "global_step": 530259, "epoch": 6388} {"train_loss": -27.562301635742188, "global_step": 530260, "epoch": 6388} {"train_loss": -27.376752853393555, "global_step": 530261, "epoch": 6388} {"train_loss": -27.189123153686523, "global_step": 530262, "epoch": 6388} {"train_loss": -27.27424430847168, "global_step": 530263, "epoch": 6388} {"train_loss": -27.343555450439453, "global_step": 530264, "epoch": 6388} {"train_loss": -27.61677360534668, "global_step": 530265, "epoch": 6388} {"train_loss": -27.40662956237793, "global_step": 530266, "epoch": 6388} {"train_loss": -27.628162384033203, "global_step": 530267, "epoch": 6388} {"train_loss": -27.352405548095703, "global_step": 530268, "epoch": 6388} {"train_loss": -27.081594467163086, "global_step": 530269, "epoch": 6388} {"train_loss": -26.79322624206543, "global_step": 530270, "epoch": 6388} {"train_loss": -27.024831771850586, "global_step": 530271, "epoch": 6388} {"train_loss": -27.971332550048828, "global_step": 530272, "epoch": 6388} {"train_loss": -27.567096710205078, "global_step": 530273, "epoch": 6388} {"train_loss": -27.236143112182617, "global_step": 530274, "epoch": 6388} {"train_loss": -27.4205322265625, "global_step": 530275, "epoch": 6388} {"train_loss": -27.919052124023438, "global_step": 530276, "epoch": 6388} {"train_loss": -27.450244903564453, "global_step": 530277, "epoch": 6388} {"train_loss": -27.597402572631836, "global_step": 530278, "epoch": 6388} {"train_loss": -27.621967315673828, "global_step": 530279, "epoch": 6388} {"train_loss": -27.7430477142334, "global_step": 530280, "epoch": 6388} {"train_loss": -27.37624168395996, "global_step": 530281, "epoch": 6388} {"train_loss": -27.60684585571289, "global_step": 530282, "epoch": 6388} {"train_loss": -27.699848175048828, "global_step": 530283, "epoch": 6388} {"train_loss": -27.7108097076416, "global_step": 530284, "epoch": 6388} {"train_loss": -27.92084312438965, "global_step": 530285, "epoch": 6388} {"train_loss": -27.464639571775873, "global_step": 530286, "epoch": 6388, "val_loss": 6548418.0} {"train_loss": -27.022619247436523, "global_step": 530287, "epoch": 6389} {"train_loss": -26.66717529296875, "global_step": 530288, "epoch": 6389} {"train_loss": -25.661609649658203, "global_step": 530289, "epoch": 6389} {"train_loss": -26.36829948425293, "global_step": 530290, "epoch": 6389} {"train_loss": -26.887451171875, "global_step": 530291, "epoch": 6389} {"train_loss": -26.659936904907227, "global_step": 530292, "epoch": 6389} {"train_loss": -27.57000732421875, "global_step": 530293, "epoch": 6389} {"train_loss": -26.500640869140625, "global_step": 530294, "epoch": 6389} {"train_loss": -27.275070190429688, "global_step": 530295, "epoch": 6389} {"train_loss": -26.909032821655273, "global_step": 530296, "epoch": 6389} {"train_loss": -27.122278213500977, "global_step": 530297, "epoch": 6389} {"train_loss": -27.04656410217285, "global_step": 530298, "epoch": 6389} {"train_loss": -27.012537002563477, "global_step": 530299, "epoch": 6389} {"train_loss": -27.1203556060791, "global_step": 530300, "epoch": 6389} {"train_loss": -27.43212890625, "global_step": 530301, "epoch": 6389} {"train_loss": -27.1419734954834, "global_step": 530302, "epoch": 6389} {"train_loss": -27.122913360595703, "global_step": 530303, "epoch": 6389} {"train_loss": -26.930206298828125, "global_step": 530304, "epoch": 6389} {"train_loss": -26.957263946533203, "global_step": 530305, "epoch": 6389} {"train_loss": -27.926227569580078, "global_step": 530306, "epoch": 6389} {"train_loss": -27.19780921936035, "global_step": 530307, "epoch": 6389} {"train_loss": -27.470630645751953, "global_step": 530308, "epoch": 6389} {"train_loss": -27.22853660583496, "global_step": 530309, "epoch": 6389} {"train_loss": -27.402679443359375, "global_step": 530310, "epoch": 6389} {"train_loss": -27.552978515625, "global_step": 530311, "epoch": 6389} {"train_loss": -27.450292587280273, "global_step": 530312, "epoch": 6389} {"train_loss": -27.29373550415039, "global_step": 530313, "epoch": 6389} {"train_loss": -27.359527587890625, "global_step": 530314, "epoch": 6389} {"train_loss": -27.77652359008789, "global_step": 530315, "epoch": 6389} {"train_loss": -27.363819122314453, "global_step": 530316, "epoch": 6389} {"train_loss": -27.368085861206055, "global_step": 530317, "epoch": 6389} {"train_loss": -27.619253158569336, "global_step": 530318, "epoch": 6389} {"train_loss": -27.664403915405273, "global_step": 530319, "epoch": 6389} {"train_loss": -27.826704025268555, "global_step": 530320, "epoch": 6389} {"train_loss": -27.12200355529785, "global_step": 530321, "epoch": 6389} {"train_loss": -27.3997859954834, "global_step": 530322, "epoch": 6389} {"train_loss": -27.26773452758789, "global_step": 530323, "epoch": 6389} {"train_loss": -27.48554801940918, "global_step": 530324, "epoch": 6389} {"train_loss": -27.76739501953125, "global_step": 530325, "epoch": 6389} {"train_loss": -27.781991958618164, "global_step": 530326, "epoch": 6389} {"train_loss": -27.510175704956055, "global_step": 530327, "epoch": 6389} {"train_loss": -27.766637802124023, "global_step": 530328, "epoch": 6389} {"train_loss": -27.883771896362305, "global_step": 530329, "epoch": 6389} {"train_loss": -27.654590606689453, "global_step": 530330, "epoch": 6389} {"train_loss": -27.439123153686523, "global_step": 530331, "epoch": 6389} {"train_loss": -27.675031661987305, "global_step": 530332, "epoch": 6389} {"train_loss": -27.879003524780273, "global_step": 530333, "epoch": 6389} {"train_loss": -27.539031982421875, "global_step": 530334, "epoch": 6389} {"train_loss": -27.2978458404541, "global_step": 530335, "epoch": 6389} {"train_loss": -27.314727783203125, "global_step": 530336, "epoch": 6389} {"train_loss": -27.4841251373291, "global_step": 530337, "epoch": 6389} {"train_loss": -28.002614974975586, "global_step": 530338, "epoch": 6389} {"train_loss": -27.788131713867188, "global_step": 530339, "epoch": 6389} {"train_loss": -27.5585994720459, "global_step": 530340, "epoch": 6389} {"train_loss": -27.74396324157715, "global_step": 530341, "epoch": 6389} {"train_loss": -27.69544792175293, "global_step": 530342, "epoch": 6389} {"train_loss": -27.622480392456055, "global_step": 530343, "epoch": 6389} {"train_loss": -27.628803253173828, "global_step": 530344, "epoch": 6389} {"train_loss": -27.913888931274414, "global_step": 530345, "epoch": 6389} {"train_loss": -27.832712173461914, "global_step": 530346, "epoch": 6389} {"train_loss": -27.148944854736328, "global_step": 530347, "epoch": 6389} {"train_loss": -27.75861930847168, "global_step": 530348, "epoch": 6389} {"train_loss": -27.812952041625977, "global_step": 530349, "epoch": 6389} {"train_loss": -28.162389755249023, "global_step": 530350, "epoch": 6389} {"train_loss": -27.665929794311523, "global_step": 530351, "epoch": 6389} {"train_loss": -27.52190589904785, "global_step": 530352, "epoch": 6389} {"train_loss": -27.438756942749023, "global_step": 530353, "epoch": 6389} {"train_loss": -27.750614166259766, "global_step": 530354, "epoch": 6389} {"train_loss": -27.27595329284668, "global_step": 530355, "epoch": 6389} {"train_loss": -27.435239791870117, "global_step": 530356, "epoch": 6389} {"train_loss": -27.891773223876953, "global_step": 530357, "epoch": 6389} {"train_loss": -27.49271583557129, "global_step": 530358, "epoch": 6389} {"train_loss": -27.44032859802246, "global_step": 530359, "epoch": 6389} {"train_loss": -27.753087997436523, "global_step": 530360, "epoch": 6389} {"train_loss": -28.33230972290039, "global_step": 530361, "epoch": 6389} {"train_loss": -27.584875106811523, "global_step": 530362, "epoch": 6389} {"train_loss": -27.843402862548828, "global_step": 530363, "epoch": 6389} {"train_loss": -27.792043685913086, "global_step": 530364, "epoch": 6389} {"train_loss": -27.534284591674805, "global_step": 530365, "epoch": 6389} {"train_loss": -27.48993492126465, "global_step": 530366, "epoch": 6389} {"train_loss": -27.88385581970215, "global_step": 530367, "epoch": 6389} {"train_loss": -27.51849937438965, "global_step": 530368, "epoch": 6389} {"train_loss": -27.454446470881084, "global_step": 530369, "epoch": 6389, "val_loss": 6689468.0} {"train_loss": -26.51324462890625, "global_step": 530370, "epoch": 6390} {"train_loss": -25.827167510986328, "global_step": 530371, "epoch": 6390} {"train_loss": -26.13343620300293, "global_step": 530372, "epoch": 6390} {"train_loss": -26.421728134155273, "global_step": 530373, "epoch": 6390} {"train_loss": -26.163537979125977, "global_step": 530374, "epoch": 6390} {"train_loss": -26.420063018798828, "global_step": 530375, "epoch": 6390} {"train_loss": -26.1147403717041, "global_step": 530376, "epoch": 6390} {"train_loss": -27.14605712890625, "global_step": 530377, "epoch": 6390} {"train_loss": -26.240835189819336, "global_step": 530378, "epoch": 6390} {"train_loss": -26.946426391601562, "global_step": 530379, "epoch": 6390} {"train_loss": -26.657154083251953, "global_step": 530380, "epoch": 6390} {"train_loss": -26.730152130126953, "global_step": 530381, "epoch": 6390} {"train_loss": -26.811573028564453, "global_step": 530382, "epoch": 6390} {"train_loss": -26.7119083404541, "global_step": 530383, "epoch": 6390} {"train_loss": -26.880950927734375, "global_step": 530384, "epoch": 6390} {"train_loss": -27.12885856628418, "global_step": 530385, "epoch": 6390} {"train_loss": -27.109695434570312, "global_step": 530386, "epoch": 6390} {"train_loss": -26.8139591217041, "global_step": 530387, "epoch": 6390} {"train_loss": -27.094745635986328, "global_step": 530388, "epoch": 6390} {"train_loss": -27.125598907470703, "global_step": 530389, "epoch": 6390} {"train_loss": -27.18381690979004, "global_step": 530390, "epoch": 6390} {"train_loss": -27.121231079101562, "global_step": 530391, "epoch": 6390} {"train_loss": -27.40009880065918, "global_step": 530392, "epoch": 6390} {"train_loss": -27.266620635986328, "global_step": 530393, "epoch": 6390} {"train_loss": -26.97258949279785, "global_step": 530394, "epoch": 6390} {"train_loss": -26.959033966064453, "global_step": 530395, "epoch": 6390} {"train_loss": -27.6862735748291, "global_step": 530396, "epoch": 6390} {"train_loss": -27.463638305664062, "global_step": 530397, "epoch": 6390} {"train_loss": -27.572952270507812, "global_step": 530398, "epoch": 6390} {"train_loss": -27.3847713470459, "global_step": 530399, "epoch": 6390} {"train_loss": -27.41646385192871, "global_step": 530400, "epoch": 6390} {"train_loss": -27.154417037963867, "global_step": 530401, "epoch": 6390} {"train_loss": -27.51279067993164, "global_step": 530402, "epoch": 6390} {"train_loss": -27.091754913330078, "global_step": 530403, "epoch": 6390} {"train_loss": -27.66315269470215, "global_step": 530404, "epoch": 6390} {"train_loss": -27.63918113708496, "global_step": 530405, "epoch": 6390} {"train_loss": -27.552417755126953, "global_step": 530406, "epoch": 6390} {"train_loss": -27.616804122924805, "global_step": 530407, "epoch": 6390} {"train_loss": -27.534290313720703, "global_step": 530408, "epoch": 6390} {"train_loss": -27.9635009765625, "global_step": 530409, "epoch": 6390} {"train_loss": -27.761316299438477, "global_step": 530410, "epoch": 6390} {"train_loss": -27.87862205505371, "global_step": 530411, "epoch": 6390} {"train_loss": -27.956323623657227, "global_step": 530412, "epoch": 6390} {"train_loss": -27.43691062927246, "global_step": 530413, "epoch": 6390} {"train_loss": -27.3604736328125, "global_step": 530414, "epoch": 6390} {"train_loss": -27.630374908447266, "global_step": 530415, "epoch": 6390} {"train_loss": -27.607065200805664, "global_step": 530416, "epoch": 6390} {"train_loss": -27.092731475830078, "global_step": 530417, "epoch": 6390} {"train_loss": -27.75274085998535, "global_step": 530418, "epoch": 6390} {"train_loss": -27.693790435791016, "global_step": 530419, "epoch": 6390} {"train_loss": -27.53240394592285, "global_step": 530420, "epoch": 6390} {"train_loss": -27.775135040283203, "global_step": 530421, "epoch": 6390} {"train_loss": -27.48723793029785, "global_step": 530422, "epoch": 6390} {"train_loss": -27.844263076782227, "global_step": 530423, "epoch": 6390} {"train_loss": -27.683197021484375, "global_step": 530424, "epoch": 6390} {"train_loss": -27.68732261657715, "global_step": 530425, "epoch": 6390} {"train_loss": -27.62330436706543, "global_step": 530426, "epoch": 6390} {"train_loss": -27.669687271118164, "global_step": 530427, "epoch": 6390} {"train_loss": -27.7147274017334, "global_step": 530428, "epoch": 6390} {"train_loss": -27.27659034729004, "global_step": 530429, "epoch": 6390} {"train_loss": -27.050947189331055, "global_step": 530430, "epoch": 6390} {"train_loss": -27.459211349487305, "global_step": 530431, "epoch": 6390} {"train_loss": -27.55280876159668, "global_step": 530432, "epoch": 6390} {"train_loss": -27.825620651245117, "global_step": 530433, "epoch": 6390} {"train_loss": -27.293445587158203, "global_step": 530434, "epoch": 6390} {"train_loss": -27.1391658782959, "global_step": 530435, "epoch": 6390} {"train_loss": -27.571775436401367, "global_step": 530436, "epoch": 6390} {"train_loss": -27.303909301757812, "global_step": 530437, "epoch": 6390} {"train_loss": -27.25327491760254, "global_step": 530438, "epoch": 6390} {"train_loss": -27.604429244995117, "global_step": 530439, "epoch": 6390} {"train_loss": -27.80535316467285, "global_step": 530440, "epoch": 6390} {"train_loss": -27.43048095703125, "global_step": 530441, "epoch": 6390} {"train_loss": -27.35086441040039, "global_step": 530442, "epoch": 6390} {"train_loss": -27.92889404296875, "global_step": 530443, "epoch": 6390} {"train_loss": -27.689224243164062, "global_step": 530444, "epoch": 6390} {"train_loss": -27.844955444335938, "global_step": 530445, "epoch": 6390} {"train_loss": -27.68976402282715, "global_step": 530446, "epoch": 6390} {"train_loss": -27.545124053955078, "global_step": 530447, "epoch": 6390} {"train_loss": -27.69679069519043, "global_step": 530448, "epoch": 6390} {"train_loss": -27.558399200439453, "global_step": 530449, "epoch": 6390} {"train_loss": -27.717178344726562, "global_step": 530450, "epoch": 6390} {"train_loss": -27.428632736206055, "global_step": 530451, "epoch": 6390} {"train_loss": -27.31100546595562, "global_step": 530452, "epoch": 6390, "val_loss": 6441046.0} {"train_loss": -26.30126953125, "global_step": 530453, "epoch": 6391} {"train_loss": -26.925474166870117, "global_step": 530454, "epoch": 6391} {"train_loss": -26.90157127380371, "global_step": 530455, "epoch": 6391} {"train_loss": -26.687515258789062, "global_step": 530456, "epoch": 6391} {"train_loss": -27.132665634155273, "global_step": 530457, "epoch": 6391} {"train_loss": -27.078638076782227, "global_step": 530458, "epoch": 6391} {"train_loss": -26.925739288330078, "global_step": 530459, "epoch": 6391} {"train_loss": -27.462560653686523, "global_step": 530460, "epoch": 6391} {"train_loss": -27.046293258666992, "global_step": 530461, "epoch": 6391} {"train_loss": -26.999845504760742, "global_step": 530462, "epoch": 6391} {"train_loss": -27.494962692260742, "global_step": 530463, "epoch": 6391} {"train_loss": -27.469526290893555, "global_step": 530464, "epoch": 6391} {"train_loss": -27.058252334594727, "global_step": 530465, "epoch": 6391} {"train_loss": -27.10027503967285, "global_step": 530466, "epoch": 6391} {"train_loss": -27.0938777923584, "global_step": 530467, "epoch": 6391} {"train_loss": -27.07806396484375, "global_step": 530468, "epoch": 6391} {"train_loss": -27.344497680664062, "global_step": 530469, "epoch": 6391} {"train_loss": -27.2485294342041, "global_step": 530470, "epoch": 6391} {"train_loss": -27.677640914916992, "global_step": 530471, "epoch": 6391} {"train_loss": -27.147247314453125, "global_step": 530472, "epoch": 6391} {"train_loss": -27.83859634399414, "global_step": 530473, "epoch": 6391} {"train_loss": -26.99675941467285, "global_step": 530474, "epoch": 6391} {"train_loss": -27.6127986907959, "global_step": 530475, "epoch": 6391} {"train_loss": -27.456159591674805, "global_step": 530476, "epoch": 6391} {"train_loss": -27.646636962890625, "global_step": 530477, "epoch": 6391} {"train_loss": -27.213865280151367, "global_step": 530478, "epoch": 6391} {"train_loss": -27.86935806274414, "global_step": 530479, "epoch": 6391} {"train_loss": -27.70709800720215, "global_step": 530480, "epoch": 6391} {"train_loss": -27.807636260986328, "global_step": 530481, "epoch": 6391} {"train_loss": -27.5194034576416, "global_step": 530482, "epoch": 6391} {"train_loss": -27.596485137939453, "global_step": 530483, "epoch": 6391} {"train_loss": -28.233198165893555, "global_step": 530484, "epoch": 6391} {"train_loss": -27.689008712768555, "global_step": 530485, "epoch": 6391} {"train_loss": -27.426074981689453, "global_step": 530486, "epoch": 6391} {"train_loss": -27.5145263671875, "global_step": 530487, "epoch": 6391} {"train_loss": -27.47809410095215, "global_step": 530488, "epoch": 6391} {"train_loss": -27.816532135009766, "global_step": 530489, "epoch": 6391} {"train_loss": -27.64310073852539, "global_step": 530490, "epoch": 6391} {"train_loss": -27.636083602905273, "global_step": 530491, "epoch": 6391} {"train_loss": -27.918476104736328, "global_step": 530492, "epoch": 6391} {"train_loss": -27.43276023864746, "global_step": 530493, "epoch": 6391} {"train_loss": -27.584238052368164, "global_step": 530494, "epoch": 6391} {"train_loss": -27.59596061706543, "global_step": 530495, "epoch": 6391} {"train_loss": -27.925939559936523, "global_step": 530496, "epoch": 6391} {"train_loss": -27.568944931030273, "global_step": 530497, "epoch": 6391} {"train_loss": -27.247241973876953, "global_step": 530498, "epoch": 6391} {"train_loss": -27.857908248901367, "global_step": 530499, "epoch": 6391} {"train_loss": -28.005231857299805, "global_step": 530500, "epoch": 6391} {"train_loss": -27.4815616607666, "global_step": 530501, "epoch": 6391} {"train_loss": -27.65143394470215, "global_step": 530502, "epoch": 6391} {"train_loss": -27.82159423828125, "global_step": 530503, "epoch": 6391} {"train_loss": -27.772491455078125, "global_step": 530504, "epoch": 6391} {"train_loss": -28.216901779174805, "global_step": 530505, "epoch": 6391} {"train_loss": -27.87653160095215, "global_step": 530506, "epoch": 6391} {"train_loss": -27.076309204101562, "global_step": 530507, "epoch": 6391} {"train_loss": -26.838031768798828, "global_step": 530508, "epoch": 6391} {"train_loss": -26.945646286010742, "global_step": 530509, "epoch": 6391} {"train_loss": -27.279586791992188, "global_step": 530510, "epoch": 6391} {"train_loss": -27.359277725219727, "global_step": 530511, "epoch": 6391} {"train_loss": -27.55018424987793, "global_step": 530512, "epoch": 6391} {"train_loss": -26.95704460144043, "global_step": 530513, "epoch": 6391} {"train_loss": -27.139158248901367, "global_step": 530514, "epoch": 6391} {"train_loss": -27.2213077545166, "global_step": 530515, "epoch": 6391} {"train_loss": -27.67205238342285, "global_step": 530516, "epoch": 6391} {"train_loss": -27.75489616394043, "global_step": 530517, "epoch": 6391} {"train_loss": -27.479700088500977, "global_step": 530518, "epoch": 6391} {"train_loss": -27.414113998413086, "global_step": 530519, "epoch": 6391} {"train_loss": -27.064680099487305, "global_step": 530520, "epoch": 6391} {"train_loss": -27.645557403564453, "global_step": 530521, "epoch": 6391} {"train_loss": -27.355731964111328, "global_step": 530522, "epoch": 6391} {"train_loss": -27.374591827392578, "global_step": 530523, "epoch": 6391} {"train_loss": -27.549158096313477, "global_step": 530524, "epoch": 6391} {"train_loss": -27.62546730041504, "global_step": 530525, "epoch": 6391} {"train_loss": -27.682910919189453, "global_step": 530526, "epoch": 6391} {"train_loss": -27.4372501373291, "global_step": 530527, "epoch": 6391} {"train_loss": -27.758804321289062, "global_step": 530528, "epoch": 6391} {"train_loss": -27.50046157836914, "global_step": 530529, "epoch": 6391} {"train_loss": -28.06951332092285, "global_step": 530530, "epoch": 6391} {"train_loss": -27.5222225189209, "global_step": 530531, "epoch": 6391} {"train_loss": -27.56485939025879, "global_step": 530532, "epoch": 6391} {"train_loss": -27.324481964111328, "global_step": 530533, "epoch": 6391} {"train_loss": -27.923730850219727, "global_step": 530534, "epoch": 6391} {"train_loss": -27.46395527023867, "global_step": 530535, "epoch": 6391, "val_loss": 6474308.0} {"train_loss": -26.771757125854492, "global_step": 530536, "epoch": 6392} {"train_loss": -27.502099990844727, "global_step": 530537, "epoch": 6392} {"train_loss": -26.982370376586914, "global_step": 530538, "epoch": 6392} {"train_loss": -27.266937255859375, "global_step": 530539, "epoch": 6392} {"train_loss": -27.334997177124023, "global_step": 530540, "epoch": 6392} {"train_loss": -27.072967529296875, "global_step": 530541, "epoch": 6392} {"train_loss": -26.755842208862305, "global_step": 530542, "epoch": 6392} {"train_loss": -27.13746452331543, "global_step": 530543, "epoch": 6392} {"train_loss": -27.464496612548828, "global_step": 530544, "epoch": 6392} {"train_loss": -27.38311195373535, "global_step": 530545, "epoch": 6392} {"train_loss": -27.10493278503418, "global_step": 530546, "epoch": 6392} {"train_loss": -27.0242977142334, "global_step": 530547, "epoch": 6392} {"train_loss": -27.5640811920166, "global_step": 530548, "epoch": 6392} {"train_loss": -27.373632431030273, "global_step": 530549, "epoch": 6392} {"train_loss": -27.47235679626465, "global_step": 530550, "epoch": 6392} {"train_loss": -27.5759220123291, "global_step": 530551, "epoch": 6392} {"train_loss": -27.347211837768555, "global_step": 530552, "epoch": 6392} {"train_loss": -27.848682403564453, "global_step": 530553, "epoch": 6392} {"train_loss": -27.093219757080078, "global_step": 530554, "epoch": 6392} {"train_loss": -27.094898223876953, "global_step": 530555, "epoch": 6392} {"train_loss": -27.593708038330078, "global_step": 530556, "epoch": 6392} {"train_loss": -27.650089263916016, "global_step": 530557, "epoch": 6392} {"train_loss": -27.568470001220703, "global_step": 530558, "epoch": 6392} {"train_loss": -27.404890060424805, "global_step": 530559, "epoch": 6392} {"train_loss": -27.34705924987793, "global_step": 530560, "epoch": 6392} {"train_loss": -27.5506591796875, "global_step": 530561, "epoch": 6392} {"train_loss": -27.91180419921875, "global_step": 530562, "epoch": 6392} {"train_loss": -27.320016860961914, "global_step": 530563, "epoch": 6392} {"train_loss": -27.318384170532227, "global_step": 530564, "epoch": 6392} {"train_loss": -27.9018497467041, "global_step": 530565, "epoch": 6392} {"train_loss": -27.514020919799805, "global_step": 530566, "epoch": 6392} {"train_loss": -27.408111572265625, "global_step": 530567, "epoch": 6392} {"train_loss": -27.548023223876953, "global_step": 530568, "epoch": 6392} {"train_loss": -27.555957794189453, "global_step": 530569, "epoch": 6392} {"train_loss": -27.514118194580078, "global_step": 530570, "epoch": 6392} {"train_loss": -27.180755615234375, "global_step": 530571, "epoch": 6392} {"train_loss": -27.260862350463867, "global_step": 530572, "epoch": 6392} {"train_loss": -28.02400779724121, "global_step": 530573, "epoch": 6392} {"train_loss": -27.82142448425293, "global_step": 530574, "epoch": 6392} {"train_loss": -27.549299240112305, "global_step": 530575, "epoch": 6392} {"train_loss": -27.34527587890625, "global_step": 530576, "epoch": 6392} {"train_loss": -27.58465003967285, "global_step": 530577, "epoch": 6392} {"train_loss": -27.53775405883789, "global_step": 530578, "epoch": 6392} {"train_loss": -28.095911026000977, "global_step": 530579, "epoch": 6392} {"train_loss": -27.657062530517578, "global_step": 530580, "epoch": 6392} {"train_loss": -27.61751365661621, "global_step": 530581, "epoch": 6392} {"train_loss": -27.162464141845703, "global_step": 530582, "epoch": 6392} {"train_loss": -27.336572647094727, "global_step": 530583, "epoch": 6392} {"train_loss": -27.580997467041016, "global_step": 530584, "epoch": 6392} {"train_loss": -27.471357345581055, "global_step": 530585, "epoch": 6392} {"train_loss": -27.752063751220703, "global_step": 530586, "epoch": 6392} {"train_loss": -27.21150779724121, "global_step": 530587, "epoch": 6392} {"train_loss": -27.675323486328125, "global_step": 530588, "epoch": 6392} {"train_loss": -27.678577423095703, "global_step": 530589, "epoch": 6392} {"train_loss": -27.755475997924805, "global_step": 530590, "epoch": 6392} {"train_loss": -27.4084529876709, "global_step": 530591, "epoch": 6392} {"train_loss": -27.483121871948242, "global_step": 530592, "epoch": 6392} {"train_loss": -27.69291114807129, "global_step": 530593, "epoch": 6392} {"train_loss": -27.463071823120117, "global_step": 530594, "epoch": 6392} {"train_loss": -27.646223068237305, "global_step": 530595, "epoch": 6392} {"train_loss": -27.57869529724121, "global_step": 530596, "epoch": 6392} {"train_loss": -28.049833297729492, "global_step": 530597, "epoch": 6392} {"train_loss": -27.51741600036621, "global_step": 530598, "epoch": 6392} {"train_loss": -27.504119873046875, "global_step": 530599, "epoch": 6392} {"train_loss": -28.1031551361084, "global_step": 530600, "epoch": 6392} {"train_loss": -27.99920654296875, "global_step": 530601, "epoch": 6392} {"train_loss": -28.049102783203125, "global_step": 530602, "epoch": 6392} {"train_loss": -28.067825317382812, "global_step": 530603, "epoch": 6392} {"train_loss": -27.65472984313965, "global_step": 530604, "epoch": 6392} {"train_loss": -27.730255126953125, "global_step": 530605, "epoch": 6392} {"train_loss": -27.62415885925293, "global_step": 530606, "epoch": 6392} {"train_loss": -27.76666831970215, "global_step": 530607, "epoch": 6392} {"train_loss": -27.843717575073242, "global_step": 530608, "epoch": 6392} {"train_loss": -27.732135772705078, "global_step": 530609, "epoch": 6392} {"train_loss": -27.671127319335938, "global_step": 530610, "epoch": 6392} {"train_loss": -27.389516830444336, "global_step": 530611, "epoch": 6392} {"train_loss": -27.39149284362793, "global_step": 530612, "epoch": 6392} {"train_loss": -27.735916137695312, "global_step": 530613, "epoch": 6392} {"train_loss": -27.461679458618164, "global_step": 530614, "epoch": 6392} {"train_loss": -27.844846725463867, "global_step": 530615, "epoch": 6392} {"train_loss": -27.82158851623535, "global_step": 530616, "epoch": 6392} {"train_loss": -27.910938262939453, "global_step": 530617, "epoch": 6392} {"train_loss": -27.528317692768145, "global_step": 530618, "epoch": 6392, "val_loss": 6494677.0} {"train_loss": -26.03900718688965, "global_step": 530619, "epoch": 6393} {"train_loss": -25.653573989868164, "global_step": 530620, "epoch": 6393} {"train_loss": -25.97471046447754, "global_step": 530621, "epoch": 6393} {"train_loss": -26.646631240844727, "global_step": 530622, "epoch": 6393} {"train_loss": -26.421466827392578, "global_step": 530623, "epoch": 6393} {"train_loss": -26.00029945373535, "global_step": 530624, "epoch": 6393} {"train_loss": -26.924087524414062, "global_step": 530625, "epoch": 6393} {"train_loss": -26.76102066040039, "global_step": 530626, "epoch": 6393} {"train_loss": -26.827316284179688, "global_step": 530627, "epoch": 6393} {"train_loss": -27.197240829467773, "global_step": 530628, "epoch": 6393} {"train_loss": -26.85576820373535, "global_step": 530629, "epoch": 6393} {"train_loss": -27.231550216674805, "global_step": 530630, "epoch": 6393} {"train_loss": -27.136091232299805, "global_step": 530631, "epoch": 6393} {"train_loss": -27.440946578979492, "global_step": 530632, "epoch": 6393} {"train_loss": -26.96044921875, "global_step": 530633, "epoch": 6393} {"train_loss": -26.89834976196289, "global_step": 530634, "epoch": 6393} {"train_loss": -27.077198028564453, "global_step": 530635, "epoch": 6393} {"train_loss": -27.16803550720215, "global_step": 530636, "epoch": 6393} {"train_loss": -26.836210250854492, "global_step": 530637, "epoch": 6393} {"train_loss": -26.87030029296875, "global_step": 530638, "epoch": 6393} {"train_loss": -27.640897750854492, "global_step": 530639, "epoch": 6393} {"train_loss": -27.046247482299805, "global_step": 530640, "epoch": 6393} {"train_loss": -27.226621627807617, "global_step": 530641, "epoch": 6393} {"train_loss": -27.276321411132812, "global_step": 530642, "epoch": 6393} {"train_loss": -27.50653076171875, "global_step": 530643, "epoch": 6393} {"train_loss": -26.99222183227539, "global_step": 530644, "epoch": 6393} {"train_loss": -26.95285987854004, "global_step": 530645, "epoch": 6393} {"train_loss": -27.347898483276367, "global_step": 530646, "epoch": 6393} {"train_loss": -27.460254669189453, "global_step": 530647, "epoch": 6393} {"train_loss": -27.547712326049805, "global_step": 530648, "epoch": 6393} {"train_loss": -27.67105484008789, "global_step": 530649, "epoch": 6393} {"train_loss": -27.384424209594727, "global_step": 530650, "epoch": 6393} {"train_loss": -27.583515167236328, "global_step": 530651, "epoch": 6393} {"train_loss": -27.564233779907227, "global_step": 530652, "epoch": 6393} {"train_loss": -27.757246017456055, "global_step": 530653, "epoch": 6393} {"train_loss": -27.97307777404785, "global_step": 530654, "epoch": 6393} {"train_loss": -27.618127822875977, "global_step": 530655, "epoch": 6393} {"train_loss": -27.409582138061523, "global_step": 530656, "epoch": 6393} {"train_loss": -27.797510147094727, "global_step": 530657, "epoch": 6393} {"train_loss": -27.326282501220703, "global_step": 530658, "epoch": 6393} {"train_loss": -27.923233032226562, "global_step": 530659, "epoch": 6393} {"train_loss": -27.715192794799805, "global_step": 530660, "epoch": 6393} {"train_loss": -27.442941665649414, "global_step": 530661, "epoch": 6393} {"train_loss": -27.637741088867188, "global_step": 530662, "epoch": 6393} {"train_loss": -27.84942054748535, "global_step": 530663, "epoch": 6393} {"train_loss": -27.840009689331055, "global_step": 530664, "epoch": 6393} {"train_loss": -28.152069091796875, "global_step": 530665, "epoch": 6393} {"train_loss": -27.73505210876465, "global_step": 530666, "epoch": 6393} {"train_loss": -27.617206573486328, "global_step": 530667, "epoch": 6393} {"train_loss": -27.740676879882812, "global_step": 530668, "epoch": 6393} {"train_loss": -27.803668975830078, "global_step": 530669, "epoch": 6393} {"train_loss": -27.75227165222168, "global_step": 530670, "epoch": 6393} {"train_loss": -27.690282821655273, "global_step": 530671, "epoch": 6393} {"train_loss": -28.1419677734375, "global_step": 530672, "epoch": 6393} {"train_loss": -28.04424476623535, "global_step": 530673, "epoch": 6393} {"train_loss": -28.155141830444336, "global_step": 530674, "epoch": 6393} {"train_loss": -27.513671875, "global_step": 530675, "epoch": 6393} {"train_loss": -28.170429229736328, "global_step": 530676, "epoch": 6393} {"train_loss": -27.7199764251709, "global_step": 530677, "epoch": 6393} {"train_loss": -27.96443748474121, "global_step": 530678, "epoch": 6393} {"train_loss": -27.98691749572754, "global_step": 530679, "epoch": 6393} {"train_loss": -27.567813873291016, "global_step": 530680, "epoch": 6393} {"train_loss": -27.570199966430664, "global_step": 530681, "epoch": 6393} {"train_loss": -27.48514747619629, "global_step": 530682, "epoch": 6393} {"train_loss": -27.340545654296875, "global_step": 530683, "epoch": 6393} {"train_loss": -27.802404403686523, "global_step": 530684, "epoch": 6393} {"train_loss": -27.617521286010742, "global_step": 530685, "epoch": 6393} {"train_loss": -27.266550064086914, "global_step": 530686, "epoch": 6393} {"train_loss": -27.41586685180664, "global_step": 530687, "epoch": 6393} {"train_loss": -27.75115394592285, "global_step": 530688, "epoch": 6393} {"train_loss": -27.53704833984375, "global_step": 530689, "epoch": 6393} {"train_loss": -27.208709716796875, "global_step": 530690, "epoch": 6393} {"train_loss": -27.744831085205078, "global_step": 530691, "epoch": 6393} {"train_loss": -27.381811141967773, "global_step": 530692, "epoch": 6393} {"train_loss": -27.491445541381836, "global_step": 530693, "epoch": 6393} {"train_loss": -27.504261016845703, "global_step": 530694, "epoch": 6393} {"train_loss": -27.65566062927246, "global_step": 530695, "epoch": 6393} {"train_loss": -27.1384334564209, "global_step": 530696, "epoch": 6393} {"train_loss": -27.701873779296875, "global_step": 530697, "epoch": 6393} {"train_loss": -27.561025619506836, "global_step": 530698, "epoch": 6393} {"train_loss": -27.609939575195312, "global_step": 530699, "epoch": 6393} {"train_loss": -27.806264877319336, "global_step": 530700, "epoch": 6393} {"train_loss": -27.376426880618176, "global_step": 530701, "epoch": 6393, "val_loss": 6518840.0} {"train_loss": -27.184850692749023, "global_step": 530702, "epoch": 6394} {"train_loss": -26.764392852783203, "global_step": 530703, "epoch": 6394} {"train_loss": -27.1043701171875, "global_step": 530704, "epoch": 6394} {"train_loss": -26.708328247070312, "global_step": 530705, "epoch": 6394} {"train_loss": -27.325651168823242, "global_step": 530706, "epoch": 6394} {"train_loss": -27.23004150390625, "global_step": 530707, "epoch": 6394} {"train_loss": -27.506637573242188, "global_step": 530708, "epoch": 6394} {"train_loss": -27.097620010375977, "global_step": 530709, "epoch": 6394} {"train_loss": -27.102697372436523, "global_step": 530710, "epoch": 6394} {"train_loss": -27.1724796295166, "global_step": 530711, "epoch": 6394} {"train_loss": -27.223886489868164, "global_step": 530712, "epoch": 6394} {"train_loss": -27.13959312438965, "global_step": 530713, "epoch": 6394} {"train_loss": -27.0698299407959, "global_step": 530714, "epoch": 6394} {"train_loss": -27.131805419921875, "global_step": 530715, "epoch": 6394} {"train_loss": -27.35389518737793, "global_step": 530716, "epoch": 6394} {"train_loss": -27.794219970703125, "global_step": 530717, "epoch": 6394} {"train_loss": -27.52644157409668, "global_step": 530718, "epoch": 6394} {"train_loss": -27.228046417236328, "global_step": 530719, "epoch": 6394} {"train_loss": -27.395299911499023, "global_step": 530720, "epoch": 6394} {"train_loss": -27.545703887939453, "global_step": 530721, "epoch": 6394} {"train_loss": -27.942474365234375, "global_step": 530722, "epoch": 6394} {"train_loss": -27.45819091796875, "global_step": 530723, "epoch": 6394} {"train_loss": -27.1135311126709, "global_step": 530724, "epoch": 6394} {"train_loss": -27.54022789001465, "global_step": 530725, "epoch": 6394} {"train_loss": -27.33147621154785, "global_step": 530726, "epoch": 6394} {"train_loss": -27.62379264831543, "global_step": 530727, "epoch": 6394} {"train_loss": -27.8513126373291, "global_step": 530728, "epoch": 6394} {"train_loss": -27.470006942749023, "global_step": 530729, "epoch": 6394} {"train_loss": -27.71396827697754, "global_step": 530730, "epoch": 6394} {"train_loss": -27.66973876953125, "global_step": 530731, "epoch": 6394} {"train_loss": -27.871341705322266, "global_step": 530732, "epoch": 6394} {"train_loss": -27.526626586914062, "global_step": 530733, "epoch": 6394} {"train_loss": -27.323993682861328, "global_step": 530734, "epoch": 6394} {"train_loss": -27.65701675415039, "global_step": 530735, "epoch": 6394} {"train_loss": -27.74679946899414, "global_step": 530736, "epoch": 6394} {"train_loss": -27.706928253173828, "global_step": 530737, "epoch": 6394} {"train_loss": -27.484634399414062, "global_step": 530738, "epoch": 6394} {"train_loss": -27.843109130859375, "global_step": 530739, "epoch": 6394} {"train_loss": -27.49702262878418, "global_step": 530740, "epoch": 6394} {"train_loss": -27.521554946899414, "global_step": 530741, "epoch": 6394} {"train_loss": -27.9964656829834, "global_step": 530742, "epoch": 6394} {"train_loss": -27.675525665283203, "global_step": 530743, "epoch": 6394} {"train_loss": -27.653949737548828, "global_step": 530744, "epoch": 6394} {"train_loss": -27.911956787109375, "global_step": 530745, "epoch": 6394} {"train_loss": -27.781641006469727, "global_step": 530746, "epoch": 6394} {"train_loss": -27.664337158203125, "global_step": 530747, "epoch": 6394} {"train_loss": -28.00886344909668, "global_step": 530748, "epoch": 6394} {"train_loss": -27.413854598999023, "global_step": 530749, "epoch": 6394} {"train_loss": -27.737329483032227, "global_step": 530750, "epoch": 6394} {"train_loss": -27.724912643432617, "global_step": 530751, "epoch": 6394} {"train_loss": -27.93929100036621, "global_step": 530752, "epoch": 6394} {"train_loss": -27.271072387695312, "global_step": 530753, "epoch": 6394} {"train_loss": -27.749265670776367, "global_step": 530754, "epoch": 6394} {"train_loss": -27.864459991455078, "global_step": 530755, "epoch": 6394} {"train_loss": -27.856298446655273, "global_step": 530756, "epoch": 6394} {"train_loss": -27.51178550720215, "global_step": 530757, "epoch": 6394} {"train_loss": -27.58245277404785, "global_step": 530758, "epoch": 6394} {"train_loss": -27.7773380279541, "global_step": 530759, "epoch": 6394} {"train_loss": -27.516759872436523, "global_step": 530760, "epoch": 6394} {"train_loss": -27.66983413696289, "global_step": 530761, "epoch": 6394} {"train_loss": -28.17595863342285, "global_step": 530762, "epoch": 6394} {"train_loss": -27.684309005737305, "global_step": 530763, "epoch": 6394} {"train_loss": -27.689178466796875, "global_step": 530764, "epoch": 6394} {"train_loss": -27.736480712890625, "global_step": 530765, "epoch": 6394} {"train_loss": -27.649539947509766, "global_step": 530766, "epoch": 6394} {"train_loss": -27.905902862548828, "global_step": 530767, "epoch": 6394} {"train_loss": -27.5599365234375, "global_step": 530768, "epoch": 6394} {"train_loss": -27.645893096923828, "global_step": 530769, "epoch": 6394} {"train_loss": -27.447452545166016, "global_step": 530770, "epoch": 6394} {"train_loss": -27.658313751220703, "global_step": 530771, "epoch": 6394} {"train_loss": -27.690671920776367, "global_step": 530772, "epoch": 6394} {"train_loss": -27.675922393798828, "global_step": 530773, "epoch": 6394} {"train_loss": -27.623138427734375, "global_step": 530774, "epoch": 6394} {"train_loss": -27.648263931274414, "global_step": 530775, "epoch": 6394} {"train_loss": -27.792367935180664, "global_step": 530776, "epoch": 6394} {"train_loss": -27.7364444732666, "global_step": 530777, "epoch": 6394} {"train_loss": -27.97956657409668, "global_step": 530778, "epoch": 6394} {"train_loss": -27.622425079345703, "global_step": 530779, "epoch": 6394} {"train_loss": -27.97370719909668, "global_step": 530780, "epoch": 6394} {"train_loss": -27.522674560546875, "global_step": 530781, "epoch": 6394} {"train_loss": -27.314971923828125, "global_step": 530782, "epoch": 6394} {"train_loss": -27.753101348876953, "global_step": 530783, "epoch": 6394} {"train_loss": -27.564780108899956, "global_step": 530784, "epoch": 6394, "val_loss": 6476960.5} {"train_loss": -26.736663818359375, "global_step": 530785, "epoch": 6395} {"train_loss": -26.185779571533203, "global_step": 530786, "epoch": 6395} {"train_loss": -26.369070053100586, "global_step": 530787, "epoch": 6395} {"train_loss": -27.271900177001953, "global_step": 530788, "epoch": 6395} {"train_loss": -26.210107803344727, "global_step": 530789, "epoch": 6395} {"train_loss": -26.380117416381836, "global_step": 530790, "epoch": 6395} {"train_loss": -26.460050582885742, "global_step": 530791, "epoch": 6395} {"train_loss": -26.278488159179688, "global_step": 530792, "epoch": 6395} {"train_loss": -26.966455459594727, "global_step": 530793, "epoch": 6395} {"train_loss": -26.432477951049805, "global_step": 530794, "epoch": 6395} {"train_loss": -26.90715980529785, "global_step": 530795, "epoch": 6395} {"train_loss": -26.497100830078125, "global_step": 530796, "epoch": 6395} {"train_loss": -26.847925186157227, "global_step": 530797, "epoch": 6395} {"train_loss": -27.072187423706055, "global_step": 530798, "epoch": 6395} {"train_loss": -26.3215389251709, "global_step": 530799, "epoch": 6395} {"train_loss": -26.973785400390625, "global_step": 530800, "epoch": 6395} {"train_loss": -26.996185302734375, "global_step": 530801, "epoch": 6395} {"train_loss": -27.24098014831543, "global_step": 530802, "epoch": 6395} {"train_loss": -27.2390193939209, "global_step": 530803, "epoch": 6395} {"train_loss": -26.79585075378418, "global_step": 530804, "epoch": 6395} {"train_loss": -27.26434326171875, "global_step": 530805, "epoch": 6395} {"train_loss": -26.986648559570312, "global_step": 530806, "epoch": 6395} {"train_loss": -27.31524658203125, "global_step": 530807, "epoch": 6395} {"train_loss": -27.245161056518555, "global_step": 530808, "epoch": 6395} {"train_loss": -27.305469512939453, "global_step": 530809, "epoch": 6395} {"train_loss": -27.42896842956543, "global_step": 530810, "epoch": 6395} {"train_loss": -27.249759674072266, "global_step": 530811, "epoch": 6395} {"train_loss": -26.99346351623535, "global_step": 530812, "epoch": 6395} {"train_loss": -27.537199020385742, "global_step": 530813, "epoch": 6395} {"train_loss": -27.21652603149414, "global_step": 530814, "epoch": 6395} {"train_loss": -27.47499656677246, "global_step": 530815, "epoch": 6395} {"train_loss": -27.51975440979004, "global_step": 530816, "epoch": 6395} {"train_loss": -27.3895263671875, "global_step": 530817, "epoch": 6395} {"train_loss": -27.53546142578125, "global_step": 530818, "epoch": 6395} {"train_loss": -27.499591827392578, "global_step": 530819, "epoch": 6395} {"train_loss": -27.64593505859375, "global_step": 530820, "epoch": 6395} {"train_loss": -27.723926544189453, "global_step": 530821, "epoch": 6395} {"train_loss": -27.799579620361328, "global_step": 530822, "epoch": 6395} {"train_loss": -27.638090133666992, "global_step": 530823, "epoch": 6395} {"train_loss": -27.625213623046875, "global_step": 530824, "epoch": 6395} {"train_loss": -27.780073165893555, "global_step": 530825, "epoch": 6395} {"train_loss": -27.74810791015625, "global_step": 530826, "epoch": 6395} {"train_loss": -27.56068992614746, "global_step": 530827, "epoch": 6395} {"train_loss": -27.96435546875, "global_step": 530828, "epoch": 6395} {"train_loss": -27.584278106689453, "global_step": 530829, "epoch": 6395} {"train_loss": -28.062353134155273, "global_step": 530830, "epoch": 6395} {"train_loss": -27.83782958984375, "global_step": 530831, "epoch": 6395} {"train_loss": -27.94744300842285, "global_step": 530832, "epoch": 6395} {"train_loss": -27.81624412536621, "global_step": 530833, "epoch": 6395} {"train_loss": -27.94540786743164, "global_step": 530834, "epoch": 6395} {"train_loss": -28.04024314880371, "global_step": 530835, "epoch": 6395} {"train_loss": -27.75836753845215, "global_step": 530836, "epoch": 6395} {"train_loss": -27.37113380432129, "global_step": 530837, "epoch": 6395} {"train_loss": -27.54937744140625, "global_step": 530838, "epoch": 6395} {"train_loss": -27.57942008972168, "global_step": 530839, "epoch": 6395} {"train_loss": -28.069793701171875, "global_step": 530840, "epoch": 6395} {"train_loss": -27.59712028503418, "global_step": 530841, "epoch": 6395} {"train_loss": -27.619558334350586, "global_step": 530842, "epoch": 6395} {"train_loss": -28.061246871948242, "global_step": 530843, "epoch": 6395} {"train_loss": -27.52569580078125, "global_step": 530844, "epoch": 6395} {"train_loss": -27.42510986328125, "global_step": 530845, "epoch": 6395} {"train_loss": -27.342065811157227, "global_step": 530846, "epoch": 6395} {"train_loss": -27.4029541015625, "global_step": 530847, "epoch": 6395} {"train_loss": -27.478208541870117, "global_step": 530848, "epoch": 6395} {"train_loss": -27.1301212310791, "global_step": 530849, "epoch": 6395} {"train_loss": -27.395038604736328, "global_step": 530850, "epoch": 6395} {"train_loss": -26.795846939086914, "global_step": 530851, "epoch": 6395} {"train_loss": -27.55293083190918, "global_step": 530852, "epoch": 6395} {"train_loss": -27.189367294311523, "global_step": 530853, "epoch": 6395} {"train_loss": -27.155054092407227, "global_step": 530854, "epoch": 6395} {"train_loss": -27.523883819580078, "global_step": 530855, "epoch": 6395} {"train_loss": -27.5062313079834, "global_step": 530856, "epoch": 6395} {"train_loss": -27.441457748413086, "global_step": 530857, "epoch": 6395} {"train_loss": -27.49928855895996, "global_step": 530858, "epoch": 6395} {"train_loss": -27.442731857299805, "global_step": 530859, "epoch": 6395} {"train_loss": -27.822580337524414, "global_step": 530860, "epoch": 6395} {"train_loss": -27.3026123046875, "global_step": 530861, "epoch": 6395} {"train_loss": -27.891103744506836, "global_step": 530862, "epoch": 6395} {"train_loss": -27.777896881103516, "global_step": 530863, "epoch": 6395} {"train_loss": -27.549962997436523, "global_step": 530864, "epoch": 6395} {"train_loss": -27.390710830688477, "global_step": 530865, "epoch": 6395} {"train_loss": -27.76325035095215, "global_step": 530866, "epoch": 6395} {"train_loss": -27.338079130793194, "global_step": 530867, "epoch": 6395, "val_loss": 6536693.0} {"train_loss": -27.330774307250977, "global_step": 530868, "epoch": 6396} {"train_loss": -26.645782470703125, "global_step": 530869, "epoch": 6396} {"train_loss": -26.136276245117188, "global_step": 530870, "epoch": 6396} {"train_loss": -25.52577018737793, "global_step": 530871, "epoch": 6396} {"train_loss": -25.716205596923828, "global_step": 530872, "epoch": 6396} {"train_loss": -27.048669815063477, "global_step": 530873, "epoch": 6396} {"train_loss": -26.933706283569336, "global_step": 530874, "epoch": 6396} {"train_loss": -26.669687271118164, "global_step": 530875, "epoch": 6396} {"train_loss": -27.20768165588379, "global_step": 530876, "epoch": 6396} {"train_loss": -26.900501251220703, "global_step": 530877, "epoch": 6396} {"train_loss": -27.013031005859375, "global_step": 530878, "epoch": 6396} {"train_loss": -27.2005558013916, "global_step": 530879, "epoch": 6396} {"train_loss": -27.08868408203125, "global_step": 530880, "epoch": 6396} {"train_loss": -27.055622100830078, "global_step": 530881, "epoch": 6396} {"train_loss": -26.960779190063477, "global_step": 530882, "epoch": 6396} {"train_loss": -27.613677978515625, "global_step": 530883, "epoch": 6396} {"train_loss": -27.341140747070312, "global_step": 530884, "epoch": 6396} {"train_loss": -27.629072189331055, "global_step": 530885, "epoch": 6396} {"train_loss": -27.477802276611328, "global_step": 530886, "epoch": 6396} {"train_loss": -27.427978515625, "global_step": 530887, "epoch": 6396} {"train_loss": -27.515705108642578, "global_step": 530888, "epoch": 6396} {"train_loss": -27.418554306030273, "global_step": 530889, "epoch": 6396} {"train_loss": -27.326501846313477, "global_step": 530890, "epoch": 6396} {"train_loss": -27.444700241088867, "global_step": 530891, "epoch": 6396} {"train_loss": -27.812238693237305, "global_step": 530892, "epoch": 6396} {"train_loss": -27.611845016479492, "global_step": 530893, "epoch": 6396} {"train_loss": -27.473962783813477, "global_step": 530894, "epoch": 6396} {"train_loss": -27.690580368041992, "global_step": 530895, "epoch": 6396} {"train_loss": -27.632110595703125, "global_step": 530896, "epoch": 6396} {"train_loss": -28.164899826049805, "global_step": 530897, "epoch": 6396} {"train_loss": -27.671659469604492, "global_step": 530898, "epoch": 6396} {"train_loss": -27.49973487854004, "global_step": 530899, "epoch": 6396} {"train_loss": -27.779647827148438, "global_step": 530900, "epoch": 6396} {"train_loss": -27.83394432067871, "global_step": 530901, "epoch": 6396} {"train_loss": -27.588428497314453, "global_step": 530902, "epoch": 6396} {"train_loss": -28.153085708618164, "global_step": 530903, "epoch": 6396} {"train_loss": -27.892318725585938, "global_step": 530904, "epoch": 6396} {"train_loss": -27.717985153198242, "global_step": 530905, "epoch": 6396} {"train_loss": -27.2619571685791, "global_step": 530906, "epoch": 6396} {"train_loss": -27.64653968811035, "global_step": 530907, "epoch": 6396} {"train_loss": -27.5148983001709, "global_step": 530908, "epoch": 6396} {"train_loss": -28.20936393737793, "global_step": 530909, "epoch": 6396} {"train_loss": -27.84650993347168, "global_step": 530910, "epoch": 6396} {"train_loss": -27.462554931640625, "global_step": 530911, "epoch": 6396} {"train_loss": -27.66985511779785, "global_step": 530912, "epoch": 6396} {"train_loss": -27.573740005493164, "global_step": 530913, "epoch": 6396} {"train_loss": -27.182477951049805, "global_step": 530914, "epoch": 6396} {"train_loss": -27.96510887145996, "global_step": 530915, "epoch": 6396} {"train_loss": -27.334735870361328, "global_step": 530916, "epoch": 6396} {"train_loss": -27.683393478393555, "global_step": 530917, "epoch": 6396} {"train_loss": -27.542341232299805, "global_step": 530918, "epoch": 6396} {"train_loss": -27.60198974609375, "global_step": 530919, "epoch": 6396} {"train_loss": -27.248950958251953, "global_step": 530920, "epoch": 6396} {"train_loss": -27.473346710205078, "global_step": 530921, "epoch": 6396} {"train_loss": -27.82988929748535, "global_step": 530922, "epoch": 6396} {"train_loss": -27.603485107421875, "global_step": 530923, "epoch": 6396} {"train_loss": -27.5128231048584, "global_step": 530924, "epoch": 6396} {"train_loss": -27.739225387573242, "global_step": 530925, "epoch": 6396} {"train_loss": -27.50807762145996, "global_step": 530926, "epoch": 6396} {"train_loss": -27.966266632080078, "global_step": 530927, "epoch": 6396} {"train_loss": -27.58403968811035, "global_step": 530928, "epoch": 6396} {"train_loss": -27.50604248046875, "global_step": 530929, "epoch": 6396} {"train_loss": -27.580259323120117, "global_step": 530930, "epoch": 6396} {"train_loss": -27.7058162689209, "global_step": 530931, "epoch": 6396} {"train_loss": -27.283187866210938, "global_step": 530932, "epoch": 6396} {"train_loss": -27.44378662109375, "global_step": 530933, "epoch": 6396} {"train_loss": -28.025836944580078, "global_step": 530934, "epoch": 6396} {"train_loss": -27.9190616607666, "global_step": 530935, "epoch": 6396} {"train_loss": -27.596433639526367, "global_step": 530936, "epoch": 6396} {"train_loss": -27.84865379333496, "global_step": 530937, "epoch": 6396} {"train_loss": -27.839160919189453, "global_step": 530938, "epoch": 6396} {"train_loss": -27.79615592956543, "global_step": 530939, "epoch": 6396} {"train_loss": -28.181686401367188, "global_step": 530940, "epoch": 6396} {"train_loss": -28.133350372314453, "global_step": 530941, "epoch": 6396} {"train_loss": -27.61440086364746, "global_step": 530942, "epoch": 6396} {"train_loss": -27.904455184936523, "global_step": 530943, "epoch": 6396} {"train_loss": -27.80328369140625, "global_step": 530944, "epoch": 6396} {"train_loss": -27.921070098876953, "global_step": 530945, "epoch": 6396} {"train_loss": -27.925519943237305, "global_step": 530946, "epoch": 6396} {"train_loss": -27.682653427124023, "global_step": 530947, "epoch": 6396} {"train_loss": -27.66986656188965, "global_step": 530948, "epoch": 6396} {"train_loss": -27.69780921936035, "global_step": 530949, "epoch": 6396} {"train_loss": -27.508322658309016, "global_step": 530950, "epoch": 6396, "val_loss": 6440882.0} {"train_loss": -25.937881469726562, "global_step": 530951, "epoch": 6397} {"train_loss": -25.741336822509766, "global_step": 530952, "epoch": 6397} {"train_loss": -26.376386642456055, "global_step": 530953, "epoch": 6397} {"train_loss": -26.952863693237305, "global_step": 530954, "epoch": 6397} {"train_loss": -26.546070098876953, "global_step": 530955, "epoch": 6397} {"train_loss": -26.037328720092773, "global_step": 530956, "epoch": 6397} {"train_loss": -27.355411529541016, "global_step": 530957, "epoch": 6397} {"train_loss": -26.2384090423584, "global_step": 530958, "epoch": 6397} {"train_loss": -26.8099422454834, "global_step": 530959, "epoch": 6397} {"train_loss": -26.800739288330078, "global_step": 530960, "epoch": 6397} {"train_loss": -27.15406608581543, "global_step": 530961, "epoch": 6397} {"train_loss": -26.840229034423828, "global_step": 530962, "epoch": 6397} {"train_loss": -27.1707763671875, "global_step": 530963, "epoch": 6397} {"train_loss": -27.32903480529785, "global_step": 530964, "epoch": 6397} {"train_loss": -27.13362693786621, "global_step": 530965, "epoch": 6397} {"train_loss": -27.41814613342285, "global_step": 530966, "epoch": 6397} {"train_loss": -27.665246963500977, "global_step": 530967, "epoch": 6397} {"train_loss": -27.120656967163086, "global_step": 530968, "epoch": 6397} {"train_loss": -27.66448974609375, "global_step": 530969, "epoch": 6397} {"train_loss": -27.23520278930664, "global_step": 530970, "epoch": 6397} {"train_loss": -27.395679473876953, "global_step": 530971, "epoch": 6397} {"train_loss": -27.536697387695312, "global_step": 530972, "epoch": 6397} {"train_loss": -27.415449142456055, "global_step": 530973, "epoch": 6397} {"train_loss": -27.473175048828125, "global_step": 530974, "epoch": 6397} {"train_loss": -27.354434967041016, "global_step": 530975, "epoch": 6397} {"train_loss": -27.448028564453125, "global_step": 530976, "epoch": 6397} {"train_loss": -27.361318588256836, "global_step": 530977, "epoch": 6397} {"train_loss": -27.530393600463867, "global_step": 530978, "epoch": 6397} {"train_loss": -27.440093994140625, "global_step": 530979, "epoch": 6397} {"train_loss": -27.480457305908203, "global_step": 530980, "epoch": 6397} {"train_loss": -27.626361846923828, "global_step": 530981, "epoch": 6397} {"train_loss": -27.951496124267578, "global_step": 530982, "epoch": 6397} {"train_loss": -27.877561569213867, "global_step": 530983, "epoch": 6397} {"train_loss": -27.57891845703125, "global_step": 530984, "epoch": 6397} {"train_loss": -27.76136589050293, "global_step": 530985, "epoch": 6397} {"train_loss": -27.89637565612793, "global_step": 530986, "epoch": 6397} {"train_loss": -27.82793617248535, "global_step": 530987, "epoch": 6397} {"train_loss": -27.355066299438477, "global_step": 530988, "epoch": 6397} {"train_loss": -28.044599533081055, "global_step": 530989, "epoch": 6397} {"train_loss": -27.2076416015625, "global_step": 530990, "epoch": 6397} {"train_loss": -27.78413200378418, "global_step": 530991, "epoch": 6397} {"train_loss": -27.822187423706055, "global_step": 530992, "epoch": 6397} {"train_loss": -27.86014747619629, "global_step": 530993, "epoch": 6397} {"train_loss": -28.16131591796875, "global_step": 530994, "epoch": 6397} {"train_loss": -27.833608627319336, "global_step": 530995, "epoch": 6397} {"train_loss": -27.556760787963867, "global_step": 530996, "epoch": 6397} {"train_loss": -27.36968421936035, "global_step": 530997, "epoch": 6397} {"train_loss": -27.773223876953125, "global_step": 530998, "epoch": 6397} {"train_loss": -28.02119255065918, "global_step": 530999, "epoch": 6397} {"train_loss": -27.813817977905273, "global_step": 531000, "epoch": 6397} {"train_loss": -27.563983917236328, "global_step": 531001, "epoch": 6397} {"train_loss": -27.51724624633789, "global_step": 531002, "epoch": 6397} {"train_loss": -27.597318649291992, "global_step": 531003, "epoch": 6397} {"train_loss": -27.836023330688477, "global_step": 531004, "epoch": 6397} {"train_loss": -27.89898109436035, "global_step": 531005, "epoch": 6397} {"train_loss": -28.071577072143555, "global_step": 531006, "epoch": 6397} {"train_loss": -27.8807373046875, "global_step": 531007, "epoch": 6397} {"train_loss": -27.591827392578125, "global_step": 531008, "epoch": 6397} {"train_loss": -27.733245849609375, "global_step": 531009, "epoch": 6397} {"train_loss": -27.864749908447266, "global_step": 531010, "epoch": 6397} {"train_loss": -27.707080841064453, "global_step": 531011, "epoch": 6397} {"train_loss": -27.59136390686035, "global_step": 531012, "epoch": 6397} {"train_loss": -27.709930419921875, "global_step": 531013, "epoch": 6397} {"train_loss": -28.375944137573242, "global_step": 531014, "epoch": 6397} {"train_loss": -27.775650024414062, "global_step": 531015, "epoch": 6397} {"train_loss": -27.84457778930664, "global_step": 531016, "epoch": 6397} {"train_loss": -27.632709503173828, "global_step": 531017, "epoch": 6397} {"train_loss": -27.590490341186523, "global_step": 531018, "epoch": 6397} {"train_loss": -26.681427001953125, "global_step": 531019, "epoch": 6397} {"train_loss": -25.90919303894043, "global_step": 531020, "epoch": 6397} {"train_loss": -23.56658935546875, "global_step": 531021, "epoch": 6397} {"train_loss": -24.058246612548828, "global_step": 531022, "epoch": 6397} {"train_loss": -26.850976943969727, "global_step": 531023, "epoch": 6397} {"train_loss": -26.61891746520996, "global_step": 531024, "epoch": 6397} {"train_loss": -26.881467819213867, "global_step": 531025, "epoch": 6397} {"train_loss": -26.338422775268555, "global_step": 531026, "epoch": 6397} {"train_loss": -27.046384811401367, "global_step": 531027, "epoch": 6397} {"train_loss": -26.569650650024414, "global_step": 531028, "epoch": 6397} {"train_loss": -26.577863693237305, "global_step": 531029, "epoch": 6397} {"train_loss": -26.912139892578125, "global_step": 531030, "epoch": 6397} {"train_loss": -27.157840728759766, "global_step": 531031, "epoch": 6397} {"train_loss": -26.809127807617188, "global_step": 531032, "epoch": 6397} {"train_loss": -27.253193751875177, "global_step": 531033, "epoch": 6397, "val_loss": 6575044.5} {"train_loss": -25.788818359375, "global_step": 531034, "epoch": 6398} {"train_loss": -26.251663208007812, "global_step": 531035, "epoch": 6398} {"train_loss": -26.246862411499023, "global_step": 531036, "epoch": 6398} {"train_loss": -26.235488891601562, "global_step": 531037, "epoch": 6398} {"train_loss": -26.17914390563965, "global_step": 531038, "epoch": 6398} {"train_loss": -26.340198516845703, "global_step": 531039, "epoch": 6398} {"train_loss": -26.643798828125, "global_step": 531040, "epoch": 6398} {"train_loss": -26.701711654663086, "global_step": 531041, "epoch": 6398} {"train_loss": -26.44634437561035, "global_step": 531042, "epoch": 6398} {"train_loss": -26.397830963134766, "global_step": 531043, "epoch": 6398} {"train_loss": -26.66141128540039, "global_step": 531044, "epoch": 6398} {"train_loss": -26.8852481842041, "global_step": 531045, "epoch": 6398} {"train_loss": -26.932172775268555, "global_step": 531046, "epoch": 6398} {"train_loss": -26.603565216064453, "global_step": 531047, "epoch": 6398} {"train_loss": -26.756311416625977, "global_step": 531048, "epoch": 6398} {"train_loss": -27.075170516967773, "global_step": 531049, "epoch": 6398} {"train_loss": -26.71296501159668, "global_step": 531050, "epoch": 6398} {"train_loss": -26.89934730529785, "global_step": 531051, "epoch": 6398} {"train_loss": -26.865802764892578, "global_step": 531052, "epoch": 6398} {"train_loss": -26.977819442749023, "global_step": 531053, "epoch": 6398} {"train_loss": -27.129657745361328, "global_step": 531054, "epoch": 6398} {"train_loss": -27.10516357421875, "global_step": 531055, "epoch": 6398} {"train_loss": -26.842702865600586, "global_step": 531056, "epoch": 6398} {"train_loss": -27.101825714111328, "global_step": 531057, "epoch": 6398} {"train_loss": -26.90675163269043, "global_step": 531058, "epoch": 6398} {"train_loss": -27.167531967163086, "global_step": 531059, "epoch": 6398} {"train_loss": -26.94365882873535, "global_step": 531060, "epoch": 6398} {"train_loss": -27.01456069946289, "global_step": 531061, "epoch": 6398} {"train_loss": -27.697784423828125, "global_step": 531062, "epoch": 6398} {"train_loss": -27.370010375976562, "global_step": 531063, "epoch": 6398} {"train_loss": -27.612558364868164, "global_step": 531064, "epoch": 6398} {"train_loss": -27.415130615234375, "global_step": 531065, "epoch": 6398} {"train_loss": -27.505481719970703, "global_step": 531066, "epoch": 6398} {"train_loss": -27.550384521484375, "global_step": 531067, "epoch": 6398} {"train_loss": -27.41426658630371, "global_step": 531068, "epoch": 6398} {"train_loss": -27.554794311523438, "global_step": 531069, "epoch": 6398} {"train_loss": -27.755828857421875, "global_step": 531070, "epoch": 6398} {"train_loss": -27.626678466796875, "global_step": 531071, "epoch": 6398} {"train_loss": -27.80866050720215, "global_step": 531072, "epoch": 6398} {"train_loss": -27.791748046875, "global_step": 531073, "epoch": 6398} {"train_loss": -27.646081924438477, "global_step": 531074, "epoch": 6398} {"train_loss": -27.486770629882812, "global_step": 531075, "epoch": 6398} {"train_loss": -27.764373779296875, "global_step": 531076, "epoch": 6398} {"train_loss": -28.024612426757812, "global_step": 531077, "epoch": 6398} {"train_loss": -27.425649642944336, "global_step": 531078, "epoch": 6398} {"train_loss": -27.3325252532959, "global_step": 531079, "epoch": 6398} {"train_loss": -27.923080444335938, "global_step": 531080, "epoch": 6398} {"train_loss": -27.430347442626953, "global_step": 531081, "epoch": 6398} {"train_loss": -27.967798233032227, "global_step": 531082, "epoch": 6398} {"train_loss": -27.559301376342773, "global_step": 531083, "epoch": 6398} {"train_loss": -27.623416900634766, "global_step": 531084, "epoch": 6398} {"train_loss": -27.4890079498291, "global_step": 531085, "epoch": 6398} {"train_loss": -27.556232452392578, "global_step": 531086, "epoch": 6398} {"train_loss": -27.897220611572266, "global_step": 531087, "epoch": 6398} {"train_loss": -27.6123104095459, "global_step": 531088, "epoch": 6398} {"train_loss": -27.398529052734375, "global_step": 531089, "epoch": 6398} {"train_loss": -27.3426456451416, "global_step": 531090, "epoch": 6398} {"train_loss": -27.965543746948242, "global_step": 531091, "epoch": 6398} {"train_loss": -27.457258224487305, "global_step": 531092, "epoch": 6398} {"train_loss": -27.36065673828125, "global_step": 531093, "epoch": 6398} {"train_loss": -27.829360961914062, "global_step": 531094, "epoch": 6398} {"train_loss": -27.663320541381836, "global_step": 531095, "epoch": 6398} {"train_loss": -28.015424728393555, "global_step": 531096, "epoch": 6398} {"train_loss": -27.405187606811523, "global_step": 531097, "epoch": 6398} {"train_loss": -27.32877540588379, "global_step": 531098, "epoch": 6398} {"train_loss": -27.33746337890625, "global_step": 531099, "epoch": 6398} {"train_loss": -27.5007381439209, "global_step": 531100, "epoch": 6398} {"train_loss": -27.405099868774414, "global_step": 531101, "epoch": 6398} {"train_loss": -27.328617095947266, "global_step": 531102, "epoch": 6398} {"train_loss": -27.878332138061523, "global_step": 531103, "epoch": 6398} {"train_loss": -27.38309669494629, "global_step": 531104, "epoch": 6398} {"train_loss": -27.658899307250977, "global_step": 531105, "epoch": 6398} {"train_loss": -27.63962745666504, "global_step": 531106, "epoch": 6398} {"train_loss": -28.32566261291504, "global_step": 531107, "epoch": 6398} {"train_loss": -27.55555534362793, "global_step": 531108, "epoch": 6398} {"train_loss": -27.71392822265625, "global_step": 531109, "epoch": 6398} {"train_loss": -27.780988693237305, "global_step": 531110, "epoch": 6398} {"train_loss": -27.6018123626709, "global_step": 531111, "epoch": 6398} {"train_loss": -27.521987915039062, "global_step": 531112, "epoch": 6398} {"train_loss": -27.697265625, "global_step": 531113, "epoch": 6398} {"train_loss": -27.703933715820312, "global_step": 531114, "epoch": 6398} {"train_loss": -27.60225486755371, "global_step": 531115, "epoch": 6398} {"train_loss": -27.30883715526167, "global_step": 531116, "epoch": 6398, "val_loss": 6456475.0} {"train_loss": -27.5479793548584, "global_step": 531117, "epoch": 6399} {"train_loss": -27.520002365112305, "global_step": 531118, "epoch": 6399} {"train_loss": -27.45267677307129, "global_step": 531119, "epoch": 6399} {"train_loss": -27.306604385375977, "global_step": 531120, "epoch": 6399} {"train_loss": -27.273767471313477, "global_step": 531121, "epoch": 6399} {"train_loss": -27.7484188079834, "global_step": 531122, "epoch": 6399} {"train_loss": -27.5352725982666, "global_step": 531123, "epoch": 6399} {"train_loss": -27.462873458862305, "global_step": 531124, "epoch": 6399} {"train_loss": -27.576574325561523, "global_step": 531125, "epoch": 6399} {"train_loss": -27.483783721923828, "global_step": 531126, "epoch": 6399} {"train_loss": -27.406362533569336, "global_step": 531127, "epoch": 6399} {"train_loss": -27.740142822265625, "global_step": 531128, "epoch": 6399} {"train_loss": -27.706573486328125, "global_step": 531129, "epoch": 6399} {"train_loss": -27.54530906677246, "global_step": 531130, "epoch": 6399} {"train_loss": -27.2485408782959, "global_step": 531131, "epoch": 6399} {"train_loss": -27.22730827331543, "global_step": 531132, "epoch": 6399} {"train_loss": -27.160490036010742, "global_step": 531133, "epoch": 6399} {"train_loss": -27.815811157226562, "global_step": 531134, "epoch": 6399} {"train_loss": -27.806751251220703, "global_step": 531135, "epoch": 6399} {"train_loss": -27.75054931640625, "global_step": 531136, "epoch": 6399} {"train_loss": -27.494647979736328, "global_step": 531137, "epoch": 6399} {"train_loss": -27.781513214111328, "global_step": 531138, "epoch": 6399} {"train_loss": -27.181568145751953, "global_step": 531139, "epoch": 6399} {"train_loss": -27.525983810424805, "global_step": 531140, "epoch": 6399} {"train_loss": -27.65338706970215, "global_step": 531141, "epoch": 6399} {"train_loss": -27.36094093322754, "global_step": 531142, "epoch": 6399} {"train_loss": -27.293659210205078, "global_step": 531143, "epoch": 6399} {"train_loss": -27.475540161132812, "global_step": 531144, "epoch": 6399} {"train_loss": -27.258026123046875, "global_step": 531145, "epoch": 6399} {"train_loss": -27.573150634765625, "global_step": 531146, "epoch": 6399} {"train_loss": -27.533349990844727, "global_step": 531147, "epoch": 6399} {"train_loss": -27.529132843017578, "global_step": 531148, "epoch": 6399} {"train_loss": -27.923664093017578, "global_step": 531149, "epoch": 6399} {"train_loss": -27.71502685546875, "global_step": 531150, "epoch": 6399} {"train_loss": -27.61237907409668, "global_step": 531151, "epoch": 6399} {"train_loss": -27.81476402282715, "global_step": 531152, "epoch": 6399} {"train_loss": -27.910114288330078, "global_step": 531153, "epoch": 6399} {"train_loss": -27.6001033782959, "global_step": 531154, "epoch": 6399} {"train_loss": -27.248743057250977, "global_step": 531155, "epoch": 6399} {"train_loss": -27.7460880279541, "global_step": 531156, "epoch": 6399} {"train_loss": -27.6978702545166, "global_step": 531157, "epoch": 6399} {"train_loss": -27.55033302307129, "global_step": 531158, "epoch": 6399} {"train_loss": -28.09902000427246, "global_step": 531159, "epoch": 6399} {"train_loss": -27.8178653717041, "global_step": 531160, "epoch": 6399} {"train_loss": -27.756305694580078, "global_step": 531161, "epoch": 6399} {"train_loss": -27.521350860595703, "global_step": 531162, "epoch": 6399} {"train_loss": -27.533334732055664, "global_step": 531163, "epoch": 6399} {"train_loss": -27.896244049072266, "global_step": 531164, "epoch": 6399} {"train_loss": -27.927648544311523, "global_step": 531165, "epoch": 6399} {"train_loss": -27.766387939453125, "global_step": 531166, "epoch": 6399} {"train_loss": -27.688974380493164, "global_step": 531167, "epoch": 6399} {"train_loss": -27.665485382080078, "global_step": 531168, "epoch": 6399} {"train_loss": -27.754932403564453, "global_step": 531169, "epoch": 6399} {"train_loss": -27.739246368408203, "global_step": 531170, "epoch": 6399} {"train_loss": -27.815439224243164, "global_step": 531171, "epoch": 6399} {"train_loss": -27.526508331298828, "global_step": 531172, "epoch": 6399} {"train_loss": -27.658050537109375, "global_step": 531173, "epoch": 6399} {"train_loss": -27.80082130432129, "global_step": 531174, "epoch": 6399} {"train_loss": -27.552255630493164, "global_step": 531175, "epoch": 6399} {"train_loss": -27.901691436767578, "global_step": 531176, "epoch": 6399} {"train_loss": -27.893146514892578, "global_step": 531177, "epoch": 6399} {"train_loss": -27.568470001220703, "global_step": 531178, "epoch": 6399} {"train_loss": -27.60782241821289, "global_step": 531179, "epoch": 6399} {"train_loss": -27.633630752563477, "global_step": 531180, "epoch": 6399} {"train_loss": -27.52179527282715, "global_step": 531181, "epoch": 6399} {"train_loss": -27.85615348815918, "global_step": 531182, "epoch": 6399} {"train_loss": -28.098264694213867, "global_step": 531183, "epoch": 6399} {"train_loss": -27.573888778686523, "global_step": 531184, "epoch": 6399} {"train_loss": -27.814468383789062, "global_step": 531185, "epoch": 6399} {"train_loss": -27.6857967376709, "global_step": 531186, "epoch": 6399} {"train_loss": -27.778717041015625, "global_step": 531187, "epoch": 6399} {"train_loss": -27.828048706054688, "global_step": 531188, "epoch": 6399} {"train_loss": -27.818714141845703, "global_step": 531189, "epoch": 6399} {"train_loss": -27.74915885925293, "global_step": 531190, "epoch": 6399} {"train_loss": -27.865224838256836, "global_step": 531191, "epoch": 6399} {"train_loss": -27.517744064331055, "global_step": 531192, "epoch": 6399} {"train_loss": -27.716516494750977, "global_step": 531193, "epoch": 6399} {"train_loss": -27.817890167236328, "global_step": 531194, "epoch": 6399} {"train_loss": -27.64971923828125, "global_step": 531195, "epoch": 6399} {"train_loss": -27.452054977416992, "global_step": 531196, "epoch": 6399} {"train_loss": -27.0888614654541, "global_step": 531197, "epoch": 6399} {"train_loss": -26.766559600830078, "global_step": 531198, "epoch": 6399} {"train_loss": -27.604816115046123, "global_step": 531199, "epoch": 6399, "val_loss": 6420042.0} {"train_loss": -26.4075870513916, "global_step": 531200, "epoch": 6400} {"train_loss": -26.271148681640625, "global_step": 531201, "epoch": 6400} {"train_loss": -26.425424575805664, "global_step": 531202, "epoch": 6400} {"train_loss": -26.443628311157227, "global_step": 531203, "epoch": 6400} {"train_loss": -26.565689086914062, "global_step": 531204, "epoch": 6400} {"train_loss": -26.780027389526367, "global_step": 531205, "epoch": 6400} {"train_loss": -26.828125, "global_step": 531206, "epoch": 6400} {"train_loss": -26.63203239440918, "global_step": 531207, "epoch": 6400} {"train_loss": -26.971027374267578, "global_step": 531208, "epoch": 6400} {"train_loss": -27.090560913085938, "global_step": 531209, "epoch": 6400} {"train_loss": -26.833829879760742, "global_step": 531210, "epoch": 6400} {"train_loss": -26.692310333251953, "global_step": 531211, "epoch": 6400} {"train_loss": -26.159337997436523, "global_step": 531212, "epoch": 6400} {"train_loss": -26.884418487548828, "global_step": 531213, "epoch": 6400} {"train_loss": -26.95704460144043, "global_step": 531214, "epoch": 6400} {"train_loss": -27.252782821655273, "global_step": 531215, "epoch": 6400} {"train_loss": -27.466968536376953, "global_step": 531216, "epoch": 6400} {"train_loss": -26.97578239440918, "global_step": 531217, "epoch": 6400} {"train_loss": -27.17487144470215, "global_step": 531218, "epoch": 6400} {"train_loss": -27.336990356445312, "global_step": 531219, "epoch": 6400} {"train_loss": -27.4736385345459, "global_step": 531220, "epoch": 6400} {"train_loss": -26.954450607299805, "global_step": 531221, "epoch": 6400} {"train_loss": -27.38642692565918, "global_step": 531222, "epoch": 6400} {"train_loss": -27.191797256469727, "global_step": 531223, "epoch": 6400} {"train_loss": -27.537694931030273, "global_step": 531224, "epoch": 6400} {"train_loss": -27.362585067749023, "global_step": 531225, "epoch": 6400} {"train_loss": -27.2283935546875, "global_step": 531226, "epoch": 6400} {"train_loss": -27.390216827392578, "global_step": 531227, "epoch": 6400} {"train_loss": -27.243789672851562, "global_step": 531228, "epoch": 6400} {"train_loss": -27.553613662719727, "global_step": 531229, "epoch": 6400} {"train_loss": -27.04204750061035, "global_step": 531230, "epoch": 6400} {"train_loss": -27.52540397644043, "global_step": 531231, "epoch": 6400} {"train_loss": -27.82024574279785, "global_step": 531232, "epoch": 6400} {"train_loss": -27.188018798828125, "global_step": 531233, "epoch": 6400} {"train_loss": -27.15374755859375, "global_step": 531234, "epoch": 6400} {"train_loss": -27.27972984313965, "global_step": 531235, "epoch": 6400} {"train_loss": -27.397537231445312, "global_step": 531236, "epoch": 6400} {"train_loss": -27.715961456298828, "global_step": 531237, "epoch": 6400} {"train_loss": -27.201162338256836, "global_step": 531238, "epoch": 6400} {"train_loss": -27.503690719604492, "global_step": 531239, "epoch": 6400} {"train_loss": -27.41305923461914, "global_step": 531240, "epoch": 6400} {"train_loss": -27.602161407470703, "global_step": 531241, "epoch": 6400} {"train_loss": -27.641225814819336, "global_step": 531242, "epoch": 6400} {"train_loss": -27.617828369140625, "global_step": 531243, "epoch": 6400} {"train_loss": -27.702991485595703, "global_step": 531244, "epoch": 6400} {"train_loss": -28.0316219329834, "global_step": 531245, "epoch": 6400} {"train_loss": -27.654890060424805, "global_step": 531246, "epoch": 6400} {"train_loss": -27.505456924438477, "global_step": 531247, "epoch": 6400} {"train_loss": -27.659133911132812, "global_step": 531248, "epoch": 6400} {"train_loss": -28.13484001159668, "global_step": 531249, "epoch": 6400} {"train_loss": -27.45526123046875, "global_step": 531250, "epoch": 6400} {"train_loss": -27.616437911987305, "global_step": 531251, "epoch": 6400} {"train_loss": -27.763931274414062, "global_step": 531252, "epoch": 6400} {"train_loss": -27.705524444580078, "global_step": 531253, "epoch": 6400} {"train_loss": -27.594226837158203, "global_step": 531254, "epoch": 6400} {"train_loss": -27.751270294189453, "global_step": 531255, "epoch": 6400} {"train_loss": -27.57649040222168, "global_step": 531256, "epoch": 6400} {"train_loss": -27.704456329345703, "global_step": 531257, "epoch": 6400} {"train_loss": -27.6646728515625, "global_step": 531258, "epoch": 6400} {"train_loss": -27.9003963470459, "global_step": 531259, "epoch": 6400} {"train_loss": -27.713092803955078, "global_step": 531260, "epoch": 6400} {"train_loss": -27.121204376220703, "global_step": 531261, "epoch": 6400} {"train_loss": -27.59124755859375, "global_step": 531262, "epoch": 6400} {"train_loss": -27.876596450805664, "global_step": 531263, "epoch": 6400} {"train_loss": -27.62005043029785, "global_step": 531264, "epoch": 6400} {"train_loss": -27.2314510345459, "global_step": 531265, "epoch": 6400} {"train_loss": -27.56671714782715, "global_step": 531266, "epoch": 6400} {"train_loss": -27.99397087097168, "global_step": 531267, "epoch": 6400} {"train_loss": -27.288894653320312, "global_step": 531268, "epoch": 6400} {"train_loss": -27.53369140625, "global_step": 531269, "epoch": 6400} {"train_loss": -27.92452049255371, "global_step": 531270, "epoch": 6400} {"train_loss": -27.943328857421875, "global_step": 531271, "epoch": 6400} {"train_loss": -27.61359214782715, "global_step": 531272, "epoch": 6400} {"train_loss": -27.461584091186523, "global_step": 531273, "epoch": 6400} {"train_loss": -27.625446319580078, "global_step": 531274, "epoch": 6400} {"train_loss": -27.75705909729004, "global_step": 531275, "epoch": 6400} {"train_loss": -27.336999893188477, "global_step": 531276, "epoch": 6400} {"train_loss": -27.27120018005371, "global_step": 531277, "epoch": 6400} {"train_loss": -27.398406982421875, "global_step": 531278, "epoch": 6400} {"train_loss": -27.326995849609375, "global_step": 531279, "epoch": 6400} {"train_loss": -27.206411361694336, "global_step": 531280, "epoch": 6400} {"train_loss": -27.125131607055664, "global_step": 531281, "epoch": 6400} {"train_loss": -27.35263286728457, "global_step": 531282, "epoch": 6400, "train/sim_max_reward_0": 0.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 0.0, "train/sim_max_reward_4": 0.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4500000": 1.0, "test/sim_max_reward_4500001": 1.0, "test/sim_max_reward_4500002": 1.0, "test/sim_max_reward_4500003": 1.0, "test/sim_max_reward_4500004": 1.0, "test/sim_max_reward_4500005": 1.0, "test/sim_max_reward_4500006": 1.0, "test/sim_max_reward_4500007": 0.0, "test/sim_max_reward_4500008": 1.0, "test/sim_max_reward_4500009": 1.0, "test/sim_max_reward_4500010": 1.0, "test/sim_max_reward_4500011": 1.0, "test/sim_max_reward_4500012": 1.0, "test/sim_max_reward_4500013": 0.0, "test/sim_max_reward_4500014": 1.0, "test/sim_max_reward_4500015": 1.0, "test/sim_max_reward_4500016": 1.0, "test/sim_max_reward_4500017": 1.0, "test/sim_max_reward_4500018": 0.0, "test/sim_max_reward_4500019": 1.0, "test/sim_max_reward_4500020": 1.0, "test/sim_max_reward_4500021": 1.0, "train/mean_score": 0.5, "test/mean_score": 0.8636363636363636, "val_loss": 6445970.0} {"train_loss": -24.378583908081055, "global_step": 531283, "epoch": 6401} {"train_loss": -25.1059513092041, "global_step": 531284, "epoch": 6401} {"train_loss": -24.613431930541992, "global_step": 531285, "epoch": 6401} {"train_loss": -25.722442626953125, "global_step": 531286, "epoch": 6401} {"train_loss": -24.775493621826172, "global_step": 531287, "epoch": 6401} {"train_loss": -25.808460235595703, "global_step": 531288, "epoch": 6401} {"train_loss": -25.6028995513916, "global_step": 531289, "epoch": 6401} {"train_loss": -26.05731773376465, "global_step": 531290, "epoch": 6401} {"train_loss": -25.96990966796875, "global_step": 531291, "epoch": 6401} {"train_loss": -26.10330581665039, "global_step": 531292, "epoch": 6401} {"train_loss": -26.001144409179688, "global_step": 531293, "epoch": 6401} {"train_loss": -26.216413497924805, "global_step": 531294, "epoch": 6401} {"train_loss": -26.479055404663086, "global_step": 531295, "epoch": 6401} {"train_loss": -26.244489669799805, "global_step": 531296, "epoch": 6401} {"train_loss": -26.46845054626465, "global_step": 531297, "epoch": 6401} {"train_loss": -26.318115234375, "global_step": 531298, "epoch": 6401} {"train_loss": -26.268362045288086, "global_step": 531299, "epoch": 6401} {"train_loss": -26.496978759765625, "global_step": 531300, "epoch": 6401} {"train_loss": -26.423954010009766, "global_step": 531301, "epoch": 6401} {"train_loss": -26.750585556030273, "global_step": 531302, "epoch": 6401} {"train_loss": -26.70435905456543, "global_step": 531303, "epoch": 6401} {"train_loss": -26.5499210357666, "global_step": 531304, "epoch": 6401} {"train_loss": -26.4930362701416, "global_step": 531305, "epoch": 6401} {"train_loss": -26.24806785583496, "global_step": 531306, "epoch": 6401} {"train_loss": -26.272552490234375, "global_step": 531307, "epoch": 6401} {"train_loss": -26.802270889282227, "global_step": 531308, "epoch": 6401} {"train_loss": -27.088598251342773, "global_step": 531309, "epoch": 6401} {"train_loss": -26.637556076049805, "global_step": 531310, "epoch": 6401} {"train_loss": -26.908771514892578, "global_step": 531311, "epoch": 6401} {"train_loss": -27.070947647094727, "global_step": 531312, "epoch": 6401} {"train_loss": -26.941024780273438, "global_step": 531313, "epoch": 6401} {"train_loss": -26.662342071533203, "global_step": 531314, "epoch": 6401} {"train_loss": -27.256200790405273, "global_step": 531315, "epoch": 6401} {"train_loss": -27.23553466796875, "global_step": 531316, "epoch": 6401} {"train_loss": -27.215560913085938, "global_step": 531317, "epoch": 6401} {"train_loss": -27.206348419189453, "global_step": 531318, "epoch": 6401} {"train_loss": -27.623416900634766, "global_step": 531319, "epoch": 6401} {"train_loss": -27.127527236938477, "global_step": 531320, "epoch": 6401} {"train_loss": -27.507877349853516, "global_step": 531321, "epoch": 6401} {"train_loss": -26.6820068359375, "global_step": 531322, "epoch": 6401} {"train_loss": -27.5614070892334, "global_step": 531323, "epoch": 6401} {"train_loss": -27.107099533081055, "global_step": 531324, "epoch": 6401} {"train_loss": -27.649642944335938, "global_step": 531325, "epoch": 6401} {"train_loss": -27.404462814331055, "global_step": 531326, "epoch": 6401} {"train_loss": -26.94342041015625, "global_step": 531327, "epoch": 6401} {"train_loss": -27.49395179748535, "global_step": 531328, "epoch": 6401} {"train_loss": -27.34964942932129, "global_step": 531329, "epoch": 6401} {"train_loss": -27.59686279296875, "global_step": 531330, "epoch": 6401} {"train_loss": -27.32172203063965, "global_step": 531331, "epoch": 6401} {"train_loss": -27.431615829467773, "global_step": 531332, "epoch": 6401} {"train_loss": -27.292715072631836, "global_step": 531333, "epoch": 6401} {"train_loss": -27.636524200439453, "global_step": 531334, "epoch": 6401} {"train_loss": -27.9613094329834, "global_step": 531335, "epoch": 6401} {"train_loss": -27.338977813720703, "global_step": 531336, "epoch": 6401} {"train_loss": -27.839075088500977, "global_step": 531337, "epoch": 6401} {"train_loss": -27.712827682495117, "global_step": 531338, "epoch": 6401} {"train_loss": -27.777502059936523, "global_step": 531339, "epoch": 6401} {"train_loss": -27.660703659057617, "global_step": 531340, "epoch": 6401} {"train_loss": -27.82929039001465, "global_step": 531341, "epoch": 6401} {"train_loss": -27.70365333557129, "global_step": 531342, "epoch": 6401} {"train_loss": -27.684980392456055, "global_step": 531343, "epoch": 6401} {"train_loss": -27.501733779907227, "global_step": 531344, "epoch": 6401} {"train_loss": -27.844207763671875, "global_step": 531345, "epoch": 6401} {"train_loss": -27.484628677368164, "global_step": 531346, "epoch": 6401} {"train_loss": -27.942956924438477, "global_step": 531347, "epoch": 6401} {"train_loss": -27.9269962310791, "global_step": 531348, "epoch": 6401} {"train_loss": -27.426666259765625, "global_step": 531349, "epoch": 6401} {"train_loss": -27.95301628112793, "global_step": 531350, "epoch": 6401} {"train_loss": -27.703702926635742, "global_step": 531351, "epoch": 6401} {"train_loss": -27.571258544921875, "global_step": 531352, "epoch": 6401} {"train_loss": -27.64618492126465, "global_step": 531353, "epoch": 6401} {"train_loss": -27.914716720581055, "global_step": 531354, "epoch": 6401} {"train_loss": -27.903013229370117, "global_step": 531355, "epoch": 6401} {"train_loss": -27.445959091186523, "global_step": 531356, "epoch": 6401} {"train_loss": -27.707260131835938, "global_step": 531357, "epoch": 6401} {"train_loss": -27.245874404907227, "global_step": 531358, "epoch": 6401} {"train_loss": -28.002277374267578, "global_step": 531359, "epoch": 6401} {"train_loss": -27.174362182617188, "global_step": 531360, "epoch": 6401} {"train_loss": -27.495349884033203, "global_step": 531361, "epoch": 6401} {"train_loss": -27.05120277404785, "global_step": 531362, "epoch": 6401} {"train_loss": -26.87637710571289, "global_step": 531363, "epoch": 6401} {"train_loss": -27.412290573120117, "global_step": 531364, "epoch": 6401} {"train_loss": -27.013912017086902, "global_step": 531365, "epoch": 6401, "val_loss": 6449421.5} {"train_loss": -25.22545051574707, "global_step": 531366, "epoch": 6402} {"train_loss": -26.663496017456055, "global_step": 531367, "epoch": 6402} {"train_loss": -25.763504028320312, "global_step": 531368, "epoch": 6402} {"train_loss": -26.3428955078125, "global_step": 531369, "epoch": 6402} {"train_loss": -25.791223526000977, "global_step": 531370, "epoch": 6402} {"train_loss": -26.493764877319336, "global_step": 531371, "epoch": 6402} {"train_loss": -26.251144409179688, "global_step": 531372, "epoch": 6402} {"train_loss": -26.505035400390625, "global_step": 531373, "epoch": 6402} {"train_loss": -26.52242088317871, "global_step": 531374, "epoch": 6402} {"train_loss": -26.700916290283203, "global_step": 531375, "epoch": 6402} {"train_loss": -26.47670555114746, "global_step": 531376, "epoch": 6402} {"train_loss": -26.891958236694336, "global_step": 531377, "epoch": 6402} {"train_loss": -26.89229393005371, "global_step": 531378, "epoch": 6402} {"train_loss": -26.629125595092773, "global_step": 531379, "epoch": 6402} {"train_loss": -27.183927536010742, "global_step": 531380, "epoch": 6402} {"train_loss": -26.965803146362305, "global_step": 531381, "epoch": 6402} {"train_loss": -27.060102462768555, "global_step": 531382, "epoch": 6402} {"train_loss": -27.19124412536621, "global_step": 531383, "epoch": 6402} {"train_loss": -27.056299209594727, "global_step": 531384, "epoch": 6402} {"train_loss": -26.907974243164062, "global_step": 531385, "epoch": 6402} {"train_loss": -27.241199493408203, "global_step": 531386, "epoch": 6402} {"train_loss": -27.205352783203125, "global_step": 531387, "epoch": 6402} {"train_loss": -27.113737106323242, "global_step": 531388, "epoch": 6402} {"train_loss": -27.348920822143555, "global_step": 531389, "epoch": 6402} {"train_loss": -27.282331466674805, "global_step": 531390, "epoch": 6402} {"train_loss": -27.36512565612793, "global_step": 531391, "epoch": 6402} {"train_loss": -27.512983322143555, "global_step": 531392, "epoch": 6402} {"train_loss": -27.097919464111328, "global_step": 531393, "epoch": 6402} {"train_loss": -26.852880477905273, "global_step": 531394, "epoch": 6402} {"train_loss": -27.206375122070312, "global_step": 531395, "epoch": 6402} {"train_loss": -27.314619064331055, "global_step": 531396, "epoch": 6402} {"train_loss": -27.53080177307129, "global_step": 531397, "epoch": 6402} {"train_loss": -27.45501136779785, "global_step": 531398, "epoch": 6402} {"train_loss": -27.240249633789062, "global_step": 531399, "epoch": 6402} {"train_loss": -27.208206176757812, "global_step": 531400, "epoch": 6402} {"train_loss": -27.713336944580078, "global_step": 531401, "epoch": 6402} {"train_loss": -27.2755069732666, "global_step": 531402, "epoch": 6402} {"train_loss": -27.519514083862305, "global_step": 531403, "epoch": 6402} {"train_loss": -27.26230812072754, "global_step": 531404, "epoch": 6402} {"train_loss": -27.66266441345215, "global_step": 531405, "epoch": 6402} {"train_loss": -27.5519962310791, "global_step": 531406, "epoch": 6402} {"train_loss": -27.47722816467285, "global_step": 531407, "epoch": 6402} {"train_loss": -27.619733810424805, "global_step": 531408, "epoch": 6402} {"train_loss": -27.5787353515625, "global_step": 531409, "epoch": 6402} {"train_loss": -27.777923583984375, "global_step": 531410, "epoch": 6402} {"train_loss": -27.35297203063965, "global_step": 531411, "epoch": 6402} {"train_loss": -27.54779052734375, "global_step": 531412, "epoch": 6402} {"train_loss": -27.755273818969727, "global_step": 531413, "epoch": 6402} {"train_loss": -27.630834579467773, "global_step": 531414, "epoch": 6402} {"train_loss": -27.391626358032227, "global_step": 531415, "epoch": 6402} {"train_loss": -27.85454750061035, "global_step": 531416, "epoch": 6402} {"train_loss": -27.496366500854492, "global_step": 531417, "epoch": 6402} {"train_loss": -27.90028190612793, "global_step": 531418, "epoch": 6402} {"train_loss": -27.567001342773438, "global_step": 531419, "epoch": 6402} {"train_loss": -27.941802978515625, "global_step": 531420, "epoch": 6402} {"train_loss": -27.518512725830078, "global_step": 531421, "epoch": 6402} {"train_loss": -27.689254760742188, "global_step": 531422, "epoch": 6402} {"train_loss": -27.346511840820312, "global_step": 531423, "epoch": 6402} {"train_loss": -27.851057052612305, "global_step": 531424, "epoch": 6402} {"train_loss": -27.5551700592041, "global_step": 531425, "epoch": 6402} {"train_loss": -27.768545150756836, "global_step": 531426, "epoch": 6402} {"train_loss": -27.780532836914062, "global_step": 531427, "epoch": 6402} {"train_loss": -27.61512565612793, "global_step": 531428, "epoch": 6402} {"train_loss": -27.44890785217285, "global_step": 531429, "epoch": 6402} {"train_loss": -27.47970962524414, "global_step": 531430, "epoch": 6402} {"train_loss": -27.797582626342773, "global_step": 531431, "epoch": 6402} {"train_loss": -27.66644287109375, "global_step": 531432, "epoch": 6402} {"train_loss": -27.58102798461914, "global_step": 531433, "epoch": 6402} {"train_loss": -27.31829261779785, "global_step": 531434, "epoch": 6402} {"train_loss": -27.691686630249023, "global_step": 531435, "epoch": 6402} {"train_loss": -27.54453468322754, "global_step": 531436, "epoch": 6402} {"train_loss": -27.293426513671875, "global_step": 531437, "epoch": 6402} {"train_loss": -27.52951431274414, "global_step": 531438, "epoch": 6402} {"train_loss": -27.503204345703125, "global_step": 531439, "epoch": 6402} {"train_loss": -27.618408203125, "global_step": 531440, "epoch": 6402} {"train_loss": -27.770368576049805, "global_step": 531441, "epoch": 6402} {"train_loss": -27.44484519958496, "global_step": 531442, "epoch": 6402} {"train_loss": -27.348119735717773, "global_step": 531443, "epoch": 6402} {"train_loss": -27.441022872924805, "global_step": 531444, "epoch": 6402} {"train_loss": -27.860748291015625, "global_step": 531445, "epoch": 6402} {"train_loss": -27.766347885131836, "global_step": 531446, "epoch": 6402} {"train_loss": -27.60947036743164, "global_step": 531447, "epoch": 6402} {"train_loss": -27.289355978908308, "global_step": 531448, "epoch": 6402, "val_loss": 6504898.5} {"train_loss": -27.533620834350586, "global_step": 531449, "epoch": 6403} {"train_loss": -26.935083389282227, "global_step": 531450, "epoch": 6403} {"train_loss": -26.782745361328125, "global_step": 531451, "epoch": 6403} {"train_loss": -26.852115631103516, "global_step": 531452, "epoch": 6403} {"train_loss": -27.149930953979492, "global_step": 531453, "epoch": 6403} {"train_loss": -27.110294342041016, "global_step": 531454, "epoch": 6403} {"train_loss": -27.498706817626953, "global_step": 531455, "epoch": 6403} {"train_loss": -27.3269100189209, "global_step": 531456, "epoch": 6403} {"train_loss": -27.682281494140625, "global_step": 531457, "epoch": 6403} {"train_loss": -27.2813663482666, "global_step": 531458, "epoch": 6403} {"train_loss": -27.131000518798828, "global_step": 531459, "epoch": 6403} {"train_loss": -27.740331649780273, "global_step": 531460, "epoch": 6403} {"train_loss": -27.293725967407227, "global_step": 531461, "epoch": 6403} {"train_loss": -27.2840576171875, "global_step": 531462, "epoch": 6403} {"train_loss": -27.316877365112305, "global_step": 531463, "epoch": 6403} {"train_loss": -27.641387939453125, "global_step": 531464, "epoch": 6403} {"train_loss": -27.36911964416504, "global_step": 531465, "epoch": 6403} {"train_loss": -27.470855712890625, "global_step": 531466, "epoch": 6403} {"train_loss": -27.273447036743164, "global_step": 531467, "epoch": 6403} {"train_loss": -27.43988609313965, "global_step": 531468, "epoch": 6403} {"train_loss": -27.398792266845703, "global_step": 531469, "epoch": 6403} {"train_loss": -27.52338981628418, "global_step": 531470, "epoch": 6403} {"train_loss": -27.477075576782227, "global_step": 531471, "epoch": 6403} {"train_loss": -27.64853286743164, "global_step": 531472, "epoch": 6403} {"train_loss": -27.6143798828125, "global_step": 531473, "epoch": 6403} {"train_loss": -27.951923370361328, "global_step": 531474, "epoch": 6403} {"train_loss": -27.474817276000977, "global_step": 531475, "epoch": 6403} {"train_loss": -28.038349151611328, "global_step": 531476, "epoch": 6403} {"train_loss": -27.604787826538086, "global_step": 531477, "epoch": 6403} {"train_loss": -27.54774284362793, "global_step": 531478, "epoch": 6403} {"train_loss": -27.76953125, "global_step": 531479, "epoch": 6403} {"train_loss": -27.477203369140625, "global_step": 531480, "epoch": 6403} {"train_loss": -27.556562423706055, "global_step": 531481, "epoch": 6403} {"train_loss": -27.300718307495117, "global_step": 531482, "epoch": 6403} {"train_loss": -27.67990493774414, "global_step": 531483, "epoch": 6403} {"train_loss": -27.601160049438477, "global_step": 531484, "epoch": 6403} {"train_loss": -27.821226119995117, "global_step": 531485, "epoch": 6403} {"train_loss": -27.74667739868164, "global_step": 531486, "epoch": 6403} {"train_loss": -27.851123809814453, "global_step": 531487, "epoch": 6403} {"train_loss": -27.284448623657227, "global_step": 531488, "epoch": 6403} {"train_loss": -27.530227661132812, "global_step": 531489, "epoch": 6403} {"train_loss": -27.3248233795166, "global_step": 531490, "epoch": 6403} {"train_loss": -27.78215980529785, "global_step": 531491, "epoch": 6403} {"train_loss": -27.890424728393555, "global_step": 531492, "epoch": 6403} {"train_loss": -27.715742111206055, "global_step": 531493, "epoch": 6403} {"train_loss": -27.37281608581543, "global_step": 531494, "epoch": 6403} {"train_loss": -27.70831871032715, "global_step": 531495, "epoch": 6403} {"train_loss": -27.364282608032227, "global_step": 531496, "epoch": 6403} {"train_loss": -27.32728385925293, "global_step": 531497, "epoch": 6403} {"train_loss": -27.682958602905273, "global_step": 531498, "epoch": 6403} {"train_loss": -27.143402099609375, "global_step": 531499, "epoch": 6403} {"train_loss": -26.833032608032227, "global_step": 531500, "epoch": 6403} {"train_loss": -27.4681453704834, "global_step": 531501, "epoch": 6403} {"train_loss": -27.6834774017334, "global_step": 531502, "epoch": 6403} {"train_loss": -27.21634864807129, "global_step": 531503, "epoch": 6403} {"train_loss": -27.225698471069336, "global_step": 531504, "epoch": 6403} {"train_loss": -27.702932357788086, "global_step": 531505, "epoch": 6403} {"train_loss": -27.063562393188477, "global_step": 531506, "epoch": 6403} {"train_loss": -27.425373077392578, "global_step": 531507, "epoch": 6403} {"train_loss": -27.439544677734375, "global_step": 531508, "epoch": 6403} {"train_loss": -27.453994750976562, "global_step": 531509, "epoch": 6403} {"train_loss": -27.56695556640625, "global_step": 531510, "epoch": 6403} {"train_loss": -27.382492065429688, "global_step": 531511, "epoch": 6403} {"train_loss": -27.445133209228516, "global_step": 531512, "epoch": 6403} {"train_loss": -27.36519432067871, "global_step": 531513, "epoch": 6403} {"train_loss": -27.147504806518555, "global_step": 531514, "epoch": 6403} {"train_loss": -27.384504318237305, "global_step": 531515, "epoch": 6403} {"train_loss": -26.962553024291992, "global_step": 531516, "epoch": 6403} {"train_loss": -27.803058624267578, "global_step": 531517, "epoch": 6403} {"train_loss": -26.800439834594727, "global_step": 531518, "epoch": 6403} {"train_loss": -26.91184425354004, "global_step": 531519, "epoch": 6403} {"train_loss": -27.624801635742188, "global_step": 531520, "epoch": 6403} {"train_loss": -26.98428726196289, "global_step": 531521, "epoch": 6403} {"train_loss": -27.305707931518555, "global_step": 531522, "epoch": 6403} {"train_loss": -27.38897132873535, "global_step": 531523, "epoch": 6403} {"train_loss": -27.2657413482666, "global_step": 531524, "epoch": 6403} {"train_loss": -27.437726974487305, "global_step": 531525, "epoch": 6403} {"train_loss": -27.725061416625977, "global_step": 531526, "epoch": 6403} {"train_loss": -27.515186309814453, "global_step": 531527, "epoch": 6403} {"train_loss": -27.513959884643555, "global_step": 531528, "epoch": 6403} {"train_loss": -27.568775177001953, "global_step": 531529, "epoch": 6403} {"train_loss": -28.04629898071289, "global_step": 531530, "epoch": 6403} {"train_loss": -27.462427392063372, "global_step": 531531, "epoch": 6403, "val_loss": 6511109.5} {"train_loss": -27.250431060791016, "global_step": 531532, "epoch": 6404} {"train_loss": -27.003210067749023, "global_step": 531533, "epoch": 6404} {"train_loss": -26.823963165283203, "global_step": 531534, "epoch": 6404} {"train_loss": -27.004140853881836, "global_step": 531535, "epoch": 6404} {"train_loss": -26.96198844909668, "global_step": 531536, "epoch": 6404} {"train_loss": -26.940570831298828, "global_step": 531537, "epoch": 6404} {"train_loss": -26.849828720092773, "global_step": 531538, "epoch": 6404} {"train_loss": -27.52292251586914, "global_step": 531539, "epoch": 6404} {"train_loss": -27.04925537109375, "global_step": 531540, "epoch": 6404} {"train_loss": -27.65241813659668, "global_step": 531541, "epoch": 6404} {"train_loss": -26.772851943969727, "global_step": 531542, "epoch": 6404} {"train_loss": -27.27632713317871, "global_step": 531543, "epoch": 6404} {"train_loss": -27.418994903564453, "global_step": 531544, "epoch": 6404} {"train_loss": -27.27744483947754, "global_step": 531545, "epoch": 6404} {"train_loss": -27.445392608642578, "global_step": 531546, "epoch": 6404} {"train_loss": -27.4571475982666, "global_step": 531547, "epoch": 6404} {"train_loss": -27.31494140625, "global_step": 531548, "epoch": 6404} {"train_loss": -27.43097496032715, "global_step": 531549, "epoch": 6404} {"train_loss": -26.947742462158203, "global_step": 531550, "epoch": 6404} {"train_loss": -27.430713653564453, "global_step": 531551, "epoch": 6404} {"train_loss": -27.387784957885742, "global_step": 531552, "epoch": 6404} {"train_loss": -27.402786254882812, "global_step": 531553, "epoch": 6404} {"train_loss": -27.414419174194336, "global_step": 531554, "epoch": 6404} {"train_loss": -27.52515983581543, "global_step": 531555, "epoch": 6404} {"train_loss": -27.571853637695312, "global_step": 531556, "epoch": 6404} {"train_loss": -27.174579620361328, "global_step": 531557, "epoch": 6404} {"train_loss": -27.21600914001465, "global_step": 531558, "epoch": 6404} {"train_loss": -27.13177490234375, "global_step": 531559, "epoch": 6404} {"train_loss": -27.4642276763916, "global_step": 531560, "epoch": 6404} {"train_loss": -27.51759147644043, "global_step": 531561, "epoch": 6404} {"train_loss": -27.55691909790039, "global_step": 531562, "epoch": 6404} {"train_loss": -27.57492446899414, "global_step": 531563, "epoch": 6404} {"train_loss": -27.361722946166992, "global_step": 531564, "epoch": 6404} {"train_loss": -27.54498863220215, "global_step": 531565, "epoch": 6404} {"train_loss": -27.32747459411621, "global_step": 531566, "epoch": 6404} {"train_loss": -27.7618465423584, "global_step": 531567, "epoch": 6404} {"train_loss": -27.242263793945312, "global_step": 531568, "epoch": 6404} {"train_loss": -27.0637264251709, "global_step": 531569, "epoch": 6404} {"train_loss": -27.48335075378418, "global_step": 531570, "epoch": 6404} {"train_loss": -27.522964477539062, "global_step": 531571, "epoch": 6404} {"train_loss": -27.337186813354492, "global_step": 531572, "epoch": 6404} {"train_loss": -27.619550704956055, "global_step": 531573, "epoch": 6404} {"train_loss": -27.8298397064209, "global_step": 531574, "epoch": 6404} {"train_loss": -27.373228073120117, "global_step": 531575, "epoch": 6404} {"train_loss": -26.890050888061523, "global_step": 531576, "epoch": 6404} {"train_loss": -27.49407386779785, "global_step": 531577, "epoch": 6404} {"train_loss": -27.77937126159668, "global_step": 531578, "epoch": 6404} {"train_loss": -27.37969398498535, "global_step": 531579, "epoch": 6404} {"train_loss": -27.642919540405273, "global_step": 531580, "epoch": 6404} {"train_loss": -27.402917861938477, "global_step": 531581, "epoch": 6404} {"train_loss": -27.50396728515625, "global_step": 531582, "epoch": 6404} {"train_loss": -27.844629287719727, "global_step": 531583, "epoch": 6404} {"train_loss": -27.61720085144043, "global_step": 531584, "epoch": 6404} {"train_loss": -27.44001579284668, "global_step": 531585, "epoch": 6404} {"train_loss": -27.618284225463867, "global_step": 531586, "epoch": 6404} {"train_loss": -27.490934371948242, "global_step": 531587, "epoch": 6404} {"train_loss": -27.59212303161621, "global_step": 531588, "epoch": 6404} {"train_loss": -28.0154972076416, "global_step": 531589, "epoch": 6404} {"train_loss": -27.745946884155273, "global_step": 531590, "epoch": 6404} {"train_loss": -27.94732666015625, "global_step": 531591, "epoch": 6404} {"train_loss": -27.434112548828125, "global_step": 531592, "epoch": 6404} {"train_loss": -27.669340133666992, "global_step": 531593, "epoch": 6404} {"train_loss": -27.666828155517578, "global_step": 531594, "epoch": 6404} {"train_loss": -27.462909698486328, "global_step": 531595, "epoch": 6404} {"train_loss": -27.883520126342773, "global_step": 531596, "epoch": 6404} {"train_loss": -27.862539291381836, "global_step": 531597, "epoch": 6404} {"train_loss": -27.73052406311035, "global_step": 531598, "epoch": 6404} {"train_loss": -27.778839111328125, "global_step": 531599, "epoch": 6404} {"train_loss": -27.892797470092773, "global_step": 531600, "epoch": 6404} {"train_loss": -27.691120147705078, "global_step": 531601, "epoch": 6404} {"train_loss": -27.9172306060791, "global_step": 531602, "epoch": 6404} {"train_loss": -27.848722457885742, "global_step": 531603, "epoch": 6404} {"train_loss": -27.642908096313477, "global_step": 531604, "epoch": 6404} {"train_loss": -28.181781768798828, "global_step": 531605, "epoch": 6404} {"train_loss": -27.532062530517578, "global_step": 531606, "epoch": 6404} {"train_loss": -27.437305450439453, "global_step": 531607, "epoch": 6404} {"train_loss": -27.062469482421875, "global_step": 531608, "epoch": 6404} {"train_loss": -24.991371154785156, "global_step": 531609, "epoch": 6404} {"train_loss": -24.232954025268555, "global_step": 531610, "epoch": 6404} {"train_loss": -25.57822608947754, "global_step": 531611, "epoch": 6404} {"train_loss": -25.962406158447266, "global_step": 531612, "epoch": 6404} {"train_loss": -26.701879501342773, "global_step": 531613, "epoch": 6404} {"train_loss": -27.323669042931982, "global_step": 531614, "epoch": 6404, "val_loss": 6553742.5} {"train_loss": -24.428565979003906, "global_step": 531615, "epoch": 6405} {"train_loss": -25.31647300720215, "global_step": 531616, "epoch": 6405} {"train_loss": -25.456716537475586, "global_step": 531617, "epoch": 6405} {"train_loss": -24.895797729492188, "global_step": 531618, "epoch": 6405} {"train_loss": -25.6297550201416, "global_step": 531619, "epoch": 6405} {"train_loss": -24.844892501831055, "global_step": 531620, "epoch": 6405} {"train_loss": -26.115095138549805, "global_step": 531621, "epoch": 6405} {"train_loss": -25.68885612487793, "global_step": 531622, "epoch": 6405} {"train_loss": -26.219257354736328, "global_step": 531623, "epoch": 6405} {"train_loss": -26.033771514892578, "global_step": 531624, "epoch": 6405} {"train_loss": -26.05714225769043, "global_step": 531625, "epoch": 6405} {"train_loss": -25.865076065063477, "global_step": 531626, "epoch": 6405} {"train_loss": -26.2525577545166, "global_step": 531627, "epoch": 6405} {"train_loss": -26.16461181640625, "global_step": 531628, "epoch": 6405} {"train_loss": -26.051366806030273, "global_step": 531629, "epoch": 6405} {"train_loss": -26.293684005737305, "global_step": 531630, "epoch": 6405} {"train_loss": -26.8167781829834, "global_step": 531631, "epoch": 6405} {"train_loss": -26.310476303100586, "global_step": 531632, "epoch": 6405} {"train_loss": -26.26615333557129, "global_step": 531633, "epoch": 6405} {"train_loss": -27.034198760986328, "global_step": 531634, "epoch": 6405} {"train_loss": -26.811105728149414, "global_step": 531635, "epoch": 6405} {"train_loss": -26.24151039123535, "global_step": 531636, "epoch": 6405} {"train_loss": -26.712482452392578, "global_step": 531637, "epoch": 6405} {"train_loss": -26.882410049438477, "global_step": 531638, "epoch": 6405} {"train_loss": -27.06768798828125, "global_step": 531639, "epoch": 6405} {"train_loss": -26.5704402923584, "global_step": 531640, "epoch": 6405} {"train_loss": -26.9140682220459, "global_step": 531641, "epoch": 6405} {"train_loss": -26.59967041015625, "global_step": 531642, "epoch": 6405} {"train_loss": -27.09479331970215, "global_step": 531643, "epoch": 6405} {"train_loss": -26.057086944580078, "global_step": 531644, "epoch": 6405} {"train_loss": -26.98015785217285, "global_step": 531645, "epoch": 6405} {"train_loss": -27.093286514282227, "global_step": 531646, "epoch": 6405} {"train_loss": -27.237934112548828, "global_step": 531647, "epoch": 6405} {"train_loss": -27.229719161987305, "global_step": 531648, "epoch": 6405} {"train_loss": -27.646625518798828, "global_step": 531649, "epoch": 6405} {"train_loss": -27.152307510375977, "global_step": 531650, "epoch": 6405} {"train_loss": -27.34878921508789, "global_step": 531651, "epoch": 6405} {"train_loss": -27.222476959228516, "global_step": 531652, "epoch": 6405} {"train_loss": -27.358251571655273, "global_step": 531653, "epoch": 6405} {"train_loss": -27.517728805541992, "global_step": 531654, "epoch": 6405} {"train_loss": -27.37039566040039, "global_step": 531655, "epoch": 6405} {"train_loss": -27.484106063842773, "global_step": 531656, "epoch": 6405} {"train_loss": -27.914875030517578, "global_step": 531657, "epoch": 6405} {"train_loss": -27.006452560424805, "global_step": 531658, "epoch": 6405} {"train_loss": -27.226917266845703, "global_step": 531659, "epoch": 6405} {"train_loss": -27.639562606811523, "global_step": 531660, "epoch": 6405} {"train_loss": -27.329330444335938, "global_step": 531661, "epoch": 6405} {"train_loss": -27.150543212890625, "global_step": 531662, "epoch": 6405} {"train_loss": -27.530012130737305, "global_step": 531663, "epoch": 6405} {"train_loss": -27.402896881103516, "global_step": 531664, "epoch": 6405} {"train_loss": -27.399301528930664, "global_step": 531665, "epoch": 6405} {"train_loss": -27.130329132080078, "global_step": 531666, "epoch": 6405} {"train_loss": -27.62790870666504, "global_step": 531667, "epoch": 6405} {"train_loss": -27.284820556640625, "global_step": 531668, "epoch": 6405} {"train_loss": -27.49677085876465, "global_step": 531669, "epoch": 6405} {"train_loss": -27.631153106689453, "global_step": 531670, "epoch": 6405} {"train_loss": -27.889204025268555, "global_step": 531671, "epoch": 6405} {"train_loss": -27.634174346923828, "global_step": 531672, "epoch": 6405} {"train_loss": -27.8521785736084, "global_step": 531673, "epoch": 6405} {"train_loss": -27.763019561767578, "global_step": 531674, "epoch": 6405} {"train_loss": -27.58881187438965, "global_step": 531675, "epoch": 6405} {"train_loss": -27.63054847717285, "global_step": 531676, "epoch": 6405} {"train_loss": -27.7255916595459, "global_step": 531677, "epoch": 6405} {"train_loss": -27.80938148498535, "global_step": 531678, "epoch": 6405} {"train_loss": -27.799198150634766, "global_step": 531679, "epoch": 6405} {"train_loss": -27.77695655822754, "global_step": 531680, "epoch": 6405} {"train_loss": -27.53228187561035, "global_step": 531681, "epoch": 6405} {"train_loss": -27.476430892944336, "global_step": 531682, "epoch": 6405} {"train_loss": -27.846698760986328, "global_step": 531683, "epoch": 6405} {"train_loss": -27.780517578125, "global_step": 531684, "epoch": 6405} {"train_loss": -27.35650062561035, "global_step": 531685, "epoch": 6405} {"train_loss": -27.750471115112305, "global_step": 531686, "epoch": 6405} {"train_loss": -28.003894805908203, "global_step": 531687, "epoch": 6405} {"train_loss": -27.541519165039062, "global_step": 531688, "epoch": 6405} {"train_loss": -28.42364501953125, "global_step": 531689, "epoch": 6405} {"train_loss": -27.750885009765625, "global_step": 531690, "epoch": 6405} {"train_loss": -27.64393424987793, "global_step": 531691, "epoch": 6405} {"train_loss": -27.65606689453125, "global_step": 531692, "epoch": 6405} {"train_loss": -27.923355102539062, "global_step": 531693, "epoch": 6405} {"train_loss": -27.62556266784668, "global_step": 531694, "epoch": 6405} {"train_loss": -27.95413589477539, "global_step": 531695, "epoch": 6405} {"train_loss": -27.62626075744629, "global_step": 531696, "epoch": 6405} {"train_loss": -27.029493125088244, "global_step": 531697, "epoch": 6405, "val_loss": 6391260.0} {"train_loss": -26.892120361328125, "global_step": 531698, "epoch": 6406} {"train_loss": -25.794605255126953, "global_step": 531699, "epoch": 6406} {"train_loss": -26.26812171936035, "global_step": 531700, "epoch": 6406} {"train_loss": -25.41129493713379, "global_step": 531701, "epoch": 6406} {"train_loss": -26.392791748046875, "global_step": 531702, "epoch": 6406} {"train_loss": -26.316503524780273, "global_step": 531703, "epoch": 6406} {"train_loss": -26.250244140625, "global_step": 531704, "epoch": 6406} {"train_loss": -26.682071685791016, "global_step": 531705, "epoch": 6406} {"train_loss": -25.295795440673828, "global_step": 531706, "epoch": 6406} {"train_loss": -26.31043815612793, "global_step": 531707, "epoch": 6406} {"train_loss": -26.788923263549805, "global_step": 531708, "epoch": 6406} {"train_loss": -26.852319717407227, "global_step": 531709, "epoch": 6406} {"train_loss": -26.790876388549805, "global_step": 531710, "epoch": 6406} {"train_loss": -27.0655574798584, "global_step": 531711, "epoch": 6406} {"train_loss": -26.279943466186523, "global_step": 531712, "epoch": 6406} {"train_loss": -27.094480514526367, "global_step": 531713, "epoch": 6406} {"train_loss": -26.904905319213867, "global_step": 531714, "epoch": 6406} {"train_loss": -26.790342330932617, "global_step": 531715, "epoch": 6406} {"train_loss": -27.360132217407227, "global_step": 531716, "epoch": 6406} {"train_loss": -26.821191787719727, "global_step": 531717, "epoch": 6406} {"train_loss": -26.8905029296875, "global_step": 531718, "epoch": 6406} {"train_loss": -27.375843048095703, "global_step": 531719, "epoch": 6406} {"train_loss": -27.208829879760742, "global_step": 531720, "epoch": 6406} {"train_loss": -27.227025985717773, "global_step": 531721, "epoch": 6406} {"train_loss": -27.520776748657227, "global_step": 531722, "epoch": 6406} {"train_loss": -27.22833251953125, "global_step": 531723, "epoch": 6406} {"train_loss": -27.3367919921875, "global_step": 531724, "epoch": 6406} {"train_loss": -27.547143936157227, "global_step": 531725, "epoch": 6406} {"train_loss": -27.468671798706055, "global_step": 531726, "epoch": 6406} {"train_loss": -27.429243087768555, "global_step": 531727, "epoch": 6406} {"train_loss": -27.488901138305664, "global_step": 531728, "epoch": 6406} {"train_loss": -27.652851104736328, "global_step": 531729, "epoch": 6406} {"train_loss": -27.161603927612305, "global_step": 531730, "epoch": 6406} {"train_loss": -27.215137481689453, "global_step": 531731, "epoch": 6406} {"train_loss": -27.552749633789062, "global_step": 531732, "epoch": 6406} {"train_loss": -27.69268798828125, "global_step": 531733, "epoch": 6406} {"train_loss": -27.901996612548828, "global_step": 531734, "epoch": 6406} {"train_loss": -27.706653594970703, "global_step": 531735, "epoch": 6406} {"train_loss": -27.567264556884766, "global_step": 531736, "epoch": 6406} {"train_loss": -27.4539737701416, "global_step": 531737, "epoch": 6406} {"train_loss": -27.19757080078125, "global_step": 531738, "epoch": 6406} {"train_loss": -27.458337783813477, "global_step": 531739, "epoch": 6406} {"train_loss": -28.22943115234375, "global_step": 531740, "epoch": 6406} {"train_loss": -27.755725860595703, "global_step": 531741, "epoch": 6406} {"train_loss": -27.473453521728516, "global_step": 531742, "epoch": 6406} {"train_loss": -27.5582218170166, "global_step": 531743, "epoch": 6406} {"train_loss": -27.75026512145996, "global_step": 531744, "epoch": 6406} {"train_loss": -27.788406372070312, "global_step": 531745, "epoch": 6406} {"train_loss": -27.730676651000977, "global_step": 531746, "epoch": 6406} {"train_loss": -27.552160263061523, "global_step": 531747, "epoch": 6406} {"train_loss": -27.799673080444336, "global_step": 531748, "epoch": 6406} {"train_loss": -27.837743759155273, "global_step": 531749, "epoch": 6406} {"train_loss": -27.949018478393555, "global_step": 531750, "epoch": 6406} {"train_loss": -27.948047637939453, "global_step": 531751, "epoch": 6406} {"train_loss": -27.736658096313477, "global_step": 531752, "epoch": 6406} {"train_loss": -27.85175132751465, "global_step": 531753, "epoch": 6406} {"train_loss": -27.78730583190918, "global_step": 531754, "epoch": 6406} {"train_loss": -28.059656143188477, "global_step": 531755, "epoch": 6406} {"train_loss": -27.830163955688477, "global_step": 531756, "epoch": 6406} {"train_loss": -27.830175399780273, "global_step": 531757, "epoch": 6406} {"train_loss": -27.430622100830078, "global_step": 531758, "epoch": 6406} {"train_loss": -27.745691299438477, "global_step": 531759, "epoch": 6406} {"train_loss": -27.980545043945312, "global_step": 531760, "epoch": 6406} {"train_loss": -27.7679443359375, "global_step": 531761, "epoch": 6406} {"train_loss": -28.02460289001465, "global_step": 531762, "epoch": 6406} {"train_loss": -28.070667266845703, "global_step": 531763, "epoch": 6406} {"train_loss": -28.022192001342773, "global_step": 531764, "epoch": 6406} {"train_loss": -27.89040184020996, "global_step": 531765, "epoch": 6406} {"train_loss": -27.97088050842285, "global_step": 531766, "epoch": 6406} {"train_loss": -27.830224990844727, "global_step": 531767, "epoch": 6406} {"train_loss": -27.750883102416992, "global_step": 531768, "epoch": 6406} {"train_loss": -27.094770431518555, "global_step": 531769, "epoch": 6406} {"train_loss": -27.543821334838867, "global_step": 531770, "epoch": 6406} {"train_loss": -27.875640869140625, "global_step": 531771, "epoch": 6406} {"train_loss": -27.58441162109375, "global_step": 531772, "epoch": 6406} {"train_loss": -27.138702392578125, "global_step": 531773, "epoch": 6406} {"train_loss": -26.869958877563477, "global_step": 531774, "epoch": 6406} {"train_loss": -27.582050323486328, "global_step": 531775, "epoch": 6406} {"train_loss": -27.349084854125977, "global_step": 531776, "epoch": 6406} {"train_loss": -27.060657501220703, "global_step": 531777, "epoch": 6406} {"train_loss": -27.053171157836914, "global_step": 531778, "epoch": 6406} {"train_loss": -27.31121826171875, "global_step": 531779, "epoch": 6406} {"train_loss": -27.327388786407838, "global_step": 531780, "epoch": 6406, "val_loss": 6475365.0} {"train_loss": -25.603063583374023, "global_step": 531781, "epoch": 6407} {"train_loss": -26.386926651000977, "global_step": 531782, "epoch": 6407} {"train_loss": -27.26576042175293, "global_step": 531783, "epoch": 6407} {"train_loss": -26.359655380249023, "global_step": 531784, "epoch": 6407} {"train_loss": -26.870813369750977, "global_step": 531785, "epoch": 6407} {"train_loss": -25.842493057250977, "global_step": 531786, "epoch": 6407} {"train_loss": -26.73370361328125, "global_step": 531787, "epoch": 6407} {"train_loss": -26.267419815063477, "global_step": 531788, "epoch": 6407} {"train_loss": -27.32578468322754, "global_step": 531789, "epoch": 6407} {"train_loss": -27.040319442749023, "global_step": 531790, "epoch": 6407} {"train_loss": -26.887393951416016, "global_step": 531791, "epoch": 6407} {"train_loss": -27.516956329345703, "global_step": 531792, "epoch": 6407} {"train_loss": -26.95657730102539, "global_step": 531793, "epoch": 6407} {"train_loss": -27.247461318969727, "global_step": 531794, "epoch": 6407} {"train_loss": -27.18136978149414, "global_step": 531795, "epoch": 6407} {"train_loss": -26.999292373657227, "global_step": 531796, "epoch": 6407} {"train_loss": -27.611713409423828, "global_step": 531797, "epoch": 6407} {"train_loss": -27.128793716430664, "global_step": 531798, "epoch": 6407} {"train_loss": -27.591394424438477, "global_step": 531799, "epoch": 6407} {"train_loss": -27.0084285736084, "global_step": 531800, "epoch": 6407} {"train_loss": -27.26546287536621, "global_step": 531801, "epoch": 6407} {"train_loss": -27.050405502319336, "global_step": 531802, "epoch": 6407} {"train_loss": -27.501256942749023, "global_step": 531803, "epoch": 6407} {"train_loss": -27.733753204345703, "global_step": 531804, "epoch": 6407} {"train_loss": -27.216089248657227, "global_step": 531805, "epoch": 6407} {"train_loss": -27.61683464050293, "global_step": 531806, "epoch": 6407} {"train_loss": -27.464984893798828, "global_step": 531807, "epoch": 6407} {"train_loss": -27.4711856842041, "global_step": 531808, "epoch": 6407} {"train_loss": -27.386144638061523, "global_step": 531809, "epoch": 6407} {"train_loss": -27.576696395874023, "global_step": 531810, "epoch": 6407} {"train_loss": -27.313159942626953, "global_step": 531811, "epoch": 6407} {"train_loss": -27.495437622070312, "global_step": 531812, "epoch": 6407} {"train_loss": -27.584869384765625, "global_step": 531813, "epoch": 6407} {"train_loss": -27.575366973876953, "global_step": 531814, "epoch": 6407} {"train_loss": -27.63958168029785, "global_step": 531815, "epoch": 6407} {"train_loss": -27.456283569335938, "global_step": 531816, "epoch": 6407} {"train_loss": -27.693811416625977, "global_step": 531817, "epoch": 6407} {"train_loss": -27.606525421142578, "global_step": 531818, "epoch": 6407} {"train_loss": -27.524625778198242, "global_step": 531819, "epoch": 6407} {"train_loss": -27.578100204467773, "global_step": 531820, "epoch": 6407} {"train_loss": -27.705820083618164, "global_step": 531821, "epoch": 6407} {"train_loss": -27.470020294189453, "global_step": 531822, "epoch": 6407} {"train_loss": -27.781330108642578, "global_step": 531823, "epoch": 6407} {"train_loss": -27.803964614868164, "global_step": 531824, "epoch": 6407} {"train_loss": -27.806640625, "global_step": 531825, "epoch": 6407} {"train_loss": -27.62934684753418, "global_step": 531826, "epoch": 6407} {"train_loss": -27.333179473876953, "global_step": 531827, "epoch": 6407} {"train_loss": -27.46034049987793, "global_step": 531828, "epoch": 6407} {"train_loss": -27.496301651000977, "global_step": 531829, "epoch": 6407} {"train_loss": -27.63433265686035, "global_step": 531830, "epoch": 6407} {"train_loss": -27.47623634338379, "global_step": 531831, "epoch": 6407} {"train_loss": -27.68948745727539, "global_step": 531832, "epoch": 6407} {"train_loss": -27.755115509033203, "global_step": 531833, "epoch": 6407} {"train_loss": -27.689865112304688, "global_step": 531834, "epoch": 6407} {"train_loss": -27.983718872070312, "global_step": 531835, "epoch": 6407} {"train_loss": -27.80841064453125, "global_step": 531836, "epoch": 6407} {"train_loss": -27.77992820739746, "global_step": 531837, "epoch": 6407} {"train_loss": -27.6086368560791, "global_step": 531838, "epoch": 6407} {"train_loss": -27.4792423248291, "global_step": 531839, "epoch": 6407} {"train_loss": -27.42865562438965, "global_step": 531840, "epoch": 6407} {"train_loss": -27.67522621154785, "global_step": 531841, "epoch": 6407} {"train_loss": -27.552392959594727, "global_step": 531842, "epoch": 6407} {"train_loss": -27.70516014099121, "global_step": 531843, "epoch": 6407} {"train_loss": -27.68779945373535, "global_step": 531844, "epoch": 6407} {"train_loss": -27.29953956604004, "global_step": 531845, "epoch": 6407} {"train_loss": -27.713769912719727, "global_step": 531846, "epoch": 6407} {"train_loss": -27.48392105102539, "global_step": 531847, "epoch": 6407} {"train_loss": -27.65753173828125, "global_step": 531848, "epoch": 6407} {"train_loss": -27.385828018188477, "global_step": 531849, "epoch": 6407} {"train_loss": -27.6619930267334, "global_step": 531850, "epoch": 6407} {"train_loss": -27.55057716369629, "global_step": 531851, "epoch": 6407} {"train_loss": -28.041715621948242, "global_step": 531852, "epoch": 6407} {"train_loss": -27.852956771850586, "global_step": 531853, "epoch": 6407} {"train_loss": -27.714624404907227, "global_step": 531854, "epoch": 6407} {"train_loss": -27.843097686767578, "global_step": 531855, "epoch": 6407} {"train_loss": -27.991729736328125, "global_step": 531856, "epoch": 6407} {"train_loss": -28.03028678894043, "global_step": 531857, "epoch": 6407} {"train_loss": -27.74775505065918, "global_step": 531858, "epoch": 6407} {"train_loss": -27.7593994140625, "global_step": 531859, "epoch": 6407} {"train_loss": -27.7499942779541, "global_step": 531860, "epoch": 6407} {"train_loss": -27.721899032592773, "global_step": 531861, "epoch": 6407} {"train_loss": -27.588254928588867, "global_step": 531862, "epoch": 6407} {"train_loss": -27.43917584706502, "global_step": 531863, "epoch": 6407, "val_loss": 6456540.5} {"train_loss": -27.77752685546875, "global_step": 531864, "epoch": 6408} {"train_loss": -27.40936851501465, "global_step": 531865, "epoch": 6408} {"train_loss": -28.06943130493164, "global_step": 531866, "epoch": 6408} {"train_loss": -27.527862548828125, "global_step": 531867, "epoch": 6408} {"train_loss": -27.525531768798828, "global_step": 531868, "epoch": 6408} {"train_loss": -27.565353393554688, "global_step": 531869, "epoch": 6408} {"train_loss": -27.52837562561035, "global_step": 531870, "epoch": 6408} {"train_loss": -27.30439567565918, "global_step": 531871, "epoch": 6408} {"train_loss": -27.456287384033203, "global_step": 531872, "epoch": 6408} {"train_loss": -27.232715606689453, "global_step": 531873, "epoch": 6408} {"train_loss": -27.76679801940918, "global_step": 531874, "epoch": 6408} {"train_loss": -27.782766342163086, "global_step": 531875, "epoch": 6408} {"train_loss": -27.520538330078125, "global_step": 531876, "epoch": 6408} {"train_loss": -27.527963638305664, "global_step": 531877, "epoch": 6408} {"train_loss": -27.333200454711914, "global_step": 531878, "epoch": 6408} {"train_loss": -27.40768814086914, "global_step": 531879, "epoch": 6408} {"train_loss": -27.36819839477539, "global_step": 531880, "epoch": 6408} {"train_loss": -27.056396484375, "global_step": 531881, "epoch": 6408} {"train_loss": -27.038787841796875, "global_step": 531882, "epoch": 6408} {"train_loss": -27.337726593017578, "global_step": 531883, "epoch": 6408} {"train_loss": -27.5828914642334, "global_step": 531884, "epoch": 6408} {"train_loss": -27.3245849609375, "global_step": 531885, "epoch": 6408} {"train_loss": -27.3947811126709, "global_step": 531886, "epoch": 6408} {"train_loss": -27.356311798095703, "global_step": 531887, "epoch": 6408} {"train_loss": -27.312152862548828, "global_step": 531888, "epoch": 6408} {"train_loss": -27.05112648010254, "global_step": 531889, "epoch": 6408} {"train_loss": -27.275836944580078, "global_step": 531890, "epoch": 6408} {"train_loss": -27.167341232299805, "global_step": 531891, "epoch": 6408} {"train_loss": -27.725778579711914, "global_step": 531892, "epoch": 6408} {"train_loss": -27.366437911987305, "global_step": 531893, "epoch": 6408} {"train_loss": -27.24118423461914, "global_step": 531894, "epoch": 6408} {"train_loss": -27.59168815612793, "global_step": 531895, "epoch": 6408} {"train_loss": -27.353885650634766, "global_step": 531896, "epoch": 6408} {"train_loss": -27.68109130859375, "global_step": 531897, "epoch": 6408} {"train_loss": -27.62702751159668, "global_step": 531898, "epoch": 6408} {"train_loss": -27.111236572265625, "global_step": 531899, "epoch": 6408} {"train_loss": -27.448139190673828, "global_step": 531900, "epoch": 6408} {"train_loss": -27.852848052978516, "global_step": 531901, "epoch": 6408} {"train_loss": -27.461301803588867, "global_step": 531902, "epoch": 6408} {"train_loss": -27.871353149414062, "global_step": 531903, "epoch": 6408} {"train_loss": -27.659650802612305, "global_step": 531904, "epoch": 6408} {"train_loss": -27.667890548706055, "global_step": 531905, "epoch": 6408} {"train_loss": -27.73297691345215, "global_step": 531906, "epoch": 6408} {"train_loss": -28.03557777404785, "global_step": 531907, "epoch": 6408} {"train_loss": -28.068029403686523, "global_step": 531908, "epoch": 6408} {"train_loss": -27.936176300048828, "global_step": 531909, "epoch": 6408} {"train_loss": -27.736297607421875, "global_step": 531910, "epoch": 6408} {"train_loss": -27.559738159179688, "global_step": 531911, "epoch": 6408} {"train_loss": -27.587127685546875, "global_step": 531912, "epoch": 6408} {"train_loss": -27.669147491455078, "global_step": 531913, "epoch": 6408} {"train_loss": -27.635547637939453, "global_step": 531914, "epoch": 6408} {"train_loss": -27.773996353149414, "global_step": 531915, "epoch": 6408} {"train_loss": -27.408262252807617, "global_step": 531916, "epoch": 6408} {"train_loss": -27.492151260375977, "global_step": 531917, "epoch": 6408} {"train_loss": -27.983295440673828, "global_step": 531918, "epoch": 6408} {"train_loss": -27.846174240112305, "global_step": 531919, "epoch": 6408} {"train_loss": -27.75217056274414, "global_step": 531920, "epoch": 6408} {"train_loss": -27.783761978149414, "global_step": 531921, "epoch": 6408} {"train_loss": -27.906625747680664, "global_step": 531922, "epoch": 6408} {"train_loss": -27.5606632232666, "global_step": 531923, "epoch": 6408} {"train_loss": -27.828886032104492, "global_step": 531924, "epoch": 6408} {"train_loss": -27.673938751220703, "global_step": 531925, "epoch": 6408} {"train_loss": -27.875396728515625, "global_step": 531926, "epoch": 6408} {"train_loss": -27.612817764282227, "global_step": 531927, "epoch": 6408} {"train_loss": -27.43992042541504, "global_step": 531928, "epoch": 6408} {"train_loss": -27.86634635925293, "global_step": 531929, "epoch": 6408} {"train_loss": -27.64613914489746, "global_step": 531930, "epoch": 6408} {"train_loss": -27.551971435546875, "global_step": 531931, "epoch": 6408} {"train_loss": -28.20475196838379, "global_step": 531932, "epoch": 6408} {"train_loss": -27.749357223510742, "global_step": 531933, "epoch": 6408} {"train_loss": -27.815866470336914, "global_step": 531934, "epoch": 6408} {"train_loss": -27.76423454284668, "global_step": 531935, "epoch": 6408} {"train_loss": -27.370697021484375, "global_step": 531936, "epoch": 6408} {"train_loss": -27.53729248046875, "global_step": 531937, "epoch": 6408} {"train_loss": -27.19406509399414, "global_step": 531938, "epoch": 6408} {"train_loss": -27.444482803344727, "global_step": 531939, "epoch": 6408} {"train_loss": -26.938373565673828, "global_step": 531940, "epoch": 6408} {"train_loss": -26.917728424072266, "global_step": 531941, "epoch": 6408} {"train_loss": -27.90824317932129, "global_step": 531942, "epoch": 6408} {"train_loss": -27.85205078125, "global_step": 531943, "epoch": 6408} {"train_loss": -27.257715225219727, "global_step": 531944, "epoch": 6408} {"train_loss": -27.2146053314209, "global_step": 531945, "epoch": 6408} {"train_loss": -27.553514549531133, "global_step": 531946, "epoch": 6408, "val_loss": 6447219.5} {"train_loss": -26.148242950439453, "global_step": 531947, "epoch": 6409} {"train_loss": -26.270742416381836, "global_step": 531948, "epoch": 6409} {"train_loss": -27.379209518432617, "global_step": 531949, "epoch": 6409} {"train_loss": -26.995777130126953, "global_step": 531950, "epoch": 6409} {"train_loss": -27.144617080688477, "global_step": 531951, "epoch": 6409} {"train_loss": -27.330310821533203, "global_step": 531952, "epoch": 6409} {"train_loss": -27.31772804260254, "global_step": 531953, "epoch": 6409} {"train_loss": -26.904041290283203, "global_step": 531954, "epoch": 6409} {"train_loss": -27.421003341674805, "global_step": 531955, "epoch": 6409} {"train_loss": -27.231719970703125, "global_step": 531956, "epoch": 6409} {"train_loss": -27.3211612701416, "global_step": 531957, "epoch": 6409} {"train_loss": -27.164636611938477, "global_step": 531958, "epoch": 6409} {"train_loss": -27.168781280517578, "global_step": 531959, "epoch": 6409} {"train_loss": -27.60371208190918, "global_step": 531960, "epoch": 6409} {"train_loss": -27.43851661682129, "global_step": 531961, "epoch": 6409} {"train_loss": -27.505945205688477, "global_step": 531962, "epoch": 6409} {"train_loss": -27.549631118774414, "global_step": 531963, "epoch": 6409} {"train_loss": -27.3065185546875, "global_step": 531964, "epoch": 6409} {"train_loss": -27.255578994750977, "global_step": 531965, "epoch": 6409} {"train_loss": -26.961490631103516, "global_step": 531966, "epoch": 6409} {"train_loss": -27.4716854095459, "global_step": 531967, "epoch": 6409} {"train_loss": -27.38043212890625, "global_step": 531968, "epoch": 6409} {"train_loss": -27.357501983642578, "global_step": 531969, "epoch": 6409} {"train_loss": -27.46956443786621, "global_step": 531970, "epoch": 6409} {"train_loss": -27.5178279876709, "global_step": 531971, "epoch": 6409} {"train_loss": -27.24967384338379, "global_step": 531972, "epoch": 6409} {"train_loss": -27.385435104370117, "global_step": 531973, "epoch": 6409} {"train_loss": -27.772138595581055, "global_step": 531974, "epoch": 6409} {"train_loss": -27.618549346923828, "global_step": 531975, "epoch": 6409} {"train_loss": -27.97333335876465, "global_step": 531976, "epoch": 6409} {"train_loss": -27.288251876831055, "global_step": 531977, "epoch": 6409} {"train_loss": -28.023046493530273, "global_step": 531978, "epoch": 6409} {"train_loss": -27.535070419311523, "global_step": 531979, "epoch": 6409} {"train_loss": -27.46221351623535, "global_step": 531980, "epoch": 6409} {"train_loss": -27.669052124023438, "global_step": 531981, "epoch": 6409} {"train_loss": -28.054594039916992, "global_step": 531982, "epoch": 6409} {"train_loss": -28.008136749267578, "global_step": 531983, "epoch": 6409} {"train_loss": -27.9321346282959, "global_step": 531984, "epoch": 6409} {"train_loss": -27.674184799194336, "global_step": 531985, "epoch": 6409} {"train_loss": -27.81208610534668, "global_step": 531986, "epoch": 6409} {"train_loss": -27.802270889282227, "global_step": 531987, "epoch": 6409} {"train_loss": -27.73174476623535, "global_step": 531988, "epoch": 6409} {"train_loss": -27.700658798217773, "global_step": 531989, "epoch": 6409} {"train_loss": -27.804601669311523, "global_step": 531990, "epoch": 6409} {"train_loss": -28.019397735595703, "global_step": 531991, "epoch": 6409} {"train_loss": -27.710407257080078, "global_step": 531992, "epoch": 6409} {"train_loss": -27.86798095703125, "global_step": 531993, "epoch": 6409} {"train_loss": -27.672321319580078, "global_step": 531994, "epoch": 6409} {"train_loss": -27.845779418945312, "global_step": 531995, "epoch": 6409} {"train_loss": -27.523712158203125, "global_step": 531996, "epoch": 6409} {"train_loss": -27.517139434814453, "global_step": 531997, "epoch": 6409} {"train_loss": -27.88982582092285, "global_step": 531998, "epoch": 6409} {"train_loss": -27.593769073486328, "global_step": 531999, "epoch": 6409} {"train_loss": -27.515033721923828, "global_step": 532000, "epoch": 6409} {"train_loss": -27.72516441345215, "global_step": 532001, "epoch": 6409} {"train_loss": -27.677783966064453, "global_step": 532002, "epoch": 6409} {"train_loss": -27.487689971923828, "global_step": 532003, "epoch": 6409} {"train_loss": -27.425138473510742, "global_step": 532004, "epoch": 6409} {"train_loss": -27.517292022705078, "global_step": 532005, "epoch": 6409} {"train_loss": -27.6083927154541, "global_step": 532006, "epoch": 6409} {"train_loss": -27.122039794921875, "global_step": 532007, "epoch": 6409} {"train_loss": -27.649372100830078, "global_step": 532008, "epoch": 6409} {"train_loss": -27.62240982055664, "global_step": 532009, "epoch": 6409} {"train_loss": -27.60320472717285, "global_step": 532010, "epoch": 6409} {"train_loss": -27.675094604492188, "global_step": 532011, "epoch": 6409} {"train_loss": -27.814380645751953, "global_step": 532012, "epoch": 6409} {"train_loss": -27.593585968017578, "global_step": 532013, "epoch": 6409} {"train_loss": -27.149200439453125, "global_step": 532014, "epoch": 6409} {"train_loss": -27.488489151000977, "global_step": 532015, "epoch": 6409} {"train_loss": -27.653858184814453, "global_step": 532016, "epoch": 6409} {"train_loss": -27.371051788330078, "global_step": 532017, "epoch": 6409} {"train_loss": -27.393253326416016, "global_step": 532018, "epoch": 6409} {"train_loss": -27.846052169799805, "global_step": 532019, "epoch": 6409} {"train_loss": -27.47222328186035, "global_step": 532020, "epoch": 6409} {"train_loss": -27.62140464782715, "global_step": 532021, "epoch": 6409} {"train_loss": -28.190336227416992, "global_step": 532022, "epoch": 6409} {"train_loss": -27.4522647857666, "global_step": 532023, "epoch": 6409} {"train_loss": -27.58908462524414, "global_step": 532024, "epoch": 6409} {"train_loss": -27.65662956237793, "global_step": 532025, "epoch": 6409} {"train_loss": -27.389020919799805, "global_step": 532026, "epoch": 6409} {"train_loss": -27.536298751831055, "global_step": 532027, "epoch": 6409} {"train_loss": -27.25030517578125, "global_step": 532028, "epoch": 6409} {"train_loss": -27.50896522797734, "global_step": 532029, "epoch": 6409, "val_loss": 6495794.0} {"train_loss": -26.342954635620117, "global_step": 532030, "epoch": 6410} {"train_loss": -27.104949951171875, "global_step": 532031, "epoch": 6410} {"train_loss": -26.123371124267578, "global_step": 532032, "epoch": 6410} {"train_loss": -26.774755477905273, "global_step": 532033, "epoch": 6410} {"train_loss": -26.949399948120117, "global_step": 532034, "epoch": 6410} {"train_loss": -27.064050674438477, "global_step": 532035, "epoch": 6410} {"train_loss": -26.812915802001953, "global_step": 532036, "epoch": 6410} {"train_loss": -26.6960506439209, "global_step": 532037, "epoch": 6410} {"train_loss": -26.707229614257812, "global_step": 532038, "epoch": 6410} {"train_loss": -26.747623443603516, "global_step": 532039, "epoch": 6410} {"train_loss": -26.640613555908203, "global_step": 532040, "epoch": 6410} {"train_loss": -26.988622665405273, "global_step": 532041, "epoch": 6410} {"train_loss": -26.596418380737305, "global_step": 532042, "epoch": 6410} {"train_loss": -26.794401168823242, "global_step": 532043, "epoch": 6410} {"train_loss": -27.135120391845703, "global_step": 532044, "epoch": 6410} {"train_loss": -27.0859432220459, "global_step": 532045, "epoch": 6410} {"train_loss": -26.80890464782715, "global_step": 532046, "epoch": 6410} {"train_loss": -27.279943466186523, "global_step": 532047, "epoch": 6410} {"train_loss": -27.144678115844727, "global_step": 532048, "epoch": 6410} {"train_loss": -27.417205810546875, "global_step": 532049, "epoch": 6410} {"train_loss": -27.196874618530273, "global_step": 532050, "epoch": 6410} {"train_loss": -27.334142684936523, "global_step": 532051, "epoch": 6410} {"train_loss": -27.287734985351562, "global_step": 532052, "epoch": 6410} {"train_loss": -27.056177139282227, "global_step": 532053, "epoch": 6410} {"train_loss": -27.591955184936523, "global_step": 532054, "epoch": 6410} {"train_loss": -27.12546157836914, "global_step": 532055, "epoch": 6410} {"train_loss": -27.363849639892578, "global_step": 532056, "epoch": 6410} {"train_loss": -27.056686401367188, "global_step": 532057, "epoch": 6410} {"train_loss": -27.572179794311523, "global_step": 532058, "epoch": 6410} {"train_loss": -27.178098678588867, "global_step": 532059, "epoch": 6410} {"train_loss": -27.713186264038086, "global_step": 532060, "epoch": 6410} {"train_loss": -27.493762969970703, "global_step": 532061, "epoch": 6410} {"train_loss": -27.643360137939453, "global_step": 532062, "epoch": 6410} {"train_loss": -27.322311401367188, "global_step": 532063, "epoch": 6410} {"train_loss": -27.502954483032227, "global_step": 532064, "epoch": 6410} {"train_loss": -27.5865421295166, "global_step": 532065, "epoch": 6410} {"train_loss": -27.475141525268555, "global_step": 532066, "epoch": 6410} {"train_loss": -27.689062118530273, "global_step": 532067, "epoch": 6410} {"train_loss": -27.599206924438477, "global_step": 532068, "epoch": 6410} {"train_loss": -27.55439567565918, "global_step": 532069, "epoch": 6410} {"train_loss": -27.53773307800293, "global_step": 532070, "epoch": 6410} {"train_loss": -27.11517333984375, "global_step": 532071, "epoch": 6410} {"train_loss": -27.360422134399414, "global_step": 532072, "epoch": 6410} {"train_loss": -27.627904891967773, "global_step": 532073, "epoch": 6410} {"train_loss": -27.504491806030273, "global_step": 532074, "epoch": 6410} {"train_loss": -27.62166404724121, "global_step": 532075, "epoch": 6410} {"train_loss": -28.039823532104492, "global_step": 532076, "epoch": 6410} {"train_loss": -27.81593132019043, "global_step": 532077, "epoch": 6410} {"train_loss": -27.849105834960938, "global_step": 532078, "epoch": 6410} {"train_loss": -27.4151554107666, "global_step": 532079, "epoch": 6410} {"train_loss": -27.875097274780273, "global_step": 532080, "epoch": 6410} {"train_loss": -27.570709228515625, "global_step": 532081, "epoch": 6410} {"train_loss": -27.78093910217285, "global_step": 532082, "epoch": 6410} {"train_loss": -27.85422706604004, "global_step": 532083, "epoch": 6410} {"train_loss": -27.79239845275879, "global_step": 532084, "epoch": 6410} {"train_loss": -27.861291885375977, "global_step": 532085, "epoch": 6410} {"train_loss": -27.87403678894043, "global_step": 532086, "epoch": 6410} {"train_loss": -27.5718994140625, "global_step": 532087, "epoch": 6410} {"train_loss": -27.738927841186523, "global_step": 532088, "epoch": 6410} {"train_loss": -27.636159896850586, "global_step": 532089, "epoch": 6410} {"train_loss": -27.64339256286621, "global_step": 532090, "epoch": 6410} {"train_loss": -26.730451583862305, "global_step": 532091, "epoch": 6410} {"train_loss": -27.103931427001953, "global_step": 532092, "epoch": 6410} {"train_loss": -26.842823028564453, "global_step": 532093, "epoch": 6410} {"train_loss": -27.5468692779541, "global_step": 532094, "epoch": 6410} {"train_loss": -27.886991500854492, "global_step": 532095, "epoch": 6410} {"train_loss": -27.09002113342285, "global_step": 532096, "epoch": 6410} {"train_loss": -27.768644332885742, "global_step": 532097, "epoch": 6410} {"train_loss": -27.326889038085938, "global_step": 532098, "epoch": 6410} {"train_loss": -27.51905632019043, "global_step": 532099, "epoch": 6410} {"train_loss": -27.55805015563965, "global_step": 532100, "epoch": 6410} {"train_loss": -27.274816513061523, "global_step": 532101, "epoch": 6410} {"train_loss": -27.252172470092773, "global_step": 532102, "epoch": 6410} {"train_loss": -27.652191162109375, "global_step": 532103, "epoch": 6410} {"train_loss": -27.705854415893555, "global_step": 532104, "epoch": 6410} {"train_loss": -27.357690811157227, "global_step": 532105, "epoch": 6410} {"train_loss": -27.604429244995117, "global_step": 532106, "epoch": 6410} {"train_loss": -27.417804718017578, "global_step": 532107, "epoch": 6410} {"train_loss": -28.20611000061035, "global_step": 532108, "epoch": 6410} {"train_loss": -27.454198837280273, "global_step": 532109, "epoch": 6410} {"train_loss": -27.619977951049805, "global_step": 532110, "epoch": 6410} {"train_loss": -27.157712936401367, "global_step": 532111, "epoch": 6410} {"train_loss": -27.3431820467294, "global_step": 532112, "epoch": 6410, "val_loss": 6424739.0} {"train_loss": -27.18586540222168, "global_step": 532113, "epoch": 6411} {"train_loss": -27.077972412109375, "global_step": 532114, "epoch": 6411} {"train_loss": -27.337156295776367, "global_step": 532115, "epoch": 6411} {"train_loss": -27.153608322143555, "global_step": 532116, "epoch": 6411} {"train_loss": -27.072803497314453, "global_step": 532117, "epoch": 6411} {"train_loss": -27.063053131103516, "global_step": 532118, "epoch": 6411} {"train_loss": -27.302215576171875, "global_step": 532119, "epoch": 6411} {"train_loss": -27.109710693359375, "global_step": 532120, "epoch": 6411} {"train_loss": -26.76611328125, "global_step": 532121, "epoch": 6411} {"train_loss": -26.905139923095703, "global_step": 532122, "epoch": 6411} {"train_loss": -27.649999618530273, "global_step": 532123, "epoch": 6411} {"train_loss": -27.346975326538086, "global_step": 532124, "epoch": 6411} {"train_loss": -27.554306030273438, "global_step": 532125, "epoch": 6411} {"train_loss": -27.435333251953125, "global_step": 532126, "epoch": 6411} {"train_loss": -27.068267822265625, "global_step": 532127, "epoch": 6411} {"train_loss": -27.303293228149414, "global_step": 532128, "epoch": 6411} {"train_loss": -27.330713272094727, "global_step": 532129, "epoch": 6411} {"train_loss": -27.483198165893555, "global_step": 532130, "epoch": 6411} {"train_loss": -27.300434112548828, "global_step": 532131, "epoch": 6411} {"train_loss": -27.452062606811523, "global_step": 532132, "epoch": 6411} {"train_loss": -27.4371337890625, "global_step": 532133, "epoch": 6411} {"train_loss": -27.74375343322754, "global_step": 532134, "epoch": 6411} {"train_loss": -27.72067642211914, "global_step": 532135, "epoch": 6411} {"train_loss": -27.1739444732666, "global_step": 532136, "epoch": 6411} {"train_loss": -27.934228897094727, "global_step": 532137, "epoch": 6411} {"train_loss": -27.87147331237793, "global_step": 532138, "epoch": 6411} {"train_loss": -27.728424072265625, "global_step": 532139, "epoch": 6411} {"train_loss": -27.58103370666504, "global_step": 532140, "epoch": 6411} {"train_loss": -27.747648239135742, "global_step": 532141, "epoch": 6411} {"train_loss": -27.81039810180664, "global_step": 532142, "epoch": 6411} {"train_loss": -27.932209014892578, "global_step": 532143, "epoch": 6411} {"train_loss": -27.41523551940918, "global_step": 532144, "epoch": 6411} {"train_loss": -27.70869255065918, "global_step": 532145, "epoch": 6411} {"train_loss": -27.3411808013916, "global_step": 532146, "epoch": 6411} {"train_loss": -27.95159339904785, "global_step": 532147, "epoch": 6411} {"train_loss": -27.572153091430664, "global_step": 532148, "epoch": 6411} {"train_loss": -27.86734962463379, "global_step": 532149, "epoch": 6411} {"train_loss": -27.882123947143555, "global_step": 532150, "epoch": 6411} {"train_loss": -27.735136032104492, "global_step": 532151, "epoch": 6411} {"train_loss": -27.825729370117188, "global_step": 532152, "epoch": 6411} {"train_loss": -27.66729164123535, "global_step": 532153, "epoch": 6411} {"train_loss": -28.17420768737793, "global_step": 532154, "epoch": 6411} {"train_loss": -27.9453125, "global_step": 532155, "epoch": 6411} {"train_loss": -27.555795669555664, "global_step": 532156, "epoch": 6411} {"train_loss": -27.86700439453125, "global_step": 532157, "epoch": 6411} {"train_loss": -27.57156753540039, "global_step": 532158, "epoch": 6411} {"train_loss": -27.521575927734375, "global_step": 532159, "epoch": 6411} {"train_loss": -27.8627986907959, "global_step": 532160, "epoch": 6411} {"train_loss": -27.630544662475586, "global_step": 532161, "epoch": 6411} {"train_loss": -27.6964168548584, "global_step": 532162, "epoch": 6411} {"train_loss": -27.858551025390625, "global_step": 532163, "epoch": 6411} {"train_loss": -27.70379066467285, "global_step": 532164, "epoch": 6411} {"train_loss": -27.758441925048828, "global_step": 532165, "epoch": 6411} {"train_loss": -27.853422164916992, "global_step": 532166, "epoch": 6411} {"train_loss": -27.522192001342773, "global_step": 532167, "epoch": 6411} {"train_loss": -26.644351959228516, "global_step": 532168, "epoch": 6411} {"train_loss": -26.838977813720703, "global_step": 532169, "epoch": 6411} {"train_loss": -27.296497344970703, "global_step": 532170, "epoch": 6411} {"train_loss": -27.432758331298828, "global_step": 532171, "epoch": 6411} {"train_loss": -26.77773094177246, "global_step": 532172, "epoch": 6411} {"train_loss": -27.243377685546875, "global_step": 532173, "epoch": 6411} {"train_loss": -27.30781364440918, "global_step": 532174, "epoch": 6411} {"train_loss": -27.196889877319336, "global_step": 532175, "epoch": 6411} {"train_loss": -27.156787872314453, "global_step": 532176, "epoch": 6411} {"train_loss": -27.694982528686523, "global_step": 532177, "epoch": 6411} {"train_loss": -27.6346492767334, "global_step": 532178, "epoch": 6411} {"train_loss": -27.359546661376953, "global_step": 532179, "epoch": 6411} {"train_loss": -27.626379013061523, "global_step": 532180, "epoch": 6411} {"train_loss": -27.476856231689453, "global_step": 532181, "epoch": 6411} {"train_loss": -27.34647560119629, "global_step": 532182, "epoch": 6411} {"train_loss": -27.79831314086914, "global_step": 532183, "epoch": 6411} {"train_loss": -27.418350219726562, "global_step": 532184, "epoch": 6411} {"train_loss": -27.664011001586914, "global_step": 532185, "epoch": 6411} {"train_loss": -27.602920532226562, "global_step": 532186, "epoch": 6411} {"train_loss": -27.486541748046875, "global_step": 532187, "epoch": 6411} {"train_loss": -27.720325469970703, "global_step": 532188, "epoch": 6411} {"train_loss": -27.47003173828125, "global_step": 532189, "epoch": 6411} {"train_loss": -27.342105865478516, "global_step": 532190, "epoch": 6411} {"train_loss": -27.4208927154541, "global_step": 532191, "epoch": 6411} {"train_loss": -27.479822158813477, "global_step": 532192, "epoch": 6411} {"train_loss": -27.5097713470459, "global_step": 532193, "epoch": 6411} {"train_loss": -27.499414443969727, "global_step": 532194, "epoch": 6411} {"train_loss": -27.501577813941314, "global_step": 532195, "epoch": 6411, "val_loss": 6488593.0} {"train_loss": -27.221765518188477, "global_step": 532196, "epoch": 6412} {"train_loss": -27.359851837158203, "global_step": 532197, "epoch": 6412} {"train_loss": -27.334537506103516, "global_step": 532198, "epoch": 6412} {"train_loss": -27.23111915588379, "global_step": 532199, "epoch": 6412} {"train_loss": -27.098800659179688, "global_step": 532200, "epoch": 6412} {"train_loss": -27.332265853881836, "global_step": 532201, "epoch": 6412} {"train_loss": -27.154748916625977, "global_step": 532202, "epoch": 6412} {"train_loss": -27.400415420532227, "global_step": 532203, "epoch": 6412} {"train_loss": -27.393232345581055, "global_step": 532204, "epoch": 6412} {"train_loss": -27.295642852783203, "global_step": 532205, "epoch": 6412} {"train_loss": -27.419452667236328, "global_step": 532206, "epoch": 6412} {"train_loss": -27.127843856811523, "global_step": 532207, "epoch": 6412} {"train_loss": -27.54304313659668, "global_step": 532208, "epoch": 6412} {"train_loss": -27.11441993713379, "global_step": 532209, "epoch": 6412} {"train_loss": -27.10611915588379, "global_step": 532210, "epoch": 6412} {"train_loss": -27.3072566986084, "global_step": 532211, "epoch": 6412} {"train_loss": -27.091299057006836, "global_step": 532212, "epoch": 6412} {"train_loss": -27.431018829345703, "global_step": 532213, "epoch": 6412} {"train_loss": -27.52425193786621, "global_step": 532214, "epoch": 6412} {"train_loss": -27.44059181213379, "global_step": 532215, "epoch": 6412} {"train_loss": -27.80034828186035, "global_step": 532216, "epoch": 6412} {"train_loss": -27.760278701782227, "global_step": 532217, "epoch": 6412} {"train_loss": -27.723363876342773, "global_step": 532218, "epoch": 6412} {"train_loss": -27.526594161987305, "global_step": 532219, "epoch": 6412} {"train_loss": -27.592514038085938, "global_step": 532220, "epoch": 6412} {"train_loss": -27.585020065307617, "global_step": 532221, "epoch": 6412} {"train_loss": -27.496734619140625, "global_step": 532222, "epoch": 6412} {"train_loss": -27.547765731811523, "global_step": 532223, "epoch": 6412} {"train_loss": -27.860708236694336, "global_step": 532224, "epoch": 6412} {"train_loss": -27.419879913330078, "global_step": 532225, "epoch": 6412} {"train_loss": -27.6464786529541, "global_step": 532226, "epoch": 6412} {"train_loss": -27.55425453186035, "global_step": 532227, "epoch": 6412} {"train_loss": -27.689661026000977, "global_step": 532228, "epoch": 6412} {"train_loss": -26.966882705688477, "global_step": 532229, "epoch": 6412} {"train_loss": -27.12489891052246, "global_step": 532230, "epoch": 6412} {"train_loss": -26.793777465820312, "global_step": 532231, "epoch": 6412} {"train_loss": -27.826868057250977, "global_step": 532232, "epoch": 6412} {"train_loss": -27.94769287109375, "global_step": 532233, "epoch": 6412} {"train_loss": -27.192001342773438, "global_step": 532234, "epoch": 6412} {"train_loss": -26.903766632080078, "global_step": 532235, "epoch": 6412} {"train_loss": -27.573932647705078, "global_step": 532236, "epoch": 6412} {"train_loss": -27.847455978393555, "global_step": 532237, "epoch": 6412} {"train_loss": -27.36577796936035, "global_step": 532238, "epoch": 6412} {"train_loss": -27.659839630126953, "global_step": 532239, "epoch": 6412} {"train_loss": -27.440662384033203, "global_step": 532240, "epoch": 6412} {"train_loss": -27.318674087524414, "global_step": 532241, "epoch": 6412} {"train_loss": -27.660547256469727, "global_step": 532242, "epoch": 6412} {"train_loss": -27.552459716796875, "global_step": 532243, "epoch": 6412} {"train_loss": -27.74188232421875, "global_step": 532244, "epoch": 6412} {"train_loss": -27.56867027282715, "global_step": 532245, "epoch": 6412} {"train_loss": -27.83184242248535, "global_step": 532246, "epoch": 6412} {"train_loss": -27.449411392211914, "global_step": 532247, "epoch": 6412} {"train_loss": -27.708587646484375, "global_step": 532248, "epoch": 6412} {"train_loss": -27.433645248413086, "global_step": 532249, "epoch": 6412} {"train_loss": -27.395055770874023, "global_step": 532250, "epoch": 6412} {"train_loss": -27.439672470092773, "global_step": 532251, "epoch": 6412} {"train_loss": -27.859283447265625, "global_step": 532252, "epoch": 6412} {"train_loss": -27.714618682861328, "global_step": 532253, "epoch": 6412} {"train_loss": -27.978546142578125, "global_step": 532254, "epoch": 6412} {"train_loss": -27.739089965820312, "global_step": 532255, "epoch": 6412} {"train_loss": -27.746875762939453, "global_step": 532256, "epoch": 6412} {"train_loss": -27.892242431640625, "global_step": 532257, "epoch": 6412} {"train_loss": -27.7819881439209, "global_step": 532258, "epoch": 6412} {"train_loss": -27.409940719604492, "global_step": 532259, "epoch": 6412} {"train_loss": -28.077301025390625, "global_step": 532260, "epoch": 6412} {"train_loss": -27.842670440673828, "global_step": 532261, "epoch": 6412} {"train_loss": -27.904504776000977, "global_step": 532262, "epoch": 6412} {"train_loss": -27.6252384185791, "global_step": 532263, "epoch": 6412} {"train_loss": -27.087690353393555, "global_step": 532264, "epoch": 6412} {"train_loss": -27.272024154663086, "global_step": 532265, "epoch": 6412} {"train_loss": -27.34808349609375, "global_step": 532266, "epoch": 6412} {"train_loss": -27.622055053710938, "global_step": 532267, "epoch": 6412} {"train_loss": -27.467496871948242, "global_step": 532268, "epoch": 6412} {"train_loss": -27.63197898864746, "global_step": 532269, "epoch": 6412} {"train_loss": -28.12782096862793, "global_step": 532270, "epoch": 6412} {"train_loss": -27.70729637145996, "global_step": 532271, "epoch": 6412} {"train_loss": -27.625818252563477, "global_step": 532272, "epoch": 6412} {"train_loss": -27.968032836914062, "global_step": 532273, "epoch": 6412} {"train_loss": -27.897607803344727, "global_step": 532274, "epoch": 6412} {"train_loss": -27.76936912536621, "global_step": 532275, "epoch": 6412} {"train_loss": -27.726154327392578, "global_step": 532276, "epoch": 6412} {"train_loss": -27.894500732421875, "global_step": 532277, "epoch": 6412} {"train_loss": -27.544387541621564, "global_step": 532278, "epoch": 6412, "val_loss": 6547653.0} {"train_loss": -27.108585357666016, "global_step": 532279, "epoch": 6413} {"train_loss": -27.0583438873291, "global_step": 532280, "epoch": 6413} {"train_loss": -27.01079750061035, "global_step": 532281, "epoch": 6413} {"train_loss": -26.96013832092285, "global_step": 532282, "epoch": 6413} {"train_loss": -26.663740158081055, "global_step": 532283, "epoch": 6413} {"train_loss": -26.974878311157227, "global_step": 532284, "epoch": 6413} {"train_loss": -27.49281883239746, "global_step": 532285, "epoch": 6413} {"train_loss": -26.978002548217773, "global_step": 532286, "epoch": 6413} {"train_loss": -27.275909423828125, "global_step": 532287, "epoch": 6413} {"train_loss": -27.27161979675293, "global_step": 532288, "epoch": 6413} {"train_loss": -27.381742477416992, "global_step": 532289, "epoch": 6413} {"train_loss": -27.314167022705078, "global_step": 532290, "epoch": 6413} {"train_loss": -27.505659103393555, "global_step": 532291, "epoch": 6413} {"train_loss": -26.734363555908203, "global_step": 532292, "epoch": 6413} {"train_loss": -27.128509521484375, "global_step": 532293, "epoch": 6413} {"train_loss": -27.41658592224121, "global_step": 532294, "epoch": 6413} {"train_loss": -27.35736083984375, "global_step": 532295, "epoch": 6413} {"train_loss": -27.17696189880371, "global_step": 532296, "epoch": 6413} {"train_loss": -27.64167594909668, "global_step": 532297, "epoch": 6413} {"train_loss": -27.74713134765625, "global_step": 532298, "epoch": 6413} {"train_loss": -27.894498825073242, "global_step": 532299, "epoch": 6413} {"train_loss": -27.549774169921875, "global_step": 532300, "epoch": 6413} {"train_loss": -27.871850967407227, "global_step": 532301, "epoch": 6413} {"train_loss": -27.64542579650879, "global_step": 532302, "epoch": 6413} {"train_loss": -27.846288681030273, "global_step": 532303, "epoch": 6413} {"train_loss": -27.40252685546875, "global_step": 532304, "epoch": 6413} {"train_loss": -27.63876724243164, "global_step": 532305, "epoch": 6413} {"train_loss": -27.37396812438965, "global_step": 532306, "epoch": 6413} {"train_loss": -27.528812408447266, "global_step": 532307, "epoch": 6413} {"train_loss": -27.42474365234375, "global_step": 532308, "epoch": 6413} {"train_loss": -27.548913955688477, "global_step": 532309, "epoch": 6413} {"train_loss": -27.4266357421875, "global_step": 532310, "epoch": 6413} {"train_loss": -27.458053588867188, "global_step": 532311, "epoch": 6413} {"train_loss": -27.55421257019043, "global_step": 532312, "epoch": 6413} {"train_loss": -27.7813777923584, "global_step": 532313, "epoch": 6413} {"train_loss": -27.59027671813965, "global_step": 532314, "epoch": 6413} {"train_loss": -27.90126609802246, "global_step": 532315, "epoch": 6413} {"train_loss": -27.748327255249023, "global_step": 532316, "epoch": 6413} {"train_loss": -27.828832626342773, "global_step": 532317, "epoch": 6413} {"train_loss": -28.112146377563477, "global_step": 532318, "epoch": 6413} {"train_loss": -27.281946182250977, "global_step": 532319, "epoch": 6413} {"train_loss": -27.310321807861328, "global_step": 532320, "epoch": 6413} {"train_loss": -27.856552124023438, "global_step": 532321, "epoch": 6413} {"train_loss": -27.903165817260742, "global_step": 532322, "epoch": 6413} {"train_loss": -27.601398468017578, "global_step": 532323, "epoch": 6413} {"train_loss": -27.452123641967773, "global_step": 532324, "epoch": 6413} {"train_loss": -26.994577407836914, "global_step": 532325, "epoch": 6413} {"train_loss": -27.123884201049805, "global_step": 532326, "epoch": 6413} {"train_loss": -27.46125602722168, "global_step": 532327, "epoch": 6413} {"train_loss": -27.347427368164062, "global_step": 532328, "epoch": 6413} {"train_loss": -27.25861930847168, "global_step": 532329, "epoch": 6413} {"train_loss": -27.50010108947754, "global_step": 532330, "epoch": 6413} {"train_loss": -27.73468017578125, "global_step": 532331, "epoch": 6413} {"train_loss": -27.396228790283203, "global_step": 532332, "epoch": 6413} {"train_loss": -27.380048751831055, "global_step": 532333, "epoch": 6413} {"train_loss": -27.957563400268555, "global_step": 532334, "epoch": 6413} {"train_loss": -27.528400421142578, "global_step": 532335, "epoch": 6413} {"train_loss": -27.8439884185791, "global_step": 532336, "epoch": 6413} {"train_loss": -27.882749557495117, "global_step": 532337, "epoch": 6413} {"train_loss": -27.487060546875, "global_step": 532338, "epoch": 6413} {"train_loss": -27.803586959838867, "global_step": 532339, "epoch": 6413} {"train_loss": -27.572052001953125, "global_step": 532340, "epoch": 6413} {"train_loss": -27.296051025390625, "global_step": 532341, "epoch": 6413} {"train_loss": -28.0268497467041, "global_step": 532342, "epoch": 6413} {"train_loss": -27.713285446166992, "global_step": 532343, "epoch": 6413} {"train_loss": -27.783740997314453, "global_step": 532344, "epoch": 6413} {"train_loss": -27.741947174072266, "global_step": 532345, "epoch": 6413} {"train_loss": -27.476287841796875, "global_step": 532346, "epoch": 6413} {"train_loss": -27.958698272705078, "global_step": 532347, "epoch": 6413} {"train_loss": -27.941884994506836, "global_step": 532348, "epoch": 6413} {"train_loss": -28.055688858032227, "global_step": 532349, "epoch": 6413} {"train_loss": -27.853750228881836, "global_step": 532350, "epoch": 6413} {"train_loss": -27.445432662963867, "global_step": 532351, "epoch": 6413} {"train_loss": -26.629663467407227, "global_step": 532352, "epoch": 6413} {"train_loss": -26.437299728393555, "global_step": 532353, "epoch": 6413} {"train_loss": -26.83342933654785, "global_step": 532354, "epoch": 6413} {"train_loss": -27.14175796508789, "global_step": 532355, "epoch": 6413} {"train_loss": -27.291067123413086, "global_step": 532356, "epoch": 6413} {"train_loss": -26.460554122924805, "global_step": 532357, "epoch": 6413} {"train_loss": -27.448266983032227, "global_step": 532358, "epoch": 6413} {"train_loss": -27.30084800720215, "global_step": 532359, "epoch": 6413} {"train_loss": -27.023456573486328, "global_step": 532360, "epoch": 6413} {"train_loss": -27.439558258975843, "global_step": 532361, "epoch": 6413, "val_loss": 6575761.5} {"train_loss": -26.59688377380371, "global_step": 532362, "epoch": 6414} {"train_loss": -26.688159942626953, "global_step": 532363, "epoch": 6414} {"train_loss": -27.144468307495117, "global_step": 532364, "epoch": 6414} {"train_loss": -26.856077194213867, "global_step": 532365, "epoch": 6414} {"train_loss": -26.89592933654785, "global_step": 532366, "epoch": 6414} {"train_loss": -26.905426025390625, "global_step": 532367, "epoch": 6414} {"train_loss": -27.5250244140625, "global_step": 532368, "epoch": 6414} {"train_loss": -26.869672775268555, "global_step": 532369, "epoch": 6414} {"train_loss": -27.261640548706055, "global_step": 532370, "epoch": 6414} {"train_loss": -27.203052520751953, "global_step": 532371, "epoch": 6414} {"train_loss": -26.9468936920166, "global_step": 532372, "epoch": 6414} {"train_loss": -27.244873046875, "global_step": 532373, "epoch": 6414} {"train_loss": -27.348478317260742, "global_step": 532374, "epoch": 6414} {"train_loss": -27.470916748046875, "global_step": 532375, "epoch": 6414} {"train_loss": -27.476642608642578, "global_step": 532376, "epoch": 6414} {"train_loss": -27.096460342407227, "global_step": 532377, "epoch": 6414} {"train_loss": -27.4449520111084, "global_step": 532378, "epoch": 6414} {"train_loss": -27.3660945892334, "global_step": 532379, "epoch": 6414} {"train_loss": -27.284088134765625, "global_step": 532380, "epoch": 6414} {"train_loss": -27.369287490844727, "global_step": 532381, "epoch": 6414} {"train_loss": -27.55243492126465, "global_step": 532382, "epoch": 6414} {"train_loss": -27.711469650268555, "global_step": 532383, "epoch": 6414} {"train_loss": -27.563207626342773, "global_step": 532384, "epoch": 6414} {"train_loss": -27.3862247467041, "global_step": 532385, "epoch": 6414} {"train_loss": -27.879369735717773, "global_step": 532386, "epoch": 6414} {"train_loss": -27.745786666870117, "global_step": 532387, "epoch": 6414} {"train_loss": -27.447790145874023, "global_step": 532388, "epoch": 6414} {"train_loss": -27.4521427154541, "global_step": 532389, "epoch": 6414} {"train_loss": -27.44086265563965, "global_step": 532390, "epoch": 6414} {"train_loss": -27.854787826538086, "global_step": 532391, "epoch": 6414} {"train_loss": -27.76565933227539, "global_step": 532392, "epoch": 6414} {"train_loss": -28.006561279296875, "global_step": 532393, "epoch": 6414} {"train_loss": -27.8112735748291, "global_step": 532394, "epoch": 6414} {"train_loss": -27.875732421875, "global_step": 532395, "epoch": 6414} {"train_loss": -28.0918025970459, "global_step": 532396, "epoch": 6414} {"train_loss": -27.822357177734375, "global_step": 532397, "epoch": 6414} {"train_loss": -27.240140914916992, "global_step": 532398, "epoch": 6414} {"train_loss": -27.627553939819336, "global_step": 532399, "epoch": 6414} {"train_loss": -27.5283145904541, "global_step": 532400, "epoch": 6414} {"train_loss": -27.572473526000977, "global_step": 532401, "epoch": 6414} {"train_loss": -28.183307647705078, "global_step": 532402, "epoch": 6414} {"train_loss": -27.818359375, "global_step": 532403, "epoch": 6414} {"train_loss": -27.474609375, "global_step": 532404, "epoch": 6414} {"train_loss": -27.58479118347168, "global_step": 532405, "epoch": 6414} {"train_loss": -27.273462295532227, "global_step": 532406, "epoch": 6414} {"train_loss": -28.05206871032715, "global_step": 532407, "epoch": 6414} {"train_loss": -27.434003829956055, "global_step": 532408, "epoch": 6414} {"train_loss": -27.465925216674805, "global_step": 532409, "epoch": 6414} {"train_loss": -28.03273582458496, "global_step": 532410, "epoch": 6414} {"train_loss": -27.520587921142578, "global_step": 532411, "epoch": 6414} {"train_loss": -27.980710983276367, "global_step": 532412, "epoch": 6414} {"train_loss": -27.569334030151367, "global_step": 532413, "epoch": 6414} {"train_loss": -27.803136825561523, "global_step": 532414, "epoch": 6414} {"train_loss": -27.871957778930664, "global_step": 532415, "epoch": 6414} {"train_loss": -27.899641036987305, "global_step": 532416, "epoch": 6414} {"train_loss": -27.67774772644043, "global_step": 532417, "epoch": 6414} {"train_loss": -27.83746910095215, "global_step": 532418, "epoch": 6414} {"train_loss": -27.61614418029785, "global_step": 532419, "epoch": 6414} {"train_loss": -27.493427276611328, "global_step": 532420, "epoch": 6414} {"train_loss": -27.172271728515625, "global_step": 532421, "epoch": 6414} {"train_loss": -27.169849395751953, "global_step": 532422, "epoch": 6414} {"train_loss": -27.989240646362305, "global_step": 532423, "epoch": 6414} {"train_loss": -27.33802604675293, "global_step": 532424, "epoch": 6414} {"train_loss": -27.718082427978516, "global_step": 532425, "epoch": 6414} {"train_loss": -28.048017501831055, "global_step": 532426, "epoch": 6414} {"train_loss": -27.74171257019043, "global_step": 532427, "epoch": 6414} {"train_loss": -27.3535099029541, "global_step": 532428, "epoch": 6414} {"train_loss": -28.087818145751953, "global_step": 532429, "epoch": 6414} {"train_loss": -27.539499282836914, "global_step": 532430, "epoch": 6414} {"train_loss": -27.284107208251953, "global_step": 532431, "epoch": 6414} {"train_loss": -28.04180908203125, "global_step": 532432, "epoch": 6414} {"train_loss": -27.19146156311035, "global_step": 532433, "epoch": 6414} {"train_loss": -27.243438720703125, "global_step": 532434, "epoch": 6414} {"train_loss": -26.725910186767578, "global_step": 532435, "epoch": 6414} {"train_loss": -27.697772979736328, "global_step": 532436, "epoch": 6414} {"train_loss": -27.445388793945312, "global_step": 532437, "epoch": 6414} {"train_loss": -27.940221786499023, "global_step": 532438, "epoch": 6414} {"train_loss": -27.5780086517334, "global_step": 532439, "epoch": 6414} {"train_loss": -27.570449829101562, "global_step": 532440, "epoch": 6414} {"train_loss": -27.724716186523438, "global_step": 532441, "epoch": 6414} {"train_loss": -27.55991554260254, "global_step": 532442, "epoch": 6414} {"train_loss": -27.71784019470215, "global_step": 532443, "epoch": 6414} {"train_loss": -27.52462364104857, "global_step": 532444, "epoch": 6414, "val_loss": 6592328.0} {"train_loss": -27.456823348999023, "global_step": 532445, "epoch": 6415} {"train_loss": -26.629453659057617, "global_step": 532446, "epoch": 6415} {"train_loss": -26.53788185119629, "global_step": 532447, "epoch": 6415} {"train_loss": -26.63018226623535, "global_step": 532448, "epoch": 6415} {"train_loss": -26.494037628173828, "global_step": 532449, "epoch": 6415} {"train_loss": -26.916996002197266, "global_step": 532450, "epoch": 6415} {"train_loss": -25.834646224975586, "global_step": 532451, "epoch": 6415} {"train_loss": -26.418447494506836, "global_step": 532452, "epoch": 6415} {"train_loss": -26.79725456237793, "global_step": 532453, "epoch": 6415} {"train_loss": -26.723785400390625, "global_step": 532454, "epoch": 6415} {"train_loss": -26.497770309448242, "global_step": 532455, "epoch": 6415} {"train_loss": -27.307483673095703, "global_step": 532456, "epoch": 6415} {"train_loss": -26.570287704467773, "global_step": 532457, "epoch": 6415} {"train_loss": -27.234619140625, "global_step": 532458, "epoch": 6415} {"train_loss": -26.748212814331055, "global_step": 532459, "epoch": 6415} {"train_loss": -26.967853546142578, "global_step": 532460, "epoch": 6415} {"train_loss": -26.867151260375977, "global_step": 532461, "epoch": 6415} {"train_loss": -27.20833396911621, "global_step": 532462, "epoch": 6415} {"train_loss": -26.945096969604492, "global_step": 532463, "epoch": 6415} {"train_loss": -27.064807891845703, "global_step": 532464, "epoch": 6415} {"train_loss": -27.1971435546875, "global_step": 532465, "epoch": 6415} {"train_loss": -26.742780685424805, "global_step": 532466, "epoch": 6415} {"train_loss": -27.164785385131836, "global_step": 532467, "epoch": 6415} {"train_loss": -26.933883666992188, "global_step": 532468, "epoch": 6415} {"train_loss": -26.995691299438477, "global_step": 532469, "epoch": 6415} {"train_loss": -27.362516403198242, "global_step": 532470, "epoch": 6415} {"train_loss": -27.286518096923828, "global_step": 532471, "epoch": 6415} {"train_loss": -27.164108276367188, "global_step": 532472, "epoch": 6415} {"train_loss": -27.725431442260742, "global_step": 532473, "epoch": 6415} {"train_loss": -27.467390060424805, "global_step": 532474, "epoch": 6415} {"train_loss": -27.30137062072754, "global_step": 532475, "epoch": 6415} {"train_loss": -27.271717071533203, "global_step": 532476, "epoch": 6415} {"train_loss": -27.313745498657227, "global_step": 532477, "epoch": 6415} {"train_loss": -27.611530303955078, "global_step": 532478, "epoch": 6415} {"train_loss": -27.35126304626465, "global_step": 532479, "epoch": 6415} {"train_loss": -27.486242294311523, "global_step": 532480, "epoch": 6415} {"train_loss": -27.547595977783203, "global_step": 532481, "epoch": 6415} {"train_loss": -27.817768096923828, "global_step": 532482, "epoch": 6415} {"train_loss": -27.41619873046875, "global_step": 532483, "epoch": 6415} {"train_loss": -27.08847999572754, "global_step": 532484, "epoch": 6415} {"train_loss": -27.84003257751465, "global_step": 532485, "epoch": 6415} {"train_loss": -27.20094871520996, "global_step": 532486, "epoch": 6415} {"train_loss": -27.71613121032715, "global_step": 532487, "epoch": 6415} {"train_loss": -27.723529815673828, "global_step": 532488, "epoch": 6415} {"train_loss": -27.44170570373535, "global_step": 532489, "epoch": 6415} {"train_loss": -27.582738876342773, "global_step": 532490, "epoch": 6415} {"train_loss": -27.607812881469727, "global_step": 532491, "epoch": 6415} {"train_loss": -27.394092559814453, "global_step": 532492, "epoch": 6415} {"train_loss": -27.667621612548828, "global_step": 532493, "epoch": 6415} {"train_loss": -27.60761070251465, "global_step": 532494, "epoch": 6415} {"train_loss": -27.667631149291992, "global_step": 532495, "epoch": 6415} {"train_loss": -27.834827423095703, "global_step": 532496, "epoch": 6415} {"train_loss": -27.56204605102539, "global_step": 532497, "epoch": 6415} {"train_loss": -27.50288200378418, "global_step": 532498, "epoch": 6415} {"train_loss": -27.67164421081543, "global_step": 532499, "epoch": 6415} {"train_loss": -27.960803985595703, "global_step": 532500, "epoch": 6415} {"train_loss": -27.89057731628418, "global_step": 532501, "epoch": 6415} {"train_loss": -27.639495849609375, "global_step": 532502, "epoch": 6415} {"train_loss": -27.521345138549805, "global_step": 532503, "epoch": 6415} {"train_loss": -27.425321578979492, "global_step": 532504, "epoch": 6415} {"train_loss": -27.811262130737305, "global_step": 532505, "epoch": 6415} {"train_loss": -27.92936134338379, "global_step": 532506, "epoch": 6415} {"train_loss": -27.991321563720703, "global_step": 532507, "epoch": 6415} {"train_loss": -27.931903839111328, "global_step": 532508, "epoch": 6415} {"train_loss": -27.845312118530273, "global_step": 532509, "epoch": 6415} {"train_loss": -27.33908462524414, "global_step": 532510, "epoch": 6415} {"train_loss": -27.661054611206055, "global_step": 532511, "epoch": 6415} {"train_loss": -27.7391414642334, "global_step": 532512, "epoch": 6415} {"train_loss": -27.574934005737305, "global_step": 532513, "epoch": 6415} {"train_loss": -27.5810489654541, "global_step": 532514, "epoch": 6415} {"train_loss": -27.79901695251465, "global_step": 532515, "epoch": 6415} {"train_loss": -28.113325119018555, "global_step": 532516, "epoch": 6415} {"train_loss": -28.01739501953125, "global_step": 532517, "epoch": 6415} {"train_loss": -27.68671226501465, "global_step": 532518, "epoch": 6415} {"train_loss": -27.781579971313477, "global_step": 532519, "epoch": 6415} {"train_loss": -27.838220596313477, "global_step": 532520, "epoch": 6415} {"train_loss": -27.7276611328125, "global_step": 532521, "epoch": 6415} {"train_loss": -27.630094528198242, "global_step": 532522, "epoch": 6415} {"train_loss": -27.987354278564453, "global_step": 532523, "epoch": 6415} {"train_loss": -28.06085777282715, "global_step": 532524, "epoch": 6415} {"train_loss": -27.690927505493164, "global_step": 532525, "epoch": 6415} {"train_loss": -28.04578971862793, "global_step": 532526, "epoch": 6415} {"train_loss": -27.414052963256836, "global_step": 532527, "epoch": 6415, "val_loss": 6631462.0} {"train_loss": -27.139860153198242, "global_step": 532528, "epoch": 6416} {"train_loss": -27.690073013305664, "global_step": 532529, "epoch": 6416} {"train_loss": -27.410114288330078, "global_step": 532530, "epoch": 6416} {"train_loss": -27.451141357421875, "global_step": 532531, "epoch": 6416} {"train_loss": -27.19166374206543, "global_step": 532532, "epoch": 6416} {"train_loss": -27.208484649658203, "global_step": 532533, "epoch": 6416} {"train_loss": -26.994001388549805, "global_step": 532534, "epoch": 6416} {"train_loss": -26.626745223999023, "global_step": 532535, "epoch": 6416} {"train_loss": -24.518325805664062, "global_step": 532536, "epoch": 6416} {"train_loss": -26.21160316467285, "global_step": 532537, "epoch": 6416} {"train_loss": -27.08554458618164, "global_step": 532538, "epoch": 6416} {"train_loss": -26.249780654907227, "global_step": 532539, "epoch": 6416} {"train_loss": -25.058635711669922, "global_step": 532540, "epoch": 6416} {"train_loss": -26.666921615600586, "global_step": 532541, "epoch": 6416} {"train_loss": -26.06538200378418, "global_step": 532542, "epoch": 6416} {"train_loss": -26.220462799072266, "global_step": 532543, "epoch": 6416} {"train_loss": -26.734277725219727, "global_step": 532544, "epoch": 6416} {"train_loss": -26.19254493713379, "global_step": 532545, "epoch": 6416} {"train_loss": -26.60335350036621, "global_step": 532546, "epoch": 6416} {"train_loss": -27.19087028503418, "global_step": 532547, "epoch": 6416} {"train_loss": -26.41694450378418, "global_step": 532548, "epoch": 6416} {"train_loss": -26.933820724487305, "global_step": 532549, "epoch": 6416} {"train_loss": -26.41424560546875, "global_step": 532550, "epoch": 6416} {"train_loss": -26.924331665039062, "global_step": 532551, "epoch": 6416} {"train_loss": -27.007354736328125, "global_step": 532552, "epoch": 6416} {"train_loss": -27.533802032470703, "global_step": 532553, "epoch": 6416} {"train_loss": -26.951736450195312, "global_step": 532554, "epoch": 6416} {"train_loss": -27.201688766479492, "global_step": 532555, "epoch": 6416} {"train_loss": -27.077436447143555, "global_step": 532556, "epoch": 6416} {"train_loss": -26.80606460571289, "global_step": 532557, "epoch": 6416} {"train_loss": -27.396574020385742, "global_step": 532558, "epoch": 6416} {"train_loss": -26.77419090270996, "global_step": 532559, "epoch": 6416} {"train_loss": -26.9422664642334, "global_step": 532560, "epoch": 6416} {"train_loss": -27.109603881835938, "global_step": 532561, "epoch": 6416} {"train_loss": -27.317975997924805, "global_step": 532562, "epoch": 6416} {"train_loss": -27.4482364654541, "global_step": 532563, "epoch": 6416} {"train_loss": -26.9144229888916, "global_step": 532564, "epoch": 6416} {"train_loss": -27.64349365234375, "global_step": 532565, "epoch": 6416} {"train_loss": -27.0227108001709, "global_step": 532566, "epoch": 6416} {"train_loss": -27.141809463500977, "global_step": 532567, "epoch": 6416} {"train_loss": -27.33180046081543, "global_step": 532568, "epoch": 6416} {"train_loss": -27.234827041625977, "global_step": 532569, "epoch": 6416} {"train_loss": -27.59321403503418, "global_step": 532570, "epoch": 6416} {"train_loss": -27.513568878173828, "global_step": 532571, "epoch": 6416} {"train_loss": -27.287250518798828, "global_step": 532572, "epoch": 6416} {"train_loss": -27.773548126220703, "global_step": 532573, "epoch": 6416} {"train_loss": -27.60536003112793, "global_step": 532574, "epoch": 6416} {"train_loss": -27.598724365234375, "global_step": 532575, "epoch": 6416} {"train_loss": -27.50199317932129, "global_step": 532576, "epoch": 6416} {"train_loss": -27.712726593017578, "global_step": 532577, "epoch": 6416} {"train_loss": -27.89011573791504, "global_step": 532578, "epoch": 6416} {"train_loss": -27.53468132019043, "global_step": 532579, "epoch": 6416} {"train_loss": -28.112960815429688, "global_step": 532580, "epoch": 6416} {"train_loss": -27.852432250976562, "global_step": 532581, "epoch": 6416} {"train_loss": -27.990787506103516, "global_step": 532582, "epoch": 6416} {"train_loss": -27.81561279296875, "global_step": 532583, "epoch": 6416} {"train_loss": -27.782012939453125, "global_step": 532584, "epoch": 6416} {"train_loss": -27.555683135986328, "global_step": 532585, "epoch": 6416} {"train_loss": -27.56743812561035, "global_step": 532586, "epoch": 6416} {"train_loss": -27.82893943786621, "global_step": 532587, "epoch": 6416} {"train_loss": -27.900623321533203, "global_step": 532588, "epoch": 6416} {"train_loss": -28.159460067749023, "global_step": 532589, "epoch": 6416} {"train_loss": -28.028955459594727, "global_step": 532590, "epoch": 6416} {"train_loss": -28.227802276611328, "global_step": 532591, "epoch": 6416} {"train_loss": -27.899463653564453, "global_step": 532592, "epoch": 6416} {"train_loss": -27.673797607421875, "global_step": 532593, "epoch": 6416} {"train_loss": -27.797510147094727, "global_step": 532594, "epoch": 6416} {"train_loss": -27.886768341064453, "global_step": 532595, "epoch": 6416} {"train_loss": -27.515649795532227, "global_step": 532596, "epoch": 6416} {"train_loss": -27.84171485900879, "global_step": 532597, "epoch": 6416} {"train_loss": -27.945270538330078, "global_step": 532598, "epoch": 6416} {"train_loss": -27.75934410095215, "global_step": 532599, "epoch": 6416} {"train_loss": -27.705373764038086, "global_step": 532600, "epoch": 6416} {"train_loss": -27.740589141845703, "global_step": 532601, "epoch": 6416} {"train_loss": -28.056854248046875, "global_step": 532602, "epoch": 6416} {"train_loss": -28.22039222717285, "global_step": 532603, "epoch": 6416} {"train_loss": -27.834278106689453, "global_step": 532604, "epoch": 6416} {"train_loss": -27.637739181518555, "global_step": 532605, "epoch": 6416} {"train_loss": -27.429981231689453, "global_step": 532606, "epoch": 6416} {"train_loss": -27.67268943786621, "global_step": 532607, "epoch": 6416} {"train_loss": -27.813739776611328, "global_step": 532608, "epoch": 6416} {"train_loss": -27.757965087890625, "global_step": 532609, "epoch": 6416} {"train_loss": -27.30583301222468, "global_step": 532610, "epoch": 6416, "val_loss": 6545247.0} {"train_loss": -26.03559684753418, "global_step": 532611, "epoch": 6417} {"train_loss": -25.210798263549805, "global_step": 532612, "epoch": 6417} {"train_loss": -23.61115837097168, "global_step": 532613, "epoch": 6417} {"train_loss": -26.091140747070312, "global_step": 532614, "epoch": 6417} {"train_loss": -26.5212345123291, "global_step": 532615, "epoch": 6417} {"train_loss": -26.26007652282715, "global_step": 532616, "epoch": 6417} {"train_loss": -26.850000381469727, "global_step": 532617, "epoch": 6417} {"train_loss": -26.509870529174805, "global_step": 532618, "epoch": 6417} {"train_loss": -26.71820640563965, "global_step": 532619, "epoch": 6417} {"train_loss": -27.056753158569336, "global_step": 532620, "epoch": 6417} {"train_loss": -26.855859756469727, "global_step": 532621, "epoch": 6417} {"train_loss": -26.730009078979492, "global_step": 532622, "epoch": 6417} {"train_loss": -26.8436336517334, "global_step": 532623, "epoch": 6417} {"train_loss": -26.595062255859375, "global_step": 532624, "epoch": 6417} {"train_loss": -27.272390365600586, "global_step": 532625, "epoch": 6417} {"train_loss": -26.892868041992188, "global_step": 532626, "epoch": 6417} {"train_loss": -27.253314971923828, "global_step": 532627, "epoch": 6417} {"train_loss": -27.02199363708496, "global_step": 532628, "epoch": 6417} {"train_loss": -26.45478630065918, "global_step": 532629, "epoch": 6417} {"train_loss": -27.001296997070312, "global_step": 532630, "epoch": 6417} {"train_loss": -27.094701766967773, "global_step": 532631, "epoch": 6417} {"train_loss": -26.969099044799805, "global_step": 532632, "epoch": 6417} {"train_loss": -27.279855728149414, "global_step": 532633, "epoch": 6417} {"train_loss": -27.37689781188965, "global_step": 532634, "epoch": 6417} {"train_loss": -27.14959144592285, "global_step": 532635, "epoch": 6417} {"train_loss": -27.072586059570312, "global_step": 532636, "epoch": 6417} {"train_loss": -27.443958282470703, "global_step": 532637, "epoch": 6417} {"train_loss": -26.9521484375, "global_step": 532638, "epoch": 6417} {"train_loss": -27.28192138671875, "global_step": 532639, "epoch": 6417} {"train_loss": -27.213459014892578, "global_step": 532640, "epoch": 6417} {"train_loss": -27.478961944580078, "global_step": 532641, "epoch": 6417} {"train_loss": -27.4427490234375, "global_step": 532642, "epoch": 6417} {"train_loss": -26.822439193725586, "global_step": 532643, "epoch": 6417} {"train_loss": -27.783939361572266, "global_step": 532644, "epoch": 6417} {"train_loss": -27.21856117248535, "global_step": 532645, "epoch": 6417} {"train_loss": -27.486129760742188, "global_step": 532646, "epoch": 6417} {"train_loss": -26.759443283081055, "global_step": 532647, "epoch": 6417} {"train_loss": -27.53456687927246, "global_step": 532648, "epoch": 6417} {"train_loss": -27.200408935546875, "global_step": 532649, "epoch": 6417} {"train_loss": -27.45172691345215, "global_step": 532650, "epoch": 6417} {"train_loss": -27.431808471679688, "global_step": 532651, "epoch": 6417} {"train_loss": -27.410831451416016, "global_step": 532652, "epoch": 6417} {"train_loss": -27.447412490844727, "global_step": 532653, "epoch": 6417} {"train_loss": -27.85581398010254, "global_step": 532654, "epoch": 6417} {"train_loss": -27.4945125579834, "global_step": 532655, "epoch": 6417} {"train_loss": -27.403234481811523, "global_step": 532656, "epoch": 6417} {"train_loss": -27.866546630859375, "global_step": 532657, "epoch": 6417} {"train_loss": -27.444931030273438, "global_step": 532658, "epoch": 6417} {"train_loss": -27.797765731811523, "global_step": 532659, "epoch": 6417} {"train_loss": -27.68629264831543, "global_step": 532660, "epoch": 6417} {"train_loss": -27.32607078552246, "global_step": 532661, "epoch": 6417} {"train_loss": -27.603225708007812, "global_step": 532662, "epoch": 6417} {"train_loss": -27.668350219726562, "global_step": 532663, "epoch": 6417} {"train_loss": -27.57339859008789, "global_step": 532664, "epoch": 6417} {"train_loss": -27.596948623657227, "global_step": 532665, "epoch": 6417} {"train_loss": -27.63006019592285, "global_step": 532666, "epoch": 6417} {"train_loss": -27.915069580078125, "global_step": 532667, "epoch": 6417} {"train_loss": -27.64788818359375, "global_step": 532668, "epoch": 6417} {"train_loss": -26.988554000854492, "global_step": 532669, "epoch": 6417} {"train_loss": -27.780658721923828, "global_step": 532670, "epoch": 6417} {"train_loss": -27.75360679626465, "global_step": 532671, "epoch": 6417} {"train_loss": -27.628034591674805, "global_step": 532672, "epoch": 6417} {"train_loss": -27.44045066833496, "global_step": 532673, "epoch": 6417} {"train_loss": -27.59562110900879, "global_step": 532674, "epoch": 6417} {"train_loss": -27.3281192779541, "global_step": 532675, "epoch": 6417} {"train_loss": -27.156143188476562, "global_step": 532676, "epoch": 6417} {"train_loss": -26.992298126220703, "global_step": 532677, "epoch": 6417} {"train_loss": -26.632211685180664, "global_step": 532678, "epoch": 6417} {"train_loss": -27.975717544555664, "global_step": 532679, "epoch": 6417} {"train_loss": -27.75111198425293, "global_step": 532680, "epoch": 6417} {"train_loss": -27.81367301940918, "global_step": 532681, "epoch": 6417} {"train_loss": -27.70111656188965, "global_step": 532682, "epoch": 6417} {"train_loss": -27.5339298248291, "global_step": 532683, "epoch": 6417} {"train_loss": -27.861799240112305, "global_step": 532684, "epoch": 6417} {"train_loss": -27.466894149780273, "global_step": 532685, "epoch": 6417} {"train_loss": -27.651046752929688, "global_step": 532686, "epoch": 6417} {"train_loss": -27.442541122436523, "global_step": 532687, "epoch": 6417} {"train_loss": -27.347761154174805, "global_step": 532688, "epoch": 6417} {"train_loss": -27.853010177612305, "global_step": 532689, "epoch": 6417} {"train_loss": -27.92242431640625, "global_step": 532690, "epoch": 6417} {"train_loss": -27.396442413330078, "global_step": 532691, "epoch": 6417} {"train_loss": -27.47931480407715, "global_step": 532692, "epoch": 6417} {"train_loss": -27.234779357910156, "global_step": 532693, "epoch": 6417, "val_loss": 6565096.5} {"train_loss": -27.216623306274414, "global_step": 532694, "epoch": 6418} {"train_loss": -26.281064987182617, "global_step": 532695, "epoch": 6418} {"train_loss": -26.680532455444336, "global_step": 532696, "epoch": 6418} {"train_loss": -27.22150230407715, "global_step": 532697, "epoch": 6418} {"train_loss": -26.44329261779785, "global_step": 532698, "epoch": 6418} {"train_loss": -26.912353515625, "global_step": 532699, "epoch": 6418} {"train_loss": -27.283124923706055, "global_step": 532700, "epoch": 6418} {"train_loss": -26.98752212524414, "global_step": 532701, "epoch": 6418} {"train_loss": -27.288654327392578, "global_step": 532702, "epoch": 6418} {"train_loss": -27.068252563476562, "global_step": 532703, "epoch": 6418} {"train_loss": -26.857070922851562, "global_step": 532704, "epoch": 6418} {"train_loss": -27.408966064453125, "global_step": 532705, "epoch": 6418} {"train_loss": -26.8980712890625, "global_step": 532706, "epoch": 6418} {"train_loss": -27.279165267944336, "global_step": 532707, "epoch": 6418} {"train_loss": -27.291330337524414, "global_step": 532708, "epoch": 6418} {"train_loss": -27.257230758666992, "global_step": 532709, "epoch": 6418} {"train_loss": -27.227130889892578, "global_step": 532710, "epoch": 6418} {"train_loss": -27.134008407592773, "global_step": 532711, "epoch": 6418} {"train_loss": -27.149560928344727, "global_step": 532712, "epoch": 6418} {"train_loss": -27.402118682861328, "global_step": 532713, "epoch": 6418} {"train_loss": -27.345813751220703, "global_step": 532714, "epoch": 6418} {"train_loss": -26.988391876220703, "global_step": 532715, "epoch": 6418} {"train_loss": -27.70233726501465, "global_step": 532716, "epoch": 6418} {"train_loss": -27.20355224609375, "global_step": 532717, "epoch": 6418} {"train_loss": -27.528335571289062, "global_step": 532718, "epoch": 6418} {"train_loss": -27.43413734436035, "global_step": 532719, "epoch": 6418} {"train_loss": -27.082422256469727, "global_step": 532720, "epoch": 6418} {"train_loss": -27.44744873046875, "global_step": 532721, "epoch": 6418} {"train_loss": -27.579374313354492, "global_step": 532722, "epoch": 6418} {"train_loss": -27.487585067749023, "global_step": 532723, "epoch": 6418} {"train_loss": -27.049762725830078, "global_step": 532724, "epoch": 6418} {"train_loss": -27.5064640045166, "global_step": 532725, "epoch": 6418} {"train_loss": -27.567724227905273, "global_step": 532726, "epoch": 6418} {"train_loss": -27.850088119506836, "global_step": 532727, "epoch": 6418} {"train_loss": -27.4609317779541, "global_step": 532728, "epoch": 6418} {"train_loss": -27.5903263092041, "global_step": 532729, "epoch": 6418} {"train_loss": -27.553882598876953, "global_step": 532730, "epoch": 6418} {"train_loss": -27.664459228515625, "global_step": 532731, "epoch": 6418} {"train_loss": -27.364521026611328, "global_step": 532732, "epoch": 6418} {"train_loss": -27.328903198242188, "global_step": 532733, "epoch": 6418} {"train_loss": -27.543405532836914, "global_step": 532734, "epoch": 6418} {"train_loss": -27.43043327331543, "global_step": 532735, "epoch": 6418} {"train_loss": -27.4094295501709, "global_step": 532736, "epoch": 6418} {"train_loss": -27.85525894165039, "global_step": 532737, "epoch": 6418} {"train_loss": -27.88471031188965, "global_step": 532738, "epoch": 6418} {"train_loss": -27.682287216186523, "global_step": 532739, "epoch": 6418} {"train_loss": -27.91309928894043, "global_step": 532740, "epoch": 6418} {"train_loss": -27.77705192565918, "global_step": 532741, "epoch": 6418} {"train_loss": -27.55837059020996, "global_step": 532742, "epoch": 6418} {"train_loss": -27.73784828186035, "global_step": 532743, "epoch": 6418} {"train_loss": -27.40046501159668, "global_step": 532744, "epoch": 6418} {"train_loss": -28.058557510375977, "global_step": 532745, "epoch": 6418} {"train_loss": -27.556116104125977, "global_step": 532746, "epoch": 6418} {"train_loss": -27.95045280456543, "global_step": 532747, "epoch": 6418} {"train_loss": -27.725299835205078, "global_step": 532748, "epoch": 6418} {"train_loss": -27.853839874267578, "global_step": 532749, "epoch": 6418} {"train_loss": -27.679508209228516, "global_step": 532750, "epoch": 6418} {"train_loss": -27.439619064331055, "global_step": 532751, "epoch": 6418} {"train_loss": -27.636823654174805, "global_step": 532752, "epoch": 6418} {"train_loss": -27.580785751342773, "global_step": 532753, "epoch": 6418} {"train_loss": -27.436859130859375, "global_step": 532754, "epoch": 6418} {"train_loss": -27.151248931884766, "global_step": 532755, "epoch": 6418} {"train_loss": -27.413776397705078, "global_step": 532756, "epoch": 6418} {"train_loss": -27.855016708374023, "global_step": 532757, "epoch": 6418} {"train_loss": -27.43462562561035, "global_step": 532758, "epoch": 6418} {"train_loss": -26.987213134765625, "global_step": 532759, "epoch": 6418} {"train_loss": -26.895038604736328, "global_step": 532760, "epoch": 6418} {"train_loss": -26.985687255859375, "global_step": 532761, "epoch": 6418} {"train_loss": -27.38775634765625, "global_step": 532762, "epoch": 6418} {"train_loss": -27.449329376220703, "global_step": 532763, "epoch": 6418} {"train_loss": -27.330429077148438, "global_step": 532764, "epoch": 6418} {"train_loss": -26.948490142822266, "global_step": 532765, "epoch": 6418} {"train_loss": -27.904996871948242, "global_step": 532766, "epoch": 6418} {"train_loss": -27.590301513671875, "global_step": 532767, "epoch": 6418} {"train_loss": -27.246301651000977, "global_step": 532768, "epoch": 6418} {"train_loss": -27.52918815612793, "global_step": 532769, "epoch": 6418} {"train_loss": -27.637739181518555, "global_step": 532770, "epoch": 6418} {"train_loss": -27.579212188720703, "global_step": 532771, "epoch": 6418} {"train_loss": -27.78797721862793, "global_step": 532772, "epoch": 6418} {"train_loss": -27.5721492767334, "global_step": 532773, "epoch": 6418} {"train_loss": -27.791763305664062, "global_step": 532774, "epoch": 6418} {"train_loss": -27.60223960876465, "global_step": 532775, "epoch": 6418} {"train_loss": -27.40070090236434, "global_step": 532776, "epoch": 6418, "val_loss": 6479239.5} {"train_loss": -27.15655517578125, "global_step": 532777, "epoch": 6419} {"train_loss": -27.257843017578125, "global_step": 532778, "epoch": 6419} {"train_loss": -27.07450294494629, "global_step": 532779, "epoch": 6419} {"train_loss": -27.15045738220215, "global_step": 532780, "epoch": 6419} {"train_loss": -27.346662521362305, "global_step": 532781, "epoch": 6419} {"train_loss": -27.053335189819336, "global_step": 532782, "epoch": 6419} {"train_loss": -27.3255558013916, "global_step": 532783, "epoch": 6419} {"train_loss": -27.562488555908203, "global_step": 532784, "epoch": 6419} {"train_loss": -27.6472110748291, "global_step": 532785, "epoch": 6419} {"train_loss": -27.646453857421875, "global_step": 532786, "epoch": 6419} {"train_loss": -27.48917579650879, "global_step": 532787, "epoch": 6419} {"train_loss": -27.454776763916016, "global_step": 532788, "epoch": 6419} {"train_loss": -27.016708374023438, "global_step": 532789, "epoch": 6419} {"train_loss": -27.630056381225586, "global_step": 532790, "epoch": 6419} {"train_loss": -27.229766845703125, "global_step": 532791, "epoch": 6419} {"train_loss": -27.363508224487305, "global_step": 532792, "epoch": 6419} {"train_loss": -27.733295440673828, "global_step": 532793, "epoch": 6419} {"train_loss": -27.470081329345703, "global_step": 532794, "epoch": 6419} {"train_loss": -27.678857803344727, "global_step": 532795, "epoch": 6419} {"train_loss": -27.6922664642334, "global_step": 532796, "epoch": 6419} {"train_loss": -27.9362735748291, "global_step": 532797, "epoch": 6419} {"train_loss": -27.991724014282227, "global_step": 532798, "epoch": 6419} {"train_loss": -27.331439971923828, "global_step": 532799, "epoch": 6419} {"train_loss": -27.336868286132812, "global_step": 532800, "epoch": 6419} {"train_loss": -27.905736923217773, "global_step": 532801, "epoch": 6419} {"train_loss": -27.738691329956055, "global_step": 532802, "epoch": 6419} {"train_loss": -27.964527130126953, "global_step": 532803, "epoch": 6419} {"train_loss": -27.530364990234375, "global_step": 532804, "epoch": 6419} {"train_loss": -27.512908935546875, "global_step": 532805, "epoch": 6419} {"train_loss": -27.768850326538086, "global_step": 532806, "epoch": 6419} {"train_loss": -27.4262752532959, "global_step": 532807, "epoch": 6419} {"train_loss": -27.408483505249023, "global_step": 532808, "epoch": 6419} {"train_loss": -27.928770065307617, "global_step": 532809, "epoch": 6419} {"train_loss": -27.34553337097168, "global_step": 532810, "epoch": 6419} {"train_loss": -27.86968421936035, "global_step": 532811, "epoch": 6419} {"train_loss": -27.60284423828125, "global_step": 532812, "epoch": 6419} {"train_loss": -27.256284713745117, "global_step": 532813, "epoch": 6419} {"train_loss": -27.99578285217285, "global_step": 532814, "epoch": 6419} {"train_loss": -27.861835479736328, "global_step": 532815, "epoch": 6419} {"train_loss": -27.3592586517334, "global_step": 532816, "epoch": 6419} {"train_loss": -27.522693634033203, "global_step": 532817, "epoch": 6419} {"train_loss": -28.012313842773438, "global_step": 532818, "epoch": 6419} {"train_loss": -27.469669342041016, "global_step": 532819, "epoch": 6419} {"train_loss": -27.628189086914062, "global_step": 532820, "epoch": 6419} {"train_loss": -27.5860595703125, "global_step": 532821, "epoch": 6419} {"train_loss": -27.815820693969727, "global_step": 532822, "epoch": 6419} {"train_loss": -27.290639877319336, "global_step": 532823, "epoch": 6419} {"train_loss": -27.905858993530273, "global_step": 532824, "epoch": 6419} {"train_loss": -28.067916870117188, "global_step": 532825, "epoch": 6419} {"train_loss": -27.892333984375, "global_step": 532826, "epoch": 6419} {"train_loss": -27.637338638305664, "global_step": 532827, "epoch": 6419} {"train_loss": -27.505712509155273, "global_step": 532828, "epoch": 6419} {"train_loss": -27.463117599487305, "global_step": 532829, "epoch": 6419} {"train_loss": -27.35395622253418, "global_step": 532830, "epoch": 6419} {"train_loss": -27.676929473876953, "global_step": 532831, "epoch": 6419} {"train_loss": -27.508869171142578, "global_step": 532832, "epoch": 6419} {"train_loss": -27.423297882080078, "global_step": 532833, "epoch": 6419} {"train_loss": -27.09734535217285, "global_step": 532834, "epoch": 6419} {"train_loss": -27.357873916625977, "global_step": 532835, "epoch": 6419} {"train_loss": -26.972814559936523, "global_step": 532836, "epoch": 6419} {"train_loss": -27.24603271484375, "global_step": 532837, "epoch": 6419} {"train_loss": -27.11530113220215, "global_step": 532838, "epoch": 6419} {"train_loss": -27.5804500579834, "global_step": 532839, "epoch": 6419} {"train_loss": -27.5738525390625, "global_step": 532840, "epoch": 6419} {"train_loss": -27.66815185546875, "global_step": 532841, "epoch": 6419} {"train_loss": -27.409677505493164, "global_step": 532842, "epoch": 6419} {"train_loss": -27.493371963500977, "global_step": 532843, "epoch": 6419} {"train_loss": -27.71430778503418, "global_step": 532844, "epoch": 6419} {"train_loss": -27.09963035583496, "global_step": 532845, "epoch": 6419} {"train_loss": -27.871686935424805, "global_step": 532846, "epoch": 6419} {"train_loss": -27.771265029907227, "global_step": 532847, "epoch": 6419} {"train_loss": -27.856983184814453, "global_step": 532848, "epoch": 6419} {"train_loss": -27.571216583251953, "global_step": 532849, "epoch": 6419} {"train_loss": -27.30686378479004, "global_step": 532850, "epoch": 6419} {"train_loss": -27.80986976623535, "global_step": 532851, "epoch": 6419} {"train_loss": -27.527257919311523, "global_step": 532852, "epoch": 6419} {"train_loss": -27.575790405273438, "global_step": 532853, "epoch": 6419} {"train_loss": -27.430444717407227, "global_step": 532854, "epoch": 6419} {"train_loss": -27.699493408203125, "global_step": 532855, "epoch": 6419} {"train_loss": -27.53130531311035, "global_step": 532856, "epoch": 6419} {"train_loss": -27.836349487304688, "global_step": 532857, "epoch": 6419} {"train_loss": -28.023488998413086, "global_step": 532858, "epoch": 6419} {"train_loss": -27.545262325240905, "global_step": 532859, "epoch": 6419, "val_loss": 6540783.5} {"train_loss": -26.077972412109375, "global_step": 532860, "epoch": 6420} {"train_loss": -26.348957061767578, "global_step": 532861, "epoch": 6420} {"train_loss": -26.989301681518555, "global_step": 532862, "epoch": 6420} {"train_loss": -27.01972007751465, "global_step": 532863, "epoch": 6420} {"train_loss": -26.529809951782227, "global_step": 532864, "epoch": 6420} {"train_loss": -26.806257247924805, "global_step": 532865, "epoch": 6420} {"train_loss": -26.7511043548584, "global_step": 532866, "epoch": 6420} {"train_loss": -26.778188705444336, "global_step": 532867, "epoch": 6420} {"train_loss": -26.9141845703125, "global_step": 532868, "epoch": 6420} {"train_loss": -27.132070541381836, "global_step": 532869, "epoch": 6420} {"train_loss": -27.27825355529785, "global_step": 532870, "epoch": 6420} {"train_loss": -27.543981552124023, "global_step": 532871, "epoch": 6420} {"train_loss": -26.847370147705078, "global_step": 532872, "epoch": 6420} {"train_loss": -27.381961822509766, "global_step": 532873, "epoch": 6420} {"train_loss": -27.228565216064453, "global_step": 532874, "epoch": 6420} {"train_loss": -27.16179847717285, "global_step": 532875, "epoch": 6420} {"train_loss": -27.484907150268555, "global_step": 532876, "epoch": 6420} {"train_loss": -27.3559627532959, "global_step": 532877, "epoch": 6420} {"train_loss": -27.849334716796875, "global_step": 532878, "epoch": 6420} {"train_loss": -27.3155460357666, "global_step": 532879, "epoch": 6420} {"train_loss": -27.336933135986328, "global_step": 532880, "epoch": 6420} {"train_loss": -27.421598434448242, "global_step": 532881, "epoch": 6420} {"train_loss": -27.108585357666016, "global_step": 532882, "epoch": 6420} {"train_loss": -27.560901641845703, "global_step": 532883, "epoch": 6420} {"train_loss": -27.892730712890625, "global_step": 532884, "epoch": 6420} {"train_loss": -27.300262451171875, "global_step": 532885, "epoch": 6420} {"train_loss": -27.90264892578125, "global_step": 532886, "epoch": 6420} {"train_loss": -27.480224609375, "global_step": 532887, "epoch": 6420} {"train_loss": -27.542455673217773, "global_step": 532888, "epoch": 6420} {"train_loss": -27.76755714416504, "global_step": 532889, "epoch": 6420} {"train_loss": -27.520496368408203, "global_step": 532890, "epoch": 6420} {"train_loss": -27.61610221862793, "global_step": 532891, "epoch": 6420} {"train_loss": -27.287982940673828, "global_step": 532892, "epoch": 6420} {"train_loss": -28.00799560546875, "global_step": 532893, "epoch": 6420} {"train_loss": -27.41596031188965, "global_step": 532894, "epoch": 6420} {"train_loss": -27.634815216064453, "global_step": 532895, "epoch": 6420} {"train_loss": -27.713972091674805, "global_step": 532896, "epoch": 6420} {"train_loss": -27.3825740814209, "global_step": 532897, "epoch": 6420} {"train_loss": -27.6291446685791, "global_step": 532898, "epoch": 6420} {"train_loss": -27.861862182617188, "global_step": 532899, "epoch": 6420} {"train_loss": -27.654281616210938, "global_step": 532900, "epoch": 6420} {"train_loss": -27.892822265625, "global_step": 532901, "epoch": 6420} {"train_loss": -27.757038116455078, "global_step": 532902, "epoch": 6420} {"train_loss": -27.989612579345703, "global_step": 532903, "epoch": 6420} {"train_loss": -27.988630294799805, "global_step": 532904, "epoch": 6420} {"train_loss": -27.744298934936523, "global_step": 532905, "epoch": 6420} {"train_loss": -27.451435089111328, "global_step": 532906, "epoch": 6420} {"train_loss": -27.605762481689453, "global_step": 532907, "epoch": 6420} {"train_loss": -27.63495445251465, "global_step": 532908, "epoch": 6420} {"train_loss": -27.35590934753418, "global_step": 532909, "epoch": 6420} {"train_loss": -27.658288955688477, "global_step": 532910, "epoch": 6420} {"train_loss": -27.899099349975586, "global_step": 532911, "epoch": 6420} {"train_loss": -27.667316436767578, "global_step": 532912, "epoch": 6420} {"train_loss": -27.546772003173828, "global_step": 532913, "epoch": 6420} {"train_loss": -27.863927841186523, "global_step": 532914, "epoch": 6420} {"train_loss": -27.699813842773438, "global_step": 532915, "epoch": 6420} {"train_loss": -27.81982421875, "global_step": 532916, "epoch": 6420} {"train_loss": -27.620351791381836, "global_step": 532917, "epoch": 6420} {"train_loss": -27.08601951599121, "global_step": 532918, "epoch": 6420} {"train_loss": -26.931604385375977, "global_step": 532919, "epoch": 6420} {"train_loss": -26.751419067382812, "global_step": 532920, "epoch": 6420} {"train_loss": -27.692935943603516, "global_step": 532921, "epoch": 6420} {"train_loss": -27.599035263061523, "global_step": 532922, "epoch": 6420} {"train_loss": -27.518268585205078, "global_step": 532923, "epoch": 6420} {"train_loss": -27.805150985717773, "global_step": 532924, "epoch": 6420} {"train_loss": -27.714269638061523, "global_step": 532925, "epoch": 6420} {"train_loss": -27.469120025634766, "global_step": 532926, "epoch": 6420} {"train_loss": -27.529285430908203, "global_step": 532927, "epoch": 6420} {"train_loss": -27.624433517456055, "global_step": 532928, "epoch": 6420} {"train_loss": -27.734394073486328, "global_step": 532929, "epoch": 6420} {"train_loss": -27.4443302154541, "global_step": 532930, "epoch": 6420} {"train_loss": -27.759016036987305, "global_step": 532931, "epoch": 6420} {"train_loss": -27.882568359375, "global_step": 532932, "epoch": 6420} {"train_loss": -27.71748161315918, "global_step": 532933, "epoch": 6420} {"train_loss": -28.000507354736328, "global_step": 532934, "epoch": 6420} {"train_loss": -27.7957820892334, "global_step": 532935, "epoch": 6420} {"train_loss": -27.58575439453125, "global_step": 532936, "epoch": 6420} {"train_loss": -27.832717895507812, "global_step": 532937, "epoch": 6420} {"train_loss": -27.586408615112305, "global_step": 532938, "epoch": 6420} {"train_loss": -27.220050811767578, "global_step": 532939, "epoch": 6420} {"train_loss": -27.822559356689453, "global_step": 532940, "epoch": 6420} {"train_loss": -27.6591796875, "global_step": 532941, "epoch": 6420} {"train_loss": -27.480322918259954, "global_step": 532942, "epoch": 6420, "val_loss": 6525369.0} {"train_loss": -27.41678810119629, "global_step": 532943, "epoch": 6421} {"train_loss": -27.089279174804688, "global_step": 532944, "epoch": 6421} {"train_loss": -27.48880386352539, "global_step": 532945, "epoch": 6421} {"train_loss": -27.19611930847168, "global_step": 532946, "epoch": 6421} {"train_loss": -27.021146774291992, "global_step": 532947, "epoch": 6421} {"train_loss": -27.0115966796875, "global_step": 532948, "epoch": 6421} {"train_loss": -27.273893356323242, "global_step": 532949, "epoch": 6421} {"train_loss": -27.3737850189209, "global_step": 532950, "epoch": 6421} {"train_loss": -27.76363182067871, "global_step": 532951, "epoch": 6421} {"train_loss": -26.94875144958496, "global_step": 532952, "epoch": 6421} {"train_loss": -27.461755752563477, "global_step": 532953, "epoch": 6421} {"train_loss": -27.430496215820312, "global_step": 532954, "epoch": 6421} {"train_loss": -27.35999870300293, "global_step": 532955, "epoch": 6421} {"train_loss": -27.64954948425293, "global_step": 532956, "epoch": 6421} {"train_loss": -27.36635398864746, "global_step": 532957, "epoch": 6421} {"train_loss": -27.580636978149414, "global_step": 532958, "epoch": 6421} {"train_loss": -27.55205726623535, "global_step": 532959, "epoch": 6421} {"train_loss": -27.116973876953125, "global_step": 532960, "epoch": 6421} {"train_loss": -28.085901260375977, "global_step": 532961, "epoch": 6421} {"train_loss": -27.263513565063477, "global_step": 532962, "epoch": 6421} {"train_loss": -27.392988204956055, "global_step": 532963, "epoch": 6421} {"train_loss": -27.202362060546875, "global_step": 532964, "epoch": 6421} {"train_loss": -27.6484317779541, "global_step": 532965, "epoch": 6421} {"train_loss": -27.2698917388916, "global_step": 532966, "epoch": 6421} {"train_loss": -27.383398056030273, "global_step": 532967, "epoch": 6421} {"train_loss": -27.62837028503418, "global_step": 532968, "epoch": 6421} {"train_loss": -27.455463409423828, "global_step": 532969, "epoch": 6421} {"train_loss": -27.255823135375977, "global_step": 532970, "epoch": 6421} {"train_loss": -27.91998863220215, "global_step": 532971, "epoch": 6421} {"train_loss": -27.361188888549805, "global_step": 532972, "epoch": 6421} {"train_loss": -27.78313636779785, "global_step": 532973, "epoch": 6421} {"train_loss": -27.614566802978516, "global_step": 532974, "epoch": 6421} {"train_loss": -27.55670738220215, "global_step": 532975, "epoch": 6421} {"train_loss": -27.9776611328125, "global_step": 532976, "epoch": 6421} {"train_loss": -27.8793888092041, "global_step": 532977, "epoch": 6421} {"train_loss": -27.52109718322754, "global_step": 532978, "epoch": 6421} {"train_loss": -27.724639892578125, "global_step": 532979, "epoch": 6421} {"train_loss": -27.788619995117188, "global_step": 532980, "epoch": 6421} {"train_loss": -27.87566566467285, "global_step": 532981, "epoch": 6421} {"train_loss": -27.279773712158203, "global_step": 532982, "epoch": 6421} {"train_loss": -27.620405197143555, "global_step": 532983, "epoch": 6421} {"train_loss": -27.78167724609375, "global_step": 532984, "epoch": 6421} {"train_loss": -27.427310943603516, "global_step": 532985, "epoch": 6421} {"train_loss": -27.653059005737305, "global_step": 532986, "epoch": 6421} {"train_loss": -27.569904327392578, "global_step": 532987, "epoch": 6421} {"train_loss": -28.05108642578125, "global_step": 532988, "epoch": 6421} {"train_loss": -27.97210693359375, "global_step": 532989, "epoch": 6421} {"train_loss": -27.508329391479492, "global_step": 532990, "epoch": 6421} {"train_loss": -27.336393356323242, "global_step": 532991, "epoch": 6421} {"train_loss": -27.49416160583496, "global_step": 532992, "epoch": 6421} {"train_loss": -27.796493530273438, "global_step": 532993, "epoch": 6421} {"train_loss": -27.37739372253418, "global_step": 532994, "epoch": 6421} {"train_loss": -27.669797897338867, "global_step": 532995, "epoch": 6421} {"train_loss": -27.540441513061523, "global_step": 532996, "epoch": 6421} {"train_loss": -27.379383087158203, "global_step": 532997, "epoch": 6421} {"train_loss": -27.717023849487305, "global_step": 532998, "epoch": 6421} {"train_loss": -27.474210739135742, "global_step": 532999, "epoch": 6421} {"train_loss": -27.157001495361328, "global_step": 533000, "epoch": 6421} {"train_loss": -27.028396606445312, "global_step": 533001, "epoch": 6421} {"train_loss": -26.891632080078125, "global_step": 533002, "epoch": 6421} {"train_loss": -27.248645782470703, "global_step": 533003, "epoch": 6421} {"train_loss": -27.758703231811523, "global_step": 533004, "epoch": 6421} {"train_loss": -27.41943359375, "global_step": 533005, "epoch": 6421} {"train_loss": -27.189685821533203, "global_step": 533006, "epoch": 6421} {"train_loss": -27.626367568969727, "global_step": 533007, "epoch": 6421} {"train_loss": -27.8334903717041, "global_step": 533008, "epoch": 6421} {"train_loss": -27.497098922729492, "global_step": 533009, "epoch": 6421} {"train_loss": -27.492956161499023, "global_step": 533010, "epoch": 6421} {"train_loss": -27.311628341674805, "global_step": 533011, "epoch": 6421} {"train_loss": -27.615070343017578, "global_step": 533012, "epoch": 6421} {"train_loss": -27.659475326538086, "global_step": 533013, "epoch": 6421} {"train_loss": -27.660858154296875, "global_step": 533014, "epoch": 6421} {"train_loss": -27.530744552612305, "global_step": 533015, "epoch": 6421} {"train_loss": -27.748144149780273, "global_step": 533016, "epoch": 6421} {"train_loss": -27.733015060424805, "global_step": 533017, "epoch": 6421} {"train_loss": -27.732589721679688, "global_step": 533018, "epoch": 6421} {"train_loss": -27.413434982299805, "global_step": 533019, "epoch": 6421} {"train_loss": -27.52484703063965, "global_step": 533020, "epoch": 6421} {"train_loss": -27.259719848632812, "global_step": 533021, "epoch": 6421} {"train_loss": -27.51336669921875, "global_step": 533022, "epoch": 6421} {"train_loss": -27.208892822265625, "global_step": 533023, "epoch": 6421} {"train_loss": -27.13848876953125, "global_step": 533024, "epoch": 6421} {"train_loss": -27.490117130509343, "global_step": 533025, "epoch": 6421, "val_loss": 6469150.0} {"train_loss": -27.022174835205078, "global_step": 533026, "epoch": 6422} {"train_loss": -26.275598526000977, "global_step": 533027, "epoch": 6422} {"train_loss": -26.62583351135254, "global_step": 533028, "epoch": 6422} {"train_loss": -25.389684677124023, "global_step": 533029, "epoch": 6422} {"train_loss": -25.7200870513916, "global_step": 533030, "epoch": 6422} {"train_loss": -27.1002197265625, "global_step": 533031, "epoch": 6422} {"train_loss": -25.881973266601562, "global_step": 533032, "epoch": 6422} {"train_loss": -26.3284912109375, "global_step": 533033, "epoch": 6422} {"train_loss": -26.778345108032227, "global_step": 533034, "epoch": 6422} {"train_loss": -26.236669540405273, "global_step": 533035, "epoch": 6422} {"train_loss": -26.820600509643555, "global_step": 533036, "epoch": 6422} {"train_loss": -26.679914474487305, "global_step": 533037, "epoch": 6422} {"train_loss": -26.654138565063477, "global_step": 533038, "epoch": 6422} {"train_loss": -27.00765037536621, "global_step": 533039, "epoch": 6422} {"train_loss": -27.05877685546875, "global_step": 533040, "epoch": 6422} {"train_loss": -26.564727783203125, "global_step": 533041, "epoch": 6422} {"train_loss": -27.055194854736328, "global_step": 533042, "epoch": 6422} {"train_loss": -27.16071891784668, "global_step": 533043, "epoch": 6422} {"train_loss": -27.013168334960938, "global_step": 533044, "epoch": 6422} {"train_loss": -26.908544540405273, "global_step": 533045, "epoch": 6422} {"train_loss": -26.80921745300293, "global_step": 533046, "epoch": 6422} {"train_loss": -27.264795303344727, "global_step": 533047, "epoch": 6422} {"train_loss": -27.318038940429688, "global_step": 533048, "epoch": 6422} {"train_loss": -27.03285026550293, "global_step": 533049, "epoch": 6422} {"train_loss": -27.245361328125, "global_step": 533050, "epoch": 6422} {"train_loss": -27.508554458618164, "global_step": 533051, "epoch": 6422} {"train_loss": -27.375741958618164, "global_step": 533052, "epoch": 6422} {"train_loss": -27.50575065612793, "global_step": 533053, "epoch": 6422} {"train_loss": -27.31879997253418, "global_step": 533054, "epoch": 6422} {"train_loss": -27.210729598999023, "global_step": 533055, "epoch": 6422} {"train_loss": -27.27322769165039, "global_step": 533056, "epoch": 6422} {"train_loss": -27.492124557495117, "global_step": 533057, "epoch": 6422} {"train_loss": -27.946685791015625, "global_step": 533058, "epoch": 6422} {"train_loss": -27.367191314697266, "global_step": 533059, "epoch": 6422} {"train_loss": -27.481611251831055, "global_step": 533060, "epoch": 6422} {"train_loss": -27.45261573791504, "global_step": 533061, "epoch": 6422} {"train_loss": -27.579187393188477, "global_step": 533062, "epoch": 6422} {"train_loss": -27.430089950561523, "global_step": 533063, "epoch": 6422} {"train_loss": -27.879404067993164, "global_step": 533064, "epoch": 6422} {"train_loss": -27.570587158203125, "global_step": 533065, "epoch": 6422} {"train_loss": -27.49672508239746, "global_step": 533066, "epoch": 6422} {"train_loss": -27.695154190063477, "global_step": 533067, "epoch": 6422} {"train_loss": -27.76153564453125, "global_step": 533068, "epoch": 6422} {"train_loss": -27.82105827331543, "global_step": 533069, "epoch": 6422} {"train_loss": -27.657093048095703, "global_step": 533070, "epoch": 6422} {"train_loss": -28.20979118347168, "global_step": 533071, "epoch": 6422} {"train_loss": -27.564443588256836, "global_step": 533072, "epoch": 6422} {"train_loss": -27.708698272705078, "global_step": 533073, "epoch": 6422} {"train_loss": -27.469369888305664, "global_step": 533074, "epoch": 6422} {"train_loss": -27.641590118408203, "global_step": 533075, "epoch": 6422} {"train_loss": -27.966903686523438, "global_step": 533076, "epoch": 6422} {"train_loss": -27.532882690429688, "global_step": 533077, "epoch": 6422} {"train_loss": -27.75556755065918, "global_step": 533078, "epoch": 6422} {"train_loss": -28.123212814331055, "global_step": 533079, "epoch": 6422} {"train_loss": -27.576557159423828, "global_step": 533080, "epoch": 6422} {"train_loss": -28.140491485595703, "global_step": 533081, "epoch": 6422} {"train_loss": -27.857044219970703, "global_step": 533082, "epoch": 6422} {"train_loss": -27.865259170532227, "global_step": 533083, "epoch": 6422} {"train_loss": -27.792530059814453, "global_step": 533084, "epoch": 6422} {"train_loss": -27.809803009033203, "global_step": 533085, "epoch": 6422} {"train_loss": -27.8613338470459, "global_step": 533086, "epoch": 6422} {"train_loss": -27.375669479370117, "global_step": 533087, "epoch": 6422} {"train_loss": -27.619403839111328, "global_step": 533088, "epoch": 6422} {"train_loss": -27.6768856048584, "global_step": 533089, "epoch": 6422} {"train_loss": -27.41629409790039, "global_step": 533090, "epoch": 6422} {"train_loss": -27.112485885620117, "global_step": 533091, "epoch": 6422} {"train_loss": -27.443592071533203, "global_step": 533092, "epoch": 6422} {"train_loss": -27.48148536682129, "global_step": 533093, "epoch": 6422} {"train_loss": -27.670551300048828, "global_step": 533094, "epoch": 6422} {"train_loss": -27.8270320892334, "global_step": 533095, "epoch": 6422} {"train_loss": -27.898712158203125, "global_step": 533096, "epoch": 6422} {"train_loss": -27.68691062927246, "global_step": 533097, "epoch": 6422} {"train_loss": -27.744367599487305, "global_step": 533098, "epoch": 6422} {"train_loss": -27.4674015045166, "global_step": 533099, "epoch": 6422} {"train_loss": -27.500532150268555, "global_step": 533100, "epoch": 6422} {"train_loss": -27.716337203979492, "global_step": 533101, "epoch": 6422} {"train_loss": -27.269058227539062, "global_step": 533102, "epoch": 6422} {"train_loss": -27.371509552001953, "global_step": 533103, "epoch": 6422} {"train_loss": -27.567350387573242, "global_step": 533104, "epoch": 6422} {"train_loss": -27.697324752807617, "global_step": 533105, "epoch": 6422} {"train_loss": -27.656909942626953, "global_step": 533106, "epoch": 6422} {"train_loss": -27.57252311706543, "global_step": 533107, "epoch": 6422} {"train_loss": -27.33896432439965, "global_step": 533108, "epoch": 6422, "val_loss": 6519916.0} {"train_loss": -26.38054847717285, "global_step": 533109, "epoch": 6423} {"train_loss": -26.217981338500977, "global_step": 533110, "epoch": 6423} {"train_loss": -26.93018913269043, "global_step": 533111, "epoch": 6423} {"train_loss": -26.210163116455078, "global_step": 533112, "epoch": 6423} {"train_loss": -26.253498077392578, "global_step": 533113, "epoch": 6423} {"train_loss": -26.179920196533203, "global_step": 533114, "epoch": 6423} {"train_loss": -26.055831909179688, "global_step": 533115, "epoch": 6423} {"train_loss": -26.510120391845703, "global_step": 533116, "epoch": 6423} {"train_loss": -26.36036491394043, "global_step": 533117, "epoch": 6423} {"train_loss": -26.848697662353516, "global_step": 533118, "epoch": 6423} {"train_loss": -26.591232299804688, "global_step": 533119, "epoch": 6423} {"train_loss": -27.142658233642578, "global_step": 533120, "epoch": 6423} {"train_loss": -26.89566993713379, "global_step": 533121, "epoch": 6423} {"train_loss": -27.094236373901367, "global_step": 533122, "epoch": 6423} {"train_loss": -26.74529457092285, "global_step": 533123, "epoch": 6423} {"train_loss": -27.223413467407227, "global_step": 533124, "epoch": 6423} {"train_loss": -26.831945419311523, "global_step": 533125, "epoch": 6423} {"train_loss": -27.425134658813477, "global_step": 533126, "epoch": 6423} {"train_loss": -27.12363624572754, "global_step": 533127, "epoch": 6423} {"train_loss": -26.940031051635742, "global_step": 533128, "epoch": 6423} {"train_loss": -27.000904083251953, "global_step": 533129, "epoch": 6423} {"train_loss": -27.322391510009766, "global_step": 533130, "epoch": 6423} {"train_loss": -27.0598201751709, "global_step": 533131, "epoch": 6423} {"train_loss": -27.242267608642578, "global_step": 533132, "epoch": 6423} {"train_loss": -27.0371036529541, "global_step": 533133, "epoch": 6423} {"train_loss": -26.889556884765625, "global_step": 533134, "epoch": 6423} {"train_loss": -27.455556869506836, "global_step": 533135, "epoch": 6423} {"train_loss": -27.26615333557129, "global_step": 533136, "epoch": 6423} {"train_loss": -27.200536727905273, "global_step": 533137, "epoch": 6423} {"train_loss": -27.245655059814453, "global_step": 533138, "epoch": 6423} {"train_loss": -26.81391716003418, "global_step": 533139, "epoch": 6423} {"train_loss": -27.53244972229004, "global_step": 533140, "epoch": 6423} {"train_loss": -27.649707794189453, "global_step": 533141, "epoch": 6423} {"train_loss": -27.44794273376465, "global_step": 533142, "epoch": 6423} {"train_loss": -27.538984298706055, "global_step": 533143, "epoch": 6423} {"train_loss": -27.5460262298584, "global_step": 533144, "epoch": 6423} {"train_loss": -27.4398136138916, "global_step": 533145, "epoch": 6423} {"train_loss": -27.97395133972168, "global_step": 533146, "epoch": 6423} {"train_loss": -27.418073654174805, "global_step": 533147, "epoch": 6423} {"train_loss": -27.496356964111328, "global_step": 533148, "epoch": 6423} {"train_loss": -27.967493057250977, "global_step": 533149, "epoch": 6423} {"train_loss": -27.547571182250977, "global_step": 533150, "epoch": 6423} {"train_loss": -27.28986930847168, "global_step": 533151, "epoch": 6423} {"train_loss": -27.628690719604492, "global_step": 533152, "epoch": 6423} {"train_loss": -27.609975814819336, "global_step": 533153, "epoch": 6423} {"train_loss": -27.697851181030273, "global_step": 533154, "epoch": 6423} {"train_loss": -27.370630264282227, "global_step": 533155, "epoch": 6423} {"train_loss": -27.779315948486328, "global_step": 533156, "epoch": 6423} {"train_loss": -27.65276527404785, "global_step": 533157, "epoch": 6423} {"train_loss": -27.768598556518555, "global_step": 533158, "epoch": 6423} {"train_loss": -27.886322021484375, "global_step": 533159, "epoch": 6423} {"train_loss": -27.506277084350586, "global_step": 533160, "epoch": 6423} {"train_loss": -27.9194278717041, "global_step": 533161, "epoch": 6423} {"train_loss": -27.51398277282715, "global_step": 533162, "epoch": 6423} {"train_loss": -27.8409481048584, "global_step": 533163, "epoch": 6423} {"train_loss": -27.758691787719727, "global_step": 533164, "epoch": 6423} {"train_loss": -28.040119171142578, "global_step": 533165, "epoch": 6423} {"train_loss": -27.960662841796875, "global_step": 533166, "epoch": 6423} {"train_loss": -27.855863571166992, "global_step": 533167, "epoch": 6423} {"train_loss": -28.001184463500977, "global_step": 533168, "epoch": 6423} {"train_loss": -27.796375274658203, "global_step": 533169, "epoch": 6423} {"train_loss": -27.6780948638916, "global_step": 533170, "epoch": 6423} {"train_loss": -28.244384765625, "global_step": 533171, "epoch": 6423} {"train_loss": -27.91285514831543, "global_step": 533172, "epoch": 6423} {"train_loss": -27.9370059967041, "global_step": 533173, "epoch": 6423} {"train_loss": -27.393707275390625, "global_step": 533174, "epoch": 6423} {"train_loss": -27.441816329956055, "global_step": 533175, "epoch": 6423} {"train_loss": -27.91895866394043, "global_step": 533176, "epoch": 6423} {"train_loss": -27.668537139892578, "global_step": 533177, "epoch": 6423} {"train_loss": -27.18815040588379, "global_step": 533178, "epoch": 6423} {"train_loss": -27.68183708190918, "global_step": 533179, "epoch": 6423} {"train_loss": -27.784809112548828, "global_step": 533180, "epoch": 6423} {"train_loss": -27.429000854492188, "global_step": 533181, "epoch": 6423} {"train_loss": -27.760513305664062, "global_step": 533182, "epoch": 6423} {"train_loss": -27.604907989501953, "global_step": 533183, "epoch": 6423} {"train_loss": -27.704193115234375, "global_step": 533184, "epoch": 6423} {"train_loss": -27.79408073425293, "global_step": 533185, "epoch": 6423} {"train_loss": -28.054229736328125, "global_step": 533186, "epoch": 6423} {"train_loss": -27.71904945373535, "global_step": 533187, "epoch": 6423} {"train_loss": -27.903064727783203, "global_step": 533188, "epoch": 6423} {"train_loss": -27.129392623901367, "global_step": 533189, "epoch": 6423} {"train_loss": -27.542871475219727, "global_step": 533190, "epoch": 6423} {"train_loss": -27.375429727944983, "global_step": 533191, "epoch": 6423, "val_loss": 6499391.0} {"train_loss": -27.75953483581543, "global_step": 533192, "epoch": 6424} {"train_loss": -27.417211532592773, "global_step": 533193, "epoch": 6424} {"train_loss": -27.439014434814453, "global_step": 533194, "epoch": 6424} {"train_loss": -27.27386474609375, "global_step": 533195, "epoch": 6424} {"train_loss": -27.461023330688477, "global_step": 533196, "epoch": 6424} {"train_loss": -27.209314346313477, "global_step": 533197, "epoch": 6424} {"train_loss": -27.220111846923828, "global_step": 533198, "epoch": 6424} {"train_loss": -27.323638916015625, "global_step": 533199, "epoch": 6424} {"train_loss": -27.10871696472168, "global_step": 533200, "epoch": 6424} {"train_loss": -27.21478271484375, "global_step": 533201, "epoch": 6424} {"train_loss": -27.413999557495117, "global_step": 533202, "epoch": 6424} {"train_loss": -27.140050888061523, "global_step": 533203, "epoch": 6424} {"train_loss": -27.75518798828125, "global_step": 533204, "epoch": 6424} {"train_loss": -27.130447387695312, "global_step": 533205, "epoch": 6424} {"train_loss": -27.479963302612305, "global_step": 533206, "epoch": 6424} {"train_loss": -27.1180419921875, "global_step": 533207, "epoch": 6424} {"train_loss": -27.286970138549805, "global_step": 533208, "epoch": 6424} {"train_loss": -27.292423248291016, "global_step": 533209, "epoch": 6424} {"train_loss": -27.499011993408203, "global_step": 533210, "epoch": 6424} {"train_loss": -27.65113639831543, "global_step": 533211, "epoch": 6424} {"train_loss": -27.87506103515625, "global_step": 533212, "epoch": 6424} {"train_loss": -27.57472038269043, "global_step": 533213, "epoch": 6424} {"train_loss": -27.57136344909668, "global_step": 533214, "epoch": 6424} {"train_loss": -27.889480590820312, "global_step": 533215, "epoch": 6424} {"train_loss": -27.637479782104492, "global_step": 533216, "epoch": 6424} {"train_loss": -27.499387741088867, "global_step": 533217, "epoch": 6424} {"train_loss": -28.063451766967773, "global_step": 533218, "epoch": 6424} {"train_loss": -27.44761085510254, "global_step": 533219, "epoch": 6424} {"train_loss": -27.556671142578125, "global_step": 533220, "epoch": 6424} {"train_loss": -27.9138126373291, "global_step": 533221, "epoch": 6424} {"train_loss": -27.77142333984375, "global_step": 533222, "epoch": 6424} {"train_loss": -27.42502212524414, "global_step": 533223, "epoch": 6424} {"train_loss": -27.84211540222168, "global_step": 533224, "epoch": 6424} {"train_loss": -27.975513458251953, "global_step": 533225, "epoch": 6424} {"train_loss": -27.355060577392578, "global_step": 533226, "epoch": 6424} {"train_loss": -27.97566032409668, "global_step": 533227, "epoch": 6424} {"train_loss": -27.794540405273438, "global_step": 533228, "epoch": 6424} {"train_loss": -27.602407455444336, "global_step": 533229, "epoch": 6424} {"train_loss": -27.572507858276367, "global_step": 533230, "epoch": 6424} {"train_loss": -27.44715690612793, "global_step": 533231, "epoch": 6424} {"train_loss": -27.65229606628418, "global_step": 533232, "epoch": 6424} {"train_loss": -27.796018600463867, "global_step": 533233, "epoch": 6424} {"train_loss": -27.947839736938477, "global_step": 533234, "epoch": 6424} {"train_loss": -27.487262725830078, "global_step": 533235, "epoch": 6424} {"train_loss": -27.808530807495117, "global_step": 533236, "epoch": 6424} {"train_loss": -27.46906852722168, "global_step": 533237, "epoch": 6424} {"train_loss": -27.661945343017578, "global_step": 533238, "epoch": 6424} {"train_loss": -28.157184600830078, "global_step": 533239, "epoch": 6424} {"train_loss": -27.606016159057617, "global_step": 533240, "epoch": 6424} {"train_loss": -27.65226173400879, "global_step": 533241, "epoch": 6424} {"train_loss": -27.69346046447754, "global_step": 533242, "epoch": 6424} {"train_loss": -27.856189727783203, "global_step": 533243, "epoch": 6424} {"train_loss": -27.95037269592285, "global_step": 533244, "epoch": 6424} {"train_loss": -27.989301681518555, "global_step": 533245, "epoch": 6424} {"train_loss": -27.527374267578125, "global_step": 533246, "epoch": 6424} {"train_loss": -27.776874542236328, "global_step": 533247, "epoch": 6424} {"train_loss": -27.563390731811523, "global_step": 533248, "epoch": 6424} {"train_loss": -27.90472412109375, "global_step": 533249, "epoch": 6424} {"train_loss": -27.668622970581055, "global_step": 533250, "epoch": 6424} {"train_loss": -27.760650634765625, "global_step": 533251, "epoch": 6424} {"train_loss": -27.839292526245117, "global_step": 533252, "epoch": 6424} {"train_loss": -27.891752243041992, "global_step": 533253, "epoch": 6424} {"train_loss": -27.585758209228516, "global_step": 533254, "epoch": 6424} {"train_loss": -27.68596839904785, "global_step": 533255, "epoch": 6424} {"train_loss": -27.56097412109375, "global_step": 533256, "epoch": 6424} {"train_loss": -27.8468074798584, "global_step": 533257, "epoch": 6424} {"train_loss": -27.66839599609375, "global_step": 533258, "epoch": 6424} {"train_loss": -27.740314483642578, "global_step": 533259, "epoch": 6424} {"train_loss": -27.510950088500977, "global_step": 533260, "epoch": 6424} {"train_loss": -28.051191329956055, "global_step": 533261, "epoch": 6424} {"train_loss": -27.720947265625, "global_step": 533262, "epoch": 6424} {"train_loss": -27.976306915283203, "global_step": 533263, "epoch": 6424} {"train_loss": -27.702238082885742, "global_step": 533264, "epoch": 6424} {"train_loss": -27.61916160583496, "global_step": 533265, "epoch": 6424} {"train_loss": -27.584203720092773, "global_step": 533266, "epoch": 6424} {"train_loss": -27.6165714263916, "global_step": 533267, "epoch": 6424} {"train_loss": -27.739118576049805, "global_step": 533268, "epoch": 6424} {"train_loss": -28.057098388671875, "global_step": 533269, "epoch": 6424} {"train_loss": -27.518878936767578, "global_step": 533270, "epoch": 6424} {"train_loss": -27.526229858398438, "global_step": 533271, "epoch": 6424} {"train_loss": -27.25922966003418, "global_step": 533272, "epoch": 6424} {"train_loss": -27.276535034179688, "global_step": 533273, "epoch": 6424} {"train_loss": -27.621083822595068, "global_step": 533274, "epoch": 6424, "val_loss": 6493746.0} {"train_loss": -26.9549617767334, "global_step": 533275, "epoch": 6425} {"train_loss": -24.773773193359375, "global_step": 533276, "epoch": 6425} {"train_loss": -24.407169342041016, "global_step": 533277, "epoch": 6425} {"train_loss": -27.0422420501709, "global_step": 533278, "epoch": 6425} {"train_loss": -26.25996208190918, "global_step": 533279, "epoch": 6425} {"train_loss": -26.460981369018555, "global_step": 533280, "epoch": 6425} {"train_loss": -27.104999542236328, "global_step": 533281, "epoch": 6425} {"train_loss": -27.030420303344727, "global_step": 533282, "epoch": 6425} {"train_loss": -26.8382625579834, "global_step": 533283, "epoch": 6425} {"train_loss": -26.51016616821289, "global_step": 533284, "epoch": 6425} {"train_loss": -27.062000274658203, "global_step": 533285, "epoch": 6425} {"train_loss": -26.798603057861328, "global_step": 533286, "epoch": 6425} {"train_loss": -26.637475967407227, "global_step": 533287, "epoch": 6425} {"train_loss": -26.79545021057129, "global_step": 533288, "epoch": 6425} {"train_loss": -26.86199951171875, "global_step": 533289, "epoch": 6425} {"train_loss": -27.414026260375977, "global_step": 533290, "epoch": 6425} {"train_loss": -27.585718154907227, "global_step": 533291, "epoch": 6425} {"train_loss": -26.9365234375, "global_step": 533292, "epoch": 6425} {"train_loss": -27.288930892944336, "global_step": 533293, "epoch": 6425} {"train_loss": -27.029998779296875, "global_step": 533294, "epoch": 6425} {"train_loss": -27.038267135620117, "global_step": 533295, "epoch": 6425} {"train_loss": -27.424758911132812, "global_step": 533296, "epoch": 6425} {"train_loss": -27.71942138671875, "global_step": 533297, "epoch": 6425} {"train_loss": -27.4116268157959, "global_step": 533298, "epoch": 6425} {"train_loss": -27.653928756713867, "global_step": 533299, "epoch": 6425} {"train_loss": -27.44854164123535, "global_step": 533300, "epoch": 6425} {"train_loss": -27.30960464477539, "global_step": 533301, "epoch": 6425} {"train_loss": -27.31396484375, "global_step": 533302, "epoch": 6425} {"train_loss": -27.512210845947266, "global_step": 533303, "epoch": 6425} {"train_loss": -27.981897354125977, "global_step": 533304, "epoch": 6425} {"train_loss": -27.363849639892578, "global_step": 533305, "epoch": 6425} {"train_loss": -27.283660888671875, "global_step": 533306, "epoch": 6425} {"train_loss": -27.65288734436035, "global_step": 533307, "epoch": 6425} {"train_loss": -27.866626739501953, "global_step": 533308, "epoch": 6425} {"train_loss": -27.634262084960938, "global_step": 533309, "epoch": 6425} {"train_loss": -27.4868106842041, "global_step": 533310, "epoch": 6425} {"train_loss": -27.51873779296875, "global_step": 533311, "epoch": 6425} {"train_loss": -27.43732261657715, "global_step": 533312, "epoch": 6425} {"train_loss": -27.4208927154541, "global_step": 533313, "epoch": 6425} {"train_loss": -27.68302345275879, "global_step": 533314, "epoch": 6425} {"train_loss": -27.574298858642578, "global_step": 533315, "epoch": 6425} {"train_loss": -27.76226234436035, "global_step": 533316, "epoch": 6425} {"train_loss": -27.907989501953125, "global_step": 533317, "epoch": 6425} {"train_loss": -27.580060958862305, "global_step": 533318, "epoch": 6425} {"train_loss": -28.042383193969727, "global_step": 533319, "epoch": 6425} {"train_loss": -27.773651123046875, "global_step": 533320, "epoch": 6425} {"train_loss": -28.0236759185791, "global_step": 533321, "epoch": 6425} {"train_loss": -27.745105743408203, "global_step": 533322, "epoch": 6425} {"train_loss": -27.628376007080078, "global_step": 533323, "epoch": 6425} {"train_loss": -27.724822998046875, "global_step": 533324, "epoch": 6425} {"train_loss": -28.182559967041016, "global_step": 533325, "epoch": 6425} {"train_loss": -28.077619552612305, "global_step": 533326, "epoch": 6425} {"train_loss": -28.197797775268555, "global_step": 533327, "epoch": 6425} {"train_loss": -27.5063533782959, "global_step": 533328, "epoch": 6425} {"train_loss": -27.32061767578125, "global_step": 533329, "epoch": 6425} {"train_loss": -26.551883697509766, "global_step": 533330, "epoch": 6425} {"train_loss": -26.007373809814453, "global_step": 533331, "epoch": 6425} {"train_loss": -24.36366844177246, "global_step": 533332, "epoch": 6425} {"train_loss": -24.859882354736328, "global_step": 533333, "epoch": 6425} {"train_loss": -26.56036376953125, "global_step": 533334, "epoch": 6425} {"train_loss": -25.383991241455078, "global_step": 533335, "epoch": 6425} {"train_loss": -26.65577507019043, "global_step": 533336, "epoch": 6425} {"train_loss": -25.962377548217773, "global_step": 533337, "epoch": 6425} {"train_loss": -26.954792022705078, "global_step": 533338, "epoch": 6425} {"train_loss": -26.612417221069336, "global_step": 533339, "epoch": 6425} {"train_loss": -26.366165161132812, "global_step": 533340, "epoch": 6425} {"train_loss": -27.107858657836914, "global_step": 533341, "epoch": 6425} {"train_loss": -26.695959091186523, "global_step": 533342, "epoch": 6425} {"train_loss": -26.844839096069336, "global_step": 533343, "epoch": 6425} {"train_loss": -26.878097534179688, "global_step": 533344, "epoch": 6425} {"train_loss": -26.87604331970215, "global_step": 533345, "epoch": 6425} {"train_loss": -27.376089096069336, "global_step": 533346, "epoch": 6425} {"train_loss": -27.18512535095215, "global_step": 533347, "epoch": 6425} {"train_loss": -27.139280319213867, "global_step": 533348, "epoch": 6425} {"train_loss": -27.11883544921875, "global_step": 533349, "epoch": 6425} {"train_loss": -27.240264892578125, "global_step": 533350, "epoch": 6425} {"train_loss": -26.917545318603516, "global_step": 533351, "epoch": 6425} {"train_loss": -27.41718864440918, "global_step": 533352, "epoch": 6425} {"train_loss": -27.129114151000977, "global_step": 533353, "epoch": 6425} {"train_loss": -27.5494441986084, "global_step": 533354, "epoch": 6425} {"train_loss": -27.405588150024414, "global_step": 533355, "epoch": 6425} {"train_loss": -27.3559627532959, "global_step": 533356, "epoch": 6425} {"train_loss": -27.090061946087573, "global_step": 533357, "epoch": 6425, "val_loss": 6580298.0} {"train_loss": -27.39839744567871, "global_step": 533358, "epoch": 6426} {"train_loss": -27.325620651245117, "global_step": 533359, "epoch": 6426} {"train_loss": -27.255048751831055, "global_step": 533360, "epoch": 6426} {"train_loss": -27.088459014892578, "global_step": 533361, "epoch": 6426} {"train_loss": -27.164426803588867, "global_step": 533362, "epoch": 6426} {"train_loss": -27.18556785583496, "global_step": 533363, "epoch": 6426} {"train_loss": -26.90227699279785, "global_step": 533364, "epoch": 6426} {"train_loss": -27.055952072143555, "global_step": 533365, "epoch": 6426} {"train_loss": -27.185392379760742, "global_step": 533366, "epoch": 6426} {"train_loss": -26.955835342407227, "global_step": 533367, "epoch": 6426} {"train_loss": -27.378265380859375, "global_step": 533368, "epoch": 6426} {"train_loss": -27.34637451171875, "global_step": 533369, "epoch": 6426} {"train_loss": -27.335412979125977, "global_step": 533370, "epoch": 6426} {"train_loss": -27.50823974609375, "global_step": 533371, "epoch": 6426} {"train_loss": -27.249677658081055, "global_step": 533372, "epoch": 6426} {"train_loss": -27.338281631469727, "global_step": 533373, "epoch": 6426} {"train_loss": -26.926538467407227, "global_step": 533374, "epoch": 6426} {"train_loss": -27.4460506439209, "global_step": 533375, "epoch": 6426} {"train_loss": -27.54303550720215, "global_step": 533376, "epoch": 6426} {"train_loss": -27.502609252929688, "global_step": 533377, "epoch": 6426} {"train_loss": -27.821802139282227, "global_step": 533378, "epoch": 6426} {"train_loss": -27.71005630493164, "global_step": 533379, "epoch": 6426} {"train_loss": -27.518102645874023, "global_step": 533380, "epoch": 6426} {"train_loss": -27.608694076538086, "global_step": 533381, "epoch": 6426} {"train_loss": -27.629281997680664, "global_step": 533382, "epoch": 6426} {"train_loss": -27.5752010345459, "global_step": 533383, "epoch": 6426} {"train_loss": -27.849328994750977, "global_step": 533384, "epoch": 6426} {"train_loss": -27.713409423828125, "global_step": 533385, "epoch": 6426} {"train_loss": -28.016427993774414, "global_step": 533386, "epoch": 6426} {"train_loss": -27.310461044311523, "global_step": 533387, "epoch": 6426} {"train_loss": -27.578022003173828, "global_step": 533388, "epoch": 6426} {"train_loss": -27.509382247924805, "global_step": 533389, "epoch": 6426} {"train_loss": -27.2876033782959, "global_step": 533390, "epoch": 6426} {"train_loss": -27.8760986328125, "global_step": 533391, "epoch": 6426} {"train_loss": -27.90740394592285, "global_step": 533392, "epoch": 6426} {"train_loss": -27.617338180541992, "global_step": 533393, "epoch": 6426} {"train_loss": -27.67535972595215, "global_step": 533394, "epoch": 6426} {"train_loss": -27.204458236694336, "global_step": 533395, "epoch": 6426} {"train_loss": -27.599990844726562, "global_step": 533396, "epoch": 6426} {"train_loss": -27.30817222595215, "global_step": 533397, "epoch": 6426} {"train_loss": -27.45857048034668, "global_step": 533398, "epoch": 6426} {"train_loss": -27.819080352783203, "global_step": 533399, "epoch": 6426} {"train_loss": -27.857681274414062, "global_step": 533400, "epoch": 6426} {"train_loss": -27.54414176940918, "global_step": 533401, "epoch": 6426} {"train_loss": -27.794925689697266, "global_step": 533402, "epoch": 6426} {"train_loss": -27.797351837158203, "global_step": 533403, "epoch": 6426} {"train_loss": -27.982410430908203, "global_step": 533404, "epoch": 6426} {"train_loss": -27.553359985351562, "global_step": 533405, "epoch": 6426} {"train_loss": -28.229461669921875, "global_step": 533406, "epoch": 6426} {"train_loss": -27.931676864624023, "global_step": 533407, "epoch": 6426} {"train_loss": -27.655134201049805, "global_step": 533408, "epoch": 6426} {"train_loss": -27.907093048095703, "global_step": 533409, "epoch": 6426} {"train_loss": -27.8460693359375, "global_step": 533410, "epoch": 6426} {"train_loss": -27.692218780517578, "global_step": 533411, "epoch": 6426} {"train_loss": -27.496564865112305, "global_step": 533412, "epoch": 6426} {"train_loss": -27.81553077697754, "global_step": 533413, "epoch": 6426} {"train_loss": -27.687671661376953, "global_step": 533414, "epoch": 6426} {"train_loss": -27.387907028198242, "global_step": 533415, "epoch": 6426} {"train_loss": -27.780670166015625, "global_step": 533416, "epoch": 6426} {"train_loss": -27.799291610717773, "global_step": 533417, "epoch": 6426} {"train_loss": -27.78143310546875, "global_step": 533418, "epoch": 6426} {"train_loss": -27.93183708190918, "global_step": 533419, "epoch": 6426} {"train_loss": -27.38361167907715, "global_step": 533420, "epoch": 6426} {"train_loss": -27.434011459350586, "global_step": 533421, "epoch": 6426} {"train_loss": -27.81348991394043, "global_step": 533422, "epoch": 6426} {"train_loss": -28.05767822265625, "global_step": 533423, "epoch": 6426} {"train_loss": -27.8449649810791, "global_step": 533424, "epoch": 6426} {"train_loss": -27.743528366088867, "global_step": 533425, "epoch": 6426} {"train_loss": -27.100757598876953, "global_step": 533426, "epoch": 6426} {"train_loss": -27.667633056640625, "global_step": 533427, "epoch": 6426} {"train_loss": -27.7087345123291, "global_step": 533428, "epoch": 6426} {"train_loss": -27.413801193237305, "global_step": 533429, "epoch": 6426} {"train_loss": -27.17414665222168, "global_step": 533430, "epoch": 6426} {"train_loss": -27.54749870300293, "global_step": 533431, "epoch": 6426} {"train_loss": -27.44562339782715, "global_step": 533432, "epoch": 6426} {"train_loss": -27.68896484375, "global_step": 533433, "epoch": 6426} {"train_loss": -27.388660430908203, "global_step": 533434, "epoch": 6426} {"train_loss": -27.217050552368164, "global_step": 533435, "epoch": 6426} {"train_loss": -27.397565841674805, "global_step": 533436, "epoch": 6426} {"train_loss": -27.79532814025879, "global_step": 533437, "epoch": 6426} {"train_loss": -27.91916275024414, "global_step": 533438, "epoch": 6426} {"train_loss": -27.699583053588867, "global_step": 533439, "epoch": 6426} {"train_loss": -27.56284437983869, "global_step": 533440, "epoch": 6426, "val_loss": 6536442.0} {"train_loss": -27.10169792175293, "global_step": 533441, "epoch": 6427} {"train_loss": -27.540090560913086, "global_step": 533442, "epoch": 6427} {"train_loss": -27.143665313720703, "global_step": 533443, "epoch": 6427} {"train_loss": -27.213642120361328, "global_step": 533444, "epoch": 6427} {"train_loss": -27.293701171875, "global_step": 533445, "epoch": 6427} {"train_loss": -26.97747802734375, "global_step": 533446, "epoch": 6427} {"train_loss": -27.51300048828125, "global_step": 533447, "epoch": 6427} {"train_loss": -26.937170028686523, "global_step": 533448, "epoch": 6427} {"train_loss": -27.41303062438965, "global_step": 533449, "epoch": 6427} {"train_loss": -27.69561195373535, "global_step": 533450, "epoch": 6427} {"train_loss": -27.427114486694336, "global_step": 533451, "epoch": 6427} {"train_loss": -27.13593101501465, "global_step": 533452, "epoch": 6427} {"train_loss": -27.23374366760254, "global_step": 533453, "epoch": 6427} {"train_loss": -27.456144332885742, "global_step": 533454, "epoch": 6427} {"train_loss": -27.5670108795166, "global_step": 533455, "epoch": 6427} {"train_loss": -27.424917221069336, "global_step": 533456, "epoch": 6427} {"train_loss": -27.99749755859375, "global_step": 533457, "epoch": 6427} {"train_loss": -26.96841812133789, "global_step": 533458, "epoch": 6427} {"train_loss": -27.451440811157227, "global_step": 533459, "epoch": 6427} {"train_loss": -27.289823532104492, "global_step": 533460, "epoch": 6427} {"train_loss": -27.046478271484375, "global_step": 533461, "epoch": 6427} {"train_loss": -27.366003036499023, "global_step": 533462, "epoch": 6427} {"train_loss": -27.2728214263916, "global_step": 533463, "epoch": 6427} {"train_loss": -27.307270050048828, "global_step": 533464, "epoch": 6427} {"train_loss": -27.655935287475586, "global_step": 533465, "epoch": 6427} {"train_loss": -27.564916610717773, "global_step": 533466, "epoch": 6427} {"train_loss": -27.512231826782227, "global_step": 533467, "epoch": 6427} {"train_loss": -27.813505172729492, "global_step": 533468, "epoch": 6427} {"train_loss": -27.639379501342773, "global_step": 533469, "epoch": 6427} {"train_loss": -27.45672607421875, "global_step": 533470, "epoch": 6427} {"train_loss": -27.722314834594727, "global_step": 533471, "epoch": 6427} {"train_loss": -27.55854606628418, "global_step": 533472, "epoch": 6427} {"train_loss": -27.495758056640625, "global_step": 533473, "epoch": 6427} {"train_loss": -27.561328887939453, "global_step": 533474, "epoch": 6427} {"train_loss": -28.06776237487793, "global_step": 533475, "epoch": 6427} {"train_loss": -27.635217666625977, "global_step": 533476, "epoch": 6427} {"train_loss": -28.082685470581055, "global_step": 533477, "epoch": 6427} {"train_loss": -27.279104232788086, "global_step": 533478, "epoch": 6427} {"train_loss": -27.776580810546875, "global_step": 533479, "epoch": 6427} {"train_loss": -27.693710327148438, "global_step": 533480, "epoch": 6427} {"train_loss": -27.9703426361084, "global_step": 533481, "epoch": 6427} {"train_loss": -27.524328231811523, "global_step": 533482, "epoch": 6427} {"train_loss": -27.692590713500977, "global_step": 533483, "epoch": 6427} {"train_loss": -27.544164657592773, "global_step": 533484, "epoch": 6427} {"train_loss": -27.991369247436523, "global_step": 533485, "epoch": 6427} {"train_loss": -27.790576934814453, "global_step": 533486, "epoch": 6427} {"train_loss": -27.688053131103516, "global_step": 533487, "epoch": 6427} {"train_loss": -28.152387619018555, "global_step": 533488, "epoch": 6427} {"train_loss": -27.98406410217285, "global_step": 533489, "epoch": 6427} {"train_loss": -27.52777099609375, "global_step": 533490, "epoch": 6427} {"train_loss": -27.456165313720703, "global_step": 533491, "epoch": 6427} {"train_loss": -27.410358428955078, "global_step": 533492, "epoch": 6427} {"train_loss": -27.824365615844727, "global_step": 533493, "epoch": 6427} {"train_loss": -27.75251579284668, "global_step": 533494, "epoch": 6427} {"train_loss": -27.675312042236328, "global_step": 533495, "epoch": 6427} {"train_loss": -27.902002334594727, "global_step": 533496, "epoch": 6427} {"train_loss": -27.80440330505371, "global_step": 533497, "epoch": 6427} {"train_loss": -27.91825294494629, "global_step": 533498, "epoch": 6427} {"train_loss": -27.426965713500977, "global_step": 533499, "epoch": 6427} {"train_loss": -27.25642204284668, "global_step": 533500, "epoch": 6427} {"train_loss": -27.390396118164062, "global_step": 533501, "epoch": 6427} {"train_loss": -27.113006591796875, "global_step": 533502, "epoch": 6427} {"train_loss": -27.42656898498535, "global_step": 533503, "epoch": 6427} {"train_loss": -27.67400550842285, "global_step": 533504, "epoch": 6427} {"train_loss": -27.727582931518555, "global_step": 533505, "epoch": 6427} {"train_loss": -27.50927734375, "global_step": 533506, "epoch": 6427} {"train_loss": -27.849756240844727, "global_step": 533507, "epoch": 6427} {"train_loss": -27.132843017578125, "global_step": 533508, "epoch": 6427} {"train_loss": -27.7131290435791, "global_step": 533509, "epoch": 6427} {"train_loss": -27.436307907104492, "global_step": 533510, "epoch": 6427} {"train_loss": -27.3718318939209, "global_step": 533511, "epoch": 6427} {"train_loss": -27.603178024291992, "global_step": 533512, "epoch": 6427} {"train_loss": -27.431188583374023, "global_step": 533513, "epoch": 6427} {"train_loss": -27.7769718170166, "global_step": 533514, "epoch": 6427} {"train_loss": -27.608869552612305, "global_step": 533515, "epoch": 6427} {"train_loss": -27.558984756469727, "global_step": 533516, "epoch": 6427} {"train_loss": -27.463056564331055, "global_step": 533517, "epoch": 6427} {"train_loss": -27.61728858947754, "global_step": 533518, "epoch": 6427} {"train_loss": -27.662702560424805, "global_step": 533519, "epoch": 6427} {"train_loss": -27.860593795776367, "global_step": 533520, "epoch": 6427} {"train_loss": -27.724075317382812, "global_step": 533521, "epoch": 6427} {"train_loss": -27.771459579467773, "global_step": 533522, "epoch": 6427} {"train_loss": -27.55493927001953, "global_step": 533523, "epoch": 6427, "val_loss": 6473384.0} {"train_loss": -26.555646896362305, "global_step": 533524, "epoch": 6428} {"train_loss": -25.719146728515625, "global_step": 533525, "epoch": 6428} {"train_loss": -26.720661163330078, "global_step": 533526, "epoch": 6428} {"train_loss": -26.77821159362793, "global_step": 533527, "epoch": 6428} {"train_loss": -26.845495223999023, "global_step": 533528, "epoch": 6428} {"train_loss": -27.043197631835938, "global_step": 533529, "epoch": 6428} {"train_loss": -26.681806564331055, "global_step": 533530, "epoch": 6428} {"train_loss": -26.62227439880371, "global_step": 533531, "epoch": 6428} {"train_loss": -27.456439971923828, "global_step": 533532, "epoch": 6428} {"train_loss": -27.299474716186523, "global_step": 533533, "epoch": 6428} {"train_loss": -27.136194229125977, "global_step": 533534, "epoch": 6428} {"train_loss": -27.21731948852539, "global_step": 533535, "epoch": 6428} {"train_loss": -27.32390785217285, "global_step": 533536, "epoch": 6428} {"train_loss": -26.924213409423828, "global_step": 533537, "epoch": 6428} {"train_loss": -27.609289169311523, "global_step": 533538, "epoch": 6428} {"train_loss": -27.048969268798828, "global_step": 533539, "epoch": 6428} {"train_loss": -27.374059677124023, "global_step": 533540, "epoch": 6428} {"train_loss": -27.231094360351562, "global_step": 533541, "epoch": 6428} {"train_loss": -27.352752685546875, "global_step": 533542, "epoch": 6428} {"train_loss": -27.3938045501709, "global_step": 533543, "epoch": 6428} {"train_loss": -27.330890655517578, "global_step": 533544, "epoch": 6428} {"train_loss": -27.66285514831543, "global_step": 533545, "epoch": 6428} {"train_loss": -27.383771896362305, "global_step": 533546, "epoch": 6428} {"train_loss": -27.515775680541992, "global_step": 533547, "epoch": 6428} {"train_loss": -27.28080177307129, "global_step": 533548, "epoch": 6428} {"train_loss": -27.380956649780273, "global_step": 533549, "epoch": 6428} {"train_loss": -27.249637603759766, "global_step": 533550, "epoch": 6428} {"train_loss": -27.292530059814453, "global_step": 533551, "epoch": 6428} {"train_loss": -27.759021759033203, "global_step": 533552, "epoch": 6428} {"train_loss": -27.701416015625, "global_step": 533553, "epoch": 6428} {"train_loss": -27.127294540405273, "global_step": 533554, "epoch": 6428} {"train_loss": -27.4821834564209, "global_step": 533555, "epoch": 6428} {"train_loss": -27.581525802612305, "global_step": 533556, "epoch": 6428} {"train_loss": -27.309858322143555, "global_step": 533557, "epoch": 6428} {"train_loss": -27.415761947631836, "global_step": 533558, "epoch": 6428} {"train_loss": -27.092573165893555, "global_step": 533559, "epoch": 6428} {"train_loss": -27.822874069213867, "global_step": 533560, "epoch": 6428} {"train_loss": -27.56504249572754, "global_step": 533561, "epoch": 6428} {"train_loss": -27.887235641479492, "global_step": 533562, "epoch": 6428} {"train_loss": -27.914426803588867, "global_step": 533563, "epoch": 6428} {"train_loss": -27.468189239501953, "global_step": 533564, "epoch": 6428} {"train_loss": -27.492406845092773, "global_step": 533565, "epoch": 6428} {"train_loss": -27.51482582092285, "global_step": 533566, "epoch": 6428} {"train_loss": -27.79180335998535, "global_step": 533567, "epoch": 6428} {"train_loss": -27.511524200439453, "global_step": 533568, "epoch": 6428} {"train_loss": -27.828702926635742, "global_step": 533569, "epoch": 6428} {"train_loss": -27.792409896850586, "global_step": 533570, "epoch": 6428} {"train_loss": -27.683948516845703, "global_step": 533571, "epoch": 6428} {"train_loss": -27.627410888671875, "global_step": 533572, "epoch": 6428} {"train_loss": -27.539575576782227, "global_step": 533573, "epoch": 6428} {"train_loss": -27.62139320373535, "global_step": 533574, "epoch": 6428} {"train_loss": -27.895811080932617, "global_step": 533575, "epoch": 6428} {"train_loss": -27.30353355407715, "global_step": 533576, "epoch": 6428} {"train_loss": -27.833576202392578, "global_step": 533577, "epoch": 6428} {"train_loss": -26.958906173706055, "global_step": 533578, "epoch": 6428} {"train_loss": -27.809797286987305, "global_step": 533579, "epoch": 6428} {"train_loss": -27.1117000579834, "global_step": 533580, "epoch": 6428} {"train_loss": -27.5206356048584, "global_step": 533581, "epoch": 6428} {"train_loss": -27.413110733032227, "global_step": 533582, "epoch": 6428} {"train_loss": -27.5283145904541, "global_step": 533583, "epoch": 6428} {"train_loss": -27.671802520751953, "global_step": 533584, "epoch": 6428} {"train_loss": -27.607837677001953, "global_step": 533585, "epoch": 6428} {"train_loss": -27.796295166015625, "global_step": 533586, "epoch": 6428} {"train_loss": -27.73927116394043, "global_step": 533587, "epoch": 6428} {"train_loss": -27.51698112487793, "global_step": 533588, "epoch": 6428} {"train_loss": -27.9620304107666, "global_step": 533589, "epoch": 6428} {"train_loss": -27.79837417602539, "global_step": 533590, "epoch": 6428} {"train_loss": -27.41533851623535, "global_step": 533591, "epoch": 6428} {"train_loss": -27.705078125, "global_step": 533592, "epoch": 6428} {"train_loss": -27.27532958984375, "global_step": 533593, "epoch": 6428} {"train_loss": -27.29461097717285, "global_step": 533594, "epoch": 6428} {"train_loss": -27.46412467956543, "global_step": 533595, "epoch": 6428} {"train_loss": -27.505773544311523, "global_step": 533596, "epoch": 6428} {"train_loss": -27.63046646118164, "global_step": 533597, "epoch": 6428} {"train_loss": -27.464475631713867, "global_step": 533598, "epoch": 6428} {"train_loss": -27.392240524291992, "global_step": 533599, "epoch": 6428} {"train_loss": -27.31414222717285, "global_step": 533600, "epoch": 6428} {"train_loss": -27.664844512939453, "global_step": 533601, "epoch": 6428} {"train_loss": -27.841337203979492, "global_step": 533602, "epoch": 6428} {"train_loss": -27.58794593811035, "global_step": 533603, "epoch": 6428} {"train_loss": -27.4333553314209, "global_step": 533604, "epoch": 6428} {"train_loss": -27.829519271850586, "global_step": 533605, "epoch": 6428} {"train_loss": -27.418597186904357, "global_step": 533606, "epoch": 6428, "val_loss": 6495107.0} {"train_loss": -27.196653366088867, "global_step": 533607, "epoch": 6429} {"train_loss": -26.21697425842285, "global_step": 533608, "epoch": 6429} {"train_loss": -26.033212661743164, "global_step": 533609, "epoch": 6429} {"train_loss": -26.870298385620117, "global_step": 533610, "epoch": 6429} {"train_loss": -26.91817283630371, "global_step": 533611, "epoch": 6429} {"train_loss": -26.77060317993164, "global_step": 533612, "epoch": 6429} {"train_loss": -27.154489517211914, "global_step": 533613, "epoch": 6429} {"train_loss": -27.24001121520996, "global_step": 533614, "epoch": 6429} {"train_loss": -26.865156173706055, "global_step": 533615, "epoch": 6429} {"train_loss": -27.06926918029785, "global_step": 533616, "epoch": 6429} {"train_loss": -27.476520538330078, "global_step": 533617, "epoch": 6429} {"train_loss": -27.200254440307617, "global_step": 533618, "epoch": 6429} {"train_loss": -27.290746688842773, "global_step": 533619, "epoch": 6429} {"train_loss": -27.1353816986084, "global_step": 533620, "epoch": 6429} {"train_loss": -27.080305099487305, "global_step": 533621, "epoch": 6429} {"train_loss": -26.76521110534668, "global_step": 533622, "epoch": 6429} {"train_loss": -27.10968017578125, "global_step": 533623, "epoch": 6429} {"train_loss": -27.508655548095703, "global_step": 533624, "epoch": 6429} {"train_loss": -27.669143676757812, "global_step": 533625, "epoch": 6429} {"train_loss": -26.975156784057617, "global_step": 533626, "epoch": 6429} {"train_loss": -27.4669246673584, "global_step": 533627, "epoch": 6429} {"train_loss": -27.421600341796875, "global_step": 533628, "epoch": 6429} {"train_loss": -27.409616470336914, "global_step": 533629, "epoch": 6429} {"train_loss": -27.60773277282715, "global_step": 533630, "epoch": 6429} {"train_loss": -27.505619049072266, "global_step": 533631, "epoch": 6429} {"train_loss": -27.3542537689209, "global_step": 533632, "epoch": 6429} {"train_loss": -27.374835968017578, "global_step": 533633, "epoch": 6429} {"train_loss": -27.177209854125977, "global_step": 533634, "epoch": 6429} {"train_loss": -27.59937858581543, "global_step": 533635, "epoch": 6429} {"train_loss": -27.347455978393555, "global_step": 533636, "epoch": 6429} {"train_loss": -26.92719841003418, "global_step": 533637, "epoch": 6429} {"train_loss": -26.543161392211914, "global_step": 533638, "epoch": 6429} {"train_loss": -27.181528091430664, "global_step": 533639, "epoch": 6429} {"train_loss": -27.894458770751953, "global_step": 533640, "epoch": 6429} {"train_loss": -27.581457138061523, "global_step": 533641, "epoch": 6429} {"train_loss": -27.722333908081055, "global_step": 533642, "epoch": 6429} {"train_loss": -27.555023193359375, "global_step": 533643, "epoch": 6429} {"train_loss": -27.909692764282227, "global_step": 533644, "epoch": 6429} {"train_loss": -27.53862953186035, "global_step": 533645, "epoch": 6429} {"train_loss": -27.41845703125, "global_step": 533646, "epoch": 6429} {"train_loss": -27.516498565673828, "global_step": 533647, "epoch": 6429} {"train_loss": -27.35662269592285, "global_step": 533648, "epoch": 6429} {"train_loss": -27.468061447143555, "global_step": 533649, "epoch": 6429} {"train_loss": -27.7902774810791, "global_step": 533650, "epoch": 6429} {"train_loss": -27.633996963500977, "global_step": 533651, "epoch": 6429} {"train_loss": -27.746326446533203, "global_step": 533652, "epoch": 6429} {"train_loss": -27.55019187927246, "global_step": 533653, "epoch": 6429} {"train_loss": -27.60601234436035, "global_step": 533654, "epoch": 6429} {"train_loss": -27.822961807250977, "global_step": 533655, "epoch": 6429} {"train_loss": -27.625940322875977, "global_step": 533656, "epoch": 6429} {"train_loss": -27.90244483947754, "global_step": 533657, "epoch": 6429} {"train_loss": -28.076200485229492, "global_step": 533658, "epoch": 6429} {"train_loss": -28.15130043029785, "global_step": 533659, "epoch": 6429} {"train_loss": -27.900592803955078, "global_step": 533660, "epoch": 6429} {"train_loss": -27.869131088256836, "global_step": 533661, "epoch": 6429} {"train_loss": -27.577905654907227, "global_step": 533662, "epoch": 6429} {"train_loss": -28.058752059936523, "global_step": 533663, "epoch": 6429} {"train_loss": -27.97626304626465, "global_step": 533664, "epoch": 6429} {"train_loss": -27.8450984954834, "global_step": 533665, "epoch": 6429} {"train_loss": -27.698606491088867, "global_step": 533666, "epoch": 6429} {"train_loss": -27.452777862548828, "global_step": 533667, "epoch": 6429} {"train_loss": -27.411151885986328, "global_step": 533668, "epoch": 6429} {"train_loss": -27.782459259033203, "global_step": 533669, "epoch": 6429} {"train_loss": -27.46315574645996, "global_step": 533670, "epoch": 6429} {"train_loss": -27.61647605895996, "global_step": 533671, "epoch": 6429} {"train_loss": -27.515649795532227, "global_step": 533672, "epoch": 6429} {"train_loss": -27.542036056518555, "global_step": 533673, "epoch": 6429} {"train_loss": -27.454132080078125, "global_step": 533674, "epoch": 6429} {"train_loss": -27.3552188873291, "global_step": 533675, "epoch": 6429} {"train_loss": -26.786426544189453, "global_step": 533676, "epoch": 6429} {"train_loss": -26.5772705078125, "global_step": 533677, "epoch": 6429} {"train_loss": -27.253076553344727, "global_step": 533678, "epoch": 6429} {"train_loss": -27.510961532592773, "global_step": 533679, "epoch": 6429} {"train_loss": -27.051889419555664, "global_step": 533680, "epoch": 6429} {"train_loss": -27.357587814331055, "global_step": 533681, "epoch": 6429} {"train_loss": -27.40769386291504, "global_step": 533682, "epoch": 6429} {"train_loss": -27.542682647705078, "global_step": 533683, "epoch": 6429} {"train_loss": -27.392751693725586, "global_step": 533684, "epoch": 6429} {"train_loss": -27.623764038085938, "global_step": 533685, "epoch": 6429} {"train_loss": -27.819595336914062, "global_step": 533686, "epoch": 6429} {"train_loss": -27.873197555541992, "global_step": 533687, "epoch": 6429} {"train_loss": -27.42886734008789, "global_step": 533688, "epoch": 6429} {"train_loss": -27.39387698345874, "global_step": 533689, "epoch": 6429, "val_loss": 6546799.0} {"train_loss": -27.282392501831055, "global_step": 533690, "epoch": 6430} {"train_loss": -26.9382381439209, "global_step": 533691, "epoch": 6430} {"train_loss": -27.218921661376953, "global_step": 533692, "epoch": 6430} {"train_loss": -26.957956314086914, "global_step": 533693, "epoch": 6430} {"train_loss": -27.32466697692871, "global_step": 533694, "epoch": 6430} {"train_loss": -27.311843872070312, "global_step": 533695, "epoch": 6430} {"train_loss": -26.74762535095215, "global_step": 533696, "epoch": 6430} {"train_loss": -27.29315185546875, "global_step": 533697, "epoch": 6430} {"train_loss": -27.0603084564209, "global_step": 533698, "epoch": 6430} {"train_loss": -27.7445011138916, "global_step": 533699, "epoch": 6430} {"train_loss": -27.555206298828125, "global_step": 533700, "epoch": 6430} {"train_loss": -27.37162208557129, "global_step": 533701, "epoch": 6430} {"train_loss": -27.02800941467285, "global_step": 533702, "epoch": 6430} {"train_loss": -27.091421127319336, "global_step": 533703, "epoch": 6430} {"train_loss": -27.305744171142578, "global_step": 533704, "epoch": 6430} {"train_loss": -27.62929344177246, "global_step": 533705, "epoch": 6430} {"train_loss": -27.537389755249023, "global_step": 533706, "epoch": 6430} {"train_loss": -27.526107788085938, "global_step": 533707, "epoch": 6430} {"train_loss": -27.812414169311523, "global_step": 533708, "epoch": 6430} {"train_loss": -27.15740966796875, "global_step": 533709, "epoch": 6430} {"train_loss": -27.341291427612305, "global_step": 533710, "epoch": 6430} {"train_loss": -27.3819580078125, "global_step": 533711, "epoch": 6430} {"train_loss": -27.29725456237793, "global_step": 533712, "epoch": 6430} {"train_loss": -27.672101974487305, "global_step": 533713, "epoch": 6430} {"train_loss": -27.730695724487305, "global_step": 533714, "epoch": 6430} {"train_loss": -27.700138092041016, "global_step": 533715, "epoch": 6430} {"train_loss": -27.5915470123291, "global_step": 533716, "epoch": 6430} {"train_loss": -27.44003677368164, "global_step": 533717, "epoch": 6430} {"train_loss": -27.6781005859375, "global_step": 533718, "epoch": 6430} {"train_loss": -27.413944244384766, "global_step": 533719, "epoch": 6430} {"train_loss": -27.755361557006836, "global_step": 533720, "epoch": 6430} {"train_loss": -27.37387466430664, "global_step": 533721, "epoch": 6430} {"train_loss": -27.74933433532715, "global_step": 533722, "epoch": 6430} {"train_loss": -27.55982780456543, "global_step": 533723, "epoch": 6430} {"train_loss": -27.558507919311523, "global_step": 533724, "epoch": 6430} {"train_loss": -27.505212783813477, "global_step": 533725, "epoch": 6430} {"train_loss": -27.60614585876465, "global_step": 533726, "epoch": 6430} {"train_loss": -27.787384033203125, "global_step": 533727, "epoch": 6430} {"train_loss": -27.58430290222168, "global_step": 533728, "epoch": 6430} {"train_loss": -27.758167266845703, "global_step": 533729, "epoch": 6430} {"train_loss": -27.648441314697266, "global_step": 533730, "epoch": 6430} {"train_loss": -27.946842193603516, "global_step": 533731, "epoch": 6430} {"train_loss": -28.03571891784668, "global_step": 533732, "epoch": 6430} {"train_loss": -27.842823028564453, "global_step": 533733, "epoch": 6430} {"train_loss": -27.90772819519043, "global_step": 533734, "epoch": 6430} {"train_loss": -27.95612144470215, "global_step": 533735, "epoch": 6430} {"train_loss": -27.4346866607666, "global_step": 533736, "epoch": 6430} {"train_loss": -27.691608428955078, "global_step": 533737, "epoch": 6430} {"train_loss": -28.056167602539062, "global_step": 533738, "epoch": 6430} {"train_loss": -27.72040367126465, "global_step": 533739, "epoch": 6430} {"train_loss": -27.750232696533203, "global_step": 533740, "epoch": 6430} {"train_loss": -27.69929313659668, "global_step": 533741, "epoch": 6430} {"train_loss": -27.543928146362305, "global_step": 533742, "epoch": 6430} {"train_loss": -27.884435653686523, "global_step": 533743, "epoch": 6430} {"train_loss": -28.025415420532227, "global_step": 533744, "epoch": 6430} {"train_loss": -27.585973739624023, "global_step": 533745, "epoch": 6430} {"train_loss": -27.914819717407227, "global_step": 533746, "epoch": 6430} {"train_loss": -27.73540687561035, "global_step": 533747, "epoch": 6430} {"train_loss": -27.75357437133789, "global_step": 533748, "epoch": 6430} {"train_loss": -27.651105880737305, "global_step": 533749, "epoch": 6430} {"train_loss": -27.84954833984375, "global_step": 533750, "epoch": 6430} {"train_loss": -27.674787521362305, "global_step": 533751, "epoch": 6430} {"train_loss": -27.24517822265625, "global_step": 533752, "epoch": 6430} {"train_loss": -27.40524673461914, "global_step": 533753, "epoch": 6430} {"train_loss": -27.35776138305664, "global_step": 533754, "epoch": 6430} {"train_loss": -27.79340171813965, "global_step": 533755, "epoch": 6430} {"train_loss": -27.224512100219727, "global_step": 533756, "epoch": 6430} {"train_loss": -27.50373649597168, "global_step": 533757, "epoch": 6430} {"train_loss": -27.635168075561523, "global_step": 533758, "epoch": 6430} {"train_loss": -27.468997955322266, "global_step": 533759, "epoch": 6430} {"train_loss": -27.470361709594727, "global_step": 533760, "epoch": 6430} {"train_loss": -28.154159545898438, "global_step": 533761, "epoch": 6430} {"train_loss": -27.40761375427246, "global_step": 533762, "epoch": 6430} {"train_loss": -27.53910255432129, "global_step": 533763, "epoch": 6430} {"train_loss": -27.629898071289062, "global_step": 533764, "epoch": 6430} {"train_loss": -27.380048751831055, "global_step": 533765, "epoch": 6430} {"train_loss": -27.76832389831543, "global_step": 533766, "epoch": 6430} {"train_loss": -27.775243759155273, "global_step": 533767, "epoch": 6430} {"train_loss": -27.751117706298828, "global_step": 533768, "epoch": 6430} {"train_loss": -27.403949737548828, "global_step": 533769, "epoch": 6430} {"train_loss": -27.290449142456055, "global_step": 533770, "epoch": 6430} {"train_loss": -27.531763076782227, "global_step": 533771, "epoch": 6430} {"train_loss": -27.576851350715362, "global_step": 533772, "epoch": 6430, "val_loss": 6588017.0} {"train_loss": -25.081560134887695, "global_step": 533773, "epoch": 6431} {"train_loss": -25.247730255126953, "global_step": 533774, "epoch": 6431} {"train_loss": -24.624555587768555, "global_step": 533775, "epoch": 6431} {"train_loss": -26.80623435974121, "global_step": 533776, "epoch": 6431} {"train_loss": -26.240020751953125, "global_step": 533777, "epoch": 6431} {"train_loss": -25.789295196533203, "global_step": 533778, "epoch": 6431} {"train_loss": -26.66725730895996, "global_step": 533779, "epoch": 6431} {"train_loss": -26.113269805908203, "global_step": 533780, "epoch": 6431} {"train_loss": -26.95306968688965, "global_step": 533781, "epoch": 6431} {"train_loss": -26.619821548461914, "global_step": 533782, "epoch": 6431} {"train_loss": -26.914060592651367, "global_step": 533783, "epoch": 6431} {"train_loss": -26.774023056030273, "global_step": 533784, "epoch": 6431} {"train_loss": -27.01227378845215, "global_step": 533785, "epoch": 6431} {"train_loss": -26.23137855529785, "global_step": 533786, "epoch": 6431} {"train_loss": -27.33721923828125, "global_step": 533787, "epoch": 6431} {"train_loss": -26.950265884399414, "global_step": 533788, "epoch": 6431} {"train_loss": -27.144794464111328, "global_step": 533789, "epoch": 6431} {"train_loss": -26.988245010375977, "global_step": 533790, "epoch": 6431} {"train_loss": -26.83539390563965, "global_step": 533791, "epoch": 6431} {"train_loss": -26.859790802001953, "global_step": 533792, "epoch": 6431} {"train_loss": -27.165191650390625, "global_step": 533793, "epoch": 6431} {"train_loss": -27.118728637695312, "global_step": 533794, "epoch": 6431} {"train_loss": -26.819034576416016, "global_step": 533795, "epoch": 6431} {"train_loss": -27.30303382873535, "global_step": 533796, "epoch": 6431} {"train_loss": -27.530725479125977, "global_step": 533797, "epoch": 6431} {"train_loss": -27.33538818359375, "global_step": 533798, "epoch": 6431} {"train_loss": -26.862451553344727, "global_step": 533799, "epoch": 6431} {"train_loss": -27.261371612548828, "global_step": 533800, "epoch": 6431} {"train_loss": -27.394052505493164, "global_step": 533801, "epoch": 6431} {"train_loss": -27.1981258392334, "global_step": 533802, "epoch": 6431} {"train_loss": -27.4183349609375, "global_step": 533803, "epoch": 6431} {"train_loss": -27.953611373901367, "global_step": 533804, "epoch": 6431} {"train_loss": -27.360549926757812, "global_step": 533805, "epoch": 6431} {"train_loss": -27.50787353515625, "global_step": 533806, "epoch": 6431} {"train_loss": -27.51837158203125, "global_step": 533807, "epoch": 6431} {"train_loss": -27.46516990661621, "global_step": 533808, "epoch": 6431} {"train_loss": -27.760547637939453, "global_step": 533809, "epoch": 6431} {"train_loss": -27.283178329467773, "global_step": 533810, "epoch": 6431} {"train_loss": -27.668989181518555, "global_step": 533811, "epoch": 6431} {"train_loss": -27.625965118408203, "global_step": 533812, "epoch": 6431} {"train_loss": -27.760709762573242, "global_step": 533813, "epoch": 6431} {"train_loss": -27.409738540649414, "global_step": 533814, "epoch": 6431} {"train_loss": -27.414596557617188, "global_step": 533815, "epoch": 6431} {"train_loss": -27.608783721923828, "global_step": 533816, "epoch": 6431} {"train_loss": -27.622602462768555, "global_step": 533817, "epoch": 6431} {"train_loss": -27.705204010009766, "global_step": 533818, "epoch": 6431} {"train_loss": -27.703603744506836, "global_step": 533819, "epoch": 6431} {"train_loss": -27.682147979736328, "global_step": 533820, "epoch": 6431} {"train_loss": -27.063077926635742, "global_step": 533821, "epoch": 6431} {"train_loss": -27.335966110229492, "global_step": 533822, "epoch": 6431} {"train_loss": -27.749347686767578, "global_step": 533823, "epoch": 6431} {"train_loss": -27.87526512145996, "global_step": 533824, "epoch": 6431} {"train_loss": -27.49196434020996, "global_step": 533825, "epoch": 6431} {"train_loss": -27.886001586914062, "global_step": 533826, "epoch": 6431} {"train_loss": -27.820453643798828, "global_step": 533827, "epoch": 6431} {"train_loss": -27.38727378845215, "global_step": 533828, "epoch": 6431} {"train_loss": -27.447296142578125, "global_step": 533829, "epoch": 6431} {"train_loss": -27.617380142211914, "global_step": 533830, "epoch": 6431} {"train_loss": -27.60015296936035, "global_step": 533831, "epoch": 6431} {"train_loss": -27.289825439453125, "global_step": 533832, "epoch": 6431} {"train_loss": -27.188100814819336, "global_step": 533833, "epoch": 6431} {"train_loss": -27.78683853149414, "global_step": 533834, "epoch": 6431} {"train_loss": -27.770578384399414, "global_step": 533835, "epoch": 6431} {"train_loss": -27.7543888092041, "global_step": 533836, "epoch": 6431} {"train_loss": -27.57148551940918, "global_step": 533837, "epoch": 6431} {"train_loss": -27.671979904174805, "global_step": 533838, "epoch": 6431} {"train_loss": -27.547351837158203, "global_step": 533839, "epoch": 6431} {"train_loss": -27.8268985748291, "global_step": 533840, "epoch": 6431} {"train_loss": -27.47515869140625, "global_step": 533841, "epoch": 6431} {"train_loss": -27.52044105529785, "global_step": 533842, "epoch": 6431} {"train_loss": -27.980016708374023, "global_step": 533843, "epoch": 6431} {"train_loss": -27.51287841796875, "global_step": 533844, "epoch": 6431} {"train_loss": -27.53303337097168, "global_step": 533845, "epoch": 6431} {"train_loss": -27.716115951538086, "global_step": 533846, "epoch": 6431} {"train_loss": -27.54828453063965, "global_step": 533847, "epoch": 6431} {"train_loss": -27.8160457611084, "global_step": 533848, "epoch": 6431} {"train_loss": -27.779699325561523, "global_step": 533849, "epoch": 6431} {"train_loss": -27.714649200439453, "global_step": 533850, "epoch": 6431} {"train_loss": -28.00201416015625, "global_step": 533851, "epoch": 6431} {"train_loss": -27.712873458862305, "global_step": 533852, "epoch": 6431} {"train_loss": -27.4498291015625, "global_step": 533853, "epoch": 6431} {"train_loss": -27.6500301361084, "global_step": 533854, "epoch": 6431} {"train_loss": -27.274839240384388, "global_step": 533855, "epoch": 6431, "val_loss": 6504077.0} {"train_loss": -27.047033309936523, "global_step": 533856, "epoch": 6432} {"train_loss": -26.242328643798828, "global_step": 533857, "epoch": 6432} {"train_loss": -26.869739532470703, "global_step": 533858, "epoch": 6432} {"train_loss": -27.04718017578125, "global_step": 533859, "epoch": 6432} {"train_loss": -26.728967666625977, "global_step": 533860, "epoch": 6432} {"train_loss": -27.180713653564453, "global_step": 533861, "epoch": 6432} {"train_loss": -26.909265518188477, "global_step": 533862, "epoch": 6432} {"train_loss": -26.64105796813965, "global_step": 533863, "epoch": 6432} {"train_loss": -26.936185836791992, "global_step": 533864, "epoch": 6432} {"train_loss": -27.34030532836914, "global_step": 533865, "epoch": 6432} {"train_loss": -27.366559982299805, "global_step": 533866, "epoch": 6432} {"train_loss": -27.501758575439453, "global_step": 533867, "epoch": 6432} {"train_loss": -27.17683219909668, "global_step": 533868, "epoch": 6432} {"train_loss": -27.581878662109375, "global_step": 533869, "epoch": 6432} {"train_loss": -26.95440673828125, "global_step": 533870, "epoch": 6432} {"train_loss": -27.393142700195312, "global_step": 533871, "epoch": 6432} {"train_loss": -27.42530632019043, "global_step": 533872, "epoch": 6432} {"train_loss": -27.408117294311523, "global_step": 533873, "epoch": 6432} {"train_loss": -27.56475830078125, "global_step": 533874, "epoch": 6432} {"train_loss": -27.213104248046875, "global_step": 533875, "epoch": 6432} {"train_loss": -27.57015037536621, "global_step": 533876, "epoch": 6432} {"train_loss": -27.6387882232666, "global_step": 533877, "epoch": 6432} {"train_loss": -27.224273681640625, "global_step": 533878, "epoch": 6432} {"train_loss": -27.57106590270996, "global_step": 533879, "epoch": 6432} {"train_loss": -27.57667350769043, "global_step": 533880, "epoch": 6432} {"train_loss": -27.672958374023438, "global_step": 533881, "epoch": 6432} {"train_loss": -27.2886905670166, "global_step": 533882, "epoch": 6432} {"train_loss": -27.896072387695312, "global_step": 533883, "epoch": 6432} {"train_loss": -27.55830955505371, "global_step": 533884, "epoch": 6432} {"train_loss": -27.55856704711914, "global_step": 533885, "epoch": 6432} {"train_loss": -27.56281852722168, "global_step": 533886, "epoch": 6432} {"train_loss": -27.598913192749023, "global_step": 533887, "epoch": 6432} {"train_loss": -27.6204833984375, "global_step": 533888, "epoch": 6432} {"train_loss": -27.575305938720703, "global_step": 533889, "epoch": 6432} {"train_loss": -27.79522705078125, "global_step": 533890, "epoch": 6432} {"train_loss": -27.716501235961914, "global_step": 533891, "epoch": 6432} {"train_loss": -27.642786026000977, "global_step": 533892, "epoch": 6432} {"train_loss": -27.730010986328125, "global_step": 533893, "epoch": 6432} {"train_loss": -27.84122657775879, "global_step": 533894, "epoch": 6432} {"train_loss": -27.75543212890625, "global_step": 533895, "epoch": 6432} {"train_loss": -27.822677612304688, "global_step": 533896, "epoch": 6432} {"train_loss": -27.705678939819336, "global_step": 533897, "epoch": 6432} {"train_loss": -27.699878692626953, "global_step": 533898, "epoch": 6432} {"train_loss": -27.780059814453125, "global_step": 533899, "epoch": 6432} {"train_loss": -27.281696319580078, "global_step": 533900, "epoch": 6432} {"train_loss": -27.30356788635254, "global_step": 533901, "epoch": 6432} {"train_loss": -27.55816650390625, "global_step": 533902, "epoch": 6432} {"train_loss": -27.693891525268555, "global_step": 533903, "epoch": 6432} {"train_loss": -27.482715606689453, "global_step": 533904, "epoch": 6432} {"train_loss": -27.844213485717773, "global_step": 533905, "epoch": 6432} {"train_loss": -27.848745346069336, "global_step": 533906, "epoch": 6432} {"train_loss": -27.816940307617188, "global_step": 533907, "epoch": 6432} {"train_loss": -27.11403465270996, "global_step": 533908, "epoch": 6432} {"train_loss": -27.696802139282227, "global_step": 533909, "epoch": 6432} {"train_loss": -27.445255279541016, "global_step": 533910, "epoch": 6432} {"train_loss": -27.632583618164062, "global_step": 533911, "epoch": 6432} {"train_loss": -27.54107093811035, "global_step": 533912, "epoch": 6432} {"train_loss": -28.046789169311523, "global_step": 533913, "epoch": 6432} {"train_loss": -27.439624786376953, "global_step": 533914, "epoch": 6432} {"train_loss": -27.09650230407715, "global_step": 533915, "epoch": 6432} {"train_loss": -27.2929630279541, "global_step": 533916, "epoch": 6432} {"train_loss": -27.41343116760254, "global_step": 533917, "epoch": 6432} {"train_loss": -27.491357803344727, "global_step": 533918, "epoch": 6432} {"train_loss": -27.47670555114746, "global_step": 533919, "epoch": 6432} {"train_loss": -27.418689727783203, "global_step": 533920, "epoch": 6432} {"train_loss": -27.376447677612305, "global_step": 533921, "epoch": 6432} {"train_loss": -27.379240036010742, "global_step": 533922, "epoch": 6432} {"train_loss": -27.311750411987305, "global_step": 533923, "epoch": 6432} {"train_loss": -27.928476333618164, "global_step": 533924, "epoch": 6432} {"train_loss": -27.535749435424805, "global_step": 533925, "epoch": 6432} {"train_loss": -26.833459854125977, "global_step": 533926, "epoch": 6432} {"train_loss": -27.332305908203125, "global_step": 533927, "epoch": 6432} {"train_loss": -27.897205352783203, "global_step": 533928, "epoch": 6432} {"train_loss": -27.23663330078125, "global_step": 533929, "epoch": 6432} {"train_loss": -27.481393814086914, "global_step": 533930, "epoch": 6432} {"train_loss": -27.56129264831543, "global_step": 533931, "epoch": 6432} {"train_loss": -27.520339965820312, "global_step": 533932, "epoch": 6432} {"train_loss": -27.17268180847168, "global_step": 533933, "epoch": 6432} {"train_loss": -27.747604370117188, "global_step": 533934, "epoch": 6432} {"train_loss": -27.51775550842285, "global_step": 533935, "epoch": 6432} {"train_loss": -27.44874382019043, "global_step": 533936, "epoch": 6432} {"train_loss": -27.786579132080078, "global_step": 533937, "epoch": 6432} {"train_loss": -27.46176774817777, "global_step": 533938, "epoch": 6432, "val_loss": 6562049.0} {"train_loss": -27.526647567749023, "global_step": 533939, "epoch": 6433} {"train_loss": -27.20599365234375, "global_step": 533940, "epoch": 6433} {"train_loss": -27.680898666381836, "global_step": 533941, "epoch": 6433} {"train_loss": -27.349836349487305, "global_step": 533942, "epoch": 6433} {"train_loss": -27.422956466674805, "global_step": 533943, "epoch": 6433} {"train_loss": -27.65523338317871, "global_step": 533944, "epoch": 6433} {"train_loss": -27.339496612548828, "global_step": 533945, "epoch": 6433} {"train_loss": -27.04481315612793, "global_step": 533946, "epoch": 6433} {"train_loss": -27.690229415893555, "global_step": 533947, "epoch": 6433} {"train_loss": -27.485578536987305, "global_step": 533948, "epoch": 6433} {"train_loss": -27.455032348632812, "global_step": 533949, "epoch": 6433} {"train_loss": -27.317777633666992, "global_step": 533950, "epoch": 6433} {"train_loss": -27.294940948486328, "global_step": 533951, "epoch": 6433} {"train_loss": -27.86895751953125, "global_step": 533952, "epoch": 6433} {"train_loss": -27.20065689086914, "global_step": 533953, "epoch": 6433} {"train_loss": -27.467260360717773, "global_step": 533954, "epoch": 6433} {"train_loss": -27.330652236938477, "global_step": 533955, "epoch": 6433} {"train_loss": -27.276243209838867, "global_step": 533956, "epoch": 6433} {"train_loss": -27.70765495300293, "global_step": 533957, "epoch": 6433} {"train_loss": -27.460538864135742, "global_step": 533958, "epoch": 6433} {"train_loss": -27.765625, "global_step": 533959, "epoch": 6433} {"train_loss": -27.598058700561523, "global_step": 533960, "epoch": 6433} {"train_loss": -27.35713768005371, "global_step": 533961, "epoch": 6433} {"train_loss": -27.70694351196289, "global_step": 533962, "epoch": 6433} {"train_loss": -27.432050704956055, "global_step": 533963, "epoch": 6433} {"train_loss": -27.394445419311523, "global_step": 533964, "epoch": 6433} {"train_loss": -27.932636260986328, "global_step": 533965, "epoch": 6433} {"train_loss": -27.3570556640625, "global_step": 533966, "epoch": 6433} {"train_loss": -27.543302536010742, "global_step": 533967, "epoch": 6433} {"train_loss": -27.706323623657227, "global_step": 533968, "epoch": 6433} {"train_loss": -27.232227325439453, "global_step": 533969, "epoch": 6433} {"train_loss": -27.71331787109375, "global_step": 533970, "epoch": 6433} {"train_loss": -27.04144287109375, "global_step": 533971, "epoch": 6433} {"train_loss": -27.681385040283203, "global_step": 533972, "epoch": 6433} {"train_loss": -27.485538482666016, "global_step": 533973, "epoch": 6433} {"train_loss": -27.48923683166504, "global_step": 533974, "epoch": 6433} {"train_loss": -27.7966251373291, "global_step": 533975, "epoch": 6433} {"train_loss": -27.421234130859375, "global_step": 533976, "epoch": 6433} {"train_loss": -27.968460083007812, "global_step": 533977, "epoch": 6433} {"train_loss": -27.360971450805664, "global_step": 533978, "epoch": 6433} {"train_loss": -27.885913848876953, "global_step": 533979, "epoch": 6433} {"train_loss": -27.808368682861328, "global_step": 533980, "epoch": 6433} {"train_loss": -27.625106811523438, "global_step": 533981, "epoch": 6433} {"train_loss": -27.689838409423828, "global_step": 533982, "epoch": 6433} {"train_loss": -27.85968589782715, "global_step": 533983, "epoch": 6433} {"train_loss": -27.668176651000977, "global_step": 533984, "epoch": 6433} {"train_loss": -27.4493408203125, "global_step": 533985, "epoch": 6433} {"train_loss": -27.84332275390625, "global_step": 533986, "epoch": 6433} {"train_loss": -27.558155059814453, "global_step": 533987, "epoch": 6433} {"train_loss": -27.69166374206543, "global_step": 533988, "epoch": 6433} {"train_loss": -27.923416137695312, "global_step": 533989, "epoch": 6433} {"train_loss": -27.3602237701416, "global_step": 533990, "epoch": 6433} {"train_loss": -27.98345375061035, "global_step": 533991, "epoch": 6433} {"train_loss": -27.860525131225586, "global_step": 533992, "epoch": 6433} {"train_loss": -27.86116600036621, "global_step": 533993, "epoch": 6433} {"train_loss": -27.1854305267334, "global_step": 533994, "epoch": 6433} {"train_loss": -27.405725479125977, "global_step": 533995, "epoch": 6433} {"train_loss": -27.279571533203125, "global_step": 533996, "epoch": 6433} {"train_loss": -27.636611938476562, "global_step": 533997, "epoch": 6433} {"train_loss": -27.45692253112793, "global_step": 533998, "epoch": 6433} {"train_loss": -27.561100006103516, "global_step": 533999, "epoch": 6433} {"train_loss": -27.739673614501953, "global_step": 534000, "epoch": 6433} {"train_loss": -27.692651748657227, "global_step": 534001, "epoch": 6433} {"train_loss": -27.787841796875, "global_step": 534002, "epoch": 6433} {"train_loss": -27.4959774017334, "global_step": 534003, "epoch": 6433} {"train_loss": -27.509496688842773, "global_step": 534004, "epoch": 6433} {"train_loss": -27.70608901977539, "global_step": 534005, "epoch": 6433} {"train_loss": -27.974679946899414, "global_step": 534006, "epoch": 6433} {"train_loss": -27.718524932861328, "global_step": 534007, "epoch": 6433} {"train_loss": -28.092145919799805, "global_step": 534008, "epoch": 6433} {"train_loss": -27.675159454345703, "global_step": 534009, "epoch": 6433} {"train_loss": -27.481897354125977, "global_step": 534010, "epoch": 6433} {"train_loss": -27.618982315063477, "global_step": 534011, "epoch": 6433} {"train_loss": -27.863922119140625, "global_step": 534012, "epoch": 6433} {"train_loss": -27.46919059753418, "global_step": 534013, "epoch": 6433} {"train_loss": -27.713125228881836, "global_step": 534014, "epoch": 6433} {"train_loss": -27.751134872436523, "global_step": 534015, "epoch": 6433} {"train_loss": -27.870513916015625, "global_step": 534016, "epoch": 6433} {"train_loss": -27.607797622680664, "global_step": 534017, "epoch": 6433} {"train_loss": -27.551746368408203, "global_step": 534018, "epoch": 6433} {"train_loss": -27.31648826599121, "global_step": 534019, "epoch": 6433} {"train_loss": -27.080047607421875, "global_step": 534020, "epoch": 6433} {"train_loss": -27.57007787313806, "global_step": 534021, "epoch": 6433, "val_loss": 6503516.0} {"train_loss": -24.38478660583496, "global_step": 534022, "epoch": 6434} {"train_loss": -23.69422721862793, "global_step": 534023, "epoch": 6434} {"train_loss": -26.56963539123535, "global_step": 534024, "epoch": 6434} {"train_loss": -25.710607528686523, "global_step": 534025, "epoch": 6434} {"train_loss": -25.933629989624023, "global_step": 534026, "epoch": 6434} {"train_loss": -26.12039566040039, "global_step": 534027, "epoch": 6434} {"train_loss": -26.43438720703125, "global_step": 534028, "epoch": 6434} {"train_loss": -26.060773849487305, "global_step": 534029, "epoch": 6434} {"train_loss": -26.842987060546875, "global_step": 534030, "epoch": 6434} {"train_loss": -26.094755172729492, "global_step": 534031, "epoch": 6434} {"train_loss": -26.495763778686523, "global_step": 534032, "epoch": 6434} {"train_loss": -26.344161987304688, "global_step": 534033, "epoch": 6434} {"train_loss": -26.23099136352539, "global_step": 534034, "epoch": 6434} {"train_loss": -26.805469512939453, "global_step": 534035, "epoch": 6434} {"train_loss": -26.32158851623535, "global_step": 534036, "epoch": 6434} {"train_loss": -26.747739791870117, "global_step": 534037, "epoch": 6434} {"train_loss": -26.832456588745117, "global_step": 534038, "epoch": 6434} {"train_loss": -26.530139923095703, "global_step": 534039, "epoch": 6434} {"train_loss": -26.77914810180664, "global_step": 534040, "epoch": 6434} {"train_loss": -27.209980010986328, "global_step": 534041, "epoch": 6434} {"train_loss": -26.86818504333496, "global_step": 534042, "epoch": 6434} {"train_loss": -27.011520385742188, "global_step": 534043, "epoch": 6434} {"train_loss": -27.07757568359375, "global_step": 534044, "epoch": 6434} {"train_loss": -27.12749671936035, "global_step": 534045, "epoch": 6434} {"train_loss": -26.887720108032227, "global_step": 534046, "epoch": 6434} {"train_loss": -27.1270694732666, "global_step": 534047, "epoch": 6434} {"train_loss": -26.97833824157715, "global_step": 534048, "epoch": 6434} {"train_loss": -26.953388214111328, "global_step": 534049, "epoch": 6434} {"train_loss": -27.187814712524414, "global_step": 534050, "epoch": 6434} {"train_loss": -27.429431915283203, "global_step": 534051, "epoch": 6434} {"train_loss": -26.9445743560791, "global_step": 534052, "epoch": 6434} {"train_loss": -27.327716827392578, "global_step": 534053, "epoch": 6434} {"train_loss": -27.1700382232666, "global_step": 534054, "epoch": 6434} {"train_loss": -27.57419204711914, "global_step": 534055, "epoch": 6434} {"train_loss": -27.169178009033203, "global_step": 534056, "epoch": 6434} {"train_loss": -27.678823471069336, "global_step": 534057, "epoch": 6434} {"train_loss": -27.4199275970459, "global_step": 534058, "epoch": 6434} {"train_loss": -27.215106964111328, "global_step": 534059, "epoch": 6434} {"train_loss": -27.746984481811523, "global_step": 534060, "epoch": 6434} {"train_loss": -27.648496627807617, "global_step": 534061, "epoch": 6434} {"train_loss": -27.213581085205078, "global_step": 534062, "epoch": 6434} {"train_loss": -27.657514572143555, "global_step": 534063, "epoch": 6434} {"train_loss": -27.691879272460938, "global_step": 534064, "epoch": 6434} {"train_loss": -27.217721939086914, "global_step": 534065, "epoch": 6434} {"train_loss": -27.737096786499023, "global_step": 534066, "epoch": 6434} {"train_loss": -27.974340438842773, "global_step": 534067, "epoch": 6434} {"train_loss": -27.682416915893555, "global_step": 534068, "epoch": 6434} {"train_loss": -27.58539390563965, "global_step": 534069, "epoch": 6434} {"train_loss": -27.907794952392578, "global_step": 534070, "epoch": 6434} {"train_loss": -27.895965576171875, "global_step": 534071, "epoch": 6434} {"train_loss": -28.2408504486084, "global_step": 534072, "epoch": 6434} {"train_loss": -27.478946685791016, "global_step": 534073, "epoch": 6434} {"train_loss": -27.868276596069336, "global_step": 534074, "epoch": 6434} {"train_loss": -27.867414474487305, "global_step": 534075, "epoch": 6434} {"train_loss": -27.682220458984375, "global_step": 534076, "epoch": 6434} {"train_loss": -27.80132484436035, "global_step": 534077, "epoch": 6434} {"train_loss": -27.745737075805664, "global_step": 534078, "epoch": 6434} {"train_loss": -27.7730712890625, "global_step": 534079, "epoch": 6434} {"train_loss": -27.61004638671875, "global_step": 534080, "epoch": 6434} {"train_loss": -27.77748680114746, "global_step": 534081, "epoch": 6434} {"train_loss": -27.759748458862305, "global_step": 534082, "epoch": 6434} {"train_loss": -27.422042846679688, "global_step": 534083, "epoch": 6434} {"train_loss": -27.486988067626953, "global_step": 534084, "epoch": 6434} {"train_loss": -27.7796688079834, "global_step": 534085, "epoch": 6434} {"train_loss": -27.879074096679688, "global_step": 534086, "epoch": 6434} {"train_loss": -27.809350967407227, "global_step": 534087, "epoch": 6434} {"train_loss": -27.61971092224121, "global_step": 534088, "epoch": 6434} {"train_loss": -27.578693389892578, "global_step": 534089, "epoch": 6434} {"train_loss": -27.47357177734375, "global_step": 534090, "epoch": 6434} {"train_loss": -27.556238174438477, "global_step": 534091, "epoch": 6434} {"train_loss": -27.67685890197754, "global_step": 534092, "epoch": 6434} {"train_loss": -27.858448028564453, "global_step": 534093, "epoch": 6434} {"train_loss": -27.89805030822754, "global_step": 534094, "epoch": 6434} {"train_loss": -27.973859786987305, "global_step": 534095, "epoch": 6434} {"train_loss": -27.585779190063477, "global_step": 534096, "epoch": 6434} {"train_loss": -27.652013778686523, "global_step": 534097, "epoch": 6434} {"train_loss": -27.674365997314453, "global_step": 534098, "epoch": 6434} {"train_loss": -27.7080020904541, "global_step": 534099, "epoch": 6434} {"train_loss": -27.705808639526367, "global_step": 534100, "epoch": 6434} {"train_loss": -27.668859481811523, "global_step": 534101, "epoch": 6434} {"train_loss": -27.59556007385254, "global_step": 534102, "epoch": 6434} {"train_loss": -27.83180046081543, "global_step": 534103, "epoch": 6434} {"train_loss": -27.200529236391365, "global_step": 534104, "epoch": 6434, "val_loss": 6552935.5} {"train_loss": -27.426427841186523, "global_step": 534105, "epoch": 6435} {"train_loss": -27.30777359008789, "global_step": 534106, "epoch": 6435} {"train_loss": -27.678747177124023, "global_step": 534107, "epoch": 6435} {"train_loss": -27.568267822265625, "global_step": 534108, "epoch": 6435} {"train_loss": -26.985132217407227, "global_step": 534109, "epoch": 6435} {"train_loss": -26.95374870300293, "global_step": 534110, "epoch": 6435} {"train_loss": -27.3859920501709, "global_step": 534111, "epoch": 6435} {"train_loss": -26.865514755249023, "global_step": 534112, "epoch": 6435} {"train_loss": -27.1251163482666, "global_step": 534113, "epoch": 6435} {"train_loss": -26.549604415893555, "global_step": 534114, "epoch": 6435} {"train_loss": -26.6221923828125, "global_step": 534115, "epoch": 6435} {"train_loss": -26.852497100830078, "global_step": 534116, "epoch": 6435} {"train_loss": -27.36353874206543, "global_step": 534117, "epoch": 6435} {"train_loss": -27.095617294311523, "global_step": 534118, "epoch": 6435} {"train_loss": -27.18292236328125, "global_step": 534119, "epoch": 6435} {"train_loss": -27.27520751953125, "global_step": 534120, "epoch": 6435} {"train_loss": -27.10418128967285, "global_step": 534121, "epoch": 6435} {"train_loss": -27.1397647857666, "global_step": 534122, "epoch": 6435} {"train_loss": -27.258197784423828, "global_step": 534123, "epoch": 6435} {"train_loss": -27.155059814453125, "global_step": 534124, "epoch": 6435} {"train_loss": -27.15900993347168, "global_step": 534125, "epoch": 6435} {"train_loss": -27.511571884155273, "global_step": 534126, "epoch": 6435} {"train_loss": -27.345468521118164, "global_step": 534127, "epoch": 6435} {"train_loss": -27.524280548095703, "global_step": 534128, "epoch": 6435} {"train_loss": -27.73345375061035, "global_step": 534129, "epoch": 6435} {"train_loss": -27.415979385375977, "global_step": 534130, "epoch": 6435} {"train_loss": -27.4478759765625, "global_step": 534131, "epoch": 6435} {"train_loss": -27.193161010742188, "global_step": 534132, "epoch": 6435} {"train_loss": -27.792749404907227, "global_step": 534133, "epoch": 6435} {"train_loss": -27.977750778198242, "global_step": 534134, "epoch": 6435} {"train_loss": -27.58633804321289, "global_step": 534135, "epoch": 6435} {"train_loss": -27.345678329467773, "global_step": 534136, "epoch": 6435} {"train_loss": -27.573593139648438, "global_step": 534137, "epoch": 6435} {"train_loss": -27.5379638671875, "global_step": 534138, "epoch": 6435} {"train_loss": -27.500320434570312, "global_step": 534139, "epoch": 6435} {"train_loss": -27.466291427612305, "global_step": 534140, "epoch": 6435} {"train_loss": -27.827295303344727, "global_step": 534141, "epoch": 6435} {"train_loss": -27.655981063842773, "global_step": 534142, "epoch": 6435} {"train_loss": -27.522052764892578, "global_step": 534143, "epoch": 6435} {"train_loss": -27.362262725830078, "global_step": 534144, "epoch": 6435} {"train_loss": -27.58918571472168, "global_step": 534145, "epoch": 6435} {"train_loss": -27.690753936767578, "global_step": 534146, "epoch": 6435} {"train_loss": -27.79229164123535, "global_step": 534147, "epoch": 6435} {"train_loss": -27.4431209564209, "global_step": 534148, "epoch": 6435} {"train_loss": -27.763809204101562, "global_step": 534149, "epoch": 6435} {"train_loss": -27.90500831604004, "global_step": 534150, "epoch": 6435} {"train_loss": -27.710834503173828, "global_step": 534151, "epoch": 6435} {"train_loss": -27.78388786315918, "global_step": 534152, "epoch": 6435} {"train_loss": -27.7570858001709, "global_step": 534153, "epoch": 6435} {"train_loss": -27.983190536499023, "global_step": 534154, "epoch": 6435} {"train_loss": -27.60392189025879, "global_step": 534155, "epoch": 6435} {"train_loss": -27.7497615814209, "global_step": 534156, "epoch": 6435} {"train_loss": -27.660871505737305, "global_step": 534157, "epoch": 6435} {"train_loss": -27.96866798400879, "global_step": 534158, "epoch": 6435} {"train_loss": -27.763479232788086, "global_step": 534159, "epoch": 6435} {"train_loss": -27.738508224487305, "global_step": 534160, "epoch": 6435} {"train_loss": -27.9168701171875, "global_step": 534161, "epoch": 6435} {"train_loss": -27.979711532592773, "global_step": 534162, "epoch": 6435} {"train_loss": -27.604663848876953, "global_step": 534163, "epoch": 6435} {"train_loss": -27.5900821685791, "global_step": 534164, "epoch": 6435} {"train_loss": -27.964191436767578, "global_step": 534165, "epoch": 6435} {"train_loss": -27.747827529907227, "global_step": 534166, "epoch": 6435} {"train_loss": -27.726703643798828, "global_step": 534167, "epoch": 6435} {"train_loss": -27.698362350463867, "global_step": 534168, "epoch": 6435} {"train_loss": -27.584976196289062, "global_step": 534169, "epoch": 6435} {"train_loss": -27.799985885620117, "global_step": 534170, "epoch": 6435} {"train_loss": -27.55902099609375, "global_step": 534171, "epoch": 6435} {"train_loss": -28.00385856628418, "global_step": 534172, "epoch": 6435} {"train_loss": -28.075138092041016, "global_step": 534173, "epoch": 6435} {"train_loss": -28.200042724609375, "global_step": 534174, "epoch": 6435} {"train_loss": -27.61929702758789, "global_step": 534175, "epoch": 6435} {"train_loss": -27.847198486328125, "global_step": 534176, "epoch": 6435} {"train_loss": -27.4931697845459, "global_step": 534177, "epoch": 6435} {"train_loss": -27.89777183532715, "global_step": 534178, "epoch": 6435} {"train_loss": -27.896942138671875, "global_step": 534179, "epoch": 6435} {"train_loss": -27.692480087280273, "global_step": 534180, "epoch": 6435} {"train_loss": -27.86264991760254, "global_step": 534181, "epoch": 6435} {"train_loss": -27.653650283813477, "global_step": 534182, "epoch": 6435} {"train_loss": -27.43946647644043, "global_step": 534183, "epoch": 6435} {"train_loss": -27.3028621673584, "global_step": 534184, "epoch": 6435} {"train_loss": -26.748132705688477, "global_step": 534185, "epoch": 6435} {"train_loss": -25.64143180847168, "global_step": 534186, "epoch": 6435} {"train_loss": -27.48860138582896, "global_step": 534187, "epoch": 6435, "val_loss": 6512632.0} {"train_loss": -25.964115142822266, "global_step": 534188, "epoch": 6436} {"train_loss": -26.14259147644043, "global_step": 534189, "epoch": 6436} {"train_loss": -26.422714233398438, "global_step": 534190, "epoch": 6436} {"train_loss": -25.825910568237305, "global_step": 534191, "epoch": 6436} {"train_loss": -26.28360939025879, "global_step": 534192, "epoch": 6436} {"train_loss": -26.52753257751465, "global_step": 534193, "epoch": 6436} {"train_loss": -26.646503448486328, "global_step": 534194, "epoch": 6436} {"train_loss": -26.291645050048828, "global_step": 534195, "epoch": 6436} {"train_loss": -26.876272201538086, "global_step": 534196, "epoch": 6436} {"train_loss": -26.349411010742188, "global_step": 534197, "epoch": 6436} {"train_loss": -26.61138916015625, "global_step": 534198, "epoch": 6436} {"train_loss": -26.917688369750977, "global_step": 534199, "epoch": 6436} {"train_loss": -27.017353057861328, "global_step": 534200, "epoch": 6436} {"train_loss": -27.005640029907227, "global_step": 534201, "epoch": 6436} {"train_loss": -26.77886962890625, "global_step": 534202, "epoch": 6436} {"train_loss": -27.19942283630371, "global_step": 534203, "epoch": 6436} {"train_loss": -27.265411376953125, "global_step": 534204, "epoch": 6436} {"train_loss": -26.901227951049805, "global_step": 534205, "epoch": 6436} {"train_loss": -26.699176788330078, "global_step": 534206, "epoch": 6436} {"train_loss": -27.114511489868164, "global_step": 534207, "epoch": 6436} {"train_loss": -27.449216842651367, "global_step": 534208, "epoch": 6436} {"train_loss": -27.139997482299805, "global_step": 534209, "epoch": 6436} {"train_loss": -27.073719024658203, "global_step": 534210, "epoch": 6436} {"train_loss": -27.119665145874023, "global_step": 534211, "epoch": 6436} {"train_loss": -27.45416259765625, "global_step": 534212, "epoch": 6436} {"train_loss": -27.239795684814453, "global_step": 534213, "epoch": 6436} {"train_loss": -27.002771377563477, "global_step": 534214, "epoch": 6436} {"train_loss": -27.12644386291504, "global_step": 534215, "epoch": 6436} {"train_loss": -27.425567626953125, "global_step": 534216, "epoch": 6436} {"train_loss": -27.3924503326416, "global_step": 534217, "epoch": 6436} {"train_loss": -26.944665908813477, "global_step": 534218, "epoch": 6436} {"train_loss": -27.1517333984375, "global_step": 534219, "epoch": 6436} {"train_loss": -27.35955810546875, "global_step": 534220, "epoch": 6436} {"train_loss": -27.462194442749023, "global_step": 534221, "epoch": 6436} {"train_loss": -27.182409286499023, "global_step": 534222, "epoch": 6436} {"train_loss": -27.307371139526367, "global_step": 534223, "epoch": 6436} {"train_loss": -27.66840934753418, "global_step": 534224, "epoch": 6436} {"train_loss": -27.3426570892334, "global_step": 534225, "epoch": 6436} {"train_loss": -27.327850341796875, "global_step": 534226, "epoch": 6436} {"train_loss": -27.71221923828125, "global_step": 534227, "epoch": 6436} {"train_loss": -27.68253517150879, "global_step": 534228, "epoch": 6436} {"train_loss": -27.378015518188477, "global_step": 534229, "epoch": 6436} {"train_loss": -27.358346939086914, "global_step": 534230, "epoch": 6436} {"train_loss": -27.868505477905273, "global_step": 534231, "epoch": 6436} {"train_loss": -27.4658145904541, "global_step": 534232, "epoch": 6436} {"train_loss": -27.903303146362305, "global_step": 534233, "epoch": 6436} {"train_loss": -27.93320655822754, "global_step": 534234, "epoch": 6436} {"train_loss": -27.723196029663086, "global_step": 534235, "epoch": 6436} {"train_loss": -27.840185165405273, "global_step": 534236, "epoch": 6436} {"train_loss": -28.101831436157227, "global_step": 534237, "epoch": 6436} {"train_loss": -27.973804473876953, "global_step": 534238, "epoch": 6436} {"train_loss": -27.500476837158203, "global_step": 534239, "epoch": 6436} {"train_loss": -27.97772216796875, "global_step": 534240, "epoch": 6436} {"train_loss": -27.423070907592773, "global_step": 534241, "epoch": 6436} {"train_loss": -27.61370277404785, "global_step": 534242, "epoch": 6436} {"train_loss": -27.72466468811035, "global_step": 534243, "epoch": 6436} {"train_loss": -27.50543785095215, "global_step": 534244, "epoch": 6436} {"train_loss": -27.811193466186523, "global_step": 534245, "epoch": 6436} {"train_loss": -28.13629150390625, "global_step": 534246, "epoch": 6436} {"train_loss": -27.973657608032227, "global_step": 534247, "epoch": 6436} {"train_loss": -27.31731605529785, "global_step": 534248, "epoch": 6436} {"train_loss": -28.025033950805664, "global_step": 534249, "epoch": 6436} {"train_loss": -27.762165069580078, "global_step": 534250, "epoch": 6436} {"train_loss": -27.54755973815918, "global_step": 534251, "epoch": 6436} {"train_loss": -27.8511962890625, "global_step": 534252, "epoch": 6436} {"train_loss": -27.79799461364746, "global_step": 534253, "epoch": 6436} {"train_loss": -27.721601486206055, "global_step": 534254, "epoch": 6436} {"train_loss": -28.02497673034668, "global_step": 534255, "epoch": 6436} {"train_loss": -27.867938995361328, "global_step": 534256, "epoch": 6436} {"train_loss": -27.505414962768555, "global_step": 534257, "epoch": 6436} {"train_loss": -27.10369873046875, "global_step": 534258, "epoch": 6436} {"train_loss": -27.308652877807617, "global_step": 534259, "epoch": 6436} {"train_loss": -26.76291275024414, "global_step": 534260, "epoch": 6436} {"train_loss": -26.311365127563477, "global_step": 534261, "epoch": 6436} {"train_loss": -27.15484046936035, "global_step": 534262, "epoch": 6436} {"train_loss": -27.336959838867188, "global_step": 534263, "epoch": 6436} {"train_loss": -27.270700454711914, "global_step": 534264, "epoch": 6436} {"train_loss": -27.491575241088867, "global_step": 534265, "epoch": 6436} {"train_loss": -27.382795333862305, "global_step": 534266, "epoch": 6436} {"train_loss": -27.827960968017578, "global_step": 534267, "epoch": 6436} {"train_loss": -26.95623779296875, "global_step": 534268, "epoch": 6436} {"train_loss": -27.565099716186523, "global_step": 534269, "epoch": 6436} {"train_loss": -27.293324137308513, "global_step": 534270, "epoch": 6436, "val_loss": 6551631.0} {"train_loss": -27.08436393737793, "global_step": 534271, "epoch": 6437} {"train_loss": -26.88128662109375, "global_step": 534272, "epoch": 6437} {"train_loss": -26.529205322265625, "global_step": 534273, "epoch": 6437} {"train_loss": -26.654172897338867, "global_step": 534274, "epoch": 6437} {"train_loss": -27.033111572265625, "global_step": 534275, "epoch": 6437} {"train_loss": -26.96186637878418, "global_step": 534276, "epoch": 6437} {"train_loss": -26.971942901611328, "global_step": 534277, "epoch": 6437} {"train_loss": -27.140613555908203, "global_step": 534278, "epoch": 6437} {"train_loss": -27.436599731445312, "global_step": 534279, "epoch": 6437} {"train_loss": -27.3972225189209, "global_step": 534280, "epoch": 6437} {"train_loss": -27.076807022094727, "global_step": 534281, "epoch": 6437} {"train_loss": -27.328937530517578, "global_step": 534282, "epoch": 6437} {"train_loss": -27.10406494140625, "global_step": 534283, "epoch": 6437} {"train_loss": -27.185916900634766, "global_step": 534284, "epoch": 6437} {"train_loss": -27.352985382080078, "global_step": 534285, "epoch": 6437} {"train_loss": -27.5211238861084, "global_step": 534286, "epoch": 6437} {"train_loss": -27.1412410736084, "global_step": 534287, "epoch": 6437} {"train_loss": -27.421783447265625, "global_step": 534288, "epoch": 6437} {"train_loss": -27.192066192626953, "global_step": 534289, "epoch": 6437} {"train_loss": -27.116443634033203, "global_step": 534290, "epoch": 6437} {"train_loss": -27.667081832885742, "global_step": 534291, "epoch": 6437} {"train_loss": -27.298303604125977, "global_step": 534292, "epoch": 6437} {"train_loss": -27.38844108581543, "global_step": 534293, "epoch": 6437} {"train_loss": -27.850927352905273, "global_step": 534294, "epoch": 6437} {"train_loss": -27.693506240844727, "global_step": 534295, "epoch": 6437} {"train_loss": -27.545642852783203, "global_step": 534296, "epoch": 6437} {"train_loss": -27.62904167175293, "global_step": 534297, "epoch": 6437} {"train_loss": -27.881549835205078, "global_step": 534298, "epoch": 6437} {"train_loss": -27.764633178710938, "global_step": 534299, "epoch": 6437} {"train_loss": -27.7991943359375, "global_step": 534300, "epoch": 6437} {"train_loss": -27.57158851623535, "global_step": 534301, "epoch": 6437} {"train_loss": -27.7828311920166, "global_step": 534302, "epoch": 6437} {"train_loss": -27.857328414916992, "global_step": 534303, "epoch": 6437} {"train_loss": -27.771589279174805, "global_step": 534304, "epoch": 6437} {"train_loss": -27.550342559814453, "global_step": 534305, "epoch": 6437} {"train_loss": -27.36056900024414, "global_step": 534306, "epoch": 6437} {"train_loss": -27.567249298095703, "global_step": 534307, "epoch": 6437} {"train_loss": -27.754730224609375, "global_step": 534308, "epoch": 6437} {"train_loss": -27.606393814086914, "global_step": 534309, "epoch": 6437} {"train_loss": -27.525693893432617, "global_step": 534310, "epoch": 6437} {"train_loss": -27.796283721923828, "global_step": 534311, "epoch": 6437} {"train_loss": -28.000585556030273, "global_step": 534312, "epoch": 6437} {"train_loss": -27.599206924438477, "global_step": 534313, "epoch": 6437} {"train_loss": -27.63932228088379, "global_step": 534314, "epoch": 6437} {"train_loss": -27.62098503112793, "global_step": 534315, "epoch": 6437} {"train_loss": -27.78144645690918, "global_step": 534316, "epoch": 6437} {"train_loss": -27.6101131439209, "global_step": 534317, "epoch": 6437} {"train_loss": -27.862852096557617, "global_step": 534318, "epoch": 6437} {"train_loss": -27.669052124023438, "global_step": 534319, "epoch": 6437} {"train_loss": -27.98126220703125, "global_step": 534320, "epoch": 6437} {"train_loss": -27.8017635345459, "global_step": 534321, "epoch": 6437} {"train_loss": -27.59284019470215, "global_step": 534322, "epoch": 6437} {"train_loss": -27.99125099182129, "global_step": 534323, "epoch": 6437} {"train_loss": -27.647871017456055, "global_step": 534324, "epoch": 6437} {"train_loss": -27.566259384155273, "global_step": 534325, "epoch": 6437} {"train_loss": -27.281234741210938, "global_step": 534326, "epoch": 6437} {"train_loss": -27.392873764038086, "global_step": 534327, "epoch": 6437} {"train_loss": -27.1097354888916, "global_step": 534328, "epoch": 6437} {"train_loss": -27.20631980895996, "global_step": 534329, "epoch": 6437} {"train_loss": -27.606525421142578, "global_step": 534330, "epoch": 6437} {"train_loss": -27.953577041625977, "global_step": 534331, "epoch": 6437} {"train_loss": -27.950719833374023, "global_step": 534332, "epoch": 6437} {"train_loss": -27.778329849243164, "global_step": 534333, "epoch": 6437} {"train_loss": -27.64328384399414, "global_step": 534334, "epoch": 6437} {"train_loss": -27.850446701049805, "global_step": 534335, "epoch": 6437} {"train_loss": -27.76746940612793, "global_step": 534336, "epoch": 6437} {"train_loss": -27.66790771484375, "global_step": 534337, "epoch": 6437} {"train_loss": -27.75971794128418, "global_step": 534338, "epoch": 6437} {"train_loss": -27.734777450561523, "global_step": 534339, "epoch": 6437} {"train_loss": -27.676349639892578, "global_step": 534340, "epoch": 6437} {"train_loss": -28.061315536499023, "global_step": 534341, "epoch": 6437} {"train_loss": -27.70900535583496, "global_step": 534342, "epoch": 6437} {"train_loss": -27.7857666015625, "global_step": 534343, "epoch": 6437} {"train_loss": -27.462329864501953, "global_step": 534344, "epoch": 6437} {"train_loss": -27.748205184936523, "global_step": 534345, "epoch": 6437} {"train_loss": -27.7598876953125, "global_step": 534346, "epoch": 6437} {"train_loss": -27.677534103393555, "global_step": 534347, "epoch": 6437} {"train_loss": -27.107955932617188, "global_step": 534348, "epoch": 6437} {"train_loss": -27.17145347595215, "global_step": 534349, "epoch": 6437} {"train_loss": -27.154142379760742, "global_step": 534350, "epoch": 6437} {"train_loss": -27.265043258666992, "global_step": 534351, "epoch": 6437} {"train_loss": -28.230741500854492, "global_step": 534352, "epoch": 6437} {"train_loss": -27.532123312892683, "global_step": 534353, "epoch": 6437, "val_loss": 6540668.5} {"train_loss": -27.379602432250977, "global_step": 534354, "epoch": 6438} {"train_loss": -26.890310287475586, "global_step": 534355, "epoch": 6438} {"train_loss": -27.25129508972168, "global_step": 534356, "epoch": 6438} {"train_loss": -26.933002471923828, "global_step": 534357, "epoch": 6438} {"train_loss": -26.88210105895996, "global_step": 534358, "epoch": 6438} {"train_loss": -27.341779708862305, "global_step": 534359, "epoch": 6438} {"train_loss": -27.162405014038086, "global_step": 534360, "epoch": 6438} {"train_loss": -27.427871704101562, "global_step": 534361, "epoch": 6438} {"train_loss": -26.888080596923828, "global_step": 534362, "epoch": 6438} {"train_loss": -26.501834869384766, "global_step": 534363, "epoch": 6438} {"train_loss": -27.058801651000977, "global_step": 534364, "epoch": 6438} {"train_loss": -27.16864013671875, "global_step": 534365, "epoch": 6438} {"train_loss": -27.0347957611084, "global_step": 534366, "epoch": 6438} {"train_loss": -27.21600914001465, "global_step": 534367, "epoch": 6438} {"train_loss": -26.975549697875977, "global_step": 534368, "epoch": 6438} {"train_loss": -27.142648696899414, "global_step": 534369, "epoch": 6438} {"train_loss": -27.37912368774414, "global_step": 534370, "epoch": 6438} {"train_loss": -26.980810165405273, "global_step": 534371, "epoch": 6438} {"train_loss": -27.4268798828125, "global_step": 534372, "epoch": 6438} {"train_loss": -27.377426147460938, "global_step": 534373, "epoch": 6438} {"train_loss": -27.05377769470215, "global_step": 534374, "epoch": 6438} {"train_loss": -26.929092407226562, "global_step": 534375, "epoch": 6438} {"train_loss": -27.110280990600586, "global_step": 534376, "epoch": 6438} {"train_loss": -27.52324867248535, "global_step": 534377, "epoch": 6438} {"train_loss": -27.340795516967773, "global_step": 534378, "epoch": 6438} {"train_loss": -26.9564151763916, "global_step": 534379, "epoch": 6438} {"train_loss": -27.241809844970703, "global_step": 534380, "epoch": 6438} {"train_loss": -27.42380714416504, "global_step": 534381, "epoch": 6438} {"train_loss": -27.543811798095703, "global_step": 534382, "epoch": 6438} {"train_loss": -27.439666748046875, "global_step": 534383, "epoch": 6438} {"train_loss": -27.226972579956055, "global_step": 534384, "epoch": 6438} {"train_loss": -27.826932907104492, "global_step": 534385, "epoch": 6438} {"train_loss": -27.34796142578125, "global_step": 534386, "epoch": 6438} {"train_loss": -27.25703239440918, "global_step": 534387, "epoch": 6438} {"train_loss": -27.892847061157227, "global_step": 534388, "epoch": 6438} {"train_loss": -27.753238677978516, "global_step": 534389, "epoch": 6438} {"train_loss": -27.74932289123535, "global_step": 534390, "epoch": 6438} {"train_loss": -27.618820190429688, "global_step": 534391, "epoch": 6438} {"train_loss": -27.784635543823242, "global_step": 534392, "epoch": 6438} {"train_loss": -27.251760482788086, "global_step": 534393, "epoch": 6438} {"train_loss": -27.568115234375, "global_step": 534394, "epoch": 6438} {"train_loss": -27.524442672729492, "global_step": 534395, "epoch": 6438} {"train_loss": -27.28606605529785, "global_step": 534396, "epoch": 6438} {"train_loss": -27.25284767150879, "global_step": 534397, "epoch": 6438} {"train_loss": -27.612695693969727, "global_step": 534398, "epoch": 6438} {"train_loss": -27.79278564453125, "global_step": 534399, "epoch": 6438} {"train_loss": -27.793100357055664, "global_step": 534400, "epoch": 6438} {"train_loss": -27.538537979125977, "global_step": 534401, "epoch": 6438} {"train_loss": -27.42620849609375, "global_step": 534402, "epoch": 6438} {"train_loss": -27.597326278686523, "global_step": 534403, "epoch": 6438} {"train_loss": -27.85235595703125, "global_step": 534404, "epoch": 6438} {"train_loss": -27.45892906188965, "global_step": 534405, "epoch": 6438} {"train_loss": -27.512104034423828, "global_step": 534406, "epoch": 6438} {"train_loss": -27.356388092041016, "global_step": 534407, "epoch": 6438} {"train_loss": -27.45387077331543, "global_step": 534408, "epoch": 6438} {"train_loss": -27.686201095581055, "global_step": 534409, "epoch": 6438} {"train_loss": -27.496850967407227, "global_step": 534410, "epoch": 6438} {"train_loss": -27.92557716369629, "global_step": 534411, "epoch": 6438} {"train_loss": -27.786413192749023, "global_step": 534412, "epoch": 6438} {"train_loss": -27.790674209594727, "global_step": 534413, "epoch": 6438} {"train_loss": -27.592344284057617, "global_step": 534414, "epoch": 6438} {"train_loss": -27.58978271484375, "global_step": 534415, "epoch": 6438} {"train_loss": -27.926435470581055, "global_step": 534416, "epoch": 6438} {"train_loss": -27.716053009033203, "global_step": 534417, "epoch": 6438} {"train_loss": -27.83231544494629, "global_step": 534418, "epoch": 6438} {"train_loss": -27.50269889831543, "global_step": 534419, "epoch": 6438} {"train_loss": -27.25326919555664, "global_step": 534420, "epoch": 6438} {"train_loss": -27.77542495727539, "global_step": 534421, "epoch": 6438} {"train_loss": -27.771331787109375, "global_step": 534422, "epoch": 6438} {"train_loss": -27.583906173706055, "global_step": 534423, "epoch": 6438} {"train_loss": -27.72330093383789, "global_step": 534424, "epoch": 6438} {"train_loss": -27.77969741821289, "global_step": 534425, "epoch": 6438} {"train_loss": -27.766559600830078, "global_step": 534426, "epoch": 6438} {"train_loss": -27.707122802734375, "global_step": 534427, "epoch": 6438} {"train_loss": -27.3354434967041, "global_step": 534428, "epoch": 6438} {"train_loss": -26.909286499023438, "global_step": 534429, "epoch": 6438} {"train_loss": -27.299840927124023, "global_step": 534430, "epoch": 6438} {"train_loss": -27.642566680908203, "global_step": 534431, "epoch": 6438} {"train_loss": -27.164228439331055, "global_step": 534432, "epoch": 6438} {"train_loss": -27.08326530456543, "global_step": 534433, "epoch": 6438} {"train_loss": -27.524860382080078, "global_step": 534434, "epoch": 6438} {"train_loss": -27.53085708618164, "global_step": 534435, "epoch": 6438} {"train_loss": -27.427010501723693, "global_step": 534436, "epoch": 6438, "val_loss": 6581613.0} {"train_loss": -25.926496505737305, "global_step": 534437, "epoch": 6439} {"train_loss": -26.591394424438477, "global_step": 534438, "epoch": 6439} {"train_loss": -26.983762741088867, "global_step": 534439, "epoch": 6439} {"train_loss": -26.226720809936523, "global_step": 534440, "epoch": 6439} {"train_loss": -26.425466537475586, "global_step": 534441, "epoch": 6439} {"train_loss": -27.134845733642578, "global_step": 534442, "epoch": 6439} {"train_loss": -26.0157413482666, "global_step": 534443, "epoch": 6439} {"train_loss": -26.967679977416992, "global_step": 534444, "epoch": 6439} {"train_loss": -26.800275802612305, "global_step": 534445, "epoch": 6439} {"train_loss": -26.69866371154785, "global_step": 534446, "epoch": 6439} {"train_loss": -27.182209014892578, "global_step": 534447, "epoch": 6439} {"train_loss": -26.830259323120117, "global_step": 534448, "epoch": 6439} {"train_loss": -27.418371200561523, "global_step": 534449, "epoch": 6439} {"train_loss": -27.209924697875977, "global_step": 534450, "epoch": 6439} {"train_loss": -27.112323760986328, "global_step": 534451, "epoch": 6439} {"train_loss": -27.15771484375, "global_step": 534452, "epoch": 6439} {"train_loss": -27.45703125, "global_step": 534453, "epoch": 6439} {"train_loss": -27.390466690063477, "global_step": 534454, "epoch": 6439} {"train_loss": -26.9561824798584, "global_step": 534455, "epoch": 6439} {"train_loss": -27.22786521911621, "global_step": 534456, "epoch": 6439} {"train_loss": -27.422473907470703, "global_step": 534457, "epoch": 6439} {"train_loss": -26.972213745117188, "global_step": 534458, "epoch": 6439} {"train_loss": -27.124418258666992, "global_step": 534459, "epoch": 6439} {"train_loss": -26.90732765197754, "global_step": 534460, "epoch": 6439} {"train_loss": -27.690631866455078, "global_step": 534461, "epoch": 6439} {"train_loss": -27.25998306274414, "global_step": 534462, "epoch": 6439} {"train_loss": -27.425189971923828, "global_step": 534463, "epoch": 6439} {"train_loss": -27.40675926208496, "global_step": 534464, "epoch": 6439} {"train_loss": -27.245742797851562, "global_step": 534465, "epoch": 6439} {"train_loss": -27.298315048217773, "global_step": 534466, "epoch": 6439} {"train_loss": -27.499011993408203, "global_step": 534467, "epoch": 6439} {"train_loss": -27.4981632232666, "global_step": 534468, "epoch": 6439} {"train_loss": -27.782499313354492, "global_step": 534469, "epoch": 6439} {"train_loss": -27.689611434936523, "global_step": 534470, "epoch": 6439} {"train_loss": -27.754865646362305, "global_step": 534471, "epoch": 6439} {"train_loss": -27.72883415222168, "global_step": 534472, "epoch": 6439} {"train_loss": -28.0037899017334, "global_step": 534473, "epoch": 6439} {"train_loss": -27.64753532409668, "global_step": 534474, "epoch": 6439} {"train_loss": -27.416431427001953, "global_step": 534475, "epoch": 6439} {"train_loss": -27.68208122253418, "global_step": 534476, "epoch": 6439} {"train_loss": -27.349292755126953, "global_step": 534477, "epoch": 6439} {"train_loss": -27.444660186767578, "global_step": 534478, "epoch": 6439} {"train_loss": -27.770034790039062, "global_step": 534479, "epoch": 6439} {"train_loss": -27.829421997070312, "global_step": 534480, "epoch": 6439} {"train_loss": -27.573257446289062, "global_step": 534481, "epoch": 6439} {"train_loss": -27.59284782409668, "global_step": 534482, "epoch": 6439} {"train_loss": -27.31306266784668, "global_step": 534483, "epoch": 6439} {"train_loss": -27.553144454956055, "global_step": 534484, "epoch": 6439} {"train_loss": -27.835798263549805, "global_step": 534485, "epoch": 6439} {"train_loss": -27.747303009033203, "global_step": 534486, "epoch": 6439} {"train_loss": -27.658161163330078, "global_step": 534487, "epoch": 6439} {"train_loss": -27.966794967651367, "global_step": 534488, "epoch": 6439} {"train_loss": -27.82712173461914, "global_step": 534489, "epoch": 6439} {"train_loss": -27.90167808532715, "global_step": 534490, "epoch": 6439} {"train_loss": -27.39910316467285, "global_step": 534491, "epoch": 6439} {"train_loss": -27.72478675842285, "global_step": 534492, "epoch": 6439} {"train_loss": -27.538562774658203, "global_step": 534493, "epoch": 6439} {"train_loss": -27.92409324645996, "global_step": 534494, "epoch": 6439} {"train_loss": -27.948272705078125, "global_step": 534495, "epoch": 6439} {"train_loss": -27.738672256469727, "global_step": 534496, "epoch": 6439} {"train_loss": -27.7542724609375, "global_step": 534497, "epoch": 6439} {"train_loss": -27.948572158813477, "global_step": 534498, "epoch": 6439} {"train_loss": -28.418127059936523, "global_step": 534499, "epoch": 6439} {"train_loss": -27.759323120117188, "global_step": 534500, "epoch": 6439} {"train_loss": -27.437280654907227, "global_step": 534501, "epoch": 6439} {"train_loss": -26.707294464111328, "global_step": 534502, "epoch": 6439} {"train_loss": -26.5460147857666, "global_step": 534503, "epoch": 6439} {"train_loss": -26.812332153320312, "global_step": 534504, "epoch": 6439} {"train_loss": -27.01796531677246, "global_step": 534505, "epoch": 6439} {"train_loss": -27.69552993774414, "global_step": 534506, "epoch": 6439} {"train_loss": -27.47117042541504, "global_step": 534507, "epoch": 6439} {"train_loss": -27.1693172454834, "global_step": 534508, "epoch": 6439} {"train_loss": -27.49171257019043, "global_step": 534509, "epoch": 6439} {"train_loss": -27.680089950561523, "global_step": 534510, "epoch": 6439} {"train_loss": -27.054243087768555, "global_step": 534511, "epoch": 6439} {"train_loss": -27.32535743713379, "global_step": 534512, "epoch": 6439} {"train_loss": -27.240392684936523, "global_step": 534513, "epoch": 6439} {"train_loss": -26.806751251220703, "global_step": 534514, "epoch": 6439} {"train_loss": -27.277027130126953, "global_step": 534515, "epoch": 6439} {"train_loss": -27.6453857421875, "global_step": 534516, "epoch": 6439} {"train_loss": -27.108251571655273, "global_step": 534517, "epoch": 6439} {"train_loss": -26.818161010742188, "global_step": 534518, "epoch": 6439} {"train_loss": -27.33798008654491, "global_step": 534519, "epoch": 6439, "val_loss": 6657078.0} {"train_loss": -26.803159713745117, "global_step": 534520, "epoch": 6440} {"train_loss": -26.579730987548828, "global_step": 534521, "epoch": 6440} {"train_loss": -26.714941024780273, "global_step": 534522, "epoch": 6440} {"train_loss": -26.989110946655273, "global_step": 534523, "epoch": 6440} {"train_loss": -26.0401611328125, "global_step": 534524, "epoch": 6440} {"train_loss": -27.059967041015625, "global_step": 534525, "epoch": 6440} {"train_loss": -26.03419303894043, "global_step": 534526, "epoch": 6440} {"train_loss": -27.049909591674805, "global_step": 534527, "epoch": 6440} {"train_loss": -26.953857421875, "global_step": 534528, "epoch": 6440} {"train_loss": -26.41973304748535, "global_step": 534529, "epoch": 6440} {"train_loss": -26.977853775024414, "global_step": 534530, "epoch": 6440} {"train_loss": -26.648040771484375, "global_step": 534531, "epoch": 6440} {"train_loss": -27.19880485534668, "global_step": 534532, "epoch": 6440} {"train_loss": -26.563318252563477, "global_step": 534533, "epoch": 6440} {"train_loss": -27.030841827392578, "global_step": 534534, "epoch": 6440} {"train_loss": -27.4894962310791, "global_step": 534535, "epoch": 6440} {"train_loss": -27.192392349243164, "global_step": 534536, "epoch": 6440} {"train_loss": -27.185422897338867, "global_step": 534537, "epoch": 6440} {"train_loss": -27.532794952392578, "global_step": 534538, "epoch": 6440} {"train_loss": -27.268198013305664, "global_step": 534539, "epoch": 6440} {"train_loss": -27.60222816467285, "global_step": 534540, "epoch": 6440} {"train_loss": -27.195953369140625, "global_step": 534541, "epoch": 6440} {"train_loss": -27.274703979492188, "global_step": 534542, "epoch": 6440} {"train_loss": -27.16011619567871, "global_step": 534543, "epoch": 6440} {"train_loss": -27.45380210876465, "global_step": 534544, "epoch": 6440} {"train_loss": -27.606189727783203, "global_step": 534545, "epoch": 6440} {"train_loss": -27.674304962158203, "global_step": 534546, "epoch": 6440} {"train_loss": -27.20928955078125, "global_step": 534547, "epoch": 6440} {"train_loss": -27.859527587890625, "global_step": 534548, "epoch": 6440} {"train_loss": -27.4566593170166, "global_step": 534549, "epoch": 6440} {"train_loss": -27.239078521728516, "global_step": 534550, "epoch": 6440} {"train_loss": -27.559585571289062, "global_step": 534551, "epoch": 6440} {"train_loss": -27.617176055908203, "global_step": 534552, "epoch": 6440} {"train_loss": -27.519794464111328, "global_step": 534553, "epoch": 6440} {"train_loss": -27.706029891967773, "global_step": 534554, "epoch": 6440} {"train_loss": -27.704267501831055, "global_step": 534555, "epoch": 6440} {"train_loss": -27.979154586791992, "global_step": 534556, "epoch": 6440} {"train_loss": -27.91375732421875, "global_step": 534557, "epoch": 6440} {"train_loss": -27.665973663330078, "global_step": 534558, "epoch": 6440} {"train_loss": -27.284137725830078, "global_step": 534559, "epoch": 6440} {"train_loss": -27.83027458190918, "global_step": 534560, "epoch": 6440} {"train_loss": -27.582202911376953, "global_step": 534561, "epoch": 6440} {"train_loss": -27.32512855529785, "global_step": 534562, "epoch": 6440} {"train_loss": -27.542285919189453, "global_step": 534563, "epoch": 6440} {"train_loss": -27.412342071533203, "global_step": 534564, "epoch": 6440} {"train_loss": -27.500463485717773, "global_step": 534565, "epoch": 6440} {"train_loss": -27.68096923828125, "global_step": 534566, "epoch": 6440} {"train_loss": -27.974035263061523, "global_step": 534567, "epoch": 6440} {"train_loss": -28.023025512695312, "global_step": 534568, "epoch": 6440} {"train_loss": -27.738866806030273, "global_step": 534569, "epoch": 6440} {"train_loss": -27.8847713470459, "global_step": 534570, "epoch": 6440} {"train_loss": -27.637832641601562, "global_step": 534571, "epoch": 6440} {"train_loss": -27.191543579101562, "global_step": 534572, "epoch": 6440} {"train_loss": -27.408191680908203, "global_step": 534573, "epoch": 6440} {"train_loss": -27.933347702026367, "global_step": 534574, "epoch": 6440} {"train_loss": -27.89192008972168, "global_step": 534575, "epoch": 6440} {"train_loss": -27.502004623413086, "global_step": 534576, "epoch": 6440} {"train_loss": -27.466415405273438, "global_step": 534577, "epoch": 6440} {"train_loss": -27.651870727539062, "global_step": 534578, "epoch": 6440} {"train_loss": -27.428302764892578, "global_step": 534579, "epoch": 6440} {"train_loss": -27.5754337310791, "global_step": 534580, "epoch": 6440} {"train_loss": -27.38068199157715, "global_step": 534581, "epoch": 6440} {"train_loss": -27.484790802001953, "global_step": 534582, "epoch": 6440} {"train_loss": -27.568161010742188, "global_step": 534583, "epoch": 6440} {"train_loss": -27.332077026367188, "global_step": 534584, "epoch": 6440} {"train_loss": -27.712421417236328, "global_step": 534585, "epoch": 6440} {"train_loss": -27.79969596862793, "global_step": 534586, "epoch": 6440} {"train_loss": -27.718555450439453, "global_step": 534587, "epoch": 6440} {"train_loss": -27.65976905822754, "global_step": 534588, "epoch": 6440} {"train_loss": -27.688343048095703, "global_step": 534589, "epoch": 6440} {"train_loss": -27.776905059814453, "global_step": 534590, "epoch": 6440} {"train_loss": -27.42793083190918, "global_step": 534591, "epoch": 6440} {"train_loss": -27.797178268432617, "global_step": 534592, "epoch": 6440} {"train_loss": -28.034469604492188, "global_step": 534593, "epoch": 6440} {"train_loss": -28.044788360595703, "global_step": 534594, "epoch": 6440} {"train_loss": -27.54917335510254, "global_step": 534595, "epoch": 6440} {"train_loss": -27.8503360748291, "global_step": 534596, "epoch": 6440} {"train_loss": -27.597116470336914, "global_step": 534597, "epoch": 6440} {"train_loss": -27.37813377380371, "global_step": 534598, "epoch": 6440} {"train_loss": -27.49708366394043, "global_step": 534599, "epoch": 6440} {"train_loss": -27.839441299438477, "global_step": 534600, "epoch": 6440} {"train_loss": -27.736408233642578, "global_step": 534601, "epoch": 6440} {"train_loss": -27.415657824780567, "global_step": 534602, "epoch": 6440, "val_loss": 6591155.5} {"train_loss": -26.382186889648438, "global_step": 534603, "epoch": 6441} {"train_loss": -25.177963256835938, "global_step": 534604, "epoch": 6441} {"train_loss": -26.48343276977539, "global_step": 534605, "epoch": 6441} {"train_loss": -26.681171417236328, "global_step": 534606, "epoch": 6441} {"train_loss": -26.038665771484375, "global_step": 534607, "epoch": 6441} {"train_loss": -27.134428024291992, "global_step": 534608, "epoch": 6441} {"train_loss": -26.666351318359375, "global_step": 534609, "epoch": 6441} {"train_loss": -26.580636978149414, "global_step": 534610, "epoch": 6441} {"train_loss": -26.807830810546875, "global_step": 534611, "epoch": 6441} {"train_loss": -26.837650299072266, "global_step": 534612, "epoch": 6441} {"train_loss": -27.179840087890625, "global_step": 534613, "epoch": 6441} {"train_loss": -26.7463321685791, "global_step": 534614, "epoch": 6441} {"train_loss": -27.224933624267578, "global_step": 534615, "epoch": 6441} {"train_loss": -27.114355087280273, "global_step": 534616, "epoch": 6441} {"train_loss": -27.263269424438477, "global_step": 534617, "epoch": 6441} {"train_loss": -27.070392608642578, "global_step": 534618, "epoch": 6441} {"train_loss": -27.129913330078125, "global_step": 534619, "epoch": 6441} {"train_loss": -27.18915367126465, "global_step": 534620, "epoch": 6441} {"train_loss": -27.237995147705078, "global_step": 534621, "epoch": 6441} {"train_loss": -26.8878173828125, "global_step": 534622, "epoch": 6441} {"train_loss": -27.1470890045166, "global_step": 534623, "epoch": 6441} {"train_loss": -27.415048599243164, "global_step": 534624, "epoch": 6441} {"train_loss": -27.33137321472168, "global_step": 534625, "epoch": 6441} {"train_loss": -27.197980880737305, "global_step": 534626, "epoch": 6441} {"train_loss": -27.4139347076416, "global_step": 534627, "epoch": 6441} {"train_loss": -27.742345809936523, "global_step": 534628, "epoch": 6441} {"train_loss": -27.381025314331055, "global_step": 534629, "epoch": 6441} {"train_loss": -27.918848037719727, "global_step": 534630, "epoch": 6441} {"train_loss": -27.615705490112305, "global_step": 534631, "epoch": 6441} {"train_loss": -27.717315673828125, "global_step": 534632, "epoch": 6441} {"train_loss": -27.724206924438477, "global_step": 534633, "epoch": 6441} {"train_loss": -27.565656661987305, "global_step": 534634, "epoch": 6441} {"train_loss": -27.805007934570312, "global_step": 534635, "epoch": 6441} {"train_loss": -27.618915557861328, "global_step": 534636, "epoch": 6441} {"train_loss": -27.530975341796875, "global_step": 534637, "epoch": 6441} {"train_loss": -27.802478790283203, "global_step": 534638, "epoch": 6441} {"train_loss": -28.054874420166016, "global_step": 534639, "epoch": 6441} {"train_loss": -28.19720458984375, "global_step": 534640, "epoch": 6441} {"train_loss": -27.755109786987305, "global_step": 534641, "epoch": 6441} {"train_loss": -27.95685386657715, "global_step": 534642, "epoch": 6441} {"train_loss": -27.529504776000977, "global_step": 534643, "epoch": 6441} {"train_loss": -26.964139938354492, "global_step": 534644, "epoch": 6441} {"train_loss": -27.301578521728516, "global_step": 534645, "epoch": 6441} {"train_loss": -27.49295425415039, "global_step": 534646, "epoch": 6441} {"train_loss": -27.439075469970703, "global_step": 534647, "epoch": 6441} {"train_loss": -27.4169921875, "global_step": 534648, "epoch": 6441} {"train_loss": -27.81831932067871, "global_step": 534649, "epoch": 6441} {"train_loss": -27.42658805847168, "global_step": 534650, "epoch": 6441} {"train_loss": -27.416296005249023, "global_step": 534651, "epoch": 6441} {"train_loss": -27.5056095123291, "global_step": 534652, "epoch": 6441} {"train_loss": -27.911832809448242, "global_step": 534653, "epoch": 6441} {"train_loss": -27.28061866760254, "global_step": 534654, "epoch": 6441} {"train_loss": -27.614492416381836, "global_step": 534655, "epoch": 6441} {"train_loss": -27.968366622924805, "global_step": 534656, "epoch": 6441} {"train_loss": -27.640207290649414, "global_step": 534657, "epoch": 6441} {"train_loss": -27.390396118164062, "global_step": 534658, "epoch": 6441} {"train_loss": -27.666608810424805, "global_step": 534659, "epoch": 6441} {"train_loss": -27.835968017578125, "global_step": 534660, "epoch": 6441} {"train_loss": -27.618139266967773, "global_step": 534661, "epoch": 6441} {"train_loss": -27.860126495361328, "global_step": 534662, "epoch": 6441} {"train_loss": -27.991958618164062, "global_step": 534663, "epoch": 6441} {"train_loss": -27.918527603149414, "global_step": 534664, "epoch": 6441} {"train_loss": -27.427322387695312, "global_step": 534665, "epoch": 6441} {"train_loss": -27.897653579711914, "global_step": 534666, "epoch": 6441} {"train_loss": -28.02469253540039, "global_step": 534667, "epoch": 6441} {"train_loss": -27.901309967041016, "global_step": 534668, "epoch": 6441} {"train_loss": -27.90326499938965, "global_step": 534669, "epoch": 6441} {"train_loss": -27.70033073425293, "global_step": 534670, "epoch": 6441} {"train_loss": -27.72565269470215, "global_step": 534671, "epoch": 6441} {"train_loss": -28.07016372680664, "global_step": 534672, "epoch": 6441} {"train_loss": -27.937896728515625, "global_step": 534673, "epoch": 6441} {"train_loss": -27.468067169189453, "global_step": 534674, "epoch": 6441} {"train_loss": -27.56068229675293, "global_step": 534675, "epoch": 6441} {"train_loss": -27.73944664001465, "global_step": 534676, "epoch": 6441} {"train_loss": -27.464492797851562, "global_step": 534677, "epoch": 6441} {"train_loss": -27.553836822509766, "global_step": 534678, "epoch": 6441} {"train_loss": -27.448486328125, "global_step": 534679, "epoch": 6441} {"train_loss": -27.48969841003418, "global_step": 534680, "epoch": 6441} {"train_loss": -27.339704513549805, "global_step": 534681, "epoch": 6441} {"train_loss": -27.4172306060791, "global_step": 534682, "epoch": 6441} {"train_loss": -27.6035099029541, "global_step": 534683, "epoch": 6441} {"train_loss": -27.57557487487793, "global_step": 534684, "epoch": 6441} {"train_loss": -27.41924285888672, "global_step": 534685, "epoch": 6441, "val_loss": 6612310.0} {"train_loss": -27.079221725463867, "global_step": 534686, "epoch": 6442} {"train_loss": -26.706029891967773, "global_step": 534687, "epoch": 6442} {"train_loss": -26.794574737548828, "global_step": 534688, "epoch": 6442} {"train_loss": -26.8789119720459, "global_step": 534689, "epoch": 6442} {"train_loss": -27.110809326171875, "global_step": 534690, "epoch": 6442} {"train_loss": -26.922183990478516, "global_step": 534691, "epoch": 6442} {"train_loss": -26.787363052368164, "global_step": 534692, "epoch": 6442} {"train_loss": -26.84274673461914, "global_step": 534693, "epoch": 6442} {"train_loss": -27.234052658081055, "global_step": 534694, "epoch": 6442} {"train_loss": -26.517292022705078, "global_step": 534695, "epoch": 6442} {"train_loss": -26.939239501953125, "global_step": 534696, "epoch": 6442} {"train_loss": -27.43916130065918, "global_step": 534697, "epoch": 6442} {"train_loss": -27.205915451049805, "global_step": 534698, "epoch": 6442} {"train_loss": -27.06207275390625, "global_step": 534699, "epoch": 6442} {"train_loss": -26.882795333862305, "global_step": 534700, "epoch": 6442} {"train_loss": -26.94917106628418, "global_step": 534701, "epoch": 6442} {"train_loss": -27.238895416259766, "global_step": 534702, "epoch": 6442} {"train_loss": -27.228546142578125, "global_step": 534703, "epoch": 6442} {"train_loss": -27.412490844726562, "global_step": 534704, "epoch": 6442} {"train_loss": -27.548755645751953, "global_step": 534705, "epoch": 6442} {"train_loss": -27.154096603393555, "global_step": 534706, "epoch": 6442} {"train_loss": -27.20142936706543, "global_step": 534707, "epoch": 6442} {"train_loss": -27.641565322875977, "global_step": 534708, "epoch": 6442} {"train_loss": -27.433408737182617, "global_step": 534709, "epoch": 6442} {"train_loss": -27.769983291625977, "global_step": 534710, "epoch": 6442} {"train_loss": -27.323862075805664, "global_step": 534711, "epoch": 6442} {"train_loss": -27.498456954956055, "global_step": 534712, "epoch": 6442} {"train_loss": -27.410541534423828, "global_step": 534713, "epoch": 6442} {"train_loss": -27.441177368164062, "global_step": 534714, "epoch": 6442} {"train_loss": -27.547988891601562, "global_step": 534715, "epoch": 6442} {"train_loss": -27.151248931884766, "global_step": 534716, "epoch": 6442} {"train_loss": -27.292465209960938, "global_step": 534717, "epoch": 6442} {"train_loss": -27.31574821472168, "global_step": 534718, "epoch": 6442} {"train_loss": -27.618408203125, "global_step": 534719, "epoch": 6442} {"train_loss": -27.74618911743164, "global_step": 534720, "epoch": 6442} {"train_loss": -27.781747817993164, "global_step": 534721, "epoch": 6442} {"train_loss": -27.435245513916016, "global_step": 534722, "epoch": 6442} {"train_loss": -27.805938720703125, "global_step": 534723, "epoch": 6442} {"train_loss": -27.72016716003418, "global_step": 534724, "epoch": 6442} {"train_loss": -27.559280395507812, "global_step": 534725, "epoch": 6442} {"train_loss": -27.787683486938477, "global_step": 534726, "epoch": 6442} {"train_loss": -27.63262367248535, "global_step": 534727, "epoch": 6442} {"train_loss": -27.761754989624023, "global_step": 534728, "epoch": 6442} {"train_loss": -27.92255210876465, "global_step": 534729, "epoch": 6442} {"train_loss": -27.580835342407227, "global_step": 534730, "epoch": 6442} {"train_loss": -27.83909034729004, "global_step": 534731, "epoch": 6442} {"train_loss": -27.7043399810791, "global_step": 534732, "epoch": 6442} {"train_loss": -27.59356117248535, "global_step": 534733, "epoch": 6442} {"train_loss": -27.752338409423828, "global_step": 534734, "epoch": 6442} {"train_loss": -27.6329288482666, "global_step": 534735, "epoch": 6442} {"train_loss": -27.6641788482666, "global_step": 534736, "epoch": 6442} {"train_loss": -27.444351196289062, "global_step": 534737, "epoch": 6442} {"train_loss": -27.532459259033203, "global_step": 534738, "epoch": 6442} {"train_loss": -27.799163818359375, "global_step": 534739, "epoch": 6442} {"train_loss": -27.842878341674805, "global_step": 534740, "epoch": 6442} {"train_loss": -27.344196319580078, "global_step": 534741, "epoch": 6442} {"train_loss": -27.129545211791992, "global_step": 534742, "epoch": 6442} {"train_loss": -27.339645385742188, "global_step": 534743, "epoch": 6442} {"train_loss": -27.503082275390625, "global_step": 534744, "epoch": 6442} {"train_loss": -27.230716705322266, "global_step": 534745, "epoch": 6442} {"train_loss": -27.62299156188965, "global_step": 534746, "epoch": 6442} {"train_loss": -27.62934684753418, "global_step": 534747, "epoch": 6442} {"train_loss": -27.604232788085938, "global_step": 534748, "epoch": 6442} {"train_loss": -27.982589721679688, "global_step": 534749, "epoch": 6442} {"train_loss": -27.84950828552246, "global_step": 534750, "epoch": 6442} {"train_loss": -27.488727569580078, "global_step": 534751, "epoch": 6442} {"train_loss": -28.114688873291016, "global_step": 534752, "epoch": 6442} {"train_loss": -27.277982711791992, "global_step": 534753, "epoch": 6442} {"train_loss": -27.17412757873535, "global_step": 534754, "epoch": 6442} {"train_loss": -26.250394821166992, "global_step": 534755, "epoch": 6442} {"train_loss": -26.713703155517578, "global_step": 534756, "epoch": 6442} {"train_loss": -26.737775802612305, "global_step": 534757, "epoch": 6442} {"train_loss": -27.6814022064209, "global_step": 534758, "epoch": 6442} {"train_loss": -26.84014892578125, "global_step": 534759, "epoch": 6442} {"train_loss": -26.8276424407959, "global_step": 534760, "epoch": 6442} {"train_loss": -27.027868270874023, "global_step": 534761, "epoch": 6442} {"train_loss": -27.507720947265625, "global_step": 534762, "epoch": 6442} {"train_loss": -27.053735733032227, "global_step": 534763, "epoch": 6442} {"train_loss": -27.47039794921875, "global_step": 534764, "epoch": 6442} {"train_loss": -27.69520378112793, "global_step": 534765, "epoch": 6442} {"train_loss": -27.106367111206055, "global_step": 534766, "epoch": 6442} {"train_loss": -27.686664581298828, "global_step": 534767, "epoch": 6442} {"train_loss": -27.36633277801146, "global_step": 534768, "epoch": 6442, "val_loss": 6541474.5} {"train_loss": -27.232070922851562, "global_step": 534769, "epoch": 6443} {"train_loss": -26.795446395874023, "global_step": 534770, "epoch": 6443} {"train_loss": -27.1409969329834, "global_step": 534771, "epoch": 6443} {"train_loss": -27.216825485229492, "global_step": 534772, "epoch": 6443} {"train_loss": -26.819244384765625, "global_step": 534773, "epoch": 6443} {"train_loss": -27.40952491760254, "global_step": 534774, "epoch": 6443} {"train_loss": -27.2054443359375, "global_step": 534775, "epoch": 6443} {"train_loss": -27.112396240234375, "global_step": 534776, "epoch": 6443} {"train_loss": -27.318286895751953, "global_step": 534777, "epoch": 6443} {"train_loss": -27.630258560180664, "global_step": 534778, "epoch": 6443} {"train_loss": -27.427152633666992, "global_step": 534779, "epoch": 6443} {"train_loss": -27.611669540405273, "global_step": 534780, "epoch": 6443} {"train_loss": -27.455366134643555, "global_step": 534781, "epoch": 6443} {"train_loss": -27.20431900024414, "global_step": 534782, "epoch": 6443} {"train_loss": -27.503986358642578, "global_step": 534783, "epoch": 6443} {"train_loss": -27.48162269592285, "global_step": 534784, "epoch": 6443} {"train_loss": -27.278600692749023, "global_step": 534785, "epoch": 6443} {"train_loss": -27.405445098876953, "global_step": 534786, "epoch": 6443} {"train_loss": -27.59824562072754, "global_step": 534787, "epoch": 6443} {"train_loss": -27.78028678894043, "global_step": 534788, "epoch": 6443} {"train_loss": -27.84932518005371, "global_step": 534789, "epoch": 6443} {"train_loss": -27.90799903869629, "global_step": 534790, "epoch": 6443} {"train_loss": -27.771921157836914, "global_step": 534791, "epoch": 6443} {"train_loss": -27.748443603515625, "global_step": 534792, "epoch": 6443} {"train_loss": -27.910160064697266, "global_step": 534793, "epoch": 6443} {"train_loss": -27.706064224243164, "global_step": 534794, "epoch": 6443} {"train_loss": -27.944074630737305, "global_step": 534795, "epoch": 6443} {"train_loss": -27.483579635620117, "global_step": 534796, "epoch": 6443} {"train_loss": -28.017013549804688, "global_step": 534797, "epoch": 6443} {"train_loss": -27.78167724609375, "global_step": 534798, "epoch": 6443} {"train_loss": -27.750019073486328, "global_step": 534799, "epoch": 6443} {"train_loss": -27.652851104736328, "global_step": 534800, "epoch": 6443} {"train_loss": -27.89130210876465, "global_step": 534801, "epoch": 6443} {"train_loss": -27.948495864868164, "global_step": 534802, "epoch": 6443} {"train_loss": -27.643756866455078, "global_step": 534803, "epoch": 6443} {"train_loss": -27.857385635375977, "global_step": 534804, "epoch": 6443} {"train_loss": -27.713531494140625, "global_step": 534805, "epoch": 6443} {"train_loss": -27.329486846923828, "global_step": 534806, "epoch": 6443} {"train_loss": -27.328876495361328, "global_step": 534807, "epoch": 6443} {"train_loss": -27.5759220123291, "global_step": 534808, "epoch": 6443} {"train_loss": -27.590274810791016, "global_step": 534809, "epoch": 6443} {"train_loss": -27.27594566345215, "global_step": 534810, "epoch": 6443} {"train_loss": -27.3691349029541, "global_step": 534811, "epoch": 6443} {"train_loss": -27.74275779724121, "global_step": 534812, "epoch": 6443} {"train_loss": -27.94086265563965, "global_step": 534813, "epoch": 6443} {"train_loss": -27.29798698425293, "global_step": 534814, "epoch": 6443} {"train_loss": -27.193708419799805, "global_step": 534815, "epoch": 6443} {"train_loss": -27.186071395874023, "global_step": 534816, "epoch": 6443} {"train_loss": -27.168893814086914, "global_step": 534817, "epoch": 6443} {"train_loss": -27.40052604675293, "global_step": 534818, "epoch": 6443} {"train_loss": -27.733997344970703, "global_step": 534819, "epoch": 6443} {"train_loss": -27.70184898376465, "global_step": 534820, "epoch": 6443} {"train_loss": -27.46185302734375, "global_step": 534821, "epoch": 6443} {"train_loss": -27.58186149597168, "global_step": 534822, "epoch": 6443} {"train_loss": -27.7421875, "global_step": 534823, "epoch": 6443} {"train_loss": -27.290151596069336, "global_step": 534824, "epoch": 6443} {"train_loss": -27.522876739501953, "global_step": 534825, "epoch": 6443} {"train_loss": -28.231403350830078, "global_step": 534826, "epoch": 6443} {"train_loss": -27.196063995361328, "global_step": 534827, "epoch": 6443} {"train_loss": -27.684553146362305, "global_step": 534828, "epoch": 6443} {"train_loss": -27.85028648376465, "global_step": 534829, "epoch": 6443} {"train_loss": -28.00146484375, "global_step": 534830, "epoch": 6443} {"train_loss": -27.680997848510742, "global_step": 534831, "epoch": 6443} {"train_loss": -27.30803871154785, "global_step": 534832, "epoch": 6443} {"train_loss": -27.912261962890625, "global_step": 534833, "epoch": 6443} {"train_loss": -27.44744873046875, "global_step": 534834, "epoch": 6443} {"train_loss": -28.105106353759766, "global_step": 534835, "epoch": 6443} {"train_loss": -28.157928466796875, "global_step": 534836, "epoch": 6443} {"train_loss": -27.6924991607666, "global_step": 534837, "epoch": 6443} {"train_loss": -27.651533126831055, "global_step": 534838, "epoch": 6443} {"train_loss": -27.746612548828125, "global_step": 534839, "epoch": 6443} {"train_loss": -27.69270133972168, "global_step": 534840, "epoch": 6443} {"train_loss": -27.373077392578125, "global_step": 534841, "epoch": 6443} {"train_loss": -27.76589012145996, "global_step": 534842, "epoch": 6443} {"train_loss": -27.383947372436523, "global_step": 534843, "epoch": 6443} {"train_loss": -27.683271408081055, "global_step": 534844, "epoch": 6443} {"train_loss": -27.809789657592773, "global_step": 534845, "epoch": 6443} {"train_loss": -27.414594650268555, "global_step": 534846, "epoch": 6443} {"train_loss": -27.614654541015625, "global_step": 534847, "epoch": 6443} {"train_loss": -27.73052978515625, "global_step": 534848, "epoch": 6443} {"train_loss": -27.498355865478516, "global_step": 534849, "epoch": 6443} {"train_loss": -27.324460983276367, "global_step": 534850, "epoch": 6443} {"train_loss": -27.56495705570083, "global_step": 534851, "epoch": 6443, "val_loss": 6490611.5} {"train_loss": -23.31479263305664, "global_step": 534852, "epoch": 6444} {"train_loss": -22.271879196166992, "global_step": 534853, "epoch": 6444} {"train_loss": -26.031768798828125, "global_step": 534854, "epoch": 6444} {"train_loss": -24.966466903686523, "global_step": 534855, "epoch": 6444} {"train_loss": -26.079486846923828, "global_step": 534856, "epoch": 6444} {"train_loss": -25.269437789916992, "global_step": 534857, "epoch": 6444} {"train_loss": -26.485675811767578, "global_step": 534858, "epoch": 6444} {"train_loss": -26.17465591430664, "global_step": 534859, "epoch": 6444} {"train_loss": -26.298126220703125, "global_step": 534860, "epoch": 6444} {"train_loss": -26.575244903564453, "global_step": 534861, "epoch": 6444} {"train_loss": -26.62798500061035, "global_step": 534862, "epoch": 6444} {"train_loss": -26.740636825561523, "global_step": 534863, "epoch": 6444} {"train_loss": -26.538312911987305, "global_step": 534864, "epoch": 6444} {"train_loss": -26.632034301757812, "global_step": 534865, "epoch": 6444} {"train_loss": -26.946063995361328, "global_step": 534866, "epoch": 6444} {"train_loss": -26.518482208251953, "global_step": 534867, "epoch": 6444} {"train_loss": -26.934232711791992, "global_step": 534868, "epoch": 6444} {"train_loss": -26.962610244750977, "global_step": 534869, "epoch": 6444} {"train_loss": -26.955371856689453, "global_step": 534870, "epoch": 6444} {"train_loss": -26.7325439453125, "global_step": 534871, "epoch": 6444} {"train_loss": -26.756357192993164, "global_step": 534872, "epoch": 6444} {"train_loss": -27.0623722076416, "global_step": 534873, "epoch": 6444} {"train_loss": -26.968618392944336, "global_step": 534874, "epoch": 6444} {"train_loss": -26.849740982055664, "global_step": 534875, "epoch": 6444} {"train_loss": -27.173370361328125, "global_step": 534876, "epoch": 6444} {"train_loss": -27.19166374206543, "global_step": 534877, "epoch": 6444} {"train_loss": -27.322851181030273, "global_step": 534878, "epoch": 6444} {"train_loss": -27.073535919189453, "global_step": 534879, "epoch": 6444} {"train_loss": -26.9744815826416, "global_step": 534880, "epoch": 6444} {"train_loss": -27.450571060180664, "global_step": 534881, "epoch": 6444} {"train_loss": -27.265216827392578, "global_step": 534882, "epoch": 6444} {"train_loss": -27.5966796875, "global_step": 534883, "epoch": 6444} {"train_loss": -27.294574737548828, "global_step": 534884, "epoch": 6444} {"train_loss": -27.316364288330078, "global_step": 534885, "epoch": 6444} {"train_loss": -27.006927490234375, "global_step": 534886, "epoch": 6444} {"train_loss": -27.155866622924805, "global_step": 534887, "epoch": 6444} {"train_loss": -27.403249740600586, "global_step": 534888, "epoch": 6444} {"train_loss": -27.345306396484375, "global_step": 534889, "epoch": 6444} {"train_loss": -27.350324630737305, "global_step": 534890, "epoch": 6444} {"train_loss": -27.48480796813965, "global_step": 534891, "epoch": 6444} {"train_loss": -26.99329948425293, "global_step": 534892, "epoch": 6444} {"train_loss": -27.302377700805664, "global_step": 534893, "epoch": 6444} {"train_loss": -27.425390243530273, "global_step": 534894, "epoch": 6444} {"train_loss": -26.999731063842773, "global_step": 534895, "epoch": 6444} {"train_loss": -27.626394271850586, "global_step": 534896, "epoch": 6444} {"train_loss": -27.318225860595703, "global_step": 534897, "epoch": 6444} {"train_loss": -27.34107780456543, "global_step": 534898, "epoch": 6444} {"train_loss": -27.518789291381836, "global_step": 534899, "epoch": 6444} {"train_loss": -27.79632568359375, "global_step": 534900, "epoch": 6444} {"train_loss": -27.554519653320312, "global_step": 534901, "epoch": 6444} {"train_loss": -27.58754539489746, "global_step": 534902, "epoch": 6444} {"train_loss": -27.458723068237305, "global_step": 534903, "epoch": 6444} {"train_loss": -27.6359920501709, "global_step": 534904, "epoch": 6444} {"train_loss": -27.5082950592041, "global_step": 534905, "epoch": 6444} {"train_loss": -27.7687931060791, "global_step": 534906, "epoch": 6444} {"train_loss": -27.419921875, "global_step": 534907, "epoch": 6444} {"train_loss": -27.600696563720703, "global_step": 534908, "epoch": 6444} {"train_loss": -27.15045166015625, "global_step": 534909, "epoch": 6444} {"train_loss": -27.67303466796875, "global_step": 534910, "epoch": 6444} {"train_loss": -27.86528968811035, "global_step": 534911, "epoch": 6444} {"train_loss": -27.59698486328125, "global_step": 534912, "epoch": 6444} {"train_loss": -28.03598976135254, "global_step": 534913, "epoch": 6444} {"train_loss": -27.331787109375, "global_step": 534914, "epoch": 6444} {"train_loss": -27.099470138549805, "global_step": 534915, "epoch": 6444} {"train_loss": -27.2366943359375, "global_step": 534916, "epoch": 6444} {"train_loss": -27.452646255493164, "global_step": 534917, "epoch": 6444} {"train_loss": -27.234304428100586, "global_step": 534918, "epoch": 6444} {"train_loss": -27.16819190979004, "global_step": 534919, "epoch": 6444} {"train_loss": -27.6593017578125, "global_step": 534920, "epoch": 6444} {"train_loss": -27.350812911987305, "global_step": 534921, "epoch": 6444} {"train_loss": -27.53657341003418, "global_step": 534922, "epoch": 6444} {"train_loss": -27.532819747924805, "global_step": 534923, "epoch": 6444} {"train_loss": -27.30512046813965, "global_step": 534924, "epoch": 6444} {"train_loss": -27.459278106689453, "global_step": 534925, "epoch": 6444} {"train_loss": -27.51861572265625, "global_step": 534926, "epoch": 6444} {"train_loss": -27.032407760620117, "global_step": 534927, "epoch": 6444} {"train_loss": -27.3931827545166, "global_step": 534928, "epoch": 6444} {"train_loss": -27.543508529663086, "global_step": 534929, "epoch": 6444} {"train_loss": -27.65394401550293, "global_step": 534930, "epoch": 6444} {"train_loss": -27.403242111206055, "global_step": 534931, "epoch": 6444} {"train_loss": -27.7631778717041, "global_step": 534932, "epoch": 6444} {"train_loss": -27.6037654876709, "global_step": 534933, "epoch": 6444} {"train_loss": -27.058342991105047, "global_step": 534934, "epoch": 6444, "val_loss": 6528962.0} {"train_loss": -24.364395141601562, "global_step": 534935, "epoch": 6445} {"train_loss": -24.82352638244629, "global_step": 534936, "epoch": 6445} {"train_loss": -27.2658748626709, "global_step": 534937, "epoch": 6445} {"train_loss": -26.214624404907227, "global_step": 534938, "epoch": 6445} {"train_loss": -27.10027503967285, "global_step": 534939, "epoch": 6445} {"train_loss": -25.672544479370117, "global_step": 534940, "epoch": 6445} {"train_loss": -26.9075870513916, "global_step": 534941, "epoch": 6445} {"train_loss": -26.681562423706055, "global_step": 534942, "epoch": 6445} {"train_loss": -26.559356689453125, "global_step": 534943, "epoch": 6445} {"train_loss": -26.226428985595703, "global_step": 534944, "epoch": 6445} {"train_loss": -26.436811447143555, "global_step": 534945, "epoch": 6445} {"train_loss": -27.032644271850586, "global_step": 534946, "epoch": 6445} {"train_loss": -27.094751358032227, "global_step": 534947, "epoch": 6445} {"train_loss": -26.6295166015625, "global_step": 534948, "epoch": 6445} {"train_loss": -26.68477439880371, "global_step": 534949, "epoch": 6445} {"train_loss": -27.250532150268555, "global_step": 534950, "epoch": 6445} {"train_loss": -26.679182052612305, "global_step": 534951, "epoch": 6445} {"train_loss": -27.282806396484375, "global_step": 534952, "epoch": 6445} {"train_loss": -27.174283981323242, "global_step": 534953, "epoch": 6445} {"train_loss": -26.741559982299805, "global_step": 534954, "epoch": 6445} {"train_loss": -26.807056427001953, "global_step": 534955, "epoch": 6445} {"train_loss": -27.3964786529541, "global_step": 534956, "epoch": 6445} {"train_loss": -27.240436553955078, "global_step": 534957, "epoch": 6445} {"train_loss": -26.98215675354004, "global_step": 534958, "epoch": 6445} {"train_loss": -27.360004425048828, "global_step": 534959, "epoch": 6445} {"train_loss": -27.38970947265625, "global_step": 534960, "epoch": 6445} {"train_loss": -27.436670303344727, "global_step": 534961, "epoch": 6445} {"train_loss": -27.237506866455078, "global_step": 534962, "epoch": 6445} {"train_loss": -27.29499626159668, "global_step": 534963, "epoch": 6445} {"train_loss": -27.463302612304688, "global_step": 534964, "epoch": 6445} {"train_loss": -27.67412757873535, "global_step": 534965, "epoch": 6445} {"train_loss": -27.216327667236328, "global_step": 534966, "epoch": 6445} {"train_loss": -27.609893798828125, "global_step": 534967, "epoch": 6445} {"train_loss": -27.517236709594727, "global_step": 534968, "epoch": 6445} {"train_loss": -27.857715606689453, "global_step": 534969, "epoch": 6445} {"train_loss": -27.445114135742188, "global_step": 534970, "epoch": 6445} {"train_loss": -27.338550567626953, "global_step": 534971, "epoch": 6445} {"train_loss": -27.5512752532959, "global_step": 534972, "epoch": 6445} {"train_loss": -27.55206871032715, "global_step": 534973, "epoch": 6445} {"train_loss": -27.744403839111328, "global_step": 534974, "epoch": 6445} {"train_loss": -27.444318771362305, "global_step": 534975, "epoch": 6445} {"train_loss": -27.36105728149414, "global_step": 534976, "epoch": 6445} {"train_loss": -27.508880615234375, "global_step": 534977, "epoch": 6445} {"train_loss": -27.818439483642578, "global_step": 534978, "epoch": 6445} {"train_loss": -27.846359252929688, "global_step": 534979, "epoch": 6445} {"train_loss": -27.165863037109375, "global_step": 534980, "epoch": 6445} {"train_loss": -27.982751846313477, "global_step": 534981, "epoch": 6445} {"train_loss": -27.713748931884766, "global_step": 534982, "epoch": 6445} {"train_loss": -27.744237899780273, "global_step": 534983, "epoch": 6445} {"train_loss": -27.910184860229492, "global_step": 534984, "epoch": 6445} {"train_loss": -27.36712646484375, "global_step": 534985, "epoch": 6445} {"train_loss": -27.703155517578125, "global_step": 534986, "epoch": 6445} {"train_loss": -27.91543960571289, "global_step": 534987, "epoch": 6445} {"train_loss": -27.982099533081055, "global_step": 534988, "epoch": 6445} {"train_loss": -27.9727783203125, "global_step": 534989, "epoch": 6445} {"train_loss": -27.51806640625, "global_step": 534990, "epoch": 6445} {"train_loss": -27.543100357055664, "global_step": 534991, "epoch": 6445} {"train_loss": -27.652973175048828, "global_step": 534992, "epoch": 6445} {"train_loss": -28.01056480407715, "global_step": 534993, "epoch": 6445} {"train_loss": -27.319171905517578, "global_step": 534994, "epoch": 6445} {"train_loss": -27.5870418548584, "global_step": 534995, "epoch": 6445} {"train_loss": -27.495807647705078, "global_step": 534996, "epoch": 6445} {"train_loss": -27.5810489654541, "global_step": 534997, "epoch": 6445} {"train_loss": -27.68366050720215, "global_step": 534998, "epoch": 6445} {"train_loss": -27.595401763916016, "global_step": 534999, "epoch": 6445} {"train_loss": -27.4034366607666, "global_step": 535000, "epoch": 6445} {"train_loss": -27.658313751220703, "global_step": 535001, "epoch": 6445} {"train_loss": -27.961227416992188, "global_step": 535002, "epoch": 6445} {"train_loss": -27.609268188476562, "global_step": 535003, "epoch": 6445} {"train_loss": -27.621484756469727, "global_step": 535004, "epoch": 6445} {"train_loss": -28.0223331451416, "global_step": 535005, "epoch": 6445} {"train_loss": -27.76513671875, "global_step": 535006, "epoch": 6445} {"train_loss": -27.8968563079834, "global_step": 535007, "epoch": 6445} {"train_loss": -27.976667404174805, "global_step": 535008, "epoch": 6445} {"train_loss": -27.98062515258789, "global_step": 535009, "epoch": 6445} {"train_loss": -27.90549087524414, "global_step": 535010, "epoch": 6445} {"train_loss": -27.612165451049805, "global_step": 535011, "epoch": 6445} {"train_loss": -27.63020133972168, "global_step": 535012, "epoch": 6445} {"train_loss": -28.055633544921875, "global_step": 535013, "epoch": 6445} {"train_loss": -27.88728141784668, "global_step": 535014, "epoch": 6445} {"train_loss": -27.793420791625977, "global_step": 535015, "epoch": 6445} {"train_loss": -27.65810203552246, "global_step": 535016, "epoch": 6445} {"train_loss": -27.329973979168628, "global_step": 535017, "epoch": 6445, "val_loss": 6564319.0} {"train_loss": -27.44849967956543, "global_step": 535018, "epoch": 6446} {"train_loss": -27.17905044555664, "global_step": 535019, "epoch": 6446} {"train_loss": -27.627826690673828, "global_step": 535020, "epoch": 6446} {"train_loss": -27.496374130249023, "global_step": 535021, "epoch": 6446} {"train_loss": -27.355926513671875, "global_step": 535022, "epoch": 6446} {"train_loss": -27.650848388671875, "global_step": 535023, "epoch": 6446} {"train_loss": -27.621084213256836, "global_step": 535024, "epoch": 6446} {"train_loss": -27.30561637878418, "global_step": 535025, "epoch": 6446} {"train_loss": -27.257959365844727, "global_step": 535026, "epoch": 6446} {"train_loss": -27.387226104736328, "global_step": 535027, "epoch": 6446} {"train_loss": -27.5240535736084, "global_step": 535028, "epoch": 6446} {"train_loss": -27.30414390563965, "global_step": 535029, "epoch": 6446} {"train_loss": -27.637042999267578, "global_step": 535030, "epoch": 6446} {"train_loss": -27.594282150268555, "global_step": 535031, "epoch": 6446} {"train_loss": -27.787860870361328, "global_step": 535032, "epoch": 6446} {"train_loss": -27.692108154296875, "global_step": 535033, "epoch": 6446} {"train_loss": -27.536039352416992, "global_step": 535034, "epoch": 6446} {"train_loss": -27.7503719329834, "global_step": 535035, "epoch": 6446} {"train_loss": -27.756128311157227, "global_step": 535036, "epoch": 6446} {"train_loss": -27.595355987548828, "global_step": 535037, "epoch": 6446} {"train_loss": -27.91461753845215, "global_step": 535038, "epoch": 6446} {"train_loss": -27.564279556274414, "global_step": 535039, "epoch": 6446} {"train_loss": -27.86089515686035, "global_step": 535040, "epoch": 6446} {"train_loss": -27.698339462280273, "global_step": 535041, "epoch": 6446} {"train_loss": -27.646411895751953, "global_step": 535042, "epoch": 6446} {"train_loss": -27.73927116394043, "global_step": 535043, "epoch": 6446} {"train_loss": -27.747419357299805, "global_step": 535044, "epoch": 6446} {"train_loss": -27.745563507080078, "global_step": 535045, "epoch": 6446} {"train_loss": -27.921167373657227, "global_step": 535046, "epoch": 6446} {"train_loss": -27.623126983642578, "global_step": 535047, "epoch": 6446} {"train_loss": -27.92353630065918, "global_step": 535048, "epoch": 6446} {"train_loss": -27.83098793029785, "global_step": 535049, "epoch": 6446} {"train_loss": -27.70575523376465, "global_step": 535050, "epoch": 6446} {"train_loss": -27.879003524780273, "global_step": 535051, "epoch": 6446} {"train_loss": -27.15069580078125, "global_step": 535052, "epoch": 6446} {"train_loss": -27.762845993041992, "global_step": 535053, "epoch": 6446} {"train_loss": -27.328479766845703, "global_step": 535054, "epoch": 6446} {"train_loss": -27.92612075805664, "global_step": 535055, "epoch": 6446} {"train_loss": -27.016590118408203, "global_step": 535056, "epoch": 6446} {"train_loss": -27.53919792175293, "global_step": 535057, "epoch": 6446} {"train_loss": -27.457794189453125, "global_step": 535058, "epoch": 6446} {"train_loss": -27.46620750427246, "global_step": 535059, "epoch": 6446} {"train_loss": -27.19028663635254, "global_step": 535060, "epoch": 6446} {"train_loss": -27.66627311706543, "global_step": 535061, "epoch": 6446} {"train_loss": -27.603271484375, "global_step": 535062, "epoch": 6446} {"train_loss": -27.53865623474121, "global_step": 535063, "epoch": 6446} {"train_loss": -27.6866397857666, "global_step": 535064, "epoch": 6446} {"train_loss": -27.44253921508789, "global_step": 535065, "epoch": 6446} {"train_loss": -27.598501205444336, "global_step": 535066, "epoch": 6446} {"train_loss": -27.532285690307617, "global_step": 535067, "epoch": 6446} {"train_loss": -27.278181076049805, "global_step": 535068, "epoch": 6446} {"train_loss": -27.790699005126953, "global_step": 535069, "epoch": 6446} {"train_loss": -27.48423194885254, "global_step": 535070, "epoch": 6446} {"train_loss": -27.350238800048828, "global_step": 535071, "epoch": 6446} {"train_loss": -27.386035919189453, "global_step": 535072, "epoch": 6446} {"train_loss": -27.595510482788086, "global_step": 535073, "epoch": 6446} {"train_loss": -27.512786865234375, "global_step": 535074, "epoch": 6446} {"train_loss": -27.275724411010742, "global_step": 535075, "epoch": 6446} {"train_loss": -27.07317543029785, "global_step": 535076, "epoch": 6446} {"train_loss": -27.535070419311523, "global_step": 535077, "epoch": 6446} {"train_loss": -27.484338760375977, "global_step": 535078, "epoch": 6446} {"train_loss": -27.46030044555664, "global_step": 535079, "epoch": 6446} {"train_loss": -27.57404899597168, "global_step": 535080, "epoch": 6446} {"train_loss": -27.656208038330078, "global_step": 535081, "epoch": 6446} {"train_loss": -27.36517906188965, "global_step": 535082, "epoch": 6446} {"train_loss": -27.91010856628418, "global_step": 535083, "epoch": 6446} {"train_loss": -27.652952194213867, "global_step": 535084, "epoch": 6446} {"train_loss": -27.752344131469727, "global_step": 535085, "epoch": 6446} {"train_loss": -27.562915802001953, "global_step": 535086, "epoch": 6446} {"train_loss": -27.841358184814453, "global_step": 535087, "epoch": 6446} {"train_loss": -27.76950454711914, "global_step": 535088, "epoch": 6446} {"train_loss": -27.619556427001953, "global_step": 535089, "epoch": 6446} {"train_loss": -27.700672149658203, "global_step": 535090, "epoch": 6446} {"train_loss": -27.57477378845215, "global_step": 535091, "epoch": 6446} {"train_loss": -27.799428939819336, "global_step": 535092, "epoch": 6446} {"train_loss": -27.905902862548828, "global_step": 535093, "epoch": 6446} {"train_loss": -27.7176456451416, "global_step": 535094, "epoch": 6446} {"train_loss": -27.382734298706055, "global_step": 535095, "epoch": 6446} {"train_loss": -27.854171752929688, "global_step": 535096, "epoch": 6446} {"train_loss": -27.68060874938965, "global_step": 535097, "epoch": 6446} {"train_loss": -27.774072647094727, "global_step": 535098, "epoch": 6446} {"train_loss": -27.921594619750977, "global_step": 535099, "epoch": 6446} {"train_loss": -27.592688089393707, "global_step": 535100, "epoch": 6446, "val_loss": 6509646.0} {"train_loss": -27.482986450195312, "global_step": 535101, "epoch": 6447} {"train_loss": -26.383386611938477, "global_step": 535102, "epoch": 6447} {"train_loss": -25.295480728149414, "global_step": 535103, "epoch": 6447} {"train_loss": -25.80109214782715, "global_step": 535104, "epoch": 6447} {"train_loss": -26.881011962890625, "global_step": 535105, "epoch": 6447} {"train_loss": -26.979894638061523, "global_step": 535106, "epoch": 6447} {"train_loss": -27.207242965698242, "global_step": 535107, "epoch": 6447} {"train_loss": -26.778303146362305, "global_step": 535108, "epoch": 6447} {"train_loss": -27.33918571472168, "global_step": 535109, "epoch": 6447} {"train_loss": -27.18111228942871, "global_step": 535110, "epoch": 6447} {"train_loss": -26.635101318359375, "global_step": 535111, "epoch": 6447} {"train_loss": -26.99476432800293, "global_step": 535112, "epoch": 6447} {"train_loss": -27.206466674804688, "global_step": 535113, "epoch": 6447} {"train_loss": -27.265966415405273, "global_step": 535114, "epoch": 6447} {"train_loss": -27.2211971282959, "global_step": 535115, "epoch": 6447} {"train_loss": -27.38116455078125, "global_step": 535116, "epoch": 6447} {"train_loss": -27.188108444213867, "global_step": 535117, "epoch": 6447} {"train_loss": -27.574970245361328, "global_step": 535118, "epoch": 6447} {"train_loss": -27.10713768005371, "global_step": 535119, "epoch": 6447} {"train_loss": -27.34629249572754, "global_step": 535120, "epoch": 6447} {"train_loss": -27.56005859375, "global_step": 535121, "epoch": 6447} {"train_loss": -27.214887619018555, "global_step": 535122, "epoch": 6447} {"train_loss": -26.950571060180664, "global_step": 535123, "epoch": 6447} {"train_loss": -27.709060668945312, "global_step": 535124, "epoch": 6447} {"train_loss": -27.3869571685791, "global_step": 535125, "epoch": 6447} {"train_loss": -27.5317440032959, "global_step": 535126, "epoch": 6447} {"train_loss": -27.809906005859375, "global_step": 535127, "epoch": 6447} {"train_loss": -27.636371612548828, "global_step": 535128, "epoch": 6447} {"train_loss": -27.421186447143555, "global_step": 535129, "epoch": 6447} {"train_loss": -27.12293815612793, "global_step": 535130, "epoch": 6447} {"train_loss": -27.409780502319336, "global_step": 535131, "epoch": 6447} {"train_loss": -27.592853546142578, "global_step": 535132, "epoch": 6447} {"train_loss": -27.748388290405273, "global_step": 535133, "epoch": 6447} {"train_loss": -27.535245895385742, "global_step": 535134, "epoch": 6447} {"train_loss": -27.37183952331543, "global_step": 535135, "epoch": 6447} {"train_loss": -27.625349044799805, "global_step": 535136, "epoch": 6447} {"train_loss": -27.943801879882812, "global_step": 535137, "epoch": 6447} {"train_loss": -27.797382354736328, "global_step": 535138, "epoch": 6447} {"train_loss": -27.73480796813965, "global_step": 535139, "epoch": 6447} {"train_loss": -27.60079002380371, "global_step": 535140, "epoch": 6447} {"train_loss": -27.65523338317871, "global_step": 535141, "epoch": 6447} {"train_loss": -28.061826705932617, "global_step": 535142, "epoch": 6447} {"train_loss": -27.300134658813477, "global_step": 535143, "epoch": 6447} {"train_loss": -27.722692489624023, "global_step": 535144, "epoch": 6447} {"train_loss": -27.960607528686523, "global_step": 535145, "epoch": 6447} {"train_loss": -27.917327880859375, "global_step": 535146, "epoch": 6447} {"train_loss": -27.520679473876953, "global_step": 535147, "epoch": 6447} {"train_loss": -27.433713912963867, "global_step": 535148, "epoch": 6447} {"train_loss": -27.66950798034668, "global_step": 535149, "epoch": 6447} {"train_loss": -27.73163414001465, "global_step": 535150, "epoch": 6447} {"train_loss": -27.87969970703125, "global_step": 535151, "epoch": 6447} {"train_loss": -27.817197799682617, "global_step": 535152, "epoch": 6447} {"train_loss": -27.761133193969727, "global_step": 535153, "epoch": 6447} {"train_loss": -27.795806884765625, "global_step": 535154, "epoch": 6447} {"train_loss": -27.571577072143555, "global_step": 535155, "epoch": 6447} {"train_loss": -27.630420684814453, "global_step": 535156, "epoch": 6447} {"train_loss": -27.734344482421875, "global_step": 535157, "epoch": 6447} {"train_loss": -27.495864868164062, "global_step": 535158, "epoch": 6447} {"train_loss": -27.736724853515625, "global_step": 535159, "epoch": 6447} {"train_loss": -27.278722763061523, "global_step": 535160, "epoch": 6447} {"train_loss": -27.596179962158203, "global_step": 535161, "epoch": 6447} {"train_loss": -27.9243221282959, "global_step": 535162, "epoch": 6447} {"train_loss": -27.385244369506836, "global_step": 535163, "epoch": 6447} {"train_loss": -27.989395141601562, "global_step": 535164, "epoch": 6447} {"train_loss": -27.569934844970703, "global_step": 535165, "epoch": 6447} {"train_loss": -27.87518310546875, "global_step": 535166, "epoch": 6447} {"train_loss": -27.65083122253418, "global_step": 535167, "epoch": 6447} {"train_loss": -27.446802139282227, "global_step": 535168, "epoch": 6447} {"train_loss": -27.399885177612305, "global_step": 535169, "epoch": 6447} {"train_loss": -27.944873809814453, "global_step": 535170, "epoch": 6447} {"train_loss": -27.14313316345215, "global_step": 535171, "epoch": 6447} {"train_loss": -27.649377822875977, "global_step": 535172, "epoch": 6447} {"train_loss": -26.945417404174805, "global_step": 535173, "epoch": 6447} {"train_loss": -27.089893341064453, "global_step": 535174, "epoch": 6447} {"train_loss": -27.793725967407227, "global_step": 535175, "epoch": 6447} {"train_loss": -28.028654098510742, "global_step": 535176, "epoch": 6447} {"train_loss": -26.89310073852539, "global_step": 535177, "epoch": 6447} {"train_loss": -27.522628784179688, "global_step": 535178, "epoch": 6447} {"train_loss": -27.224750518798828, "global_step": 535179, "epoch": 6447} {"train_loss": -27.416616439819336, "global_step": 535180, "epoch": 6447} {"train_loss": -27.60321044921875, "global_step": 535181, "epoch": 6447} {"train_loss": -27.338653564453125, "global_step": 535182, "epoch": 6447} {"train_loss": -27.431836989988764, "global_step": 535183, "epoch": 6447, "val_loss": 6673779.0} {"train_loss": -26.393827438354492, "global_step": 535184, "epoch": 6448} {"train_loss": -25.918954849243164, "global_step": 535185, "epoch": 6448} {"train_loss": -26.271970748901367, "global_step": 535186, "epoch": 6448} {"train_loss": -25.7409725189209, "global_step": 535187, "epoch": 6448} {"train_loss": -26.83102798461914, "global_step": 535188, "epoch": 6448} {"train_loss": -26.401874542236328, "global_step": 535189, "epoch": 6448} {"train_loss": -26.345834732055664, "global_step": 535190, "epoch": 6448} {"train_loss": -26.76275634765625, "global_step": 535191, "epoch": 6448} {"train_loss": -26.521045684814453, "global_step": 535192, "epoch": 6448} {"train_loss": -26.678211212158203, "global_step": 535193, "epoch": 6448} {"train_loss": -26.72576332092285, "global_step": 535194, "epoch": 6448} {"train_loss": -26.808856964111328, "global_step": 535195, "epoch": 6448} {"train_loss": -27.349365234375, "global_step": 535196, "epoch": 6448} {"train_loss": -27.060382843017578, "global_step": 535197, "epoch": 6448} {"train_loss": -27.117605209350586, "global_step": 535198, "epoch": 6448} {"train_loss": -27.07952308654785, "global_step": 535199, "epoch": 6448} {"train_loss": -27.294111251831055, "global_step": 535200, "epoch": 6448} {"train_loss": -26.952604293823242, "global_step": 535201, "epoch": 6448} {"train_loss": -27.164159774780273, "global_step": 535202, "epoch": 6448} {"train_loss": -27.061237335205078, "global_step": 535203, "epoch": 6448} {"train_loss": -26.948352813720703, "global_step": 535204, "epoch": 6448} {"train_loss": -27.572736740112305, "global_step": 535205, "epoch": 6448} {"train_loss": -27.03910255432129, "global_step": 535206, "epoch": 6448} {"train_loss": -27.04052734375, "global_step": 535207, "epoch": 6448} {"train_loss": -27.33180046081543, "global_step": 535208, "epoch": 6448} {"train_loss": -27.30972671508789, "global_step": 535209, "epoch": 6448} {"train_loss": -27.4450626373291, "global_step": 535210, "epoch": 6448} {"train_loss": -27.516828536987305, "global_step": 535211, "epoch": 6448} {"train_loss": -27.449817657470703, "global_step": 535212, "epoch": 6448} {"train_loss": -27.0802001953125, "global_step": 535213, "epoch": 6448} {"train_loss": -27.436838150024414, "global_step": 535214, "epoch": 6448} {"train_loss": -27.546131134033203, "global_step": 535215, "epoch": 6448} {"train_loss": -27.58479118347168, "global_step": 535216, "epoch": 6448} {"train_loss": -27.99848747253418, "global_step": 535217, "epoch": 6448} {"train_loss": -27.476593017578125, "global_step": 535218, "epoch": 6448} {"train_loss": -27.5367488861084, "global_step": 535219, "epoch": 6448} {"train_loss": -27.914560317993164, "global_step": 535220, "epoch": 6448} {"train_loss": -27.607807159423828, "global_step": 535221, "epoch": 6448} {"train_loss": -27.868078231811523, "global_step": 535222, "epoch": 6448} {"train_loss": -27.77176284790039, "global_step": 535223, "epoch": 6448} {"train_loss": -27.645126342773438, "global_step": 535224, "epoch": 6448} {"train_loss": -27.766103744506836, "global_step": 535225, "epoch": 6448} {"train_loss": -27.608076095581055, "global_step": 535226, "epoch": 6448} {"train_loss": -27.844345092773438, "global_step": 535227, "epoch": 6448} {"train_loss": -28.099536895751953, "global_step": 535228, "epoch": 6448} {"train_loss": -27.772520065307617, "global_step": 535229, "epoch": 6448} {"train_loss": -27.73386573791504, "global_step": 535230, "epoch": 6448} {"train_loss": -27.6125545501709, "global_step": 535231, "epoch": 6448} {"train_loss": -27.883939743041992, "global_step": 535232, "epoch": 6448} {"train_loss": -27.819177627563477, "global_step": 535233, "epoch": 6448} {"train_loss": -27.5538272857666, "global_step": 535234, "epoch": 6448} {"train_loss": -27.878583908081055, "global_step": 535235, "epoch": 6448} {"train_loss": -27.705921173095703, "global_step": 535236, "epoch": 6448} {"train_loss": -27.859724044799805, "global_step": 535237, "epoch": 6448} {"train_loss": -27.729389190673828, "global_step": 535238, "epoch": 6448} {"train_loss": -27.92513084411621, "global_step": 535239, "epoch": 6448} {"train_loss": -27.932783126831055, "global_step": 535240, "epoch": 6448} {"train_loss": -28.168909072875977, "global_step": 535241, "epoch": 6448} {"train_loss": -27.988866806030273, "global_step": 535242, "epoch": 6448} {"train_loss": -27.66350746154785, "global_step": 535243, "epoch": 6448} {"train_loss": -28.136667251586914, "global_step": 535244, "epoch": 6448} {"train_loss": -27.726545333862305, "global_step": 535245, "epoch": 6448} {"train_loss": -27.35902976989746, "global_step": 535246, "epoch": 6448} {"train_loss": -27.897321701049805, "global_step": 535247, "epoch": 6448} {"train_loss": -27.83401870727539, "global_step": 535248, "epoch": 6448} {"train_loss": -27.950927734375, "global_step": 535249, "epoch": 6448} {"train_loss": -27.74419593811035, "global_step": 535250, "epoch": 6448} {"train_loss": -27.848270416259766, "global_step": 535251, "epoch": 6448} {"train_loss": -27.735483169555664, "global_step": 535252, "epoch": 6448} {"train_loss": -28.000934600830078, "global_step": 535253, "epoch": 6448} {"train_loss": -28.001361846923828, "global_step": 535254, "epoch": 6448} {"train_loss": -27.624738693237305, "global_step": 535255, "epoch": 6448} {"train_loss": -28.039093017578125, "global_step": 535256, "epoch": 6448} {"train_loss": -27.66798973083496, "global_step": 535257, "epoch": 6448} {"train_loss": -27.464889526367188, "global_step": 535258, "epoch": 6448} {"train_loss": -28.07242774963379, "global_step": 535259, "epoch": 6448} {"train_loss": -27.288976669311523, "global_step": 535260, "epoch": 6448} {"train_loss": -27.221832275390625, "global_step": 535261, "epoch": 6448} {"train_loss": -26.899051666259766, "global_step": 535262, "epoch": 6448} {"train_loss": -27.281827926635742, "global_step": 535263, "epoch": 6448} {"train_loss": -27.669416427612305, "global_step": 535264, "epoch": 6448} {"train_loss": -27.491941452026367, "global_step": 535265, "epoch": 6448} {"train_loss": -27.422074145581348, "global_step": 535266, "epoch": 6448, "val_loss": 6486917.0} {"train_loss": -27.654071807861328, "global_step": 535267, "epoch": 6449} {"train_loss": -27.348846435546875, "global_step": 535268, "epoch": 6449} {"train_loss": -26.76020622253418, "global_step": 535269, "epoch": 6449} {"train_loss": -27.54473876953125, "global_step": 535270, "epoch": 6449} {"train_loss": -27.64165687561035, "global_step": 535271, "epoch": 6449} {"train_loss": -27.12601661682129, "global_step": 535272, "epoch": 6449} {"train_loss": -26.779956817626953, "global_step": 535273, "epoch": 6449} {"train_loss": -27.591339111328125, "global_step": 535274, "epoch": 6449} {"train_loss": -27.00569725036621, "global_step": 535275, "epoch": 6449} {"train_loss": -27.0506534576416, "global_step": 535276, "epoch": 6449} {"train_loss": -27.354419708251953, "global_step": 535277, "epoch": 6449} {"train_loss": -26.828760147094727, "global_step": 535278, "epoch": 6449} {"train_loss": -27.132604598999023, "global_step": 535279, "epoch": 6449} {"train_loss": -27.632368087768555, "global_step": 535280, "epoch": 6449} {"train_loss": -27.053974151611328, "global_step": 535281, "epoch": 6449} {"train_loss": -27.922855377197266, "global_step": 535282, "epoch": 6449} {"train_loss": -27.56507682800293, "global_step": 535283, "epoch": 6449} {"train_loss": -27.425155639648438, "global_step": 535284, "epoch": 6449} {"train_loss": -28.0162410736084, "global_step": 535285, "epoch": 6449} {"train_loss": -27.514291763305664, "global_step": 535286, "epoch": 6449} {"train_loss": -27.506439208984375, "global_step": 535287, "epoch": 6449} {"train_loss": -27.3887882232666, "global_step": 535288, "epoch": 6449} {"train_loss": -27.270282745361328, "global_step": 535289, "epoch": 6449} {"train_loss": -27.2957763671875, "global_step": 535290, "epoch": 6449} {"train_loss": -27.116872787475586, "global_step": 535291, "epoch": 6449} {"train_loss": -27.665912628173828, "global_step": 535292, "epoch": 6449} {"train_loss": -27.597869873046875, "global_step": 535293, "epoch": 6449} {"train_loss": -27.518310546875, "global_step": 535294, "epoch": 6449} {"train_loss": -27.940114974975586, "global_step": 535295, "epoch": 6449} {"train_loss": -27.695905685424805, "global_step": 535296, "epoch": 6449} {"train_loss": -27.528745651245117, "global_step": 535297, "epoch": 6449} {"train_loss": -27.4115047454834, "global_step": 535298, "epoch": 6449} {"train_loss": -27.457778930664062, "global_step": 535299, "epoch": 6449} {"train_loss": -27.6766414642334, "global_step": 535300, "epoch": 6449} {"train_loss": -27.989084243774414, "global_step": 535301, "epoch": 6449} {"train_loss": -27.484210968017578, "global_step": 535302, "epoch": 6449} {"train_loss": -27.8497314453125, "global_step": 535303, "epoch": 6449} {"train_loss": -27.590070724487305, "global_step": 535304, "epoch": 6449} {"train_loss": -27.399011611938477, "global_step": 535305, "epoch": 6449} {"train_loss": -27.684789657592773, "global_step": 535306, "epoch": 6449} {"train_loss": -27.5225830078125, "global_step": 535307, "epoch": 6449} {"train_loss": -27.66605567932129, "global_step": 535308, "epoch": 6449} {"train_loss": -27.49494743347168, "global_step": 535309, "epoch": 6449} {"train_loss": -27.761219024658203, "global_step": 535310, "epoch": 6449} {"train_loss": -27.74201774597168, "global_step": 535311, "epoch": 6449} {"train_loss": -27.775365829467773, "global_step": 535312, "epoch": 6449} {"train_loss": -27.183401107788086, "global_step": 535313, "epoch": 6449} {"train_loss": -27.223981857299805, "global_step": 535314, "epoch": 6449} {"train_loss": -27.369760513305664, "global_step": 535315, "epoch": 6449} {"train_loss": -27.679086685180664, "global_step": 535316, "epoch": 6449} {"train_loss": -27.736011505126953, "global_step": 535317, "epoch": 6449} {"train_loss": -27.767393112182617, "global_step": 535318, "epoch": 6449} {"train_loss": -27.36163902282715, "global_step": 535319, "epoch": 6449} {"train_loss": -27.83721923828125, "global_step": 535320, "epoch": 6449} {"train_loss": -27.408832550048828, "global_step": 535321, "epoch": 6449} {"train_loss": -27.416351318359375, "global_step": 535322, "epoch": 6449} {"train_loss": -27.49357032775879, "global_step": 535323, "epoch": 6449} {"train_loss": -27.747262954711914, "global_step": 535324, "epoch": 6449} {"train_loss": -27.901935577392578, "global_step": 535325, "epoch": 6449} {"train_loss": -27.662954330444336, "global_step": 535326, "epoch": 6449} {"train_loss": -27.279462814331055, "global_step": 535327, "epoch": 6449} {"train_loss": -27.463363647460938, "global_step": 535328, "epoch": 6449} {"train_loss": -27.268310546875, "global_step": 535329, "epoch": 6449} {"train_loss": -27.549726486206055, "global_step": 535330, "epoch": 6449} {"train_loss": -27.61604118347168, "global_step": 535331, "epoch": 6449} {"train_loss": -27.682016372680664, "global_step": 535332, "epoch": 6449} {"train_loss": -27.76045036315918, "global_step": 535333, "epoch": 6449} {"train_loss": -27.59765625, "global_step": 535334, "epoch": 6449} {"train_loss": -27.439090728759766, "global_step": 535335, "epoch": 6449} {"train_loss": -27.735315322875977, "global_step": 535336, "epoch": 6449} {"train_loss": -27.379352569580078, "global_step": 535337, "epoch": 6449} {"train_loss": -27.750051498413086, "global_step": 535338, "epoch": 6449} {"train_loss": -27.44891357421875, "global_step": 535339, "epoch": 6449} {"train_loss": -27.38028335571289, "global_step": 535340, "epoch": 6449} {"train_loss": -27.658374786376953, "global_step": 535341, "epoch": 6449} {"train_loss": -27.514936447143555, "global_step": 535342, "epoch": 6449} {"train_loss": -27.9514102935791, "global_step": 535343, "epoch": 6449} {"train_loss": -27.9797420501709, "global_step": 535344, "epoch": 6449} {"train_loss": -27.742170333862305, "global_step": 535345, "epoch": 6449} {"train_loss": -27.84064292907715, "global_step": 535346, "epoch": 6449} {"train_loss": -27.232166290283203, "global_step": 535347, "epoch": 6449} {"train_loss": -27.080184936523438, "global_step": 535348, "epoch": 6449} {"train_loss": -27.50640593379377, "global_step": 535349, "epoch": 6449, "val_loss": 6476896.0} {"train_loss": -25.098623275756836, "global_step": 535350, "epoch": 6450} {"train_loss": -24.315265655517578, "global_step": 535351, "epoch": 6450} {"train_loss": -25.947162628173828, "global_step": 535352, "epoch": 6450} {"train_loss": -26.38044548034668, "global_step": 535353, "epoch": 6450} {"train_loss": -25.802082061767578, "global_step": 535354, "epoch": 6450} {"train_loss": -26.848739624023438, "global_step": 535355, "epoch": 6450} {"train_loss": -25.83133888244629, "global_step": 535356, "epoch": 6450} {"train_loss": -26.779876708984375, "global_step": 535357, "epoch": 6450} {"train_loss": -26.658803939819336, "global_step": 535358, "epoch": 6450} {"train_loss": -26.96441078186035, "global_step": 535359, "epoch": 6450} {"train_loss": -26.763113021850586, "global_step": 535360, "epoch": 6450} {"train_loss": -27.225666046142578, "global_step": 535361, "epoch": 6450} {"train_loss": -26.709796905517578, "global_step": 535362, "epoch": 6450} {"train_loss": -27.23209571838379, "global_step": 535363, "epoch": 6450} {"train_loss": -26.9249267578125, "global_step": 535364, "epoch": 6450} {"train_loss": -27.022024154663086, "global_step": 535365, "epoch": 6450} {"train_loss": -26.895410537719727, "global_step": 535366, "epoch": 6450} {"train_loss": -26.897825241088867, "global_step": 535367, "epoch": 6450} {"train_loss": -26.715290069580078, "global_step": 535368, "epoch": 6450} {"train_loss": -26.959259033203125, "global_step": 535369, "epoch": 6450} {"train_loss": -27.739538192749023, "global_step": 535370, "epoch": 6450} {"train_loss": -26.97625160217285, "global_step": 535371, "epoch": 6450} {"train_loss": -27.275747299194336, "global_step": 535372, "epoch": 6450} {"train_loss": -27.141172409057617, "global_step": 535373, "epoch": 6450} {"train_loss": -27.481916427612305, "global_step": 535374, "epoch": 6450} {"train_loss": -27.372802734375, "global_step": 535375, "epoch": 6450} {"train_loss": -27.114667892456055, "global_step": 535376, "epoch": 6450} {"train_loss": -27.555517196655273, "global_step": 535377, "epoch": 6450} {"train_loss": -27.29026222229004, "global_step": 535378, "epoch": 6450} {"train_loss": -27.53968620300293, "global_step": 535379, "epoch": 6450} {"train_loss": -27.529987335205078, "global_step": 535380, "epoch": 6450} {"train_loss": -27.379592895507812, "global_step": 535381, "epoch": 6450} {"train_loss": -27.152530670166016, "global_step": 535382, "epoch": 6450} {"train_loss": -27.599531173706055, "global_step": 535383, "epoch": 6450} {"train_loss": -27.59657096862793, "global_step": 535384, "epoch": 6450} {"train_loss": -27.869150161743164, "global_step": 535385, "epoch": 6450} {"train_loss": -27.6563720703125, "global_step": 535386, "epoch": 6450} {"train_loss": -27.563199996948242, "global_step": 535387, "epoch": 6450} {"train_loss": -27.791479110717773, "global_step": 535388, "epoch": 6450} {"train_loss": -27.480756759643555, "global_step": 535389, "epoch": 6450} {"train_loss": -27.510223388671875, "global_step": 535390, "epoch": 6450} {"train_loss": -27.537221908569336, "global_step": 535391, "epoch": 6450} {"train_loss": -27.751089096069336, "global_step": 535392, "epoch": 6450} {"train_loss": -27.626453399658203, "global_step": 535393, "epoch": 6450} {"train_loss": -27.752471923828125, "global_step": 535394, "epoch": 6450} {"train_loss": -27.789295196533203, "global_step": 535395, "epoch": 6450} {"train_loss": -28.04669189453125, "global_step": 535396, "epoch": 6450} {"train_loss": -27.565509796142578, "global_step": 535397, "epoch": 6450} {"train_loss": -27.87412452697754, "global_step": 535398, "epoch": 6450} {"train_loss": -28.004236221313477, "global_step": 535399, "epoch": 6450} {"train_loss": -27.70867919921875, "global_step": 535400, "epoch": 6450} {"train_loss": -27.826339721679688, "global_step": 535401, "epoch": 6450} {"train_loss": -27.980009078979492, "global_step": 535402, "epoch": 6450} {"train_loss": -27.678024291992188, "global_step": 535403, "epoch": 6450} {"train_loss": -27.785608291625977, "global_step": 535404, "epoch": 6450} {"train_loss": -27.894269943237305, "global_step": 535405, "epoch": 6450} {"train_loss": -28.20751953125, "global_step": 535406, "epoch": 6450} {"train_loss": -27.976791381835938, "global_step": 535407, "epoch": 6450} {"train_loss": -27.900754928588867, "global_step": 535408, "epoch": 6450} {"train_loss": -27.92718505859375, "global_step": 535409, "epoch": 6450} {"train_loss": -27.19529151916504, "global_step": 535410, "epoch": 6450} {"train_loss": -26.767507553100586, "global_step": 535411, "epoch": 6450} {"train_loss": -24.727487564086914, "global_step": 535412, "epoch": 6450} {"train_loss": -23.233631134033203, "global_step": 535413, "epoch": 6450} {"train_loss": -24.891809463500977, "global_step": 535414, "epoch": 6450} {"train_loss": -25.46723747253418, "global_step": 535415, "epoch": 6450} {"train_loss": -25.014389038085938, "global_step": 535416, "epoch": 6450} {"train_loss": -26.54961585998535, "global_step": 535417, "epoch": 6450} {"train_loss": -25.7723331451416, "global_step": 535418, "epoch": 6450} {"train_loss": -26.824689865112305, "global_step": 535419, "epoch": 6450} {"train_loss": -26.240041732788086, "global_step": 535420, "epoch": 6450} {"train_loss": -26.86407470703125, "global_step": 535421, "epoch": 6450} {"train_loss": -26.50885009765625, "global_step": 535422, "epoch": 6450} {"train_loss": -26.8373966217041, "global_step": 535423, "epoch": 6450} {"train_loss": -26.564178466796875, "global_step": 535424, "epoch": 6450} {"train_loss": -26.8990421295166, "global_step": 535425, "epoch": 6450} {"train_loss": -26.775299072265625, "global_step": 535426, "epoch": 6450} {"train_loss": -27.031667709350586, "global_step": 535427, "epoch": 6450} {"train_loss": -27.330244064331055, "global_step": 535428, "epoch": 6450} {"train_loss": -27.29412269592285, "global_step": 535429, "epoch": 6450} {"train_loss": -26.988300323486328, "global_step": 535430, "epoch": 6450} {"train_loss": -26.99711036682129, "global_step": 535431, "epoch": 6450} {"train_loss": -27.00834313358169, "global_step": 535432, "epoch": 6450, "train/sim_max_reward_0": 1.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4500000": 1.0, "test/sim_max_reward_4500001": 1.0, "test/sim_max_reward_4500002": 1.0, "test/sim_max_reward_4500003": 1.0, "test/sim_max_reward_4500004": 1.0, "test/sim_max_reward_4500005": 1.0, "test/sim_max_reward_4500006": 1.0, "test/sim_max_reward_4500007": 1.0, "test/sim_max_reward_4500008": 1.0, "test/sim_max_reward_4500009": 1.0, "test/sim_max_reward_4500010": 1.0, "test/sim_max_reward_4500011": 1.0, "test/sim_max_reward_4500012": 1.0, "test/sim_max_reward_4500013": 1.0, "test/sim_max_reward_4500014": 1.0, "test/sim_max_reward_4500015": 1.0, "test/sim_max_reward_4500016": 1.0, "test/sim_max_reward_4500017": 1.0, "test/sim_max_reward_4500018": 1.0, "test/sim_max_reward_4500019": 0.0, "test/sim_max_reward_4500020": 1.0, "test/sim_max_reward_4500021": 1.0, "train/mean_score": 1.0, "test/mean_score": 0.9545454545454546, "val_loss": 6470158.0} {"train_loss": -26.825056076049805, "global_step": 535433, "epoch": 6451} {"train_loss": -26.991199493408203, "global_step": 535434, "epoch": 6451} {"train_loss": -26.838214874267578, "global_step": 535435, "epoch": 6451} {"train_loss": -26.76991844177246, "global_step": 535436, "epoch": 6451} {"train_loss": -27.051258087158203, "global_step": 535437, "epoch": 6451} {"train_loss": -26.72568702697754, "global_step": 535438, "epoch": 6451} {"train_loss": -26.826080322265625, "global_step": 535439, "epoch": 6451} {"train_loss": -26.606765747070312, "global_step": 535440, "epoch": 6451} {"train_loss": -27.065174102783203, "global_step": 535441, "epoch": 6451} {"train_loss": -27.19776725769043, "global_step": 535442, "epoch": 6451} {"train_loss": -27.134557723999023, "global_step": 535443, "epoch": 6451} {"train_loss": -27.198974609375, "global_step": 535444, "epoch": 6451} {"train_loss": -27.38214111328125, "global_step": 535445, "epoch": 6451} {"train_loss": -27.05422019958496, "global_step": 535446, "epoch": 6451} {"train_loss": -27.423749923706055, "global_step": 535447, "epoch": 6451} {"train_loss": -27.4982852935791, "global_step": 535448, "epoch": 6451} {"train_loss": -27.36431884765625, "global_step": 535449, "epoch": 6451} {"train_loss": -27.438047409057617, "global_step": 535450, "epoch": 6451} {"train_loss": -27.240095138549805, "global_step": 535451, "epoch": 6451} {"train_loss": -27.360559463500977, "global_step": 535452, "epoch": 6451} {"train_loss": -27.111984252929688, "global_step": 535453, "epoch": 6451} {"train_loss": -27.489349365234375, "global_step": 535454, "epoch": 6451} {"train_loss": -27.241016387939453, "global_step": 535455, "epoch": 6451} {"train_loss": -27.734872817993164, "global_step": 535456, "epoch": 6451} {"train_loss": -27.471418380737305, "global_step": 535457, "epoch": 6451} {"train_loss": -27.49299430847168, "global_step": 535458, "epoch": 6451} {"train_loss": -27.581045150756836, "global_step": 535459, "epoch": 6451} {"train_loss": -27.793121337890625, "global_step": 535460, "epoch": 6451} {"train_loss": -27.890277862548828, "global_step": 535461, "epoch": 6451} {"train_loss": -27.709257125854492, "global_step": 535462, "epoch": 6451} {"train_loss": -27.5015811920166, "global_step": 535463, "epoch": 6451} {"train_loss": -27.5323429107666, "global_step": 535464, "epoch": 6451} {"train_loss": -27.691869735717773, "global_step": 535465, "epoch": 6451} {"train_loss": -27.71160316467285, "global_step": 535466, "epoch": 6451} {"train_loss": -27.420629501342773, "global_step": 535467, "epoch": 6451} {"train_loss": -27.906667709350586, "global_step": 535468, "epoch": 6451} {"train_loss": -27.447736740112305, "global_step": 535469, "epoch": 6451} {"train_loss": -28.086978912353516, "global_step": 535470, "epoch": 6451} {"train_loss": -27.78773307800293, "global_step": 535471, "epoch": 6451} {"train_loss": -27.51946449279785, "global_step": 535472, "epoch": 6451} {"train_loss": -27.83343505859375, "global_step": 535473, "epoch": 6451} {"train_loss": -27.83485221862793, "global_step": 535474, "epoch": 6451} {"train_loss": -27.573514938354492, "global_step": 535475, "epoch": 6451} {"train_loss": -27.589197158813477, "global_step": 535476, "epoch": 6451} {"train_loss": -27.82025718688965, "global_step": 535477, "epoch": 6451} {"train_loss": -27.207509994506836, "global_step": 535478, "epoch": 6451} {"train_loss": -28.00103187561035, "global_step": 535479, "epoch": 6451} {"train_loss": -27.633955001831055, "global_step": 535480, "epoch": 6451} {"train_loss": -27.68399429321289, "global_step": 535481, "epoch": 6451} {"train_loss": -27.639089584350586, "global_step": 535482, "epoch": 6451} {"train_loss": -27.740283966064453, "global_step": 535483, "epoch": 6451} {"train_loss": -27.45121192932129, "global_step": 535484, "epoch": 6451} {"train_loss": -27.655460357666016, "global_step": 535485, "epoch": 6451} {"train_loss": -27.761144638061523, "global_step": 535486, "epoch": 6451} {"train_loss": -27.487722396850586, "global_step": 535487, "epoch": 6451} {"train_loss": -27.309375762939453, "global_step": 535488, "epoch": 6451} {"train_loss": -27.501632690429688, "global_step": 535489, "epoch": 6451} {"train_loss": -27.267169952392578, "global_step": 535490, "epoch": 6451} {"train_loss": -27.530195236206055, "global_step": 535491, "epoch": 6451} {"train_loss": -28.01630973815918, "global_step": 535492, "epoch": 6451} {"train_loss": -27.625690460205078, "global_step": 535493, "epoch": 6451} {"train_loss": -27.337209701538086, "global_step": 535494, "epoch": 6451} {"train_loss": -27.542661666870117, "global_step": 535495, "epoch": 6451} {"train_loss": -28.024145126342773, "global_step": 535496, "epoch": 6451} {"train_loss": -27.868017196655273, "global_step": 535497, "epoch": 6451} {"train_loss": -27.429981231689453, "global_step": 535498, "epoch": 6451} {"train_loss": -27.83717918395996, "global_step": 535499, "epoch": 6451} {"train_loss": -27.740203857421875, "global_step": 535500, "epoch": 6451} {"train_loss": -27.538110733032227, "global_step": 535501, "epoch": 6451} {"train_loss": -27.660400390625, "global_step": 535502, "epoch": 6451} {"train_loss": -27.673307418823242, "global_step": 535503, "epoch": 6451} {"train_loss": -27.583881378173828, "global_step": 535504, "epoch": 6451} {"train_loss": -27.675561904907227, "global_step": 535505, "epoch": 6451} {"train_loss": -27.45896339416504, "global_step": 535506, "epoch": 6451} {"train_loss": -27.934560775756836, "global_step": 535507, "epoch": 6451} {"train_loss": -27.284460067749023, "global_step": 535508, "epoch": 6451} {"train_loss": -27.818817138671875, "global_step": 535509, "epoch": 6451} {"train_loss": -27.982288360595703, "global_step": 535510, "epoch": 6451} {"train_loss": -27.731962203979492, "global_step": 535511, "epoch": 6451} {"train_loss": -27.716861724853516, "global_step": 535512, "epoch": 6451} {"train_loss": -27.86163330078125, "global_step": 535513, "epoch": 6451} {"train_loss": -28.089008331298828, "global_step": 535514, "epoch": 6451} {"train_loss": -27.518597177712316, "global_step": 535515, "epoch": 6451, "val_loss": 6400199.0} {"train_loss": -27.241668701171875, "global_step": 535516, "epoch": 6452} {"train_loss": -26.915374755859375, "global_step": 535517, "epoch": 6452} {"train_loss": -27.021215438842773, "global_step": 535518, "epoch": 6452} {"train_loss": -27.0550594329834, "global_step": 535519, "epoch": 6452} {"train_loss": -26.50669288635254, "global_step": 535520, "epoch": 6452} {"train_loss": -27.424097061157227, "global_step": 535521, "epoch": 6452} {"train_loss": -26.91385841369629, "global_step": 535522, "epoch": 6452} {"train_loss": -27.08234977722168, "global_step": 535523, "epoch": 6452} {"train_loss": -27.06863784790039, "global_step": 535524, "epoch": 6452} {"train_loss": -27.4708194732666, "global_step": 535525, "epoch": 6452} {"train_loss": -27.490848541259766, "global_step": 535526, "epoch": 6452} {"train_loss": -27.237781524658203, "global_step": 535527, "epoch": 6452} {"train_loss": -27.074081420898438, "global_step": 535528, "epoch": 6452} {"train_loss": -27.16229248046875, "global_step": 535529, "epoch": 6452} {"train_loss": -27.56135368347168, "global_step": 535530, "epoch": 6452} {"train_loss": -27.609586715698242, "global_step": 535531, "epoch": 6452} {"train_loss": -27.488378524780273, "global_step": 535532, "epoch": 6452} {"train_loss": -27.72267723083496, "global_step": 535533, "epoch": 6452} {"train_loss": -27.300649642944336, "global_step": 535534, "epoch": 6452} {"train_loss": -27.679248809814453, "global_step": 535535, "epoch": 6452} {"train_loss": -27.411285400390625, "global_step": 535536, "epoch": 6452} {"train_loss": -27.097946166992188, "global_step": 535537, "epoch": 6452} {"train_loss": -27.635486602783203, "global_step": 535538, "epoch": 6452} {"train_loss": -27.53195571899414, "global_step": 535539, "epoch": 6452} {"train_loss": -27.827123641967773, "global_step": 535540, "epoch": 6452} {"train_loss": -27.485776901245117, "global_step": 535541, "epoch": 6452} {"train_loss": -27.701099395751953, "global_step": 535542, "epoch": 6452} {"train_loss": -27.652618408203125, "global_step": 535543, "epoch": 6452} {"train_loss": -27.6905574798584, "global_step": 535544, "epoch": 6452} {"train_loss": -27.51324462890625, "global_step": 535545, "epoch": 6452} {"train_loss": -27.500158309936523, "global_step": 535546, "epoch": 6452} {"train_loss": -27.69361686706543, "global_step": 535547, "epoch": 6452} {"train_loss": -27.83616065979004, "global_step": 535548, "epoch": 6452} {"train_loss": -27.6214542388916, "global_step": 535549, "epoch": 6452} {"train_loss": -27.599781036376953, "global_step": 535550, "epoch": 6452} {"train_loss": -27.8104248046875, "global_step": 535551, "epoch": 6452} {"train_loss": -28.028539657592773, "global_step": 535552, "epoch": 6452} {"train_loss": -27.660907745361328, "global_step": 535553, "epoch": 6452} {"train_loss": -27.589202880859375, "global_step": 535554, "epoch": 6452} {"train_loss": -27.507801055908203, "global_step": 535555, "epoch": 6452} {"train_loss": -27.5963191986084, "global_step": 535556, "epoch": 6452} {"train_loss": -28.137678146362305, "global_step": 535557, "epoch": 6452} {"train_loss": -27.67885398864746, "global_step": 535558, "epoch": 6452} {"train_loss": -27.574323654174805, "global_step": 535559, "epoch": 6452} {"train_loss": -27.436079025268555, "global_step": 535560, "epoch": 6452} {"train_loss": -27.904455184936523, "global_step": 535561, "epoch": 6452} {"train_loss": -27.77377700805664, "global_step": 535562, "epoch": 6452} {"train_loss": -27.904172897338867, "global_step": 535563, "epoch": 6452} {"train_loss": -28.0020694732666, "global_step": 535564, "epoch": 6452} {"train_loss": -27.868549346923828, "global_step": 535565, "epoch": 6452} {"train_loss": -27.912857055664062, "global_step": 535566, "epoch": 6452} {"train_loss": -27.542377471923828, "global_step": 535567, "epoch": 6452} {"train_loss": -26.951618194580078, "global_step": 535568, "epoch": 6452} {"train_loss": -28.09963035583496, "global_step": 535569, "epoch": 6452} {"train_loss": -27.746145248413086, "global_step": 535570, "epoch": 6452} {"train_loss": -27.678369522094727, "global_step": 535571, "epoch": 6452} {"train_loss": -27.535181045532227, "global_step": 535572, "epoch": 6452} {"train_loss": -27.5703067779541, "global_step": 535573, "epoch": 6452} {"train_loss": -27.80449867248535, "global_step": 535574, "epoch": 6452} {"train_loss": -27.377639770507812, "global_step": 535575, "epoch": 6452} {"train_loss": -27.368927001953125, "global_step": 535576, "epoch": 6452} {"train_loss": -27.869647979736328, "global_step": 535577, "epoch": 6452} {"train_loss": -27.3323974609375, "global_step": 535578, "epoch": 6452} {"train_loss": -27.579181671142578, "global_step": 535579, "epoch": 6452} {"train_loss": -27.75982666015625, "global_step": 535580, "epoch": 6452} {"train_loss": -27.723867416381836, "global_step": 535581, "epoch": 6452} {"train_loss": -27.47348403930664, "global_step": 535582, "epoch": 6452} {"train_loss": -27.90488624572754, "global_step": 535583, "epoch": 6452} {"train_loss": -27.660663604736328, "global_step": 535584, "epoch": 6452} {"train_loss": -27.5195369720459, "global_step": 535585, "epoch": 6452} {"train_loss": -27.756103515625, "global_step": 535586, "epoch": 6452} {"train_loss": -27.720556259155273, "global_step": 535587, "epoch": 6452} {"train_loss": -27.783374786376953, "global_step": 535588, "epoch": 6452} {"train_loss": -27.693124771118164, "global_step": 535589, "epoch": 6452} {"train_loss": -27.669958114624023, "global_step": 535590, "epoch": 6452} {"train_loss": -27.69269371032715, "global_step": 535591, "epoch": 6452} {"train_loss": -27.5830020904541, "global_step": 535592, "epoch": 6452} {"train_loss": -27.472272872924805, "global_step": 535593, "epoch": 6452} {"train_loss": -27.73968505859375, "global_step": 535594, "epoch": 6452} {"train_loss": -27.4399471282959, "global_step": 535595, "epoch": 6452} {"train_loss": -27.4494686126709, "global_step": 535596, "epoch": 6452} {"train_loss": -27.510608673095703, "global_step": 535597, "epoch": 6452} {"train_loss": -27.56165713574513, "global_step": 535598, "epoch": 6452, "val_loss": 6456117.5} {"train_loss": -26.903594970703125, "global_step": 535599, "epoch": 6453} {"train_loss": -24.96582794189453, "global_step": 535600, "epoch": 6453} {"train_loss": -24.04054832458496, "global_step": 535601, "epoch": 6453} {"train_loss": -25.26545524597168, "global_step": 535602, "epoch": 6453} {"train_loss": -27.014957427978516, "global_step": 535603, "epoch": 6453} {"train_loss": -26.174219131469727, "global_step": 535604, "epoch": 6453} {"train_loss": -26.551572799682617, "global_step": 535605, "epoch": 6453} {"train_loss": -26.060407638549805, "global_step": 535606, "epoch": 6453} {"train_loss": -26.836252212524414, "global_step": 535607, "epoch": 6453} {"train_loss": -26.515228271484375, "global_step": 535608, "epoch": 6453} {"train_loss": -26.816984176635742, "global_step": 535609, "epoch": 6453} {"train_loss": -26.516742706298828, "global_step": 535610, "epoch": 6453} {"train_loss": -26.70796012878418, "global_step": 535611, "epoch": 6453} {"train_loss": -27.090646743774414, "global_step": 535612, "epoch": 6453} {"train_loss": -26.74934196472168, "global_step": 535613, "epoch": 6453} {"train_loss": -27.0185546875, "global_step": 535614, "epoch": 6453} {"train_loss": -27.10772705078125, "global_step": 535615, "epoch": 6453} {"train_loss": -26.7698974609375, "global_step": 535616, "epoch": 6453} {"train_loss": -27.130939483642578, "global_step": 535617, "epoch": 6453} {"train_loss": -27.055322647094727, "global_step": 535618, "epoch": 6453} {"train_loss": -27.400012969970703, "global_step": 535619, "epoch": 6453} {"train_loss": -27.378278732299805, "global_step": 535620, "epoch": 6453} {"train_loss": -27.009817123413086, "global_step": 535621, "epoch": 6453} {"train_loss": -27.155698776245117, "global_step": 535622, "epoch": 6453} {"train_loss": -27.300058364868164, "global_step": 535623, "epoch": 6453} {"train_loss": -27.198444366455078, "global_step": 535624, "epoch": 6453} {"train_loss": -27.462644577026367, "global_step": 535625, "epoch": 6453} {"train_loss": -27.174991607666016, "global_step": 535626, "epoch": 6453} {"train_loss": -27.309741973876953, "global_step": 535627, "epoch": 6453} {"train_loss": -27.327436447143555, "global_step": 535628, "epoch": 6453} {"train_loss": -27.147851943969727, "global_step": 535629, "epoch": 6453} {"train_loss": -27.744531631469727, "global_step": 535630, "epoch": 6453} {"train_loss": -27.12006950378418, "global_step": 535631, "epoch": 6453} {"train_loss": -27.145313262939453, "global_step": 535632, "epoch": 6453} {"train_loss": -27.2546443939209, "global_step": 535633, "epoch": 6453} {"train_loss": -27.36524772644043, "global_step": 535634, "epoch": 6453} {"train_loss": -27.509286880493164, "global_step": 535635, "epoch": 6453} {"train_loss": -27.525732040405273, "global_step": 535636, "epoch": 6453} {"train_loss": -27.15327262878418, "global_step": 535637, "epoch": 6453} {"train_loss": -27.38101577758789, "global_step": 535638, "epoch": 6453} {"train_loss": -27.09871482849121, "global_step": 535639, "epoch": 6453} {"train_loss": -27.368799209594727, "global_step": 535640, "epoch": 6453} {"train_loss": -27.44573974609375, "global_step": 535641, "epoch": 6453} {"train_loss": -27.42962074279785, "global_step": 535642, "epoch": 6453} {"train_loss": -27.644241333007812, "global_step": 535643, "epoch": 6453} {"train_loss": -27.282581329345703, "global_step": 535644, "epoch": 6453} {"train_loss": -27.493986129760742, "global_step": 535645, "epoch": 6453} {"train_loss": -27.58837890625, "global_step": 535646, "epoch": 6453} {"train_loss": -27.969640731811523, "global_step": 535647, "epoch": 6453} {"train_loss": -27.97849464416504, "global_step": 535648, "epoch": 6453} {"train_loss": -27.627649307250977, "global_step": 535649, "epoch": 6453} {"train_loss": -27.993728637695312, "global_step": 535650, "epoch": 6453} {"train_loss": -27.96735191345215, "global_step": 535651, "epoch": 6453} {"train_loss": -27.868000030517578, "global_step": 535652, "epoch": 6453} {"train_loss": -28.004064559936523, "global_step": 535653, "epoch": 6453} {"train_loss": -27.876020431518555, "global_step": 535654, "epoch": 6453} {"train_loss": -27.758970260620117, "global_step": 535655, "epoch": 6453} {"train_loss": -28.067005157470703, "global_step": 535656, "epoch": 6453} {"train_loss": -27.821115493774414, "global_step": 535657, "epoch": 6453} {"train_loss": -28.02656364440918, "global_step": 535658, "epoch": 6453} {"train_loss": -27.820026397705078, "global_step": 535659, "epoch": 6453} {"train_loss": -27.763036727905273, "global_step": 535660, "epoch": 6453} {"train_loss": -28.07729148864746, "global_step": 535661, "epoch": 6453} {"train_loss": -27.743072509765625, "global_step": 535662, "epoch": 6453} {"train_loss": -27.76800537109375, "global_step": 535663, "epoch": 6453} {"train_loss": -27.526611328125, "global_step": 535664, "epoch": 6453} {"train_loss": -27.23219108581543, "global_step": 535665, "epoch": 6453} {"train_loss": -27.858388900756836, "global_step": 535666, "epoch": 6453} {"train_loss": -27.976423263549805, "global_step": 535667, "epoch": 6453} {"train_loss": -27.331623077392578, "global_step": 535668, "epoch": 6453} {"train_loss": -28.006942749023438, "global_step": 535669, "epoch": 6453} {"train_loss": -27.851428985595703, "global_step": 535670, "epoch": 6453} {"train_loss": -27.84601402282715, "global_step": 535671, "epoch": 6453} {"train_loss": -27.6992130279541, "global_step": 535672, "epoch": 6453} {"train_loss": -27.60501480102539, "global_step": 535673, "epoch": 6453} {"train_loss": -27.66497802734375, "global_step": 535674, "epoch": 6453} {"train_loss": -27.781360626220703, "global_step": 535675, "epoch": 6453} {"train_loss": -27.373291015625, "global_step": 535676, "epoch": 6453} {"train_loss": -27.66536521911621, "global_step": 535677, "epoch": 6453} {"train_loss": -27.806549072265625, "global_step": 535678, "epoch": 6453} {"train_loss": -27.767240524291992, "global_step": 535679, "epoch": 6453} {"train_loss": -27.824941635131836, "global_step": 535680, "epoch": 6453} {"train_loss": -27.323851872639484, "global_step": 535681, "epoch": 6453, "val_loss": 6438565.0} {"train_loss": -27.08210563659668, "global_step": 535682, "epoch": 6454} {"train_loss": -26.836517333984375, "global_step": 535683, "epoch": 6454} {"train_loss": -26.906896591186523, "global_step": 535684, "epoch": 6454} {"train_loss": -26.840696334838867, "global_step": 535685, "epoch": 6454} {"train_loss": -27.342548370361328, "global_step": 535686, "epoch": 6454} {"train_loss": -26.73927879333496, "global_step": 535687, "epoch": 6454} {"train_loss": -27.23335075378418, "global_step": 535688, "epoch": 6454} {"train_loss": -26.832120895385742, "global_step": 535689, "epoch": 6454} {"train_loss": -26.970600128173828, "global_step": 535690, "epoch": 6454} {"train_loss": -27.447256088256836, "global_step": 535691, "epoch": 6454} {"train_loss": -27.459564208984375, "global_step": 535692, "epoch": 6454} {"train_loss": -27.09938621520996, "global_step": 535693, "epoch": 6454} {"train_loss": -27.684356689453125, "global_step": 535694, "epoch": 6454} {"train_loss": -27.19337272644043, "global_step": 535695, "epoch": 6454} {"train_loss": -27.359088897705078, "global_step": 535696, "epoch": 6454} {"train_loss": -27.527786254882812, "global_step": 535697, "epoch": 6454} {"train_loss": -27.110736846923828, "global_step": 535698, "epoch": 6454} {"train_loss": -27.27003288269043, "global_step": 535699, "epoch": 6454} {"train_loss": -27.292556762695312, "global_step": 535700, "epoch": 6454} {"train_loss": -27.061553955078125, "global_step": 535701, "epoch": 6454} {"train_loss": -27.239652633666992, "global_step": 535702, "epoch": 6454} {"train_loss": -27.346837997436523, "global_step": 535703, "epoch": 6454} {"train_loss": -27.525419235229492, "global_step": 535704, "epoch": 6454} {"train_loss": -27.395374298095703, "global_step": 535705, "epoch": 6454} {"train_loss": -27.746479034423828, "global_step": 535706, "epoch": 6454} {"train_loss": -27.8809871673584, "global_step": 535707, "epoch": 6454} {"train_loss": -27.84588623046875, "global_step": 535708, "epoch": 6454} {"train_loss": -27.754846572875977, "global_step": 535709, "epoch": 6454} {"train_loss": -27.508756637573242, "global_step": 535710, "epoch": 6454} {"train_loss": -27.850183486938477, "global_step": 535711, "epoch": 6454} {"train_loss": -27.66021728515625, "global_step": 535712, "epoch": 6454} {"train_loss": -27.69573402404785, "global_step": 535713, "epoch": 6454} {"train_loss": -27.4816837310791, "global_step": 535714, "epoch": 6454} {"train_loss": -27.672271728515625, "global_step": 535715, "epoch": 6454} {"train_loss": -27.488554000854492, "global_step": 535716, "epoch": 6454} {"train_loss": -27.6589298248291, "global_step": 535717, "epoch": 6454} {"train_loss": -27.463302612304688, "global_step": 535718, "epoch": 6454} {"train_loss": -27.328031539916992, "global_step": 535719, "epoch": 6454} {"train_loss": -27.726327896118164, "global_step": 535720, "epoch": 6454} {"train_loss": -27.939844131469727, "global_step": 535721, "epoch": 6454} {"train_loss": -27.435331344604492, "global_step": 535722, "epoch": 6454} {"train_loss": -27.8724422454834, "global_step": 535723, "epoch": 6454} {"train_loss": -27.557281494140625, "global_step": 535724, "epoch": 6454} {"train_loss": -27.680089950561523, "global_step": 535725, "epoch": 6454} {"train_loss": -27.755878448486328, "global_step": 535726, "epoch": 6454} {"train_loss": -27.80647850036621, "global_step": 535727, "epoch": 6454} {"train_loss": -27.799673080444336, "global_step": 535728, "epoch": 6454} {"train_loss": -27.673925399780273, "global_step": 535729, "epoch": 6454} {"train_loss": -28.012598037719727, "global_step": 535730, "epoch": 6454} {"train_loss": -27.805383682250977, "global_step": 535731, "epoch": 6454} {"train_loss": -27.89174461364746, "global_step": 535732, "epoch": 6454} {"train_loss": -27.871252059936523, "global_step": 535733, "epoch": 6454} {"train_loss": -27.631061553955078, "global_step": 535734, "epoch": 6454} {"train_loss": -27.95703125, "global_step": 535735, "epoch": 6454} {"train_loss": -27.54568862915039, "global_step": 535736, "epoch": 6454} {"train_loss": -27.49268913269043, "global_step": 535737, "epoch": 6454} {"train_loss": -27.905309677124023, "global_step": 535738, "epoch": 6454} {"train_loss": -27.477161407470703, "global_step": 535739, "epoch": 6454} {"train_loss": -27.658740997314453, "global_step": 535740, "epoch": 6454} {"train_loss": -27.82929039001465, "global_step": 535741, "epoch": 6454} {"train_loss": -27.49056053161621, "global_step": 535742, "epoch": 6454} {"train_loss": -27.921234130859375, "global_step": 535743, "epoch": 6454} {"train_loss": -27.582660675048828, "global_step": 535744, "epoch": 6454} {"train_loss": -27.95285987854004, "global_step": 535745, "epoch": 6454} {"train_loss": -27.8637638092041, "global_step": 535746, "epoch": 6454} {"train_loss": -27.501340866088867, "global_step": 535747, "epoch": 6454} {"train_loss": -27.774866104125977, "global_step": 535748, "epoch": 6454} {"train_loss": -27.959808349609375, "global_step": 535749, "epoch": 6454} {"train_loss": -28.162811279296875, "global_step": 535750, "epoch": 6454} {"train_loss": -27.83322525024414, "global_step": 535751, "epoch": 6454} {"train_loss": -27.51397705078125, "global_step": 535752, "epoch": 6454} {"train_loss": -27.638525009155273, "global_step": 535753, "epoch": 6454} {"train_loss": -27.747333526611328, "global_step": 535754, "epoch": 6454} {"train_loss": -28.026153564453125, "global_step": 535755, "epoch": 6454} {"train_loss": -27.8164119720459, "global_step": 535756, "epoch": 6454} {"train_loss": -27.95000648498535, "global_step": 535757, "epoch": 6454} {"train_loss": -27.848352432250977, "global_step": 535758, "epoch": 6454} {"train_loss": -27.702362060546875, "global_step": 535759, "epoch": 6454} {"train_loss": -27.45063591003418, "global_step": 535760, "epoch": 6454} {"train_loss": -27.46427345275879, "global_step": 535761, "epoch": 6454} {"train_loss": -27.680219650268555, "global_step": 535762, "epoch": 6454} {"train_loss": -27.8677921295166, "global_step": 535763, "epoch": 6454} {"train_loss": -27.58284837653838, "global_step": 535764, "epoch": 6454, "val_loss": 6467085.5} {"train_loss": -27.20216178894043, "global_step": 535765, "epoch": 6455} {"train_loss": -27.363739013671875, "global_step": 535766, "epoch": 6455} {"train_loss": -27.35247802734375, "global_step": 535767, "epoch": 6455} {"train_loss": -27.063501358032227, "global_step": 535768, "epoch": 6455} {"train_loss": -27.489410400390625, "global_step": 535769, "epoch": 6455} {"train_loss": -27.72784423828125, "global_step": 535770, "epoch": 6455} {"train_loss": -27.194766998291016, "global_step": 535771, "epoch": 6455} {"train_loss": -27.281286239624023, "global_step": 535772, "epoch": 6455} {"train_loss": -27.272220611572266, "global_step": 535773, "epoch": 6455} {"train_loss": -27.107038497924805, "global_step": 535774, "epoch": 6455} {"train_loss": -27.305932998657227, "global_step": 535775, "epoch": 6455} {"train_loss": -26.9005126953125, "global_step": 535776, "epoch": 6455} {"train_loss": -27.08810806274414, "global_step": 535777, "epoch": 6455} {"train_loss": -27.249191284179688, "global_step": 535778, "epoch": 6455} {"train_loss": -27.42232322692871, "global_step": 535779, "epoch": 6455} {"train_loss": -27.166675567626953, "global_step": 535780, "epoch": 6455} {"train_loss": -27.48854637145996, "global_step": 535781, "epoch": 6455} {"train_loss": -27.4512882232666, "global_step": 535782, "epoch": 6455} {"train_loss": -27.87841796875, "global_step": 535783, "epoch": 6455} {"train_loss": -27.751676559448242, "global_step": 535784, "epoch": 6455} {"train_loss": -26.8536319732666, "global_step": 535785, "epoch": 6455} {"train_loss": -27.433135986328125, "global_step": 535786, "epoch": 6455} {"train_loss": -27.188955307006836, "global_step": 535787, "epoch": 6455} {"train_loss": -26.993545532226562, "global_step": 535788, "epoch": 6455} {"train_loss": -27.753742218017578, "global_step": 535789, "epoch": 6455} {"train_loss": -27.098535537719727, "global_step": 535790, "epoch": 6455} {"train_loss": -27.642919540405273, "global_step": 535791, "epoch": 6455} {"train_loss": -27.251300811767578, "global_step": 535792, "epoch": 6455} {"train_loss": -27.300817489624023, "global_step": 535793, "epoch": 6455} {"train_loss": -27.5379638671875, "global_step": 535794, "epoch": 6455} {"train_loss": -27.49546241760254, "global_step": 535795, "epoch": 6455} {"train_loss": -27.600690841674805, "global_step": 535796, "epoch": 6455} {"train_loss": -27.512693405151367, "global_step": 535797, "epoch": 6455} {"train_loss": -27.545217514038086, "global_step": 535798, "epoch": 6455} {"train_loss": -27.414274215698242, "global_step": 535799, "epoch": 6455} {"train_loss": -27.534955978393555, "global_step": 535800, "epoch": 6455} {"train_loss": -27.545948028564453, "global_step": 535801, "epoch": 6455} {"train_loss": -27.362096786499023, "global_step": 535802, "epoch": 6455} {"train_loss": -27.724872589111328, "global_step": 535803, "epoch": 6455} {"train_loss": -27.309152603149414, "global_step": 535804, "epoch": 6455} {"train_loss": -27.633636474609375, "global_step": 535805, "epoch": 6455} {"train_loss": -27.698698043823242, "global_step": 535806, "epoch": 6455} {"train_loss": -27.302087783813477, "global_step": 535807, "epoch": 6455} {"train_loss": -28.220243453979492, "global_step": 535808, "epoch": 6455} {"train_loss": -27.818403244018555, "global_step": 535809, "epoch": 6455} {"train_loss": -27.75007438659668, "global_step": 535810, "epoch": 6455} {"train_loss": -27.647985458374023, "global_step": 535811, "epoch": 6455} {"train_loss": -28.1326904296875, "global_step": 535812, "epoch": 6455} {"train_loss": -27.916339874267578, "global_step": 535813, "epoch": 6455} {"train_loss": -27.841266632080078, "global_step": 535814, "epoch": 6455} {"train_loss": -28.000675201416016, "global_step": 535815, "epoch": 6455} {"train_loss": -27.419103622436523, "global_step": 535816, "epoch": 6455} {"train_loss": -28.21107292175293, "global_step": 535817, "epoch": 6455} {"train_loss": -27.56513023376465, "global_step": 535818, "epoch": 6455} {"train_loss": -27.996397018432617, "global_step": 535819, "epoch": 6455} {"train_loss": -27.662357330322266, "global_step": 535820, "epoch": 6455} {"train_loss": -28.125024795532227, "global_step": 535821, "epoch": 6455} {"train_loss": -27.715442657470703, "global_step": 535822, "epoch": 6455} {"train_loss": -27.549741744995117, "global_step": 535823, "epoch": 6455} {"train_loss": -27.811264038085938, "global_step": 535824, "epoch": 6455} {"train_loss": -27.489288330078125, "global_step": 535825, "epoch": 6455} {"train_loss": -27.50678825378418, "global_step": 535826, "epoch": 6455} {"train_loss": -27.87627601623535, "global_step": 535827, "epoch": 6455} {"train_loss": -27.799787521362305, "global_step": 535828, "epoch": 6455} {"train_loss": -28.043577194213867, "global_step": 535829, "epoch": 6455} {"train_loss": -27.8106746673584, "global_step": 535830, "epoch": 6455} {"train_loss": -27.771713256835938, "global_step": 535831, "epoch": 6455} {"train_loss": -27.528959274291992, "global_step": 535832, "epoch": 6455} {"train_loss": -27.487018585205078, "global_step": 535833, "epoch": 6455} {"train_loss": -27.402145385742188, "global_step": 535834, "epoch": 6455} {"train_loss": -28.066665649414062, "global_step": 535835, "epoch": 6455} {"train_loss": -28.105213165283203, "global_step": 535836, "epoch": 6455} {"train_loss": -27.567340850830078, "global_step": 535837, "epoch": 6455} {"train_loss": -27.637680053710938, "global_step": 535838, "epoch": 6455} {"train_loss": -27.497610092163086, "global_step": 535839, "epoch": 6455} {"train_loss": -27.07820701599121, "global_step": 535840, "epoch": 6455} {"train_loss": -27.89751625061035, "global_step": 535841, "epoch": 6455} {"train_loss": -27.690053939819336, "global_step": 535842, "epoch": 6455} {"train_loss": -27.71355628967285, "global_step": 535843, "epoch": 6455} {"train_loss": -27.536853790283203, "global_step": 535844, "epoch": 6455} {"train_loss": -27.630292892456055, "global_step": 535845, "epoch": 6455} {"train_loss": -27.57675552368164, "global_step": 535846, "epoch": 6455} {"train_loss": -27.54394565720156, "global_step": 535847, "epoch": 6455, "val_loss": 6448419.0} {"train_loss": -27.27032470703125, "global_step": 535848, "epoch": 6456} {"train_loss": -27.313459396362305, "global_step": 535849, "epoch": 6456} {"train_loss": -26.9996395111084, "global_step": 535850, "epoch": 6456} {"train_loss": -27.658496856689453, "global_step": 535851, "epoch": 6456} {"train_loss": -27.199071884155273, "global_step": 535852, "epoch": 6456} {"train_loss": -27.02324867248535, "global_step": 535853, "epoch": 6456} {"train_loss": -27.2088623046875, "global_step": 535854, "epoch": 6456} {"train_loss": -27.204349517822266, "global_step": 535855, "epoch": 6456} {"train_loss": -27.713712692260742, "global_step": 535856, "epoch": 6456} {"train_loss": -27.397817611694336, "global_step": 535857, "epoch": 6456} {"train_loss": -27.75830078125, "global_step": 535858, "epoch": 6456} {"train_loss": -27.435760498046875, "global_step": 535859, "epoch": 6456} {"train_loss": -27.123779296875, "global_step": 535860, "epoch": 6456} {"train_loss": -27.2099552154541, "global_step": 535861, "epoch": 6456} {"train_loss": -27.739349365234375, "global_step": 535862, "epoch": 6456} {"train_loss": -27.124954223632812, "global_step": 535863, "epoch": 6456} {"train_loss": -27.38311195373535, "global_step": 535864, "epoch": 6456} {"train_loss": -27.63494300842285, "global_step": 535865, "epoch": 6456} {"train_loss": -27.810993194580078, "global_step": 535866, "epoch": 6456} {"train_loss": -27.891605377197266, "global_step": 535867, "epoch": 6456} {"train_loss": -27.963132858276367, "global_step": 535868, "epoch": 6456} {"train_loss": -27.8257999420166, "global_step": 535869, "epoch": 6456} {"train_loss": -27.44571876525879, "global_step": 535870, "epoch": 6456} {"train_loss": -28.01617431640625, "global_step": 535871, "epoch": 6456} {"train_loss": -27.819900512695312, "global_step": 535872, "epoch": 6456} {"train_loss": -27.599689483642578, "global_step": 535873, "epoch": 6456} {"train_loss": -27.576623916625977, "global_step": 535874, "epoch": 6456} {"train_loss": -27.53791618347168, "global_step": 535875, "epoch": 6456} {"train_loss": -27.60306739807129, "global_step": 535876, "epoch": 6456} {"train_loss": -28.04610252380371, "global_step": 535877, "epoch": 6456} {"train_loss": -27.717639923095703, "global_step": 535878, "epoch": 6456} {"train_loss": -27.637319564819336, "global_step": 535879, "epoch": 6456} {"train_loss": -28.020109176635742, "global_step": 535880, "epoch": 6456} {"train_loss": -27.871337890625, "global_step": 535881, "epoch": 6456} {"train_loss": -27.75933265686035, "global_step": 535882, "epoch": 6456} {"train_loss": -27.925283432006836, "global_step": 535883, "epoch": 6456} {"train_loss": -27.9807186126709, "global_step": 535884, "epoch": 6456} {"train_loss": -27.935129165649414, "global_step": 535885, "epoch": 6456} {"train_loss": -27.89240837097168, "global_step": 535886, "epoch": 6456} {"train_loss": -27.64426040649414, "global_step": 535887, "epoch": 6456} {"train_loss": -27.792959213256836, "global_step": 535888, "epoch": 6456} {"train_loss": -27.61440086364746, "global_step": 535889, "epoch": 6456} {"train_loss": -27.6806583404541, "global_step": 535890, "epoch": 6456} {"train_loss": -27.662153244018555, "global_step": 535891, "epoch": 6456} {"train_loss": -27.377538681030273, "global_step": 535892, "epoch": 6456} {"train_loss": -27.4189453125, "global_step": 535893, "epoch": 6456} {"train_loss": -27.609039306640625, "global_step": 535894, "epoch": 6456} {"train_loss": -27.37704849243164, "global_step": 535895, "epoch": 6456} {"train_loss": -27.773801803588867, "global_step": 535896, "epoch": 6456} {"train_loss": -27.883758544921875, "global_step": 535897, "epoch": 6456} {"train_loss": -27.72991943359375, "global_step": 535898, "epoch": 6456} {"train_loss": -27.3577880859375, "global_step": 535899, "epoch": 6456} {"train_loss": -27.331396102905273, "global_step": 535900, "epoch": 6456} {"train_loss": -27.147863388061523, "global_step": 535901, "epoch": 6456} {"train_loss": -27.39713478088379, "global_step": 535902, "epoch": 6456} {"train_loss": -27.681894302368164, "global_step": 535903, "epoch": 6456} {"train_loss": -27.554052352905273, "global_step": 535904, "epoch": 6456} {"train_loss": -27.598413467407227, "global_step": 535905, "epoch": 6456} {"train_loss": -27.8617000579834, "global_step": 535906, "epoch": 6456} {"train_loss": -27.639698028564453, "global_step": 535907, "epoch": 6456} {"train_loss": -27.294448852539062, "global_step": 535908, "epoch": 6456} {"train_loss": -27.538671493530273, "global_step": 535909, "epoch": 6456} {"train_loss": -27.0128173828125, "global_step": 535910, "epoch": 6456} {"train_loss": -27.33173179626465, "global_step": 535911, "epoch": 6456} {"train_loss": -27.786468505859375, "global_step": 535912, "epoch": 6456} {"train_loss": -27.325048446655273, "global_step": 535913, "epoch": 6456} {"train_loss": -27.354663848876953, "global_step": 535914, "epoch": 6456} {"train_loss": -27.736988067626953, "global_step": 535915, "epoch": 6456} {"train_loss": -27.786426544189453, "global_step": 535916, "epoch": 6456} {"train_loss": -27.63252067565918, "global_step": 535917, "epoch": 6456} {"train_loss": -27.577411651611328, "global_step": 535918, "epoch": 6456} {"train_loss": -27.772428512573242, "global_step": 535919, "epoch": 6456} {"train_loss": -27.940526962280273, "global_step": 535920, "epoch": 6456} {"train_loss": -27.4029483795166, "global_step": 535921, "epoch": 6456} {"train_loss": -27.514606475830078, "global_step": 535922, "epoch": 6456} {"train_loss": -27.459142684936523, "global_step": 535923, "epoch": 6456} {"train_loss": -27.619836807250977, "global_step": 535924, "epoch": 6456} {"train_loss": -27.53086280822754, "global_step": 535925, "epoch": 6456} {"train_loss": -26.9836368560791, "global_step": 535926, "epoch": 6456} {"train_loss": -27.628284454345703, "global_step": 535927, "epoch": 6456} {"train_loss": -27.756086349487305, "global_step": 535928, "epoch": 6456} {"train_loss": -27.49462890625, "global_step": 535929, "epoch": 6456} {"train_loss": -27.569604505975562, "global_step": 535930, "epoch": 6456, "val_loss": 6415510.5} {"train_loss": -27.308759689331055, "global_step": 535931, "epoch": 6457} {"train_loss": -27.164213180541992, "global_step": 535932, "epoch": 6457} {"train_loss": -27.236719131469727, "global_step": 535933, "epoch": 6457} {"train_loss": -27.12287712097168, "global_step": 535934, "epoch": 6457} {"train_loss": -27.152698516845703, "global_step": 535935, "epoch": 6457} {"train_loss": -27.07013511657715, "global_step": 535936, "epoch": 6457} {"train_loss": -26.990320205688477, "global_step": 535937, "epoch": 6457} {"train_loss": -27.40669059753418, "global_step": 535938, "epoch": 6457} {"train_loss": -27.841400146484375, "global_step": 535939, "epoch": 6457} {"train_loss": -27.307477951049805, "global_step": 535940, "epoch": 6457} {"train_loss": -27.246068954467773, "global_step": 535941, "epoch": 6457} {"train_loss": -27.365997314453125, "global_step": 535942, "epoch": 6457} {"train_loss": -27.64072036743164, "global_step": 535943, "epoch": 6457} {"train_loss": -27.870208740234375, "global_step": 535944, "epoch": 6457} {"train_loss": -27.298315048217773, "global_step": 535945, "epoch": 6457} {"train_loss": -27.42268943786621, "global_step": 535946, "epoch": 6457} {"train_loss": -27.297086715698242, "global_step": 535947, "epoch": 6457} {"train_loss": -27.38404655456543, "global_step": 535948, "epoch": 6457} {"train_loss": -27.390579223632812, "global_step": 535949, "epoch": 6457} {"train_loss": -27.601093292236328, "global_step": 535950, "epoch": 6457} {"train_loss": -27.94122886657715, "global_step": 535951, "epoch": 6457} {"train_loss": -27.153594970703125, "global_step": 535952, "epoch": 6457} {"train_loss": -27.625341415405273, "global_step": 535953, "epoch": 6457} {"train_loss": -27.03049659729004, "global_step": 535954, "epoch": 6457} {"train_loss": -27.8011474609375, "global_step": 535955, "epoch": 6457} {"train_loss": -27.605005264282227, "global_step": 535956, "epoch": 6457} {"train_loss": -27.584264755249023, "global_step": 535957, "epoch": 6457} {"train_loss": -27.50837516784668, "global_step": 535958, "epoch": 6457} {"train_loss": -27.37179946899414, "global_step": 535959, "epoch": 6457} {"train_loss": -27.64851951599121, "global_step": 535960, "epoch": 6457} {"train_loss": -27.6735782623291, "global_step": 535961, "epoch": 6457} {"train_loss": -27.770980834960938, "global_step": 535962, "epoch": 6457} {"train_loss": -27.72955322265625, "global_step": 535963, "epoch": 6457} {"train_loss": -27.578161239624023, "global_step": 535964, "epoch": 6457} {"train_loss": -27.799224853515625, "global_step": 535965, "epoch": 6457} {"train_loss": -28.118017196655273, "global_step": 535966, "epoch": 6457} {"train_loss": -27.684350967407227, "global_step": 535967, "epoch": 6457} {"train_loss": -27.720783233642578, "global_step": 535968, "epoch": 6457} {"train_loss": -27.69441795349121, "global_step": 535969, "epoch": 6457} {"train_loss": -27.729185104370117, "global_step": 535970, "epoch": 6457} {"train_loss": -27.49079704284668, "global_step": 535971, "epoch": 6457} {"train_loss": -27.652057647705078, "global_step": 535972, "epoch": 6457} {"train_loss": -27.791461944580078, "global_step": 535973, "epoch": 6457} {"train_loss": -27.788776397705078, "global_step": 535974, "epoch": 6457} {"train_loss": -27.638214111328125, "global_step": 535975, "epoch": 6457} {"train_loss": -27.930633544921875, "global_step": 535976, "epoch": 6457} {"train_loss": -27.52585792541504, "global_step": 535977, "epoch": 6457} {"train_loss": -27.050994873046875, "global_step": 535978, "epoch": 6457} {"train_loss": -26.794843673706055, "global_step": 535979, "epoch": 6457} {"train_loss": -26.498762130737305, "global_step": 535980, "epoch": 6457} {"train_loss": -25.118223190307617, "global_step": 535981, "epoch": 6457} {"train_loss": -24.881540298461914, "global_step": 535982, "epoch": 6457} {"train_loss": -26.890243530273438, "global_step": 535983, "epoch": 6457} {"train_loss": -27.288217544555664, "global_step": 535984, "epoch": 6457} {"train_loss": -26.656808853149414, "global_step": 535985, "epoch": 6457} {"train_loss": -27.0306396484375, "global_step": 535986, "epoch": 6457} {"train_loss": -27.02836036682129, "global_step": 535987, "epoch": 6457} {"train_loss": -27.11910057067871, "global_step": 535988, "epoch": 6457} {"train_loss": -27.199569702148438, "global_step": 535989, "epoch": 6457} {"train_loss": -27.287763595581055, "global_step": 535990, "epoch": 6457} {"train_loss": -26.97235107421875, "global_step": 535991, "epoch": 6457} {"train_loss": -27.3510684967041, "global_step": 535992, "epoch": 6457} {"train_loss": -27.23341941833496, "global_step": 535993, "epoch": 6457} {"train_loss": -27.08926773071289, "global_step": 535994, "epoch": 6457} {"train_loss": -27.4644775390625, "global_step": 535995, "epoch": 6457} {"train_loss": -27.284082412719727, "global_step": 535996, "epoch": 6457} {"train_loss": -27.7386531829834, "global_step": 535997, "epoch": 6457} {"train_loss": -27.239151000976562, "global_step": 535998, "epoch": 6457} {"train_loss": -27.619230270385742, "global_step": 535999, "epoch": 6457} {"train_loss": -27.249631881713867, "global_step": 536000, "epoch": 6457} {"train_loss": -27.494592666625977, "global_step": 536001, "epoch": 6457} {"train_loss": -27.7154483795166, "global_step": 536002, "epoch": 6457} {"train_loss": -27.14508056640625, "global_step": 536003, "epoch": 6457} {"train_loss": -27.206562042236328, "global_step": 536004, "epoch": 6457} {"train_loss": -27.360822677612305, "global_step": 536005, "epoch": 6457} {"train_loss": -27.732086181640625, "global_step": 536006, "epoch": 6457} {"train_loss": -27.405424118041992, "global_step": 536007, "epoch": 6457} {"train_loss": -27.71771240234375, "global_step": 536008, "epoch": 6457} {"train_loss": -27.736474990844727, "global_step": 536009, "epoch": 6457} {"train_loss": -27.826080322265625, "global_step": 536010, "epoch": 6457} {"train_loss": -27.6649227142334, "global_step": 536011, "epoch": 6457} {"train_loss": -27.569616317749023, "global_step": 536012, "epoch": 6457} {"train_loss": -27.37952703452972, "global_step": 536013, "epoch": 6457, "val_loss": 6485652.0} {"train_loss": -27.469104766845703, "global_step": 536014, "epoch": 6458} {"train_loss": -27.028722763061523, "global_step": 536015, "epoch": 6458} {"train_loss": -27.16922378540039, "global_step": 536016, "epoch": 6458} {"train_loss": -27.622833251953125, "global_step": 536017, "epoch": 6458} {"train_loss": -26.80817985534668, "global_step": 536018, "epoch": 6458} {"train_loss": -27.040746688842773, "global_step": 536019, "epoch": 6458} {"train_loss": -26.957538604736328, "global_step": 536020, "epoch": 6458} {"train_loss": -27.38427734375, "global_step": 536021, "epoch": 6458} {"train_loss": -27.470006942749023, "global_step": 536022, "epoch": 6458} {"train_loss": -26.898502349853516, "global_step": 536023, "epoch": 6458} {"train_loss": -27.375232696533203, "global_step": 536024, "epoch": 6458} {"train_loss": -27.049673080444336, "global_step": 536025, "epoch": 6458} {"train_loss": -27.471221923828125, "global_step": 536026, "epoch": 6458} {"train_loss": -27.573331832885742, "global_step": 536027, "epoch": 6458} {"train_loss": -27.571685791015625, "global_step": 536028, "epoch": 6458} {"train_loss": -27.348651885986328, "global_step": 536029, "epoch": 6458} {"train_loss": -27.922107696533203, "global_step": 536030, "epoch": 6458} {"train_loss": -27.75800132751465, "global_step": 536031, "epoch": 6458} {"train_loss": -27.4561710357666, "global_step": 536032, "epoch": 6458} {"train_loss": -27.389068603515625, "global_step": 536033, "epoch": 6458} {"train_loss": -27.47068214416504, "global_step": 536034, "epoch": 6458} {"train_loss": -27.511001586914062, "global_step": 536035, "epoch": 6458} {"train_loss": -27.644672393798828, "global_step": 536036, "epoch": 6458} {"train_loss": -27.490055084228516, "global_step": 536037, "epoch": 6458} {"train_loss": -27.603952407836914, "global_step": 536038, "epoch": 6458} {"train_loss": -27.654478073120117, "global_step": 536039, "epoch": 6458} {"train_loss": -27.504674911499023, "global_step": 536040, "epoch": 6458} {"train_loss": -27.625219345092773, "global_step": 536041, "epoch": 6458} {"train_loss": -27.70526123046875, "global_step": 536042, "epoch": 6458} {"train_loss": -27.555944442749023, "global_step": 536043, "epoch": 6458} {"train_loss": -27.37664794921875, "global_step": 536044, "epoch": 6458} {"train_loss": -27.43182945251465, "global_step": 536045, "epoch": 6458} {"train_loss": -27.596332550048828, "global_step": 536046, "epoch": 6458} {"train_loss": -27.552072525024414, "global_step": 536047, "epoch": 6458} {"train_loss": -28.1400089263916, "global_step": 536048, "epoch": 6458} {"train_loss": -27.644269943237305, "global_step": 536049, "epoch": 6458} {"train_loss": -27.712583541870117, "global_step": 536050, "epoch": 6458} {"train_loss": -27.8367919921875, "global_step": 536051, "epoch": 6458} {"train_loss": -27.81446647644043, "global_step": 536052, "epoch": 6458} {"train_loss": -27.837228775024414, "global_step": 536053, "epoch": 6458} {"train_loss": -27.584278106689453, "global_step": 536054, "epoch": 6458} {"train_loss": -28.109601974487305, "global_step": 536055, "epoch": 6458} {"train_loss": -27.986083984375, "global_step": 536056, "epoch": 6458} {"train_loss": -27.917829513549805, "global_step": 536057, "epoch": 6458} {"train_loss": -27.8765926361084, "global_step": 536058, "epoch": 6458} {"train_loss": -27.50702476501465, "global_step": 536059, "epoch": 6458} {"train_loss": -28.149267196655273, "global_step": 536060, "epoch": 6458} {"train_loss": -28.10858154296875, "global_step": 536061, "epoch": 6458} {"train_loss": -27.764026641845703, "global_step": 536062, "epoch": 6458} {"train_loss": -27.8378963470459, "global_step": 536063, "epoch": 6458} {"train_loss": -27.682340621948242, "global_step": 536064, "epoch": 6458} {"train_loss": -27.5797119140625, "global_step": 536065, "epoch": 6458} {"train_loss": -27.939184188842773, "global_step": 536066, "epoch": 6458} {"train_loss": -27.642419815063477, "global_step": 536067, "epoch": 6458} {"train_loss": -27.705625534057617, "global_step": 536068, "epoch": 6458} {"train_loss": -27.77947425842285, "global_step": 536069, "epoch": 6458} {"train_loss": -27.441267013549805, "global_step": 536070, "epoch": 6458} {"train_loss": -28.020483016967773, "global_step": 536071, "epoch": 6458} {"train_loss": -27.636091232299805, "global_step": 536072, "epoch": 6458} {"train_loss": -28.014463424682617, "global_step": 536073, "epoch": 6458} {"train_loss": -28.18320655822754, "global_step": 536074, "epoch": 6458} {"train_loss": -27.630359649658203, "global_step": 536075, "epoch": 6458} {"train_loss": -27.8487606048584, "global_step": 536076, "epoch": 6458} {"train_loss": -27.405324935913086, "global_step": 536077, "epoch": 6458} {"train_loss": -27.678485870361328, "global_step": 536078, "epoch": 6458} {"train_loss": -27.897205352783203, "global_step": 536079, "epoch": 6458} {"train_loss": -27.7537899017334, "global_step": 536080, "epoch": 6458} {"train_loss": -27.807239532470703, "global_step": 536081, "epoch": 6458} {"train_loss": -27.73081398010254, "global_step": 536082, "epoch": 6458} {"train_loss": -27.77712059020996, "global_step": 536083, "epoch": 6458} {"train_loss": -27.835651397705078, "global_step": 536084, "epoch": 6458} {"train_loss": -27.92060661315918, "global_step": 536085, "epoch": 6458} {"train_loss": -28.016889572143555, "global_step": 536086, "epoch": 6458} {"train_loss": -27.781980514526367, "global_step": 536087, "epoch": 6458} {"train_loss": -27.959476470947266, "global_step": 536088, "epoch": 6458} {"train_loss": -27.868947982788086, "global_step": 536089, "epoch": 6458} {"train_loss": -27.83100700378418, "global_step": 536090, "epoch": 6458} {"train_loss": -27.73654556274414, "global_step": 536091, "epoch": 6458} {"train_loss": -27.29926109313965, "global_step": 536092, "epoch": 6458} {"train_loss": -26.843198776245117, "global_step": 536093, "epoch": 6458} {"train_loss": -27.37847900390625, "global_step": 536094, "epoch": 6458} {"train_loss": -27.374242782592773, "global_step": 536095, "epoch": 6458} {"train_loss": -27.614048670573407, "global_step": 536096, "epoch": 6458, "val_loss": 6613706.0} {"train_loss": -25.596323013305664, "global_step": 536097, "epoch": 6459} {"train_loss": -25.137981414794922, "global_step": 536098, "epoch": 6459} {"train_loss": -24.835241317749023, "global_step": 536099, "epoch": 6459} {"train_loss": -26.305896759033203, "global_step": 536100, "epoch": 6459} {"train_loss": -26.252704620361328, "global_step": 536101, "epoch": 6459} {"train_loss": -26.596189498901367, "global_step": 536102, "epoch": 6459} {"train_loss": -26.680994033813477, "global_step": 536103, "epoch": 6459} {"train_loss": -26.001611709594727, "global_step": 536104, "epoch": 6459} {"train_loss": -26.143789291381836, "global_step": 536105, "epoch": 6459} {"train_loss": -26.576990127563477, "global_step": 536106, "epoch": 6459} {"train_loss": -26.871610641479492, "global_step": 536107, "epoch": 6459} {"train_loss": -26.73536491394043, "global_step": 536108, "epoch": 6459} {"train_loss": -26.95142936706543, "global_step": 536109, "epoch": 6459} {"train_loss": -27.231048583984375, "global_step": 536110, "epoch": 6459} {"train_loss": -27.342864990234375, "global_step": 536111, "epoch": 6459} {"train_loss": -27.032922744750977, "global_step": 536112, "epoch": 6459} {"train_loss": -27.06056022644043, "global_step": 536113, "epoch": 6459} {"train_loss": -27.495275497436523, "global_step": 536114, "epoch": 6459} {"train_loss": -26.969776153564453, "global_step": 536115, "epoch": 6459} {"train_loss": -27.00128173828125, "global_step": 536116, "epoch": 6459} {"train_loss": -27.186498641967773, "global_step": 536117, "epoch": 6459} {"train_loss": -27.66847038269043, "global_step": 536118, "epoch": 6459} {"train_loss": -27.285192489624023, "global_step": 536119, "epoch": 6459} {"train_loss": -27.303211212158203, "global_step": 536120, "epoch": 6459} {"train_loss": -27.68744468688965, "global_step": 536121, "epoch": 6459} {"train_loss": -27.28390884399414, "global_step": 536122, "epoch": 6459} {"train_loss": -27.226728439331055, "global_step": 536123, "epoch": 6459} {"train_loss": -27.237329483032227, "global_step": 536124, "epoch": 6459} {"train_loss": -27.62935447692871, "global_step": 536125, "epoch": 6459} {"train_loss": -27.130136489868164, "global_step": 536126, "epoch": 6459} {"train_loss": -27.24299430847168, "global_step": 536127, "epoch": 6459} {"train_loss": -27.399038314819336, "global_step": 536128, "epoch": 6459} {"train_loss": -27.565031051635742, "global_step": 536129, "epoch": 6459} {"train_loss": -27.526288986206055, "global_step": 536130, "epoch": 6459} {"train_loss": -27.58307456970215, "global_step": 536131, "epoch": 6459} {"train_loss": -27.642602920532227, "global_step": 536132, "epoch": 6459} {"train_loss": -27.804107666015625, "global_step": 536133, "epoch": 6459} {"train_loss": -27.5128116607666, "global_step": 536134, "epoch": 6459} {"train_loss": -27.7774658203125, "global_step": 536135, "epoch": 6459} {"train_loss": -28.08013916015625, "global_step": 536136, "epoch": 6459} {"train_loss": -27.767730712890625, "global_step": 536137, "epoch": 6459} {"train_loss": -27.825916290283203, "global_step": 536138, "epoch": 6459} {"train_loss": -27.840259552001953, "global_step": 536139, "epoch": 6459} {"train_loss": -27.925445556640625, "global_step": 536140, "epoch": 6459} {"train_loss": -27.32558250427246, "global_step": 536141, "epoch": 6459} {"train_loss": -27.964588165283203, "global_step": 536142, "epoch": 6459} {"train_loss": -28.09284782409668, "global_step": 536143, "epoch": 6459} {"train_loss": -28.081195831298828, "global_step": 536144, "epoch": 6459} {"train_loss": -27.97098731994629, "global_step": 536145, "epoch": 6459} {"train_loss": -27.65226173400879, "global_step": 536146, "epoch": 6459} {"train_loss": -28.0218563079834, "global_step": 536147, "epoch": 6459} {"train_loss": -28.037561416625977, "global_step": 536148, "epoch": 6459} {"train_loss": -28.144636154174805, "global_step": 536149, "epoch": 6459} {"train_loss": -27.871658325195312, "global_step": 536150, "epoch": 6459} {"train_loss": -28.133222579956055, "global_step": 536151, "epoch": 6459} {"train_loss": -27.727203369140625, "global_step": 536152, "epoch": 6459} {"train_loss": -28.062292098999023, "global_step": 536153, "epoch": 6459} {"train_loss": -27.88982582092285, "global_step": 536154, "epoch": 6459} {"train_loss": -27.7519474029541, "global_step": 536155, "epoch": 6459} {"train_loss": -27.775558471679688, "global_step": 536156, "epoch": 6459} {"train_loss": -27.702497482299805, "global_step": 536157, "epoch": 6459} {"train_loss": -27.706649780273438, "global_step": 536158, "epoch": 6459} {"train_loss": -27.680917739868164, "global_step": 536159, "epoch": 6459} {"train_loss": -28.209716796875, "global_step": 536160, "epoch": 6459} {"train_loss": -27.753713607788086, "global_step": 536161, "epoch": 6459} {"train_loss": -27.813125610351562, "global_step": 536162, "epoch": 6459} {"train_loss": -27.621368408203125, "global_step": 536163, "epoch": 6459} {"train_loss": -27.992706298828125, "global_step": 536164, "epoch": 6459} {"train_loss": -27.663211822509766, "global_step": 536165, "epoch": 6459} {"train_loss": -27.929052352905273, "global_step": 536166, "epoch": 6459} {"train_loss": -27.18855094909668, "global_step": 536167, "epoch": 6459} {"train_loss": -27.094970703125, "global_step": 536168, "epoch": 6459} {"train_loss": -27.582014083862305, "global_step": 536169, "epoch": 6459} {"train_loss": -27.12506103515625, "global_step": 536170, "epoch": 6459} {"train_loss": -26.958831787109375, "global_step": 536171, "epoch": 6459} {"train_loss": -26.663394927978516, "global_step": 536172, "epoch": 6459} {"train_loss": -27.239383697509766, "global_step": 536173, "epoch": 6459} {"train_loss": -27.41855812072754, "global_step": 536174, "epoch": 6459} {"train_loss": -27.260150909423828, "global_step": 536175, "epoch": 6459} {"train_loss": -26.67933464050293, "global_step": 536176, "epoch": 6459} {"train_loss": -27.125051498413086, "global_step": 536177, "epoch": 6459} {"train_loss": -27.897974014282227, "global_step": 536178, "epoch": 6459} {"train_loss": -27.336691155491106, "global_step": 536179, "epoch": 6459, "val_loss": 6517429.0} {"train_loss": -25.79786491394043, "global_step": 536180, "epoch": 6460} {"train_loss": -26.204309463500977, "global_step": 536181, "epoch": 6460} {"train_loss": -26.598535537719727, "global_step": 536182, "epoch": 6460} {"train_loss": -26.297210693359375, "global_step": 536183, "epoch": 6460} {"train_loss": -26.842376708984375, "global_step": 536184, "epoch": 6460} {"train_loss": -26.446752548217773, "global_step": 536185, "epoch": 6460} {"train_loss": -26.794647216796875, "global_step": 536186, "epoch": 6460} {"train_loss": -27.12843132019043, "global_step": 536187, "epoch": 6460} {"train_loss": -27.06780433654785, "global_step": 536188, "epoch": 6460} {"train_loss": -27.015588760375977, "global_step": 536189, "epoch": 6460} {"train_loss": -26.895055770874023, "global_step": 536190, "epoch": 6460} {"train_loss": -27.26947021484375, "global_step": 536191, "epoch": 6460} {"train_loss": -27.30278968811035, "global_step": 536192, "epoch": 6460} {"train_loss": -27.152997970581055, "global_step": 536193, "epoch": 6460} {"train_loss": -27.131927490234375, "global_step": 536194, "epoch": 6460} {"train_loss": -27.093189239501953, "global_step": 536195, "epoch": 6460} {"train_loss": -27.257598876953125, "global_step": 536196, "epoch": 6460} {"train_loss": -27.487106323242188, "global_step": 536197, "epoch": 6460} {"train_loss": -27.508014678955078, "global_step": 536198, "epoch": 6460} {"train_loss": -27.567676544189453, "global_step": 536199, "epoch": 6460} {"train_loss": -27.253055572509766, "global_step": 536200, "epoch": 6460} {"train_loss": -27.843297958374023, "global_step": 536201, "epoch": 6460} {"train_loss": -27.41118812561035, "global_step": 536202, "epoch": 6460} {"train_loss": -27.53476333618164, "global_step": 536203, "epoch": 6460} {"train_loss": -27.7203369140625, "global_step": 536204, "epoch": 6460} {"train_loss": -27.27388572692871, "global_step": 536205, "epoch": 6460} {"train_loss": -27.1886043548584, "global_step": 536206, "epoch": 6460} {"train_loss": -27.559656143188477, "global_step": 536207, "epoch": 6460} {"train_loss": -27.460376739501953, "global_step": 536208, "epoch": 6460} {"train_loss": -27.562549591064453, "global_step": 536209, "epoch": 6460} {"train_loss": -27.72165298461914, "global_step": 536210, "epoch": 6460} {"train_loss": -27.719486236572266, "global_step": 536211, "epoch": 6460} {"train_loss": -27.440235137939453, "global_step": 536212, "epoch": 6460} {"train_loss": -27.734975814819336, "global_step": 536213, "epoch": 6460} {"train_loss": -27.979206085205078, "global_step": 536214, "epoch": 6460} {"train_loss": -27.91827392578125, "global_step": 536215, "epoch": 6460} {"train_loss": -27.808197021484375, "global_step": 536216, "epoch": 6460} {"train_loss": -27.878217697143555, "global_step": 536217, "epoch": 6460} {"train_loss": -27.8320369720459, "global_step": 536218, "epoch": 6460} {"train_loss": -28.0510311126709, "global_step": 536219, "epoch": 6460} {"train_loss": -27.565061569213867, "global_step": 536220, "epoch": 6460} {"train_loss": -27.583051681518555, "global_step": 536221, "epoch": 6460} {"train_loss": -27.402179718017578, "global_step": 536222, "epoch": 6460} {"train_loss": -27.7331485748291, "global_step": 536223, "epoch": 6460} {"train_loss": -28.026514053344727, "global_step": 536224, "epoch": 6460} {"train_loss": -27.718175888061523, "global_step": 536225, "epoch": 6460} {"train_loss": -27.6929874420166, "global_step": 536226, "epoch": 6460} {"train_loss": -27.7265567779541, "global_step": 536227, "epoch": 6460} {"train_loss": -27.999114990234375, "global_step": 536228, "epoch": 6460} {"train_loss": -27.949064254760742, "global_step": 536229, "epoch": 6460} {"train_loss": -27.28034019470215, "global_step": 536230, "epoch": 6460} {"train_loss": -27.740427017211914, "global_step": 536231, "epoch": 6460} {"train_loss": -28.028247833251953, "global_step": 536232, "epoch": 6460} {"train_loss": -27.808074951171875, "global_step": 536233, "epoch": 6460} {"train_loss": -27.6066951751709, "global_step": 536234, "epoch": 6460} {"train_loss": -27.504865646362305, "global_step": 536235, "epoch": 6460} {"train_loss": -27.524906158447266, "global_step": 536236, "epoch": 6460} {"train_loss": -27.75178337097168, "global_step": 536237, "epoch": 6460} {"train_loss": -27.143274307250977, "global_step": 536238, "epoch": 6460} {"train_loss": -27.496610641479492, "global_step": 536239, "epoch": 6460} {"train_loss": -27.66187858581543, "global_step": 536240, "epoch": 6460} {"train_loss": -27.874975204467773, "global_step": 536241, "epoch": 6460} {"train_loss": -27.98333168029785, "global_step": 536242, "epoch": 6460} {"train_loss": -27.839176177978516, "global_step": 536243, "epoch": 6460} {"train_loss": -27.828998565673828, "global_step": 536244, "epoch": 6460} {"train_loss": -27.865365982055664, "global_step": 536245, "epoch": 6460} {"train_loss": -27.255542755126953, "global_step": 536246, "epoch": 6460} {"train_loss": -27.481184005737305, "global_step": 536247, "epoch": 6460} {"train_loss": -27.361454010009766, "global_step": 536248, "epoch": 6460} {"train_loss": -27.740270614624023, "global_step": 536249, "epoch": 6460} {"train_loss": -27.8129940032959, "global_step": 536250, "epoch": 6460} {"train_loss": -28.033666610717773, "global_step": 536251, "epoch": 6460} {"train_loss": -27.463590621948242, "global_step": 536252, "epoch": 6460} {"train_loss": -27.34063148498535, "global_step": 536253, "epoch": 6460} {"train_loss": -27.41973304748535, "global_step": 536254, "epoch": 6460} {"train_loss": -27.709264755249023, "global_step": 536255, "epoch": 6460} {"train_loss": -27.281766891479492, "global_step": 536256, "epoch": 6460} {"train_loss": -27.732681274414062, "global_step": 536257, "epoch": 6460} {"train_loss": -27.838327407836914, "global_step": 536258, "epoch": 6460} {"train_loss": -27.488494873046875, "global_step": 536259, "epoch": 6460} {"train_loss": -27.46685218811035, "global_step": 536260, "epoch": 6460} {"train_loss": -27.67270278930664, "global_step": 536261, "epoch": 6460} {"train_loss": -27.484346205929675, "global_step": 536262, "epoch": 6460, "val_loss": 6542524.5} {"train_loss": -27.139453887939453, "global_step": 536263, "epoch": 6461} {"train_loss": -27.773435592651367, "global_step": 536264, "epoch": 6461} {"train_loss": -27.2419490814209, "global_step": 536265, "epoch": 6461} {"train_loss": -27.280109405517578, "global_step": 536266, "epoch": 6461} {"train_loss": -27.24283790588379, "global_step": 536267, "epoch": 6461} {"train_loss": -27.037403106689453, "global_step": 536268, "epoch": 6461} {"train_loss": -27.177204132080078, "global_step": 536269, "epoch": 6461} {"train_loss": -27.046655654907227, "global_step": 536270, "epoch": 6461} {"train_loss": -27.429279327392578, "global_step": 536271, "epoch": 6461} {"train_loss": -27.191099166870117, "global_step": 536272, "epoch": 6461} {"train_loss": -26.964929580688477, "global_step": 536273, "epoch": 6461} {"train_loss": -27.22977066040039, "global_step": 536274, "epoch": 6461} {"train_loss": -27.341094970703125, "global_step": 536275, "epoch": 6461} {"train_loss": -27.558109283447266, "global_step": 536276, "epoch": 6461} {"train_loss": -27.083572387695312, "global_step": 536277, "epoch": 6461} {"train_loss": -27.399127960205078, "global_step": 536278, "epoch": 6461} {"train_loss": -27.722610473632812, "global_step": 536279, "epoch": 6461} {"train_loss": -27.400415420532227, "global_step": 536280, "epoch": 6461} {"train_loss": -27.260862350463867, "global_step": 536281, "epoch": 6461} {"train_loss": -27.19635009765625, "global_step": 536282, "epoch": 6461} {"train_loss": -27.508630752563477, "global_step": 536283, "epoch": 6461} {"train_loss": -27.547494888305664, "global_step": 536284, "epoch": 6461} {"train_loss": -27.624540328979492, "global_step": 536285, "epoch": 6461} {"train_loss": -27.3165283203125, "global_step": 536286, "epoch": 6461} {"train_loss": -27.68890380859375, "global_step": 536287, "epoch": 6461} {"train_loss": -27.478748321533203, "global_step": 536288, "epoch": 6461} {"train_loss": -27.770605087280273, "global_step": 536289, "epoch": 6461} {"train_loss": -28.237451553344727, "global_step": 536290, "epoch": 6461} {"train_loss": -27.715681076049805, "global_step": 536291, "epoch": 6461} {"train_loss": -27.719877243041992, "global_step": 536292, "epoch": 6461} {"train_loss": -27.97450065612793, "global_step": 536293, "epoch": 6461} {"train_loss": -27.88254737854004, "global_step": 536294, "epoch": 6461} {"train_loss": -27.821094512939453, "global_step": 536295, "epoch": 6461} {"train_loss": -27.623016357421875, "global_step": 536296, "epoch": 6461} {"train_loss": -27.840681076049805, "global_step": 536297, "epoch": 6461} {"train_loss": -27.589096069335938, "global_step": 536298, "epoch": 6461} {"train_loss": -27.748544692993164, "global_step": 536299, "epoch": 6461} {"train_loss": -27.430404663085938, "global_step": 536300, "epoch": 6461} {"train_loss": -27.660552978515625, "global_step": 536301, "epoch": 6461} {"train_loss": -27.91522789001465, "global_step": 536302, "epoch": 6461} {"train_loss": -27.795089721679688, "global_step": 536303, "epoch": 6461} {"train_loss": -27.48982810974121, "global_step": 536304, "epoch": 6461} {"train_loss": -27.6705322265625, "global_step": 536305, "epoch": 6461} {"train_loss": -27.937957763671875, "global_step": 536306, "epoch": 6461} {"train_loss": -27.91461753845215, "global_step": 536307, "epoch": 6461} {"train_loss": -27.590246200561523, "global_step": 536308, "epoch": 6461} {"train_loss": -27.975616455078125, "global_step": 536309, "epoch": 6461} {"train_loss": -28.033124923706055, "global_step": 536310, "epoch": 6461} {"train_loss": -27.798370361328125, "global_step": 536311, "epoch": 6461} {"train_loss": -27.716175079345703, "global_step": 536312, "epoch": 6461} {"train_loss": -27.929651260375977, "global_step": 536313, "epoch": 6461} {"train_loss": -27.683679580688477, "global_step": 536314, "epoch": 6461} {"train_loss": -27.54517936706543, "global_step": 536315, "epoch": 6461} {"train_loss": -27.107507705688477, "global_step": 536316, "epoch": 6461} {"train_loss": -27.615018844604492, "global_step": 536317, "epoch": 6461} {"train_loss": -28.028074264526367, "global_step": 536318, "epoch": 6461} {"train_loss": -27.771453857421875, "global_step": 536319, "epoch": 6461} {"train_loss": -27.592756271362305, "global_step": 536320, "epoch": 6461} {"train_loss": -27.57406997680664, "global_step": 536321, "epoch": 6461} {"train_loss": -27.7421932220459, "global_step": 536322, "epoch": 6461} {"train_loss": -27.445087432861328, "global_step": 536323, "epoch": 6461} {"train_loss": -27.8121337890625, "global_step": 536324, "epoch": 6461} {"train_loss": -27.63484001159668, "global_step": 536325, "epoch": 6461} {"train_loss": -27.178924560546875, "global_step": 536326, "epoch": 6461} {"train_loss": -27.644330978393555, "global_step": 536327, "epoch": 6461} {"train_loss": -27.07929801940918, "global_step": 536328, "epoch": 6461} {"train_loss": -27.579639434814453, "global_step": 536329, "epoch": 6461} {"train_loss": -27.255285263061523, "global_step": 536330, "epoch": 6461} {"train_loss": -27.851398468017578, "global_step": 536331, "epoch": 6461} {"train_loss": -27.083911895751953, "global_step": 536332, "epoch": 6461} {"train_loss": -27.41864585876465, "global_step": 536333, "epoch": 6461} {"train_loss": -27.846853256225586, "global_step": 536334, "epoch": 6461} {"train_loss": -27.301589965820312, "global_step": 536335, "epoch": 6461} {"train_loss": -27.409093856811523, "global_step": 536336, "epoch": 6461} {"train_loss": -27.48687744140625, "global_step": 536337, "epoch": 6461} {"train_loss": -27.0789794921875, "global_step": 536338, "epoch": 6461} {"train_loss": -27.325170516967773, "global_step": 536339, "epoch": 6461} {"train_loss": -27.34956169128418, "global_step": 536340, "epoch": 6461} {"train_loss": -27.44991111755371, "global_step": 536341, "epoch": 6461} {"train_loss": -28.019018173217773, "global_step": 536342, "epoch": 6461} {"train_loss": -27.1602725982666, "global_step": 536343, "epoch": 6461} {"train_loss": -27.275049209594727, "global_step": 536344, "epoch": 6461} {"train_loss": -27.537050568913838, "global_step": 536345, "epoch": 6461, "val_loss": 6438874.0} {"train_loss": -25.210403442382812, "global_step": 536346, "epoch": 6462} {"train_loss": -26.31513786315918, "global_step": 536347, "epoch": 6462} {"train_loss": -27.42360496520996, "global_step": 536348, "epoch": 6462} {"train_loss": -26.785913467407227, "global_step": 536349, "epoch": 6462} {"train_loss": -26.3182430267334, "global_step": 536350, "epoch": 6462} {"train_loss": -26.683109283447266, "global_step": 536351, "epoch": 6462} {"train_loss": -26.81719970703125, "global_step": 536352, "epoch": 6462} {"train_loss": -26.366621017456055, "global_step": 536353, "epoch": 6462} {"train_loss": -26.2869930267334, "global_step": 536354, "epoch": 6462} {"train_loss": -26.986713409423828, "global_step": 536355, "epoch": 6462} {"train_loss": -26.433691024780273, "global_step": 536356, "epoch": 6462} {"train_loss": -27.37479019165039, "global_step": 536357, "epoch": 6462} {"train_loss": -26.725732803344727, "global_step": 536358, "epoch": 6462} {"train_loss": -27.07037925720215, "global_step": 536359, "epoch": 6462} {"train_loss": -26.876510620117188, "global_step": 536360, "epoch": 6462} {"train_loss": -26.95850944519043, "global_step": 536361, "epoch": 6462} {"train_loss": -27.12769889831543, "global_step": 536362, "epoch": 6462} {"train_loss": -27.173925399780273, "global_step": 536363, "epoch": 6462} {"train_loss": -26.899572372436523, "global_step": 536364, "epoch": 6462} {"train_loss": -27.36651611328125, "global_step": 536365, "epoch": 6462} {"train_loss": -27.353748321533203, "global_step": 536366, "epoch": 6462} {"train_loss": -27.406524658203125, "global_step": 536367, "epoch": 6462} {"train_loss": -27.189929962158203, "global_step": 536368, "epoch": 6462} {"train_loss": -27.329925537109375, "global_step": 536369, "epoch": 6462} {"train_loss": -27.3607177734375, "global_step": 536370, "epoch": 6462} {"train_loss": -27.322851181030273, "global_step": 536371, "epoch": 6462} {"train_loss": -27.63837242126465, "global_step": 536372, "epoch": 6462} {"train_loss": -27.89501953125, "global_step": 536373, "epoch": 6462} {"train_loss": -27.251911163330078, "global_step": 536374, "epoch": 6462} {"train_loss": -27.240259170532227, "global_step": 536375, "epoch": 6462} {"train_loss": -27.509069442749023, "global_step": 536376, "epoch": 6462} {"train_loss": -27.5432186126709, "global_step": 536377, "epoch": 6462} {"train_loss": -28.0068416595459, "global_step": 536378, "epoch": 6462} {"train_loss": -27.448413848876953, "global_step": 536379, "epoch": 6462} {"train_loss": -27.49116325378418, "global_step": 536380, "epoch": 6462} {"train_loss": -27.678714752197266, "global_step": 536381, "epoch": 6462} {"train_loss": -27.646554946899414, "global_step": 536382, "epoch": 6462} {"train_loss": -27.620548248291016, "global_step": 536383, "epoch": 6462} {"train_loss": -27.693761825561523, "global_step": 536384, "epoch": 6462} {"train_loss": -27.55281639099121, "global_step": 536385, "epoch": 6462} {"train_loss": -27.495758056640625, "global_step": 536386, "epoch": 6462} {"train_loss": -27.82307243347168, "global_step": 536387, "epoch": 6462} {"train_loss": -27.48565101623535, "global_step": 536388, "epoch": 6462} {"train_loss": -27.563779830932617, "global_step": 536389, "epoch": 6462} {"train_loss": -27.82541275024414, "global_step": 536390, "epoch": 6462} {"train_loss": -27.690326690673828, "global_step": 536391, "epoch": 6462} {"train_loss": -27.8289737701416, "global_step": 536392, "epoch": 6462} {"train_loss": -28.2242488861084, "global_step": 536393, "epoch": 6462} {"train_loss": -27.79233169555664, "global_step": 536394, "epoch": 6462} {"train_loss": -28.040502548217773, "global_step": 536395, "epoch": 6462} {"train_loss": -27.842605590820312, "global_step": 536396, "epoch": 6462} {"train_loss": -27.946399688720703, "global_step": 536397, "epoch": 6462} {"train_loss": -28.315488815307617, "global_step": 536398, "epoch": 6462} {"train_loss": -27.85831069946289, "global_step": 536399, "epoch": 6462} {"train_loss": -27.889448165893555, "global_step": 536400, "epoch": 6462} {"train_loss": -27.5823974609375, "global_step": 536401, "epoch": 6462} {"train_loss": -27.59050941467285, "global_step": 536402, "epoch": 6462} {"train_loss": -27.532400131225586, "global_step": 536403, "epoch": 6462} {"train_loss": -27.77099609375, "global_step": 536404, "epoch": 6462} {"train_loss": -27.717945098876953, "global_step": 536405, "epoch": 6462} {"train_loss": -27.789892196655273, "global_step": 536406, "epoch": 6462} {"train_loss": -27.818567276000977, "global_step": 536407, "epoch": 6462} {"train_loss": -28.14227294921875, "global_step": 536408, "epoch": 6462} {"train_loss": -28.07089614868164, "global_step": 536409, "epoch": 6462} {"train_loss": -28.200759887695312, "global_step": 536410, "epoch": 6462} {"train_loss": -28.120319366455078, "global_step": 536411, "epoch": 6462} {"train_loss": -28.017236709594727, "global_step": 536412, "epoch": 6462} {"train_loss": -27.224096298217773, "global_step": 536413, "epoch": 6462} {"train_loss": -27.27536964416504, "global_step": 536414, "epoch": 6462} {"train_loss": -27.52507972717285, "global_step": 536415, "epoch": 6462} {"train_loss": -27.22100830078125, "global_step": 536416, "epoch": 6462} {"train_loss": -27.1727352142334, "global_step": 536417, "epoch": 6462} {"train_loss": -27.75984001159668, "global_step": 536418, "epoch": 6462} {"train_loss": -27.535932540893555, "global_step": 536419, "epoch": 6462} {"train_loss": -26.91803550720215, "global_step": 536420, "epoch": 6462} {"train_loss": -27.455717086791992, "global_step": 536421, "epoch": 6462} {"train_loss": -27.267715454101562, "global_step": 536422, "epoch": 6462} {"train_loss": -27.392230987548828, "global_step": 536423, "epoch": 6462} {"train_loss": -27.712860107421875, "global_step": 536424, "epoch": 6462} {"train_loss": -27.553791046142578, "global_step": 536425, "epoch": 6462} {"train_loss": -27.7061710357666, "global_step": 536426, "epoch": 6462} {"train_loss": -27.677173614501953, "global_step": 536427, "epoch": 6462} {"train_loss": -27.42507169332849, "global_step": 536428, "epoch": 6462, "val_loss": 6436256.5} {"train_loss": -26.97698402404785, "global_step": 536429, "epoch": 6463} {"train_loss": -27.0378360748291, "global_step": 536430, "epoch": 6463} {"train_loss": -27.25555992126465, "global_step": 536431, "epoch": 6463} {"train_loss": -27.102258682250977, "global_step": 536432, "epoch": 6463} {"train_loss": -27.052783966064453, "global_step": 536433, "epoch": 6463} {"train_loss": -27.42209815979004, "global_step": 536434, "epoch": 6463} {"train_loss": -27.5255126953125, "global_step": 536435, "epoch": 6463} {"train_loss": -27.382856369018555, "global_step": 536436, "epoch": 6463} {"train_loss": -27.24947166442871, "global_step": 536437, "epoch": 6463} {"train_loss": -27.546064376831055, "global_step": 536438, "epoch": 6463} {"train_loss": -27.044763565063477, "global_step": 536439, "epoch": 6463} {"train_loss": -27.382160186767578, "global_step": 536440, "epoch": 6463} {"train_loss": -27.529138565063477, "global_step": 536441, "epoch": 6463} {"train_loss": -27.06890869140625, "global_step": 536442, "epoch": 6463} {"train_loss": -27.594812393188477, "global_step": 536443, "epoch": 6463} {"train_loss": -27.59602165222168, "global_step": 536444, "epoch": 6463} {"train_loss": -27.479887008666992, "global_step": 536445, "epoch": 6463} {"train_loss": -27.424203872680664, "global_step": 536446, "epoch": 6463} {"train_loss": -27.58479118347168, "global_step": 536447, "epoch": 6463} {"train_loss": -27.745441436767578, "global_step": 536448, "epoch": 6463} {"train_loss": -27.796560287475586, "global_step": 536449, "epoch": 6463} {"train_loss": -27.690658569335938, "global_step": 536450, "epoch": 6463} {"train_loss": -27.3885440826416, "global_step": 536451, "epoch": 6463} {"train_loss": -27.6846923828125, "global_step": 536452, "epoch": 6463} {"train_loss": -27.800893783569336, "global_step": 536453, "epoch": 6463} {"train_loss": -27.411041259765625, "global_step": 536454, "epoch": 6463} {"train_loss": -27.45062828063965, "global_step": 536455, "epoch": 6463} {"train_loss": -27.8159122467041, "global_step": 536456, "epoch": 6463} {"train_loss": -27.787750244140625, "global_step": 536457, "epoch": 6463} {"train_loss": -27.78605079650879, "global_step": 536458, "epoch": 6463} {"train_loss": -27.501834869384766, "global_step": 536459, "epoch": 6463} {"train_loss": -27.872772216796875, "global_step": 536460, "epoch": 6463} {"train_loss": -27.819189071655273, "global_step": 536461, "epoch": 6463} {"train_loss": -27.506311416625977, "global_step": 536462, "epoch": 6463} {"train_loss": -27.674543380737305, "global_step": 536463, "epoch": 6463} {"train_loss": -27.59235954284668, "global_step": 536464, "epoch": 6463} {"train_loss": -27.79424476623535, "global_step": 536465, "epoch": 6463} {"train_loss": -28.196725845336914, "global_step": 536466, "epoch": 6463} {"train_loss": -27.79896354675293, "global_step": 536467, "epoch": 6463} {"train_loss": -27.56646728515625, "global_step": 536468, "epoch": 6463} {"train_loss": -28.1041259765625, "global_step": 536469, "epoch": 6463} {"train_loss": -27.69906997680664, "global_step": 536470, "epoch": 6463} {"train_loss": -27.713165283203125, "global_step": 536471, "epoch": 6463} {"train_loss": -27.847620010375977, "global_step": 536472, "epoch": 6463} {"train_loss": -27.395145416259766, "global_step": 536473, "epoch": 6463} {"train_loss": -28.193531036376953, "global_step": 536474, "epoch": 6463} {"train_loss": -27.830280303955078, "global_step": 536475, "epoch": 6463} {"train_loss": -28.0993595123291, "global_step": 536476, "epoch": 6463} {"train_loss": -27.808313369750977, "global_step": 536477, "epoch": 6463} {"train_loss": -27.602075576782227, "global_step": 536478, "epoch": 6463} {"train_loss": -27.806058883666992, "global_step": 536479, "epoch": 6463} {"train_loss": -27.340442657470703, "global_step": 536480, "epoch": 6463} {"train_loss": -27.64348793029785, "global_step": 536481, "epoch": 6463} {"train_loss": -27.448749542236328, "global_step": 536482, "epoch": 6463} {"train_loss": -27.980955123901367, "global_step": 536483, "epoch": 6463} {"train_loss": -27.344934463500977, "global_step": 536484, "epoch": 6463} {"train_loss": -26.757413864135742, "global_step": 536485, "epoch": 6463} {"train_loss": -25.898223876953125, "global_step": 536486, "epoch": 6463} {"train_loss": -26.75916862487793, "global_step": 536487, "epoch": 6463} {"train_loss": -27.595285415649414, "global_step": 536488, "epoch": 6463} {"train_loss": -27.34590721130371, "global_step": 536489, "epoch": 6463} {"train_loss": -27.0472469329834, "global_step": 536490, "epoch": 6463} {"train_loss": -27.218900680541992, "global_step": 536491, "epoch": 6463} {"train_loss": -26.760257720947266, "global_step": 536492, "epoch": 6463} {"train_loss": -27.37616539001465, "global_step": 536493, "epoch": 6463} {"train_loss": -26.793378829956055, "global_step": 536494, "epoch": 6463} {"train_loss": -27.25321388244629, "global_step": 536495, "epoch": 6463} {"train_loss": -27.59205436706543, "global_step": 536496, "epoch": 6463} {"train_loss": -27.00857925415039, "global_step": 536497, "epoch": 6463} {"train_loss": -27.44597816467285, "global_step": 536498, "epoch": 6463} {"train_loss": -26.985702514648438, "global_step": 536499, "epoch": 6463} {"train_loss": -27.1389217376709, "global_step": 536500, "epoch": 6463} {"train_loss": -27.363428115844727, "global_step": 536501, "epoch": 6463} {"train_loss": -27.23296546936035, "global_step": 536502, "epoch": 6463} {"train_loss": -27.314956665039062, "global_step": 536503, "epoch": 6463} {"train_loss": -27.4990177154541, "global_step": 536504, "epoch": 6463} {"train_loss": -27.466516494750977, "global_step": 536505, "epoch": 6463} {"train_loss": -27.638696670532227, "global_step": 536506, "epoch": 6463} {"train_loss": -27.060394287109375, "global_step": 536507, "epoch": 6463} {"train_loss": -27.66639518737793, "global_step": 536508, "epoch": 6463} {"train_loss": -27.500707626342773, "global_step": 536509, "epoch": 6463} {"train_loss": -27.484811782836914, "global_step": 536510, "epoch": 6463} {"train_loss": -27.453059644584197, "global_step": 536511, "epoch": 6463, "val_loss": 6514217.0} {"train_loss": -26.75152015686035, "global_step": 536512, "epoch": 6464} {"train_loss": -26.231369018554688, "global_step": 536513, "epoch": 6464} {"train_loss": -27.4688663482666, "global_step": 536514, "epoch": 6464} {"train_loss": -26.661771774291992, "global_step": 536515, "epoch": 6464} {"train_loss": -27.2207088470459, "global_step": 536516, "epoch": 6464} {"train_loss": -27.18643569946289, "global_step": 536517, "epoch": 6464} {"train_loss": -26.755950927734375, "global_step": 536518, "epoch": 6464} {"train_loss": -27.22230339050293, "global_step": 536519, "epoch": 6464} {"train_loss": -26.961048126220703, "global_step": 536520, "epoch": 6464} {"train_loss": -27.174650192260742, "global_step": 536521, "epoch": 6464} {"train_loss": -27.371078491210938, "global_step": 536522, "epoch": 6464} {"train_loss": -27.087244033813477, "global_step": 536523, "epoch": 6464} {"train_loss": -27.641845703125, "global_step": 536524, "epoch": 6464} {"train_loss": -26.916662216186523, "global_step": 536525, "epoch": 6464} {"train_loss": -27.22150230407715, "global_step": 536526, "epoch": 6464} {"train_loss": -27.429922103881836, "global_step": 536527, "epoch": 6464} {"train_loss": -27.56452751159668, "global_step": 536528, "epoch": 6464} {"train_loss": -27.259662628173828, "global_step": 536529, "epoch": 6464} {"train_loss": -27.28548240661621, "global_step": 536530, "epoch": 6464} {"train_loss": -27.483732223510742, "global_step": 536531, "epoch": 6464} {"train_loss": -27.589841842651367, "global_step": 536532, "epoch": 6464} {"train_loss": -27.431415557861328, "global_step": 536533, "epoch": 6464} {"train_loss": -27.4456844329834, "global_step": 536534, "epoch": 6464} {"train_loss": -27.723180770874023, "global_step": 536535, "epoch": 6464} {"train_loss": -27.375696182250977, "global_step": 536536, "epoch": 6464} {"train_loss": -27.69593620300293, "global_step": 536537, "epoch": 6464} {"train_loss": -27.56540298461914, "global_step": 536538, "epoch": 6464} {"train_loss": -27.469745635986328, "global_step": 536539, "epoch": 6464} {"train_loss": -27.596759796142578, "global_step": 536540, "epoch": 6464} {"train_loss": -27.709863662719727, "global_step": 536541, "epoch": 6464} {"train_loss": -27.70961570739746, "global_step": 536542, "epoch": 6464} {"train_loss": -27.948028564453125, "global_step": 536543, "epoch": 6464} {"train_loss": -27.534595489501953, "global_step": 536544, "epoch": 6464} {"train_loss": -27.849328994750977, "global_step": 536545, "epoch": 6464} {"train_loss": -27.583938598632812, "global_step": 536546, "epoch": 6464} {"train_loss": -27.936100006103516, "global_step": 536547, "epoch": 6464} {"train_loss": -27.457111358642578, "global_step": 536548, "epoch": 6464} {"train_loss": -27.579757690429688, "global_step": 536549, "epoch": 6464} {"train_loss": -27.35133934020996, "global_step": 536550, "epoch": 6464} {"train_loss": -27.819440841674805, "global_step": 536551, "epoch": 6464} {"train_loss": -27.786468505859375, "global_step": 536552, "epoch": 6464} {"train_loss": -27.73811149597168, "global_step": 536553, "epoch": 6464} {"train_loss": -27.53546142578125, "global_step": 536554, "epoch": 6464} {"train_loss": -28.19353675842285, "global_step": 536555, "epoch": 6464} {"train_loss": -27.798114776611328, "global_step": 536556, "epoch": 6464} {"train_loss": -27.53055763244629, "global_step": 536557, "epoch": 6464} {"train_loss": -27.655649185180664, "global_step": 536558, "epoch": 6464} {"train_loss": -27.758569717407227, "global_step": 536559, "epoch": 6464} {"train_loss": -27.778898239135742, "global_step": 536560, "epoch": 6464} {"train_loss": -27.92060661315918, "global_step": 536561, "epoch": 6464} {"train_loss": -27.724023818969727, "global_step": 536562, "epoch": 6464} {"train_loss": -28.04059410095215, "global_step": 536563, "epoch": 6464} {"train_loss": -27.83251953125, "global_step": 536564, "epoch": 6464} {"train_loss": -27.606597900390625, "global_step": 536565, "epoch": 6464} {"train_loss": -27.538959503173828, "global_step": 536566, "epoch": 6464} {"train_loss": -27.84486198425293, "global_step": 536567, "epoch": 6464} {"train_loss": -27.85663414001465, "global_step": 536568, "epoch": 6464} {"train_loss": -27.946203231811523, "global_step": 536569, "epoch": 6464} {"train_loss": -27.79351234436035, "global_step": 536570, "epoch": 6464} {"train_loss": -27.8886775970459, "global_step": 536571, "epoch": 6464} {"train_loss": -27.8436336517334, "global_step": 536572, "epoch": 6464} {"train_loss": -27.570261001586914, "global_step": 536573, "epoch": 6464} {"train_loss": -27.8040828704834, "global_step": 536574, "epoch": 6464} {"train_loss": -27.486190795898438, "global_step": 536575, "epoch": 6464} {"train_loss": -27.51954460144043, "global_step": 536576, "epoch": 6464} {"train_loss": -27.178762435913086, "global_step": 536577, "epoch": 6464} {"train_loss": -26.85344886779785, "global_step": 536578, "epoch": 6464} {"train_loss": -25.937665939331055, "global_step": 536579, "epoch": 6464} {"train_loss": -25.02089500427246, "global_step": 536580, "epoch": 6464} {"train_loss": -24.535568237304688, "global_step": 536581, "epoch": 6464} {"train_loss": -25.01883316040039, "global_step": 536582, "epoch": 6464} {"train_loss": -26.826196670532227, "global_step": 536583, "epoch": 6464} {"train_loss": -26.536895751953125, "global_step": 536584, "epoch": 6464} {"train_loss": -26.622644424438477, "global_step": 536585, "epoch": 6464} {"train_loss": -26.76773452758789, "global_step": 536586, "epoch": 6464} {"train_loss": -26.987018585205078, "global_step": 536587, "epoch": 6464} {"train_loss": -26.83835220336914, "global_step": 536588, "epoch": 6464} {"train_loss": -27.124435424804688, "global_step": 536589, "epoch": 6464} {"train_loss": -26.55573081970215, "global_step": 536590, "epoch": 6464} {"train_loss": -27.233266830444336, "global_step": 536591, "epoch": 6464} {"train_loss": -27.322778701782227, "global_step": 536592, "epoch": 6464} {"train_loss": -27.04823112487793, "global_step": 536593, "epoch": 6464} {"train_loss": -27.301731776042157, "global_step": 536594, "epoch": 6464, "val_loss": 6500329.0} {"train_loss": -26.763294219970703, "global_step": 536595, "epoch": 6465} {"train_loss": -26.402456283569336, "global_step": 536596, "epoch": 6465} {"train_loss": -26.351842880249023, "global_step": 536597, "epoch": 6465} {"train_loss": -27.07044792175293, "global_step": 536598, "epoch": 6465} {"train_loss": -26.72614860534668, "global_step": 536599, "epoch": 6465} {"train_loss": -27.249897003173828, "global_step": 536600, "epoch": 6465} {"train_loss": -26.32052993774414, "global_step": 536601, "epoch": 6465} {"train_loss": -27.155548095703125, "global_step": 536602, "epoch": 6465} {"train_loss": -26.966089248657227, "global_step": 536603, "epoch": 6465} {"train_loss": -26.667694091796875, "global_step": 536604, "epoch": 6465} {"train_loss": -26.903522491455078, "global_step": 536605, "epoch": 6465} {"train_loss": -26.264698028564453, "global_step": 536606, "epoch": 6465} {"train_loss": -26.744556427001953, "global_step": 536607, "epoch": 6465} {"train_loss": -26.92669677734375, "global_step": 536608, "epoch": 6465} {"train_loss": -27.173480987548828, "global_step": 536609, "epoch": 6465} {"train_loss": -27.144880294799805, "global_step": 536610, "epoch": 6465} {"train_loss": -27.172643661499023, "global_step": 536611, "epoch": 6465} {"train_loss": -27.6776123046875, "global_step": 536612, "epoch": 6465} {"train_loss": -27.263153076171875, "global_step": 536613, "epoch": 6465} {"train_loss": -27.061527252197266, "global_step": 536614, "epoch": 6465} {"train_loss": -27.491851806640625, "global_step": 536615, "epoch": 6465} {"train_loss": -27.365009307861328, "global_step": 536616, "epoch": 6465} {"train_loss": -27.132139205932617, "global_step": 536617, "epoch": 6465} {"train_loss": -27.421655654907227, "global_step": 536618, "epoch": 6465} {"train_loss": -27.259723663330078, "global_step": 536619, "epoch": 6465} {"train_loss": -27.314258575439453, "global_step": 536620, "epoch": 6465} {"train_loss": -27.410598754882812, "global_step": 536621, "epoch": 6465} {"train_loss": -27.4126033782959, "global_step": 536622, "epoch": 6465} {"train_loss": -27.72905921936035, "global_step": 536623, "epoch": 6465} {"train_loss": -27.667856216430664, "global_step": 536624, "epoch": 6465} {"train_loss": -27.484756469726562, "global_step": 536625, "epoch": 6465} {"train_loss": -27.749258041381836, "global_step": 536626, "epoch": 6465} {"train_loss": -27.312427520751953, "global_step": 536627, "epoch": 6465} {"train_loss": -27.36216163635254, "global_step": 536628, "epoch": 6465} {"train_loss": -27.643115997314453, "global_step": 536629, "epoch": 6465} {"train_loss": -27.676929473876953, "global_step": 536630, "epoch": 6465} {"train_loss": -27.516077041625977, "global_step": 536631, "epoch": 6465} {"train_loss": -27.87066078186035, "global_step": 536632, "epoch": 6465} {"train_loss": -27.659423828125, "global_step": 536633, "epoch": 6465} {"train_loss": -27.700286865234375, "global_step": 536634, "epoch": 6465} {"train_loss": -27.8431453704834, "global_step": 536635, "epoch": 6465} {"train_loss": -27.6928768157959, "global_step": 536636, "epoch": 6465} {"train_loss": -27.722126007080078, "global_step": 536637, "epoch": 6465} {"train_loss": -27.876333236694336, "global_step": 536638, "epoch": 6465} {"train_loss": -27.818387985229492, "global_step": 536639, "epoch": 6465} {"train_loss": -27.609786987304688, "global_step": 536640, "epoch": 6465} {"train_loss": -27.338790893554688, "global_step": 536641, "epoch": 6465} {"train_loss": -27.756027221679688, "global_step": 536642, "epoch": 6465} {"train_loss": -27.756366729736328, "global_step": 536643, "epoch": 6465} {"train_loss": -28.148971557617188, "global_step": 536644, "epoch": 6465} {"train_loss": -27.861013412475586, "global_step": 536645, "epoch": 6465} {"train_loss": -27.87079429626465, "global_step": 536646, "epoch": 6465} {"train_loss": -27.72696876525879, "global_step": 536647, "epoch": 6465} {"train_loss": -27.85825538635254, "global_step": 536648, "epoch": 6465} {"train_loss": -28.15583610534668, "global_step": 536649, "epoch": 6465} {"train_loss": -27.728139877319336, "global_step": 536650, "epoch": 6465} {"train_loss": -27.710962295532227, "global_step": 536651, "epoch": 6465} {"train_loss": -27.81691551208496, "global_step": 536652, "epoch": 6465} {"train_loss": -27.45587158203125, "global_step": 536653, "epoch": 6465} {"train_loss": -27.717992782592773, "global_step": 536654, "epoch": 6465} {"train_loss": -27.7406063079834, "global_step": 536655, "epoch": 6465} {"train_loss": -27.683456420898438, "global_step": 536656, "epoch": 6465} {"train_loss": -27.7781982421875, "global_step": 536657, "epoch": 6465} {"train_loss": -27.605276107788086, "global_step": 536658, "epoch": 6465} {"train_loss": -27.688018798828125, "global_step": 536659, "epoch": 6465} {"train_loss": -28.027820587158203, "global_step": 536660, "epoch": 6465} {"train_loss": -27.189115524291992, "global_step": 536661, "epoch": 6465} {"train_loss": -27.782669067382812, "global_step": 536662, "epoch": 6465} {"train_loss": -27.924177169799805, "global_step": 536663, "epoch": 6465} {"train_loss": -27.923694610595703, "global_step": 536664, "epoch": 6465} {"train_loss": -28.073923110961914, "global_step": 536665, "epoch": 6465} {"train_loss": -27.569660186767578, "global_step": 536666, "epoch": 6465} {"train_loss": -27.772932052612305, "global_step": 536667, "epoch": 6465} {"train_loss": -27.533536911010742, "global_step": 536668, "epoch": 6465} {"train_loss": -27.468713760375977, "global_step": 536669, "epoch": 6465} {"train_loss": -27.966796875, "global_step": 536670, "epoch": 6465} {"train_loss": -27.497724533081055, "global_step": 536671, "epoch": 6465} {"train_loss": -27.611621856689453, "global_step": 536672, "epoch": 6465} {"train_loss": -28.0406436920166, "global_step": 536673, "epoch": 6465} {"train_loss": -27.712675094604492, "global_step": 536674, "epoch": 6465} {"train_loss": -27.615522384643555, "global_step": 536675, "epoch": 6465} {"train_loss": -27.584564208984375, "global_step": 536676, "epoch": 6465} {"train_loss": -27.47792453076466, "global_step": 536677, "epoch": 6465, "val_loss": 6471885.0} {"train_loss": -26.88319206237793, "global_step": 536678, "epoch": 6466} {"train_loss": -26.52545166015625, "global_step": 536679, "epoch": 6466} {"train_loss": -26.051620483398438, "global_step": 536680, "epoch": 6466} {"train_loss": -26.720422744750977, "global_step": 536681, "epoch": 6466} {"train_loss": -26.823993682861328, "global_step": 536682, "epoch": 6466} {"train_loss": -26.401824951171875, "global_step": 536683, "epoch": 6466} {"train_loss": -26.963666915893555, "global_step": 536684, "epoch": 6466} {"train_loss": -26.989416122436523, "global_step": 536685, "epoch": 6466} {"train_loss": -27.282743453979492, "global_step": 536686, "epoch": 6466} {"train_loss": -26.1412296295166, "global_step": 536687, "epoch": 6466} {"train_loss": -26.450916290283203, "global_step": 536688, "epoch": 6466} {"train_loss": -26.391977310180664, "global_step": 536689, "epoch": 6466} {"train_loss": -26.573095321655273, "global_step": 536690, "epoch": 6466} {"train_loss": -27.102365493774414, "global_step": 536691, "epoch": 6466} {"train_loss": -26.733442306518555, "global_step": 536692, "epoch": 6466} {"train_loss": -27.054615020751953, "global_step": 536693, "epoch": 6466} {"train_loss": -26.66375732421875, "global_step": 536694, "epoch": 6466} {"train_loss": -27.132434844970703, "global_step": 536695, "epoch": 6466} {"train_loss": -26.7734317779541, "global_step": 536696, "epoch": 6466} {"train_loss": -27.253019332885742, "global_step": 536697, "epoch": 6466} {"train_loss": -27.205121994018555, "global_step": 536698, "epoch": 6466} {"train_loss": -26.752161026000977, "global_step": 536699, "epoch": 6466} {"train_loss": -27.315637588500977, "global_step": 536700, "epoch": 6466} {"train_loss": -27.442358016967773, "global_step": 536701, "epoch": 6466} {"train_loss": -27.343524932861328, "global_step": 536702, "epoch": 6466} {"train_loss": -26.955347061157227, "global_step": 536703, "epoch": 6466} {"train_loss": -27.232864379882812, "global_step": 536704, "epoch": 6466} {"train_loss": -27.12896156311035, "global_step": 536705, "epoch": 6466} {"train_loss": -27.201452255249023, "global_step": 536706, "epoch": 6466} {"train_loss": -27.754438400268555, "global_step": 536707, "epoch": 6466} {"train_loss": -27.257970809936523, "global_step": 536708, "epoch": 6466} {"train_loss": -27.785568237304688, "global_step": 536709, "epoch": 6466} {"train_loss": -27.437280654907227, "global_step": 536710, "epoch": 6466} {"train_loss": -27.44314956665039, "global_step": 536711, "epoch": 6466} {"train_loss": -27.1846866607666, "global_step": 536712, "epoch": 6466} {"train_loss": -27.737585067749023, "global_step": 536713, "epoch": 6466} {"train_loss": -27.486190795898438, "global_step": 536714, "epoch": 6466} {"train_loss": -27.581073760986328, "global_step": 536715, "epoch": 6466} {"train_loss": -27.58338737487793, "global_step": 536716, "epoch": 6466} {"train_loss": -27.408477783203125, "global_step": 536717, "epoch": 6466} {"train_loss": -27.659570693969727, "global_step": 536718, "epoch": 6466} {"train_loss": -27.506458282470703, "global_step": 536719, "epoch": 6466} {"train_loss": -27.64703369140625, "global_step": 536720, "epoch": 6466} {"train_loss": -27.558828353881836, "global_step": 536721, "epoch": 6466} {"train_loss": -27.755130767822266, "global_step": 536722, "epoch": 6466} {"train_loss": -28.09614372253418, "global_step": 536723, "epoch": 6466} {"train_loss": -27.875940322875977, "global_step": 536724, "epoch": 6466} {"train_loss": -27.756946563720703, "global_step": 536725, "epoch": 6466} {"train_loss": -27.62701988220215, "global_step": 536726, "epoch": 6466} {"train_loss": -27.953800201416016, "global_step": 536727, "epoch": 6466} {"train_loss": -27.965656280517578, "global_step": 536728, "epoch": 6466} {"train_loss": -27.537572860717773, "global_step": 536729, "epoch": 6466} {"train_loss": -27.737873077392578, "global_step": 536730, "epoch": 6466} {"train_loss": -27.348785400390625, "global_step": 536731, "epoch": 6466} {"train_loss": -28.33216667175293, "global_step": 536732, "epoch": 6466} {"train_loss": -27.61639404296875, "global_step": 536733, "epoch": 6466} {"train_loss": -27.844884872436523, "global_step": 536734, "epoch": 6466} {"train_loss": -27.791141510009766, "global_step": 536735, "epoch": 6466} {"train_loss": -28.009252548217773, "global_step": 536736, "epoch": 6466} {"train_loss": -27.891855239868164, "global_step": 536737, "epoch": 6466} {"train_loss": -27.82159423828125, "global_step": 536738, "epoch": 6466} {"train_loss": -26.873748779296875, "global_step": 536739, "epoch": 6466} {"train_loss": -28.25240135192871, "global_step": 536740, "epoch": 6466} {"train_loss": -27.171798706054688, "global_step": 536741, "epoch": 6466} {"train_loss": -27.45880699157715, "global_step": 536742, "epoch": 6466} {"train_loss": -27.577375411987305, "global_step": 536743, "epoch": 6466} {"train_loss": -27.44575309753418, "global_step": 536744, "epoch": 6466} {"train_loss": -27.8662052154541, "global_step": 536745, "epoch": 6466} {"train_loss": -27.439599990844727, "global_step": 536746, "epoch": 6466} {"train_loss": -27.78545570373535, "global_step": 536747, "epoch": 6466} {"train_loss": -27.382104873657227, "global_step": 536748, "epoch": 6466} {"train_loss": -27.32916259765625, "global_step": 536749, "epoch": 6466} {"train_loss": -27.89959144592285, "global_step": 536750, "epoch": 6466} {"train_loss": -27.511266708374023, "global_step": 536751, "epoch": 6466} {"train_loss": -27.35261344909668, "global_step": 536752, "epoch": 6466} {"train_loss": -27.575841903686523, "global_step": 536753, "epoch": 6466} {"train_loss": -27.614013671875, "global_step": 536754, "epoch": 6466} {"train_loss": -27.7625789642334, "global_step": 536755, "epoch": 6466} {"train_loss": -27.60686683654785, "global_step": 536756, "epoch": 6466} {"train_loss": -27.520893096923828, "global_step": 536757, "epoch": 6466} {"train_loss": -27.66290855407715, "global_step": 536758, "epoch": 6466} {"train_loss": -27.52728271484375, "global_step": 536759, "epoch": 6466} {"train_loss": -27.37685362114964, "global_step": 536760, "epoch": 6466, "val_loss": 6469463.0} {"train_loss": -26.784765243530273, "global_step": 536761, "epoch": 6467} {"train_loss": -26.525156021118164, "global_step": 536762, "epoch": 6467} {"train_loss": -26.503808975219727, "global_step": 536763, "epoch": 6467} {"train_loss": -27.215566635131836, "global_step": 536764, "epoch": 6467} {"train_loss": -27.117191314697266, "global_step": 536765, "epoch": 6467} {"train_loss": -27.0025577545166, "global_step": 536766, "epoch": 6467} {"train_loss": -27.199386596679688, "global_step": 536767, "epoch": 6467} {"train_loss": -27.269079208374023, "global_step": 536768, "epoch": 6467} {"train_loss": -27.115890502929688, "global_step": 536769, "epoch": 6467} {"train_loss": -27.477191925048828, "global_step": 536770, "epoch": 6467} {"train_loss": -26.9473819732666, "global_step": 536771, "epoch": 6467} {"train_loss": -27.627721786499023, "global_step": 536772, "epoch": 6467} {"train_loss": -26.971221923828125, "global_step": 536773, "epoch": 6467} {"train_loss": -27.383956909179688, "global_step": 536774, "epoch": 6467} {"train_loss": -27.529890060424805, "global_step": 536775, "epoch": 6467} {"train_loss": -27.690305709838867, "global_step": 536776, "epoch": 6467} {"train_loss": -27.570499420166016, "global_step": 536777, "epoch": 6467} {"train_loss": -27.242095947265625, "global_step": 536778, "epoch": 6467} {"train_loss": -27.129779815673828, "global_step": 536779, "epoch": 6467} {"train_loss": -27.407682418823242, "global_step": 536780, "epoch": 6467} {"train_loss": -27.50971794128418, "global_step": 536781, "epoch": 6467} {"train_loss": -27.1154842376709, "global_step": 536782, "epoch": 6467} {"train_loss": -27.288135528564453, "global_step": 536783, "epoch": 6467} {"train_loss": -26.952112197875977, "global_step": 536784, "epoch": 6467} {"train_loss": -27.348377227783203, "global_step": 536785, "epoch": 6467} {"train_loss": -27.180496215820312, "global_step": 536786, "epoch": 6467} {"train_loss": -27.418073654174805, "global_step": 536787, "epoch": 6467} {"train_loss": -27.540618896484375, "global_step": 536788, "epoch": 6467} {"train_loss": -27.26753044128418, "global_step": 536789, "epoch": 6467} {"train_loss": -27.487091064453125, "global_step": 536790, "epoch": 6467} {"train_loss": -27.296905517578125, "global_step": 536791, "epoch": 6467} {"train_loss": -27.511133193969727, "global_step": 536792, "epoch": 6467} {"train_loss": -27.405200958251953, "global_step": 536793, "epoch": 6467} {"train_loss": -27.4583683013916, "global_step": 536794, "epoch": 6467} {"train_loss": -27.738683700561523, "global_step": 536795, "epoch": 6467} {"train_loss": -27.606199264526367, "global_step": 536796, "epoch": 6467} {"train_loss": -27.409902572631836, "global_step": 536797, "epoch": 6467} {"train_loss": -27.827991485595703, "global_step": 536798, "epoch": 6467} {"train_loss": -27.48556900024414, "global_step": 536799, "epoch": 6467} {"train_loss": -27.52364158630371, "global_step": 536800, "epoch": 6467} {"train_loss": -27.730993270874023, "global_step": 536801, "epoch": 6467} {"train_loss": -27.934738159179688, "global_step": 536802, "epoch": 6467} {"train_loss": -27.849939346313477, "global_step": 536803, "epoch": 6467} {"train_loss": -27.955963134765625, "global_step": 536804, "epoch": 6467} {"train_loss": -28.04437828063965, "global_step": 536805, "epoch": 6467} {"train_loss": -27.912763595581055, "global_step": 536806, "epoch": 6467} {"train_loss": -27.437238693237305, "global_step": 536807, "epoch": 6467} {"train_loss": -27.405065536499023, "global_step": 536808, "epoch": 6467} {"train_loss": -27.571212768554688, "global_step": 536809, "epoch": 6467} {"train_loss": -27.466379165649414, "global_step": 536810, "epoch": 6467} {"train_loss": -27.7637882232666, "global_step": 536811, "epoch": 6467} {"train_loss": -27.711750030517578, "global_step": 536812, "epoch": 6467} {"train_loss": -27.429901123046875, "global_step": 536813, "epoch": 6467} {"train_loss": -27.337528228759766, "global_step": 536814, "epoch": 6467} {"train_loss": -27.715620040893555, "global_step": 536815, "epoch": 6467} {"train_loss": -27.931615829467773, "global_step": 536816, "epoch": 6467} {"train_loss": -27.431848526000977, "global_step": 536817, "epoch": 6467} {"train_loss": -27.896453857421875, "global_step": 536818, "epoch": 6467} {"train_loss": -27.654809951782227, "global_step": 536819, "epoch": 6467} {"train_loss": -27.805469512939453, "global_step": 536820, "epoch": 6467} {"train_loss": -27.58139991760254, "global_step": 536821, "epoch": 6467} {"train_loss": -27.638402938842773, "global_step": 536822, "epoch": 6467} {"train_loss": -27.727584838867188, "global_step": 536823, "epoch": 6467} {"train_loss": -27.321308135986328, "global_step": 536824, "epoch": 6467} {"train_loss": -27.86503028869629, "global_step": 536825, "epoch": 6467} {"train_loss": -27.71454429626465, "global_step": 536826, "epoch": 6467} {"train_loss": -27.460927963256836, "global_step": 536827, "epoch": 6467} {"train_loss": -27.65113639831543, "global_step": 536828, "epoch": 6467} {"train_loss": -28.006006240844727, "global_step": 536829, "epoch": 6467} {"train_loss": -27.696271896362305, "global_step": 536830, "epoch": 6467} {"train_loss": -27.706518173217773, "global_step": 536831, "epoch": 6467} {"train_loss": -27.556631088256836, "global_step": 536832, "epoch": 6467} {"train_loss": -27.905685424804688, "global_step": 536833, "epoch": 6467} {"train_loss": -27.628812789916992, "global_step": 536834, "epoch": 6467} {"train_loss": -27.68202781677246, "global_step": 536835, "epoch": 6467} {"train_loss": -27.64385986328125, "global_step": 536836, "epoch": 6467} {"train_loss": -27.968189239501953, "global_step": 536837, "epoch": 6467} {"train_loss": -27.844999313354492, "global_step": 536838, "epoch": 6467} {"train_loss": -27.968097686767578, "global_step": 536839, "epoch": 6467} {"train_loss": -27.5109920501709, "global_step": 536840, "epoch": 6467} {"train_loss": -27.552968978881836, "global_step": 536841, "epoch": 6467} {"train_loss": -27.818567276000977, "global_step": 536842, "epoch": 6467} {"train_loss": -27.514661398278662, "global_step": 536843, "epoch": 6467, "val_loss": 6485052.5} {"train_loss": -27.240453720092773, "global_step": 536844, "epoch": 6468} {"train_loss": -26.9371395111084, "global_step": 536845, "epoch": 6468} {"train_loss": -27.242862701416016, "global_step": 536846, "epoch": 6468} {"train_loss": -26.950592041015625, "global_step": 536847, "epoch": 6468} {"train_loss": -27.884424209594727, "global_step": 536848, "epoch": 6468} {"train_loss": -27.113712310791016, "global_step": 536849, "epoch": 6468} {"train_loss": -27.541980743408203, "global_step": 536850, "epoch": 6468} {"train_loss": -27.752685546875, "global_step": 536851, "epoch": 6468} {"train_loss": -27.226593017578125, "global_step": 536852, "epoch": 6468} {"train_loss": -27.489904403686523, "global_step": 536853, "epoch": 6468} {"train_loss": -27.613759994506836, "global_step": 536854, "epoch": 6468} {"train_loss": -27.546142578125, "global_step": 536855, "epoch": 6468} {"train_loss": -27.278562545776367, "global_step": 536856, "epoch": 6468} {"train_loss": -27.068647384643555, "global_step": 536857, "epoch": 6468} {"train_loss": -27.271148681640625, "global_step": 536858, "epoch": 6468} {"train_loss": -27.36829948425293, "global_step": 536859, "epoch": 6468} {"train_loss": -27.876331329345703, "global_step": 536860, "epoch": 6468} {"train_loss": -27.208829879760742, "global_step": 536861, "epoch": 6468} {"train_loss": -27.364730834960938, "global_step": 536862, "epoch": 6468} {"train_loss": -27.608930587768555, "global_step": 536863, "epoch": 6468} {"train_loss": -27.465301513671875, "global_step": 536864, "epoch": 6468} {"train_loss": -27.390670776367188, "global_step": 536865, "epoch": 6468} {"train_loss": -28.047773361206055, "global_step": 536866, "epoch": 6468} {"train_loss": -27.53667640686035, "global_step": 536867, "epoch": 6468} {"train_loss": -27.509939193725586, "global_step": 536868, "epoch": 6468} {"train_loss": -27.590940475463867, "global_step": 536869, "epoch": 6468} {"train_loss": -27.72056007385254, "global_step": 536870, "epoch": 6468} {"train_loss": -27.598928451538086, "global_step": 536871, "epoch": 6468} {"train_loss": -27.397958755493164, "global_step": 536872, "epoch": 6468} {"train_loss": -27.508153915405273, "global_step": 536873, "epoch": 6468} {"train_loss": -27.904264450073242, "global_step": 536874, "epoch": 6468} {"train_loss": -27.99945640563965, "global_step": 536875, "epoch": 6468} {"train_loss": -27.879125595092773, "global_step": 536876, "epoch": 6468} {"train_loss": -27.85361099243164, "global_step": 536877, "epoch": 6468} {"train_loss": -28.01502799987793, "global_step": 536878, "epoch": 6468} {"train_loss": -27.63232421875, "global_step": 536879, "epoch": 6468} {"train_loss": -27.770538330078125, "global_step": 536880, "epoch": 6468} {"train_loss": -27.729969024658203, "global_step": 536881, "epoch": 6468} {"train_loss": -27.751657485961914, "global_step": 536882, "epoch": 6468} {"train_loss": -27.62286376953125, "global_step": 536883, "epoch": 6468} {"train_loss": -27.801801681518555, "global_step": 536884, "epoch": 6468} {"train_loss": -27.382659912109375, "global_step": 536885, "epoch": 6468} {"train_loss": -27.884435653686523, "global_step": 536886, "epoch": 6468} {"train_loss": -28.06658363342285, "global_step": 536887, "epoch": 6468} {"train_loss": -27.63347816467285, "global_step": 536888, "epoch": 6468} {"train_loss": -27.498517990112305, "global_step": 536889, "epoch": 6468} {"train_loss": -27.3514461517334, "global_step": 536890, "epoch": 6468} {"train_loss": -27.22150230407715, "global_step": 536891, "epoch": 6468} {"train_loss": -27.40803337097168, "global_step": 536892, "epoch": 6468} {"train_loss": -27.317914962768555, "global_step": 536893, "epoch": 6468} {"train_loss": -27.339811325073242, "global_step": 536894, "epoch": 6468} {"train_loss": -27.54221534729004, "global_step": 536895, "epoch": 6468} {"train_loss": -27.589853286743164, "global_step": 536896, "epoch": 6468} {"train_loss": -27.23714256286621, "global_step": 536897, "epoch": 6468} {"train_loss": -28.048513412475586, "global_step": 536898, "epoch": 6468} {"train_loss": -27.737411499023438, "global_step": 536899, "epoch": 6468} {"train_loss": -27.485492706298828, "global_step": 536900, "epoch": 6468} {"train_loss": -27.53924560546875, "global_step": 536901, "epoch": 6468} {"train_loss": -27.720056533813477, "global_step": 536902, "epoch": 6468} {"train_loss": -27.73585319519043, "global_step": 536903, "epoch": 6468} {"train_loss": -27.268091201782227, "global_step": 536904, "epoch": 6468} {"train_loss": -27.81882667541504, "global_step": 536905, "epoch": 6468} {"train_loss": -27.444604873657227, "global_step": 536906, "epoch": 6468} {"train_loss": -27.655792236328125, "global_step": 536907, "epoch": 6468} {"train_loss": -27.511991500854492, "global_step": 536908, "epoch": 6468} {"train_loss": -27.494937896728516, "global_step": 536909, "epoch": 6468} {"train_loss": -28.00689125061035, "global_step": 536910, "epoch": 6468} {"train_loss": -27.639928817749023, "global_step": 536911, "epoch": 6468} {"train_loss": -27.843799591064453, "global_step": 536912, "epoch": 6468} {"train_loss": -27.951629638671875, "global_step": 536913, "epoch": 6468} {"train_loss": -27.88701820373535, "global_step": 536914, "epoch": 6468} {"train_loss": -27.601957321166992, "global_step": 536915, "epoch": 6468} {"train_loss": -28.012075424194336, "global_step": 536916, "epoch": 6468} {"train_loss": -27.751983642578125, "global_step": 536917, "epoch": 6468} {"train_loss": -27.746259689331055, "global_step": 536918, "epoch": 6468} {"train_loss": -27.881567001342773, "global_step": 536919, "epoch": 6468} {"train_loss": -27.690093994140625, "global_step": 536920, "epoch": 6468} {"train_loss": -27.653045654296875, "global_step": 536921, "epoch": 6468} {"train_loss": -27.883569717407227, "global_step": 536922, "epoch": 6468} {"train_loss": -27.912857055664062, "global_step": 536923, "epoch": 6468} {"train_loss": -27.72002601623535, "global_step": 536924, "epoch": 6468} {"train_loss": -27.983915328979492, "global_step": 536925, "epoch": 6468} {"train_loss": -27.59733742403697, "global_step": 536926, "epoch": 6468, "val_loss": 6445096.0} {"train_loss": -27.428024291992188, "global_step": 536927, "epoch": 6469} {"train_loss": -27.221487045288086, "global_step": 536928, "epoch": 6469} {"train_loss": -27.546716690063477, "global_step": 536929, "epoch": 6469} {"train_loss": -27.07623291015625, "global_step": 536930, "epoch": 6469} {"train_loss": -27.510623931884766, "global_step": 536931, "epoch": 6469} {"train_loss": -27.704254150390625, "global_step": 536932, "epoch": 6469} {"train_loss": -26.787189483642578, "global_step": 536933, "epoch": 6469} {"train_loss": -26.425413131713867, "global_step": 536934, "epoch": 6469} {"train_loss": -27.17005729675293, "global_step": 536935, "epoch": 6469} {"train_loss": -27.39923095703125, "global_step": 536936, "epoch": 6469} {"train_loss": -27.621191024780273, "global_step": 536937, "epoch": 6469} {"train_loss": -27.059045791625977, "global_step": 536938, "epoch": 6469} {"train_loss": -27.111249923706055, "global_step": 536939, "epoch": 6469} {"train_loss": -27.33925437927246, "global_step": 536940, "epoch": 6469} {"train_loss": -27.43409538269043, "global_step": 536941, "epoch": 6469} {"train_loss": -27.485671997070312, "global_step": 536942, "epoch": 6469} {"train_loss": -27.700754165649414, "global_step": 536943, "epoch": 6469} {"train_loss": -27.563690185546875, "global_step": 536944, "epoch": 6469} {"train_loss": -27.463720321655273, "global_step": 536945, "epoch": 6469} {"train_loss": -27.666593551635742, "global_step": 536946, "epoch": 6469} {"train_loss": -27.49090576171875, "global_step": 536947, "epoch": 6469} {"train_loss": -27.74541664123535, "global_step": 536948, "epoch": 6469} {"train_loss": -27.51663589477539, "global_step": 536949, "epoch": 6469} {"train_loss": -27.591938018798828, "global_step": 536950, "epoch": 6469} {"train_loss": -27.821191787719727, "global_step": 536951, "epoch": 6469} {"train_loss": -27.441181182861328, "global_step": 536952, "epoch": 6469} {"train_loss": -27.429920196533203, "global_step": 536953, "epoch": 6469} {"train_loss": -27.831756591796875, "global_step": 536954, "epoch": 6469} {"train_loss": -28.113977432250977, "global_step": 536955, "epoch": 6469} {"train_loss": -27.573394775390625, "global_step": 536956, "epoch": 6469} {"train_loss": -27.574609756469727, "global_step": 536957, "epoch": 6469} {"train_loss": -27.709089279174805, "global_step": 536958, "epoch": 6469} {"train_loss": -27.84999656677246, "global_step": 536959, "epoch": 6469} {"train_loss": -27.551807403564453, "global_step": 536960, "epoch": 6469} {"train_loss": -27.914472579956055, "global_step": 536961, "epoch": 6469} {"train_loss": -27.913095474243164, "global_step": 536962, "epoch": 6469} {"train_loss": -27.57236671447754, "global_step": 536963, "epoch": 6469} {"train_loss": -27.65384292602539, "global_step": 536964, "epoch": 6469} {"train_loss": -27.7806396484375, "global_step": 536965, "epoch": 6469} {"train_loss": -27.822101593017578, "global_step": 536966, "epoch": 6469} {"train_loss": -27.614013671875, "global_step": 536967, "epoch": 6469} {"train_loss": -27.673391342163086, "global_step": 536968, "epoch": 6469} {"train_loss": -27.95771598815918, "global_step": 536969, "epoch": 6469} {"train_loss": -27.7033748626709, "global_step": 536970, "epoch": 6469} {"train_loss": -27.870588302612305, "global_step": 536971, "epoch": 6469} {"train_loss": -27.646764755249023, "global_step": 536972, "epoch": 6469} {"train_loss": -28.004953384399414, "global_step": 536973, "epoch": 6469} {"train_loss": -27.837249755859375, "global_step": 536974, "epoch": 6469} {"train_loss": -27.97580909729004, "global_step": 536975, "epoch": 6469} {"train_loss": -27.978525161743164, "global_step": 536976, "epoch": 6469} {"train_loss": -27.88629722595215, "global_step": 536977, "epoch": 6469} {"train_loss": -27.877490997314453, "global_step": 536978, "epoch": 6469} {"train_loss": -27.831256866455078, "global_step": 536979, "epoch": 6469} {"train_loss": -27.928991317749023, "global_step": 536980, "epoch": 6469} {"train_loss": -27.876752853393555, "global_step": 536981, "epoch": 6469} {"train_loss": -28.0135498046875, "global_step": 536982, "epoch": 6469} {"train_loss": -27.839599609375, "global_step": 536983, "epoch": 6469} {"train_loss": -27.778533935546875, "global_step": 536984, "epoch": 6469} {"train_loss": -27.871000289916992, "global_step": 536985, "epoch": 6469} {"train_loss": -27.929901123046875, "global_step": 536986, "epoch": 6469} {"train_loss": -27.426828384399414, "global_step": 536987, "epoch": 6469} {"train_loss": -27.863800048828125, "global_step": 536988, "epoch": 6469} {"train_loss": -27.18897819519043, "global_step": 536989, "epoch": 6469} {"train_loss": -27.247406005859375, "global_step": 536990, "epoch": 6469} {"train_loss": -26.92886734008789, "global_step": 536991, "epoch": 6469} {"train_loss": -27.091379165649414, "global_step": 536992, "epoch": 6469} {"train_loss": -27.164960861206055, "global_step": 536993, "epoch": 6469} {"train_loss": -26.959692001342773, "global_step": 536994, "epoch": 6469} {"train_loss": -26.582239151000977, "global_step": 536995, "epoch": 6469} {"train_loss": -27.277088165283203, "global_step": 536996, "epoch": 6469} {"train_loss": -27.4805850982666, "global_step": 536997, "epoch": 6469} {"train_loss": -26.896636962890625, "global_step": 536998, "epoch": 6469} {"train_loss": -26.47896385192871, "global_step": 536999, "epoch": 6469} {"train_loss": -27.430700302124023, "global_step": 537000, "epoch": 6469} {"train_loss": -27.329492568969727, "global_step": 537001, "epoch": 6469} {"train_loss": -27.240869522094727, "global_step": 537002, "epoch": 6469} {"train_loss": -27.41875648498535, "global_step": 537003, "epoch": 6469} {"train_loss": -27.484851837158203, "global_step": 537004, "epoch": 6469} {"train_loss": -27.3548526763916, "global_step": 537005, "epoch": 6469} {"train_loss": -27.230321884155273, "global_step": 537006, "epoch": 6469} {"train_loss": -27.492727279663086, "global_step": 537007, "epoch": 6469} {"train_loss": -27.356298446655273, "global_step": 537008, "epoch": 6469} {"train_loss": -27.512246442128376, "global_step": 537009, "epoch": 6469, "val_loss": 6435329.5} {"train_loss": -27.568347930908203, "global_step": 537010, "epoch": 6470} {"train_loss": -27.325326919555664, "global_step": 537011, "epoch": 6470} {"train_loss": -27.31964683532715, "global_step": 537012, "epoch": 6470} {"train_loss": -27.389450073242188, "global_step": 537013, "epoch": 6470} {"train_loss": -27.19122886657715, "global_step": 537014, "epoch": 6470} {"train_loss": -27.461435317993164, "global_step": 537015, "epoch": 6470} {"train_loss": -27.596542358398438, "global_step": 537016, "epoch": 6470} {"train_loss": -27.126371383666992, "global_step": 537017, "epoch": 6470} {"train_loss": -27.762243270874023, "global_step": 537018, "epoch": 6470} {"train_loss": -27.46644401550293, "global_step": 537019, "epoch": 6470} {"train_loss": -27.643146514892578, "global_step": 537020, "epoch": 6470} {"train_loss": -27.35056495666504, "global_step": 537021, "epoch": 6470} {"train_loss": -27.460376739501953, "global_step": 537022, "epoch": 6470} {"train_loss": -27.3048038482666, "global_step": 537023, "epoch": 6470} {"train_loss": -27.58461570739746, "global_step": 537024, "epoch": 6470} {"train_loss": -27.259552001953125, "global_step": 537025, "epoch": 6470} {"train_loss": -27.36154556274414, "global_step": 537026, "epoch": 6470} {"train_loss": -27.467493057250977, "global_step": 537027, "epoch": 6470} {"train_loss": -27.288923263549805, "global_step": 537028, "epoch": 6470} {"train_loss": -27.982397079467773, "global_step": 537029, "epoch": 6470} {"train_loss": -27.392602920532227, "global_step": 537030, "epoch": 6470} {"train_loss": -27.54969596862793, "global_step": 537031, "epoch": 6470} {"train_loss": -27.611190795898438, "global_step": 537032, "epoch": 6470} {"train_loss": -27.761220932006836, "global_step": 537033, "epoch": 6470} {"train_loss": -27.73798179626465, "global_step": 537034, "epoch": 6470} {"train_loss": -27.885900497436523, "global_step": 537035, "epoch": 6470} {"train_loss": -27.903318405151367, "global_step": 537036, "epoch": 6470} {"train_loss": -28.086957931518555, "global_step": 537037, "epoch": 6470} {"train_loss": -27.732969284057617, "global_step": 537038, "epoch": 6470} {"train_loss": -27.533660888671875, "global_step": 537039, "epoch": 6470} {"train_loss": -28.192718505859375, "global_step": 537040, "epoch": 6470} {"train_loss": -28.00262451171875, "global_step": 537041, "epoch": 6470} {"train_loss": -27.776004791259766, "global_step": 537042, "epoch": 6470} {"train_loss": -27.921100616455078, "global_step": 537043, "epoch": 6470} {"train_loss": -27.643735885620117, "global_step": 537044, "epoch": 6470} {"train_loss": -27.522235870361328, "global_step": 537045, "epoch": 6470} {"train_loss": -27.429025650024414, "global_step": 537046, "epoch": 6470} {"train_loss": -27.399137496948242, "global_step": 537047, "epoch": 6470} {"train_loss": -27.88870620727539, "global_step": 537048, "epoch": 6470} {"train_loss": -28.064258575439453, "global_step": 537049, "epoch": 6470} {"train_loss": -27.664220809936523, "global_step": 537050, "epoch": 6470} {"train_loss": -27.399961471557617, "global_step": 537051, "epoch": 6470} {"train_loss": -28.239501953125, "global_step": 537052, "epoch": 6470} {"train_loss": -27.532428741455078, "global_step": 537053, "epoch": 6470} {"train_loss": -27.86000633239746, "global_step": 537054, "epoch": 6470} {"train_loss": -27.493789672851562, "global_step": 537055, "epoch": 6470} {"train_loss": -27.763463973999023, "global_step": 537056, "epoch": 6470} {"train_loss": -27.73211097717285, "global_step": 537057, "epoch": 6470} {"train_loss": -27.49749755859375, "global_step": 537058, "epoch": 6470} {"train_loss": -27.772613525390625, "global_step": 537059, "epoch": 6470} {"train_loss": -27.496850967407227, "global_step": 537060, "epoch": 6470} {"train_loss": -27.90534782409668, "global_step": 537061, "epoch": 6470} {"train_loss": -27.678058624267578, "global_step": 537062, "epoch": 6470} {"train_loss": -27.466352462768555, "global_step": 537063, "epoch": 6470} {"train_loss": -27.785114288330078, "global_step": 537064, "epoch": 6470} {"train_loss": -27.645193099975586, "global_step": 537065, "epoch": 6470} {"train_loss": -27.047637939453125, "global_step": 537066, "epoch": 6470} {"train_loss": -27.755041122436523, "global_step": 537067, "epoch": 6470} {"train_loss": -27.983352661132812, "global_step": 537068, "epoch": 6470} {"train_loss": -27.496475219726562, "global_step": 537069, "epoch": 6470} {"train_loss": -27.591064453125, "global_step": 537070, "epoch": 6470} {"train_loss": -27.389083862304688, "global_step": 537071, "epoch": 6470} {"train_loss": -27.068273544311523, "global_step": 537072, "epoch": 6470} {"train_loss": -27.51798439025879, "global_step": 537073, "epoch": 6470} {"train_loss": -27.648115158081055, "global_step": 537074, "epoch": 6470} {"train_loss": -27.87347984313965, "global_step": 537075, "epoch": 6470} {"train_loss": -27.76837158203125, "global_step": 537076, "epoch": 6470} {"train_loss": -28.243762969970703, "global_step": 537077, "epoch": 6470} {"train_loss": -27.956012725830078, "global_step": 537078, "epoch": 6470} {"train_loss": -27.125141143798828, "global_step": 537079, "epoch": 6470} {"train_loss": -27.756906509399414, "global_step": 537080, "epoch": 6470} {"train_loss": -28.153894424438477, "global_step": 537081, "epoch": 6470} {"train_loss": -27.741804122924805, "global_step": 537082, "epoch": 6470} {"train_loss": -27.718042373657227, "global_step": 537083, "epoch": 6470} {"train_loss": -27.8154239654541, "global_step": 537084, "epoch": 6470} {"train_loss": -27.83698844909668, "global_step": 537085, "epoch": 6470} {"train_loss": -28.0118465423584, "global_step": 537086, "epoch": 6470} {"train_loss": -27.680866241455078, "global_step": 537087, "epoch": 6470} {"train_loss": -27.669675827026367, "global_step": 537088, "epoch": 6470} {"train_loss": -28.031030654907227, "global_step": 537089, "epoch": 6470} {"train_loss": -26.85611343383789, "global_step": 537090, "epoch": 6470} {"train_loss": -27.531280517578125, "global_step": 537091, "epoch": 6470} {"train_loss": -27.65078553808741, "global_step": 537092, "epoch": 6470, "val_loss": 6525905.0} {"train_loss": -25.182151794433594, "global_step": 537093, "epoch": 6471} {"train_loss": -23.391557693481445, "global_step": 537094, "epoch": 6471} {"train_loss": -26.374008178710938, "global_step": 537095, "epoch": 6471} {"train_loss": -25.958541870117188, "global_step": 537096, "epoch": 6471} {"train_loss": -26.080780029296875, "global_step": 537097, "epoch": 6471} {"train_loss": -26.0574951171875, "global_step": 537098, "epoch": 6471} {"train_loss": -26.0241756439209, "global_step": 537099, "epoch": 6471} {"train_loss": -26.46759033203125, "global_step": 537100, "epoch": 6471} {"train_loss": -26.45142936706543, "global_step": 537101, "epoch": 6471} {"train_loss": -26.614179611206055, "global_step": 537102, "epoch": 6471} {"train_loss": -26.37896156311035, "global_step": 537103, "epoch": 6471} {"train_loss": -26.986526489257812, "global_step": 537104, "epoch": 6471} {"train_loss": -26.637216567993164, "global_step": 537105, "epoch": 6471} {"train_loss": -26.87415885925293, "global_step": 537106, "epoch": 6471} {"train_loss": -26.857526779174805, "global_step": 537107, "epoch": 6471} {"train_loss": -26.90866470336914, "global_step": 537108, "epoch": 6471} {"train_loss": -26.942890167236328, "global_step": 537109, "epoch": 6471} {"train_loss": -26.83905601501465, "global_step": 537110, "epoch": 6471} {"train_loss": -27.108158111572266, "global_step": 537111, "epoch": 6471} {"train_loss": -26.867151260375977, "global_step": 537112, "epoch": 6471} {"train_loss": -27.038558959960938, "global_step": 537113, "epoch": 6471} {"train_loss": -27.158960342407227, "global_step": 537114, "epoch": 6471} {"train_loss": -27.111465454101562, "global_step": 537115, "epoch": 6471} {"train_loss": -27.666852951049805, "global_step": 537116, "epoch": 6471} {"train_loss": -27.226455688476562, "global_step": 537117, "epoch": 6471} {"train_loss": -27.2307186126709, "global_step": 537118, "epoch": 6471} {"train_loss": -27.1248836517334, "global_step": 537119, "epoch": 6471} {"train_loss": -27.627050399780273, "global_step": 537120, "epoch": 6471} {"train_loss": -27.155561447143555, "global_step": 537121, "epoch": 6471} {"train_loss": -27.22437858581543, "global_step": 537122, "epoch": 6471} {"train_loss": -27.5333309173584, "global_step": 537123, "epoch": 6471} {"train_loss": -27.595081329345703, "global_step": 537124, "epoch": 6471} {"train_loss": -27.2329158782959, "global_step": 537125, "epoch": 6471} {"train_loss": -27.136062622070312, "global_step": 537126, "epoch": 6471} {"train_loss": -27.2824649810791, "global_step": 537127, "epoch": 6471} {"train_loss": -27.7536563873291, "global_step": 537128, "epoch": 6471} {"train_loss": -27.180957794189453, "global_step": 537129, "epoch": 6471} {"train_loss": -27.279800415039062, "global_step": 537130, "epoch": 6471} {"train_loss": -27.598514556884766, "global_step": 537131, "epoch": 6471} {"train_loss": -27.391284942626953, "global_step": 537132, "epoch": 6471} {"train_loss": -27.66531753540039, "global_step": 537133, "epoch": 6471} {"train_loss": -27.435583114624023, "global_step": 537134, "epoch": 6471} {"train_loss": -27.3660888671875, "global_step": 537135, "epoch": 6471} {"train_loss": -27.6815185546875, "global_step": 537136, "epoch": 6471} {"train_loss": -27.51141929626465, "global_step": 537137, "epoch": 6471} {"train_loss": -28.161258697509766, "global_step": 537138, "epoch": 6471} {"train_loss": -27.37948989868164, "global_step": 537139, "epoch": 6471} {"train_loss": -27.701276779174805, "global_step": 537140, "epoch": 6471} {"train_loss": -27.601383209228516, "global_step": 537141, "epoch": 6471} {"train_loss": -28.047513961791992, "global_step": 537142, "epoch": 6471} {"train_loss": -27.741260528564453, "global_step": 537143, "epoch": 6471} {"train_loss": -27.651803970336914, "global_step": 537144, "epoch": 6471} {"train_loss": -27.825042724609375, "global_step": 537145, "epoch": 6471} {"train_loss": -27.69586181640625, "global_step": 537146, "epoch": 6471} {"train_loss": -27.611066818237305, "global_step": 537147, "epoch": 6471} {"train_loss": -27.672016143798828, "global_step": 537148, "epoch": 6471} {"train_loss": -27.758441925048828, "global_step": 537149, "epoch": 6471} {"train_loss": -27.530227661132812, "global_step": 537150, "epoch": 6471} {"train_loss": -27.899328231811523, "global_step": 537151, "epoch": 6471} {"train_loss": -28.04729652404785, "global_step": 537152, "epoch": 6471} {"train_loss": -27.963743209838867, "global_step": 537153, "epoch": 6471} {"train_loss": -28.10792350769043, "global_step": 537154, "epoch": 6471} {"train_loss": -28.074634552001953, "global_step": 537155, "epoch": 6471} {"train_loss": -27.913898468017578, "global_step": 537156, "epoch": 6471} {"train_loss": -27.90485191345215, "global_step": 537157, "epoch": 6471} {"train_loss": -27.92634391784668, "global_step": 537158, "epoch": 6471} {"train_loss": -27.96430015563965, "global_step": 537159, "epoch": 6471} {"train_loss": -28.43472671508789, "global_step": 537160, "epoch": 6471} {"train_loss": -27.501386642456055, "global_step": 537161, "epoch": 6471} {"train_loss": -27.692489624023438, "global_step": 537162, "epoch": 6471} {"train_loss": -27.28285026550293, "global_step": 537163, "epoch": 6471} {"train_loss": -28.013233184814453, "global_step": 537164, "epoch": 6471} {"train_loss": -27.817413330078125, "global_step": 537165, "epoch": 6471} {"train_loss": -27.26422691345215, "global_step": 537166, "epoch": 6471} {"train_loss": -26.711191177368164, "global_step": 537167, "epoch": 6471} {"train_loss": -26.678312301635742, "global_step": 537168, "epoch": 6471} {"train_loss": -27.63153076171875, "global_step": 537169, "epoch": 6471} {"train_loss": -27.23213005065918, "global_step": 537170, "epoch": 6471} {"train_loss": -27.656396865844727, "global_step": 537171, "epoch": 6471} {"train_loss": -27.486312866210938, "global_step": 537172, "epoch": 6471} {"train_loss": -27.279504776000977, "global_step": 537173, "epoch": 6471} {"train_loss": -27.78132438659668, "global_step": 537174, "epoch": 6471} {"train_loss": -27.254916501332477, "global_step": 537175, "epoch": 6471, "val_loss": 6472854.0} {"train_loss": -26.295379638671875, "global_step": 537176, "epoch": 6472} {"train_loss": -26.670337677001953, "global_step": 537177, "epoch": 6472} {"train_loss": -26.539031982421875, "global_step": 537178, "epoch": 6472} {"train_loss": -27.078336715698242, "global_step": 537179, "epoch": 6472} {"train_loss": -26.4014949798584, "global_step": 537180, "epoch": 6472} {"train_loss": -26.64161491394043, "global_step": 537181, "epoch": 6472} {"train_loss": -26.914295196533203, "global_step": 537182, "epoch": 6472} {"train_loss": -26.952808380126953, "global_step": 537183, "epoch": 6472} {"train_loss": -26.858020782470703, "global_step": 537184, "epoch": 6472} {"train_loss": -26.83462905883789, "global_step": 537185, "epoch": 6472} {"train_loss": -26.49952507019043, "global_step": 537186, "epoch": 6472} {"train_loss": -26.844196319580078, "global_step": 537187, "epoch": 6472} {"train_loss": -26.845569610595703, "global_step": 537188, "epoch": 6472} {"train_loss": -26.531049728393555, "global_step": 537189, "epoch": 6472} {"train_loss": -27.063617706298828, "global_step": 537190, "epoch": 6472} {"train_loss": -27.29425621032715, "global_step": 537191, "epoch": 6472} {"train_loss": -27.337970733642578, "global_step": 537192, "epoch": 6472} {"train_loss": -27.2481632232666, "global_step": 537193, "epoch": 6472} {"train_loss": -27.33672523498535, "global_step": 537194, "epoch": 6472} {"train_loss": -26.92616081237793, "global_step": 537195, "epoch": 6472} {"train_loss": -27.17621421813965, "global_step": 537196, "epoch": 6472} {"train_loss": -27.634078979492188, "global_step": 537197, "epoch": 6472} {"train_loss": -27.435199737548828, "global_step": 537198, "epoch": 6472} {"train_loss": -27.241134643554688, "global_step": 537199, "epoch": 6472} {"train_loss": -27.50180435180664, "global_step": 537200, "epoch": 6472} {"train_loss": -27.582656860351562, "global_step": 537201, "epoch": 6472} {"train_loss": -27.476184844970703, "global_step": 537202, "epoch": 6472} {"train_loss": -27.468982696533203, "global_step": 537203, "epoch": 6472} {"train_loss": -27.19704246520996, "global_step": 537204, "epoch": 6472} {"train_loss": -27.52762794494629, "global_step": 537205, "epoch": 6472} {"train_loss": -27.900304794311523, "global_step": 537206, "epoch": 6472} {"train_loss": -27.61905860900879, "global_step": 537207, "epoch": 6472} {"train_loss": -27.679141998291016, "global_step": 537208, "epoch": 6472} {"train_loss": -27.767480850219727, "global_step": 537209, "epoch": 6472} {"train_loss": -27.620895385742188, "global_step": 537210, "epoch": 6472} {"train_loss": -27.99212074279785, "global_step": 537211, "epoch": 6472} {"train_loss": -28.056854248046875, "global_step": 537212, "epoch": 6472} {"train_loss": -27.85479164123535, "global_step": 537213, "epoch": 6472} {"train_loss": -27.952655792236328, "global_step": 537214, "epoch": 6472} {"train_loss": -28.008508682250977, "global_step": 537215, "epoch": 6472} {"train_loss": -27.884679794311523, "global_step": 537216, "epoch": 6472} {"train_loss": -27.824024200439453, "global_step": 537217, "epoch": 6472} {"train_loss": -27.51454734802246, "global_step": 537218, "epoch": 6472} {"train_loss": -27.978824615478516, "global_step": 537219, "epoch": 6472} {"train_loss": -27.776214599609375, "global_step": 537220, "epoch": 6472} {"train_loss": -27.69403648376465, "global_step": 537221, "epoch": 6472} {"train_loss": -27.439727783203125, "global_step": 537222, "epoch": 6472} {"train_loss": -27.2278995513916, "global_step": 537223, "epoch": 6472} {"train_loss": -27.6608943939209, "global_step": 537224, "epoch": 6472} {"train_loss": -27.373498916625977, "global_step": 537225, "epoch": 6472} {"train_loss": -27.695178985595703, "global_step": 537226, "epoch": 6472} {"train_loss": -28.15797996520996, "global_step": 537227, "epoch": 6472} {"train_loss": -27.8889102935791, "global_step": 537228, "epoch": 6472} {"train_loss": -27.40952491760254, "global_step": 537229, "epoch": 6472} {"train_loss": -27.997610092163086, "global_step": 537230, "epoch": 6472} {"train_loss": -27.700214385986328, "global_step": 537231, "epoch": 6472} {"train_loss": -27.879743576049805, "global_step": 537232, "epoch": 6472} {"train_loss": -27.8238468170166, "global_step": 537233, "epoch": 6472} {"train_loss": -27.831714630126953, "global_step": 537234, "epoch": 6472} {"train_loss": -27.656713485717773, "global_step": 537235, "epoch": 6472} {"train_loss": -27.3609561920166, "global_step": 537236, "epoch": 6472} {"train_loss": -27.4996280670166, "global_step": 537237, "epoch": 6472} {"train_loss": -27.594404220581055, "global_step": 537238, "epoch": 6472} {"train_loss": -27.99603271484375, "global_step": 537239, "epoch": 6472} {"train_loss": -27.55405616760254, "global_step": 537240, "epoch": 6472} {"train_loss": -27.906330108642578, "global_step": 537241, "epoch": 6472} {"train_loss": -27.68577003479004, "global_step": 537242, "epoch": 6472} {"train_loss": -28.195188522338867, "global_step": 537243, "epoch": 6472} {"train_loss": -27.917932510375977, "global_step": 537244, "epoch": 6472} {"train_loss": -28.02484130859375, "global_step": 537245, "epoch": 6472} {"train_loss": -27.721786499023438, "global_step": 537246, "epoch": 6472} {"train_loss": -27.729482650756836, "global_step": 537247, "epoch": 6472} {"train_loss": -27.646169662475586, "global_step": 537248, "epoch": 6472} {"train_loss": -27.686420440673828, "global_step": 537249, "epoch": 6472} {"train_loss": -27.669803619384766, "global_step": 537250, "epoch": 6472} {"train_loss": -27.369543075561523, "global_step": 537251, "epoch": 6472} {"train_loss": -28.027585983276367, "global_step": 537252, "epoch": 6472} {"train_loss": -27.916568756103516, "global_step": 537253, "epoch": 6472} {"train_loss": -27.77898597717285, "global_step": 537254, "epoch": 6472} {"train_loss": -27.898771286010742, "global_step": 537255, "epoch": 6472} {"train_loss": -27.40154457092285, "global_step": 537256, "epoch": 6472} {"train_loss": -27.76991081237793, "global_step": 537257, "epoch": 6472} {"train_loss": -27.498111127370812, "global_step": 537258, "epoch": 6472, "val_loss": 6484843.0} {"train_loss": -27.116727828979492, "global_step": 537259, "epoch": 6473} {"train_loss": -25.22084617614746, "global_step": 537260, "epoch": 6473} {"train_loss": -24.005157470703125, "global_step": 537261, "epoch": 6473} {"train_loss": -26.717864990234375, "global_step": 537262, "epoch": 6473} {"train_loss": -26.013574600219727, "global_step": 537263, "epoch": 6473} {"train_loss": -26.41163444519043, "global_step": 537264, "epoch": 6473} {"train_loss": -26.133197784423828, "global_step": 537265, "epoch": 6473} {"train_loss": -26.216394424438477, "global_step": 537266, "epoch": 6473} {"train_loss": -26.953842163085938, "global_step": 537267, "epoch": 6473} {"train_loss": -26.739765167236328, "global_step": 537268, "epoch": 6473} {"train_loss": -26.742578506469727, "global_step": 537269, "epoch": 6473} {"train_loss": -26.886600494384766, "global_step": 537270, "epoch": 6473} {"train_loss": -26.646081924438477, "global_step": 537271, "epoch": 6473} {"train_loss": -26.991403579711914, "global_step": 537272, "epoch": 6473} {"train_loss": -26.98917007446289, "global_step": 537273, "epoch": 6473} {"train_loss": -27.086395263671875, "global_step": 537274, "epoch": 6473} {"train_loss": -26.87578773498535, "global_step": 537275, "epoch": 6473} {"train_loss": -27.140625, "global_step": 537276, "epoch": 6473} {"train_loss": -27.07771110534668, "global_step": 537277, "epoch": 6473} {"train_loss": -27.233551025390625, "global_step": 537278, "epoch": 6473} {"train_loss": -27.254718780517578, "global_step": 537279, "epoch": 6473} {"train_loss": -27.0656795501709, "global_step": 537280, "epoch": 6473} {"train_loss": -27.204944610595703, "global_step": 537281, "epoch": 6473} {"train_loss": -27.387680053710938, "global_step": 537282, "epoch": 6473} {"train_loss": -27.4627742767334, "global_step": 537283, "epoch": 6473} {"train_loss": -27.204864501953125, "global_step": 537284, "epoch": 6473} {"train_loss": -27.653961181640625, "global_step": 537285, "epoch": 6473} {"train_loss": -27.2670955657959, "global_step": 537286, "epoch": 6473} {"train_loss": -27.396453857421875, "global_step": 537287, "epoch": 6473} {"train_loss": -27.30999183654785, "global_step": 537288, "epoch": 6473} {"train_loss": -27.25250816345215, "global_step": 537289, "epoch": 6473} {"train_loss": -28.055728912353516, "global_step": 537290, "epoch": 6473} {"train_loss": -27.217132568359375, "global_step": 537291, "epoch": 6473} {"train_loss": -27.531097412109375, "global_step": 537292, "epoch": 6473} {"train_loss": -27.805770874023438, "global_step": 537293, "epoch": 6473} {"train_loss": -27.44182777404785, "global_step": 537294, "epoch": 6473} {"train_loss": -27.207569122314453, "global_step": 537295, "epoch": 6473} {"train_loss": -27.872217178344727, "global_step": 537296, "epoch": 6473} {"train_loss": -27.544641494750977, "global_step": 537297, "epoch": 6473} {"train_loss": -27.71026039123535, "global_step": 537298, "epoch": 6473} {"train_loss": -27.484670639038086, "global_step": 537299, "epoch": 6473} {"train_loss": -27.77581214904785, "global_step": 537300, "epoch": 6473} {"train_loss": -27.83815574645996, "global_step": 537301, "epoch": 6473} {"train_loss": -27.687213897705078, "global_step": 537302, "epoch": 6473} {"train_loss": -27.943286895751953, "global_step": 537303, "epoch": 6473} {"train_loss": -27.919214248657227, "global_step": 537304, "epoch": 6473} {"train_loss": -27.484989166259766, "global_step": 537305, "epoch": 6473} {"train_loss": -27.811182022094727, "global_step": 537306, "epoch": 6473} {"train_loss": -27.6988525390625, "global_step": 537307, "epoch": 6473} {"train_loss": -27.792448043823242, "global_step": 537308, "epoch": 6473} {"train_loss": -27.964282989501953, "global_step": 537309, "epoch": 6473} {"train_loss": -27.946638107299805, "global_step": 537310, "epoch": 6473} {"train_loss": -27.9947452545166, "global_step": 537311, "epoch": 6473} {"train_loss": -27.73826026916504, "global_step": 537312, "epoch": 6473} {"train_loss": -27.81446647644043, "global_step": 537313, "epoch": 6473} {"train_loss": -27.958356857299805, "global_step": 537314, "epoch": 6473} {"train_loss": -27.58512306213379, "global_step": 537315, "epoch": 6473} {"train_loss": -28.140735626220703, "global_step": 537316, "epoch": 6473} {"train_loss": -27.82208251953125, "global_step": 537317, "epoch": 6473} {"train_loss": -27.95021629333496, "global_step": 537318, "epoch": 6473} {"train_loss": -27.732269287109375, "global_step": 537319, "epoch": 6473} {"train_loss": -27.96286964416504, "global_step": 537320, "epoch": 6473} {"train_loss": -27.796649932861328, "global_step": 537321, "epoch": 6473} {"train_loss": -27.295255661010742, "global_step": 537322, "epoch": 6473} {"train_loss": -27.24639320373535, "global_step": 537323, "epoch": 6473} {"train_loss": -27.831815719604492, "global_step": 537324, "epoch": 6473} {"train_loss": -27.7285213470459, "global_step": 537325, "epoch": 6473} {"train_loss": -27.90101432800293, "global_step": 537326, "epoch": 6473} {"train_loss": -27.758169174194336, "global_step": 537327, "epoch": 6473} {"train_loss": -27.6809024810791, "global_step": 537328, "epoch": 6473} {"train_loss": -27.96305274963379, "global_step": 537329, "epoch": 6473} {"train_loss": -27.810867309570312, "global_step": 537330, "epoch": 6473} {"train_loss": -28.070539474487305, "global_step": 537331, "epoch": 6473} {"train_loss": -27.835962295532227, "global_step": 537332, "epoch": 6473} {"train_loss": -28.103185653686523, "global_step": 537333, "epoch": 6473} {"train_loss": -27.668594360351562, "global_step": 537334, "epoch": 6473} {"train_loss": -28.12681007385254, "global_step": 537335, "epoch": 6473} {"train_loss": -27.76389503479004, "global_step": 537336, "epoch": 6473} {"train_loss": -27.720754623413086, "global_step": 537337, "epoch": 6473} {"train_loss": -27.955663681030273, "global_step": 537338, "epoch": 6473} {"train_loss": -27.71197509765625, "global_step": 537339, "epoch": 6473} {"train_loss": -28.067901611328125, "global_step": 537340, "epoch": 6473} {"train_loss": -27.441822695444866, "global_step": 537341, "epoch": 6473, "val_loss": 6428243.0} {"train_loss": -27.020309448242188, "global_step": 537342, "epoch": 6474} {"train_loss": -26.818796157836914, "global_step": 537343, "epoch": 6474} {"train_loss": -26.164525985717773, "global_step": 537344, "epoch": 6474} {"train_loss": -27.373584747314453, "global_step": 537345, "epoch": 6474} {"train_loss": -27.666187286376953, "global_step": 537346, "epoch": 6474} {"train_loss": -27.4658145904541, "global_step": 537347, "epoch": 6474} {"train_loss": -27.37318992614746, "global_step": 537348, "epoch": 6474} {"train_loss": -27.78139305114746, "global_step": 537349, "epoch": 6474} {"train_loss": -27.587202072143555, "global_step": 537350, "epoch": 6474} {"train_loss": -27.028364181518555, "global_step": 537351, "epoch": 6474} {"train_loss": -27.377700805664062, "global_step": 537352, "epoch": 6474} {"train_loss": -27.396106719970703, "global_step": 537353, "epoch": 6474} {"train_loss": -27.31695556640625, "global_step": 537354, "epoch": 6474} {"train_loss": -27.728612899780273, "global_step": 537355, "epoch": 6474} {"train_loss": -27.459003448486328, "global_step": 537356, "epoch": 6474} {"train_loss": -27.54072380065918, "global_step": 537357, "epoch": 6474} {"train_loss": -27.91282081604004, "global_step": 537358, "epoch": 6474} {"train_loss": -27.6207218170166, "global_step": 537359, "epoch": 6474} {"train_loss": -27.635028839111328, "global_step": 537360, "epoch": 6474} {"train_loss": -27.61750602722168, "global_step": 537361, "epoch": 6474} {"train_loss": -27.43408203125, "global_step": 537362, "epoch": 6474} {"train_loss": -27.505069732666016, "global_step": 537363, "epoch": 6474} {"train_loss": -27.602842330932617, "global_step": 537364, "epoch": 6474} {"train_loss": -27.359516143798828, "global_step": 537365, "epoch": 6474} {"train_loss": -27.759756088256836, "global_step": 537366, "epoch": 6474} {"train_loss": -27.891345977783203, "global_step": 537367, "epoch": 6474} {"train_loss": -27.654571533203125, "global_step": 537368, "epoch": 6474} {"train_loss": -27.392297744750977, "global_step": 537369, "epoch": 6474} {"train_loss": -27.901229858398438, "global_step": 537370, "epoch": 6474} {"train_loss": -27.54388999938965, "global_step": 537371, "epoch": 6474} {"train_loss": -27.982213973999023, "global_step": 537372, "epoch": 6474} {"train_loss": -28.02182388305664, "global_step": 537373, "epoch": 6474} {"train_loss": -27.863935470581055, "global_step": 537374, "epoch": 6474} {"train_loss": -27.63214683532715, "global_step": 537375, "epoch": 6474} {"train_loss": -27.864673614501953, "global_step": 537376, "epoch": 6474} {"train_loss": -27.67352867126465, "global_step": 537377, "epoch": 6474} {"train_loss": -28.02777671813965, "global_step": 537378, "epoch": 6474} {"train_loss": -27.7620792388916, "global_step": 537379, "epoch": 6474} {"train_loss": -27.565214157104492, "global_step": 537380, "epoch": 6474} {"train_loss": -27.980560302734375, "global_step": 537381, "epoch": 6474} {"train_loss": -27.555479049682617, "global_step": 537382, "epoch": 6474} {"train_loss": -27.749181747436523, "global_step": 537383, "epoch": 6474} {"train_loss": -27.29078483581543, "global_step": 537384, "epoch": 6474} {"train_loss": -27.96283531188965, "global_step": 537385, "epoch": 6474} {"train_loss": -27.6285343170166, "global_step": 537386, "epoch": 6474} {"train_loss": -27.427534103393555, "global_step": 537387, "epoch": 6474} {"train_loss": -27.615097045898438, "global_step": 537388, "epoch": 6474} {"train_loss": -27.759784698486328, "global_step": 537389, "epoch": 6474} {"train_loss": -27.769750595092773, "global_step": 537390, "epoch": 6474} {"train_loss": -27.865447998046875, "global_step": 537391, "epoch": 6474} {"train_loss": -28.0139217376709, "global_step": 537392, "epoch": 6474} {"train_loss": -27.961273193359375, "global_step": 537393, "epoch": 6474} {"train_loss": -27.993183135986328, "global_step": 537394, "epoch": 6474} {"train_loss": -27.65875244140625, "global_step": 537395, "epoch": 6474} {"train_loss": -27.710205078125, "global_step": 537396, "epoch": 6474} {"train_loss": -27.830942153930664, "global_step": 537397, "epoch": 6474} {"train_loss": -27.844640731811523, "global_step": 537398, "epoch": 6474} {"train_loss": -27.5552978515625, "global_step": 537399, "epoch": 6474} {"train_loss": -27.84682273864746, "global_step": 537400, "epoch": 6474} {"train_loss": -28.066024780273438, "global_step": 537401, "epoch": 6474} {"train_loss": -27.861408233642578, "global_step": 537402, "epoch": 6474} {"train_loss": -27.682626724243164, "global_step": 537403, "epoch": 6474} {"train_loss": -27.59683609008789, "global_step": 537404, "epoch": 6474} {"train_loss": -27.67569923400879, "global_step": 537405, "epoch": 6474} {"train_loss": -27.925283432006836, "global_step": 537406, "epoch": 6474} {"train_loss": -28.01893424987793, "global_step": 537407, "epoch": 6474} {"train_loss": -27.64215087890625, "global_step": 537408, "epoch": 6474} {"train_loss": -27.89833641052246, "global_step": 537409, "epoch": 6474} {"train_loss": -27.6499080657959, "global_step": 537410, "epoch": 6474} {"train_loss": -27.914709091186523, "global_step": 537411, "epoch": 6474} {"train_loss": -27.61934471130371, "global_step": 537412, "epoch": 6474} {"train_loss": -27.299640655517578, "global_step": 537413, "epoch": 6474} {"train_loss": -27.136371612548828, "global_step": 537414, "epoch": 6474} {"train_loss": -26.94287109375, "global_step": 537415, "epoch": 6474} {"train_loss": -27.143646240234375, "global_step": 537416, "epoch": 6474} {"train_loss": -27.143163681030273, "global_step": 537417, "epoch": 6474} {"train_loss": -27.582746505737305, "global_step": 537418, "epoch": 6474} {"train_loss": -27.37542724609375, "global_step": 537419, "epoch": 6474} {"train_loss": -27.153722763061523, "global_step": 537420, "epoch": 6474} {"train_loss": -27.466510772705078, "global_step": 537421, "epoch": 6474} {"train_loss": -27.6895694732666, "global_step": 537422, "epoch": 6474} {"train_loss": -27.22893714904785, "global_step": 537423, "epoch": 6474} {"train_loss": -27.596535418407026, "global_step": 537424, "epoch": 6474, "val_loss": 6368033.5} {"train_loss": -26.78277587890625, "global_step": 537425, "epoch": 6475} {"train_loss": -27.19113540649414, "global_step": 537426, "epoch": 6475} {"train_loss": -27.338903427124023, "global_step": 537427, "epoch": 6475} {"train_loss": -26.80547523498535, "global_step": 537428, "epoch": 6475} {"train_loss": -26.849645614624023, "global_step": 537429, "epoch": 6475} {"train_loss": -26.495344161987305, "global_step": 537430, "epoch": 6475} {"train_loss": -27.108295440673828, "global_step": 537431, "epoch": 6475} {"train_loss": -27.241546630859375, "global_step": 537432, "epoch": 6475} {"train_loss": -26.88162612915039, "global_step": 537433, "epoch": 6475} {"train_loss": -27.07611083984375, "global_step": 537434, "epoch": 6475} {"train_loss": -27.38982582092285, "global_step": 537435, "epoch": 6475} {"train_loss": -27.377561569213867, "global_step": 537436, "epoch": 6475} {"train_loss": -27.022647857666016, "global_step": 537437, "epoch": 6475} {"train_loss": -26.56183433532715, "global_step": 537438, "epoch": 6475} {"train_loss": -26.275609970092773, "global_step": 537439, "epoch": 6475} {"train_loss": -27.523229598999023, "global_step": 537440, "epoch": 6475} {"train_loss": -26.615148544311523, "global_step": 537441, "epoch": 6475} {"train_loss": -27.466567993164062, "global_step": 537442, "epoch": 6475} {"train_loss": -27.071149826049805, "global_step": 537443, "epoch": 6475} {"train_loss": -27.1304988861084, "global_step": 537444, "epoch": 6475} {"train_loss": -27.349273681640625, "global_step": 537445, "epoch": 6475} {"train_loss": -27.122976303100586, "global_step": 537446, "epoch": 6475} {"train_loss": -27.390775680541992, "global_step": 537447, "epoch": 6475} {"train_loss": -27.453052520751953, "global_step": 537448, "epoch": 6475} {"train_loss": -27.52618408203125, "global_step": 537449, "epoch": 6475} {"train_loss": -27.34844398498535, "global_step": 537450, "epoch": 6475} {"train_loss": -27.69171714782715, "global_step": 537451, "epoch": 6475} {"train_loss": -27.535573959350586, "global_step": 537452, "epoch": 6475} {"train_loss": -27.329809188842773, "global_step": 537453, "epoch": 6475} {"train_loss": -27.524417877197266, "global_step": 537454, "epoch": 6475} {"train_loss": -27.569873809814453, "global_step": 537455, "epoch": 6475} {"train_loss": -27.327802658081055, "global_step": 537456, "epoch": 6475} {"train_loss": -27.728748321533203, "global_step": 537457, "epoch": 6475} {"train_loss": -27.54404640197754, "global_step": 537458, "epoch": 6475} {"train_loss": -27.694318771362305, "global_step": 537459, "epoch": 6475} {"train_loss": -27.600305557250977, "global_step": 537460, "epoch": 6475} {"train_loss": -27.690805435180664, "global_step": 537461, "epoch": 6475} {"train_loss": -27.647932052612305, "global_step": 537462, "epoch": 6475} {"train_loss": -27.422887802124023, "global_step": 537463, "epoch": 6475} {"train_loss": -27.5667724609375, "global_step": 537464, "epoch": 6475} {"train_loss": -27.51556396484375, "global_step": 537465, "epoch": 6475} {"train_loss": -27.822126388549805, "global_step": 537466, "epoch": 6475} {"train_loss": -27.565587997436523, "global_step": 537467, "epoch": 6475} {"train_loss": -27.423368453979492, "global_step": 537468, "epoch": 6475} {"train_loss": -27.79852294921875, "global_step": 537469, "epoch": 6475} {"train_loss": -27.174997329711914, "global_step": 537470, "epoch": 6475} {"train_loss": -27.72408103942871, "global_step": 537471, "epoch": 6475} {"train_loss": -27.7471981048584, "global_step": 537472, "epoch": 6475} {"train_loss": -27.802587509155273, "global_step": 537473, "epoch": 6475} {"train_loss": -27.71441078186035, "global_step": 537474, "epoch": 6475} {"train_loss": -27.674402236938477, "global_step": 537475, "epoch": 6475} {"train_loss": -27.557952880859375, "global_step": 537476, "epoch": 6475} {"train_loss": -27.9913387298584, "global_step": 537477, "epoch": 6475} {"train_loss": -27.66724967956543, "global_step": 537478, "epoch": 6475} {"train_loss": -27.511199951171875, "global_step": 537479, "epoch": 6475} {"train_loss": -27.738662719726562, "global_step": 537480, "epoch": 6475} {"train_loss": -27.492996215820312, "global_step": 537481, "epoch": 6475} {"train_loss": -27.812103271484375, "global_step": 537482, "epoch": 6475} {"train_loss": -28.028711318969727, "global_step": 537483, "epoch": 6475} {"train_loss": -27.840417861938477, "global_step": 537484, "epoch": 6475} {"train_loss": -28.349462509155273, "global_step": 537485, "epoch": 6475} {"train_loss": -27.858530044555664, "global_step": 537486, "epoch": 6475} {"train_loss": -27.696569442749023, "global_step": 537487, "epoch": 6475} {"train_loss": -27.54864501953125, "global_step": 537488, "epoch": 6475} {"train_loss": -27.77899742126465, "global_step": 537489, "epoch": 6475} {"train_loss": -27.936450958251953, "global_step": 537490, "epoch": 6475} {"train_loss": -28.070051193237305, "global_step": 537491, "epoch": 6475} {"train_loss": -27.4797306060791, "global_step": 537492, "epoch": 6475} {"train_loss": -27.74774742126465, "global_step": 537493, "epoch": 6475} {"train_loss": -27.518939971923828, "global_step": 537494, "epoch": 6475} {"train_loss": -27.97623634338379, "global_step": 537495, "epoch": 6475} {"train_loss": -27.67484474182129, "global_step": 537496, "epoch": 6475} {"train_loss": -28.026004791259766, "global_step": 537497, "epoch": 6475} {"train_loss": -27.758893966674805, "global_step": 537498, "epoch": 6475} {"train_loss": -27.919921875, "global_step": 537499, "epoch": 6475} {"train_loss": -27.814624786376953, "global_step": 537500, "epoch": 6475} {"train_loss": -27.463464736938477, "global_step": 537501, "epoch": 6475} {"train_loss": -27.42352867126465, "global_step": 537502, "epoch": 6475} {"train_loss": -27.619165420532227, "global_step": 537503, "epoch": 6475} {"train_loss": -27.583084106445312, "global_step": 537504, "epoch": 6475} {"train_loss": -27.618661880493164, "global_step": 537505, "epoch": 6475} {"train_loss": -27.273578643798828, "global_step": 537506, "epoch": 6475} {"train_loss": -27.494477076702807, "global_step": 537507, "epoch": 6475, "val_loss": 6417283.5} {"train_loss": -26.4899845123291, "global_step": 537508, "epoch": 6476} {"train_loss": -26.91153335571289, "global_step": 537509, "epoch": 6476} {"train_loss": -26.361066818237305, "global_step": 537510, "epoch": 6476} {"train_loss": -27.2736873626709, "global_step": 537511, "epoch": 6476} {"train_loss": -26.581892013549805, "global_step": 537512, "epoch": 6476} {"train_loss": -26.920679092407227, "global_step": 537513, "epoch": 6476} {"train_loss": -27.052804946899414, "global_step": 537514, "epoch": 6476} {"train_loss": -27.0037841796875, "global_step": 537515, "epoch": 6476} {"train_loss": -27.25860023498535, "global_step": 537516, "epoch": 6476} {"train_loss": -26.99375343322754, "global_step": 537517, "epoch": 6476} {"train_loss": -26.491857528686523, "global_step": 537518, "epoch": 6476} {"train_loss": -26.83684730529785, "global_step": 537519, "epoch": 6476} {"train_loss": -27.240234375, "global_step": 537520, "epoch": 6476} {"train_loss": -27.18716812133789, "global_step": 537521, "epoch": 6476} {"train_loss": -27.242666244506836, "global_step": 537522, "epoch": 6476} {"train_loss": -27.484710693359375, "global_step": 537523, "epoch": 6476} {"train_loss": -26.857315063476562, "global_step": 537524, "epoch": 6476} {"train_loss": -27.36054801940918, "global_step": 537525, "epoch": 6476} {"train_loss": -27.439096450805664, "global_step": 537526, "epoch": 6476} {"train_loss": -27.1468448638916, "global_step": 537527, "epoch": 6476} {"train_loss": -27.4424991607666, "global_step": 537528, "epoch": 6476} {"train_loss": -27.054147720336914, "global_step": 537529, "epoch": 6476} {"train_loss": -27.033283233642578, "global_step": 537530, "epoch": 6476} {"train_loss": -27.38605308532715, "global_step": 537531, "epoch": 6476} {"train_loss": -27.2106990814209, "global_step": 537532, "epoch": 6476} {"train_loss": -27.283374786376953, "global_step": 537533, "epoch": 6476} {"train_loss": -27.30181884765625, "global_step": 537534, "epoch": 6476} {"train_loss": -27.6032657623291, "global_step": 537535, "epoch": 6476} {"train_loss": -27.472265243530273, "global_step": 537536, "epoch": 6476} {"train_loss": -27.72967529296875, "global_step": 537537, "epoch": 6476} {"train_loss": -27.375659942626953, "global_step": 537538, "epoch": 6476} {"train_loss": -27.40582847595215, "global_step": 537539, "epoch": 6476} {"train_loss": -27.740253448486328, "global_step": 537540, "epoch": 6476} {"train_loss": -27.558286666870117, "global_step": 537541, "epoch": 6476} {"train_loss": -27.586820602416992, "global_step": 537542, "epoch": 6476} {"train_loss": -27.70307731628418, "global_step": 537543, "epoch": 6476} {"train_loss": -27.65308952331543, "global_step": 537544, "epoch": 6476} {"train_loss": -27.594690322875977, "global_step": 537545, "epoch": 6476} {"train_loss": -27.62506103515625, "global_step": 537546, "epoch": 6476} {"train_loss": -27.505598068237305, "global_step": 537547, "epoch": 6476} {"train_loss": -27.68863868713379, "global_step": 537548, "epoch": 6476} {"train_loss": -27.56709861755371, "global_step": 537549, "epoch": 6476} {"train_loss": -27.94243812561035, "global_step": 537550, "epoch": 6476} {"train_loss": -27.7530460357666, "global_step": 537551, "epoch": 6476} {"train_loss": -27.7901611328125, "global_step": 537552, "epoch": 6476} {"train_loss": -27.79249382019043, "global_step": 537553, "epoch": 6476} {"train_loss": -28.145177841186523, "global_step": 537554, "epoch": 6476} {"train_loss": -27.806812286376953, "global_step": 537555, "epoch": 6476} {"train_loss": -27.620336532592773, "global_step": 537556, "epoch": 6476} {"train_loss": -27.946340560913086, "global_step": 537557, "epoch": 6476} {"train_loss": -27.90053367614746, "global_step": 537558, "epoch": 6476} {"train_loss": -27.6494197845459, "global_step": 537559, "epoch": 6476} {"train_loss": -27.52324867248535, "global_step": 537560, "epoch": 6476} {"train_loss": -27.83108901977539, "global_step": 537561, "epoch": 6476} {"train_loss": -27.78838539123535, "global_step": 537562, "epoch": 6476} {"train_loss": -28.051288604736328, "global_step": 537563, "epoch": 6476} {"train_loss": -27.99248695373535, "global_step": 537564, "epoch": 6476} {"train_loss": -27.703292846679688, "global_step": 537565, "epoch": 6476} {"train_loss": -28.023900985717773, "global_step": 537566, "epoch": 6476} {"train_loss": -27.559141159057617, "global_step": 537567, "epoch": 6476} {"train_loss": -27.82612419128418, "global_step": 537568, "epoch": 6476} {"train_loss": -28.120452880859375, "global_step": 537569, "epoch": 6476} {"train_loss": -27.92812156677246, "global_step": 537570, "epoch": 6476} {"train_loss": -27.751646041870117, "global_step": 537571, "epoch": 6476} {"train_loss": -27.406110763549805, "global_step": 537572, "epoch": 6476} {"train_loss": -27.101215362548828, "global_step": 537573, "epoch": 6476} {"train_loss": -27.593748092651367, "global_step": 537574, "epoch": 6476} {"train_loss": -27.90500259399414, "global_step": 537575, "epoch": 6476} {"train_loss": -27.350605010986328, "global_step": 537576, "epoch": 6476} {"train_loss": -27.505456924438477, "global_step": 537577, "epoch": 6476} {"train_loss": -27.797269821166992, "global_step": 537578, "epoch": 6476} {"train_loss": -27.635456085205078, "global_step": 537579, "epoch": 6476} {"train_loss": -27.77638053894043, "global_step": 537580, "epoch": 6476} {"train_loss": -27.433008193969727, "global_step": 537581, "epoch": 6476} {"train_loss": -27.226133346557617, "global_step": 537582, "epoch": 6476} {"train_loss": -26.888843536376953, "global_step": 537583, "epoch": 6476} {"train_loss": -27.35357666015625, "global_step": 537584, "epoch": 6476} {"train_loss": -27.285192489624023, "global_step": 537585, "epoch": 6476} {"train_loss": -27.93214988708496, "global_step": 537586, "epoch": 6476} {"train_loss": -27.072484970092773, "global_step": 537587, "epoch": 6476} {"train_loss": -28.01449966430664, "global_step": 537588, "epoch": 6476} {"train_loss": -27.5274600982666, "global_step": 537589, "epoch": 6476} {"train_loss": -27.48333241566118, "global_step": 537590, "epoch": 6476, "val_loss": 6446265.0} {"train_loss": -27.054113388061523, "global_step": 537591, "epoch": 6477} {"train_loss": -27.157520294189453, "global_step": 537592, "epoch": 6477} {"train_loss": -27.146894454956055, "global_step": 537593, "epoch": 6477} {"train_loss": -27.691389083862305, "global_step": 537594, "epoch": 6477} {"train_loss": -27.285919189453125, "global_step": 537595, "epoch": 6477} {"train_loss": -27.279272079467773, "global_step": 537596, "epoch": 6477} {"train_loss": -27.502294540405273, "global_step": 537597, "epoch": 6477} {"train_loss": -27.08745765686035, "global_step": 537598, "epoch": 6477} {"train_loss": -27.66339111328125, "global_step": 537599, "epoch": 6477} {"train_loss": -27.492645263671875, "global_step": 537600, "epoch": 6477} {"train_loss": -27.221359252929688, "global_step": 537601, "epoch": 6477} {"train_loss": -27.575626373291016, "global_step": 537602, "epoch": 6477} {"train_loss": -27.423391342163086, "global_step": 537603, "epoch": 6477} {"train_loss": -27.49749755859375, "global_step": 537604, "epoch": 6477} {"train_loss": -27.515729904174805, "global_step": 537605, "epoch": 6477} {"train_loss": -27.221174240112305, "global_step": 537606, "epoch": 6477} {"train_loss": -27.498743057250977, "global_step": 537607, "epoch": 6477} {"train_loss": -27.725177764892578, "global_step": 537608, "epoch": 6477} {"train_loss": -27.661041259765625, "global_step": 537609, "epoch": 6477} {"train_loss": -27.424823760986328, "global_step": 537610, "epoch": 6477} {"train_loss": -27.86262321472168, "global_step": 537611, "epoch": 6477} {"train_loss": -27.532995223999023, "global_step": 537612, "epoch": 6477} {"train_loss": -27.863309860229492, "global_step": 537613, "epoch": 6477} {"train_loss": -27.798315048217773, "global_step": 537614, "epoch": 6477} {"train_loss": -27.724639892578125, "global_step": 537615, "epoch": 6477} {"train_loss": -27.60151481628418, "global_step": 537616, "epoch": 6477} {"train_loss": -27.80842399597168, "global_step": 537617, "epoch": 6477} {"train_loss": -27.75043296813965, "global_step": 537618, "epoch": 6477} {"train_loss": -27.83987808227539, "global_step": 537619, "epoch": 6477} {"train_loss": -27.890562057495117, "global_step": 537620, "epoch": 6477} {"train_loss": -27.71921157836914, "global_step": 537621, "epoch": 6477} {"train_loss": -27.54377555847168, "global_step": 537622, "epoch": 6477} {"train_loss": -27.583480834960938, "global_step": 537623, "epoch": 6477} {"train_loss": -27.76267433166504, "global_step": 537624, "epoch": 6477} {"train_loss": -27.005237579345703, "global_step": 537625, "epoch": 6477} {"train_loss": -27.34330177307129, "global_step": 537626, "epoch": 6477} {"train_loss": -26.924325942993164, "global_step": 537627, "epoch": 6477} {"train_loss": -27.049396514892578, "global_step": 537628, "epoch": 6477} {"train_loss": -27.1978759765625, "global_step": 537629, "epoch": 6477} {"train_loss": -27.740802764892578, "global_step": 537630, "epoch": 6477} {"train_loss": -27.697607040405273, "global_step": 537631, "epoch": 6477} {"train_loss": -27.898761749267578, "global_step": 537632, "epoch": 6477} {"train_loss": -27.549468994140625, "global_step": 537633, "epoch": 6477} {"train_loss": -27.83503532409668, "global_step": 537634, "epoch": 6477} {"train_loss": -27.908710479736328, "global_step": 537635, "epoch": 6477} {"train_loss": -27.96453857421875, "global_step": 537636, "epoch": 6477} {"train_loss": -27.7955322265625, "global_step": 537637, "epoch": 6477} {"train_loss": -27.90622901916504, "global_step": 537638, "epoch": 6477} {"train_loss": -27.65740394592285, "global_step": 537639, "epoch": 6477} {"train_loss": -28.32806396484375, "global_step": 537640, "epoch": 6477} {"train_loss": -27.645370483398438, "global_step": 537641, "epoch": 6477} {"train_loss": -27.757055282592773, "global_step": 537642, "epoch": 6477} {"train_loss": -27.51691246032715, "global_step": 537643, "epoch": 6477} {"train_loss": -27.375030517578125, "global_step": 537644, "epoch": 6477} {"train_loss": -28.058319091796875, "global_step": 537645, "epoch": 6477} {"train_loss": -27.544818878173828, "global_step": 537646, "epoch": 6477} {"train_loss": -27.59852409362793, "global_step": 537647, "epoch": 6477} {"train_loss": -27.94703483581543, "global_step": 537648, "epoch": 6477} {"train_loss": -27.618146896362305, "global_step": 537649, "epoch": 6477} {"train_loss": -27.585651397705078, "global_step": 537650, "epoch": 6477} {"train_loss": -27.663496017456055, "global_step": 537651, "epoch": 6477} {"train_loss": -27.81685447692871, "global_step": 537652, "epoch": 6477} {"train_loss": -27.581029891967773, "global_step": 537653, "epoch": 6477} {"train_loss": -27.845645904541016, "global_step": 537654, "epoch": 6477} {"train_loss": -27.877634048461914, "global_step": 537655, "epoch": 6477} {"train_loss": -28.02728843688965, "global_step": 537656, "epoch": 6477} {"train_loss": -27.971288681030273, "global_step": 537657, "epoch": 6477} {"train_loss": -27.52604103088379, "global_step": 537658, "epoch": 6477} {"train_loss": -27.63632583618164, "global_step": 537659, "epoch": 6477} {"train_loss": -28.001007080078125, "global_step": 537660, "epoch": 6477} {"train_loss": -28.160375595092773, "global_step": 537661, "epoch": 6477} {"train_loss": -27.819660186767578, "global_step": 537662, "epoch": 6477} {"train_loss": -27.663227081298828, "global_step": 537663, "epoch": 6477} {"train_loss": -27.29912757873535, "global_step": 537664, "epoch": 6477} {"train_loss": -26.409748077392578, "global_step": 537665, "epoch": 6477} {"train_loss": -26.714811325073242, "global_step": 537666, "epoch": 6477} {"train_loss": -27.567724227905273, "global_step": 537667, "epoch": 6477} {"train_loss": -27.16346549987793, "global_step": 537668, "epoch": 6477} {"train_loss": -26.6024169921875, "global_step": 537669, "epoch": 6477} {"train_loss": -26.51272964477539, "global_step": 537670, "epoch": 6477} {"train_loss": -26.48910903930664, "global_step": 537671, "epoch": 6477} {"train_loss": -26.197778701782227, "global_step": 537672, "epoch": 6477} {"train_loss": -27.513564443013752, "global_step": 537673, "epoch": 6477, "val_loss": 6430286.0} {"train_loss": -25.898426055908203, "global_step": 537674, "epoch": 6478} {"train_loss": -26.162353515625, "global_step": 537675, "epoch": 6478} {"train_loss": -26.37372398376465, "global_step": 537676, "epoch": 6478} {"train_loss": -26.15484046936035, "global_step": 537677, "epoch": 6478} {"train_loss": -26.59893226623535, "global_step": 537678, "epoch": 6478} {"train_loss": -26.310474395751953, "global_step": 537679, "epoch": 6478} {"train_loss": -26.905517578125, "global_step": 537680, "epoch": 6478} {"train_loss": -26.408048629760742, "global_step": 537681, "epoch": 6478} {"train_loss": -26.842514038085938, "global_step": 537682, "epoch": 6478} {"train_loss": -26.742023468017578, "global_step": 537683, "epoch": 6478} {"train_loss": -26.585676193237305, "global_step": 537684, "epoch": 6478} {"train_loss": -26.340917587280273, "global_step": 537685, "epoch": 6478} {"train_loss": -26.817108154296875, "global_step": 537686, "epoch": 6478} {"train_loss": -26.84244155883789, "global_step": 537687, "epoch": 6478} {"train_loss": -26.697118759155273, "global_step": 537688, "epoch": 6478} {"train_loss": -27.29217529296875, "global_step": 537689, "epoch": 6478} {"train_loss": -27.35523796081543, "global_step": 537690, "epoch": 6478} {"train_loss": -26.8861083984375, "global_step": 537691, "epoch": 6478} {"train_loss": -27.32512855529785, "global_step": 537692, "epoch": 6478} {"train_loss": -26.940427780151367, "global_step": 537693, "epoch": 6478} {"train_loss": -26.989490509033203, "global_step": 537694, "epoch": 6478} {"train_loss": -27.32421875, "global_step": 537695, "epoch": 6478} {"train_loss": -27.347015380859375, "global_step": 537696, "epoch": 6478} {"train_loss": -27.43857765197754, "global_step": 537697, "epoch": 6478} {"train_loss": -27.435134887695312, "global_step": 537698, "epoch": 6478} {"train_loss": -27.111907958984375, "global_step": 537699, "epoch": 6478} {"train_loss": -27.307214736938477, "global_step": 537700, "epoch": 6478} {"train_loss": -27.374530792236328, "global_step": 537701, "epoch": 6478} {"train_loss": -27.6263370513916, "global_step": 537702, "epoch": 6478} {"train_loss": -27.511335372924805, "global_step": 537703, "epoch": 6478} {"train_loss": -27.304479598999023, "global_step": 537704, "epoch": 6478} {"train_loss": -27.794004440307617, "global_step": 537705, "epoch": 6478} {"train_loss": -27.376310348510742, "global_step": 537706, "epoch": 6478} {"train_loss": -27.624755859375, "global_step": 537707, "epoch": 6478} {"train_loss": -27.198530197143555, "global_step": 537708, "epoch": 6478} {"train_loss": -27.61404800415039, "global_step": 537709, "epoch": 6478} {"train_loss": -27.766427993774414, "global_step": 537710, "epoch": 6478} {"train_loss": -27.355976104736328, "global_step": 537711, "epoch": 6478} {"train_loss": -27.784696578979492, "global_step": 537712, "epoch": 6478} {"train_loss": -27.26513671875, "global_step": 537713, "epoch": 6478} {"train_loss": -27.550373077392578, "global_step": 537714, "epoch": 6478} {"train_loss": -27.526830673217773, "global_step": 537715, "epoch": 6478} {"train_loss": -27.207107543945312, "global_step": 537716, "epoch": 6478} {"train_loss": -27.326162338256836, "global_step": 537717, "epoch": 6478} {"train_loss": -27.82132911682129, "global_step": 537718, "epoch": 6478} {"train_loss": -27.386886596679688, "global_step": 537719, "epoch": 6478} {"train_loss": -27.539602279663086, "global_step": 537720, "epoch": 6478} {"train_loss": -27.732654571533203, "global_step": 537721, "epoch": 6478} {"train_loss": -27.604978561401367, "global_step": 537722, "epoch": 6478} {"train_loss": -27.466632843017578, "global_step": 537723, "epoch": 6478} {"train_loss": -27.747222900390625, "global_step": 537724, "epoch": 6478} {"train_loss": -27.890792846679688, "global_step": 537725, "epoch": 6478} {"train_loss": -27.958866119384766, "global_step": 537726, "epoch": 6478} {"train_loss": -27.883804321289062, "global_step": 537727, "epoch": 6478} {"train_loss": -27.545812606811523, "global_step": 537728, "epoch": 6478} {"train_loss": -27.206518173217773, "global_step": 537729, "epoch": 6478} {"train_loss": -27.250701904296875, "global_step": 537730, "epoch": 6478} {"train_loss": -27.73333168029785, "global_step": 537731, "epoch": 6478} {"train_loss": -27.723066329956055, "global_step": 537732, "epoch": 6478} {"train_loss": -27.537139892578125, "global_step": 537733, "epoch": 6478} {"train_loss": -27.806676864624023, "global_step": 537734, "epoch": 6478} {"train_loss": -27.665546417236328, "global_step": 537735, "epoch": 6478} {"train_loss": -28.07843017578125, "global_step": 537736, "epoch": 6478} {"train_loss": -27.806970596313477, "global_step": 537737, "epoch": 6478} {"train_loss": -27.5760498046875, "global_step": 537738, "epoch": 6478} {"train_loss": -27.613306045532227, "global_step": 537739, "epoch": 6478} {"train_loss": -27.742923736572266, "global_step": 537740, "epoch": 6478} {"train_loss": -27.539289474487305, "global_step": 537741, "epoch": 6478} {"train_loss": -27.856149673461914, "global_step": 537742, "epoch": 6478} {"train_loss": -27.372766494750977, "global_step": 537743, "epoch": 6478} {"train_loss": -27.465192794799805, "global_step": 537744, "epoch": 6478} {"train_loss": -27.508529663085938, "global_step": 537745, "epoch": 6478} {"train_loss": -27.609949111938477, "global_step": 537746, "epoch": 6478} {"train_loss": -27.57105827331543, "global_step": 537747, "epoch": 6478} {"train_loss": -27.974706649780273, "global_step": 537748, "epoch": 6478} {"train_loss": -27.8825626373291, "global_step": 537749, "epoch": 6478} {"train_loss": -27.821704864501953, "global_step": 537750, "epoch": 6478} {"train_loss": -27.417434692382812, "global_step": 537751, "epoch": 6478} {"train_loss": -27.72165298461914, "global_step": 537752, "epoch": 6478} {"train_loss": -27.951095581054688, "global_step": 537753, "epoch": 6478} {"train_loss": -28.04766273498535, "global_step": 537754, "epoch": 6478} {"train_loss": -27.69243812561035, "global_step": 537755, "epoch": 6478} {"train_loss": -27.371264285351856, "global_step": 537756, "epoch": 6478, "val_loss": 6496226.0} {"train_loss": -27.064197540283203, "global_step": 537757, "epoch": 6479} {"train_loss": -26.575204849243164, "global_step": 537758, "epoch": 6479} {"train_loss": -26.448944091796875, "global_step": 537759, "epoch": 6479} {"train_loss": -26.788923263549805, "global_step": 537760, "epoch": 6479} {"train_loss": -26.7185001373291, "global_step": 537761, "epoch": 6479} {"train_loss": -26.552459716796875, "global_step": 537762, "epoch": 6479} {"train_loss": -26.98042869567871, "global_step": 537763, "epoch": 6479} {"train_loss": -26.779905319213867, "global_step": 537764, "epoch": 6479} {"train_loss": -27.02776527404785, "global_step": 537765, "epoch": 6479} {"train_loss": -27.09638023376465, "global_step": 537766, "epoch": 6479} {"train_loss": -27.133649826049805, "global_step": 537767, "epoch": 6479} {"train_loss": -27.00244140625, "global_step": 537768, "epoch": 6479} {"train_loss": -27.196943283081055, "global_step": 537769, "epoch": 6479} {"train_loss": -26.725101470947266, "global_step": 537770, "epoch": 6479} {"train_loss": -27.187612533569336, "global_step": 537771, "epoch": 6479} {"train_loss": -27.458759307861328, "global_step": 537772, "epoch": 6479} {"train_loss": -27.294559478759766, "global_step": 537773, "epoch": 6479} {"train_loss": -27.1142635345459, "global_step": 537774, "epoch": 6479} {"train_loss": -27.3367919921875, "global_step": 537775, "epoch": 6479} {"train_loss": -27.008787155151367, "global_step": 537776, "epoch": 6479} {"train_loss": -27.376745223999023, "global_step": 537777, "epoch": 6479} {"train_loss": -27.488183975219727, "global_step": 537778, "epoch": 6479} {"train_loss": -27.225751876831055, "global_step": 537779, "epoch": 6479} {"train_loss": -27.4969482421875, "global_step": 537780, "epoch": 6479} {"train_loss": -27.48517417907715, "global_step": 537781, "epoch": 6479} {"train_loss": -27.50855827331543, "global_step": 537782, "epoch": 6479} {"train_loss": -26.997053146362305, "global_step": 537783, "epoch": 6479} {"train_loss": -27.53767204284668, "global_step": 537784, "epoch": 6479} {"train_loss": -27.392993927001953, "global_step": 537785, "epoch": 6479} {"train_loss": -27.445880889892578, "global_step": 537786, "epoch": 6479} {"train_loss": -27.506885528564453, "global_step": 537787, "epoch": 6479} {"train_loss": -27.683557510375977, "global_step": 537788, "epoch": 6479} {"train_loss": -27.676990509033203, "global_step": 537789, "epoch": 6479} {"train_loss": -27.786102294921875, "global_step": 537790, "epoch": 6479} {"train_loss": -27.42510986328125, "global_step": 537791, "epoch": 6479} {"train_loss": -27.715662002563477, "global_step": 537792, "epoch": 6479} {"train_loss": -27.6192626953125, "global_step": 537793, "epoch": 6479} {"train_loss": -27.737470626831055, "global_step": 537794, "epoch": 6479} {"train_loss": -27.914758682250977, "global_step": 537795, "epoch": 6479} {"train_loss": -27.620563507080078, "global_step": 537796, "epoch": 6479} {"train_loss": -27.5799617767334, "global_step": 537797, "epoch": 6479} {"train_loss": -27.56898307800293, "global_step": 537798, "epoch": 6479} {"train_loss": -27.845733642578125, "global_step": 537799, "epoch": 6479} {"train_loss": -27.72245216369629, "global_step": 537800, "epoch": 6479} {"train_loss": -27.661609649658203, "global_step": 537801, "epoch": 6479} {"train_loss": -27.87064552307129, "global_step": 537802, "epoch": 6479} {"train_loss": -27.46286392211914, "global_step": 537803, "epoch": 6479} {"train_loss": -27.818347930908203, "global_step": 537804, "epoch": 6479} {"train_loss": -27.841028213500977, "global_step": 537805, "epoch": 6479} {"train_loss": -27.798797607421875, "global_step": 537806, "epoch": 6479} {"train_loss": -27.81162452697754, "global_step": 537807, "epoch": 6479} {"train_loss": -27.73687171936035, "global_step": 537808, "epoch": 6479} {"train_loss": -27.8955020904541, "global_step": 537809, "epoch": 6479} {"train_loss": -27.579076766967773, "global_step": 537810, "epoch": 6479} {"train_loss": -27.632226943969727, "global_step": 537811, "epoch": 6479} {"train_loss": -28.01959228515625, "global_step": 537812, "epoch": 6479} {"train_loss": -27.828466415405273, "global_step": 537813, "epoch": 6479} {"train_loss": -27.93364906311035, "global_step": 537814, "epoch": 6479} {"train_loss": -27.994226455688477, "global_step": 537815, "epoch": 6479} {"train_loss": -27.921483993530273, "global_step": 537816, "epoch": 6479} {"train_loss": -28.082294464111328, "global_step": 537817, "epoch": 6479} {"train_loss": -27.793766021728516, "global_step": 537818, "epoch": 6479} {"train_loss": -28.095260620117188, "global_step": 537819, "epoch": 6479} {"train_loss": -27.89447021484375, "global_step": 537820, "epoch": 6479} {"train_loss": -28.08182716369629, "global_step": 537821, "epoch": 6479} {"train_loss": -28.0463809967041, "global_step": 537822, "epoch": 6479} {"train_loss": -28.331445693969727, "global_step": 537823, "epoch": 6479} {"train_loss": -27.649194717407227, "global_step": 537824, "epoch": 6479} {"train_loss": -28.086801528930664, "global_step": 537825, "epoch": 6479} {"train_loss": -27.695714950561523, "global_step": 537826, "epoch": 6479} {"train_loss": -28.188657760620117, "global_step": 537827, "epoch": 6479} {"train_loss": -27.755475997924805, "global_step": 537828, "epoch": 6479} {"train_loss": -28.0428466796875, "global_step": 537829, "epoch": 6479} {"train_loss": -27.97028160095215, "global_step": 537830, "epoch": 6479} {"train_loss": -27.892074584960938, "global_step": 537831, "epoch": 6479} {"train_loss": -27.888227462768555, "global_step": 537832, "epoch": 6479} {"train_loss": -27.679365158081055, "global_step": 537833, "epoch": 6479} {"train_loss": -27.720067977905273, "global_step": 537834, "epoch": 6479} {"train_loss": -27.49448585510254, "global_step": 537835, "epoch": 6479} {"train_loss": -27.91156005859375, "global_step": 537836, "epoch": 6479} {"train_loss": -27.618377685546875, "global_step": 537837, "epoch": 6479} {"train_loss": -26.635522842407227, "global_step": 537838, "epoch": 6479} {"train_loss": -27.50058863536421, "global_step": 537839, "epoch": 6479, "val_loss": 6398446.0} {"train_loss": -24.685258865356445, "global_step": 537840, "epoch": 6480} {"train_loss": -23.574432373046875, "global_step": 537841, "epoch": 6480} {"train_loss": -24.643293380737305, "global_step": 537842, "epoch": 6480} {"train_loss": -22.358922958374023, "global_step": 537843, "epoch": 6480} {"train_loss": -24.566883087158203, "global_step": 537844, "epoch": 6480} {"train_loss": -24.412595748901367, "global_step": 537845, "epoch": 6480} {"train_loss": -24.94454002380371, "global_step": 537846, "epoch": 6480} {"train_loss": -25.323978424072266, "global_step": 537847, "epoch": 6480} {"train_loss": -25.895069122314453, "global_step": 537848, "epoch": 6480} {"train_loss": -25.41675567626953, "global_step": 537849, "epoch": 6480} {"train_loss": -25.79640007019043, "global_step": 537850, "epoch": 6480} {"train_loss": -25.585264205932617, "global_step": 537851, "epoch": 6480} {"train_loss": -25.954355239868164, "global_step": 537852, "epoch": 6480} {"train_loss": -25.760650634765625, "global_step": 537853, "epoch": 6480} {"train_loss": -25.673721313476562, "global_step": 537854, "epoch": 6480} {"train_loss": -25.74651527404785, "global_step": 537855, "epoch": 6480} {"train_loss": -26.305866241455078, "global_step": 537856, "epoch": 6480} {"train_loss": -26.075702667236328, "global_step": 537857, "epoch": 6480} {"train_loss": -25.76580238342285, "global_step": 537858, "epoch": 6480} {"train_loss": -26.6188907623291, "global_step": 537859, "epoch": 6480} {"train_loss": -26.20344352722168, "global_step": 537860, "epoch": 6480} {"train_loss": -26.29631996154785, "global_step": 537861, "epoch": 6480} {"train_loss": -26.0738525390625, "global_step": 537862, "epoch": 6480} {"train_loss": -26.653417587280273, "global_step": 537863, "epoch": 6480} {"train_loss": -25.97535514831543, "global_step": 537864, "epoch": 6480} {"train_loss": -26.605213165283203, "global_step": 537865, "epoch": 6480} {"train_loss": -26.51055335998535, "global_step": 537866, "epoch": 6480} {"train_loss": -26.380212783813477, "global_step": 537867, "epoch": 6480} {"train_loss": -26.252355575561523, "global_step": 537868, "epoch": 6480} {"train_loss": -26.84153175354004, "global_step": 537869, "epoch": 6480} {"train_loss": -26.795001983642578, "global_step": 537870, "epoch": 6480} {"train_loss": -26.591596603393555, "global_step": 537871, "epoch": 6480} {"train_loss": -26.518218994140625, "global_step": 537872, "epoch": 6480} {"train_loss": -26.810083389282227, "global_step": 537873, "epoch": 6480} {"train_loss": -26.583837509155273, "global_step": 537874, "epoch": 6480} {"train_loss": -27.106983184814453, "global_step": 537875, "epoch": 6480} {"train_loss": -26.734359741210938, "global_step": 537876, "epoch": 6480} {"train_loss": -27.088958740234375, "global_step": 537877, "epoch": 6480} {"train_loss": -27.0617618560791, "global_step": 537878, "epoch": 6480} {"train_loss": -27.193939208984375, "global_step": 537879, "epoch": 6480} {"train_loss": -26.906469345092773, "global_step": 537880, "epoch": 6480} {"train_loss": -26.878400802612305, "global_step": 537881, "epoch": 6480} {"train_loss": -27.018203735351562, "global_step": 537882, "epoch": 6480} {"train_loss": -27.038944244384766, "global_step": 537883, "epoch": 6480} {"train_loss": -27.169879913330078, "global_step": 537884, "epoch": 6480} {"train_loss": -27.2279052734375, "global_step": 537885, "epoch": 6480} {"train_loss": -27.19923210144043, "global_step": 537886, "epoch": 6480} {"train_loss": -27.213972091674805, "global_step": 537887, "epoch": 6480} {"train_loss": -26.97646141052246, "global_step": 537888, "epoch": 6480} {"train_loss": -27.568084716796875, "global_step": 537889, "epoch": 6480} {"train_loss": -27.00905418395996, "global_step": 537890, "epoch": 6480} {"train_loss": -27.396215438842773, "global_step": 537891, "epoch": 6480} {"train_loss": -27.55390739440918, "global_step": 537892, "epoch": 6480} {"train_loss": -27.55072021484375, "global_step": 537893, "epoch": 6480} {"train_loss": -27.274124145507812, "global_step": 537894, "epoch": 6480} {"train_loss": -27.528457641601562, "global_step": 537895, "epoch": 6480} {"train_loss": -27.73066520690918, "global_step": 537896, "epoch": 6480} {"train_loss": -27.626529693603516, "global_step": 537897, "epoch": 6480} {"train_loss": -27.187646865844727, "global_step": 537898, "epoch": 6480} {"train_loss": -27.60807228088379, "global_step": 537899, "epoch": 6480} {"train_loss": -27.387502670288086, "global_step": 537900, "epoch": 6480} {"train_loss": -27.493682861328125, "global_step": 537901, "epoch": 6480} {"train_loss": -27.652896881103516, "global_step": 537902, "epoch": 6480} {"train_loss": -27.75750732421875, "global_step": 537903, "epoch": 6480} {"train_loss": -27.520984649658203, "global_step": 537904, "epoch": 6480} {"train_loss": -27.56202507019043, "global_step": 537905, "epoch": 6480} {"train_loss": -27.81882095336914, "global_step": 537906, "epoch": 6480} {"train_loss": -27.806232452392578, "global_step": 537907, "epoch": 6480} {"train_loss": -27.724079132080078, "global_step": 537908, "epoch": 6480} {"train_loss": -27.946399688720703, "global_step": 537909, "epoch": 6480} {"train_loss": -27.763227462768555, "global_step": 537910, "epoch": 6480} {"train_loss": -27.514026641845703, "global_step": 537911, "epoch": 6480} {"train_loss": -27.8568058013916, "global_step": 537912, "epoch": 6480} {"train_loss": -27.6553955078125, "global_step": 537913, "epoch": 6480} {"train_loss": -27.528671264648438, "global_step": 537914, "epoch": 6480} {"train_loss": -27.611042022705078, "global_step": 537915, "epoch": 6480} {"train_loss": -27.56251335144043, "global_step": 537916, "epoch": 6480} {"train_loss": -27.495588302612305, "global_step": 537917, "epoch": 6480} {"train_loss": -27.515228271484375, "global_step": 537918, "epoch": 6480} {"train_loss": -27.819135665893555, "global_step": 537919, "epoch": 6480} {"train_loss": -27.3565731048584, "global_step": 537920, "epoch": 6480} {"train_loss": -27.60456657409668, "global_step": 537921, "epoch": 6480} {"train_loss": -26.731385288468328, "global_step": 537922, "epoch": 6480, "val_loss": 6466643.0} {"train_loss": -27.029037475585938, "global_step": 537923, "epoch": 6481} {"train_loss": -26.692480087280273, "global_step": 537924, "epoch": 6481} {"train_loss": -27.30427360534668, "global_step": 537925, "epoch": 6481} {"train_loss": -27.075925827026367, "global_step": 537926, "epoch": 6481} {"train_loss": -26.53546142578125, "global_step": 537927, "epoch": 6481} {"train_loss": -27.217487335205078, "global_step": 537928, "epoch": 6481} {"train_loss": -27.137866973876953, "global_step": 537929, "epoch": 6481} {"train_loss": -26.71719741821289, "global_step": 537930, "epoch": 6481} {"train_loss": -27.161441802978516, "global_step": 537931, "epoch": 6481} {"train_loss": -26.26215934753418, "global_step": 537932, "epoch": 6481} {"train_loss": -26.8509578704834, "global_step": 537933, "epoch": 6481} {"train_loss": -26.994672775268555, "global_step": 537934, "epoch": 6481} {"train_loss": -26.82328224182129, "global_step": 537935, "epoch": 6481} {"train_loss": -27.23292350769043, "global_step": 537936, "epoch": 6481} {"train_loss": -27.049856185913086, "global_step": 537937, "epoch": 6481} {"train_loss": -27.1762752532959, "global_step": 537938, "epoch": 6481} {"train_loss": -27.365278244018555, "global_step": 537939, "epoch": 6481} {"train_loss": -27.146223068237305, "global_step": 537940, "epoch": 6481} {"train_loss": -27.60675621032715, "global_step": 537941, "epoch": 6481} {"train_loss": -27.380353927612305, "global_step": 537942, "epoch": 6481} {"train_loss": -27.557214736938477, "global_step": 537943, "epoch": 6481} {"train_loss": -27.52093505859375, "global_step": 537944, "epoch": 6481} {"train_loss": -27.401229858398438, "global_step": 537945, "epoch": 6481} {"train_loss": -27.261962890625, "global_step": 537946, "epoch": 6481} {"train_loss": -27.27363395690918, "global_step": 537947, "epoch": 6481} {"train_loss": -27.685556411743164, "global_step": 537948, "epoch": 6481} {"train_loss": -27.153512954711914, "global_step": 537949, "epoch": 6481} {"train_loss": -27.28898048400879, "global_step": 537950, "epoch": 6481} {"train_loss": -27.193777084350586, "global_step": 537951, "epoch": 6481} {"train_loss": -27.717920303344727, "global_step": 537952, "epoch": 6481} {"train_loss": -27.023290634155273, "global_step": 537953, "epoch": 6481} {"train_loss": -27.656696319580078, "global_step": 537954, "epoch": 6481} {"train_loss": -27.399206161499023, "global_step": 537955, "epoch": 6481} {"train_loss": -27.84278678894043, "global_step": 537956, "epoch": 6481} {"train_loss": -27.426040649414062, "global_step": 537957, "epoch": 6481} {"train_loss": -27.760196685791016, "global_step": 537958, "epoch": 6481} {"train_loss": -27.531400680541992, "global_step": 537959, "epoch": 6481} {"train_loss": -27.522113800048828, "global_step": 537960, "epoch": 6481} {"train_loss": -27.566747665405273, "global_step": 537961, "epoch": 6481} {"train_loss": -27.664154052734375, "global_step": 537962, "epoch": 6481} {"train_loss": -27.613019943237305, "global_step": 537963, "epoch": 6481} {"train_loss": -27.80674171447754, "global_step": 537964, "epoch": 6481} {"train_loss": -27.892597198486328, "global_step": 537965, "epoch": 6481} {"train_loss": -27.586318969726562, "global_step": 537966, "epoch": 6481} {"train_loss": -27.784963607788086, "global_step": 537967, "epoch": 6481} {"train_loss": -27.994211196899414, "global_step": 537968, "epoch": 6481} {"train_loss": -27.709091186523438, "global_step": 537969, "epoch": 6481} {"train_loss": -27.82440757751465, "global_step": 537970, "epoch": 6481} {"train_loss": -28.023212432861328, "global_step": 537971, "epoch": 6481} {"train_loss": -27.905303955078125, "global_step": 537972, "epoch": 6481} {"train_loss": -27.646772384643555, "global_step": 537973, "epoch": 6481} {"train_loss": -27.38116455078125, "global_step": 537974, "epoch": 6481} {"train_loss": -27.644041061401367, "global_step": 537975, "epoch": 6481} {"train_loss": -27.779706954956055, "global_step": 537976, "epoch": 6481} {"train_loss": -28.089584350585938, "global_step": 537977, "epoch": 6481} {"train_loss": -27.613779067993164, "global_step": 537978, "epoch": 6481} {"train_loss": -27.661420822143555, "global_step": 537979, "epoch": 6481} {"train_loss": -27.89188575744629, "global_step": 537980, "epoch": 6481} {"train_loss": -27.775836944580078, "global_step": 537981, "epoch": 6481} {"train_loss": -27.845264434814453, "global_step": 537982, "epoch": 6481} {"train_loss": -27.521392822265625, "global_step": 537983, "epoch": 6481} {"train_loss": -27.760635375976562, "global_step": 537984, "epoch": 6481} {"train_loss": -27.718231201171875, "global_step": 537985, "epoch": 6481} {"train_loss": -27.915952682495117, "global_step": 537986, "epoch": 6481} {"train_loss": -27.891117095947266, "global_step": 537987, "epoch": 6481} {"train_loss": -27.651086807250977, "global_step": 537988, "epoch": 6481} {"train_loss": -27.752389907836914, "global_step": 537989, "epoch": 6481} {"train_loss": -27.781513214111328, "global_step": 537990, "epoch": 6481} {"train_loss": -27.588153839111328, "global_step": 537991, "epoch": 6481} {"train_loss": -28.107587814331055, "global_step": 537992, "epoch": 6481} {"train_loss": -27.675952911376953, "global_step": 537993, "epoch": 6481} {"train_loss": -28.054325103759766, "global_step": 537994, "epoch": 6481} {"train_loss": -27.369720458984375, "global_step": 537995, "epoch": 6481} {"train_loss": -27.574384689331055, "global_step": 537996, "epoch": 6481} {"train_loss": -28.1723575592041, "global_step": 537997, "epoch": 6481} {"train_loss": -27.01725196838379, "global_step": 537998, "epoch": 6481} {"train_loss": -27.10110855102539, "global_step": 537999, "epoch": 6481} {"train_loss": -27.31171226501465, "global_step": 538000, "epoch": 6481} {"train_loss": -27.745452880859375, "global_step": 538001, "epoch": 6481} {"train_loss": -27.665943145751953, "global_step": 538002, "epoch": 6481} {"train_loss": -27.57275390625, "global_step": 538003, "epoch": 6481} {"train_loss": -27.702600479125977, "global_step": 538004, "epoch": 6481} {"train_loss": -27.506179878510626, "global_step": 538005, "epoch": 6481, "val_loss": 6420792.0} {"train_loss": -25.718347549438477, "global_step": 538006, "epoch": 6482} {"train_loss": -26.061254501342773, "global_step": 538007, "epoch": 6482} {"train_loss": -27.087263107299805, "global_step": 538008, "epoch": 6482} {"train_loss": -26.526187896728516, "global_step": 538009, "epoch": 6482} {"train_loss": -26.651586532592773, "global_step": 538010, "epoch": 6482} {"train_loss": -26.859088897705078, "global_step": 538011, "epoch": 6482} {"train_loss": -26.60572624206543, "global_step": 538012, "epoch": 6482} {"train_loss": -26.778310775756836, "global_step": 538013, "epoch": 6482} {"train_loss": -26.647247314453125, "global_step": 538014, "epoch": 6482} {"train_loss": -26.589298248291016, "global_step": 538015, "epoch": 6482} {"train_loss": -26.641132354736328, "global_step": 538016, "epoch": 6482} {"train_loss": -26.970706939697266, "global_step": 538017, "epoch": 6482} {"train_loss": -26.975067138671875, "global_step": 538018, "epoch": 6482} {"train_loss": -26.910669326782227, "global_step": 538019, "epoch": 6482} {"train_loss": -26.866907119750977, "global_step": 538020, "epoch": 6482} {"train_loss": -27.214920043945312, "global_step": 538021, "epoch": 6482} {"train_loss": -27.062238693237305, "global_step": 538022, "epoch": 6482} {"train_loss": -26.90154457092285, "global_step": 538023, "epoch": 6482} {"train_loss": -27.021636962890625, "global_step": 538024, "epoch": 6482} {"train_loss": -27.022491455078125, "global_step": 538025, "epoch": 6482} {"train_loss": -27.579547882080078, "global_step": 538026, "epoch": 6482} {"train_loss": -27.073577880859375, "global_step": 538027, "epoch": 6482} {"train_loss": -26.970935821533203, "global_step": 538028, "epoch": 6482} {"train_loss": -27.41424560546875, "global_step": 538029, "epoch": 6482} {"train_loss": -27.469684600830078, "global_step": 538030, "epoch": 6482} {"train_loss": -27.593637466430664, "global_step": 538031, "epoch": 6482} {"train_loss": -27.20538902282715, "global_step": 538032, "epoch": 6482} {"train_loss": -26.754125595092773, "global_step": 538033, "epoch": 6482} {"train_loss": -27.622812271118164, "global_step": 538034, "epoch": 6482} {"train_loss": -27.195531845092773, "global_step": 538035, "epoch": 6482} {"train_loss": -27.39118003845215, "global_step": 538036, "epoch": 6482} {"train_loss": -27.584508895874023, "global_step": 538037, "epoch": 6482} {"train_loss": -27.310760498046875, "global_step": 538038, "epoch": 6482} {"train_loss": -27.5002498626709, "global_step": 538039, "epoch": 6482} {"train_loss": -27.86216163635254, "global_step": 538040, "epoch": 6482} {"train_loss": -27.520498275756836, "global_step": 538041, "epoch": 6482} {"train_loss": -27.291234970092773, "global_step": 538042, "epoch": 6482} {"train_loss": -27.4224910736084, "global_step": 538043, "epoch": 6482} {"train_loss": -27.422353744506836, "global_step": 538044, "epoch": 6482} {"train_loss": -27.7714786529541, "global_step": 538045, "epoch": 6482} {"train_loss": -27.54718017578125, "global_step": 538046, "epoch": 6482} {"train_loss": -27.79034423828125, "global_step": 538047, "epoch": 6482} {"train_loss": -27.6605224609375, "global_step": 538048, "epoch": 6482} {"train_loss": -27.43060302734375, "global_step": 538049, "epoch": 6482} {"train_loss": -27.722339630126953, "global_step": 538050, "epoch": 6482} {"train_loss": -27.75103187561035, "global_step": 538051, "epoch": 6482} {"train_loss": -27.76654052734375, "global_step": 538052, "epoch": 6482} {"train_loss": -27.851194381713867, "global_step": 538053, "epoch": 6482} {"train_loss": -27.651687622070312, "global_step": 538054, "epoch": 6482} {"train_loss": -27.857425689697266, "global_step": 538055, "epoch": 6482} {"train_loss": -27.836389541625977, "global_step": 538056, "epoch": 6482} {"train_loss": -27.71856689453125, "global_step": 538057, "epoch": 6482} {"train_loss": -27.73238182067871, "global_step": 538058, "epoch": 6482} {"train_loss": -27.926095962524414, "global_step": 538059, "epoch": 6482} {"train_loss": -27.71973991394043, "global_step": 538060, "epoch": 6482} {"train_loss": -27.949844360351562, "global_step": 538061, "epoch": 6482} {"train_loss": -27.9678955078125, "global_step": 538062, "epoch": 6482} {"train_loss": -27.730010986328125, "global_step": 538063, "epoch": 6482} {"train_loss": -27.633955001831055, "global_step": 538064, "epoch": 6482} {"train_loss": -28.21748161315918, "global_step": 538065, "epoch": 6482} {"train_loss": -27.553857803344727, "global_step": 538066, "epoch": 6482} {"train_loss": -27.91543960571289, "global_step": 538067, "epoch": 6482} {"train_loss": -27.86090087890625, "global_step": 538068, "epoch": 6482} {"train_loss": -28.255096435546875, "global_step": 538069, "epoch": 6482} {"train_loss": -27.859846115112305, "global_step": 538070, "epoch": 6482} {"train_loss": -27.829639434814453, "global_step": 538071, "epoch": 6482} {"train_loss": -27.79304313659668, "global_step": 538072, "epoch": 6482} {"train_loss": -28.045522689819336, "global_step": 538073, "epoch": 6482} {"train_loss": -27.6684627532959, "global_step": 538074, "epoch": 6482} {"train_loss": -27.869491577148438, "global_step": 538075, "epoch": 6482} {"train_loss": -27.608915328979492, "global_step": 538076, "epoch": 6482} {"train_loss": -27.7476806640625, "global_step": 538077, "epoch": 6482} {"train_loss": -27.756738662719727, "global_step": 538078, "epoch": 6482} {"train_loss": -27.7015380859375, "global_step": 538079, "epoch": 6482} {"train_loss": -27.278959274291992, "global_step": 538080, "epoch": 6482} {"train_loss": -28.0203914642334, "global_step": 538081, "epoch": 6482} {"train_loss": -28.397796630859375, "global_step": 538082, "epoch": 6482} {"train_loss": -27.57500648498535, "global_step": 538083, "epoch": 6482} {"train_loss": -27.496265411376953, "global_step": 538084, "epoch": 6482} {"train_loss": -27.632797241210938, "global_step": 538085, "epoch": 6482} {"train_loss": -27.677932739257812, "global_step": 538086, "epoch": 6482} {"train_loss": -27.71442222595215, "global_step": 538087, "epoch": 6482} {"train_loss": -27.432777634586195, "global_step": 538088, "epoch": 6482, "val_loss": 6489073.0} {"train_loss": -26.37112808227539, "global_step": 538089, "epoch": 6483} {"train_loss": -26.97382926940918, "global_step": 538090, "epoch": 6483} {"train_loss": -26.8608455657959, "global_step": 538091, "epoch": 6483} {"train_loss": -27.181869506835938, "global_step": 538092, "epoch": 6483} {"train_loss": -27.041671752929688, "global_step": 538093, "epoch": 6483} {"train_loss": -27.579273223876953, "global_step": 538094, "epoch": 6483} {"train_loss": -26.523345947265625, "global_step": 538095, "epoch": 6483} {"train_loss": -27.030344009399414, "global_step": 538096, "epoch": 6483} {"train_loss": -27.35219383239746, "global_step": 538097, "epoch": 6483} {"train_loss": -27.28714370727539, "global_step": 538098, "epoch": 6483} {"train_loss": -27.438074111938477, "global_step": 538099, "epoch": 6483} {"train_loss": -26.948989868164062, "global_step": 538100, "epoch": 6483} {"train_loss": -27.254093170166016, "global_step": 538101, "epoch": 6483} {"train_loss": -27.129602432250977, "global_step": 538102, "epoch": 6483} {"train_loss": -27.02796745300293, "global_step": 538103, "epoch": 6483} {"train_loss": -27.728168487548828, "global_step": 538104, "epoch": 6483} {"train_loss": -27.384504318237305, "global_step": 538105, "epoch": 6483} {"train_loss": -27.423358917236328, "global_step": 538106, "epoch": 6483} {"train_loss": -27.39544105529785, "global_step": 538107, "epoch": 6483} {"train_loss": -27.105772018432617, "global_step": 538108, "epoch": 6483} {"train_loss": -27.426427841186523, "global_step": 538109, "epoch": 6483} {"train_loss": -27.496179580688477, "global_step": 538110, "epoch": 6483} {"train_loss": -27.57352066040039, "global_step": 538111, "epoch": 6483} {"train_loss": -27.33734130859375, "global_step": 538112, "epoch": 6483} {"train_loss": -27.80255126953125, "global_step": 538113, "epoch": 6483} {"train_loss": -27.501123428344727, "global_step": 538114, "epoch": 6483} {"train_loss": -27.490203857421875, "global_step": 538115, "epoch": 6483} {"train_loss": -27.37233543395996, "global_step": 538116, "epoch": 6483} {"train_loss": -27.56415367126465, "global_step": 538117, "epoch": 6483} {"train_loss": -27.187753677368164, "global_step": 538118, "epoch": 6483} {"train_loss": -27.690465927124023, "global_step": 538119, "epoch": 6483} {"train_loss": -27.57000160217285, "global_step": 538120, "epoch": 6483} {"train_loss": -27.63043785095215, "global_step": 538121, "epoch": 6483} {"train_loss": -27.535064697265625, "global_step": 538122, "epoch": 6483} {"train_loss": -26.934247970581055, "global_step": 538123, "epoch": 6483} {"train_loss": -27.863073348999023, "global_step": 538124, "epoch": 6483} {"train_loss": -27.8682861328125, "global_step": 538125, "epoch": 6483} {"train_loss": -27.69585609436035, "global_step": 538126, "epoch": 6483} {"train_loss": -27.95595359802246, "global_step": 538127, "epoch": 6483} {"train_loss": -27.65687370300293, "global_step": 538128, "epoch": 6483} {"train_loss": -27.819610595703125, "global_step": 538129, "epoch": 6483} {"train_loss": -27.7536563873291, "global_step": 538130, "epoch": 6483} {"train_loss": -27.274694442749023, "global_step": 538131, "epoch": 6483} {"train_loss": -27.616668701171875, "global_step": 538132, "epoch": 6483} {"train_loss": -27.845703125, "global_step": 538133, "epoch": 6483} {"train_loss": -27.612768173217773, "global_step": 538134, "epoch": 6483} {"train_loss": -27.911191940307617, "global_step": 538135, "epoch": 6483} {"train_loss": -27.50592041015625, "global_step": 538136, "epoch": 6483} {"train_loss": -27.981292724609375, "global_step": 538137, "epoch": 6483} {"train_loss": -27.428424835205078, "global_step": 538138, "epoch": 6483} {"train_loss": -27.350217819213867, "global_step": 538139, "epoch": 6483} {"train_loss": -27.460615158081055, "global_step": 538140, "epoch": 6483} {"train_loss": -27.78656578063965, "global_step": 538141, "epoch": 6483} {"train_loss": -27.35320472717285, "global_step": 538142, "epoch": 6483} {"train_loss": -27.316974639892578, "global_step": 538143, "epoch": 6483} {"train_loss": -27.66108512878418, "global_step": 538144, "epoch": 6483} {"train_loss": -27.291791915893555, "global_step": 538145, "epoch": 6483} {"train_loss": -27.437149047851562, "global_step": 538146, "epoch": 6483} {"train_loss": -26.845539093017578, "global_step": 538147, "epoch": 6483} {"train_loss": -27.262277603149414, "global_step": 538148, "epoch": 6483} {"train_loss": -27.350553512573242, "global_step": 538149, "epoch": 6483} {"train_loss": -27.035491943359375, "global_step": 538150, "epoch": 6483} {"train_loss": -27.7114200592041, "global_step": 538151, "epoch": 6483} {"train_loss": -27.85671043395996, "global_step": 538152, "epoch": 6483} {"train_loss": -27.388721466064453, "global_step": 538153, "epoch": 6483} {"train_loss": -27.01834487915039, "global_step": 538154, "epoch": 6483} {"train_loss": -27.12750816345215, "global_step": 538155, "epoch": 6483} {"train_loss": -27.723846435546875, "global_step": 538156, "epoch": 6483} {"train_loss": -27.155420303344727, "global_step": 538157, "epoch": 6483} {"train_loss": -27.37959098815918, "global_step": 538158, "epoch": 6483} {"train_loss": -27.261579513549805, "global_step": 538159, "epoch": 6483} {"train_loss": -27.79304313659668, "global_step": 538160, "epoch": 6483} {"train_loss": -27.305374145507812, "global_step": 538161, "epoch": 6483} {"train_loss": -27.87813377380371, "global_step": 538162, "epoch": 6483} {"train_loss": -27.428579330444336, "global_step": 538163, "epoch": 6483} {"train_loss": -27.673816680908203, "global_step": 538164, "epoch": 6483} {"train_loss": -27.920440673828125, "global_step": 538165, "epoch": 6483} {"train_loss": -27.7066707611084, "global_step": 538166, "epoch": 6483} {"train_loss": -27.91965675354004, "global_step": 538167, "epoch": 6483} {"train_loss": -27.719013214111328, "global_step": 538168, "epoch": 6483} {"train_loss": -27.731098175048828, "global_step": 538169, "epoch": 6483} {"train_loss": -27.62200355529785, "global_step": 538170, "epoch": 6483} {"train_loss": -27.449316737163496, "global_step": 538171, "epoch": 6483, "val_loss": 6462662.0} {"train_loss": -27.005136489868164, "global_step": 538172, "epoch": 6484} {"train_loss": -27.30805015563965, "global_step": 538173, "epoch": 6484} {"train_loss": -27.017545700073242, "global_step": 538174, "epoch": 6484} {"train_loss": -27.483922958374023, "global_step": 538175, "epoch": 6484} {"train_loss": -27.21160888671875, "global_step": 538176, "epoch": 6484} {"train_loss": -27.810333251953125, "global_step": 538177, "epoch": 6484} {"train_loss": -27.510343551635742, "global_step": 538178, "epoch": 6484} {"train_loss": -27.602094650268555, "global_step": 538179, "epoch": 6484} {"train_loss": -27.379547119140625, "global_step": 538180, "epoch": 6484} {"train_loss": -27.445371627807617, "global_step": 538181, "epoch": 6484} {"train_loss": -27.271621704101562, "global_step": 538182, "epoch": 6484} {"train_loss": -27.55568504333496, "global_step": 538183, "epoch": 6484} {"train_loss": -27.26971435546875, "global_step": 538184, "epoch": 6484} {"train_loss": -27.675939559936523, "global_step": 538185, "epoch": 6484} {"train_loss": -27.26409912109375, "global_step": 538186, "epoch": 6484} {"train_loss": -27.16069984436035, "global_step": 538187, "epoch": 6484} {"train_loss": -27.067493438720703, "global_step": 538188, "epoch": 6484} {"train_loss": -27.20831871032715, "global_step": 538189, "epoch": 6484} {"train_loss": -27.4724178314209, "global_step": 538190, "epoch": 6484} {"train_loss": -27.684640884399414, "global_step": 538191, "epoch": 6484} {"train_loss": -27.254108428955078, "global_step": 538192, "epoch": 6484} {"train_loss": -27.539779663085938, "global_step": 538193, "epoch": 6484} {"train_loss": -27.315561294555664, "global_step": 538194, "epoch": 6484} {"train_loss": -27.919952392578125, "global_step": 538195, "epoch": 6484} {"train_loss": -27.422819137573242, "global_step": 538196, "epoch": 6484} {"train_loss": -26.973691940307617, "global_step": 538197, "epoch": 6484} {"train_loss": -27.024377822875977, "global_step": 538198, "epoch": 6484} {"train_loss": -27.112722396850586, "global_step": 538199, "epoch": 6484} {"train_loss": -26.86463737487793, "global_step": 538200, "epoch": 6484} {"train_loss": -26.999570846557617, "global_step": 538201, "epoch": 6484} {"train_loss": -27.54365348815918, "global_step": 538202, "epoch": 6484} {"train_loss": -27.604848861694336, "global_step": 538203, "epoch": 6484} {"train_loss": -27.644805908203125, "global_step": 538204, "epoch": 6484} {"train_loss": -27.56280517578125, "global_step": 538205, "epoch": 6484} {"train_loss": -27.294601440429688, "global_step": 538206, "epoch": 6484} {"train_loss": -27.47601890563965, "global_step": 538207, "epoch": 6484} {"train_loss": -27.625791549682617, "global_step": 538208, "epoch": 6484} {"train_loss": -27.288074493408203, "global_step": 538209, "epoch": 6484} {"train_loss": -27.63997459411621, "global_step": 538210, "epoch": 6484} {"train_loss": -27.244409561157227, "global_step": 538211, "epoch": 6484} {"train_loss": -27.741445541381836, "global_step": 538212, "epoch": 6484} {"train_loss": -27.578649520874023, "global_step": 538213, "epoch": 6484} {"train_loss": -27.62495231628418, "global_step": 538214, "epoch": 6484} {"train_loss": -28.07065200805664, "global_step": 538215, "epoch": 6484} {"train_loss": -27.74506950378418, "global_step": 538216, "epoch": 6484} {"train_loss": -27.6314640045166, "global_step": 538217, "epoch": 6484} {"train_loss": -27.613922119140625, "global_step": 538218, "epoch": 6484} {"train_loss": -27.627674102783203, "global_step": 538219, "epoch": 6484} {"train_loss": -27.701398849487305, "global_step": 538220, "epoch": 6484} {"train_loss": -27.579822540283203, "global_step": 538221, "epoch": 6484} {"train_loss": -27.727951049804688, "global_step": 538222, "epoch": 6484} {"train_loss": -27.7286319732666, "global_step": 538223, "epoch": 6484} {"train_loss": -27.8156795501709, "global_step": 538224, "epoch": 6484} {"train_loss": -27.778600692749023, "global_step": 538225, "epoch": 6484} {"train_loss": -27.77106285095215, "global_step": 538226, "epoch": 6484} {"train_loss": -27.6965274810791, "global_step": 538227, "epoch": 6484} {"train_loss": -27.99065589904785, "global_step": 538228, "epoch": 6484} {"train_loss": -27.6474552154541, "global_step": 538229, "epoch": 6484} {"train_loss": -27.744903564453125, "global_step": 538230, "epoch": 6484} {"train_loss": -27.795923233032227, "global_step": 538231, "epoch": 6484} {"train_loss": -28.0279598236084, "global_step": 538232, "epoch": 6484} {"train_loss": -27.635242462158203, "global_step": 538233, "epoch": 6484} {"train_loss": -27.571887969970703, "global_step": 538234, "epoch": 6484} {"train_loss": -27.958688735961914, "global_step": 538235, "epoch": 6484} {"train_loss": -27.371244430541992, "global_step": 538236, "epoch": 6484} {"train_loss": -27.634384155273438, "global_step": 538237, "epoch": 6484} {"train_loss": -27.773603439331055, "global_step": 538238, "epoch": 6484} {"train_loss": -28.100255966186523, "global_step": 538239, "epoch": 6484} {"train_loss": -27.757083892822266, "global_step": 538240, "epoch": 6484} {"train_loss": -27.613800048828125, "global_step": 538241, "epoch": 6484} {"train_loss": -27.937957763671875, "global_step": 538242, "epoch": 6484} {"train_loss": -27.272872924804688, "global_step": 538243, "epoch": 6484} {"train_loss": -27.962614059448242, "global_step": 538244, "epoch": 6484} {"train_loss": -27.700057983398438, "global_step": 538245, "epoch": 6484} {"train_loss": -27.913116455078125, "global_step": 538246, "epoch": 6484} {"train_loss": -27.856191635131836, "global_step": 538247, "epoch": 6484} {"train_loss": -27.975034713745117, "global_step": 538248, "epoch": 6484} {"train_loss": -27.870044708251953, "global_step": 538249, "epoch": 6484} {"train_loss": -27.914474487304688, "global_step": 538250, "epoch": 6484} {"train_loss": -27.886371612548828, "global_step": 538251, "epoch": 6484} {"train_loss": -28.141523361206055, "global_step": 538252, "epoch": 6484} {"train_loss": -27.365955352783203, "global_step": 538253, "epoch": 6484} {"train_loss": -27.564261631793286, "global_step": 538254, "epoch": 6484, "val_loss": 6502648.5} {"train_loss": -26.54412269592285, "global_step": 538255, "epoch": 6485} {"train_loss": -25.71124267578125, "global_step": 538256, "epoch": 6485} {"train_loss": -26.534955978393555, "global_step": 538257, "epoch": 6485} {"train_loss": -26.911407470703125, "global_step": 538258, "epoch": 6485} {"train_loss": -26.722326278686523, "global_step": 538259, "epoch": 6485} {"train_loss": -26.302160263061523, "global_step": 538260, "epoch": 6485} {"train_loss": -27.157102584838867, "global_step": 538261, "epoch": 6485} {"train_loss": -26.98089599609375, "global_step": 538262, "epoch": 6485} {"train_loss": -27.103322982788086, "global_step": 538263, "epoch": 6485} {"train_loss": -27.116058349609375, "global_step": 538264, "epoch": 6485} {"train_loss": -26.84527015686035, "global_step": 538265, "epoch": 6485} {"train_loss": -27.141565322875977, "global_step": 538266, "epoch": 6485} {"train_loss": -26.49189567565918, "global_step": 538267, "epoch": 6485} {"train_loss": -27.423110961914062, "global_step": 538268, "epoch": 6485} {"train_loss": -26.943201065063477, "global_step": 538269, "epoch": 6485} {"train_loss": -26.9169864654541, "global_step": 538270, "epoch": 6485} {"train_loss": -27.328784942626953, "global_step": 538271, "epoch": 6485} {"train_loss": -27.56390953063965, "global_step": 538272, "epoch": 6485} {"train_loss": -26.893522262573242, "global_step": 538273, "epoch": 6485} {"train_loss": -27.637908935546875, "global_step": 538274, "epoch": 6485} {"train_loss": -27.753070831298828, "global_step": 538275, "epoch": 6485} {"train_loss": -27.303930282592773, "global_step": 538276, "epoch": 6485} {"train_loss": -27.696027755737305, "global_step": 538277, "epoch": 6485} {"train_loss": -27.166614532470703, "global_step": 538278, "epoch": 6485} {"train_loss": -27.207395553588867, "global_step": 538279, "epoch": 6485} {"train_loss": -27.40130043029785, "global_step": 538280, "epoch": 6485} {"train_loss": -27.309661865234375, "global_step": 538281, "epoch": 6485} {"train_loss": -27.560346603393555, "global_step": 538282, "epoch": 6485} {"train_loss": -27.669193267822266, "global_step": 538283, "epoch": 6485} {"train_loss": -27.367862701416016, "global_step": 538284, "epoch": 6485} {"train_loss": -27.63568687438965, "global_step": 538285, "epoch": 6485} {"train_loss": -27.685943603515625, "global_step": 538286, "epoch": 6485} {"train_loss": -27.47586441040039, "global_step": 538287, "epoch": 6485} {"train_loss": -27.96591567993164, "global_step": 538288, "epoch": 6485} {"train_loss": -27.86048698425293, "global_step": 538289, "epoch": 6485} {"train_loss": -27.74835205078125, "global_step": 538290, "epoch": 6485} {"train_loss": -27.948989868164062, "global_step": 538291, "epoch": 6485} {"train_loss": -27.647907257080078, "global_step": 538292, "epoch": 6485} {"train_loss": -28.016677856445312, "global_step": 538293, "epoch": 6485} {"train_loss": -27.378192901611328, "global_step": 538294, "epoch": 6485} {"train_loss": -27.836679458618164, "global_step": 538295, "epoch": 6485} {"train_loss": -27.370227813720703, "global_step": 538296, "epoch": 6485} {"train_loss": -27.873748779296875, "global_step": 538297, "epoch": 6485} {"train_loss": -27.82459831237793, "global_step": 538298, "epoch": 6485} {"train_loss": -27.91852378845215, "global_step": 538299, "epoch": 6485} {"train_loss": -27.591917037963867, "global_step": 538300, "epoch": 6485} {"train_loss": -27.819808959960938, "global_step": 538301, "epoch": 6485} {"train_loss": -27.98752212524414, "global_step": 538302, "epoch": 6485} {"train_loss": -27.778644561767578, "global_step": 538303, "epoch": 6485} {"train_loss": -28.0712890625, "global_step": 538304, "epoch": 6485} {"train_loss": -27.51813316345215, "global_step": 538305, "epoch": 6485} {"train_loss": -27.650548934936523, "global_step": 538306, "epoch": 6485} {"train_loss": -27.659433364868164, "global_step": 538307, "epoch": 6485} {"train_loss": -27.569400787353516, "global_step": 538308, "epoch": 6485} {"train_loss": -27.557836532592773, "global_step": 538309, "epoch": 6485} {"train_loss": -27.615802764892578, "global_step": 538310, "epoch": 6485} {"train_loss": -27.949207305908203, "global_step": 538311, "epoch": 6485} {"train_loss": -27.459796905517578, "global_step": 538312, "epoch": 6485} {"train_loss": -27.932249069213867, "global_step": 538313, "epoch": 6485} {"train_loss": -27.72952651977539, "global_step": 538314, "epoch": 6485} {"train_loss": -27.74228286743164, "global_step": 538315, "epoch": 6485} {"train_loss": -27.932723999023438, "global_step": 538316, "epoch": 6485} {"train_loss": -27.412694931030273, "global_step": 538317, "epoch": 6485} {"train_loss": -27.64460563659668, "global_step": 538318, "epoch": 6485} {"train_loss": -27.68096923828125, "global_step": 538319, "epoch": 6485} {"train_loss": -27.591217041015625, "global_step": 538320, "epoch": 6485} {"train_loss": -27.64931297302246, "global_step": 538321, "epoch": 6485} {"train_loss": -27.6744327545166, "global_step": 538322, "epoch": 6485} {"train_loss": -28.048187255859375, "global_step": 538323, "epoch": 6485} {"train_loss": -27.775867462158203, "global_step": 538324, "epoch": 6485} {"train_loss": -27.56251335144043, "global_step": 538325, "epoch": 6485} {"train_loss": -27.853912353515625, "global_step": 538326, "epoch": 6485} {"train_loss": -27.911123275756836, "global_step": 538327, "epoch": 6485} {"train_loss": -27.58709716796875, "global_step": 538328, "epoch": 6485} {"train_loss": -27.424341201782227, "global_step": 538329, "epoch": 6485} {"train_loss": -27.728458404541016, "global_step": 538330, "epoch": 6485} {"train_loss": -27.754846572875977, "global_step": 538331, "epoch": 6485} {"train_loss": -27.696796417236328, "global_step": 538332, "epoch": 6485} {"train_loss": -27.693252563476562, "global_step": 538333, "epoch": 6485} {"train_loss": -27.717294692993164, "global_step": 538334, "epoch": 6485} {"train_loss": -27.64594078063965, "global_step": 538335, "epoch": 6485} {"train_loss": -27.159530639648438, "global_step": 538336, "epoch": 6485} {"train_loss": -27.46253680033856, "global_step": 538337, "epoch": 6485, "val_loss": 6464212.0} {"train_loss": -26.84409523010254, "global_step": 538338, "epoch": 6486} {"train_loss": -27.247058868408203, "global_step": 538339, "epoch": 6486} {"train_loss": -27.015670776367188, "global_step": 538340, "epoch": 6486} {"train_loss": -26.70099449157715, "global_step": 538341, "epoch": 6486} {"train_loss": -27.3326473236084, "global_step": 538342, "epoch": 6486} {"train_loss": -27.49005126953125, "global_step": 538343, "epoch": 6486} {"train_loss": -26.165674209594727, "global_step": 538344, "epoch": 6486} {"train_loss": -26.992048263549805, "global_step": 538345, "epoch": 6486} {"train_loss": -26.904539108276367, "global_step": 538346, "epoch": 6486} {"train_loss": -27.418277740478516, "global_step": 538347, "epoch": 6486} {"train_loss": -27.42975425720215, "global_step": 538348, "epoch": 6486} {"train_loss": -27.39119529724121, "global_step": 538349, "epoch": 6486} {"train_loss": -27.18562126159668, "global_step": 538350, "epoch": 6486} {"train_loss": -27.171539306640625, "global_step": 538351, "epoch": 6486} {"train_loss": -27.332889556884766, "global_step": 538352, "epoch": 6486} {"train_loss": -27.08827018737793, "global_step": 538353, "epoch": 6486} {"train_loss": -27.245502471923828, "global_step": 538354, "epoch": 6486} {"train_loss": -27.50404167175293, "global_step": 538355, "epoch": 6486} {"train_loss": -27.77947998046875, "global_step": 538356, "epoch": 6486} {"train_loss": -27.741910934448242, "global_step": 538357, "epoch": 6486} {"train_loss": -27.80084228515625, "global_step": 538358, "epoch": 6486} {"train_loss": -27.427942276000977, "global_step": 538359, "epoch": 6486} {"train_loss": -27.444921493530273, "global_step": 538360, "epoch": 6486} {"train_loss": -27.780426025390625, "global_step": 538361, "epoch": 6486} {"train_loss": -27.74830436706543, "global_step": 538362, "epoch": 6486} {"train_loss": -27.733495712280273, "global_step": 538363, "epoch": 6486} {"train_loss": -27.930246353149414, "global_step": 538364, "epoch": 6486} {"train_loss": -27.17585563659668, "global_step": 538365, "epoch": 6486} {"train_loss": -27.57672691345215, "global_step": 538366, "epoch": 6486} {"train_loss": -27.821069717407227, "global_step": 538367, "epoch": 6486} {"train_loss": -27.754186630249023, "global_step": 538368, "epoch": 6486} {"train_loss": -27.8455753326416, "global_step": 538369, "epoch": 6486} {"train_loss": -27.843481063842773, "global_step": 538370, "epoch": 6486} {"train_loss": -27.81154441833496, "global_step": 538371, "epoch": 6486} {"train_loss": -27.720380783081055, "global_step": 538372, "epoch": 6486} {"train_loss": -27.6846981048584, "global_step": 538373, "epoch": 6486} {"train_loss": -27.66770362854004, "global_step": 538374, "epoch": 6486} {"train_loss": -27.544422149658203, "global_step": 538375, "epoch": 6486} {"train_loss": -27.638397216796875, "global_step": 538376, "epoch": 6486} {"train_loss": -27.903284072875977, "global_step": 538377, "epoch": 6486} {"train_loss": -27.911346435546875, "global_step": 538378, "epoch": 6486} {"train_loss": -27.42987632751465, "global_step": 538379, "epoch": 6486} {"train_loss": -27.7487735748291, "global_step": 538380, "epoch": 6486} {"train_loss": -27.574682235717773, "global_step": 538381, "epoch": 6486} {"train_loss": -27.4486026763916, "global_step": 538382, "epoch": 6486} {"train_loss": -27.84284019470215, "global_step": 538383, "epoch": 6486} {"train_loss": -27.45193862915039, "global_step": 538384, "epoch": 6486} {"train_loss": -27.901260375976562, "global_step": 538385, "epoch": 6486} {"train_loss": -27.60841178894043, "global_step": 538386, "epoch": 6486} {"train_loss": -27.724477767944336, "global_step": 538387, "epoch": 6486} {"train_loss": -27.701812744140625, "global_step": 538388, "epoch": 6486} {"train_loss": -27.52734375, "global_step": 538389, "epoch": 6486} {"train_loss": -27.75251579284668, "global_step": 538390, "epoch": 6486} {"train_loss": -27.95130729675293, "global_step": 538391, "epoch": 6486} {"train_loss": -27.979658126831055, "global_step": 538392, "epoch": 6486} {"train_loss": -27.60761070251465, "global_step": 538393, "epoch": 6486} {"train_loss": -27.782257080078125, "global_step": 538394, "epoch": 6486} {"train_loss": -27.793691635131836, "global_step": 538395, "epoch": 6486} {"train_loss": -27.57586669921875, "global_step": 538396, "epoch": 6486} {"train_loss": -27.712635040283203, "global_step": 538397, "epoch": 6486} {"train_loss": -28.05930519104004, "global_step": 538398, "epoch": 6486} {"train_loss": -28.027647018432617, "global_step": 538399, "epoch": 6486} {"train_loss": -27.87957763671875, "global_step": 538400, "epoch": 6486} {"train_loss": -27.670185089111328, "global_step": 538401, "epoch": 6486} {"train_loss": -27.722089767456055, "global_step": 538402, "epoch": 6486} {"train_loss": -27.707000732421875, "global_step": 538403, "epoch": 6486} {"train_loss": -27.91242790222168, "global_step": 538404, "epoch": 6486} {"train_loss": -27.322891235351562, "global_step": 538405, "epoch": 6486} {"train_loss": -27.7144832611084, "global_step": 538406, "epoch": 6486} {"train_loss": -27.875959396362305, "global_step": 538407, "epoch": 6486} {"train_loss": -27.604541778564453, "global_step": 538408, "epoch": 6486} {"train_loss": -27.17462730407715, "global_step": 538409, "epoch": 6486} {"train_loss": -27.233137130737305, "global_step": 538410, "epoch": 6486} {"train_loss": -27.19952964782715, "global_step": 538411, "epoch": 6486} {"train_loss": -27.287601470947266, "global_step": 538412, "epoch": 6486} {"train_loss": -27.563220977783203, "global_step": 538413, "epoch": 6486} {"train_loss": -26.990386962890625, "global_step": 538414, "epoch": 6486} {"train_loss": -27.360706329345703, "global_step": 538415, "epoch": 6486} {"train_loss": -27.653589248657227, "global_step": 538416, "epoch": 6486} {"train_loss": -27.55156898498535, "global_step": 538417, "epoch": 6486} {"train_loss": -27.597919464111328, "global_step": 538418, "epoch": 6486} {"train_loss": -27.614477157592773, "global_step": 538419, "epoch": 6486} {"train_loss": -27.5500396590635, "global_step": 538420, "epoch": 6486, "val_loss": 6492323.0} {"train_loss": -26.921920776367188, "global_step": 538421, "epoch": 6487} {"train_loss": -27.48223304748535, "global_step": 538422, "epoch": 6487} {"train_loss": -27.41619873046875, "global_step": 538423, "epoch": 6487} {"train_loss": -27.22196388244629, "global_step": 538424, "epoch": 6487} {"train_loss": -27.210784912109375, "global_step": 538425, "epoch": 6487} {"train_loss": -27.531070709228516, "global_step": 538426, "epoch": 6487} {"train_loss": -27.0937442779541, "global_step": 538427, "epoch": 6487} {"train_loss": -27.012149810791016, "global_step": 538428, "epoch": 6487} {"train_loss": -26.944965362548828, "global_step": 538429, "epoch": 6487} {"train_loss": -27.235809326171875, "global_step": 538430, "epoch": 6487} {"train_loss": -27.53706169128418, "global_step": 538431, "epoch": 6487} {"train_loss": -27.034326553344727, "global_step": 538432, "epoch": 6487} {"train_loss": -27.720081329345703, "global_step": 538433, "epoch": 6487} {"train_loss": -26.938446044921875, "global_step": 538434, "epoch": 6487} {"train_loss": -27.675451278686523, "global_step": 538435, "epoch": 6487} {"train_loss": -27.30960464477539, "global_step": 538436, "epoch": 6487} {"train_loss": -27.113019943237305, "global_step": 538437, "epoch": 6487} {"train_loss": -27.70380210876465, "global_step": 538438, "epoch": 6487} {"train_loss": -27.383167266845703, "global_step": 538439, "epoch": 6487} {"train_loss": -27.431537628173828, "global_step": 538440, "epoch": 6487} {"train_loss": -27.199512481689453, "global_step": 538441, "epoch": 6487} {"train_loss": -27.626462936401367, "global_step": 538442, "epoch": 6487} {"train_loss": -27.793607711791992, "global_step": 538443, "epoch": 6487} {"train_loss": -27.355655670166016, "global_step": 538444, "epoch": 6487} {"train_loss": -27.722156524658203, "global_step": 538445, "epoch": 6487} {"train_loss": -27.63765525817871, "global_step": 538446, "epoch": 6487} {"train_loss": -27.319019317626953, "global_step": 538447, "epoch": 6487} {"train_loss": -27.656097412109375, "global_step": 538448, "epoch": 6487} {"train_loss": -27.617664337158203, "global_step": 538449, "epoch": 6487} {"train_loss": -27.610143661499023, "global_step": 538450, "epoch": 6487} {"train_loss": -27.640472412109375, "global_step": 538451, "epoch": 6487} {"train_loss": -27.627243041992188, "global_step": 538452, "epoch": 6487} {"train_loss": -27.985265731811523, "global_step": 538453, "epoch": 6487} {"train_loss": -27.4016056060791, "global_step": 538454, "epoch": 6487} {"train_loss": -27.457914352416992, "global_step": 538455, "epoch": 6487} {"train_loss": -27.717010498046875, "global_step": 538456, "epoch": 6487} {"train_loss": -27.698150634765625, "global_step": 538457, "epoch": 6487} {"train_loss": -27.605573654174805, "global_step": 538458, "epoch": 6487} {"train_loss": -27.54874038696289, "global_step": 538459, "epoch": 6487} {"train_loss": -27.71088981628418, "global_step": 538460, "epoch": 6487} {"train_loss": -27.42658042907715, "global_step": 538461, "epoch": 6487} {"train_loss": -27.680526733398438, "global_step": 538462, "epoch": 6487} {"train_loss": -27.848224639892578, "global_step": 538463, "epoch": 6487} {"train_loss": -27.975812911987305, "global_step": 538464, "epoch": 6487} {"train_loss": -27.22725486755371, "global_step": 538465, "epoch": 6487} {"train_loss": -27.4794979095459, "global_step": 538466, "epoch": 6487} {"train_loss": -27.884496688842773, "global_step": 538467, "epoch": 6487} {"train_loss": -27.6035213470459, "global_step": 538468, "epoch": 6487} {"train_loss": -27.79561424255371, "global_step": 538469, "epoch": 6487} {"train_loss": -27.824377059936523, "global_step": 538470, "epoch": 6487} {"train_loss": -27.940046310424805, "global_step": 538471, "epoch": 6487} {"train_loss": -27.511981964111328, "global_step": 538472, "epoch": 6487} {"train_loss": -27.827856063842773, "global_step": 538473, "epoch": 6487} {"train_loss": -27.94698143005371, "global_step": 538474, "epoch": 6487} {"train_loss": -27.601953506469727, "global_step": 538475, "epoch": 6487} {"train_loss": -27.90204429626465, "global_step": 538476, "epoch": 6487} {"train_loss": -27.43387222290039, "global_step": 538477, "epoch": 6487} {"train_loss": -27.63887596130371, "global_step": 538478, "epoch": 6487} {"train_loss": -27.40803337097168, "global_step": 538479, "epoch": 6487} {"train_loss": -27.566030502319336, "global_step": 538480, "epoch": 6487} {"train_loss": -27.444494247436523, "global_step": 538481, "epoch": 6487} {"train_loss": -27.41914176940918, "global_step": 538482, "epoch": 6487} {"train_loss": -27.62847900390625, "global_step": 538483, "epoch": 6487} {"train_loss": -27.991607666015625, "global_step": 538484, "epoch": 6487} {"train_loss": -27.899137496948242, "global_step": 538485, "epoch": 6487} {"train_loss": -27.258697509765625, "global_step": 538486, "epoch": 6487} {"train_loss": -27.7816162109375, "global_step": 538487, "epoch": 6487} {"train_loss": -27.59565544128418, "global_step": 538488, "epoch": 6487} {"train_loss": -27.986486434936523, "global_step": 538489, "epoch": 6487} {"train_loss": -27.465429306030273, "global_step": 538490, "epoch": 6487} {"train_loss": -27.49761390686035, "global_step": 538491, "epoch": 6487} {"train_loss": -27.98896598815918, "global_step": 538492, "epoch": 6487} {"train_loss": -27.786380767822266, "global_step": 538493, "epoch": 6487} {"train_loss": -27.4251766204834, "global_step": 538494, "epoch": 6487} {"train_loss": -27.7520694732666, "global_step": 538495, "epoch": 6487} {"train_loss": -27.397058486938477, "global_step": 538496, "epoch": 6487} {"train_loss": -27.504444122314453, "global_step": 538497, "epoch": 6487} {"train_loss": -27.349857330322266, "global_step": 538498, "epoch": 6487} {"train_loss": -27.528181076049805, "global_step": 538499, "epoch": 6487} {"train_loss": -27.7572078704834, "global_step": 538500, "epoch": 6487} {"train_loss": -27.167102813720703, "global_step": 538501, "epoch": 6487} {"train_loss": -27.344776153564453, "global_step": 538502, "epoch": 6487} {"train_loss": -27.558436589068677, "global_step": 538503, "epoch": 6487, "val_loss": 6447782.0} {"train_loss": -27.282934188842773, "global_step": 538504, "epoch": 6488} {"train_loss": -26.390625, "global_step": 538505, "epoch": 6488} {"train_loss": -26.916034698486328, "global_step": 538506, "epoch": 6488} {"train_loss": -26.566816329956055, "global_step": 538507, "epoch": 6488} {"train_loss": -27.114032745361328, "global_step": 538508, "epoch": 6488} {"train_loss": -26.893178939819336, "global_step": 538509, "epoch": 6488} {"train_loss": -26.57389259338379, "global_step": 538510, "epoch": 6488} {"train_loss": -27.074188232421875, "global_step": 538511, "epoch": 6488} {"train_loss": -26.74658203125, "global_step": 538512, "epoch": 6488} {"train_loss": -27.169599533081055, "global_step": 538513, "epoch": 6488} {"train_loss": -27.1262149810791, "global_step": 538514, "epoch": 6488} {"train_loss": -27.207386016845703, "global_step": 538515, "epoch": 6488} {"train_loss": -26.73583984375, "global_step": 538516, "epoch": 6488} {"train_loss": -27.392688751220703, "global_step": 538517, "epoch": 6488} {"train_loss": -26.92998695373535, "global_step": 538518, "epoch": 6488} {"train_loss": -26.84377098083496, "global_step": 538519, "epoch": 6488} {"train_loss": -27.365554809570312, "global_step": 538520, "epoch": 6488} {"train_loss": -27.47718620300293, "global_step": 538521, "epoch": 6488} {"train_loss": -27.750722885131836, "global_step": 538522, "epoch": 6488} {"train_loss": -27.278833389282227, "global_step": 538523, "epoch": 6488} {"train_loss": -27.063526153564453, "global_step": 538524, "epoch": 6488} {"train_loss": -27.618818283081055, "global_step": 538525, "epoch": 6488} {"train_loss": -27.69146156311035, "global_step": 538526, "epoch": 6488} {"train_loss": -27.20538902282715, "global_step": 538527, "epoch": 6488} {"train_loss": -27.68793296813965, "global_step": 538528, "epoch": 6488} {"train_loss": -27.469385147094727, "global_step": 538529, "epoch": 6488} {"train_loss": -27.48079490661621, "global_step": 538530, "epoch": 6488} {"train_loss": -27.873748779296875, "global_step": 538531, "epoch": 6488} {"train_loss": -27.40134620666504, "global_step": 538532, "epoch": 6488} {"train_loss": -27.518756866455078, "global_step": 538533, "epoch": 6488} {"train_loss": -27.598947525024414, "global_step": 538534, "epoch": 6488} {"train_loss": -27.42994499206543, "global_step": 538535, "epoch": 6488} {"train_loss": -27.383161544799805, "global_step": 538536, "epoch": 6488} {"train_loss": -27.746112823486328, "global_step": 538537, "epoch": 6488} {"train_loss": -27.83954429626465, "global_step": 538538, "epoch": 6488} {"train_loss": -28.113311767578125, "global_step": 538539, "epoch": 6488} {"train_loss": -27.64789390563965, "global_step": 538540, "epoch": 6488} {"train_loss": -28.021711349487305, "global_step": 538541, "epoch": 6488} {"train_loss": -27.93534278869629, "global_step": 538542, "epoch": 6488} {"train_loss": -27.926748275756836, "global_step": 538543, "epoch": 6488} {"train_loss": -27.585830688476562, "global_step": 538544, "epoch": 6488} {"train_loss": -28.061054229736328, "global_step": 538545, "epoch": 6488} {"train_loss": -28.077802658081055, "global_step": 538546, "epoch": 6488} {"train_loss": -28.160160064697266, "global_step": 538547, "epoch": 6488} {"train_loss": -27.880512237548828, "global_step": 538548, "epoch": 6488} {"train_loss": -27.716161727905273, "global_step": 538549, "epoch": 6488} {"train_loss": -27.84394645690918, "global_step": 538550, "epoch": 6488} {"train_loss": -28.073150634765625, "global_step": 538551, "epoch": 6488} {"train_loss": -27.573007583618164, "global_step": 538552, "epoch": 6488} {"train_loss": -27.625349044799805, "global_step": 538553, "epoch": 6488} {"train_loss": -28.081247329711914, "global_step": 538554, "epoch": 6488} {"train_loss": -27.709253311157227, "global_step": 538555, "epoch": 6488} {"train_loss": -27.660913467407227, "global_step": 538556, "epoch": 6488} {"train_loss": -27.577381134033203, "global_step": 538557, "epoch": 6488} {"train_loss": -26.87636375427246, "global_step": 538558, "epoch": 6488} {"train_loss": -27.005512237548828, "global_step": 538559, "epoch": 6488} {"train_loss": -26.54829216003418, "global_step": 538560, "epoch": 6488} {"train_loss": -26.14866065979004, "global_step": 538561, "epoch": 6488} {"train_loss": -27.39499855041504, "global_step": 538562, "epoch": 6488} {"train_loss": -27.202680587768555, "global_step": 538563, "epoch": 6488} {"train_loss": -27.04132080078125, "global_step": 538564, "epoch": 6488} {"train_loss": -27.56689453125, "global_step": 538565, "epoch": 6488} {"train_loss": -27.02716064453125, "global_step": 538566, "epoch": 6488} {"train_loss": -27.650787353515625, "global_step": 538567, "epoch": 6488} {"train_loss": -27.168060302734375, "global_step": 538568, "epoch": 6488} {"train_loss": -27.84754753112793, "global_step": 538569, "epoch": 6488} {"train_loss": -27.412214279174805, "global_step": 538570, "epoch": 6488} {"train_loss": -27.806354522705078, "global_step": 538571, "epoch": 6488} {"train_loss": -27.552398681640625, "global_step": 538572, "epoch": 6488} {"train_loss": -27.797082901000977, "global_step": 538573, "epoch": 6488} {"train_loss": -27.76262855529785, "global_step": 538574, "epoch": 6488} {"train_loss": -27.341922760009766, "global_step": 538575, "epoch": 6488} {"train_loss": -27.38568687438965, "global_step": 538576, "epoch": 6488} {"train_loss": -27.567127227783203, "global_step": 538577, "epoch": 6488} {"train_loss": -27.559478759765625, "global_step": 538578, "epoch": 6488} {"train_loss": -27.68732261657715, "global_step": 538579, "epoch": 6488} {"train_loss": -27.52247428894043, "global_step": 538580, "epoch": 6488} {"train_loss": -27.27105140686035, "global_step": 538581, "epoch": 6488} {"train_loss": -27.519662857055664, "global_step": 538582, "epoch": 6488} {"train_loss": -27.707483291625977, "global_step": 538583, "epoch": 6488} {"train_loss": -27.820758819580078, "global_step": 538584, "epoch": 6488} {"train_loss": -27.461750030517578, "global_step": 538585, "epoch": 6488} {"train_loss": -27.4447715023914, "global_step": 538586, "epoch": 6488, "val_loss": 6492375.5} {"train_loss": -27.111799240112305, "global_step": 538587, "epoch": 6489} {"train_loss": -27.123388290405273, "global_step": 538588, "epoch": 6489} {"train_loss": -27.47403335571289, "global_step": 538589, "epoch": 6489} {"train_loss": -27.521839141845703, "global_step": 538590, "epoch": 6489} {"train_loss": -27.01051902770996, "global_step": 538591, "epoch": 6489} {"train_loss": -27.0189151763916, "global_step": 538592, "epoch": 6489} {"train_loss": -27.526784896850586, "global_step": 538593, "epoch": 6489} {"train_loss": -27.363916397094727, "global_step": 538594, "epoch": 6489} {"train_loss": -27.250930786132812, "global_step": 538595, "epoch": 6489} {"train_loss": -27.453277587890625, "global_step": 538596, "epoch": 6489} {"train_loss": -27.76983642578125, "global_step": 538597, "epoch": 6489} {"train_loss": -27.856657028198242, "global_step": 538598, "epoch": 6489} {"train_loss": -27.034570693969727, "global_step": 538599, "epoch": 6489} {"train_loss": -27.74054527282715, "global_step": 538600, "epoch": 6489} {"train_loss": -27.236663818359375, "global_step": 538601, "epoch": 6489} {"train_loss": -27.705657958984375, "global_step": 538602, "epoch": 6489} {"train_loss": -27.44679069519043, "global_step": 538603, "epoch": 6489} {"train_loss": -27.638784408569336, "global_step": 538604, "epoch": 6489} {"train_loss": -27.581939697265625, "global_step": 538605, "epoch": 6489} {"train_loss": -27.609027862548828, "global_step": 538606, "epoch": 6489} {"train_loss": -27.819604873657227, "global_step": 538607, "epoch": 6489} {"train_loss": -27.60822105407715, "global_step": 538608, "epoch": 6489} {"train_loss": -27.52448081970215, "global_step": 538609, "epoch": 6489} {"train_loss": -27.566619873046875, "global_step": 538610, "epoch": 6489} {"train_loss": -27.75284767150879, "global_step": 538611, "epoch": 6489} {"train_loss": -27.539569854736328, "global_step": 538612, "epoch": 6489} {"train_loss": -27.687009811401367, "global_step": 538613, "epoch": 6489} {"train_loss": -27.503782272338867, "global_step": 538614, "epoch": 6489} {"train_loss": -28.00516128540039, "global_step": 538615, "epoch": 6489} {"train_loss": -27.698749542236328, "global_step": 538616, "epoch": 6489} {"train_loss": -27.52593994140625, "global_step": 538617, "epoch": 6489} {"train_loss": -27.85987663269043, "global_step": 538618, "epoch": 6489} {"train_loss": -27.70489501953125, "global_step": 538619, "epoch": 6489} {"train_loss": -27.603403091430664, "global_step": 538620, "epoch": 6489} {"train_loss": -27.933332443237305, "global_step": 538621, "epoch": 6489} {"train_loss": -27.5926513671875, "global_step": 538622, "epoch": 6489} {"train_loss": -27.66362953186035, "global_step": 538623, "epoch": 6489} {"train_loss": -27.595861434936523, "global_step": 538624, "epoch": 6489} {"train_loss": -27.65875244140625, "global_step": 538625, "epoch": 6489} {"train_loss": -27.54488182067871, "global_step": 538626, "epoch": 6489} {"train_loss": -27.70196533203125, "global_step": 538627, "epoch": 6489} {"train_loss": -27.527082443237305, "global_step": 538628, "epoch": 6489} {"train_loss": -27.522235870361328, "global_step": 538629, "epoch": 6489} {"train_loss": -27.539533615112305, "global_step": 538630, "epoch": 6489} {"train_loss": -27.37721824645996, "global_step": 538631, "epoch": 6489} {"train_loss": -27.417266845703125, "global_step": 538632, "epoch": 6489} {"train_loss": -27.59868812561035, "global_step": 538633, "epoch": 6489} {"train_loss": -27.509763717651367, "global_step": 538634, "epoch": 6489} {"train_loss": -27.685901641845703, "global_step": 538635, "epoch": 6489} {"train_loss": -27.483463287353516, "global_step": 538636, "epoch": 6489} {"train_loss": -27.5949764251709, "global_step": 538637, "epoch": 6489} {"train_loss": -27.991071701049805, "global_step": 538638, "epoch": 6489} {"train_loss": -27.607221603393555, "global_step": 538639, "epoch": 6489} {"train_loss": -27.35833168029785, "global_step": 538640, "epoch": 6489} {"train_loss": -27.49061393737793, "global_step": 538641, "epoch": 6489} {"train_loss": -26.556074142456055, "global_step": 538642, "epoch": 6489} {"train_loss": -26.318653106689453, "global_step": 538643, "epoch": 6489} {"train_loss": -27.585708618164062, "global_step": 538644, "epoch": 6489} {"train_loss": -27.410846710205078, "global_step": 538645, "epoch": 6489} {"train_loss": -27.874317169189453, "global_step": 538646, "epoch": 6489} {"train_loss": -27.273956298828125, "global_step": 538647, "epoch": 6489} {"train_loss": -27.58136558532715, "global_step": 538648, "epoch": 6489} {"train_loss": -27.830474853515625, "global_step": 538649, "epoch": 6489} {"train_loss": -27.27880859375, "global_step": 538650, "epoch": 6489} {"train_loss": -27.703351974487305, "global_step": 538651, "epoch": 6489} {"train_loss": -27.3983211517334, "global_step": 538652, "epoch": 6489} {"train_loss": -27.607160568237305, "global_step": 538653, "epoch": 6489} {"train_loss": -27.820676803588867, "global_step": 538654, "epoch": 6489} {"train_loss": -27.724414825439453, "global_step": 538655, "epoch": 6489} {"train_loss": -27.703168869018555, "global_step": 538656, "epoch": 6489} {"train_loss": -27.91632080078125, "global_step": 538657, "epoch": 6489} {"train_loss": -27.729455947875977, "global_step": 538658, "epoch": 6489} {"train_loss": -27.59858512878418, "global_step": 538659, "epoch": 6489} {"train_loss": -27.713184356689453, "global_step": 538660, "epoch": 6489} {"train_loss": -27.57061195373535, "global_step": 538661, "epoch": 6489} {"train_loss": -27.67108154296875, "global_step": 538662, "epoch": 6489} {"train_loss": -27.711944580078125, "global_step": 538663, "epoch": 6489} {"train_loss": -27.537336349487305, "global_step": 538664, "epoch": 6489} {"train_loss": -27.847370147705078, "global_step": 538665, "epoch": 6489} {"train_loss": -27.663305282592773, "global_step": 538666, "epoch": 6489} {"train_loss": -27.45084571838379, "global_step": 538667, "epoch": 6489} {"train_loss": -27.40142822265625, "global_step": 538668, "epoch": 6489} {"train_loss": -27.53943461682423, "global_step": 538669, "epoch": 6489, "val_loss": 6461859.5} {"train_loss": -27.507043838500977, "global_step": 538670, "epoch": 6490} {"train_loss": -27.68804359436035, "global_step": 538671, "epoch": 6490} {"train_loss": -27.100309371948242, "global_step": 538672, "epoch": 6490} {"train_loss": -27.626977920532227, "global_step": 538673, "epoch": 6490} {"train_loss": -27.1098690032959, "global_step": 538674, "epoch": 6490} {"train_loss": -26.93446159362793, "global_step": 538675, "epoch": 6490} {"train_loss": -27.285083770751953, "global_step": 538676, "epoch": 6490} {"train_loss": -27.0693416595459, "global_step": 538677, "epoch": 6490} {"train_loss": -27.40836524963379, "global_step": 538678, "epoch": 6490} {"train_loss": -27.33579444885254, "global_step": 538679, "epoch": 6490} {"train_loss": -27.626834869384766, "global_step": 538680, "epoch": 6490} {"train_loss": -27.800992965698242, "global_step": 538681, "epoch": 6490} {"train_loss": -27.167205810546875, "global_step": 538682, "epoch": 6490} {"train_loss": -27.64859962463379, "global_step": 538683, "epoch": 6490} {"train_loss": -27.57460594177246, "global_step": 538684, "epoch": 6490} {"train_loss": -27.37380027770996, "global_step": 538685, "epoch": 6490} {"train_loss": -27.41141128540039, "global_step": 538686, "epoch": 6490} {"train_loss": -27.63628578186035, "global_step": 538687, "epoch": 6490} {"train_loss": -27.370075225830078, "global_step": 538688, "epoch": 6490} {"train_loss": -27.359861373901367, "global_step": 538689, "epoch": 6490} {"train_loss": -27.734411239624023, "global_step": 538690, "epoch": 6490} {"train_loss": -27.7387752532959, "global_step": 538691, "epoch": 6490} {"train_loss": -27.64619255065918, "global_step": 538692, "epoch": 6490} {"train_loss": -27.91583824157715, "global_step": 538693, "epoch": 6490} {"train_loss": -27.69775390625, "global_step": 538694, "epoch": 6490} {"train_loss": -27.7981014251709, "global_step": 538695, "epoch": 6490} {"train_loss": -27.704315185546875, "global_step": 538696, "epoch": 6490} {"train_loss": -27.29833984375, "global_step": 538697, "epoch": 6490} {"train_loss": -27.74359130859375, "global_step": 538698, "epoch": 6490} {"train_loss": -27.477985382080078, "global_step": 538699, "epoch": 6490} {"train_loss": -27.788227081298828, "global_step": 538700, "epoch": 6490} {"train_loss": -27.809452056884766, "global_step": 538701, "epoch": 6490} {"train_loss": -27.40321159362793, "global_step": 538702, "epoch": 6490} {"train_loss": -27.724515914916992, "global_step": 538703, "epoch": 6490} {"train_loss": -27.927637100219727, "global_step": 538704, "epoch": 6490} {"train_loss": -27.363662719726562, "global_step": 538705, "epoch": 6490} {"train_loss": -27.806421279907227, "global_step": 538706, "epoch": 6490} {"train_loss": -27.874494552612305, "global_step": 538707, "epoch": 6490} {"train_loss": -27.796079635620117, "global_step": 538708, "epoch": 6490} {"train_loss": -28.1882266998291, "global_step": 538709, "epoch": 6490} {"train_loss": -27.751605987548828, "global_step": 538710, "epoch": 6490} {"train_loss": -27.288801193237305, "global_step": 538711, "epoch": 6490} {"train_loss": -27.808765411376953, "global_step": 538712, "epoch": 6490} {"train_loss": -27.34014892578125, "global_step": 538713, "epoch": 6490} {"train_loss": -27.74471092224121, "global_step": 538714, "epoch": 6490} {"train_loss": -27.7094669342041, "global_step": 538715, "epoch": 6490} {"train_loss": -27.577856063842773, "global_step": 538716, "epoch": 6490} {"train_loss": -27.337438583374023, "global_step": 538717, "epoch": 6490} {"train_loss": -27.604297637939453, "global_step": 538718, "epoch": 6490} {"train_loss": -27.702362060546875, "global_step": 538719, "epoch": 6490} {"train_loss": -27.725116729736328, "global_step": 538720, "epoch": 6490} {"train_loss": -27.677717208862305, "global_step": 538721, "epoch": 6490} {"train_loss": -27.514142990112305, "global_step": 538722, "epoch": 6490} {"train_loss": -27.470701217651367, "global_step": 538723, "epoch": 6490} {"train_loss": -27.897659301757812, "global_step": 538724, "epoch": 6490} {"train_loss": -27.58514976501465, "global_step": 538725, "epoch": 6490} {"train_loss": -28.065616607666016, "global_step": 538726, "epoch": 6490} {"train_loss": -27.320068359375, "global_step": 538727, "epoch": 6490} {"train_loss": -27.857961654663086, "global_step": 538728, "epoch": 6490} {"train_loss": -27.60455322265625, "global_step": 538729, "epoch": 6490} {"train_loss": -27.468488693237305, "global_step": 538730, "epoch": 6490} {"train_loss": -27.261016845703125, "global_step": 538731, "epoch": 6490} {"train_loss": -27.165536880493164, "global_step": 538732, "epoch": 6490} {"train_loss": -26.372053146362305, "global_step": 538733, "epoch": 6490} {"train_loss": -26.327472686767578, "global_step": 538734, "epoch": 6490} {"train_loss": -26.632986068725586, "global_step": 538735, "epoch": 6490} {"train_loss": -26.781768798828125, "global_step": 538736, "epoch": 6490} {"train_loss": -26.710485458374023, "global_step": 538737, "epoch": 6490} {"train_loss": -27.065479278564453, "global_step": 538738, "epoch": 6490} {"train_loss": -27.40949058532715, "global_step": 538739, "epoch": 6490} {"train_loss": -26.992340087890625, "global_step": 538740, "epoch": 6490} {"train_loss": -27.31892204284668, "global_step": 538741, "epoch": 6490} {"train_loss": -27.429285049438477, "global_step": 538742, "epoch": 6490} {"train_loss": -27.396982192993164, "global_step": 538743, "epoch": 6490} {"train_loss": -27.490100860595703, "global_step": 538744, "epoch": 6490} {"train_loss": -27.750802993774414, "global_step": 538745, "epoch": 6490} {"train_loss": -27.37689208984375, "global_step": 538746, "epoch": 6490} {"train_loss": -27.37836265563965, "global_step": 538747, "epoch": 6490} {"train_loss": -27.729028701782227, "global_step": 538748, "epoch": 6490} {"train_loss": -27.696231842041016, "global_step": 538749, "epoch": 6490} {"train_loss": -27.673730850219727, "global_step": 538750, "epoch": 6490} {"train_loss": -27.563596725463867, "global_step": 538751, "epoch": 6490} {"train_loss": -27.48362534304699, "global_step": 538752, "epoch": 6490, "val_loss": 6439192.0} {"train_loss": -26.99338150024414, "global_step": 538753, "epoch": 6491} {"train_loss": -27.282672882080078, "global_step": 538754, "epoch": 6491} {"train_loss": -27.414264678955078, "global_step": 538755, "epoch": 6491} {"train_loss": -27.315784454345703, "global_step": 538756, "epoch": 6491} {"train_loss": -26.989810943603516, "global_step": 538757, "epoch": 6491} {"train_loss": -27.44013023376465, "global_step": 538758, "epoch": 6491} {"train_loss": -27.60841178894043, "global_step": 538759, "epoch": 6491} {"train_loss": -27.498035430908203, "global_step": 538760, "epoch": 6491} {"train_loss": -27.140869140625, "global_step": 538761, "epoch": 6491} {"train_loss": -27.480154037475586, "global_step": 538762, "epoch": 6491} {"train_loss": -27.607166290283203, "global_step": 538763, "epoch": 6491} {"train_loss": -27.7447509765625, "global_step": 538764, "epoch": 6491} {"train_loss": -27.380340576171875, "global_step": 538765, "epoch": 6491} {"train_loss": -27.5469970703125, "global_step": 538766, "epoch": 6491} {"train_loss": -27.434894561767578, "global_step": 538767, "epoch": 6491} {"train_loss": -27.724536895751953, "global_step": 538768, "epoch": 6491} {"train_loss": -27.43890953063965, "global_step": 538769, "epoch": 6491} {"train_loss": -27.63702964782715, "global_step": 538770, "epoch": 6491} {"train_loss": -27.84815788269043, "global_step": 538771, "epoch": 6491} {"train_loss": -27.785520553588867, "global_step": 538772, "epoch": 6491} {"train_loss": -28.1385555267334, "global_step": 538773, "epoch": 6491} {"train_loss": -27.487375259399414, "global_step": 538774, "epoch": 6491} {"train_loss": -27.74755859375, "global_step": 538775, "epoch": 6491} {"train_loss": -27.733808517456055, "global_step": 538776, "epoch": 6491} {"train_loss": -27.83700942993164, "global_step": 538777, "epoch": 6491} {"train_loss": -27.494312286376953, "global_step": 538778, "epoch": 6491} {"train_loss": -27.8470401763916, "global_step": 538779, "epoch": 6491} {"train_loss": -27.92896842956543, "global_step": 538780, "epoch": 6491} {"train_loss": -27.7126407623291, "global_step": 538781, "epoch": 6491} {"train_loss": -27.935016632080078, "global_step": 538782, "epoch": 6491} {"train_loss": -27.541723251342773, "global_step": 538783, "epoch": 6491} {"train_loss": -28.07325553894043, "global_step": 538784, "epoch": 6491} {"train_loss": -27.8746337890625, "global_step": 538785, "epoch": 6491} {"train_loss": -28.15048599243164, "global_step": 538786, "epoch": 6491} {"train_loss": -28.124570846557617, "global_step": 538787, "epoch": 6491} {"train_loss": -27.81292724609375, "global_step": 538788, "epoch": 6491} {"train_loss": -28.071762084960938, "global_step": 538789, "epoch": 6491} {"train_loss": -27.55130958557129, "global_step": 538790, "epoch": 6491} {"train_loss": -28.134719848632812, "global_step": 538791, "epoch": 6491} {"train_loss": -27.792760848999023, "global_step": 538792, "epoch": 6491} {"train_loss": -28.03647804260254, "global_step": 538793, "epoch": 6491} {"train_loss": -28.00018310546875, "global_step": 538794, "epoch": 6491} {"train_loss": -27.773534774780273, "global_step": 538795, "epoch": 6491} {"train_loss": -27.51875114440918, "global_step": 538796, "epoch": 6491} {"train_loss": -27.41412353515625, "global_step": 538797, "epoch": 6491} {"train_loss": -27.47287940979004, "global_step": 538798, "epoch": 6491} {"train_loss": -27.467985153198242, "global_step": 538799, "epoch": 6491} {"train_loss": -27.429738998413086, "global_step": 538800, "epoch": 6491} {"train_loss": -27.596094131469727, "global_step": 538801, "epoch": 6491} {"train_loss": -27.97674560546875, "global_step": 538802, "epoch": 6491} {"train_loss": -28.019821166992188, "global_step": 538803, "epoch": 6491} {"train_loss": -27.976444244384766, "global_step": 538804, "epoch": 6491} {"train_loss": -27.643583297729492, "global_step": 538805, "epoch": 6491} {"train_loss": -27.892669677734375, "global_step": 538806, "epoch": 6491} {"train_loss": -27.760974884033203, "global_step": 538807, "epoch": 6491} {"train_loss": -27.47840690612793, "global_step": 538808, "epoch": 6491} {"train_loss": -27.771421432495117, "global_step": 538809, "epoch": 6491} {"train_loss": -27.6760196685791, "global_step": 538810, "epoch": 6491} {"train_loss": -27.80950355529785, "global_step": 538811, "epoch": 6491} {"train_loss": -27.43202018737793, "global_step": 538812, "epoch": 6491} {"train_loss": -27.658573150634766, "global_step": 538813, "epoch": 6491} {"train_loss": -28.133695602416992, "global_step": 538814, "epoch": 6491} {"train_loss": -27.95269775390625, "global_step": 538815, "epoch": 6491} {"train_loss": -27.41938591003418, "global_step": 538816, "epoch": 6491} {"train_loss": -27.5849666595459, "global_step": 538817, "epoch": 6491} {"train_loss": -28.247037887573242, "global_step": 538818, "epoch": 6491} {"train_loss": -27.5460205078125, "global_step": 538819, "epoch": 6491} {"train_loss": -27.25604820251465, "global_step": 538820, "epoch": 6491} {"train_loss": -27.05171012878418, "global_step": 538821, "epoch": 6491} {"train_loss": -27.11957359313965, "global_step": 538822, "epoch": 6491} {"train_loss": -27.499128341674805, "global_step": 538823, "epoch": 6491} {"train_loss": -26.95057487487793, "global_step": 538824, "epoch": 6491} {"train_loss": -27.6304931640625, "global_step": 538825, "epoch": 6491} {"train_loss": -27.735883712768555, "global_step": 538826, "epoch": 6491} {"train_loss": -27.536081314086914, "global_step": 538827, "epoch": 6491} {"train_loss": -27.70135498046875, "global_step": 538828, "epoch": 6491} {"train_loss": -26.805145263671875, "global_step": 538829, "epoch": 6491} {"train_loss": -26.941425323486328, "global_step": 538830, "epoch": 6491} {"train_loss": -27.4987735748291, "global_step": 538831, "epoch": 6491} {"train_loss": -27.171466827392578, "global_step": 538832, "epoch": 6491} {"train_loss": -26.85724449157715, "global_step": 538833, "epoch": 6491} {"train_loss": -27.1291561126709, "global_step": 538834, "epoch": 6491} {"train_loss": -27.620054750557404, "global_step": 538835, "epoch": 6491, "val_loss": 6544394.0} {"train_loss": -27.1002254486084, "global_step": 538836, "epoch": 6492} {"train_loss": -26.45218849182129, "global_step": 538837, "epoch": 6492} {"train_loss": -27.10675621032715, "global_step": 538838, "epoch": 6492} {"train_loss": -26.738330841064453, "global_step": 538839, "epoch": 6492} {"train_loss": -26.442916870117188, "global_step": 538840, "epoch": 6492} {"train_loss": -26.98073387145996, "global_step": 538841, "epoch": 6492} {"train_loss": -27.006988525390625, "global_step": 538842, "epoch": 6492} {"train_loss": -27.431859970092773, "global_step": 538843, "epoch": 6492} {"train_loss": -27.567453384399414, "global_step": 538844, "epoch": 6492} {"train_loss": -27.0206241607666, "global_step": 538845, "epoch": 6492} {"train_loss": -26.898298263549805, "global_step": 538846, "epoch": 6492} {"train_loss": -26.9622859954834, "global_step": 538847, "epoch": 6492} {"train_loss": -27.099241256713867, "global_step": 538848, "epoch": 6492} {"train_loss": -27.43678092956543, "global_step": 538849, "epoch": 6492} {"train_loss": -27.48480224609375, "global_step": 538850, "epoch": 6492} {"train_loss": -27.463048934936523, "global_step": 538851, "epoch": 6492} {"train_loss": -27.336210250854492, "global_step": 538852, "epoch": 6492} {"train_loss": -27.388471603393555, "global_step": 538853, "epoch": 6492} {"train_loss": -27.48486328125, "global_step": 538854, "epoch": 6492} {"train_loss": -27.462787628173828, "global_step": 538855, "epoch": 6492} {"train_loss": -27.06764793395996, "global_step": 538856, "epoch": 6492} {"train_loss": -27.499536514282227, "global_step": 538857, "epoch": 6492} {"train_loss": -27.958539962768555, "global_step": 538858, "epoch": 6492} {"train_loss": -27.477191925048828, "global_step": 538859, "epoch": 6492} {"train_loss": -27.5462589263916, "global_step": 538860, "epoch": 6492} {"train_loss": -27.758304595947266, "global_step": 538861, "epoch": 6492} {"train_loss": -28.016752243041992, "global_step": 538862, "epoch": 6492} {"train_loss": -27.86713218688965, "global_step": 538863, "epoch": 6492} {"train_loss": -27.456884384155273, "global_step": 538864, "epoch": 6492} {"train_loss": -27.397174835205078, "global_step": 538865, "epoch": 6492} {"train_loss": -27.510562896728516, "global_step": 538866, "epoch": 6492} {"train_loss": -27.70290184020996, "global_step": 538867, "epoch": 6492} {"train_loss": -27.350046157836914, "global_step": 538868, "epoch": 6492} {"train_loss": -27.773374557495117, "global_step": 538869, "epoch": 6492} {"train_loss": -27.878087997436523, "global_step": 538870, "epoch": 6492} {"train_loss": -27.873620986938477, "global_step": 538871, "epoch": 6492} {"train_loss": -28.17399024963379, "global_step": 538872, "epoch": 6492} {"train_loss": -28.39190101623535, "global_step": 538873, "epoch": 6492} {"train_loss": -27.65412712097168, "global_step": 538874, "epoch": 6492} {"train_loss": -28.064910888671875, "global_step": 538875, "epoch": 6492} {"train_loss": -28.148883819580078, "global_step": 538876, "epoch": 6492} {"train_loss": -28.000274658203125, "global_step": 538877, "epoch": 6492} {"train_loss": -27.869482040405273, "global_step": 538878, "epoch": 6492} {"train_loss": -27.698200225830078, "global_step": 538879, "epoch": 6492} {"train_loss": -28.01481056213379, "global_step": 538880, "epoch": 6492} {"train_loss": -27.601720809936523, "global_step": 538881, "epoch": 6492} {"train_loss": -27.599777221679688, "global_step": 538882, "epoch": 6492} {"train_loss": -27.328693389892578, "global_step": 538883, "epoch": 6492} {"train_loss": -27.536636352539062, "global_step": 538884, "epoch": 6492} {"train_loss": -27.387298583984375, "global_step": 538885, "epoch": 6492} {"train_loss": -27.923730850219727, "global_step": 538886, "epoch": 6492} {"train_loss": -27.575366973876953, "global_step": 538887, "epoch": 6492} {"train_loss": -27.93868064880371, "global_step": 538888, "epoch": 6492} {"train_loss": -28.03712272644043, "global_step": 538889, "epoch": 6492} {"train_loss": -27.615076065063477, "global_step": 538890, "epoch": 6492} {"train_loss": -27.931488037109375, "global_step": 538891, "epoch": 6492} {"train_loss": -27.502628326416016, "global_step": 538892, "epoch": 6492} {"train_loss": -26.948104858398438, "global_step": 538893, "epoch": 6492} {"train_loss": -27.439895629882812, "global_step": 538894, "epoch": 6492} {"train_loss": -28.112226486206055, "global_step": 538895, "epoch": 6492} {"train_loss": -27.676992416381836, "global_step": 538896, "epoch": 6492} {"train_loss": -27.28521728515625, "global_step": 538897, "epoch": 6492} {"train_loss": -27.78631019592285, "global_step": 538898, "epoch": 6492} {"train_loss": -27.95978355407715, "global_step": 538899, "epoch": 6492} {"train_loss": -27.9471492767334, "global_step": 538900, "epoch": 6492} {"train_loss": -27.643728256225586, "global_step": 538901, "epoch": 6492} {"train_loss": -27.4197998046875, "global_step": 538902, "epoch": 6492} {"train_loss": -27.592660903930664, "global_step": 538903, "epoch": 6492} {"train_loss": -27.8995418548584, "global_step": 538904, "epoch": 6492} {"train_loss": -27.563749313354492, "global_step": 538905, "epoch": 6492} {"train_loss": -27.50714111328125, "global_step": 538906, "epoch": 6492} {"train_loss": -27.411596298217773, "global_step": 538907, "epoch": 6492} {"train_loss": -27.321929931640625, "global_step": 538908, "epoch": 6492} {"train_loss": -27.787139892578125, "global_step": 538909, "epoch": 6492} {"train_loss": -28.05427360534668, "global_step": 538910, "epoch": 6492} {"train_loss": -27.619016647338867, "global_step": 538911, "epoch": 6492} {"train_loss": -27.895421981811523, "global_step": 538912, "epoch": 6492} {"train_loss": -27.747976303100586, "global_step": 538913, "epoch": 6492} {"train_loss": -27.560277938842773, "global_step": 538914, "epoch": 6492} {"train_loss": -27.897964477539062, "global_step": 538915, "epoch": 6492} {"train_loss": -27.749860763549805, "global_step": 538916, "epoch": 6492} {"train_loss": -27.894880294799805, "global_step": 538917, "epoch": 6492} {"train_loss": -27.547389340687946, "global_step": 538918, "epoch": 6492, "val_loss": 6463034.0} {"train_loss": -27.436359405517578, "global_step": 538919, "epoch": 6493} {"train_loss": -27.328296661376953, "global_step": 538920, "epoch": 6493} {"train_loss": -26.82549476623535, "global_step": 538921, "epoch": 6493} {"train_loss": -27.28541374206543, "global_step": 538922, "epoch": 6493} {"train_loss": -27.6011905670166, "global_step": 538923, "epoch": 6493} {"train_loss": -27.0422420501709, "global_step": 538924, "epoch": 6493} {"train_loss": -27.358259201049805, "global_step": 538925, "epoch": 6493} {"train_loss": -27.077131271362305, "global_step": 538926, "epoch": 6493} {"train_loss": -26.957624435424805, "global_step": 538927, "epoch": 6493} {"train_loss": -28.033065795898438, "global_step": 538928, "epoch": 6493} {"train_loss": -27.638671875, "global_step": 538929, "epoch": 6493} {"train_loss": -27.537677764892578, "global_step": 538930, "epoch": 6493} {"train_loss": -27.253942489624023, "global_step": 538931, "epoch": 6493} {"train_loss": -27.544431686401367, "global_step": 538932, "epoch": 6493} {"train_loss": -27.37945556640625, "global_step": 538933, "epoch": 6493} {"train_loss": -27.510623931884766, "global_step": 538934, "epoch": 6493} {"train_loss": -27.518659591674805, "global_step": 538935, "epoch": 6493} {"train_loss": -27.459115982055664, "global_step": 538936, "epoch": 6493} {"train_loss": -27.60831069946289, "global_step": 538937, "epoch": 6493} {"train_loss": -27.837696075439453, "global_step": 538938, "epoch": 6493} {"train_loss": -27.64377212524414, "global_step": 538939, "epoch": 6493} {"train_loss": -27.658063888549805, "global_step": 538940, "epoch": 6493} {"train_loss": -27.614667892456055, "global_step": 538941, "epoch": 6493} {"train_loss": -27.517526626586914, "global_step": 538942, "epoch": 6493} {"train_loss": -27.456201553344727, "global_step": 538943, "epoch": 6493} {"train_loss": -28.10654640197754, "global_step": 538944, "epoch": 6493} {"train_loss": -27.729705810546875, "global_step": 538945, "epoch": 6493} {"train_loss": -27.660675048828125, "global_step": 538946, "epoch": 6493} {"train_loss": -27.376102447509766, "global_step": 538947, "epoch": 6493} {"train_loss": -27.45576286315918, "global_step": 538948, "epoch": 6493} {"train_loss": -27.675556182861328, "global_step": 538949, "epoch": 6493} {"train_loss": -28.0141544342041, "global_step": 538950, "epoch": 6493} {"train_loss": -27.721220016479492, "global_step": 538951, "epoch": 6493} {"train_loss": -27.82917594909668, "global_step": 538952, "epoch": 6493} {"train_loss": -27.58552360534668, "global_step": 538953, "epoch": 6493} {"train_loss": -27.949087142944336, "global_step": 538954, "epoch": 6493} {"train_loss": -27.773040771484375, "global_step": 538955, "epoch": 6493} {"train_loss": -27.662160873413086, "global_step": 538956, "epoch": 6493} {"train_loss": -28.2388858795166, "global_step": 538957, "epoch": 6493} {"train_loss": -27.53952980041504, "global_step": 538958, "epoch": 6493} {"train_loss": -27.9289608001709, "global_step": 538959, "epoch": 6493} {"train_loss": -27.841827392578125, "global_step": 538960, "epoch": 6493} {"train_loss": -27.391874313354492, "global_step": 538961, "epoch": 6493} {"train_loss": -27.7764949798584, "global_step": 538962, "epoch": 6493} {"train_loss": -27.532489776611328, "global_step": 538963, "epoch": 6493} {"train_loss": -27.54799461364746, "global_step": 538964, "epoch": 6493} {"train_loss": -27.369617462158203, "global_step": 538965, "epoch": 6493} {"train_loss": -27.0069522857666, "global_step": 538966, "epoch": 6493} {"train_loss": -26.768268585205078, "global_step": 538967, "epoch": 6493} {"train_loss": -26.9341983795166, "global_step": 538968, "epoch": 6493} {"train_loss": -27.3820743560791, "global_step": 538969, "epoch": 6493} {"train_loss": -27.1508731842041, "global_step": 538970, "epoch": 6493} {"train_loss": -27.694883346557617, "global_step": 538971, "epoch": 6493} {"train_loss": -27.30254554748535, "global_step": 538972, "epoch": 6493} {"train_loss": -27.029190063476562, "global_step": 538973, "epoch": 6493} {"train_loss": -27.119916915893555, "global_step": 538974, "epoch": 6493} {"train_loss": -27.2840518951416, "global_step": 538975, "epoch": 6493} {"train_loss": -27.380273818969727, "global_step": 538976, "epoch": 6493} {"train_loss": -27.517852783203125, "global_step": 538977, "epoch": 6493} {"train_loss": -27.875104904174805, "global_step": 538978, "epoch": 6493} {"train_loss": -27.711963653564453, "global_step": 538979, "epoch": 6493} {"train_loss": -27.5893497467041, "global_step": 538980, "epoch": 6493} {"train_loss": -27.524511337280273, "global_step": 538981, "epoch": 6493} {"train_loss": -27.511646270751953, "global_step": 538982, "epoch": 6493} {"train_loss": -27.706928253173828, "global_step": 538983, "epoch": 6493} {"train_loss": -27.57366371154785, "global_step": 538984, "epoch": 6493} {"train_loss": -27.878448486328125, "global_step": 538985, "epoch": 6493} {"train_loss": -27.965551376342773, "global_step": 538986, "epoch": 6493} {"train_loss": -27.950422286987305, "global_step": 538987, "epoch": 6493} {"train_loss": -27.995832443237305, "global_step": 538988, "epoch": 6493} {"train_loss": -27.781187057495117, "global_step": 538989, "epoch": 6493} {"train_loss": -27.650442123413086, "global_step": 538990, "epoch": 6493} {"train_loss": -27.9295597076416, "global_step": 538991, "epoch": 6493} {"train_loss": -27.61749839782715, "global_step": 538992, "epoch": 6493} {"train_loss": -27.837095260620117, "global_step": 538993, "epoch": 6493} {"train_loss": -27.974023818969727, "global_step": 538994, "epoch": 6493} {"train_loss": -27.700204849243164, "global_step": 538995, "epoch": 6493} {"train_loss": -27.53389549255371, "global_step": 538996, "epoch": 6493} {"train_loss": -27.743322372436523, "global_step": 538997, "epoch": 6493} {"train_loss": -27.462926864624023, "global_step": 538998, "epoch": 6493} {"train_loss": -28.1241455078125, "global_step": 538999, "epoch": 6493} {"train_loss": -27.520099639892578, "global_step": 539000, "epoch": 6493} {"train_loss": -27.58382094050028, "global_step": 539001, "epoch": 6493, "val_loss": 6471329.0} {"train_loss": -27.1231632232666, "global_step": 539002, "epoch": 6494} {"train_loss": -27.193805694580078, "global_step": 539003, "epoch": 6494} {"train_loss": -27.90070915222168, "global_step": 539004, "epoch": 6494} {"train_loss": -27.501585006713867, "global_step": 539005, "epoch": 6494} {"train_loss": -27.446517944335938, "global_step": 539006, "epoch": 6494} {"train_loss": -27.551610946655273, "global_step": 539007, "epoch": 6494} {"train_loss": -27.585187911987305, "global_step": 539008, "epoch": 6494} {"train_loss": -27.25067138671875, "global_step": 539009, "epoch": 6494} {"train_loss": -27.586462020874023, "global_step": 539010, "epoch": 6494} {"train_loss": -27.591238021850586, "global_step": 539011, "epoch": 6494} {"train_loss": -27.941553115844727, "global_step": 539012, "epoch": 6494} {"train_loss": -27.216644287109375, "global_step": 539013, "epoch": 6494} {"train_loss": -27.5875301361084, "global_step": 539014, "epoch": 6494} {"train_loss": -27.365732192993164, "global_step": 539015, "epoch": 6494} {"train_loss": -27.38486099243164, "global_step": 539016, "epoch": 6494} {"train_loss": -27.274930953979492, "global_step": 539017, "epoch": 6494} {"train_loss": -27.759531021118164, "global_step": 539018, "epoch": 6494} {"train_loss": -27.9431095123291, "global_step": 539019, "epoch": 6494} {"train_loss": -27.311620712280273, "global_step": 539020, "epoch": 6494} {"train_loss": -27.566699981689453, "global_step": 539021, "epoch": 6494} {"train_loss": -27.584104537963867, "global_step": 539022, "epoch": 6494} {"train_loss": -27.670608520507812, "global_step": 539023, "epoch": 6494} {"train_loss": -27.317052841186523, "global_step": 539024, "epoch": 6494} {"train_loss": -27.943939208984375, "global_step": 539025, "epoch": 6494} {"train_loss": -27.829334259033203, "global_step": 539026, "epoch": 6494} {"train_loss": -27.840900421142578, "global_step": 539027, "epoch": 6494} {"train_loss": -27.691259384155273, "global_step": 539028, "epoch": 6494} {"train_loss": -27.77369499206543, "global_step": 539029, "epoch": 6494} {"train_loss": -27.770282745361328, "global_step": 539030, "epoch": 6494} {"train_loss": -27.924285888671875, "global_step": 539031, "epoch": 6494} {"train_loss": -27.826404571533203, "global_step": 539032, "epoch": 6494} {"train_loss": -27.48160743713379, "global_step": 539033, "epoch": 6494} {"train_loss": -27.68686294555664, "global_step": 539034, "epoch": 6494} {"train_loss": -27.534406661987305, "global_step": 539035, "epoch": 6494} {"train_loss": -27.6278076171875, "global_step": 539036, "epoch": 6494} {"train_loss": -27.93373680114746, "global_step": 539037, "epoch": 6494} {"train_loss": -27.968957901000977, "global_step": 539038, "epoch": 6494} {"train_loss": -27.81879234313965, "global_step": 539039, "epoch": 6494} {"train_loss": -27.505096435546875, "global_step": 539040, "epoch": 6494} {"train_loss": -27.827611923217773, "global_step": 539041, "epoch": 6494} {"train_loss": -27.7196044921875, "global_step": 539042, "epoch": 6494} {"train_loss": -27.569751739501953, "global_step": 539043, "epoch": 6494} {"train_loss": -27.521947860717773, "global_step": 539044, "epoch": 6494} {"train_loss": -27.49904441833496, "global_step": 539045, "epoch": 6494} {"train_loss": -27.798114776611328, "global_step": 539046, "epoch": 6494} {"train_loss": -27.61983299255371, "global_step": 539047, "epoch": 6494} {"train_loss": -27.51862907409668, "global_step": 539048, "epoch": 6494} {"train_loss": -27.9571590423584, "global_step": 539049, "epoch": 6494} {"train_loss": -27.924619674682617, "global_step": 539050, "epoch": 6494} {"train_loss": -27.460371017456055, "global_step": 539051, "epoch": 6494} {"train_loss": -27.478546142578125, "global_step": 539052, "epoch": 6494} {"train_loss": -27.539764404296875, "global_step": 539053, "epoch": 6494} {"train_loss": -27.55499267578125, "global_step": 539054, "epoch": 6494} {"train_loss": -27.53594398498535, "global_step": 539055, "epoch": 6494} {"train_loss": -27.308801651000977, "global_step": 539056, "epoch": 6494} {"train_loss": -27.23517417907715, "global_step": 539057, "epoch": 6494} {"train_loss": -27.3959903717041, "global_step": 539058, "epoch": 6494} {"train_loss": -27.28626823425293, "global_step": 539059, "epoch": 6494} {"train_loss": -26.994604110717773, "global_step": 539060, "epoch": 6494} {"train_loss": -27.348974227905273, "global_step": 539061, "epoch": 6494} {"train_loss": -27.14069175720215, "global_step": 539062, "epoch": 6494} {"train_loss": -27.512441635131836, "global_step": 539063, "epoch": 6494} {"train_loss": -27.363332748413086, "global_step": 539064, "epoch": 6494} {"train_loss": -27.560504913330078, "global_step": 539065, "epoch": 6494} {"train_loss": -27.41346549987793, "global_step": 539066, "epoch": 6494} {"train_loss": -27.6348934173584, "global_step": 539067, "epoch": 6494} {"train_loss": -27.683080673217773, "global_step": 539068, "epoch": 6494} {"train_loss": -27.763507843017578, "global_step": 539069, "epoch": 6494} {"train_loss": -27.47930908203125, "global_step": 539070, "epoch": 6494} {"train_loss": -27.59425163269043, "global_step": 539071, "epoch": 6494} {"train_loss": -27.74456214904785, "global_step": 539072, "epoch": 6494} {"train_loss": -27.553564071655273, "global_step": 539073, "epoch": 6494} {"train_loss": -27.640655517578125, "global_step": 539074, "epoch": 6494} {"train_loss": -27.733081817626953, "global_step": 539075, "epoch": 6494} {"train_loss": -27.70586585998535, "global_step": 539076, "epoch": 6494} {"train_loss": -27.993520736694336, "global_step": 539077, "epoch": 6494} {"train_loss": -27.591211318969727, "global_step": 539078, "epoch": 6494} {"train_loss": -27.596826553344727, "global_step": 539079, "epoch": 6494} {"train_loss": -28.09272575378418, "global_step": 539080, "epoch": 6494} {"train_loss": -28.0120906829834, "global_step": 539081, "epoch": 6494} {"train_loss": -27.549169540405273, "global_step": 539082, "epoch": 6494} {"train_loss": -27.952619552612305, "global_step": 539083, "epoch": 6494} {"train_loss": -27.608806058584925, "global_step": 539084, "epoch": 6494, "val_loss": 6439188.0} {"train_loss": -26.66279411315918, "global_step": 539085, "epoch": 6495} {"train_loss": -27.018888473510742, "global_step": 539086, "epoch": 6495} {"train_loss": -27.573362350463867, "global_step": 539087, "epoch": 6495} {"train_loss": -27.4818058013916, "global_step": 539088, "epoch": 6495} {"train_loss": -27.06671142578125, "global_step": 539089, "epoch": 6495} {"train_loss": -27.158863067626953, "global_step": 539090, "epoch": 6495} {"train_loss": -27.52372169494629, "global_step": 539091, "epoch": 6495} {"train_loss": -27.25494956970215, "global_step": 539092, "epoch": 6495} {"train_loss": -27.469884872436523, "global_step": 539093, "epoch": 6495} {"train_loss": -27.53739356994629, "global_step": 539094, "epoch": 6495} {"train_loss": -27.122272491455078, "global_step": 539095, "epoch": 6495} {"train_loss": -27.38620376586914, "global_step": 539096, "epoch": 6495} {"train_loss": -27.629499435424805, "global_step": 539097, "epoch": 6495} {"train_loss": -27.422504425048828, "global_step": 539098, "epoch": 6495} {"train_loss": -27.35091209411621, "global_step": 539099, "epoch": 6495} {"train_loss": -27.625080108642578, "global_step": 539100, "epoch": 6495} {"train_loss": -27.848291397094727, "global_step": 539101, "epoch": 6495} {"train_loss": -27.524534225463867, "global_step": 539102, "epoch": 6495} {"train_loss": -28.03474235534668, "global_step": 539103, "epoch": 6495} {"train_loss": -27.43505859375, "global_step": 539104, "epoch": 6495} {"train_loss": -27.630918502807617, "global_step": 539105, "epoch": 6495} {"train_loss": -27.46356773376465, "global_step": 539106, "epoch": 6495} {"train_loss": -27.686386108398438, "global_step": 539107, "epoch": 6495} {"train_loss": -27.746225357055664, "global_step": 539108, "epoch": 6495} {"train_loss": -27.849857330322266, "global_step": 539109, "epoch": 6495} {"train_loss": -27.418201446533203, "global_step": 539110, "epoch": 6495} {"train_loss": -27.845722198486328, "global_step": 539111, "epoch": 6495} {"train_loss": -27.41986656188965, "global_step": 539112, "epoch": 6495} {"train_loss": -27.742828369140625, "global_step": 539113, "epoch": 6495} {"train_loss": -27.91156005859375, "global_step": 539114, "epoch": 6495} {"train_loss": -27.613300323486328, "global_step": 539115, "epoch": 6495} {"train_loss": -27.525665283203125, "global_step": 539116, "epoch": 6495} {"train_loss": -27.95416831970215, "global_step": 539117, "epoch": 6495} {"train_loss": -27.58087158203125, "global_step": 539118, "epoch": 6495} {"train_loss": -27.797040939331055, "global_step": 539119, "epoch": 6495} {"train_loss": -27.884435653686523, "global_step": 539120, "epoch": 6495} {"train_loss": -27.825408935546875, "global_step": 539121, "epoch": 6495} {"train_loss": -27.85906410217285, "global_step": 539122, "epoch": 6495} {"train_loss": -27.729171752929688, "global_step": 539123, "epoch": 6495} {"train_loss": -27.90778923034668, "global_step": 539124, "epoch": 6495} {"train_loss": -27.80148696899414, "global_step": 539125, "epoch": 6495} {"train_loss": -27.511335372924805, "global_step": 539126, "epoch": 6495} {"train_loss": -27.558761596679688, "global_step": 539127, "epoch": 6495} {"train_loss": -27.929365158081055, "global_step": 539128, "epoch": 6495} {"train_loss": -27.541349411010742, "global_step": 539129, "epoch": 6495} {"train_loss": -27.677642822265625, "global_step": 539130, "epoch": 6495} {"train_loss": -27.63091468811035, "global_step": 539131, "epoch": 6495} {"train_loss": -27.845001220703125, "global_step": 539132, "epoch": 6495} {"train_loss": -27.667682647705078, "global_step": 539133, "epoch": 6495} {"train_loss": -27.846485137939453, "global_step": 539134, "epoch": 6495} {"train_loss": -27.68145179748535, "global_step": 539135, "epoch": 6495} {"train_loss": -27.22218894958496, "global_step": 539136, "epoch": 6495} {"train_loss": -27.632965087890625, "global_step": 539137, "epoch": 6495} {"train_loss": -27.83540153503418, "global_step": 539138, "epoch": 6495} {"train_loss": -27.847900390625, "global_step": 539139, "epoch": 6495} {"train_loss": -27.498138427734375, "global_step": 539140, "epoch": 6495} {"train_loss": -27.809402465820312, "global_step": 539141, "epoch": 6495} {"train_loss": -27.3614444732666, "global_step": 539142, "epoch": 6495} {"train_loss": -27.1409912109375, "global_step": 539143, "epoch": 6495} {"train_loss": -26.993810653686523, "global_step": 539144, "epoch": 6495} {"train_loss": -26.79005241394043, "global_step": 539145, "epoch": 6495} {"train_loss": -27.447723388671875, "global_step": 539146, "epoch": 6495} {"train_loss": -27.542224884033203, "global_step": 539147, "epoch": 6495} {"train_loss": -27.09430503845215, "global_step": 539148, "epoch": 6495} {"train_loss": -27.493627548217773, "global_step": 539149, "epoch": 6495} {"train_loss": -27.545318603515625, "global_step": 539150, "epoch": 6495} {"train_loss": -27.381107330322266, "global_step": 539151, "epoch": 6495} {"train_loss": -27.530187606811523, "global_step": 539152, "epoch": 6495} {"train_loss": -27.110797882080078, "global_step": 539153, "epoch": 6495} {"train_loss": -27.1839656829834, "global_step": 539154, "epoch": 6495} {"train_loss": -27.448745727539062, "global_step": 539155, "epoch": 6495} {"train_loss": -27.342926025390625, "global_step": 539156, "epoch": 6495} {"train_loss": -27.54281997680664, "global_step": 539157, "epoch": 6495} {"train_loss": -27.595922470092773, "global_step": 539158, "epoch": 6495} {"train_loss": -27.190536499023438, "global_step": 539159, "epoch": 6495} {"train_loss": -27.457733154296875, "global_step": 539160, "epoch": 6495} {"train_loss": -27.352161407470703, "global_step": 539161, "epoch": 6495} {"train_loss": -27.35175132751465, "global_step": 539162, "epoch": 6495} {"train_loss": -27.254241943359375, "global_step": 539163, "epoch": 6495} {"train_loss": -27.670995712280273, "global_step": 539164, "epoch": 6495} {"train_loss": -27.388702392578125, "global_step": 539165, "epoch": 6495} {"train_loss": -27.366308212280273, "global_step": 539166, "epoch": 6495} {"train_loss": -27.529145252273743, "global_step": 539167, "epoch": 6495, "val_loss": 6510795.0} {"train_loss": -26.9454288482666, "global_step": 539168, "epoch": 6496} {"train_loss": -26.9488582611084, "global_step": 539169, "epoch": 6496} {"train_loss": -26.940704345703125, "global_step": 539170, "epoch": 6496} {"train_loss": -26.87458610534668, "global_step": 539171, "epoch": 6496} {"train_loss": -26.6238956451416, "global_step": 539172, "epoch": 6496} {"train_loss": -27.633075714111328, "global_step": 539173, "epoch": 6496} {"train_loss": -26.89927101135254, "global_step": 539174, "epoch": 6496} {"train_loss": -27.052343368530273, "global_step": 539175, "epoch": 6496} {"train_loss": -27.6473445892334, "global_step": 539176, "epoch": 6496} {"train_loss": -27.359567642211914, "global_step": 539177, "epoch": 6496} {"train_loss": -26.887924194335938, "global_step": 539178, "epoch": 6496} {"train_loss": -27.262836456298828, "global_step": 539179, "epoch": 6496} {"train_loss": -26.978973388671875, "global_step": 539180, "epoch": 6496} {"train_loss": -27.21381187438965, "global_step": 539181, "epoch": 6496} {"train_loss": -27.416147232055664, "global_step": 539182, "epoch": 6496} {"train_loss": -27.492151260375977, "global_step": 539183, "epoch": 6496} {"train_loss": -27.43647575378418, "global_step": 539184, "epoch": 6496} {"train_loss": -27.39411735534668, "global_step": 539185, "epoch": 6496} {"train_loss": -27.44305419921875, "global_step": 539186, "epoch": 6496} {"train_loss": -27.449726104736328, "global_step": 539187, "epoch": 6496} {"train_loss": -27.338897705078125, "global_step": 539188, "epoch": 6496} {"train_loss": -27.435522079467773, "global_step": 539189, "epoch": 6496} {"train_loss": -27.3841495513916, "global_step": 539190, "epoch": 6496} {"train_loss": -27.65517234802246, "global_step": 539191, "epoch": 6496} {"train_loss": -27.157583236694336, "global_step": 539192, "epoch": 6496} {"train_loss": -27.485401153564453, "global_step": 539193, "epoch": 6496} {"train_loss": -27.445819854736328, "global_step": 539194, "epoch": 6496} {"train_loss": -27.746564865112305, "global_step": 539195, "epoch": 6496} {"train_loss": -27.446212768554688, "global_step": 539196, "epoch": 6496} {"train_loss": -28.02606201171875, "global_step": 539197, "epoch": 6496} {"train_loss": -27.5344181060791, "global_step": 539198, "epoch": 6496} {"train_loss": -27.665241241455078, "global_step": 539199, "epoch": 6496} {"train_loss": -28.211252212524414, "global_step": 539200, "epoch": 6496} {"train_loss": -27.6806640625, "global_step": 539201, "epoch": 6496} {"train_loss": -27.705915451049805, "global_step": 539202, "epoch": 6496} {"train_loss": -27.94780921936035, "global_step": 539203, "epoch": 6496} {"train_loss": -27.595693588256836, "global_step": 539204, "epoch": 6496} {"train_loss": -27.493209838867188, "global_step": 539205, "epoch": 6496} {"train_loss": -27.677642822265625, "global_step": 539206, "epoch": 6496} {"train_loss": -27.554004669189453, "global_step": 539207, "epoch": 6496} {"train_loss": -27.435239791870117, "global_step": 539208, "epoch": 6496} {"train_loss": -27.87275505065918, "global_step": 539209, "epoch": 6496} {"train_loss": -27.626951217651367, "global_step": 539210, "epoch": 6496} {"train_loss": -27.7703800201416, "global_step": 539211, "epoch": 6496} {"train_loss": -27.945343017578125, "global_step": 539212, "epoch": 6496} {"train_loss": -27.69024085998535, "global_step": 539213, "epoch": 6496} {"train_loss": -28.046127319335938, "global_step": 539214, "epoch": 6496} {"train_loss": -27.6368350982666, "global_step": 539215, "epoch": 6496} {"train_loss": -27.709930419921875, "global_step": 539216, "epoch": 6496} {"train_loss": -27.9077091217041, "global_step": 539217, "epoch": 6496} {"train_loss": -27.77033805847168, "global_step": 539218, "epoch": 6496} {"train_loss": -27.689599990844727, "global_step": 539219, "epoch": 6496} {"train_loss": -28.014997482299805, "global_step": 539220, "epoch": 6496} {"train_loss": -27.382413864135742, "global_step": 539221, "epoch": 6496} {"train_loss": -27.714330673217773, "global_step": 539222, "epoch": 6496} {"train_loss": -27.93166160583496, "global_step": 539223, "epoch": 6496} {"train_loss": -27.348783493041992, "global_step": 539224, "epoch": 6496} {"train_loss": -27.585468292236328, "global_step": 539225, "epoch": 6496} {"train_loss": -27.69454002380371, "global_step": 539226, "epoch": 6496} {"train_loss": -27.466907501220703, "global_step": 539227, "epoch": 6496} {"train_loss": -27.8377628326416, "global_step": 539228, "epoch": 6496} {"train_loss": -28.006744384765625, "global_step": 539229, "epoch": 6496} {"train_loss": -27.614049911499023, "global_step": 539230, "epoch": 6496} {"train_loss": -27.50809669494629, "global_step": 539231, "epoch": 6496} {"train_loss": -27.699234008789062, "global_step": 539232, "epoch": 6496} {"train_loss": -27.675756454467773, "global_step": 539233, "epoch": 6496} {"train_loss": -27.692508697509766, "global_step": 539234, "epoch": 6496} {"train_loss": -27.37403678894043, "global_step": 539235, "epoch": 6496} {"train_loss": -27.418502807617188, "global_step": 539236, "epoch": 6496} {"train_loss": -27.6596622467041, "global_step": 539237, "epoch": 6496} {"train_loss": -27.673782348632812, "global_step": 539238, "epoch": 6496} {"train_loss": -27.282669067382812, "global_step": 539239, "epoch": 6496} {"train_loss": -27.489919662475586, "global_step": 539240, "epoch": 6496} {"train_loss": -28.01032066345215, "global_step": 539241, "epoch": 6496} {"train_loss": -27.864233016967773, "global_step": 539242, "epoch": 6496} {"train_loss": -27.74946403503418, "global_step": 539243, "epoch": 6496} {"train_loss": -27.42826271057129, "global_step": 539244, "epoch": 6496} {"train_loss": -27.217498779296875, "global_step": 539245, "epoch": 6496} {"train_loss": -27.702178955078125, "global_step": 539246, "epoch": 6496} {"train_loss": -27.34760093688965, "global_step": 539247, "epoch": 6496} {"train_loss": -27.75111961364746, "global_step": 539248, "epoch": 6496} {"train_loss": -27.863218307495117, "global_step": 539249, "epoch": 6496} {"train_loss": -27.55311800485634, "global_step": 539250, "epoch": 6496, "val_loss": 6442631.5} {"train_loss": -27.481643676757812, "global_step": 539251, "epoch": 6497} {"train_loss": -27.024511337280273, "global_step": 539252, "epoch": 6497} {"train_loss": -27.430282592773438, "global_step": 539253, "epoch": 6497} {"train_loss": -26.940048217773438, "global_step": 539254, "epoch": 6497} {"train_loss": -27.206769943237305, "global_step": 539255, "epoch": 6497} {"train_loss": -26.67947769165039, "global_step": 539256, "epoch": 6497} {"train_loss": -27.178924560546875, "global_step": 539257, "epoch": 6497} {"train_loss": -27.527362823486328, "global_step": 539258, "epoch": 6497} {"train_loss": -26.950794219970703, "global_step": 539259, "epoch": 6497} {"train_loss": -27.211374282836914, "global_step": 539260, "epoch": 6497} {"train_loss": -27.59955406188965, "global_step": 539261, "epoch": 6497} {"train_loss": -27.321292877197266, "global_step": 539262, "epoch": 6497} {"train_loss": -26.777307510375977, "global_step": 539263, "epoch": 6497} {"train_loss": -27.306058883666992, "global_step": 539264, "epoch": 6497} {"train_loss": -27.348682403564453, "global_step": 539265, "epoch": 6497} {"train_loss": -27.426603317260742, "global_step": 539266, "epoch": 6497} {"train_loss": -27.601709365844727, "global_step": 539267, "epoch": 6497} {"train_loss": -27.56340980529785, "global_step": 539268, "epoch": 6497} {"train_loss": -27.571014404296875, "global_step": 539269, "epoch": 6497} {"train_loss": -27.573522567749023, "global_step": 539270, "epoch": 6497} {"train_loss": -27.734394073486328, "global_step": 539271, "epoch": 6497} {"train_loss": -27.467121124267578, "global_step": 539272, "epoch": 6497} {"train_loss": -27.409345626831055, "global_step": 539273, "epoch": 6497} {"train_loss": -27.461706161499023, "global_step": 539274, "epoch": 6497} {"train_loss": -27.95815086364746, "global_step": 539275, "epoch": 6497} {"train_loss": -27.58795166015625, "global_step": 539276, "epoch": 6497} {"train_loss": -27.77907371520996, "global_step": 539277, "epoch": 6497} {"train_loss": -27.803503036499023, "global_step": 539278, "epoch": 6497} {"train_loss": -27.9041690826416, "global_step": 539279, "epoch": 6497} {"train_loss": -27.354816436767578, "global_step": 539280, "epoch": 6497} {"train_loss": -27.945043563842773, "global_step": 539281, "epoch": 6497} {"train_loss": -27.4407958984375, "global_step": 539282, "epoch": 6497} {"train_loss": -27.69268798828125, "global_step": 539283, "epoch": 6497} {"train_loss": -27.49053382873535, "global_step": 539284, "epoch": 6497} {"train_loss": -27.708112716674805, "global_step": 539285, "epoch": 6497} {"train_loss": -27.848804473876953, "global_step": 539286, "epoch": 6497} {"train_loss": -27.55694007873535, "global_step": 539287, "epoch": 6497} {"train_loss": -27.3614444732666, "global_step": 539288, "epoch": 6497} {"train_loss": -27.7271728515625, "global_step": 539289, "epoch": 6497} {"train_loss": -27.7733154296875, "global_step": 539290, "epoch": 6497} {"train_loss": -27.78472328186035, "global_step": 539291, "epoch": 6497} {"train_loss": -27.63600730895996, "global_step": 539292, "epoch": 6497} {"train_loss": -27.65413475036621, "global_step": 539293, "epoch": 6497} {"train_loss": -27.921859741210938, "global_step": 539294, "epoch": 6497} {"train_loss": -27.860410690307617, "global_step": 539295, "epoch": 6497} {"train_loss": -27.887723922729492, "global_step": 539296, "epoch": 6497} {"train_loss": -28.089155197143555, "global_step": 539297, "epoch": 6497} {"train_loss": -27.9093017578125, "global_step": 539298, "epoch": 6497} {"train_loss": -27.4506893157959, "global_step": 539299, "epoch": 6497} {"train_loss": -27.64375114440918, "global_step": 539300, "epoch": 6497} {"train_loss": -27.753820419311523, "global_step": 539301, "epoch": 6497} {"train_loss": -27.934629440307617, "global_step": 539302, "epoch": 6497} {"train_loss": -27.988666534423828, "global_step": 539303, "epoch": 6497} {"train_loss": -28.072004318237305, "global_step": 539304, "epoch": 6497} {"train_loss": -28.022266387939453, "global_step": 539305, "epoch": 6497} {"train_loss": -27.825382232666016, "global_step": 539306, "epoch": 6497} {"train_loss": -27.511510848999023, "global_step": 539307, "epoch": 6497} {"train_loss": -27.996662139892578, "global_step": 539308, "epoch": 6497} {"train_loss": -27.59657859802246, "global_step": 539309, "epoch": 6497} {"train_loss": -28.104578018188477, "global_step": 539310, "epoch": 6497} {"train_loss": -27.37445640563965, "global_step": 539311, "epoch": 6497} {"train_loss": -28.106220245361328, "global_step": 539312, "epoch": 6497} {"train_loss": -27.856374740600586, "global_step": 539313, "epoch": 6497} {"train_loss": -27.503202438354492, "global_step": 539314, "epoch": 6497} {"train_loss": -27.474416732788086, "global_step": 539315, "epoch": 6497} {"train_loss": -27.341238021850586, "global_step": 539316, "epoch": 6497} {"train_loss": -27.1243839263916, "global_step": 539317, "epoch": 6497} {"train_loss": -26.95258140563965, "global_step": 539318, "epoch": 6497} {"train_loss": -27.62546157836914, "global_step": 539319, "epoch": 6497} {"train_loss": -27.9099063873291, "global_step": 539320, "epoch": 6497} {"train_loss": -27.74539566040039, "global_step": 539321, "epoch": 6497} {"train_loss": -27.4699764251709, "global_step": 539322, "epoch": 6497} {"train_loss": -27.115890502929688, "global_step": 539323, "epoch": 6497} {"train_loss": -27.517744064331055, "global_step": 539324, "epoch": 6497} {"train_loss": -27.098981857299805, "global_step": 539325, "epoch": 6497} {"train_loss": -26.698835372924805, "global_step": 539326, "epoch": 6497} {"train_loss": -27.193044662475586, "global_step": 539327, "epoch": 6497} {"train_loss": -27.508014678955078, "global_step": 539328, "epoch": 6497} {"train_loss": -27.330615997314453, "global_step": 539329, "epoch": 6497} {"train_loss": -27.040563583374023, "global_step": 539330, "epoch": 6497} {"train_loss": -26.70136833190918, "global_step": 539331, "epoch": 6497} {"train_loss": -27.458166122436523, "global_step": 539332, "epoch": 6497} {"train_loss": -27.52285281721368, "global_step": 539333, "epoch": 6497, "val_loss": 6467142.0} {"train_loss": -27.1453800201416, "global_step": 539334, "epoch": 6498} {"train_loss": -26.678787231445312, "global_step": 539335, "epoch": 6498} {"train_loss": -25.62885093688965, "global_step": 539336, "epoch": 6498} {"train_loss": -26.2137393951416, "global_step": 539337, "epoch": 6498} {"train_loss": -26.730518341064453, "global_step": 539338, "epoch": 6498} {"train_loss": -26.2490177154541, "global_step": 539339, "epoch": 6498} {"train_loss": -27.24416160583496, "global_step": 539340, "epoch": 6498} {"train_loss": -26.72781753540039, "global_step": 539341, "epoch": 6498} {"train_loss": -26.96868324279785, "global_step": 539342, "epoch": 6498} {"train_loss": -27.25156021118164, "global_step": 539343, "epoch": 6498} {"train_loss": -26.93268394470215, "global_step": 539344, "epoch": 6498} {"train_loss": -27.1712589263916, "global_step": 539345, "epoch": 6498} {"train_loss": -27.467864990234375, "global_step": 539346, "epoch": 6498} {"train_loss": -26.83967399597168, "global_step": 539347, "epoch": 6498} {"train_loss": -26.878854751586914, "global_step": 539348, "epoch": 6498} {"train_loss": -27.299407958984375, "global_step": 539349, "epoch": 6498} {"train_loss": -27.05084800720215, "global_step": 539350, "epoch": 6498} {"train_loss": -27.698068618774414, "global_step": 539351, "epoch": 6498} {"train_loss": -27.34798240661621, "global_step": 539352, "epoch": 6498} {"train_loss": -27.465185165405273, "global_step": 539353, "epoch": 6498} {"train_loss": -27.30097007751465, "global_step": 539354, "epoch": 6498} {"train_loss": -27.110172271728516, "global_step": 539355, "epoch": 6498} {"train_loss": -27.309345245361328, "global_step": 539356, "epoch": 6498} {"train_loss": -27.236282348632812, "global_step": 539357, "epoch": 6498} {"train_loss": -27.408227920532227, "global_step": 539358, "epoch": 6498} {"train_loss": -27.46587562561035, "global_step": 539359, "epoch": 6498} {"train_loss": -27.562036514282227, "global_step": 539360, "epoch": 6498} {"train_loss": -27.716794967651367, "global_step": 539361, "epoch": 6498} {"train_loss": -27.612268447875977, "global_step": 539362, "epoch": 6498} {"train_loss": -27.550094604492188, "global_step": 539363, "epoch": 6498} {"train_loss": -27.480566024780273, "global_step": 539364, "epoch": 6498} {"train_loss": -27.599863052368164, "global_step": 539365, "epoch": 6498} {"train_loss": -27.4503231048584, "global_step": 539366, "epoch": 6498} {"train_loss": -27.607587814331055, "global_step": 539367, "epoch": 6498} {"train_loss": -27.256505966186523, "global_step": 539368, "epoch": 6498} {"train_loss": -27.533252716064453, "global_step": 539369, "epoch": 6498} {"train_loss": -27.672855377197266, "global_step": 539370, "epoch": 6498} {"train_loss": -27.736387252807617, "global_step": 539371, "epoch": 6498} {"train_loss": -27.713581085205078, "global_step": 539372, "epoch": 6498} {"train_loss": -27.692794799804688, "global_step": 539373, "epoch": 6498} {"train_loss": -27.70771598815918, "global_step": 539374, "epoch": 6498} {"train_loss": -27.819320678710938, "global_step": 539375, "epoch": 6498} {"train_loss": -27.868127822875977, "global_step": 539376, "epoch": 6498} {"train_loss": -28.20148277282715, "global_step": 539377, "epoch": 6498} {"train_loss": -27.762414932250977, "global_step": 539378, "epoch": 6498} {"train_loss": -27.972375869750977, "global_step": 539379, "epoch": 6498} {"train_loss": -27.618940353393555, "global_step": 539380, "epoch": 6498} {"train_loss": -27.8861083984375, "global_step": 539381, "epoch": 6498} {"train_loss": -27.82416343688965, "global_step": 539382, "epoch": 6498} {"train_loss": -27.7266845703125, "global_step": 539383, "epoch": 6498} {"train_loss": -27.816059112548828, "global_step": 539384, "epoch": 6498} {"train_loss": -27.772750854492188, "global_step": 539385, "epoch": 6498} {"train_loss": -27.626270294189453, "global_step": 539386, "epoch": 6498} {"train_loss": -27.58107566833496, "global_step": 539387, "epoch": 6498} {"train_loss": -26.658649444580078, "global_step": 539388, "epoch": 6498} {"train_loss": -27.591718673706055, "global_step": 539389, "epoch": 6498} {"train_loss": -27.440032958984375, "global_step": 539390, "epoch": 6498} {"train_loss": -27.59090232849121, "global_step": 539391, "epoch": 6498} {"train_loss": -27.38103675842285, "global_step": 539392, "epoch": 6498} {"train_loss": -27.590381622314453, "global_step": 539393, "epoch": 6498} {"train_loss": -27.400165557861328, "global_step": 539394, "epoch": 6498} {"train_loss": -27.4084529876709, "global_step": 539395, "epoch": 6498} {"train_loss": -27.734891891479492, "global_step": 539396, "epoch": 6498} {"train_loss": -27.39544105529785, "global_step": 539397, "epoch": 6498} {"train_loss": -27.26325798034668, "global_step": 539398, "epoch": 6498} {"train_loss": -27.59236717224121, "global_step": 539399, "epoch": 6498} {"train_loss": -27.715259552001953, "global_step": 539400, "epoch": 6498} {"train_loss": -27.923864364624023, "global_step": 539401, "epoch": 6498} {"train_loss": -28.001890182495117, "global_step": 539402, "epoch": 6498} {"train_loss": -27.669118881225586, "global_step": 539403, "epoch": 6498} {"train_loss": -27.619596481323242, "global_step": 539404, "epoch": 6498} {"train_loss": -27.7316951751709, "global_step": 539405, "epoch": 6498} {"train_loss": -27.755966186523438, "global_step": 539406, "epoch": 6498} {"train_loss": -27.503509521484375, "global_step": 539407, "epoch": 6498} {"train_loss": -28.02577018737793, "global_step": 539408, "epoch": 6498} {"train_loss": -27.859323501586914, "global_step": 539409, "epoch": 6498} {"train_loss": -27.41766929626465, "global_step": 539410, "epoch": 6498} {"train_loss": -27.93703269958496, "global_step": 539411, "epoch": 6498} {"train_loss": -27.653711318969727, "global_step": 539412, "epoch": 6498} {"train_loss": -27.789037704467773, "global_step": 539413, "epoch": 6498} {"train_loss": -27.879541397094727, "global_step": 539414, "epoch": 6498} {"train_loss": -27.915454864501953, "global_step": 539415, "epoch": 6498} {"train_loss": -27.476999443697643, "global_step": 539416, "epoch": 6498, "val_loss": 6480639.0} {"train_loss": -26.9689998626709, "global_step": 539417, "epoch": 6499} {"train_loss": -26.500629425048828, "global_step": 539418, "epoch": 6499} {"train_loss": -25.68000602722168, "global_step": 539419, "epoch": 6499} {"train_loss": -26.14008140563965, "global_step": 539420, "epoch": 6499} {"train_loss": -27.678495407104492, "global_step": 539421, "epoch": 6499} {"train_loss": -26.41619300842285, "global_step": 539422, "epoch": 6499} {"train_loss": -27.217344284057617, "global_step": 539423, "epoch": 6499} {"train_loss": -27.14142417907715, "global_step": 539424, "epoch": 6499} {"train_loss": -27.48914909362793, "global_step": 539425, "epoch": 6499} {"train_loss": -27.192764282226562, "global_step": 539426, "epoch": 6499} {"train_loss": -27.29020118713379, "global_step": 539427, "epoch": 6499} {"train_loss": -27.4464168548584, "global_step": 539428, "epoch": 6499} {"train_loss": -27.304601669311523, "global_step": 539429, "epoch": 6499} {"train_loss": -26.889495849609375, "global_step": 539430, "epoch": 6499} {"train_loss": -27.44232749938965, "global_step": 539431, "epoch": 6499} {"train_loss": -27.46931266784668, "global_step": 539432, "epoch": 6499} {"train_loss": -27.634992599487305, "global_step": 539433, "epoch": 6499} {"train_loss": -27.493566513061523, "global_step": 539434, "epoch": 6499} {"train_loss": -27.397977828979492, "global_step": 539435, "epoch": 6499} {"train_loss": -27.68220329284668, "global_step": 539436, "epoch": 6499} {"train_loss": -26.936792373657227, "global_step": 539437, "epoch": 6499} {"train_loss": -27.48773765563965, "global_step": 539438, "epoch": 6499} {"train_loss": -27.428516387939453, "global_step": 539439, "epoch": 6499} {"train_loss": -27.50973892211914, "global_step": 539440, "epoch": 6499} {"train_loss": -27.591995239257812, "global_step": 539441, "epoch": 6499} {"train_loss": -27.56422996520996, "global_step": 539442, "epoch": 6499} {"train_loss": -27.371267318725586, "global_step": 539443, "epoch": 6499} {"train_loss": -27.65289878845215, "global_step": 539444, "epoch": 6499} {"train_loss": -27.08147621154785, "global_step": 539445, "epoch": 6499} {"train_loss": -27.527862548828125, "global_step": 539446, "epoch": 6499} {"train_loss": -28.203475952148438, "global_step": 539447, "epoch": 6499} {"train_loss": -27.6897029876709, "global_step": 539448, "epoch": 6499} {"train_loss": -27.7183837890625, "global_step": 539449, "epoch": 6499} {"train_loss": -27.20796775817871, "global_step": 539450, "epoch": 6499} {"train_loss": -27.786487579345703, "global_step": 539451, "epoch": 6499} {"train_loss": -27.846479415893555, "global_step": 539452, "epoch": 6499} {"train_loss": -27.39447021484375, "global_step": 539453, "epoch": 6499} {"train_loss": -27.758209228515625, "global_step": 539454, "epoch": 6499} {"train_loss": -27.713560104370117, "global_step": 539455, "epoch": 6499} {"train_loss": -27.6423282623291, "global_step": 539456, "epoch": 6499} {"train_loss": -27.365570068359375, "global_step": 539457, "epoch": 6499} {"train_loss": -27.923355102539062, "global_step": 539458, "epoch": 6499} {"train_loss": -27.52479362487793, "global_step": 539459, "epoch": 6499} {"train_loss": -27.362548828125, "global_step": 539460, "epoch": 6499} {"train_loss": -26.736480712890625, "global_step": 539461, "epoch": 6499} {"train_loss": -27.03658103942871, "global_step": 539462, "epoch": 6499} {"train_loss": -27.71462059020996, "global_step": 539463, "epoch": 6499} {"train_loss": -27.402952194213867, "global_step": 539464, "epoch": 6499} {"train_loss": -26.8960018157959, "global_step": 539465, "epoch": 6499} {"train_loss": -27.221927642822266, "global_step": 539466, "epoch": 6499} {"train_loss": -27.298673629760742, "global_step": 539467, "epoch": 6499} {"train_loss": -27.238916397094727, "global_step": 539468, "epoch": 6499} {"train_loss": -27.54730796813965, "global_step": 539469, "epoch": 6499} {"train_loss": -27.054656982421875, "global_step": 539470, "epoch": 6499} {"train_loss": -27.47027587890625, "global_step": 539471, "epoch": 6499} {"train_loss": -27.57484245300293, "global_step": 539472, "epoch": 6499} {"train_loss": -27.06145668029785, "global_step": 539473, "epoch": 6499} {"train_loss": -27.458112716674805, "global_step": 539474, "epoch": 6499} {"train_loss": -27.2255916595459, "global_step": 539475, "epoch": 6499} {"train_loss": -27.489988327026367, "global_step": 539476, "epoch": 6499} {"train_loss": -27.827503204345703, "global_step": 539477, "epoch": 6499} {"train_loss": -27.548608779907227, "global_step": 539478, "epoch": 6499} {"train_loss": -27.413427352905273, "global_step": 539479, "epoch": 6499} {"train_loss": -27.561304092407227, "global_step": 539480, "epoch": 6499} {"train_loss": -27.808176040649414, "global_step": 539481, "epoch": 6499} {"train_loss": -27.358245849609375, "global_step": 539482, "epoch": 6499} {"train_loss": -27.800567626953125, "global_step": 539483, "epoch": 6499} {"train_loss": -27.707000732421875, "global_step": 539484, "epoch": 6499} {"train_loss": -27.28903579711914, "global_step": 539485, "epoch": 6499} {"train_loss": -27.851871490478516, "global_step": 539486, "epoch": 6499} {"train_loss": -27.5430965423584, "global_step": 539487, "epoch": 6499} {"train_loss": -27.500463485717773, "global_step": 539488, "epoch": 6499} {"train_loss": -27.759567260742188, "global_step": 539489, "epoch": 6499} {"train_loss": -27.77875328063965, "global_step": 539490, "epoch": 6499} {"train_loss": -27.746259689331055, "global_step": 539491, "epoch": 6499} {"train_loss": -27.323444366455078, "global_step": 539492, "epoch": 6499} {"train_loss": -27.452743530273438, "global_step": 539493, "epoch": 6499} {"train_loss": -27.842884063720703, "global_step": 539494, "epoch": 6499} {"train_loss": -27.771713256835938, "global_step": 539495, "epoch": 6499} {"train_loss": -27.442123413085938, "global_step": 539496, "epoch": 6499} {"train_loss": -27.257461547851562, "global_step": 539497, "epoch": 6499} {"train_loss": -27.662952423095703, "global_step": 539498, "epoch": 6499} {"train_loss": -27.417401509112622, "global_step": 539499, "epoch": 6499, "val_loss": 6435393.0} {"train_loss": -27.389739990234375, "global_step": 539500, "epoch": 6500} {"train_loss": -27.669830322265625, "global_step": 539501, "epoch": 6500} {"train_loss": -27.67289161682129, "global_step": 539502, "epoch": 6500} {"train_loss": -27.56049919128418, "global_step": 539503, "epoch": 6500} {"train_loss": -27.607437133789062, "global_step": 539504, "epoch": 6500} {"train_loss": -27.44952392578125, "global_step": 539505, "epoch": 6500} {"train_loss": -27.07139015197754, "global_step": 539506, "epoch": 6500} {"train_loss": -27.44807243347168, "global_step": 539507, "epoch": 6500} {"train_loss": -27.770944595336914, "global_step": 539508, "epoch": 6500} {"train_loss": -27.5497989654541, "global_step": 539509, "epoch": 6500} {"train_loss": -27.25812339782715, "global_step": 539510, "epoch": 6500} {"train_loss": -27.75274658203125, "global_step": 539511, "epoch": 6500} {"train_loss": -27.650976181030273, "global_step": 539512, "epoch": 6500} {"train_loss": -27.768640518188477, "global_step": 539513, "epoch": 6500} {"train_loss": -27.601287841796875, "global_step": 539514, "epoch": 6500} {"train_loss": -27.48341941833496, "global_step": 539515, "epoch": 6500} {"train_loss": -27.37274742126465, "global_step": 539516, "epoch": 6500} {"train_loss": -27.824676513671875, "global_step": 539517, "epoch": 6500} {"train_loss": -27.277734756469727, "global_step": 539518, "epoch": 6500} {"train_loss": -27.929752349853516, "global_step": 539519, "epoch": 6500} {"train_loss": -27.61256217956543, "global_step": 539520, "epoch": 6500} {"train_loss": -27.413105010986328, "global_step": 539521, "epoch": 6500} {"train_loss": -27.54726219177246, "global_step": 539522, "epoch": 6500} {"train_loss": -27.669042587280273, "global_step": 539523, "epoch": 6500} {"train_loss": -27.6789493560791, "global_step": 539524, "epoch": 6500} {"train_loss": -27.919422149658203, "global_step": 539525, "epoch": 6500} {"train_loss": -27.5416316986084, "global_step": 539526, "epoch": 6500} {"train_loss": -27.5252685546875, "global_step": 539527, "epoch": 6500} {"train_loss": -27.54159927368164, "global_step": 539528, "epoch": 6500} {"train_loss": -27.821805953979492, "global_step": 539529, "epoch": 6500} {"train_loss": -27.777372360229492, "global_step": 539530, "epoch": 6500} {"train_loss": -27.887250900268555, "global_step": 539531, "epoch": 6500} {"train_loss": -28.096546173095703, "global_step": 539532, "epoch": 6500} {"train_loss": -27.6593074798584, "global_step": 539533, "epoch": 6500} {"train_loss": -27.68052101135254, "global_step": 539534, "epoch": 6500} {"train_loss": -27.773645401000977, "global_step": 539535, "epoch": 6500} {"train_loss": -28.1878719329834, "global_step": 539536, "epoch": 6500} {"train_loss": -27.670700073242188, "global_step": 539537, "epoch": 6500} {"train_loss": -27.121274948120117, "global_step": 539538, "epoch": 6500} {"train_loss": -27.714435577392578, "global_step": 539539, "epoch": 6500} {"train_loss": -27.574758529663086, "global_step": 539540, "epoch": 6500} {"train_loss": -27.6762752532959, "global_step": 539541, "epoch": 6500} {"train_loss": -28.0822696685791, "global_step": 539542, "epoch": 6500} {"train_loss": -27.4278564453125, "global_step": 539543, "epoch": 6500} {"train_loss": -27.971323013305664, "global_step": 539544, "epoch": 6500} {"train_loss": -27.9566707611084, "global_step": 539545, "epoch": 6500} {"train_loss": -27.952177047729492, "global_step": 539546, "epoch": 6500} {"train_loss": -27.631031036376953, "global_step": 539547, "epoch": 6500} {"train_loss": -27.087430953979492, "global_step": 539548, "epoch": 6500} {"train_loss": -26.88697624206543, "global_step": 539549, "epoch": 6500} {"train_loss": -26.401782989501953, "global_step": 539550, "epoch": 6500} {"train_loss": -26.530481338500977, "global_step": 539551, "epoch": 6500} {"train_loss": -26.442113876342773, "global_step": 539552, "epoch": 6500} {"train_loss": -27.696874618530273, "global_step": 539553, "epoch": 6500} {"train_loss": -27.497573852539062, "global_step": 539554, "epoch": 6500} {"train_loss": -27.400421142578125, "global_step": 539555, "epoch": 6500} {"train_loss": -27.453962326049805, "global_step": 539556, "epoch": 6500} {"train_loss": -27.31894874572754, "global_step": 539557, "epoch": 6500} {"train_loss": -27.597463607788086, "global_step": 539558, "epoch": 6500} {"train_loss": -27.21402931213379, "global_step": 539559, "epoch": 6500} {"train_loss": -27.637784957885742, "global_step": 539560, "epoch": 6500} {"train_loss": -27.32840919494629, "global_step": 539561, "epoch": 6500} {"train_loss": -27.689722061157227, "global_step": 539562, "epoch": 6500} {"train_loss": -27.5467586517334, "global_step": 539563, "epoch": 6500} {"train_loss": -27.459522247314453, "global_step": 539564, "epoch": 6500} {"train_loss": -27.579498291015625, "global_step": 539565, "epoch": 6500} {"train_loss": -27.371601104736328, "global_step": 539566, "epoch": 6500} {"train_loss": -27.43806266784668, "global_step": 539567, "epoch": 6500} {"train_loss": -27.737287521362305, "global_step": 539568, "epoch": 6500} {"train_loss": -27.477304458618164, "global_step": 539569, "epoch": 6500} {"train_loss": -27.51861572265625, "global_step": 539570, "epoch": 6500} {"train_loss": -27.428058624267578, "global_step": 539571, "epoch": 6500} {"train_loss": -27.6756649017334, "global_step": 539572, "epoch": 6500} {"train_loss": -27.651647567749023, "global_step": 539573, "epoch": 6500} {"train_loss": -27.48004722595215, "global_step": 539574, "epoch": 6500} {"train_loss": -27.684614181518555, "global_step": 539575, "epoch": 6500} {"train_loss": -27.8857479095459, "global_step": 539576, "epoch": 6500} {"train_loss": -27.720001220703125, "global_step": 539577, "epoch": 6500} {"train_loss": -27.59160804748535, "global_step": 539578, "epoch": 6500} {"train_loss": -27.601415634155273, "global_step": 539579, "epoch": 6500} {"train_loss": -27.79664421081543, "global_step": 539580, "epoch": 6500} {"train_loss": -27.93390464782715, "global_step": 539581, "epoch": 6500} {"train_loss": -27.582928462200854, "global_step": 539582, "epoch": 6500, "train/sim_max_reward_0": 1.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4500000": 1.0, "test/sim_max_reward_4500001": 1.0, "test/sim_max_reward_4500002": 1.0, "test/sim_max_reward_4500003": 1.0, "test/sim_max_reward_4500004": 1.0, "test/sim_max_reward_4500005": 1.0, "test/sim_max_reward_4500006": 1.0, "test/sim_max_reward_4500007": 0.0, "test/sim_max_reward_4500008": 1.0, "test/sim_max_reward_4500009": 1.0, "test/sim_max_reward_4500010": 1.0, "test/sim_max_reward_4500011": 1.0, "test/sim_max_reward_4500012": 1.0, "test/sim_max_reward_4500013": 0.0, "test/sim_max_reward_4500014": 1.0, "test/sim_max_reward_4500015": 1.0, "test/sim_max_reward_4500016": 1.0, "test/sim_max_reward_4500017": 1.0, "test/sim_max_reward_4500018": 1.0, "test/sim_max_reward_4500019": 1.0, "test/sim_max_reward_4500020": 1.0, "test/sim_max_reward_4500021": 1.0, "train/mean_score": 1.0, "test/mean_score": 0.9090909090909091, "val_loss": 6471360.0} {"train_loss": -27.57708168029785, "global_step": 539583, "epoch": 6501} {"train_loss": -27.05940818786621, "global_step": 539584, "epoch": 6501} {"train_loss": -27.357885360717773, "global_step": 539585, "epoch": 6501} {"train_loss": -27.42719841003418, "global_step": 539586, "epoch": 6501} {"train_loss": -27.2824764251709, "global_step": 539587, "epoch": 6501} {"train_loss": -26.787900924682617, "global_step": 539588, "epoch": 6501} {"train_loss": -26.70844078063965, "global_step": 539589, "epoch": 6501} {"train_loss": -27.355182647705078, "global_step": 539590, "epoch": 6501} {"train_loss": -27.5194034576416, "global_step": 539591, "epoch": 6501} {"train_loss": -27.22149658203125, "global_step": 539592, "epoch": 6501} {"train_loss": -27.66437339782715, "global_step": 539593, "epoch": 6501} {"train_loss": -27.225122451782227, "global_step": 539594, "epoch": 6501} {"train_loss": -27.648941040039062, "global_step": 539595, "epoch": 6501} {"train_loss": -27.30402946472168, "global_step": 539596, "epoch": 6501} {"train_loss": -27.041772842407227, "global_step": 539597, "epoch": 6501} {"train_loss": -27.20081901550293, "global_step": 539598, "epoch": 6501} {"train_loss": -27.9422550201416, "global_step": 539599, "epoch": 6501} {"train_loss": -27.28759765625, "global_step": 539600, "epoch": 6501} {"train_loss": -27.466108322143555, "global_step": 539601, "epoch": 6501} {"train_loss": -27.47359275817871, "global_step": 539602, "epoch": 6501} {"train_loss": -27.70098304748535, "global_step": 539603, "epoch": 6501} {"train_loss": -27.233732223510742, "global_step": 539604, "epoch": 6501} {"train_loss": -27.370702743530273, "global_step": 539605, "epoch": 6501} {"train_loss": -27.519485473632812, "global_step": 539606, "epoch": 6501} {"train_loss": -27.52361488342285, "global_step": 539607, "epoch": 6501} {"train_loss": -27.719913482666016, "global_step": 539608, "epoch": 6501} {"train_loss": -27.80512046813965, "global_step": 539609, "epoch": 6501} {"train_loss": -27.410358428955078, "global_step": 539610, "epoch": 6501} {"train_loss": -27.78986167907715, "global_step": 539611, "epoch": 6501} {"train_loss": -27.944379806518555, "global_step": 539612, "epoch": 6501} {"train_loss": -27.622709274291992, "global_step": 539613, "epoch": 6501} {"train_loss": -27.7260684967041, "global_step": 539614, "epoch": 6501} {"train_loss": -27.4632568359375, "global_step": 539615, "epoch": 6501} {"train_loss": -27.19529151916504, "global_step": 539616, "epoch": 6501} {"train_loss": -27.840147018432617, "global_step": 539617, "epoch": 6501} {"train_loss": -27.75480079650879, "global_step": 539618, "epoch": 6501} {"train_loss": -27.576858520507812, "global_step": 539619, "epoch": 6501} {"train_loss": -27.469802856445312, "global_step": 539620, "epoch": 6501} {"train_loss": -27.35479736328125, "global_step": 539621, "epoch": 6501} {"train_loss": -27.395788192749023, "global_step": 539622, "epoch": 6501} {"train_loss": -27.672082901000977, "global_step": 539623, "epoch": 6501} {"train_loss": -27.919403076171875, "global_step": 539624, "epoch": 6501} {"train_loss": -27.67374038696289, "global_step": 539625, "epoch": 6501} {"train_loss": -27.784442901611328, "global_step": 539626, "epoch": 6501} {"train_loss": -27.9340877532959, "global_step": 539627, "epoch": 6501} {"train_loss": -27.74494743347168, "global_step": 539628, "epoch": 6501} {"train_loss": -27.71634292602539, "global_step": 539629, "epoch": 6501} {"train_loss": -27.97858238220215, "global_step": 539630, "epoch": 6501} {"train_loss": -27.254209518432617, "global_step": 539631, "epoch": 6501} {"train_loss": -27.963300704956055, "global_step": 539632, "epoch": 6501} {"train_loss": -27.803619384765625, "global_step": 539633, "epoch": 6501} {"train_loss": -27.836750030517578, "global_step": 539634, "epoch": 6501} {"train_loss": -27.746265411376953, "global_step": 539635, "epoch": 6501} {"train_loss": -27.905048370361328, "global_step": 539636, "epoch": 6501} {"train_loss": -27.692169189453125, "global_step": 539637, "epoch": 6501} {"train_loss": -27.89870262145996, "global_step": 539638, "epoch": 6501} {"train_loss": -27.6353702545166, "global_step": 539639, "epoch": 6501} {"train_loss": -27.739612579345703, "global_step": 539640, "epoch": 6501} {"train_loss": -27.86478042602539, "global_step": 539641, "epoch": 6501} {"train_loss": -27.162982940673828, "global_step": 539642, "epoch": 6501} {"train_loss": -27.602645874023438, "global_step": 539643, "epoch": 6501} {"train_loss": -27.527929306030273, "global_step": 539644, "epoch": 6501} {"train_loss": -27.921600341796875, "global_step": 539645, "epoch": 6501} {"train_loss": -27.493871688842773, "global_step": 539646, "epoch": 6501} {"train_loss": -27.276647567749023, "global_step": 539647, "epoch": 6501} {"train_loss": -27.7758731842041, "global_step": 539648, "epoch": 6501} {"train_loss": -27.597997665405273, "global_step": 539649, "epoch": 6501} {"train_loss": -27.920486450195312, "global_step": 539650, "epoch": 6501} {"train_loss": -27.479156494140625, "global_step": 539651, "epoch": 6501} {"train_loss": -27.740650177001953, "global_step": 539652, "epoch": 6501} {"train_loss": -27.8395938873291, "global_step": 539653, "epoch": 6501} {"train_loss": -27.693204879760742, "global_step": 539654, "epoch": 6501} {"train_loss": -27.667768478393555, "global_step": 539655, "epoch": 6501} {"train_loss": -27.84516716003418, "global_step": 539656, "epoch": 6501} {"train_loss": -28.04437255859375, "global_step": 539657, "epoch": 6501} {"train_loss": -27.674177169799805, "global_step": 539658, "epoch": 6501} {"train_loss": -27.681127548217773, "global_step": 539659, "epoch": 6501} {"train_loss": -27.370996475219727, "global_step": 539660, "epoch": 6501} {"train_loss": -27.869129180908203, "global_step": 539661, "epoch": 6501} {"train_loss": -27.664474487304688, "global_step": 539662, "epoch": 6501} {"train_loss": -27.754993438720703, "global_step": 539663, "epoch": 6501} {"train_loss": -27.439428329467773, "global_step": 539664, "epoch": 6501} {"train_loss": -27.58942911998335, "global_step": 539665, "epoch": 6501, "val_loss": 6485069.0} {"train_loss": -27.485891342163086, "global_step": 539666, "epoch": 6502} {"train_loss": -26.543079376220703, "global_step": 539667, "epoch": 6502} {"train_loss": -25.53194236755371, "global_step": 539668, "epoch": 6502} {"train_loss": -26.08603858947754, "global_step": 539669, "epoch": 6502} {"train_loss": -26.214954376220703, "global_step": 539670, "epoch": 6502} {"train_loss": -26.79087257385254, "global_step": 539671, "epoch": 6502} {"train_loss": -27.169504165649414, "global_step": 539672, "epoch": 6502} {"train_loss": -26.8030948638916, "global_step": 539673, "epoch": 6502} {"train_loss": -26.909521102905273, "global_step": 539674, "epoch": 6502} {"train_loss": -27.42313003540039, "global_step": 539675, "epoch": 6502} {"train_loss": -27.33070182800293, "global_step": 539676, "epoch": 6502} {"train_loss": -27.265365600585938, "global_step": 539677, "epoch": 6502} {"train_loss": -27.47319984436035, "global_step": 539678, "epoch": 6502} {"train_loss": -26.86528968811035, "global_step": 539679, "epoch": 6502} {"train_loss": -27.51661491394043, "global_step": 539680, "epoch": 6502} {"train_loss": -27.65718650817871, "global_step": 539681, "epoch": 6502} {"train_loss": -27.527423858642578, "global_step": 539682, "epoch": 6502} {"train_loss": -27.608966827392578, "global_step": 539683, "epoch": 6502} {"train_loss": -27.608707427978516, "global_step": 539684, "epoch": 6502} {"train_loss": -27.019392013549805, "global_step": 539685, "epoch": 6502} {"train_loss": -27.428964614868164, "global_step": 539686, "epoch": 6502} {"train_loss": -27.192209243774414, "global_step": 539687, "epoch": 6502} {"train_loss": -27.642078399658203, "global_step": 539688, "epoch": 6502} {"train_loss": -27.049924850463867, "global_step": 539689, "epoch": 6502} {"train_loss": -27.749555587768555, "global_step": 539690, "epoch": 6502} {"train_loss": -27.399133682250977, "global_step": 539691, "epoch": 6502} {"train_loss": -27.53204345703125, "global_step": 539692, "epoch": 6502} {"train_loss": -27.467941284179688, "global_step": 539693, "epoch": 6502} {"train_loss": -27.7291259765625, "global_step": 539694, "epoch": 6502} {"train_loss": -27.48533058166504, "global_step": 539695, "epoch": 6502} {"train_loss": -27.604007720947266, "global_step": 539696, "epoch": 6502} {"train_loss": -27.761676788330078, "global_step": 539697, "epoch": 6502} {"train_loss": -27.834684371948242, "global_step": 539698, "epoch": 6502} {"train_loss": -27.489002227783203, "global_step": 539699, "epoch": 6502} {"train_loss": -27.564666748046875, "global_step": 539700, "epoch": 6502} {"train_loss": -27.72833251953125, "global_step": 539701, "epoch": 6502} {"train_loss": -27.6632137298584, "global_step": 539702, "epoch": 6502} {"train_loss": -27.400821685791016, "global_step": 539703, "epoch": 6502} {"train_loss": -27.51246452331543, "global_step": 539704, "epoch": 6502} {"train_loss": -27.66278648376465, "global_step": 539705, "epoch": 6502} {"train_loss": -27.754779815673828, "global_step": 539706, "epoch": 6502} {"train_loss": -27.712865829467773, "global_step": 539707, "epoch": 6502} {"train_loss": -27.619565963745117, "global_step": 539708, "epoch": 6502} {"train_loss": -27.90717124938965, "global_step": 539709, "epoch": 6502} {"train_loss": -27.7643985748291, "global_step": 539710, "epoch": 6502} {"train_loss": -27.52817153930664, "global_step": 539711, "epoch": 6502} {"train_loss": -28.07573890686035, "global_step": 539712, "epoch": 6502} {"train_loss": -28.0032901763916, "global_step": 539713, "epoch": 6502} {"train_loss": -28.131635665893555, "global_step": 539714, "epoch": 6502} {"train_loss": -27.733306884765625, "global_step": 539715, "epoch": 6502} {"train_loss": -27.87177085876465, "global_step": 539716, "epoch": 6502} {"train_loss": -27.803632736206055, "global_step": 539717, "epoch": 6502} {"train_loss": -27.73664665222168, "global_step": 539718, "epoch": 6502} {"train_loss": -27.387954711914062, "global_step": 539719, "epoch": 6502} {"train_loss": -27.883590698242188, "global_step": 539720, "epoch": 6502} {"train_loss": -27.71331214904785, "global_step": 539721, "epoch": 6502} {"train_loss": -27.7443904876709, "global_step": 539722, "epoch": 6502} {"train_loss": -27.45222282409668, "global_step": 539723, "epoch": 6502} {"train_loss": -27.247766494750977, "global_step": 539724, "epoch": 6502} {"train_loss": -27.249496459960938, "global_step": 539725, "epoch": 6502} {"train_loss": -27.704389572143555, "global_step": 539726, "epoch": 6502} {"train_loss": -28.02115821838379, "global_step": 539727, "epoch": 6502} {"train_loss": -27.566797256469727, "global_step": 539728, "epoch": 6502} {"train_loss": -27.118518829345703, "global_step": 539729, "epoch": 6502} {"train_loss": -27.722747802734375, "global_step": 539730, "epoch": 6502} {"train_loss": -27.728925704956055, "global_step": 539731, "epoch": 6502} {"train_loss": -27.96455955505371, "global_step": 539732, "epoch": 6502} {"train_loss": -28.18012809753418, "global_step": 539733, "epoch": 6502} {"train_loss": -27.292734146118164, "global_step": 539734, "epoch": 6502} {"train_loss": -27.589502334594727, "global_step": 539735, "epoch": 6502} {"train_loss": -27.489124298095703, "global_step": 539736, "epoch": 6502} {"train_loss": -27.873937606811523, "global_step": 539737, "epoch": 6502} {"train_loss": -27.3546085357666, "global_step": 539738, "epoch": 6502} {"train_loss": -27.549015045166016, "global_step": 539739, "epoch": 6502} {"train_loss": -27.515966415405273, "global_step": 539740, "epoch": 6502} {"train_loss": -27.4080867767334, "global_step": 539741, "epoch": 6502} {"train_loss": -27.846988677978516, "global_step": 539742, "epoch": 6502} {"train_loss": -27.736541748046875, "global_step": 539743, "epoch": 6502} {"train_loss": -27.662281036376953, "global_step": 539744, "epoch": 6502} {"train_loss": -27.730085372924805, "global_step": 539745, "epoch": 6502} {"train_loss": -27.605436325073242, "global_step": 539746, "epoch": 6502} {"train_loss": -28.08970069885254, "global_step": 539747, "epoch": 6502} {"train_loss": -27.516055302447583, "global_step": 539748, "epoch": 6502, "val_loss": 6410386.0} {"train_loss": -25.624902725219727, "global_step": 539749, "epoch": 6503} {"train_loss": -26.689441680908203, "global_step": 539750, "epoch": 6503} {"train_loss": -26.1452579498291, "global_step": 539751, "epoch": 6503} {"train_loss": -26.689697265625, "global_step": 539752, "epoch": 6503} {"train_loss": -26.743255615234375, "global_step": 539753, "epoch": 6503} {"train_loss": -26.575895309448242, "global_step": 539754, "epoch": 6503} {"train_loss": -27.28102684020996, "global_step": 539755, "epoch": 6503} {"train_loss": -26.401077270507812, "global_step": 539756, "epoch": 6503} {"train_loss": -26.765378952026367, "global_step": 539757, "epoch": 6503} {"train_loss": -27.148263931274414, "global_step": 539758, "epoch": 6503} {"train_loss": -26.724090576171875, "global_step": 539759, "epoch": 6503} {"train_loss": -27.266056060791016, "global_step": 539760, "epoch": 6503} {"train_loss": -26.851566314697266, "global_step": 539761, "epoch": 6503} {"train_loss": -27.023651123046875, "global_step": 539762, "epoch": 6503} {"train_loss": -27.60672950744629, "global_step": 539763, "epoch": 6503} {"train_loss": -27.01212501525879, "global_step": 539764, "epoch": 6503} {"train_loss": -27.26025390625, "global_step": 539765, "epoch": 6503} {"train_loss": -27.362905502319336, "global_step": 539766, "epoch": 6503} {"train_loss": -27.31989097595215, "global_step": 539767, "epoch": 6503} {"train_loss": -26.956287384033203, "global_step": 539768, "epoch": 6503} {"train_loss": -27.3353214263916, "global_step": 539769, "epoch": 6503} {"train_loss": -27.296483993530273, "global_step": 539770, "epoch": 6503} {"train_loss": -27.526952743530273, "global_step": 539771, "epoch": 6503} {"train_loss": -27.63286781311035, "global_step": 539772, "epoch": 6503} {"train_loss": -27.67609214782715, "global_step": 539773, "epoch": 6503} {"train_loss": -27.66999626159668, "global_step": 539774, "epoch": 6503} {"train_loss": -27.706623077392578, "global_step": 539775, "epoch": 6503} {"train_loss": -27.663623809814453, "global_step": 539776, "epoch": 6503} {"train_loss": -27.758453369140625, "global_step": 539777, "epoch": 6503} {"train_loss": -27.846242904663086, "global_step": 539778, "epoch": 6503} {"train_loss": -27.304264068603516, "global_step": 539779, "epoch": 6503} {"train_loss": -27.579015731811523, "global_step": 539780, "epoch": 6503} {"train_loss": -27.69923210144043, "global_step": 539781, "epoch": 6503} {"train_loss": -27.790075302124023, "global_step": 539782, "epoch": 6503} {"train_loss": -27.650266647338867, "global_step": 539783, "epoch": 6503} {"train_loss": -27.572555541992188, "global_step": 539784, "epoch": 6503} {"train_loss": -27.575979232788086, "global_step": 539785, "epoch": 6503} {"train_loss": -27.779809951782227, "global_step": 539786, "epoch": 6503} {"train_loss": -27.70063591003418, "global_step": 539787, "epoch": 6503} {"train_loss": -27.76698112487793, "global_step": 539788, "epoch": 6503} {"train_loss": -27.691558837890625, "global_step": 539789, "epoch": 6503} {"train_loss": -27.574844360351562, "global_step": 539790, "epoch": 6503} {"train_loss": -27.661365509033203, "global_step": 539791, "epoch": 6503} {"train_loss": -27.772790908813477, "global_step": 539792, "epoch": 6503} {"train_loss": -27.62399673461914, "global_step": 539793, "epoch": 6503} {"train_loss": -27.54202651977539, "global_step": 539794, "epoch": 6503} {"train_loss": -27.715045928955078, "global_step": 539795, "epoch": 6503} {"train_loss": -27.56442642211914, "global_step": 539796, "epoch": 6503} {"train_loss": -28.051837921142578, "global_step": 539797, "epoch": 6503} {"train_loss": -27.87367820739746, "global_step": 539798, "epoch": 6503} {"train_loss": -27.355478286743164, "global_step": 539799, "epoch": 6503} {"train_loss": -27.507741928100586, "global_step": 539800, "epoch": 6503} {"train_loss": -27.8027400970459, "global_step": 539801, "epoch": 6503} {"train_loss": -28.110641479492188, "global_step": 539802, "epoch": 6503} {"train_loss": -27.555631637573242, "global_step": 539803, "epoch": 6503} {"train_loss": -27.63633155822754, "global_step": 539804, "epoch": 6503} {"train_loss": -27.951623916625977, "global_step": 539805, "epoch": 6503} {"train_loss": -27.907855987548828, "global_step": 539806, "epoch": 6503} {"train_loss": -27.733015060424805, "global_step": 539807, "epoch": 6503} {"train_loss": -27.37064552307129, "global_step": 539808, "epoch": 6503} {"train_loss": -27.415170669555664, "global_step": 539809, "epoch": 6503} {"train_loss": -27.357227325439453, "global_step": 539810, "epoch": 6503} {"train_loss": -27.577051162719727, "global_step": 539811, "epoch": 6503} {"train_loss": -27.902191162109375, "global_step": 539812, "epoch": 6503} {"train_loss": -27.61532974243164, "global_step": 539813, "epoch": 6503} {"train_loss": -27.457611083984375, "global_step": 539814, "epoch": 6503} {"train_loss": -27.3623104095459, "global_step": 539815, "epoch": 6503} {"train_loss": -27.463109970092773, "global_step": 539816, "epoch": 6503} {"train_loss": -27.904972076416016, "global_step": 539817, "epoch": 6503} {"train_loss": -27.62983512878418, "global_step": 539818, "epoch": 6503} {"train_loss": -27.8350772857666, "global_step": 539819, "epoch": 6503} {"train_loss": -27.607025146484375, "global_step": 539820, "epoch": 6503} {"train_loss": -27.708066940307617, "global_step": 539821, "epoch": 6503} {"train_loss": -27.605594635009766, "global_step": 539822, "epoch": 6503} {"train_loss": -27.514759063720703, "global_step": 539823, "epoch": 6503} {"train_loss": -27.427160263061523, "global_step": 539824, "epoch": 6503} {"train_loss": -27.018508911132812, "global_step": 539825, "epoch": 6503} {"train_loss": -27.188520431518555, "global_step": 539826, "epoch": 6503} {"train_loss": -27.299182891845703, "global_step": 539827, "epoch": 6503} {"train_loss": -27.223913192749023, "global_step": 539828, "epoch": 6503} {"train_loss": -27.431814193725586, "global_step": 539829, "epoch": 6503} {"train_loss": -27.823902130126953, "global_step": 539830, "epoch": 6503} {"train_loss": -27.431765705706127, "global_step": 539831, "epoch": 6503, "val_loss": 6457414.0} {"train_loss": -26.88262939453125, "global_step": 539832, "epoch": 6504} {"train_loss": -27.036758422851562, "global_step": 539833, "epoch": 6504} {"train_loss": -27.1085147857666, "global_step": 539834, "epoch": 6504} {"train_loss": -27.2416934967041, "global_step": 539835, "epoch": 6504} {"train_loss": -26.784223556518555, "global_step": 539836, "epoch": 6504} {"train_loss": -27.35834312438965, "global_step": 539837, "epoch": 6504} {"train_loss": -27.02225685119629, "global_step": 539838, "epoch": 6504} {"train_loss": -27.115249633789062, "global_step": 539839, "epoch": 6504} {"train_loss": -27.686182022094727, "global_step": 539840, "epoch": 6504} {"train_loss": -26.918201446533203, "global_step": 539841, "epoch": 6504} {"train_loss": -27.25050163269043, "global_step": 539842, "epoch": 6504} {"train_loss": -27.224822998046875, "global_step": 539843, "epoch": 6504} {"train_loss": -27.531387329101562, "global_step": 539844, "epoch": 6504} {"train_loss": -27.494964599609375, "global_step": 539845, "epoch": 6504} {"train_loss": -27.741147994995117, "global_step": 539846, "epoch": 6504} {"train_loss": -27.661121368408203, "global_step": 539847, "epoch": 6504} {"train_loss": -27.71259880065918, "global_step": 539848, "epoch": 6504} {"train_loss": -27.916412353515625, "global_step": 539849, "epoch": 6504} {"train_loss": -27.77304458618164, "global_step": 539850, "epoch": 6504} {"train_loss": -27.393232345581055, "global_step": 539851, "epoch": 6504} {"train_loss": -27.30914878845215, "global_step": 539852, "epoch": 6504} {"train_loss": -27.81304359436035, "global_step": 539853, "epoch": 6504} {"train_loss": -27.357437133789062, "global_step": 539854, "epoch": 6504} {"train_loss": -27.46877098083496, "global_step": 539855, "epoch": 6504} {"train_loss": -27.493940353393555, "global_step": 539856, "epoch": 6504} {"train_loss": -27.493154525756836, "global_step": 539857, "epoch": 6504} {"train_loss": -27.60334587097168, "global_step": 539858, "epoch": 6504} {"train_loss": -28.046167373657227, "global_step": 539859, "epoch": 6504} {"train_loss": -27.907913208007812, "global_step": 539860, "epoch": 6504} {"train_loss": -27.7550106048584, "global_step": 539861, "epoch": 6504} {"train_loss": -27.844587326049805, "global_step": 539862, "epoch": 6504} {"train_loss": -27.729089736938477, "global_step": 539863, "epoch": 6504} {"train_loss": -27.574909210205078, "global_step": 539864, "epoch": 6504} {"train_loss": -27.854267120361328, "global_step": 539865, "epoch": 6504} {"train_loss": -27.73408317565918, "global_step": 539866, "epoch": 6504} {"train_loss": -27.37005615234375, "global_step": 539867, "epoch": 6504} {"train_loss": -28.041120529174805, "global_step": 539868, "epoch": 6504} {"train_loss": -27.822690963745117, "global_step": 539869, "epoch": 6504} {"train_loss": -27.5490779876709, "global_step": 539870, "epoch": 6504} {"train_loss": -27.859222412109375, "global_step": 539871, "epoch": 6504} {"train_loss": -27.817291259765625, "global_step": 539872, "epoch": 6504} {"train_loss": -27.615142822265625, "global_step": 539873, "epoch": 6504} {"train_loss": -27.970123291015625, "global_step": 539874, "epoch": 6504} {"train_loss": -27.878087997436523, "global_step": 539875, "epoch": 6504} {"train_loss": -27.97256851196289, "global_step": 539876, "epoch": 6504} {"train_loss": -27.541147232055664, "global_step": 539877, "epoch": 6504} {"train_loss": -28.084043502807617, "global_step": 539878, "epoch": 6504} {"train_loss": -27.77117347717285, "global_step": 539879, "epoch": 6504} {"train_loss": -27.682886123657227, "global_step": 539880, "epoch": 6504} {"train_loss": -27.240182876586914, "global_step": 539881, "epoch": 6504} {"train_loss": -27.460805892944336, "global_step": 539882, "epoch": 6504} {"train_loss": -27.6413516998291, "global_step": 539883, "epoch": 6504} {"train_loss": -27.609909057617188, "global_step": 539884, "epoch": 6504} {"train_loss": -27.392242431640625, "global_step": 539885, "epoch": 6504} {"train_loss": -27.551074981689453, "global_step": 539886, "epoch": 6504} {"train_loss": -27.2836856842041, "global_step": 539887, "epoch": 6504} {"train_loss": -27.02264404296875, "global_step": 539888, "epoch": 6504} {"train_loss": -26.106348037719727, "global_step": 539889, "epoch": 6504} {"train_loss": -27.292041778564453, "global_step": 539890, "epoch": 6504} {"train_loss": -27.74370765686035, "global_step": 539891, "epoch": 6504} {"train_loss": -27.193395614624023, "global_step": 539892, "epoch": 6504} {"train_loss": -27.28346824645996, "global_step": 539893, "epoch": 6504} {"train_loss": -27.53076171875, "global_step": 539894, "epoch": 6504} {"train_loss": -27.457223892211914, "global_step": 539895, "epoch": 6504} {"train_loss": -27.513168334960938, "global_step": 539896, "epoch": 6504} {"train_loss": -27.440185546875, "global_step": 539897, "epoch": 6504} {"train_loss": -27.46969985961914, "global_step": 539898, "epoch": 6504} {"train_loss": -27.41607666015625, "global_step": 539899, "epoch": 6504} {"train_loss": -28.01479148864746, "global_step": 539900, "epoch": 6504} {"train_loss": -27.653722763061523, "global_step": 539901, "epoch": 6504} {"train_loss": -27.63655662536621, "global_step": 539902, "epoch": 6504} {"train_loss": -27.976598739624023, "global_step": 539903, "epoch": 6504} {"train_loss": -27.72047233581543, "global_step": 539904, "epoch": 6504} {"train_loss": -27.625722885131836, "global_step": 539905, "epoch": 6504} {"train_loss": -27.566125869750977, "global_step": 539906, "epoch": 6504} {"train_loss": -27.727880477905273, "global_step": 539907, "epoch": 6504} {"train_loss": -27.62342643737793, "global_step": 539908, "epoch": 6504} {"train_loss": -27.758102416992188, "global_step": 539909, "epoch": 6504} {"train_loss": -27.947004318237305, "global_step": 539910, "epoch": 6504} {"train_loss": -27.321359634399414, "global_step": 539911, "epoch": 6504} {"train_loss": -27.550439834594727, "global_step": 539912, "epoch": 6504} {"train_loss": -27.614501953125, "global_step": 539913, "epoch": 6504} {"train_loss": -27.558583500873613, "global_step": 539914, "epoch": 6504, "val_loss": 6435412.0} {"train_loss": -27.02679443359375, "global_step": 539915, "epoch": 6505} {"train_loss": -27.052724838256836, "global_step": 539916, "epoch": 6505} {"train_loss": -27.054685592651367, "global_step": 539917, "epoch": 6505} {"train_loss": -27.372900009155273, "global_step": 539918, "epoch": 6505} {"train_loss": -27.59724998474121, "global_step": 539919, "epoch": 6505} {"train_loss": -27.456974029541016, "global_step": 539920, "epoch": 6505} {"train_loss": -27.06255531311035, "global_step": 539921, "epoch": 6505} {"train_loss": -27.629150390625, "global_step": 539922, "epoch": 6505} {"train_loss": -27.46695327758789, "global_step": 539923, "epoch": 6505} {"train_loss": -27.527753829956055, "global_step": 539924, "epoch": 6505} {"train_loss": -27.403064727783203, "global_step": 539925, "epoch": 6505} {"train_loss": -27.275604248046875, "global_step": 539926, "epoch": 6505} {"train_loss": -27.34079933166504, "global_step": 539927, "epoch": 6505} {"train_loss": -27.814044952392578, "global_step": 539928, "epoch": 6505} {"train_loss": -27.473388671875, "global_step": 539929, "epoch": 6505} {"train_loss": -27.51615333557129, "global_step": 539930, "epoch": 6505} {"train_loss": -27.77268409729004, "global_step": 539931, "epoch": 6505} {"train_loss": -27.920225143432617, "global_step": 539932, "epoch": 6505} {"train_loss": -27.458887100219727, "global_step": 539933, "epoch": 6505} {"train_loss": -27.248260498046875, "global_step": 539934, "epoch": 6505} {"train_loss": -27.928892135620117, "global_step": 539935, "epoch": 6505} {"train_loss": -27.598697662353516, "global_step": 539936, "epoch": 6505} {"train_loss": -27.679346084594727, "global_step": 539937, "epoch": 6505} {"train_loss": -27.7489013671875, "global_step": 539938, "epoch": 6505} {"train_loss": -28.096546173095703, "global_step": 539939, "epoch": 6505} {"train_loss": -27.813114166259766, "global_step": 539940, "epoch": 6505} {"train_loss": -27.615070343017578, "global_step": 539941, "epoch": 6505} {"train_loss": -27.26068115234375, "global_step": 539942, "epoch": 6505} {"train_loss": -28.18939208984375, "global_step": 539943, "epoch": 6505} {"train_loss": -27.689802169799805, "global_step": 539944, "epoch": 6505} {"train_loss": -27.513111114501953, "global_step": 539945, "epoch": 6505} {"train_loss": -27.528417587280273, "global_step": 539946, "epoch": 6505} {"train_loss": -27.33296012878418, "global_step": 539947, "epoch": 6505} {"train_loss": -27.864526748657227, "global_step": 539948, "epoch": 6505} {"train_loss": -27.80923843383789, "global_step": 539949, "epoch": 6505} {"train_loss": -27.444467544555664, "global_step": 539950, "epoch": 6505} {"train_loss": -27.7982120513916, "global_step": 539951, "epoch": 6505} {"train_loss": -28.19471549987793, "global_step": 539952, "epoch": 6505} {"train_loss": -27.885156631469727, "global_step": 539953, "epoch": 6505} {"train_loss": -27.650104522705078, "global_step": 539954, "epoch": 6505} {"train_loss": -27.42066764831543, "global_step": 539955, "epoch": 6505} {"train_loss": -27.79029655456543, "global_step": 539956, "epoch": 6505} {"train_loss": -27.89151382446289, "global_step": 539957, "epoch": 6505} {"train_loss": -27.573354721069336, "global_step": 539958, "epoch": 6505} {"train_loss": -27.605697631835938, "global_step": 539959, "epoch": 6505} {"train_loss": -26.7702693939209, "global_step": 539960, "epoch": 6505} {"train_loss": -25.99773597717285, "global_step": 539961, "epoch": 6505} {"train_loss": -27.217208862304688, "global_step": 539962, "epoch": 6505} {"train_loss": -27.6126651763916, "global_step": 539963, "epoch": 6505} {"train_loss": -27.037389755249023, "global_step": 539964, "epoch": 6505} {"train_loss": -27.08831214904785, "global_step": 539965, "epoch": 6505} {"train_loss": -28.0080509185791, "global_step": 539966, "epoch": 6505} {"train_loss": -27.52825355529785, "global_step": 539967, "epoch": 6505} {"train_loss": -27.707883834838867, "global_step": 539968, "epoch": 6505} {"train_loss": -27.544580459594727, "global_step": 539969, "epoch": 6505} {"train_loss": -27.419025421142578, "global_step": 539970, "epoch": 6505} {"train_loss": -27.5886287689209, "global_step": 539971, "epoch": 6505} {"train_loss": -27.481637954711914, "global_step": 539972, "epoch": 6505} {"train_loss": -27.471805572509766, "global_step": 539973, "epoch": 6505} {"train_loss": -27.69191551208496, "global_step": 539974, "epoch": 6505} {"train_loss": -27.711130142211914, "global_step": 539975, "epoch": 6505} {"train_loss": -27.670682907104492, "global_step": 539976, "epoch": 6505} {"train_loss": -27.70087242126465, "global_step": 539977, "epoch": 6505} {"train_loss": -27.945011138916016, "global_step": 539978, "epoch": 6505} {"train_loss": -27.304845809936523, "global_step": 539979, "epoch": 6505} {"train_loss": -27.68964195251465, "global_step": 539980, "epoch": 6505} {"train_loss": -28.010074615478516, "global_step": 539981, "epoch": 6505} {"train_loss": -27.767072677612305, "global_step": 539982, "epoch": 6505} {"train_loss": -28.03253746032715, "global_step": 539983, "epoch": 6505} {"train_loss": -27.70316505432129, "global_step": 539984, "epoch": 6505} {"train_loss": -27.634008407592773, "global_step": 539985, "epoch": 6505} {"train_loss": -27.4622859954834, "global_step": 539986, "epoch": 6505} {"train_loss": -27.195104598999023, "global_step": 539987, "epoch": 6505} {"train_loss": -27.51494789123535, "global_step": 539988, "epoch": 6505} {"train_loss": -27.453338623046875, "global_step": 539989, "epoch": 6505} {"train_loss": -27.563125610351562, "global_step": 539990, "epoch": 6505} {"train_loss": -27.894210815429688, "global_step": 539991, "epoch": 6505} {"train_loss": -27.40164566040039, "global_step": 539992, "epoch": 6505} {"train_loss": -27.468774795532227, "global_step": 539993, "epoch": 6505} {"train_loss": -27.764759063720703, "global_step": 539994, "epoch": 6505} {"train_loss": -27.99249839782715, "global_step": 539995, "epoch": 6505} {"train_loss": -27.394861221313477, "global_step": 539996, "epoch": 6505} {"train_loss": -27.558604619589197, "global_step": 539997, "epoch": 6505, "val_loss": 6494003.5} {"train_loss": -26.97028160095215, "global_step": 539998, "epoch": 6506} {"train_loss": -26.212072372436523, "global_step": 539999, "epoch": 6506} {"train_loss": -26.80783462524414, "global_step": 540000, "epoch": 6506} {"train_loss": -26.814847946166992, "global_step": 540001, "epoch": 6506} {"train_loss": -27.445215225219727, "global_step": 540002, "epoch": 6506} {"train_loss": -26.03763198852539, "global_step": 540003, "epoch": 6506} {"train_loss": -26.84783363342285, "global_step": 540004, "epoch": 6506} {"train_loss": -27.08636474609375, "global_step": 540005, "epoch": 6506} {"train_loss": -26.835895538330078, "global_step": 540006, "epoch": 6506} {"train_loss": -27.04096794128418, "global_step": 540007, "epoch": 6506} {"train_loss": -27.13715171813965, "global_step": 540008, "epoch": 6506} {"train_loss": -27.07928466796875, "global_step": 540009, "epoch": 6506} {"train_loss": -27.092700958251953, "global_step": 540010, "epoch": 6506} {"train_loss": -27.06503677368164, "global_step": 540011, "epoch": 6506} {"train_loss": -27.275760650634766, "global_step": 540012, "epoch": 6506} {"train_loss": -27.4290714263916, "global_step": 540013, "epoch": 6506} {"train_loss": -27.530075073242188, "global_step": 540014, "epoch": 6506} {"train_loss": -27.118427276611328, "global_step": 540015, "epoch": 6506} {"train_loss": -27.489736557006836, "global_step": 540016, "epoch": 6506} {"train_loss": -27.02718162536621, "global_step": 540017, "epoch": 6506} {"train_loss": -27.438953399658203, "global_step": 540018, "epoch": 6506} {"train_loss": -27.6688175201416, "global_step": 540019, "epoch": 6506} {"train_loss": -27.721548080444336, "global_step": 540020, "epoch": 6506} {"train_loss": -27.536483764648438, "global_step": 540021, "epoch": 6506} {"train_loss": -27.46034812927246, "global_step": 540022, "epoch": 6506} {"train_loss": -27.46712303161621, "global_step": 540023, "epoch": 6506} {"train_loss": -27.66226577758789, "global_step": 540024, "epoch": 6506} {"train_loss": -27.84699058532715, "global_step": 540025, "epoch": 6506} {"train_loss": -28.026386260986328, "global_step": 540026, "epoch": 6506} {"train_loss": -28.066564559936523, "global_step": 540027, "epoch": 6506} {"train_loss": -27.419025421142578, "global_step": 540028, "epoch": 6506} {"train_loss": -27.3052921295166, "global_step": 540029, "epoch": 6506} {"train_loss": -27.308988571166992, "global_step": 540030, "epoch": 6506} {"train_loss": -27.80197525024414, "global_step": 540031, "epoch": 6506} {"train_loss": -27.778600692749023, "global_step": 540032, "epoch": 6506} {"train_loss": -27.589508056640625, "global_step": 540033, "epoch": 6506} {"train_loss": -27.121267318725586, "global_step": 540034, "epoch": 6506} {"train_loss": -27.696521759033203, "global_step": 540035, "epoch": 6506} {"train_loss": -27.520587921142578, "global_step": 540036, "epoch": 6506} {"train_loss": -27.36921501159668, "global_step": 540037, "epoch": 6506} {"train_loss": -27.633163452148438, "global_step": 540038, "epoch": 6506} {"train_loss": -27.917938232421875, "global_step": 540039, "epoch": 6506} {"train_loss": -27.531103134155273, "global_step": 540040, "epoch": 6506} {"train_loss": -27.903966903686523, "global_step": 540041, "epoch": 6506} {"train_loss": -27.978864669799805, "global_step": 540042, "epoch": 6506} {"train_loss": -27.661603927612305, "global_step": 540043, "epoch": 6506} {"train_loss": -27.6850643157959, "global_step": 540044, "epoch": 6506} {"train_loss": -27.92206382751465, "global_step": 540045, "epoch": 6506} {"train_loss": -28.145605087280273, "global_step": 540046, "epoch": 6506} {"train_loss": -27.440460205078125, "global_step": 540047, "epoch": 6506} {"train_loss": -27.70119285583496, "global_step": 540048, "epoch": 6506} {"train_loss": -27.49372673034668, "global_step": 540049, "epoch": 6506} {"train_loss": -27.63153648376465, "global_step": 540050, "epoch": 6506} {"train_loss": -27.8472900390625, "global_step": 540051, "epoch": 6506} {"train_loss": -27.678049087524414, "global_step": 540052, "epoch": 6506} {"train_loss": -27.8024959564209, "global_step": 540053, "epoch": 6506} {"train_loss": -27.251047134399414, "global_step": 540054, "epoch": 6506} {"train_loss": -27.528919219970703, "global_step": 540055, "epoch": 6506} {"train_loss": -27.636402130126953, "global_step": 540056, "epoch": 6506} {"train_loss": -27.800718307495117, "global_step": 540057, "epoch": 6506} {"train_loss": -27.321823120117188, "global_step": 540058, "epoch": 6506} {"train_loss": -27.575672149658203, "global_step": 540059, "epoch": 6506} {"train_loss": -27.37885856628418, "global_step": 540060, "epoch": 6506} {"train_loss": -27.923574447631836, "global_step": 540061, "epoch": 6506} {"train_loss": -27.495594024658203, "global_step": 540062, "epoch": 6506} {"train_loss": -27.46305274963379, "global_step": 540063, "epoch": 6506} {"train_loss": -27.430593490600586, "global_step": 540064, "epoch": 6506} {"train_loss": -27.751953125, "global_step": 540065, "epoch": 6506} {"train_loss": -27.388952255249023, "global_step": 540066, "epoch": 6506} {"train_loss": -27.555438995361328, "global_step": 540067, "epoch": 6506} {"train_loss": -27.775726318359375, "global_step": 540068, "epoch": 6506} {"train_loss": -28.11958885192871, "global_step": 540069, "epoch": 6506} {"train_loss": -27.668798446655273, "global_step": 540070, "epoch": 6506} {"train_loss": -27.632705688476562, "global_step": 540071, "epoch": 6506} {"train_loss": -27.562646865844727, "global_step": 540072, "epoch": 6506} {"train_loss": -27.935626983642578, "global_step": 540073, "epoch": 6506} {"train_loss": -27.333871841430664, "global_step": 540074, "epoch": 6506} {"train_loss": -27.677473068237305, "global_step": 540075, "epoch": 6506} {"train_loss": -27.609210968017578, "global_step": 540076, "epoch": 6506} {"train_loss": -27.552753448486328, "global_step": 540077, "epoch": 6506} {"train_loss": -27.776416778564453, "global_step": 540078, "epoch": 6506} {"train_loss": -27.943099975585938, "global_step": 540079, "epoch": 6506} {"train_loss": -27.50544313637607, "global_step": 540080, "epoch": 6506, "val_loss": 6453679.0} {"train_loss": -26.805334091186523, "global_step": 540081, "epoch": 6507} {"train_loss": -26.615095138549805, "global_step": 540082, "epoch": 6507} {"train_loss": -27.005268096923828, "global_step": 540083, "epoch": 6507} {"train_loss": -26.89759635925293, "global_step": 540084, "epoch": 6507} {"train_loss": -27.364063262939453, "global_step": 540085, "epoch": 6507} {"train_loss": -26.779626846313477, "global_step": 540086, "epoch": 6507} {"train_loss": -26.879621505737305, "global_step": 540087, "epoch": 6507} {"train_loss": -27.098037719726562, "global_step": 540088, "epoch": 6507} {"train_loss": -26.9771671295166, "global_step": 540089, "epoch": 6507} {"train_loss": -27.1693115234375, "global_step": 540090, "epoch": 6507} {"train_loss": -27.440900802612305, "global_step": 540091, "epoch": 6507} {"train_loss": -27.056201934814453, "global_step": 540092, "epoch": 6507} {"train_loss": -27.263565063476562, "global_step": 540093, "epoch": 6507} {"train_loss": -27.556798934936523, "global_step": 540094, "epoch": 6507} {"train_loss": -27.477859497070312, "global_step": 540095, "epoch": 6507} {"train_loss": -27.695240020751953, "global_step": 540096, "epoch": 6507} {"train_loss": -27.342710494995117, "global_step": 540097, "epoch": 6507} {"train_loss": -27.17070960998535, "global_step": 540098, "epoch": 6507} {"train_loss": -27.672321319580078, "global_step": 540099, "epoch": 6507} {"train_loss": -27.24784278869629, "global_step": 540100, "epoch": 6507} {"train_loss": -27.4942569732666, "global_step": 540101, "epoch": 6507} {"train_loss": -27.493331909179688, "global_step": 540102, "epoch": 6507} {"train_loss": -27.72174072265625, "global_step": 540103, "epoch": 6507} {"train_loss": -27.846561431884766, "global_step": 540104, "epoch": 6507} {"train_loss": -27.627002716064453, "global_step": 540105, "epoch": 6507} {"train_loss": -27.75636100769043, "global_step": 540106, "epoch": 6507} {"train_loss": -27.683637619018555, "global_step": 540107, "epoch": 6507} {"train_loss": -27.623395919799805, "global_step": 540108, "epoch": 6507} {"train_loss": -27.729719161987305, "global_step": 540109, "epoch": 6507} {"train_loss": -28.09027671813965, "global_step": 540110, "epoch": 6507} {"train_loss": -27.701629638671875, "global_step": 540111, "epoch": 6507} {"train_loss": -27.695301055908203, "global_step": 540112, "epoch": 6507} {"train_loss": -27.768957138061523, "global_step": 540113, "epoch": 6507} {"train_loss": -27.750574111938477, "global_step": 540114, "epoch": 6507} {"train_loss": -27.7409725189209, "global_step": 540115, "epoch": 6507} {"train_loss": -27.810962677001953, "global_step": 540116, "epoch": 6507} {"train_loss": -27.642459869384766, "global_step": 540117, "epoch": 6507} {"train_loss": -28.02033042907715, "global_step": 540118, "epoch": 6507} {"train_loss": -27.589130401611328, "global_step": 540119, "epoch": 6507} {"train_loss": -28.04078483581543, "global_step": 540120, "epoch": 6507} {"train_loss": -27.81009292602539, "global_step": 540121, "epoch": 6507} {"train_loss": -28.050275802612305, "global_step": 540122, "epoch": 6507} {"train_loss": -28.182645797729492, "global_step": 540123, "epoch": 6507} {"train_loss": -27.83076286315918, "global_step": 540124, "epoch": 6507} {"train_loss": -27.57093620300293, "global_step": 540125, "epoch": 6507} {"train_loss": -27.74187660217285, "global_step": 540126, "epoch": 6507} {"train_loss": -27.8790225982666, "global_step": 540127, "epoch": 6507} {"train_loss": -27.83197593688965, "global_step": 540128, "epoch": 6507} {"train_loss": -27.58432388305664, "global_step": 540129, "epoch": 6507} {"train_loss": -27.76597023010254, "global_step": 540130, "epoch": 6507} {"train_loss": -27.613996505737305, "global_step": 540131, "epoch": 6507} {"train_loss": -27.77410888671875, "global_step": 540132, "epoch": 6507} {"train_loss": -27.65182876586914, "global_step": 540133, "epoch": 6507} {"train_loss": -27.597936630249023, "global_step": 540134, "epoch": 6507} {"train_loss": -27.8875732421875, "global_step": 540135, "epoch": 6507} {"train_loss": -27.609296798706055, "global_step": 540136, "epoch": 6507} {"train_loss": -27.723373413085938, "global_step": 540137, "epoch": 6507} {"train_loss": -27.251447677612305, "global_step": 540138, "epoch": 6507} {"train_loss": -27.55537223815918, "global_step": 540139, "epoch": 6507} {"train_loss": -27.28363037109375, "global_step": 540140, "epoch": 6507} {"train_loss": -27.310104370117188, "global_step": 540141, "epoch": 6507} {"train_loss": -27.71976661682129, "global_step": 540142, "epoch": 6507} {"train_loss": -27.81683921813965, "global_step": 540143, "epoch": 6507} {"train_loss": -27.48712158203125, "global_step": 540144, "epoch": 6507} {"train_loss": -27.38361167907715, "global_step": 540145, "epoch": 6507} {"train_loss": -27.78948974609375, "global_step": 540146, "epoch": 6507} {"train_loss": -27.715152740478516, "global_step": 540147, "epoch": 6507} {"train_loss": -27.68891716003418, "global_step": 540148, "epoch": 6507} {"train_loss": -27.885406494140625, "global_step": 540149, "epoch": 6507} {"train_loss": -27.727697372436523, "global_step": 540150, "epoch": 6507} {"train_loss": -27.740528106689453, "global_step": 540151, "epoch": 6507} {"train_loss": -27.753957748413086, "global_step": 540152, "epoch": 6507} {"train_loss": -27.95956802368164, "global_step": 540153, "epoch": 6507} {"train_loss": -27.64203453063965, "global_step": 540154, "epoch": 6507} {"train_loss": -27.46416664123535, "global_step": 540155, "epoch": 6507} {"train_loss": -27.575550079345703, "global_step": 540156, "epoch": 6507} {"train_loss": -27.58636474609375, "global_step": 540157, "epoch": 6507} {"train_loss": -27.5047664642334, "global_step": 540158, "epoch": 6507} {"train_loss": -27.555761337280273, "global_step": 540159, "epoch": 6507} {"train_loss": -28.1395320892334, "global_step": 540160, "epoch": 6507} {"train_loss": -27.9086856842041, "global_step": 540161, "epoch": 6507} {"train_loss": -27.81377601623535, "global_step": 540162, "epoch": 6507} {"train_loss": -27.58418788680111, "global_step": 540163, "epoch": 6507, "val_loss": 6466102.0} {"train_loss": -27.280710220336914, "global_step": 540164, "epoch": 6508} {"train_loss": -27.1398983001709, "global_step": 540165, "epoch": 6508} {"train_loss": -27.560449600219727, "global_step": 540166, "epoch": 6508} {"train_loss": -27.372974395751953, "global_step": 540167, "epoch": 6508} {"train_loss": -27.228342056274414, "global_step": 540168, "epoch": 6508} {"train_loss": -27.612348556518555, "global_step": 540169, "epoch": 6508} {"train_loss": -27.418109893798828, "global_step": 540170, "epoch": 6508} {"train_loss": -27.689992904663086, "global_step": 540171, "epoch": 6508} {"train_loss": -27.400333404541016, "global_step": 540172, "epoch": 6508} {"train_loss": -27.516845703125, "global_step": 540173, "epoch": 6508} {"train_loss": -27.45551872253418, "global_step": 540174, "epoch": 6508} {"train_loss": -27.399595260620117, "global_step": 540175, "epoch": 6508} {"train_loss": -27.121337890625, "global_step": 540176, "epoch": 6508} {"train_loss": -27.55045509338379, "global_step": 540177, "epoch": 6508} {"train_loss": -27.76325035095215, "global_step": 540178, "epoch": 6508} {"train_loss": -27.71150016784668, "global_step": 540179, "epoch": 6508} {"train_loss": -27.403167724609375, "global_step": 540180, "epoch": 6508} {"train_loss": -27.766027450561523, "global_step": 540181, "epoch": 6508} {"train_loss": -27.741540908813477, "global_step": 540182, "epoch": 6508} {"train_loss": -27.7921085357666, "global_step": 540183, "epoch": 6508} {"train_loss": -27.781326293945312, "global_step": 540184, "epoch": 6508} {"train_loss": -27.777490615844727, "global_step": 540185, "epoch": 6508} {"train_loss": -27.80527114868164, "global_step": 540186, "epoch": 6508} {"train_loss": -27.652801513671875, "global_step": 540187, "epoch": 6508} {"train_loss": -27.794065475463867, "global_step": 540188, "epoch": 6508} {"train_loss": -27.79835319519043, "global_step": 540189, "epoch": 6508} {"train_loss": -28.149982452392578, "global_step": 540190, "epoch": 6508} {"train_loss": -27.583831787109375, "global_step": 540191, "epoch": 6508} {"train_loss": -28.060163497924805, "global_step": 540192, "epoch": 6508} {"train_loss": -27.584951400756836, "global_step": 540193, "epoch": 6508} {"train_loss": -27.899255752563477, "global_step": 540194, "epoch": 6508} {"train_loss": -28.02949333190918, "global_step": 540195, "epoch": 6508} {"train_loss": -28.036962509155273, "global_step": 540196, "epoch": 6508} {"train_loss": -27.85491943359375, "global_step": 540197, "epoch": 6508} {"train_loss": -28.06612205505371, "global_step": 540198, "epoch": 6508} {"train_loss": -27.533802032470703, "global_step": 540199, "epoch": 6508} {"train_loss": -27.32657814025879, "global_step": 540200, "epoch": 6508} {"train_loss": -27.458566665649414, "global_step": 540201, "epoch": 6508} {"train_loss": -27.674474716186523, "global_step": 540202, "epoch": 6508} {"train_loss": -27.472492218017578, "global_step": 540203, "epoch": 6508} {"train_loss": -27.781875610351562, "global_step": 540204, "epoch": 6508} {"train_loss": -27.698745727539062, "global_step": 540205, "epoch": 6508} {"train_loss": -27.34663200378418, "global_step": 540206, "epoch": 6508} {"train_loss": -27.79424476623535, "global_step": 540207, "epoch": 6508} {"train_loss": -27.942249298095703, "global_step": 540208, "epoch": 6508} {"train_loss": -27.43904685974121, "global_step": 540209, "epoch": 6508} {"train_loss": -27.34358024597168, "global_step": 540210, "epoch": 6508} {"train_loss": -28.120792388916016, "global_step": 540211, "epoch": 6508} {"train_loss": -27.51093864440918, "global_step": 540212, "epoch": 6508} {"train_loss": -27.622190475463867, "global_step": 540213, "epoch": 6508} {"train_loss": -27.375396728515625, "global_step": 540214, "epoch": 6508} {"train_loss": -27.603961944580078, "global_step": 540215, "epoch": 6508} {"train_loss": -27.7608699798584, "global_step": 540216, "epoch": 6508} {"train_loss": -27.7880916595459, "global_step": 540217, "epoch": 6508} {"train_loss": -27.665735244750977, "global_step": 540218, "epoch": 6508} {"train_loss": -27.377685546875, "global_step": 540219, "epoch": 6508} {"train_loss": -27.694412231445312, "global_step": 540220, "epoch": 6508} {"train_loss": -27.10589599609375, "global_step": 540221, "epoch": 6508} {"train_loss": -27.557973861694336, "global_step": 540222, "epoch": 6508} {"train_loss": -27.127836227416992, "global_step": 540223, "epoch": 6508} {"train_loss": -27.924604415893555, "global_step": 540224, "epoch": 6508} {"train_loss": -27.569921493530273, "global_step": 540225, "epoch": 6508} {"train_loss": -27.582433700561523, "global_step": 540226, "epoch": 6508} {"train_loss": -27.348712921142578, "global_step": 540227, "epoch": 6508} {"train_loss": -27.695606231689453, "global_step": 540228, "epoch": 6508} {"train_loss": -27.88606071472168, "global_step": 540229, "epoch": 6508} {"train_loss": -27.376117706298828, "global_step": 540230, "epoch": 6508} {"train_loss": -27.700220108032227, "global_step": 540231, "epoch": 6508} {"train_loss": -27.675573348999023, "global_step": 540232, "epoch": 6508} {"train_loss": -27.58564567565918, "global_step": 540233, "epoch": 6508} {"train_loss": -27.88514518737793, "global_step": 540234, "epoch": 6508} {"train_loss": -27.562000274658203, "global_step": 540235, "epoch": 6508} {"train_loss": -27.551406860351562, "global_step": 540236, "epoch": 6508} {"train_loss": -27.475555419921875, "global_step": 540237, "epoch": 6508} {"train_loss": -28.04680824279785, "global_step": 540238, "epoch": 6508} {"train_loss": -27.72393226623535, "global_step": 540239, "epoch": 6508} {"train_loss": -27.92142677307129, "global_step": 540240, "epoch": 6508} {"train_loss": -27.839996337890625, "global_step": 540241, "epoch": 6508} {"train_loss": -28.090625762939453, "global_step": 540242, "epoch": 6508} {"train_loss": -27.76966667175293, "global_step": 540243, "epoch": 6508} {"train_loss": -27.562833786010742, "global_step": 540244, "epoch": 6508} {"train_loss": -27.49517822265625, "global_step": 540245, "epoch": 6508} {"train_loss": -27.632525731282062, "global_step": 540246, "epoch": 6508, "val_loss": 6521990.5} {"train_loss": -26.792394638061523, "global_step": 540247, "epoch": 6509} {"train_loss": -25.254913330078125, "global_step": 540248, "epoch": 6509} {"train_loss": -23.827688217163086, "global_step": 540249, "epoch": 6509} {"train_loss": -26.577375411987305, "global_step": 540250, "epoch": 6509} {"train_loss": -27.28211784362793, "global_step": 540251, "epoch": 6509} {"train_loss": -26.64510154724121, "global_step": 540252, "epoch": 6509} {"train_loss": -27.098230361938477, "global_step": 540253, "epoch": 6509} {"train_loss": -26.862951278686523, "global_step": 540254, "epoch": 6509} {"train_loss": -27.065692901611328, "global_step": 540255, "epoch": 6509} {"train_loss": -27.31781578063965, "global_step": 540256, "epoch": 6509} {"train_loss": -27.477161407470703, "global_step": 540257, "epoch": 6509} {"train_loss": -27.28702735900879, "global_step": 540258, "epoch": 6509} {"train_loss": -27.092493057250977, "global_step": 540259, "epoch": 6509} {"train_loss": -27.550567626953125, "global_step": 540260, "epoch": 6509} {"train_loss": -27.414960861206055, "global_step": 540261, "epoch": 6509} {"train_loss": -27.091482162475586, "global_step": 540262, "epoch": 6509} {"train_loss": -27.28382682800293, "global_step": 540263, "epoch": 6509} {"train_loss": -27.270496368408203, "global_step": 540264, "epoch": 6509} {"train_loss": -27.528791427612305, "global_step": 540265, "epoch": 6509} {"train_loss": -27.70474624633789, "global_step": 540266, "epoch": 6509} {"train_loss": -27.780447006225586, "global_step": 540267, "epoch": 6509} {"train_loss": -27.5642032623291, "global_step": 540268, "epoch": 6509} {"train_loss": -27.825231552124023, "global_step": 540269, "epoch": 6509} {"train_loss": -27.409093856811523, "global_step": 540270, "epoch": 6509} {"train_loss": -27.46864891052246, "global_step": 540271, "epoch": 6509} {"train_loss": -27.53919792175293, "global_step": 540272, "epoch": 6509} {"train_loss": -27.51666831970215, "global_step": 540273, "epoch": 6509} {"train_loss": -27.7231388092041, "global_step": 540274, "epoch": 6509} {"train_loss": -27.48794937133789, "global_step": 540275, "epoch": 6509} {"train_loss": -27.23786735534668, "global_step": 540276, "epoch": 6509} {"train_loss": -27.65095329284668, "global_step": 540277, "epoch": 6509} {"train_loss": -27.42217445373535, "global_step": 540278, "epoch": 6509} {"train_loss": -27.682117462158203, "global_step": 540279, "epoch": 6509} {"train_loss": -27.621618270874023, "global_step": 540280, "epoch": 6509} {"train_loss": -27.753849029541016, "global_step": 540281, "epoch": 6509} {"train_loss": -27.60542869567871, "global_step": 540282, "epoch": 6509} {"train_loss": -27.472900390625, "global_step": 540283, "epoch": 6509} {"train_loss": -27.876813888549805, "global_step": 540284, "epoch": 6509} {"train_loss": -27.9771671295166, "global_step": 540285, "epoch": 6509} {"train_loss": -27.64473533630371, "global_step": 540286, "epoch": 6509} {"train_loss": -27.37933349609375, "global_step": 540287, "epoch": 6509} {"train_loss": -26.645776748657227, "global_step": 540288, "epoch": 6509} {"train_loss": -27.020404815673828, "global_step": 540289, "epoch": 6509} {"train_loss": -27.33246421813965, "global_step": 540290, "epoch": 6509} {"train_loss": -26.243032455444336, "global_step": 540291, "epoch": 6509} {"train_loss": -27.26813316345215, "global_step": 540292, "epoch": 6509} {"train_loss": -27.14155387878418, "global_step": 540293, "epoch": 6509} {"train_loss": -26.787036895751953, "global_step": 540294, "epoch": 6509} {"train_loss": -26.894025802612305, "global_step": 540295, "epoch": 6509} {"train_loss": -26.882282257080078, "global_step": 540296, "epoch": 6509} {"train_loss": -27.26685905456543, "global_step": 540297, "epoch": 6509} {"train_loss": -26.787378311157227, "global_step": 540298, "epoch": 6509} {"train_loss": -27.429616928100586, "global_step": 540299, "epoch": 6509} {"train_loss": -27.13815689086914, "global_step": 540300, "epoch": 6509} {"train_loss": -27.795400619506836, "global_step": 540301, "epoch": 6509} {"train_loss": -27.37754249572754, "global_step": 540302, "epoch": 6509} {"train_loss": -27.125165939331055, "global_step": 540303, "epoch": 6509} {"train_loss": -27.36785888671875, "global_step": 540304, "epoch": 6509} {"train_loss": -27.121030807495117, "global_step": 540305, "epoch": 6509} {"train_loss": -27.3970947265625, "global_step": 540306, "epoch": 6509} {"train_loss": -27.255155563354492, "global_step": 540307, "epoch": 6509} {"train_loss": -27.2719669342041, "global_step": 540308, "epoch": 6509} {"train_loss": -27.5074462890625, "global_step": 540309, "epoch": 6509} {"train_loss": -27.731918334960938, "global_step": 540310, "epoch": 6509} {"train_loss": -27.386816024780273, "global_step": 540311, "epoch": 6509} {"train_loss": -27.790176391601562, "global_step": 540312, "epoch": 6509} {"train_loss": -27.338891983032227, "global_step": 540313, "epoch": 6509} {"train_loss": -27.334171295166016, "global_step": 540314, "epoch": 6509} {"train_loss": -27.637556076049805, "global_step": 540315, "epoch": 6509} {"train_loss": -27.355121612548828, "global_step": 540316, "epoch": 6509} {"train_loss": -27.673114776611328, "global_step": 540317, "epoch": 6509} {"train_loss": -27.42795753479004, "global_step": 540318, "epoch": 6509} {"train_loss": -27.59629249572754, "global_step": 540319, "epoch": 6509} {"train_loss": -27.432947158813477, "global_step": 540320, "epoch": 6509} {"train_loss": -27.75697898864746, "global_step": 540321, "epoch": 6509} {"train_loss": -27.64515495300293, "global_step": 540322, "epoch": 6509} {"train_loss": -27.84331703186035, "global_step": 540323, "epoch": 6509} {"train_loss": -27.586572647094727, "global_step": 540324, "epoch": 6509} {"train_loss": -27.2165584564209, "global_step": 540325, "epoch": 6509} {"train_loss": -27.4680118560791, "global_step": 540326, "epoch": 6509} {"train_loss": -27.85688591003418, "global_step": 540327, "epoch": 6509} {"train_loss": -27.724456787109375, "global_step": 540328, "epoch": 6509} {"train_loss": -27.319176754319525, "global_step": 540329, "epoch": 6509, "val_loss": 6521760.5} {"train_loss": -25.84153175354004, "global_step": 540330, "epoch": 6510} {"train_loss": -25.797840118408203, "global_step": 540331, "epoch": 6510} {"train_loss": -26.6171932220459, "global_step": 540332, "epoch": 6510} {"train_loss": -26.28313636779785, "global_step": 540333, "epoch": 6510} {"train_loss": -26.444061279296875, "global_step": 540334, "epoch": 6510} {"train_loss": -27.049463272094727, "global_step": 540335, "epoch": 6510} {"train_loss": -26.383569717407227, "global_step": 540336, "epoch": 6510} {"train_loss": -26.96070671081543, "global_step": 540337, "epoch": 6510} {"train_loss": -25.899169921875, "global_step": 540338, "epoch": 6510} {"train_loss": -26.515256881713867, "global_step": 540339, "epoch": 6510} {"train_loss": -26.9295597076416, "global_step": 540340, "epoch": 6510} {"train_loss": -27.072372436523438, "global_step": 540341, "epoch": 6510} {"train_loss": -26.49273681640625, "global_step": 540342, "epoch": 6510} {"train_loss": -27.170856475830078, "global_step": 540343, "epoch": 6510} {"train_loss": -27.20998191833496, "global_step": 540344, "epoch": 6510} {"train_loss": -26.78371238708496, "global_step": 540345, "epoch": 6510} {"train_loss": -27.54886245727539, "global_step": 540346, "epoch": 6510} {"train_loss": -26.800302505493164, "global_step": 540347, "epoch": 6510} {"train_loss": -27.151823043823242, "global_step": 540348, "epoch": 6510} {"train_loss": -27.301807403564453, "global_step": 540349, "epoch": 6510} {"train_loss": -27.226104736328125, "global_step": 540350, "epoch": 6510} {"train_loss": -26.764150619506836, "global_step": 540351, "epoch": 6510} {"train_loss": -27.357975006103516, "global_step": 540352, "epoch": 6510} {"train_loss": -27.26797866821289, "global_step": 540353, "epoch": 6510} {"train_loss": -27.460935592651367, "global_step": 540354, "epoch": 6510} {"train_loss": -27.219690322875977, "global_step": 540355, "epoch": 6510} {"train_loss": -27.162092208862305, "global_step": 540356, "epoch": 6510} {"train_loss": -27.46778678894043, "global_step": 540357, "epoch": 6510} {"train_loss": -27.748554229736328, "global_step": 540358, "epoch": 6510} {"train_loss": -27.184356689453125, "global_step": 540359, "epoch": 6510} {"train_loss": -27.56292152404785, "global_step": 540360, "epoch": 6510} {"train_loss": -27.346166610717773, "global_step": 540361, "epoch": 6510} {"train_loss": -27.75605583190918, "global_step": 540362, "epoch": 6510} {"train_loss": -27.555265426635742, "global_step": 540363, "epoch": 6510} {"train_loss": -27.58429527282715, "global_step": 540364, "epoch": 6510} {"train_loss": -27.80144691467285, "global_step": 540365, "epoch": 6510} {"train_loss": -27.893640518188477, "global_step": 540366, "epoch": 6510} {"train_loss": -27.938684463500977, "global_step": 540367, "epoch": 6510} {"train_loss": -27.656660079956055, "global_step": 540368, "epoch": 6510} {"train_loss": -27.874231338500977, "global_step": 540369, "epoch": 6510} {"train_loss": -27.718795776367188, "global_step": 540370, "epoch": 6510} {"train_loss": -27.659381866455078, "global_step": 540371, "epoch": 6510} {"train_loss": -27.831317901611328, "global_step": 540372, "epoch": 6510} {"train_loss": -28.130767822265625, "global_step": 540373, "epoch": 6510} {"train_loss": -28.138492584228516, "global_step": 540374, "epoch": 6510} {"train_loss": -28.195587158203125, "global_step": 540375, "epoch": 6510} {"train_loss": -27.84665298461914, "global_step": 540376, "epoch": 6510} {"train_loss": -27.73499870300293, "global_step": 540377, "epoch": 6510} {"train_loss": -27.84650993347168, "global_step": 540378, "epoch": 6510} {"train_loss": -27.70318031311035, "global_step": 540379, "epoch": 6510} {"train_loss": -28.207311630249023, "global_step": 540380, "epoch": 6510} {"train_loss": -27.35101318359375, "global_step": 540381, "epoch": 6510} {"train_loss": -27.321685791015625, "global_step": 540382, "epoch": 6510} {"train_loss": -27.827667236328125, "global_step": 540383, "epoch": 6510} {"train_loss": -27.899770736694336, "global_step": 540384, "epoch": 6510} {"train_loss": -27.656721115112305, "global_step": 540385, "epoch": 6510} {"train_loss": -27.7528133392334, "global_step": 540386, "epoch": 6510} {"train_loss": -27.615339279174805, "global_step": 540387, "epoch": 6510} {"train_loss": -28.039474487304688, "global_step": 540388, "epoch": 6510} {"train_loss": -27.7850341796875, "global_step": 540389, "epoch": 6510} {"train_loss": -28.15384292602539, "global_step": 540390, "epoch": 6510} {"train_loss": -27.803455352783203, "global_step": 540391, "epoch": 6510} {"train_loss": -27.948352813720703, "global_step": 540392, "epoch": 6510} {"train_loss": -27.98223876953125, "global_step": 540393, "epoch": 6510} {"train_loss": -27.71133804321289, "global_step": 540394, "epoch": 6510} {"train_loss": -27.7103328704834, "global_step": 540395, "epoch": 6510} {"train_loss": -27.311527252197266, "global_step": 540396, "epoch": 6510} {"train_loss": -27.242877960205078, "global_step": 540397, "epoch": 6510} {"train_loss": -27.991592407226562, "global_step": 540398, "epoch": 6510} {"train_loss": -27.56661033630371, "global_step": 540399, "epoch": 6510} {"train_loss": -27.799551010131836, "global_step": 540400, "epoch": 6510} {"train_loss": -27.70952796936035, "global_step": 540401, "epoch": 6510} {"train_loss": -27.67402458190918, "global_step": 540402, "epoch": 6510} {"train_loss": -27.479644775390625, "global_step": 540403, "epoch": 6510} {"train_loss": -27.641714096069336, "global_step": 540404, "epoch": 6510} {"train_loss": -28.207599639892578, "global_step": 540405, "epoch": 6510} {"train_loss": -27.7069091796875, "global_step": 540406, "epoch": 6510} {"train_loss": -27.891382217407227, "global_step": 540407, "epoch": 6510} {"train_loss": -27.91529655456543, "global_step": 540408, "epoch": 6510} {"train_loss": -27.63448143005371, "global_step": 540409, "epoch": 6510} {"train_loss": -27.623762130737305, "global_step": 540410, "epoch": 6510} {"train_loss": -27.7639217376709, "global_step": 540411, "epoch": 6510} {"train_loss": -27.450923529015967, "global_step": 540412, "epoch": 6510, "val_loss": 6547947.0} {"train_loss": -26.524343490600586, "global_step": 540413, "epoch": 6511} {"train_loss": -25.719818115234375, "global_step": 540414, "epoch": 6511} {"train_loss": -26.874032974243164, "global_step": 540415, "epoch": 6511} {"train_loss": -26.914052963256836, "global_step": 540416, "epoch": 6511} {"train_loss": -26.29009437561035, "global_step": 540417, "epoch": 6511} {"train_loss": -26.448780059814453, "global_step": 540418, "epoch": 6511} {"train_loss": -26.32844352722168, "global_step": 540419, "epoch": 6511} {"train_loss": -25.973081588745117, "global_step": 540420, "epoch": 6511} {"train_loss": -26.576719284057617, "global_step": 540421, "epoch": 6511} {"train_loss": -26.428510665893555, "global_step": 540422, "epoch": 6511} {"train_loss": -26.949283599853516, "global_step": 540423, "epoch": 6511} {"train_loss": -26.42020034790039, "global_step": 540424, "epoch": 6511} {"train_loss": -26.724103927612305, "global_step": 540425, "epoch": 6511} {"train_loss": -27.23529624938965, "global_step": 540426, "epoch": 6511} {"train_loss": -27.362186431884766, "global_step": 540427, "epoch": 6511} {"train_loss": -27.44805908203125, "global_step": 540428, "epoch": 6511} {"train_loss": -27.13818359375, "global_step": 540429, "epoch": 6511} {"train_loss": -27.277877807617188, "global_step": 540430, "epoch": 6511} {"train_loss": -26.970556259155273, "global_step": 540431, "epoch": 6511} {"train_loss": -27.43635368347168, "global_step": 540432, "epoch": 6511} {"train_loss": -27.383758544921875, "global_step": 540433, "epoch": 6511} {"train_loss": -27.213333129882812, "global_step": 540434, "epoch": 6511} {"train_loss": -27.34651756286621, "global_step": 540435, "epoch": 6511} {"train_loss": -27.67927360534668, "global_step": 540436, "epoch": 6511} {"train_loss": -27.733747482299805, "global_step": 540437, "epoch": 6511} {"train_loss": -27.307783126831055, "global_step": 540438, "epoch": 6511} {"train_loss": -27.325244903564453, "global_step": 540439, "epoch": 6511} {"train_loss": -27.32061767578125, "global_step": 540440, "epoch": 6511} {"train_loss": -27.712743759155273, "global_step": 540441, "epoch": 6511} {"train_loss": -27.7446346282959, "global_step": 540442, "epoch": 6511} {"train_loss": -27.648590087890625, "global_step": 540443, "epoch": 6511} {"train_loss": -27.41200828552246, "global_step": 540444, "epoch": 6511} {"train_loss": -27.630268096923828, "global_step": 540445, "epoch": 6511} {"train_loss": -27.389272689819336, "global_step": 540446, "epoch": 6511} {"train_loss": -27.21673011779785, "global_step": 540447, "epoch": 6511} {"train_loss": -27.781641006469727, "global_step": 540448, "epoch": 6511} {"train_loss": -27.67518424987793, "global_step": 540449, "epoch": 6511} {"train_loss": -27.649993896484375, "global_step": 540450, "epoch": 6511} {"train_loss": -28.14466667175293, "global_step": 540451, "epoch": 6511} {"train_loss": -27.878149032592773, "global_step": 540452, "epoch": 6511} {"train_loss": -27.830183029174805, "global_step": 540453, "epoch": 6511} {"train_loss": -27.988739013671875, "global_step": 540454, "epoch": 6511} {"train_loss": -27.87763786315918, "global_step": 540455, "epoch": 6511} {"train_loss": -27.75008201599121, "global_step": 540456, "epoch": 6511} {"train_loss": -27.7454833984375, "global_step": 540457, "epoch": 6511} {"train_loss": -27.805591583251953, "global_step": 540458, "epoch": 6511} {"train_loss": -28.172033309936523, "global_step": 540459, "epoch": 6511} {"train_loss": -27.996307373046875, "global_step": 540460, "epoch": 6511} {"train_loss": -27.751514434814453, "global_step": 540461, "epoch": 6511} {"train_loss": -27.911609649658203, "global_step": 540462, "epoch": 6511} {"train_loss": -27.960424423217773, "global_step": 540463, "epoch": 6511} {"train_loss": -27.722198486328125, "global_step": 540464, "epoch": 6511} {"train_loss": -27.99386978149414, "global_step": 540465, "epoch": 6511} {"train_loss": -27.87579917907715, "global_step": 540466, "epoch": 6511} {"train_loss": -28.231470108032227, "global_step": 540467, "epoch": 6511} {"train_loss": -27.704864501953125, "global_step": 540468, "epoch": 6511} {"train_loss": -27.798294067382812, "global_step": 540469, "epoch": 6511} {"train_loss": -27.791763305664062, "global_step": 540470, "epoch": 6511} {"train_loss": -27.763198852539062, "global_step": 540471, "epoch": 6511} {"train_loss": -27.97108268737793, "global_step": 540472, "epoch": 6511} {"train_loss": -27.610340118408203, "global_step": 540473, "epoch": 6511} {"train_loss": -26.92453384399414, "global_step": 540474, "epoch": 6511} {"train_loss": -27.001602172851562, "global_step": 540475, "epoch": 6511} {"train_loss": -27.36121940612793, "global_step": 540476, "epoch": 6511} {"train_loss": -27.41896629333496, "global_step": 540477, "epoch": 6511} {"train_loss": -27.55419921875, "global_step": 540478, "epoch": 6511} {"train_loss": -27.890308380126953, "global_step": 540479, "epoch": 6511} {"train_loss": -27.689863204956055, "global_step": 540480, "epoch": 6511} {"train_loss": -27.644088745117188, "global_step": 540481, "epoch": 6511} {"train_loss": -27.974414825439453, "global_step": 540482, "epoch": 6511} {"train_loss": -27.682714462280273, "global_step": 540483, "epoch": 6511} {"train_loss": -28.155853271484375, "global_step": 540484, "epoch": 6511} {"train_loss": -27.7928409576416, "global_step": 540485, "epoch": 6511} {"train_loss": -27.576019287109375, "global_step": 540486, "epoch": 6511} {"train_loss": -27.963062286376953, "global_step": 540487, "epoch": 6511} {"train_loss": -27.502309799194336, "global_step": 540488, "epoch": 6511} {"train_loss": -27.624303817749023, "global_step": 540489, "epoch": 6511} {"train_loss": -27.758203506469727, "global_step": 540490, "epoch": 6511} {"train_loss": -27.694730758666992, "global_step": 540491, "epoch": 6511} {"train_loss": -27.49842643737793, "global_step": 540492, "epoch": 6511} {"train_loss": -27.388538360595703, "global_step": 540493, "epoch": 6511} {"train_loss": -26.749963760375977, "global_step": 540494, "epoch": 6511} {"train_loss": -27.45208122069577, "global_step": 540495, "epoch": 6511, "val_loss": 6525470.0} {"train_loss": -26.7092227935791, "global_step": 540496, "epoch": 6512} {"train_loss": -23.112897872924805, "global_step": 540497, "epoch": 6512} {"train_loss": -21.977453231811523, "global_step": 540498, "epoch": 6512} {"train_loss": -26.113067626953125, "global_step": 540499, "epoch": 6512} {"train_loss": -25.209672927856445, "global_step": 540500, "epoch": 6512} {"train_loss": -25.409456253051758, "global_step": 540501, "epoch": 6512} {"train_loss": -25.59442710876465, "global_step": 540502, "epoch": 6512} {"train_loss": -26.539764404296875, "global_step": 540503, "epoch": 6512} {"train_loss": -26.24956703186035, "global_step": 540504, "epoch": 6512} {"train_loss": -26.63789176940918, "global_step": 540505, "epoch": 6512} {"train_loss": -26.821231842041016, "global_step": 540506, "epoch": 6512} {"train_loss": -25.938648223876953, "global_step": 540507, "epoch": 6512} {"train_loss": -26.927473068237305, "global_step": 540508, "epoch": 6512} {"train_loss": -26.903554916381836, "global_step": 540509, "epoch": 6512} {"train_loss": -26.719724655151367, "global_step": 540510, "epoch": 6512} {"train_loss": -26.564855575561523, "global_step": 540511, "epoch": 6512} {"train_loss": -26.857410430908203, "global_step": 540512, "epoch": 6512} {"train_loss": -26.901081085205078, "global_step": 540513, "epoch": 6512} {"train_loss": -26.84547996520996, "global_step": 540514, "epoch": 6512} {"train_loss": -27.140378952026367, "global_step": 540515, "epoch": 6512} {"train_loss": -26.93610954284668, "global_step": 540516, "epoch": 6512} {"train_loss": -27.18855094909668, "global_step": 540517, "epoch": 6512} {"train_loss": -27.078596115112305, "global_step": 540518, "epoch": 6512} {"train_loss": -27.04910659790039, "global_step": 540519, "epoch": 6512} {"train_loss": -27.300458908081055, "global_step": 540520, "epoch": 6512} {"train_loss": -27.16810417175293, "global_step": 540521, "epoch": 6512} {"train_loss": -27.1331844329834, "global_step": 540522, "epoch": 6512} {"train_loss": -27.28912353515625, "global_step": 540523, "epoch": 6512} {"train_loss": -26.72085952758789, "global_step": 540524, "epoch": 6512} {"train_loss": -26.939300537109375, "global_step": 540525, "epoch": 6512} {"train_loss": -27.23516845703125, "global_step": 540526, "epoch": 6512} {"train_loss": -27.017988204956055, "global_step": 540527, "epoch": 6512} {"train_loss": -27.509550094604492, "global_step": 540528, "epoch": 6512} {"train_loss": -27.465728759765625, "global_step": 540529, "epoch": 6512} {"train_loss": -27.1661319732666, "global_step": 540530, "epoch": 6512} {"train_loss": -27.150955200195312, "global_step": 540531, "epoch": 6512} {"train_loss": -27.303770065307617, "global_step": 540532, "epoch": 6512} {"train_loss": -27.680639266967773, "global_step": 540533, "epoch": 6512} {"train_loss": -27.522876739501953, "global_step": 540534, "epoch": 6512} {"train_loss": -27.550647735595703, "global_step": 540535, "epoch": 6512} {"train_loss": -27.78230094909668, "global_step": 540536, "epoch": 6512} {"train_loss": -27.882221221923828, "global_step": 540537, "epoch": 6512} {"train_loss": -27.7805118560791, "global_step": 540538, "epoch": 6512} {"train_loss": -27.836502075195312, "global_step": 540539, "epoch": 6512} {"train_loss": -27.726099014282227, "global_step": 540540, "epoch": 6512} {"train_loss": -27.82935905456543, "global_step": 540541, "epoch": 6512} {"train_loss": -27.60101890563965, "global_step": 540542, "epoch": 6512} {"train_loss": -27.71866226196289, "global_step": 540543, "epoch": 6512} {"train_loss": -27.806379318237305, "global_step": 540544, "epoch": 6512} {"train_loss": -27.724884033203125, "global_step": 540545, "epoch": 6512} {"train_loss": -27.518564224243164, "global_step": 540546, "epoch": 6512} {"train_loss": -27.537153244018555, "global_step": 540547, "epoch": 6512} {"train_loss": -27.55314064025879, "global_step": 540548, "epoch": 6512} {"train_loss": -28.09572410583496, "global_step": 540549, "epoch": 6512} {"train_loss": -27.710901260375977, "global_step": 540550, "epoch": 6512} {"train_loss": -27.965864181518555, "global_step": 540551, "epoch": 6512} {"train_loss": -27.62513542175293, "global_step": 540552, "epoch": 6512} {"train_loss": -27.61799430847168, "global_step": 540553, "epoch": 6512} {"train_loss": -27.932086944580078, "global_step": 540554, "epoch": 6512} {"train_loss": -27.87163734436035, "global_step": 540555, "epoch": 6512} {"train_loss": -27.809595108032227, "global_step": 540556, "epoch": 6512} {"train_loss": -27.728139877319336, "global_step": 540557, "epoch": 6512} {"train_loss": -28.38694190979004, "global_step": 540558, "epoch": 6512} {"train_loss": -28.004911422729492, "global_step": 540559, "epoch": 6512} {"train_loss": -27.588998794555664, "global_step": 540560, "epoch": 6512} {"train_loss": -27.605749130249023, "global_step": 540561, "epoch": 6512} {"train_loss": -27.511016845703125, "global_step": 540562, "epoch": 6512} {"train_loss": -27.29217529296875, "global_step": 540563, "epoch": 6512} {"train_loss": -27.544544219970703, "global_step": 540564, "epoch": 6512} {"train_loss": -27.99225425720215, "global_step": 540565, "epoch": 6512} {"train_loss": -27.635217666625977, "global_step": 540566, "epoch": 6512} {"train_loss": -27.83984375, "global_step": 540567, "epoch": 6512} {"train_loss": -27.40573501586914, "global_step": 540568, "epoch": 6512} {"train_loss": -27.7011661529541, "global_step": 540569, "epoch": 6512} {"train_loss": -27.71099281311035, "global_step": 540570, "epoch": 6512} {"train_loss": -27.3610782623291, "global_step": 540571, "epoch": 6512} {"train_loss": -27.81597328186035, "global_step": 540572, "epoch": 6512} {"train_loss": -27.79139518737793, "global_step": 540573, "epoch": 6512} {"train_loss": -27.75322914123535, "global_step": 540574, "epoch": 6512} {"train_loss": -27.472436904907227, "global_step": 540575, "epoch": 6512} {"train_loss": -27.405471801757812, "global_step": 540576, "epoch": 6512} {"train_loss": -27.514368057250977, "global_step": 540577, "epoch": 6512} {"train_loss": -27.170855372785084, "global_step": 540578, "epoch": 6512, "val_loss": 6524722.0} {"train_loss": -26.87299919128418, "global_step": 540579, "epoch": 6513} {"train_loss": -26.506818771362305, "global_step": 540580, "epoch": 6513} {"train_loss": -27.141523361206055, "global_step": 540581, "epoch": 6513} {"train_loss": -27.07216453552246, "global_step": 540582, "epoch": 6513} {"train_loss": -27.5628662109375, "global_step": 540583, "epoch": 6513} {"train_loss": -27.30849266052246, "global_step": 540584, "epoch": 6513} {"train_loss": -27.088642120361328, "global_step": 540585, "epoch": 6513} {"train_loss": -27.014062881469727, "global_step": 540586, "epoch": 6513} {"train_loss": -27.27723503112793, "global_step": 540587, "epoch": 6513} {"train_loss": -27.619421005249023, "global_step": 540588, "epoch": 6513} {"train_loss": -27.48090934753418, "global_step": 540589, "epoch": 6513} {"train_loss": -27.118757247924805, "global_step": 540590, "epoch": 6513} {"train_loss": -27.521543502807617, "global_step": 540591, "epoch": 6513} {"train_loss": -27.67103385925293, "global_step": 540592, "epoch": 6513} {"train_loss": -27.3026123046875, "global_step": 540593, "epoch": 6513} {"train_loss": -27.71624183654785, "global_step": 540594, "epoch": 6513} {"train_loss": -27.500577926635742, "global_step": 540595, "epoch": 6513} {"train_loss": -27.32756996154785, "global_step": 540596, "epoch": 6513} {"train_loss": -28.106189727783203, "global_step": 540597, "epoch": 6513} {"train_loss": -27.508865356445312, "global_step": 540598, "epoch": 6513} {"train_loss": -27.791519165039062, "global_step": 540599, "epoch": 6513} {"train_loss": -27.62933349609375, "global_step": 540600, "epoch": 6513} {"train_loss": -27.625980377197266, "global_step": 540601, "epoch": 6513} {"train_loss": -27.605945587158203, "global_step": 540602, "epoch": 6513} {"train_loss": -27.623340606689453, "global_step": 540603, "epoch": 6513} {"train_loss": -27.06167984008789, "global_step": 540604, "epoch": 6513} {"train_loss": -27.28666114807129, "global_step": 540605, "epoch": 6513} {"train_loss": -27.37507438659668, "global_step": 540606, "epoch": 6513} {"train_loss": -27.51997184753418, "global_step": 540607, "epoch": 6513} {"train_loss": -27.413928985595703, "global_step": 540608, "epoch": 6513} {"train_loss": -27.639423370361328, "global_step": 540609, "epoch": 6513} {"train_loss": -27.77618980407715, "global_step": 540610, "epoch": 6513} {"train_loss": -27.347412109375, "global_step": 540611, "epoch": 6513} {"train_loss": -27.18824577331543, "global_step": 540612, "epoch": 6513} {"train_loss": -27.626361846923828, "global_step": 540613, "epoch": 6513} {"train_loss": -27.600757598876953, "global_step": 540614, "epoch": 6513} {"train_loss": -27.47206687927246, "global_step": 540615, "epoch": 6513} {"train_loss": -27.904224395751953, "global_step": 540616, "epoch": 6513} {"train_loss": -27.933324813842773, "global_step": 540617, "epoch": 6513} {"train_loss": -27.473474502563477, "global_step": 540618, "epoch": 6513} {"train_loss": -27.682886123657227, "global_step": 540619, "epoch": 6513} {"train_loss": -27.34193992614746, "global_step": 540620, "epoch": 6513} {"train_loss": -27.779260635375977, "global_step": 540621, "epoch": 6513} {"train_loss": -27.89580726623535, "global_step": 540622, "epoch": 6513} {"train_loss": -27.42510986328125, "global_step": 540623, "epoch": 6513} {"train_loss": -27.457061767578125, "global_step": 540624, "epoch": 6513} {"train_loss": -27.80234146118164, "global_step": 540625, "epoch": 6513} {"train_loss": -27.7525634765625, "global_step": 540626, "epoch": 6513} {"train_loss": -27.396657943725586, "global_step": 540627, "epoch": 6513} {"train_loss": -27.8299617767334, "global_step": 540628, "epoch": 6513} {"train_loss": -27.805866241455078, "global_step": 540629, "epoch": 6513} {"train_loss": -27.98179054260254, "global_step": 540630, "epoch": 6513} {"train_loss": -27.368396759033203, "global_step": 540631, "epoch": 6513} {"train_loss": -27.515308380126953, "global_step": 540632, "epoch": 6513} {"train_loss": -27.53412437438965, "global_step": 540633, "epoch": 6513} {"train_loss": -27.251327514648438, "global_step": 540634, "epoch": 6513} {"train_loss": -27.390119552612305, "global_step": 540635, "epoch": 6513} {"train_loss": -27.397668838500977, "global_step": 540636, "epoch": 6513} {"train_loss": -27.315221786499023, "global_step": 540637, "epoch": 6513} {"train_loss": -27.663837432861328, "global_step": 540638, "epoch": 6513} {"train_loss": -27.444915771484375, "global_step": 540639, "epoch": 6513} {"train_loss": -27.6093692779541, "global_step": 540640, "epoch": 6513} {"train_loss": -27.466480255126953, "global_step": 540641, "epoch": 6513} {"train_loss": -27.803991317749023, "global_step": 540642, "epoch": 6513} {"train_loss": -27.87775993347168, "global_step": 540643, "epoch": 6513} {"train_loss": -27.504993438720703, "global_step": 540644, "epoch": 6513} {"train_loss": -27.970117568969727, "global_step": 540645, "epoch": 6513} {"train_loss": -27.960718154907227, "global_step": 540646, "epoch": 6513} {"train_loss": -27.776334762573242, "global_step": 540647, "epoch": 6513} {"train_loss": -27.795286178588867, "global_step": 540648, "epoch": 6513} {"train_loss": -27.772974014282227, "global_step": 540649, "epoch": 6513} {"train_loss": -27.716161727905273, "global_step": 540650, "epoch": 6513} {"train_loss": -27.843469619750977, "global_step": 540651, "epoch": 6513} {"train_loss": -27.612394332885742, "global_step": 540652, "epoch": 6513} {"train_loss": -27.750024795532227, "global_step": 540653, "epoch": 6513} {"train_loss": -28.044824600219727, "global_step": 540654, "epoch": 6513} {"train_loss": -27.841028213500977, "global_step": 540655, "epoch": 6513} {"train_loss": -27.740238189697266, "global_step": 540656, "epoch": 6513} {"train_loss": -27.637592315673828, "global_step": 540657, "epoch": 6513} {"train_loss": -28.123950958251953, "global_step": 540658, "epoch": 6513} {"train_loss": -27.708770751953125, "global_step": 540659, "epoch": 6513} {"train_loss": -27.534442901611328, "global_step": 540660, "epoch": 6513} {"train_loss": -27.5563110903085, "global_step": 540661, "epoch": 6513, "val_loss": 6480935.0} {"train_loss": -26.936506271362305, "global_step": 540662, "epoch": 6514} {"train_loss": -26.481571197509766, "global_step": 540663, "epoch": 6514} {"train_loss": -26.394001007080078, "global_step": 540664, "epoch": 6514} {"train_loss": -27.100112915039062, "global_step": 540665, "epoch": 6514} {"train_loss": -26.312864303588867, "global_step": 540666, "epoch": 6514} {"train_loss": -26.86439323425293, "global_step": 540667, "epoch": 6514} {"train_loss": -27.09177589416504, "global_step": 540668, "epoch": 6514} {"train_loss": -26.8472843170166, "global_step": 540669, "epoch": 6514} {"train_loss": -27.04180908203125, "global_step": 540670, "epoch": 6514} {"train_loss": -27.493244171142578, "global_step": 540671, "epoch": 6514} {"train_loss": -27.18778419494629, "global_step": 540672, "epoch": 6514} {"train_loss": -26.760488510131836, "global_step": 540673, "epoch": 6514} {"train_loss": -27.21787452697754, "global_step": 540674, "epoch": 6514} {"train_loss": -27.32356071472168, "global_step": 540675, "epoch": 6514} {"train_loss": -27.27146339416504, "global_step": 540676, "epoch": 6514} {"train_loss": -27.239850997924805, "global_step": 540677, "epoch": 6514} {"train_loss": -27.43412208557129, "global_step": 540678, "epoch": 6514} {"train_loss": -27.261999130249023, "global_step": 540679, "epoch": 6514} {"train_loss": -27.153974533081055, "global_step": 540680, "epoch": 6514} {"train_loss": -27.4211368560791, "global_step": 540681, "epoch": 6514} {"train_loss": -26.87637710571289, "global_step": 540682, "epoch": 6514} {"train_loss": -27.18808937072754, "global_step": 540683, "epoch": 6514} {"train_loss": -27.72950553894043, "global_step": 540684, "epoch": 6514} {"train_loss": -27.36456871032715, "global_step": 540685, "epoch": 6514} {"train_loss": -27.559667587280273, "global_step": 540686, "epoch": 6514} {"train_loss": -27.824838638305664, "global_step": 540687, "epoch": 6514} {"train_loss": -27.5473575592041, "global_step": 540688, "epoch": 6514} {"train_loss": -27.57330894470215, "global_step": 540689, "epoch": 6514} {"train_loss": -28.0199031829834, "global_step": 540690, "epoch": 6514} {"train_loss": -27.569799423217773, "global_step": 540691, "epoch": 6514} {"train_loss": -27.668228149414062, "global_step": 540692, "epoch": 6514} {"train_loss": -27.755924224853516, "global_step": 540693, "epoch": 6514} {"train_loss": -27.85321044921875, "global_step": 540694, "epoch": 6514} {"train_loss": -28.130563735961914, "global_step": 540695, "epoch": 6514} {"train_loss": -27.382007598876953, "global_step": 540696, "epoch": 6514} {"train_loss": -27.921003341674805, "global_step": 540697, "epoch": 6514} {"train_loss": -27.7524471282959, "global_step": 540698, "epoch": 6514} {"train_loss": -27.48457145690918, "global_step": 540699, "epoch": 6514} {"train_loss": -27.598114013671875, "global_step": 540700, "epoch": 6514} {"train_loss": -27.896442413330078, "global_step": 540701, "epoch": 6514} {"train_loss": -27.806325912475586, "global_step": 540702, "epoch": 6514} {"train_loss": -28.02808952331543, "global_step": 540703, "epoch": 6514} {"train_loss": -27.93521499633789, "global_step": 540704, "epoch": 6514} {"train_loss": -27.897672653198242, "global_step": 540705, "epoch": 6514} {"train_loss": -27.760089874267578, "global_step": 540706, "epoch": 6514} {"train_loss": -28.02141761779785, "global_step": 540707, "epoch": 6514} {"train_loss": -27.717716217041016, "global_step": 540708, "epoch": 6514} {"train_loss": -27.983551025390625, "global_step": 540709, "epoch": 6514} {"train_loss": -28.006732940673828, "global_step": 540710, "epoch": 6514} {"train_loss": -27.867963790893555, "global_step": 540711, "epoch": 6514} {"train_loss": -27.819799423217773, "global_step": 540712, "epoch": 6514} {"train_loss": -28.203739166259766, "global_step": 540713, "epoch": 6514} {"train_loss": -27.960065841674805, "global_step": 540714, "epoch": 6514} {"train_loss": -27.4659366607666, "global_step": 540715, "epoch": 6514} {"train_loss": -27.688756942749023, "global_step": 540716, "epoch": 6514} {"train_loss": -27.729461669921875, "global_step": 540717, "epoch": 6514} {"train_loss": -27.936323165893555, "global_step": 540718, "epoch": 6514} {"train_loss": -27.94508171081543, "global_step": 540719, "epoch": 6514} {"train_loss": -27.493701934814453, "global_step": 540720, "epoch": 6514} {"train_loss": -27.715280532836914, "global_step": 540721, "epoch": 6514} {"train_loss": -27.692136764526367, "global_step": 540722, "epoch": 6514} {"train_loss": -27.601673126220703, "global_step": 540723, "epoch": 6514} {"train_loss": -27.271072387695312, "global_step": 540724, "epoch": 6514} {"train_loss": -28.02077293395996, "global_step": 540725, "epoch": 6514} {"train_loss": -28.09284019470215, "global_step": 540726, "epoch": 6514} {"train_loss": -28.10968017578125, "global_step": 540727, "epoch": 6514} {"train_loss": -27.940921783447266, "global_step": 540728, "epoch": 6514} {"train_loss": -27.683164596557617, "global_step": 540729, "epoch": 6514} {"train_loss": -27.5759220123291, "global_step": 540730, "epoch": 6514} {"train_loss": -28.079572677612305, "global_step": 540731, "epoch": 6514} {"train_loss": -27.691181182861328, "global_step": 540732, "epoch": 6514} {"train_loss": -27.87830924987793, "global_step": 540733, "epoch": 6514} {"train_loss": -27.8414363861084, "global_step": 540734, "epoch": 6514} {"train_loss": -27.513341903686523, "global_step": 540735, "epoch": 6514} {"train_loss": -27.0906982421875, "global_step": 540736, "epoch": 6514} {"train_loss": -27.178150177001953, "global_step": 540737, "epoch": 6514} {"train_loss": -27.306432723999023, "global_step": 540738, "epoch": 6514} {"train_loss": -27.174896240234375, "global_step": 540739, "epoch": 6514} {"train_loss": -27.672168731689453, "global_step": 540740, "epoch": 6514} {"train_loss": -27.439252853393555, "global_step": 540741, "epoch": 6514} {"train_loss": -27.48529624938965, "global_step": 540742, "epoch": 6514} {"train_loss": -27.92926025390625, "global_step": 540743, "epoch": 6514} {"train_loss": -27.530762821794994, "global_step": 540744, "epoch": 6514, "val_loss": 6496551.0} {"train_loss": -27.186676025390625, "global_step": 540745, "epoch": 6515} {"train_loss": -27.295984268188477, "global_step": 540746, "epoch": 6515} {"train_loss": -27.309814453125, "global_step": 540747, "epoch": 6515} {"train_loss": -27.416976928710938, "global_step": 540748, "epoch": 6515} {"train_loss": -27.288345336914062, "global_step": 540749, "epoch": 6515} {"train_loss": -27.455596923828125, "global_step": 540750, "epoch": 6515} {"train_loss": -27.10869789123535, "global_step": 540751, "epoch": 6515} {"train_loss": -27.4798583984375, "global_step": 540752, "epoch": 6515} {"train_loss": -27.34112548828125, "global_step": 540753, "epoch": 6515} {"train_loss": -27.31268310546875, "global_step": 540754, "epoch": 6515} {"train_loss": -27.579370498657227, "global_step": 540755, "epoch": 6515} {"train_loss": -27.443090438842773, "global_step": 540756, "epoch": 6515} {"train_loss": -27.51228904724121, "global_step": 540757, "epoch": 6515} {"train_loss": -27.499937057495117, "global_step": 540758, "epoch": 6515} {"train_loss": -27.57151222229004, "global_step": 540759, "epoch": 6515} {"train_loss": -27.478870391845703, "global_step": 540760, "epoch": 6515} {"train_loss": -27.341339111328125, "global_step": 540761, "epoch": 6515} {"train_loss": -27.54141616821289, "global_step": 540762, "epoch": 6515} {"train_loss": -27.614896774291992, "global_step": 540763, "epoch": 6515} {"train_loss": -27.58497428894043, "global_step": 540764, "epoch": 6515} {"train_loss": -27.20130729675293, "global_step": 540765, "epoch": 6515} {"train_loss": -27.682870864868164, "global_step": 540766, "epoch": 6515} {"train_loss": -27.507638931274414, "global_step": 540767, "epoch": 6515} {"train_loss": -27.710163116455078, "global_step": 540768, "epoch": 6515} {"train_loss": -27.523218154907227, "global_step": 540769, "epoch": 6515} {"train_loss": -27.452356338500977, "global_step": 540770, "epoch": 6515} {"train_loss": -27.419584274291992, "global_step": 540771, "epoch": 6515} {"train_loss": -27.37869644165039, "global_step": 540772, "epoch": 6515} {"train_loss": -27.85675621032715, "global_step": 540773, "epoch": 6515} {"train_loss": -27.773351669311523, "global_step": 540774, "epoch": 6515} {"train_loss": -27.51239585876465, "global_step": 540775, "epoch": 6515} {"train_loss": -27.7178897857666, "global_step": 540776, "epoch": 6515} {"train_loss": -28.153369903564453, "global_step": 540777, "epoch": 6515} {"train_loss": -27.792184829711914, "global_step": 540778, "epoch": 6515} {"train_loss": -27.6217098236084, "global_step": 540779, "epoch": 6515} {"train_loss": -27.53936767578125, "global_step": 540780, "epoch": 6515} {"train_loss": -27.469480514526367, "global_step": 540781, "epoch": 6515} {"train_loss": -27.7393798828125, "global_step": 540782, "epoch": 6515} {"train_loss": -27.60011100769043, "global_step": 540783, "epoch": 6515} {"train_loss": -27.695098876953125, "global_step": 540784, "epoch": 6515} {"train_loss": -27.76220703125, "global_step": 540785, "epoch": 6515} {"train_loss": -27.942441940307617, "global_step": 540786, "epoch": 6515} {"train_loss": -28.055105209350586, "global_step": 540787, "epoch": 6515} {"train_loss": -28.106952667236328, "global_step": 540788, "epoch": 6515} {"train_loss": -27.556995391845703, "global_step": 540789, "epoch": 6515} {"train_loss": -27.3245906829834, "global_step": 540790, "epoch": 6515} {"train_loss": -27.2585506439209, "global_step": 540791, "epoch": 6515} {"train_loss": -28.035266876220703, "global_step": 540792, "epoch": 6515} {"train_loss": -28.142675399780273, "global_step": 540793, "epoch": 6515} {"train_loss": -27.759170532226562, "global_step": 540794, "epoch": 6515} {"train_loss": -27.519180297851562, "global_step": 540795, "epoch": 6515} {"train_loss": -27.791418075561523, "global_step": 540796, "epoch": 6515} {"train_loss": -27.20118522644043, "global_step": 540797, "epoch": 6515} {"train_loss": -27.652780532836914, "global_step": 540798, "epoch": 6515} {"train_loss": -27.7913875579834, "global_step": 540799, "epoch": 6515} {"train_loss": -27.70098304748535, "global_step": 540800, "epoch": 6515} {"train_loss": -27.874622344970703, "global_step": 540801, "epoch": 6515} {"train_loss": -27.6373348236084, "global_step": 540802, "epoch": 6515} {"train_loss": -27.942678451538086, "global_step": 540803, "epoch": 6515} {"train_loss": -27.425769805908203, "global_step": 540804, "epoch": 6515} {"train_loss": -27.75758171081543, "global_step": 540805, "epoch": 6515} {"train_loss": -27.677967071533203, "global_step": 540806, "epoch": 6515} {"train_loss": -27.794315338134766, "global_step": 540807, "epoch": 6515} {"train_loss": -27.601781845092773, "global_step": 540808, "epoch": 6515} {"train_loss": -27.247709274291992, "global_step": 540809, "epoch": 6515} {"train_loss": -27.552534103393555, "global_step": 540810, "epoch": 6515} {"train_loss": -27.81906509399414, "global_step": 540811, "epoch": 6515} {"train_loss": -27.625686645507812, "global_step": 540812, "epoch": 6515} {"train_loss": -27.317514419555664, "global_step": 540813, "epoch": 6515} {"train_loss": -27.458343505859375, "global_step": 540814, "epoch": 6515} {"train_loss": -28.12784767150879, "global_step": 540815, "epoch": 6515} {"train_loss": -27.33650016784668, "global_step": 540816, "epoch": 6515} {"train_loss": -27.727643966674805, "global_step": 540817, "epoch": 6515} {"train_loss": -27.667713165283203, "global_step": 540818, "epoch": 6515} {"train_loss": -27.70016860961914, "global_step": 540819, "epoch": 6515} {"train_loss": -27.6672306060791, "global_step": 540820, "epoch": 6515} {"train_loss": -27.43829917907715, "global_step": 540821, "epoch": 6515} {"train_loss": -27.83670997619629, "global_step": 540822, "epoch": 6515} {"train_loss": -27.736413955688477, "global_step": 540823, "epoch": 6515} {"train_loss": -27.513763427734375, "global_step": 540824, "epoch": 6515} {"train_loss": -27.917158126831055, "global_step": 540825, "epoch": 6515} {"train_loss": -27.796051025390625, "global_step": 540826, "epoch": 6515} {"train_loss": -27.6095990789942, "global_step": 540827, "epoch": 6515, "val_loss": 6511770.0} {"train_loss": -26.9291934967041, "global_step": 540828, "epoch": 6516} {"train_loss": -27.18861198425293, "global_step": 540829, "epoch": 6516} {"train_loss": -26.993701934814453, "global_step": 540830, "epoch": 6516} {"train_loss": -27.503925323486328, "global_step": 540831, "epoch": 6516} {"train_loss": -26.82857322692871, "global_step": 540832, "epoch": 6516} {"train_loss": -27.385709762573242, "global_step": 540833, "epoch": 6516} {"train_loss": -27.267751693725586, "global_step": 540834, "epoch": 6516} {"train_loss": -27.025434494018555, "global_step": 540835, "epoch": 6516} {"train_loss": -26.911352157592773, "global_step": 540836, "epoch": 6516} {"train_loss": -27.260480880737305, "global_step": 540837, "epoch": 6516} {"train_loss": -27.829435348510742, "global_step": 540838, "epoch": 6516} {"train_loss": -27.4240665435791, "global_step": 540839, "epoch": 6516} {"train_loss": -27.300973892211914, "global_step": 540840, "epoch": 6516} {"train_loss": -27.528583526611328, "global_step": 540841, "epoch": 6516} {"train_loss": -27.167455673217773, "global_step": 540842, "epoch": 6516} {"train_loss": -27.656545639038086, "global_step": 540843, "epoch": 6516} {"train_loss": -27.360578536987305, "global_step": 540844, "epoch": 6516} {"train_loss": -27.73734474182129, "global_step": 540845, "epoch": 6516} {"train_loss": -27.468769073486328, "global_step": 540846, "epoch": 6516} {"train_loss": -27.68372917175293, "global_step": 540847, "epoch": 6516} {"train_loss": -27.24371337890625, "global_step": 540848, "epoch": 6516} {"train_loss": -27.704679489135742, "global_step": 540849, "epoch": 6516} {"train_loss": -27.63149070739746, "global_step": 540850, "epoch": 6516} {"train_loss": -27.47324562072754, "global_step": 540851, "epoch": 6516} {"train_loss": -27.53271484375, "global_step": 540852, "epoch": 6516} {"train_loss": -27.74896240234375, "global_step": 540853, "epoch": 6516} {"train_loss": -27.446081161499023, "global_step": 540854, "epoch": 6516} {"train_loss": -27.414051055908203, "global_step": 540855, "epoch": 6516} {"train_loss": -27.639007568359375, "global_step": 540856, "epoch": 6516} {"train_loss": -27.762863159179688, "global_step": 540857, "epoch": 6516} {"train_loss": -27.5340576171875, "global_step": 540858, "epoch": 6516} {"train_loss": -27.515979766845703, "global_step": 540859, "epoch": 6516} {"train_loss": -27.80561637878418, "global_step": 540860, "epoch": 6516} {"train_loss": -27.7387638092041, "global_step": 540861, "epoch": 6516} {"train_loss": -27.488361358642578, "global_step": 540862, "epoch": 6516} {"train_loss": -27.587631225585938, "global_step": 540863, "epoch": 6516} {"train_loss": -27.972509384155273, "global_step": 540864, "epoch": 6516} {"train_loss": -27.81097412109375, "global_step": 540865, "epoch": 6516} {"train_loss": -27.81878089904785, "global_step": 540866, "epoch": 6516} {"train_loss": -27.84735679626465, "global_step": 540867, "epoch": 6516} {"train_loss": -27.785253524780273, "global_step": 540868, "epoch": 6516} {"train_loss": -27.721405029296875, "global_step": 540869, "epoch": 6516} {"train_loss": -27.8035945892334, "global_step": 540870, "epoch": 6516} {"train_loss": -28.45279884338379, "global_step": 540871, "epoch": 6516} {"train_loss": -28.00314712524414, "global_step": 540872, "epoch": 6516} {"train_loss": -27.578718185424805, "global_step": 540873, "epoch": 6516} {"train_loss": -27.850500106811523, "global_step": 540874, "epoch": 6516} {"train_loss": -27.678064346313477, "global_step": 540875, "epoch": 6516} {"train_loss": -27.5502872467041, "global_step": 540876, "epoch": 6516} {"train_loss": -27.41131019592285, "global_step": 540877, "epoch": 6516} {"train_loss": -27.752485275268555, "global_step": 540878, "epoch": 6516} {"train_loss": -28.048614501953125, "global_step": 540879, "epoch": 6516} {"train_loss": -27.61573600769043, "global_step": 540880, "epoch": 6516} {"train_loss": -27.726581573486328, "global_step": 540881, "epoch": 6516} {"train_loss": -27.64947509765625, "global_step": 540882, "epoch": 6516} {"train_loss": -27.824542999267578, "global_step": 540883, "epoch": 6516} {"train_loss": -27.6054744720459, "global_step": 540884, "epoch": 6516} {"train_loss": -27.521100997924805, "global_step": 540885, "epoch": 6516} {"train_loss": -26.987674713134766, "global_step": 540886, "epoch": 6516} {"train_loss": -26.92136573791504, "global_step": 540887, "epoch": 6516} {"train_loss": -28.119375228881836, "global_step": 540888, "epoch": 6516} {"train_loss": -27.7291202545166, "global_step": 540889, "epoch": 6516} {"train_loss": -27.73075294494629, "global_step": 540890, "epoch": 6516} {"train_loss": -27.478118896484375, "global_step": 540891, "epoch": 6516} {"train_loss": -27.599609375, "global_step": 540892, "epoch": 6516} {"train_loss": -26.640756607055664, "global_step": 540893, "epoch": 6516} {"train_loss": -26.95680809020996, "global_step": 540894, "epoch": 6516} {"train_loss": -27.693439483642578, "global_step": 540895, "epoch": 6516} {"train_loss": -27.716726303100586, "global_step": 540896, "epoch": 6516} {"train_loss": -27.003625869750977, "global_step": 540897, "epoch": 6516} {"train_loss": -27.500707626342773, "global_step": 540898, "epoch": 6516} {"train_loss": -26.85107421875, "global_step": 540899, "epoch": 6516} {"train_loss": -27.443099975585938, "global_step": 540900, "epoch": 6516} {"train_loss": -27.491912841796875, "global_step": 540901, "epoch": 6516} {"train_loss": -27.104511260986328, "global_step": 540902, "epoch": 6516} {"train_loss": -27.380945205688477, "global_step": 540903, "epoch": 6516} {"train_loss": -27.07086753845215, "global_step": 540904, "epoch": 6516} {"train_loss": -27.5094051361084, "global_step": 540905, "epoch": 6516} {"train_loss": -27.300155639648438, "global_step": 540906, "epoch": 6516} {"train_loss": -27.295373916625977, "global_step": 540907, "epoch": 6516} {"train_loss": -27.62689208984375, "global_step": 540908, "epoch": 6516} {"train_loss": -27.519351959228516, "global_step": 540909, "epoch": 6516} {"train_loss": -27.53325464639319, "global_step": 540910, "epoch": 6516, "val_loss": 6469505.0} {"train_loss": -27.324161529541016, "global_step": 540911, "epoch": 6517} {"train_loss": -27.276037216186523, "global_step": 540912, "epoch": 6517} {"train_loss": -27.48040199279785, "global_step": 540913, "epoch": 6517} {"train_loss": -27.368383407592773, "global_step": 540914, "epoch": 6517} {"train_loss": -27.47810173034668, "global_step": 540915, "epoch": 6517} {"train_loss": -27.354764938354492, "global_step": 540916, "epoch": 6517} {"train_loss": -27.569156646728516, "global_step": 540917, "epoch": 6517} {"train_loss": -27.45005226135254, "global_step": 540918, "epoch": 6517} {"train_loss": -27.98956298828125, "global_step": 540919, "epoch": 6517} {"train_loss": -27.439056396484375, "global_step": 540920, "epoch": 6517} {"train_loss": -27.702423095703125, "global_step": 540921, "epoch": 6517} {"train_loss": -27.551870346069336, "global_step": 540922, "epoch": 6517} {"train_loss": -27.734628677368164, "global_step": 540923, "epoch": 6517} {"train_loss": -27.415164947509766, "global_step": 540924, "epoch": 6517} {"train_loss": -27.543432235717773, "global_step": 540925, "epoch": 6517} {"train_loss": -27.42633056640625, "global_step": 540926, "epoch": 6517} {"train_loss": -27.276636123657227, "global_step": 540927, "epoch": 6517} {"train_loss": -27.49968910217285, "global_step": 540928, "epoch": 6517} {"train_loss": -27.542682647705078, "global_step": 540929, "epoch": 6517} {"train_loss": -27.61529541015625, "global_step": 540930, "epoch": 6517} {"train_loss": -27.4349365234375, "global_step": 540931, "epoch": 6517} {"train_loss": -27.823780059814453, "global_step": 540932, "epoch": 6517} {"train_loss": -27.500091552734375, "global_step": 540933, "epoch": 6517} {"train_loss": -27.788333892822266, "global_step": 540934, "epoch": 6517} {"train_loss": -27.75355339050293, "global_step": 540935, "epoch": 6517} {"train_loss": -28.0474853515625, "global_step": 540936, "epoch": 6517} {"train_loss": -27.669095993041992, "global_step": 540937, "epoch": 6517} {"train_loss": -27.811304092407227, "global_step": 540938, "epoch": 6517} {"train_loss": -27.70472526550293, "global_step": 540939, "epoch": 6517} {"train_loss": -27.431339263916016, "global_step": 540940, "epoch": 6517} {"train_loss": -27.906476974487305, "global_step": 540941, "epoch": 6517} {"train_loss": -27.47621726989746, "global_step": 540942, "epoch": 6517} {"train_loss": -27.8991641998291, "global_step": 540943, "epoch": 6517} {"train_loss": -27.989532470703125, "global_step": 540944, "epoch": 6517} {"train_loss": -27.84235191345215, "global_step": 540945, "epoch": 6517} {"train_loss": -28.072406768798828, "global_step": 540946, "epoch": 6517} {"train_loss": -27.682056427001953, "global_step": 540947, "epoch": 6517} {"train_loss": -27.917333602905273, "global_step": 540948, "epoch": 6517} {"train_loss": -27.680200576782227, "global_step": 540949, "epoch": 6517} {"train_loss": -28.18622398376465, "global_step": 540950, "epoch": 6517} {"train_loss": -27.8940486907959, "global_step": 540951, "epoch": 6517} {"train_loss": -28.12598991394043, "global_step": 540952, "epoch": 6517} {"train_loss": -27.8010196685791, "global_step": 540953, "epoch": 6517} {"train_loss": -27.1518611907959, "global_step": 540954, "epoch": 6517} {"train_loss": -27.797727584838867, "global_step": 540955, "epoch": 6517} {"train_loss": -27.91065788269043, "global_step": 540956, "epoch": 6517} {"train_loss": -28.040271759033203, "global_step": 540957, "epoch": 6517} {"train_loss": -27.437911987304688, "global_step": 540958, "epoch": 6517} {"train_loss": -27.4221134185791, "global_step": 540959, "epoch": 6517} {"train_loss": -27.23954200744629, "global_step": 540960, "epoch": 6517} {"train_loss": -27.532629013061523, "global_step": 540961, "epoch": 6517} {"train_loss": -27.475568771362305, "global_step": 540962, "epoch": 6517} {"train_loss": -27.636138916015625, "global_step": 540963, "epoch": 6517} {"train_loss": -28.221139907836914, "global_step": 540964, "epoch": 6517} {"train_loss": -27.441022872924805, "global_step": 540965, "epoch": 6517} {"train_loss": -27.783191680908203, "global_step": 540966, "epoch": 6517} {"train_loss": -28.029499053955078, "global_step": 540967, "epoch": 6517} {"train_loss": -27.694501876831055, "global_step": 540968, "epoch": 6517} {"train_loss": -27.55814552307129, "global_step": 540969, "epoch": 6517} {"train_loss": -27.788434982299805, "global_step": 540970, "epoch": 6517} {"train_loss": -27.75611686706543, "global_step": 540971, "epoch": 6517} {"train_loss": -27.156036376953125, "global_step": 540972, "epoch": 6517} {"train_loss": -27.41880226135254, "global_step": 540973, "epoch": 6517} {"train_loss": -27.006574630737305, "global_step": 540974, "epoch": 6517} {"train_loss": -27.601675033569336, "global_step": 540975, "epoch": 6517} {"train_loss": -27.775304794311523, "global_step": 540976, "epoch": 6517} {"train_loss": -27.70612144470215, "global_step": 540977, "epoch": 6517} {"train_loss": -27.318283081054688, "global_step": 540978, "epoch": 6517} {"train_loss": -27.7191104888916, "global_step": 540979, "epoch": 6517} {"train_loss": -27.4599666595459, "global_step": 540980, "epoch": 6517} {"train_loss": -27.450489044189453, "global_step": 540981, "epoch": 6517} {"train_loss": -27.471969604492188, "global_step": 540982, "epoch": 6517} {"train_loss": -27.186832427978516, "global_step": 540983, "epoch": 6517} {"train_loss": -27.920446395874023, "global_step": 540984, "epoch": 6517} {"train_loss": -27.76780128479004, "global_step": 540985, "epoch": 6517} {"train_loss": -27.85523796081543, "global_step": 540986, "epoch": 6517} {"train_loss": -28.083539962768555, "global_step": 540987, "epoch": 6517} {"train_loss": -27.836353302001953, "global_step": 540988, "epoch": 6517} {"train_loss": -27.874408721923828, "global_step": 540989, "epoch": 6517} {"train_loss": -27.826007843017578, "global_step": 540990, "epoch": 6517} {"train_loss": -27.509002685546875, "global_step": 540991, "epoch": 6517} {"train_loss": -27.73969078063965, "global_step": 540992, "epoch": 6517} {"train_loss": -27.658781534217926, "global_step": 540993, "epoch": 6517, "val_loss": 6444991.0} {"train_loss": -27.17168617248535, "global_step": 540994, "epoch": 6518} {"train_loss": -27.499256134033203, "global_step": 540995, "epoch": 6518} {"train_loss": -26.9267578125, "global_step": 540996, "epoch": 6518} {"train_loss": -27.250263214111328, "global_step": 540997, "epoch": 6518} {"train_loss": -27.460851669311523, "global_step": 540998, "epoch": 6518} {"train_loss": -27.482202529907227, "global_step": 540999, "epoch": 6518} {"train_loss": -27.605255126953125, "global_step": 541000, "epoch": 6518} {"train_loss": -27.46796226501465, "global_step": 541001, "epoch": 6518} {"train_loss": -27.62166404724121, "global_step": 541002, "epoch": 6518} {"train_loss": -27.42034912109375, "global_step": 541003, "epoch": 6518} {"train_loss": -27.804773330688477, "global_step": 541004, "epoch": 6518} {"train_loss": -27.6054744720459, "global_step": 541005, "epoch": 6518} {"train_loss": -27.93794822692871, "global_step": 541006, "epoch": 6518} {"train_loss": -27.4952449798584, "global_step": 541007, "epoch": 6518} {"train_loss": -27.13030433654785, "global_step": 541008, "epoch": 6518} {"train_loss": -27.271961212158203, "global_step": 541009, "epoch": 6518} {"train_loss": -27.374347686767578, "global_step": 541010, "epoch": 6518} {"train_loss": -27.603958129882812, "global_step": 541011, "epoch": 6518} {"train_loss": -27.2988338470459, "global_step": 541012, "epoch": 6518} {"train_loss": -27.606155395507812, "global_step": 541013, "epoch": 6518} {"train_loss": -27.560535430908203, "global_step": 541014, "epoch": 6518} {"train_loss": -27.71454429626465, "global_step": 541015, "epoch": 6518} {"train_loss": -27.382587432861328, "global_step": 541016, "epoch": 6518} {"train_loss": -27.803937911987305, "global_step": 541017, "epoch": 6518} {"train_loss": -27.86321449279785, "global_step": 541018, "epoch": 6518} {"train_loss": -28.02715492248535, "global_step": 541019, "epoch": 6518} {"train_loss": -27.50235939025879, "global_step": 541020, "epoch": 6518} {"train_loss": -28.04060173034668, "global_step": 541021, "epoch": 6518} {"train_loss": -27.58216667175293, "global_step": 541022, "epoch": 6518} {"train_loss": -27.90266227722168, "global_step": 541023, "epoch": 6518} {"train_loss": -27.89754295349121, "global_step": 541024, "epoch": 6518} {"train_loss": -27.897680282592773, "global_step": 541025, "epoch": 6518} {"train_loss": -27.62925148010254, "global_step": 541026, "epoch": 6518} {"train_loss": -28.034605026245117, "global_step": 541027, "epoch": 6518} {"train_loss": -27.98966407775879, "global_step": 541028, "epoch": 6518} {"train_loss": -27.868085861206055, "global_step": 541029, "epoch": 6518} {"train_loss": -27.63811683654785, "global_step": 541030, "epoch": 6518} {"train_loss": -27.806676864624023, "global_step": 541031, "epoch": 6518} {"train_loss": -27.80720329284668, "global_step": 541032, "epoch": 6518} {"train_loss": -28.064462661743164, "global_step": 541033, "epoch": 6518} {"train_loss": -27.928258895874023, "global_step": 541034, "epoch": 6518} {"train_loss": -27.74995994567871, "global_step": 541035, "epoch": 6518} {"train_loss": -27.970703125, "global_step": 541036, "epoch": 6518} {"train_loss": -27.647958755493164, "global_step": 541037, "epoch": 6518} {"train_loss": -27.38673210144043, "global_step": 541038, "epoch": 6518} {"train_loss": -28.248199462890625, "global_step": 541039, "epoch": 6518} {"train_loss": -27.924341201782227, "global_step": 541040, "epoch": 6518} {"train_loss": -27.588165283203125, "global_step": 541041, "epoch": 6518} {"train_loss": -27.720382690429688, "global_step": 541042, "epoch": 6518} {"train_loss": -27.413694381713867, "global_step": 541043, "epoch": 6518} {"train_loss": -27.581151962280273, "global_step": 541044, "epoch": 6518} {"train_loss": -27.480093002319336, "global_step": 541045, "epoch": 6518} {"train_loss": -27.77980613708496, "global_step": 541046, "epoch": 6518} {"train_loss": -27.62041664123535, "global_step": 541047, "epoch": 6518} {"train_loss": -27.894317626953125, "global_step": 541048, "epoch": 6518} {"train_loss": -27.484373092651367, "global_step": 541049, "epoch": 6518} {"train_loss": -27.288549423217773, "global_step": 541050, "epoch": 6518} {"train_loss": -28.0124454498291, "global_step": 541051, "epoch": 6518} {"train_loss": -27.834247589111328, "global_step": 541052, "epoch": 6518} {"train_loss": -27.550058364868164, "global_step": 541053, "epoch": 6518} {"train_loss": -27.620508193969727, "global_step": 541054, "epoch": 6518} {"train_loss": -27.87017822265625, "global_step": 541055, "epoch": 6518} {"train_loss": -27.504186630249023, "global_step": 541056, "epoch": 6518} {"train_loss": -27.8231258392334, "global_step": 541057, "epoch": 6518} {"train_loss": -27.539703369140625, "global_step": 541058, "epoch": 6518} {"train_loss": -27.5235595703125, "global_step": 541059, "epoch": 6518} {"train_loss": -27.95810317993164, "global_step": 541060, "epoch": 6518} {"train_loss": -27.671045303344727, "global_step": 541061, "epoch": 6518} {"train_loss": -27.51837730407715, "global_step": 541062, "epoch": 6518} {"train_loss": -27.13226318359375, "global_step": 541063, "epoch": 6518} {"train_loss": -27.36832618713379, "global_step": 541064, "epoch": 6518} {"train_loss": -27.500268936157227, "global_step": 541065, "epoch": 6518} {"train_loss": -27.496789932250977, "global_step": 541066, "epoch": 6518} {"train_loss": -27.454238891601562, "global_step": 541067, "epoch": 6518} {"train_loss": -27.48870849609375, "global_step": 541068, "epoch": 6518} {"train_loss": -27.424774169921875, "global_step": 541069, "epoch": 6518} {"train_loss": -27.4763126373291, "global_step": 541070, "epoch": 6518} {"train_loss": -27.66460609436035, "global_step": 541071, "epoch": 6518} {"train_loss": -27.77021598815918, "global_step": 541072, "epoch": 6518} {"train_loss": -27.595422744750977, "global_step": 541073, "epoch": 6518} {"train_loss": -26.734272003173828, "global_step": 541074, "epoch": 6518} {"train_loss": -27.61492347717285, "global_step": 541075, "epoch": 6518} {"train_loss": -27.614354282976635, "global_step": 541076, "epoch": 6518, "val_loss": 6389043.0} {"train_loss": -26.818078994750977, "global_step": 541077, "epoch": 6519} {"train_loss": -27.10233497619629, "global_step": 541078, "epoch": 6519} {"train_loss": -27.41302490234375, "global_step": 541079, "epoch": 6519} {"train_loss": -26.91936683654785, "global_step": 541080, "epoch": 6519} {"train_loss": -27.46900749206543, "global_step": 541081, "epoch": 6519} {"train_loss": -27.011762619018555, "global_step": 541082, "epoch": 6519} {"train_loss": -26.9638729095459, "global_step": 541083, "epoch": 6519} {"train_loss": -27.08966636657715, "global_step": 541084, "epoch": 6519} {"train_loss": -27.35186767578125, "global_step": 541085, "epoch": 6519} {"train_loss": -27.1814022064209, "global_step": 541086, "epoch": 6519} {"train_loss": -27.01264762878418, "global_step": 541087, "epoch": 6519} {"train_loss": -27.325361251831055, "global_step": 541088, "epoch": 6519} {"train_loss": -27.18036460876465, "global_step": 541089, "epoch": 6519} {"train_loss": -27.25006103515625, "global_step": 541090, "epoch": 6519} {"train_loss": -27.113534927368164, "global_step": 541091, "epoch": 6519} {"train_loss": -27.255468368530273, "global_step": 541092, "epoch": 6519} {"train_loss": -27.774829864501953, "global_step": 541093, "epoch": 6519} {"train_loss": -27.2465763092041, "global_step": 541094, "epoch": 6519} {"train_loss": -27.734655380249023, "global_step": 541095, "epoch": 6519} {"train_loss": -27.5426025390625, "global_step": 541096, "epoch": 6519} {"train_loss": -27.99833106994629, "global_step": 541097, "epoch": 6519} {"train_loss": -27.433897018432617, "global_step": 541098, "epoch": 6519} {"train_loss": -27.745105743408203, "global_step": 541099, "epoch": 6519} {"train_loss": -27.4105281829834, "global_step": 541100, "epoch": 6519} {"train_loss": -27.704626083374023, "global_step": 541101, "epoch": 6519} {"train_loss": -27.760028839111328, "global_step": 541102, "epoch": 6519} {"train_loss": -27.703222274780273, "global_step": 541103, "epoch": 6519} {"train_loss": -27.833948135375977, "global_step": 541104, "epoch": 6519} {"train_loss": -27.596149444580078, "global_step": 541105, "epoch": 6519} {"train_loss": -27.874814987182617, "global_step": 541106, "epoch": 6519} {"train_loss": -27.60138511657715, "global_step": 541107, "epoch": 6519} {"train_loss": -27.671045303344727, "global_step": 541108, "epoch": 6519} {"train_loss": -27.69892692565918, "global_step": 541109, "epoch": 6519} {"train_loss": -27.42511558532715, "global_step": 541110, "epoch": 6519} {"train_loss": -27.775222778320312, "global_step": 541111, "epoch": 6519} {"train_loss": -27.883615493774414, "global_step": 541112, "epoch": 6519} {"train_loss": -27.742273330688477, "global_step": 541113, "epoch": 6519} {"train_loss": -28.23076820373535, "global_step": 541114, "epoch": 6519} {"train_loss": -27.822345733642578, "global_step": 541115, "epoch": 6519} {"train_loss": -27.770605087280273, "global_step": 541116, "epoch": 6519} {"train_loss": -27.974536895751953, "global_step": 541117, "epoch": 6519} {"train_loss": -27.642114639282227, "global_step": 541118, "epoch": 6519} {"train_loss": -27.44562339782715, "global_step": 541119, "epoch": 6519} {"train_loss": -27.7493896484375, "global_step": 541120, "epoch": 6519} {"train_loss": -27.731094360351562, "global_step": 541121, "epoch": 6519} {"train_loss": -28.045316696166992, "global_step": 541122, "epoch": 6519} {"train_loss": -27.765735626220703, "global_step": 541123, "epoch": 6519} {"train_loss": -27.898712158203125, "global_step": 541124, "epoch": 6519} {"train_loss": -27.967151641845703, "global_step": 541125, "epoch": 6519} {"train_loss": -27.73524284362793, "global_step": 541126, "epoch": 6519} {"train_loss": -27.809600830078125, "global_step": 541127, "epoch": 6519} {"train_loss": -27.790679931640625, "global_step": 541128, "epoch": 6519} {"train_loss": -27.63877296447754, "global_step": 541129, "epoch": 6519} {"train_loss": -27.264142990112305, "global_step": 541130, "epoch": 6519} {"train_loss": -26.689481735229492, "global_step": 541131, "epoch": 6519} {"train_loss": -26.600290298461914, "global_step": 541132, "epoch": 6519} {"train_loss": -27.3649959564209, "global_step": 541133, "epoch": 6519} {"train_loss": -27.802961349487305, "global_step": 541134, "epoch": 6519} {"train_loss": -27.426040649414062, "global_step": 541135, "epoch": 6519} {"train_loss": -27.363101959228516, "global_step": 541136, "epoch": 6519} {"train_loss": -28.0523738861084, "global_step": 541137, "epoch": 6519} {"train_loss": -27.371997833251953, "global_step": 541138, "epoch": 6519} {"train_loss": -27.790739059448242, "global_step": 541139, "epoch": 6519} {"train_loss": -27.924442291259766, "global_step": 541140, "epoch": 6519} {"train_loss": -27.70830726623535, "global_step": 541141, "epoch": 6519} {"train_loss": -27.8726749420166, "global_step": 541142, "epoch": 6519} {"train_loss": -27.888202667236328, "global_step": 541143, "epoch": 6519} {"train_loss": -27.310657501220703, "global_step": 541144, "epoch": 6519} {"train_loss": -27.84590721130371, "global_step": 541145, "epoch": 6519} {"train_loss": -27.662023544311523, "global_step": 541146, "epoch": 6519} {"train_loss": -27.912723541259766, "global_step": 541147, "epoch": 6519} {"train_loss": -27.68267250061035, "global_step": 541148, "epoch": 6519} {"train_loss": -28.016143798828125, "global_step": 541149, "epoch": 6519} {"train_loss": -27.714496612548828, "global_step": 541150, "epoch": 6519} {"train_loss": -27.718597412109375, "global_step": 541151, "epoch": 6519} {"train_loss": -27.5030517578125, "global_step": 541152, "epoch": 6519} {"train_loss": -27.69179344177246, "global_step": 541153, "epoch": 6519} {"train_loss": -27.502893447875977, "global_step": 541154, "epoch": 6519} {"train_loss": -28.072479248046875, "global_step": 541155, "epoch": 6519} {"train_loss": -27.714475631713867, "global_step": 541156, "epoch": 6519} {"train_loss": -27.70577049255371, "global_step": 541157, "epoch": 6519} {"train_loss": -27.524694442749023, "global_step": 541158, "epoch": 6519} {"train_loss": -27.605040630662298, "global_step": 541159, "epoch": 6519, "val_loss": 6343331.5} {"train_loss": -27.143152236938477, "global_step": 541160, "epoch": 6520} {"train_loss": -26.466135025024414, "global_step": 541161, "epoch": 6520} {"train_loss": -26.91077995300293, "global_step": 541162, "epoch": 6520} {"train_loss": -27.569263458251953, "global_step": 541163, "epoch": 6520} {"train_loss": -26.53696060180664, "global_step": 541164, "epoch": 6520} {"train_loss": -26.799726486206055, "global_step": 541165, "epoch": 6520} {"train_loss": -26.273975372314453, "global_step": 541166, "epoch": 6520} {"train_loss": -26.981958389282227, "global_step": 541167, "epoch": 6520} {"train_loss": -26.85576820373535, "global_step": 541168, "epoch": 6520} {"train_loss": -26.90390968322754, "global_step": 541169, "epoch": 6520} {"train_loss": -26.826007843017578, "global_step": 541170, "epoch": 6520} {"train_loss": -27.685285568237305, "global_step": 541171, "epoch": 6520} {"train_loss": -27.033832550048828, "global_step": 541172, "epoch": 6520} {"train_loss": -27.718347549438477, "global_step": 541173, "epoch": 6520} {"train_loss": -27.6981258392334, "global_step": 541174, "epoch": 6520} {"train_loss": -27.256195068359375, "global_step": 541175, "epoch": 6520} {"train_loss": -27.716604232788086, "global_step": 541176, "epoch": 6520} {"train_loss": -27.408674240112305, "global_step": 541177, "epoch": 6520} {"train_loss": -27.616514205932617, "global_step": 541178, "epoch": 6520} {"train_loss": -27.5352840423584, "global_step": 541179, "epoch": 6520} {"train_loss": -27.7176513671875, "global_step": 541180, "epoch": 6520} {"train_loss": -27.4935245513916, "global_step": 541181, "epoch": 6520} {"train_loss": -27.4094181060791, "global_step": 541182, "epoch": 6520} {"train_loss": -27.926000595092773, "global_step": 541183, "epoch": 6520} {"train_loss": -27.432111740112305, "global_step": 541184, "epoch": 6520} {"train_loss": -27.778629302978516, "global_step": 541185, "epoch": 6520} {"train_loss": -27.88083267211914, "global_step": 541186, "epoch": 6520} {"train_loss": -27.939258575439453, "global_step": 541187, "epoch": 6520} {"train_loss": -27.825592041015625, "global_step": 541188, "epoch": 6520} {"train_loss": -27.846012115478516, "global_step": 541189, "epoch": 6520} {"train_loss": -27.591827392578125, "global_step": 541190, "epoch": 6520} {"train_loss": -27.731252670288086, "global_step": 541191, "epoch": 6520} {"train_loss": -28.099796295166016, "global_step": 541192, "epoch": 6520} {"train_loss": -27.806604385375977, "global_step": 541193, "epoch": 6520} {"train_loss": -27.871973037719727, "global_step": 541194, "epoch": 6520} {"train_loss": -27.600072860717773, "global_step": 541195, "epoch": 6520} {"train_loss": -28.226852416992188, "global_step": 541196, "epoch": 6520} {"train_loss": -28.235864639282227, "global_step": 541197, "epoch": 6520} {"train_loss": -27.597116470336914, "global_step": 541198, "epoch": 6520} {"train_loss": -27.678049087524414, "global_step": 541199, "epoch": 6520} {"train_loss": -27.81586265563965, "global_step": 541200, "epoch": 6520} {"train_loss": -27.61756706237793, "global_step": 541201, "epoch": 6520} {"train_loss": -27.435657501220703, "global_step": 541202, "epoch": 6520} {"train_loss": -27.06365394592285, "global_step": 541203, "epoch": 6520} {"train_loss": -27.22842788696289, "global_step": 541204, "epoch": 6520} {"train_loss": -27.369367599487305, "global_step": 541205, "epoch": 6520} {"train_loss": -28.0324764251709, "global_step": 541206, "epoch": 6520} {"train_loss": -27.39080810546875, "global_step": 541207, "epoch": 6520} {"train_loss": -27.758275985717773, "global_step": 541208, "epoch": 6520} {"train_loss": -27.26009178161621, "global_step": 541209, "epoch": 6520} {"train_loss": -27.92608642578125, "global_step": 541210, "epoch": 6520} {"train_loss": -28.05253028869629, "global_step": 541211, "epoch": 6520} {"train_loss": -27.612573623657227, "global_step": 541212, "epoch": 6520} {"train_loss": -27.786725997924805, "global_step": 541213, "epoch": 6520} {"train_loss": -27.744924545288086, "global_step": 541214, "epoch": 6520} {"train_loss": -27.55316162109375, "global_step": 541215, "epoch": 6520} {"train_loss": -27.517871856689453, "global_step": 541216, "epoch": 6520} {"train_loss": -27.985248565673828, "global_step": 541217, "epoch": 6520} {"train_loss": -28.031003952026367, "global_step": 541218, "epoch": 6520} {"train_loss": -27.54244041442871, "global_step": 541219, "epoch": 6520} {"train_loss": -27.98041343688965, "global_step": 541220, "epoch": 6520} {"train_loss": -28.199079513549805, "global_step": 541221, "epoch": 6520} {"train_loss": -27.864383697509766, "global_step": 541222, "epoch": 6520} {"train_loss": -27.55314064025879, "global_step": 541223, "epoch": 6520} {"train_loss": -27.858991622924805, "global_step": 541224, "epoch": 6520} {"train_loss": -27.596439361572266, "global_step": 541225, "epoch": 6520} {"train_loss": -27.46693992614746, "global_step": 541226, "epoch": 6520} {"train_loss": -27.204700469970703, "global_step": 541227, "epoch": 6520} {"train_loss": -27.74371910095215, "global_step": 541228, "epoch": 6520} {"train_loss": -27.56448745727539, "global_step": 541229, "epoch": 6520} {"train_loss": -27.421091079711914, "global_step": 541230, "epoch": 6520} {"train_loss": -27.286359786987305, "global_step": 541231, "epoch": 6520} {"train_loss": -26.884382247924805, "global_step": 541232, "epoch": 6520} {"train_loss": -27.24957275390625, "global_step": 541233, "epoch": 6520} {"train_loss": -27.47002601623535, "global_step": 541234, "epoch": 6520} {"train_loss": -27.769962310791016, "global_step": 541235, "epoch": 6520} {"train_loss": -27.50038719177246, "global_step": 541236, "epoch": 6520} {"train_loss": -27.52947998046875, "global_step": 541237, "epoch": 6520} {"train_loss": -27.46213150024414, "global_step": 541238, "epoch": 6520} {"train_loss": -27.8189640045166, "global_step": 541239, "epoch": 6520} {"train_loss": -27.887908935546875, "global_step": 541240, "epoch": 6520} {"train_loss": -27.371732711791992, "global_step": 541241, "epoch": 6520} {"train_loss": -27.524858635592174, "global_step": 541242, "epoch": 6520, "val_loss": 6490723.0} {"train_loss": -27.372085571289062, "global_step": 541243, "epoch": 6521} {"train_loss": -27.46930503845215, "global_step": 541244, "epoch": 6521} {"train_loss": -27.079181671142578, "global_step": 541245, "epoch": 6521} {"train_loss": -26.923694610595703, "global_step": 541246, "epoch": 6521} {"train_loss": -27.2182674407959, "global_step": 541247, "epoch": 6521} {"train_loss": -27.41269874572754, "global_step": 541248, "epoch": 6521} {"train_loss": -26.678150177001953, "global_step": 541249, "epoch": 6521} {"train_loss": -27.123891830444336, "global_step": 541250, "epoch": 6521} {"train_loss": -26.92803955078125, "global_step": 541251, "epoch": 6521} {"train_loss": -27.394575119018555, "global_step": 541252, "epoch": 6521} {"train_loss": -27.106952667236328, "global_step": 541253, "epoch": 6521} {"train_loss": -27.184539794921875, "global_step": 541254, "epoch": 6521} {"train_loss": -27.868854522705078, "global_step": 541255, "epoch": 6521} {"train_loss": -27.663049697875977, "global_step": 541256, "epoch": 6521} {"train_loss": -27.626529693603516, "global_step": 541257, "epoch": 6521} {"train_loss": -27.209753036499023, "global_step": 541258, "epoch": 6521} {"train_loss": -27.51410484313965, "global_step": 541259, "epoch": 6521} {"train_loss": -27.007354736328125, "global_step": 541260, "epoch": 6521} {"train_loss": -27.455215454101562, "global_step": 541261, "epoch": 6521} {"train_loss": -27.404890060424805, "global_step": 541262, "epoch": 6521} {"train_loss": -27.75044059753418, "global_step": 541263, "epoch": 6521} {"train_loss": -27.429380416870117, "global_step": 541264, "epoch": 6521} {"train_loss": -27.610105514526367, "global_step": 541265, "epoch": 6521} {"train_loss": -27.798908233642578, "global_step": 541266, "epoch": 6521} {"train_loss": -27.371564865112305, "global_step": 541267, "epoch": 6521} {"train_loss": -27.58683204650879, "global_step": 541268, "epoch": 6521} {"train_loss": -27.507612228393555, "global_step": 541269, "epoch": 6521} {"train_loss": -27.599164962768555, "global_step": 541270, "epoch": 6521} {"train_loss": -27.79010581970215, "global_step": 541271, "epoch": 6521} {"train_loss": -27.77223777770996, "global_step": 541272, "epoch": 6521} {"train_loss": -27.44089126586914, "global_step": 541273, "epoch": 6521} {"train_loss": -27.23878288269043, "global_step": 541274, "epoch": 6521} {"train_loss": -27.416309356689453, "global_step": 541275, "epoch": 6521} {"train_loss": -27.435810089111328, "global_step": 541276, "epoch": 6521} {"train_loss": -27.6844539642334, "global_step": 541277, "epoch": 6521} {"train_loss": -27.69183921813965, "global_step": 541278, "epoch": 6521} {"train_loss": -28.071287155151367, "global_step": 541279, "epoch": 6521} {"train_loss": -27.832611083984375, "global_step": 541280, "epoch": 6521} {"train_loss": -27.802209854125977, "global_step": 541281, "epoch": 6521} {"train_loss": -28.001953125, "global_step": 541282, "epoch": 6521} {"train_loss": -27.78590202331543, "global_step": 541283, "epoch": 6521} {"train_loss": -27.69475746154785, "global_step": 541284, "epoch": 6521} {"train_loss": -27.8419246673584, "global_step": 541285, "epoch": 6521} {"train_loss": -27.762561798095703, "global_step": 541286, "epoch": 6521} {"train_loss": -27.654556274414062, "global_step": 541287, "epoch": 6521} {"train_loss": -27.78472328186035, "global_step": 541288, "epoch": 6521} {"train_loss": -27.542810440063477, "global_step": 541289, "epoch": 6521} {"train_loss": -27.862197875976562, "global_step": 541290, "epoch": 6521} {"train_loss": -27.676904678344727, "global_step": 541291, "epoch": 6521} {"train_loss": -27.499378204345703, "global_step": 541292, "epoch": 6521} {"train_loss": -27.546192169189453, "global_step": 541293, "epoch": 6521} {"train_loss": -27.80994987487793, "global_step": 541294, "epoch": 6521} {"train_loss": -28.078479766845703, "global_step": 541295, "epoch": 6521} {"train_loss": -28.237945556640625, "global_step": 541296, "epoch": 6521} {"train_loss": -27.83942985534668, "global_step": 541297, "epoch": 6521} {"train_loss": -27.908666610717773, "global_step": 541298, "epoch": 6521} {"train_loss": -27.9925537109375, "global_step": 541299, "epoch": 6521} {"train_loss": -27.945175170898438, "global_step": 541300, "epoch": 6521} {"train_loss": -27.893692016601562, "global_step": 541301, "epoch": 6521} {"train_loss": -28.242828369140625, "global_step": 541302, "epoch": 6521} {"train_loss": -28.09222984313965, "global_step": 541303, "epoch": 6521} {"train_loss": -27.334142684936523, "global_step": 541304, "epoch": 6521} {"train_loss": -27.601037979125977, "global_step": 541305, "epoch": 6521} {"train_loss": -27.416772842407227, "global_step": 541306, "epoch": 6521} {"train_loss": -27.26824951171875, "global_step": 541307, "epoch": 6521} {"train_loss": -26.60377311706543, "global_step": 541308, "epoch": 6521} {"train_loss": -26.272964477539062, "global_step": 541309, "epoch": 6521} {"train_loss": -25.98853874206543, "global_step": 541310, "epoch": 6521} {"train_loss": -27.531787872314453, "global_step": 541311, "epoch": 6521} {"train_loss": -26.38136100769043, "global_step": 541312, "epoch": 6521} {"train_loss": -26.68830680847168, "global_step": 541313, "epoch": 6521} {"train_loss": -27.613433837890625, "global_step": 541314, "epoch": 6521} {"train_loss": -27.27010154724121, "global_step": 541315, "epoch": 6521} {"train_loss": -27.04217529296875, "global_step": 541316, "epoch": 6521} {"train_loss": -27.633188247680664, "global_step": 541317, "epoch": 6521} {"train_loss": -26.978559494018555, "global_step": 541318, "epoch": 6521} {"train_loss": -27.17860221862793, "global_step": 541319, "epoch": 6521} {"train_loss": -26.821481704711914, "global_step": 541320, "epoch": 6521} {"train_loss": -27.161487579345703, "global_step": 541321, "epoch": 6521} {"train_loss": -27.292236328125, "global_step": 541322, "epoch": 6521} {"train_loss": -27.468830108642578, "global_step": 541323, "epoch": 6521} {"train_loss": -27.641300201416016, "global_step": 541324, "epoch": 6521} {"train_loss": -27.46642882565418, "global_step": 541325, "epoch": 6521, "val_loss": 6418017.0} {"train_loss": -27.12458610534668, "global_step": 541326, "epoch": 6522} {"train_loss": -26.742694854736328, "global_step": 541327, "epoch": 6522} {"train_loss": -27.086790084838867, "global_step": 541328, "epoch": 6522} {"train_loss": -26.909809112548828, "global_step": 541329, "epoch": 6522} {"train_loss": -27.15531349182129, "global_step": 541330, "epoch": 6522} {"train_loss": -26.913043975830078, "global_step": 541331, "epoch": 6522} {"train_loss": -26.7211971282959, "global_step": 541332, "epoch": 6522} {"train_loss": -26.974035263061523, "global_step": 541333, "epoch": 6522} {"train_loss": -27.314966201782227, "global_step": 541334, "epoch": 6522} {"train_loss": -27.318561553955078, "global_step": 541335, "epoch": 6522} {"train_loss": -27.29688835144043, "global_step": 541336, "epoch": 6522} {"train_loss": -27.00959587097168, "global_step": 541337, "epoch": 6522} {"train_loss": -27.449268341064453, "global_step": 541338, "epoch": 6522} {"train_loss": -26.997333526611328, "global_step": 541339, "epoch": 6522} {"train_loss": -27.29902458190918, "global_step": 541340, "epoch": 6522} {"train_loss": -27.083160400390625, "global_step": 541341, "epoch": 6522} {"train_loss": -27.300800323486328, "global_step": 541342, "epoch": 6522} {"train_loss": -27.486846923828125, "global_step": 541343, "epoch": 6522} {"train_loss": -27.2990779876709, "global_step": 541344, "epoch": 6522} {"train_loss": -27.736902236938477, "global_step": 541345, "epoch": 6522} {"train_loss": -27.507360458374023, "global_step": 541346, "epoch": 6522} {"train_loss": -27.552566528320312, "global_step": 541347, "epoch": 6522} {"train_loss": -27.84791374206543, "global_step": 541348, "epoch": 6522} {"train_loss": -27.32154655456543, "global_step": 541349, "epoch": 6522} {"train_loss": -27.613555908203125, "global_step": 541350, "epoch": 6522} {"train_loss": -27.725845336914062, "global_step": 541351, "epoch": 6522} {"train_loss": -27.528018951416016, "global_step": 541352, "epoch": 6522} {"train_loss": -27.715335845947266, "global_step": 541353, "epoch": 6522} {"train_loss": -27.640226364135742, "global_step": 541354, "epoch": 6522} {"train_loss": -27.67207145690918, "global_step": 541355, "epoch": 6522} {"train_loss": -27.678821563720703, "global_step": 541356, "epoch": 6522} {"train_loss": -27.927509307861328, "global_step": 541357, "epoch": 6522} {"train_loss": -27.36216163635254, "global_step": 541358, "epoch": 6522} {"train_loss": -27.9113712310791, "global_step": 541359, "epoch": 6522} {"train_loss": -27.749713897705078, "global_step": 541360, "epoch": 6522} {"train_loss": -27.945205688476562, "global_step": 541361, "epoch": 6522} {"train_loss": -27.65777587890625, "global_step": 541362, "epoch": 6522} {"train_loss": -28.31121826171875, "global_step": 541363, "epoch": 6522} {"train_loss": -27.636398315429688, "global_step": 541364, "epoch": 6522} {"train_loss": -27.432790756225586, "global_step": 541365, "epoch": 6522} {"train_loss": -27.3729190826416, "global_step": 541366, "epoch": 6522} {"train_loss": -27.94447135925293, "global_step": 541367, "epoch": 6522} {"train_loss": -27.752405166625977, "global_step": 541368, "epoch": 6522} {"train_loss": -27.957916259765625, "global_step": 541369, "epoch": 6522} {"train_loss": -27.90973472595215, "global_step": 541370, "epoch": 6522} {"train_loss": -27.73699951171875, "global_step": 541371, "epoch": 6522} {"train_loss": -27.899810791015625, "global_step": 541372, "epoch": 6522} {"train_loss": -28.010406494140625, "global_step": 541373, "epoch": 6522} {"train_loss": -28.00375747680664, "global_step": 541374, "epoch": 6522} {"train_loss": -27.89661979675293, "global_step": 541375, "epoch": 6522} {"train_loss": -27.966400146484375, "global_step": 541376, "epoch": 6522} {"train_loss": -27.651525497436523, "global_step": 541377, "epoch": 6522} {"train_loss": -27.67439079284668, "global_step": 541378, "epoch": 6522} {"train_loss": -27.936132431030273, "global_step": 541379, "epoch": 6522} {"train_loss": -27.928274154663086, "global_step": 541380, "epoch": 6522} {"train_loss": -27.747058868408203, "global_step": 541381, "epoch": 6522} {"train_loss": -27.77847671508789, "global_step": 541382, "epoch": 6522} {"train_loss": -27.845535278320312, "global_step": 541383, "epoch": 6522} {"train_loss": -27.6372013092041, "global_step": 541384, "epoch": 6522} {"train_loss": -28.080286026000977, "global_step": 541385, "epoch": 6522} {"train_loss": -28.024982452392578, "global_step": 541386, "epoch": 6522} {"train_loss": -28.0429630279541, "global_step": 541387, "epoch": 6522} {"train_loss": -27.912668228149414, "global_step": 541388, "epoch": 6522} {"train_loss": -27.801794052124023, "global_step": 541389, "epoch": 6522} {"train_loss": -27.92677116394043, "global_step": 541390, "epoch": 6522} {"train_loss": -28.016626358032227, "global_step": 541391, "epoch": 6522} {"train_loss": -27.67302894592285, "global_step": 541392, "epoch": 6522} {"train_loss": -28.017751693725586, "global_step": 541393, "epoch": 6522} {"train_loss": -27.631811141967773, "global_step": 541394, "epoch": 6522} {"train_loss": -27.91852378845215, "global_step": 541395, "epoch": 6522} {"train_loss": -28.2255916595459, "global_step": 541396, "epoch": 6522} {"train_loss": -27.94742774963379, "global_step": 541397, "epoch": 6522} {"train_loss": -28.071640014648438, "global_step": 541398, "epoch": 6522} {"train_loss": -28.02777671813965, "global_step": 541399, "epoch": 6522} {"train_loss": -27.989593505859375, "global_step": 541400, "epoch": 6522} {"train_loss": -27.790403366088867, "global_step": 541401, "epoch": 6522} {"train_loss": -27.6522159576416, "global_step": 541402, "epoch": 6522} {"train_loss": -27.906375885009766, "global_step": 541403, "epoch": 6522} {"train_loss": -27.5327205657959, "global_step": 541404, "epoch": 6522} {"train_loss": -27.70730972290039, "global_step": 541405, "epoch": 6522} {"train_loss": -27.26618003845215, "global_step": 541406, "epoch": 6522} {"train_loss": -27.83430290222168, "global_step": 541407, "epoch": 6522} {"train_loss": -27.643775526299535, "global_step": 541408, "epoch": 6522, "val_loss": 6503442.0} {"train_loss": -27.650854110717773, "global_step": 541409, "epoch": 6523} {"train_loss": -27.11248779296875, "global_step": 541410, "epoch": 6523} {"train_loss": -26.615325927734375, "global_step": 541411, "epoch": 6523} {"train_loss": -26.32123374938965, "global_step": 541412, "epoch": 6523} {"train_loss": -26.937305450439453, "global_step": 541413, "epoch": 6523} {"train_loss": -27.17731285095215, "global_step": 541414, "epoch": 6523} {"train_loss": -27.11421775817871, "global_step": 541415, "epoch": 6523} {"train_loss": -26.845117568969727, "global_step": 541416, "epoch": 6523} {"train_loss": -26.897424697875977, "global_step": 541417, "epoch": 6523} {"train_loss": -27.042285919189453, "global_step": 541418, "epoch": 6523} {"train_loss": -26.626657485961914, "global_step": 541419, "epoch": 6523} {"train_loss": -26.981231689453125, "global_step": 541420, "epoch": 6523} {"train_loss": -27.36490249633789, "global_step": 541421, "epoch": 6523} {"train_loss": -27.28927993774414, "global_step": 541422, "epoch": 6523} {"train_loss": -27.541458129882812, "global_step": 541423, "epoch": 6523} {"train_loss": -27.0343017578125, "global_step": 541424, "epoch": 6523} {"train_loss": -27.08980369567871, "global_step": 541425, "epoch": 6523} {"train_loss": -27.2836856842041, "global_step": 541426, "epoch": 6523} {"train_loss": -27.171594619750977, "global_step": 541427, "epoch": 6523} {"train_loss": -27.23505210876465, "global_step": 541428, "epoch": 6523} {"train_loss": -27.473224639892578, "global_step": 541429, "epoch": 6523} {"train_loss": -27.17032814025879, "global_step": 541430, "epoch": 6523} {"train_loss": -27.347930908203125, "global_step": 541431, "epoch": 6523} {"train_loss": -27.365020751953125, "global_step": 541432, "epoch": 6523} {"train_loss": -27.3387508392334, "global_step": 541433, "epoch": 6523} {"train_loss": -27.16837501525879, "global_step": 541434, "epoch": 6523} {"train_loss": -27.792455673217773, "global_step": 541435, "epoch": 6523} {"train_loss": -27.525558471679688, "global_step": 541436, "epoch": 6523} {"train_loss": -27.7315731048584, "global_step": 541437, "epoch": 6523} {"train_loss": -27.53504753112793, "global_step": 541438, "epoch": 6523} {"train_loss": -27.74326515197754, "global_step": 541439, "epoch": 6523} {"train_loss": -27.476978302001953, "global_step": 541440, "epoch": 6523} {"train_loss": -27.721012115478516, "global_step": 541441, "epoch": 6523} {"train_loss": -27.526548385620117, "global_step": 541442, "epoch": 6523} {"train_loss": -27.512964248657227, "global_step": 541443, "epoch": 6523} {"train_loss": -27.8272705078125, "global_step": 541444, "epoch": 6523} {"train_loss": -27.88129234313965, "global_step": 541445, "epoch": 6523} {"train_loss": -27.404653549194336, "global_step": 541446, "epoch": 6523} {"train_loss": -27.9948787689209, "global_step": 541447, "epoch": 6523} {"train_loss": -28.07269859313965, "global_step": 541448, "epoch": 6523} {"train_loss": -28.01247215270996, "global_step": 541449, "epoch": 6523} {"train_loss": -27.388595581054688, "global_step": 541450, "epoch": 6523} {"train_loss": -27.824909210205078, "global_step": 541451, "epoch": 6523} {"train_loss": -27.575605392456055, "global_step": 541452, "epoch": 6523} {"train_loss": -27.81571388244629, "global_step": 541453, "epoch": 6523} {"train_loss": -27.866418838500977, "global_step": 541454, "epoch": 6523} {"train_loss": -27.754989624023438, "global_step": 541455, "epoch": 6523} {"train_loss": -27.86919593811035, "global_step": 541456, "epoch": 6523} {"train_loss": -27.890106201171875, "global_step": 541457, "epoch": 6523} {"train_loss": -27.860034942626953, "global_step": 541458, "epoch": 6523} {"train_loss": -27.86337661743164, "global_step": 541459, "epoch": 6523} {"train_loss": -27.626678466796875, "global_step": 541460, "epoch": 6523} {"train_loss": -28.272916793823242, "global_step": 541461, "epoch": 6523} {"train_loss": -27.935394287109375, "global_step": 541462, "epoch": 6523} {"train_loss": -27.142868041992188, "global_step": 541463, "epoch": 6523} {"train_loss": -27.867340087890625, "global_step": 541464, "epoch": 6523} {"train_loss": -27.778894424438477, "global_step": 541465, "epoch": 6523} {"train_loss": -28.004077911376953, "global_step": 541466, "epoch": 6523} {"train_loss": -27.814529418945312, "global_step": 541467, "epoch": 6523} {"train_loss": -27.919462203979492, "global_step": 541468, "epoch": 6523} {"train_loss": -27.689346313476562, "global_step": 541469, "epoch": 6523} {"train_loss": -28.02811050415039, "global_step": 541470, "epoch": 6523} {"train_loss": -27.810287475585938, "global_step": 541471, "epoch": 6523} {"train_loss": -28.130374908447266, "global_step": 541472, "epoch": 6523} {"train_loss": -27.8435001373291, "global_step": 541473, "epoch": 6523} {"train_loss": -27.845474243164062, "global_step": 541474, "epoch": 6523} {"train_loss": -27.908924102783203, "global_step": 541475, "epoch": 6523} {"train_loss": -27.459787368774414, "global_step": 541476, "epoch": 6523} {"train_loss": -27.1474552154541, "global_step": 541477, "epoch": 6523} {"train_loss": -26.732858657836914, "global_step": 541478, "epoch": 6523} {"train_loss": -26.205631256103516, "global_step": 541479, "epoch": 6523} {"train_loss": -26.63129997253418, "global_step": 541480, "epoch": 6523} {"train_loss": -27.03883171081543, "global_step": 541481, "epoch": 6523} {"train_loss": -27.415063858032227, "global_step": 541482, "epoch": 6523} {"train_loss": -26.71681022644043, "global_step": 541483, "epoch": 6523} {"train_loss": -27.505908966064453, "global_step": 541484, "epoch": 6523} {"train_loss": -27.896142959594727, "global_step": 541485, "epoch": 6523} {"train_loss": -27.342609405517578, "global_step": 541486, "epoch": 6523} {"train_loss": -27.391986846923828, "global_step": 541487, "epoch": 6523} {"train_loss": -27.322265625, "global_step": 541488, "epoch": 6523} {"train_loss": -27.34541130065918, "global_step": 541489, "epoch": 6523} {"train_loss": -27.60821533203125, "global_step": 541490, "epoch": 6523} {"train_loss": -27.462520323603986, "global_step": 541491, "epoch": 6523, "val_loss": 6454701.0} {"train_loss": -24.561504364013672, "global_step": 541492, "epoch": 6524} {"train_loss": -23.40711784362793, "global_step": 541493, "epoch": 6524} {"train_loss": -27.005664825439453, "global_step": 541494, "epoch": 6524} {"train_loss": -26.475187301635742, "global_step": 541495, "epoch": 6524} {"train_loss": -26.422048568725586, "global_step": 541496, "epoch": 6524} {"train_loss": -26.51759147644043, "global_step": 541497, "epoch": 6524} {"train_loss": -26.5140438079834, "global_step": 541498, "epoch": 6524} {"train_loss": -25.893030166625977, "global_step": 541499, "epoch": 6524} {"train_loss": -26.97821617126465, "global_step": 541500, "epoch": 6524} {"train_loss": -26.745471954345703, "global_step": 541501, "epoch": 6524} {"train_loss": -26.9249267578125, "global_step": 541502, "epoch": 6524} {"train_loss": -27.003162384033203, "global_step": 541503, "epoch": 6524} {"train_loss": -27.020288467407227, "global_step": 541504, "epoch": 6524} {"train_loss": -26.912139892578125, "global_step": 541505, "epoch": 6524} {"train_loss": -26.928638458251953, "global_step": 541506, "epoch": 6524} {"train_loss": -27.048709869384766, "global_step": 541507, "epoch": 6524} {"train_loss": -26.80879020690918, "global_step": 541508, "epoch": 6524} {"train_loss": -26.872817993164062, "global_step": 541509, "epoch": 6524} {"train_loss": -27.275842666625977, "global_step": 541510, "epoch": 6524} {"train_loss": -27.069875717163086, "global_step": 541511, "epoch": 6524} {"train_loss": -27.116369247436523, "global_step": 541512, "epoch": 6524} {"train_loss": -27.779815673828125, "global_step": 541513, "epoch": 6524} {"train_loss": -27.361377716064453, "global_step": 541514, "epoch": 6524} {"train_loss": -27.545618057250977, "global_step": 541515, "epoch": 6524} {"train_loss": -27.639875411987305, "global_step": 541516, "epoch": 6524} {"train_loss": -26.9094181060791, "global_step": 541517, "epoch": 6524} {"train_loss": -27.90921974182129, "global_step": 541518, "epoch": 6524} {"train_loss": -27.289579391479492, "global_step": 541519, "epoch": 6524} {"train_loss": -27.05085563659668, "global_step": 541520, "epoch": 6524} {"train_loss": -27.62784194946289, "global_step": 541521, "epoch": 6524} {"train_loss": -27.48431968688965, "global_step": 541522, "epoch": 6524} {"train_loss": -27.387372970581055, "global_step": 541523, "epoch": 6524} {"train_loss": -27.464523315429688, "global_step": 541524, "epoch": 6524} {"train_loss": -27.5545711517334, "global_step": 541525, "epoch": 6524} {"train_loss": -27.79681968688965, "global_step": 541526, "epoch": 6524} {"train_loss": -27.79705238342285, "global_step": 541527, "epoch": 6524} {"train_loss": -27.794214248657227, "global_step": 541528, "epoch": 6524} {"train_loss": -28.11628532409668, "global_step": 541529, "epoch": 6524} {"train_loss": -27.69623374938965, "global_step": 541530, "epoch": 6524} {"train_loss": -27.607629776000977, "global_step": 541531, "epoch": 6524} {"train_loss": -27.59629249572754, "global_step": 541532, "epoch": 6524} {"train_loss": -27.668752670288086, "global_step": 541533, "epoch": 6524} {"train_loss": -27.324665069580078, "global_step": 541534, "epoch": 6524} {"train_loss": -27.7977237701416, "global_step": 541535, "epoch": 6524} {"train_loss": -27.985441207885742, "global_step": 541536, "epoch": 6524} {"train_loss": -27.671972274780273, "global_step": 541537, "epoch": 6524} {"train_loss": -27.957548141479492, "global_step": 541538, "epoch": 6524} {"train_loss": -27.629968643188477, "global_step": 541539, "epoch": 6524} {"train_loss": -28.054235458374023, "global_step": 541540, "epoch": 6524} {"train_loss": -27.547128677368164, "global_step": 541541, "epoch": 6524} {"train_loss": -27.897321701049805, "global_step": 541542, "epoch": 6524} {"train_loss": -27.873554229736328, "global_step": 541543, "epoch": 6524} {"train_loss": -27.680374145507812, "global_step": 541544, "epoch": 6524} {"train_loss": -28.051172256469727, "global_step": 541545, "epoch": 6524} {"train_loss": -27.6477108001709, "global_step": 541546, "epoch": 6524} {"train_loss": -27.410009384155273, "global_step": 541547, "epoch": 6524} {"train_loss": -27.524255752563477, "global_step": 541548, "epoch": 6524} {"train_loss": -27.539691925048828, "global_step": 541549, "epoch": 6524} {"train_loss": -27.070600509643555, "global_step": 541550, "epoch": 6524} {"train_loss": -26.945871353149414, "global_step": 541551, "epoch": 6524} {"train_loss": -27.443693161010742, "global_step": 541552, "epoch": 6524} {"train_loss": -27.612241744995117, "global_step": 541553, "epoch": 6524} {"train_loss": -27.86285400390625, "global_step": 541554, "epoch": 6524} {"train_loss": -27.510894775390625, "global_step": 541555, "epoch": 6524} {"train_loss": -27.230178833007812, "global_step": 541556, "epoch": 6524} {"train_loss": -27.154205322265625, "global_step": 541557, "epoch": 6524} {"train_loss": -27.64613914489746, "global_step": 541558, "epoch": 6524} {"train_loss": -27.922931671142578, "global_step": 541559, "epoch": 6524} {"train_loss": -27.61042594909668, "global_step": 541560, "epoch": 6524} {"train_loss": -27.485342025756836, "global_step": 541561, "epoch": 6524} {"train_loss": -27.5386962890625, "global_step": 541562, "epoch": 6524} {"train_loss": -28.120960235595703, "global_step": 541563, "epoch": 6524} {"train_loss": -28.045087814331055, "global_step": 541564, "epoch": 6524} {"train_loss": -27.877248764038086, "global_step": 541565, "epoch": 6524} {"train_loss": -27.935546875, "global_step": 541566, "epoch": 6524} {"train_loss": -27.594602584838867, "global_step": 541567, "epoch": 6524} {"train_loss": -28.180892944335938, "global_step": 541568, "epoch": 6524} {"train_loss": -27.78643226623535, "global_step": 541569, "epoch": 6524} {"train_loss": -27.625669479370117, "global_step": 541570, "epoch": 6524} {"train_loss": -27.687726974487305, "global_step": 541571, "epoch": 6524} {"train_loss": -27.792160034179688, "global_step": 541572, "epoch": 6524} {"train_loss": -27.32612419128418, "global_step": 541573, "epoch": 6524} {"train_loss": -27.342929771147578, "global_step": 541574, "epoch": 6524, "val_loss": 6319543.5} {"train_loss": -27.04774284362793, "global_step": 541575, "epoch": 6525} {"train_loss": -25.330698013305664, "global_step": 541576, "epoch": 6525} {"train_loss": -26.287221908569336, "global_step": 541577, "epoch": 6525} {"train_loss": -26.903188705444336, "global_step": 541578, "epoch": 6525} {"train_loss": -26.517017364501953, "global_step": 541579, "epoch": 6525} {"train_loss": -26.16737174987793, "global_step": 541580, "epoch": 6525} {"train_loss": -26.60400390625, "global_step": 541581, "epoch": 6525} {"train_loss": -26.777624130249023, "global_step": 541582, "epoch": 6525} {"train_loss": -27.082860946655273, "global_step": 541583, "epoch": 6525} {"train_loss": -26.894193649291992, "global_step": 541584, "epoch": 6525} {"train_loss": -26.997411727905273, "global_step": 541585, "epoch": 6525} {"train_loss": -27.06662368774414, "global_step": 541586, "epoch": 6525} {"train_loss": -27.1026668548584, "global_step": 541587, "epoch": 6525} {"train_loss": -27.09429931640625, "global_step": 541588, "epoch": 6525} {"train_loss": -27.234506607055664, "global_step": 541589, "epoch": 6525} {"train_loss": -27.249740600585938, "global_step": 541590, "epoch": 6525} {"train_loss": -27.121158599853516, "global_step": 541591, "epoch": 6525} {"train_loss": -27.347400665283203, "global_step": 541592, "epoch": 6525} {"train_loss": -27.089765548706055, "global_step": 541593, "epoch": 6525} {"train_loss": -27.568557739257812, "global_step": 541594, "epoch": 6525} {"train_loss": -27.31056022644043, "global_step": 541595, "epoch": 6525} {"train_loss": -27.266199111938477, "global_step": 541596, "epoch": 6525} {"train_loss": -27.391942977905273, "global_step": 541597, "epoch": 6525} {"train_loss": -27.3122615814209, "global_step": 541598, "epoch": 6525} {"train_loss": -27.282485961914062, "global_step": 541599, "epoch": 6525} {"train_loss": -27.698740005493164, "global_step": 541600, "epoch": 6525} {"train_loss": -27.683013916015625, "global_step": 541601, "epoch": 6525} {"train_loss": -28.00140380859375, "global_step": 541602, "epoch": 6525} {"train_loss": -27.579153060913086, "global_step": 541603, "epoch": 6525} {"train_loss": -27.4606876373291, "global_step": 541604, "epoch": 6525} {"train_loss": -27.814544677734375, "global_step": 541605, "epoch": 6525} {"train_loss": -27.801984786987305, "global_step": 541606, "epoch": 6525} {"train_loss": -27.47271156311035, "global_step": 541607, "epoch": 6525} {"train_loss": -27.710575103759766, "global_step": 541608, "epoch": 6525} {"train_loss": -27.712188720703125, "global_step": 541609, "epoch": 6525} {"train_loss": -27.712249755859375, "global_step": 541610, "epoch": 6525} {"train_loss": -27.6417293548584, "global_step": 541611, "epoch": 6525} {"train_loss": -27.983068466186523, "global_step": 541612, "epoch": 6525} {"train_loss": -27.814783096313477, "global_step": 541613, "epoch": 6525} {"train_loss": -27.84075927734375, "global_step": 541614, "epoch": 6525} {"train_loss": -27.710119247436523, "global_step": 541615, "epoch": 6525} {"train_loss": -27.7612361907959, "global_step": 541616, "epoch": 6525} {"train_loss": -27.871408462524414, "global_step": 541617, "epoch": 6525} {"train_loss": -28.19269371032715, "global_step": 541618, "epoch": 6525} {"train_loss": -27.869909286499023, "global_step": 541619, "epoch": 6525} {"train_loss": -27.720794677734375, "global_step": 541620, "epoch": 6525} {"train_loss": -27.820486068725586, "global_step": 541621, "epoch": 6525} {"train_loss": -27.984601974487305, "global_step": 541622, "epoch": 6525} {"train_loss": -27.3753719329834, "global_step": 541623, "epoch": 6525} {"train_loss": -27.721424102783203, "global_step": 541624, "epoch": 6525} {"train_loss": -27.281660079956055, "global_step": 541625, "epoch": 6525} {"train_loss": -26.168127059936523, "global_step": 541626, "epoch": 6525} {"train_loss": -25.17254066467285, "global_step": 541627, "epoch": 6525} {"train_loss": -26.510969161987305, "global_step": 541628, "epoch": 6525} {"train_loss": -27.134366989135742, "global_step": 541629, "epoch": 6525} {"train_loss": -26.734756469726562, "global_step": 541630, "epoch": 6525} {"train_loss": -26.886005401611328, "global_step": 541631, "epoch": 6525} {"train_loss": -27.22014808654785, "global_step": 541632, "epoch": 6525} {"train_loss": -26.76679039001465, "global_step": 541633, "epoch": 6525} {"train_loss": -27.662799835205078, "global_step": 541634, "epoch": 6525} {"train_loss": -26.56243324279785, "global_step": 541635, "epoch": 6525} {"train_loss": -27.510955810546875, "global_step": 541636, "epoch": 6525} {"train_loss": -27.16057777404785, "global_step": 541637, "epoch": 6525} {"train_loss": -27.405248641967773, "global_step": 541638, "epoch": 6525} {"train_loss": -27.27398109436035, "global_step": 541639, "epoch": 6525} {"train_loss": -27.16644859313965, "global_step": 541640, "epoch": 6525} {"train_loss": -26.919910430908203, "global_step": 541641, "epoch": 6525} {"train_loss": -27.489505767822266, "global_step": 541642, "epoch": 6525} {"train_loss": -27.672012329101562, "global_step": 541643, "epoch": 6525} {"train_loss": -27.395282745361328, "global_step": 541644, "epoch": 6525} {"train_loss": -27.8944091796875, "global_step": 541645, "epoch": 6525} {"train_loss": -26.923095703125, "global_step": 541646, "epoch": 6525} {"train_loss": -27.411426544189453, "global_step": 541647, "epoch": 6525} {"train_loss": -27.288110733032227, "global_step": 541648, "epoch": 6525} {"train_loss": -27.776580810546875, "global_step": 541649, "epoch": 6525} {"train_loss": -27.755722045898438, "global_step": 541650, "epoch": 6525} {"train_loss": -27.608671188354492, "global_step": 541651, "epoch": 6525} {"train_loss": -27.323749542236328, "global_step": 541652, "epoch": 6525} {"train_loss": -27.967565536499023, "global_step": 541653, "epoch": 6525} {"train_loss": -27.763137817382812, "global_step": 541654, "epoch": 6525} {"train_loss": -28.03281593322754, "global_step": 541655, "epoch": 6525} {"train_loss": -28.007612228393555, "global_step": 541656, "epoch": 6525} {"train_loss": -27.331644012267333, "global_step": 541657, "epoch": 6525, "val_loss": 6397618.5} {"train_loss": -27.438337326049805, "global_step": 541658, "epoch": 6526} {"train_loss": -27.619070053100586, "global_step": 541659, "epoch": 6526} {"train_loss": -27.303577423095703, "global_step": 541660, "epoch": 6526} {"train_loss": -27.71665382385254, "global_step": 541661, "epoch": 6526} {"train_loss": -27.2811222076416, "global_step": 541662, "epoch": 6526} {"train_loss": -27.196950912475586, "global_step": 541663, "epoch": 6526} {"train_loss": -27.46598243713379, "global_step": 541664, "epoch": 6526} {"train_loss": -27.196598052978516, "global_step": 541665, "epoch": 6526} {"train_loss": -27.17323112487793, "global_step": 541666, "epoch": 6526} {"train_loss": -27.154916763305664, "global_step": 541667, "epoch": 6526} {"train_loss": -27.7285099029541, "global_step": 541668, "epoch": 6526} {"train_loss": -27.01161003112793, "global_step": 541669, "epoch": 6526} {"train_loss": -27.625934600830078, "global_step": 541670, "epoch": 6526} {"train_loss": -27.422765731811523, "global_step": 541671, "epoch": 6526} {"train_loss": -27.403162002563477, "global_step": 541672, "epoch": 6526} {"train_loss": -27.41461181640625, "global_step": 541673, "epoch": 6526} {"train_loss": -27.587186813354492, "global_step": 541674, "epoch": 6526} {"train_loss": -27.689558029174805, "global_step": 541675, "epoch": 6526} {"train_loss": -27.68597412109375, "global_step": 541676, "epoch": 6526} {"train_loss": -27.636749267578125, "global_step": 541677, "epoch": 6526} {"train_loss": -27.38816261291504, "global_step": 541678, "epoch": 6526} {"train_loss": -27.6785831451416, "global_step": 541679, "epoch": 6526} {"train_loss": -28.106000900268555, "global_step": 541680, "epoch": 6526} {"train_loss": -27.566370010375977, "global_step": 541681, "epoch": 6526} {"train_loss": -27.603229522705078, "global_step": 541682, "epoch": 6526} {"train_loss": -27.662033081054688, "global_step": 541683, "epoch": 6526} {"train_loss": -27.605804443359375, "global_step": 541684, "epoch": 6526} {"train_loss": -27.63527488708496, "global_step": 541685, "epoch": 6526} {"train_loss": -27.748952865600586, "global_step": 541686, "epoch": 6526} {"train_loss": -27.674331665039062, "global_step": 541687, "epoch": 6526} {"train_loss": -27.666898727416992, "global_step": 541688, "epoch": 6526} {"train_loss": -27.518762588500977, "global_step": 541689, "epoch": 6526} {"train_loss": -28.061254501342773, "global_step": 541690, "epoch": 6526} {"train_loss": -27.701383590698242, "global_step": 541691, "epoch": 6526} {"train_loss": -28.014556884765625, "global_step": 541692, "epoch": 6526} {"train_loss": -27.810956954956055, "global_step": 541693, "epoch": 6526} {"train_loss": -28.158445358276367, "global_step": 541694, "epoch": 6526} {"train_loss": -27.60980224609375, "global_step": 541695, "epoch": 6526} {"train_loss": -28.14263916015625, "global_step": 541696, "epoch": 6526} {"train_loss": -28.097309112548828, "global_step": 541697, "epoch": 6526} {"train_loss": -28.02869987487793, "global_step": 541698, "epoch": 6526} {"train_loss": -28.266382217407227, "global_step": 541699, "epoch": 6526} {"train_loss": -27.731313705444336, "global_step": 541700, "epoch": 6526} {"train_loss": -28.16375160217285, "global_step": 541701, "epoch": 6526} {"train_loss": -27.91242027282715, "global_step": 541702, "epoch": 6526} {"train_loss": -27.918115615844727, "global_step": 541703, "epoch": 6526} {"train_loss": -28.18390464782715, "global_step": 541704, "epoch": 6526} {"train_loss": -27.808996200561523, "global_step": 541705, "epoch": 6526} {"train_loss": -27.497617721557617, "global_step": 541706, "epoch": 6526} {"train_loss": -27.60797119140625, "global_step": 541707, "epoch": 6526} {"train_loss": -27.260610580444336, "global_step": 541708, "epoch": 6526} {"train_loss": -27.30706787109375, "global_step": 541709, "epoch": 6526} {"train_loss": -27.063745498657227, "global_step": 541710, "epoch": 6526} {"train_loss": -27.489398956298828, "global_step": 541711, "epoch": 6526} {"train_loss": -27.919965744018555, "global_step": 541712, "epoch": 6526} {"train_loss": -27.301755905151367, "global_step": 541713, "epoch": 6526} {"train_loss": -27.508161544799805, "global_step": 541714, "epoch": 6526} {"train_loss": -27.735401153564453, "global_step": 541715, "epoch": 6526} {"train_loss": -27.253467559814453, "global_step": 541716, "epoch": 6526} {"train_loss": -27.379261016845703, "global_step": 541717, "epoch": 6526} {"train_loss": -27.410888671875, "global_step": 541718, "epoch": 6526} {"train_loss": -27.470260620117188, "global_step": 541719, "epoch": 6526} {"train_loss": -27.437353134155273, "global_step": 541720, "epoch": 6526} {"train_loss": -27.486291885375977, "global_step": 541721, "epoch": 6526} {"train_loss": -27.553380966186523, "global_step": 541722, "epoch": 6526} {"train_loss": -27.537189483642578, "global_step": 541723, "epoch": 6526} {"train_loss": -27.09071922302246, "global_step": 541724, "epoch": 6526} {"train_loss": -27.5522403717041, "global_step": 541725, "epoch": 6526} {"train_loss": -27.657804489135742, "global_step": 541726, "epoch": 6526} {"train_loss": -27.6859073638916, "global_step": 541727, "epoch": 6526} {"train_loss": -27.522235870361328, "global_step": 541728, "epoch": 6526} {"train_loss": -27.446680068969727, "global_step": 541729, "epoch": 6526} {"train_loss": -27.442886352539062, "global_step": 541730, "epoch": 6526} {"train_loss": -27.837202072143555, "global_step": 541731, "epoch": 6526} {"train_loss": -27.332202911376953, "global_step": 541732, "epoch": 6526} {"train_loss": -27.2303466796875, "global_step": 541733, "epoch": 6526} {"train_loss": -27.607379913330078, "global_step": 541734, "epoch": 6526} {"train_loss": -27.6803035736084, "global_step": 541735, "epoch": 6526} {"train_loss": -27.3868408203125, "global_step": 541736, "epoch": 6526} {"train_loss": -27.86330223083496, "global_step": 541737, "epoch": 6526} {"train_loss": -27.494504928588867, "global_step": 541738, "epoch": 6526} {"train_loss": -27.64031982421875, "global_step": 541739, "epoch": 6526} {"train_loss": -27.598048566335656, "global_step": 541740, "epoch": 6526, "val_loss": 6360454.0} {"train_loss": -27.1175479888916, "global_step": 541741, "epoch": 6527} {"train_loss": -27.178754806518555, "global_step": 541742, "epoch": 6527} {"train_loss": -27.082843780517578, "global_step": 541743, "epoch": 6527} {"train_loss": -26.72675895690918, "global_step": 541744, "epoch": 6527} {"train_loss": -26.902740478515625, "global_step": 541745, "epoch": 6527} {"train_loss": -26.620319366455078, "global_step": 541746, "epoch": 6527} {"train_loss": -27.25430679321289, "global_step": 541747, "epoch": 6527} {"train_loss": -26.640857696533203, "global_step": 541748, "epoch": 6527} {"train_loss": -27.396528244018555, "global_step": 541749, "epoch": 6527} {"train_loss": -27.02229118347168, "global_step": 541750, "epoch": 6527} {"train_loss": -27.52543067932129, "global_step": 541751, "epoch": 6527} {"train_loss": -27.338409423828125, "global_step": 541752, "epoch": 6527} {"train_loss": -26.9928035736084, "global_step": 541753, "epoch": 6527} {"train_loss": -27.24753189086914, "global_step": 541754, "epoch": 6527} {"train_loss": -26.819494247436523, "global_step": 541755, "epoch": 6527} {"train_loss": -27.1353759765625, "global_step": 541756, "epoch": 6527} {"train_loss": -27.241724014282227, "global_step": 541757, "epoch": 6527} {"train_loss": -27.307357788085938, "global_step": 541758, "epoch": 6527} {"train_loss": -27.342981338500977, "global_step": 541759, "epoch": 6527} {"train_loss": -27.384580612182617, "global_step": 541760, "epoch": 6527} {"train_loss": -27.593957901000977, "global_step": 541761, "epoch": 6527} {"train_loss": -27.067174911499023, "global_step": 541762, "epoch": 6527} {"train_loss": -27.441986083984375, "global_step": 541763, "epoch": 6527} {"train_loss": -27.22116470336914, "global_step": 541764, "epoch": 6527} {"train_loss": -27.30454444885254, "global_step": 541765, "epoch": 6527} {"train_loss": -27.65601921081543, "global_step": 541766, "epoch": 6527} {"train_loss": -27.730819702148438, "global_step": 541767, "epoch": 6527} {"train_loss": -27.515634536743164, "global_step": 541768, "epoch": 6527} {"train_loss": -27.83133888244629, "global_step": 541769, "epoch": 6527} {"train_loss": -27.491933822631836, "global_step": 541770, "epoch": 6527} {"train_loss": -27.63397789001465, "global_step": 541771, "epoch": 6527} {"train_loss": -27.72177505493164, "global_step": 541772, "epoch": 6527} {"train_loss": -27.884267807006836, "global_step": 541773, "epoch": 6527} {"train_loss": -27.49167251586914, "global_step": 541774, "epoch": 6527} {"train_loss": -27.77655029296875, "global_step": 541775, "epoch": 6527} {"train_loss": -28.105777740478516, "global_step": 541776, "epoch": 6527} {"train_loss": -27.588342666625977, "global_step": 541777, "epoch": 6527} {"train_loss": -27.7197265625, "global_step": 541778, "epoch": 6527} {"train_loss": -28.014490127563477, "global_step": 541779, "epoch": 6527} {"train_loss": -27.3708438873291, "global_step": 541780, "epoch": 6527} {"train_loss": -27.944440841674805, "global_step": 541781, "epoch": 6527} {"train_loss": -28.14777183532715, "global_step": 541782, "epoch": 6527} {"train_loss": -27.962514877319336, "global_step": 541783, "epoch": 6527} {"train_loss": -27.67536735534668, "global_step": 541784, "epoch": 6527} {"train_loss": -27.67054557800293, "global_step": 541785, "epoch": 6527} {"train_loss": -27.52748680114746, "global_step": 541786, "epoch": 6527} {"train_loss": -27.27215003967285, "global_step": 541787, "epoch": 6527} {"train_loss": -27.26911735534668, "global_step": 541788, "epoch": 6527} {"train_loss": -27.198230743408203, "global_step": 541789, "epoch": 6527} {"train_loss": -27.63569450378418, "global_step": 541790, "epoch": 6527} {"train_loss": -27.772418975830078, "global_step": 541791, "epoch": 6527} {"train_loss": -27.595117568969727, "global_step": 541792, "epoch": 6527} {"train_loss": -27.621551513671875, "global_step": 541793, "epoch": 6527} {"train_loss": -27.38458251953125, "global_step": 541794, "epoch": 6527} {"train_loss": -27.722564697265625, "global_step": 541795, "epoch": 6527} {"train_loss": -27.596088409423828, "global_step": 541796, "epoch": 6527} {"train_loss": -27.47377586364746, "global_step": 541797, "epoch": 6527} {"train_loss": -28.075773239135742, "global_step": 541798, "epoch": 6527} {"train_loss": -28.1624698638916, "global_step": 541799, "epoch": 6527} {"train_loss": -27.8572998046875, "global_step": 541800, "epoch": 6527} {"train_loss": -27.677274703979492, "global_step": 541801, "epoch": 6527} {"train_loss": -27.625280380249023, "global_step": 541802, "epoch": 6527} {"train_loss": -27.631671905517578, "global_step": 541803, "epoch": 6527} {"train_loss": -27.4244384765625, "global_step": 541804, "epoch": 6527} {"train_loss": -27.543806076049805, "global_step": 541805, "epoch": 6527} {"train_loss": -27.799015045166016, "global_step": 541806, "epoch": 6527} {"train_loss": -27.193838119506836, "global_step": 541807, "epoch": 6527} {"train_loss": -27.71826171875, "global_step": 541808, "epoch": 6527} {"train_loss": -27.794849395751953, "global_step": 541809, "epoch": 6527} {"train_loss": -27.817899703979492, "global_step": 541810, "epoch": 6527} {"train_loss": -27.671072006225586, "global_step": 541811, "epoch": 6527} {"train_loss": -27.74578285217285, "global_step": 541812, "epoch": 6527} {"train_loss": -27.67437744140625, "global_step": 541813, "epoch": 6527} {"train_loss": -27.81068229675293, "global_step": 541814, "epoch": 6527} {"train_loss": -27.41841697692871, "global_step": 541815, "epoch": 6527} {"train_loss": -27.392492294311523, "global_step": 541816, "epoch": 6527} {"train_loss": -27.5855770111084, "global_step": 541817, "epoch": 6527} {"train_loss": -27.770933151245117, "global_step": 541818, "epoch": 6527} {"train_loss": -27.786169052124023, "global_step": 541819, "epoch": 6527} {"train_loss": -27.745405197143555, "global_step": 541820, "epoch": 6527} {"train_loss": -27.45096778869629, "global_step": 541821, "epoch": 6527} {"train_loss": -27.382465362548828, "global_step": 541822, "epoch": 6527} {"train_loss": -27.505953685346856, "global_step": 541823, "epoch": 6527, "val_loss": 6500297.0} {"train_loss": -25.8034725189209, "global_step": 541824, "epoch": 6528} {"train_loss": -24.609375, "global_step": 541825, "epoch": 6528} {"train_loss": -27.300312042236328, "global_step": 541826, "epoch": 6528} {"train_loss": -26.251596450805664, "global_step": 541827, "epoch": 6528} {"train_loss": -26.29688835144043, "global_step": 541828, "epoch": 6528} {"train_loss": -27.5433349609375, "global_step": 541829, "epoch": 6528} {"train_loss": -26.729307174682617, "global_step": 541830, "epoch": 6528} {"train_loss": -26.922718048095703, "global_step": 541831, "epoch": 6528} {"train_loss": -27.074573516845703, "global_step": 541832, "epoch": 6528} {"train_loss": -27.584028244018555, "global_step": 541833, "epoch": 6528} {"train_loss": -27.6445255279541, "global_step": 541834, "epoch": 6528} {"train_loss": -27.12725830078125, "global_step": 541835, "epoch": 6528} {"train_loss": -27.408050537109375, "global_step": 541836, "epoch": 6528} {"train_loss": -27.047412872314453, "global_step": 541837, "epoch": 6528} {"train_loss": -27.074560165405273, "global_step": 541838, "epoch": 6528} {"train_loss": -27.19672203063965, "global_step": 541839, "epoch": 6528} {"train_loss": -27.37226676940918, "global_step": 541840, "epoch": 6528} {"train_loss": -27.01490592956543, "global_step": 541841, "epoch": 6528} {"train_loss": -27.27054214477539, "global_step": 541842, "epoch": 6528} {"train_loss": -27.003589630126953, "global_step": 541843, "epoch": 6528} {"train_loss": -27.550827026367188, "global_step": 541844, "epoch": 6528} {"train_loss": -27.2716007232666, "global_step": 541845, "epoch": 6528} {"train_loss": -27.471288681030273, "global_step": 541846, "epoch": 6528} {"train_loss": -27.259796142578125, "global_step": 541847, "epoch": 6528} {"train_loss": -27.6081485748291, "global_step": 541848, "epoch": 6528} {"train_loss": -27.7320499420166, "global_step": 541849, "epoch": 6528} {"train_loss": -27.680444717407227, "global_step": 541850, "epoch": 6528} {"train_loss": -27.364688873291016, "global_step": 541851, "epoch": 6528} {"train_loss": -27.607879638671875, "global_step": 541852, "epoch": 6528} {"train_loss": -27.794235229492188, "global_step": 541853, "epoch": 6528} {"train_loss": -27.76556968688965, "global_step": 541854, "epoch": 6528} {"train_loss": -27.654754638671875, "global_step": 541855, "epoch": 6528} {"train_loss": -27.290363311767578, "global_step": 541856, "epoch": 6528} {"train_loss": -27.515775680541992, "global_step": 541857, "epoch": 6528} {"train_loss": -27.683792114257812, "global_step": 541858, "epoch": 6528} {"train_loss": -27.58045768737793, "global_step": 541859, "epoch": 6528} {"train_loss": -27.733997344970703, "global_step": 541860, "epoch": 6528} {"train_loss": -27.43816566467285, "global_step": 541861, "epoch": 6528} {"train_loss": -27.752063751220703, "global_step": 541862, "epoch": 6528} {"train_loss": -27.442358016967773, "global_step": 541863, "epoch": 6528} {"train_loss": -27.779245376586914, "global_step": 541864, "epoch": 6528} {"train_loss": -27.55265235900879, "global_step": 541865, "epoch": 6528} {"train_loss": -27.162240982055664, "global_step": 541866, "epoch": 6528} {"train_loss": -27.512189865112305, "global_step": 541867, "epoch": 6528} {"train_loss": -27.6671199798584, "global_step": 541868, "epoch": 6528} {"train_loss": -27.422483444213867, "global_step": 541869, "epoch": 6528} {"train_loss": -27.681081771850586, "global_step": 541870, "epoch": 6528} {"train_loss": -27.652576446533203, "global_step": 541871, "epoch": 6528} {"train_loss": -27.52972984313965, "global_step": 541872, "epoch": 6528} {"train_loss": -27.630929946899414, "global_step": 541873, "epoch": 6528} {"train_loss": -27.28387451171875, "global_step": 541874, "epoch": 6528} {"train_loss": -27.39607048034668, "global_step": 541875, "epoch": 6528} {"train_loss": -27.380056381225586, "global_step": 541876, "epoch": 6528} {"train_loss": -27.17671775817871, "global_step": 541877, "epoch": 6528} {"train_loss": -27.200790405273438, "global_step": 541878, "epoch": 6528} {"train_loss": -26.5269775390625, "global_step": 541879, "epoch": 6528} {"train_loss": -26.8472957611084, "global_step": 541880, "epoch": 6528} {"train_loss": -27.6893310546875, "global_step": 541881, "epoch": 6528} {"train_loss": -26.834674835205078, "global_step": 541882, "epoch": 6528} {"train_loss": -27.052289962768555, "global_step": 541883, "epoch": 6528} {"train_loss": -27.161619186401367, "global_step": 541884, "epoch": 6528} {"train_loss": -27.181928634643555, "global_step": 541885, "epoch": 6528} {"train_loss": -27.33503532409668, "global_step": 541886, "epoch": 6528} {"train_loss": -27.10433006286621, "global_step": 541887, "epoch": 6528} {"train_loss": -27.799036026000977, "global_step": 541888, "epoch": 6528} {"train_loss": -27.056806564331055, "global_step": 541889, "epoch": 6528} {"train_loss": -27.677453994750977, "global_step": 541890, "epoch": 6528} {"train_loss": -27.217309951782227, "global_step": 541891, "epoch": 6528} {"train_loss": -27.654050827026367, "global_step": 541892, "epoch": 6528} {"train_loss": -26.783710479736328, "global_step": 541893, "epoch": 6528} {"train_loss": -27.33585548400879, "global_step": 541894, "epoch": 6528} {"train_loss": -27.14072036743164, "global_step": 541895, "epoch": 6528} {"train_loss": -27.397979736328125, "global_step": 541896, "epoch": 6528} {"train_loss": -27.093250274658203, "global_step": 541897, "epoch": 6528} {"train_loss": -27.414037704467773, "global_step": 541898, "epoch": 6528} {"train_loss": -27.29566764831543, "global_step": 541899, "epoch": 6528} {"train_loss": -27.56960105895996, "global_step": 541900, "epoch": 6528} {"train_loss": -27.730070114135742, "global_step": 541901, "epoch": 6528} {"train_loss": -27.72652244567871, "global_step": 541902, "epoch": 6528} {"train_loss": -27.34547233581543, "global_step": 541903, "epoch": 6528} {"train_loss": -27.832782745361328, "global_step": 541904, "epoch": 6528} {"train_loss": -27.76398277282715, "global_step": 541905, "epoch": 6528} {"train_loss": -27.316471099853516, "global_step": 541906, "epoch": 6528, "val_loss": 6480184.0} {"train_loss": -27.24875259399414, "global_step": 541907, "epoch": 6529} {"train_loss": -26.805212020874023, "global_step": 541908, "epoch": 6529} {"train_loss": -27.360815048217773, "global_step": 541909, "epoch": 6529} {"train_loss": -26.70099449157715, "global_step": 541910, "epoch": 6529} {"train_loss": -27.458362579345703, "global_step": 541911, "epoch": 6529} {"train_loss": -27.328107833862305, "global_step": 541912, "epoch": 6529} {"train_loss": -27.160070419311523, "global_step": 541913, "epoch": 6529} {"train_loss": -27.263952255249023, "global_step": 541914, "epoch": 6529} {"train_loss": -27.09549331665039, "global_step": 541915, "epoch": 6529} {"train_loss": -27.211767196655273, "global_step": 541916, "epoch": 6529} {"train_loss": -27.335840225219727, "global_step": 541917, "epoch": 6529} {"train_loss": -27.643524169921875, "global_step": 541918, "epoch": 6529} {"train_loss": -27.289392471313477, "global_step": 541919, "epoch": 6529} {"train_loss": -27.331501007080078, "global_step": 541920, "epoch": 6529} {"train_loss": -27.720136642456055, "global_step": 541921, "epoch": 6529} {"train_loss": -27.700016021728516, "global_step": 541922, "epoch": 6529} {"train_loss": -27.599424362182617, "global_step": 541923, "epoch": 6529} {"train_loss": -27.8072452545166, "global_step": 541924, "epoch": 6529} {"train_loss": -27.073514938354492, "global_step": 541925, "epoch": 6529} {"train_loss": -27.87615394592285, "global_step": 541926, "epoch": 6529} {"train_loss": -27.5519962310791, "global_step": 541927, "epoch": 6529} {"train_loss": -27.762622833251953, "global_step": 541928, "epoch": 6529} {"train_loss": -28.03513526916504, "global_step": 541929, "epoch": 6529} {"train_loss": -27.738910675048828, "global_step": 541930, "epoch": 6529} {"train_loss": -27.77937126159668, "global_step": 541931, "epoch": 6529} {"train_loss": -27.73902702331543, "global_step": 541932, "epoch": 6529} {"train_loss": -27.601032257080078, "global_step": 541933, "epoch": 6529} {"train_loss": -28.0223388671875, "global_step": 541934, "epoch": 6529} {"train_loss": -27.888227462768555, "global_step": 541935, "epoch": 6529} {"train_loss": -27.988988876342773, "global_step": 541936, "epoch": 6529} {"train_loss": -28.01472282409668, "global_step": 541937, "epoch": 6529} {"train_loss": -27.748462677001953, "global_step": 541938, "epoch": 6529} {"train_loss": -27.922693252563477, "global_step": 541939, "epoch": 6529} {"train_loss": -27.637048721313477, "global_step": 541940, "epoch": 6529} {"train_loss": -27.72648048400879, "global_step": 541941, "epoch": 6529} {"train_loss": -28.001590728759766, "global_step": 541942, "epoch": 6529} {"train_loss": -27.841205596923828, "global_step": 541943, "epoch": 6529} {"train_loss": -27.803823471069336, "global_step": 541944, "epoch": 6529} {"train_loss": -27.655506134033203, "global_step": 541945, "epoch": 6529} {"train_loss": -27.915674209594727, "global_step": 541946, "epoch": 6529} {"train_loss": -27.522104263305664, "global_step": 541947, "epoch": 6529} {"train_loss": -27.6656551361084, "global_step": 541948, "epoch": 6529} {"train_loss": -27.917516708374023, "global_step": 541949, "epoch": 6529} {"train_loss": -27.564706802368164, "global_step": 541950, "epoch": 6529} {"train_loss": -27.875940322875977, "global_step": 541951, "epoch": 6529} {"train_loss": -27.73761558532715, "global_step": 541952, "epoch": 6529} {"train_loss": -28.1216983795166, "global_step": 541953, "epoch": 6529} {"train_loss": -28.10577964782715, "global_step": 541954, "epoch": 6529} {"train_loss": -27.59720802307129, "global_step": 541955, "epoch": 6529} {"train_loss": -27.235082626342773, "global_step": 541956, "epoch": 6529} {"train_loss": -27.8782958984375, "global_step": 541957, "epoch": 6529} {"train_loss": -27.83087158203125, "global_step": 541958, "epoch": 6529} {"train_loss": -27.54606056213379, "global_step": 541959, "epoch": 6529} {"train_loss": -27.76877212524414, "global_step": 541960, "epoch": 6529} {"train_loss": -27.727130889892578, "global_step": 541961, "epoch": 6529} {"train_loss": -27.872730255126953, "global_step": 541962, "epoch": 6529} {"train_loss": -27.702518463134766, "global_step": 541963, "epoch": 6529} {"train_loss": -27.908985137939453, "global_step": 541964, "epoch": 6529} {"train_loss": -27.81440544128418, "global_step": 541965, "epoch": 6529} {"train_loss": -28.2590274810791, "global_step": 541966, "epoch": 6529} {"train_loss": -27.57282066345215, "global_step": 541967, "epoch": 6529} {"train_loss": -27.442245483398438, "global_step": 541968, "epoch": 6529} {"train_loss": -27.95220947265625, "global_step": 541969, "epoch": 6529} {"train_loss": -27.69282341003418, "global_step": 541970, "epoch": 6529} {"train_loss": -27.616254806518555, "global_step": 541971, "epoch": 6529} {"train_loss": -27.63041114807129, "global_step": 541972, "epoch": 6529} {"train_loss": -27.687397003173828, "global_step": 541973, "epoch": 6529} {"train_loss": -27.769012451171875, "global_step": 541974, "epoch": 6529} {"train_loss": -27.9882869720459, "global_step": 541975, "epoch": 6529} {"train_loss": -27.697040557861328, "global_step": 541976, "epoch": 6529} {"train_loss": -28.05527687072754, "global_step": 541977, "epoch": 6529} {"train_loss": -28.037200927734375, "global_step": 541978, "epoch": 6529} {"train_loss": -27.477746963500977, "global_step": 541979, "epoch": 6529} {"train_loss": -27.479272842407227, "global_step": 541980, "epoch": 6529} {"train_loss": -27.816009521484375, "global_step": 541981, "epoch": 6529} {"train_loss": -27.591150283813477, "global_step": 541982, "epoch": 6529} {"train_loss": -27.55702018737793, "global_step": 541983, "epoch": 6529} {"train_loss": -27.394506454467773, "global_step": 541984, "epoch": 6529} {"train_loss": -27.563934326171875, "global_step": 541985, "epoch": 6529} {"train_loss": -28.135114669799805, "global_step": 541986, "epoch": 6529} {"train_loss": -27.632116317749023, "global_step": 541987, "epoch": 6529} {"train_loss": -27.79656982421875, "global_step": 541988, "epoch": 6529} {"train_loss": -27.671571111104573, "global_step": 541989, "epoch": 6529, "val_loss": 6497915.0} {"train_loss": -26.619800567626953, "global_step": 541990, "epoch": 6530} {"train_loss": -27.130048751831055, "global_step": 541991, "epoch": 6530} {"train_loss": -27.135334014892578, "global_step": 541992, "epoch": 6530} {"train_loss": -26.799535751342773, "global_step": 541993, "epoch": 6530} {"train_loss": -27.240453720092773, "global_step": 541994, "epoch": 6530} {"train_loss": -26.630796432495117, "global_step": 541995, "epoch": 6530} {"train_loss": -26.9005184173584, "global_step": 541996, "epoch": 6530} {"train_loss": -26.83049964904785, "global_step": 541997, "epoch": 6530} {"train_loss": -27.133075714111328, "global_step": 541998, "epoch": 6530} {"train_loss": -27.044824600219727, "global_step": 541999, "epoch": 6530} {"train_loss": -26.963727951049805, "global_step": 542000, "epoch": 6530} {"train_loss": -27.098785400390625, "global_step": 542001, "epoch": 6530} {"train_loss": -26.751821517944336, "global_step": 542002, "epoch": 6530} {"train_loss": -27.066442489624023, "global_step": 542003, "epoch": 6530} {"train_loss": -26.500043869018555, "global_step": 542004, "epoch": 6530} {"train_loss": -27.123701095581055, "global_step": 542005, "epoch": 6530} {"train_loss": -26.641382217407227, "global_step": 542006, "epoch": 6530} {"train_loss": -27.256122589111328, "global_step": 542007, "epoch": 6530} {"train_loss": -27.25428581237793, "global_step": 542008, "epoch": 6530} {"train_loss": -26.790424346923828, "global_step": 542009, "epoch": 6530} {"train_loss": -27.35321617126465, "global_step": 542010, "epoch": 6530} {"train_loss": -27.1142578125, "global_step": 542011, "epoch": 6530} {"train_loss": -27.317590713500977, "global_step": 542012, "epoch": 6530} {"train_loss": -27.4790096282959, "global_step": 542013, "epoch": 6530} {"train_loss": -26.857473373413086, "global_step": 542014, "epoch": 6530} {"train_loss": -27.023361206054688, "global_step": 542015, "epoch": 6530} {"train_loss": -27.593219757080078, "global_step": 542016, "epoch": 6530} {"train_loss": -27.500822067260742, "global_step": 542017, "epoch": 6530} {"train_loss": -27.117401123046875, "global_step": 542018, "epoch": 6530} {"train_loss": -27.220794677734375, "global_step": 542019, "epoch": 6530} {"train_loss": -27.380191802978516, "global_step": 542020, "epoch": 6530} {"train_loss": -27.666412353515625, "global_step": 542021, "epoch": 6530} {"train_loss": -27.8023681640625, "global_step": 542022, "epoch": 6530} {"train_loss": -27.49530029296875, "global_step": 542023, "epoch": 6530} {"train_loss": -27.886066436767578, "global_step": 542024, "epoch": 6530} {"train_loss": -27.300073623657227, "global_step": 542025, "epoch": 6530} {"train_loss": -27.489370346069336, "global_step": 542026, "epoch": 6530} {"train_loss": -26.97529411315918, "global_step": 542027, "epoch": 6530} {"train_loss": -27.0819091796875, "global_step": 542028, "epoch": 6530} {"train_loss": -27.654836654663086, "global_step": 542029, "epoch": 6530} {"train_loss": -27.446680068969727, "global_step": 542030, "epoch": 6530} {"train_loss": -27.367223739624023, "global_step": 542031, "epoch": 6530} {"train_loss": -27.646820068359375, "global_step": 542032, "epoch": 6530} {"train_loss": -27.37635612487793, "global_step": 542033, "epoch": 6530} {"train_loss": -27.75514030456543, "global_step": 542034, "epoch": 6530} {"train_loss": -27.6814022064209, "global_step": 542035, "epoch": 6530} {"train_loss": -27.411596298217773, "global_step": 542036, "epoch": 6530} {"train_loss": -27.3717098236084, "global_step": 542037, "epoch": 6530} {"train_loss": -27.537872314453125, "global_step": 542038, "epoch": 6530} {"train_loss": -27.533527374267578, "global_step": 542039, "epoch": 6530} {"train_loss": -27.163623809814453, "global_step": 542040, "epoch": 6530} {"train_loss": -27.681396484375, "global_step": 542041, "epoch": 6530} {"train_loss": -27.4615421295166, "global_step": 542042, "epoch": 6530} {"train_loss": -28.043994903564453, "global_step": 542043, "epoch": 6530} {"train_loss": -28.007919311523438, "global_step": 542044, "epoch": 6530} {"train_loss": -27.23115348815918, "global_step": 542045, "epoch": 6530} {"train_loss": -27.61431312561035, "global_step": 542046, "epoch": 6530} {"train_loss": -27.95839500427246, "global_step": 542047, "epoch": 6530} {"train_loss": -27.760786056518555, "global_step": 542048, "epoch": 6530} {"train_loss": -27.75629234313965, "global_step": 542049, "epoch": 6530} {"train_loss": -27.476221084594727, "global_step": 542050, "epoch": 6530} {"train_loss": -27.454498291015625, "global_step": 542051, "epoch": 6530} {"train_loss": -27.66180419921875, "global_step": 542052, "epoch": 6530} {"train_loss": -27.67059898376465, "global_step": 542053, "epoch": 6530} {"train_loss": -27.585834503173828, "global_step": 542054, "epoch": 6530} {"train_loss": -27.757230758666992, "global_step": 542055, "epoch": 6530} {"train_loss": -27.706491470336914, "global_step": 542056, "epoch": 6530} {"train_loss": -27.73549461364746, "global_step": 542057, "epoch": 6530} {"train_loss": -27.613052368164062, "global_step": 542058, "epoch": 6530} {"train_loss": -27.966339111328125, "global_step": 542059, "epoch": 6530} {"train_loss": -27.728811264038086, "global_step": 542060, "epoch": 6530} {"train_loss": -27.299407958984375, "global_step": 542061, "epoch": 6530} {"train_loss": -27.68707847595215, "global_step": 542062, "epoch": 6530} {"train_loss": -27.832040786743164, "global_step": 542063, "epoch": 6530} {"train_loss": -27.738157272338867, "global_step": 542064, "epoch": 6530} {"train_loss": -27.772485733032227, "global_step": 542065, "epoch": 6530} {"train_loss": -27.81558609008789, "global_step": 542066, "epoch": 6530} {"train_loss": -28.327178955078125, "global_step": 542067, "epoch": 6530} {"train_loss": -27.67885398864746, "global_step": 542068, "epoch": 6530} {"train_loss": -27.94818115234375, "global_step": 542069, "epoch": 6530} {"train_loss": -27.950448989868164, "global_step": 542070, "epoch": 6530} {"train_loss": -27.95557975769043, "global_step": 542071, "epoch": 6530} {"train_loss": -27.423475242522827, "global_step": 542072, "epoch": 6530, "val_loss": 6438972.0} {"train_loss": -27.507511138916016, "global_step": 542073, "epoch": 6531} {"train_loss": -27.132862091064453, "global_step": 542074, "epoch": 6531} {"train_loss": -27.025354385375977, "global_step": 542075, "epoch": 6531} {"train_loss": -27.358320236206055, "global_step": 542076, "epoch": 6531} {"train_loss": -27.992212295532227, "global_step": 542077, "epoch": 6531} {"train_loss": -27.265546798706055, "global_step": 542078, "epoch": 6531} {"train_loss": -26.74468994140625, "global_step": 542079, "epoch": 6531} {"train_loss": -26.88462257385254, "global_step": 542080, "epoch": 6531} {"train_loss": -27.429641723632812, "global_step": 542081, "epoch": 6531} {"train_loss": -26.899938583374023, "global_step": 542082, "epoch": 6531} {"train_loss": -27.018896102905273, "global_step": 542083, "epoch": 6531} {"train_loss": -27.467914581298828, "global_step": 542084, "epoch": 6531} {"train_loss": -27.06694984436035, "global_step": 542085, "epoch": 6531} {"train_loss": -27.429248809814453, "global_step": 542086, "epoch": 6531} {"train_loss": -27.39105796813965, "global_step": 542087, "epoch": 6531} {"train_loss": -27.42976951599121, "global_step": 542088, "epoch": 6531} {"train_loss": -27.496246337890625, "global_step": 542089, "epoch": 6531} {"train_loss": -27.54798698425293, "global_step": 542090, "epoch": 6531} {"train_loss": -27.723291397094727, "global_step": 542091, "epoch": 6531} {"train_loss": -27.7886905670166, "global_step": 542092, "epoch": 6531} {"train_loss": -27.657052993774414, "global_step": 542093, "epoch": 6531} {"train_loss": -27.788135528564453, "global_step": 542094, "epoch": 6531} {"train_loss": -27.859375, "global_step": 542095, "epoch": 6531} {"train_loss": -27.790876388549805, "global_step": 542096, "epoch": 6531} {"train_loss": -27.6957950592041, "global_step": 542097, "epoch": 6531} {"train_loss": -27.45364761352539, "global_step": 542098, "epoch": 6531} {"train_loss": -27.693506240844727, "global_step": 542099, "epoch": 6531} {"train_loss": -27.480504989624023, "global_step": 542100, "epoch": 6531} {"train_loss": -27.472681045532227, "global_step": 542101, "epoch": 6531} {"train_loss": -27.823373794555664, "global_step": 542102, "epoch": 6531} {"train_loss": -27.679595947265625, "global_step": 542103, "epoch": 6531} {"train_loss": -27.815505981445312, "global_step": 542104, "epoch": 6531} {"train_loss": -27.382062911987305, "global_step": 542105, "epoch": 6531} {"train_loss": -27.765695571899414, "global_step": 542106, "epoch": 6531} {"train_loss": -27.68855094909668, "global_step": 542107, "epoch": 6531} {"train_loss": -27.739776611328125, "global_step": 542108, "epoch": 6531} {"train_loss": -27.573596954345703, "global_step": 542109, "epoch": 6531} {"train_loss": -27.701772689819336, "global_step": 542110, "epoch": 6531} {"train_loss": -27.775135040283203, "global_step": 542111, "epoch": 6531} {"train_loss": -27.445316314697266, "global_step": 542112, "epoch": 6531} {"train_loss": -27.373687744140625, "global_step": 542113, "epoch": 6531} {"train_loss": -27.45623779296875, "global_step": 542114, "epoch": 6531} {"train_loss": -27.7525577545166, "global_step": 542115, "epoch": 6531} {"train_loss": -27.413068771362305, "global_step": 542116, "epoch": 6531} {"train_loss": -27.544042587280273, "global_step": 542117, "epoch": 6531} {"train_loss": -27.582233428955078, "global_step": 542118, "epoch": 6531} {"train_loss": -28.069272994995117, "global_step": 542119, "epoch": 6531} {"train_loss": -27.65066909790039, "global_step": 542120, "epoch": 6531} {"train_loss": -27.85492515563965, "global_step": 542121, "epoch": 6531} {"train_loss": -27.733844757080078, "global_step": 542122, "epoch": 6531} {"train_loss": -27.85040855407715, "global_step": 542123, "epoch": 6531} {"train_loss": -27.80719566345215, "global_step": 542124, "epoch": 6531} {"train_loss": -27.856290817260742, "global_step": 542125, "epoch": 6531} {"train_loss": -27.528661727905273, "global_step": 542126, "epoch": 6531} {"train_loss": -27.766529083251953, "global_step": 542127, "epoch": 6531} {"train_loss": -27.71388816833496, "global_step": 542128, "epoch": 6531} {"train_loss": -27.980178833007812, "global_step": 542129, "epoch": 6531} {"train_loss": -27.78777503967285, "global_step": 542130, "epoch": 6531} {"train_loss": -27.951248168945312, "global_step": 542131, "epoch": 6531} {"train_loss": -28.369638442993164, "global_step": 542132, "epoch": 6531} {"train_loss": -27.675079345703125, "global_step": 542133, "epoch": 6531} {"train_loss": -27.66790199279785, "global_step": 542134, "epoch": 6531} {"train_loss": -27.670007705688477, "global_step": 542135, "epoch": 6531} {"train_loss": -27.661054611206055, "global_step": 542136, "epoch": 6531} {"train_loss": -27.695032119750977, "global_step": 542137, "epoch": 6531} {"train_loss": -27.820032119750977, "global_step": 542138, "epoch": 6531} {"train_loss": -27.550695419311523, "global_step": 542139, "epoch": 6531} {"train_loss": -27.804126739501953, "global_step": 542140, "epoch": 6531} {"train_loss": -27.4591007232666, "global_step": 542141, "epoch": 6531} {"train_loss": -27.58447265625, "global_step": 542142, "epoch": 6531} {"train_loss": -27.427228927612305, "global_step": 542143, "epoch": 6531} {"train_loss": -26.94757080078125, "global_step": 542144, "epoch": 6531} {"train_loss": -26.300928115844727, "global_step": 542145, "epoch": 6531} {"train_loss": -27.41391944885254, "global_step": 542146, "epoch": 6531} {"train_loss": -27.8973445892334, "global_step": 542147, "epoch": 6531} {"train_loss": -27.155139923095703, "global_step": 542148, "epoch": 6531} {"train_loss": -27.33721351623535, "global_step": 542149, "epoch": 6531} {"train_loss": -27.679677963256836, "global_step": 542150, "epoch": 6531} {"train_loss": -27.697080612182617, "global_step": 542151, "epoch": 6531} {"train_loss": -27.28144645690918, "global_step": 542152, "epoch": 6531} {"train_loss": -27.442615509033203, "global_step": 542153, "epoch": 6531} {"train_loss": -27.62639808654785, "global_step": 542154, "epoch": 6531} {"train_loss": -27.5662389088826, "global_step": 542155, "epoch": 6531, "val_loss": 6442879.5} {"train_loss": -26.590545654296875, "global_step": 542156, "epoch": 6532} {"train_loss": -27.4978084564209, "global_step": 542157, "epoch": 6532} {"train_loss": -26.466541290283203, "global_step": 542158, "epoch": 6532} {"train_loss": -27.05317497253418, "global_step": 542159, "epoch": 6532} {"train_loss": -26.378314971923828, "global_step": 542160, "epoch": 6532} {"train_loss": -27.070941925048828, "global_step": 542161, "epoch": 6532} {"train_loss": -26.76814079284668, "global_step": 542162, "epoch": 6532} {"train_loss": -27.40230369567871, "global_step": 542163, "epoch": 6532} {"train_loss": -26.61579704284668, "global_step": 542164, "epoch": 6532} {"train_loss": -26.9986572265625, "global_step": 542165, "epoch": 6532} {"train_loss": -27.202880859375, "global_step": 542166, "epoch": 6532} {"train_loss": -26.980438232421875, "global_step": 542167, "epoch": 6532} {"train_loss": -27.13654899597168, "global_step": 542168, "epoch": 6532} {"train_loss": -26.951919555664062, "global_step": 542169, "epoch": 6532} {"train_loss": -26.790058135986328, "global_step": 542170, "epoch": 6532} {"train_loss": -27.32435417175293, "global_step": 542171, "epoch": 6532} {"train_loss": -26.76605796813965, "global_step": 542172, "epoch": 6532} {"train_loss": -26.85365867614746, "global_step": 542173, "epoch": 6532} {"train_loss": -27.005126953125, "global_step": 542174, "epoch": 6532} {"train_loss": -27.169240951538086, "global_step": 542175, "epoch": 6532} {"train_loss": -27.232135772705078, "global_step": 542176, "epoch": 6532} {"train_loss": -27.40813636779785, "global_step": 542177, "epoch": 6532} {"train_loss": -26.911645889282227, "global_step": 542178, "epoch": 6532} {"train_loss": -27.732091903686523, "global_step": 542179, "epoch": 6532} {"train_loss": -27.28864860534668, "global_step": 542180, "epoch": 6532} {"train_loss": -27.41069984436035, "global_step": 542181, "epoch": 6532} {"train_loss": -27.420978546142578, "global_step": 542182, "epoch": 6532} {"train_loss": -27.467395782470703, "global_step": 542183, "epoch": 6532} {"train_loss": -27.468046188354492, "global_step": 542184, "epoch": 6532} {"train_loss": -27.587955474853516, "global_step": 542185, "epoch": 6532} {"train_loss": -27.363828659057617, "global_step": 542186, "epoch": 6532} {"train_loss": -27.653274536132812, "global_step": 542187, "epoch": 6532} {"train_loss": -27.8865909576416, "global_step": 542188, "epoch": 6532} {"train_loss": -27.97367286682129, "global_step": 542189, "epoch": 6532} {"train_loss": -27.528106689453125, "global_step": 542190, "epoch": 6532} {"train_loss": -27.817794799804688, "global_step": 542191, "epoch": 6532} {"train_loss": -27.863794326782227, "global_step": 542192, "epoch": 6532} {"train_loss": -27.770523071289062, "global_step": 542193, "epoch": 6532} {"train_loss": -27.444726943969727, "global_step": 542194, "epoch": 6532} {"train_loss": -28.108549118041992, "global_step": 542195, "epoch": 6532} {"train_loss": -27.830137252807617, "global_step": 542196, "epoch": 6532} {"train_loss": -28.138654708862305, "global_step": 542197, "epoch": 6532} {"train_loss": -27.51288414001465, "global_step": 542198, "epoch": 6532} {"train_loss": -28.059814453125, "global_step": 542199, "epoch": 6532} {"train_loss": -27.558536529541016, "global_step": 542200, "epoch": 6532} {"train_loss": -27.713708877563477, "global_step": 542201, "epoch": 6532} {"train_loss": -27.733240127563477, "global_step": 542202, "epoch": 6532} {"train_loss": -27.771886825561523, "global_step": 542203, "epoch": 6532} {"train_loss": -28.03436279296875, "global_step": 542204, "epoch": 6532} {"train_loss": -27.864709854125977, "global_step": 542205, "epoch": 6532} {"train_loss": -27.85479736328125, "global_step": 542206, "epoch": 6532} {"train_loss": -27.84500503540039, "global_step": 542207, "epoch": 6532} {"train_loss": -27.4622802734375, "global_step": 542208, "epoch": 6532} {"train_loss": -28.05878257751465, "global_step": 542209, "epoch": 6532} {"train_loss": -27.637317657470703, "global_step": 542210, "epoch": 6532} {"train_loss": -27.747556686401367, "global_step": 542211, "epoch": 6532} {"train_loss": -28.038671493530273, "global_step": 542212, "epoch": 6532} {"train_loss": -27.628437042236328, "global_step": 542213, "epoch": 6532} {"train_loss": -27.720876693725586, "global_step": 542214, "epoch": 6532} {"train_loss": -27.24358558654785, "global_step": 542215, "epoch": 6532} {"train_loss": -27.542890548706055, "global_step": 542216, "epoch": 6532} {"train_loss": -27.925357818603516, "global_step": 542217, "epoch": 6532} {"train_loss": -27.83503532409668, "global_step": 542218, "epoch": 6532} {"train_loss": -27.708723068237305, "global_step": 542219, "epoch": 6532} {"train_loss": -27.575885772705078, "global_step": 542220, "epoch": 6532} {"train_loss": -28.023157119750977, "global_step": 542221, "epoch": 6532} {"train_loss": -27.78765296936035, "global_step": 542222, "epoch": 6532} {"train_loss": -27.847827911376953, "global_step": 542223, "epoch": 6532} {"train_loss": -27.476255416870117, "global_step": 542224, "epoch": 6532} {"train_loss": -27.176374435424805, "global_step": 542225, "epoch": 6532} {"train_loss": -27.078582763671875, "global_step": 542226, "epoch": 6532} {"train_loss": -27.155210494995117, "global_step": 542227, "epoch": 6532} {"train_loss": -27.58989906311035, "global_step": 542228, "epoch": 6532} {"train_loss": -27.530710220336914, "global_step": 542229, "epoch": 6532} {"train_loss": -27.2800235748291, "global_step": 542230, "epoch": 6532} {"train_loss": -27.635251998901367, "global_step": 542231, "epoch": 6532} {"train_loss": -27.711118698120117, "global_step": 542232, "epoch": 6532} {"train_loss": -27.167118072509766, "global_step": 542233, "epoch": 6532} {"train_loss": -27.644775390625, "global_step": 542234, "epoch": 6532} {"train_loss": -28.098346710205078, "global_step": 542235, "epoch": 6532} {"train_loss": -27.54197120666504, "global_step": 542236, "epoch": 6532} {"train_loss": -27.575321197509766, "global_step": 542237, "epoch": 6532} {"train_loss": -27.475794458963787, "global_step": 542238, "epoch": 6532, "val_loss": 6425521.0} {"train_loss": -27.1514892578125, "global_step": 542239, "epoch": 6533} {"train_loss": -27.249948501586914, "global_step": 542240, "epoch": 6533} {"train_loss": -27.383630752563477, "global_step": 542241, "epoch": 6533} {"train_loss": -27.42976188659668, "global_step": 542242, "epoch": 6533} {"train_loss": -27.265762329101562, "global_step": 542243, "epoch": 6533} {"train_loss": -27.57069206237793, "global_step": 542244, "epoch": 6533} {"train_loss": -27.48090171813965, "global_step": 542245, "epoch": 6533} {"train_loss": -27.40925407409668, "global_step": 542246, "epoch": 6533} {"train_loss": -27.49261474609375, "global_step": 542247, "epoch": 6533} {"train_loss": -27.801044464111328, "global_step": 542248, "epoch": 6533} {"train_loss": -27.423948287963867, "global_step": 542249, "epoch": 6533} {"train_loss": -27.27778434753418, "global_step": 542250, "epoch": 6533} {"train_loss": -27.26323890686035, "global_step": 542251, "epoch": 6533} {"train_loss": -27.19373893737793, "global_step": 542252, "epoch": 6533} {"train_loss": -27.255374908447266, "global_step": 542253, "epoch": 6533} {"train_loss": -27.168445587158203, "global_step": 542254, "epoch": 6533} {"train_loss": -27.568872451782227, "global_step": 542255, "epoch": 6533} {"train_loss": -27.76075553894043, "global_step": 542256, "epoch": 6533} {"train_loss": -27.522363662719727, "global_step": 542257, "epoch": 6533} {"train_loss": -27.320165634155273, "global_step": 542258, "epoch": 6533} {"train_loss": -28.007001876831055, "global_step": 542259, "epoch": 6533} {"train_loss": -27.65223503112793, "global_step": 542260, "epoch": 6533} {"train_loss": -27.6096248626709, "global_step": 542261, "epoch": 6533} {"train_loss": -27.788354873657227, "global_step": 542262, "epoch": 6533} {"train_loss": -27.66129493713379, "global_step": 542263, "epoch": 6533} {"train_loss": -28.114133834838867, "global_step": 542264, "epoch": 6533} {"train_loss": -27.830488204956055, "global_step": 542265, "epoch": 6533} {"train_loss": -27.53730583190918, "global_step": 542266, "epoch": 6533} {"train_loss": -27.47303581237793, "global_step": 542267, "epoch": 6533} {"train_loss": -27.458730697631836, "global_step": 542268, "epoch": 6533} {"train_loss": -27.999082565307617, "global_step": 542269, "epoch": 6533} {"train_loss": -27.887975692749023, "global_step": 542270, "epoch": 6533} {"train_loss": -27.583898544311523, "global_step": 542271, "epoch": 6533} {"train_loss": -27.73836326599121, "global_step": 542272, "epoch": 6533} {"train_loss": -28.05759620666504, "global_step": 542273, "epoch": 6533} {"train_loss": -27.993606567382812, "global_step": 542274, "epoch": 6533} {"train_loss": -28.07330894470215, "global_step": 542275, "epoch": 6533} {"train_loss": -27.88368034362793, "global_step": 542276, "epoch": 6533} {"train_loss": -28.177337646484375, "global_step": 542277, "epoch": 6533} {"train_loss": -27.85382080078125, "global_step": 542278, "epoch": 6533} {"train_loss": -27.67097282409668, "global_step": 542279, "epoch": 6533} {"train_loss": -28.026447296142578, "global_step": 542280, "epoch": 6533} {"train_loss": -27.616092681884766, "global_step": 542281, "epoch": 6533} {"train_loss": -27.78143882751465, "global_step": 542282, "epoch": 6533} {"train_loss": -27.801437377929688, "global_step": 542283, "epoch": 6533} {"train_loss": -27.30305290222168, "global_step": 542284, "epoch": 6533} {"train_loss": -27.386022567749023, "global_step": 542285, "epoch": 6533} {"train_loss": -26.76338005065918, "global_step": 542286, "epoch": 6533} {"train_loss": -27.35828971862793, "global_step": 542287, "epoch": 6533} {"train_loss": -27.55523681640625, "global_step": 542288, "epoch": 6533} {"train_loss": -27.753173828125, "global_step": 542289, "epoch": 6533} {"train_loss": -27.87794303894043, "global_step": 542290, "epoch": 6533} {"train_loss": -27.54102897644043, "global_step": 542291, "epoch": 6533} {"train_loss": -27.214282989501953, "global_step": 542292, "epoch": 6533} {"train_loss": -27.48056983947754, "global_step": 542293, "epoch": 6533} {"train_loss": -27.582380294799805, "global_step": 542294, "epoch": 6533} {"train_loss": -27.725854873657227, "global_step": 542295, "epoch": 6533} {"train_loss": -27.294370651245117, "global_step": 542296, "epoch": 6533} {"train_loss": -27.65420913696289, "global_step": 542297, "epoch": 6533} {"train_loss": -27.623794555664062, "global_step": 542298, "epoch": 6533} {"train_loss": -28.1328182220459, "global_step": 542299, "epoch": 6533} {"train_loss": -27.44093132019043, "global_step": 542300, "epoch": 6533} {"train_loss": -27.640104293823242, "global_step": 542301, "epoch": 6533} {"train_loss": -27.347875595092773, "global_step": 542302, "epoch": 6533} {"train_loss": -27.753509521484375, "global_step": 542303, "epoch": 6533} {"train_loss": -27.66790771484375, "global_step": 542304, "epoch": 6533} {"train_loss": -27.806562423706055, "global_step": 542305, "epoch": 6533} {"train_loss": -27.844419479370117, "global_step": 542306, "epoch": 6533} {"train_loss": -27.673261642456055, "global_step": 542307, "epoch": 6533} {"train_loss": -27.782827377319336, "global_step": 542308, "epoch": 6533} {"train_loss": -27.753864288330078, "global_step": 542309, "epoch": 6533} {"train_loss": -27.723169326782227, "global_step": 542310, "epoch": 6533} {"train_loss": -27.51970863342285, "global_step": 542311, "epoch": 6533} {"train_loss": -27.882110595703125, "global_step": 542312, "epoch": 6533} {"train_loss": -28.122522354125977, "global_step": 542313, "epoch": 6533} {"train_loss": -27.593244552612305, "global_step": 542314, "epoch": 6533} {"train_loss": -27.891881942749023, "global_step": 542315, "epoch": 6533} {"train_loss": -27.761783599853516, "global_step": 542316, "epoch": 6533} {"train_loss": -28.2783260345459, "global_step": 542317, "epoch": 6533} {"train_loss": -28.208520889282227, "global_step": 542318, "epoch": 6533} {"train_loss": -27.91022300720215, "global_step": 542319, "epoch": 6533} {"train_loss": -27.977346420288086, "global_step": 542320, "epoch": 6533} {"train_loss": -27.65415166372276, "global_step": 542321, "epoch": 6533, "val_loss": 6507400.0} {"train_loss": -27.68490982055664, "global_step": 542322, "epoch": 6534} {"train_loss": -27.678333282470703, "global_step": 542323, "epoch": 6534} {"train_loss": -27.527679443359375, "global_step": 542324, "epoch": 6534} {"train_loss": -27.06263542175293, "global_step": 542325, "epoch": 6534} {"train_loss": -27.450428009033203, "global_step": 542326, "epoch": 6534} {"train_loss": -27.50801658630371, "global_step": 542327, "epoch": 6534} {"train_loss": -27.539560317993164, "global_step": 542328, "epoch": 6534} {"train_loss": -27.770294189453125, "global_step": 542329, "epoch": 6534} {"train_loss": -27.40620231628418, "global_step": 542330, "epoch": 6534} {"train_loss": -27.802444458007812, "global_step": 542331, "epoch": 6534} {"train_loss": -27.257678985595703, "global_step": 542332, "epoch": 6534} {"train_loss": -27.2717227935791, "global_step": 542333, "epoch": 6534} {"train_loss": -27.14947509765625, "global_step": 542334, "epoch": 6534} {"train_loss": -27.612232208251953, "global_step": 542335, "epoch": 6534} {"train_loss": -27.552845001220703, "global_step": 542336, "epoch": 6534} {"train_loss": -27.392908096313477, "global_step": 542337, "epoch": 6534} {"train_loss": -27.404972076416016, "global_step": 542338, "epoch": 6534} {"train_loss": -26.864675521850586, "global_step": 542339, "epoch": 6534} {"train_loss": -27.633392333984375, "global_step": 542340, "epoch": 6534} {"train_loss": -27.187030792236328, "global_step": 542341, "epoch": 6534} {"train_loss": -27.521350860595703, "global_step": 542342, "epoch": 6534} {"train_loss": -27.883031845092773, "global_step": 542343, "epoch": 6534} {"train_loss": -27.16779136657715, "global_step": 542344, "epoch": 6534} {"train_loss": -27.206226348876953, "global_step": 542345, "epoch": 6534} {"train_loss": -27.515884399414062, "global_step": 542346, "epoch": 6534} {"train_loss": -27.14312171936035, "global_step": 542347, "epoch": 6534} {"train_loss": -27.33551597595215, "global_step": 542348, "epoch": 6534} {"train_loss": -27.3375244140625, "global_step": 542349, "epoch": 6534} {"train_loss": -27.645246505737305, "global_step": 542350, "epoch": 6534} {"train_loss": -27.094757080078125, "global_step": 542351, "epoch": 6534} {"train_loss": -27.966150283813477, "global_step": 542352, "epoch": 6534} {"train_loss": -27.324975967407227, "global_step": 542353, "epoch": 6534} {"train_loss": -27.781091690063477, "global_step": 542354, "epoch": 6534} {"train_loss": -27.244550704956055, "global_step": 542355, "epoch": 6534} {"train_loss": -27.571842193603516, "global_step": 542356, "epoch": 6534} {"train_loss": -27.819629669189453, "global_step": 542357, "epoch": 6534} {"train_loss": -27.437902450561523, "global_step": 542358, "epoch": 6534} {"train_loss": -27.25201988220215, "global_step": 542359, "epoch": 6534} {"train_loss": -27.613052368164062, "global_step": 542360, "epoch": 6534} {"train_loss": -28.106281280517578, "global_step": 542361, "epoch": 6534} {"train_loss": -27.85637855529785, "global_step": 542362, "epoch": 6534} {"train_loss": -27.88800048828125, "global_step": 542363, "epoch": 6534} {"train_loss": -27.80079460144043, "global_step": 542364, "epoch": 6534} {"train_loss": -27.858854293823242, "global_step": 542365, "epoch": 6534} {"train_loss": -27.791528701782227, "global_step": 542366, "epoch": 6534} {"train_loss": -27.418363571166992, "global_step": 542367, "epoch": 6534} {"train_loss": -27.754682540893555, "global_step": 542368, "epoch": 6534} {"train_loss": -27.670568466186523, "global_step": 542369, "epoch": 6534} {"train_loss": -27.590576171875, "global_step": 542370, "epoch": 6534} {"train_loss": -28.101627349853516, "global_step": 542371, "epoch": 6534} {"train_loss": -27.81580924987793, "global_step": 542372, "epoch": 6534} {"train_loss": -27.788867950439453, "global_step": 542373, "epoch": 6534} {"train_loss": -27.951242446899414, "global_step": 542374, "epoch": 6534} {"train_loss": -27.636396408081055, "global_step": 542375, "epoch": 6534} {"train_loss": -27.839750289916992, "global_step": 542376, "epoch": 6534} {"train_loss": -27.61927604675293, "global_step": 542377, "epoch": 6534} {"train_loss": -27.499658584594727, "global_step": 542378, "epoch": 6534} {"train_loss": -27.893890380859375, "global_step": 542379, "epoch": 6534} {"train_loss": -27.8726863861084, "global_step": 542380, "epoch": 6534} {"train_loss": -28.00482177734375, "global_step": 542381, "epoch": 6534} {"train_loss": -27.620777130126953, "global_step": 542382, "epoch": 6534} {"train_loss": -27.387582778930664, "global_step": 542383, "epoch": 6534} {"train_loss": -27.8282413482666, "global_step": 542384, "epoch": 6534} {"train_loss": -27.875518798828125, "global_step": 542385, "epoch": 6534} {"train_loss": -27.507776260375977, "global_step": 542386, "epoch": 6534} {"train_loss": -27.400495529174805, "global_step": 542387, "epoch": 6534} {"train_loss": -27.566625595092773, "global_step": 542388, "epoch": 6534} {"train_loss": -27.860626220703125, "global_step": 542389, "epoch": 6534} {"train_loss": -27.39094352722168, "global_step": 542390, "epoch": 6534} {"train_loss": -27.544031143188477, "global_step": 542391, "epoch": 6534} {"train_loss": -27.350828170776367, "global_step": 542392, "epoch": 6534} {"train_loss": -27.562442779541016, "global_step": 542393, "epoch": 6534} {"train_loss": -27.798431396484375, "global_step": 542394, "epoch": 6534} {"train_loss": -27.266347885131836, "global_step": 542395, "epoch": 6534} {"train_loss": -28.045642852783203, "global_step": 542396, "epoch": 6534} {"train_loss": -27.6905460357666, "global_step": 542397, "epoch": 6534} {"train_loss": -27.45484733581543, "global_step": 542398, "epoch": 6534} {"train_loss": -27.943262100219727, "global_step": 542399, "epoch": 6534} {"train_loss": -27.471887588500977, "global_step": 542400, "epoch": 6534} {"train_loss": -27.369190216064453, "global_step": 542401, "epoch": 6534} {"train_loss": -27.463544845581055, "global_step": 542402, "epoch": 6534} {"train_loss": -27.248334884643555, "global_step": 542403, "epoch": 6534} {"train_loss": -27.56264854339232, "global_step": 542404, "epoch": 6534, "val_loss": 6465240.0} {"train_loss": -26.125959396362305, "global_step": 542405, "epoch": 6535} {"train_loss": -24.81891441345215, "global_step": 542406, "epoch": 6535} {"train_loss": -25.33416175842285, "global_step": 542407, "epoch": 6535} {"train_loss": -26.77984619140625, "global_step": 542408, "epoch": 6535} {"train_loss": -26.0205020904541, "global_step": 542409, "epoch": 6535} {"train_loss": -26.840036392211914, "global_step": 542410, "epoch": 6535} {"train_loss": -26.343717575073242, "global_step": 542411, "epoch": 6535} {"train_loss": -26.78742790222168, "global_step": 542412, "epoch": 6535} {"train_loss": -26.883548736572266, "global_step": 542413, "epoch": 6535} {"train_loss": -26.49741554260254, "global_step": 542414, "epoch": 6535} {"train_loss": -27.28799819946289, "global_step": 542415, "epoch": 6535} {"train_loss": -26.995086669921875, "global_step": 542416, "epoch": 6535} {"train_loss": -27.12088966369629, "global_step": 542417, "epoch": 6535} {"train_loss": -27.13067054748535, "global_step": 542418, "epoch": 6535} {"train_loss": -27.006750106811523, "global_step": 542419, "epoch": 6535} {"train_loss": -27.204925537109375, "global_step": 542420, "epoch": 6535} {"train_loss": -27.21746253967285, "global_step": 542421, "epoch": 6535} {"train_loss": -26.916259765625, "global_step": 542422, "epoch": 6535} {"train_loss": -27.21457290649414, "global_step": 542423, "epoch": 6535} {"train_loss": -27.45503044128418, "global_step": 542424, "epoch": 6535} {"train_loss": -27.268484115600586, "global_step": 542425, "epoch": 6535} {"train_loss": -27.456592559814453, "global_step": 542426, "epoch": 6535} {"train_loss": -27.508432388305664, "global_step": 542427, "epoch": 6535} {"train_loss": -27.278656005859375, "global_step": 542428, "epoch": 6535} {"train_loss": -27.49906349182129, "global_step": 542429, "epoch": 6535} {"train_loss": -27.022241592407227, "global_step": 542430, "epoch": 6535} {"train_loss": -27.22922706604004, "global_step": 542431, "epoch": 6535} {"train_loss": -27.486181259155273, "global_step": 542432, "epoch": 6535} {"train_loss": -27.3610782623291, "global_step": 542433, "epoch": 6535} {"train_loss": -27.3736629486084, "global_step": 542434, "epoch": 6535} {"train_loss": -27.732751846313477, "global_step": 542435, "epoch": 6535} {"train_loss": -27.152379989624023, "global_step": 542436, "epoch": 6535} {"train_loss": -27.224384307861328, "global_step": 542437, "epoch": 6535} {"train_loss": -27.278478622436523, "global_step": 542438, "epoch": 6535} {"train_loss": -27.6758975982666, "global_step": 542439, "epoch": 6535} {"train_loss": -27.558914184570312, "global_step": 542440, "epoch": 6535} {"train_loss": -27.746261596679688, "global_step": 542441, "epoch": 6535} {"train_loss": -27.574726104736328, "global_step": 542442, "epoch": 6535} {"train_loss": -27.676862716674805, "global_step": 542443, "epoch": 6535} {"train_loss": -27.37139320373535, "global_step": 542444, "epoch": 6535} {"train_loss": -27.626708984375, "global_step": 542445, "epoch": 6535} {"train_loss": -27.346755981445312, "global_step": 542446, "epoch": 6535} {"train_loss": -27.71388053894043, "global_step": 542447, "epoch": 6535} {"train_loss": -27.6615047454834, "global_step": 542448, "epoch": 6535} {"train_loss": -27.94964027404785, "global_step": 542449, "epoch": 6535} {"train_loss": -27.906076431274414, "global_step": 542450, "epoch": 6535} {"train_loss": -27.692052841186523, "global_step": 542451, "epoch": 6535} {"train_loss": -27.773298263549805, "global_step": 542452, "epoch": 6535} {"train_loss": -27.952442169189453, "global_step": 542453, "epoch": 6535} {"train_loss": -27.515302658081055, "global_step": 542454, "epoch": 6535} {"train_loss": -27.81925392150879, "global_step": 542455, "epoch": 6535} {"train_loss": -27.5194034576416, "global_step": 542456, "epoch": 6535} {"train_loss": -27.9472713470459, "global_step": 542457, "epoch": 6535} {"train_loss": -27.916858673095703, "global_step": 542458, "epoch": 6535} {"train_loss": -28.08635902404785, "global_step": 542459, "epoch": 6535} {"train_loss": -27.3787841796875, "global_step": 542460, "epoch": 6535} {"train_loss": -27.595754623413086, "global_step": 542461, "epoch": 6535} {"train_loss": -27.69053077697754, "global_step": 542462, "epoch": 6535} {"train_loss": -27.749954223632812, "global_step": 542463, "epoch": 6535} {"train_loss": -27.646265029907227, "global_step": 542464, "epoch": 6535} {"train_loss": -28.250934600830078, "global_step": 542465, "epoch": 6535} {"train_loss": -27.666004180908203, "global_step": 542466, "epoch": 6535} {"train_loss": -27.71023941040039, "global_step": 542467, "epoch": 6535} {"train_loss": -28.057819366455078, "global_step": 542468, "epoch": 6535} {"train_loss": -27.919620513916016, "global_step": 542469, "epoch": 6535} {"train_loss": -28.081892013549805, "global_step": 542470, "epoch": 6535} {"train_loss": -27.759557723999023, "global_step": 542471, "epoch": 6535} {"train_loss": -28.12293815612793, "global_step": 542472, "epoch": 6535} {"train_loss": -27.957977294921875, "global_step": 542473, "epoch": 6535} {"train_loss": -27.958881378173828, "global_step": 542474, "epoch": 6535} {"train_loss": -27.878686904907227, "global_step": 542475, "epoch": 6535} {"train_loss": -28.06220054626465, "global_step": 542476, "epoch": 6535} {"train_loss": -27.9835147857666, "global_step": 542477, "epoch": 6535} {"train_loss": -27.888219833374023, "global_step": 542478, "epoch": 6535} {"train_loss": -27.927515029907227, "global_step": 542479, "epoch": 6535} {"train_loss": -28.29220962524414, "global_step": 542480, "epoch": 6535} {"train_loss": -28.03436851501465, "global_step": 542481, "epoch": 6535} {"train_loss": -27.36505699157715, "global_step": 542482, "epoch": 6535} {"train_loss": -27.809345245361328, "global_step": 542483, "epoch": 6535} {"train_loss": -27.444019317626953, "global_step": 542484, "epoch": 6535} {"train_loss": -27.33380699157715, "global_step": 542485, "epoch": 6535} {"train_loss": -27.394922256469727, "global_step": 542486, "epoch": 6535} {"train_loss": -27.452160088412732, "global_step": 542487, "epoch": 6535, "val_loss": 6506632.0} {"train_loss": -25.755945205688477, "global_step": 542488, "epoch": 6536} {"train_loss": -25.14298439025879, "global_step": 542489, "epoch": 6536} {"train_loss": -24.199010848999023, "global_step": 542490, "epoch": 6536} {"train_loss": -26.048908233642578, "global_step": 542491, "epoch": 6536} {"train_loss": -25.533214569091797, "global_step": 542492, "epoch": 6536} {"train_loss": -26.675952911376953, "global_step": 542493, "epoch": 6536} {"train_loss": -25.96462059020996, "global_step": 542494, "epoch": 6536} {"train_loss": -26.04377555847168, "global_step": 542495, "epoch": 6536} {"train_loss": -26.545347213745117, "global_step": 542496, "epoch": 6536} {"train_loss": -26.63531494140625, "global_step": 542497, "epoch": 6536} {"train_loss": -26.496870040893555, "global_step": 542498, "epoch": 6536} {"train_loss": -27.063512802124023, "global_step": 542499, "epoch": 6536} {"train_loss": -26.738449096679688, "global_step": 542500, "epoch": 6536} {"train_loss": -26.97039222717285, "global_step": 542501, "epoch": 6536} {"train_loss": -26.7763729095459, "global_step": 542502, "epoch": 6536} {"train_loss": -26.993398666381836, "global_step": 542503, "epoch": 6536} {"train_loss": -26.804548263549805, "global_step": 542504, "epoch": 6536} {"train_loss": -26.8128662109375, "global_step": 542505, "epoch": 6536} {"train_loss": -26.773422241210938, "global_step": 542506, "epoch": 6536} {"train_loss": -27.073734283447266, "global_step": 542507, "epoch": 6536} {"train_loss": -27.030126571655273, "global_step": 542508, "epoch": 6536} {"train_loss": -27.108570098876953, "global_step": 542509, "epoch": 6536} {"train_loss": -26.61478042602539, "global_step": 542510, "epoch": 6536} {"train_loss": -27.043249130249023, "global_step": 542511, "epoch": 6536} {"train_loss": -27.281808853149414, "global_step": 542512, "epoch": 6536} {"train_loss": -26.99090576171875, "global_step": 542513, "epoch": 6536} {"train_loss": -26.942712783813477, "global_step": 542514, "epoch": 6536} {"train_loss": -27.0247802734375, "global_step": 542515, "epoch": 6536} {"train_loss": -27.094160079956055, "global_step": 542516, "epoch": 6536} {"train_loss": -27.060949325561523, "global_step": 542517, "epoch": 6536} {"train_loss": -27.480823516845703, "global_step": 542518, "epoch": 6536} {"train_loss": -27.444583892822266, "global_step": 542519, "epoch": 6536} {"train_loss": -27.544891357421875, "global_step": 542520, "epoch": 6536} {"train_loss": -27.197040557861328, "global_step": 542521, "epoch": 6536} {"train_loss": -27.37261962890625, "global_step": 542522, "epoch": 6536} {"train_loss": -27.5543155670166, "global_step": 542523, "epoch": 6536} {"train_loss": -27.402206420898438, "global_step": 542524, "epoch": 6536} {"train_loss": -27.715839385986328, "global_step": 542525, "epoch": 6536} {"train_loss": -27.3746395111084, "global_step": 542526, "epoch": 6536} {"train_loss": -27.50917625427246, "global_step": 542527, "epoch": 6536} {"train_loss": -27.72760581970215, "global_step": 542528, "epoch": 6536} {"train_loss": -27.84608268737793, "global_step": 542529, "epoch": 6536} {"train_loss": -27.613996505737305, "global_step": 542530, "epoch": 6536} {"train_loss": -27.475818634033203, "global_step": 542531, "epoch": 6536} {"train_loss": -27.41449546813965, "global_step": 542532, "epoch": 6536} {"train_loss": -27.564756393432617, "global_step": 542533, "epoch": 6536} {"train_loss": -27.370304107666016, "global_step": 542534, "epoch": 6536} {"train_loss": -27.804489135742188, "global_step": 542535, "epoch": 6536} {"train_loss": -27.631139755249023, "global_step": 542536, "epoch": 6536} {"train_loss": -27.801971435546875, "global_step": 542537, "epoch": 6536} {"train_loss": -28.105838775634766, "global_step": 542538, "epoch": 6536} {"train_loss": -27.661619186401367, "global_step": 542539, "epoch": 6536} {"train_loss": -27.825098037719727, "global_step": 542540, "epoch": 6536} {"train_loss": -27.329126358032227, "global_step": 542541, "epoch": 6536} {"train_loss": -27.942480087280273, "global_step": 542542, "epoch": 6536} {"train_loss": -27.94475746154785, "global_step": 542543, "epoch": 6536} {"train_loss": -27.96607780456543, "global_step": 542544, "epoch": 6536} {"train_loss": -28.072484970092773, "global_step": 542545, "epoch": 6536} {"train_loss": -28.16110610961914, "global_step": 542546, "epoch": 6536} {"train_loss": -27.50483512878418, "global_step": 542547, "epoch": 6536} {"train_loss": -27.84248924255371, "global_step": 542548, "epoch": 6536} {"train_loss": -27.68751335144043, "global_step": 542549, "epoch": 6536} {"train_loss": -27.884723663330078, "global_step": 542550, "epoch": 6536} {"train_loss": -27.37885093688965, "global_step": 542551, "epoch": 6536} {"train_loss": -27.070281982421875, "global_step": 542552, "epoch": 6536} {"train_loss": -27.434919357299805, "global_step": 542553, "epoch": 6536} {"train_loss": -27.408832550048828, "global_step": 542554, "epoch": 6536} {"train_loss": -26.857763290405273, "global_step": 542555, "epoch": 6536} {"train_loss": -27.335113525390625, "global_step": 542556, "epoch": 6536} {"train_loss": -27.093215942382812, "global_step": 542557, "epoch": 6536} {"train_loss": -27.6697998046875, "global_step": 542558, "epoch": 6536} {"train_loss": -27.13142204284668, "global_step": 542559, "epoch": 6536} {"train_loss": -27.33909034729004, "global_step": 542560, "epoch": 6536} {"train_loss": -27.327396392822266, "global_step": 542561, "epoch": 6536} {"train_loss": -27.354297637939453, "global_step": 542562, "epoch": 6536} {"train_loss": -27.40821647644043, "global_step": 542563, "epoch": 6536} {"train_loss": -27.652801513671875, "global_step": 542564, "epoch": 6536} {"train_loss": -27.36686134338379, "global_step": 542565, "epoch": 6536} {"train_loss": -27.826730728149414, "global_step": 542566, "epoch": 6536} {"train_loss": -27.818899154663086, "global_step": 542567, "epoch": 6536} {"train_loss": -27.609365463256836, "global_step": 542568, "epoch": 6536} {"train_loss": -27.37733268737793, "global_step": 542569, "epoch": 6536} {"train_loss": -27.197971091212995, "global_step": 542570, "epoch": 6536, "val_loss": 6599524.0} {"train_loss": -27.66826820373535, "global_step": 542571, "epoch": 6537} {"train_loss": -27.206151962280273, "global_step": 542572, "epoch": 6537} {"train_loss": -26.70624351501465, "global_step": 542573, "epoch": 6537} {"train_loss": -27.105960845947266, "global_step": 542574, "epoch": 6537} {"train_loss": -27.203479766845703, "global_step": 542575, "epoch": 6537} {"train_loss": -27.407651901245117, "global_step": 542576, "epoch": 6537} {"train_loss": -27.186649322509766, "global_step": 542577, "epoch": 6537} {"train_loss": -27.3184757232666, "global_step": 542578, "epoch": 6537} {"train_loss": -26.81610679626465, "global_step": 542579, "epoch": 6537} {"train_loss": -27.255619049072266, "global_step": 542580, "epoch": 6537} {"train_loss": -26.793136596679688, "global_step": 542581, "epoch": 6537} {"train_loss": -26.91744041442871, "global_step": 542582, "epoch": 6537} {"train_loss": -27.57911491394043, "global_step": 542583, "epoch": 6537} {"train_loss": -27.69600486755371, "global_step": 542584, "epoch": 6537} {"train_loss": -27.401870727539062, "global_step": 542585, "epoch": 6537} {"train_loss": -27.361974716186523, "global_step": 542586, "epoch": 6537} {"train_loss": -27.374658584594727, "global_step": 542587, "epoch": 6537} {"train_loss": -27.361297607421875, "global_step": 542588, "epoch": 6537} {"train_loss": -27.40254020690918, "global_step": 542589, "epoch": 6537} {"train_loss": -27.428176879882812, "global_step": 542590, "epoch": 6537} {"train_loss": -27.480188369750977, "global_step": 542591, "epoch": 6537} {"train_loss": -27.5982666015625, "global_step": 542592, "epoch": 6537} {"train_loss": -27.7178955078125, "global_step": 542593, "epoch": 6537} {"train_loss": -27.71857261657715, "global_step": 542594, "epoch": 6537} {"train_loss": -27.246448516845703, "global_step": 542595, "epoch": 6537} {"train_loss": -27.574970245361328, "global_step": 542596, "epoch": 6537} {"train_loss": -27.85892105102539, "global_step": 542597, "epoch": 6537} {"train_loss": -27.720853805541992, "global_step": 542598, "epoch": 6537} {"train_loss": -27.925067901611328, "global_step": 542599, "epoch": 6537} {"train_loss": -27.616352081298828, "global_step": 542600, "epoch": 6537} {"train_loss": -27.982519149780273, "global_step": 542601, "epoch": 6537} {"train_loss": -27.83200454711914, "global_step": 542602, "epoch": 6537} {"train_loss": -27.875696182250977, "global_step": 542603, "epoch": 6537} {"train_loss": -28.01911735534668, "global_step": 542604, "epoch": 6537} {"train_loss": -27.71016502380371, "global_step": 542605, "epoch": 6537} {"train_loss": -27.918508529663086, "global_step": 542606, "epoch": 6537} {"train_loss": -27.53797721862793, "global_step": 542607, "epoch": 6537} {"train_loss": -27.928075790405273, "global_step": 542608, "epoch": 6537} {"train_loss": -27.4743709564209, "global_step": 542609, "epoch": 6537} {"train_loss": -27.831945419311523, "global_step": 542610, "epoch": 6537} {"train_loss": -27.541976928710938, "global_step": 542611, "epoch": 6537} {"train_loss": -27.738012313842773, "global_step": 542612, "epoch": 6537} {"train_loss": -28.039480209350586, "global_step": 542613, "epoch": 6537} {"train_loss": -27.826129913330078, "global_step": 542614, "epoch": 6537} {"train_loss": -28.043867111206055, "global_step": 542615, "epoch": 6537} {"train_loss": -27.61838722229004, "global_step": 542616, "epoch": 6537} {"train_loss": -27.7091064453125, "global_step": 542617, "epoch": 6537} {"train_loss": -28.16205406188965, "global_step": 542618, "epoch": 6537} {"train_loss": -27.998281478881836, "global_step": 542619, "epoch": 6537} {"train_loss": -27.752294540405273, "global_step": 542620, "epoch": 6537} {"train_loss": -27.970600128173828, "global_step": 542621, "epoch": 6537} {"train_loss": -27.69046974182129, "global_step": 542622, "epoch": 6537} {"train_loss": -28.035364151000977, "global_step": 542623, "epoch": 6537} {"train_loss": -28.023828506469727, "global_step": 542624, "epoch": 6537} {"train_loss": -28.44821548461914, "global_step": 542625, "epoch": 6537} {"train_loss": -27.637601852416992, "global_step": 542626, "epoch": 6537} {"train_loss": -27.682485580444336, "global_step": 542627, "epoch": 6537} {"train_loss": -27.8510684967041, "global_step": 542628, "epoch": 6537} {"train_loss": -28.213546752929688, "global_step": 542629, "epoch": 6537} {"train_loss": -27.636518478393555, "global_step": 542630, "epoch": 6537} {"train_loss": -26.517786026000977, "global_step": 542631, "epoch": 6537} {"train_loss": -27.641021728515625, "global_step": 542632, "epoch": 6537} {"train_loss": -27.68617820739746, "global_step": 542633, "epoch": 6537} {"train_loss": -27.11032485961914, "global_step": 542634, "epoch": 6537} {"train_loss": -27.197834014892578, "global_step": 542635, "epoch": 6537} {"train_loss": -26.934309005737305, "global_step": 542636, "epoch": 6537} {"train_loss": -27.193561553955078, "global_step": 542637, "epoch": 6537} {"train_loss": -27.751916885375977, "global_step": 542638, "epoch": 6537} {"train_loss": -27.56403923034668, "global_step": 542639, "epoch": 6537} {"train_loss": -27.64584732055664, "global_step": 542640, "epoch": 6537} {"train_loss": -27.29768943786621, "global_step": 542641, "epoch": 6537} {"train_loss": -27.755084991455078, "global_step": 542642, "epoch": 6537} {"train_loss": -27.35382080078125, "global_step": 542643, "epoch": 6537} {"train_loss": -27.348724365234375, "global_step": 542644, "epoch": 6537} {"train_loss": -27.522781372070312, "global_step": 542645, "epoch": 6537} {"train_loss": -27.437891006469727, "global_step": 542646, "epoch": 6537} {"train_loss": -27.307052612304688, "global_step": 542647, "epoch": 6537} {"train_loss": -27.304996490478516, "global_step": 542648, "epoch": 6537} {"train_loss": -27.184814453125, "global_step": 542649, "epoch": 6537} {"train_loss": -27.392698287963867, "global_step": 542650, "epoch": 6537} {"train_loss": -26.8937931060791, "global_step": 542651, "epoch": 6537} {"train_loss": -27.336719512939453, "global_step": 542652, "epoch": 6537} {"train_loss": -27.53568906669157, "global_step": 542653, "epoch": 6537, "val_loss": 6531563.5} {"train_loss": -26.445037841796875, "global_step": 542654, "epoch": 6538} {"train_loss": -26.560699462890625, "global_step": 542655, "epoch": 6538} {"train_loss": -26.825727462768555, "global_step": 542656, "epoch": 6538} {"train_loss": -26.990875244140625, "global_step": 542657, "epoch": 6538} {"train_loss": -26.80840492248535, "global_step": 542658, "epoch": 6538} {"train_loss": -26.83404541015625, "global_step": 542659, "epoch": 6538} {"train_loss": -27.48968505859375, "global_step": 542660, "epoch": 6538} {"train_loss": -27.059362411499023, "global_step": 542661, "epoch": 6538} {"train_loss": -27.024564743041992, "global_step": 542662, "epoch": 6538} {"train_loss": -27.162109375, "global_step": 542663, "epoch": 6538} {"train_loss": -26.76239585876465, "global_step": 542664, "epoch": 6538} {"train_loss": -27.218271255493164, "global_step": 542665, "epoch": 6538} {"train_loss": -27.214889526367188, "global_step": 542666, "epoch": 6538} {"train_loss": -27.428312301635742, "global_step": 542667, "epoch": 6538} {"train_loss": -27.127912521362305, "global_step": 542668, "epoch": 6538} {"train_loss": -27.463226318359375, "global_step": 542669, "epoch": 6538} {"train_loss": -27.427549362182617, "global_step": 542670, "epoch": 6538} {"train_loss": -27.346044540405273, "global_step": 542671, "epoch": 6538} {"train_loss": -27.319177627563477, "global_step": 542672, "epoch": 6538} {"train_loss": -27.04360008239746, "global_step": 542673, "epoch": 6538} {"train_loss": -27.05376625061035, "global_step": 542674, "epoch": 6538} {"train_loss": -27.617691040039062, "global_step": 542675, "epoch": 6538} {"train_loss": -27.533248901367188, "global_step": 542676, "epoch": 6538} {"train_loss": -27.75994300842285, "global_step": 542677, "epoch": 6538} {"train_loss": -27.545392990112305, "global_step": 542678, "epoch": 6538} {"train_loss": -27.710128784179688, "global_step": 542679, "epoch": 6538} {"train_loss": -27.53647232055664, "global_step": 542680, "epoch": 6538} {"train_loss": -27.742431640625, "global_step": 542681, "epoch": 6538} {"train_loss": -27.54123306274414, "global_step": 542682, "epoch": 6538} {"train_loss": -27.703359603881836, "global_step": 542683, "epoch": 6538} {"train_loss": -27.437824249267578, "global_step": 542684, "epoch": 6538} {"train_loss": -27.978824615478516, "global_step": 542685, "epoch": 6538} {"train_loss": -27.652587890625, "global_step": 542686, "epoch": 6538} {"train_loss": -27.807239532470703, "global_step": 542687, "epoch": 6538} {"train_loss": -27.6314754486084, "global_step": 542688, "epoch": 6538} {"train_loss": -27.972997665405273, "global_step": 542689, "epoch": 6538} {"train_loss": -27.822345733642578, "global_step": 542690, "epoch": 6538} {"train_loss": -28.07038688659668, "global_step": 542691, "epoch": 6538} {"train_loss": -27.709253311157227, "global_step": 542692, "epoch": 6538} {"train_loss": -28.144628524780273, "global_step": 542693, "epoch": 6538} {"train_loss": -27.46942710876465, "global_step": 542694, "epoch": 6538} {"train_loss": -27.95462417602539, "global_step": 542695, "epoch": 6538} {"train_loss": -27.572891235351562, "global_step": 542696, "epoch": 6538} {"train_loss": -27.882726669311523, "global_step": 542697, "epoch": 6538} {"train_loss": -27.53473472595215, "global_step": 542698, "epoch": 6538} {"train_loss": -28.1112003326416, "global_step": 542699, "epoch": 6538} {"train_loss": -27.69365882873535, "global_step": 542700, "epoch": 6538} {"train_loss": -27.972869873046875, "global_step": 542701, "epoch": 6538} {"train_loss": -27.79120445251465, "global_step": 542702, "epoch": 6538} {"train_loss": -27.438745498657227, "global_step": 542703, "epoch": 6538} {"train_loss": -27.4919376373291, "global_step": 542704, "epoch": 6538} {"train_loss": -27.998685836791992, "global_step": 542705, "epoch": 6538} {"train_loss": -28.095849990844727, "global_step": 542706, "epoch": 6538} {"train_loss": -27.421676635742188, "global_step": 542707, "epoch": 6538} {"train_loss": -27.489429473876953, "global_step": 542708, "epoch": 6538} {"train_loss": -27.911712646484375, "global_step": 542709, "epoch": 6538} {"train_loss": -28.139490127563477, "global_step": 542710, "epoch": 6538} {"train_loss": -27.276357650756836, "global_step": 542711, "epoch": 6538} {"train_loss": -27.82537841796875, "global_step": 542712, "epoch": 6538} {"train_loss": -27.49921989440918, "global_step": 542713, "epoch": 6538} {"train_loss": -27.33705711364746, "global_step": 542714, "epoch": 6538} {"train_loss": -27.678970336914062, "global_step": 542715, "epoch": 6538} {"train_loss": -27.56317138671875, "global_step": 542716, "epoch": 6538} {"train_loss": -27.2677059173584, "global_step": 542717, "epoch": 6538} {"train_loss": -27.555938720703125, "global_step": 542718, "epoch": 6538} {"train_loss": -27.595874786376953, "global_step": 542719, "epoch": 6538} {"train_loss": -27.7072811126709, "global_step": 542720, "epoch": 6538} {"train_loss": -27.4814510345459, "global_step": 542721, "epoch": 6538} {"train_loss": -27.517196655273438, "global_step": 542722, "epoch": 6538} {"train_loss": -27.82525062561035, "global_step": 542723, "epoch": 6538} {"train_loss": -27.831268310546875, "global_step": 542724, "epoch": 6538} {"train_loss": -27.74128532409668, "global_step": 542725, "epoch": 6538} {"train_loss": -27.83180046081543, "global_step": 542726, "epoch": 6538} {"train_loss": -27.824390411376953, "global_step": 542727, "epoch": 6538} {"train_loss": -27.854948043823242, "global_step": 542728, "epoch": 6538} {"train_loss": -27.832244873046875, "global_step": 542729, "epoch": 6538} {"train_loss": -27.507938385009766, "global_step": 542730, "epoch": 6538} {"train_loss": -27.814722061157227, "global_step": 542731, "epoch": 6538} {"train_loss": -27.870288848876953, "global_step": 542732, "epoch": 6538} {"train_loss": -27.75174331665039, "global_step": 542733, "epoch": 6538} {"train_loss": -28.128408432006836, "global_step": 542734, "epoch": 6538} {"train_loss": -27.452665328979492, "global_step": 542735, "epoch": 6538} {"train_loss": -27.55866172514766, "global_step": 542736, "epoch": 6538, "val_loss": 6507123.5} {"train_loss": -27.043670654296875, "global_step": 542737, "epoch": 6539} {"train_loss": -27.279504776000977, "global_step": 542738, "epoch": 6539} {"train_loss": -26.862213134765625, "global_step": 542739, "epoch": 6539} {"train_loss": -27.358068466186523, "global_step": 542740, "epoch": 6539} {"train_loss": -27.065649032592773, "global_step": 542741, "epoch": 6539} {"train_loss": -27.2675724029541, "global_step": 542742, "epoch": 6539} {"train_loss": -26.93494987487793, "global_step": 542743, "epoch": 6539} {"train_loss": -27.66635513305664, "global_step": 542744, "epoch": 6539} {"train_loss": -27.282068252563477, "global_step": 542745, "epoch": 6539} {"train_loss": -27.14239501953125, "global_step": 542746, "epoch": 6539} {"train_loss": -27.2502498626709, "global_step": 542747, "epoch": 6539} {"train_loss": -27.43413734436035, "global_step": 542748, "epoch": 6539} {"train_loss": -27.3377628326416, "global_step": 542749, "epoch": 6539} {"train_loss": -27.623056411743164, "global_step": 542750, "epoch": 6539} {"train_loss": -27.123991012573242, "global_step": 542751, "epoch": 6539} {"train_loss": -27.78647804260254, "global_step": 542752, "epoch": 6539} {"train_loss": -27.708942413330078, "global_step": 542753, "epoch": 6539} {"train_loss": -27.5157527923584, "global_step": 542754, "epoch": 6539} {"train_loss": -27.045026779174805, "global_step": 542755, "epoch": 6539} {"train_loss": -27.65728759765625, "global_step": 542756, "epoch": 6539} {"train_loss": -27.561023712158203, "global_step": 542757, "epoch": 6539} {"train_loss": -27.89045524597168, "global_step": 542758, "epoch": 6539} {"train_loss": -27.682758331298828, "global_step": 542759, "epoch": 6539} {"train_loss": -27.723663330078125, "global_step": 542760, "epoch": 6539} {"train_loss": -27.92476463317871, "global_step": 542761, "epoch": 6539} {"train_loss": -27.3391170501709, "global_step": 542762, "epoch": 6539} {"train_loss": -27.710620880126953, "global_step": 542763, "epoch": 6539} {"train_loss": -27.604373931884766, "global_step": 542764, "epoch": 6539} {"train_loss": -27.839475631713867, "global_step": 542765, "epoch": 6539} {"train_loss": -27.542236328125, "global_step": 542766, "epoch": 6539} {"train_loss": -27.594587326049805, "global_step": 542767, "epoch": 6539} {"train_loss": -27.31021499633789, "global_step": 542768, "epoch": 6539} {"train_loss": -27.50287437438965, "global_step": 542769, "epoch": 6539} {"train_loss": -27.77919578552246, "global_step": 542770, "epoch": 6539} {"train_loss": -27.507556915283203, "global_step": 542771, "epoch": 6539} {"train_loss": -27.61085319519043, "global_step": 542772, "epoch": 6539} {"train_loss": -27.504011154174805, "global_step": 542773, "epoch": 6539} {"train_loss": -28.097614288330078, "global_step": 542774, "epoch": 6539} {"train_loss": -27.854507446289062, "global_step": 542775, "epoch": 6539} {"train_loss": -27.958389282226562, "global_step": 542776, "epoch": 6539} {"train_loss": -27.964374542236328, "global_step": 542777, "epoch": 6539} {"train_loss": -27.727008819580078, "global_step": 542778, "epoch": 6539} {"train_loss": -27.58416748046875, "global_step": 542779, "epoch": 6539} {"train_loss": -27.61785888671875, "global_step": 542780, "epoch": 6539} {"train_loss": -27.819299697875977, "global_step": 542781, "epoch": 6539} {"train_loss": -27.749204635620117, "global_step": 542782, "epoch": 6539} {"train_loss": -28.02359390258789, "global_step": 542783, "epoch": 6539} {"train_loss": -27.95057487487793, "global_step": 542784, "epoch": 6539} {"train_loss": -27.6047306060791, "global_step": 542785, "epoch": 6539} {"train_loss": -27.970977783203125, "global_step": 542786, "epoch": 6539} {"train_loss": -28.006017684936523, "global_step": 542787, "epoch": 6539} {"train_loss": -28.0743350982666, "global_step": 542788, "epoch": 6539} {"train_loss": -27.651214599609375, "global_step": 542789, "epoch": 6539} {"train_loss": -27.698572158813477, "global_step": 542790, "epoch": 6539} {"train_loss": -28.153234481811523, "global_step": 542791, "epoch": 6539} {"train_loss": -27.15458106994629, "global_step": 542792, "epoch": 6539} {"train_loss": -27.278018951416016, "global_step": 542793, "epoch": 6539} {"train_loss": -27.541105270385742, "global_step": 542794, "epoch": 6539} {"train_loss": -27.580121994018555, "global_step": 542795, "epoch": 6539} {"train_loss": -27.83169937133789, "global_step": 542796, "epoch": 6539} {"train_loss": -27.855670928955078, "global_step": 542797, "epoch": 6539} {"train_loss": -27.50807762145996, "global_step": 542798, "epoch": 6539} {"train_loss": -28.13112449645996, "global_step": 542799, "epoch": 6539} {"train_loss": -27.640844345092773, "global_step": 542800, "epoch": 6539} {"train_loss": -27.8617000579834, "global_step": 542801, "epoch": 6539} {"train_loss": -27.61628532409668, "global_step": 542802, "epoch": 6539} {"train_loss": -27.70362663269043, "global_step": 542803, "epoch": 6539} {"train_loss": -27.820154190063477, "global_step": 542804, "epoch": 6539} {"train_loss": -27.33965492248535, "global_step": 542805, "epoch": 6539} {"train_loss": -27.974409103393555, "global_step": 542806, "epoch": 6539} {"train_loss": -27.505407333374023, "global_step": 542807, "epoch": 6539} {"train_loss": -27.9382381439209, "global_step": 542808, "epoch": 6539} {"train_loss": -27.97751808166504, "global_step": 542809, "epoch": 6539} {"train_loss": -27.774682998657227, "global_step": 542810, "epoch": 6539} {"train_loss": -27.999235153198242, "global_step": 542811, "epoch": 6539} {"train_loss": -27.579389572143555, "global_step": 542812, "epoch": 6539} {"train_loss": -27.6141357421875, "global_step": 542813, "epoch": 6539} {"train_loss": -27.933805465698242, "global_step": 542814, "epoch": 6539} {"train_loss": -28.026208877563477, "global_step": 542815, "epoch": 6539} {"train_loss": -27.57154655456543, "global_step": 542816, "epoch": 6539} {"train_loss": -27.73969841003418, "global_step": 542817, "epoch": 6539} {"train_loss": -27.840192794799805, "global_step": 542818, "epoch": 6539} {"train_loss": -27.61846625086773, "global_step": 542819, "epoch": 6539, "val_loss": 6521014.0} {"train_loss": -27.472888946533203, "global_step": 542820, "epoch": 6540} {"train_loss": -26.594715118408203, "global_step": 542821, "epoch": 6540} {"train_loss": -26.660139083862305, "global_step": 542822, "epoch": 6540} {"train_loss": -27.27362632751465, "global_step": 542823, "epoch": 6540} {"train_loss": -27.40620994567871, "global_step": 542824, "epoch": 6540} {"train_loss": -27.147607803344727, "global_step": 542825, "epoch": 6540} {"train_loss": -27.140949249267578, "global_step": 542826, "epoch": 6540} {"train_loss": -27.43665885925293, "global_step": 542827, "epoch": 6540} {"train_loss": -26.998075485229492, "global_step": 542828, "epoch": 6540} {"train_loss": -27.573184967041016, "global_step": 542829, "epoch": 6540} {"train_loss": -27.117862701416016, "global_step": 542830, "epoch": 6540} {"train_loss": -27.37052345275879, "global_step": 542831, "epoch": 6540} {"train_loss": -27.261749267578125, "global_step": 542832, "epoch": 6540} {"train_loss": -27.5396671295166, "global_step": 542833, "epoch": 6540} {"train_loss": -27.316497802734375, "global_step": 542834, "epoch": 6540} {"train_loss": -27.535247802734375, "global_step": 542835, "epoch": 6540} {"train_loss": -27.155029296875, "global_step": 542836, "epoch": 6540} {"train_loss": -27.43863868713379, "global_step": 542837, "epoch": 6540} {"train_loss": -27.334766387939453, "global_step": 542838, "epoch": 6540} {"train_loss": -26.8818302154541, "global_step": 542839, "epoch": 6540} {"train_loss": -27.198511123657227, "global_step": 542840, "epoch": 6540} {"train_loss": -27.23409080505371, "global_step": 542841, "epoch": 6540} {"train_loss": -27.10593605041504, "global_step": 542842, "epoch": 6540} {"train_loss": -27.316328048706055, "global_step": 542843, "epoch": 6540} {"train_loss": -27.304779052734375, "global_step": 542844, "epoch": 6540} {"train_loss": -27.307666778564453, "global_step": 542845, "epoch": 6540} {"train_loss": -27.265165328979492, "global_step": 542846, "epoch": 6540} {"train_loss": -27.33687400817871, "global_step": 542847, "epoch": 6540} {"train_loss": -27.78583335876465, "global_step": 542848, "epoch": 6540} {"train_loss": -27.613128662109375, "global_step": 542849, "epoch": 6540} {"train_loss": -27.689905166625977, "global_step": 542850, "epoch": 6540} {"train_loss": -27.611831665039062, "global_step": 542851, "epoch": 6540} {"train_loss": -27.594867706298828, "global_step": 542852, "epoch": 6540} {"train_loss": -27.358983993530273, "global_step": 542853, "epoch": 6540} {"train_loss": -27.559127807617188, "global_step": 542854, "epoch": 6540} {"train_loss": -27.734342575073242, "global_step": 542855, "epoch": 6540} {"train_loss": -27.68770408630371, "global_step": 542856, "epoch": 6540} {"train_loss": -27.545923233032227, "global_step": 542857, "epoch": 6540} {"train_loss": -27.457563400268555, "global_step": 542858, "epoch": 6540} {"train_loss": -27.47210121154785, "global_step": 542859, "epoch": 6540} {"train_loss": -27.71223258972168, "global_step": 542860, "epoch": 6540} {"train_loss": -27.34832191467285, "global_step": 542861, "epoch": 6540} {"train_loss": -28.059555053710938, "global_step": 542862, "epoch": 6540} {"train_loss": -27.658187866210938, "global_step": 542863, "epoch": 6540} {"train_loss": -27.563282012939453, "global_step": 542864, "epoch": 6540} {"train_loss": -27.74580192565918, "global_step": 542865, "epoch": 6540} {"train_loss": -27.40093421936035, "global_step": 542866, "epoch": 6540} {"train_loss": -27.497236251831055, "global_step": 542867, "epoch": 6540} {"train_loss": -27.243879318237305, "global_step": 542868, "epoch": 6540} {"train_loss": -27.988142013549805, "global_step": 542869, "epoch": 6540} {"train_loss": -27.314807891845703, "global_step": 542870, "epoch": 6540} {"train_loss": -27.324819564819336, "global_step": 542871, "epoch": 6540} {"train_loss": -27.813940048217773, "global_step": 542872, "epoch": 6540} {"train_loss": -27.93552017211914, "global_step": 542873, "epoch": 6540} {"train_loss": -27.948026657104492, "global_step": 542874, "epoch": 6540} {"train_loss": -27.579126358032227, "global_step": 542875, "epoch": 6540} {"train_loss": -27.854339599609375, "global_step": 542876, "epoch": 6540} {"train_loss": -27.40439224243164, "global_step": 542877, "epoch": 6540} {"train_loss": -27.685291290283203, "global_step": 542878, "epoch": 6540} {"train_loss": -27.64552116394043, "global_step": 542879, "epoch": 6540} {"train_loss": -27.63983726501465, "global_step": 542880, "epoch": 6540} {"train_loss": -27.77027702331543, "global_step": 542881, "epoch": 6540} {"train_loss": -27.521347045898438, "global_step": 542882, "epoch": 6540} {"train_loss": -27.784942626953125, "global_step": 542883, "epoch": 6540} {"train_loss": -27.630416870117188, "global_step": 542884, "epoch": 6540} {"train_loss": -27.86094093322754, "global_step": 542885, "epoch": 6540} {"train_loss": -27.857837677001953, "global_step": 542886, "epoch": 6540} {"train_loss": -28.01388931274414, "global_step": 542887, "epoch": 6540} {"train_loss": -27.915475845336914, "global_step": 542888, "epoch": 6540} {"train_loss": -27.900060653686523, "global_step": 542889, "epoch": 6540} {"train_loss": -27.885467529296875, "global_step": 542890, "epoch": 6540} {"train_loss": -27.815587997436523, "global_step": 542891, "epoch": 6540} {"train_loss": -27.89460563659668, "global_step": 542892, "epoch": 6540} {"train_loss": -28.127368927001953, "global_step": 542893, "epoch": 6540} {"train_loss": -27.716449737548828, "global_step": 542894, "epoch": 6540} {"train_loss": -27.784137725830078, "global_step": 542895, "epoch": 6540} {"train_loss": -27.312891006469727, "global_step": 542896, "epoch": 6540} {"train_loss": -26.932058334350586, "global_step": 542897, "epoch": 6540} {"train_loss": -27.44484519958496, "global_step": 542898, "epoch": 6540} {"train_loss": -27.84136962890625, "global_step": 542899, "epoch": 6540} {"train_loss": -26.94219970703125, "global_step": 542900, "epoch": 6540} {"train_loss": -26.56117057800293, "global_step": 542901, "epoch": 6540} {"train_loss": -27.487562386386365, "global_step": 542902, "epoch": 6540, "val_loss": 6562174.0} {"train_loss": -27.2147216796875, "global_step": 542903, "epoch": 6541} {"train_loss": -26.92609977722168, "global_step": 542904, "epoch": 6541} {"train_loss": -27.066518783569336, "global_step": 542905, "epoch": 6541} {"train_loss": -26.300174713134766, "global_step": 542906, "epoch": 6541} {"train_loss": -26.363433837890625, "global_step": 542907, "epoch": 6541} {"train_loss": -26.570371627807617, "global_step": 542908, "epoch": 6541} {"train_loss": -26.921024322509766, "global_step": 542909, "epoch": 6541} {"train_loss": -26.972623825073242, "global_step": 542910, "epoch": 6541} {"train_loss": -27.002050399780273, "global_step": 542911, "epoch": 6541} {"train_loss": -27.349889755249023, "global_step": 542912, "epoch": 6541} {"train_loss": -27.034574508666992, "global_step": 542913, "epoch": 6541} {"train_loss": -27.353931427001953, "global_step": 542914, "epoch": 6541} {"train_loss": -27.18134880065918, "global_step": 542915, "epoch": 6541} {"train_loss": -27.309507369995117, "global_step": 542916, "epoch": 6541} {"train_loss": -26.936079025268555, "global_step": 542917, "epoch": 6541} {"train_loss": -27.57810401916504, "global_step": 542918, "epoch": 6541} {"train_loss": -27.256982803344727, "global_step": 542919, "epoch": 6541} {"train_loss": -27.548974990844727, "global_step": 542920, "epoch": 6541} {"train_loss": -27.159570693969727, "global_step": 542921, "epoch": 6541} {"train_loss": -27.266529083251953, "global_step": 542922, "epoch": 6541} {"train_loss": -27.079761505126953, "global_step": 542923, "epoch": 6541} {"train_loss": -27.53912925720215, "global_step": 542924, "epoch": 6541} {"train_loss": -27.757604598999023, "global_step": 542925, "epoch": 6541} {"train_loss": -27.477575302124023, "global_step": 542926, "epoch": 6541} {"train_loss": -27.869718551635742, "global_step": 542927, "epoch": 6541} {"train_loss": -27.728925704956055, "global_step": 542928, "epoch": 6541} {"train_loss": -27.664941787719727, "global_step": 542929, "epoch": 6541} {"train_loss": -27.62660026550293, "global_step": 542930, "epoch": 6541} {"train_loss": -27.14862060546875, "global_step": 542931, "epoch": 6541} {"train_loss": -27.653379440307617, "global_step": 542932, "epoch": 6541} {"train_loss": -27.55716896057129, "global_step": 542933, "epoch": 6541} {"train_loss": -27.6823787689209, "global_step": 542934, "epoch": 6541} {"train_loss": -27.705625534057617, "global_step": 542935, "epoch": 6541} {"train_loss": -27.830585479736328, "global_step": 542936, "epoch": 6541} {"train_loss": -27.824752807617188, "global_step": 542937, "epoch": 6541} {"train_loss": -27.593732833862305, "global_step": 542938, "epoch": 6541} {"train_loss": -27.8179874420166, "global_step": 542939, "epoch": 6541} {"train_loss": -27.8103084564209, "global_step": 542940, "epoch": 6541} {"train_loss": -27.664047241210938, "global_step": 542941, "epoch": 6541} {"train_loss": -28.01991844177246, "global_step": 542942, "epoch": 6541} {"train_loss": -27.740991592407227, "global_step": 542943, "epoch": 6541} {"train_loss": -27.680585861206055, "global_step": 542944, "epoch": 6541} {"train_loss": -27.51971435546875, "global_step": 542945, "epoch": 6541} {"train_loss": -27.822906494140625, "global_step": 542946, "epoch": 6541} {"train_loss": -27.677331924438477, "global_step": 542947, "epoch": 6541} {"train_loss": -27.420825958251953, "global_step": 542948, "epoch": 6541} {"train_loss": -27.688892364501953, "global_step": 542949, "epoch": 6541} {"train_loss": -28.10030174255371, "global_step": 542950, "epoch": 6541} {"train_loss": -27.5423526763916, "global_step": 542951, "epoch": 6541} {"train_loss": -27.977231979370117, "global_step": 542952, "epoch": 6541} {"train_loss": -28.124921798706055, "global_step": 542953, "epoch": 6541} {"train_loss": -27.64063835144043, "global_step": 542954, "epoch": 6541} {"train_loss": -27.77984619140625, "global_step": 542955, "epoch": 6541} {"train_loss": -28.043912887573242, "global_step": 542956, "epoch": 6541} {"train_loss": -27.7740421295166, "global_step": 542957, "epoch": 6541} {"train_loss": -27.541357040405273, "global_step": 542958, "epoch": 6541} {"train_loss": -27.833820343017578, "global_step": 542959, "epoch": 6541} {"train_loss": -28.130842208862305, "global_step": 542960, "epoch": 6541} {"train_loss": -28.006851196289062, "global_step": 542961, "epoch": 6541} {"train_loss": -28.218509674072266, "global_step": 542962, "epoch": 6541} {"train_loss": -27.897674560546875, "global_step": 542963, "epoch": 6541} {"train_loss": -27.454160690307617, "global_step": 542964, "epoch": 6541} {"train_loss": -27.37664794921875, "global_step": 542965, "epoch": 6541} {"train_loss": -27.6917667388916, "global_step": 542966, "epoch": 6541} {"train_loss": -28.060171127319336, "global_step": 542967, "epoch": 6541} {"train_loss": -27.608367919921875, "global_step": 542968, "epoch": 6541} {"train_loss": -27.970401763916016, "global_step": 542969, "epoch": 6541} {"train_loss": -27.59574317932129, "global_step": 542970, "epoch": 6541} {"train_loss": -28.061994552612305, "global_step": 542971, "epoch": 6541} {"train_loss": -27.568994522094727, "global_step": 542972, "epoch": 6541} {"train_loss": -27.78034782409668, "global_step": 542973, "epoch": 6541} {"train_loss": -27.576339721679688, "global_step": 542974, "epoch": 6541} {"train_loss": -27.32659339904785, "global_step": 542975, "epoch": 6541} {"train_loss": -27.3699893951416, "global_step": 542976, "epoch": 6541} {"train_loss": -27.69350242614746, "global_step": 542977, "epoch": 6541} {"train_loss": -27.269123077392578, "global_step": 542978, "epoch": 6541} {"train_loss": -27.04193115234375, "global_step": 542979, "epoch": 6541} {"train_loss": -27.292646408081055, "global_step": 542980, "epoch": 6541} {"train_loss": -27.53570556640625, "global_step": 542981, "epoch": 6541} {"train_loss": -27.309961318969727, "global_step": 542982, "epoch": 6541} {"train_loss": -27.183795928955078, "global_step": 542983, "epoch": 6541} {"train_loss": -27.534143447875977, "global_step": 542984, "epoch": 6541} {"train_loss": -27.514794315200255, "global_step": 542985, "epoch": 6541, "val_loss": 6490910.0} {"train_loss": -26.67536735534668, "global_step": 542986, "epoch": 6542} {"train_loss": -26.19939613342285, "global_step": 542987, "epoch": 6542} {"train_loss": -26.35584831237793, "global_step": 542988, "epoch": 6542} {"train_loss": -26.743289947509766, "global_step": 542989, "epoch": 6542} {"train_loss": -27.094324111938477, "global_step": 542990, "epoch": 6542} {"train_loss": -26.880857467651367, "global_step": 542991, "epoch": 6542} {"train_loss": -26.726789474487305, "global_step": 542992, "epoch": 6542} {"train_loss": -27.24484634399414, "global_step": 542993, "epoch": 6542} {"train_loss": -26.8220272064209, "global_step": 542994, "epoch": 6542} {"train_loss": -27.29501724243164, "global_step": 542995, "epoch": 6542} {"train_loss": -27.264240264892578, "global_step": 542996, "epoch": 6542} {"train_loss": -27.03875160217285, "global_step": 542997, "epoch": 6542} {"train_loss": -26.9647216796875, "global_step": 542998, "epoch": 6542} {"train_loss": -27.368017196655273, "global_step": 542999, "epoch": 6542} {"train_loss": -27.19011878967285, "global_step": 543000, "epoch": 6542} {"train_loss": -27.1878719329834, "global_step": 543001, "epoch": 6542} {"train_loss": -27.48406410217285, "global_step": 543002, "epoch": 6542} {"train_loss": -27.628137588500977, "global_step": 543003, "epoch": 6542} {"train_loss": -27.735448837280273, "global_step": 543004, "epoch": 6542} {"train_loss": -27.57386589050293, "global_step": 543005, "epoch": 6542} {"train_loss": -27.77692985534668, "global_step": 543006, "epoch": 6542} {"train_loss": -27.657739639282227, "global_step": 543007, "epoch": 6542} {"train_loss": -27.73046875, "global_step": 543008, "epoch": 6542} {"train_loss": -27.111597061157227, "global_step": 543009, "epoch": 6542} {"train_loss": -27.212482452392578, "global_step": 543010, "epoch": 6542} {"train_loss": -27.33099937438965, "global_step": 543011, "epoch": 6542} {"train_loss": -27.84259605407715, "global_step": 543012, "epoch": 6542} {"train_loss": -27.663196563720703, "global_step": 543013, "epoch": 6542} {"train_loss": -27.79493522644043, "global_step": 543014, "epoch": 6542} {"train_loss": -27.49091911315918, "global_step": 543015, "epoch": 6542} {"train_loss": -28.276844024658203, "global_step": 543016, "epoch": 6542} {"train_loss": -27.53861427307129, "global_step": 543017, "epoch": 6542} {"train_loss": -27.65094566345215, "global_step": 543018, "epoch": 6542} {"train_loss": -27.828887939453125, "global_step": 543019, "epoch": 6542} {"train_loss": -28.072086334228516, "global_step": 543020, "epoch": 6542} {"train_loss": -27.60039710998535, "global_step": 543021, "epoch": 6542} {"train_loss": -27.633569717407227, "global_step": 543022, "epoch": 6542} {"train_loss": -27.94406509399414, "global_step": 543023, "epoch": 6542} {"train_loss": -27.853422164916992, "global_step": 543024, "epoch": 6542} {"train_loss": -27.71552085876465, "global_step": 543025, "epoch": 6542} {"train_loss": -27.875396728515625, "global_step": 543026, "epoch": 6542} {"train_loss": -27.812530517578125, "global_step": 543027, "epoch": 6542} {"train_loss": -28.020002365112305, "global_step": 543028, "epoch": 6542} {"train_loss": -27.98674964904785, "global_step": 543029, "epoch": 6542} {"train_loss": -27.700977325439453, "global_step": 543030, "epoch": 6542} {"train_loss": -27.31366539001465, "global_step": 543031, "epoch": 6542} {"train_loss": -27.93352699279785, "global_step": 543032, "epoch": 6542} {"train_loss": -27.702878952026367, "global_step": 543033, "epoch": 6542} {"train_loss": -27.722919464111328, "global_step": 543034, "epoch": 6542} {"train_loss": -28.047109603881836, "global_step": 543035, "epoch": 6542} {"train_loss": -28.1549015045166, "global_step": 543036, "epoch": 6542} {"train_loss": -27.723865509033203, "global_step": 543037, "epoch": 6542} {"train_loss": -28.174835205078125, "global_step": 543038, "epoch": 6542} {"train_loss": -28.347248077392578, "global_step": 543039, "epoch": 6542} {"train_loss": -27.60188102722168, "global_step": 543040, "epoch": 6542} {"train_loss": -27.64521598815918, "global_step": 543041, "epoch": 6542} {"train_loss": -27.554502487182617, "global_step": 543042, "epoch": 6542} {"train_loss": -27.611862182617188, "global_step": 543043, "epoch": 6542} {"train_loss": -27.869781494140625, "global_step": 543044, "epoch": 6542} {"train_loss": -27.643787384033203, "global_step": 543045, "epoch": 6542} {"train_loss": -27.62738037109375, "global_step": 543046, "epoch": 6542} {"train_loss": -27.776172637939453, "global_step": 543047, "epoch": 6542} {"train_loss": -27.395200729370117, "global_step": 543048, "epoch": 6542} {"train_loss": -27.905820846557617, "global_step": 543049, "epoch": 6542} {"train_loss": -27.493520736694336, "global_step": 543050, "epoch": 6542} {"train_loss": -27.70710563659668, "global_step": 543051, "epoch": 6542} {"train_loss": -27.781354904174805, "global_step": 543052, "epoch": 6542} {"train_loss": -27.58342933654785, "global_step": 543053, "epoch": 6542} {"train_loss": -27.6566162109375, "global_step": 543054, "epoch": 6542} {"train_loss": -27.455331802368164, "global_step": 543055, "epoch": 6542} {"train_loss": -27.639684677124023, "global_step": 543056, "epoch": 6542} {"train_loss": -27.533050537109375, "global_step": 543057, "epoch": 6542} {"train_loss": -27.47731590270996, "global_step": 543058, "epoch": 6542} {"train_loss": -27.766935348510742, "global_step": 543059, "epoch": 6542} {"train_loss": -27.724628448486328, "global_step": 543060, "epoch": 6542} {"train_loss": -27.33740234375, "global_step": 543061, "epoch": 6542} {"train_loss": -27.67063331604004, "global_step": 543062, "epoch": 6542} {"train_loss": -27.472721099853516, "global_step": 543063, "epoch": 6542} {"train_loss": -27.700376510620117, "global_step": 543064, "epoch": 6542} {"train_loss": -27.27027702331543, "global_step": 543065, "epoch": 6542} {"train_loss": -27.125762939453125, "global_step": 543066, "epoch": 6542} {"train_loss": -26.866437911987305, "global_step": 543067, "epoch": 6542} {"train_loss": -27.541928187910333, "global_step": 543068, "epoch": 6542, "val_loss": 6524874.0} {"train_loss": -26.7565860748291, "global_step": 543069, "epoch": 6543} {"train_loss": -26.48846435546875, "global_step": 543070, "epoch": 6543} {"train_loss": -27.6329345703125, "global_step": 543071, "epoch": 6543} {"train_loss": -26.992395401000977, "global_step": 543072, "epoch": 6543} {"train_loss": -26.682025909423828, "global_step": 543073, "epoch": 6543} {"train_loss": -27.46306800842285, "global_step": 543074, "epoch": 6543} {"train_loss": -26.47450828552246, "global_step": 543075, "epoch": 6543} {"train_loss": -27.202917098999023, "global_step": 543076, "epoch": 6543} {"train_loss": -26.87237548828125, "global_step": 543077, "epoch": 6543} {"train_loss": -27.092641830444336, "global_step": 543078, "epoch": 6543} {"train_loss": -26.959299087524414, "global_step": 543079, "epoch": 6543} {"train_loss": -27.116729736328125, "global_step": 543080, "epoch": 6543} {"train_loss": -27.51263999938965, "global_step": 543081, "epoch": 6543} {"train_loss": -27.09425163269043, "global_step": 543082, "epoch": 6543} {"train_loss": -27.251611709594727, "global_step": 543083, "epoch": 6543} {"train_loss": -27.376760482788086, "global_step": 543084, "epoch": 6543} {"train_loss": -27.379026412963867, "global_step": 543085, "epoch": 6543} {"train_loss": -27.43671226501465, "global_step": 543086, "epoch": 6543} {"train_loss": -27.27366065979004, "global_step": 543087, "epoch": 6543} {"train_loss": -27.589771270751953, "global_step": 543088, "epoch": 6543} {"train_loss": -27.28435707092285, "global_step": 543089, "epoch": 6543} {"train_loss": -27.615447998046875, "global_step": 543090, "epoch": 6543} {"train_loss": -27.34010124206543, "global_step": 543091, "epoch": 6543} {"train_loss": -27.135766983032227, "global_step": 543092, "epoch": 6543} {"train_loss": -27.38421630859375, "global_step": 543093, "epoch": 6543} {"train_loss": -27.497360229492188, "global_step": 543094, "epoch": 6543} {"train_loss": -27.674575805664062, "global_step": 543095, "epoch": 6543} {"train_loss": -27.578229904174805, "global_step": 543096, "epoch": 6543} {"train_loss": -27.726318359375, "global_step": 543097, "epoch": 6543} {"train_loss": -27.619653701782227, "global_step": 543098, "epoch": 6543} {"train_loss": -27.268041610717773, "global_step": 543099, "epoch": 6543} {"train_loss": -27.62876319885254, "global_step": 543100, "epoch": 6543} {"train_loss": -27.7164249420166, "global_step": 543101, "epoch": 6543} {"train_loss": -27.54819107055664, "global_step": 543102, "epoch": 6543} {"train_loss": -27.781509399414062, "global_step": 543103, "epoch": 6543} {"train_loss": -27.454198837280273, "global_step": 543104, "epoch": 6543} {"train_loss": -27.48505210876465, "global_step": 543105, "epoch": 6543} {"train_loss": -27.98606300354004, "global_step": 543106, "epoch": 6543} {"train_loss": -27.86797523498535, "global_step": 543107, "epoch": 6543} {"train_loss": -27.505598068237305, "global_step": 543108, "epoch": 6543} {"train_loss": -28.024641036987305, "global_step": 543109, "epoch": 6543} {"train_loss": -27.66897964477539, "global_step": 543110, "epoch": 6543} {"train_loss": -27.903045654296875, "global_step": 543111, "epoch": 6543} {"train_loss": -28.128772735595703, "global_step": 543112, "epoch": 6543} {"train_loss": -27.764822006225586, "global_step": 543113, "epoch": 6543} {"train_loss": -27.72364616394043, "global_step": 543114, "epoch": 6543} {"train_loss": -27.503263473510742, "global_step": 543115, "epoch": 6543} {"train_loss": -27.837018966674805, "global_step": 543116, "epoch": 6543} {"train_loss": -28.1217098236084, "global_step": 543117, "epoch": 6543} {"train_loss": -27.9527530670166, "global_step": 543118, "epoch": 6543} {"train_loss": -27.78785514831543, "global_step": 543119, "epoch": 6543} {"train_loss": -27.86787223815918, "global_step": 543120, "epoch": 6543} {"train_loss": -27.014394760131836, "global_step": 543121, "epoch": 6543} {"train_loss": -26.829120635986328, "global_step": 543122, "epoch": 6543} {"train_loss": -25.681140899658203, "global_step": 543123, "epoch": 6543} {"train_loss": -25.670989990234375, "global_step": 543124, "epoch": 6543} {"train_loss": -27.03830337524414, "global_step": 543125, "epoch": 6543} {"train_loss": -27.316808700561523, "global_step": 543126, "epoch": 6543} {"train_loss": -26.942895889282227, "global_step": 543127, "epoch": 6543} {"train_loss": -27.265539169311523, "global_step": 543128, "epoch": 6543} {"train_loss": -27.440948486328125, "global_step": 543129, "epoch": 6543} {"train_loss": -27.337305068969727, "global_step": 543130, "epoch": 6543} {"train_loss": -27.6792049407959, "global_step": 543131, "epoch": 6543} {"train_loss": -27.241727828979492, "global_step": 543132, "epoch": 6543} {"train_loss": -27.420337677001953, "global_step": 543133, "epoch": 6543} {"train_loss": -27.10546875, "global_step": 543134, "epoch": 6543} {"train_loss": -27.516027450561523, "global_step": 543135, "epoch": 6543} {"train_loss": -27.34376335144043, "global_step": 543136, "epoch": 6543} {"train_loss": -27.612319946289062, "global_step": 543137, "epoch": 6543} {"train_loss": -27.071760177612305, "global_step": 543138, "epoch": 6543} {"train_loss": -27.622100830078125, "global_step": 543139, "epoch": 6543} {"train_loss": -27.554773330688477, "global_step": 543140, "epoch": 6543} {"train_loss": -27.083209991455078, "global_step": 543141, "epoch": 6543} {"train_loss": -27.660207748413086, "global_step": 543142, "epoch": 6543} {"train_loss": -27.44081687927246, "global_step": 543143, "epoch": 6543} {"train_loss": -27.652063369750977, "global_step": 543144, "epoch": 6543} {"train_loss": -27.559885025024414, "global_step": 543145, "epoch": 6543} {"train_loss": -27.09575843811035, "global_step": 543146, "epoch": 6543} {"train_loss": -27.465576171875, "global_step": 543147, "epoch": 6543} {"train_loss": -27.130615234375, "global_step": 543148, "epoch": 6543} {"train_loss": -27.672086715698242, "global_step": 543149, "epoch": 6543} {"train_loss": -27.775510787963867, "global_step": 543150, "epoch": 6543} {"train_loss": -27.403427215943854, "global_step": 543151, "epoch": 6543, "val_loss": 6487605.0} {"train_loss": -27.000146865844727, "global_step": 543152, "epoch": 6544} {"train_loss": -26.977441787719727, "global_step": 543153, "epoch": 6544} {"train_loss": -26.484434127807617, "global_step": 543154, "epoch": 6544} {"train_loss": -27.11760902404785, "global_step": 543155, "epoch": 6544} {"train_loss": -26.938379287719727, "global_step": 543156, "epoch": 6544} {"train_loss": -26.887128829956055, "global_step": 543157, "epoch": 6544} {"train_loss": -26.95466423034668, "global_step": 543158, "epoch": 6544} {"train_loss": -27.541913986206055, "global_step": 543159, "epoch": 6544} {"train_loss": -27.186243057250977, "global_step": 543160, "epoch": 6544} {"train_loss": -27.389245986938477, "global_step": 543161, "epoch": 6544} {"train_loss": -27.639759063720703, "global_step": 543162, "epoch": 6544} {"train_loss": -26.953046798706055, "global_step": 543163, "epoch": 6544} {"train_loss": -27.2819881439209, "global_step": 543164, "epoch": 6544} {"train_loss": -27.56165885925293, "global_step": 543165, "epoch": 6544} {"train_loss": -27.240232467651367, "global_step": 543166, "epoch": 6544} {"train_loss": -27.58564567565918, "global_step": 543167, "epoch": 6544} {"train_loss": -27.662906646728516, "global_step": 543168, "epoch": 6544} {"train_loss": -27.669103622436523, "global_step": 543169, "epoch": 6544} {"train_loss": -27.657690048217773, "global_step": 543170, "epoch": 6544} {"train_loss": -27.697162628173828, "global_step": 543171, "epoch": 6544} {"train_loss": -27.357929229736328, "global_step": 543172, "epoch": 6544} {"train_loss": -27.4419002532959, "global_step": 543173, "epoch": 6544} {"train_loss": -27.539697647094727, "global_step": 543174, "epoch": 6544} {"train_loss": -27.6972599029541, "global_step": 543175, "epoch": 6544} {"train_loss": -27.691516876220703, "global_step": 543176, "epoch": 6544} {"train_loss": -27.950897216796875, "global_step": 543177, "epoch": 6544} {"train_loss": -27.767948150634766, "global_step": 543178, "epoch": 6544} {"train_loss": -27.706960678100586, "global_step": 543179, "epoch": 6544} {"train_loss": -27.37080955505371, "global_step": 543180, "epoch": 6544} {"train_loss": -27.753808975219727, "global_step": 543181, "epoch": 6544} {"train_loss": -27.775293350219727, "global_step": 543182, "epoch": 6544} {"train_loss": -27.728260040283203, "global_step": 543183, "epoch": 6544} {"train_loss": -27.635168075561523, "global_step": 543184, "epoch": 6544} {"train_loss": -28.25714111328125, "global_step": 543185, "epoch": 6544} {"train_loss": -27.571508407592773, "global_step": 543186, "epoch": 6544} {"train_loss": -27.549856185913086, "global_step": 543187, "epoch": 6544} {"train_loss": -27.72043800354004, "global_step": 543188, "epoch": 6544} {"train_loss": -28.085363388061523, "global_step": 543189, "epoch": 6544} {"train_loss": -27.921628952026367, "global_step": 543190, "epoch": 6544} {"train_loss": -27.64228630065918, "global_step": 543191, "epoch": 6544} {"train_loss": -27.948583602905273, "global_step": 543192, "epoch": 6544} {"train_loss": -27.622365951538086, "global_step": 543193, "epoch": 6544} {"train_loss": -27.458402633666992, "global_step": 543194, "epoch": 6544} {"train_loss": -27.8315372467041, "global_step": 543195, "epoch": 6544} {"train_loss": -27.8007755279541, "global_step": 543196, "epoch": 6544} {"train_loss": -27.757694244384766, "global_step": 543197, "epoch": 6544} {"train_loss": -27.45782470703125, "global_step": 543198, "epoch": 6544} {"train_loss": -27.675460815429688, "global_step": 543199, "epoch": 6544} {"train_loss": -27.698902130126953, "global_step": 543200, "epoch": 6544} {"train_loss": -27.775930404663086, "global_step": 543201, "epoch": 6544} {"train_loss": -27.6353702545166, "global_step": 543202, "epoch": 6544} {"train_loss": -27.836088180541992, "global_step": 543203, "epoch": 6544} {"train_loss": -28.053180694580078, "global_step": 543204, "epoch": 6544} {"train_loss": -27.667240142822266, "global_step": 543205, "epoch": 6544} {"train_loss": -27.667367935180664, "global_step": 543206, "epoch": 6544} {"train_loss": -27.729398727416992, "global_step": 543207, "epoch": 6544} {"train_loss": -27.919553756713867, "global_step": 543208, "epoch": 6544} {"train_loss": -27.802749633789062, "global_step": 543209, "epoch": 6544} {"train_loss": -27.768579483032227, "global_step": 543210, "epoch": 6544} {"train_loss": -28.268491744995117, "global_step": 543211, "epoch": 6544} {"train_loss": -27.818939208984375, "global_step": 543212, "epoch": 6544} {"train_loss": -27.466283798217773, "global_step": 543213, "epoch": 6544} {"train_loss": -27.592731475830078, "global_step": 543214, "epoch": 6544} {"train_loss": -27.547672271728516, "global_step": 543215, "epoch": 6544} {"train_loss": -27.243682861328125, "global_step": 543216, "epoch": 6544} {"train_loss": -27.70208740234375, "global_step": 543217, "epoch": 6544} {"train_loss": -27.623706817626953, "global_step": 543218, "epoch": 6544} {"train_loss": -27.686628341674805, "global_step": 543219, "epoch": 6544} {"train_loss": -27.771825790405273, "global_step": 543220, "epoch": 6544} {"train_loss": -27.461612701416016, "global_step": 543221, "epoch": 6544} {"train_loss": -27.593778610229492, "global_step": 543222, "epoch": 6544} {"train_loss": -27.8532772064209, "global_step": 543223, "epoch": 6544} {"train_loss": -27.896764755249023, "global_step": 543224, "epoch": 6544} {"train_loss": -28.0931339263916, "global_step": 543225, "epoch": 6544} {"train_loss": -27.7518310546875, "global_step": 543226, "epoch": 6544} {"train_loss": -27.912933349609375, "global_step": 543227, "epoch": 6544} {"train_loss": -27.81866455078125, "global_step": 543228, "epoch": 6544} {"train_loss": -27.6934814453125, "global_step": 543229, "epoch": 6544} {"train_loss": -27.783405303955078, "global_step": 543230, "epoch": 6544} {"train_loss": -27.715137481689453, "global_step": 543231, "epoch": 6544} {"train_loss": -27.88555908203125, "global_step": 543232, "epoch": 6544} {"train_loss": -27.457319259643555, "global_step": 543233, "epoch": 6544} {"train_loss": -27.62485092806529, "global_step": 543234, "epoch": 6544, "val_loss": 6511732.5} {"train_loss": -27.36720085144043, "global_step": 543235, "epoch": 6545} {"train_loss": -26.55611228942871, "global_step": 543236, "epoch": 6545} {"train_loss": -26.52626609802246, "global_step": 543237, "epoch": 6545} {"train_loss": -27.21467399597168, "global_step": 543238, "epoch": 6545} {"train_loss": -27.34894371032715, "global_step": 543239, "epoch": 6545} {"train_loss": -27.655874252319336, "global_step": 543240, "epoch": 6545} {"train_loss": -27.46681022644043, "global_step": 543241, "epoch": 6545} {"train_loss": -27.52601432800293, "global_step": 543242, "epoch": 6545} {"train_loss": -27.603717803955078, "global_step": 543243, "epoch": 6545} {"train_loss": -27.422155380249023, "global_step": 543244, "epoch": 6545} {"train_loss": -27.761838912963867, "global_step": 543245, "epoch": 6545} {"train_loss": -27.564016342163086, "global_step": 543246, "epoch": 6545} {"train_loss": -27.507177352905273, "global_step": 543247, "epoch": 6545} {"train_loss": -27.39692497253418, "global_step": 543248, "epoch": 6545} {"train_loss": -27.420759201049805, "global_step": 543249, "epoch": 6545} {"train_loss": -27.566253662109375, "global_step": 543250, "epoch": 6545} {"train_loss": -26.911218643188477, "global_step": 543251, "epoch": 6545} {"train_loss": -27.483457565307617, "global_step": 543252, "epoch": 6545} {"train_loss": -27.207046508789062, "global_step": 543253, "epoch": 6545} {"train_loss": -27.793867111206055, "global_step": 543254, "epoch": 6545} {"train_loss": -27.916522979736328, "global_step": 543255, "epoch": 6545} {"train_loss": -27.51264762878418, "global_step": 543256, "epoch": 6545} {"train_loss": -27.375776290893555, "global_step": 543257, "epoch": 6545} {"train_loss": -27.550662994384766, "global_step": 543258, "epoch": 6545} {"train_loss": -27.024322509765625, "global_step": 543259, "epoch": 6545} {"train_loss": -27.626073837280273, "global_step": 543260, "epoch": 6545} {"train_loss": -28.079010009765625, "global_step": 543261, "epoch": 6545} {"train_loss": -27.412992477416992, "global_step": 543262, "epoch": 6545} {"train_loss": -27.477380752563477, "global_step": 543263, "epoch": 6545} {"train_loss": -27.683591842651367, "global_step": 543264, "epoch": 6545} {"train_loss": -27.577444076538086, "global_step": 543265, "epoch": 6545} {"train_loss": -27.5671329498291, "global_step": 543266, "epoch": 6545} {"train_loss": -27.502233505249023, "global_step": 543267, "epoch": 6545} {"train_loss": -27.97722816467285, "global_step": 543268, "epoch": 6545} {"train_loss": -27.649316787719727, "global_step": 543269, "epoch": 6545} {"train_loss": -27.557510375976562, "global_step": 543270, "epoch": 6545} {"train_loss": -27.659149169921875, "global_step": 543271, "epoch": 6545} {"train_loss": -27.48268699645996, "global_step": 543272, "epoch": 6545} {"train_loss": -27.70985221862793, "global_step": 543273, "epoch": 6545} {"train_loss": -27.330078125, "global_step": 543274, "epoch": 6545} {"train_loss": -27.76388931274414, "global_step": 543275, "epoch": 6545} {"train_loss": -28.058435440063477, "global_step": 543276, "epoch": 6545} {"train_loss": -27.726598739624023, "global_step": 543277, "epoch": 6545} {"train_loss": -28.39322853088379, "global_step": 543278, "epoch": 6545} {"train_loss": -27.70557975769043, "global_step": 543279, "epoch": 6545} {"train_loss": -28.013050079345703, "global_step": 543280, "epoch": 6545} {"train_loss": -27.800769805908203, "global_step": 543281, "epoch": 6545} {"train_loss": -27.887527465820312, "global_step": 543282, "epoch": 6545} {"train_loss": -27.731042861938477, "global_step": 543283, "epoch": 6545} {"train_loss": -27.962827682495117, "global_step": 543284, "epoch": 6545} {"train_loss": -27.76923942565918, "global_step": 543285, "epoch": 6545} {"train_loss": -27.7921085357666, "global_step": 543286, "epoch": 6545} {"train_loss": -28.144245147705078, "global_step": 543287, "epoch": 6545} {"train_loss": -27.854284286499023, "global_step": 543288, "epoch": 6545} {"train_loss": -27.64396095275879, "global_step": 543289, "epoch": 6545} {"train_loss": -27.35770606994629, "global_step": 543290, "epoch": 6545} {"train_loss": -27.738046646118164, "global_step": 543291, "epoch": 6545} {"train_loss": -27.711151123046875, "global_step": 543292, "epoch": 6545} {"train_loss": -27.40096092224121, "global_step": 543293, "epoch": 6545} {"train_loss": -27.757389068603516, "global_step": 543294, "epoch": 6545} {"train_loss": -27.325550079345703, "global_step": 543295, "epoch": 6545} {"train_loss": -27.08270835876465, "global_step": 543296, "epoch": 6545} {"train_loss": -27.554794311523438, "global_step": 543297, "epoch": 6545} {"train_loss": -27.34104347229004, "global_step": 543298, "epoch": 6545} {"train_loss": -27.605915069580078, "global_step": 543299, "epoch": 6545} {"train_loss": -27.591012954711914, "global_step": 543300, "epoch": 6545} {"train_loss": -27.562780380249023, "global_step": 543301, "epoch": 6545} {"train_loss": -27.49128532409668, "global_step": 543302, "epoch": 6545} {"train_loss": -27.770139694213867, "global_step": 543303, "epoch": 6545} {"train_loss": -27.391529083251953, "global_step": 543304, "epoch": 6545} {"train_loss": -27.727725982666016, "global_step": 543305, "epoch": 6545} {"train_loss": -27.847686767578125, "global_step": 543306, "epoch": 6545} {"train_loss": -27.92807388305664, "global_step": 543307, "epoch": 6545} {"train_loss": -27.88697624206543, "global_step": 543308, "epoch": 6545} {"train_loss": -28.18596839904785, "global_step": 543309, "epoch": 6545} {"train_loss": -27.658954620361328, "global_step": 543310, "epoch": 6545} {"train_loss": -28.056732177734375, "global_step": 543311, "epoch": 6545} {"train_loss": -27.935474395751953, "global_step": 543312, "epoch": 6545} {"train_loss": -27.929889678955078, "global_step": 543313, "epoch": 6545} {"train_loss": -27.69101333618164, "global_step": 543314, "epoch": 6545} {"train_loss": -27.73968505859375, "global_step": 543315, "epoch": 6545} {"train_loss": -27.864622116088867, "global_step": 543316, "epoch": 6545} {"train_loss": -27.622282235019178, "global_step": 543317, "epoch": 6545, "val_loss": 6507015.5} {"train_loss": -27.187559127807617, "global_step": 543318, "epoch": 6546} {"train_loss": -27.469650268554688, "global_step": 543319, "epoch": 6546} {"train_loss": -26.95802879333496, "global_step": 543320, "epoch": 6546} {"train_loss": -27.542938232421875, "global_step": 543321, "epoch": 6546} {"train_loss": -27.63079261779785, "global_step": 543322, "epoch": 6546} {"train_loss": -27.605005264282227, "global_step": 543323, "epoch": 6546} {"train_loss": -27.7567081451416, "global_step": 543324, "epoch": 6546} {"train_loss": -27.88227653503418, "global_step": 543325, "epoch": 6546} {"train_loss": -27.59919548034668, "global_step": 543326, "epoch": 6546} {"train_loss": -27.77964210510254, "global_step": 543327, "epoch": 6546} {"train_loss": -27.59663200378418, "global_step": 543328, "epoch": 6546} {"train_loss": -27.797046661376953, "global_step": 543329, "epoch": 6546} {"train_loss": -27.55439567565918, "global_step": 543330, "epoch": 6546} {"train_loss": -27.525604248046875, "global_step": 543331, "epoch": 6546} {"train_loss": -27.78180503845215, "global_step": 543332, "epoch": 6546} {"train_loss": -27.184675216674805, "global_step": 543333, "epoch": 6546} {"train_loss": -27.57404136657715, "global_step": 543334, "epoch": 6546} {"train_loss": -27.793048858642578, "global_step": 543335, "epoch": 6546} {"train_loss": -27.684965133666992, "global_step": 543336, "epoch": 6546} {"train_loss": -27.42365074157715, "global_step": 543337, "epoch": 6546} {"train_loss": -27.6400203704834, "global_step": 543338, "epoch": 6546} {"train_loss": -27.919767379760742, "global_step": 543339, "epoch": 6546} {"train_loss": -27.328632354736328, "global_step": 543340, "epoch": 6546} {"train_loss": -27.650379180908203, "global_step": 543341, "epoch": 6546} {"train_loss": -27.243330001831055, "global_step": 543342, "epoch": 6546} {"train_loss": -27.4328556060791, "global_step": 543343, "epoch": 6546} {"train_loss": -27.2667236328125, "global_step": 543344, "epoch": 6546} {"train_loss": -27.691211700439453, "global_step": 543345, "epoch": 6546} {"train_loss": -27.453094482421875, "global_step": 543346, "epoch": 6546} {"train_loss": -27.660018920898438, "global_step": 543347, "epoch": 6546} {"train_loss": -27.423643112182617, "global_step": 543348, "epoch": 6546} {"train_loss": -28.016088485717773, "global_step": 543349, "epoch": 6546} {"train_loss": -27.77850914001465, "global_step": 543350, "epoch": 6546} {"train_loss": -27.9952335357666, "global_step": 543351, "epoch": 6546} {"train_loss": -27.673675537109375, "global_step": 543352, "epoch": 6546} {"train_loss": -27.486865997314453, "global_step": 543353, "epoch": 6546} {"train_loss": -27.34315299987793, "global_step": 543354, "epoch": 6546} {"train_loss": -28.01337242126465, "global_step": 543355, "epoch": 6546} {"train_loss": -27.7830753326416, "global_step": 543356, "epoch": 6546} {"train_loss": -27.936471939086914, "global_step": 543357, "epoch": 6546} {"train_loss": -27.733510971069336, "global_step": 543358, "epoch": 6546} {"train_loss": -27.686758041381836, "global_step": 543359, "epoch": 6546} {"train_loss": -27.54558753967285, "global_step": 543360, "epoch": 6546} {"train_loss": -27.9002685546875, "global_step": 543361, "epoch": 6546} {"train_loss": -27.825199127197266, "global_step": 543362, "epoch": 6546} {"train_loss": -28.048486709594727, "global_step": 543363, "epoch": 6546} {"train_loss": -27.643781661987305, "global_step": 543364, "epoch": 6546} {"train_loss": -28.418882369995117, "global_step": 543365, "epoch": 6546} {"train_loss": -27.93659782409668, "global_step": 543366, "epoch": 6546} {"train_loss": -27.893457412719727, "global_step": 543367, "epoch": 6546} {"train_loss": -27.708709716796875, "global_step": 543368, "epoch": 6546} {"train_loss": -27.636005401611328, "global_step": 543369, "epoch": 6546} {"train_loss": -27.9306697845459, "global_step": 543370, "epoch": 6546} {"train_loss": -27.518552780151367, "global_step": 543371, "epoch": 6546} {"train_loss": -27.770984649658203, "global_step": 543372, "epoch": 6546} {"train_loss": -27.278772354125977, "global_step": 543373, "epoch": 6546} {"train_loss": -27.231098175048828, "global_step": 543374, "epoch": 6546} {"train_loss": -27.01850700378418, "global_step": 543375, "epoch": 6546} {"train_loss": -27.074121475219727, "global_step": 543376, "epoch": 6546} {"train_loss": -27.360273361206055, "global_step": 543377, "epoch": 6546} {"train_loss": -27.63327980041504, "global_step": 543378, "epoch": 6546} {"train_loss": -27.3442440032959, "global_step": 543379, "epoch": 6546} {"train_loss": -27.409595489501953, "global_step": 543380, "epoch": 6546} {"train_loss": -27.77603530883789, "global_step": 543381, "epoch": 6546} {"train_loss": -27.672565460205078, "global_step": 543382, "epoch": 6546} {"train_loss": -27.174915313720703, "global_step": 543383, "epoch": 6546} {"train_loss": -26.94953727722168, "global_step": 543384, "epoch": 6546} {"train_loss": -27.629358291625977, "global_step": 543385, "epoch": 6546} {"train_loss": -27.732694625854492, "global_step": 543386, "epoch": 6546} {"train_loss": -27.92424964904785, "global_step": 543387, "epoch": 6546} {"train_loss": -27.9486026763916, "global_step": 543388, "epoch": 6546} {"train_loss": -27.53901481628418, "global_step": 543389, "epoch": 6546} {"train_loss": -27.061920166015625, "global_step": 543390, "epoch": 6546} {"train_loss": -27.902250289916992, "global_step": 543391, "epoch": 6546} {"train_loss": -27.480331420898438, "global_step": 543392, "epoch": 6546} {"train_loss": -27.588544845581055, "global_step": 543393, "epoch": 6546} {"train_loss": -28.022153854370117, "global_step": 543394, "epoch": 6546} {"train_loss": -27.759424209594727, "global_step": 543395, "epoch": 6546} {"train_loss": -27.551361083984375, "global_step": 543396, "epoch": 6546} {"train_loss": -27.650320053100586, "global_step": 543397, "epoch": 6546} {"train_loss": -27.554828643798828, "global_step": 543398, "epoch": 6546} {"train_loss": -27.54627799987793, "global_step": 543399, "epoch": 6546} {"train_loss": -27.617007473865186, "global_step": 543400, "epoch": 6546, "val_loss": 6496947.0} {"train_loss": -27.103178024291992, "global_step": 543401, "epoch": 6547} {"train_loss": -27.37088394165039, "global_step": 543402, "epoch": 6547} {"train_loss": -27.451034545898438, "global_step": 543403, "epoch": 6547} {"train_loss": -27.15290641784668, "global_step": 543404, "epoch": 6547} {"train_loss": -27.43525505065918, "global_step": 543405, "epoch": 6547} {"train_loss": -27.242572784423828, "global_step": 543406, "epoch": 6547} {"train_loss": -27.169342041015625, "global_step": 543407, "epoch": 6547} {"train_loss": -27.419641494750977, "global_step": 543408, "epoch": 6547} {"train_loss": -27.423938751220703, "global_step": 543409, "epoch": 6547} {"train_loss": -27.471059799194336, "global_step": 543410, "epoch": 6547} {"train_loss": -27.2427921295166, "global_step": 543411, "epoch": 6547} {"train_loss": -27.404987335205078, "global_step": 543412, "epoch": 6547} {"train_loss": -27.444303512573242, "global_step": 543413, "epoch": 6547} {"train_loss": -27.459369659423828, "global_step": 543414, "epoch": 6547} {"train_loss": -27.391403198242188, "global_step": 543415, "epoch": 6547} {"train_loss": -27.6881046295166, "global_step": 543416, "epoch": 6547} {"train_loss": -27.73408317565918, "global_step": 543417, "epoch": 6547} {"train_loss": -27.59064292907715, "global_step": 543418, "epoch": 6547} {"train_loss": -27.659093856811523, "global_step": 543419, "epoch": 6547} {"train_loss": -27.698606491088867, "global_step": 543420, "epoch": 6547} {"train_loss": -27.39104652404785, "global_step": 543421, "epoch": 6547} {"train_loss": -27.98536491394043, "global_step": 543422, "epoch": 6547} {"train_loss": -27.356555938720703, "global_step": 543423, "epoch": 6547} {"train_loss": -27.66826820373535, "global_step": 543424, "epoch": 6547} {"train_loss": -27.75554847717285, "global_step": 543425, "epoch": 6547} {"train_loss": -27.692325592041016, "global_step": 543426, "epoch": 6547} {"train_loss": -28.05380630493164, "global_step": 543427, "epoch": 6547} {"train_loss": -28.03887367248535, "global_step": 543428, "epoch": 6547} {"train_loss": -27.516387939453125, "global_step": 543429, "epoch": 6547} {"train_loss": -27.687793731689453, "global_step": 543430, "epoch": 6547} {"train_loss": -28.07098960876465, "global_step": 543431, "epoch": 6547} {"train_loss": -27.603927612304688, "global_step": 543432, "epoch": 6547} {"train_loss": -27.57815933227539, "global_step": 543433, "epoch": 6547} {"train_loss": -27.870187759399414, "global_step": 543434, "epoch": 6547} {"train_loss": -27.620615005493164, "global_step": 543435, "epoch": 6547} {"train_loss": -27.754911422729492, "global_step": 543436, "epoch": 6547} {"train_loss": -27.859724044799805, "global_step": 543437, "epoch": 6547} {"train_loss": -27.64497184753418, "global_step": 543438, "epoch": 6547} {"train_loss": -27.62371253967285, "global_step": 543439, "epoch": 6547} {"train_loss": -27.925872802734375, "global_step": 543440, "epoch": 6547} {"train_loss": -27.917465209960938, "global_step": 543441, "epoch": 6547} {"train_loss": -27.532835006713867, "global_step": 543442, "epoch": 6547} {"train_loss": -27.947132110595703, "global_step": 543443, "epoch": 6547} {"train_loss": -28.13238525390625, "global_step": 543444, "epoch": 6547} {"train_loss": -27.63824462890625, "global_step": 543445, "epoch": 6547} {"train_loss": -27.795856475830078, "global_step": 543446, "epoch": 6547} {"train_loss": -27.740589141845703, "global_step": 543447, "epoch": 6547} {"train_loss": -27.801593780517578, "global_step": 543448, "epoch": 6547} {"train_loss": -28.115097045898438, "global_step": 543449, "epoch": 6547} {"train_loss": -27.479938507080078, "global_step": 543450, "epoch": 6547} {"train_loss": -27.570911407470703, "global_step": 543451, "epoch": 6547} {"train_loss": -27.942153930664062, "global_step": 543452, "epoch": 6547} {"train_loss": -27.632080078125, "global_step": 543453, "epoch": 6547} {"train_loss": -27.906171798706055, "global_step": 543454, "epoch": 6547} {"train_loss": -28.057987213134766, "global_step": 543455, "epoch": 6547} {"train_loss": -27.471847534179688, "global_step": 543456, "epoch": 6547} {"train_loss": -27.96563148498535, "global_step": 543457, "epoch": 6547} {"train_loss": -27.549518585205078, "global_step": 543458, "epoch": 6547} {"train_loss": -27.651824951171875, "global_step": 543459, "epoch": 6547} {"train_loss": -27.45045280456543, "global_step": 543460, "epoch": 6547} {"train_loss": -27.753997802734375, "global_step": 543461, "epoch": 6547} {"train_loss": -27.589139938354492, "global_step": 543462, "epoch": 6547} {"train_loss": -27.43214225769043, "global_step": 543463, "epoch": 6547} {"train_loss": -27.465606689453125, "global_step": 543464, "epoch": 6547} {"train_loss": -27.536108016967773, "global_step": 543465, "epoch": 6547} {"train_loss": -27.72198486328125, "global_step": 543466, "epoch": 6547} {"train_loss": -27.725622177124023, "global_step": 543467, "epoch": 6547} {"train_loss": -27.866897583007812, "global_step": 543468, "epoch": 6547} {"train_loss": -27.78680992126465, "global_step": 543469, "epoch": 6547} {"train_loss": -27.548675537109375, "global_step": 543470, "epoch": 6547} {"train_loss": -26.751373291015625, "global_step": 543471, "epoch": 6547} {"train_loss": -27.125486373901367, "global_step": 543472, "epoch": 6547} {"train_loss": -27.61141014099121, "global_step": 543473, "epoch": 6547} {"train_loss": -27.895483016967773, "global_step": 543474, "epoch": 6547} {"train_loss": -27.427610397338867, "global_step": 543475, "epoch": 6547} {"train_loss": -27.601903915405273, "global_step": 543476, "epoch": 6547} {"train_loss": -27.464893341064453, "global_step": 543477, "epoch": 6547} {"train_loss": -27.73736572265625, "global_step": 543478, "epoch": 6547} {"train_loss": -27.607336044311523, "global_step": 543479, "epoch": 6547} {"train_loss": -27.842823028564453, "global_step": 543480, "epoch": 6547} {"train_loss": -27.959924697875977, "global_step": 543481, "epoch": 6547} {"train_loss": -27.766376495361328, "global_step": 543482, "epoch": 6547} {"train_loss": -27.62633342053517, "global_step": 543483, "epoch": 6547, "val_loss": 6534554.0} {"train_loss": -27.086652755737305, "global_step": 543484, "epoch": 6548} {"train_loss": -26.732166290283203, "global_step": 543485, "epoch": 6548} {"train_loss": -26.921396255493164, "global_step": 543486, "epoch": 6548} {"train_loss": -27.11358070373535, "global_step": 543487, "epoch": 6548} {"train_loss": -27.042724609375, "global_step": 543488, "epoch": 6548} {"train_loss": -26.82916831970215, "global_step": 543489, "epoch": 6548} {"train_loss": -26.6356201171875, "global_step": 543490, "epoch": 6548} {"train_loss": -27.78719139099121, "global_step": 543491, "epoch": 6548} {"train_loss": -27.05293846130371, "global_step": 543492, "epoch": 6548} {"train_loss": -26.975248336791992, "global_step": 543493, "epoch": 6548} {"train_loss": -26.887781143188477, "global_step": 543494, "epoch": 6548} {"train_loss": -26.550668716430664, "global_step": 543495, "epoch": 6548} {"train_loss": -26.95204734802246, "global_step": 543496, "epoch": 6548} {"train_loss": -27.296329498291016, "global_step": 543497, "epoch": 6548} {"train_loss": -27.245426177978516, "global_step": 543498, "epoch": 6548} {"train_loss": -26.885847091674805, "global_step": 543499, "epoch": 6548} {"train_loss": -27.11138343811035, "global_step": 543500, "epoch": 6548} {"train_loss": -27.849172592163086, "global_step": 543501, "epoch": 6548} {"train_loss": -27.239582061767578, "global_step": 543502, "epoch": 6548} {"train_loss": -27.259963989257812, "global_step": 543503, "epoch": 6548} {"train_loss": -27.409286499023438, "global_step": 543504, "epoch": 6548} {"train_loss": -26.957731246948242, "global_step": 543505, "epoch": 6548} {"train_loss": -27.26011085510254, "global_step": 543506, "epoch": 6548} {"train_loss": -27.239103317260742, "global_step": 543507, "epoch": 6548} {"train_loss": -27.482635498046875, "global_step": 543508, "epoch": 6548} {"train_loss": -27.334213256835938, "global_step": 543509, "epoch": 6548} {"train_loss": -27.452917098999023, "global_step": 543510, "epoch": 6548} {"train_loss": -27.381423950195312, "global_step": 543511, "epoch": 6548} {"train_loss": -27.4183349609375, "global_step": 543512, "epoch": 6548} {"train_loss": -27.432849884033203, "global_step": 543513, "epoch": 6548} {"train_loss": -27.319746017456055, "global_step": 543514, "epoch": 6548} {"train_loss": -27.51997184753418, "global_step": 543515, "epoch": 6548} {"train_loss": -27.773956298828125, "global_step": 543516, "epoch": 6548} {"train_loss": -27.747852325439453, "global_step": 543517, "epoch": 6548} {"train_loss": -27.588775634765625, "global_step": 543518, "epoch": 6548} {"train_loss": -27.583707809448242, "global_step": 543519, "epoch": 6548} {"train_loss": -27.8857364654541, "global_step": 543520, "epoch": 6548} {"train_loss": -27.37210464477539, "global_step": 543521, "epoch": 6548} {"train_loss": -27.059803009033203, "global_step": 543522, "epoch": 6548} {"train_loss": -27.667505264282227, "global_step": 543523, "epoch": 6548} {"train_loss": -27.928735733032227, "global_step": 543524, "epoch": 6548} {"train_loss": -27.40228271484375, "global_step": 543525, "epoch": 6548} {"train_loss": -27.722091674804688, "global_step": 543526, "epoch": 6548} {"train_loss": -27.71099281311035, "global_step": 543527, "epoch": 6548} {"train_loss": -27.506559371948242, "global_step": 543528, "epoch": 6548} {"train_loss": -27.834009170532227, "global_step": 543529, "epoch": 6548} {"train_loss": -27.771595001220703, "global_step": 543530, "epoch": 6548} {"train_loss": -27.975202560424805, "global_step": 543531, "epoch": 6548} {"train_loss": -27.618261337280273, "global_step": 543532, "epoch": 6548} {"train_loss": -27.853530883789062, "global_step": 543533, "epoch": 6548} {"train_loss": -27.608753204345703, "global_step": 543534, "epoch": 6548} {"train_loss": -27.482751846313477, "global_step": 543535, "epoch": 6548} {"train_loss": -27.821247100830078, "global_step": 543536, "epoch": 6548} {"train_loss": -27.570775985717773, "global_step": 543537, "epoch": 6548} {"train_loss": -27.76031494140625, "global_step": 543538, "epoch": 6548} {"train_loss": -27.67524528503418, "global_step": 543539, "epoch": 6548} {"train_loss": -27.79665184020996, "global_step": 543540, "epoch": 6548} {"train_loss": -27.78677749633789, "global_step": 543541, "epoch": 6548} {"train_loss": -27.524343490600586, "global_step": 543542, "epoch": 6548} {"train_loss": -27.847949981689453, "global_step": 543543, "epoch": 6548} {"train_loss": -27.66202735900879, "global_step": 543544, "epoch": 6548} {"train_loss": -27.855634689331055, "global_step": 543545, "epoch": 6548} {"train_loss": -28.116119384765625, "global_step": 543546, "epoch": 6548} {"train_loss": -27.963590621948242, "global_step": 543547, "epoch": 6548} {"train_loss": -28.00834083557129, "global_step": 543548, "epoch": 6548} {"train_loss": -28.021886825561523, "global_step": 543549, "epoch": 6548} {"train_loss": -27.748554229736328, "global_step": 543550, "epoch": 6548} {"train_loss": -27.204635620117188, "global_step": 543551, "epoch": 6548} {"train_loss": -27.076444625854492, "global_step": 543552, "epoch": 6548} {"train_loss": -27.25465202331543, "global_step": 543553, "epoch": 6548} {"train_loss": -27.1186466217041, "global_step": 543554, "epoch": 6548} {"train_loss": -27.08351707458496, "global_step": 543555, "epoch": 6548} {"train_loss": -27.78179359436035, "global_step": 543556, "epoch": 6548} {"train_loss": -27.723875045776367, "global_step": 543557, "epoch": 6548} {"train_loss": -27.67879295349121, "global_step": 543558, "epoch": 6548} {"train_loss": -27.844635009765625, "global_step": 543559, "epoch": 6548} {"train_loss": -27.61990737915039, "global_step": 543560, "epoch": 6548} {"train_loss": -27.7667179107666, "global_step": 543561, "epoch": 6548} {"train_loss": -27.51495933532715, "global_step": 543562, "epoch": 6548} {"train_loss": -27.783435821533203, "global_step": 543563, "epoch": 6548} {"train_loss": -27.908979415893555, "global_step": 543564, "epoch": 6548} {"train_loss": -27.50577735900879, "global_step": 543565, "epoch": 6548} {"train_loss": -27.47367355622441, "global_step": 543566, "epoch": 6548, "val_loss": 6515327.5} {"train_loss": -27.402484893798828, "global_step": 543567, "epoch": 6549} {"train_loss": -27.175537109375, "global_step": 543568, "epoch": 6549} {"train_loss": -26.857778549194336, "global_step": 543569, "epoch": 6549} {"train_loss": -27.144840240478516, "global_step": 543570, "epoch": 6549} {"train_loss": -27.1573486328125, "global_step": 543571, "epoch": 6549} {"train_loss": -27.141584396362305, "global_step": 543572, "epoch": 6549} {"train_loss": -27.341876983642578, "global_step": 543573, "epoch": 6549} {"train_loss": -27.194507598876953, "global_step": 543574, "epoch": 6549} {"train_loss": -27.285730361938477, "global_step": 543575, "epoch": 6549} {"train_loss": -27.21894645690918, "global_step": 543576, "epoch": 6549} {"train_loss": -27.200284957885742, "global_step": 543577, "epoch": 6549} {"train_loss": -27.3319034576416, "global_step": 543578, "epoch": 6549} {"train_loss": -27.344512939453125, "global_step": 543579, "epoch": 6549} {"train_loss": -27.91754722595215, "global_step": 543580, "epoch": 6549} {"train_loss": -26.928991317749023, "global_step": 543581, "epoch": 6549} {"train_loss": -27.421283721923828, "global_step": 543582, "epoch": 6549} {"train_loss": -27.870868682861328, "global_step": 543583, "epoch": 6549} {"train_loss": -27.371601104736328, "global_step": 543584, "epoch": 6549} {"train_loss": -27.395648956298828, "global_step": 543585, "epoch": 6549} {"train_loss": -27.58638572692871, "global_step": 543586, "epoch": 6549} {"train_loss": -27.421422958374023, "global_step": 543587, "epoch": 6549} {"train_loss": -27.736108779907227, "global_step": 543588, "epoch": 6549} {"train_loss": -27.38490104675293, "global_step": 543589, "epoch": 6549} {"train_loss": -27.404712677001953, "global_step": 543590, "epoch": 6549} {"train_loss": -27.35895347595215, "global_step": 543591, "epoch": 6549} {"train_loss": -27.516845703125, "global_step": 543592, "epoch": 6549} {"train_loss": -27.230192184448242, "global_step": 543593, "epoch": 6549} {"train_loss": -27.930484771728516, "global_step": 543594, "epoch": 6549} {"train_loss": -27.406835556030273, "global_step": 543595, "epoch": 6549} {"train_loss": -27.60345458984375, "global_step": 543596, "epoch": 6549} {"train_loss": -27.179977416992188, "global_step": 543597, "epoch": 6549} {"train_loss": -27.396326065063477, "global_step": 543598, "epoch": 6549} {"train_loss": -27.65423583984375, "global_step": 543599, "epoch": 6549} {"train_loss": -27.965444564819336, "global_step": 543600, "epoch": 6549} {"train_loss": -27.68255043029785, "global_step": 543601, "epoch": 6549} {"train_loss": -27.952680587768555, "global_step": 543602, "epoch": 6549} {"train_loss": -27.827396392822266, "global_step": 543603, "epoch": 6549} {"train_loss": -27.53017234802246, "global_step": 543604, "epoch": 6549} {"train_loss": -27.8018741607666, "global_step": 543605, "epoch": 6549} {"train_loss": -27.58272361755371, "global_step": 543606, "epoch": 6549} {"train_loss": -27.67311668395996, "global_step": 543607, "epoch": 6549} {"train_loss": -27.948049545288086, "global_step": 543608, "epoch": 6549} {"train_loss": -27.394515991210938, "global_step": 543609, "epoch": 6549} {"train_loss": -27.578718185424805, "global_step": 543610, "epoch": 6549} {"train_loss": -27.738683700561523, "global_step": 543611, "epoch": 6549} {"train_loss": -27.981428146362305, "global_step": 543612, "epoch": 6549} {"train_loss": -27.511632919311523, "global_step": 543613, "epoch": 6549} {"train_loss": -27.858861923217773, "global_step": 543614, "epoch": 6549} {"train_loss": -27.748016357421875, "global_step": 543615, "epoch": 6549} {"train_loss": -27.96489906311035, "global_step": 543616, "epoch": 6549} {"train_loss": -27.56024169921875, "global_step": 543617, "epoch": 6549} {"train_loss": -28.1796932220459, "global_step": 543618, "epoch": 6549} {"train_loss": -27.724533081054688, "global_step": 543619, "epoch": 6549} {"train_loss": -27.766630172729492, "global_step": 543620, "epoch": 6549} {"train_loss": -27.725812911987305, "global_step": 543621, "epoch": 6549} {"train_loss": -27.839704513549805, "global_step": 543622, "epoch": 6549} {"train_loss": -28.02242088317871, "global_step": 543623, "epoch": 6549} {"train_loss": -27.921567916870117, "global_step": 543624, "epoch": 6549} {"train_loss": -27.878950119018555, "global_step": 543625, "epoch": 6549} {"train_loss": -27.389362335205078, "global_step": 543626, "epoch": 6549} {"train_loss": -27.1893310546875, "global_step": 543627, "epoch": 6549} {"train_loss": -27.49922752380371, "global_step": 543628, "epoch": 6549} {"train_loss": -27.6816463470459, "global_step": 543629, "epoch": 6549} {"train_loss": -27.672611236572266, "global_step": 543630, "epoch": 6549} {"train_loss": -27.431598663330078, "global_step": 543631, "epoch": 6549} {"train_loss": -27.373090744018555, "global_step": 543632, "epoch": 6549} {"train_loss": -27.654434204101562, "global_step": 543633, "epoch": 6549} {"train_loss": -27.264780044555664, "global_step": 543634, "epoch": 6549} {"train_loss": -27.889118194580078, "global_step": 543635, "epoch": 6549} {"train_loss": -27.714147567749023, "global_step": 543636, "epoch": 6549} {"train_loss": -27.095443725585938, "global_step": 543637, "epoch": 6549} {"train_loss": -27.346027374267578, "global_step": 543638, "epoch": 6549} {"train_loss": -27.50153923034668, "global_step": 543639, "epoch": 6549} {"train_loss": -27.690099716186523, "global_step": 543640, "epoch": 6549} {"train_loss": -27.311786651611328, "global_step": 543641, "epoch": 6549} {"train_loss": -27.42474937438965, "global_step": 543642, "epoch": 6549} {"train_loss": -27.331037521362305, "global_step": 543643, "epoch": 6549} {"train_loss": -27.50653076171875, "global_step": 543644, "epoch": 6549} {"train_loss": -27.25199317932129, "global_step": 543645, "epoch": 6549} {"train_loss": -27.1401424407959, "global_step": 543646, "epoch": 6549} {"train_loss": -27.65475845336914, "global_step": 543647, "epoch": 6549} {"train_loss": -27.680282592773438, "global_step": 543648, "epoch": 6549} {"train_loss": -27.5437160859625, "global_step": 543649, "epoch": 6549, "val_loss": 6545195.0} {"train_loss": -27.35748863220215, "global_step": 543650, "epoch": 6550} {"train_loss": -27.545124053955078, "global_step": 543651, "epoch": 6550} {"train_loss": -27.3306941986084, "global_step": 543652, "epoch": 6550} {"train_loss": -27.282499313354492, "global_step": 543653, "epoch": 6550} {"train_loss": -27.0030460357666, "global_step": 543654, "epoch": 6550} {"train_loss": -26.83213233947754, "global_step": 543655, "epoch": 6550} {"train_loss": -27.02638053894043, "global_step": 543656, "epoch": 6550} {"train_loss": -26.900836944580078, "global_step": 543657, "epoch": 6550} {"train_loss": -27.536731719970703, "global_step": 543658, "epoch": 6550} {"train_loss": -27.550085067749023, "global_step": 543659, "epoch": 6550} {"train_loss": -27.6817626953125, "global_step": 543660, "epoch": 6550} {"train_loss": -27.564817428588867, "global_step": 543661, "epoch": 6550} {"train_loss": -27.61167335510254, "global_step": 543662, "epoch": 6550} {"train_loss": -27.52212905883789, "global_step": 543663, "epoch": 6550} {"train_loss": -27.188140869140625, "global_step": 543664, "epoch": 6550} {"train_loss": -27.322738647460938, "global_step": 543665, "epoch": 6550} {"train_loss": -28.043701171875, "global_step": 543666, "epoch": 6550} {"train_loss": -27.47248649597168, "global_step": 543667, "epoch": 6550} {"train_loss": -27.389989852905273, "global_step": 543668, "epoch": 6550} {"train_loss": -27.485265731811523, "global_step": 543669, "epoch": 6550} {"train_loss": -27.57966423034668, "global_step": 543670, "epoch": 6550} {"train_loss": -27.975421905517578, "global_step": 543671, "epoch": 6550} {"train_loss": -27.622638702392578, "global_step": 543672, "epoch": 6550} {"train_loss": -27.65219497680664, "global_step": 543673, "epoch": 6550} {"train_loss": -27.482288360595703, "global_step": 543674, "epoch": 6550} {"train_loss": -27.714862823486328, "global_step": 543675, "epoch": 6550} {"train_loss": -27.840646743774414, "global_step": 543676, "epoch": 6550} {"train_loss": -27.273107528686523, "global_step": 543677, "epoch": 6550} {"train_loss": -27.649091720581055, "global_step": 543678, "epoch": 6550} {"train_loss": -27.810333251953125, "global_step": 543679, "epoch": 6550} {"train_loss": -27.880237579345703, "global_step": 543680, "epoch": 6550} {"train_loss": -27.9630184173584, "global_step": 543681, "epoch": 6550} {"train_loss": -27.72904396057129, "global_step": 543682, "epoch": 6550} {"train_loss": -27.468616485595703, "global_step": 543683, "epoch": 6550} {"train_loss": -27.959857940673828, "global_step": 543684, "epoch": 6550} {"train_loss": -27.47211265563965, "global_step": 543685, "epoch": 6550} {"train_loss": -27.431304931640625, "global_step": 543686, "epoch": 6550} {"train_loss": -27.38919448852539, "global_step": 543687, "epoch": 6550} {"train_loss": -27.1419677734375, "global_step": 543688, "epoch": 6550} {"train_loss": -27.900238037109375, "global_step": 543689, "epoch": 6550} {"train_loss": -27.489221572875977, "global_step": 543690, "epoch": 6550} {"train_loss": -27.45831298828125, "global_step": 543691, "epoch": 6550} {"train_loss": -27.57997703552246, "global_step": 543692, "epoch": 6550} {"train_loss": -27.834095001220703, "global_step": 543693, "epoch": 6550} {"train_loss": -27.748029708862305, "global_step": 543694, "epoch": 6550} {"train_loss": -28.059955596923828, "global_step": 543695, "epoch": 6550} {"train_loss": -27.69160270690918, "global_step": 543696, "epoch": 6550} {"train_loss": -27.46476173400879, "global_step": 543697, "epoch": 6550} {"train_loss": -27.662281036376953, "global_step": 543698, "epoch": 6550} {"train_loss": -27.32407569885254, "global_step": 543699, "epoch": 6550} {"train_loss": -27.39130973815918, "global_step": 543700, "epoch": 6550} {"train_loss": -27.415815353393555, "global_step": 543701, "epoch": 6550} {"train_loss": -27.528173446655273, "global_step": 543702, "epoch": 6550} {"train_loss": -27.859821319580078, "global_step": 543703, "epoch": 6550} {"train_loss": -27.738758087158203, "global_step": 543704, "epoch": 6550} {"train_loss": -27.427942276000977, "global_step": 543705, "epoch": 6550} {"train_loss": -28.01179313659668, "global_step": 543706, "epoch": 6550} {"train_loss": -27.67424964904785, "global_step": 543707, "epoch": 6550} {"train_loss": -27.762470245361328, "global_step": 543708, "epoch": 6550} {"train_loss": -27.341611862182617, "global_step": 543709, "epoch": 6550} {"train_loss": -27.098859786987305, "global_step": 543710, "epoch": 6550} {"train_loss": -27.1004581451416, "global_step": 543711, "epoch": 6550} {"train_loss": -26.88681411743164, "global_step": 543712, "epoch": 6550} {"train_loss": -26.84187126159668, "global_step": 543713, "epoch": 6550} {"train_loss": -26.57367515563965, "global_step": 543714, "epoch": 6550} {"train_loss": -27.088947296142578, "global_step": 543715, "epoch": 6550} {"train_loss": -28.061914443969727, "global_step": 543716, "epoch": 6550} {"train_loss": -27.509368896484375, "global_step": 543717, "epoch": 6550} {"train_loss": -27.47906494140625, "global_step": 543718, "epoch": 6550} {"train_loss": -27.66912841796875, "global_step": 543719, "epoch": 6550} {"train_loss": -27.26712989807129, "global_step": 543720, "epoch": 6550} {"train_loss": -27.148941040039062, "global_step": 543721, "epoch": 6550} {"train_loss": -27.88374900817871, "global_step": 543722, "epoch": 6550} {"train_loss": -27.31390380859375, "global_step": 543723, "epoch": 6550} {"train_loss": -27.426549911499023, "global_step": 543724, "epoch": 6550} {"train_loss": -27.780515670776367, "global_step": 543725, "epoch": 6550} {"train_loss": -27.437124252319336, "global_step": 543726, "epoch": 6550} {"train_loss": -27.502958297729492, "global_step": 543727, "epoch": 6550} {"train_loss": -27.34683609008789, "global_step": 543728, "epoch": 6550} {"train_loss": -27.915847778320312, "global_step": 543729, "epoch": 6550} {"train_loss": -27.421728134155273, "global_step": 543730, "epoch": 6550} {"train_loss": -27.88492202758789, "global_step": 543731, "epoch": 6550} {"train_loss": -27.49914854118623, "global_step": 543732, "epoch": 6550, "train/sim_max_reward_0": 1.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4500000": 1.0, "test/sim_max_reward_4500001": 1.0, "test/sim_max_reward_4500002": 1.0, "test/sim_max_reward_4500003": 1.0, "test/sim_max_reward_4500004": 1.0, "test/sim_max_reward_4500005": 1.0, "test/sim_max_reward_4500006": 1.0, "test/sim_max_reward_4500007": 0.0, "test/sim_max_reward_4500008": 1.0, "test/sim_max_reward_4500009": 1.0, "test/sim_max_reward_4500010": 1.0, "test/sim_max_reward_4500011": 1.0, "test/sim_max_reward_4500012": 1.0, "test/sim_max_reward_4500013": 1.0, "test/sim_max_reward_4500014": 1.0, "test/sim_max_reward_4500015": 1.0, "test/sim_max_reward_4500016": 1.0, "test/sim_max_reward_4500017": 1.0, "test/sim_max_reward_4500018": 0.0, "test/sim_max_reward_4500019": 0.0, "test/sim_max_reward_4500020": 1.0, "test/sim_max_reward_4500021": 1.0, "train/mean_score": 1.0, "test/mean_score": 0.8636363636363636, "val_loss": 6643798.0} {"train_loss": -27.191146850585938, "global_step": 543733, "epoch": 6551} {"train_loss": -27.48756980895996, "global_step": 543734, "epoch": 6551} {"train_loss": -27.65779685974121, "global_step": 543735, "epoch": 6551} {"train_loss": -27.6085262298584, "global_step": 543736, "epoch": 6551} {"train_loss": -27.812604904174805, "global_step": 543737, "epoch": 6551} {"train_loss": -27.676651000976562, "global_step": 543738, "epoch": 6551} {"train_loss": -27.638166427612305, "global_step": 543739, "epoch": 6551} {"train_loss": -27.555835723876953, "global_step": 543740, "epoch": 6551} {"train_loss": -27.5688533782959, "global_step": 543741, "epoch": 6551} {"train_loss": -27.575763702392578, "global_step": 543742, "epoch": 6551} {"train_loss": -27.765424728393555, "global_step": 543743, "epoch": 6551} {"train_loss": -27.84273338317871, "global_step": 543744, "epoch": 6551} {"train_loss": -27.382282257080078, "global_step": 543745, "epoch": 6551} {"train_loss": -27.57562255859375, "global_step": 543746, "epoch": 6551} {"train_loss": -27.646936416625977, "global_step": 543747, "epoch": 6551} {"train_loss": -27.431278228759766, "global_step": 543748, "epoch": 6551} {"train_loss": -27.688146591186523, "global_step": 543749, "epoch": 6551} {"train_loss": -27.87506103515625, "global_step": 543750, "epoch": 6551} {"train_loss": -27.59588623046875, "global_step": 543751, "epoch": 6551} {"train_loss": -27.274511337280273, "global_step": 543752, "epoch": 6551} {"train_loss": -27.775989532470703, "global_step": 543753, "epoch": 6551} {"train_loss": -27.867773056030273, "global_step": 543754, "epoch": 6551} {"train_loss": -28.2705020904541, "global_step": 543755, "epoch": 6551} {"train_loss": -27.584638595581055, "global_step": 543756, "epoch": 6551} {"train_loss": -27.636856079101562, "global_step": 543757, "epoch": 6551} {"train_loss": -27.4886417388916, "global_step": 543758, "epoch": 6551} {"train_loss": -27.194751739501953, "global_step": 543759, "epoch": 6551} {"train_loss": -27.381338119506836, "global_step": 543760, "epoch": 6551} {"train_loss": -27.69508171081543, "global_step": 543761, "epoch": 6551} {"train_loss": -27.7286376953125, "global_step": 543762, "epoch": 6551} {"train_loss": -27.355756759643555, "global_step": 543763, "epoch": 6551} {"train_loss": -27.941146850585938, "global_step": 543764, "epoch": 6551} {"train_loss": -27.743921279907227, "global_step": 543765, "epoch": 6551} {"train_loss": -27.69775390625, "global_step": 543766, "epoch": 6551} {"train_loss": -27.827362060546875, "global_step": 543767, "epoch": 6551} {"train_loss": -27.428119659423828, "global_step": 543768, "epoch": 6551} {"train_loss": -27.415918350219727, "global_step": 543769, "epoch": 6551} {"train_loss": -27.582792282104492, "global_step": 543770, "epoch": 6551} {"train_loss": -27.167524337768555, "global_step": 543771, "epoch": 6551} {"train_loss": -27.14890480041504, "global_step": 543772, "epoch": 6551} {"train_loss": -27.4727725982666, "global_step": 543773, "epoch": 6551} {"train_loss": -27.61954116821289, "global_step": 543774, "epoch": 6551} {"train_loss": -27.790863037109375, "global_step": 543775, "epoch": 6551} {"train_loss": -27.7078800201416, "global_step": 543776, "epoch": 6551} {"train_loss": -27.34943962097168, "global_step": 543777, "epoch": 6551} {"train_loss": -27.82590675354004, "global_step": 543778, "epoch": 6551} {"train_loss": -27.6430721282959, "global_step": 543779, "epoch": 6551} {"train_loss": -27.673933029174805, "global_step": 543780, "epoch": 6551} {"train_loss": -27.616199493408203, "global_step": 543781, "epoch": 6551} {"train_loss": -27.620481491088867, "global_step": 543782, "epoch": 6551} {"train_loss": -27.46522331237793, "global_step": 543783, "epoch": 6551} {"train_loss": -27.846708297729492, "global_step": 543784, "epoch": 6551} {"train_loss": -27.56415367126465, "global_step": 543785, "epoch": 6551} {"train_loss": -27.649404525756836, "global_step": 543786, "epoch": 6551} {"train_loss": -27.55976676940918, "global_step": 543787, "epoch": 6551} {"train_loss": -27.902969360351562, "global_step": 543788, "epoch": 6551} {"train_loss": -28.03098487854004, "global_step": 543789, "epoch": 6551} {"train_loss": -27.88327407836914, "global_step": 543790, "epoch": 6551} {"train_loss": -27.51582145690918, "global_step": 543791, "epoch": 6551} {"train_loss": -27.355926513671875, "global_step": 543792, "epoch": 6551} {"train_loss": -27.304426193237305, "global_step": 543793, "epoch": 6551} {"train_loss": -27.710180282592773, "global_step": 543794, "epoch": 6551} {"train_loss": -27.373580932617188, "global_step": 543795, "epoch": 6551} {"train_loss": -27.31747817993164, "global_step": 543796, "epoch": 6551} {"train_loss": -27.172504425048828, "global_step": 543797, "epoch": 6551} {"train_loss": -27.112585067749023, "global_step": 543798, "epoch": 6551} {"train_loss": -27.129043579101562, "global_step": 543799, "epoch": 6551} {"train_loss": -27.75977897644043, "global_step": 543800, "epoch": 6551} {"train_loss": -27.76511573791504, "global_step": 543801, "epoch": 6551} {"train_loss": -27.63287353515625, "global_step": 543802, "epoch": 6551} {"train_loss": -27.708744049072266, "global_step": 543803, "epoch": 6551} {"train_loss": -27.898609161376953, "global_step": 543804, "epoch": 6551} {"train_loss": -27.933629989624023, "global_step": 543805, "epoch": 6551} {"train_loss": -27.213735580444336, "global_step": 543806, "epoch": 6551} {"train_loss": -27.785144805908203, "global_step": 543807, "epoch": 6551} {"train_loss": -27.6112060546875, "global_step": 543808, "epoch": 6551} {"train_loss": -27.4423885345459, "global_step": 543809, "epoch": 6551} {"train_loss": -27.848926544189453, "global_step": 543810, "epoch": 6551} {"train_loss": -27.612157821655273, "global_step": 543811, "epoch": 6551} {"train_loss": -27.4503173828125, "global_step": 543812, "epoch": 6551} {"train_loss": -27.631128311157227, "global_step": 543813, "epoch": 6551} {"train_loss": -27.5383358001709, "global_step": 543814, "epoch": 6551} {"train_loss": -27.595428581697394, "global_step": 543815, "epoch": 6551, "val_loss": 6497444.0} {"train_loss": -27.127431869506836, "global_step": 543816, "epoch": 6552} {"train_loss": -26.667896270751953, "global_step": 543817, "epoch": 6552} {"train_loss": -26.737119674682617, "global_step": 543818, "epoch": 6552} {"train_loss": -27.46430015563965, "global_step": 543819, "epoch": 6552} {"train_loss": -26.816091537475586, "global_step": 543820, "epoch": 6552} {"train_loss": -25.942026138305664, "global_step": 543821, "epoch": 6552} {"train_loss": -26.78400230407715, "global_step": 543822, "epoch": 6552} {"train_loss": -27.490758895874023, "global_step": 543823, "epoch": 6552} {"train_loss": -25.677465438842773, "global_step": 543824, "epoch": 6552} {"train_loss": -26.851959228515625, "global_step": 543825, "epoch": 6552} {"train_loss": -26.4512939453125, "global_step": 543826, "epoch": 6552} {"train_loss": -26.676374435424805, "global_step": 543827, "epoch": 6552} {"train_loss": -26.729150772094727, "global_step": 543828, "epoch": 6552} {"train_loss": -27.459003448486328, "global_step": 543829, "epoch": 6552} {"train_loss": -26.94000244140625, "global_step": 543830, "epoch": 6552} {"train_loss": -26.967924118041992, "global_step": 543831, "epoch": 6552} {"train_loss": -26.850507736206055, "global_step": 543832, "epoch": 6552} {"train_loss": -27.125585556030273, "global_step": 543833, "epoch": 6552} {"train_loss": -26.92287254333496, "global_step": 543834, "epoch": 6552} {"train_loss": -27.4080753326416, "global_step": 543835, "epoch": 6552} {"train_loss": -26.896772384643555, "global_step": 543836, "epoch": 6552} {"train_loss": -27.15399742126465, "global_step": 543837, "epoch": 6552} {"train_loss": -27.174535751342773, "global_step": 543838, "epoch": 6552} {"train_loss": -26.839956283569336, "global_step": 543839, "epoch": 6552} {"train_loss": -27.238672256469727, "global_step": 543840, "epoch": 6552} {"train_loss": -27.02247428894043, "global_step": 543841, "epoch": 6552} {"train_loss": -27.181936264038086, "global_step": 543842, "epoch": 6552} {"train_loss": -27.586944580078125, "global_step": 543843, "epoch": 6552} {"train_loss": -27.018117904663086, "global_step": 543844, "epoch": 6552} {"train_loss": -27.1993465423584, "global_step": 543845, "epoch": 6552} {"train_loss": -27.344038009643555, "global_step": 543846, "epoch": 6552} {"train_loss": -27.28192138671875, "global_step": 543847, "epoch": 6552} {"train_loss": -27.325180053710938, "global_step": 543848, "epoch": 6552} {"train_loss": -27.28215980529785, "global_step": 543849, "epoch": 6552} {"train_loss": -28.097915649414062, "global_step": 543850, "epoch": 6552} {"train_loss": -27.472049713134766, "global_step": 543851, "epoch": 6552} {"train_loss": -27.322736740112305, "global_step": 543852, "epoch": 6552} {"train_loss": -27.334375381469727, "global_step": 543853, "epoch": 6552} {"train_loss": -27.629547119140625, "global_step": 543854, "epoch": 6552} {"train_loss": -27.697553634643555, "global_step": 543855, "epoch": 6552} {"train_loss": -27.655820846557617, "global_step": 543856, "epoch": 6552} {"train_loss": -27.411117553710938, "global_step": 543857, "epoch": 6552} {"train_loss": -27.5194149017334, "global_step": 543858, "epoch": 6552} {"train_loss": -27.667346954345703, "global_step": 543859, "epoch": 6552} {"train_loss": -27.707483291625977, "global_step": 543860, "epoch": 6552} {"train_loss": -27.958770751953125, "global_step": 543861, "epoch": 6552} {"train_loss": -27.730268478393555, "global_step": 543862, "epoch": 6552} {"train_loss": -28.011953353881836, "global_step": 543863, "epoch": 6552} {"train_loss": -27.91179847717285, "global_step": 543864, "epoch": 6552} {"train_loss": -27.6948184967041, "global_step": 543865, "epoch": 6552} {"train_loss": -27.618253707885742, "global_step": 543866, "epoch": 6552} {"train_loss": -27.8700008392334, "global_step": 543867, "epoch": 6552} {"train_loss": -27.790027618408203, "global_step": 543868, "epoch": 6552} {"train_loss": -27.779630661010742, "global_step": 543869, "epoch": 6552} {"train_loss": -28.03993034362793, "global_step": 543870, "epoch": 6552} {"train_loss": -27.607297897338867, "global_step": 543871, "epoch": 6552} {"train_loss": -27.806060791015625, "global_step": 543872, "epoch": 6552} {"train_loss": -27.709522247314453, "global_step": 543873, "epoch": 6552} {"train_loss": -27.778339385986328, "global_step": 543874, "epoch": 6552} {"train_loss": -27.708301544189453, "global_step": 543875, "epoch": 6552} {"train_loss": -28.03973960876465, "global_step": 543876, "epoch": 6552} {"train_loss": -27.7633056640625, "global_step": 543877, "epoch": 6552} {"train_loss": -27.939477920532227, "global_step": 543878, "epoch": 6552} {"train_loss": -27.747156143188477, "global_step": 543879, "epoch": 6552} {"train_loss": -28.093708038330078, "global_step": 543880, "epoch": 6552} {"train_loss": -28.030195236206055, "global_step": 543881, "epoch": 6552} {"train_loss": -27.792709350585938, "global_step": 543882, "epoch": 6552} {"train_loss": -27.96522331237793, "global_step": 543883, "epoch": 6552} {"train_loss": -27.659818649291992, "global_step": 543884, "epoch": 6552} {"train_loss": -27.897205352783203, "global_step": 543885, "epoch": 6552} {"train_loss": -27.875558853149414, "global_step": 543886, "epoch": 6552} {"train_loss": -27.89369010925293, "global_step": 543887, "epoch": 6552} {"train_loss": -27.71172523498535, "global_step": 543888, "epoch": 6552} {"train_loss": -27.952884674072266, "global_step": 543889, "epoch": 6552} {"train_loss": -27.4498348236084, "global_step": 543890, "epoch": 6552} {"train_loss": -27.8298397064209, "global_step": 543891, "epoch": 6552} {"train_loss": -27.9389591217041, "global_step": 543892, "epoch": 6552} {"train_loss": -27.570871353149414, "global_step": 543893, "epoch": 6552} {"train_loss": -27.295019149780273, "global_step": 543894, "epoch": 6552} {"train_loss": -27.3926944732666, "global_step": 543895, "epoch": 6552} {"train_loss": -27.5533390045166, "global_step": 543896, "epoch": 6552} {"train_loss": -27.38075065612793, "global_step": 543897, "epoch": 6552} {"train_loss": -27.4293166930417, "global_step": 543898, "epoch": 6552, "val_loss": 6610010.0} {"train_loss": -26.703622817993164, "global_step": 543899, "epoch": 6553} {"train_loss": -25.544761657714844, "global_step": 543900, "epoch": 6553} {"train_loss": -26.38567543029785, "global_step": 543901, "epoch": 6553} {"train_loss": -26.535144805908203, "global_step": 543902, "epoch": 6553} {"train_loss": -27.285064697265625, "global_step": 543903, "epoch": 6553} {"train_loss": -27.468246459960938, "global_step": 543904, "epoch": 6553} {"train_loss": -27.095600128173828, "global_step": 543905, "epoch": 6553} {"train_loss": -26.8226261138916, "global_step": 543906, "epoch": 6553} {"train_loss": -27.073062896728516, "global_step": 543907, "epoch": 6553} {"train_loss": -26.88728141784668, "global_step": 543908, "epoch": 6553} {"train_loss": -26.994714736938477, "global_step": 543909, "epoch": 6553} {"train_loss": -27.198827743530273, "global_step": 543910, "epoch": 6553} {"train_loss": -27.597015380859375, "global_step": 543911, "epoch": 6553} {"train_loss": -27.24871253967285, "global_step": 543912, "epoch": 6553} {"train_loss": -27.843658447265625, "global_step": 543913, "epoch": 6553} {"train_loss": -27.388397216796875, "global_step": 543914, "epoch": 6553} {"train_loss": -27.42963218688965, "global_step": 543915, "epoch": 6553} {"train_loss": -27.6634578704834, "global_step": 543916, "epoch": 6553} {"train_loss": -27.589801788330078, "global_step": 543917, "epoch": 6553} {"train_loss": -27.149276733398438, "global_step": 543918, "epoch": 6553} {"train_loss": -27.438236236572266, "global_step": 543919, "epoch": 6553} {"train_loss": -27.51167106628418, "global_step": 543920, "epoch": 6553} {"train_loss": -27.588642120361328, "global_step": 543921, "epoch": 6553} {"train_loss": -27.597875595092773, "global_step": 543922, "epoch": 6553} {"train_loss": -27.430051803588867, "global_step": 543923, "epoch": 6553} {"train_loss": -27.181894302368164, "global_step": 543924, "epoch": 6553} {"train_loss": -27.4876708984375, "global_step": 543925, "epoch": 6553} {"train_loss": -27.552183151245117, "global_step": 543926, "epoch": 6553} {"train_loss": -27.671178817749023, "global_step": 543927, "epoch": 6553} {"train_loss": -27.837329864501953, "global_step": 543928, "epoch": 6553} {"train_loss": -27.965478897094727, "global_step": 543929, "epoch": 6553} {"train_loss": -27.62824058532715, "global_step": 543930, "epoch": 6553} {"train_loss": -27.750577926635742, "global_step": 543931, "epoch": 6553} {"train_loss": -27.806562423706055, "global_step": 543932, "epoch": 6553} {"train_loss": -27.58243751525879, "global_step": 543933, "epoch": 6553} {"train_loss": -28.170969009399414, "global_step": 543934, "epoch": 6553} {"train_loss": -27.770893096923828, "global_step": 543935, "epoch": 6553} {"train_loss": -27.878849029541016, "global_step": 543936, "epoch": 6553} {"train_loss": -27.511579513549805, "global_step": 543937, "epoch": 6553} {"train_loss": -27.548532485961914, "global_step": 543938, "epoch": 6553} {"train_loss": -27.796478271484375, "global_step": 543939, "epoch": 6553} {"train_loss": -27.95452880859375, "global_step": 543940, "epoch": 6553} {"train_loss": -27.894941329956055, "global_step": 543941, "epoch": 6553} {"train_loss": -27.66009521484375, "global_step": 543942, "epoch": 6553} {"train_loss": -27.754003524780273, "global_step": 543943, "epoch": 6553} {"train_loss": -27.809904098510742, "global_step": 543944, "epoch": 6553} {"train_loss": -27.801477432250977, "global_step": 543945, "epoch": 6553} {"train_loss": -27.744375228881836, "global_step": 543946, "epoch": 6553} {"train_loss": -27.83259391784668, "global_step": 543947, "epoch": 6553} {"train_loss": -27.813125610351562, "global_step": 543948, "epoch": 6553} {"train_loss": -27.945993423461914, "global_step": 543949, "epoch": 6553} {"train_loss": -27.806631088256836, "global_step": 543950, "epoch": 6553} {"train_loss": -27.92156982421875, "global_step": 543951, "epoch": 6553} {"train_loss": -27.345996856689453, "global_step": 543952, "epoch": 6553} {"train_loss": -27.900197982788086, "global_step": 543953, "epoch": 6553} {"train_loss": -27.643802642822266, "global_step": 543954, "epoch": 6553} {"train_loss": -27.69907569885254, "global_step": 543955, "epoch": 6553} {"train_loss": -27.860090255737305, "global_step": 543956, "epoch": 6553} {"train_loss": -27.719207763671875, "global_step": 543957, "epoch": 6553} {"train_loss": -27.611682891845703, "global_step": 543958, "epoch": 6553} {"train_loss": -27.902082443237305, "global_step": 543959, "epoch": 6553} {"train_loss": -27.748462677001953, "global_step": 543960, "epoch": 6553} {"train_loss": -28.001134872436523, "global_step": 543961, "epoch": 6553} {"train_loss": -28.209692001342773, "global_step": 543962, "epoch": 6553} {"train_loss": -27.603647232055664, "global_step": 543963, "epoch": 6553} {"train_loss": -27.695653915405273, "global_step": 543964, "epoch": 6553} {"train_loss": -27.54591178894043, "global_step": 543965, "epoch": 6553} {"train_loss": -28.05328369140625, "global_step": 543966, "epoch": 6553} {"train_loss": -27.9024715423584, "global_step": 543967, "epoch": 6553} {"train_loss": -27.634552001953125, "global_step": 543968, "epoch": 6553} {"train_loss": -27.795120239257812, "global_step": 543969, "epoch": 6553} {"train_loss": -27.456607818603516, "global_step": 543970, "epoch": 6553} {"train_loss": -26.647979736328125, "global_step": 543971, "epoch": 6553} {"train_loss": -25.736352920532227, "global_step": 543972, "epoch": 6553} {"train_loss": -25.15716552734375, "global_step": 543973, "epoch": 6553} {"train_loss": -27.13051414489746, "global_step": 543974, "epoch": 6553} {"train_loss": -26.95758056640625, "global_step": 543975, "epoch": 6553} {"train_loss": -26.680295944213867, "global_step": 543976, "epoch": 6553} {"train_loss": -27.042205810546875, "global_step": 543977, "epoch": 6553} {"train_loss": -27.128662109375, "global_step": 543978, "epoch": 6553} {"train_loss": -26.823486328125, "global_step": 543979, "epoch": 6553} {"train_loss": -27.5252628326416, "global_step": 543980, "epoch": 6553} {"train_loss": -27.46197911917445, "global_step": 543981, "epoch": 6553, "val_loss": 6574184.0} {"train_loss": -26.51846694946289, "global_step": 543982, "epoch": 6554} {"train_loss": -27.036813735961914, "global_step": 543983, "epoch": 6554} {"train_loss": -26.5987606048584, "global_step": 543984, "epoch": 6554} {"train_loss": -27.33746337890625, "global_step": 543985, "epoch": 6554} {"train_loss": -26.53834342956543, "global_step": 543986, "epoch": 6554} {"train_loss": -27.04414176940918, "global_step": 543987, "epoch": 6554} {"train_loss": -27.17572593688965, "global_step": 543988, "epoch": 6554} {"train_loss": -27.19648551940918, "global_step": 543989, "epoch": 6554} {"train_loss": -27.133960723876953, "global_step": 543990, "epoch": 6554} {"train_loss": -26.9886531829834, "global_step": 543991, "epoch": 6554} {"train_loss": -27.247791290283203, "global_step": 543992, "epoch": 6554} {"train_loss": -26.905561447143555, "global_step": 543993, "epoch": 6554} {"train_loss": -27.093311309814453, "global_step": 543994, "epoch": 6554} {"train_loss": -26.903797149658203, "global_step": 543995, "epoch": 6554} {"train_loss": -27.348432540893555, "global_step": 543996, "epoch": 6554} {"train_loss": -27.159027099609375, "global_step": 543997, "epoch": 6554} {"train_loss": -27.34552001953125, "global_step": 543998, "epoch": 6554} {"train_loss": -27.24750328063965, "global_step": 543999, "epoch": 6554} {"train_loss": -27.555871963500977, "global_step": 544000, "epoch": 6554} {"train_loss": -26.954557418823242, "global_step": 544001, "epoch": 6554} {"train_loss": -27.643280029296875, "global_step": 544002, "epoch": 6554} {"train_loss": -27.275426864624023, "global_step": 544003, "epoch": 6554} {"train_loss": -27.2771053314209, "global_step": 544004, "epoch": 6554} {"train_loss": -27.168283462524414, "global_step": 544005, "epoch": 6554} {"train_loss": -27.36569595336914, "global_step": 544006, "epoch": 6554} {"train_loss": -27.528913497924805, "global_step": 544007, "epoch": 6554} {"train_loss": -27.681869506835938, "global_step": 544008, "epoch": 6554} {"train_loss": -27.552845001220703, "global_step": 544009, "epoch": 6554} {"train_loss": -27.822601318359375, "global_step": 544010, "epoch": 6554} {"train_loss": -27.63392448425293, "global_step": 544011, "epoch": 6554} {"train_loss": -27.821035385131836, "global_step": 544012, "epoch": 6554} {"train_loss": -27.650033950805664, "global_step": 544013, "epoch": 6554} {"train_loss": -27.502124786376953, "global_step": 544014, "epoch": 6554} {"train_loss": -27.702558517456055, "global_step": 544015, "epoch": 6554} {"train_loss": -27.64459228515625, "global_step": 544016, "epoch": 6554} {"train_loss": -27.72945213317871, "global_step": 544017, "epoch": 6554} {"train_loss": -27.866174697875977, "global_step": 544018, "epoch": 6554} {"train_loss": -27.89242935180664, "global_step": 544019, "epoch": 6554} {"train_loss": -27.88807487487793, "global_step": 544020, "epoch": 6554} {"train_loss": -27.923566818237305, "global_step": 544021, "epoch": 6554} {"train_loss": -27.4970703125, "global_step": 544022, "epoch": 6554} {"train_loss": -28.162012100219727, "global_step": 544023, "epoch": 6554} {"train_loss": -27.589187622070312, "global_step": 544024, "epoch": 6554} {"train_loss": -27.769315719604492, "global_step": 544025, "epoch": 6554} {"train_loss": -27.5270938873291, "global_step": 544026, "epoch": 6554} {"train_loss": -28.050153732299805, "global_step": 544027, "epoch": 6554} {"train_loss": -27.637760162353516, "global_step": 544028, "epoch": 6554} {"train_loss": -27.689985275268555, "global_step": 544029, "epoch": 6554} {"train_loss": -27.698352813720703, "global_step": 544030, "epoch": 6554} {"train_loss": -27.898313522338867, "global_step": 544031, "epoch": 6554} {"train_loss": -27.783910751342773, "global_step": 544032, "epoch": 6554} {"train_loss": -27.711145401000977, "global_step": 544033, "epoch": 6554} {"train_loss": -27.945056915283203, "global_step": 544034, "epoch": 6554} {"train_loss": -27.579788208007812, "global_step": 544035, "epoch": 6554} {"train_loss": -27.784223556518555, "global_step": 544036, "epoch": 6554} {"train_loss": -28.126148223876953, "global_step": 544037, "epoch": 6554} {"train_loss": -27.472644805908203, "global_step": 544038, "epoch": 6554} {"train_loss": -27.724584579467773, "global_step": 544039, "epoch": 6554} {"train_loss": -27.58807945251465, "global_step": 544040, "epoch": 6554} {"train_loss": -28.197357177734375, "global_step": 544041, "epoch": 6554} {"train_loss": -28.113195419311523, "global_step": 544042, "epoch": 6554} {"train_loss": -28.010684967041016, "global_step": 544043, "epoch": 6554} {"train_loss": -27.76344108581543, "global_step": 544044, "epoch": 6554} {"train_loss": -27.88697624206543, "global_step": 544045, "epoch": 6554} {"train_loss": -27.645587921142578, "global_step": 544046, "epoch": 6554} {"train_loss": -27.8754940032959, "global_step": 544047, "epoch": 6554} {"train_loss": -27.47781753540039, "global_step": 544048, "epoch": 6554} {"train_loss": -27.856184005737305, "global_step": 544049, "epoch": 6554} {"train_loss": -28.081180572509766, "global_step": 544050, "epoch": 6554} {"train_loss": -28.01120948791504, "global_step": 544051, "epoch": 6554} {"train_loss": -27.273792266845703, "global_step": 544052, "epoch": 6554} {"train_loss": -27.53985023498535, "global_step": 544053, "epoch": 6554} {"train_loss": -27.648035049438477, "global_step": 544054, "epoch": 6554} {"train_loss": -27.50098991394043, "global_step": 544055, "epoch": 6554} {"train_loss": -27.02813720703125, "global_step": 544056, "epoch": 6554} {"train_loss": -26.68653678894043, "global_step": 544057, "epoch": 6554} {"train_loss": -27.950531005859375, "global_step": 544058, "epoch": 6554} {"train_loss": -27.37653923034668, "global_step": 544059, "epoch": 6554} {"train_loss": -27.444019317626953, "global_step": 544060, "epoch": 6554} {"train_loss": -26.86246681213379, "global_step": 544061, "epoch": 6554} {"train_loss": -27.166845321655273, "global_step": 544062, "epoch": 6554} {"train_loss": -27.552692413330078, "global_step": 544063, "epoch": 6554} {"train_loss": -27.502312648727234, "global_step": 544064, "epoch": 6554, "val_loss": 6604688.5} {"train_loss": -26.30645179748535, "global_step": 544065, "epoch": 6555} {"train_loss": -26.931293487548828, "global_step": 544066, "epoch": 6555} {"train_loss": -27.1375732421875, "global_step": 544067, "epoch": 6555} {"train_loss": -26.138751983642578, "global_step": 544068, "epoch": 6555} {"train_loss": -27.38296890258789, "global_step": 544069, "epoch": 6555} {"train_loss": -27.06962013244629, "global_step": 544070, "epoch": 6555} {"train_loss": -27.17121696472168, "global_step": 544071, "epoch": 6555} {"train_loss": -26.745513916015625, "global_step": 544072, "epoch": 6555} {"train_loss": -27.41570472717285, "global_step": 544073, "epoch": 6555} {"train_loss": -27.13850212097168, "global_step": 544074, "epoch": 6555} {"train_loss": -27.409887313842773, "global_step": 544075, "epoch": 6555} {"train_loss": -27.1705322265625, "global_step": 544076, "epoch": 6555} {"train_loss": -27.275495529174805, "global_step": 544077, "epoch": 6555} {"train_loss": -27.17420768737793, "global_step": 544078, "epoch": 6555} {"train_loss": -27.19840431213379, "global_step": 544079, "epoch": 6555} {"train_loss": -27.326879501342773, "global_step": 544080, "epoch": 6555} {"train_loss": -27.244192123413086, "global_step": 544081, "epoch": 6555} {"train_loss": -27.45191764831543, "global_step": 544082, "epoch": 6555} {"train_loss": -27.49395179748535, "global_step": 544083, "epoch": 6555} {"train_loss": -27.6195125579834, "global_step": 544084, "epoch": 6555} {"train_loss": -27.81744956970215, "global_step": 544085, "epoch": 6555} {"train_loss": -27.374439239501953, "global_step": 544086, "epoch": 6555} {"train_loss": -27.53369140625, "global_step": 544087, "epoch": 6555} {"train_loss": -27.63434410095215, "global_step": 544088, "epoch": 6555} {"train_loss": -27.74538230895996, "global_step": 544089, "epoch": 6555} {"train_loss": -27.48019790649414, "global_step": 544090, "epoch": 6555} {"train_loss": -27.635162353515625, "global_step": 544091, "epoch": 6555} {"train_loss": -27.828222274780273, "global_step": 544092, "epoch": 6555} {"train_loss": -27.497913360595703, "global_step": 544093, "epoch": 6555} {"train_loss": -27.77044677734375, "global_step": 544094, "epoch": 6555} {"train_loss": -27.944000244140625, "global_step": 544095, "epoch": 6555} {"train_loss": -27.77370262145996, "global_step": 544096, "epoch": 6555} {"train_loss": -27.726734161376953, "global_step": 544097, "epoch": 6555} {"train_loss": -28.100543975830078, "global_step": 544098, "epoch": 6555} {"train_loss": -27.71713638305664, "global_step": 544099, "epoch": 6555} {"train_loss": -27.929218292236328, "global_step": 544100, "epoch": 6555} {"train_loss": -27.613061904907227, "global_step": 544101, "epoch": 6555} {"train_loss": -28.21329116821289, "global_step": 544102, "epoch": 6555} {"train_loss": -27.761032104492188, "global_step": 544103, "epoch": 6555} {"train_loss": -27.558242797851562, "global_step": 544104, "epoch": 6555} {"train_loss": -27.62627601623535, "global_step": 544105, "epoch": 6555} {"train_loss": -27.62447166442871, "global_step": 544106, "epoch": 6555} {"train_loss": -28.397632598876953, "global_step": 544107, "epoch": 6555} {"train_loss": -28.10740089416504, "global_step": 544108, "epoch": 6555} {"train_loss": -27.88258171081543, "global_step": 544109, "epoch": 6555} {"train_loss": -27.969181060791016, "global_step": 544110, "epoch": 6555} {"train_loss": -27.997455596923828, "global_step": 544111, "epoch": 6555} {"train_loss": -28.096899032592773, "global_step": 544112, "epoch": 6555} {"train_loss": -27.689489364624023, "global_step": 544113, "epoch": 6555} {"train_loss": -27.570825576782227, "global_step": 544114, "epoch": 6555} {"train_loss": -27.650815963745117, "global_step": 544115, "epoch": 6555} {"train_loss": -27.99106788635254, "global_step": 544116, "epoch": 6555} {"train_loss": -28.103809356689453, "global_step": 544117, "epoch": 6555} {"train_loss": -28.034448623657227, "global_step": 544118, "epoch": 6555} {"train_loss": -27.566843032836914, "global_step": 544119, "epoch": 6555} {"train_loss": -27.035505294799805, "global_step": 544120, "epoch": 6555} {"train_loss": -26.907384872436523, "global_step": 544121, "epoch": 6555} {"train_loss": -27.153522491455078, "global_step": 544122, "epoch": 6555} {"train_loss": -27.449111938476562, "global_step": 544123, "epoch": 6555} {"train_loss": -27.324979782104492, "global_step": 544124, "epoch": 6555} {"train_loss": -27.816808700561523, "global_step": 544125, "epoch": 6555} {"train_loss": -27.299957275390625, "global_step": 544126, "epoch": 6555} {"train_loss": -27.410720825195312, "global_step": 544127, "epoch": 6555} {"train_loss": -27.218942642211914, "global_step": 544128, "epoch": 6555} {"train_loss": -27.614526748657227, "global_step": 544129, "epoch": 6555} {"train_loss": -28.118122100830078, "global_step": 544130, "epoch": 6555} {"train_loss": -27.567981719970703, "global_step": 544131, "epoch": 6555} {"train_loss": -27.47853660583496, "global_step": 544132, "epoch": 6555} {"train_loss": -27.34469985961914, "global_step": 544133, "epoch": 6555} {"train_loss": -27.844404220581055, "global_step": 544134, "epoch": 6555} {"train_loss": -27.553375244140625, "global_step": 544135, "epoch": 6555} {"train_loss": -27.6475830078125, "global_step": 544136, "epoch": 6555} {"train_loss": -27.585546493530273, "global_step": 544137, "epoch": 6555} {"train_loss": -27.6160945892334, "global_step": 544138, "epoch": 6555} {"train_loss": -27.33249282836914, "global_step": 544139, "epoch": 6555} {"train_loss": -27.461029052734375, "global_step": 544140, "epoch": 6555} {"train_loss": -27.447452545166016, "global_step": 544141, "epoch": 6555} {"train_loss": -27.23011589050293, "global_step": 544142, "epoch": 6555} {"train_loss": -27.93129539489746, "global_step": 544143, "epoch": 6555} {"train_loss": -27.452777862548828, "global_step": 544144, "epoch": 6555} {"train_loss": -27.35744285583496, "global_step": 544145, "epoch": 6555} {"train_loss": -27.497995376586914, "global_step": 544146, "epoch": 6555} {"train_loss": -27.522836960941913, "global_step": 544147, "epoch": 6555, "val_loss": 6547114.5} {"train_loss": -26.974964141845703, "global_step": 544148, "epoch": 6556} {"train_loss": -27.066614151000977, "global_step": 544149, "epoch": 6556} {"train_loss": -27.026477813720703, "global_step": 544150, "epoch": 6556} {"train_loss": -26.975061416625977, "global_step": 544151, "epoch": 6556} {"train_loss": -27.181440353393555, "global_step": 544152, "epoch": 6556} {"train_loss": -27.373233795166016, "global_step": 544153, "epoch": 6556} {"train_loss": -27.1350154876709, "global_step": 544154, "epoch": 6556} {"train_loss": -27.016895294189453, "global_step": 544155, "epoch": 6556} {"train_loss": -27.278900146484375, "global_step": 544156, "epoch": 6556} {"train_loss": -27.12092399597168, "global_step": 544157, "epoch": 6556} {"train_loss": -26.80837059020996, "global_step": 544158, "epoch": 6556} {"train_loss": -27.3377685546875, "global_step": 544159, "epoch": 6556} {"train_loss": -27.276611328125, "global_step": 544160, "epoch": 6556} {"train_loss": -27.41999626159668, "global_step": 544161, "epoch": 6556} {"train_loss": -27.12542724609375, "global_step": 544162, "epoch": 6556} {"train_loss": -27.386377334594727, "global_step": 544163, "epoch": 6556} {"train_loss": -27.67767333984375, "global_step": 544164, "epoch": 6556} {"train_loss": -27.312952041625977, "global_step": 544165, "epoch": 6556} {"train_loss": -27.277570724487305, "global_step": 544166, "epoch": 6556} {"train_loss": -27.678802490234375, "global_step": 544167, "epoch": 6556} {"train_loss": -27.65913200378418, "global_step": 544168, "epoch": 6556} {"train_loss": -27.619552612304688, "global_step": 544169, "epoch": 6556} {"train_loss": -27.833637237548828, "global_step": 544170, "epoch": 6556} {"train_loss": -27.135425567626953, "global_step": 544171, "epoch": 6556} {"train_loss": -27.4442138671875, "global_step": 544172, "epoch": 6556} {"train_loss": -27.494770050048828, "global_step": 544173, "epoch": 6556} {"train_loss": -27.693832397460938, "global_step": 544174, "epoch": 6556} {"train_loss": -27.76556396484375, "global_step": 544175, "epoch": 6556} {"train_loss": -27.654312133789062, "global_step": 544176, "epoch": 6556} {"train_loss": -27.861730575561523, "global_step": 544177, "epoch": 6556} {"train_loss": -27.822431564331055, "global_step": 544178, "epoch": 6556} {"train_loss": -27.373767852783203, "global_step": 544179, "epoch": 6556} {"train_loss": -27.843088150024414, "global_step": 544180, "epoch": 6556} {"train_loss": -27.740270614624023, "global_step": 544181, "epoch": 6556} {"train_loss": -27.618194580078125, "global_step": 544182, "epoch": 6556} {"train_loss": -27.572925567626953, "global_step": 544183, "epoch": 6556} {"train_loss": -28.002927780151367, "global_step": 544184, "epoch": 6556} {"train_loss": -27.50007438659668, "global_step": 544185, "epoch": 6556} {"train_loss": -27.912982940673828, "global_step": 544186, "epoch": 6556} {"train_loss": -27.550739288330078, "global_step": 544187, "epoch": 6556} {"train_loss": -28.14716911315918, "global_step": 544188, "epoch": 6556} {"train_loss": -27.62074089050293, "global_step": 544189, "epoch": 6556} {"train_loss": -27.621631622314453, "global_step": 544190, "epoch": 6556} {"train_loss": -27.90151023864746, "global_step": 544191, "epoch": 6556} {"train_loss": -27.751325607299805, "global_step": 544192, "epoch": 6556} {"train_loss": -27.834226608276367, "global_step": 544193, "epoch": 6556} {"train_loss": -27.998371124267578, "global_step": 544194, "epoch": 6556} {"train_loss": -28.066797256469727, "global_step": 544195, "epoch": 6556} {"train_loss": -28.021167755126953, "global_step": 544196, "epoch": 6556} {"train_loss": -28.128625869750977, "global_step": 544197, "epoch": 6556} {"train_loss": -28.07720947265625, "global_step": 544198, "epoch": 6556} {"train_loss": -27.85561180114746, "global_step": 544199, "epoch": 6556} {"train_loss": -27.89313316345215, "global_step": 544200, "epoch": 6556} {"train_loss": -28.316852569580078, "global_step": 544201, "epoch": 6556} {"train_loss": -27.472257614135742, "global_step": 544202, "epoch": 6556} {"train_loss": -28.093469619750977, "global_step": 544203, "epoch": 6556} {"train_loss": -27.425851821899414, "global_step": 544204, "epoch": 6556} {"train_loss": -27.90450096130371, "global_step": 544205, "epoch": 6556} {"train_loss": -28.06026268005371, "global_step": 544206, "epoch": 6556} {"train_loss": -27.63111686706543, "global_step": 544207, "epoch": 6556} {"train_loss": -27.9417724609375, "global_step": 544208, "epoch": 6556} {"train_loss": -27.362548828125, "global_step": 544209, "epoch": 6556} {"train_loss": -27.7584285736084, "global_step": 544210, "epoch": 6556} {"train_loss": -27.55191421508789, "global_step": 544211, "epoch": 6556} {"train_loss": -27.755239486694336, "global_step": 544212, "epoch": 6556} {"train_loss": -27.602094650268555, "global_step": 544213, "epoch": 6556} {"train_loss": -27.90185546875, "global_step": 544214, "epoch": 6556} {"train_loss": -27.386798858642578, "global_step": 544215, "epoch": 6556} {"train_loss": -27.485797882080078, "global_step": 544216, "epoch": 6556} {"train_loss": -27.746793746948242, "global_step": 544217, "epoch": 6556} {"train_loss": -27.747243881225586, "global_step": 544218, "epoch": 6556} {"train_loss": -27.6622314453125, "global_step": 544219, "epoch": 6556} {"train_loss": -27.190099716186523, "global_step": 544220, "epoch": 6556} {"train_loss": -26.202741622924805, "global_step": 544221, "epoch": 6556} {"train_loss": -26.105762481689453, "global_step": 544222, "epoch": 6556} {"train_loss": -27.049457550048828, "global_step": 544223, "epoch": 6556} {"train_loss": -27.36923599243164, "global_step": 544224, "epoch": 6556} {"train_loss": -26.53431510925293, "global_step": 544225, "epoch": 6556} {"train_loss": -26.45608901977539, "global_step": 544226, "epoch": 6556} {"train_loss": -27.63629722595215, "global_step": 544227, "epoch": 6556} {"train_loss": -26.811132431030273, "global_step": 544228, "epoch": 6556} {"train_loss": -27.052480697631836, "global_step": 544229, "epoch": 6556} {"train_loss": -27.5285272023764, "global_step": 544230, "epoch": 6556, "val_loss": 6615266.0} {"train_loss": -26.120025634765625, "global_step": 544231, "epoch": 6557} {"train_loss": -26.92647361755371, "global_step": 544232, "epoch": 6557} {"train_loss": -26.729888916015625, "global_step": 544233, "epoch": 6557} {"train_loss": -26.91965675354004, "global_step": 544234, "epoch": 6557} {"train_loss": -26.7098388671875, "global_step": 544235, "epoch": 6557} {"train_loss": -27.03415870666504, "global_step": 544236, "epoch": 6557} {"train_loss": -26.967792510986328, "global_step": 544237, "epoch": 6557} {"train_loss": -26.96648597717285, "global_step": 544238, "epoch": 6557} {"train_loss": -26.78590202331543, "global_step": 544239, "epoch": 6557} {"train_loss": -27.263147354125977, "global_step": 544240, "epoch": 6557} {"train_loss": -27.35926628112793, "global_step": 544241, "epoch": 6557} {"train_loss": -27.163625717163086, "global_step": 544242, "epoch": 6557} {"train_loss": -26.774890899658203, "global_step": 544243, "epoch": 6557} {"train_loss": -27.03702163696289, "global_step": 544244, "epoch": 6557} {"train_loss": -27.282934188842773, "global_step": 544245, "epoch": 6557} {"train_loss": -26.955642700195312, "global_step": 544246, "epoch": 6557} {"train_loss": -27.467676162719727, "global_step": 544247, "epoch": 6557} {"train_loss": -27.329086303710938, "global_step": 544248, "epoch": 6557} {"train_loss": -27.245824813842773, "global_step": 544249, "epoch": 6557} {"train_loss": -27.293359756469727, "global_step": 544250, "epoch": 6557} {"train_loss": -27.37201499938965, "global_step": 544251, "epoch": 6557} {"train_loss": -27.309951782226562, "global_step": 544252, "epoch": 6557} {"train_loss": -27.693403244018555, "global_step": 544253, "epoch": 6557} {"train_loss": -27.743545532226562, "global_step": 544254, "epoch": 6557} {"train_loss": -27.569046020507812, "global_step": 544255, "epoch": 6557} {"train_loss": -27.289716720581055, "global_step": 544256, "epoch": 6557} {"train_loss": -27.314132690429688, "global_step": 544257, "epoch": 6557} {"train_loss": -27.3674373626709, "global_step": 544258, "epoch": 6557} {"train_loss": -27.52252769470215, "global_step": 544259, "epoch": 6557} {"train_loss": -27.62713623046875, "global_step": 544260, "epoch": 6557} {"train_loss": -27.652311325073242, "global_step": 544261, "epoch": 6557} {"train_loss": -27.640424728393555, "global_step": 544262, "epoch": 6557} {"train_loss": -27.791492462158203, "global_step": 544263, "epoch": 6557} {"train_loss": -27.871850967407227, "global_step": 544264, "epoch": 6557} {"train_loss": -27.68293571472168, "global_step": 544265, "epoch": 6557} {"train_loss": -27.913293838500977, "global_step": 544266, "epoch": 6557} {"train_loss": -27.4221134185791, "global_step": 544267, "epoch": 6557} {"train_loss": -28.084232330322266, "global_step": 544268, "epoch": 6557} {"train_loss": -27.555652618408203, "global_step": 544269, "epoch": 6557} {"train_loss": -27.58391761779785, "global_step": 544270, "epoch": 6557} {"train_loss": -27.816068649291992, "global_step": 544271, "epoch": 6557} {"train_loss": -27.675968170166016, "global_step": 544272, "epoch": 6557} {"train_loss": -27.99709129333496, "global_step": 544273, "epoch": 6557} {"train_loss": -27.55266761779785, "global_step": 544274, "epoch": 6557} {"train_loss": -27.974246978759766, "global_step": 544275, "epoch": 6557} {"train_loss": -28.106231689453125, "global_step": 544276, "epoch": 6557} {"train_loss": -28.022809982299805, "global_step": 544277, "epoch": 6557} {"train_loss": -27.94052505493164, "global_step": 544278, "epoch": 6557} {"train_loss": -27.587690353393555, "global_step": 544279, "epoch": 6557} {"train_loss": -28.051782608032227, "global_step": 544280, "epoch": 6557} {"train_loss": -27.86842918395996, "global_step": 544281, "epoch": 6557} {"train_loss": -27.991788864135742, "global_step": 544282, "epoch": 6557} {"train_loss": -28.08846092224121, "global_step": 544283, "epoch": 6557} {"train_loss": -27.80182456970215, "global_step": 544284, "epoch": 6557} {"train_loss": -28.077810287475586, "global_step": 544285, "epoch": 6557} {"train_loss": -27.809356689453125, "global_step": 544286, "epoch": 6557} {"train_loss": -27.789731979370117, "global_step": 544287, "epoch": 6557} {"train_loss": -28.25762367248535, "global_step": 544288, "epoch": 6557} {"train_loss": -28.342004776000977, "global_step": 544289, "epoch": 6557} {"train_loss": -27.90846061706543, "global_step": 544290, "epoch": 6557} {"train_loss": -27.854644775390625, "global_step": 544291, "epoch": 6557} {"train_loss": -27.8966121673584, "global_step": 544292, "epoch": 6557} {"train_loss": -28.121601104736328, "global_step": 544293, "epoch": 6557} {"train_loss": -27.723352432250977, "global_step": 544294, "epoch": 6557} {"train_loss": -28.00946617126465, "global_step": 544295, "epoch": 6557} {"train_loss": -27.705778121948242, "global_step": 544296, "epoch": 6557} {"train_loss": -28.110870361328125, "global_step": 544297, "epoch": 6557} {"train_loss": -27.693357467651367, "global_step": 544298, "epoch": 6557} {"train_loss": -27.890884399414062, "global_step": 544299, "epoch": 6557} {"train_loss": -28.126630783081055, "global_step": 544300, "epoch": 6557} {"train_loss": -28.11675453186035, "global_step": 544301, "epoch": 6557} {"train_loss": -27.722620010375977, "global_step": 544302, "epoch": 6557} {"train_loss": -27.857885360717773, "global_step": 544303, "epoch": 6557} {"train_loss": -27.289880752563477, "global_step": 544304, "epoch": 6557} {"train_loss": -27.306604385375977, "global_step": 544305, "epoch": 6557} {"train_loss": -26.704242706298828, "global_step": 544306, "epoch": 6557} {"train_loss": -25.744522094726562, "global_step": 544307, "epoch": 6557} {"train_loss": -25.31470489501953, "global_step": 544308, "epoch": 6557} {"train_loss": -26.9217529296875, "global_step": 544309, "epoch": 6557} {"train_loss": -26.9887638092041, "global_step": 544310, "epoch": 6557} {"train_loss": -26.27558708190918, "global_step": 544311, "epoch": 6557} {"train_loss": -27.429065704345703, "global_step": 544312, "epoch": 6557} {"train_loss": -27.500060598534272, "global_step": 544313, "epoch": 6557, "val_loss": 6607136.0} {"train_loss": -24.88945198059082, "global_step": 544314, "epoch": 6558} {"train_loss": -25.22673988342285, "global_step": 544315, "epoch": 6558} {"train_loss": -24.669797897338867, "global_step": 544316, "epoch": 6558} {"train_loss": -25.74310874938965, "global_step": 544317, "epoch": 6558} {"train_loss": -25.208765029907227, "global_step": 544318, "epoch": 6558} {"train_loss": -25.77174186706543, "global_step": 544319, "epoch": 6558} {"train_loss": -25.828643798828125, "global_step": 544320, "epoch": 6558} {"train_loss": -26.06019401550293, "global_step": 544321, "epoch": 6558} {"train_loss": -25.647756576538086, "global_step": 544322, "epoch": 6558} {"train_loss": -26.271591186523438, "global_step": 544323, "epoch": 6558} {"train_loss": -25.506296157836914, "global_step": 544324, "epoch": 6558} {"train_loss": -26.424488067626953, "global_step": 544325, "epoch": 6558} {"train_loss": -26.14584732055664, "global_step": 544326, "epoch": 6558} {"train_loss": -26.21224021911621, "global_step": 544327, "epoch": 6558} {"train_loss": -26.38880729675293, "global_step": 544328, "epoch": 6558} {"train_loss": -26.261754989624023, "global_step": 544329, "epoch": 6558} {"train_loss": -26.159265518188477, "global_step": 544330, "epoch": 6558} {"train_loss": -26.587677001953125, "global_step": 544331, "epoch": 6558} {"train_loss": -26.395898818969727, "global_step": 544332, "epoch": 6558} {"train_loss": -26.59543228149414, "global_step": 544333, "epoch": 6558} {"train_loss": -26.55059814453125, "global_step": 544334, "epoch": 6558} {"train_loss": -26.267423629760742, "global_step": 544335, "epoch": 6558} {"train_loss": -26.468656539916992, "global_step": 544336, "epoch": 6558} {"train_loss": -26.78213882446289, "global_step": 544337, "epoch": 6558} {"train_loss": -27.064558029174805, "global_step": 544338, "epoch": 6558} {"train_loss": -26.864398956298828, "global_step": 544339, "epoch": 6558} {"train_loss": -27.186298370361328, "global_step": 544340, "epoch": 6558} {"train_loss": -26.905517578125, "global_step": 544341, "epoch": 6558} {"train_loss": -27.088693618774414, "global_step": 544342, "epoch": 6558} {"train_loss": -27.141447067260742, "global_step": 544343, "epoch": 6558} {"train_loss": -26.788694381713867, "global_step": 544344, "epoch": 6558} {"train_loss": -27.2615909576416, "global_step": 544345, "epoch": 6558} {"train_loss": -26.79083824157715, "global_step": 544346, "epoch": 6558} {"train_loss": -27.195825576782227, "global_step": 544347, "epoch": 6558} {"train_loss": -27.18583106994629, "global_step": 544348, "epoch": 6558} {"train_loss": -27.132415771484375, "global_step": 544349, "epoch": 6558} {"train_loss": -27.026769638061523, "global_step": 544350, "epoch": 6558} {"train_loss": -27.383352279663086, "global_step": 544351, "epoch": 6558} {"train_loss": -27.506546020507812, "global_step": 544352, "epoch": 6558} {"train_loss": -27.44672966003418, "global_step": 544353, "epoch": 6558} {"train_loss": -27.8964900970459, "global_step": 544354, "epoch": 6558} {"train_loss": -27.495288848876953, "global_step": 544355, "epoch": 6558} {"train_loss": -27.56134033203125, "global_step": 544356, "epoch": 6558} {"train_loss": -27.6789493560791, "global_step": 544357, "epoch": 6558} {"train_loss": -27.674484252929688, "global_step": 544358, "epoch": 6558} {"train_loss": -27.635498046875, "global_step": 544359, "epoch": 6558} {"train_loss": -27.76949119567871, "global_step": 544360, "epoch": 6558} {"train_loss": -27.692432403564453, "global_step": 544361, "epoch": 6558} {"train_loss": -27.636249542236328, "global_step": 544362, "epoch": 6558} {"train_loss": -27.811813354492188, "global_step": 544363, "epoch": 6558} {"train_loss": -27.58577537536621, "global_step": 544364, "epoch": 6558} {"train_loss": -27.522953033447266, "global_step": 544365, "epoch": 6558} {"train_loss": -27.37128257751465, "global_step": 544366, "epoch": 6558} {"train_loss": -27.53972816467285, "global_step": 544367, "epoch": 6558} {"train_loss": -27.653579711914062, "global_step": 544368, "epoch": 6558} {"train_loss": -27.673547744750977, "global_step": 544369, "epoch": 6558} {"train_loss": -27.56951332092285, "global_step": 544370, "epoch": 6558} {"train_loss": -27.893695831298828, "global_step": 544371, "epoch": 6558} {"train_loss": -27.562658309936523, "global_step": 544372, "epoch": 6558} {"train_loss": -27.455795288085938, "global_step": 544373, "epoch": 6558} {"train_loss": -27.912214279174805, "global_step": 544374, "epoch": 6558} {"train_loss": -27.793073654174805, "global_step": 544375, "epoch": 6558} {"train_loss": -27.90984535217285, "global_step": 544376, "epoch": 6558} {"train_loss": -27.767837524414062, "global_step": 544377, "epoch": 6558} {"train_loss": -27.69391441345215, "global_step": 544378, "epoch": 6558} {"train_loss": -27.85980796813965, "global_step": 544379, "epoch": 6558} {"train_loss": -27.653085708618164, "global_step": 544380, "epoch": 6558} {"train_loss": -27.6028995513916, "global_step": 544381, "epoch": 6558} {"train_loss": -27.40992546081543, "global_step": 544382, "epoch": 6558} {"train_loss": -27.663965225219727, "global_step": 544383, "epoch": 6558} {"train_loss": -27.787755966186523, "global_step": 544384, "epoch": 6558} {"train_loss": -27.76197624206543, "global_step": 544385, "epoch": 6558} {"train_loss": -27.862638473510742, "global_step": 544386, "epoch": 6558} {"train_loss": -27.95381736755371, "global_step": 544387, "epoch": 6558} {"train_loss": -27.770709991455078, "global_step": 544388, "epoch": 6558} {"train_loss": -27.43179702758789, "global_step": 544389, "epoch": 6558} {"train_loss": -27.94380760192871, "global_step": 544390, "epoch": 6558} {"train_loss": -28.028121948242188, "global_step": 544391, "epoch": 6558} {"train_loss": -28.111892700195312, "global_step": 544392, "epoch": 6558} {"train_loss": -27.955503463745117, "global_step": 544393, "epoch": 6558} {"train_loss": -27.592498779296875, "global_step": 544394, "epoch": 6558} {"train_loss": -27.759565353393555, "global_step": 544395, "epoch": 6558} {"train_loss": -27.113527137112904, "global_step": 544396, "epoch": 6558, "val_loss": 6690506.0} {"train_loss": -26.489395141601562, "global_step": 544397, "epoch": 6559} {"train_loss": -27.197107315063477, "global_step": 544398, "epoch": 6559} {"train_loss": -27.148303985595703, "global_step": 544399, "epoch": 6559} {"train_loss": -27.016189575195312, "global_step": 544400, "epoch": 6559} {"train_loss": -26.254987716674805, "global_step": 544401, "epoch": 6559} {"train_loss": -27.311986923217773, "global_step": 544402, "epoch": 6559} {"train_loss": -26.79071617126465, "global_step": 544403, "epoch": 6559} {"train_loss": -27.40570640563965, "global_step": 544404, "epoch": 6559} {"train_loss": -26.974231719970703, "global_step": 544405, "epoch": 6559} {"train_loss": -26.92364501953125, "global_step": 544406, "epoch": 6559} {"train_loss": -27.185678482055664, "global_step": 544407, "epoch": 6559} {"train_loss": -27.398523330688477, "global_step": 544408, "epoch": 6559} {"train_loss": -27.064672470092773, "global_step": 544409, "epoch": 6559} {"train_loss": -26.694732666015625, "global_step": 544410, "epoch": 6559} {"train_loss": -27.260589599609375, "global_step": 544411, "epoch": 6559} {"train_loss": -27.501346588134766, "global_step": 544412, "epoch": 6559} {"train_loss": -26.86561393737793, "global_step": 544413, "epoch": 6559} {"train_loss": -26.91904067993164, "global_step": 544414, "epoch": 6559} {"train_loss": -27.512540817260742, "global_step": 544415, "epoch": 6559} {"train_loss": -27.052473068237305, "global_step": 544416, "epoch": 6559} {"train_loss": -27.41510009765625, "global_step": 544417, "epoch": 6559} {"train_loss": -27.5329647064209, "global_step": 544418, "epoch": 6559} {"train_loss": -27.655242919921875, "global_step": 544419, "epoch": 6559} {"train_loss": -27.50676918029785, "global_step": 544420, "epoch": 6559} {"train_loss": -27.585851669311523, "global_step": 544421, "epoch": 6559} {"train_loss": -27.471277236938477, "global_step": 544422, "epoch": 6559} {"train_loss": -27.65926170349121, "global_step": 544423, "epoch": 6559} {"train_loss": -27.170333862304688, "global_step": 544424, "epoch": 6559} {"train_loss": -27.751956939697266, "global_step": 544425, "epoch": 6559} {"train_loss": -27.443429946899414, "global_step": 544426, "epoch": 6559} {"train_loss": -27.452707290649414, "global_step": 544427, "epoch": 6559} {"train_loss": -27.49908447265625, "global_step": 544428, "epoch": 6559} {"train_loss": -27.469945907592773, "global_step": 544429, "epoch": 6559} {"train_loss": -27.79719352722168, "global_step": 544430, "epoch": 6559} {"train_loss": -27.392642974853516, "global_step": 544431, "epoch": 6559} {"train_loss": -27.831384658813477, "global_step": 544432, "epoch": 6559} {"train_loss": -27.559528350830078, "global_step": 544433, "epoch": 6559} {"train_loss": -27.75245475769043, "global_step": 544434, "epoch": 6559} {"train_loss": -27.667997360229492, "global_step": 544435, "epoch": 6559} {"train_loss": -27.530654907226562, "global_step": 544436, "epoch": 6559} {"train_loss": -27.660131454467773, "global_step": 544437, "epoch": 6559} {"train_loss": -27.847829818725586, "global_step": 544438, "epoch": 6559} {"train_loss": -27.498126983642578, "global_step": 544439, "epoch": 6559} {"train_loss": -27.851184844970703, "global_step": 544440, "epoch": 6559} {"train_loss": -27.43524742126465, "global_step": 544441, "epoch": 6559} {"train_loss": -27.54438591003418, "global_step": 544442, "epoch": 6559} {"train_loss": -27.96595573425293, "global_step": 544443, "epoch": 6559} {"train_loss": -27.330480575561523, "global_step": 544444, "epoch": 6559} {"train_loss": -28.017898559570312, "global_step": 544445, "epoch": 6559} {"train_loss": -27.922555923461914, "global_step": 544446, "epoch": 6559} {"train_loss": -27.93820571899414, "global_step": 544447, "epoch": 6559} {"train_loss": -27.897436141967773, "global_step": 544448, "epoch": 6559} {"train_loss": -27.857946395874023, "global_step": 544449, "epoch": 6559} {"train_loss": -27.7973690032959, "global_step": 544450, "epoch": 6559} {"train_loss": -27.645944595336914, "global_step": 544451, "epoch": 6559} {"train_loss": -27.800601959228516, "global_step": 544452, "epoch": 6559} {"train_loss": -27.913105010986328, "global_step": 544453, "epoch": 6559} {"train_loss": -28.095001220703125, "global_step": 544454, "epoch": 6559} {"train_loss": -27.739261627197266, "global_step": 544455, "epoch": 6559} {"train_loss": -27.753305435180664, "global_step": 544456, "epoch": 6559} {"train_loss": -27.45697021484375, "global_step": 544457, "epoch": 6559} {"train_loss": -27.7777042388916, "global_step": 544458, "epoch": 6559} {"train_loss": -28.188159942626953, "global_step": 544459, "epoch": 6559} {"train_loss": -27.909292221069336, "global_step": 544460, "epoch": 6559} {"train_loss": -27.764923095703125, "global_step": 544461, "epoch": 6559} {"train_loss": -27.792844772338867, "global_step": 544462, "epoch": 6559} {"train_loss": -27.758466720581055, "global_step": 544463, "epoch": 6559} {"train_loss": -27.959081649780273, "global_step": 544464, "epoch": 6559} {"train_loss": -27.979684829711914, "global_step": 544465, "epoch": 6559} {"train_loss": -27.798337936401367, "global_step": 544466, "epoch": 6559} {"train_loss": -28.139209747314453, "global_step": 544467, "epoch": 6559} {"train_loss": -27.851255416870117, "global_step": 544468, "epoch": 6559} {"train_loss": -27.924579620361328, "global_step": 544469, "epoch": 6559} {"train_loss": -28.02729606628418, "global_step": 544470, "epoch": 6559} {"train_loss": -27.76386070251465, "global_step": 544471, "epoch": 6559} {"train_loss": -27.958356857299805, "global_step": 544472, "epoch": 6559} {"train_loss": -27.861743927001953, "global_step": 544473, "epoch": 6559} {"train_loss": -28.04725456237793, "global_step": 544474, "epoch": 6559} {"train_loss": -28.075586318969727, "global_step": 544475, "epoch": 6559} {"train_loss": -27.996662139892578, "global_step": 544476, "epoch": 6559} {"train_loss": -27.979833602905273, "global_step": 544477, "epoch": 6559} {"train_loss": -27.46027183532715, "global_step": 544478, "epoch": 6559} {"train_loss": -27.570558226252178, "global_step": 544479, "epoch": 6559, "val_loss": 6500300.0} {"train_loss": -27.308734893798828, "global_step": 544480, "epoch": 6560} {"train_loss": -26.801319122314453, "global_step": 544481, "epoch": 6560} {"train_loss": -26.358489990234375, "global_step": 544482, "epoch": 6560} {"train_loss": -26.422407150268555, "global_step": 544483, "epoch": 6560} {"train_loss": -26.038583755493164, "global_step": 544484, "epoch": 6560} {"train_loss": -26.4205265045166, "global_step": 544485, "epoch": 6560} {"train_loss": -26.76032829284668, "global_step": 544486, "epoch": 6560} {"train_loss": -27.129133224487305, "global_step": 544487, "epoch": 6560} {"train_loss": -26.78689956665039, "global_step": 544488, "epoch": 6560} {"train_loss": -26.864133834838867, "global_step": 544489, "epoch": 6560} {"train_loss": -27.159748077392578, "global_step": 544490, "epoch": 6560} {"train_loss": -26.989490509033203, "global_step": 544491, "epoch": 6560} {"train_loss": -27.164731979370117, "global_step": 544492, "epoch": 6560} {"train_loss": -27.272602081298828, "global_step": 544493, "epoch": 6560} {"train_loss": -27.350385665893555, "global_step": 544494, "epoch": 6560} {"train_loss": -27.457229614257812, "global_step": 544495, "epoch": 6560} {"train_loss": -27.263111114501953, "global_step": 544496, "epoch": 6560} {"train_loss": -27.30803871154785, "global_step": 544497, "epoch": 6560} {"train_loss": -27.33738136291504, "global_step": 544498, "epoch": 6560} {"train_loss": -27.348173141479492, "global_step": 544499, "epoch": 6560} {"train_loss": -27.467945098876953, "global_step": 544500, "epoch": 6560} {"train_loss": -27.561864852905273, "global_step": 544501, "epoch": 6560} {"train_loss": -27.340534210205078, "global_step": 544502, "epoch": 6560} {"train_loss": -27.529693603515625, "global_step": 544503, "epoch": 6560} {"train_loss": -27.417585372924805, "global_step": 544504, "epoch": 6560} {"train_loss": -27.223743438720703, "global_step": 544505, "epoch": 6560} {"train_loss": -27.11627769470215, "global_step": 544506, "epoch": 6560} {"train_loss": -27.520893096923828, "global_step": 544507, "epoch": 6560} {"train_loss": -27.055408477783203, "global_step": 544508, "epoch": 6560} {"train_loss": -27.63327980041504, "global_step": 544509, "epoch": 6560} {"train_loss": -27.55417823791504, "global_step": 544510, "epoch": 6560} {"train_loss": -27.754730224609375, "global_step": 544511, "epoch": 6560} {"train_loss": -27.46198844909668, "global_step": 544512, "epoch": 6560} {"train_loss": -27.45954704284668, "global_step": 544513, "epoch": 6560} {"train_loss": -27.470495223999023, "global_step": 544514, "epoch": 6560} {"train_loss": -27.535980224609375, "global_step": 544515, "epoch": 6560} {"train_loss": -27.3757266998291, "global_step": 544516, "epoch": 6560} {"train_loss": -27.685260772705078, "global_step": 544517, "epoch": 6560} {"train_loss": -27.7198429107666, "global_step": 544518, "epoch": 6560} {"train_loss": -27.457275390625, "global_step": 544519, "epoch": 6560} {"train_loss": -27.748249053955078, "global_step": 544520, "epoch": 6560} {"train_loss": -27.9433536529541, "global_step": 544521, "epoch": 6560} {"train_loss": -27.69292640686035, "global_step": 544522, "epoch": 6560} {"train_loss": -27.44380760192871, "global_step": 544523, "epoch": 6560} {"train_loss": -27.623029708862305, "global_step": 544524, "epoch": 6560} {"train_loss": -27.62762451171875, "global_step": 544525, "epoch": 6560} {"train_loss": -28.021747589111328, "global_step": 544526, "epoch": 6560} {"train_loss": -27.9769344329834, "global_step": 544527, "epoch": 6560} {"train_loss": -28.062366485595703, "global_step": 544528, "epoch": 6560} {"train_loss": -27.784574508666992, "global_step": 544529, "epoch": 6560} {"train_loss": -27.653003692626953, "global_step": 544530, "epoch": 6560} {"train_loss": -27.676477432250977, "global_step": 544531, "epoch": 6560} {"train_loss": -27.63791847229004, "global_step": 544532, "epoch": 6560} {"train_loss": -27.93171501159668, "global_step": 544533, "epoch": 6560} {"train_loss": -27.78080177307129, "global_step": 544534, "epoch": 6560} {"train_loss": -27.56964683532715, "global_step": 544535, "epoch": 6560} {"train_loss": -28.158004760742188, "global_step": 544536, "epoch": 6560} {"train_loss": -27.347509384155273, "global_step": 544537, "epoch": 6560} {"train_loss": -27.785608291625977, "global_step": 544538, "epoch": 6560} {"train_loss": -27.052005767822266, "global_step": 544539, "epoch": 6560} {"train_loss": -25.946704864501953, "global_step": 544540, "epoch": 6560} {"train_loss": -24.05485725402832, "global_step": 544541, "epoch": 6560} {"train_loss": -25.586986541748047, "global_step": 544542, "epoch": 6560} {"train_loss": -26.964466094970703, "global_step": 544543, "epoch": 6560} {"train_loss": -25.70859146118164, "global_step": 544544, "epoch": 6560} {"train_loss": -27.401870727539062, "global_step": 544545, "epoch": 6560} {"train_loss": -26.20395851135254, "global_step": 544546, "epoch": 6560} {"train_loss": -27.663965225219727, "global_step": 544547, "epoch": 6560} {"train_loss": -26.896448135375977, "global_step": 544548, "epoch": 6560} {"train_loss": -26.73952293395996, "global_step": 544549, "epoch": 6560} {"train_loss": -27.329010009765625, "global_step": 544550, "epoch": 6560} {"train_loss": -27.208938598632812, "global_step": 544551, "epoch": 6560} {"train_loss": -27.3664493560791, "global_step": 544552, "epoch": 6560} {"train_loss": -27.494842529296875, "global_step": 544553, "epoch": 6560} {"train_loss": -27.6590633392334, "global_step": 544554, "epoch": 6560} {"train_loss": -27.366064071655273, "global_step": 544555, "epoch": 6560} {"train_loss": -27.32573890686035, "global_step": 544556, "epoch": 6560} {"train_loss": -27.671377182006836, "global_step": 544557, "epoch": 6560} {"train_loss": -27.605066299438477, "global_step": 544558, "epoch": 6560} {"train_loss": -27.28486442565918, "global_step": 544559, "epoch": 6560} {"train_loss": -27.19069480895996, "global_step": 544560, "epoch": 6560} {"train_loss": -27.295637130737305, "global_step": 544561, "epoch": 6560} {"train_loss": -27.25190693499094, "global_step": 544562, "epoch": 6560, "val_loss": 6546712.0} {"train_loss": -26.769498825073242, "global_step": 544563, "epoch": 6561} {"train_loss": -26.77703857421875, "global_step": 544564, "epoch": 6561} {"train_loss": -27.408533096313477, "global_step": 544565, "epoch": 6561} {"train_loss": -26.164701461791992, "global_step": 544566, "epoch": 6561} {"train_loss": -25.925434112548828, "global_step": 544567, "epoch": 6561} {"train_loss": -25.824600219726562, "global_step": 544568, "epoch": 6561} {"train_loss": -26.8094482421875, "global_step": 544569, "epoch": 6561} {"train_loss": -26.771636962890625, "global_step": 544570, "epoch": 6561} {"train_loss": -26.569665908813477, "global_step": 544571, "epoch": 6561} {"train_loss": -27.029077529907227, "global_step": 544572, "epoch": 6561} {"train_loss": -26.947662353515625, "global_step": 544573, "epoch": 6561} {"train_loss": -27.222858428955078, "global_step": 544574, "epoch": 6561} {"train_loss": -27.242816925048828, "global_step": 544575, "epoch": 6561} {"train_loss": -26.9348087310791, "global_step": 544576, "epoch": 6561} {"train_loss": -27.16586685180664, "global_step": 544577, "epoch": 6561} {"train_loss": -27.147470474243164, "global_step": 544578, "epoch": 6561} {"train_loss": -27.266565322875977, "global_step": 544579, "epoch": 6561} {"train_loss": -27.368946075439453, "global_step": 544580, "epoch": 6561} {"train_loss": -27.1683406829834, "global_step": 544581, "epoch": 6561} {"train_loss": -27.473804473876953, "global_step": 544582, "epoch": 6561} {"train_loss": -26.911481857299805, "global_step": 544583, "epoch": 6561} {"train_loss": -27.590747833251953, "global_step": 544584, "epoch": 6561} {"train_loss": -27.53696632385254, "global_step": 544585, "epoch": 6561} {"train_loss": -26.806549072265625, "global_step": 544586, "epoch": 6561} {"train_loss": -27.459348678588867, "global_step": 544587, "epoch": 6561} {"train_loss": -27.07588768005371, "global_step": 544588, "epoch": 6561} {"train_loss": -27.504764556884766, "global_step": 544589, "epoch": 6561} {"train_loss": -27.504154205322266, "global_step": 544590, "epoch": 6561} {"train_loss": -27.438562393188477, "global_step": 544591, "epoch": 6561} {"train_loss": -28.017683029174805, "global_step": 544592, "epoch": 6561} {"train_loss": -27.43544578552246, "global_step": 544593, "epoch": 6561} {"train_loss": -27.6776123046875, "global_step": 544594, "epoch": 6561} {"train_loss": -27.349271774291992, "global_step": 544595, "epoch": 6561} {"train_loss": -27.445587158203125, "global_step": 544596, "epoch": 6561} {"train_loss": -27.493087768554688, "global_step": 544597, "epoch": 6561} {"train_loss": -27.608718872070312, "global_step": 544598, "epoch": 6561} {"train_loss": -27.829898834228516, "global_step": 544599, "epoch": 6561} {"train_loss": -27.372262954711914, "global_step": 544600, "epoch": 6561} {"train_loss": -27.885391235351562, "global_step": 544601, "epoch": 6561} {"train_loss": -27.574689865112305, "global_step": 544602, "epoch": 6561} {"train_loss": -27.67447853088379, "global_step": 544603, "epoch": 6561} {"train_loss": -27.51508140563965, "global_step": 544604, "epoch": 6561} {"train_loss": -28.133655548095703, "global_step": 544605, "epoch": 6561} {"train_loss": -27.836612701416016, "global_step": 544606, "epoch": 6561} {"train_loss": -27.864850997924805, "global_step": 544607, "epoch": 6561} {"train_loss": -27.86213493347168, "global_step": 544608, "epoch": 6561} {"train_loss": -27.557315826416016, "global_step": 544609, "epoch": 6561} {"train_loss": -27.762109756469727, "global_step": 544610, "epoch": 6561} {"train_loss": -27.93561363220215, "global_step": 544611, "epoch": 6561} {"train_loss": -27.58246421813965, "global_step": 544612, "epoch": 6561} {"train_loss": -28.0218505859375, "global_step": 544613, "epoch": 6561} {"train_loss": -27.887638092041016, "global_step": 544614, "epoch": 6561} {"train_loss": -27.63840103149414, "global_step": 544615, "epoch": 6561} {"train_loss": -27.668203353881836, "global_step": 544616, "epoch": 6561} {"train_loss": -27.55368995666504, "global_step": 544617, "epoch": 6561} {"train_loss": -27.238962173461914, "global_step": 544618, "epoch": 6561} {"train_loss": -27.25459861755371, "global_step": 544619, "epoch": 6561} {"train_loss": -27.029462814331055, "global_step": 544620, "epoch": 6561} {"train_loss": -26.53891372680664, "global_step": 544621, "epoch": 6561} {"train_loss": -26.521183013916016, "global_step": 544622, "epoch": 6561} {"train_loss": -27.4555721282959, "global_step": 544623, "epoch": 6561} {"train_loss": -27.55653190612793, "global_step": 544624, "epoch": 6561} {"train_loss": -26.91301918029785, "global_step": 544625, "epoch": 6561} {"train_loss": -26.773059844970703, "global_step": 544626, "epoch": 6561} {"train_loss": -27.14727210998535, "global_step": 544627, "epoch": 6561} {"train_loss": -26.352842330932617, "global_step": 544628, "epoch": 6561} {"train_loss": -26.801776885986328, "global_step": 544629, "epoch": 6561} {"train_loss": -27.172657012939453, "global_step": 544630, "epoch": 6561} {"train_loss": -27.157703399658203, "global_step": 544631, "epoch": 6561} {"train_loss": -26.814605712890625, "global_step": 544632, "epoch": 6561} {"train_loss": -27.127853393554688, "global_step": 544633, "epoch": 6561} {"train_loss": -26.85235023498535, "global_step": 544634, "epoch": 6561} {"train_loss": -27.07501220703125, "global_step": 544635, "epoch": 6561} {"train_loss": -27.159900665283203, "global_step": 544636, "epoch": 6561} {"train_loss": -27.421436309814453, "global_step": 544637, "epoch": 6561} {"train_loss": -26.835830688476562, "global_step": 544638, "epoch": 6561} {"train_loss": -27.120283126831055, "global_step": 544639, "epoch": 6561} {"train_loss": -27.12481689453125, "global_step": 544640, "epoch": 6561} {"train_loss": -27.39617919921875, "global_step": 544641, "epoch": 6561} {"train_loss": -27.196186065673828, "global_step": 544642, "epoch": 6561} {"train_loss": -27.57583999633789, "global_step": 544643, "epoch": 6561} {"train_loss": -27.580291748046875, "global_step": 544644, "epoch": 6561} {"train_loss": -27.251506138996906, "global_step": 544645, "epoch": 6561, "val_loss": 6539353.5} {"train_loss": -25.591890335083008, "global_step": 544646, "epoch": 6562} {"train_loss": -24.561201095581055, "global_step": 544647, "epoch": 6562} {"train_loss": -24.719669342041016, "global_step": 544648, "epoch": 6562} {"train_loss": -24.71415138244629, "global_step": 544649, "epoch": 6562} {"train_loss": -25.082340240478516, "global_step": 544650, "epoch": 6562} {"train_loss": -26.259817123413086, "global_step": 544651, "epoch": 6562} {"train_loss": -26.43269157409668, "global_step": 544652, "epoch": 6562} {"train_loss": -26.754932403564453, "global_step": 544653, "epoch": 6562} {"train_loss": -26.869342803955078, "global_step": 544654, "epoch": 6562} {"train_loss": -26.425373077392578, "global_step": 544655, "epoch": 6562} {"train_loss": -26.506696701049805, "global_step": 544656, "epoch": 6562} {"train_loss": -26.372968673706055, "global_step": 544657, "epoch": 6562} {"train_loss": -26.238666534423828, "global_step": 544658, "epoch": 6562} {"train_loss": -26.8382511138916, "global_step": 544659, "epoch": 6562} {"train_loss": -26.44840431213379, "global_step": 544660, "epoch": 6562} {"train_loss": -26.81647300720215, "global_step": 544661, "epoch": 6562} {"train_loss": -26.79903221130371, "global_step": 544662, "epoch": 6562} {"train_loss": -27.251056671142578, "global_step": 544663, "epoch": 6562} {"train_loss": -26.9537353515625, "global_step": 544664, "epoch": 6562} {"train_loss": -26.897125244140625, "global_step": 544665, "epoch": 6562} {"train_loss": -27.131925582885742, "global_step": 544666, "epoch": 6562} {"train_loss": -27.53626823425293, "global_step": 544667, "epoch": 6562} {"train_loss": -27.0280704498291, "global_step": 544668, "epoch": 6562} {"train_loss": -26.954687118530273, "global_step": 544669, "epoch": 6562} {"train_loss": -27.354904174804688, "global_step": 544670, "epoch": 6562} {"train_loss": -26.581405639648438, "global_step": 544671, "epoch": 6562} {"train_loss": -27.21820640563965, "global_step": 544672, "epoch": 6562} {"train_loss": -27.52128028869629, "global_step": 544673, "epoch": 6562} {"train_loss": -27.302419662475586, "global_step": 544674, "epoch": 6562} {"train_loss": -27.24384117126465, "global_step": 544675, "epoch": 6562} {"train_loss": -27.353164672851562, "global_step": 544676, "epoch": 6562} {"train_loss": -27.2821044921875, "global_step": 544677, "epoch": 6562} {"train_loss": -27.428970336914062, "global_step": 544678, "epoch": 6562} {"train_loss": -27.5908260345459, "global_step": 544679, "epoch": 6562} {"train_loss": -27.471298217773438, "global_step": 544680, "epoch": 6562} {"train_loss": -26.986433029174805, "global_step": 544681, "epoch": 6562} {"train_loss": -27.401321411132812, "global_step": 544682, "epoch": 6562} {"train_loss": -27.5122127532959, "global_step": 544683, "epoch": 6562} {"train_loss": -27.06196403503418, "global_step": 544684, "epoch": 6562} {"train_loss": -27.540176391601562, "global_step": 544685, "epoch": 6562} {"train_loss": -27.345144271850586, "global_step": 544686, "epoch": 6562} {"train_loss": -27.517566680908203, "global_step": 544687, "epoch": 6562} {"train_loss": -27.552358627319336, "global_step": 544688, "epoch": 6562} {"train_loss": -27.14935874938965, "global_step": 544689, "epoch": 6562} {"train_loss": -27.5831356048584, "global_step": 544690, "epoch": 6562} {"train_loss": -27.7972469329834, "global_step": 544691, "epoch": 6562} {"train_loss": -27.631397247314453, "global_step": 544692, "epoch": 6562} {"train_loss": -27.919458389282227, "global_step": 544693, "epoch": 6562} {"train_loss": -27.6663818359375, "global_step": 544694, "epoch": 6562} {"train_loss": -27.605682373046875, "global_step": 544695, "epoch": 6562} {"train_loss": -27.86885643005371, "global_step": 544696, "epoch": 6562} {"train_loss": -27.406766891479492, "global_step": 544697, "epoch": 6562} {"train_loss": -27.79860496520996, "global_step": 544698, "epoch": 6562} {"train_loss": -27.572843551635742, "global_step": 544699, "epoch": 6562} {"train_loss": -27.3815975189209, "global_step": 544700, "epoch": 6562} {"train_loss": -27.896717071533203, "global_step": 544701, "epoch": 6562} {"train_loss": -27.34075927734375, "global_step": 544702, "epoch": 6562} {"train_loss": -27.769378662109375, "global_step": 544703, "epoch": 6562} {"train_loss": -28.01797866821289, "global_step": 544704, "epoch": 6562} {"train_loss": -27.81268882751465, "global_step": 544705, "epoch": 6562} {"train_loss": -27.840246200561523, "global_step": 544706, "epoch": 6562} {"train_loss": -27.8304386138916, "global_step": 544707, "epoch": 6562} {"train_loss": -27.662094116210938, "global_step": 544708, "epoch": 6562} {"train_loss": -27.53021812438965, "global_step": 544709, "epoch": 6562} {"train_loss": -27.82634925842285, "global_step": 544710, "epoch": 6562} {"train_loss": -27.72784423828125, "global_step": 544711, "epoch": 6562} {"train_loss": -27.81219482421875, "global_step": 544712, "epoch": 6562} {"train_loss": -27.54802894592285, "global_step": 544713, "epoch": 6562} {"train_loss": -27.581090927124023, "global_step": 544714, "epoch": 6562} {"train_loss": -27.924795150756836, "global_step": 544715, "epoch": 6562} {"train_loss": -27.74799156188965, "global_step": 544716, "epoch": 6562} {"train_loss": -27.330707550048828, "global_step": 544717, "epoch": 6562} {"train_loss": -27.354639053344727, "global_step": 544718, "epoch": 6562} {"train_loss": -27.489370346069336, "global_step": 544719, "epoch": 6562} {"train_loss": -27.96119499206543, "global_step": 544720, "epoch": 6562} {"train_loss": -27.692829132080078, "global_step": 544721, "epoch": 6562} {"train_loss": -27.7766056060791, "global_step": 544722, "epoch": 6562} {"train_loss": -27.43402099609375, "global_step": 544723, "epoch": 6562} {"train_loss": -27.73563003540039, "global_step": 544724, "epoch": 6562} {"train_loss": -27.520116806030273, "global_step": 544725, "epoch": 6562} {"train_loss": -27.594253540039062, "global_step": 544726, "epoch": 6562} {"train_loss": -27.83047866821289, "global_step": 544727, "epoch": 6562} {"train_loss": -27.218175681240588, "global_step": 544728, "epoch": 6562, "val_loss": 6575868.5} {"train_loss": -27.207813262939453, "global_step": 544729, "epoch": 6563} {"train_loss": -27.26161766052246, "global_step": 544730, "epoch": 6563} {"train_loss": -27.143598556518555, "global_step": 544731, "epoch": 6563} {"train_loss": -26.376163482666016, "global_step": 544732, "epoch": 6563} {"train_loss": -26.060693740844727, "global_step": 544733, "epoch": 6563} {"train_loss": -26.371007919311523, "global_step": 544734, "epoch": 6563} {"train_loss": -26.449310302734375, "global_step": 544735, "epoch": 6563} {"train_loss": -26.54090690612793, "global_step": 544736, "epoch": 6563} {"train_loss": -26.517309188842773, "global_step": 544737, "epoch": 6563} {"train_loss": -26.66997718811035, "global_step": 544738, "epoch": 6563} {"train_loss": -27.19062614440918, "global_step": 544739, "epoch": 6563} {"train_loss": -27.243946075439453, "global_step": 544740, "epoch": 6563} {"train_loss": -26.976552963256836, "global_step": 544741, "epoch": 6563} {"train_loss": -26.9488468170166, "global_step": 544742, "epoch": 6563} {"train_loss": -27.117292404174805, "global_step": 544743, "epoch": 6563} {"train_loss": -27.23346519470215, "global_step": 544744, "epoch": 6563} {"train_loss": -27.063169479370117, "global_step": 544745, "epoch": 6563} {"train_loss": -27.114465713500977, "global_step": 544746, "epoch": 6563} {"train_loss": -27.091100692749023, "global_step": 544747, "epoch": 6563} {"train_loss": -27.1068058013916, "global_step": 544748, "epoch": 6563} {"train_loss": -27.178998947143555, "global_step": 544749, "epoch": 6563} {"train_loss": -27.369129180908203, "global_step": 544750, "epoch": 6563} {"train_loss": -27.39729118347168, "global_step": 544751, "epoch": 6563} {"train_loss": -27.264753341674805, "global_step": 544752, "epoch": 6563} {"train_loss": -27.525970458984375, "global_step": 544753, "epoch": 6563} {"train_loss": -27.693044662475586, "global_step": 544754, "epoch": 6563} {"train_loss": -27.348905563354492, "global_step": 544755, "epoch": 6563} {"train_loss": -27.831790924072266, "global_step": 544756, "epoch": 6563} {"train_loss": -27.657209396362305, "global_step": 544757, "epoch": 6563} {"train_loss": -27.564191818237305, "global_step": 544758, "epoch": 6563} {"train_loss": -27.396747589111328, "global_step": 544759, "epoch": 6563} {"train_loss": -27.595666885375977, "global_step": 544760, "epoch": 6563} {"train_loss": -27.626073837280273, "global_step": 544761, "epoch": 6563} {"train_loss": -28.2048282623291, "global_step": 544762, "epoch": 6563} {"train_loss": -27.507049560546875, "global_step": 544763, "epoch": 6563} {"train_loss": -27.613916397094727, "global_step": 544764, "epoch": 6563} {"train_loss": -27.636627197265625, "global_step": 544765, "epoch": 6563} {"train_loss": -27.789030075073242, "global_step": 544766, "epoch": 6563} {"train_loss": -27.8890380859375, "global_step": 544767, "epoch": 6563} {"train_loss": -27.581647872924805, "global_step": 544768, "epoch": 6563} {"train_loss": -27.67254638671875, "global_step": 544769, "epoch": 6563} {"train_loss": -27.8936710357666, "global_step": 544770, "epoch": 6563} {"train_loss": -27.596837997436523, "global_step": 544771, "epoch": 6563} {"train_loss": -27.81452751159668, "global_step": 544772, "epoch": 6563} {"train_loss": -27.52488136291504, "global_step": 544773, "epoch": 6563} {"train_loss": -27.6501522064209, "global_step": 544774, "epoch": 6563} {"train_loss": -27.862613677978516, "global_step": 544775, "epoch": 6563} {"train_loss": -27.82831382751465, "global_step": 544776, "epoch": 6563} {"train_loss": -28.0416202545166, "global_step": 544777, "epoch": 6563} {"train_loss": -27.851511001586914, "global_step": 544778, "epoch": 6563} {"train_loss": -28.0869083404541, "global_step": 544779, "epoch": 6563} {"train_loss": -27.937314987182617, "global_step": 544780, "epoch": 6563} {"train_loss": -27.940954208374023, "global_step": 544781, "epoch": 6563} {"train_loss": -27.898305892944336, "global_step": 544782, "epoch": 6563} {"train_loss": -28.32568359375, "global_step": 544783, "epoch": 6563} {"train_loss": -27.783178329467773, "global_step": 544784, "epoch": 6563} {"train_loss": -27.488433837890625, "global_step": 544785, "epoch": 6563} {"train_loss": -27.78742027282715, "global_step": 544786, "epoch": 6563} {"train_loss": -27.66871452331543, "global_step": 544787, "epoch": 6563} {"train_loss": -27.510923385620117, "global_step": 544788, "epoch": 6563} {"train_loss": -27.181684494018555, "global_step": 544789, "epoch": 6563} {"train_loss": -26.777149200439453, "global_step": 544790, "epoch": 6563} {"train_loss": -27.58711051940918, "global_step": 544791, "epoch": 6563} {"train_loss": -27.781896591186523, "global_step": 544792, "epoch": 6563} {"train_loss": -27.261383056640625, "global_step": 544793, "epoch": 6563} {"train_loss": -27.52387809753418, "global_step": 544794, "epoch": 6563} {"train_loss": -27.166522979736328, "global_step": 544795, "epoch": 6563} {"train_loss": -27.27475929260254, "global_step": 544796, "epoch": 6563} {"train_loss": -27.594013214111328, "global_step": 544797, "epoch": 6563} {"train_loss": -27.27545738220215, "global_step": 544798, "epoch": 6563} {"train_loss": -26.902090072631836, "global_step": 544799, "epoch": 6563} {"train_loss": -26.97743797302246, "global_step": 544800, "epoch": 6563} {"train_loss": -26.876699447631836, "global_step": 544801, "epoch": 6563} {"train_loss": -27.4101505279541, "global_step": 544802, "epoch": 6563} {"train_loss": -27.925413131713867, "global_step": 544803, "epoch": 6563} {"train_loss": -27.532596588134766, "global_step": 544804, "epoch": 6563} {"train_loss": -27.040283203125, "global_step": 544805, "epoch": 6563} {"train_loss": -27.5657901763916, "global_step": 544806, "epoch": 6563} {"train_loss": -27.419269561767578, "global_step": 544807, "epoch": 6563} {"train_loss": -27.448881149291992, "global_step": 544808, "epoch": 6563} {"train_loss": -27.675724029541016, "global_step": 544809, "epoch": 6563} {"train_loss": -27.724201202392578, "global_step": 544810, "epoch": 6563} {"train_loss": -27.409485391823644, "global_step": 544811, "epoch": 6563, "val_loss": 6588331.0} {"train_loss": -26.666961669921875, "global_step": 544812, "epoch": 6564} {"train_loss": -26.124601364135742, "global_step": 544813, "epoch": 6564} {"train_loss": -26.792566299438477, "global_step": 544814, "epoch": 6564} {"train_loss": -26.35956382751465, "global_step": 544815, "epoch": 6564} {"train_loss": -26.827606201171875, "global_step": 544816, "epoch": 6564} {"train_loss": -26.44133949279785, "global_step": 544817, "epoch": 6564} {"train_loss": -26.980239868164062, "global_step": 544818, "epoch": 6564} {"train_loss": -27.043298721313477, "global_step": 544819, "epoch": 6564} {"train_loss": -27.254186630249023, "global_step": 544820, "epoch": 6564} {"train_loss": -27.074365615844727, "global_step": 544821, "epoch": 6564} {"train_loss": -27.075353622436523, "global_step": 544822, "epoch": 6564} {"train_loss": -27.1157283782959, "global_step": 544823, "epoch": 6564} {"train_loss": -26.954010009765625, "global_step": 544824, "epoch": 6564} {"train_loss": -27.064529418945312, "global_step": 544825, "epoch": 6564} {"train_loss": -27.210058212280273, "global_step": 544826, "epoch": 6564} {"train_loss": -27.348947525024414, "global_step": 544827, "epoch": 6564} {"train_loss": -27.605356216430664, "global_step": 544828, "epoch": 6564} {"train_loss": -27.19956398010254, "global_step": 544829, "epoch": 6564} {"train_loss": -27.534292221069336, "global_step": 544830, "epoch": 6564} {"train_loss": -27.266260147094727, "global_step": 544831, "epoch": 6564} {"train_loss": -27.402637481689453, "global_step": 544832, "epoch": 6564} {"train_loss": -27.298810958862305, "global_step": 544833, "epoch": 6564} {"train_loss": -27.528730392456055, "global_step": 544834, "epoch": 6564} {"train_loss": -27.303150177001953, "global_step": 544835, "epoch": 6564} {"train_loss": -27.590057373046875, "global_step": 544836, "epoch": 6564} {"train_loss": -27.57854652404785, "global_step": 544837, "epoch": 6564} {"train_loss": -27.30917739868164, "global_step": 544838, "epoch": 6564} {"train_loss": -27.571741104125977, "global_step": 544839, "epoch": 6564} {"train_loss": -27.551965713500977, "global_step": 544840, "epoch": 6564} {"train_loss": -27.505386352539062, "global_step": 544841, "epoch": 6564} {"train_loss": -27.227664947509766, "global_step": 544842, "epoch": 6564} {"train_loss": -27.476043701171875, "global_step": 544843, "epoch": 6564} {"train_loss": -27.327239990234375, "global_step": 544844, "epoch": 6564} {"train_loss": -27.32340431213379, "global_step": 544845, "epoch": 6564} {"train_loss": -27.76641845703125, "global_step": 544846, "epoch": 6564} {"train_loss": -27.159713745117188, "global_step": 544847, "epoch": 6564} {"train_loss": -27.389759063720703, "global_step": 544848, "epoch": 6564} {"train_loss": -27.95304298400879, "global_step": 544849, "epoch": 6564} {"train_loss": -27.458703994750977, "global_step": 544850, "epoch": 6564} {"train_loss": -27.428348541259766, "global_step": 544851, "epoch": 6564} {"train_loss": -27.828245162963867, "global_step": 544852, "epoch": 6564} {"train_loss": -27.60163688659668, "global_step": 544853, "epoch": 6564} {"train_loss": -27.61757469177246, "global_step": 544854, "epoch": 6564} {"train_loss": -27.891469955444336, "global_step": 544855, "epoch": 6564} {"train_loss": -27.62298011779785, "global_step": 544856, "epoch": 6564} {"train_loss": -27.67694091796875, "global_step": 544857, "epoch": 6564} {"train_loss": -27.757232666015625, "global_step": 544858, "epoch": 6564} {"train_loss": -28.090900421142578, "global_step": 544859, "epoch": 6564} {"train_loss": -27.988956451416016, "global_step": 544860, "epoch": 6564} {"train_loss": -27.759174346923828, "global_step": 544861, "epoch": 6564} {"train_loss": -27.84754753112793, "global_step": 544862, "epoch": 6564} {"train_loss": -27.985218048095703, "global_step": 544863, "epoch": 6564} {"train_loss": -27.834409713745117, "global_step": 544864, "epoch": 6564} {"train_loss": -27.586029052734375, "global_step": 544865, "epoch": 6564} {"train_loss": -27.799814224243164, "global_step": 544866, "epoch": 6564} {"train_loss": -27.700464248657227, "global_step": 544867, "epoch": 6564} {"train_loss": -27.3956241607666, "global_step": 544868, "epoch": 6564} {"train_loss": -27.62674331665039, "global_step": 544869, "epoch": 6564} {"train_loss": -27.778156280517578, "global_step": 544870, "epoch": 6564} {"train_loss": -27.8851318359375, "global_step": 544871, "epoch": 6564} {"train_loss": -27.843313217163086, "global_step": 544872, "epoch": 6564} {"train_loss": -27.835630416870117, "global_step": 544873, "epoch": 6564} {"train_loss": -27.61590576171875, "global_step": 544874, "epoch": 6564} {"train_loss": -27.50542640686035, "global_step": 544875, "epoch": 6564} {"train_loss": -27.459857940673828, "global_step": 544876, "epoch": 6564} {"train_loss": -27.427404403686523, "global_step": 544877, "epoch": 6564} {"train_loss": -27.629032135009766, "global_step": 544878, "epoch": 6564} {"train_loss": -27.788211822509766, "global_step": 544879, "epoch": 6564} {"train_loss": -27.649906158447266, "global_step": 544880, "epoch": 6564} {"train_loss": -27.308725357055664, "global_step": 544881, "epoch": 6564} {"train_loss": -27.549535751342773, "global_step": 544882, "epoch": 6564} {"train_loss": -28.113794326782227, "global_step": 544883, "epoch": 6564} {"train_loss": -28.24386978149414, "global_step": 544884, "epoch": 6564} {"train_loss": -27.75819206237793, "global_step": 544885, "epoch": 6564} {"train_loss": -27.491256713867188, "global_step": 544886, "epoch": 6564} {"train_loss": -27.926925659179688, "global_step": 544887, "epoch": 6564} {"train_loss": -27.76861572265625, "global_step": 544888, "epoch": 6564} {"train_loss": -27.38555335998535, "global_step": 544889, "epoch": 6564} {"train_loss": -27.63325309753418, "global_step": 544890, "epoch": 6564} {"train_loss": -27.679523468017578, "global_step": 544891, "epoch": 6564} {"train_loss": -27.985855102539062, "global_step": 544892, "epoch": 6564} {"train_loss": -27.995325088500977, "global_step": 544893, "epoch": 6564} {"train_loss": -27.4899781928005, "global_step": 544894, "epoch": 6564, "val_loss": 6615190.0} {"train_loss": -27.5429744720459, "global_step": 544895, "epoch": 6565} {"train_loss": -27.500537872314453, "global_step": 544896, "epoch": 6565} {"train_loss": -27.412694931030273, "global_step": 544897, "epoch": 6565} {"train_loss": -27.535160064697266, "global_step": 544898, "epoch": 6565} {"train_loss": -27.248550415039062, "global_step": 544899, "epoch": 6565} {"train_loss": -27.23101234436035, "global_step": 544900, "epoch": 6565} {"train_loss": -26.973987579345703, "global_step": 544901, "epoch": 6565} {"train_loss": -26.8249454498291, "global_step": 544902, "epoch": 6565} {"train_loss": -27.597864151000977, "global_step": 544903, "epoch": 6565} {"train_loss": -26.913339614868164, "global_step": 544904, "epoch": 6565} {"train_loss": -26.619043350219727, "global_step": 544905, "epoch": 6565} {"train_loss": -27.35922622680664, "global_step": 544906, "epoch": 6565} {"train_loss": -27.413684844970703, "global_step": 544907, "epoch": 6565} {"train_loss": -27.471607208251953, "global_step": 544908, "epoch": 6565} {"train_loss": -26.89777183532715, "global_step": 544909, "epoch": 6565} {"train_loss": -27.094213485717773, "global_step": 544910, "epoch": 6565} {"train_loss": -27.401533126831055, "global_step": 544911, "epoch": 6565} {"train_loss": -27.608978271484375, "global_step": 544912, "epoch": 6565} {"train_loss": -27.266294479370117, "global_step": 544913, "epoch": 6565} {"train_loss": -27.357446670532227, "global_step": 544914, "epoch": 6565} {"train_loss": -27.819726943969727, "global_step": 544915, "epoch": 6565} {"train_loss": -27.320470809936523, "global_step": 544916, "epoch": 6565} {"train_loss": -27.779876708984375, "global_step": 544917, "epoch": 6565} {"train_loss": -27.487043380737305, "global_step": 544918, "epoch": 6565} {"train_loss": -27.439916610717773, "global_step": 544919, "epoch": 6565} {"train_loss": -28.111474990844727, "global_step": 544920, "epoch": 6565} {"train_loss": -27.554471969604492, "global_step": 544921, "epoch": 6565} {"train_loss": -27.953893661499023, "global_step": 544922, "epoch": 6565} {"train_loss": -27.60855484008789, "global_step": 544923, "epoch": 6565} {"train_loss": -27.74249267578125, "global_step": 544924, "epoch": 6565} {"train_loss": -27.634061813354492, "global_step": 544925, "epoch": 6565} {"train_loss": -28.03460693359375, "global_step": 544926, "epoch": 6565} {"train_loss": -27.90384292602539, "global_step": 544927, "epoch": 6565} {"train_loss": -27.504547119140625, "global_step": 544928, "epoch": 6565} {"train_loss": -27.89129638671875, "global_step": 544929, "epoch": 6565} {"train_loss": -28.013671875, "global_step": 544930, "epoch": 6565} {"train_loss": -27.604816436767578, "global_step": 544931, "epoch": 6565} {"train_loss": -27.839452743530273, "global_step": 544932, "epoch": 6565} {"train_loss": -27.741907119750977, "global_step": 544933, "epoch": 6565} {"train_loss": -27.6337890625, "global_step": 544934, "epoch": 6565} {"train_loss": -27.857275009155273, "global_step": 544935, "epoch": 6565} {"train_loss": -27.74912452697754, "global_step": 544936, "epoch": 6565} {"train_loss": -27.663293838500977, "global_step": 544937, "epoch": 6565} {"train_loss": -27.791173934936523, "global_step": 544938, "epoch": 6565} {"train_loss": -27.82105827331543, "global_step": 544939, "epoch": 6565} {"train_loss": -27.8944034576416, "global_step": 544940, "epoch": 6565} {"train_loss": -27.539520263671875, "global_step": 544941, "epoch": 6565} {"train_loss": -27.858112335205078, "global_step": 544942, "epoch": 6565} {"train_loss": -27.754302978515625, "global_step": 544943, "epoch": 6565} {"train_loss": -28.52166748046875, "global_step": 544944, "epoch": 6565} {"train_loss": -28.027286529541016, "global_step": 544945, "epoch": 6565} {"train_loss": -27.489721298217773, "global_step": 544946, "epoch": 6565} {"train_loss": -27.844852447509766, "global_step": 544947, "epoch": 6565} {"train_loss": -27.664167404174805, "global_step": 544948, "epoch": 6565} {"train_loss": -27.74344825744629, "global_step": 544949, "epoch": 6565} {"train_loss": -27.506174087524414, "global_step": 544950, "epoch": 6565} {"train_loss": -27.506399154663086, "global_step": 544951, "epoch": 6565} {"train_loss": -27.4750919342041, "global_step": 544952, "epoch": 6565} {"train_loss": -28.06549644470215, "global_step": 544953, "epoch": 6565} {"train_loss": -27.842016220092773, "global_step": 544954, "epoch": 6565} {"train_loss": -27.2373046875, "global_step": 544955, "epoch": 6565} {"train_loss": -27.732492446899414, "global_step": 544956, "epoch": 6565} {"train_loss": -27.688358306884766, "global_step": 544957, "epoch": 6565} {"train_loss": -27.69768714904785, "global_step": 544958, "epoch": 6565} {"train_loss": -27.684301376342773, "global_step": 544959, "epoch": 6565} {"train_loss": -27.9517879486084, "global_step": 544960, "epoch": 6565} {"train_loss": -27.950098037719727, "global_step": 544961, "epoch": 6565} {"train_loss": -28.0430850982666, "global_step": 544962, "epoch": 6565} {"train_loss": -27.747100830078125, "global_step": 544963, "epoch": 6565} {"train_loss": -27.786182403564453, "global_step": 544964, "epoch": 6565} {"train_loss": -27.91926383972168, "global_step": 544965, "epoch": 6565} {"train_loss": -27.88115882873535, "global_step": 544966, "epoch": 6565} {"train_loss": -27.807031631469727, "global_step": 544967, "epoch": 6565} {"train_loss": -28.086023330688477, "global_step": 544968, "epoch": 6565} {"train_loss": -27.794179916381836, "global_step": 544969, "epoch": 6565} {"train_loss": -27.730926513671875, "global_step": 544970, "epoch": 6565} {"train_loss": -28.152631759643555, "global_step": 544971, "epoch": 6565} {"train_loss": -27.682050704956055, "global_step": 544972, "epoch": 6565} {"train_loss": -27.387638092041016, "global_step": 544973, "epoch": 6565} {"train_loss": -27.835424423217773, "global_step": 544974, "epoch": 6565} {"train_loss": -27.251127243041992, "global_step": 544975, "epoch": 6565} {"train_loss": -27.70339012145996, "global_step": 544976, "epoch": 6565} {"train_loss": -27.642223978617107, "global_step": 544977, "epoch": 6565, "val_loss": 6563195.0} {"train_loss": -26.559375762939453, "global_step": 544978, "epoch": 6566} {"train_loss": -25.287382125854492, "global_step": 544979, "epoch": 6566} {"train_loss": -24.821802139282227, "global_step": 544980, "epoch": 6566} {"train_loss": -25.65126609802246, "global_step": 544981, "epoch": 6566} {"train_loss": -26.271377563476562, "global_step": 544982, "epoch": 6566} {"train_loss": -27.133275985717773, "global_step": 544983, "epoch": 6566} {"train_loss": -26.502044677734375, "global_step": 544984, "epoch": 6566} {"train_loss": -26.350723266601562, "global_step": 544985, "epoch": 6566} {"train_loss": -26.779340744018555, "global_step": 544986, "epoch": 6566} {"train_loss": -26.776357650756836, "global_step": 544987, "epoch": 6566} {"train_loss": -26.939838409423828, "global_step": 544988, "epoch": 6566} {"train_loss": -27.375308990478516, "global_step": 544989, "epoch": 6566} {"train_loss": -27.189416885375977, "global_step": 544990, "epoch": 6566} {"train_loss": -26.8515567779541, "global_step": 544991, "epoch": 6566} {"train_loss": -26.8522891998291, "global_step": 544992, "epoch": 6566} {"train_loss": -27.54037857055664, "global_step": 544993, "epoch": 6566} {"train_loss": -27.130537033081055, "global_step": 544994, "epoch": 6566} {"train_loss": -27.586210250854492, "global_step": 544995, "epoch": 6566} {"train_loss": -27.251134872436523, "global_step": 544996, "epoch": 6566} {"train_loss": -27.2804012298584, "global_step": 544997, "epoch": 6566} {"train_loss": -27.638540267944336, "global_step": 544998, "epoch": 6566} {"train_loss": -27.41875648498535, "global_step": 544999, "epoch": 6566} {"train_loss": -27.558151245117188, "global_step": 545000, "epoch": 6566} {"train_loss": -27.554479598999023, "global_step": 545001, "epoch": 6566} {"train_loss": -27.53199577331543, "global_step": 545002, "epoch": 6566} {"train_loss": -27.781049728393555, "global_step": 545003, "epoch": 6566} {"train_loss": -27.519489288330078, "global_step": 545004, "epoch": 6566} {"train_loss": -27.700820922851562, "global_step": 545005, "epoch": 6566} {"train_loss": -27.5263729095459, "global_step": 545006, "epoch": 6566} {"train_loss": -27.768451690673828, "global_step": 545007, "epoch": 6566} {"train_loss": -27.538671493530273, "global_step": 545008, "epoch": 6566} {"train_loss": -27.863500595092773, "global_step": 545009, "epoch": 6566} {"train_loss": -27.959259033203125, "global_step": 545010, "epoch": 6566} {"train_loss": -28.07771110534668, "global_step": 545011, "epoch": 6566} {"train_loss": -27.710538864135742, "global_step": 545012, "epoch": 6566} {"train_loss": -27.81231689453125, "global_step": 545013, "epoch": 6566} {"train_loss": -27.70254898071289, "global_step": 545014, "epoch": 6566} {"train_loss": -28.142797470092773, "global_step": 545015, "epoch": 6566} {"train_loss": -27.633895874023438, "global_step": 545016, "epoch": 6566} {"train_loss": -27.81476402282715, "global_step": 545017, "epoch": 6566} {"train_loss": -27.792560577392578, "global_step": 545018, "epoch": 6566} {"train_loss": -27.911359786987305, "global_step": 545019, "epoch": 6566} {"train_loss": -27.796579360961914, "global_step": 545020, "epoch": 6566} {"train_loss": -28.295495986938477, "global_step": 545021, "epoch": 6566} {"train_loss": -27.652124404907227, "global_step": 545022, "epoch": 6566} {"train_loss": -27.4724178314209, "global_step": 545023, "epoch": 6566} {"train_loss": -27.697355270385742, "global_step": 545024, "epoch": 6566} {"train_loss": -27.91644287109375, "global_step": 545025, "epoch": 6566} {"train_loss": -27.76938819885254, "global_step": 545026, "epoch": 6566} {"train_loss": -27.88421630859375, "global_step": 545027, "epoch": 6566} {"train_loss": -27.954288482666016, "global_step": 545028, "epoch": 6566} {"train_loss": -27.659833908081055, "global_step": 545029, "epoch": 6566} {"train_loss": -28.07452964782715, "global_step": 545030, "epoch": 6566} {"train_loss": -28.083282470703125, "global_step": 545031, "epoch": 6566} {"train_loss": -27.76618766784668, "global_step": 545032, "epoch": 6566} {"train_loss": -27.88809585571289, "global_step": 545033, "epoch": 6566} {"train_loss": -27.59724998474121, "global_step": 545034, "epoch": 6566} {"train_loss": -28.10527992248535, "global_step": 545035, "epoch": 6566} {"train_loss": -27.41969108581543, "global_step": 545036, "epoch": 6566} {"train_loss": -27.627887725830078, "global_step": 545037, "epoch": 6566} {"train_loss": -27.72621726989746, "global_step": 545038, "epoch": 6566} {"train_loss": -27.6229190826416, "global_step": 545039, "epoch": 6566} {"train_loss": -27.657318115234375, "global_step": 545040, "epoch": 6566} {"train_loss": -27.656085968017578, "global_step": 545041, "epoch": 6566} {"train_loss": -27.784814834594727, "global_step": 545042, "epoch": 6566} {"train_loss": -28.0373477935791, "global_step": 545043, "epoch": 6566} {"train_loss": -27.605777740478516, "global_step": 545044, "epoch": 6566} {"train_loss": -27.718774795532227, "global_step": 545045, "epoch": 6566} {"train_loss": -27.605304718017578, "global_step": 545046, "epoch": 6566} {"train_loss": -27.8710880279541, "global_step": 545047, "epoch": 6566} {"train_loss": -27.93902015686035, "global_step": 545048, "epoch": 6566} {"train_loss": -27.75748634338379, "global_step": 545049, "epoch": 6566} {"train_loss": -27.339258193969727, "global_step": 545050, "epoch": 6566} {"train_loss": -27.427139282226562, "global_step": 545051, "epoch": 6566} {"train_loss": -27.351789474487305, "global_step": 545052, "epoch": 6566} {"train_loss": -26.74812889099121, "global_step": 545053, "epoch": 6566} {"train_loss": -26.66550636291504, "global_step": 545054, "epoch": 6566} {"train_loss": -27.226160049438477, "global_step": 545055, "epoch": 6566} {"train_loss": -27.943115234375, "global_step": 545056, "epoch": 6566} {"train_loss": -27.514392852783203, "global_step": 545057, "epoch": 6566} {"train_loss": -27.169408798217773, "global_step": 545058, "epoch": 6566} {"train_loss": -27.58623695373535, "global_step": 545059, "epoch": 6566} {"train_loss": -27.437610373439558, "global_step": 545060, "epoch": 6566, "val_loss": 6615313.0} {"train_loss": -27.0306339263916, "global_step": 545061, "epoch": 6567} {"train_loss": -27.00337791442871, "global_step": 545062, "epoch": 6567} {"train_loss": -27.527740478515625, "global_step": 545063, "epoch": 6567} {"train_loss": -27.12306022644043, "global_step": 545064, "epoch": 6567} {"train_loss": -27.077056884765625, "global_step": 545065, "epoch": 6567} {"train_loss": -27.18320655822754, "global_step": 545066, "epoch": 6567} {"train_loss": -27.3635311126709, "global_step": 545067, "epoch": 6567} {"train_loss": -26.9589900970459, "global_step": 545068, "epoch": 6567} {"train_loss": -27.493682861328125, "global_step": 545069, "epoch": 6567} {"train_loss": -27.10530662536621, "global_step": 545070, "epoch": 6567} {"train_loss": -27.25324058532715, "global_step": 545071, "epoch": 6567} {"train_loss": -27.303369522094727, "global_step": 545072, "epoch": 6567} {"train_loss": -27.746774673461914, "global_step": 545073, "epoch": 6567} {"train_loss": -27.507654190063477, "global_step": 545074, "epoch": 6567} {"train_loss": -27.51041030883789, "global_step": 545075, "epoch": 6567} {"train_loss": -27.64865493774414, "global_step": 545076, "epoch": 6567} {"train_loss": -27.72505760192871, "global_step": 545077, "epoch": 6567} {"train_loss": -28.083332061767578, "global_step": 545078, "epoch": 6567} {"train_loss": -27.157257080078125, "global_step": 545079, "epoch": 6567} {"train_loss": -27.78558921813965, "global_step": 545080, "epoch": 6567} {"train_loss": -27.842731475830078, "global_step": 545081, "epoch": 6567} {"train_loss": -27.96986198425293, "global_step": 545082, "epoch": 6567} {"train_loss": -28.03622817993164, "global_step": 545083, "epoch": 6567} {"train_loss": -28.028867721557617, "global_step": 545084, "epoch": 6567} {"train_loss": -27.797582626342773, "global_step": 545085, "epoch": 6567} {"train_loss": -27.606138229370117, "global_step": 545086, "epoch": 6567} {"train_loss": -27.617355346679688, "global_step": 545087, "epoch": 6567} {"train_loss": -27.778295516967773, "global_step": 545088, "epoch": 6567} {"train_loss": -27.73105812072754, "global_step": 545089, "epoch": 6567} {"train_loss": -27.8171443939209, "global_step": 545090, "epoch": 6567} {"train_loss": -27.952930450439453, "global_step": 545091, "epoch": 6567} {"train_loss": -27.633569717407227, "global_step": 545092, "epoch": 6567} {"train_loss": -27.709991455078125, "global_step": 545093, "epoch": 6567} {"train_loss": -27.819705963134766, "global_step": 545094, "epoch": 6567} {"train_loss": -27.509571075439453, "global_step": 545095, "epoch": 6567} {"train_loss": -27.4371337890625, "global_step": 545096, "epoch": 6567} {"train_loss": -27.9962215423584, "global_step": 545097, "epoch": 6567} {"train_loss": -27.614917755126953, "global_step": 545098, "epoch": 6567} {"train_loss": -27.827823638916016, "global_step": 545099, "epoch": 6567} {"train_loss": -28.195022583007812, "global_step": 545100, "epoch": 6567} {"train_loss": -27.651874542236328, "global_step": 545101, "epoch": 6567} {"train_loss": -27.81745719909668, "global_step": 545102, "epoch": 6567} {"train_loss": -27.8809757232666, "global_step": 545103, "epoch": 6567} {"train_loss": -27.69508934020996, "global_step": 545104, "epoch": 6567} {"train_loss": -27.94964027404785, "global_step": 545105, "epoch": 6567} {"train_loss": -27.773319244384766, "global_step": 545106, "epoch": 6567} {"train_loss": -27.49102210998535, "global_step": 545107, "epoch": 6567} {"train_loss": -27.77703857421875, "global_step": 545108, "epoch": 6567} {"train_loss": -27.952228546142578, "global_step": 545109, "epoch": 6567} {"train_loss": -27.81048011779785, "global_step": 545110, "epoch": 6567} {"train_loss": -27.915042877197266, "global_step": 545111, "epoch": 6567} {"train_loss": -27.85981559753418, "global_step": 545112, "epoch": 6567} {"train_loss": -28.11040687561035, "global_step": 545113, "epoch": 6567} {"train_loss": -27.433130264282227, "global_step": 545114, "epoch": 6567} {"train_loss": -27.5161075592041, "global_step": 545115, "epoch": 6567} {"train_loss": -27.674707412719727, "global_step": 545116, "epoch": 6567} {"train_loss": -27.59491539001465, "global_step": 545117, "epoch": 6567} {"train_loss": -28.005273818969727, "global_step": 545118, "epoch": 6567} {"train_loss": -28.062744140625, "global_step": 545119, "epoch": 6567} {"train_loss": -27.810577392578125, "global_step": 545120, "epoch": 6567} {"train_loss": -27.567663192749023, "global_step": 545121, "epoch": 6567} {"train_loss": -27.60400390625, "global_step": 545122, "epoch": 6567} {"train_loss": -28.01797866821289, "global_step": 545123, "epoch": 6567} {"train_loss": -27.765897750854492, "global_step": 545124, "epoch": 6567} {"train_loss": -27.5191593170166, "global_step": 545125, "epoch": 6567} {"train_loss": -26.86797523498535, "global_step": 545126, "epoch": 6567} {"train_loss": -26.4699764251709, "global_step": 545127, "epoch": 6567} {"train_loss": -26.899417877197266, "global_step": 545128, "epoch": 6567} {"train_loss": -27.992572784423828, "global_step": 545129, "epoch": 6567} {"train_loss": -27.3582763671875, "global_step": 545130, "epoch": 6567} {"train_loss": -27.412128448486328, "global_step": 545131, "epoch": 6567} {"train_loss": -26.96700096130371, "global_step": 545132, "epoch": 6567} {"train_loss": -27.948108673095703, "global_step": 545133, "epoch": 6567} {"train_loss": -27.575361251831055, "global_step": 545134, "epoch": 6567} {"train_loss": -27.7780818939209, "global_step": 545135, "epoch": 6567} {"train_loss": -27.710865020751953, "global_step": 545136, "epoch": 6567} {"train_loss": -27.26859474182129, "global_step": 545137, "epoch": 6567} {"train_loss": -27.35186767578125, "global_step": 545138, "epoch": 6567} {"train_loss": -27.644254684448242, "global_step": 545139, "epoch": 6567} {"train_loss": -27.81233024597168, "global_step": 545140, "epoch": 6567} {"train_loss": -27.027612686157227, "global_step": 545141, "epoch": 6567} {"train_loss": -27.61274528503418, "global_step": 545142, "epoch": 6567} {"train_loss": -27.601327160754835, "global_step": 545143, "epoch": 6567, "val_loss": 6620551.0} {"train_loss": -27.409814834594727, "global_step": 545144, "epoch": 6568} {"train_loss": -27.650068283081055, "global_step": 545145, "epoch": 6568} {"train_loss": -27.584989547729492, "global_step": 545146, "epoch": 6568} {"train_loss": -27.79334831237793, "global_step": 545147, "epoch": 6568} {"train_loss": -27.404560089111328, "global_step": 545148, "epoch": 6568} {"train_loss": -27.38348960876465, "global_step": 545149, "epoch": 6568} {"train_loss": -27.268264770507812, "global_step": 545150, "epoch": 6568} {"train_loss": -27.45362663269043, "global_step": 545151, "epoch": 6568} {"train_loss": -27.778076171875, "global_step": 545152, "epoch": 6568} {"train_loss": -27.639596939086914, "global_step": 545153, "epoch": 6568} {"train_loss": -27.275121688842773, "global_step": 545154, "epoch": 6568} {"train_loss": -28.044382095336914, "global_step": 545155, "epoch": 6568} {"train_loss": -27.565631866455078, "global_step": 545156, "epoch": 6568} {"train_loss": -27.435882568359375, "global_step": 545157, "epoch": 6568} {"train_loss": -27.77886962890625, "global_step": 545158, "epoch": 6568} {"train_loss": -27.205617904663086, "global_step": 545159, "epoch": 6568} {"train_loss": -27.972028732299805, "global_step": 545160, "epoch": 6568} {"train_loss": -27.498188018798828, "global_step": 545161, "epoch": 6568} {"train_loss": -27.710535049438477, "global_step": 545162, "epoch": 6568} {"train_loss": -27.7318058013916, "global_step": 545163, "epoch": 6568} {"train_loss": -27.690053939819336, "global_step": 545164, "epoch": 6568} {"train_loss": -27.7269229888916, "global_step": 545165, "epoch": 6568} {"train_loss": -27.78794288635254, "global_step": 545166, "epoch": 6568} {"train_loss": -27.482404708862305, "global_step": 545167, "epoch": 6568} {"train_loss": -27.913818359375, "global_step": 545168, "epoch": 6568} {"train_loss": -27.67840576171875, "global_step": 545169, "epoch": 6568} {"train_loss": -27.8796443939209, "global_step": 545170, "epoch": 6568} {"train_loss": -27.515583038330078, "global_step": 545171, "epoch": 6568} {"train_loss": -27.687162399291992, "global_step": 545172, "epoch": 6568} {"train_loss": -27.682641983032227, "global_step": 545173, "epoch": 6568} {"train_loss": -27.71294593811035, "global_step": 545174, "epoch": 6568} {"train_loss": -27.88177490234375, "global_step": 545175, "epoch": 6568} {"train_loss": -27.989171981811523, "global_step": 545176, "epoch": 6568} {"train_loss": -27.624258041381836, "global_step": 545177, "epoch": 6568} {"train_loss": -27.781415939331055, "global_step": 545178, "epoch": 6568} {"train_loss": -27.712936401367188, "global_step": 545179, "epoch": 6568} {"train_loss": -28.099740982055664, "global_step": 545180, "epoch": 6568} {"train_loss": -28.0009765625, "global_step": 545181, "epoch": 6568} {"train_loss": -27.80328369140625, "global_step": 545182, "epoch": 6568} {"train_loss": -27.5777645111084, "global_step": 545183, "epoch": 6568} {"train_loss": -27.224943161010742, "global_step": 545184, "epoch": 6568} {"train_loss": -26.531641006469727, "global_step": 545185, "epoch": 6568} {"train_loss": -26.815387725830078, "global_step": 545186, "epoch": 6568} {"train_loss": -27.94268798828125, "global_step": 545187, "epoch": 6568} {"train_loss": -27.26944923400879, "global_step": 545188, "epoch": 6568} {"train_loss": -27.344196319580078, "global_step": 545189, "epoch": 6568} {"train_loss": -27.583349227905273, "global_step": 545190, "epoch": 6568} {"train_loss": -27.476125717163086, "global_step": 545191, "epoch": 6568} {"train_loss": -27.679197311401367, "global_step": 545192, "epoch": 6568} {"train_loss": -27.393457412719727, "global_step": 545193, "epoch": 6568} {"train_loss": -27.455251693725586, "global_step": 545194, "epoch": 6568} {"train_loss": -27.285781860351562, "global_step": 545195, "epoch": 6568} {"train_loss": -27.762678146362305, "global_step": 545196, "epoch": 6568} {"train_loss": -26.935611724853516, "global_step": 545197, "epoch": 6568} {"train_loss": -27.8964900970459, "global_step": 545198, "epoch": 6568} {"train_loss": -27.5466251373291, "global_step": 545199, "epoch": 6568} {"train_loss": -27.574995040893555, "global_step": 545200, "epoch": 6568} {"train_loss": -27.600000381469727, "global_step": 545201, "epoch": 6568} {"train_loss": -27.750574111938477, "global_step": 545202, "epoch": 6568} {"train_loss": -27.360599517822266, "global_step": 545203, "epoch": 6568} {"train_loss": -27.6328067779541, "global_step": 545204, "epoch": 6568} {"train_loss": -27.49579429626465, "global_step": 545205, "epoch": 6568} {"train_loss": -27.516544342041016, "global_step": 545206, "epoch": 6568} {"train_loss": -27.437896728515625, "global_step": 545207, "epoch": 6568} {"train_loss": -27.165287017822266, "global_step": 545208, "epoch": 6568} {"train_loss": -27.638416290283203, "global_step": 545209, "epoch": 6568} {"train_loss": -27.61065101623535, "global_step": 545210, "epoch": 6568} {"train_loss": -27.657678604125977, "global_step": 545211, "epoch": 6568} {"train_loss": -27.57843589782715, "global_step": 545212, "epoch": 6568} {"train_loss": -27.407611846923828, "global_step": 545213, "epoch": 6568} {"train_loss": -27.935094833374023, "global_step": 545214, "epoch": 6568} {"train_loss": -27.842700958251953, "global_step": 545215, "epoch": 6568} {"train_loss": -27.889190673828125, "global_step": 545216, "epoch": 6568} {"train_loss": -27.886554718017578, "global_step": 545217, "epoch": 6568} {"train_loss": -27.525543212890625, "global_step": 545218, "epoch": 6568} {"train_loss": -27.890872955322266, "global_step": 545219, "epoch": 6568} {"train_loss": -27.48219108581543, "global_step": 545220, "epoch": 6568} {"train_loss": -27.4957332611084, "global_step": 545221, "epoch": 6568} {"train_loss": -27.880964279174805, "global_step": 545222, "epoch": 6568} {"train_loss": -28.072772979736328, "global_step": 545223, "epoch": 6568} {"train_loss": -27.703292846679688, "global_step": 545224, "epoch": 6568} {"train_loss": -28.003183364868164, "global_step": 545225, "epoch": 6568} {"train_loss": -27.607872147157966, "global_step": 545226, "epoch": 6568, "val_loss": 6549032.0} {"train_loss": -27.841222763061523, "global_step": 545227, "epoch": 6569} {"train_loss": -27.714258193969727, "global_step": 545228, "epoch": 6569} {"train_loss": -27.551786422729492, "global_step": 545229, "epoch": 6569} {"train_loss": -27.694446563720703, "global_step": 545230, "epoch": 6569} {"train_loss": -27.72648048400879, "global_step": 545231, "epoch": 6569} {"train_loss": -27.662580490112305, "global_step": 545232, "epoch": 6569} {"train_loss": -27.2235050201416, "global_step": 545233, "epoch": 6569} {"train_loss": -27.83827018737793, "global_step": 545234, "epoch": 6569} {"train_loss": -27.916385650634766, "global_step": 545235, "epoch": 6569} {"train_loss": -27.76276969909668, "global_step": 545236, "epoch": 6569} {"train_loss": -27.4322509765625, "global_step": 545237, "epoch": 6569} {"train_loss": -27.760068893432617, "global_step": 545238, "epoch": 6569} {"train_loss": -27.733991622924805, "global_step": 545239, "epoch": 6569} {"train_loss": -27.939844131469727, "global_step": 545240, "epoch": 6569} {"train_loss": -27.762372970581055, "global_step": 545241, "epoch": 6569} {"train_loss": -27.154870986938477, "global_step": 545242, "epoch": 6569} {"train_loss": -27.177595138549805, "global_step": 545243, "epoch": 6569} {"train_loss": -27.15791130065918, "global_step": 545244, "epoch": 6569} {"train_loss": -28.09003257751465, "global_step": 545245, "epoch": 6569} {"train_loss": -27.87105369567871, "global_step": 545246, "epoch": 6569} {"train_loss": -27.588394165039062, "global_step": 545247, "epoch": 6569} {"train_loss": -27.590173721313477, "global_step": 545248, "epoch": 6569} {"train_loss": -27.592023849487305, "global_step": 545249, "epoch": 6569} {"train_loss": -27.927331924438477, "global_step": 545250, "epoch": 6569} {"train_loss": -27.960214614868164, "global_step": 545251, "epoch": 6569} {"train_loss": -27.83216667175293, "global_step": 545252, "epoch": 6569} {"train_loss": -27.83223533630371, "global_step": 545253, "epoch": 6569} {"train_loss": -27.80423927307129, "global_step": 545254, "epoch": 6569} {"train_loss": -27.63605308532715, "global_step": 545255, "epoch": 6569} {"train_loss": -27.781946182250977, "global_step": 545256, "epoch": 6569} {"train_loss": -27.91340446472168, "global_step": 545257, "epoch": 6569} {"train_loss": -28.047414779663086, "global_step": 545258, "epoch": 6569} {"train_loss": -27.8127384185791, "global_step": 545259, "epoch": 6569} {"train_loss": -27.58194351196289, "global_step": 545260, "epoch": 6569} {"train_loss": -27.63325309753418, "global_step": 545261, "epoch": 6569} {"train_loss": -27.78887367248535, "global_step": 545262, "epoch": 6569} {"train_loss": -27.932188034057617, "global_step": 545263, "epoch": 6569} {"train_loss": -27.72736167907715, "global_step": 545264, "epoch": 6569} {"train_loss": -28.014270782470703, "global_step": 545265, "epoch": 6569} {"train_loss": -27.679868698120117, "global_step": 545266, "epoch": 6569} {"train_loss": -27.74853515625, "global_step": 545267, "epoch": 6569} {"train_loss": -27.570295333862305, "global_step": 545268, "epoch": 6569} {"train_loss": -27.649261474609375, "global_step": 545269, "epoch": 6569} {"train_loss": -27.496417999267578, "global_step": 545270, "epoch": 6569} {"train_loss": -27.8963680267334, "global_step": 545271, "epoch": 6569} {"train_loss": -27.83736228942871, "global_step": 545272, "epoch": 6569} {"train_loss": -27.510602951049805, "global_step": 545273, "epoch": 6569} {"train_loss": -27.84063148498535, "global_step": 545274, "epoch": 6569} {"train_loss": -28.009973526000977, "global_step": 545275, "epoch": 6569} {"train_loss": -27.699237823486328, "global_step": 545276, "epoch": 6569} {"train_loss": -27.152618408203125, "global_step": 545277, "epoch": 6569} {"train_loss": -27.779233932495117, "global_step": 545278, "epoch": 6569} {"train_loss": -27.9439754486084, "global_step": 545279, "epoch": 6569} {"train_loss": -27.907617568969727, "global_step": 545280, "epoch": 6569} {"train_loss": -27.693445205688477, "global_step": 545281, "epoch": 6569} {"train_loss": -27.95016860961914, "global_step": 545282, "epoch": 6569} {"train_loss": -27.791213989257812, "global_step": 545283, "epoch": 6569} {"train_loss": -28.2797908782959, "global_step": 545284, "epoch": 6569} {"train_loss": -27.534011840820312, "global_step": 545285, "epoch": 6569} {"train_loss": -27.81992530822754, "global_step": 545286, "epoch": 6569} {"train_loss": -27.371856689453125, "global_step": 545287, "epoch": 6569} {"train_loss": -27.421863555908203, "global_step": 545288, "epoch": 6569} {"train_loss": -27.9316349029541, "global_step": 545289, "epoch": 6569} {"train_loss": -27.705724716186523, "global_step": 545290, "epoch": 6569} {"train_loss": -27.876571655273438, "global_step": 545291, "epoch": 6569} {"train_loss": -27.93161392211914, "global_step": 545292, "epoch": 6569} {"train_loss": -28.022079467773438, "global_step": 545293, "epoch": 6569} {"train_loss": -27.943872451782227, "global_step": 545294, "epoch": 6569} {"train_loss": -27.685754776000977, "global_step": 545295, "epoch": 6569} {"train_loss": -27.68706703186035, "global_step": 545296, "epoch": 6569} {"train_loss": -27.609180450439453, "global_step": 545297, "epoch": 6569} {"train_loss": -27.7453670501709, "global_step": 545298, "epoch": 6569} {"train_loss": -27.70120620727539, "global_step": 545299, "epoch": 6569} {"train_loss": -27.903949737548828, "global_step": 545300, "epoch": 6569} {"train_loss": -28.023359298706055, "global_step": 545301, "epoch": 6569} {"train_loss": -27.204681396484375, "global_step": 545302, "epoch": 6569} {"train_loss": -27.118423461914062, "global_step": 545303, "epoch": 6569} {"train_loss": -26.584705352783203, "global_step": 545304, "epoch": 6569} {"train_loss": -26.74738883972168, "global_step": 545305, "epoch": 6569} {"train_loss": -27.824005126953125, "global_step": 545306, "epoch": 6569} {"train_loss": -26.788000106811523, "global_step": 545307, "epoch": 6569} {"train_loss": -27.543066024780273, "global_step": 545308, "epoch": 6569} {"train_loss": -27.697286628815064, "global_step": 545309, "epoch": 6569, "val_loss": 6556852.0} {"train_loss": -27.452184677124023, "global_step": 545310, "epoch": 6570} {"train_loss": -26.90961265563965, "global_step": 545311, "epoch": 6570} {"train_loss": -27.367895126342773, "global_step": 545312, "epoch": 6570} {"train_loss": -26.860614776611328, "global_step": 545313, "epoch": 6570} {"train_loss": -26.66552734375, "global_step": 545314, "epoch": 6570} {"train_loss": -27.254926681518555, "global_step": 545315, "epoch": 6570} {"train_loss": -27.042993545532227, "global_step": 545316, "epoch": 6570} {"train_loss": -27.509296417236328, "global_step": 545317, "epoch": 6570} {"train_loss": -27.231191635131836, "global_step": 545318, "epoch": 6570} {"train_loss": -27.1767578125, "global_step": 545319, "epoch": 6570} {"train_loss": -26.932470321655273, "global_step": 545320, "epoch": 6570} {"train_loss": -27.187910079956055, "global_step": 545321, "epoch": 6570} {"train_loss": -27.1987247467041, "global_step": 545322, "epoch": 6570} {"train_loss": -27.06036376953125, "global_step": 545323, "epoch": 6570} {"train_loss": -27.312915802001953, "global_step": 545324, "epoch": 6570} {"train_loss": -27.055646896362305, "global_step": 545325, "epoch": 6570} {"train_loss": -27.452316284179688, "global_step": 545326, "epoch": 6570} {"train_loss": -27.382116317749023, "global_step": 545327, "epoch": 6570} {"train_loss": -27.5942325592041, "global_step": 545328, "epoch": 6570} {"train_loss": -27.315969467163086, "global_step": 545329, "epoch": 6570} {"train_loss": -27.316404342651367, "global_step": 545330, "epoch": 6570} {"train_loss": -27.48541831970215, "global_step": 545331, "epoch": 6570} {"train_loss": -27.87049674987793, "global_step": 545332, "epoch": 6570} {"train_loss": -27.79974365234375, "global_step": 545333, "epoch": 6570} {"train_loss": -27.432626724243164, "global_step": 545334, "epoch": 6570} {"train_loss": -27.702728271484375, "global_step": 545335, "epoch": 6570} {"train_loss": -27.186933517456055, "global_step": 545336, "epoch": 6570} {"train_loss": -27.725385665893555, "global_step": 545337, "epoch": 6570} {"train_loss": -27.653966903686523, "global_step": 545338, "epoch": 6570} {"train_loss": -27.2083797454834, "global_step": 545339, "epoch": 6570} {"train_loss": -27.544946670532227, "global_step": 545340, "epoch": 6570} {"train_loss": -27.687747955322266, "global_step": 545341, "epoch": 6570} {"train_loss": -27.563207626342773, "global_step": 545342, "epoch": 6570} {"train_loss": -27.82511329650879, "global_step": 545343, "epoch": 6570} {"train_loss": -27.585416793823242, "global_step": 545344, "epoch": 6570} {"train_loss": -27.6932430267334, "global_step": 545345, "epoch": 6570} {"train_loss": -27.611658096313477, "global_step": 545346, "epoch": 6570} {"train_loss": -27.414417266845703, "global_step": 545347, "epoch": 6570} {"train_loss": -27.64023208618164, "global_step": 545348, "epoch": 6570} {"train_loss": -27.748016357421875, "global_step": 545349, "epoch": 6570} {"train_loss": -28.059049606323242, "global_step": 545350, "epoch": 6570} {"train_loss": -27.897626876831055, "global_step": 545351, "epoch": 6570} {"train_loss": -28.02727699279785, "global_step": 545352, "epoch": 6570} {"train_loss": -27.683141708374023, "global_step": 545353, "epoch": 6570} {"train_loss": -27.922277450561523, "global_step": 545354, "epoch": 6570} {"train_loss": -27.61744499206543, "global_step": 545355, "epoch": 6570} {"train_loss": -27.804487228393555, "global_step": 545356, "epoch": 6570} {"train_loss": -27.64056396484375, "global_step": 545357, "epoch": 6570} {"train_loss": -27.615100860595703, "global_step": 545358, "epoch": 6570} {"train_loss": -27.945173263549805, "global_step": 545359, "epoch": 6570} {"train_loss": -27.842147827148438, "global_step": 545360, "epoch": 6570} {"train_loss": -28.1839656829834, "global_step": 545361, "epoch": 6570} {"train_loss": -27.676300048828125, "global_step": 545362, "epoch": 6570} {"train_loss": -27.8857421875, "global_step": 545363, "epoch": 6570} {"train_loss": -27.9566707611084, "global_step": 545364, "epoch": 6570} {"train_loss": -27.663990020751953, "global_step": 545365, "epoch": 6570} {"train_loss": -27.859848022460938, "global_step": 545366, "epoch": 6570} {"train_loss": -27.9311466217041, "global_step": 545367, "epoch": 6570} {"train_loss": -27.907445907592773, "global_step": 545368, "epoch": 6570} {"train_loss": -27.855321884155273, "global_step": 545369, "epoch": 6570} {"train_loss": -28.170852661132812, "global_step": 545370, "epoch": 6570} {"train_loss": -28.023229598999023, "global_step": 545371, "epoch": 6570} {"train_loss": -27.846038818359375, "global_step": 545372, "epoch": 6570} {"train_loss": -28.03607177734375, "global_step": 545373, "epoch": 6570} {"train_loss": -27.784086227416992, "global_step": 545374, "epoch": 6570} {"train_loss": -27.990985870361328, "global_step": 545375, "epoch": 6570} {"train_loss": -27.761402130126953, "global_step": 545376, "epoch": 6570} {"train_loss": -27.70562744140625, "global_step": 545377, "epoch": 6570} {"train_loss": -27.665576934814453, "global_step": 545378, "epoch": 6570} {"train_loss": -27.525632858276367, "global_step": 545379, "epoch": 6570} {"train_loss": -26.834430694580078, "global_step": 545380, "epoch": 6570} {"train_loss": -26.626251220703125, "global_step": 545381, "epoch": 6570} {"train_loss": -27.41398048400879, "global_step": 545382, "epoch": 6570} {"train_loss": -27.73760986328125, "global_step": 545383, "epoch": 6570} {"train_loss": -27.433124542236328, "global_step": 545384, "epoch": 6570} {"train_loss": -27.222736358642578, "global_step": 545385, "epoch": 6570} {"train_loss": -27.259016036987305, "global_step": 545386, "epoch": 6570} {"train_loss": -27.762420654296875, "global_step": 545387, "epoch": 6570} {"train_loss": -27.45102310180664, "global_step": 545388, "epoch": 6570} {"train_loss": -27.7327880859375, "global_step": 545389, "epoch": 6570} {"train_loss": -27.29522705078125, "global_step": 545390, "epoch": 6570} {"train_loss": -27.258758544921875, "global_step": 545391, "epoch": 6570} {"train_loss": -27.54428095989917, "global_step": 545392, "epoch": 6570, "val_loss": 6547236.0} {"train_loss": -24.54908561706543, "global_step": 545393, "epoch": 6571} {"train_loss": -23.549739837646484, "global_step": 545394, "epoch": 6571} {"train_loss": -26.3474178314209, "global_step": 545395, "epoch": 6571} {"train_loss": -25.775068283081055, "global_step": 545396, "epoch": 6571} {"train_loss": -25.803226470947266, "global_step": 545397, "epoch": 6571} {"train_loss": -26.425268173217773, "global_step": 545398, "epoch": 6571} {"train_loss": -24.613256454467773, "global_step": 545399, "epoch": 6571} {"train_loss": -26.732580184936523, "global_step": 545400, "epoch": 6571} {"train_loss": -26.033588409423828, "global_step": 545401, "epoch": 6571} {"train_loss": -26.530353546142578, "global_step": 545402, "epoch": 6571} {"train_loss": -26.797555923461914, "global_step": 545403, "epoch": 6571} {"train_loss": -27.050012588500977, "global_step": 545404, "epoch": 6571} {"train_loss": -26.66216468811035, "global_step": 545405, "epoch": 6571} {"train_loss": -27.063947677612305, "global_step": 545406, "epoch": 6571} {"train_loss": -26.97650718688965, "global_step": 545407, "epoch": 6571} {"train_loss": -27.01987648010254, "global_step": 545408, "epoch": 6571} {"train_loss": -26.93892478942871, "global_step": 545409, "epoch": 6571} {"train_loss": -26.46932029724121, "global_step": 545410, "epoch": 6571} {"train_loss": -27.41094970703125, "global_step": 545411, "epoch": 6571} {"train_loss": -27.274377822875977, "global_step": 545412, "epoch": 6571} {"train_loss": -26.782209396362305, "global_step": 545413, "epoch": 6571} {"train_loss": -27.165735244750977, "global_step": 545414, "epoch": 6571} {"train_loss": -27.066879272460938, "global_step": 545415, "epoch": 6571} {"train_loss": -27.445178985595703, "global_step": 545416, "epoch": 6571} {"train_loss": -27.29180335998535, "global_step": 545417, "epoch": 6571} {"train_loss": -27.226154327392578, "global_step": 545418, "epoch": 6571} {"train_loss": -27.433124542236328, "global_step": 545419, "epoch": 6571} {"train_loss": -27.4384765625, "global_step": 545420, "epoch": 6571} {"train_loss": -27.28628921508789, "global_step": 545421, "epoch": 6571} {"train_loss": -26.907123565673828, "global_step": 545422, "epoch": 6571} {"train_loss": -27.496295928955078, "global_step": 545423, "epoch": 6571} {"train_loss": -27.38728141784668, "global_step": 545424, "epoch": 6571} {"train_loss": -27.846023559570312, "global_step": 545425, "epoch": 6571} {"train_loss": -27.422388076782227, "global_step": 545426, "epoch": 6571} {"train_loss": -27.719018936157227, "global_step": 545427, "epoch": 6571} {"train_loss": -27.425207138061523, "global_step": 545428, "epoch": 6571} {"train_loss": -27.608484268188477, "global_step": 545429, "epoch": 6571} {"train_loss": -27.730010986328125, "global_step": 545430, "epoch": 6571} {"train_loss": -27.684839248657227, "global_step": 545431, "epoch": 6571} {"train_loss": -27.750946044921875, "global_step": 545432, "epoch": 6571} {"train_loss": -27.268524169921875, "global_step": 545433, "epoch": 6571} {"train_loss": -27.558218002319336, "global_step": 545434, "epoch": 6571} {"train_loss": -27.726285934448242, "global_step": 545435, "epoch": 6571} {"train_loss": -27.502613067626953, "global_step": 545436, "epoch": 6571} {"train_loss": -27.963092803955078, "global_step": 545437, "epoch": 6571} {"train_loss": -27.562591552734375, "global_step": 545438, "epoch": 6571} {"train_loss": -27.3723087310791, "global_step": 545439, "epoch": 6571} {"train_loss": -27.75312614440918, "global_step": 545440, "epoch": 6571} {"train_loss": -27.29694938659668, "global_step": 545441, "epoch": 6571} {"train_loss": -27.410993576049805, "global_step": 545442, "epoch": 6571} {"train_loss": -27.444263458251953, "global_step": 545443, "epoch": 6571} {"train_loss": -27.52487564086914, "global_step": 545444, "epoch": 6571} {"train_loss": -27.648746490478516, "global_step": 545445, "epoch": 6571} {"train_loss": -27.735931396484375, "global_step": 545446, "epoch": 6571} {"train_loss": -27.23602867126465, "global_step": 545447, "epoch": 6571} {"train_loss": -27.73036003112793, "global_step": 545448, "epoch": 6571} {"train_loss": -27.706085205078125, "global_step": 545449, "epoch": 6571} {"train_loss": -27.68406105041504, "global_step": 545450, "epoch": 6571} {"train_loss": -27.661306381225586, "global_step": 545451, "epoch": 6571} {"train_loss": -27.624658584594727, "global_step": 545452, "epoch": 6571} {"train_loss": -27.540063858032227, "global_step": 545453, "epoch": 6571} {"train_loss": -27.5747013092041, "global_step": 545454, "epoch": 6571} {"train_loss": -27.534605026245117, "global_step": 545455, "epoch": 6571} {"train_loss": -27.737817764282227, "global_step": 545456, "epoch": 6571} {"train_loss": -27.730146408081055, "global_step": 545457, "epoch": 6571} {"train_loss": -27.59516716003418, "global_step": 545458, "epoch": 6571} {"train_loss": -27.576154708862305, "global_step": 545459, "epoch": 6571} {"train_loss": -27.399505615234375, "global_step": 545460, "epoch": 6571} {"train_loss": -27.567663192749023, "global_step": 545461, "epoch": 6571} {"train_loss": -27.706953048706055, "global_step": 545462, "epoch": 6571} {"train_loss": -27.576995849609375, "global_step": 545463, "epoch": 6571} {"train_loss": -27.541187286376953, "global_step": 545464, "epoch": 6571} {"train_loss": -27.611957550048828, "global_step": 545465, "epoch": 6571} {"train_loss": -27.602476119995117, "global_step": 545466, "epoch": 6571} {"train_loss": -27.894575119018555, "global_step": 545467, "epoch": 6571} {"train_loss": -27.714466094970703, "global_step": 545468, "epoch": 6571} {"train_loss": -27.943729400634766, "global_step": 545469, "epoch": 6571} {"train_loss": -27.86053466796875, "global_step": 545470, "epoch": 6571} {"train_loss": -27.432504653930664, "global_step": 545471, "epoch": 6571} {"train_loss": -27.66888427734375, "global_step": 545472, "epoch": 6571} {"train_loss": -27.607885360717773, "global_step": 545473, "epoch": 6571} {"train_loss": -27.829748153686523, "global_step": 545474, "epoch": 6571} {"train_loss": -27.252291208290192, "global_step": 545475, "epoch": 6571, "val_loss": 6616561.0} {"train_loss": -26.899215698242188, "global_step": 545476, "epoch": 6572} {"train_loss": -26.78865623474121, "global_step": 545477, "epoch": 6572} {"train_loss": -26.63148307800293, "global_step": 545478, "epoch": 6572} {"train_loss": -26.8505916595459, "global_step": 545479, "epoch": 6572} {"train_loss": -27.225305557250977, "global_step": 545480, "epoch": 6572} {"train_loss": -26.615570068359375, "global_step": 545481, "epoch": 6572} {"train_loss": -27.119266510009766, "global_step": 545482, "epoch": 6572} {"train_loss": -27.403573989868164, "global_step": 545483, "epoch": 6572} {"train_loss": -27.15081787109375, "global_step": 545484, "epoch": 6572} {"train_loss": -26.966245651245117, "global_step": 545485, "epoch": 6572} {"train_loss": -27.54056167602539, "global_step": 545486, "epoch": 6572} {"train_loss": -27.33334732055664, "global_step": 545487, "epoch": 6572} {"train_loss": -27.111713409423828, "global_step": 545488, "epoch": 6572} {"train_loss": -27.388132095336914, "global_step": 545489, "epoch": 6572} {"train_loss": -27.640790939331055, "global_step": 545490, "epoch": 6572} {"train_loss": -27.131567001342773, "global_step": 545491, "epoch": 6572} {"train_loss": -27.37696647644043, "global_step": 545492, "epoch": 6572} {"train_loss": -27.45684814453125, "global_step": 545493, "epoch": 6572} {"train_loss": -26.97950553894043, "global_step": 545494, "epoch": 6572} {"train_loss": -27.505460739135742, "global_step": 545495, "epoch": 6572} {"train_loss": -27.22515869140625, "global_step": 545496, "epoch": 6572} {"train_loss": -27.358753204345703, "global_step": 545497, "epoch": 6572} {"train_loss": -27.32370948791504, "global_step": 545498, "epoch": 6572} {"train_loss": -27.422901153564453, "global_step": 545499, "epoch": 6572} {"train_loss": -27.445575714111328, "global_step": 545500, "epoch": 6572} {"train_loss": -27.70761489868164, "global_step": 545501, "epoch": 6572} {"train_loss": -27.332189559936523, "global_step": 545502, "epoch": 6572} {"train_loss": -27.657428741455078, "global_step": 545503, "epoch": 6572} {"train_loss": -27.535480499267578, "global_step": 545504, "epoch": 6572} {"train_loss": -27.71644401550293, "global_step": 545505, "epoch": 6572} {"train_loss": -27.532949447631836, "global_step": 545506, "epoch": 6572} {"train_loss": -27.86708641052246, "global_step": 545507, "epoch": 6572} {"train_loss": -27.340600967407227, "global_step": 545508, "epoch": 6572} {"train_loss": -27.431203842163086, "global_step": 545509, "epoch": 6572} {"train_loss": -27.775312423706055, "global_step": 545510, "epoch": 6572} {"train_loss": -28.079498291015625, "global_step": 545511, "epoch": 6572} {"train_loss": -27.8795166015625, "global_step": 545512, "epoch": 6572} {"train_loss": -27.89350700378418, "global_step": 545513, "epoch": 6572} {"train_loss": -27.330530166625977, "global_step": 545514, "epoch": 6572} {"train_loss": -27.534652709960938, "global_step": 545515, "epoch": 6572} {"train_loss": -27.857574462890625, "global_step": 545516, "epoch": 6572} {"train_loss": -27.806241989135742, "global_step": 545517, "epoch": 6572} {"train_loss": -27.79278564453125, "global_step": 545518, "epoch": 6572} {"train_loss": -27.847326278686523, "global_step": 545519, "epoch": 6572} {"train_loss": -27.877939224243164, "global_step": 545520, "epoch": 6572} {"train_loss": -28.16883659362793, "global_step": 545521, "epoch": 6572} {"train_loss": -27.587228775024414, "global_step": 545522, "epoch": 6572} {"train_loss": -27.57476234436035, "global_step": 545523, "epoch": 6572} {"train_loss": -28.061145782470703, "global_step": 545524, "epoch": 6572} {"train_loss": -27.59925651550293, "global_step": 545525, "epoch": 6572} {"train_loss": -27.94099235534668, "global_step": 545526, "epoch": 6572} {"train_loss": -28.109350204467773, "global_step": 545527, "epoch": 6572} {"train_loss": -27.627918243408203, "global_step": 545528, "epoch": 6572} {"train_loss": -27.507333755493164, "global_step": 545529, "epoch": 6572} {"train_loss": -27.7365779876709, "global_step": 545530, "epoch": 6572} {"train_loss": -27.471960067749023, "global_step": 545531, "epoch": 6572} {"train_loss": -27.795074462890625, "global_step": 545532, "epoch": 6572} {"train_loss": -27.388778686523438, "global_step": 545533, "epoch": 6572} {"train_loss": -27.46013832092285, "global_step": 545534, "epoch": 6572} {"train_loss": -28.01508903503418, "global_step": 545535, "epoch": 6572} {"train_loss": -27.73154067993164, "global_step": 545536, "epoch": 6572} {"train_loss": -27.579572677612305, "global_step": 545537, "epoch": 6572} {"train_loss": -27.815786361694336, "global_step": 545538, "epoch": 6572} {"train_loss": -27.72968864440918, "global_step": 545539, "epoch": 6572} {"train_loss": -27.35822105407715, "global_step": 545540, "epoch": 6572} {"train_loss": -27.9276180267334, "global_step": 545541, "epoch": 6572} {"train_loss": -28.02255630493164, "global_step": 545542, "epoch": 6572} {"train_loss": -27.384078979492188, "global_step": 545543, "epoch": 6572} {"train_loss": -27.746896743774414, "global_step": 545544, "epoch": 6572} {"train_loss": -28.18897819519043, "global_step": 545545, "epoch": 6572} {"train_loss": -27.676706314086914, "global_step": 545546, "epoch": 6572} {"train_loss": -27.595762252807617, "global_step": 545547, "epoch": 6572} {"train_loss": -28.014114379882812, "global_step": 545548, "epoch": 6572} {"train_loss": -27.680200576782227, "global_step": 545549, "epoch": 6572} {"train_loss": -27.69544792175293, "global_step": 545550, "epoch": 6572} {"train_loss": -27.682600021362305, "global_step": 545551, "epoch": 6572} {"train_loss": -27.971160888671875, "global_step": 545552, "epoch": 6572} {"train_loss": -28.184955596923828, "global_step": 545553, "epoch": 6572} {"train_loss": -27.866418838500977, "global_step": 545554, "epoch": 6572} {"train_loss": -27.63238525390625, "global_step": 545555, "epoch": 6572} {"train_loss": -27.72834587097168, "global_step": 545556, "epoch": 6572} {"train_loss": -27.804956436157227, "global_step": 545557, "epoch": 6572} {"train_loss": -27.57125077764672, "global_step": 545558, "epoch": 6572, "val_loss": 6598307.0} {"train_loss": -27.36659812927246, "global_step": 545559, "epoch": 6573} {"train_loss": -27.288496017456055, "global_step": 545560, "epoch": 6573} {"train_loss": -27.16963768005371, "global_step": 545561, "epoch": 6573} {"train_loss": -27.25921630859375, "global_step": 545562, "epoch": 6573} {"train_loss": -27.531293869018555, "global_step": 545563, "epoch": 6573} {"train_loss": -27.13083839416504, "global_step": 545564, "epoch": 6573} {"train_loss": -27.299488067626953, "global_step": 545565, "epoch": 6573} {"train_loss": -27.195663452148438, "global_step": 545566, "epoch": 6573} {"train_loss": -27.42636489868164, "global_step": 545567, "epoch": 6573} {"train_loss": -27.3262939453125, "global_step": 545568, "epoch": 6573} {"train_loss": -27.206756591796875, "global_step": 545569, "epoch": 6573} {"train_loss": -27.415674209594727, "global_step": 545570, "epoch": 6573} {"train_loss": -27.224899291992188, "global_step": 545571, "epoch": 6573} {"train_loss": -27.041004180908203, "global_step": 545572, "epoch": 6573} {"train_loss": -26.990009307861328, "global_step": 545573, "epoch": 6573} {"train_loss": -27.205408096313477, "global_step": 545574, "epoch": 6573} {"train_loss": -27.50465202331543, "global_step": 545575, "epoch": 6573} {"train_loss": -27.4332332611084, "global_step": 545576, "epoch": 6573} {"train_loss": -27.099878311157227, "global_step": 545577, "epoch": 6573} {"train_loss": -27.59018325805664, "global_step": 545578, "epoch": 6573} {"train_loss": -27.704050064086914, "global_step": 545579, "epoch": 6573} {"train_loss": -27.36294937133789, "global_step": 545580, "epoch": 6573} {"train_loss": -27.6769962310791, "global_step": 545581, "epoch": 6573} {"train_loss": -27.19684410095215, "global_step": 545582, "epoch": 6573} {"train_loss": -27.163557052612305, "global_step": 545583, "epoch": 6573} {"train_loss": -27.778234481811523, "global_step": 545584, "epoch": 6573} {"train_loss": -27.5517578125, "global_step": 545585, "epoch": 6573} {"train_loss": -27.586822509765625, "global_step": 545586, "epoch": 6573} {"train_loss": -27.721420288085938, "global_step": 545587, "epoch": 6573} {"train_loss": -27.354333877563477, "global_step": 545588, "epoch": 6573} {"train_loss": -27.248804092407227, "global_step": 545589, "epoch": 6573} {"train_loss": -27.745080947875977, "global_step": 545590, "epoch": 6573} {"train_loss": -27.62489128112793, "global_step": 545591, "epoch": 6573} {"train_loss": -27.979551315307617, "global_step": 545592, "epoch": 6573} {"train_loss": -27.83785057067871, "global_step": 545593, "epoch": 6573} {"train_loss": -27.724096298217773, "global_step": 545594, "epoch": 6573} {"train_loss": -27.900922775268555, "global_step": 545595, "epoch": 6573} {"train_loss": -27.97562599182129, "global_step": 545596, "epoch": 6573} {"train_loss": -27.61203384399414, "global_step": 545597, "epoch": 6573} {"train_loss": -27.710290908813477, "global_step": 545598, "epoch": 6573} {"train_loss": -27.635828018188477, "global_step": 545599, "epoch": 6573} {"train_loss": -27.58028221130371, "global_step": 545600, "epoch": 6573} {"train_loss": -27.72515296936035, "global_step": 545601, "epoch": 6573} {"train_loss": -27.755334854125977, "global_step": 545602, "epoch": 6573} {"train_loss": -28.00595474243164, "global_step": 545603, "epoch": 6573} {"train_loss": -27.987018585205078, "global_step": 545604, "epoch": 6573} {"train_loss": -28.207386016845703, "global_step": 545605, "epoch": 6573} {"train_loss": -27.85614585876465, "global_step": 545606, "epoch": 6573} {"train_loss": -27.569660186767578, "global_step": 545607, "epoch": 6573} {"train_loss": -27.817413330078125, "global_step": 545608, "epoch": 6573} {"train_loss": -27.77573585510254, "global_step": 545609, "epoch": 6573} {"train_loss": -28.095914840698242, "global_step": 545610, "epoch": 6573} {"train_loss": -28.11578369140625, "global_step": 545611, "epoch": 6573} {"train_loss": -28.084604263305664, "global_step": 545612, "epoch": 6573} {"train_loss": -28.203588485717773, "global_step": 545613, "epoch": 6573} {"train_loss": -28.021329879760742, "global_step": 545614, "epoch": 6573} {"train_loss": -27.99930763244629, "global_step": 545615, "epoch": 6573} {"train_loss": -28.261823654174805, "global_step": 545616, "epoch": 6573} {"train_loss": -28.22784996032715, "global_step": 545617, "epoch": 6573} {"train_loss": -27.7061710357666, "global_step": 545618, "epoch": 6573} {"train_loss": -27.694091796875, "global_step": 545619, "epoch": 6573} {"train_loss": -27.401899337768555, "global_step": 545620, "epoch": 6573} {"train_loss": -27.92664909362793, "global_step": 545621, "epoch": 6573} {"train_loss": -28.087377548217773, "global_step": 545622, "epoch": 6573} {"train_loss": -27.97284507751465, "global_step": 545623, "epoch": 6573} {"train_loss": -27.76727867126465, "global_step": 545624, "epoch": 6573} {"train_loss": -27.47113609313965, "global_step": 545625, "epoch": 6573} {"train_loss": -27.513410568237305, "global_step": 545626, "epoch": 6573} {"train_loss": -27.27362060546875, "global_step": 545627, "epoch": 6573} {"train_loss": -27.545642852783203, "global_step": 545628, "epoch": 6573} {"train_loss": -26.95926856994629, "global_step": 545629, "epoch": 6573} {"train_loss": -26.85493278503418, "global_step": 545630, "epoch": 6573} {"train_loss": -26.67822265625, "global_step": 545631, "epoch": 6573} {"train_loss": -26.435714721679688, "global_step": 545632, "epoch": 6573} {"train_loss": -27.064624786376953, "global_step": 545633, "epoch": 6573} {"train_loss": -27.61568260192871, "global_step": 545634, "epoch": 6573} {"train_loss": -27.356998443603516, "global_step": 545635, "epoch": 6573} {"train_loss": -27.227508544921875, "global_step": 545636, "epoch": 6573} {"train_loss": -27.312103271484375, "global_step": 545637, "epoch": 6573} {"train_loss": -27.834325790405273, "global_step": 545638, "epoch": 6573} {"train_loss": -27.518875122070312, "global_step": 545639, "epoch": 6573} {"train_loss": -27.640167236328125, "global_step": 545640, "epoch": 6573} {"train_loss": -27.573359064308995, "global_step": 545641, "epoch": 6573, "val_loss": 6632048.0} {"train_loss": -27.028501510620117, "global_step": 545642, "epoch": 6574} {"train_loss": -27.269819259643555, "global_step": 545643, "epoch": 6574} {"train_loss": -27.282934188842773, "global_step": 545644, "epoch": 6574} {"train_loss": -27.133764266967773, "global_step": 545645, "epoch": 6574} {"train_loss": -27.009418487548828, "global_step": 545646, "epoch": 6574} {"train_loss": -27.76340103149414, "global_step": 545647, "epoch": 6574} {"train_loss": -26.95611000061035, "global_step": 545648, "epoch": 6574} {"train_loss": -27.20588493347168, "global_step": 545649, "epoch": 6574} {"train_loss": -27.11859130859375, "global_step": 545650, "epoch": 6574} {"train_loss": -26.961755752563477, "global_step": 545651, "epoch": 6574} {"train_loss": -27.05215835571289, "global_step": 545652, "epoch": 6574} {"train_loss": -27.2281436920166, "global_step": 545653, "epoch": 6574} {"train_loss": -27.31363296508789, "global_step": 545654, "epoch": 6574} {"train_loss": -27.180225372314453, "global_step": 545655, "epoch": 6574} {"train_loss": -27.37689208984375, "global_step": 545656, "epoch": 6574} {"train_loss": -27.6044921875, "global_step": 545657, "epoch": 6574} {"train_loss": -27.617521286010742, "global_step": 545658, "epoch": 6574} {"train_loss": -27.176828384399414, "global_step": 545659, "epoch": 6574} {"train_loss": -27.1546688079834, "global_step": 545660, "epoch": 6574} {"train_loss": -27.404844284057617, "global_step": 545661, "epoch": 6574} {"train_loss": -27.738874435424805, "global_step": 545662, "epoch": 6574} {"train_loss": -27.666431427001953, "global_step": 545663, "epoch": 6574} {"train_loss": -27.5828800201416, "global_step": 545664, "epoch": 6574} {"train_loss": -27.518091201782227, "global_step": 545665, "epoch": 6574} {"train_loss": -27.586090087890625, "global_step": 545666, "epoch": 6574} {"train_loss": -27.367589950561523, "global_step": 545667, "epoch": 6574} {"train_loss": -27.75040626525879, "global_step": 545668, "epoch": 6574} {"train_loss": -28.108057022094727, "global_step": 545669, "epoch": 6574} {"train_loss": -27.5184268951416, "global_step": 545670, "epoch": 6574} {"train_loss": -27.72368812561035, "global_step": 545671, "epoch": 6574} {"train_loss": -27.558181762695312, "global_step": 545672, "epoch": 6574} {"train_loss": -27.73712730407715, "global_step": 545673, "epoch": 6574} {"train_loss": -27.680774688720703, "global_step": 545674, "epoch": 6574} {"train_loss": -27.718463897705078, "global_step": 545675, "epoch": 6574} {"train_loss": -27.900699615478516, "global_step": 545676, "epoch": 6574} {"train_loss": -27.846912384033203, "global_step": 545677, "epoch": 6574} {"train_loss": -27.9188232421875, "global_step": 545678, "epoch": 6574} {"train_loss": -27.680856704711914, "global_step": 545679, "epoch": 6574} {"train_loss": -27.791397094726562, "global_step": 545680, "epoch": 6574} {"train_loss": -27.645771026611328, "global_step": 545681, "epoch": 6574} {"train_loss": -27.66448974609375, "global_step": 545682, "epoch": 6574} {"train_loss": -27.91932487487793, "global_step": 545683, "epoch": 6574} {"train_loss": -28.077178955078125, "global_step": 545684, "epoch": 6574} {"train_loss": -28.143728256225586, "global_step": 545685, "epoch": 6574} {"train_loss": -28.1627140045166, "global_step": 545686, "epoch": 6574} {"train_loss": -27.932287216186523, "global_step": 545687, "epoch": 6574} {"train_loss": -27.422210693359375, "global_step": 545688, "epoch": 6574} {"train_loss": -28.004962921142578, "global_step": 545689, "epoch": 6574} {"train_loss": -28.11464500427246, "global_step": 545690, "epoch": 6574} {"train_loss": -27.8182373046875, "global_step": 545691, "epoch": 6574} {"train_loss": -27.605932235717773, "global_step": 545692, "epoch": 6574} {"train_loss": -28.021209716796875, "global_step": 545693, "epoch": 6574} {"train_loss": -27.679718017578125, "global_step": 545694, "epoch": 6574} {"train_loss": -27.634729385375977, "global_step": 545695, "epoch": 6574} {"train_loss": -28.190839767456055, "global_step": 545696, "epoch": 6574} {"train_loss": -27.763080596923828, "global_step": 545697, "epoch": 6574} {"train_loss": -27.54770851135254, "global_step": 545698, "epoch": 6574} {"train_loss": -27.8090763092041, "global_step": 545699, "epoch": 6574} {"train_loss": -27.172561645507812, "global_step": 545700, "epoch": 6574} {"train_loss": -27.408567428588867, "global_step": 545701, "epoch": 6574} {"train_loss": -27.581104278564453, "global_step": 545702, "epoch": 6574} {"train_loss": -27.327198028564453, "global_step": 545703, "epoch": 6574} {"train_loss": -27.404010772705078, "global_step": 545704, "epoch": 6574} {"train_loss": -27.06267738342285, "global_step": 545705, "epoch": 6574} {"train_loss": -27.47100257873535, "global_step": 545706, "epoch": 6574} {"train_loss": -27.47627067565918, "global_step": 545707, "epoch": 6574} {"train_loss": -27.279682159423828, "global_step": 545708, "epoch": 6574} {"train_loss": -27.526859283447266, "global_step": 545709, "epoch": 6574} {"train_loss": -27.395368576049805, "global_step": 545710, "epoch": 6574} {"train_loss": -27.226255416870117, "global_step": 545711, "epoch": 6574} {"train_loss": -27.77545166015625, "global_step": 545712, "epoch": 6574} {"train_loss": -27.712209701538086, "global_step": 545713, "epoch": 6574} {"train_loss": -27.420013427734375, "global_step": 545714, "epoch": 6574} {"train_loss": -27.114871978759766, "global_step": 545715, "epoch": 6574} {"train_loss": -27.9152889251709, "global_step": 545716, "epoch": 6574} {"train_loss": -27.737518310546875, "global_step": 545717, "epoch": 6574} {"train_loss": -27.790136337280273, "global_step": 545718, "epoch": 6574} {"train_loss": -27.656524658203125, "global_step": 545719, "epoch": 6574} {"train_loss": -27.89215087890625, "global_step": 545720, "epoch": 6574} {"train_loss": -27.938278198242188, "global_step": 545721, "epoch": 6574} {"train_loss": -27.699560165405273, "global_step": 545722, "epoch": 6574} {"train_loss": -27.909046173095703, "global_step": 545723, "epoch": 6574} {"train_loss": -27.59585070322795, "global_step": 545724, "epoch": 6574, "val_loss": 6619444.0} {"train_loss": -27.043537139892578, "global_step": 545725, "epoch": 6575} {"train_loss": -26.97369956970215, "global_step": 545726, "epoch": 6575} {"train_loss": -27.058502197265625, "global_step": 545727, "epoch": 6575} {"train_loss": -26.925912857055664, "global_step": 545728, "epoch": 6575} {"train_loss": -26.841665267944336, "global_step": 545729, "epoch": 6575} {"train_loss": -27.11591148376465, "global_step": 545730, "epoch": 6575} {"train_loss": -27.0367431640625, "global_step": 545731, "epoch": 6575} {"train_loss": -26.690704345703125, "global_step": 545732, "epoch": 6575} {"train_loss": -27.097442626953125, "global_step": 545733, "epoch": 6575} {"train_loss": -27.185449600219727, "global_step": 545734, "epoch": 6575} {"train_loss": -27.191822052001953, "global_step": 545735, "epoch": 6575} {"train_loss": -27.56467056274414, "global_step": 545736, "epoch": 6575} {"train_loss": -27.172266006469727, "global_step": 545737, "epoch": 6575} {"train_loss": -27.1437931060791, "global_step": 545738, "epoch": 6575} {"train_loss": -27.264862060546875, "global_step": 545739, "epoch": 6575} {"train_loss": -27.397235870361328, "global_step": 545740, "epoch": 6575} {"train_loss": -27.31329917907715, "global_step": 545741, "epoch": 6575} {"train_loss": -27.513940811157227, "global_step": 545742, "epoch": 6575} {"train_loss": -27.74940299987793, "global_step": 545743, "epoch": 6575} {"train_loss": -27.46990966796875, "global_step": 545744, "epoch": 6575} {"train_loss": -27.723602294921875, "global_step": 545745, "epoch": 6575} {"train_loss": -27.1429500579834, "global_step": 545746, "epoch": 6575} {"train_loss": -27.46564292907715, "global_step": 545747, "epoch": 6575} {"train_loss": -27.253767013549805, "global_step": 545748, "epoch": 6575} {"train_loss": -27.299972534179688, "global_step": 545749, "epoch": 6575} {"train_loss": -27.359350204467773, "global_step": 545750, "epoch": 6575} {"train_loss": -27.937570571899414, "global_step": 545751, "epoch": 6575} {"train_loss": -27.680830001831055, "global_step": 545752, "epoch": 6575} {"train_loss": -27.77601432800293, "global_step": 545753, "epoch": 6575} {"train_loss": -27.508947372436523, "global_step": 545754, "epoch": 6575} {"train_loss": -27.86099624633789, "global_step": 545755, "epoch": 6575} {"train_loss": -27.513599395751953, "global_step": 545756, "epoch": 6575} {"train_loss": -27.503686904907227, "global_step": 545757, "epoch": 6575} {"train_loss": -27.334980010986328, "global_step": 545758, "epoch": 6575} {"train_loss": -27.701385498046875, "global_step": 545759, "epoch": 6575} {"train_loss": -27.45292091369629, "global_step": 545760, "epoch": 6575} {"train_loss": -27.457550048828125, "global_step": 545761, "epoch": 6575} {"train_loss": -27.667938232421875, "global_step": 545762, "epoch": 6575} {"train_loss": -27.907331466674805, "global_step": 545763, "epoch": 6575} {"train_loss": -27.956327438354492, "global_step": 545764, "epoch": 6575} {"train_loss": -27.81357192993164, "global_step": 545765, "epoch": 6575} {"train_loss": -27.710657119750977, "global_step": 545766, "epoch": 6575} {"train_loss": -27.832782745361328, "global_step": 545767, "epoch": 6575} {"train_loss": -28.10955810546875, "global_step": 545768, "epoch": 6575} {"train_loss": -27.814926147460938, "global_step": 545769, "epoch": 6575} {"train_loss": -28.053937911987305, "global_step": 545770, "epoch": 6575} {"train_loss": -27.941370010375977, "global_step": 545771, "epoch": 6575} {"train_loss": -27.462182998657227, "global_step": 545772, "epoch": 6575} {"train_loss": -27.7944393157959, "global_step": 545773, "epoch": 6575} {"train_loss": -28.053186416625977, "global_step": 545774, "epoch": 6575} {"train_loss": -27.64798927307129, "global_step": 545775, "epoch": 6575} {"train_loss": -28.224451065063477, "global_step": 545776, "epoch": 6575} {"train_loss": -27.889429092407227, "global_step": 545777, "epoch": 6575} {"train_loss": -27.799779891967773, "global_step": 545778, "epoch": 6575} {"train_loss": -27.62823486328125, "global_step": 545779, "epoch": 6575} {"train_loss": -27.665084838867188, "global_step": 545780, "epoch": 6575} {"train_loss": -27.870670318603516, "global_step": 545781, "epoch": 6575} {"train_loss": -27.895856857299805, "global_step": 545782, "epoch": 6575} {"train_loss": -27.54681396484375, "global_step": 545783, "epoch": 6575} {"train_loss": -27.77899169921875, "global_step": 545784, "epoch": 6575} {"train_loss": -28.11323356628418, "global_step": 545785, "epoch": 6575} {"train_loss": -28.179630279541016, "global_step": 545786, "epoch": 6575} {"train_loss": -27.57990074157715, "global_step": 545787, "epoch": 6575} {"train_loss": -27.57147216796875, "global_step": 545788, "epoch": 6575} {"train_loss": -27.920690536499023, "global_step": 545789, "epoch": 6575} {"train_loss": -27.782922744750977, "global_step": 545790, "epoch": 6575} {"train_loss": -27.943883895874023, "global_step": 545791, "epoch": 6575} {"train_loss": -27.860187530517578, "global_step": 545792, "epoch": 6575} {"train_loss": -27.754016876220703, "global_step": 545793, "epoch": 6575} {"train_loss": -27.58613395690918, "global_step": 545794, "epoch": 6575} {"train_loss": -27.618188858032227, "global_step": 545795, "epoch": 6575} {"train_loss": -27.417524337768555, "global_step": 545796, "epoch": 6575} {"train_loss": -27.48394203186035, "global_step": 545797, "epoch": 6575} {"train_loss": -27.551977157592773, "global_step": 545798, "epoch": 6575} {"train_loss": -27.998579025268555, "global_step": 545799, "epoch": 6575} {"train_loss": -27.657733917236328, "global_step": 545800, "epoch": 6575} {"train_loss": -26.963708877563477, "global_step": 545801, "epoch": 6575} {"train_loss": -26.6012020111084, "global_step": 545802, "epoch": 6575} {"train_loss": -27.566736221313477, "global_step": 545803, "epoch": 6575} {"train_loss": -27.442541122436523, "global_step": 545804, "epoch": 6575} {"train_loss": -27.11970329284668, "global_step": 545805, "epoch": 6575} {"train_loss": -27.508636474609375, "global_step": 545806, "epoch": 6575} {"train_loss": -27.53872866802905, "global_step": 545807, "epoch": 6575, "val_loss": 6465136.0} {"train_loss": -25.284854888916016, "global_step": 545808, "epoch": 6576} {"train_loss": -25.71857261657715, "global_step": 545809, "epoch": 6576} {"train_loss": -26.37092399597168, "global_step": 545810, "epoch": 6576} {"train_loss": -25.649642944335938, "global_step": 545811, "epoch": 6576} {"train_loss": -26.367847442626953, "global_step": 545812, "epoch": 6576} {"train_loss": -26.07808494567871, "global_step": 545813, "epoch": 6576} {"train_loss": -26.632184982299805, "global_step": 545814, "epoch": 6576} {"train_loss": -26.981067657470703, "global_step": 545815, "epoch": 6576} {"train_loss": -27.228412628173828, "global_step": 545816, "epoch": 6576} {"train_loss": -26.895832061767578, "global_step": 545817, "epoch": 6576} {"train_loss": -26.971235275268555, "global_step": 545818, "epoch": 6576} {"train_loss": -26.955204010009766, "global_step": 545819, "epoch": 6576} {"train_loss": -26.996875762939453, "global_step": 545820, "epoch": 6576} {"train_loss": -26.9953670501709, "global_step": 545821, "epoch": 6576} {"train_loss": -27.065799713134766, "global_step": 545822, "epoch": 6576} {"train_loss": -26.95963478088379, "global_step": 545823, "epoch": 6576} {"train_loss": -26.998456954956055, "global_step": 545824, "epoch": 6576} {"train_loss": -27.567792892456055, "global_step": 545825, "epoch": 6576} {"train_loss": -27.073652267456055, "global_step": 545826, "epoch": 6576} {"train_loss": -27.586105346679688, "global_step": 545827, "epoch": 6576} {"train_loss": -27.10157585144043, "global_step": 545828, "epoch": 6576} {"train_loss": -27.000629425048828, "global_step": 545829, "epoch": 6576} {"train_loss": -27.221240997314453, "global_step": 545830, "epoch": 6576} {"train_loss": -27.25201416015625, "global_step": 545831, "epoch": 6576} {"train_loss": -27.15073585510254, "global_step": 545832, "epoch": 6576} {"train_loss": -27.430438995361328, "global_step": 545833, "epoch": 6576} {"train_loss": -27.502553939819336, "global_step": 545834, "epoch": 6576} {"train_loss": -27.754941940307617, "global_step": 545835, "epoch": 6576} {"train_loss": -27.7391300201416, "global_step": 545836, "epoch": 6576} {"train_loss": -27.61305809020996, "global_step": 545837, "epoch": 6576} {"train_loss": -27.546295166015625, "global_step": 545838, "epoch": 6576} {"train_loss": -27.47809410095215, "global_step": 545839, "epoch": 6576} {"train_loss": -27.769006729125977, "global_step": 545840, "epoch": 6576} {"train_loss": -27.560443878173828, "global_step": 545841, "epoch": 6576} {"train_loss": -27.422475814819336, "global_step": 545842, "epoch": 6576} {"train_loss": -27.6780948638916, "global_step": 545843, "epoch": 6576} {"train_loss": -27.712158203125, "global_step": 545844, "epoch": 6576} {"train_loss": -28.054401397705078, "global_step": 545845, "epoch": 6576} {"train_loss": -27.67059898376465, "global_step": 545846, "epoch": 6576} {"train_loss": -27.801849365234375, "global_step": 545847, "epoch": 6576} {"train_loss": -27.42275047302246, "global_step": 545848, "epoch": 6576} {"train_loss": -27.806522369384766, "global_step": 545849, "epoch": 6576} {"train_loss": -27.817060470581055, "global_step": 545850, "epoch": 6576} {"train_loss": -27.91046142578125, "global_step": 545851, "epoch": 6576} {"train_loss": -27.483457565307617, "global_step": 545852, "epoch": 6576} {"train_loss": -27.743406295776367, "global_step": 545853, "epoch": 6576} {"train_loss": -27.9976806640625, "global_step": 545854, "epoch": 6576} {"train_loss": -27.876386642456055, "global_step": 545855, "epoch": 6576} {"train_loss": -27.807714462280273, "global_step": 545856, "epoch": 6576} {"train_loss": -27.72361183166504, "global_step": 545857, "epoch": 6576} {"train_loss": -27.71150016784668, "global_step": 545858, "epoch": 6576} {"train_loss": -28.140369415283203, "global_step": 545859, "epoch": 6576} {"train_loss": -28.19028663635254, "global_step": 545860, "epoch": 6576} {"train_loss": -27.991479873657227, "global_step": 545861, "epoch": 6576} {"train_loss": -27.689794540405273, "global_step": 545862, "epoch": 6576} {"train_loss": -27.754058837890625, "global_step": 545863, "epoch": 6576} {"train_loss": -27.67536735534668, "global_step": 545864, "epoch": 6576} {"train_loss": -27.572179794311523, "global_step": 545865, "epoch": 6576} {"train_loss": -27.975040435791016, "global_step": 545866, "epoch": 6576} {"train_loss": -27.920490264892578, "global_step": 545867, "epoch": 6576} {"train_loss": -28.139942169189453, "global_step": 545868, "epoch": 6576} {"train_loss": -27.92270278930664, "global_step": 545869, "epoch": 6576} {"train_loss": -28.167097091674805, "global_step": 545870, "epoch": 6576} {"train_loss": -27.801435470581055, "global_step": 545871, "epoch": 6576} {"train_loss": -28.2103214263916, "global_step": 545872, "epoch": 6576} {"train_loss": -27.6007137298584, "global_step": 545873, "epoch": 6576} {"train_loss": -27.845544815063477, "global_step": 545874, "epoch": 6576} {"train_loss": -27.80428123474121, "global_step": 545875, "epoch": 6576} {"train_loss": -27.606952667236328, "global_step": 545876, "epoch": 6576} {"train_loss": -27.620336532592773, "global_step": 545877, "epoch": 6576} {"train_loss": -27.9959659576416, "global_step": 545878, "epoch": 6576} {"train_loss": -28.071542739868164, "global_step": 545879, "epoch": 6576} {"train_loss": -27.67339515686035, "global_step": 545880, "epoch": 6576} {"train_loss": -27.55045509338379, "global_step": 545881, "epoch": 6576} {"train_loss": -27.594873428344727, "global_step": 545882, "epoch": 6576} {"train_loss": -27.7415828704834, "global_step": 545883, "epoch": 6576} {"train_loss": -27.837472915649414, "global_step": 545884, "epoch": 6576} {"train_loss": -27.433469772338867, "global_step": 545885, "epoch": 6576} {"train_loss": -27.5484676361084, "global_step": 545886, "epoch": 6576} {"train_loss": -27.697900772094727, "global_step": 545887, "epoch": 6576} {"train_loss": -27.61577796936035, "global_step": 545888, "epoch": 6576} {"train_loss": -27.268972396850586, "global_step": 545889, "epoch": 6576} {"train_loss": -27.469801431678864, "global_step": 545890, "epoch": 6576, "val_loss": 6594801.0} {"train_loss": -24.991147994995117, "global_step": 545891, "epoch": 6577} {"train_loss": -24.04066276550293, "global_step": 545892, "epoch": 6577} {"train_loss": -25.15362548828125, "global_step": 545893, "epoch": 6577} {"train_loss": -26.336395263671875, "global_step": 545894, "epoch": 6577} {"train_loss": -26.359588623046875, "global_step": 545895, "epoch": 6577} {"train_loss": -26.524707794189453, "global_step": 545896, "epoch": 6577} {"train_loss": -26.604379653930664, "global_step": 545897, "epoch": 6577} {"train_loss": -26.867307662963867, "global_step": 545898, "epoch": 6577} {"train_loss": -26.87098503112793, "global_step": 545899, "epoch": 6577} {"train_loss": -27.300495147705078, "global_step": 545900, "epoch": 6577} {"train_loss": -27.1064510345459, "global_step": 545901, "epoch": 6577} {"train_loss": -26.936878204345703, "global_step": 545902, "epoch": 6577} {"train_loss": -27.04298210144043, "global_step": 545903, "epoch": 6577} {"train_loss": -26.89161491394043, "global_step": 545904, "epoch": 6577} {"train_loss": -27.277313232421875, "global_step": 545905, "epoch": 6577} {"train_loss": -27.354413986206055, "global_step": 545906, "epoch": 6577} {"train_loss": -27.328237533569336, "global_step": 545907, "epoch": 6577} {"train_loss": -27.316741943359375, "global_step": 545908, "epoch": 6577} {"train_loss": -27.526702880859375, "global_step": 545909, "epoch": 6577} {"train_loss": -27.178680419921875, "global_step": 545910, "epoch": 6577} {"train_loss": -27.026813507080078, "global_step": 545911, "epoch": 6577} {"train_loss": -27.411828994750977, "global_step": 545912, "epoch": 6577} {"train_loss": -27.103515625, "global_step": 545913, "epoch": 6577} {"train_loss": -27.34531021118164, "global_step": 545914, "epoch": 6577} {"train_loss": -27.0071964263916, "global_step": 545915, "epoch": 6577} {"train_loss": -27.343393325805664, "global_step": 545916, "epoch": 6577} {"train_loss": -28.197412490844727, "global_step": 545917, "epoch": 6577} {"train_loss": -27.24210548400879, "global_step": 545918, "epoch": 6577} {"train_loss": -27.36311149597168, "global_step": 545919, "epoch": 6577} {"train_loss": -27.44867515563965, "global_step": 545920, "epoch": 6577} {"train_loss": -27.563201904296875, "global_step": 545921, "epoch": 6577} {"train_loss": -27.65034294128418, "global_step": 545922, "epoch": 6577} {"train_loss": -27.271093368530273, "global_step": 545923, "epoch": 6577} {"train_loss": -27.27864646911621, "global_step": 545924, "epoch": 6577} {"train_loss": -28.004056930541992, "global_step": 545925, "epoch": 6577} {"train_loss": -27.772428512573242, "global_step": 545926, "epoch": 6577} {"train_loss": -28.017179489135742, "global_step": 545927, "epoch": 6577} {"train_loss": -27.814817428588867, "global_step": 545928, "epoch": 6577} {"train_loss": -27.590255737304688, "global_step": 545929, "epoch": 6577} {"train_loss": -27.487289428710938, "global_step": 545930, "epoch": 6577} {"train_loss": -27.777124404907227, "global_step": 545931, "epoch": 6577} {"train_loss": -27.618453979492188, "global_step": 545932, "epoch": 6577} {"train_loss": -27.904638290405273, "global_step": 545933, "epoch": 6577} {"train_loss": -27.868494033813477, "global_step": 545934, "epoch": 6577} {"train_loss": -27.372589111328125, "global_step": 545935, "epoch": 6577} {"train_loss": -27.531946182250977, "global_step": 545936, "epoch": 6577} {"train_loss": -27.9141845703125, "global_step": 545937, "epoch": 6577} {"train_loss": -27.745208740234375, "global_step": 545938, "epoch": 6577} {"train_loss": -27.728601455688477, "global_step": 545939, "epoch": 6577} {"train_loss": -27.971240997314453, "global_step": 545940, "epoch": 6577} {"train_loss": -27.497594833374023, "global_step": 545941, "epoch": 6577} {"train_loss": -27.902210235595703, "global_step": 545942, "epoch": 6577} {"train_loss": -27.490461349487305, "global_step": 545943, "epoch": 6577} {"train_loss": -27.727985382080078, "global_step": 545944, "epoch": 6577} {"train_loss": -27.793466567993164, "global_step": 545945, "epoch": 6577} {"train_loss": -28.045026779174805, "global_step": 545946, "epoch": 6577} {"train_loss": -27.997228622436523, "global_step": 545947, "epoch": 6577} {"train_loss": -28.172576904296875, "global_step": 545948, "epoch": 6577} {"train_loss": -28.091611862182617, "global_step": 545949, "epoch": 6577} {"train_loss": -28.18585205078125, "global_step": 545950, "epoch": 6577} {"train_loss": -28.132709503173828, "global_step": 545951, "epoch": 6577} {"train_loss": -27.890933990478516, "global_step": 545952, "epoch": 6577} {"train_loss": -28.18821144104004, "global_step": 545953, "epoch": 6577} {"train_loss": -27.85877799987793, "global_step": 545954, "epoch": 6577} {"train_loss": -27.96722984313965, "global_step": 545955, "epoch": 6577} {"train_loss": -27.977798461914062, "global_step": 545956, "epoch": 6577} {"train_loss": -27.99989128112793, "global_step": 545957, "epoch": 6577} {"train_loss": -27.942663192749023, "global_step": 545958, "epoch": 6577} {"train_loss": -28.02207374572754, "global_step": 545959, "epoch": 6577} {"train_loss": -27.926298141479492, "global_step": 545960, "epoch": 6577} {"train_loss": -27.737817764282227, "global_step": 545961, "epoch": 6577} {"train_loss": -27.340978622436523, "global_step": 545962, "epoch": 6577} {"train_loss": -27.68341064453125, "global_step": 545963, "epoch": 6577} {"train_loss": -27.6588191986084, "global_step": 545964, "epoch": 6577} {"train_loss": -28.116565704345703, "global_step": 545965, "epoch": 6577} {"train_loss": -27.881555557250977, "global_step": 545966, "epoch": 6577} {"train_loss": -27.822568893432617, "global_step": 545967, "epoch": 6577} {"train_loss": -27.566638946533203, "global_step": 545968, "epoch": 6577} {"train_loss": -28.002655029296875, "global_step": 545969, "epoch": 6577} {"train_loss": -27.827960968017578, "global_step": 545970, "epoch": 6577} {"train_loss": -27.7073917388916, "global_step": 545971, "epoch": 6577} {"train_loss": -27.340717315673828, "global_step": 545972, "epoch": 6577} {"train_loss": -27.449501956801818, "global_step": 545973, "epoch": 6577, "val_loss": 6599887.0} {"train_loss": -27.637332916259766, "global_step": 545974, "epoch": 6578} {"train_loss": -26.96441650390625, "global_step": 545975, "epoch": 6578} {"train_loss": -26.42044448852539, "global_step": 545976, "epoch": 6578} {"train_loss": -26.624088287353516, "global_step": 545977, "epoch": 6578} {"train_loss": -26.661956787109375, "global_step": 545978, "epoch": 6578} {"train_loss": -27.0372314453125, "global_step": 545979, "epoch": 6578} {"train_loss": -26.764734268188477, "global_step": 545980, "epoch": 6578} {"train_loss": -27.14971923828125, "global_step": 545981, "epoch": 6578} {"train_loss": -26.503894805908203, "global_step": 545982, "epoch": 6578} {"train_loss": -27.413625717163086, "global_step": 545983, "epoch": 6578} {"train_loss": -26.7869873046875, "global_step": 545984, "epoch": 6578} {"train_loss": -26.728458404541016, "global_step": 545985, "epoch": 6578} {"train_loss": -26.642194747924805, "global_step": 545986, "epoch": 6578} {"train_loss": -27.0438232421875, "global_step": 545987, "epoch": 6578} {"train_loss": -26.631677627563477, "global_step": 545988, "epoch": 6578} {"train_loss": -27.03053855895996, "global_step": 545989, "epoch": 6578} {"train_loss": -27.382904052734375, "global_step": 545990, "epoch": 6578} {"train_loss": -27.22541618347168, "global_step": 545991, "epoch": 6578} {"train_loss": -26.91473388671875, "global_step": 545992, "epoch": 6578} {"train_loss": -27.021833419799805, "global_step": 545993, "epoch": 6578} {"train_loss": -27.333852767944336, "global_step": 545994, "epoch": 6578} {"train_loss": -26.05171012878418, "global_step": 545995, "epoch": 6578} {"train_loss": -27.008596420288086, "global_step": 545996, "epoch": 6578} {"train_loss": -27.05756950378418, "global_step": 545997, "epoch": 6578} {"train_loss": -27.0328426361084, "global_step": 545998, "epoch": 6578} {"train_loss": -27.1085147857666, "global_step": 545999, "epoch": 6578} {"train_loss": -27.392913818359375, "global_step": 546000, "epoch": 6578} {"train_loss": -27.016021728515625, "global_step": 546001, "epoch": 6578} {"train_loss": -27.324298858642578, "global_step": 546002, "epoch": 6578} {"train_loss": -27.280319213867188, "global_step": 546003, "epoch": 6578} {"train_loss": -27.486021041870117, "global_step": 546004, "epoch": 6578} {"train_loss": -27.364639282226562, "global_step": 546005, "epoch": 6578} {"train_loss": -27.665658950805664, "global_step": 546006, "epoch": 6578} {"train_loss": -27.21927261352539, "global_step": 546007, "epoch": 6578} {"train_loss": -27.575429916381836, "global_step": 546008, "epoch": 6578} {"train_loss": -27.39002799987793, "global_step": 546009, "epoch": 6578} {"train_loss": -27.609830856323242, "global_step": 546010, "epoch": 6578} {"train_loss": -27.8671932220459, "global_step": 546011, "epoch": 6578} {"train_loss": -27.46923828125, "global_step": 546012, "epoch": 6578} {"train_loss": -27.55696678161621, "global_step": 546013, "epoch": 6578} {"train_loss": -27.7210693359375, "global_step": 546014, "epoch": 6578} {"train_loss": -27.64728355407715, "global_step": 546015, "epoch": 6578} {"train_loss": -27.500335693359375, "global_step": 546016, "epoch": 6578} {"train_loss": -27.6772403717041, "global_step": 546017, "epoch": 6578} {"train_loss": -27.829071044921875, "global_step": 546018, "epoch": 6578} {"train_loss": -27.7222900390625, "global_step": 546019, "epoch": 6578} {"train_loss": -27.587722778320312, "global_step": 546020, "epoch": 6578} {"train_loss": -27.891462326049805, "global_step": 546021, "epoch": 6578} {"train_loss": -27.902379989624023, "global_step": 546022, "epoch": 6578} {"train_loss": -27.889318466186523, "global_step": 546023, "epoch": 6578} {"train_loss": -28.146991729736328, "global_step": 546024, "epoch": 6578} {"train_loss": -27.549423217773438, "global_step": 546025, "epoch": 6578} {"train_loss": -27.610992431640625, "global_step": 546026, "epoch": 6578} {"train_loss": -28.092254638671875, "global_step": 546027, "epoch": 6578} {"train_loss": -27.70229148864746, "global_step": 546028, "epoch": 6578} {"train_loss": -27.76125144958496, "global_step": 546029, "epoch": 6578} {"train_loss": -27.807968139648438, "global_step": 546030, "epoch": 6578} {"train_loss": -28.140899658203125, "global_step": 546031, "epoch": 6578} {"train_loss": -27.657184600830078, "global_step": 546032, "epoch": 6578} {"train_loss": -27.963727951049805, "global_step": 546033, "epoch": 6578} {"train_loss": -27.799819946289062, "global_step": 546034, "epoch": 6578} {"train_loss": -28.093305587768555, "global_step": 546035, "epoch": 6578} {"train_loss": -27.870939254760742, "global_step": 546036, "epoch": 6578} {"train_loss": -27.831384658813477, "global_step": 546037, "epoch": 6578} {"train_loss": -27.516199111938477, "global_step": 546038, "epoch": 6578} {"train_loss": -27.541921615600586, "global_step": 546039, "epoch": 6578} {"train_loss": -27.589740753173828, "global_step": 546040, "epoch": 6578} {"train_loss": -27.945953369140625, "global_step": 546041, "epoch": 6578} {"train_loss": -27.782312393188477, "global_step": 546042, "epoch": 6578} {"train_loss": -27.602588653564453, "global_step": 546043, "epoch": 6578} {"train_loss": -27.808917999267578, "global_step": 546044, "epoch": 6578} {"train_loss": -27.80842399597168, "global_step": 546045, "epoch": 6578} {"train_loss": -27.677143096923828, "global_step": 546046, "epoch": 6578} {"train_loss": -27.95307731628418, "global_step": 546047, "epoch": 6578} {"train_loss": -27.78753089904785, "global_step": 546048, "epoch": 6578} {"train_loss": -26.4044189453125, "global_step": 546049, "epoch": 6578} {"train_loss": -25.65155601501465, "global_step": 546050, "epoch": 6578} {"train_loss": -26.431415557861328, "global_step": 546051, "epoch": 6578} {"train_loss": -24.555091857910156, "global_step": 546052, "epoch": 6578} {"train_loss": -25.692167282104492, "global_step": 546053, "epoch": 6578} {"train_loss": -27.412485122680664, "global_step": 546054, "epoch": 6578} {"train_loss": -25.42431640625, "global_step": 546055, "epoch": 6578} {"train_loss": -27.285314789737562, "global_step": 546056, "epoch": 6578, "val_loss": 6694839.0} {"train_loss": -25.9062557220459, "global_step": 546057, "epoch": 6579} {"train_loss": -26.2368221282959, "global_step": 546058, "epoch": 6579} {"train_loss": -26.11269187927246, "global_step": 546059, "epoch": 6579} {"train_loss": -26.377655029296875, "global_step": 546060, "epoch": 6579} {"train_loss": -26.83731460571289, "global_step": 546061, "epoch": 6579} {"train_loss": -26.779834747314453, "global_step": 546062, "epoch": 6579} {"train_loss": -26.744531631469727, "global_step": 546063, "epoch": 6579} {"train_loss": -26.601789474487305, "global_step": 546064, "epoch": 6579} {"train_loss": -26.925695419311523, "global_step": 546065, "epoch": 6579} {"train_loss": -26.932241439819336, "global_step": 546066, "epoch": 6579} {"train_loss": -26.66025161743164, "global_step": 546067, "epoch": 6579} {"train_loss": -26.776254653930664, "global_step": 546068, "epoch": 6579} {"train_loss": -27.0498046875, "global_step": 546069, "epoch": 6579} {"train_loss": -26.96673011779785, "global_step": 546070, "epoch": 6579} {"train_loss": -27.151498794555664, "global_step": 546071, "epoch": 6579} {"train_loss": -26.88909912109375, "global_step": 546072, "epoch": 6579} {"train_loss": -26.957462310791016, "global_step": 546073, "epoch": 6579} {"train_loss": -27.384328842163086, "global_step": 546074, "epoch": 6579} {"train_loss": -26.981409072875977, "global_step": 546075, "epoch": 6579} {"train_loss": -27.21156883239746, "global_step": 546076, "epoch": 6579} {"train_loss": -27.3595027923584, "global_step": 546077, "epoch": 6579} {"train_loss": -27.331968307495117, "global_step": 546078, "epoch": 6579} {"train_loss": -27.093719482421875, "global_step": 546079, "epoch": 6579} {"train_loss": -27.191736221313477, "global_step": 546080, "epoch": 6579} {"train_loss": -27.24837303161621, "global_step": 546081, "epoch": 6579} {"train_loss": -27.71731948852539, "global_step": 546082, "epoch": 6579} {"train_loss": -27.563129425048828, "global_step": 546083, "epoch": 6579} {"train_loss": -27.240528106689453, "global_step": 546084, "epoch": 6579} {"train_loss": -27.44624137878418, "global_step": 546085, "epoch": 6579} {"train_loss": -27.552457809448242, "global_step": 546086, "epoch": 6579} {"train_loss": -27.31495475769043, "global_step": 546087, "epoch": 6579} {"train_loss": -27.693517684936523, "global_step": 546088, "epoch": 6579} {"train_loss": -27.450759887695312, "global_step": 546089, "epoch": 6579} {"train_loss": -27.521764755249023, "global_step": 546090, "epoch": 6579} {"train_loss": -27.80319595336914, "global_step": 546091, "epoch": 6579} {"train_loss": -27.55132484436035, "global_step": 546092, "epoch": 6579} {"train_loss": -27.819320678710938, "global_step": 546093, "epoch": 6579} {"train_loss": -27.701038360595703, "global_step": 546094, "epoch": 6579} {"train_loss": -27.79253578186035, "global_step": 546095, "epoch": 6579} {"train_loss": -27.81532096862793, "global_step": 546096, "epoch": 6579} {"train_loss": -27.994647979736328, "global_step": 546097, "epoch": 6579} {"train_loss": -28.059223175048828, "global_step": 546098, "epoch": 6579} {"train_loss": -27.69768714904785, "global_step": 546099, "epoch": 6579} {"train_loss": -28.07478141784668, "global_step": 546100, "epoch": 6579} {"train_loss": -27.5738468170166, "global_step": 546101, "epoch": 6579} {"train_loss": -27.47757339477539, "global_step": 546102, "epoch": 6579} {"train_loss": -27.660287857055664, "global_step": 546103, "epoch": 6579} {"train_loss": -27.80810546875, "global_step": 546104, "epoch": 6579} {"train_loss": -27.48444175720215, "global_step": 546105, "epoch": 6579} {"train_loss": -28.016122817993164, "global_step": 546106, "epoch": 6579} {"train_loss": -27.875385284423828, "global_step": 546107, "epoch": 6579} {"train_loss": -27.847135543823242, "global_step": 546108, "epoch": 6579} {"train_loss": -27.896814346313477, "global_step": 546109, "epoch": 6579} {"train_loss": -27.984628677368164, "global_step": 546110, "epoch": 6579} {"train_loss": -27.843229293823242, "global_step": 546111, "epoch": 6579} {"train_loss": -27.94935417175293, "global_step": 546112, "epoch": 6579} {"train_loss": -28.043212890625, "global_step": 546113, "epoch": 6579} {"train_loss": -28.250730514526367, "global_step": 546114, "epoch": 6579} {"train_loss": -28.098905563354492, "global_step": 546115, "epoch": 6579} {"train_loss": -28.265552520751953, "global_step": 546116, "epoch": 6579} {"train_loss": -27.179479598999023, "global_step": 546117, "epoch": 6579} {"train_loss": -27.12677574157715, "global_step": 546118, "epoch": 6579} {"train_loss": -27.375112533569336, "global_step": 546119, "epoch": 6579} {"train_loss": -28.041645050048828, "global_step": 546120, "epoch": 6579} {"train_loss": -27.679624557495117, "global_step": 546121, "epoch": 6579} {"train_loss": -27.3941707611084, "global_step": 546122, "epoch": 6579} {"train_loss": -27.7470760345459, "global_step": 546123, "epoch": 6579} {"train_loss": -27.467437744140625, "global_step": 546124, "epoch": 6579} {"train_loss": -27.60601806640625, "global_step": 546125, "epoch": 6579} {"train_loss": -27.67230796813965, "global_step": 546126, "epoch": 6579} {"train_loss": -27.34272575378418, "global_step": 546127, "epoch": 6579} {"train_loss": -27.523344039916992, "global_step": 546128, "epoch": 6579} {"train_loss": -26.96381950378418, "global_step": 546129, "epoch": 6579} {"train_loss": -27.12019920349121, "global_step": 546130, "epoch": 6579} {"train_loss": -27.504682540893555, "global_step": 546131, "epoch": 6579} {"train_loss": -27.322790145874023, "global_step": 546132, "epoch": 6579} {"train_loss": -27.17311668395996, "global_step": 546133, "epoch": 6579} {"train_loss": -27.6140079498291, "global_step": 546134, "epoch": 6579} {"train_loss": -27.63956069946289, "global_step": 546135, "epoch": 6579} {"train_loss": -27.369190216064453, "global_step": 546136, "epoch": 6579} {"train_loss": -28.18610191345215, "global_step": 546137, "epoch": 6579} {"train_loss": -27.738256454467773, "global_step": 546138, "epoch": 6579} {"train_loss": -27.411634950752717, "global_step": 546139, "epoch": 6579, "val_loss": 6576871.5} {"train_loss": -27.311059951782227, "global_step": 546140, "epoch": 6580} {"train_loss": -27.129241943359375, "global_step": 546141, "epoch": 6580} {"train_loss": -26.914535522460938, "global_step": 546142, "epoch": 6580} {"train_loss": -27.36371421813965, "global_step": 546143, "epoch": 6580} {"train_loss": -27.003036499023438, "global_step": 546144, "epoch": 6580} {"train_loss": -26.877059936523438, "global_step": 546145, "epoch": 6580} {"train_loss": -26.951221466064453, "global_step": 546146, "epoch": 6580} {"train_loss": -27.242050170898438, "global_step": 546147, "epoch": 6580} {"train_loss": -27.150732040405273, "global_step": 546148, "epoch": 6580} {"train_loss": -26.877002716064453, "global_step": 546149, "epoch": 6580} {"train_loss": -27.04888343811035, "global_step": 546150, "epoch": 6580} {"train_loss": -27.247211456298828, "global_step": 546151, "epoch": 6580} {"train_loss": -27.333423614501953, "global_step": 546152, "epoch": 6580} {"train_loss": -27.461257934570312, "global_step": 546153, "epoch": 6580} {"train_loss": -27.069116592407227, "global_step": 546154, "epoch": 6580} {"train_loss": -27.568634033203125, "global_step": 546155, "epoch": 6580} {"train_loss": -27.41973876953125, "global_step": 546156, "epoch": 6580} {"train_loss": -27.34735679626465, "global_step": 546157, "epoch": 6580} {"train_loss": -27.357349395751953, "global_step": 546158, "epoch": 6580} {"train_loss": -26.957611083984375, "global_step": 546159, "epoch": 6580} {"train_loss": -27.4166316986084, "global_step": 546160, "epoch": 6580} {"train_loss": -27.752365112304688, "global_step": 546161, "epoch": 6580} {"train_loss": -27.051715850830078, "global_step": 546162, "epoch": 6580} {"train_loss": -27.850677490234375, "global_step": 546163, "epoch": 6580} {"train_loss": -27.59638786315918, "global_step": 546164, "epoch": 6580} {"train_loss": -27.335962295532227, "global_step": 546165, "epoch": 6580} {"train_loss": -27.48822593688965, "global_step": 546166, "epoch": 6580} {"train_loss": -27.647634506225586, "global_step": 546167, "epoch": 6580} {"train_loss": -27.620792388916016, "global_step": 546168, "epoch": 6580} {"train_loss": -27.50263786315918, "global_step": 546169, "epoch": 6580} {"train_loss": -27.72332191467285, "global_step": 546170, "epoch": 6580} {"train_loss": -27.73030662536621, "global_step": 546171, "epoch": 6580} {"train_loss": -27.934799194335938, "global_step": 546172, "epoch": 6580} {"train_loss": -27.650724411010742, "global_step": 546173, "epoch": 6580} {"train_loss": -28.049283981323242, "global_step": 546174, "epoch": 6580} {"train_loss": -27.909687042236328, "global_step": 546175, "epoch": 6580} {"train_loss": -27.6416072845459, "global_step": 546176, "epoch": 6580} {"train_loss": -27.650836944580078, "global_step": 546177, "epoch": 6580} {"train_loss": -27.434417724609375, "global_step": 546178, "epoch": 6580} {"train_loss": -27.662275314331055, "global_step": 546179, "epoch": 6580} {"train_loss": -27.74346923828125, "global_step": 546180, "epoch": 6580} {"train_loss": -27.62666130065918, "global_step": 546181, "epoch": 6580} {"train_loss": -27.8864803314209, "global_step": 546182, "epoch": 6580} {"train_loss": -27.78092384338379, "global_step": 546183, "epoch": 6580} {"train_loss": -27.555994033813477, "global_step": 546184, "epoch": 6580} {"train_loss": -27.64577293395996, "global_step": 546185, "epoch": 6580} {"train_loss": -27.753591537475586, "global_step": 546186, "epoch": 6580} {"train_loss": -27.877500534057617, "global_step": 546187, "epoch": 6580} {"train_loss": -28.04486083984375, "global_step": 546188, "epoch": 6580} {"train_loss": -27.262319564819336, "global_step": 546189, "epoch": 6580} {"train_loss": -27.600793838500977, "global_step": 546190, "epoch": 6580} {"train_loss": -27.86740493774414, "global_step": 546191, "epoch": 6580} {"train_loss": -28.01651382446289, "global_step": 546192, "epoch": 6580} {"train_loss": -27.454395294189453, "global_step": 546193, "epoch": 6580} {"train_loss": -27.527490615844727, "global_step": 546194, "epoch": 6580} {"train_loss": -27.9483585357666, "global_step": 546195, "epoch": 6580} {"train_loss": -27.241785049438477, "global_step": 546196, "epoch": 6580} {"train_loss": -27.368677139282227, "global_step": 546197, "epoch": 6580} {"train_loss": -27.794065475463867, "global_step": 546198, "epoch": 6580} {"train_loss": -27.58820152282715, "global_step": 546199, "epoch": 6580} {"train_loss": -27.884145736694336, "global_step": 546200, "epoch": 6580} {"train_loss": -27.283966064453125, "global_step": 546201, "epoch": 6580} {"train_loss": -27.670591354370117, "global_step": 546202, "epoch": 6580} {"train_loss": -27.809436798095703, "global_step": 546203, "epoch": 6580} {"train_loss": -27.54388427734375, "global_step": 546204, "epoch": 6580} {"train_loss": -27.789886474609375, "global_step": 546205, "epoch": 6580} {"train_loss": -27.398046493530273, "global_step": 546206, "epoch": 6580} {"train_loss": -27.773839950561523, "global_step": 546207, "epoch": 6580} {"train_loss": -27.883203506469727, "global_step": 546208, "epoch": 6580} {"train_loss": -27.62604331970215, "global_step": 546209, "epoch": 6580} {"train_loss": -28.005252838134766, "global_step": 546210, "epoch": 6580} {"train_loss": -27.745044708251953, "global_step": 546211, "epoch": 6580} {"train_loss": -27.737958908081055, "global_step": 546212, "epoch": 6580} {"train_loss": -27.71661949157715, "global_step": 546213, "epoch": 6580} {"train_loss": -28.20880699157715, "global_step": 546214, "epoch": 6580} {"train_loss": -27.581098556518555, "global_step": 546215, "epoch": 6580} {"train_loss": -27.97720718383789, "global_step": 546216, "epoch": 6580} {"train_loss": -27.404834747314453, "global_step": 546217, "epoch": 6580} {"train_loss": -27.427900314331055, "global_step": 546218, "epoch": 6580} {"train_loss": -27.12139320373535, "global_step": 546219, "epoch": 6580} {"train_loss": -27.42108154296875, "global_step": 546220, "epoch": 6580} {"train_loss": -27.960681915283203, "global_step": 546221, "epoch": 6580} {"train_loss": -27.561654240252025, "global_step": 546222, "epoch": 6580, "val_loss": 6600737.0} {"train_loss": -27.836883544921875, "global_step": 546223, "epoch": 6581} {"train_loss": -28.05328941345215, "global_step": 546224, "epoch": 6581} {"train_loss": -27.679407119750977, "global_step": 546225, "epoch": 6581} {"train_loss": -27.72931480407715, "global_step": 546226, "epoch": 6581} {"train_loss": -27.313940048217773, "global_step": 546227, "epoch": 6581} {"train_loss": -27.564916610717773, "global_step": 546228, "epoch": 6581} {"train_loss": -27.381372451782227, "global_step": 546229, "epoch": 6581} {"train_loss": -27.44087791442871, "global_step": 546230, "epoch": 6581} {"train_loss": -27.68191909790039, "global_step": 546231, "epoch": 6581} {"train_loss": -27.397750854492188, "global_step": 546232, "epoch": 6581} {"train_loss": -27.46357536315918, "global_step": 546233, "epoch": 6581} {"train_loss": -27.282072067260742, "global_step": 546234, "epoch": 6581} {"train_loss": -27.60914421081543, "global_step": 546235, "epoch": 6581} {"train_loss": -28.0555477142334, "global_step": 546236, "epoch": 6581} {"train_loss": -27.386682510375977, "global_step": 546237, "epoch": 6581} {"train_loss": -27.47071647644043, "global_step": 546238, "epoch": 6581} {"train_loss": -27.35618019104004, "global_step": 546239, "epoch": 6581} {"train_loss": -27.392322540283203, "global_step": 546240, "epoch": 6581} {"train_loss": -27.630695343017578, "global_step": 546241, "epoch": 6581} {"train_loss": -27.563886642456055, "global_step": 546242, "epoch": 6581} {"train_loss": -27.3267879486084, "global_step": 546243, "epoch": 6581} {"train_loss": -27.45635414123535, "global_step": 546244, "epoch": 6581} {"train_loss": -27.74494743347168, "global_step": 546245, "epoch": 6581} {"train_loss": -27.177213668823242, "global_step": 546246, "epoch": 6581} {"train_loss": -26.9939022064209, "global_step": 546247, "epoch": 6581} {"train_loss": -26.608539581298828, "global_step": 546248, "epoch": 6581} {"train_loss": -28.11539649963379, "global_step": 546249, "epoch": 6581} {"train_loss": -27.26584815979004, "global_step": 546250, "epoch": 6581} {"train_loss": -26.890005111694336, "global_step": 546251, "epoch": 6581} {"train_loss": -27.287296295166016, "global_step": 546252, "epoch": 6581} {"train_loss": -26.780736923217773, "global_step": 546253, "epoch": 6581} {"train_loss": -27.424161911010742, "global_step": 546254, "epoch": 6581} {"train_loss": -27.235889434814453, "global_step": 546255, "epoch": 6581} {"train_loss": -27.13311767578125, "global_step": 546256, "epoch": 6581} {"train_loss": -27.15558433532715, "global_step": 546257, "epoch": 6581} {"train_loss": -27.24140739440918, "global_step": 546258, "epoch": 6581} {"train_loss": -27.32376480102539, "global_step": 546259, "epoch": 6581} {"train_loss": -27.58603858947754, "global_step": 546260, "epoch": 6581} {"train_loss": -27.442657470703125, "global_step": 546261, "epoch": 6581} {"train_loss": -27.5039119720459, "global_step": 546262, "epoch": 6581} {"train_loss": -27.35281753540039, "global_step": 546263, "epoch": 6581} {"train_loss": -27.249317169189453, "global_step": 546264, "epoch": 6581} {"train_loss": -27.202539443969727, "global_step": 546265, "epoch": 6581} {"train_loss": -27.472753524780273, "global_step": 546266, "epoch": 6581} {"train_loss": -27.299482345581055, "global_step": 546267, "epoch": 6581} {"train_loss": -27.64697265625, "global_step": 546268, "epoch": 6581} {"train_loss": -27.62293815612793, "global_step": 546269, "epoch": 6581} {"train_loss": -27.524770736694336, "global_step": 546270, "epoch": 6581} {"train_loss": -27.83694839477539, "global_step": 546271, "epoch": 6581} {"train_loss": -27.56940269470215, "global_step": 546272, "epoch": 6581} {"train_loss": -27.8164119720459, "global_step": 546273, "epoch": 6581} {"train_loss": -27.601221084594727, "global_step": 546274, "epoch": 6581} {"train_loss": -27.2897891998291, "global_step": 546275, "epoch": 6581} {"train_loss": -27.81902503967285, "global_step": 546276, "epoch": 6581} {"train_loss": -27.84305763244629, "global_step": 546277, "epoch": 6581} {"train_loss": -27.59344482421875, "global_step": 546278, "epoch": 6581} {"train_loss": -27.575651168823242, "global_step": 546279, "epoch": 6581} {"train_loss": -27.416589736938477, "global_step": 546280, "epoch": 6581} {"train_loss": -27.994964599609375, "global_step": 546281, "epoch": 6581} {"train_loss": -27.665470123291016, "global_step": 546282, "epoch": 6581} {"train_loss": -27.63454246520996, "global_step": 546283, "epoch": 6581} {"train_loss": -27.9542236328125, "global_step": 546284, "epoch": 6581} {"train_loss": -27.782318115234375, "global_step": 546285, "epoch": 6581} {"train_loss": -28.03798484802246, "global_step": 546286, "epoch": 6581} {"train_loss": -27.920429229736328, "global_step": 546287, "epoch": 6581} {"train_loss": -27.57779312133789, "global_step": 546288, "epoch": 6581} {"train_loss": -27.77520751953125, "global_step": 546289, "epoch": 6581} {"train_loss": -28.06829261779785, "global_step": 546290, "epoch": 6581} {"train_loss": -27.8609676361084, "global_step": 546291, "epoch": 6581} {"train_loss": -28.155118942260742, "global_step": 546292, "epoch": 6581} {"train_loss": -27.656415939331055, "global_step": 546293, "epoch": 6581} {"train_loss": -27.7176570892334, "global_step": 546294, "epoch": 6581} {"train_loss": -28.12127113342285, "global_step": 546295, "epoch": 6581} {"train_loss": -27.910673141479492, "global_step": 546296, "epoch": 6581} {"train_loss": -27.927860260009766, "global_step": 546297, "epoch": 6581} {"train_loss": -27.832487106323242, "global_step": 546298, "epoch": 6581} {"train_loss": -27.7720890045166, "global_step": 546299, "epoch": 6581} {"train_loss": -27.477380752563477, "global_step": 546300, "epoch": 6581} {"train_loss": -27.185760498046875, "global_step": 546301, "epoch": 6581} {"train_loss": -26.885589599609375, "global_step": 546302, "epoch": 6581} {"train_loss": -26.43010902404785, "global_step": 546303, "epoch": 6581} {"train_loss": -26.6323184967041, "global_step": 546304, "epoch": 6581} {"train_loss": -27.521058714533428, "global_step": 546305, "epoch": 6581, "val_loss": 6664220.0} {"train_loss": -26.944482803344727, "global_step": 546306, "epoch": 6582} {"train_loss": -26.66104507446289, "global_step": 546307, "epoch": 6582} {"train_loss": -26.275861740112305, "global_step": 546308, "epoch": 6582} {"train_loss": -26.402942657470703, "global_step": 546309, "epoch": 6582} {"train_loss": -26.74344825744629, "global_step": 546310, "epoch": 6582} {"train_loss": -26.7663631439209, "global_step": 546311, "epoch": 6582} {"train_loss": -26.782306671142578, "global_step": 546312, "epoch": 6582} {"train_loss": -27.41265869140625, "global_step": 546313, "epoch": 6582} {"train_loss": -26.999746322631836, "global_step": 546314, "epoch": 6582} {"train_loss": -26.8974666595459, "global_step": 546315, "epoch": 6582} {"train_loss": -27.16204261779785, "global_step": 546316, "epoch": 6582} {"train_loss": -27.1171932220459, "global_step": 546317, "epoch": 6582} {"train_loss": -27.157339096069336, "global_step": 546318, "epoch": 6582} {"train_loss": -27.386449813842773, "global_step": 546319, "epoch": 6582} {"train_loss": -27.10956382751465, "global_step": 546320, "epoch": 6582} {"train_loss": -27.378650665283203, "global_step": 546321, "epoch": 6582} {"train_loss": -27.32901382446289, "global_step": 546322, "epoch": 6582} {"train_loss": -27.294769287109375, "global_step": 546323, "epoch": 6582} {"train_loss": -27.130151748657227, "global_step": 546324, "epoch": 6582} {"train_loss": -27.756067276000977, "global_step": 546325, "epoch": 6582} {"train_loss": -27.724088668823242, "global_step": 546326, "epoch": 6582} {"train_loss": -27.31442642211914, "global_step": 546327, "epoch": 6582} {"train_loss": -27.69269371032715, "global_step": 546328, "epoch": 6582} {"train_loss": -27.51531410217285, "global_step": 546329, "epoch": 6582} {"train_loss": -27.433685302734375, "global_step": 546330, "epoch": 6582} {"train_loss": -27.333967208862305, "global_step": 546331, "epoch": 6582} {"train_loss": -27.522993087768555, "global_step": 546332, "epoch": 6582} {"train_loss": -27.71225357055664, "global_step": 546333, "epoch": 6582} {"train_loss": -27.303369522094727, "global_step": 546334, "epoch": 6582} {"train_loss": -27.758451461791992, "global_step": 546335, "epoch": 6582} {"train_loss": -27.563283920288086, "global_step": 546336, "epoch": 6582} {"train_loss": -27.677160263061523, "global_step": 546337, "epoch": 6582} {"train_loss": -27.632055282592773, "global_step": 546338, "epoch": 6582} {"train_loss": -27.65533447265625, "global_step": 546339, "epoch": 6582} {"train_loss": -27.80755615234375, "global_step": 546340, "epoch": 6582} {"train_loss": -27.803421020507812, "global_step": 546341, "epoch": 6582} {"train_loss": -27.319761276245117, "global_step": 546342, "epoch": 6582} {"train_loss": -27.5145320892334, "global_step": 546343, "epoch": 6582} {"train_loss": -27.793004989624023, "global_step": 546344, "epoch": 6582} {"train_loss": -27.856882095336914, "global_step": 546345, "epoch": 6582} {"train_loss": -27.672809600830078, "global_step": 546346, "epoch": 6582} {"train_loss": -27.580419540405273, "global_step": 546347, "epoch": 6582} {"train_loss": -27.79192543029785, "global_step": 546348, "epoch": 6582} {"train_loss": -27.597640991210938, "global_step": 546349, "epoch": 6582} {"train_loss": -27.863683700561523, "global_step": 546350, "epoch": 6582} {"train_loss": -28.095829010009766, "global_step": 546351, "epoch": 6582} {"train_loss": -27.876541137695312, "global_step": 546352, "epoch": 6582} {"train_loss": -27.64253807067871, "global_step": 546353, "epoch": 6582} {"train_loss": -27.78365135192871, "global_step": 546354, "epoch": 6582} {"train_loss": -27.681554794311523, "global_step": 546355, "epoch": 6582} {"train_loss": -27.945159912109375, "global_step": 546356, "epoch": 6582} {"train_loss": -28.072113037109375, "global_step": 546357, "epoch": 6582} {"train_loss": -27.857345581054688, "global_step": 546358, "epoch": 6582} {"train_loss": -27.88482093811035, "global_step": 546359, "epoch": 6582} {"train_loss": -27.883642196655273, "global_step": 546360, "epoch": 6582} {"train_loss": -27.410877227783203, "global_step": 546361, "epoch": 6582} {"train_loss": -27.822834014892578, "global_step": 546362, "epoch": 6582} {"train_loss": -28.0848445892334, "global_step": 546363, "epoch": 6582} {"train_loss": -27.87150001525879, "global_step": 546364, "epoch": 6582} {"train_loss": -27.799774169921875, "global_step": 546365, "epoch": 6582} {"train_loss": -28.025686264038086, "global_step": 546366, "epoch": 6582} {"train_loss": -27.67213249206543, "global_step": 546367, "epoch": 6582} {"train_loss": -27.53511619567871, "global_step": 546368, "epoch": 6582} {"train_loss": -27.996503829956055, "global_step": 546369, "epoch": 6582} {"train_loss": -27.896818161010742, "global_step": 546370, "epoch": 6582} {"train_loss": -27.9294490814209, "global_step": 546371, "epoch": 6582} {"train_loss": -27.62167739868164, "global_step": 546372, "epoch": 6582} {"train_loss": -27.74847412109375, "global_step": 546373, "epoch": 6582} {"train_loss": -27.43367576599121, "global_step": 546374, "epoch": 6582} {"train_loss": -27.404211044311523, "global_step": 546375, "epoch": 6582} {"train_loss": -27.65045166015625, "global_step": 546376, "epoch": 6582} {"train_loss": -27.8149471282959, "global_step": 546377, "epoch": 6582} {"train_loss": -28.192602157592773, "global_step": 546378, "epoch": 6582} {"train_loss": -27.885839462280273, "global_step": 546379, "epoch": 6582} {"train_loss": -27.434045791625977, "global_step": 546380, "epoch": 6582} {"train_loss": -26.983617782592773, "global_step": 546381, "epoch": 6582} {"train_loss": -26.258955001831055, "global_step": 546382, "epoch": 6582} {"train_loss": -25.055973052978516, "global_step": 546383, "epoch": 6582} {"train_loss": -23.19462013244629, "global_step": 546384, "epoch": 6582} {"train_loss": -25.646398544311523, "global_step": 546385, "epoch": 6582} {"train_loss": -26.994220733642578, "global_step": 546386, "epoch": 6582} {"train_loss": -26.026987075805664, "global_step": 546387, "epoch": 6582} {"train_loss": -27.380144877606128, "global_step": 546388, "epoch": 6582, "val_loss": 6614556.0} {"train_loss": -26.54188346862793, "global_step": 546389, "epoch": 6583} {"train_loss": -26.6510009765625, "global_step": 546390, "epoch": 6583} {"train_loss": -26.89395523071289, "global_step": 546391, "epoch": 6583} {"train_loss": -27.070032119750977, "global_step": 546392, "epoch": 6583} {"train_loss": -26.209497451782227, "global_step": 546393, "epoch": 6583} {"train_loss": -26.742284774780273, "global_step": 546394, "epoch": 6583} {"train_loss": -26.622800827026367, "global_step": 546395, "epoch": 6583} {"train_loss": -26.6129150390625, "global_step": 546396, "epoch": 6583} {"train_loss": -26.417743682861328, "global_step": 546397, "epoch": 6583} {"train_loss": -27.02774429321289, "global_step": 546398, "epoch": 6583} {"train_loss": -27.1801815032959, "global_step": 546399, "epoch": 6583} {"train_loss": -26.879669189453125, "global_step": 546400, "epoch": 6583} {"train_loss": -26.7499942779541, "global_step": 546401, "epoch": 6583} {"train_loss": -26.53143882751465, "global_step": 546402, "epoch": 6583} {"train_loss": -27.115081787109375, "global_step": 546403, "epoch": 6583} {"train_loss": -26.929792404174805, "global_step": 546404, "epoch": 6583} {"train_loss": -27.03253173828125, "global_step": 546405, "epoch": 6583} {"train_loss": -26.954381942749023, "global_step": 546406, "epoch": 6583} {"train_loss": -27.2581787109375, "global_step": 546407, "epoch": 6583} {"train_loss": -26.918256759643555, "global_step": 546408, "epoch": 6583} {"train_loss": -27.382394790649414, "global_step": 546409, "epoch": 6583} {"train_loss": -27.369199752807617, "global_step": 546410, "epoch": 6583} {"train_loss": -27.09221839904785, "global_step": 546411, "epoch": 6583} {"train_loss": -27.051008224487305, "global_step": 546412, "epoch": 6583} {"train_loss": -26.87346839904785, "global_step": 546413, "epoch": 6583} {"train_loss": -27.514245986938477, "global_step": 546414, "epoch": 6583} {"train_loss": -27.669513702392578, "global_step": 546415, "epoch": 6583} {"train_loss": -27.32806968688965, "global_step": 546416, "epoch": 6583} {"train_loss": -27.293561935424805, "global_step": 546417, "epoch": 6583} {"train_loss": -27.482879638671875, "global_step": 546418, "epoch": 6583} {"train_loss": -27.18170166015625, "global_step": 546419, "epoch": 6583} {"train_loss": -27.1851806640625, "global_step": 546420, "epoch": 6583} {"train_loss": -27.361204147338867, "global_step": 546421, "epoch": 6583} {"train_loss": -27.536422729492188, "global_step": 546422, "epoch": 6583} {"train_loss": -27.310529708862305, "global_step": 546423, "epoch": 6583} {"train_loss": -27.50522232055664, "global_step": 546424, "epoch": 6583} {"train_loss": -27.764984130859375, "global_step": 546425, "epoch": 6583} {"train_loss": -27.44659423828125, "global_step": 546426, "epoch": 6583} {"train_loss": -27.545190811157227, "global_step": 546427, "epoch": 6583} {"train_loss": -27.731765747070312, "global_step": 546428, "epoch": 6583} {"train_loss": -27.626483917236328, "global_step": 546429, "epoch": 6583} {"train_loss": -27.164077758789062, "global_step": 546430, "epoch": 6583} {"train_loss": -27.586755752563477, "global_step": 546431, "epoch": 6583} {"train_loss": -27.91578483581543, "global_step": 546432, "epoch": 6583} {"train_loss": -27.607702255249023, "global_step": 546433, "epoch": 6583} {"train_loss": -27.6674861907959, "global_step": 546434, "epoch": 6583} {"train_loss": -27.32941246032715, "global_step": 546435, "epoch": 6583} {"train_loss": -27.560943603515625, "global_step": 546436, "epoch": 6583} {"train_loss": -27.310022354125977, "global_step": 546437, "epoch": 6583} {"train_loss": -27.8752384185791, "global_step": 546438, "epoch": 6583} {"train_loss": -27.676895141601562, "global_step": 546439, "epoch": 6583} {"train_loss": -27.90301513671875, "global_step": 546440, "epoch": 6583} {"train_loss": -27.625219345092773, "global_step": 546441, "epoch": 6583} {"train_loss": -27.63650894165039, "global_step": 546442, "epoch": 6583} {"train_loss": -27.6417236328125, "global_step": 546443, "epoch": 6583} {"train_loss": -27.60906982421875, "global_step": 546444, "epoch": 6583} {"train_loss": -27.585058212280273, "global_step": 546445, "epoch": 6583} {"train_loss": -27.507715225219727, "global_step": 546446, "epoch": 6583} {"train_loss": -27.573505401611328, "global_step": 546447, "epoch": 6583} {"train_loss": -28.053115844726562, "global_step": 546448, "epoch": 6583} {"train_loss": -27.7110538482666, "global_step": 546449, "epoch": 6583} {"train_loss": -27.401941299438477, "global_step": 546450, "epoch": 6583} {"train_loss": -28.002042770385742, "global_step": 546451, "epoch": 6583} {"train_loss": -27.709243774414062, "global_step": 546452, "epoch": 6583} {"train_loss": -27.975101470947266, "global_step": 546453, "epoch": 6583} {"train_loss": -27.60137939453125, "global_step": 546454, "epoch": 6583} {"train_loss": -27.464574813842773, "global_step": 546455, "epoch": 6583} {"train_loss": -27.23594093322754, "global_step": 546456, "epoch": 6583} {"train_loss": -27.8502254486084, "global_step": 546457, "epoch": 6583} {"train_loss": -28.099334716796875, "global_step": 546458, "epoch": 6583} {"train_loss": -27.566699981689453, "global_step": 546459, "epoch": 6583} {"train_loss": -27.6527099609375, "global_step": 546460, "epoch": 6583} {"train_loss": -27.843292236328125, "global_step": 546461, "epoch": 6583} {"train_loss": -27.52729606628418, "global_step": 546462, "epoch": 6583} {"train_loss": -27.642547607421875, "global_step": 546463, "epoch": 6583} {"train_loss": -27.876605987548828, "global_step": 546464, "epoch": 6583} {"train_loss": -28.102069854736328, "global_step": 546465, "epoch": 6583} {"train_loss": -27.85749626159668, "global_step": 546466, "epoch": 6583} {"train_loss": -27.82368278503418, "global_step": 546467, "epoch": 6583} {"train_loss": -28.162137985229492, "global_step": 546468, "epoch": 6583} {"train_loss": -27.850940704345703, "global_step": 546469, "epoch": 6583} {"train_loss": -27.968408584594727, "global_step": 546470, "epoch": 6583} {"train_loss": -27.404909019010613, "global_step": 546471, "epoch": 6583, "val_loss": 6599996.0} {"train_loss": -27.059961318969727, "global_step": 546472, "epoch": 6584} {"train_loss": -27.1250057220459, "global_step": 546473, "epoch": 6584} {"train_loss": -27.25446891784668, "global_step": 546474, "epoch": 6584} {"train_loss": -27.20562171936035, "global_step": 546475, "epoch": 6584} {"train_loss": -27.140674591064453, "global_step": 546476, "epoch": 6584} {"train_loss": -27.374082565307617, "global_step": 546477, "epoch": 6584} {"train_loss": -27.37314224243164, "global_step": 546478, "epoch": 6584} {"train_loss": -27.261768341064453, "global_step": 546479, "epoch": 6584} {"train_loss": -27.21051597595215, "global_step": 546480, "epoch": 6584} {"train_loss": -27.38093376159668, "global_step": 546481, "epoch": 6584} {"train_loss": -27.39154624938965, "global_step": 546482, "epoch": 6584} {"train_loss": -27.812042236328125, "global_step": 546483, "epoch": 6584} {"train_loss": -27.367969512939453, "global_step": 546484, "epoch": 6584} {"train_loss": -27.4801025390625, "global_step": 546485, "epoch": 6584} {"train_loss": -27.84950065612793, "global_step": 546486, "epoch": 6584} {"train_loss": -27.4728946685791, "global_step": 546487, "epoch": 6584} {"train_loss": -27.614837646484375, "global_step": 546488, "epoch": 6584} {"train_loss": -27.673114776611328, "global_step": 546489, "epoch": 6584} {"train_loss": -27.67864418029785, "global_step": 546490, "epoch": 6584} {"train_loss": -27.43341636657715, "global_step": 546491, "epoch": 6584} {"train_loss": -28.029449462890625, "global_step": 546492, "epoch": 6584} {"train_loss": -27.31556510925293, "global_step": 546493, "epoch": 6584} {"train_loss": -27.45893669128418, "global_step": 546494, "epoch": 6584} {"train_loss": -27.649377822875977, "global_step": 546495, "epoch": 6584} {"train_loss": -27.854263305664062, "global_step": 546496, "epoch": 6584} {"train_loss": -27.6098690032959, "global_step": 546497, "epoch": 6584} {"train_loss": -27.615619659423828, "global_step": 546498, "epoch": 6584} {"train_loss": -27.855228424072266, "global_step": 546499, "epoch": 6584} {"train_loss": -27.26325798034668, "global_step": 546500, "epoch": 6584} {"train_loss": -27.5856990814209, "global_step": 546501, "epoch": 6584} {"train_loss": -27.858545303344727, "global_step": 546502, "epoch": 6584} {"train_loss": -27.50140953063965, "global_step": 546503, "epoch": 6584} {"train_loss": -28.058752059936523, "global_step": 546504, "epoch": 6584} {"train_loss": -27.936542510986328, "global_step": 546505, "epoch": 6584} {"train_loss": -27.837400436401367, "global_step": 546506, "epoch": 6584} {"train_loss": -28.029211044311523, "global_step": 546507, "epoch": 6584} {"train_loss": -27.48395347595215, "global_step": 546508, "epoch": 6584} {"train_loss": -27.62766456604004, "global_step": 546509, "epoch": 6584} {"train_loss": -27.301864624023438, "global_step": 546510, "epoch": 6584} {"train_loss": -27.886474609375, "global_step": 546511, "epoch": 6584} {"train_loss": -27.60088539123535, "global_step": 546512, "epoch": 6584} {"train_loss": -27.557661056518555, "global_step": 546513, "epoch": 6584} {"train_loss": -27.792102813720703, "global_step": 546514, "epoch": 6584} {"train_loss": -28.00225830078125, "global_step": 546515, "epoch": 6584} {"train_loss": -27.916183471679688, "global_step": 546516, "epoch": 6584} {"train_loss": -27.874134063720703, "global_step": 546517, "epoch": 6584} {"train_loss": -28.345157623291016, "global_step": 546518, "epoch": 6584} {"train_loss": -27.75288200378418, "global_step": 546519, "epoch": 6584} {"train_loss": -27.7579345703125, "global_step": 546520, "epoch": 6584} {"train_loss": -27.668323516845703, "global_step": 546521, "epoch": 6584} {"train_loss": -27.897863388061523, "global_step": 546522, "epoch": 6584} {"train_loss": -27.658090591430664, "global_step": 546523, "epoch": 6584} {"train_loss": -27.53138542175293, "global_step": 546524, "epoch": 6584} {"train_loss": -27.679906845092773, "global_step": 546525, "epoch": 6584} {"train_loss": -27.773487091064453, "global_step": 546526, "epoch": 6584} {"train_loss": -27.716388702392578, "global_step": 546527, "epoch": 6584} {"train_loss": -27.689956665039062, "global_step": 546528, "epoch": 6584} {"train_loss": -27.92637062072754, "global_step": 546529, "epoch": 6584} {"train_loss": -28.115324020385742, "global_step": 546530, "epoch": 6584} {"train_loss": -27.75482177734375, "global_step": 546531, "epoch": 6584} {"train_loss": -28.03860855102539, "global_step": 546532, "epoch": 6584} {"train_loss": -27.5921688079834, "global_step": 546533, "epoch": 6584} {"train_loss": -27.627851486206055, "global_step": 546534, "epoch": 6584} {"train_loss": -27.493606567382812, "global_step": 546535, "epoch": 6584} {"train_loss": -28.087753295898438, "global_step": 546536, "epoch": 6584} {"train_loss": -27.737415313720703, "global_step": 546537, "epoch": 6584} {"train_loss": -27.3111515045166, "global_step": 546538, "epoch": 6584} {"train_loss": -27.491567611694336, "global_step": 546539, "epoch": 6584} {"train_loss": -27.816755294799805, "global_step": 546540, "epoch": 6584} {"train_loss": -27.79862403869629, "global_step": 546541, "epoch": 6584} {"train_loss": -27.84320068359375, "global_step": 546542, "epoch": 6584} {"train_loss": -27.662351608276367, "global_step": 546543, "epoch": 6584} {"train_loss": -27.95802116394043, "global_step": 546544, "epoch": 6584} {"train_loss": -28.119962692260742, "global_step": 546545, "epoch": 6584} {"train_loss": -27.9793758392334, "global_step": 546546, "epoch": 6584} {"train_loss": -27.826597213745117, "global_step": 546547, "epoch": 6584} {"train_loss": -27.643930435180664, "global_step": 546548, "epoch": 6584} {"train_loss": -27.791461944580078, "global_step": 546549, "epoch": 6584} {"train_loss": -28.078474044799805, "global_step": 546550, "epoch": 6584} {"train_loss": -28.089975357055664, "global_step": 546551, "epoch": 6584} {"train_loss": -27.66560935974121, "global_step": 546552, "epoch": 6584} {"train_loss": -28.010007858276367, "global_step": 546553, "epoch": 6584} {"train_loss": -27.68460806881089, "global_step": 546554, "epoch": 6584, "val_loss": 6644302.0} {"train_loss": -26.617069244384766, "global_step": 546555, "epoch": 6585} {"train_loss": -27.083276748657227, "global_step": 546556, "epoch": 6585} {"train_loss": -26.26442527770996, "global_step": 546557, "epoch": 6585} {"train_loss": -26.361135482788086, "global_step": 546558, "epoch": 6585} {"train_loss": -26.805810928344727, "global_step": 546559, "epoch": 6585} {"train_loss": -26.81648063659668, "global_step": 546560, "epoch": 6585} {"train_loss": -27.16718101501465, "global_step": 546561, "epoch": 6585} {"train_loss": -27.13701820373535, "global_step": 546562, "epoch": 6585} {"train_loss": -27.26161766052246, "global_step": 546563, "epoch": 6585} {"train_loss": -27.103168487548828, "global_step": 546564, "epoch": 6585} {"train_loss": -26.906051635742188, "global_step": 546565, "epoch": 6585} {"train_loss": -27.37502098083496, "global_step": 546566, "epoch": 6585} {"train_loss": -27.180988311767578, "global_step": 546567, "epoch": 6585} {"train_loss": -27.2167911529541, "global_step": 546568, "epoch": 6585} {"train_loss": -27.360212326049805, "global_step": 546569, "epoch": 6585} {"train_loss": -27.374603271484375, "global_step": 546570, "epoch": 6585} {"train_loss": -27.319522857666016, "global_step": 546571, "epoch": 6585} {"train_loss": -27.23334312438965, "global_step": 546572, "epoch": 6585} {"train_loss": -27.1650447845459, "global_step": 546573, "epoch": 6585} {"train_loss": -26.82431411743164, "global_step": 546574, "epoch": 6585} {"train_loss": -27.409387588500977, "global_step": 546575, "epoch": 6585} {"train_loss": -27.65582847595215, "global_step": 546576, "epoch": 6585} {"train_loss": -27.312137603759766, "global_step": 546577, "epoch": 6585} {"train_loss": -27.266828536987305, "global_step": 546578, "epoch": 6585} {"train_loss": -27.66046714782715, "global_step": 546579, "epoch": 6585} {"train_loss": -27.887609481811523, "global_step": 546580, "epoch": 6585} {"train_loss": -27.592954635620117, "global_step": 546581, "epoch": 6585} {"train_loss": -28.056745529174805, "global_step": 546582, "epoch": 6585} {"train_loss": -27.238632202148438, "global_step": 546583, "epoch": 6585} {"train_loss": -27.667999267578125, "global_step": 546584, "epoch": 6585} {"train_loss": -27.56254005432129, "global_step": 546585, "epoch": 6585} {"train_loss": -27.740283966064453, "global_step": 546586, "epoch": 6585} {"train_loss": -27.673852920532227, "global_step": 546587, "epoch": 6585} {"train_loss": -27.088891983032227, "global_step": 546588, "epoch": 6585} {"train_loss": -27.682586669921875, "global_step": 546589, "epoch": 6585} {"train_loss": -27.989582061767578, "global_step": 546590, "epoch": 6585} {"train_loss": -27.5839900970459, "global_step": 546591, "epoch": 6585} {"train_loss": -27.626859664916992, "global_step": 546592, "epoch": 6585} {"train_loss": -27.670331954956055, "global_step": 546593, "epoch": 6585} {"train_loss": -27.88321876525879, "global_step": 546594, "epoch": 6585} {"train_loss": -28.16456413269043, "global_step": 546595, "epoch": 6585} {"train_loss": -27.577590942382812, "global_step": 546596, "epoch": 6585} {"train_loss": -27.940887451171875, "global_step": 546597, "epoch": 6585} {"train_loss": -27.827367782592773, "global_step": 546598, "epoch": 6585} {"train_loss": -27.86972999572754, "global_step": 546599, "epoch": 6585} {"train_loss": -27.657302856445312, "global_step": 546600, "epoch": 6585} {"train_loss": -27.27533531188965, "global_step": 546601, "epoch": 6585} {"train_loss": -27.625104904174805, "global_step": 546602, "epoch": 6585} {"train_loss": -27.70574951171875, "global_step": 546603, "epoch": 6585} {"train_loss": -27.66053581237793, "global_step": 546604, "epoch": 6585} {"train_loss": -27.823974609375, "global_step": 546605, "epoch": 6585} {"train_loss": -27.86345863342285, "global_step": 546606, "epoch": 6585} {"train_loss": -27.930471420288086, "global_step": 546607, "epoch": 6585} {"train_loss": -27.581100463867188, "global_step": 546608, "epoch": 6585} {"train_loss": -27.47394371032715, "global_step": 546609, "epoch": 6585} {"train_loss": -27.803625106811523, "global_step": 546610, "epoch": 6585} {"train_loss": -27.713281631469727, "global_step": 546611, "epoch": 6585} {"train_loss": -27.396839141845703, "global_step": 546612, "epoch": 6585} {"train_loss": -27.819965362548828, "global_step": 546613, "epoch": 6585} {"train_loss": -28.269296646118164, "global_step": 546614, "epoch": 6585} {"train_loss": -27.4180965423584, "global_step": 546615, "epoch": 6585} {"train_loss": -27.471235275268555, "global_step": 546616, "epoch": 6585} {"train_loss": -27.497772216796875, "global_step": 546617, "epoch": 6585} {"train_loss": -27.424779891967773, "global_step": 546618, "epoch": 6585} {"train_loss": -27.753488540649414, "global_step": 546619, "epoch": 6585} {"train_loss": -27.9692440032959, "global_step": 546620, "epoch": 6585} {"train_loss": -27.903959274291992, "global_step": 546621, "epoch": 6585} {"train_loss": -27.4939022064209, "global_step": 546622, "epoch": 6585} {"train_loss": -27.9605770111084, "global_step": 546623, "epoch": 6585} {"train_loss": -27.728546142578125, "global_step": 546624, "epoch": 6585} {"train_loss": -27.7020320892334, "global_step": 546625, "epoch": 6585} {"train_loss": -27.4052677154541, "global_step": 546626, "epoch": 6585} {"train_loss": -27.653074264526367, "global_step": 546627, "epoch": 6585} {"train_loss": -27.92449951171875, "global_step": 546628, "epoch": 6585} {"train_loss": -27.759763717651367, "global_step": 546629, "epoch": 6585} {"train_loss": -28.030561447143555, "global_step": 546630, "epoch": 6585} {"train_loss": -27.685638427734375, "global_step": 546631, "epoch": 6585} {"train_loss": -27.5311336517334, "global_step": 546632, "epoch": 6585} {"train_loss": -27.835840225219727, "global_step": 546633, "epoch": 6585} {"train_loss": -27.786970138549805, "global_step": 546634, "epoch": 6585} {"train_loss": -27.90616226196289, "global_step": 546635, "epoch": 6585} {"train_loss": -28.464054107666016, "global_step": 546636, "epoch": 6585} {"train_loss": -27.54402084810188, "global_step": 546637, "epoch": 6585, "val_loss": 6569590.0} {"train_loss": -26.974225997924805, "global_step": 546638, "epoch": 6586} {"train_loss": -27.266834259033203, "global_step": 546639, "epoch": 6586} {"train_loss": -27.412424087524414, "global_step": 546640, "epoch": 6586} {"train_loss": -27.361257553100586, "global_step": 546641, "epoch": 6586} {"train_loss": -27.720197677612305, "global_step": 546642, "epoch": 6586} {"train_loss": -27.604034423828125, "global_step": 546643, "epoch": 6586} {"train_loss": -27.42424964904785, "global_step": 546644, "epoch": 6586} {"train_loss": -27.854150772094727, "global_step": 546645, "epoch": 6586} {"train_loss": -28.05756187438965, "global_step": 546646, "epoch": 6586} {"train_loss": -27.775461196899414, "global_step": 546647, "epoch": 6586} {"train_loss": -27.188095092773438, "global_step": 546648, "epoch": 6586} {"train_loss": -27.227750778198242, "global_step": 546649, "epoch": 6586} {"train_loss": -27.678319931030273, "global_step": 546650, "epoch": 6586} {"train_loss": -28.042768478393555, "global_step": 546651, "epoch": 6586} {"train_loss": -27.667943954467773, "global_step": 546652, "epoch": 6586} {"train_loss": -27.6580867767334, "global_step": 546653, "epoch": 6586} {"train_loss": -27.61020851135254, "global_step": 546654, "epoch": 6586} {"train_loss": -27.624713897705078, "global_step": 546655, "epoch": 6586} {"train_loss": -27.827619552612305, "global_step": 546656, "epoch": 6586} {"train_loss": -27.8826847076416, "global_step": 546657, "epoch": 6586} {"train_loss": -27.46978187561035, "global_step": 546658, "epoch": 6586} {"train_loss": -28.013427734375, "global_step": 546659, "epoch": 6586} {"train_loss": -27.825885772705078, "global_step": 546660, "epoch": 6586} {"train_loss": -27.61417579650879, "global_step": 546661, "epoch": 6586} {"train_loss": -27.630359649658203, "global_step": 546662, "epoch": 6586} {"train_loss": -27.68132972717285, "global_step": 546663, "epoch": 6586} {"train_loss": -27.515369415283203, "global_step": 546664, "epoch": 6586} {"train_loss": -27.784269332885742, "global_step": 546665, "epoch": 6586} {"train_loss": -27.52967643737793, "global_step": 546666, "epoch": 6586} {"train_loss": -27.820846557617188, "global_step": 546667, "epoch": 6586} {"train_loss": -27.4249210357666, "global_step": 546668, "epoch": 6586} {"train_loss": -27.441450119018555, "global_step": 546669, "epoch": 6586} {"train_loss": -27.53851318359375, "global_step": 546670, "epoch": 6586} {"train_loss": -27.39632225036621, "global_step": 546671, "epoch": 6586} {"train_loss": -27.86233901977539, "global_step": 546672, "epoch": 6586} {"train_loss": -27.569446563720703, "global_step": 546673, "epoch": 6586} {"train_loss": -27.74757194519043, "global_step": 546674, "epoch": 6586} {"train_loss": -27.7332820892334, "global_step": 546675, "epoch": 6586} {"train_loss": -27.680667877197266, "global_step": 546676, "epoch": 6586} {"train_loss": -27.645620346069336, "global_step": 546677, "epoch": 6586} {"train_loss": -27.99114990234375, "global_step": 546678, "epoch": 6586} {"train_loss": -27.97747802734375, "global_step": 546679, "epoch": 6586} {"train_loss": -27.94182777404785, "global_step": 546680, "epoch": 6586} {"train_loss": -28.14755630493164, "global_step": 546681, "epoch": 6586} {"train_loss": -27.95855712890625, "global_step": 546682, "epoch": 6586} {"train_loss": -27.58194923400879, "global_step": 546683, "epoch": 6586} {"train_loss": -27.99830436706543, "global_step": 546684, "epoch": 6586} {"train_loss": -27.708951950073242, "global_step": 546685, "epoch": 6586} {"train_loss": -28.154829025268555, "global_step": 546686, "epoch": 6586} {"train_loss": -27.654760360717773, "global_step": 546687, "epoch": 6586} {"train_loss": -27.926538467407227, "global_step": 546688, "epoch": 6586} {"train_loss": -28.06265640258789, "global_step": 546689, "epoch": 6586} {"train_loss": -27.8904972076416, "global_step": 546690, "epoch": 6586} {"train_loss": -27.618839263916016, "global_step": 546691, "epoch": 6586} {"train_loss": -27.45844841003418, "global_step": 546692, "epoch": 6586} {"train_loss": -27.46185302734375, "global_step": 546693, "epoch": 6586} {"train_loss": -27.706777572631836, "global_step": 546694, "epoch": 6586} {"train_loss": -27.893301010131836, "global_step": 546695, "epoch": 6586} {"train_loss": -27.491592407226562, "global_step": 546696, "epoch": 6586} {"train_loss": -26.85029411315918, "global_step": 546697, "epoch": 6586} {"train_loss": -26.426939010620117, "global_step": 546698, "epoch": 6586} {"train_loss": -27.3499698638916, "global_step": 546699, "epoch": 6586} {"train_loss": -27.45594596862793, "global_step": 546700, "epoch": 6586} {"train_loss": -27.189619064331055, "global_step": 546701, "epoch": 6586} {"train_loss": -27.2603702545166, "global_step": 546702, "epoch": 6586} {"train_loss": -26.785633087158203, "global_step": 546703, "epoch": 6586} {"train_loss": -27.400861740112305, "global_step": 546704, "epoch": 6586} {"train_loss": -27.750051498413086, "global_step": 546705, "epoch": 6586} {"train_loss": -27.7297420501709, "global_step": 546706, "epoch": 6586} {"train_loss": -27.147205352783203, "global_step": 546707, "epoch": 6586} {"train_loss": -27.299835205078125, "global_step": 546708, "epoch": 6586} {"train_loss": -27.745941162109375, "global_step": 546709, "epoch": 6586} {"train_loss": -27.65580177307129, "global_step": 546710, "epoch": 6586} {"train_loss": -27.426837921142578, "global_step": 546711, "epoch": 6586} {"train_loss": -27.65069007873535, "global_step": 546712, "epoch": 6586} {"train_loss": -27.40077781677246, "global_step": 546713, "epoch": 6586} {"train_loss": -27.377710342407227, "global_step": 546714, "epoch": 6586} {"train_loss": -27.06511878967285, "global_step": 546715, "epoch": 6586} {"train_loss": -26.909048080444336, "global_step": 546716, "epoch": 6586} {"train_loss": -27.1069278717041, "global_step": 546717, "epoch": 6586} {"train_loss": -27.618146896362305, "global_step": 546718, "epoch": 6586} {"train_loss": -27.50690269470215, "global_step": 546719, "epoch": 6586} {"train_loss": -27.559169401605445, "global_step": 546720, "epoch": 6586, "val_loss": 6634180.5} {"train_loss": -25.392562866210938, "global_step": 546721, "epoch": 6587} {"train_loss": -26.458948135375977, "global_step": 546722, "epoch": 6587} {"train_loss": -26.48896598815918, "global_step": 546723, "epoch": 6587} {"train_loss": -25.817066192626953, "global_step": 546724, "epoch": 6587} {"train_loss": -26.895389556884766, "global_step": 546725, "epoch": 6587} {"train_loss": -26.1730899810791, "global_step": 546726, "epoch": 6587} {"train_loss": -27.030317306518555, "global_step": 546727, "epoch": 6587} {"train_loss": -26.03765296936035, "global_step": 546728, "epoch": 6587} {"train_loss": -26.85879898071289, "global_step": 546729, "epoch": 6587} {"train_loss": -26.6779727935791, "global_step": 546730, "epoch": 6587} {"train_loss": -26.86524772644043, "global_step": 546731, "epoch": 6587} {"train_loss": -27.071897506713867, "global_step": 546732, "epoch": 6587} {"train_loss": -26.823450088500977, "global_step": 546733, "epoch": 6587} {"train_loss": -27.136987686157227, "global_step": 546734, "epoch": 6587} {"train_loss": -27.120197296142578, "global_step": 546735, "epoch": 6587} {"train_loss": -27.264432907104492, "global_step": 546736, "epoch": 6587} {"train_loss": -27.1592960357666, "global_step": 546737, "epoch": 6587} {"train_loss": -27.26283073425293, "global_step": 546738, "epoch": 6587} {"train_loss": -26.858646392822266, "global_step": 546739, "epoch": 6587} {"train_loss": -27.598546981811523, "global_step": 546740, "epoch": 6587} {"train_loss": -27.466251373291016, "global_step": 546741, "epoch": 6587} {"train_loss": -27.670385360717773, "global_step": 546742, "epoch": 6587} {"train_loss": -27.614852905273438, "global_step": 546743, "epoch": 6587} {"train_loss": -27.64557456970215, "global_step": 546744, "epoch": 6587} {"train_loss": -27.582197189331055, "global_step": 546745, "epoch": 6587} {"train_loss": -27.382761001586914, "global_step": 546746, "epoch": 6587} {"train_loss": -27.381498336791992, "global_step": 546747, "epoch": 6587} {"train_loss": -27.3627986907959, "global_step": 546748, "epoch": 6587} {"train_loss": -27.48847007751465, "global_step": 546749, "epoch": 6587} {"train_loss": -27.519262313842773, "global_step": 546750, "epoch": 6587} {"train_loss": -27.57484245300293, "global_step": 546751, "epoch": 6587} {"train_loss": -27.2338809967041, "global_step": 546752, "epoch": 6587} {"train_loss": -27.79676628112793, "global_step": 546753, "epoch": 6587} {"train_loss": -27.65924644470215, "global_step": 546754, "epoch": 6587} {"train_loss": -27.621551513671875, "global_step": 546755, "epoch": 6587} {"train_loss": -27.998754501342773, "global_step": 546756, "epoch": 6587} {"train_loss": -27.94045066833496, "global_step": 546757, "epoch": 6587} {"train_loss": -27.474287033081055, "global_step": 546758, "epoch": 6587} {"train_loss": -27.72601890563965, "global_step": 546759, "epoch": 6587} {"train_loss": -27.766504287719727, "global_step": 546760, "epoch": 6587} {"train_loss": -27.5784854888916, "global_step": 546761, "epoch": 6587} {"train_loss": -27.764875411987305, "global_step": 546762, "epoch": 6587} {"train_loss": -27.8515682220459, "global_step": 546763, "epoch": 6587} {"train_loss": -27.418292999267578, "global_step": 546764, "epoch": 6587} {"train_loss": -27.545129776000977, "global_step": 546765, "epoch": 6587} {"train_loss": -27.88888931274414, "global_step": 546766, "epoch": 6587} {"train_loss": -28.018125534057617, "global_step": 546767, "epoch": 6587} {"train_loss": -28.154470443725586, "global_step": 546768, "epoch": 6587} {"train_loss": -27.90349769592285, "global_step": 546769, "epoch": 6587} {"train_loss": -27.751489639282227, "global_step": 546770, "epoch": 6587} {"train_loss": -27.6978759765625, "global_step": 546771, "epoch": 6587} {"train_loss": -27.36736488342285, "global_step": 546772, "epoch": 6587} {"train_loss": -27.17596435546875, "global_step": 546773, "epoch": 6587} {"train_loss": -27.689441680908203, "global_step": 546774, "epoch": 6587} {"train_loss": -27.500146865844727, "global_step": 546775, "epoch": 6587} {"train_loss": -27.603809356689453, "global_step": 546776, "epoch": 6587} {"train_loss": -27.514408111572266, "global_step": 546777, "epoch": 6587} {"train_loss": -27.510101318359375, "global_step": 546778, "epoch": 6587} {"train_loss": -26.8636531829834, "global_step": 546779, "epoch": 6587} {"train_loss": -27.601245880126953, "global_step": 546780, "epoch": 6587} {"train_loss": -27.627609252929688, "global_step": 546781, "epoch": 6587} {"train_loss": -27.745153427124023, "global_step": 546782, "epoch": 6587} {"train_loss": -27.82649803161621, "global_step": 546783, "epoch": 6587} {"train_loss": -27.588672637939453, "global_step": 546784, "epoch": 6587} {"train_loss": -27.105548858642578, "global_step": 546785, "epoch": 6587} {"train_loss": -27.81532096862793, "global_step": 546786, "epoch": 6587} {"train_loss": -27.502094268798828, "global_step": 546787, "epoch": 6587} {"train_loss": -27.849836349487305, "global_step": 546788, "epoch": 6587} {"train_loss": -28.1545352935791, "global_step": 546789, "epoch": 6587} {"train_loss": -27.635547637939453, "global_step": 546790, "epoch": 6587} {"train_loss": -27.7999210357666, "global_step": 546791, "epoch": 6587} {"train_loss": -27.487934112548828, "global_step": 546792, "epoch": 6587} {"train_loss": -28.05220603942871, "global_step": 546793, "epoch": 6587} {"train_loss": -27.864700317382812, "global_step": 546794, "epoch": 6587} {"train_loss": -27.874876022338867, "global_step": 546795, "epoch": 6587} {"train_loss": -27.818683624267578, "global_step": 546796, "epoch": 6587} {"train_loss": -27.7484130859375, "global_step": 546797, "epoch": 6587} {"train_loss": -27.86726188659668, "global_step": 546798, "epoch": 6587} {"train_loss": -27.605558395385742, "global_step": 546799, "epoch": 6587} {"train_loss": -27.94622802734375, "global_step": 546800, "epoch": 6587} {"train_loss": -28.0496826171875, "global_step": 546801, "epoch": 6587} {"train_loss": -27.9595890045166, "global_step": 546802, "epoch": 6587} {"train_loss": -27.428844153162945, "global_step": 546803, "epoch": 6587, "val_loss": 6469278.0} {"train_loss": -27.052038192749023, "global_step": 546804, "epoch": 6588} {"train_loss": -26.84906005859375, "global_step": 546805, "epoch": 6588} {"train_loss": -27.233118057250977, "global_step": 546806, "epoch": 6588} {"train_loss": -27.274133682250977, "global_step": 546807, "epoch": 6588} {"train_loss": -27.423791885375977, "global_step": 546808, "epoch": 6588} {"train_loss": -27.557575225830078, "global_step": 546809, "epoch": 6588} {"train_loss": -27.409833908081055, "global_step": 546810, "epoch": 6588} {"train_loss": -27.428760528564453, "global_step": 546811, "epoch": 6588} {"train_loss": -27.596471786499023, "global_step": 546812, "epoch": 6588} {"train_loss": -27.817548751831055, "global_step": 546813, "epoch": 6588} {"train_loss": -27.3112850189209, "global_step": 546814, "epoch": 6588} {"train_loss": -27.556034088134766, "global_step": 546815, "epoch": 6588} {"train_loss": -27.6715087890625, "global_step": 546816, "epoch": 6588} {"train_loss": -27.492324829101562, "global_step": 546817, "epoch": 6588} {"train_loss": -27.339130401611328, "global_step": 546818, "epoch": 6588} {"train_loss": -27.644941329956055, "global_step": 546819, "epoch": 6588} {"train_loss": -27.76095962524414, "global_step": 546820, "epoch": 6588} {"train_loss": -27.203088760375977, "global_step": 546821, "epoch": 6588} {"train_loss": -27.580060958862305, "global_step": 546822, "epoch": 6588} {"train_loss": -27.708051681518555, "global_step": 546823, "epoch": 6588} {"train_loss": -27.548185348510742, "global_step": 546824, "epoch": 6588} {"train_loss": -27.584918975830078, "global_step": 546825, "epoch": 6588} {"train_loss": -27.891279220581055, "global_step": 546826, "epoch": 6588} {"train_loss": -27.434650421142578, "global_step": 546827, "epoch": 6588} {"train_loss": -27.783008575439453, "global_step": 546828, "epoch": 6588} {"train_loss": -27.73431968688965, "global_step": 546829, "epoch": 6588} {"train_loss": -27.716581344604492, "global_step": 546830, "epoch": 6588} {"train_loss": -27.6249942779541, "global_step": 546831, "epoch": 6588} {"train_loss": -27.402973175048828, "global_step": 546832, "epoch": 6588} {"train_loss": -27.397628784179688, "global_step": 546833, "epoch": 6588} {"train_loss": -27.72022819519043, "global_step": 546834, "epoch": 6588} {"train_loss": -28.0201358795166, "global_step": 546835, "epoch": 6588} {"train_loss": -27.876041412353516, "global_step": 546836, "epoch": 6588} {"train_loss": -27.977399826049805, "global_step": 546837, "epoch": 6588} {"train_loss": -27.654165267944336, "global_step": 546838, "epoch": 6588} {"train_loss": -27.83831787109375, "global_step": 546839, "epoch": 6588} {"train_loss": -27.97393226623535, "global_step": 546840, "epoch": 6588} {"train_loss": -27.740137100219727, "global_step": 546841, "epoch": 6588} {"train_loss": -27.779882431030273, "global_step": 546842, "epoch": 6588} {"train_loss": -27.943561553955078, "global_step": 546843, "epoch": 6588} {"train_loss": -27.96973991394043, "global_step": 546844, "epoch": 6588} {"train_loss": -28.12786865234375, "global_step": 546845, "epoch": 6588} {"train_loss": -27.500537872314453, "global_step": 546846, "epoch": 6588} {"train_loss": -27.9638671875, "global_step": 546847, "epoch": 6588} {"train_loss": -27.948410034179688, "global_step": 546848, "epoch": 6588} {"train_loss": -27.954303741455078, "global_step": 546849, "epoch": 6588} {"train_loss": -27.58154296875, "global_step": 546850, "epoch": 6588} {"train_loss": -27.378131866455078, "global_step": 546851, "epoch": 6588} {"train_loss": -26.78346061706543, "global_step": 546852, "epoch": 6588} {"train_loss": -26.921478271484375, "global_step": 546853, "epoch": 6588} {"train_loss": -27.662994384765625, "global_step": 546854, "epoch": 6588} {"train_loss": -27.80707359313965, "global_step": 546855, "epoch": 6588} {"train_loss": -27.72125244140625, "global_step": 546856, "epoch": 6588} {"train_loss": -27.925256729125977, "global_step": 546857, "epoch": 6588} {"train_loss": -27.823291778564453, "global_step": 546858, "epoch": 6588} {"train_loss": -27.606159210205078, "global_step": 546859, "epoch": 6588} {"train_loss": -27.627477645874023, "global_step": 546860, "epoch": 6588} {"train_loss": -28.001569747924805, "global_step": 546861, "epoch": 6588} {"train_loss": -27.487829208374023, "global_step": 546862, "epoch": 6588} {"train_loss": -27.4161319732666, "global_step": 546863, "epoch": 6588} {"train_loss": -27.40506362915039, "global_step": 546864, "epoch": 6588} {"train_loss": -27.573444366455078, "global_step": 546865, "epoch": 6588} {"train_loss": -27.878625869750977, "global_step": 546866, "epoch": 6588} {"train_loss": -27.498132705688477, "global_step": 546867, "epoch": 6588} {"train_loss": -27.77215003967285, "global_step": 546868, "epoch": 6588} {"train_loss": -27.841421127319336, "global_step": 546869, "epoch": 6588} {"train_loss": -27.605682373046875, "global_step": 546870, "epoch": 6588} {"train_loss": -27.955810546875, "global_step": 546871, "epoch": 6588} {"train_loss": -27.72327995300293, "global_step": 546872, "epoch": 6588} {"train_loss": -27.93099021911621, "global_step": 546873, "epoch": 6588} {"train_loss": -27.80208396911621, "global_step": 546874, "epoch": 6588} {"train_loss": -27.78385353088379, "global_step": 546875, "epoch": 6588} {"train_loss": -28.130041122436523, "global_step": 546876, "epoch": 6588} {"train_loss": -27.968225479125977, "global_step": 546877, "epoch": 6588} {"train_loss": -28.343358993530273, "global_step": 546878, "epoch": 6588} {"train_loss": -27.602951049804688, "global_step": 546879, "epoch": 6588} {"train_loss": -27.9805850982666, "global_step": 546880, "epoch": 6588} {"train_loss": -27.976720809936523, "global_step": 546881, "epoch": 6588} {"train_loss": -27.674560546875, "global_step": 546882, "epoch": 6588} {"train_loss": -27.603378295898438, "global_step": 546883, "epoch": 6588} {"train_loss": -27.755155563354492, "global_step": 546884, "epoch": 6588} {"train_loss": -27.340362548828125, "global_step": 546885, "epoch": 6588} {"train_loss": -27.66370012673987, "global_step": 546886, "epoch": 6588, "val_loss": 6576371.0} {"train_loss": -27.362060546875, "global_step": 546887, "epoch": 6589} {"train_loss": -26.127363204956055, "global_step": 546888, "epoch": 6589} {"train_loss": -25.03499984741211, "global_step": 546889, "epoch": 6589} {"train_loss": -25.52878761291504, "global_step": 546890, "epoch": 6589} {"train_loss": -26.7296085357666, "global_step": 546891, "epoch": 6589} {"train_loss": -27.40976333618164, "global_step": 546892, "epoch": 6589} {"train_loss": -26.56361198425293, "global_step": 546893, "epoch": 6589} {"train_loss": -27.270706176757812, "global_step": 546894, "epoch": 6589} {"train_loss": -26.88701820373535, "global_step": 546895, "epoch": 6589} {"train_loss": -27.010284423828125, "global_step": 546896, "epoch": 6589} {"train_loss": -26.700422286987305, "global_step": 546897, "epoch": 6589} {"train_loss": -27.488849639892578, "global_step": 546898, "epoch": 6589} {"train_loss": -27.109130859375, "global_step": 546899, "epoch": 6589} {"train_loss": -27.23566246032715, "global_step": 546900, "epoch": 6589} {"train_loss": -27.3057804107666, "global_step": 546901, "epoch": 6589} {"train_loss": -27.054288864135742, "global_step": 546902, "epoch": 6589} {"train_loss": -27.3247127532959, "global_step": 546903, "epoch": 6589} {"train_loss": -27.41533851623535, "global_step": 546904, "epoch": 6589} {"train_loss": -27.274900436401367, "global_step": 546905, "epoch": 6589} {"train_loss": -27.64619255065918, "global_step": 546906, "epoch": 6589} {"train_loss": -27.50299072265625, "global_step": 546907, "epoch": 6589} {"train_loss": -27.320743560791016, "global_step": 546908, "epoch": 6589} {"train_loss": -27.40406608581543, "global_step": 546909, "epoch": 6589} {"train_loss": -27.027158737182617, "global_step": 546910, "epoch": 6589} {"train_loss": -27.70728874206543, "global_step": 546911, "epoch": 6589} {"train_loss": -27.336469650268555, "global_step": 546912, "epoch": 6589} {"train_loss": -28.032358169555664, "global_step": 546913, "epoch": 6589} {"train_loss": -27.425939559936523, "global_step": 546914, "epoch": 6589} {"train_loss": -27.644306182861328, "global_step": 546915, "epoch": 6589} {"train_loss": -27.565540313720703, "global_step": 546916, "epoch": 6589} {"train_loss": -27.524444580078125, "global_step": 546917, "epoch": 6589} {"train_loss": -27.717960357666016, "global_step": 546918, "epoch": 6589} {"train_loss": -27.602441787719727, "global_step": 546919, "epoch": 6589} {"train_loss": -27.5446720123291, "global_step": 546920, "epoch": 6589} {"train_loss": -27.774396896362305, "global_step": 546921, "epoch": 6589} {"train_loss": -27.8236083984375, "global_step": 546922, "epoch": 6589} {"train_loss": -27.504575729370117, "global_step": 546923, "epoch": 6589} {"train_loss": -27.707141876220703, "global_step": 546924, "epoch": 6589} {"train_loss": -27.852136611938477, "global_step": 546925, "epoch": 6589} {"train_loss": -27.7969913482666, "global_step": 546926, "epoch": 6589} {"train_loss": -27.766286849975586, "global_step": 546927, "epoch": 6589} {"train_loss": -27.84942054748535, "global_step": 546928, "epoch": 6589} {"train_loss": -27.751941680908203, "global_step": 546929, "epoch": 6589} {"train_loss": -27.891279220581055, "global_step": 546930, "epoch": 6589} {"train_loss": -27.839147567749023, "global_step": 546931, "epoch": 6589} {"train_loss": -27.768884658813477, "global_step": 546932, "epoch": 6589} {"train_loss": -27.710498809814453, "global_step": 546933, "epoch": 6589} {"train_loss": -28.12471580505371, "global_step": 546934, "epoch": 6589} {"train_loss": -28.045251846313477, "global_step": 546935, "epoch": 6589} {"train_loss": -27.945053100585938, "global_step": 546936, "epoch": 6589} {"train_loss": -27.686573028564453, "global_step": 546937, "epoch": 6589} {"train_loss": -27.97037696838379, "global_step": 546938, "epoch": 6589} {"train_loss": -27.609296798706055, "global_step": 546939, "epoch": 6589} {"train_loss": -27.841638565063477, "global_step": 546940, "epoch": 6589} {"train_loss": -27.639753341674805, "global_step": 546941, "epoch": 6589} {"train_loss": -28.062332153320312, "global_step": 546942, "epoch": 6589} {"train_loss": -27.9794979095459, "global_step": 546943, "epoch": 6589} {"train_loss": -27.780624389648438, "global_step": 546944, "epoch": 6589} {"train_loss": -27.577991485595703, "global_step": 546945, "epoch": 6589} {"train_loss": -27.642362594604492, "global_step": 546946, "epoch": 6589} {"train_loss": -28.278491973876953, "global_step": 546947, "epoch": 6589} {"train_loss": -27.623910903930664, "global_step": 546948, "epoch": 6589} {"train_loss": -27.88299560546875, "global_step": 546949, "epoch": 6589} {"train_loss": -27.66322898864746, "global_step": 546950, "epoch": 6589} {"train_loss": -27.73223304748535, "global_step": 546951, "epoch": 6589} {"train_loss": -27.853620529174805, "global_step": 546952, "epoch": 6589} {"train_loss": -27.46907615661621, "global_step": 546953, "epoch": 6589} {"train_loss": -27.915679931640625, "global_step": 546954, "epoch": 6589} {"train_loss": -28.02308464050293, "global_step": 546955, "epoch": 6589} {"train_loss": -27.983383178710938, "global_step": 546956, "epoch": 6589} {"train_loss": -27.715606689453125, "global_step": 546957, "epoch": 6589} {"train_loss": -27.995447158813477, "global_step": 546958, "epoch": 6589} {"train_loss": -27.284881591796875, "global_step": 546959, "epoch": 6589} {"train_loss": -27.9537410736084, "global_step": 546960, "epoch": 6589} {"train_loss": -27.223052978515625, "global_step": 546961, "epoch": 6589} {"train_loss": -27.686933517456055, "global_step": 546962, "epoch": 6589} {"train_loss": -27.929147720336914, "global_step": 546963, "epoch": 6589} {"train_loss": -27.979461669921875, "global_step": 546964, "epoch": 6589} {"train_loss": -27.49911880493164, "global_step": 546965, "epoch": 6589} {"train_loss": -27.97381591796875, "global_step": 546966, "epoch": 6589} {"train_loss": -27.61655044555664, "global_step": 546967, "epoch": 6589} {"train_loss": -27.88709831237793, "global_step": 546968, "epoch": 6589} {"train_loss": -27.53815074139331, "global_step": 546969, "epoch": 6589, "val_loss": 6588795.5} {"train_loss": -27.110931396484375, "global_step": 546970, "epoch": 6590} {"train_loss": -26.27532386779785, "global_step": 546971, "epoch": 6590} {"train_loss": -25.938236236572266, "global_step": 546972, "epoch": 6590} {"train_loss": -25.472732543945312, "global_step": 546973, "epoch": 6590} {"train_loss": -25.459314346313477, "global_step": 546974, "epoch": 6590} {"train_loss": -26.9133358001709, "global_step": 546975, "epoch": 6590} {"train_loss": -26.27579689025879, "global_step": 546976, "epoch": 6590} {"train_loss": -26.894269943237305, "global_step": 546977, "epoch": 6590} {"train_loss": -26.85114097595215, "global_step": 546978, "epoch": 6590} {"train_loss": -27.47125816345215, "global_step": 546979, "epoch": 6590} {"train_loss": -26.95987319946289, "global_step": 546980, "epoch": 6590} {"train_loss": -26.95166015625, "global_step": 546981, "epoch": 6590} {"train_loss": -26.990142822265625, "global_step": 546982, "epoch": 6590} {"train_loss": -26.994775772094727, "global_step": 546983, "epoch": 6590} {"train_loss": -27.18451499938965, "global_step": 546984, "epoch": 6590} {"train_loss": -27.049753189086914, "global_step": 546985, "epoch": 6590} {"train_loss": -27.17291831970215, "global_step": 546986, "epoch": 6590} {"train_loss": -27.364215850830078, "global_step": 546987, "epoch": 6590} {"train_loss": -27.38185691833496, "global_step": 546988, "epoch": 6590} {"train_loss": -27.559579849243164, "global_step": 546989, "epoch": 6590} {"train_loss": -27.40203285217285, "global_step": 546990, "epoch": 6590} {"train_loss": -27.432905197143555, "global_step": 546991, "epoch": 6590} {"train_loss": -27.772449493408203, "global_step": 546992, "epoch": 6590} {"train_loss": -26.9658145904541, "global_step": 546993, "epoch": 6590} {"train_loss": -27.312414169311523, "global_step": 546994, "epoch": 6590} {"train_loss": -27.655685424804688, "global_step": 546995, "epoch": 6590} {"train_loss": -27.634504318237305, "global_step": 546996, "epoch": 6590} {"train_loss": -27.49407958984375, "global_step": 546997, "epoch": 6590} {"train_loss": -27.68587303161621, "global_step": 546998, "epoch": 6590} {"train_loss": -27.663415908813477, "global_step": 546999, "epoch": 6590} {"train_loss": -27.771894454956055, "global_step": 547000, "epoch": 6590} {"train_loss": -27.62127113342285, "global_step": 547001, "epoch": 6590} {"train_loss": -27.504688262939453, "global_step": 547002, "epoch": 6590} {"train_loss": -27.76190185546875, "global_step": 547003, "epoch": 6590} {"train_loss": -27.640247344970703, "global_step": 547004, "epoch": 6590} {"train_loss": -27.839506149291992, "global_step": 547005, "epoch": 6590} {"train_loss": -27.719131469726562, "global_step": 547006, "epoch": 6590} {"train_loss": -27.462186813354492, "global_step": 547007, "epoch": 6590} {"train_loss": -28.025543212890625, "global_step": 547008, "epoch": 6590} {"train_loss": -27.56036949157715, "global_step": 547009, "epoch": 6590} {"train_loss": -27.418371200561523, "global_step": 547010, "epoch": 6590} {"train_loss": -28.069644927978516, "global_step": 547011, "epoch": 6590} {"train_loss": -27.64887809753418, "global_step": 547012, "epoch": 6590} {"train_loss": -27.782678604125977, "global_step": 547013, "epoch": 6590} {"train_loss": -27.66798210144043, "global_step": 547014, "epoch": 6590} {"train_loss": -27.86948013305664, "global_step": 547015, "epoch": 6590} {"train_loss": -27.84539794921875, "global_step": 547016, "epoch": 6590} {"train_loss": -28.008243560791016, "global_step": 547017, "epoch": 6590} {"train_loss": -27.656965255737305, "global_step": 547018, "epoch": 6590} {"train_loss": -27.979114532470703, "global_step": 547019, "epoch": 6590} {"train_loss": -27.634113311767578, "global_step": 547020, "epoch": 6590} {"train_loss": -27.956602096557617, "global_step": 547021, "epoch": 6590} {"train_loss": -27.816207885742188, "global_step": 547022, "epoch": 6590} {"train_loss": -27.892438888549805, "global_step": 547023, "epoch": 6590} {"train_loss": -28.156513214111328, "global_step": 547024, "epoch": 6590} {"train_loss": -27.8143310546875, "global_step": 547025, "epoch": 6590} {"train_loss": -27.841833114624023, "global_step": 547026, "epoch": 6590} {"train_loss": -28.0531063079834, "global_step": 547027, "epoch": 6590} {"train_loss": -27.7997989654541, "global_step": 547028, "epoch": 6590} {"train_loss": -28.082172393798828, "global_step": 547029, "epoch": 6590} {"train_loss": -28.18769645690918, "global_step": 547030, "epoch": 6590} {"train_loss": -27.98202896118164, "global_step": 547031, "epoch": 6590} {"train_loss": -27.552356719970703, "global_step": 547032, "epoch": 6590} {"train_loss": -28.12660026550293, "global_step": 547033, "epoch": 6590} {"train_loss": -27.537267684936523, "global_step": 547034, "epoch": 6590} {"train_loss": -27.617589950561523, "global_step": 547035, "epoch": 6590} {"train_loss": -27.527862548828125, "global_step": 547036, "epoch": 6590} {"train_loss": -28.006315231323242, "global_step": 547037, "epoch": 6590} {"train_loss": -27.501209259033203, "global_step": 547038, "epoch": 6590} {"train_loss": -27.624414443969727, "global_step": 547039, "epoch": 6590} {"train_loss": -27.794336318969727, "global_step": 547040, "epoch": 6590} {"train_loss": -27.731748580932617, "global_step": 547041, "epoch": 6590} {"train_loss": -27.380905151367188, "global_step": 547042, "epoch": 6590} {"train_loss": -27.41339111328125, "global_step": 547043, "epoch": 6590} {"train_loss": -27.21445083618164, "global_step": 547044, "epoch": 6590} {"train_loss": -27.732202529907227, "global_step": 547045, "epoch": 6590} {"train_loss": -27.69843101501465, "global_step": 547046, "epoch": 6590} {"train_loss": -27.899030685424805, "global_step": 547047, "epoch": 6590} {"train_loss": -27.382200241088867, "global_step": 547048, "epoch": 6590} {"train_loss": -27.8761043548584, "global_step": 547049, "epoch": 6590} {"train_loss": -27.51242446899414, "global_step": 547050, "epoch": 6590} {"train_loss": -27.62470817565918, "global_step": 547051, "epoch": 6590} {"train_loss": -27.5004407124347, "global_step": 547052, "epoch": 6590, "val_loss": 6543611.0} {"train_loss": -26.988636016845703, "global_step": 547053, "epoch": 6591} {"train_loss": -27.228199005126953, "global_step": 547054, "epoch": 6591} {"train_loss": -27.13604736328125, "global_step": 547055, "epoch": 6591} {"train_loss": -27.40866470336914, "global_step": 547056, "epoch": 6591} {"train_loss": -27.24225425720215, "global_step": 547057, "epoch": 6591} {"train_loss": -27.37822914123535, "global_step": 547058, "epoch": 6591} {"train_loss": -27.242752075195312, "global_step": 547059, "epoch": 6591} {"train_loss": -27.32549476623535, "global_step": 547060, "epoch": 6591} {"train_loss": -27.204504013061523, "global_step": 547061, "epoch": 6591} {"train_loss": -27.243886947631836, "global_step": 547062, "epoch": 6591} {"train_loss": -27.3786678314209, "global_step": 547063, "epoch": 6591} {"train_loss": -27.31855583190918, "global_step": 547064, "epoch": 6591} {"train_loss": -27.351987838745117, "global_step": 547065, "epoch": 6591} {"train_loss": -27.306121826171875, "global_step": 547066, "epoch": 6591} {"train_loss": -27.227895736694336, "global_step": 547067, "epoch": 6591} {"train_loss": -27.239368438720703, "global_step": 547068, "epoch": 6591} {"train_loss": -27.77972412109375, "global_step": 547069, "epoch": 6591} {"train_loss": -27.407068252563477, "global_step": 547070, "epoch": 6591} {"train_loss": -27.190261840820312, "global_step": 547071, "epoch": 6591} {"train_loss": -27.8896427154541, "global_step": 547072, "epoch": 6591} {"train_loss": -27.417434692382812, "global_step": 547073, "epoch": 6591} {"train_loss": -27.69410514831543, "global_step": 547074, "epoch": 6591} {"train_loss": -27.22980308532715, "global_step": 547075, "epoch": 6591} {"train_loss": -27.3863468170166, "global_step": 547076, "epoch": 6591} {"train_loss": -27.59107780456543, "global_step": 547077, "epoch": 6591} {"train_loss": -27.7182674407959, "global_step": 547078, "epoch": 6591} {"train_loss": -27.70037841796875, "global_step": 547079, "epoch": 6591} {"train_loss": -27.60092544555664, "global_step": 547080, "epoch": 6591} {"train_loss": -27.878644943237305, "global_step": 547081, "epoch": 6591} {"train_loss": -27.628881454467773, "global_step": 547082, "epoch": 6591} {"train_loss": -27.7551326751709, "global_step": 547083, "epoch": 6591} {"train_loss": -27.532529830932617, "global_step": 547084, "epoch": 6591} {"train_loss": -27.813405990600586, "global_step": 547085, "epoch": 6591} {"train_loss": -27.554981231689453, "global_step": 547086, "epoch": 6591} {"train_loss": -27.629959106445312, "global_step": 547087, "epoch": 6591} {"train_loss": -27.633255004882812, "global_step": 547088, "epoch": 6591} {"train_loss": -27.348529815673828, "global_step": 547089, "epoch": 6591} {"train_loss": -27.69186782836914, "global_step": 547090, "epoch": 6591} {"train_loss": -27.878671646118164, "global_step": 547091, "epoch": 6591} {"train_loss": -27.367237091064453, "global_step": 547092, "epoch": 6591} {"train_loss": -27.75349235534668, "global_step": 547093, "epoch": 6591} {"train_loss": -27.510787963867188, "global_step": 547094, "epoch": 6591} {"train_loss": -27.839563369750977, "global_step": 547095, "epoch": 6591} {"train_loss": -27.7054500579834, "global_step": 547096, "epoch": 6591} {"train_loss": -28.042654037475586, "global_step": 547097, "epoch": 6591} {"train_loss": -27.737653732299805, "global_step": 547098, "epoch": 6591} {"train_loss": -27.277673721313477, "global_step": 547099, "epoch": 6591} {"train_loss": -27.739408493041992, "global_step": 547100, "epoch": 6591} {"train_loss": -28.289779663085938, "global_step": 547101, "epoch": 6591} {"train_loss": -28.00693702697754, "global_step": 547102, "epoch": 6591} {"train_loss": -27.56776237487793, "global_step": 547103, "epoch": 6591} {"train_loss": -27.724695205688477, "global_step": 547104, "epoch": 6591} {"train_loss": -27.73939323425293, "global_step": 547105, "epoch": 6591} {"train_loss": -27.98394775390625, "global_step": 547106, "epoch": 6591} {"train_loss": -27.986902236938477, "global_step": 547107, "epoch": 6591} {"train_loss": -28.038049697875977, "global_step": 547108, "epoch": 6591} {"train_loss": -27.001386642456055, "global_step": 547109, "epoch": 6591} {"train_loss": -27.431549072265625, "global_step": 547110, "epoch": 6591} {"train_loss": -27.976171493530273, "global_step": 547111, "epoch": 6591} {"train_loss": -27.115711212158203, "global_step": 547112, "epoch": 6591} {"train_loss": -26.887928009033203, "global_step": 547113, "epoch": 6591} {"train_loss": -27.554920196533203, "global_step": 547114, "epoch": 6591} {"train_loss": -26.9327392578125, "global_step": 547115, "epoch": 6591} {"train_loss": -27.71900749206543, "global_step": 547116, "epoch": 6591} {"train_loss": -27.699819564819336, "global_step": 547117, "epoch": 6591} {"train_loss": -27.51275062561035, "global_step": 547118, "epoch": 6591} {"train_loss": -27.30450439453125, "global_step": 547119, "epoch": 6591} {"train_loss": -27.713001251220703, "global_step": 547120, "epoch": 6591} {"train_loss": -27.55446434020996, "global_step": 547121, "epoch": 6591} {"train_loss": -27.752683639526367, "global_step": 547122, "epoch": 6591} {"train_loss": -27.5562686920166, "global_step": 547123, "epoch": 6591} {"train_loss": -27.531497955322266, "global_step": 547124, "epoch": 6591} {"train_loss": -27.84766960144043, "global_step": 547125, "epoch": 6591} {"train_loss": -27.584308624267578, "global_step": 547126, "epoch": 6591} {"train_loss": -27.240819931030273, "global_step": 547127, "epoch": 6591} {"train_loss": -27.7594051361084, "global_step": 547128, "epoch": 6591} {"train_loss": -27.66940689086914, "global_step": 547129, "epoch": 6591} {"train_loss": -27.559186935424805, "global_step": 547130, "epoch": 6591} {"train_loss": -27.923969268798828, "global_step": 547131, "epoch": 6591} {"train_loss": -27.89996337890625, "global_step": 547132, "epoch": 6591} {"train_loss": -27.609567642211914, "global_step": 547133, "epoch": 6591} {"train_loss": -27.859256744384766, "global_step": 547134, "epoch": 6591} {"train_loss": -27.550307262374695, "global_step": 547135, "epoch": 6591, "val_loss": 6565812.5} {"train_loss": -27.825042724609375, "global_step": 547136, "epoch": 6592} {"train_loss": -27.7484188079834, "global_step": 547137, "epoch": 6592} {"train_loss": -27.78424072265625, "global_step": 547138, "epoch": 6592} {"train_loss": -27.371826171875, "global_step": 547139, "epoch": 6592} {"train_loss": -27.215543746948242, "global_step": 547140, "epoch": 6592} {"train_loss": -27.420028686523438, "global_step": 547141, "epoch": 6592} {"train_loss": -27.51102638244629, "global_step": 547142, "epoch": 6592} {"train_loss": -27.734832763671875, "global_step": 547143, "epoch": 6592} {"train_loss": -27.689422607421875, "global_step": 547144, "epoch": 6592} {"train_loss": -27.754514694213867, "global_step": 547145, "epoch": 6592} {"train_loss": -27.350778579711914, "global_step": 547146, "epoch": 6592} {"train_loss": -27.8425350189209, "global_step": 547147, "epoch": 6592} {"train_loss": -27.344018936157227, "global_step": 547148, "epoch": 6592} {"train_loss": -27.552703857421875, "global_step": 547149, "epoch": 6592} {"train_loss": -27.64564323425293, "global_step": 547150, "epoch": 6592} {"train_loss": -27.435937881469727, "global_step": 547151, "epoch": 6592} {"train_loss": -27.429479598999023, "global_step": 547152, "epoch": 6592} {"train_loss": -27.737085342407227, "global_step": 547153, "epoch": 6592} {"train_loss": -27.6281795501709, "global_step": 547154, "epoch": 6592} {"train_loss": -27.812543869018555, "global_step": 547155, "epoch": 6592} {"train_loss": -27.735464096069336, "global_step": 547156, "epoch": 6592} {"train_loss": -27.684234619140625, "global_step": 547157, "epoch": 6592} {"train_loss": -27.498193740844727, "global_step": 547158, "epoch": 6592} {"train_loss": -27.463937759399414, "global_step": 547159, "epoch": 6592} {"train_loss": -27.565649032592773, "global_step": 547160, "epoch": 6592} {"train_loss": -27.380023956298828, "global_step": 547161, "epoch": 6592} {"train_loss": -27.469099044799805, "global_step": 547162, "epoch": 6592} {"train_loss": -27.246728897094727, "global_step": 547163, "epoch": 6592} {"train_loss": -27.514196395874023, "global_step": 547164, "epoch": 6592} {"train_loss": -27.293384552001953, "global_step": 547165, "epoch": 6592} {"train_loss": -27.804452896118164, "global_step": 547166, "epoch": 6592} {"train_loss": -27.912830352783203, "global_step": 547167, "epoch": 6592} {"train_loss": -27.992008209228516, "global_step": 547168, "epoch": 6592} {"train_loss": -27.588287353515625, "global_step": 547169, "epoch": 6592} {"train_loss": -27.84809684753418, "global_step": 547170, "epoch": 6592} {"train_loss": -28.014297485351562, "global_step": 547171, "epoch": 6592} {"train_loss": -28.063852310180664, "global_step": 547172, "epoch": 6592} {"train_loss": -27.610355377197266, "global_step": 547173, "epoch": 6592} {"train_loss": -27.963367462158203, "global_step": 547174, "epoch": 6592} {"train_loss": -27.572467803955078, "global_step": 547175, "epoch": 6592} {"train_loss": -27.536436080932617, "global_step": 547176, "epoch": 6592} {"train_loss": -27.680810928344727, "global_step": 547177, "epoch": 6592} {"train_loss": -28.06465721130371, "global_step": 547178, "epoch": 6592} {"train_loss": -27.72108268737793, "global_step": 547179, "epoch": 6592} {"train_loss": -27.735137939453125, "global_step": 547180, "epoch": 6592} {"train_loss": -28.334814071655273, "global_step": 547181, "epoch": 6592} {"train_loss": -28.195417404174805, "global_step": 547182, "epoch": 6592} {"train_loss": -27.883787155151367, "global_step": 547183, "epoch": 6592} {"train_loss": -27.933393478393555, "global_step": 547184, "epoch": 6592} {"train_loss": -28.031280517578125, "global_step": 547185, "epoch": 6592} {"train_loss": -28.04306411743164, "global_step": 547186, "epoch": 6592} {"train_loss": -28.110044479370117, "global_step": 547187, "epoch": 6592} {"train_loss": -28.02227783203125, "global_step": 547188, "epoch": 6592} {"train_loss": -27.668500900268555, "global_step": 547189, "epoch": 6592} {"train_loss": -28.20762062072754, "global_step": 547190, "epoch": 6592} {"train_loss": -27.705657958984375, "global_step": 547191, "epoch": 6592} {"train_loss": -27.8002986907959, "global_step": 547192, "epoch": 6592} {"train_loss": -27.618032455444336, "global_step": 547193, "epoch": 6592} {"train_loss": -27.90254020690918, "global_step": 547194, "epoch": 6592} {"train_loss": -27.65546226501465, "global_step": 547195, "epoch": 6592} {"train_loss": -27.416706085205078, "global_step": 547196, "epoch": 6592} {"train_loss": -27.42024803161621, "global_step": 547197, "epoch": 6592} {"train_loss": -27.4211368560791, "global_step": 547198, "epoch": 6592} {"train_loss": -27.870996475219727, "global_step": 547199, "epoch": 6592} {"train_loss": -27.5533447265625, "global_step": 547200, "epoch": 6592} {"train_loss": -28.05217933654785, "global_step": 547201, "epoch": 6592} {"train_loss": -27.7585391998291, "global_step": 547202, "epoch": 6592} {"train_loss": -27.31353187561035, "global_step": 547203, "epoch": 6592} {"train_loss": -27.020843505859375, "global_step": 547204, "epoch": 6592} {"train_loss": -27.076568603515625, "global_step": 547205, "epoch": 6592} {"train_loss": -27.690505981445312, "global_step": 547206, "epoch": 6592} {"train_loss": -27.841543197631836, "global_step": 547207, "epoch": 6592} {"train_loss": -27.173192977905273, "global_step": 547208, "epoch": 6592} {"train_loss": -27.90070152282715, "global_step": 547209, "epoch": 6592} {"train_loss": -27.185117721557617, "global_step": 547210, "epoch": 6592} {"train_loss": -27.696033477783203, "global_step": 547211, "epoch": 6592} {"train_loss": -27.593841552734375, "global_step": 547212, "epoch": 6592} {"train_loss": -26.9591121673584, "global_step": 547213, "epoch": 6592} {"train_loss": -27.440353393554688, "global_step": 547214, "epoch": 6592} {"train_loss": -27.565229415893555, "global_step": 547215, "epoch": 6592} {"train_loss": -28.098281860351562, "global_step": 547216, "epoch": 6592} {"train_loss": -27.560455322265625, "global_step": 547217, "epoch": 6592} {"train_loss": -27.658687246851173, "global_step": 547218, "epoch": 6592, "val_loss": 6580684.5} {"train_loss": -27.13982582092285, "global_step": 547219, "epoch": 6593} {"train_loss": -27.643457412719727, "global_step": 547220, "epoch": 6593} {"train_loss": -27.0812931060791, "global_step": 547221, "epoch": 6593} {"train_loss": -27.50543212890625, "global_step": 547222, "epoch": 6593} {"train_loss": -27.081623077392578, "global_step": 547223, "epoch": 6593} {"train_loss": -27.204105377197266, "global_step": 547224, "epoch": 6593} {"train_loss": -27.638532638549805, "global_step": 547225, "epoch": 6593} {"train_loss": -27.698745727539062, "global_step": 547226, "epoch": 6593} {"train_loss": -27.505172729492188, "global_step": 547227, "epoch": 6593} {"train_loss": -27.429885864257812, "global_step": 547228, "epoch": 6593} {"train_loss": -27.747421264648438, "global_step": 547229, "epoch": 6593} {"train_loss": -27.36726951599121, "global_step": 547230, "epoch": 6593} {"train_loss": -27.292417526245117, "global_step": 547231, "epoch": 6593} {"train_loss": -27.33011817932129, "global_step": 547232, "epoch": 6593} {"train_loss": -27.382038116455078, "global_step": 547233, "epoch": 6593} {"train_loss": -27.410993576049805, "global_step": 547234, "epoch": 6593} {"train_loss": -27.6551570892334, "global_step": 547235, "epoch": 6593} {"train_loss": -27.82166862487793, "global_step": 547236, "epoch": 6593} {"train_loss": -27.444416046142578, "global_step": 547237, "epoch": 6593} {"train_loss": -27.612537384033203, "global_step": 547238, "epoch": 6593} {"train_loss": -27.489538192749023, "global_step": 547239, "epoch": 6593} {"train_loss": -27.477142333984375, "global_step": 547240, "epoch": 6593} {"train_loss": -27.6744384765625, "global_step": 547241, "epoch": 6593} {"train_loss": -27.3037166595459, "global_step": 547242, "epoch": 6593} {"train_loss": -27.979272842407227, "global_step": 547243, "epoch": 6593} {"train_loss": -27.6908016204834, "global_step": 547244, "epoch": 6593} {"train_loss": -27.846059799194336, "global_step": 547245, "epoch": 6593} {"train_loss": -28.05765724182129, "global_step": 547246, "epoch": 6593} {"train_loss": -27.76187515258789, "global_step": 547247, "epoch": 6593} {"train_loss": -27.894590377807617, "global_step": 547248, "epoch": 6593} {"train_loss": -27.71124839782715, "global_step": 547249, "epoch": 6593} {"train_loss": -27.756322860717773, "global_step": 547250, "epoch": 6593} {"train_loss": -27.550052642822266, "global_step": 547251, "epoch": 6593} {"train_loss": -27.8761043548584, "global_step": 547252, "epoch": 6593} {"train_loss": -28.093984603881836, "global_step": 547253, "epoch": 6593} {"train_loss": -27.663721084594727, "global_step": 547254, "epoch": 6593} {"train_loss": -27.90882682800293, "global_step": 547255, "epoch": 6593} {"train_loss": -27.942371368408203, "global_step": 547256, "epoch": 6593} {"train_loss": -28.03982925415039, "global_step": 547257, "epoch": 6593} {"train_loss": -27.93141746520996, "global_step": 547258, "epoch": 6593} {"train_loss": -27.622180938720703, "global_step": 547259, "epoch": 6593} {"train_loss": -28.0469913482666, "global_step": 547260, "epoch": 6593} {"train_loss": -27.833911895751953, "global_step": 547261, "epoch": 6593} {"train_loss": -27.53446388244629, "global_step": 547262, "epoch": 6593} {"train_loss": -27.485578536987305, "global_step": 547263, "epoch": 6593} {"train_loss": -28.105558395385742, "global_step": 547264, "epoch": 6593} {"train_loss": -27.884641647338867, "global_step": 547265, "epoch": 6593} {"train_loss": -27.4671688079834, "global_step": 547266, "epoch": 6593} {"train_loss": -27.73907470703125, "global_step": 547267, "epoch": 6593} {"train_loss": -27.78277015686035, "global_step": 547268, "epoch": 6593} {"train_loss": -27.9851016998291, "global_step": 547269, "epoch": 6593} {"train_loss": -27.896045684814453, "global_step": 547270, "epoch": 6593} {"train_loss": -27.731678009033203, "global_step": 547271, "epoch": 6593} {"train_loss": -27.5842227935791, "global_step": 547272, "epoch": 6593} {"train_loss": -27.960580825805664, "global_step": 547273, "epoch": 6593} {"train_loss": -27.82545280456543, "global_step": 547274, "epoch": 6593} {"train_loss": -27.496313095092773, "global_step": 547275, "epoch": 6593} {"train_loss": -27.81060791015625, "global_step": 547276, "epoch": 6593} {"train_loss": -27.47027587890625, "global_step": 547277, "epoch": 6593} {"train_loss": -27.829084396362305, "global_step": 547278, "epoch": 6593} {"train_loss": -28.038776397705078, "global_step": 547279, "epoch": 6593} {"train_loss": -27.638105392456055, "global_step": 547280, "epoch": 6593} {"train_loss": -27.625228881835938, "global_step": 547281, "epoch": 6593} {"train_loss": -27.473474502563477, "global_step": 547282, "epoch": 6593} {"train_loss": -27.7291202545166, "global_step": 547283, "epoch": 6593} {"train_loss": -28.033105850219727, "global_step": 547284, "epoch": 6593} {"train_loss": -27.849496841430664, "global_step": 547285, "epoch": 6593} {"train_loss": -27.632688522338867, "global_step": 547286, "epoch": 6593} {"train_loss": -27.49452781677246, "global_step": 547287, "epoch": 6593} {"train_loss": -27.86855125427246, "global_step": 547288, "epoch": 6593} {"train_loss": -27.8659725189209, "global_step": 547289, "epoch": 6593} {"train_loss": -27.52027702331543, "global_step": 547290, "epoch": 6593} {"train_loss": -27.98575782775879, "global_step": 547291, "epoch": 6593} {"train_loss": -27.62921714782715, "global_step": 547292, "epoch": 6593} {"train_loss": -27.949182510375977, "global_step": 547293, "epoch": 6593} {"train_loss": -27.798511505126953, "global_step": 547294, "epoch": 6593} {"train_loss": -27.802392959594727, "global_step": 547295, "epoch": 6593} {"train_loss": -28.100751876831055, "global_step": 547296, "epoch": 6593} {"train_loss": -27.930343627929688, "global_step": 547297, "epoch": 6593} {"train_loss": -28.05838394165039, "global_step": 547298, "epoch": 6593} {"train_loss": -27.670764923095703, "global_step": 547299, "epoch": 6593} {"train_loss": -27.436323165893555, "global_step": 547300, "epoch": 6593} {"train_loss": -27.701104037732964, "global_step": 547301, "epoch": 6593, "val_loss": 6607447.0} {"train_loss": -26.876379013061523, "global_step": 547302, "epoch": 6594} {"train_loss": -26.674274444580078, "global_step": 547303, "epoch": 6594} {"train_loss": -26.803442001342773, "global_step": 547304, "epoch": 6594} {"train_loss": -27.200590133666992, "global_step": 547305, "epoch": 6594} {"train_loss": -27.26778221130371, "global_step": 547306, "epoch": 6594} {"train_loss": -26.960113525390625, "global_step": 547307, "epoch": 6594} {"train_loss": -27.01295280456543, "global_step": 547308, "epoch": 6594} {"train_loss": -27.368366241455078, "global_step": 547309, "epoch": 6594} {"train_loss": -27.238203048706055, "global_step": 547310, "epoch": 6594} {"train_loss": -26.7814998626709, "global_step": 547311, "epoch": 6594} {"train_loss": -26.92449951171875, "global_step": 547312, "epoch": 6594} {"train_loss": -27.3194580078125, "global_step": 547313, "epoch": 6594} {"train_loss": -27.195356369018555, "global_step": 547314, "epoch": 6594} {"train_loss": -27.307897567749023, "global_step": 547315, "epoch": 6594} {"train_loss": -27.15846824645996, "global_step": 547316, "epoch": 6594} {"train_loss": -27.0673828125, "global_step": 547317, "epoch": 6594} {"train_loss": -27.406208038330078, "global_step": 547318, "epoch": 6594} {"train_loss": -27.40272331237793, "global_step": 547319, "epoch": 6594} {"train_loss": -27.324918746948242, "global_step": 547320, "epoch": 6594} {"train_loss": -26.965208053588867, "global_step": 547321, "epoch": 6594} {"train_loss": -27.224302291870117, "global_step": 547322, "epoch": 6594} {"train_loss": -27.53564453125, "global_step": 547323, "epoch": 6594} {"train_loss": -27.498931884765625, "global_step": 547324, "epoch": 6594} {"train_loss": -27.374561309814453, "global_step": 547325, "epoch": 6594} {"train_loss": -27.472742080688477, "global_step": 547326, "epoch": 6594} {"train_loss": -27.4212703704834, "global_step": 547327, "epoch": 6594} {"train_loss": -27.398208618164062, "global_step": 547328, "epoch": 6594} {"train_loss": -27.72647476196289, "global_step": 547329, "epoch": 6594} {"train_loss": -27.52337074279785, "global_step": 547330, "epoch": 6594} {"train_loss": -27.793365478515625, "global_step": 547331, "epoch": 6594} {"train_loss": -27.660924911499023, "global_step": 547332, "epoch": 6594} {"train_loss": -28.020355224609375, "global_step": 547333, "epoch": 6594} {"train_loss": -27.799482345581055, "global_step": 547334, "epoch": 6594} {"train_loss": -27.851882934570312, "global_step": 547335, "epoch": 6594} {"train_loss": -27.886281967163086, "global_step": 547336, "epoch": 6594} {"train_loss": -27.788122177124023, "global_step": 547337, "epoch": 6594} {"train_loss": -27.767126083374023, "global_step": 547338, "epoch": 6594} {"train_loss": -27.955957412719727, "global_step": 547339, "epoch": 6594} {"train_loss": -27.9044132232666, "global_step": 547340, "epoch": 6594} {"train_loss": -27.864154815673828, "global_step": 547341, "epoch": 6594} {"train_loss": -27.815723419189453, "global_step": 547342, "epoch": 6594} {"train_loss": -28.280729293823242, "global_step": 547343, "epoch": 6594} {"train_loss": -27.710147857666016, "global_step": 547344, "epoch": 6594} {"train_loss": -27.754871368408203, "global_step": 547345, "epoch": 6594} {"train_loss": -28.0556697845459, "global_step": 547346, "epoch": 6594} {"train_loss": -27.820035934448242, "global_step": 547347, "epoch": 6594} {"train_loss": -27.78866958618164, "global_step": 547348, "epoch": 6594} {"train_loss": -27.858945846557617, "global_step": 547349, "epoch": 6594} {"train_loss": -27.709888458251953, "global_step": 547350, "epoch": 6594} {"train_loss": -28.10184669494629, "global_step": 547351, "epoch": 6594} {"train_loss": -27.8284969329834, "global_step": 547352, "epoch": 6594} {"train_loss": -27.861536026000977, "global_step": 547353, "epoch": 6594} {"train_loss": -27.812366485595703, "global_step": 547354, "epoch": 6594} {"train_loss": -27.950387954711914, "global_step": 547355, "epoch": 6594} {"train_loss": -27.759252548217773, "global_step": 547356, "epoch": 6594} {"train_loss": -27.803695678710938, "global_step": 547357, "epoch": 6594} {"train_loss": -27.732086181640625, "global_step": 547358, "epoch": 6594} {"train_loss": -27.607080459594727, "global_step": 547359, "epoch": 6594} {"train_loss": -28.188146591186523, "global_step": 547360, "epoch": 6594} {"train_loss": -28.12628173828125, "global_step": 547361, "epoch": 6594} {"train_loss": -28.11846923828125, "global_step": 547362, "epoch": 6594} {"train_loss": -27.79542350769043, "global_step": 547363, "epoch": 6594} {"train_loss": -27.850255966186523, "global_step": 547364, "epoch": 6594} {"train_loss": -28.181304931640625, "global_step": 547365, "epoch": 6594} {"train_loss": -27.640562057495117, "global_step": 547366, "epoch": 6594} {"train_loss": -27.816694259643555, "global_step": 547367, "epoch": 6594} {"train_loss": -27.647205352783203, "global_step": 547368, "epoch": 6594} {"train_loss": -26.900577545166016, "global_step": 547369, "epoch": 6594} {"train_loss": -25.943195343017578, "global_step": 547370, "epoch": 6594} {"train_loss": -26.02882194519043, "global_step": 547371, "epoch": 6594} {"train_loss": -26.554691314697266, "global_step": 547372, "epoch": 6594} {"train_loss": -26.58574867248535, "global_step": 547373, "epoch": 6594} {"train_loss": -26.157394409179688, "global_step": 547374, "epoch": 6594} {"train_loss": -26.706787109375, "global_step": 547375, "epoch": 6594} {"train_loss": -26.957931518554688, "global_step": 547376, "epoch": 6594} {"train_loss": -26.96332359313965, "global_step": 547377, "epoch": 6594} {"train_loss": -26.786731719970703, "global_step": 547378, "epoch": 6594} {"train_loss": -27.063232421875, "global_step": 547379, "epoch": 6594} {"train_loss": -27.69819450378418, "global_step": 547380, "epoch": 6594} {"train_loss": -27.267053604125977, "global_step": 547381, "epoch": 6594} {"train_loss": -27.450910568237305, "global_step": 547382, "epoch": 6594} {"train_loss": -27.602941513061523, "global_step": 547383, "epoch": 6594} {"train_loss": -27.449630323662817, "global_step": 547384, "epoch": 6594, "val_loss": 6597768.0} {"train_loss": -27.315942764282227, "global_step": 547385, "epoch": 6595} {"train_loss": -26.7735538482666, "global_step": 547386, "epoch": 6595} {"train_loss": -26.90581703186035, "global_step": 547387, "epoch": 6595} {"train_loss": -26.735315322875977, "global_step": 547388, "epoch": 6595} {"train_loss": -27.067533493041992, "global_step": 547389, "epoch": 6595} {"train_loss": -27.1669979095459, "global_step": 547390, "epoch": 6595} {"train_loss": -27.40778160095215, "global_step": 547391, "epoch": 6595} {"train_loss": -26.669843673706055, "global_step": 547392, "epoch": 6595} {"train_loss": -26.940235137939453, "global_step": 547393, "epoch": 6595} {"train_loss": -27.078176498413086, "global_step": 547394, "epoch": 6595} {"train_loss": -27.2462215423584, "global_step": 547395, "epoch": 6595} {"train_loss": -27.295896530151367, "global_step": 547396, "epoch": 6595} {"train_loss": -27.21079444885254, "global_step": 547397, "epoch": 6595} {"train_loss": -27.21952247619629, "global_step": 547398, "epoch": 6595} {"train_loss": -27.53741455078125, "global_step": 547399, "epoch": 6595} {"train_loss": -27.147781372070312, "global_step": 547400, "epoch": 6595} {"train_loss": -27.42146110534668, "global_step": 547401, "epoch": 6595} {"train_loss": -27.3618221282959, "global_step": 547402, "epoch": 6595} {"train_loss": -27.4324893951416, "global_step": 547403, "epoch": 6595} {"train_loss": -27.470739364624023, "global_step": 547404, "epoch": 6595} {"train_loss": -27.206058502197266, "global_step": 547405, "epoch": 6595} {"train_loss": -27.286087036132812, "global_step": 547406, "epoch": 6595} {"train_loss": -27.630212783813477, "global_step": 547407, "epoch": 6595} {"train_loss": -27.067371368408203, "global_step": 547408, "epoch": 6595} {"train_loss": -27.64533042907715, "global_step": 547409, "epoch": 6595} {"train_loss": -27.629150390625, "global_step": 547410, "epoch": 6595} {"train_loss": -27.709630966186523, "global_step": 547411, "epoch": 6595} {"train_loss": -27.86720085144043, "global_step": 547412, "epoch": 6595} {"train_loss": -27.334070205688477, "global_step": 547413, "epoch": 6595} {"train_loss": -27.68792724609375, "global_step": 547414, "epoch": 6595} {"train_loss": -27.83877944946289, "global_step": 547415, "epoch": 6595} {"train_loss": -27.425495147705078, "global_step": 547416, "epoch": 6595} {"train_loss": -27.831317901611328, "global_step": 547417, "epoch": 6595} {"train_loss": -27.725467681884766, "global_step": 547418, "epoch": 6595} {"train_loss": -27.605701446533203, "global_step": 547419, "epoch": 6595} {"train_loss": -27.690521240234375, "global_step": 547420, "epoch": 6595} {"train_loss": -27.754703521728516, "global_step": 547421, "epoch": 6595} {"train_loss": -27.488981246948242, "global_step": 547422, "epoch": 6595} {"train_loss": -27.987516403198242, "global_step": 547423, "epoch": 6595} {"train_loss": -27.743993759155273, "global_step": 547424, "epoch": 6595} {"train_loss": -27.8916072845459, "global_step": 547425, "epoch": 6595} {"train_loss": -27.997602462768555, "global_step": 547426, "epoch": 6595} {"train_loss": -28.17876625061035, "global_step": 547427, "epoch": 6595} {"train_loss": -27.703821182250977, "global_step": 547428, "epoch": 6595} {"train_loss": -27.93963623046875, "global_step": 547429, "epoch": 6595} {"train_loss": -27.803512573242188, "global_step": 547430, "epoch": 6595} {"train_loss": -27.987646102905273, "global_step": 547431, "epoch": 6595} {"train_loss": -28.118396759033203, "global_step": 547432, "epoch": 6595} {"train_loss": -28.106525421142578, "global_step": 547433, "epoch": 6595} {"train_loss": -28.02805519104004, "global_step": 547434, "epoch": 6595} {"train_loss": -27.7586669921875, "global_step": 547435, "epoch": 6595} {"train_loss": -27.5135555267334, "global_step": 547436, "epoch": 6595} {"train_loss": -27.72821044921875, "global_step": 547437, "epoch": 6595} {"train_loss": -27.880414962768555, "global_step": 547438, "epoch": 6595} {"train_loss": -28.12518310546875, "global_step": 547439, "epoch": 6595} {"train_loss": -27.939239501953125, "global_step": 547440, "epoch": 6595} {"train_loss": -27.3704776763916, "global_step": 547441, "epoch": 6595} {"train_loss": -27.706958770751953, "global_step": 547442, "epoch": 6595} {"train_loss": -27.657123565673828, "global_step": 547443, "epoch": 6595} {"train_loss": -27.59983253479004, "global_step": 547444, "epoch": 6595} {"train_loss": -27.515640258789062, "global_step": 547445, "epoch": 6595} {"train_loss": -27.801029205322266, "global_step": 547446, "epoch": 6595} {"train_loss": -28.1387996673584, "global_step": 547447, "epoch": 6595} {"train_loss": -27.930450439453125, "global_step": 547448, "epoch": 6595} {"train_loss": -27.79376220703125, "global_step": 547449, "epoch": 6595} {"train_loss": -28.010419845581055, "global_step": 547450, "epoch": 6595} {"train_loss": -27.60359001159668, "global_step": 547451, "epoch": 6595} {"train_loss": -27.53546714782715, "global_step": 547452, "epoch": 6595} {"train_loss": -27.86328125, "global_step": 547453, "epoch": 6595} {"train_loss": -27.57489013671875, "global_step": 547454, "epoch": 6595} {"train_loss": -28.291852951049805, "global_step": 547455, "epoch": 6595} {"train_loss": -27.90643310546875, "global_step": 547456, "epoch": 6595} {"train_loss": -27.31611442565918, "global_step": 547457, "epoch": 6595} {"train_loss": -28.128345489501953, "global_step": 547458, "epoch": 6595} {"train_loss": -28.26714515686035, "global_step": 547459, "epoch": 6595} {"train_loss": -27.690229415893555, "global_step": 547460, "epoch": 6595} {"train_loss": -27.72794532775879, "global_step": 547461, "epoch": 6595} {"train_loss": -28.050918579101562, "global_step": 547462, "epoch": 6595} {"train_loss": -27.42822265625, "global_step": 547463, "epoch": 6595} {"train_loss": -27.48262596130371, "global_step": 547464, "epoch": 6595} {"train_loss": -28.0128116607666, "global_step": 547465, "epoch": 6595} {"train_loss": -27.620349884033203, "global_step": 547466, "epoch": 6595} {"train_loss": -27.624364692044544, "global_step": 547467, "epoch": 6595, "val_loss": 6590621.5} {"train_loss": -26.741607666015625, "global_step": 547468, "epoch": 6596} {"train_loss": -26.049047470092773, "global_step": 547469, "epoch": 6596} {"train_loss": -25.94557762145996, "global_step": 547470, "epoch": 6596} {"train_loss": -27.129932403564453, "global_step": 547471, "epoch": 6596} {"train_loss": -26.29456901550293, "global_step": 547472, "epoch": 6596} {"train_loss": -25.905954360961914, "global_step": 547473, "epoch": 6596} {"train_loss": -26.888181686401367, "global_step": 547474, "epoch": 6596} {"train_loss": -27.1633358001709, "global_step": 547475, "epoch": 6596} {"train_loss": -27.219467163085938, "global_step": 547476, "epoch": 6596} {"train_loss": -27.04673194885254, "global_step": 547477, "epoch": 6596} {"train_loss": -27.13991355895996, "global_step": 547478, "epoch": 6596} {"train_loss": -27.157230377197266, "global_step": 547479, "epoch": 6596} {"train_loss": -26.722442626953125, "global_step": 547480, "epoch": 6596} {"train_loss": -27.08277702331543, "global_step": 547481, "epoch": 6596} {"train_loss": -27.36077880859375, "global_step": 547482, "epoch": 6596} {"train_loss": -27.018117904663086, "global_step": 547483, "epoch": 6596} {"train_loss": -27.493545532226562, "global_step": 547484, "epoch": 6596} {"train_loss": -27.272897720336914, "global_step": 547485, "epoch": 6596} {"train_loss": -27.006208419799805, "global_step": 547486, "epoch": 6596} {"train_loss": -27.542072296142578, "global_step": 547487, "epoch": 6596} {"train_loss": -27.5770263671875, "global_step": 547488, "epoch": 6596} {"train_loss": -26.861799240112305, "global_step": 547489, "epoch": 6596} {"train_loss": -27.232595443725586, "global_step": 547490, "epoch": 6596} {"train_loss": -27.2901611328125, "global_step": 547491, "epoch": 6596} {"train_loss": -27.714950561523438, "global_step": 547492, "epoch": 6596} {"train_loss": -27.73073387145996, "global_step": 547493, "epoch": 6596} {"train_loss": -27.361652374267578, "global_step": 547494, "epoch": 6596} {"train_loss": -27.54340934753418, "global_step": 547495, "epoch": 6596} {"train_loss": -27.702661514282227, "global_step": 547496, "epoch": 6596} {"train_loss": -27.558195114135742, "global_step": 547497, "epoch": 6596} {"train_loss": -27.7525691986084, "global_step": 547498, "epoch": 6596} {"train_loss": -27.919904708862305, "global_step": 547499, "epoch": 6596} {"train_loss": -27.560285568237305, "global_step": 547500, "epoch": 6596} {"train_loss": -27.772537231445312, "global_step": 547501, "epoch": 6596} {"train_loss": -27.549962997436523, "global_step": 547502, "epoch": 6596} {"train_loss": -27.96504020690918, "global_step": 547503, "epoch": 6596} {"train_loss": -27.5285701751709, "global_step": 547504, "epoch": 6596} {"train_loss": -27.92670249938965, "global_step": 547505, "epoch": 6596} {"train_loss": -27.792448043823242, "global_step": 547506, "epoch": 6596} {"train_loss": -27.84113883972168, "global_step": 547507, "epoch": 6596} {"train_loss": -27.851093292236328, "global_step": 547508, "epoch": 6596} {"train_loss": -27.678699493408203, "global_step": 547509, "epoch": 6596} {"train_loss": -27.7544002532959, "global_step": 547510, "epoch": 6596} {"train_loss": -27.817752838134766, "global_step": 547511, "epoch": 6596} {"train_loss": -28.06939697265625, "global_step": 547512, "epoch": 6596} {"train_loss": -27.657373428344727, "global_step": 547513, "epoch": 6596} {"train_loss": -27.87977409362793, "global_step": 547514, "epoch": 6596} {"train_loss": -27.749515533447266, "global_step": 547515, "epoch": 6596} {"train_loss": -27.9101505279541, "global_step": 547516, "epoch": 6596} {"train_loss": -27.892169952392578, "global_step": 547517, "epoch": 6596} {"train_loss": -27.566425323486328, "global_step": 547518, "epoch": 6596} {"train_loss": -27.852008819580078, "global_step": 547519, "epoch": 6596} {"train_loss": -28.122671127319336, "global_step": 547520, "epoch": 6596} {"train_loss": -27.521411895751953, "global_step": 547521, "epoch": 6596} {"train_loss": -27.852294921875, "global_step": 547522, "epoch": 6596} {"train_loss": -27.83536148071289, "global_step": 547523, "epoch": 6596} {"train_loss": -27.681852340698242, "global_step": 547524, "epoch": 6596} {"train_loss": -27.82724380493164, "global_step": 547525, "epoch": 6596} {"train_loss": -27.61402702331543, "global_step": 547526, "epoch": 6596} {"train_loss": -28.0733699798584, "global_step": 547527, "epoch": 6596} {"train_loss": -27.540388107299805, "global_step": 547528, "epoch": 6596} {"train_loss": -27.595396041870117, "global_step": 547529, "epoch": 6596} {"train_loss": -27.682397842407227, "global_step": 547530, "epoch": 6596} {"train_loss": -27.78839111328125, "global_step": 547531, "epoch": 6596} {"train_loss": -27.82716178894043, "global_step": 547532, "epoch": 6596} {"train_loss": -27.601795196533203, "global_step": 547533, "epoch": 6596} {"train_loss": -27.8001766204834, "global_step": 547534, "epoch": 6596} {"train_loss": -27.8946533203125, "global_step": 547535, "epoch": 6596} {"train_loss": -27.71038246154785, "global_step": 547536, "epoch": 6596} {"train_loss": -27.290512084960938, "global_step": 547537, "epoch": 6596} {"train_loss": -27.370080947875977, "global_step": 547538, "epoch": 6596} {"train_loss": -28.14728355407715, "global_step": 547539, "epoch": 6596} {"train_loss": -27.998687744140625, "global_step": 547540, "epoch": 6596} {"train_loss": -27.676923751831055, "global_step": 547541, "epoch": 6596} {"train_loss": -27.79583168029785, "global_step": 547542, "epoch": 6596} {"train_loss": -28.194761276245117, "global_step": 547543, "epoch": 6596} {"train_loss": -27.626922607421875, "global_step": 547544, "epoch": 6596} {"train_loss": -27.80354881286621, "global_step": 547545, "epoch": 6596} {"train_loss": -27.582914352416992, "global_step": 547546, "epoch": 6596} {"train_loss": -27.861143112182617, "global_step": 547547, "epoch": 6596} {"train_loss": -27.285175323486328, "global_step": 547548, "epoch": 6596} {"train_loss": -27.514057159423828, "global_step": 547549, "epoch": 6596} {"train_loss": -27.526609995278967, "global_step": 547550, "epoch": 6596, "val_loss": 6631021.0} {"train_loss": -27.103681564331055, "global_step": 547551, "epoch": 6597} {"train_loss": -27.649768829345703, "global_step": 547552, "epoch": 6597} {"train_loss": -27.081525802612305, "global_step": 547553, "epoch": 6597} {"train_loss": -27.002897262573242, "global_step": 547554, "epoch": 6597} {"train_loss": -27.104528427124023, "global_step": 547555, "epoch": 6597} {"train_loss": -27.4228515625, "global_step": 547556, "epoch": 6597} {"train_loss": -27.227087020874023, "global_step": 547557, "epoch": 6597} {"train_loss": -27.249963760375977, "global_step": 547558, "epoch": 6597} {"train_loss": -27.209625244140625, "global_step": 547559, "epoch": 6597} {"train_loss": -26.7357234954834, "global_step": 547560, "epoch": 6597} {"train_loss": -27.41486930847168, "global_step": 547561, "epoch": 6597} {"train_loss": -27.0142879486084, "global_step": 547562, "epoch": 6597} {"train_loss": -27.33009147644043, "global_step": 547563, "epoch": 6597} {"train_loss": -27.468103408813477, "global_step": 547564, "epoch": 6597} {"train_loss": -27.4824275970459, "global_step": 547565, "epoch": 6597} {"train_loss": -27.278839111328125, "global_step": 547566, "epoch": 6597} {"train_loss": -27.542957305908203, "global_step": 547567, "epoch": 6597} {"train_loss": -27.793670654296875, "global_step": 547568, "epoch": 6597} {"train_loss": -27.731475830078125, "global_step": 547569, "epoch": 6597} {"train_loss": -27.7869873046875, "global_step": 547570, "epoch": 6597} {"train_loss": -27.734668731689453, "global_step": 547571, "epoch": 6597} {"train_loss": -27.432676315307617, "global_step": 547572, "epoch": 6597} {"train_loss": -27.313825607299805, "global_step": 547573, "epoch": 6597} {"train_loss": -27.72767448425293, "global_step": 547574, "epoch": 6597} {"train_loss": -27.922697067260742, "global_step": 547575, "epoch": 6597} {"train_loss": -27.601806640625, "global_step": 547576, "epoch": 6597} {"train_loss": -27.555042266845703, "global_step": 547577, "epoch": 6597} {"train_loss": -27.820837020874023, "global_step": 547578, "epoch": 6597} {"train_loss": -27.64426040649414, "global_step": 547579, "epoch": 6597} {"train_loss": -27.597936630249023, "global_step": 547580, "epoch": 6597} {"train_loss": -27.69880485534668, "global_step": 547581, "epoch": 6597} {"train_loss": -27.74261474609375, "global_step": 547582, "epoch": 6597} {"train_loss": -27.272790908813477, "global_step": 547583, "epoch": 6597} {"train_loss": -27.14544677734375, "global_step": 547584, "epoch": 6597} {"train_loss": -27.584701538085938, "global_step": 547585, "epoch": 6597} {"train_loss": -27.566991806030273, "global_step": 547586, "epoch": 6597} {"train_loss": -27.43357276916504, "global_step": 547587, "epoch": 6597} {"train_loss": -27.587141036987305, "global_step": 547588, "epoch": 6597} {"train_loss": -27.544233322143555, "global_step": 547589, "epoch": 6597} {"train_loss": -27.788293838500977, "global_step": 547590, "epoch": 6597} {"train_loss": -27.60357093811035, "global_step": 547591, "epoch": 6597} {"train_loss": -27.653308868408203, "global_step": 547592, "epoch": 6597} {"train_loss": -27.627134323120117, "global_step": 547593, "epoch": 6597} {"train_loss": -27.53127098083496, "global_step": 547594, "epoch": 6597} {"train_loss": -27.980878829956055, "global_step": 547595, "epoch": 6597} {"train_loss": -27.96329689025879, "global_step": 547596, "epoch": 6597} {"train_loss": -27.4808292388916, "global_step": 547597, "epoch": 6597} {"train_loss": -27.434680938720703, "global_step": 547598, "epoch": 6597} {"train_loss": -27.781705856323242, "global_step": 547599, "epoch": 6597} {"train_loss": -27.526315689086914, "global_step": 547600, "epoch": 6597} {"train_loss": -27.73602294921875, "global_step": 547601, "epoch": 6597} {"train_loss": -27.685840606689453, "global_step": 547602, "epoch": 6597} {"train_loss": -27.6829891204834, "global_step": 547603, "epoch": 6597} {"train_loss": -27.837018966674805, "global_step": 547604, "epoch": 6597} {"train_loss": -27.763296127319336, "global_step": 547605, "epoch": 6597} {"train_loss": -27.758569717407227, "global_step": 547606, "epoch": 6597} {"train_loss": -28.0006046295166, "global_step": 547607, "epoch": 6597} {"train_loss": -27.77825355529785, "global_step": 547608, "epoch": 6597} {"train_loss": -27.740610122680664, "global_step": 547609, "epoch": 6597} {"train_loss": -27.7154541015625, "global_step": 547610, "epoch": 6597} {"train_loss": -27.477081298828125, "global_step": 547611, "epoch": 6597} {"train_loss": -27.98978614807129, "global_step": 547612, "epoch": 6597} {"train_loss": -27.7501277923584, "global_step": 547613, "epoch": 6597} {"train_loss": -27.676986694335938, "global_step": 547614, "epoch": 6597} {"train_loss": -27.78369140625, "global_step": 547615, "epoch": 6597} {"train_loss": -27.720617294311523, "global_step": 547616, "epoch": 6597} {"train_loss": -27.873926162719727, "global_step": 547617, "epoch": 6597} {"train_loss": -27.326099395751953, "global_step": 547618, "epoch": 6597} {"train_loss": -27.68694496154785, "global_step": 547619, "epoch": 6597} {"train_loss": -27.373456954956055, "global_step": 547620, "epoch": 6597} {"train_loss": -27.933385848999023, "global_step": 547621, "epoch": 6597} {"train_loss": -27.586902618408203, "global_step": 547622, "epoch": 6597} {"train_loss": -27.477142333984375, "global_step": 547623, "epoch": 6597} {"train_loss": -27.864181518554688, "global_step": 547624, "epoch": 6597} {"train_loss": -27.735193252563477, "global_step": 547625, "epoch": 6597} {"train_loss": -28.012975692749023, "global_step": 547626, "epoch": 6597} {"train_loss": -27.822967529296875, "global_step": 547627, "epoch": 6597} {"train_loss": -27.998971939086914, "global_step": 547628, "epoch": 6597} {"train_loss": -27.469640731811523, "global_step": 547629, "epoch": 6597} {"train_loss": -27.818456649780273, "global_step": 547630, "epoch": 6597} {"train_loss": -28.103879928588867, "global_step": 547631, "epoch": 6597} {"train_loss": -27.557514190673828, "global_step": 547632, "epoch": 6597} {"train_loss": -27.55930273216891, "global_step": 547633, "epoch": 6597, "val_loss": 6547237.5} {"train_loss": -25.92091178894043, "global_step": 547634, "epoch": 6598} {"train_loss": -26.463932037353516, "global_step": 547635, "epoch": 6598} {"train_loss": -25.920068740844727, "global_step": 547636, "epoch": 6598} {"train_loss": -24.183218002319336, "global_step": 547637, "epoch": 6598} {"train_loss": -26.66473388671875, "global_step": 547638, "epoch": 6598} {"train_loss": -26.29474449157715, "global_step": 547639, "epoch": 6598} {"train_loss": -26.417194366455078, "global_step": 547640, "epoch": 6598} {"train_loss": -25.90992546081543, "global_step": 547641, "epoch": 6598} {"train_loss": -26.987014770507812, "global_step": 547642, "epoch": 6598} {"train_loss": -26.622970581054688, "global_step": 547643, "epoch": 6598} {"train_loss": -26.695877075195312, "global_step": 547644, "epoch": 6598} {"train_loss": -27.125898361206055, "global_step": 547645, "epoch": 6598} {"train_loss": -26.50809669494629, "global_step": 547646, "epoch": 6598} {"train_loss": -27.271711349487305, "global_step": 547647, "epoch": 6598} {"train_loss": -27.152816772460938, "global_step": 547648, "epoch": 6598} {"train_loss": -27.236738204956055, "global_step": 547649, "epoch": 6598} {"train_loss": -27.008121490478516, "global_step": 547650, "epoch": 6598} {"train_loss": -27.282743453979492, "global_step": 547651, "epoch": 6598} {"train_loss": -27.365354537963867, "global_step": 547652, "epoch": 6598} {"train_loss": -27.01381492614746, "global_step": 547653, "epoch": 6598} {"train_loss": -27.4934139251709, "global_step": 547654, "epoch": 6598} {"train_loss": -27.164844512939453, "global_step": 547655, "epoch": 6598} {"train_loss": -27.07651710510254, "global_step": 547656, "epoch": 6598} {"train_loss": -27.499792098999023, "global_step": 547657, "epoch": 6598} {"train_loss": -27.839111328125, "global_step": 547658, "epoch": 6598} {"train_loss": -27.498504638671875, "global_step": 547659, "epoch": 6598} {"train_loss": -27.146589279174805, "global_step": 547660, "epoch": 6598} {"train_loss": -27.757238388061523, "global_step": 547661, "epoch": 6598} {"train_loss": -27.509357452392578, "global_step": 547662, "epoch": 6598} {"train_loss": -27.571653366088867, "global_step": 547663, "epoch": 6598} {"train_loss": -27.59701919555664, "global_step": 547664, "epoch": 6598} {"train_loss": -27.646345138549805, "global_step": 547665, "epoch": 6598} {"train_loss": -27.526275634765625, "global_step": 547666, "epoch": 6598} {"train_loss": -27.510343551635742, "global_step": 547667, "epoch": 6598} {"train_loss": -27.866743087768555, "global_step": 547668, "epoch": 6598} {"train_loss": -26.987783432006836, "global_step": 547669, "epoch": 6598} {"train_loss": -27.4936466217041, "global_step": 547670, "epoch": 6598} {"train_loss": -27.39580726623535, "global_step": 547671, "epoch": 6598} {"train_loss": -26.9035587310791, "global_step": 547672, "epoch": 6598} {"train_loss": -27.1820125579834, "global_step": 547673, "epoch": 6598} {"train_loss": -27.6605167388916, "global_step": 547674, "epoch": 6598} {"train_loss": -27.526416778564453, "global_step": 547675, "epoch": 6598} {"train_loss": -27.839588165283203, "global_step": 547676, "epoch": 6598} {"train_loss": -27.001331329345703, "global_step": 547677, "epoch": 6598} {"train_loss": -27.35532569885254, "global_step": 547678, "epoch": 6598} {"train_loss": -27.399255752563477, "global_step": 547679, "epoch": 6598} {"train_loss": -27.520645141601562, "global_step": 547680, "epoch": 6598} {"train_loss": -27.429523468017578, "global_step": 547681, "epoch": 6598} {"train_loss": -27.88360595703125, "global_step": 547682, "epoch": 6598} {"train_loss": -27.27460289001465, "global_step": 547683, "epoch": 6598} {"train_loss": -27.27570152282715, "global_step": 547684, "epoch": 6598} {"train_loss": -27.786087036132812, "global_step": 547685, "epoch": 6598} {"train_loss": -27.48354148864746, "global_step": 547686, "epoch": 6598} {"train_loss": -27.767364501953125, "global_step": 547687, "epoch": 6598} {"train_loss": -27.50362205505371, "global_step": 547688, "epoch": 6598} {"train_loss": -27.616424560546875, "global_step": 547689, "epoch": 6598} {"train_loss": -27.73345375061035, "global_step": 547690, "epoch": 6598} {"train_loss": -27.738555908203125, "global_step": 547691, "epoch": 6598} {"train_loss": -27.699249267578125, "global_step": 547692, "epoch": 6598} {"train_loss": -27.462299346923828, "global_step": 547693, "epoch": 6598} {"train_loss": -27.6245059967041, "global_step": 547694, "epoch": 6598} {"train_loss": -27.947662353515625, "global_step": 547695, "epoch": 6598} {"train_loss": -27.576618194580078, "global_step": 547696, "epoch": 6598} {"train_loss": -27.389204025268555, "global_step": 547697, "epoch": 6598} {"train_loss": -27.7333984375, "global_step": 547698, "epoch": 6598} {"train_loss": -27.75381851196289, "global_step": 547699, "epoch": 6598} {"train_loss": -27.335662841796875, "global_step": 547700, "epoch": 6598} {"train_loss": -27.76123046875, "global_step": 547701, "epoch": 6598} {"train_loss": -27.67706298828125, "global_step": 547702, "epoch": 6598} {"train_loss": -27.805444717407227, "global_step": 547703, "epoch": 6598} {"train_loss": -27.83355712890625, "global_step": 547704, "epoch": 6598} {"train_loss": -27.922651290893555, "global_step": 547705, "epoch": 6598} {"train_loss": -27.6240291595459, "global_step": 547706, "epoch": 6598} {"train_loss": -27.918750762939453, "global_step": 547707, "epoch": 6598} {"train_loss": -27.841970443725586, "global_step": 547708, "epoch": 6598} {"train_loss": -27.945966720581055, "global_step": 547709, "epoch": 6598} {"train_loss": -27.777191162109375, "global_step": 547710, "epoch": 6598} {"train_loss": -27.829818725585938, "global_step": 547711, "epoch": 6598} {"train_loss": -28.065876007080078, "global_step": 547712, "epoch": 6598} {"train_loss": -27.917444229125977, "global_step": 547713, "epoch": 6598} {"train_loss": -28.107831954956055, "global_step": 547714, "epoch": 6598} {"train_loss": -27.906707763671875, "global_step": 547715, "epoch": 6598} {"train_loss": -27.33527075526226, "global_step": 547716, "epoch": 6598, "val_loss": 6570576.0} {"train_loss": -26.992034912109375, "global_step": 547717, "epoch": 6599} {"train_loss": -26.21660804748535, "global_step": 547718, "epoch": 6599} {"train_loss": -26.693450927734375, "global_step": 547719, "epoch": 6599} {"train_loss": -27.77833366394043, "global_step": 547720, "epoch": 6599} {"train_loss": -27.593896865844727, "global_step": 547721, "epoch": 6599} {"train_loss": -27.191556930541992, "global_step": 547722, "epoch": 6599} {"train_loss": -27.433258056640625, "global_step": 547723, "epoch": 6599} {"train_loss": -27.021997451782227, "global_step": 547724, "epoch": 6599} {"train_loss": -27.366907119750977, "global_step": 547725, "epoch": 6599} {"train_loss": -27.32062339782715, "global_step": 547726, "epoch": 6599} {"train_loss": -27.934789657592773, "global_step": 547727, "epoch": 6599} {"train_loss": -27.5301513671875, "global_step": 547728, "epoch": 6599} {"train_loss": -27.638202667236328, "global_step": 547729, "epoch": 6599} {"train_loss": -27.485456466674805, "global_step": 547730, "epoch": 6599} {"train_loss": -27.99408531188965, "global_step": 547731, "epoch": 6599} {"train_loss": -27.576644897460938, "global_step": 547732, "epoch": 6599} {"train_loss": -27.74028968811035, "global_step": 547733, "epoch": 6599} {"train_loss": -27.81806755065918, "global_step": 547734, "epoch": 6599} {"train_loss": -27.874975204467773, "global_step": 547735, "epoch": 6599} {"train_loss": -27.48528480529785, "global_step": 547736, "epoch": 6599} {"train_loss": -27.51165199279785, "global_step": 547737, "epoch": 6599} {"train_loss": -27.235815048217773, "global_step": 547738, "epoch": 6599} {"train_loss": -27.771772384643555, "global_step": 547739, "epoch": 6599} {"train_loss": -27.370405197143555, "global_step": 547740, "epoch": 6599} {"train_loss": -27.668930053710938, "global_step": 547741, "epoch": 6599} {"train_loss": -27.620162963867188, "global_step": 547742, "epoch": 6599} {"train_loss": -27.810556411743164, "global_step": 547743, "epoch": 6599} {"train_loss": -27.991735458374023, "global_step": 547744, "epoch": 6599} {"train_loss": -27.9555606842041, "global_step": 547745, "epoch": 6599} {"train_loss": -27.9527645111084, "global_step": 547746, "epoch": 6599} {"train_loss": -27.94895362854004, "global_step": 547747, "epoch": 6599} {"train_loss": -28.08100700378418, "global_step": 547748, "epoch": 6599} {"train_loss": -27.68683433532715, "global_step": 547749, "epoch": 6599} {"train_loss": -28.003202438354492, "global_step": 547750, "epoch": 6599} {"train_loss": -27.780370712280273, "global_step": 547751, "epoch": 6599} {"train_loss": -27.44951820373535, "global_step": 547752, "epoch": 6599} {"train_loss": -28.107254028320312, "global_step": 547753, "epoch": 6599} {"train_loss": -27.6937198638916, "global_step": 547754, "epoch": 6599} {"train_loss": -27.8135929107666, "global_step": 547755, "epoch": 6599} {"train_loss": -27.472864151000977, "global_step": 547756, "epoch": 6599} {"train_loss": -27.878198623657227, "global_step": 547757, "epoch": 6599} {"train_loss": -27.822269439697266, "global_step": 547758, "epoch": 6599} {"train_loss": -27.903547286987305, "global_step": 547759, "epoch": 6599} {"train_loss": -27.672895431518555, "global_step": 547760, "epoch": 6599} {"train_loss": -27.644062042236328, "global_step": 547761, "epoch": 6599} {"train_loss": -27.863723754882812, "global_step": 547762, "epoch": 6599} {"train_loss": -27.99883460998535, "global_step": 547763, "epoch": 6599} {"train_loss": -27.742856979370117, "global_step": 547764, "epoch": 6599} {"train_loss": -27.69742774963379, "global_step": 547765, "epoch": 6599} {"train_loss": -27.738195419311523, "global_step": 547766, "epoch": 6599} {"train_loss": -27.387969970703125, "global_step": 547767, "epoch": 6599} {"train_loss": -27.594770431518555, "global_step": 547768, "epoch": 6599} {"train_loss": -28.007862091064453, "global_step": 547769, "epoch": 6599} {"train_loss": -27.770315170288086, "global_step": 547770, "epoch": 6599} {"train_loss": -27.746353149414062, "global_step": 547771, "epoch": 6599} {"train_loss": -27.930866241455078, "global_step": 547772, "epoch": 6599} {"train_loss": -28.023099899291992, "global_step": 547773, "epoch": 6599} {"train_loss": -27.308563232421875, "global_step": 547774, "epoch": 6599} {"train_loss": -27.65292739868164, "global_step": 547775, "epoch": 6599} {"train_loss": -27.4938907623291, "global_step": 547776, "epoch": 6599} {"train_loss": -27.640363693237305, "global_step": 547777, "epoch": 6599} {"train_loss": -28.211618423461914, "global_step": 547778, "epoch": 6599} {"train_loss": -27.663915634155273, "global_step": 547779, "epoch": 6599} {"train_loss": -27.634754180908203, "global_step": 547780, "epoch": 6599} {"train_loss": -27.380340576171875, "global_step": 547781, "epoch": 6599} {"train_loss": -27.539886474609375, "global_step": 547782, "epoch": 6599} {"train_loss": -27.79779624938965, "global_step": 547783, "epoch": 6599} {"train_loss": -27.43219566345215, "global_step": 547784, "epoch": 6599} {"train_loss": -27.841276168823242, "global_step": 547785, "epoch": 6599} {"train_loss": -27.5887508392334, "global_step": 547786, "epoch": 6599} {"train_loss": -27.644149780273438, "global_step": 547787, "epoch": 6599} {"train_loss": -27.673871994018555, "global_step": 547788, "epoch": 6599} {"train_loss": -27.910329818725586, "global_step": 547789, "epoch": 6599} {"train_loss": -27.626922607421875, "global_step": 547790, "epoch": 6599} {"train_loss": -27.906982421875, "global_step": 547791, "epoch": 6599} {"train_loss": -27.174890518188477, "global_step": 547792, "epoch": 6599} {"train_loss": -27.561185836791992, "global_step": 547793, "epoch": 6599} {"train_loss": -27.594547271728516, "global_step": 547794, "epoch": 6599} {"train_loss": -27.958209991455078, "global_step": 547795, "epoch": 6599} {"train_loss": -27.7322940826416, "global_step": 547796, "epoch": 6599} {"train_loss": -27.670934677124023, "global_step": 547797, "epoch": 6599} {"train_loss": -27.46705436706543, "global_step": 547798, "epoch": 6599} {"train_loss": -27.66209990719715, "global_step": 547799, "epoch": 6599, "val_loss": 6567251.0} {"train_loss": -26.79416847229004, "global_step": 547800, "epoch": 6600} {"train_loss": -25.46729850769043, "global_step": 547801, "epoch": 6600} {"train_loss": -26.450885772705078, "global_step": 547802, "epoch": 6600} {"train_loss": -25.47960662841797, "global_step": 547803, "epoch": 6600} {"train_loss": -26.714704513549805, "global_step": 547804, "epoch": 6600} {"train_loss": -27.082284927368164, "global_step": 547805, "epoch": 6600} {"train_loss": -26.5079288482666, "global_step": 547806, "epoch": 6600} {"train_loss": -27.101917266845703, "global_step": 547807, "epoch": 6600} {"train_loss": -26.443374633789062, "global_step": 547808, "epoch": 6600} {"train_loss": -27.1922607421875, "global_step": 547809, "epoch": 6600} {"train_loss": -26.86820411682129, "global_step": 547810, "epoch": 6600} {"train_loss": -26.92116355895996, "global_step": 547811, "epoch": 6600} {"train_loss": -26.807336807250977, "global_step": 547812, "epoch": 6600} {"train_loss": -27.347702026367188, "global_step": 547813, "epoch": 6600} {"train_loss": -27.14871597290039, "global_step": 547814, "epoch": 6600} {"train_loss": -27.255905151367188, "global_step": 547815, "epoch": 6600} {"train_loss": -27.080066680908203, "global_step": 547816, "epoch": 6600} {"train_loss": -26.983963012695312, "global_step": 547817, "epoch": 6600} {"train_loss": -27.088397979736328, "global_step": 547818, "epoch": 6600} {"train_loss": -27.29878807067871, "global_step": 547819, "epoch": 6600} {"train_loss": -27.469501495361328, "global_step": 547820, "epoch": 6600} {"train_loss": -27.342763900756836, "global_step": 547821, "epoch": 6600} {"train_loss": -27.548416137695312, "global_step": 547822, "epoch": 6600} {"train_loss": -27.55691909790039, "global_step": 547823, "epoch": 6600} {"train_loss": -27.147064208984375, "global_step": 547824, "epoch": 6600} {"train_loss": -27.08033561706543, "global_step": 547825, "epoch": 6600} {"train_loss": -27.487546920776367, "global_step": 547826, "epoch": 6600} {"train_loss": -27.468368530273438, "global_step": 547827, "epoch": 6600} {"train_loss": -27.457883834838867, "global_step": 547828, "epoch": 6600} {"train_loss": -27.602914810180664, "global_step": 547829, "epoch": 6600} {"train_loss": -27.585554122924805, "global_step": 547830, "epoch": 6600} {"train_loss": -27.699506759643555, "global_step": 547831, "epoch": 6600} {"train_loss": -27.549365997314453, "global_step": 547832, "epoch": 6600} {"train_loss": -27.78156852722168, "global_step": 547833, "epoch": 6600} {"train_loss": -27.606470108032227, "global_step": 547834, "epoch": 6600} {"train_loss": -27.71820068359375, "global_step": 547835, "epoch": 6600} {"train_loss": -27.723163604736328, "global_step": 547836, "epoch": 6600} {"train_loss": -27.466217041015625, "global_step": 547837, "epoch": 6600} {"train_loss": -27.925735473632812, "global_step": 547838, "epoch": 6600} {"train_loss": -27.8490047454834, "global_step": 547839, "epoch": 6600} {"train_loss": -27.727033615112305, "global_step": 547840, "epoch": 6600} {"train_loss": -27.925886154174805, "global_step": 547841, "epoch": 6600} {"train_loss": -28.019445419311523, "global_step": 547842, "epoch": 6600} {"train_loss": -27.779056549072266, "global_step": 547843, "epoch": 6600} {"train_loss": -28.032642364501953, "global_step": 547844, "epoch": 6600} {"train_loss": -27.916040420532227, "global_step": 547845, "epoch": 6600} {"train_loss": -27.594141006469727, "global_step": 547846, "epoch": 6600} {"train_loss": -27.99981689453125, "global_step": 547847, "epoch": 6600} {"train_loss": -27.97580337524414, "global_step": 547848, "epoch": 6600} {"train_loss": -28.1772403717041, "global_step": 547849, "epoch": 6600} {"train_loss": -27.55877685546875, "global_step": 547850, "epoch": 6600} {"train_loss": -27.891616821289062, "global_step": 547851, "epoch": 6600} {"train_loss": -28.1873836517334, "global_step": 547852, "epoch": 6600} {"train_loss": -27.85687828063965, "global_step": 547853, "epoch": 6600} {"train_loss": -27.801313400268555, "global_step": 547854, "epoch": 6600} {"train_loss": -28.0148868560791, "global_step": 547855, "epoch": 6600} {"train_loss": -28.075946807861328, "global_step": 547856, "epoch": 6600} {"train_loss": -28.35053825378418, "global_step": 547857, "epoch": 6600} {"train_loss": -27.853376388549805, "global_step": 547858, "epoch": 6600} {"train_loss": -27.819074630737305, "global_step": 547859, "epoch": 6600} {"train_loss": -27.846975326538086, "global_step": 547860, "epoch": 6600} {"train_loss": -27.68195152282715, "global_step": 547861, "epoch": 6600} {"train_loss": -27.823917388916016, "global_step": 547862, "epoch": 6600} {"train_loss": -28.083728790283203, "global_step": 547863, "epoch": 6600} {"train_loss": -28.064926147460938, "global_step": 547864, "epoch": 6600} {"train_loss": -27.780126571655273, "global_step": 547865, "epoch": 6600} {"train_loss": -28.18451499938965, "global_step": 547866, "epoch": 6600} {"train_loss": -28.10310173034668, "global_step": 547867, "epoch": 6600} {"train_loss": -28.03620719909668, "global_step": 547868, "epoch": 6600} {"train_loss": -27.808923721313477, "global_step": 547869, "epoch": 6600} {"train_loss": -27.7824764251709, "global_step": 547870, "epoch": 6600} {"train_loss": -27.918237686157227, "global_step": 547871, "epoch": 6600} {"train_loss": -27.949182510375977, "global_step": 547872, "epoch": 6600} {"train_loss": -27.620471954345703, "global_step": 547873, "epoch": 6600} {"train_loss": -27.749006271362305, "global_step": 547874, "epoch": 6600} {"train_loss": -27.761144638061523, "global_step": 547875, "epoch": 6600} {"train_loss": -27.604354858398438, "global_step": 547876, "epoch": 6600} {"train_loss": -26.941160202026367, "global_step": 547877, "epoch": 6600} {"train_loss": -26.977598190307617, "global_step": 547878, "epoch": 6600} {"train_loss": -26.615835189819336, "global_step": 547879, "epoch": 6600} {"train_loss": -27.10342788696289, "global_step": 547880, "epoch": 6600} {"train_loss": -27.669635772705078, "global_step": 547881, "epoch": 6600} {"train_loss": -27.50744690952531, "global_step": 547882, "epoch": 6600, "train/sim_max_reward_0": 1.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4500000": 1.0, "test/sim_max_reward_4500001": 1.0, "test/sim_max_reward_4500002": 1.0, "test/sim_max_reward_4500003": 1.0, "test/sim_max_reward_4500004": 1.0, "test/sim_max_reward_4500005": 1.0, "test/sim_max_reward_4500006": 1.0, "test/sim_max_reward_4500007": 0.0, "test/sim_max_reward_4500008": 1.0, "test/sim_max_reward_4500009": 1.0, "test/sim_max_reward_4500010": 1.0, "test/sim_max_reward_4500011": 1.0, "test/sim_max_reward_4500012": 1.0, "test/sim_max_reward_4500013": 1.0, "test/sim_max_reward_4500014": 1.0, "test/sim_max_reward_4500015": 1.0, "test/sim_max_reward_4500016": 1.0, "test/sim_max_reward_4500017": 1.0, "test/sim_max_reward_4500018": 0.0, "test/sim_max_reward_4500019": 0.0, "test/sim_max_reward_4500020": 1.0, "test/sim_max_reward_4500021": 1.0, "train/mean_score": 1.0, "test/mean_score": 0.8636363636363636, "val_loss": 6535329.0} {"train_loss": -26.240468978881836, "global_step": 547883, "epoch": 6601} {"train_loss": -26.356155395507812, "global_step": 547884, "epoch": 6601} {"train_loss": -26.557708740234375, "global_step": 547885, "epoch": 6601} {"train_loss": -26.638120651245117, "global_step": 547886, "epoch": 6601} {"train_loss": -26.688623428344727, "global_step": 547887, "epoch": 6601} {"train_loss": -26.422788619995117, "global_step": 547888, "epoch": 6601} {"train_loss": -26.531009674072266, "global_step": 547889, "epoch": 6601} {"train_loss": -26.501047134399414, "global_step": 547890, "epoch": 6601} {"train_loss": -26.67874526977539, "global_step": 547891, "epoch": 6601} {"train_loss": -26.423288345336914, "global_step": 547892, "epoch": 6601} {"train_loss": -26.209264755249023, "global_step": 547893, "epoch": 6601} {"train_loss": -26.896331787109375, "global_step": 547894, "epoch": 6601} {"train_loss": -26.845930099487305, "global_step": 547895, "epoch": 6601} {"train_loss": -27.00935173034668, "global_step": 547896, "epoch": 6601} {"train_loss": -26.79424476623535, "global_step": 547897, "epoch": 6601} {"train_loss": -26.675851821899414, "global_step": 547898, "epoch": 6601} {"train_loss": -27.196186065673828, "global_step": 547899, "epoch": 6601} {"train_loss": -27.098682403564453, "global_step": 547900, "epoch": 6601} {"train_loss": -27.17658042907715, "global_step": 547901, "epoch": 6601} {"train_loss": -27.25209617614746, "global_step": 547902, "epoch": 6601} {"train_loss": -27.163068771362305, "global_step": 547903, "epoch": 6601} {"train_loss": -27.096261978149414, "global_step": 547904, "epoch": 6601} {"train_loss": -27.4954833984375, "global_step": 547905, "epoch": 6601} {"train_loss": -26.920740127563477, "global_step": 547906, "epoch": 6601} {"train_loss": -27.17047691345215, "global_step": 547907, "epoch": 6601} {"train_loss": -27.03033447265625, "global_step": 547908, "epoch": 6601} {"train_loss": -27.25233268737793, "global_step": 547909, "epoch": 6601} {"train_loss": -27.528379440307617, "global_step": 547910, "epoch": 6601} {"train_loss": -27.739917755126953, "global_step": 547911, "epoch": 6601} {"train_loss": -27.24786376953125, "global_step": 547912, "epoch": 6601} {"train_loss": -27.168506622314453, "global_step": 547913, "epoch": 6601} {"train_loss": -27.489334106445312, "global_step": 547914, "epoch": 6601} {"train_loss": -27.46461296081543, "global_step": 547915, "epoch": 6601} {"train_loss": -27.306873321533203, "global_step": 547916, "epoch": 6601} {"train_loss": -27.33877944946289, "global_step": 547917, "epoch": 6601} {"train_loss": -27.232192993164062, "global_step": 547918, "epoch": 6601} {"train_loss": -27.79127311706543, "global_step": 547919, "epoch": 6601} {"train_loss": -27.2353515625, "global_step": 547920, "epoch": 6601} {"train_loss": -27.829553604125977, "global_step": 547921, "epoch": 6601} {"train_loss": -27.68788719177246, "global_step": 547922, "epoch": 6601} {"train_loss": -27.992074966430664, "global_step": 547923, "epoch": 6601} {"train_loss": -27.727319717407227, "global_step": 547924, "epoch": 6601} {"train_loss": -27.78521728515625, "global_step": 547925, "epoch": 6601} {"train_loss": -27.909414291381836, "global_step": 547926, "epoch": 6601} {"train_loss": -27.544422149658203, "global_step": 547927, "epoch": 6601} {"train_loss": -27.498687744140625, "global_step": 547928, "epoch": 6601} {"train_loss": -27.70210075378418, "global_step": 547929, "epoch": 6601} {"train_loss": -28.07622718811035, "global_step": 547930, "epoch": 6601} {"train_loss": -27.835834503173828, "global_step": 547931, "epoch": 6601} {"train_loss": -28.126392364501953, "global_step": 547932, "epoch": 6601} {"train_loss": -27.791339874267578, "global_step": 547933, "epoch": 6601} {"train_loss": -27.655292510986328, "global_step": 547934, "epoch": 6601} {"train_loss": -28.03301429748535, "global_step": 547935, "epoch": 6601} {"train_loss": -27.546823501586914, "global_step": 547936, "epoch": 6601} {"train_loss": -28.10479736328125, "global_step": 547937, "epoch": 6601} {"train_loss": -27.83304786682129, "global_step": 547938, "epoch": 6601} {"train_loss": -27.554197311401367, "global_step": 547939, "epoch": 6601} {"train_loss": -27.86634635925293, "global_step": 547940, "epoch": 6601} {"train_loss": -27.70611572265625, "global_step": 547941, "epoch": 6601} {"train_loss": -27.70244789123535, "global_step": 547942, "epoch": 6601} {"train_loss": -27.95505142211914, "global_step": 547943, "epoch": 6601} {"train_loss": -27.798974990844727, "global_step": 547944, "epoch": 6601} {"train_loss": -28.183263778686523, "global_step": 547945, "epoch": 6601} {"train_loss": -27.441864013671875, "global_step": 547946, "epoch": 6601} {"train_loss": -27.877511978149414, "global_step": 547947, "epoch": 6601} {"train_loss": -28.251569747924805, "global_step": 547948, "epoch": 6601} {"train_loss": -28.038578033447266, "global_step": 547949, "epoch": 6601} {"train_loss": -28.146366119384766, "global_step": 547950, "epoch": 6601} {"train_loss": -27.372785568237305, "global_step": 547951, "epoch": 6601} {"train_loss": -27.22352409362793, "global_step": 547952, "epoch": 6601} {"train_loss": -27.114355087280273, "global_step": 547953, "epoch": 6601} {"train_loss": -27.633441925048828, "global_step": 547954, "epoch": 6601} {"train_loss": -27.964691162109375, "global_step": 547955, "epoch": 6601} {"train_loss": -26.941791534423828, "global_step": 547956, "epoch": 6601} {"train_loss": -26.9088191986084, "global_step": 547957, "epoch": 6601} {"train_loss": -27.783939361572266, "global_step": 547958, "epoch": 6601} {"train_loss": -27.27467155456543, "global_step": 547959, "epoch": 6601} {"train_loss": -27.535358428955078, "global_step": 547960, "epoch": 6601} {"train_loss": -27.83707046508789, "global_step": 547961, "epoch": 6601} {"train_loss": -27.65327262878418, "global_step": 547962, "epoch": 6601} {"train_loss": -27.443225860595703, "global_step": 547963, "epoch": 6601} {"train_loss": -27.43338394165039, "global_step": 547964, "epoch": 6601} {"train_loss": -27.38663461983922, "global_step": 547965, "epoch": 6601, "val_loss": 6532696.0} {"train_loss": -26.0814208984375, "global_step": 547966, "epoch": 6602} {"train_loss": -25.265073776245117, "global_step": 547967, "epoch": 6602} {"train_loss": -25.55243682861328, "global_step": 547968, "epoch": 6602} {"train_loss": -24.621536254882812, "global_step": 547969, "epoch": 6602} {"train_loss": -25.93674659729004, "global_step": 547970, "epoch": 6602} {"train_loss": -25.5228214263916, "global_step": 547971, "epoch": 6602} {"train_loss": -25.633258819580078, "global_step": 547972, "epoch": 6602} {"train_loss": -25.45208168029785, "global_step": 547973, "epoch": 6602} {"train_loss": -26.088916778564453, "global_step": 547974, "epoch": 6602} {"train_loss": -26.102685928344727, "global_step": 547975, "epoch": 6602} {"train_loss": -25.962860107421875, "global_step": 547976, "epoch": 6602} {"train_loss": -27.008981704711914, "global_step": 547977, "epoch": 6602} {"train_loss": -25.886648178100586, "global_step": 547978, "epoch": 6602} {"train_loss": -26.596343994140625, "global_step": 547979, "epoch": 6602} {"train_loss": -26.7906436920166, "global_step": 547980, "epoch": 6602} {"train_loss": -26.73797035217285, "global_step": 547981, "epoch": 6602} {"train_loss": -26.894556045532227, "global_step": 547982, "epoch": 6602} {"train_loss": -26.446121215820312, "global_step": 547983, "epoch": 6602} {"train_loss": -27.11612892150879, "global_step": 547984, "epoch": 6602} {"train_loss": -26.767972946166992, "global_step": 547985, "epoch": 6602} {"train_loss": -26.419666290283203, "global_step": 547986, "epoch": 6602} {"train_loss": -27.042617797851562, "global_step": 547987, "epoch": 6602} {"train_loss": -26.775842666625977, "global_step": 547988, "epoch": 6602} {"train_loss": -26.910877227783203, "global_step": 547989, "epoch": 6602} {"train_loss": -26.662158966064453, "global_step": 547990, "epoch": 6602} {"train_loss": -27.268299102783203, "global_step": 547991, "epoch": 6602} {"train_loss": -26.903335571289062, "global_step": 547992, "epoch": 6602} {"train_loss": -27.326065063476562, "global_step": 547993, "epoch": 6602} {"train_loss": -27.015066146850586, "global_step": 547994, "epoch": 6602} {"train_loss": -27.142059326171875, "global_step": 547995, "epoch": 6602} {"train_loss": -27.1610164642334, "global_step": 547996, "epoch": 6602} {"train_loss": -27.204669952392578, "global_step": 547997, "epoch": 6602} {"train_loss": -27.53769302368164, "global_step": 547998, "epoch": 6602} {"train_loss": -27.360095977783203, "global_step": 547999, "epoch": 6602} {"train_loss": -27.22547721862793, "global_step": 548000, "epoch": 6602} {"train_loss": -27.396228790283203, "global_step": 548001, "epoch": 6602} {"train_loss": -27.78095817565918, "global_step": 548002, "epoch": 6602} {"train_loss": -27.387451171875, "global_step": 548003, "epoch": 6602} {"train_loss": -27.802570343017578, "global_step": 548004, "epoch": 6602} {"train_loss": -27.8005428314209, "global_step": 548005, "epoch": 6602} {"train_loss": -27.346662521362305, "global_step": 548006, "epoch": 6602} {"train_loss": -27.553394317626953, "global_step": 548007, "epoch": 6602} {"train_loss": -27.349853515625, "global_step": 548008, "epoch": 6602} {"train_loss": -27.722599029541016, "global_step": 548009, "epoch": 6602} {"train_loss": -27.523853302001953, "global_step": 548010, "epoch": 6602} {"train_loss": -27.722980499267578, "global_step": 548011, "epoch": 6602} {"train_loss": -27.521398544311523, "global_step": 548012, "epoch": 6602} {"train_loss": -27.581457138061523, "global_step": 548013, "epoch": 6602} {"train_loss": -28.16548728942871, "global_step": 548014, "epoch": 6602} {"train_loss": -27.40386962890625, "global_step": 548015, "epoch": 6602} {"train_loss": -27.57187843322754, "global_step": 548016, "epoch": 6602} {"train_loss": -27.88507080078125, "global_step": 548017, "epoch": 6602} {"train_loss": -27.848834991455078, "global_step": 548018, "epoch": 6602} {"train_loss": -28.135679244995117, "global_step": 548019, "epoch": 6602} {"train_loss": -27.704580307006836, "global_step": 548020, "epoch": 6602} {"train_loss": -27.927570343017578, "global_step": 548021, "epoch": 6602} {"train_loss": -27.797826766967773, "global_step": 548022, "epoch": 6602} {"train_loss": -27.78144645690918, "global_step": 548023, "epoch": 6602} {"train_loss": -27.896581649780273, "global_step": 548024, "epoch": 6602} {"train_loss": -27.85881996154785, "global_step": 548025, "epoch": 6602} {"train_loss": -27.679105758666992, "global_step": 548026, "epoch": 6602} {"train_loss": -27.885757446289062, "global_step": 548027, "epoch": 6602} {"train_loss": -27.954511642456055, "global_step": 548028, "epoch": 6602} {"train_loss": -28.118804931640625, "global_step": 548029, "epoch": 6602} {"train_loss": -27.891366958618164, "global_step": 548030, "epoch": 6602} {"train_loss": -27.876256942749023, "global_step": 548031, "epoch": 6602} {"train_loss": -27.812971115112305, "global_step": 548032, "epoch": 6602} {"train_loss": -27.93646812438965, "global_step": 548033, "epoch": 6602} {"train_loss": -27.8271484375, "global_step": 548034, "epoch": 6602} {"train_loss": -27.676252365112305, "global_step": 548035, "epoch": 6602} {"train_loss": -27.667102813720703, "global_step": 548036, "epoch": 6602} {"train_loss": -27.80681800842285, "global_step": 548037, "epoch": 6602} {"train_loss": -27.856367111206055, "global_step": 548038, "epoch": 6602} {"train_loss": -28.1849308013916, "global_step": 548039, "epoch": 6602} {"train_loss": -28.043212890625, "global_step": 548040, "epoch": 6602} {"train_loss": -27.760034561157227, "global_step": 548041, "epoch": 6602} {"train_loss": -28.086841583251953, "global_step": 548042, "epoch": 6602} {"train_loss": -28.06808853149414, "global_step": 548043, "epoch": 6602} {"train_loss": -28.117136001586914, "global_step": 548044, "epoch": 6602} {"train_loss": -27.908716201782227, "global_step": 548045, "epoch": 6602} {"train_loss": -28.036880493164062, "global_step": 548046, "epoch": 6602} {"train_loss": -28.30634880065918, "global_step": 548047, "epoch": 6602} {"train_loss": -27.28017763344638, "global_step": 548048, "epoch": 6602, "val_loss": 6541491.0} {"train_loss": -26.786718368530273, "global_step": 548049, "epoch": 6603} {"train_loss": -26.868600845336914, "global_step": 548050, "epoch": 6603} {"train_loss": -27.54216957092285, "global_step": 548051, "epoch": 6603} {"train_loss": -27.14946937561035, "global_step": 548052, "epoch": 6603} {"train_loss": -27.496381759643555, "global_step": 548053, "epoch": 6603} {"train_loss": -26.69107437133789, "global_step": 548054, "epoch": 6603} {"train_loss": -25.90130043029785, "global_step": 548055, "epoch": 6603} {"train_loss": -25.835248947143555, "global_step": 548056, "epoch": 6603} {"train_loss": -26.47382164001465, "global_step": 548057, "epoch": 6603} {"train_loss": -26.955402374267578, "global_step": 548058, "epoch": 6603} {"train_loss": -27.1910343170166, "global_step": 548059, "epoch": 6603} {"train_loss": -26.88899040222168, "global_step": 548060, "epoch": 6603} {"train_loss": -27.184179306030273, "global_step": 548061, "epoch": 6603} {"train_loss": -27.347610473632812, "global_step": 548062, "epoch": 6603} {"train_loss": -27.184492111206055, "global_step": 548063, "epoch": 6603} {"train_loss": -26.986806869506836, "global_step": 548064, "epoch": 6603} {"train_loss": -27.37176513671875, "global_step": 548065, "epoch": 6603} {"train_loss": -26.989013671875, "global_step": 548066, "epoch": 6603} {"train_loss": -27.16695213317871, "global_step": 548067, "epoch": 6603} {"train_loss": -27.724918365478516, "global_step": 548068, "epoch": 6603} {"train_loss": -27.326007843017578, "global_step": 548069, "epoch": 6603} {"train_loss": -27.31587791442871, "global_step": 548070, "epoch": 6603} {"train_loss": -27.620023727416992, "global_step": 548071, "epoch": 6603} {"train_loss": -27.416677474975586, "global_step": 548072, "epoch": 6603} {"train_loss": -27.68115234375, "global_step": 548073, "epoch": 6603} {"train_loss": -27.735382080078125, "global_step": 548074, "epoch": 6603} {"train_loss": -27.259496688842773, "global_step": 548075, "epoch": 6603} {"train_loss": -27.610462188720703, "global_step": 548076, "epoch": 6603} {"train_loss": -27.6877498626709, "global_step": 548077, "epoch": 6603} {"train_loss": -27.6324462890625, "global_step": 548078, "epoch": 6603} {"train_loss": -27.77412223815918, "global_step": 548079, "epoch": 6603} {"train_loss": -27.49390983581543, "global_step": 548080, "epoch": 6603} {"train_loss": -27.868885040283203, "global_step": 548081, "epoch": 6603} {"train_loss": -27.856595993041992, "global_step": 548082, "epoch": 6603} {"train_loss": -28.038888931274414, "global_step": 548083, "epoch": 6603} {"train_loss": -27.826969146728516, "global_step": 548084, "epoch": 6603} {"train_loss": -27.9168758392334, "global_step": 548085, "epoch": 6603} {"train_loss": -28.118616104125977, "global_step": 548086, "epoch": 6603} {"train_loss": -27.97027015686035, "global_step": 548087, "epoch": 6603} {"train_loss": -27.648609161376953, "global_step": 548088, "epoch": 6603} {"train_loss": -27.702478408813477, "global_step": 548089, "epoch": 6603} {"train_loss": -27.586084365844727, "global_step": 548090, "epoch": 6603} {"train_loss": -27.880102157592773, "global_step": 548091, "epoch": 6603} {"train_loss": -27.695127487182617, "global_step": 548092, "epoch": 6603} {"train_loss": -27.8841552734375, "global_step": 548093, "epoch": 6603} {"train_loss": -28.038070678710938, "global_step": 548094, "epoch": 6603} {"train_loss": -27.724058151245117, "global_step": 548095, "epoch": 6603} {"train_loss": -27.855676651000977, "global_step": 548096, "epoch": 6603} {"train_loss": -27.67426109313965, "global_step": 548097, "epoch": 6603} {"train_loss": -28.013193130493164, "global_step": 548098, "epoch": 6603} {"train_loss": -27.80938720703125, "global_step": 548099, "epoch": 6603} {"train_loss": -27.66705894470215, "global_step": 548100, "epoch": 6603} {"train_loss": -27.6761531829834, "global_step": 548101, "epoch": 6603} {"train_loss": -27.918685913085938, "global_step": 548102, "epoch": 6603} {"train_loss": -27.92649269104004, "global_step": 548103, "epoch": 6603} {"train_loss": -27.829084396362305, "global_step": 548104, "epoch": 6603} {"train_loss": -27.766942977905273, "global_step": 548105, "epoch": 6603} {"train_loss": -27.24627685546875, "global_step": 548106, "epoch": 6603} {"train_loss": -27.52320671081543, "global_step": 548107, "epoch": 6603} {"train_loss": -27.966251373291016, "global_step": 548108, "epoch": 6603} {"train_loss": -27.896961212158203, "global_step": 548109, "epoch": 6603} {"train_loss": -28.00092124938965, "global_step": 548110, "epoch": 6603} {"train_loss": -27.798559188842773, "global_step": 548111, "epoch": 6603} {"train_loss": -27.703632354736328, "global_step": 548112, "epoch": 6603} {"train_loss": -27.58835792541504, "global_step": 548113, "epoch": 6603} {"train_loss": -27.491514205932617, "global_step": 548114, "epoch": 6603} {"train_loss": -27.60101890563965, "global_step": 548115, "epoch": 6603} {"train_loss": -27.818714141845703, "global_step": 548116, "epoch": 6603} {"train_loss": -27.632068634033203, "global_step": 548117, "epoch": 6603} {"train_loss": -28.003881454467773, "global_step": 548118, "epoch": 6603} {"train_loss": -27.936965942382812, "global_step": 548119, "epoch": 6603} {"train_loss": -27.721332550048828, "global_step": 548120, "epoch": 6603} {"train_loss": -27.900970458984375, "global_step": 548121, "epoch": 6603} {"train_loss": -28.003406524658203, "global_step": 548122, "epoch": 6603} {"train_loss": -27.929243087768555, "global_step": 548123, "epoch": 6603} {"train_loss": -28.301864624023438, "global_step": 548124, "epoch": 6603} {"train_loss": -28.118627548217773, "global_step": 548125, "epoch": 6603} {"train_loss": -27.949777603149414, "global_step": 548126, "epoch": 6603} {"train_loss": -27.79290771484375, "global_step": 548127, "epoch": 6603} {"train_loss": -27.86405372619629, "global_step": 548128, "epoch": 6603} {"train_loss": -27.794958114624023, "global_step": 548129, "epoch": 6603} {"train_loss": -27.574209213256836, "global_step": 548130, "epoch": 6603} {"train_loss": -27.597463607788086, "global_step": 548131, "epoch": 6603, "val_loss": 6588196.0} {"train_loss": -26.834247589111328, "global_step": 548132, "epoch": 6604} {"train_loss": -27.30647850036621, "global_step": 548133, "epoch": 6604} {"train_loss": -26.508642196655273, "global_step": 548134, "epoch": 6604} {"train_loss": -27.35675048828125, "global_step": 548135, "epoch": 6604} {"train_loss": -26.537139892578125, "global_step": 548136, "epoch": 6604} {"train_loss": -26.77329444885254, "global_step": 548137, "epoch": 6604} {"train_loss": -26.965576171875, "global_step": 548138, "epoch": 6604} {"train_loss": -27.18293571472168, "global_step": 548139, "epoch": 6604} {"train_loss": -27.20303726196289, "global_step": 548140, "epoch": 6604} {"train_loss": -26.58696937561035, "global_step": 548141, "epoch": 6604} {"train_loss": -26.7464542388916, "global_step": 548142, "epoch": 6604} {"train_loss": -27.38080406188965, "global_step": 548143, "epoch": 6604} {"train_loss": -27.13445472717285, "global_step": 548144, "epoch": 6604} {"train_loss": -26.943021774291992, "global_step": 548145, "epoch": 6604} {"train_loss": -27.520246505737305, "global_step": 548146, "epoch": 6604} {"train_loss": -27.270740509033203, "global_step": 548147, "epoch": 6604} {"train_loss": -27.44733238220215, "global_step": 548148, "epoch": 6604} {"train_loss": -27.1060791015625, "global_step": 548149, "epoch": 6604} {"train_loss": -27.325841903686523, "global_step": 548150, "epoch": 6604} {"train_loss": -27.4105224609375, "global_step": 548151, "epoch": 6604} {"train_loss": -27.473865509033203, "global_step": 548152, "epoch": 6604} {"train_loss": -27.3109073638916, "global_step": 548153, "epoch": 6604} {"train_loss": -27.317331314086914, "global_step": 548154, "epoch": 6604} {"train_loss": -27.509557723999023, "global_step": 548155, "epoch": 6604} {"train_loss": -27.851282119750977, "global_step": 548156, "epoch": 6604} {"train_loss": -27.686960220336914, "global_step": 548157, "epoch": 6604} {"train_loss": -27.459989547729492, "global_step": 548158, "epoch": 6604} {"train_loss": -27.75347900390625, "global_step": 548159, "epoch": 6604} {"train_loss": -27.758594512939453, "global_step": 548160, "epoch": 6604} {"train_loss": -27.56633949279785, "global_step": 548161, "epoch": 6604} {"train_loss": -27.188323974609375, "global_step": 548162, "epoch": 6604} {"train_loss": -27.32892417907715, "global_step": 548163, "epoch": 6604} {"train_loss": -27.62628746032715, "global_step": 548164, "epoch": 6604} {"train_loss": -27.8935546875, "global_step": 548165, "epoch": 6604} {"train_loss": -27.924102783203125, "global_step": 548166, "epoch": 6604} {"train_loss": -27.731002807617188, "global_step": 548167, "epoch": 6604} {"train_loss": -27.569122314453125, "global_step": 548168, "epoch": 6604} {"train_loss": -27.494342803955078, "global_step": 548169, "epoch": 6604} {"train_loss": -27.622100830078125, "global_step": 548170, "epoch": 6604} {"train_loss": -27.83112907409668, "global_step": 548171, "epoch": 6604} {"train_loss": -27.85355567932129, "global_step": 548172, "epoch": 6604} {"train_loss": -28.15915870666504, "global_step": 548173, "epoch": 6604} {"train_loss": -27.983505249023438, "global_step": 548174, "epoch": 6604} {"train_loss": -27.879369735717773, "global_step": 548175, "epoch": 6604} {"train_loss": -27.963781356811523, "global_step": 548176, "epoch": 6604} {"train_loss": -27.70562744140625, "global_step": 548177, "epoch": 6604} {"train_loss": -27.93436050415039, "global_step": 548178, "epoch": 6604} {"train_loss": -28.03057289123535, "global_step": 548179, "epoch": 6604} {"train_loss": -27.95832633972168, "global_step": 548180, "epoch": 6604} {"train_loss": -28.0190372467041, "global_step": 548181, "epoch": 6604} {"train_loss": -27.85951042175293, "global_step": 548182, "epoch": 6604} {"train_loss": -27.6259708404541, "global_step": 548183, "epoch": 6604} {"train_loss": -28.2409610748291, "global_step": 548184, "epoch": 6604} {"train_loss": -27.7160701751709, "global_step": 548185, "epoch": 6604} {"train_loss": -28.071781158447266, "global_step": 548186, "epoch": 6604} {"train_loss": -27.7814998626709, "global_step": 548187, "epoch": 6604} {"train_loss": -27.539310455322266, "global_step": 548188, "epoch": 6604} {"train_loss": -27.802814483642578, "global_step": 548189, "epoch": 6604} {"train_loss": -27.72650718688965, "global_step": 548190, "epoch": 6604} {"train_loss": -27.274078369140625, "global_step": 548191, "epoch": 6604} {"train_loss": -27.42542839050293, "global_step": 548192, "epoch": 6604} {"train_loss": -27.65081787109375, "global_step": 548193, "epoch": 6604} {"train_loss": -27.9096736907959, "global_step": 548194, "epoch": 6604} {"train_loss": -28.022506713867188, "global_step": 548195, "epoch": 6604} {"train_loss": -27.818464279174805, "global_step": 548196, "epoch": 6604} {"train_loss": -27.587087631225586, "global_step": 548197, "epoch": 6604} {"train_loss": -27.930622100830078, "global_step": 548198, "epoch": 6604} {"train_loss": -28.079303741455078, "global_step": 548199, "epoch": 6604} {"train_loss": -27.992902755737305, "global_step": 548200, "epoch": 6604} {"train_loss": -27.83936882019043, "global_step": 548201, "epoch": 6604} {"train_loss": -27.895360946655273, "global_step": 548202, "epoch": 6604} {"train_loss": -27.790149688720703, "global_step": 548203, "epoch": 6604} {"train_loss": -27.89398765563965, "global_step": 548204, "epoch": 6604} {"train_loss": -27.701404571533203, "global_step": 548205, "epoch": 6604} {"train_loss": -27.870473861694336, "global_step": 548206, "epoch": 6604} {"train_loss": -27.745290756225586, "global_step": 548207, "epoch": 6604} {"train_loss": -27.711612701416016, "global_step": 548208, "epoch": 6604} {"train_loss": -27.639265060424805, "global_step": 548209, "epoch": 6604} {"train_loss": -27.877338409423828, "global_step": 548210, "epoch": 6604} {"train_loss": -27.810163497924805, "global_step": 548211, "epoch": 6604} {"train_loss": -28.09210205078125, "global_step": 548212, "epoch": 6604} {"train_loss": -27.68646240234375, "global_step": 548213, "epoch": 6604} {"train_loss": -27.614412974162274, "global_step": 548214, "epoch": 6604, "val_loss": 6604861.0} {"train_loss": -27.54717445373535, "global_step": 548215, "epoch": 6605} {"train_loss": -27.455045700073242, "global_step": 548216, "epoch": 6605} {"train_loss": -27.711292266845703, "global_step": 548217, "epoch": 6605} {"train_loss": -27.58945083618164, "global_step": 548218, "epoch": 6605} {"train_loss": -27.785165786743164, "global_step": 548219, "epoch": 6605} {"train_loss": -27.44403648376465, "global_step": 548220, "epoch": 6605} {"train_loss": -27.46729850769043, "global_step": 548221, "epoch": 6605} {"train_loss": -27.709280014038086, "global_step": 548222, "epoch": 6605} {"train_loss": -27.70709228515625, "global_step": 548223, "epoch": 6605} {"train_loss": -27.45123291015625, "global_step": 548224, "epoch": 6605} {"train_loss": -27.516326904296875, "global_step": 548225, "epoch": 6605} {"train_loss": -27.094593048095703, "global_step": 548226, "epoch": 6605} {"train_loss": -27.581893920898438, "global_step": 548227, "epoch": 6605} {"train_loss": -27.406494140625, "global_step": 548228, "epoch": 6605} {"train_loss": -27.214513778686523, "global_step": 548229, "epoch": 6605} {"train_loss": -27.721052169799805, "global_step": 548230, "epoch": 6605} {"train_loss": -27.6354923248291, "global_step": 548231, "epoch": 6605} {"train_loss": -27.3273983001709, "global_step": 548232, "epoch": 6605} {"train_loss": -27.442785263061523, "global_step": 548233, "epoch": 6605} {"train_loss": -27.652318954467773, "global_step": 548234, "epoch": 6605} {"train_loss": -27.133398056030273, "global_step": 548235, "epoch": 6605} {"train_loss": -28.017059326171875, "global_step": 548236, "epoch": 6605} {"train_loss": -27.606033325195312, "global_step": 548237, "epoch": 6605} {"train_loss": -27.93063735961914, "global_step": 548238, "epoch": 6605} {"train_loss": -27.15958023071289, "global_step": 548239, "epoch": 6605} {"train_loss": -27.997528076171875, "global_step": 548240, "epoch": 6605} {"train_loss": -27.658023834228516, "global_step": 548241, "epoch": 6605} {"train_loss": -27.570281982421875, "global_step": 548242, "epoch": 6605} {"train_loss": -27.447057723999023, "global_step": 548243, "epoch": 6605} {"train_loss": -27.7904052734375, "global_step": 548244, "epoch": 6605} {"train_loss": -27.6875057220459, "global_step": 548245, "epoch": 6605} {"train_loss": -27.557336807250977, "global_step": 548246, "epoch": 6605} {"train_loss": -27.589818954467773, "global_step": 548247, "epoch": 6605} {"train_loss": -27.78995132446289, "global_step": 548248, "epoch": 6605} {"train_loss": -27.78033447265625, "global_step": 548249, "epoch": 6605} {"train_loss": -27.580249786376953, "global_step": 548250, "epoch": 6605} {"train_loss": -27.795202255249023, "global_step": 548251, "epoch": 6605} {"train_loss": -27.988733291625977, "global_step": 548252, "epoch": 6605} {"train_loss": -27.962848663330078, "global_step": 548253, "epoch": 6605} {"train_loss": -27.45069694519043, "global_step": 548254, "epoch": 6605} {"train_loss": -27.935556411743164, "global_step": 548255, "epoch": 6605} {"train_loss": -27.746931076049805, "global_step": 548256, "epoch": 6605} {"train_loss": -27.442407608032227, "global_step": 548257, "epoch": 6605} {"train_loss": -27.591466903686523, "global_step": 548258, "epoch": 6605} {"train_loss": -27.564603805541992, "global_step": 548259, "epoch": 6605} {"train_loss": -27.80763053894043, "global_step": 548260, "epoch": 6605} {"train_loss": -27.8394832611084, "global_step": 548261, "epoch": 6605} {"train_loss": -27.134286880493164, "global_step": 548262, "epoch": 6605} {"train_loss": -27.501434326171875, "global_step": 548263, "epoch": 6605} {"train_loss": -27.559589385986328, "global_step": 548264, "epoch": 6605} {"train_loss": -27.504470825195312, "global_step": 548265, "epoch": 6605} {"train_loss": -27.299726486206055, "global_step": 548266, "epoch": 6605} {"train_loss": -27.537580490112305, "global_step": 548267, "epoch": 6605} {"train_loss": -27.438573837280273, "global_step": 548268, "epoch": 6605} {"train_loss": -27.155399322509766, "global_step": 548269, "epoch": 6605} {"train_loss": -27.668899536132812, "global_step": 548270, "epoch": 6605} {"train_loss": -27.329975128173828, "global_step": 548271, "epoch": 6605} {"train_loss": -27.793415069580078, "global_step": 548272, "epoch": 6605} {"train_loss": -27.621671676635742, "global_step": 548273, "epoch": 6605} {"train_loss": -27.594812393188477, "global_step": 548274, "epoch": 6605} {"train_loss": -27.89995765686035, "global_step": 548275, "epoch": 6605} {"train_loss": -27.45198631286621, "global_step": 548276, "epoch": 6605} {"train_loss": -27.54102897644043, "global_step": 548277, "epoch": 6605} {"train_loss": -27.77594566345215, "global_step": 548278, "epoch": 6605} {"train_loss": -27.696619033813477, "global_step": 548279, "epoch": 6605} {"train_loss": -27.238300323486328, "global_step": 548280, "epoch": 6605} {"train_loss": -27.76893424987793, "global_step": 548281, "epoch": 6605} {"train_loss": -27.660449981689453, "global_step": 548282, "epoch": 6605} {"train_loss": -27.814411163330078, "global_step": 548283, "epoch": 6605} {"train_loss": -27.4051570892334, "global_step": 548284, "epoch": 6605} {"train_loss": -27.93031883239746, "global_step": 548285, "epoch": 6605} {"train_loss": -27.75660514831543, "global_step": 548286, "epoch": 6605} {"train_loss": -27.752538681030273, "global_step": 548287, "epoch": 6605} {"train_loss": -27.459501266479492, "global_step": 548288, "epoch": 6605} {"train_loss": -27.95612907409668, "global_step": 548289, "epoch": 6605} {"train_loss": -27.684432983398438, "global_step": 548290, "epoch": 6605} {"train_loss": -27.739652633666992, "global_step": 548291, "epoch": 6605} {"train_loss": -27.79144287109375, "global_step": 548292, "epoch": 6605} {"train_loss": -27.412321090698242, "global_step": 548293, "epoch": 6605} {"train_loss": -28.053043365478516, "global_step": 548294, "epoch": 6605} {"train_loss": -27.77655029296875, "global_step": 548295, "epoch": 6605} {"train_loss": -27.71076011657715, "global_step": 548296, "epoch": 6605} {"train_loss": -27.626889837793556, "global_step": 548297, "epoch": 6605, "val_loss": 6564556.0} {"train_loss": -27.351980209350586, "global_step": 548298, "epoch": 6606} {"train_loss": -26.868070602416992, "global_step": 548299, "epoch": 6606} {"train_loss": -27.311864852905273, "global_step": 548300, "epoch": 6606} {"train_loss": -27.419483184814453, "global_step": 548301, "epoch": 6606} {"train_loss": -27.217721939086914, "global_step": 548302, "epoch": 6606} {"train_loss": -27.59173011779785, "global_step": 548303, "epoch": 6606} {"train_loss": -26.9357967376709, "global_step": 548304, "epoch": 6606} {"train_loss": -27.486865997314453, "global_step": 548305, "epoch": 6606} {"train_loss": -27.28663444519043, "global_step": 548306, "epoch": 6606} {"train_loss": -27.125446319580078, "global_step": 548307, "epoch": 6606} {"train_loss": -27.67738914489746, "global_step": 548308, "epoch": 6606} {"train_loss": -26.876928329467773, "global_step": 548309, "epoch": 6606} {"train_loss": -27.803457260131836, "global_step": 548310, "epoch": 6606} {"train_loss": -27.392011642456055, "global_step": 548311, "epoch": 6606} {"train_loss": -27.6799373626709, "global_step": 548312, "epoch": 6606} {"train_loss": -27.06449317932129, "global_step": 548313, "epoch": 6606} {"train_loss": -27.48121452331543, "global_step": 548314, "epoch": 6606} {"train_loss": -27.853803634643555, "global_step": 548315, "epoch": 6606} {"train_loss": -27.392261505126953, "global_step": 548316, "epoch": 6606} {"train_loss": -27.453628540039062, "global_step": 548317, "epoch": 6606} {"train_loss": -27.360654830932617, "global_step": 548318, "epoch": 6606} {"train_loss": -27.64377784729004, "global_step": 548319, "epoch": 6606} {"train_loss": -27.870147705078125, "global_step": 548320, "epoch": 6606} {"train_loss": -27.423725128173828, "global_step": 548321, "epoch": 6606} {"train_loss": -27.498804092407227, "global_step": 548322, "epoch": 6606} {"train_loss": -27.873489379882812, "global_step": 548323, "epoch": 6606} {"train_loss": -27.895029067993164, "global_step": 548324, "epoch": 6606} {"train_loss": -27.711444854736328, "global_step": 548325, "epoch": 6606} {"train_loss": -27.794904708862305, "global_step": 548326, "epoch": 6606} {"train_loss": -27.299468994140625, "global_step": 548327, "epoch": 6606} {"train_loss": -28.093358993530273, "global_step": 548328, "epoch": 6606} {"train_loss": -27.752912521362305, "global_step": 548329, "epoch": 6606} {"train_loss": -27.429433822631836, "global_step": 548330, "epoch": 6606} {"train_loss": -27.821945190429688, "global_step": 548331, "epoch": 6606} {"train_loss": -27.2731876373291, "global_step": 548332, "epoch": 6606} {"train_loss": -27.485788345336914, "global_step": 548333, "epoch": 6606} {"train_loss": -27.632104873657227, "global_step": 548334, "epoch": 6606} {"train_loss": -27.71225929260254, "global_step": 548335, "epoch": 6606} {"train_loss": -27.68819236755371, "global_step": 548336, "epoch": 6606} {"train_loss": -27.694822311401367, "global_step": 548337, "epoch": 6606} {"train_loss": -27.628345489501953, "global_step": 548338, "epoch": 6606} {"train_loss": -27.610509872436523, "global_step": 548339, "epoch": 6606} {"train_loss": -27.825254440307617, "global_step": 548340, "epoch": 6606} {"train_loss": -27.76874351501465, "global_step": 548341, "epoch": 6606} {"train_loss": -27.559675216674805, "global_step": 548342, "epoch": 6606} {"train_loss": -27.93863868713379, "global_step": 548343, "epoch": 6606} {"train_loss": -27.961811065673828, "global_step": 548344, "epoch": 6606} {"train_loss": -27.77667236328125, "global_step": 548345, "epoch": 6606} {"train_loss": -27.45977210998535, "global_step": 548346, "epoch": 6606} {"train_loss": -27.586450576782227, "global_step": 548347, "epoch": 6606} {"train_loss": -27.543798446655273, "global_step": 548348, "epoch": 6606} {"train_loss": -27.965377807617188, "global_step": 548349, "epoch": 6606} {"train_loss": -27.786331176757812, "global_step": 548350, "epoch": 6606} {"train_loss": -27.795734405517578, "global_step": 548351, "epoch": 6606} {"train_loss": -27.863584518432617, "global_step": 548352, "epoch": 6606} {"train_loss": -27.490015029907227, "global_step": 548353, "epoch": 6606} {"train_loss": -27.728612899780273, "global_step": 548354, "epoch": 6606} {"train_loss": -28.083173751831055, "global_step": 548355, "epoch": 6606} {"train_loss": -27.94989013671875, "global_step": 548356, "epoch": 6606} {"train_loss": -27.951629638671875, "global_step": 548357, "epoch": 6606} {"train_loss": -27.652185440063477, "global_step": 548358, "epoch": 6606} {"train_loss": -27.63018226623535, "global_step": 548359, "epoch": 6606} {"train_loss": -27.736572265625, "global_step": 548360, "epoch": 6606} {"train_loss": -28.239133834838867, "global_step": 548361, "epoch": 6606} {"train_loss": -27.750415802001953, "global_step": 548362, "epoch": 6606} {"train_loss": -27.689361572265625, "global_step": 548363, "epoch": 6606} {"train_loss": -27.74969482421875, "global_step": 548364, "epoch": 6606} {"train_loss": -27.483280181884766, "global_step": 548365, "epoch": 6606} {"train_loss": -27.60576820373535, "global_step": 548366, "epoch": 6606} {"train_loss": -28.05051612854004, "global_step": 548367, "epoch": 6606} {"train_loss": -27.8406982421875, "global_step": 548368, "epoch": 6606} {"train_loss": -27.891071319580078, "global_step": 548369, "epoch": 6606} {"train_loss": -27.369077682495117, "global_step": 548370, "epoch": 6606} {"train_loss": -27.46278190612793, "global_step": 548371, "epoch": 6606} {"train_loss": -27.91077995300293, "global_step": 548372, "epoch": 6606} {"train_loss": -27.85584831237793, "global_step": 548373, "epoch": 6606} {"train_loss": -27.51837158203125, "global_step": 548374, "epoch": 6606} {"train_loss": -27.512470245361328, "global_step": 548375, "epoch": 6606} {"train_loss": -28.048877716064453, "global_step": 548376, "epoch": 6606} {"train_loss": -27.77593994140625, "global_step": 548377, "epoch": 6606} {"train_loss": -27.501937866210938, "global_step": 548378, "epoch": 6606} {"train_loss": -27.485395431518555, "global_step": 548379, "epoch": 6606} {"train_loss": -27.61495631574148, "global_step": 548380, "epoch": 6606, "val_loss": 6588870.0} {"train_loss": -26.8178768157959, "global_step": 548381, "epoch": 6607} {"train_loss": -26.04043960571289, "global_step": 548382, "epoch": 6607} {"train_loss": -26.85369300842285, "global_step": 548383, "epoch": 6607} {"train_loss": -26.64274024963379, "global_step": 548384, "epoch": 6607} {"train_loss": -26.507099151611328, "global_step": 548385, "epoch": 6607} {"train_loss": -27.15227699279785, "global_step": 548386, "epoch": 6607} {"train_loss": -26.6341552734375, "global_step": 548387, "epoch": 6607} {"train_loss": -26.79132652282715, "global_step": 548388, "epoch": 6607} {"train_loss": -27.193073272705078, "global_step": 548389, "epoch": 6607} {"train_loss": -26.8212947845459, "global_step": 548390, "epoch": 6607} {"train_loss": -27.14798927307129, "global_step": 548391, "epoch": 6607} {"train_loss": -26.886564254760742, "global_step": 548392, "epoch": 6607} {"train_loss": -27.147628784179688, "global_step": 548393, "epoch": 6607} {"train_loss": -27.572345733642578, "global_step": 548394, "epoch": 6607} {"train_loss": -27.0076904296875, "global_step": 548395, "epoch": 6607} {"train_loss": -27.080549240112305, "global_step": 548396, "epoch": 6607} {"train_loss": -27.25007438659668, "global_step": 548397, "epoch": 6607} {"train_loss": -26.7220516204834, "global_step": 548398, "epoch": 6607} {"train_loss": -26.9254150390625, "global_step": 548399, "epoch": 6607} {"train_loss": -27.21394157409668, "global_step": 548400, "epoch": 6607} {"train_loss": -27.321935653686523, "global_step": 548401, "epoch": 6607} {"train_loss": -27.551355361938477, "global_step": 548402, "epoch": 6607} {"train_loss": -27.39422607421875, "global_step": 548403, "epoch": 6607} {"train_loss": -27.29701805114746, "global_step": 548404, "epoch": 6607} {"train_loss": -27.63490867614746, "global_step": 548405, "epoch": 6607} {"train_loss": -27.419538497924805, "global_step": 548406, "epoch": 6607} {"train_loss": -27.592557907104492, "global_step": 548407, "epoch": 6607} {"train_loss": -27.50579261779785, "global_step": 548408, "epoch": 6607} {"train_loss": -27.42231559753418, "global_step": 548409, "epoch": 6607} {"train_loss": -27.27610206604004, "global_step": 548410, "epoch": 6607} {"train_loss": -27.621734619140625, "global_step": 548411, "epoch": 6607} {"train_loss": -27.691192626953125, "global_step": 548412, "epoch": 6607} {"train_loss": -27.46915626525879, "global_step": 548413, "epoch": 6607} {"train_loss": -27.523151397705078, "global_step": 548414, "epoch": 6607} {"train_loss": -27.4100284576416, "global_step": 548415, "epoch": 6607} {"train_loss": -27.6782283782959, "global_step": 548416, "epoch": 6607} {"train_loss": -27.53324317932129, "global_step": 548417, "epoch": 6607} {"train_loss": -27.586074829101562, "global_step": 548418, "epoch": 6607} {"train_loss": -27.76356315612793, "global_step": 548419, "epoch": 6607} {"train_loss": -28.061429977416992, "global_step": 548420, "epoch": 6607} {"train_loss": -27.757291793823242, "global_step": 548421, "epoch": 6607} {"train_loss": -27.8275146484375, "global_step": 548422, "epoch": 6607} {"train_loss": -28.526580810546875, "global_step": 548423, "epoch": 6607} {"train_loss": -27.6724853515625, "global_step": 548424, "epoch": 6607} {"train_loss": -28.1307430267334, "global_step": 548425, "epoch": 6607} {"train_loss": -27.443958282470703, "global_step": 548426, "epoch": 6607} {"train_loss": -27.503997802734375, "global_step": 548427, "epoch": 6607} {"train_loss": -27.825336456298828, "global_step": 548428, "epoch": 6607} {"train_loss": -27.76252555847168, "global_step": 548429, "epoch": 6607} {"train_loss": -27.75184440612793, "global_step": 548430, "epoch": 6607} {"train_loss": -27.842737197875977, "global_step": 548431, "epoch": 6607} {"train_loss": -27.898183822631836, "global_step": 548432, "epoch": 6607} {"train_loss": -27.920307159423828, "global_step": 548433, "epoch": 6607} {"train_loss": -27.812057495117188, "global_step": 548434, "epoch": 6607} {"train_loss": -28.096460342407227, "global_step": 548435, "epoch": 6607} {"train_loss": -28.10674476623535, "global_step": 548436, "epoch": 6607} {"train_loss": -27.9664306640625, "global_step": 548437, "epoch": 6607} {"train_loss": -28.27048683166504, "global_step": 548438, "epoch": 6607} {"train_loss": -27.65523338317871, "global_step": 548439, "epoch": 6607} {"train_loss": -27.87967300415039, "global_step": 548440, "epoch": 6607} {"train_loss": -27.651525497436523, "global_step": 548441, "epoch": 6607} {"train_loss": -28.054738998413086, "global_step": 548442, "epoch": 6607} {"train_loss": -27.71143913269043, "global_step": 548443, "epoch": 6607} {"train_loss": -27.828176498413086, "global_step": 548444, "epoch": 6607} {"train_loss": -27.803211212158203, "global_step": 548445, "epoch": 6607} {"train_loss": -27.442209243774414, "global_step": 548446, "epoch": 6607} {"train_loss": -27.827322006225586, "global_step": 548447, "epoch": 6607} {"train_loss": -28.063222885131836, "global_step": 548448, "epoch": 6607} {"train_loss": -28.261667251586914, "global_step": 548449, "epoch": 6607} {"train_loss": -27.8170166015625, "global_step": 548450, "epoch": 6607} {"train_loss": -27.1685848236084, "global_step": 548451, "epoch": 6607} {"train_loss": -25.717634201049805, "global_step": 548452, "epoch": 6607} {"train_loss": -25.42975616455078, "global_step": 548453, "epoch": 6607} {"train_loss": -26.683374404907227, "global_step": 548454, "epoch": 6607} {"train_loss": -27.40662956237793, "global_step": 548455, "epoch": 6607} {"train_loss": -26.950992584228516, "global_step": 548456, "epoch": 6607} {"train_loss": -27.466007232666016, "global_step": 548457, "epoch": 6607} {"train_loss": -27.177326202392578, "global_step": 548458, "epoch": 6607} {"train_loss": -27.615890502929688, "global_step": 548459, "epoch": 6607} {"train_loss": -27.408300399780273, "global_step": 548460, "epoch": 6607} {"train_loss": -27.01075553894043, "global_step": 548461, "epoch": 6607} {"train_loss": -27.3541316986084, "global_step": 548462, "epoch": 6607} {"train_loss": -27.429354104651026, "global_step": 548463, "epoch": 6607, "val_loss": 6605210.0} {"train_loss": -26.865737915039062, "global_step": 548464, "epoch": 6608} {"train_loss": -26.058996200561523, "global_step": 548465, "epoch": 6608} {"train_loss": -26.81891441345215, "global_step": 548466, "epoch": 6608} {"train_loss": -26.655841827392578, "global_step": 548467, "epoch": 6608} {"train_loss": -26.55061912536621, "global_step": 548468, "epoch": 6608} {"train_loss": -26.99476432800293, "global_step": 548469, "epoch": 6608} {"train_loss": -26.500974655151367, "global_step": 548470, "epoch": 6608} {"train_loss": -26.95591163635254, "global_step": 548471, "epoch": 6608} {"train_loss": -27.021955490112305, "global_step": 548472, "epoch": 6608} {"train_loss": -27.215621948242188, "global_step": 548473, "epoch": 6608} {"train_loss": -26.951139450073242, "global_step": 548474, "epoch": 6608} {"train_loss": -27.203359603881836, "global_step": 548475, "epoch": 6608} {"train_loss": -27.43413734436035, "global_step": 548476, "epoch": 6608} {"train_loss": -26.76484489440918, "global_step": 548477, "epoch": 6608} {"train_loss": -27.13948631286621, "global_step": 548478, "epoch": 6608} {"train_loss": -26.939453125, "global_step": 548479, "epoch": 6608} {"train_loss": -26.87234878540039, "global_step": 548480, "epoch": 6608} {"train_loss": -27.40400505065918, "global_step": 548481, "epoch": 6608} {"train_loss": -27.54303550720215, "global_step": 548482, "epoch": 6608} {"train_loss": -27.2445068359375, "global_step": 548483, "epoch": 6608} {"train_loss": -27.50253677368164, "global_step": 548484, "epoch": 6608} {"train_loss": -27.24393653869629, "global_step": 548485, "epoch": 6608} {"train_loss": -27.732257843017578, "global_step": 548486, "epoch": 6608} {"train_loss": -26.980255126953125, "global_step": 548487, "epoch": 6608} {"train_loss": -27.601917266845703, "global_step": 548488, "epoch": 6608} {"train_loss": -27.70693016052246, "global_step": 548489, "epoch": 6608} {"train_loss": -27.619216918945312, "global_step": 548490, "epoch": 6608} {"train_loss": -27.471099853515625, "global_step": 548491, "epoch": 6608} {"train_loss": -27.422529220581055, "global_step": 548492, "epoch": 6608} {"train_loss": -27.2225399017334, "global_step": 548493, "epoch": 6608} {"train_loss": -28.13703727722168, "global_step": 548494, "epoch": 6608} {"train_loss": -27.56629753112793, "global_step": 548495, "epoch": 6608} {"train_loss": -27.804126739501953, "global_step": 548496, "epoch": 6608} {"train_loss": -27.87139320373535, "global_step": 548497, "epoch": 6608} {"train_loss": -27.677961349487305, "global_step": 548498, "epoch": 6608} {"train_loss": -27.67767906188965, "global_step": 548499, "epoch": 6608} {"train_loss": -27.38344383239746, "global_step": 548500, "epoch": 6608} {"train_loss": -27.44052505493164, "global_step": 548501, "epoch": 6608} {"train_loss": -27.7027587890625, "global_step": 548502, "epoch": 6608} {"train_loss": -27.73379898071289, "global_step": 548503, "epoch": 6608} {"train_loss": -27.811323165893555, "global_step": 548504, "epoch": 6608} {"train_loss": -27.911951065063477, "global_step": 548505, "epoch": 6608} {"train_loss": -27.677581787109375, "global_step": 548506, "epoch": 6608} {"train_loss": -27.923583984375, "global_step": 548507, "epoch": 6608} {"train_loss": -27.77286720275879, "global_step": 548508, "epoch": 6608} {"train_loss": -27.84966468811035, "global_step": 548509, "epoch": 6608} {"train_loss": -27.722869873046875, "global_step": 548510, "epoch": 6608} {"train_loss": -27.99407386779785, "global_step": 548511, "epoch": 6608} {"train_loss": -28.113428115844727, "global_step": 548512, "epoch": 6608} {"train_loss": -28.238142013549805, "global_step": 548513, "epoch": 6608} {"train_loss": -27.874237060546875, "global_step": 548514, "epoch": 6608} {"train_loss": -28.054046630859375, "global_step": 548515, "epoch": 6608} {"train_loss": -28.2443790435791, "global_step": 548516, "epoch": 6608} {"train_loss": -27.783111572265625, "global_step": 548517, "epoch": 6608} {"train_loss": -27.873275756835938, "global_step": 548518, "epoch": 6608} {"train_loss": -27.955825805664062, "global_step": 548519, "epoch": 6608} {"train_loss": -27.5632266998291, "global_step": 548520, "epoch": 6608} {"train_loss": -28.007394790649414, "global_step": 548521, "epoch": 6608} {"train_loss": -28.037982940673828, "global_step": 548522, "epoch": 6608} {"train_loss": -27.60089683532715, "global_step": 548523, "epoch": 6608} {"train_loss": -27.738935470581055, "global_step": 548524, "epoch": 6608} {"train_loss": -27.655256271362305, "global_step": 548525, "epoch": 6608} {"train_loss": -27.498737335205078, "global_step": 548526, "epoch": 6608} {"train_loss": -27.53802490234375, "global_step": 548527, "epoch": 6608} {"train_loss": -27.472639083862305, "global_step": 548528, "epoch": 6608} {"train_loss": -27.307519912719727, "global_step": 548529, "epoch": 6608} {"train_loss": -26.899778366088867, "global_step": 548530, "epoch": 6608} {"train_loss": -26.834918975830078, "global_step": 548531, "epoch": 6608} {"train_loss": -27.738122940063477, "global_step": 548532, "epoch": 6608} {"train_loss": -27.5545711517334, "global_step": 548533, "epoch": 6608} {"train_loss": -27.229110717773438, "global_step": 548534, "epoch": 6608} {"train_loss": -27.628559112548828, "global_step": 548535, "epoch": 6608} {"train_loss": -27.54718589782715, "global_step": 548536, "epoch": 6608} {"train_loss": -26.993499755859375, "global_step": 548537, "epoch": 6608} {"train_loss": -27.314453125, "global_step": 548538, "epoch": 6608} {"train_loss": -27.126562118530273, "global_step": 548539, "epoch": 6608} {"train_loss": -27.770130157470703, "global_step": 548540, "epoch": 6608} {"train_loss": -27.546171188354492, "global_step": 548541, "epoch": 6608} {"train_loss": -27.79450798034668, "global_step": 548542, "epoch": 6608} {"train_loss": -27.966222763061523, "global_step": 548543, "epoch": 6608} {"train_loss": -27.56766128540039, "global_step": 548544, "epoch": 6608} {"train_loss": -27.79853630065918, "global_step": 548545, "epoch": 6608} {"train_loss": -27.468093136706983, "global_step": 548546, "epoch": 6608, "val_loss": 6629011.0} {"train_loss": -26.69951820373535, "global_step": 548547, "epoch": 6609} {"train_loss": -25.627161026000977, "global_step": 548548, "epoch": 6609} {"train_loss": -26.459583282470703, "global_step": 548549, "epoch": 6609} {"train_loss": -26.56818962097168, "global_step": 548550, "epoch": 6609} {"train_loss": -26.663068771362305, "global_step": 548551, "epoch": 6609} {"train_loss": -26.6340274810791, "global_step": 548552, "epoch": 6609} {"train_loss": -26.46036720275879, "global_step": 548553, "epoch": 6609} {"train_loss": -26.86097526550293, "global_step": 548554, "epoch": 6609} {"train_loss": -26.87247657775879, "global_step": 548555, "epoch": 6609} {"train_loss": -27.393064498901367, "global_step": 548556, "epoch": 6609} {"train_loss": -26.645841598510742, "global_step": 548557, "epoch": 6609} {"train_loss": -27.231876373291016, "global_step": 548558, "epoch": 6609} {"train_loss": -27.219192504882812, "global_step": 548559, "epoch": 6609} {"train_loss": -27.089569091796875, "global_step": 548560, "epoch": 6609} {"train_loss": -27.14800453186035, "global_step": 548561, "epoch": 6609} {"train_loss": -27.564416885375977, "global_step": 548562, "epoch": 6609} {"train_loss": -27.38437271118164, "global_step": 548563, "epoch": 6609} {"train_loss": -27.21968650817871, "global_step": 548564, "epoch": 6609} {"train_loss": -27.322301864624023, "global_step": 548565, "epoch": 6609} {"train_loss": -27.303709030151367, "global_step": 548566, "epoch": 6609} {"train_loss": -27.65793800354004, "global_step": 548567, "epoch": 6609} {"train_loss": -27.599477767944336, "global_step": 548568, "epoch": 6609} {"train_loss": -27.3903751373291, "global_step": 548569, "epoch": 6609} {"train_loss": -27.604904174804688, "global_step": 548570, "epoch": 6609} {"train_loss": -27.34168815612793, "global_step": 548571, "epoch": 6609} {"train_loss": -27.5316219329834, "global_step": 548572, "epoch": 6609} {"train_loss": -27.7359561920166, "global_step": 548573, "epoch": 6609} {"train_loss": -27.486968994140625, "global_step": 548574, "epoch": 6609} {"train_loss": -27.34758949279785, "global_step": 548575, "epoch": 6609} {"train_loss": -27.673620223999023, "global_step": 548576, "epoch": 6609} {"train_loss": -27.544981002807617, "global_step": 548577, "epoch": 6609} {"train_loss": -28.1553897857666, "global_step": 548578, "epoch": 6609} {"train_loss": -27.292739868164062, "global_step": 548579, "epoch": 6609} {"train_loss": -27.251428604125977, "global_step": 548580, "epoch": 6609} {"train_loss": -27.91226577758789, "global_step": 548581, "epoch": 6609} {"train_loss": -27.610944747924805, "global_step": 548582, "epoch": 6609} {"train_loss": -27.5440673828125, "global_step": 548583, "epoch": 6609} {"train_loss": -28.13344383239746, "global_step": 548584, "epoch": 6609} {"train_loss": -27.466516494750977, "global_step": 548585, "epoch": 6609} {"train_loss": -27.48395347595215, "global_step": 548586, "epoch": 6609} {"train_loss": -28.09327507019043, "global_step": 548587, "epoch": 6609} {"train_loss": -27.979022979736328, "global_step": 548588, "epoch": 6609} {"train_loss": -28.009490966796875, "global_step": 548589, "epoch": 6609} {"train_loss": -27.851032257080078, "global_step": 548590, "epoch": 6609} {"train_loss": -27.45516014099121, "global_step": 548591, "epoch": 6609} {"train_loss": -28.235004425048828, "global_step": 548592, "epoch": 6609} {"train_loss": -27.981769561767578, "global_step": 548593, "epoch": 6609} {"train_loss": -27.93863296508789, "global_step": 548594, "epoch": 6609} {"train_loss": -27.80509376525879, "global_step": 548595, "epoch": 6609} {"train_loss": -27.878494262695312, "global_step": 548596, "epoch": 6609} {"train_loss": -28.029937744140625, "global_step": 548597, "epoch": 6609} {"train_loss": -27.563556671142578, "global_step": 548598, "epoch": 6609} {"train_loss": -27.94428062438965, "global_step": 548599, "epoch": 6609} {"train_loss": -27.629175186157227, "global_step": 548600, "epoch": 6609} {"train_loss": -28.066396713256836, "global_step": 548601, "epoch": 6609} {"train_loss": -28.07200050354004, "global_step": 548602, "epoch": 6609} {"train_loss": -27.914426803588867, "global_step": 548603, "epoch": 6609} {"train_loss": -27.756444931030273, "global_step": 548604, "epoch": 6609} {"train_loss": -28.074628829956055, "global_step": 548605, "epoch": 6609} {"train_loss": -27.931188583374023, "global_step": 548606, "epoch": 6609} {"train_loss": -27.800519943237305, "global_step": 548607, "epoch": 6609} {"train_loss": -27.980335235595703, "global_step": 548608, "epoch": 6609} {"train_loss": -27.24744987487793, "global_step": 548609, "epoch": 6609} {"train_loss": -27.2316951751709, "global_step": 548610, "epoch": 6609} {"train_loss": -27.4943790435791, "global_step": 548611, "epoch": 6609} {"train_loss": -27.742544174194336, "global_step": 548612, "epoch": 6609} {"train_loss": -27.99543571472168, "global_step": 548613, "epoch": 6609} {"train_loss": -27.440839767456055, "global_step": 548614, "epoch": 6609} {"train_loss": -27.315465927124023, "global_step": 548615, "epoch": 6609} {"train_loss": -27.694684982299805, "global_step": 548616, "epoch": 6609} {"train_loss": -27.805591583251953, "global_step": 548617, "epoch": 6609} {"train_loss": -27.8469181060791, "global_step": 548618, "epoch": 6609} {"train_loss": -27.940046310424805, "global_step": 548619, "epoch": 6609} {"train_loss": -28.00519371032715, "global_step": 548620, "epoch": 6609} {"train_loss": -28.087665557861328, "global_step": 548621, "epoch": 6609} {"train_loss": -28.020009994506836, "global_step": 548622, "epoch": 6609} {"train_loss": -27.511838912963867, "global_step": 548623, "epoch": 6609} {"train_loss": -27.682233810424805, "global_step": 548624, "epoch": 6609} {"train_loss": -27.754077911376953, "global_step": 548625, "epoch": 6609} {"train_loss": -28.18421745300293, "global_step": 548626, "epoch": 6609} {"train_loss": -27.559240341186523, "global_step": 548627, "epoch": 6609} {"train_loss": -27.750635147094727, "global_step": 548628, "epoch": 6609} {"train_loss": -27.548258103520038, "global_step": 548629, "epoch": 6609, "val_loss": 6576437.0} {"train_loss": -26.931243896484375, "global_step": 548630, "epoch": 6610} {"train_loss": -25.8149471282959, "global_step": 548631, "epoch": 6610} {"train_loss": -25.575475692749023, "global_step": 548632, "epoch": 6610} {"train_loss": -26.569982528686523, "global_step": 548633, "epoch": 6610} {"train_loss": -26.4476261138916, "global_step": 548634, "epoch": 6610} {"train_loss": -27.04618263244629, "global_step": 548635, "epoch": 6610} {"train_loss": -27.03577995300293, "global_step": 548636, "epoch": 6610} {"train_loss": -26.536840438842773, "global_step": 548637, "epoch": 6610} {"train_loss": -27.164960861206055, "global_step": 548638, "epoch": 6610} {"train_loss": -27.127548217773438, "global_step": 548639, "epoch": 6610} {"train_loss": -27.111175537109375, "global_step": 548640, "epoch": 6610} {"train_loss": -27.265033721923828, "global_step": 548641, "epoch": 6610} {"train_loss": -26.628767013549805, "global_step": 548642, "epoch": 6610} {"train_loss": -26.97222328186035, "global_step": 548643, "epoch": 6610} {"train_loss": -26.677534103393555, "global_step": 548644, "epoch": 6610} {"train_loss": -27.1163272857666, "global_step": 548645, "epoch": 6610} {"train_loss": -26.6787052154541, "global_step": 548646, "epoch": 6610} {"train_loss": -27.379791259765625, "global_step": 548647, "epoch": 6610} {"train_loss": -26.842512130737305, "global_step": 548648, "epoch": 6610} {"train_loss": -27.416837692260742, "global_step": 548649, "epoch": 6610} {"train_loss": -27.180072784423828, "global_step": 548650, "epoch": 6610} {"train_loss": -27.283185958862305, "global_step": 548651, "epoch": 6610} {"train_loss": -27.061208724975586, "global_step": 548652, "epoch": 6610} {"train_loss": -26.84456443786621, "global_step": 548653, "epoch": 6610} {"train_loss": -27.21973991394043, "global_step": 548654, "epoch": 6610} {"train_loss": -27.38605308532715, "global_step": 548655, "epoch": 6610} {"train_loss": -27.618305206298828, "global_step": 548656, "epoch": 6610} {"train_loss": -27.14242935180664, "global_step": 548657, "epoch": 6610} {"train_loss": -27.270374298095703, "global_step": 548658, "epoch": 6610} {"train_loss": -27.131927490234375, "global_step": 548659, "epoch": 6610} {"train_loss": -27.198413848876953, "global_step": 548660, "epoch": 6610} {"train_loss": -27.478042602539062, "global_step": 548661, "epoch": 6610} {"train_loss": -27.498319625854492, "global_step": 548662, "epoch": 6610} {"train_loss": -27.594030380249023, "global_step": 548663, "epoch": 6610} {"train_loss": -27.41733169555664, "global_step": 548664, "epoch": 6610} {"train_loss": -27.503095626831055, "global_step": 548665, "epoch": 6610} {"train_loss": -27.609216690063477, "global_step": 548666, "epoch": 6610} {"train_loss": -27.273191452026367, "global_step": 548667, "epoch": 6610} {"train_loss": -27.415658950805664, "global_step": 548668, "epoch": 6610} {"train_loss": -27.728078842163086, "global_step": 548669, "epoch": 6610} {"train_loss": -27.64594078063965, "global_step": 548670, "epoch": 6610} {"train_loss": -27.359312057495117, "global_step": 548671, "epoch": 6610} {"train_loss": -27.8187198638916, "global_step": 548672, "epoch": 6610} {"train_loss": -27.507587432861328, "global_step": 548673, "epoch": 6610} {"train_loss": -27.75162124633789, "global_step": 548674, "epoch": 6610} {"train_loss": -27.982559204101562, "global_step": 548675, "epoch": 6610} {"train_loss": -27.716297149658203, "global_step": 548676, "epoch": 6610} {"train_loss": -27.774744033813477, "global_step": 548677, "epoch": 6610} {"train_loss": -27.726776123046875, "global_step": 548678, "epoch": 6610} {"train_loss": -27.998395919799805, "global_step": 548679, "epoch": 6610} {"train_loss": -27.8155517578125, "global_step": 548680, "epoch": 6610} {"train_loss": -28.116153717041016, "global_step": 548681, "epoch": 6610} {"train_loss": -27.953067779541016, "global_step": 548682, "epoch": 6610} {"train_loss": -28.00275993347168, "global_step": 548683, "epoch": 6610} {"train_loss": -27.732269287109375, "global_step": 548684, "epoch": 6610} {"train_loss": -28.095901489257812, "global_step": 548685, "epoch": 6610} {"train_loss": -28.3076171875, "global_step": 548686, "epoch": 6610} {"train_loss": -28.113256454467773, "global_step": 548687, "epoch": 6610} {"train_loss": -27.566614151000977, "global_step": 548688, "epoch": 6610} {"train_loss": -27.84812355041504, "global_step": 548689, "epoch": 6610} {"train_loss": -28.153045654296875, "global_step": 548690, "epoch": 6610} {"train_loss": -27.794126510620117, "global_step": 548691, "epoch": 6610} {"train_loss": -27.869281768798828, "global_step": 548692, "epoch": 6610} {"train_loss": -28.217071533203125, "global_step": 548693, "epoch": 6610} {"train_loss": -27.661035537719727, "global_step": 548694, "epoch": 6610} {"train_loss": -27.976093292236328, "global_step": 548695, "epoch": 6610} {"train_loss": -27.99464225769043, "global_step": 548696, "epoch": 6610} {"train_loss": -27.818103790283203, "global_step": 548697, "epoch": 6610} {"train_loss": -27.666772842407227, "global_step": 548698, "epoch": 6610} {"train_loss": -27.810348510742188, "global_step": 548699, "epoch": 6610} {"train_loss": -28.066852569580078, "global_step": 548700, "epoch": 6610} {"train_loss": -27.9936580657959, "global_step": 548701, "epoch": 6610} {"train_loss": -27.890287399291992, "global_step": 548702, "epoch": 6610} {"train_loss": -27.8448429107666, "global_step": 548703, "epoch": 6610} {"train_loss": -27.940475463867188, "global_step": 548704, "epoch": 6610} {"train_loss": -28.239912033081055, "global_step": 548705, "epoch": 6610} {"train_loss": -28.046064376831055, "global_step": 548706, "epoch": 6610} {"train_loss": -27.9130916595459, "global_step": 548707, "epoch": 6610} {"train_loss": -27.891706466674805, "global_step": 548708, "epoch": 6610} {"train_loss": -27.97238540649414, "global_step": 548709, "epoch": 6610} {"train_loss": -27.494068145751953, "global_step": 548710, "epoch": 6610} {"train_loss": -27.47641372680664, "global_step": 548711, "epoch": 6610} {"train_loss": -27.48345735848668, "global_step": 548712, "epoch": 6610, "val_loss": 6592924.5} {"train_loss": -25.688474655151367, "global_step": 548713, "epoch": 6611} {"train_loss": -23.119230270385742, "global_step": 548714, "epoch": 6611} {"train_loss": -22.867050170898438, "global_step": 548715, "epoch": 6611} {"train_loss": -25.357728958129883, "global_step": 548716, "epoch": 6611} {"train_loss": -26.489770889282227, "global_step": 548717, "epoch": 6611} {"train_loss": -26.228010177612305, "global_step": 548718, "epoch": 6611} {"train_loss": -26.330408096313477, "global_step": 548719, "epoch": 6611} {"train_loss": -26.5076904296875, "global_step": 548720, "epoch": 6611} {"train_loss": -26.041406631469727, "global_step": 548721, "epoch": 6611} {"train_loss": -27.101409912109375, "global_step": 548722, "epoch": 6611} {"train_loss": -26.652658462524414, "global_step": 548723, "epoch": 6611} {"train_loss": -26.4027099609375, "global_step": 548724, "epoch": 6611} {"train_loss": -27.28260612487793, "global_step": 548725, "epoch": 6611} {"train_loss": -27.165313720703125, "global_step": 548726, "epoch": 6611} {"train_loss": -26.709869384765625, "global_step": 548727, "epoch": 6611} {"train_loss": -26.983142852783203, "global_step": 548728, "epoch": 6611} {"train_loss": -26.9071044921875, "global_step": 548729, "epoch": 6611} {"train_loss": -27.03017234802246, "global_step": 548730, "epoch": 6611} {"train_loss": -27.19843864440918, "global_step": 548731, "epoch": 6611} {"train_loss": -27.2935848236084, "global_step": 548732, "epoch": 6611} {"train_loss": -26.811939239501953, "global_step": 548733, "epoch": 6611} {"train_loss": -27.635522842407227, "global_step": 548734, "epoch": 6611} {"train_loss": -27.484350204467773, "global_step": 548735, "epoch": 6611} {"train_loss": -26.8810977935791, "global_step": 548736, "epoch": 6611} {"train_loss": -27.741682052612305, "global_step": 548737, "epoch": 6611} {"train_loss": -27.399999618530273, "global_step": 548738, "epoch": 6611} {"train_loss": -27.445302963256836, "global_step": 548739, "epoch": 6611} {"train_loss": -27.134052276611328, "global_step": 548740, "epoch": 6611} {"train_loss": -27.2224178314209, "global_step": 548741, "epoch": 6611} {"train_loss": -27.19415855407715, "global_step": 548742, "epoch": 6611} {"train_loss": -27.442991256713867, "global_step": 548743, "epoch": 6611} {"train_loss": -27.31697654724121, "global_step": 548744, "epoch": 6611} {"train_loss": -27.6014461517334, "global_step": 548745, "epoch": 6611} {"train_loss": -27.259851455688477, "global_step": 548746, "epoch": 6611} {"train_loss": -27.59490394592285, "global_step": 548747, "epoch": 6611} {"train_loss": -27.446441650390625, "global_step": 548748, "epoch": 6611} {"train_loss": -27.659011840820312, "global_step": 548749, "epoch": 6611} {"train_loss": -27.570026397705078, "global_step": 548750, "epoch": 6611} {"train_loss": -28.00453758239746, "global_step": 548751, "epoch": 6611} {"train_loss": -27.541406631469727, "global_step": 548752, "epoch": 6611} {"train_loss": -27.679859161376953, "global_step": 548753, "epoch": 6611} {"train_loss": -27.3470401763916, "global_step": 548754, "epoch": 6611} {"train_loss": -27.985382080078125, "global_step": 548755, "epoch": 6611} {"train_loss": -27.407541275024414, "global_step": 548756, "epoch": 6611} {"train_loss": -27.83509635925293, "global_step": 548757, "epoch": 6611} {"train_loss": -27.622516632080078, "global_step": 548758, "epoch": 6611} {"train_loss": -27.8468017578125, "global_step": 548759, "epoch": 6611} {"train_loss": -27.65168571472168, "global_step": 548760, "epoch": 6611} {"train_loss": -27.825027465820312, "global_step": 548761, "epoch": 6611} {"train_loss": -27.874921798706055, "global_step": 548762, "epoch": 6611} {"train_loss": -27.3979549407959, "global_step": 548763, "epoch": 6611} {"train_loss": -27.93060302734375, "global_step": 548764, "epoch": 6611} {"train_loss": -27.76722526550293, "global_step": 548765, "epoch": 6611} {"train_loss": -28.165857315063477, "global_step": 548766, "epoch": 6611} {"train_loss": -28.132787704467773, "global_step": 548767, "epoch": 6611} {"train_loss": -27.648828506469727, "global_step": 548768, "epoch": 6611} {"train_loss": -27.882923126220703, "global_step": 548769, "epoch": 6611} {"train_loss": -27.81830406188965, "global_step": 548770, "epoch": 6611} {"train_loss": -28.1387939453125, "global_step": 548771, "epoch": 6611} {"train_loss": -27.84547996520996, "global_step": 548772, "epoch": 6611} {"train_loss": -27.44549560546875, "global_step": 548773, "epoch": 6611} {"train_loss": -27.90755271911621, "global_step": 548774, "epoch": 6611} {"train_loss": -27.634180068969727, "global_step": 548775, "epoch": 6611} {"train_loss": -27.478412628173828, "global_step": 548776, "epoch": 6611} {"train_loss": -27.80136489868164, "global_step": 548777, "epoch": 6611} {"train_loss": -27.489953994750977, "global_step": 548778, "epoch": 6611} {"train_loss": -28.037195205688477, "global_step": 548779, "epoch": 6611} {"train_loss": -27.149152755737305, "global_step": 548780, "epoch": 6611} {"train_loss": -27.33512306213379, "global_step": 548781, "epoch": 6611} {"train_loss": -27.442703247070312, "global_step": 548782, "epoch": 6611} {"train_loss": -27.655744552612305, "global_step": 548783, "epoch": 6611} {"train_loss": -27.552661895751953, "global_step": 548784, "epoch": 6611} {"train_loss": -27.701505661010742, "global_step": 548785, "epoch": 6611} {"train_loss": -27.67178726196289, "global_step": 548786, "epoch": 6611} {"train_loss": -27.814889907836914, "global_step": 548787, "epoch": 6611} {"train_loss": -27.628768920898438, "global_step": 548788, "epoch": 6611} {"train_loss": -27.81683921813965, "global_step": 548789, "epoch": 6611} {"train_loss": -27.6009521484375, "global_step": 548790, "epoch": 6611} {"train_loss": -27.859786987304688, "global_step": 548791, "epoch": 6611} {"train_loss": -27.786670684814453, "global_step": 548792, "epoch": 6611} {"train_loss": -27.8991641998291, "global_step": 548793, "epoch": 6611} {"train_loss": -27.776981353759766, "global_step": 548794, "epoch": 6611} {"train_loss": -27.284991298813416, "global_step": 548795, "epoch": 6611, "val_loss": 6620651.0} {"train_loss": -25.629568099975586, "global_step": 548796, "epoch": 6612} {"train_loss": -25.2160701751709, "global_step": 548797, "epoch": 6612} {"train_loss": -26.489057540893555, "global_step": 548798, "epoch": 6612} {"train_loss": -25.65309715270996, "global_step": 548799, "epoch": 6612} {"train_loss": -26.424055099487305, "global_step": 548800, "epoch": 6612} {"train_loss": -26.334997177124023, "global_step": 548801, "epoch": 6612} {"train_loss": -26.833723068237305, "global_step": 548802, "epoch": 6612} {"train_loss": -26.710147857666016, "global_step": 548803, "epoch": 6612} {"train_loss": -26.3632755279541, "global_step": 548804, "epoch": 6612} {"train_loss": -26.673664093017578, "global_step": 548805, "epoch": 6612} {"train_loss": -27.02227210998535, "global_step": 548806, "epoch": 6612} {"train_loss": -26.7059383392334, "global_step": 548807, "epoch": 6612} {"train_loss": -26.649444580078125, "global_step": 548808, "epoch": 6612} {"train_loss": -26.880895614624023, "global_step": 548809, "epoch": 6612} {"train_loss": -26.651700973510742, "global_step": 548810, "epoch": 6612} {"train_loss": -26.691579818725586, "global_step": 548811, "epoch": 6612} {"train_loss": -27.02704429626465, "global_step": 548812, "epoch": 6612} {"train_loss": -27.200666427612305, "global_step": 548813, "epoch": 6612} {"train_loss": -27.15728187561035, "global_step": 548814, "epoch": 6612} {"train_loss": -27.030033111572266, "global_step": 548815, "epoch": 6612} {"train_loss": -27.323904037475586, "global_step": 548816, "epoch": 6612} {"train_loss": -27.219823837280273, "global_step": 548817, "epoch": 6612} {"train_loss": -27.34099769592285, "global_step": 548818, "epoch": 6612} {"train_loss": -27.610177993774414, "global_step": 548819, "epoch": 6612} {"train_loss": -26.978952407836914, "global_step": 548820, "epoch": 6612} {"train_loss": -27.538700103759766, "global_step": 548821, "epoch": 6612} {"train_loss": -27.244693756103516, "global_step": 548822, "epoch": 6612} {"train_loss": -27.23723793029785, "global_step": 548823, "epoch": 6612} {"train_loss": -27.271970748901367, "global_step": 548824, "epoch": 6612} {"train_loss": -27.361652374267578, "global_step": 548825, "epoch": 6612} {"train_loss": -27.31141471862793, "global_step": 548826, "epoch": 6612} {"train_loss": -27.2235107421875, "global_step": 548827, "epoch": 6612} {"train_loss": -27.826181411743164, "global_step": 548828, "epoch": 6612} {"train_loss": -27.4251708984375, "global_step": 548829, "epoch": 6612} {"train_loss": -27.324146270751953, "global_step": 548830, "epoch": 6612} {"train_loss": -27.51771354675293, "global_step": 548831, "epoch": 6612} {"train_loss": -27.513696670532227, "global_step": 548832, "epoch": 6612} {"train_loss": -27.668256759643555, "global_step": 548833, "epoch": 6612} {"train_loss": -28.2728328704834, "global_step": 548834, "epoch": 6612} {"train_loss": -27.56348991394043, "global_step": 548835, "epoch": 6612} {"train_loss": -27.884206771850586, "global_step": 548836, "epoch": 6612} {"train_loss": -27.749555587768555, "global_step": 548837, "epoch": 6612} {"train_loss": -27.707006454467773, "global_step": 548838, "epoch": 6612} {"train_loss": -27.6811580657959, "global_step": 548839, "epoch": 6612} {"train_loss": -27.43910789489746, "global_step": 548840, "epoch": 6612} {"train_loss": -27.740915298461914, "global_step": 548841, "epoch": 6612} {"train_loss": -27.839181900024414, "global_step": 548842, "epoch": 6612} {"train_loss": -28.052099227905273, "global_step": 548843, "epoch": 6612} {"train_loss": -27.847930908203125, "global_step": 548844, "epoch": 6612} {"train_loss": -27.92588233947754, "global_step": 548845, "epoch": 6612} {"train_loss": -27.83967399597168, "global_step": 548846, "epoch": 6612} {"train_loss": -28.036178588867188, "global_step": 548847, "epoch": 6612} {"train_loss": -27.938745498657227, "global_step": 548848, "epoch": 6612} {"train_loss": -27.508712768554688, "global_step": 548849, "epoch": 6612} {"train_loss": -27.850927352905273, "global_step": 548850, "epoch": 6612} {"train_loss": -27.54023551940918, "global_step": 548851, "epoch": 6612} {"train_loss": -27.8259334564209, "global_step": 548852, "epoch": 6612} {"train_loss": -28.078577041625977, "global_step": 548853, "epoch": 6612} {"train_loss": -27.873838424682617, "global_step": 548854, "epoch": 6612} {"train_loss": -28.006824493408203, "global_step": 548855, "epoch": 6612} {"train_loss": -27.99432373046875, "global_step": 548856, "epoch": 6612} {"train_loss": -27.94647789001465, "global_step": 548857, "epoch": 6612} {"train_loss": -27.768661499023438, "global_step": 548858, "epoch": 6612} {"train_loss": -27.786468505859375, "global_step": 548859, "epoch": 6612} {"train_loss": -27.9086971282959, "global_step": 548860, "epoch": 6612} {"train_loss": -27.914657592773438, "global_step": 548861, "epoch": 6612} {"train_loss": -27.991785049438477, "global_step": 548862, "epoch": 6612} {"train_loss": -28.066373825073242, "global_step": 548863, "epoch": 6612} {"train_loss": -27.31245231628418, "global_step": 548864, "epoch": 6612} {"train_loss": -27.631702423095703, "global_step": 548865, "epoch": 6612} {"train_loss": -27.912145614624023, "global_step": 548866, "epoch": 6612} {"train_loss": -27.955402374267578, "global_step": 548867, "epoch": 6612} {"train_loss": -27.741613388061523, "global_step": 548868, "epoch": 6612} {"train_loss": -27.708066940307617, "global_step": 548869, "epoch": 6612} {"train_loss": -27.158771514892578, "global_step": 548870, "epoch": 6612} {"train_loss": -27.69124412536621, "global_step": 548871, "epoch": 6612} {"train_loss": -27.618438720703125, "global_step": 548872, "epoch": 6612} {"train_loss": -27.899688720703125, "global_step": 548873, "epoch": 6612} {"train_loss": -28.018665313720703, "global_step": 548874, "epoch": 6612} {"train_loss": -27.6362361907959, "global_step": 548875, "epoch": 6612} {"train_loss": -27.997638702392578, "global_step": 548876, "epoch": 6612} {"train_loss": -28.1602840423584, "global_step": 548877, "epoch": 6612} {"train_loss": -27.436105751129517, "global_step": 548878, "epoch": 6612, "val_loss": 6563833.0} {"train_loss": -26.800878524780273, "global_step": 548879, "epoch": 6613} {"train_loss": -26.494409561157227, "global_step": 548880, "epoch": 6613} {"train_loss": -26.9013671875, "global_step": 548881, "epoch": 6613} {"train_loss": -27.572187423706055, "global_step": 548882, "epoch": 6613} {"train_loss": -26.254810333251953, "global_step": 548883, "epoch": 6613} {"train_loss": -27.050540924072266, "global_step": 548884, "epoch": 6613} {"train_loss": -26.683652877807617, "global_step": 548885, "epoch": 6613} {"train_loss": -26.495304107666016, "global_step": 548886, "epoch": 6613} {"train_loss": -26.68879508972168, "global_step": 548887, "epoch": 6613} {"train_loss": -27.385852813720703, "global_step": 548888, "epoch": 6613} {"train_loss": -26.963064193725586, "global_step": 548889, "epoch": 6613} {"train_loss": -27.39597511291504, "global_step": 548890, "epoch": 6613} {"train_loss": -27.0042781829834, "global_step": 548891, "epoch": 6613} {"train_loss": -26.9845027923584, "global_step": 548892, "epoch": 6613} {"train_loss": -27.363744735717773, "global_step": 548893, "epoch": 6613} {"train_loss": -27.30610466003418, "global_step": 548894, "epoch": 6613} {"train_loss": -27.8188419342041, "global_step": 548895, "epoch": 6613} {"train_loss": -27.560155868530273, "global_step": 548896, "epoch": 6613} {"train_loss": -27.4754695892334, "global_step": 548897, "epoch": 6613} {"train_loss": -27.48493003845215, "global_step": 548898, "epoch": 6613} {"train_loss": -27.627344131469727, "global_step": 548899, "epoch": 6613} {"train_loss": -28.059431076049805, "global_step": 548900, "epoch": 6613} {"train_loss": -27.445627212524414, "global_step": 548901, "epoch": 6613} {"train_loss": -27.695348739624023, "global_step": 548902, "epoch": 6613} {"train_loss": -27.521825790405273, "global_step": 548903, "epoch": 6613} {"train_loss": -28.28082847595215, "global_step": 548904, "epoch": 6613} {"train_loss": -27.793073654174805, "global_step": 548905, "epoch": 6613} {"train_loss": -27.937414169311523, "global_step": 548906, "epoch": 6613} {"train_loss": -27.9920711517334, "global_step": 548907, "epoch": 6613} {"train_loss": -27.650806427001953, "global_step": 548908, "epoch": 6613} {"train_loss": -27.576215744018555, "global_step": 548909, "epoch": 6613} {"train_loss": -27.91045570373535, "global_step": 548910, "epoch": 6613} {"train_loss": -27.835004806518555, "global_step": 548911, "epoch": 6613} {"train_loss": -27.670654296875, "global_step": 548912, "epoch": 6613} {"train_loss": -27.901472091674805, "global_step": 548913, "epoch": 6613} {"train_loss": -28.298187255859375, "global_step": 548914, "epoch": 6613} {"train_loss": -28.111631393432617, "global_step": 548915, "epoch": 6613} {"train_loss": -27.920501708984375, "global_step": 548916, "epoch": 6613} {"train_loss": -27.618778228759766, "global_step": 548917, "epoch": 6613} {"train_loss": -28.069738388061523, "global_step": 548918, "epoch": 6613} {"train_loss": -28.002552032470703, "global_step": 548919, "epoch": 6613} {"train_loss": -28.099048614501953, "global_step": 548920, "epoch": 6613} {"train_loss": -28.0596866607666, "global_step": 548921, "epoch": 6613} {"train_loss": -28.178380966186523, "global_step": 548922, "epoch": 6613} {"train_loss": -27.785852432250977, "global_step": 548923, "epoch": 6613} {"train_loss": -27.963178634643555, "global_step": 548924, "epoch": 6613} {"train_loss": -28.360584259033203, "global_step": 548925, "epoch": 6613} {"train_loss": -28.29509925842285, "global_step": 548926, "epoch": 6613} {"train_loss": -27.822864532470703, "global_step": 548927, "epoch": 6613} {"train_loss": -28.0383243560791, "global_step": 548928, "epoch": 6613} {"train_loss": -27.750598907470703, "global_step": 548929, "epoch": 6613} {"train_loss": -28.135053634643555, "global_step": 548930, "epoch": 6613} {"train_loss": -28.25629997253418, "global_step": 548931, "epoch": 6613} {"train_loss": -27.683252334594727, "global_step": 548932, "epoch": 6613} {"train_loss": -27.957441329956055, "global_step": 548933, "epoch": 6613} {"train_loss": -27.839643478393555, "global_step": 548934, "epoch": 6613} {"train_loss": -27.926679611206055, "global_step": 548935, "epoch": 6613} {"train_loss": -27.79969596862793, "global_step": 548936, "epoch": 6613} {"train_loss": -28.0844669342041, "global_step": 548937, "epoch": 6613} {"train_loss": -28.18670654296875, "global_step": 548938, "epoch": 6613} {"train_loss": -27.7520694732666, "global_step": 548939, "epoch": 6613} {"train_loss": -27.90228843688965, "global_step": 548940, "epoch": 6613} {"train_loss": -27.859045028686523, "global_step": 548941, "epoch": 6613} {"train_loss": -27.70553970336914, "global_step": 548942, "epoch": 6613} {"train_loss": -27.467092514038086, "global_step": 548943, "epoch": 6613} {"train_loss": -26.633222579956055, "global_step": 548944, "epoch": 6613} {"train_loss": -25.918874740600586, "global_step": 548945, "epoch": 6613} {"train_loss": -26.385787963867188, "global_step": 548946, "epoch": 6613} {"train_loss": -26.982934951782227, "global_step": 548947, "epoch": 6613} {"train_loss": -27.0030574798584, "global_step": 548948, "epoch": 6613} {"train_loss": -26.911090850830078, "global_step": 548949, "epoch": 6613} {"train_loss": -26.960678100585938, "global_step": 548950, "epoch": 6613} {"train_loss": -26.79913902282715, "global_step": 548951, "epoch": 6613} {"train_loss": -26.978857040405273, "global_step": 548952, "epoch": 6613} {"train_loss": -27.0803165435791, "global_step": 548953, "epoch": 6613} {"train_loss": -27.058135986328125, "global_step": 548954, "epoch": 6613} {"train_loss": -27.47891616821289, "global_step": 548955, "epoch": 6613} {"train_loss": -27.162641525268555, "global_step": 548956, "epoch": 6613} {"train_loss": -27.556604385375977, "global_step": 548957, "epoch": 6613} {"train_loss": -27.470050811767578, "global_step": 548958, "epoch": 6613} {"train_loss": -27.172199249267578, "global_step": 548959, "epoch": 6613} {"train_loss": -27.271759033203125, "global_step": 548960, "epoch": 6613} {"train_loss": -27.526517132678663, "global_step": 548961, "epoch": 6613, "val_loss": 6594857.0} {"train_loss": -27.017948150634766, "global_step": 548962, "epoch": 6614} {"train_loss": -26.37843132019043, "global_step": 548963, "epoch": 6614} {"train_loss": -27.01124382019043, "global_step": 548964, "epoch": 6614} {"train_loss": -26.728574752807617, "global_step": 548965, "epoch": 6614} {"train_loss": -26.932373046875, "global_step": 548966, "epoch": 6614} {"train_loss": -27.251501083374023, "global_step": 548967, "epoch": 6614} {"train_loss": -26.79841423034668, "global_step": 548968, "epoch": 6614} {"train_loss": -26.675012588500977, "global_step": 548969, "epoch": 6614} {"train_loss": -27.223255157470703, "global_step": 548970, "epoch": 6614} {"train_loss": -27.294147491455078, "global_step": 548971, "epoch": 6614} {"train_loss": -27.4766902923584, "global_step": 548972, "epoch": 6614} {"train_loss": -27.23939323425293, "global_step": 548973, "epoch": 6614} {"train_loss": -27.008817672729492, "global_step": 548974, "epoch": 6614} {"train_loss": -27.4830379486084, "global_step": 548975, "epoch": 6614} {"train_loss": -27.3330078125, "global_step": 548976, "epoch": 6614} {"train_loss": -27.304828643798828, "global_step": 548977, "epoch": 6614} {"train_loss": -27.52469825744629, "global_step": 548978, "epoch": 6614} {"train_loss": -27.04168128967285, "global_step": 548979, "epoch": 6614} {"train_loss": -27.4713134765625, "global_step": 548980, "epoch": 6614} {"train_loss": -27.322528839111328, "global_step": 548981, "epoch": 6614} {"train_loss": -27.579437255859375, "global_step": 548982, "epoch": 6614} {"train_loss": -27.60112953186035, "global_step": 548983, "epoch": 6614} {"train_loss": -27.518720626831055, "global_step": 548984, "epoch": 6614} {"train_loss": -27.967472076416016, "global_step": 548985, "epoch": 6614} {"train_loss": -27.332067489624023, "global_step": 548986, "epoch": 6614} {"train_loss": -27.782251358032227, "global_step": 548987, "epoch": 6614} {"train_loss": -27.795103073120117, "global_step": 548988, "epoch": 6614} {"train_loss": -27.677108764648438, "global_step": 548989, "epoch": 6614} {"train_loss": -27.73322868347168, "global_step": 548990, "epoch": 6614} {"train_loss": -27.581623077392578, "global_step": 548991, "epoch": 6614} {"train_loss": -27.670194625854492, "global_step": 548992, "epoch": 6614} {"train_loss": -27.40479850769043, "global_step": 548993, "epoch": 6614} {"train_loss": -27.970319747924805, "global_step": 548994, "epoch": 6614} {"train_loss": -28.182836532592773, "global_step": 548995, "epoch": 6614} {"train_loss": -27.708826065063477, "global_step": 548996, "epoch": 6614} {"train_loss": -27.441181182861328, "global_step": 548997, "epoch": 6614} {"train_loss": -27.76007652282715, "global_step": 548998, "epoch": 6614} {"train_loss": -27.356021881103516, "global_step": 548999, "epoch": 6614} {"train_loss": -27.75583839416504, "global_step": 549000, "epoch": 6614} {"train_loss": -27.559497833251953, "global_step": 549001, "epoch": 6614} {"train_loss": -27.93292236328125, "global_step": 549002, "epoch": 6614} {"train_loss": -27.40363883972168, "global_step": 549003, "epoch": 6614} {"train_loss": -27.435565948486328, "global_step": 549004, "epoch": 6614} {"train_loss": -27.74982261657715, "global_step": 549005, "epoch": 6614} {"train_loss": -27.638883590698242, "global_step": 549006, "epoch": 6614} {"train_loss": -27.388574600219727, "global_step": 549007, "epoch": 6614} {"train_loss": -28.074054718017578, "global_step": 549008, "epoch": 6614} {"train_loss": -27.55140495300293, "global_step": 549009, "epoch": 6614} {"train_loss": -27.9498291015625, "global_step": 549010, "epoch": 6614} {"train_loss": -27.875417709350586, "global_step": 549011, "epoch": 6614} {"train_loss": -27.633108139038086, "global_step": 549012, "epoch": 6614} {"train_loss": -28.193927764892578, "global_step": 549013, "epoch": 6614} {"train_loss": -27.94040870666504, "global_step": 549014, "epoch": 6614} {"train_loss": -27.6395206451416, "global_step": 549015, "epoch": 6614} {"train_loss": -27.747100830078125, "global_step": 549016, "epoch": 6614} {"train_loss": -27.698911666870117, "global_step": 549017, "epoch": 6614} {"train_loss": -27.848825454711914, "global_step": 549018, "epoch": 6614} {"train_loss": -27.32708168029785, "global_step": 549019, "epoch": 6614} {"train_loss": -27.76453971862793, "global_step": 549020, "epoch": 6614} {"train_loss": -27.678375244140625, "global_step": 549021, "epoch": 6614} {"train_loss": -27.859617233276367, "global_step": 549022, "epoch": 6614} {"train_loss": -27.6629581451416, "global_step": 549023, "epoch": 6614} {"train_loss": -27.703994750976562, "global_step": 549024, "epoch": 6614} {"train_loss": -27.887256622314453, "global_step": 549025, "epoch": 6614} {"train_loss": -27.807764053344727, "global_step": 549026, "epoch": 6614} {"train_loss": -28.038349151611328, "global_step": 549027, "epoch": 6614} {"train_loss": -27.746503829956055, "global_step": 549028, "epoch": 6614} {"train_loss": -27.707727432250977, "global_step": 549029, "epoch": 6614} {"train_loss": -27.996978759765625, "global_step": 549030, "epoch": 6614} {"train_loss": -28.041452407836914, "global_step": 549031, "epoch": 6614} {"train_loss": -27.852893829345703, "global_step": 549032, "epoch": 6614} {"train_loss": -27.78522300720215, "global_step": 549033, "epoch": 6614} {"train_loss": -27.765043258666992, "global_step": 549034, "epoch": 6614} {"train_loss": -27.62811851501465, "global_step": 549035, "epoch": 6614} {"train_loss": -27.867467880249023, "global_step": 549036, "epoch": 6614} {"train_loss": -27.718841552734375, "global_step": 549037, "epoch": 6614} {"train_loss": -27.665693283081055, "global_step": 549038, "epoch": 6614} {"train_loss": -27.75925064086914, "global_step": 549039, "epoch": 6614} {"train_loss": -27.81962013244629, "global_step": 549040, "epoch": 6614} {"train_loss": -27.822641372680664, "global_step": 549041, "epoch": 6614} {"train_loss": -27.60834312438965, "global_step": 549042, "epoch": 6614} {"train_loss": -27.370635986328125, "global_step": 549043, "epoch": 6614} {"train_loss": -27.56993447728904, "global_step": 549044, "epoch": 6614, "val_loss": 6562856.0} {"train_loss": -27.739328384399414, "global_step": 549045, "epoch": 6615} {"train_loss": -27.5732364654541, "global_step": 549046, "epoch": 6615} {"train_loss": -27.5585880279541, "global_step": 549047, "epoch": 6615} {"train_loss": -27.238269805908203, "global_step": 549048, "epoch": 6615} {"train_loss": -27.390188217163086, "global_step": 549049, "epoch": 6615} {"train_loss": -27.398035049438477, "global_step": 549050, "epoch": 6615} {"train_loss": -27.681509017944336, "global_step": 549051, "epoch": 6615} {"train_loss": -27.377777099609375, "global_step": 549052, "epoch": 6615} {"train_loss": -27.39605712890625, "global_step": 549053, "epoch": 6615} {"train_loss": -27.600854873657227, "global_step": 549054, "epoch": 6615} {"train_loss": -27.285327911376953, "global_step": 549055, "epoch": 6615} {"train_loss": -26.948408126831055, "global_step": 549056, "epoch": 6615} {"train_loss": -27.088104248046875, "global_step": 549057, "epoch": 6615} {"train_loss": -27.207529067993164, "global_step": 549058, "epoch": 6615} {"train_loss": -26.960046768188477, "global_step": 549059, "epoch": 6615} {"train_loss": -27.732580184936523, "global_step": 549060, "epoch": 6615} {"train_loss": -27.171527862548828, "global_step": 549061, "epoch": 6615} {"train_loss": -27.60676383972168, "global_step": 549062, "epoch": 6615} {"train_loss": -27.122827529907227, "global_step": 549063, "epoch": 6615} {"train_loss": -27.572595596313477, "global_step": 549064, "epoch": 6615} {"train_loss": -27.648273468017578, "global_step": 549065, "epoch": 6615} {"train_loss": -27.89601707458496, "global_step": 549066, "epoch": 6615} {"train_loss": -27.480487823486328, "global_step": 549067, "epoch": 6615} {"train_loss": -27.802734375, "global_step": 549068, "epoch": 6615} {"train_loss": -27.487211227416992, "global_step": 549069, "epoch": 6615} {"train_loss": -27.70716667175293, "global_step": 549070, "epoch": 6615} {"train_loss": -27.544727325439453, "global_step": 549071, "epoch": 6615} {"train_loss": -27.61026382446289, "global_step": 549072, "epoch": 6615} {"train_loss": -27.32008934020996, "global_step": 549073, "epoch": 6615} {"train_loss": -27.5577392578125, "global_step": 549074, "epoch": 6615} {"train_loss": -27.839324951171875, "global_step": 549075, "epoch": 6615} {"train_loss": -27.684661865234375, "global_step": 549076, "epoch": 6615} {"train_loss": -27.575489044189453, "global_step": 549077, "epoch": 6615} {"train_loss": -27.55177879333496, "global_step": 549078, "epoch": 6615} {"train_loss": -27.69097328186035, "global_step": 549079, "epoch": 6615} {"train_loss": -27.510578155517578, "global_step": 549080, "epoch": 6615} {"train_loss": -27.764490127563477, "global_step": 549081, "epoch": 6615} {"train_loss": -27.588016510009766, "global_step": 549082, "epoch": 6615} {"train_loss": -27.261281967163086, "global_step": 549083, "epoch": 6615} {"train_loss": -27.510950088500977, "global_step": 549084, "epoch": 6615} {"train_loss": -27.816797256469727, "global_step": 549085, "epoch": 6615} {"train_loss": -27.736352920532227, "global_step": 549086, "epoch": 6615} {"train_loss": -27.836017608642578, "global_step": 549087, "epoch": 6615} {"train_loss": -27.671194076538086, "global_step": 549088, "epoch": 6615} {"train_loss": -27.848230361938477, "global_step": 549089, "epoch": 6615} {"train_loss": -27.634687423706055, "global_step": 549090, "epoch": 6615} {"train_loss": -27.683279037475586, "global_step": 549091, "epoch": 6615} {"train_loss": -27.555877685546875, "global_step": 549092, "epoch": 6615} {"train_loss": -27.846479415893555, "global_step": 549093, "epoch": 6615} {"train_loss": -27.99151611328125, "global_step": 549094, "epoch": 6615} {"train_loss": -28.032148361206055, "global_step": 549095, "epoch": 6615} {"train_loss": -27.90113639831543, "global_step": 549096, "epoch": 6615} {"train_loss": -28.1375732421875, "global_step": 549097, "epoch": 6615} {"train_loss": -27.327131271362305, "global_step": 549098, "epoch": 6615} {"train_loss": -27.78767967224121, "global_step": 549099, "epoch": 6615} {"train_loss": -27.828855514526367, "global_step": 549100, "epoch": 6615} {"train_loss": -28.046911239624023, "global_step": 549101, "epoch": 6615} {"train_loss": -27.84152603149414, "global_step": 549102, "epoch": 6615} {"train_loss": -27.96393394470215, "global_step": 549103, "epoch": 6615} {"train_loss": -28.182043075561523, "global_step": 549104, "epoch": 6615} {"train_loss": -27.665573120117188, "global_step": 549105, "epoch": 6615} {"train_loss": -28.0105037689209, "global_step": 549106, "epoch": 6615} {"train_loss": -27.916244506835938, "global_step": 549107, "epoch": 6615} {"train_loss": -27.501789093017578, "global_step": 549108, "epoch": 6615} {"train_loss": -27.578031539916992, "global_step": 549109, "epoch": 6615} {"train_loss": -27.43580436706543, "global_step": 549110, "epoch": 6615} {"train_loss": -27.638904571533203, "global_step": 549111, "epoch": 6615} {"train_loss": -27.61281394958496, "global_step": 549112, "epoch": 6615} {"train_loss": -27.661474227905273, "global_step": 549113, "epoch": 6615} {"train_loss": -28.260400772094727, "global_step": 549114, "epoch": 6615} {"train_loss": -27.6551513671875, "global_step": 549115, "epoch": 6615} {"train_loss": -27.807661056518555, "global_step": 549116, "epoch": 6615} {"train_loss": -27.298192977905273, "global_step": 549117, "epoch": 6615} {"train_loss": -27.7675838470459, "global_step": 549118, "epoch": 6615} {"train_loss": -27.929906845092773, "global_step": 549119, "epoch": 6615} {"train_loss": -27.280303955078125, "global_step": 549120, "epoch": 6615} {"train_loss": -27.53228187561035, "global_step": 549121, "epoch": 6615} {"train_loss": -27.364042282104492, "global_step": 549122, "epoch": 6615} {"train_loss": -27.4508056640625, "global_step": 549123, "epoch": 6615} {"train_loss": -27.522241592407227, "global_step": 549124, "epoch": 6615} {"train_loss": -27.22511100769043, "global_step": 549125, "epoch": 6615} {"train_loss": -27.54859733581543, "global_step": 549126, "epoch": 6615} {"train_loss": -27.6135202430817, "global_step": 549127, "epoch": 6615, "val_loss": 6454347.5} {"train_loss": -23.400766372680664, "global_step": 549128, "epoch": 6616} {"train_loss": -22.011014938354492, "global_step": 549129, "epoch": 6616} {"train_loss": -26.46589469909668, "global_step": 549130, "epoch": 6616} {"train_loss": -23.64516258239746, "global_step": 549131, "epoch": 6616} {"train_loss": -26.333683013916016, "global_step": 549132, "epoch": 6616} {"train_loss": -24.872892379760742, "global_step": 549133, "epoch": 6616} {"train_loss": -24.931608200073242, "global_step": 549134, "epoch": 6616} {"train_loss": -26.31344985961914, "global_step": 549135, "epoch": 6616} {"train_loss": -25.789350509643555, "global_step": 549136, "epoch": 6616} {"train_loss": -25.64276695251465, "global_step": 549137, "epoch": 6616} {"train_loss": -26.13212013244629, "global_step": 549138, "epoch": 6616} {"train_loss": -26.301389694213867, "global_step": 549139, "epoch": 6616} {"train_loss": -25.808149337768555, "global_step": 549140, "epoch": 6616} {"train_loss": -26.181188583374023, "global_step": 549141, "epoch": 6616} {"train_loss": -26.328893661499023, "global_step": 549142, "epoch": 6616} {"train_loss": -26.671873092651367, "global_step": 549143, "epoch": 6616} {"train_loss": -26.446866989135742, "global_step": 549144, "epoch": 6616} {"train_loss": -26.77558708190918, "global_step": 549145, "epoch": 6616} {"train_loss": -26.834182739257812, "global_step": 549146, "epoch": 6616} {"train_loss": -26.912572860717773, "global_step": 549147, "epoch": 6616} {"train_loss": -26.352436065673828, "global_step": 549148, "epoch": 6616} {"train_loss": -26.6005802154541, "global_step": 549149, "epoch": 6616} {"train_loss": -26.690216064453125, "global_step": 549150, "epoch": 6616} {"train_loss": -26.64939308166504, "global_step": 549151, "epoch": 6616} {"train_loss": -26.910358428955078, "global_step": 549152, "epoch": 6616} {"train_loss": -27.166635513305664, "global_step": 549153, "epoch": 6616} {"train_loss": -27.001495361328125, "global_step": 549154, "epoch": 6616} {"train_loss": -26.928007125854492, "global_step": 549155, "epoch": 6616} {"train_loss": -27.194189071655273, "global_step": 549156, "epoch": 6616} {"train_loss": -27.127771377563477, "global_step": 549157, "epoch": 6616} {"train_loss": -27.34186363220215, "global_step": 549158, "epoch": 6616} {"train_loss": -27.03094482421875, "global_step": 549159, "epoch": 6616} {"train_loss": -26.961889266967773, "global_step": 549160, "epoch": 6616} {"train_loss": -27.0063533782959, "global_step": 549161, "epoch": 6616} {"train_loss": -27.04903221130371, "global_step": 549162, "epoch": 6616} {"train_loss": -27.19829750061035, "global_step": 549163, "epoch": 6616} {"train_loss": -27.277801513671875, "global_step": 549164, "epoch": 6616} {"train_loss": -27.35409927368164, "global_step": 549165, "epoch": 6616} {"train_loss": -26.961780548095703, "global_step": 549166, "epoch": 6616} {"train_loss": -27.290979385375977, "global_step": 549167, "epoch": 6616} {"train_loss": -27.044721603393555, "global_step": 549168, "epoch": 6616} {"train_loss": -27.500574111938477, "global_step": 549169, "epoch": 6616} {"train_loss": -27.65753746032715, "global_step": 549170, "epoch": 6616} {"train_loss": -27.664228439331055, "global_step": 549171, "epoch": 6616} {"train_loss": -27.738325119018555, "global_step": 549172, "epoch": 6616} {"train_loss": -27.37055015563965, "global_step": 549173, "epoch": 6616} {"train_loss": -27.722187042236328, "global_step": 549174, "epoch": 6616} {"train_loss": -27.614837646484375, "global_step": 549175, "epoch": 6616} {"train_loss": -27.25502586364746, "global_step": 549176, "epoch": 6616} {"train_loss": -27.50421142578125, "global_step": 549177, "epoch": 6616} {"train_loss": -27.6844539642334, "global_step": 549178, "epoch": 6616} {"train_loss": -27.451475143432617, "global_step": 549179, "epoch": 6616} {"train_loss": -27.88751792907715, "global_step": 549180, "epoch": 6616} {"train_loss": -27.62061882019043, "global_step": 549181, "epoch": 6616} {"train_loss": -27.874210357666016, "global_step": 549182, "epoch": 6616} {"train_loss": -27.642866134643555, "global_step": 549183, "epoch": 6616} {"train_loss": -27.575475692749023, "global_step": 549184, "epoch": 6616} {"train_loss": -27.79351234436035, "global_step": 549185, "epoch": 6616} {"train_loss": -27.618749618530273, "global_step": 549186, "epoch": 6616} {"train_loss": -27.927021026611328, "global_step": 549187, "epoch": 6616} {"train_loss": -27.47515296936035, "global_step": 549188, "epoch": 6616} {"train_loss": -27.949539184570312, "global_step": 549189, "epoch": 6616} {"train_loss": -28.10601806640625, "global_step": 549190, "epoch": 6616} {"train_loss": -27.923114776611328, "global_step": 549191, "epoch": 6616} {"train_loss": -27.990467071533203, "global_step": 549192, "epoch": 6616} {"train_loss": -27.48135757446289, "global_step": 549193, "epoch": 6616} {"train_loss": -27.777423858642578, "global_step": 549194, "epoch": 6616} {"train_loss": -27.87725830078125, "global_step": 549195, "epoch": 6616} {"train_loss": -27.72239112854004, "global_step": 549196, "epoch": 6616} {"train_loss": -27.525266647338867, "global_step": 549197, "epoch": 6616} {"train_loss": -28.009450912475586, "global_step": 549198, "epoch": 6616} {"train_loss": -28.00172233581543, "global_step": 549199, "epoch": 6616} {"train_loss": -27.838666915893555, "global_step": 549200, "epoch": 6616} {"train_loss": -28.03260612487793, "global_step": 549201, "epoch": 6616} {"train_loss": -28.031696319580078, "global_step": 549202, "epoch": 6616} {"train_loss": -28.12994956970215, "global_step": 549203, "epoch": 6616} {"train_loss": -27.490758895874023, "global_step": 549204, "epoch": 6616} {"train_loss": -27.84808349609375, "global_step": 549205, "epoch": 6616} {"train_loss": -28.090356826782227, "global_step": 549206, "epoch": 6616} {"train_loss": -27.808216094970703, "global_step": 549207, "epoch": 6616} {"train_loss": -27.675634384155273, "global_step": 549208, "epoch": 6616} {"train_loss": -27.134546279907227, "global_step": 549209, "epoch": 6616} {"train_loss": -27.031884457691607, "global_step": 549210, "epoch": 6616, "val_loss": 6507355.0} {"train_loss": -22.905975341796875, "global_step": 549211, "epoch": 6617} {"train_loss": -24.780811309814453, "global_step": 549212, "epoch": 6617} {"train_loss": -25.049245834350586, "global_step": 549213, "epoch": 6617} {"train_loss": -24.733524322509766, "global_step": 549214, "epoch": 6617} {"train_loss": -26.02362060546875, "global_step": 549215, "epoch": 6617} {"train_loss": -25.103778839111328, "global_step": 549216, "epoch": 6617} {"train_loss": -25.328643798828125, "global_step": 549217, "epoch": 6617} {"train_loss": -26.213855743408203, "global_step": 549218, "epoch": 6617} {"train_loss": -24.8205509185791, "global_step": 549219, "epoch": 6617} {"train_loss": -26.33710289001465, "global_step": 549220, "epoch": 6617} {"train_loss": -25.918140411376953, "global_step": 549221, "epoch": 6617} {"train_loss": -26.46523094177246, "global_step": 549222, "epoch": 6617} {"train_loss": -26.56537437438965, "global_step": 549223, "epoch": 6617} {"train_loss": -26.730682373046875, "global_step": 549224, "epoch": 6617} {"train_loss": -26.37359046936035, "global_step": 549225, "epoch": 6617} {"train_loss": -26.443445205688477, "global_step": 549226, "epoch": 6617} {"train_loss": -26.849964141845703, "global_step": 549227, "epoch": 6617} {"train_loss": -26.225738525390625, "global_step": 549228, "epoch": 6617} {"train_loss": -26.483264923095703, "global_step": 549229, "epoch": 6617} {"train_loss": -27.014511108398438, "global_step": 549230, "epoch": 6617} {"train_loss": -26.360919952392578, "global_step": 549231, "epoch": 6617} {"train_loss": -26.595550537109375, "global_step": 549232, "epoch": 6617} {"train_loss": -26.775976181030273, "global_step": 549233, "epoch": 6617} {"train_loss": -26.897302627563477, "global_step": 549234, "epoch": 6617} {"train_loss": -26.88599967956543, "global_step": 549235, "epoch": 6617} {"train_loss": -27.10723876953125, "global_step": 549236, "epoch": 6617} {"train_loss": -26.712316513061523, "global_step": 549237, "epoch": 6617} {"train_loss": -26.928741455078125, "global_step": 549238, "epoch": 6617} {"train_loss": -26.731653213500977, "global_step": 549239, "epoch": 6617} {"train_loss": -27.200489044189453, "global_step": 549240, "epoch": 6617} {"train_loss": -27.080677032470703, "global_step": 549241, "epoch": 6617} {"train_loss": -27.240890502929688, "global_step": 549242, "epoch": 6617} {"train_loss": -26.798725128173828, "global_step": 549243, "epoch": 6617} {"train_loss": -27.031391143798828, "global_step": 549244, "epoch": 6617} {"train_loss": -27.351917266845703, "global_step": 549245, "epoch": 6617} {"train_loss": -27.37820816040039, "global_step": 549246, "epoch": 6617} {"train_loss": -27.21803855895996, "global_step": 549247, "epoch": 6617} {"train_loss": -26.92384147644043, "global_step": 549248, "epoch": 6617} {"train_loss": -27.296630859375, "global_step": 549249, "epoch": 6617} {"train_loss": -27.04787254333496, "global_step": 549250, "epoch": 6617} {"train_loss": -27.542877197265625, "global_step": 549251, "epoch": 6617} {"train_loss": -27.645978927612305, "global_step": 549252, "epoch": 6617} {"train_loss": -27.58676528930664, "global_step": 549253, "epoch": 6617} {"train_loss": -27.40715980529785, "global_step": 549254, "epoch": 6617} {"train_loss": -27.615264892578125, "global_step": 549255, "epoch": 6617} {"train_loss": -26.946640014648438, "global_step": 549256, "epoch": 6617} {"train_loss": -27.606611251831055, "global_step": 549257, "epoch": 6617} {"train_loss": -27.840051651000977, "global_step": 549258, "epoch": 6617} {"train_loss": -27.612722396850586, "global_step": 549259, "epoch": 6617} {"train_loss": -27.450454711914062, "global_step": 549260, "epoch": 6617} {"train_loss": -27.542348861694336, "global_step": 549261, "epoch": 6617} {"train_loss": -27.81805419921875, "global_step": 549262, "epoch": 6617} {"train_loss": -27.35165786743164, "global_step": 549263, "epoch": 6617} {"train_loss": -27.54143714904785, "global_step": 549264, "epoch": 6617} {"train_loss": -27.35127067565918, "global_step": 549265, "epoch": 6617} {"train_loss": -27.630298614501953, "global_step": 549266, "epoch": 6617} {"train_loss": -27.6090145111084, "global_step": 549267, "epoch": 6617} {"train_loss": -27.524097442626953, "global_step": 549268, "epoch": 6617} {"train_loss": -27.60723876953125, "global_step": 549269, "epoch": 6617} {"train_loss": -27.486677169799805, "global_step": 549270, "epoch": 6617} {"train_loss": -28.026336669921875, "global_step": 549271, "epoch": 6617} {"train_loss": -27.3283634185791, "global_step": 549272, "epoch": 6617} {"train_loss": -27.822011947631836, "global_step": 549273, "epoch": 6617} {"train_loss": -27.14021110534668, "global_step": 549274, "epoch": 6617} {"train_loss": -27.910863876342773, "global_step": 549275, "epoch": 6617} {"train_loss": -27.6555233001709, "global_step": 549276, "epoch": 6617} {"train_loss": -27.854482650756836, "global_step": 549277, "epoch": 6617} {"train_loss": -27.780309677124023, "global_step": 549278, "epoch": 6617} {"train_loss": -27.675617218017578, "global_step": 549279, "epoch": 6617} {"train_loss": -27.857975006103516, "global_step": 549280, "epoch": 6617} {"train_loss": -27.496992111206055, "global_step": 549281, "epoch": 6617} {"train_loss": -27.553424835205078, "global_step": 549282, "epoch": 6617} {"train_loss": -27.808027267456055, "global_step": 549283, "epoch": 6617} {"train_loss": -28.08982276916504, "global_step": 549284, "epoch": 6617} {"train_loss": -27.643741607666016, "global_step": 549285, "epoch": 6617} {"train_loss": -27.836231231689453, "global_step": 549286, "epoch": 6617} {"train_loss": -27.619970321655273, "global_step": 549287, "epoch": 6617} {"train_loss": -27.8525390625, "global_step": 549288, "epoch": 6617} {"train_loss": -27.877111434936523, "global_step": 549289, "epoch": 6617} {"train_loss": -27.381439208984375, "global_step": 549290, "epoch": 6617} {"train_loss": -27.87839698791504, "global_step": 549291, "epoch": 6617} {"train_loss": -27.94095802307129, "global_step": 549292, "epoch": 6617} {"train_loss": -27.043461282569243, "global_step": 549293, "epoch": 6617, "val_loss": 6555194.5} {"train_loss": -27.389942169189453, "global_step": 549294, "epoch": 6618} {"train_loss": -26.784107208251953, "global_step": 549295, "epoch": 6618} {"train_loss": -26.91794776916504, "global_step": 549296, "epoch": 6618} {"train_loss": -27.285724639892578, "global_step": 549297, "epoch": 6618} {"train_loss": -26.903411865234375, "global_step": 549298, "epoch": 6618} {"train_loss": -26.980976104736328, "global_step": 549299, "epoch": 6618} {"train_loss": -27.5263614654541, "global_step": 549300, "epoch": 6618} {"train_loss": -26.950437545776367, "global_step": 549301, "epoch": 6618} {"train_loss": -27.579809188842773, "global_step": 549302, "epoch": 6618} {"train_loss": -27.613956451416016, "global_step": 549303, "epoch": 6618} {"train_loss": -27.107303619384766, "global_step": 549304, "epoch": 6618} {"train_loss": -27.511255264282227, "global_step": 549305, "epoch": 6618} {"train_loss": -27.456369400024414, "global_step": 549306, "epoch": 6618} {"train_loss": -27.489307403564453, "global_step": 549307, "epoch": 6618} {"train_loss": -27.79359245300293, "global_step": 549308, "epoch": 6618} {"train_loss": -27.143463134765625, "global_step": 549309, "epoch": 6618} {"train_loss": -27.64142417907715, "global_step": 549310, "epoch": 6618} {"train_loss": -27.183191299438477, "global_step": 549311, "epoch": 6618} {"train_loss": -27.76676368713379, "global_step": 549312, "epoch": 6618} {"train_loss": -27.30464744567871, "global_step": 549313, "epoch": 6618} {"train_loss": -27.669647216796875, "global_step": 549314, "epoch": 6618} {"train_loss": -27.471847534179688, "global_step": 549315, "epoch": 6618} {"train_loss": -27.245328903198242, "global_step": 549316, "epoch": 6618} {"train_loss": -27.455036163330078, "global_step": 549317, "epoch": 6618} {"train_loss": -27.62749671936035, "global_step": 549318, "epoch": 6618} {"train_loss": -27.383588790893555, "global_step": 549319, "epoch": 6618} {"train_loss": -27.4405517578125, "global_step": 549320, "epoch": 6618} {"train_loss": -27.507587432861328, "global_step": 549321, "epoch": 6618} {"train_loss": -27.822668075561523, "global_step": 549322, "epoch": 6618} {"train_loss": -27.290058135986328, "global_step": 549323, "epoch": 6618} {"train_loss": -27.913599014282227, "global_step": 549324, "epoch": 6618} {"train_loss": -28.038904190063477, "global_step": 549325, "epoch": 6618} {"train_loss": -27.697925567626953, "global_step": 549326, "epoch": 6618} {"train_loss": -27.610218048095703, "global_step": 549327, "epoch": 6618} {"train_loss": -27.8533992767334, "global_step": 549328, "epoch": 6618} {"train_loss": -28.12931251525879, "global_step": 549329, "epoch": 6618} {"train_loss": -27.70931053161621, "global_step": 549330, "epoch": 6618} {"train_loss": -27.78057861328125, "global_step": 549331, "epoch": 6618} {"train_loss": -27.975576400756836, "global_step": 549332, "epoch": 6618} {"train_loss": -28.060277938842773, "global_step": 549333, "epoch": 6618} {"train_loss": -27.729589462280273, "global_step": 549334, "epoch": 6618} {"train_loss": -28.144794464111328, "global_step": 549335, "epoch": 6618} {"train_loss": -27.673437118530273, "global_step": 549336, "epoch": 6618} {"train_loss": -27.64776039123535, "global_step": 549337, "epoch": 6618} {"train_loss": -27.713422775268555, "global_step": 549338, "epoch": 6618} {"train_loss": -28.18793296813965, "global_step": 549339, "epoch": 6618} {"train_loss": -27.76104164123535, "global_step": 549340, "epoch": 6618} {"train_loss": -27.76163101196289, "global_step": 549341, "epoch": 6618} {"train_loss": -28.16041374206543, "global_step": 549342, "epoch": 6618} {"train_loss": -28.217634201049805, "global_step": 549343, "epoch": 6618} {"train_loss": -27.64910316467285, "global_step": 549344, "epoch": 6618} {"train_loss": -28.178363800048828, "global_step": 549345, "epoch": 6618} {"train_loss": -27.910398483276367, "global_step": 549346, "epoch": 6618} {"train_loss": -27.634540557861328, "global_step": 549347, "epoch": 6618} {"train_loss": -27.986478805541992, "global_step": 549348, "epoch": 6618} {"train_loss": -27.79292106628418, "global_step": 549349, "epoch": 6618} {"train_loss": -27.7764949798584, "global_step": 549350, "epoch": 6618} {"train_loss": -27.79554557800293, "global_step": 549351, "epoch": 6618} {"train_loss": -28.377426147460938, "global_step": 549352, "epoch": 6618} {"train_loss": -28.034650802612305, "global_step": 549353, "epoch": 6618} {"train_loss": -27.58477783203125, "global_step": 549354, "epoch": 6618} {"train_loss": -28.296772003173828, "global_step": 549355, "epoch": 6618} {"train_loss": -27.715295791625977, "global_step": 549356, "epoch": 6618} {"train_loss": -28.088666915893555, "global_step": 549357, "epoch": 6618} {"train_loss": -27.960474014282227, "global_step": 549358, "epoch": 6618} {"train_loss": -27.745161056518555, "global_step": 549359, "epoch": 6618} {"train_loss": -27.73798942565918, "global_step": 549360, "epoch": 6618} {"train_loss": -27.475305557250977, "global_step": 549361, "epoch": 6618} {"train_loss": -27.89715576171875, "global_step": 549362, "epoch": 6618} {"train_loss": -27.66806983947754, "global_step": 549363, "epoch": 6618} {"train_loss": -27.916217803955078, "global_step": 549364, "epoch": 6618} {"train_loss": -28.150100708007812, "global_step": 549365, "epoch": 6618} {"train_loss": -27.74725914001465, "global_step": 549366, "epoch": 6618} {"train_loss": -27.88178062438965, "global_step": 549367, "epoch": 6618} {"train_loss": -27.747390747070312, "global_step": 549368, "epoch": 6618} {"train_loss": -27.8585147857666, "global_step": 549369, "epoch": 6618} {"train_loss": -27.579069137573242, "global_step": 549370, "epoch": 6618} {"train_loss": -27.928869247436523, "global_step": 549371, "epoch": 6618} {"train_loss": -27.192768096923828, "global_step": 549372, "epoch": 6618} {"train_loss": -27.95911979675293, "global_step": 549373, "epoch": 6618} {"train_loss": -27.92498207092285, "global_step": 549374, "epoch": 6618} {"train_loss": -27.26885986328125, "global_step": 549375, "epoch": 6618} {"train_loss": -27.6605631357216, "global_step": 549376, "epoch": 6618, "val_loss": 6581413.0} {"train_loss": -26.260345458984375, "global_step": 549377, "epoch": 6619} {"train_loss": -25.320499420166016, "global_step": 549378, "epoch": 6619} {"train_loss": -25.369165420532227, "global_step": 549379, "epoch": 6619} {"train_loss": -26.2593936920166, "global_step": 549380, "epoch": 6619} {"train_loss": -26.835657119750977, "global_step": 549381, "epoch": 6619} {"train_loss": -25.851835250854492, "global_step": 549382, "epoch": 6619} {"train_loss": -26.586328506469727, "global_step": 549383, "epoch": 6619} {"train_loss": -25.80353355407715, "global_step": 549384, "epoch": 6619} {"train_loss": -25.383136749267578, "global_step": 549385, "epoch": 6619} {"train_loss": -26.530292510986328, "global_step": 549386, "epoch": 6619} {"train_loss": -26.407825469970703, "global_step": 549387, "epoch": 6619} {"train_loss": -26.719409942626953, "global_step": 549388, "epoch": 6619} {"train_loss": -26.642541885375977, "global_step": 549389, "epoch": 6619} {"train_loss": -26.78492546081543, "global_step": 549390, "epoch": 6619} {"train_loss": -27.146652221679688, "global_step": 549391, "epoch": 6619} {"train_loss": -27.16651725769043, "global_step": 549392, "epoch": 6619} {"train_loss": -26.60563087463379, "global_step": 549393, "epoch": 6619} {"train_loss": -27.255090713500977, "global_step": 549394, "epoch": 6619} {"train_loss": -26.69710350036621, "global_step": 549395, "epoch": 6619} {"train_loss": -26.984540939331055, "global_step": 549396, "epoch": 6619} {"train_loss": -27.01531982421875, "global_step": 549397, "epoch": 6619} {"train_loss": -27.294584274291992, "global_step": 549398, "epoch": 6619} {"train_loss": -27.103778839111328, "global_step": 549399, "epoch": 6619} {"train_loss": -27.559309005737305, "global_step": 549400, "epoch": 6619} {"train_loss": -27.14893913269043, "global_step": 549401, "epoch": 6619} {"train_loss": -27.297815322875977, "global_step": 549402, "epoch": 6619} {"train_loss": -27.142637252807617, "global_step": 549403, "epoch": 6619} {"train_loss": -27.230945587158203, "global_step": 549404, "epoch": 6619} {"train_loss": -27.316986083984375, "global_step": 549405, "epoch": 6619} {"train_loss": -27.282812118530273, "global_step": 549406, "epoch": 6619} {"train_loss": -27.447895050048828, "global_step": 549407, "epoch": 6619} {"train_loss": -27.491165161132812, "global_step": 549408, "epoch": 6619} {"train_loss": -27.857023239135742, "global_step": 549409, "epoch": 6619} {"train_loss": -27.480091094970703, "global_step": 549410, "epoch": 6619} {"train_loss": -27.265100479125977, "global_step": 549411, "epoch": 6619} {"train_loss": -27.56980323791504, "global_step": 549412, "epoch": 6619} {"train_loss": -27.496084213256836, "global_step": 549413, "epoch": 6619} {"train_loss": -27.71497917175293, "global_step": 549414, "epoch": 6619} {"train_loss": -27.6455135345459, "global_step": 549415, "epoch": 6619} {"train_loss": -27.58707618713379, "global_step": 549416, "epoch": 6619} {"train_loss": -27.534351348876953, "global_step": 549417, "epoch": 6619} {"train_loss": -27.583667755126953, "global_step": 549418, "epoch": 6619} {"train_loss": -27.66162109375, "global_step": 549419, "epoch": 6619} {"train_loss": -27.55475425720215, "global_step": 549420, "epoch": 6619} {"train_loss": -27.823339462280273, "global_step": 549421, "epoch": 6619} {"train_loss": -27.789575576782227, "global_step": 549422, "epoch": 6619} {"train_loss": -27.782928466796875, "global_step": 549423, "epoch": 6619} {"train_loss": -27.504199981689453, "global_step": 549424, "epoch": 6619} {"train_loss": -27.9139404296875, "global_step": 549425, "epoch": 6619} {"train_loss": -27.76588249206543, "global_step": 549426, "epoch": 6619} {"train_loss": -27.822412490844727, "global_step": 549427, "epoch": 6619} {"train_loss": -27.880634307861328, "global_step": 549428, "epoch": 6619} {"train_loss": -28.285907745361328, "global_step": 549429, "epoch": 6619} {"train_loss": -27.955835342407227, "global_step": 549430, "epoch": 6619} {"train_loss": -27.84742546081543, "global_step": 549431, "epoch": 6619} {"train_loss": -27.790821075439453, "global_step": 549432, "epoch": 6619} {"train_loss": -27.89701271057129, "global_step": 549433, "epoch": 6619} {"train_loss": -28.028400421142578, "global_step": 549434, "epoch": 6619} {"train_loss": -27.82984733581543, "global_step": 549435, "epoch": 6619} {"train_loss": -27.735828399658203, "global_step": 549436, "epoch": 6619} {"train_loss": -28.08255386352539, "global_step": 549437, "epoch": 6619} {"train_loss": -27.7879695892334, "global_step": 549438, "epoch": 6619} {"train_loss": -27.79786491394043, "global_step": 549439, "epoch": 6619} {"train_loss": -28.029834747314453, "global_step": 549440, "epoch": 6619} {"train_loss": -28.177845001220703, "global_step": 549441, "epoch": 6619} {"train_loss": -28.087554931640625, "global_step": 549442, "epoch": 6619} {"train_loss": -27.8707275390625, "global_step": 549443, "epoch": 6619} {"train_loss": -27.66620445251465, "global_step": 549444, "epoch": 6619} {"train_loss": -28.0728816986084, "global_step": 549445, "epoch": 6619} {"train_loss": -27.81134033203125, "global_step": 549446, "epoch": 6619} {"train_loss": -28.1024112701416, "global_step": 549447, "epoch": 6619} {"train_loss": -27.8043270111084, "global_step": 549448, "epoch": 6619} {"train_loss": -27.791797637939453, "global_step": 549449, "epoch": 6619} {"train_loss": -28.0676326751709, "global_step": 549450, "epoch": 6619} {"train_loss": -27.6761417388916, "global_step": 549451, "epoch": 6619} {"train_loss": -27.692371368408203, "global_step": 549452, "epoch": 6619} {"train_loss": -27.98408317565918, "global_step": 549453, "epoch": 6619} {"train_loss": -28.17568016052246, "global_step": 549454, "epoch": 6619} {"train_loss": -27.748748779296875, "global_step": 549455, "epoch": 6619} {"train_loss": -27.98097801208496, "global_step": 549456, "epoch": 6619} {"train_loss": -27.823272705078125, "global_step": 549457, "epoch": 6619} {"train_loss": -27.51252555847168, "global_step": 549458, "epoch": 6619} {"train_loss": -27.399490310485106, "global_step": 549459, "epoch": 6619, "val_loss": 6494331.0} {"train_loss": -26.858041763305664, "global_step": 549460, "epoch": 6620} {"train_loss": -26.523101806640625, "global_step": 549461, "epoch": 6620} {"train_loss": -26.264379501342773, "global_step": 549462, "epoch": 6620} {"train_loss": -25.570005416870117, "global_step": 549463, "epoch": 6620} {"train_loss": -26.451467514038086, "global_step": 549464, "epoch": 6620} {"train_loss": -26.170272827148438, "global_step": 549465, "epoch": 6620} {"train_loss": -26.952295303344727, "global_step": 549466, "epoch": 6620} {"train_loss": -26.918380737304688, "global_step": 549467, "epoch": 6620} {"train_loss": -26.8764591217041, "global_step": 549468, "epoch": 6620} {"train_loss": -26.809234619140625, "global_step": 549469, "epoch": 6620} {"train_loss": -26.961181640625, "global_step": 549470, "epoch": 6620} {"train_loss": -26.86806297302246, "global_step": 549471, "epoch": 6620} {"train_loss": -27.01594352722168, "global_step": 549472, "epoch": 6620} {"train_loss": -27.235111236572266, "global_step": 549473, "epoch": 6620} {"train_loss": -27.331247329711914, "global_step": 549474, "epoch": 6620} {"train_loss": -27.0312557220459, "global_step": 549475, "epoch": 6620} {"train_loss": -26.752246856689453, "global_step": 549476, "epoch": 6620} {"train_loss": -27.402313232421875, "global_step": 549477, "epoch": 6620} {"train_loss": -27.08396339416504, "global_step": 549478, "epoch": 6620} {"train_loss": -27.203649520874023, "global_step": 549479, "epoch": 6620} {"train_loss": -27.493066787719727, "global_step": 549480, "epoch": 6620} {"train_loss": -26.747146606445312, "global_step": 549481, "epoch": 6620} {"train_loss": -27.110015869140625, "global_step": 549482, "epoch": 6620} {"train_loss": -26.912595748901367, "global_step": 549483, "epoch": 6620} {"train_loss": -27.463546752929688, "global_step": 549484, "epoch": 6620} {"train_loss": -27.59681510925293, "global_step": 549485, "epoch": 6620} {"train_loss": -27.64484214782715, "global_step": 549486, "epoch": 6620} {"train_loss": -27.778289794921875, "global_step": 549487, "epoch": 6620} {"train_loss": -27.534170150756836, "global_step": 549488, "epoch": 6620} {"train_loss": -27.35359001159668, "global_step": 549489, "epoch": 6620} {"train_loss": -27.21441650390625, "global_step": 549490, "epoch": 6620} {"train_loss": -27.38494873046875, "global_step": 549491, "epoch": 6620} {"train_loss": -27.816547393798828, "global_step": 549492, "epoch": 6620} {"train_loss": -27.22157096862793, "global_step": 549493, "epoch": 6620} {"train_loss": -27.912626266479492, "global_step": 549494, "epoch": 6620} {"train_loss": -27.51496696472168, "global_step": 549495, "epoch": 6620} {"train_loss": -27.7403507232666, "global_step": 549496, "epoch": 6620} {"train_loss": -27.643295288085938, "global_step": 549497, "epoch": 6620} {"train_loss": -27.481281280517578, "global_step": 549498, "epoch": 6620} {"train_loss": -27.803693771362305, "global_step": 549499, "epoch": 6620} {"train_loss": -27.809833526611328, "global_step": 549500, "epoch": 6620} {"train_loss": -27.46319007873535, "global_step": 549501, "epoch": 6620} {"train_loss": -27.93006706237793, "global_step": 549502, "epoch": 6620} {"train_loss": -27.5407657623291, "global_step": 549503, "epoch": 6620} {"train_loss": -27.730422973632812, "global_step": 549504, "epoch": 6620} {"train_loss": -27.618366241455078, "global_step": 549505, "epoch": 6620} {"train_loss": -27.89661979675293, "global_step": 549506, "epoch": 6620} {"train_loss": -27.712848663330078, "global_step": 549507, "epoch": 6620} {"train_loss": -28.071353912353516, "global_step": 549508, "epoch": 6620} {"train_loss": -27.926761627197266, "global_step": 549509, "epoch": 6620} {"train_loss": -27.952672958374023, "global_step": 549510, "epoch": 6620} {"train_loss": -27.898954391479492, "global_step": 549511, "epoch": 6620} {"train_loss": -27.7043514251709, "global_step": 549512, "epoch": 6620} {"train_loss": -28.027368545532227, "global_step": 549513, "epoch": 6620} {"train_loss": -28.026716232299805, "global_step": 549514, "epoch": 6620} {"train_loss": -28.117462158203125, "global_step": 549515, "epoch": 6620} {"train_loss": -28.04701805114746, "global_step": 549516, "epoch": 6620} {"train_loss": -28.007892608642578, "global_step": 549517, "epoch": 6620} {"train_loss": -27.530920028686523, "global_step": 549518, "epoch": 6620} {"train_loss": -27.768207550048828, "global_step": 549519, "epoch": 6620} {"train_loss": -27.9427547454834, "global_step": 549520, "epoch": 6620} {"train_loss": -28.026227951049805, "global_step": 549521, "epoch": 6620} {"train_loss": -27.963483810424805, "global_step": 549522, "epoch": 6620} {"train_loss": -28.074295043945312, "global_step": 549523, "epoch": 6620} {"train_loss": -27.943695068359375, "global_step": 549524, "epoch": 6620} {"train_loss": -27.57484245300293, "global_step": 549525, "epoch": 6620} {"train_loss": -27.962158203125, "global_step": 549526, "epoch": 6620} {"train_loss": -27.7584228515625, "global_step": 549527, "epoch": 6620} {"train_loss": -27.583480834960938, "global_step": 549528, "epoch": 6620} {"train_loss": -27.715543746948242, "global_step": 549529, "epoch": 6620} {"train_loss": -28.410449981689453, "global_step": 549530, "epoch": 6620} {"train_loss": -27.37823486328125, "global_step": 549531, "epoch": 6620} {"train_loss": -27.118494033813477, "global_step": 549532, "epoch": 6620} {"train_loss": -26.66902732849121, "global_step": 549533, "epoch": 6620} {"train_loss": -27.176095962524414, "global_step": 549534, "epoch": 6620} {"train_loss": -28.113784790039062, "global_step": 549535, "epoch": 6620} {"train_loss": -27.643644332885742, "global_step": 549536, "epoch": 6620} {"train_loss": -27.3216609954834, "global_step": 549537, "epoch": 6620} {"train_loss": -27.844343185424805, "global_step": 549538, "epoch": 6620} {"train_loss": -27.506505966186523, "global_step": 549539, "epoch": 6620} {"train_loss": -27.457136154174805, "global_step": 549540, "epoch": 6620} {"train_loss": -27.44418716430664, "global_step": 549541, "epoch": 6620} {"train_loss": -27.45974821067718, "global_step": 549542, "epoch": 6620, "val_loss": 6434575.0} {"train_loss": -27.453632354736328, "global_step": 549543, "epoch": 6621} {"train_loss": -27.377166748046875, "global_step": 549544, "epoch": 6621} {"train_loss": -27.332128524780273, "global_step": 549545, "epoch": 6621} {"train_loss": -27.33222007751465, "global_step": 549546, "epoch": 6621} {"train_loss": -27.447961807250977, "global_step": 549547, "epoch": 6621} {"train_loss": -27.30792808532715, "global_step": 549548, "epoch": 6621} {"train_loss": -27.632553100585938, "global_step": 549549, "epoch": 6621} {"train_loss": -27.81568717956543, "global_step": 549550, "epoch": 6621} {"train_loss": -27.502477645874023, "global_step": 549551, "epoch": 6621} {"train_loss": -27.718481063842773, "global_step": 549552, "epoch": 6621} {"train_loss": -27.561323165893555, "global_step": 549553, "epoch": 6621} {"train_loss": -27.53510093688965, "global_step": 549554, "epoch": 6621} {"train_loss": -27.39957046508789, "global_step": 549555, "epoch": 6621} {"train_loss": -27.37209129333496, "global_step": 549556, "epoch": 6621} {"train_loss": -27.462682723999023, "global_step": 549557, "epoch": 6621} {"train_loss": -27.783695220947266, "global_step": 549558, "epoch": 6621} {"train_loss": -27.7789363861084, "global_step": 549559, "epoch": 6621} {"train_loss": -27.845487594604492, "global_step": 549560, "epoch": 6621} {"train_loss": -27.597522735595703, "global_step": 549561, "epoch": 6621} {"train_loss": -28.04615592956543, "global_step": 549562, "epoch": 6621} {"train_loss": -27.52937889099121, "global_step": 549563, "epoch": 6621} {"train_loss": -27.73724937438965, "global_step": 549564, "epoch": 6621} {"train_loss": -27.51708984375, "global_step": 549565, "epoch": 6621} {"train_loss": -27.447370529174805, "global_step": 549566, "epoch": 6621} {"train_loss": -27.046253204345703, "global_step": 549567, "epoch": 6621} {"train_loss": -27.2622013092041, "global_step": 549568, "epoch": 6621} {"train_loss": -27.516834259033203, "global_step": 549569, "epoch": 6621} {"train_loss": -27.617544174194336, "global_step": 549570, "epoch": 6621} {"train_loss": -27.744565963745117, "global_step": 549571, "epoch": 6621} {"train_loss": -27.860885620117188, "global_step": 549572, "epoch": 6621} {"train_loss": -27.70438003540039, "global_step": 549573, "epoch": 6621} {"train_loss": -27.839197158813477, "global_step": 549574, "epoch": 6621} {"train_loss": -27.917551040649414, "global_step": 549575, "epoch": 6621} {"train_loss": -27.858129501342773, "global_step": 549576, "epoch": 6621} {"train_loss": -27.83335304260254, "global_step": 549577, "epoch": 6621} {"train_loss": -28.14192008972168, "global_step": 549578, "epoch": 6621} {"train_loss": -27.646055221557617, "global_step": 549579, "epoch": 6621} {"train_loss": -28.023313522338867, "global_step": 549580, "epoch": 6621} {"train_loss": -27.752893447875977, "global_step": 549581, "epoch": 6621} {"train_loss": -27.44813346862793, "global_step": 549582, "epoch": 6621} {"train_loss": -27.639211654663086, "global_step": 549583, "epoch": 6621} {"train_loss": -27.89348793029785, "global_step": 549584, "epoch": 6621} {"train_loss": -27.6635684967041, "global_step": 549585, "epoch": 6621} {"train_loss": -27.55647087097168, "global_step": 549586, "epoch": 6621} {"train_loss": -27.821990966796875, "global_step": 549587, "epoch": 6621} {"train_loss": -27.979406356811523, "global_step": 549588, "epoch": 6621} {"train_loss": -27.8033504486084, "global_step": 549589, "epoch": 6621} {"train_loss": -27.822187423706055, "global_step": 549590, "epoch": 6621} {"train_loss": -27.70452308654785, "global_step": 549591, "epoch": 6621} {"train_loss": -27.876569747924805, "global_step": 549592, "epoch": 6621} {"train_loss": -27.755334854125977, "global_step": 549593, "epoch": 6621} {"train_loss": -27.765039443969727, "global_step": 549594, "epoch": 6621} {"train_loss": -27.889577865600586, "global_step": 549595, "epoch": 6621} {"train_loss": -27.821218490600586, "global_step": 549596, "epoch": 6621} {"train_loss": -27.90980339050293, "global_step": 549597, "epoch": 6621} {"train_loss": -27.965072631835938, "global_step": 549598, "epoch": 6621} {"train_loss": -27.8792667388916, "global_step": 549599, "epoch": 6621} {"train_loss": -27.858495712280273, "global_step": 549600, "epoch": 6621} {"train_loss": -27.708789825439453, "global_step": 549601, "epoch": 6621} {"train_loss": -27.875768661499023, "global_step": 549602, "epoch": 6621} {"train_loss": -27.778417587280273, "global_step": 549603, "epoch": 6621} {"train_loss": -28.305988311767578, "global_step": 549604, "epoch": 6621} {"train_loss": -28.021177291870117, "global_step": 549605, "epoch": 6621} {"train_loss": -27.694171905517578, "global_step": 549606, "epoch": 6621} {"train_loss": -27.8330078125, "global_step": 549607, "epoch": 6621} {"train_loss": -27.748687744140625, "global_step": 549608, "epoch": 6621} {"train_loss": -28.106281280517578, "global_step": 549609, "epoch": 6621} {"train_loss": -27.709918975830078, "global_step": 549610, "epoch": 6621} {"train_loss": -27.804645538330078, "global_step": 549611, "epoch": 6621} {"train_loss": -27.62593650817871, "global_step": 549612, "epoch": 6621} {"train_loss": -28.063159942626953, "global_step": 549613, "epoch": 6621} {"train_loss": -27.62782859802246, "global_step": 549614, "epoch": 6621} {"train_loss": -28.024417877197266, "global_step": 549615, "epoch": 6621} {"train_loss": -27.6835994720459, "global_step": 549616, "epoch": 6621} {"train_loss": -27.8173770904541, "global_step": 549617, "epoch": 6621} {"train_loss": -27.8238525390625, "global_step": 549618, "epoch": 6621} {"train_loss": -27.5180606842041, "global_step": 549619, "epoch": 6621} {"train_loss": -28.136993408203125, "global_step": 549620, "epoch": 6621} {"train_loss": -27.99091911315918, "global_step": 549621, "epoch": 6621} {"train_loss": -27.640249252319336, "global_step": 549622, "epoch": 6621} {"train_loss": -27.929428100585938, "global_step": 549623, "epoch": 6621} {"train_loss": -27.778289794921875, "global_step": 549624, "epoch": 6621} {"train_loss": -27.730868925531226, "global_step": 549625, "epoch": 6621, "val_loss": 6342198.0} {"train_loss": -27.267032623291016, "global_step": 549626, "epoch": 6622} {"train_loss": -26.589696884155273, "global_step": 549627, "epoch": 6622} {"train_loss": -26.720550537109375, "global_step": 549628, "epoch": 6622} {"train_loss": -26.78773307800293, "global_step": 549629, "epoch": 6622} {"train_loss": -27.158849716186523, "global_step": 549630, "epoch": 6622} {"train_loss": -26.2993221282959, "global_step": 549631, "epoch": 6622} {"train_loss": -26.15665054321289, "global_step": 549632, "epoch": 6622} {"train_loss": -26.86299705505371, "global_step": 549633, "epoch": 6622} {"train_loss": -26.68462562561035, "global_step": 549634, "epoch": 6622} {"train_loss": -27.095111846923828, "global_step": 549635, "epoch": 6622} {"train_loss": -26.7255859375, "global_step": 549636, "epoch": 6622} {"train_loss": -27.158374786376953, "global_step": 549637, "epoch": 6622} {"train_loss": -26.711963653564453, "global_step": 549638, "epoch": 6622} {"train_loss": -26.859914779663086, "global_step": 549639, "epoch": 6622} {"train_loss": -27.230283737182617, "global_step": 549640, "epoch": 6622} {"train_loss": -26.885351181030273, "global_step": 549641, "epoch": 6622} {"train_loss": -27.51539421081543, "global_step": 549642, "epoch": 6622} {"train_loss": -27.43084716796875, "global_step": 549643, "epoch": 6622} {"train_loss": -27.123571395874023, "global_step": 549644, "epoch": 6622} {"train_loss": -27.409162521362305, "global_step": 549645, "epoch": 6622} {"train_loss": -27.346216201782227, "global_step": 549646, "epoch": 6622} {"train_loss": -27.465864181518555, "global_step": 549647, "epoch": 6622} {"train_loss": -27.4931640625, "global_step": 549648, "epoch": 6622} {"train_loss": -27.6341552734375, "global_step": 549649, "epoch": 6622} {"train_loss": -27.45694923400879, "global_step": 549650, "epoch": 6622} {"train_loss": -27.616260528564453, "global_step": 549651, "epoch": 6622} {"train_loss": -27.8096981048584, "global_step": 549652, "epoch": 6622} {"train_loss": -27.248706817626953, "global_step": 549653, "epoch": 6622} {"train_loss": -27.53907585144043, "global_step": 549654, "epoch": 6622} {"train_loss": -27.647480010986328, "global_step": 549655, "epoch": 6622} {"train_loss": -27.648605346679688, "global_step": 549656, "epoch": 6622} {"train_loss": -27.896484375, "global_step": 549657, "epoch": 6622} {"train_loss": -27.423070907592773, "global_step": 549658, "epoch": 6622} {"train_loss": -27.7336483001709, "global_step": 549659, "epoch": 6622} {"train_loss": -27.498701095581055, "global_step": 549660, "epoch": 6622} {"train_loss": -27.574493408203125, "global_step": 549661, "epoch": 6622} {"train_loss": -27.81391716003418, "global_step": 549662, "epoch": 6622} {"train_loss": -27.696033477783203, "global_step": 549663, "epoch": 6622} {"train_loss": -27.76411247253418, "global_step": 549664, "epoch": 6622} {"train_loss": -27.669239044189453, "global_step": 549665, "epoch": 6622} {"train_loss": -27.927886962890625, "global_step": 549666, "epoch": 6622} {"train_loss": -27.801496505737305, "global_step": 549667, "epoch": 6622} {"train_loss": -28.0945987701416, "global_step": 549668, "epoch": 6622} {"train_loss": -28.215192794799805, "global_step": 549669, "epoch": 6622} {"train_loss": -27.512048721313477, "global_step": 549670, "epoch": 6622} {"train_loss": -28.223388671875, "global_step": 549671, "epoch": 6622} {"train_loss": -27.9247989654541, "global_step": 549672, "epoch": 6622} {"train_loss": -27.673547744750977, "global_step": 549673, "epoch": 6622} {"train_loss": -27.981918334960938, "global_step": 549674, "epoch": 6622} {"train_loss": -27.58466148376465, "global_step": 549675, "epoch": 6622} {"train_loss": -28.107421875, "global_step": 549676, "epoch": 6622} {"train_loss": -28.189136505126953, "global_step": 549677, "epoch": 6622} {"train_loss": -27.799835205078125, "global_step": 549678, "epoch": 6622} {"train_loss": -27.605138778686523, "global_step": 549679, "epoch": 6622} {"train_loss": -27.748083114624023, "global_step": 549680, "epoch": 6622} {"train_loss": -27.9139461517334, "global_step": 549681, "epoch": 6622} {"train_loss": -28.30447769165039, "global_step": 549682, "epoch": 6622} {"train_loss": -27.714338302612305, "global_step": 549683, "epoch": 6622} {"train_loss": -27.442825317382812, "global_step": 549684, "epoch": 6622} {"train_loss": -27.479578018188477, "global_step": 549685, "epoch": 6622} {"train_loss": -27.847021102905273, "global_step": 549686, "epoch": 6622} {"train_loss": -27.542661666870117, "global_step": 549687, "epoch": 6622} {"train_loss": -27.798095703125, "global_step": 549688, "epoch": 6622} {"train_loss": -27.933286666870117, "global_step": 549689, "epoch": 6622} {"train_loss": -27.869165420532227, "global_step": 549690, "epoch": 6622} {"train_loss": -27.680633544921875, "global_step": 549691, "epoch": 6622} {"train_loss": -27.783864974975586, "global_step": 549692, "epoch": 6622} {"train_loss": -27.865360260009766, "global_step": 549693, "epoch": 6622} {"train_loss": -27.923261642456055, "global_step": 549694, "epoch": 6622} {"train_loss": -28.1524715423584, "global_step": 549695, "epoch": 6622} {"train_loss": -27.6822509765625, "global_step": 549696, "epoch": 6622} {"train_loss": -27.844289779663086, "global_step": 549697, "epoch": 6622} {"train_loss": -27.74678611755371, "global_step": 549698, "epoch": 6622} {"train_loss": -27.970022201538086, "global_step": 549699, "epoch": 6622} {"train_loss": -27.77349853515625, "global_step": 549700, "epoch": 6622} {"train_loss": -28.16400146484375, "global_step": 549701, "epoch": 6622} {"train_loss": -27.822118759155273, "global_step": 549702, "epoch": 6622} {"train_loss": -27.71497917175293, "global_step": 549703, "epoch": 6622} {"train_loss": -27.832677841186523, "global_step": 549704, "epoch": 6622} {"train_loss": -27.974517822265625, "global_step": 549705, "epoch": 6622} {"train_loss": -28.07826805114746, "global_step": 549706, "epoch": 6622} {"train_loss": -28.16486167907715, "global_step": 549707, "epoch": 6622} {"train_loss": -27.571321648287487, "global_step": 549708, "epoch": 6622, "val_loss": 6538067.0} {"train_loss": -25.591230392456055, "global_step": 549709, "epoch": 6623} {"train_loss": -19.866687774658203, "global_step": 549710, "epoch": 6623} {"train_loss": -17.121068954467773, "global_step": 549711, "epoch": 6623} {"train_loss": -25.910263061523438, "global_step": 549712, "epoch": 6623} {"train_loss": -22.073869705200195, "global_step": 549713, "epoch": 6623} {"train_loss": -26.078725814819336, "global_step": 549714, "epoch": 6623} {"train_loss": -23.309768676757812, "global_step": 549715, "epoch": 6623} {"train_loss": -25.459823608398438, "global_step": 549716, "epoch": 6623} {"train_loss": -25.287063598632812, "global_step": 549717, "epoch": 6623} {"train_loss": -26.074909210205078, "global_step": 549718, "epoch": 6623} {"train_loss": -24.80762481689453, "global_step": 549719, "epoch": 6623} {"train_loss": -25.6085262298584, "global_step": 549720, "epoch": 6623} {"train_loss": -26.260761260986328, "global_step": 549721, "epoch": 6623} {"train_loss": -25.977277755737305, "global_step": 549722, "epoch": 6623} {"train_loss": -25.008766174316406, "global_step": 549723, "epoch": 6623} {"train_loss": -26.193166732788086, "global_step": 549724, "epoch": 6623} {"train_loss": -26.028940200805664, "global_step": 549725, "epoch": 6623} {"train_loss": -26.073352813720703, "global_step": 549726, "epoch": 6623} {"train_loss": -26.07783317565918, "global_step": 549727, "epoch": 6623} {"train_loss": -26.4765567779541, "global_step": 549728, "epoch": 6623} {"train_loss": -26.113208770751953, "global_step": 549729, "epoch": 6623} {"train_loss": -26.69513511657715, "global_step": 549730, "epoch": 6623} {"train_loss": -26.61445426940918, "global_step": 549731, "epoch": 6623} {"train_loss": -26.47296142578125, "global_step": 549732, "epoch": 6623} {"train_loss": -26.55208396911621, "global_step": 549733, "epoch": 6623} {"train_loss": -26.4631290435791, "global_step": 549734, "epoch": 6623} {"train_loss": -26.570810317993164, "global_step": 549735, "epoch": 6623} {"train_loss": -26.562255859375, "global_step": 549736, "epoch": 6623} {"train_loss": -26.87405776977539, "global_step": 549737, "epoch": 6623} {"train_loss": -26.904342651367188, "global_step": 549738, "epoch": 6623} {"train_loss": -27.119434356689453, "global_step": 549739, "epoch": 6623} {"train_loss": -26.841421127319336, "global_step": 549740, "epoch": 6623} {"train_loss": -26.78385353088379, "global_step": 549741, "epoch": 6623} {"train_loss": -27.026880264282227, "global_step": 549742, "epoch": 6623} {"train_loss": -26.958051681518555, "global_step": 549743, "epoch": 6623} {"train_loss": -27.022659301757812, "global_step": 549744, "epoch": 6623} {"train_loss": -26.965499877929688, "global_step": 549745, "epoch": 6623} {"train_loss": -27.191761016845703, "global_step": 549746, "epoch": 6623} {"train_loss": -27.26881217956543, "global_step": 549747, "epoch": 6623} {"train_loss": -27.55569839477539, "global_step": 549748, "epoch": 6623} {"train_loss": -27.126117706298828, "global_step": 549749, "epoch": 6623} {"train_loss": -27.285329818725586, "global_step": 549750, "epoch": 6623} {"train_loss": -27.092992782592773, "global_step": 549751, "epoch": 6623} {"train_loss": -27.601964950561523, "global_step": 549752, "epoch": 6623} {"train_loss": -27.51381492614746, "global_step": 549753, "epoch": 6623} {"train_loss": -27.260910034179688, "global_step": 549754, "epoch": 6623} {"train_loss": -27.284591674804688, "global_step": 549755, "epoch": 6623} {"train_loss": -27.115386962890625, "global_step": 549756, "epoch": 6623} {"train_loss": -27.278661727905273, "global_step": 549757, "epoch": 6623} {"train_loss": -27.136768341064453, "global_step": 549758, "epoch": 6623} {"train_loss": -27.175119400024414, "global_step": 549759, "epoch": 6623} {"train_loss": -27.256271362304688, "global_step": 549760, "epoch": 6623} {"train_loss": -27.33915138244629, "global_step": 549761, "epoch": 6623} {"train_loss": -27.443586349487305, "global_step": 549762, "epoch": 6623} {"train_loss": -27.317764282226562, "global_step": 549763, "epoch": 6623} {"train_loss": -27.02662467956543, "global_step": 549764, "epoch": 6623} {"train_loss": -27.46918296813965, "global_step": 549765, "epoch": 6623} {"train_loss": -27.792224884033203, "global_step": 549766, "epoch": 6623} {"train_loss": -28.014677047729492, "global_step": 549767, "epoch": 6623} {"train_loss": -27.479246139526367, "global_step": 549768, "epoch": 6623} {"train_loss": -27.60597038269043, "global_step": 549769, "epoch": 6623} {"train_loss": -27.619535446166992, "global_step": 549770, "epoch": 6623} {"train_loss": -27.54117774963379, "global_step": 549771, "epoch": 6623} {"train_loss": -27.39643669128418, "global_step": 549772, "epoch": 6623} {"train_loss": -27.786666870117188, "global_step": 549773, "epoch": 6623} {"train_loss": -28.057910919189453, "global_step": 549774, "epoch": 6623} {"train_loss": -27.917261123657227, "global_step": 549775, "epoch": 6623} {"train_loss": -27.496545791625977, "global_step": 549776, "epoch": 6623} {"train_loss": -27.60517692565918, "global_step": 549777, "epoch": 6623} {"train_loss": -27.767776489257812, "global_step": 549778, "epoch": 6623} {"train_loss": -27.72499656677246, "global_step": 549779, "epoch": 6623} {"train_loss": -27.188562393188477, "global_step": 549780, "epoch": 6623} {"train_loss": -27.73176383972168, "global_step": 549781, "epoch": 6623} {"train_loss": -27.864721298217773, "global_step": 549782, "epoch": 6623} {"train_loss": -27.872833251953125, "global_step": 549783, "epoch": 6623} {"train_loss": -27.607385635375977, "global_step": 549784, "epoch": 6623} {"train_loss": -27.2663516998291, "global_step": 549785, "epoch": 6623} {"train_loss": -27.533666610717773, "global_step": 549786, "epoch": 6623} {"train_loss": -27.681116104125977, "global_step": 549787, "epoch": 6623} {"train_loss": -28.155994415283203, "global_step": 549788, "epoch": 6623} {"train_loss": -28.23700523376465, "global_step": 549789, "epoch": 6623} {"train_loss": -27.570026397705078, "global_step": 549790, "epoch": 6623} {"train_loss": -26.714980826320417, "global_step": 549791, "epoch": 6623, "val_loss": 6690931.0} {"train_loss": -27.133441925048828, "global_step": 549792, "epoch": 6624} {"train_loss": -26.403518676757812, "global_step": 549793, "epoch": 6624} {"train_loss": -27.4466495513916, "global_step": 549794, "epoch": 6624} {"train_loss": -27.318307876586914, "global_step": 549795, "epoch": 6624} {"train_loss": -26.919118881225586, "global_step": 549796, "epoch": 6624} {"train_loss": -26.87055778503418, "global_step": 549797, "epoch": 6624} {"train_loss": -26.81829261779785, "global_step": 549798, "epoch": 6624} {"train_loss": -27.498289108276367, "global_step": 549799, "epoch": 6624} {"train_loss": -27.181201934814453, "global_step": 549800, "epoch": 6624} {"train_loss": -27.61822509765625, "global_step": 549801, "epoch": 6624} {"train_loss": -27.406524658203125, "global_step": 549802, "epoch": 6624} {"train_loss": -26.872913360595703, "global_step": 549803, "epoch": 6624} {"train_loss": -27.411117553710938, "global_step": 549804, "epoch": 6624} {"train_loss": -27.193845748901367, "global_step": 549805, "epoch": 6624} {"train_loss": -27.3144474029541, "global_step": 549806, "epoch": 6624} {"train_loss": -27.58656883239746, "global_step": 549807, "epoch": 6624} {"train_loss": -27.082914352416992, "global_step": 549808, "epoch": 6624} {"train_loss": -27.284992218017578, "global_step": 549809, "epoch": 6624} {"train_loss": -27.151081085205078, "global_step": 549810, "epoch": 6624} {"train_loss": -27.332605361938477, "global_step": 549811, "epoch": 6624} {"train_loss": -27.94928550720215, "global_step": 549812, "epoch": 6624} {"train_loss": -27.530059814453125, "global_step": 549813, "epoch": 6624} {"train_loss": -27.406591415405273, "global_step": 549814, "epoch": 6624} {"train_loss": -27.307336807250977, "global_step": 549815, "epoch": 6624} {"train_loss": -27.886289596557617, "global_step": 549816, "epoch": 6624} {"train_loss": -27.82564353942871, "global_step": 549817, "epoch": 6624} {"train_loss": -27.69140625, "global_step": 549818, "epoch": 6624} {"train_loss": -27.678592681884766, "global_step": 549819, "epoch": 6624} {"train_loss": -27.2734317779541, "global_step": 549820, "epoch": 6624} {"train_loss": -27.576496124267578, "global_step": 549821, "epoch": 6624} {"train_loss": -27.647506713867188, "global_step": 549822, "epoch": 6624} {"train_loss": -27.806976318359375, "global_step": 549823, "epoch": 6624} {"train_loss": -27.701068878173828, "global_step": 549824, "epoch": 6624} {"train_loss": -27.454687118530273, "global_step": 549825, "epoch": 6624} {"train_loss": -27.759937286376953, "global_step": 549826, "epoch": 6624} {"train_loss": -27.368026733398438, "global_step": 549827, "epoch": 6624} {"train_loss": -27.778223037719727, "global_step": 549828, "epoch": 6624} {"train_loss": -27.853925704956055, "global_step": 549829, "epoch": 6624} {"train_loss": -27.744001388549805, "global_step": 549830, "epoch": 6624} {"train_loss": -27.778766632080078, "global_step": 549831, "epoch": 6624} {"train_loss": -27.5300350189209, "global_step": 549832, "epoch": 6624} {"train_loss": -27.910531997680664, "global_step": 549833, "epoch": 6624} {"train_loss": -27.5803279876709, "global_step": 549834, "epoch": 6624} {"train_loss": -27.6806583404541, "global_step": 549835, "epoch": 6624} {"train_loss": -27.958948135375977, "global_step": 549836, "epoch": 6624} {"train_loss": -27.874082565307617, "global_step": 549837, "epoch": 6624} {"train_loss": -27.777114868164062, "global_step": 549838, "epoch": 6624} {"train_loss": -28.134021759033203, "global_step": 549839, "epoch": 6624} {"train_loss": -27.8662109375, "global_step": 549840, "epoch": 6624} {"train_loss": -27.640562057495117, "global_step": 549841, "epoch": 6624} {"train_loss": -27.70248794555664, "global_step": 549842, "epoch": 6624} {"train_loss": -27.516422271728516, "global_step": 549843, "epoch": 6624} {"train_loss": -27.466312408447266, "global_step": 549844, "epoch": 6624} {"train_loss": -27.68995475769043, "global_step": 549845, "epoch": 6624} {"train_loss": -27.74028968811035, "global_step": 549846, "epoch": 6624} {"train_loss": -28.120670318603516, "global_step": 549847, "epoch": 6624} {"train_loss": -27.651559829711914, "global_step": 549848, "epoch": 6624} {"train_loss": -27.84663200378418, "global_step": 549849, "epoch": 6624} {"train_loss": -27.805566787719727, "global_step": 549850, "epoch": 6624} {"train_loss": -27.5053768157959, "global_step": 549851, "epoch": 6624} {"train_loss": -27.56451988220215, "global_step": 549852, "epoch": 6624} {"train_loss": -27.565908432006836, "global_step": 549853, "epoch": 6624} {"train_loss": -27.768651962280273, "global_step": 549854, "epoch": 6624} {"train_loss": -27.765640258789062, "global_step": 549855, "epoch": 6624} {"train_loss": -27.7172794342041, "global_step": 549856, "epoch": 6624} {"train_loss": -28.000802993774414, "global_step": 549857, "epoch": 6624} {"train_loss": -27.734922409057617, "global_step": 549858, "epoch": 6624} {"train_loss": -27.913888931274414, "global_step": 549859, "epoch": 6624} {"train_loss": -27.335952758789062, "global_step": 549860, "epoch": 6624} {"train_loss": -27.93341636657715, "global_step": 549861, "epoch": 6624} {"train_loss": -27.749990463256836, "global_step": 549862, "epoch": 6624} {"train_loss": -27.804672241210938, "global_step": 549863, "epoch": 6624} {"train_loss": -28.186832427978516, "global_step": 549864, "epoch": 6624} {"train_loss": -27.887847900390625, "global_step": 549865, "epoch": 6624} {"train_loss": -27.949054718017578, "global_step": 549866, "epoch": 6624} {"train_loss": -27.764989852905273, "global_step": 549867, "epoch": 6624} {"train_loss": -27.796064376831055, "global_step": 549868, "epoch": 6624} {"train_loss": -27.88873863220215, "global_step": 549869, "epoch": 6624} {"train_loss": -28.304824829101562, "global_step": 549870, "epoch": 6624} {"train_loss": -27.78260612487793, "global_step": 549871, "epoch": 6624} {"train_loss": -27.9626407623291, "global_step": 549872, "epoch": 6624} {"train_loss": -27.701032638549805, "global_step": 549873, "epoch": 6624} {"train_loss": -27.611393641276532, "global_step": 549874, "epoch": 6624, "val_loss": 6559935.0} {"train_loss": -27.194686889648438, "global_step": 549875, "epoch": 6625} {"train_loss": -27.215742111206055, "global_step": 549876, "epoch": 6625} {"train_loss": -27.297327041625977, "global_step": 549877, "epoch": 6625} {"train_loss": -26.981739044189453, "global_step": 549878, "epoch": 6625} {"train_loss": -27.179401397705078, "global_step": 549879, "epoch": 6625} {"train_loss": -26.974353790283203, "global_step": 549880, "epoch": 6625} {"train_loss": -27.290668487548828, "global_step": 549881, "epoch": 6625} {"train_loss": -27.196348190307617, "global_step": 549882, "epoch": 6625} {"train_loss": -27.30096435546875, "global_step": 549883, "epoch": 6625} {"train_loss": -27.119998931884766, "global_step": 549884, "epoch": 6625} {"train_loss": -27.0042781829834, "global_step": 549885, "epoch": 6625} {"train_loss": -27.810260772705078, "global_step": 549886, "epoch": 6625} {"train_loss": -27.070816040039062, "global_step": 549887, "epoch": 6625} {"train_loss": -27.33595848083496, "global_step": 549888, "epoch": 6625} {"train_loss": -27.079687118530273, "global_step": 549889, "epoch": 6625} {"train_loss": -27.644805908203125, "global_step": 549890, "epoch": 6625} {"train_loss": -27.400930404663086, "global_step": 549891, "epoch": 6625} {"train_loss": -27.624866485595703, "global_step": 549892, "epoch": 6625} {"train_loss": -27.941064834594727, "global_step": 549893, "epoch": 6625} {"train_loss": -27.809173583984375, "global_step": 549894, "epoch": 6625} {"train_loss": -27.637537002563477, "global_step": 549895, "epoch": 6625} {"train_loss": -27.683271408081055, "global_step": 549896, "epoch": 6625} {"train_loss": -27.878026962280273, "global_step": 549897, "epoch": 6625} {"train_loss": -27.691389083862305, "global_step": 549898, "epoch": 6625} {"train_loss": -27.87255859375, "global_step": 549899, "epoch": 6625} {"train_loss": -27.86722183227539, "global_step": 549900, "epoch": 6625} {"train_loss": -27.933551788330078, "global_step": 549901, "epoch": 6625} {"train_loss": -27.622684478759766, "global_step": 549902, "epoch": 6625} {"train_loss": -27.66936683654785, "global_step": 549903, "epoch": 6625} {"train_loss": -27.68994140625, "global_step": 549904, "epoch": 6625} {"train_loss": -28.0255184173584, "global_step": 549905, "epoch": 6625} {"train_loss": -27.5720157623291, "global_step": 549906, "epoch": 6625} {"train_loss": -27.895994186401367, "global_step": 549907, "epoch": 6625} {"train_loss": -27.6680965423584, "global_step": 549908, "epoch": 6625} {"train_loss": -28.038496017456055, "global_step": 549909, "epoch": 6625} {"train_loss": -28.014822006225586, "global_step": 549910, "epoch": 6625} {"train_loss": -27.938791275024414, "global_step": 549911, "epoch": 6625} {"train_loss": -27.275711059570312, "global_step": 549912, "epoch": 6625} {"train_loss": -28.29697036743164, "global_step": 549913, "epoch": 6625} {"train_loss": -27.694116592407227, "global_step": 549914, "epoch": 6625} {"train_loss": -27.962146759033203, "global_step": 549915, "epoch": 6625} {"train_loss": -28.080270767211914, "global_step": 549916, "epoch": 6625} {"train_loss": -28.018583297729492, "global_step": 549917, "epoch": 6625} {"train_loss": -27.734373092651367, "global_step": 549918, "epoch": 6625} {"train_loss": -27.688079833984375, "global_step": 549919, "epoch": 6625} {"train_loss": -27.702259063720703, "global_step": 549920, "epoch": 6625} {"train_loss": -27.748046875, "global_step": 549921, "epoch": 6625} {"train_loss": -28.030241012573242, "global_step": 549922, "epoch": 6625} {"train_loss": -27.80900001525879, "global_step": 549923, "epoch": 6625} {"train_loss": -27.951007843017578, "global_step": 549924, "epoch": 6625} {"train_loss": -27.842504501342773, "global_step": 549925, "epoch": 6625} {"train_loss": -27.637115478515625, "global_step": 549926, "epoch": 6625} {"train_loss": -28.067352294921875, "global_step": 549927, "epoch": 6625} {"train_loss": -27.908048629760742, "global_step": 549928, "epoch": 6625} {"train_loss": -28.19378089904785, "global_step": 549929, "epoch": 6625} {"train_loss": -27.911291122436523, "global_step": 549930, "epoch": 6625} {"train_loss": -27.679645538330078, "global_step": 549931, "epoch": 6625} {"train_loss": -28.030370712280273, "global_step": 549932, "epoch": 6625} {"train_loss": -27.606374740600586, "global_step": 549933, "epoch": 6625} {"train_loss": -27.742462158203125, "global_step": 549934, "epoch": 6625} {"train_loss": -27.581756591796875, "global_step": 549935, "epoch": 6625} {"train_loss": -26.403045654296875, "global_step": 549936, "epoch": 6625} {"train_loss": -23.594449996948242, "global_step": 549937, "epoch": 6625} {"train_loss": -22.71006965637207, "global_step": 549938, "epoch": 6625} {"train_loss": -27.072036743164062, "global_step": 549939, "epoch": 6625} {"train_loss": -25.582334518432617, "global_step": 549940, "epoch": 6625} {"train_loss": -27.04300880432129, "global_step": 549941, "epoch": 6625} {"train_loss": -25.838581085205078, "global_step": 549942, "epoch": 6625} {"train_loss": -27.22224235534668, "global_step": 549943, "epoch": 6625} {"train_loss": -26.48589515686035, "global_step": 549944, "epoch": 6625} {"train_loss": -26.829015731811523, "global_step": 549945, "epoch": 6625} {"train_loss": -26.87721824645996, "global_step": 549946, "epoch": 6625} {"train_loss": -27.089954376220703, "global_step": 549947, "epoch": 6625} {"train_loss": -26.665454864501953, "global_step": 549948, "epoch": 6625} {"train_loss": -27.030975341796875, "global_step": 549949, "epoch": 6625} {"train_loss": -26.866918563842773, "global_step": 549950, "epoch": 6625} {"train_loss": -26.626041412353516, "global_step": 549951, "epoch": 6625} {"train_loss": -27.221546173095703, "global_step": 549952, "epoch": 6625} {"train_loss": -27.308807373046875, "global_step": 549953, "epoch": 6625} {"train_loss": -26.7208251953125, "global_step": 549954, "epoch": 6625} {"train_loss": -27.47051429748535, "global_step": 549955, "epoch": 6625} {"train_loss": -27.577438354492188, "global_step": 549956, "epoch": 6625} {"train_loss": -27.364331946315534, "global_step": 549957, "epoch": 6625, "val_loss": 6611454.0} {"train_loss": -26.410776138305664, "global_step": 549958, "epoch": 6626} {"train_loss": -26.475324630737305, "global_step": 549959, "epoch": 6626} {"train_loss": -27.38441276550293, "global_step": 549960, "epoch": 6626} {"train_loss": -27.239835739135742, "global_step": 549961, "epoch": 6626} {"train_loss": -26.867395401000977, "global_step": 549962, "epoch": 6626} {"train_loss": -27.067169189453125, "global_step": 549963, "epoch": 6626} {"train_loss": -27.373477935791016, "global_step": 549964, "epoch": 6626} {"train_loss": -26.86128807067871, "global_step": 549965, "epoch": 6626} {"train_loss": -27.238554000854492, "global_step": 549966, "epoch": 6626} {"train_loss": -26.994596481323242, "global_step": 549967, "epoch": 6626} {"train_loss": -27.178192138671875, "global_step": 549968, "epoch": 6626} {"train_loss": -27.04438591003418, "global_step": 549969, "epoch": 6626} {"train_loss": -27.131610870361328, "global_step": 549970, "epoch": 6626} {"train_loss": -27.47779655456543, "global_step": 549971, "epoch": 6626} {"train_loss": -27.504316329956055, "global_step": 549972, "epoch": 6626} {"train_loss": -27.6849365234375, "global_step": 549973, "epoch": 6626} {"train_loss": -27.452688217163086, "global_step": 549974, "epoch": 6626} {"train_loss": -27.432178497314453, "global_step": 549975, "epoch": 6626} {"train_loss": -27.674108505249023, "global_step": 549976, "epoch": 6626} {"train_loss": -27.327960968017578, "global_step": 549977, "epoch": 6626} {"train_loss": -27.5982723236084, "global_step": 549978, "epoch": 6626} {"train_loss": -27.412628173828125, "global_step": 549979, "epoch": 6626} {"train_loss": -27.77557945251465, "global_step": 549980, "epoch": 6626} {"train_loss": -27.624298095703125, "global_step": 549981, "epoch": 6626} {"train_loss": -27.442432403564453, "global_step": 549982, "epoch": 6626} {"train_loss": -27.307077407836914, "global_step": 549983, "epoch": 6626} {"train_loss": -27.474470138549805, "global_step": 549984, "epoch": 6626} {"train_loss": -27.779943466186523, "global_step": 549985, "epoch": 6626} {"train_loss": -27.544702529907227, "global_step": 549986, "epoch": 6626} {"train_loss": -27.6830997467041, "global_step": 549987, "epoch": 6626} {"train_loss": -27.741559982299805, "global_step": 549988, "epoch": 6626} {"train_loss": -27.604522705078125, "global_step": 549989, "epoch": 6626} {"train_loss": -27.65199851989746, "global_step": 549990, "epoch": 6626} {"train_loss": -27.651020050048828, "global_step": 549991, "epoch": 6626} {"train_loss": -27.525482177734375, "global_step": 549992, "epoch": 6626} {"train_loss": -27.668790817260742, "global_step": 549993, "epoch": 6626} {"train_loss": -27.45867347717285, "global_step": 549994, "epoch": 6626} {"train_loss": -27.366968154907227, "global_step": 549995, "epoch": 6626} {"train_loss": -27.495832443237305, "global_step": 549996, "epoch": 6626} {"train_loss": -27.6112060546875, "global_step": 549997, "epoch": 6626} {"train_loss": -27.813831329345703, "global_step": 549998, "epoch": 6626} {"train_loss": -27.571985244750977, "global_step": 549999, "epoch": 6626} {"train_loss": -27.556182861328125, "global_step": 550000, "epoch": 6626} {"train_loss": -27.815555572509766, "global_step": 550001, "epoch": 6626} {"train_loss": -27.499267578125, "global_step": 550002, "epoch": 6626} {"train_loss": -27.85648536682129, "global_step": 550003, "epoch": 6626} {"train_loss": -28.072357177734375, "global_step": 550004, "epoch": 6626} {"train_loss": -27.635278701782227, "global_step": 550005, "epoch": 6626} {"train_loss": -28.089160919189453, "global_step": 550006, "epoch": 6626} {"train_loss": -28.032697677612305, "global_step": 550007, "epoch": 6626} {"train_loss": -27.92164421081543, "global_step": 550008, "epoch": 6626} {"train_loss": -28.23395347595215, "global_step": 550009, "epoch": 6626} {"train_loss": -27.693439483642578, "global_step": 550010, "epoch": 6626} {"train_loss": -27.642847061157227, "global_step": 550011, "epoch": 6626} {"train_loss": -28.151010513305664, "global_step": 550012, "epoch": 6626} {"train_loss": -27.64013671875, "global_step": 550013, "epoch": 6626} {"train_loss": -27.8050479888916, "global_step": 550014, "epoch": 6626} {"train_loss": -27.638214111328125, "global_step": 550015, "epoch": 6626} {"train_loss": -27.712743759155273, "global_step": 550016, "epoch": 6626} {"train_loss": -27.661361694335938, "global_step": 550017, "epoch": 6626} {"train_loss": -27.737354278564453, "global_step": 550018, "epoch": 6626} {"train_loss": -27.997745513916016, "global_step": 550019, "epoch": 6626} {"train_loss": -27.760650634765625, "global_step": 550020, "epoch": 6626} {"train_loss": -28.002790451049805, "global_step": 550021, "epoch": 6626} {"train_loss": -28.01002311706543, "global_step": 550022, "epoch": 6626} {"train_loss": -28.10041618347168, "global_step": 550023, "epoch": 6626} {"train_loss": -28.058868408203125, "global_step": 550024, "epoch": 6626} {"train_loss": -27.489246368408203, "global_step": 550025, "epoch": 6626} {"train_loss": -27.570425033569336, "global_step": 550026, "epoch": 6626} {"train_loss": -27.871734619140625, "global_step": 550027, "epoch": 6626} {"train_loss": -27.997095108032227, "global_step": 550028, "epoch": 6626} {"train_loss": -27.8330078125, "global_step": 550029, "epoch": 6626} {"train_loss": -27.590116500854492, "global_step": 550030, "epoch": 6626} {"train_loss": -28.073444366455078, "global_step": 550031, "epoch": 6626} {"train_loss": -27.664234161376953, "global_step": 550032, "epoch": 6626} {"train_loss": -27.949960708618164, "global_step": 550033, "epoch": 6626} {"train_loss": -27.91277503967285, "global_step": 550034, "epoch": 6626} {"train_loss": -27.52143669128418, "global_step": 550035, "epoch": 6626} {"train_loss": -27.60858726501465, "global_step": 550036, "epoch": 6626} {"train_loss": -27.7178897857666, "global_step": 550037, "epoch": 6626} {"train_loss": -27.717008590698242, "global_step": 550038, "epoch": 6626} {"train_loss": -27.948272705078125, "global_step": 550039, "epoch": 6626} {"train_loss": -27.589292641145637, "global_step": 550040, "epoch": 6626, "val_loss": 6615048.5} {"train_loss": -26.793542861938477, "global_step": 550041, "epoch": 6627} {"train_loss": -26.510095596313477, "global_step": 550042, "epoch": 6627} {"train_loss": -26.525999069213867, "global_step": 550043, "epoch": 6627} {"train_loss": -26.756763458251953, "global_step": 550044, "epoch": 6627} {"train_loss": -27.47821617126465, "global_step": 550045, "epoch": 6627} {"train_loss": -26.09697914123535, "global_step": 550046, "epoch": 6627} {"train_loss": -27.155776977539062, "global_step": 550047, "epoch": 6627} {"train_loss": -27.154300689697266, "global_step": 550048, "epoch": 6627} {"train_loss": -27.194339752197266, "global_step": 550049, "epoch": 6627} {"train_loss": -26.95612144470215, "global_step": 550050, "epoch": 6627} {"train_loss": -26.99932861328125, "global_step": 550051, "epoch": 6627} {"train_loss": -27.20416259765625, "global_step": 550052, "epoch": 6627} {"train_loss": -26.993383407592773, "global_step": 550053, "epoch": 6627} {"train_loss": -27.46013832092285, "global_step": 550054, "epoch": 6627} {"train_loss": -27.513586044311523, "global_step": 550055, "epoch": 6627} {"train_loss": -27.294721603393555, "global_step": 550056, "epoch": 6627} {"train_loss": -27.544921875, "global_step": 550057, "epoch": 6627} {"train_loss": -27.29056739807129, "global_step": 550058, "epoch": 6627} {"train_loss": -27.283557891845703, "global_step": 550059, "epoch": 6627} {"train_loss": -27.091962814331055, "global_step": 550060, "epoch": 6627} {"train_loss": -27.49857521057129, "global_step": 550061, "epoch": 6627} {"train_loss": -27.120691299438477, "global_step": 550062, "epoch": 6627} {"train_loss": -27.24277114868164, "global_step": 550063, "epoch": 6627} {"train_loss": -27.618946075439453, "global_step": 550064, "epoch": 6627} {"train_loss": -27.433521270751953, "global_step": 550065, "epoch": 6627} {"train_loss": -27.39837646484375, "global_step": 550066, "epoch": 6627} {"train_loss": -27.8341007232666, "global_step": 550067, "epoch": 6627} {"train_loss": -27.401952743530273, "global_step": 550068, "epoch": 6627} {"train_loss": -27.926130294799805, "global_step": 550069, "epoch": 6627} {"train_loss": -27.765867233276367, "global_step": 550070, "epoch": 6627} {"train_loss": -27.6041316986084, "global_step": 550071, "epoch": 6627} {"train_loss": -27.60761833190918, "global_step": 550072, "epoch": 6627} {"train_loss": -27.516122817993164, "global_step": 550073, "epoch": 6627} {"train_loss": -27.955387115478516, "global_step": 550074, "epoch": 6627} {"train_loss": -27.794031143188477, "global_step": 550075, "epoch": 6627} {"train_loss": -27.85260009765625, "global_step": 550076, "epoch": 6627} {"train_loss": -27.734750747680664, "global_step": 550077, "epoch": 6627} {"train_loss": -27.5341796875, "global_step": 550078, "epoch": 6627} {"train_loss": -27.335485458374023, "global_step": 550079, "epoch": 6627} {"train_loss": -27.35382080078125, "global_step": 550080, "epoch": 6627} {"train_loss": -27.623022079467773, "global_step": 550081, "epoch": 6627} {"train_loss": -27.74736976623535, "global_step": 550082, "epoch": 6627} {"train_loss": -27.78755760192871, "global_step": 550083, "epoch": 6627} {"train_loss": -27.944604873657227, "global_step": 550084, "epoch": 6627} {"train_loss": -27.837934494018555, "global_step": 550085, "epoch": 6627} {"train_loss": -27.637598037719727, "global_step": 550086, "epoch": 6627} {"train_loss": -28.150190353393555, "global_step": 550087, "epoch": 6627} {"train_loss": -27.8612003326416, "global_step": 550088, "epoch": 6627} {"train_loss": -27.722869873046875, "global_step": 550089, "epoch": 6627} {"train_loss": -28.20941162109375, "global_step": 550090, "epoch": 6627} {"train_loss": -27.583276748657227, "global_step": 550091, "epoch": 6627} {"train_loss": -27.896060943603516, "global_step": 550092, "epoch": 6627} {"train_loss": -27.72157096862793, "global_step": 550093, "epoch": 6627} {"train_loss": -27.53203773498535, "global_step": 550094, "epoch": 6627} {"train_loss": -27.928918838500977, "global_step": 550095, "epoch": 6627} {"train_loss": -28.0574893951416, "global_step": 550096, "epoch": 6627} {"train_loss": -27.808462142944336, "global_step": 550097, "epoch": 6627} {"train_loss": -27.722021102905273, "global_step": 550098, "epoch": 6627} {"train_loss": -27.91033363342285, "global_step": 550099, "epoch": 6627} {"train_loss": -27.17231559753418, "global_step": 550100, "epoch": 6627} {"train_loss": -27.508588790893555, "global_step": 550101, "epoch": 6627} {"train_loss": -27.30472183227539, "global_step": 550102, "epoch": 6627} {"train_loss": -27.55879020690918, "global_step": 550103, "epoch": 6627} {"train_loss": -27.371198654174805, "global_step": 550104, "epoch": 6627} {"train_loss": -27.21000099182129, "global_step": 550105, "epoch": 6627} {"train_loss": -27.7028751373291, "global_step": 550106, "epoch": 6627} {"train_loss": -27.7497615814209, "global_step": 550107, "epoch": 6627} {"train_loss": -27.259902954101562, "global_step": 550108, "epoch": 6627} {"train_loss": -27.798038482666016, "global_step": 550109, "epoch": 6627} {"train_loss": -27.825424194335938, "global_step": 550110, "epoch": 6627} {"train_loss": -27.3723201751709, "global_step": 550111, "epoch": 6627} {"train_loss": -27.827802658081055, "global_step": 550112, "epoch": 6627} {"train_loss": -27.884267807006836, "global_step": 550113, "epoch": 6627} {"train_loss": -27.491043090820312, "global_step": 550114, "epoch": 6627} {"train_loss": -27.647825241088867, "global_step": 550115, "epoch": 6627} {"train_loss": -27.637311935424805, "global_step": 550116, "epoch": 6627} {"train_loss": -27.761035919189453, "global_step": 550117, "epoch": 6627} {"train_loss": -27.708484649658203, "global_step": 550118, "epoch": 6627} {"train_loss": -27.85686683654785, "global_step": 550119, "epoch": 6627} {"train_loss": -27.819150924682617, "global_step": 550120, "epoch": 6627} {"train_loss": -28.19943618774414, "global_step": 550121, "epoch": 6627} {"train_loss": -27.79506492614746, "global_step": 550122, "epoch": 6627} {"train_loss": -27.529381832444525, "global_step": 550123, "epoch": 6627, "val_loss": 6556219.0} {"train_loss": -27.36829948425293, "global_step": 550124, "epoch": 6628} {"train_loss": -27.461578369140625, "global_step": 550125, "epoch": 6628} {"train_loss": -27.049030303955078, "global_step": 550126, "epoch": 6628} {"train_loss": -27.68836784362793, "global_step": 550127, "epoch": 6628} {"train_loss": -26.821582794189453, "global_step": 550128, "epoch": 6628} {"train_loss": -27.40641212463379, "global_step": 550129, "epoch": 6628} {"train_loss": -27.561243057250977, "global_step": 550130, "epoch": 6628} {"train_loss": -27.023054122924805, "global_step": 550131, "epoch": 6628} {"train_loss": -27.180662155151367, "global_step": 550132, "epoch": 6628} {"train_loss": -27.812658309936523, "global_step": 550133, "epoch": 6628} {"train_loss": -27.391910552978516, "global_step": 550134, "epoch": 6628} {"train_loss": -27.56662368774414, "global_step": 550135, "epoch": 6628} {"train_loss": -27.34869384765625, "global_step": 550136, "epoch": 6628} {"train_loss": -27.913166046142578, "global_step": 550137, "epoch": 6628} {"train_loss": -27.419586181640625, "global_step": 550138, "epoch": 6628} {"train_loss": -27.47121238708496, "global_step": 550139, "epoch": 6628} {"train_loss": -27.667993545532227, "global_step": 550140, "epoch": 6628} {"train_loss": -27.429962158203125, "global_step": 550141, "epoch": 6628} {"train_loss": -27.861310958862305, "global_step": 550142, "epoch": 6628} {"train_loss": -27.5343017578125, "global_step": 550143, "epoch": 6628} {"train_loss": -27.6024227142334, "global_step": 550144, "epoch": 6628} {"train_loss": -27.57622718811035, "global_step": 550145, "epoch": 6628} {"train_loss": -27.255353927612305, "global_step": 550146, "epoch": 6628} {"train_loss": -27.65399169921875, "global_step": 550147, "epoch": 6628} {"train_loss": -27.845441818237305, "global_step": 550148, "epoch": 6628} {"train_loss": -27.54141616821289, "global_step": 550149, "epoch": 6628} {"train_loss": -27.669336318969727, "global_step": 550150, "epoch": 6628} {"train_loss": -27.78070640563965, "global_step": 550151, "epoch": 6628} {"train_loss": -27.8581600189209, "global_step": 550152, "epoch": 6628} {"train_loss": -27.90424156188965, "global_step": 550153, "epoch": 6628} {"train_loss": -27.509618759155273, "global_step": 550154, "epoch": 6628} {"train_loss": -27.623260498046875, "global_step": 550155, "epoch": 6628} {"train_loss": -27.8808650970459, "global_step": 550156, "epoch": 6628} {"train_loss": -27.523977279663086, "global_step": 550157, "epoch": 6628} {"train_loss": -27.951345443725586, "global_step": 550158, "epoch": 6628} {"train_loss": -28.144702911376953, "global_step": 550159, "epoch": 6628} {"train_loss": -28.07306480407715, "global_step": 550160, "epoch": 6628} {"train_loss": -27.655542373657227, "global_step": 550161, "epoch": 6628} {"train_loss": -27.645187377929688, "global_step": 550162, "epoch": 6628} {"train_loss": -27.664587020874023, "global_step": 550163, "epoch": 6628} {"train_loss": -27.545886993408203, "global_step": 550164, "epoch": 6628} {"train_loss": -27.849166870117188, "global_step": 550165, "epoch": 6628} {"train_loss": -27.7734432220459, "global_step": 550166, "epoch": 6628} {"train_loss": -28.198331832885742, "global_step": 550167, "epoch": 6628} {"train_loss": -27.490863800048828, "global_step": 550168, "epoch": 6628} {"train_loss": -27.8459529876709, "global_step": 550169, "epoch": 6628} {"train_loss": -28.2204532623291, "global_step": 550170, "epoch": 6628} {"train_loss": -27.914936065673828, "global_step": 550171, "epoch": 6628} {"train_loss": -27.874807357788086, "global_step": 550172, "epoch": 6628} {"train_loss": -27.75068473815918, "global_step": 550173, "epoch": 6628} {"train_loss": -28.050390243530273, "global_step": 550174, "epoch": 6628} {"train_loss": -27.817169189453125, "global_step": 550175, "epoch": 6628} {"train_loss": -27.077442169189453, "global_step": 550176, "epoch": 6628} {"train_loss": -27.987451553344727, "global_step": 550177, "epoch": 6628} {"train_loss": -27.752761840820312, "global_step": 550178, "epoch": 6628} {"train_loss": -27.732452392578125, "global_step": 550179, "epoch": 6628} {"train_loss": -27.752347946166992, "global_step": 550180, "epoch": 6628} {"train_loss": -27.1379337310791, "global_step": 550181, "epoch": 6628} {"train_loss": -27.4991455078125, "global_step": 550182, "epoch": 6628} {"train_loss": -27.310346603393555, "global_step": 550183, "epoch": 6628} {"train_loss": -27.457050323486328, "global_step": 550184, "epoch": 6628} {"train_loss": -27.527099609375, "global_step": 550185, "epoch": 6628} {"train_loss": -26.71695899963379, "global_step": 550186, "epoch": 6628} {"train_loss": -27.81671714782715, "global_step": 550187, "epoch": 6628} {"train_loss": -27.43534278869629, "global_step": 550188, "epoch": 6628} {"train_loss": -27.47327995300293, "global_step": 550189, "epoch": 6628} {"train_loss": -27.466772079467773, "global_step": 550190, "epoch": 6628} {"train_loss": -27.73828125, "global_step": 550191, "epoch": 6628} {"train_loss": -27.257022857666016, "global_step": 550192, "epoch": 6628} {"train_loss": -27.389789581298828, "global_step": 550193, "epoch": 6628} {"train_loss": -27.499469757080078, "global_step": 550194, "epoch": 6628} {"train_loss": -27.718128204345703, "global_step": 550195, "epoch": 6628} {"train_loss": -27.7878475189209, "global_step": 550196, "epoch": 6628} {"train_loss": -27.237836837768555, "global_step": 550197, "epoch": 6628} {"train_loss": -28.076770782470703, "global_step": 550198, "epoch": 6628} {"train_loss": -27.595020294189453, "global_step": 550199, "epoch": 6628} {"train_loss": -27.451709747314453, "global_step": 550200, "epoch": 6628} {"train_loss": -27.35271644592285, "global_step": 550201, "epoch": 6628} {"train_loss": -27.76059913635254, "global_step": 550202, "epoch": 6628} {"train_loss": -27.549823760986328, "global_step": 550203, "epoch": 6628} {"train_loss": -27.65069580078125, "global_step": 550204, "epoch": 6628} {"train_loss": -27.325519561767578, "global_step": 550205, "epoch": 6628} {"train_loss": -27.60086227325072, "global_step": 550206, "epoch": 6628, "val_loss": 6628095.0} {"train_loss": -27.363439559936523, "global_step": 550207, "epoch": 6629} {"train_loss": -27.19292640686035, "global_step": 550208, "epoch": 6629} {"train_loss": -26.989185333251953, "global_step": 550209, "epoch": 6629} {"train_loss": -27.16868019104004, "global_step": 550210, "epoch": 6629} {"train_loss": -27.66969871520996, "global_step": 550211, "epoch": 6629} {"train_loss": -27.158239364624023, "global_step": 550212, "epoch": 6629} {"train_loss": -27.42669677734375, "global_step": 550213, "epoch": 6629} {"train_loss": -27.520618438720703, "global_step": 550214, "epoch": 6629} {"train_loss": -27.7187442779541, "global_step": 550215, "epoch": 6629} {"train_loss": -27.25927734375, "global_step": 550216, "epoch": 6629} {"train_loss": -26.671838760375977, "global_step": 550217, "epoch": 6629} {"train_loss": -26.775100708007812, "global_step": 550218, "epoch": 6629} {"train_loss": -27.3922176361084, "global_step": 550219, "epoch": 6629} {"train_loss": -27.19276237487793, "global_step": 550220, "epoch": 6629} {"train_loss": -27.457178115844727, "global_step": 550221, "epoch": 6629} {"train_loss": -27.776168823242188, "global_step": 550222, "epoch": 6629} {"train_loss": -27.68268394470215, "global_step": 550223, "epoch": 6629} {"train_loss": -27.01723289489746, "global_step": 550224, "epoch": 6629} {"train_loss": -27.04585838317871, "global_step": 550225, "epoch": 6629} {"train_loss": -27.462604522705078, "global_step": 550226, "epoch": 6629} {"train_loss": -27.22536277770996, "global_step": 550227, "epoch": 6629} {"train_loss": -27.605154037475586, "global_step": 550228, "epoch": 6629} {"train_loss": -27.329254150390625, "global_step": 550229, "epoch": 6629} {"train_loss": -27.508865356445312, "global_step": 550230, "epoch": 6629} {"train_loss": -27.433902740478516, "global_step": 550231, "epoch": 6629} {"train_loss": -27.942142486572266, "global_step": 550232, "epoch": 6629} {"train_loss": -27.878896713256836, "global_step": 550233, "epoch": 6629} {"train_loss": -27.560510635375977, "global_step": 550234, "epoch": 6629} {"train_loss": -27.2401180267334, "global_step": 550235, "epoch": 6629} {"train_loss": -27.488052368164062, "global_step": 550236, "epoch": 6629} {"train_loss": -27.612035751342773, "global_step": 550237, "epoch": 6629} {"train_loss": -27.688785552978516, "global_step": 550238, "epoch": 6629} {"train_loss": -27.19691276550293, "global_step": 550239, "epoch": 6629} {"train_loss": -27.68975830078125, "global_step": 550240, "epoch": 6629} {"train_loss": -27.466001510620117, "global_step": 550241, "epoch": 6629} {"train_loss": -27.847761154174805, "global_step": 550242, "epoch": 6629} {"train_loss": -27.796789169311523, "global_step": 550243, "epoch": 6629} {"train_loss": -27.885950088500977, "global_step": 550244, "epoch": 6629} {"train_loss": -27.645954132080078, "global_step": 550245, "epoch": 6629} {"train_loss": -28.05597496032715, "global_step": 550246, "epoch": 6629} {"train_loss": -27.902328491210938, "global_step": 550247, "epoch": 6629} {"train_loss": -27.735013961791992, "global_step": 550248, "epoch": 6629} {"train_loss": -27.617475509643555, "global_step": 550249, "epoch": 6629} {"train_loss": -27.944543838500977, "global_step": 550250, "epoch": 6629} {"train_loss": -27.8640193939209, "global_step": 550251, "epoch": 6629} {"train_loss": -27.90536880493164, "global_step": 550252, "epoch": 6629} {"train_loss": -27.37640380859375, "global_step": 550253, "epoch": 6629} {"train_loss": -28.041494369506836, "global_step": 550254, "epoch": 6629} {"train_loss": -27.55222511291504, "global_step": 550255, "epoch": 6629} {"train_loss": -27.883441925048828, "global_step": 550256, "epoch": 6629} {"train_loss": -28.103689193725586, "global_step": 550257, "epoch": 6629} {"train_loss": -27.573139190673828, "global_step": 550258, "epoch": 6629} {"train_loss": -27.636621475219727, "global_step": 550259, "epoch": 6629} {"train_loss": -27.833826065063477, "global_step": 550260, "epoch": 6629} {"train_loss": -27.691858291625977, "global_step": 550261, "epoch": 6629} {"train_loss": -28.204275131225586, "global_step": 550262, "epoch": 6629} {"train_loss": -28.1008243560791, "global_step": 550263, "epoch": 6629} {"train_loss": -27.616607666015625, "global_step": 550264, "epoch": 6629} {"train_loss": -27.507465362548828, "global_step": 550265, "epoch": 6629} {"train_loss": -27.379117965698242, "global_step": 550266, "epoch": 6629} {"train_loss": -27.431760787963867, "global_step": 550267, "epoch": 6629} {"train_loss": -27.816076278686523, "global_step": 550268, "epoch": 6629} {"train_loss": -27.66594886779785, "global_step": 550269, "epoch": 6629} {"train_loss": -27.84817886352539, "global_step": 550270, "epoch": 6629} {"train_loss": -27.70380210876465, "global_step": 550271, "epoch": 6629} {"train_loss": -27.559402465820312, "global_step": 550272, "epoch": 6629} {"train_loss": -27.702253341674805, "global_step": 550273, "epoch": 6629} {"train_loss": -27.640689849853516, "global_step": 550274, "epoch": 6629} {"train_loss": -27.62928581237793, "global_step": 550275, "epoch": 6629} {"train_loss": -27.791065216064453, "global_step": 550276, "epoch": 6629} {"train_loss": -27.20476722717285, "global_step": 550277, "epoch": 6629} {"train_loss": -27.6483097076416, "global_step": 550278, "epoch": 6629} {"train_loss": -27.6380672454834, "global_step": 550279, "epoch": 6629} {"train_loss": -27.486291885375977, "global_step": 550280, "epoch": 6629} {"train_loss": -27.84345817565918, "global_step": 550281, "epoch": 6629} {"train_loss": -27.656675338745117, "global_step": 550282, "epoch": 6629} {"train_loss": -27.694482803344727, "global_step": 550283, "epoch": 6629} {"train_loss": -27.566165924072266, "global_step": 550284, "epoch": 6629} {"train_loss": -27.509326934814453, "global_step": 550285, "epoch": 6629} {"train_loss": -27.58938980102539, "global_step": 550286, "epoch": 6629} {"train_loss": -28.021230697631836, "global_step": 550287, "epoch": 6629} {"train_loss": -27.61604118347168, "global_step": 550288, "epoch": 6629} {"train_loss": -27.605982102543475, "global_step": 550289, "epoch": 6629, "val_loss": 6696263.5} {"train_loss": -27.029891967773438, "global_step": 550290, "epoch": 6630} {"train_loss": -26.397253036499023, "global_step": 550291, "epoch": 6630} {"train_loss": -27.253326416015625, "global_step": 550292, "epoch": 6630} {"train_loss": -27.3582820892334, "global_step": 550293, "epoch": 6630} {"train_loss": -27.0914249420166, "global_step": 550294, "epoch": 6630} {"train_loss": -27.351057052612305, "global_step": 550295, "epoch": 6630} {"train_loss": -27.269989013671875, "global_step": 550296, "epoch": 6630} {"train_loss": -27.26270866394043, "global_step": 550297, "epoch": 6630} {"train_loss": -27.567367553710938, "global_step": 550298, "epoch": 6630} {"train_loss": -27.444726943969727, "global_step": 550299, "epoch": 6630} {"train_loss": -27.364599227905273, "global_step": 550300, "epoch": 6630} {"train_loss": -27.48520851135254, "global_step": 550301, "epoch": 6630} {"train_loss": -27.59870719909668, "global_step": 550302, "epoch": 6630} {"train_loss": -27.60433006286621, "global_step": 550303, "epoch": 6630} {"train_loss": -27.5316104888916, "global_step": 550304, "epoch": 6630} {"train_loss": -27.580158233642578, "global_step": 550305, "epoch": 6630} {"train_loss": -27.42474365234375, "global_step": 550306, "epoch": 6630} {"train_loss": -27.199127197265625, "global_step": 550307, "epoch": 6630} {"train_loss": -27.475711822509766, "global_step": 550308, "epoch": 6630} {"train_loss": -27.574827194213867, "global_step": 550309, "epoch": 6630} {"train_loss": -27.887853622436523, "global_step": 550310, "epoch": 6630} {"train_loss": -27.184003829956055, "global_step": 550311, "epoch": 6630} {"train_loss": -27.361364364624023, "global_step": 550312, "epoch": 6630} {"train_loss": -27.1245059967041, "global_step": 550313, "epoch": 6630} {"train_loss": -27.778411865234375, "global_step": 550314, "epoch": 6630} {"train_loss": -27.465576171875, "global_step": 550315, "epoch": 6630} {"train_loss": -27.842878341674805, "global_step": 550316, "epoch": 6630} {"train_loss": -27.84150505065918, "global_step": 550317, "epoch": 6630} {"train_loss": -27.495025634765625, "global_step": 550318, "epoch": 6630} {"train_loss": -27.558319091796875, "global_step": 550319, "epoch": 6630} {"train_loss": -27.883092880249023, "global_step": 550320, "epoch": 6630} {"train_loss": -27.813568115234375, "global_step": 550321, "epoch": 6630} {"train_loss": -28.00971031188965, "global_step": 550322, "epoch": 6630} {"train_loss": -27.945438385009766, "global_step": 550323, "epoch": 6630} {"train_loss": -27.705957412719727, "global_step": 550324, "epoch": 6630} {"train_loss": -27.727127075195312, "global_step": 550325, "epoch": 6630} {"train_loss": -27.727130889892578, "global_step": 550326, "epoch": 6630} {"train_loss": -27.651187896728516, "global_step": 550327, "epoch": 6630} {"train_loss": -27.719614028930664, "global_step": 550328, "epoch": 6630} {"train_loss": -27.614044189453125, "global_step": 550329, "epoch": 6630} {"train_loss": -27.939313888549805, "global_step": 550330, "epoch": 6630} {"train_loss": -27.62396812438965, "global_step": 550331, "epoch": 6630} {"train_loss": -27.972930908203125, "global_step": 550332, "epoch": 6630} {"train_loss": -28.119775772094727, "global_step": 550333, "epoch": 6630} {"train_loss": -27.253570556640625, "global_step": 550334, "epoch": 6630} {"train_loss": -27.921157836914062, "global_step": 550335, "epoch": 6630} {"train_loss": -27.856298446655273, "global_step": 550336, "epoch": 6630} {"train_loss": -27.76751708984375, "global_step": 550337, "epoch": 6630} {"train_loss": -27.761850357055664, "global_step": 550338, "epoch": 6630} {"train_loss": -27.65389060974121, "global_step": 550339, "epoch": 6630} {"train_loss": -28.083316802978516, "global_step": 550340, "epoch": 6630} {"train_loss": -28.074460983276367, "global_step": 550341, "epoch": 6630} {"train_loss": -27.98579216003418, "global_step": 550342, "epoch": 6630} {"train_loss": -27.850143432617188, "global_step": 550343, "epoch": 6630} {"train_loss": -27.8769588470459, "global_step": 550344, "epoch": 6630} {"train_loss": -27.574161529541016, "global_step": 550345, "epoch": 6630} {"train_loss": -27.920347213745117, "global_step": 550346, "epoch": 6630} {"train_loss": -27.995969772338867, "global_step": 550347, "epoch": 6630} {"train_loss": -27.97932243347168, "global_step": 550348, "epoch": 6630} {"train_loss": -27.54493522644043, "global_step": 550349, "epoch": 6630} {"train_loss": -27.5371150970459, "global_step": 550350, "epoch": 6630} {"train_loss": -27.4532527923584, "global_step": 550351, "epoch": 6630} {"train_loss": -27.291534423828125, "global_step": 550352, "epoch": 6630} {"train_loss": -27.553537368774414, "global_step": 550353, "epoch": 6630} {"train_loss": -27.905736923217773, "global_step": 550354, "epoch": 6630} {"train_loss": -27.928083419799805, "global_step": 550355, "epoch": 6630} {"train_loss": -28.06435203552246, "global_step": 550356, "epoch": 6630} {"train_loss": -27.702131271362305, "global_step": 550357, "epoch": 6630} {"train_loss": -28.40582847595215, "global_step": 550358, "epoch": 6630} {"train_loss": -28.15656089782715, "global_step": 550359, "epoch": 6630} {"train_loss": -28.0018310546875, "global_step": 550360, "epoch": 6630} {"train_loss": -27.67816162109375, "global_step": 550361, "epoch": 6630} {"train_loss": -27.743457794189453, "global_step": 550362, "epoch": 6630} {"train_loss": -28.06424903869629, "global_step": 550363, "epoch": 6630} {"train_loss": -27.308837890625, "global_step": 550364, "epoch": 6630} {"train_loss": -27.78462028503418, "global_step": 550365, "epoch": 6630} {"train_loss": -27.795703887939453, "global_step": 550366, "epoch": 6630} {"train_loss": -27.54791831970215, "global_step": 550367, "epoch": 6630} {"train_loss": -27.54248046875, "global_step": 550368, "epoch": 6630} {"train_loss": -27.49930191040039, "global_step": 550369, "epoch": 6630} {"train_loss": -27.80475425720215, "global_step": 550370, "epoch": 6630} {"train_loss": -27.802270889282227, "global_step": 550371, "epoch": 6630} {"train_loss": -27.654182640902967, "global_step": 550372, "epoch": 6630, "val_loss": 6733426.0} {"train_loss": -28.020370483398438, "global_step": 550373, "epoch": 6631} {"train_loss": -27.792280197143555, "global_step": 550374, "epoch": 6631} {"train_loss": -27.198486328125, "global_step": 550375, "epoch": 6631} {"train_loss": -27.590368270874023, "global_step": 550376, "epoch": 6631} {"train_loss": -27.36221694946289, "global_step": 550377, "epoch": 6631} {"train_loss": -28.124235153198242, "global_step": 550378, "epoch": 6631} {"train_loss": -27.539718627929688, "global_step": 550379, "epoch": 6631} {"train_loss": -27.2928466796875, "global_step": 550380, "epoch": 6631} {"train_loss": -27.226160049438477, "global_step": 550381, "epoch": 6631} {"train_loss": -27.698673248291016, "global_step": 550382, "epoch": 6631} {"train_loss": -27.32430076599121, "global_step": 550383, "epoch": 6631} {"train_loss": -27.531604766845703, "global_step": 550384, "epoch": 6631} {"train_loss": -27.61625099182129, "global_step": 550385, "epoch": 6631} {"train_loss": -27.911237716674805, "global_step": 550386, "epoch": 6631} {"train_loss": -26.99586296081543, "global_step": 550387, "epoch": 6631} {"train_loss": -27.14784812927246, "global_step": 550388, "epoch": 6631} {"train_loss": -27.68025016784668, "global_step": 550389, "epoch": 6631} {"train_loss": -27.79144859313965, "global_step": 550390, "epoch": 6631} {"train_loss": -27.690643310546875, "global_step": 550391, "epoch": 6631} {"train_loss": -27.4613094329834, "global_step": 550392, "epoch": 6631} {"train_loss": -27.5469913482666, "global_step": 550393, "epoch": 6631} {"train_loss": -27.96781349182129, "global_step": 550394, "epoch": 6631} {"train_loss": -28.013381958007812, "global_step": 550395, "epoch": 6631} {"train_loss": -27.859882354736328, "global_step": 550396, "epoch": 6631} {"train_loss": -27.49334716796875, "global_step": 550397, "epoch": 6631} {"train_loss": -27.715402603149414, "global_step": 550398, "epoch": 6631} {"train_loss": -27.467700958251953, "global_step": 550399, "epoch": 6631} {"train_loss": -27.993732452392578, "global_step": 550400, "epoch": 6631} {"train_loss": -27.80621910095215, "global_step": 550401, "epoch": 6631} {"train_loss": -27.92091941833496, "global_step": 550402, "epoch": 6631} {"train_loss": -28.17291831970215, "global_step": 550403, "epoch": 6631} {"train_loss": -28.151966094970703, "global_step": 550404, "epoch": 6631} {"train_loss": -28.199613571166992, "global_step": 550405, "epoch": 6631} {"train_loss": -27.92704200744629, "global_step": 550406, "epoch": 6631} {"train_loss": -27.898181915283203, "global_step": 550407, "epoch": 6631} {"train_loss": -27.823795318603516, "global_step": 550408, "epoch": 6631} {"train_loss": -27.9361572265625, "global_step": 550409, "epoch": 6631} {"train_loss": -27.695831298828125, "global_step": 550410, "epoch": 6631} {"train_loss": -27.803197860717773, "global_step": 550411, "epoch": 6631} {"train_loss": -27.484134674072266, "global_step": 550412, "epoch": 6631} {"train_loss": -27.830677032470703, "global_step": 550413, "epoch": 6631} {"train_loss": -27.890066146850586, "global_step": 550414, "epoch": 6631} {"train_loss": -28.076587677001953, "global_step": 550415, "epoch": 6631} {"train_loss": -27.779708862304688, "global_step": 550416, "epoch": 6631} {"train_loss": -27.65984535217285, "global_step": 550417, "epoch": 6631} {"train_loss": -27.608932495117188, "global_step": 550418, "epoch": 6631} {"train_loss": -27.606128692626953, "global_step": 550419, "epoch": 6631} {"train_loss": -27.597864151000977, "global_step": 550420, "epoch": 6631} {"train_loss": -27.524688720703125, "global_step": 550421, "epoch": 6631} {"train_loss": -27.539525985717773, "global_step": 550422, "epoch": 6631} {"train_loss": -27.43317222595215, "global_step": 550423, "epoch": 6631} {"train_loss": -27.628198623657227, "global_step": 550424, "epoch": 6631} {"train_loss": -27.673704147338867, "global_step": 550425, "epoch": 6631} {"train_loss": -27.65166664123535, "global_step": 550426, "epoch": 6631} {"train_loss": -27.595117568969727, "global_step": 550427, "epoch": 6631} {"train_loss": -27.226816177368164, "global_step": 550428, "epoch": 6631} {"train_loss": -27.516666412353516, "global_step": 550429, "epoch": 6631} {"train_loss": -27.76966667175293, "global_step": 550430, "epoch": 6631} {"train_loss": -27.66537857055664, "global_step": 550431, "epoch": 6631} {"train_loss": -27.40155029296875, "global_step": 550432, "epoch": 6631} {"train_loss": -27.56110954284668, "global_step": 550433, "epoch": 6631} {"train_loss": -27.3223819732666, "global_step": 550434, "epoch": 6631} {"train_loss": -27.8267765045166, "global_step": 550435, "epoch": 6631} {"train_loss": -27.530227661132812, "global_step": 550436, "epoch": 6631} {"train_loss": -27.708402633666992, "global_step": 550437, "epoch": 6631} {"train_loss": -27.965429306030273, "global_step": 550438, "epoch": 6631} {"train_loss": -27.509521484375, "global_step": 550439, "epoch": 6631} {"train_loss": -27.75739097595215, "global_step": 550440, "epoch": 6631} {"train_loss": -27.5499324798584, "global_step": 550441, "epoch": 6631} {"train_loss": -27.887176513671875, "global_step": 550442, "epoch": 6631} {"train_loss": -27.7379150390625, "global_step": 550443, "epoch": 6631} {"train_loss": -28.228469848632812, "global_step": 550444, "epoch": 6631} {"train_loss": -27.525907516479492, "global_step": 550445, "epoch": 6631} {"train_loss": -27.806726455688477, "global_step": 550446, "epoch": 6631} {"train_loss": -27.641489028930664, "global_step": 550447, "epoch": 6631} {"train_loss": -28.031728744506836, "global_step": 550448, "epoch": 6631} {"train_loss": -27.636917114257812, "global_step": 550449, "epoch": 6631} {"train_loss": -27.658246994018555, "global_step": 550450, "epoch": 6631} {"train_loss": -28.106237411499023, "global_step": 550451, "epoch": 6631} {"train_loss": -27.515100479125977, "global_step": 550452, "epoch": 6631} {"train_loss": -27.850439071655273, "global_step": 550453, "epoch": 6631} {"train_loss": -27.91962242126465, "global_step": 550454, "epoch": 6631} {"train_loss": -27.675157937658838, "global_step": 550455, "epoch": 6631, "val_loss": 6711103.5} {"train_loss": -26.85799217224121, "global_step": 550456, "epoch": 6632} {"train_loss": -26.242334365844727, "global_step": 550457, "epoch": 6632} {"train_loss": -26.50778579711914, "global_step": 550458, "epoch": 6632} {"train_loss": -27.084848403930664, "global_step": 550459, "epoch": 6632} {"train_loss": -26.001333236694336, "global_step": 550460, "epoch": 6632} {"train_loss": -26.97714614868164, "global_step": 550461, "epoch": 6632} {"train_loss": -26.632980346679688, "global_step": 550462, "epoch": 6632} {"train_loss": -26.56892967224121, "global_step": 550463, "epoch": 6632} {"train_loss": -26.585662841796875, "global_step": 550464, "epoch": 6632} {"train_loss": -27.288013458251953, "global_step": 550465, "epoch": 6632} {"train_loss": -27.30216407775879, "global_step": 550466, "epoch": 6632} {"train_loss": -27.108388900756836, "global_step": 550467, "epoch": 6632} {"train_loss": -27.27496910095215, "global_step": 550468, "epoch": 6632} {"train_loss": -26.572874069213867, "global_step": 550469, "epoch": 6632} {"train_loss": -27.533172607421875, "global_step": 550470, "epoch": 6632} {"train_loss": -27.0119686126709, "global_step": 550471, "epoch": 6632} {"train_loss": -27.157424926757812, "global_step": 550472, "epoch": 6632} {"train_loss": -26.941293716430664, "global_step": 550473, "epoch": 6632} {"train_loss": -27.0797176361084, "global_step": 550474, "epoch": 6632} {"train_loss": -27.258209228515625, "global_step": 550475, "epoch": 6632} {"train_loss": -27.593534469604492, "global_step": 550476, "epoch": 6632} {"train_loss": -27.351318359375, "global_step": 550477, "epoch": 6632} {"train_loss": -27.346240997314453, "global_step": 550478, "epoch": 6632} {"train_loss": -27.505640029907227, "global_step": 550479, "epoch": 6632} {"train_loss": -27.47397232055664, "global_step": 550480, "epoch": 6632} {"train_loss": -28.042911529541016, "global_step": 550481, "epoch": 6632} {"train_loss": -27.33880615234375, "global_step": 550482, "epoch": 6632} {"train_loss": -27.689254760742188, "global_step": 550483, "epoch": 6632} {"train_loss": -27.68475341796875, "global_step": 550484, "epoch": 6632} {"train_loss": -27.559030532836914, "global_step": 550485, "epoch": 6632} {"train_loss": -27.519214630126953, "global_step": 550486, "epoch": 6632} {"train_loss": -27.817907333374023, "global_step": 550487, "epoch": 6632} {"train_loss": -27.718297958374023, "global_step": 550488, "epoch": 6632} {"train_loss": -27.583120346069336, "global_step": 550489, "epoch": 6632} {"train_loss": -27.591169357299805, "global_step": 550490, "epoch": 6632} {"train_loss": -27.89337158203125, "global_step": 550491, "epoch": 6632} {"train_loss": -27.63214111328125, "global_step": 550492, "epoch": 6632} {"train_loss": -27.780414581298828, "global_step": 550493, "epoch": 6632} {"train_loss": -27.729999542236328, "global_step": 550494, "epoch": 6632} {"train_loss": -27.99403190612793, "global_step": 550495, "epoch": 6632} {"train_loss": -27.8896541595459, "global_step": 550496, "epoch": 6632} {"train_loss": -27.767337799072266, "global_step": 550497, "epoch": 6632} {"train_loss": -27.981592178344727, "global_step": 550498, "epoch": 6632} {"train_loss": -27.751026153564453, "global_step": 550499, "epoch": 6632} {"train_loss": -27.645109176635742, "global_step": 550500, "epoch": 6632} {"train_loss": -27.364856719970703, "global_step": 550501, "epoch": 6632} {"train_loss": -27.9989070892334, "global_step": 550502, "epoch": 6632} {"train_loss": -27.644201278686523, "global_step": 550503, "epoch": 6632} {"train_loss": -27.960861206054688, "global_step": 550504, "epoch": 6632} {"train_loss": -27.93580436706543, "global_step": 550505, "epoch": 6632} {"train_loss": -28.062925338745117, "global_step": 550506, "epoch": 6632} {"train_loss": -27.76894187927246, "global_step": 550507, "epoch": 6632} {"train_loss": -27.725086212158203, "global_step": 550508, "epoch": 6632} {"train_loss": -28.141382217407227, "global_step": 550509, "epoch": 6632} {"train_loss": -27.852285385131836, "global_step": 550510, "epoch": 6632} {"train_loss": -27.74690055847168, "global_step": 550511, "epoch": 6632} {"train_loss": -27.49310302734375, "global_step": 550512, "epoch": 6632} {"train_loss": -27.69142723083496, "global_step": 550513, "epoch": 6632} {"train_loss": -27.931751251220703, "global_step": 550514, "epoch": 6632} {"train_loss": -27.834457397460938, "global_step": 550515, "epoch": 6632} {"train_loss": -27.489206314086914, "global_step": 550516, "epoch": 6632} {"train_loss": -27.8007869720459, "global_step": 550517, "epoch": 6632} {"train_loss": -28.159759521484375, "global_step": 550518, "epoch": 6632} {"train_loss": -27.932525634765625, "global_step": 550519, "epoch": 6632} {"train_loss": -27.601789474487305, "global_step": 550520, "epoch": 6632} {"train_loss": -27.797504425048828, "global_step": 550521, "epoch": 6632} {"train_loss": -27.72190284729004, "global_step": 550522, "epoch": 6632} {"train_loss": -27.446561813354492, "global_step": 550523, "epoch": 6632} {"train_loss": -27.372802734375, "global_step": 550524, "epoch": 6632} {"train_loss": -27.7733154296875, "global_step": 550525, "epoch": 6632} {"train_loss": -28.01953125, "global_step": 550526, "epoch": 6632} {"train_loss": -27.773900985717773, "global_step": 550527, "epoch": 6632} {"train_loss": -27.994007110595703, "global_step": 550528, "epoch": 6632} {"train_loss": -27.978368759155273, "global_step": 550529, "epoch": 6632} {"train_loss": -27.80316734313965, "global_step": 550530, "epoch": 6632} {"train_loss": -28.325220108032227, "global_step": 550531, "epoch": 6632} {"train_loss": -28.013952255249023, "global_step": 550532, "epoch": 6632} {"train_loss": -27.894128799438477, "global_step": 550533, "epoch": 6632} {"train_loss": -27.8546085357666, "global_step": 550534, "epoch": 6632} {"train_loss": -27.69306755065918, "global_step": 550535, "epoch": 6632} {"train_loss": -27.676427841186523, "global_step": 550536, "epoch": 6632} {"train_loss": -27.6337890625, "global_step": 550537, "epoch": 6632} {"train_loss": -27.546957061951417, "global_step": 550538, "epoch": 6632, "val_loss": 6701683.0} {"train_loss": -27.1509952545166, "global_step": 550539, "epoch": 6633} {"train_loss": -26.16196632385254, "global_step": 550540, "epoch": 6633} {"train_loss": -26.1644344329834, "global_step": 550541, "epoch": 6633} {"train_loss": -27.281082153320312, "global_step": 550542, "epoch": 6633} {"train_loss": -27.286802291870117, "global_step": 550543, "epoch": 6633} {"train_loss": -26.7387752532959, "global_step": 550544, "epoch": 6633} {"train_loss": -27.406110763549805, "global_step": 550545, "epoch": 6633} {"train_loss": -26.79383659362793, "global_step": 550546, "epoch": 6633} {"train_loss": -27.28580093383789, "global_step": 550547, "epoch": 6633} {"train_loss": -27.138086318969727, "global_step": 550548, "epoch": 6633} {"train_loss": -27.416181564331055, "global_step": 550549, "epoch": 6633} {"train_loss": -27.10365867614746, "global_step": 550550, "epoch": 6633} {"train_loss": -27.219533920288086, "global_step": 550551, "epoch": 6633} {"train_loss": -26.871931076049805, "global_step": 550552, "epoch": 6633} {"train_loss": -27.37977409362793, "global_step": 550553, "epoch": 6633} {"train_loss": -26.928394317626953, "global_step": 550554, "epoch": 6633} {"train_loss": -27.546518325805664, "global_step": 550555, "epoch": 6633} {"train_loss": -27.164106369018555, "global_step": 550556, "epoch": 6633} {"train_loss": -27.570667266845703, "global_step": 550557, "epoch": 6633} {"train_loss": -26.990808486938477, "global_step": 550558, "epoch": 6633} {"train_loss": -27.272619247436523, "global_step": 550559, "epoch": 6633} {"train_loss": -27.47686195373535, "global_step": 550560, "epoch": 6633} {"train_loss": -27.234272003173828, "global_step": 550561, "epoch": 6633} {"train_loss": -27.456953048706055, "global_step": 550562, "epoch": 6633} {"train_loss": -27.632282257080078, "global_step": 550563, "epoch": 6633} {"train_loss": -27.96500587463379, "global_step": 550564, "epoch": 6633} {"train_loss": -27.793766021728516, "global_step": 550565, "epoch": 6633} {"train_loss": -27.734643936157227, "global_step": 550566, "epoch": 6633} {"train_loss": -27.37018394470215, "global_step": 550567, "epoch": 6633} {"train_loss": -27.666858673095703, "global_step": 550568, "epoch": 6633} {"train_loss": -27.74077796936035, "global_step": 550569, "epoch": 6633} {"train_loss": -28.244232177734375, "global_step": 550570, "epoch": 6633} {"train_loss": -27.564157485961914, "global_step": 550571, "epoch": 6633} {"train_loss": -27.823286056518555, "global_step": 550572, "epoch": 6633} {"train_loss": -27.839628219604492, "global_step": 550573, "epoch": 6633} {"train_loss": -27.746076583862305, "global_step": 550574, "epoch": 6633} {"train_loss": -27.652463912963867, "global_step": 550575, "epoch": 6633} {"train_loss": -28.068899154663086, "global_step": 550576, "epoch": 6633} {"train_loss": -27.8970890045166, "global_step": 550577, "epoch": 6633} {"train_loss": -27.4605770111084, "global_step": 550578, "epoch": 6633} {"train_loss": -28.055286407470703, "global_step": 550579, "epoch": 6633} {"train_loss": -27.590621948242188, "global_step": 550580, "epoch": 6633} {"train_loss": -27.74025535583496, "global_step": 550581, "epoch": 6633} {"train_loss": -27.753400802612305, "global_step": 550582, "epoch": 6633} {"train_loss": -27.799728393554688, "global_step": 550583, "epoch": 6633} {"train_loss": -27.84174919128418, "global_step": 550584, "epoch": 6633} {"train_loss": -28.01865005493164, "global_step": 550585, "epoch": 6633} {"train_loss": -27.447601318359375, "global_step": 550586, "epoch": 6633} {"train_loss": -27.797449111938477, "global_step": 550587, "epoch": 6633} {"train_loss": -27.93953514099121, "global_step": 550588, "epoch": 6633} {"train_loss": -27.651708602905273, "global_step": 550589, "epoch": 6633} {"train_loss": -27.672327041625977, "global_step": 550590, "epoch": 6633} {"train_loss": -27.50750732421875, "global_step": 550591, "epoch": 6633} {"train_loss": -27.853626251220703, "global_step": 550592, "epoch": 6633} {"train_loss": -28.112585067749023, "global_step": 550593, "epoch": 6633} {"train_loss": -27.952804565429688, "global_step": 550594, "epoch": 6633} {"train_loss": -27.783309936523438, "global_step": 550595, "epoch": 6633} {"train_loss": -27.770612716674805, "global_step": 550596, "epoch": 6633} {"train_loss": -27.895843505859375, "global_step": 550597, "epoch": 6633} {"train_loss": -28.198760986328125, "global_step": 550598, "epoch": 6633} {"train_loss": -27.897552490234375, "global_step": 550599, "epoch": 6633} {"train_loss": -27.899362564086914, "global_step": 550600, "epoch": 6633} {"train_loss": -27.785913467407227, "global_step": 550601, "epoch": 6633} {"train_loss": -27.473413467407227, "global_step": 550602, "epoch": 6633} {"train_loss": -27.78512954711914, "global_step": 550603, "epoch": 6633} {"train_loss": -28.10100746154785, "global_step": 550604, "epoch": 6633} {"train_loss": -27.85694694519043, "global_step": 550605, "epoch": 6633} {"train_loss": -27.842147827148438, "global_step": 550606, "epoch": 6633} {"train_loss": -28.359516143798828, "global_step": 550607, "epoch": 6633} {"train_loss": -27.879499435424805, "global_step": 550608, "epoch": 6633} {"train_loss": -27.92603874206543, "global_step": 550609, "epoch": 6633} {"train_loss": -27.930028915405273, "global_step": 550610, "epoch": 6633} {"train_loss": -28.458545684814453, "global_step": 550611, "epoch": 6633} {"train_loss": -27.730146408081055, "global_step": 550612, "epoch": 6633} {"train_loss": -28.08201026916504, "global_step": 550613, "epoch": 6633} {"train_loss": -28.0924129486084, "global_step": 550614, "epoch": 6633} {"train_loss": -27.911069869995117, "global_step": 550615, "epoch": 6633} {"train_loss": -27.892730712890625, "global_step": 550616, "epoch": 6633} {"train_loss": -28.054838180541992, "global_step": 550617, "epoch": 6633} {"train_loss": -27.77522087097168, "global_step": 550618, "epoch": 6633} {"train_loss": -27.6715145111084, "global_step": 550619, "epoch": 6633} {"train_loss": -27.450244903564453, "global_step": 550620, "epoch": 6633} {"train_loss": -27.63891224688794, "global_step": 550621, "epoch": 6633, "val_loss": 6726983.0} {"train_loss": -24.967899322509766, "global_step": 550622, "epoch": 6634} {"train_loss": -20.768383026123047, "global_step": 550623, "epoch": 6634} {"train_loss": -25.82427978515625, "global_step": 550624, "epoch": 6634} {"train_loss": -24.157062530517578, "global_step": 550625, "epoch": 6634} {"train_loss": -24.89035987854004, "global_step": 550626, "epoch": 6634} {"train_loss": -25.62125015258789, "global_step": 550627, "epoch": 6634} {"train_loss": -25.14487075805664, "global_step": 550628, "epoch": 6634} {"train_loss": -25.56633186340332, "global_step": 550629, "epoch": 6634} {"train_loss": -26.133203506469727, "global_step": 550630, "epoch": 6634} {"train_loss": -25.365467071533203, "global_step": 550631, "epoch": 6634} {"train_loss": -26.068729400634766, "global_step": 550632, "epoch": 6634} {"train_loss": -26.6717586517334, "global_step": 550633, "epoch": 6634} {"train_loss": -26.546417236328125, "global_step": 550634, "epoch": 6634} {"train_loss": -25.914356231689453, "global_step": 550635, "epoch": 6634} {"train_loss": -26.838769912719727, "global_step": 550636, "epoch": 6634} {"train_loss": -26.36590003967285, "global_step": 550637, "epoch": 6634} {"train_loss": -26.815641403198242, "global_step": 550638, "epoch": 6634} {"train_loss": -26.666595458984375, "global_step": 550639, "epoch": 6634} {"train_loss": -26.416351318359375, "global_step": 550640, "epoch": 6634} {"train_loss": -26.603147506713867, "global_step": 550641, "epoch": 6634} {"train_loss": -26.638425827026367, "global_step": 550642, "epoch": 6634} {"train_loss": -26.66598892211914, "global_step": 550643, "epoch": 6634} {"train_loss": -26.7314395904541, "global_step": 550644, "epoch": 6634} {"train_loss": -26.8028564453125, "global_step": 550645, "epoch": 6634} {"train_loss": -26.770627975463867, "global_step": 550646, "epoch": 6634} {"train_loss": -27.048730850219727, "global_step": 550647, "epoch": 6634} {"train_loss": -27.081323623657227, "global_step": 550648, "epoch": 6634} {"train_loss": -26.98960304260254, "global_step": 550649, "epoch": 6634} {"train_loss": -27.12506675720215, "global_step": 550650, "epoch": 6634} {"train_loss": -27.455774307250977, "global_step": 550651, "epoch": 6634} {"train_loss": -27.14162254333496, "global_step": 550652, "epoch": 6634} {"train_loss": -27.287124633789062, "global_step": 550653, "epoch": 6634} {"train_loss": -27.124969482421875, "global_step": 550654, "epoch": 6634} {"train_loss": -27.420185089111328, "global_step": 550655, "epoch": 6634} {"train_loss": -27.309497833251953, "global_step": 550656, "epoch": 6634} {"train_loss": -27.109418869018555, "global_step": 550657, "epoch": 6634} {"train_loss": -27.13956642150879, "global_step": 550658, "epoch": 6634} {"train_loss": -27.280670166015625, "global_step": 550659, "epoch": 6634} {"train_loss": -27.270252227783203, "global_step": 550660, "epoch": 6634} {"train_loss": -27.67660903930664, "global_step": 550661, "epoch": 6634} {"train_loss": -27.167377471923828, "global_step": 550662, "epoch": 6634} {"train_loss": -27.227880477905273, "global_step": 550663, "epoch": 6634} {"train_loss": -27.38588523864746, "global_step": 550664, "epoch": 6634} {"train_loss": -27.201648712158203, "global_step": 550665, "epoch": 6634} {"train_loss": -27.30575942993164, "global_step": 550666, "epoch": 6634} {"train_loss": -26.9554500579834, "global_step": 550667, "epoch": 6634} {"train_loss": -27.67633628845215, "global_step": 550668, "epoch": 6634} {"train_loss": -27.613489151000977, "global_step": 550669, "epoch": 6634} {"train_loss": -27.63625144958496, "global_step": 550670, "epoch": 6634} {"train_loss": -27.739404678344727, "global_step": 550671, "epoch": 6634} {"train_loss": -27.352725982666016, "global_step": 550672, "epoch": 6634} {"train_loss": -27.77553367614746, "global_step": 550673, "epoch": 6634} {"train_loss": -27.426206588745117, "global_step": 550674, "epoch": 6634} {"train_loss": -27.61393165588379, "global_step": 550675, "epoch": 6634} {"train_loss": -27.533796310424805, "global_step": 550676, "epoch": 6634} {"train_loss": -27.699533462524414, "global_step": 550677, "epoch": 6634} {"train_loss": -27.424585342407227, "global_step": 550678, "epoch": 6634} {"train_loss": -27.604202270507812, "global_step": 550679, "epoch": 6634} {"train_loss": -27.848371505737305, "global_step": 550680, "epoch": 6634} {"train_loss": -27.50087547302246, "global_step": 550681, "epoch": 6634} {"train_loss": -27.769428253173828, "global_step": 550682, "epoch": 6634} {"train_loss": -27.463659286499023, "global_step": 550683, "epoch": 6634} {"train_loss": -27.730499267578125, "global_step": 550684, "epoch": 6634} {"train_loss": -27.524616241455078, "global_step": 550685, "epoch": 6634} {"train_loss": -27.703298568725586, "global_step": 550686, "epoch": 6634} {"train_loss": -27.730871200561523, "global_step": 550687, "epoch": 6634} {"train_loss": -27.904132843017578, "global_step": 550688, "epoch": 6634} {"train_loss": -27.95118522644043, "global_step": 550689, "epoch": 6634} {"train_loss": -28.146533966064453, "global_step": 550690, "epoch": 6634} {"train_loss": -27.984806060791016, "global_step": 550691, "epoch": 6634} {"train_loss": -28.0250186920166, "global_step": 550692, "epoch": 6634} {"train_loss": -28.0030517578125, "global_step": 550693, "epoch": 6634} {"train_loss": -27.793445587158203, "global_step": 550694, "epoch": 6634} {"train_loss": -27.60700798034668, "global_step": 550695, "epoch": 6634} {"train_loss": -27.769712448120117, "global_step": 550696, "epoch": 6634} {"train_loss": -28.101058959960938, "global_step": 550697, "epoch": 6634} {"train_loss": -27.68757438659668, "global_step": 550698, "epoch": 6634} {"train_loss": -27.616193771362305, "global_step": 550699, "epoch": 6634} {"train_loss": -28.03659439086914, "global_step": 550700, "epoch": 6634} {"train_loss": -27.615222930908203, "global_step": 550701, "epoch": 6634} {"train_loss": -27.78907585144043, "global_step": 550702, "epoch": 6634} {"train_loss": -27.902362823486328, "global_step": 550703, "epoch": 6634} {"train_loss": -27.04073749680117, "global_step": 550704, "epoch": 6634, "val_loss": 6743330.5} {"train_loss": -27.081884384155273, "global_step": 550705, "epoch": 6635} {"train_loss": -25.453649520874023, "global_step": 550706, "epoch": 6635} {"train_loss": -25.827573776245117, "global_step": 550707, "epoch": 6635} {"train_loss": -26.455047607421875, "global_step": 550708, "epoch": 6635} {"train_loss": -26.65028190612793, "global_step": 550709, "epoch": 6635} {"train_loss": -27.121076583862305, "global_step": 550710, "epoch": 6635} {"train_loss": -26.795486450195312, "global_step": 550711, "epoch": 6635} {"train_loss": -27.00750160217285, "global_step": 550712, "epoch": 6635} {"train_loss": -26.719501495361328, "global_step": 550713, "epoch": 6635} {"train_loss": -27.044849395751953, "global_step": 550714, "epoch": 6635} {"train_loss": -27.326416015625, "global_step": 550715, "epoch": 6635} {"train_loss": -26.6823673248291, "global_step": 550716, "epoch": 6635} {"train_loss": -27.458845138549805, "global_step": 550717, "epoch": 6635} {"train_loss": -27.31967544555664, "global_step": 550718, "epoch": 6635} {"train_loss": -27.030393600463867, "global_step": 550719, "epoch": 6635} {"train_loss": -26.91278076171875, "global_step": 550720, "epoch": 6635} {"train_loss": -27.042343139648438, "global_step": 550721, "epoch": 6635} {"train_loss": -27.521697998046875, "global_step": 550722, "epoch": 6635} {"train_loss": -27.472431182861328, "global_step": 550723, "epoch": 6635} {"train_loss": -27.385831832885742, "global_step": 550724, "epoch": 6635} {"train_loss": -27.559589385986328, "global_step": 550725, "epoch": 6635} {"train_loss": -27.19868278503418, "global_step": 550726, "epoch": 6635} {"train_loss": -27.581836700439453, "global_step": 550727, "epoch": 6635} {"train_loss": -27.40799331665039, "global_step": 550728, "epoch": 6635} {"train_loss": -27.304410934448242, "global_step": 550729, "epoch": 6635} {"train_loss": -27.5676326751709, "global_step": 550730, "epoch": 6635} {"train_loss": -27.373884201049805, "global_step": 550731, "epoch": 6635} {"train_loss": -27.34927749633789, "global_step": 550732, "epoch": 6635} {"train_loss": -27.69720458984375, "global_step": 550733, "epoch": 6635} {"train_loss": -27.284042358398438, "global_step": 550734, "epoch": 6635} {"train_loss": -27.260419845581055, "global_step": 550735, "epoch": 6635} {"train_loss": -27.363361358642578, "global_step": 550736, "epoch": 6635} {"train_loss": -27.620941162109375, "global_step": 550737, "epoch": 6635} {"train_loss": -27.80868911743164, "global_step": 550738, "epoch": 6635} {"train_loss": -27.850805282592773, "global_step": 550739, "epoch": 6635} {"train_loss": -27.4742431640625, "global_step": 550740, "epoch": 6635} {"train_loss": -27.824460983276367, "global_step": 550741, "epoch": 6635} {"train_loss": -27.713598251342773, "global_step": 550742, "epoch": 6635} {"train_loss": -27.97224998474121, "global_step": 550743, "epoch": 6635} {"train_loss": -27.521026611328125, "global_step": 550744, "epoch": 6635} {"train_loss": -27.6237735748291, "global_step": 550745, "epoch": 6635} {"train_loss": -27.79615592956543, "global_step": 550746, "epoch": 6635} {"train_loss": -27.61271095275879, "global_step": 550747, "epoch": 6635} {"train_loss": -27.95745849609375, "global_step": 550748, "epoch": 6635} {"train_loss": -27.707672119140625, "global_step": 550749, "epoch": 6635} {"train_loss": -28.121158599853516, "global_step": 550750, "epoch": 6635} {"train_loss": -27.987762451171875, "global_step": 550751, "epoch": 6635} {"train_loss": -28.03419303894043, "global_step": 550752, "epoch": 6635} {"train_loss": -27.923547744750977, "global_step": 550753, "epoch": 6635} {"train_loss": -27.674671173095703, "global_step": 550754, "epoch": 6635} {"train_loss": -27.79848289489746, "global_step": 550755, "epoch": 6635} {"train_loss": -28.145471572875977, "global_step": 550756, "epoch": 6635} {"train_loss": -28.092121124267578, "global_step": 550757, "epoch": 6635} {"train_loss": -27.7923526763916, "global_step": 550758, "epoch": 6635} {"train_loss": -27.6597900390625, "global_step": 550759, "epoch": 6635} {"train_loss": -27.712121963500977, "global_step": 550760, "epoch": 6635} {"train_loss": -27.986286163330078, "global_step": 550761, "epoch": 6635} {"train_loss": -27.490015029907227, "global_step": 550762, "epoch": 6635} {"train_loss": -27.430084228515625, "global_step": 550763, "epoch": 6635} {"train_loss": -27.69793701171875, "global_step": 550764, "epoch": 6635} {"train_loss": -27.480688095092773, "global_step": 550765, "epoch": 6635} {"train_loss": -27.908065795898438, "global_step": 550766, "epoch": 6635} {"train_loss": -28.013086318969727, "global_step": 550767, "epoch": 6635} {"train_loss": -27.756671905517578, "global_step": 550768, "epoch": 6635} {"train_loss": -27.73493003845215, "global_step": 550769, "epoch": 6635} {"train_loss": -27.984790802001953, "global_step": 550770, "epoch": 6635} {"train_loss": -27.705169677734375, "global_step": 550771, "epoch": 6635} {"train_loss": -27.669937133789062, "global_step": 550772, "epoch": 6635} {"train_loss": -28.173200607299805, "global_step": 550773, "epoch": 6635} {"train_loss": -28.069746017456055, "global_step": 550774, "epoch": 6635} {"train_loss": -27.661497116088867, "global_step": 550775, "epoch": 6635} {"train_loss": -27.823942184448242, "global_step": 550776, "epoch": 6635} {"train_loss": -27.93934440612793, "global_step": 550777, "epoch": 6635} {"train_loss": -27.74261474609375, "global_step": 550778, "epoch": 6635} {"train_loss": -27.649017333984375, "global_step": 550779, "epoch": 6635} {"train_loss": -27.929128646850586, "global_step": 550780, "epoch": 6635} {"train_loss": -27.9877986907959, "global_step": 550781, "epoch": 6635} {"train_loss": -28.126333236694336, "global_step": 550782, "epoch": 6635} {"train_loss": -27.762601852416992, "global_step": 550783, "epoch": 6635} {"train_loss": -27.687536239624023, "global_step": 550784, "epoch": 6635} {"train_loss": -27.704986572265625, "global_step": 550785, "epoch": 6635} {"train_loss": -27.65510368347168, "global_step": 550786, "epoch": 6635} {"train_loss": -27.53024071383189, "global_step": 550787, "epoch": 6635, "val_loss": 6673614.0} {"train_loss": -26.952661514282227, "global_step": 550788, "epoch": 6636} {"train_loss": -27.299365997314453, "global_step": 550789, "epoch": 6636} {"train_loss": -26.96439552307129, "global_step": 550790, "epoch": 6636} {"train_loss": -26.95379066467285, "global_step": 550791, "epoch": 6636} {"train_loss": -26.885467529296875, "global_step": 550792, "epoch": 6636} {"train_loss": -26.60589599609375, "global_step": 550793, "epoch": 6636} {"train_loss": -26.156949996948242, "global_step": 550794, "epoch": 6636} {"train_loss": -26.965497970581055, "global_step": 550795, "epoch": 6636} {"train_loss": -26.814132690429688, "global_step": 550796, "epoch": 6636} {"train_loss": -26.42978858947754, "global_step": 550797, "epoch": 6636} {"train_loss": -27.177804946899414, "global_step": 550798, "epoch": 6636} {"train_loss": -26.806188583374023, "global_step": 550799, "epoch": 6636} {"train_loss": -27.063650131225586, "global_step": 550800, "epoch": 6636} {"train_loss": -26.438220977783203, "global_step": 550801, "epoch": 6636} {"train_loss": -26.769216537475586, "global_step": 550802, "epoch": 6636} {"train_loss": -27.18423843383789, "global_step": 550803, "epoch": 6636} {"train_loss": -26.8533935546875, "global_step": 550804, "epoch": 6636} {"train_loss": -27.049713134765625, "global_step": 550805, "epoch": 6636} {"train_loss": -27.021108627319336, "global_step": 550806, "epoch": 6636} {"train_loss": -27.259571075439453, "global_step": 550807, "epoch": 6636} {"train_loss": -27.37598991394043, "global_step": 550808, "epoch": 6636} {"train_loss": -26.975061416625977, "global_step": 550809, "epoch": 6636} {"train_loss": -27.0393009185791, "global_step": 550810, "epoch": 6636} {"train_loss": -27.55706787109375, "global_step": 550811, "epoch": 6636} {"train_loss": -27.55499839782715, "global_step": 550812, "epoch": 6636} {"train_loss": -27.233417510986328, "global_step": 550813, "epoch": 6636} {"train_loss": -27.172964096069336, "global_step": 550814, "epoch": 6636} {"train_loss": -27.6648006439209, "global_step": 550815, "epoch": 6636} {"train_loss": -27.078723907470703, "global_step": 550816, "epoch": 6636} {"train_loss": -27.62007713317871, "global_step": 550817, "epoch": 6636} {"train_loss": -27.67840576171875, "global_step": 550818, "epoch": 6636} {"train_loss": -27.569555282592773, "global_step": 550819, "epoch": 6636} {"train_loss": -27.654600143432617, "global_step": 550820, "epoch": 6636} {"train_loss": -27.22772789001465, "global_step": 550821, "epoch": 6636} {"train_loss": -27.50617027282715, "global_step": 550822, "epoch": 6636} {"train_loss": -27.201797485351562, "global_step": 550823, "epoch": 6636} {"train_loss": -27.85248374938965, "global_step": 550824, "epoch": 6636} {"train_loss": -27.895780563354492, "global_step": 550825, "epoch": 6636} {"train_loss": -27.430423736572266, "global_step": 550826, "epoch": 6636} {"train_loss": -27.835004806518555, "global_step": 550827, "epoch": 6636} {"train_loss": -27.736005783081055, "global_step": 550828, "epoch": 6636} {"train_loss": -27.485767364501953, "global_step": 550829, "epoch": 6636} {"train_loss": -27.601612091064453, "global_step": 550830, "epoch": 6636} {"train_loss": -27.888593673706055, "global_step": 550831, "epoch": 6636} {"train_loss": -27.77398109436035, "global_step": 550832, "epoch": 6636} {"train_loss": -28.060129165649414, "global_step": 550833, "epoch": 6636} {"train_loss": -27.8204288482666, "global_step": 550834, "epoch": 6636} {"train_loss": -27.666833877563477, "global_step": 550835, "epoch": 6636} {"train_loss": -28.08257484436035, "global_step": 550836, "epoch": 6636} {"train_loss": -27.325439453125, "global_step": 550837, "epoch": 6636} {"train_loss": -27.793058395385742, "global_step": 550838, "epoch": 6636} {"train_loss": -27.525381088256836, "global_step": 550839, "epoch": 6636} {"train_loss": -28.018640518188477, "global_step": 550840, "epoch": 6636} {"train_loss": -27.57260513305664, "global_step": 550841, "epoch": 6636} {"train_loss": -27.71894645690918, "global_step": 550842, "epoch": 6636} {"train_loss": -28.014062881469727, "global_step": 550843, "epoch": 6636} {"train_loss": -28.354248046875, "global_step": 550844, "epoch": 6636} {"train_loss": -28.041950225830078, "global_step": 550845, "epoch": 6636} {"train_loss": -27.972883224487305, "global_step": 550846, "epoch": 6636} {"train_loss": -27.807708740234375, "global_step": 550847, "epoch": 6636} {"train_loss": -27.5223331451416, "global_step": 550848, "epoch": 6636} {"train_loss": -27.95270347595215, "global_step": 550849, "epoch": 6636} {"train_loss": -27.8952579498291, "global_step": 550850, "epoch": 6636} {"train_loss": -27.690271377563477, "global_step": 550851, "epoch": 6636} {"train_loss": -27.780780792236328, "global_step": 550852, "epoch": 6636} {"train_loss": -27.704980850219727, "global_step": 550853, "epoch": 6636} {"train_loss": -27.832672119140625, "global_step": 550854, "epoch": 6636} {"train_loss": -28.138086318969727, "global_step": 550855, "epoch": 6636} {"train_loss": -27.733489990234375, "global_step": 550856, "epoch": 6636} {"train_loss": -27.54072380065918, "global_step": 550857, "epoch": 6636} {"train_loss": -27.947574615478516, "global_step": 550858, "epoch": 6636} {"train_loss": -27.792882919311523, "global_step": 550859, "epoch": 6636} {"train_loss": -28.008642196655273, "global_step": 550860, "epoch": 6636} {"train_loss": -27.619409561157227, "global_step": 550861, "epoch": 6636} {"train_loss": -28.1273193359375, "global_step": 550862, "epoch": 6636} {"train_loss": -27.922779083251953, "global_step": 550863, "epoch": 6636} {"train_loss": -27.7423038482666, "global_step": 550864, "epoch": 6636} {"train_loss": -28.079877853393555, "global_step": 550865, "epoch": 6636} {"train_loss": -27.882617950439453, "global_step": 550866, "epoch": 6636} {"train_loss": -27.799108505249023, "global_step": 550867, "epoch": 6636} {"train_loss": -27.808197021484375, "global_step": 550868, "epoch": 6636} {"train_loss": -27.931081771850586, "global_step": 550869, "epoch": 6636} {"train_loss": -27.50523666014154, "global_step": 550870, "epoch": 6636, "val_loss": 6575692.5} {"train_loss": -27.545454025268555, "global_step": 550871, "epoch": 6637} {"train_loss": -26.850915908813477, "global_step": 550872, "epoch": 6637} {"train_loss": -26.48297119140625, "global_step": 550873, "epoch": 6637} {"train_loss": -26.695459365844727, "global_step": 550874, "epoch": 6637} {"train_loss": -26.4349365234375, "global_step": 550875, "epoch": 6637} {"train_loss": -27.875625610351562, "global_step": 550876, "epoch": 6637} {"train_loss": -27.475595474243164, "global_step": 550877, "epoch": 6637} {"train_loss": -26.728595733642578, "global_step": 550878, "epoch": 6637} {"train_loss": -27.011310577392578, "global_step": 550879, "epoch": 6637} {"train_loss": -27.34096336364746, "global_step": 550880, "epoch": 6637} {"train_loss": -27.239349365234375, "global_step": 550881, "epoch": 6637} {"train_loss": -27.190900802612305, "global_step": 550882, "epoch": 6637} {"train_loss": -27.644433975219727, "global_step": 550883, "epoch": 6637} {"train_loss": -27.569778442382812, "global_step": 550884, "epoch": 6637} {"train_loss": -27.519506454467773, "global_step": 550885, "epoch": 6637} {"train_loss": -27.487897872924805, "global_step": 550886, "epoch": 6637} {"train_loss": -27.72120475769043, "global_step": 550887, "epoch": 6637} {"train_loss": -27.733856201171875, "global_step": 550888, "epoch": 6637} {"train_loss": -27.543048858642578, "global_step": 550889, "epoch": 6637} {"train_loss": -27.497907638549805, "global_step": 550890, "epoch": 6637} {"train_loss": -27.9731388092041, "global_step": 550891, "epoch": 6637} {"train_loss": -27.500280380249023, "global_step": 550892, "epoch": 6637} {"train_loss": -27.573883056640625, "global_step": 550893, "epoch": 6637} {"train_loss": -27.6210994720459, "global_step": 550894, "epoch": 6637} {"train_loss": -27.551361083984375, "global_step": 550895, "epoch": 6637} {"train_loss": -27.54840660095215, "global_step": 550896, "epoch": 6637} {"train_loss": -27.5836238861084, "global_step": 550897, "epoch": 6637} {"train_loss": -27.52499771118164, "global_step": 550898, "epoch": 6637} {"train_loss": -27.667341232299805, "global_step": 550899, "epoch": 6637} {"train_loss": -27.713638305664062, "global_step": 550900, "epoch": 6637} {"train_loss": -27.65439796447754, "global_step": 550901, "epoch": 6637} {"train_loss": -27.828413009643555, "global_step": 550902, "epoch": 6637} {"train_loss": -27.88423728942871, "global_step": 550903, "epoch": 6637} {"train_loss": -27.808813095092773, "global_step": 550904, "epoch": 6637} {"train_loss": -27.624439239501953, "global_step": 550905, "epoch": 6637} {"train_loss": -27.743200302124023, "global_step": 550906, "epoch": 6637} {"train_loss": -27.72012710571289, "global_step": 550907, "epoch": 6637} {"train_loss": -27.929401397705078, "global_step": 550908, "epoch": 6637} {"train_loss": -27.862836837768555, "global_step": 550909, "epoch": 6637} {"train_loss": -27.905012130737305, "global_step": 550910, "epoch": 6637} {"train_loss": -27.807565689086914, "global_step": 550911, "epoch": 6637} {"train_loss": -27.973052978515625, "global_step": 550912, "epoch": 6637} {"train_loss": -27.86785316467285, "global_step": 550913, "epoch": 6637} {"train_loss": -27.488500595092773, "global_step": 550914, "epoch": 6637} {"train_loss": -27.892541885375977, "global_step": 550915, "epoch": 6637} {"train_loss": -27.870702743530273, "global_step": 550916, "epoch": 6637} {"train_loss": -28.145681381225586, "global_step": 550917, "epoch": 6637} {"train_loss": -27.980093002319336, "global_step": 550918, "epoch": 6637} {"train_loss": -27.749221801757812, "global_step": 550919, "epoch": 6637} {"train_loss": -27.850080490112305, "global_step": 550920, "epoch": 6637} {"train_loss": -27.611591339111328, "global_step": 550921, "epoch": 6637} {"train_loss": -26.961536407470703, "global_step": 550922, "epoch": 6637} {"train_loss": -26.5224552154541, "global_step": 550923, "epoch": 6637} {"train_loss": -26.608795166015625, "global_step": 550924, "epoch": 6637} {"train_loss": -27.30463218688965, "global_step": 550925, "epoch": 6637} {"train_loss": -27.44720458984375, "global_step": 550926, "epoch": 6637} {"train_loss": -27.43377685546875, "global_step": 550927, "epoch": 6637} {"train_loss": -27.45839500427246, "global_step": 550928, "epoch": 6637} {"train_loss": -27.581567764282227, "global_step": 550929, "epoch": 6637} {"train_loss": -27.61182975769043, "global_step": 550930, "epoch": 6637} {"train_loss": -27.842416763305664, "global_step": 550931, "epoch": 6637} {"train_loss": -27.662378311157227, "global_step": 550932, "epoch": 6637} {"train_loss": -27.47053337097168, "global_step": 550933, "epoch": 6637} {"train_loss": -27.925506591796875, "global_step": 550934, "epoch": 6637} {"train_loss": -27.357282638549805, "global_step": 550935, "epoch": 6637} {"train_loss": -27.266834259033203, "global_step": 550936, "epoch": 6637} {"train_loss": -27.30459976196289, "global_step": 550937, "epoch": 6637} {"train_loss": -27.661712646484375, "global_step": 550938, "epoch": 6637} {"train_loss": -27.642316818237305, "global_step": 550939, "epoch": 6637} {"train_loss": -27.6075382232666, "global_step": 550940, "epoch": 6637} {"train_loss": -28.175689697265625, "global_step": 550941, "epoch": 6637} {"train_loss": -27.62269401550293, "global_step": 550942, "epoch": 6637} {"train_loss": -27.889036178588867, "global_step": 550943, "epoch": 6637} {"train_loss": -27.346439361572266, "global_step": 550944, "epoch": 6637} {"train_loss": -27.943851470947266, "global_step": 550945, "epoch": 6637} {"train_loss": -27.55398941040039, "global_step": 550946, "epoch": 6637} {"train_loss": -27.732086181640625, "global_step": 550947, "epoch": 6637} {"train_loss": -27.773710250854492, "global_step": 550948, "epoch": 6637} {"train_loss": -27.527685165405273, "global_step": 550949, "epoch": 6637} {"train_loss": -27.593154907226562, "global_step": 550950, "epoch": 6637} {"train_loss": -27.506078720092773, "global_step": 550951, "epoch": 6637} {"train_loss": -28.148712158203125, "global_step": 550952, "epoch": 6637} {"train_loss": -27.533604265695594, "global_step": 550953, "epoch": 6637, "val_loss": 6538030.0} {"train_loss": -26.786298751831055, "global_step": 550954, "epoch": 6638} {"train_loss": -27.363590240478516, "global_step": 550955, "epoch": 6638} {"train_loss": -27.243635177612305, "global_step": 550956, "epoch": 6638} {"train_loss": -26.6800594329834, "global_step": 550957, "epoch": 6638} {"train_loss": -26.81278419494629, "global_step": 550958, "epoch": 6638} {"train_loss": -27.459735870361328, "global_step": 550959, "epoch": 6638} {"train_loss": -27.185611724853516, "global_step": 550960, "epoch": 6638} {"train_loss": -26.705718994140625, "global_step": 550961, "epoch": 6638} {"train_loss": -27.693531036376953, "global_step": 550962, "epoch": 6638} {"train_loss": -27.401899337768555, "global_step": 550963, "epoch": 6638} {"train_loss": -27.539661407470703, "global_step": 550964, "epoch": 6638} {"train_loss": -27.262826919555664, "global_step": 550965, "epoch": 6638} {"train_loss": -27.288503646850586, "global_step": 550966, "epoch": 6638} {"train_loss": -27.244781494140625, "global_step": 550967, "epoch": 6638} {"train_loss": -27.697021484375, "global_step": 550968, "epoch": 6638} {"train_loss": -27.29608726501465, "global_step": 550969, "epoch": 6638} {"train_loss": -27.670934677124023, "global_step": 550970, "epoch": 6638} {"train_loss": -27.842267990112305, "global_step": 550971, "epoch": 6638} {"train_loss": -27.334308624267578, "global_step": 550972, "epoch": 6638} {"train_loss": -27.94382095336914, "global_step": 550973, "epoch": 6638} {"train_loss": -27.295379638671875, "global_step": 550974, "epoch": 6638} {"train_loss": -27.609037399291992, "global_step": 550975, "epoch": 6638} {"train_loss": -27.716806411743164, "global_step": 550976, "epoch": 6638} {"train_loss": -27.610193252563477, "global_step": 550977, "epoch": 6638} {"train_loss": -27.895475387573242, "global_step": 550978, "epoch": 6638} {"train_loss": -27.685626983642578, "global_step": 550979, "epoch": 6638} {"train_loss": -27.78302001953125, "global_step": 550980, "epoch": 6638} {"train_loss": -27.46149253845215, "global_step": 550981, "epoch": 6638} {"train_loss": -27.94965171813965, "global_step": 550982, "epoch": 6638} {"train_loss": -27.70696449279785, "global_step": 550983, "epoch": 6638} {"train_loss": -27.5134220123291, "global_step": 550984, "epoch": 6638} {"train_loss": -27.52716636657715, "global_step": 550985, "epoch": 6638} {"train_loss": -27.540943145751953, "global_step": 550986, "epoch": 6638} {"train_loss": -27.990087509155273, "global_step": 550987, "epoch": 6638} {"train_loss": -27.923383712768555, "global_step": 550988, "epoch": 6638} {"train_loss": -27.883747100830078, "global_step": 550989, "epoch": 6638} {"train_loss": -27.39093589782715, "global_step": 550990, "epoch": 6638} {"train_loss": -27.755529403686523, "global_step": 550991, "epoch": 6638} {"train_loss": -27.773977279663086, "global_step": 550992, "epoch": 6638} {"train_loss": -27.697351455688477, "global_step": 550993, "epoch": 6638} {"train_loss": -27.39204216003418, "global_step": 550994, "epoch": 6638} {"train_loss": -27.938861846923828, "global_step": 550995, "epoch": 6638} {"train_loss": -28.062580108642578, "global_step": 550996, "epoch": 6638} {"train_loss": -27.767578125, "global_step": 550997, "epoch": 6638} {"train_loss": -27.920059204101562, "global_step": 550998, "epoch": 6638} {"train_loss": -28.13886070251465, "global_step": 550999, "epoch": 6638} {"train_loss": -28.10853385925293, "global_step": 551000, "epoch": 6638} {"train_loss": -27.724756240844727, "global_step": 551001, "epoch": 6638} {"train_loss": -27.389806747436523, "global_step": 551002, "epoch": 6638} {"train_loss": -27.57758140563965, "global_step": 551003, "epoch": 6638} {"train_loss": -27.617919921875, "global_step": 551004, "epoch": 6638} {"train_loss": -27.208972930908203, "global_step": 551005, "epoch": 6638} {"train_loss": -27.121627807617188, "global_step": 551006, "epoch": 6638} {"train_loss": -27.262853622436523, "global_step": 551007, "epoch": 6638} {"train_loss": -27.83269691467285, "global_step": 551008, "epoch": 6638} {"train_loss": -27.644947052001953, "global_step": 551009, "epoch": 6638} {"train_loss": -27.56422233581543, "global_step": 551010, "epoch": 6638} {"train_loss": -27.563201904296875, "global_step": 551011, "epoch": 6638} {"train_loss": -27.708707809448242, "global_step": 551012, "epoch": 6638} {"train_loss": -27.966989517211914, "global_step": 551013, "epoch": 6638} {"train_loss": -27.247711181640625, "global_step": 551014, "epoch": 6638} {"train_loss": -27.614261627197266, "global_step": 551015, "epoch": 6638} {"train_loss": -27.91278648376465, "global_step": 551016, "epoch": 6638} {"train_loss": -27.461889266967773, "global_step": 551017, "epoch": 6638} {"train_loss": -27.5114803314209, "global_step": 551018, "epoch": 6638} {"train_loss": -27.811416625976562, "global_step": 551019, "epoch": 6638} {"train_loss": -27.544164657592773, "global_step": 551020, "epoch": 6638} {"train_loss": -27.061811447143555, "global_step": 551021, "epoch": 6638} {"train_loss": -27.317707061767578, "global_step": 551022, "epoch": 6638} {"train_loss": -27.60651206970215, "global_step": 551023, "epoch": 6638} {"train_loss": -27.902441024780273, "global_step": 551024, "epoch": 6638} {"train_loss": -27.344160079956055, "global_step": 551025, "epoch": 6638} {"train_loss": -27.923049926757812, "global_step": 551026, "epoch": 6638} {"train_loss": -27.45916175842285, "global_step": 551027, "epoch": 6638} {"train_loss": -27.544164657592773, "global_step": 551028, "epoch": 6638} {"train_loss": -27.54084587097168, "global_step": 551029, "epoch": 6638} {"train_loss": -27.791616439819336, "global_step": 551030, "epoch": 6638} {"train_loss": -27.71632957458496, "global_step": 551031, "epoch": 6638} {"train_loss": -27.537220001220703, "global_step": 551032, "epoch": 6638} {"train_loss": -28.02882194519043, "global_step": 551033, "epoch": 6638} {"train_loss": -27.52020835876465, "global_step": 551034, "epoch": 6638} {"train_loss": -27.683923721313477, "global_step": 551035, "epoch": 6638} {"train_loss": -27.56551140474986, "global_step": 551036, "epoch": 6638, "val_loss": 6480409.5} {"train_loss": -26.8704891204834, "global_step": 551037, "epoch": 6639} {"train_loss": -27.063989639282227, "global_step": 551038, "epoch": 6639} {"train_loss": -26.881000518798828, "global_step": 551039, "epoch": 6639} {"train_loss": -27.06983757019043, "global_step": 551040, "epoch": 6639} {"train_loss": -27.171045303344727, "global_step": 551041, "epoch": 6639} {"train_loss": -27.343555450439453, "global_step": 551042, "epoch": 6639} {"train_loss": -27.623361587524414, "global_step": 551043, "epoch": 6639} {"train_loss": -27.441221237182617, "global_step": 551044, "epoch": 6639} {"train_loss": -27.345178604125977, "global_step": 551045, "epoch": 6639} {"train_loss": -27.095367431640625, "global_step": 551046, "epoch": 6639} {"train_loss": -27.548730850219727, "global_step": 551047, "epoch": 6639} {"train_loss": -27.302494049072266, "global_step": 551048, "epoch": 6639} {"train_loss": -27.4483699798584, "global_step": 551049, "epoch": 6639} {"train_loss": -27.383935928344727, "global_step": 551050, "epoch": 6639} {"train_loss": -27.181318283081055, "global_step": 551051, "epoch": 6639} {"train_loss": -27.487329483032227, "global_step": 551052, "epoch": 6639} {"train_loss": -28.08277702331543, "global_step": 551053, "epoch": 6639} {"train_loss": -27.505170822143555, "global_step": 551054, "epoch": 6639} {"train_loss": -27.463964462280273, "global_step": 551055, "epoch": 6639} {"train_loss": -27.2562198638916, "global_step": 551056, "epoch": 6639} {"train_loss": -27.753986358642578, "global_step": 551057, "epoch": 6639} {"train_loss": -27.491010665893555, "global_step": 551058, "epoch": 6639} {"train_loss": -27.511112213134766, "global_step": 551059, "epoch": 6639} {"train_loss": -27.603784561157227, "global_step": 551060, "epoch": 6639} {"train_loss": -27.640338897705078, "global_step": 551061, "epoch": 6639} {"train_loss": -27.385427474975586, "global_step": 551062, "epoch": 6639} {"train_loss": -27.532611846923828, "global_step": 551063, "epoch": 6639} {"train_loss": -27.633203506469727, "global_step": 551064, "epoch": 6639} {"train_loss": -27.390430450439453, "global_step": 551065, "epoch": 6639} {"train_loss": -27.683530807495117, "global_step": 551066, "epoch": 6639} {"train_loss": -27.667938232421875, "global_step": 551067, "epoch": 6639} {"train_loss": -27.80549430847168, "global_step": 551068, "epoch": 6639} {"train_loss": -27.760589599609375, "global_step": 551069, "epoch": 6639} {"train_loss": -27.747961044311523, "global_step": 551070, "epoch": 6639} {"train_loss": -27.989765167236328, "global_step": 551071, "epoch": 6639} {"train_loss": -27.465015411376953, "global_step": 551072, "epoch": 6639} {"train_loss": -27.51555824279785, "global_step": 551073, "epoch": 6639} {"train_loss": -27.738645553588867, "global_step": 551074, "epoch": 6639} {"train_loss": -27.552839279174805, "global_step": 551075, "epoch": 6639} {"train_loss": -27.839078903198242, "global_step": 551076, "epoch": 6639} {"train_loss": -27.780960083007812, "global_step": 551077, "epoch": 6639} {"train_loss": -27.69502067565918, "global_step": 551078, "epoch": 6639} {"train_loss": -27.860864639282227, "global_step": 551079, "epoch": 6639} {"train_loss": -27.57877540588379, "global_step": 551080, "epoch": 6639} {"train_loss": -27.711029052734375, "global_step": 551081, "epoch": 6639} {"train_loss": -27.821319580078125, "global_step": 551082, "epoch": 6639} {"train_loss": -28.02015495300293, "global_step": 551083, "epoch": 6639} {"train_loss": -27.907642364501953, "global_step": 551084, "epoch": 6639} {"train_loss": -27.5056095123291, "global_step": 551085, "epoch": 6639} {"train_loss": -27.85077476501465, "global_step": 551086, "epoch": 6639} {"train_loss": -28.20830726623535, "global_step": 551087, "epoch": 6639} {"train_loss": -28.00242042541504, "global_step": 551088, "epoch": 6639} {"train_loss": -27.97565269470215, "global_step": 551089, "epoch": 6639} {"train_loss": -27.899768829345703, "global_step": 551090, "epoch": 6639} {"train_loss": -27.9074649810791, "global_step": 551091, "epoch": 6639} {"train_loss": -27.262319564819336, "global_step": 551092, "epoch": 6639} {"train_loss": -27.923898696899414, "global_step": 551093, "epoch": 6639} {"train_loss": -27.852569580078125, "global_step": 551094, "epoch": 6639} {"train_loss": -27.71278190612793, "global_step": 551095, "epoch": 6639} {"train_loss": -27.754072189331055, "global_step": 551096, "epoch": 6639} {"train_loss": -27.891515731811523, "global_step": 551097, "epoch": 6639} {"train_loss": -27.809051513671875, "global_step": 551098, "epoch": 6639} {"train_loss": -27.89405632019043, "global_step": 551099, "epoch": 6639} {"train_loss": -27.88117790222168, "global_step": 551100, "epoch": 6639} {"train_loss": -27.790679931640625, "global_step": 551101, "epoch": 6639} {"train_loss": -27.829303741455078, "global_step": 551102, "epoch": 6639} {"train_loss": -27.857421875, "global_step": 551103, "epoch": 6639} {"train_loss": -27.95347023010254, "global_step": 551104, "epoch": 6639} {"train_loss": -28.030628204345703, "global_step": 551105, "epoch": 6639} {"train_loss": -27.93116569519043, "global_step": 551106, "epoch": 6639} {"train_loss": -27.61954116821289, "global_step": 551107, "epoch": 6639} {"train_loss": -27.97088623046875, "global_step": 551108, "epoch": 6639} {"train_loss": -27.518064498901367, "global_step": 551109, "epoch": 6639} {"train_loss": -27.82915687561035, "global_step": 551110, "epoch": 6639} {"train_loss": -28.2341251373291, "global_step": 551111, "epoch": 6639} {"train_loss": -28.615589141845703, "global_step": 551112, "epoch": 6639} {"train_loss": -28.03472900390625, "global_step": 551113, "epoch": 6639} {"train_loss": -27.654356002807617, "global_step": 551114, "epoch": 6639} {"train_loss": -28.241836547851562, "global_step": 551115, "epoch": 6639} {"train_loss": -27.56464958190918, "global_step": 551116, "epoch": 6639} {"train_loss": -28.270065307617188, "global_step": 551117, "epoch": 6639} {"train_loss": -27.86149024963379, "global_step": 551118, "epoch": 6639} {"train_loss": -27.68102843502918, "global_step": 551119, "epoch": 6639, "val_loss": 6485871.0} {"train_loss": -27.579132080078125, "global_step": 551120, "epoch": 6640} {"train_loss": -27.533720016479492, "global_step": 551121, "epoch": 6640} {"train_loss": -27.428674697875977, "global_step": 551122, "epoch": 6640} {"train_loss": -27.080829620361328, "global_step": 551123, "epoch": 6640} {"train_loss": -27.117740631103516, "global_step": 551124, "epoch": 6640} {"train_loss": -27.26796531677246, "global_step": 551125, "epoch": 6640} {"train_loss": -27.238412857055664, "global_step": 551126, "epoch": 6640} {"train_loss": -27.520856857299805, "global_step": 551127, "epoch": 6640} {"train_loss": -27.8190860748291, "global_step": 551128, "epoch": 6640} {"train_loss": -27.6155948638916, "global_step": 551129, "epoch": 6640} {"train_loss": -27.800933837890625, "global_step": 551130, "epoch": 6640} {"train_loss": -27.126394271850586, "global_step": 551131, "epoch": 6640} {"train_loss": -27.88849449157715, "global_step": 551132, "epoch": 6640} {"train_loss": -27.630542755126953, "global_step": 551133, "epoch": 6640} {"train_loss": -27.55525016784668, "global_step": 551134, "epoch": 6640} {"train_loss": -27.531702041625977, "global_step": 551135, "epoch": 6640} {"train_loss": -27.476057052612305, "global_step": 551136, "epoch": 6640} {"train_loss": -27.725194931030273, "global_step": 551137, "epoch": 6640} {"train_loss": -27.455936431884766, "global_step": 551138, "epoch": 6640} {"train_loss": -27.718862533569336, "global_step": 551139, "epoch": 6640} {"train_loss": -27.87751579284668, "global_step": 551140, "epoch": 6640} {"train_loss": -27.990331649780273, "global_step": 551141, "epoch": 6640} {"train_loss": -27.466449737548828, "global_step": 551142, "epoch": 6640} {"train_loss": -28.004968643188477, "global_step": 551143, "epoch": 6640} {"train_loss": -27.47749137878418, "global_step": 551144, "epoch": 6640} {"train_loss": -27.49114418029785, "global_step": 551145, "epoch": 6640} {"train_loss": -27.911365509033203, "global_step": 551146, "epoch": 6640} {"train_loss": -27.442432403564453, "global_step": 551147, "epoch": 6640} {"train_loss": -27.687353134155273, "global_step": 551148, "epoch": 6640} {"train_loss": -27.8870849609375, "global_step": 551149, "epoch": 6640} {"train_loss": -27.862014770507812, "global_step": 551150, "epoch": 6640} {"train_loss": -27.717432022094727, "global_step": 551151, "epoch": 6640} {"train_loss": -27.924264907836914, "global_step": 551152, "epoch": 6640} {"train_loss": -27.6962947845459, "global_step": 551153, "epoch": 6640} {"train_loss": -27.80712890625, "global_step": 551154, "epoch": 6640} {"train_loss": -27.315601348876953, "global_step": 551155, "epoch": 6640} {"train_loss": -27.73060417175293, "global_step": 551156, "epoch": 6640} {"train_loss": -28.005178451538086, "global_step": 551157, "epoch": 6640} {"train_loss": -27.665149688720703, "global_step": 551158, "epoch": 6640} {"train_loss": -27.87702751159668, "global_step": 551159, "epoch": 6640} {"train_loss": -27.895009994506836, "global_step": 551160, "epoch": 6640} {"train_loss": -27.54815101623535, "global_step": 551161, "epoch": 6640} {"train_loss": -27.833600997924805, "global_step": 551162, "epoch": 6640} {"train_loss": -27.90167236328125, "global_step": 551163, "epoch": 6640} {"train_loss": -27.65595817565918, "global_step": 551164, "epoch": 6640} {"train_loss": -27.64948844909668, "global_step": 551165, "epoch": 6640} {"train_loss": -27.64797019958496, "global_step": 551166, "epoch": 6640} {"train_loss": -28.16595458984375, "global_step": 551167, "epoch": 6640} {"train_loss": -27.637731552124023, "global_step": 551168, "epoch": 6640} {"train_loss": -27.56548500061035, "global_step": 551169, "epoch": 6640} {"train_loss": -27.508909225463867, "global_step": 551170, "epoch": 6640} {"train_loss": -27.360692977905273, "global_step": 551171, "epoch": 6640} {"train_loss": -27.789106369018555, "global_step": 551172, "epoch": 6640} {"train_loss": -27.648618698120117, "global_step": 551173, "epoch": 6640} {"train_loss": -27.357587814331055, "global_step": 551174, "epoch": 6640} {"train_loss": -27.605558395385742, "global_step": 551175, "epoch": 6640} {"train_loss": -27.73615074157715, "global_step": 551176, "epoch": 6640} {"train_loss": -27.5032958984375, "global_step": 551177, "epoch": 6640} {"train_loss": -28.02570915222168, "global_step": 551178, "epoch": 6640} {"train_loss": -27.657459259033203, "global_step": 551179, "epoch": 6640} {"train_loss": -27.468969345092773, "global_step": 551180, "epoch": 6640} {"train_loss": -27.385177612304688, "global_step": 551181, "epoch": 6640} {"train_loss": -27.327341079711914, "global_step": 551182, "epoch": 6640} {"train_loss": -27.473968505859375, "global_step": 551183, "epoch": 6640} {"train_loss": -27.481672286987305, "global_step": 551184, "epoch": 6640} {"train_loss": -27.523914337158203, "global_step": 551185, "epoch": 6640} {"train_loss": -27.4737491607666, "global_step": 551186, "epoch": 6640} {"train_loss": -27.61897087097168, "global_step": 551187, "epoch": 6640} {"train_loss": -27.484704971313477, "global_step": 551188, "epoch": 6640} {"train_loss": -28.085676193237305, "global_step": 551189, "epoch": 6640} {"train_loss": -27.473066329956055, "global_step": 551190, "epoch": 6640} {"train_loss": -27.69654655456543, "global_step": 551191, "epoch": 6640} {"train_loss": -27.72675895690918, "global_step": 551192, "epoch": 6640} {"train_loss": -27.819183349609375, "global_step": 551193, "epoch": 6640} {"train_loss": -27.95045280456543, "global_step": 551194, "epoch": 6640} {"train_loss": -27.545373916625977, "global_step": 551195, "epoch": 6640} {"train_loss": -27.636627197265625, "global_step": 551196, "epoch": 6640} {"train_loss": -27.6315860748291, "global_step": 551197, "epoch": 6640} {"train_loss": -27.7574405670166, "global_step": 551198, "epoch": 6640} {"train_loss": -27.978612899780273, "global_step": 551199, "epoch": 6640} {"train_loss": -27.47113609313965, "global_step": 551200, "epoch": 6640} {"train_loss": -27.683340072631836, "global_step": 551201, "epoch": 6640} {"train_loss": -27.636795181825935, "global_step": 551202, "epoch": 6640, "val_loss": 6492652.5} {"train_loss": -27.095184326171875, "global_step": 551203, "epoch": 6641} {"train_loss": -26.612531661987305, "global_step": 551204, "epoch": 6641} {"train_loss": -27.505573272705078, "global_step": 551205, "epoch": 6641} {"train_loss": -26.943267822265625, "global_step": 551206, "epoch": 6641} {"train_loss": -27.569076538085938, "global_step": 551207, "epoch": 6641} {"train_loss": -27.48505973815918, "global_step": 551208, "epoch": 6641} {"train_loss": -27.383453369140625, "global_step": 551209, "epoch": 6641} {"train_loss": -27.563980102539062, "global_step": 551210, "epoch": 6641} {"train_loss": -26.882516860961914, "global_step": 551211, "epoch": 6641} {"train_loss": -27.371692657470703, "global_step": 551212, "epoch": 6641} {"train_loss": -27.44915771484375, "global_step": 551213, "epoch": 6641} {"train_loss": -27.093738555908203, "global_step": 551214, "epoch": 6641} {"train_loss": -27.40201759338379, "global_step": 551215, "epoch": 6641} {"train_loss": -27.28814697265625, "global_step": 551216, "epoch": 6641} {"train_loss": -27.2042179107666, "global_step": 551217, "epoch": 6641} {"train_loss": -27.662256240844727, "global_step": 551218, "epoch": 6641} {"train_loss": -27.300678253173828, "global_step": 551219, "epoch": 6641} {"train_loss": -27.237985610961914, "global_step": 551220, "epoch": 6641} {"train_loss": -27.602340698242188, "global_step": 551221, "epoch": 6641} {"train_loss": -27.655805587768555, "global_step": 551222, "epoch": 6641} {"train_loss": -27.974395751953125, "global_step": 551223, "epoch": 6641} {"train_loss": -27.48682975769043, "global_step": 551224, "epoch": 6641} {"train_loss": -27.733362197875977, "global_step": 551225, "epoch": 6641} {"train_loss": -27.73027992248535, "global_step": 551226, "epoch": 6641} {"train_loss": -27.65593910217285, "global_step": 551227, "epoch": 6641} {"train_loss": -27.711963653564453, "global_step": 551228, "epoch": 6641} {"train_loss": -28.10107421875, "global_step": 551229, "epoch": 6641} {"train_loss": -27.66851234436035, "global_step": 551230, "epoch": 6641} {"train_loss": -28.092138290405273, "global_step": 551231, "epoch": 6641} {"train_loss": -27.913074493408203, "global_step": 551232, "epoch": 6641} {"train_loss": -27.91514015197754, "global_step": 551233, "epoch": 6641} {"train_loss": -28.03925132751465, "global_step": 551234, "epoch": 6641} {"train_loss": -27.69989585876465, "global_step": 551235, "epoch": 6641} {"train_loss": -27.540740966796875, "global_step": 551236, "epoch": 6641} {"train_loss": -27.694746017456055, "global_step": 551237, "epoch": 6641} {"train_loss": -27.50477409362793, "global_step": 551238, "epoch": 6641} {"train_loss": -27.7470703125, "global_step": 551239, "epoch": 6641} {"train_loss": -27.77167320251465, "global_step": 551240, "epoch": 6641} {"train_loss": -27.638105392456055, "global_step": 551241, "epoch": 6641} {"train_loss": -28.03092384338379, "global_step": 551242, "epoch": 6641} {"train_loss": -27.718664169311523, "global_step": 551243, "epoch": 6641} {"train_loss": -27.67414665222168, "global_step": 551244, "epoch": 6641} {"train_loss": -27.6637020111084, "global_step": 551245, "epoch": 6641} {"train_loss": -27.68043327331543, "global_step": 551246, "epoch": 6641} {"train_loss": -27.455785751342773, "global_step": 551247, "epoch": 6641} {"train_loss": -27.63587760925293, "global_step": 551248, "epoch": 6641} {"train_loss": -27.92291259765625, "global_step": 551249, "epoch": 6641} {"train_loss": -27.880807876586914, "global_step": 551250, "epoch": 6641} {"train_loss": -27.911161422729492, "global_step": 551251, "epoch": 6641} {"train_loss": -27.602453231811523, "global_step": 551252, "epoch": 6641} {"train_loss": -27.52593994140625, "global_step": 551253, "epoch": 6641} {"train_loss": -27.952844619750977, "global_step": 551254, "epoch": 6641} {"train_loss": -27.746747970581055, "global_step": 551255, "epoch": 6641} {"train_loss": -27.8701114654541, "global_step": 551256, "epoch": 6641} {"train_loss": -27.55391502380371, "global_step": 551257, "epoch": 6641} {"train_loss": -27.73089027404785, "global_step": 551258, "epoch": 6641} {"train_loss": -27.846765518188477, "global_step": 551259, "epoch": 6641} {"train_loss": -27.795978546142578, "global_step": 551260, "epoch": 6641} {"train_loss": -27.741052627563477, "global_step": 551261, "epoch": 6641} {"train_loss": -27.500244140625, "global_step": 551262, "epoch": 6641} {"train_loss": -27.939472198486328, "global_step": 551263, "epoch": 6641} {"train_loss": -27.818836212158203, "global_step": 551264, "epoch": 6641} {"train_loss": -27.607135772705078, "global_step": 551265, "epoch": 6641} {"train_loss": -28.331741333007812, "global_step": 551266, "epoch": 6641} {"train_loss": -27.867544174194336, "global_step": 551267, "epoch": 6641} {"train_loss": -27.937711715698242, "global_step": 551268, "epoch": 6641} {"train_loss": -27.881521224975586, "global_step": 551269, "epoch": 6641} {"train_loss": -27.849767684936523, "global_step": 551270, "epoch": 6641} {"train_loss": -28.10323143005371, "global_step": 551271, "epoch": 6641} {"train_loss": -27.839752197265625, "global_step": 551272, "epoch": 6641} {"train_loss": -27.625635147094727, "global_step": 551273, "epoch": 6641} {"train_loss": -27.928882598876953, "global_step": 551274, "epoch": 6641} {"train_loss": -27.81618309020996, "global_step": 551275, "epoch": 6641} {"train_loss": -28.069446563720703, "global_step": 551276, "epoch": 6641} {"train_loss": -27.725305557250977, "global_step": 551277, "epoch": 6641} {"train_loss": -27.7783145904541, "global_step": 551278, "epoch": 6641} {"train_loss": -27.701929092407227, "global_step": 551279, "epoch": 6641} {"train_loss": -27.71877098083496, "global_step": 551280, "epoch": 6641} {"train_loss": -27.869522094726562, "global_step": 551281, "epoch": 6641} {"train_loss": -27.520679473876953, "global_step": 551282, "epoch": 6641} {"train_loss": -27.451440811157227, "global_step": 551283, "epoch": 6641} {"train_loss": -27.599018096923828, "global_step": 551284, "epoch": 6641} {"train_loss": -27.659883131463843, "global_step": 551285, "epoch": 6641, "val_loss": 6459825.0} {"train_loss": -26.14222526550293, "global_step": 551286, "epoch": 6642} {"train_loss": -27.240966796875, "global_step": 551287, "epoch": 6642} {"train_loss": -26.816787719726562, "global_step": 551288, "epoch": 6642} {"train_loss": -26.649206161499023, "global_step": 551289, "epoch": 6642} {"train_loss": -27.12229347229004, "global_step": 551290, "epoch": 6642} {"train_loss": -27.134000778198242, "global_step": 551291, "epoch": 6642} {"train_loss": -26.843408584594727, "global_step": 551292, "epoch": 6642} {"train_loss": -27.240198135375977, "global_step": 551293, "epoch": 6642} {"train_loss": -27.136444091796875, "global_step": 551294, "epoch": 6642} {"train_loss": -27.257465362548828, "global_step": 551295, "epoch": 6642} {"train_loss": -27.016019821166992, "global_step": 551296, "epoch": 6642} {"train_loss": -27.007429122924805, "global_step": 551297, "epoch": 6642} {"train_loss": -27.136198043823242, "global_step": 551298, "epoch": 6642} {"train_loss": -27.28104019165039, "global_step": 551299, "epoch": 6642} {"train_loss": -27.49151039123535, "global_step": 551300, "epoch": 6642} {"train_loss": -27.442724227905273, "global_step": 551301, "epoch": 6642} {"train_loss": -27.405378341674805, "global_step": 551302, "epoch": 6642} {"train_loss": -27.43951416015625, "global_step": 551303, "epoch": 6642} {"train_loss": -27.472875595092773, "global_step": 551304, "epoch": 6642} {"train_loss": -27.547101974487305, "global_step": 551305, "epoch": 6642} {"train_loss": -27.087879180908203, "global_step": 551306, "epoch": 6642} {"train_loss": -27.21234703063965, "global_step": 551307, "epoch": 6642} {"train_loss": -27.74481201171875, "global_step": 551308, "epoch": 6642} {"train_loss": -27.47918701171875, "global_step": 551309, "epoch": 6642} {"train_loss": -27.705951690673828, "global_step": 551310, "epoch": 6642} {"train_loss": -27.217330932617188, "global_step": 551311, "epoch": 6642} {"train_loss": -27.9515438079834, "global_step": 551312, "epoch": 6642} {"train_loss": -27.3387451171875, "global_step": 551313, "epoch": 6642} {"train_loss": -27.417016983032227, "global_step": 551314, "epoch": 6642} {"train_loss": -26.9293270111084, "global_step": 551315, "epoch": 6642} {"train_loss": -28.01673698425293, "global_step": 551316, "epoch": 6642} {"train_loss": -27.694631576538086, "global_step": 551317, "epoch": 6642} {"train_loss": -27.509647369384766, "global_step": 551318, "epoch": 6642} {"train_loss": -27.8740234375, "global_step": 551319, "epoch": 6642} {"train_loss": -27.749250411987305, "global_step": 551320, "epoch": 6642} {"train_loss": -27.696796417236328, "global_step": 551321, "epoch": 6642} {"train_loss": -27.548254013061523, "global_step": 551322, "epoch": 6642} {"train_loss": -27.5546932220459, "global_step": 551323, "epoch": 6642} {"train_loss": -27.853485107421875, "global_step": 551324, "epoch": 6642} {"train_loss": -27.46027946472168, "global_step": 551325, "epoch": 6642} {"train_loss": -27.835737228393555, "global_step": 551326, "epoch": 6642} {"train_loss": -27.37894630432129, "global_step": 551327, "epoch": 6642} {"train_loss": -27.506591796875, "global_step": 551328, "epoch": 6642} {"train_loss": -27.652790069580078, "global_step": 551329, "epoch": 6642} {"train_loss": -27.46784782409668, "global_step": 551330, "epoch": 6642} {"train_loss": -28.3033504486084, "global_step": 551331, "epoch": 6642} {"train_loss": -27.990686416625977, "global_step": 551332, "epoch": 6642} {"train_loss": -27.696258544921875, "global_step": 551333, "epoch": 6642} {"train_loss": -27.538442611694336, "global_step": 551334, "epoch": 6642} {"train_loss": -28.185510635375977, "global_step": 551335, "epoch": 6642} {"train_loss": -27.821186065673828, "global_step": 551336, "epoch": 6642} {"train_loss": -27.770971298217773, "global_step": 551337, "epoch": 6642} {"train_loss": -27.791217803955078, "global_step": 551338, "epoch": 6642} {"train_loss": -27.997207641601562, "global_step": 551339, "epoch": 6642} {"train_loss": -27.518640518188477, "global_step": 551340, "epoch": 6642} {"train_loss": -27.88094139099121, "global_step": 551341, "epoch": 6642} {"train_loss": -27.29438591003418, "global_step": 551342, "epoch": 6642} {"train_loss": -27.436508178710938, "global_step": 551343, "epoch": 6642} {"train_loss": -27.702112197875977, "global_step": 551344, "epoch": 6642} {"train_loss": -27.83939552307129, "global_step": 551345, "epoch": 6642} {"train_loss": -27.710718154907227, "global_step": 551346, "epoch": 6642} {"train_loss": -27.842166900634766, "global_step": 551347, "epoch": 6642} {"train_loss": -27.8865909576416, "global_step": 551348, "epoch": 6642} {"train_loss": -28.00311851501465, "global_step": 551349, "epoch": 6642} {"train_loss": -27.829010009765625, "global_step": 551350, "epoch": 6642} {"train_loss": -27.7163143157959, "global_step": 551351, "epoch": 6642} {"train_loss": -27.68052101135254, "global_step": 551352, "epoch": 6642} {"train_loss": -27.651472091674805, "global_step": 551353, "epoch": 6642} {"train_loss": -28.073566436767578, "global_step": 551354, "epoch": 6642} {"train_loss": -28.019290924072266, "global_step": 551355, "epoch": 6642} {"train_loss": -27.93238639831543, "global_step": 551356, "epoch": 6642} {"train_loss": -27.92795181274414, "global_step": 551357, "epoch": 6642} {"train_loss": -28.026065826416016, "global_step": 551358, "epoch": 6642} {"train_loss": -27.959320068359375, "global_step": 551359, "epoch": 6642} {"train_loss": -27.790424346923828, "global_step": 551360, "epoch": 6642} {"train_loss": -27.891355514526367, "global_step": 551361, "epoch": 6642} {"train_loss": -27.8416748046875, "global_step": 551362, "epoch": 6642} {"train_loss": -27.6299991607666, "global_step": 551363, "epoch": 6642} {"train_loss": -27.993505477905273, "global_step": 551364, "epoch": 6642} {"train_loss": -27.488630294799805, "global_step": 551365, "epoch": 6642} {"train_loss": -27.853397369384766, "global_step": 551366, "epoch": 6642} {"train_loss": -27.896133422851562, "global_step": 551367, "epoch": 6642} {"train_loss": -27.56095578297075, "global_step": 551368, "epoch": 6642, "val_loss": 6615313.0} {"train_loss": -26.436725616455078, "global_step": 551369, "epoch": 6643} {"train_loss": -25.7314453125, "global_step": 551370, "epoch": 6643} {"train_loss": -26.96233558654785, "global_step": 551371, "epoch": 6643} {"train_loss": -26.678787231445312, "global_step": 551372, "epoch": 6643} {"train_loss": -26.814380645751953, "global_step": 551373, "epoch": 6643} {"train_loss": -26.39728355407715, "global_step": 551374, "epoch": 6643} {"train_loss": -26.68927574157715, "global_step": 551375, "epoch": 6643} {"train_loss": -26.848587036132812, "global_step": 551376, "epoch": 6643} {"train_loss": -26.665512084960938, "global_step": 551377, "epoch": 6643} {"train_loss": -27.001026153564453, "global_step": 551378, "epoch": 6643} {"train_loss": -27.219512939453125, "global_step": 551379, "epoch": 6643} {"train_loss": -26.810382843017578, "global_step": 551380, "epoch": 6643} {"train_loss": -27.239530563354492, "global_step": 551381, "epoch": 6643} {"train_loss": -26.878387451171875, "global_step": 551382, "epoch": 6643} {"train_loss": -27.19614028930664, "global_step": 551383, "epoch": 6643} {"train_loss": -26.926809310913086, "global_step": 551384, "epoch": 6643} {"train_loss": -27.4918212890625, "global_step": 551385, "epoch": 6643} {"train_loss": -27.290525436401367, "global_step": 551386, "epoch": 6643} {"train_loss": -27.168638229370117, "global_step": 551387, "epoch": 6643} {"train_loss": -27.5584716796875, "global_step": 551388, "epoch": 6643} {"train_loss": -27.3680419921875, "global_step": 551389, "epoch": 6643} {"train_loss": -27.29493522644043, "global_step": 551390, "epoch": 6643} {"train_loss": -27.212018966674805, "global_step": 551391, "epoch": 6643} {"train_loss": -27.30769157409668, "global_step": 551392, "epoch": 6643} {"train_loss": -27.108489990234375, "global_step": 551393, "epoch": 6643} {"train_loss": -27.428693771362305, "global_step": 551394, "epoch": 6643} {"train_loss": -27.857080459594727, "global_step": 551395, "epoch": 6643} {"train_loss": -27.600879669189453, "global_step": 551396, "epoch": 6643} {"train_loss": -27.58465576171875, "global_step": 551397, "epoch": 6643} {"train_loss": -27.667444229125977, "global_step": 551398, "epoch": 6643} {"train_loss": -27.708251953125, "global_step": 551399, "epoch": 6643} {"train_loss": -27.6568546295166, "global_step": 551400, "epoch": 6643} {"train_loss": -27.6618709564209, "global_step": 551401, "epoch": 6643} {"train_loss": -27.370691299438477, "global_step": 551402, "epoch": 6643} {"train_loss": -27.779682159423828, "global_step": 551403, "epoch": 6643} {"train_loss": -27.52911376953125, "global_step": 551404, "epoch": 6643} {"train_loss": -27.865835189819336, "global_step": 551405, "epoch": 6643} {"train_loss": -27.859638214111328, "global_step": 551406, "epoch": 6643} {"train_loss": -27.73554039001465, "global_step": 551407, "epoch": 6643} {"train_loss": -27.90970230102539, "global_step": 551408, "epoch": 6643} {"train_loss": -28.212549209594727, "global_step": 551409, "epoch": 6643} {"train_loss": -27.997943878173828, "global_step": 551410, "epoch": 6643} {"train_loss": -27.840978622436523, "global_step": 551411, "epoch": 6643} {"train_loss": -27.812763214111328, "global_step": 551412, "epoch": 6643} {"train_loss": -27.976926803588867, "global_step": 551413, "epoch": 6643} {"train_loss": -28.18500328063965, "global_step": 551414, "epoch": 6643} {"train_loss": -28.02178382873535, "global_step": 551415, "epoch": 6643} {"train_loss": -28.320425033569336, "global_step": 551416, "epoch": 6643} {"train_loss": -28.277713775634766, "global_step": 551417, "epoch": 6643} {"train_loss": -28.113388061523438, "global_step": 551418, "epoch": 6643} {"train_loss": -27.864532470703125, "global_step": 551419, "epoch": 6643} {"train_loss": -27.97639274597168, "global_step": 551420, "epoch": 6643} {"train_loss": -27.69585609436035, "global_step": 551421, "epoch": 6643} {"train_loss": -27.832468032836914, "global_step": 551422, "epoch": 6643} {"train_loss": -27.970905303955078, "global_step": 551423, "epoch": 6643} {"train_loss": -28.01409912109375, "global_step": 551424, "epoch": 6643} {"train_loss": -28.133270263671875, "global_step": 551425, "epoch": 6643} {"train_loss": -28.108457565307617, "global_step": 551426, "epoch": 6643} {"train_loss": -27.746509552001953, "global_step": 551427, "epoch": 6643} {"train_loss": -27.520587921142578, "global_step": 551428, "epoch": 6643} {"train_loss": -27.81682777404785, "global_step": 551429, "epoch": 6643} {"train_loss": -27.522510528564453, "global_step": 551430, "epoch": 6643} {"train_loss": -27.708288192749023, "global_step": 551431, "epoch": 6643} {"train_loss": -27.9422550201416, "global_step": 551432, "epoch": 6643} {"train_loss": -27.431140899658203, "global_step": 551433, "epoch": 6643} {"train_loss": -27.402469635009766, "global_step": 551434, "epoch": 6643} {"train_loss": -27.342819213867188, "global_step": 551435, "epoch": 6643} {"train_loss": -27.217823028564453, "global_step": 551436, "epoch": 6643} {"train_loss": -27.291427612304688, "global_step": 551437, "epoch": 6643} {"train_loss": -27.605382919311523, "global_step": 551438, "epoch": 6643} {"train_loss": -27.896154403686523, "global_step": 551439, "epoch": 6643} {"train_loss": -27.676193237304688, "global_step": 551440, "epoch": 6643} {"train_loss": -27.533838272094727, "global_step": 551441, "epoch": 6643} {"train_loss": -27.4160213470459, "global_step": 551442, "epoch": 6643} {"train_loss": -27.643712997436523, "global_step": 551443, "epoch": 6643} {"train_loss": -27.607202529907227, "global_step": 551444, "epoch": 6643} {"train_loss": -27.694982528686523, "global_step": 551445, "epoch": 6643} {"train_loss": -27.761411666870117, "global_step": 551446, "epoch": 6643} {"train_loss": -27.85445213317871, "global_step": 551447, "epoch": 6643} {"train_loss": -27.817468643188477, "global_step": 551448, "epoch": 6643} {"train_loss": -27.9755859375, "global_step": 551449, "epoch": 6643} {"train_loss": -27.80812644958496, "global_step": 551450, "epoch": 6643} {"train_loss": -27.53689439612699, "global_step": 551451, "epoch": 6643, "val_loss": 6634426.5} {"train_loss": -26.802839279174805, "global_step": 551452, "epoch": 6644} {"train_loss": -25.39008140563965, "global_step": 551453, "epoch": 6644} {"train_loss": -25.65439224243164, "global_step": 551454, "epoch": 6644} {"train_loss": -27.573917388916016, "global_step": 551455, "epoch": 6644} {"train_loss": -25.161027908325195, "global_step": 551456, "epoch": 6644} {"train_loss": -26.751935958862305, "global_step": 551457, "epoch": 6644} {"train_loss": -27.091842651367188, "global_step": 551458, "epoch": 6644} {"train_loss": -26.76615333557129, "global_step": 551459, "epoch": 6644} {"train_loss": -26.95509147644043, "global_step": 551460, "epoch": 6644} {"train_loss": -27.340103149414062, "global_step": 551461, "epoch": 6644} {"train_loss": -26.87482261657715, "global_step": 551462, "epoch": 6644} {"train_loss": -26.991500854492188, "global_step": 551463, "epoch": 6644} {"train_loss": -27.249603271484375, "global_step": 551464, "epoch": 6644} {"train_loss": -27.279937744140625, "global_step": 551465, "epoch": 6644} {"train_loss": -27.57252311706543, "global_step": 551466, "epoch": 6644} {"train_loss": -27.043689727783203, "global_step": 551467, "epoch": 6644} {"train_loss": -27.4515380859375, "global_step": 551468, "epoch": 6644} {"train_loss": -27.034687042236328, "global_step": 551469, "epoch": 6644} {"train_loss": -27.236982345581055, "global_step": 551470, "epoch": 6644} {"train_loss": -27.75310707092285, "global_step": 551471, "epoch": 6644} {"train_loss": -27.3699951171875, "global_step": 551472, "epoch": 6644} {"train_loss": -27.473779678344727, "global_step": 551473, "epoch": 6644} {"train_loss": -27.178937911987305, "global_step": 551474, "epoch": 6644} {"train_loss": -27.388959884643555, "global_step": 551475, "epoch": 6644} {"train_loss": -27.516010284423828, "global_step": 551476, "epoch": 6644} {"train_loss": -27.528974533081055, "global_step": 551477, "epoch": 6644} {"train_loss": -27.425159454345703, "global_step": 551478, "epoch": 6644} {"train_loss": -27.37032127380371, "global_step": 551479, "epoch": 6644} {"train_loss": -27.60450553894043, "global_step": 551480, "epoch": 6644} {"train_loss": -27.721420288085938, "global_step": 551481, "epoch": 6644} {"train_loss": -27.627288818359375, "global_step": 551482, "epoch": 6644} {"train_loss": -27.2916316986084, "global_step": 551483, "epoch": 6644} {"train_loss": -27.771162033081055, "global_step": 551484, "epoch": 6644} {"train_loss": -27.74823570251465, "global_step": 551485, "epoch": 6644} {"train_loss": -27.085474014282227, "global_step": 551486, "epoch": 6644} {"train_loss": -27.970495223999023, "global_step": 551487, "epoch": 6644} {"train_loss": -27.751789093017578, "global_step": 551488, "epoch": 6644} {"train_loss": -27.753543853759766, "global_step": 551489, "epoch": 6644} {"train_loss": -27.694320678710938, "global_step": 551490, "epoch": 6644} {"train_loss": -27.827686309814453, "global_step": 551491, "epoch": 6644} {"train_loss": -27.16937255859375, "global_step": 551492, "epoch": 6644} {"train_loss": -27.6527042388916, "global_step": 551493, "epoch": 6644} {"train_loss": -27.614349365234375, "global_step": 551494, "epoch": 6644} {"train_loss": -27.93454933166504, "global_step": 551495, "epoch": 6644} {"train_loss": -27.372385025024414, "global_step": 551496, "epoch": 6644} {"train_loss": -27.601781845092773, "global_step": 551497, "epoch": 6644} {"train_loss": -27.972497940063477, "global_step": 551498, "epoch": 6644} {"train_loss": -27.841108322143555, "global_step": 551499, "epoch": 6644} {"train_loss": -27.950891494750977, "global_step": 551500, "epoch": 6644} {"train_loss": -28.008153915405273, "global_step": 551501, "epoch": 6644} {"train_loss": -27.6495418548584, "global_step": 551502, "epoch": 6644} {"train_loss": -28.228153228759766, "global_step": 551503, "epoch": 6644} {"train_loss": -27.73663330078125, "global_step": 551504, "epoch": 6644} {"train_loss": -27.984949111938477, "global_step": 551505, "epoch": 6644} {"train_loss": -28.102087020874023, "global_step": 551506, "epoch": 6644} {"train_loss": -27.902883529663086, "global_step": 551507, "epoch": 6644} {"train_loss": -27.952747344970703, "global_step": 551508, "epoch": 6644} {"train_loss": -28.014301300048828, "global_step": 551509, "epoch": 6644} {"train_loss": -28.222448348999023, "global_step": 551510, "epoch": 6644} {"train_loss": -27.81304931640625, "global_step": 551511, "epoch": 6644} {"train_loss": -28.147663116455078, "global_step": 551512, "epoch": 6644} {"train_loss": -27.864709854125977, "global_step": 551513, "epoch": 6644} {"train_loss": -27.86176109313965, "global_step": 551514, "epoch": 6644} {"train_loss": -28.293317794799805, "global_step": 551515, "epoch": 6644} {"train_loss": -27.933767318725586, "global_step": 551516, "epoch": 6644} {"train_loss": -27.9619083404541, "global_step": 551517, "epoch": 6644} {"train_loss": -28.081531524658203, "global_step": 551518, "epoch": 6644} {"train_loss": -28.082727432250977, "global_step": 551519, "epoch": 6644} {"train_loss": -28.004180908203125, "global_step": 551520, "epoch": 6644} {"train_loss": -28.126028060913086, "global_step": 551521, "epoch": 6644} {"train_loss": -27.56340980529785, "global_step": 551522, "epoch": 6644} {"train_loss": -28.13348388671875, "global_step": 551523, "epoch": 6644} {"train_loss": -28.150068283081055, "global_step": 551524, "epoch": 6644} {"train_loss": -27.552656173706055, "global_step": 551525, "epoch": 6644} {"train_loss": -27.41542625427246, "global_step": 551526, "epoch": 6644} {"train_loss": -27.48018455505371, "global_step": 551527, "epoch": 6644} {"train_loss": -28.014963150024414, "global_step": 551528, "epoch": 6644} {"train_loss": -27.713117599487305, "global_step": 551529, "epoch": 6644} {"train_loss": -27.717151641845703, "global_step": 551530, "epoch": 6644} {"train_loss": -27.766538619995117, "global_step": 551531, "epoch": 6644} {"train_loss": -27.49896240234375, "global_step": 551532, "epoch": 6644} {"train_loss": -27.989049911499023, "global_step": 551533, "epoch": 6644} {"train_loss": -27.553357135818665, "global_step": 551534, "epoch": 6644, "val_loss": 6643168.0} {"train_loss": -26.85956382751465, "global_step": 551535, "epoch": 6645} {"train_loss": -26.57301139831543, "global_step": 551536, "epoch": 6645} {"train_loss": -26.9052734375, "global_step": 551537, "epoch": 6645} {"train_loss": -26.80722427368164, "global_step": 551538, "epoch": 6645} {"train_loss": -27.112476348876953, "global_step": 551539, "epoch": 6645} {"train_loss": -26.5782527923584, "global_step": 551540, "epoch": 6645} {"train_loss": -26.707406997680664, "global_step": 551541, "epoch": 6645} {"train_loss": -27.22846031188965, "global_step": 551542, "epoch": 6645} {"train_loss": -27.073841094970703, "global_step": 551543, "epoch": 6645} {"train_loss": -27.009313583374023, "global_step": 551544, "epoch": 6645} {"train_loss": -27.465009689331055, "global_step": 551545, "epoch": 6645} {"train_loss": -26.87858009338379, "global_step": 551546, "epoch": 6645} {"train_loss": -27.781213760375977, "global_step": 551547, "epoch": 6645} {"train_loss": -27.402088165283203, "global_step": 551548, "epoch": 6645} {"train_loss": -27.581378936767578, "global_step": 551549, "epoch": 6645} {"train_loss": -27.598485946655273, "global_step": 551550, "epoch": 6645} {"train_loss": -27.398340225219727, "global_step": 551551, "epoch": 6645} {"train_loss": -27.661563873291016, "global_step": 551552, "epoch": 6645} {"train_loss": -27.45026969909668, "global_step": 551553, "epoch": 6645} {"train_loss": -27.717681884765625, "global_step": 551554, "epoch": 6645} {"train_loss": -27.377424240112305, "global_step": 551555, "epoch": 6645} {"train_loss": -27.81513023376465, "global_step": 551556, "epoch": 6645} {"train_loss": -27.287372589111328, "global_step": 551557, "epoch": 6645} {"train_loss": -27.371301651000977, "global_step": 551558, "epoch": 6645} {"train_loss": -27.556232452392578, "global_step": 551559, "epoch": 6645} {"train_loss": -27.624013900756836, "global_step": 551560, "epoch": 6645} {"train_loss": -27.482816696166992, "global_step": 551561, "epoch": 6645} {"train_loss": -27.621265411376953, "global_step": 551562, "epoch": 6645} {"train_loss": -28.02556800842285, "global_step": 551563, "epoch": 6645} {"train_loss": -27.65400505065918, "global_step": 551564, "epoch": 6645} {"train_loss": -27.67780113220215, "global_step": 551565, "epoch": 6645} {"train_loss": -27.834980010986328, "global_step": 551566, "epoch": 6645} {"train_loss": -28.013355255126953, "global_step": 551567, "epoch": 6645} {"train_loss": -27.693359375, "global_step": 551568, "epoch": 6645} {"train_loss": -27.778242111206055, "global_step": 551569, "epoch": 6645} {"train_loss": -27.757461547851562, "global_step": 551570, "epoch": 6645} {"train_loss": -27.536651611328125, "global_step": 551571, "epoch": 6645} {"train_loss": -27.776721954345703, "global_step": 551572, "epoch": 6645} {"train_loss": -27.566015243530273, "global_step": 551573, "epoch": 6645} {"train_loss": -27.6027774810791, "global_step": 551574, "epoch": 6645} {"train_loss": -27.729507446289062, "global_step": 551575, "epoch": 6645} {"train_loss": -27.750051498413086, "global_step": 551576, "epoch": 6645} {"train_loss": -27.401071548461914, "global_step": 551577, "epoch": 6645} {"train_loss": -27.675825119018555, "global_step": 551578, "epoch": 6645} {"train_loss": -27.443357467651367, "global_step": 551579, "epoch": 6645} {"train_loss": -27.460342407226562, "global_step": 551580, "epoch": 6645} {"train_loss": -27.757720947265625, "global_step": 551581, "epoch": 6645} {"train_loss": -27.916584014892578, "global_step": 551582, "epoch": 6645} {"train_loss": -27.349319458007812, "global_step": 551583, "epoch": 6645} {"train_loss": -27.328723907470703, "global_step": 551584, "epoch": 6645} {"train_loss": -27.812524795532227, "global_step": 551585, "epoch": 6645} {"train_loss": -27.77608299255371, "global_step": 551586, "epoch": 6645} {"train_loss": -27.456995010375977, "global_step": 551587, "epoch": 6645} {"train_loss": -27.40134620666504, "global_step": 551588, "epoch": 6645} {"train_loss": -27.33660888671875, "global_step": 551589, "epoch": 6645} {"train_loss": -27.203582763671875, "global_step": 551590, "epoch": 6645} {"train_loss": -27.828052520751953, "global_step": 551591, "epoch": 6645} {"train_loss": -27.858203887939453, "global_step": 551592, "epoch": 6645} {"train_loss": -27.613683700561523, "global_step": 551593, "epoch": 6645} {"train_loss": -27.8144474029541, "global_step": 551594, "epoch": 6645} {"train_loss": -27.82862663269043, "global_step": 551595, "epoch": 6645} {"train_loss": -27.670515060424805, "global_step": 551596, "epoch": 6645} {"train_loss": -27.970718383789062, "global_step": 551597, "epoch": 6645} {"train_loss": -27.701465606689453, "global_step": 551598, "epoch": 6645} {"train_loss": -27.875925064086914, "global_step": 551599, "epoch": 6645} {"train_loss": -28.2083683013916, "global_step": 551600, "epoch": 6645} {"train_loss": -27.516260147094727, "global_step": 551601, "epoch": 6645} {"train_loss": -27.91069984436035, "global_step": 551602, "epoch": 6645} {"train_loss": -27.807336807250977, "global_step": 551603, "epoch": 6645} {"train_loss": -27.627349853515625, "global_step": 551604, "epoch": 6645} {"train_loss": -27.834745407104492, "global_step": 551605, "epoch": 6645} {"train_loss": -27.65801429748535, "global_step": 551606, "epoch": 6645} {"train_loss": -27.854806900024414, "global_step": 551607, "epoch": 6645} {"train_loss": -27.772144317626953, "global_step": 551608, "epoch": 6645} {"train_loss": -27.908985137939453, "global_step": 551609, "epoch": 6645} {"train_loss": -27.826797485351562, "global_step": 551610, "epoch": 6645} {"train_loss": -27.57402992248535, "global_step": 551611, "epoch": 6645} {"train_loss": -27.4901180267334, "global_step": 551612, "epoch": 6645} {"train_loss": -27.537464141845703, "global_step": 551613, "epoch": 6645} {"train_loss": -27.8317928314209, "global_step": 551614, "epoch": 6645} {"train_loss": -27.831323623657227, "global_step": 551615, "epoch": 6645} {"train_loss": -27.58771324157715, "global_step": 551616, "epoch": 6645} {"train_loss": -27.550513233046935, "global_step": 551617, "epoch": 6645, "val_loss": 6655297.5} {"train_loss": -26.93598747253418, "global_step": 551618, "epoch": 6646} {"train_loss": -27.269882202148438, "global_step": 551619, "epoch": 6646} {"train_loss": -27.53299331665039, "global_step": 551620, "epoch": 6646} {"train_loss": -26.834253311157227, "global_step": 551621, "epoch": 6646} {"train_loss": -26.394372940063477, "global_step": 551622, "epoch": 6646} {"train_loss": -27.130552291870117, "global_step": 551623, "epoch": 6646} {"train_loss": -27.687463760375977, "global_step": 551624, "epoch": 6646} {"train_loss": -27.0523738861084, "global_step": 551625, "epoch": 6646} {"train_loss": -28.063766479492188, "global_step": 551626, "epoch": 6646} {"train_loss": -27.560638427734375, "global_step": 551627, "epoch": 6646} {"train_loss": -27.36539077758789, "global_step": 551628, "epoch": 6646} {"train_loss": -27.52734375, "global_step": 551629, "epoch": 6646} {"train_loss": -27.44587516784668, "global_step": 551630, "epoch": 6646} {"train_loss": -27.520004272460938, "global_step": 551631, "epoch": 6646} {"train_loss": -27.663251876831055, "global_step": 551632, "epoch": 6646} {"train_loss": -27.457290649414062, "global_step": 551633, "epoch": 6646} {"train_loss": -27.308378219604492, "global_step": 551634, "epoch": 6646} {"train_loss": -27.577350616455078, "global_step": 551635, "epoch": 6646} {"train_loss": -27.77263832092285, "global_step": 551636, "epoch": 6646} {"train_loss": -27.327468872070312, "global_step": 551637, "epoch": 6646} {"train_loss": -27.482955932617188, "global_step": 551638, "epoch": 6646} {"train_loss": -27.361358642578125, "global_step": 551639, "epoch": 6646} {"train_loss": -27.390884399414062, "global_step": 551640, "epoch": 6646} {"train_loss": -27.48589515686035, "global_step": 551641, "epoch": 6646} {"train_loss": -27.501562118530273, "global_step": 551642, "epoch": 6646} {"train_loss": -27.529340744018555, "global_step": 551643, "epoch": 6646} {"train_loss": -27.00617790222168, "global_step": 551644, "epoch": 6646} {"train_loss": -27.65667724609375, "global_step": 551645, "epoch": 6646} {"train_loss": -27.651905059814453, "global_step": 551646, "epoch": 6646} {"train_loss": -27.789020538330078, "global_step": 551647, "epoch": 6646} {"train_loss": -27.75787353515625, "global_step": 551648, "epoch": 6646} {"train_loss": -27.58974266052246, "global_step": 551649, "epoch": 6646} {"train_loss": -27.6190128326416, "global_step": 551650, "epoch": 6646} {"train_loss": -27.530927658081055, "global_step": 551651, "epoch": 6646} {"train_loss": -27.555774688720703, "global_step": 551652, "epoch": 6646} {"train_loss": -28.014087677001953, "global_step": 551653, "epoch": 6646} {"train_loss": -27.586669921875, "global_step": 551654, "epoch": 6646} {"train_loss": -27.450117111206055, "global_step": 551655, "epoch": 6646} {"train_loss": -27.683828353881836, "global_step": 551656, "epoch": 6646} {"train_loss": -27.974323272705078, "global_step": 551657, "epoch": 6646} {"train_loss": -27.468732833862305, "global_step": 551658, "epoch": 6646} {"train_loss": -27.772125244140625, "global_step": 551659, "epoch": 6646} {"train_loss": -27.56702995300293, "global_step": 551660, "epoch": 6646} {"train_loss": -27.523696899414062, "global_step": 551661, "epoch": 6646} {"train_loss": -27.52579689025879, "global_step": 551662, "epoch": 6646} {"train_loss": -27.330413818359375, "global_step": 551663, "epoch": 6646} {"train_loss": -27.85965347290039, "global_step": 551664, "epoch": 6646} {"train_loss": -27.586881637573242, "global_step": 551665, "epoch": 6646} {"train_loss": -27.6698055267334, "global_step": 551666, "epoch": 6646} {"train_loss": -27.72096061706543, "global_step": 551667, "epoch": 6646} {"train_loss": -27.51889419555664, "global_step": 551668, "epoch": 6646} {"train_loss": -27.867727279663086, "global_step": 551669, "epoch": 6646} {"train_loss": -28.228185653686523, "global_step": 551670, "epoch": 6646} {"train_loss": -27.71121597290039, "global_step": 551671, "epoch": 6646} {"train_loss": -27.5733642578125, "global_step": 551672, "epoch": 6646} {"train_loss": -27.991403579711914, "global_step": 551673, "epoch": 6646} {"train_loss": -27.714847564697266, "global_step": 551674, "epoch": 6646} {"train_loss": -27.606992721557617, "global_step": 551675, "epoch": 6646} {"train_loss": -27.75443458557129, "global_step": 551676, "epoch": 6646} {"train_loss": -27.81812858581543, "global_step": 551677, "epoch": 6646} {"train_loss": -27.992691040039062, "global_step": 551678, "epoch": 6646} {"train_loss": -27.577863693237305, "global_step": 551679, "epoch": 6646} {"train_loss": -27.719404220581055, "global_step": 551680, "epoch": 6646} {"train_loss": -27.83833122253418, "global_step": 551681, "epoch": 6646} {"train_loss": -27.925504684448242, "global_step": 551682, "epoch": 6646} {"train_loss": -27.76149559020996, "global_step": 551683, "epoch": 6646} {"train_loss": -27.578832626342773, "global_step": 551684, "epoch": 6646} {"train_loss": -27.946775436401367, "global_step": 551685, "epoch": 6646} {"train_loss": -28.160449981689453, "global_step": 551686, "epoch": 6646} {"train_loss": -27.577899932861328, "global_step": 551687, "epoch": 6646} {"train_loss": -27.70905876159668, "global_step": 551688, "epoch": 6646} {"train_loss": -27.80460548400879, "global_step": 551689, "epoch": 6646} {"train_loss": -27.287656784057617, "global_step": 551690, "epoch": 6646} {"train_loss": -27.839563369750977, "global_step": 551691, "epoch": 6646} {"train_loss": -27.747283935546875, "global_step": 551692, "epoch": 6646} {"train_loss": -27.646671295166016, "global_step": 551693, "epoch": 6646} {"train_loss": -27.648954391479492, "global_step": 551694, "epoch": 6646} {"train_loss": -27.996374130249023, "global_step": 551695, "epoch": 6646} {"train_loss": -28.258447647094727, "global_step": 551696, "epoch": 6646} {"train_loss": -28.022573471069336, "global_step": 551697, "epoch": 6646} {"train_loss": -27.746429443359375, "global_step": 551698, "epoch": 6646} {"train_loss": -27.499921798706055, "global_step": 551699, "epoch": 6646} {"train_loss": -27.618229762617364, "global_step": 551700, "epoch": 6646, "val_loss": 6698405.0} {"train_loss": -27.5020694732666, "global_step": 551701, "epoch": 6647} {"train_loss": -26.9702205657959, "global_step": 551702, "epoch": 6647} {"train_loss": -26.43329429626465, "global_step": 551703, "epoch": 6647} {"train_loss": -27.38154411315918, "global_step": 551704, "epoch": 6647} {"train_loss": -27.306791305541992, "global_step": 551705, "epoch": 6647} {"train_loss": -27.094654083251953, "global_step": 551706, "epoch": 6647} {"train_loss": -27.414525985717773, "global_step": 551707, "epoch": 6647} {"train_loss": -27.147602081298828, "global_step": 551708, "epoch": 6647} {"train_loss": -27.298608779907227, "global_step": 551709, "epoch": 6647} {"train_loss": -27.598127365112305, "global_step": 551710, "epoch": 6647} {"train_loss": -27.20814323425293, "global_step": 551711, "epoch": 6647} {"train_loss": -27.421615600585938, "global_step": 551712, "epoch": 6647} {"train_loss": -27.568695068359375, "global_step": 551713, "epoch": 6647} {"train_loss": -27.428573608398438, "global_step": 551714, "epoch": 6647} {"train_loss": -27.078428268432617, "global_step": 551715, "epoch": 6647} {"train_loss": -27.545730590820312, "global_step": 551716, "epoch": 6647} {"train_loss": -27.462339401245117, "global_step": 551717, "epoch": 6647} {"train_loss": -27.528783798217773, "global_step": 551718, "epoch": 6647} {"train_loss": -27.56216812133789, "global_step": 551719, "epoch": 6647} {"train_loss": -27.755451202392578, "global_step": 551720, "epoch": 6647} {"train_loss": -27.541288375854492, "global_step": 551721, "epoch": 6647} {"train_loss": -27.53165054321289, "global_step": 551722, "epoch": 6647} {"train_loss": -27.364917755126953, "global_step": 551723, "epoch": 6647} {"train_loss": -27.736719131469727, "global_step": 551724, "epoch": 6647} {"train_loss": -27.58928871154785, "global_step": 551725, "epoch": 6647} {"train_loss": -27.800275802612305, "global_step": 551726, "epoch": 6647} {"train_loss": -27.48528480529785, "global_step": 551727, "epoch": 6647} {"train_loss": -27.704437255859375, "global_step": 551728, "epoch": 6647} {"train_loss": -27.87424659729004, "global_step": 551729, "epoch": 6647} {"train_loss": -27.87590980529785, "global_step": 551730, "epoch": 6647} {"train_loss": -27.6772403717041, "global_step": 551731, "epoch": 6647} {"train_loss": -27.690570831298828, "global_step": 551732, "epoch": 6647} {"train_loss": -27.997949600219727, "global_step": 551733, "epoch": 6647} {"train_loss": -27.496479034423828, "global_step": 551734, "epoch": 6647} {"train_loss": -27.94291114807129, "global_step": 551735, "epoch": 6647} {"train_loss": -27.736661911010742, "global_step": 551736, "epoch": 6647} {"train_loss": -27.9604434967041, "global_step": 551737, "epoch": 6647} {"train_loss": -28.006494522094727, "global_step": 551738, "epoch": 6647} {"train_loss": -27.764997482299805, "global_step": 551739, "epoch": 6647} {"train_loss": -27.725439071655273, "global_step": 551740, "epoch": 6647} {"train_loss": -27.740644454956055, "global_step": 551741, "epoch": 6647} {"train_loss": -27.867202758789062, "global_step": 551742, "epoch": 6647} {"train_loss": -27.8428897857666, "global_step": 551743, "epoch": 6647} {"train_loss": -27.70277214050293, "global_step": 551744, "epoch": 6647} {"train_loss": -27.788007736206055, "global_step": 551745, "epoch": 6647} {"train_loss": -27.846649169921875, "global_step": 551746, "epoch": 6647} {"train_loss": -27.974903106689453, "global_step": 551747, "epoch": 6647} {"train_loss": -27.92142105102539, "global_step": 551748, "epoch": 6647} {"train_loss": -27.52508544921875, "global_step": 551749, "epoch": 6647} {"train_loss": -27.843250274658203, "global_step": 551750, "epoch": 6647} {"train_loss": -27.848962783813477, "global_step": 551751, "epoch": 6647} {"train_loss": -27.669662475585938, "global_step": 551752, "epoch": 6647} {"train_loss": -27.846485137939453, "global_step": 551753, "epoch": 6647} {"train_loss": -27.65058708190918, "global_step": 551754, "epoch": 6647} {"train_loss": -27.7590389251709, "global_step": 551755, "epoch": 6647} {"train_loss": -27.76247215270996, "global_step": 551756, "epoch": 6647} {"train_loss": -27.654434204101562, "global_step": 551757, "epoch": 6647} {"train_loss": -27.741979598999023, "global_step": 551758, "epoch": 6647} {"train_loss": -27.812814712524414, "global_step": 551759, "epoch": 6647} {"train_loss": -28.055707931518555, "global_step": 551760, "epoch": 6647} {"train_loss": -27.7043514251709, "global_step": 551761, "epoch": 6647} {"train_loss": -27.715988159179688, "global_step": 551762, "epoch": 6647} {"train_loss": -27.472686767578125, "global_step": 551763, "epoch": 6647} {"train_loss": -27.723251342773438, "global_step": 551764, "epoch": 6647} {"train_loss": -27.604578018188477, "global_step": 551765, "epoch": 6647} {"train_loss": -27.605417251586914, "global_step": 551766, "epoch": 6647} {"train_loss": -27.673242568969727, "global_step": 551767, "epoch": 6647} {"train_loss": -27.57624626159668, "global_step": 551768, "epoch": 6647} {"train_loss": -27.900033950805664, "global_step": 551769, "epoch": 6647} {"train_loss": -27.6589412689209, "global_step": 551770, "epoch": 6647} {"train_loss": -27.892675399780273, "global_step": 551771, "epoch": 6647} {"train_loss": -28.098682403564453, "global_step": 551772, "epoch": 6647} {"train_loss": -28.041715621948242, "global_step": 551773, "epoch": 6647} {"train_loss": -27.913679122924805, "global_step": 551774, "epoch": 6647} {"train_loss": -27.600940704345703, "global_step": 551775, "epoch": 6647} {"train_loss": -27.59999656677246, "global_step": 551776, "epoch": 6647} {"train_loss": -27.793195724487305, "global_step": 551777, "epoch": 6647} {"train_loss": -27.86542320251465, "global_step": 551778, "epoch": 6647} {"train_loss": -27.87322998046875, "global_step": 551779, "epoch": 6647} {"train_loss": -27.949569702148438, "global_step": 551780, "epoch": 6647} {"train_loss": -27.6312198638916, "global_step": 551781, "epoch": 6647} {"train_loss": -27.712629318237305, "global_step": 551782, "epoch": 6647} {"train_loss": -27.65616127381842, "global_step": 551783, "epoch": 6647, "val_loss": 6711296.0} {"train_loss": -26.744848251342773, "global_step": 551784, "epoch": 6648} {"train_loss": -27.31131362915039, "global_step": 551785, "epoch": 6648} {"train_loss": -27.300159454345703, "global_step": 551786, "epoch": 6648} {"train_loss": -27.129419326782227, "global_step": 551787, "epoch": 6648} {"train_loss": -27.127395629882812, "global_step": 551788, "epoch": 6648} {"train_loss": -27.377355575561523, "global_step": 551789, "epoch": 6648} {"train_loss": -27.080488204956055, "global_step": 551790, "epoch": 6648} {"train_loss": -27.39168357849121, "global_step": 551791, "epoch": 6648} {"train_loss": -27.366668701171875, "global_step": 551792, "epoch": 6648} {"train_loss": -27.160907745361328, "global_step": 551793, "epoch": 6648} {"train_loss": -27.414093017578125, "global_step": 551794, "epoch": 6648} {"train_loss": -27.386571884155273, "global_step": 551795, "epoch": 6648} {"train_loss": -27.505956649780273, "global_step": 551796, "epoch": 6648} {"train_loss": -27.386783599853516, "global_step": 551797, "epoch": 6648} {"train_loss": -27.413745880126953, "global_step": 551798, "epoch": 6648} {"train_loss": -27.85810661315918, "global_step": 551799, "epoch": 6648} {"train_loss": -27.597187042236328, "global_step": 551800, "epoch": 6648} {"train_loss": -27.113269805908203, "global_step": 551801, "epoch": 6648} {"train_loss": -27.873991012573242, "global_step": 551802, "epoch": 6648} {"train_loss": -27.688688278198242, "global_step": 551803, "epoch": 6648} {"train_loss": -27.70943260192871, "global_step": 551804, "epoch": 6648} {"train_loss": -27.513019561767578, "global_step": 551805, "epoch": 6648} {"train_loss": -27.537200927734375, "global_step": 551806, "epoch": 6648} {"train_loss": -27.589208602905273, "global_step": 551807, "epoch": 6648} {"train_loss": -28.056745529174805, "global_step": 551808, "epoch": 6648} {"train_loss": -27.563400268554688, "global_step": 551809, "epoch": 6648} {"train_loss": -27.76951026916504, "global_step": 551810, "epoch": 6648} {"train_loss": -27.614179611206055, "global_step": 551811, "epoch": 6648} {"train_loss": -27.588232040405273, "global_step": 551812, "epoch": 6648} {"train_loss": -27.937284469604492, "global_step": 551813, "epoch": 6648} {"train_loss": -28.069746017456055, "global_step": 551814, "epoch": 6648} {"train_loss": -27.477182388305664, "global_step": 551815, "epoch": 6648} {"train_loss": -28.078006744384766, "global_step": 551816, "epoch": 6648} {"train_loss": -27.86594009399414, "global_step": 551817, "epoch": 6648} {"train_loss": -27.7156982421875, "global_step": 551818, "epoch": 6648} {"train_loss": -27.757848739624023, "global_step": 551819, "epoch": 6648} {"train_loss": -27.99151611328125, "global_step": 551820, "epoch": 6648} {"train_loss": -27.959003448486328, "global_step": 551821, "epoch": 6648} {"train_loss": -28.07051658630371, "global_step": 551822, "epoch": 6648} {"train_loss": -27.86496925354004, "global_step": 551823, "epoch": 6648} {"train_loss": -27.85849380493164, "global_step": 551824, "epoch": 6648} {"train_loss": -27.599882125854492, "global_step": 551825, "epoch": 6648} {"train_loss": -27.699560165405273, "global_step": 551826, "epoch": 6648} {"train_loss": -27.942520141601562, "global_step": 551827, "epoch": 6648} {"train_loss": -28.213232040405273, "global_step": 551828, "epoch": 6648} {"train_loss": -28.022192001342773, "global_step": 551829, "epoch": 6648} {"train_loss": -28.135534286499023, "global_step": 551830, "epoch": 6648} {"train_loss": -27.601581573486328, "global_step": 551831, "epoch": 6648} {"train_loss": -27.90777015686035, "global_step": 551832, "epoch": 6648} {"train_loss": -28.030622482299805, "global_step": 551833, "epoch": 6648} {"train_loss": -27.789962768554688, "global_step": 551834, "epoch": 6648} {"train_loss": -27.838775634765625, "global_step": 551835, "epoch": 6648} {"train_loss": -28.0731201171875, "global_step": 551836, "epoch": 6648} {"train_loss": -27.7486629486084, "global_step": 551837, "epoch": 6648} {"train_loss": -27.787954330444336, "global_step": 551838, "epoch": 6648} {"train_loss": -27.231496810913086, "global_step": 551839, "epoch": 6648} {"train_loss": -27.87177848815918, "global_step": 551840, "epoch": 6648} {"train_loss": -27.894977569580078, "global_step": 551841, "epoch": 6648} {"train_loss": -27.528478622436523, "global_step": 551842, "epoch": 6648} {"train_loss": -27.805206298828125, "global_step": 551843, "epoch": 6648} {"train_loss": -27.40633201599121, "global_step": 551844, "epoch": 6648} {"train_loss": -27.713788986206055, "global_step": 551845, "epoch": 6648} {"train_loss": -27.51218605041504, "global_step": 551846, "epoch": 6648} {"train_loss": -27.624866485595703, "global_step": 551847, "epoch": 6648} {"train_loss": -27.740753173828125, "global_step": 551848, "epoch": 6648} {"train_loss": -27.809667587280273, "global_step": 551849, "epoch": 6648} {"train_loss": -27.897541046142578, "global_step": 551850, "epoch": 6648} {"train_loss": -27.596160888671875, "global_step": 551851, "epoch": 6648} {"train_loss": -27.490957260131836, "global_step": 551852, "epoch": 6648} {"train_loss": -27.556781768798828, "global_step": 551853, "epoch": 6648} {"train_loss": -27.6656436920166, "global_step": 551854, "epoch": 6648} {"train_loss": -27.23187255859375, "global_step": 551855, "epoch": 6648} {"train_loss": -27.256921768188477, "global_step": 551856, "epoch": 6648} {"train_loss": -27.227249145507812, "global_step": 551857, "epoch": 6648} {"train_loss": -26.73830223083496, "global_step": 551858, "epoch": 6648} {"train_loss": -26.473554611206055, "global_step": 551859, "epoch": 6648} {"train_loss": -27.41669273376465, "global_step": 551860, "epoch": 6648} {"train_loss": -27.6152286529541, "global_step": 551861, "epoch": 6648} {"train_loss": -27.68108558654785, "global_step": 551862, "epoch": 6648} {"train_loss": -27.529067993164062, "global_step": 551863, "epoch": 6648} {"train_loss": -27.60003089904785, "global_step": 551864, "epoch": 6648} {"train_loss": -27.304540634155273, "global_step": 551865, "epoch": 6648} {"train_loss": -27.60420128236334, "global_step": 551866, "epoch": 6648, "val_loss": 6764137.0} {"train_loss": -27.371374130249023, "global_step": 551867, "epoch": 6649} {"train_loss": -26.117416381835938, "global_step": 551868, "epoch": 6649} {"train_loss": -26.887365341186523, "global_step": 551869, "epoch": 6649} {"train_loss": -27.193273544311523, "global_step": 551870, "epoch": 6649} {"train_loss": -26.80274772644043, "global_step": 551871, "epoch": 6649} {"train_loss": -26.858861923217773, "global_step": 551872, "epoch": 6649} {"train_loss": -26.601043701171875, "global_step": 551873, "epoch": 6649} {"train_loss": -26.649564743041992, "global_step": 551874, "epoch": 6649} {"train_loss": -27.012678146362305, "global_step": 551875, "epoch": 6649} {"train_loss": -27.322046279907227, "global_step": 551876, "epoch": 6649} {"train_loss": -27.152149200439453, "global_step": 551877, "epoch": 6649} {"train_loss": -27.51712417602539, "global_step": 551878, "epoch": 6649} {"train_loss": -26.972803115844727, "global_step": 551879, "epoch": 6649} {"train_loss": -27.521575927734375, "global_step": 551880, "epoch": 6649} {"train_loss": -27.14335060119629, "global_step": 551881, "epoch": 6649} {"train_loss": -27.333789825439453, "global_step": 551882, "epoch": 6649} {"train_loss": -27.309356689453125, "global_step": 551883, "epoch": 6649} {"train_loss": -27.376468658447266, "global_step": 551884, "epoch": 6649} {"train_loss": -27.28266716003418, "global_step": 551885, "epoch": 6649} {"train_loss": -27.417835235595703, "global_step": 551886, "epoch": 6649} {"train_loss": -27.55811882019043, "global_step": 551887, "epoch": 6649} {"train_loss": -27.05384635925293, "global_step": 551888, "epoch": 6649} {"train_loss": -27.462696075439453, "global_step": 551889, "epoch": 6649} {"train_loss": -27.5273380279541, "global_step": 551890, "epoch": 6649} {"train_loss": -27.835769653320312, "global_step": 551891, "epoch": 6649} {"train_loss": -27.433380126953125, "global_step": 551892, "epoch": 6649} {"train_loss": -27.332935333251953, "global_step": 551893, "epoch": 6649} {"train_loss": -27.9377384185791, "global_step": 551894, "epoch": 6649} {"train_loss": -27.637903213500977, "global_step": 551895, "epoch": 6649} {"train_loss": -27.81715202331543, "global_step": 551896, "epoch": 6649} {"train_loss": -27.487918853759766, "global_step": 551897, "epoch": 6649} {"train_loss": -27.91879653930664, "global_step": 551898, "epoch": 6649} {"train_loss": -27.9700927734375, "global_step": 551899, "epoch": 6649} {"train_loss": -27.86785888671875, "global_step": 551900, "epoch": 6649} {"train_loss": -27.78200340270996, "global_step": 551901, "epoch": 6649} {"train_loss": -27.82867431640625, "global_step": 551902, "epoch": 6649} {"train_loss": -27.831378936767578, "global_step": 551903, "epoch": 6649} {"train_loss": -27.938695907592773, "global_step": 551904, "epoch": 6649} {"train_loss": -28.050317764282227, "global_step": 551905, "epoch": 6649} {"train_loss": -27.7131404876709, "global_step": 551906, "epoch": 6649} {"train_loss": -27.552831649780273, "global_step": 551907, "epoch": 6649} {"train_loss": -28.114871978759766, "global_step": 551908, "epoch": 6649} {"train_loss": -28.051074981689453, "global_step": 551909, "epoch": 6649} {"train_loss": -27.9235897064209, "global_step": 551910, "epoch": 6649} {"train_loss": -27.84392738342285, "global_step": 551911, "epoch": 6649} {"train_loss": -27.9396915435791, "global_step": 551912, "epoch": 6649} {"train_loss": -27.565601348876953, "global_step": 551913, "epoch": 6649} {"train_loss": -28.17244529724121, "global_step": 551914, "epoch": 6649} {"train_loss": -27.733091354370117, "global_step": 551915, "epoch": 6649} {"train_loss": -27.871429443359375, "global_step": 551916, "epoch": 6649} {"train_loss": -27.885900497436523, "global_step": 551917, "epoch": 6649} {"train_loss": -27.734771728515625, "global_step": 551918, "epoch": 6649} {"train_loss": -27.888870239257812, "global_step": 551919, "epoch": 6649} {"train_loss": -27.761661529541016, "global_step": 551920, "epoch": 6649} {"train_loss": -27.83795738220215, "global_step": 551921, "epoch": 6649} {"train_loss": -28.06476402282715, "global_step": 551922, "epoch": 6649} {"train_loss": -27.628015518188477, "global_step": 551923, "epoch": 6649} {"train_loss": -28.121356964111328, "global_step": 551924, "epoch": 6649} {"train_loss": -27.68793296813965, "global_step": 551925, "epoch": 6649} {"train_loss": -27.798749923706055, "global_step": 551926, "epoch": 6649} {"train_loss": -28.047321319580078, "global_step": 551927, "epoch": 6649} {"train_loss": -27.816802978515625, "global_step": 551928, "epoch": 6649} {"train_loss": -28.009363174438477, "global_step": 551929, "epoch": 6649} {"train_loss": -27.390701293945312, "global_step": 551930, "epoch": 6649} {"train_loss": -27.9450740814209, "global_step": 551931, "epoch": 6649} {"train_loss": -27.792280197143555, "global_step": 551932, "epoch": 6649} {"train_loss": -27.40742301940918, "global_step": 551933, "epoch": 6649} {"train_loss": -28.02524757385254, "global_step": 551934, "epoch": 6649} {"train_loss": -28.124853134155273, "global_step": 551935, "epoch": 6649} {"train_loss": -27.95912742614746, "global_step": 551936, "epoch": 6649} {"train_loss": -27.484155654907227, "global_step": 551937, "epoch": 6649} {"train_loss": -27.2564640045166, "global_step": 551938, "epoch": 6649} {"train_loss": -27.165807723999023, "global_step": 551939, "epoch": 6649} {"train_loss": -27.221302032470703, "global_step": 551940, "epoch": 6649} {"train_loss": -27.78925895690918, "global_step": 551941, "epoch": 6649} {"train_loss": -27.385700225830078, "global_step": 551942, "epoch": 6649} {"train_loss": -27.483642578125, "global_step": 551943, "epoch": 6649} {"train_loss": -26.978137969970703, "global_step": 551944, "epoch": 6649} {"train_loss": -27.87274169921875, "global_step": 551945, "epoch": 6649} {"train_loss": -27.438825607299805, "global_step": 551946, "epoch": 6649} {"train_loss": -27.81434440612793, "global_step": 551947, "epoch": 6649} {"train_loss": -27.35041618347168, "global_step": 551948, "epoch": 6649} {"train_loss": -27.583426372114435, "global_step": 551949, "epoch": 6649, "val_loss": 6693705.0} {"train_loss": -27.071317672729492, "global_step": 551950, "epoch": 6650} {"train_loss": -27.415067672729492, "global_step": 551951, "epoch": 6650} {"train_loss": -27.41457176208496, "global_step": 551952, "epoch": 6650} {"train_loss": -26.715429306030273, "global_step": 551953, "epoch": 6650} {"train_loss": -27.282367706298828, "global_step": 551954, "epoch": 6650} {"train_loss": -27.440887451171875, "global_step": 551955, "epoch": 6650} {"train_loss": -26.890216827392578, "global_step": 551956, "epoch": 6650} {"train_loss": -27.456317901611328, "global_step": 551957, "epoch": 6650} {"train_loss": -27.082162857055664, "global_step": 551958, "epoch": 6650} {"train_loss": -27.442846298217773, "global_step": 551959, "epoch": 6650} {"train_loss": -27.25547218322754, "global_step": 551960, "epoch": 6650} {"train_loss": -27.400054931640625, "global_step": 551961, "epoch": 6650} {"train_loss": -27.39466667175293, "global_step": 551962, "epoch": 6650} {"train_loss": -27.3262996673584, "global_step": 551963, "epoch": 6650} {"train_loss": -27.618366241455078, "global_step": 551964, "epoch": 6650} {"train_loss": -27.298837661743164, "global_step": 551965, "epoch": 6650} {"train_loss": -27.502180099487305, "global_step": 551966, "epoch": 6650} {"train_loss": -27.688364028930664, "global_step": 551967, "epoch": 6650} {"train_loss": -27.965051651000977, "global_step": 551968, "epoch": 6650} {"train_loss": -27.490758895874023, "global_step": 551969, "epoch": 6650} {"train_loss": -27.224374771118164, "global_step": 551970, "epoch": 6650} {"train_loss": -27.429229736328125, "global_step": 551971, "epoch": 6650} {"train_loss": -27.54721450805664, "global_step": 551972, "epoch": 6650} {"train_loss": -27.4050350189209, "global_step": 551973, "epoch": 6650} {"train_loss": -27.426898956298828, "global_step": 551974, "epoch": 6650} {"train_loss": -27.785572052001953, "global_step": 551975, "epoch": 6650} {"train_loss": -27.9910945892334, "global_step": 551976, "epoch": 6650} {"train_loss": -27.658700942993164, "global_step": 551977, "epoch": 6650} {"train_loss": -27.307662963867188, "global_step": 551978, "epoch": 6650} {"train_loss": -27.573394775390625, "global_step": 551979, "epoch": 6650} {"train_loss": -27.490392684936523, "global_step": 551980, "epoch": 6650} {"train_loss": -27.663455963134766, "global_step": 551981, "epoch": 6650} {"train_loss": -27.3726863861084, "global_step": 551982, "epoch": 6650} {"train_loss": -27.903736114501953, "global_step": 551983, "epoch": 6650} {"train_loss": -27.750974655151367, "global_step": 551984, "epoch": 6650} {"train_loss": -27.790979385375977, "global_step": 551985, "epoch": 6650} {"train_loss": -27.707687377929688, "global_step": 551986, "epoch": 6650} {"train_loss": -27.8078556060791, "global_step": 551987, "epoch": 6650} {"train_loss": -27.96723747253418, "global_step": 551988, "epoch": 6650} {"train_loss": -27.804168701171875, "global_step": 551989, "epoch": 6650} {"train_loss": -27.87306785583496, "global_step": 551990, "epoch": 6650} {"train_loss": -27.96149253845215, "global_step": 551991, "epoch": 6650} {"train_loss": -27.64883804321289, "global_step": 551992, "epoch": 6650} {"train_loss": -27.757116317749023, "global_step": 551993, "epoch": 6650} {"train_loss": -27.774473190307617, "global_step": 551994, "epoch": 6650} {"train_loss": -27.935773849487305, "global_step": 551995, "epoch": 6650} {"train_loss": -27.971769332885742, "global_step": 551996, "epoch": 6650} {"train_loss": -27.594833374023438, "global_step": 551997, "epoch": 6650} {"train_loss": -27.784622192382812, "global_step": 551998, "epoch": 6650} {"train_loss": -27.449920654296875, "global_step": 551999, "epoch": 6650} {"train_loss": -27.9422664642334, "global_step": 552000, "epoch": 6650} {"train_loss": -27.91315269470215, "global_step": 552001, "epoch": 6650} {"train_loss": -27.587238311767578, "global_step": 552002, "epoch": 6650} {"train_loss": -27.74189567565918, "global_step": 552003, "epoch": 6650} {"train_loss": -27.77886390686035, "global_step": 552004, "epoch": 6650} {"train_loss": -27.652624130249023, "global_step": 552005, "epoch": 6650} {"train_loss": -27.950809478759766, "global_step": 552006, "epoch": 6650} {"train_loss": -27.63996696472168, "global_step": 552007, "epoch": 6650} {"train_loss": -27.716405868530273, "global_step": 552008, "epoch": 6650} {"train_loss": -27.407184600830078, "global_step": 552009, "epoch": 6650} {"train_loss": -27.71469497680664, "global_step": 552010, "epoch": 6650} {"train_loss": -27.84320068359375, "global_step": 552011, "epoch": 6650} {"train_loss": -27.557031631469727, "global_step": 552012, "epoch": 6650} {"train_loss": -27.582794189453125, "global_step": 552013, "epoch": 6650} {"train_loss": -27.789520263671875, "global_step": 552014, "epoch": 6650} {"train_loss": -27.638751983642578, "global_step": 552015, "epoch": 6650} {"train_loss": -27.727874755859375, "global_step": 552016, "epoch": 6650} {"train_loss": -27.044843673706055, "global_step": 552017, "epoch": 6650} {"train_loss": -27.24267578125, "global_step": 552018, "epoch": 6650} {"train_loss": -27.192548751831055, "global_step": 552019, "epoch": 6650} {"train_loss": -27.505298614501953, "global_step": 552020, "epoch": 6650} {"train_loss": -27.904218673706055, "global_step": 552021, "epoch": 6650} {"train_loss": -27.6370906829834, "global_step": 552022, "epoch": 6650} {"train_loss": -27.59917640686035, "global_step": 552023, "epoch": 6650} {"train_loss": -27.672433853149414, "global_step": 552024, "epoch": 6650} {"train_loss": -27.91144371032715, "global_step": 552025, "epoch": 6650} {"train_loss": -27.42822265625, "global_step": 552026, "epoch": 6650} {"train_loss": -27.643051147460938, "global_step": 552027, "epoch": 6650} {"train_loss": -27.7398624420166, "global_step": 552028, "epoch": 6650} {"train_loss": -27.574350357055664, "global_step": 552029, "epoch": 6650} {"train_loss": -27.806005477905273, "global_step": 552030, "epoch": 6650} {"train_loss": -27.774917602539062, "global_step": 552031, "epoch": 6650} {"train_loss": -27.585655120481928, "global_step": 552032, "epoch": 6650, "train/sim_max_reward_0": 0.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4500000": 1.0, "test/sim_max_reward_4500001": 1.0, "test/sim_max_reward_4500002": 1.0, "test/sim_max_reward_4500003": 1.0, "test/sim_max_reward_4500004": 0.0, "test/sim_max_reward_4500005": 1.0, "test/sim_max_reward_4500006": 1.0, "test/sim_max_reward_4500007": 0.0, "test/sim_max_reward_4500008": 1.0, "test/sim_max_reward_4500009": 1.0, "test/sim_max_reward_4500010": 1.0, "test/sim_max_reward_4500011": 1.0, "test/sim_max_reward_4500012": 1.0, "test/sim_max_reward_4500013": 1.0, "test/sim_max_reward_4500014": 1.0, "test/sim_max_reward_4500015": 1.0, "test/sim_max_reward_4500016": 1.0, "test/sim_max_reward_4500017": 1.0, "test/sim_max_reward_4500018": 0.0, "test/sim_max_reward_4500019": 0.0, "test/sim_max_reward_4500020": 1.0, "test/sim_max_reward_4500021": 1.0, "train/mean_score": 0.8333333333333334, "test/mean_score": 0.8181818181818182, "val_loss": 6653133.0} {"train_loss": -26.0479793548584, "global_step": 552033, "epoch": 6651} {"train_loss": -26.279279708862305, "global_step": 552034, "epoch": 6651} {"train_loss": -27.17215919494629, "global_step": 552035, "epoch": 6651} {"train_loss": -27.451251983642578, "global_step": 552036, "epoch": 6651} {"train_loss": -27.147668838500977, "global_step": 552037, "epoch": 6651} {"train_loss": -27.348743438720703, "global_step": 552038, "epoch": 6651} {"train_loss": -27.601926803588867, "global_step": 552039, "epoch": 6651} {"train_loss": -27.29920768737793, "global_step": 552040, "epoch": 6651} {"train_loss": -27.293649673461914, "global_step": 552041, "epoch": 6651} {"train_loss": -27.247547149658203, "global_step": 552042, "epoch": 6651} {"train_loss": -26.957380294799805, "global_step": 552043, "epoch": 6651} {"train_loss": -27.467472076416016, "global_step": 552044, "epoch": 6651} {"train_loss": -27.271961212158203, "global_step": 552045, "epoch": 6651} {"train_loss": -27.469635009765625, "global_step": 552046, "epoch": 6651} {"train_loss": -27.579877853393555, "global_step": 552047, "epoch": 6651} {"train_loss": -27.24091911315918, "global_step": 552048, "epoch": 6651} {"train_loss": -27.468530654907227, "global_step": 552049, "epoch": 6651} {"train_loss": -27.588748931884766, "global_step": 552050, "epoch": 6651} {"train_loss": -27.886096954345703, "global_step": 552051, "epoch": 6651} {"train_loss": -27.65614128112793, "global_step": 552052, "epoch": 6651} {"train_loss": -27.647611618041992, "global_step": 552053, "epoch": 6651} {"train_loss": -27.605670928955078, "global_step": 552054, "epoch": 6651} {"train_loss": -27.692459106445312, "global_step": 552055, "epoch": 6651} {"train_loss": -27.470067977905273, "global_step": 552056, "epoch": 6651} {"train_loss": -27.422657012939453, "global_step": 552057, "epoch": 6651} {"train_loss": -27.38443946838379, "global_step": 552058, "epoch": 6651} {"train_loss": -27.4713191986084, "global_step": 552059, "epoch": 6651} {"train_loss": -27.804594039916992, "global_step": 552060, "epoch": 6651} {"train_loss": -27.968358993530273, "global_step": 552061, "epoch": 6651} {"train_loss": -27.31424331665039, "global_step": 552062, "epoch": 6651} {"train_loss": -27.585586547851562, "global_step": 552063, "epoch": 6651} {"train_loss": -27.669843673706055, "global_step": 552064, "epoch": 6651} {"train_loss": -27.653614044189453, "global_step": 552065, "epoch": 6651} {"train_loss": -27.5035343170166, "global_step": 552066, "epoch": 6651} {"train_loss": -27.727325439453125, "global_step": 552067, "epoch": 6651} {"train_loss": -27.341718673706055, "global_step": 552068, "epoch": 6651} {"train_loss": -27.414432525634766, "global_step": 552069, "epoch": 6651} {"train_loss": -27.745670318603516, "global_step": 552070, "epoch": 6651} {"train_loss": -27.867841720581055, "global_step": 552071, "epoch": 6651} {"train_loss": -28.08988380432129, "global_step": 552072, "epoch": 6651} {"train_loss": -27.894128799438477, "global_step": 552073, "epoch": 6651} {"train_loss": -27.677474975585938, "global_step": 552074, "epoch": 6651} {"train_loss": -27.975025177001953, "global_step": 552075, "epoch": 6651} {"train_loss": -27.9389591217041, "global_step": 552076, "epoch": 6651} {"train_loss": -27.709583282470703, "global_step": 552077, "epoch": 6651} {"train_loss": -28.091577529907227, "global_step": 552078, "epoch": 6651} {"train_loss": -28.07341957092285, "global_step": 552079, "epoch": 6651} {"train_loss": -27.71058464050293, "global_step": 552080, "epoch": 6651} {"train_loss": -27.94944190979004, "global_step": 552081, "epoch": 6651} {"train_loss": -27.843618392944336, "global_step": 552082, "epoch": 6651} {"train_loss": -27.717931747436523, "global_step": 552083, "epoch": 6651} {"train_loss": -27.89448356628418, "global_step": 552084, "epoch": 6651} {"train_loss": -27.9913272857666, "global_step": 552085, "epoch": 6651} {"train_loss": -27.988195419311523, "global_step": 552086, "epoch": 6651} {"train_loss": -27.9034481048584, "global_step": 552087, "epoch": 6651} {"train_loss": -27.960264205932617, "global_step": 552088, "epoch": 6651} {"train_loss": -27.848648071289062, "global_step": 552089, "epoch": 6651} {"train_loss": -27.564451217651367, "global_step": 552090, "epoch": 6651} {"train_loss": -28.034870147705078, "global_step": 552091, "epoch": 6651} {"train_loss": -28.27467918395996, "global_step": 552092, "epoch": 6651} {"train_loss": -28.203794479370117, "global_step": 552093, "epoch": 6651} {"train_loss": -28.085620880126953, "global_step": 552094, "epoch": 6651} {"train_loss": -27.43207359313965, "global_step": 552095, "epoch": 6651} {"train_loss": -27.303319931030273, "global_step": 552096, "epoch": 6651} {"train_loss": -26.89691734313965, "global_step": 552097, "epoch": 6651} {"train_loss": -26.377241134643555, "global_step": 552098, "epoch": 6651} {"train_loss": -25.883087158203125, "global_step": 552099, "epoch": 6651} {"train_loss": -27.072900772094727, "global_step": 552100, "epoch": 6651} {"train_loss": -27.497907638549805, "global_step": 552101, "epoch": 6651} {"train_loss": -27.63343620300293, "global_step": 552102, "epoch": 6651} {"train_loss": -27.24439811706543, "global_step": 552103, "epoch": 6651} {"train_loss": -27.5646915435791, "global_step": 552104, "epoch": 6651} {"train_loss": -27.62909507751465, "global_step": 552105, "epoch": 6651} {"train_loss": -27.5015869140625, "global_step": 552106, "epoch": 6651} {"train_loss": -27.368356704711914, "global_step": 552107, "epoch": 6651} {"train_loss": -27.677356719970703, "global_step": 552108, "epoch": 6651} {"train_loss": -27.716144561767578, "global_step": 552109, "epoch": 6651} {"train_loss": -27.583404541015625, "global_step": 552110, "epoch": 6651} {"train_loss": -27.61277198791504, "global_step": 552111, "epoch": 6651} {"train_loss": -27.564355850219727, "global_step": 552112, "epoch": 6651} {"train_loss": -27.774099349975586, "global_step": 552113, "epoch": 6651} {"train_loss": -27.63795280456543, "global_step": 552114, "epoch": 6651} {"train_loss": -27.567313251725164, "global_step": 552115, "epoch": 6651, "val_loss": 6678909.0} {"train_loss": -27.519134521484375, "global_step": 552116, "epoch": 6652} {"train_loss": -27.315876007080078, "global_step": 552117, "epoch": 6652} {"train_loss": -27.290369033813477, "global_step": 552118, "epoch": 6652} {"train_loss": -26.6207218170166, "global_step": 552119, "epoch": 6652} {"train_loss": -27.368534088134766, "global_step": 552120, "epoch": 6652} {"train_loss": -26.798629760742188, "global_step": 552121, "epoch": 6652} {"train_loss": -27.129474639892578, "global_step": 552122, "epoch": 6652} {"train_loss": -27.258258819580078, "global_step": 552123, "epoch": 6652} {"train_loss": -27.401123046875, "global_step": 552124, "epoch": 6652} {"train_loss": -27.343835830688477, "global_step": 552125, "epoch": 6652} {"train_loss": -27.684894561767578, "global_step": 552126, "epoch": 6652} {"train_loss": -27.402158737182617, "global_step": 552127, "epoch": 6652} {"train_loss": -27.36395835876465, "global_step": 552128, "epoch": 6652} {"train_loss": -27.571552276611328, "global_step": 552129, "epoch": 6652} {"train_loss": -27.535968780517578, "global_step": 552130, "epoch": 6652} {"train_loss": -27.26090431213379, "global_step": 552131, "epoch": 6652} {"train_loss": -27.45966148376465, "global_step": 552132, "epoch": 6652} {"train_loss": -27.689594268798828, "global_step": 552133, "epoch": 6652} {"train_loss": -27.609411239624023, "global_step": 552134, "epoch": 6652} {"train_loss": -27.69209098815918, "global_step": 552135, "epoch": 6652} {"train_loss": -27.72796630859375, "global_step": 552136, "epoch": 6652} {"train_loss": -27.323591232299805, "global_step": 552137, "epoch": 6652} {"train_loss": -27.855224609375, "global_step": 552138, "epoch": 6652} {"train_loss": -27.859527587890625, "global_step": 552139, "epoch": 6652} {"train_loss": -27.8795166015625, "global_step": 552140, "epoch": 6652} {"train_loss": -28.06146240234375, "global_step": 552141, "epoch": 6652} {"train_loss": -27.978656768798828, "global_step": 552142, "epoch": 6652} {"train_loss": -27.497684478759766, "global_step": 552143, "epoch": 6652} {"train_loss": -28.087390899658203, "global_step": 552144, "epoch": 6652} {"train_loss": -28.10451316833496, "global_step": 552145, "epoch": 6652} {"train_loss": -27.85567283630371, "global_step": 552146, "epoch": 6652} {"train_loss": -28.202789306640625, "global_step": 552147, "epoch": 6652} {"train_loss": -27.7265567779541, "global_step": 552148, "epoch": 6652} {"train_loss": -27.926965713500977, "global_step": 552149, "epoch": 6652} {"train_loss": -27.818130493164062, "global_step": 552150, "epoch": 6652} {"train_loss": -28.095508575439453, "global_step": 552151, "epoch": 6652} {"train_loss": -28.07834815979004, "global_step": 552152, "epoch": 6652} {"train_loss": -27.9209041595459, "global_step": 552153, "epoch": 6652} {"train_loss": -27.79438591003418, "global_step": 552154, "epoch": 6652} {"train_loss": -27.7575626373291, "global_step": 552155, "epoch": 6652} {"train_loss": -27.776769638061523, "global_step": 552156, "epoch": 6652} {"train_loss": -27.977991104125977, "global_step": 552157, "epoch": 6652} {"train_loss": -27.9547176361084, "global_step": 552158, "epoch": 6652} {"train_loss": -27.985488891601562, "global_step": 552159, "epoch": 6652} {"train_loss": -28.282785415649414, "global_step": 552160, "epoch": 6652} {"train_loss": -28.02338981628418, "global_step": 552161, "epoch": 6652} {"train_loss": -27.683629989624023, "global_step": 552162, "epoch": 6652} {"train_loss": -28.137863159179688, "global_step": 552163, "epoch": 6652} {"train_loss": -27.930389404296875, "global_step": 552164, "epoch": 6652} {"train_loss": -27.974340438842773, "global_step": 552165, "epoch": 6652} {"train_loss": -27.730243682861328, "global_step": 552166, "epoch": 6652} {"train_loss": -28.132858276367188, "global_step": 552167, "epoch": 6652} {"train_loss": -27.677398681640625, "global_step": 552168, "epoch": 6652} {"train_loss": -27.950223922729492, "global_step": 552169, "epoch": 6652} {"train_loss": -28.146930694580078, "global_step": 552170, "epoch": 6652} {"train_loss": -27.954076766967773, "global_step": 552171, "epoch": 6652} {"train_loss": -28.11740493774414, "global_step": 552172, "epoch": 6652} {"train_loss": -28.154544830322266, "global_step": 552173, "epoch": 6652} {"train_loss": -27.9711971282959, "global_step": 552174, "epoch": 6652} {"train_loss": -27.682722091674805, "global_step": 552175, "epoch": 6652} {"train_loss": -27.80628776550293, "global_step": 552176, "epoch": 6652} {"train_loss": -27.859771728515625, "global_step": 552177, "epoch": 6652} {"train_loss": -27.963972091674805, "global_step": 552178, "epoch": 6652} {"train_loss": -27.706750869750977, "global_step": 552179, "epoch": 6652} {"train_loss": -27.621856689453125, "global_step": 552180, "epoch": 6652} {"train_loss": -27.480148315429688, "global_step": 552181, "epoch": 6652} {"train_loss": -27.612852096557617, "global_step": 552182, "epoch": 6652} {"train_loss": -27.259180068969727, "global_step": 552183, "epoch": 6652} {"train_loss": -27.34202003479004, "global_step": 552184, "epoch": 6652} {"train_loss": -27.4910945892334, "global_step": 552185, "epoch": 6652} {"train_loss": -27.842199325561523, "global_step": 552186, "epoch": 6652} {"train_loss": -27.685888290405273, "global_step": 552187, "epoch": 6652} {"train_loss": -27.56617546081543, "global_step": 552188, "epoch": 6652} {"train_loss": -27.56536865234375, "global_step": 552189, "epoch": 6652} {"train_loss": -27.778234481811523, "global_step": 552190, "epoch": 6652} {"train_loss": -27.5834903717041, "global_step": 552191, "epoch": 6652} {"train_loss": -27.886398315429688, "global_step": 552192, "epoch": 6652} {"train_loss": -28.219587326049805, "global_step": 552193, "epoch": 6652} {"train_loss": -27.650897979736328, "global_step": 552194, "epoch": 6652} {"train_loss": -27.754995346069336, "global_step": 552195, "epoch": 6652} {"train_loss": -27.67621421813965, "global_step": 552196, "epoch": 6652} {"train_loss": -27.48151969909668, "global_step": 552197, "epoch": 6652} {"train_loss": -27.73240319217544, "global_step": 552198, "epoch": 6652, "val_loss": 6653233.0} {"train_loss": -27.298511505126953, "global_step": 552199, "epoch": 6653} {"train_loss": -27.01443862915039, "global_step": 552200, "epoch": 6653} {"train_loss": -27.2202205657959, "global_step": 552201, "epoch": 6653} {"train_loss": -26.95538330078125, "global_step": 552202, "epoch": 6653} {"train_loss": -27.562314987182617, "global_step": 552203, "epoch": 6653} {"train_loss": -27.07899284362793, "global_step": 552204, "epoch": 6653} {"train_loss": -27.487552642822266, "global_step": 552205, "epoch": 6653} {"train_loss": -27.186071395874023, "global_step": 552206, "epoch": 6653} {"train_loss": -27.46552085876465, "global_step": 552207, "epoch": 6653} {"train_loss": -27.601484298706055, "global_step": 552208, "epoch": 6653} {"train_loss": -27.45379638671875, "global_step": 552209, "epoch": 6653} {"train_loss": -27.30059242248535, "global_step": 552210, "epoch": 6653} {"train_loss": -27.5275821685791, "global_step": 552211, "epoch": 6653} {"train_loss": -27.392148971557617, "global_step": 552212, "epoch": 6653} {"train_loss": -27.563251495361328, "global_step": 552213, "epoch": 6653} {"train_loss": -27.428815841674805, "global_step": 552214, "epoch": 6653} {"train_loss": -27.497726440429688, "global_step": 552215, "epoch": 6653} {"train_loss": -27.78627586364746, "global_step": 552216, "epoch": 6653} {"train_loss": -27.335676193237305, "global_step": 552217, "epoch": 6653} {"train_loss": -27.593957901000977, "global_step": 552218, "epoch": 6653} {"train_loss": -27.6641902923584, "global_step": 552219, "epoch": 6653} {"train_loss": -27.2842960357666, "global_step": 552220, "epoch": 6653} {"train_loss": -27.951269149780273, "global_step": 552221, "epoch": 6653} {"train_loss": -27.4781436920166, "global_step": 552222, "epoch": 6653} {"train_loss": -27.53131103515625, "global_step": 552223, "epoch": 6653} {"train_loss": -27.470361709594727, "global_step": 552224, "epoch": 6653} {"train_loss": -27.829809188842773, "global_step": 552225, "epoch": 6653} {"train_loss": -27.818622589111328, "global_step": 552226, "epoch": 6653} {"train_loss": -27.690170288085938, "global_step": 552227, "epoch": 6653} {"train_loss": -27.631689071655273, "global_step": 552228, "epoch": 6653} {"train_loss": -27.567846298217773, "global_step": 552229, "epoch": 6653} {"train_loss": -27.398488998413086, "global_step": 552230, "epoch": 6653} {"train_loss": -27.490758895874023, "global_step": 552231, "epoch": 6653} {"train_loss": -27.978595733642578, "global_step": 552232, "epoch": 6653} {"train_loss": -27.5715274810791, "global_step": 552233, "epoch": 6653} {"train_loss": -27.705854415893555, "global_step": 552234, "epoch": 6653} {"train_loss": -27.987415313720703, "global_step": 552235, "epoch": 6653} {"train_loss": -27.37338638305664, "global_step": 552236, "epoch": 6653} {"train_loss": -28.07297706604004, "global_step": 552237, "epoch": 6653} {"train_loss": -28.103986740112305, "global_step": 552238, "epoch": 6653} {"train_loss": -27.685989379882812, "global_step": 552239, "epoch": 6653} {"train_loss": -27.642786026000977, "global_step": 552240, "epoch": 6653} {"train_loss": -27.81281089782715, "global_step": 552241, "epoch": 6653} {"train_loss": -28.15054702758789, "global_step": 552242, "epoch": 6653} {"train_loss": -27.6353816986084, "global_step": 552243, "epoch": 6653} {"train_loss": -27.71868896484375, "global_step": 552244, "epoch": 6653} {"train_loss": -28.01090431213379, "global_step": 552245, "epoch": 6653} {"train_loss": -28.223302841186523, "global_step": 552246, "epoch": 6653} {"train_loss": -27.65850830078125, "global_step": 552247, "epoch": 6653} {"train_loss": -27.705739974975586, "global_step": 552248, "epoch": 6653} {"train_loss": -28.09576988220215, "global_step": 552249, "epoch": 6653} {"train_loss": -27.51767349243164, "global_step": 552250, "epoch": 6653} {"train_loss": -28.171140670776367, "global_step": 552251, "epoch": 6653} {"train_loss": -27.7178897857666, "global_step": 552252, "epoch": 6653} {"train_loss": -27.651336669921875, "global_step": 552253, "epoch": 6653} {"train_loss": -27.851160049438477, "global_step": 552254, "epoch": 6653} {"train_loss": -27.85529899597168, "global_step": 552255, "epoch": 6653} {"train_loss": -27.754499435424805, "global_step": 552256, "epoch": 6653} {"train_loss": -27.460988998413086, "global_step": 552257, "epoch": 6653} {"train_loss": -27.137378692626953, "global_step": 552258, "epoch": 6653} {"train_loss": -27.320600509643555, "global_step": 552259, "epoch": 6653} {"train_loss": -27.986230850219727, "global_step": 552260, "epoch": 6653} {"train_loss": -27.525400161743164, "global_step": 552261, "epoch": 6653} {"train_loss": -27.245147705078125, "global_step": 552262, "epoch": 6653} {"train_loss": -27.282516479492188, "global_step": 552263, "epoch": 6653} {"train_loss": -27.655454635620117, "global_step": 552264, "epoch": 6653} {"train_loss": -27.77190589904785, "global_step": 552265, "epoch": 6653} {"train_loss": -27.309646606445312, "global_step": 552266, "epoch": 6653} {"train_loss": -27.89434814453125, "global_step": 552267, "epoch": 6653} {"train_loss": -27.794179916381836, "global_step": 552268, "epoch": 6653} {"train_loss": -27.379165649414062, "global_step": 552269, "epoch": 6653} {"train_loss": -27.53564453125, "global_step": 552270, "epoch": 6653} {"train_loss": -27.712406158447266, "global_step": 552271, "epoch": 6653} {"train_loss": -27.579700469970703, "global_step": 552272, "epoch": 6653} {"train_loss": -27.8549747467041, "global_step": 552273, "epoch": 6653} {"train_loss": -27.68135643005371, "global_step": 552274, "epoch": 6653} {"train_loss": -27.9342041015625, "global_step": 552275, "epoch": 6653} {"train_loss": -27.654132843017578, "global_step": 552276, "epoch": 6653} {"train_loss": -27.84486198425293, "global_step": 552277, "epoch": 6653} {"train_loss": -28.043903350830078, "global_step": 552278, "epoch": 6653} {"train_loss": -27.701074600219727, "global_step": 552279, "epoch": 6653} {"train_loss": -28.000349044799805, "global_step": 552280, "epoch": 6653} {"train_loss": -27.61366212224386, "global_step": 552281, "epoch": 6653, "val_loss": 6641060.0} {"train_loss": -27.1324462890625, "global_step": 552282, "epoch": 6654} {"train_loss": -27.477767944335938, "global_step": 552283, "epoch": 6654} {"train_loss": -26.84528923034668, "global_step": 552284, "epoch": 6654} {"train_loss": -27.36958122253418, "global_step": 552285, "epoch": 6654} {"train_loss": -27.201704025268555, "global_step": 552286, "epoch": 6654} {"train_loss": -27.508737564086914, "global_step": 552287, "epoch": 6654} {"train_loss": -27.2088623046875, "global_step": 552288, "epoch": 6654} {"train_loss": -27.534610748291016, "global_step": 552289, "epoch": 6654} {"train_loss": -27.427701950073242, "global_step": 552290, "epoch": 6654} {"train_loss": -27.206329345703125, "global_step": 552291, "epoch": 6654} {"train_loss": -27.584341049194336, "global_step": 552292, "epoch": 6654} {"train_loss": -27.122669219970703, "global_step": 552293, "epoch": 6654} {"train_loss": -27.350317001342773, "global_step": 552294, "epoch": 6654} {"train_loss": -27.348102569580078, "global_step": 552295, "epoch": 6654} {"train_loss": -27.424413681030273, "global_step": 552296, "epoch": 6654} {"train_loss": -27.346654891967773, "global_step": 552297, "epoch": 6654} {"train_loss": -27.498279571533203, "global_step": 552298, "epoch": 6654} {"train_loss": -27.801660537719727, "global_step": 552299, "epoch": 6654} {"train_loss": -27.3477725982666, "global_step": 552300, "epoch": 6654} {"train_loss": -27.52418327331543, "global_step": 552301, "epoch": 6654} {"train_loss": -27.785303115844727, "global_step": 552302, "epoch": 6654} {"train_loss": -27.794031143188477, "global_step": 552303, "epoch": 6654} {"train_loss": -27.53448486328125, "global_step": 552304, "epoch": 6654} {"train_loss": -27.676130294799805, "global_step": 552305, "epoch": 6654} {"train_loss": -28.005970001220703, "global_step": 552306, "epoch": 6654} {"train_loss": -27.814542770385742, "global_step": 552307, "epoch": 6654} {"train_loss": -27.810327529907227, "global_step": 552308, "epoch": 6654} {"train_loss": -27.831567764282227, "global_step": 552309, "epoch": 6654} {"train_loss": -28.075658798217773, "global_step": 552310, "epoch": 6654} {"train_loss": -27.937040328979492, "global_step": 552311, "epoch": 6654} {"train_loss": -27.738983154296875, "global_step": 552312, "epoch": 6654} {"train_loss": -27.848691940307617, "global_step": 552313, "epoch": 6654} {"train_loss": -27.905996322631836, "global_step": 552314, "epoch": 6654} {"train_loss": -27.70100975036621, "global_step": 552315, "epoch": 6654} {"train_loss": -27.541311264038086, "global_step": 552316, "epoch": 6654} {"train_loss": -27.485702514648438, "global_step": 552317, "epoch": 6654} {"train_loss": -27.289148330688477, "global_step": 552318, "epoch": 6654} {"train_loss": -27.29347038269043, "global_step": 552319, "epoch": 6654} {"train_loss": -27.561542510986328, "global_step": 552320, "epoch": 6654} {"train_loss": -28.029645919799805, "global_step": 552321, "epoch": 6654} {"train_loss": -27.646848678588867, "global_step": 552322, "epoch": 6654} {"train_loss": -27.322702407836914, "global_step": 552323, "epoch": 6654} {"train_loss": -27.716629028320312, "global_step": 552324, "epoch": 6654} {"train_loss": -27.711837768554688, "global_step": 552325, "epoch": 6654} {"train_loss": -27.85806655883789, "global_step": 552326, "epoch": 6654} {"train_loss": -27.774396896362305, "global_step": 552327, "epoch": 6654} {"train_loss": -27.883813858032227, "global_step": 552328, "epoch": 6654} {"train_loss": -27.859113693237305, "global_step": 552329, "epoch": 6654} {"train_loss": -27.777036666870117, "global_step": 552330, "epoch": 6654} {"train_loss": -28.005573272705078, "global_step": 552331, "epoch": 6654} {"train_loss": -27.791025161743164, "global_step": 552332, "epoch": 6654} {"train_loss": -27.81298828125, "global_step": 552333, "epoch": 6654} {"train_loss": -27.652746200561523, "global_step": 552334, "epoch": 6654} {"train_loss": -27.4924373626709, "global_step": 552335, "epoch": 6654} {"train_loss": -27.3739070892334, "global_step": 552336, "epoch": 6654} {"train_loss": -28.049591064453125, "global_step": 552337, "epoch": 6654} {"train_loss": -27.68670082092285, "global_step": 552338, "epoch": 6654} {"train_loss": -27.8113956451416, "global_step": 552339, "epoch": 6654} {"train_loss": -27.938806533813477, "global_step": 552340, "epoch": 6654} {"train_loss": -27.635330200195312, "global_step": 552341, "epoch": 6654} {"train_loss": -27.896087646484375, "global_step": 552342, "epoch": 6654} {"train_loss": -27.770227432250977, "global_step": 552343, "epoch": 6654} {"train_loss": -27.74808120727539, "global_step": 552344, "epoch": 6654} {"train_loss": -27.597976684570312, "global_step": 552345, "epoch": 6654} {"train_loss": -27.521686553955078, "global_step": 552346, "epoch": 6654} {"train_loss": -27.659610748291016, "global_step": 552347, "epoch": 6654} {"train_loss": -27.675861358642578, "global_step": 552348, "epoch": 6654} {"train_loss": -27.763336181640625, "global_step": 552349, "epoch": 6654} {"train_loss": -28.030248641967773, "global_step": 552350, "epoch": 6654} {"train_loss": -28.177183151245117, "global_step": 552351, "epoch": 6654} {"train_loss": -27.92616081237793, "global_step": 552352, "epoch": 6654} {"train_loss": -27.62750244140625, "global_step": 552353, "epoch": 6654} {"train_loss": -27.860422134399414, "global_step": 552354, "epoch": 6654} {"train_loss": -27.83013343811035, "global_step": 552355, "epoch": 6654} {"train_loss": -27.401220321655273, "global_step": 552356, "epoch": 6654} {"train_loss": -27.740018844604492, "global_step": 552357, "epoch": 6654} {"train_loss": -27.294666290283203, "global_step": 552358, "epoch": 6654} {"train_loss": -27.302936553955078, "global_step": 552359, "epoch": 6654} {"train_loss": -27.47882652282715, "global_step": 552360, "epoch": 6654} {"train_loss": -27.6591854095459, "global_step": 552361, "epoch": 6654} {"train_loss": -28.087997436523438, "global_step": 552362, "epoch": 6654} {"train_loss": -27.6101131439209, "global_step": 552363, "epoch": 6654} {"train_loss": -27.6359760100583, "global_step": 552364, "epoch": 6654, "val_loss": 6658248.0} {"train_loss": -27.339330673217773, "global_step": 552365, "epoch": 6655} {"train_loss": -27.242673873901367, "global_step": 552366, "epoch": 6655} {"train_loss": -27.27679443359375, "global_step": 552367, "epoch": 6655} {"train_loss": -27.366321563720703, "global_step": 552368, "epoch": 6655} {"train_loss": -27.58070182800293, "global_step": 552369, "epoch": 6655} {"train_loss": -27.597620010375977, "global_step": 552370, "epoch": 6655} {"train_loss": -27.251996994018555, "global_step": 552371, "epoch": 6655} {"train_loss": -27.585025787353516, "global_step": 552372, "epoch": 6655} {"train_loss": -27.684310913085938, "global_step": 552373, "epoch": 6655} {"train_loss": -27.19585609436035, "global_step": 552374, "epoch": 6655} {"train_loss": -27.13698387145996, "global_step": 552375, "epoch": 6655} {"train_loss": -27.32563591003418, "global_step": 552376, "epoch": 6655} {"train_loss": -27.21006202697754, "global_step": 552377, "epoch": 6655} {"train_loss": -27.781116485595703, "global_step": 552378, "epoch": 6655} {"train_loss": -27.101333618164062, "global_step": 552379, "epoch": 6655} {"train_loss": -27.569660186767578, "global_step": 552380, "epoch": 6655} {"train_loss": -27.19353675842285, "global_step": 552381, "epoch": 6655} {"train_loss": -27.385190963745117, "global_step": 552382, "epoch": 6655} {"train_loss": -27.5601863861084, "global_step": 552383, "epoch": 6655} {"train_loss": -27.40924644470215, "global_step": 552384, "epoch": 6655} {"train_loss": -27.75282096862793, "global_step": 552385, "epoch": 6655} {"train_loss": -27.563568115234375, "global_step": 552386, "epoch": 6655} {"train_loss": -27.784101486206055, "global_step": 552387, "epoch": 6655} {"train_loss": -27.555959701538086, "global_step": 552388, "epoch": 6655} {"train_loss": -27.794586181640625, "global_step": 552389, "epoch": 6655} {"train_loss": -27.964155197143555, "global_step": 552390, "epoch": 6655} {"train_loss": -27.720386505126953, "global_step": 552391, "epoch": 6655} {"train_loss": -27.808258056640625, "global_step": 552392, "epoch": 6655} {"train_loss": -27.43463706970215, "global_step": 552393, "epoch": 6655} {"train_loss": -27.49104118347168, "global_step": 552394, "epoch": 6655} {"train_loss": -28.188098907470703, "global_step": 552395, "epoch": 6655} {"train_loss": -27.916879653930664, "global_step": 552396, "epoch": 6655} {"train_loss": -27.978897094726562, "global_step": 552397, "epoch": 6655} {"train_loss": -28.17376708984375, "global_step": 552398, "epoch": 6655} {"train_loss": -27.785730361938477, "global_step": 552399, "epoch": 6655} {"train_loss": -28.087324142456055, "global_step": 552400, "epoch": 6655} {"train_loss": -27.913848876953125, "global_step": 552401, "epoch": 6655} {"train_loss": -27.957538604736328, "global_step": 552402, "epoch": 6655} {"train_loss": -27.46571159362793, "global_step": 552403, "epoch": 6655} {"train_loss": -27.9288272857666, "global_step": 552404, "epoch": 6655} {"train_loss": -27.957975387573242, "global_step": 552405, "epoch": 6655} {"train_loss": -27.94083595275879, "global_step": 552406, "epoch": 6655} {"train_loss": -28.005781173706055, "global_step": 552407, "epoch": 6655} {"train_loss": -28.126392364501953, "global_step": 552408, "epoch": 6655} {"train_loss": -28.20478630065918, "global_step": 552409, "epoch": 6655} {"train_loss": -28.11215591430664, "global_step": 552410, "epoch": 6655} {"train_loss": -27.78449058532715, "global_step": 552411, "epoch": 6655} {"train_loss": -27.44940757751465, "global_step": 552412, "epoch": 6655} {"train_loss": -27.574934005737305, "global_step": 552413, "epoch": 6655} {"train_loss": -27.8511962890625, "global_step": 552414, "epoch": 6655} {"train_loss": -27.384790420532227, "global_step": 552415, "epoch": 6655} {"train_loss": -27.332250595092773, "global_step": 552416, "epoch": 6655} {"train_loss": -28.159748077392578, "global_step": 552417, "epoch": 6655} {"train_loss": -27.6250057220459, "global_step": 552418, "epoch": 6655} {"train_loss": -27.673954010009766, "global_step": 552419, "epoch": 6655} {"train_loss": -27.625537872314453, "global_step": 552420, "epoch": 6655} {"train_loss": -27.966909408569336, "global_step": 552421, "epoch": 6655} {"train_loss": -27.6552791595459, "global_step": 552422, "epoch": 6655} {"train_loss": -27.4998722076416, "global_step": 552423, "epoch": 6655} {"train_loss": -27.650775909423828, "global_step": 552424, "epoch": 6655} {"train_loss": -27.489013671875, "global_step": 552425, "epoch": 6655} {"train_loss": -27.5697078704834, "global_step": 552426, "epoch": 6655} {"train_loss": -27.616941452026367, "global_step": 552427, "epoch": 6655} {"train_loss": -27.76222038269043, "global_step": 552428, "epoch": 6655} {"train_loss": -27.699878692626953, "global_step": 552429, "epoch": 6655} {"train_loss": -27.668806076049805, "global_step": 552430, "epoch": 6655} {"train_loss": -27.59794044494629, "global_step": 552431, "epoch": 6655} {"train_loss": -27.537017822265625, "global_step": 552432, "epoch": 6655} {"train_loss": -27.18112564086914, "global_step": 552433, "epoch": 6655} {"train_loss": -26.561588287353516, "global_step": 552434, "epoch": 6655} {"train_loss": -26.353429794311523, "global_step": 552435, "epoch": 6655} {"train_loss": -26.96869468688965, "global_step": 552436, "epoch": 6655} {"train_loss": -27.458932876586914, "global_step": 552437, "epoch": 6655} {"train_loss": -27.35430335998535, "global_step": 552438, "epoch": 6655} {"train_loss": -27.158863067626953, "global_step": 552439, "epoch": 6655} {"train_loss": -27.41385269165039, "global_step": 552440, "epoch": 6655} {"train_loss": -27.1707706451416, "global_step": 552441, "epoch": 6655} {"train_loss": -27.742517471313477, "global_step": 552442, "epoch": 6655} {"train_loss": -27.516326904296875, "global_step": 552443, "epoch": 6655} {"train_loss": -27.481372833251953, "global_step": 552444, "epoch": 6655} {"train_loss": -27.518857955932617, "global_step": 552445, "epoch": 6655} {"train_loss": -27.923803329467773, "global_step": 552446, "epoch": 6655} {"train_loss": -27.573087416499494, "global_step": 552447, "epoch": 6655, "val_loss": 6566815.0} {"train_loss": -27.152877807617188, "global_step": 552448, "epoch": 6656} {"train_loss": -27.251800537109375, "global_step": 552449, "epoch": 6656} {"train_loss": -27.093976974487305, "global_step": 552450, "epoch": 6656} {"train_loss": -26.9741268157959, "global_step": 552451, "epoch": 6656} {"train_loss": -26.853260040283203, "global_step": 552452, "epoch": 6656} {"train_loss": -27.2217960357666, "global_step": 552453, "epoch": 6656} {"train_loss": -27.543659210205078, "global_step": 552454, "epoch": 6656} {"train_loss": -27.102827072143555, "global_step": 552455, "epoch": 6656} {"train_loss": -27.211414337158203, "global_step": 552456, "epoch": 6656} {"train_loss": -27.632282257080078, "global_step": 552457, "epoch": 6656} {"train_loss": -27.492475509643555, "global_step": 552458, "epoch": 6656} {"train_loss": -27.23333168029785, "global_step": 552459, "epoch": 6656} {"train_loss": -27.612049102783203, "global_step": 552460, "epoch": 6656} {"train_loss": -27.44362449645996, "global_step": 552461, "epoch": 6656} {"train_loss": -27.57037353515625, "global_step": 552462, "epoch": 6656} {"train_loss": -27.023340225219727, "global_step": 552463, "epoch": 6656} {"train_loss": -27.415206909179688, "global_step": 552464, "epoch": 6656} {"train_loss": -27.311527252197266, "global_step": 552465, "epoch": 6656} {"train_loss": -27.55292320251465, "global_step": 552466, "epoch": 6656} {"train_loss": -27.988788604736328, "global_step": 552467, "epoch": 6656} {"train_loss": -27.671918869018555, "global_step": 552468, "epoch": 6656} {"train_loss": -27.5787353515625, "global_step": 552469, "epoch": 6656} {"train_loss": -27.658872604370117, "global_step": 552470, "epoch": 6656} {"train_loss": -27.812047958374023, "global_step": 552471, "epoch": 6656} {"train_loss": -27.606124877929688, "global_step": 552472, "epoch": 6656} {"train_loss": -27.76856803894043, "global_step": 552473, "epoch": 6656} {"train_loss": -27.755390167236328, "global_step": 552474, "epoch": 6656} {"train_loss": -27.966238021850586, "global_step": 552475, "epoch": 6656} {"train_loss": -27.892684936523438, "global_step": 552476, "epoch": 6656} {"train_loss": -27.84808349609375, "global_step": 552477, "epoch": 6656} {"train_loss": -27.820117950439453, "global_step": 552478, "epoch": 6656} {"train_loss": -27.702213287353516, "global_step": 552479, "epoch": 6656} {"train_loss": -27.579975128173828, "global_step": 552480, "epoch": 6656} {"train_loss": -27.560815811157227, "global_step": 552481, "epoch": 6656} {"train_loss": -27.9603214263916, "global_step": 552482, "epoch": 6656} {"train_loss": -27.722875595092773, "global_step": 552483, "epoch": 6656} {"train_loss": -27.88384437561035, "global_step": 552484, "epoch": 6656} {"train_loss": -27.759668350219727, "global_step": 552485, "epoch": 6656} {"train_loss": -28.386157989501953, "global_step": 552486, "epoch": 6656} {"train_loss": -28.2624568939209, "global_step": 552487, "epoch": 6656} {"train_loss": -27.783472061157227, "global_step": 552488, "epoch": 6656} {"train_loss": -27.788604736328125, "global_step": 552489, "epoch": 6656} {"train_loss": -27.84917640686035, "global_step": 552490, "epoch": 6656} {"train_loss": -27.5672664642334, "global_step": 552491, "epoch": 6656} {"train_loss": -27.89325523376465, "global_step": 552492, "epoch": 6656} {"train_loss": -27.739978790283203, "global_step": 552493, "epoch": 6656} {"train_loss": -27.767438888549805, "global_step": 552494, "epoch": 6656} {"train_loss": -28.06165885925293, "global_step": 552495, "epoch": 6656} {"train_loss": -27.918277740478516, "global_step": 552496, "epoch": 6656} {"train_loss": -27.450510025024414, "global_step": 552497, "epoch": 6656} {"train_loss": -27.707672119140625, "global_step": 552498, "epoch": 6656} {"train_loss": -27.033111572265625, "global_step": 552499, "epoch": 6656} {"train_loss": -27.079370498657227, "global_step": 552500, "epoch": 6656} {"train_loss": -27.604272842407227, "global_step": 552501, "epoch": 6656} {"train_loss": -27.8640193939209, "global_step": 552502, "epoch": 6656} {"train_loss": -27.273468017578125, "global_step": 552503, "epoch": 6656} {"train_loss": -27.294599533081055, "global_step": 552504, "epoch": 6656} {"train_loss": -27.44679069519043, "global_step": 552505, "epoch": 6656} {"train_loss": -27.539098739624023, "global_step": 552506, "epoch": 6656} {"train_loss": -27.523359298706055, "global_step": 552507, "epoch": 6656} {"train_loss": -27.712121963500977, "global_step": 552508, "epoch": 6656} {"train_loss": -27.561552047729492, "global_step": 552509, "epoch": 6656} {"train_loss": -27.69093132019043, "global_step": 552510, "epoch": 6656} {"train_loss": -27.59326171875, "global_step": 552511, "epoch": 6656} {"train_loss": -27.723220825195312, "global_step": 552512, "epoch": 6656} {"train_loss": -27.84817886352539, "global_step": 552513, "epoch": 6656} {"train_loss": -27.468164443969727, "global_step": 552514, "epoch": 6656} {"train_loss": -28.019678115844727, "global_step": 552515, "epoch": 6656} {"train_loss": -27.526464462280273, "global_step": 552516, "epoch": 6656} {"train_loss": -27.9332332611084, "global_step": 552517, "epoch": 6656} {"train_loss": -28.1025447845459, "global_step": 552518, "epoch": 6656} {"train_loss": -27.6861629486084, "global_step": 552519, "epoch": 6656} {"train_loss": -27.8663272857666, "global_step": 552520, "epoch": 6656} {"train_loss": -27.652099609375, "global_step": 552521, "epoch": 6656} {"train_loss": -27.805648803710938, "global_step": 552522, "epoch": 6656} {"train_loss": -27.65154457092285, "global_step": 552523, "epoch": 6656} {"train_loss": -28.1682186126709, "global_step": 552524, "epoch": 6656} {"train_loss": -27.85342788696289, "global_step": 552525, "epoch": 6656} {"train_loss": -27.765722274780273, "global_step": 552526, "epoch": 6656} {"train_loss": -27.761280059814453, "global_step": 552527, "epoch": 6656} {"train_loss": -27.437885284423828, "global_step": 552528, "epoch": 6656} {"train_loss": -27.70843505859375, "global_step": 552529, "epoch": 6656} {"train_loss": -27.622957045773425, "global_step": 552530, "epoch": 6656, "val_loss": 6663985.5} {"train_loss": -27.262426376342773, "global_step": 552531, "epoch": 6657} {"train_loss": -27.0566349029541, "global_step": 552532, "epoch": 6657} {"train_loss": -26.553205490112305, "global_step": 552533, "epoch": 6657} {"train_loss": -26.07346534729004, "global_step": 552534, "epoch": 6657} {"train_loss": -25.988361358642578, "global_step": 552535, "epoch": 6657} {"train_loss": -27.009906768798828, "global_step": 552536, "epoch": 6657} {"train_loss": -27.435546875, "global_step": 552537, "epoch": 6657} {"train_loss": -26.96014404296875, "global_step": 552538, "epoch": 6657} {"train_loss": -27.231359481811523, "global_step": 552539, "epoch": 6657} {"train_loss": -26.58985710144043, "global_step": 552540, "epoch": 6657} {"train_loss": -27.00868034362793, "global_step": 552541, "epoch": 6657} {"train_loss": -27.163572311401367, "global_step": 552542, "epoch": 6657} {"train_loss": -27.460973739624023, "global_step": 552543, "epoch": 6657} {"train_loss": -27.38104248046875, "global_step": 552544, "epoch": 6657} {"train_loss": -27.52345085144043, "global_step": 552545, "epoch": 6657} {"train_loss": -27.646108627319336, "global_step": 552546, "epoch": 6657} {"train_loss": -27.3057918548584, "global_step": 552547, "epoch": 6657} {"train_loss": -27.542882919311523, "global_step": 552548, "epoch": 6657} {"train_loss": -27.423126220703125, "global_step": 552549, "epoch": 6657} {"train_loss": -27.576141357421875, "global_step": 552550, "epoch": 6657} {"train_loss": -27.765546798706055, "global_step": 552551, "epoch": 6657} {"train_loss": -27.521459579467773, "global_step": 552552, "epoch": 6657} {"train_loss": -27.713537216186523, "global_step": 552553, "epoch": 6657} {"train_loss": -27.89527702331543, "global_step": 552554, "epoch": 6657} {"train_loss": -27.476993560791016, "global_step": 552555, "epoch": 6657} {"train_loss": -27.696353912353516, "global_step": 552556, "epoch": 6657} {"train_loss": -27.3193416595459, "global_step": 552557, "epoch": 6657} {"train_loss": -27.78187370300293, "global_step": 552558, "epoch": 6657} {"train_loss": -27.875654220581055, "global_step": 552559, "epoch": 6657} {"train_loss": -28.03420066833496, "global_step": 552560, "epoch": 6657} {"train_loss": -27.837514877319336, "global_step": 552561, "epoch": 6657} {"train_loss": -27.767166137695312, "global_step": 552562, "epoch": 6657} {"train_loss": -27.779672622680664, "global_step": 552563, "epoch": 6657} {"train_loss": -27.841480255126953, "global_step": 552564, "epoch": 6657} {"train_loss": -27.62548828125, "global_step": 552565, "epoch": 6657} {"train_loss": -27.86952018737793, "global_step": 552566, "epoch": 6657} {"train_loss": -28.112140655517578, "global_step": 552567, "epoch": 6657} {"train_loss": -27.68722915649414, "global_step": 552568, "epoch": 6657} {"train_loss": -28.059326171875, "global_step": 552569, "epoch": 6657} {"train_loss": -27.85761070251465, "global_step": 552570, "epoch": 6657} {"train_loss": -27.53839683532715, "global_step": 552571, "epoch": 6657} {"train_loss": -27.91548728942871, "global_step": 552572, "epoch": 6657} {"train_loss": -27.399518966674805, "global_step": 552573, "epoch": 6657} {"train_loss": -27.389404296875, "global_step": 552574, "epoch": 6657} {"train_loss": -27.43828773498535, "global_step": 552575, "epoch": 6657} {"train_loss": -28.039352416992188, "global_step": 552576, "epoch": 6657} {"train_loss": -27.356733322143555, "global_step": 552577, "epoch": 6657} {"train_loss": -27.634063720703125, "global_step": 552578, "epoch": 6657} {"train_loss": -27.320615768432617, "global_step": 552579, "epoch": 6657} {"train_loss": -27.378311157226562, "global_step": 552580, "epoch": 6657} {"train_loss": -27.220495223999023, "global_step": 552581, "epoch": 6657} {"train_loss": -27.642812728881836, "global_step": 552582, "epoch": 6657} {"train_loss": -28.5395565032959, "global_step": 552583, "epoch": 6657} {"train_loss": -27.377273559570312, "global_step": 552584, "epoch": 6657} {"train_loss": -27.890995025634766, "global_step": 552585, "epoch": 6657} {"train_loss": -27.7087345123291, "global_step": 552586, "epoch": 6657} {"train_loss": -27.388280868530273, "global_step": 552587, "epoch": 6657} {"train_loss": -27.53577995300293, "global_step": 552588, "epoch": 6657} {"train_loss": -27.655288696289062, "global_step": 552589, "epoch": 6657} {"train_loss": -27.60989761352539, "global_step": 552590, "epoch": 6657} {"train_loss": -27.933013916015625, "global_step": 552591, "epoch": 6657} {"train_loss": -27.900693893432617, "global_step": 552592, "epoch": 6657} {"train_loss": -27.868200302124023, "global_step": 552593, "epoch": 6657} {"train_loss": -27.58033561706543, "global_step": 552594, "epoch": 6657} {"train_loss": -27.87289810180664, "global_step": 552595, "epoch": 6657} {"train_loss": -27.495386123657227, "global_step": 552596, "epoch": 6657} {"train_loss": -27.60968589782715, "global_step": 552597, "epoch": 6657} {"train_loss": -27.71803092956543, "global_step": 552598, "epoch": 6657} {"train_loss": -27.958709716796875, "global_step": 552599, "epoch": 6657} {"train_loss": -27.74141502380371, "global_step": 552600, "epoch": 6657} {"train_loss": -27.822559356689453, "global_step": 552601, "epoch": 6657} {"train_loss": -27.834487915039062, "global_step": 552602, "epoch": 6657} {"train_loss": -28.118600845336914, "global_step": 552603, "epoch": 6657} {"train_loss": -27.78725242614746, "global_step": 552604, "epoch": 6657} {"train_loss": -27.734472274780273, "global_step": 552605, "epoch": 6657} {"train_loss": -28.248703002929688, "global_step": 552606, "epoch": 6657} {"train_loss": -27.641803741455078, "global_step": 552607, "epoch": 6657} {"train_loss": -27.71522331237793, "global_step": 552608, "epoch": 6657} {"train_loss": -27.832101821899414, "global_step": 552609, "epoch": 6657} {"train_loss": -27.668115615844727, "global_step": 552610, "epoch": 6657} {"train_loss": -27.666305541992188, "global_step": 552611, "epoch": 6657} {"train_loss": -27.18216896057129, "global_step": 552612, "epoch": 6657} {"train_loss": -27.565664705023707, "global_step": 552613, "epoch": 6657, "val_loss": 6673482.0} {"train_loss": -27.702871322631836, "global_step": 552614, "epoch": 6658} {"train_loss": -26.461652755737305, "global_step": 552615, "epoch": 6658} {"train_loss": -26.76239013671875, "global_step": 552616, "epoch": 6658} {"train_loss": -27.194799423217773, "global_step": 552617, "epoch": 6658} {"train_loss": -26.11516761779785, "global_step": 552618, "epoch": 6658} {"train_loss": -27.017765045166016, "global_step": 552619, "epoch": 6658} {"train_loss": -26.7865047454834, "global_step": 552620, "epoch": 6658} {"train_loss": -26.5943603515625, "global_step": 552621, "epoch": 6658} {"train_loss": -26.539737701416016, "global_step": 552622, "epoch": 6658} {"train_loss": -26.9129581451416, "global_step": 552623, "epoch": 6658} {"train_loss": -27.005945205688477, "global_step": 552624, "epoch": 6658} {"train_loss": -27.20184326171875, "global_step": 552625, "epoch": 6658} {"train_loss": -27.409835815429688, "global_step": 552626, "epoch": 6658} {"train_loss": -27.3538761138916, "global_step": 552627, "epoch": 6658} {"train_loss": -26.906024932861328, "global_step": 552628, "epoch": 6658} {"train_loss": -27.398605346679688, "global_step": 552629, "epoch": 6658} {"train_loss": -26.852014541625977, "global_step": 552630, "epoch": 6658} {"train_loss": -27.39800453186035, "global_step": 552631, "epoch": 6658} {"train_loss": -26.9555721282959, "global_step": 552632, "epoch": 6658} {"train_loss": -27.154775619506836, "global_step": 552633, "epoch": 6658} {"train_loss": -26.855087280273438, "global_step": 552634, "epoch": 6658} {"train_loss": -27.0765380859375, "global_step": 552635, "epoch": 6658} {"train_loss": -27.584339141845703, "global_step": 552636, "epoch": 6658} {"train_loss": -27.402973175048828, "global_step": 552637, "epoch": 6658} {"train_loss": -27.221418380737305, "global_step": 552638, "epoch": 6658} {"train_loss": -27.765745162963867, "global_step": 552639, "epoch": 6658} {"train_loss": -27.752416610717773, "global_step": 552640, "epoch": 6658} {"train_loss": -27.61260986328125, "global_step": 552641, "epoch": 6658} {"train_loss": -27.3709716796875, "global_step": 552642, "epoch": 6658} {"train_loss": -27.522314071655273, "global_step": 552643, "epoch": 6658} {"train_loss": -27.20111083984375, "global_step": 552644, "epoch": 6658} {"train_loss": -27.68332862854004, "global_step": 552645, "epoch": 6658} {"train_loss": -27.48712730407715, "global_step": 552646, "epoch": 6658} {"train_loss": -27.662572860717773, "global_step": 552647, "epoch": 6658} {"train_loss": -27.73386001586914, "global_step": 552648, "epoch": 6658} {"train_loss": -27.77544593811035, "global_step": 552649, "epoch": 6658} {"train_loss": -27.454303741455078, "global_step": 552650, "epoch": 6658} {"train_loss": -27.797880172729492, "global_step": 552651, "epoch": 6658} {"train_loss": -27.68869400024414, "global_step": 552652, "epoch": 6658} {"train_loss": -27.495548248291016, "global_step": 552653, "epoch": 6658} {"train_loss": -27.287622451782227, "global_step": 552654, "epoch": 6658} {"train_loss": -27.577322006225586, "global_step": 552655, "epoch": 6658} {"train_loss": -27.904468536376953, "global_step": 552656, "epoch": 6658} {"train_loss": -27.101287841796875, "global_step": 552657, "epoch": 6658} {"train_loss": -27.925352096557617, "global_step": 552658, "epoch": 6658} {"train_loss": -27.757307052612305, "global_step": 552659, "epoch": 6658} {"train_loss": -27.441198348999023, "global_step": 552660, "epoch": 6658} {"train_loss": -27.0600528717041, "global_step": 552661, "epoch": 6658} {"train_loss": -27.862268447875977, "global_step": 552662, "epoch": 6658} {"train_loss": -27.712890625, "global_step": 552663, "epoch": 6658} {"train_loss": -27.318510055541992, "global_step": 552664, "epoch": 6658} {"train_loss": -27.416242599487305, "global_step": 552665, "epoch": 6658} {"train_loss": -27.63678550720215, "global_step": 552666, "epoch": 6658} {"train_loss": -27.425424575805664, "global_step": 552667, "epoch": 6658} {"train_loss": -27.37507438659668, "global_step": 552668, "epoch": 6658} {"train_loss": -27.09307861328125, "global_step": 552669, "epoch": 6658} {"train_loss": -27.765125274658203, "global_step": 552670, "epoch": 6658} {"train_loss": -27.597980499267578, "global_step": 552671, "epoch": 6658} {"train_loss": -27.032180786132812, "global_step": 552672, "epoch": 6658} {"train_loss": -27.737646102905273, "global_step": 552673, "epoch": 6658} {"train_loss": -27.430362701416016, "global_step": 552674, "epoch": 6658} {"train_loss": -27.78736686706543, "global_step": 552675, "epoch": 6658} {"train_loss": -27.877172470092773, "global_step": 552676, "epoch": 6658} {"train_loss": -28.016315460205078, "global_step": 552677, "epoch": 6658} {"train_loss": -27.8629207611084, "global_step": 552678, "epoch": 6658} {"train_loss": -27.725507736206055, "global_step": 552679, "epoch": 6658} {"train_loss": -27.916385650634766, "global_step": 552680, "epoch": 6658} {"train_loss": -27.937265396118164, "global_step": 552681, "epoch": 6658} {"train_loss": -27.82480812072754, "global_step": 552682, "epoch": 6658} {"train_loss": -27.89298439025879, "global_step": 552683, "epoch": 6658} {"train_loss": -28.02566909790039, "global_step": 552684, "epoch": 6658} {"train_loss": -28.141401290893555, "global_step": 552685, "epoch": 6658} {"train_loss": -27.76564598083496, "global_step": 552686, "epoch": 6658} {"train_loss": -27.571813583374023, "global_step": 552687, "epoch": 6658} {"train_loss": -27.955347061157227, "global_step": 552688, "epoch": 6658} {"train_loss": -27.709333419799805, "global_step": 552689, "epoch": 6658} {"train_loss": -27.796255111694336, "global_step": 552690, "epoch": 6658} {"train_loss": -27.631086349487305, "global_step": 552691, "epoch": 6658} {"train_loss": -27.817346572875977, "global_step": 552692, "epoch": 6658} {"train_loss": -28.14236831665039, "global_step": 552693, "epoch": 6658} {"train_loss": -27.744840621948242, "global_step": 552694, "epoch": 6658} {"train_loss": -28.262155532836914, "global_step": 552695, "epoch": 6658} {"train_loss": -27.4855464108019, "global_step": 552696, "epoch": 6658, "val_loss": 6693568.5} {"train_loss": -27.141036987304688, "global_step": 552697, "epoch": 6659} {"train_loss": -26.81781005859375, "global_step": 552698, "epoch": 6659} {"train_loss": -25.74237060546875, "global_step": 552699, "epoch": 6659} {"train_loss": -25.231399536132812, "global_step": 552700, "epoch": 6659} {"train_loss": -26.17439842224121, "global_step": 552701, "epoch": 6659} {"train_loss": -26.806182861328125, "global_step": 552702, "epoch": 6659} {"train_loss": -25.961896896362305, "global_step": 552703, "epoch": 6659} {"train_loss": -26.93048095703125, "global_step": 552704, "epoch": 6659} {"train_loss": -26.32386589050293, "global_step": 552705, "epoch": 6659} {"train_loss": -27.40301513671875, "global_step": 552706, "epoch": 6659} {"train_loss": -26.6646671295166, "global_step": 552707, "epoch": 6659} {"train_loss": -26.98065185546875, "global_step": 552708, "epoch": 6659} {"train_loss": -26.903257369995117, "global_step": 552709, "epoch": 6659} {"train_loss": -27.36029624938965, "global_step": 552710, "epoch": 6659} {"train_loss": -27.1726131439209, "global_step": 552711, "epoch": 6659} {"train_loss": -27.651044845581055, "global_step": 552712, "epoch": 6659} {"train_loss": -26.918350219726562, "global_step": 552713, "epoch": 6659} {"train_loss": -27.306379318237305, "global_step": 552714, "epoch": 6659} {"train_loss": -27.380979537963867, "global_step": 552715, "epoch": 6659} {"train_loss": -27.51079750061035, "global_step": 552716, "epoch": 6659} {"train_loss": -27.23794937133789, "global_step": 552717, "epoch": 6659} {"train_loss": -27.57440185546875, "global_step": 552718, "epoch": 6659} {"train_loss": -27.294891357421875, "global_step": 552719, "epoch": 6659} {"train_loss": -27.56165885925293, "global_step": 552720, "epoch": 6659} {"train_loss": -27.293249130249023, "global_step": 552721, "epoch": 6659} {"train_loss": -27.675928115844727, "global_step": 552722, "epoch": 6659} {"train_loss": -27.41763687133789, "global_step": 552723, "epoch": 6659} {"train_loss": -27.785669326782227, "global_step": 552724, "epoch": 6659} {"train_loss": -27.449853897094727, "global_step": 552725, "epoch": 6659} {"train_loss": -27.556360244750977, "global_step": 552726, "epoch": 6659} {"train_loss": -27.444116592407227, "global_step": 552727, "epoch": 6659} {"train_loss": -27.563989639282227, "global_step": 552728, "epoch": 6659} {"train_loss": -27.791522979736328, "global_step": 552729, "epoch": 6659} {"train_loss": -27.393524169921875, "global_step": 552730, "epoch": 6659} {"train_loss": -27.47810173034668, "global_step": 552731, "epoch": 6659} {"train_loss": -27.879230499267578, "global_step": 552732, "epoch": 6659} {"train_loss": -27.477493286132812, "global_step": 552733, "epoch": 6659} {"train_loss": -27.797704696655273, "global_step": 552734, "epoch": 6659} {"train_loss": -27.960983276367188, "global_step": 552735, "epoch": 6659} {"train_loss": -27.581806182861328, "global_step": 552736, "epoch": 6659} {"train_loss": -28.067840576171875, "global_step": 552737, "epoch": 6659} {"train_loss": -27.869794845581055, "global_step": 552738, "epoch": 6659} {"train_loss": -27.609363555908203, "global_step": 552739, "epoch": 6659} {"train_loss": -27.879169464111328, "global_step": 552740, "epoch": 6659} {"train_loss": -27.89727783203125, "global_step": 552741, "epoch": 6659} {"train_loss": -27.665246963500977, "global_step": 552742, "epoch": 6659} {"train_loss": -27.948429107666016, "global_step": 552743, "epoch": 6659} {"train_loss": -27.919382095336914, "global_step": 552744, "epoch": 6659} {"train_loss": -28.086023330688477, "global_step": 552745, "epoch": 6659} {"train_loss": -27.80924415588379, "global_step": 552746, "epoch": 6659} {"train_loss": -27.92069435119629, "global_step": 552747, "epoch": 6659} {"train_loss": -27.85328483581543, "global_step": 552748, "epoch": 6659} {"train_loss": -28.15577507019043, "global_step": 552749, "epoch": 6659} {"train_loss": -27.825632095336914, "global_step": 552750, "epoch": 6659} {"train_loss": -27.564804077148438, "global_step": 552751, "epoch": 6659} {"train_loss": -27.817941665649414, "global_step": 552752, "epoch": 6659} {"train_loss": -27.9466552734375, "global_step": 552753, "epoch": 6659} {"train_loss": -28.045700073242188, "global_step": 552754, "epoch": 6659} {"train_loss": -27.599124908447266, "global_step": 552755, "epoch": 6659} {"train_loss": -27.513126373291016, "global_step": 552756, "epoch": 6659} {"train_loss": -27.619863510131836, "global_step": 552757, "epoch": 6659} {"train_loss": -28.035573959350586, "global_step": 552758, "epoch": 6659} {"train_loss": -27.811487197875977, "global_step": 552759, "epoch": 6659} {"train_loss": -27.824756622314453, "global_step": 552760, "epoch": 6659} {"train_loss": -28.125354766845703, "global_step": 552761, "epoch": 6659} {"train_loss": -27.6646785736084, "global_step": 552762, "epoch": 6659} {"train_loss": -27.451879501342773, "global_step": 552763, "epoch": 6659} {"train_loss": -28.006439208984375, "global_step": 552764, "epoch": 6659} {"train_loss": -28.043493270874023, "global_step": 552765, "epoch": 6659} {"train_loss": -27.72027015686035, "global_step": 552766, "epoch": 6659} {"train_loss": -27.98554801940918, "global_step": 552767, "epoch": 6659} {"train_loss": -27.74798583984375, "global_step": 552768, "epoch": 6659} {"train_loss": -27.372894287109375, "global_step": 552769, "epoch": 6659} {"train_loss": -27.491437911987305, "global_step": 552770, "epoch": 6659} {"train_loss": -27.782773971557617, "global_step": 552771, "epoch": 6659} {"train_loss": -27.787229537963867, "global_step": 552772, "epoch": 6659} {"train_loss": -27.51897621154785, "global_step": 552773, "epoch": 6659} {"train_loss": -27.870813369750977, "global_step": 552774, "epoch": 6659} {"train_loss": -28.24469566345215, "global_step": 552775, "epoch": 6659} {"train_loss": -27.74468421936035, "global_step": 552776, "epoch": 6659} {"train_loss": -27.592212677001953, "global_step": 552777, "epoch": 6659} {"train_loss": -27.857257843017578, "global_step": 552778, "epoch": 6659} {"train_loss": -27.511182991855115, "global_step": 552779, "epoch": 6659, "val_loss": 6665259.0} {"train_loss": -27.109378814697266, "global_step": 552780, "epoch": 6660} {"train_loss": -27.226476669311523, "global_step": 552781, "epoch": 6660} {"train_loss": -27.4025936126709, "global_step": 552782, "epoch": 6660} {"train_loss": -27.27335548400879, "global_step": 552783, "epoch": 6660} {"train_loss": -27.828723907470703, "global_step": 552784, "epoch": 6660} {"train_loss": -27.264097213745117, "global_step": 552785, "epoch": 6660} {"train_loss": -27.497943878173828, "global_step": 552786, "epoch": 6660} {"train_loss": -27.393476486206055, "global_step": 552787, "epoch": 6660} {"train_loss": -27.3443546295166, "global_step": 552788, "epoch": 6660} {"train_loss": -27.684064865112305, "global_step": 552789, "epoch": 6660} {"train_loss": -27.1583309173584, "global_step": 552790, "epoch": 6660} {"train_loss": -27.422407150268555, "global_step": 552791, "epoch": 6660} {"train_loss": -27.293792724609375, "global_step": 552792, "epoch": 6660} {"train_loss": -27.881086349487305, "global_step": 552793, "epoch": 6660} {"train_loss": -27.621137619018555, "global_step": 552794, "epoch": 6660} {"train_loss": -27.626422882080078, "global_step": 552795, "epoch": 6660} {"train_loss": -27.280073165893555, "global_step": 552796, "epoch": 6660} {"train_loss": -27.760961532592773, "global_step": 552797, "epoch": 6660} {"train_loss": -27.646366119384766, "global_step": 552798, "epoch": 6660} {"train_loss": -27.907413482666016, "global_step": 552799, "epoch": 6660} {"train_loss": -27.601978302001953, "global_step": 552800, "epoch": 6660} {"train_loss": -27.748294830322266, "global_step": 552801, "epoch": 6660} {"train_loss": -27.797794342041016, "global_step": 552802, "epoch": 6660} {"train_loss": -27.733007431030273, "global_step": 552803, "epoch": 6660} {"train_loss": -27.784332275390625, "global_step": 552804, "epoch": 6660} {"train_loss": -27.511905670166016, "global_step": 552805, "epoch": 6660} {"train_loss": -27.984228134155273, "global_step": 552806, "epoch": 6660} {"train_loss": -27.850723266601562, "global_step": 552807, "epoch": 6660} {"train_loss": -27.81428337097168, "global_step": 552808, "epoch": 6660} {"train_loss": -27.905675888061523, "global_step": 552809, "epoch": 6660} {"train_loss": -27.961383819580078, "global_step": 552810, "epoch": 6660} {"train_loss": -27.75758171081543, "global_step": 552811, "epoch": 6660} {"train_loss": -27.99390983581543, "global_step": 552812, "epoch": 6660} {"train_loss": -27.802783966064453, "global_step": 552813, "epoch": 6660} {"train_loss": -27.557531356811523, "global_step": 552814, "epoch": 6660} {"train_loss": -28.16290855407715, "global_step": 552815, "epoch": 6660} {"train_loss": -28.01895523071289, "global_step": 552816, "epoch": 6660} {"train_loss": -27.66753578186035, "global_step": 552817, "epoch": 6660} {"train_loss": -27.719196319580078, "global_step": 552818, "epoch": 6660} {"train_loss": -27.924274444580078, "global_step": 552819, "epoch": 6660} {"train_loss": -27.891773223876953, "global_step": 552820, "epoch": 6660} {"train_loss": -27.86380386352539, "global_step": 552821, "epoch": 6660} {"train_loss": -27.52483558654785, "global_step": 552822, "epoch": 6660} {"train_loss": -27.91560173034668, "global_step": 552823, "epoch": 6660} {"train_loss": -28.027862548828125, "global_step": 552824, "epoch": 6660} {"train_loss": -28.011709213256836, "global_step": 552825, "epoch": 6660} {"train_loss": -27.977888107299805, "global_step": 552826, "epoch": 6660} {"train_loss": -27.841949462890625, "global_step": 552827, "epoch": 6660} {"train_loss": -28.300073623657227, "global_step": 552828, "epoch": 6660} {"train_loss": -27.707788467407227, "global_step": 552829, "epoch": 6660} {"train_loss": -28.104867935180664, "global_step": 552830, "epoch": 6660} {"train_loss": -27.532209396362305, "global_step": 552831, "epoch": 6660} {"train_loss": -27.8656005859375, "global_step": 552832, "epoch": 6660} {"train_loss": -27.32683753967285, "global_step": 552833, "epoch": 6660} {"train_loss": -27.748565673828125, "global_step": 552834, "epoch": 6660} {"train_loss": -27.635812759399414, "global_step": 552835, "epoch": 6660} {"train_loss": -28.1024169921875, "global_step": 552836, "epoch": 6660} {"train_loss": -27.54237937927246, "global_step": 552837, "epoch": 6660} {"train_loss": -27.3244686126709, "global_step": 552838, "epoch": 6660} {"train_loss": -26.904678344726562, "global_step": 552839, "epoch": 6660} {"train_loss": -27.524005889892578, "global_step": 552840, "epoch": 6660} {"train_loss": -27.794204711914062, "global_step": 552841, "epoch": 6660} {"train_loss": -27.361209869384766, "global_step": 552842, "epoch": 6660} {"train_loss": -27.128192901611328, "global_step": 552843, "epoch": 6660} {"train_loss": -27.675006866455078, "global_step": 552844, "epoch": 6660} {"train_loss": -27.8721866607666, "global_step": 552845, "epoch": 6660} {"train_loss": -27.605792999267578, "global_step": 552846, "epoch": 6660} {"train_loss": -27.03348731994629, "global_step": 552847, "epoch": 6660} {"train_loss": -27.392419815063477, "global_step": 552848, "epoch": 6660} {"train_loss": -27.754602432250977, "global_step": 552849, "epoch": 6660} {"train_loss": -27.78761863708496, "global_step": 552850, "epoch": 6660} {"train_loss": -27.46661376953125, "global_step": 552851, "epoch": 6660} {"train_loss": -27.7769718170166, "global_step": 552852, "epoch": 6660} {"train_loss": -27.87689208984375, "global_step": 552853, "epoch": 6660} {"train_loss": -27.67032814025879, "global_step": 552854, "epoch": 6660} {"train_loss": -27.509235382080078, "global_step": 552855, "epoch": 6660} {"train_loss": -27.70572280883789, "global_step": 552856, "epoch": 6660} {"train_loss": -27.713729858398438, "global_step": 552857, "epoch": 6660} {"train_loss": -27.782928466796875, "global_step": 552858, "epoch": 6660} {"train_loss": -27.998371124267578, "global_step": 552859, "epoch": 6660} {"train_loss": -27.901220321655273, "global_step": 552860, "epoch": 6660} {"train_loss": -28.07623863220215, "global_step": 552861, "epoch": 6660} {"train_loss": -27.68865302671869, "global_step": 552862, "epoch": 6660, "val_loss": 6630374.5} {"train_loss": -27.5604248046875, "global_step": 552863, "epoch": 6661} {"train_loss": -27.558454513549805, "global_step": 552864, "epoch": 6661} {"train_loss": -27.864973068237305, "global_step": 552865, "epoch": 6661} {"train_loss": -27.210407257080078, "global_step": 552866, "epoch": 6661} {"train_loss": -27.39777183532715, "global_step": 552867, "epoch": 6661} {"train_loss": -27.714059829711914, "global_step": 552868, "epoch": 6661} {"train_loss": -27.393890380859375, "global_step": 552869, "epoch": 6661} {"train_loss": -27.37862205505371, "global_step": 552870, "epoch": 6661} {"train_loss": -27.73370933532715, "global_step": 552871, "epoch": 6661} {"train_loss": -27.64796257019043, "global_step": 552872, "epoch": 6661} {"train_loss": -27.497222900390625, "global_step": 552873, "epoch": 6661} {"train_loss": -27.920827865600586, "global_step": 552874, "epoch": 6661} {"train_loss": -27.85344886779785, "global_step": 552875, "epoch": 6661} {"train_loss": -27.958240509033203, "global_step": 552876, "epoch": 6661} {"train_loss": -27.416595458984375, "global_step": 552877, "epoch": 6661} {"train_loss": -27.467939376831055, "global_step": 552878, "epoch": 6661} {"train_loss": -27.559911727905273, "global_step": 552879, "epoch": 6661} {"train_loss": -27.72712516784668, "global_step": 552880, "epoch": 6661} {"train_loss": -27.93364906311035, "global_step": 552881, "epoch": 6661} {"train_loss": -27.415435791015625, "global_step": 552882, "epoch": 6661} {"train_loss": -27.3242130279541, "global_step": 552883, "epoch": 6661} {"train_loss": -27.5827579498291, "global_step": 552884, "epoch": 6661} {"train_loss": -27.612207412719727, "global_step": 552885, "epoch": 6661} {"train_loss": -27.648839950561523, "global_step": 552886, "epoch": 6661} {"train_loss": -27.7329044342041, "global_step": 552887, "epoch": 6661} {"train_loss": -27.873037338256836, "global_step": 552888, "epoch": 6661} {"train_loss": -28.0332088470459, "global_step": 552889, "epoch": 6661} {"train_loss": -27.75929832458496, "global_step": 552890, "epoch": 6661} {"train_loss": -27.86563491821289, "global_step": 552891, "epoch": 6661} {"train_loss": -27.767431259155273, "global_step": 552892, "epoch": 6661} {"train_loss": -27.772567749023438, "global_step": 552893, "epoch": 6661} {"train_loss": -27.648725509643555, "global_step": 552894, "epoch": 6661} {"train_loss": -27.573225021362305, "global_step": 552895, "epoch": 6661} {"train_loss": -27.798431396484375, "global_step": 552896, "epoch": 6661} {"train_loss": -27.560150146484375, "global_step": 552897, "epoch": 6661} {"train_loss": -27.59521484375, "global_step": 552898, "epoch": 6661} {"train_loss": -27.888208389282227, "global_step": 552899, "epoch": 6661} {"train_loss": -27.887348175048828, "global_step": 552900, "epoch": 6661} {"train_loss": -27.769323348999023, "global_step": 552901, "epoch": 6661} {"train_loss": -27.641462326049805, "global_step": 552902, "epoch": 6661} {"train_loss": -27.747440338134766, "global_step": 552903, "epoch": 6661} {"train_loss": -27.70697021484375, "global_step": 552904, "epoch": 6661} {"train_loss": -28.031036376953125, "global_step": 552905, "epoch": 6661} {"train_loss": -27.85712242126465, "global_step": 552906, "epoch": 6661} {"train_loss": -27.923078536987305, "global_step": 552907, "epoch": 6661} {"train_loss": -27.922155380249023, "global_step": 552908, "epoch": 6661} {"train_loss": -28.25323486328125, "global_step": 552909, "epoch": 6661} {"train_loss": -27.852148056030273, "global_step": 552910, "epoch": 6661} {"train_loss": -27.782079696655273, "global_step": 552911, "epoch": 6661} {"train_loss": -28.305652618408203, "global_step": 552912, "epoch": 6661} {"train_loss": -27.686965942382812, "global_step": 552913, "epoch": 6661} {"train_loss": -27.8071231842041, "global_step": 552914, "epoch": 6661} {"train_loss": -27.699432373046875, "global_step": 552915, "epoch": 6661} {"train_loss": -27.648096084594727, "global_step": 552916, "epoch": 6661} {"train_loss": -27.72956657409668, "global_step": 552917, "epoch": 6661} {"train_loss": -27.80742835998535, "global_step": 552918, "epoch": 6661} {"train_loss": -28.063032150268555, "global_step": 552919, "epoch": 6661} {"train_loss": -27.718856811523438, "global_step": 552920, "epoch": 6661} {"train_loss": -27.412281036376953, "global_step": 552921, "epoch": 6661} {"train_loss": -27.3409366607666, "global_step": 552922, "epoch": 6661} {"train_loss": -27.506555557250977, "global_step": 552923, "epoch": 6661} {"train_loss": -28.331546783447266, "global_step": 552924, "epoch": 6661} {"train_loss": -27.369474411010742, "global_step": 552925, "epoch": 6661} {"train_loss": -27.612548828125, "global_step": 552926, "epoch": 6661} {"train_loss": -27.54011344909668, "global_step": 552927, "epoch": 6661} {"train_loss": -27.842222213745117, "global_step": 552928, "epoch": 6661} {"train_loss": -27.20068359375, "global_step": 552929, "epoch": 6661} {"train_loss": -27.388029098510742, "global_step": 552930, "epoch": 6661} {"train_loss": -27.5330753326416, "global_step": 552931, "epoch": 6661} {"train_loss": -27.458845138549805, "global_step": 552932, "epoch": 6661} {"train_loss": -27.354328155517578, "global_step": 552933, "epoch": 6661} {"train_loss": -27.42024040222168, "global_step": 552934, "epoch": 6661} {"train_loss": -27.620075225830078, "global_step": 552935, "epoch": 6661} {"train_loss": -27.434040069580078, "global_step": 552936, "epoch": 6661} {"train_loss": -27.832996368408203, "global_step": 552937, "epoch": 6661} {"train_loss": -27.295740127563477, "global_step": 552938, "epoch": 6661} {"train_loss": -27.586929321289062, "global_step": 552939, "epoch": 6661} {"train_loss": -27.46982765197754, "global_step": 552940, "epoch": 6661} {"train_loss": -27.704864501953125, "global_step": 552941, "epoch": 6661} {"train_loss": -27.655603408813477, "global_step": 552942, "epoch": 6661} {"train_loss": -27.8116512298584, "global_step": 552943, "epoch": 6661} {"train_loss": -28.088119506835938, "global_step": 552944, "epoch": 6661} {"train_loss": -27.673989996852644, "global_step": 552945, "epoch": 6661, "val_loss": 6584604.0} {"train_loss": -27.23648452758789, "global_step": 552946, "epoch": 6662} {"train_loss": -26.731403350830078, "global_step": 552947, "epoch": 6662} {"train_loss": -26.706134796142578, "global_step": 552948, "epoch": 6662} {"train_loss": -27.558679580688477, "global_step": 552949, "epoch": 6662} {"train_loss": -27.36075210571289, "global_step": 552950, "epoch": 6662} {"train_loss": -26.970916748046875, "global_step": 552951, "epoch": 6662} {"train_loss": -27.515857696533203, "global_step": 552952, "epoch": 6662} {"train_loss": -27.613910675048828, "global_step": 552953, "epoch": 6662} {"train_loss": -27.246728897094727, "global_step": 552954, "epoch": 6662} {"train_loss": -27.513525009155273, "global_step": 552955, "epoch": 6662} {"train_loss": -27.3428897857666, "global_step": 552956, "epoch": 6662} {"train_loss": -27.77601432800293, "global_step": 552957, "epoch": 6662} {"train_loss": -27.88258171081543, "global_step": 552958, "epoch": 6662} {"train_loss": -27.5838680267334, "global_step": 552959, "epoch": 6662} {"train_loss": -27.75678825378418, "global_step": 552960, "epoch": 6662} {"train_loss": -27.549753189086914, "global_step": 552961, "epoch": 6662} {"train_loss": -27.242755889892578, "global_step": 552962, "epoch": 6662} {"train_loss": -28.15815544128418, "global_step": 552963, "epoch": 6662} {"train_loss": -27.64655113220215, "global_step": 552964, "epoch": 6662} {"train_loss": -27.65728759765625, "global_step": 552965, "epoch": 6662} {"train_loss": -27.800369262695312, "global_step": 552966, "epoch": 6662} {"train_loss": -28.16937255859375, "global_step": 552967, "epoch": 6662} {"train_loss": -27.72432518005371, "global_step": 552968, "epoch": 6662} {"train_loss": -27.848480224609375, "global_step": 552969, "epoch": 6662} {"train_loss": -28.01765251159668, "global_step": 552970, "epoch": 6662} {"train_loss": -27.886014938354492, "global_step": 552971, "epoch": 6662} {"train_loss": -27.868371963500977, "global_step": 552972, "epoch": 6662} {"train_loss": -28.130895614624023, "global_step": 552973, "epoch": 6662} {"train_loss": -27.890125274658203, "global_step": 552974, "epoch": 6662} {"train_loss": -27.953907012939453, "global_step": 552975, "epoch": 6662} {"train_loss": -27.76654052734375, "global_step": 552976, "epoch": 6662} {"train_loss": -27.76969337463379, "global_step": 552977, "epoch": 6662} {"train_loss": -27.718427658081055, "global_step": 552978, "epoch": 6662} {"train_loss": -27.87198257446289, "global_step": 552979, "epoch": 6662} {"train_loss": -27.875518798828125, "global_step": 552980, "epoch": 6662} {"train_loss": -28.090869903564453, "global_step": 552981, "epoch": 6662} {"train_loss": -27.902652740478516, "global_step": 552982, "epoch": 6662} {"train_loss": -27.655609130859375, "global_step": 552983, "epoch": 6662} {"train_loss": -28.015918731689453, "global_step": 552984, "epoch": 6662} {"train_loss": -27.920501708984375, "global_step": 552985, "epoch": 6662} {"train_loss": -28.0147647857666, "global_step": 552986, "epoch": 6662} {"train_loss": -27.697629928588867, "global_step": 552987, "epoch": 6662} {"train_loss": -28.2193546295166, "global_step": 552988, "epoch": 6662} {"train_loss": -27.8886775970459, "global_step": 552989, "epoch": 6662} {"train_loss": -27.7218017578125, "global_step": 552990, "epoch": 6662} {"train_loss": -27.87752342224121, "global_step": 552991, "epoch": 6662} {"train_loss": -28.16292381286621, "global_step": 552992, "epoch": 6662} {"train_loss": -28.341703414916992, "global_step": 552993, "epoch": 6662} {"train_loss": -28.076034545898438, "global_step": 552994, "epoch": 6662} {"train_loss": -27.90403175354004, "global_step": 552995, "epoch": 6662} {"train_loss": -28.21430778503418, "global_step": 552996, "epoch": 6662} {"train_loss": -27.759876251220703, "global_step": 552997, "epoch": 6662} {"train_loss": -27.75166893005371, "global_step": 552998, "epoch": 6662} {"train_loss": -27.761005401611328, "global_step": 552999, "epoch": 6662} {"train_loss": -27.978246688842773, "global_step": 553000, "epoch": 6662} {"train_loss": -28.062097549438477, "global_step": 553001, "epoch": 6662} {"train_loss": -27.629608154296875, "global_step": 553002, "epoch": 6662} {"train_loss": -27.7766170501709, "global_step": 553003, "epoch": 6662} {"train_loss": -27.820758819580078, "global_step": 553004, "epoch": 6662} {"train_loss": -27.8558349609375, "global_step": 553005, "epoch": 6662} {"train_loss": -27.62159538269043, "global_step": 553006, "epoch": 6662} {"train_loss": -27.245716094970703, "global_step": 553007, "epoch": 6662} {"train_loss": -27.912405014038086, "global_step": 553008, "epoch": 6662} {"train_loss": -27.98414421081543, "global_step": 553009, "epoch": 6662} {"train_loss": -27.82404899597168, "global_step": 553010, "epoch": 6662} {"train_loss": -27.9591007232666, "global_step": 553011, "epoch": 6662} {"train_loss": -27.60308837890625, "global_step": 553012, "epoch": 6662} {"train_loss": -27.761383056640625, "global_step": 553013, "epoch": 6662} {"train_loss": -27.698705673217773, "global_step": 553014, "epoch": 6662} {"train_loss": -27.517786026000977, "global_step": 553015, "epoch": 6662} {"train_loss": -27.54534912109375, "global_step": 553016, "epoch": 6662} {"train_loss": -27.40994644165039, "global_step": 553017, "epoch": 6662} {"train_loss": -27.24237060546875, "global_step": 553018, "epoch": 6662} {"train_loss": -27.26806640625, "global_step": 553019, "epoch": 6662} {"train_loss": -27.46721839904785, "global_step": 553020, "epoch": 6662} {"train_loss": -27.638137817382812, "global_step": 553021, "epoch": 6662} {"train_loss": -27.4770565032959, "global_step": 553022, "epoch": 6662} {"train_loss": -27.62925148010254, "global_step": 553023, "epoch": 6662} {"train_loss": -27.97515869140625, "global_step": 553024, "epoch": 6662} {"train_loss": -27.4053897857666, "global_step": 553025, "epoch": 6662} {"train_loss": -27.518789291381836, "global_step": 553026, "epoch": 6662} {"train_loss": -27.833478927612305, "global_step": 553027, "epoch": 6662} {"train_loss": -27.72314499085208, "global_step": 553028, "epoch": 6662, "val_loss": 6742332.0} {"train_loss": -27.061994552612305, "global_step": 553029, "epoch": 6663} {"train_loss": -26.9528751373291, "global_step": 553030, "epoch": 6663} {"train_loss": -27.213720321655273, "global_step": 553031, "epoch": 6663} {"train_loss": -26.67188835144043, "global_step": 553032, "epoch": 6663} {"train_loss": -26.867603302001953, "global_step": 553033, "epoch": 6663} {"train_loss": -27.137861251831055, "global_step": 553034, "epoch": 6663} {"train_loss": -27.243268966674805, "global_step": 553035, "epoch": 6663} {"train_loss": -27.486326217651367, "global_step": 553036, "epoch": 6663} {"train_loss": -27.280750274658203, "global_step": 553037, "epoch": 6663} {"train_loss": -27.552417755126953, "global_step": 553038, "epoch": 6663} {"train_loss": -27.302387237548828, "global_step": 553039, "epoch": 6663} {"train_loss": -27.328351974487305, "global_step": 553040, "epoch": 6663} {"train_loss": -27.320249557495117, "global_step": 553041, "epoch": 6663} {"train_loss": -27.395421981811523, "global_step": 553042, "epoch": 6663} {"train_loss": -27.40087890625, "global_step": 553043, "epoch": 6663} {"train_loss": -27.841760635375977, "global_step": 553044, "epoch": 6663} {"train_loss": -27.04197120666504, "global_step": 553045, "epoch": 6663} {"train_loss": -27.463048934936523, "global_step": 553046, "epoch": 6663} {"train_loss": -27.475934982299805, "global_step": 553047, "epoch": 6663} {"train_loss": -27.708093643188477, "global_step": 553048, "epoch": 6663} {"train_loss": -27.62933921813965, "global_step": 553049, "epoch": 6663} {"train_loss": -27.743488311767578, "global_step": 553050, "epoch": 6663} {"train_loss": -27.819568634033203, "global_step": 553051, "epoch": 6663} {"train_loss": -27.543354034423828, "global_step": 553052, "epoch": 6663} {"train_loss": -27.816574096679688, "global_step": 553053, "epoch": 6663} {"train_loss": -27.669647216796875, "global_step": 553054, "epoch": 6663} {"train_loss": -27.489700317382812, "global_step": 553055, "epoch": 6663} {"train_loss": -27.772306442260742, "global_step": 553056, "epoch": 6663} {"train_loss": -27.4859561920166, "global_step": 553057, "epoch": 6663} {"train_loss": -27.550058364868164, "global_step": 553058, "epoch": 6663} {"train_loss": -27.499454498291016, "global_step": 553059, "epoch": 6663} {"train_loss": -27.97759437561035, "global_step": 553060, "epoch": 6663} {"train_loss": -28.106054306030273, "global_step": 553061, "epoch": 6663} {"train_loss": -27.75437355041504, "global_step": 553062, "epoch": 6663} {"train_loss": -27.710416793823242, "global_step": 553063, "epoch": 6663} {"train_loss": -27.569211959838867, "global_step": 553064, "epoch": 6663} {"train_loss": -27.832265853881836, "global_step": 553065, "epoch": 6663} {"train_loss": -27.769805908203125, "global_step": 553066, "epoch": 6663} {"train_loss": -28.085559844970703, "global_step": 553067, "epoch": 6663} {"train_loss": -27.74130630493164, "global_step": 553068, "epoch": 6663} {"train_loss": -27.67984390258789, "global_step": 553069, "epoch": 6663} {"train_loss": -27.588123321533203, "global_step": 553070, "epoch": 6663} {"train_loss": -27.924808502197266, "global_step": 553071, "epoch": 6663} {"train_loss": -27.580490112304688, "global_step": 553072, "epoch": 6663} {"train_loss": -28.00172233581543, "global_step": 553073, "epoch": 6663} {"train_loss": -27.93292808532715, "global_step": 553074, "epoch": 6663} {"train_loss": -28.023008346557617, "global_step": 553075, "epoch": 6663} {"train_loss": -27.726306915283203, "global_step": 553076, "epoch": 6663} {"train_loss": -27.89350700378418, "global_step": 553077, "epoch": 6663} {"train_loss": -27.88022232055664, "global_step": 553078, "epoch": 6663} {"train_loss": -28.152753829956055, "global_step": 553079, "epoch": 6663} {"train_loss": -28.062702178955078, "global_step": 553080, "epoch": 6663} {"train_loss": -27.985492706298828, "global_step": 553081, "epoch": 6663} {"train_loss": -28.066938400268555, "global_step": 553082, "epoch": 6663} {"train_loss": -28.1654109954834, "global_step": 553083, "epoch": 6663} {"train_loss": -28.384077072143555, "global_step": 553084, "epoch": 6663} {"train_loss": -27.93983268737793, "global_step": 553085, "epoch": 6663} {"train_loss": -28.02899742126465, "global_step": 553086, "epoch": 6663} {"train_loss": -27.73036003112793, "global_step": 553087, "epoch": 6663} {"train_loss": -27.81526756286621, "global_step": 553088, "epoch": 6663} {"train_loss": -26.885923385620117, "global_step": 553089, "epoch": 6663} {"train_loss": -25.237348556518555, "global_step": 553090, "epoch": 6663} {"train_loss": -24.9573917388916, "global_step": 553091, "epoch": 6663} {"train_loss": -25.907791137695312, "global_step": 553092, "epoch": 6663} {"train_loss": -26.393033981323242, "global_step": 553093, "epoch": 6663} {"train_loss": -26.70173454284668, "global_step": 553094, "epoch": 6663} {"train_loss": -27.373437881469727, "global_step": 553095, "epoch": 6663} {"train_loss": -26.466583251953125, "global_step": 553096, "epoch": 6663} {"train_loss": -27.42695426940918, "global_step": 553097, "epoch": 6663} {"train_loss": -26.9366455078125, "global_step": 553098, "epoch": 6663} {"train_loss": -27.22675132751465, "global_step": 553099, "epoch": 6663} {"train_loss": -27.057891845703125, "global_step": 553100, "epoch": 6663} {"train_loss": -27.336706161499023, "global_step": 553101, "epoch": 6663} {"train_loss": -27.08637046813965, "global_step": 553102, "epoch": 6663} {"train_loss": -27.160703659057617, "global_step": 553103, "epoch": 6663} {"train_loss": -27.654998779296875, "global_step": 553104, "epoch": 6663} {"train_loss": -27.50634765625, "global_step": 553105, "epoch": 6663} {"train_loss": -27.18338394165039, "global_step": 553106, "epoch": 6663} {"train_loss": -27.50897789001465, "global_step": 553107, "epoch": 6663} {"train_loss": -27.54897117614746, "global_step": 553108, "epoch": 6663} {"train_loss": -27.2271785736084, "global_step": 553109, "epoch": 6663} {"train_loss": -27.36716079711914, "global_step": 553110, "epoch": 6663} {"train_loss": -27.457889143242895, "global_step": 553111, "epoch": 6663, "val_loss": 6680743.0} {"train_loss": -27.347944259643555, "global_step": 553112, "epoch": 6664} {"train_loss": -27.012197494506836, "global_step": 553113, "epoch": 6664} {"train_loss": -27.243375778198242, "global_step": 553114, "epoch": 6664} {"train_loss": -27.271833419799805, "global_step": 553115, "epoch": 6664} {"train_loss": -27.24287223815918, "global_step": 553116, "epoch": 6664} {"train_loss": -27.744110107421875, "global_step": 553117, "epoch": 6664} {"train_loss": -27.08197593688965, "global_step": 553118, "epoch": 6664} {"train_loss": -27.474822998046875, "global_step": 553119, "epoch": 6664} {"train_loss": -27.6095027923584, "global_step": 553120, "epoch": 6664} {"train_loss": -27.69173240661621, "global_step": 553121, "epoch": 6664} {"train_loss": -27.561609268188477, "global_step": 553122, "epoch": 6664} {"train_loss": -27.53519630432129, "global_step": 553123, "epoch": 6664} {"train_loss": -27.712512969970703, "global_step": 553124, "epoch": 6664} {"train_loss": -27.712100982666016, "global_step": 553125, "epoch": 6664} {"train_loss": -27.78070640563965, "global_step": 553126, "epoch": 6664} {"train_loss": -28.03877067565918, "global_step": 553127, "epoch": 6664} {"train_loss": -27.2689266204834, "global_step": 553128, "epoch": 6664} {"train_loss": -27.491897583007812, "global_step": 553129, "epoch": 6664} {"train_loss": -27.757123947143555, "global_step": 553130, "epoch": 6664} {"train_loss": -27.37055778503418, "global_step": 553131, "epoch": 6664} {"train_loss": -27.888507843017578, "global_step": 553132, "epoch": 6664} {"train_loss": -27.711292266845703, "global_step": 553133, "epoch": 6664} {"train_loss": -27.362323760986328, "global_step": 553134, "epoch": 6664} {"train_loss": -27.94439697265625, "global_step": 553135, "epoch": 6664} {"train_loss": -27.595930099487305, "global_step": 553136, "epoch": 6664} {"train_loss": -27.914783477783203, "global_step": 553137, "epoch": 6664} {"train_loss": -28.044538497924805, "global_step": 553138, "epoch": 6664} {"train_loss": -27.785531997680664, "global_step": 553139, "epoch": 6664} {"train_loss": -27.987287521362305, "global_step": 553140, "epoch": 6664} {"train_loss": -28.0377140045166, "global_step": 553141, "epoch": 6664} {"train_loss": -27.90640640258789, "global_step": 553142, "epoch": 6664} {"train_loss": -27.9288272857666, "global_step": 553143, "epoch": 6664} {"train_loss": -27.946027755737305, "global_step": 553144, "epoch": 6664} {"train_loss": -27.968915939331055, "global_step": 553145, "epoch": 6664} {"train_loss": -27.86636734008789, "global_step": 553146, "epoch": 6664} {"train_loss": -27.574609756469727, "global_step": 553147, "epoch": 6664} {"train_loss": -28.272003173828125, "global_step": 553148, "epoch": 6664} {"train_loss": -28.09345054626465, "global_step": 553149, "epoch": 6664} {"train_loss": -28.123504638671875, "global_step": 553150, "epoch": 6664} {"train_loss": -27.46697425842285, "global_step": 553151, "epoch": 6664} {"train_loss": -27.694263458251953, "global_step": 553152, "epoch": 6664} {"train_loss": -27.919586181640625, "global_step": 553153, "epoch": 6664} {"train_loss": -27.50992202758789, "global_step": 553154, "epoch": 6664} {"train_loss": -28.09332275390625, "global_step": 553155, "epoch": 6664} {"train_loss": -27.649465560913086, "global_step": 553156, "epoch": 6664} {"train_loss": -27.722925186157227, "global_step": 553157, "epoch": 6664} {"train_loss": -27.80854606628418, "global_step": 553158, "epoch": 6664} {"train_loss": -27.675870895385742, "global_step": 553159, "epoch": 6664} {"train_loss": -28.102161407470703, "global_step": 553160, "epoch": 6664} {"train_loss": -27.607126235961914, "global_step": 553161, "epoch": 6664} {"train_loss": -27.836523056030273, "global_step": 553162, "epoch": 6664} {"train_loss": -27.47528648376465, "global_step": 553163, "epoch": 6664} {"train_loss": -27.23225212097168, "global_step": 553164, "epoch": 6664} {"train_loss": -27.617633819580078, "global_step": 553165, "epoch": 6664} {"train_loss": -27.514923095703125, "global_step": 553166, "epoch": 6664} {"train_loss": -27.818073272705078, "global_step": 553167, "epoch": 6664} {"train_loss": -27.51641845703125, "global_step": 553168, "epoch": 6664} {"train_loss": -27.564380645751953, "global_step": 553169, "epoch": 6664} {"train_loss": -27.78389549255371, "global_step": 553170, "epoch": 6664} {"train_loss": -27.594934463500977, "global_step": 553171, "epoch": 6664} {"train_loss": -27.341718673706055, "global_step": 553172, "epoch": 6664} {"train_loss": -28.146799087524414, "global_step": 553173, "epoch": 6664} {"train_loss": -27.693115234375, "global_step": 553174, "epoch": 6664} {"train_loss": -28.0349063873291, "global_step": 553175, "epoch": 6664} {"train_loss": -27.77760887145996, "global_step": 553176, "epoch": 6664} {"train_loss": -27.514022827148438, "global_step": 553177, "epoch": 6664} {"train_loss": -27.746082305908203, "global_step": 553178, "epoch": 6664} {"train_loss": -28.073062896728516, "global_step": 553179, "epoch": 6664} {"train_loss": -27.59375, "global_step": 553180, "epoch": 6664} {"train_loss": -27.811803817749023, "global_step": 553181, "epoch": 6664} {"train_loss": -28.04022216796875, "global_step": 553182, "epoch": 6664} {"train_loss": -27.70361328125, "global_step": 553183, "epoch": 6664} {"train_loss": -27.78754997253418, "global_step": 553184, "epoch": 6664} {"train_loss": -27.639673233032227, "global_step": 553185, "epoch": 6664} {"train_loss": -27.981237411499023, "global_step": 553186, "epoch": 6664} {"train_loss": -27.693639755249023, "global_step": 553187, "epoch": 6664} {"train_loss": -27.578399658203125, "global_step": 553188, "epoch": 6664} {"train_loss": -27.382431030273438, "global_step": 553189, "epoch": 6664} {"train_loss": -27.178564071655273, "global_step": 553190, "epoch": 6664} {"train_loss": -27.225080490112305, "global_step": 553191, "epoch": 6664} {"train_loss": -27.07196617126465, "global_step": 553192, "epoch": 6664} {"train_loss": -27.520145416259766, "global_step": 553193, "epoch": 6664} {"train_loss": -27.688271694872753, "global_step": 553194, "epoch": 6664, "val_loss": 6669152.5} {"train_loss": -27.03346061706543, "global_step": 553195, "epoch": 6665} {"train_loss": -26.626508712768555, "global_step": 553196, "epoch": 6665} {"train_loss": -26.695669174194336, "global_step": 553197, "epoch": 6665} {"train_loss": -26.688278198242188, "global_step": 553198, "epoch": 6665} {"train_loss": -27.12653923034668, "global_step": 553199, "epoch": 6665} {"train_loss": -27.126129150390625, "global_step": 553200, "epoch": 6665} {"train_loss": -27.0896053314209, "global_step": 553201, "epoch": 6665} {"train_loss": -26.934995651245117, "global_step": 553202, "epoch": 6665} {"train_loss": -27.55694580078125, "global_step": 553203, "epoch": 6665} {"train_loss": -26.797067642211914, "global_step": 553204, "epoch": 6665} {"train_loss": -26.730072021484375, "global_step": 553205, "epoch": 6665} {"train_loss": -27.46213722229004, "global_step": 553206, "epoch": 6665} {"train_loss": -27.896503448486328, "global_step": 553207, "epoch": 6665} {"train_loss": -27.57293128967285, "global_step": 553208, "epoch": 6665} {"train_loss": -27.405324935913086, "global_step": 553209, "epoch": 6665} {"train_loss": -27.287927627563477, "global_step": 553210, "epoch": 6665} {"train_loss": -27.418624877929688, "global_step": 553211, "epoch": 6665} {"train_loss": -27.449634552001953, "global_step": 553212, "epoch": 6665} {"train_loss": -27.440582275390625, "global_step": 553213, "epoch": 6665} {"train_loss": -27.729337692260742, "global_step": 553214, "epoch": 6665} {"train_loss": -27.749731063842773, "global_step": 553215, "epoch": 6665} {"train_loss": -27.807880401611328, "global_step": 553216, "epoch": 6665} {"train_loss": -27.604419708251953, "global_step": 553217, "epoch": 6665} {"train_loss": -27.678022384643555, "global_step": 553218, "epoch": 6665} {"train_loss": -27.652135848999023, "global_step": 553219, "epoch": 6665} {"train_loss": -27.4849910736084, "global_step": 553220, "epoch": 6665} {"train_loss": -27.652597427368164, "global_step": 553221, "epoch": 6665} {"train_loss": -27.7695255279541, "global_step": 553222, "epoch": 6665} {"train_loss": -27.860742568969727, "global_step": 553223, "epoch": 6665} {"train_loss": -27.783527374267578, "global_step": 553224, "epoch": 6665} {"train_loss": -27.533842086791992, "global_step": 553225, "epoch": 6665} {"train_loss": -27.94001579284668, "global_step": 553226, "epoch": 6665} {"train_loss": -27.47486686706543, "global_step": 553227, "epoch": 6665} {"train_loss": -28.069250106811523, "global_step": 553228, "epoch": 6665} {"train_loss": -27.49837303161621, "global_step": 553229, "epoch": 6665} {"train_loss": -27.983911514282227, "global_step": 553230, "epoch": 6665} {"train_loss": -27.446075439453125, "global_step": 553231, "epoch": 6665} {"train_loss": -27.885589599609375, "global_step": 553232, "epoch": 6665} {"train_loss": -27.572721481323242, "global_step": 553233, "epoch": 6665} {"train_loss": -27.733306884765625, "global_step": 553234, "epoch": 6665} {"train_loss": -27.77851676940918, "global_step": 553235, "epoch": 6665} {"train_loss": -27.380456924438477, "global_step": 553236, "epoch": 6665} {"train_loss": -27.8080997467041, "global_step": 553237, "epoch": 6665} {"train_loss": -27.87529945373535, "global_step": 553238, "epoch": 6665} {"train_loss": -27.76838493347168, "global_step": 553239, "epoch": 6665} {"train_loss": -27.957965850830078, "global_step": 553240, "epoch": 6665} {"train_loss": -27.887231826782227, "global_step": 553241, "epoch": 6665} {"train_loss": -27.734344482421875, "global_step": 553242, "epoch": 6665} {"train_loss": -27.7636661529541, "global_step": 553243, "epoch": 6665} {"train_loss": -27.61749267578125, "global_step": 553244, "epoch": 6665} {"train_loss": -27.31884765625, "global_step": 553245, "epoch": 6665} {"train_loss": -27.625274658203125, "global_step": 553246, "epoch": 6665} {"train_loss": -27.32000160217285, "global_step": 553247, "epoch": 6665} {"train_loss": -27.619140625, "global_step": 553248, "epoch": 6665} {"train_loss": -27.85145378112793, "global_step": 553249, "epoch": 6665} {"train_loss": -27.373157501220703, "global_step": 553250, "epoch": 6665} {"train_loss": -27.694049835205078, "global_step": 553251, "epoch": 6665} {"train_loss": -27.52199363708496, "global_step": 553252, "epoch": 6665} {"train_loss": -27.743011474609375, "global_step": 553253, "epoch": 6665} {"train_loss": -27.570087432861328, "global_step": 553254, "epoch": 6665} {"train_loss": -27.356674194335938, "global_step": 553255, "epoch": 6665} {"train_loss": -27.91657829284668, "global_step": 553256, "epoch": 6665} {"train_loss": -28.05116081237793, "global_step": 553257, "epoch": 6665} {"train_loss": -27.475549697875977, "global_step": 553258, "epoch": 6665} {"train_loss": -27.7271728515625, "global_step": 553259, "epoch": 6665} {"train_loss": -27.5377140045166, "global_step": 553260, "epoch": 6665} {"train_loss": -27.869565963745117, "global_step": 553261, "epoch": 6665} {"train_loss": -27.48187828063965, "global_step": 553262, "epoch": 6665} {"train_loss": -27.617414474487305, "global_step": 553263, "epoch": 6665} {"train_loss": -27.417646408081055, "global_step": 553264, "epoch": 6665} {"train_loss": -27.75892448425293, "global_step": 553265, "epoch": 6665} {"train_loss": -27.65643310546875, "global_step": 553266, "epoch": 6665} {"train_loss": -27.73947525024414, "global_step": 553267, "epoch": 6665} {"train_loss": -27.41015625, "global_step": 553268, "epoch": 6665} {"train_loss": -27.5324764251709, "global_step": 553269, "epoch": 6665} {"train_loss": -27.928375244140625, "global_step": 553270, "epoch": 6665} {"train_loss": -27.424901962280273, "global_step": 553271, "epoch": 6665} {"train_loss": -27.497882843017578, "global_step": 553272, "epoch": 6665} {"train_loss": -26.936079025268555, "global_step": 553273, "epoch": 6665} {"train_loss": -27.07245445251465, "global_step": 553274, "epoch": 6665} {"train_loss": -27.7439022064209, "global_step": 553275, "epoch": 6665} {"train_loss": -27.910572052001953, "global_step": 553276, "epoch": 6665} {"train_loss": -27.541555335722773, "global_step": 553277, "epoch": 6665, "val_loss": 6660270.0} {"train_loss": -27.67822265625, "global_step": 553278, "epoch": 6666} {"train_loss": -27.428878784179688, "global_step": 553279, "epoch": 6666} {"train_loss": -27.333181381225586, "global_step": 553280, "epoch": 6666} {"train_loss": -27.16777992248535, "global_step": 553281, "epoch": 6666} {"train_loss": -26.91280174255371, "global_step": 553282, "epoch": 6666} {"train_loss": -27.72408103942871, "global_step": 553283, "epoch": 6666} {"train_loss": -27.07625389099121, "global_step": 553284, "epoch": 6666} {"train_loss": -27.230005264282227, "global_step": 553285, "epoch": 6666} {"train_loss": -27.00233268737793, "global_step": 553286, "epoch": 6666} {"train_loss": -26.7197265625, "global_step": 553287, "epoch": 6666} {"train_loss": -27.279897689819336, "global_step": 553288, "epoch": 6666} {"train_loss": -27.052997589111328, "global_step": 553289, "epoch": 6666} {"train_loss": -27.09486198425293, "global_step": 553290, "epoch": 6666} {"train_loss": -27.557586669921875, "global_step": 553291, "epoch": 6666} {"train_loss": -27.40665054321289, "global_step": 553292, "epoch": 6666} {"train_loss": -27.64763832092285, "global_step": 553293, "epoch": 6666} {"train_loss": -27.271625518798828, "global_step": 553294, "epoch": 6666} {"train_loss": -27.718677520751953, "global_step": 553295, "epoch": 6666} {"train_loss": -27.304229736328125, "global_step": 553296, "epoch": 6666} {"train_loss": -27.56072425842285, "global_step": 553297, "epoch": 6666} {"train_loss": -27.20486831665039, "global_step": 553298, "epoch": 6666} {"train_loss": -27.7578125, "global_step": 553299, "epoch": 6666} {"train_loss": -27.425596237182617, "global_step": 553300, "epoch": 6666} {"train_loss": -27.822622299194336, "global_step": 553301, "epoch": 6666} {"train_loss": -27.52665138244629, "global_step": 553302, "epoch": 6666} {"train_loss": -27.552295684814453, "global_step": 553303, "epoch": 6666} {"train_loss": -27.728580474853516, "global_step": 553304, "epoch": 6666} {"train_loss": -27.539987564086914, "global_step": 553305, "epoch": 6666} {"train_loss": -27.593896865844727, "global_step": 553306, "epoch": 6666} {"train_loss": -27.65435791015625, "global_step": 553307, "epoch": 6666} {"train_loss": -27.59195899963379, "global_step": 553308, "epoch": 6666} {"train_loss": -27.553693771362305, "global_step": 553309, "epoch": 6666} {"train_loss": -27.653467178344727, "global_step": 553310, "epoch": 6666} {"train_loss": -27.440906524658203, "global_step": 553311, "epoch": 6666} {"train_loss": -27.459020614624023, "global_step": 553312, "epoch": 6666} {"train_loss": -27.697607040405273, "global_step": 553313, "epoch": 6666} {"train_loss": -27.773727416992188, "global_step": 553314, "epoch": 6666} {"train_loss": -27.6782283782959, "global_step": 553315, "epoch": 6666} {"train_loss": -27.414779663085938, "global_step": 553316, "epoch": 6666} {"train_loss": -27.68499183654785, "global_step": 553317, "epoch": 6666} {"train_loss": -27.579004287719727, "global_step": 553318, "epoch": 6666} {"train_loss": -27.579252243041992, "global_step": 553319, "epoch": 6666} {"train_loss": -28.073163986206055, "global_step": 553320, "epoch": 6666} {"train_loss": -27.82874870300293, "global_step": 553321, "epoch": 6666} {"train_loss": -27.72809410095215, "global_step": 553322, "epoch": 6666} {"train_loss": -27.66337013244629, "global_step": 553323, "epoch": 6666} {"train_loss": -27.82895278930664, "global_step": 553324, "epoch": 6666} {"train_loss": -28.174406051635742, "global_step": 553325, "epoch": 6666} {"train_loss": -27.773468017578125, "global_step": 553326, "epoch": 6666} {"train_loss": -27.774824142456055, "global_step": 553327, "epoch": 6666} {"train_loss": -27.776153564453125, "global_step": 553328, "epoch": 6666} {"train_loss": -27.446081161499023, "global_step": 553329, "epoch": 6666} {"train_loss": -27.85120964050293, "global_step": 553330, "epoch": 6666} {"train_loss": -27.99041748046875, "global_step": 553331, "epoch": 6666} {"train_loss": -27.741785049438477, "global_step": 553332, "epoch": 6666} {"train_loss": -27.926923751831055, "global_step": 553333, "epoch": 6666} {"train_loss": -27.773380279541016, "global_step": 553334, "epoch": 6666} {"train_loss": -27.45631217956543, "global_step": 553335, "epoch": 6666} {"train_loss": -27.808664321899414, "global_step": 553336, "epoch": 6666} {"train_loss": -28.00027847290039, "global_step": 553337, "epoch": 6666} {"train_loss": -27.571456909179688, "global_step": 553338, "epoch": 6666} {"train_loss": -27.80756950378418, "global_step": 553339, "epoch": 6666} {"train_loss": -27.698673248291016, "global_step": 553340, "epoch": 6666} {"train_loss": -27.37750244140625, "global_step": 553341, "epoch": 6666} {"train_loss": -27.825550079345703, "global_step": 553342, "epoch": 6666} {"train_loss": -27.44611167907715, "global_step": 553343, "epoch": 6666} {"train_loss": -27.27487564086914, "global_step": 553344, "epoch": 6666} {"train_loss": -27.40753173828125, "global_step": 553345, "epoch": 6666} {"train_loss": -27.899612426757812, "global_step": 553346, "epoch": 6666} {"train_loss": -27.300769805908203, "global_step": 553347, "epoch": 6666} {"train_loss": -27.337661743164062, "global_step": 553348, "epoch": 6666} {"train_loss": -27.6149959564209, "global_step": 553349, "epoch": 6666} {"train_loss": -27.407764434814453, "global_step": 553350, "epoch": 6666} {"train_loss": -27.927932739257812, "global_step": 553351, "epoch": 6666} {"train_loss": -27.56715202331543, "global_step": 553352, "epoch": 6666} {"train_loss": -27.531539916992188, "global_step": 553353, "epoch": 6666} {"train_loss": -27.402515411376953, "global_step": 553354, "epoch": 6666} {"train_loss": -27.809396743774414, "global_step": 553355, "epoch": 6666} {"train_loss": -27.54375648498535, "global_step": 553356, "epoch": 6666} {"train_loss": -28.202116012573242, "global_step": 553357, "epoch": 6666} {"train_loss": -27.558218002319336, "global_step": 553358, "epoch": 6666} {"train_loss": -27.66749382019043, "global_step": 553359, "epoch": 6666} {"train_loss": -27.584268317165144, "global_step": 553360, "epoch": 6666, "val_loss": 6572795.0} {"train_loss": -26.311725616455078, "global_step": 553361, "epoch": 6667} {"train_loss": -26.593902587890625, "global_step": 553362, "epoch": 6667} {"train_loss": -27.054906845092773, "global_step": 553363, "epoch": 6667} {"train_loss": -26.760339736938477, "global_step": 553364, "epoch": 6667} {"train_loss": -26.46352195739746, "global_step": 553365, "epoch": 6667} {"train_loss": -26.695636749267578, "global_step": 553366, "epoch": 6667} {"train_loss": -27.228134155273438, "global_step": 553367, "epoch": 6667} {"train_loss": -26.947019577026367, "global_step": 553368, "epoch": 6667} {"train_loss": -27.38738441467285, "global_step": 553369, "epoch": 6667} {"train_loss": -27.051803588867188, "global_step": 553370, "epoch": 6667} {"train_loss": -26.687580108642578, "global_step": 553371, "epoch": 6667} {"train_loss": -26.923959732055664, "global_step": 553372, "epoch": 6667} {"train_loss": -27.318470001220703, "global_step": 553373, "epoch": 6667} {"train_loss": -26.7123966217041, "global_step": 553374, "epoch": 6667} {"train_loss": -27.30254554748535, "global_step": 553375, "epoch": 6667} {"train_loss": -27.22712516784668, "global_step": 553376, "epoch": 6667} {"train_loss": -27.484777450561523, "global_step": 553377, "epoch": 6667} {"train_loss": -27.1105899810791, "global_step": 553378, "epoch": 6667} {"train_loss": -27.707477569580078, "global_step": 553379, "epoch": 6667} {"train_loss": -27.484289169311523, "global_step": 553380, "epoch": 6667} {"train_loss": -27.12251091003418, "global_step": 553381, "epoch": 6667} {"train_loss": -27.579374313354492, "global_step": 553382, "epoch": 6667} {"train_loss": -27.522281646728516, "global_step": 553383, "epoch": 6667} {"train_loss": -27.65534782409668, "global_step": 553384, "epoch": 6667} {"train_loss": -27.261865615844727, "global_step": 553385, "epoch": 6667} {"train_loss": -27.62196159362793, "global_step": 553386, "epoch": 6667} {"train_loss": -27.261615753173828, "global_step": 553387, "epoch": 6667} {"train_loss": -27.638315200805664, "global_step": 553388, "epoch": 6667} {"train_loss": -27.093610763549805, "global_step": 553389, "epoch": 6667} {"train_loss": -27.230030059814453, "global_step": 553390, "epoch": 6667} {"train_loss": -27.456083297729492, "global_step": 553391, "epoch": 6667} {"train_loss": -27.809036254882812, "global_step": 553392, "epoch": 6667} {"train_loss": -27.672163009643555, "global_step": 553393, "epoch": 6667} {"train_loss": -28.11134147644043, "global_step": 553394, "epoch": 6667} {"train_loss": -27.723196029663086, "global_step": 553395, "epoch": 6667} {"train_loss": -27.63776206970215, "global_step": 553396, "epoch": 6667} {"train_loss": -27.622812271118164, "global_step": 553397, "epoch": 6667} {"train_loss": -27.558374404907227, "global_step": 553398, "epoch": 6667} {"train_loss": -27.833057403564453, "global_step": 553399, "epoch": 6667} {"train_loss": -27.67872428894043, "global_step": 553400, "epoch": 6667} {"train_loss": -27.920886993408203, "global_step": 553401, "epoch": 6667} {"train_loss": -27.748159408569336, "global_step": 553402, "epoch": 6667} {"train_loss": -27.959304809570312, "global_step": 553403, "epoch": 6667} {"train_loss": -27.649341583251953, "global_step": 553404, "epoch": 6667} {"train_loss": -27.35687828063965, "global_step": 553405, "epoch": 6667} {"train_loss": -27.900842666625977, "global_step": 553406, "epoch": 6667} {"train_loss": -27.795682907104492, "global_step": 553407, "epoch": 6667} {"train_loss": -27.725671768188477, "global_step": 553408, "epoch": 6667} {"train_loss": -28.042469024658203, "global_step": 553409, "epoch": 6667} {"train_loss": -27.915876388549805, "global_step": 553410, "epoch": 6667} {"train_loss": -27.631610870361328, "global_step": 553411, "epoch": 6667} {"train_loss": -28.035009384155273, "global_step": 553412, "epoch": 6667} {"train_loss": -28.076215744018555, "global_step": 553413, "epoch": 6667} {"train_loss": -27.811771392822266, "global_step": 553414, "epoch": 6667} {"train_loss": -27.915515899658203, "global_step": 553415, "epoch": 6667} {"train_loss": -28.040130615234375, "global_step": 553416, "epoch": 6667} {"train_loss": -28.088672637939453, "global_step": 553417, "epoch": 6667} {"train_loss": -27.845678329467773, "global_step": 553418, "epoch": 6667} {"train_loss": -28.203876495361328, "global_step": 553419, "epoch": 6667} {"train_loss": -27.826200485229492, "global_step": 553420, "epoch": 6667} {"train_loss": -27.83713722229004, "global_step": 553421, "epoch": 6667} {"train_loss": -28.207910537719727, "global_step": 553422, "epoch": 6667} {"train_loss": -27.826353073120117, "global_step": 553423, "epoch": 6667} {"train_loss": -27.91790771484375, "global_step": 553424, "epoch": 6667} {"train_loss": -28.004215240478516, "global_step": 553425, "epoch": 6667} {"train_loss": -27.492361068725586, "global_step": 553426, "epoch": 6667} {"train_loss": -27.521442413330078, "global_step": 553427, "epoch": 6667} {"train_loss": -27.665634155273438, "global_step": 553428, "epoch": 6667} {"train_loss": -28.057239532470703, "global_step": 553429, "epoch": 6667} {"train_loss": -27.47977066040039, "global_step": 553430, "epoch": 6667} {"train_loss": -27.625646591186523, "global_step": 553431, "epoch": 6667} {"train_loss": -28.0692195892334, "global_step": 553432, "epoch": 6667} {"train_loss": -27.9169864654541, "global_step": 553433, "epoch": 6667} {"train_loss": -27.7288818359375, "global_step": 553434, "epoch": 6667} {"train_loss": -27.656940460205078, "global_step": 553435, "epoch": 6667} {"train_loss": -28.026941299438477, "global_step": 553436, "epoch": 6667} {"train_loss": -28.030975341796875, "global_step": 553437, "epoch": 6667} {"train_loss": -27.899641036987305, "global_step": 553438, "epoch": 6667} {"train_loss": -28.155431747436523, "global_step": 553439, "epoch": 6667} {"train_loss": -27.95804786682129, "global_step": 553440, "epoch": 6667} {"train_loss": -27.994068145751953, "global_step": 553441, "epoch": 6667} {"train_loss": -27.550260543823242, "global_step": 553442, "epoch": 6667} {"train_loss": -27.577190123408673, "global_step": 553443, "epoch": 6667, "val_loss": 6613209.0} {"train_loss": -27.05340576171875, "global_step": 553444, "epoch": 6668} {"train_loss": -26.932859420776367, "global_step": 553445, "epoch": 6668} {"train_loss": -27.339643478393555, "global_step": 553446, "epoch": 6668} {"train_loss": -26.852237701416016, "global_step": 553447, "epoch": 6668} {"train_loss": -27.117589950561523, "global_step": 553448, "epoch": 6668} {"train_loss": -26.890182495117188, "global_step": 553449, "epoch": 6668} {"train_loss": -27.31369400024414, "global_step": 553450, "epoch": 6668} {"train_loss": -26.95269775390625, "global_step": 553451, "epoch": 6668} {"train_loss": -27.23713493347168, "global_step": 553452, "epoch": 6668} {"train_loss": -26.80243492126465, "global_step": 553453, "epoch": 6668} {"train_loss": -26.810190200805664, "global_step": 553454, "epoch": 6668} {"train_loss": -27.05372428894043, "global_step": 553455, "epoch": 6668} {"train_loss": -27.46575355529785, "global_step": 553456, "epoch": 6668} {"train_loss": -27.177499771118164, "global_step": 553457, "epoch": 6668} {"train_loss": -27.60614013671875, "global_step": 553458, "epoch": 6668} {"train_loss": -26.597257614135742, "global_step": 553459, "epoch": 6668} {"train_loss": -27.175220489501953, "global_step": 553460, "epoch": 6668} {"train_loss": -27.683277130126953, "global_step": 553461, "epoch": 6668} {"train_loss": -27.496625900268555, "global_step": 553462, "epoch": 6668} {"train_loss": -27.325010299682617, "global_step": 553463, "epoch": 6668} {"train_loss": -27.537317276000977, "global_step": 553464, "epoch": 6668} {"train_loss": -27.44325828552246, "global_step": 553465, "epoch": 6668} {"train_loss": -27.689102172851562, "global_step": 553466, "epoch": 6668} {"train_loss": -27.707305908203125, "global_step": 553467, "epoch": 6668} {"train_loss": -27.28241539001465, "global_step": 553468, "epoch": 6668} {"train_loss": -27.156936645507812, "global_step": 553469, "epoch": 6668} {"train_loss": -27.88563346862793, "global_step": 553470, "epoch": 6668} {"train_loss": -27.438024520874023, "global_step": 553471, "epoch": 6668} {"train_loss": -27.868789672851562, "global_step": 553472, "epoch": 6668} {"train_loss": -27.612878799438477, "global_step": 553473, "epoch": 6668} {"train_loss": -27.4705810546875, "global_step": 553474, "epoch": 6668} {"train_loss": -27.593061447143555, "global_step": 553475, "epoch": 6668} {"train_loss": -27.50412368774414, "global_step": 553476, "epoch": 6668} {"train_loss": -27.91657829284668, "global_step": 553477, "epoch": 6668} {"train_loss": -27.62994384765625, "global_step": 553478, "epoch": 6668} {"train_loss": -28.238126754760742, "global_step": 553479, "epoch": 6668} {"train_loss": -27.7825870513916, "global_step": 553480, "epoch": 6668} {"train_loss": -27.66510009765625, "global_step": 553481, "epoch": 6668} {"train_loss": -27.31516456604004, "global_step": 553482, "epoch": 6668} {"train_loss": -27.570560455322266, "global_step": 553483, "epoch": 6668} {"train_loss": -27.641193389892578, "global_step": 553484, "epoch": 6668} {"train_loss": -27.478925704956055, "global_step": 553485, "epoch": 6668} {"train_loss": -27.69753074645996, "global_step": 553486, "epoch": 6668} {"train_loss": -27.984912872314453, "global_step": 553487, "epoch": 6668} {"train_loss": -28.043609619140625, "global_step": 553488, "epoch": 6668} {"train_loss": -27.732160568237305, "global_step": 553489, "epoch": 6668} {"train_loss": -28.178268432617188, "global_step": 553490, "epoch": 6668} {"train_loss": -27.64348793029785, "global_step": 553491, "epoch": 6668} {"train_loss": -27.249393463134766, "global_step": 553492, "epoch": 6668} {"train_loss": -27.8457088470459, "global_step": 553493, "epoch": 6668} {"train_loss": -27.318212509155273, "global_step": 553494, "epoch": 6668} {"train_loss": -27.752038955688477, "global_step": 553495, "epoch": 6668} {"train_loss": -27.73160743713379, "global_step": 553496, "epoch": 6668} {"train_loss": -27.580549240112305, "global_step": 553497, "epoch": 6668} {"train_loss": -28.0085506439209, "global_step": 553498, "epoch": 6668} {"train_loss": -27.71369743347168, "global_step": 553499, "epoch": 6668} {"train_loss": -28.09549331665039, "global_step": 553500, "epoch": 6668} {"train_loss": -27.40714454650879, "global_step": 553501, "epoch": 6668} {"train_loss": -27.74703025817871, "global_step": 553502, "epoch": 6668} {"train_loss": -27.84246253967285, "global_step": 553503, "epoch": 6668} {"train_loss": -27.813322067260742, "global_step": 553504, "epoch": 6668} {"train_loss": -27.915958404541016, "global_step": 553505, "epoch": 6668} {"train_loss": -27.92766761779785, "global_step": 553506, "epoch": 6668} {"train_loss": -27.905582427978516, "global_step": 553507, "epoch": 6668} {"train_loss": -27.908878326416016, "global_step": 553508, "epoch": 6668} {"train_loss": -27.938425064086914, "global_step": 553509, "epoch": 6668} {"train_loss": -27.921295166015625, "global_step": 553510, "epoch": 6668} {"train_loss": -27.974760055541992, "global_step": 553511, "epoch": 6668} {"train_loss": -28.027952194213867, "global_step": 553512, "epoch": 6668} {"train_loss": -27.793243408203125, "global_step": 553513, "epoch": 6668} {"train_loss": -27.855554580688477, "global_step": 553514, "epoch": 6668} {"train_loss": -27.613311767578125, "global_step": 553515, "epoch": 6668} {"train_loss": -27.668176651000977, "global_step": 553516, "epoch": 6668} {"train_loss": -28.00417137145996, "global_step": 553517, "epoch": 6668} {"train_loss": -28.07313346862793, "global_step": 553518, "epoch": 6668} {"train_loss": -27.920312881469727, "global_step": 553519, "epoch": 6668} {"train_loss": -27.917966842651367, "global_step": 553520, "epoch": 6668} {"train_loss": -27.7390079498291, "global_step": 553521, "epoch": 6668} {"train_loss": -27.740285873413086, "global_step": 553522, "epoch": 6668} {"train_loss": -27.732248306274414, "global_step": 553523, "epoch": 6668} {"train_loss": -27.93336296081543, "global_step": 553524, "epoch": 6668} {"train_loss": -27.674406051635742, "global_step": 553525, "epoch": 6668} {"train_loss": -27.58431338114911, "global_step": 553526, "epoch": 6668, "val_loss": 6633388.5} {"train_loss": -27.1706485748291, "global_step": 553527, "epoch": 6669} {"train_loss": -27.277814865112305, "global_step": 553528, "epoch": 6669} {"train_loss": -28.031278610229492, "global_step": 553529, "epoch": 6669} {"train_loss": -27.159439086914062, "global_step": 553530, "epoch": 6669} {"train_loss": -27.104360580444336, "global_step": 553531, "epoch": 6669} {"train_loss": -27.385541915893555, "global_step": 553532, "epoch": 6669} {"train_loss": -27.16456413269043, "global_step": 553533, "epoch": 6669} {"train_loss": -27.266223907470703, "global_step": 553534, "epoch": 6669} {"train_loss": -27.49036979675293, "global_step": 553535, "epoch": 6669} {"train_loss": -27.43242835998535, "global_step": 553536, "epoch": 6669} {"train_loss": -27.723920822143555, "global_step": 553537, "epoch": 6669} {"train_loss": -27.289037704467773, "global_step": 553538, "epoch": 6669} {"train_loss": -27.176008224487305, "global_step": 553539, "epoch": 6669} {"train_loss": -27.82257080078125, "global_step": 553540, "epoch": 6669} {"train_loss": -27.687307357788086, "global_step": 553541, "epoch": 6669} {"train_loss": -27.664688110351562, "global_step": 553542, "epoch": 6669} {"train_loss": -27.831470489501953, "global_step": 553543, "epoch": 6669} {"train_loss": -27.81159019470215, "global_step": 553544, "epoch": 6669} {"train_loss": -27.678991317749023, "global_step": 553545, "epoch": 6669} {"train_loss": -27.772382736206055, "global_step": 553546, "epoch": 6669} {"train_loss": -27.45026969909668, "global_step": 553547, "epoch": 6669} {"train_loss": -27.686914443969727, "global_step": 553548, "epoch": 6669} {"train_loss": -27.694808959960938, "global_step": 553549, "epoch": 6669} {"train_loss": -27.680124282836914, "global_step": 553550, "epoch": 6669} {"train_loss": -27.536340713500977, "global_step": 553551, "epoch": 6669} {"train_loss": -27.41651725769043, "global_step": 553552, "epoch": 6669} {"train_loss": -27.347156524658203, "global_step": 553553, "epoch": 6669} {"train_loss": -27.730199813842773, "global_step": 553554, "epoch": 6669} {"train_loss": -28.05378532409668, "global_step": 553555, "epoch": 6669} {"train_loss": -27.387170791625977, "global_step": 553556, "epoch": 6669} {"train_loss": -27.85468101501465, "global_step": 553557, "epoch": 6669} {"train_loss": -27.58211326599121, "global_step": 553558, "epoch": 6669} {"train_loss": -27.3039493560791, "global_step": 553559, "epoch": 6669} {"train_loss": -27.88825035095215, "global_step": 553560, "epoch": 6669} {"train_loss": -27.89179801940918, "global_step": 553561, "epoch": 6669} {"train_loss": -27.74640464782715, "global_step": 553562, "epoch": 6669} {"train_loss": -27.987058639526367, "global_step": 553563, "epoch": 6669} {"train_loss": -27.55182456970215, "global_step": 553564, "epoch": 6669} {"train_loss": -27.909717559814453, "global_step": 553565, "epoch": 6669} {"train_loss": -27.69129753112793, "global_step": 553566, "epoch": 6669} {"train_loss": -28.000463485717773, "global_step": 553567, "epoch": 6669} {"train_loss": -27.786252975463867, "global_step": 553568, "epoch": 6669} {"train_loss": -27.876977920532227, "global_step": 553569, "epoch": 6669} {"train_loss": -27.540258407592773, "global_step": 553570, "epoch": 6669} {"train_loss": -27.22611427307129, "global_step": 553571, "epoch": 6669} {"train_loss": -27.39238929748535, "global_step": 553572, "epoch": 6669} {"train_loss": -28.091156005859375, "global_step": 553573, "epoch": 6669} {"train_loss": -27.597753524780273, "global_step": 553574, "epoch": 6669} {"train_loss": -27.741735458374023, "global_step": 553575, "epoch": 6669} {"train_loss": -27.7603759765625, "global_step": 553576, "epoch": 6669} {"train_loss": -28.092742919921875, "global_step": 553577, "epoch": 6669} {"train_loss": -27.6634464263916, "global_step": 553578, "epoch": 6669} {"train_loss": -27.7030029296875, "global_step": 553579, "epoch": 6669} {"train_loss": -27.82881736755371, "global_step": 553580, "epoch": 6669} {"train_loss": -27.741352081298828, "global_step": 553581, "epoch": 6669} {"train_loss": -27.679004669189453, "global_step": 553582, "epoch": 6669} {"train_loss": -27.83608055114746, "global_step": 553583, "epoch": 6669} {"train_loss": -27.4407958984375, "global_step": 553584, "epoch": 6669} {"train_loss": -27.451135635375977, "global_step": 553585, "epoch": 6669} {"train_loss": -27.733142852783203, "global_step": 553586, "epoch": 6669} {"train_loss": -27.63399314880371, "global_step": 553587, "epoch": 6669} {"train_loss": -27.807621002197266, "global_step": 553588, "epoch": 6669} {"train_loss": -27.76612663269043, "global_step": 553589, "epoch": 6669} {"train_loss": -27.729883193969727, "global_step": 553590, "epoch": 6669} {"train_loss": -27.541793823242188, "global_step": 553591, "epoch": 6669} {"train_loss": -28.05824851989746, "global_step": 553592, "epoch": 6669} {"train_loss": -27.635013580322266, "global_step": 553593, "epoch": 6669} {"train_loss": -27.799884796142578, "global_step": 553594, "epoch": 6669} {"train_loss": -27.554290771484375, "global_step": 553595, "epoch": 6669} {"train_loss": -27.5495662689209, "global_step": 553596, "epoch": 6669} {"train_loss": -27.405309677124023, "global_step": 553597, "epoch": 6669} {"train_loss": -27.288562774658203, "global_step": 553598, "epoch": 6669} {"train_loss": -27.687009811401367, "global_step": 553599, "epoch": 6669} {"train_loss": -27.451440811157227, "global_step": 553600, "epoch": 6669} {"train_loss": -27.71233558654785, "global_step": 553601, "epoch": 6669} {"train_loss": -27.481908798217773, "global_step": 553602, "epoch": 6669} {"train_loss": -27.4577579498291, "global_step": 553603, "epoch": 6669} {"train_loss": -28.12544059753418, "global_step": 553604, "epoch": 6669} {"train_loss": -27.59255027770996, "global_step": 553605, "epoch": 6669} {"train_loss": -27.424671173095703, "global_step": 553606, "epoch": 6669} {"train_loss": -27.7952938079834, "global_step": 553607, "epoch": 6669} {"train_loss": -27.85565185546875, "global_step": 553608, "epoch": 6669} {"train_loss": -27.628015058586396, "global_step": 553609, "epoch": 6669, "val_loss": 6550886.5} {"train_loss": -26.824872970581055, "global_step": 553610, "epoch": 6670} {"train_loss": -25.928876876831055, "global_step": 553611, "epoch": 6670} {"train_loss": -26.35479164123535, "global_step": 553612, "epoch": 6670} {"train_loss": -26.72340202331543, "global_step": 553613, "epoch": 6670} {"train_loss": -27.403640747070312, "global_step": 553614, "epoch": 6670} {"train_loss": -27.191455841064453, "global_step": 553615, "epoch": 6670} {"train_loss": -27.128143310546875, "global_step": 553616, "epoch": 6670} {"train_loss": -27.625171661376953, "global_step": 553617, "epoch": 6670} {"train_loss": -27.12017250061035, "global_step": 553618, "epoch": 6670} {"train_loss": -27.439971923828125, "global_step": 553619, "epoch": 6670} {"train_loss": -27.294662475585938, "global_step": 553620, "epoch": 6670} {"train_loss": -27.343381881713867, "global_step": 553621, "epoch": 6670} {"train_loss": -27.473529815673828, "global_step": 553622, "epoch": 6670} {"train_loss": -27.6049861907959, "global_step": 553623, "epoch": 6670} {"train_loss": -27.68878746032715, "global_step": 553624, "epoch": 6670} {"train_loss": -27.792245864868164, "global_step": 553625, "epoch": 6670} {"train_loss": -26.8551025390625, "global_step": 553626, "epoch": 6670} {"train_loss": -27.578805923461914, "global_step": 553627, "epoch": 6670} {"train_loss": -27.359085083007812, "global_step": 553628, "epoch": 6670} {"train_loss": -27.639188766479492, "global_step": 553629, "epoch": 6670} {"train_loss": -27.789670944213867, "global_step": 553630, "epoch": 6670} {"train_loss": -27.843708038330078, "global_step": 553631, "epoch": 6670} {"train_loss": -27.735233306884766, "global_step": 553632, "epoch": 6670} {"train_loss": -27.750171661376953, "global_step": 553633, "epoch": 6670} {"train_loss": -27.570432662963867, "global_step": 553634, "epoch": 6670} {"train_loss": -28.024765014648438, "global_step": 553635, "epoch": 6670} {"train_loss": -27.878141403198242, "global_step": 553636, "epoch": 6670} {"train_loss": -27.679767608642578, "global_step": 553637, "epoch": 6670} {"train_loss": -27.848493576049805, "global_step": 553638, "epoch": 6670} {"train_loss": -28.029020309448242, "global_step": 553639, "epoch": 6670} {"train_loss": -27.66023063659668, "global_step": 553640, "epoch": 6670} {"train_loss": -27.741886138916016, "global_step": 553641, "epoch": 6670} {"train_loss": -28.006881713867188, "global_step": 553642, "epoch": 6670} {"train_loss": -27.844436645507812, "global_step": 553643, "epoch": 6670} {"train_loss": -27.865896224975586, "global_step": 553644, "epoch": 6670} {"train_loss": -27.679845809936523, "global_step": 553645, "epoch": 6670} {"train_loss": -27.45292091369629, "global_step": 553646, "epoch": 6670} {"train_loss": -27.753559112548828, "global_step": 553647, "epoch": 6670} {"train_loss": -27.92388343811035, "global_step": 553648, "epoch": 6670} {"train_loss": -28.225299835205078, "global_step": 553649, "epoch": 6670} {"train_loss": -27.865381240844727, "global_step": 553650, "epoch": 6670} {"train_loss": -27.7574462890625, "global_step": 553651, "epoch": 6670} {"train_loss": -28.00530433654785, "global_step": 553652, "epoch": 6670} {"train_loss": -28.009357452392578, "global_step": 553653, "epoch": 6670} {"train_loss": -28.025678634643555, "global_step": 553654, "epoch": 6670} {"train_loss": -28.33365249633789, "global_step": 553655, "epoch": 6670} {"train_loss": -27.745466232299805, "global_step": 553656, "epoch": 6670} {"train_loss": -28.018798828125, "global_step": 553657, "epoch": 6670} {"train_loss": -27.909936904907227, "global_step": 553658, "epoch": 6670} {"train_loss": -27.96799659729004, "global_step": 553659, "epoch": 6670} {"train_loss": -27.911264419555664, "global_step": 553660, "epoch": 6670} {"train_loss": -27.64173698425293, "global_step": 553661, "epoch": 6670} {"train_loss": -27.907583236694336, "global_step": 553662, "epoch": 6670} {"train_loss": -26.9948673248291, "global_step": 553663, "epoch": 6670} {"train_loss": -27.421192169189453, "global_step": 553664, "epoch": 6670} {"train_loss": -26.344030380249023, "global_step": 553665, "epoch": 6670} {"train_loss": -26.44675636291504, "global_step": 553666, "epoch": 6670} {"train_loss": -26.722599029541016, "global_step": 553667, "epoch": 6670} {"train_loss": -26.91987419128418, "global_step": 553668, "epoch": 6670} {"train_loss": -27.468229293823242, "global_step": 553669, "epoch": 6670} {"train_loss": -27.30573081970215, "global_step": 553670, "epoch": 6670} {"train_loss": -27.306140899658203, "global_step": 553671, "epoch": 6670} {"train_loss": -27.400251388549805, "global_step": 553672, "epoch": 6670} {"train_loss": -27.722503662109375, "global_step": 553673, "epoch": 6670} {"train_loss": -27.941822052001953, "global_step": 553674, "epoch": 6670} {"train_loss": -27.628711700439453, "global_step": 553675, "epoch": 6670} {"train_loss": -27.629148483276367, "global_step": 553676, "epoch": 6670} {"train_loss": -27.361785888671875, "global_step": 553677, "epoch": 6670} {"train_loss": -27.661359786987305, "global_step": 553678, "epoch": 6670} {"train_loss": -27.622900009155273, "global_step": 553679, "epoch": 6670} {"train_loss": -27.549484252929688, "global_step": 553680, "epoch": 6670} {"train_loss": -27.695545196533203, "global_step": 553681, "epoch": 6670} {"train_loss": -27.82148551940918, "global_step": 553682, "epoch": 6670} {"train_loss": -27.99933433532715, "global_step": 553683, "epoch": 6670} {"train_loss": -27.337610244750977, "global_step": 553684, "epoch": 6670} {"train_loss": -27.534194946289062, "global_step": 553685, "epoch": 6670} {"train_loss": -27.6485652923584, "global_step": 553686, "epoch": 6670} {"train_loss": -27.922748565673828, "global_step": 553687, "epoch": 6670} {"train_loss": -27.8076114654541, "global_step": 553688, "epoch": 6670} {"train_loss": -27.948328018188477, "global_step": 553689, "epoch": 6670} {"train_loss": -27.746234893798828, "global_step": 553690, "epoch": 6670} {"train_loss": -27.611047744750977, "global_step": 553691, "epoch": 6670} {"train_loss": -27.556900621896766, "global_step": 553692, "epoch": 6670, "val_loss": 6598382.0} {"train_loss": -27.700153350830078, "global_step": 553693, "epoch": 6671} {"train_loss": -27.2539119720459, "global_step": 553694, "epoch": 6671} {"train_loss": -27.589385986328125, "global_step": 553695, "epoch": 6671} {"train_loss": -27.524206161499023, "global_step": 553696, "epoch": 6671} {"train_loss": -27.3836727142334, "global_step": 553697, "epoch": 6671} {"train_loss": -27.499622344970703, "global_step": 553698, "epoch": 6671} {"train_loss": -27.399677276611328, "global_step": 553699, "epoch": 6671} {"train_loss": -27.575103759765625, "global_step": 553700, "epoch": 6671} {"train_loss": -27.506744384765625, "global_step": 553701, "epoch": 6671} {"train_loss": -27.661865234375, "global_step": 553702, "epoch": 6671} {"train_loss": -27.631580352783203, "global_step": 553703, "epoch": 6671} {"train_loss": -27.482410430908203, "global_step": 553704, "epoch": 6671} {"train_loss": -27.12428092956543, "global_step": 553705, "epoch": 6671} {"train_loss": -27.387496948242188, "global_step": 553706, "epoch": 6671} {"train_loss": -27.676984786987305, "global_step": 553707, "epoch": 6671} {"train_loss": -27.247655868530273, "global_step": 553708, "epoch": 6671} {"train_loss": -27.506122589111328, "global_step": 553709, "epoch": 6671} {"train_loss": -27.887609481811523, "global_step": 553710, "epoch": 6671} {"train_loss": -27.654462814331055, "global_step": 553711, "epoch": 6671} {"train_loss": -27.64960289001465, "global_step": 553712, "epoch": 6671} {"train_loss": -27.70654296875, "global_step": 553713, "epoch": 6671} {"train_loss": -27.63909912109375, "global_step": 553714, "epoch": 6671} {"train_loss": -27.596288681030273, "global_step": 553715, "epoch": 6671} {"train_loss": -28.08253288269043, "global_step": 553716, "epoch": 6671} {"train_loss": -27.850177764892578, "global_step": 553717, "epoch": 6671} {"train_loss": -27.99915885925293, "global_step": 553718, "epoch": 6671} {"train_loss": -28.012012481689453, "global_step": 553719, "epoch": 6671} {"train_loss": -27.717151641845703, "global_step": 553720, "epoch": 6671} {"train_loss": -28.212482452392578, "global_step": 553721, "epoch": 6671} {"train_loss": -27.62346839904785, "global_step": 553722, "epoch": 6671} {"train_loss": -27.97181510925293, "global_step": 553723, "epoch": 6671} {"train_loss": -27.825571060180664, "global_step": 553724, "epoch": 6671} {"train_loss": -28.257314682006836, "global_step": 553725, "epoch": 6671} {"train_loss": -27.646560668945312, "global_step": 553726, "epoch": 6671} {"train_loss": -27.759565353393555, "global_step": 553727, "epoch": 6671} {"train_loss": -27.894744873046875, "global_step": 553728, "epoch": 6671} {"train_loss": -28.0864200592041, "global_step": 553729, "epoch": 6671} {"train_loss": -28.156652450561523, "global_step": 553730, "epoch": 6671} {"train_loss": -27.838119506835938, "global_step": 553731, "epoch": 6671} {"train_loss": -27.61529541015625, "global_step": 553732, "epoch": 6671} {"train_loss": -27.3023681640625, "global_step": 553733, "epoch": 6671} {"train_loss": -26.923009872436523, "global_step": 553734, "epoch": 6671} {"train_loss": -25.799488067626953, "global_step": 553735, "epoch": 6671} {"train_loss": -25.849109649658203, "global_step": 553736, "epoch": 6671} {"train_loss": -26.687986373901367, "global_step": 553737, "epoch": 6671} {"train_loss": -26.462854385375977, "global_step": 553738, "epoch": 6671} {"train_loss": -26.727981567382812, "global_step": 553739, "epoch": 6671} {"train_loss": -26.40728187561035, "global_step": 553740, "epoch": 6671} {"train_loss": -27.03505516052246, "global_step": 553741, "epoch": 6671} {"train_loss": -26.735143661499023, "global_step": 553742, "epoch": 6671} {"train_loss": -26.982990264892578, "global_step": 553743, "epoch": 6671} {"train_loss": -26.940885543823242, "global_step": 553744, "epoch": 6671} {"train_loss": -27.42923355102539, "global_step": 553745, "epoch": 6671} {"train_loss": -27.120752334594727, "global_step": 553746, "epoch": 6671} {"train_loss": -26.97163200378418, "global_step": 553747, "epoch": 6671} {"train_loss": -27.035486221313477, "global_step": 553748, "epoch": 6671} {"train_loss": -27.28488540649414, "global_step": 553749, "epoch": 6671} {"train_loss": -27.328001022338867, "global_step": 553750, "epoch": 6671} {"train_loss": -27.272275924682617, "global_step": 553751, "epoch": 6671} {"train_loss": -26.882614135742188, "global_step": 553752, "epoch": 6671} {"train_loss": -27.23569107055664, "global_step": 553753, "epoch": 6671} {"train_loss": -27.349048614501953, "global_step": 553754, "epoch": 6671} {"train_loss": -27.35528564453125, "global_step": 553755, "epoch": 6671} {"train_loss": -27.46211051940918, "global_step": 553756, "epoch": 6671} {"train_loss": -27.70582389831543, "global_step": 553757, "epoch": 6671} {"train_loss": -27.678821563720703, "global_step": 553758, "epoch": 6671} {"train_loss": -27.08342933654785, "global_step": 553759, "epoch": 6671} {"train_loss": -27.557544708251953, "global_step": 553760, "epoch": 6671} {"train_loss": -27.52052116394043, "global_step": 553761, "epoch": 6671} {"train_loss": -27.27402687072754, "global_step": 553762, "epoch": 6671} {"train_loss": -27.368879318237305, "global_step": 553763, "epoch": 6671} {"train_loss": -27.643402099609375, "global_step": 553764, "epoch": 6671} {"train_loss": -27.79644775390625, "global_step": 553765, "epoch": 6671} {"train_loss": -27.8084659576416, "global_step": 553766, "epoch": 6671} {"train_loss": -27.8757381439209, "global_step": 553767, "epoch": 6671} {"train_loss": -27.388463973999023, "global_step": 553768, "epoch": 6671} {"train_loss": -27.52349853515625, "global_step": 553769, "epoch": 6671} {"train_loss": -27.719648361206055, "global_step": 553770, "epoch": 6671} {"train_loss": -27.814924240112305, "global_step": 553771, "epoch": 6671} {"train_loss": -28.156558990478516, "global_step": 553772, "epoch": 6671} {"train_loss": -27.45530128479004, "global_step": 553773, "epoch": 6671} {"train_loss": -27.907855987548828, "global_step": 553774, "epoch": 6671} {"train_loss": -27.466076793440852, "global_step": 553775, "epoch": 6671, "val_loss": 6465450.0} {"train_loss": -26.979572296142578, "global_step": 553776, "epoch": 6672} {"train_loss": -27.276203155517578, "global_step": 553777, "epoch": 6672} {"train_loss": -27.365442276000977, "global_step": 553778, "epoch": 6672} {"train_loss": -26.8930606842041, "global_step": 553779, "epoch": 6672} {"train_loss": -27.524734497070312, "global_step": 553780, "epoch": 6672} {"train_loss": -27.32923698425293, "global_step": 553781, "epoch": 6672} {"train_loss": -27.619443893432617, "global_step": 553782, "epoch": 6672} {"train_loss": -27.494672775268555, "global_step": 553783, "epoch": 6672} {"train_loss": -27.4858341217041, "global_step": 553784, "epoch": 6672} {"train_loss": -27.509937286376953, "global_step": 553785, "epoch": 6672} {"train_loss": -27.45977210998535, "global_step": 553786, "epoch": 6672} {"train_loss": -27.30695152282715, "global_step": 553787, "epoch": 6672} {"train_loss": -27.177642822265625, "global_step": 553788, "epoch": 6672} {"train_loss": -27.72047233581543, "global_step": 553789, "epoch": 6672} {"train_loss": -27.626256942749023, "global_step": 553790, "epoch": 6672} {"train_loss": -27.850820541381836, "global_step": 553791, "epoch": 6672} {"train_loss": -27.803775787353516, "global_step": 553792, "epoch": 6672} {"train_loss": -27.361337661743164, "global_step": 553793, "epoch": 6672} {"train_loss": -27.23321533203125, "global_step": 553794, "epoch": 6672} {"train_loss": -27.707422256469727, "global_step": 553795, "epoch": 6672} {"train_loss": -27.841794967651367, "global_step": 553796, "epoch": 6672} {"train_loss": -27.915746688842773, "global_step": 553797, "epoch": 6672} {"train_loss": -27.63654136657715, "global_step": 553798, "epoch": 6672} {"train_loss": -27.57984733581543, "global_step": 553799, "epoch": 6672} {"train_loss": -27.80735206604004, "global_step": 553800, "epoch": 6672} {"train_loss": -28.080738067626953, "global_step": 553801, "epoch": 6672} {"train_loss": -28.028186798095703, "global_step": 553802, "epoch": 6672} {"train_loss": -27.70867347717285, "global_step": 553803, "epoch": 6672} {"train_loss": -27.7921085357666, "global_step": 553804, "epoch": 6672} {"train_loss": -27.929513931274414, "global_step": 553805, "epoch": 6672} {"train_loss": -28.003070831298828, "global_step": 553806, "epoch": 6672} {"train_loss": -27.722867965698242, "global_step": 553807, "epoch": 6672} {"train_loss": -27.916723251342773, "global_step": 553808, "epoch": 6672} {"train_loss": -27.706298828125, "global_step": 553809, "epoch": 6672} {"train_loss": -27.599233627319336, "global_step": 553810, "epoch": 6672} {"train_loss": -27.61469841003418, "global_step": 553811, "epoch": 6672} {"train_loss": -27.6885929107666, "global_step": 553812, "epoch": 6672} {"train_loss": -27.996564865112305, "global_step": 553813, "epoch": 6672} {"train_loss": -27.858184814453125, "global_step": 553814, "epoch": 6672} {"train_loss": -27.752399444580078, "global_step": 553815, "epoch": 6672} {"train_loss": -27.41794204711914, "global_step": 553816, "epoch": 6672} {"train_loss": -27.686857223510742, "global_step": 553817, "epoch": 6672} {"train_loss": -27.69135856628418, "global_step": 553818, "epoch": 6672} {"train_loss": -27.84209632873535, "global_step": 553819, "epoch": 6672} {"train_loss": -27.59388542175293, "global_step": 553820, "epoch": 6672} {"train_loss": -27.649038314819336, "global_step": 553821, "epoch": 6672} {"train_loss": -27.56534194946289, "global_step": 553822, "epoch": 6672} {"train_loss": -27.874225616455078, "global_step": 553823, "epoch": 6672} {"train_loss": -27.489383697509766, "global_step": 553824, "epoch": 6672} {"train_loss": -27.56117057800293, "global_step": 553825, "epoch": 6672} {"train_loss": -27.18851089477539, "global_step": 553826, "epoch": 6672} {"train_loss": -27.752866744995117, "global_step": 553827, "epoch": 6672} {"train_loss": -27.802881240844727, "global_step": 553828, "epoch": 6672} {"train_loss": -27.92341423034668, "global_step": 553829, "epoch": 6672} {"train_loss": -27.3544864654541, "global_step": 553830, "epoch": 6672} {"train_loss": -28.155424118041992, "global_step": 553831, "epoch": 6672} {"train_loss": -28.121912002563477, "global_step": 553832, "epoch": 6672} {"train_loss": -27.8781795501709, "global_step": 553833, "epoch": 6672} {"train_loss": -28.105737686157227, "global_step": 553834, "epoch": 6672} {"train_loss": -27.878950119018555, "global_step": 553835, "epoch": 6672} {"train_loss": -27.614004135131836, "global_step": 553836, "epoch": 6672} {"train_loss": -27.964496612548828, "global_step": 553837, "epoch": 6672} {"train_loss": -28.14484214782715, "global_step": 553838, "epoch": 6672} {"train_loss": -27.72833251953125, "global_step": 553839, "epoch": 6672} {"train_loss": -28.081268310546875, "global_step": 553840, "epoch": 6672} {"train_loss": -27.992572784423828, "global_step": 553841, "epoch": 6672} {"train_loss": -27.8424129486084, "global_step": 553842, "epoch": 6672} {"train_loss": -27.7431697845459, "global_step": 553843, "epoch": 6672} {"train_loss": -28.000797271728516, "global_step": 553844, "epoch": 6672} {"train_loss": -27.7669620513916, "global_step": 553845, "epoch": 6672} {"train_loss": -27.92865562438965, "global_step": 553846, "epoch": 6672} {"train_loss": -27.967519760131836, "global_step": 553847, "epoch": 6672} {"train_loss": -27.798019409179688, "global_step": 553848, "epoch": 6672} {"train_loss": -28.289648056030273, "global_step": 553849, "epoch": 6672} {"train_loss": -28.20586585998535, "global_step": 553850, "epoch": 6672} {"train_loss": -28.055591583251953, "global_step": 553851, "epoch": 6672} {"train_loss": -28.297582626342773, "global_step": 553852, "epoch": 6672} {"train_loss": -27.75897789001465, "global_step": 553853, "epoch": 6672} {"train_loss": -27.967453002929688, "global_step": 553854, "epoch": 6672} {"train_loss": -27.93523597717285, "global_step": 553855, "epoch": 6672} {"train_loss": -27.7672061920166, "global_step": 553856, "epoch": 6672} {"train_loss": -27.47010612487793, "global_step": 553857, "epoch": 6672} {"train_loss": -27.716679285807782, "global_step": 553858, "epoch": 6672, "val_loss": 6570277.5} {"train_loss": -27.124603271484375, "global_step": 553859, "epoch": 6673} {"train_loss": -26.9328556060791, "global_step": 553860, "epoch": 6673} {"train_loss": -27.041645050048828, "global_step": 553861, "epoch": 6673} {"train_loss": -26.29831886291504, "global_step": 553862, "epoch": 6673} {"train_loss": -26.30659294128418, "global_step": 553863, "epoch": 6673} {"train_loss": -26.70380210876465, "global_step": 553864, "epoch": 6673} {"train_loss": -27.207019805908203, "global_step": 553865, "epoch": 6673} {"train_loss": -26.72199058532715, "global_step": 553866, "epoch": 6673} {"train_loss": -27.16718864440918, "global_step": 553867, "epoch": 6673} {"train_loss": -27.295568466186523, "global_step": 553868, "epoch": 6673} {"train_loss": -26.960662841796875, "global_step": 553869, "epoch": 6673} {"train_loss": -27.6461181640625, "global_step": 553870, "epoch": 6673} {"train_loss": -26.86652946472168, "global_step": 553871, "epoch": 6673} {"train_loss": -27.45452308654785, "global_step": 553872, "epoch": 6673} {"train_loss": -27.36174964904785, "global_step": 553873, "epoch": 6673} {"train_loss": -27.09714126586914, "global_step": 553874, "epoch": 6673} {"train_loss": -27.263843536376953, "global_step": 553875, "epoch": 6673} {"train_loss": -26.92535400390625, "global_step": 553876, "epoch": 6673} {"train_loss": -27.434650421142578, "global_step": 553877, "epoch": 6673} {"train_loss": -27.02606201171875, "global_step": 553878, "epoch": 6673} {"train_loss": -27.392847061157227, "global_step": 553879, "epoch": 6673} {"train_loss": -27.572301864624023, "global_step": 553880, "epoch": 6673} {"train_loss": -27.3477840423584, "global_step": 553881, "epoch": 6673} {"train_loss": -27.80804443359375, "global_step": 553882, "epoch": 6673} {"train_loss": -27.26764488220215, "global_step": 553883, "epoch": 6673} {"train_loss": -27.382551193237305, "global_step": 553884, "epoch": 6673} {"train_loss": -27.652021408081055, "global_step": 553885, "epoch": 6673} {"train_loss": -27.63270378112793, "global_step": 553886, "epoch": 6673} {"train_loss": -27.707752227783203, "global_step": 553887, "epoch": 6673} {"train_loss": -27.756872177124023, "global_step": 553888, "epoch": 6673} {"train_loss": -27.789541244506836, "global_step": 553889, "epoch": 6673} {"train_loss": -27.90516471862793, "global_step": 553890, "epoch": 6673} {"train_loss": -27.501270294189453, "global_step": 553891, "epoch": 6673} {"train_loss": -27.725446701049805, "global_step": 553892, "epoch": 6673} {"train_loss": -27.520654678344727, "global_step": 553893, "epoch": 6673} {"train_loss": -27.598098754882812, "global_step": 553894, "epoch": 6673} {"train_loss": -27.52064323425293, "global_step": 553895, "epoch": 6673} {"train_loss": -27.680875778198242, "global_step": 553896, "epoch": 6673} {"train_loss": -27.552942276000977, "global_step": 553897, "epoch": 6673} {"train_loss": -27.8815860748291, "global_step": 553898, "epoch": 6673} {"train_loss": -27.68841552734375, "global_step": 553899, "epoch": 6673} {"train_loss": -27.917749404907227, "global_step": 553900, "epoch": 6673} {"train_loss": -27.860517501831055, "global_step": 553901, "epoch": 6673} {"train_loss": -27.653417587280273, "global_step": 553902, "epoch": 6673} {"train_loss": -27.64299964904785, "global_step": 553903, "epoch": 6673} {"train_loss": -27.666217803955078, "global_step": 553904, "epoch": 6673} {"train_loss": -27.3580322265625, "global_step": 553905, "epoch": 6673} {"train_loss": -27.71441650390625, "global_step": 553906, "epoch": 6673} {"train_loss": -27.472043991088867, "global_step": 553907, "epoch": 6673} {"train_loss": -28.0502872467041, "global_step": 553908, "epoch": 6673} {"train_loss": -27.981653213500977, "global_step": 553909, "epoch": 6673} {"train_loss": -27.91851806640625, "global_step": 553910, "epoch": 6673} {"train_loss": -27.66434669494629, "global_step": 553911, "epoch": 6673} {"train_loss": -27.970050811767578, "global_step": 553912, "epoch": 6673} {"train_loss": -28.313079833984375, "global_step": 553913, "epoch": 6673} {"train_loss": -27.662729263305664, "global_step": 553914, "epoch": 6673} {"train_loss": -27.823904037475586, "global_step": 553915, "epoch": 6673} {"train_loss": -28.133777618408203, "global_step": 553916, "epoch": 6673} {"train_loss": -27.440357208251953, "global_step": 553917, "epoch": 6673} {"train_loss": -27.36809730529785, "global_step": 553918, "epoch": 6673} {"train_loss": -27.461883544921875, "global_step": 553919, "epoch": 6673} {"train_loss": -27.745086669921875, "global_step": 553920, "epoch": 6673} {"train_loss": -27.53412437438965, "global_step": 553921, "epoch": 6673} {"train_loss": -27.9177303314209, "global_step": 553922, "epoch": 6673} {"train_loss": -27.8887996673584, "global_step": 553923, "epoch": 6673} {"train_loss": -27.826251983642578, "global_step": 553924, "epoch": 6673} {"train_loss": -27.394027709960938, "global_step": 553925, "epoch": 6673} {"train_loss": -27.7302188873291, "global_step": 553926, "epoch": 6673} {"train_loss": -27.406396865844727, "global_step": 553927, "epoch": 6673} {"train_loss": -27.992101669311523, "global_step": 553928, "epoch": 6673} {"train_loss": -27.70863914489746, "global_step": 553929, "epoch": 6673} {"train_loss": -27.677515029907227, "global_step": 553930, "epoch": 6673} {"train_loss": -27.64777946472168, "global_step": 553931, "epoch": 6673} {"train_loss": -27.76328468322754, "global_step": 553932, "epoch": 6673} {"train_loss": -27.78261375427246, "global_step": 553933, "epoch": 6673} {"train_loss": -28.10443687438965, "global_step": 553934, "epoch": 6673} {"train_loss": -27.67963981628418, "global_step": 553935, "epoch": 6673} {"train_loss": -27.923227310180664, "global_step": 553936, "epoch": 6673} {"train_loss": -27.40372657775879, "global_step": 553937, "epoch": 6673} {"train_loss": -27.984729766845703, "global_step": 553938, "epoch": 6673} {"train_loss": -27.88408851623535, "global_step": 553939, "epoch": 6673} {"train_loss": -27.823322296142578, "global_step": 553940, "epoch": 6673} {"train_loss": -27.545547370451043, "global_step": 553941, "epoch": 6673, "val_loss": 6593353.0} {"train_loss": -27.419620513916016, "global_step": 553942, "epoch": 6674} {"train_loss": -27.41521644592285, "global_step": 553943, "epoch": 6674} {"train_loss": -27.3714542388916, "global_step": 553944, "epoch": 6674} {"train_loss": -27.696027755737305, "global_step": 553945, "epoch": 6674} {"train_loss": -27.042234420776367, "global_step": 553946, "epoch": 6674} {"train_loss": -27.22446060180664, "global_step": 553947, "epoch": 6674} {"train_loss": -27.061115264892578, "global_step": 553948, "epoch": 6674} {"train_loss": -27.54767417907715, "global_step": 553949, "epoch": 6674} {"train_loss": -27.3175106048584, "global_step": 553950, "epoch": 6674} {"train_loss": -27.271121978759766, "global_step": 553951, "epoch": 6674} {"train_loss": -27.152286529541016, "global_step": 553952, "epoch": 6674} {"train_loss": -27.561201095581055, "global_step": 553953, "epoch": 6674} {"train_loss": -27.516828536987305, "global_step": 553954, "epoch": 6674} {"train_loss": -27.564611434936523, "global_step": 553955, "epoch": 6674} {"train_loss": -27.27313232421875, "global_step": 553956, "epoch": 6674} {"train_loss": -28.0310115814209, "global_step": 553957, "epoch": 6674} {"train_loss": -27.380090713500977, "global_step": 553958, "epoch": 6674} {"train_loss": -27.19342613220215, "global_step": 553959, "epoch": 6674} {"train_loss": -27.463842391967773, "global_step": 553960, "epoch": 6674} {"train_loss": -27.947317123413086, "global_step": 553961, "epoch": 6674} {"train_loss": -27.576353073120117, "global_step": 553962, "epoch": 6674} {"train_loss": -27.152576446533203, "global_step": 553963, "epoch": 6674} {"train_loss": -27.959197998046875, "global_step": 553964, "epoch": 6674} {"train_loss": -27.725208282470703, "global_step": 553965, "epoch": 6674} {"train_loss": -27.6926326751709, "global_step": 553966, "epoch": 6674} {"train_loss": -27.800336837768555, "global_step": 553967, "epoch": 6674} {"train_loss": -27.817792892456055, "global_step": 553968, "epoch": 6674} {"train_loss": -27.52587890625, "global_step": 553969, "epoch": 6674} {"train_loss": -27.650495529174805, "global_step": 553970, "epoch": 6674} {"train_loss": -27.744592666625977, "global_step": 553971, "epoch": 6674} {"train_loss": -27.708271026611328, "global_step": 553972, "epoch": 6674} {"train_loss": -27.867786407470703, "global_step": 553973, "epoch": 6674} {"train_loss": -27.629892349243164, "global_step": 553974, "epoch": 6674} {"train_loss": -27.829755783081055, "global_step": 553975, "epoch": 6674} {"train_loss": -27.961822509765625, "global_step": 553976, "epoch": 6674} {"train_loss": -27.784269332885742, "global_step": 553977, "epoch": 6674} {"train_loss": -27.71048927307129, "global_step": 553978, "epoch": 6674} {"train_loss": -28.11907386779785, "global_step": 553979, "epoch": 6674} {"train_loss": -27.8065242767334, "global_step": 553980, "epoch": 6674} {"train_loss": -27.79737663269043, "global_step": 553981, "epoch": 6674} {"train_loss": -28.070585250854492, "global_step": 553982, "epoch": 6674} {"train_loss": -27.5993709564209, "global_step": 553983, "epoch": 6674} {"train_loss": -28.49018669128418, "global_step": 553984, "epoch": 6674} {"train_loss": -28.048492431640625, "global_step": 553985, "epoch": 6674} {"train_loss": -28.039220809936523, "global_step": 553986, "epoch": 6674} {"train_loss": -28.026941299438477, "global_step": 553987, "epoch": 6674} {"train_loss": -28.1374454498291, "global_step": 553988, "epoch": 6674} {"train_loss": -27.883466720581055, "global_step": 553989, "epoch": 6674} {"train_loss": -27.82887840270996, "global_step": 553990, "epoch": 6674} {"train_loss": -27.934850692749023, "global_step": 553991, "epoch": 6674} {"train_loss": -27.528446197509766, "global_step": 553992, "epoch": 6674} {"train_loss": -27.2482852935791, "global_step": 553993, "epoch": 6674} {"train_loss": -26.650278091430664, "global_step": 553994, "epoch": 6674} {"train_loss": -27.099546432495117, "global_step": 553995, "epoch": 6674} {"train_loss": -27.408527374267578, "global_step": 553996, "epoch": 6674} {"train_loss": -27.845930099487305, "global_step": 553997, "epoch": 6674} {"train_loss": -27.123783111572266, "global_step": 553998, "epoch": 6674} {"train_loss": -27.356542587280273, "global_step": 553999, "epoch": 6674} {"train_loss": -27.1057186126709, "global_step": 554000, "epoch": 6674} {"train_loss": -27.384931564331055, "global_step": 554001, "epoch": 6674} {"train_loss": -27.658145904541016, "global_step": 554002, "epoch": 6674} {"train_loss": -27.487598419189453, "global_step": 554003, "epoch": 6674} {"train_loss": -27.470746994018555, "global_step": 554004, "epoch": 6674} {"train_loss": -27.500900268554688, "global_step": 554005, "epoch": 6674} {"train_loss": -27.455795288085938, "global_step": 554006, "epoch": 6674} {"train_loss": -27.949560165405273, "global_step": 554007, "epoch": 6674} {"train_loss": -27.86793327331543, "global_step": 554008, "epoch": 6674} {"train_loss": -27.512216567993164, "global_step": 554009, "epoch": 6674} {"train_loss": -27.550195693969727, "global_step": 554010, "epoch": 6674} {"train_loss": -27.296875, "global_step": 554011, "epoch": 6674} {"train_loss": -27.593305587768555, "global_step": 554012, "epoch": 6674} {"train_loss": -28.1796875, "global_step": 554013, "epoch": 6674} {"train_loss": -27.758956909179688, "global_step": 554014, "epoch": 6674} {"train_loss": -27.40899085998535, "global_step": 554015, "epoch": 6674} {"train_loss": -27.789356231689453, "global_step": 554016, "epoch": 6674} {"train_loss": -27.839452743530273, "global_step": 554017, "epoch": 6674} {"train_loss": -27.41462516784668, "global_step": 554018, "epoch": 6674} {"train_loss": -27.101537704467773, "global_step": 554019, "epoch": 6674} {"train_loss": -28.032514572143555, "global_step": 554020, "epoch": 6674} {"train_loss": -27.70490837097168, "global_step": 554021, "epoch": 6674} {"train_loss": -27.873178482055664, "global_step": 554022, "epoch": 6674} {"train_loss": -27.752124786376953, "global_step": 554023, "epoch": 6674} {"train_loss": -27.62147703515478, "global_step": 554024, "epoch": 6674, "val_loss": 6527937.0} {"train_loss": -26.533660888671875, "global_step": 554025, "epoch": 6675} {"train_loss": -25.26129913330078, "global_step": 554026, "epoch": 6675} {"train_loss": -26.557025909423828, "global_step": 554027, "epoch": 6675} {"train_loss": -26.208789825439453, "global_step": 554028, "epoch": 6675} {"train_loss": -26.192758560180664, "global_step": 554029, "epoch": 6675} {"train_loss": -26.6258487701416, "global_step": 554030, "epoch": 6675} {"train_loss": -26.498554229736328, "global_step": 554031, "epoch": 6675} {"train_loss": -26.62323570251465, "global_step": 554032, "epoch": 6675} {"train_loss": -26.257598876953125, "global_step": 554033, "epoch": 6675} {"train_loss": -26.860742568969727, "global_step": 554034, "epoch": 6675} {"train_loss": -27.25031089782715, "global_step": 554035, "epoch": 6675} {"train_loss": -26.854766845703125, "global_step": 554036, "epoch": 6675} {"train_loss": -27.192142486572266, "global_step": 554037, "epoch": 6675} {"train_loss": -27.111026763916016, "global_step": 554038, "epoch": 6675} {"train_loss": -27.324604034423828, "global_step": 554039, "epoch": 6675} {"train_loss": -26.79526710510254, "global_step": 554040, "epoch": 6675} {"train_loss": -27.13275146484375, "global_step": 554041, "epoch": 6675} {"train_loss": -27.533222198486328, "global_step": 554042, "epoch": 6675} {"train_loss": -27.273340225219727, "global_step": 554043, "epoch": 6675} {"train_loss": -27.36231803894043, "global_step": 554044, "epoch": 6675} {"train_loss": -27.70134925842285, "global_step": 554045, "epoch": 6675} {"train_loss": -27.433679580688477, "global_step": 554046, "epoch": 6675} {"train_loss": -27.48258399963379, "global_step": 554047, "epoch": 6675} {"train_loss": -27.169702529907227, "global_step": 554048, "epoch": 6675} {"train_loss": -27.342737197875977, "global_step": 554049, "epoch": 6675} {"train_loss": -27.690509796142578, "global_step": 554050, "epoch": 6675} {"train_loss": -27.444355010986328, "global_step": 554051, "epoch": 6675} {"train_loss": -26.99464225769043, "global_step": 554052, "epoch": 6675} {"train_loss": -27.19305419921875, "global_step": 554053, "epoch": 6675} {"train_loss": -27.762678146362305, "global_step": 554054, "epoch": 6675} {"train_loss": -27.679779052734375, "global_step": 554055, "epoch": 6675} {"train_loss": -27.4464168548584, "global_step": 554056, "epoch": 6675} {"train_loss": -27.7368221282959, "global_step": 554057, "epoch": 6675} {"train_loss": -27.667829513549805, "global_step": 554058, "epoch": 6675} {"train_loss": -27.65592384338379, "global_step": 554059, "epoch": 6675} {"train_loss": -27.68057632446289, "global_step": 554060, "epoch": 6675} {"train_loss": -27.487268447875977, "global_step": 554061, "epoch": 6675} {"train_loss": -28.1583309173584, "global_step": 554062, "epoch": 6675} {"train_loss": -27.455469131469727, "global_step": 554063, "epoch": 6675} {"train_loss": -27.641653060913086, "global_step": 554064, "epoch": 6675} {"train_loss": -27.651330947875977, "global_step": 554065, "epoch": 6675} {"train_loss": -27.533796310424805, "global_step": 554066, "epoch": 6675} {"train_loss": -27.76569175720215, "global_step": 554067, "epoch": 6675} {"train_loss": -27.735355377197266, "global_step": 554068, "epoch": 6675} {"train_loss": -27.488866806030273, "global_step": 554069, "epoch": 6675} {"train_loss": -27.784223556518555, "global_step": 554070, "epoch": 6675} {"train_loss": -28.268722534179688, "global_step": 554071, "epoch": 6675} {"train_loss": -27.56072425842285, "global_step": 554072, "epoch": 6675} {"train_loss": -27.630807876586914, "global_step": 554073, "epoch": 6675} {"train_loss": -28.29847526550293, "global_step": 554074, "epoch": 6675} {"train_loss": -27.637969970703125, "global_step": 554075, "epoch": 6675} {"train_loss": -27.659208297729492, "global_step": 554076, "epoch": 6675} {"train_loss": -27.54446792602539, "global_step": 554077, "epoch": 6675} {"train_loss": -27.790878295898438, "global_step": 554078, "epoch": 6675} {"train_loss": -27.570531845092773, "global_step": 554079, "epoch": 6675} {"train_loss": -27.8261775970459, "global_step": 554080, "epoch": 6675} {"train_loss": -27.8638858795166, "global_step": 554081, "epoch": 6675} {"train_loss": -27.176502227783203, "global_step": 554082, "epoch": 6675} {"train_loss": -28.301177978515625, "global_step": 554083, "epoch": 6675} {"train_loss": -27.577783584594727, "global_step": 554084, "epoch": 6675} {"train_loss": -27.820484161376953, "global_step": 554085, "epoch": 6675} {"train_loss": -27.966459274291992, "global_step": 554086, "epoch": 6675} {"train_loss": -27.868732452392578, "global_step": 554087, "epoch": 6675} {"train_loss": -27.899600982666016, "global_step": 554088, "epoch": 6675} {"train_loss": -27.93756103515625, "global_step": 554089, "epoch": 6675} {"train_loss": -27.863876342773438, "global_step": 554090, "epoch": 6675} {"train_loss": -27.352705001831055, "global_step": 554091, "epoch": 6675} {"train_loss": -27.48736000061035, "global_step": 554092, "epoch": 6675} {"train_loss": -27.885421752929688, "global_step": 554093, "epoch": 6675} {"train_loss": -27.717639923095703, "global_step": 554094, "epoch": 6675} {"train_loss": -27.07269859313965, "global_step": 554095, "epoch": 6675} {"train_loss": -27.19854736328125, "global_step": 554096, "epoch": 6675} {"train_loss": -27.8316650390625, "global_step": 554097, "epoch": 6675} {"train_loss": -27.07876968383789, "global_step": 554098, "epoch": 6675} {"train_loss": -27.89841651916504, "global_step": 554099, "epoch": 6675} {"train_loss": -27.326480865478516, "global_step": 554100, "epoch": 6675} {"train_loss": -27.765207290649414, "global_step": 554101, "epoch": 6675} {"train_loss": -27.649322509765625, "global_step": 554102, "epoch": 6675} {"train_loss": -27.490835189819336, "global_step": 554103, "epoch": 6675} {"train_loss": -27.492572784423828, "global_step": 554104, "epoch": 6675} {"train_loss": -27.904743194580078, "global_step": 554105, "epoch": 6675} {"train_loss": -27.34115982055664, "global_step": 554106, "epoch": 6675} {"train_loss": -27.41214106456343, "global_step": 554107, "epoch": 6675, "val_loss": 6509818.0} {"train_loss": -27.24300193786621, "global_step": 554108, "epoch": 6676} {"train_loss": -26.4411563873291, "global_step": 554109, "epoch": 6676} {"train_loss": -26.435083389282227, "global_step": 554110, "epoch": 6676} {"train_loss": -27.06135368347168, "global_step": 554111, "epoch": 6676} {"train_loss": -26.6897029876709, "global_step": 554112, "epoch": 6676} {"train_loss": -27.192413330078125, "global_step": 554113, "epoch": 6676} {"train_loss": -27.039464950561523, "global_step": 554114, "epoch": 6676} {"train_loss": -26.92998695373535, "global_step": 554115, "epoch": 6676} {"train_loss": -26.81792640686035, "global_step": 554116, "epoch": 6676} {"train_loss": -27.208282470703125, "global_step": 554117, "epoch": 6676} {"train_loss": -26.875646591186523, "global_step": 554118, "epoch": 6676} {"train_loss": -26.75825309753418, "global_step": 554119, "epoch": 6676} {"train_loss": -27.226957321166992, "global_step": 554120, "epoch": 6676} {"train_loss": -27.479833602905273, "global_step": 554121, "epoch": 6676} {"train_loss": -27.255361557006836, "global_step": 554122, "epoch": 6676} {"train_loss": -26.81135368347168, "global_step": 554123, "epoch": 6676} {"train_loss": -27.292877197265625, "global_step": 554124, "epoch": 6676} {"train_loss": -27.033994674682617, "global_step": 554125, "epoch": 6676} {"train_loss": -27.30735206604004, "global_step": 554126, "epoch": 6676} {"train_loss": -27.32594108581543, "global_step": 554127, "epoch": 6676} {"train_loss": -27.455036163330078, "global_step": 554128, "epoch": 6676} {"train_loss": -27.52423667907715, "global_step": 554129, "epoch": 6676} {"train_loss": -27.715402603149414, "global_step": 554130, "epoch": 6676} {"train_loss": -27.681976318359375, "global_step": 554131, "epoch": 6676} {"train_loss": -27.5068302154541, "global_step": 554132, "epoch": 6676} {"train_loss": -27.460615158081055, "global_step": 554133, "epoch": 6676} {"train_loss": -27.326309204101562, "global_step": 554134, "epoch": 6676} {"train_loss": -27.9100399017334, "global_step": 554135, "epoch": 6676} {"train_loss": -27.857080459594727, "global_step": 554136, "epoch": 6676} {"train_loss": -27.730581283569336, "global_step": 554137, "epoch": 6676} {"train_loss": -28.058944702148438, "global_step": 554138, "epoch": 6676} {"train_loss": -27.7584171295166, "global_step": 554139, "epoch": 6676} {"train_loss": -27.948440551757812, "global_step": 554140, "epoch": 6676} {"train_loss": -27.765579223632812, "global_step": 554141, "epoch": 6676} {"train_loss": -27.80691909790039, "global_step": 554142, "epoch": 6676} {"train_loss": -27.81199073791504, "global_step": 554143, "epoch": 6676} {"train_loss": -27.64887046813965, "global_step": 554144, "epoch": 6676} {"train_loss": -28.0478515625, "global_step": 554145, "epoch": 6676} {"train_loss": -28.088138580322266, "global_step": 554146, "epoch": 6676} {"train_loss": -27.88703727722168, "global_step": 554147, "epoch": 6676} {"train_loss": -28.023746490478516, "global_step": 554148, "epoch": 6676} {"train_loss": -27.90185546875, "global_step": 554149, "epoch": 6676} {"train_loss": -28.12946128845215, "global_step": 554150, "epoch": 6676} {"train_loss": -28.183874130249023, "global_step": 554151, "epoch": 6676} {"train_loss": -27.929304122924805, "global_step": 554152, "epoch": 6676} {"train_loss": -28.054121017456055, "global_step": 554153, "epoch": 6676} {"train_loss": -28.0969181060791, "global_step": 554154, "epoch": 6676} {"train_loss": -28.058258056640625, "global_step": 554155, "epoch": 6676} {"train_loss": -27.48451805114746, "global_step": 554156, "epoch": 6676} {"train_loss": -27.94769287109375, "global_step": 554157, "epoch": 6676} {"train_loss": -27.976160049438477, "global_step": 554158, "epoch": 6676} {"train_loss": -27.617237091064453, "global_step": 554159, "epoch": 6676} {"train_loss": -27.6522274017334, "global_step": 554160, "epoch": 6676} {"train_loss": -28.482046127319336, "global_step": 554161, "epoch": 6676} {"train_loss": -27.538843154907227, "global_step": 554162, "epoch": 6676} {"train_loss": -27.714160919189453, "global_step": 554163, "epoch": 6676} {"train_loss": -27.864965438842773, "global_step": 554164, "epoch": 6676} {"train_loss": -27.94287109375, "global_step": 554165, "epoch": 6676} {"train_loss": -26.763486862182617, "global_step": 554166, "epoch": 6676} {"train_loss": -27.490528106689453, "global_step": 554167, "epoch": 6676} {"train_loss": -27.1402530670166, "global_step": 554168, "epoch": 6676} {"train_loss": -26.99853515625, "global_step": 554169, "epoch": 6676} {"train_loss": -27.017744064331055, "global_step": 554170, "epoch": 6676} {"train_loss": -26.84055519104004, "global_step": 554171, "epoch": 6676} {"train_loss": -27.109760284423828, "global_step": 554172, "epoch": 6676} {"train_loss": -27.504108428955078, "global_step": 554173, "epoch": 6676} {"train_loss": -27.286640167236328, "global_step": 554174, "epoch": 6676} {"train_loss": -27.930622100830078, "global_step": 554175, "epoch": 6676} {"train_loss": -27.473758697509766, "global_step": 554176, "epoch": 6676} {"train_loss": -27.596466064453125, "global_step": 554177, "epoch": 6676} {"train_loss": -27.401899337768555, "global_step": 554178, "epoch": 6676} {"train_loss": -27.516971588134766, "global_step": 554179, "epoch": 6676} {"train_loss": -27.6654109954834, "global_step": 554180, "epoch": 6676} {"train_loss": -27.38993263244629, "global_step": 554181, "epoch": 6676} {"train_loss": -27.827594757080078, "global_step": 554182, "epoch": 6676} {"train_loss": -27.839269638061523, "global_step": 554183, "epoch": 6676} {"train_loss": -27.42803955078125, "global_step": 554184, "epoch": 6676} {"train_loss": -27.1925106048584, "global_step": 554185, "epoch": 6676} {"train_loss": -27.472061157226562, "global_step": 554186, "epoch": 6676} {"train_loss": -27.600873947143555, "global_step": 554187, "epoch": 6676} {"train_loss": -27.549518585205078, "global_step": 554188, "epoch": 6676} {"train_loss": -27.266931533813477, "global_step": 554189, "epoch": 6676} {"train_loss": -27.505613441926887, "global_step": 554190, "epoch": 6676, "val_loss": 6552765.0} {"train_loss": -27.127460479736328, "global_step": 554191, "epoch": 6677} {"train_loss": -27.735319137573242, "global_step": 554192, "epoch": 6677} {"train_loss": -27.058822631835938, "global_step": 554193, "epoch": 6677} {"train_loss": -27.585865020751953, "global_step": 554194, "epoch": 6677} {"train_loss": -27.56459617614746, "global_step": 554195, "epoch": 6677} {"train_loss": -27.480344772338867, "global_step": 554196, "epoch": 6677} {"train_loss": -27.588438034057617, "global_step": 554197, "epoch": 6677} {"train_loss": -27.395986557006836, "global_step": 554198, "epoch": 6677} {"train_loss": -27.966053009033203, "global_step": 554199, "epoch": 6677} {"train_loss": -27.496936798095703, "global_step": 554200, "epoch": 6677} {"train_loss": -27.598743438720703, "global_step": 554201, "epoch": 6677} {"train_loss": -27.680418014526367, "global_step": 554202, "epoch": 6677} {"train_loss": -27.742645263671875, "global_step": 554203, "epoch": 6677} {"train_loss": -27.664602279663086, "global_step": 554204, "epoch": 6677} {"train_loss": -27.761184692382812, "global_step": 554205, "epoch": 6677} {"train_loss": -28.046850204467773, "global_step": 554206, "epoch": 6677} {"train_loss": -27.624835968017578, "global_step": 554207, "epoch": 6677} {"train_loss": -27.801939010620117, "global_step": 554208, "epoch": 6677} {"train_loss": -28.09834098815918, "global_step": 554209, "epoch": 6677} {"train_loss": -27.673261642456055, "global_step": 554210, "epoch": 6677} {"train_loss": -27.429853439331055, "global_step": 554211, "epoch": 6677} {"train_loss": -27.935443878173828, "global_step": 554212, "epoch": 6677} {"train_loss": -27.83208656311035, "global_step": 554213, "epoch": 6677} {"train_loss": -28.029590606689453, "global_step": 554214, "epoch": 6677} {"train_loss": -27.86310386657715, "global_step": 554215, "epoch": 6677} {"train_loss": -27.879058837890625, "global_step": 554216, "epoch": 6677} {"train_loss": -27.746118545532227, "global_step": 554217, "epoch": 6677} {"train_loss": -28.2124080657959, "global_step": 554218, "epoch": 6677} {"train_loss": -28.126752853393555, "global_step": 554219, "epoch": 6677} {"train_loss": -28.016265869140625, "global_step": 554220, "epoch": 6677} {"train_loss": -27.831750869750977, "global_step": 554221, "epoch": 6677} {"train_loss": -27.626306533813477, "global_step": 554222, "epoch": 6677} {"train_loss": -27.827295303344727, "global_step": 554223, "epoch": 6677} {"train_loss": -28.08649253845215, "global_step": 554224, "epoch": 6677} {"train_loss": -27.482257843017578, "global_step": 554225, "epoch": 6677} {"train_loss": -27.765186309814453, "global_step": 554226, "epoch": 6677} {"train_loss": -27.74481773376465, "global_step": 554227, "epoch": 6677} {"train_loss": -27.841535568237305, "global_step": 554228, "epoch": 6677} {"train_loss": -27.929712295532227, "global_step": 554229, "epoch": 6677} {"train_loss": -27.8041934967041, "global_step": 554230, "epoch": 6677} {"train_loss": -27.846878051757812, "global_step": 554231, "epoch": 6677} {"train_loss": -27.822925567626953, "global_step": 554232, "epoch": 6677} {"train_loss": -28.22334098815918, "global_step": 554233, "epoch": 6677} {"train_loss": -27.99659538269043, "global_step": 554234, "epoch": 6677} {"train_loss": -28.223730087280273, "global_step": 554235, "epoch": 6677} {"train_loss": -27.4600772857666, "global_step": 554236, "epoch": 6677} {"train_loss": -27.840784072875977, "global_step": 554237, "epoch": 6677} {"train_loss": -28.045764923095703, "global_step": 554238, "epoch": 6677} {"train_loss": -27.6058349609375, "global_step": 554239, "epoch": 6677} {"train_loss": -28.16476821899414, "global_step": 554240, "epoch": 6677} {"train_loss": -27.87684440612793, "global_step": 554241, "epoch": 6677} {"train_loss": -27.687177658081055, "global_step": 554242, "epoch": 6677} {"train_loss": -27.800933837890625, "global_step": 554243, "epoch": 6677} {"train_loss": -27.566852569580078, "global_step": 554244, "epoch": 6677} {"train_loss": -27.810413360595703, "global_step": 554245, "epoch": 6677} {"train_loss": -27.96656608581543, "global_step": 554246, "epoch": 6677} {"train_loss": -27.85584831237793, "global_step": 554247, "epoch": 6677} {"train_loss": -27.783496856689453, "global_step": 554248, "epoch": 6677} {"train_loss": -27.669315338134766, "global_step": 554249, "epoch": 6677} {"train_loss": -28.03570556640625, "global_step": 554250, "epoch": 6677} {"train_loss": -27.917516708374023, "global_step": 554251, "epoch": 6677} {"train_loss": -27.424274444580078, "global_step": 554252, "epoch": 6677} {"train_loss": -27.609418869018555, "global_step": 554253, "epoch": 6677} {"train_loss": -27.733097076416016, "global_step": 554254, "epoch": 6677} {"train_loss": -27.975584030151367, "global_step": 554255, "epoch": 6677} {"train_loss": -27.4791202545166, "global_step": 554256, "epoch": 6677} {"train_loss": -27.986343383789062, "global_step": 554257, "epoch": 6677} {"train_loss": -27.469263076782227, "global_step": 554258, "epoch": 6677} {"train_loss": -27.686935424804688, "global_step": 554259, "epoch": 6677} {"train_loss": -27.693090438842773, "global_step": 554260, "epoch": 6677} {"train_loss": -27.3802490234375, "global_step": 554261, "epoch": 6677} {"train_loss": -27.5030517578125, "global_step": 554262, "epoch": 6677} {"train_loss": -27.704757690429688, "global_step": 554263, "epoch": 6677} {"train_loss": -27.790761947631836, "global_step": 554264, "epoch": 6677} {"train_loss": -27.726470947265625, "global_step": 554265, "epoch": 6677} {"train_loss": -27.408849716186523, "global_step": 554266, "epoch": 6677} {"train_loss": -27.71516227722168, "global_step": 554267, "epoch": 6677} {"train_loss": -27.584003448486328, "global_step": 554268, "epoch": 6677} {"train_loss": -27.605443954467773, "global_step": 554269, "epoch": 6677} {"train_loss": -27.94439697265625, "global_step": 554270, "epoch": 6677} {"train_loss": -27.730024337768555, "global_step": 554271, "epoch": 6677} {"train_loss": -28.040943145751953, "global_step": 554272, "epoch": 6677} {"train_loss": -27.75913360319942, "global_step": 554273, "epoch": 6677, "val_loss": 6623680.0} {"train_loss": -27.3692684173584, "global_step": 554274, "epoch": 6678} {"train_loss": -27.191024780273438, "global_step": 554275, "epoch": 6678} {"train_loss": -27.23626136779785, "global_step": 554276, "epoch": 6678} {"train_loss": -26.93946647644043, "global_step": 554277, "epoch": 6678} {"train_loss": -27.454736709594727, "global_step": 554278, "epoch": 6678} {"train_loss": -27.637048721313477, "global_step": 554279, "epoch": 6678} {"train_loss": -27.32196044921875, "global_step": 554280, "epoch": 6678} {"train_loss": -26.905872344970703, "global_step": 554281, "epoch": 6678} {"train_loss": -27.178638458251953, "global_step": 554282, "epoch": 6678} {"train_loss": -27.47047233581543, "global_step": 554283, "epoch": 6678} {"train_loss": -27.32063102722168, "global_step": 554284, "epoch": 6678} {"train_loss": -27.654333114624023, "global_step": 554285, "epoch": 6678} {"train_loss": -27.669973373413086, "global_step": 554286, "epoch": 6678} {"train_loss": -27.487476348876953, "global_step": 554287, "epoch": 6678} {"train_loss": -27.4567813873291, "global_step": 554288, "epoch": 6678} {"train_loss": -27.548288345336914, "global_step": 554289, "epoch": 6678} {"train_loss": -27.633087158203125, "global_step": 554290, "epoch": 6678} {"train_loss": -27.295948028564453, "global_step": 554291, "epoch": 6678} {"train_loss": -27.447294235229492, "global_step": 554292, "epoch": 6678} {"train_loss": -27.491138458251953, "global_step": 554293, "epoch": 6678} {"train_loss": -27.487075805664062, "global_step": 554294, "epoch": 6678} {"train_loss": -27.476404190063477, "global_step": 554295, "epoch": 6678} {"train_loss": -27.73402976989746, "global_step": 554296, "epoch": 6678} {"train_loss": -27.312641143798828, "global_step": 554297, "epoch": 6678} {"train_loss": -27.608661651611328, "global_step": 554298, "epoch": 6678} {"train_loss": -27.6682071685791, "global_step": 554299, "epoch": 6678} {"train_loss": -27.567230224609375, "global_step": 554300, "epoch": 6678} {"train_loss": -27.286334991455078, "global_step": 554301, "epoch": 6678} {"train_loss": -27.779678344726562, "global_step": 554302, "epoch": 6678} {"train_loss": -27.715681076049805, "global_step": 554303, "epoch": 6678} {"train_loss": -27.765085220336914, "global_step": 554304, "epoch": 6678} {"train_loss": -27.7018985748291, "global_step": 554305, "epoch": 6678} {"train_loss": -27.73026466369629, "global_step": 554306, "epoch": 6678} {"train_loss": -27.808996200561523, "global_step": 554307, "epoch": 6678} {"train_loss": -27.70063591003418, "global_step": 554308, "epoch": 6678} {"train_loss": -27.83607292175293, "global_step": 554309, "epoch": 6678} {"train_loss": -27.8804988861084, "global_step": 554310, "epoch": 6678} {"train_loss": -27.824676513671875, "global_step": 554311, "epoch": 6678} {"train_loss": -27.833099365234375, "global_step": 554312, "epoch": 6678} {"train_loss": -27.654401779174805, "global_step": 554313, "epoch": 6678} {"train_loss": -28.02997398376465, "global_step": 554314, "epoch": 6678} {"train_loss": -27.653066635131836, "global_step": 554315, "epoch": 6678} {"train_loss": -27.888975143432617, "global_step": 554316, "epoch": 6678} {"train_loss": -27.354297637939453, "global_step": 554317, "epoch": 6678} {"train_loss": -28.032093048095703, "global_step": 554318, "epoch": 6678} {"train_loss": -27.9831600189209, "global_step": 554319, "epoch": 6678} {"train_loss": -27.56525230407715, "global_step": 554320, "epoch": 6678} {"train_loss": -27.410968780517578, "global_step": 554321, "epoch": 6678} {"train_loss": -27.758935928344727, "global_step": 554322, "epoch": 6678} {"train_loss": -27.76021385192871, "global_step": 554323, "epoch": 6678} {"train_loss": -27.747516632080078, "global_step": 554324, "epoch": 6678} {"train_loss": -27.8344783782959, "global_step": 554325, "epoch": 6678} {"train_loss": -27.810775756835938, "global_step": 554326, "epoch": 6678} {"train_loss": -27.61982536315918, "global_step": 554327, "epoch": 6678} {"train_loss": -27.80604362487793, "global_step": 554328, "epoch": 6678} {"train_loss": -27.984119415283203, "global_step": 554329, "epoch": 6678} {"train_loss": -27.364673614501953, "global_step": 554330, "epoch": 6678} {"train_loss": -27.987844467163086, "global_step": 554331, "epoch": 6678} {"train_loss": -27.80669593811035, "global_step": 554332, "epoch": 6678} {"train_loss": -27.833356857299805, "global_step": 554333, "epoch": 6678} {"train_loss": -27.833112716674805, "global_step": 554334, "epoch": 6678} {"train_loss": -28.30317497253418, "global_step": 554335, "epoch": 6678} {"train_loss": -28.300464630126953, "global_step": 554336, "epoch": 6678} {"train_loss": -27.634122848510742, "global_step": 554337, "epoch": 6678} {"train_loss": -27.988861083984375, "global_step": 554338, "epoch": 6678} {"train_loss": -28.072561264038086, "global_step": 554339, "epoch": 6678} {"train_loss": -28.20942497253418, "global_step": 554340, "epoch": 6678} {"train_loss": -27.791330337524414, "global_step": 554341, "epoch": 6678} {"train_loss": -27.653900146484375, "global_step": 554342, "epoch": 6678} {"train_loss": -27.732574462890625, "global_step": 554343, "epoch": 6678} {"train_loss": -27.71213150024414, "global_step": 554344, "epoch": 6678} {"train_loss": -28.095996856689453, "global_step": 554345, "epoch": 6678} {"train_loss": -27.942529678344727, "global_step": 554346, "epoch": 6678} {"train_loss": -27.878305435180664, "global_step": 554347, "epoch": 6678} {"train_loss": -27.9016170501709, "global_step": 554348, "epoch": 6678} {"train_loss": -27.742658615112305, "global_step": 554349, "epoch": 6678} {"train_loss": -27.865514755249023, "global_step": 554350, "epoch": 6678} {"train_loss": -27.8197021484375, "global_step": 554351, "epoch": 6678} {"train_loss": -27.96535301208496, "global_step": 554352, "epoch": 6678} {"train_loss": -27.570905685424805, "global_step": 554353, "epoch": 6678} {"train_loss": -27.857257843017578, "global_step": 554354, "epoch": 6678} {"train_loss": -27.234113693237305, "global_step": 554355, "epoch": 6678} {"train_loss": -27.65757684822542, "global_step": 554356, "epoch": 6678, "val_loss": 6636886.0} {"train_loss": -22.47287368774414, "global_step": 554357, "epoch": 6679} {"train_loss": -24.08807373046875, "global_step": 554358, "epoch": 6679} {"train_loss": -25.148962020874023, "global_step": 554359, "epoch": 6679} {"train_loss": -24.150333404541016, "global_step": 554360, "epoch": 6679} {"train_loss": -25.283567428588867, "global_step": 554361, "epoch": 6679} {"train_loss": -25.648242950439453, "global_step": 554362, "epoch": 6679} {"train_loss": -24.801481246948242, "global_step": 554363, "epoch": 6679} {"train_loss": -26.387592315673828, "global_step": 554364, "epoch": 6679} {"train_loss": -26.38232421875, "global_step": 554365, "epoch": 6679} {"train_loss": -26.038232803344727, "global_step": 554366, "epoch": 6679} {"train_loss": -25.801725387573242, "global_step": 554367, "epoch": 6679} {"train_loss": -26.384906768798828, "global_step": 554368, "epoch": 6679} {"train_loss": -26.719924926757812, "global_step": 554369, "epoch": 6679} {"train_loss": -26.20755958557129, "global_step": 554370, "epoch": 6679} {"train_loss": -26.368167877197266, "global_step": 554371, "epoch": 6679} {"train_loss": -26.7047176361084, "global_step": 554372, "epoch": 6679} {"train_loss": -26.765043258666992, "global_step": 554373, "epoch": 6679} {"train_loss": -26.596654891967773, "global_step": 554374, "epoch": 6679} {"train_loss": -26.73919105529785, "global_step": 554375, "epoch": 6679} {"train_loss": -26.619470596313477, "global_step": 554376, "epoch": 6679} {"train_loss": -26.24835205078125, "global_step": 554377, "epoch": 6679} {"train_loss": -26.69475746154785, "global_step": 554378, "epoch": 6679} {"train_loss": -26.418537139892578, "global_step": 554379, "epoch": 6679} {"train_loss": -26.73005485534668, "global_step": 554380, "epoch": 6679} {"train_loss": -26.490949630737305, "global_step": 554381, "epoch": 6679} {"train_loss": -26.60589027404785, "global_step": 554382, "epoch": 6679} {"train_loss": -26.55109214782715, "global_step": 554383, "epoch": 6679} {"train_loss": -26.71213150024414, "global_step": 554384, "epoch": 6679} {"train_loss": -26.77593994140625, "global_step": 554385, "epoch": 6679} {"train_loss": -26.992523193359375, "global_step": 554386, "epoch": 6679} {"train_loss": -26.76018714904785, "global_step": 554387, "epoch": 6679} {"train_loss": -27.035329818725586, "global_step": 554388, "epoch": 6679} {"train_loss": -26.96906852722168, "global_step": 554389, "epoch": 6679} {"train_loss": -27.160083770751953, "global_step": 554390, "epoch": 6679} {"train_loss": -27.17659568786621, "global_step": 554391, "epoch": 6679} {"train_loss": -26.74024772644043, "global_step": 554392, "epoch": 6679} {"train_loss": -26.813690185546875, "global_step": 554393, "epoch": 6679} {"train_loss": -27.196807861328125, "global_step": 554394, "epoch": 6679} {"train_loss": -27.376300811767578, "global_step": 554395, "epoch": 6679} {"train_loss": -27.0440731048584, "global_step": 554396, "epoch": 6679} {"train_loss": -27.23432731628418, "global_step": 554397, "epoch": 6679} {"train_loss": -27.31886100769043, "global_step": 554398, "epoch": 6679} {"train_loss": -27.409454345703125, "global_step": 554399, "epoch": 6679} {"train_loss": -27.178625106811523, "global_step": 554400, "epoch": 6679} {"train_loss": -27.543292999267578, "global_step": 554401, "epoch": 6679} {"train_loss": -27.128198623657227, "global_step": 554402, "epoch": 6679} {"train_loss": -27.719013214111328, "global_step": 554403, "epoch": 6679} {"train_loss": -27.370319366455078, "global_step": 554404, "epoch": 6679} {"train_loss": -27.29367446899414, "global_step": 554405, "epoch": 6679} {"train_loss": -27.441741943359375, "global_step": 554406, "epoch": 6679} {"train_loss": -27.480146408081055, "global_step": 554407, "epoch": 6679} {"train_loss": -27.630115509033203, "global_step": 554408, "epoch": 6679} {"train_loss": -27.823261260986328, "global_step": 554409, "epoch": 6679} {"train_loss": -27.541400909423828, "global_step": 554410, "epoch": 6679} {"train_loss": -27.7968692779541, "global_step": 554411, "epoch": 6679} {"train_loss": -27.772512435913086, "global_step": 554412, "epoch": 6679} {"train_loss": -27.624738693237305, "global_step": 554413, "epoch": 6679} {"train_loss": -27.6368408203125, "global_step": 554414, "epoch": 6679} {"train_loss": -27.456689834594727, "global_step": 554415, "epoch": 6679} {"train_loss": -28.329212188720703, "global_step": 554416, "epoch": 6679} {"train_loss": -27.949188232421875, "global_step": 554417, "epoch": 6679} {"train_loss": -27.679107666015625, "global_step": 554418, "epoch": 6679} {"train_loss": -27.872943878173828, "global_step": 554419, "epoch": 6679} {"train_loss": -27.977216720581055, "global_step": 554420, "epoch": 6679} {"train_loss": -27.9403133392334, "global_step": 554421, "epoch": 6679} {"train_loss": -27.650558471679688, "global_step": 554422, "epoch": 6679} {"train_loss": -27.544696807861328, "global_step": 554423, "epoch": 6679} {"train_loss": -28.05586051940918, "global_step": 554424, "epoch": 6679} {"train_loss": -27.58820915222168, "global_step": 554425, "epoch": 6679} {"train_loss": -27.631887435913086, "global_step": 554426, "epoch": 6679} {"train_loss": -27.616153717041016, "global_step": 554427, "epoch": 6679} {"train_loss": -27.494138717651367, "global_step": 554428, "epoch": 6679} {"train_loss": -27.704715728759766, "global_step": 554429, "epoch": 6679} {"train_loss": -28.121923446655273, "global_step": 554430, "epoch": 6679} {"train_loss": -28.00441551208496, "global_step": 554431, "epoch": 6679} {"train_loss": -27.731664657592773, "global_step": 554432, "epoch": 6679} {"train_loss": -27.27596092224121, "global_step": 554433, "epoch": 6679} {"train_loss": -27.4847469329834, "global_step": 554434, "epoch": 6679} {"train_loss": -27.429244995117188, "global_step": 554435, "epoch": 6679} {"train_loss": -28.034149169921875, "global_step": 554436, "epoch": 6679} {"train_loss": -27.569486618041992, "global_step": 554437, "epoch": 6679} {"train_loss": -27.757299423217773, "global_step": 554438, "epoch": 6679} {"train_loss": -26.98986370592232, "global_step": 554439, "epoch": 6679, "val_loss": 6516786.5} {"train_loss": -27.454727172851562, "global_step": 554440, "epoch": 6680} {"train_loss": -27.9435977935791, "global_step": 554441, "epoch": 6680} {"train_loss": -27.857580184936523, "global_step": 554442, "epoch": 6680} {"train_loss": -28.024145126342773, "global_step": 554443, "epoch": 6680} {"train_loss": -27.765350341796875, "global_step": 554444, "epoch": 6680} {"train_loss": -27.63909339904785, "global_step": 554445, "epoch": 6680} {"train_loss": -27.83319091796875, "global_step": 554446, "epoch": 6680} {"train_loss": -27.457809448242188, "global_step": 554447, "epoch": 6680} {"train_loss": -27.90597915649414, "global_step": 554448, "epoch": 6680} {"train_loss": -28.343992233276367, "global_step": 554449, "epoch": 6680} {"train_loss": -27.68158531188965, "global_step": 554450, "epoch": 6680} {"train_loss": -27.859603881835938, "global_step": 554451, "epoch": 6680} {"train_loss": -27.78366470336914, "global_step": 554452, "epoch": 6680} {"train_loss": -27.61481285095215, "global_step": 554453, "epoch": 6680} {"train_loss": -27.28926658630371, "global_step": 554454, "epoch": 6680} {"train_loss": -27.46625328063965, "global_step": 554455, "epoch": 6680} {"train_loss": -27.743988037109375, "global_step": 554456, "epoch": 6680} {"train_loss": -27.29798698425293, "global_step": 554457, "epoch": 6680} {"train_loss": -27.640817642211914, "global_step": 554458, "epoch": 6680} {"train_loss": -27.65277671813965, "global_step": 554459, "epoch": 6680} {"train_loss": -27.71185874938965, "global_step": 554460, "epoch": 6680} {"train_loss": -27.69061279296875, "global_step": 554461, "epoch": 6680} {"train_loss": -27.41316795349121, "global_step": 554462, "epoch": 6680} {"train_loss": -27.765775680541992, "global_step": 554463, "epoch": 6680} {"train_loss": -27.837848663330078, "global_step": 554464, "epoch": 6680} {"train_loss": -27.52945327758789, "global_step": 554465, "epoch": 6680} {"train_loss": -27.454437255859375, "global_step": 554466, "epoch": 6680} {"train_loss": -28.077335357666016, "global_step": 554467, "epoch": 6680} {"train_loss": -27.93448257446289, "global_step": 554468, "epoch": 6680} {"train_loss": -27.791400909423828, "global_step": 554469, "epoch": 6680} {"train_loss": -27.83418846130371, "global_step": 554470, "epoch": 6680} {"train_loss": -27.89642333984375, "global_step": 554471, "epoch": 6680} {"train_loss": -28.022314071655273, "global_step": 554472, "epoch": 6680} {"train_loss": -27.97574806213379, "global_step": 554473, "epoch": 6680} {"train_loss": -28.052534103393555, "global_step": 554474, "epoch": 6680} {"train_loss": -28.027286529541016, "global_step": 554475, "epoch": 6680} {"train_loss": -27.47885513305664, "global_step": 554476, "epoch": 6680} {"train_loss": -27.598188400268555, "global_step": 554477, "epoch": 6680} {"train_loss": -27.31658363342285, "global_step": 554478, "epoch": 6680} {"train_loss": -26.86094093322754, "global_step": 554479, "epoch": 6680} {"train_loss": -27.57672691345215, "global_step": 554480, "epoch": 6680} {"train_loss": -28.052343368530273, "global_step": 554481, "epoch": 6680} {"train_loss": -27.58538246154785, "global_step": 554482, "epoch": 6680} {"train_loss": -27.4663028717041, "global_step": 554483, "epoch": 6680} {"train_loss": -27.481983184814453, "global_step": 554484, "epoch": 6680} {"train_loss": -27.430707931518555, "global_step": 554485, "epoch": 6680} {"train_loss": -27.937719345092773, "global_step": 554486, "epoch": 6680} {"train_loss": -27.69776725769043, "global_step": 554487, "epoch": 6680} {"train_loss": -27.71809196472168, "global_step": 554488, "epoch": 6680} {"train_loss": -28.115570068359375, "global_step": 554489, "epoch": 6680} {"train_loss": -28.120075225830078, "global_step": 554490, "epoch": 6680} {"train_loss": -27.839202880859375, "global_step": 554491, "epoch": 6680} {"train_loss": -27.894214630126953, "global_step": 554492, "epoch": 6680} {"train_loss": -27.89674949645996, "global_step": 554493, "epoch": 6680} {"train_loss": -28.0638370513916, "global_step": 554494, "epoch": 6680} {"train_loss": -27.93694496154785, "global_step": 554495, "epoch": 6680} {"train_loss": -27.690088272094727, "global_step": 554496, "epoch": 6680} {"train_loss": -27.80219841003418, "global_step": 554497, "epoch": 6680} {"train_loss": -28.167325973510742, "global_step": 554498, "epoch": 6680} {"train_loss": -27.962753295898438, "global_step": 554499, "epoch": 6680} {"train_loss": -27.6951904296875, "global_step": 554500, "epoch": 6680} {"train_loss": -27.770776748657227, "global_step": 554501, "epoch": 6680} {"train_loss": -28.106576919555664, "global_step": 554502, "epoch": 6680} {"train_loss": -27.880826950073242, "global_step": 554503, "epoch": 6680} {"train_loss": -28.021215438842773, "global_step": 554504, "epoch": 6680} {"train_loss": -28.1392822265625, "global_step": 554505, "epoch": 6680} {"train_loss": -27.802453994750977, "global_step": 554506, "epoch": 6680} {"train_loss": -27.798084259033203, "global_step": 554507, "epoch": 6680} {"train_loss": -27.68177604675293, "global_step": 554508, "epoch": 6680} {"train_loss": -27.8878173828125, "global_step": 554509, "epoch": 6680} {"train_loss": -28.22284507751465, "global_step": 554510, "epoch": 6680} {"train_loss": -27.886327743530273, "global_step": 554511, "epoch": 6680} {"train_loss": -27.949499130249023, "global_step": 554512, "epoch": 6680} {"train_loss": -28.006641387939453, "global_step": 554513, "epoch": 6680} {"train_loss": -28.040700912475586, "global_step": 554514, "epoch": 6680} {"train_loss": -27.872690200805664, "global_step": 554515, "epoch": 6680} {"train_loss": -27.25244140625, "global_step": 554516, "epoch": 6680} {"train_loss": -27.353546142578125, "global_step": 554517, "epoch": 6680} {"train_loss": -27.419843673706055, "global_step": 554518, "epoch": 6680} {"train_loss": -27.27776527404785, "global_step": 554519, "epoch": 6680} {"train_loss": -28.147628784179688, "global_step": 554520, "epoch": 6680} {"train_loss": -27.693586349487305, "global_step": 554521, "epoch": 6680} {"train_loss": -27.778551699167274, "global_step": 554522, "epoch": 6680, "val_loss": 6522927.5} {"train_loss": -20.980960845947266, "global_step": 554523, "epoch": 6681} {"train_loss": -22.06233787536621, "global_step": 554524, "epoch": 6681} {"train_loss": -21.785037994384766, "global_step": 554525, "epoch": 6681} {"train_loss": -22.202211380004883, "global_step": 554526, "epoch": 6681} {"train_loss": -23.097890853881836, "global_step": 554527, "epoch": 6681} {"train_loss": -23.4260196685791, "global_step": 554528, "epoch": 6681} {"train_loss": -23.99838638305664, "global_step": 554529, "epoch": 6681} {"train_loss": -24.958242416381836, "global_step": 554530, "epoch": 6681} {"train_loss": -24.777494430541992, "global_step": 554531, "epoch": 6681} {"train_loss": -24.295570373535156, "global_step": 554532, "epoch": 6681} {"train_loss": -24.79531478881836, "global_step": 554533, "epoch": 6681} {"train_loss": -25.116052627563477, "global_step": 554534, "epoch": 6681} {"train_loss": -25.51512336730957, "global_step": 554535, "epoch": 6681} {"train_loss": -25.273723602294922, "global_step": 554536, "epoch": 6681} {"train_loss": -25.163373947143555, "global_step": 554537, "epoch": 6681} {"train_loss": -25.36183738708496, "global_step": 554538, "epoch": 6681} {"train_loss": -25.821063995361328, "global_step": 554539, "epoch": 6681} {"train_loss": -25.572397232055664, "global_step": 554540, "epoch": 6681} {"train_loss": -25.72035789489746, "global_step": 554541, "epoch": 6681} {"train_loss": -25.939502716064453, "global_step": 554542, "epoch": 6681} {"train_loss": -25.56831169128418, "global_step": 554543, "epoch": 6681} {"train_loss": -26.171539306640625, "global_step": 554544, "epoch": 6681} {"train_loss": -25.62959098815918, "global_step": 554545, "epoch": 6681} {"train_loss": -25.860559463500977, "global_step": 554546, "epoch": 6681} {"train_loss": -25.809850692749023, "global_step": 554547, "epoch": 6681} {"train_loss": -26.266448974609375, "global_step": 554548, "epoch": 6681} {"train_loss": -26.3232421875, "global_step": 554549, "epoch": 6681} {"train_loss": -26.215269088745117, "global_step": 554550, "epoch": 6681} {"train_loss": -26.379621505737305, "global_step": 554551, "epoch": 6681} {"train_loss": -26.224506378173828, "global_step": 554552, "epoch": 6681} {"train_loss": -26.648101806640625, "global_step": 554553, "epoch": 6681} {"train_loss": -26.2979679107666, "global_step": 554554, "epoch": 6681} {"train_loss": -26.64070701599121, "global_step": 554555, "epoch": 6681} {"train_loss": -26.533552169799805, "global_step": 554556, "epoch": 6681} {"train_loss": -26.69695472717285, "global_step": 554557, "epoch": 6681} {"train_loss": -26.657764434814453, "global_step": 554558, "epoch": 6681} {"train_loss": -26.810623168945312, "global_step": 554559, "epoch": 6681} {"train_loss": -26.817930221557617, "global_step": 554560, "epoch": 6681} {"train_loss": -26.822956085205078, "global_step": 554561, "epoch": 6681} {"train_loss": -27.077472686767578, "global_step": 554562, "epoch": 6681} {"train_loss": -26.989124298095703, "global_step": 554563, "epoch": 6681} {"train_loss": -26.712432861328125, "global_step": 554564, "epoch": 6681} {"train_loss": -27.09744644165039, "global_step": 554565, "epoch": 6681} {"train_loss": -27.365554809570312, "global_step": 554566, "epoch": 6681} {"train_loss": -27.416736602783203, "global_step": 554567, "epoch": 6681} {"train_loss": -27.111785888671875, "global_step": 554568, "epoch": 6681} {"train_loss": -26.9025821685791, "global_step": 554569, "epoch": 6681} {"train_loss": -27.052875518798828, "global_step": 554570, "epoch": 6681} {"train_loss": -27.399560928344727, "global_step": 554571, "epoch": 6681} {"train_loss": -26.9968318939209, "global_step": 554572, "epoch": 6681} {"train_loss": -27.1490421295166, "global_step": 554573, "epoch": 6681} {"train_loss": -27.38205909729004, "global_step": 554574, "epoch": 6681} {"train_loss": -26.930402755737305, "global_step": 554575, "epoch": 6681} {"train_loss": -27.435110092163086, "global_step": 554576, "epoch": 6681} {"train_loss": -27.382131576538086, "global_step": 554577, "epoch": 6681} {"train_loss": -27.194177627563477, "global_step": 554578, "epoch": 6681} {"train_loss": -27.51265525817871, "global_step": 554579, "epoch": 6681} {"train_loss": -27.384780883789062, "global_step": 554580, "epoch": 6681} {"train_loss": -27.766132354736328, "global_step": 554581, "epoch": 6681} {"train_loss": -27.440168380737305, "global_step": 554582, "epoch": 6681} {"train_loss": -27.47784423828125, "global_step": 554583, "epoch": 6681} {"train_loss": -27.78314781188965, "global_step": 554584, "epoch": 6681} {"train_loss": -27.472097396850586, "global_step": 554585, "epoch": 6681} {"train_loss": -27.561294555664062, "global_step": 554586, "epoch": 6681} {"train_loss": -27.383466720581055, "global_step": 554587, "epoch": 6681} {"train_loss": -27.979822158813477, "global_step": 554588, "epoch": 6681} {"train_loss": -27.360198974609375, "global_step": 554589, "epoch": 6681} {"train_loss": -27.81483268737793, "global_step": 554590, "epoch": 6681} {"train_loss": -27.64276123046875, "global_step": 554591, "epoch": 6681} {"train_loss": -27.665876388549805, "global_step": 554592, "epoch": 6681} {"train_loss": -27.87554931640625, "global_step": 554593, "epoch": 6681} {"train_loss": -27.22564125061035, "global_step": 554594, "epoch": 6681} {"train_loss": -27.76820182800293, "global_step": 554595, "epoch": 6681} {"train_loss": -27.954092025756836, "global_step": 554596, "epoch": 6681} {"train_loss": -27.613388061523438, "global_step": 554597, "epoch": 6681} {"train_loss": -27.7614803314209, "global_step": 554598, "epoch": 6681} {"train_loss": -27.423974990844727, "global_step": 554599, "epoch": 6681} {"train_loss": -27.844858169555664, "global_step": 554600, "epoch": 6681} {"train_loss": -27.930601119995117, "global_step": 554601, "epoch": 6681} {"train_loss": -27.603912353515625, "global_step": 554602, "epoch": 6681} {"train_loss": -27.65717887878418, "global_step": 554603, "epoch": 6681} {"train_loss": -27.2742919921875, "global_step": 554604, "epoch": 6681} {"train_loss": -26.430760900658296, "global_step": 554605, "epoch": 6681, "val_loss": 6626877.5} {"train_loss": -26.72259521484375, "global_step": 554606, "epoch": 6682} {"train_loss": -27.193349838256836, "global_step": 554607, "epoch": 6682} {"train_loss": -26.37880516052246, "global_step": 554608, "epoch": 6682} {"train_loss": -25.80666160583496, "global_step": 554609, "epoch": 6682} {"train_loss": -26.2293758392334, "global_step": 554610, "epoch": 6682} {"train_loss": -26.565765380859375, "global_step": 554611, "epoch": 6682} {"train_loss": -27.020782470703125, "global_step": 554612, "epoch": 6682} {"train_loss": -26.66999626159668, "global_step": 554613, "epoch": 6682} {"train_loss": -26.894926071166992, "global_step": 554614, "epoch": 6682} {"train_loss": -27.000812530517578, "global_step": 554615, "epoch": 6682} {"train_loss": -27.00634765625, "global_step": 554616, "epoch": 6682} {"train_loss": -26.799468994140625, "global_step": 554617, "epoch": 6682} {"train_loss": -26.41851234436035, "global_step": 554618, "epoch": 6682} {"train_loss": -26.87763786315918, "global_step": 554619, "epoch": 6682} {"train_loss": -27.3039493560791, "global_step": 554620, "epoch": 6682} {"train_loss": -26.999719619750977, "global_step": 554621, "epoch": 6682} {"train_loss": -27.053211212158203, "global_step": 554622, "epoch": 6682} {"train_loss": -27.148962020874023, "global_step": 554623, "epoch": 6682} {"train_loss": -27.02924156188965, "global_step": 554624, "epoch": 6682} {"train_loss": -27.51468276977539, "global_step": 554625, "epoch": 6682} {"train_loss": -27.63409996032715, "global_step": 554626, "epoch": 6682} {"train_loss": -27.45090103149414, "global_step": 554627, "epoch": 6682} {"train_loss": -27.286426544189453, "global_step": 554628, "epoch": 6682} {"train_loss": -27.419050216674805, "global_step": 554629, "epoch": 6682} {"train_loss": -27.384016036987305, "global_step": 554630, "epoch": 6682} {"train_loss": -27.746814727783203, "global_step": 554631, "epoch": 6682} {"train_loss": -27.488988876342773, "global_step": 554632, "epoch": 6682} {"train_loss": -27.421375274658203, "global_step": 554633, "epoch": 6682} {"train_loss": -27.675153732299805, "global_step": 554634, "epoch": 6682} {"train_loss": -27.666824340820312, "global_step": 554635, "epoch": 6682} {"train_loss": -27.429046630859375, "global_step": 554636, "epoch": 6682} {"train_loss": -27.67243003845215, "global_step": 554637, "epoch": 6682} {"train_loss": -27.7932186126709, "global_step": 554638, "epoch": 6682} {"train_loss": -27.437753677368164, "global_step": 554639, "epoch": 6682} {"train_loss": -27.653776168823242, "global_step": 554640, "epoch": 6682} {"train_loss": -27.724267959594727, "global_step": 554641, "epoch": 6682} {"train_loss": -27.864355087280273, "global_step": 554642, "epoch": 6682} {"train_loss": -27.564533233642578, "global_step": 554643, "epoch": 6682} {"train_loss": -27.535913467407227, "global_step": 554644, "epoch": 6682} {"train_loss": -27.932281494140625, "global_step": 554645, "epoch": 6682} {"train_loss": -28.277246475219727, "global_step": 554646, "epoch": 6682} {"train_loss": -27.904220581054688, "global_step": 554647, "epoch": 6682} {"train_loss": -27.488515853881836, "global_step": 554648, "epoch": 6682} {"train_loss": -27.782703399658203, "global_step": 554649, "epoch": 6682} {"train_loss": -27.602325439453125, "global_step": 554650, "epoch": 6682} {"train_loss": -28.264179229736328, "global_step": 554651, "epoch": 6682} {"train_loss": -27.895343780517578, "global_step": 554652, "epoch": 6682} {"train_loss": -27.788373947143555, "global_step": 554653, "epoch": 6682} {"train_loss": -27.683454513549805, "global_step": 554654, "epoch": 6682} {"train_loss": -27.79473876953125, "global_step": 554655, "epoch": 6682} {"train_loss": -27.965890884399414, "global_step": 554656, "epoch": 6682} {"train_loss": -27.89032554626465, "global_step": 554657, "epoch": 6682} {"train_loss": -28.299137115478516, "global_step": 554658, "epoch": 6682} {"train_loss": -27.54541015625, "global_step": 554659, "epoch": 6682} {"train_loss": -27.579360961914062, "global_step": 554660, "epoch": 6682} {"train_loss": -27.862119674682617, "global_step": 554661, "epoch": 6682} {"train_loss": -28.012256622314453, "global_step": 554662, "epoch": 6682} {"train_loss": -27.585180282592773, "global_step": 554663, "epoch": 6682} {"train_loss": -28.196577072143555, "global_step": 554664, "epoch": 6682} {"train_loss": -27.236373901367188, "global_step": 554665, "epoch": 6682} {"train_loss": -27.86001968383789, "global_step": 554666, "epoch": 6682} {"train_loss": -27.322010040283203, "global_step": 554667, "epoch": 6682} {"train_loss": -27.6752986907959, "global_step": 554668, "epoch": 6682} {"train_loss": -27.43902015686035, "global_step": 554669, "epoch": 6682} {"train_loss": -27.806249618530273, "global_step": 554670, "epoch": 6682} {"train_loss": -27.838226318359375, "global_step": 554671, "epoch": 6682} {"train_loss": -27.51191520690918, "global_step": 554672, "epoch": 6682} {"train_loss": -28.07892417907715, "global_step": 554673, "epoch": 6682} {"train_loss": -27.993927001953125, "global_step": 554674, "epoch": 6682} {"train_loss": -27.823225021362305, "global_step": 554675, "epoch": 6682} {"train_loss": -27.902790069580078, "global_step": 554676, "epoch": 6682} {"train_loss": -27.649066925048828, "global_step": 554677, "epoch": 6682} {"train_loss": -27.67432975769043, "global_step": 554678, "epoch": 6682} {"train_loss": -27.226301193237305, "global_step": 554679, "epoch": 6682} {"train_loss": -26.97075843811035, "global_step": 554680, "epoch": 6682} {"train_loss": -27.7687931060791, "global_step": 554681, "epoch": 6682} {"train_loss": -28.090417861938477, "global_step": 554682, "epoch": 6682} {"train_loss": -27.6021671295166, "global_step": 554683, "epoch": 6682} {"train_loss": -27.4285831451416, "global_step": 554684, "epoch": 6682} {"train_loss": -27.60135269165039, "global_step": 554685, "epoch": 6682} {"train_loss": -27.899982452392578, "global_step": 554686, "epoch": 6682} {"train_loss": -27.3881893157959, "global_step": 554687, "epoch": 6682} {"train_loss": -27.498513853693584, "global_step": 554688, "epoch": 6682, "val_loss": 6682241.5} {"train_loss": -27.019886016845703, "global_step": 554689, "epoch": 6683} {"train_loss": -25.971744537353516, "global_step": 554690, "epoch": 6683} {"train_loss": -27.410192489624023, "global_step": 554691, "epoch": 6683} {"train_loss": -27.012426376342773, "global_step": 554692, "epoch": 6683} {"train_loss": -26.772933959960938, "global_step": 554693, "epoch": 6683} {"train_loss": -27.06373405456543, "global_step": 554694, "epoch": 6683} {"train_loss": -27.16300392150879, "global_step": 554695, "epoch": 6683} {"train_loss": -27.17486572265625, "global_step": 554696, "epoch": 6683} {"train_loss": -26.684497833251953, "global_step": 554697, "epoch": 6683} {"train_loss": -27.286314010620117, "global_step": 554698, "epoch": 6683} {"train_loss": -27.237966537475586, "global_step": 554699, "epoch": 6683} {"train_loss": -27.595678329467773, "global_step": 554700, "epoch": 6683} {"train_loss": -27.353656768798828, "global_step": 554701, "epoch": 6683} {"train_loss": -27.3680419921875, "global_step": 554702, "epoch": 6683} {"train_loss": -27.349355697631836, "global_step": 554703, "epoch": 6683} {"train_loss": -27.336944580078125, "global_step": 554704, "epoch": 6683} {"train_loss": -27.33974266052246, "global_step": 554705, "epoch": 6683} {"train_loss": -27.53182029724121, "global_step": 554706, "epoch": 6683} {"train_loss": -27.516254425048828, "global_step": 554707, "epoch": 6683} {"train_loss": -27.698339462280273, "global_step": 554708, "epoch": 6683} {"train_loss": -27.73211097717285, "global_step": 554709, "epoch": 6683} {"train_loss": -27.383405685424805, "global_step": 554710, "epoch": 6683} {"train_loss": -27.888355255126953, "global_step": 554711, "epoch": 6683} {"train_loss": -27.809925079345703, "global_step": 554712, "epoch": 6683} {"train_loss": -27.547637939453125, "global_step": 554713, "epoch": 6683} {"train_loss": -27.907541275024414, "global_step": 554714, "epoch": 6683} {"train_loss": -27.73128318786621, "global_step": 554715, "epoch": 6683} {"train_loss": -27.8419189453125, "global_step": 554716, "epoch": 6683} {"train_loss": -27.675535202026367, "global_step": 554717, "epoch": 6683} {"train_loss": -27.692142486572266, "global_step": 554718, "epoch": 6683} {"train_loss": -27.65966796875, "global_step": 554719, "epoch": 6683} {"train_loss": -27.67877769470215, "global_step": 554720, "epoch": 6683} {"train_loss": -27.583288192749023, "global_step": 554721, "epoch": 6683} {"train_loss": -27.885740280151367, "global_step": 554722, "epoch": 6683} {"train_loss": -27.72820472717285, "global_step": 554723, "epoch": 6683} {"train_loss": -27.63870620727539, "global_step": 554724, "epoch": 6683} {"train_loss": -27.81549644470215, "global_step": 554725, "epoch": 6683} {"train_loss": -27.752161026000977, "global_step": 554726, "epoch": 6683} {"train_loss": -27.61800193786621, "global_step": 554727, "epoch": 6683} {"train_loss": -28.021484375, "global_step": 554728, "epoch": 6683} {"train_loss": -27.757654190063477, "global_step": 554729, "epoch": 6683} {"train_loss": -27.91798210144043, "global_step": 554730, "epoch": 6683} {"train_loss": -27.986743927001953, "global_step": 554731, "epoch": 6683} {"train_loss": -27.843521118164062, "global_step": 554732, "epoch": 6683} {"train_loss": -28.019123077392578, "global_step": 554733, "epoch": 6683} {"train_loss": -27.94622802734375, "global_step": 554734, "epoch": 6683} {"train_loss": -28.012487411499023, "global_step": 554735, "epoch": 6683} {"train_loss": -27.9298152923584, "global_step": 554736, "epoch": 6683} {"train_loss": -27.691503524780273, "global_step": 554737, "epoch": 6683} {"train_loss": -27.90142250061035, "global_step": 554738, "epoch": 6683} {"train_loss": -27.525766372680664, "global_step": 554739, "epoch": 6683} {"train_loss": -28.030160903930664, "global_step": 554740, "epoch": 6683} {"train_loss": -27.6734619140625, "global_step": 554741, "epoch": 6683} {"train_loss": -27.35976219177246, "global_step": 554742, "epoch": 6683} {"train_loss": -27.445173263549805, "global_step": 554743, "epoch": 6683} {"train_loss": -28.028364181518555, "global_step": 554744, "epoch": 6683} {"train_loss": -27.870716094970703, "global_step": 554745, "epoch": 6683} {"train_loss": -27.325117111206055, "global_step": 554746, "epoch": 6683} {"train_loss": -27.4875545501709, "global_step": 554747, "epoch": 6683} {"train_loss": -27.74457359313965, "global_step": 554748, "epoch": 6683} {"train_loss": -27.844390869140625, "global_step": 554749, "epoch": 6683} {"train_loss": -27.78242301940918, "global_step": 554750, "epoch": 6683} {"train_loss": -27.71943473815918, "global_step": 554751, "epoch": 6683} {"train_loss": -27.64763832092285, "global_step": 554752, "epoch": 6683} {"train_loss": -27.848737716674805, "global_step": 554753, "epoch": 6683} {"train_loss": -27.83314323425293, "global_step": 554754, "epoch": 6683} {"train_loss": -27.637048721313477, "global_step": 554755, "epoch": 6683} {"train_loss": -27.951196670532227, "global_step": 554756, "epoch": 6683} {"train_loss": -27.73331642150879, "global_step": 554757, "epoch": 6683} {"train_loss": -27.58893394470215, "global_step": 554758, "epoch": 6683} {"train_loss": -27.599145889282227, "global_step": 554759, "epoch": 6683} {"train_loss": -27.901630401611328, "global_step": 554760, "epoch": 6683} {"train_loss": -27.87373161315918, "global_step": 554761, "epoch": 6683} {"train_loss": -27.809356689453125, "global_step": 554762, "epoch": 6683} {"train_loss": -27.646942138671875, "global_step": 554763, "epoch": 6683} {"train_loss": -27.74016761779785, "global_step": 554764, "epoch": 6683} {"train_loss": -27.965253829956055, "global_step": 554765, "epoch": 6683} {"train_loss": -27.836523056030273, "global_step": 554766, "epoch": 6683} {"train_loss": -28.088422775268555, "global_step": 554767, "epoch": 6683} {"train_loss": -27.760705947875977, "global_step": 554768, "epoch": 6683} {"train_loss": -27.785919189453125, "global_step": 554769, "epoch": 6683} {"train_loss": -27.738489151000977, "global_step": 554770, "epoch": 6683} {"train_loss": -27.63376638113734, "global_step": 554771, "epoch": 6683, "val_loss": 6670674.0} {"train_loss": -27.790119171142578, "global_step": 554772, "epoch": 6684} {"train_loss": -27.400360107421875, "global_step": 554773, "epoch": 6684} {"train_loss": -27.4963321685791, "global_step": 554774, "epoch": 6684} {"train_loss": -26.9613037109375, "global_step": 554775, "epoch": 6684} {"train_loss": -27.35767936706543, "global_step": 554776, "epoch": 6684} {"train_loss": -26.999725341796875, "global_step": 554777, "epoch": 6684} {"train_loss": -27.38865089416504, "global_step": 554778, "epoch": 6684} {"train_loss": -27.34132957458496, "global_step": 554779, "epoch": 6684} {"train_loss": -26.9000186920166, "global_step": 554780, "epoch": 6684} {"train_loss": -27.100141525268555, "global_step": 554781, "epoch": 6684} {"train_loss": -27.548654556274414, "global_step": 554782, "epoch": 6684} {"train_loss": -27.388967514038086, "global_step": 554783, "epoch": 6684} {"train_loss": -27.152860641479492, "global_step": 554784, "epoch": 6684} {"train_loss": -27.33064079284668, "global_step": 554785, "epoch": 6684} {"train_loss": -27.43182373046875, "global_step": 554786, "epoch": 6684} {"train_loss": -27.4914608001709, "global_step": 554787, "epoch": 6684} {"train_loss": -27.350156784057617, "global_step": 554788, "epoch": 6684} {"train_loss": -27.813827514648438, "global_step": 554789, "epoch": 6684} {"train_loss": -27.4564208984375, "global_step": 554790, "epoch": 6684} {"train_loss": -27.6207218170166, "global_step": 554791, "epoch": 6684} {"train_loss": -27.063140869140625, "global_step": 554792, "epoch": 6684} {"train_loss": -27.4512939453125, "global_step": 554793, "epoch": 6684} {"train_loss": -27.750629425048828, "global_step": 554794, "epoch": 6684} {"train_loss": -27.917469024658203, "global_step": 554795, "epoch": 6684} {"train_loss": -27.32240867614746, "global_step": 554796, "epoch": 6684} {"train_loss": -28.1315860748291, "global_step": 554797, "epoch": 6684} {"train_loss": -27.936582565307617, "global_step": 554798, "epoch": 6684} {"train_loss": -27.5687198638916, "global_step": 554799, "epoch": 6684} {"train_loss": -27.3902645111084, "global_step": 554800, "epoch": 6684} {"train_loss": -27.357467651367188, "global_step": 554801, "epoch": 6684} {"train_loss": -27.787174224853516, "global_step": 554802, "epoch": 6684} {"train_loss": -27.777673721313477, "global_step": 554803, "epoch": 6684} {"train_loss": -27.916589736938477, "global_step": 554804, "epoch": 6684} {"train_loss": -27.391590118408203, "global_step": 554805, "epoch": 6684} {"train_loss": -27.4511775970459, "global_step": 554806, "epoch": 6684} {"train_loss": -27.860626220703125, "global_step": 554807, "epoch": 6684} {"train_loss": -27.806970596313477, "global_step": 554808, "epoch": 6684} {"train_loss": -27.777753829956055, "global_step": 554809, "epoch": 6684} {"train_loss": -27.67792320251465, "global_step": 554810, "epoch": 6684} {"train_loss": -27.82265281677246, "global_step": 554811, "epoch": 6684} {"train_loss": -27.833038330078125, "global_step": 554812, "epoch": 6684} {"train_loss": -27.8359375, "global_step": 554813, "epoch": 6684} {"train_loss": -27.7100887298584, "global_step": 554814, "epoch": 6684} {"train_loss": -28.035812377929688, "global_step": 554815, "epoch": 6684} {"train_loss": -28.106531143188477, "global_step": 554816, "epoch": 6684} {"train_loss": -27.973575592041016, "global_step": 554817, "epoch": 6684} {"train_loss": -27.590524673461914, "global_step": 554818, "epoch": 6684} {"train_loss": -28.208450317382812, "global_step": 554819, "epoch": 6684} {"train_loss": -27.97478675842285, "global_step": 554820, "epoch": 6684} {"train_loss": -28.192676544189453, "global_step": 554821, "epoch": 6684} {"train_loss": -28.242727279663086, "global_step": 554822, "epoch": 6684} {"train_loss": -27.981689453125, "global_step": 554823, "epoch": 6684} {"train_loss": -27.981916427612305, "global_step": 554824, "epoch": 6684} {"train_loss": -28.078882217407227, "global_step": 554825, "epoch": 6684} {"train_loss": -28.205169677734375, "global_step": 554826, "epoch": 6684} {"train_loss": -27.907546997070312, "global_step": 554827, "epoch": 6684} {"train_loss": -27.62093162536621, "global_step": 554828, "epoch": 6684} {"train_loss": -28.19087028503418, "global_step": 554829, "epoch": 6684} {"train_loss": -28.30022621154785, "global_step": 554830, "epoch": 6684} {"train_loss": -28.05893898010254, "global_step": 554831, "epoch": 6684} {"train_loss": -28.109527587890625, "global_step": 554832, "epoch": 6684} {"train_loss": -27.953638076782227, "global_step": 554833, "epoch": 6684} {"train_loss": -28.284927368164062, "global_step": 554834, "epoch": 6684} {"train_loss": -28.190622329711914, "global_step": 554835, "epoch": 6684} {"train_loss": -28.37632179260254, "global_step": 554836, "epoch": 6684} {"train_loss": -28.20708656311035, "global_step": 554837, "epoch": 6684} {"train_loss": -28.56125831604004, "global_step": 554838, "epoch": 6684} {"train_loss": -27.826913833618164, "global_step": 554839, "epoch": 6684} {"train_loss": -27.590686798095703, "global_step": 554840, "epoch": 6684} {"train_loss": -27.20074462890625, "global_step": 554841, "epoch": 6684} {"train_loss": -27.02090835571289, "global_step": 554842, "epoch": 6684} {"train_loss": -26.323699951171875, "global_step": 554843, "epoch": 6684} {"train_loss": -26.33740234375, "global_step": 554844, "epoch": 6684} {"train_loss": -26.011754989624023, "global_step": 554845, "epoch": 6684} {"train_loss": -25.477428436279297, "global_step": 554846, "epoch": 6684} {"train_loss": -26.80362319946289, "global_step": 554847, "epoch": 6684} {"train_loss": -27.275068283081055, "global_step": 554848, "epoch": 6684} {"train_loss": -26.725128173828125, "global_step": 554849, "epoch": 6684} {"train_loss": -27.26088523864746, "global_step": 554850, "epoch": 6684} {"train_loss": -27.19376564025879, "global_step": 554851, "epoch": 6684} {"train_loss": -27.5145320892334, "global_step": 554852, "epoch": 6684} {"train_loss": -26.718524932861328, "global_step": 554853, "epoch": 6684} {"train_loss": -27.582268266792756, "global_step": 554854, "epoch": 6684, "val_loss": 6750190.0} {"train_loss": -26.438901901245117, "global_step": 554855, "epoch": 6685} {"train_loss": -25.047290802001953, "global_step": 554856, "epoch": 6685} {"train_loss": -26.834074020385742, "global_step": 554857, "epoch": 6685} {"train_loss": -26.190479278564453, "global_step": 554858, "epoch": 6685} {"train_loss": -26.458206176757812, "global_step": 554859, "epoch": 6685} {"train_loss": -26.4437313079834, "global_step": 554860, "epoch": 6685} {"train_loss": -26.47188377380371, "global_step": 554861, "epoch": 6685} {"train_loss": -26.24476432800293, "global_step": 554862, "epoch": 6685} {"train_loss": -26.88547134399414, "global_step": 554863, "epoch": 6685} {"train_loss": -26.390832901000977, "global_step": 554864, "epoch": 6685} {"train_loss": -26.862913131713867, "global_step": 554865, "epoch": 6685} {"train_loss": -26.681509017944336, "global_step": 554866, "epoch": 6685} {"train_loss": -26.641326904296875, "global_step": 554867, "epoch": 6685} {"train_loss": -26.95429039001465, "global_step": 554868, "epoch": 6685} {"train_loss": -26.906848907470703, "global_step": 554869, "epoch": 6685} {"train_loss": -26.874984741210938, "global_step": 554870, "epoch": 6685} {"train_loss": -27.09834861755371, "global_step": 554871, "epoch": 6685} {"train_loss": -27.485464096069336, "global_step": 554872, "epoch": 6685} {"train_loss": -27.122638702392578, "global_step": 554873, "epoch": 6685} {"train_loss": -26.834177017211914, "global_step": 554874, "epoch": 6685} {"train_loss": -27.060943603515625, "global_step": 554875, "epoch": 6685} {"train_loss": -27.367462158203125, "global_step": 554876, "epoch": 6685} {"train_loss": -27.318525314331055, "global_step": 554877, "epoch": 6685} {"train_loss": -27.210641860961914, "global_step": 554878, "epoch": 6685} {"train_loss": -27.65227699279785, "global_step": 554879, "epoch": 6685} {"train_loss": -27.352527618408203, "global_step": 554880, "epoch": 6685} {"train_loss": -27.344038009643555, "global_step": 554881, "epoch": 6685} {"train_loss": -27.22024917602539, "global_step": 554882, "epoch": 6685} {"train_loss": -27.374481201171875, "global_step": 554883, "epoch": 6685} {"train_loss": -27.590566635131836, "global_step": 554884, "epoch": 6685} {"train_loss": -27.30122184753418, "global_step": 554885, "epoch": 6685} {"train_loss": -27.43379020690918, "global_step": 554886, "epoch": 6685} {"train_loss": -27.302001953125, "global_step": 554887, "epoch": 6685} {"train_loss": -27.60393714904785, "global_step": 554888, "epoch": 6685} {"train_loss": -27.619144439697266, "global_step": 554889, "epoch": 6685} {"train_loss": -27.018552780151367, "global_step": 554890, "epoch": 6685} {"train_loss": -27.235815048217773, "global_step": 554891, "epoch": 6685} {"train_loss": -27.46213150024414, "global_step": 554892, "epoch": 6685} {"train_loss": -27.783660888671875, "global_step": 554893, "epoch": 6685} {"train_loss": -28.041980743408203, "global_step": 554894, "epoch": 6685} {"train_loss": -27.982885360717773, "global_step": 554895, "epoch": 6685} {"train_loss": -27.11419105529785, "global_step": 554896, "epoch": 6685} {"train_loss": -27.534088134765625, "global_step": 554897, "epoch": 6685} {"train_loss": -27.7101993560791, "global_step": 554898, "epoch": 6685} {"train_loss": -27.965463638305664, "global_step": 554899, "epoch": 6685} {"train_loss": -27.978437423706055, "global_step": 554900, "epoch": 6685} {"train_loss": -27.552719116210938, "global_step": 554901, "epoch": 6685} {"train_loss": -27.758411407470703, "global_step": 554902, "epoch": 6685} {"train_loss": -27.570571899414062, "global_step": 554903, "epoch": 6685} {"train_loss": -27.620227813720703, "global_step": 554904, "epoch": 6685} {"train_loss": -28.203378677368164, "global_step": 554905, "epoch": 6685} {"train_loss": -27.903295516967773, "global_step": 554906, "epoch": 6685} {"train_loss": -28.01383399963379, "global_step": 554907, "epoch": 6685} {"train_loss": -27.76331901550293, "global_step": 554908, "epoch": 6685} {"train_loss": -28.02756690979004, "global_step": 554909, "epoch": 6685} {"train_loss": -27.7590389251709, "global_step": 554910, "epoch": 6685} {"train_loss": -27.953367233276367, "global_step": 554911, "epoch": 6685} {"train_loss": -28.089874267578125, "global_step": 554912, "epoch": 6685} {"train_loss": -28.016742706298828, "global_step": 554913, "epoch": 6685} {"train_loss": -27.773962020874023, "global_step": 554914, "epoch": 6685} {"train_loss": -27.4136962890625, "global_step": 554915, "epoch": 6685} {"train_loss": -27.75412940979004, "global_step": 554916, "epoch": 6685} {"train_loss": -27.661977767944336, "global_step": 554917, "epoch": 6685} {"train_loss": -27.865758895874023, "global_step": 554918, "epoch": 6685} {"train_loss": -27.92005729675293, "global_step": 554919, "epoch": 6685} {"train_loss": -27.7799129486084, "global_step": 554920, "epoch": 6685} {"train_loss": -27.8482666015625, "global_step": 554921, "epoch": 6685} {"train_loss": -27.672910690307617, "global_step": 554922, "epoch": 6685} {"train_loss": -27.742963790893555, "global_step": 554923, "epoch": 6685} {"train_loss": -27.780881881713867, "global_step": 554924, "epoch": 6685} {"train_loss": -27.7615909576416, "global_step": 554925, "epoch": 6685} {"train_loss": -27.778369903564453, "global_step": 554926, "epoch": 6685} {"train_loss": -27.41952896118164, "global_step": 554927, "epoch": 6685} {"train_loss": -27.769819259643555, "global_step": 554928, "epoch": 6685} {"train_loss": -27.980804443359375, "global_step": 554929, "epoch": 6685} {"train_loss": -28.019311904907227, "global_step": 554930, "epoch": 6685} {"train_loss": -27.95099449157715, "global_step": 554931, "epoch": 6685} {"train_loss": -28.016672134399414, "global_step": 554932, "epoch": 6685} {"train_loss": -27.567861557006836, "global_step": 554933, "epoch": 6685} {"train_loss": -27.720361709594727, "global_step": 554934, "epoch": 6685} {"train_loss": -28.155841827392578, "global_step": 554935, "epoch": 6685} {"train_loss": -28.170989990234375, "global_step": 554936, "epoch": 6685} {"train_loss": -27.431382420551348, "global_step": 554937, "epoch": 6685, "val_loss": 6646237.0} {"train_loss": -25.915868759155273, "global_step": 554938, "epoch": 6686} {"train_loss": -25.377531051635742, "global_step": 554939, "epoch": 6686} {"train_loss": -27.32105827331543, "global_step": 554940, "epoch": 6686} {"train_loss": -24.24335289001465, "global_step": 554941, "epoch": 6686} {"train_loss": -26.54328727722168, "global_step": 554942, "epoch": 6686} {"train_loss": -25.753870010375977, "global_step": 554943, "epoch": 6686} {"train_loss": -27.303455352783203, "global_step": 554944, "epoch": 6686} {"train_loss": -26.171594619750977, "global_step": 554945, "epoch": 6686} {"train_loss": -27.231088638305664, "global_step": 554946, "epoch": 6686} {"train_loss": -26.78394889831543, "global_step": 554947, "epoch": 6686} {"train_loss": -26.69207763671875, "global_step": 554948, "epoch": 6686} {"train_loss": -27.122167587280273, "global_step": 554949, "epoch": 6686} {"train_loss": -27.040912628173828, "global_step": 554950, "epoch": 6686} {"train_loss": -26.43191909790039, "global_step": 554951, "epoch": 6686} {"train_loss": -27.251081466674805, "global_step": 554952, "epoch": 6686} {"train_loss": -27.186323165893555, "global_step": 554953, "epoch": 6686} {"train_loss": -27.258228302001953, "global_step": 554954, "epoch": 6686} {"train_loss": -27.232608795166016, "global_step": 554955, "epoch": 6686} {"train_loss": -27.455829620361328, "global_step": 554956, "epoch": 6686} {"train_loss": -26.998029708862305, "global_step": 554957, "epoch": 6686} {"train_loss": -27.41796875, "global_step": 554958, "epoch": 6686} {"train_loss": -26.848791122436523, "global_step": 554959, "epoch": 6686} {"train_loss": -26.985010147094727, "global_step": 554960, "epoch": 6686} {"train_loss": -27.44060707092285, "global_step": 554961, "epoch": 6686} {"train_loss": -27.085729598999023, "global_step": 554962, "epoch": 6686} {"train_loss": -27.27520751953125, "global_step": 554963, "epoch": 6686} {"train_loss": -27.066192626953125, "global_step": 554964, "epoch": 6686} {"train_loss": -27.47904396057129, "global_step": 554965, "epoch": 6686} {"train_loss": -27.43890953063965, "global_step": 554966, "epoch": 6686} {"train_loss": -27.418598175048828, "global_step": 554967, "epoch": 6686} {"train_loss": -27.406787872314453, "global_step": 554968, "epoch": 6686} {"train_loss": -27.7690372467041, "global_step": 554969, "epoch": 6686} {"train_loss": -27.062152862548828, "global_step": 554970, "epoch": 6686} {"train_loss": -27.40620231628418, "global_step": 554971, "epoch": 6686} {"train_loss": -27.45856285095215, "global_step": 554972, "epoch": 6686} {"train_loss": -27.258874893188477, "global_step": 554973, "epoch": 6686} {"train_loss": -27.5019588470459, "global_step": 554974, "epoch": 6686} {"train_loss": -27.52483558654785, "global_step": 554975, "epoch": 6686} {"train_loss": -27.550878524780273, "global_step": 554976, "epoch": 6686} {"train_loss": -27.922937393188477, "global_step": 554977, "epoch": 6686} {"train_loss": -27.66936683654785, "global_step": 554978, "epoch": 6686} {"train_loss": -27.37955665588379, "global_step": 554979, "epoch": 6686} {"train_loss": -27.583332061767578, "global_step": 554980, "epoch": 6686} {"train_loss": -27.819726943969727, "global_step": 554981, "epoch": 6686} {"train_loss": -27.7825927734375, "global_step": 554982, "epoch": 6686} {"train_loss": -27.8455867767334, "global_step": 554983, "epoch": 6686} {"train_loss": -27.97710609436035, "global_step": 554984, "epoch": 6686} {"train_loss": -27.72525978088379, "global_step": 554985, "epoch": 6686} {"train_loss": -27.491138458251953, "global_step": 554986, "epoch": 6686} {"train_loss": -27.65419578552246, "global_step": 554987, "epoch": 6686} {"train_loss": -28.0537109375, "global_step": 554988, "epoch": 6686} {"train_loss": -27.732254028320312, "global_step": 554989, "epoch": 6686} {"train_loss": -27.75662612915039, "global_step": 554990, "epoch": 6686} {"train_loss": -27.704870223999023, "global_step": 554991, "epoch": 6686} {"train_loss": -26.770660400390625, "global_step": 554992, "epoch": 6686} {"train_loss": -26.478010177612305, "global_step": 554993, "epoch": 6686} {"train_loss": -26.4525089263916, "global_step": 554994, "epoch": 6686} {"train_loss": -27.4744873046875, "global_step": 554995, "epoch": 6686} {"train_loss": -27.713947296142578, "global_step": 554996, "epoch": 6686} {"train_loss": -27.146574020385742, "global_step": 554997, "epoch": 6686} {"train_loss": -27.726205825805664, "global_step": 554998, "epoch": 6686} {"train_loss": -27.183923721313477, "global_step": 554999, "epoch": 6686} {"train_loss": -27.61280632019043, "global_step": 555000, "epoch": 6686} {"train_loss": -27.600360870361328, "global_step": 555001, "epoch": 6686} {"train_loss": -27.46923828125, "global_step": 555002, "epoch": 6686} {"train_loss": -27.70967674255371, "global_step": 555003, "epoch": 6686} {"train_loss": -27.900495529174805, "global_step": 555004, "epoch": 6686} {"train_loss": -27.519977569580078, "global_step": 555005, "epoch": 6686} {"train_loss": -27.492752075195312, "global_step": 555006, "epoch": 6686} {"train_loss": -27.7639102935791, "global_step": 555007, "epoch": 6686} {"train_loss": -27.638635635375977, "global_step": 555008, "epoch": 6686} {"train_loss": -27.195343017578125, "global_step": 555009, "epoch": 6686} {"train_loss": -27.381393432617188, "global_step": 555010, "epoch": 6686} {"train_loss": -27.61496353149414, "global_step": 555011, "epoch": 6686} {"train_loss": -27.14064598083496, "global_step": 555012, "epoch": 6686} {"train_loss": -27.513952255249023, "global_step": 555013, "epoch": 6686} {"train_loss": -27.26236343383789, "global_step": 555014, "epoch": 6686} {"train_loss": -27.370132446289062, "global_step": 555015, "epoch": 6686} {"train_loss": -27.338544845581055, "global_step": 555016, "epoch": 6686} {"train_loss": -27.248708724975586, "global_step": 555017, "epoch": 6686} {"train_loss": -27.7125186920166, "global_step": 555018, "epoch": 6686} {"train_loss": -27.569686889648438, "global_step": 555019, "epoch": 6686} {"train_loss": -27.263732542474585, "global_step": 555020, "epoch": 6686, "val_loss": 6670503.5} {"train_loss": -26.54163932800293, "global_step": 555021, "epoch": 6687} {"train_loss": -26.765594482421875, "global_step": 555022, "epoch": 6687} {"train_loss": -26.520536422729492, "global_step": 555023, "epoch": 6687} {"train_loss": -26.746618270874023, "global_step": 555024, "epoch": 6687} {"train_loss": -26.7314510345459, "global_step": 555025, "epoch": 6687} {"train_loss": -27.333209991455078, "global_step": 555026, "epoch": 6687} {"train_loss": -26.97969627380371, "global_step": 555027, "epoch": 6687} {"train_loss": -27.181955337524414, "global_step": 555028, "epoch": 6687} {"train_loss": -27.039167404174805, "global_step": 555029, "epoch": 6687} {"train_loss": -27.15932273864746, "global_step": 555030, "epoch": 6687} {"train_loss": -26.94923210144043, "global_step": 555031, "epoch": 6687} {"train_loss": -27.210920333862305, "global_step": 555032, "epoch": 6687} {"train_loss": -27.126483917236328, "global_step": 555033, "epoch": 6687} {"train_loss": -27.30924415588379, "global_step": 555034, "epoch": 6687} {"train_loss": -27.613744735717773, "global_step": 555035, "epoch": 6687} {"train_loss": -27.637771606445312, "global_step": 555036, "epoch": 6687} {"train_loss": -27.382009506225586, "global_step": 555037, "epoch": 6687} {"train_loss": -27.348474502563477, "global_step": 555038, "epoch": 6687} {"train_loss": -27.389341354370117, "global_step": 555039, "epoch": 6687} {"train_loss": -27.032007217407227, "global_step": 555040, "epoch": 6687} {"train_loss": -27.89436912536621, "global_step": 555041, "epoch": 6687} {"train_loss": -27.26631736755371, "global_step": 555042, "epoch": 6687} {"train_loss": -27.503437042236328, "global_step": 555043, "epoch": 6687} {"train_loss": -28.071088790893555, "global_step": 555044, "epoch": 6687} {"train_loss": -27.603612899780273, "global_step": 555045, "epoch": 6687} {"train_loss": -27.73343276977539, "global_step": 555046, "epoch": 6687} {"train_loss": -27.639694213867188, "global_step": 555047, "epoch": 6687} {"train_loss": -27.901403427124023, "global_step": 555048, "epoch": 6687} {"train_loss": -27.634307861328125, "global_step": 555049, "epoch": 6687} {"train_loss": -27.600248336791992, "global_step": 555050, "epoch": 6687} {"train_loss": -27.709686279296875, "global_step": 555051, "epoch": 6687} {"train_loss": -27.693140029907227, "global_step": 555052, "epoch": 6687} {"train_loss": -27.572406768798828, "global_step": 555053, "epoch": 6687} {"train_loss": -28.154987335205078, "global_step": 555054, "epoch": 6687} {"train_loss": -27.998926162719727, "global_step": 555055, "epoch": 6687} {"train_loss": -27.302682876586914, "global_step": 555056, "epoch": 6687} {"train_loss": -27.99407386779785, "global_step": 555057, "epoch": 6687} {"train_loss": -27.888036727905273, "global_step": 555058, "epoch": 6687} {"train_loss": -28.008228302001953, "global_step": 555059, "epoch": 6687} {"train_loss": -27.788288116455078, "global_step": 555060, "epoch": 6687} {"train_loss": -27.871946334838867, "global_step": 555061, "epoch": 6687} {"train_loss": -27.878616333007812, "global_step": 555062, "epoch": 6687} {"train_loss": -28.0087890625, "global_step": 555063, "epoch": 6687} {"train_loss": -28.079059600830078, "global_step": 555064, "epoch": 6687} {"train_loss": -27.86394691467285, "global_step": 555065, "epoch": 6687} {"train_loss": -28.058130264282227, "global_step": 555066, "epoch": 6687} {"train_loss": -28.229284286499023, "global_step": 555067, "epoch": 6687} {"train_loss": -28.183820724487305, "global_step": 555068, "epoch": 6687} {"train_loss": -27.978164672851562, "global_step": 555069, "epoch": 6687} {"train_loss": -27.770109176635742, "global_step": 555070, "epoch": 6687} {"train_loss": -28.004302978515625, "global_step": 555071, "epoch": 6687} {"train_loss": -27.98388671875, "global_step": 555072, "epoch": 6687} {"train_loss": -27.933979034423828, "global_step": 555073, "epoch": 6687} {"train_loss": -28.235448837280273, "global_step": 555074, "epoch": 6687} {"train_loss": -27.76666831970215, "global_step": 555075, "epoch": 6687} {"train_loss": -27.914478302001953, "global_step": 555076, "epoch": 6687} {"train_loss": -28.038101196289062, "global_step": 555077, "epoch": 6687} {"train_loss": -27.793607711791992, "global_step": 555078, "epoch": 6687} {"train_loss": -28.3419189453125, "global_step": 555079, "epoch": 6687} {"train_loss": -27.953458786010742, "global_step": 555080, "epoch": 6687} {"train_loss": -27.478647232055664, "global_step": 555081, "epoch": 6687} {"train_loss": -27.716882705688477, "global_step": 555082, "epoch": 6687} {"train_loss": -27.463083267211914, "global_step": 555083, "epoch": 6687} {"train_loss": -27.364227294921875, "global_step": 555084, "epoch": 6687} {"train_loss": -27.4012508392334, "global_step": 555085, "epoch": 6687} {"train_loss": -27.011682510375977, "global_step": 555086, "epoch": 6687} {"train_loss": -27.02044105529785, "global_step": 555087, "epoch": 6687} {"train_loss": -27.708036422729492, "global_step": 555088, "epoch": 6687} {"train_loss": -28.052988052368164, "global_step": 555089, "epoch": 6687} {"train_loss": -27.2279052734375, "global_step": 555090, "epoch": 6687} {"train_loss": -27.372425079345703, "global_step": 555091, "epoch": 6687} {"train_loss": -27.777191162109375, "global_step": 555092, "epoch": 6687} {"train_loss": -27.557565689086914, "global_step": 555093, "epoch": 6687} {"train_loss": -27.930784225463867, "global_step": 555094, "epoch": 6687} {"train_loss": -27.828948974609375, "global_step": 555095, "epoch": 6687} {"train_loss": -28.101144790649414, "global_step": 555096, "epoch": 6687} {"train_loss": -27.179990768432617, "global_step": 555097, "epoch": 6687} {"train_loss": -27.8079833984375, "global_step": 555098, "epoch": 6687} {"train_loss": -27.722681045532227, "global_step": 555099, "epoch": 6687} {"train_loss": -27.973636627197266, "global_step": 555100, "epoch": 6687} {"train_loss": -27.820119857788086, "global_step": 555101, "epoch": 6687} {"train_loss": -27.6127872467041, "global_step": 555102, "epoch": 6687} {"train_loss": -27.608112381165284, "global_step": 555103, "epoch": 6687, "val_loss": 6556355.0} {"train_loss": -27.38813591003418, "global_step": 555104, "epoch": 6688} {"train_loss": -27.31355857849121, "global_step": 555105, "epoch": 6688} {"train_loss": -27.115894317626953, "global_step": 555106, "epoch": 6688} {"train_loss": -27.121824264526367, "global_step": 555107, "epoch": 6688} {"train_loss": -27.235376358032227, "global_step": 555108, "epoch": 6688} {"train_loss": -27.25282096862793, "global_step": 555109, "epoch": 6688} {"train_loss": -27.061811447143555, "global_step": 555110, "epoch": 6688} {"train_loss": -27.19961929321289, "global_step": 555111, "epoch": 6688} {"train_loss": -27.204181671142578, "global_step": 555112, "epoch": 6688} {"train_loss": -27.413837432861328, "global_step": 555113, "epoch": 6688} {"train_loss": -27.372604370117188, "global_step": 555114, "epoch": 6688} {"train_loss": -27.12064552307129, "global_step": 555115, "epoch": 6688} {"train_loss": -27.3887939453125, "global_step": 555116, "epoch": 6688} {"train_loss": -27.372802734375, "global_step": 555117, "epoch": 6688} {"train_loss": -27.202756881713867, "global_step": 555118, "epoch": 6688} {"train_loss": -27.442840576171875, "global_step": 555119, "epoch": 6688} {"train_loss": -27.774738311767578, "global_step": 555120, "epoch": 6688} {"train_loss": -27.566986083984375, "global_step": 555121, "epoch": 6688} {"train_loss": -27.30313491821289, "global_step": 555122, "epoch": 6688} {"train_loss": -27.412128448486328, "global_step": 555123, "epoch": 6688} {"train_loss": -27.254013061523438, "global_step": 555124, "epoch": 6688} {"train_loss": -28.07666015625, "global_step": 555125, "epoch": 6688} {"train_loss": -27.605331420898438, "global_step": 555126, "epoch": 6688} {"train_loss": -27.58892822265625, "global_step": 555127, "epoch": 6688} {"train_loss": -27.9191951751709, "global_step": 555128, "epoch": 6688} {"train_loss": -27.514799118041992, "global_step": 555129, "epoch": 6688} {"train_loss": -27.830411911010742, "global_step": 555130, "epoch": 6688} {"train_loss": -27.538116455078125, "global_step": 555131, "epoch": 6688} {"train_loss": -27.513320922851562, "global_step": 555132, "epoch": 6688} {"train_loss": -27.9141845703125, "global_step": 555133, "epoch": 6688} {"train_loss": -27.747604370117188, "global_step": 555134, "epoch": 6688} {"train_loss": -27.51857566833496, "global_step": 555135, "epoch": 6688} {"train_loss": -27.84559440612793, "global_step": 555136, "epoch": 6688} {"train_loss": -27.620389938354492, "global_step": 555137, "epoch": 6688} {"train_loss": -27.669485092163086, "global_step": 555138, "epoch": 6688} {"train_loss": -27.70037841796875, "global_step": 555139, "epoch": 6688} {"train_loss": -27.595190048217773, "global_step": 555140, "epoch": 6688} {"train_loss": -27.69636344909668, "global_step": 555141, "epoch": 6688} {"train_loss": -27.849721908569336, "global_step": 555142, "epoch": 6688} {"train_loss": -27.676427841186523, "global_step": 555143, "epoch": 6688} {"train_loss": -27.78444480895996, "global_step": 555144, "epoch": 6688} {"train_loss": -27.992053985595703, "global_step": 555145, "epoch": 6688} {"train_loss": -27.985977172851562, "global_step": 555146, "epoch": 6688} {"train_loss": -28.189228057861328, "global_step": 555147, "epoch": 6688} {"train_loss": -27.927717208862305, "global_step": 555148, "epoch": 6688} {"train_loss": -27.853260040283203, "global_step": 555149, "epoch": 6688} {"train_loss": -27.86572265625, "global_step": 555150, "epoch": 6688} {"train_loss": -27.764652252197266, "global_step": 555151, "epoch": 6688} {"train_loss": -28.027372360229492, "global_step": 555152, "epoch": 6688} {"train_loss": -27.99053955078125, "global_step": 555153, "epoch": 6688} {"train_loss": -27.968481063842773, "global_step": 555154, "epoch": 6688} {"train_loss": -28.17477798461914, "global_step": 555155, "epoch": 6688} {"train_loss": -27.790664672851562, "global_step": 555156, "epoch": 6688} {"train_loss": -27.5493221282959, "global_step": 555157, "epoch": 6688} {"train_loss": -27.3326416015625, "global_step": 555158, "epoch": 6688} {"train_loss": -26.7744083404541, "global_step": 555159, "epoch": 6688} {"train_loss": -27.054784774780273, "global_step": 555160, "epoch": 6688} {"train_loss": -27.536331176757812, "global_step": 555161, "epoch": 6688} {"train_loss": -27.6253662109375, "global_step": 555162, "epoch": 6688} {"train_loss": -27.54865074157715, "global_step": 555163, "epoch": 6688} {"train_loss": -27.557178497314453, "global_step": 555164, "epoch": 6688} {"train_loss": -27.575565338134766, "global_step": 555165, "epoch": 6688} {"train_loss": -27.5565185546875, "global_step": 555166, "epoch": 6688} {"train_loss": -28.04244041442871, "global_step": 555167, "epoch": 6688} {"train_loss": -27.674823760986328, "global_step": 555168, "epoch": 6688} {"train_loss": -27.561664581298828, "global_step": 555169, "epoch": 6688} {"train_loss": -28.032958984375, "global_step": 555170, "epoch": 6688} {"train_loss": -27.6044979095459, "global_step": 555171, "epoch": 6688} {"train_loss": -27.97246742248535, "global_step": 555172, "epoch": 6688} {"train_loss": -27.74000358581543, "global_step": 555173, "epoch": 6688} {"train_loss": -27.72500991821289, "global_step": 555174, "epoch": 6688} {"train_loss": -27.6375675201416, "global_step": 555175, "epoch": 6688} {"train_loss": -28.12993812561035, "global_step": 555176, "epoch": 6688} {"train_loss": -27.799848556518555, "global_step": 555177, "epoch": 6688} {"train_loss": -27.929716110229492, "global_step": 555178, "epoch": 6688} {"train_loss": -27.957311630249023, "global_step": 555179, "epoch": 6688} {"train_loss": -27.9758358001709, "global_step": 555180, "epoch": 6688} {"train_loss": -27.81635856628418, "global_step": 555181, "epoch": 6688} {"train_loss": -27.808210372924805, "global_step": 555182, "epoch": 6688} {"train_loss": -27.56833267211914, "global_step": 555183, "epoch": 6688} {"train_loss": -27.699655532836914, "global_step": 555184, "epoch": 6688} {"train_loss": -28.159772872924805, "global_step": 555185, "epoch": 6688} {"train_loss": -27.647646317999047, "global_step": 555186, "epoch": 6688, "val_loss": 6451230.0} {"train_loss": -27.11463737487793, "global_step": 555187, "epoch": 6689} {"train_loss": -27.493627548217773, "global_step": 555188, "epoch": 6689} {"train_loss": -27.026092529296875, "global_step": 555189, "epoch": 6689} {"train_loss": -27.130273818969727, "global_step": 555190, "epoch": 6689} {"train_loss": -27.2143611907959, "global_step": 555191, "epoch": 6689} {"train_loss": -27.70843505859375, "global_step": 555192, "epoch": 6689} {"train_loss": -27.29611587524414, "global_step": 555193, "epoch": 6689} {"train_loss": -27.55755615234375, "global_step": 555194, "epoch": 6689} {"train_loss": -27.770416259765625, "global_step": 555195, "epoch": 6689} {"train_loss": -27.075239181518555, "global_step": 555196, "epoch": 6689} {"train_loss": -27.555957794189453, "global_step": 555197, "epoch": 6689} {"train_loss": -27.063018798828125, "global_step": 555198, "epoch": 6689} {"train_loss": -27.079633712768555, "global_step": 555199, "epoch": 6689} {"train_loss": -27.669187545776367, "global_step": 555200, "epoch": 6689} {"train_loss": -27.039052963256836, "global_step": 555201, "epoch": 6689} {"train_loss": -27.696928024291992, "global_step": 555202, "epoch": 6689} {"train_loss": -27.319074630737305, "global_step": 555203, "epoch": 6689} {"train_loss": -27.86445426940918, "global_step": 555204, "epoch": 6689} {"train_loss": -27.682653427124023, "global_step": 555205, "epoch": 6689} {"train_loss": -27.892663955688477, "global_step": 555206, "epoch": 6689} {"train_loss": -27.388233184814453, "global_step": 555207, "epoch": 6689} {"train_loss": -27.96595573425293, "global_step": 555208, "epoch": 6689} {"train_loss": -27.7724552154541, "global_step": 555209, "epoch": 6689} {"train_loss": -27.755966186523438, "global_step": 555210, "epoch": 6689} {"train_loss": -27.855056762695312, "global_step": 555211, "epoch": 6689} {"train_loss": -27.35320472717285, "global_step": 555212, "epoch": 6689} {"train_loss": -28.219274520874023, "global_step": 555213, "epoch": 6689} {"train_loss": -27.48597526550293, "global_step": 555214, "epoch": 6689} {"train_loss": -27.547637939453125, "global_step": 555215, "epoch": 6689} {"train_loss": -27.52308464050293, "global_step": 555216, "epoch": 6689} {"train_loss": -27.468551635742188, "global_step": 555217, "epoch": 6689} {"train_loss": -27.781896591186523, "global_step": 555218, "epoch": 6689} {"train_loss": -27.79178237915039, "global_step": 555219, "epoch": 6689} {"train_loss": -27.670883178710938, "global_step": 555220, "epoch": 6689} {"train_loss": -27.952835083007812, "global_step": 555221, "epoch": 6689} {"train_loss": -27.817520141601562, "global_step": 555222, "epoch": 6689} {"train_loss": -27.807941436767578, "global_step": 555223, "epoch": 6689} {"train_loss": -27.8016300201416, "global_step": 555224, "epoch": 6689} {"train_loss": -27.750579833984375, "global_step": 555225, "epoch": 6689} {"train_loss": -27.825864791870117, "global_step": 555226, "epoch": 6689} {"train_loss": -27.429738998413086, "global_step": 555227, "epoch": 6689} {"train_loss": -27.73099136352539, "global_step": 555228, "epoch": 6689} {"train_loss": -27.778600692749023, "global_step": 555229, "epoch": 6689} {"train_loss": -27.479379653930664, "global_step": 555230, "epoch": 6689} {"train_loss": -28.15459632873535, "global_step": 555231, "epoch": 6689} {"train_loss": -27.671253204345703, "global_step": 555232, "epoch": 6689} {"train_loss": -27.879535675048828, "global_step": 555233, "epoch": 6689} {"train_loss": -27.888498306274414, "global_step": 555234, "epoch": 6689} {"train_loss": -27.844282150268555, "global_step": 555235, "epoch": 6689} {"train_loss": -27.722808837890625, "global_step": 555236, "epoch": 6689} {"train_loss": -27.763723373413086, "global_step": 555237, "epoch": 6689} {"train_loss": -27.308135986328125, "global_step": 555238, "epoch": 6689} {"train_loss": -27.841552734375, "global_step": 555239, "epoch": 6689} {"train_loss": -27.832233428955078, "global_step": 555240, "epoch": 6689} {"train_loss": -27.9666805267334, "global_step": 555241, "epoch": 6689} {"train_loss": -27.821624755859375, "global_step": 555242, "epoch": 6689} {"train_loss": -27.66217613220215, "global_step": 555243, "epoch": 6689} {"train_loss": -27.988203048706055, "global_step": 555244, "epoch": 6689} {"train_loss": -27.6464900970459, "global_step": 555245, "epoch": 6689} {"train_loss": -27.463916778564453, "global_step": 555246, "epoch": 6689} {"train_loss": -28.095922470092773, "global_step": 555247, "epoch": 6689} {"train_loss": -27.665332794189453, "global_step": 555248, "epoch": 6689} {"train_loss": -28.186248779296875, "global_step": 555249, "epoch": 6689} {"train_loss": -27.826953887939453, "global_step": 555250, "epoch": 6689} {"train_loss": -27.791473388671875, "global_step": 555251, "epoch": 6689} {"train_loss": -27.52652931213379, "global_step": 555252, "epoch": 6689} {"train_loss": -28.031585693359375, "global_step": 555253, "epoch": 6689} {"train_loss": -27.621835708618164, "global_step": 555254, "epoch": 6689} {"train_loss": -27.816303253173828, "global_step": 555255, "epoch": 6689} {"train_loss": -27.530731201171875, "global_step": 555256, "epoch": 6689} {"train_loss": -28.01743507385254, "global_step": 555257, "epoch": 6689} {"train_loss": -27.8673095703125, "global_step": 555258, "epoch": 6689} {"train_loss": -27.715717315673828, "global_step": 555259, "epoch": 6689} {"train_loss": -27.66487693786621, "global_step": 555260, "epoch": 6689} {"train_loss": -27.8585262298584, "global_step": 555261, "epoch": 6689} {"train_loss": -27.874723434448242, "global_step": 555262, "epoch": 6689} {"train_loss": -27.86720085144043, "global_step": 555263, "epoch": 6689} {"train_loss": -27.41558837890625, "global_step": 555264, "epoch": 6689} {"train_loss": -27.89556884765625, "global_step": 555265, "epoch": 6689} {"train_loss": -27.857620239257812, "global_step": 555266, "epoch": 6689} {"train_loss": -27.43292808532715, "global_step": 555267, "epoch": 6689} {"train_loss": -27.32623863220215, "global_step": 555268, "epoch": 6689} {"train_loss": -27.673872752361987, "global_step": 555269, "epoch": 6689, "val_loss": 6440688.5} {"train_loss": -26.800949096679688, "global_step": 555270, "epoch": 6690} {"train_loss": -26.620487213134766, "global_step": 555271, "epoch": 6690} {"train_loss": -26.276941299438477, "global_step": 555272, "epoch": 6690} {"train_loss": -25.841602325439453, "global_step": 555273, "epoch": 6690} {"train_loss": -26.988224029541016, "global_step": 555274, "epoch": 6690} {"train_loss": -26.547107696533203, "global_step": 555275, "epoch": 6690} {"train_loss": -26.085113525390625, "global_step": 555276, "epoch": 6690} {"train_loss": -27.143335342407227, "global_step": 555277, "epoch": 6690} {"train_loss": -27.286651611328125, "global_step": 555278, "epoch": 6690} {"train_loss": -27.11089515686035, "global_step": 555279, "epoch": 6690} {"train_loss": -27.27422523498535, "global_step": 555280, "epoch": 6690} {"train_loss": -27.180822372436523, "global_step": 555281, "epoch": 6690} {"train_loss": -26.971784591674805, "global_step": 555282, "epoch": 6690} {"train_loss": -27.46034049987793, "global_step": 555283, "epoch": 6690} {"train_loss": -27.237350463867188, "global_step": 555284, "epoch": 6690} {"train_loss": -27.340890884399414, "global_step": 555285, "epoch": 6690} {"train_loss": -27.721384048461914, "global_step": 555286, "epoch": 6690} {"train_loss": -27.494739532470703, "global_step": 555287, "epoch": 6690} {"train_loss": -27.431976318359375, "global_step": 555288, "epoch": 6690} {"train_loss": -27.37811851501465, "global_step": 555289, "epoch": 6690} {"train_loss": -27.429731369018555, "global_step": 555290, "epoch": 6690} {"train_loss": -27.561111450195312, "global_step": 555291, "epoch": 6690} {"train_loss": -27.243253707885742, "global_step": 555292, "epoch": 6690} {"train_loss": -27.631811141967773, "global_step": 555293, "epoch": 6690} {"train_loss": -27.603759765625, "global_step": 555294, "epoch": 6690} {"train_loss": -27.99969482421875, "global_step": 555295, "epoch": 6690} {"train_loss": -27.43866539001465, "global_step": 555296, "epoch": 6690} {"train_loss": -27.490463256835938, "global_step": 555297, "epoch": 6690} {"train_loss": -27.61097526550293, "global_step": 555298, "epoch": 6690} {"train_loss": -27.6606502532959, "global_step": 555299, "epoch": 6690} {"train_loss": -27.632246017456055, "global_step": 555300, "epoch": 6690} {"train_loss": -27.5709171295166, "global_step": 555301, "epoch": 6690} {"train_loss": -27.68665885925293, "global_step": 555302, "epoch": 6690} {"train_loss": -27.611719131469727, "global_step": 555303, "epoch": 6690} {"train_loss": -27.793231964111328, "global_step": 555304, "epoch": 6690} {"train_loss": -27.561080932617188, "global_step": 555305, "epoch": 6690} {"train_loss": -27.73769187927246, "global_step": 555306, "epoch": 6690} {"train_loss": -27.685205459594727, "global_step": 555307, "epoch": 6690} {"train_loss": -27.851552963256836, "global_step": 555308, "epoch": 6690} {"train_loss": -27.84563636779785, "global_step": 555309, "epoch": 6690} {"train_loss": -28.10359764099121, "global_step": 555310, "epoch": 6690} {"train_loss": -27.64322853088379, "global_step": 555311, "epoch": 6690} {"train_loss": -28.017292022705078, "global_step": 555312, "epoch": 6690} {"train_loss": -27.998945236206055, "global_step": 555313, "epoch": 6690} {"train_loss": -27.612165451049805, "global_step": 555314, "epoch": 6690} {"train_loss": -27.92205810546875, "global_step": 555315, "epoch": 6690} {"train_loss": -27.887481689453125, "global_step": 555316, "epoch": 6690} {"train_loss": -27.8013916015625, "global_step": 555317, "epoch": 6690} {"train_loss": -27.882217407226562, "global_step": 555318, "epoch": 6690} {"train_loss": -27.615650177001953, "global_step": 555319, "epoch": 6690} {"train_loss": -27.88092613220215, "global_step": 555320, "epoch": 6690} {"train_loss": -27.75983238220215, "global_step": 555321, "epoch": 6690} {"train_loss": -27.485727310180664, "global_step": 555322, "epoch": 6690} {"train_loss": -27.778379440307617, "global_step": 555323, "epoch": 6690} {"train_loss": -27.986988067626953, "global_step": 555324, "epoch": 6690} {"train_loss": -27.77259635925293, "global_step": 555325, "epoch": 6690} {"train_loss": -27.777151107788086, "global_step": 555326, "epoch": 6690} {"train_loss": -27.87920570373535, "global_step": 555327, "epoch": 6690} {"train_loss": -27.943439483642578, "global_step": 555328, "epoch": 6690} {"train_loss": -28.249048233032227, "global_step": 555329, "epoch": 6690} {"train_loss": -28.298416137695312, "global_step": 555330, "epoch": 6690} {"train_loss": -27.96497917175293, "global_step": 555331, "epoch": 6690} {"train_loss": -27.882925033569336, "global_step": 555332, "epoch": 6690} {"train_loss": -28.38947105407715, "global_step": 555333, "epoch": 6690} {"train_loss": -28.2081298828125, "global_step": 555334, "epoch": 6690} {"train_loss": -27.952972412109375, "global_step": 555335, "epoch": 6690} {"train_loss": -28.1345157623291, "global_step": 555336, "epoch": 6690} {"train_loss": -28.257699966430664, "global_step": 555337, "epoch": 6690} {"train_loss": -27.71510124206543, "global_step": 555338, "epoch": 6690} {"train_loss": -27.61372184753418, "global_step": 555339, "epoch": 6690} {"train_loss": -27.7539005279541, "global_step": 555340, "epoch": 6690} {"train_loss": -27.903182983398438, "global_step": 555341, "epoch": 6690} {"train_loss": -27.822113037109375, "global_step": 555342, "epoch": 6690} {"train_loss": -27.305206298828125, "global_step": 555343, "epoch": 6690} {"train_loss": -27.147430419921875, "global_step": 555344, "epoch": 6690} {"train_loss": -27.69886589050293, "global_step": 555345, "epoch": 6690} {"train_loss": -27.252431869506836, "global_step": 555346, "epoch": 6690} {"train_loss": -27.962560653686523, "global_step": 555347, "epoch": 6690} {"train_loss": -27.24989128112793, "global_step": 555348, "epoch": 6690} {"train_loss": -28.394824981689453, "global_step": 555349, "epoch": 6690} {"train_loss": -27.824071884155273, "global_step": 555350, "epoch": 6690} {"train_loss": -27.553543090820312, "global_step": 555351, "epoch": 6690} {"train_loss": -27.599171420177782, "global_step": 555352, "epoch": 6690, "val_loss": 6469093.0} {"train_loss": -27.438861846923828, "global_step": 555353, "epoch": 6691} {"train_loss": -27.18830680847168, "global_step": 555354, "epoch": 6691} {"train_loss": -27.322589874267578, "global_step": 555355, "epoch": 6691} {"train_loss": -27.205114364624023, "global_step": 555356, "epoch": 6691} {"train_loss": -27.13864517211914, "global_step": 555357, "epoch": 6691} {"train_loss": -26.984832763671875, "global_step": 555358, "epoch": 6691} {"train_loss": -27.42121696472168, "global_step": 555359, "epoch": 6691} {"train_loss": -27.111658096313477, "global_step": 555360, "epoch": 6691} {"train_loss": -27.51551628112793, "global_step": 555361, "epoch": 6691} {"train_loss": -27.061437606811523, "global_step": 555362, "epoch": 6691} {"train_loss": -27.08746910095215, "global_step": 555363, "epoch": 6691} {"train_loss": -27.35188102722168, "global_step": 555364, "epoch": 6691} {"train_loss": -27.847198486328125, "global_step": 555365, "epoch": 6691} {"train_loss": -27.59939956665039, "global_step": 555366, "epoch": 6691} {"train_loss": -27.335224151611328, "global_step": 555367, "epoch": 6691} {"train_loss": -27.689340591430664, "global_step": 555368, "epoch": 6691} {"train_loss": -27.513105392456055, "global_step": 555369, "epoch": 6691} {"train_loss": -27.409997940063477, "global_step": 555370, "epoch": 6691} {"train_loss": -28.127506256103516, "global_step": 555371, "epoch": 6691} {"train_loss": -27.659793853759766, "global_step": 555372, "epoch": 6691} {"train_loss": -27.81683921813965, "global_step": 555373, "epoch": 6691} {"train_loss": -27.621448516845703, "global_step": 555374, "epoch": 6691} {"train_loss": -27.64625358581543, "global_step": 555375, "epoch": 6691} {"train_loss": -27.76847267150879, "global_step": 555376, "epoch": 6691} {"train_loss": -27.610218048095703, "global_step": 555377, "epoch": 6691} {"train_loss": -27.967187881469727, "global_step": 555378, "epoch": 6691} {"train_loss": -27.534332275390625, "global_step": 555379, "epoch": 6691} {"train_loss": -28.132787704467773, "global_step": 555380, "epoch": 6691} {"train_loss": -27.72562599182129, "global_step": 555381, "epoch": 6691} {"train_loss": -27.6781005859375, "global_step": 555382, "epoch": 6691} {"train_loss": -27.431385040283203, "global_step": 555383, "epoch": 6691} {"train_loss": -27.95685386657715, "global_step": 555384, "epoch": 6691} {"train_loss": -27.6956729888916, "global_step": 555385, "epoch": 6691} {"train_loss": -28.276447296142578, "global_step": 555386, "epoch": 6691} {"train_loss": -27.840152740478516, "global_step": 555387, "epoch": 6691} {"train_loss": -27.680994033813477, "global_step": 555388, "epoch": 6691} {"train_loss": -27.854467391967773, "global_step": 555389, "epoch": 6691} {"train_loss": -27.57244300842285, "global_step": 555390, "epoch": 6691} {"train_loss": -27.789432525634766, "global_step": 555391, "epoch": 6691} {"train_loss": -28.09560203552246, "global_step": 555392, "epoch": 6691} {"train_loss": -27.86140251159668, "global_step": 555393, "epoch": 6691} {"train_loss": -27.978424072265625, "global_step": 555394, "epoch": 6691} {"train_loss": -28.17768669128418, "global_step": 555395, "epoch": 6691} {"train_loss": -27.673322677612305, "global_step": 555396, "epoch": 6691} {"train_loss": -28.04803466796875, "global_step": 555397, "epoch": 6691} {"train_loss": -27.625045776367188, "global_step": 555398, "epoch": 6691} {"train_loss": -27.900146484375, "global_step": 555399, "epoch": 6691} {"train_loss": -27.743528366088867, "global_step": 555400, "epoch": 6691} {"train_loss": -27.809507369995117, "global_step": 555401, "epoch": 6691} {"train_loss": -27.867557525634766, "global_step": 555402, "epoch": 6691} {"train_loss": -27.85160255432129, "global_step": 555403, "epoch": 6691} {"train_loss": -27.6993408203125, "global_step": 555404, "epoch": 6691} {"train_loss": -27.48145866394043, "global_step": 555405, "epoch": 6691} {"train_loss": -26.883747100830078, "global_step": 555406, "epoch": 6691} {"train_loss": -27.206445693969727, "global_step": 555407, "epoch": 6691} {"train_loss": -27.434585571289062, "global_step": 555408, "epoch": 6691} {"train_loss": -27.519208908081055, "global_step": 555409, "epoch": 6691} {"train_loss": -27.579721450805664, "global_step": 555410, "epoch": 6691} {"train_loss": -27.41230583190918, "global_step": 555411, "epoch": 6691} {"train_loss": -27.623388290405273, "global_step": 555412, "epoch": 6691} {"train_loss": -27.40850257873535, "global_step": 555413, "epoch": 6691} {"train_loss": -27.353437423706055, "global_step": 555414, "epoch": 6691} {"train_loss": -27.45977210998535, "global_step": 555415, "epoch": 6691} {"train_loss": -27.519052505493164, "global_step": 555416, "epoch": 6691} {"train_loss": -27.25211524963379, "global_step": 555417, "epoch": 6691} {"train_loss": -27.331344604492188, "global_step": 555418, "epoch": 6691} {"train_loss": -27.856481552124023, "global_step": 555419, "epoch": 6691} {"train_loss": -27.556812286376953, "global_step": 555420, "epoch": 6691} {"train_loss": -27.911869049072266, "global_step": 555421, "epoch": 6691} {"train_loss": -27.733274459838867, "global_step": 555422, "epoch": 6691} {"train_loss": -27.68735694885254, "global_step": 555423, "epoch": 6691} {"train_loss": -27.848791122436523, "global_step": 555424, "epoch": 6691} {"train_loss": -27.82156753540039, "global_step": 555425, "epoch": 6691} {"train_loss": -27.591110229492188, "global_step": 555426, "epoch": 6691} {"train_loss": -27.76850700378418, "global_step": 555427, "epoch": 6691} {"train_loss": -28.06305503845215, "global_step": 555428, "epoch": 6691} {"train_loss": -27.597366333007812, "global_step": 555429, "epoch": 6691} {"train_loss": -27.6337833404541, "global_step": 555430, "epoch": 6691} {"train_loss": -27.812368392944336, "global_step": 555431, "epoch": 6691} {"train_loss": -27.94672203063965, "global_step": 555432, "epoch": 6691} {"train_loss": -27.903934478759766, "global_step": 555433, "epoch": 6691} {"train_loss": -28.084014892578125, "global_step": 555434, "epoch": 6691} {"train_loss": -27.631291010293616, "global_step": 555435, "epoch": 6691, "val_loss": 6429676.0} {"train_loss": -26.886083602905273, "global_step": 555436, "epoch": 6692} {"train_loss": -27.37079429626465, "global_step": 555437, "epoch": 6692} {"train_loss": -27.704345703125, "global_step": 555438, "epoch": 6692} {"train_loss": -27.61683464050293, "global_step": 555439, "epoch": 6692} {"train_loss": -27.547672271728516, "global_step": 555440, "epoch": 6692} {"train_loss": -27.524465560913086, "global_step": 555441, "epoch": 6692} {"train_loss": -27.086660385131836, "global_step": 555442, "epoch": 6692} {"train_loss": -27.361194610595703, "global_step": 555443, "epoch": 6692} {"train_loss": -27.2186336517334, "global_step": 555444, "epoch": 6692} {"train_loss": -27.704126358032227, "global_step": 555445, "epoch": 6692} {"train_loss": -27.185251235961914, "global_step": 555446, "epoch": 6692} {"train_loss": -27.392353057861328, "global_step": 555447, "epoch": 6692} {"train_loss": -27.858976364135742, "global_step": 555448, "epoch": 6692} {"train_loss": -27.471572875976562, "global_step": 555449, "epoch": 6692} {"train_loss": -27.27781105041504, "global_step": 555450, "epoch": 6692} {"train_loss": -27.148975372314453, "global_step": 555451, "epoch": 6692} {"train_loss": -27.358383178710938, "global_step": 555452, "epoch": 6692} {"train_loss": -27.076812744140625, "global_step": 555453, "epoch": 6692} {"train_loss": -27.431970596313477, "global_step": 555454, "epoch": 6692} {"train_loss": -27.92207908630371, "global_step": 555455, "epoch": 6692} {"train_loss": -27.680164337158203, "global_step": 555456, "epoch": 6692} {"train_loss": -27.55779457092285, "global_step": 555457, "epoch": 6692} {"train_loss": -27.66358757019043, "global_step": 555458, "epoch": 6692} {"train_loss": -27.817602157592773, "global_step": 555459, "epoch": 6692} {"train_loss": -27.47002601623535, "global_step": 555460, "epoch": 6692} {"train_loss": -27.736902236938477, "global_step": 555461, "epoch": 6692} {"train_loss": -27.60563087463379, "global_step": 555462, "epoch": 6692} {"train_loss": -27.726089477539062, "global_step": 555463, "epoch": 6692} {"train_loss": -27.46002769470215, "global_step": 555464, "epoch": 6692} {"train_loss": -27.66567039489746, "global_step": 555465, "epoch": 6692} {"train_loss": -27.728443145751953, "global_step": 555466, "epoch": 6692} {"train_loss": -27.663644790649414, "global_step": 555467, "epoch": 6692} {"train_loss": -27.72989845275879, "global_step": 555468, "epoch": 6692} {"train_loss": -27.86231803894043, "global_step": 555469, "epoch": 6692} {"train_loss": -27.69659423828125, "global_step": 555470, "epoch": 6692} {"train_loss": -27.986209869384766, "global_step": 555471, "epoch": 6692} {"train_loss": -28.229583740234375, "global_step": 555472, "epoch": 6692} {"train_loss": -28.143564224243164, "global_step": 555473, "epoch": 6692} {"train_loss": -27.709333419799805, "global_step": 555474, "epoch": 6692} {"train_loss": -27.760828018188477, "global_step": 555475, "epoch": 6692} {"train_loss": -28.146320343017578, "global_step": 555476, "epoch": 6692} {"train_loss": -27.924062728881836, "global_step": 555477, "epoch": 6692} {"train_loss": -28.038049697875977, "global_step": 555478, "epoch": 6692} {"train_loss": -27.910749435424805, "global_step": 555479, "epoch": 6692} {"train_loss": -27.84766960144043, "global_step": 555480, "epoch": 6692} {"train_loss": -27.954792022705078, "global_step": 555481, "epoch": 6692} {"train_loss": -27.7252254486084, "global_step": 555482, "epoch": 6692} {"train_loss": -27.574201583862305, "global_step": 555483, "epoch": 6692} {"train_loss": -27.759674072265625, "global_step": 555484, "epoch": 6692} {"train_loss": -28.00265884399414, "global_step": 555485, "epoch": 6692} {"train_loss": -28.022668838500977, "global_step": 555486, "epoch": 6692} {"train_loss": -28.299819946289062, "global_step": 555487, "epoch": 6692} {"train_loss": -27.752466201782227, "global_step": 555488, "epoch": 6692} {"train_loss": -27.93012046813965, "global_step": 555489, "epoch": 6692} {"train_loss": -28.044946670532227, "global_step": 555490, "epoch": 6692} {"train_loss": -27.817533493041992, "global_step": 555491, "epoch": 6692} {"train_loss": -27.966833114624023, "global_step": 555492, "epoch": 6692} {"train_loss": -28.269306182861328, "global_step": 555493, "epoch": 6692} {"train_loss": -28.0125789642334, "global_step": 555494, "epoch": 6692} {"train_loss": -28.1685848236084, "global_step": 555495, "epoch": 6692} {"train_loss": -27.856098175048828, "global_step": 555496, "epoch": 6692} {"train_loss": -27.88616371154785, "global_step": 555497, "epoch": 6692} {"train_loss": -26.548084259033203, "global_step": 555498, "epoch": 6692} {"train_loss": -24.993486404418945, "global_step": 555499, "epoch": 6692} {"train_loss": -25.1186580657959, "global_step": 555500, "epoch": 6692} {"train_loss": -25.8033504486084, "global_step": 555501, "epoch": 6692} {"train_loss": -26.659570693969727, "global_step": 555502, "epoch": 6692} {"train_loss": -26.910276412963867, "global_step": 555503, "epoch": 6692} {"train_loss": -26.983129501342773, "global_step": 555504, "epoch": 6692} {"train_loss": -27.24432945251465, "global_step": 555505, "epoch": 6692} {"train_loss": -27.293787002563477, "global_step": 555506, "epoch": 6692} {"train_loss": -27.425745010375977, "global_step": 555507, "epoch": 6692} {"train_loss": -27.43601417541504, "global_step": 555508, "epoch": 6692} {"train_loss": -27.35365104675293, "global_step": 555509, "epoch": 6692} {"train_loss": -27.44358253479004, "global_step": 555510, "epoch": 6692} {"train_loss": -27.67499351501465, "global_step": 555511, "epoch": 6692} {"train_loss": -27.48365592956543, "global_step": 555512, "epoch": 6692} {"train_loss": -27.37168312072754, "global_step": 555513, "epoch": 6692} {"train_loss": -27.656965255737305, "global_step": 555514, "epoch": 6692} {"train_loss": -27.254735946655273, "global_step": 555515, "epoch": 6692} {"train_loss": -27.34918785095215, "global_step": 555516, "epoch": 6692} {"train_loss": -27.578964233398438, "global_step": 555517, "epoch": 6692} {"train_loss": -27.526461842548418, "global_step": 555518, "epoch": 6692, "val_loss": 6368133.0} {"train_loss": -26.963855743408203, "global_step": 555519, "epoch": 6693} {"train_loss": -27.580041885375977, "global_step": 555520, "epoch": 6693} {"train_loss": -27.080902099609375, "global_step": 555521, "epoch": 6693} {"train_loss": -27.078083038330078, "global_step": 555522, "epoch": 6693} {"train_loss": -27.509077072143555, "global_step": 555523, "epoch": 6693} {"train_loss": -27.33253288269043, "global_step": 555524, "epoch": 6693} {"train_loss": -27.620529174804688, "global_step": 555525, "epoch": 6693} {"train_loss": -27.023181915283203, "global_step": 555526, "epoch": 6693} {"train_loss": -27.496952056884766, "global_step": 555527, "epoch": 6693} {"train_loss": -27.418439865112305, "global_step": 555528, "epoch": 6693} {"train_loss": -26.992298126220703, "global_step": 555529, "epoch": 6693} {"train_loss": -27.606769561767578, "global_step": 555530, "epoch": 6693} {"train_loss": -27.215375900268555, "global_step": 555531, "epoch": 6693} {"train_loss": -27.50697898864746, "global_step": 555532, "epoch": 6693} {"train_loss": -27.54201316833496, "global_step": 555533, "epoch": 6693} {"train_loss": -27.41644287109375, "global_step": 555534, "epoch": 6693} {"train_loss": -27.878747940063477, "global_step": 555535, "epoch": 6693} {"train_loss": -27.454391479492188, "global_step": 555536, "epoch": 6693} {"train_loss": -27.285388946533203, "global_step": 555537, "epoch": 6693} {"train_loss": -27.374753952026367, "global_step": 555538, "epoch": 6693} {"train_loss": -27.483495712280273, "global_step": 555539, "epoch": 6693} {"train_loss": -27.641759872436523, "global_step": 555540, "epoch": 6693} {"train_loss": -27.581777572631836, "global_step": 555541, "epoch": 6693} {"train_loss": -27.80427360534668, "global_step": 555542, "epoch": 6693} {"train_loss": -27.704669952392578, "global_step": 555543, "epoch": 6693} {"train_loss": -27.564197540283203, "global_step": 555544, "epoch": 6693} {"train_loss": -27.865652084350586, "global_step": 555545, "epoch": 6693} {"train_loss": -27.245351791381836, "global_step": 555546, "epoch": 6693} {"train_loss": -27.8345947265625, "global_step": 555547, "epoch": 6693} {"train_loss": -27.454572677612305, "global_step": 555548, "epoch": 6693} {"train_loss": -27.735265731811523, "global_step": 555549, "epoch": 6693} {"train_loss": -27.654422760009766, "global_step": 555550, "epoch": 6693} {"train_loss": -27.643644332885742, "global_step": 555551, "epoch": 6693} {"train_loss": -27.7373046875, "global_step": 555552, "epoch": 6693} {"train_loss": -27.833478927612305, "global_step": 555553, "epoch": 6693} {"train_loss": -27.636316299438477, "global_step": 555554, "epoch": 6693} {"train_loss": -27.54676628112793, "global_step": 555555, "epoch": 6693} {"train_loss": -28.08424186706543, "global_step": 555556, "epoch": 6693} {"train_loss": -27.6510009765625, "global_step": 555557, "epoch": 6693} {"train_loss": -28.099287033081055, "global_step": 555558, "epoch": 6693} {"train_loss": -27.89874839782715, "global_step": 555559, "epoch": 6693} {"train_loss": -27.727224349975586, "global_step": 555560, "epoch": 6693} {"train_loss": -27.675586700439453, "global_step": 555561, "epoch": 6693} {"train_loss": -27.96046257019043, "global_step": 555562, "epoch": 6693} {"train_loss": -28.019729614257812, "global_step": 555563, "epoch": 6693} {"train_loss": -27.761926651000977, "global_step": 555564, "epoch": 6693} {"train_loss": -27.95491600036621, "global_step": 555565, "epoch": 6693} {"train_loss": -27.7889404296875, "global_step": 555566, "epoch": 6693} {"train_loss": -27.99318504333496, "global_step": 555567, "epoch": 6693} {"train_loss": -27.981760025024414, "global_step": 555568, "epoch": 6693} {"train_loss": -28.075422286987305, "global_step": 555569, "epoch": 6693} {"train_loss": -27.928497314453125, "global_step": 555570, "epoch": 6693} {"train_loss": -27.800683975219727, "global_step": 555571, "epoch": 6693} {"train_loss": -27.7440185546875, "global_step": 555572, "epoch": 6693} {"train_loss": -27.644622802734375, "global_step": 555573, "epoch": 6693} {"train_loss": -27.523290634155273, "global_step": 555574, "epoch": 6693} {"train_loss": -27.6273193359375, "global_step": 555575, "epoch": 6693} {"train_loss": -27.369003295898438, "global_step": 555576, "epoch": 6693} {"train_loss": -27.722570419311523, "global_step": 555577, "epoch": 6693} {"train_loss": -27.76116943359375, "global_step": 555578, "epoch": 6693} {"train_loss": -27.73117446899414, "global_step": 555579, "epoch": 6693} {"train_loss": -27.886194229125977, "global_step": 555580, "epoch": 6693} {"train_loss": -27.83013343811035, "global_step": 555581, "epoch": 6693} {"train_loss": -27.87550163269043, "global_step": 555582, "epoch": 6693} {"train_loss": -28.00481605529785, "global_step": 555583, "epoch": 6693} {"train_loss": -28.071441650390625, "global_step": 555584, "epoch": 6693} {"train_loss": -27.993921279907227, "global_step": 555585, "epoch": 6693} {"train_loss": -27.62748146057129, "global_step": 555586, "epoch": 6693} {"train_loss": -27.8980712890625, "global_step": 555587, "epoch": 6693} {"train_loss": -27.929243087768555, "global_step": 555588, "epoch": 6693} {"train_loss": -28.382293701171875, "global_step": 555589, "epoch": 6693} {"train_loss": -27.732725143432617, "global_step": 555590, "epoch": 6693} {"train_loss": -27.86427879333496, "global_step": 555591, "epoch": 6693} {"train_loss": -27.820287704467773, "global_step": 555592, "epoch": 6693} {"train_loss": -28.07464599609375, "global_step": 555593, "epoch": 6693} {"train_loss": -28.35719108581543, "global_step": 555594, "epoch": 6693} {"train_loss": -27.537525177001953, "global_step": 555595, "epoch": 6693} {"train_loss": -27.659534454345703, "global_step": 555596, "epoch": 6693} {"train_loss": -27.424030303955078, "global_step": 555597, "epoch": 6693} {"train_loss": -27.752676010131836, "global_step": 555598, "epoch": 6693} {"train_loss": -27.732892990112305, "global_step": 555599, "epoch": 6693} {"train_loss": -27.52784538269043, "global_step": 555600, "epoch": 6693} {"train_loss": -27.669301389211633, "global_step": 555601, "epoch": 6693, "val_loss": 6406871.0} {"train_loss": -27.684972763061523, "global_step": 555602, "epoch": 6694} {"train_loss": -27.747159957885742, "global_step": 555603, "epoch": 6694} {"train_loss": -27.13522720336914, "global_step": 555604, "epoch": 6694} {"train_loss": -27.854883193969727, "global_step": 555605, "epoch": 6694} {"train_loss": -27.629425048828125, "global_step": 555606, "epoch": 6694} {"train_loss": -27.459182739257812, "global_step": 555607, "epoch": 6694} {"train_loss": -27.4361629486084, "global_step": 555608, "epoch": 6694} {"train_loss": -27.5338134765625, "global_step": 555609, "epoch": 6694} {"train_loss": -27.752317428588867, "global_step": 555610, "epoch": 6694} {"train_loss": -27.6428279876709, "global_step": 555611, "epoch": 6694} {"train_loss": -27.73911476135254, "global_step": 555612, "epoch": 6694} {"train_loss": -27.6846866607666, "global_step": 555613, "epoch": 6694} {"train_loss": -27.514570236206055, "global_step": 555614, "epoch": 6694} {"train_loss": -27.83112144470215, "global_step": 555615, "epoch": 6694} {"train_loss": -28.011877059936523, "global_step": 555616, "epoch": 6694} {"train_loss": -27.899093627929688, "global_step": 555617, "epoch": 6694} {"train_loss": -27.31235694885254, "global_step": 555618, "epoch": 6694} {"train_loss": -27.713687896728516, "global_step": 555619, "epoch": 6694} {"train_loss": -27.586400985717773, "global_step": 555620, "epoch": 6694} {"train_loss": -27.496723175048828, "global_step": 555621, "epoch": 6694} {"train_loss": -27.766454696655273, "global_step": 555622, "epoch": 6694} {"train_loss": -27.856603622436523, "global_step": 555623, "epoch": 6694} {"train_loss": -27.756986618041992, "global_step": 555624, "epoch": 6694} {"train_loss": -27.701404571533203, "global_step": 555625, "epoch": 6694} {"train_loss": -27.564178466796875, "global_step": 555626, "epoch": 6694} {"train_loss": -27.781091690063477, "global_step": 555627, "epoch": 6694} {"train_loss": -27.790578842163086, "global_step": 555628, "epoch": 6694} {"train_loss": -27.773193359375, "global_step": 555629, "epoch": 6694} {"train_loss": -27.876554489135742, "global_step": 555630, "epoch": 6694} {"train_loss": -28.044281005859375, "global_step": 555631, "epoch": 6694} {"train_loss": -27.858190536499023, "global_step": 555632, "epoch": 6694} {"train_loss": -27.266128540039062, "global_step": 555633, "epoch": 6694} {"train_loss": -27.448637008666992, "global_step": 555634, "epoch": 6694} {"train_loss": -27.090497970581055, "global_step": 555635, "epoch": 6694} {"train_loss": -26.91206932067871, "global_step": 555636, "epoch": 6694} {"train_loss": -27.608905792236328, "global_step": 555637, "epoch": 6694} {"train_loss": -27.861425399780273, "global_step": 555638, "epoch": 6694} {"train_loss": -26.805845260620117, "global_step": 555639, "epoch": 6694} {"train_loss": -27.5704288482666, "global_step": 555640, "epoch": 6694} {"train_loss": -27.557498931884766, "global_step": 555641, "epoch": 6694} {"train_loss": -27.26032829284668, "global_step": 555642, "epoch": 6694} {"train_loss": -27.420501708984375, "global_step": 555643, "epoch": 6694} {"train_loss": -27.7761173248291, "global_step": 555644, "epoch": 6694} {"train_loss": -26.933679580688477, "global_step": 555645, "epoch": 6694} {"train_loss": -27.50429344177246, "global_step": 555646, "epoch": 6694} {"train_loss": -27.386524200439453, "global_step": 555647, "epoch": 6694} {"train_loss": -27.7132511138916, "global_step": 555648, "epoch": 6694} {"train_loss": -27.05314064025879, "global_step": 555649, "epoch": 6694} {"train_loss": -27.34629249572754, "global_step": 555650, "epoch": 6694} {"train_loss": -27.528156280517578, "global_step": 555651, "epoch": 6694} {"train_loss": -27.611066818237305, "global_step": 555652, "epoch": 6694} {"train_loss": -27.743194580078125, "global_step": 555653, "epoch": 6694} {"train_loss": -27.685617446899414, "global_step": 555654, "epoch": 6694} {"train_loss": -27.981937408447266, "global_step": 555655, "epoch": 6694} {"train_loss": -27.78549575805664, "global_step": 555656, "epoch": 6694} {"train_loss": -27.5277099609375, "global_step": 555657, "epoch": 6694} {"train_loss": -27.992944717407227, "global_step": 555658, "epoch": 6694} {"train_loss": -27.693546295166016, "global_step": 555659, "epoch": 6694} {"train_loss": -27.982046127319336, "global_step": 555660, "epoch": 6694} {"train_loss": -28.26177978515625, "global_step": 555661, "epoch": 6694} {"train_loss": -28.05366325378418, "global_step": 555662, "epoch": 6694} {"train_loss": -28.17527198791504, "global_step": 555663, "epoch": 6694} {"train_loss": -28.042327880859375, "global_step": 555664, "epoch": 6694} {"train_loss": -27.675312042236328, "global_step": 555665, "epoch": 6694} {"train_loss": -28.05946922302246, "global_step": 555666, "epoch": 6694} {"train_loss": -27.784759521484375, "global_step": 555667, "epoch": 6694} {"train_loss": -27.764774322509766, "global_step": 555668, "epoch": 6694} {"train_loss": -28.192218780517578, "global_step": 555669, "epoch": 6694} {"train_loss": -27.712879180908203, "global_step": 555670, "epoch": 6694} {"train_loss": -27.755918502807617, "global_step": 555671, "epoch": 6694} {"train_loss": -27.90964698791504, "global_step": 555672, "epoch": 6694} {"train_loss": -28.051076889038086, "global_step": 555673, "epoch": 6694} {"train_loss": -27.805002212524414, "global_step": 555674, "epoch": 6694} {"train_loss": -27.88608741760254, "global_step": 555675, "epoch": 6694} {"train_loss": -27.819955825805664, "global_step": 555676, "epoch": 6694} {"train_loss": -27.83733558654785, "global_step": 555677, "epoch": 6694} {"train_loss": -28.1867733001709, "global_step": 555678, "epoch": 6694} {"train_loss": -27.410263061523438, "global_step": 555679, "epoch": 6694} {"train_loss": -28.111328125, "global_step": 555680, "epoch": 6694} {"train_loss": -27.850494384765625, "global_step": 555681, "epoch": 6694} {"train_loss": -28.028776168823242, "global_step": 555682, "epoch": 6694} {"train_loss": -27.393198013305664, "global_step": 555683, "epoch": 6694} {"train_loss": -27.692351605518756, "global_step": 555684, "epoch": 6694, "val_loss": 6427857.0} {"train_loss": -27.613290786743164, "global_step": 555685, "epoch": 6695} {"train_loss": -26.946887969970703, "global_step": 555686, "epoch": 6695} {"train_loss": -25.438016891479492, "global_step": 555687, "epoch": 6695} {"train_loss": -23.84842872619629, "global_step": 555688, "epoch": 6695} {"train_loss": -25.638355255126953, "global_step": 555689, "epoch": 6695} {"train_loss": -27.210968017578125, "global_step": 555690, "epoch": 6695} {"train_loss": -26.49066162109375, "global_step": 555691, "epoch": 6695} {"train_loss": -27.264066696166992, "global_step": 555692, "epoch": 6695} {"train_loss": -26.947265625, "global_step": 555693, "epoch": 6695} {"train_loss": -27.175214767456055, "global_step": 555694, "epoch": 6695} {"train_loss": -26.87367057800293, "global_step": 555695, "epoch": 6695} {"train_loss": -27.252716064453125, "global_step": 555696, "epoch": 6695} {"train_loss": -27.175939559936523, "global_step": 555697, "epoch": 6695} {"train_loss": -26.662067413330078, "global_step": 555698, "epoch": 6695} {"train_loss": -27.574304580688477, "global_step": 555699, "epoch": 6695} {"train_loss": -27.223861694335938, "global_step": 555700, "epoch": 6695} {"train_loss": -27.14951515197754, "global_step": 555701, "epoch": 6695} {"train_loss": -27.167524337768555, "global_step": 555702, "epoch": 6695} {"train_loss": -27.531457901000977, "global_step": 555703, "epoch": 6695} {"train_loss": -27.360321044921875, "global_step": 555704, "epoch": 6695} {"train_loss": -27.00784683227539, "global_step": 555705, "epoch": 6695} {"train_loss": -27.37652015686035, "global_step": 555706, "epoch": 6695} {"train_loss": -27.45196533203125, "global_step": 555707, "epoch": 6695} {"train_loss": -27.491943359375, "global_step": 555708, "epoch": 6695} {"train_loss": -27.47857666015625, "global_step": 555709, "epoch": 6695} {"train_loss": -27.33981704711914, "global_step": 555710, "epoch": 6695} {"train_loss": -27.25721549987793, "global_step": 555711, "epoch": 6695} {"train_loss": -27.2009334564209, "global_step": 555712, "epoch": 6695} {"train_loss": -27.602258682250977, "global_step": 555713, "epoch": 6695} {"train_loss": -27.173227310180664, "global_step": 555714, "epoch": 6695} {"train_loss": -27.281301498413086, "global_step": 555715, "epoch": 6695} {"train_loss": -27.298755645751953, "global_step": 555716, "epoch": 6695} {"train_loss": -27.596054077148438, "global_step": 555717, "epoch": 6695} {"train_loss": -27.68183708190918, "global_step": 555718, "epoch": 6695} {"train_loss": -27.68391227722168, "global_step": 555719, "epoch": 6695} {"train_loss": -27.436389923095703, "global_step": 555720, "epoch": 6695} {"train_loss": -27.600051879882812, "global_step": 555721, "epoch": 6695} {"train_loss": -27.352649688720703, "global_step": 555722, "epoch": 6695} {"train_loss": -27.49755859375, "global_step": 555723, "epoch": 6695} {"train_loss": -28.0039119720459, "global_step": 555724, "epoch": 6695} {"train_loss": -27.58967399597168, "global_step": 555725, "epoch": 6695} {"train_loss": -27.325576782226562, "global_step": 555726, "epoch": 6695} {"train_loss": -27.3539981842041, "global_step": 555727, "epoch": 6695} {"train_loss": -27.7237491607666, "global_step": 555728, "epoch": 6695} {"train_loss": -27.340850830078125, "global_step": 555729, "epoch": 6695} {"train_loss": -27.5170841217041, "global_step": 555730, "epoch": 6695} {"train_loss": -28.044296264648438, "global_step": 555731, "epoch": 6695} {"train_loss": -27.694181442260742, "global_step": 555732, "epoch": 6695} {"train_loss": -27.96807289123535, "global_step": 555733, "epoch": 6695} {"train_loss": -28.08698844909668, "global_step": 555734, "epoch": 6695} {"train_loss": -27.594648361206055, "global_step": 555735, "epoch": 6695} {"train_loss": -27.489294052124023, "global_step": 555736, "epoch": 6695} {"train_loss": -27.936803817749023, "global_step": 555737, "epoch": 6695} {"train_loss": -27.628286361694336, "global_step": 555738, "epoch": 6695} {"train_loss": -27.779804229736328, "global_step": 555739, "epoch": 6695} {"train_loss": -28.079147338867188, "global_step": 555740, "epoch": 6695} {"train_loss": -27.81702995300293, "global_step": 555741, "epoch": 6695} {"train_loss": -27.975879669189453, "global_step": 555742, "epoch": 6695} {"train_loss": -27.66669273376465, "global_step": 555743, "epoch": 6695} {"train_loss": -27.581775665283203, "global_step": 555744, "epoch": 6695} {"train_loss": -27.511310577392578, "global_step": 555745, "epoch": 6695} {"train_loss": -27.468597412109375, "global_step": 555746, "epoch": 6695} {"train_loss": -27.238187789916992, "global_step": 555747, "epoch": 6695} {"train_loss": -27.505701065063477, "global_step": 555748, "epoch": 6695} {"train_loss": -27.370014190673828, "global_step": 555749, "epoch": 6695} {"train_loss": -27.754486083984375, "global_step": 555750, "epoch": 6695} {"train_loss": -28.13006019592285, "global_step": 555751, "epoch": 6695} {"train_loss": -28.248090744018555, "global_step": 555752, "epoch": 6695} {"train_loss": -27.362720489501953, "global_step": 555753, "epoch": 6695} {"train_loss": -27.489599227905273, "global_step": 555754, "epoch": 6695} {"train_loss": -27.79866600036621, "global_step": 555755, "epoch": 6695} {"train_loss": -27.769437789916992, "global_step": 555756, "epoch": 6695} {"train_loss": -28.113317489624023, "global_step": 555757, "epoch": 6695} {"train_loss": -27.956073760986328, "global_step": 555758, "epoch": 6695} {"train_loss": -28.081588745117188, "global_step": 555759, "epoch": 6695} {"train_loss": -28.003820419311523, "global_step": 555760, "epoch": 6695} {"train_loss": -27.883319854736328, "global_step": 555761, "epoch": 6695} {"train_loss": -27.984725952148438, "global_step": 555762, "epoch": 6695} {"train_loss": -28.04721450805664, "global_step": 555763, "epoch": 6695} {"train_loss": -27.915258407592773, "global_step": 555764, "epoch": 6695} {"train_loss": -27.946796417236328, "global_step": 555765, "epoch": 6695} {"train_loss": -28.0610408782959, "global_step": 555766, "epoch": 6695} {"train_loss": -27.44576111759048, "global_step": 555767, "epoch": 6695, "val_loss": 6420906.0} {"train_loss": -26.989233016967773, "global_step": 555768, "epoch": 6696} {"train_loss": -25.387060165405273, "global_step": 555769, "epoch": 6696} {"train_loss": -26.699726104736328, "global_step": 555770, "epoch": 6696} {"train_loss": -26.66156578063965, "global_step": 555771, "epoch": 6696} {"train_loss": -26.130985260009766, "global_step": 555772, "epoch": 6696} {"train_loss": -27.010908126831055, "global_step": 555773, "epoch": 6696} {"train_loss": -26.39276123046875, "global_step": 555774, "epoch": 6696} {"train_loss": -26.82118797302246, "global_step": 555775, "epoch": 6696} {"train_loss": -27.216989517211914, "global_step": 555776, "epoch": 6696} {"train_loss": -26.782318115234375, "global_step": 555777, "epoch": 6696} {"train_loss": -27.01593589782715, "global_step": 555778, "epoch": 6696} {"train_loss": -27.06243896484375, "global_step": 555779, "epoch": 6696} {"train_loss": -27.174686431884766, "global_step": 555780, "epoch": 6696} {"train_loss": -26.85519790649414, "global_step": 555781, "epoch": 6696} {"train_loss": -27.37129020690918, "global_step": 555782, "epoch": 6696} {"train_loss": -27.442548751831055, "global_step": 555783, "epoch": 6696} {"train_loss": -27.479711532592773, "global_step": 555784, "epoch": 6696} {"train_loss": -27.466861724853516, "global_step": 555785, "epoch": 6696} {"train_loss": -27.370275497436523, "global_step": 555786, "epoch": 6696} {"train_loss": -27.52500343322754, "global_step": 555787, "epoch": 6696} {"train_loss": -27.48667335510254, "global_step": 555788, "epoch": 6696} {"train_loss": -27.580005645751953, "global_step": 555789, "epoch": 6696} {"train_loss": -27.684757232666016, "global_step": 555790, "epoch": 6696} {"train_loss": -27.444822311401367, "global_step": 555791, "epoch": 6696} {"train_loss": -27.91663932800293, "global_step": 555792, "epoch": 6696} {"train_loss": -27.56825065612793, "global_step": 555793, "epoch": 6696} {"train_loss": -28.001672744750977, "global_step": 555794, "epoch": 6696} {"train_loss": -27.519628524780273, "global_step": 555795, "epoch": 6696} {"train_loss": -27.858600616455078, "global_step": 555796, "epoch": 6696} {"train_loss": -27.43320655822754, "global_step": 555797, "epoch": 6696} {"train_loss": -27.59220314025879, "global_step": 555798, "epoch": 6696} {"train_loss": -27.2515811920166, "global_step": 555799, "epoch": 6696} {"train_loss": -28.21186637878418, "global_step": 555800, "epoch": 6696} {"train_loss": -27.8156795501709, "global_step": 555801, "epoch": 6696} {"train_loss": -27.540048599243164, "global_step": 555802, "epoch": 6696} {"train_loss": -27.8543758392334, "global_step": 555803, "epoch": 6696} {"train_loss": -27.859472274780273, "global_step": 555804, "epoch": 6696} {"train_loss": -27.838571548461914, "global_step": 555805, "epoch": 6696} {"train_loss": -27.598981857299805, "global_step": 555806, "epoch": 6696} {"train_loss": -27.84930992126465, "global_step": 555807, "epoch": 6696} {"train_loss": -27.71270751953125, "global_step": 555808, "epoch": 6696} {"train_loss": -27.646472930908203, "global_step": 555809, "epoch": 6696} {"train_loss": -27.80672264099121, "global_step": 555810, "epoch": 6696} {"train_loss": -27.723739624023438, "global_step": 555811, "epoch": 6696} {"train_loss": -28.0114803314209, "global_step": 555812, "epoch": 6696} {"train_loss": -27.77437400817871, "global_step": 555813, "epoch": 6696} {"train_loss": -27.8121395111084, "global_step": 555814, "epoch": 6696} {"train_loss": -27.73020362854004, "global_step": 555815, "epoch": 6696} {"train_loss": -27.627172470092773, "global_step": 555816, "epoch": 6696} {"train_loss": -27.928791046142578, "global_step": 555817, "epoch": 6696} {"train_loss": -27.29861831665039, "global_step": 555818, "epoch": 6696} {"train_loss": -27.30083656311035, "global_step": 555819, "epoch": 6696} {"train_loss": -27.84157371520996, "global_step": 555820, "epoch": 6696} {"train_loss": -28.1134090423584, "global_step": 555821, "epoch": 6696} {"train_loss": -28.05451011657715, "global_step": 555822, "epoch": 6696} {"train_loss": -27.72086524963379, "global_step": 555823, "epoch": 6696} {"train_loss": -28.178516387939453, "global_step": 555824, "epoch": 6696} {"train_loss": -27.611963272094727, "global_step": 555825, "epoch": 6696} {"train_loss": -27.662084579467773, "global_step": 555826, "epoch": 6696} {"train_loss": -27.8394832611084, "global_step": 555827, "epoch": 6696} {"train_loss": -28.091699600219727, "global_step": 555828, "epoch": 6696} {"train_loss": -27.832860946655273, "global_step": 555829, "epoch": 6696} {"train_loss": -28.133634567260742, "global_step": 555830, "epoch": 6696} {"train_loss": -28.005075454711914, "global_step": 555831, "epoch": 6696} {"train_loss": -27.774335861206055, "global_step": 555832, "epoch": 6696} {"train_loss": -27.44930076599121, "global_step": 555833, "epoch": 6696} {"train_loss": -27.902372360229492, "global_step": 555834, "epoch": 6696} {"train_loss": -27.740036010742188, "global_step": 555835, "epoch": 6696} {"train_loss": -28.1160831451416, "global_step": 555836, "epoch": 6696} {"train_loss": -28.045856475830078, "global_step": 555837, "epoch": 6696} {"train_loss": -27.780630111694336, "global_step": 555838, "epoch": 6696} {"train_loss": -27.99519157409668, "global_step": 555839, "epoch": 6696} {"train_loss": -28.060998916625977, "global_step": 555840, "epoch": 6696} {"train_loss": -27.907323837280273, "global_step": 555841, "epoch": 6696} {"train_loss": -27.705469131469727, "global_step": 555842, "epoch": 6696} {"train_loss": -27.77753257751465, "global_step": 555843, "epoch": 6696} {"train_loss": -28.009052276611328, "global_step": 555844, "epoch": 6696} {"train_loss": -27.841405868530273, "global_step": 555845, "epoch": 6696} {"train_loss": -27.52338218688965, "global_step": 555846, "epoch": 6696} {"train_loss": -27.62653923034668, "global_step": 555847, "epoch": 6696} {"train_loss": -27.596410751342773, "global_step": 555848, "epoch": 6696} {"train_loss": -27.631555557250977, "global_step": 555849, "epoch": 6696} {"train_loss": -27.554080848234246, "global_step": 555850, "epoch": 6696, "val_loss": 6404862.5} {"train_loss": -26.740936279296875, "global_step": 555851, "epoch": 6697} {"train_loss": -26.948877334594727, "global_step": 555852, "epoch": 6697} {"train_loss": -26.979938507080078, "global_step": 555853, "epoch": 6697} {"train_loss": -27.551645278930664, "global_step": 555854, "epoch": 6697} {"train_loss": -27.706838607788086, "global_step": 555855, "epoch": 6697} {"train_loss": -27.222980499267578, "global_step": 555856, "epoch": 6697} {"train_loss": -27.6772403717041, "global_step": 555857, "epoch": 6697} {"train_loss": -27.358800888061523, "global_step": 555858, "epoch": 6697} {"train_loss": -27.461780548095703, "global_step": 555859, "epoch": 6697} {"train_loss": -27.47733497619629, "global_step": 555860, "epoch": 6697} {"train_loss": -27.756250381469727, "global_step": 555861, "epoch": 6697} {"train_loss": -27.383604049682617, "global_step": 555862, "epoch": 6697} {"train_loss": -27.73312759399414, "global_step": 555863, "epoch": 6697} {"train_loss": -27.446582794189453, "global_step": 555864, "epoch": 6697} {"train_loss": -27.451196670532227, "global_step": 555865, "epoch": 6697} {"train_loss": -27.36714744567871, "global_step": 555866, "epoch": 6697} {"train_loss": -27.905807495117188, "global_step": 555867, "epoch": 6697} {"train_loss": -27.61297607421875, "global_step": 555868, "epoch": 6697} {"train_loss": -27.95709228515625, "global_step": 555869, "epoch": 6697} {"train_loss": -27.444807052612305, "global_step": 555870, "epoch": 6697} {"train_loss": -27.730316162109375, "global_step": 555871, "epoch": 6697} {"train_loss": -28.093870162963867, "global_step": 555872, "epoch": 6697} {"train_loss": -27.689306259155273, "global_step": 555873, "epoch": 6697} {"train_loss": -27.879669189453125, "global_step": 555874, "epoch": 6697} {"train_loss": -27.960296630859375, "global_step": 555875, "epoch": 6697} {"train_loss": -27.670276641845703, "global_step": 555876, "epoch": 6697} {"train_loss": -27.710800170898438, "global_step": 555877, "epoch": 6697} {"train_loss": -27.6544246673584, "global_step": 555878, "epoch": 6697} {"train_loss": -27.84186363220215, "global_step": 555879, "epoch": 6697} {"train_loss": -27.42432975769043, "global_step": 555880, "epoch": 6697} {"train_loss": -27.817523956298828, "global_step": 555881, "epoch": 6697} {"train_loss": -28.035863876342773, "global_step": 555882, "epoch": 6697} {"train_loss": -28.20639991760254, "global_step": 555883, "epoch": 6697} {"train_loss": -28.007110595703125, "global_step": 555884, "epoch": 6697} {"train_loss": -27.879606246948242, "global_step": 555885, "epoch": 6697} {"train_loss": -27.920618057250977, "global_step": 555886, "epoch": 6697} {"train_loss": -27.910144805908203, "global_step": 555887, "epoch": 6697} {"train_loss": -28.224462509155273, "global_step": 555888, "epoch": 6697} {"train_loss": -27.90626335144043, "global_step": 555889, "epoch": 6697} {"train_loss": -28.23349952697754, "global_step": 555890, "epoch": 6697} {"train_loss": -27.81119728088379, "global_step": 555891, "epoch": 6697} {"train_loss": -27.73687744140625, "global_step": 555892, "epoch": 6697} {"train_loss": -28.188032150268555, "global_step": 555893, "epoch": 6697} {"train_loss": -27.479001998901367, "global_step": 555894, "epoch": 6697} {"train_loss": -28.074689865112305, "global_step": 555895, "epoch": 6697} {"train_loss": -28.170148849487305, "global_step": 555896, "epoch": 6697} {"train_loss": -27.872594833374023, "global_step": 555897, "epoch": 6697} {"train_loss": -27.728452682495117, "global_step": 555898, "epoch": 6697} {"train_loss": -27.599884033203125, "global_step": 555899, "epoch": 6697} {"train_loss": -27.82364845275879, "global_step": 555900, "epoch": 6697} {"train_loss": -27.5909423828125, "global_step": 555901, "epoch": 6697} {"train_loss": -27.66015625, "global_step": 555902, "epoch": 6697} {"train_loss": -27.610137939453125, "global_step": 555903, "epoch": 6697} {"train_loss": -27.147708892822266, "global_step": 555904, "epoch": 6697} {"train_loss": -27.138456344604492, "global_step": 555905, "epoch": 6697} {"train_loss": -27.288379669189453, "global_step": 555906, "epoch": 6697} {"train_loss": -28.272125244140625, "global_step": 555907, "epoch": 6697} {"train_loss": -27.573566436767578, "global_step": 555908, "epoch": 6697} {"train_loss": -27.011199951171875, "global_step": 555909, "epoch": 6697} {"train_loss": -27.330474853515625, "global_step": 555910, "epoch": 6697} {"train_loss": -27.8288631439209, "global_step": 555911, "epoch": 6697} {"train_loss": -27.866636276245117, "global_step": 555912, "epoch": 6697} {"train_loss": -27.663999557495117, "global_step": 555913, "epoch": 6697} {"train_loss": -27.75626564025879, "global_step": 555914, "epoch": 6697} {"train_loss": -27.742446899414062, "global_step": 555915, "epoch": 6697} {"train_loss": -27.65340232849121, "global_step": 555916, "epoch": 6697} {"train_loss": -27.7907657623291, "global_step": 555917, "epoch": 6697} {"train_loss": -27.447479248046875, "global_step": 555918, "epoch": 6697} {"train_loss": -28.071359634399414, "global_step": 555919, "epoch": 6697} {"train_loss": -27.964345932006836, "global_step": 555920, "epoch": 6697} {"train_loss": -27.496931076049805, "global_step": 555921, "epoch": 6697} {"train_loss": -27.56415367126465, "global_step": 555922, "epoch": 6697} {"train_loss": -27.90768814086914, "global_step": 555923, "epoch": 6697} {"train_loss": -27.411046981811523, "global_step": 555924, "epoch": 6697} {"train_loss": -27.92460060119629, "global_step": 555925, "epoch": 6697} {"train_loss": -27.59673500061035, "global_step": 555926, "epoch": 6697} {"train_loss": -27.581571578979492, "global_step": 555927, "epoch": 6697} {"train_loss": -27.414831161499023, "global_step": 555928, "epoch": 6697} {"train_loss": -27.966217041015625, "global_step": 555929, "epoch": 6697} {"train_loss": -27.32330322265625, "global_step": 555930, "epoch": 6697} {"train_loss": -27.52327537536621, "global_step": 555931, "epoch": 6697} {"train_loss": -27.689367294311523, "global_step": 555932, "epoch": 6697} {"train_loss": -27.684256680040473, "global_step": 555933, "epoch": 6697, "val_loss": 6450184.0} {"train_loss": -27.258758544921875, "global_step": 555934, "epoch": 6698} {"train_loss": -26.563953399658203, "global_step": 555935, "epoch": 6698} {"train_loss": -27.3291015625, "global_step": 555936, "epoch": 6698} {"train_loss": -27.20440673828125, "global_step": 555937, "epoch": 6698} {"train_loss": -27.216665267944336, "global_step": 555938, "epoch": 6698} {"train_loss": -26.95448112487793, "global_step": 555939, "epoch": 6698} {"train_loss": -27.453027725219727, "global_step": 555940, "epoch": 6698} {"train_loss": -27.496734619140625, "global_step": 555941, "epoch": 6698} {"train_loss": -27.384033203125, "global_step": 555942, "epoch": 6698} {"train_loss": -27.669652938842773, "global_step": 555943, "epoch": 6698} {"train_loss": -27.381616592407227, "global_step": 555944, "epoch": 6698} {"train_loss": -27.986982345581055, "global_step": 555945, "epoch": 6698} {"train_loss": -27.830366134643555, "global_step": 555946, "epoch": 6698} {"train_loss": -27.54587173461914, "global_step": 555947, "epoch": 6698} {"train_loss": -27.349491119384766, "global_step": 555948, "epoch": 6698} {"train_loss": -27.662647247314453, "global_step": 555949, "epoch": 6698} {"train_loss": -27.499364852905273, "global_step": 555950, "epoch": 6698} {"train_loss": -27.35743522644043, "global_step": 555951, "epoch": 6698} {"train_loss": -27.52071189880371, "global_step": 555952, "epoch": 6698} {"train_loss": -27.597700119018555, "global_step": 555953, "epoch": 6698} {"train_loss": -27.67061424255371, "global_step": 555954, "epoch": 6698} {"train_loss": -27.685516357421875, "global_step": 555955, "epoch": 6698} {"train_loss": -27.590280532836914, "global_step": 555956, "epoch": 6698} {"train_loss": -27.6911678314209, "global_step": 555957, "epoch": 6698} {"train_loss": -27.60169792175293, "global_step": 555958, "epoch": 6698} {"train_loss": -27.48821449279785, "global_step": 555959, "epoch": 6698} {"train_loss": -27.524045944213867, "global_step": 555960, "epoch": 6698} {"train_loss": -27.9980411529541, "global_step": 555961, "epoch": 6698} {"train_loss": -27.84524917602539, "global_step": 555962, "epoch": 6698} {"train_loss": -27.935958862304688, "global_step": 555963, "epoch": 6698} {"train_loss": -28.04469871520996, "global_step": 555964, "epoch": 6698} {"train_loss": -27.7515869140625, "global_step": 555965, "epoch": 6698} {"train_loss": -27.82122802734375, "global_step": 555966, "epoch": 6698} {"train_loss": -27.99566650390625, "global_step": 555967, "epoch": 6698} {"train_loss": -27.927276611328125, "global_step": 555968, "epoch": 6698} {"train_loss": -27.41805076599121, "global_step": 555969, "epoch": 6698} {"train_loss": -27.5079402923584, "global_step": 555970, "epoch": 6698} {"train_loss": -27.922876358032227, "global_step": 555971, "epoch": 6698} {"train_loss": -27.92441749572754, "global_step": 555972, "epoch": 6698} {"train_loss": -27.478342056274414, "global_step": 555973, "epoch": 6698} {"train_loss": -27.980512619018555, "global_step": 555974, "epoch": 6698} {"train_loss": -27.904541015625, "global_step": 555975, "epoch": 6698} {"train_loss": -27.899457931518555, "global_step": 555976, "epoch": 6698} {"train_loss": -27.749963760375977, "global_step": 555977, "epoch": 6698} {"train_loss": -27.69111442565918, "global_step": 555978, "epoch": 6698} {"train_loss": -27.62116813659668, "global_step": 555979, "epoch": 6698} {"train_loss": -27.984235763549805, "global_step": 555980, "epoch": 6698} {"train_loss": -27.813573837280273, "global_step": 555981, "epoch": 6698} {"train_loss": -27.82423210144043, "global_step": 555982, "epoch": 6698} {"train_loss": -27.507923126220703, "global_step": 555983, "epoch": 6698} {"train_loss": -27.55328369140625, "global_step": 555984, "epoch": 6698} {"train_loss": -27.748083114624023, "global_step": 555985, "epoch": 6698} {"train_loss": -27.945993423461914, "global_step": 555986, "epoch": 6698} {"train_loss": -27.94443130493164, "global_step": 555987, "epoch": 6698} {"train_loss": -27.621387481689453, "global_step": 555988, "epoch": 6698} {"train_loss": -27.633533477783203, "global_step": 555989, "epoch": 6698} {"train_loss": -27.6697998046875, "global_step": 555990, "epoch": 6698} {"train_loss": -27.68995475769043, "global_step": 555991, "epoch": 6698} {"train_loss": -27.856916427612305, "global_step": 555992, "epoch": 6698} {"train_loss": -27.665327072143555, "global_step": 555993, "epoch": 6698} {"train_loss": -27.75737953186035, "global_step": 555994, "epoch": 6698} {"train_loss": -27.325336456298828, "global_step": 555995, "epoch": 6698} {"train_loss": -27.3544979095459, "global_step": 555996, "epoch": 6698} {"train_loss": -27.880142211914062, "global_step": 555997, "epoch": 6698} {"train_loss": -27.6854248046875, "global_step": 555998, "epoch": 6698} {"train_loss": -27.495275497436523, "global_step": 555999, "epoch": 6698} {"train_loss": -27.209735870361328, "global_step": 556000, "epoch": 6698} {"train_loss": -27.848596572875977, "global_step": 556001, "epoch": 6698} {"train_loss": -27.780282974243164, "global_step": 556002, "epoch": 6698} {"train_loss": -27.518524169921875, "global_step": 556003, "epoch": 6698} {"train_loss": -27.371673583984375, "global_step": 556004, "epoch": 6698} {"train_loss": -27.734067916870117, "global_step": 556005, "epoch": 6698} {"train_loss": -28.149097442626953, "global_step": 556006, "epoch": 6698} {"train_loss": -27.688440322875977, "global_step": 556007, "epoch": 6698} {"train_loss": -27.68048095703125, "global_step": 556008, "epoch": 6698} {"train_loss": -28.20735740661621, "global_step": 556009, "epoch": 6698} {"train_loss": -27.886810302734375, "global_step": 556010, "epoch": 6698} {"train_loss": -27.87078857421875, "global_step": 556011, "epoch": 6698} {"train_loss": -27.79046058654785, "global_step": 556012, "epoch": 6698} {"train_loss": -27.652240753173828, "global_step": 556013, "epoch": 6698} {"train_loss": -28.024566650390625, "global_step": 556014, "epoch": 6698} {"train_loss": -27.744665145874023, "global_step": 556015, "epoch": 6698} {"train_loss": -27.653539220970796, "global_step": 556016, "epoch": 6698, "val_loss": 6423781.0} {"train_loss": -25.664403915405273, "global_step": 556017, "epoch": 6699} {"train_loss": -24.52090835571289, "global_step": 556018, "epoch": 6699} {"train_loss": -26.797683715820312, "global_step": 556019, "epoch": 6699} {"train_loss": -26.789213180541992, "global_step": 556020, "epoch": 6699} {"train_loss": -26.643936157226562, "global_step": 556021, "epoch": 6699} {"train_loss": -27.065509796142578, "global_step": 556022, "epoch": 6699} {"train_loss": -27.130231857299805, "global_step": 556023, "epoch": 6699} {"train_loss": -26.952198028564453, "global_step": 556024, "epoch": 6699} {"train_loss": -27.310489654541016, "global_step": 556025, "epoch": 6699} {"train_loss": -27.18975830078125, "global_step": 556026, "epoch": 6699} {"train_loss": -27.163288116455078, "global_step": 556027, "epoch": 6699} {"train_loss": -27.1751766204834, "global_step": 556028, "epoch": 6699} {"train_loss": -26.885955810546875, "global_step": 556029, "epoch": 6699} {"train_loss": -27.090421676635742, "global_step": 556030, "epoch": 6699} {"train_loss": -27.02577781677246, "global_step": 556031, "epoch": 6699} {"train_loss": -27.243549346923828, "global_step": 556032, "epoch": 6699} {"train_loss": -27.337697982788086, "global_step": 556033, "epoch": 6699} {"train_loss": -27.519031524658203, "global_step": 556034, "epoch": 6699} {"train_loss": -27.687259674072266, "global_step": 556035, "epoch": 6699} {"train_loss": -27.069538116455078, "global_step": 556036, "epoch": 6699} {"train_loss": -27.96625328063965, "global_step": 556037, "epoch": 6699} {"train_loss": -27.337020874023438, "global_step": 556038, "epoch": 6699} {"train_loss": -27.143142700195312, "global_step": 556039, "epoch": 6699} {"train_loss": -27.401325225830078, "global_step": 556040, "epoch": 6699} {"train_loss": -27.622785568237305, "global_step": 556041, "epoch": 6699} {"train_loss": -27.3934268951416, "global_step": 556042, "epoch": 6699} {"train_loss": -27.7825870513916, "global_step": 556043, "epoch": 6699} {"train_loss": -27.691787719726562, "global_step": 556044, "epoch": 6699} {"train_loss": -27.580236434936523, "global_step": 556045, "epoch": 6699} {"train_loss": -27.444257736206055, "global_step": 556046, "epoch": 6699} {"train_loss": -27.546127319335938, "global_step": 556047, "epoch": 6699} {"train_loss": -27.779315948486328, "global_step": 556048, "epoch": 6699} {"train_loss": -27.551807403564453, "global_step": 556049, "epoch": 6699} {"train_loss": -27.78083610534668, "global_step": 556050, "epoch": 6699} {"train_loss": -27.834070205688477, "global_step": 556051, "epoch": 6699} {"train_loss": -27.939228057861328, "global_step": 556052, "epoch": 6699} {"train_loss": -27.717756271362305, "global_step": 556053, "epoch": 6699} {"train_loss": -27.8904972076416, "global_step": 556054, "epoch": 6699} {"train_loss": -27.704193115234375, "global_step": 556055, "epoch": 6699} {"train_loss": -27.650379180908203, "global_step": 556056, "epoch": 6699} {"train_loss": -27.908618927001953, "global_step": 556057, "epoch": 6699} {"train_loss": -27.75221061706543, "global_step": 556058, "epoch": 6699} {"train_loss": -27.88166618347168, "global_step": 556059, "epoch": 6699} {"train_loss": -28.3599853515625, "global_step": 556060, "epoch": 6699} {"train_loss": -28.084165573120117, "global_step": 556061, "epoch": 6699} {"train_loss": -28.151172637939453, "global_step": 556062, "epoch": 6699} {"train_loss": -27.769681930541992, "global_step": 556063, "epoch": 6699} {"train_loss": -27.820377349853516, "global_step": 556064, "epoch": 6699} {"train_loss": -27.651493072509766, "global_step": 556065, "epoch": 6699} {"train_loss": -27.289600372314453, "global_step": 556066, "epoch": 6699} {"train_loss": -27.62821388244629, "global_step": 556067, "epoch": 6699} {"train_loss": -27.712371826171875, "global_step": 556068, "epoch": 6699} {"train_loss": -27.618871688842773, "global_step": 556069, "epoch": 6699} {"train_loss": -27.9417781829834, "global_step": 556070, "epoch": 6699} {"train_loss": -27.863370895385742, "global_step": 556071, "epoch": 6699} {"train_loss": -27.29743003845215, "global_step": 556072, "epoch": 6699} {"train_loss": -27.378461837768555, "global_step": 556073, "epoch": 6699} {"train_loss": -27.466333389282227, "global_step": 556074, "epoch": 6699} {"train_loss": -27.98420524597168, "global_step": 556075, "epoch": 6699} {"train_loss": -27.458160400390625, "global_step": 556076, "epoch": 6699} {"train_loss": -27.7460994720459, "global_step": 556077, "epoch": 6699} {"train_loss": -27.005584716796875, "global_step": 556078, "epoch": 6699} {"train_loss": -27.71346092224121, "global_step": 556079, "epoch": 6699} {"train_loss": -27.393171310424805, "global_step": 556080, "epoch": 6699} {"train_loss": -27.234399795532227, "global_step": 556081, "epoch": 6699} {"train_loss": -27.706884384155273, "global_step": 556082, "epoch": 6699} {"train_loss": -27.516809463500977, "global_step": 556083, "epoch": 6699} {"train_loss": -27.654077529907227, "global_step": 556084, "epoch": 6699} {"train_loss": -27.70857048034668, "global_step": 556085, "epoch": 6699} {"train_loss": -27.910261154174805, "global_step": 556086, "epoch": 6699} {"train_loss": -27.721586227416992, "global_step": 556087, "epoch": 6699} {"train_loss": -27.701339721679688, "global_step": 556088, "epoch": 6699} {"train_loss": -27.949445724487305, "global_step": 556089, "epoch": 6699} {"train_loss": -27.626556396484375, "global_step": 556090, "epoch": 6699} {"train_loss": -27.868499755859375, "global_step": 556091, "epoch": 6699} {"train_loss": -27.69013786315918, "global_step": 556092, "epoch": 6699} {"train_loss": -28.02850914001465, "global_step": 556093, "epoch": 6699} {"train_loss": -27.7977294921875, "global_step": 556094, "epoch": 6699} {"train_loss": -27.836002349853516, "global_step": 556095, "epoch": 6699} {"train_loss": -27.81304931640625, "global_step": 556096, "epoch": 6699} {"train_loss": -28.054346084594727, "global_step": 556097, "epoch": 6699} {"train_loss": -28.160276412963867, "global_step": 556098, "epoch": 6699} {"train_loss": -27.50616873316018, "global_step": 556099, "epoch": 6699, "val_loss": 6410354.0} {"train_loss": -27.689743041992188, "global_step": 556100, "epoch": 6700} {"train_loss": -28.009923934936523, "global_step": 556101, "epoch": 6700} {"train_loss": -27.627368927001953, "global_step": 556102, "epoch": 6700} {"train_loss": -27.83365821838379, "global_step": 556103, "epoch": 6700} {"train_loss": -28.027124404907227, "global_step": 556104, "epoch": 6700} {"train_loss": -27.148468017578125, "global_step": 556105, "epoch": 6700} {"train_loss": -27.753498077392578, "global_step": 556106, "epoch": 6700} {"train_loss": -27.424789428710938, "global_step": 556107, "epoch": 6700} {"train_loss": -28.081769943237305, "global_step": 556108, "epoch": 6700} {"train_loss": -27.4169921875, "global_step": 556109, "epoch": 6700} {"train_loss": -27.712717056274414, "global_step": 556110, "epoch": 6700} {"train_loss": -27.83076286315918, "global_step": 556111, "epoch": 6700} {"train_loss": -27.35873794555664, "global_step": 556112, "epoch": 6700} {"train_loss": -28.074010848999023, "global_step": 556113, "epoch": 6700} {"train_loss": -27.73837661743164, "global_step": 556114, "epoch": 6700} {"train_loss": -27.81586265563965, "global_step": 556115, "epoch": 6700} {"train_loss": -28.011091232299805, "global_step": 556116, "epoch": 6700} {"train_loss": -27.548736572265625, "global_step": 556117, "epoch": 6700} {"train_loss": -27.842416763305664, "global_step": 556118, "epoch": 6700} {"train_loss": -27.998876571655273, "global_step": 556119, "epoch": 6700} {"train_loss": -27.80902099609375, "global_step": 556120, "epoch": 6700} {"train_loss": -27.577123641967773, "global_step": 556121, "epoch": 6700} {"train_loss": -27.62060546875, "global_step": 556122, "epoch": 6700} {"train_loss": -27.5535831451416, "global_step": 556123, "epoch": 6700} {"train_loss": -27.511581420898438, "global_step": 556124, "epoch": 6700} {"train_loss": -27.59344482421875, "global_step": 556125, "epoch": 6700} {"train_loss": -27.880056381225586, "global_step": 556126, "epoch": 6700} {"train_loss": -27.301898956298828, "global_step": 556127, "epoch": 6700} {"train_loss": -27.4835262298584, "global_step": 556128, "epoch": 6700} {"train_loss": -28.2944393157959, "global_step": 556129, "epoch": 6700} {"train_loss": -27.730331420898438, "global_step": 556130, "epoch": 6700} {"train_loss": -27.65500831604004, "global_step": 556131, "epoch": 6700} {"train_loss": -28.075780868530273, "global_step": 556132, "epoch": 6700} {"train_loss": -27.872268676757812, "global_step": 556133, "epoch": 6700} {"train_loss": -27.651968002319336, "global_step": 556134, "epoch": 6700} {"train_loss": -27.99335289001465, "global_step": 556135, "epoch": 6700} {"train_loss": -27.816770553588867, "global_step": 556136, "epoch": 6700} {"train_loss": -27.66401481628418, "global_step": 556137, "epoch": 6700} {"train_loss": -27.39034080505371, "global_step": 556138, "epoch": 6700} {"train_loss": -27.593338012695312, "global_step": 556139, "epoch": 6700} {"train_loss": -27.80791664123535, "global_step": 556140, "epoch": 6700} {"train_loss": -27.52554702758789, "global_step": 556141, "epoch": 6700} {"train_loss": -27.703519821166992, "global_step": 556142, "epoch": 6700} {"train_loss": -27.70868492126465, "global_step": 556143, "epoch": 6700} {"train_loss": -27.799413681030273, "global_step": 556144, "epoch": 6700} {"train_loss": -27.324405670166016, "global_step": 556145, "epoch": 6700} {"train_loss": -27.601974487304688, "global_step": 556146, "epoch": 6700} {"train_loss": -27.8339900970459, "global_step": 556147, "epoch": 6700} {"train_loss": -27.779706954956055, "global_step": 556148, "epoch": 6700} {"train_loss": -27.62336540222168, "global_step": 556149, "epoch": 6700} {"train_loss": -28.062152862548828, "global_step": 556150, "epoch": 6700} {"train_loss": -27.812427520751953, "global_step": 556151, "epoch": 6700} {"train_loss": -27.93621826171875, "global_step": 556152, "epoch": 6700} {"train_loss": -28.03251075744629, "global_step": 556153, "epoch": 6700} {"train_loss": -27.530914306640625, "global_step": 556154, "epoch": 6700} {"train_loss": -27.53260612487793, "global_step": 556155, "epoch": 6700} {"train_loss": -27.307748794555664, "global_step": 556156, "epoch": 6700} {"train_loss": -27.47900390625, "global_step": 556157, "epoch": 6700} {"train_loss": -27.828109741210938, "global_step": 556158, "epoch": 6700} {"train_loss": -27.816486358642578, "global_step": 556159, "epoch": 6700} {"train_loss": -27.9800968170166, "global_step": 556160, "epoch": 6700} {"train_loss": -27.953229904174805, "global_step": 556161, "epoch": 6700} {"train_loss": -27.565107345581055, "global_step": 556162, "epoch": 6700} {"train_loss": -27.717273712158203, "global_step": 556163, "epoch": 6700} {"train_loss": -27.977249145507812, "global_step": 556164, "epoch": 6700} {"train_loss": -27.791507720947266, "global_step": 556165, "epoch": 6700} {"train_loss": -28.063358306884766, "global_step": 556166, "epoch": 6700} {"train_loss": -27.993335723876953, "global_step": 556167, "epoch": 6700} {"train_loss": -27.956018447875977, "global_step": 556168, "epoch": 6700} {"train_loss": -27.738510131835938, "global_step": 556169, "epoch": 6700} {"train_loss": -27.98577308654785, "global_step": 556170, "epoch": 6700} {"train_loss": -27.767749786376953, "global_step": 556171, "epoch": 6700} {"train_loss": -28.054418563842773, "global_step": 556172, "epoch": 6700} {"train_loss": -27.450586318969727, "global_step": 556173, "epoch": 6700} {"train_loss": -27.48213005065918, "global_step": 556174, "epoch": 6700} {"train_loss": -27.970563888549805, "global_step": 556175, "epoch": 6700} {"train_loss": -27.460540771484375, "global_step": 556176, "epoch": 6700} {"train_loss": -27.434284210205078, "global_step": 556177, "epoch": 6700} {"train_loss": -27.75762939453125, "global_step": 556178, "epoch": 6700} {"train_loss": -27.45253562927246, "global_step": 556179, "epoch": 6700} {"train_loss": -27.66254997253418, "global_step": 556180, "epoch": 6700} {"train_loss": -27.85304069519043, "global_step": 556181, "epoch": 6700} {"train_loss": -27.714442126722222, "global_step": 556182, "epoch": 6700, "train/sim_max_reward_0": 0.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 0.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4500000": 1.0, "test/sim_max_reward_4500001": 1.0, "test/sim_max_reward_4500002": 1.0, "test/sim_max_reward_4500003": 1.0, "test/sim_max_reward_4500004": 1.0, "test/sim_max_reward_4500005": 0.0, "test/sim_max_reward_4500006": 1.0, "test/sim_max_reward_4500007": 0.0, "test/sim_max_reward_4500008": 1.0, "test/sim_max_reward_4500009": 1.0, "test/sim_max_reward_4500010": 1.0, "test/sim_max_reward_4500011": 1.0, "test/sim_max_reward_4500012": 1.0, "test/sim_max_reward_4500013": 0.0, "test/sim_max_reward_4500014": 1.0, "test/sim_max_reward_4500015": 1.0, "test/sim_max_reward_4500016": 1.0, "test/sim_max_reward_4500017": 1.0, "test/sim_max_reward_4500018": 1.0, "test/sim_max_reward_4500019": 0.0, "test/sim_max_reward_4500020": 1.0, "test/sim_max_reward_4500021": 1.0, "train/mean_score": 0.6666666666666666, "test/mean_score": 0.8181818181818182, "val_loss": 6411473.5} {"train_loss": -27.260730743408203, "global_step": 556183, "epoch": 6701} {"train_loss": -25.299510955810547, "global_step": 556184, "epoch": 6701} {"train_loss": -25.453046798706055, "global_step": 556185, "epoch": 6701} {"train_loss": -24.24207878112793, "global_step": 556186, "epoch": 6701} {"train_loss": -25.876317977905273, "global_step": 556187, "epoch": 6701} {"train_loss": -26.7303524017334, "global_step": 556188, "epoch": 6701} {"train_loss": -26.235990524291992, "global_step": 556189, "epoch": 6701} {"train_loss": -26.723180770874023, "global_step": 556190, "epoch": 6701} {"train_loss": -26.386234283447266, "global_step": 556191, "epoch": 6701} {"train_loss": -26.675878524780273, "global_step": 556192, "epoch": 6701} {"train_loss": -26.73868179321289, "global_step": 556193, "epoch": 6701} {"train_loss": -26.697223663330078, "global_step": 556194, "epoch": 6701} {"train_loss": -26.777185440063477, "global_step": 556195, "epoch": 6701} {"train_loss": -27.016138076782227, "global_step": 556196, "epoch": 6701} {"train_loss": -26.6355037689209, "global_step": 556197, "epoch": 6701} {"train_loss": -26.73712158203125, "global_step": 556198, "epoch": 6701} {"train_loss": -27.037750244140625, "global_step": 556199, "epoch": 6701} {"train_loss": -27.36295509338379, "global_step": 556200, "epoch": 6701} {"train_loss": -27.021331787109375, "global_step": 556201, "epoch": 6701} {"train_loss": -27.313032150268555, "global_step": 556202, "epoch": 6701} {"train_loss": -27.164854049682617, "global_step": 556203, "epoch": 6701} {"train_loss": -27.18732261657715, "global_step": 556204, "epoch": 6701} {"train_loss": -27.2022705078125, "global_step": 556205, "epoch": 6701} {"train_loss": -27.102270126342773, "global_step": 556206, "epoch": 6701} {"train_loss": -27.6108455657959, "global_step": 556207, "epoch": 6701} {"train_loss": -27.1038818359375, "global_step": 556208, "epoch": 6701} {"train_loss": -27.33247184753418, "global_step": 556209, "epoch": 6701} {"train_loss": -27.269439697265625, "global_step": 556210, "epoch": 6701} {"train_loss": -27.1382999420166, "global_step": 556211, "epoch": 6701} {"train_loss": -27.336889266967773, "global_step": 556212, "epoch": 6701} {"train_loss": -27.53901481628418, "global_step": 556213, "epoch": 6701} {"train_loss": -27.62295913696289, "global_step": 556214, "epoch": 6701} {"train_loss": -27.921594619750977, "global_step": 556215, "epoch": 6701} {"train_loss": -27.5338191986084, "global_step": 556216, "epoch": 6701} {"train_loss": -27.3349666595459, "global_step": 556217, "epoch": 6701} {"train_loss": -27.715229034423828, "global_step": 556218, "epoch": 6701} {"train_loss": -27.208608627319336, "global_step": 556219, "epoch": 6701} {"train_loss": -27.420108795166016, "global_step": 556220, "epoch": 6701} {"train_loss": -27.273426055908203, "global_step": 556221, "epoch": 6701} {"train_loss": -27.675769805908203, "global_step": 556222, "epoch": 6701} {"train_loss": -27.599964141845703, "global_step": 556223, "epoch": 6701} {"train_loss": -27.443960189819336, "global_step": 556224, "epoch": 6701} {"train_loss": -27.405027389526367, "global_step": 556225, "epoch": 6701} {"train_loss": -27.77569007873535, "global_step": 556226, "epoch": 6701} {"train_loss": -27.441165924072266, "global_step": 556227, "epoch": 6701} {"train_loss": -27.66534423828125, "global_step": 556228, "epoch": 6701} {"train_loss": -27.884750366210938, "global_step": 556229, "epoch": 6701} {"train_loss": -27.928760528564453, "global_step": 556230, "epoch": 6701} {"train_loss": -27.934118270874023, "global_step": 556231, "epoch": 6701} {"train_loss": -27.807804107666016, "global_step": 556232, "epoch": 6701} {"train_loss": -27.81939697265625, "global_step": 556233, "epoch": 6701} {"train_loss": -27.786334991455078, "global_step": 556234, "epoch": 6701} {"train_loss": -28.201765060424805, "global_step": 556235, "epoch": 6701} {"train_loss": -28.043197631835938, "global_step": 556236, "epoch": 6701} {"train_loss": -27.733570098876953, "global_step": 556237, "epoch": 6701} {"train_loss": -27.8814697265625, "global_step": 556238, "epoch": 6701} {"train_loss": -28.063526153564453, "global_step": 556239, "epoch": 6701} {"train_loss": -27.735584259033203, "global_step": 556240, "epoch": 6701} {"train_loss": -28.270421981811523, "global_step": 556241, "epoch": 6701} {"train_loss": -27.794702529907227, "global_step": 556242, "epoch": 6701} {"train_loss": -27.856464385986328, "global_step": 556243, "epoch": 6701} {"train_loss": -27.78660011291504, "global_step": 556244, "epoch": 6701} {"train_loss": -28.282012939453125, "global_step": 556245, "epoch": 6701} {"train_loss": -27.99127197265625, "global_step": 556246, "epoch": 6701} {"train_loss": -27.707509994506836, "global_step": 556247, "epoch": 6701} {"train_loss": -27.67595863342285, "global_step": 556248, "epoch": 6701} {"train_loss": -27.386289596557617, "global_step": 556249, "epoch": 6701} {"train_loss": -27.714208602905273, "global_step": 556250, "epoch": 6701} {"train_loss": -27.787921905517578, "global_step": 556251, "epoch": 6701} {"train_loss": -27.9366397857666, "global_step": 556252, "epoch": 6701} {"train_loss": -27.67926025390625, "global_step": 556253, "epoch": 6701} {"train_loss": -27.84956169128418, "global_step": 556254, "epoch": 6701} {"train_loss": -27.665924072265625, "global_step": 556255, "epoch": 6701} {"train_loss": -27.6531982421875, "global_step": 556256, "epoch": 6701} {"train_loss": -27.859540939331055, "global_step": 556257, "epoch": 6701} {"train_loss": -27.588266372680664, "global_step": 556258, "epoch": 6701} {"train_loss": -27.920934677124023, "global_step": 556259, "epoch": 6701} {"train_loss": -27.842056274414062, "global_step": 556260, "epoch": 6701} {"train_loss": -27.83160400390625, "global_step": 556261, "epoch": 6701} {"train_loss": -27.61688232421875, "global_step": 556262, "epoch": 6701} {"train_loss": -27.553632736206055, "global_step": 556263, "epoch": 6701} {"train_loss": -27.46245765686035, "global_step": 556264, "epoch": 6701} {"train_loss": -27.3949777074607, "global_step": 556265, "epoch": 6701, "val_loss": 6396499.5} {"train_loss": -27.92226219177246, "global_step": 556266, "epoch": 6702} {"train_loss": -27.39681053161621, "global_step": 556267, "epoch": 6702} {"train_loss": -27.295637130737305, "global_step": 556268, "epoch": 6702} {"train_loss": -27.59771728515625, "global_step": 556269, "epoch": 6702} {"train_loss": -27.408945083618164, "global_step": 556270, "epoch": 6702} {"train_loss": -27.309406280517578, "global_step": 556271, "epoch": 6702} {"train_loss": -27.52008628845215, "global_step": 556272, "epoch": 6702} {"train_loss": -27.672414779663086, "global_step": 556273, "epoch": 6702} {"train_loss": -27.208301544189453, "global_step": 556274, "epoch": 6702} {"train_loss": -27.5468692779541, "global_step": 556275, "epoch": 6702} {"train_loss": -27.3399715423584, "global_step": 556276, "epoch": 6702} {"train_loss": -27.748804092407227, "global_step": 556277, "epoch": 6702} {"train_loss": -27.9169979095459, "global_step": 556278, "epoch": 6702} {"train_loss": -27.68397331237793, "global_step": 556279, "epoch": 6702} {"train_loss": -27.529651641845703, "global_step": 556280, "epoch": 6702} {"train_loss": -27.49553871154785, "global_step": 556281, "epoch": 6702} {"train_loss": -27.707624435424805, "global_step": 556282, "epoch": 6702} {"train_loss": -27.937177658081055, "global_step": 556283, "epoch": 6702} {"train_loss": -27.956867218017578, "global_step": 556284, "epoch": 6702} {"train_loss": -27.848941802978516, "global_step": 556285, "epoch": 6702} {"train_loss": -27.702747344970703, "global_step": 556286, "epoch": 6702} {"train_loss": -27.90390968322754, "global_step": 556287, "epoch": 6702} {"train_loss": -28.008081436157227, "global_step": 556288, "epoch": 6702} {"train_loss": -27.647733688354492, "global_step": 556289, "epoch": 6702} {"train_loss": -27.704870223999023, "global_step": 556290, "epoch": 6702} {"train_loss": -27.6657772064209, "global_step": 556291, "epoch": 6702} {"train_loss": -27.8309268951416, "global_step": 556292, "epoch": 6702} {"train_loss": -27.716211318969727, "global_step": 556293, "epoch": 6702} {"train_loss": -27.900623321533203, "global_step": 556294, "epoch": 6702} {"train_loss": -28.084562301635742, "global_step": 556295, "epoch": 6702} {"train_loss": -27.855924606323242, "global_step": 556296, "epoch": 6702} {"train_loss": -27.5991268157959, "global_step": 556297, "epoch": 6702} {"train_loss": -27.80974769592285, "global_step": 556298, "epoch": 6702} {"train_loss": -27.810758590698242, "global_step": 556299, "epoch": 6702} {"train_loss": -27.173242568969727, "global_step": 556300, "epoch": 6702} {"train_loss": -27.918060302734375, "global_step": 556301, "epoch": 6702} {"train_loss": -27.731826782226562, "global_step": 556302, "epoch": 6702} {"train_loss": -27.8724365234375, "global_step": 556303, "epoch": 6702} {"train_loss": -27.733840942382812, "global_step": 556304, "epoch": 6702} {"train_loss": -27.829395294189453, "global_step": 556305, "epoch": 6702} {"train_loss": -28.049604415893555, "global_step": 556306, "epoch": 6702} {"train_loss": -28.03681755065918, "global_step": 556307, "epoch": 6702} {"train_loss": -28.046545028686523, "global_step": 556308, "epoch": 6702} {"train_loss": -27.6307373046875, "global_step": 556309, "epoch": 6702} {"train_loss": -27.624387741088867, "global_step": 556310, "epoch": 6702} {"train_loss": -27.572031021118164, "global_step": 556311, "epoch": 6702} {"train_loss": -27.796003341674805, "global_step": 556312, "epoch": 6702} {"train_loss": -27.850385665893555, "global_step": 556313, "epoch": 6702} {"train_loss": -27.58672523498535, "global_step": 556314, "epoch": 6702} {"train_loss": -27.61773109436035, "global_step": 556315, "epoch": 6702} {"train_loss": -28.03790855407715, "global_step": 556316, "epoch": 6702} {"train_loss": -27.54937171936035, "global_step": 556317, "epoch": 6702} {"train_loss": -27.606903076171875, "global_step": 556318, "epoch": 6702} {"train_loss": -27.90863037109375, "global_step": 556319, "epoch": 6702} {"train_loss": -27.920927047729492, "global_step": 556320, "epoch": 6702} {"train_loss": -27.915754318237305, "global_step": 556321, "epoch": 6702} {"train_loss": -27.857364654541016, "global_step": 556322, "epoch": 6702} {"train_loss": -27.628559112548828, "global_step": 556323, "epoch": 6702} {"train_loss": -27.852985382080078, "global_step": 556324, "epoch": 6702} {"train_loss": -27.754186630249023, "global_step": 556325, "epoch": 6702} {"train_loss": -27.526657104492188, "global_step": 556326, "epoch": 6702} {"train_loss": -27.771326065063477, "global_step": 556327, "epoch": 6702} {"train_loss": -27.902374267578125, "global_step": 556328, "epoch": 6702} {"train_loss": -28.00079345703125, "global_step": 556329, "epoch": 6702} {"train_loss": -27.662189483642578, "global_step": 556330, "epoch": 6702} {"train_loss": -27.69753074645996, "global_step": 556331, "epoch": 6702} {"train_loss": -28.10146141052246, "global_step": 556332, "epoch": 6702} {"train_loss": -28.16729736328125, "global_step": 556333, "epoch": 6702} {"train_loss": -27.13262939453125, "global_step": 556334, "epoch": 6702} {"train_loss": -27.714614868164062, "global_step": 556335, "epoch": 6702} {"train_loss": -27.99903678894043, "global_step": 556336, "epoch": 6702} {"train_loss": -28.07699966430664, "global_step": 556337, "epoch": 6702} {"train_loss": -27.699878692626953, "global_step": 556338, "epoch": 6702} {"train_loss": -27.47645378112793, "global_step": 556339, "epoch": 6702} {"train_loss": -27.45035171508789, "global_step": 556340, "epoch": 6702} {"train_loss": -27.158279418945312, "global_step": 556341, "epoch": 6702} {"train_loss": -27.706256866455078, "global_step": 556342, "epoch": 6702} {"train_loss": -27.44675636291504, "global_step": 556343, "epoch": 6702} {"train_loss": -27.435688018798828, "global_step": 556344, "epoch": 6702} {"train_loss": -27.5220947265625, "global_step": 556345, "epoch": 6702} {"train_loss": -27.641422271728516, "global_step": 556346, "epoch": 6702} {"train_loss": -27.440122604370117, "global_step": 556347, "epoch": 6702} {"train_loss": -27.716453460325678, "global_step": 556348, "epoch": 6702, "val_loss": 6375315.0} {"train_loss": -26.923419952392578, "global_step": 556349, "epoch": 6703} {"train_loss": -26.80951499938965, "global_step": 556350, "epoch": 6703} {"train_loss": -26.679187774658203, "global_step": 556351, "epoch": 6703} {"train_loss": -27.216632843017578, "global_step": 556352, "epoch": 6703} {"train_loss": -27.02726173400879, "global_step": 556353, "epoch": 6703} {"train_loss": -26.800153732299805, "global_step": 556354, "epoch": 6703} {"train_loss": -27.494403839111328, "global_step": 556355, "epoch": 6703} {"train_loss": -27.07382583618164, "global_step": 556356, "epoch": 6703} {"train_loss": -26.608890533447266, "global_step": 556357, "epoch": 6703} {"train_loss": -27.150848388671875, "global_step": 556358, "epoch": 6703} {"train_loss": -27.559934616088867, "global_step": 556359, "epoch": 6703} {"train_loss": -27.763687133789062, "global_step": 556360, "epoch": 6703} {"train_loss": -27.158466339111328, "global_step": 556361, "epoch": 6703} {"train_loss": -27.42115592956543, "global_step": 556362, "epoch": 6703} {"train_loss": -27.321918487548828, "global_step": 556363, "epoch": 6703} {"train_loss": -27.845245361328125, "global_step": 556364, "epoch": 6703} {"train_loss": -27.646198272705078, "global_step": 556365, "epoch": 6703} {"train_loss": -27.604755401611328, "global_step": 556366, "epoch": 6703} {"train_loss": -27.690189361572266, "global_step": 556367, "epoch": 6703} {"train_loss": -27.59297752380371, "global_step": 556368, "epoch": 6703} {"train_loss": -27.522907257080078, "global_step": 556369, "epoch": 6703} {"train_loss": -27.68487548828125, "global_step": 556370, "epoch": 6703} {"train_loss": -27.908294677734375, "global_step": 556371, "epoch": 6703} {"train_loss": -27.683568954467773, "global_step": 556372, "epoch": 6703} {"train_loss": -27.878772735595703, "global_step": 556373, "epoch": 6703} {"train_loss": -27.63710594177246, "global_step": 556374, "epoch": 6703} {"train_loss": -27.8786678314209, "global_step": 556375, "epoch": 6703} {"train_loss": -28.13285255432129, "global_step": 556376, "epoch": 6703} {"train_loss": -27.91969108581543, "global_step": 556377, "epoch": 6703} {"train_loss": -28.1669921875, "global_step": 556378, "epoch": 6703} {"train_loss": -27.99163818359375, "global_step": 556379, "epoch": 6703} {"train_loss": -27.504541397094727, "global_step": 556380, "epoch": 6703} {"train_loss": -28.06488037109375, "global_step": 556381, "epoch": 6703} {"train_loss": -28.002002716064453, "global_step": 556382, "epoch": 6703} {"train_loss": -27.706390380859375, "global_step": 556383, "epoch": 6703} {"train_loss": -28.219640731811523, "global_step": 556384, "epoch": 6703} {"train_loss": -27.98084831237793, "global_step": 556385, "epoch": 6703} {"train_loss": -28.214696884155273, "global_step": 556386, "epoch": 6703} {"train_loss": -27.71892738342285, "global_step": 556387, "epoch": 6703} {"train_loss": -27.9843692779541, "global_step": 556388, "epoch": 6703} {"train_loss": -28.011106491088867, "global_step": 556389, "epoch": 6703} {"train_loss": -27.917245864868164, "global_step": 556390, "epoch": 6703} {"train_loss": -27.695493698120117, "global_step": 556391, "epoch": 6703} {"train_loss": -28.08955192565918, "global_step": 556392, "epoch": 6703} {"train_loss": -28.09083366394043, "global_step": 556393, "epoch": 6703} {"train_loss": -27.912805557250977, "global_step": 556394, "epoch": 6703} {"train_loss": -28.240447998046875, "global_step": 556395, "epoch": 6703} {"train_loss": -27.933582305908203, "global_step": 556396, "epoch": 6703} {"train_loss": -27.999948501586914, "global_step": 556397, "epoch": 6703} {"train_loss": -27.87384605407715, "global_step": 556398, "epoch": 6703} {"train_loss": -28.115646362304688, "global_step": 556399, "epoch": 6703} {"train_loss": -28.050537109375, "global_step": 556400, "epoch": 6703} {"train_loss": -27.796756744384766, "global_step": 556401, "epoch": 6703} {"train_loss": -27.758569717407227, "global_step": 556402, "epoch": 6703} {"train_loss": -27.539722442626953, "global_step": 556403, "epoch": 6703} {"train_loss": -27.253833770751953, "global_step": 556404, "epoch": 6703} {"train_loss": -27.671466827392578, "global_step": 556405, "epoch": 6703} {"train_loss": -27.8590087890625, "global_step": 556406, "epoch": 6703} {"train_loss": -27.9139404296875, "global_step": 556407, "epoch": 6703} {"train_loss": -27.966419219970703, "global_step": 556408, "epoch": 6703} {"train_loss": -27.5747127532959, "global_step": 556409, "epoch": 6703} {"train_loss": -27.592878341674805, "global_step": 556410, "epoch": 6703} {"train_loss": -27.865848541259766, "global_step": 556411, "epoch": 6703} {"train_loss": -27.48931884765625, "global_step": 556412, "epoch": 6703} {"train_loss": -27.47212791442871, "global_step": 556413, "epoch": 6703} {"train_loss": -27.741668701171875, "global_step": 556414, "epoch": 6703} {"train_loss": -27.947813034057617, "global_step": 556415, "epoch": 6703} {"train_loss": -27.880624771118164, "global_step": 556416, "epoch": 6703} {"train_loss": -27.850830078125, "global_step": 556417, "epoch": 6703} {"train_loss": -27.844385147094727, "global_step": 556418, "epoch": 6703} {"train_loss": -27.7523136138916, "global_step": 556419, "epoch": 6703} {"train_loss": -27.674665451049805, "global_step": 556420, "epoch": 6703} {"train_loss": -27.791778564453125, "global_step": 556421, "epoch": 6703} {"train_loss": -28.129453659057617, "global_step": 556422, "epoch": 6703} {"train_loss": -27.79031753540039, "global_step": 556423, "epoch": 6703} {"train_loss": -27.69391441345215, "global_step": 556424, "epoch": 6703} {"train_loss": -27.75514030456543, "global_step": 556425, "epoch": 6703} {"train_loss": -28.120420455932617, "global_step": 556426, "epoch": 6703} {"train_loss": -27.759363174438477, "global_step": 556427, "epoch": 6703} {"train_loss": -27.798276901245117, "global_step": 556428, "epoch": 6703} {"train_loss": -27.622589111328125, "global_step": 556429, "epoch": 6703} {"train_loss": -27.09486961364746, "global_step": 556430, "epoch": 6703} {"train_loss": -27.71376161690218, "global_step": 556431, "epoch": 6703, "val_loss": 6496176.0} {"train_loss": -26.868927001953125, "global_step": 556432, "epoch": 6704} {"train_loss": -25.40010643005371, "global_step": 556433, "epoch": 6704} {"train_loss": -24.935386657714844, "global_step": 556434, "epoch": 6704} {"train_loss": -25.975255966186523, "global_step": 556435, "epoch": 6704} {"train_loss": -26.867935180664062, "global_step": 556436, "epoch": 6704} {"train_loss": -25.261184692382812, "global_step": 556437, "epoch": 6704} {"train_loss": -27.2793025970459, "global_step": 556438, "epoch": 6704} {"train_loss": -26.174280166625977, "global_step": 556439, "epoch": 6704} {"train_loss": -26.662841796875, "global_step": 556440, "epoch": 6704} {"train_loss": -26.351638793945312, "global_step": 556441, "epoch": 6704} {"train_loss": -26.980377197265625, "global_step": 556442, "epoch": 6704} {"train_loss": -26.578842163085938, "global_step": 556443, "epoch": 6704} {"train_loss": -26.68121337890625, "global_step": 556444, "epoch": 6704} {"train_loss": -26.805225372314453, "global_step": 556445, "epoch": 6704} {"train_loss": -26.335905075073242, "global_step": 556446, "epoch": 6704} {"train_loss": -27.263818740844727, "global_step": 556447, "epoch": 6704} {"train_loss": -26.9312686920166, "global_step": 556448, "epoch": 6704} {"train_loss": -27.25886344909668, "global_step": 556449, "epoch": 6704} {"train_loss": -27.534753799438477, "global_step": 556450, "epoch": 6704} {"train_loss": -27.154748916625977, "global_step": 556451, "epoch": 6704} {"train_loss": -27.254638671875, "global_step": 556452, "epoch": 6704} {"train_loss": -26.65230369567871, "global_step": 556453, "epoch": 6704} {"train_loss": -27.20942497253418, "global_step": 556454, "epoch": 6704} {"train_loss": -27.3087158203125, "global_step": 556455, "epoch": 6704} {"train_loss": -27.587308883666992, "global_step": 556456, "epoch": 6704} {"train_loss": -27.161640167236328, "global_step": 556457, "epoch": 6704} {"train_loss": -27.62571144104004, "global_step": 556458, "epoch": 6704} {"train_loss": -27.061786651611328, "global_step": 556459, "epoch": 6704} {"train_loss": -27.239856719970703, "global_step": 556460, "epoch": 6704} {"train_loss": -27.519168853759766, "global_step": 556461, "epoch": 6704} {"train_loss": -27.453857421875, "global_step": 556462, "epoch": 6704} {"train_loss": -27.284046173095703, "global_step": 556463, "epoch": 6704} {"train_loss": -27.383527755737305, "global_step": 556464, "epoch": 6704} {"train_loss": -27.585840225219727, "global_step": 556465, "epoch": 6704} {"train_loss": -27.364734649658203, "global_step": 556466, "epoch": 6704} {"train_loss": -27.843433380126953, "global_step": 556467, "epoch": 6704} {"train_loss": -27.642974853515625, "global_step": 556468, "epoch": 6704} {"train_loss": -28.030542373657227, "global_step": 556469, "epoch": 6704} {"train_loss": -27.547943115234375, "global_step": 556470, "epoch": 6704} {"train_loss": -27.65278434753418, "global_step": 556471, "epoch": 6704} {"train_loss": -27.727828979492188, "global_step": 556472, "epoch": 6704} {"train_loss": -27.765302658081055, "global_step": 556473, "epoch": 6704} {"train_loss": -27.465972900390625, "global_step": 556474, "epoch": 6704} {"train_loss": -28.057662963867188, "global_step": 556475, "epoch": 6704} {"train_loss": -27.791303634643555, "global_step": 556476, "epoch": 6704} {"train_loss": -28.11451530456543, "global_step": 556477, "epoch": 6704} {"train_loss": -27.874176025390625, "global_step": 556478, "epoch": 6704} {"train_loss": -28.010028839111328, "global_step": 556479, "epoch": 6704} {"train_loss": -28.162683486938477, "global_step": 556480, "epoch": 6704} {"train_loss": -27.948293685913086, "global_step": 556481, "epoch": 6704} {"train_loss": -27.855972290039062, "global_step": 556482, "epoch": 6704} {"train_loss": -27.6983699798584, "global_step": 556483, "epoch": 6704} {"train_loss": -27.762670516967773, "global_step": 556484, "epoch": 6704} {"train_loss": -28.111661911010742, "global_step": 556485, "epoch": 6704} {"train_loss": -27.98842430114746, "global_step": 556486, "epoch": 6704} {"train_loss": -27.94870376586914, "global_step": 556487, "epoch": 6704} {"train_loss": -27.871686935424805, "global_step": 556488, "epoch": 6704} {"train_loss": -27.962392807006836, "global_step": 556489, "epoch": 6704} {"train_loss": -27.855207443237305, "global_step": 556490, "epoch": 6704} {"train_loss": -27.679487228393555, "global_step": 556491, "epoch": 6704} {"train_loss": -27.475875854492188, "global_step": 556492, "epoch": 6704} {"train_loss": -27.708398818969727, "global_step": 556493, "epoch": 6704} {"train_loss": -27.908939361572266, "global_step": 556494, "epoch": 6704} {"train_loss": -27.9848575592041, "global_step": 556495, "epoch": 6704} {"train_loss": -27.799793243408203, "global_step": 556496, "epoch": 6704} {"train_loss": -27.784351348876953, "global_step": 556497, "epoch": 6704} {"train_loss": -27.78614616394043, "global_step": 556498, "epoch": 6704} {"train_loss": -28.053787231445312, "global_step": 556499, "epoch": 6704} {"train_loss": -27.7622127532959, "global_step": 556500, "epoch": 6704} {"train_loss": -28.01540184020996, "global_step": 556501, "epoch": 6704} {"train_loss": -27.535614013671875, "global_step": 556502, "epoch": 6704} {"train_loss": -27.85162353515625, "global_step": 556503, "epoch": 6704} {"train_loss": -27.800954818725586, "global_step": 556504, "epoch": 6704} {"train_loss": -28.033533096313477, "global_step": 556505, "epoch": 6704} {"train_loss": -27.9229679107666, "global_step": 556506, "epoch": 6704} {"train_loss": -27.903547286987305, "global_step": 556507, "epoch": 6704} {"train_loss": -27.502674102783203, "global_step": 556508, "epoch": 6704} {"train_loss": -26.399337768554688, "global_step": 556509, "epoch": 6704} {"train_loss": -22.790454864501953, "global_step": 556510, "epoch": 6704} {"train_loss": -18.831666946411133, "global_step": 556511, "epoch": 6704} {"train_loss": -26.385223388671875, "global_step": 556512, "epoch": 6704} {"train_loss": -24.475488662719727, "global_step": 556513, "epoch": 6704} {"train_loss": -27.171838484614728, "global_step": 556514, "epoch": 6704, "val_loss": 6463885.0} {"train_loss": -23.376264572143555, "global_step": 556515, "epoch": 6705} {"train_loss": -25.85120964050293, "global_step": 556516, "epoch": 6705} {"train_loss": -25.407958984375, "global_step": 556517, "epoch": 6705} {"train_loss": -24.08405113220215, "global_step": 556518, "epoch": 6705} {"train_loss": -25.906158447265625, "global_step": 556519, "epoch": 6705} {"train_loss": -25.510496139526367, "global_step": 556520, "epoch": 6705} {"train_loss": -25.35343360900879, "global_step": 556521, "epoch": 6705} {"train_loss": -25.83977699279785, "global_step": 556522, "epoch": 6705} {"train_loss": -26.692834854125977, "global_step": 556523, "epoch": 6705} {"train_loss": -26.28468132019043, "global_step": 556524, "epoch": 6705} {"train_loss": -26.038135528564453, "global_step": 556525, "epoch": 6705} {"train_loss": -26.157306671142578, "global_step": 556526, "epoch": 6705} {"train_loss": -26.40142250061035, "global_step": 556527, "epoch": 6705} {"train_loss": -26.003677368164062, "global_step": 556528, "epoch": 6705} {"train_loss": -26.423383712768555, "global_step": 556529, "epoch": 6705} {"train_loss": -26.499755859375, "global_step": 556530, "epoch": 6705} {"train_loss": -26.304983139038086, "global_step": 556531, "epoch": 6705} {"train_loss": -26.62152671813965, "global_step": 556532, "epoch": 6705} {"train_loss": -26.68283462524414, "global_step": 556533, "epoch": 6705} {"train_loss": -26.60285758972168, "global_step": 556534, "epoch": 6705} {"train_loss": -27.09921646118164, "global_step": 556535, "epoch": 6705} {"train_loss": -26.62287712097168, "global_step": 556536, "epoch": 6705} {"train_loss": -26.56048011779785, "global_step": 556537, "epoch": 6705} {"train_loss": -26.7958927154541, "global_step": 556538, "epoch": 6705} {"train_loss": -27.38466453552246, "global_step": 556539, "epoch": 6705} {"train_loss": -26.96067237854004, "global_step": 556540, "epoch": 6705} {"train_loss": -26.71134376525879, "global_step": 556541, "epoch": 6705} {"train_loss": -27.261581420898438, "global_step": 556542, "epoch": 6705} {"train_loss": -26.771142959594727, "global_step": 556543, "epoch": 6705} {"train_loss": -27.2640323638916, "global_step": 556544, "epoch": 6705} {"train_loss": -27.280668258666992, "global_step": 556545, "epoch": 6705} {"train_loss": -27.454666137695312, "global_step": 556546, "epoch": 6705} {"train_loss": -26.846942901611328, "global_step": 556547, "epoch": 6705} {"train_loss": -26.779281616210938, "global_step": 556548, "epoch": 6705} {"train_loss": -27.860265731811523, "global_step": 556549, "epoch": 6705} {"train_loss": -27.320425033569336, "global_step": 556550, "epoch": 6705} {"train_loss": -27.3064022064209, "global_step": 556551, "epoch": 6705} {"train_loss": -27.36181640625, "global_step": 556552, "epoch": 6705} {"train_loss": -27.80779457092285, "global_step": 556553, "epoch": 6705} {"train_loss": -27.50718116760254, "global_step": 556554, "epoch": 6705} {"train_loss": -27.719022750854492, "global_step": 556555, "epoch": 6705} {"train_loss": -27.72564125061035, "global_step": 556556, "epoch": 6705} {"train_loss": -27.990915298461914, "global_step": 556557, "epoch": 6705} {"train_loss": -27.5418701171875, "global_step": 556558, "epoch": 6705} {"train_loss": -27.169097900390625, "global_step": 556559, "epoch": 6705} {"train_loss": -27.284011840820312, "global_step": 556560, "epoch": 6705} {"train_loss": -27.313520431518555, "global_step": 556561, "epoch": 6705} {"train_loss": -27.71039390563965, "global_step": 556562, "epoch": 6705} {"train_loss": -27.29326820373535, "global_step": 556563, "epoch": 6705} {"train_loss": -27.87994956970215, "global_step": 556564, "epoch": 6705} {"train_loss": -27.645492553710938, "global_step": 556565, "epoch": 6705} {"train_loss": -27.677865982055664, "global_step": 556566, "epoch": 6705} {"train_loss": -27.32801628112793, "global_step": 556567, "epoch": 6705} {"train_loss": -27.76645278930664, "global_step": 556568, "epoch": 6705} {"train_loss": -27.293603897094727, "global_step": 556569, "epoch": 6705} {"train_loss": -27.600210189819336, "global_step": 556570, "epoch": 6705} {"train_loss": -27.298248291015625, "global_step": 556571, "epoch": 6705} {"train_loss": -27.2950439453125, "global_step": 556572, "epoch": 6705} {"train_loss": -28.002197265625, "global_step": 556573, "epoch": 6705} {"train_loss": -27.774560928344727, "global_step": 556574, "epoch": 6705} {"train_loss": -27.565954208374023, "global_step": 556575, "epoch": 6705} {"train_loss": -27.68568992614746, "global_step": 556576, "epoch": 6705} {"train_loss": -27.55535316467285, "global_step": 556577, "epoch": 6705} {"train_loss": -27.691669464111328, "global_step": 556578, "epoch": 6705} {"train_loss": -27.37818717956543, "global_step": 556579, "epoch": 6705} {"train_loss": -27.821496963500977, "global_step": 556580, "epoch": 6705} {"train_loss": -27.731931686401367, "global_step": 556581, "epoch": 6705} {"train_loss": -27.292882919311523, "global_step": 556582, "epoch": 6705} {"train_loss": -27.703771591186523, "global_step": 556583, "epoch": 6705} {"train_loss": -27.77204704284668, "global_step": 556584, "epoch": 6705} {"train_loss": -27.583057403564453, "global_step": 556585, "epoch": 6705} {"train_loss": -27.362852096557617, "global_step": 556586, "epoch": 6705} {"train_loss": -27.620325088500977, "global_step": 556587, "epoch": 6705} {"train_loss": -28.04615592956543, "global_step": 556588, "epoch": 6705} {"train_loss": -27.804296493530273, "global_step": 556589, "epoch": 6705} {"train_loss": -27.87788200378418, "global_step": 556590, "epoch": 6705} {"train_loss": -27.830652236938477, "global_step": 556591, "epoch": 6705} {"train_loss": -27.8730411529541, "global_step": 556592, "epoch": 6705} {"train_loss": -27.129003524780273, "global_step": 556593, "epoch": 6705} {"train_loss": -28.065387725830078, "global_step": 556594, "epoch": 6705} {"train_loss": -27.980131149291992, "global_step": 556595, "epoch": 6705} {"train_loss": -27.97315788269043, "global_step": 556596, "epoch": 6705} {"train_loss": -27.092404951532203, "global_step": 556597, "epoch": 6705, "val_loss": 6395787.5} {"train_loss": -27.044052124023438, "global_step": 556598, "epoch": 6706} {"train_loss": -27.1101016998291, "global_step": 556599, "epoch": 6706} {"train_loss": -26.6660213470459, "global_step": 556600, "epoch": 6706} {"train_loss": -25.161762237548828, "global_step": 556601, "epoch": 6706} {"train_loss": -26.431121826171875, "global_step": 556602, "epoch": 6706} {"train_loss": -26.28977394104004, "global_step": 556603, "epoch": 6706} {"train_loss": -26.472455978393555, "global_step": 556604, "epoch": 6706} {"train_loss": -26.85149574279785, "global_step": 556605, "epoch": 6706} {"train_loss": -27.095870971679688, "global_step": 556606, "epoch": 6706} {"train_loss": -26.598352432250977, "global_step": 556607, "epoch": 6706} {"train_loss": -27.321561813354492, "global_step": 556608, "epoch": 6706} {"train_loss": -27.020959854125977, "global_step": 556609, "epoch": 6706} {"train_loss": -27.186323165893555, "global_step": 556610, "epoch": 6706} {"train_loss": -26.866987228393555, "global_step": 556611, "epoch": 6706} {"train_loss": -26.899494171142578, "global_step": 556612, "epoch": 6706} {"train_loss": -27.39668083190918, "global_step": 556613, "epoch": 6706} {"train_loss": -27.303022384643555, "global_step": 556614, "epoch": 6706} {"train_loss": -27.039133071899414, "global_step": 556615, "epoch": 6706} {"train_loss": -26.79422378540039, "global_step": 556616, "epoch": 6706} {"train_loss": -27.27359390258789, "global_step": 556617, "epoch": 6706} {"train_loss": -27.039337158203125, "global_step": 556618, "epoch": 6706} {"train_loss": -27.182165145874023, "global_step": 556619, "epoch": 6706} {"train_loss": -27.287622451782227, "global_step": 556620, "epoch": 6706} {"train_loss": -26.946691513061523, "global_step": 556621, "epoch": 6706} {"train_loss": -27.05372428894043, "global_step": 556622, "epoch": 6706} {"train_loss": -27.444625854492188, "global_step": 556623, "epoch": 6706} {"train_loss": -27.312292098999023, "global_step": 556624, "epoch": 6706} {"train_loss": -27.482669830322266, "global_step": 556625, "epoch": 6706} {"train_loss": -27.810047149658203, "global_step": 556626, "epoch": 6706} {"train_loss": -27.80946922302246, "global_step": 556627, "epoch": 6706} {"train_loss": -27.3376407623291, "global_step": 556628, "epoch": 6706} {"train_loss": -27.206256866455078, "global_step": 556629, "epoch": 6706} {"train_loss": -27.719436645507812, "global_step": 556630, "epoch": 6706} {"train_loss": -27.494552612304688, "global_step": 556631, "epoch": 6706} {"train_loss": -27.2841796875, "global_step": 556632, "epoch": 6706} {"train_loss": -27.50615882873535, "global_step": 556633, "epoch": 6706} {"train_loss": -27.74869728088379, "global_step": 556634, "epoch": 6706} {"train_loss": -27.110828399658203, "global_step": 556635, "epoch": 6706} {"train_loss": -27.609878540039062, "global_step": 556636, "epoch": 6706} {"train_loss": -27.660511016845703, "global_step": 556637, "epoch": 6706} {"train_loss": -27.745038986206055, "global_step": 556638, "epoch": 6706} {"train_loss": -27.829364776611328, "global_step": 556639, "epoch": 6706} {"train_loss": -27.71258544921875, "global_step": 556640, "epoch": 6706} {"train_loss": -27.70387077331543, "global_step": 556641, "epoch": 6706} {"train_loss": -27.791168212890625, "global_step": 556642, "epoch": 6706} {"train_loss": -27.832197189331055, "global_step": 556643, "epoch": 6706} {"train_loss": -27.763885498046875, "global_step": 556644, "epoch": 6706} {"train_loss": -27.852619171142578, "global_step": 556645, "epoch": 6706} {"train_loss": -28.298757553100586, "global_step": 556646, "epoch": 6706} {"train_loss": -27.73023796081543, "global_step": 556647, "epoch": 6706} {"train_loss": -27.75165367126465, "global_step": 556648, "epoch": 6706} {"train_loss": -27.9388484954834, "global_step": 556649, "epoch": 6706} {"train_loss": -27.82769775390625, "global_step": 556650, "epoch": 6706} {"train_loss": -27.8286075592041, "global_step": 556651, "epoch": 6706} {"train_loss": -27.697553634643555, "global_step": 556652, "epoch": 6706} {"train_loss": -27.689435958862305, "global_step": 556653, "epoch": 6706} {"train_loss": -28.054075241088867, "global_step": 556654, "epoch": 6706} {"train_loss": -28.1505069732666, "global_step": 556655, "epoch": 6706} {"train_loss": -27.68366813659668, "global_step": 556656, "epoch": 6706} {"train_loss": -27.909835815429688, "global_step": 556657, "epoch": 6706} {"train_loss": -27.74411392211914, "global_step": 556658, "epoch": 6706} {"train_loss": -27.876739501953125, "global_step": 556659, "epoch": 6706} {"train_loss": -28.092859268188477, "global_step": 556660, "epoch": 6706} {"train_loss": -27.782812118530273, "global_step": 556661, "epoch": 6706} {"train_loss": -27.825885772705078, "global_step": 556662, "epoch": 6706} {"train_loss": -27.953893661499023, "global_step": 556663, "epoch": 6706} {"train_loss": -27.573108673095703, "global_step": 556664, "epoch": 6706} {"train_loss": -27.39850425720215, "global_step": 556665, "epoch": 6706} {"train_loss": -28.10721778869629, "global_step": 556666, "epoch": 6706} {"train_loss": -27.83771324157715, "global_step": 556667, "epoch": 6706} {"train_loss": -27.983243942260742, "global_step": 556668, "epoch": 6706} {"train_loss": -27.5321044921875, "global_step": 556669, "epoch": 6706} {"train_loss": -27.77984619140625, "global_step": 556670, "epoch": 6706} {"train_loss": -27.780750274658203, "global_step": 556671, "epoch": 6706} {"train_loss": -27.99762535095215, "global_step": 556672, "epoch": 6706} {"train_loss": -28.126129150390625, "global_step": 556673, "epoch": 6706} {"train_loss": -27.85625648498535, "global_step": 556674, "epoch": 6706} {"train_loss": -27.8879451751709, "global_step": 556675, "epoch": 6706} {"train_loss": -28.25933265686035, "global_step": 556676, "epoch": 6706} {"train_loss": -27.35076904296875, "global_step": 556677, "epoch": 6706} {"train_loss": -27.95856285095215, "global_step": 556678, "epoch": 6706} {"train_loss": -27.622085571289062, "global_step": 556679, "epoch": 6706} {"train_loss": -27.48459473575454, "global_step": 556680, "epoch": 6706, "val_loss": 6558481.0} {"train_loss": -27.794055938720703, "global_step": 556681, "epoch": 6707} {"train_loss": -27.096548080444336, "global_step": 556682, "epoch": 6707} {"train_loss": -27.3631534576416, "global_step": 556683, "epoch": 6707} {"train_loss": -27.004535675048828, "global_step": 556684, "epoch": 6707} {"train_loss": -27.19361686706543, "global_step": 556685, "epoch": 6707} {"train_loss": -27.251148223876953, "global_step": 556686, "epoch": 6707} {"train_loss": -27.584802627563477, "global_step": 556687, "epoch": 6707} {"train_loss": -27.65448570251465, "global_step": 556688, "epoch": 6707} {"train_loss": -27.526580810546875, "global_step": 556689, "epoch": 6707} {"train_loss": -27.396137237548828, "global_step": 556690, "epoch": 6707} {"train_loss": -27.8623046875, "global_step": 556691, "epoch": 6707} {"train_loss": -27.734533309936523, "global_step": 556692, "epoch": 6707} {"train_loss": -27.757551193237305, "global_step": 556693, "epoch": 6707} {"train_loss": -27.7890567779541, "global_step": 556694, "epoch": 6707} {"train_loss": -27.76299476623535, "global_step": 556695, "epoch": 6707} {"train_loss": -27.77723503112793, "global_step": 556696, "epoch": 6707} {"train_loss": -27.693683624267578, "global_step": 556697, "epoch": 6707} {"train_loss": -27.8974552154541, "global_step": 556698, "epoch": 6707} {"train_loss": -27.6052188873291, "global_step": 556699, "epoch": 6707} {"train_loss": -27.445043563842773, "global_step": 556700, "epoch": 6707} {"train_loss": -28.074247360229492, "global_step": 556701, "epoch": 6707} {"train_loss": -27.73177146911621, "global_step": 556702, "epoch": 6707} {"train_loss": -27.744171142578125, "global_step": 556703, "epoch": 6707} {"train_loss": -27.905237197875977, "global_step": 556704, "epoch": 6707} {"train_loss": -27.62286376953125, "global_step": 556705, "epoch": 6707} {"train_loss": -27.84160804748535, "global_step": 556706, "epoch": 6707} {"train_loss": -27.721710205078125, "global_step": 556707, "epoch": 6707} {"train_loss": -28.1917667388916, "global_step": 556708, "epoch": 6707} {"train_loss": -27.483936309814453, "global_step": 556709, "epoch": 6707} {"train_loss": -27.57864761352539, "global_step": 556710, "epoch": 6707} {"train_loss": -28.031736373901367, "global_step": 556711, "epoch": 6707} {"train_loss": -27.741119384765625, "global_step": 556712, "epoch": 6707} {"train_loss": -27.74811363220215, "global_step": 556713, "epoch": 6707} {"train_loss": -27.59317398071289, "global_step": 556714, "epoch": 6707} {"train_loss": -28.0432186126709, "global_step": 556715, "epoch": 6707} {"train_loss": -27.8496036529541, "global_step": 556716, "epoch": 6707} {"train_loss": -27.99232292175293, "global_step": 556717, "epoch": 6707} {"train_loss": -27.641504287719727, "global_step": 556718, "epoch": 6707} {"train_loss": -27.698776245117188, "global_step": 556719, "epoch": 6707} {"train_loss": -27.53737449645996, "global_step": 556720, "epoch": 6707} {"train_loss": -28.0623836517334, "global_step": 556721, "epoch": 6707} {"train_loss": -27.68115234375, "global_step": 556722, "epoch": 6707} {"train_loss": -27.8311710357666, "global_step": 556723, "epoch": 6707} {"train_loss": -28.191370010375977, "global_step": 556724, "epoch": 6707} {"train_loss": -27.887969970703125, "global_step": 556725, "epoch": 6707} {"train_loss": -28.271162033081055, "global_step": 556726, "epoch": 6707} {"train_loss": -27.631200790405273, "global_step": 556727, "epoch": 6707} {"train_loss": -28.2716007232666, "global_step": 556728, "epoch": 6707} {"train_loss": -28.297149658203125, "global_step": 556729, "epoch": 6707} {"train_loss": -27.948139190673828, "global_step": 556730, "epoch": 6707} {"train_loss": -27.951934814453125, "global_step": 556731, "epoch": 6707} {"train_loss": -27.666412353515625, "global_step": 556732, "epoch": 6707} {"train_loss": -28.008222579956055, "global_step": 556733, "epoch": 6707} {"train_loss": -28.229568481445312, "global_step": 556734, "epoch": 6707} {"train_loss": -27.7646541595459, "global_step": 556735, "epoch": 6707} {"train_loss": -28.13062858581543, "global_step": 556736, "epoch": 6707} {"train_loss": -27.974451065063477, "global_step": 556737, "epoch": 6707} {"train_loss": -27.77931022644043, "global_step": 556738, "epoch": 6707} {"train_loss": -27.983245849609375, "global_step": 556739, "epoch": 6707} {"train_loss": -27.87701416015625, "global_step": 556740, "epoch": 6707} {"train_loss": -28.17612648010254, "global_step": 556741, "epoch": 6707} {"train_loss": -27.826292037963867, "global_step": 556742, "epoch": 6707} {"train_loss": -27.95148277282715, "global_step": 556743, "epoch": 6707} {"train_loss": -27.96537208557129, "global_step": 556744, "epoch": 6707} {"train_loss": -27.787572860717773, "global_step": 556745, "epoch": 6707} {"train_loss": -28.247556686401367, "global_step": 556746, "epoch": 6707} {"train_loss": -28.201459884643555, "global_step": 556747, "epoch": 6707} {"train_loss": -28.09095573425293, "global_step": 556748, "epoch": 6707} {"train_loss": -28.022083282470703, "global_step": 556749, "epoch": 6707} {"train_loss": -27.908716201782227, "global_step": 556750, "epoch": 6707} {"train_loss": -27.78498649597168, "global_step": 556751, "epoch": 6707} {"train_loss": -27.904376983642578, "global_step": 556752, "epoch": 6707} {"train_loss": -28.149810791015625, "global_step": 556753, "epoch": 6707} {"train_loss": -27.49188804626465, "global_step": 556754, "epoch": 6707} {"train_loss": -27.347305297851562, "global_step": 556755, "epoch": 6707} {"train_loss": -27.770063400268555, "global_step": 556756, "epoch": 6707} {"train_loss": -27.064544677734375, "global_step": 556757, "epoch": 6707} {"train_loss": -27.3055477142334, "global_step": 556758, "epoch": 6707} {"train_loss": -27.233081817626953, "global_step": 556759, "epoch": 6707} {"train_loss": -27.40069007873535, "global_step": 556760, "epoch": 6707} {"train_loss": -27.48982810974121, "global_step": 556761, "epoch": 6707} {"train_loss": -27.78095054626465, "global_step": 556762, "epoch": 6707} {"train_loss": -27.76630514213838, "global_step": 556763, "epoch": 6707, "val_loss": 6562516.0} {"train_loss": -25.808446884155273, "global_step": 556764, "epoch": 6708} {"train_loss": -26.814855575561523, "global_step": 556765, "epoch": 6708} {"train_loss": -26.823286056518555, "global_step": 556766, "epoch": 6708} {"train_loss": -26.438007354736328, "global_step": 556767, "epoch": 6708} {"train_loss": -26.64834976196289, "global_step": 556768, "epoch": 6708} {"train_loss": -26.191465377807617, "global_step": 556769, "epoch": 6708} {"train_loss": -27.07073974609375, "global_step": 556770, "epoch": 6708} {"train_loss": -26.340295791625977, "global_step": 556771, "epoch": 6708} {"train_loss": -26.914844512939453, "global_step": 556772, "epoch": 6708} {"train_loss": -26.934049606323242, "global_step": 556773, "epoch": 6708} {"train_loss": -27.29425048828125, "global_step": 556774, "epoch": 6708} {"train_loss": -27.044157028198242, "global_step": 556775, "epoch": 6708} {"train_loss": -26.972883224487305, "global_step": 556776, "epoch": 6708} {"train_loss": -27.127796173095703, "global_step": 556777, "epoch": 6708} {"train_loss": -27.27610206604004, "global_step": 556778, "epoch": 6708} {"train_loss": -27.137893676757812, "global_step": 556779, "epoch": 6708} {"train_loss": -27.5864200592041, "global_step": 556780, "epoch": 6708} {"train_loss": -27.26626968383789, "global_step": 556781, "epoch": 6708} {"train_loss": -27.163095474243164, "global_step": 556782, "epoch": 6708} {"train_loss": -27.784534454345703, "global_step": 556783, "epoch": 6708} {"train_loss": -27.1429443359375, "global_step": 556784, "epoch": 6708} {"train_loss": -27.401525497436523, "global_step": 556785, "epoch": 6708} {"train_loss": -27.232440948486328, "global_step": 556786, "epoch": 6708} {"train_loss": -27.548994064331055, "global_step": 556787, "epoch": 6708} {"train_loss": -27.509119033813477, "global_step": 556788, "epoch": 6708} {"train_loss": -27.82990074157715, "global_step": 556789, "epoch": 6708} {"train_loss": -27.71291160583496, "global_step": 556790, "epoch": 6708} {"train_loss": -27.49799919128418, "global_step": 556791, "epoch": 6708} {"train_loss": -28.029626846313477, "global_step": 556792, "epoch": 6708} {"train_loss": -27.5727596282959, "global_step": 556793, "epoch": 6708} {"train_loss": -27.535398483276367, "global_step": 556794, "epoch": 6708} {"train_loss": -27.578500747680664, "global_step": 556795, "epoch": 6708} {"train_loss": -27.78781509399414, "global_step": 556796, "epoch": 6708} {"train_loss": -28.01214027404785, "global_step": 556797, "epoch": 6708} {"train_loss": -27.445356369018555, "global_step": 556798, "epoch": 6708} {"train_loss": -27.70126724243164, "global_step": 556799, "epoch": 6708} {"train_loss": -27.907312393188477, "global_step": 556800, "epoch": 6708} {"train_loss": -27.882863998413086, "global_step": 556801, "epoch": 6708} {"train_loss": -27.972244262695312, "global_step": 556802, "epoch": 6708} {"train_loss": -27.855396270751953, "global_step": 556803, "epoch": 6708} {"train_loss": -27.857385635375977, "global_step": 556804, "epoch": 6708} {"train_loss": -27.91901969909668, "global_step": 556805, "epoch": 6708} {"train_loss": -27.980789184570312, "global_step": 556806, "epoch": 6708} {"train_loss": -27.82496452331543, "global_step": 556807, "epoch": 6708} {"train_loss": -27.6464786529541, "global_step": 556808, "epoch": 6708} {"train_loss": -28.023456573486328, "global_step": 556809, "epoch": 6708} {"train_loss": -27.862567901611328, "global_step": 556810, "epoch": 6708} {"train_loss": -27.921131134033203, "global_step": 556811, "epoch": 6708} {"train_loss": -27.728097915649414, "global_step": 556812, "epoch": 6708} {"train_loss": -27.888715744018555, "global_step": 556813, "epoch": 6708} {"train_loss": -27.5213565826416, "global_step": 556814, "epoch": 6708} {"train_loss": -27.6791934967041, "global_step": 556815, "epoch": 6708} {"train_loss": -28.31717872619629, "global_step": 556816, "epoch": 6708} {"train_loss": -27.68549919128418, "global_step": 556817, "epoch": 6708} {"train_loss": -27.79835319519043, "global_step": 556818, "epoch": 6708} {"train_loss": -27.506940841674805, "global_step": 556819, "epoch": 6708} {"train_loss": -28.055145263671875, "global_step": 556820, "epoch": 6708} {"train_loss": -28.159133911132812, "global_step": 556821, "epoch": 6708} {"train_loss": -27.643590927124023, "global_step": 556822, "epoch": 6708} {"train_loss": -27.7736759185791, "global_step": 556823, "epoch": 6708} {"train_loss": -27.893157958984375, "global_step": 556824, "epoch": 6708} {"train_loss": -27.8466796875, "global_step": 556825, "epoch": 6708} {"train_loss": -27.79534912109375, "global_step": 556826, "epoch": 6708} {"train_loss": -28.2056941986084, "global_step": 556827, "epoch": 6708} {"train_loss": -28.049991607666016, "global_step": 556828, "epoch": 6708} {"train_loss": -27.783594131469727, "global_step": 556829, "epoch": 6708} {"train_loss": -27.875080108642578, "global_step": 556830, "epoch": 6708} {"train_loss": -27.99539566040039, "global_step": 556831, "epoch": 6708} {"train_loss": -28.115863800048828, "global_step": 556832, "epoch": 6708} {"train_loss": -28.179956436157227, "global_step": 556833, "epoch": 6708} {"train_loss": -27.588165283203125, "global_step": 556834, "epoch": 6708} {"train_loss": -28.044301986694336, "global_step": 556835, "epoch": 6708} {"train_loss": -27.498777389526367, "global_step": 556836, "epoch": 6708} {"train_loss": -28.142194747924805, "global_step": 556837, "epoch": 6708} {"train_loss": -28.039411544799805, "global_step": 556838, "epoch": 6708} {"train_loss": -27.75394630432129, "global_step": 556839, "epoch": 6708} {"train_loss": -27.891305923461914, "global_step": 556840, "epoch": 6708} {"train_loss": -27.682266235351562, "global_step": 556841, "epoch": 6708} {"train_loss": -27.817956924438477, "global_step": 556842, "epoch": 6708} {"train_loss": -27.768014907836914, "global_step": 556843, "epoch": 6708} {"train_loss": -27.465784072875977, "global_step": 556844, "epoch": 6708} {"train_loss": -27.93662452697754, "global_step": 556845, "epoch": 6708} {"train_loss": -27.575350864824042, "global_step": 556846, "epoch": 6708, "val_loss": 6540925.5} {"train_loss": -27.308807373046875, "global_step": 556847, "epoch": 6709} {"train_loss": -27.17085838317871, "global_step": 556848, "epoch": 6709} {"train_loss": -26.69593620300293, "global_step": 556849, "epoch": 6709} {"train_loss": -26.43021583557129, "global_step": 556850, "epoch": 6709} {"train_loss": -25.116262435913086, "global_step": 556851, "epoch": 6709} {"train_loss": -24.935413360595703, "global_step": 556852, "epoch": 6709} {"train_loss": -25.4898738861084, "global_step": 556853, "epoch": 6709} {"train_loss": -27.1091365814209, "global_step": 556854, "epoch": 6709} {"train_loss": -26.104156494140625, "global_step": 556855, "epoch": 6709} {"train_loss": -26.1934757232666, "global_step": 556856, "epoch": 6709} {"train_loss": -26.93714714050293, "global_step": 556857, "epoch": 6709} {"train_loss": -26.46607780456543, "global_step": 556858, "epoch": 6709} {"train_loss": -27.076370239257812, "global_step": 556859, "epoch": 6709} {"train_loss": -26.518051147460938, "global_step": 556860, "epoch": 6709} {"train_loss": -27.215866088867188, "global_step": 556861, "epoch": 6709} {"train_loss": -26.655725479125977, "global_step": 556862, "epoch": 6709} {"train_loss": -27.174474716186523, "global_step": 556863, "epoch": 6709} {"train_loss": -26.689756393432617, "global_step": 556864, "epoch": 6709} {"train_loss": -27.336090087890625, "global_step": 556865, "epoch": 6709} {"train_loss": -27.322265625, "global_step": 556866, "epoch": 6709} {"train_loss": -27.06044578552246, "global_step": 556867, "epoch": 6709} {"train_loss": -27.23198890686035, "global_step": 556868, "epoch": 6709} {"train_loss": -27.499664306640625, "global_step": 556869, "epoch": 6709} {"train_loss": -27.314062118530273, "global_step": 556870, "epoch": 6709} {"train_loss": -27.2116641998291, "global_step": 556871, "epoch": 6709} {"train_loss": -27.129934310913086, "global_step": 556872, "epoch": 6709} {"train_loss": -27.192630767822266, "global_step": 556873, "epoch": 6709} {"train_loss": -27.58370018005371, "global_step": 556874, "epoch": 6709} {"train_loss": -27.525379180908203, "global_step": 556875, "epoch": 6709} {"train_loss": -27.16358757019043, "global_step": 556876, "epoch": 6709} {"train_loss": -27.66928482055664, "global_step": 556877, "epoch": 6709} {"train_loss": -27.808942794799805, "global_step": 556878, "epoch": 6709} {"train_loss": -27.551849365234375, "global_step": 556879, "epoch": 6709} {"train_loss": -27.572011947631836, "global_step": 556880, "epoch": 6709} {"train_loss": -27.991485595703125, "global_step": 556881, "epoch": 6709} {"train_loss": -27.37477684020996, "global_step": 556882, "epoch": 6709} {"train_loss": -27.509057998657227, "global_step": 556883, "epoch": 6709} {"train_loss": -27.859800338745117, "global_step": 556884, "epoch": 6709} {"train_loss": -27.964313507080078, "global_step": 556885, "epoch": 6709} {"train_loss": -27.598188400268555, "global_step": 556886, "epoch": 6709} {"train_loss": -27.680700302124023, "global_step": 556887, "epoch": 6709} {"train_loss": -27.864093780517578, "global_step": 556888, "epoch": 6709} {"train_loss": -27.795251846313477, "global_step": 556889, "epoch": 6709} {"train_loss": -27.59242057800293, "global_step": 556890, "epoch": 6709} {"train_loss": -27.760278701782227, "global_step": 556891, "epoch": 6709} {"train_loss": -27.457162857055664, "global_step": 556892, "epoch": 6709} {"train_loss": -27.844425201416016, "global_step": 556893, "epoch": 6709} {"train_loss": -27.7554874420166, "global_step": 556894, "epoch": 6709} {"train_loss": -28.0184383392334, "global_step": 556895, "epoch": 6709} {"train_loss": -27.890411376953125, "global_step": 556896, "epoch": 6709} {"train_loss": -27.75823974609375, "global_step": 556897, "epoch": 6709} {"train_loss": -28.15327262878418, "global_step": 556898, "epoch": 6709} {"train_loss": -27.845739364624023, "global_step": 556899, "epoch": 6709} {"train_loss": -27.90254020690918, "global_step": 556900, "epoch": 6709} {"train_loss": -27.9416446685791, "global_step": 556901, "epoch": 6709} {"train_loss": -27.966413497924805, "global_step": 556902, "epoch": 6709} {"train_loss": -27.819992065429688, "global_step": 556903, "epoch": 6709} {"train_loss": -28.24360466003418, "global_step": 556904, "epoch": 6709} {"train_loss": -28.08108901977539, "global_step": 556905, "epoch": 6709} {"train_loss": -28.091861724853516, "global_step": 556906, "epoch": 6709} {"train_loss": -27.876855850219727, "global_step": 556907, "epoch": 6709} {"train_loss": -28.222219467163086, "global_step": 556908, "epoch": 6709} {"train_loss": -27.951181411743164, "global_step": 556909, "epoch": 6709} {"train_loss": -28.129871368408203, "global_step": 556910, "epoch": 6709} {"train_loss": -27.793787002563477, "global_step": 556911, "epoch": 6709} {"train_loss": -27.666852951049805, "global_step": 556912, "epoch": 6709} {"train_loss": -27.609344482421875, "global_step": 556913, "epoch": 6709} {"train_loss": -28.31196403503418, "global_step": 556914, "epoch": 6709} {"train_loss": -27.470733642578125, "global_step": 556915, "epoch": 6709} {"train_loss": -27.277740478515625, "global_step": 556916, "epoch": 6709} {"train_loss": -27.776952743530273, "global_step": 556917, "epoch": 6709} {"train_loss": -27.654027938842773, "global_step": 556918, "epoch": 6709} {"train_loss": -28.021854400634766, "global_step": 556919, "epoch": 6709} {"train_loss": -27.770313262939453, "global_step": 556920, "epoch": 6709} {"train_loss": -27.728778839111328, "global_step": 556921, "epoch": 6709} {"train_loss": -27.68341064453125, "global_step": 556922, "epoch": 6709} {"train_loss": -27.8941650390625, "global_step": 556923, "epoch": 6709} {"train_loss": -28.02151870727539, "global_step": 556924, "epoch": 6709} {"train_loss": -27.58660888671875, "global_step": 556925, "epoch": 6709} {"train_loss": -27.89813232421875, "global_step": 556926, "epoch": 6709} {"train_loss": -27.90622329711914, "global_step": 556927, "epoch": 6709} {"train_loss": -28.229352951049805, "global_step": 556928, "epoch": 6709} {"train_loss": -27.468027022947748, "global_step": 556929, "epoch": 6709, "val_loss": 6523099.5} {"train_loss": -27.233423233032227, "global_step": 556930, "epoch": 6710} {"train_loss": -27.189146041870117, "global_step": 556931, "epoch": 6710} {"train_loss": -27.1964168548584, "global_step": 556932, "epoch": 6710} {"train_loss": -27.072406768798828, "global_step": 556933, "epoch": 6710} {"train_loss": -27.287397384643555, "global_step": 556934, "epoch": 6710} {"train_loss": -27.3963680267334, "global_step": 556935, "epoch": 6710} {"train_loss": -27.478063583374023, "global_step": 556936, "epoch": 6710} {"train_loss": -27.14845085144043, "global_step": 556937, "epoch": 6710} {"train_loss": -27.590290069580078, "global_step": 556938, "epoch": 6710} {"train_loss": -27.599994659423828, "global_step": 556939, "epoch": 6710} {"train_loss": -27.491302490234375, "global_step": 556940, "epoch": 6710} {"train_loss": -27.62593650817871, "global_step": 556941, "epoch": 6710} {"train_loss": -27.70261001586914, "global_step": 556942, "epoch": 6710} {"train_loss": -27.59307289123535, "global_step": 556943, "epoch": 6710} {"train_loss": -27.335372924804688, "global_step": 556944, "epoch": 6710} {"train_loss": -27.36519432067871, "global_step": 556945, "epoch": 6710} {"train_loss": -27.75836181640625, "global_step": 556946, "epoch": 6710} {"train_loss": -27.850126266479492, "global_step": 556947, "epoch": 6710} {"train_loss": -27.2536563873291, "global_step": 556948, "epoch": 6710} {"train_loss": -27.504919052124023, "global_step": 556949, "epoch": 6710} {"train_loss": -27.55951499938965, "global_step": 556950, "epoch": 6710} {"train_loss": -28.184301376342773, "global_step": 556951, "epoch": 6710} {"train_loss": -27.540851593017578, "global_step": 556952, "epoch": 6710} {"train_loss": -27.9072322845459, "global_step": 556953, "epoch": 6710} {"train_loss": -27.82850456237793, "global_step": 556954, "epoch": 6710} {"train_loss": -27.649871826171875, "global_step": 556955, "epoch": 6710} {"train_loss": -27.508268356323242, "global_step": 556956, "epoch": 6710} {"train_loss": -27.383832931518555, "global_step": 556957, "epoch": 6710} {"train_loss": -27.739593505859375, "global_step": 556958, "epoch": 6710} {"train_loss": -27.990447998046875, "global_step": 556959, "epoch": 6710} {"train_loss": -27.6923770904541, "global_step": 556960, "epoch": 6710} {"train_loss": -27.680252075195312, "global_step": 556961, "epoch": 6710} {"train_loss": -27.630664825439453, "global_step": 556962, "epoch": 6710} {"train_loss": -27.73284339904785, "global_step": 556963, "epoch": 6710} {"train_loss": -27.739721298217773, "global_step": 556964, "epoch": 6710} {"train_loss": -27.659448623657227, "global_step": 556965, "epoch": 6710} {"train_loss": -27.761682510375977, "global_step": 556966, "epoch": 6710} {"train_loss": -27.99274253845215, "global_step": 556967, "epoch": 6710} {"train_loss": -27.88189697265625, "global_step": 556968, "epoch": 6710} {"train_loss": -27.996557235717773, "global_step": 556969, "epoch": 6710} {"train_loss": -28.152740478515625, "global_step": 556970, "epoch": 6710} {"train_loss": -27.877548217773438, "global_step": 556971, "epoch": 6710} {"train_loss": -27.92022132873535, "global_step": 556972, "epoch": 6710} {"train_loss": -28.203678131103516, "global_step": 556973, "epoch": 6710} {"train_loss": -28.059616088867188, "global_step": 556974, "epoch": 6710} {"train_loss": -27.871915817260742, "global_step": 556975, "epoch": 6710} {"train_loss": -28.174238204956055, "global_step": 556976, "epoch": 6710} {"train_loss": -27.887372970581055, "global_step": 556977, "epoch": 6710} {"train_loss": -27.941516876220703, "global_step": 556978, "epoch": 6710} {"train_loss": -27.669116973876953, "global_step": 556979, "epoch": 6710} {"train_loss": -27.6713809967041, "global_step": 556980, "epoch": 6710} {"train_loss": -28.20954704284668, "global_step": 556981, "epoch": 6710} {"train_loss": -28.236913681030273, "global_step": 556982, "epoch": 6710} {"train_loss": -28.261869430541992, "global_step": 556983, "epoch": 6710} {"train_loss": -28.01692008972168, "global_step": 556984, "epoch": 6710} {"train_loss": -28.359943389892578, "global_step": 556985, "epoch": 6710} {"train_loss": -28.2225341796875, "global_step": 556986, "epoch": 6710} {"train_loss": -28.01822280883789, "global_step": 556987, "epoch": 6710} {"train_loss": -27.955963134765625, "global_step": 556988, "epoch": 6710} {"train_loss": -27.86376953125, "global_step": 556989, "epoch": 6710} {"train_loss": -28.032629013061523, "global_step": 556990, "epoch": 6710} {"train_loss": -27.81298828125, "global_step": 556991, "epoch": 6710} {"train_loss": -28.072620391845703, "global_step": 556992, "epoch": 6710} {"train_loss": -27.69717788696289, "global_step": 556993, "epoch": 6710} {"train_loss": -27.250080108642578, "global_step": 556994, "epoch": 6710} {"train_loss": -26.86996841430664, "global_step": 556995, "epoch": 6710} {"train_loss": -26.894577026367188, "global_step": 556996, "epoch": 6710} {"train_loss": -26.931360244750977, "global_step": 556997, "epoch": 6710} {"train_loss": -27.50046157836914, "global_step": 556998, "epoch": 6710} {"train_loss": -27.132476806640625, "global_step": 556999, "epoch": 6710} {"train_loss": -27.147119522094727, "global_step": 557000, "epoch": 6710} {"train_loss": -27.820295333862305, "global_step": 557001, "epoch": 6710} {"train_loss": -27.54081153869629, "global_step": 557002, "epoch": 6710} {"train_loss": -27.767105102539062, "global_step": 557003, "epoch": 6710} {"train_loss": -28.088911056518555, "global_step": 557004, "epoch": 6710} {"train_loss": -27.17804527282715, "global_step": 557005, "epoch": 6710} {"train_loss": -27.818134307861328, "global_step": 557006, "epoch": 6710} {"train_loss": -27.840412139892578, "global_step": 557007, "epoch": 6710} {"train_loss": -27.45330810546875, "global_step": 557008, "epoch": 6710} {"train_loss": -27.96584129333496, "global_step": 557009, "epoch": 6710} {"train_loss": -27.5819091796875, "global_step": 557010, "epoch": 6710} {"train_loss": -27.878162384033203, "global_step": 557011, "epoch": 6710} {"train_loss": -27.689552169248284, "global_step": 557012, "epoch": 6710, "val_loss": 6484337.0} {"train_loss": -27.1073055267334, "global_step": 557013, "epoch": 6711} {"train_loss": -26.483816146850586, "global_step": 557014, "epoch": 6711} {"train_loss": -26.996641159057617, "global_step": 557015, "epoch": 6711} {"train_loss": -26.69693374633789, "global_step": 557016, "epoch": 6711} {"train_loss": -26.717599868774414, "global_step": 557017, "epoch": 6711} {"train_loss": -26.827844619750977, "global_step": 557018, "epoch": 6711} {"train_loss": -26.528757095336914, "global_step": 557019, "epoch": 6711} {"train_loss": -26.56890296936035, "global_step": 557020, "epoch": 6711} {"train_loss": -27.4067440032959, "global_step": 557021, "epoch": 6711} {"train_loss": -27.092992782592773, "global_step": 557022, "epoch": 6711} {"train_loss": -27.1865177154541, "global_step": 557023, "epoch": 6711} {"train_loss": -26.94541358947754, "global_step": 557024, "epoch": 6711} {"train_loss": -27.07399559020996, "global_step": 557025, "epoch": 6711} {"train_loss": -26.832828521728516, "global_step": 557026, "epoch": 6711} {"train_loss": -26.94757080078125, "global_step": 557027, "epoch": 6711} {"train_loss": -27.070775985717773, "global_step": 557028, "epoch": 6711} {"train_loss": -27.585058212280273, "global_step": 557029, "epoch": 6711} {"train_loss": -27.32390785217285, "global_step": 557030, "epoch": 6711} {"train_loss": -27.188495635986328, "global_step": 557031, "epoch": 6711} {"train_loss": -27.335538864135742, "global_step": 557032, "epoch": 6711} {"train_loss": -27.670446395874023, "global_step": 557033, "epoch": 6711} {"train_loss": -27.480072021484375, "global_step": 557034, "epoch": 6711} {"train_loss": -27.68900489807129, "global_step": 557035, "epoch": 6711} {"train_loss": -27.56074333190918, "global_step": 557036, "epoch": 6711} {"train_loss": -27.0190486907959, "global_step": 557037, "epoch": 6711} {"train_loss": -28.016332626342773, "global_step": 557038, "epoch": 6711} {"train_loss": -27.67646598815918, "global_step": 557039, "epoch": 6711} {"train_loss": -27.58595085144043, "global_step": 557040, "epoch": 6711} {"train_loss": -27.516284942626953, "global_step": 557041, "epoch": 6711} {"train_loss": -27.59295654296875, "global_step": 557042, "epoch": 6711} {"train_loss": -27.932205200195312, "global_step": 557043, "epoch": 6711} {"train_loss": -27.242841720581055, "global_step": 557044, "epoch": 6711} {"train_loss": -27.780960083007812, "global_step": 557045, "epoch": 6711} {"train_loss": -27.923715591430664, "global_step": 557046, "epoch": 6711} {"train_loss": -27.9948673248291, "global_step": 557047, "epoch": 6711} {"train_loss": -27.870563507080078, "global_step": 557048, "epoch": 6711} {"train_loss": -27.89820671081543, "global_step": 557049, "epoch": 6711} {"train_loss": -27.85394287109375, "global_step": 557050, "epoch": 6711} {"train_loss": -27.731229782104492, "global_step": 557051, "epoch": 6711} {"train_loss": -28.318174362182617, "global_step": 557052, "epoch": 6711} {"train_loss": -27.901269912719727, "global_step": 557053, "epoch": 6711} {"train_loss": -27.862060546875, "global_step": 557054, "epoch": 6711} {"train_loss": -27.655492782592773, "global_step": 557055, "epoch": 6711} {"train_loss": -27.817489624023438, "global_step": 557056, "epoch": 6711} {"train_loss": -27.67341423034668, "global_step": 557057, "epoch": 6711} {"train_loss": -28.3398380279541, "global_step": 557058, "epoch": 6711} {"train_loss": -28.036514282226562, "global_step": 557059, "epoch": 6711} {"train_loss": -27.862213134765625, "global_step": 557060, "epoch": 6711} {"train_loss": -27.80097770690918, "global_step": 557061, "epoch": 6711} {"train_loss": -28.07562255859375, "global_step": 557062, "epoch": 6711} {"train_loss": -28.31378173828125, "global_step": 557063, "epoch": 6711} {"train_loss": -28.1518611907959, "global_step": 557064, "epoch": 6711} {"train_loss": -27.78508949279785, "global_step": 557065, "epoch": 6711} {"train_loss": -27.876798629760742, "global_step": 557066, "epoch": 6711} {"train_loss": -28.10721778869629, "global_step": 557067, "epoch": 6711} {"train_loss": -27.974140167236328, "global_step": 557068, "epoch": 6711} {"train_loss": -27.994861602783203, "global_step": 557069, "epoch": 6711} {"train_loss": -28.066608428955078, "global_step": 557070, "epoch": 6711} {"train_loss": -27.15572166442871, "global_step": 557071, "epoch": 6711} {"train_loss": -27.588953018188477, "global_step": 557072, "epoch": 6711} {"train_loss": -27.621402740478516, "global_step": 557073, "epoch": 6711} {"train_loss": -27.889448165893555, "global_step": 557074, "epoch": 6711} {"train_loss": -27.72199821472168, "global_step": 557075, "epoch": 6711} {"train_loss": -27.203643798828125, "global_step": 557076, "epoch": 6711} {"train_loss": -27.569690704345703, "global_step": 557077, "epoch": 6711} {"train_loss": -28.27984046936035, "global_step": 557078, "epoch": 6711} {"train_loss": -27.880512237548828, "global_step": 557079, "epoch": 6711} {"train_loss": -27.897680282592773, "global_step": 557080, "epoch": 6711} {"train_loss": -27.858905792236328, "global_step": 557081, "epoch": 6711} {"train_loss": -27.731353759765625, "global_step": 557082, "epoch": 6711} {"train_loss": -27.65082359313965, "global_step": 557083, "epoch": 6711} {"train_loss": -27.546483993530273, "global_step": 557084, "epoch": 6711} {"train_loss": -27.74725341796875, "global_step": 557085, "epoch": 6711} {"train_loss": -27.44440269470215, "global_step": 557086, "epoch": 6711} {"train_loss": -27.66523551940918, "global_step": 557087, "epoch": 6711} {"train_loss": -27.9664249420166, "global_step": 557088, "epoch": 6711} {"train_loss": -27.9571590423584, "global_step": 557089, "epoch": 6711} {"train_loss": -27.688201904296875, "global_step": 557090, "epoch": 6711} {"train_loss": -27.454242706298828, "global_step": 557091, "epoch": 6711} {"train_loss": -27.7775936126709, "global_step": 557092, "epoch": 6711} {"train_loss": -27.681045532226562, "global_step": 557093, "epoch": 6711} {"train_loss": -27.612476348876953, "global_step": 557094, "epoch": 6711} {"train_loss": -27.59297120427511, "global_step": 557095, "epoch": 6711, "val_loss": 6429610.5} {"train_loss": -26.69428062438965, "global_step": 557096, "epoch": 6712} {"train_loss": -26.979238510131836, "global_step": 557097, "epoch": 6712} {"train_loss": -26.772001266479492, "global_step": 557098, "epoch": 6712} {"train_loss": -26.999357223510742, "global_step": 557099, "epoch": 6712} {"train_loss": -27.382892608642578, "global_step": 557100, "epoch": 6712} {"train_loss": -26.781904220581055, "global_step": 557101, "epoch": 6712} {"train_loss": -27.008102416992188, "global_step": 557102, "epoch": 6712} {"train_loss": -27.240644454956055, "global_step": 557103, "epoch": 6712} {"train_loss": -26.858417510986328, "global_step": 557104, "epoch": 6712} {"train_loss": -27.371295928955078, "global_step": 557105, "epoch": 6712} {"train_loss": -27.452239990234375, "global_step": 557106, "epoch": 6712} {"train_loss": -27.12078857421875, "global_step": 557107, "epoch": 6712} {"train_loss": -27.477209091186523, "global_step": 557108, "epoch": 6712} {"train_loss": -27.270191192626953, "global_step": 557109, "epoch": 6712} {"train_loss": -27.45667839050293, "global_step": 557110, "epoch": 6712} {"train_loss": -27.7950439453125, "global_step": 557111, "epoch": 6712} {"train_loss": -27.14582633972168, "global_step": 557112, "epoch": 6712} {"train_loss": -27.217741012573242, "global_step": 557113, "epoch": 6712} {"train_loss": -27.6186580657959, "global_step": 557114, "epoch": 6712} {"train_loss": -27.477685928344727, "global_step": 557115, "epoch": 6712} {"train_loss": -27.437469482421875, "global_step": 557116, "epoch": 6712} {"train_loss": -27.691547393798828, "global_step": 557117, "epoch": 6712} {"train_loss": -27.413639068603516, "global_step": 557118, "epoch": 6712} {"train_loss": -27.75017738342285, "global_step": 557119, "epoch": 6712} {"train_loss": -27.67922019958496, "global_step": 557120, "epoch": 6712} {"train_loss": -27.389734268188477, "global_step": 557121, "epoch": 6712} {"train_loss": -27.558032989501953, "global_step": 557122, "epoch": 6712} {"train_loss": -27.57708740234375, "global_step": 557123, "epoch": 6712} {"train_loss": -27.485321044921875, "global_step": 557124, "epoch": 6712} {"train_loss": -27.492202758789062, "global_step": 557125, "epoch": 6712} {"train_loss": -27.594999313354492, "global_step": 557126, "epoch": 6712} {"train_loss": -27.422748565673828, "global_step": 557127, "epoch": 6712} {"train_loss": -27.386518478393555, "global_step": 557128, "epoch": 6712} {"train_loss": -27.613513946533203, "global_step": 557129, "epoch": 6712} {"train_loss": -27.8111515045166, "global_step": 557130, "epoch": 6712} {"train_loss": -28.180273056030273, "global_step": 557131, "epoch": 6712} {"train_loss": -27.462369918823242, "global_step": 557132, "epoch": 6712} {"train_loss": -28.002029418945312, "global_step": 557133, "epoch": 6712} {"train_loss": -27.792816162109375, "global_step": 557134, "epoch": 6712} {"train_loss": -27.821680068969727, "global_step": 557135, "epoch": 6712} {"train_loss": -27.619007110595703, "global_step": 557136, "epoch": 6712} {"train_loss": -27.838333129882812, "global_step": 557137, "epoch": 6712} {"train_loss": -28.026926040649414, "global_step": 557138, "epoch": 6712} {"train_loss": -27.91438865661621, "global_step": 557139, "epoch": 6712} {"train_loss": -28.24946403503418, "global_step": 557140, "epoch": 6712} {"train_loss": -27.642749786376953, "global_step": 557141, "epoch": 6712} {"train_loss": -28.011320114135742, "global_step": 557142, "epoch": 6712} {"train_loss": -27.979206085205078, "global_step": 557143, "epoch": 6712} {"train_loss": -27.860071182250977, "global_step": 557144, "epoch": 6712} {"train_loss": -27.6932430267334, "global_step": 557145, "epoch": 6712} {"train_loss": -27.78867530822754, "global_step": 557146, "epoch": 6712} {"train_loss": -27.85296630859375, "global_step": 557147, "epoch": 6712} {"train_loss": -28.340307235717773, "global_step": 557148, "epoch": 6712} {"train_loss": -27.664825439453125, "global_step": 557149, "epoch": 6712} {"train_loss": -27.98777198791504, "global_step": 557150, "epoch": 6712} {"train_loss": -28.257654190063477, "global_step": 557151, "epoch": 6712} {"train_loss": -27.74085807800293, "global_step": 557152, "epoch": 6712} {"train_loss": -28.040515899658203, "global_step": 557153, "epoch": 6712} {"train_loss": -27.606414794921875, "global_step": 557154, "epoch": 6712} {"train_loss": -27.5482120513916, "global_step": 557155, "epoch": 6712} {"train_loss": -27.893857955932617, "global_step": 557156, "epoch": 6712} {"train_loss": -27.36182975769043, "global_step": 557157, "epoch": 6712} {"train_loss": -28.12934684753418, "global_step": 557158, "epoch": 6712} {"train_loss": -27.794330596923828, "global_step": 557159, "epoch": 6712} {"train_loss": -27.814685821533203, "global_step": 557160, "epoch": 6712} {"train_loss": -27.8349666595459, "global_step": 557161, "epoch": 6712} {"train_loss": -27.334314346313477, "global_step": 557162, "epoch": 6712} {"train_loss": -27.51979637145996, "global_step": 557163, "epoch": 6712} {"train_loss": -27.788171768188477, "global_step": 557164, "epoch": 6712} {"train_loss": -27.978479385375977, "global_step": 557165, "epoch": 6712} {"train_loss": -27.484228134155273, "global_step": 557166, "epoch": 6712} {"train_loss": -27.835798263549805, "global_step": 557167, "epoch": 6712} {"train_loss": -27.659208297729492, "global_step": 557168, "epoch": 6712} {"train_loss": -27.602466583251953, "global_step": 557169, "epoch": 6712} {"train_loss": -27.654340744018555, "global_step": 557170, "epoch": 6712} {"train_loss": -27.95713233947754, "global_step": 557171, "epoch": 6712} {"train_loss": -27.576406478881836, "global_step": 557172, "epoch": 6712} {"train_loss": -27.590986251831055, "global_step": 557173, "epoch": 6712} {"train_loss": -27.745132446289062, "global_step": 557174, "epoch": 6712} {"train_loss": -27.591684341430664, "global_step": 557175, "epoch": 6712} {"train_loss": -27.67221450805664, "global_step": 557176, "epoch": 6712} {"train_loss": -27.817672729492188, "global_step": 557177, "epoch": 6712} {"train_loss": -27.60708569905844, "global_step": 557178, "epoch": 6712, "val_loss": 6499437.0} {"train_loss": -26.729084014892578, "global_step": 557179, "epoch": 6713} {"train_loss": -25.99033546447754, "global_step": 557180, "epoch": 6713} {"train_loss": -26.70505142211914, "global_step": 557181, "epoch": 6713} {"train_loss": -26.713092803955078, "global_step": 557182, "epoch": 6713} {"train_loss": -26.3795223236084, "global_step": 557183, "epoch": 6713} {"train_loss": -26.273603439331055, "global_step": 557184, "epoch": 6713} {"train_loss": -27.069433212280273, "global_step": 557185, "epoch": 6713} {"train_loss": -26.75172233581543, "global_step": 557186, "epoch": 6713} {"train_loss": -26.749439239501953, "global_step": 557187, "epoch": 6713} {"train_loss": -26.723669052124023, "global_step": 557188, "epoch": 6713} {"train_loss": -27.0660343170166, "global_step": 557189, "epoch": 6713} {"train_loss": -27.00214195251465, "global_step": 557190, "epoch": 6713} {"train_loss": -26.8358154296875, "global_step": 557191, "epoch": 6713} {"train_loss": -27.191360473632812, "global_step": 557192, "epoch": 6713} {"train_loss": -26.953327178955078, "global_step": 557193, "epoch": 6713} {"train_loss": -27.220190048217773, "global_step": 557194, "epoch": 6713} {"train_loss": -26.82512855529785, "global_step": 557195, "epoch": 6713} {"train_loss": -27.300342559814453, "global_step": 557196, "epoch": 6713} {"train_loss": -27.493244171142578, "global_step": 557197, "epoch": 6713} {"train_loss": -27.530811309814453, "global_step": 557198, "epoch": 6713} {"train_loss": -27.270536422729492, "global_step": 557199, "epoch": 6713} {"train_loss": -27.26584243774414, "global_step": 557200, "epoch": 6713} {"train_loss": -27.4626407623291, "global_step": 557201, "epoch": 6713} {"train_loss": -27.32258415222168, "global_step": 557202, "epoch": 6713} {"train_loss": -27.654254913330078, "global_step": 557203, "epoch": 6713} {"train_loss": -27.32294273376465, "global_step": 557204, "epoch": 6713} {"train_loss": -27.497604370117188, "global_step": 557205, "epoch": 6713} {"train_loss": -27.11777114868164, "global_step": 557206, "epoch": 6713} {"train_loss": -27.743284225463867, "global_step": 557207, "epoch": 6713} {"train_loss": -27.471704483032227, "global_step": 557208, "epoch": 6713} {"train_loss": -27.426315307617188, "global_step": 557209, "epoch": 6713} {"train_loss": -27.74068260192871, "global_step": 557210, "epoch": 6713} {"train_loss": -27.38875389099121, "global_step": 557211, "epoch": 6713} {"train_loss": -27.6307430267334, "global_step": 557212, "epoch": 6713} {"train_loss": -27.4620361328125, "global_step": 557213, "epoch": 6713} {"train_loss": -27.943561553955078, "global_step": 557214, "epoch": 6713} {"train_loss": -27.393476486206055, "global_step": 557215, "epoch": 6713} {"train_loss": -27.967670440673828, "global_step": 557216, "epoch": 6713} {"train_loss": -27.82624626159668, "global_step": 557217, "epoch": 6713} {"train_loss": -27.61097526550293, "global_step": 557218, "epoch": 6713} {"train_loss": -27.79107666015625, "global_step": 557219, "epoch": 6713} {"train_loss": -27.24676513671875, "global_step": 557220, "epoch": 6713} {"train_loss": -27.683378219604492, "global_step": 557221, "epoch": 6713} {"train_loss": -27.839841842651367, "global_step": 557222, "epoch": 6713} {"train_loss": -27.42789649963379, "global_step": 557223, "epoch": 6713} {"train_loss": -27.91729736328125, "global_step": 557224, "epoch": 6713} {"train_loss": -27.849287033081055, "global_step": 557225, "epoch": 6713} {"train_loss": -27.604938507080078, "global_step": 557226, "epoch": 6713} {"train_loss": -28.024906158447266, "global_step": 557227, "epoch": 6713} {"train_loss": -27.720489501953125, "global_step": 557228, "epoch": 6713} {"train_loss": -27.594640731811523, "global_step": 557229, "epoch": 6713} {"train_loss": -27.54978370666504, "global_step": 557230, "epoch": 6713} {"train_loss": -28.07960319519043, "global_step": 557231, "epoch": 6713} {"train_loss": -27.73128318786621, "global_step": 557232, "epoch": 6713} {"train_loss": -27.678964614868164, "global_step": 557233, "epoch": 6713} {"train_loss": -27.885547637939453, "global_step": 557234, "epoch": 6713} {"train_loss": -27.88838005065918, "global_step": 557235, "epoch": 6713} {"train_loss": -28.226011276245117, "global_step": 557236, "epoch": 6713} {"train_loss": -28.12518882751465, "global_step": 557237, "epoch": 6713} {"train_loss": -27.70527458190918, "global_step": 557238, "epoch": 6713} {"train_loss": -27.63417625427246, "global_step": 557239, "epoch": 6713} {"train_loss": -27.948028564453125, "global_step": 557240, "epoch": 6713} {"train_loss": -28.0947322845459, "global_step": 557241, "epoch": 6713} {"train_loss": -27.81180191040039, "global_step": 557242, "epoch": 6713} {"train_loss": -27.564105987548828, "global_step": 557243, "epoch": 6713} {"train_loss": -27.96135902404785, "global_step": 557244, "epoch": 6713} {"train_loss": -27.50897216796875, "global_step": 557245, "epoch": 6713} {"train_loss": -27.89982032775879, "global_step": 557246, "epoch": 6713} {"train_loss": -27.6304988861084, "global_step": 557247, "epoch": 6713} {"train_loss": -27.972814559936523, "global_step": 557248, "epoch": 6713} {"train_loss": -27.725250244140625, "global_step": 557249, "epoch": 6713} {"train_loss": -27.712045669555664, "global_step": 557250, "epoch": 6713} {"train_loss": -27.769458770751953, "global_step": 557251, "epoch": 6713} {"train_loss": -27.465774536132812, "global_step": 557252, "epoch": 6713} {"train_loss": -27.577199935913086, "global_step": 557253, "epoch": 6713} {"train_loss": -27.731891632080078, "global_step": 557254, "epoch": 6713} {"train_loss": -27.681493759155273, "global_step": 557255, "epoch": 6713} {"train_loss": -27.913084030151367, "global_step": 557256, "epoch": 6713} {"train_loss": -27.8426570892334, "global_step": 557257, "epoch": 6713} {"train_loss": -27.786252975463867, "global_step": 557258, "epoch": 6713} {"train_loss": -27.7645206451416, "global_step": 557259, "epoch": 6713} {"train_loss": -27.9350528717041, "global_step": 557260, "epoch": 6713} {"train_loss": -27.48949724220368, "global_step": 557261, "epoch": 6713, "val_loss": 6583695.0} {"train_loss": -26.991470336914062, "global_step": 557262, "epoch": 6714} {"train_loss": -26.774946212768555, "global_step": 557263, "epoch": 6714} {"train_loss": -26.692590713500977, "global_step": 557264, "epoch": 6714} {"train_loss": -26.9936466217041, "global_step": 557265, "epoch": 6714} {"train_loss": -26.96803855895996, "global_step": 557266, "epoch": 6714} {"train_loss": -26.5029239654541, "global_step": 557267, "epoch": 6714} {"train_loss": -27.322851181030273, "global_step": 557268, "epoch": 6714} {"train_loss": -27.154987335205078, "global_step": 557269, "epoch": 6714} {"train_loss": -27.3211669921875, "global_step": 557270, "epoch": 6714} {"train_loss": -27.440185546875, "global_step": 557271, "epoch": 6714} {"train_loss": -27.036426544189453, "global_step": 557272, "epoch": 6714} {"train_loss": -27.677265167236328, "global_step": 557273, "epoch": 6714} {"train_loss": -27.10104751586914, "global_step": 557274, "epoch": 6714} {"train_loss": -27.479480743408203, "global_step": 557275, "epoch": 6714} {"train_loss": -27.208646774291992, "global_step": 557276, "epoch": 6714} {"train_loss": -27.050100326538086, "global_step": 557277, "epoch": 6714} {"train_loss": -27.433151245117188, "global_step": 557278, "epoch": 6714} {"train_loss": -27.549097061157227, "global_step": 557279, "epoch": 6714} {"train_loss": -27.5538272857666, "global_step": 557280, "epoch": 6714} {"train_loss": -27.572179794311523, "global_step": 557281, "epoch": 6714} {"train_loss": -27.076129913330078, "global_step": 557282, "epoch": 6714} {"train_loss": -27.058490753173828, "global_step": 557283, "epoch": 6714} {"train_loss": -27.852323532104492, "global_step": 557284, "epoch": 6714} {"train_loss": -27.759428024291992, "global_step": 557285, "epoch": 6714} {"train_loss": -27.515039443969727, "global_step": 557286, "epoch": 6714} {"train_loss": -27.93896484375, "global_step": 557287, "epoch": 6714} {"train_loss": -27.905536651611328, "global_step": 557288, "epoch": 6714} {"train_loss": -27.735870361328125, "global_step": 557289, "epoch": 6714} {"train_loss": -27.585540771484375, "global_step": 557290, "epoch": 6714} {"train_loss": -27.577966690063477, "global_step": 557291, "epoch": 6714} {"train_loss": -27.696807861328125, "global_step": 557292, "epoch": 6714} {"train_loss": -27.914865493774414, "global_step": 557293, "epoch": 6714} {"train_loss": -28.004169464111328, "global_step": 557294, "epoch": 6714} {"train_loss": -27.726776123046875, "global_step": 557295, "epoch": 6714} {"train_loss": -27.83123779296875, "global_step": 557296, "epoch": 6714} {"train_loss": -27.63407325744629, "global_step": 557297, "epoch": 6714} {"train_loss": -27.683979034423828, "global_step": 557298, "epoch": 6714} {"train_loss": -27.953699111938477, "global_step": 557299, "epoch": 6714} {"train_loss": -27.85536003112793, "global_step": 557300, "epoch": 6714} {"train_loss": -27.721988677978516, "global_step": 557301, "epoch": 6714} {"train_loss": -28.13093376159668, "global_step": 557302, "epoch": 6714} {"train_loss": -27.7663631439209, "global_step": 557303, "epoch": 6714} {"train_loss": -27.8309383392334, "global_step": 557304, "epoch": 6714} {"train_loss": -27.582345962524414, "global_step": 557305, "epoch": 6714} {"train_loss": -27.804182052612305, "global_step": 557306, "epoch": 6714} {"train_loss": -28.101627349853516, "global_step": 557307, "epoch": 6714} {"train_loss": -27.815282821655273, "global_step": 557308, "epoch": 6714} {"train_loss": -28.313617706298828, "global_step": 557309, "epoch": 6714} {"train_loss": -27.789575576782227, "global_step": 557310, "epoch": 6714} {"train_loss": -27.702911376953125, "global_step": 557311, "epoch": 6714} {"train_loss": -28.090436935424805, "global_step": 557312, "epoch": 6714} {"train_loss": -27.91824722290039, "global_step": 557313, "epoch": 6714} {"train_loss": -27.841419219970703, "global_step": 557314, "epoch": 6714} {"train_loss": -27.639341354370117, "global_step": 557315, "epoch": 6714} {"train_loss": -28.143823623657227, "global_step": 557316, "epoch": 6714} {"train_loss": -27.726566314697266, "global_step": 557317, "epoch": 6714} {"train_loss": -27.816364288330078, "global_step": 557318, "epoch": 6714} {"train_loss": -27.719955444335938, "global_step": 557319, "epoch": 6714} {"train_loss": -27.497772216796875, "global_step": 557320, "epoch": 6714} {"train_loss": -27.8714656829834, "global_step": 557321, "epoch": 6714} {"train_loss": -28.04664421081543, "global_step": 557322, "epoch": 6714} {"train_loss": -27.77316665649414, "global_step": 557323, "epoch": 6714} {"train_loss": -28.03082847595215, "global_step": 557324, "epoch": 6714} {"train_loss": -27.805164337158203, "global_step": 557325, "epoch": 6714} {"train_loss": -27.130435943603516, "global_step": 557326, "epoch": 6714} {"train_loss": -27.884729385375977, "global_step": 557327, "epoch": 6714} {"train_loss": -27.89592933654785, "global_step": 557328, "epoch": 6714} {"train_loss": -27.099878311157227, "global_step": 557329, "epoch": 6714} {"train_loss": -27.493093490600586, "global_step": 557330, "epoch": 6714} {"train_loss": -27.5242977142334, "global_step": 557331, "epoch": 6714} {"train_loss": -27.41033363342285, "global_step": 557332, "epoch": 6714} {"train_loss": -27.631555557250977, "global_step": 557333, "epoch": 6714} {"train_loss": -27.10340690612793, "global_step": 557334, "epoch": 6714} {"train_loss": -26.326391220092773, "global_step": 557335, "epoch": 6714} {"train_loss": -25.69051170349121, "global_step": 557336, "epoch": 6714} {"train_loss": -25.8016414642334, "global_step": 557337, "epoch": 6714} {"train_loss": -27.29461669921875, "global_step": 557338, "epoch": 6714} {"train_loss": -27.092334747314453, "global_step": 557339, "epoch": 6714} {"train_loss": -26.372900009155273, "global_step": 557340, "epoch": 6714} {"train_loss": -26.67593765258789, "global_step": 557341, "epoch": 6714} {"train_loss": -27.061166763305664, "global_step": 557342, "epoch": 6714} {"train_loss": -26.765827178955078, "global_step": 557343, "epoch": 6714} {"train_loss": -27.47180835310235, "global_step": 557344, "epoch": 6714, "val_loss": 6507074.0} {"train_loss": -26.383955001831055, "global_step": 557345, "epoch": 6715} {"train_loss": -27.055707931518555, "global_step": 557346, "epoch": 6715} {"train_loss": -26.413400650024414, "global_step": 557347, "epoch": 6715} {"train_loss": -26.55694580078125, "global_step": 557348, "epoch": 6715} {"train_loss": -26.99835205078125, "global_step": 557349, "epoch": 6715} {"train_loss": -27.1047306060791, "global_step": 557350, "epoch": 6715} {"train_loss": -26.94952392578125, "global_step": 557351, "epoch": 6715} {"train_loss": -26.783384323120117, "global_step": 557352, "epoch": 6715} {"train_loss": -27.02766227722168, "global_step": 557353, "epoch": 6715} {"train_loss": -27.2302188873291, "global_step": 557354, "epoch": 6715} {"train_loss": -27.338071823120117, "global_step": 557355, "epoch": 6715} {"train_loss": -27.31430435180664, "global_step": 557356, "epoch": 6715} {"train_loss": -27.015851974487305, "global_step": 557357, "epoch": 6715} {"train_loss": -27.57513999938965, "global_step": 557358, "epoch": 6715} {"train_loss": -27.354642868041992, "global_step": 557359, "epoch": 6715} {"train_loss": -27.258020401000977, "global_step": 557360, "epoch": 6715} {"train_loss": -27.53564453125, "global_step": 557361, "epoch": 6715} {"train_loss": -27.154712677001953, "global_step": 557362, "epoch": 6715} {"train_loss": -27.709461212158203, "global_step": 557363, "epoch": 6715} {"train_loss": -27.509424209594727, "global_step": 557364, "epoch": 6715} {"train_loss": -27.649152755737305, "global_step": 557365, "epoch": 6715} {"train_loss": -27.941457748413086, "global_step": 557366, "epoch": 6715} {"train_loss": -27.511920928955078, "global_step": 557367, "epoch": 6715} {"train_loss": -27.466474533081055, "global_step": 557368, "epoch": 6715} {"train_loss": -27.3512020111084, "global_step": 557369, "epoch": 6715} {"train_loss": -27.59291648864746, "global_step": 557370, "epoch": 6715} {"train_loss": -27.766250610351562, "global_step": 557371, "epoch": 6715} {"train_loss": -27.50624656677246, "global_step": 557372, "epoch": 6715} {"train_loss": -27.68704605102539, "global_step": 557373, "epoch": 6715} {"train_loss": -27.728076934814453, "global_step": 557374, "epoch": 6715} {"train_loss": -27.461139678955078, "global_step": 557375, "epoch": 6715} {"train_loss": -27.805988311767578, "global_step": 557376, "epoch": 6715} {"train_loss": -27.586572647094727, "global_step": 557377, "epoch": 6715} {"train_loss": -27.55866050720215, "global_step": 557378, "epoch": 6715} {"train_loss": -28.10391616821289, "global_step": 557379, "epoch": 6715} {"train_loss": -28.118072509765625, "global_step": 557380, "epoch": 6715} {"train_loss": -27.732452392578125, "global_step": 557381, "epoch": 6715} {"train_loss": -28.103986740112305, "global_step": 557382, "epoch": 6715} {"train_loss": -28.140045166015625, "global_step": 557383, "epoch": 6715} {"train_loss": -27.795419692993164, "global_step": 557384, "epoch": 6715} {"train_loss": -28.043292999267578, "global_step": 557385, "epoch": 6715} {"train_loss": -27.648727416992188, "global_step": 557386, "epoch": 6715} {"train_loss": -27.517263412475586, "global_step": 557387, "epoch": 6715} {"train_loss": -27.747838973999023, "global_step": 557388, "epoch": 6715} {"train_loss": -27.806232452392578, "global_step": 557389, "epoch": 6715} {"train_loss": -28.096271514892578, "global_step": 557390, "epoch": 6715} {"train_loss": -27.966291427612305, "global_step": 557391, "epoch": 6715} {"train_loss": -27.79390525817871, "global_step": 557392, "epoch": 6715} {"train_loss": -27.740758895874023, "global_step": 557393, "epoch": 6715} {"train_loss": -27.744977951049805, "global_step": 557394, "epoch": 6715} {"train_loss": -27.70991325378418, "global_step": 557395, "epoch": 6715} {"train_loss": -28.05689811706543, "global_step": 557396, "epoch": 6715} {"train_loss": -28.140411376953125, "global_step": 557397, "epoch": 6715} {"train_loss": -27.87043571472168, "global_step": 557398, "epoch": 6715} {"train_loss": -27.98480796813965, "global_step": 557399, "epoch": 6715} {"train_loss": -27.827001571655273, "global_step": 557400, "epoch": 6715} {"train_loss": -27.895532608032227, "global_step": 557401, "epoch": 6715} {"train_loss": -28.03740882873535, "global_step": 557402, "epoch": 6715} {"train_loss": -28.10749626159668, "global_step": 557403, "epoch": 6715} {"train_loss": -27.94202995300293, "global_step": 557404, "epoch": 6715} {"train_loss": -27.9952392578125, "global_step": 557405, "epoch": 6715} {"train_loss": -28.086957931518555, "global_step": 557406, "epoch": 6715} {"train_loss": -28.211963653564453, "global_step": 557407, "epoch": 6715} {"train_loss": -27.920124053955078, "global_step": 557408, "epoch": 6715} {"train_loss": -27.978424072265625, "global_step": 557409, "epoch": 6715} {"train_loss": -28.29705810546875, "global_step": 557410, "epoch": 6715} {"train_loss": -27.950098037719727, "global_step": 557411, "epoch": 6715} {"train_loss": -27.93071937561035, "global_step": 557412, "epoch": 6715} {"train_loss": -27.889972686767578, "global_step": 557413, "epoch": 6715} {"train_loss": -28.051727294921875, "global_step": 557414, "epoch": 6715} {"train_loss": -28.3480224609375, "global_step": 557415, "epoch": 6715} {"train_loss": -28.022811889648438, "global_step": 557416, "epoch": 6715} {"train_loss": -27.833972930908203, "global_step": 557417, "epoch": 6715} {"train_loss": -28.046361923217773, "global_step": 557418, "epoch": 6715} {"train_loss": -27.757923126220703, "global_step": 557419, "epoch": 6715} {"train_loss": -27.515592575073242, "global_step": 557420, "epoch": 6715} {"train_loss": -27.632709503173828, "global_step": 557421, "epoch": 6715} {"train_loss": -27.020944595336914, "global_step": 557422, "epoch": 6715} {"train_loss": -26.432348251342773, "global_step": 557423, "epoch": 6715} {"train_loss": -26.9160213470459, "global_step": 557424, "epoch": 6715} {"train_loss": -27.485105514526367, "global_step": 557425, "epoch": 6715} {"train_loss": -27.07368278503418, "global_step": 557426, "epoch": 6715} {"train_loss": -27.60912152945277, "global_step": 557427, "epoch": 6715, "val_loss": 6501718.0} {"train_loss": -26.658639907836914, "global_step": 557428, "epoch": 6716} {"train_loss": -26.79548454284668, "global_step": 557429, "epoch": 6716} {"train_loss": -26.091495513916016, "global_step": 557430, "epoch": 6716} {"train_loss": -27.063068389892578, "global_step": 557431, "epoch": 6716} {"train_loss": -26.573272705078125, "global_step": 557432, "epoch": 6716} {"train_loss": -27.160425186157227, "global_step": 557433, "epoch": 6716} {"train_loss": -26.976825714111328, "global_step": 557434, "epoch": 6716} {"train_loss": -26.80201530456543, "global_step": 557435, "epoch": 6716} {"train_loss": -26.87611198425293, "global_step": 557436, "epoch": 6716} {"train_loss": -26.90827751159668, "global_step": 557437, "epoch": 6716} {"train_loss": -26.546842575073242, "global_step": 557438, "epoch": 6716} {"train_loss": -27.129968643188477, "global_step": 557439, "epoch": 6716} {"train_loss": -26.94540786743164, "global_step": 557440, "epoch": 6716} {"train_loss": -27.296533584594727, "global_step": 557441, "epoch": 6716} {"train_loss": -26.973661422729492, "global_step": 557442, "epoch": 6716} {"train_loss": -26.74880027770996, "global_step": 557443, "epoch": 6716} {"train_loss": -26.890369415283203, "global_step": 557444, "epoch": 6716} {"train_loss": -27.3082332611084, "global_step": 557445, "epoch": 6716} {"train_loss": -27.337121963500977, "global_step": 557446, "epoch": 6716} {"train_loss": -27.42584228515625, "global_step": 557447, "epoch": 6716} {"train_loss": -27.2674617767334, "global_step": 557448, "epoch": 6716} {"train_loss": -27.289648056030273, "global_step": 557449, "epoch": 6716} {"train_loss": -27.099042892456055, "global_step": 557450, "epoch": 6716} {"train_loss": -27.308917999267578, "global_step": 557451, "epoch": 6716} {"train_loss": -27.532672882080078, "global_step": 557452, "epoch": 6716} {"train_loss": -27.711669921875, "global_step": 557453, "epoch": 6716} {"train_loss": -27.4393367767334, "global_step": 557454, "epoch": 6716} {"train_loss": -27.450077056884766, "global_step": 557455, "epoch": 6716} {"train_loss": -27.508283615112305, "global_step": 557456, "epoch": 6716} {"train_loss": -27.3552303314209, "global_step": 557457, "epoch": 6716} {"train_loss": -27.610931396484375, "global_step": 557458, "epoch": 6716} {"train_loss": -27.545637130737305, "global_step": 557459, "epoch": 6716} {"train_loss": -27.72958755493164, "global_step": 557460, "epoch": 6716} {"train_loss": -27.555770874023438, "global_step": 557461, "epoch": 6716} {"train_loss": -27.620121002197266, "global_step": 557462, "epoch": 6716} {"train_loss": -28.03228759765625, "global_step": 557463, "epoch": 6716} {"train_loss": -27.9636173248291, "global_step": 557464, "epoch": 6716} {"train_loss": -27.994068145751953, "global_step": 557465, "epoch": 6716} {"train_loss": -27.70857810974121, "global_step": 557466, "epoch": 6716} {"train_loss": -28.013629913330078, "global_step": 557467, "epoch": 6716} {"train_loss": -27.58534049987793, "global_step": 557468, "epoch": 6716} {"train_loss": -27.88075828552246, "global_step": 557469, "epoch": 6716} {"train_loss": -27.718957901000977, "global_step": 557470, "epoch": 6716} {"train_loss": -27.582916259765625, "global_step": 557471, "epoch": 6716} {"train_loss": -27.581029891967773, "global_step": 557472, "epoch": 6716} {"train_loss": -27.784543991088867, "global_step": 557473, "epoch": 6716} {"train_loss": -27.688220977783203, "global_step": 557474, "epoch": 6716} {"train_loss": -28.134525299072266, "global_step": 557475, "epoch": 6716} {"train_loss": -28.02557945251465, "global_step": 557476, "epoch": 6716} {"train_loss": -27.5965633392334, "global_step": 557477, "epoch": 6716} {"train_loss": -28.122724533081055, "global_step": 557478, "epoch": 6716} {"train_loss": -28.034351348876953, "global_step": 557479, "epoch": 6716} {"train_loss": -27.921899795532227, "global_step": 557480, "epoch": 6716} {"train_loss": -27.717456817626953, "global_step": 557481, "epoch": 6716} {"train_loss": -27.943679809570312, "global_step": 557482, "epoch": 6716} {"train_loss": -28.141494750976562, "global_step": 557483, "epoch": 6716} {"train_loss": -28.26312255859375, "global_step": 557484, "epoch": 6716} {"train_loss": -28.032119750976562, "global_step": 557485, "epoch": 6716} {"train_loss": -27.9749698638916, "global_step": 557486, "epoch": 6716} {"train_loss": -27.832794189453125, "global_step": 557487, "epoch": 6716} {"train_loss": -27.622472763061523, "global_step": 557488, "epoch": 6716} {"train_loss": -27.87952995300293, "global_step": 557489, "epoch": 6716} {"train_loss": -28.089557647705078, "global_step": 557490, "epoch": 6716} {"train_loss": -27.755517959594727, "global_step": 557491, "epoch": 6716} {"train_loss": -28.051977157592773, "global_step": 557492, "epoch": 6716} {"train_loss": -28.411956787109375, "global_step": 557493, "epoch": 6716} {"train_loss": -27.70611000061035, "global_step": 557494, "epoch": 6716} {"train_loss": -27.948322296142578, "global_step": 557495, "epoch": 6716} {"train_loss": -27.816816329956055, "global_step": 557496, "epoch": 6716} {"train_loss": -28.054767608642578, "global_step": 557497, "epoch": 6716} {"train_loss": -27.67335319519043, "global_step": 557498, "epoch": 6716} {"train_loss": -27.762414932250977, "global_step": 557499, "epoch": 6716} {"train_loss": -28.135009765625, "global_step": 557500, "epoch": 6716} {"train_loss": -28.179513931274414, "global_step": 557501, "epoch": 6716} {"train_loss": -27.75166130065918, "global_step": 557502, "epoch": 6716} {"train_loss": -27.921131134033203, "global_step": 557503, "epoch": 6716} {"train_loss": -27.760711669921875, "global_step": 557504, "epoch": 6716} {"train_loss": -27.846296310424805, "global_step": 557505, "epoch": 6716} {"train_loss": -28.129566192626953, "global_step": 557506, "epoch": 6716} {"train_loss": -28.170812606811523, "global_step": 557507, "epoch": 6716} {"train_loss": -28.201766967773438, "global_step": 557508, "epoch": 6716} {"train_loss": -28.170612335205078, "global_step": 557509, "epoch": 6716} {"train_loss": -27.625681314123682, "global_step": 557510, "epoch": 6716, "val_loss": 6472080.0} {"train_loss": -27.34518814086914, "global_step": 557511, "epoch": 6717} {"train_loss": -27.388492584228516, "global_step": 557512, "epoch": 6717} {"train_loss": -27.285934448242188, "global_step": 557513, "epoch": 6717} {"train_loss": -26.791431427001953, "global_step": 557514, "epoch": 6717} {"train_loss": -25.599130630493164, "global_step": 557515, "epoch": 6717} {"train_loss": -25.11728858947754, "global_step": 557516, "epoch": 6717} {"train_loss": -26.2890625, "global_step": 557517, "epoch": 6717} {"train_loss": -25.88923454284668, "global_step": 557518, "epoch": 6717} {"train_loss": -25.602767944335938, "global_step": 557519, "epoch": 6717} {"train_loss": -26.23752212524414, "global_step": 557520, "epoch": 6717} {"train_loss": -25.493906021118164, "global_step": 557521, "epoch": 6717} {"train_loss": -26.484601974487305, "global_step": 557522, "epoch": 6717} {"train_loss": -25.940946578979492, "global_step": 557523, "epoch": 6717} {"train_loss": -26.558155059814453, "global_step": 557524, "epoch": 6717} {"train_loss": -26.413793563842773, "global_step": 557525, "epoch": 6717} {"train_loss": -26.57859230041504, "global_step": 557526, "epoch": 6717} {"train_loss": -26.4370059967041, "global_step": 557527, "epoch": 6717} {"train_loss": -27.051116943359375, "global_step": 557528, "epoch": 6717} {"train_loss": -26.77497673034668, "global_step": 557529, "epoch": 6717} {"train_loss": -26.966535568237305, "global_step": 557530, "epoch": 6717} {"train_loss": -27.054931640625, "global_step": 557531, "epoch": 6717} {"train_loss": -27.025333404541016, "global_step": 557532, "epoch": 6717} {"train_loss": -27.408283233642578, "global_step": 557533, "epoch": 6717} {"train_loss": -27.06599235534668, "global_step": 557534, "epoch": 6717} {"train_loss": -27.102951049804688, "global_step": 557535, "epoch": 6717} {"train_loss": -27.236743927001953, "global_step": 557536, "epoch": 6717} {"train_loss": -27.296588897705078, "global_step": 557537, "epoch": 6717} {"train_loss": -27.367813110351562, "global_step": 557538, "epoch": 6717} {"train_loss": -27.031055450439453, "global_step": 557539, "epoch": 6717} {"train_loss": -27.13421630859375, "global_step": 557540, "epoch": 6717} {"train_loss": -27.26491355895996, "global_step": 557541, "epoch": 6717} {"train_loss": -27.45515251159668, "global_step": 557542, "epoch": 6717} {"train_loss": -27.0905704498291, "global_step": 557543, "epoch": 6717} {"train_loss": -27.483047485351562, "global_step": 557544, "epoch": 6717} {"train_loss": -27.500446319580078, "global_step": 557545, "epoch": 6717} {"train_loss": -27.563074111938477, "global_step": 557546, "epoch": 6717} {"train_loss": -27.692707061767578, "global_step": 557547, "epoch": 6717} {"train_loss": -27.50917625427246, "global_step": 557548, "epoch": 6717} {"train_loss": -27.602069854736328, "global_step": 557549, "epoch": 6717} {"train_loss": -27.389089584350586, "global_step": 557550, "epoch": 6717} {"train_loss": -27.35536766052246, "global_step": 557551, "epoch": 6717} {"train_loss": -27.47881507873535, "global_step": 557552, "epoch": 6717} {"train_loss": -27.7060604095459, "global_step": 557553, "epoch": 6717} {"train_loss": -27.8941707611084, "global_step": 557554, "epoch": 6717} {"train_loss": -27.71588134765625, "global_step": 557555, "epoch": 6717} {"train_loss": -27.573530197143555, "global_step": 557556, "epoch": 6717} {"train_loss": -27.82373046875, "global_step": 557557, "epoch": 6717} {"train_loss": -27.957645416259766, "global_step": 557558, "epoch": 6717} {"train_loss": -27.57215690612793, "global_step": 557559, "epoch": 6717} {"train_loss": -27.88214683532715, "global_step": 557560, "epoch": 6717} {"train_loss": -27.72673988342285, "global_step": 557561, "epoch": 6717} {"train_loss": -27.9864559173584, "global_step": 557562, "epoch": 6717} {"train_loss": -27.731399536132812, "global_step": 557563, "epoch": 6717} {"train_loss": -27.591089248657227, "global_step": 557564, "epoch": 6717} {"train_loss": -27.697280883789062, "global_step": 557565, "epoch": 6717} {"train_loss": -27.821638107299805, "global_step": 557566, "epoch": 6717} {"train_loss": -27.840742111206055, "global_step": 557567, "epoch": 6717} {"train_loss": -27.906763076782227, "global_step": 557568, "epoch": 6717} {"train_loss": -27.897729873657227, "global_step": 557569, "epoch": 6717} {"train_loss": -27.758398056030273, "global_step": 557570, "epoch": 6717} {"train_loss": -28.32781410217285, "global_step": 557571, "epoch": 6717} {"train_loss": -27.98394775390625, "global_step": 557572, "epoch": 6717} {"train_loss": -27.898181915283203, "global_step": 557573, "epoch": 6717} {"train_loss": -28.162933349609375, "global_step": 557574, "epoch": 6717} {"train_loss": -28.26506996154785, "global_step": 557575, "epoch": 6717} {"train_loss": -27.907459259033203, "global_step": 557576, "epoch": 6717} {"train_loss": -28.361572265625, "global_step": 557577, "epoch": 6717} {"train_loss": -27.77789306640625, "global_step": 557578, "epoch": 6717} {"train_loss": -27.97391700744629, "global_step": 557579, "epoch": 6717} {"train_loss": -28.144269943237305, "global_step": 557580, "epoch": 6717} {"train_loss": -27.98223304748535, "global_step": 557581, "epoch": 6717} {"train_loss": -28.121809005737305, "global_step": 557582, "epoch": 6717} {"train_loss": -28.262420654296875, "global_step": 557583, "epoch": 6717} {"train_loss": -27.925344467163086, "global_step": 557584, "epoch": 6717} {"train_loss": -27.909656524658203, "global_step": 557585, "epoch": 6717} {"train_loss": -27.627904891967773, "global_step": 557586, "epoch": 6717} {"train_loss": -27.9212589263916, "global_step": 557587, "epoch": 6717} {"train_loss": -27.98626708984375, "global_step": 557588, "epoch": 6717} {"train_loss": -28.18868064880371, "global_step": 557589, "epoch": 6717} {"train_loss": -27.74875259399414, "global_step": 557590, "epoch": 6717} {"train_loss": -27.92181968688965, "global_step": 557591, "epoch": 6717} {"train_loss": -28.092443466186523, "global_step": 557592, "epoch": 6717} {"train_loss": -27.400787790137603, "global_step": 557593, "epoch": 6717, "val_loss": 6470375.0} {"train_loss": -27.43633460998535, "global_step": 557594, "epoch": 6718} {"train_loss": -27.099958419799805, "global_step": 557595, "epoch": 6718} {"train_loss": -27.5499267578125, "global_step": 557596, "epoch": 6718} {"train_loss": -27.46611976623535, "global_step": 557597, "epoch": 6718} {"train_loss": -27.401376724243164, "global_step": 557598, "epoch": 6718} {"train_loss": -27.200088500976562, "global_step": 557599, "epoch": 6718} {"train_loss": -27.336130142211914, "global_step": 557600, "epoch": 6718} {"train_loss": -27.894689559936523, "global_step": 557601, "epoch": 6718} {"train_loss": -27.619556427001953, "global_step": 557602, "epoch": 6718} {"train_loss": -26.995935440063477, "global_step": 557603, "epoch": 6718} {"train_loss": -27.956037521362305, "global_step": 557604, "epoch": 6718} {"train_loss": -27.460004806518555, "global_step": 557605, "epoch": 6718} {"train_loss": -27.595712661743164, "global_step": 557606, "epoch": 6718} {"train_loss": -26.750635147094727, "global_step": 557607, "epoch": 6718} {"train_loss": -27.64863395690918, "global_step": 557608, "epoch": 6718} {"train_loss": -27.884796142578125, "global_step": 557609, "epoch": 6718} {"train_loss": -27.587005615234375, "global_step": 557610, "epoch": 6718} {"train_loss": -27.54227638244629, "global_step": 557611, "epoch": 6718} {"train_loss": -27.584299087524414, "global_step": 557612, "epoch": 6718} {"train_loss": -27.89911460876465, "global_step": 557613, "epoch": 6718} {"train_loss": -27.830915451049805, "global_step": 557614, "epoch": 6718} {"train_loss": -27.9670352935791, "global_step": 557615, "epoch": 6718} {"train_loss": -27.383459091186523, "global_step": 557616, "epoch": 6718} {"train_loss": -27.539154052734375, "global_step": 557617, "epoch": 6718} {"train_loss": -27.520978927612305, "global_step": 557618, "epoch": 6718} {"train_loss": -27.68399429321289, "global_step": 557619, "epoch": 6718} {"train_loss": -27.71404457092285, "global_step": 557620, "epoch": 6718} {"train_loss": -27.806772232055664, "global_step": 557621, "epoch": 6718} {"train_loss": -27.899383544921875, "global_step": 557622, "epoch": 6718} {"train_loss": -27.538549423217773, "global_step": 557623, "epoch": 6718} {"train_loss": -28.087507247924805, "global_step": 557624, "epoch": 6718} {"train_loss": -27.732343673706055, "global_step": 557625, "epoch": 6718} {"train_loss": -27.877521514892578, "global_step": 557626, "epoch": 6718} {"train_loss": -27.845388412475586, "global_step": 557627, "epoch": 6718} {"train_loss": -27.810077667236328, "global_step": 557628, "epoch": 6718} {"train_loss": -28.06623649597168, "global_step": 557629, "epoch": 6718} {"train_loss": -27.94917106628418, "global_step": 557630, "epoch": 6718} {"train_loss": -27.800077438354492, "global_step": 557631, "epoch": 6718} {"train_loss": -27.64882469177246, "global_step": 557632, "epoch": 6718} {"train_loss": -27.89447593688965, "global_step": 557633, "epoch": 6718} {"train_loss": -27.475690841674805, "global_step": 557634, "epoch": 6718} {"train_loss": -27.810596466064453, "global_step": 557635, "epoch": 6718} {"train_loss": -27.6031551361084, "global_step": 557636, "epoch": 6718} {"train_loss": -28.218738555908203, "global_step": 557637, "epoch": 6718} {"train_loss": -27.60567283630371, "global_step": 557638, "epoch": 6718} {"train_loss": -27.905933380126953, "global_step": 557639, "epoch": 6718} {"train_loss": -27.455829620361328, "global_step": 557640, "epoch": 6718} {"train_loss": -27.82855224609375, "global_step": 557641, "epoch": 6718} {"train_loss": -27.853504180908203, "global_step": 557642, "epoch": 6718} {"train_loss": -27.713788986206055, "global_step": 557643, "epoch": 6718} {"train_loss": -27.738733291625977, "global_step": 557644, "epoch": 6718} {"train_loss": -27.76576042175293, "global_step": 557645, "epoch": 6718} {"train_loss": -28.035587310791016, "global_step": 557646, "epoch": 6718} {"train_loss": -27.698810577392578, "global_step": 557647, "epoch": 6718} {"train_loss": -27.76030921936035, "global_step": 557648, "epoch": 6718} {"train_loss": -27.800474166870117, "global_step": 557649, "epoch": 6718} {"train_loss": -28.147485733032227, "global_step": 557650, "epoch": 6718} {"train_loss": -28.188867568969727, "global_step": 557651, "epoch": 6718} {"train_loss": -27.45330810546875, "global_step": 557652, "epoch": 6718} {"train_loss": -27.449628829956055, "global_step": 557653, "epoch": 6718} {"train_loss": -27.413745880126953, "global_step": 557654, "epoch": 6718} {"train_loss": -27.925092697143555, "global_step": 557655, "epoch": 6718} {"train_loss": -27.269092559814453, "global_step": 557656, "epoch": 6718} {"train_loss": -27.053024291992188, "global_step": 557657, "epoch": 6718} {"train_loss": -27.598127365112305, "global_step": 557658, "epoch": 6718} {"train_loss": -27.53973388671875, "global_step": 557659, "epoch": 6718} {"train_loss": -26.748218536376953, "global_step": 557660, "epoch": 6718} {"train_loss": -26.945459365844727, "global_step": 557661, "epoch": 6718} {"train_loss": -27.82039451599121, "global_step": 557662, "epoch": 6718} {"train_loss": -27.5343074798584, "global_step": 557663, "epoch": 6718} {"train_loss": -27.395435333251953, "global_step": 557664, "epoch": 6718} {"train_loss": -27.328887939453125, "global_step": 557665, "epoch": 6718} {"train_loss": -27.6739559173584, "global_step": 557666, "epoch": 6718} {"train_loss": -27.352313995361328, "global_step": 557667, "epoch": 6718} {"train_loss": -27.359542846679688, "global_step": 557668, "epoch": 6718} {"train_loss": -27.641538619995117, "global_step": 557669, "epoch": 6718} {"train_loss": -27.324462890625, "global_step": 557670, "epoch": 6718} {"train_loss": -27.534534454345703, "global_step": 557671, "epoch": 6718} {"train_loss": -28.00836753845215, "global_step": 557672, "epoch": 6718} {"train_loss": -27.726953506469727, "global_step": 557673, "epoch": 6718} {"train_loss": -27.774505615234375, "global_step": 557674, "epoch": 6718} {"train_loss": -27.8535099029541, "global_step": 557675, "epoch": 6718} {"train_loss": -27.634204818541747, "global_step": 557676, "epoch": 6718, "val_loss": 6512534.5} {"train_loss": -27.350360870361328, "global_step": 557677, "epoch": 6719} {"train_loss": -26.696521759033203, "global_step": 557678, "epoch": 6719} {"train_loss": -27.109128952026367, "global_step": 557679, "epoch": 6719} {"train_loss": -26.781967163085938, "global_step": 557680, "epoch": 6719} {"train_loss": -26.974462509155273, "global_step": 557681, "epoch": 6719} {"train_loss": -27.163679122924805, "global_step": 557682, "epoch": 6719} {"train_loss": -27.67764663696289, "global_step": 557683, "epoch": 6719} {"train_loss": -27.097570419311523, "global_step": 557684, "epoch": 6719} {"train_loss": -27.399036407470703, "global_step": 557685, "epoch": 6719} {"train_loss": -27.3829345703125, "global_step": 557686, "epoch": 6719} {"train_loss": -26.86676025390625, "global_step": 557687, "epoch": 6719} {"train_loss": -27.417768478393555, "global_step": 557688, "epoch": 6719} {"train_loss": -27.4080810546875, "global_step": 557689, "epoch": 6719} {"train_loss": -27.179101943969727, "global_step": 557690, "epoch": 6719} {"train_loss": -27.487140655517578, "global_step": 557691, "epoch": 6719} {"train_loss": -27.035369873046875, "global_step": 557692, "epoch": 6719} {"train_loss": -27.261377334594727, "global_step": 557693, "epoch": 6719} {"train_loss": -27.425567626953125, "global_step": 557694, "epoch": 6719} {"train_loss": -27.421741485595703, "global_step": 557695, "epoch": 6719} {"train_loss": -27.494129180908203, "global_step": 557696, "epoch": 6719} {"train_loss": -27.35236930847168, "global_step": 557697, "epoch": 6719} {"train_loss": -27.58831214904785, "global_step": 557698, "epoch": 6719} {"train_loss": -27.63815689086914, "global_step": 557699, "epoch": 6719} {"train_loss": -27.27387046813965, "global_step": 557700, "epoch": 6719} {"train_loss": -27.343408584594727, "global_step": 557701, "epoch": 6719} {"train_loss": -27.484975814819336, "global_step": 557702, "epoch": 6719} {"train_loss": -27.503808975219727, "global_step": 557703, "epoch": 6719} {"train_loss": -27.552892684936523, "global_step": 557704, "epoch": 6719} {"train_loss": -27.78545570373535, "global_step": 557705, "epoch": 6719} {"train_loss": -27.647916793823242, "global_step": 557706, "epoch": 6719} {"train_loss": -27.599319458007812, "global_step": 557707, "epoch": 6719} {"train_loss": -28.067346572875977, "global_step": 557708, "epoch": 6719} {"train_loss": -27.37171745300293, "global_step": 557709, "epoch": 6719} {"train_loss": -28.273147583007812, "global_step": 557710, "epoch": 6719} {"train_loss": -27.745319366455078, "global_step": 557711, "epoch": 6719} {"train_loss": -27.609655380249023, "global_step": 557712, "epoch": 6719} {"train_loss": -27.82021141052246, "global_step": 557713, "epoch": 6719} {"train_loss": -27.775379180908203, "global_step": 557714, "epoch": 6719} {"train_loss": -27.70014762878418, "global_step": 557715, "epoch": 6719} {"train_loss": -27.79084587097168, "global_step": 557716, "epoch": 6719} {"train_loss": -28.228118896484375, "global_step": 557717, "epoch": 6719} {"train_loss": -27.5073299407959, "global_step": 557718, "epoch": 6719} {"train_loss": -27.707324981689453, "global_step": 557719, "epoch": 6719} {"train_loss": -27.251434326171875, "global_step": 557720, "epoch": 6719} {"train_loss": -27.85222816467285, "global_step": 557721, "epoch": 6719} {"train_loss": -27.656726837158203, "global_step": 557722, "epoch": 6719} {"train_loss": -28.037296295166016, "global_step": 557723, "epoch": 6719} {"train_loss": -28.12798500061035, "global_step": 557724, "epoch": 6719} {"train_loss": -28.309972763061523, "global_step": 557725, "epoch": 6719} {"train_loss": -27.886606216430664, "global_step": 557726, "epoch": 6719} {"train_loss": -27.912092208862305, "global_step": 557727, "epoch": 6719} {"train_loss": -27.624271392822266, "global_step": 557728, "epoch": 6719} {"train_loss": -28.147809982299805, "global_step": 557729, "epoch": 6719} {"train_loss": -27.705564498901367, "global_step": 557730, "epoch": 6719} {"train_loss": -28.14243507385254, "global_step": 557731, "epoch": 6719} {"train_loss": -28.30194664001465, "global_step": 557732, "epoch": 6719} {"train_loss": -27.996137619018555, "global_step": 557733, "epoch": 6719} {"train_loss": -28.214893341064453, "global_step": 557734, "epoch": 6719} {"train_loss": -27.7829532623291, "global_step": 557735, "epoch": 6719} {"train_loss": -27.645471572875977, "global_step": 557736, "epoch": 6719} {"train_loss": -28.19415855407715, "global_step": 557737, "epoch": 6719} {"train_loss": -27.80600357055664, "global_step": 557738, "epoch": 6719} {"train_loss": -27.917646408081055, "global_step": 557739, "epoch": 6719} {"train_loss": -27.744352340698242, "global_step": 557740, "epoch": 6719} {"train_loss": -27.94086265563965, "global_step": 557741, "epoch": 6719} {"train_loss": -27.603778839111328, "global_step": 557742, "epoch": 6719} {"train_loss": -28.126483917236328, "global_step": 557743, "epoch": 6719} {"train_loss": -28.12061882019043, "global_step": 557744, "epoch": 6719} {"train_loss": -28.184370040893555, "global_step": 557745, "epoch": 6719} {"train_loss": -27.99665641784668, "global_step": 557746, "epoch": 6719} {"train_loss": -27.443769454956055, "global_step": 557747, "epoch": 6719} {"train_loss": -27.8255558013916, "global_step": 557748, "epoch": 6719} {"train_loss": -28.119535446166992, "global_step": 557749, "epoch": 6719} {"train_loss": -27.801589965820312, "global_step": 557750, "epoch": 6719} {"train_loss": -27.94022560119629, "global_step": 557751, "epoch": 6719} {"train_loss": -28.139633178710938, "global_step": 557752, "epoch": 6719} {"train_loss": -27.946319580078125, "global_step": 557753, "epoch": 6719} {"train_loss": -27.488479614257812, "global_step": 557754, "epoch": 6719} {"train_loss": -27.824941635131836, "global_step": 557755, "epoch": 6719} {"train_loss": -27.858264923095703, "global_step": 557756, "epoch": 6719} {"train_loss": -28.044376373291016, "global_step": 557757, "epoch": 6719} {"train_loss": -27.926422119140625, "global_step": 557758, "epoch": 6719} {"train_loss": -27.695020882480115, "global_step": 557759, "epoch": 6719, "val_loss": 6520052.0} {"train_loss": -26.792688369750977, "global_step": 557760, "epoch": 6720} {"train_loss": -26.820295333862305, "global_step": 557761, "epoch": 6720} {"train_loss": -27.025930404663086, "global_step": 557762, "epoch": 6720} {"train_loss": -26.98395347595215, "global_step": 557763, "epoch": 6720} {"train_loss": -26.424854278564453, "global_step": 557764, "epoch": 6720} {"train_loss": -27.13393211364746, "global_step": 557765, "epoch": 6720} {"train_loss": -27.245452880859375, "global_step": 557766, "epoch": 6720} {"train_loss": -27.169296264648438, "global_step": 557767, "epoch": 6720} {"train_loss": -26.466476440429688, "global_step": 557768, "epoch": 6720} {"train_loss": -26.924060821533203, "global_step": 557769, "epoch": 6720} {"train_loss": -26.9847412109375, "global_step": 557770, "epoch": 6720} {"train_loss": -26.96466636657715, "global_step": 557771, "epoch": 6720} {"train_loss": -27.167097091674805, "global_step": 557772, "epoch": 6720} {"train_loss": -27.70432472229004, "global_step": 557773, "epoch": 6720} {"train_loss": -27.516321182250977, "global_step": 557774, "epoch": 6720} {"train_loss": -27.468595504760742, "global_step": 557775, "epoch": 6720} {"train_loss": -27.37837028503418, "global_step": 557776, "epoch": 6720} {"train_loss": -27.658267974853516, "global_step": 557777, "epoch": 6720} {"train_loss": -27.49897575378418, "global_step": 557778, "epoch": 6720} {"train_loss": -27.62129020690918, "global_step": 557779, "epoch": 6720} {"train_loss": -27.385822296142578, "global_step": 557780, "epoch": 6720} {"train_loss": -27.63762855529785, "global_step": 557781, "epoch": 6720} {"train_loss": -27.478595733642578, "global_step": 557782, "epoch": 6720} {"train_loss": -27.314001083374023, "global_step": 557783, "epoch": 6720} {"train_loss": -27.696191787719727, "global_step": 557784, "epoch": 6720} {"train_loss": -27.710498809814453, "global_step": 557785, "epoch": 6720} {"train_loss": -27.819965362548828, "global_step": 557786, "epoch": 6720} {"train_loss": -27.546396255493164, "global_step": 557787, "epoch": 6720} {"train_loss": -27.7525634765625, "global_step": 557788, "epoch": 6720} {"train_loss": -27.53291893005371, "global_step": 557789, "epoch": 6720} {"train_loss": -27.98404312133789, "global_step": 557790, "epoch": 6720} {"train_loss": -27.581811904907227, "global_step": 557791, "epoch": 6720} {"train_loss": -27.774511337280273, "global_step": 557792, "epoch": 6720} {"train_loss": -27.635679244995117, "global_step": 557793, "epoch": 6720} {"train_loss": -27.655027389526367, "global_step": 557794, "epoch": 6720} {"train_loss": -27.835742950439453, "global_step": 557795, "epoch": 6720} {"train_loss": -28.133115768432617, "global_step": 557796, "epoch": 6720} {"train_loss": -27.5839900970459, "global_step": 557797, "epoch": 6720} {"train_loss": -27.874073028564453, "global_step": 557798, "epoch": 6720} {"train_loss": -28.0955810546875, "global_step": 557799, "epoch": 6720} {"train_loss": -27.81243896484375, "global_step": 557800, "epoch": 6720} {"train_loss": -27.757253646850586, "global_step": 557801, "epoch": 6720} {"train_loss": -27.758214950561523, "global_step": 557802, "epoch": 6720} {"train_loss": -27.94880485534668, "global_step": 557803, "epoch": 6720} {"train_loss": -27.9638729095459, "global_step": 557804, "epoch": 6720} {"train_loss": -28.010129928588867, "global_step": 557805, "epoch": 6720} {"train_loss": -28.271371841430664, "global_step": 557806, "epoch": 6720} {"train_loss": -27.888158798217773, "global_step": 557807, "epoch": 6720} {"train_loss": -28.225866317749023, "global_step": 557808, "epoch": 6720} {"train_loss": -27.69929313659668, "global_step": 557809, "epoch": 6720} {"train_loss": -28.181060791015625, "global_step": 557810, "epoch": 6720} {"train_loss": -27.95831871032715, "global_step": 557811, "epoch": 6720} {"train_loss": -27.958356857299805, "global_step": 557812, "epoch": 6720} {"train_loss": -28.363019943237305, "global_step": 557813, "epoch": 6720} {"train_loss": -27.9774169921875, "global_step": 557814, "epoch": 6720} {"train_loss": -28.132822036743164, "global_step": 557815, "epoch": 6720} {"train_loss": -28.028064727783203, "global_step": 557816, "epoch": 6720} {"train_loss": -28.121267318725586, "global_step": 557817, "epoch": 6720} {"train_loss": -27.785696029663086, "global_step": 557818, "epoch": 6720} {"train_loss": -28.013477325439453, "global_step": 557819, "epoch": 6720} {"train_loss": -28.31492042541504, "global_step": 557820, "epoch": 6720} {"train_loss": -27.933385848999023, "global_step": 557821, "epoch": 6720} {"train_loss": -27.563674926757812, "global_step": 557822, "epoch": 6720} {"train_loss": -27.928266525268555, "global_step": 557823, "epoch": 6720} {"train_loss": -27.805288314819336, "global_step": 557824, "epoch": 6720} {"train_loss": -27.29871940612793, "global_step": 557825, "epoch": 6720} {"train_loss": -26.9936580657959, "global_step": 557826, "epoch": 6720} {"train_loss": -26.814334869384766, "global_step": 557827, "epoch": 6720} {"train_loss": -26.85264015197754, "global_step": 557828, "epoch": 6720} {"train_loss": -27.72965431213379, "global_step": 557829, "epoch": 6720} {"train_loss": -27.63165855407715, "global_step": 557830, "epoch": 6720} {"train_loss": -27.40398597717285, "global_step": 557831, "epoch": 6720} {"train_loss": -27.123615264892578, "global_step": 557832, "epoch": 6720} {"train_loss": -27.335437774658203, "global_step": 557833, "epoch": 6720} {"train_loss": -27.5990047454834, "global_step": 557834, "epoch": 6720} {"train_loss": -27.712305068969727, "global_step": 557835, "epoch": 6720} {"train_loss": -27.388355255126953, "global_step": 557836, "epoch": 6720} {"train_loss": -27.76300621032715, "global_step": 557837, "epoch": 6720} {"train_loss": -27.705020904541016, "global_step": 557838, "epoch": 6720} {"train_loss": -27.556650161743164, "global_step": 557839, "epoch": 6720} {"train_loss": -27.85603904724121, "global_step": 557840, "epoch": 6720} {"train_loss": -27.493494033813477, "global_step": 557841, "epoch": 6720} {"train_loss": -27.578734708119587, "global_step": 557842, "epoch": 6720, "val_loss": 6500231.0} {"train_loss": -27.364856719970703, "global_step": 557843, "epoch": 6721} {"train_loss": -27.76202964782715, "global_step": 557844, "epoch": 6721} {"train_loss": -27.185455322265625, "global_step": 557845, "epoch": 6721} {"train_loss": -27.711774826049805, "global_step": 557846, "epoch": 6721} {"train_loss": -27.16010856628418, "global_step": 557847, "epoch": 6721} {"train_loss": -27.287389755249023, "global_step": 557848, "epoch": 6721} {"train_loss": -27.224369049072266, "global_step": 557849, "epoch": 6721} {"train_loss": -27.51704216003418, "global_step": 557850, "epoch": 6721} {"train_loss": -27.373022079467773, "global_step": 557851, "epoch": 6721} {"train_loss": -27.340871810913086, "global_step": 557852, "epoch": 6721} {"train_loss": -27.807031631469727, "global_step": 557853, "epoch": 6721} {"train_loss": -27.455896377563477, "global_step": 557854, "epoch": 6721} {"train_loss": -27.7025089263916, "global_step": 557855, "epoch": 6721} {"train_loss": -27.259769439697266, "global_step": 557856, "epoch": 6721} {"train_loss": -27.3243350982666, "global_step": 557857, "epoch": 6721} {"train_loss": -27.609649658203125, "global_step": 557858, "epoch": 6721} {"train_loss": -27.09799575805664, "global_step": 557859, "epoch": 6721} {"train_loss": -27.24312400817871, "global_step": 557860, "epoch": 6721} {"train_loss": -27.844074249267578, "global_step": 557861, "epoch": 6721} {"train_loss": -27.352529525756836, "global_step": 557862, "epoch": 6721} {"train_loss": -27.52992820739746, "global_step": 557863, "epoch": 6721} {"train_loss": -27.307907104492188, "global_step": 557864, "epoch": 6721} {"train_loss": -27.2322940826416, "global_step": 557865, "epoch": 6721} {"train_loss": -27.634916305541992, "global_step": 557866, "epoch": 6721} {"train_loss": -27.64118003845215, "global_step": 557867, "epoch": 6721} {"train_loss": -27.543134689331055, "global_step": 557868, "epoch": 6721} {"train_loss": -27.908863067626953, "global_step": 557869, "epoch": 6721} {"train_loss": -27.498645782470703, "global_step": 557870, "epoch": 6721} {"train_loss": -27.704944610595703, "global_step": 557871, "epoch": 6721} {"train_loss": -27.698532104492188, "global_step": 557872, "epoch": 6721} {"train_loss": -27.47434425354004, "global_step": 557873, "epoch": 6721} {"train_loss": -27.8126163482666, "global_step": 557874, "epoch": 6721} {"train_loss": -27.419824600219727, "global_step": 557875, "epoch": 6721} {"train_loss": -28.106725692749023, "global_step": 557876, "epoch": 6721} {"train_loss": -27.580480575561523, "global_step": 557877, "epoch": 6721} {"train_loss": -27.598377227783203, "global_step": 557878, "epoch": 6721} {"train_loss": -27.870107650756836, "global_step": 557879, "epoch": 6721} {"train_loss": -27.712188720703125, "global_step": 557880, "epoch": 6721} {"train_loss": -27.9447021484375, "global_step": 557881, "epoch": 6721} {"train_loss": -27.97968864440918, "global_step": 557882, "epoch": 6721} {"train_loss": -27.896581649780273, "global_step": 557883, "epoch": 6721} {"train_loss": -27.777545928955078, "global_step": 557884, "epoch": 6721} {"train_loss": -27.84758949279785, "global_step": 557885, "epoch": 6721} {"train_loss": -27.651611328125, "global_step": 557886, "epoch": 6721} {"train_loss": -27.779409408569336, "global_step": 557887, "epoch": 6721} {"train_loss": -27.9372615814209, "global_step": 557888, "epoch": 6721} {"train_loss": -27.561141967773438, "global_step": 557889, "epoch": 6721} {"train_loss": -28.041345596313477, "global_step": 557890, "epoch": 6721} {"train_loss": -27.92622947692871, "global_step": 557891, "epoch": 6721} {"train_loss": -27.977502822875977, "global_step": 557892, "epoch": 6721} {"train_loss": -28.071218490600586, "global_step": 557893, "epoch": 6721} {"train_loss": -28.23404312133789, "global_step": 557894, "epoch": 6721} {"train_loss": -27.980667114257812, "global_step": 557895, "epoch": 6721} {"train_loss": -27.927387237548828, "global_step": 557896, "epoch": 6721} {"train_loss": -28.024946212768555, "global_step": 557897, "epoch": 6721} {"train_loss": -28.094247817993164, "global_step": 557898, "epoch": 6721} {"train_loss": -28.021076202392578, "global_step": 557899, "epoch": 6721} {"train_loss": -27.948755264282227, "global_step": 557900, "epoch": 6721} {"train_loss": -28.12941551208496, "global_step": 557901, "epoch": 6721} {"train_loss": -27.690149307250977, "global_step": 557902, "epoch": 6721} {"train_loss": -27.76910972595215, "global_step": 557903, "epoch": 6721} {"train_loss": -27.480573654174805, "global_step": 557904, "epoch": 6721} {"train_loss": -27.924213409423828, "global_step": 557905, "epoch": 6721} {"train_loss": -28.087888717651367, "global_step": 557906, "epoch": 6721} {"train_loss": -27.82996940612793, "global_step": 557907, "epoch": 6721} {"train_loss": -27.7379207611084, "global_step": 557908, "epoch": 6721} {"train_loss": -27.815046310424805, "global_step": 557909, "epoch": 6721} {"train_loss": -27.597482681274414, "global_step": 557910, "epoch": 6721} {"train_loss": -27.188928604125977, "global_step": 557911, "epoch": 6721} {"train_loss": -27.715682983398438, "global_step": 557912, "epoch": 6721} {"train_loss": -27.746641159057617, "global_step": 557913, "epoch": 6721} {"train_loss": -27.821563720703125, "global_step": 557914, "epoch": 6721} {"train_loss": -27.99769401550293, "global_step": 557915, "epoch": 6721} {"train_loss": -27.884973526000977, "global_step": 557916, "epoch": 6721} {"train_loss": -27.739301681518555, "global_step": 557917, "epoch": 6721} {"train_loss": -27.683454513549805, "global_step": 557918, "epoch": 6721} {"train_loss": -27.415363311767578, "global_step": 557919, "epoch": 6721} {"train_loss": -27.888708114624023, "global_step": 557920, "epoch": 6721} {"train_loss": -27.736753463745117, "global_step": 557921, "epoch": 6721} {"train_loss": -27.634740829467773, "global_step": 557922, "epoch": 6721} {"train_loss": -27.519912719726562, "global_step": 557923, "epoch": 6721} {"train_loss": -27.581836700439453, "global_step": 557924, "epoch": 6721} {"train_loss": -27.692397818507917, "global_step": 557925, "epoch": 6721, "val_loss": 6505879.5} {"train_loss": -27.45136833190918, "global_step": 557926, "epoch": 6722} {"train_loss": -27.082555770874023, "global_step": 557927, "epoch": 6722} {"train_loss": -26.99293327331543, "global_step": 557928, "epoch": 6722} {"train_loss": -27.2794189453125, "global_step": 557929, "epoch": 6722} {"train_loss": -27.50912857055664, "global_step": 557930, "epoch": 6722} {"train_loss": -27.53285026550293, "global_step": 557931, "epoch": 6722} {"train_loss": -27.174802780151367, "global_step": 557932, "epoch": 6722} {"train_loss": -27.457059860229492, "global_step": 557933, "epoch": 6722} {"train_loss": -27.26601219177246, "global_step": 557934, "epoch": 6722} {"train_loss": -27.417224884033203, "global_step": 557935, "epoch": 6722} {"train_loss": -27.613737106323242, "global_step": 557936, "epoch": 6722} {"train_loss": -27.51462745666504, "global_step": 557937, "epoch": 6722} {"train_loss": -27.7048282623291, "global_step": 557938, "epoch": 6722} {"train_loss": -27.531707763671875, "global_step": 557939, "epoch": 6722} {"train_loss": -27.623815536499023, "global_step": 557940, "epoch": 6722} {"train_loss": -27.860376358032227, "global_step": 557941, "epoch": 6722} {"train_loss": -27.659345626831055, "global_step": 557942, "epoch": 6722} {"train_loss": -27.820653915405273, "global_step": 557943, "epoch": 6722} {"train_loss": -27.812665939331055, "global_step": 557944, "epoch": 6722} {"train_loss": -27.66533851623535, "global_step": 557945, "epoch": 6722} {"train_loss": -27.83306884765625, "global_step": 557946, "epoch": 6722} {"train_loss": -27.841154098510742, "global_step": 557947, "epoch": 6722} {"train_loss": -27.917875289916992, "global_step": 557948, "epoch": 6722} {"train_loss": -28.1370906829834, "global_step": 557949, "epoch": 6722} {"train_loss": -27.4853515625, "global_step": 557950, "epoch": 6722} {"train_loss": -27.80964469909668, "global_step": 557951, "epoch": 6722} {"train_loss": -27.789886474609375, "global_step": 557952, "epoch": 6722} {"train_loss": -27.701074600219727, "global_step": 557953, "epoch": 6722} {"train_loss": -28.00531005859375, "global_step": 557954, "epoch": 6722} {"train_loss": -28.003467559814453, "global_step": 557955, "epoch": 6722} {"train_loss": -28.33540153503418, "global_step": 557956, "epoch": 6722} {"train_loss": -27.71539878845215, "global_step": 557957, "epoch": 6722} {"train_loss": -27.771406173706055, "global_step": 557958, "epoch": 6722} {"train_loss": -27.782861709594727, "global_step": 557959, "epoch": 6722} {"train_loss": -27.915491104125977, "global_step": 557960, "epoch": 6722} {"train_loss": -28.16998863220215, "global_step": 557961, "epoch": 6722} {"train_loss": -27.934497833251953, "global_step": 557962, "epoch": 6722} {"train_loss": -28.012475967407227, "global_step": 557963, "epoch": 6722} {"train_loss": -27.99652099609375, "global_step": 557964, "epoch": 6722} {"train_loss": -27.922760009765625, "global_step": 557965, "epoch": 6722} {"train_loss": -28.17439079284668, "global_step": 557966, "epoch": 6722} {"train_loss": -28.025686264038086, "global_step": 557967, "epoch": 6722} {"train_loss": -27.86673927307129, "global_step": 557968, "epoch": 6722} {"train_loss": -27.925992965698242, "global_step": 557969, "epoch": 6722} {"train_loss": -28.0465145111084, "global_step": 557970, "epoch": 6722} {"train_loss": -27.8502254486084, "global_step": 557971, "epoch": 6722} {"train_loss": -27.861806869506836, "global_step": 557972, "epoch": 6722} {"train_loss": -28.040729522705078, "global_step": 557973, "epoch": 6722} {"train_loss": -27.8631649017334, "global_step": 557974, "epoch": 6722} {"train_loss": -28.151443481445312, "global_step": 557975, "epoch": 6722} {"train_loss": -28.068817138671875, "global_step": 557976, "epoch": 6722} {"train_loss": -27.931249618530273, "global_step": 557977, "epoch": 6722} {"train_loss": -27.7880859375, "global_step": 557978, "epoch": 6722} {"train_loss": -27.974933624267578, "global_step": 557979, "epoch": 6722} {"train_loss": -27.918231964111328, "global_step": 557980, "epoch": 6722} {"train_loss": -27.584823608398438, "global_step": 557981, "epoch": 6722} {"train_loss": -27.46233558654785, "global_step": 557982, "epoch": 6722} {"train_loss": -27.0772762298584, "global_step": 557983, "epoch": 6722} {"train_loss": -27.3425350189209, "global_step": 557984, "epoch": 6722} {"train_loss": -27.39727210998535, "global_step": 557985, "epoch": 6722} {"train_loss": -27.81252098083496, "global_step": 557986, "epoch": 6722} {"train_loss": -27.822702407836914, "global_step": 557987, "epoch": 6722} {"train_loss": -28.044248580932617, "global_step": 557988, "epoch": 6722} {"train_loss": -27.933645248413086, "global_step": 557989, "epoch": 6722} {"train_loss": -27.706329345703125, "global_step": 557990, "epoch": 6722} {"train_loss": -27.617694854736328, "global_step": 557991, "epoch": 6722} {"train_loss": -26.296308517456055, "global_step": 557992, "epoch": 6722} {"train_loss": -26.10615348815918, "global_step": 557993, "epoch": 6722} {"train_loss": -27.23552894592285, "global_step": 557994, "epoch": 6722} {"train_loss": -27.62335777282715, "global_step": 557995, "epoch": 6722} {"train_loss": -27.457666397094727, "global_step": 557996, "epoch": 6722} {"train_loss": -27.09856605529785, "global_step": 557997, "epoch": 6722} {"train_loss": -27.331995010375977, "global_step": 557998, "epoch": 6722} {"train_loss": -27.48261833190918, "global_step": 557999, "epoch": 6722} {"train_loss": -27.660131454467773, "global_step": 558000, "epoch": 6722} {"train_loss": -27.147968292236328, "global_step": 558001, "epoch": 6722} {"train_loss": -27.578821182250977, "global_step": 558002, "epoch": 6722} {"train_loss": -27.33052635192871, "global_step": 558003, "epoch": 6722} {"train_loss": -27.004444122314453, "global_step": 558004, "epoch": 6722} {"train_loss": -27.541183471679688, "global_step": 558005, "epoch": 6722} {"train_loss": -27.54157066345215, "global_step": 558006, "epoch": 6722} {"train_loss": -27.513586044311523, "global_step": 558007, "epoch": 6722} {"train_loss": -27.636152681097926, "global_step": 558008, "epoch": 6722, "val_loss": 6477494.5} {"train_loss": -27.032392501831055, "global_step": 558009, "epoch": 6723} {"train_loss": -27.50071144104004, "global_step": 558010, "epoch": 6723} {"train_loss": -27.4312801361084, "global_step": 558011, "epoch": 6723} {"train_loss": -27.216983795166016, "global_step": 558012, "epoch": 6723} {"train_loss": -27.77338218688965, "global_step": 558013, "epoch": 6723} {"train_loss": -27.27350425720215, "global_step": 558014, "epoch": 6723} {"train_loss": -27.411605834960938, "global_step": 558015, "epoch": 6723} {"train_loss": -27.70000648498535, "global_step": 558016, "epoch": 6723} {"train_loss": -27.3193416595459, "global_step": 558017, "epoch": 6723} {"train_loss": -27.304706573486328, "global_step": 558018, "epoch": 6723} {"train_loss": -27.174732208251953, "global_step": 558019, "epoch": 6723} {"train_loss": -27.298131942749023, "global_step": 558020, "epoch": 6723} {"train_loss": -27.159086227416992, "global_step": 558021, "epoch": 6723} {"train_loss": -27.56092643737793, "global_step": 558022, "epoch": 6723} {"train_loss": -27.54506492614746, "global_step": 558023, "epoch": 6723} {"train_loss": -27.82405662536621, "global_step": 558024, "epoch": 6723} {"train_loss": -27.557361602783203, "global_step": 558025, "epoch": 6723} {"train_loss": -27.759626388549805, "global_step": 558026, "epoch": 6723} {"train_loss": -27.741262435913086, "global_step": 558027, "epoch": 6723} {"train_loss": -27.483755111694336, "global_step": 558028, "epoch": 6723} {"train_loss": -27.535505294799805, "global_step": 558029, "epoch": 6723} {"train_loss": -27.8230037689209, "global_step": 558030, "epoch": 6723} {"train_loss": -27.492029190063477, "global_step": 558031, "epoch": 6723} {"train_loss": -27.940977096557617, "global_step": 558032, "epoch": 6723} {"train_loss": -27.74720573425293, "global_step": 558033, "epoch": 6723} {"train_loss": -28.15399169921875, "global_step": 558034, "epoch": 6723} {"train_loss": -27.598102569580078, "global_step": 558035, "epoch": 6723} {"train_loss": -27.684656143188477, "global_step": 558036, "epoch": 6723} {"train_loss": -27.850858688354492, "global_step": 558037, "epoch": 6723} {"train_loss": -27.922948837280273, "global_step": 558038, "epoch": 6723} {"train_loss": -27.63872718811035, "global_step": 558039, "epoch": 6723} {"train_loss": -27.70005226135254, "global_step": 558040, "epoch": 6723} {"train_loss": -27.924055099487305, "global_step": 558041, "epoch": 6723} {"train_loss": -28.030792236328125, "global_step": 558042, "epoch": 6723} {"train_loss": -27.994993209838867, "global_step": 558043, "epoch": 6723} {"train_loss": -27.595706939697266, "global_step": 558044, "epoch": 6723} {"train_loss": -28.067968368530273, "global_step": 558045, "epoch": 6723} {"train_loss": -27.755584716796875, "global_step": 558046, "epoch": 6723} {"train_loss": -27.651901245117188, "global_step": 558047, "epoch": 6723} {"train_loss": -28.056079864501953, "global_step": 558048, "epoch": 6723} {"train_loss": -27.7691650390625, "global_step": 558049, "epoch": 6723} {"train_loss": -27.70650291442871, "global_step": 558050, "epoch": 6723} {"train_loss": -27.632781982421875, "global_step": 558051, "epoch": 6723} {"train_loss": -27.596960067749023, "global_step": 558052, "epoch": 6723} {"train_loss": -27.38702964782715, "global_step": 558053, "epoch": 6723} {"train_loss": -27.852453231811523, "global_step": 558054, "epoch": 6723} {"train_loss": -27.833984375, "global_step": 558055, "epoch": 6723} {"train_loss": -27.775516510009766, "global_step": 558056, "epoch": 6723} {"train_loss": -28.2128963470459, "global_step": 558057, "epoch": 6723} {"train_loss": -27.969812393188477, "global_step": 558058, "epoch": 6723} {"train_loss": -27.59515953063965, "global_step": 558059, "epoch": 6723} {"train_loss": -27.69699478149414, "global_step": 558060, "epoch": 6723} {"train_loss": -27.860504150390625, "global_step": 558061, "epoch": 6723} {"train_loss": -27.9791259765625, "global_step": 558062, "epoch": 6723} {"train_loss": -27.389495849609375, "global_step": 558063, "epoch": 6723} {"train_loss": -27.372272491455078, "global_step": 558064, "epoch": 6723} {"train_loss": -27.807626724243164, "global_step": 558065, "epoch": 6723} {"train_loss": -27.7359676361084, "global_step": 558066, "epoch": 6723} {"train_loss": -27.430683135986328, "global_step": 558067, "epoch": 6723} {"train_loss": -27.512449264526367, "global_step": 558068, "epoch": 6723} {"train_loss": -27.31501579284668, "global_step": 558069, "epoch": 6723} {"train_loss": -27.95745849609375, "global_step": 558070, "epoch": 6723} {"train_loss": -27.920461654663086, "global_step": 558071, "epoch": 6723} {"train_loss": -27.66431999206543, "global_step": 558072, "epoch": 6723} {"train_loss": -27.829721450805664, "global_step": 558073, "epoch": 6723} {"train_loss": -27.44061279296875, "global_step": 558074, "epoch": 6723} {"train_loss": -27.824682235717773, "global_step": 558075, "epoch": 6723} {"train_loss": -27.53852653503418, "global_step": 558076, "epoch": 6723} {"train_loss": -27.093494415283203, "global_step": 558077, "epoch": 6723} {"train_loss": -27.63985252380371, "global_step": 558078, "epoch": 6723} {"train_loss": -27.8775634765625, "global_step": 558079, "epoch": 6723} {"train_loss": -27.443761825561523, "global_step": 558080, "epoch": 6723} {"train_loss": -28.004568099975586, "global_step": 558081, "epoch": 6723} {"train_loss": -27.60602378845215, "global_step": 558082, "epoch": 6723} {"train_loss": -27.237302780151367, "global_step": 558083, "epoch": 6723} {"train_loss": -27.76104164123535, "global_step": 558084, "epoch": 6723} {"train_loss": -27.538482666015625, "global_step": 558085, "epoch": 6723} {"train_loss": -27.8608455657959, "global_step": 558086, "epoch": 6723} {"train_loss": -27.778547286987305, "global_step": 558087, "epoch": 6723} {"train_loss": -27.85140037536621, "global_step": 558088, "epoch": 6723} {"train_loss": -27.78974723815918, "global_step": 558089, "epoch": 6723} {"train_loss": -27.65778923034668, "global_step": 558090, "epoch": 6723} {"train_loss": -27.665113586977302, "global_step": 558091, "epoch": 6723, "val_loss": 6482682.0} {"train_loss": -26.010547637939453, "global_step": 558092, "epoch": 6724} {"train_loss": -27.7435359954834, "global_step": 558093, "epoch": 6724} {"train_loss": -27.37239646911621, "global_step": 558094, "epoch": 6724} {"train_loss": -27.245080947875977, "global_step": 558095, "epoch": 6724} {"train_loss": -27.377277374267578, "global_step": 558096, "epoch": 6724} {"train_loss": -26.95583152770996, "global_step": 558097, "epoch": 6724} {"train_loss": -27.51002311706543, "global_step": 558098, "epoch": 6724} {"train_loss": -27.170358657836914, "global_step": 558099, "epoch": 6724} {"train_loss": -27.321701049804688, "global_step": 558100, "epoch": 6724} {"train_loss": -26.996597290039062, "global_step": 558101, "epoch": 6724} {"train_loss": -27.639657974243164, "global_step": 558102, "epoch": 6724} {"train_loss": -27.53018569946289, "global_step": 558103, "epoch": 6724} {"train_loss": -27.423410415649414, "global_step": 558104, "epoch": 6724} {"train_loss": -27.699399948120117, "global_step": 558105, "epoch": 6724} {"train_loss": -27.53834342956543, "global_step": 558106, "epoch": 6724} {"train_loss": -27.459070205688477, "global_step": 558107, "epoch": 6724} {"train_loss": -27.232391357421875, "global_step": 558108, "epoch": 6724} {"train_loss": -27.52593421936035, "global_step": 558109, "epoch": 6724} {"train_loss": -27.594940185546875, "global_step": 558110, "epoch": 6724} {"train_loss": -27.53265380859375, "global_step": 558111, "epoch": 6724} {"train_loss": -27.64862632751465, "global_step": 558112, "epoch": 6724} {"train_loss": -27.719877243041992, "global_step": 558113, "epoch": 6724} {"train_loss": -27.701751708984375, "global_step": 558114, "epoch": 6724} {"train_loss": -27.488306045532227, "global_step": 558115, "epoch": 6724} {"train_loss": -27.614721298217773, "global_step": 558116, "epoch": 6724} {"train_loss": -27.640710830688477, "global_step": 558117, "epoch": 6724} {"train_loss": -27.925500869750977, "global_step": 558118, "epoch": 6724} {"train_loss": -27.82118034362793, "global_step": 558119, "epoch": 6724} {"train_loss": -27.935277938842773, "global_step": 558120, "epoch": 6724} {"train_loss": -27.963531494140625, "global_step": 558121, "epoch": 6724} {"train_loss": -28.01226234436035, "global_step": 558122, "epoch": 6724} {"train_loss": -27.77260398864746, "global_step": 558123, "epoch": 6724} {"train_loss": -27.576416015625, "global_step": 558124, "epoch": 6724} {"train_loss": -27.936124801635742, "global_step": 558125, "epoch": 6724} {"train_loss": -27.776464462280273, "global_step": 558126, "epoch": 6724} {"train_loss": -27.549362182617188, "global_step": 558127, "epoch": 6724} {"train_loss": -27.835493087768555, "global_step": 558128, "epoch": 6724} {"train_loss": -27.390501022338867, "global_step": 558129, "epoch": 6724} {"train_loss": -27.8171443939209, "global_step": 558130, "epoch": 6724} {"train_loss": -27.758304595947266, "global_step": 558131, "epoch": 6724} {"train_loss": -27.57661247253418, "global_step": 558132, "epoch": 6724} {"train_loss": -27.644763946533203, "global_step": 558133, "epoch": 6724} {"train_loss": -27.925506591796875, "global_step": 558134, "epoch": 6724} {"train_loss": -27.84159278869629, "global_step": 558135, "epoch": 6724} {"train_loss": -28.104373931884766, "global_step": 558136, "epoch": 6724} {"train_loss": -27.952157974243164, "global_step": 558137, "epoch": 6724} {"train_loss": -28.311695098876953, "global_step": 558138, "epoch": 6724} {"train_loss": -27.90152359008789, "global_step": 558139, "epoch": 6724} {"train_loss": -27.662622451782227, "global_step": 558140, "epoch": 6724} {"train_loss": -28.143634796142578, "global_step": 558141, "epoch": 6724} {"train_loss": -27.85847282409668, "global_step": 558142, "epoch": 6724} {"train_loss": -27.7808837890625, "global_step": 558143, "epoch": 6724} {"train_loss": -28.077468872070312, "global_step": 558144, "epoch": 6724} {"train_loss": -27.676279067993164, "global_step": 558145, "epoch": 6724} {"train_loss": -27.637426376342773, "global_step": 558146, "epoch": 6724} {"train_loss": -27.305219650268555, "global_step": 558147, "epoch": 6724} {"train_loss": -27.307209014892578, "global_step": 558148, "epoch": 6724} {"train_loss": -27.736347198486328, "global_step": 558149, "epoch": 6724} {"train_loss": -28.17191505432129, "global_step": 558150, "epoch": 6724} {"train_loss": -27.40826988220215, "global_step": 558151, "epoch": 6724} {"train_loss": -27.640918731689453, "global_step": 558152, "epoch": 6724} {"train_loss": -27.375402450561523, "global_step": 558153, "epoch": 6724} {"train_loss": -27.773229598999023, "global_step": 558154, "epoch": 6724} {"train_loss": -27.75593376159668, "global_step": 558155, "epoch": 6724} {"train_loss": -27.683746337890625, "global_step": 558156, "epoch": 6724} {"train_loss": -27.43988609313965, "global_step": 558157, "epoch": 6724} {"train_loss": -27.921934127807617, "global_step": 558158, "epoch": 6724} {"train_loss": -27.553741455078125, "global_step": 558159, "epoch": 6724} {"train_loss": -27.825910568237305, "global_step": 558160, "epoch": 6724} {"train_loss": -27.693180084228516, "global_step": 558161, "epoch": 6724} {"train_loss": -27.5192813873291, "global_step": 558162, "epoch": 6724} {"train_loss": -27.63348388671875, "global_step": 558163, "epoch": 6724} {"train_loss": -28.11445426940918, "global_step": 558164, "epoch": 6724} {"train_loss": -28.28006362915039, "global_step": 558165, "epoch": 6724} {"train_loss": -28.011524200439453, "global_step": 558166, "epoch": 6724} {"train_loss": -27.685998916625977, "global_step": 558167, "epoch": 6724} {"train_loss": -27.746707916259766, "global_step": 558168, "epoch": 6724} {"train_loss": -27.832090377807617, "global_step": 558169, "epoch": 6724} {"train_loss": -27.953256607055664, "global_step": 558170, "epoch": 6724} {"train_loss": -28.319793701171875, "global_step": 558171, "epoch": 6724} {"train_loss": -27.932727813720703, "global_step": 558172, "epoch": 6724} {"train_loss": -28.221832275390625, "global_step": 558173, "epoch": 6724} {"train_loss": -27.697213092482233, "global_step": 558174, "epoch": 6724, "val_loss": 6559482.0} {"train_loss": -27.292068481445312, "global_step": 558175, "epoch": 6725} {"train_loss": -26.153467178344727, "global_step": 558176, "epoch": 6725} {"train_loss": -27.865625381469727, "global_step": 558177, "epoch": 6725} {"train_loss": -27.080896377563477, "global_step": 558178, "epoch": 6725} {"train_loss": -27.49530601501465, "global_step": 558179, "epoch": 6725} {"train_loss": -26.934484481811523, "global_step": 558180, "epoch": 6725} {"train_loss": -27.682743072509766, "global_step": 558181, "epoch": 6725} {"train_loss": -26.93161964416504, "global_step": 558182, "epoch": 6725} {"train_loss": -27.7874698638916, "global_step": 558183, "epoch": 6725} {"train_loss": -27.227075576782227, "global_step": 558184, "epoch": 6725} {"train_loss": -27.281152725219727, "global_step": 558185, "epoch": 6725} {"train_loss": -27.106672286987305, "global_step": 558186, "epoch": 6725} {"train_loss": -27.357404708862305, "global_step": 558187, "epoch": 6725} {"train_loss": -27.46355628967285, "global_step": 558188, "epoch": 6725} {"train_loss": -27.292266845703125, "global_step": 558189, "epoch": 6725} {"train_loss": -27.465274810791016, "global_step": 558190, "epoch": 6725} {"train_loss": -27.5061092376709, "global_step": 558191, "epoch": 6725} {"train_loss": -27.391111373901367, "global_step": 558192, "epoch": 6725} {"train_loss": -27.547134399414062, "global_step": 558193, "epoch": 6725} {"train_loss": -27.531970977783203, "global_step": 558194, "epoch": 6725} {"train_loss": -27.608386993408203, "global_step": 558195, "epoch": 6725} {"train_loss": -27.12775230407715, "global_step": 558196, "epoch": 6725} {"train_loss": -27.806217193603516, "global_step": 558197, "epoch": 6725} {"train_loss": -27.221765518188477, "global_step": 558198, "epoch": 6725} {"train_loss": -26.999433517456055, "global_step": 558199, "epoch": 6725} {"train_loss": -27.673904418945312, "global_step": 558200, "epoch": 6725} {"train_loss": -27.60300064086914, "global_step": 558201, "epoch": 6725} {"train_loss": -27.619705200195312, "global_step": 558202, "epoch": 6725} {"train_loss": -27.88144302368164, "global_step": 558203, "epoch": 6725} {"train_loss": -27.581680297851562, "global_step": 558204, "epoch": 6725} {"train_loss": -27.8695068359375, "global_step": 558205, "epoch": 6725} {"train_loss": -27.776874542236328, "global_step": 558206, "epoch": 6725} {"train_loss": -27.58314323425293, "global_step": 558207, "epoch": 6725} {"train_loss": -27.62127685546875, "global_step": 558208, "epoch": 6725} {"train_loss": -27.441686630249023, "global_step": 558209, "epoch": 6725} {"train_loss": -27.37774658203125, "global_step": 558210, "epoch": 6725} {"train_loss": -27.638092041015625, "global_step": 558211, "epoch": 6725} {"train_loss": -27.558929443359375, "global_step": 558212, "epoch": 6725} {"train_loss": -27.302337646484375, "global_step": 558213, "epoch": 6725} {"train_loss": -27.622175216674805, "global_step": 558214, "epoch": 6725} {"train_loss": -27.837995529174805, "global_step": 558215, "epoch": 6725} {"train_loss": -27.95490837097168, "global_step": 558216, "epoch": 6725} {"train_loss": -27.91477394104004, "global_step": 558217, "epoch": 6725} {"train_loss": -27.9686222076416, "global_step": 558218, "epoch": 6725} {"train_loss": -27.68869972229004, "global_step": 558219, "epoch": 6725} {"train_loss": -27.67925453186035, "global_step": 558220, "epoch": 6725} {"train_loss": -27.52838134765625, "global_step": 558221, "epoch": 6725} {"train_loss": -27.843713760375977, "global_step": 558222, "epoch": 6725} {"train_loss": -27.710208892822266, "global_step": 558223, "epoch": 6725} {"train_loss": -27.840576171875, "global_step": 558224, "epoch": 6725} {"train_loss": -28.148221969604492, "global_step": 558225, "epoch": 6725} {"train_loss": -27.851974487304688, "global_step": 558226, "epoch": 6725} {"train_loss": -27.882970809936523, "global_step": 558227, "epoch": 6725} {"train_loss": -28.070547103881836, "global_step": 558228, "epoch": 6725} {"train_loss": -27.911828994750977, "global_step": 558229, "epoch": 6725} {"train_loss": -27.768213272094727, "global_step": 558230, "epoch": 6725} {"train_loss": -27.87839698791504, "global_step": 558231, "epoch": 6725} {"train_loss": -27.64497947692871, "global_step": 558232, "epoch": 6725} {"train_loss": -28.23569107055664, "global_step": 558233, "epoch": 6725} {"train_loss": -27.911535263061523, "global_step": 558234, "epoch": 6725} {"train_loss": -28.058542251586914, "global_step": 558235, "epoch": 6725} {"train_loss": -27.674936294555664, "global_step": 558236, "epoch": 6725} {"train_loss": -28.092626571655273, "global_step": 558237, "epoch": 6725} {"train_loss": -27.842138290405273, "global_step": 558238, "epoch": 6725} {"train_loss": -27.671655654907227, "global_step": 558239, "epoch": 6725} {"train_loss": -27.98298454284668, "global_step": 558240, "epoch": 6725} {"train_loss": -28.08949089050293, "global_step": 558241, "epoch": 6725} {"train_loss": -27.904714584350586, "global_step": 558242, "epoch": 6725} {"train_loss": -27.35527992248535, "global_step": 558243, "epoch": 6725} {"train_loss": -27.59174156188965, "global_step": 558244, "epoch": 6725} {"train_loss": -27.305301666259766, "global_step": 558245, "epoch": 6725} {"train_loss": -27.634740829467773, "global_step": 558246, "epoch": 6725} {"train_loss": -27.992807388305664, "global_step": 558247, "epoch": 6725} {"train_loss": -27.825855255126953, "global_step": 558248, "epoch": 6725} {"train_loss": -27.933191299438477, "global_step": 558249, "epoch": 6725} {"train_loss": -27.846975326538086, "global_step": 558250, "epoch": 6725} {"train_loss": -27.71912956237793, "global_step": 558251, "epoch": 6725} {"train_loss": -27.46136474609375, "global_step": 558252, "epoch": 6725} {"train_loss": -27.774459838867188, "global_step": 558253, "epoch": 6725} {"train_loss": -27.670425415039062, "global_step": 558254, "epoch": 6725} {"train_loss": -27.492660522460938, "global_step": 558255, "epoch": 6725} {"train_loss": -27.847936630249023, "global_step": 558256, "epoch": 6725} {"train_loss": -27.62400314606816, "global_step": 558257, "epoch": 6725, "val_loss": 6499484.0} {"train_loss": -27.824987411499023, "global_step": 558258, "epoch": 6726} {"train_loss": -27.435638427734375, "global_step": 558259, "epoch": 6726} {"train_loss": -27.67380142211914, "global_step": 558260, "epoch": 6726} {"train_loss": -27.830204010009766, "global_step": 558261, "epoch": 6726} {"train_loss": -27.457233428955078, "global_step": 558262, "epoch": 6726} {"train_loss": -27.773340225219727, "global_step": 558263, "epoch": 6726} {"train_loss": -27.203893661499023, "global_step": 558264, "epoch": 6726} {"train_loss": -27.48232078552246, "global_step": 558265, "epoch": 6726} {"train_loss": -27.5773868560791, "global_step": 558266, "epoch": 6726} {"train_loss": -27.580419540405273, "global_step": 558267, "epoch": 6726} {"train_loss": -27.50330924987793, "global_step": 558268, "epoch": 6726} {"train_loss": -27.93084716796875, "global_step": 558269, "epoch": 6726} {"train_loss": -27.312366485595703, "global_step": 558270, "epoch": 6726} {"train_loss": -27.469009399414062, "global_step": 558271, "epoch": 6726} {"train_loss": -27.7861385345459, "global_step": 558272, "epoch": 6726} {"train_loss": -27.87936782836914, "global_step": 558273, "epoch": 6726} {"train_loss": -27.46238136291504, "global_step": 558274, "epoch": 6726} {"train_loss": -27.322162628173828, "global_step": 558275, "epoch": 6726} {"train_loss": -27.641742706298828, "global_step": 558276, "epoch": 6726} {"train_loss": -27.30714225769043, "global_step": 558277, "epoch": 6726} {"train_loss": -27.616580963134766, "global_step": 558278, "epoch": 6726} {"train_loss": -27.397714614868164, "global_step": 558279, "epoch": 6726} {"train_loss": -27.36075210571289, "global_step": 558280, "epoch": 6726} {"train_loss": -27.39299964904785, "global_step": 558281, "epoch": 6726} {"train_loss": -27.690021514892578, "global_step": 558282, "epoch": 6726} {"train_loss": -27.428678512573242, "global_step": 558283, "epoch": 6726} {"train_loss": -27.733844757080078, "global_step": 558284, "epoch": 6726} {"train_loss": -27.856901168823242, "global_step": 558285, "epoch": 6726} {"train_loss": -27.7065486907959, "global_step": 558286, "epoch": 6726} {"train_loss": -27.5773983001709, "global_step": 558287, "epoch": 6726} {"train_loss": -27.48040771484375, "global_step": 558288, "epoch": 6726} {"train_loss": -28.067401885986328, "global_step": 558289, "epoch": 6726} {"train_loss": -27.95821189880371, "global_step": 558290, "epoch": 6726} {"train_loss": -27.585529327392578, "global_step": 558291, "epoch": 6726} {"train_loss": -27.76361083984375, "global_step": 558292, "epoch": 6726} {"train_loss": -27.797718048095703, "global_step": 558293, "epoch": 6726} {"train_loss": -27.57177734375, "global_step": 558294, "epoch": 6726} {"train_loss": -27.98089599609375, "global_step": 558295, "epoch": 6726} {"train_loss": -28.03663444519043, "global_step": 558296, "epoch": 6726} {"train_loss": -28.050268173217773, "global_step": 558297, "epoch": 6726} {"train_loss": -27.634618759155273, "global_step": 558298, "epoch": 6726} {"train_loss": -28.017175674438477, "global_step": 558299, "epoch": 6726} {"train_loss": -27.8857421875, "global_step": 558300, "epoch": 6726} {"train_loss": -27.74100112915039, "global_step": 558301, "epoch": 6726} {"train_loss": -27.989273071289062, "global_step": 558302, "epoch": 6726} {"train_loss": -28.0947322845459, "global_step": 558303, "epoch": 6726} {"train_loss": -27.625696182250977, "global_step": 558304, "epoch": 6726} {"train_loss": -28.246368408203125, "global_step": 558305, "epoch": 6726} {"train_loss": -28.282974243164062, "global_step": 558306, "epoch": 6726} {"train_loss": -28.052053451538086, "global_step": 558307, "epoch": 6726} {"train_loss": -27.97509765625, "global_step": 558308, "epoch": 6726} {"train_loss": -27.688711166381836, "global_step": 558309, "epoch": 6726} {"train_loss": -28.301721572875977, "global_step": 558310, "epoch": 6726} {"train_loss": -28.314970016479492, "global_step": 558311, "epoch": 6726} {"train_loss": -28.282337188720703, "global_step": 558312, "epoch": 6726} {"train_loss": -28.111303329467773, "global_step": 558313, "epoch": 6726} {"train_loss": -28.022180557250977, "global_step": 558314, "epoch": 6726} {"train_loss": -27.931594848632812, "global_step": 558315, "epoch": 6726} {"train_loss": -28.255603790283203, "global_step": 558316, "epoch": 6726} {"train_loss": -28.3929386138916, "global_step": 558317, "epoch": 6726} {"train_loss": -28.138269424438477, "global_step": 558318, "epoch": 6726} {"train_loss": -27.7871036529541, "global_step": 558319, "epoch": 6726} {"train_loss": -27.756671905517578, "global_step": 558320, "epoch": 6726} {"train_loss": -27.77435874938965, "global_step": 558321, "epoch": 6726} {"train_loss": -27.786222457885742, "global_step": 558322, "epoch": 6726} {"train_loss": -28.02186393737793, "global_step": 558323, "epoch": 6726} {"train_loss": -28.318174362182617, "global_step": 558324, "epoch": 6726} {"train_loss": -28.075515747070312, "global_step": 558325, "epoch": 6726} {"train_loss": -27.627538681030273, "global_step": 558326, "epoch": 6726} {"train_loss": -27.2281494140625, "global_step": 558327, "epoch": 6726} {"train_loss": -25.99294090270996, "global_step": 558328, "epoch": 6726} {"train_loss": -23.466650009155273, "global_step": 558329, "epoch": 6726} {"train_loss": -23.16155433654785, "global_step": 558330, "epoch": 6726} {"train_loss": -26.10602378845215, "global_step": 558331, "epoch": 6726} {"train_loss": -26.295392990112305, "global_step": 558332, "epoch": 6726} {"train_loss": -26.057819366455078, "global_step": 558333, "epoch": 6726} {"train_loss": -26.50104331970215, "global_step": 558334, "epoch": 6726} {"train_loss": -26.582361221313477, "global_step": 558335, "epoch": 6726} {"train_loss": -26.399145126342773, "global_step": 558336, "epoch": 6726} {"train_loss": -26.69832420349121, "global_step": 558337, "epoch": 6726} {"train_loss": -27.023828506469727, "global_step": 558338, "epoch": 6726} {"train_loss": -26.648731231689453, "global_step": 558339, "epoch": 6726} {"train_loss": -27.491564463420087, "global_step": 558340, "epoch": 6726, "val_loss": 6494848.0} {"train_loss": -25.953535079956055, "global_step": 558341, "epoch": 6727} {"train_loss": -26.314390182495117, "global_step": 558342, "epoch": 6727} {"train_loss": -26.32598304748535, "global_step": 558343, "epoch": 6727} {"train_loss": -26.137222290039062, "global_step": 558344, "epoch": 6727} {"train_loss": -26.35809326171875, "global_step": 558345, "epoch": 6727} {"train_loss": -26.567855834960938, "global_step": 558346, "epoch": 6727} {"train_loss": -26.56218910217285, "global_step": 558347, "epoch": 6727} {"train_loss": -26.255468368530273, "global_step": 558348, "epoch": 6727} {"train_loss": -26.878820419311523, "global_step": 558349, "epoch": 6727} {"train_loss": -26.609283447265625, "global_step": 558350, "epoch": 6727} {"train_loss": -26.772186279296875, "global_step": 558351, "epoch": 6727} {"train_loss": -26.870655059814453, "global_step": 558352, "epoch": 6727} {"train_loss": -27.04994010925293, "global_step": 558353, "epoch": 6727} {"train_loss": -26.96453857421875, "global_step": 558354, "epoch": 6727} {"train_loss": -26.894943237304688, "global_step": 558355, "epoch": 6727} {"train_loss": -27.195999145507812, "global_step": 558356, "epoch": 6727} {"train_loss": -26.8565673828125, "global_step": 558357, "epoch": 6727} {"train_loss": -26.855737686157227, "global_step": 558358, "epoch": 6727} {"train_loss": -27.016698837280273, "global_step": 558359, "epoch": 6727} {"train_loss": -27.40485191345215, "global_step": 558360, "epoch": 6727} {"train_loss": -27.330890655517578, "global_step": 558361, "epoch": 6727} {"train_loss": -27.02996253967285, "global_step": 558362, "epoch": 6727} {"train_loss": -26.956470489501953, "global_step": 558363, "epoch": 6727} {"train_loss": -27.59726333618164, "global_step": 558364, "epoch": 6727} {"train_loss": -27.32834243774414, "global_step": 558365, "epoch": 6727} {"train_loss": -27.577972412109375, "global_step": 558366, "epoch": 6727} {"train_loss": -27.675153732299805, "global_step": 558367, "epoch": 6727} {"train_loss": -27.510961532592773, "global_step": 558368, "epoch": 6727} {"train_loss": -27.607208251953125, "global_step": 558369, "epoch": 6727} {"train_loss": -27.444080352783203, "global_step": 558370, "epoch": 6727} {"train_loss": -27.542163848876953, "global_step": 558371, "epoch": 6727} {"train_loss": -27.541372299194336, "global_step": 558372, "epoch": 6727} {"train_loss": -27.528778076171875, "global_step": 558373, "epoch": 6727} {"train_loss": -27.172800064086914, "global_step": 558374, "epoch": 6727} {"train_loss": -27.67500114440918, "global_step": 558375, "epoch": 6727} {"train_loss": -27.80312156677246, "global_step": 558376, "epoch": 6727} {"train_loss": -27.873065948486328, "global_step": 558377, "epoch": 6727} {"train_loss": -27.71866798400879, "global_step": 558378, "epoch": 6727} {"train_loss": -27.296356201171875, "global_step": 558379, "epoch": 6727} {"train_loss": -27.843183517456055, "global_step": 558380, "epoch": 6727} {"train_loss": -27.66033363342285, "global_step": 558381, "epoch": 6727} {"train_loss": -28.034046173095703, "global_step": 558382, "epoch": 6727} {"train_loss": -27.994421005249023, "global_step": 558383, "epoch": 6727} {"train_loss": -28.127363204956055, "global_step": 558384, "epoch": 6727} {"train_loss": -27.496295928955078, "global_step": 558385, "epoch": 6727} {"train_loss": -28.037378311157227, "global_step": 558386, "epoch": 6727} {"train_loss": -27.862537384033203, "global_step": 558387, "epoch": 6727} {"train_loss": -27.88983726501465, "global_step": 558388, "epoch": 6727} {"train_loss": -27.99590492248535, "global_step": 558389, "epoch": 6727} {"train_loss": -27.99713134765625, "global_step": 558390, "epoch": 6727} {"train_loss": -27.85755729675293, "global_step": 558391, "epoch": 6727} {"train_loss": -27.886539459228516, "global_step": 558392, "epoch": 6727} {"train_loss": -28.074670791625977, "global_step": 558393, "epoch": 6727} {"train_loss": -27.91946792602539, "global_step": 558394, "epoch": 6727} {"train_loss": -27.760229110717773, "global_step": 558395, "epoch": 6727} {"train_loss": -27.839345932006836, "global_step": 558396, "epoch": 6727} {"train_loss": -27.726537704467773, "global_step": 558397, "epoch": 6727} {"train_loss": -27.91827392578125, "global_step": 558398, "epoch": 6727} {"train_loss": -27.530210494995117, "global_step": 558399, "epoch": 6727} {"train_loss": -27.627038955688477, "global_step": 558400, "epoch": 6727} {"train_loss": -27.463394165039062, "global_step": 558401, "epoch": 6727} {"train_loss": -28.26630973815918, "global_step": 558402, "epoch": 6727} {"train_loss": -27.7564754486084, "global_step": 558403, "epoch": 6727} {"train_loss": -27.7587890625, "global_step": 558404, "epoch": 6727} {"train_loss": -27.71291160583496, "global_step": 558405, "epoch": 6727} {"train_loss": -27.921213150024414, "global_step": 558406, "epoch": 6727} {"train_loss": -27.706602096557617, "global_step": 558407, "epoch": 6727} {"train_loss": -27.877674102783203, "global_step": 558408, "epoch": 6727} {"train_loss": -27.72051429748535, "global_step": 558409, "epoch": 6727} {"train_loss": -27.717010498046875, "global_step": 558410, "epoch": 6727} {"train_loss": -27.564382553100586, "global_step": 558411, "epoch": 6727} {"train_loss": -27.535724639892578, "global_step": 558412, "epoch": 6727} {"train_loss": -27.1329402923584, "global_step": 558413, "epoch": 6727} {"train_loss": -27.975671768188477, "global_step": 558414, "epoch": 6727} {"train_loss": -27.526586532592773, "global_step": 558415, "epoch": 6727} {"train_loss": -27.94495964050293, "global_step": 558416, "epoch": 6727} {"train_loss": -28.0080509185791, "global_step": 558417, "epoch": 6727} {"train_loss": -27.52924156188965, "global_step": 558418, "epoch": 6727} {"train_loss": -27.500436782836914, "global_step": 558419, "epoch": 6727} {"train_loss": -27.713109970092773, "global_step": 558420, "epoch": 6727} {"train_loss": -27.960947036743164, "global_step": 558421, "epoch": 6727} {"train_loss": -28.00461769104004, "global_step": 558422, "epoch": 6727} {"train_loss": -27.453468713415674, "global_step": 558423, "epoch": 6727, "val_loss": 6524385.0} {"train_loss": -25.963342666625977, "global_step": 558424, "epoch": 6728} {"train_loss": -25.35300064086914, "global_step": 558425, "epoch": 6728} {"train_loss": -26.463287353515625, "global_step": 558426, "epoch": 6728} {"train_loss": -26.091373443603516, "global_step": 558427, "epoch": 6728} {"train_loss": -27.054931640625, "global_step": 558428, "epoch": 6728} {"train_loss": -26.990585327148438, "global_step": 558429, "epoch": 6728} {"train_loss": -26.622604370117188, "global_step": 558430, "epoch": 6728} {"train_loss": -27.217578887939453, "global_step": 558431, "epoch": 6728} {"train_loss": -26.69512367248535, "global_step": 558432, "epoch": 6728} {"train_loss": -26.69150161743164, "global_step": 558433, "epoch": 6728} {"train_loss": -27.232824325561523, "global_step": 558434, "epoch": 6728} {"train_loss": -27.406965255737305, "global_step": 558435, "epoch": 6728} {"train_loss": -27.065683364868164, "global_step": 558436, "epoch": 6728} {"train_loss": -27.23309898376465, "global_step": 558437, "epoch": 6728} {"train_loss": -27.131662368774414, "global_step": 558438, "epoch": 6728} {"train_loss": -27.471118927001953, "global_step": 558439, "epoch": 6728} {"train_loss": -27.546335220336914, "global_step": 558440, "epoch": 6728} {"train_loss": -27.246992111206055, "global_step": 558441, "epoch": 6728} {"train_loss": -27.50614356994629, "global_step": 558442, "epoch": 6728} {"train_loss": -27.560285568237305, "global_step": 558443, "epoch": 6728} {"train_loss": -27.74539566040039, "global_step": 558444, "epoch": 6728} {"train_loss": -27.403959274291992, "global_step": 558445, "epoch": 6728} {"train_loss": -27.64893913269043, "global_step": 558446, "epoch": 6728} {"train_loss": -27.856821060180664, "global_step": 558447, "epoch": 6728} {"train_loss": -27.77008628845215, "global_step": 558448, "epoch": 6728} {"train_loss": -27.171634674072266, "global_step": 558449, "epoch": 6728} {"train_loss": -27.461103439331055, "global_step": 558450, "epoch": 6728} {"train_loss": -27.906843185424805, "global_step": 558451, "epoch": 6728} {"train_loss": -27.35467529296875, "global_step": 558452, "epoch": 6728} {"train_loss": -27.993432998657227, "global_step": 558453, "epoch": 6728} {"train_loss": -27.518369674682617, "global_step": 558454, "epoch": 6728} {"train_loss": -27.73908805847168, "global_step": 558455, "epoch": 6728} {"train_loss": -27.65650749206543, "global_step": 558456, "epoch": 6728} {"train_loss": -27.89630126953125, "global_step": 558457, "epoch": 6728} {"train_loss": -27.84736442565918, "global_step": 558458, "epoch": 6728} {"train_loss": -28.021472930908203, "global_step": 558459, "epoch": 6728} {"train_loss": -27.67728614807129, "global_step": 558460, "epoch": 6728} {"train_loss": -28.012908935546875, "global_step": 558461, "epoch": 6728} {"train_loss": -27.780431747436523, "global_step": 558462, "epoch": 6728} {"train_loss": -27.91298484802246, "global_step": 558463, "epoch": 6728} {"train_loss": -27.72378921508789, "global_step": 558464, "epoch": 6728} {"train_loss": -27.647653579711914, "global_step": 558465, "epoch": 6728} {"train_loss": -27.651824951171875, "global_step": 558466, "epoch": 6728} {"train_loss": -27.56674575805664, "global_step": 558467, "epoch": 6728} {"train_loss": -27.41543960571289, "global_step": 558468, "epoch": 6728} {"train_loss": -27.6350040435791, "global_step": 558469, "epoch": 6728} {"train_loss": -27.431806564331055, "global_step": 558470, "epoch": 6728} {"train_loss": -27.703271865844727, "global_step": 558471, "epoch": 6728} {"train_loss": -27.8465518951416, "global_step": 558472, "epoch": 6728} {"train_loss": -27.683349609375, "global_step": 558473, "epoch": 6728} {"train_loss": -27.940656661987305, "global_step": 558474, "epoch": 6728} {"train_loss": -28.036569595336914, "global_step": 558475, "epoch": 6728} {"train_loss": -27.942846298217773, "global_step": 558476, "epoch": 6728} {"train_loss": -27.862060546875, "global_step": 558477, "epoch": 6728} {"train_loss": -28.014240264892578, "global_step": 558478, "epoch": 6728} {"train_loss": -28.081024169921875, "global_step": 558479, "epoch": 6728} {"train_loss": -27.73655128479004, "global_step": 558480, "epoch": 6728} {"train_loss": -27.82682228088379, "global_step": 558481, "epoch": 6728} {"train_loss": -27.830490112304688, "global_step": 558482, "epoch": 6728} {"train_loss": -27.6452693939209, "global_step": 558483, "epoch": 6728} {"train_loss": -28.248615264892578, "global_step": 558484, "epoch": 6728} {"train_loss": -28.04596519470215, "global_step": 558485, "epoch": 6728} {"train_loss": -27.824970245361328, "global_step": 558486, "epoch": 6728} {"train_loss": -28.049604415893555, "global_step": 558487, "epoch": 6728} {"train_loss": -27.94892692565918, "global_step": 558488, "epoch": 6728} {"train_loss": -27.733240127563477, "global_step": 558489, "epoch": 6728} {"train_loss": -27.578216552734375, "global_step": 558490, "epoch": 6728} {"train_loss": -28.040637969970703, "global_step": 558491, "epoch": 6728} {"train_loss": -27.564865112304688, "global_step": 558492, "epoch": 6728} {"train_loss": -27.74476432800293, "global_step": 558493, "epoch": 6728} {"train_loss": -27.50587272644043, "global_step": 558494, "epoch": 6728} {"train_loss": -28.007612228393555, "global_step": 558495, "epoch": 6728} {"train_loss": -27.932876586914062, "global_step": 558496, "epoch": 6728} {"train_loss": -28.031991958618164, "global_step": 558497, "epoch": 6728} {"train_loss": -27.587499618530273, "global_step": 558498, "epoch": 6728} {"train_loss": -27.572345733642578, "global_step": 558499, "epoch": 6728} {"train_loss": -27.7733211517334, "global_step": 558500, "epoch": 6728} {"train_loss": -27.895246505737305, "global_step": 558501, "epoch": 6728} {"train_loss": -27.71370506286621, "global_step": 558502, "epoch": 6728} {"train_loss": -27.8433780670166, "global_step": 558503, "epoch": 6728} {"train_loss": -28.005634307861328, "global_step": 558504, "epoch": 6728} {"train_loss": -28.235584259033203, "global_step": 558505, "epoch": 6728} {"train_loss": -27.55431997919657, "global_step": 558506, "epoch": 6728, "val_loss": 6417910.0} {"train_loss": -25.05128288269043, "global_step": 558507, "epoch": 6729} {"train_loss": -25.602079391479492, "global_step": 558508, "epoch": 6729} {"train_loss": -25.871612548828125, "global_step": 558509, "epoch": 6729} {"train_loss": -26.533191680908203, "global_step": 558510, "epoch": 6729} {"train_loss": -25.227609634399414, "global_step": 558511, "epoch": 6729} {"train_loss": -26.02589988708496, "global_step": 558512, "epoch": 6729} {"train_loss": -25.737390518188477, "global_step": 558513, "epoch": 6729} {"train_loss": -25.896366119384766, "global_step": 558514, "epoch": 6729} {"train_loss": -26.09455680847168, "global_step": 558515, "epoch": 6729} {"train_loss": -26.779943466186523, "global_step": 558516, "epoch": 6729} {"train_loss": -26.374608993530273, "global_step": 558517, "epoch": 6729} {"train_loss": -26.262348175048828, "global_step": 558518, "epoch": 6729} {"train_loss": -26.328027725219727, "global_step": 558519, "epoch": 6729} {"train_loss": -26.75018310546875, "global_step": 558520, "epoch": 6729} {"train_loss": -26.740875244140625, "global_step": 558521, "epoch": 6729} {"train_loss": -26.422815322875977, "global_step": 558522, "epoch": 6729} {"train_loss": -26.773700714111328, "global_step": 558523, "epoch": 6729} {"train_loss": -26.851675033569336, "global_step": 558524, "epoch": 6729} {"train_loss": -26.941492080688477, "global_step": 558525, "epoch": 6729} {"train_loss": -26.7674560546875, "global_step": 558526, "epoch": 6729} {"train_loss": -26.864065170288086, "global_step": 558527, "epoch": 6729} {"train_loss": -27.04111099243164, "global_step": 558528, "epoch": 6729} {"train_loss": -26.977323532104492, "global_step": 558529, "epoch": 6729} {"train_loss": -26.751331329345703, "global_step": 558530, "epoch": 6729} {"train_loss": -27.170150756835938, "global_step": 558531, "epoch": 6729} {"train_loss": -27.410690307617188, "global_step": 558532, "epoch": 6729} {"train_loss": -27.328903198242188, "global_step": 558533, "epoch": 6729} {"train_loss": -27.458478927612305, "global_step": 558534, "epoch": 6729} {"train_loss": -27.157678604125977, "global_step": 558535, "epoch": 6729} {"train_loss": -27.45179557800293, "global_step": 558536, "epoch": 6729} {"train_loss": -27.552282333374023, "global_step": 558537, "epoch": 6729} {"train_loss": -27.332477569580078, "global_step": 558538, "epoch": 6729} {"train_loss": -27.320974349975586, "global_step": 558539, "epoch": 6729} {"train_loss": -27.224445343017578, "global_step": 558540, "epoch": 6729} {"train_loss": -27.37618064880371, "global_step": 558541, "epoch": 6729} {"train_loss": -27.140302658081055, "global_step": 558542, "epoch": 6729} {"train_loss": -27.518402099609375, "global_step": 558543, "epoch": 6729} {"train_loss": -27.557458877563477, "global_step": 558544, "epoch": 6729} {"train_loss": -27.487009048461914, "global_step": 558545, "epoch": 6729} {"train_loss": -26.926868438720703, "global_step": 558546, "epoch": 6729} {"train_loss": -27.52057456970215, "global_step": 558547, "epoch": 6729} {"train_loss": -27.66802978515625, "global_step": 558548, "epoch": 6729} {"train_loss": -27.941022872924805, "global_step": 558549, "epoch": 6729} {"train_loss": -27.622507095336914, "global_step": 558550, "epoch": 6729} {"train_loss": -27.9661808013916, "global_step": 558551, "epoch": 6729} {"train_loss": -27.939035415649414, "global_step": 558552, "epoch": 6729} {"train_loss": -27.90032958984375, "global_step": 558553, "epoch": 6729} {"train_loss": -27.698102951049805, "global_step": 558554, "epoch": 6729} {"train_loss": -27.51091957092285, "global_step": 558555, "epoch": 6729} {"train_loss": -27.637964248657227, "global_step": 558556, "epoch": 6729} {"train_loss": -27.664566040039062, "global_step": 558557, "epoch": 6729} {"train_loss": -27.803085327148438, "global_step": 558558, "epoch": 6729} {"train_loss": -27.679737091064453, "global_step": 558559, "epoch": 6729} {"train_loss": -27.94784927368164, "global_step": 558560, "epoch": 6729} {"train_loss": -28.013778686523438, "global_step": 558561, "epoch": 6729} {"train_loss": -28.205358505249023, "global_step": 558562, "epoch": 6729} {"train_loss": -28.05732536315918, "global_step": 558563, "epoch": 6729} {"train_loss": -27.917417526245117, "global_step": 558564, "epoch": 6729} {"train_loss": -28.673141479492188, "global_step": 558565, "epoch": 6729} {"train_loss": -27.826704025268555, "global_step": 558566, "epoch": 6729} {"train_loss": -27.769001007080078, "global_step": 558567, "epoch": 6729} {"train_loss": -28.227588653564453, "global_step": 558568, "epoch": 6729} {"train_loss": -27.957050323486328, "global_step": 558569, "epoch": 6729} {"train_loss": -27.716144561767578, "global_step": 558570, "epoch": 6729} {"train_loss": -27.97403907775879, "global_step": 558571, "epoch": 6729} {"train_loss": -27.834775924682617, "global_step": 558572, "epoch": 6729} {"train_loss": -27.9307804107666, "global_step": 558573, "epoch": 6729} {"train_loss": -27.768310546875, "global_step": 558574, "epoch": 6729} {"train_loss": -27.7603816986084, "global_step": 558575, "epoch": 6729} {"train_loss": -27.6252498626709, "global_step": 558576, "epoch": 6729} {"train_loss": -27.9993839263916, "global_step": 558577, "epoch": 6729} {"train_loss": -27.80616569519043, "global_step": 558578, "epoch": 6729} {"train_loss": -28.00250244140625, "global_step": 558579, "epoch": 6729} {"train_loss": -27.3271427154541, "global_step": 558580, "epoch": 6729} {"train_loss": -27.858383178710938, "global_step": 558581, "epoch": 6729} {"train_loss": -27.84686851501465, "global_step": 558582, "epoch": 6729} {"train_loss": -27.51361083984375, "global_step": 558583, "epoch": 6729} {"train_loss": -27.77471923828125, "global_step": 558584, "epoch": 6729} {"train_loss": -27.646499633789062, "global_step": 558585, "epoch": 6729} {"train_loss": -27.902502059936523, "global_step": 558586, "epoch": 6729} {"train_loss": -27.825424194335938, "global_step": 558587, "epoch": 6729} {"train_loss": -27.9791259765625, "global_step": 558588, "epoch": 6729} {"train_loss": -27.29604160354798, "global_step": 558589, "epoch": 6729, "val_loss": 6480516.5} {"train_loss": -25.82684898376465, "global_step": 558590, "epoch": 6730} {"train_loss": -23.81209945678711, "global_step": 558591, "epoch": 6730} {"train_loss": -23.297115325927734, "global_step": 558592, "epoch": 6730} {"train_loss": -25.935461044311523, "global_step": 558593, "epoch": 6730} {"train_loss": -26.43061637878418, "global_step": 558594, "epoch": 6730} {"train_loss": -25.360109329223633, "global_step": 558595, "epoch": 6730} {"train_loss": -27.0340576171875, "global_step": 558596, "epoch": 6730} {"train_loss": -26.491748809814453, "global_step": 558597, "epoch": 6730} {"train_loss": -26.620594024658203, "global_step": 558598, "epoch": 6730} {"train_loss": -26.300928115844727, "global_step": 558599, "epoch": 6730} {"train_loss": -26.914953231811523, "global_step": 558600, "epoch": 6730} {"train_loss": -26.752843856811523, "global_step": 558601, "epoch": 6730} {"train_loss": -27.047460556030273, "global_step": 558602, "epoch": 6730} {"train_loss": -26.995935440063477, "global_step": 558603, "epoch": 6730} {"train_loss": -26.865558624267578, "global_step": 558604, "epoch": 6730} {"train_loss": -27.20882225036621, "global_step": 558605, "epoch": 6730} {"train_loss": -27.15791130065918, "global_step": 558606, "epoch": 6730} {"train_loss": -27.367822647094727, "global_step": 558607, "epoch": 6730} {"train_loss": -27.22490882873535, "global_step": 558608, "epoch": 6730} {"train_loss": -26.913654327392578, "global_step": 558609, "epoch": 6730} {"train_loss": -27.418140411376953, "global_step": 558610, "epoch": 6730} {"train_loss": -27.57485008239746, "global_step": 558611, "epoch": 6730} {"train_loss": -27.64862632751465, "global_step": 558612, "epoch": 6730} {"train_loss": -26.978302001953125, "global_step": 558613, "epoch": 6730} {"train_loss": -27.387231826782227, "global_step": 558614, "epoch": 6730} {"train_loss": -27.4669189453125, "global_step": 558615, "epoch": 6730} {"train_loss": -27.491342544555664, "global_step": 558616, "epoch": 6730} {"train_loss": -27.902502059936523, "global_step": 558617, "epoch": 6730} {"train_loss": -27.90888786315918, "global_step": 558618, "epoch": 6730} {"train_loss": -28.037622451782227, "global_step": 558619, "epoch": 6730} {"train_loss": -27.6732177734375, "global_step": 558620, "epoch": 6730} {"train_loss": -27.919540405273438, "global_step": 558621, "epoch": 6730} {"train_loss": -27.687299728393555, "global_step": 558622, "epoch": 6730} {"train_loss": -27.80997657775879, "global_step": 558623, "epoch": 6730} {"train_loss": -27.62763786315918, "global_step": 558624, "epoch": 6730} {"train_loss": -27.84812355041504, "global_step": 558625, "epoch": 6730} {"train_loss": -27.665258407592773, "global_step": 558626, "epoch": 6730} {"train_loss": -27.704797744750977, "global_step": 558627, "epoch": 6730} {"train_loss": -27.5053653717041, "global_step": 558628, "epoch": 6730} {"train_loss": -27.820714950561523, "global_step": 558629, "epoch": 6730} {"train_loss": -27.844913482666016, "global_step": 558630, "epoch": 6730} {"train_loss": -27.902612686157227, "global_step": 558631, "epoch": 6730} {"train_loss": -28.047574996948242, "global_step": 558632, "epoch": 6730} {"train_loss": -27.555673599243164, "global_step": 558633, "epoch": 6730} {"train_loss": -27.973724365234375, "global_step": 558634, "epoch": 6730} {"train_loss": -27.697513580322266, "global_step": 558635, "epoch": 6730} {"train_loss": -27.691747665405273, "global_step": 558636, "epoch": 6730} {"train_loss": -27.904367446899414, "global_step": 558637, "epoch": 6730} {"train_loss": -27.821104049682617, "global_step": 558638, "epoch": 6730} {"train_loss": -28.0665225982666, "global_step": 558639, "epoch": 6730} {"train_loss": -27.747989654541016, "global_step": 558640, "epoch": 6730} {"train_loss": -27.750598907470703, "global_step": 558641, "epoch": 6730} {"train_loss": -27.898025512695312, "global_step": 558642, "epoch": 6730} {"train_loss": -27.973602294921875, "global_step": 558643, "epoch": 6730} {"train_loss": -27.578937530517578, "global_step": 558644, "epoch": 6730} {"train_loss": -27.933969497680664, "global_step": 558645, "epoch": 6730} {"train_loss": -28.107898712158203, "global_step": 558646, "epoch": 6730} {"train_loss": -27.949024200439453, "global_step": 558647, "epoch": 6730} {"train_loss": -27.859710693359375, "global_step": 558648, "epoch": 6730} {"train_loss": -27.645431518554688, "global_step": 558649, "epoch": 6730} {"train_loss": -28.163410186767578, "global_step": 558650, "epoch": 6730} {"train_loss": -27.956501007080078, "global_step": 558651, "epoch": 6730} {"train_loss": -27.968097686767578, "global_step": 558652, "epoch": 6730} {"train_loss": -27.874725341796875, "global_step": 558653, "epoch": 6730} {"train_loss": -27.869678497314453, "global_step": 558654, "epoch": 6730} {"train_loss": -27.821975708007812, "global_step": 558655, "epoch": 6730} {"train_loss": -28.065109252929688, "global_step": 558656, "epoch": 6730} {"train_loss": -28.167770385742188, "global_step": 558657, "epoch": 6730} {"train_loss": -28.012908935546875, "global_step": 558658, "epoch": 6730} {"train_loss": -28.130569458007812, "global_step": 558659, "epoch": 6730} {"train_loss": -27.700714111328125, "global_step": 558660, "epoch": 6730} {"train_loss": -27.87568473815918, "global_step": 558661, "epoch": 6730} {"train_loss": -27.388031005859375, "global_step": 558662, "epoch": 6730} {"train_loss": -27.840362548828125, "global_step": 558663, "epoch": 6730} {"train_loss": -28.019058227539062, "global_step": 558664, "epoch": 6730} {"train_loss": -27.887678146362305, "global_step": 558665, "epoch": 6730} {"train_loss": -27.813840866088867, "global_step": 558666, "epoch": 6730} {"train_loss": -27.79807472229004, "global_step": 558667, "epoch": 6730} {"train_loss": -28.058120727539062, "global_step": 558668, "epoch": 6730} {"train_loss": -27.608417510986328, "global_step": 558669, "epoch": 6730} {"train_loss": -28.13030433654785, "global_step": 558670, "epoch": 6730} {"train_loss": -27.799646377563477, "global_step": 558671, "epoch": 6730} {"train_loss": -27.461992677435816, "global_step": 558672, "epoch": 6730, "val_loss": 6481262.5} {"train_loss": -27.92046546936035, "global_step": 558673, "epoch": 6731} {"train_loss": -27.3454532623291, "global_step": 558674, "epoch": 6731} {"train_loss": -26.699705123901367, "global_step": 558675, "epoch": 6731} {"train_loss": -27.200742721557617, "global_step": 558676, "epoch": 6731} {"train_loss": -27.1939754486084, "global_step": 558677, "epoch": 6731} {"train_loss": -27.4516544342041, "global_step": 558678, "epoch": 6731} {"train_loss": -27.45743751525879, "global_step": 558679, "epoch": 6731} {"train_loss": -27.501867294311523, "global_step": 558680, "epoch": 6731} {"train_loss": -27.365589141845703, "global_step": 558681, "epoch": 6731} {"train_loss": -27.5413875579834, "global_step": 558682, "epoch": 6731} {"train_loss": -27.088804244995117, "global_step": 558683, "epoch": 6731} {"train_loss": -27.8210506439209, "global_step": 558684, "epoch": 6731} {"train_loss": -27.698835372924805, "global_step": 558685, "epoch": 6731} {"train_loss": -27.699176788330078, "global_step": 558686, "epoch": 6731} {"train_loss": -27.536890029907227, "global_step": 558687, "epoch": 6731} {"train_loss": -27.96124839782715, "global_step": 558688, "epoch": 6731} {"train_loss": -27.410877227783203, "global_step": 558689, "epoch": 6731} {"train_loss": -27.54532814025879, "global_step": 558690, "epoch": 6731} {"train_loss": -27.738330841064453, "global_step": 558691, "epoch": 6731} {"train_loss": -27.301380157470703, "global_step": 558692, "epoch": 6731} {"train_loss": -28.287012100219727, "global_step": 558693, "epoch": 6731} {"train_loss": -27.753631591796875, "global_step": 558694, "epoch": 6731} {"train_loss": -27.738813400268555, "global_step": 558695, "epoch": 6731} {"train_loss": -27.759796142578125, "global_step": 558696, "epoch": 6731} {"train_loss": -27.795698165893555, "global_step": 558697, "epoch": 6731} {"train_loss": -27.788415908813477, "global_step": 558698, "epoch": 6731} {"train_loss": -27.915191650390625, "global_step": 558699, "epoch": 6731} {"train_loss": -27.742786407470703, "global_step": 558700, "epoch": 6731} {"train_loss": -27.867938995361328, "global_step": 558701, "epoch": 6731} {"train_loss": -28.005212783813477, "global_step": 558702, "epoch": 6731} {"train_loss": -28.100418090820312, "global_step": 558703, "epoch": 6731} {"train_loss": -27.714923858642578, "global_step": 558704, "epoch": 6731} {"train_loss": -27.609161376953125, "global_step": 558705, "epoch": 6731} {"train_loss": -28.063251495361328, "global_step": 558706, "epoch": 6731} {"train_loss": -27.771331787109375, "global_step": 558707, "epoch": 6731} {"train_loss": -27.910058975219727, "global_step": 558708, "epoch": 6731} {"train_loss": -27.926191329956055, "global_step": 558709, "epoch": 6731} {"train_loss": -27.420087814331055, "global_step": 558710, "epoch": 6731} {"train_loss": -28.1666202545166, "global_step": 558711, "epoch": 6731} {"train_loss": -27.690601348876953, "global_step": 558712, "epoch": 6731} {"train_loss": -27.83344078063965, "global_step": 558713, "epoch": 6731} {"train_loss": -27.967029571533203, "global_step": 558714, "epoch": 6731} {"train_loss": -27.6462459564209, "global_step": 558715, "epoch": 6731} {"train_loss": -27.805883407592773, "global_step": 558716, "epoch": 6731} {"train_loss": -27.783954620361328, "global_step": 558717, "epoch": 6731} {"train_loss": -27.95943260192871, "global_step": 558718, "epoch": 6731} {"train_loss": -27.747114181518555, "global_step": 558719, "epoch": 6731} {"train_loss": -27.76740837097168, "global_step": 558720, "epoch": 6731} {"train_loss": -27.936716079711914, "global_step": 558721, "epoch": 6731} {"train_loss": -27.81415367126465, "global_step": 558722, "epoch": 6731} {"train_loss": -27.697858810424805, "global_step": 558723, "epoch": 6731} {"train_loss": -27.815948486328125, "global_step": 558724, "epoch": 6731} {"train_loss": -27.663818359375, "global_step": 558725, "epoch": 6731} {"train_loss": -27.997888565063477, "global_step": 558726, "epoch": 6731} {"train_loss": -27.16529655456543, "global_step": 558727, "epoch": 6731} {"train_loss": -27.7725772857666, "global_step": 558728, "epoch": 6731} {"train_loss": -27.91029930114746, "global_step": 558729, "epoch": 6731} {"train_loss": -28.195484161376953, "global_step": 558730, "epoch": 6731} {"train_loss": -27.685626983642578, "global_step": 558731, "epoch": 6731} {"train_loss": -27.844024658203125, "global_step": 558732, "epoch": 6731} {"train_loss": -28.274139404296875, "global_step": 558733, "epoch": 6731} {"train_loss": -27.67975425720215, "global_step": 558734, "epoch": 6731} {"train_loss": -27.586627960205078, "global_step": 558735, "epoch": 6731} {"train_loss": -27.820646286010742, "global_step": 558736, "epoch": 6731} {"train_loss": -28.03082275390625, "global_step": 558737, "epoch": 6731} {"train_loss": -27.999542236328125, "global_step": 558738, "epoch": 6731} {"train_loss": -28.003870010375977, "global_step": 558739, "epoch": 6731} {"train_loss": -28.113569259643555, "global_step": 558740, "epoch": 6731} {"train_loss": -27.93082618713379, "global_step": 558741, "epoch": 6731} {"train_loss": -27.592634201049805, "global_step": 558742, "epoch": 6731} {"train_loss": -28.120532989501953, "global_step": 558743, "epoch": 6731} {"train_loss": -27.868009567260742, "global_step": 558744, "epoch": 6731} {"train_loss": -28.056013107299805, "global_step": 558745, "epoch": 6731} {"train_loss": -28.139795303344727, "global_step": 558746, "epoch": 6731} {"train_loss": -28.02936363220215, "global_step": 558747, "epoch": 6731} {"train_loss": -27.865066528320312, "global_step": 558748, "epoch": 6731} {"train_loss": -27.974878311157227, "global_step": 558749, "epoch": 6731} {"train_loss": -27.69217300415039, "global_step": 558750, "epoch": 6731} {"train_loss": -27.429061889648438, "global_step": 558751, "epoch": 6731} {"train_loss": -26.61551856994629, "global_step": 558752, "epoch": 6731} {"train_loss": -26.64910316467285, "global_step": 558753, "epoch": 6731} {"train_loss": -27.5233154296875, "global_step": 558754, "epoch": 6731} {"train_loss": -27.72615246600415, "global_step": 558755, "epoch": 6731, "val_loss": 6610474.0} {"train_loss": -26.51934814453125, "global_step": 558756, "epoch": 6732} {"train_loss": -25.9151668548584, "global_step": 558757, "epoch": 6732} {"train_loss": -27.16717529296875, "global_step": 558758, "epoch": 6732} {"train_loss": -26.3150634765625, "global_step": 558759, "epoch": 6732} {"train_loss": -26.24759292602539, "global_step": 558760, "epoch": 6732} {"train_loss": -25.904830932617188, "global_step": 558761, "epoch": 6732} {"train_loss": -27.08233070373535, "global_step": 558762, "epoch": 6732} {"train_loss": -26.298812866210938, "global_step": 558763, "epoch": 6732} {"train_loss": -27.013214111328125, "global_step": 558764, "epoch": 6732} {"train_loss": -26.68318748474121, "global_step": 558765, "epoch": 6732} {"train_loss": -26.909494400024414, "global_step": 558766, "epoch": 6732} {"train_loss": -26.63065528869629, "global_step": 558767, "epoch": 6732} {"train_loss": -27.16998863220215, "global_step": 558768, "epoch": 6732} {"train_loss": -27.135055541992188, "global_step": 558769, "epoch": 6732} {"train_loss": -27.14692497253418, "global_step": 558770, "epoch": 6732} {"train_loss": -27.207223892211914, "global_step": 558771, "epoch": 6732} {"train_loss": -27.147741317749023, "global_step": 558772, "epoch": 6732} {"train_loss": -27.17304801940918, "global_step": 558773, "epoch": 6732} {"train_loss": -26.8037166595459, "global_step": 558774, "epoch": 6732} {"train_loss": -27.3361759185791, "global_step": 558775, "epoch": 6732} {"train_loss": -26.9733943939209, "global_step": 558776, "epoch": 6732} {"train_loss": -27.234582901000977, "global_step": 558777, "epoch": 6732} {"train_loss": -27.4688663482666, "global_step": 558778, "epoch": 6732} {"train_loss": -27.767675399780273, "global_step": 558779, "epoch": 6732} {"train_loss": -27.449050903320312, "global_step": 558780, "epoch": 6732} {"train_loss": -27.079833984375, "global_step": 558781, "epoch": 6732} {"train_loss": -27.173017501831055, "global_step": 558782, "epoch": 6732} {"train_loss": -27.491851806640625, "global_step": 558783, "epoch": 6732} {"train_loss": -27.216068267822266, "global_step": 558784, "epoch": 6732} {"train_loss": -27.71240234375, "global_step": 558785, "epoch": 6732} {"train_loss": -27.562192916870117, "global_step": 558786, "epoch": 6732} {"train_loss": -27.95371437072754, "global_step": 558787, "epoch": 6732} {"train_loss": -27.642688751220703, "global_step": 558788, "epoch": 6732} {"train_loss": -27.625028610229492, "global_step": 558789, "epoch": 6732} {"train_loss": -27.653650283813477, "global_step": 558790, "epoch": 6732} {"train_loss": -27.24932289123535, "global_step": 558791, "epoch": 6732} {"train_loss": -27.49859046936035, "global_step": 558792, "epoch": 6732} {"train_loss": -27.502334594726562, "global_step": 558793, "epoch": 6732} {"train_loss": -27.205398559570312, "global_step": 558794, "epoch": 6732} {"train_loss": -27.900558471679688, "global_step": 558795, "epoch": 6732} {"train_loss": -27.42596435546875, "global_step": 558796, "epoch": 6732} {"train_loss": -27.811145782470703, "global_step": 558797, "epoch": 6732} {"train_loss": -28.265344619750977, "global_step": 558798, "epoch": 6732} {"train_loss": -27.789457321166992, "global_step": 558799, "epoch": 6732} {"train_loss": -27.983427047729492, "global_step": 558800, "epoch": 6732} {"train_loss": -27.2061824798584, "global_step": 558801, "epoch": 6732} {"train_loss": -27.856903076171875, "global_step": 558802, "epoch": 6732} {"train_loss": -27.805877685546875, "global_step": 558803, "epoch": 6732} {"train_loss": -27.623727798461914, "global_step": 558804, "epoch": 6732} {"train_loss": -28.099721908569336, "global_step": 558805, "epoch": 6732} {"train_loss": -27.80463218688965, "global_step": 558806, "epoch": 6732} {"train_loss": -27.772811889648438, "global_step": 558807, "epoch": 6732} {"train_loss": -27.635568618774414, "global_step": 558808, "epoch": 6732} {"train_loss": -28.087299346923828, "global_step": 558809, "epoch": 6732} {"train_loss": -27.86237144470215, "global_step": 558810, "epoch": 6732} {"train_loss": -28.355920791625977, "global_step": 558811, "epoch": 6732} {"train_loss": -27.598194122314453, "global_step": 558812, "epoch": 6732} {"train_loss": -27.991308212280273, "global_step": 558813, "epoch": 6732} {"train_loss": -27.27878761291504, "global_step": 558814, "epoch": 6732} {"train_loss": -27.4577693939209, "global_step": 558815, "epoch": 6732} {"train_loss": -27.755680084228516, "global_step": 558816, "epoch": 6732} {"train_loss": -28.0908260345459, "global_step": 558817, "epoch": 6732} {"train_loss": -27.772418975830078, "global_step": 558818, "epoch": 6732} {"train_loss": -27.500823974609375, "global_step": 558819, "epoch": 6732} {"train_loss": -28.081708908081055, "global_step": 558820, "epoch": 6732} {"train_loss": -28.023242950439453, "global_step": 558821, "epoch": 6732} {"train_loss": -27.949308395385742, "global_step": 558822, "epoch": 6732} {"train_loss": -27.6466007232666, "global_step": 558823, "epoch": 6732} {"train_loss": -27.571027755737305, "global_step": 558824, "epoch": 6732} {"train_loss": -27.951725006103516, "global_step": 558825, "epoch": 6732} {"train_loss": -28.022003173828125, "global_step": 558826, "epoch": 6732} {"train_loss": -27.477874755859375, "global_step": 558827, "epoch": 6732} {"train_loss": -27.64910316467285, "global_step": 558828, "epoch": 6732} {"train_loss": -27.460355758666992, "global_step": 558829, "epoch": 6732} {"train_loss": -27.698644638061523, "global_step": 558830, "epoch": 6732} {"train_loss": -27.211380004882812, "global_step": 558831, "epoch": 6732} {"train_loss": -26.834762573242188, "global_step": 558832, "epoch": 6732} {"train_loss": -26.916784286499023, "global_step": 558833, "epoch": 6732} {"train_loss": -26.937164306640625, "global_step": 558834, "epoch": 6732} {"train_loss": -27.405426025390625, "global_step": 558835, "epoch": 6732} {"train_loss": -27.744123458862305, "global_step": 558836, "epoch": 6732} {"train_loss": -27.351734161376953, "global_step": 558837, "epoch": 6732} {"train_loss": -27.416027574654084, "global_step": 558838, "epoch": 6732, "val_loss": 6595021.0} {"train_loss": -27.898361206054688, "global_step": 558839, "epoch": 6733} {"train_loss": -27.544147491455078, "global_step": 558840, "epoch": 6733} {"train_loss": -27.324560165405273, "global_step": 558841, "epoch": 6733} {"train_loss": -27.348852157592773, "global_step": 558842, "epoch": 6733} {"train_loss": -27.75016212463379, "global_step": 558843, "epoch": 6733} {"train_loss": -27.413116455078125, "global_step": 558844, "epoch": 6733} {"train_loss": -27.463886260986328, "global_step": 558845, "epoch": 6733} {"train_loss": -27.434988021850586, "global_step": 558846, "epoch": 6733} {"train_loss": -27.719579696655273, "global_step": 558847, "epoch": 6733} {"train_loss": -27.130704879760742, "global_step": 558848, "epoch": 6733} {"train_loss": -27.22858238220215, "global_step": 558849, "epoch": 6733} {"train_loss": -27.317642211914062, "global_step": 558850, "epoch": 6733} {"train_loss": -27.82666015625, "global_step": 558851, "epoch": 6733} {"train_loss": -27.65668296813965, "global_step": 558852, "epoch": 6733} {"train_loss": -27.867456436157227, "global_step": 558853, "epoch": 6733} {"train_loss": -27.946781158447266, "global_step": 558854, "epoch": 6733} {"train_loss": -27.49090576171875, "global_step": 558855, "epoch": 6733} {"train_loss": -27.307876586914062, "global_step": 558856, "epoch": 6733} {"train_loss": -27.663421630859375, "global_step": 558857, "epoch": 6733} {"train_loss": -27.650663375854492, "global_step": 558858, "epoch": 6733} {"train_loss": -27.568445205688477, "global_step": 558859, "epoch": 6733} {"train_loss": -27.766727447509766, "global_step": 558860, "epoch": 6733} {"train_loss": -27.781295776367188, "global_step": 558861, "epoch": 6733} {"train_loss": -28.044178009033203, "global_step": 558862, "epoch": 6733} {"train_loss": -27.618757247924805, "global_step": 558863, "epoch": 6733} {"train_loss": -27.75082778930664, "global_step": 558864, "epoch": 6733} {"train_loss": -27.572650909423828, "global_step": 558865, "epoch": 6733} {"train_loss": -27.65923500061035, "global_step": 558866, "epoch": 6733} {"train_loss": -28.0548152923584, "global_step": 558867, "epoch": 6733} {"train_loss": -27.798086166381836, "global_step": 558868, "epoch": 6733} {"train_loss": -27.437545776367188, "global_step": 558869, "epoch": 6733} {"train_loss": -27.947589874267578, "global_step": 558870, "epoch": 6733} {"train_loss": -27.88691520690918, "global_step": 558871, "epoch": 6733} {"train_loss": -27.7371883392334, "global_step": 558872, "epoch": 6733} {"train_loss": -28.038183212280273, "global_step": 558873, "epoch": 6733} {"train_loss": -27.95564079284668, "global_step": 558874, "epoch": 6733} {"train_loss": -27.657913208007812, "global_step": 558875, "epoch": 6733} {"train_loss": -28.13818359375, "global_step": 558876, "epoch": 6733} {"train_loss": -27.68208885192871, "global_step": 558877, "epoch": 6733} {"train_loss": -27.73126220703125, "global_step": 558878, "epoch": 6733} {"train_loss": -27.80963134765625, "global_step": 558879, "epoch": 6733} {"train_loss": -27.9427547454834, "global_step": 558880, "epoch": 6733} {"train_loss": -27.618621826171875, "global_step": 558881, "epoch": 6733} {"train_loss": -28.254674911499023, "global_step": 558882, "epoch": 6733} {"train_loss": -28.137134552001953, "global_step": 558883, "epoch": 6733} {"train_loss": -28.050262451171875, "global_step": 558884, "epoch": 6733} {"train_loss": -27.791357040405273, "global_step": 558885, "epoch": 6733} {"train_loss": -27.881805419921875, "global_step": 558886, "epoch": 6733} {"train_loss": -27.800077438354492, "global_step": 558887, "epoch": 6733} {"train_loss": -27.59868812561035, "global_step": 558888, "epoch": 6733} {"train_loss": -28.177371978759766, "global_step": 558889, "epoch": 6733} {"train_loss": -27.960418701171875, "global_step": 558890, "epoch": 6733} {"train_loss": -28.152862548828125, "global_step": 558891, "epoch": 6733} {"train_loss": -27.8619327545166, "global_step": 558892, "epoch": 6733} {"train_loss": -27.56391716003418, "global_step": 558893, "epoch": 6733} {"train_loss": -27.940826416015625, "global_step": 558894, "epoch": 6733} {"train_loss": -27.943073272705078, "global_step": 558895, "epoch": 6733} {"train_loss": -27.388906478881836, "global_step": 558896, "epoch": 6733} {"train_loss": -27.47297477722168, "global_step": 558897, "epoch": 6733} {"train_loss": -27.67182731628418, "global_step": 558898, "epoch": 6733} {"train_loss": -27.613712310791016, "global_step": 558899, "epoch": 6733} {"train_loss": -27.745874404907227, "global_step": 558900, "epoch": 6733} {"train_loss": -27.52644920349121, "global_step": 558901, "epoch": 6733} {"train_loss": -27.383153915405273, "global_step": 558902, "epoch": 6733} {"train_loss": -27.651782989501953, "global_step": 558903, "epoch": 6733} {"train_loss": -27.55768394470215, "global_step": 558904, "epoch": 6733} {"train_loss": -27.45633316040039, "global_step": 558905, "epoch": 6733} {"train_loss": -28.08417320251465, "global_step": 558906, "epoch": 6733} {"train_loss": -27.753952026367188, "global_step": 558907, "epoch": 6733} {"train_loss": -27.904626846313477, "global_step": 558908, "epoch": 6733} {"train_loss": -27.928302764892578, "global_step": 558909, "epoch": 6733} {"train_loss": -27.8768253326416, "global_step": 558910, "epoch": 6733} {"train_loss": -28.1031436920166, "global_step": 558911, "epoch": 6733} {"train_loss": -28.05613136291504, "global_step": 558912, "epoch": 6733} {"train_loss": -27.57987403869629, "global_step": 558913, "epoch": 6733} {"train_loss": -27.944110870361328, "global_step": 558914, "epoch": 6733} {"train_loss": -27.75408935546875, "global_step": 558915, "epoch": 6733} {"train_loss": -28.05738639831543, "global_step": 558916, "epoch": 6733} {"train_loss": -28.109176635742188, "global_step": 558917, "epoch": 6733} {"train_loss": -28.06268310546875, "global_step": 558918, "epoch": 6733} {"train_loss": -27.695053100585938, "global_step": 558919, "epoch": 6733} {"train_loss": -27.839258193969727, "global_step": 558920, "epoch": 6733} {"train_loss": -27.753093926303357, "global_step": 558921, "epoch": 6733, "val_loss": 6626475.0} {"train_loss": -27.53278160095215, "global_step": 558922, "epoch": 6734} {"train_loss": -27.086652755737305, "global_step": 558923, "epoch": 6734} {"train_loss": -27.25617790222168, "global_step": 558924, "epoch": 6734} {"train_loss": -27.532684326171875, "global_step": 558925, "epoch": 6734} {"train_loss": -27.3207950592041, "global_step": 558926, "epoch": 6734} {"train_loss": -27.309473037719727, "global_step": 558927, "epoch": 6734} {"train_loss": -27.61676025390625, "global_step": 558928, "epoch": 6734} {"train_loss": -27.541391372680664, "global_step": 558929, "epoch": 6734} {"train_loss": -27.51807975769043, "global_step": 558930, "epoch": 6734} {"train_loss": -27.269643783569336, "global_step": 558931, "epoch": 6734} {"train_loss": -27.57828140258789, "global_step": 558932, "epoch": 6734} {"train_loss": -27.614355087280273, "global_step": 558933, "epoch": 6734} {"train_loss": -27.6705379486084, "global_step": 558934, "epoch": 6734} {"train_loss": -27.591400146484375, "global_step": 558935, "epoch": 6734} {"train_loss": -27.186994552612305, "global_step": 558936, "epoch": 6734} {"train_loss": -27.331024169921875, "global_step": 558937, "epoch": 6734} {"train_loss": -27.58024024963379, "global_step": 558938, "epoch": 6734} {"train_loss": -27.8740291595459, "global_step": 558939, "epoch": 6734} {"train_loss": -27.501386642456055, "global_step": 558940, "epoch": 6734} {"train_loss": -27.381072998046875, "global_step": 558941, "epoch": 6734} {"train_loss": -27.700366973876953, "global_step": 558942, "epoch": 6734} {"train_loss": -27.744165420532227, "global_step": 558943, "epoch": 6734} {"train_loss": -27.453351974487305, "global_step": 558944, "epoch": 6734} {"train_loss": -27.650659561157227, "global_step": 558945, "epoch": 6734} {"train_loss": -27.39447021484375, "global_step": 558946, "epoch": 6734} {"train_loss": -27.516738891601562, "global_step": 558947, "epoch": 6734} {"train_loss": -28.061853408813477, "global_step": 558948, "epoch": 6734} {"train_loss": -27.774465560913086, "global_step": 558949, "epoch": 6734} {"train_loss": -27.510812759399414, "global_step": 558950, "epoch": 6734} {"train_loss": -27.710357666015625, "global_step": 558951, "epoch": 6734} {"train_loss": -27.92609977722168, "global_step": 558952, "epoch": 6734} {"train_loss": -27.7685489654541, "global_step": 558953, "epoch": 6734} {"train_loss": -28.004064559936523, "global_step": 558954, "epoch": 6734} {"train_loss": -27.622282028198242, "global_step": 558955, "epoch": 6734} {"train_loss": -28.184843063354492, "global_step": 558956, "epoch": 6734} {"train_loss": -27.727285385131836, "global_step": 558957, "epoch": 6734} {"train_loss": -27.76154899597168, "global_step": 558958, "epoch": 6734} {"train_loss": -27.661596298217773, "global_step": 558959, "epoch": 6734} {"train_loss": -27.705398559570312, "global_step": 558960, "epoch": 6734} {"train_loss": -27.517337799072266, "global_step": 558961, "epoch": 6734} {"train_loss": -27.417560577392578, "global_step": 558962, "epoch": 6734} {"train_loss": -28.154211044311523, "global_step": 558963, "epoch": 6734} {"train_loss": -27.64063835144043, "global_step": 558964, "epoch": 6734} {"train_loss": -27.559911727905273, "global_step": 558965, "epoch": 6734} {"train_loss": -28.1185302734375, "global_step": 558966, "epoch": 6734} {"train_loss": -27.85676383972168, "global_step": 558967, "epoch": 6734} {"train_loss": -27.716699600219727, "global_step": 558968, "epoch": 6734} {"train_loss": -27.908288955688477, "global_step": 558969, "epoch": 6734} {"train_loss": -27.5439395904541, "global_step": 558970, "epoch": 6734} {"train_loss": -28.036422729492188, "global_step": 558971, "epoch": 6734} {"train_loss": -27.924909591674805, "global_step": 558972, "epoch": 6734} {"train_loss": -27.92603874206543, "global_step": 558973, "epoch": 6734} {"train_loss": -27.840835571289062, "global_step": 558974, "epoch": 6734} {"train_loss": -27.328662872314453, "global_step": 558975, "epoch": 6734} {"train_loss": -27.8345947265625, "global_step": 558976, "epoch": 6734} {"train_loss": -27.886762619018555, "global_step": 558977, "epoch": 6734} {"train_loss": -27.712854385375977, "global_step": 558978, "epoch": 6734} {"train_loss": -27.661151885986328, "global_step": 558979, "epoch": 6734} {"train_loss": -27.901777267456055, "global_step": 558980, "epoch": 6734} {"train_loss": -27.998388290405273, "global_step": 558981, "epoch": 6734} {"train_loss": -27.87320899963379, "global_step": 558982, "epoch": 6734} {"train_loss": -27.546030044555664, "global_step": 558983, "epoch": 6734} {"train_loss": -27.68461036682129, "global_step": 558984, "epoch": 6734} {"train_loss": -27.87835121154785, "global_step": 558985, "epoch": 6734} {"train_loss": -28.0921573638916, "global_step": 558986, "epoch": 6734} {"train_loss": -27.79510498046875, "global_step": 558987, "epoch": 6734} {"train_loss": -27.38275718688965, "global_step": 558988, "epoch": 6734} {"train_loss": -27.17713737487793, "global_step": 558989, "epoch": 6734} {"train_loss": -27.554162979125977, "global_step": 558990, "epoch": 6734} {"train_loss": -28.038022994995117, "global_step": 558991, "epoch": 6734} {"train_loss": -27.404804229736328, "global_step": 558992, "epoch": 6734} {"train_loss": -27.55707359313965, "global_step": 558993, "epoch": 6734} {"train_loss": -27.8620662689209, "global_step": 558994, "epoch": 6734} {"train_loss": -27.68438720703125, "global_step": 558995, "epoch": 6734} {"train_loss": -27.967620849609375, "global_step": 558996, "epoch": 6734} {"train_loss": -27.9263916015625, "global_step": 558997, "epoch": 6734} {"train_loss": -27.445575714111328, "global_step": 558998, "epoch": 6734} {"train_loss": -27.991439819335938, "global_step": 558999, "epoch": 6734} {"train_loss": -28.075231552124023, "global_step": 559000, "epoch": 6734} {"train_loss": -28.12006187438965, "global_step": 559001, "epoch": 6734} {"train_loss": -27.641698837280273, "global_step": 559002, "epoch": 6734} {"train_loss": -27.758955001831055, "global_step": 559003, "epoch": 6734} {"train_loss": -27.70296675900379, "global_step": 559004, "epoch": 6734, "val_loss": 6578610.0} {"train_loss": -26.54964256286621, "global_step": 559005, "epoch": 6735} {"train_loss": -26.8015079498291, "global_step": 559006, "epoch": 6735} {"train_loss": -27.380773544311523, "global_step": 559007, "epoch": 6735} {"train_loss": -27.325876235961914, "global_step": 559008, "epoch": 6735} {"train_loss": -27.232568740844727, "global_step": 559009, "epoch": 6735} {"train_loss": -27.312177658081055, "global_step": 559010, "epoch": 6735} {"train_loss": -27.489856719970703, "global_step": 559011, "epoch": 6735} {"train_loss": -27.372289657592773, "global_step": 559012, "epoch": 6735} {"train_loss": -27.095800399780273, "global_step": 559013, "epoch": 6735} {"train_loss": -27.396215438842773, "global_step": 559014, "epoch": 6735} {"train_loss": -27.255430221557617, "global_step": 559015, "epoch": 6735} {"train_loss": -27.41340446472168, "global_step": 559016, "epoch": 6735} {"train_loss": -27.676116943359375, "global_step": 559017, "epoch": 6735} {"train_loss": -27.945697784423828, "global_step": 559018, "epoch": 6735} {"train_loss": -27.320825576782227, "global_step": 559019, "epoch": 6735} {"train_loss": -28.285369873046875, "global_step": 559020, "epoch": 6735} {"train_loss": -27.687915802001953, "global_step": 559021, "epoch": 6735} {"train_loss": -27.476825714111328, "global_step": 559022, "epoch": 6735} {"train_loss": -27.77418327331543, "global_step": 559023, "epoch": 6735} {"train_loss": -27.42158317565918, "global_step": 559024, "epoch": 6735} {"train_loss": -27.496326446533203, "global_step": 559025, "epoch": 6735} {"train_loss": -27.74226951599121, "global_step": 559026, "epoch": 6735} {"train_loss": -28.011051177978516, "global_step": 559027, "epoch": 6735} {"train_loss": -27.701251983642578, "global_step": 559028, "epoch": 6735} {"train_loss": -27.939619064331055, "global_step": 559029, "epoch": 6735} {"train_loss": -27.92559814453125, "global_step": 559030, "epoch": 6735} {"train_loss": -28.183929443359375, "global_step": 559031, "epoch": 6735} {"train_loss": -27.45191764831543, "global_step": 559032, "epoch": 6735} {"train_loss": -27.629560470581055, "global_step": 559033, "epoch": 6735} {"train_loss": -27.994054794311523, "global_step": 559034, "epoch": 6735} {"train_loss": -27.80561637878418, "global_step": 559035, "epoch": 6735} {"train_loss": -28.28271484375, "global_step": 559036, "epoch": 6735} {"train_loss": -27.48707389831543, "global_step": 559037, "epoch": 6735} {"train_loss": -27.876569747924805, "global_step": 559038, "epoch": 6735} {"train_loss": -27.48654556274414, "global_step": 559039, "epoch": 6735} {"train_loss": -27.59760856628418, "global_step": 559040, "epoch": 6735} {"train_loss": -27.592803955078125, "global_step": 559041, "epoch": 6735} {"train_loss": -27.69244384765625, "global_step": 559042, "epoch": 6735} {"train_loss": -27.850360870361328, "global_step": 559043, "epoch": 6735} {"train_loss": -27.9892635345459, "global_step": 559044, "epoch": 6735} {"train_loss": -28.131946563720703, "global_step": 559045, "epoch": 6735} {"train_loss": -27.572065353393555, "global_step": 559046, "epoch": 6735} {"train_loss": -27.57084083557129, "global_step": 559047, "epoch": 6735} {"train_loss": -27.873188018798828, "global_step": 559048, "epoch": 6735} {"train_loss": -27.671117782592773, "global_step": 559049, "epoch": 6735} {"train_loss": -27.481815338134766, "global_step": 559050, "epoch": 6735} {"train_loss": -27.835309982299805, "global_step": 559051, "epoch": 6735} {"train_loss": -27.585418701171875, "global_step": 559052, "epoch": 6735} {"train_loss": -27.870187759399414, "global_step": 559053, "epoch": 6735} {"train_loss": -27.806598663330078, "global_step": 559054, "epoch": 6735} {"train_loss": -27.444250106811523, "global_step": 559055, "epoch": 6735} {"train_loss": -28.102590560913086, "global_step": 559056, "epoch": 6735} {"train_loss": -27.912067413330078, "global_step": 559057, "epoch": 6735} {"train_loss": -27.917829513549805, "global_step": 559058, "epoch": 6735} {"train_loss": -27.75368309020996, "global_step": 559059, "epoch": 6735} {"train_loss": -27.642791748046875, "global_step": 559060, "epoch": 6735} {"train_loss": -27.601612091064453, "global_step": 559061, "epoch": 6735} {"train_loss": -27.563251495361328, "global_step": 559062, "epoch": 6735} {"train_loss": -27.806493759155273, "global_step": 559063, "epoch": 6735} {"train_loss": -28.07472038269043, "global_step": 559064, "epoch": 6735} {"train_loss": -27.69658851623535, "global_step": 559065, "epoch": 6735} {"train_loss": -27.26873779296875, "global_step": 559066, "epoch": 6735} {"train_loss": -27.840961456298828, "global_step": 559067, "epoch": 6735} {"train_loss": -27.88886070251465, "global_step": 559068, "epoch": 6735} {"train_loss": -27.85243797302246, "global_step": 559069, "epoch": 6735} {"train_loss": -28.311777114868164, "global_step": 559070, "epoch": 6735} {"train_loss": -27.265899658203125, "global_step": 559071, "epoch": 6735} {"train_loss": -27.647348403930664, "global_step": 559072, "epoch": 6735} {"train_loss": -27.420501708984375, "global_step": 559073, "epoch": 6735} {"train_loss": -27.69550132751465, "global_step": 559074, "epoch": 6735} {"train_loss": -28.1568660736084, "global_step": 559075, "epoch": 6735} {"train_loss": -27.5612850189209, "global_step": 559076, "epoch": 6735} {"train_loss": -27.652057647705078, "global_step": 559077, "epoch": 6735} {"train_loss": -27.63654899597168, "global_step": 559078, "epoch": 6735} {"train_loss": -27.242847442626953, "global_step": 559079, "epoch": 6735} {"train_loss": -27.756689071655273, "global_step": 559080, "epoch": 6735} {"train_loss": -27.652713775634766, "global_step": 559081, "epoch": 6735} {"train_loss": -27.9223575592041, "global_step": 559082, "epoch": 6735} {"train_loss": -28.026874542236328, "global_step": 559083, "epoch": 6735} {"train_loss": -28.08479881286621, "global_step": 559084, "epoch": 6735} {"train_loss": -27.91852378845215, "global_step": 559085, "epoch": 6735} {"train_loss": -27.98712158203125, "global_step": 559086, "epoch": 6735} {"train_loss": -27.680083309311463, "global_step": 559087, "epoch": 6735, "val_loss": 6717461.0} {"train_loss": -25.87994384765625, "global_step": 559088, "epoch": 6736} {"train_loss": -26.098773956298828, "global_step": 559089, "epoch": 6736} {"train_loss": -26.20073890686035, "global_step": 559090, "epoch": 6736} {"train_loss": -26.273080825805664, "global_step": 559091, "epoch": 6736} {"train_loss": -26.140522003173828, "global_step": 559092, "epoch": 6736} {"train_loss": -26.755529403686523, "global_step": 559093, "epoch": 6736} {"train_loss": -26.231536865234375, "global_step": 559094, "epoch": 6736} {"train_loss": -26.415124893188477, "global_step": 559095, "epoch": 6736} {"train_loss": -27.11992835998535, "global_step": 559096, "epoch": 6736} {"train_loss": -26.839374542236328, "global_step": 559097, "epoch": 6736} {"train_loss": -26.914213180541992, "global_step": 559098, "epoch": 6736} {"train_loss": -26.623233795166016, "global_step": 559099, "epoch": 6736} {"train_loss": -27.28118324279785, "global_step": 559100, "epoch": 6736} {"train_loss": -27.429975509643555, "global_step": 559101, "epoch": 6736} {"train_loss": -27.33637046813965, "global_step": 559102, "epoch": 6736} {"train_loss": -27.246658325195312, "global_step": 559103, "epoch": 6736} {"train_loss": -27.354248046875, "global_step": 559104, "epoch": 6736} {"train_loss": -27.480453491210938, "global_step": 559105, "epoch": 6736} {"train_loss": -26.92132568359375, "global_step": 559106, "epoch": 6736} {"train_loss": -27.33652687072754, "global_step": 559107, "epoch": 6736} {"train_loss": -27.4522705078125, "global_step": 559108, "epoch": 6736} {"train_loss": -27.299942016601562, "global_step": 559109, "epoch": 6736} {"train_loss": -27.45509147644043, "global_step": 559110, "epoch": 6736} {"train_loss": -27.334394454956055, "global_step": 559111, "epoch": 6736} {"train_loss": -27.466596603393555, "global_step": 559112, "epoch": 6736} {"train_loss": -27.207082748413086, "global_step": 559113, "epoch": 6736} {"train_loss": -27.535802841186523, "global_step": 559114, "epoch": 6736} {"train_loss": -27.21973991394043, "global_step": 559115, "epoch": 6736} {"train_loss": -27.737152099609375, "global_step": 559116, "epoch": 6736} {"train_loss": -27.579498291015625, "global_step": 559117, "epoch": 6736} {"train_loss": -27.566144943237305, "global_step": 559118, "epoch": 6736} {"train_loss": -27.39716148376465, "global_step": 559119, "epoch": 6736} {"train_loss": -27.655241012573242, "global_step": 559120, "epoch": 6736} {"train_loss": -27.673648834228516, "global_step": 559121, "epoch": 6736} {"train_loss": -27.9884033203125, "global_step": 559122, "epoch": 6736} {"train_loss": -27.712995529174805, "global_step": 559123, "epoch": 6736} {"train_loss": -27.543241500854492, "global_step": 559124, "epoch": 6736} {"train_loss": -27.321786880493164, "global_step": 559125, "epoch": 6736} {"train_loss": -27.794036865234375, "global_step": 559126, "epoch": 6736} {"train_loss": -27.610944747924805, "global_step": 559127, "epoch": 6736} {"train_loss": -28.109750747680664, "global_step": 559128, "epoch": 6736} {"train_loss": -28.030073165893555, "global_step": 559129, "epoch": 6736} {"train_loss": -27.737882614135742, "global_step": 559130, "epoch": 6736} {"train_loss": -27.948450088500977, "global_step": 559131, "epoch": 6736} {"train_loss": -27.841867446899414, "global_step": 559132, "epoch": 6736} {"train_loss": -27.696643829345703, "global_step": 559133, "epoch": 6736} {"train_loss": -27.985593795776367, "global_step": 559134, "epoch": 6736} {"train_loss": -27.790576934814453, "global_step": 559135, "epoch": 6736} {"train_loss": -27.89239501953125, "global_step": 559136, "epoch": 6736} {"train_loss": -28.016651153564453, "global_step": 559137, "epoch": 6736} {"train_loss": -27.579919815063477, "global_step": 559138, "epoch": 6736} {"train_loss": -28.01824378967285, "global_step": 559139, "epoch": 6736} {"train_loss": -27.59297752380371, "global_step": 559140, "epoch": 6736} {"train_loss": -27.712772369384766, "global_step": 559141, "epoch": 6736} {"train_loss": -27.84309959411621, "global_step": 559142, "epoch": 6736} {"train_loss": -27.9849853515625, "global_step": 559143, "epoch": 6736} {"train_loss": -27.907581329345703, "global_step": 559144, "epoch": 6736} {"train_loss": -28.334150314331055, "global_step": 559145, "epoch": 6736} {"train_loss": -28.277301788330078, "global_step": 559146, "epoch": 6736} {"train_loss": -28.095062255859375, "global_step": 559147, "epoch": 6736} {"train_loss": -27.959487915039062, "global_step": 559148, "epoch": 6736} {"train_loss": -27.86395263671875, "global_step": 559149, "epoch": 6736} {"train_loss": -28.00307273864746, "global_step": 559150, "epoch": 6736} {"train_loss": -27.872037887573242, "global_step": 559151, "epoch": 6736} {"train_loss": -27.957788467407227, "global_step": 559152, "epoch": 6736} {"train_loss": -27.68059730529785, "global_step": 559153, "epoch": 6736} {"train_loss": -27.92864990234375, "global_step": 559154, "epoch": 6736} {"train_loss": -27.987470626831055, "global_step": 559155, "epoch": 6736} {"train_loss": -27.907785415649414, "global_step": 559156, "epoch": 6736} {"train_loss": -28.07086753845215, "global_step": 559157, "epoch": 6736} {"train_loss": -27.748441696166992, "global_step": 559158, "epoch": 6736} {"train_loss": -27.011524200439453, "global_step": 559159, "epoch": 6736} {"train_loss": -26.989215850830078, "global_step": 559160, "epoch": 6736} {"train_loss": -27.247182846069336, "global_step": 559161, "epoch": 6736} {"train_loss": -26.98712730407715, "global_step": 559162, "epoch": 6736} {"train_loss": -27.35943603515625, "global_step": 559163, "epoch": 6736} {"train_loss": -27.4578914642334, "global_step": 559164, "epoch": 6736} {"train_loss": -27.458499908447266, "global_step": 559165, "epoch": 6736} {"train_loss": -27.297351837158203, "global_step": 559166, "epoch": 6736} {"train_loss": -27.94293212890625, "global_step": 559167, "epoch": 6736} {"train_loss": -27.527570724487305, "global_step": 559168, "epoch": 6736} {"train_loss": -27.56391716003418, "global_step": 559169, "epoch": 6736} {"train_loss": -27.463610476758106, "global_step": 559170, "epoch": 6736, "val_loss": 6653085.0} {"train_loss": -27.307479858398438, "global_step": 559171, "epoch": 6737} {"train_loss": -27.0322322845459, "global_step": 559172, "epoch": 6737} {"train_loss": -26.871185302734375, "global_step": 559173, "epoch": 6737} {"train_loss": -27.07663917541504, "global_step": 559174, "epoch": 6737} {"train_loss": -27.32167625427246, "global_step": 559175, "epoch": 6737} {"train_loss": -26.7884464263916, "global_step": 559176, "epoch": 6737} {"train_loss": -27.765552520751953, "global_step": 559177, "epoch": 6737} {"train_loss": -27.277063369750977, "global_step": 559178, "epoch": 6737} {"train_loss": -27.36199951171875, "global_step": 559179, "epoch": 6737} {"train_loss": -27.419153213500977, "global_step": 559180, "epoch": 6737} {"train_loss": -27.64898109436035, "global_step": 559181, "epoch": 6737} {"train_loss": -27.322803497314453, "global_step": 559182, "epoch": 6737} {"train_loss": -27.289281845092773, "global_step": 559183, "epoch": 6737} {"train_loss": -27.299121856689453, "global_step": 559184, "epoch": 6737} {"train_loss": -27.40418815612793, "global_step": 559185, "epoch": 6737} {"train_loss": -27.62970542907715, "global_step": 559186, "epoch": 6737} {"train_loss": -27.865802764892578, "global_step": 559187, "epoch": 6737} {"train_loss": -27.6617431640625, "global_step": 559188, "epoch": 6737} {"train_loss": -27.9337215423584, "global_step": 559189, "epoch": 6737} {"train_loss": -27.064254760742188, "global_step": 559190, "epoch": 6737} {"train_loss": -27.68143653869629, "global_step": 559191, "epoch": 6737} {"train_loss": -27.806793212890625, "global_step": 559192, "epoch": 6737} {"train_loss": -27.780902862548828, "global_step": 559193, "epoch": 6737} {"train_loss": -27.56727409362793, "global_step": 559194, "epoch": 6737} {"train_loss": -27.739126205444336, "global_step": 559195, "epoch": 6737} {"train_loss": -27.8565673828125, "global_step": 559196, "epoch": 6737} {"train_loss": -28.11541175842285, "global_step": 559197, "epoch": 6737} {"train_loss": -27.549230575561523, "global_step": 559198, "epoch": 6737} {"train_loss": -27.4185848236084, "global_step": 559199, "epoch": 6737} {"train_loss": -28.12860107421875, "global_step": 559200, "epoch": 6737} {"train_loss": -27.843460083007812, "global_step": 559201, "epoch": 6737} {"train_loss": -27.87140464782715, "global_step": 559202, "epoch": 6737} {"train_loss": -27.797882080078125, "global_step": 559203, "epoch": 6737} {"train_loss": -27.971460342407227, "global_step": 559204, "epoch": 6737} {"train_loss": -27.952835083007812, "global_step": 559205, "epoch": 6737} {"train_loss": -27.597442626953125, "global_step": 559206, "epoch": 6737} {"train_loss": -28.392988204956055, "global_step": 559207, "epoch": 6737} {"train_loss": -28.150922775268555, "global_step": 559208, "epoch": 6737} {"train_loss": -27.959516525268555, "global_step": 559209, "epoch": 6737} {"train_loss": -28.2515811920166, "global_step": 559210, "epoch": 6737} {"train_loss": -27.868270874023438, "global_step": 559211, "epoch": 6737} {"train_loss": -27.985273361206055, "global_step": 559212, "epoch": 6737} {"train_loss": -27.825305938720703, "global_step": 559213, "epoch": 6737} {"train_loss": -28.5398006439209, "global_step": 559214, "epoch": 6737} {"train_loss": -27.7116756439209, "global_step": 559215, "epoch": 6737} {"train_loss": -27.409515380859375, "global_step": 559216, "epoch": 6737} {"train_loss": -26.539173126220703, "global_step": 559217, "epoch": 6737} {"train_loss": -26.380651473999023, "global_step": 559218, "epoch": 6737} {"train_loss": -27.14369773864746, "global_step": 559219, "epoch": 6737} {"train_loss": -27.908910751342773, "global_step": 559220, "epoch": 6737} {"train_loss": -27.048206329345703, "global_step": 559221, "epoch": 6737} {"train_loss": -27.25733757019043, "global_step": 559222, "epoch": 6737} {"train_loss": -27.441680908203125, "global_step": 559223, "epoch": 6737} {"train_loss": -27.603912353515625, "global_step": 559224, "epoch": 6737} {"train_loss": -27.742666244506836, "global_step": 559225, "epoch": 6737} {"train_loss": -27.317142486572266, "global_step": 559226, "epoch": 6737} {"train_loss": -28.216684341430664, "global_step": 559227, "epoch": 6737} {"train_loss": -27.568994522094727, "global_step": 559228, "epoch": 6737} {"train_loss": -27.812702178955078, "global_step": 559229, "epoch": 6737} {"train_loss": -27.61798095703125, "global_step": 559230, "epoch": 6737} {"train_loss": -27.928369522094727, "global_step": 559231, "epoch": 6737} {"train_loss": -27.848119735717773, "global_step": 559232, "epoch": 6737} {"train_loss": -27.491790771484375, "global_step": 559233, "epoch": 6737} {"train_loss": -27.036224365234375, "global_step": 559234, "epoch": 6737} {"train_loss": -27.530115127563477, "global_step": 559235, "epoch": 6737} {"train_loss": -27.69761085510254, "global_step": 559236, "epoch": 6737} {"train_loss": -27.1967716217041, "global_step": 559237, "epoch": 6737} {"train_loss": -27.375385284423828, "global_step": 559238, "epoch": 6737} {"train_loss": -28.014692306518555, "global_step": 559239, "epoch": 6737} {"train_loss": -27.957611083984375, "global_step": 559240, "epoch": 6737} {"train_loss": -27.803197860717773, "global_step": 559241, "epoch": 6737} {"train_loss": -27.648868560791016, "global_step": 559242, "epoch": 6737} {"train_loss": -28.019628524780273, "global_step": 559243, "epoch": 6737} {"train_loss": -28.0079345703125, "global_step": 559244, "epoch": 6737} {"train_loss": -27.46601676940918, "global_step": 559245, "epoch": 6737} {"train_loss": -27.5886287689209, "global_step": 559246, "epoch": 6737} {"train_loss": -27.866514205932617, "global_step": 559247, "epoch": 6737} {"train_loss": -27.752912521362305, "global_step": 559248, "epoch": 6737} {"train_loss": -27.818374633789062, "global_step": 559249, "epoch": 6737} {"train_loss": -27.972089767456055, "global_step": 559250, "epoch": 6737} {"train_loss": -28.22017478942871, "global_step": 559251, "epoch": 6737} {"train_loss": -28.030282974243164, "global_step": 559252, "epoch": 6737} {"train_loss": -27.64601948749588, "global_step": 559253, "epoch": 6737, "val_loss": 6575438.5} {"train_loss": -27.81104850769043, "global_step": 559254, "epoch": 6738} {"train_loss": -27.560522079467773, "global_step": 559255, "epoch": 6738} {"train_loss": -27.854450225830078, "global_step": 559256, "epoch": 6738} {"train_loss": -27.96124839782715, "global_step": 559257, "epoch": 6738} {"train_loss": -27.82074546813965, "global_step": 559258, "epoch": 6738} {"train_loss": -27.664886474609375, "global_step": 559259, "epoch": 6738} {"train_loss": -27.817296981811523, "global_step": 559260, "epoch": 6738} {"train_loss": -27.553190231323242, "global_step": 559261, "epoch": 6738} {"train_loss": -27.478992462158203, "global_step": 559262, "epoch": 6738} {"train_loss": -27.57958984375, "global_step": 559263, "epoch": 6738} {"train_loss": -27.51185417175293, "global_step": 559264, "epoch": 6738} {"train_loss": -27.915842056274414, "global_step": 559265, "epoch": 6738} {"train_loss": -27.473560333251953, "global_step": 559266, "epoch": 6738} {"train_loss": -27.38886070251465, "global_step": 559267, "epoch": 6738} {"train_loss": -27.831212997436523, "global_step": 559268, "epoch": 6738} {"train_loss": -27.996124267578125, "global_step": 559269, "epoch": 6738} {"train_loss": -27.692174911499023, "global_step": 559270, "epoch": 6738} {"train_loss": -27.85556983947754, "global_step": 559271, "epoch": 6738} {"train_loss": -27.792272567749023, "global_step": 559272, "epoch": 6738} {"train_loss": -27.73712158203125, "global_step": 559273, "epoch": 6738} {"train_loss": -27.987253189086914, "global_step": 559274, "epoch": 6738} {"train_loss": -27.78070640563965, "global_step": 559275, "epoch": 6738} {"train_loss": -28.02804946899414, "global_step": 559276, "epoch": 6738} {"train_loss": -28.047351837158203, "global_step": 559277, "epoch": 6738} {"train_loss": -27.968976974487305, "global_step": 559278, "epoch": 6738} {"train_loss": -27.90045166015625, "global_step": 559279, "epoch": 6738} {"train_loss": -28.35603141784668, "global_step": 559280, "epoch": 6738} {"train_loss": -27.756383895874023, "global_step": 559281, "epoch": 6738} {"train_loss": -27.90020179748535, "global_step": 559282, "epoch": 6738} {"train_loss": -27.779403686523438, "global_step": 559283, "epoch": 6738} {"train_loss": -28.046634674072266, "global_step": 559284, "epoch": 6738} {"train_loss": -28.02728843688965, "global_step": 559285, "epoch": 6738} {"train_loss": -27.70230484008789, "global_step": 559286, "epoch": 6738} {"train_loss": -27.850278854370117, "global_step": 559287, "epoch": 6738} {"train_loss": -27.96238136291504, "global_step": 559288, "epoch": 6738} {"train_loss": -27.633499145507812, "global_step": 559289, "epoch": 6738} {"train_loss": -28.253355026245117, "global_step": 559290, "epoch": 6738} {"train_loss": -28.06964111328125, "global_step": 559291, "epoch": 6738} {"train_loss": -27.857786178588867, "global_step": 559292, "epoch": 6738} {"train_loss": -28.073490142822266, "global_step": 559293, "epoch": 6738} {"train_loss": -27.789108276367188, "global_step": 559294, "epoch": 6738} {"train_loss": -28.161718368530273, "global_step": 559295, "epoch": 6738} {"train_loss": -28.009992599487305, "global_step": 559296, "epoch": 6738} {"train_loss": -28.135351181030273, "global_step": 559297, "epoch": 6738} {"train_loss": -28.053985595703125, "global_step": 559298, "epoch": 6738} {"train_loss": -27.645360946655273, "global_step": 559299, "epoch": 6738} {"train_loss": -27.97076416015625, "global_step": 559300, "epoch": 6738} {"train_loss": -28.0705623626709, "global_step": 559301, "epoch": 6738} {"train_loss": -28.25737953186035, "global_step": 559302, "epoch": 6738} {"train_loss": -27.870651245117188, "global_step": 559303, "epoch": 6738} {"train_loss": -27.916275024414062, "global_step": 559304, "epoch": 6738} {"train_loss": -27.990009307861328, "global_step": 559305, "epoch": 6738} {"train_loss": -27.896854400634766, "global_step": 559306, "epoch": 6738} {"train_loss": -27.600555419921875, "global_step": 559307, "epoch": 6738} {"train_loss": -27.7222957611084, "global_step": 559308, "epoch": 6738} {"train_loss": -27.485504150390625, "global_step": 559309, "epoch": 6738} {"train_loss": -27.75054931640625, "global_step": 559310, "epoch": 6738} {"train_loss": -28.310522079467773, "global_step": 559311, "epoch": 6738} {"train_loss": -28.008975982666016, "global_step": 559312, "epoch": 6738} {"train_loss": -28.0137882232666, "global_step": 559313, "epoch": 6738} {"train_loss": -27.648279190063477, "global_step": 559314, "epoch": 6738} {"train_loss": -27.242704391479492, "global_step": 559315, "epoch": 6738} {"train_loss": -27.228778839111328, "global_step": 559316, "epoch": 6738} {"train_loss": -27.585174560546875, "global_step": 559317, "epoch": 6738} {"train_loss": -28.043262481689453, "global_step": 559318, "epoch": 6738} {"train_loss": -28.280567169189453, "global_step": 559319, "epoch": 6738} {"train_loss": -27.744998931884766, "global_step": 559320, "epoch": 6738} {"train_loss": -27.51502799987793, "global_step": 559321, "epoch": 6738} {"train_loss": -27.455280303955078, "global_step": 559322, "epoch": 6738} {"train_loss": -27.679380416870117, "global_step": 559323, "epoch": 6738} {"train_loss": -27.2208251953125, "global_step": 559324, "epoch": 6738} {"train_loss": -27.67481803894043, "global_step": 559325, "epoch": 6738} {"train_loss": -27.717273712158203, "global_step": 559326, "epoch": 6738} {"train_loss": -27.538227081298828, "global_step": 559327, "epoch": 6738} {"train_loss": -27.68219566345215, "global_step": 559328, "epoch": 6738} {"train_loss": -27.531763076782227, "global_step": 559329, "epoch": 6738} {"train_loss": -27.54083251953125, "global_step": 559330, "epoch": 6738} {"train_loss": -27.498016357421875, "global_step": 559331, "epoch": 6738} {"train_loss": -27.645055770874023, "global_step": 559332, "epoch": 6738} {"train_loss": -27.646148681640625, "global_step": 559333, "epoch": 6738} {"train_loss": -27.39191246032715, "global_step": 559334, "epoch": 6738} {"train_loss": -27.762039184570312, "global_step": 559335, "epoch": 6738} {"train_loss": -27.781808439507543, "global_step": 559336, "epoch": 6738, "val_loss": 6536039.0} {"train_loss": -25.312931060791016, "global_step": 559337, "epoch": 6739} {"train_loss": -25.552780151367188, "global_step": 559338, "epoch": 6739} {"train_loss": -26.222888946533203, "global_step": 559339, "epoch": 6739} {"train_loss": -26.751083374023438, "global_step": 559340, "epoch": 6739} {"train_loss": -25.632007598876953, "global_step": 559341, "epoch": 6739} {"train_loss": -25.975629806518555, "global_step": 559342, "epoch": 6739} {"train_loss": -26.088287353515625, "global_step": 559343, "epoch": 6739} {"train_loss": -25.781173706054688, "global_step": 559344, "epoch": 6739} {"train_loss": -26.635650634765625, "global_step": 559345, "epoch": 6739} {"train_loss": -26.759552001953125, "global_step": 559346, "epoch": 6739} {"train_loss": -26.253372192382812, "global_step": 559347, "epoch": 6739} {"train_loss": -26.92829704284668, "global_step": 559348, "epoch": 6739} {"train_loss": -26.323139190673828, "global_step": 559349, "epoch": 6739} {"train_loss": -26.960037231445312, "global_step": 559350, "epoch": 6739} {"train_loss": -26.559789657592773, "global_step": 559351, "epoch": 6739} {"train_loss": -27.033679962158203, "global_step": 559352, "epoch": 6739} {"train_loss": -27.069971084594727, "global_step": 559353, "epoch": 6739} {"train_loss": -27.0767822265625, "global_step": 559354, "epoch": 6739} {"train_loss": -27.081884384155273, "global_step": 559355, "epoch": 6739} {"train_loss": -27.142175674438477, "global_step": 559356, "epoch": 6739} {"train_loss": -26.937030792236328, "global_step": 559357, "epoch": 6739} {"train_loss": -27.36872673034668, "global_step": 559358, "epoch": 6739} {"train_loss": -27.226755142211914, "global_step": 559359, "epoch": 6739} {"train_loss": -27.158935546875, "global_step": 559360, "epoch": 6739} {"train_loss": -27.4468994140625, "global_step": 559361, "epoch": 6739} {"train_loss": -27.451583862304688, "global_step": 559362, "epoch": 6739} {"train_loss": -27.607349395751953, "global_step": 559363, "epoch": 6739} {"train_loss": -27.589221954345703, "global_step": 559364, "epoch": 6739} {"train_loss": -27.379602432250977, "global_step": 559365, "epoch": 6739} {"train_loss": -27.568532943725586, "global_step": 559366, "epoch": 6739} {"train_loss": -27.50856590270996, "global_step": 559367, "epoch": 6739} {"train_loss": -27.669233322143555, "global_step": 559368, "epoch": 6739} {"train_loss": -27.549304962158203, "global_step": 559369, "epoch": 6739} {"train_loss": -27.66973876953125, "global_step": 559370, "epoch": 6739} {"train_loss": -27.736783981323242, "global_step": 559371, "epoch": 6739} {"train_loss": -27.460708618164062, "global_step": 559372, "epoch": 6739} {"train_loss": -27.759679794311523, "global_step": 559373, "epoch": 6739} {"train_loss": -27.594587326049805, "global_step": 559374, "epoch": 6739} {"train_loss": -28.128870010375977, "global_step": 559375, "epoch": 6739} {"train_loss": -27.568435668945312, "global_step": 559376, "epoch": 6739} {"train_loss": -27.626184463500977, "global_step": 559377, "epoch": 6739} {"train_loss": -27.678632736206055, "global_step": 559378, "epoch": 6739} {"train_loss": -27.923755645751953, "global_step": 559379, "epoch": 6739} {"train_loss": -27.831464767456055, "global_step": 559380, "epoch": 6739} {"train_loss": -27.570669174194336, "global_step": 559381, "epoch": 6739} {"train_loss": -27.95826530456543, "global_step": 559382, "epoch": 6739} {"train_loss": -27.902542114257812, "global_step": 559383, "epoch": 6739} {"train_loss": -28.07210350036621, "global_step": 559384, "epoch": 6739} {"train_loss": -28.06780433654785, "global_step": 559385, "epoch": 6739} {"train_loss": -27.958459854125977, "global_step": 559386, "epoch": 6739} {"train_loss": -27.772306442260742, "global_step": 559387, "epoch": 6739} {"train_loss": -28.113183975219727, "global_step": 559388, "epoch": 6739} {"train_loss": -27.918386459350586, "global_step": 559389, "epoch": 6739} {"train_loss": -27.990345001220703, "global_step": 559390, "epoch": 6739} {"train_loss": -27.548324584960938, "global_step": 559391, "epoch": 6739} {"train_loss": -27.937274932861328, "global_step": 559392, "epoch": 6739} {"train_loss": -27.97608757019043, "global_step": 559393, "epoch": 6739} {"train_loss": -27.813678741455078, "global_step": 559394, "epoch": 6739} {"train_loss": -27.380996704101562, "global_step": 559395, "epoch": 6739} {"train_loss": -27.194005966186523, "global_step": 559396, "epoch": 6739} {"train_loss": -26.541166305541992, "global_step": 559397, "epoch": 6739} {"train_loss": -26.576004028320312, "global_step": 559398, "epoch": 6739} {"train_loss": -27.31403923034668, "global_step": 559399, "epoch": 6739} {"train_loss": -27.755462646484375, "global_step": 559400, "epoch": 6739} {"train_loss": -27.84909439086914, "global_step": 559401, "epoch": 6739} {"train_loss": -27.604528427124023, "global_step": 559402, "epoch": 6739} {"train_loss": -27.36553382873535, "global_step": 559403, "epoch": 6739} {"train_loss": -27.994104385375977, "global_step": 559404, "epoch": 6739} {"train_loss": -27.7005672454834, "global_step": 559405, "epoch": 6739} {"train_loss": -27.27695655822754, "global_step": 559406, "epoch": 6739} {"train_loss": -27.792776107788086, "global_step": 559407, "epoch": 6739} {"train_loss": -27.515668869018555, "global_step": 559408, "epoch": 6739} {"train_loss": -27.649463653564453, "global_step": 559409, "epoch": 6739} {"train_loss": -27.673852920532227, "global_step": 559410, "epoch": 6739} {"train_loss": -27.7139835357666, "global_step": 559411, "epoch": 6739} {"train_loss": -27.91755485534668, "global_step": 559412, "epoch": 6739} {"train_loss": -27.32785415649414, "global_step": 559413, "epoch": 6739} {"train_loss": -27.792163848876953, "global_step": 559414, "epoch": 6739} {"train_loss": -27.86573600769043, "global_step": 559415, "epoch": 6739} {"train_loss": -27.6912899017334, "global_step": 559416, "epoch": 6739} {"train_loss": -27.798566818237305, "global_step": 559417, "epoch": 6739} {"train_loss": -27.482511520385742, "global_step": 559418, "epoch": 6739} {"train_loss": -27.335576827267566, "global_step": 559419, "epoch": 6739, "val_loss": 6579502.0} {"train_loss": -26.735382080078125, "global_step": 559420, "epoch": 6740} {"train_loss": -26.42365837097168, "global_step": 559421, "epoch": 6740} {"train_loss": -27.246490478515625, "global_step": 559422, "epoch": 6740} {"train_loss": -27.2174072265625, "global_step": 559423, "epoch": 6740} {"train_loss": -26.857009887695312, "global_step": 559424, "epoch": 6740} {"train_loss": -27.17133140563965, "global_step": 559425, "epoch": 6740} {"train_loss": -27.042022705078125, "global_step": 559426, "epoch": 6740} {"train_loss": -26.87430191040039, "global_step": 559427, "epoch": 6740} {"train_loss": -26.930200576782227, "global_step": 559428, "epoch": 6740} {"train_loss": -27.16852378845215, "global_step": 559429, "epoch": 6740} {"train_loss": -27.543893814086914, "global_step": 559430, "epoch": 6740} {"train_loss": -27.071884155273438, "global_step": 559431, "epoch": 6740} {"train_loss": -26.83343505859375, "global_step": 559432, "epoch": 6740} {"train_loss": -27.3653621673584, "global_step": 559433, "epoch": 6740} {"train_loss": -27.084949493408203, "global_step": 559434, "epoch": 6740} {"train_loss": -27.5158748626709, "global_step": 559435, "epoch": 6740} {"train_loss": -27.25543212890625, "global_step": 559436, "epoch": 6740} {"train_loss": -27.169279098510742, "global_step": 559437, "epoch": 6740} {"train_loss": -27.9550724029541, "global_step": 559438, "epoch": 6740} {"train_loss": -27.502948760986328, "global_step": 559439, "epoch": 6740} {"train_loss": -27.580738067626953, "global_step": 559440, "epoch": 6740} {"train_loss": -27.476245880126953, "global_step": 559441, "epoch": 6740} {"train_loss": -27.7812557220459, "global_step": 559442, "epoch": 6740} {"train_loss": -27.2722225189209, "global_step": 559443, "epoch": 6740} {"train_loss": -27.258886337280273, "global_step": 559444, "epoch": 6740} {"train_loss": -27.2728271484375, "global_step": 559445, "epoch": 6740} {"train_loss": -26.45944595336914, "global_step": 559446, "epoch": 6740} {"train_loss": -27.616943359375, "global_step": 559447, "epoch": 6740} {"train_loss": -26.4470157623291, "global_step": 559448, "epoch": 6740} {"train_loss": -27.5729923248291, "global_step": 559449, "epoch": 6740} {"train_loss": -27.535120010375977, "global_step": 559450, "epoch": 6740} {"train_loss": -27.628461837768555, "global_step": 559451, "epoch": 6740} {"train_loss": -27.738418579101562, "global_step": 559452, "epoch": 6740} {"train_loss": -27.499494552612305, "global_step": 559453, "epoch": 6740} {"train_loss": -27.800556182861328, "global_step": 559454, "epoch": 6740} {"train_loss": -27.724130630493164, "global_step": 559455, "epoch": 6740} {"train_loss": -27.60269546508789, "global_step": 559456, "epoch": 6740} {"train_loss": -27.538818359375, "global_step": 559457, "epoch": 6740} {"train_loss": -27.509098052978516, "global_step": 559458, "epoch": 6740} {"train_loss": -27.960086822509766, "global_step": 559459, "epoch": 6740} {"train_loss": -27.794605255126953, "global_step": 559460, "epoch": 6740} {"train_loss": -27.897052764892578, "global_step": 559461, "epoch": 6740} {"train_loss": -27.5467472076416, "global_step": 559462, "epoch": 6740} {"train_loss": -27.597614288330078, "global_step": 559463, "epoch": 6740} {"train_loss": -27.914905548095703, "global_step": 559464, "epoch": 6740} {"train_loss": -27.72566795349121, "global_step": 559465, "epoch": 6740} {"train_loss": -27.70050621032715, "global_step": 559466, "epoch": 6740} {"train_loss": -27.912857055664062, "global_step": 559467, "epoch": 6740} {"train_loss": -27.6531982421875, "global_step": 559468, "epoch": 6740} {"train_loss": -27.920255661010742, "global_step": 559469, "epoch": 6740} {"train_loss": -27.50925636291504, "global_step": 559470, "epoch": 6740} {"train_loss": -27.561981201171875, "global_step": 559471, "epoch": 6740} {"train_loss": -27.846609115600586, "global_step": 559472, "epoch": 6740} {"train_loss": -27.740934371948242, "global_step": 559473, "epoch": 6740} {"train_loss": -27.893890380859375, "global_step": 559474, "epoch": 6740} {"train_loss": -27.8643856048584, "global_step": 559475, "epoch": 6740} {"train_loss": -27.901763916015625, "global_step": 559476, "epoch": 6740} {"train_loss": -27.68634033203125, "global_step": 559477, "epoch": 6740} {"train_loss": -27.65449333190918, "global_step": 559478, "epoch": 6740} {"train_loss": -28.01934814453125, "global_step": 559479, "epoch": 6740} {"train_loss": -27.9527530670166, "global_step": 559480, "epoch": 6740} {"train_loss": -27.636682510375977, "global_step": 559481, "epoch": 6740} {"train_loss": -28.005563735961914, "global_step": 559482, "epoch": 6740} {"train_loss": -27.903736114501953, "global_step": 559483, "epoch": 6740} {"train_loss": -27.68548583984375, "global_step": 559484, "epoch": 6740} {"train_loss": -27.623748779296875, "global_step": 559485, "epoch": 6740} {"train_loss": -27.99796485900879, "global_step": 559486, "epoch": 6740} {"train_loss": -28.132740020751953, "global_step": 559487, "epoch": 6740} {"train_loss": -27.799579620361328, "global_step": 559488, "epoch": 6740} {"train_loss": -27.986194610595703, "global_step": 559489, "epoch": 6740} {"train_loss": -27.90723991394043, "global_step": 559490, "epoch": 6740} {"train_loss": -27.68507194519043, "global_step": 559491, "epoch": 6740} {"train_loss": -27.845823287963867, "global_step": 559492, "epoch": 6740} {"train_loss": -27.499988555908203, "global_step": 559493, "epoch": 6740} {"train_loss": -27.47039794921875, "global_step": 559494, "epoch": 6740} {"train_loss": -27.383468627929688, "global_step": 559495, "epoch": 6740} {"train_loss": -27.476240158081055, "global_step": 559496, "epoch": 6740} {"train_loss": -27.464506149291992, "global_step": 559497, "epoch": 6740} {"train_loss": -28.050525665283203, "global_step": 559498, "epoch": 6740} {"train_loss": -28.060333251953125, "global_step": 559499, "epoch": 6740} {"train_loss": -27.661718368530273, "global_step": 559500, "epoch": 6740} {"train_loss": -28.157062530517578, "global_step": 559501, "epoch": 6740} {"train_loss": -27.565700576966066, "global_step": 559502, "epoch": 6740, "val_loss": 6586403.0} {"train_loss": -25.777135848999023, "global_step": 559503, "epoch": 6741} {"train_loss": -26.20924186706543, "global_step": 559504, "epoch": 6741} {"train_loss": -26.68948745727539, "global_step": 559505, "epoch": 6741} {"train_loss": -26.972827911376953, "global_step": 559506, "epoch": 6741} {"train_loss": -25.466798782348633, "global_step": 559507, "epoch": 6741} {"train_loss": -26.27252769470215, "global_step": 559508, "epoch": 6741} {"train_loss": -27.181854248046875, "global_step": 559509, "epoch": 6741} {"train_loss": -27.24055290222168, "global_step": 559510, "epoch": 6741} {"train_loss": -25.928268432617188, "global_step": 559511, "epoch": 6741} {"train_loss": -27.060962677001953, "global_step": 559512, "epoch": 6741} {"train_loss": -27.151037216186523, "global_step": 559513, "epoch": 6741} {"train_loss": -27.4599666595459, "global_step": 559514, "epoch": 6741} {"train_loss": -27.299091339111328, "global_step": 559515, "epoch": 6741} {"train_loss": -27.128625869750977, "global_step": 559516, "epoch": 6741} {"train_loss": -26.9742488861084, "global_step": 559517, "epoch": 6741} {"train_loss": -27.462430953979492, "global_step": 559518, "epoch": 6741} {"train_loss": -27.254560470581055, "global_step": 559519, "epoch": 6741} {"train_loss": -27.241104125976562, "global_step": 559520, "epoch": 6741} {"train_loss": -27.771808624267578, "global_step": 559521, "epoch": 6741} {"train_loss": -27.607471466064453, "global_step": 559522, "epoch": 6741} {"train_loss": -27.38532829284668, "global_step": 559523, "epoch": 6741} {"train_loss": -26.856534957885742, "global_step": 559524, "epoch": 6741} {"train_loss": -27.183277130126953, "global_step": 559525, "epoch": 6741} {"train_loss": -27.554025650024414, "global_step": 559526, "epoch": 6741} {"train_loss": -27.273223876953125, "global_step": 559527, "epoch": 6741} {"train_loss": -27.12891960144043, "global_step": 559528, "epoch": 6741} {"train_loss": -27.412439346313477, "global_step": 559529, "epoch": 6741} {"train_loss": -27.9892635345459, "global_step": 559530, "epoch": 6741} {"train_loss": -27.406843185424805, "global_step": 559531, "epoch": 6741} {"train_loss": -27.866321563720703, "global_step": 559532, "epoch": 6741} {"train_loss": -27.831106185913086, "global_step": 559533, "epoch": 6741} {"train_loss": -27.371002197265625, "global_step": 559534, "epoch": 6741} {"train_loss": -27.563709259033203, "global_step": 559535, "epoch": 6741} {"train_loss": -27.7025146484375, "global_step": 559536, "epoch": 6741} {"train_loss": -27.461278915405273, "global_step": 559537, "epoch": 6741} {"train_loss": -27.381139755249023, "global_step": 559538, "epoch": 6741} {"train_loss": -27.95111083984375, "global_step": 559539, "epoch": 6741} {"train_loss": -27.5880069732666, "global_step": 559540, "epoch": 6741} {"train_loss": -27.505908966064453, "global_step": 559541, "epoch": 6741} {"train_loss": -27.968114852905273, "global_step": 559542, "epoch": 6741} {"train_loss": -27.475570678710938, "global_step": 559543, "epoch": 6741} {"train_loss": -27.49879264831543, "global_step": 559544, "epoch": 6741} {"train_loss": -27.9460391998291, "global_step": 559545, "epoch": 6741} {"train_loss": -27.9571475982666, "global_step": 559546, "epoch": 6741} {"train_loss": -27.73239517211914, "global_step": 559547, "epoch": 6741} {"train_loss": -28.198917388916016, "global_step": 559548, "epoch": 6741} {"train_loss": -27.739917755126953, "global_step": 559549, "epoch": 6741} {"train_loss": -27.73992347717285, "global_step": 559550, "epoch": 6741} {"train_loss": -27.70905113220215, "global_step": 559551, "epoch": 6741} {"train_loss": -27.575702667236328, "global_step": 559552, "epoch": 6741} {"train_loss": -27.55293846130371, "global_step": 559553, "epoch": 6741} {"train_loss": -27.7432918548584, "global_step": 559554, "epoch": 6741} {"train_loss": -27.8103084564209, "global_step": 559555, "epoch": 6741} {"train_loss": -28.163644790649414, "global_step": 559556, "epoch": 6741} {"train_loss": -27.360822677612305, "global_step": 559557, "epoch": 6741} {"train_loss": -27.589879989624023, "global_step": 559558, "epoch": 6741} {"train_loss": -27.255435943603516, "global_step": 559559, "epoch": 6741} {"train_loss": -27.711719512939453, "global_step": 559560, "epoch": 6741} {"train_loss": -27.44184684753418, "global_step": 559561, "epoch": 6741} {"train_loss": -27.736602783203125, "global_step": 559562, "epoch": 6741} {"train_loss": -27.421483993530273, "global_step": 559563, "epoch": 6741} {"train_loss": -27.567407608032227, "global_step": 559564, "epoch": 6741} {"train_loss": -26.862516403198242, "global_step": 559565, "epoch": 6741} {"train_loss": -27.70366859436035, "global_step": 559566, "epoch": 6741} {"train_loss": -27.093414306640625, "global_step": 559567, "epoch": 6741} {"train_loss": -27.6832275390625, "global_step": 559568, "epoch": 6741} {"train_loss": -27.613508224487305, "global_step": 559569, "epoch": 6741} {"train_loss": -27.80828285217285, "global_step": 559570, "epoch": 6741} {"train_loss": -28.00785255432129, "global_step": 559571, "epoch": 6741} {"train_loss": -27.64239501953125, "global_step": 559572, "epoch": 6741} {"train_loss": -27.753198623657227, "global_step": 559573, "epoch": 6741} {"train_loss": -27.81546974182129, "global_step": 559574, "epoch": 6741} {"train_loss": -27.529163360595703, "global_step": 559575, "epoch": 6741} {"train_loss": -27.86421012878418, "global_step": 559576, "epoch": 6741} {"train_loss": -27.789499282836914, "global_step": 559577, "epoch": 6741} {"train_loss": -27.4949951171875, "global_step": 559578, "epoch": 6741} {"train_loss": -27.935232162475586, "global_step": 559579, "epoch": 6741} {"train_loss": -27.741682052612305, "global_step": 559580, "epoch": 6741} {"train_loss": -27.87013816833496, "global_step": 559581, "epoch": 6741} {"train_loss": -27.849231719970703, "global_step": 559582, "epoch": 6741} {"train_loss": -27.68528175354004, "global_step": 559583, "epoch": 6741} {"train_loss": -27.91866111755371, "global_step": 559584, "epoch": 6741} {"train_loss": -27.460547527634954, "global_step": 559585, "epoch": 6741, "val_loss": 6373724.5} {"train_loss": -27.586200714111328, "global_step": 559586, "epoch": 6742} {"train_loss": -27.42396354675293, "global_step": 559587, "epoch": 6742} {"train_loss": -27.368427276611328, "global_step": 559588, "epoch": 6742} {"train_loss": -27.43192481994629, "global_step": 559589, "epoch": 6742} {"train_loss": -26.879392623901367, "global_step": 559590, "epoch": 6742} {"train_loss": -27.369470596313477, "global_step": 559591, "epoch": 6742} {"train_loss": -27.60292625427246, "global_step": 559592, "epoch": 6742} {"train_loss": -27.601057052612305, "global_step": 559593, "epoch": 6742} {"train_loss": -27.528406143188477, "global_step": 559594, "epoch": 6742} {"train_loss": -27.247425079345703, "global_step": 559595, "epoch": 6742} {"train_loss": -27.38062858581543, "global_step": 559596, "epoch": 6742} {"train_loss": -27.150556564331055, "global_step": 559597, "epoch": 6742} {"train_loss": -27.90740966796875, "global_step": 559598, "epoch": 6742} {"train_loss": -27.32989501953125, "global_step": 559599, "epoch": 6742} {"train_loss": -27.68024253845215, "global_step": 559600, "epoch": 6742} {"train_loss": -27.718122482299805, "global_step": 559601, "epoch": 6742} {"train_loss": -27.485483169555664, "global_step": 559602, "epoch": 6742} {"train_loss": -27.458908081054688, "global_step": 559603, "epoch": 6742} {"train_loss": -27.74140739440918, "global_step": 559604, "epoch": 6742} {"train_loss": -27.4280948638916, "global_step": 559605, "epoch": 6742} {"train_loss": -27.393415451049805, "global_step": 559606, "epoch": 6742} {"train_loss": -28.0252685546875, "global_step": 559607, "epoch": 6742} {"train_loss": -27.810720443725586, "global_step": 559608, "epoch": 6742} {"train_loss": -27.64515495300293, "global_step": 559609, "epoch": 6742} {"train_loss": -27.7163143157959, "global_step": 559610, "epoch": 6742} {"train_loss": -28.05988121032715, "global_step": 559611, "epoch": 6742} {"train_loss": -27.813831329345703, "global_step": 559612, "epoch": 6742} {"train_loss": -27.708349227905273, "global_step": 559613, "epoch": 6742} {"train_loss": -27.55282974243164, "global_step": 559614, "epoch": 6742} {"train_loss": -27.841581344604492, "global_step": 559615, "epoch": 6742} {"train_loss": -27.716054916381836, "global_step": 559616, "epoch": 6742} {"train_loss": -27.81743812561035, "global_step": 559617, "epoch": 6742} {"train_loss": -27.766754150390625, "global_step": 559618, "epoch": 6742} {"train_loss": -27.747589111328125, "global_step": 559619, "epoch": 6742} {"train_loss": -27.768325805664062, "global_step": 559620, "epoch": 6742} {"train_loss": -27.79383659362793, "global_step": 559621, "epoch": 6742} {"train_loss": -27.61567497253418, "global_step": 559622, "epoch": 6742} {"train_loss": -28.15461540222168, "global_step": 559623, "epoch": 6742} {"train_loss": -27.96112632751465, "global_step": 559624, "epoch": 6742} {"train_loss": -27.838586807250977, "global_step": 559625, "epoch": 6742} {"train_loss": -27.84319496154785, "global_step": 559626, "epoch": 6742} {"train_loss": -27.704771041870117, "global_step": 559627, "epoch": 6742} {"train_loss": -27.72498893737793, "global_step": 559628, "epoch": 6742} {"train_loss": -27.877471923828125, "global_step": 559629, "epoch": 6742} {"train_loss": -27.87302589416504, "global_step": 559630, "epoch": 6742} {"train_loss": -28.139814376831055, "global_step": 559631, "epoch": 6742} {"train_loss": -27.80738639831543, "global_step": 559632, "epoch": 6742} {"train_loss": -27.8387451171875, "global_step": 559633, "epoch": 6742} {"train_loss": -27.83258628845215, "global_step": 559634, "epoch": 6742} {"train_loss": -28.03376579284668, "global_step": 559635, "epoch": 6742} {"train_loss": -27.896137237548828, "global_step": 559636, "epoch": 6742} {"train_loss": -27.833160400390625, "global_step": 559637, "epoch": 6742} {"train_loss": -28.0517520904541, "global_step": 559638, "epoch": 6742} {"train_loss": -27.917821884155273, "global_step": 559639, "epoch": 6742} {"train_loss": -27.60113525390625, "global_step": 559640, "epoch": 6742} {"train_loss": -27.94827651977539, "global_step": 559641, "epoch": 6742} {"train_loss": -27.903583526611328, "global_step": 559642, "epoch": 6742} {"train_loss": -27.755130767822266, "global_step": 559643, "epoch": 6742} {"train_loss": -27.972091674804688, "global_step": 559644, "epoch": 6742} {"train_loss": -28.008237838745117, "global_step": 559645, "epoch": 6742} {"train_loss": -27.862009048461914, "global_step": 559646, "epoch": 6742} {"train_loss": -28.09794044494629, "global_step": 559647, "epoch": 6742} {"train_loss": -27.95795249938965, "global_step": 559648, "epoch": 6742} {"train_loss": -27.853208541870117, "global_step": 559649, "epoch": 6742} {"train_loss": -27.34016227722168, "global_step": 559650, "epoch": 6742} {"train_loss": -27.41910743713379, "global_step": 559651, "epoch": 6742} {"train_loss": -26.863937377929688, "global_step": 559652, "epoch": 6742} {"train_loss": -26.97930908203125, "global_step": 559653, "epoch": 6742} {"train_loss": -27.203195571899414, "global_step": 559654, "epoch": 6742} {"train_loss": -27.4600830078125, "global_step": 559655, "epoch": 6742} {"train_loss": -27.887134552001953, "global_step": 559656, "epoch": 6742} {"train_loss": -27.673664093017578, "global_step": 559657, "epoch": 6742} {"train_loss": -27.813581466674805, "global_step": 559658, "epoch": 6742} {"train_loss": -27.756011962890625, "global_step": 559659, "epoch": 6742} {"train_loss": -27.76161766052246, "global_step": 559660, "epoch": 6742} {"train_loss": -28.108844757080078, "global_step": 559661, "epoch": 6742} {"train_loss": -27.666366577148438, "global_step": 559662, "epoch": 6742} {"train_loss": -27.679706573486328, "global_step": 559663, "epoch": 6742} {"train_loss": -27.714170455932617, "global_step": 559664, "epoch": 6742} {"train_loss": -28.079853057861328, "global_step": 559665, "epoch": 6742} {"train_loss": -27.946887969970703, "global_step": 559666, "epoch": 6742} {"train_loss": -28.011581420898438, "global_step": 559667, "epoch": 6742} {"train_loss": -27.706896333809357, "global_step": 559668, "epoch": 6742, "val_loss": 6385584.0} {"train_loss": -27.37883949279785, "global_step": 559669, "epoch": 6743} {"train_loss": -26.58711051940918, "global_step": 559670, "epoch": 6743} {"train_loss": -27.165693283081055, "global_step": 559671, "epoch": 6743} {"train_loss": -26.84160804748535, "global_step": 559672, "epoch": 6743} {"train_loss": -27.3013973236084, "global_step": 559673, "epoch": 6743} {"train_loss": -27.589069366455078, "global_step": 559674, "epoch": 6743} {"train_loss": -27.085840225219727, "global_step": 559675, "epoch": 6743} {"train_loss": -27.130239486694336, "global_step": 559676, "epoch": 6743} {"train_loss": -27.157440185546875, "global_step": 559677, "epoch": 6743} {"train_loss": -27.21368408203125, "global_step": 559678, "epoch": 6743} {"train_loss": -27.174041748046875, "global_step": 559679, "epoch": 6743} {"train_loss": -27.600141525268555, "global_step": 559680, "epoch": 6743} {"train_loss": -27.1170654296875, "global_step": 559681, "epoch": 6743} {"train_loss": -27.367834091186523, "global_step": 559682, "epoch": 6743} {"train_loss": -27.632904052734375, "global_step": 559683, "epoch": 6743} {"train_loss": -27.13874626159668, "global_step": 559684, "epoch": 6743} {"train_loss": -27.41752052307129, "global_step": 559685, "epoch": 6743} {"train_loss": -27.797006607055664, "global_step": 559686, "epoch": 6743} {"train_loss": -27.241657257080078, "global_step": 559687, "epoch": 6743} {"train_loss": -27.352832794189453, "global_step": 559688, "epoch": 6743} {"train_loss": -27.744525909423828, "global_step": 559689, "epoch": 6743} {"train_loss": -27.7259578704834, "global_step": 559690, "epoch": 6743} {"train_loss": -27.4379825592041, "global_step": 559691, "epoch": 6743} {"train_loss": -27.376117706298828, "global_step": 559692, "epoch": 6743} {"train_loss": -27.27362060546875, "global_step": 559693, "epoch": 6743} {"train_loss": -27.764942169189453, "global_step": 559694, "epoch": 6743} {"train_loss": -27.481382369995117, "global_step": 559695, "epoch": 6743} {"train_loss": -27.395843505859375, "global_step": 559696, "epoch": 6743} {"train_loss": -27.79609489440918, "global_step": 559697, "epoch": 6743} {"train_loss": -27.65413475036621, "global_step": 559698, "epoch": 6743} {"train_loss": -27.568134307861328, "global_step": 559699, "epoch": 6743} {"train_loss": -27.38469886779785, "global_step": 559700, "epoch": 6743} {"train_loss": -27.58807945251465, "global_step": 559701, "epoch": 6743} {"train_loss": -27.343107223510742, "global_step": 559702, "epoch": 6743} {"train_loss": -27.477380752563477, "global_step": 559703, "epoch": 6743} {"train_loss": -27.736480712890625, "global_step": 559704, "epoch": 6743} {"train_loss": -27.803373336791992, "global_step": 559705, "epoch": 6743} {"train_loss": -27.982650756835938, "global_step": 559706, "epoch": 6743} {"train_loss": -27.69280433654785, "global_step": 559707, "epoch": 6743} {"train_loss": -28.112262725830078, "global_step": 559708, "epoch": 6743} {"train_loss": -28.24500846862793, "global_step": 559709, "epoch": 6743} {"train_loss": -27.821613311767578, "global_step": 559710, "epoch": 6743} {"train_loss": -27.85308837890625, "global_step": 559711, "epoch": 6743} {"train_loss": -27.74820327758789, "global_step": 559712, "epoch": 6743} {"train_loss": -27.68662452697754, "global_step": 559713, "epoch": 6743} {"train_loss": -27.642663955688477, "global_step": 559714, "epoch": 6743} {"train_loss": -27.422330856323242, "global_step": 559715, "epoch": 6743} {"train_loss": -27.816436767578125, "global_step": 559716, "epoch": 6743} {"train_loss": -28.07415199279785, "global_step": 559717, "epoch": 6743} {"train_loss": -28.291717529296875, "global_step": 559718, "epoch": 6743} {"train_loss": -27.8306827545166, "global_step": 559719, "epoch": 6743} {"train_loss": -27.623456954956055, "global_step": 559720, "epoch": 6743} {"train_loss": -27.827707290649414, "global_step": 559721, "epoch": 6743} {"train_loss": -27.8874568939209, "global_step": 559722, "epoch": 6743} {"train_loss": -28.04361343383789, "global_step": 559723, "epoch": 6743} {"train_loss": -27.21295738220215, "global_step": 559724, "epoch": 6743} {"train_loss": -27.82209587097168, "global_step": 559725, "epoch": 6743} {"train_loss": -27.599721908569336, "global_step": 559726, "epoch": 6743} {"train_loss": -27.588947296142578, "global_step": 559727, "epoch": 6743} {"train_loss": -27.29046630859375, "global_step": 559728, "epoch": 6743} {"train_loss": -27.923017501831055, "global_step": 559729, "epoch": 6743} {"train_loss": -27.692005157470703, "global_step": 559730, "epoch": 6743} {"train_loss": -28.022497177124023, "global_step": 559731, "epoch": 6743} {"train_loss": -28.063751220703125, "global_step": 559732, "epoch": 6743} {"train_loss": -27.75172233581543, "global_step": 559733, "epoch": 6743} {"train_loss": -27.8248291015625, "global_step": 559734, "epoch": 6743} {"train_loss": -27.715839385986328, "global_step": 559735, "epoch": 6743} {"train_loss": -27.787771224975586, "global_step": 559736, "epoch": 6743} {"train_loss": -28.113494873046875, "global_step": 559737, "epoch": 6743} {"train_loss": -28.1346435546875, "global_step": 559738, "epoch": 6743} {"train_loss": -27.9345760345459, "global_step": 559739, "epoch": 6743} {"train_loss": -27.75763511657715, "global_step": 559740, "epoch": 6743} {"train_loss": -28.247541427612305, "global_step": 559741, "epoch": 6743} {"train_loss": -28.14950942993164, "global_step": 559742, "epoch": 6743} {"train_loss": -28.078195571899414, "global_step": 559743, "epoch": 6743} {"train_loss": -27.8027286529541, "global_step": 559744, "epoch": 6743} {"train_loss": -27.867673873901367, "global_step": 559745, "epoch": 6743} {"train_loss": -27.770437240600586, "global_step": 559746, "epoch": 6743} {"train_loss": -27.258575439453125, "global_step": 559747, "epoch": 6743} {"train_loss": -26.6095027923584, "global_step": 559748, "epoch": 6743} {"train_loss": -26.958179473876953, "global_step": 559749, "epoch": 6743} {"train_loss": -27.52235984802246, "global_step": 559750, "epoch": 6743} {"train_loss": -27.619959842727845, "global_step": 559751, "epoch": 6743, "val_loss": 6400310.5} {"train_loss": -22.203161239624023, "global_step": 559752, "epoch": 6744} {"train_loss": -25.602542877197266, "global_step": 559753, "epoch": 6744} {"train_loss": -22.926074981689453, "global_step": 559754, "epoch": 6744} {"train_loss": -25.46918296813965, "global_step": 559755, "epoch": 6744} {"train_loss": -24.877906799316406, "global_step": 559756, "epoch": 6744} {"train_loss": -24.617855072021484, "global_step": 559757, "epoch": 6744} {"train_loss": -24.850358963012695, "global_step": 559758, "epoch": 6744} {"train_loss": -25.129987716674805, "global_step": 559759, "epoch": 6744} {"train_loss": -24.952407836914062, "global_step": 559760, "epoch": 6744} {"train_loss": -25.985824584960938, "global_step": 559761, "epoch": 6744} {"train_loss": -25.590425491333008, "global_step": 559762, "epoch": 6744} {"train_loss": -24.831729888916016, "global_step": 559763, "epoch": 6744} {"train_loss": -26.034317016601562, "global_step": 559764, "epoch": 6744} {"train_loss": -26.102075576782227, "global_step": 559765, "epoch": 6744} {"train_loss": -26.016767501831055, "global_step": 559766, "epoch": 6744} {"train_loss": -26.0673828125, "global_step": 559767, "epoch": 6744} {"train_loss": -26.29593276977539, "global_step": 559768, "epoch": 6744} {"train_loss": -26.136474609375, "global_step": 559769, "epoch": 6744} {"train_loss": -26.707813262939453, "global_step": 559770, "epoch": 6744} {"train_loss": -26.534284591674805, "global_step": 559771, "epoch": 6744} {"train_loss": -26.255475997924805, "global_step": 559772, "epoch": 6744} {"train_loss": -26.0954647064209, "global_step": 559773, "epoch": 6744} {"train_loss": -26.436969757080078, "global_step": 559774, "epoch": 6744} {"train_loss": -26.415246963500977, "global_step": 559775, "epoch": 6744} {"train_loss": -26.323434829711914, "global_step": 559776, "epoch": 6744} {"train_loss": -26.26631736755371, "global_step": 559777, "epoch": 6744} {"train_loss": -26.6263484954834, "global_step": 559778, "epoch": 6744} {"train_loss": -26.775501251220703, "global_step": 559779, "epoch": 6744} {"train_loss": -26.96229362487793, "global_step": 559780, "epoch": 6744} {"train_loss": -26.904190063476562, "global_step": 559781, "epoch": 6744} {"train_loss": -26.73095703125, "global_step": 559782, "epoch": 6744} {"train_loss": -26.93733024597168, "global_step": 559783, "epoch": 6744} {"train_loss": -27.01173210144043, "global_step": 559784, "epoch": 6744} {"train_loss": -26.846166610717773, "global_step": 559785, "epoch": 6744} {"train_loss": -26.798276901245117, "global_step": 559786, "epoch": 6744} {"train_loss": -26.53961181640625, "global_step": 559787, "epoch": 6744} {"train_loss": -27.277908325195312, "global_step": 559788, "epoch": 6744} {"train_loss": -27.0216064453125, "global_step": 559789, "epoch": 6744} {"train_loss": -27.076404571533203, "global_step": 559790, "epoch": 6744} {"train_loss": -26.970935821533203, "global_step": 559791, "epoch": 6744} {"train_loss": -26.612600326538086, "global_step": 559792, "epoch": 6744} {"train_loss": -26.862695693969727, "global_step": 559793, "epoch": 6744} {"train_loss": -27.093366622924805, "global_step": 559794, "epoch": 6744} {"train_loss": -27.184772491455078, "global_step": 559795, "epoch": 6744} {"train_loss": -27.06580924987793, "global_step": 559796, "epoch": 6744} {"train_loss": -27.199787139892578, "global_step": 559797, "epoch": 6744} {"train_loss": -26.909276962280273, "global_step": 559798, "epoch": 6744} {"train_loss": -27.326080322265625, "global_step": 559799, "epoch": 6744} {"train_loss": -27.48504638671875, "global_step": 559800, "epoch": 6744} {"train_loss": -27.406904220581055, "global_step": 559801, "epoch": 6744} {"train_loss": -27.655160903930664, "global_step": 559802, "epoch": 6744} {"train_loss": -27.645837783813477, "global_step": 559803, "epoch": 6744} {"train_loss": -27.75425148010254, "global_step": 559804, "epoch": 6744} {"train_loss": -27.885156631469727, "global_step": 559805, "epoch": 6744} {"train_loss": -27.221878051757812, "global_step": 559806, "epoch": 6744} {"train_loss": -27.733722686767578, "global_step": 559807, "epoch": 6744} {"train_loss": -27.52534294128418, "global_step": 559808, "epoch": 6744} {"train_loss": -27.59454917907715, "global_step": 559809, "epoch": 6744} {"train_loss": -27.75189781188965, "global_step": 559810, "epoch": 6744} {"train_loss": -27.4239501953125, "global_step": 559811, "epoch": 6744} {"train_loss": -27.564722061157227, "global_step": 559812, "epoch": 6744} {"train_loss": -27.591999053955078, "global_step": 559813, "epoch": 6744} {"train_loss": -27.507568359375, "global_step": 559814, "epoch": 6744} {"train_loss": -27.199085235595703, "global_step": 559815, "epoch": 6744} {"train_loss": -27.796960830688477, "global_step": 559816, "epoch": 6744} {"train_loss": -27.372039794921875, "global_step": 559817, "epoch": 6744} {"train_loss": -27.86200523376465, "global_step": 559818, "epoch": 6744} {"train_loss": -28.036428451538086, "global_step": 559819, "epoch": 6744} {"train_loss": -27.94733238220215, "global_step": 559820, "epoch": 6744} {"train_loss": -28.028289794921875, "global_step": 559821, "epoch": 6744} {"train_loss": -27.918292999267578, "global_step": 559822, "epoch": 6744} {"train_loss": -27.56451416015625, "global_step": 559823, "epoch": 6744} {"train_loss": -27.598539352416992, "global_step": 559824, "epoch": 6744} {"train_loss": -27.867528915405273, "global_step": 559825, "epoch": 6744} {"train_loss": -27.750625610351562, "global_step": 559826, "epoch": 6744} {"train_loss": -27.55289077758789, "global_step": 559827, "epoch": 6744} {"train_loss": -27.775060653686523, "global_step": 559828, "epoch": 6744} {"train_loss": -27.90756607055664, "global_step": 559829, "epoch": 6744} {"train_loss": -27.87251091003418, "global_step": 559830, "epoch": 6744} {"train_loss": -27.743682861328125, "global_step": 559831, "epoch": 6744} {"train_loss": -27.916580200195312, "global_step": 559832, "epoch": 6744} {"train_loss": -28.253183364868164, "global_step": 559833, "epoch": 6744} {"train_loss": -26.821849822998047, "global_step": 559834, "epoch": 6744, "val_loss": 6365771.5} {"train_loss": -27.095556259155273, "global_step": 559835, "epoch": 6745} {"train_loss": -27.405115127563477, "global_step": 559836, "epoch": 6745} {"train_loss": -27.47242546081543, "global_step": 559837, "epoch": 6745} {"train_loss": -27.388797760009766, "global_step": 559838, "epoch": 6745} {"train_loss": -27.285770416259766, "global_step": 559839, "epoch": 6745} {"train_loss": -27.092741012573242, "global_step": 559840, "epoch": 6745} {"train_loss": -27.817493438720703, "global_step": 559841, "epoch": 6745} {"train_loss": -27.096027374267578, "global_step": 559842, "epoch": 6745} {"train_loss": -27.188459396362305, "global_step": 559843, "epoch": 6745} {"train_loss": -27.733428955078125, "global_step": 559844, "epoch": 6745} {"train_loss": -27.6241397857666, "global_step": 559845, "epoch": 6745} {"train_loss": -27.4403076171875, "global_step": 559846, "epoch": 6745} {"train_loss": -27.478891372680664, "global_step": 559847, "epoch": 6745} {"train_loss": -27.540380477905273, "global_step": 559848, "epoch": 6745} {"train_loss": -27.904541015625, "global_step": 559849, "epoch": 6745} {"train_loss": -27.34284782409668, "global_step": 559850, "epoch": 6745} {"train_loss": -27.411264419555664, "global_step": 559851, "epoch": 6745} {"train_loss": -27.878692626953125, "global_step": 559852, "epoch": 6745} {"train_loss": -27.62066650390625, "global_step": 559853, "epoch": 6745} {"train_loss": -27.738967895507812, "global_step": 559854, "epoch": 6745} {"train_loss": -27.545654296875, "global_step": 559855, "epoch": 6745} {"train_loss": -27.377058029174805, "global_step": 559856, "epoch": 6745} {"train_loss": -27.59917640686035, "global_step": 559857, "epoch": 6745} {"train_loss": -27.507160186767578, "global_step": 559858, "epoch": 6745} {"train_loss": -27.838565826416016, "global_step": 559859, "epoch": 6745} {"train_loss": -27.894453048706055, "global_step": 559860, "epoch": 6745} {"train_loss": -27.83392333984375, "global_step": 559861, "epoch": 6745} {"train_loss": -27.916147232055664, "global_step": 559862, "epoch": 6745} {"train_loss": -27.997861862182617, "global_step": 559863, "epoch": 6745} {"train_loss": -28.107776641845703, "global_step": 559864, "epoch": 6745} {"train_loss": -28.00144386291504, "global_step": 559865, "epoch": 6745} {"train_loss": -27.967493057250977, "global_step": 559866, "epoch": 6745} {"train_loss": -28.10938835144043, "global_step": 559867, "epoch": 6745} {"train_loss": -28.250019073486328, "global_step": 559868, "epoch": 6745} {"train_loss": -27.71298599243164, "global_step": 559869, "epoch": 6745} {"train_loss": -27.86703872680664, "global_step": 559870, "epoch": 6745} {"train_loss": -27.96504783630371, "global_step": 559871, "epoch": 6745} {"train_loss": -27.916833877563477, "global_step": 559872, "epoch": 6745} {"train_loss": -27.732105255126953, "global_step": 559873, "epoch": 6745} {"train_loss": -28.22908592224121, "global_step": 559874, "epoch": 6745} {"train_loss": -27.9415340423584, "global_step": 559875, "epoch": 6745} {"train_loss": -28.223159790039062, "global_step": 559876, "epoch": 6745} {"train_loss": -28.4062442779541, "global_step": 559877, "epoch": 6745} {"train_loss": -28.04231834411621, "global_step": 559878, "epoch": 6745} {"train_loss": -28.270278930664062, "global_step": 559879, "epoch": 6745} {"train_loss": -28.34404945373535, "global_step": 559880, "epoch": 6745} {"train_loss": -28.249835968017578, "global_step": 559881, "epoch": 6745} {"train_loss": -28.029830932617188, "global_step": 559882, "epoch": 6745} {"train_loss": -28.001169204711914, "global_step": 559883, "epoch": 6745} {"train_loss": -28.081607818603516, "global_step": 559884, "epoch": 6745} {"train_loss": -27.685699462890625, "global_step": 559885, "epoch": 6745} {"train_loss": -27.95806884765625, "global_step": 559886, "epoch": 6745} {"train_loss": -28.1916561126709, "global_step": 559887, "epoch": 6745} {"train_loss": -28.157882690429688, "global_step": 559888, "epoch": 6745} {"train_loss": -27.8295841217041, "global_step": 559889, "epoch": 6745} {"train_loss": -27.749631881713867, "global_step": 559890, "epoch": 6745} {"train_loss": -28.049915313720703, "global_step": 559891, "epoch": 6745} {"train_loss": -27.979873657226562, "global_step": 559892, "epoch": 6745} {"train_loss": -27.849973678588867, "global_step": 559893, "epoch": 6745} {"train_loss": -27.847137451171875, "global_step": 559894, "epoch": 6745} {"train_loss": -27.647708892822266, "global_step": 559895, "epoch": 6745} {"train_loss": -27.58820915222168, "global_step": 559896, "epoch": 6745} {"train_loss": -27.66431999206543, "global_step": 559897, "epoch": 6745} {"train_loss": -27.0408878326416, "global_step": 559898, "epoch": 6745} {"train_loss": -27.077783584594727, "global_step": 559899, "epoch": 6745} {"train_loss": -26.712310791015625, "global_step": 559900, "epoch": 6745} {"train_loss": -27.050968170166016, "global_step": 559901, "epoch": 6745} {"train_loss": -27.85225486755371, "global_step": 559902, "epoch": 6745} {"train_loss": -27.152673721313477, "global_step": 559903, "epoch": 6745} {"train_loss": -27.393712997436523, "global_step": 559904, "epoch": 6745} {"train_loss": -27.05694580078125, "global_step": 559905, "epoch": 6745} {"train_loss": -27.195926666259766, "global_step": 559906, "epoch": 6745} {"train_loss": -27.755346298217773, "global_step": 559907, "epoch": 6745} {"train_loss": -27.241941452026367, "global_step": 559908, "epoch": 6745} {"train_loss": -27.711353302001953, "global_step": 559909, "epoch": 6745} {"train_loss": -27.386938095092773, "global_step": 559910, "epoch": 6745} {"train_loss": -27.578588485717773, "global_step": 559911, "epoch": 6745} {"train_loss": -27.515268325805664, "global_step": 559912, "epoch": 6745} {"train_loss": -27.589813232421875, "global_step": 559913, "epoch": 6745} {"train_loss": -27.293975830078125, "global_step": 559914, "epoch": 6745} {"train_loss": -27.443517684936523, "global_step": 559915, "epoch": 6745} {"train_loss": -27.511859893798828, "global_step": 559916, "epoch": 6745} {"train_loss": -27.682107098131294, "global_step": 559917, "epoch": 6745, "val_loss": 6361919.5} {"train_loss": -27.50615882873535, "global_step": 559918, "epoch": 6746} {"train_loss": -27.475446701049805, "global_step": 559919, "epoch": 6746} {"train_loss": -26.889062881469727, "global_step": 559920, "epoch": 6746} {"train_loss": -27.684057235717773, "global_step": 559921, "epoch": 6746} {"train_loss": -27.421911239624023, "global_step": 559922, "epoch": 6746} {"train_loss": -27.129430770874023, "global_step": 559923, "epoch": 6746} {"train_loss": -27.32734489440918, "global_step": 559924, "epoch": 6746} {"train_loss": -27.591327667236328, "global_step": 559925, "epoch": 6746} {"train_loss": -27.292957305908203, "global_step": 559926, "epoch": 6746} {"train_loss": -27.46259880065918, "global_step": 559927, "epoch": 6746} {"train_loss": -27.451940536499023, "global_step": 559928, "epoch": 6746} {"train_loss": -27.587371826171875, "global_step": 559929, "epoch": 6746} {"train_loss": -27.560718536376953, "global_step": 559930, "epoch": 6746} {"train_loss": -27.501026153564453, "global_step": 559931, "epoch": 6746} {"train_loss": -27.40138053894043, "global_step": 559932, "epoch": 6746} {"train_loss": -27.297916412353516, "global_step": 559933, "epoch": 6746} {"train_loss": -27.715499877929688, "global_step": 559934, "epoch": 6746} {"train_loss": -27.86451530456543, "global_step": 559935, "epoch": 6746} {"train_loss": -27.659088134765625, "global_step": 559936, "epoch": 6746} {"train_loss": -27.691736221313477, "global_step": 559937, "epoch": 6746} {"train_loss": -27.8673152923584, "global_step": 559938, "epoch": 6746} {"train_loss": -28.030994415283203, "global_step": 559939, "epoch": 6746} {"train_loss": -27.6525936126709, "global_step": 559940, "epoch": 6746} {"train_loss": -27.329931259155273, "global_step": 559941, "epoch": 6746} {"train_loss": -27.94846534729004, "global_step": 559942, "epoch": 6746} {"train_loss": -27.96943473815918, "global_step": 559943, "epoch": 6746} {"train_loss": -27.84979820251465, "global_step": 559944, "epoch": 6746} {"train_loss": -27.51578712463379, "global_step": 559945, "epoch": 6746} {"train_loss": -27.918720245361328, "global_step": 559946, "epoch": 6746} {"train_loss": -27.531946182250977, "global_step": 559947, "epoch": 6746} {"train_loss": -27.961034774780273, "global_step": 559948, "epoch": 6746} {"train_loss": -27.76653480529785, "global_step": 559949, "epoch": 6746} {"train_loss": -28.212385177612305, "global_step": 559950, "epoch": 6746} {"train_loss": -27.62605094909668, "global_step": 559951, "epoch": 6746} {"train_loss": -28.098800659179688, "global_step": 559952, "epoch": 6746} {"train_loss": -27.725183486938477, "global_step": 559953, "epoch": 6746} {"train_loss": -28.00823402404785, "global_step": 559954, "epoch": 6746} {"train_loss": -27.800552368164062, "global_step": 559955, "epoch": 6746} {"train_loss": -28.036151885986328, "global_step": 559956, "epoch": 6746} {"train_loss": -28.003101348876953, "global_step": 559957, "epoch": 6746} {"train_loss": -27.989896774291992, "global_step": 559958, "epoch": 6746} {"train_loss": -27.5022029876709, "global_step": 559959, "epoch": 6746} {"train_loss": -27.957706451416016, "global_step": 559960, "epoch": 6746} {"train_loss": -28.04383659362793, "global_step": 559961, "epoch": 6746} {"train_loss": -28.243000030517578, "global_step": 559962, "epoch": 6746} {"train_loss": -27.880680084228516, "global_step": 559963, "epoch": 6746} {"train_loss": -27.613327026367188, "global_step": 559964, "epoch": 6746} {"train_loss": -27.611677169799805, "global_step": 559965, "epoch": 6746} {"train_loss": -27.50174903869629, "global_step": 559966, "epoch": 6746} {"train_loss": -27.641321182250977, "global_step": 559967, "epoch": 6746} {"train_loss": -27.852685928344727, "global_step": 559968, "epoch": 6746} {"train_loss": -27.601322174072266, "global_step": 559969, "epoch": 6746} {"train_loss": -28.180007934570312, "global_step": 559970, "epoch": 6746} {"train_loss": -27.990345001220703, "global_step": 559971, "epoch": 6746} {"train_loss": -27.52237892150879, "global_step": 559972, "epoch": 6746} {"train_loss": -27.525405883789062, "global_step": 559973, "epoch": 6746} {"train_loss": -27.388843536376953, "global_step": 559974, "epoch": 6746} {"train_loss": -27.653213500976562, "global_step": 559975, "epoch": 6746} {"train_loss": -28.053298950195312, "global_step": 559976, "epoch": 6746} {"train_loss": -27.603515625, "global_step": 559977, "epoch": 6746} {"train_loss": -27.952722549438477, "global_step": 559978, "epoch": 6746} {"train_loss": -27.571380615234375, "global_step": 559979, "epoch": 6746} {"train_loss": -28.093420028686523, "global_step": 559980, "epoch": 6746} {"train_loss": -27.843122482299805, "global_step": 559981, "epoch": 6746} {"train_loss": -27.980737686157227, "global_step": 559982, "epoch": 6746} {"train_loss": -27.68191909790039, "global_step": 559983, "epoch": 6746} {"train_loss": -27.72882080078125, "global_step": 559984, "epoch": 6746} {"train_loss": -27.87322998046875, "global_step": 559985, "epoch": 6746} {"train_loss": -27.743940353393555, "global_step": 559986, "epoch": 6746} {"train_loss": -27.9613094329834, "global_step": 559987, "epoch": 6746} {"train_loss": -28.04314613342285, "global_step": 559988, "epoch": 6746} {"train_loss": -27.623022079467773, "global_step": 559989, "epoch": 6746} {"train_loss": -28.0687313079834, "global_step": 559990, "epoch": 6746} {"train_loss": -28.237653732299805, "global_step": 559991, "epoch": 6746} {"train_loss": -27.825037002563477, "global_step": 559992, "epoch": 6746} {"train_loss": -28.067785263061523, "global_step": 559993, "epoch": 6746} {"train_loss": -27.885608673095703, "global_step": 559994, "epoch": 6746} {"train_loss": -27.783721923828125, "global_step": 559995, "epoch": 6746} {"train_loss": -27.89347267150879, "global_step": 559996, "epoch": 6746} {"train_loss": -27.717975616455078, "global_step": 559997, "epoch": 6746} {"train_loss": -27.692651748657227, "global_step": 559998, "epoch": 6746} {"train_loss": -28.290517807006836, "global_step": 559999, "epoch": 6746} {"train_loss": -27.756503783076642, "global_step": 560000, "epoch": 6746, "val_loss": 6411775.0} {"train_loss": -25.6915283203125, "global_step": 560001, "epoch": 6747} {"train_loss": -24.548648834228516, "global_step": 560002, "epoch": 6747} {"train_loss": -23.24129295349121, "global_step": 560003, "epoch": 6747} {"train_loss": -26.259443283081055, "global_step": 560004, "epoch": 6747} {"train_loss": -26.314289093017578, "global_step": 560005, "epoch": 6747} {"train_loss": -25.912817001342773, "global_step": 560006, "epoch": 6747} {"train_loss": -26.34282875061035, "global_step": 560007, "epoch": 6747} {"train_loss": -26.1423282623291, "global_step": 560008, "epoch": 6747} {"train_loss": -26.22511100769043, "global_step": 560009, "epoch": 6747} {"train_loss": -27.004728317260742, "global_step": 560010, "epoch": 6747} {"train_loss": -26.798425674438477, "global_step": 560011, "epoch": 6747} {"train_loss": -26.527692794799805, "global_step": 560012, "epoch": 6747} {"train_loss": -27.247648239135742, "global_step": 560013, "epoch": 6747} {"train_loss": -26.7310791015625, "global_step": 560014, "epoch": 6747} {"train_loss": -26.587194442749023, "global_step": 560015, "epoch": 6747} {"train_loss": -27.181365966796875, "global_step": 560016, "epoch": 6747} {"train_loss": -26.6024169921875, "global_step": 560017, "epoch": 6747} {"train_loss": -26.89797019958496, "global_step": 560018, "epoch": 6747} {"train_loss": -27.194625854492188, "global_step": 560019, "epoch": 6747} {"train_loss": -27.294376373291016, "global_step": 560020, "epoch": 6747} {"train_loss": -26.575042724609375, "global_step": 560021, "epoch": 6747} {"train_loss": -27.13543128967285, "global_step": 560022, "epoch": 6747} {"train_loss": -27.208261489868164, "global_step": 560023, "epoch": 6747} {"train_loss": -27.056196212768555, "global_step": 560024, "epoch": 6747} {"train_loss": -27.06020164489746, "global_step": 560025, "epoch": 6747} {"train_loss": -27.451465606689453, "global_step": 560026, "epoch": 6747} {"train_loss": -27.126195907592773, "global_step": 560027, "epoch": 6747} {"train_loss": -27.48455238342285, "global_step": 560028, "epoch": 6747} {"train_loss": -27.096845626831055, "global_step": 560029, "epoch": 6747} {"train_loss": -27.00601577758789, "global_step": 560030, "epoch": 6747} {"train_loss": -27.59702491760254, "global_step": 560031, "epoch": 6747} {"train_loss": -27.760517120361328, "global_step": 560032, "epoch": 6747} {"train_loss": -27.635725021362305, "global_step": 560033, "epoch": 6747} {"train_loss": -27.4254207611084, "global_step": 560034, "epoch": 6747} {"train_loss": -27.54530143737793, "global_step": 560035, "epoch": 6747} {"train_loss": -27.772937774658203, "global_step": 560036, "epoch": 6747} {"train_loss": -27.304285049438477, "global_step": 560037, "epoch": 6747} {"train_loss": -27.362030029296875, "global_step": 560038, "epoch": 6747} {"train_loss": -27.736236572265625, "global_step": 560039, "epoch": 6747} {"train_loss": -28.1156063079834, "global_step": 560040, "epoch": 6747} {"train_loss": -27.933835983276367, "global_step": 560041, "epoch": 6747} {"train_loss": -27.588550567626953, "global_step": 560042, "epoch": 6747} {"train_loss": -27.427845001220703, "global_step": 560043, "epoch": 6747} {"train_loss": -27.768964767456055, "global_step": 560044, "epoch": 6747} {"train_loss": -27.712604522705078, "global_step": 560045, "epoch": 6747} {"train_loss": -27.457143783569336, "global_step": 560046, "epoch": 6747} {"train_loss": -27.459186553955078, "global_step": 560047, "epoch": 6747} {"train_loss": -27.29123306274414, "global_step": 560048, "epoch": 6747} {"train_loss": -27.669157028198242, "global_step": 560049, "epoch": 6747} {"train_loss": -28.28645133972168, "global_step": 560050, "epoch": 6747} {"train_loss": -27.840330123901367, "global_step": 560051, "epoch": 6747} {"train_loss": -27.714826583862305, "global_step": 560052, "epoch": 6747} {"train_loss": -27.1312313079834, "global_step": 560053, "epoch": 6747} {"train_loss": -26.766515731811523, "global_step": 560054, "epoch": 6747} {"train_loss": -27.089008331298828, "global_step": 560055, "epoch": 6747} {"train_loss": -27.586002349853516, "global_step": 560056, "epoch": 6747} {"train_loss": -27.726654052734375, "global_step": 560057, "epoch": 6747} {"train_loss": -27.044233322143555, "global_step": 560058, "epoch": 6747} {"train_loss": -27.64078712463379, "global_step": 560059, "epoch": 6747} {"train_loss": -27.570322036743164, "global_step": 560060, "epoch": 6747} {"train_loss": -27.601551055908203, "global_step": 560061, "epoch": 6747} {"train_loss": -27.79535484313965, "global_step": 560062, "epoch": 6747} {"train_loss": -27.999414443969727, "global_step": 560063, "epoch": 6747} {"train_loss": -27.76833152770996, "global_step": 560064, "epoch": 6747} {"train_loss": -27.622406005859375, "global_step": 560065, "epoch": 6747} {"train_loss": -27.641000747680664, "global_step": 560066, "epoch": 6747} {"train_loss": -28.031461715698242, "global_step": 560067, "epoch": 6747} {"train_loss": -27.84638786315918, "global_step": 560068, "epoch": 6747} {"train_loss": -27.92591667175293, "global_step": 560069, "epoch": 6747} {"train_loss": -27.6031436920166, "global_step": 560070, "epoch": 6747} {"train_loss": -28.11798667907715, "global_step": 560071, "epoch": 6747} {"train_loss": -27.8160400390625, "global_step": 560072, "epoch": 6747} {"train_loss": -27.50055503845215, "global_step": 560073, "epoch": 6747} {"train_loss": -27.79192543029785, "global_step": 560074, "epoch": 6747} {"train_loss": -28.05562400817871, "global_step": 560075, "epoch": 6747} {"train_loss": -27.859601974487305, "global_step": 560076, "epoch": 6747} {"train_loss": -27.94899559020996, "global_step": 560077, "epoch": 6747} {"train_loss": -27.810972213745117, "global_step": 560078, "epoch": 6747} {"train_loss": -27.816137313842773, "global_step": 560079, "epoch": 6747} {"train_loss": -27.736743927001953, "global_step": 560080, "epoch": 6747} {"train_loss": -27.774580001831055, "global_step": 560081, "epoch": 6747} {"train_loss": -27.655378341674805, "global_step": 560082, "epoch": 6747} {"train_loss": -27.263692947755377, "global_step": 560083, "epoch": 6747, "val_loss": 6366439.0} {"train_loss": -27.488061904907227, "global_step": 560084, "epoch": 6748} {"train_loss": -27.289997100830078, "global_step": 560085, "epoch": 6748} {"train_loss": -27.13126564025879, "global_step": 560086, "epoch": 6748} {"train_loss": -28.009931564331055, "global_step": 560087, "epoch": 6748} {"train_loss": -27.7225341796875, "global_step": 560088, "epoch": 6748} {"train_loss": -27.274658203125, "global_step": 560089, "epoch": 6748} {"train_loss": -27.533802032470703, "global_step": 560090, "epoch": 6748} {"train_loss": -27.882572174072266, "global_step": 560091, "epoch": 6748} {"train_loss": -27.67682456970215, "global_step": 560092, "epoch": 6748} {"train_loss": -27.302892684936523, "global_step": 560093, "epoch": 6748} {"train_loss": -27.1501407623291, "global_step": 560094, "epoch": 6748} {"train_loss": -27.8818359375, "global_step": 560095, "epoch": 6748} {"train_loss": -27.5172119140625, "global_step": 560096, "epoch": 6748} {"train_loss": -27.141510009765625, "global_step": 560097, "epoch": 6748} {"train_loss": -27.941564559936523, "global_step": 560098, "epoch": 6748} {"train_loss": -27.856847763061523, "global_step": 560099, "epoch": 6748} {"train_loss": -27.748762130737305, "global_step": 560100, "epoch": 6748} {"train_loss": -27.79884147644043, "global_step": 560101, "epoch": 6748} {"train_loss": -27.910009384155273, "global_step": 560102, "epoch": 6748} {"train_loss": -27.62830924987793, "global_step": 560103, "epoch": 6748} {"train_loss": -27.803207397460938, "global_step": 560104, "epoch": 6748} {"train_loss": -27.79598045349121, "global_step": 560105, "epoch": 6748} {"train_loss": -27.206384658813477, "global_step": 560106, "epoch": 6748} {"train_loss": -27.9311466217041, "global_step": 560107, "epoch": 6748} {"train_loss": -27.897287368774414, "global_step": 560108, "epoch": 6748} {"train_loss": -28.057758331298828, "global_step": 560109, "epoch": 6748} {"train_loss": -27.728469848632812, "global_step": 560110, "epoch": 6748} {"train_loss": -27.69795036315918, "global_step": 560111, "epoch": 6748} {"train_loss": -28.106082916259766, "global_step": 560112, "epoch": 6748} {"train_loss": -28.021398544311523, "global_step": 560113, "epoch": 6748} {"train_loss": -28.118560791015625, "global_step": 560114, "epoch": 6748} {"train_loss": -27.929828643798828, "global_step": 560115, "epoch": 6748} {"train_loss": -28.059680938720703, "global_step": 560116, "epoch": 6748} {"train_loss": -28.170068740844727, "global_step": 560117, "epoch": 6748} {"train_loss": -27.93623161315918, "global_step": 560118, "epoch": 6748} {"train_loss": -27.360733032226562, "global_step": 560119, "epoch": 6748} {"train_loss": -27.360143661499023, "global_step": 560120, "epoch": 6748} {"train_loss": -27.913557052612305, "global_step": 560121, "epoch": 6748} {"train_loss": -28.023168563842773, "global_step": 560122, "epoch": 6748} {"train_loss": -27.432117462158203, "global_step": 560123, "epoch": 6748} {"train_loss": -27.121267318725586, "global_step": 560124, "epoch": 6748} {"train_loss": -26.85495376586914, "global_step": 560125, "epoch": 6748} {"train_loss": -27.406681060791016, "global_step": 560126, "epoch": 6748} {"train_loss": -27.789011001586914, "global_step": 560127, "epoch": 6748} {"train_loss": -27.559406280517578, "global_step": 560128, "epoch": 6748} {"train_loss": -27.333852767944336, "global_step": 560129, "epoch": 6748} {"train_loss": -27.731077194213867, "global_step": 560130, "epoch": 6748} {"train_loss": -27.7337646484375, "global_step": 560131, "epoch": 6748} {"train_loss": -27.582544326782227, "global_step": 560132, "epoch": 6748} {"train_loss": -27.602127075195312, "global_step": 560133, "epoch": 6748} {"train_loss": -27.689367294311523, "global_step": 560134, "epoch": 6748} {"train_loss": -27.60702896118164, "global_step": 560135, "epoch": 6748} {"train_loss": -27.6665096282959, "global_step": 560136, "epoch": 6748} {"train_loss": -27.430078506469727, "global_step": 560137, "epoch": 6748} {"train_loss": -27.435789108276367, "global_step": 560138, "epoch": 6748} {"train_loss": -27.111358642578125, "global_step": 560139, "epoch": 6748} {"train_loss": -27.568302154541016, "global_step": 560140, "epoch": 6748} {"train_loss": -27.216840744018555, "global_step": 560141, "epoch": 6748} {"train_loss": -27.288801193237305, "global_step": 560142, "epoch": 6748} {"train_loss": -27.637451171875, "global_step": 560143, "epoch": 6748} {"train_loss": -27.642688751220703, "global_step": 560144, "epoch": 6748} {"train_loss": -28.084360122680664, "global_step": 560145, "epoch": 6748} {"train_loss": -27.659713745117188, "global_step": 560146, "epoch": 6748} {"train_loss": -27.684906005859375, "global_step": 560147, "epoch": 6748} {"train_loss": -27.616378784179688, "global_step": 560148, "epoch": 6748} {"train_loss": -27.568933486938477, "global_step": 560149, "epoch": 6748} {"train_loss": -27.705307006835938, "global_step": 560150, "epoch": 6748} {"train_loss": -27.61738395690918, "global_step": 560151, "epoch": 6748} {"train_loss": -27.63101577758789, "global_step": 560152, "epoch": 6748} {"train_loss": -27.908185958862305, "global_step": 560153, "epoch": 6748} {"train_loss": -28.021026611328125, "global_step": 560154, "epoch": 6748} {"train_loss": -28.012964248657227, "global_step": 560155, "epoch": 6748} {"train_loss": -27.819385528564453, "global_step": 560156, "epoch": 6748} {"train_loss": -27.805713653564453, "global_step": 560157, "epoch": 6748} {"train_loss": -28.254364013671875, "global_step": 560158, "epoch": 6748} {"train_loss": -28.030792236328125, "global_step": 560159, "epoch": 6748} {"train_loss": -28.020612716674805, "global_step": 560160, "epoch": 6748} {"train_loss": -28.34512710571289, "global_step": 560161, "epoch": 6748} {"train_loss": -28.04859733581543, "global_step": 560162, "epoch": 6748} {"train_loss": -27.864276885986328, "global_step": 560163, "epoch": 6748} {"train_loss": -27.82733726501465, "global_step": 560164, "epoch": 6748} {"train_loss": -28.02313232421875, "global_step": 560165, "epoch": 6748} {"train_loss": -27.688183910875434, "global_step": 560166, "epoch": 6748, "val_loss": 6315518.0} {"train_loss": -25.795560836791992, "global_step": 560167, "epoch": 6749} {"train_loss": -25.813751220703125, "global_step": 560168, "epoch": 6749} {"train_loss": -27.18636131286621, "global_step": 560169, "epoch": 6749} {"train_loss": -26.522123336791992, "global_step": 560170, "epoch": 6749} {"train_loss": -26.44144630432129, "global_step": 560171, "epoch": 6749} {"train_loss": -26.93976402282715, "global_step": 560172, "epoch": 6749} {"train_loss": -27.135961532592773, "global_step": 560173, "epoch": 6749} {"train_loss": -26.947492599487305, "global_step": 560174, "epoch": 6749} {"train_loss": -27.038801193237305, "global_step": 560175, "epoch": 6749} {"train_loss": -27.00014305114746, "global_step": 560176, "epoch": 6749} {"train_loss": -27.352548599243164, "global_step": 560177, "epoch": 6749} {"train_loss": -26.919937133789062, "global_step": 560178, "epoch": 6749} {"train_loss": -27.362689971923828, "global_step": 560179, "epoch": 6749} {"train_loss": -27.53110694885254, "global_step": 560180, "epoch": 6749} {"train_loss": -27.71687126159668, "global_step": 560181, "epoch": 6749} {"train_loss": -27.404279708862305, "global_step": 560182, "epoch": 6749} {"train_loss": -27.355731964111328, "global_step": 560183, "epoch": 6749} {"train_loss": -27.688446044921875, "global_step": 560184, "epoch": 6749} {"train_loss": -27.731510162353516, "global_step": 560185, "epoch": 6749} {"train_loss": -27.402359008789062, "global_step": 560186, "epoch": 6749} {"train_loss": -27.518115997314453, "global_step": 560187, "epoch": 6749} {"train_loss": -27.519689559936523, "global_step": 560188, "epoch": 6749} {"train_loss": -27.40484619140625, "global_step": 560189, "epoch": 6749} {"train_loss": -27.869897842407227, "global_step": 560190, "epoch": 6749} {"train_loss": -27.694995880126953, "global_step": 560191, "epoch": 6749} {"train_loss": -28.103713989257812, "global_step": 560192, "epoch": 6749} {"train_loss": -27.440420150756836, "global_step": 560193, "epoch": 6749} {"train_loss": -27.54514503479004, "global_step": 560194, "epoch": 6749} {"train_loss": -28.031391143798828, "global_step": 560195, "epoch": 6749} {"train_loss": -27.649688720703125, "global_step": 560196, "epoch": 6749} {"train_loss": -27.835041046142578, "global_step": 560197, "epoch": 6749} {"train_loss": -27.707935333251953, "global_step": 560198, "epoch": 6749} {"train_loss": -27.684955596923828, "global_step": 560199, "epoch": 6749} {"train_loss": -27.719146728515625, "global_step": 560200, "epoch": 6749} {"train_loss": -27.7874755859375, "global_step": 560201, "epoch": 6749} {"train_loss": -27.966033935546875, "global_step": 560202, "epoch": 6749} {"train_loss": -28.045948028564453, "global_step": 560203, "epoch": 6749} {"train_loss": -27.7320499420166, "global_step": 560204, "epoch": 6749} {"train_loss": -27.861576080322266, "global_step": 560205, "epoch": 6749} {"train_loss": -27.782201766967773, "global_step": 560206, "epoch": 6749} {"train_loss": -28.088714599609375, "global_step": 560207, "epoch": 6749} {"train_loss": -28.0578556060791, "global_step": 560208, "epoch": 6749} {"train_loss": -27.970449447631836, "global_step": 560209, "epoch": 6749} {"train_loss": -27.706409454345703, "global_step": 560210, "epoch": 6749} {"train_loss": -27.792011260986328, "global_step": 560211, "epoch": 6749} {"train_loss": -28.071081161499023, "global_step": 560212, "epoch": 6749} {"train_loss": -28.39006996154785, "global_step": 560213, "epoch": 6749} {"train_loss": -27.9515380859375, "global_step": 560214, "epoch": 6749} {"train_loss": -27.896484375, "global_step": 560215, "epoch": 6749} {"train_loss": -27.8529109954834, "global_step": 560216, "epoch": 6749} {"train_loss": -28.32390785217285, "global_step": 560217, "epoch": 6749} {"train_loss": -27.83146095275879, "global_step": 560218, "epoch": 6749} {"train_loss": -28.202808380126953, "global_step": 560219, "epoch": 6749} {"train_loss": -27.91244888305664, "global_step": 560220, "epoch": 6749} {"train_loss": -27.96906089782715, "global_step": 560221, "epoch": 6749} {"train_loss": -27.769744873046875, "global_step": 560222, "epoch": 6749} {"train_loss": -27.54638671875, "global_step": 560223, "epoch": 6749} {"train_loss": -27.7327938079834, "global_step": 560224, "epoch": 6749} {"train_loss": -27.59052085876465, "global_step": 560225, "epoch": 6749} {"train_loss": -26.81440544128418, "global_step": 560226, "epoch": 6749} {"train_loss": -26.2117977142334, "global_step": 560227, "epoch": 6749} {"train_loss": -24.942808151245117, "global_step": 560228, "epoch": 6749} {"train_loss": -26.509855270385742, "global_step": 560229, "epoch": 6749} {"train_loss": -27.824512481689453, "global_step": 560230, "epoch": 6749} {"train_loss": -26.816633224487305, "global_step": 560231, "epoch": 6749} {"train_loss": -27.04665184020996, "global_step": 560232, "epoch": 6749} {"train_loss": -27.05537223815918, "global_step": 560233, "epoch": 6749} {"train_loss": -27.17917251586914, "global_step": 560234, "epoch": 6749} {"train_loss": -27.651731491088867, "global_step": 560235, "epoch": 6749} {"train_loss": -27.331335067749023, "global_step": 560236, "epoch": 6749} {"train_loss": -27.229948043823242, "global_step": 560237, "epoch": 6749} {"train_loss": -27.806257247924805, "global_step": 560238, "epoch": 6749} {"train_loss": -27.646743774414062, "global_step": 560239, "epoch": 6749} {"train_loss": -27.233022689819336, "global_step": 560240, "epoch": 6749} {"train_loss": -27.802900314331055, "global_step": 560241, "epoch": 6749} {"train_loss": -27.415082931518555, "global_step": 560242, "epoch": 6749} {"train_loss": -27.424283981323242, "global_step": 560243, "epoch": 6749} {"train_loss": -27.555124282836914, "global_step": 560244, "epoch": 6749} {"train_loss": -27.51521110534668, "global_step": 560245, "epoch": 6749} {"train_loss": -27.59209632873535, "global_step": 560246, "epoch": 6749} {"train_loss": -27.392202377319336, "global_step": 560247, "epoch": 6749} {"train_loss": -27.465173721313477, "global_step": 560248, "epoch": 6749} {"train_loss": -27.469772269926874, "global_step": 560249, "epoch": 6749, "val_loss": 6359640.0} {"train_loss": -27.188678741455078, "global_step": 560250, "epoch": 6750} {"train_loss": -27.09174156188965, "global_step": 560251, "epoch": 6750} {"train_loss": -27.261890411376953, "global_step": 560252, "epoch": 6750} {"train_loss": -27.127195358276367, "global_step": 560253, "epoch": 6750} {"train_loss": -27.38152503967285, "global_step": 560254, "epoch": 6750} {"train_loss": -27.244443893432617, "global_step": 560255, "epoch": 6750} {"train_loss": -27.77277183532715, "global_step": 560256, "epoch": 6750} {"train_loss": -27.339025497436523, "global_step": 560257, "epoch": 6750} {"train_loss": -27.491559982299805, "global_step": 560258, "epoch": 6750} {"train_loss": -27.563037872314453, "global_step": 560259, "epoch": 6750} {"train_loss": -27.62076759338379, "global_step": 560260, "epoch": 6750} {"train_loss": -27.35541343688965, "global_step": 560261, "epoch": 6750} {"train_loss": -27.22638511657715, "global_step": 560262, "epoch": 6750} {"train_loss": -27.433826446533203, "global_step": 560263, "epoch": 6750} {"train_loss": -27.654821395874023, "global_step": 560264, "epoch": 6750} {"train_loss": -27.549041748046875, "global_step": 560265, "epoch": 6750} {"train_loss": -28.12457847595215, "global_step": 560266, "epoch": 6750} {"train_loss": -27.562286376953125, "global_step": 560267, "epoch": 6750} {"train_loss": -27.82753562927246, "global_step": 560268, "epoch": 6750} {"train_loss": -27.567157745361328, "global_step": 560269, "epoch": 6750} {"train_loss": -28.066635131835938, "global_step": 560270, "epoch": 6750} {"train_loss": -27.572574615478516, "global_step": 560271, "epoch": 6750} {"train_loss": -27.56150245666504, "global_step": 560272, "epoch": 6750} {"train_loss": -27.854711532592773, "global_step": 560273, "epoch": 6750} {"train_loss": -27.9056396484375, "global_step": 560274, "epoch": 6750} {"train_loss": -27.693098068237305, "global_step": 560275, "epoch": 6750} {"train_loss": -27.923486709594727, "global_step": 560276, "epoch": 6750} {"train_loss": -27.984161376953125, "global_step": 560277, "epoch": 6750} {"train_loss": -28.02631187438965, "global_step": 560278, "epoch": 6750} {"train_loss": -27.91318130493164, "global_step": 560279, "epoch": 6750} {"train_loss": -27.815351486206055, "global_step": 560280, "epoch": 6750} {"train_loss": -27.802331924438477, "global_step": 560281, "epoch": 6750} {"train_loss": -27.812625885009766, "global_step": 560282, "epoch": 6750} {"train_loss": -27.966949462890625, "global_step": 560283, "epoch": 6750} {"train_loss": -27.773778915405273, "global_step": 560284, "epoch": 6750} {"train_loss": -27.97552490234375, "global_step": 560285, "epoch": 6750} {"train_loss": -27.82318687438965, "global_step": 560286, "epoch": 6750} {"train_loss": -27.990966796875, "global_step": 560287, "epoch": 6750} {"train_loss": -28.073556900024414, "global_step": 560288, "epoch": 6750} {"train_loss": -27.64363670349121, "global_step": 560289, "epoch": 6750} {"train_loss": -28.010046005249023, "global_step": 560290, "epoch": 6750} {"train_loss": -27.794315338134766, "global_step": 560291, "epoch": 6750} {"train_loss": -28.143482208251953, "global_step": 560292, "epoch": 6750} {"train_loss": -27.7319278717041, "global_step": 560293, "epoch": 6750} {"train_loss": -27.983829498291016, "global_step": 560294, "epoch": 6750} {"train_loss": -27.714466094970703, "global_step": 560295, "epoch": 6750} {"train_loss": -28.030969619750977, "global_step": 560296, "epoch": 6750} {"train_loss": -28.016803741455078, "global_step": 560297, "epoch": 6750} {"train_loss": -27.79646873474121, "global_step": 560298, "epoch": 6750} {"train_loss": -27.86408042907715, "global_step": 560299, "epoch": 6750} {"train_loss": -27.8067684173584, "global_step": 560300, "epoch": 6750} {"train_loss": -27.40973472595215, "global_step": 560301, "epoch": 6750} {"train_loss": -27.3139591217041, "global_step": 560302, "epoch": 6750} {"train_loss": -27.582006454467773, "global_step": 560303, "epoch": 6750} {"train_loss": -27.908761978149414, "global_step": 560304, "epoch": 6750} {"train_loss": -28.049665451049805, "global_step": 560305, "epoch": 6750} {"train_loss": -27.835376739501953, "global_step": 560306, "epoch": 6750} {"train_loss": -27.807958602905273, "global_step": 560307, "epoch": 6750} {"train_loss": -28.0771427154541, "global_step": 560308, "epoch": 6750} {"train_loss": -27.75260353088379, "global_step": 560309, "epoch": 6750} {"train_loss": -28.013456344604492, "global_step": 560310, "epoch": 6750} {"train_loss": -27.8619384765625, "global_step": 560311, "epoch": 6750} {"train_loss": -28.026620864868164, "global_step": 560312, "epoch": 6750} {"train_loss": -27.92951774597168, "global_step": 560313, "epoch": 6750} {"train_loss": -27.73235511779785, "global_step": 560314, "epoch": 6750} {"train_loss": -27.92529296875, "global_step": 560315, "epoch": 6750} {"train_loss": -28.1041316986084, "global_step": 560316, "epoch": 6750} {"train_loss": -28.065610885620117, "global_step": 560317, "epoch": 6750} {"train_loss": -28.013147354125977, "global_step": 560318, "epoch": 6750} {"train_loss": -27.789459228515625, "global_step": 560319, "epoch": 6750} {"train_loss": -27.290170669555664, "global_step": 560320, "epoch": 6750} {"train_loss": -26.025623321533203, "global_step": 560321, "epoch": 6750} {"train_loss": -25.544912338256836, "global_step": 560322, "epoch": 6750} {"train_loss": -26.33403968811035, "global_step": 560323, "epoch": 6750} {"train_loss": -27.404775619506836, "global_step": 560324, "epoch": 6750} {"train_loss": -26.61737632751465, "global_step": 560325, "epoch": 6750} {"train_loss": -26.733596801757812, "global_step": 560326, "epoch": 6750} {"train_loss": -26.6590576171875, "global_step": 560327, "epoch": 6750} {"train_loss": -27.178552627563477, "global_step": 560328, "epoch": 6750} {"train_loss": -26.398456573486328, "global_step": 560329, "epoch": 6750} {"train_loss": -26.864288330078125, "global_step": 560330, "epoch": 6750} {"train_loss": -26.799665451049805, "global_step": 560331, "epoch": 6750} {"train_loss": -27.576972226062452, "global_step": 560332, "epoch": 6750, "train/sim_max_reward_0": 1.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4500000": 1.0, "test/sim_max_reward_4500001": 1.0, "test/sim_max_reward_4500002": 1.0, "test/sim_max_reward_4500003": 1.0, "test/sim_max_reward_4500004": 1.0, "test/sim_max_reward_4500005": 1.0, "test/sim_max_reward_4500006": 1.0, "test/sim_max_reward_4500007": 0.0, "test/sim_max_reward_4500008": 1.0, "test/sim_max_reward_4500009": 1.0, "test/sim_max_reward_4500010": 1.0, "test/sim_max_reward_4500011": 1.0, "test/sim_max_reward_4500012": 1.0, "test/sim_max_reward_4500013": 0.0, "test/sim_max_reward_4500014": 1.0, "test/sim_max_reward_4500015": 1.0, "test/sim_max_reward_4500016": 1.0, "test/sim_max_reward_4500017": 1.0, "test/sim_max_reward_4500018": 1.0, "test/sim_max_reward_4500019": 0.0, "test/sim_max_reward_4500020": 1.0, "test/sim_max_reward_4500021": 1.0, "train/mean_score": 1.0, "test/mean_score": 0.8636363636363636, "val_loss": 6433992.0} {"train_loss": -24.99342918395996, "global_step": 560333, "epoch": 6751} {"train_loss": -25.542301177978516, "global_step": 560334, "epoch": 6751} {"train_loss": -26.44883155822754, "global_step": 560335, "epoch": 6751} {"train_loss": -25.54420280456543, "global_step": 560336, "epoch": 6751} {"train_loss": -25.72723388671875, "global_step": 560337, "epoch": 6751} {"train_loss": -25.917524337768555, "global_step": 560338, "epoch": 6751} {"train_loss": -26.163644790649414, "global_step": 560339, "epoch": 6751} {"train_loss": -26.00644874572754, "global_step": 560340, "epoch": 6751} {"train_loss": -26.42105484008789, "global_step": 560341, "epoch": 6751} {"train_loss": -26.681396484375, "global_step": 560342, "epoch": 6751} {"train_loss": -26.34671401977539, "global_step": 560343, "epoch": 6751} {"train_loss": -26.446821212768555, "global_step": 560344, "epoch": 6751} {"train_loss": -26.52732276916504, "global_step": 560345, "epoch": 6751} {"train_loss": -26.795557022094727, "global_step": 560346, "epoch": 6751} {"train_loss": -26.672632217407227, "global_step": 560347, "epoch": 6751} {"train_loss": -26.440038681030273, "global_step": 560348, "epoch": 6751} {"train_loss": -26.790170669555664, "global_step": 560349, "epoch": 6751} {"train_loss": -26.740015029907227, "global_step": 560350, "epoch": 6751} {"train_loss": -26.719274520874023, "global_step": 560351, "epoch": 6751} {"train_loss": -27.5275936126709, "global_step": 560352, "epoch": 6751} {"train_loss": -27.260303497314453, "global_step": 560353, "epoch": 6751} {"train_loss": -26.71392822265625, "global_step": 560354, "epoch": 6751} {"train_loss": -27.196624755859375, "global_step": 560355, "epoch": 6751} {"train_loss": -27.194446563720703, "global_step": 560356, "epoch": 6751} {"train_loss": -27.24725914001465, "global_step": 560357, "epoch": 6751} {"train_loss": -27.045618057250977, "global_step": 560358, "epoch": 6751} {"train_loss": -27.279672622680664, "global_step": 560359, "epoch": 6751} {"train_loss": -27.259967803955078, "global_step": 560360, "epoch": 6751} {"train_loss": -27.3887939453125, "global_step": 560361, "epoch": 6751} {"train_loss": -27.38099479675293, "global_step": 560362, "epoch": 6751} {"train_loss": -27.542341232299805, "global_step": 560363, "epoch": 6751} {"train_loss": -27.269866943359375, "global_step": 560364, "epoch": 6751} {"train_loss": -27.250158309936523, "global_step": 560365, "epoch": 6751} {"train_loss": -28.29823112487793, "global_step": 560366, "epoch": 6751} {"train_loss": -27.359350204467773, "global_step": 560367, "epoch": 6751} {"train_loss": -27.54876136779785, "global_step": 560368, "epoch": 6751} {"train_loss": -27.73835563659668, "global_step": 560369, "epoch": 6751} {"train_loss": -27.274322509765625, "global_step": 560370, "epoch": 6751} {"train_loss": -27.878782272338867, "global_step": 560371, "epoch": 6751} {"train_loss": -27.424560546875, "global_step": 560372, "epoch": 6751} {"train_loss": -27.608911514282227, "global_step": 560373, "epoch": 6751} {"train_loss": -27.490751266479492, "global_step": 560374, "epoch": 6751} {"train_loss": -27.921865463256836, "global_step": 560375, "epoch": 6751} {"train_loss": -27.785985946655273, "global_step": 560376, "epoch": 6751} {"train_loss": -27.840167999267578, "global_step": 560377, "epoch": 6751} {"train_loss": -27.716760635375977, "global_step": 560378, "epoch": 6751} {"train_loss": -27.886701583862305, "global_step": 560379, "epoch": 6751} {"train_loss": -27.812780380249023, "global_step": 560380, "epoch": 6751} {"train_loss": -27.550138473510742, "global_step": 560381, "epoch": 6751} {"train_loss": -27.886890411376953, "global_step": 560382, "epoch": 6751} {"train_loss": -27.74265480041504, "global_step": 560383, "epoch": 6751} {"train_loss": -28.22303581237793, "global_step": 560384, "epoch": 6751} {"train_loss": -27.66742515563965, "global_step": 560385, "epoch": 6751} {"train_loss": -27.934240341186523, "global_step": 560386, "epoch": 6751} {"train_loss": -28.05733299255371, "global_step": 560387, "epoch": 6751} {"train_loss": -27.903955459594727, "global_step": 560388, "epoch": 6751} {"train_loss": -28.416873931884766, "global_step": 560389, "epoch": 6751} {"train_loss": -28.41090202331543, "global_step": 560390, "epoch": 6751} {"train_loss": -28.180383682250977, "global_step": 560391, "epoch": 6751} {"train_loss": -28.159931182861328, "global_step": 560392, "epoch": 6751} {"train_loss": -28.0379695892334, "global_step": 560393, "epoch": 6751} {"train_loss": -27.87273597717285, "global_step": 560394, "epoch": 6751} {"train_loss": -27.8209285736084, "global_step": 560395, "epoch": 6751} {"train_loss": -28.18983268737793, "global_step": 560396, "epoch": 6751} {"train_loss": -28.478485107421875, "global_step": 560397, "epoch": 6751} {"train_loss": -27.714935302734375, "global_step": 560398, "epoch": 6751} {"train_loss": -27.86860466003418, "global_step": 560399, "epoch": 6751} {"train_loss": -27.415252685546875, "global_step": 560400, "epoch": 6751} {"train_loss": -27.72519302368164, "global_step": 560401, "epoch": 6751} {"train_loss": -27.947528839111328, "global_step": 560402, "epoch": 6751} {"train_loss": -27.848251342773438, "global_step": 560403, "epoch": 6751} {"train_loss": -27.604724884033203, "global_step": 560404, "epoch": 6751} {"train_loss": -27.527734756469727, "global_step": 560405, "epoch": 6751} {"train_loss": -27.277454376220703, "global_step": 560406, "epoch": 6751} {"train_loss": -27.415441513061523, "global_step": 560407, "epoch": 6751} {"train_loss": -27.099035263061523, "global_step": 560408, "epoch": 6751} {"train_loss": -26.439300537109375, "global_step": 560409, "epoch": 6751} {"train_loss": -27.484479904174805, "global_step": 560410, "epoch": 6751} {"train_loss": -27.86030387878418, "global_step": 560411, "epoch": 6751} {"train_loss": -27.158588409423828, "global_step": 560412, "epoch": 6751} {"train_loss": -27.630924224853516, "global_step": 560413, "epoch": 6751} {"train_loss": -27.8685245513916, "global_step": 560414, "epoch": 6751} {"train_loss": -27.349263869136212, "global_step": 560415, "epoch": 6751, "val_loss": 6348981.0} {"train_loss": -26.760211944580078, "global_step": 560416, "epoch": 6752} {"train_loss": -25.244131088256836, "global_step": 560417, "epoch": 6752} {"train_loss": -25.85273551940918, "global_step": 560418, "epoch": 6752} {"train_loss": -26.807880401611328, "global_step": 560419, "epoch": 6752} {"train_loss": -26.562911987304688, "global_step": 560420, "epoch": 6752} {"train_loss": -26.89173698425293, "global_step": 560421, "epoch": 6752} {"train_loss": -26.492969512939453, "global_step": 560422, "epoch": 6752} {"train_loss": -26.9866886138916, "global_step": 560423, "epoch": 6752} {"train_loss": -26.68497657775879, "global_step": 560424, "epoch": 6752} {"train_loss": -26.812854766845703, "global_step": 560425, "epoch": 6752} {"train_loss": -26.867650985717773, "global_step": 560426, "epoch": 6752} {"train_loss": -27.565387725830078, "global_step": 560427, "epoch": 6752} {"train_loss": -26.969762802124023, "global_step": 560428, "epoch": 6752} {"train_loss": -27.19964027404785, "global_step": 560429, "epoch": 6752} {"train_loss": -27.142053604125977, "global_step": 560430, "epoch": 6752} {"train_loss": -27.242826461791992, "global_step": 560431, "epoch": 6752} {"train_loss": -27.11910057067871, "global_step": 560432, "epoch": 6752} {"train_loss": -27.295196533203125, "global_step": 560433, "epoch": 6752} {"train_loss": -27.473840713500977, "global_step": 560434, "epoch": 6752} {"train_loss": -27.326251983642578, "global_step": 560435, "epoch": 6752} {"train_loss": -27.300912857055664, "global_step": 560436, "epoch": 6752} {"train_loss": -27.5699462890625, "global_step": 560437, "epoch": 6752} {"train_loss": -27.521087646484375, "global_step": 560438, "epoch": 6752} {"train_loss": -27.815107345581055, "global_step": 560439, "epoch": 6752} {"train_loss": -27.6468505859375, "global_step": 560440, "epoch": 6752} {"train_loss": -27.397403717041016, "global_step": 560441, "epoch": 6752} {"train_loss": -27.746768951416016, "global_step": 560442, "epoch": 6752} {"train_loss": -27.749835968017578, "global_step": 560443, "epoch": 6752} {"train_loss": -27.453683853149414, "global_step": 560444, "epoch": 6752} {"train_loss": -27.37556266784668, "global_step": 560445, "epoch": 6752} {"train_loss": -27.916858673095703, "global_step": 560446, "epoch": 6752} {"train_loss": -27.66663932800293, "global_step": 560447, "epoch": 6752} {"train_loss": -27.53788185119629, "global_step": 560448, "epoch": 6752} {"train_loss": -27.742944717407227, "global_step": 560449, "epoch": 6752} {"train_loss": -28.1832332611084, "global_step": 560450, "epoch": 6752} {"train_loss": -27.565082550048828, "global_step": 560451, "epoch": 6752} {"train_loss": -27.5860652923584, "global_step": 560452, "epoch": 6752} {"train_loss": -27.339696884155273, "global_step": 560453, "epoch": 6752} {"train_loss": -27.70380210876465, "global_step": 560454, "epoch": 6752} {"train_loss": -27.456945419311523, "global_step": 560455, "epoch": 6752} {"train_loss": -27.653181076049805, "global_step": 560456, "epoch": 6752} {"train_loss": -27.95309829711914, "global_step": 560457, "epoch": 6752} {"train_loss": -27.899030685424805, "global_step": 560458, "epoch": 6752} {"train_loss": -27.810760498046875, "global_step": 560459, "epoch": 6752} {"train_loss": -28.155118942260742, "global_step": 560460, "epoch": 6752} {"train_loss": -27.637311935424805, "global_step": 560461, "epoch": 6752} {"train_loss": -27.923593521118164, "global_step": 560462, "epoch": 6752} {"train_loss": -27.935789108276367, "global_step": 560463, "epoch": 6752} {"train_loss": -27.8199405670166, "global_step": 560464, "epoch": 6752} {"train_loss": -28.038543701171875, "global_step": 560465, "epoch": 6752} {"train_loss": -27.68958854675293, "global_step": 560466, "epoch": 6752} {"train_loss": -28.190799713134766, "global_step": 560467, "epoch": 6752} {"train_loss": -27.78154945373535, "global_step": 560468, "epoch": 6752} {"train_loss": -27.91769790649414, "global_step": 560469, "epoch": 6752} {"train_loss": -28.20090103149414, "global_step": 560470, "epoch": 6752} {"train_loss": -27.88262939453125, "global_step": 560471, "epoch": 6752} {"train_loss": -28.01166343688965, "global_step": 560472, "epoch": 6752} {"train_loss": -27.560285568237305, "global_step": 560473, "epoch": 6752} {"train_loss": -27.964197158813477, "global_step": 560474, "epoch": 6752} {"train_loss": -27.969152450561523, "global_step": 560475, "epoch": 6752} {"train_loss": -28.145078659057617, "global_step": 560476, "epoch": 6752} {"train_loss": -27.6272029876709, "global_step": 560477, "epoch": 6752} {"train_loss": -27.092426300048828, "global_step": 560478, "epoch": 6752} {"train_loss": -26.65778923034668, "global_step": 560479, "epoch": 6752} {"train_loss": -27.557342529296875, "global_step": 560480, "epoch": 6752} {"train_loss": -28.05258560180664, "global_step": 560481, "epoch": 6752} {"train_loss": -28.059011459350586, "global_step": 560482, "epoch": 6752} {"train_loss": -27.947860717773438, "global_step": 560483, "epoch": 6752} {"train_loss": -27.75886344909668, "global_step": 560484, "epoch": 6752} {"train_loss": -27.87800407409668, "global_step": 560485, "epoch": 6752} {"train_loss": -27.79273796081543, "global_step": 560486, "epoch": 6752} {"train_loss": -27.943811416625977, "global_step": 560487, "epoch": 6752} {"train_loss": -27.897809982299805, "global_step": 560488, "epoch": 6752} {"train_loss": -27.949132919311523, "global_step": 560489, "epoch": 6752} {"train_loss": -27.698522567749023, "global_step": 560490, "epoch": 6752} {"train_loss": -27.721967697143555, "global_step": 560491, "epoch": 6752} {"train_loss": -27.804956436157227, "global_step": 560492, "epoch": 6752} {"train_loss": -27.993534088134766, "global_step": 560493, "epoch": 6752} {"train_loss": -27.998620986938477, "global_step": 560494, "epoch": 6752} {"train_loss": -27.937442779541016, "global_step": 560495, "epoch": 6752} {"train_loss": -28.01704216003418, "global_step": 560496, "epoch": 6752} {"train_loss": -28.068078994750977, "global_step": 560497, "epoch": 6752} {"train_loss": -27.551545683159887, "global_step": 560498, "epoch": 6752, "val_loss": 6387196.0} {"train_loss": -27.576797485351562, "global_step": 560499, "epoch": 6753} {"train_loss": -27.62604331970215, "global_step": 560500, "epoch": 6753} {"train_loss": -27.71982192993164, "global_step": 560501, "epoch": 6753} {"train_loss": -27.758588790893555, "global_step": 560502, "epoch": 6753} {"train_loss": -27.316558837890625, "global_step": 560503, "epoch": 6753} {"train_loss": -27.136701583862305, "global_step": 560504, "epoch": 6753} {"train_loss": -27.13645362854004, "global_step": 560505, "epoch": 6753} {"train_loss": -27.452550888061523, "global_step": 560506, "epoch": 6753} {"train_loss": -27.530441284179688, "global_step": 560507, "epoch": 6753} {"train_loss": -27.198537826538086, "global_step": 560508, "epoch": 6753} {"train_loss": -27.989171981811523, "global_step": 560509, "epoch": 6753} {"train_loss": -27.75272560119629, "global_step": 560510, "epoch": 6753} {"train_loss": -27.53268814086914, "global_step": 560511, "epoch": 6753} {"train_loss": -27.64960289001465, "global_step": 560512, "epoch": 6753} {"train_loss": -27.74881362915039, "global_step": 560513, "epoch": 6753} {"train_loss": -27.57806968688965, "global_step": 560514, "epoch": 6753} {"train_loss": -27.613224029541016, "global_step": 560515, "epoch": 6753} {"train_loss": -27.75428581237793, "global_step": 560516, "epoch": 6753} {"train_loss": -27.505416870117188, "global_step": 560517, "epoch": 6753} {"train_loss": -27.776708602905273, "global_step": 560518, "epoch": 6753} {"train_loss": -27.635303497314453, "global_step": 560519, "epoch": 6753} {"train_loss": -28.185791015625, "global_step": 560520, "epoch": 6753} {"train_loss": -28.185644149780273, "global_step": 560521, "epoch": 6753} {"train_loss": -27.87867546081543, "global_step": 560522, "epoch": 6753} {"train_loss": -27.742176055908203, "global_step": 560523, "epoch": 6753} {"train_loss": -27.70802116394043, "global_step": 560524, "epoch": 6753} {"train_loss": -27.820417404174805, "global_step": 560525, "epoch": 6753} {"train_loss": -28.106128692626953, "global_step": 560526, "epoch": 6753} {"train_loss": -27.894123077392578, "global_step": 560527, "epoch": 6753} {"train_loss": -27.929651260375977, "global_step": 560528, "epoch": 6753} {"train_loss": -28.18440818786621, "global_step": 560529, "epoch": 6753} {"train_loss": -28.117511749267578, "global_step": 560530, "epoch": 6753} {"train_loss": -27.701581954956055, "global_step": 560531, "epoch": 6753} {"train_loss": -27.768491744995117, "global_step": 560532, "epoch": 6753} {"train_loss": -28.095434188842773, "global_step": 560533, "epoch": 6753} {"train_loss": -27.806396484375, "global_step": 560534, "epoch": 6753} {"train_loss": -27.675830841064453, "global_step": 560535, "epoch": 6753} {"train_loss": -27.6800479888916, "global_step": 560536, "epoch": 6753} {"train_loss": -27.712127685546875, "global_step": 560537, "epoch": 6753} {"train_loss": -27.899396896362305, "global_step": 560538, "epoch": 6753} {"train_loss": -27.970449447631836, "global_step": 560539, "epoch": 6753} {"train_loss": -27.832386016845703, "global_step": 560540, "epoch": 6753} {"train_loss": -27.635461807250977, "global_step": 560541, "epoch": 6753} {"train_loss": -27.82421875, "global_step": 560542, "epoch": 6753} {"train_loss": -27.79428482055664, "global_step": 560543, "epoch": 6753} {"train_loss": -27.881887435913086, "global_step": 560544, "epoch": 6753} {"train_loss": -27.77608299255371, "global_step": 560545, "epoch": 6753} {"train_loss": -27.438940048217773, "global_step": 560546, "epoch": 6753} {"train_loss": -27.608915328979492, "global_step": 560547, "epoch": 6753} {"train_loss": -27.67782974243164, "global_step": 560548, "epoch": 6753} {"train_loss": -28.2836856842041, "global_step": 560549, "epoch": 6753} {"train_loss": -28.050052642822266, "global_step": 560550, "epoch": 6753} {"train_loss": -28.114044189453125, "global_step": 560551, "epoch": 6753} {"train_loss": -27.346296310424805, "global_step": 560552, "epoch": 6753} {"train_loss": -27.330942153930664, "global_step": 560553, "epoch": 6753} {"train_loss": -27.716459274291992, "global_step": 560554, "epoch": 6753} {"train_loss": -27.75874137878418, "global_step": 560555, "epoch": 6753} {"train_loss": -27.74755859375, "global_step": 560556, "epoch": 6753} {"train_loss": -27.5670108795166, "global_step": 560557, "epoch": 6753} {"train_loss": -27.640546798706055, "global_step": 560558, "epoch": 6753} {"train_loss": -27.947330474853516, "global_step": 560559, "epoch": 6753} {"train_loss": -27.6873722076416, "global_step": 560560, "epoch": 6753} {"train_loss": -27.636926651000977, "global_step": 560561, "epoch": 6753} {"train_loss": -27.701980590820312, "global_step": 560562, "epoch": 6753} {"train_loss": -27.565343856811523, "global_step": 560563, "epoch": 6753} {"train_loss": -27.94891357421875, "global_step": 560564, "epoch": 6753} {"train_loss": -27.599416732788086, "global_step": 560565, "epoch": 6753} {"train_loss": -27.055206298828125, "global_step": 560566, "epoch": 6753} {"train_loss": -27.88523292541504, "global_step": 560567, "epoch": 6753} {"train_loss": -27.56733512878418, "global_step": 560568, "epoch": 6753} {"train_loss": -27.228546142578125, "global_step": 560569, "epoch": 6753} {"train_loss": -28.03143882751465, "global_step": 560570, "epoch": 6753} {"train_loss": -27.247018814086914, "global_step": 560571, "epoch": 6753} {"train_loss": -27.798376083374023, "global_step": 560572, "epoch": 6753} {"train_loss": -27.831212997436523, "global_step": 560573, "epoch": 6753} {"train_loss": -27.470550537109375, "global_step": 560574, "epoch": 6753} {"train_loss": -27.554834365844727, "global_step": 560575, "epoch": 6753} {"train_loss": -27.5463924407959, "global_step": 560576, "epoch": 6753} {"train_loss": -27.693761825561523, "global_step": 560577, "epoch": 6753} {"train_loss": -27.582727432250977, "global_step": 560578, "epoch": 6753} {"train_loss": -27.59858512878418, "global_step": 560579, "epoch": 6753} {"train_loss": -27.393781661987305, "global_step": 560580, "epoch": 6753} {"train_loss": -27.710510966289473, "global_step": 560581, "epoch": 6753, "val_loss": 6312833.0} {"train_loss": -26.584253311157227, "global_step": 560582, "epoch": 6754} {"train_loss": -27.342208862304688, "global_step": 560583, "epoch": 6754} {"train_loss": -26.104429244995117, "global_step": 560584, "epoch": 6754} {"train_loss": -26.484058380126953, "global_step": 560585, "epoch": 6754} {"train_loss": -26.68592643737793, "global_step": 560586, "epoch": 6754} {"train_loss": -27.280744552612305, "global_step": 560587, "epoch": 6754} {"train_loss": -26.67670249938965, "global_step": 560588, "epoch": 6754} {"train_loss": -26.96040153503418, "global_step": 560589, "epoch": 6754} {"train_loss": -27.254236221313477, "global_step": 560590, "epoch": 6754} {"train_loss": -26.87749671936035, "global_step": 560591, "epoch": 6754} {"train_loss": -27.118072509765625, "global_step": 560592, "epoch": 6754} {"train_loss": -27.1652889251709, "global_step": 560593, "epoch": 6754} {"train_loss": -27.369001388549805, "global_step": 560594, "epoch": 6754} {"train_loss": -27.09392738342285, "global_step": 560595, "epoch": 6754} {"train_loss": -27.34498405456543, "global_step": 560596, "epoch": 6754} {"train_loss": -27.376331329345703, "global_step": 560597, "epoch": 6754} {"train_loss": -27.688257217407227, "global_step": 560598, "epoch": 6754} {"train_loss": -27.589008331298828, "global_step": 560599, "epoch": 6754} {"train_loss": -27.600101470947266, "global_step": 560600, "epoch": 6754} {"train_loss": -27.587005615234375, "global_step": 560601, "epoch": 6754} {"train_loss": -27.594852447509766, "global_step": 560602, "epoch": 6754} {"train_loss": -27.627826690673828, "global_step": 560603, "epoch": 6754} {"train_loss": -27.31800651550293, "global_step": 560604, "epoch": 6754} {"train_loss": -27.225854873657227, "global_step": 560605, "epoch": 6754} {"train_loss": -27.30495262145996, "global_step": 560606, "epoch": 6754} {"train_loss": -27.4527645111084, "global_step": 560607, "epoch": 6754} {"train_loss": -27.509735107421875, "global_step": 560608, "epoch": 6754} {"train_loss": -27.674381256103516, "global_step": 560609, "epoch": 6754} {"train_loss": -27.63704490661621, "global_step": 560610, "epoch": 6754} {"train_loss": -27.635711669921875, "global_step": 560611, "epoch": 6754} {"train_loss": -27.38970375061035, "global_step": 560612, "epoch": 6754} {"train_loss": -27.8426513671875, "global_step": 560613, "epoch": 6754} {"train_loss": -27.410757064819336, "global_step": 560614, "epoch": 6754} {"train_loss": -27.4656925201416, "global_step": 560615, "epoch": 6754} {"train_loss": -27.69080924987793, "global_step": 560616, "epoch": 6754} {"train_loss": -27.414947509765625, "global_step": 560617, "epoch": 6754} {"train_loss": -27.462295532226562, "global_step": 560618, "epoch": 6754} {"train_loss": -27.66119956970215, "global_step": 560619, "epoch": 6754} {"train_loss": -27.385883331298828, "global_step": 560620, "epoch": 6754} {"train_loss": -27.0968074798584, "global_step": 560621, "epoch": 6754} {"train_loss": -27.74835205078125, "global_step": 560622, "epoch": 6754} {"train_loss": -27.828704833984375, "global_step": 560623, "epoch": 6754} {"train_loss": -27.963315963745117, "global_step": 560624, "epoch": 6754} {"train_loss": -27.8631649017334, "global_step": 560625, "epoch": 6754} {"train_loss": -27.72327995300293, "global_step": 560626, "epoch": 6754} {"train_loss": -28.417255401611328, "global_step": 560627, "epoch": 6754} {"train_loss": -27.787240982055664, "global_step": 560628, "epoch": 6754} {"train_loss": -28.33930778503418, "global_step": 560629, "epoch": 6754} {"train_loss": -27.77228355407715, "global_step": 560630, "epoch": 6754} {"train_loss": -28.172449111938477, "global_step": 560631, "epoch": 6754} {"train_loss": -27.896076202392578, "global_step": 560632, "epoch": 6754} {"train_loss": -27.863723754882812, "global_step": 560633, "epoch": 6754} {"train_loss": -28.243528366088867, "global_step": 560634, "epoch": 6754} {"train_loss": -28.131677627563477, "global_step": 560635, "epoch": 6754} {"train_loss": -27.991662979125977, "global_step": 560636, "epoch": 6754} {"train_loss": -27.6746883392334, "global_step": 560637, "epoch": 6754} {"train_loss": -27.7537841796875, "global_step": 560638, "epoch": 6754} {"train_loss": -27.923059463500977, "global_step": 560639, "epoch": 6754} {"train_loss": -27.90693473815918, "global_step": 560640, "epoch": 6754} {"train_loss": -28.08968162536621, "global_step": 560641, "epoch": 6754} {"train_loss": -28.295806884765625, "global_step": 560642, "epoch": 6754} {"train_loss": -27.883764266967773, "global_step": 560643, "epoch": 6754} {"train_loss": -27.83310890197754, "global_step": 560644, "epoch": 6754} {"train_loss": -27.8007869720459, "global_step": 560645, "epoch": 6754} {"train_loss": -28.02973747253418, "global_step": 560646, "epoch": 6754} {"train_loss": -27.82171630859375, "global_step": 560647, "epoch": 6754} {"train_loss": -27.766448974609375, "global_step": 560648, "epoch": 6754} {"train_loss": -27.906970977783203, "global_step": 560649, "epoch": 6754} {"train_loss": -27.81537437438965, "global_step": 560650, "epoch": 6754} {"train_loss": -28.279468536376953, "global_step": 560651, "epoch": 6754} {"train_loss": -28.0750789642334, "global_step": 560652, "epoch": 6754} {"train_loss": -27.84014320373535, "global_step": 560653, "epoch": 6754} {"train_loss": -27.99544334411621, "global_step": 560654, "epoch": 6754} {"train_loss": -28.03870964050293, "global_step": 560655, "epoch": 6754} {"train_loss": -27.814651489257812, "global_step": 560656, "epoch": 6754} {"train_loss": -27.509695053100586, "global_step": 560657, "epoch": 6754} {"train_loss": -28.025251388549805, "global_step": 560658, "epoch": 6754} {"train_loss": -27.89460563659668, "global_step": 560659, "epoch": 6754} {"train_loss": -27.9538631439209, "global_step": 560660, "epoch": 6754} {"train_loss": -28.049713134765625, "global_step": 560661, "epoch": 6754} {"train_loss": -28.12896156311035, "global_step": 560662, "epoch": 6754} {"train_loss": -27.5113525390625, "global_step": 560663, "epoch": 6754} {"train_loss": -27.639917005975562, "global_step": 560664, "epoch": 6754, "val_loss": 6408953.5} {"train_loss": -26.599853515625, "global_step": 560665, "epoch": 6755} {"train_loss": -27.057098388671875, "global_step": 560666, "epoch": 6755} {"train_loss": -25.85210609436035, "global_step": 560667, "epoch": 6755} {"train_loss": -26.881696701049805, "global_step": 560668, "epoch": 6755} {"train_loss": -27.062986373901367, "global_step": 560669, "epoch": 6755} {"train_loss": -26.61773681640625, "global_step": 560670, "epoch": 6755} {"train_loss": -27.02247428894043, "global_step": 560671, "epoch": 6755} {"train_loss": -27.391210556030273, "global_step": 560672, "epoch": 6755} {"train_loss": -27.12898063659668, "global_step": 560673, "epoch": 6755} {"train_loss": -27.215429306030273, "global_step": 560674, "epoch": 6755} {"train_loss": -27.36652183532715, "global_step": 560675, "epoch": 6755} {"train_loss": -27.250593185424805, "global_step": 560676, "epoch": 6755} {"train_loss": -27.58546257019043, "global_step": 560677, "epoch": 6755} {"train_loss": -27.46917724609375, "global_step": 560678, "epoch": 6755} {"train_loss": -27.3864688873291, "global_step": 560679, "epoch": 6755} {"train_loss": -27.55859375, "global_step": 560680, "epoch": 6755} {"train_loss": -27.917219161987305, "global_step": 560681, "epoch": 6755} {"train_loss": -27.328540802001953, "global_step": 560682, "epoch": 6755} {"train_loss": -27.48634147644043, "global_step": 560683, "epoch": 6755} {"train_loss": -27.67024803161621, "global_step": 560684, "epoch": 6755} {"train_loss": -27.543256759643555, "global_step": 560685, "epoch": 6755} {"train_loss": -27.730701446533203, "global_step": 560686, "epoch": 6755} {"train_loss": -27.659982681274414, "global_step": 560687, "epoch": 6755} {"train_loss": -27.779224395751953, "global_step": 560688, "epoch": 6755} {"train_loss": -27.730127334594727, "global_step": 560689, "epoch": 6755} {"train_loss": -27.598602294921875, "global_step": 560690, "epoch": 6755} {"train_loss": -27.648395538330078, "global_step": 560691, "epoch": 6755} {"train_loss": -27.7963924407959, "global_step": 560692, "epoch": 6755} {"train_loss": -28.229206085205078, "global_step": 560693, "epoch": 6755} {"train_loss": -27.587202072143555, "global_step": 560694, "epoch": 6755} {"train_loss": -27.684194564819336, "global_step": 560695, "epoch": 6755} {"train_loss": -27.587305068969727, "global_step": 560696, "epoch": 6755} {"train_loss": -27.816930770874023, "global_step": 560697, "epoch": 6755} {"train_loss": -27.799976348876953, "global_step": 560698, "epoch": 6755} {"train_loss": -27.91025161743164, "global_step": 560699, "epoch": 6755} {"train_loss": -27.64453125, "global_step": 560700, "epoch": 6755} {"train_loss": -28.197998046875, "global_step": 560701, "epoch": 6755} {"train_loss": -27.756061553955078, "global_step": 560702, "epoch": 6755} {"train_loss": -27.631555557250977, "global_step": 560703, "epoch": 6755} {"train_loss": -27.917572021484375, "global_step": 560704, "epoch": 6755} {"train_loss": -28.08465003967285, "global_step": 560705, "epoch": 6755} {"train_loss": -27.793088912963867, "global_step": 560706, "epoch": 6755} {"train_loss": -27.329320907592773, "global_step": 560707, "epoch": 6755} {"train_loss": -27.914569854736328, "global_step": 560708, "epoch": 6755} {"train_loss": -27.901458740234375, "global_step": 560709, "epoch": 6755} {"train_loss": -27.7203369140625, "global_step": 560710, "epoch": 6755} {"train_loss": -28.133996963500977, "global_step": 560711, "epoch": 6755} {"train_loss": -28.047168731689453, "global_step": 560712, "epoch": 6755} {"train_loss": -27.61969566345215, "global_step": 560713, "epoch": 6755} {"train_loss": -28.106664657592773, "global_step": 560714, "epoch": 6755} {"train_loss": -27.9130802154541, "global_step": 560715, "epoch": 6755} {"train_loss": -27.978412628173828, "global_step": 560716, "epoch": 6755} {"train_loss": -28.16912269592285, "global_step": 560717, "epoch": 6755} {"train_loss": -27.756494522094727, "global_step": 560718, "epoch": 6755} {"train_loss": -27.879169464111328, "global_step": 560719, "epoch": 6755} {"train_loss": -27.903472900390625, "global_step": 560720, "epoch": 6755} {"train_loss": -27.935272216796875, "global_step": 560721, "epoch": 6755} {"train_loss": -27.83138084411621, "global_step": 560722, "epoch": 6755} {"train_loss": -27.599164962768555, "global_step": 560723, "epoch": 6755} {"train_loss": -28.036100387573242, "global_step": 560724, "epoch": 6755} {"train_loss": -27.970617294311523, "global_step": 560725, "epoch": 6755} {"train_loss": -27.75103759765625, "global_step": 560726, "epoch": 6755} {"train_loss": -27.757598876953125, "global_step": 560727, "epoch": 6755} {"train_loss": -27.77496337890625, "global_step": 560728, "epoch": 6755} {"train_loss": -27.35675048828125, "global_step": 560729, "epoch": 6755} {"train_loss": -27.770660400390625, "global_step": 560730, "epoch": 6755} {"train_loss": -28.036813735961914, "global_step": 560731, "epoch": 6755} {"train_loss": -27.938827514648438, "global_step": 560732, "epoch": 6755} {"train_loss": -27.777936935424805, "global_step": 560733, "epoch": 6755} {"train_loss": -27.322046279907227, "global_step": 560734, "epoch": 6755} {"train_loss": -27.758108139038086, "global_step": 560735, "epoch": 6755} {"train_loss": -27.876834869384766, "global_step": 560736, "epoch": 6755} {"train_loss": -27.7737979888916, "global_step": 560737, "epoch": 6755} {"train_loss": -27.5102596282959, "global_step": 560738, "epoch": 6755} {"train_loss": -27.671405792236328, "global_step": 560739, "epoch": 6755} {"train_loss": -27.743148803710938, "global_step": 560740, "epoch": 6755} {"train_loss": -26.994028091430664, "global_step": 560741, "epoch": 6755} {"train_loss": -26.855300903320312, "global_step": 560742, "epoch": 6755} {"train_loss": -28.123395919799805, "global_step": 560743, "epoch": 6755} {"train_loss": -27.950796127319336, "global_step": 560744, "epoch": 6755} {"train_loss": -27.68951988220215, "global_step": 560745, "epoch": 6755} {"train_loss": -27.96858787536621, "global_step": 560746, "epoch": 6755} {"train_loss": -27.621145662054957, "global_step": 560747, "epoch": 6755, "val_loss": 6403724.0} {"train_loss": -27.3330078125, "global_step": 560748, "epoch": 6756} {"train_loss": -27.559614181518555, "global_step": 560749, "epoch": 6756} {"train_loss": -27.380521774291992, "global_step": 560750, "epoch": 6756} {"train_loss": -27.618972778320312, "global_step": 560751, "epoch": 6756} {"train_loss": -27.1324405670166, "global_step": 560752, "epoch": 6756} {"train_loss": -26.983169555664062, "global_step": 560753, "epoch": 6756} {"train_loss": -27.41532325744629, "global_step": 560754, "epoch": 6756} {"train_loss": -26.949193954467773, "global_step": 560755, "epoch": 6756} {"train_loss": -27.670276641845703, "global_step": 560756, "epoch": 6756} {"train_loss": -27.196985244750977, "global_step": 560757, "epoch": 6756} {"train_loss": -27.4882869720459, "global_step": 560758, "epoch": 6756} {"train_loss": -27.345727920532227, "global_step": 560759, "epoch": 6756} {"train_loss": -27.568973541259766, "global_step": 560760, "epoch": 6756} {"train_loss": -27.466083526611328, "global_step": 560761, "epoch": 6756} {"train_loss": -27.637786865234375, "global_step": 560762, "epoch": 6756} {"train_loss": -27.757770538330078, "global_step": 560763, "epoch": 6756} {"train_loss": -27.71573257446289, "global_step": 560764, "epoch": 6756} {"train_loss": -27.72981071472168, "global_step": 560765, "epoch": 6756} {"train_loss": -27.421981811523438, "global_step": 560766, "epoch": 6756} {"train_loss": -27.486419677734375, "global_step": 560767, "epoch": 6756} {"train_loss": -27.579029083251953, "global_step": 560768, "epoch": 6756} {"train_loss": -27.652297973632812, "global_step": 560769, "epoch": 6756} {"train_loss": -27.78083610534668, "global_step": 560770, "epoch": 6756} {"train_loss": -27.463937759399414, "global_step": 560771, "epoch": 6756} {"train_loss": -27.93939781188965, "global_step": 560772, "epoch": 6756} {"train_loss": -28.12017250061035, "global_step": 560773, "epoch": 6756} {"train_loss": -27.7733154296875, "global_step": 560774, "epoch": 6756} {"train_loss": -27.882898330688477, "global_step": 560775, "epoch": 6756} {"train_loss": -27.758214950561523, "global_step": 560776, "epoch": 6756} {"train_loss": -27.830900192260742, "global_step": 560777, "epoch": 6756} {"train_loss": -27.559417724609375, "global_step": 560778, "epoch": 6756} {"train_loss": -27.847436904907227, "global_step": 560779, "epoch": 6756} {"train_loss": -27.579137802124023, "global_step": 560780, "epoch": 6756} {"train_loss": -27.925268173217773, "global_step": 560781, "epoch": 6756} {"train_loss": -27.943872451782227, "global_step": 560782, "epoch": 6756} {"train_loss": -27.893102645874023, "global_step": 560783, "epoch": 6756} {"train_loss": -27.702926635742188, "global_step": 560784, "epoch": 6756} {"train_loss": -27.533735275268555, "global_step": 560785, "epoch": 6756} {"train_loss": -27.63681983947754, "global_step": 560786, "epoch": 6756} {"train_loss": -27.98101234436035, "global_step": 560787, "epoch": 6756} {"train_loss": -27.789518356323242, "global_step": 560788, "epoch": 6756} {"train_loss": -27.991195678710938, "global_step": 560789, "epoch": 6756} {"train_loss": -27.588275909423828, "global_step": 560790, "epoch": 6756} {"train_loss": -28.09646987915039, "global_step": 560791, "epoch": 6756} {"train_loss": -27.981969833374023, "global_step": 560792, "epoch": 6756} {"train_loss": -28.058170318603516, "global_step": 560793, "epoch": 6756} {"train_loss": -27.847198486328125, "global_step": 560794, "epoch": 6756} {"train_loss": -27.77325439453125, "global_step": 560795, "epoch": 6756} {"train_loss": -28.118183135986328, "global_step": 560796, "epoch": 6756} {"train_loss": -28.120574951171875, "global_step": 560797, "epoch": 6756} {"train_loss": -28.053680419921875, "global_step": 560798, "epoch": 6756} {"train_loss": -28.3526668548584, "global_step": 560799, "epoch": 6756} {"train_loss": -28.086095809936523, "global_step": 560800, "epoch": 6756} {"train_loss": -28.05099868774414, "global_step": 560801, "epoch": 6756} {"train_loss": -27.91607093811035, "global_step": 560802, "epoch": 6756} {"train_loss": -27.999347686767578, "global_step": 560803, "epoch": 6756} {"train_loss": -27.980268478393555, "global_step": 560804, "epoch": 6756} {"train_loss": -28.013046264648438, "global_step": 560805, "epoch": 6756} {"train_loss": -28.172882080078125, "global_step": 560806, "epoch": 6756} {"train_loss": -27.423093795776367, "global_step": 560807, "epoch": 6756} {"train_loss": -27.899372100830078, "global_step": 560808, "epoch": 6756} {"train_loss": -27.45501136779785, "global_step": 560809, "epoch": 6756} {"train_loss": -27.222732543945312, "global_step": 560810, "epoch": 6756} {"train_loss": -26.53801918029785, "global_step": 560811, "epoch": 6756} {"train_loss": -27.097578048706055, "global_step": 560812, "epoch": 6756} {"train_loss": -27.341833114624023, "global_step": 560813, "epoch": 6756} {"train_loss": -27.590513229370117, "global_step": 560814, "epoch": 6756} {"train_loss": -26.934711456298828, "global_step": 560815, "epoch": 6756} {"train_loss": -27.492795944213867, "global_step": 560816, "epoch": 6756} {"train_loss": -27.616931915283203, "global_step": 560817, "epoch": 6756} {"train_loss": -27.4775447845459, "global_step": 560818, "epoch": 6756} {"train_loss": -27.290369033813477, "global_step": 560819, "epoch": 6756} {"train_loss": -27.526336669921875, "global_step": 560820, "epoch": 6756} {"train_loss": -27.442493438720703, "global_step": 560821, "epoch": 6756} {"train_loss": -27.697681427001953, "global_step": 560822, "epoch": 6756} {"train_loss": -27.728281021118164, "global_step": 560823, "epoch": 6756} {"train_loss": -27.60027503967285, "global_step": 560824, "epoch": 6756} {"train_loss": -27.806732177734375, "global_step": 560825, "epoch": 6756} {"train_loss": -27.5610408782959, "global_step": 560826, "epoch": 6756} {"train_loss": -27.756561279296875, "global_step": 560827, "epoch": 6756} {"train_loss": -27.667449951171875, "global_step": 560828, "epoch": 6756} {"train_loss": -27.917510986328125, "global_step": 560829, "epoch": 6756} {"train_loss": -27.65724981836526, "global_step": 560830, "epoch": 6756, "val_loss": 6369082.5} {"train_loss": -27.651309967041016, "global_step": 560831, "epoch": 6757} {"train_loss": -27.39344596862793, "global_step": 560832, "epoch": 6757} {"train_loss": -27.654773712158203, "global_step": 560833, "epoch": 6757} {"train_loss": -27.468143463134766, "global_step": 560834, "epoch": 6757} {"train_loss": -27.713830947875977, "global_step": 560835, "epoch": 6757} {"train_loss": -27.233474731445312, "global_step": 560836, "epoch": 6757} {"train_loss": -27.611328125, "global_step": 560837, "epoch": 6757} {"train_loss": -27.55458641052246, "global_step": 560838, "epoch": 6757} {"train_loss": -26.683012008666992, "global_step": 560839, "epoch": 6757} {"train_loss": -27.540014266967773, "global_step": 560840, "epoch": 6757} {"train_loss": -27.747228622436523, "global_step": 560841, "epoch": 6757} {"train_loss": -27.48419189453125, "global_step": 560842, "epoch": 6757} {"train_loss": -27.416004180908203, "global_step": 560843, "epoch": 6757} {"train_loss": -27.5993709564209, "global_step": 560844, "epoch": 6757} {"train_loss": -27.456445693969727, "global_step": 560845, "epoch": 6757} {"train_loss": -27.734058380126953, "global_step": 560846, "epoch": 6757} {"train_loss": -27.856292724609375, "global_step": 560847, "epoch": 6757} {"train_loss": -27.476552963256836, "global_step": 560848, "epoch": 6757} {"train_loss": -27.847448348999023, "global_step": 560849, "epoch": 6757} {"train_loss": -27.914525985717773, "global_step": 560850, "epoch": 6757} {"train_loss": -27.63166618347168, "global_step": 560851, "epoch": 6757} {"train_loss": -28.041196823120117, "global_step": 560852, "epoch": 6757} {"train_loss": -27.986997604370117, "global_step": 560853, "epoch": 6757} {"train_loss": -27.667387008666992, "global_step": 560854, "epoch": 6757} {"train_loss": -28.089801788330078, "global_step": 560855, "epoch": 6757} {"train_loss": -27.7384090423584, "global_step": 560856, "epoch": 6757} {"train_loss": -28.005542755126953, "global_step": 560857, "epoch": 6757} {"train_loss": -27.628936767578125, "global_step": 560858, "epoch": 6757} {"train_loss": -27.912612915039062, "global_step": 560859, "epoch": 6757} {"train_loss": -28.152023315429688, "global_step": 560860, "epoch": 6757} {"train_loss": -28.092071533203125, "global_step": 560861, "epoch": 6757} {"train_loss": -28.21051025390625, "global_step": 560862, "epoch": 6757} {"train_loss": -28.25080680847168, "global_step": 560863, "epoch": 6757} {"train_loss": -27.87041664123535, "global_step": 560864, "epoch": 6757} {"train_loss": -27.877573013305664, "global_step": 560865, "epoch": 6757} {"train_loss": -27.958044052124023, "global_step": 560866, "epoch": 6757} {"train_loss": -27.922494888305664, "global_step": 560867, "epoch": 6757} {"train_loss": -27.509998321533203, "global_step": 560868, "epoch": 6757} {"train_loss": -27.882566452026367, "global_step": 560869, "epoch": 6757} {"train_loss": -27.627899169921875, "global_step": 560870, "epoch": 6757} {"train_loss": -27.89628028869629, "global_step": 560871, "epoch": 6757} {"train_loss": -28.14031410217285, "global_step": 560872, "epoch": 6757} {"train_loss": -27.825037002563477, "global_step": 560873, "epoch": 6757} {"train_loss": -28.153533935546875, "global_step": 560874, "epoch": 6757} {"train_loss": -27.8845157623291, "global_step": 560875, "epoch": 6757} {"train_loss": -28.123523712158203, "global_step": 560876, "epoch": 6757} {"train_loss": -28.361509323120117, "global_step": 560877, "epoch": 6757} {"train_loss": -28.04047203063965, "global_step": 560878, "epoch": 6757} {"train_loss": -27.95831871032715, "global_step": 560879, "epoch": 6757} {"train_loss": -27.715784072875977, "global_step": 560880, "epoch": 6757} {"train_loss": -28.147485733032227, "global_step": 560881, "epoch": 6757} {"train_loss": -27.70867347717285, "global_step": 560882, "epoch": 6757} {"train_loss": -27.95252799987793, "global_step": 560883, "epoch": 6757} {"train_loss": -27.854040145874023, "global_step": 560884, "epoch": 6757} {"train_loss": -27.782007217407227, "global_step": 560885, "epoch": 6757} {"train_loss": -28.021326065063477, "global_step": 560886, "epoch": 6757} {"train_loss": -27.77618980407715, "global_step": 560887, "epoch": 6757} {"train_loss": -27.89029312133789, "global_step": 560888, "epoch": 6757} {"train_loss": -28.255685806274414, "global_step": 560889, "epoch": 6757} {"train_loss": -27.842309951782227, "global_step": 560890, "epoch": 6757} {"train_loss": -28.207794189453125, "global_step": 560891, "epoch": 6757} {"train_loss": -27.869144439697266, "global_step": 560892, "epoch": 6757} {"train_loss": -28.152917861938477, "global_step": 560893, "epoch": 6757} {"train_loss": -28.070417404174805, "global_step": 560894, "epoch": 6757} {"train_loss": -27.769073486328125, "global_step": 560895, "epoch": 6757} {"train_loss": -27.847379684448242, "global_step": 560896, "epoch": 6757} {"train_loss": -27.83538818359375, "global_step": 560897, "epoch": 6757} {"train_loss": -27.7598819732666, "global_step": 560898, "epoch": 6757} {"train_loss": -27.24262046813965, "global_step": 560899, "epoch": 6757} {"train_loss": -27.04915428161621, "global_step": 560900, "epoch": 6757} {"train_loss": -27.238677978515625, "global_step": 560901, "epoch": 6757} {"train_loss": -27.3599853515625, "global_step": 560902, "epoch": 6757} {"train_loss": -27.196121215820312, "global_step": 560903, "epoch": 6757} {"train_loss": -27.2780704498291, "global_step": 560904, "epoch": 6757} {"train_loss": -27.80548095703125, "global_step": 560905, "epoch": 6757} {"train_loss": -27.723743438720703, "global_step": 560906, "epoch": 6757} {"train_loss": -27.41643714904785, "global_step": 560907, "epoch": 6757} {"train_loss": -27.47681999206543, "global_step": 560908, "epoch": 6757} {"train_loss": -27.70395851135254, "global_step": 560909, "epoch": 6757} {"train_loss": -27.51838493347168, "global_step": 560910, "epoch": 6757} {"train_loss": -27.381610870361328, "global_step": 560911, "epoch": 6757} {"train_loss": -27.322284698486328, "global_step": 560912, "epoch": 6757} {"train_loss": -27.75377919300493, "global_step": 560913, "epoch": 6757, "val_loss": 6356491.5} {"train_loss": -26.96211051940918, "global_step": 560914, "epoch": 6758} {"train_loss": -26.920644760131836, "global_step": 560915, "epoch": 6758} {"train_loss": -27.096654891967773, "global_step": 560916, "epoch": 6758} {"train_loss": -26.920654296875, "global_step": 560917, "epoch": 6758} {"train_loss": -27.249038696289062, "global_step": 560918, "epoch": 6758} {"train_loss": -27.10102653503418, "global_step": 560919, "epoch": 6758} {"train_loss": -27.013418197631836, "global_step": 560920, "epoch": 6758} {"train_loss": -27.285938262939453, "global_step": 560921, "epoch": 6758} {"train_loss": -26.76397132873535, "global_step": 560922, "epoch": 6758} {"train_loss": -27.121612548828125, "global_step": 560923, "epoch": 6758} {"train_loss": -26.60464859008789, "global_step": 560924, "epoch": 6758} {"train_loss": -27.765716552734375, "global_step": 560925, "epoch": 6758} {"train_loss": -27.096372604370117, "global_step": 560926, "epoch": 6758} {"train_loss": -27.59328269958496, "global_step": 560927, "epoch": 6758} {"train_loss": -26.818103790283203, "global_step": 560928, "epoch": 6758} {"train_loss": -27.5924015045166, "global_step": 560929, "epoch": 6758} {"train_loss": -27.226760864257812, "global_step": 560930, "epoch": 6758} {"train_loss": -27.319379806518555, "global_step": 560931, "epoch": 6758} {"train_loss": -27.456541061401367, "global_step": 560932, "epoch": 6758} {"train_loss": -27.348651885986328, "global_step": 560933, "epoch": 6758} {"train_loss": -27.325042724609375, "global_step": 560934, "epoch": 6758} {"train_loss": -27.522247314453125, "global_step": 560935, "epoch": 6758} {"train_loss": -27.473703384399414, "global_step": 560936, "epoch": 6758} {"train_loss": -27.7721004486084, "global_step": 560937, "epoch": 6758} {"train_loss": -27.29851722717285, "global_step": 560938, "epoch": 6758} {"train_loss": -27.750946044921875, "global_step": 560939, "epoch": 6758} {"train_loss": -27.959747314453125, "global_step": 560940, "epoch": 6758} {"train_loss": -27.792652130126953, "global_step": 560941, "epoch": 6758} {"train_loss": -27.348743438720703, "global_step": 560942, "epoch": 6758} {"train_loss": -27.61503028869629, "global_step": 560943, "epoch": 6758} {"train_loss": -27.4119873046875, "global_step": 560944, "epoch": 6758} {"train_loss": -28.17445182800293, "global_step": 560945, "epoch": 6758} {"train_loss": -27.9102840423584, "global_step": 560946, "epoch": 6758} {"train_loss": -27.86572265625, "global_step": 560947, "epoch": 6758} {"train_loss": -27.827768325805664, "global_step": 560948, "epoch": 6758} {"train_loss": -27.64375114440918, "global_step": 560949, "epoch": 6758} {"train_loss": -27.867551803588867, "global_step": 560950, "epoch": 6758} {"train_loss": -27.402109146118164, "global_step": 560951, "epoch": 6758} {"train_loss": -28.048633575439453, "global_step": 560952, "epoch": 6758} {"train_loss": -27.990863800048828, "global_step": 560953, "epoch": 6758} {"train_loss": -28.049116134643555, "global_step": 560954, "epoch": 6758} {"train_loss": -28.0815486907959, "global_step": 560955, "epoch": 6758} {"train_loss": -27.278839111328125, "global_step": 560956, "epoch": 6758} {"train_loss": -28.058568954467773, "global_step": 560957, "epoch": 6758} {"train_loss": -27.643644332885742, "global_step": 560958, "epoch": 6758} {"train_loss": -27.620527267456055, "global_step": 560959, "epoch": 6758} {"train_loss": -27.789880752563477, "global_step": 560960, "epoch": 6758} {"train_loss": -28.1184024810791, "global_step": 560961, "epoch": 6758} {"train_loss": -28.14208984375, "global_step": 560962, "epoch": 6758} {"train_loss": -27.856185913085938, "global_step": 560963, "epoch": 6758} {"train_loss": -27.841766357421875, "global_step": 560964, "epoch": 6758} {"train_loss": -28.112638473510742, "global_step": 560965, "epoch": 6758} {"train_loss": -27.682241439819336, "global_step": 560966, "epoch": 6758} {"train_loss": -27.700986862182617, "global_step": 560967, "epoch": 6758} {"train_loss": -27.358610153198242, "global_step": 560968, "epoch": 6758} {"train_loss": -27.3364315032959, "global_step": 560969, "epoch": 6758} {"train_loss": -27.2178955078125, "global_step": 560970, "epoch": 6758} {"train_loss": -26.7109317779541, "global_step": 560971, "epoch": 6758} {"train_loss": -27.81441307067871, "global_step": 560972, "epoch": 6758} {"train_loss": -27.552734375, "global_step": 560973, "epoch": 6758} {"train_loss": -27.080453872680664, "global_step": 560974, "epoch": 6758} {"train_loss": -27.14011001586914, "global_step": 560975, "epoch": 6758} {"train_loss": -28.08310317993164, "global_step": 560976, "epoch": 6758} {"train_loss": -27.360761642456055, "global_step": 560977, "epoch": 6758} {"train_loss": -27.436506271362305, "global_step": 560978, "epoch": 6758} {"train_loss": -27.746261596679688, "global_step": 560979, "epoch": 6758} {"train_loss": -27.818418502807617, "global_step": 560980, "epoch": 6758} {"train_loss": -27.206884384155273, "global_step": 560981, "epoch": 6758} {"train_loss": -27.45340919494629, "global_step": 560982, "epoch": 6758} {"train_loss": -27.5877742767334, "global_step": 560983, "epoch": 6758} {"train_loss": -27.529447555541992, "global_step": 560984, "epoch": 6758} {"train_loss": -27.4028377532959, "global_step": 560985, "epoch": 6758} {"train_loss": -27.704517364501953, "global_step": 560986, "epoch": 6758} {"train_loss": -27.552032470703125, "global_step": 560987, "epoch": 6758} {"train_loss": -27.588788986206055, "global_step": 560988, "epoch": 6758} {"train_loss": -27.61737632751465, "global_step": 560989, "epoch": 6758} {"train_loss": -27.47199058532715, "global_step": 560990, "epoch": 6758} {"train_loss": -27.917020797729492, "global_step": 560991, "epoch": 6758} {"train_loss": -27.83123779296875, "global_step": 560992, "epoch": 6758} {"train_loss": -27.676191329956055, "global_step": 560993, "epoch": 6758} {"train_loss": -27.960248947143555, "global_step": 560994, "epoch": 6758} {"train_loss": -27.596206665039062, "global_step": 560995, "epoch": 6758} {"train_loss": -27.534361965685004, "global_step": 560996, "epoch": 6758, "val_loss": 6360173.0} {"train_loss": -27.35426902770996, "global_step": 560997, "epoch": 6759} {"train_loss": -27.28485107421875, "global_step": 560998, "epoch": 6759} {"train_loss": -27.537561416625977, "global_step": 560999, "epoch": 6759} {"train_loss": -27.57451820373535, "global_step": 561000, "epoch": 6759} {"train_loss": -27.5090274810791, "global_step": 561001, "epoch": 6759} {"train_loss": -27.578723907470703, "global_step": 561002, "epoch": 6759} {"train_loss": -27.83502769470215, "global_step": 561003, "epoch": 6759} {"train_loss": -27.74153709411621, "global_step": 561004, "epoch": 6759} {"train_loss": -27.45945167541504, "global_step": 561005, "epoch": 6759} {"train_loss": -27.319232940673828, "global_step": 561006, "epoch": 6759} {"train_loss": -27.602746963500977, "global_step": 561007, "epoch": 6759} {"train_loss": -27.62322998046875, "global_step": 561008, "epoch": 6759} {"train_loss": -27.55891227722168, "global_step": 561009, "epoch": 6759} {"train_loss": -27.428342819213867, "global_step": 561010, "epoch": 6759} {"train_loss": -27.894617080688477, "global_step": 561011, "epoch": 6759} {"train_loss": -27.9262638092041, "global_step": 561012, "epoch": 6759} {"train_loss": -27.19195556640625, "global_step": 561013, "epoch": 6759} {"train_loss": -27.52142333984375, "global_step": 561014, "epoch": 6759} {"train_loss": -27.966876983642578, "global_step": 561015, "epoch": 6759} {"train_loss": -28.0054988861084, "global_step": 561016, "epoch": 6759} {"train_loss": -27.292062759399414, "global_step": 561017, "epoch": 6759} {"train_loss": -27.580158233642578, "global_step": 561018, "epoch": 6759} {"train_loss": -27.982288360595703, "global_step": 561019, "epoch": 6759} {"train_loss": -27.33453941345215, "global_step": 561020, "epoch": 6759} {"train_loss": -28.17047119140625, "global_step": 561021, "epoch": 6759} {"train_loss": -27.62156105041504, "global_step": 561022, "epoch": 6759} {"train_loss": -27.114501953125, "global_step": 561023, "epoch": 6759} {"train_loss": -27.756540298461914, "global_step": 561024, "epoch": 6759} {"train_loss": -28.26508903503418, "global_step": 561025, "epoch": 6759} {"train_loss": -27.781614303588867, "global_step": 561026, "epoch": 6759} {"train_loss": -27.53826904296875, "global_step": 561027, "epoch": 6759} {"train_loss": -27.923776626586914, "global_step": 561028, "epoch": 6759} {"train_loss": -27.815732955932617, "global_step": 561029, "epoch": 6759} {"train_loss": -27.978784561157227, "global_step": 561030, "epoch": 6759} {"train_loss": -28.211181640625, "global_step": 561031, "epoch": 6759} {"train_loss": -27.695241928100586, "global_step": 561032, "epoch": 6759} {"train_loss": -27.834985733032227, "global_step": 561033, "epoch": 6759} {"train_loss": -27.786890029907227, "global_step": 561034, "epoch": 6759} {"train_loss": -27.88043785095215, "global_step": 561035, "epoch": 6759} {"train_loss": -27.8505916595459, "global_step": 561036, "epoch": 6759} {"train_loss": -27.84429931640625, "global_step": 561037, "epoch": 6759} {"train_loss": -27.800756454467773, "global_step": 561038, "epoch": 6759} {"train_loss": -27.94451332092285, "global_step": 561039, "epoch": 6759} {"train_loss": -27.880603790283203, "global_step": 561040, "epoch": 6759} {"train_loss": -28.250659942626953, "global_step": 561041, "epoch": 6759} {"train_loss": -27.7506046295166, "global_step": 561042, "epoch": 6759} {"train_loss": -27.819753646850586, "global_step": 561043, "epoch": 6759} {"train_loss": -28.02176284790039, "global_step": 561044, "epoch": 6759} {"train_loss": -27.548736572265625, "global_step": 561045, "epoch": 6759} {"train_loss": -28.133224487304688, "global_step": 561046, "epoch": 6759} {"train_loss": -27.50282096862793, "global_step": 561047, "epoch": 6759} {"train_loss": -27.32097816467285, "global_step": 561048, "epoch": 6759} {"train_loss": -27.335617065429688, "global_step": 561049, "epoch": 6759} {"train_loss": -27.938861846923828, "global_step": 561050, "epoch": 6759} {"train_loss": -27.987390518188477, "global_step": 561051, "epoch": 6759} {"train_loss": -27.761213302612305, "global_step": 561052, "epoch": 6759} {"train_loss": -28.1403865814209, "global_step": 561053, "epoch": 6759} {"train_loss": -27.629819869995117, "global_step": 561054, "epoch": 6759} {"train_loss": -27.997222900390625, "global_step": 561055, "epoch": 6759} {"train_loss": -27.550491333007812, "global_step": 561056, "epoch": 6759} {"train_loss": -27.863500595092773, "global_step": 561057, "epoch": 6759} {"train_loss": -27.81056022644043, "global_step": 561058, "epoch": 6759} {"train_loss": -27.68867301940918, "global_step": 561059, "epoch": 6759} {"train_loss": -27.671918869018555, "global_step": 561060, "epoch": 6759} {"train_loss": -27.714941024780273, "global_step": 561061, "epoch": 6759} {"train_loss": -27.51209831237793, "global_step": 561062, "epoch": 6759} {"train_loss": -27.361438751220703, "global_step": 561063, "epoch": 6759} {"train_loss": -27.83148193359375, "global_step": 561064, "epoch": 6759} {"train_loss": -26.946203231811523, "global_step": 561065, "epoch": 6759} {"train_loss": -27.131668090820312, "global_step": 561066, "epoch": 6759} {"train_loss": -27.91533851623535, "global_step": 561067, "epoch": 6759} {"train_loss": -27.856760025024414, "global_step": 561068, "epoch": 6759} {"train_loss": -27.746932983398438, "global_step": 561069, "epoch": 6759} {"train_loss": -27.102697372436523, "global_step": 561070, "epoch": 6759} {"train_loss": -28.133798599243164, "global_step": 561071, "epoch": 6759} {"train_loss": -27.813190460205078, "global_step": 561072, "epoch": 6759} {"train_loss": -28.05759048461914, "global_step": 561073, "epoch": 6759} {"train_loss": -27.916589736938477, "global_step": 561074, "epoch": 6759} {"train_loss": -27.677932739257812, "global_step": 561075, "epoch": 6759} {"train_loss": -27.88921546936035, "global_step": 561076, "epoch": 6759} {"train_loss": -27.53217887878418, "global_step": 561077, "epoch": 6759} {"train_loss": -27.68124771118164, "global_step": 561078, "epoch": 6759} {"train_loss": -27.691021034516485, "global_step": 561079, "epoch": 6759, "val_loss": 6403107.0} {"train_loss": -25.915210723876953, "global_step": 561080, "epoch": 6760} {"train_loss": -26.232580184936523, "global_step": 561081, "epoch": 6760} {"train_loss": -26.15130043029785, "global_step": 561082, "epoch": 6760} {"train_loss": -26.453800201416016, "global_step": 561083, "epoch": 6760} {"train_loss": -25.87175941467285, "global_step": 561084, "epoch": 6760} {"train_loss": -27.242116928100586, "global_step": 561085, "epoch": 6760} {"train_loss": -26.251422882080078, "global_step": 561086, "epoch": 6760} {"train_loss": -27.031452178955078, "global_step": 561087, "epoch": 6760} {"train_loss": -27.044723510742188, "global_step": 561088, "epoch": 6760} {"train_loss": -26.74074363708496, "global_step": 561089, "epoch": 6760} {"train_loss": -27.458118438720703, "global_step": 561090, "epoch": 6760} {"train_loss": -27.358335494995117, "global_step": 561091, "epoch": 6760} {"train_loss": -26.745954513549805, "global_step": 561092, "epoch": 6760} {"train_loss": -27.22199821472168, "global_step": 561093, "epoch": 6760} {"train_loss": -27.298675537109375, "global_step": 561094, "epoch": 6760} {"train_loss": -27.220123291015625, "global_step": 561095, "epoch": 6760} {"train_loss": -27.01247215270996, "global_step": 561096, "epoch": 6760} {"train_loss": -27.195480346679688, "global_step": 561097, "epoch": 6760} {"train_loss": -26.980825424194336, "global_step": 561098, "epoch": 6760} {"train_loss": -27.226598739624023, "global_step": 561099, "epoch": 6760} {"train_loss": -27.560728073120117, "global_step": 561100, "epoch": 6760} {"train_loss": -27.36787223815918, "global_step": 561101, "epoch": 6760} {"train_loss": -27.156036376953125, "global_step": 561102, "epoch": 6760} {"train_loss": -26.95186424255371, "global_step": 561103, "epoch": 6760} {"train_loss": -27.43256187438965, "global_step": 561104, "epoch": 6760} {"train_loss": -27.192922592163086, "global_step": 561105, "epoch": 6760} {"train_loss": -26.995410919189453, "global_step": 561106, "epoch": 6760} {"train_loss": -26.911691665649414, "global_step": 561107, "epoch": 6760} {"train_loss": -27.17720603942871, "global_step": 561108, "epoch": 6760} {"train_loss": -27.173608779907227, "global_step": 561109, "epoch": 6760} {"train_loss": -27.62823486328125, "global_step": 561110, "epoch": 6760} {"train_loss": -27.37395668029785, "global_step": 561111, "epoch": 6760} {"train_loss": -27.3840274810791, "global_step": 561112, "epoch": 6760} {"train_loss": -27.155826568603516, "global_step": 561113, "epoch": 6760} {"train_loss": -27.482711791992188, "global_step": 561114, "epoch": 6760} {"train_loss": -27.641637802124023, "global_step": 561115, "epoch": 6760} {"train_loss": -27.419843673706055, "global_step": 561116, "epoch": 6760} {"train_loss": -27.886188507080078, "global_step": 561117, "epoch": 6760} {"train_loss": -27.317218780517578, "global_step": 561118, "epoch": 6760} {"train_loss": -27.942895889282227, "global_step": 561119, "epoch": 6760} {"train_loss": -27.847320556640625, "global_step": 561120, "epoch": 6760} {"train_loss": -27.72538185119629, "global_step": 561121, "epoch": 6760} {"train_loss": -28.12017250061035, "global_step": 561122, "epoch": 6760} {"train_loss": -27.80341911315918, "global_step": 561123, "epoch": 6760} {"train_loss": -27.456817626953125, "global_step": 561124, "epoch": 6760} {"train_loss": -27.74212646484375, "global_step": 561125, "epoch": 6760} {"train_loss": -27.855085372924805, "global_step": 561126, "epoch": 6760} {"train_loss": -27.634119033813477, "global_step": 561127, "epoch": 6760} {"train_loss": -27.273679733276367, "global_step": 561128, "epoch": 6760} {"train_loss": -27.757299423217773, "global_step": 561129, "epoch": 6760} {"train_loss": -27.674102783203125, "global_step": 561130, "epoch": 6760} {"train_loss": -27.700855255126953, "global_step": 561131, "epoch": 6760} {"train_loss": -27.84726905822754, "global_step": 561132, "epoch": 6760} {"train_loss": -28.112747192382812, "global_step": 561133, "epoch": 6760} {"train_loss": -28.14206886291504, "global_step": 561134, "epoch": 6760} {"train_loss": -28.342391967773438, "global_step": 561135, "epoch": 6760} {"train_loss": -27.88612174987793, "global_step": 561136, "epoch": 6760} {"train_loss": -27.930145263671875, "global_step": 561137, "epoch": 6760} {"train_loss": -28.258726119995117, "global_step": 561138, "epoch": 6760} {"train_loss": -27.76889419555664, "global_step": 561139, "epoch": 6760} {"train_loss": -28.19455909729004, "global_step": 561140, "epoch": 6760} {"train_loss": -28.018728256225586, "global_step": 561141, "epoch": 6760} {"train_loss": -28.02117347717285, "global_step": 561142, "epoch": 6760} {"train_loss": -27.958663940429688, "global_step": 561143, "epoch": 6760} {"train_loss": -28.2392578125, "global_step": 561144, "epoch": 6760} {"train_loss": -28.46709632873535, "global_step": 561145, "epoch": 6760} {"train_loss": -28.131750106811523, "global_step": 561146, "epoch": 6760} {"train_loss": -27.807538986206055, "global_step": 561147, "epoch": 6760} {"train_loss": -27.497207641601562, "global_step": 561148, "epoch": 6760} {"train_loss": -27.801355361938477, "global_step": 561149, "epoch": 6760} {"train_loss": -28.134002685546875, "global_step": 561150, "epoch": 6760} {"train_loss": -27.949060440063477, "global_step": 561151, "epoch": 6760} {"train_loss": -27.66650390625, "global_step": 561152, "epoch": 6760} {"train_loss": -27.525165557861328, "global_step": 561153, "epoch": 6760} {"train_loss": -27.518476486206055, "global_step": 561154, "epoch": 6760} {"train_loss": -27.762853622436523, "global_step": 561155, "epoch": 6760} {"train_loss": -28.105382919311523, "global_step": 561156, "epoch": 6760} {"train_loss": -27.704761505126953, "global_step": 561157, "epoch": 6760} {"train_loss": -27.928869247436523, "global_step": 561158, "epoch": 6760} {"train_loss": -28.151350021362305, "global_step": 561159, "epoch": 6760} {"train_loss": -27.8582763671875, "global_step": 561160, "epoch": 6760} {"train_loss": -27.85980224609375, "global_step": 561161, "epoch": 6760} {"train_loss": -27.505384123468975, "global_step": 561162, "epoch": 6760, "val_loss": 6347513.0} {"train_loss": -27.10322380065918, "global_step": 561163, "epoch": 6761} {"train_loss": -26.748743057250977, "global_step": 561164, "epoch": 6761} {"train_loss": -26.789953231811523, "global_step": 561165, "epoch": 6761} {"train_loss": -27.2667236328125, "global_step": 561166, "epoch": 6761} {"train_loss": -26.732709884643555, "global_step": 561167, "epoch": 6761} {"train_loss": -27.5704402923584, "global_step": 561168, "epoch": 6761} {"train_loss": -27.1970157623291, "global_step": 561169, "epoch": 6761} {"train_loss": -27.78834342956543, "global_step": 561170, "epoch": 6761} {"train_loss": -27.57747459411621, "global_step": 561171, "epoch": 6761} {"train_loss": -27.39823341369629, "global_step": 561172, "epoch": 6761} {"train_loss": -27.92487907409668, "global_step": 561173, "epoch": 6761} {"train_loss": -27.396759033203125, "global_step": 561174, "epoch": 6761} {"train_loss": -27.642196655273438, "global_step": 561175, "epoch": 6761} {"train_loss": -27.470645904541016, "global_step": 561176, "epoch": 6761} {"train_loss": -27.513166427612305, "global_step": 561177, "epoch": 6761} {"train_loss": -27.650915145874023, "global_step": 561178, "epoch": 6761} {"train_loss": -27.885196685791016, "global_step": 561179, "epoch": 6761} {"train_loss": -27.0236759185791, "global_step": 561180, "epoch": 6761} {"train_loss": -27.88885498046875, "global_step": 561181, "epoch": 6761} {"train_loss": -27.376007080078125, "global_step": 561182, "epoch": 6761} {"train_loss": -27.240100860595703, "global_step": 561183, "epoch": 6761} {"train_loss": -27.7242374420166, "global_step": 561184, "epoch": 6761} {"train_loss": -27.592193603515625, "global_step": 561185, "epoch": 6761} {"train_loss": -27.842870712280273, "global_step": 561186, "epoch": 6761} {"train_loss": -27.793066024780273, "global_step": 561187, "epoch": 6761} {"train_loss": -27.53409767150879, "global_step": 561188, "epoch": 6761} {"train_loss": -27.34214210510254, "global_step": 561189, "epoch": 6761} {"train_loss": -27.694080352783203, "global_step": 561190, "epoch": 6761} {"train_loss": -27.756378173828125, "global_step": 561191, "epoch": 6761} {"train_loss": -27.81573486328125, "global_step": 561192, "epoch": 6761} {"train_loss": -27.910505294799805, "global_step": 561193, "epoch": 6761} {"train_loss": -27.804052352905273, "global_step": 561194, "epoch": 6761} {"train_loss": -27.94368553161621, "global_step": 561195, "epoch": 6761} {"train_loss": -27.8469181060791, "global_step": 561196, "epoch": 6761} {"train_loss": -27.983285903930664, "global_step": 561197, "epoch": 6761} {"train_loss": -27.786792755126953, "global_step": 561198, "epoch": 6761} {"train_loss": -27.741657257080078, "global_step": 561199, "epoch": 6761} {"train_loss": -28.1524600982666, "global_step": 561200, "epoch": 6761} {"train_loss": -27.783859252929688, "global_step": 561201, "epoch": 6761} {"train_loss": -27.588796615600586, "global_step": 561202, "epoch": 6761} {"train_loss": -28.01685905456543, "global_step": 561203, "epoch": 6761} {"train_loss": -27.754682540893555, "global_step": 561204, "epoch": 6761} {"train_loss": -27.938241958618164, "global_step": 561205, "epoch": 6761} {"train_loss": -27.800683975219727, "global_step": 561206, "epoch": 6761} {"train_loss": -27.644195556640625, "global_step": 561207, "epoch": 6761} {"train_loss": -27.69831657409668, "global_step": 561208, "epoch": 6761} {"train_loss": -27.74860191345215, "global_step": 561209, "epoch": 6761} {"train_loss": -27.734771728515625, "global_step": 561210, "epoch": 6761} {"train_loss": -27.830846786499023, "global_step": 561211, "epoch": 6761} {"train_loss": -27.67523765563965, "global_step": 561212, "epoch": 6761} {"train_loss": -27.8431396484375, "global_step": 561213, "epoch": 6761} {"train_loss": -27.814682006835938, "global_step": 561214, "epoch": 6761} {"train_loss": -28.07758140563965, "global_step": 561215, "epoch": 6761} {"train_loss": -27.8465518951416, "global_step": 561216, "epoch": 6761} {"train_loss": -27.876611709594727, "global_step": 561217, "epoch": 6761} {"train_loss": -27.859909057617188, "global_step": 561218, "epoch": 6761} {"train_loss": -28.169788360595703, "global_step": 561219, "epoch": 6761} {"train_loss": -27.54545021057129, "global_step": 561220, "epoch": 6761} {"train_loss": -28.12554359436035, "global_step": 561221, "epoch": 6761} {"train_loss": -27.608062744140625, "global_step": 561222, "epoch": 6761} {"train_loss": -27.926227569580078, "global_step": 561223, "epoch": 6761} {"train_loss": -27.4459285736084, "global_step": 561224, "epoch": 6761} {"train_loss": -27.792804718017578, "global_step": 561225, "epoch": 6761} {"train_loss": -27.6424560546875, "global_step": 561226, "epoch": 6761} {"train_loss": -27.641132354736328, "global_step": 561227, "epoch": 6761} {"train_loss": -27.620059967041016, "global_step": 561228, "epoch": 6761} {"train_loss": -27.069814682006836, "global_step": 561229, "epoch": 6761} {"train_loss": -27.67069435119629, "global_step": 561230, "epoch": 6761} {"train_loss": -27.840612411499023, "global_step": 561231, "epoch": 6761} {"train_loss": -27.354034423828125, "global_step": 561232, "epoch": 6761} {"train_loss": -27.131826400756836, "global_step": 561233, "epoch": 6761} {"train_loss": -27.513769149780273, "global_step": 561234, "epoch": 6761} {"train_loss": -28.193729400634766, "global_step": 561235, "epoch": 6761} {"train_loss": -27.361831665039062, "global_step": 561236, "epoch": 6761} {"train_loss": -28.021472930908203, "global_step": 561237, "epoch": 6761} {"train_loss": -27.889175415039062, "global_step": 561238, "epoch": 6761} {"train_loss": -27.82794189453125, "global_step": 561239, "epoch": 6761} {"train_loss": -27.81471061706543, "global_step": 561240, "epoch": 6761} {"train_loss": -28.048660278320312, "global_step": 561241, "epoch": 6761} {"train_loss": -27.8836727142334, "global_step": 561242, "epoch": 6761} {"train_loss": -27.78729248046875, "global_step": 561243, "epoch": 6761} {"train_loss": -28.1569766998291, "global_step": 561244, "epoch": 6761} {"train_loss": -27.68086378258395, "global_step": 561245, "epoch": 6761, "val_loss": 6372535.0} {"train_loss": -27.421781539916992, "global_step": 561246, "epoch": 6762} {"train_loss": -27.421463012695312, "global_step": 561247, "epoch": 6762} {"train_loss": -26.348493576049805, "global_step": 561248, "epoch": 6762} {"train_loss": -26.51179313659668, "global_step": 561249, "epoch": 6762} {"train_loss": -26.739044189453125, "global_step": 561250, "epoch": 6762} {"train_loss": -27.130517959594727, "global_step": 561251, "epoch": 6762} {"train_loss": -27.219894409179688, "global_step": 561252, "epoch": 6762} {"train_loss": -27.54506492614746, "global_step": 561253, "epoch": 6762} {"train_loss": -26.93635368347168, "global_step": 561254, "epoch": 6762} {"train_loss": -27.294971466064453, "global_step": 561255, "epoch": 6762} {"train_loss": -27.13412857055664, "global_step": 561256, "epoch": 6762} {"train_loss": -27.61468505859375, "global_step": 561257, "epoch": 6762} {"train_loss": -26.908613204956055, "global_step": 561258, "epoch": 6762} {"train_loss": -27.05726432800293, "global_step": 561259, "epoch": 6762} {"train_loss": -27.454370498657227, "global_step": 561260, "epoch": 6762} {"train_loss": -27.330636978149414, "global_step": 561261, "epoch": 6762} {"train_loss": -27.4912052154541, "global_step": 561262, "epoch": 6762} {"train_loss": -27.45534324645996, "global_step": 561263, "epoch": 6762} {"train_loss": -27.41267967224121, "global_step": 561264, "epoch": 6762} {"train_loss": -27.79904556274414, "global_step": 561265, "epoch": 6762} {"train_loss": -27.497802734375, "global_step": 561266, "epoch": 6762} {"train_loss": -27.572179794311523, "global_step": 561267, "epoch": 6762} {"train_loss": -27.39401626586914, "global_step": 561268, "epoch": 6762} {"train_loss": -28.176105499267578, "global_step": 561269, "epoch": 6762} {"train_loss": -27.5606632232666, "global_step": 561270, "epoch": 6762} {"train_loss": -27.561269760131836, "global_step": 561271, "epoch": 6762} {"train_loss": -27.522336959838867, "global_step": 561272, "epoch": 6762} {"train_loss": -28.001605987548828, "global_step": 561273, "epoch": 6762} {"train_loss": -27.715803146362305, "global_step": 561274, "epoch": 6762} {"train_loss": -28.003528594970703, "global_step": 561275, "epoch": 6762} {"train_loss": -27.821887969970703, "global_step": 561276, "epoch": 6762} {"train_loss": -27.62554931640625, "global_step": 561277, "epoch": 6762} {"train_loss": -27.560565948486328, "global_step": 561278, "epoch": 6762} {"train_loss": -27.657983779907227, "global_step": 561279, "epoch": 6762} {"train_loss": -27.813718795776367, "global_step": 561280, "epoch": 6762} {"train_loss": -27.583526611328125, "global_step": 561281, "epoch": 6762} {"train_loss": -27.5614070892334, "global_step": 561282, "epoch": 6762} {"train_loss": -27.4406681060791, "global_step": 561283, "epoch": 6762} {"train_loss": -27.736530303955078, "global_step": 561284, "epoch": 6762} {"train_loss": -27.58233070373535, "global_step": 561285, "epoch": 6762} {"train_loss": -27.5283145904541, "global_step": 561286, "epoch": 6762} {"train_loss": -27.502521514892578, "global_step": 561287, "epoch": 6762} {"train_loss": -27.72210121154785, "global_step": 561288, "epoch": 6762} {"train_loss": -28.119873046875, "global_step": 561289, "epoch": 6762} {"train_loss": -27.93747901916504, "global_step": 561290, "epoch": 6762} {"train_loss": -27.9420108795166, "global_step": 561291, "epoch": 6762} {"train_loss": -27.75005531311035, "global_step": 561292, "epoch": 6762} {"train_loss": -27.49488639831543, "global_step": 561293, "epoch": 6762} {"train_loss": -27.785924911499023, "global_step": 561294, "epoch": 6762} {"train_loss": -27.9259033203125, "global_step": 561295, "epoch": 6762} {"train_loss": -27.908466339111328, "global_step": 561296, "epoch": 6762} {"train_loss": -27.837873458862305, "global_step": 561297, "epoch": 6762} {"train_loss": -27.86079978942871, "global_step": 561298, "epoch": 6762} {"train_loss": -28.08921241760254, "global_step": 561299, "epoch": 6762} {"train_loss": -27.695951461791992, "global_step": 561300, "epoch": 6762} {"train_loss": -27.748926162719727, "global_step": 561301, "epoch": 6762} {"train_loss": -27.887155532836914, "global_step": 561302, "epoch": 6762} {"train_loss": -28.11223793029785, "global_step": 561303, "epoch": 6762} {"train_loss": -27.765100479125977, "global_step": 561304, "epoch": 6762} {"train_loss": -27.41416358947754, "global_step": 561305, "epoch": 6762} {"train_loss": -27.43143653869629, "global_step": 561306, "epoch": 6762} {"train_loss": -27.815778732299805, "global_step": 561307, "epoch": 6762} {"train_loss": -27.767362594604492, "global_step": 561308, "epoch": 6762} {"train_loss": -27.914356231689453, "global_step": 561309, "epoch": 6762} {"train_loss": -28.09853172302246, "global_step": 561310, "epoch": 6762} {"train_loss": -27.848073959350586, "global_step": 561311, "epoch": 6762} {"train_loss": -27.68362808227539, "global_step": 561312, "epoch": 6762} {"train_loss": -27.66240882873535, "global_step": 561313, "epoch": 6762} {"train_loss": -27.878217697143555, "global_step": 561314, "epoch": 6762} {"train_loss": -27.966821670532227, "global_step": 561315, "epoch": 6762} {"train_loss": -27.821762084960938, "global_step": 561316, "epoch": 6762} {"train_loss": -28.029067993164062, "global_step": 561317, "epoch": 6762} {"train_loss": -27.931472778320312, "global_step": 561318, "epoch": 6762} {"train_loss": -27.90085220336914, "global_step": 561319, "epoch": 6762} {"train_loss": -27.911893844604492, "global_step": 561320, "epoch": 6762} {"train_loss": -27.91019630432129, "global_step": 561321, "epoch": 6762} {"train_loss": -28.3289737701416, "global_step": 561322, "epoch": 6762} {"train_loss": -27.756010055541992, "global_step": 561323, "epoch": 6762} {"train_loss": -27.641321182250977, "global_step": 561324, "epoch": 6762} {"train_loss": -27.57172203063965, "global_step": 561325, "epoch": 6762} {"train_loss": -26.763263702392578, "global_step": 561326, "epoch": 6762} {"train_loss": -28.07354736328125, "global_step": 561327, "epoch": 6762} {"train_loss": -27.61834084844015, "global_step": 561328, "epoch": 6762, "val_loss": 6375944.0} {"train_loss": -26.609790802001953, "global_step": 561329, "epoch": 6763} {"train_loss": -26.438873291015625, "global_step": 561330, "epoch": 6763} {"train_loss": -26.65767478942871, "global_step": 561331, "epoch": 6763} {"train_loss": -26.972089767456055, "global_step": 561332, "epoch": 6763} {"train_loss": -26.560636520385742, "global_step": 561333, "epoch": 6763} {"train_loss": -26.53409194946289, "global_step": 561334, "epoch": 6763} {"train_loss": -26.950199127197266, "global_step": 561335, "epoch": 6763} {"train_loss": -27.288959503173828, "global_step": 561336, "epoch": 6763} {"train_loss": -26.797286987304688, "global_step": 561337, "epoch": 6763} {"train_loss": -27.35523796081543, "global_step": 561338, "epoch": 6763} {"train_loss": -26.91008949279785, "global_step": 561339, "epoch": 6763} {"train_loss": -27.33479881286621, "global_step": 561340, "epoch": 6763} {"train_loss": -27.270919799804688, "global_step": 561341, "epoch": 6763} {"train_loss": -27.611572265625, "global_step": 561342, "epoch": 6763} {"train_loss": -26.934024810791016, "global_step": 561343, "epoch": 6763} {"train_loss": -27.513853073120117, "global_step": 561344, "epoch": 6763} {"train_loss": -27.19414710998535, "global_step": 561345, "epoch": 6763} {"train_loss": -27.5830020904541, "global_step": 561346, "epoch": 6763} {"train_loss": -27.269132614135742, "global_step": 561347, "epoch": 6763} {"train_loss": -27.239999771118164, "global_step": 561348, "epoch": 6763} {"train_loss": -27.72796058654785, "global_step": 561349, "epoch": 6763} {"train_loss": -27.29253578186035, "global_step": 561350, "epoch": 6763} {"train_loss": -27.3090877532959, "global_step": 561351, "epoch": 6763} {"train_loss": -27.713857650756836, "global_step": 561352, "epoch": 6763} {"train_loss": -27.873950958251953, "global_step": 561353, "epoch": 6763} {"train_loss": -27.181686401367188, "global_step": 561354, "epoch": 6763} {"train_loss": -27.691267013549805, "global_step": 561355, "epoch": 6763} {"train_loss": -27.327289581298828, "global_step": 561356, "epoch": 6763} {"train_loss": -27.561466217041016, "global_step": 561357, "epoch": 6763} {"train_loss": -27.50935173034668, "global_step": 561358, "epoch": 6763} {"train_loss": -27.905981063842773, "global_step": 561359, "epoch": 6763} {"train_loss": -27.803302764892578, "global_step": 561360, "epoch": 6763} {"train_loss": -27.719022750854492, "global_step": 561361, "epoch": 6763} {"train_loss": -27.78842544555664, "global_step": 561362, "epoch": 6763} {"train_loss": -28.10264015197754, "global_step": 561363, "epoch": 6763} {"train_loss": -27.661893844604492, "global_step": 561364, "epoch": 6763} {"train_loss": -27.716064453125, "global_step": 561365, "epoch": 6763} {"train_loss": -27.64485740661621, "global_step": 561366, "epoch": 6763} {"train_loss": -27.860319137573242, "global_step": 561367, "epoch": 6763} {"train_loss": -27.734846115112305, "global_step": 561368, "epoch": 6763} {"train_loss": -27.596811294555664, "global_step": 561369, "epoch": 6763} {"train_loss": -28.175159454345703, "global_step": 561370, "epoch": 6763} {"train_loss": -27.697179794311523, "global_step": 561371, "epoch": 6763} {"train_loss": -27.857791900634766, "global_step": 561372, "epoch": 6763} {"train_loss": -28.026458740234375, "global_step": 561373, "epoch": 6763} {"train_loss": -28.064680099487305, "global_step": 561374, "epoch": 6763} {"train_loss": -27.947538375854492, "global_step": 561375, "epoch": 6763} {"train_loss": -27.78694725036621, "global_step": 561376, "epoch": 6763} {"train_loss": -28.2308292388916, "global_step": 561377, "epoch": 6763} {"train_loss": -27.945348739624023, "global_step": 561378, "epoch": 6763} {"train_loss": -28.010761260986328, "global_step": 561379, "epoch": 6763} {"train_loss": -27.6087646484375, "global_step": 561380, "epoch": 6763} {"train_loss": -27.7485408782959, "global_step": 561381, "epoch": 6763} {"train_loss": -27.89642906188965, "global_step": 561382, "epoch": 6763} {"train_loss": -27.7752742767334, "global_step": 561383, "epoch": 6763} {"train_loss": -27.941205978393555, "global_step": 561384, "epoch": 6763} {"train_loss": -27.77432632446289, "global_step": 561385, "epoch": 6763} {"train_loss": -27.21982765197754, "global_step": 561386, "epoch": 6763} {"train_loss": -27.863693237304688, "global_step": 561387, "epoch": 6763} {"train_loss": -28.013498306274414, "global_step": 561388, "epoch": 6763} {"train_loss": -27.72515296936035, "global_step": 561389, "epoch": 6763} {"train_loss": -28.10041618347168, "global_step": 561390, "epoch": 6763} {"train_loss": -27.5545711517334, "global_step": 561391, "epoch": 6763} {"train_loss": -28.163421630859375, "global_step": 561392, "epoch": 6763} {"train_loss": -27.6602725982666, "global_step": 561393, "epoch": 6763} {"train_loss": -27.699237823486328, "global_step": 561394, "epoch": 6763} {"train_loss": -27.942041397094727, "global_step": 561395, "epoch": 6763} {"train_loss": -27.881200790405273, "global_step": 561396, "epoch": 6763} {"train_loss": -28.174942016601562, "global_step": 561397, "epoch": 6763} {"train_loss": -27.869476318359375, "global_step": 561398, "epoch": 6763} {"train_loss": -28.168127059936523, "global_step": 561399, "epoch": 6763} {"train_loss": -27.795551300048828, "global_step": 561400, "epoch": 6763} {"train_loss": -27.93476676940918, "global_step": 561401, "epoch": 6763} {"train_loss": -27.970447540283203, "global_step": 561402, "epoch": 6763} {"train_loss": -27.640920639038086, "global_step": 561403, "epoch": 6763} {"train_loss": -27.87763023376465, "global_step": 561404, "epoch": 6763} {"train_loss": -27.729267120361328, "global_step": 561405, "epoch": 6763} {"train_loss": -28.098468780517578, "global_step": 561406, "epoch": 6763} {"train_loss": -28.013202667236328, "global_step": 561407, "epoch": 6763} {"train_loss": -27.7176456451416, "global_step": 561408, "epoch": 6763} {"train_loss": -27.906225204467773, "global_step": 561409, "epoch": 6763} {"train_loss": -27.932966232299805, "global_step": 561410, "epoch": 6763} {"train_loss": -27.61311425358416, "global_step": 561411, "epoch": 6763, "val_loss": 6499807.0} {"train_loss": -26.7802791595459, "global_step": 561412, "epoch": 6764} {"train_loss": -27.194982528686523, "global_step": 561413, "epoch": 6764} {"train_loss": -26.920129776000977, "global_step": 561414, "epoch": 6764} {"train_loss": -26.7855167388916, "global_step": 561415, "epoch": 6764} {"train_loss": -27.106277465820312, "global_step": 561416, "epoch": 6764} {"train_loss": -27.033300399780273, "global_step": 561417, "epoch": 6764} {"train_loss": -27.575559616088867, "global_step": 561418, "epoch": 6764} {"train_loss": -27.430633544921875, "global_step": 561419, "epoch": 6764} {"train_loss": -27.357513427734375, "global_step": 561420, "epoch": 6764} {"train_loss": -27.170801162719727, "global_step": 561421, "epoch": 6764} {"train_loss": -27.127836227416992, "global_step": 561422, "epoch": 6764} {"train_loss": -27.373062133789062, "global_step": 561423, "epoch": 6764} {"train_loss": -27.42824363708496, "global_step": 561424, "epoch": 6764} {"train_loss": -26.915420532226562, "global_step": 561425, "epoch": 6764} {"train_loss": -27.554523468017578, "global_step": 561426, "epoch": 6764} {"train_loss": -27.535200119018555, "global_step": 561427, "epoch": 6764} {"train_loss": -27.435739517211914, "global_step": 561428, "epoch": 6764} {"train_loss": -27.611295700073242, "global_step": 561429, "epoch": 6764} {"train_loss": -27.391448974609375, "global_step": 561430, "epoch": 6764} {"train_loss": -27.851240158081055, "global_step": 561431, "epoch": 6764} {"train_loss": -27.809850692749023, "global_step": 561432, "epoch": 6764} {"train_loss": -27.622699737548828, "global_step": 561433, "epoch": 6764} {"train_loss": -28.150516510009766, "global_step": 561434, "epoch": 6764} {"train_loss": -27.8011417388916, "global_step": 561435, "epoch": 6764} {"train_loss": -27.716760635375977, "global_step": 561436, "epoch": 6764} {"train_loss": -27.236984252929688, "global_step": 561437, "epoch": 6764} {"train_loss": -27.447418212890625, "global_step": 561438, "epoch": 6764} {"train_loss": -27.82575798034668, "global_step": 561439, "epoch": 6764} {"train_loss": -27.566577911376953, "global_step": 561440, "epoch": 6764} {"train_loss": -27.548355102539062, "global_step": 561441, "epoch": 6764} {"train_loss": -27.830841064453125, "global_step": 561442, "epoch": 6764} {"train_loss": -27.745824813842773, "global_step": 561443, "epoch": 6764} {"train_loss": -27.655994415283203, "global_step": 561444, "epoch": 6764} {"train_loss": -28.071088790893555, "global_step": 561445, "epoch": 6764} {"train_loss": -27.782941818237305, "global_step": 561446, "epoch": 6764} {"train_loss": -28.0406494140625, "global_step": 561447, "epoch": 6764} {"train_loss": -27.674036026000977, "global_step": 561448, "epoch": 6764} {"train_loss": -28.177961349487305, "global_step": 561449, "epoch": 6764} {"train_loss": -27.9748592376709, "global_step": 561450, "epoch": 6764} {"train_loss": -28.10553550720215, "global_step": 561451, "epoch": 6764} {"train_loss": -28.12060546875, "global_step": 561452, "epoch": 6764} {"train_loss": -28.08888816833496, "global_step": 561453, "epoch": 6764} {"train_loss": -28.12628173828125, "global_step": 561454, "epoch": 6764} {"train_loss": -27.9666748046875, "global_step": 561455, "epoch": 6764} {"train_loss": -28.059650421142578, "global_step": 561456, "epoch": 6764} {"train_loss": -27.882741928100586, "global_step": 561457, "epoch": 6764} {"train_loss": -27.892492294311523, "global_step": 561458, "epoch": 6764} {"train_loss": -28.086668014526367, "global_step": 561459, "epoch": 6764} {"train_loss": -27.68939208984375, "global_step": 561460, "epoch": 6764} {"train_loss": -28.1833438873291, "global_step": 561461, "epoch": 6764} {"train_loss": -27.85367202758789, "global_step": 561462, "epoch": 6764} {"train_loss": -27.982709884643555, "global_step": 561463, "epoch": 6764} {"train_loss": -27.87155532836914, "global_step": 561464, "epoch": 6764} {"train_loss": -27.665449142456055, "global_step": 561465, "epoch": 6764} {"train_loss": -27.896286010742188, "global_step": 561466, "epoch": 6764} {"train_loss": -27.828031539916992, "global_step": 561467, "epoch": 6764} {"train_loss": -27.511533737182617, "global_step": 561468, "epoch": 6764} {"train_loss": -27.22260856628418, "global_step": 561469, "epoch": 6764} {"train_loss": -27.358808517456055, "global_step": 561470, "epoch": 6764} {"train_loss": -26.74700355529785, "global_step": 561471, "epoch": 6764} {"train_loss": -26.450668334960938, "global_step": 561472, "epoch": 6764} {"train_loss": -26.429920196533203, "global_step": 561473, "epoch": 6764} {"train_loss": -27.32606315612793, "global_step": 561474, "epoch": 6764} {"train_loss": -27.704410552978516, "global_step": 561475, "epoch": 6764} {"train_loss": -26.70086097717285, "global_step": 561476, "epoch": 6764} {"train_loss": -27.755456924438477, "global_step": 561477, "epoch": 6764} {"train_loss": -27.59708595275879, "global_step": 561478, "epoch": 6764} {"train_loss": -27.71246337890625, "global_step": 561479, "epoch": 6764} {"train_loss": -27.29292106628418, "global_step": 561480, "epoch": 6764} {"train_loss": -27.79319190979004, "global_step": 561481, "epoch": 6764} {"train_loss": -27.32892417907715, "global_step": 561482, "epoch": 6764} {"train_loss": -27.660425186157227, "global_step": 561483, "epoch": 6764} {"train_loss": -27.58949851989746, "global_step": 561484, "epoch": 6764} {"train_loss": -27.933368682861328, "global_step": 561485, "epoch": 6764} {"train_loss": -27.886014938354492, "global_step": 561486, "epoch": 6764} {"train_loss": -27.810943603515625, "global_step": 561487, "epoch": 6764} {"train_loss": -27.589014053344727, "global_step": 561488, "epoch": 6764} {"train_loss": -27.801883697509766, "global_step": 561489, "epoch": 6764} {"train_loss": -27.967849731445312, "global_step": 561490, "epoch": 6764} {"train_loss": -27.92852210998535, "global_step": 561491, "epoch": 6764} {"train_loss": -27.62224769592285, "global_step": 561492, "epoch": 6764} {"train_loss": -27.281890869140625, "global_step": 561493, "epoch": 6764} {"train_loss": -27.613395369196514, "global_step": 561494, "epoch": 6764, "val_loss": 6453741.0} {"train_loss": -27.1490421295166, "global_step": 561495, "epoch": 6765} {"train_loss": -26.552783966064453, "global_step": 561496, "epoch": 6765} {"train_loss": -26.796247482299805, "global_step": 561497, "epoch": 6765} {"train_loss": -26.970752716064453, "global_step": 561498, "epoch": 6765} {"train_loss": -27.30718994140625, "global_step": 561499, "epoch": 6765} {"train_loss": -27.14470863342285, "global_step": 561500, "epoch": 6765} {"train_loss": -26.78252601623535, "global_step": 561501, "epoch": 6765} {"train_loss": -27.091672897338867, "global_step": 561502, "epoch": 6765} {"train_loss": -27.36048698425293, "global_step": 561503, "epoch": 6765} {"train_loss": -27.408645629882812, "global_step": 561504, "epoch": 6765} {"train_loss": -27.086801528930664, "global_step": 561505, "epoch": 6765} {"train_loss": -27.161848068237305, "global_step": 561506, "epoch": 6765} {"train_loss": -27.6195011138916, "global_step": 561507, "epoch": 6765} {"train_loss": -26.8510684967041, "global_step": 561508, "epoch": 6765} {"train_loss": -27.189680099487305, "global_step": 561509, "epoch": 6765} {"train_loss": -27.233091354370117, "global_step": 561510, "epoch": 6765} {"train_loss": -26.937238693237305, "global_step": 561511, "epoch": 6765} {"train_loss": -27.628576278686523, "global_step": 561512, "epoch": 6765} {"train_loss": -27.4867000579834, "global_step": 561513, "epoch": 6765} {"train_loss": -27.594696044921875, "global_step": 561514, "epoch": 6765} {"train_loss": -27.561176300048828, "global_step": 561515, "epoch": 6765} {"train_loss": -27.715967178344727, "global_step": 561516, "epoch": 6765} {"train_loss": -27.405126571655273, "global_step": 561517, "epoch": 6765} {"train_loss": -27.547534942626953, "global_step": 561518, "epoch": 6765} {"train_loss": -27.951324462890625, "global_step": 561519, "epoch": 6765} {"train_loss": -27.5048885345459, "global_step": 561520, "epoch": 6765} {"train_loss": -27.986780166625977, "global_step": 561521, "epoch": 6765} {"train_loss": -27.83221435546875, "global_step": 561522, "epoch": 6765} {"train_loss": -27.680490493774414, "global_step": 561523, "epoch": 6765} {"train_loss": -27.576208114624023, "global_step": 561524, "epoch": 6765} {"train_loss": -27.75189781188965, "global_step": 561525, "epoch": 6765} {"train_loss": -27.95285415649414, "global_step": 561526, "epoch": 6765} {"train_loss": -27.911954879760742, "global_step": 561527, "epoch": 6765} {"train_loss": -27.640661239624023, "global_step": 561528, "epoch": 6765} {"train_loss": -27.86089515686035, "global_step": 561529, "epoch": 6765} {"train_loss": -27.620346069335938, "global_step": 561530, "epoch": 6765} {"train_loss": -27.981870651245117, "global_step": 561531, "epoch": 6765} {"train_loss": -28.257688522338867, "global_step": 561532, "epoch": 6765} {"train_loss": -27.87117576599121, "global_step": 561533, "epoch": 6765} {"train_loss": -27.724853515625, "global_step": 561534, "epoch": 6765} {"train_loss": -28.151351928710938, "global_step": 561535, "epoch": 6765} {"train_loss": -27.78428077697754, "global_step": 561536, "epoch": 6765} {"train_loss": -27.863500595092773, "global_step": 561537, "epoch": 6765} {"train_loss": -27.871082305908203, "global_step": 561538, "epoch": 6765} {"train_loss": -27.704376220703125, "global_step": 561539, "epoch": 6765} {"train_loss": -27.94611930847168, "global_step": 561540, "epoch": 6765} {"train_loss": -28.06525230407715, "global_step": 561541, "epoch": 6765} {"train_loss": -27.859100341796875, "global_step": 561542, "epoch": 6765} {"train_loss": -27.566125869750977, "global_step": 561543, "epoch": 6765} {"train_loss": -28.15399742126465, "global_step": 561544, "epoch": 6765} {"train_loss": -27.855695724487305, "global_step": 561545, "epoch": 6765} {"train_loss": -28.2263240814209, "global_step": 561546, "epoch": 6765} {"train_loss": -28.119714736938477, "global_step": 561547, "epoch": 6765} {"train_loss": -28.03346061706543, "global_step": 561548, "epoch": 6765} {"train_loss": -27.88592529296875, "global_step": 561549, "epoch": 6765} {"train_loss": -28.02839469909668, "global_step": 561550, "epoch": 6765} {"train_loss": -27.792348861694336, "global_step": 561551, "epoch": 6765} {"train_loss": -27.954710006713867, "global_step": 561552, "epoch": 6765} {"train_loss": -27.93808364868164, "global_step": 561553, "epoch": 6765} {"train_loss": -27.263940811157227, "global_step": 561554, "epoch": 6765} {"train_loss": -26.513635635375977, "global_step": 561555, "epoch": 6765} {"train_loss": -27.602521896362305, "global_step": 561556, "epoch": 6765} {"train_loss": -27.941455841064453, "global_step": 561557, "epoch": 6765} {"train_loss": -27.778553009033203, "global_step": 561558, "epoch": 6765} {"train_loss": -27.342090606689453, "global_step": 561559, "epoch": 6765} {"train_loss": -27.36091423034668, "global_step": 561560, "epoch": 6765} {"train_loss": -27.200693130493164, "global_step": 561561, "epoch": 6765} {"train_loss": -27.40186882019043, "global_step": 561562, "epoch": 6765} {"train_loss": -27.94597816467285, "global_step": 561563, "epoch": 6765} {"train_loss": -27.625707626342773, "global_step": 561564, "epoch": 6765} {"train_loss": -28.078388214111328, "global_step": 561565, "epoch": 6765} {"train_loss": -27.855451583862305, "global_step": 561566, "epoch": 6765} {"train_loss": -27.703784942626953, "global_step": 561567, "epoch": 6765} {"train_loss": -27.374378204345703, "global_step": 561568, "epoch": 6765} {"train_loss": -28.067066192626953, "global_step": 561569, "epoch": 6765} {"train_loss": -27.016809463500977, "global_step": 561570, "epoch": 6765} {"train_loss": -27.43001365661621, "global_step": 561571, "epoch": 6765} {"train_loss": -27.797168731689453, "global_step": 561572, "epoch": 6765} {"train_loss": -27.228595733642578, "global_step": 561573, "epoch": 6765} {"train_loss": -27.577314376831055, "global_step": 561574, "epoch": 6765} {"train_loss": -27.477264404296875, "global_step": 561575, "epoch": 6765} {"train_loss": -27.715213775634766, "global_step": 561576, "epoch": 6765} {"train_loss": -27.612423080995857, "global_step": 561577, "epoch": 6765, "val_loss": 6433380.0} {"train_loss": -27.978759765625, "global_step": 561578, "epoch": 6766} {"train_loss": -27.954742431640625, "global_step": 561579, "epoch": 6766} {"train_loss": -27.534826278686523, "global_step": 561580, "epoch": 6766} {"train_loss": -27.34418296813965, "global_step": 561581, "epoch": 6766} {"train_loss": -27.606979370117188, "global_step": 561582, "epoch": 6766} {"train_loss": -27.721708297729492, "global_step": 561583, "epoch": 6766} {"train_loss": -27.791492462158203, "global_step": 561584, "epoch": 6766} {"train_loss": -28.06147575378418, "global_step": 561585, "epoch": 6766} {"train_loss": -27.68097496032715, "global_step": 561586, "epoch": 6766} {"train_loss": -27.682836532592773, "global_step": 561587, "epoch": 6766} {"train_loss": -27.488712310791016, "global_step": 561588, "epoch": 6766} {"train_loss": -27.630172729492188, "global_step": 561589, "epoch": 6766} {"train_loss": -27.8123722076416, "global_step": 561590, "epoch": 6766} {"train_loss": -27.83119773864746, "global_step": 561591, "epoch": 6766} {"train_loss": -27.290607452392578, "global_step": 561592, "epoch": 6766} {"train_loss": -27.293615341186523, "global_step": 561593, "epoch": 6766} {"train_loss": -27.790319442749023, "global_step": 561594, "epoch": 6766} {"train_loss": -27.90779685974121, "global_step": 561595, "epoch": 6766} {"train_loss": -27.989471435546875, "global_step": 561596, "epoch": 6766} {"train_loss": -27.49622917175293, "global_step": 561597, "epoch": 6766} {"train_loss": -27.54638671875, "global_step": 561598, "epoch": 6766} {"train_loss": -27.8743896484375, "global_step": 561599, "epoch": 6766} {"train_loss": -27.455717086791992, "global_step": 561600, "epoch": 6766} {"train_loss": -27.91259765625, "global_step": 561601, "epoch": 6766} {"train_loss": -27.46821403503418, "global_step": 561602, "epoch": 6766} {"train_loss": -27.37337303161621, "global_step": 561603, "epoch": 6766} {"train_loss": -27.54509925842285, "global_step": 561604, "epoch": 6766} {"train_loss": -28.076013565063477, "global_step": 561605, "epoch": 6766} {"train_loss": -27.113861083984375, "global_step": 561606, "epoch": 6766} {"train_loss": -27.93691062927246, "global_step": 561607, "epoch": 6766} {"train_loss": -27.340734481811523, "global_step": 561608, "epoch": 6766} {"train_loss": -27.597692489624023, "global_step": 561609, "epoch": 6766} {"train_loss": -27.63702964782715, "global_step": 561610, "epoch": 6766} {"train_loss": -28.031354904174805, "global_step": 561611, "epoch": 6766} {"train_loss": -28.052061080932617, "global_step": 561612, "epoch": 6766} {"train_loss": -27.9883975982666, "global_step": 561613, "epoch": 6766} {"train_loss": -27.833850860595703, "global_step": 561614, "epoch": 6766} {"train_loss": -28.17953872680664, "global_step": 561615, "epoch": 6766} {"train_loss": -28.1926326751709, "global_step": 561616, "epoch": 6766} {"train_loss": -27.846389770507812, "global_step": 561617, "epoch": 6766} {"train_loss": -27.876920700073242, "global_step": 561618, "epoch": 6766} {"train_loss": -27.766698837280273, "global_step": 561619, "epoch": 6766} {"train_loss": -27.70166015625, "global_step": 561620, "epoch": 6766} {"train_loss": -27.6669864654541, "global_step": 561621, "epoch": 6766} {"train_loss": -28.290109634399414, "global_step": 561622, "epoch": 6766} {"train_loss": -28.022296905517578, "global_step": 561623, "epoch": 6766} {"train_loss": -28.34393310546875, "global_step": 561624, "epoch": 6766} {"train_loss": -27.83489418029785, "global_step": 561625, "epoch": 6766} {"train_loss": -27.801239013671875, "global_step": 561626, "epoch": 6766} {"train_loss": -28.03403663635254, "global_step": 561627, "epoch": 6766} {"train_loss": -27.98406410217285, "global_step": 561628, "epoch": 6766} {"train_loss": -27.997882843017578, "global_step": 561629, "epoch": 6766} {"train_loss": -27.930707931518555, "global_step": 561630, "epoch": 6766} {"train_loss": -27.9182186126709, "global_step": 561631, "epoch": 6766} {"train_loss": -28.153076171875, "global_step": 561632, "epoch": 6766} {"train_loss": -28.198041915893555, "global_step": 561633, "epoch": 6766} {"train_loss": -27.754077911376953, "global_step": 561634, "epoch": 6766} {"train_loss": -28.04657554626465, "global_step": 561635, "epoch": 6766} {"train_loss": -27.960424423217773, "global_step": 561636, "epoch": 6766} {"train_loss": -27.692224502563477, "global_step": 561637, "epoch": 6766} {"train_loss": -27.563268661499023, "global_step": 561638, "epoch": 6766} {"train_loss": -27.83807373046875, "global_step": 561639, "epoch": 6766} {"train_loss": -27.906015396118164, "global_step": 561640, "epoch": 6766} {"train_loss": -27.07280921936035, "global_step": 561641, "epoch": 6766} {"train_loss": -27.512182235717773, "global_step": 561642, "epoch": 6766} {"train_loss": -27.936847686767578, "global_step": 561643, "epoch": 6766} {"train_loss": -27.769071578979492, "global_step": 561644, "epoch": 6766} {"train_loss": -27.28460693359375, "global_step": 561645, "epoch": 6766} {"train_loss": -27.692733764648438, "global_step": 561646, "epoch": 6766} {"train_loss": -27.70721435546875, "global_step": 561647, "epoch": 6766} {"train_loss": -28.390405654907227, "global_step": 561648, "epoch": 6766} {"train_loss": -27.964431762695312, "global_step": 561649, "epoch": 6766} {"train_loss": -27.330163955688477, "global_step": 561650, "epoch": 6766} {"train_loss": -27.63861083984375, "global_step": 561651, "epoch": 6766} {"train_loss": -27.555341720581055, "global_step": 561652, "epoch": 6766} {"train_loss": -27.470779418945312, "global_step": 561653, "epoch": 6766} {"train_loss": -27.698041915893555, "global_step": 561654, "epoch": 6766} {"train_loss": -27.591022491455078, "global_step": 561655, "epoch": 6766} {"train_loss": -27.757831573486328, "global_step": 561656, "epoch": 6766} {"train_loss": -27.65988540649414, "global_step": 561657, "epoch": 6766} {"train_loss": -27.94647216796875, "global_step": 561658, "epoch": 6766} {"train_loss": -28.020374298095703, "global_step": 561659, "epoch": 6766} {"train_loss": -27.7809560155294, "global_step": 561660, "epoch": 6766, "val_loss": 6433447.0} {"train_loss": -26.796873092651367, "global_step": 561661, "epoch": 6767} {"train_loss": -27.06292724609375, "global_step": 561662, "epoch": 6767} {"train_loss": -27.159879684448242, "global_step": 561663, "epoch": 6767} {"train_loss": -27.86077308654785, "global_step": 561664, "epoch": 6767} {"train_loss": -27.044519424438477, "global_step": 561665, "epoch": 6767} {"train_loss": -27.4781436920166, "global_step": 561666, "epoch": 6767} {"train_loss": -27.8159236907959, "global_step": 561667, "epoch": 6767} {"train_loss": -27.589059829711914, "global_step": 561668, "epoch": 6767} {"train_loss": -27.502710342407227, "global_step": 561669, "epoch": 6767} {"train_loss": -27.470773696899414, "global_step": 561670, "epoch": 6767} {"train_loss": -27.419544219970703, "global_step": 561671, "epoch": 6767} {"train_loss": -27.25027847290039, "global_step": 561672, "epoch": 6767} {"train_loss": -27.4057559967041, "global_step": 561673, "epoch": 6767} {"train_loss": -27.592212677001953, "global_step": 561674, "epoch": 6767} {"train_loss": -27.321136474609375, "global_step": 561675, "epoch": 6767} {"train_loss": -27.76376724243164, "global_step": 561676, "epoch": 6767} {"train_loss": -27.709869384765625, "global_step": 561677, "epoch": 6767} {"train_loss": -27.236459732055664, "global_step": 561678, "epoch": 6767} {"train_loss": -27.628360748291016, "global_step": 561679, "epoch": 6767} {"train_loss": -27.938846588134766, "global_step": 561680, "epoch": 6767} {"train_loss": -27.6389102935791, "global_step": 561681, "epoch": 6767} {"train_loss": -27.728986740112305, "global_step": 561682, "epoch": 6767} {"train_loss": -27.861881256103516, "global_step": 561683, "epoch": 6767} {"train_loss": -27.80640983581543, "global_step": 561684, "epoch": 6767} {"train_loss": -27.750165939331055, "global_step": 561685, "epoch": 6767} {"train_loss": -28.093902587890625, "global_step": 561686, "epoch": 6767} {"train_loss": -27.950958251953125, "global_step": 561687, "epoch": 6767} {"train_loss": -27.589139938354492, "global_step": 561688, "epoch": 6767} {"train_loss": -27.824146270751953, "global_step": 561689, "epoch": 6767} {"train_loss": -27.616485595703125, "global_step": 561690, "epoch": 6767} {"train_loss": -27.65833854675293, "global_step": 561691, "epoch": 6767} {"train_loss": -27.6370849609375, "global_step": 561692, "epoch": 6767} {"train_loss": -27.96378517150879, "global_step": 561693, "epoch": 6767} {"train_loss": -27.834552764892578, "global_step": 561694, "epoch": 6767} {"train_loss": -27.613300323486328, "global_step": 561695, "epoch": 6767} {"train_loss": -27.73658561706543, "global_step": 561696, "epoch": 6767} {"train_loss": -27.885526657104492, "global_step": 561697, "epoch": 6767} {"train_loss": -28.0958309173584, "global_step": 561698, "epoch": 6767} {"train_loss": -27.71407127380371, "global_step": 561699, "epoch": 6767} {"train_loss": -27.75605583190918, "global_step": 561700, "epoch": 6767} {"train_loss": -27.817462921142578, "global_step": 561701, "epoch": 6767} {"train_loss": -27.460615158081055, "global_step": 561702, "epoch": 6767} {"train_loss": -27.5374698638916, "global_step": 561703, "epoch": 6767} {"train_loss": -27.530668258666992, "global_step": 561704, "epoch": 6767} {"train_loss": -28.043720245361328, "global_step": 561705, "epoch": 6767} {"train_loss": -27.81658935546875, "global_step": 561706, "epoch": 6767} {"train_loss": -27.574377059936523, "global_step": 561707, "epoch": 6767} {"train_loss": -27.57496452331543, "global_step": 561708, "epoch": 6767} {"train_loss": -28.045047760009766, "global_step": 561709, "epoch": 6767} {"train_loss": -27.6671199798584, "global_step": 561710, "epoch": 6767} {"train_loss": -28.012943267822266, "global_step": 561711, "epoch": 6767} {"train_loss": -27.315631866455078, "global_step": 561712, "epoch": 6767} {"train_loss": -28.000030517578125, "global_step": 561713, "epoch": 6767} {"train_loss": -27.862207412719727, "global_step": 561714, "epoch": 6767} {"train_loss": -27.99567222595215, "global_step": 561715, "epoch": 6767} {"train_loss": -27.378437042236328, "global_step": 561716, "epoch": 6767} {"train_loss": -28.119464874267578, "global_step": 561717, "epoch": 6767} {"train_loss": -27.933395385742188, "global_step": 561718, "epoch": 6767} {"train_loss": -27.73919677734375, "global_step": 561719, "epoch": 6767} {"train_loss": -27.9353084564209, "global_step": 561720, "epoch": 6767} {"train_loss": -27.489538192749023, "global_step": 561721, "epoch": 6767} {"train_loss": -27.67840003967285, "global_step": 561722, "epoch": 6767} {"train_loss": -28.056421279907227, "global_step": 561723, "epoch": 6767} {"train_loss": -27.955846786499023, "global_step": 561724, "epoch": 6767} {"train_loss": -28.061681747436523, "global_step": 561725, "epoch": 6767} {"train_loss": -27.71808433532715, "global_step": 561726, "epoch": 6767} {"train_loss": -27.768848419189453, "global_step": 561727, "epoch": 6767} {"train_loss": -27.60310935974121, "global_step": 561728, "epoch": 6767} {"train_loss": -27.77381706237793, "global_step": 561729, "epoch": 6767} {"train_loss": -27.985822677612305, "global_step": 561730, "epoch": 6767} {"train_loss": -28.009204864501953, "global_step": 561731, "epoch": 6767} {"train_loss": -27.4829044342041, "global_step": 561732, "epoch": 6767} {"train_loss": -27.646625518798828, "global_step": 561733, "epoch": 6767} {"train_loss": -27.893463134765625, "global_step": 561734, "epoch": 6767} {"train_loss": -27.92236328125, "global_step": 561735, "epoch": 6767} {"train_loss": -27.699243545532227, "global_step": 561736, "epoch": 6767} {"train_loss": -27.708560943603516, "global_step": 561737, "epoch": 6767} {"train_loss": -27.855215072631836, "global_step": 561738, "epoch": 6767} {"train_loss": -27.570581436157227, "global_step": 561739, "epoch": 6767} {"train_loss": -27.587255477905273, "global_step": 561740, "epoch": 6767} {"train_loss": -27.872669219970703, "global_step": 561741, "epoch": 6767} {"train_loss": -27.955951690673828, "global_step": 561742, "epoch": 6767} {"train_loss": -27.705385805612586, "global_step": 561743, "epoch": 6767, "val_loss": 6435444.0} {"train_loss": -26.453458786010742, "global_step": 561744, "epoch": 6768} {"train_loss": -26.388456344604492, "global_step": 561745, "epoch": 6768} {"train_loss": -27.642196655273438, "global_step": 561746, "epoch": 6768} {"train_loss": -27.027734756469727, "global_step": 561747, "epoch": 6768} {"train_loss": -26.041601181030273, "global_step": 561748, "epoch": 6768} {"train_loss": -26.88739585876465, "global_step": 561749, "epoch": 6768} {"train_loss": -26.968677520751953, "global_step": 561750, "epoch": 6768} {"train_loss": -27.34125328063965, "global_step": 561751, "epoch": 6768} {"train_loss": -27.05232048034668, "global_step": 561752, "epoch": 6768} {"train_loss": -27.378326416015625, "global_step": 561753, "epoch": 6768} {"train_loss": -27.280630111694336, "global_step": 561754, "epoch": 6768} {"train_loss": -27.48810386657715, "global_step": 561755, "epoch": 6768} {"train_loss": -27.423603057861328, "global_step": 561756, "epoch": 6768} {"train_loss": -27.515119552612305, "global_step": 561757, "epoch": 6768} {"train_loss": -27.21368408203125, "global_step": 561758, "epoch": 6768} {"train_loss": -27.327856063842773, "global_step": 561759, "epoch": 6768} {"train_loss": -27.72979164123535, "global_step": 561760, "epoch": 6768} {"train_loss": -27.556610107421875, "global_step": 561761, "epoch": 6768} {"train_loss": -27.870853424072266, "global_step": 561762, "epoch": 6768} {"train_loss": -27.43375015258789, "global_step": 561763, "epoch": 6768} {"train_loss": -27.67987632751465, "global_step": 561764, "epoch": 6768} {"train_loss": -27.5402889251709, "global_step": 561765, "epoch": 6768} {"train_loss": -27.40912437438965, "global_step": 561766, "epoch": 6768} {"train_loss": -27.379648208618164, "global_step": 561767, "epoch": 6768} {"train_loss": -27.60639762878418, "global_step": 561768, "epoch": 6768} {"train_loss": -27.5617618560791, "global_step": 561769, "epoch": 6768} {"train_loss": -27.8580379486084, "global_step": 561770, "epoch": 6768} {"train_loss": -27.832860946655273, "global_step": 561771, "epoch": 6768} {"train_loss": -27.9677734375, "global_step": 561772, "epoch": 6768} {"train_loss": -27.672712326049805, "global_step": 561773, "epoch": 6768} {"train_loss": -27.785125732421875, "global_step": 561774, "epoch": 6768} {"train_loss": -27.675634384155273, "global_step": 561775, "epoch": 6768} {"train_loss": -27.94049644470215, "global_step": 561776, "epoch": 6768} {"train_loss": -27.83056640625, "global_step": 561777, "epoch": 6768} {"train_loss": -27.982776641845703, "global_step": 561778, "epoch": 6768} {"train_loss": -28.018558502197266, "global_step": 561779, "epoch": 6768} {"train_loss": -28.075300216674805, "global_step": 561780, "epoch": 6768} {"train_loss": -27.792959213256836, "global_step": 561781, "epoch": 6768} {"train_loss": -27.60206413269043, "global_step": 561782, "epoch": 6768} {"train_loss": -27.94952964782715, "global_step": 561783, "epoch": 6768} {"train_loss": -28.057361602783203, "global_step": 561784, "epoch": 6768} {"train_loss": -27.835718154907227, "global_step": 561785, "epoch": 6768} {"train_loss": -28.023962020874023, "global_step": 561786, "epoch": 6768} {"train_loss": -28.12066650390625, "global_step": 561787, "epoch": 6768} {"train_loss": -28.179059982299805, "global_step": 561788, "epoch": 6768} {"train_loss": -27.811559677124023, "global_step": 561789, "epoch": 6768} {"train_loss": -27.99903678894043, "global_step": 561790, "epoch": 6768} {"train_loss": -27.868314743041992, "global_step": 561791, "epoch": 6768} {"train_loss": -27.786344528198242, "global_step": 561792, "epoch": 6768} {"train_loss": -27.957605361938477, "global_step": 561793, "epoch": 6768} {"train_loss": -27.649076461791992, "global_step": 561794, "epoch": 6768} {"train_loss": -27.606678009033203, "global_step": 561795, "epoch": 6768} {"train_loss": -27.64127540588379, "global_step": 561796, "epoch": 6768} {"train_loss": -27.619169235229492, "global_step": 561797, "epoch": 6768} {"train_loss": -27.538562774658203, "global_step": 561798, "epoch": 6768} {"train_loss": -27.582311630249023, "global_step": 561799, "epoch": 6768} {"train_loss": -27.56275749206543, "global_step": 561800, "epoch": 6768} {"train_loss": -28.080469131469727, "global_step": 561801, "epoch": 6768} {"train_loss": -27.923383712768555, "global_step": 561802, "epoch": 6768} {"train_loss": -27.350454330444336, "global_step": 561803, "epoch": 6768} {"train_loss": -27.39923095703125, "global_step": 561804, "epoch": 6768} {"train_loss": -27.401905059814453, "global_step": 561805, "epoch": 6768} {"train_loss": -27.53970718383789, "global_step": 561806, "epoch": 6768} {"train_loss": -27.6874942779541, "global_step": 561807, "epoch": 6768} {"train_loss": -26.902189254760742, "global_step": 561808, "epoch": 6768} {"train_loss": -27.548730850219727, "global_step": 561809, "epoch": 6768} {"train_loss": -27.832061767578125, "global_step": 561810, "epoch": 6768} {"train_loss": -27.564661026000977, "global_step": 561811, "epoch": 6768} {"train_loss": -27.48737144470215, "global_step": 561812, "epoch": 6768} {"train_loss": -27.436527252197266, "global_step": 561813, "epoch": 6768} {"train_loss": -28.014307022094727, "global_step": 561814, "epoch": 6768} {"train_loss": -27.431472778320312, "global_step": 561815, "epoch": 6768} {"train_loss": -27.74531364440918, "global_step": 561816, "epoch": 6768} {"train_loss": -27.354156494140625, "global_step": 561817, "epoch": 6768} {"train_loss": -27.683019638061523, "global_step": 561818, "epoch": 6768} {"train_loss": -27.711395263671875, "global_step": 561819, "epoch": 6768} {"train_loss": -27.592687606811523, "global_step": 561820, "epoch": 6768} {"train_loss": -27.953189849853516, "global_step": 561821, "epoch": 6768} {"train_loss": -27.87473487854004, "global_step": 561822, "epoch": 6768} {"train_loss": -27.707666397094727, "global_step": 561823, "epoch": 6768} {"train_loss": -27.9956111907959, "global_step": 561824, "epoch": 6768} {"train_loss": -27.865964889526367, "global_step": 561825, "epoch": 6768} {"train_loss": -27.600558108594043, "global_step": 561826, "epoch": 6768, "val_loss": 6395938.0} {"train_loss": -27.214969635009766, "global_step": 561827, "epoch": 6769} {"train_loss": -27.6458797454834, "global_step": 561828, "epoch": 6769} {"train_loss": -27.79080581665039, "global_step": 561829, "epoch": 6769} {"train_loss": -27.78472328186035, "global_step": 561830, "epoch": 6769} {"train_loss": -27.578336715698242, "global_step": 561831, "epoch": 6769} {"train_loss": -28.02302360534668, "global_step": 561832, "epoch": 6769} {"train_loss": -28.03669548034668, "global_step": 561833, "epoch": 6769} {"train_loss": -27.925704956054688, "global_step": 561834, "epoch": 6769} {"train_loss": -27.708911895751953, "global_step": 561835, "epoch": 6769} {"train_loss": -27.763898849487305, "global_step": 561836, "epoch": 6769} {"train_loss": -27.833410263061523, "global_step": 561837, "epoch": 6769} {"train_loss": -27.828466415405273, "global_step": 561838, "epoch": 6769} {"train_loss": -27.84384536743164, "global_step": 561839, "epoch": 6769} {"train_loss": -27.578149795532227, "global_step": 561840, "epoch": 6769} {"train_loss": -28.011320114135742, "global_step": 561841, "epoch": 6769} {"train_loss": -27.825809478759766, "global_step": 561842, "epoch": 6769} {"train_loss": -27.7049617767334, "global_step": 561843, "epoch": 6769} {"train_loss": -27.654767990112305, "global_step": 561844, "epoch": 6769} {"train_loss": -28.152740478515625, "global_step": 561845, "epoch": 6769} {"train_loss": -28.016284942626953, "global_step": 561846, "epoch": 6769} {"train_loss": -27.779438018798828, "global_step": 561847, "epoch": 6769} {"train_loss": -28.166330337524414, "global_step": 561848, "epoch": 6769} {"train_loss": -27.91790771484375, "global_step": 561849, "epoch": 6769} {"train_loss": -28.051105499267578, "global_step": 561850, "epoch": 6769} {"train_loss": -27.91029167175293, "global_step": 561851, "epoch": 6769} {"train_loss": -27.86060905456543, "global_step": 561852, "epoch": 6769} {"train_loss": -27.854034423828125, "global_step": 561853, "epoch": 6769} {"train_loss": -27.715559005737305, "global_step": 561854, "epoch": 6769} {"train_loss": -28.013086318969727, "global_step": 561855, "epoch": 6769} {"train_loss": -27.828893661499023, "global_step": 561856, "epoch": 6769} {"train_loss": -27.94190788269043, "global_step": 561857, "epoch": 6769} {"train_loss": -27.952381134033203, "global_step": 561858, "epoch": 6769} {"train_loss": -27.847644805908203, "global_step": 561859, "epoch": 6769} {"train_loss": -27.859094619750977, "global_step": 561860, "epoch": 6769} {"train_loss": -27.670751571655273, "global_step": 561861, "epoch": 6769} {"train_loss": -27.417831420898438, "global_step": 561862, "epoch": 6769} {"train_loss": -27.76824378967285, "global_step": 561863, "epoch": 6769} {"train_loss": -27.742231369018555, "global_step": 561864, "epoch": 6769} {"train_loss": -28.035125732421875, "global_step": 561865, "epoch": 6769} {"train_loss": -27.484180450439453, "global_step": 561866, "epoch": 6769} {"train_loss": -27.64374351501465, "global_step": 561867, "epoch": 6769} {"train_loss": -27.2684268951416, "global_step": 561868, "epoch": 6769} {"train_loss": -27.65032386779785, "global_step": 561869, "epoch": 6769} {"train_loss": -27.981698989868164, "global_step": 561870, "epoch": 6769} {"train_loss": -27.654769897460938, "global_step": 561871, "epoch": 6769} {"train_loss": -27.501514434814453, "global_step": 561872, "epoch": 6769} {"train_loss": -27.529727935791016, "global_step": 561873, "epoch": 6769} {"train_loss": -27.908905029296875, "global_step": 561874, "epoch": 6769} {"train_loss": -27.951251983642578, "global_step": 561875, "epoch": 6769} {"train_loss": -27.399930953979492, "global_step": 561876, "epoch": 6769} {"train_loss": -27.80303382873535, "global_step": 561877, "epoch": 6769} {"train_loss": -27.88248062133789, "global_step": 561878, "epoch": 6769} {"train_loss": -27.772146224975586, "global_step": 561879, "epoch": 6769} {"train_loss": -27.481372833251953, "global_step": 561880, "epoch": 6769} {"train_loss": -27.88160514831543, "global_step": 561881, "epoch": 6769} {"train_loss": -27.833791732788086, "global_step": 561882, "epoch": 6769} {"train_loss": -27.773792266845703, "global_step": 561883, "epoch": 6769} {"train_loss": -27.811872482299805, "global_step": 561884, "epoch": 6769} {"train_loss": -27.682111740112305, "global_step": 561885, "epoch": 6769} {"train_loss": -27.773151397705078, "global_step": 561886, "epoch": 6769} {"train_loss": -27.821523666381836, "global_step": 561887, "epoch": 6769} {"train_loss": -28.145849227905273, "global_step": 561888, "epoch": 6769} {"train_loss": -27.680166244506836, "global_step": 561889, "epoch": 6769} {"train_loss": -27.406497955322266, "global_step": 561890, "epoch": 6769} {"train_loss": -27.563695907592773, "global_step": 561891, "epoch": 6769} {"train_loss": -27.91683006286621, "global_step": 561892, "epoch": 6769} {"train_loss": -27.740161895751953, "global_step": 561893, "epoch": 6769} {"train_loss": -27.839948654174805, "global_step": 561894, "epoch": 6769} {"train_loss": -27.51948356628418, "global_step": 561895, "epoch": 6769} {"train_loss": -28.031293869018555, "global_step": 561896, "epoch": 6769} {"train_loss": -27.86460304260254, "global_step": 561897, "epoch": 6769} {"train_loss": -28.027109146118164, "global_step": 561898, "epoch": 6769} {"train_loss": -27.6695613861084, "global_step": 561899, "epoch": 6769} {"train_loss": -27.882293701171875, "global_step": 561900, "epoch": 6769} {"train_loss": -28.071786880493164, "global_step": 561901, "epoch": 6769} {"train_loss": -28.124408721923828, "global_step": 561902, "epoch": 6769} {"train_loss": -27.997446060180664, "global_step": 561903, "epoch": 6769} {"train_loss": -28.171783447265625, "global_step": 561904, "epoch": 6769} {"train_loss": -27.919652938842773, "global_step": 561905, "epoch": 6769} {"train_loss": -28.122114181518555, "global_step": 561906, "epoch": 6769} {"train_loss": -27.558385848999023, "global_step": 561907, "epoch": 6769} {"train_loss": -28.072357177734375, "global_step": 561908, "epoch": 6769} {"train_loss": -27.786816102912628, "global_step": 561909, "epoch": 6769, "val_loss": 6389368.5} {"train_loss": -27.376672744750977, "global_step": 561910, "epoch": 6770} {"train_loss": -27.405658721923828, "global_step": 561911, "epoch": 6770} {"train_loss": -27.319534301757812, "global_step": 561912, "epoch": 6770} {"train_loss": -27.171228408813477, "global_step": 561913, "epoch": 6770} {"train_loss": -27.151782989501953, "global_step": 561914, "epoch": 6770} {"train_loss": -27.506208419799805, "global_step": 561915, "epoch": 6770} {"train_loss": -26.934019088745117, "global_step": 561916, "epoch": 6770} {"train_loss": -26.8422908782959, "global_step": 561917, "epoch": 6770} {"train_loss": -27.72316551208496, "global_step": 561918, "epoch": 6770} {"train_loss": -27.848474502563477, "global_step": 561919, "epoch": 6770} {"train_loss": -27.23661231994629, "global_step": 561920, "epoch": 6770} {"train_loss": -27.455350875854492, "global_step": 561921, "epoch": 6770} {"train_loss": -27.365619659423828, "global_step": 561922, "epoch": 6770} {"train_loss": -27.50483512878418, "global_step": 561923, "epoch": 6770} {"train_loss": -27.517560958862305, "global_step": 561924, "epoch": 6770} {"train_loss": -27.566980361938477, "global_step": 561925, "epoch": 6770} {"train_loss": -27.33876609802246, "global_step": 561926, "epoch": 6770} {"train_loss": -27.592206954956055, "global_step": 561927, "epoch": 6770} {"train_loss": -27.129892349243164, "global_step": 561928, "epoch": 6770} {"train_loss": -27.466419219970703, "global_step": 561929, "epoch": 6770} {"train_loss": -27.663782119750977, "global_step": 561930, "epoch": 6770} {"train_loss": -27.67462158203125, "global_step": 561931, "epoch": 6770} {"train_loss": -27.628097534179688, "global_step": 561932, "epoch": 6770} {"train_loss": -27.48492431640625, "global_step": 561933, "epoch": 6770} {"train_loss": -27.92438316345215, "global_step": 561934, "epoch": 6770} {"train_loss": -28.195016860961914, "global_step": 561935, "epoch": 6770} {"train_loss": -27.652856826782227, "global_step": 561936, "epoch": 6770} {"train_loss": -27.658374786376953, "global_step": 561937, "epoch": 6770} {"train_loss": -27.283666610717773, "global_step": 561938, "epoch": 6770} {"train_loss": -28.19843101501465, "global_step": 561939, "epoch": 6770} {"train_loss": -27.476856231689453, "global_step": 561940, "epoch": 6770} {"train_loss": -27.399124145507812, "global_step": 561941, "epoch": 6770} {"train_loss": -27.75319480895996, "global_step": 561942, "epoch": 6770} {"train_loss": -28.206430435180664, "global_step": 561943, "epoch": 6770} {"train_loss": -27.621252059936523, "global_step": 561944, "epoch": 6770} {"train_loss": -28.24212074279785, "global_step": 561945, "epoch": 6770} {"train_loss": -27.8164005279541, "global_step": 561946, "epoch": 6770} {"train_loss": -27.870498657226562, "global_step": 561947, "epoch": 6770} {"train_loss": -27.942163467407227, "global_step": 561948, "epoch": 6770} {"train_loss": -27.58977699279785, "global_step": 561949, "epoch": 6770} {"train_loss": -27.910614013671875, "global_step": 561950, "epoch": 6770} {"train_loss": -27.64032554626465, "global_step": 561951, "epoch": 6770} {"train_loss": -27.81410026550293, "global_step": 561952, "epoch": 6770} {"train_loss": -27.855993270874023, "global_step": 561953, "epoch": 6770} {"train_loss": -27.922107696533203, "global_step": 561954, "epoch": 6770} {"train_loss": -27.905719757080078, "global_step": 561955, "epoch": 6770} {"train_loss": -27.784311294555664, "global_step": 561956, "epoch": 6770} {"train_loss": -27.749603271484375, "global_step": 561957, "epoch": 6770} {"train_loss": -28.167078018188477, "global_step": 561958, "epoch": 6770} {"train_loss": -27.733112335205078, "global_step": 561959, "epoch": 6770} {"train_loss": -27.813873291015625, "global_step": 561960, "epoch": 6770} {"train_loss": -27.963525772094727, "global_step": 561961, "epoch": 6770} {"train_loss": -27.703893661499023, "global_step": 561962, "epoch": 6770} {"train_loss": -27.147748947143555, "global_step": 561963, "epoch": 6770} {"train_loss": -27.183155059814453, "global_step": 561964, "epoch": 6770} {"train_loss": -26.67156410217285, "global_step": 561965, "epoch": 6770} {"train_loss": -27.40138053894043, "global_step": 561966, "epoch": 6770} {"train_loss": -27.817977905273438, "global_step": 561967, "epoch": 6770} {"train_loss": -27.844024658203125, "global_step": 561968, "epoch": 6770} {"train_loss": -27.583160400390625, "global_step": 561969, "epoch": 6770} {"train_loss": -27.915674209594727, "global_step": 561970, "epoch": 6770} {"train_loss": -28.109079360961914, "global_step": 561971, "epoch": 6770} {"train_loss": -28.24017333984375, "global_step": 561972, "epoch": 6770} {"train_loss": -27.6569766998291, "global_step": 561973, "epoch": 6770} {"train_loss": -27.863540649414062, "global_step": 561974, "epoch": 6770} {"train_loss": -27.795541763305664, "global_step": 561975, "epoch": 6770} {"train_loss": -27.377248764038086, "global_step": 561976, "epoch": 6770} {"train_loss": -28.033788681030273, "global_step": 561977, "epoch": 6770} {"train_loss": -27.853851318359375, "global_step": 561978, "epoch": 6770} {"train_loss": -27.8062686920166, "global_step": 561979, "epoch": 6770} {"train_loss": -27.7827205657959, "global_step": 561980, "epoch": 6770} {"train_loss": -27.757858276367188, "global_step": 561981, "epoch": 6770} {"train_loss": -27.894804000854492, "global_step": 561982, "epoch": 6770} {"train_loss": -28.23236083984375, "global_step": 561983, "epoch": 6770} {"train_loss": -27.850555419921875, "global_step": 561984, "epoch": 6770} {"train_loss": -27.5228214263916, "global_step": 561985, "epoch": 6770} {"train_loss": -27.380008697509766, "global_step": 561986, "epoch": 6770} {"train_loss": -27.630695343017578, "global_step": 561987, "epoch": 6770} {"train_loss": -27.890501022338867, "global_step": 561988, "epoch": 6770} {"train_loss": -27.901960372924805, "global_step": 561989, "epoch": 6770} {"train_loss": -28.08607292175293, "global_step": 561990, "epoch": 6770} {"train_loss": -28.183887481689453, "global_step": 561991, "epoch": 6770} {"train_loss": -27.672326811824938, "global_step": 561992, "epoch": 6770, "val_loss": 6438583.0} {"train_loss": -27.76776695251465, "global_step": 561993, "epoch": 6771} {"train_loss": -27.55893898010254, "global_step": 561994, "epoch": 6771} {"train_loss": -27.686264038085938, "global_step": 561995, "epoch": 6771} {"train_loss": -27.362354278564453, "global_step": 561996, "epoch": 6771} {"train_loss": -27.22726821899414, "global_step": 561997, "epoch": 6771} {"train_loss": -27.6176815032959, "global_step": 561998, "epoch": 6771} {"train_loss": -27.310230255126953, "global_step": 561999, "epoch": 6771} {"train_loss": -27.82900047302246, "global_step": 562000, "epoch": 6771} {"train_loss": -27.819732666015625, "global_step": 562001, "epoch": 6771} {"train_loss": -27.527013778686523, "global_step": 562002, "epoch": 6771} {"train_loss": -27.391820907592773, "global_step": 562003, "epoch": 6771} {"train_loss": -27.573013305664062, "global_step": 562004, "epoch": 6771} {"train_loss": -27.429718017578125, "global_step": 562005, "epoch": 6771} {"train_loss": -27.551782608032227, "global_step": 562006, "epoch": 6771} {"train_loss": -27.771503448486328, "global_step": 562007, "epoch": 6771} {"train_loss": -27.683401107788086, "global_step": 562008, "epoch": 6771} {"train_loss": -27.583295822143555, "global_step": 562009, "epoch": 6771} {"train_loss": -27.879383087158203, "global_step": 562010, "epoch": 6771} {"train_loss": -27.779592514038086, "global_step": 562011, "epoch": 6771} {"train_loss": -27.627674102783203, "global_step": 562012, "epoch": 6771} {"train_loss": -27.769901275634766, "global_step": 562013, "epoch": 6771} {"train_loss": -27.669164657592773, "global_step": 562014, "epoch": 6771} {"train_loss": -27.710479736328125, "global_step": 562015, "epoch": 6771} {"train_loss": -27.25187110900879, "global_step": 562016, "epoch": 6771} {"train_loss": -27.830549240112305, "global_step": 562017, "epoch": 6771} {"train_loss": -27.424091339111328, "global_step": 562018, "epoch": 6771} {"train_loss": -27.4180965423584, "global_step": 562019, "epoch": 6771} {"train_loss": -27.53171730041504, "global_step": 562020, "epoch": 6771} {"train_loss": -27.757587432861328, "global_step": 562021, "epoch": 6771} {"train_loss": -27.94367027282715, "global_step": 562022, "epoch": 6771} {"train_loss": -27.717350006103516, "global_step": 562023, "epoch": 6771} {"train_loss": -27.50542640686035, "global_step": 562024, "epoch": 6771} {"train_loss": -27.54146385192871, "global_step": 562025, "epoch": 6771} {"train_loss": -28.10678482055664, "global_step": 562026, "epoch": 6771} {"train_loss": -27.4841251373291, "global_step": 562027, "epoch": 6771} {"train_loss": -27.746570587158203, "global_step": 562028, "epoch": 6771} {"train_loss": -28.154632568359375, "global_step": 562029, "epoch": 6771} {"train_loss": -27.616418838500977, "global_step": 562030, "epoch": 6771} {"train_loss": -27.752023696899414, "global_step": 562031, "epoch": 6771} {"train_loss": -27.97490882873535, "global_step": 562032, "epoch": 6771} {"train_loss": -27.78278923034668, "global_step": 562033, "epoch": 6771} {"train_loss": -27.633869171142578, "global_step": 562034, "epoch": 6771} {"train_loss": -27.98493766784668, "global_step": 562035, "epoch": 6771} {"train_loss": -27.713565826416016, "global_step": 562036, "epoch": 6771} {"train_loss": -27.720930099487305, "global_step": 562037, "epoch": 6771} {"train_loss": -28.05561637878418, "global_step": 562038, "epoch": 6771} {"train_loss": -27.793628692626953, "global_step": 562039, "epoch": 6771} {"train_loss": -27.953632354736328, "global_step": 562040, "epoch": 6771} {"train_loss": -27.907672882080078, "global_step": 562041, "epoch": 6771} {"train_loss": -27.883466720581055, "global_step": 562042, "epoch": 6771} {"train_loss": -28.35361671447754, "global_step": 562043, "epoch": 6771} {"train_loss": -28.003925323486328, "global_step": 562044, "epoch": 6771} {"train_loss": -27.932592391967773, "global_step": 562045, "epoch": 6771} {"train_loss": -27.857419967651367, "global_step": 562046, "epoch": 6771} {"train_loss": -27.369861602783203, "global_step": 562047, "epoch": 6771} {"train_loss": -27.557310104370117, "global_step": 562048, "epoch": 6771} {"train_loss": -27.4730224609375, "global_step": 562049, "epoch": 6771} {"train_loss": -27.968326568603516, "global_step": 562050, "epoch": 6771} {"train_loss": -28.182859420776367, "global_step": 562051, "epoch": 6771} {"train_loss": -27.88807487487793, "global_step": 562052, "epoch": 6771} {"train_loss": -27.880374908447266, "global_step": 562053, "epoch": 6771} {"train_loss": -28.080907821655273, "global_step": 562054, "epoch": 6771} {"train_loss": -27.574995040893555, "global_step": 562055, "epoch": 6771} {"train_loss": -27.8726749420166, "global_step": 562056, "epoch": 6771} {"train_loss": -27.421234130859375, "global_step": 562057, "epoch": 6771} {"train_loss": -27.413284301757812, "global_step": 562058, "epoch": 6771} {"train_loss": -27.8005428314209, "global_step": 562059, "epoch": 6771} {"train_loss": -27.486082077026367, "global_step": 562060, "epoch": 6771} {"train_loss": -27.750844955444336, "global_step": 562061, "epoch": 6771} {"train_loss": -27.78315544128418, "global_step": 562062, "epoch": 6771} {"train_loss": -27.840383529663086, "global_step": 562063, "epoch": 6771} {"train_loss": -27.516860961914062, "global_step": 562064, "epoch": 6771} {"train_loss": -28.079980850219727, "global_step": 562065, "epoch": 6771} {"train_loss": -27.67991065979004, "global_step": 562066, "epoch": 6771} {"train_loss": -27.24018669128418, "global_step": 562067, "epoch": 6771} {"train_loss": -27.48307228088379, "global_step": 562068, "epoch": 6771} {"train_loss": -27.3542423248291, "global_step": 562069, "epoch": 6771} {"train_loss": -27.7261962890625, "global_step": 562070, "epoch": 6771} {"train_loss": -27.680418014526367, "global_step": 562071, "epoch": 6771} {"train_loss": -27.72787857055664, "global_step": 562072, "epoch": 6771} {"train_loss": -27.748456954956055, "global_step": 562073, "epoch": 6771} {"train_loss": -27.811233520507812, "global_step": 562074, "epoch": 6771} {"train_loss": -27.7242379935391, "global_step": 562075, "epoch": 6771, "val_loss": 6359483.0} {"train_loss": -27.57151222229004, "global_step": 562076, "epoch": 6772} {"train_loss": -26.82879638671875, "global_step": 562077, "epoch": 6772} {"train_loss": -26.3503360748291, "global_step": 562078, "epoch": 6772} {"train_loss": -26.505781173706055, "global_step": 562079, "epoch": 6772} {"train_loss": -27.31220817565918, "global_step": 562080, "epoch": 6772} {"train_loss": -27.159509658813477, "global_step": 562081, "epoch": 6772} {"train_loss": -26.931549072265625, "global_step": 562082, "epoch": 6772} {"train_loss": -27.086029052734375, "global_step": 562083, "epoch": 6772} {"train_loss": -27.084552764892578, "global_step": 562084, "epoch": 6772} {"train_loss": -27.400182723999023, "global_step": 562085, "epoch": 6772} {"train_loss": -27.578699111938477, "global_step": 562086, "epoch": 6772} {"train_loss": -27.7077693939209, "global_step": 562087, "epoch": 6772} {"train_loss": -27.367034912109375, "global_step": 562088, "epoch": 6772} {"train_loss": -27.824079513549805, "global_step": 562089, "epoch": 6772} {"train_loss": -27.642621994018555, "global_step": 562090, "epoch": 6772} {"train_loss": -27.70159912109375, "global_step": 562091, "epoch": 6772} {"train_loss": -27.7318115234375, "global_step": 562092, "epoch": 6772} {"train_loss": -28.159311294555664, "global_step": 562093, "epoch": 6772} {"train_loss": -27.61128044128418, "global_step": 562094, "epoch": 6772} {"train_loss": -27.796253204345703, "global_step": 562095, "epoch": 6772} {"train_loss": -27.652027130126953, "global_step": 562096, "epoch": 6772} {"train_loss": -27.595487594604492, "global_step": 562097, "epoch": 6772} {"train_loss": -27.51946449279785, "global_step": 562098, "epoch": 6772} {"train_loss": -27.805789947509766, "global_step": 562099, "epoch": 6772} {"train_loss": -27.406843185424805, "global_step": 562100, "epoch": 6772} {"train_loss": -27.367862701416016, "global_step": 562101, "epoch": 6772} {"train_loss": -27.84912109375, "global_step": 562102, "epoch": 6772} {"train_loss": -27.845434188842773, "global_step": 562103, "epoch": 6772} {"train_loss": -28.171255111694336, "global_step": 562104, "epoch": 6772} {"train_loss": -27.938232421875, "global_step": 562105, "epoch": 6772} {"train_loss": -27.884429931640625, "global_step": 562106, "epoch": 6772} {"train_loss": -27.854333877563477, "global_step": 562107, "epoch": 6772} {"train_loss": -27.5751953125, "global_step": 562108, "epoch": 6772} {"train_loss": -28.213855743408203, "global_step": 562109, "epoch": 6772} {"train_loss": -27.97121238708496, "global_step": 562110, "epoch": 6772} {"train_loss": -28.225921630859375, "global_step": 562111, "epoch": 6772} {"train_loss": -28.106689453125, "global_step": 562112, "epoch": 6772} {"train_loss": -27.791868209838867, "global_step": 562113, "epoch": 6772} {"train_loss": -28.035425186157227, "global_step": 562114, "epoch": 6772} {"train_loss": -27.9249210357666, "global_step": 562115, "epoch": 6772} {"train_loss": -28.01031494140625, "global_step": 562116, "epoch": 6772} {"train_loss": -28.109766006469727, "global_step": 562117, "epoch": 6772} {"train_loss": -27.870258331298828, "global_step": 562118, "epoch": 6772} {"train_loss": -28.396398544311523, "global_step": 562119, "epoch": 6772} {"train_loss": -27.592548370361328, "global_step": 562120, "epoch": 6772} {"train_loss": -27.618061065673828, "global_step": 562121, "epoch": 6772} {"train_loss": -28.03278923034668, "global_step": 562122, "epoch": 6772} {"train_loss": -27.94508171081543, "global_step": 562123, "epoch": 6772} {"train_loss": -28.00439453125, "global_step": 562124, "epoch": 6772} {"train_loss": -27.798795700073242, "global_step": 562125, "epoch": 6772} {"train_loss": -27.93971061706543, "global_step": 562126, "epoch": 6772} {"train_loss": -28.13653564453125, "global_step": 562127, "epoch": 6772} {"train_loss": -28.01936149597168, "global_step": 562128, "epoch": 6772} {"train_loss": -27.6667423248291, "global_step": 562129, "epoch": 6772} {"train_loss": -27.821455001831055, "global_step": 562130, "epoch": 6772} {"train_loss": -28.19087028503418, "global_step": 562131, "epoch": 6772} {"train_loss": -27.523008346557617, "global_step": 562132, "epoch": 6772} {"train_loss": -27.391427993774414, "global_step": 562133, "epoch": 6772} {"train_loss": -27.95263671875, "global_step": 562134, "epoch": 6772} {"train_loss": -27.434341430664062, "global_step": 562135, "epoch": 6772} {"train_loss": -27.326879501342773, "global_step": 562136, "epoch": 6772} {"train_loss": -27.759084701538086, "global_step": 562137, "epoch": 6772} {"train_loss": -26.67144775390625, "global_step": 562138, "epoch": 6772} {"train_loss": -27.130435943603516, "global_step": 562139, "epoch": 6772} {"train_loss": -27.662824630737305, "global_step": 562140, "epoch": 6772} {"train_loss": -27.41282081604004, "global_step": 562141, "epoch": 6772} {"train_loss": -27.327178955078125, "global_step": 562142, "epoch": 6772} {"train_loss": -27.638525009155273, "global_step": 562143, "epoch": 6772} {"train_loss": -27.224897384643555, "global_step": 562144, "epoch": 6772} {"train_loss": -27.337039947509766, "global_step": 562145, "epoch": 6772} {"train_loss": -27.24696159362793, "global_step": 562146, "epoch": 6772} {"train_loss": -27.177352905273438, "global_step": 562147, "epoch": 6772} {"train_loss": -27.543241500854492, "global_step": 562148, "epoch": 6772} {"train_loss": -27.332990646362305, "global_step": 562149, "epoch": 6772} {"train_loss": -27.65325355529785, "global_step": 562150, "epoch": 6772} {"train_loss": -27.53131103515625, "global_step": 562151, "epoch": 6772} {"train_loss": -27.405054092407227, "global_step": 562152, "epoch": 6772} {"train_loss": -27.4570255279541, "global_step": 562153, "epoch": 6772} {"train_loss": -27.547712326049805, "global_step": 562154, "epoch": 6772} {"train_loss": -27.55560302734375, "global_step": 562155, "epoch": 6772} {"train_loss": -27.74555015563965, "global_step": 562156, "epoch": 6772} {"train_loss": -27.36346435546875, "global_step": 562157, "epoch": 6772} {"train_loss": -27.609148760876025, "global_step": 562158, "epoch": 6772, "val_loss": 6336028.0} {"train_loss": -27.34003257751465, "global_step": 562159, "epoch": 6773} {"train_loss": -27.484054565429688, "global_step": 562160, "epoch": 6773} {"train_loss": -27.40708351135254, "global_step": 562161, "epoch": 6773} {"train_loss": -27.7928409576416, "global_step": 562162, "epoch": 6773} {"train_loss": -27.52692222595215, "global_step": 562163, "epoch": 6773} {"train_loss": -27.613325119018555, "global_step": 562164, "epoch": 6773} {"train_loss": -27.629364013671875, "global_step": 562165, "epoch": 6773} {"train_loss": -27.38168716430664, "global_step": 562166, "epoch": 6773} {"train_loss": -27.426931381225586, "global_step": 562167, "epoch": 6773} {"train_loss": -27.25250244140625, "global_step": 562168, "epoch": 6773} {"train_loss": -27.74677085876465, "global_step": 562169, "epoch": 6773} {"train_loss": -27.6740779876709, "global_step": 562170, "epoch": 6773} {"train_loss": -27.685277938842773, "global_step": 562171, "epoch": 6773} {"train_loss": -27.867237091064453, "global_step": 562172, "epoch": 6773} {"train_loss": -27.415851593017578, "global_step": 562173, "epoch": 6773} {"train_loss": -27.857370376586914, "global_step": 562174, "epoch": 6773} {"train_loss": -27.762048721313477, "global_step": 562175, "epoch": 6773} {"train_loss": -27.749921798706055, "global_step": 562176, "epoch": 6773} {"train_loss": -27.823776245117188, "global_step": 562177, "epoch": 6773} {"train_loss": -27.842493057250977, "global_step": 562178, "epoch": 6773} {"train_loss": -27.89361000061035, "global_step": 562179, "epoch": 6773} {"train_loss": -27.934484481811523, "global_step": 562180, "epoch": 6773} {"train_loss": -27.824628829956055, "global_step": 562181, "epoch": 6773} {"train_loss": -27.90754508972168, "global_step": 562182, "epoch": 6773} {"train_loss": -27.407276153564453, "global_step": 562183, "epoch": 6773} {"train_loss": -27.759845733642578, "global_step": 562184, "epoch": 6773} {"train_loss": -27.520212173461914, "global_step": 562185, "epoch": 6773} {"train_loss": -27.3110408782959, "global_step": 562186, "epoch": 6773} {"train_loss": -27.37310218811035, "global_step": 562187, "epoch": 6773} {"train_loss": -27.663318634033203, "global_step": 562188, "epoch": 6773} {"train_loss": -27.644657135009766, "global_step": 562189, "epoch": 6773} {"train_loss": -27.813079833984375, "global_step": 562190, "epoch": 6773} {"train_loss": -28.239154815673828, "global_step": 562191, "epoch": 6773} {"train_loss": -27.70159912109375, "global_step": 562192, "epoch": 6773} {"train_loss": -27.673065185546875, "global_step": 562193, "epoch": 6773} {"train_loss": -27.533300399780273, "global_step": 562194, "epoch": 6773} {"train_loss": -27.539356231689453, "global_step": 562195, "epoch": 6773} {"train_loss": -27.89666175842285, "global_step": 562196, "epoch": 6773} {"train_loss": -27.777814865112305, "global_step": 562197, "epoch": 6773} {"train_loss": -27.6314697265625, "global_step": 562198, "epoch": 6773} {"train_loss": -28.195173263549805, "global_step": 562199, "epoch": 6773} {"train_loss": -28.04374122619629, "global_step": 562200, "epoch": 6773} {"train_loss": -27.942834854125977, "global_step": 562201, "epoch": 6773} {"train_loss": -27.997770309448242, "global_step": 562202, "epoch": 6773} {"train_loss": -28.156259536743164, "global_step": 562203, "epoch": 6773} {"train_loss": -28.141172409057617, "global_step": 562204, "epoch": 6773} {"train_loss": -27.5053653717041, "global_step": 562205, "epoch": 6773} {"train_loss": -28.16477394104004, "global_step": 562206, "epoch": 6773} {"train_loss": -27.8087158203125, "global_step": 562207, "epoch": 6773} {"train_loss": -27.866750717163086, "global_step": 562208, "epoch": 6773} {"train_loss": -27.951034545898438, "global_step": 562209, "epoch": 6773} {"train_loss": -27.61541175842285, "global_step": 562210, "epoch": 6773} {"train_loss": -28.119840621948242, "global_step": 562211, "epoch": 6773} {"train_loss": -27.451589584350586, "global_step": 562212, "epoch": 6773} {"train_loss": -28.1121883392334, "global_step": 562213, "epoch": 6773} {"train_loss": -28.077590942382812, "global_step": 562214, "epoch": 6773} {"train_loss": -27.85394859313965, "global_step": 562215, "epoch": 6773} {"train_loss": -28.0601749420166, "global_step": 562216, "epoch": 6773} {"train_loss": -28.187414169311523, "global_step": 562217, "epoch": 6773} {"train_loss": -27.795333862304688, "global_step": 562218, "epoch": 6773} {"train_loss": -27.9476375579834, "global_step": 562219, "epoch": 6773} {"train_loss": -27.845996856689453, "global_step": 562220, "epoch": 6773} {"train_loss": -27.676855087280273, "global_step": 562221, "epoch": 6773} {"train_loss": -27.883798599243164, "global_step": 562222, "epoch": 6773} {"train_loss": -28.1855525970459, "global_step": 562223, "epoch": 6773} {"train_loss": -27.762189865112305, "global_step": 562224, "epoch": 6773} {"train_loss": -27.969791412353516, "global_step": 562225, "epoch": 6773} {"train_loss": -27.557470321655273, "global_step": 562226, "epoch": 6773} {"train_loss": -27.3619441986084, "global_step": 562227, "epoch": 6773} {"train_loss": -27.476276397705078, "global_step": 562228, "epoch": 6773} {"train_loss": -27.33649253845215, "global_step": 562229, "epoch": 6773} {"train_loss": -27.8179874420166, "global_step": 562230, "epoch": 6773} {"train_loss": -28.088958740234375, "global_step": 562231, "epoch": 6773} {"train_loss": -27.746475219726562, "global_step": 562232, "epoch": 6773} {"train_loss": -28.067007064819336, "global_step": 562233, "epoch": 6773} {"train_loss": -27.939605712890625, "global_step": 562234, "epoch": 6773} {"train_loss": -27.528589248657227, "global_step": 562235, "epoch": 6773} {"train_loss": -27.975873947143555, "global_step": 562236, "epoch": 6773} {"train_loss": -28.21630859375, "global_step": 562237, "epoch": 6773} {"train_loss": -27.84189796447754, "global_step": 562238, "epoch": 6773} {"train_loss": -27.959054946899414, "global_step": 562239, "epoch": 6773} {"train_loss": -28.10715675354004, "global_step": 562240, "epoch": 6773} {"train_loss": -27.782557200236493, "global_step": 562241, "epoch": 6773, "val_loss": 6401884.0} {"train_loss": -27.46986198425293, "global_step": 562242, "epoch": 6774} {"train_loss": -27.803770065307617, "global_step": 562243, "epoch": 6774} {"train_loss": -27.07538414001465, "global_step": 562244, "epoch": 6774} {"train_loss": -27.624557495117188, "global_step": 562245, "epoch": 6774} {"train_loss": -27.897104263305664, "global_step": 562246, "epoch": 6774} {"train_loss": -27.21148681640625, "global_step": 562247, "epoch": 6774} {"train_loss": -27.034887313842773, "global_step": 562248, "epoch": 6774} {"train_loss": -27.010000228881836, "global_step": 562249, "epoch": 6774} {"train_loss": -27.68061637878418, "global_step": 562250, "epoch": 6774} {"train_loss": -27.258695602416992, "global_step": 562251, "epoch": 6774} {"train_loss": -27.717670440673828, "global_step": 562252, "epoch": 6774} {"train_loss": -27.353574752807617, "global_step": 562253, "epoch": 6774} {"train_loss": -27.196802139282227, "global_step": 562254, "epoch": 6774} {"train_loss": -27.16642189025879, "global_step": 562255, "epoch": 6774} {"train_loss": -27.759185791015625, "global_step": 562256, "epoch": 6774} {"train_loss": -27.784509658813477, "global_step": 562257, "epoch": 6774} {"train_loss": -27.557861328125, "global_step": 562258, "epoch": 6774} {"train_loss": -27.792943954467773, "global_step": 562259, "epoch": 6774} {"train_loss": -27.858808517456055, "global_step": 562260, "epoch": 6774} {"train_loss": -27.49191665649414, "global_step": 562261, "epoch": 6774} {"train_loss": -27.981616973876953, "global_step": 562262, "epoch": 6774} {"train_loss": -27.5505313873291, "global_step": 562263, "epoch": 6774} {"train_loss": -27.965988159179688, "global_step": 562264, "epoch": 6774} {"train_loss": -27.984943389892578, "global_step": 562265, "epoch": 6774} {"train_loss": -27.544736862182617, "global_step": 562266, "epoch": 6774} {"train_loss": -27.85100746154785, "global_step": 562267, "epoch": 6774} {"train_loss": -27.884174346923828, "global_step": 562268, "epoch": 6774} {"train_loss": -27.751361846923828, "global_step": 562269, "epoch": 6774} {"train_loss": -27.51362419128418, "global_step": 562270, "epoch": 6774} {"train_loss": -27.45623779296875, "global_step": 562271, "epoch": 6774} {"train_loss": -28.056076049804688, "global_step": 562272, "epoch": 6774} {"train_loss": -27.967487335205078, "global_step": 562273, "epoch": 6774} {"train_loss": -28.21759033203125, "global_step": 562274, "epoch": 6774} {"train_loss": -28.03143310546875, "global_step": 562275, "epoch": 6774} {"train_loss": -27.847919464111328, "global_step": 562276, "epoch": 6774} {"train_loss": -27.988794326782227, "global_step": 562277, "epoch": 6774} {"train_loss": -27.94757080078125, "global_step": 562278, "epoch": 6774} {"train_loss": -27.5956974029541, "global_step": 562279, "epoch": 6774} {"train_loss": -28.100263595581055, "global_step": 562280, "epoch": 6774} {"train_loss": -28.042144775390625, "global_step": 562281, "epoch": 6774} {"train_loss": -27.838964462280273, "global_step": 562282, "epoch": 6774} {"train_loss": -27.83696937561035, "global_step": 562283, "epoch": 6774} {"train_loss": -28.107946395874023, "global_step": 562284, "epoch": 6774} {"train_loss": -28.015607833862305, "global_step": 562285, "epoch": 6774} {"train_loss": -28.27802848815918, "global_step": 562286, "epoch": 6774} {"train_loss": -27.98956298828125, "global_step": 562287, "epoch": 6774} {"train_loss": -28.17250633239746, "global_step": 562288, "epoch": 6774} {"train_loss": -28.05002212524414, "global_step": 562289, "epoch": 6774} {"train_loss": -27.773046493530273, "global_step": 562290, "epoch": 6774} {"train_loss": -28.11767578125, "global_step": 562291, "epoch": 6774} {"train_loss": -27.9555606842041, "global_step": 562292, "epoch": 6774} {"train_loss": -27.584619522094727, "global_step": 562293, "epoch": 6774} {"train_loss": -27.547277450561523, "global_step": 562294, "epoch": 6774} {"train_loss": -27.786741256713867, "global_step": 562295, "epoch": 6774} {"train_loss": -27.936548233032227, "global_step": 562296, "epoch": 6774} {"train_loss": -27.972803115844727, "global_step": 562297, "epoch": 6774} {"train_loss": -27.96687889099121, "global_step": 562298, "epoch": 6774} {"train_loss": -27.675525665283203, "global_step": 562299, "epoch": 6774} {"train_loss": -27.738544464111328, "global_step": 562300, "epoch": 6774} {"train_loss": -27.6346492767334, "global_step": 562301, "epoch": 6774} {"train_loss": -27.767597198486328, "global_step": 562302, "epoch": 6774} {"train_loss": -27.769977569580078, "global_step": 562303, "epoch": 6774} {"train_loss": -27.792694091796875, "global_step": 562304, "epoch": 6774} {"train_loss": -27.910322189331055, "global_step": 562305, "epoch": 6774} {"train_loss": -27.48061180114746, "global_step": 562306, "epoch": 6774} {"train_loss": -28.009191513061523, "global_step": 562307, "epoch": 6774} {"train_loss": -27.564624786376953, "global_step": 562308, "epoch": 6774} {"train_loss": -27.779760360717773, "global_step": 562309, "epoch": 6774} {"train_loss": -27.551410675048828, "global_step": 562310, "epoch": 6774} {"train_loss": -27.88204002380371, "global_step": 562311, "epoch": 6774} {"train_loss": -27.44573974609375, "global_step": 562312, "epoch": 6774} {"train_loss": -27.794830322265625, "global_step": 562313, "epoch": 6774} {"train_loss": -27.267871856689453, "global_step": 562314, "epoch": 6774} {"train_loss": -27.692625045776367, "global_step": 562315, "epoch": 6774} {"train_loss": -27.949087142944336, "global_step": 562316, "epoch": 6774} {"train_loss": -27.4410343170166, "global_step": 562317, "epoch": 6774} {"train_loss": -27.273910522460938, "global_step": 562318, "epoch": 6774} {"train_loss": -28.000890731811523, "global_step": 562319, "epoch": 6774} {"train_loss": -27.846054077148438, "global_step": 562320, "epoch": 6774} {"train_loss": -27.479761123657227, "global_step": 562321, "epoch": 6774} {"train_loss": -27.505239486694336, "global_step": 562322, "epoch": 6774} {"train_loss": -27.771390914916992, "global_step": 562323, "epoch": 6774} {"train_loss": -27.74251836753753, "global_step": 562324, "epoch": 6774, "val_loss": 6450659.0} {"train_loss": -26.561935424804688, "global_step": 562325, "epoch": 6775} {"train_loss": -27.158193588256836, "global_step": 562326, "epoch": 6775} {"train_loss": -26.950469970703125, "global_step": 562327, "epoch": 6775} {"train_loss": -27.24382972717285, "global_step": 562328, "epoch": 6775} {"train_loss": -27.319507598876953, "global_step": 562329, "epoch": 6775} {"train_loss": -26.977252960205078, "global_step": 562330, "epoch": 6775} {"train_loss": -27.6934814453125, "global_step": 562331, "epoch": 6775} {"train_loss": -27.1852970123291, "global_step": 562332, "epoch": 6775} {"train_loss": -26.395343780517578, "global_step": 562333, "epoch": 6775} {"train_loss": -27.01434326171875, "global_step": 562334, "epoch": 6775} {"train_loss": -27.19318962097168, "global_step": 562335, "epoch": 6775} {"train_loss": -27.00227165222168, "global_step": 562336, "epoch": 6775} {"train_loss": -27.273542404174805, "global_step": 562337, "epoch": 6775} {"train_loss": -27.29062843322754, "global_step": 562338, "epoch": 6775} {"train_loss": -27.28610610961914, "global_step": 562339, "epoch": 6775} {"train_loss": -27.271581649780273, "global_step": 562340, "epoch": 6775} {"train_loss": -27.34126091003418, "global_step": 562341, "epoch": 6775} {"train_loss": -27.45344352722168, "global_step": 562342, "epoch": 6775} {"train_loss": -27.44607925415039, "global_step": 562343, "epoch": 6775} {"train_loss": -27.24234962463379, "global_step": 562344, "epoch": 6775} {"train_loss": -27.46943473815918, "global_step": 562345, "epoch": 6775} {"train_loss": -27.35310173034668, "global_step": 562346, "epoch": 6775} {"train_loss": -27.397449493408203, "global_step": 562347, "epoch": 6775} {"train_loss": -27.30682373046875, "global_step": 562348, "epoch": 6775} {"train_loss": -27.776819229125977, "global_step": 562349, "epoch": 6775} {"train_loss": -27.324705123901367, "global_step": 562350, "epoch": 6775} {"train_loss": -27.75619888305664, "global_step": 562351, "epoch": 6775} {"train_loss": -27.62421989440918, "global_step": 562352, "epoch": 6775} {"train_loss": -27.52723503112793, "global_step": 562353, "epoch": 6775} {"train_loss": -27.391061782836914, "global_step": 562354, "epoch": 6775} {"train_loss": -27.7399845123291, "global_step": 562355, "epoch": 6775} {"train_loss": -28.077014923095703, "global_step": 562356, "epoch": 6775} {"train_loss": -27.44618034362793, "global_step": 562357, "epoch": 6775} {"train_loss": -27.6575927734375, "global_step": 562358, "epoch": 6775} {"train_loss": -27.58680534362793, "global_step": 562359, "epoch": 6775} {"train_loss": -27.691558837890625, "global_step": 562360, "epoch": 6775} {"train_loss": -28.0186824798584, "global_step": 562361, "epoch": 6775} {"train_loss": -27.906591415405273, "global_step": 562362, "epoch": 6775} {"train_loss": -27.71856689453125, "global_step": 562363, "epoch": 6775} {"train_loss": -27.6104793548584, "global_step": 562364, "epoch": 6775} {"train_loss": -27.6412296295166, "global_step": 562365, "epoch": 6775} {"train_loss": -27.88735008239746, "global_step": 562366, "epoch": 6775} {"train_loss": -28.02557373046875, "global_step": 562367, "epoch": 6775} {"train_loss": -27.932544708251953, "global_step": 562368, "epoch": 6775} {"train_loss": -27.783788681030273, "global_step": 562369, "epoch": 6775} {"train_loss": -27.690656661987305, "global_step": 562370, "epoch": 6775} {"train_loss": -27.644445419311523, "global_step": 562371, "epoch": 6775} {"train_loss": -27.68513298034668, "global_step": 562372, "epoch": 6775} {"train_loss": -27.613794326782227, "global_step": 562373, "epoch": 6775} {"train_loss": -27.9384708404541, "global_step": 562374, "epoch": 6775} {"train_loss": -28.19858741760254, "global_step": 562375, "epoch": 6775} {"train_loss": -28.234643936157227, "global_step": 562376, "epoch": 6775} {"train_loss": -28.3881893157959, "global_step": 562377, "epoch": 6775} {"train_loss": -27.81061363220215, "global_step": 562378, "epoch": 6775} {"train_loss": -27.886011123657227, "global_step": 562379, "epoch": 6775} {"train_loss": -27.864715576171875, "global_step": 562380, "epoch": 6775} {"train_loss": -27.860660552978516, "global_step": 562381, "epoch": 6775} {"train_loss": -28.063526153564453, "global_step": 562382, "epoch": 6775} {"train_loss": -28.2936954498291, "global_step": 562383, "epoch": 6775} {"train_loss": -27.822317123413086, "global_step": 562384, "epoch": 6775} {"train_loss": -28.380630493164062, "global_step": 562385, "epoch": 6775} {"train_loss": -27.92389488220215, "global_step": 562386, "epoch": 6775} {"train_loss": -27.960830688476562, "global_step": 562387, "epoch": 6775} {"train_loss": -27.615507125854492, "global_step": 562388, "epoch": 6775} {"train_loss": -27.76417350769043, "global_step": 562389, "epoch": 6775} {"train_loss": -27.808048248291016, "global_step": 562390, "epoch": 6775} {"train_loss": -27.85687255859375, "global_step": 562391, "epoch": 6775} {"train_loss": -27.93976402282715, "global_step": 562392, "epoch": 6775} {"train_loss": -27.671743392944336, "global_step": 562393, "epoch": 6775} {"train_loss": -27.6871395111084, "global_step": 562394, "epoch": 6775} {"train_loss": -27.457929611206055, "global_step": 562395, "epoch": 6775} {"train_loss": -26.957157135009766, "global_step": 562396, "epoch": 6775} {"train_loss": -27.741979598999023, "global_step": 562397, "epoch": 6775} {"train_loss": -27.713117599487305, "global_step": 562398, "epoch": 6775} {"train_loss": -27.402616500854492, "global_step": 562399, "epoch": 6775} {"train_loss": -27.64106559753418, "global_step": 562400, "epoch": 6775} {"train_loss": -27.281055450439453, "global_step": 562401, "epoch": 6775} {"train_loss": -27.321744918823242, "global_step": 562402, "epoch": 6775} {"train_loss": -27.145139694213867, "global_step": 562403, "epoch": 6775} {"train_loss": -27.849811553955078, "global_step": 562404, "epoch": 6775} {"train_loss": -27.508771896362305, "global_step": 562405, "epoch": 6775} {"train_loss": -27.715606689453125, "global_step": 562406, "epoch": 6775} {"train_loss": -27.58661732041692, "global_step": 562407, "epoch": 6775, "val_loss": 6444562.0} {"train_loss": -27.4660587310791, "global_step": 562408, "epoch": 6776} {"train_loss": -26.190689086914062, "global_step": 562409, "epoch": 6776} {"train_loss": -27.0897274017334, "global_step": 562410, "epoch": 6776} {"train_loss": -26.721967697143555, "global_step": 562411, "epoch": 6776} {"train_loss": -27.160205841064453, "global_step": 562412, "epoch": 6776} {"train_loss": -27.071380615234375, "global_step": 562413, "epoch": 6776} {"train_loss": -27.301315307617188, "global_step": 562414, "epoch": 6776} {"train_loss": -26.957605361938477, "global_step": 562415, "epoch": 6776} {"train_loss": -27.508543014526367, "global_step": 562416, "epoch": 6776} {"train_loss": -27.003559112548828, "global_step": 562417, "epoch": 6776} {"train_loss": -27.288522720336914, "global_step": 562418, "epoch": 6776} {"train_loss": -27.558156967163086, "global_step": 562419, "epoch": 6776} {"train_loss": -27.54306983947754, "global_step": 562420, "epoch": 6776} {"train_loss": -27.317853927612305, "global_step": 562421, "epoch": 6776} {"train_loss": -27.65241813659668, "global_step": 562422, "epoch": 6776} {"train_loss": -27.2060604095459, "global_step": 562423, "epoch": 6776} {"train_loss": -27.080509185791016, "global_step": 562424, "epoch": 6776} {"train_loss": -27.394439697265625, "global_step": 562425, "epoch": 6776} {"train_loss": -27.45352554321289, "global_step": 562426, "epoch": 6776} {"train_loss": -27.4075984954834, "global_step": 562427, "epoch": 6776} {"train_loss": -26.861713409423828, "global_step": 562428, "epoch": 6776} {"train_loss": -27.442991256713867, "global_step": 562429, "epoch": 6776} {"train_loss": -27.544519424438477, "global_step": 562430, "epoch": 6776} {"train_loss": -27.425159454345703, "global_step": 562431, "epoch": 6776} {"train_loss": -27.558923721313477, "global_step": 562432, "epoch": 6776} {"train_loss": -27.355615615844727, "global_step": 562433, "epoch": 6776} {"train_loss": -27.963544845581055, "global_step": 562434, "epoch": 6776} {"train_loss": -27.524646759033203, "global_step": 562435, "epoch": 6776} {"train_loss": -27.49652099609375, "global_step": 562436, "epoch": 6776} {"train_loss": -27.637989044189453, "global_step": 562437, "epoch": 6776} {"train_loss": -27.384946823120117, "global_step": 562438, "epoch": 6776} {"train_loss": -27.2961368560791, "global_step": 562439, "epoch": 6776} {"train_loss": -27.990583419799805, "global_step": 562440, "epoch": 6776} {"train_loss": -27.45233726501465, "global_step": 562441, "epoch": 6776} {"train_loss": -27.71148109436035, "global_step": 562442, "epoch": 6776} {"train_loss": -27.820981979370117, "global_step": 562443, "epoch": 6776} {"train_loss": -28.1500186920166, "global_step": 562444, "epoch": 6776} {"train_loss": -27.817609786987305, "global_step": 562445, "epoch": 6776} {"train_loss": -27.45639991760254, "global_step": 562446, "epoch": 6776} {"train_loss": -27.97102928161621, "global_step": 562447, "epoch": 6776} {"train_loss": -27.70635414123535, "global_step": 562448, "epoch": 6776} {"train_loss": -27.446903228759766, "global_step": 562449, "epoch": 6776} {"train_loss": -27.3313045501709, "global_step": 562450, "epoch": 6776} {"train_loss": -27.731367111206055, "global_step": 562451, "epoch": 6776} {"train_loss": -27.440216064453125, "global_step": 562452, "epoch": 6776} {"train_loss": -28.141698837280273, "global_step": 562453, "epoch": 6776} {"train_loss": -27.84441566467285, "global_step": 562454, "epoch": 6776} {"train_loss": -28.18218421936035, "global_step": 562455, "epoch": 6776} {"train_loss": -28.10042381286621, "global_step": 562456, "epoch": 6776} {"train_loss": -27.796701431274414, "global_step": 562457, "epoch": 6776} {"train_loss": -28.026525497436523, "global_step": 562458, "epoch": 6776} {"train_loss": -28.10939598083496, "global_step": 562459, "epoch": 6776} {"train_loss": -27.68352699279785, "global_step": 562460, "epoch": 6776} {"train_loss": -27.813032150268555, "global_step": 562461, "epoch": 6776} {"train_loss": -27.7056827545166, "global_step": 562462, "epoch": 6776} {"train_loss": -27.88197135925293, "global_step": 562463, "epoch": 6776} {"train_loss": -27.600006103515625, "global_step": 562464, "epoch": 6776} {"train_loss": -28.060302734375, "global_step": 562465, "epoch": 6776} {"train_loss": -27.67291259765625, "global_step": 562466, "epoch": 6776} {"train_loss": -27.90604019165039, "global_step": 562467, "epoch": 6776} {"train_loss": -27.905298233032227, "global_step": 562468, "epoch": 6776} {"train_loss": -28.13154411315918, "global_step": 562469, "epoch": 6776} {"train_loss": -28.331867218017578, "global_step": 562470, "epoch": 6776} {"train_loss": -27.610151290893555, "global_step": 562471, "epoch": 6776} {"train_loss": -27.9412899017334, "global_step": 562472, "epoch": 6776} {"train_loss": -27.964160919189453, "global_step": 562473, "epoch": 6776} {"train_loss": -28.1390380859375, "global_step": 562474, "epoch": 6776} {"train_loss": -27.750030517578125, "global_step": 562475, "epoch": 6776} {"train_loss": -27.764942169189453, "global_step": 562476, "epoch": 6776} {"train_loss": -27.6868953704834, "global_step": 562477, "epoch": 6776} {"train_loss": -27.97294044494629, "global_step": 562478, "epoch": 6776} {"train_loss": -27.57669448852539, "global_step": 562479, "epoch": 6776} {"train_loss": -27.962894439697266, "global_step": 562480, "epoch": 6776} {"train_loss": -27.97562026977539, "global_step": 562481, "epoch": 6776} {"train_loss": -27.892053604125977, "global_step": 562482, "epoch": 6776} {"train_loss": -27.891172409057617, "global_step": 562483, "epoch": 6776} {"train_loss": -27.813222885131836, "global_step": 562484, "epoch": 6776} {"train_loss": -27.56764030456543, "global_step": 562485, "epoch": 6776} {"train_loss": -28.207258224487305, "global_step": 562486, "epoch": 6776} {"train_loss": -27.671350479125977, "global_step": 562487, "epoch": 6776} {"train_loss": -27.838516235351562, "global_step": 562488, "epoch": 6776} {"train_loss": -27.689380645751953, "global_step": 562489, "epoch": 6776} {"train_loss": -27.63477325439453, "global_step": 562490, "epoch": 6776, "val_loss": 6441098.0} {"train_loss": -27.540700912475586, "global_step": 562491, "epoch": 6777} {"train_loss": -27.183460235595703, "global_step": 562492, "epoch": 6777} {"train_loss": -27.222278594970703, "global_step": 562493, "epoch": 6777} {"train_loss": -27.199445724487305, "global_step": 562494, "epoch": 6777} {"train_loss": -27.60725212097168, "global_step": 562495, "epoch": 6777} {"train_loss": -27.556854248046875, "global_step": 562496, "epoch": 6777} {"train_loss": -27.783615112304688, "global_step": 562497, "epoch": 6777} {"train_loss": -27.358753204345703, "global_step": 562498, "epoch": 6777} {"train_loss": -27.458948135375977, "global_step": 562499, "epoch": 6777} {"train_loss": -27.72977638244629, "global_step": 562500, "epoch": 6777} {"train_loss": -27.452600479125977, "global_step": 562501, "epoch": 6777} {"train_loss": -27.509552001953125, "global_step": 562502, "epoch": 6777} {"train_loss": -27.47809410095215, "global_step": 562503, "epoch": 6777} {"train_loss": -27.588361740112305, "global_step": 562504, "epoch": 6777} {"train_loss": -28.074995040893555, "global_step": 562505, "epoch": 6777} {"train_loss": -27.55946159362793, "global_step": 562506, "epoch": 6777} {"train_loss": -27.600616455078125, "global_step": 562507, "epoch": 6777} {"train_loss": -27.436634063720703, "global_step": 562508, "epoch": 6777} {"train_loss": -27.869647979736328, "global_step": 562509, "epoch": 6777} {"train_loss": -27.691038131713867, "global_step": 562510, "epoch": 6777} {"train_loss": -27.849105834960938, "global_step": 562511, "epoch": 6777} {"train_loss": -27.9383487701416, "global_step": 562512, "epoch": 6777} {"train_loss": -27.846942901611328, "global_step": 562513, "epoch": 6777} {"train_loss": -27.761396408081055, "global_step": 562514, "epoch": 6777} {"train_loss": -27.91371726989746, "global_step": 562515, "epoch": 6777} {"train_loss": -27.764026641845703, "global_step": 562516, "epoch": 6777} {"train_loss": -27.581689834594727, "global_step": 562517, "epoch": 6777} {"train_loss": -27.767669677734375, "global_step": 562518, "epoch": 6777} {"train_loss": -28.009754180908203, "global_step": 562519, "epoch": 6777} {"train_loss": -27.706003189086914, "global_step": 562520, "epoch": 6777} {"train_loss": -27.78946304321289, "global_step": 562521, "epoch": 6777} {"train_loss": -28.1729793548584, "global_step": 562522, "epoch": 6777} {"train_loss": -27.762683868408203, "global_step": 562523, "epoch": 6777} {"train_loss": -27.630146026611328, "global_step": 562524, "epoch": 6777} {"train_loss": -27.833175659179688, "global_step": 562525, "epoch": 6777} {"train_loss": -28.1660099029541, "global_step": 562526, "epoch": 6777} {"train_loss": -28.32660484313965, "global_step": 562527, "epoch": 6777} {"train_loss": -28.098907470703125, "global_step": 562528, "epoch": 6777} {"train_loss": -27.76263427734375, "global_step": 562529, "epoch": 6777} {"train_loss": -28.005475997924805, "global_step": 562530, "epoch": 6777} {"train_loss": -27.642608642578125, "global_step": 562531, "epoch": 6777} {"train_loss": -28.022748947143555, "global_step": 562532, "epoch": 6777} {"train_loss": -27.921457290649414, "global_step": 562533, "epoch": 6777} {"train_loss": -27.97823143005371, "global_step": 562534, "epoch": 6777} {"train_loss": -27.83723258972168, "global_step": 562535, "epoch": 6777} {"train_loss": -27.949481964111328, "global_step": 562536, "epoch": 6777} {"train_loss": -27.980222702026367, "global_step": 562537, "epoch": 6777} {"train_loss": -27.621984481811523, "global_step": 562538, "epoch": 6777} {"train_loss": -27.913415908813477, "global_step": 562539, "epoch": 6777} {"train_loss": -28.074766159057617, "global_step": 562540, "epoch": 6777} {"train_loss": -27.60248374938965, "global_step": 562541, "epoch": 6777} {"train_loss": -27.72430419921875, "global_step": 562542, "epoch": 6777} {"train_loss": -27.624622344970703, "global_step": 562543, "epoch": 6777} {"train_loss": -27.278656005859375, "global_step": 562544, "epoch": 6777} {"train_loss": -27.007888793945312, "global_step": 562545, "epoch": 6777} {"train_loss": -26.822021484375, "global_step": 562546, "epoch": 6777} {"train_loss": -27.273456573486328, "global_step": 562547, "epoch": 6777} {"train_loss": -27.736530303955078, "global_step": 562548, "epoch": 6777} {"train_loss": -27.42547607421875, "global_step": 562549, "epoch": 6777} {"train_loss": -27.70643424987793, "global_step": 562550, "epoch": 6777} {"train_loss": -27.375158309936523, "global_step": 562551, "epoch": 6777} {"train_loss": -27.511632919311523, "global_step": 562552, "epoch": 6777} {"train_loss": -27.571882247924805, "global_step": 562553, "epoch": 6777} {"train_loss": -27.097375869750977, "global_step": 562554, "epoch": 6777} {"train_loss": -27.858814239501953, "global_step": 562555, "epoch": 6777} {"train_loss": -27.47121238708496, "global_step": 562556, "epoch": 6777} {"train_loss": -27.19559669494629, "global_step": 562557, "epoch": 6777} {"train_loss": -27.47853660583496, "global_step": 562558, "epoch": 6777} {"train_loss": -27.447269439697266, "global_step": 562559, "epoch": 6777} {"train_loss": -27.214832305908203, "global_step": 562560, "epoch": 6777} {"train_loss": -27.425573348999023, "global_step": 562561, "epoch": 6777} {"train_loss": -27.495441436767578, "global_step": 562562, "epoch": 6777} {"train_loss": -27.5887508392334, "global_step": 562563, "epoch": 6777} {"train_loss": -27.49356460571289, "global_step": 562564, "epoch": 6777} {"train_loss": -27.419111251831055, "global_step": 562565, "epoch": 6777} {"train_loss": -27.840229034423828, "global_step": 562566, "epoch": 6777} {"train_loss": -27.74921989440918, "global_step": 562567, "epoch": 6777} {"train_loss": -27.781713485717773, "global_step": 562568, "epoch": 6777} {"train_loss": -27.637283325195312, "global_step": 562569, "epoch": 6777} {"train_loss": -27.46807289123535, "global_step": 562570, "epoch": 6777} {"train_loss": -27.53602409362793, "global_step": 562571, "epoch": 6777} {"train_loss": -27.72258949279785, "global_step": 562572, "epoch": 6777} {"train_loss": -27.661956327507294, "global_step": 562573, "epoch": 6777, "val_loss": 6437470.0} {"train_loss": -27.5327205657959, "global_step": 562574, "epoch": 6778} {"train_loss": -27.23489761352539, "global_step": 562575, "epoch": 6778} {"train_loss": -27.601110458374023, "global_step": 562576, "epoch": 6778} {"train_loss": -27.697477340698242, "global_step": 562577, "epoch": 6778} {"train_loss": -27.689727783203125, "global_step": 562578, "epoch": 6778} {"train_loss": -27.866926193237305, "global_step": 562579, "epoch": 6778} {"train_loss": -27.45229148864746, "global_step": 562580, "epoch": 6778} {"train_loss": -27.654760360717773, "global_step": 562581, "epoch": 6778} {"train_loss": -27.31568717956543, "global_step": 562582, "epoch": 6778} {"train_loss": -28.01065444946289, "global_step": 562583, "epoch": 6778} {"train_loss": -27.94353675842285, "global_step": 562584, "epoch": 6778} {"train_loss": -27.85861587524414, "global_step": 562585, "epoch": 6778} {"train_loss": -27.787302017211914, "global_step": 562586, "epoch": 6778} {"train_loss": -27.794530868530273, "global_step": 562587, "epoch": 6778} {"train_loss": -27.860855102539062, "global_step": 562588, "epoch": 6778} {"train_loss": -27.8392276763916, "global_step": 562589, "epoch": 6778} {"train_loss": -27.937047958374023, "global_step": 562590, "epoch": 6778} {"train_loss": -28.029983520507812, "global_step": 562591, "epoch": 6778} {"train_loss": -27.650381088256836, "global_step": 562592, "epoch": 6778} {"train_loss": -27.764972686767578, "global_step": 562593, "epoch": 6778} {"train_loss": -27.777637481689453, "global_step": 562594, "epoch": 6778} {"train_loss": -28.197805404663086, "global_step": 562595, "epoch": 6778} {"train_loss": -28.0715274810791, "global_step": 562596, "epoch": 6778} {"train_loss": -27.902698516845703, "global_step": 562597, "epoch": 6778} {"train_loss": -27.649145126342773, "global_step": 562598, "epoch": 6778} {"train_loss": -27.569793701171875, "global_step": 562599, "epoch": 6778} {"train_loss": -28.15288734436035, "global_step": 562600, "epoch": 6778} {"train_loss": -28.16412353515625, "global_step": 562601, "epoch": 6778} {"train_loss": -28.126829147338867, "global_step": 562602, "epoch": 6778} {"train_loss": -28.1430606842041, "global_step": 562603, "epoch": 6778} {"train_loss": -27.67608070373535, "global_step": 562604, "epoch": 6778} {"train_loss": -28.31756591796875, "global_step": 562605, "epoch": 6778} {"train_loss": -27.854455947875977, "global_step": 562606, "epoch": 6778} {"train_loss": -27.70538330078125, "global_step": 562607, "epoch": 6778} {"train_loss": -28.064294815063477, "global_step": 562608, "epoch": 6778} {"train_loss": -27.670841217041016, "global_step": 562609, "epoch": 6778} {"train_loss": -27.81641960144043, "global_step": 562610, "epoch": 6778} {"train_loss": -28.092512130737305, "global_step": 562611, "epoch": 6778} {"train_loss": -27.931476593017578, "global_step": 562612, "epoch": 6778} {"train_loss": -27.98908042907715, "global_step": 562613, "epoch": 6778} {"train_loss": -27.85283851623535, "global_step": 562614, "epoch": 6778} {"train_loss": -27.579259872436523, "global_step": 562615, "epoch": 6778} {"train_loss": -27.941274642944336, "global_step": 562616, "epoch": 6778} {"train_loss": -27.8469295501709, "global_step": 562617, "epoch": 6778} {"train_loss": -27.702280044555664, "global_step": 562618, "epoch": 6778} {"train_loss": -27.716934204101562, "global_step": 562619, "epoch": 6778} {"train_loss": -27.70400047302246, "global_step": 562620, "epoch": 6778} {"train_loss": -27.674890518188477, "global_step": 562621, "epoch": 6778} {"train_loss": -28.066675186157227, "global_step": 562622, "epoch": 6778} {"train_loss": -27.63115882873535, "global_step": 562623, "epoch": 6778} {"train_loss": -27.67453956604004, "global_step": 562624, "epoch": 6778} {"train_loss": -27.88824462890625, "global_step": 562625, "epoch": 6778} {"train_loss": -27.841405868530273, "global_step": 562626, "epoch": 6778} {"train_loss": -27.99521827697754, "global_step": 562627, "epoch": 6778} {"train_loss": -27.63958740234375, "global_step": 562628, "epoch": 6778} {"train_loss": -27.6132755279541, "global_step": 562629, "epoch": 6778} {"train_loss": -27.742334365844727, "global_step": 562630, "epoch": 6778} {"train_loss": -28.066675186157227, "global_step": 562631, "epoch": 6778} {"train_loss": -27.855792999267578, "global_step": 562632, "epoch": 6778} {"train_loss": -27.478748321533203, "global_step": 562633, "epoch": 6778} {"train_loss": -27.0211238861084, "global_step": 562634, "epoch": 6778} {"train_loss": -27.14876365661621, "global_step": 562635, "epoch": 6778} {"train_loss": -28.13530921936035, "global_step": 562636, "epoch": 6778} {"train_loss": -27.285964965820312, "global_step": 562637, "epoch": 6778} {"train_loss": -26.21677017211914, "global_step": 562638, "epoch": 6778} {"train_loss": -27.519750595092773, "global_step": 562639, "epoch": 6778} {"train_loss": -27.528900146484375, "global_step": 562640, "epoch": 6778} {"train_loss": -27.2924861907959, "global_step": 562641, "epoch": 6778} {"train_loss": -27.52933692932129, "global_step": 562642, "epoch": 6778} {"train_loss": -27.657636642456055, "global_step": 562643, "epoch": 6778} {"train_loss": -27.757965087890625, "global_step": 562644, "epoch": 6778} {"train_loss": -27.585275650024414, "global_step": 562645, "epoch": 6778} {"train_loss": -27.492521286010742, "global_step": 562646, "epoch": 6778} {"train_loss": -27.874073028564453, "global_step": 562647, "epoch": 6778} {"train_loss": -27.5878963470459, "global_step": 562648, "epoch": 6778} {"train_loss": -27.38197898864746, "global_step": 562649, "epoch": 6778} {"train_loss": -27.830596923828125, "global_step": 562650, "epoch": 6778} {"train_loss": -27.75311279296875, "global_step": 562651, "epoch": 6778} {"train_loss": -27.44048500061035, "global_step": 562652, "epoch": 6778} {"train_loss": -27.51375389099121, "global_step": 562653, "epoch": 6778} {"train_loss": -27.470067977905273, "global_step": 562654, "epoch": 6778} {"train_loss": -27.827070236206055, "global_step": 562655, "epoch": 6778} {"train_loss": -27.73163942543857, "global_step": 562656, "epoch": 6778, "val_loss": 6463540.0} {"train_loss": -26.950977325439453, "global_step": 562657, "epoch": 6779} {"train_loss": -26.14967155456543, "global_step": 562658, "epoch": 6779} {"train_loss": -26.345325469970703, "global_step": 562659, "epoch": 6779} {"train_loss": -26.340036392211914, "global_step": 562660, "epoch": 6779} {"train_loss": -26.924453735351562, "global_step": 562661, "epoch": 6779} {"train_loss": -26.893285751342773, "global_step": 562662, "epoch": 6779} {"train_loss": -26.988483428955078, "global_step": 562663, "epoch": 6779} {"train_loss": -27.331253051757812, "global_step": 562664, "epoch": 6779} {"train_loss": -26.623876571655273, "global_step": 562665, "epoch": 6779} {"train_loss": -26.627660751342773, "global_step": 562666, "epoch": 6779} {"train_loss": -26.995777130126953, "global_step": 562667, "epoch": 6779} {"train_loss": -27.15264892578125, "global_step": 562668, "epoch": 6779} {"train_loss": -27.203216552734375, "global_step": 562669, "epoch": 6779} {"train_loss": -27.129730224609375, "global_step": 562670, "epoch": 6779} {"train_loss": -27.571645736694336, "global_step": 562671, "epoch": 6779} {"train_loss": -27.237409591674805, "global_step": 562672, "epoch": 6779} {"train_loss": -27.323486328125, "global_step": 562673, "epoch": 6779} {"train_loss": -27.645666122436523, "global_step": 562674, "epoch": 6779} {"train_loss": -27.153533935546875, "global_step": 562675, "epoch": 6779} {"train_loss": -27.08209800720215, "global_step": 562676, "epoch": 6779} {"train_loss": -27.35703468322754, "global_step": 562677, "epoch": 6779} {"train_loss": -27.51997947692871, "global_step": 562678, "epoch": 6779} {"train_loss": -27.59343910217285, "global_step": 562679, "epoch": 6779} {"train_loss": -27.227115631103516, "global_step": 562680, "epoch": 6779} {"train_loss": -27.359272003173828, "global_step": 562681, "epoch": 6779} {"train_loss": -28.10660743713379, "global_step": 562682, "epoch": 6779} {"train_loss": -27.4781494140625, "global_step": 562683, "epoch": 6779} {"train_loss": -27.537572860717773, "global_step": 562684, "epoch": 6779} {"train_loss": -27.836225509643555, "global_step": 562685, "epoch": 6779} {"train_loss": -28.032873153686523, "global_step": 562686, "epoch": 6779} {"train_loss": -27.785831451416016, "global_step": 562687, "epoch": 6779} {"train_loss": -27.88120460510254, "global_step": 562688, "epoch": 6779} {"train_loss": -27.787973403930664, "global_step": 562689, "epoch": 6779} {"train_loss": -28.107818603515625, "global_step": 562690, "epoch": 6779} {"train_loss": -27.9859676361084, "global_step": 562691, "epoch": 6779} {"train_loss": -27.708148956298828, "global_step": 562692, "epoch": 6779} {"train_loss": -28.01584815979004, "global_step": 562693, "epoch": 6779} {"train_loss": -27.829065322875977, "global_step": 562694, "epoch": 6779} {"train_loss": -27.89825439453125, "global_step": 562695, "epoch": 6779} {"train_loss": -27.966815948486328, "global_step": 562696, "epoch": 6779} {"train_loss": -27.8968563079834, "global_step": 562697, "epoch": 6779} {"train_loss": -27.92000389099121, "global_step": 562698, "epoch": 6779} {"train_loss": -28.073278427124023, "global_step": 562699, "epoch": 6779} {"train_loss": -28.036117553710938, "global_step": 562700, "epoch": 6779} {"train_loss": -27.51093101501465, "global_step": 562701, "epoch": 6779} {"train_loss": -28.145532608032227, "global_step": 562702, "epoch": 6779} {"train_loss": -27.5992488861084, "global_step": 562703, "epoch": 6779} {"train_loss": -27.745742797851562, "global_step": 562704, "epoch": 6779} {"train_loss": -27.93659019470215, "global_step": 562705, "epoch": 6779} {"train_loss": -27.8474178314209, "global_step": 562706, "epoch": 6779} {"train_loss": -27.943403244018555, "global_step": 562707, "epoch": 6779} {"train_loss": -28.112966537475586, "global_step": 562708, "epoch": 6779} {"train_loss": -27.874170303344727, "global_step": 562709, "epoch": 6779} {"train_loss": -27.9470272064209, "global_step": 562710, "epoch": 6779} {"train_loss": -28.144067764282227, "global_step": 562711, "epoch": 6779} {"train_loss": -27.990507125854492, "global_step": 562712, "epoch": 6779} {"train_loss": -28.28367042541504, "global_step": 562713, "epoch": 6779} {"train_loss": -27.877307891845703, "global_step": 562714, "epoch": 6779} {"train_loss": -27.86285972595215, "global_step": 562715, "epoch": 6779} {"train_loss": -27.82451820373535, "global_step": 562716, "epoch": 6779} {"train_loss": -27.73529052734375, "global_step": 562717, "epoch": 6779} {"train_loss": -28.358535766601562, "global_step": 562718, "epoch": 6779} {"train_loss": -27.62188148498535, "global_step": 562719, "epoch": 6779} {"train_loss": -27.57242202758789, "global_step": 562720, "epoch": 6779} {"train_loss": -27.378591537475586, "global_step": 562721, "epoch": 6779} {"train_loss": -27.134033203125, "global_step": 562722, "epoch": 6779} {"train_loss": -27.618011474609375, "global_step": 562723, "epoch": 6779} {"train_loss": -27.584613800048828, "global_step": 562724, "epoch": 6779} {"train_loss": -27.354938507080078, "global_step": 562725, "epoch": 6779} {"train_loss": -26.216955184936523, "global_step": 562726, "epoch": 6779} {"train_loss": -25.921064376831055, "global_step": 562727, "epoch": 6779} {"train_loss": -27.130041122436523, "global_step": 562728, "epoch": 6779} {"train_loss": -27.414182662963867, "global_step": 562729, "epoch": 6779} {"train_loss": -27.038461685180664, "global_step": 562730, "epoch": 6779} {"train_loss": -27.380264282226562, "global_step": 562731, "epoch": 6779} {"train_loss": -27.2905216217041, "global_step": 562732, "epoch": 6779} {"train_loss": -27.082372665405273, "global_step": 562733, "epoch": 6779} {"train_loss": -27.10422134399414, "global_step": 562734, "epoch": 6779} {"train_loss": -27.37339210510254, "global_step": 562735, "epoch": 6779} {"train_loss": -27.559890747070312, "global_step": 562736, "epoch": 6779} {"train_loss": -27.506994247436523, "global_step": 562737, "epoch": 6779} {"train_loss": -27.465070724487305, "global_step": 562738, "epoch": 6779} {"train_loss": -27.504866381725634, "global_step": 562739, "epoch": 6779, "val_loss": 6397400.0} {"train_loss": -26.257186889648438, "global_step": 562740, "epoch": 6780} {"train_loss": -26.97075843811035, "global_step": 562741, "epoch": 6780} {"train_loss": -26.728412628173828, "global_step": 562742, "epoch": 6780} {"train_loss": -26.7094783782959, "global_step": 562743, "epoch": 6780} {"train_loss": -26.447162628173828, "global_step": 562744, "epoch": 6780} {"train_loss": -27.344623565673828, "global_step": 562745, "epoch": 6780} {"train_loss": -27.03553581237793, "global_step": 562746, "epoch": 6780} {"train_loss": -27.017019271850586, "global_step": 562747, "epoch": 6780} {"train_loss": -27.214811325073242, "global_step": 562748, "epoch": 6780} {"train_loss": -26.950515747070312, "global_step": 562749, "epoch": 6780} {"train_loss": -27.097997665405273, "global_step": 562750, "epoch": 6780} {"train_loss": -27.374652862548828, "global_step": 562751, "epoch": 6780} {"train_loss": -27.477344512939453, "global_step": 562752, "epoch": 6780} {"train_loss": -26.648359298706055, "global_step": 562753, "epoch": 6780} {"train_loss": -27.424285888671875, "global_step": 562754, "epoch": 6780} {"train_loss": -27.773380279541016, "global_step": 562755, "epoch": 6780} {"train_loss": -27.314273834228516, "global_step": 562756, "epoch": 6780} {"train_loss": -26.90693473815918, "global_step": 562757, "epoch": 6780} {"train_loss": -27.557891845703125, "global_step": 562758, "epoch": 6780} {"train_loss": -27.492023468017578, "global_step": 562759, "epoch": 6780} {"train_loss": -27.366809844970703, "global_step": 562760, "epoch": 6780} {"train_loss": -27.61606788635254, "global_step": 562761, "epoch": 6780} {"train_loss": -27.478036880493164, "global_step": 562762, "epoch": 6780} {"train_loss": -27.84529685974121, "global_step": 562763, "epoch": 6780} {"train_loss": -27.543930053710938, "global_step": 562764, "epoch": 6780} {"train_loss": -27.60235023498535, "global_step": 562765, "epoch": 6780} {"train_loss": -27.57245445251465, "global_step": 562766, "epoch": 6780} {"train_loss": -27.496740341186523, "global_step": 562767, "epoch": 6780} {"train_loss": -27.930341720581055, "global_step": 562768, "epoch": 6780} {"train_loss": -27.3206787109375, "global_step": 562769, "epoch": 6780} {"train_loss": -27.86676597595215, "global_step": 562770, "epoch": 6780} {"train_loss": -27.79541015625, "global_step": 562771, "epoch": 6780} {"train_loss": -27.609106063842773, "global_step": 562772, "epoch": 6780} {"train_loss": -27.90388298034668, "global_step": 562773, "epoch": 6780} {"train_loss": -27.926984786987305, "global_step": 562774, "epoch": 6780} {"train_loss": -27.77435302734375, "global_step": 562775, "epoch": 6780} {"train_loss": -27.977197647094727, "global_step": 562776, "epoch": 6780} {"train_loss": -27.77886390686035, "global_step": 562777, "epoch": 6780} {"train_loss": -28.15015983581543, "global_step": 562778, "epoch": 6780} {"train_loss": -27.76163673400879, "global_step": 562779, "epoch": 6780} {"train_loss": -27.860166549682617, "global_step": 562780, "epoch": 6780} {"train_loss": -27.591999053955078, "global_step": 562781, "epoch": 6780} {"train_loss": -27.965932846069336, "global_step": 562782, "epoch": 6780} {"train_loss": -27.988605499267578, "global_step": 562783, "epoch": 6780} {"train_loss": -28.165231704711914, "global_step": 562784, "epoch": 6780} {"train_loss": -27.96079444885254, "global_step": 562785, "epoch": 6780} {"train_loss": -27.976282119750977, "global_step": 562786, "epoch": 6780} {"train_loss": -28.004058837890625, "global_step": 562787, "epoch": 6780} {"train_loss": -28.434118270874023, "global_step": 562788, "epoch": 6780} {"train_loss": -27.874771118164062, "global_step": 562789, "epoch": 6780} {"train_loss": -27.955678939819336, "global_step": 562790, "epoch": 6780} {"train_loss": -28.015655517578125, "global_step": 562791, "epoch": 6780} {"train_loss": -27.752965927124023, "global_step": 562792, "epoch": 6780} {"train_loss": -27.811532974243164, "global_step": 562793, "epoch": 6780} {"train_loss": -28.022613525390625, "global_step": 562794, "epoch": 6780} {"train_loss": -27.8781795501709, "global_step": 562795, "epoch": 6780} {"train_loss": -27.75886344909668, "global_step": 562796, "epoch": 6780} {"train_loss": -27.089658737182617, "global_step": 562797, "epoch": 6780} {"train_loss": -27.25800895690918, "global_step": 562798, "epoch": 6780} {"train_loss": -26.498929977416992, "global_step": 562799, "epoch": 6780} {"train_loss": -26.840408325195312, "global_step": 562800, "epoch": 6780} {"train_loss": -27.232519149780273, "global_step": 562801, "epoch": 6780} {"train_loss": -27.945993423461914, "global_step": 562802, "epoch": 6780} {"train_loss": -27.712888717651367, "global_step": 562803, "epoch": 6780} {"train_loss": -27.69386863708496, "global_step": 562804, "epoch": 6780} {"train_loss": -27.38214683532715, "global_step": 562805, "epoch": 6780} {"train_loss": -28.035980224609375, "global_step": 562806, "epoch": 6780} {"train_loss": -27.454395294189453, "global_step": 562807, "epoch": 6780} {"train_loss": -27.7799015045166, "global_step": 562808, "epoch": 6780} {"train_loss": -27.768747329711914, "global_step": 562809, "epoch": 6780} {"train_loss": -27.807523727416992, "global_step": 562810, "epoch": 6780} {"train_loss": -27.952301025390625, "global_step": 562811, "epoch": 6780} {"train_loss": -27.90347671508789, "global_step": 562812, "epoch": 6780} {"train_loss": -27.613264083862305, "global_step": 562813, "epoch": 6780} {"train_loss": -28.01857566833496, "global_step": 562814, "epoch": 6780} {"train_loss": -27.968000411987305, "global_step": 562815, "epoch": 6780} {"train_loss": -28.11537742614746, "global_step": 562816, "epoch": 6780} {"train_loss": -27.943023681640625, "global_step": 562817, "epoch": 6780} {"train_loss": -27.906835556030273, "global_step": 562818, "epoch": 6780} {"train_loss": -28.15191650390625, "global_step": 562819, "epoch": 6780} {"train_loss": -28.2031307220459, "global_step": 562820, "epoch": 6780} {"train_loss": -28.062421798706055, "global_step": 562821, "epoch": 6780} {"train_loss": -27.58974024761154, "global_step": 562822, "epoch": 6780, "val_loss": 6325198.0} {"train_loss": -27.34942054748535, "global_step": 562823, "epoch": 6781} {"train_loss": -27.071533203125, "global_step": 562824, "epoch": 6781} {"train_loss": -27.463459014892578, "global_step": 562825, "epoch": 6781} {"train_loss": -27.519994735717773, "global_step": 562826, "epoch": 6781} {"train_loss": -26.904739379882812, "global_step": 562827, "epoch": 6781} {"train_loss": -27.08928871154785, "global_step": 562828, "epoch": 6781} {"train_loss": -27.754501342773438, "global_step": 562829, "epoch": 6781} {"train_loss": -27.079431533813477, "global_step": 562830, "epoch": 6781} {"train_loss": -27.096832275390625, "global_step": 562831, "epoch": 6781} {"train_loss": -27.3492488861084, "global_step": 562832, "epoch": 6781} {"train_loss": -27.090717315673828, "global_step": 562833, "epoch": 6781} {"train_loss": -27.496686935424805, "global_step": 562834, "epoch": 6781} {"train_loss": -27.12714958190918, "global_step": 562835, "epoch": 6781} {"train_loss": -27.07268714904785, "global_step": 562836, "epoch": 6781} {"train_loss": -27.494781494140625, "global_step": 562837, "epoch": 6781} {"train_loss": -27.310657501220703, "global_step": 562838, "epoch": 6781} {"train_loss": -27.380109786987305, "global_step": 562839, "epoch": 6781} {"train_loss": -27.39308738708496, "global_step": 562840, "epoch": 6781} {"train_loss": -27.51081657409668, "global_step": 562841, "epoch": 6781} {"train_loss": -27.40335464477539, "global_step": 562842, "epoch": 6781} {"train_loss": -27.847461700439453, "global_step": 562843, "epoch": 6781} {"train_loss": -27.613683700561523, "global_step": 562844, "epoch": 6781} {"train_loss": -27.603473663330078, "global_step": 562845, "epoch": 6781} {"train_loss": -27.717222213745117, "global_step": 562846, "epoch": 6781} {"train_loss": -27.330371856689453, "global_step": 562847, "epoch": 6781} {"train_loss": -27.695783615112305, "global_step": 562848, "epoch": 6781} {"train_loss": -27.50115394592285, "global_step": 562849, "epoch": 6781} {"train_loss": -27.3699951171875, "global_step": 562850, "epoch": 6781} {"train_loss": -27.545434951782227, "global_step": 562851, "epoch": 6781} {"train_loss": -27.720251083374023, "global_step": 562852, "epoch": 6781} {"train_loss": -27.582212448120117, "global_step": 562853, "epoch": 6781} {"train_loss": -27.872882843017578, "global_step": 562854, "epoch": 6781} {"train_loss": -27.88241958618164, "global_step": 562855, "epoch": 6781} {"train_loss": -28.020618438720703, "global_step": 562856, "epoch": 6781} {"train_loss": -27.725446701049805, "global_step": 562857, "epoch": 6781} {"train_loss": -27.683048248291016, "global_step": 562858, "epoch": 6781} {"train_loss": -28.34254264831543, "global_step": 562859, "epoch": 6781} {"train_loss": -28.007421493530273, "global_step": 562860, "epoch": 6781} {"train_loss": -27.818334579467773, "global_step": 562861, "epoch": 6781} {"train_loss": -27.799407958984375, "global_step": 562862, "epoch": 6781} {"train_loss": -27.982725143432617, "global_step": 562863, "epoch": 6781} {"train_loss": -27.99395179748535, "global_step": 562864, "epoch": 6781} {"train_loss": -28.532012939453125, "global_step": 562865, "epoch": 6781} {"train_loss": -27.92329216003418, "global_step": 562866, "epoch": 6781} {"train_loss": -27.916540145874023, "global_step": 562867, "epoch": 6781} {"train_loss": -28.13006591796875, "global_step": 562868, "epoch": 6781} {"train_loss": -27.89678382873535, "global_step": 562869, "epoch": 6781} {"train_loss": -28.029767990112305, "global_step": 562870, "epoch": 6781} {"train_loss": -28.383955001831055, "global_step": 562871, "epoch": 6781} {"train_loss": -28.259662628173828, "global_step": 562872, "epoch": 6781} {"train_loss": -27.875158309936523, "global_step": 562873, "epoch": 6781} {"train_loss": -27.557126998901367, "global_step": 562874, "epoch": 6781} {"train_loss": -27.820959091186523, "global_step": 562875, "epoch": 6781} {"train_loss": -27.504348754882812, "global_step": 562876, "epoch": 6781} {"train_loss": -27.75723648071289, "global_step": 562877, "epoch": 6781} {"train_loss": -27.544214248657227, "global_step": 562878, "epoch": 6781} {"train_loss": -27.463306427001953, "global_step": 562879, "epoch": 6781} {"train_loss": -27.5888614654541, "global_step": 562880, "epoch": 6781} {"train_loss": -27.391111373901367, "global_step": 562881, "epoch": 6781} {"train_loss": -28.16986656188965, "global_step": 562882, "epoch": 6781} {"train_loss": -27.62921142578125, "global_step": 562883, "epoch": 6781} {"train_loss": -27.004011154174805, "global_step": 562884, "epoch": 6781} {"train_loss": -26.24591064453125, "global_step": 562885, "epoch": 6781} {"train_loss": -26.64689064025879, "global_step": 562886, "epoch": 6781} {"train_loss": -27.69927406311035, "global_step": 562887, "epoch": 6781} {"train_loss": -27.584136962890625, "global_step": 562888, "epoch": 6781} {"train_loss": -27.674306869506836, "global_step": 562889, "epoch": 6781} {"train_loss": -27.78533935546875, "global_step": 562890, "epoch": 6781} {"train_loss": -27.49647331237793, "global_step": 562891, "epoch": 6781} {"train_loss": -27.821826934814453, "global_step": 562892, "epoch": 6781} {"train_loss": -27.662185668945312, "global_step": 562893, "epoch": 6781} {"train_loss": -27.463285446166992, "global_step": 562894, "epoch": 6781} {"train_loss": -27.7243709564209, "global_step": 562895, "epoch": 6781} {"train_loss": -27.802701950073242, "global_step": 562896, "epoch": 6781} {"train_loss": -27.471847534179688, "global_step": 562897, "epoch": 6781} {"train_loss": -27.799543380737305, "global_step": 562898, "epoch": 6781} {"train_loss": -27.690113067626953, "global_step": 562899, "epoch": 6781} {"train_loss": -27.59814453125, "global_step": 562900, "epoch": 6781} {"train_loss": -27.577314376831055, "global_step": 562901, "epoch": 6781} {"train_loss": -27.85112953186035, "global_step": 562902, "epoch": 6781} {"train_loss": -27.87948989868164, "global_step": 562903, "epoch": 6781} {"train_loss": -27.889577865600586, "global_step": 562904, "epoch": 6781} {"train_loss": -27.609072053288838, "global_step": 562905, "epoch": 6781, "val_loss": 6395784.0} {"train_loss": -27.460269927978516, "global_step": 562906, "epoch": 6782} {"train_loss": -26.907459259033203, "global_step": 562907, "epoch": 6782} {"train_loss": -26.655847549438477, "global_step": 562908, "epoch": 6782} {"train_loss": -26.96209716796875, "global_step": 562909, "epoch": 6782} {"train_loss": -27.769779205322266, "global_step": 562910, "epoch": 6782} {"train_loss": -27.764928817749023, "global_step": 562911, "epoch": 6782} {"train_loss": -27.01093101501465, "global_step": 562912, "epoch": 6782} {"train_loss": -27.591583251953125, "global_step": 562913, "epoch": 6782} {"train_loss": -27.878814697265625, "global_step": 562914, "epoch": 6782} {"train_loss": -27.713363647460938, "global_step": 562915, "epoch": 6782} {"train_loss": -28.04876136779785, "global_step": 562916, "epoch": 6782} {"train_loss": -28.022531509399414, "global_step": 562917, "epoch": 6782} {"train_loss": -27.94439125061035, "global_step": 562918, "epoch": 6782} {"train_loss": -27.61671257019043, "global_step": 562919, "epoch": 6782} {"train_loss": -28.084796905517578, "global_step": 562920, "epoch": 6782} {"train_loss": -27.435712814331055, "global_step": 562921, "epoch": 6782} {"train_loss": -27.909643173217773, "global_step": 562922, "epoch": 6782} {"train_loss": -27.879491806030273, "global_step": 562923, "epoch": 6782} {"train_loss": -27.69952964782715, "global_step": 562924, "epoch": 6782} {"train_loss": -27.916833877563477, "global_step": 562925, "epoch": 6782} {"train_loss": -27.423574447631836, "global_step": 562926, "epoch": 6782} {"train_loss": -27.866682052612305, "global_step": 562927, "epoch": 6782} {"train_loss": -27.878223419189453, "global_step": 562928, "epoch": 6782} {"train_loss": -27.851781845092773, "global_step": 562929, "epoch": 6782} {"train_loss": -27.5733642578125, "global_step": 562930, "epoch": 6782} {"train_loss": -28.0328311920166, "global_step": 562931, "epoch": 6782} {"train_loss": -27.863800048828125, "global_step": 562932, "epoch": 6782} {"train_loss": -27.756616592407227, "global_step": 562933, "epoch": 6782} {"train_loss": -27.8560848236084, "global_step": 562934, "epoch": 6782} {"train_loss": -28.163467407226562, "global_step": 562935, "epoch": 6782} {"train_loss": -27.805389404296875, "global_step": 562936, "epoch": 6782} {"train_loss": -27.965646743774414, "global_step": 562937, "epoch": 6782} {"train_loss": -28.166563034057617, "global_step": 562938, "epoch": 6782} {"train_loss": -28.03765296936035, "global_step": 562939, "epoch": 6782} {"train_loss": -28.118457794189453, "global_step": 562940, "epoch": 6782} {"train_loss": -27.671283721923828, "global_step": 562941, "epoch": 6782} {"train_loss": -28.081958770751953, "global_step": 562942, "epoch": 6782} {"train_loss": -28.1895694732666, "global_step": 562943, "epoch": 6782} {"train_loss": -27.71630859375, "global_step": 562944, "epoch": 6782} {"train_loss": -27.999624252319336, "global_step": 562945, "epoch": 6782} {"train_loss": -27.495691299438477, "global_step": 562946, "epoch": 6782} {"train_loss": -27.861047744750977, "global_step": 562947, "epoch": 6782} {"train_loss": -27.4778995513916, "global_step": 562948, "epoch": 6782} {"train_loss": -27.44776725769043, "global_step": 562949, "epoch": 6782} {"train_loss": -27.607770919799805, "global_step": 562950, "epoch": 6782} {"train_loss": -27.925764083862305, "global_step": 562951, "epoch": 6782} {"train_loss": -28.100255966186523, "global_step": 562952, "epoch": 6782} {"train_loss": -28.090940475463867, "global_step": 562953, "epoch": 6782} {"train_loss": -27.808927536010742, "global_step": 562954, "epoch": 6782} {"train_loss": -27.921070098876953, "global_step": 562955, "epoch": 6782} {"train_loss": -28.012805938720703, "global_step": 562956, "epoch": 6782} {"train_loss": -27.717931747436523, "global_step": 562957, "epoch": 6782} {"train_loss": -27.565372467041016, "global_step": 562958, "epoch": 6782} {"train_loss": -27.88266372680664, "global_step": 562959, "epoch": 6782} {"train_loss": -27.934253692626953, "global_step": 562960, "epoch": 6782} {"train_loss": -27.689926147460938, "global_step": 562961, "epoch": 6782} {"train_loss": -27.850439071655273, "global_step": 562962, "epoch": 6782} {"train_loss": -27.925146102905273, "global_step": 562963, "epoch": 6782} {"train_loss": -28.291706085205078, "global_step": 562964, "epoch": 6782} {"train_loss": -27.67983055114746, "global_step": 562965, "epoch": 6782} {"train_loss": -27.950775146484375, "global_step": 562966, "epoch": 6782} {"train_loss": -27.81353187561035, "global_step": 562967, "epoch": 6782} {"train_loss": -27.8505859375, "global_step": 562968, "epoch": 6782} {"train_loss": -28.149158477783203, "global_step": 562969, "epoch": 6782} {"train_loss": -28.113889694213867, "global_step": 562970, "epoch": 6782} {"train_loss": -27.963764190673828, "global_step": 562971, "epoch": 6782} {"train_loss": -27.6934757232666, "global_step": 562972, "epoch": 6782} {"train_loss": -27.928518295288086, "global_step": 562973, "epoch": 6782} {"train_loss": -27.813373565673828, "global_step": 562974, "epoch": 6782} {"train_loss": -28.05365562438965, "global_step": 562975, "epoch": 6782} {"train_loss": -28.071943283081055, "global_step": 562976, "epoch": 6782} {"train_loss": -28.38518714904785, "global_step": 562977, "epoch": 6782} {"train_loss": -27.847314834594727, "global_step": 562978, "epoch": 6782} {"train_loss": -27.9007625579834, "global_step": 562979, "epoch": 6782} {"train_loss": -28.271774291992188, "global_step": 562980, "epoch": 6782} {"train_loss": -27.646276473999023, "global_step": 562981, "epoch": 6782} {"train_loss": -27.926025390625, "global_step": 562982, "epoch": 6782} {"train_loss": -27.537153244018555, "global_step": 562983, "epoch": 6782} {"train_loss": -27.648345947265625, "global_step": 562984, "epoch": 6782} {"train_loss": -27.9360294342041, "global_step": 562985, "epoch": 6782} {"train_loss": -27.781768798828125, "global_step": 562986, "epoch": 6782} {"train_loss": -27.7074031829834, "global_step": 562987, "epoch": 6782} {"train_loss": -27.81691951062306, "global_step": 562988, "epoch": 6782, "val_loss": 6461228.0} {"train_loss": -27.3504581451416, "global_step": 562989, "epoch": 6783} {"train_loss": -26.449722290039062, "global_step": 562990, "epoch": 6783} {"train_loss": -25.659992218017578, "global_step": 562991, "epoch": 6783} {"train_loss": -25.897476196289062, "global_step": 562992, "epoch": 6783} {"train_loss": -27.195642471313477, "global_step": 562993, "epoch": 6783} {"train_loss": -25.775541305541992, "global_step": 562994, "epoch": 6783} {"train_loss": -26.635009765625, "global_step": 562995, "epoch": 6783} {"train_loss": -26.36183738708496, "global_step": 562996, "epoch": 6783} {"train_loss": -26.798444747924805, "global_step": 562997, "epoch": 6783} {"train_loss": -26.7568302154541, "global_step": 562998, "epoch": 6783} {"train_loss": -26.617700576782227, "global_step": 562999, "epoch": 6783} {"train_loss": -26.6888427734375, "global_step": 563000, "epoch": 6783} {"train_loss": -26.777929306030273, "global_step": 563001, "epoch": 6783} {"train_loss": -26.898670196533203, "global_step": 563002, "epoch": 6783} {"train_loss": -26.591257095336914, "global_step": 563003, "epoch": 6783} {"train_loss": -27.153051376342773, "global_step": 563004, "epoch": 6783} {"train_loss": -26.99529457092285, "global_step": 563005, "epoch": 6783} {"train_loss": -27.13315200805664, "global_step": 563006, "epoch": 6783} {"train_loss": -26.864776611328125, "global_step": 563007, "epoch": 6783} {"train_loss": -27.40357780456543, "global_step": 563008, "epoch": 6783} {"train_loss": -27.42960548400879, "global_step": 563009, "epoch": 6783} {"train_loss": -27.12725830078125, "global_step": 563010, "epoch": 6783} {"train_loss": -27.31658935546875, "global_step": 563011, "epoch": 6783} {"train_loss": -27.113880157470703, "global_step": 563012, "epoch": 6783} {"train_loss": -27.0025691986084, "global_step": 563013, "epoch": 6783} {"train_loss": -27.379901885986328, "global_step": 563014, "epoch": 6783} {"train_loss": -27.306821823120117, "global_step": 563015, "epoch": 6783} {"train_loss": -27.199085235595703, "global_step": 563016, "epoch": 6783} {"train_loss": -27.18252944946289, "global_step": 563017, "epoch": 6783} {"train_loss": -27.48299217224121, "global_step": 563018, "epoch": 6783} {"train_loss": -27.353147506713867, "global_step": 563019, "epoch": 6783} {"train_loss": -27.07875633239746, "global_step": 563020, "epoch": 6783} {"train_loss": -27.401708602905273, "global_step": 563021, "epoch": 6783} {"train_loss": -27.66773796081543, "global_step": 563022, "epoch": 6783} {"train_loss": -27.463361740112305, "global_step": 563023, "epoch": 6783} {"train_loss": -27.877521514892578, "global_step": 563024, "epoch": 6783} {"train_loss": -27.521717071533203, "global_step": 563025, "epoch": 6783} {"train_loss": -27.708362579345703, "global_step": 563026, "epoch": 6783} {"train_loss": -27.406137466430664, "global_step": 563027, "epoch": 6783} {"train_loss": -27.27508544921875, "global_step": 563028, "epoch": 6783} {"train_loss": -27.88938331604004, "global_step": 563029, "epoch": 6783} {"train_loss": -27.67474937438965, "global_step": 563030, "epoch": 6783} {"train_loss": -27.676910400390625, "global_step": 563031, "epoch": 6783} {"train_loss": -27.596582412719727, "global_step": 563032, "epoch": 6783} {"train_loss": -28.164722442626953, "global_step": 563033, "epoch": 6783} {"train_loss": -27.808984756469727, "global_step": 563034, "epoch": 6783} {"train_loss": -27.764856338500977, "global_step": 563035, "epoch": 6783} {"train_loss": -28.273523330688477, "global_step": 563036, "epoch": 6783} {"train_loss": -28.059534072875977, "global_step": 563037, "epoch": 6783} {"train_loss": -27.926198959350586, "global_step": 563038, "epoch": 6783} {"train_loss": -27.721677780151367, "global_step": 563039, "epoch": 6783} {"train_loss": -27.86256217956543, "global_step": 563040, "epoch": 6783} {"train_loss": -27.962738037109375, "global_step": 563041, "epoch": 6783} {"train_loss": -27.78449821472168, "global_step": 563042, "epoch": 6783} {"train_loss": -27.602619171142578, "global_step": 563043, "epoch": 6783} {"train_loss": -27.73211097717285, "global_step": 563044, "epoch": 6783} {"train_loss": -27.641525268554688, "global_step": 563045, "epoch": 6783} {"train_loss": -27.958288192749023, "global_step": 563046, "epoch": 6783} {"train_loss": -28.196548461914062, "global_step": 563047, "epoch": 6783} {"train_loss": -27.863998413085938, "global_step": 563048, "epoch": 6783} {"train_loss": -27.607656478881836, "global_step": 563049, "epoch": 6783} {"train_loss": -27.387271881103516, "global_step": 563050, "epoch": 6783} {"train_loss": -27.510732650756836, "global_step": 563051, "epoch": 6783} {"train_loss": -27.80377197265625, "global_step": 563052, "epoch": 6783} {"train_loss": -27.823795318603516, "global_step": 563053, "epoch": 6783} {"train_loss": -27.6720027923584, "global_step": 563054, "epoch": 6783} {"train_loss": -27.337360382080078, "global_step": 563055, "epoch": 6783} {"train_loss": -28.361576080322266, "global_step": 563056, "epoch": 6783} {"train_loss": -27.66696548461914, "global_step": 563057, "epoch": 6783} {"train_loss": -28.015888214111328, "global_step": 563058, "epoch": 6783} {"train_loss": -27.838134765625, "global_step": 563059, "epoch": 6783} {"train_loss": -27.7799015045166, "global_step": 563060, "epoch": 6783} {"train_loss": -27.767114639282227, "global_step": 563061, "epoch": 6783} {"train_loss": -27.774139404296875, "global_step": 563062, "epoch": 6783} {"train_loss": -27.66602897644043, "global_step": 563063, "epoch": 6783} {"train_loss": -28.019330978393555, "global_step": 563064, "epoch": 6783} {"train_loss": -28.031530380249023, "global_step": 563065, "epoch": 6783} {"train_loss": -27.972156524658203, "global_step": 563066, "epoch": 6783} {"train_loss": -28.084943771362305, "global_step": 563067, "epoch": 6783} {"train_loss": -28.113073348999023, "global_step": 563068, "epoch": 6783} {"train_loss": -27.938520431518555, "global_step": 563069, "epoch": 6783} {"train_loss": -28.04795265197754, "global_step": 563070, "epoch": 6783} {"train_loss": -27.45559667104698, "global_step": 563071, "epoch": 6783, "val_loss": 6443866.5} {"train_loss": -27.7291316986084, "global_step": 563072, "epoch": 6784} {"train_loss": -27.72235679626465, "global_step": 563073, "epoch": 6784} {"train_loss": -27.40424156188965, "global_step": 563074, "epoch": 6784} {"train_loss": -27.303129196166992, "global_step": 563075, "epoch": 6784} {"train_loss": -27.12727928161621, "global_step": 563076, "epoch": 6784} {"train_loss": -27.812519073486328, "global_step": 563077, "epoch": 6784} {"train_loss": -27.142210006713867, "global_step": 563078, "epoch": 6784} {"train_loss": -26.79277992248535, "global_step": 563079, "epoch": 6784} {"train_loss": -27.57795524597168, "global_step": 563080, "epoch": 6784} {"train_loss": -27.068103790283203, "global_step": 563081, "epoch": 6784} {"train_loss": -27.554288864135742, "global_step": 563082, "epoch": 6784} {"train_loss": -27.373046875, "global_step": 563083, "epoch": 6784} {"train_loss": -27.3787841796875, "global_step": 563084, "epoch": 6784} {"train_loss": -28.092493057250977, "global_step": 563085, "epoch": 6784} {"train_loss": -27.618310928344727, "global_step": 563086, "epoch": 6784} {"train_loss": -27.728036880493164, "global_step": 563087, "epoch": 6784} {"train_loss": -27.552499771118164, "global_step": 563088, "epoch": 6784} {"train_loss": -27.4572696685791, "global_step": 563089, "epoch": 6784} {"train_loss": -27.20244789123535, "global_step": 563090, "epoch": 6784} {"train_loss": -27.717864990234375, "global_step": 563091, "epoch": 6784} {"train_loss": -27.617456436157227, "global_step": 563092, "epoch": 6784} {"train_loss": -27.4790096282959, "global_step": 563093, "epoch": 6784} {"train_loss": -27.494781494140625, "global_step": 563094, "epoch": 6784} {"train_loss": -27.886014938354492, "global_step": 563095, "epoch": 6784} {"train_loss": -27.6453914642334, "global_step": 563096, "epoch": 6784} {"train_loss": -27.667205810546875, "global_step": 563097, "epoch": 6784} {"train_loss": -27.798940658569336, "global_step": 563098, "epoch": 6784} {"train_loss": -27.83461570739746, "global_step": 563099, "epoch": 6784} {"train_loss": -27.81519889831543, "global_step": 563100, "epoch": 6784} {"train_loss": -28.014596939086914, "global_step": 563101, "epoch": 6784} {"train_loss": -27.946557998657227, "global_step": 563102, "epoch": 6784} {"train_loss": -27.82801628112793, "global_step": 563103, "epoch": 6784} {"train_loss": -27.704824447631836, "global_step": 563104, "epoch": 6784} {"train_loss": -27.908666610717773, "global_step": 563105, "epoch": 6784} {"train_loss": -27.727554321289062, "global_step": 563106, "epoch": 6784} {"train_loss": -27.805328369140625, "global_step": 563107, "epoch": 6784} {"train_loss": -28.003402709960938, "global_step": 563108, "epoch": 6784} {"train_loss": -27.641138076782227, "global_step": 563109, "epoch": 6784} {"train_loss": -27.986616134643555, "global_step": 563110, "epoch": 6784} {"train_loss": -27.872638702392578, "global_step": 563111, "epoch": 6784} {"train_loss": -28.072561264038086, "global_step": 563112, "epoch": 6784} {"train_loss": -27.406864166259766, "global_step": 563113, "epoch": 6784} {"train_loss": -27.634912490844727, "global_step": 563114, "epoch": 6784} {"train_loss": -28.151090621948242, "global_step": 563115, "epoch": 6784} {"train_loss": -27.9038028717041, "global_step": 563116, "epoch": 6784} {"train_loss": -27.87361717224121, "global_step": 563117, "epoch": 6784} {"train_loss": -28.007110595703125, "global_step": 563118, "epoch": 6784} {"train_loss": -28.070775985717773, "global_step": 563119, "epoch": 6784} {"train_loss": -27.944730758666992, "global_step": 563120, "epoch": 6784} {"train_loss": -27.84686279296875, "global_step": 563121, "epoch": 6784} {"train_loss": -27.785205841064453, "global_step": 563122, "epoch": 6784} {"train_loss": -27.843692779541016, "global_step": 563123, "epoch": 6784} {"train_loss": -28.330402374267578, "global_step": 563124, "epoch": 6784} {"train_loss": -28.20784568786621, "global_step": 563125, "epoch": 6784} {"train_loss": -28.159011840820312, "global_step": 563126, "epoch": 6784} {"train_loss": -27.889739990234375, "global_step": 563127, "epoch": 6784} {"train_loss": -27.64072036743164, "global_step": 563128, "epoch": 6784} {"train_loss": -27.938806533813477, "global_step": 563129, "epoch": 6784} {"train_loss": -28.221755981445312, "global_step": 563130, "epoch": 6784} {"train_loss": -27.458398818969727, "global_step": 563131, "epoch": 6784} {"train_loss": -27.593297958374023, "global_step": 563132, "epoch": 6784} {"train_loss": -27.137928009033203, "global_step": 563133, "epoch": 6784} {"train_loss": -27.352807998657227, "global_step": 563134, "epoch": 6784} {"train_loss": -27.597400665283203, "global_step": 563135, "epoch": 6784} {"train_loss": -27.996789932250977, "global_step": 563136, "epoch": 6784} {"train_loss": -27.63825035095215, "global_step": 563137, "epoch": 6784} {"train_loss": -28.007665634155273, "global_step": 563138, "epoch": 6784} {"train_loss": -27.434316635131836, "global_step": 563139, "epoch": 6784} {"train_loss": -28.040983200073242, "global_step": 563140, "epoch": 6784} {"train_loss": -28.152490615844727, "global_step": 563141, "epoch": 6784} {"train_loss": -27.831525802612305, "global_step": 563142, "epoch": 6784} {"train_loss": -27.651813507080078, "global_step": 563143, "epoch": 6784} {"train_loss": -27.895038604736328, "global_step": 563144, "epoch": 6784} {"train_loss": -27.854751586914062, "global_step": 563145, "epoch": 6784} {"train_loss": -27.669458389282227, "global_step": 563146, "epoch": 6784} {"train_loss": -27.974294662475586, "global_step": 563147, "epoch": 6784} {"train_loss": -27.795209884643555, "global_step": 563148, "epoch": 6784} {"train_loss": -27.794452667236328, "global_step": 563149, "epoch": 6784} {"train_loss": -27.162397384643555, "global_step": 563150, "epoch": 6784} {"train_loss": -26.98561668395996, "global_step": 563151, "epoch": 6784} {"train_loss": -25.670669555664062, "global_step": 563152, "epoch": 6784} {"train_loss": -25.087833404541016, "global_step": 563153, "epoch": 6784} {"train_loss": -27.64336172356663, "global_step": 563154, "epoch": 6784, "val_loss": 6472341.0} {"train_loss": -22.24627113342285, "global_step": 563155, "epoch": 6785} {"train_loss": -25.77229118347168, "global_step": 563156, "epoch": 6785} {"train_loss": -23.619382858276367, "global_step": 563157, "epoch": 6785} {"train_loss": -25.677413940429688, "global_step": 563158, "epoch": 6785} {"train_loss": -24.344900131225586, "global_step": 563159, "epoch": 6785} {"train_loss": -25.928327560424805, "global_step": 563160, "epoch": 6785} {"train_loss": -25.866987228393555, "global_step": 563161, "epoch": 6785} {"train_loss": -25.194019317626953, "global_step": 563162, "epoch": 6785} {"train_loss": -25.98243522644043, "global_step": 563163, "epoch": 6785} {"train_loss": -26.25640869140625, "global_step": 563164, "epoch": 6785} {"train_loss": -26.027587890625, "global_step": 563165, "epoch": 6785} {"train_loss": -26.017786026000977, "global_step": 563166, "epoch": 6785} {"train_loss": -26.560195922851562, "global_step": 563167, "epoch": 6785} {"train_loss": -26.21858787536621, "global_step": 563168, "epoch": 6785} {"train_loss": -26.395971298217773, "global_step": 563169, "epoch": 6785} {"train_loss": -26.476734161376953, "global_step": 563170, "epoch": 6785} {"train_loss": -26.552356719970703, "global_step": 563171, "epoch": 6785} {"train_loss": -27.064960479736328, "global_step": 563172, "epoch": 6785} {"train_loss": -26.567813873291016, "global_step": 563173, "epoch": 6785} {"train_loss": -26.5084285736084, "global_step": 563174, "epoch": 6785} {"train_loss": -26.48597526550293, "global_step": 563175, "epoch": 6785} {"train_loss": -26.605085372924805, "global_step": 563176, "epoch": 6785} {"train_loss": -27.19672203063965, "global_step": 563177, "epoch": 6785} {"train_loss": -27.083005905151367, "global_step": 563178, "epoch": 6785} {"train_loss": -27.039459228515625, "global_step": 563179, "epoch": 6785} {"train_loss": -27.061725616455078, "global_step": 563180, "epoch": 6785} {"train_loss": -27.116321563720703, "global_step": 563181, "epoch": 6785} {"train_loss": -26.874378204345703, "global_step": 563182, "epoch": 6785} {"train_loss": -26.946552276611328, "global_step": 563183, "epoch": 6785} {"train_loss": -27.067493438720703, "global_step": 563184, "epoch": 6785} {"train_loss": -27.17134666442871, "global_step": 563185, "epoch": 6785} {"train_loss": -27.013593673706055, "global_step": 563186, "epoch": 6785} {"train_loss": -27.257038116455078, "global_step": 563187, "epoch": 6785} {"train_loss": -27.042631149291992, "global_step": 563188, "epoch": 6785} {"train_loss": -27.442737579345703, "global_step": 563189, "epoch": 6785} {"train_loss": -27.017133712768555, "global_step": 563190, "epoch": 6785} {"train_loss": -26.974111557006836, "global_step": 563191, "epoch": 6785} {"train_loss": -27.16742515563965, "global_step": 563192, "epoch": 6785} {"train_loss": -27.561450958251953, "global_step": 563193, "epoch": 6785} {"train_loss": -27.408405303955078, "global_step": 563194, "epoch": 6785} {"train_loss": -27.296722412109375, "global_step": 563195, "epoch": 6785} {"train_loss": -27.307458877563477, "global_step": 563196, "epoch": 6785} {"train_loss": -27.42291831970215, "global_step": 563197, "epoch": 6785} {"train_loss": -27.5706787109375, "global_step": 563198, "epoch": 6785} {"train_loss": -27.3378963470459, "global_step": 563199, "epoch": 6785} {"train_loss": -27.667144775390625, "global_step": 563200, "epoch": 6785} {"train_loss": -27.24704933166504, "global_step": 563201, "epoch": 6785} {"train_loss": -27.52712059020996, "global_step": 563202, "epoch": 6785} {"train_loss": -27.497028350830078, "global_step": 563203, "epoch": 6785} {"train_loss": -27.938709259033203, "global_step": 563204, "epoch": 6785} {"train_loss": -27.388906478881836, "global_step": 563205, "epoch": 6785} {"train_loss": -27.620208740234375, "global_step": 563206, "epoch": 6785} {"train_loss": -27.37177085876465, "global_step": 563207, "epoch": 6785} {"train_loss": -27.872583389282227, "global_step": 563208, "epoch": 6785} {"train_loss": -27.6324405670166, "global_step": 563209, "epoch": 6785} {"train_loss": -27.954492568969727, "global_step": 563210, "epoch": 6785} {"train_loss": -27.760961532592773, "global_step": 563211, "epoch": 6785} {"train_loss": -27.69744873046875, "global_step": 563212, "epoch": 6785} {"train_loss": -27.75660514831543, "global_step": 563213, "epoch": 6785} {"train_loss": -27.560922622680664, "global_step": 563214, "epoch": 6785} {"train_loss": -27.988616943359375, "global_step": 563215, "epoch": 6785} {"train_loss": -27.862085342407227, "global_step": 563216, "epoch": 6785} {"train_loss": -27.7520809173584, "global_step": 563217, "epoch": 6785} {"train_loss": -28.130767822265625, "global_step": 563218, "epoch": 6785} {"train_loss": -27.83246421813965, "global_step": 563219, "epoch": 6785} {"train_loss": -27.96388053894043, "global_step": 563220, "epoch": 6785} {"train_loss": -27.706045150756836, "global_step": 563221, "epoch": 6785} {"train_loss": -28.05023765563965, "global_step": 563222, "epoch": 6785} {"train_loss": -27.51738929748535, "global_step": 563223, "epoch": 6785} {"train_loss": -27.468738555908203, "global_step": 563224, "epoch": 6785} {"train_loss": -27.237646102905273, "global_step": 563225, "epoch": 6785} {"train_loss": -27.102991104125977, "global_step": 563226, "epoch": 6785} {"train_loss": -27.15730857849121, "global_step": 563227, "epoch": 6785} {"train_loss": -27.034927368164062, "global_step": 563228, "epoch": 6785} {"train_loss": -27.551319122314453, "global_step": 563229, "epoch": 6785} {"train_loss": -27.870655059814453, "global_step": 563230, "epoch": 6785} {"train_loss": -27.485132217407227, "global_step": 563231, "epoch": 6785} {"train_loss": -27.33331298828125, "global_step": 563232, "epoch": 6785} {"train_loss": -27.249536514282227, "global_step": 563233, "epoch": 6785} {"train_loss": -27.522573471069336, "global_step": 563234, "epoch": 6785} {"train_loss": -27.6131649017334, "global_step": 563235, "epoch": 6785} {"train_loss": -27.687061309814453, "global_step": 563236, "epoch": 6785} {"train_loss": -27.00893199874694, "global_step": 563237, "epoch": 6785, "val_loss": 6392229.5} {"train_loss": -26.805078506469727, "global_step": 563238, "epoch": 6786} {"train_loss": -24.527055740356445, "global_step": 563239, "epoch": 6786} {"train_loss": -26.96013832092285, "global_step": 563240, "epoch": 6786} {"train_loss": -25.71577262878418, "global_step": 563241, "epoch": 6786} {"train_loss": -26.141698837280273, "global_step": 563242, "epoch": 6786} {"train_loss": -26.49639892578125, "global_step": 563243, "epoch": 6786} {"train_loss": -26.220144271850586, "global_step": 563244, "epoch": 6786} {"train_loss": -26.722135543823242, "global_step": 563245, "epoch": 6786} {"train_loss": -26.87942886352539, "global_step": 563246, "epoch": 6786} {"train_loss": -26.769287109375, "global_step": 563247, "epoch": 6786} {"train_loss": -26.574506759643555, "global_step": 563248, "epoch": 6786} {"train_loss": -26.800546646118164, "global_step": 563249, "epoch": 6786} {"train_loss": -26.95026969909668, "global_step": 563250, "epoch": 6786} {"train_loss": -27.289997100830078, "global_step": 563251, "epoch": 6786} {"train_loss": -26.84894371032715, "global_step": 563252, "epoch": 6786} {"train_loss": -27.706008911132812, "global_step": 563253, "epoch": 6786} {"train_loss": -27.041528701782227, "global_step": 563254, "epoch": 6786} {"train_loss": -27.050596237182617, "global_step": 563255, "epoch": 6786} {"train_loss": -27.047704696655273, "global_step": 563256, "epoch": 6786} {"train_loss": -27.265745162963867, "global_step": 563257, "epoch": 6786} {"train_loss": -27.20173454284668, "global_step": 563258, "epoch": 6786} {"train_loss": -27.54804039001465, "global_step": 563259, "epoch": 6786} {"train_loss": -27.44954490661621, "global_step": 563260, "epoch": 6786} {"train_loss": -27.305389404296875, "global_step": 563261, "epoch": 6786} {"train_loss": -27.20905876159668, "global_step": 563262, "epoch": 6786} {"train_loss": -27.63671875, "global_step": 563263, "epoch": 6786} {"train_loss": -27.328125, "global_step": 563264, "epoch": 6786} {"train_loss": -27.676074981689453, "global_step": 563265, "epoch": 6786} {"train_loss": -27.567218780517578, "global_step": 563266, "epoch": 6786} {"train_loss": -27.76483154296875, "global_step": 563267, "epoch": 6786} {"train_loss": -27.35353660583496, "global_step": 563268, "epoch": 6786} {"train_loss": -27.512332916259766, "global_step": 563269, "epoch": 6786} {"train_loss": -27.38800048828125, "global_step": 563270, "epoch": 6786} {"train_loss": -27.5320987701416, "global_step": 563271, "epoch": 6786} {"train_loss": -27.30531120300293, "global_step": 563272, "epoch": 6786} {"train_loss": -27.90400505065918, "global_step": 563273, "epoch": 6786} {"train_loss": -27.62638282775879, "global_step": 563274, "epoch": 6786} {"train_loss": -27.63051414489746, "global_step": 563275, "epoch": 6786} {"train_loss": -27.360509872436523, "global_step": 563276, "epoch": 6786} {"train_loss": -27.78797721862793, "global_step": 563277, "epoch": 6786} {"train_loss": -27.77198600769043, "global_step": 563278, "epoch": 6786} {"train_loss": -27.827245712280273, "global_step": 563279, "epoch": 6786} {"train_loss": -28.022687911987305, "global_step": 563280, "epoch": 6786} {"train_loss": -27.460474014282227, "global_step": 563281, "epoch": 6786} {"train_loss": -27.99556541442871, "global_step": 563282, "epoch": 6786} {"train_loss": -27.647720336914062, "global_step": 563283, "epoch": 6786} {"train_loss": -27.656949996948242, "global_step": 563284, "epoch": 6786} {"train_loss": -27.661457061767578, "global_step": 563285, "epoch": 6786} {"train_loss": -27.728012084960938, "global_step": 563286, "epoch": 6786} {"train_loss": -27.70527458190918, "global_step": 563287, "epoch": 6786} {"train_loss": -27.5938777923584, "global_step": 563288, "epoch": 6786} {"train_loss": -27.698226928710938, "global_step": 563289, "epoch": 6786} {"train_loss": -28.141767501831055, "global_step": 563290, "epoch": 6786} {"train_loss": -28.174833297729492, "global_step": 563291, "epoch": 6786} {"train_loss": -28.134204864501953, "global_step": 563292, "epoch": 6786} {"train_loss": -27.960195541381836, "global_step": 563293, "epoch": 6786} {"train_loss": -27.71938133239746, "global_step": 563294, "epoch": 6786} {"train_loss": -27.95169448852539, "global_step": 563295, "epoch": 6786} {"train_loss": -27.863525390625, "global_step": 563296, "epoch": 6786} {"train_loss": -28.04249382019043, "global_step": 563297, "epoch": 6786} {"train_loss": -27.979230880737305, "global_step": 563298, "epoch": 6786} {"train_loss": -28.297353744506836, "global_step": 563299, "epoch": 6786} {"train_loss": -27.743789672851562, "global_step": 563300, "epoch": 6786} {"train_loss": -27.7845516204834, "global_step": 563301, "epoch": 6786} {"train_loss": -27.758121490478516, "global_step": 563302, "epoch": 6786} {"train_loss": -28.106220245361328, "global_step": 563303, "epoch": 6786} {"train_loss": -28.0907039642334, "global_step": 563304, "epoch": 6786} {"train_loss": -28.156904220581055, "global_step": 563305, "epoch": 6786} {"train_loss": -28.16962242126465, "global_step": 563306, "epoch": 6786} {"train_loss": -27.81206703186035, "global_step": 563307, "epoch": 6786} {"train_loss": -27.96071434020996, "global_step": 563308, "epoch": 6786} {"train_loss": -28.01460075378418, "global_step": 563309, "epoch": 6786} {"train_loss": -28.101062774658203, "global_step": 563310, "epoch": 6786} {"train_loss": -28.03759765625, "global_step": 563311, "epoch": 6786} {"train_loss": -28.226184844970703, "global_step": 563312, "epoch": 6786} {"train_loss": -28.0731258392334, "global_step": 563313, "epoch": 6786} {"train_loss": -27.772933959960938, "global_step": 563314, "epoch": 6786} {"train_loss": -27.855701446533203, "global_step": 563315, "epoch": 6786} {"train_loss": -27.810760498046875, "global_step": 563316, "epoch": 6786} {"train_loss": -27.321516036987305, "global_step": 563317, "epoch": 6786} {"train_loss": -27.172636032104492, "global_step": 563318, "epoch": 6786} {"train_loss": -27.325183868408203, "global_step": 563319, "epoch": 6786} {"train_loss": -27.501168469348585, "global_step": 563320, "epoch": 6786, "val_loss": 6413493.5} {"train_loss": -26.799381256103516, "global_step": 563321, "epoch": 6787} {"train_loss": -25.791418075561523, "global_step": 563322, "epoch": 6787} {"train_loss": -27.114368438720703, "global_step": 563323, "epoch": 6787} {"train_loss": -26.34153175354004, "global_step": 563324, "epoch": 6787} {"train_loss": -26.747053146362305, "global_step": 563325, "epoch": 6787} {"train_loss": -26.67180824279785, "global_step": 563326, "epoch": 6787} {"train_loss": -27.21109962463379, "global_step": 563327, "epoch": 6787} {"train_loss": -26.920379638671875, "global_step": 563328, "epoch": 6787} {"train_loss": -27.697736740112305, "global_step": 563329, "epoch": 6787} {"train_loss": -26.5497989654541, "global_step": 563330, "epoch": 6787} {"train_loss": -27.72267723083496, "global_step": 563331, "epoch": 6787} {"train_loss": -27.27199363708496, "global_step": 563332, "epoch": 6787} {"train_loss": -27.47635269165039, "global_step": 563333, "epoch": 6787} {"train_loss": -27.47907066345215, "global_step": 563334, "epoch": 6787} {"train_loss": -27.48079490661621, "global_step": 563335, "epoch": 6787} {"train_loss": -27.44105339050293, "global_step": 563336, "epoch": 6787} {"train_loss": -27.45575523376465, "global_step": 563337, "epoch": 6787} {"train_loss": -27.859281539916992, "global_step": 563338, "epoch": 6787} {"train_loss": -27.61126136779785, "global_step": 563339, "epoch": 6787} {"train_loss": -27.1954345703125, "global_step": 563340, "epoch": 6787} {"train_loss": -27.692218780517578, "global_step": 563341, "epoch": 6787} {"train_loss": -27.49002456665039, "global_step": 563342, "epoch": 6787} {"train_loss": -27.439289093017578, "global_step": 563343, "epoch": 6787} {"train_loss": -27.628433227539062, "global_step": 563344, "epoch": 6787} {"train_loss": -28.026336669921875, "global_step": 563345, "epoch": 6787} {"train_loss": -27.98636817932129, "global_step": 563346, "epoch": 6787} {"train_loss": -27.982254028320312, "global_step": 563347, "epoch": 6787} {"train_loss": -27.766315460205078, "global_step": 563348, "epoch": 6787} {"train_loss": -27.60576820373535, "global_step": 563349, "epoch": 6787} {"train_loss": -27.50962257385254, "global_step": 563350, "epoch": 6787} {"train_loss": -27.855100631713867, "global_step": 563351, "epoch": 6787} {"train_loss": -27.736703872680664, "global_step": 563352, "epoch": 6787} {"train_loss": -27.620370864868164, "global_step": 563353, "epoch": 6787} {"train_loss": -28.01631736755371, "global_step": 563354, "epoch": 6787} {"train_loss": -27.658615112304688, "global_step": 563355, "epoch": 6787} {"train_loss": -27.48136329650879, "global_step": 563356, "epoch": 6787} {"train_loss": -27.45013999938965, "global_step": 563357, "epoch": 6787} {"train_loss": -27.790851593017578, "global_step": 563358, "epoch": 6787} {"train_loss": -28.06556510925293, "global_step": 563359, "epoch": 6787} {"train_loss": -27.918842315673828, "global_step": 563360, "epoch": 6787} {"train_loss": -27.922916412353516, "global_step": 563361, "epoch": 6787} {"train_loss": -27.62562370300293, "global_step": 563362, "epoch": 6787} {"train_loss": -27.778005599975586, "global_step": 563363, "epoch": 6787} {"train_loss": -27.752548217773438, "global_step": 563364, "epoch": 6787} {"train_loss": -27.863540649414062, "global_step": 563365, "epoch": 6787} {"train_loss": -27.914581298828125, "global_step": 563366, "epoch": 6787} {"train_loss": -28.223928451538086, "global_step": 563367, "epoch": 6787} {"train_loss": -27.91227149963379, "global_step": 563368, "epoch": 6787} {"train_loss": -27.505329132080078, "global_step": 563369, "epoch": 6787} {"train_loss": -28.119709014892578, "global_step": 563370, "epoch": 6787} {"train_loss": -27.81231689453125, "global_step": 563371, "epoch": 6787} {"train_loss": -27.936426162719727, "global_step": 563372, "epoch": 6787} {"train_loss": -27.834064483642578, "global_step": 563373, "epoch": 6787} {"train_loss": -27.88519287109375, "global_step": 563374, "epoch": 6787} {"train_loss": -28.198095321655273, "global_step": 563375, "epoch": 6787} {"train_loss": -28.3663387298584, "global_step": 563376, "epoch": 6787} {"train_loss": -27.930500030517578, "global_step": 563377, "epoch": 6787} {"train_loss": -28.037689208984375, "global_step": 563378, "epoch": 6787} {"train_loss": -27.993438720703125, "global_step": 563379, "epoch": 6787} {"train_loss": -28.23465919494629, "global_step": 563380, "epoch": 6787} {"train_loss": -28.045124053955078, "global_step": 563381, "epoch": 6787} {"train_loss": -27.563568115234375, "global_step": 563382, "epoch": 6787} {"train_loss": -27.745681762695312, "global_step": 563383, "epoch": 6787} {"train_loss": -27.95098876953125, "global_step": 563384, "epoch": 6787} {"train_loss": -28.2613525390625, "global_step": 563385, "epoch": 6787} {"train_loss": -27.766555786132812, "global_step": 563386, "epoch": 6787} {"train_loss": -27.733266830444336, "global_step": 563387, "epoch": 6787} {"train_loss": -28.21180534362793, "global_step": 563388, "epoch": 6787} {"train_loss": -27.922199249267578, "global_step": 563389, "epoch": 6787} {"train_loss": -28.1223201751709, "global_step": 563390, "epoch": 6787} {"train_loss": -28.171222686767578, "global_step": 563391, "epoch": 6787} {"train_loss": -28.375577926635742, "global_step": 563392, "epoch": 6787} {"train_loss": -27.843311309814453, "global_step": 563393, "epoch": 6787} {"train_loss": -27.928747177124023, "global_step": 563394, "epoch": 6787} {"train_loss": -27.7647647857666, "global_step": 563395, "epoch": 6787} {"train_loss": -28.162084579467773, "global_step": 563396, "epoch": 6787} {"train_loss": -27.8458309173584, "global_step": 563397, "epoch": 6787} {"train_loss": -27.771413803100586, "global_step": 563398, "epoch": 6787} {"train_loss": -27.3779354095459, "global_step": 563399, "epoch": 6787} {"train_loss": -27.024169921875, "global_step": 563400, "epoch": 6787} {"train_loss": -27.47429847717285, "global_step": 563401, "epoch": 6787} {"train_loss": -27.266462326049805, "global_step": 563402, "epoch": 6787} {"train_loss": -27.646226745053948, "global_step": 563403, "epoch": 6787, "val_loss": 6449292.0} {"train_loss": -26.7891845703125, "global_step": 563404, "epoch": 6788} {"train_loss": -26.001256942749023, "global_step": 563405, "epoch": 6788} {"train_loss": -26.4500675201416, "global_step": 563406, "epoch": 6788} {"train_loss": -26.8348388671875, "global_step": 563407, "epoch": 6788} {"train_loss": -26.75360679626465, "global_step": 563408, "epoch": 6788} {"train_loss": -27.266504287719727, "global_step": 563409, "epoch": 6788} {"train_loss": -26.838361740112305, "global_step": 563410, "epoch": 6788} {"train_loss": -26.793792724609375, "global_step": 563411, "epoch": 6788} {"train_loss": -27.222532272338867, "global_step": 563412, "epoch": 6788} {"train_loss": -26.819833755493164, "global_step": 563413, "epoch": 6788} {"train_loss": -26.9188175201416, "global_step": 563414, "epoch": 6788} {"train_loss": -27.025827407836914, "global_step": 563415, "epoch": 6788} {"train_loss": -26.97174644470215, "global_step": 563416, "epoch": 6788} {"train_loss": -26.892440795898438, "global_step": 563417, "epoch": 6788} {"train_loss": -27.606143951416016, "global_step": 563418, "epoch": 6788} {"train_loss": -26.811450958251953, "global_step": 563419, "epoch": 6788} {"train_loss": -27.47882652282715, "global_step": 563420, "epoch": 6788} {"train_loss": -27.070697784423828, "global_step": 563421, "epoch": 6788} {"train_loss": -26.979511260986328, "global_step": 563422, "epoch": 6788} {"train_loss": -27.3389892578125, "global_step": 563423, "epoch": 6788} {"train_loss": -27.228185653686523, "global_step": 563424, "epoch": 6788} {"train_loss": -27.206411361694336, "global_step": 563425, "epoch": 6788} {"train_loss": -27.143341064453125, "global_step": 563426, "epoch": 6788} {"train_loss": -27.505395889282227, "global_step": 563427, "epoch": 6788} {"train_loss": -27.53605079650879, "global_step": 563428, "epoch": 6788} {"train_loss": -27.35394287109375, "global_step": 563429, "epoch": 6788} {"train_loss": -27.899545669555664, "global_step": 563430, "epoch": 6788} {"train_loss": -27.52020835876465, "global_step": 563431, "epoch": 6788} {"train_loss": -27.399494171142578, "global_step": 563432, "epoch": 6788} {"train_loss": -27.50383949279785, "global_step": 563433, "epoch": 6788} {"train_loss": -27.87103271484375, "global_step": 563434, "epoch": 6788} {"train_loss": -27.62867546081543, "global_step": 563435, "epoch": 6788} {"train_loss": -27.918989181518555, "global_step": 563436, "epoch": 6788} {"train_loss": -27.774860382080078, "global_step": 563437, "epoch": 6788} {"train_loss": -28.04123306274414, "global_step": 563438, "epoch": 6788} {"train_loss": -27.685606002807617, "global_step": 563439, "epoch": 6788} {"train_loss": -27.907318115234375, "global_step": 563440, "epoch": 6788} {"train_loss": -28.049901962280273, "global_step": 563441, "epoch": 6788} {"train_loss": -27.664630889892578, "global_step": 563442, "epoch": 6788} {"train_loss": -27.797473907470703, "global_step": 563443, "epoch": 6788} {"train_loss": -27.703784942626953, "global_step": 563444, "epoch": 6788} {"train_loss": -27.87727928161621, "global_step": 563445, "epoch": 6788} {"train_loss": -27.461668014526367, "global_step": 563446, "epoch": 6788} {"train_loss": -27.36541748046875, "global_step": 563447, "epoch": 6788} {"train_loss": -27.713714599609375, "global_step": 563448, "epoch": 6788} {"train_loss": -28.177066802978516, "global_step": 563449, "epoch": 6788} {"train_loss": -28.105804443359375, "global_step": 563450, "epoch": 6788} {"train_loss": -27.71052360534668, "global_step": 563451, "epoch": 6788} {"train_loss": -27.800931930541992, "global_step": 563452, "epoch": 6788} {"train_loss": -28.01448631286621, "global_step": 563453, "epoch": 6788} {"train_loss": -27.818164825439453, "global_step": 563454, "epoch": 6788} {"train_loss": -28.1429443359375, "global_step": 563455, "epoch": 6788} {"train_loss": -27.401945114135742, "global_step": 563456, "epoch": 6788} {"train_loss": -27.771581649780273, "global_step": 563457, "epoch": 6788} {"train_loss": -28.045215606689453, "global_step": 563458, "epoch": 6788} {"train_loss": -27.935260772705078, "global_step": 563459, "epoch": 6788} {"train_loss": -28.497953414916992, "global_step": 563460, "epoch": 6788} {"train_loss": -27.973068237304688, "global_step": 563461, "epoch": 6788} {"train_loss": -27.949726104736328, "global_step": 563462, "epoch": 6788} {"train_loss": -27.7946834564209, "global_step": 563463, "epoch": 6788} {"train_loss": -28.014562606811523, "global_step": 563464, "epoch": 6788} {"train_loss": -28.077661514282227, "global_step": 563465, "epoch": 6788} {"train_loss": -28.12531089782715, "global_step": 563466, "epoch": 6788} {"train_loss": -27.72621726989746, "global_step": 563467, "epoch": 6788} {"train_loss": -27.758270263671875, "global_step": 563468, "epoch": 6788} {"train_loss": -27.882171630859375, "global_step": 563469, "epoch": 6788} {"train_loss": -27.9551944732666, "global_step": 563470, "epoch": 6788} {"train_loss": -27.66047477722168, "global_step": 563471, "epoch": 6788} {"train_loss": -27.95821189880371, "global_step": 563472, "epoch": 6788} {"train_loss": -27.92291831970215, "global_step": 563473, "epoch": 6788} {"train_loss": -27.95728874206543, "global_step": 563474, "epoch": 6788} {"train_loss": -27.16657066345215, "global_step": 563475, "epoch": 6788} {"train_loss": -27.01485252380371, "global_step": 563476, "epoch": 6788} {"train_loss": -26.4986515045166, "global_step": 563477, "epoch": 6788} {"train_loss": -27.441930770874023, "global_step": 563478, "epoch": 6788} {"train_loss": -27.687780380249023, "global_step": 563479, "epoch": 6788} {"train_loss": -27.279455184936523, "global_step": 563480, "epoch": 6788} {"train_loss": -27.85605239868164, "global_step": 563481, "epoch": 6788} {"train_loss": -28.26197624206543, "global_step": 563482, "epoch": 6788} {"train_loss": -27.84113121032715, "global_step": 563483, "epoch": 6788} {"train_loss": -27.866331100463867, "global_step": 563484, "epoch": 6788} {"train_loss": -27.290151596069336, "global_step": 563485, "epoch": 6788} {"train_loss": -27.53146042881242, "global_step": 563486, "epoch": 6788, "val_loss": 6417011.5} {"train_loss": -27.921920776367188, "global_step": 563487, "epoch": 6789} {"train_loss": -27.72831153869629, "global_step": 563488, "epoch": 6789} {"train_loss": -27.0281982421875, "global_step": 563489, "epoch": 6789} {"train_loss": -25.617298126220703, "global_step": 563490, "epoch": 6789} {"train_loss": -25.89857292175293, "global_step": 563491, "epoch": 6789} {"train_loss": -26.938928604125977, "global_step": 563492, "epoch": 6789} {"train_loss": -27.195438385009766, "global_step": 563493, "epoch": 6789} {"train_loss": -26.27365493774414, "global_step": 563494, "epoch": 6789} {"train_loss": -27.112903594970703, "global_step": 563495, "epoch": 6789} {"train_loss": -27.032629013061523, "global_step": 563496, "epoch": 6789} {"train_loss": -26.972700119018555, "global_step": 563497, "epoch": 6789} {"train_loss": -26.80584716796875, "global_step": 563498, "epoch": 6789} {"train_loss": -26.97304344177246, "global_step": 563499, "epoch": 6789} {"train_loss": -27.475744247436523, "global_step": 563500, "epoch": 6789} {"train_loss": -27.300785064697266, "global_step": 563501, "epoch": 6789} {"train_loss": -27.5909423828125, "global_step": 563502, "epoch": 6789} {"train_loss": -27.36456871032715, "global_step": 563503, "epoch": 6789} {"train_loss": -27.275846481323242, "global_step": 563504, "epoch": 6789} {"train_loss": -27.44207191467285, "global_step": 563505, "epoch": 6789} {"train_loss": -27.271467208862305, "global_step": 563506, "epoch": 6789} {"train_loss": -27.02642822265625, "global_step": 563507, "epoch": 6789} {"train_loss": -27.403564453125, "global_step": 563508, "epoch": 6789} {"train_loss": -27.411273956298828, "global_step": 563509, "epoch": 6789} {"train_loss": -27.207706451416016, "global_step": 563510, "epoch": 6789} {"train_loss": -27.35772705078125, "global_step": 563511, "epoch": 6789} {"train_loss": -27.723926544189453, "global_step": 563512, "epoch": 6789} {"train_loss": -27.62322998046875, "global_step": 563513, "epoch": 6789} {"train_loss": -27.453824996948242, "global_step": 563514, "epoch": 6789} {"train_loss": -27.481006622314453, "global_step": 563515, "epoch": 6789} {"train_loss": -27.718595504760742, "global_step": 563516, "epoch": 6789} {"train_loss": -27.54312515258789, "global_step": 563517, "epoch": 6789} {"train_loss": -27.768041610717773, "global_step": 563518, "epoch": 6789} {"train_loss": -27.628433227539062, "global_step": 563519, "epoch": 6789} {"train_loss": -27.526636123657227, "global_step": 563520, "epoch": 6789} {"train_loss": -27.807226181030273, "global_step": 563521, "epoch": 6789} {"train_loss": -27.848363876342773, "global_step": 563522, "epoch": 6789} {"train_loss": -27.723459243774414, "global_step": 563523, "epoch": 6789} {"train_loss": -27.8778076171875, "global_step": 563524, "epoch": 6789} {"train_loss": -27.96356773376465, "global_step": 563525, "epoch": 6789} {"train_loss": -27.874143600463867, "global_step": 563526, "epoch": 6789} {"train_loss": -27.67118263244629, "global_step": 563527, "epoch": 6789} {"train_loss": -27.96400260925293, "global_step": 563528, "epoch": 6789} {"train_loss": -27.4427547454834, "global_step": 563529, "epoch": 6789} {"train_loss": -28.05354881286621, "global_step": 563530, "epoch": 6789} {"train_loss": -27.96953773498535, "global_step": 563531, "epoch": 6789} {"train_loss": -27.885822296142578, "global_step": 563532, "epoch": 6789} {"train_loss": -27.895009994506836, "global_step": 563533, "epoch": 6789} {"train_loss": -28.11467933654785, "global_step": 563534, "epoch": 6789} {"train_loss": -27.60825538635254, "global_step": 563535, "epoch": 6789} {"train_loss": -28.09746742248535, "global_step": 563536, "epoch": 6789} {"train_loss": -28.141489028930664, "global_step": 563537, "epoch": 6789} {"train_loss": -27.804126739501953, "global_step": 563538, "epoch": 6789} {"train_loss": -28.200773239135742, "global_step": 563539, "epoch": 6789} {"train_loss": -27.702987670898438, "global_step": 563540, "epoch": 6789} {"train_loss": -27.953567504882812, "global_step": 563541, "epoch": 6789} {"train_loss": -27.926746368408203, "global_step": 563542, "epoch": 6789} {"train_loss": -28.235828399658203, "global_step": 563543, "epoch": 6789} {"train_loss": -27.493793487548828, "global_step": 563544, "epoch": 6789} {"train_loss": -28.088775634765625, "global_step": 563545, "epoch": 6789} {"train_loss": -27.820592880249023, "global_step": 563546, "epoch": 6789} {"train_loss": -28.16572380065918, "global_step": 563547, "epoch": 6789} {"train_loss": -27.79693603515625, "global_step": 563548, "epoch": 6789} {"train_loss": -28.04619789123535, "global_step": 563549, "epoch": 6789} {"train_loss": -28.139936447143555, "global_step": 563550, "epoch": 6789} {"train_loss": -28.12249755859375, "global_step": 563551, "epoch": 6789} {"train_loss": -27.75873374938965, "global_step": 563552, "epoch": 6789} {"train_loss": -28.23224449157715, "global_step": 563553, "epoch": 6789} {"train_loss": -27.540571212768555, "global_step": 563554, "epoch": 6789} {"train_loss": -27.93304443359375, "global_step": 563555, "epoch": 6789} {"train_loss": -28.225454330444336, "global_step": 563556, "epoch": 6789} {"train_loss": -28.304168701171875, "global_step": 563557, "epoch": 6789} {"train_loss": -28.303730010986328, "global_step": 563558, "epoch": 6789} {"train_loss": -27.857440948486328, "global_step": 563559, "epoch": 6789} {"train_loss": -27.992359161376953, "global_step": 563560, "epoch": 6789} {"train_loss": -27.944101333618164, "global_step": 563561, "epoch": 6789} {"train_loss": -27.689844131469727, "global_step": 563562, "epoch": 6789} {"train_loss": -27.794403076171875, "global_step": 563563, "epoch": 6789} {"train_loss": -27.704572677612305, "global_step": 563564, "epoch": 6789} {"train_loss": -27.762008666992188, "global_step": 563565, "epoch": 6789} {"train_loss": -27.652753829956055, "global_step": 563566, "epoch": 6789} {"train_loss": -27.786792755126953, "global_step": 563567, "epoch": 6789} {"train_loss": -27.861356735229492, "global_step": 563568, "epoch": 6789} {"train_loss": -27.630786849791747, "global_step": 563569, "epoch": 6789, "val_loss": 6440948.5} {"train_loss": -26.946115493774414, "global_step": 563570, "epoch": 6790} {"train_loss": -27.448530197143555, "global_step": 563571, "epoch": 6790} {"train_loss": -27.137683868408203, "global_step": 563572, "epoch": 6790} {"train_loss": -27.191162109375, "global_step": 563573, "epoch": 6790} {"train_loss": -27.61639404296875, "global_step": 563574, "epoch": 6790} {"train_loss": -27.034748077392578, "global_step": 563575, "epoch": 6790} {"train_loss": -27.251922607421875, "global_step": 563576, "epoch": 6790} {"train_loss": -27.26626968383789, "global_step": 563577, "epoch": 6790} {"train_loss": -27.114423751831055, "global_step": 563578, "epoch": 6790} {"train_loss": -27.46893310546875, "global_step": 563579, "epoch": 6790} {"train_loss": -27.71480369567871, "global_step": 563580, "epoch": 6790} {"train_loss": -27.661853790283203, "global_step": 563581, "epoch": 6790} {"train_loss": -27.650671005249023, "global_step": 563582, "epoch": 6790} {"train_loss": -27.608749389648438, "global_step": 563583, "epoch": 6790} {"train_loss": -27.35968017578125, "global_step": 563584, "epoch": 6790} {"train_loss": -28.075742721557617, "global_step": 563585, "epoch": 6790} {"train_loss": -27.681446075439453, "global_step": 563586, "epoch": 6790} {"train_loss": -27.721954345703125, "global_step": 563587, "epoch": 6790} {"train_loss": -27.762439727783203, "global_step": 563588, "epoch": 6790} {"train_loss": -27.75, "global_step": 563589, "epoch": 6790} {"train_loss": -27.734786987304688, "global_step": 563590, "epoch": 6790} {"train_loss": -27.983877182006836, "global_step": 563591, "epoch": 6790} {"train_loss": -27.684133529663086, "global_step": 563592, "epoch": 6790} {"train_loss": -27.495553970336914, "global_step": 563593, "epoch": 6790} {"train_loss": -27.87027359008789, "global_step": 563594, "epoch": 6790} {"train_loss": -27.848865509033203, "global_step": 563595, "epoch": 6790} {"train_loss": -27.867816925048828, "global_step": 563596, "epoch": 6790} {"train_loss": -28.001081466674805, "global_step": 563597, "epoch": 6790} {"train_loss": -28.010690689086914, "global_step": 563598, "epoch": 6790} {"train_loss": -27.8021297454834, "global_step": 563599, "epoch": 6790} {"train_loss": -27.817975997924805, "global_step": 563600, "epoch": 6790} {"train_loss": -28.0133056640625, "global_step": 563601, "epoch": 6790} {"train_loss": -28.033472061157227, "global_step": 563602, "epoch": 6790} {"train_loss": -28.224029541015625, "global_step": 563603, "epoch": 6790} {"train_loss": -27.947555541992188, "global_step": 563604, "epoch": 6790} {"train_loss": -27.618595123291016, "global_step": 563605, "epoch": 6790} {"train_loss": -27.71538734436035, "global_step": 563606, "epoch": 6790} {"train_loss": -28.1816463470459, "global_step": 563607, "epoch": 6790} {"train_loss": -27.57562828063965, "global_step": 563608, "epoch": 6790} {"train_loss": -27.850366592407227, "global_step": 563609, "epoch": 6790} {"train_loss": -28.214399337768555, "global_step": 563610, "epoch": 6790} {"train_loss": -28.247817993164062, "global_step": 563611, "epoch": 6790} {"train_loss": -27.555662155151367, "global_step": 563612, "epoch": 6790} {"train_loss": -28.047927856445312, "global_step": 563613, "epoch": 6790} {"train_loss": -27.747711181640625, "global_step": 563614, "epoch": 6790} {"train_loss": -28.176172256469727, "global_step": 563615, "epoch": 6790} {"train_loss": -27.92872428894043, "global_step": 563616, "epoch": 6790} {"train_loss": -28.05782127380371, "global_step": 563617, "epoch": 6790} {"train_loss": -28.048587799072266, "global_step": 563618, "epoch": 6790} {"train_loss": -27.537195205688477, "global_step": 563619, "epoch": 6790} {"train_loss": -28.125476837158203, "global_step": 563620, "epoch": 6790} {"train_loss": -28.20392417907715, "global_step": 563621, "epoch": 6790} {"train_loss": -27.98140525817871, "global_step": 563622, "epoch": 6790} {"train_loss": -27.7833194732666, "global_step": 563623, "epoch": 6790} {"train_loss": -27.333486557006836, "global_step": 563624, "epoch": 6790} {"train_loss": -26.660551071166992, "global_step": 563625, "epoch": 6790} {"train_loss": -26.40144157409668, "global_step": 563626, "epoch": 6790} {"train_loss": -27.59478759765625, "global_step": 563627, "epoch": 6790} {"train_loss": -27.636356353759766, "global_step": 563628, "epoch": 6790} {"train_loss": -27.35245704650879, "global_step": 563629, "epoch": 6790} {"train_loss": -27.8236026763916, "global_step": 563630, "epoch": 6790} {"train_loss": -27.403635025024414, "global_step": 563631, "epoch": 6790} {"train_loss": -27.766742706298828, "global_step": 563632, "epoch": 6790} {"train_loss": -26.762304306030273, "global_step": 563633, "epoch": 6790} {"train_loss": -26.696624755859375, "global_step": 563634, "epoch": 6790} {"train_loss": -26.897138595581055, "global_step": 563635, "epoch": 6790} {"train_loss": -26.8225040435791, "global_step": 563636, "epoch": 6790} {"train_loss": -27.6991024017334, "global_step": 563637, "epoch": 6790} {"train_loss": -27.474206924438477, "global_step": 563638, "epoch": 6790} {"train_loss": -26.93061637878418, "global_step": 563639, "epoch": 6790} {"train_loss": -27.240217208862305, "global_step": 563640, "epoch": 6790} {"train_loss": -27.160131454467773, "global_step": 563641, "epoch": 6790} {"train_loss": -27.194955825805664, "global_step": 563642, "epoch": 6790} {"train_loss": -27.326425552368164, "global_step": 563643, "epoch": 6790} {"train_loss": -27.717365264892578, "global_step": 563644, "epoch": 6790} {"train_loss": -27.561328887939453, "global_step": 563645, "epoch": 6790} {"train_loss": -27.577035903930664, "global_step": 563646, "epoch": 6790} {"train_loss": -27.362939834594727, "global_step": 563647, "epoch": 6790} {"train_loss": -27.51148796081543, "global_step": 563648, "epoch": 6790} {"train_loss": -27.224170684814453, "global_step": 563649, "epoch": 6790} {"train_loss": -27.71894645690918, "global_step": 563650, "epoch": 6790} {"train_loss": -27.683462142944336, "global_step": 563651, "epoch": 6790} {"train_loss": -27.584281852446406, "global_step": 563652, "epoch": 6790, "val_loss": 6413612.5} {"train_loss": -27.614343643188477, "global_step": 563653, "epoch": 6791} {"train_loss": -27.370685577392578, "global_step": 563654, "epoch": 6791} {"train_loss": -27.306543350219727, "global_step": 563655, "epoch": 6791} {"train_loss": -27.299665451049805, "global_step": 563656, "epoch": 6791} {"train_loss": -27.37515640258789, "global_step": 563657, "epoch": 6791} {"train_loss": -26.70413589477539, "global_step": 563658, "epoch": 6791} {"train_loss": -26.95026206970215, "global_step": 563659, "epoch": 6791} {"train_loss": -27.512786865234375, "global_step": 563660, "epoch": 6791} {"train_loss": -27.616519927978516, "global_step": 563661, "epoch": 6791} {"train_loss": -27.37784194946289, "global_step": 563662, "epoch": 6791} {"train_loss": -27.22515869140625, "global_step": 563663, "epoch": 6791} {"train_loss": -27.734390258789062, "global_step": 563664, "epoch": 6791} {"train_loss": -27.38331413269043, "global_step": 563665, "epoch": 6791} {"train_loss": -27.4715518951416, "global_step": 563666, "epoch": 6791} {"train_loss": -27.425893783569336, "global_step": 563667, "epoch": 6791} {"train_loss": -27.443838119506836, "global_step": 563668, "epoch": 6791} {"train_loss": -27.623035430908203, "global_step": 563669, "epoch": 6791} {"train_loss": -27.45611000061035, "global_step": 563670, "epoch": 6791} {"train_loss": -27.848901748657227, "global_step": 563671, "epoch": 6791} {"train_loss": -27.61116600036621, "global_step": 563672, "epoch": 6791} {"train_loss": -27.406457901000977, "global_step": 563673, "epoch": 6791} {"train_loss": -27.827728271484375, "global_step": 563674, "epoch": 6791} {"train_loss": -27.710912704467773, "global_step": 563675, "epoch": 6791} {"train_loss": -28.008380889892578, "global_step": 563676, "epoch": 6791} {"train_loss": -27.66180419921875, "global_step": 563677, "epoch": 6791} {"train_loss": -27.476581573486328, "global_step": 563678, "epoch": 6791} {"train_loss": -27.79815673828125, "global_step": 563679, "epoch": 6791} {"train_loss": -27.955564498901367, "global_step": 563680, "epoch": 6791} {"train_loss": -27.543792724609375, "global_step": 563681, "epoch": 6791} {"train_loss": -27.679458618164062, "global_step": 563682, "epoch": 6791} {"train_loss": -28.07876968383789, "global_step": 563683, "epoch": 6791} {"train_loss": -27.734731674194336, "global_step": 563684, "epoch": 6791} {"train_loss": -27.72879981994629, "global_step": 563685, "epoch": 6791} {"train_loss": -28.12708854675293, "global_step": 563686, "epoch": 6791} {"train_loss": -27.636249542236328, "global_step": 563687, "epoch": 6791} {"train_loss": -28.156763076782227, "global_step": 563688, "epoch": 6791} {"train_loss": -28.226215362548828, "global_step": 563689, "epoch": 6791} {"train_loss": -27.780569076538086, "global_step": 563690, "epoch": 6791} {"train_loss": -28.048053741455078, "global_step": 563691, "epoch": 6791} {"train_loss": -28.061084747314453, "global_step": 563692, "epoch": 6791} {"train_loss": -28.326391220092773, "global_step": 563693, "epoch": 6791} {"train_loss": -28.042606353759766, "global_step": 563694, "epoch": 6791} {"train_loss": -27.6871280670166, "global_step": 563695, "epoch": 6791} {"train_loss": -28.01173210144043, "global_step": 563696, "epoch": 6791} {"train_loss": -27.987262725830078, "global_step": 563697, "epoch": 6791} {"train_loss": -27.730615615844727, "global_step": 563698, "epoch": 6791} {"train_loss": -27.858478546142578, "global_step": 563699, "epoch": 6791} {"train_loss": -27.509443283081055, "global_step": 563700, "epoch": 6791} {"train_loss": -27.94454002380371, "global_step": 563701, "epoch": 6791} {"train_loss": -28.00116539001465, "global_step": 563702, "epoch": 6791} {"train_loss": -28.16847038269043, "global_step": 563703, "epoch": 6791} {"train_loss": -27.983844757080078, "global_step": 563704, "epoch": 6791} {"train_loss": -27.872013092041016, "global_step": 563705, "epoch": 6791} {"train_loss": -27.7320499420166, "global_step": 563706, "epoch": 6791} {"train_loss": -27.944355010986328, "global_step": 563707, "epoch": 6791} {"train_loss": -27.894681930541992, "global_step": 563708, "epoch": 6791} {"train_loss": -28.03143882751465, "global_step": 563709, "epoch": 6791} {"train_loss": -28.04010581970215, "global_step": 563710, "epoch": 6791} {"train_loss": -28.09295654296875, "global_step": 563711, "epoch": 6791} {"train_loss": -27.884204864501953, "global_step": 563712, "epoch": 6791} {"train_loss": -28.002538681030273, "global_step": 563713, "epoch": 6791} {"train_loss": -28.019689559936523, "global_step": 563714, "epoch": 6791} {"train_loss": -28.420307159423828, "global_step": 563715, "epoch": 6791} {"train_loss": -27.598834991455078, "global_step": 563716, "epoch": 6791} {"train_loss": -27.932449340820312, "global_step": 563717, "epoch": 6791} {"train_loss": -27.97608757019043, "global_step": 563718, "epoch": 6791} {"train_loss": -27.727325439453125, "global_step": 563719, "epoch": 6791} {"train_loss": -28.160877227783203, "global_step": 563720, "epoch": 6791} {"train_loss": -28.216394424438477, "global_step": 563721, "epoch": 6791} {"train_loss": -28.113983154296875, "global_step": 563722, "epoch": 6791} {"train_loss": -27.974653244018555, "global_step": 563723, "epoch": 6791} {"train_loss": -28.408491134643555, "global_step": 563724, "epoch": 6791} {"train_loss": -28.126724243164062, "global_step": 563725, "epoch": 6791} {"train_loss": -27.952518463134766, "global_step": 563726, "epoch": 6791} {"train_loss": -28.181018829345703, "global_step": 563727, "epoch": 6791} {"train_loss": -27.752927780151367, "global_step": 563728, "epoch": 6791} {"train_loss": -28.14033317565918, "global_step": 563729, "epoch": 6791} {"train_loss": -27.963178634643555, "global_step": 563730, "epoch": 6791} {"train_loss": -27.8861141204834, "global_step": 563731, "epoch": 6791} {"train_loss": -28.0303955078125, "global_step": 563732, "epoch": 6791} {"train_loss": -28.0895938873291, "global_step": 563733, "epoch": 6791} {"train_loss": -28.4445743560791, "global_step": 563734, "epoch": 6791} {"train_loss": -27.803956548851655, "global_step": 563735, "epoch": 6791, "val_loss": 6408545.0} {"train_loss": -26.71713638305664, "global_step": 563736, "epoch": 6792} {"train_loss": -27.119138717651367, "global_step": 563737, "epoch": 6792} {"train_loss": -26.707422256469727, "global_step": 563738, "epoch": 6792} {"train_loss": -25.765317916870117, "global_step": 563739, "epoch": 6792} {"train_loss": -25.929325103759766, "global_step": 563740, "epoch": 6792} {"train_loss": -25.942829132080078, "global_step": 563741, "epoch": 6792} {"train_loss": -26.499616622924805, "global_step": 563742, "epoch": 6792} {"train_loss": -26.709821701049805, "global_step": 563743, "epoch": 6792} {"train_loss": -26.967132568359375, "global_step": 563744, "epoch": 6792} {"train_loss": -26.895172119140625, "global_step": 563745, "epoch": 6792} {"train_loss": -27.187528610229492, "global_step": 563746, "epoch": 6792} {"train_loss": -26.56191062927246, "global_step": 563747, "epoch": 6792} {"train_loss": -27.012195587158203, "global_step": 563748, "epoch": 6792} {"train_loss": -27.246564865112305, "global_step": 563749, "epoch": 6792} {"train_loss": -27.1888427734375, "global_step": 563750, "epoch": 6792} {"train_loss": -27.6746883392334, "global_step": 563751, "epoch": 6792} {"train_loss": -26.99427604675293, "global_step": 563752, "epoch": 6792} {"train_loss": -27.493549346923828, "global_step": 563753, "epoch": 6792} {"train_loss": -27.125043869018555, "global_step": 563754, "epoch": 6792} {"train_loss": -27.612390518188477, "global_step": 563755, "epoch": 6792} {"train_loss": -27.386474609375, "global_step": 563756, "epoch": 6792} {"train_loss": -27.680490493774414, "global_step": 563757, "epoch": 6792} {"train_loss": -27.360937118530273, "global_step": 563758, "epoch": 6792} {"train_loss": -27.470060348510742, "global_step": 563759, "epoch": 6792} {"train_loss": -27.877416610717773, "global_step": 563760, "epoch": 6792} {"train_loss": -27.42378807067871, "global_step": 563761, "epoch": 6792} {"train_loss": -27.609573364257812, "global_step": 563762, "epoch": 6792} {"train_loss": -27.61732292175293, "global_step": 563763, "epoch": 6792} {"train_loss": -27.724950790405273, "global_step": 563764, "epoch": 6792} {"train_loss": -27.57259178161621, "global_step": 563765, "epoch": 6792} {"train_loss": -27.429035186767578, "global_step": 563766, "epoch": 6792} {"train_loss": -27.731210708618164, "global_step": 563767, "epoch": 6792} {"train_loss": -27.620193481445312, "global_step": 563768, "epoch": 6792} {"train_loss": -27.67913246154785, "global_step": 563769, "epoch": 6792} {"train_loss": -27.8046875, "global_step": 563770, "epoch": 6792} {"train_loss": -27.902099609375, "global_step": 563771, "epoch": 6792} {"train_loss": -27.9781436920166, "global_step": 563772, "epoch": 6792} {"train_loss": -27.803613662719727, "global_step": 563773, "epoch": 6792} {"train_loss": -27.88117790222168, "global_step": 563774, "epoch": 6792} {"train_loss": -27.47161865234375, "global_step": 563775, "epoch": 6792} {"train_loss": -27.689111709594727, "global_step": 563776, "epoch": 6792} {"train_loss": -27.627948760986328, "global_step": 563777, "epoch": 6792} {"train_loss": -27.81424331665039, "global_step": 563778, "epoch": 6792} {"train_loss": -27.800342559814453, "global_step": 563779, "epoch": 6792} {"train_loss": -27.77485466003418, "global_step": 563780, "epoch": 6792} {"train_loss": -27.75164794921875, "global_step": 563781, "epoch": 6792} {"train_loss": -28.14875602722168, "global_step": 563782, "epoch": 6792} {"train_loss": -28.016372680664062, "global_step": 563783, "epoch": 6792} {"train_loss": -27.806482315063477, "global_step": 563784, "epoch": 6792} {"train_loss": -27.770660400390625, "global_step": 563785, "epoch": 6792} {"train_loss": -27.940710067749023, "global_step": 563786, "epoch": 6792} {"train_loss": -28.055017471313477, "global_step": 563787, "epoch": 6792} {"train_loss": -27.799457550048828, "global_step": 563788, "epoch": 6792} {"train_loss": -27.984994888305664, "global_step": 563789, "epoch": 6792} {"train_loss": -28.072498321533203, "global_step": 563790, "epoch": 6792} {"train_loss": -28.22725486755371, "global_step": 563791, "epoch": 6792} {"train_loss": -27.881208419799805, "global_step": 563792, "epoch": 6792} {"train_loss": -28.187143325805664, "global_step": 563793, "epoch": 6792} {"train_loss": -28.35797119140625, "global_step": 563794, "epoch": 6792} {"train_loss": -27.952640533447266, "global_step": 563795, "epoch": 6792} {"train_loss": -28.059833526611328, "global_step": 563796, "epoch": 6792} {"train_loss": -28.256994247436523, "global_step": 563797, "epoch": 6792} {"train_loss": -28.082223892211914, "global_step": 563798, "epoch": 6792} {"train_loss": -27.67909049987793, "global_step": 563799, "epoch": 6792} {"train_loss": -27.784666061401367, "global_step": 563800, "epoch": 6792} {"train_loss": -27.993167877197266, "global_step": 563801, "epoch": 6792} {"train_loss": -27.95595359802246, "global_step": 563802, "epoch": 6792} {"train_loss": -28.340015411376953, "global_step": 563803, "epoch": 6792} {"train_loss": -28.138385772705078, "global_step": 563804, "epoch": 6792} {"train_loss": -28.144285202026367, "global_step": 563805, "epoch": 6792} {"train_loss": -27.82124137878418, "global_step": 563806, "epoch": 6792} {"train_loss": -27.56271743774414, "global_step": 563807, "epoch": 6792} {"train_loss": -27.15125846862793, "global_step": 563808, "epoch": 6792} {"train_loss": -27.676166534423828, "global_step": 563809, "epoch": 6792} {"train_loss": -27.09385108947754, "global_step": 563810, "epoch": 6792} {"train_loss": -27.381580352783203, "global_step": 563811, "epoch": 6792} {"train_loss": -27.235837936401367, "global_step": 563812, "epoch": 6792} {"train_loss": -27.411001205444336, "global_step": 563813, "epoch": 6792} {"train_loss": -27.37971305847168, "global_step": 563814, "epoch": 6792} {"train_loss": -27.898757934570312, "global_step": 563815, "epoch": 6792} {"train_loss": -27.536359786987305, "global_step": 563816, "epoch": 6792} {"train_loss": -27.2058162689209, "global_step": 563817, "epoch": 6792} {"train_loss": -27.560362069003553, "global_step": 563818, "epoch": 6792, "val_loss": 6497221.5} {"train_loss": -26.570703506469727, "global_step": 563819, "epoch": 6793} {"train_loss": -26.799365997314453, "global_step": 563820, "epoch": 6793} {"train_loss": -26.709699630737305, "global_step": 563821, "epoch": 6793} {"train_loss": -26.882129669189453, "global_step": 563822, "epoch": 6793} {"train_loss": -26.570438385009766, "global_step": 563823, "epoch": 6793} {"train_loss": -26.171817779541016, "global_step": 563824, "epoch": 6793} {"train_loss": -27.18084144592285, "global_step": 563825, "epoch": 6793} {"train_loss": -27.060626983642578, "global_step": 563826, "epoch": 6793} {"train_loss": -27.13779640197754, "global_step": 563827, "epoch": 6793} {"train_loss": -26.96632194519043, "global_step": 563828, "epoch": 6793} {"train_loss": -26.758392333984375, "global_step": 563829, "epoch": 6793} {"train_loss": -27.306325912475586, "global_step": 563830, "epoch": 6793} {"train_loss": -27.39595603942871, "global_step": 563831, "epoch": 6793} {"train_loss": -26.944015502929688, "global_step": 563832, "epoch": 6793} {"train_loss": -27.142181396484375, "global_step": 563833, "epoch": 6793} {"train_loss": -27.09771728515625, "global_step": 563834, "epoch": 6793} {"train_loss": -27.550573348999023, "global_step": 563835, "epoch": 6793} {"train_loss": -27.331317901611328, "global_step": 563836, "epoch": 6793} {"train_loss": -27.2935733795166, "global_step": 563837, "epoch": 6793} {"train_loss": -27.269550323486328, "global_step": 563838, "epoch": 6793} {"train_loss": -27.292760848999023, "global_step": 563839, "epoch": 6793} {"train_loss": -27.454986572265625, "global_step": 563840, "epoch": 6793} {"train_loss": -27.47705078125, "global_step": 563841, "epoch": 6793} {"train_loss": -27.44306755065918, "global_step": 563842, "epoch": 6793} {"train_loss": -27.61981773376465, "global_step": 563843, "epoch": 6793} {"train_loss": -27.78313636779785, "global_step": 563844, "epoch": 6793} {"train_loss": -27.431859970092773, "global_step": 563845, "epoch": 6793} {"train_loss": -27.604124069213867, "global_step": 563846, "epoch": 6793} {"train_loss": -27.78790855407715, "global_step": 563847, "epoch": 6793} {"train_loss": -27.839435577392578, "global_step": 563848, "epoch": 6793} {"train_loss": -27.534576416015625, "global_step": 563849, "epoch": 6793} {"train_loss": -27.503385543823242, "global_step": 563850, "epoch": 6793} {"train_loss": -27.585519790649414, "global_step": 563851, "epoch": 6793} {"train_loss": -27.751422882080078, "global_step": 563852, "epoch": 6793} {"train_loss": -28.00282096862793, "global_step": 563853, "epoch": 6793} {"train_loss": -27.897262573242188, "global_step": 563854, "epoch": 6793} {"train_loss": -28.052576065063477, "global_step": 563855, "epoch": 6793} {"train_loss": -27.93653678894043, "global_step": 563856, "epoch": 6793} {"train_loss": -27.96030616760254, "global_step": 563857, "epoch": 6793} {"train_loss": -28.0058536529541, "global_step": 563858, "epoch": 6793} {"train_loss": -27.901031494140625, "global_step": 563859, "epoch": 6793} {"train_loss": -27.94270133972168, "global_step": 563860, "epoch": 6793} {"train_loss": -28.12263298034668, "global_step": 563861, "epoch": 6793} {"train_loss": -27.679956436157227, "global_step": 563862, "epoch": 6793} {"train_loss": -27.796964645385742, "global_step": 563863, "epoch": 6793} {"train_loss": -27.797077178955078, "global_step": 563864, "epoch": 6793} {"train_loss": -27.932126998901367, "global_step": 563865, "epoch": 6793} {"train_loss": -27.664905548095703, "global_step": 563866, "epoch": 6793} {"train_loss": -28.231836318969727, "global_step": 563867, "epoch": 6793} {"train_loss": -27.7977352142334, "global_step": 563868, "epoch": 6793} {"train_loss": -28.434667587280273, "global_step": 563869, "epoch": 6793} {"train_loss": -27.629499435424805, "global_step": 563870, "epoch": 6793} {"train_loss": -27.669172286987305, "global_step": 563871, "epoch": 6793} {"train_loss": -27.990076065063477, "global_step": 563872, "epoch": 6793} {"train_loss": -27.768518447875977, "global_step": 563873, "epoch": 6793} {"train_loss": -27.961057662963867, "global_step": 563874, "epoch": 6793} {"train_loss": -27.8846492767334, "global_step": 563875, "epoch": 6793} {"train_loss": -28.08699607849121, "global_step": 563876, "epoch": 6793} {"train_loss": -27.74738883972168, "global_step": 563877, "epoch": 6793} {"train_loss": -28.0252628326416, "global_step": 563878, "epoch": 6793} {"train_loss": -28.184070587158203, "global_step": 563879, "epoch": 6793} {"train_loss": -27.839984893798828, "global_step": 563880, "epoch": 6793} {"train_loss": -27.848403930664062, "global_step": 563881, "epoch": 6793} {"train_loss": -28.020612716674805, "global_step": 563882, "epoch": 6793} {"train_loss": -27.644927978515625, "global_step": 563883, "epoch": 6793} {"train_loss": -27.810169219970703, "global_step": 563884, "epoch": 6793} {"train_loss": -28.058643341064453, "global_step": 563885, "epoch": 6793} {"train_loss": -28.003934860229492, "global_step": 563886, "epoch": 6793} {"train_loss": -27.77262306213379, "global_step": 563887, "epoch": 6793} {"train_loss": -27.907217025756836, "global_step": 563888, "epoch": 6793} {"train_loss": -28.004995346069336, "global_step": 563889, "epoch": 6793} {"train_loss": -28.310779571533203, "global_step": 563890, "epoch": 6793} {"train_loss": -27.804279327392578, "global_step": 563891, "epoch": 6793} {"train_loss": -27.752294540405273, "global_step": 563892, "epoch": 6793} {"train_loss": -27.9771728515625, "global_step": 563893, "epoch": 6793} {"train_loss": -27.680450439453125, "global_step": 563894, "epoch": 6793} {"train_loss": -27.548141479492188, "global_step": 563895, "epoch": 6793} {"train_loss": -27.854597091674805, "global_step": 563896, "epoch": 6793} {"train_loss": -27.636798858642578, "global_step": 563897, "epoch": 6793} {"train_loss": -27.86820411682129, "global_step": 563898, "epoch": 6793} {"train_loss": -28.215890884399414, "global_step": 563899, "epoch": 6793} {"train_loss": -27.97089195251465, "global_step": 563900, "epoch": 6793} {"train_loss": -27.634789202586713, "global_step": 563901, "epoch": 6793, "val_loss": 6493411.0} {"train_loss": -27.720386505126953, "global_step": 563902, "epoch": 6794} {"train_loss": -26.971649169921875, "global_step": 563903, "epoch": 6794} {"train_loss": -27.19561195373535, "global_step": 563904, "epoch": 6794} {"train_loss": -27.481521606445312, "global_step": 563905, "epoch": 6794} {"train_loss": -27.657703399658203, "global_step": 563906, "epoch": 6794} {"train_loss": -27.296539306640625, "global_step": 563907, "epoch": 6794} {"train_loss": -26.787656784057617, "global_step": 563908, "epoch": 6794} {"train_loss": -27.94353675842285, "global_step": 563909, "epoch": 6794} {"train_loss": -27.554798126220703, "global_step": 563910, "epoch": 6794} {"train_loss": -27.486160278320312, "global_step": 563911, "epoch": 6794} {"train_loss": -27.679868698120117, "global_step": 563912, "epoch": 6794} {"train_loss": -27.498315811157227, "global_step": 563913, "epoch": 6794} {"train_loss": -27.528076171875, "global_step": 563914, "epoch": 6794} {"train_loss": -27.538726806640625, "global_step": 563915, "epoch": 6794} {"train_loss": -27.284351348876953, "global_step": 563916, "epoch": 6794} {"train_loss": -27.86280632019043, "global_step": 563917, "epoch": 6794} {"train_loss": -27.559167861938477, "global_step": 563918, "epoch": 6794} {"train_loss": -27.581470489501953, "global_step": 563919, "epoch": 6794} {"train_loss": -27.379194259643555, "global_step": 563920, "epoch": 6794} {"train_loss": -27.4956111907959, "global_step": 563921, "epoch": 6794} {"train_loss": -27.42831802368164, "global_step": 563922, "epoch": 6794} {"train_loss": -28.11651611328125, "global_step": 563923, "epoch": 6794} {"train_loss": -27.64414405822754, "global_step": 563924, "epoch": 6794} {"train_loss": -27.935791015625, "global_step": 563925, "epoch": 6794} {"train_loss": -28.241016387939453, "global_step": 563926, "epoch": 6794} {"train_loss": -27.75040054321289, "global_step": 563927, "epoch": 6794} {"train_loss": -27.586166381835938, "global_step": 563928, "epoch": 6794} {"train_loss": -27.895740509033203, "global_step": 563929, "epoch": 6794} {"train_loss": -27.65117835998535, "global_step": 563930, "epoch": 6794} {"train_loss": -28.129230499267578, "global_step": 563931, "epoch": 6794} {"train_loss": -27.813323974609375, "global_step": 563932, "epoch": 6794} {"train_loss": -27.584314346313477, "global_step": 563933, "epoch": 6794} {"train_loss": -27.466644287109375, "global_step": 563934, "epoch": 6794} {"train_loss": -27.966161727905273, "global_step": 563935, "epoch": 6794} {"train_loss": -27.769983291625977, "global_step": 563936, "epoch": 6794} {"train_loss": -27.825515747070312, "global_step": 563937, "epoch": 6794} {"train_loss": -27.720678329467773, "global_step": 563938, "epoch": 6794} {"train_loss": -27.510290145874023, "global_step": 563939, "epoch": 6794} {"train_loss": -28.069671630859375, "global_step": 563940, "epoch": 6794} {"train_loss": -28.006601333618164, "global_step": 563941, "epoch": 6794} {"train_loss": -27.832355499267578, "global_step": 563942, "epoch": 6794} {"train_loss": -27.909408569335938, "global_step": 563943, "epoch": 6794} {"train_loss": -27.7127742767334, "global_step": 563944, "epoch": 6794} {"train_loss": -27.633691787719727, "global_step": 563945, "epoch": 6794} {"train_loss": -28.110462188720703, "global_step": 563946, "epoch": 6794} {"train_loss": -27.88031005859375, "global_step": 563947, "epoch": 6794} {"train_loss": -27.91483497619629, "global_step": 563948, "epoch": 6794} {"train_loss": -28.0089111328125, "global_step": 563949, "epoch": 6794} {"train_loss": -28.096546173095703, "global_step": 563950, "epoch": 6794} {"train_loss": -27.54456901550293, "global_step": 563951, "epoch": 6794} {"train_loss": -27.958337783813477, "global_step": 563952, "epoch": 6794} {"train_loss": -27.606348037719727, "global_step": 563953, "epoch": 6794} {"train_loss": -27.442304611206055, "global_step": 563954, "epoch": 6794} {"train_loss": -27.74045753479004, "global_step": 563955, "epoch": 6794} {"train_loss": -27.57966423034668, "global_step": 563956, "epoch": 6794} {"train_loss": -28.03312110900879, "global_step": 563957, "epoch": 6794} {"train_loss": -27.864904403686523, "global_step": 563958, "epoch": 6794} {"train_loss": -27.871479034423828, "global_step": 563959, "epoch": 6794} {"train_loss": -27.75925064086914, "global_step": 563960, "epoch": 6794} {"train_loss": -27.5760498046875, "global_step": 563961, "epoch": 6794} {"train_loss": -27.768939971923828, "global_step": 563962, "epoch": 6794} {"train_loss": -27.946706771850586, "global_step": 563963, "epoch": 6794} {"train_loss": -27.97882080078125, "global_step": 563964, "epoch": 6794} {"train_loss": -27.523046493530273, "global_step": 563965, "epoch": 6794} {"train_loss": -28.061609268188477, "global_step": 563966, "epoch": 6794} {"train_loss": -27.59684181213379, "global_step": 563967, "epoch": 6794} {"train_loss": -27.7275333404541, "global_step": 563968, "epoch": 6794} {"train_loss": -27.5936336517334, "global_step": 563969, "epoch": 6794} {"train_loss": -27.807214736938477, "global_step": 563970, "epoch": 6794} {"train_loss": -27.626300811767578, "global_step": 563971, "epoch": 6794} {"train_loss": -27.666128158569336, "global_step": 563972, "epoch": 6794} {"train_loss": -27.52103042602539, "global_step": 563973, "epoch": 6794} {"train_loss": -27.363306045532227, "global_step": 563974, "epoch": 6794} {"train_loss": -27.100488662719727, "global_step": 563975, "epoch": 6794} {"train_loss": -27.160852432250977, "global_step": 563976, "epoch": 6794} {"train_loss": -27.769140243530273, "global_step": 563977, "epoch": 6794} {"train_loss": -27.286579132080078, "global_step": 563978, "epoch": 6794} {"train_loss": -27.777374267578125, "global_step": 563979, "epoch": 6794} {"train_loss": -27.474435806274414, "global_step": 563980, "epoch": 6794} {"train_loss": -27.568206787109375, "global_step": 563981, "epoch": 6794} {"train_loss": -27.723474502563477, "global_step": 563982, "epoch": 6794} {"train_loss": -28.099567413330078, "global_step": 563983, "epoch": 6794} {"train_loss": -27.696302919502717, "global_step": 563984, "epoch": 6794, "val_loss": 6515790.5} {"train_loss": -27.228925704956055, "global_step": 563985, "epoch": 6795} {"train_loss": -27.28604507446289, "global_step": 563986, "epoch": 6795} {"train_loss": -27.411447525024414, "global_step": 563987, "epoch": 6795} {"train_loss": -27.503204345703125, "global_step": 563988, "epoch": 6795} {"train_loss": -27.427539825439453, "global_step": 563989, "epoch": 6795} {"train_loss": -27.463247299194336, "global_step": 563990, "epoch": 6795} {"train_loss": -27.26910972595215, "global_step": 563991, "epoch": 6795} {"train_loss": -27.233539581298828, "global_step": 563992, "epoch": 6795} {"train_loss": -27.147504806518555, "global_step": 563993, "epoch": 6795} {"train_loss": -27.11224937438965, "global_step": 563994, "epoch": 6795} {"train_loss": -27.51069450378418, "global_step": 563995, "epoch": 6795} {"train_loss": -27.475183486938477, "global_step": 563996, "epoch": 6795} {"train_loss": -27.50617790222168, "global_step": 563997, "epoch": 6795} {"train_loss": -27.684228897094727, "global_step": 563998, "epoch": 6795} {"train_loss": -27.4560604095459, "global_step": 563999, "epoch": 6795} {"train_loss": -27.267724990844727, "global_step": 564000, "epoch": 6795} {"train_loss": -27.49049186706543, "global_step": 564001, "epoch": 6795} {"train_loss": -27.592254638671875, "global_step": 564002, "epoch": 6795} {"train_loss": -27.826892852783203, "global_step": 564003, "epoch": 6795} {"train_loss": -27.660552978515625, "global_step": 564004, "epoch": 6795} {"train_loss": -27.631555557250977, "global_step": 564005, "epoch": 6795} {"train_loss": -27.530698776245117, "global_step": 564006, "epoch": 6795} {"train_loss": -27.722436904907227, "global_step": 564007, "epoch": 6795} {"train_loss": -27.409650802612305, "global_step": 564008, "epoch": 6795} {"train_loss": -27.42127799987793, "global_step": 564009, "epoch": 6795} {"train_loss": -27.87904167175293, "global_step": 564010, "epoch": 6795} {"train_loss": -27.627851486206055, "global_step": 564011, "epoch": 6795} {"train_loss": -27.483261108398438, "global_step": 564012, "epoch": 6795} {"train_loss": -27.297805786132812, "global_step": 564013, "epoch": 6795} {"train_loss": -27.871789932250977, "global_step": 564014, "epoch": 6795} {"train_loss": -27.5483341217041, "global_step": 564015, "epoch": 6795} {"train_loss": -27.919448852539062, "global_step": 564016, "epoch": 6795} {"train_loss": -27.97450065612793, "global_step": 564017, "epoch": 6795} {"train_loss": -28.180999755859375, "global_step": 564018, "epoch": 6795} {"train_loss": -28.063520431518555, "global_step": 564019, "epoch": 6795} {"train_loss": -27.76055908203125, "global_step": 564020, "epoch": 6795} {"train_loss": -27.973295211791992, "global_step": 564021, "epoch": 6795} {"train_loss": -27.59860610961914, "global_step": 564022, "epoch": 6795} {"train_loss": -28.0896053314209, "global_step": 564023, "epoch": 6795} {"train_loss": -27.9615421295166, "global_step": 564024, "epoch": 6795} {"train_loss": -27.90323257446289, "global_step": 564025, "epoch": 6795} {"train_loss": -27.650644302368164, "global_step": 564026, "epoch": 6795} {"train_loss": -27.835901260375977, "global_step": 564027, "epoch": 6795} {"train_loss": -28.121667861938477, "global_step": 564028, "epoch": 6795} {"train_loss": -27.714792251586914, "global_step": 564029, "epoch": 6795} {"train_loss": -27.573022842407227, "global_step": 564030, "epoch": 6795} {"train_loss": -28.087024688720703, "global_step": 564031, "epoch": 6795} {"train_loss": -28.05490493774414, "global_step": 564032, "epoch": 6795} {"train_loss": -27.961042404174805, "global_step": 564033, "epoch": 6795} {"train_loss": -28.046720504760742, "global_step": 564034, "epoch": 6795} {"train_loss": -28.420886993408203, "global_step": 564035, "epoch": 6795} {"train_loss": -28.073583602905273, "global_step": 564036, "epoch": 6795} {"train_loss": -28.152637481689453, "global_step": 564037, "epoch": 6795} {"train_loss": -28.06117057800293, "global_step": 564038, "epoch": 6795} {"train_loss": -27.786624908447266, "global_step": 564039, "epoch": 6795} {"train_loss": -28.12944984436035, "global_step": 564040, "epoch": 6795} {"train_loss": -28.056949615478516, "global_step": 564041, "epoch": 6795} {"train_loss": -28.226276397705078, "global_step": 564042, "epoch": 6795} {"train_loss": -28.05401039123535, "global_step": 564043, "epoch": 6795} {"train_loss": -28.207197189331055, "global_step": 564044, "epoch": 6795} {"train_loss": -27.717824935913086, "global_step": 564045, "epoch": 6795} {"train_loss": -27.330713272094727, "global_step": 564046, "epoch": 6795} {"train_loss": -27.183141708374023, "global_step": 564047, "epoch": 6795} {"train_loss": -26.559894561767578, "global_step": 564048, "epoch": 6795} {"train_loss": -26.1944522857666, "global_step": 564049, "epoch": 6795} {"train_loss": -25.050073623657227, "global_step": 564050, "epoch": 6795} {"train_loss": -26.549819946289062, "global_step": 564051, "epoch": 6795} {"train_loss": -25.987741470336914, "global_step": 564052, "epoch": 6795} {"train_loss": -26.2426700592041, "global_step": 564053, "epoch": 6795} {"train_loss": -27.362512588500977, "global_step": 564054, "epoch": 6795} {"train_loss": -27.19838523864746, "global_step": 564055, "epoch": 6795} {"train_loss": -27.167774200439453, "global_step": 564056, "epoch": 6795} {"train_loss": -27.1636962890625, "global_step": 564057, "epoch": 6795} {"train_loss": -27.38063621520996, "global_step": 564058, "epoch": 6795} {"train_loss": -27.320383071899414, "global_step": 564059, "epoch": 6795} {"train_loss": -27.408218383789062, "global_step": 564060, "epoch": 6795} {"train_loss": -27.031421661376953, "global_step": 564061, "epoch": 6795} {"train_loss": -27.192657470703125, "global_step": 564062, "epoch": 6795} {"train_loss": -27.395612716674805, "global_step": 564063, "epoch": 6795} {"train_loss": -27.56784439086914, "global_step": 564064, "epoch": 6795} {"train_loss": -27.437335968017578, "global_step": 564065, "epoch": 6795} {"train_loss": -27.133514404296875, "global_step": 564066, "epoch": 6795} {"train_loss": -27.549094924007555, "global_step": 564067, "epoch": 6795, "val_loss": 6480557.0} {"train_loss": -26.740478515625, "global_step": 564068, "epoch": 6796} {"train_loss": -26.89155387878418, "global_step": 564069, "epoch": 6796} {"train_loss": -26.6939754486084, "global_step": 564070, "epoch": 6796} {"train_loss": -27.215118408203125, "global_step": 564071, "epoch": 6796} {"train_loss": -27.17400550842285, "global_step": 564072, "epoch": 6796} {"train_loss": -27.295751571655273, "global_step": 564073, "epoch": 6796} {"train_loss": -26.948089599609375, "global_step": 564074, "epoch": 6796} {"train_loss": -27.464025497436523, "global_step": 564075, "epoch": 6796} {"train_loss": -27.055221557617188, "global_step": 564076, "epoch": 6796} {"train_loss": -27.354196548461914, "global_step": 564077, "epoch": 6796} {"train_loss": -27.304059982299805, "global_step": 564078, "epoch": 6796} {"train_loss": -27.208032608032227, "global_step": 564079, "epoch": 6796} {"train_loss": -26.831439971923828, "global_step": 564080, "epoch": 6796} {"train_loss": -27.722156524658203, "global_step": 564081, "epoch": 6796} {"train_loss": -27.344507217407227, "global_step": 564082, "epoch": 6796} {"train_loss": -27.56429100036621, "global_step": 564083, "epoch": 6796} {"train_loss": -27.66999626159668, "global_step": 564084, "epoch": 6796} {"train_loss": -27.29168701171875, "global_step": 564085, "epoch": 6796} {"train_loss": -27.854345321655273, "global_step": 564086, "epoch": 6796} {"train_loss": -27.521299362182617, "global_step": 564087, "epoch": 6796} {"train_loss": -27.655126571655273, "global_step": 564088, "epoch": 6796} {"train_loss": -27.677764892578125, "global_step": 564089, "epoch": 6796} {"train_loss": -27.763885498046875, "global_step": 564090, "epoch": 6796} {"train_loss": -27.904830932617188, "global_step": 564091, "epoch": 6796} {"train_loss": -27.863462448120117, "global_step": 564092, "epoch": 6796} {"train_loss": -27.854297637939453, "global_step": 564093, "epoch": 6796} {"train_loss": -27.66094398498535, "global_step": 564094, "epoch": 6796} {"train_loss": -27.808841705322266, "global_step": 564095, "epoch": 6796} {"train_loss": -28.106714248657227, "global_step": 564096, "epoch": 6796} {"train_loss": -27.802387237548828, "global_step": 564097, "epoch": 6796} {"train_loss": -28.04117774963379, "global_step": 564098, "epoch": 6796} {"train_loss": -27.700490951538086, "global_step": 564099, "epoch": 6796} {"train_loss": -27.734439849853516, "global_step": 564100, "epoch": 6796} {"train_loss": -28.391321182250977, "global_step": 564101, "epoch": 6796} {"train_loss": -28.1876220703125, "global_step": 564102, "epoch": 6796} {"train_loss": -27.944751739501953, "global_step": 564103, "epoch": 6796} {"train_loss": -27.937774658203125, "global_step": 564104, "epoch": 6796} {"train_loss": -28.154218673706055, "global_step": 564105, "epoch": 6796} {"train_loss": -28.0714111328125, "global_step": 564106, "epoch": 6796} {"train_loss": -28.174962997436523, "global_step": 564107, "epoch": 6796} {"train_loss": -28.065664291381836, "global_step": 564108, "epoch": 6796} {"train_loss": -27.95587730407715, "global_step": 564109, "epoch": 6796} {"train_loss": -27.73325538635254, "global_step": 564110, "epoch": 6796} {"train_loss": -27.82783317565918, "global_step": 564111, "epoch": 6796} {"train_loss": -27.82398796081543, "global_step": 564112, "epoch": 6796} {"train_loss": -27.924091339111328, "global_step": 564113, "epoch": 6796} {"train_loss": -27.94410514831543, "global_step": 564114, "epoch": 6796} {"train_loss": -27.603376388549805, "global_step": 564115, "epoch": 6796} {"train_loss": -27.964391708374023, "global_step": 564116, "epoch": 6796} {"train_loss": -27.603015899658203, "global_step": 564117, "epoch": 6796} {"train_loss": -27.976547241210938, "global_step": 564118, "epoch": 6796} {"train_loss": -27.847570419311523, "global_step": 564119, "epoch": 6796} {"train_loss": -28.102880477905273, "global_step": 564120, "epoch": 6796} {"train_loss": -27.666015625, "global_step": 564121, "epoch": 6796} {"train_loss": -27.74273681640625, "global_step": 564122, "epoch": 6796} {"train_loss": -27.948165893554688, "global_step": 564123, "epoch": 6796} {"train_loss": -28.200693130493164, "global_step": 564124, "epoch": 6796} {"train_loss": -27.94767189025879, "global_step": 564125, "epoch": 6796} {"train_loss": -27.967947006225586, "global_step": 564126, "epoch": 6796} {"train_loss": -27.849496841430664, "global_step": 564127, "epoch": 6796} {"train_loss": -27.73636817932129, "global_step": 564128, "epoch": 6796} {"train_loss": -28.202680587768555, "global_step": 564129, "epoch": 6796} {"train_loss": -27.78130531311035, "global_step": 564130, "epoch": 6796} {"train_loss": -28.063520431518555, "global_step": 564131, "epoch": 6796} {"train_loss": -27.852319717407227, "global_step": 564132, "epoch": 6796} {"train_loss": -28.15835952758789, "global_step": 564133, "epoch": 6796} {"train_loss": -27.878875732421875, "global_step": 564134, "epoch": 6796} {"train_loss": -28.296146392822266, "global_step": 564135, "epoch": 6796} {"train_loss": -27.649255752563477, "global_step": 564136, "epoch": 6796} {"train_loss": -28.212244033813477, "global_step": 564137, "epoch": 6796} {"train_loss": -27.731985092163086, "global_step": 564138, "epoch": 6796} {"train_loss": -27.754119873046875, "global_step": 564139, "epoch": 6796} {"train_loss": -27.5239200592041, "global_step": 564140, "epoch": 6796} {"train_loss": -27.512531280517578, "global_step": 564141, "epoch": 6796} {"train_loss": -27.7825984954834, "global_step": 564142, "epoch": 6796} {"train_loss": -28.110523223876953, "global_step": 564143, "epoch": 6796} {"train_loss": -27.938812255859375, "global_step": 564144, "epoch": 6796} {"train_loss": -27.973438262939453, "global_step": 564145, "epoch": 6796} {"train_loss": -28.056543350219727, "global_step": 564146, "epoch": 6796} {"train_loss": -27.81195068359375, "global_step": 564147, "epoch": 6796} {"train_loss": -28.118513107299805, "global_step": 564148, "epoch": 6796} {"train_loss": -28.173864364624023, "global_step": 564149, "epoch": 6796} {"train_loss": -27.765960532498646, "global_step": 564150, "epoch": 6796, "val_loss": 6460270.0} {"train_loss": -27.623336791992188, "global_step": 564151, "epoch": 6797} {"train_loss": -27.55384635925293, "global_step": 564152, "epoch": 6797} {"train_loss": -27.313739776611328, "global_step": 564153, "epoch": 6797} {"train_loss": -27.66963005065918, "global_step": 564154, "epoch": 6797} {"train_loss": -27.44195556640625, "global_step": 564155, "epoch": 6797} {"train_loss": -27.99933433532715, "global_step": 564156, "epoch": 6797} {"train_loss": -27.492462158203125, "global_step": 564157, "epoch": 6797} {"train_loss": -27.487857818603516, "global_step": 564158, "epoch": 6797} {"train_loss": -27.258752822875977, "global_step": 564159, "epoch": 6797} {"train_loss": -27.25714683532715, "global_step": 564160, "epoch": 6797} {"train_loss": -27.550764083862305, "global_step": 564161, "epoch": 6797} {"train_loss": -27.448139190673828, "global_step": 564162, "epoch": 6797} {"train_loss": -27.23296546936035, "global_step": 564163, "epoch": 6797} {"train_loss": -27.396814346313477, "global_step": 564164, "epoch": 6797} {"train_loss": -27.4729061126709, "global_step": 564165, "epoch": 6797} {"train_loss": -27.4552001953125, "global_step": 564166, "epoch": 6797} {"train_loss": -27.538776397705078, "global_step": 564167, "epoch": 6797} {"train_loss": -27.571447372436523, "global_step": 564168, "epoch": 6797} {"train_loss": -27.58907127380371, "global_step": 564169, "epoch": 6797} {"train_loss": -27.097753524780273, "global_step": 564170, "epoch": 6797} {"train_loss": -27.54986572265625, "global_step": 564171, "epoch": 6797} {"train_loss": -27.521154403686523, "global_step": 564172, "epoch": 6797} {"train_loss": -27.667346954345703, "global_step": 564173, "epoch": 6797} {"train_loss": -27.669973373413086, "global_step": 564174, "epoch": 6797} {"train_loss": -28.04646110534668, "global_step": 564175, "epoch": 6797} {"train_loss": -27.770227432250977, "global_step": 564176, "epoch": 6797} {"train_loss": -27.855926513671875, "global_step": 564177, "epoch": 6797} {"train_loss": -27.8044376373291, "global_step": 564178, "epoch": 6797} {"train_loss": -28.102649688720703, "global_step": 564179, "epoch": 6797} {"train_loss": -27.586048126220703, "global_step": 564180, "epoch": 6797} {"train_loss": -27.829797744750977, "global_step": 564181, "epoch": 6797} {"train_loss": -27.46756362915039, "global_step": 564182, "epoch": 6797} {"train_loss": -27.7627010345459, "global_step": 564183, "epoch": 6797} {"train_loss": -27.790937423706055, "global_step": 564184, "epoch": 6797} {"train_loss": -28.014328002929688, "global_step": 564185, "epoch": 6797} {"train_loss": -28.326358795166016, "global_step": 564186, "epoch": 6797} {"train_loss": -27.611408233642578, "global_step": 564187, "epoch": 6797} {"train_loss": -28.027297973632812, "global_step": 564188, "epoch": 6797} {"train_loss": -27.726160049438477, "global_step": 564189, "epoch": 6797} {"train_loss": -27.954736709594727, "global_step": 564190, "epoch": 6797} {"train_loss": -27.62298011779785, "global_step": 564191, "epoch": 6797} {"train_loss": -27.60877799987793, "global_step": 564192, "epoch": 6797} {"train_loss": -27.926511764526367, "global_step": 564193, "epoch": 6797} {"train_loss": -27.852548599243164, "global_step": 564194, "epoch": 6797} {"train_loss": -27.930877685546875, "global_step": 564195, "epoch": 6797} {"train_loss": -27.9859676361084, "global_step": 564196, "epoch": 6797} {"train_loss": -27.425140380859375, "global_step": 564197, "epoch": 6797} {"train_loss": -27.70501708984375, "global_step": 564198, "epoch": 6797} {"train_loss": -27.895721435546875, "global_step": 564199, "epoch": 6797} {"train_loss": -28.106781005859375, "global_step": 564200, "epoch": 6797} {"train_loss": -28.181608200073242, "global_step": 564201, "epoch": 6797} {"train_loss": -27.751501083374023, "global_step": 564202, "epoch": 6797} {"train_loss": -27.361328125, "global_step": 564203, "epoch": 6797} {"train_loss": -27.738468170166016, "global_step": 564204, "epoch": 6797} {"train_loss": -27.60940933227539, "global_step": 564205, "epoch": 6797} {"train_loss": -27.743024826049805, "global_step": 564206, "epoch": 6797} {"train_loss": -27.96146583557129, "global_step": 564207, "epoch": 6797} {"train_loss": -28.034250259399414, "global_step": 564208, "epoch": 6797} {"train_loss": -28.118576049804688, "global_step": 564209, "epoch": 6797} {"train_loss": -28.287342071533203, "global_step": 564210, "epoch": 6797} {"train_loss": -28.21367835998535, "global_step": 564211, "epoch": 6797} {"train_loss": -28.216947555541992, "global_step": 564212, "epoch": 6797} {"train_loss": -28.03680419921875, "global_step": 564213, "epoch": 6797} {"train_loss": -28.303075790405273, "global_step": 564214, "epoch": 6797} {"train_loss": -28.09174919128418, "global_step": 564215, "epoch": 6797} {"train_loss": -28.125593185424805, "global_step": 564216, "epoch": 6797} {"train_loss": -27.606155395507812, "global_step": 564217, "epoch": 6797} {"train_loss": -28.14483642578125, "global_step": 564218, "epoch": 6797} {"train_loss": -27.97542381286621, "global_step": 564219, "epoch": 6797} {"train_loss": -27.512531280517578, "global_step": 564220, "epoch": 6797} {"train_loss": -27.74079704284668, "global_step": 564221, "epoch": 6797} {"train_loss": -27.939218521118164, "global_step": 564222, "epoch": 6797} {"train_loss": -28.081424713134766, "global_step": 564223, "epoch": 6797} {"train_loss": -27.93438720703125, "global_step": 564224, "epoch": 6797} {"train_loss": -27.836668014526367, "global_step": 564225, "epoch": 6797} {"train_loss": -27.60162925720215, "global_step": 564226, "epoch": 6797} {"train_loss": -27.88824462890625, "global_step": 564227, "epoch": 6797} {"train_loss": -28.008432388305664, "global_step": 564228, "epoch": 6797} {"train_loss": -27.54583740234375, "global_step": 564229, "epoch": 6797} {"train_loss": -27.844181060791016, "global_step": 564230, "epoch": 6797} {"train_loss": -27.8558349609375, "global_step": 564231, "epoch": 6797} {"train_loss": -27.679004669189453, "global_step": 564232, "epoch": 6797} {"train_loss": -27.755605169089442, "global_step": 564233, "epoch": 6797, "val_loss": 6438532.5} {"train_loss": -27.06446647644043, "global_step": 564234, "epoch": 6798} {"train_loss": -26.58194923400879, "global_step": 564235, "epoch": 6798} {"train_loss": -27.297855377197266, "global_step": 564236, "epoch": 6798} {"train_loss": -26.930017471313477, "global_step": 564237, "epoch": 6798} {"train_loss": -26.785938262939453, "global_step": 564238, "epoch": 6798} {"train_loss": -27.546140670776367, "global_step": 564239, "epoch": 6798} {"train_loss": -27.11310386657715, "global_step": 564240, "epoch": 6798} {"train_loss": -27.268583297729492, "global_step": 564241, "epoch": 6798} {"train_loss": -26.847930908203125, "global_step": 564242, "epoch": 6798} {"train_loss": -27.507871627807617, "global_step": 564243, "epoch": 6798} {"train_loss": -27.214618682861328, "global_step": 564244, "epoch": 6798} {"train_loss": -26.985092163085938, "global_step": 564245, "epoch": 6798} {"train_loss": -27.396841049194336, "global_step": 564246, "epoch": 6798} {"train_loss": -27.169225692749023, "global_step": 564247, "epoch": 6798} {"train_loss": -27.4241943359375, "global_step": 564248, "epoch": 6798} {"train_loss": -27.48563003540039, "global_step": 564249, "epoch": 6798} {"train_loss": -26.934873580932617, "global_step": 564250, "epoch": 6798} {"train_loss": -27.463302612304688, "global_step": 564251, "epoch": 6798} {"train_loss": -27.577768325805664, "global_step": 564252, "epoch": 6798} {"train_loss": -27.426549911499023, "global_step": 564253, "epoch": 6798} {"train_loss": -27.451492309570312, "global_step": 564254, "epoch": 6798} {"train_loss": -27.62090492248535, "global_step": 564255, "epoch": 6798} {"train_loss": -27.64930534362793, "global_step": 564256, "epoch": 6798} {"train_loss": -27.008947372436523, "global_step": 564257, "epoch": 6798} {"train_loss": -27.246915817260742, "global_step": 564258, "epoch": 6798} {"train_loss": -27.939971923828125, "global_step": 564259, "epoch": 6798} {"train_loss": -27.76558494567871, "global_step": 564260, "epoch": 6798} {"train_loss": -27.622583389282227, "global_step": 564261, "epoch": 6798} {"train_loss": -27.819799423217773, "global_step": 564262, "epoch": 6798} {"train_loss": -27.894683837890625, "global_step": 564263, "epoch": 6798} {"train_loss": -27.604663848876953, "global_step": 564264, "epoch": 6798} {"train_loss": -27.777456283569336, "global_step": 564265, "epoch": 6798} {"train_loss": -27.805234909057617, "global_step": 564266, "epoch": 6798} {"train_loss": -27.540119171142578, "global_step": 564267, "epoch": 6798} {"train_loss": -27.505502700805664, "global_step": 564268, "epoch": 6798} {"train_loss": -27.882781982421875, "global_step": 564269, "epoch": 6798} {"train_loss": -28.05548095703125, "global_step": 564270, "epoch": 6798} {"train_loss": -27.866565704345703, "global_step": 564271, "epoch": 6798} {"train_loss": -27.653181076049805, "global_step": 564272, "epoch": 6798} {"train_loss": -27.707050323486328, "global_step": 564273, "epoch": 6798} {"train_loss": -27.907424926757812, "global_step": 564274, "epoch": 6798} {"train_loss": -28.026960372924805, "global_step": 564275, "epoch": 6798} {"train_loss": -27.84891128540039, "global_step": 564276, "epoch": 6798} {"train_loss": -27.979877471923828, "global_step": 564277, "epoch": 6798} {"train_loss": -27.69452476501465, "global_step": 564278, "epoch": 6798} {"train_loss": -28.17806053161621, "global_step": 564279, "epoch": 6798} {"train_loss": -28.084217071533203, "global_step": 564280, "epoch": 6798} {"train_loss": -27.945959091186523, "global_step": 564281, "epoch": 6798} {"train_loss": -27.95102310180664, "global_step": 564282, "epoch": 6798} {"train_loss": -27.783344268798828, "global_step": 564283, "epoch": 6798} {"train_loss": -27.86530876159668, "global_step": 564284, "epoch": 6798} {"train_loss": -27.865705490112305, "global_step": 564285, "epoch": 6798} {"train_loss": -27.49090003967285, "global_step": 564286, "epoch": 6798} {"train_loss": -27.922033309936523, "global_step": 564287, "epoch": 6798} {"train_loss": -27.583972930908203, "global_step": 564288, "epoch": 6798} {"train_loss": -27.81878089904785, "global_step": 564289, "epoch": 6798} {"train_loss": -28.220407485961914, "global_step": 564290, "epoch": 6798} {"train_loss": -28.181476593017578, "global_step": 564291, "epoch": 6798} {"train_loss": -27.606582641601562, "global_step": 564292, "epoch": 6798} {"train_loss": -28.02276611328125, "global_step": 564293, "epoch": 6798} {"train_loss": -27.903608322143555, "global_step": 564294, "epoch": 6798} {"train_loss": -27.961606979370117, "global_step": 564295, "epoch": 6798} {"train_loss": -28.207706451416016, "global_step": 564296, "epoch": 6798} {"train_loss": -28.097919464111328, "global_step": 564297, "epoch": 6798} {"train_loss": -27.4343204498291, "global_step": 564298, "epoch": 6798} {"train_loss": -27.93550682067871, "global_step": 564299, "epoch": 6798} {"train_loss": -28.19313621520996, "global_step": 564300, "epoch": 6798} {"train_loss": -28.174768447875977, "global_step": 564301, "epoch": 6798} {"train_loss": -27.824951171875, "global_step": 564302, "epoch": 6798} {"train_loss": -28.122526168823242, "global_step": 564303, "epoch": 6798} {"train_loss": -27.967700958251953, "global_step": 564304, "epoch": 6798} {"train_loss": -28.07508659362793, "global_step": 564305, "epoch": 6798} {"train_loss": -28.001264572143555, "global_step": 564306, "epoch": 6798} {"train_loss": -27.564481735229492, "global_step": 564307, "epoch": 6798} {"train_loss": -28.123037338256836, "global_step": 564308, "epoch": 6798} {"train_loss": -27.788312911987305, "global_step": 564309, "epoch": 6798} {"train_loss": -28.15301513671875, "global_step": 564310, "epoch": 6798} {"train_loss": -27.712692260742188, "global_step": 564311, "epoch": 6798} {"train_loss": -28.072925567626953, "global_step": 564312, "epoch": 6798} {"train_loss": -27.87188720703125, "global_step": 564313, "epoch": 6798} {"train_loss": -27.857879638671875, "global_step": 564314, "epoch": 6798} {"train_loss": -27.75360679626465, "global_step": 564315, "epoch": 6798} {"train_loss": -27.708279621170227, "global_step": 564316, "epoch": 6798, "val_loss": 6615808.0} {"train_loss": -23.823143005371094, "global_step": 564317, "epoch": 6799} {"train_loss": -22.539743423461914, "global_step": 564318, "epoch": 6799} {"train_loss": -25.218597412109375, "global_step": 564319, "epoch": 6799} {"train_loss": -22.473865509033203, "global_step": 564320, "epoch": 6799} {"train_loss": -23.98135757446289, "global_step": 564321, "epoch": 6799} {"train_loss": -25.801013946533203, "global_step": 564322, "epoch": 6799} {"train_loss": -24.6754093170166, "global_step": 564323, "epoch": 6799} {"train_loss": -25.88041114807129, "global_step": 564324, "epoch": 6799} {"train_loss": -25.5115909576416, "global_step": 564325, "epoch": 6799} {"train_loss": -25.441707611083984, "global_step": 564326, "epoch": 6799} {"train_loss": -26.337451934814453, "global_step": 564327, "epoch": 6799} {"train_loss": -26.09164810180664, "global_step": 564328, "epoch": 6799} {"train_loss": -26.1249942779541, "global_step": 564329, "epoch": 6799} {"train_loss": -26.076725006103516, "global_step": 564330, "epoch": 6799} {"train_loss": -26.67205238342285, "global_step": 564331, "epoch": 6799} {"train_loss": -26.39166259765625, "global_step": 564332, "epoch": 6799} {"train_loss": -26.883407592773438, "global_step": 564333, "epoch": 6799} {"train_loss": -26.82622718811035, "global_step": 564334, "epoch": 6799} {"train_loss": -26.64487075805664, "global_step": 564335, "epoch": 6799} {"train_loss": -26.73868179321289, "global_step": 564336, "epoch": 6799} {"train_loss": -26.50934410095215, "global_step": 564337, "epoch": 6799} {"train_loss": -26.631732940673828, "global_step": 564338, "epoch": 6799} {"train_loss": -26.53163719177246, "global_step": 564339, "epoch": 6799} {"train_loss": -27.07948875427246, "global_step": 564340, "epoch": 6799} {"train_loss": -26.740697860717773, "global_step": 564341, "epoch": 6799} {"train_loss": -27.018177032470703, "global_step": 564342, "epoch": 6799} {"train_loss": -27.000659942626953, "global_step": 564343, "epoch": 6799} {"train_loss": -26.75674819946289, "global_step": 564344, "epoch": 6799} {"train_loss": -26.93060302734375, "global_step": 564345, "epoch": 6799} {"train_loss": -27.215412139892578, "global_step": 564346, "epoch": 6799} {"train_loss": -27.109832763671875, "global_step": 564347, "epoch": 6799} {"train_loss": -26.933801651000977, "global_step": 564348, "epoch": 6799} {"train_loss": -27.18546485900879, "global_step": 564349, "epoch": 6799} {"train_loss": -27.076099395751953, "global_step": 564350, "epoch": 6799} {"train_loss": -27.521833419799805, "global_step": 564351, "epoch": 6799} {"train_loss": -27.139636993408203, "global_step": 564352, "epoch": 6799} {"train_loss": -27.354455947875977, "global_step": 564353, "epoch": 6799} {"train_loss": -27.02963638305664, "global_step": 564354, "epoch": 6799} {"train_loss": -26.993350982666016, "global_step": 564355, "epoch": 6799} {"train_loss": -27.39522361755371, "global_step": 564356, "epoch": 6799} {"train_loss": -27.407262802124023, "global_step": 564357, "epoch": 6799} {"train_loss": -27.640783309936523, "global_step": 564358, "epoch": 6799} {"train_loss": -27.376651763916016, "global_step": 564359, "epoch": 6799} {"train_loss": -27.307310104370117, "global_step": 564360, "epoch": 6799} {"train_loss": -27.23908805847168, "global_step": 564361, "epoch": 6799} {"train_loss": -27.67644691467285, "global_step": 564362, "epoch": 6799} {"train_loss": -27.488935470581055, "global_step": 564363, "epoch": 6799} {"train_loss": -27.344953536987305, "global_step": 564364, "epoch": 6799} {"train_loss": -27.626428604125977, "global_step": 564365, "epoch": 6799} {"train_loss": -28.1064453125, "global_step": 564366, "epoch": 6799} {"train_loss": -27.621917724609375, "global_step": 564367, "epoch": 6799} {"train_loss": -27.59345054626465, "global_step": 564368, "epoch": 6799} {"train_loss": -27.972726821899414, "global_step": 564369, "epoch": 6799} {"train_loss": -27.574188232421875, "global_step": 564370, "epoch": 6799} {"train_loss": -27.52515983581543, "global_step": 564371, "epoch": 6799} {"train_loss": -27.768310546875, "global_step": 564372, "epoch": 6799} {"train_loss": -27.70432472229004, "global_step": 564373, "epoch": 6799} {"train_loss": -27.929080963134766, "global_step": 564374, "epoch": 6799} {"train_loss": -28.067502975463867, "global_step": 564375, "epoch": 6799} {"train_loss": -27.733551025390625, "global_step": 564376, "epoch": 6799} {"train_loss": -27.897735595703125, "global_step": 564377, "epoch": 6799} {"train_loss": -27.924503326416016, "global_step": 564378, "epoch": 6799} {"train_loss": -27.962982177734375, "global_step": 564379, "epoch": 6799} {"train_loss": -28.036670684814453, "global_step": 564380, "epoch": 6799} {"train_loss": -27.899316787719727, "global_step": 564381, "epoch": 6799} {"train_loss": -28.10492515563965, "global_step": 564382, "epoch": 6799} {"train_loss": -27.83375358581543, "global_step": 564383, "epoch": 6799} {"train_loss": -28.00827980041504, "global_step": 564384, "epoch": 6799} {"train_loss": -27.96059226989746, "global_step": 564385, "epoch": 6799} {"train_loss": -28.01068687438965, "global_step": 564386, "epoch": 6799} {"train_loss": -28.004867553710938, "global_step": 564387, "epoch": 6799} {"train_loss": -28.175800323486328, "global_step": 564388, "epoch": 6799} {"train_loss": -28.209613800048828, "global_step": 564389, "epoch": 6799} {"train_loss": -28.104846954345703, "global_step": 564390, "epoch": 6799} {"train_loss": -27.70090675354004, "global_step": 564391, "epoch": 6799} {"train_loss": -27.903091430664062, "global_step": 564392, "epoch": 6799} {"train_loss": -27.851181030273438, "global_step": 564393, "epoch": 6799} {"train_loss": -27.116262435913086, "global_step": 564394, "epoch": 6799} {"train_loss": -27.071744918823242, "global_step": 564395, "epoch": 6799} {"train_loss": -26.9388427734375, "global_step": 564396, "epoch": 6799} {"train_loss": -26.96949577331543, "global_step": 564397, "epoch": 6799} {"train_loss": -27.286890029907227, "global_step": 564398, "epoch": 6799} {"train_loss": -27.00323079580284, "global_step": 564399, "epoch": 6799, "val_loss": 6594220.0} {"train_loss": -26.313522338867188, "global_step": 564400, "epoch": 6800} {"train_loss": -26.643789291381836, "global_step": 564401, "epoch": 6800} {"train_loss": -27.206567764282227, "global_step": 564402, "epoch": 6800} {"train_loss": -27.149030685424805, "global_step": 564403, "epoch": 6800} {"train_loss": -27.287006378173828, "global_step": 564404, "epoch": 6800} {"train_loss": -27.47651481628418, "global_step": 564405, "epoch": 6800} {"train_loss": -26.94034767150879, "global_step": 564406, "epoch": 6800} {"train_loss": -27.000137329101562, "global_step": 564407, "epoch": 6800} {"train_loss": -27.07048988342285, "global_step": 564408, "epoch": 6800} {"train_loss": -27.23955726623535, "global_step": 564409, "epoch": 6800} {"train_loss": -27.04715347290039, "global_step": 564410, "epoch": 6800} {"train_loss": -26.733657836914062, "global_step": 564411, "epoch": 6800} {"train_loss": -27.275238037109375, "global_step": 564412, "epoch": 6800} {"train_loss": -27.373870849609375, "global_step": 564413, "epoch": 6800} {"train_loss": -27.2327880859375, "global_step": 564414, "epoch": 6800} {"train_loss": -27.199188232421875, "global_step": 564415, "epoch": 6800} {"train_loss": -27.284082412719727, "global_step": 564416, "epoch": 6800} {"train_loss": -27.89845085144043, "global_step": 564417, "epoch": 6800} {"train_loss": -27.292255401611328, "global_step": 564418, "epoch": 6800} {"train_loss": -27.469268798828125, "global_step": 564419, "epoch": 6800} {"train_loss": -27.35727310180664, "global_step": 564420, "epoch": 6800} {"train_loss": -27.405258178710938, "global_step": 564421, "epoch": 6800} {"train_loss": -27.516998291015625, "global_step": 564422, "epoch": 6800} {"train_loss": -27.619068145751953, "global_step": 564423, "epoch": 6800} {"train_loss": -27.614017486572266, "global_step": 564424, "epoch": 6800} {"train_loss": -27.325681686401367, "global_step": 564425, "epoch": 6800} {"train_loss": -27.7670955657959, "global_step": 564426, "epoch": 6800} {"train_loss": -27.7185115814209, "global_step": 564427, "epoch": 6800} {"train_loss": -27.72772789001465, "global_step": 564428, "epoch": 6800} {"train_loss": -27.56574821472168, "global_step": 564429, "epoch": 6800} {"train_loss": -27.840707778930664, "global_step": 564430, "epoch": 6800} {"train_loss": -27.796899795532227, "global_step": 564431, "epoch": 6800} {"train_loss": -27.252033233642578, "global_step": 564432, "epoch": 6800} {"train_loss": -27.619184494018555, "global_step": 564433, "epoch": 6800} {"train_loss": -27.94769287109375, "global_step": 564434, "epoch": 6800} {"train_loss": -27.43336296081543, "global_step": 564435, "epoch": 6800} {"train_loss": -27.81995964050293, "global_step": 564436, "epoch": 6800} {"train_loss": -27.88504981994629, "global_step": 564437, "epoch": 6800} {"train_loss": -27.853225708007812, "global_step": 564438, "epoch": 6800} {"train_loss": -27.50766372680664, "global_step": 564439, "epoch": 6800} {"train_loss": -27.832685470581055, "global_step": 564440, "epoch": 6800} {"train_loss": -27.948514938354492, "global_step": 564441, "epoch": 6800} {"train_loss": -27.8820743560791, "global_step": 564442, "epoch": 6800} {"train_loss": -28.099781036376953, "global_step": 564443, "epoch": 6800} {"train_loss": -27.66228675842285, "global_step": 564444, "epoch": 6800} {"train_loss": -27.776901245117188, "global_step": 564445, "epoch": 6800} {"train_loss": -27.801984786987305, "global_step": 564446, "epoch": 6800} {"train_loss": -27.66092872619629, "global_step": 564447, "epoch": 6800} {"train_loss": -28.283405303955078, "global_step": 564448, "epoch": 6800} {"train_loss": -27.749881744384766, "global_step": 564449, "epoch": 6800} {"train_loss": -27.963211059570312, "global_step": 564450, "epoch": 6800} {"train_loss": -27.75909996032715, "global_step": 564451, "epoch": 6800} {"train_loss": -28.042306900024414, "global_step": 564452, "epoch": 6800} {"train_loss": -27.845945358276367, "global_step": 564453, "epoch": 6800} {"train_loss": -27.942779541015625, "global_step": 564454, "epoch": 6800} {"train_loss": -27.80042839050293, "global_step": 564455, "epoch": 6800} {"train_loss": -27.888906478881836, "global_step": 564456, "epoch": 6800} {"train_loss": -27.8199462890625, "global_step": 564457, "epoch": 6800} {"train_loss": -27.95558738708496, "global_step": 564458, "epoch": 6800} {"train_loss": -28.093008041381836, "global_step": 564459, "epoch": 6800} {"train_loss": -27.897436141967773, "global_step": 564460, "epoch": 6800} {"train_loss": -28.1462459564209, "global_step": 564461, "epoch": 6800} {"train_loss": -27.90522575378418, "global_step": 564462, "epoch": 6800} {"train_loss": -28.19949722290039, "global_step": 564463, "epoch": 6800} {"train_loss": -27.7633113861084, "global_step": 564464, "epoch": 6800} {"train_loss": -27.60638999938965, "global_step": 564465, "epoch": 6800} {"train_loss": -28.294158935546875, "global_step": 564466, "epoch": 6800} {"train_loss": -28.03473472595215, "global_step": 564467, "epoch": 6800} {"train_loss": -27.640249252319336, "global_step": 564468, "epoch": 6800} {"train_loss": -27.759063720703125, "global_step": 564469, "epoch": 6800} {"train_loss": -27.820819854736328, "global_step": 564470, "epoch": 6800} {"train_loss": -27.548404693603516, "global_step": 564471, "epoch": 6800} {"train_loss": -28.19520378112793, "global_step": 564472, "epoch": 6800} {"train_loss": -28.105335235595703, "global_step": 564473, "epoch": 6800} {"train_loss": -27.735532760620117, "global_step": 564474, "epoch": 6800} {"train_loss": -28.037694931030273, "global_step": 564475, "epoch": 6800} {"train_loss": -27.999469757080078, "global_step": 564476, "epoch": 6800} {"train_loss": -27.926136016845703, "global_step": 564477, "epoch": 6800} {"train_loss": -27.9073543548584, "global_step": 564478, "epoch": 6800} {"train_loss": -27.509809494018555, "global_step": 564479, "epoch": 6800} {"train_loss": -28.067785263061523, "global_step": 564480, "epoch": 6800} {"train_loss": -28.045377731323242, "global_step": 564481, "epoch": 6800} {"train_loss": -27.662952790777368, "global_step": 564482, "epoch": 6800, "train/sim_max_reward_0": 0.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4500000": 1.0, "test/sim_max_reward_4500001": 1.0, "test/sim_max_reward_4500002": 1.0, "test/sim_max_reward_4500003": 1.0, "test/sim_max_reward_4500004": 1.0, "test/sim_max_reward_4500005": 1.0, "test/sim_max_reward_4500006": 1.0, "test/sim_max_reward_4500007": 1.0, "test/sim_max_reward_4500008": 1.0, "test/sim_max_reward_4500009": 1.0, "test/sim_max_reward_4500010": 1.0, "test/sim_max_reward_4500011": 1.0, "test/sim_max_reward_4500012": 1.0, "test/sim_max_reward_4500013": 0.0, "test/sim_max_reward_4500014": 1.0, "test/sim_max_reward_4500015": 1.0, "test/sim_max_reward_4500016": 1.0, "test/sim_max_reward_4500017": 1.0, "test/sim_max_reward_4500018": 1.0, "test/sim_max_reward_4500019": 1.0, "test/sim_max_reward_4500020": 1.0, "test/sim_max_reward_4500021": 1.0, "train/mean_score": 0.8333333333333334, "test/mean_score": 0.9545454545454546, "val_loss": 6615657.0} {"train_loss": -27.843067169189453, "global_step": 564483, "epoch": 6801} {"train_loss": -26.95505142211914, "global_step": 564484, "epoch": 6801} {"train_loss": -26.20746421813965, "global_step": 564485, "epoch": 6801} {"train_loss": -25.7425479888916, "global_step": 564486, "epoch": 6801} {"train_loss": -26.59038734436035, "global_step": 564487, "epoch": 6801} {"train_loss": -27.82452392578125, "global_step": 564488, "epoch": 6801} {"train_loss": -26.476404190063477, "global_step": 564489, "epoch": 6801} {"train_loss": -27.5523624420166, "global_step": 564490, "epoch": 6801} {"train_loss": -27.260101318359375, "global_step": 564491, "epoch": 6801} {"train_loss": -27.21244239807129, "global_step": 564492, "epoch": 6801} {"train_loss": -26.725461959838867, "global_step": 564493, "epoch": 6801} {"train_loss": -27.572010040283203, "global_step": 564494, "epoch": 6801} {"train_loss": -27.432188034057617, "global_step": 564495, "epoch": 6801} {"train_loss": -27.290576934814453, "global_step": 564496, "epoch": 6801} {"train_loss": -27.128820419311523, "global_step": 564497, "epoch": 6801} {"train_loss": -27.223434448242188, "global_step": 564498, "epoch": 6801} {"train_loss": -26.861398696899414, "global_step": 564499, "epoch": 6801} {"train_loss": -27.533039093017578, "global_step": 564500, "epoch": 6801} {"train_loss": -27.536914825439453, "global_step": 564501, "epoch": 6801} {"train_loss": -27.44364356994629, "global_step": 564502, "epoch": 6801} {"train_loss": -27.259496688842773, "global_step": 564503, "epoch": 6801} {"train_loss": -27.593130111694336, "global_step": 564504, "epoch": 6801} {"train_loss": -27.271005630493164, "global_step": 564505, "epoch": 6801} {"train_loss": -27.50160026550293, "global_step": 564506, "epoch": 6801} {"train_loss": -27.6383113861084, "global_step": 564507, "epoch": 6801} {"train_loss": -27.322717666625977, "global_step": 564508, "epoch": 6801} {"train_loss": -27.70545768737793, "global_step": 564509, "epoch": 6801} {"train_loss": -27.720739364624023, "global_step": 564510, "epoch": 6801} {"train_loss": -27.6340274810791, "global_step": 564511, "epoch": 6801} {"train_loss": -27.88690757751465, "global_step": 564512, "epoch": 6801} {"train_loss": -27.737451553344727, "global_step": 564513, "epoch": 6801} {"train_loss": -27.44049644470215, "global_step": 564514, "epoch": 6801} {"train_loss": -27.699548721313477, "global_step": 564515, "epoch": 6801} {"train_loss": -27.57356834411621, "global_step": 564516, "epoch": 6801} {"train_loss": -27.625051498413086, "global_step": 564517, "epoch": 6801} {"train_loss": -27.821195602416992, "global_step": 564518, "epoch": 6801} {"train_loss": -27.546640396118164, "global_step": 564519, "epoch": 6801} {"train_loss": -27.975950241088867, "global_step": 564520, "epoch": 6801} {"train_loss": -27.666208267211914, "global_step": 564521, "epoch": 6801} {"train_loss": -28.00654411315918, "global_step": 564522, "epoch": 6801} {"train_loss": -27.75775718688965, "global_step": 564523, "epoch": 6801} {"train_loss": -27.807043075561523, "global_step": 564524, "epoch": 6801} {"train_loss": -27.6987247467041, "global_step": 564525, "epoch": 6801} {"train_loss": -28.098974227905273, "global_step": 564526, "epoch": 6801} {"train_loss": -27.838821411132812, "global_step": 564527, "epoch": 6801} {"train_loss": -28.06009292602539, "global_step": 564528, "epoch": 6801} {"train_loss": -27.929885864257812, "global_step": 564529, "epoch": 6801} {"train_loss": -28.152673721313477, "global_step": 564530, "epoch": 6801} {"train_loss": -27.908721923828125, "global_step": 564531, "epoch": 6801} {"train_loss": -28.138599395751953, "global_step": 564532, "epoch": 6801} {"train_loss": -27.7839412689209, "global_step": 564533, "epoch": 6801} {"train_loss": -27.70294189453125, "global_step": 564534, "epoch": 6801} {"train_loss": -28.47808837890625, "global_step": 564535, "epoch": 6801} {"train_loss": -27.786718368530273, "global_step": 564536, "epoch": 6801} {"train_loss": -28.136930465698242, "global_step": 564537, "epoch": 6801} {"train_loss": -28.105731964111328, "global_step": 564538, "epoch": 6801} {"train_loss": -27.9378662109375, "global_step": 564539, "epoch": 6801} {"train_loss": -28.196365356445312, "global_step": 564540, "epoch": 6801} {"train_loss": -27.848743438720703, "global_step": 564541, "epoch": 6801} {"train_loss": -27.992101669311523, "global_step": 564542, "epoch": 6801} {"train_loss": -28.005523681640625, "global_step": 564543, "epoch": 6801} {"train_loss": -28.179101943969727, "global_step": 564544, "epoch": 6801} {"train_loss": -28.1038875579834, "global_step": 564545, "epoch": 6801} {"train_loss": -28.04010581970215, "global_step": 564546, "epoch": 6801} {"train_loss": -28.324005126953125, "global_step": 564547, "epoch": 6801} {"train_loss": -27.87041664123535, "global_step": 564548, "epoch": 6801} {"train_loss": -27.918380737304688, "global_step": 564549, "epoch": 6801} {"train_loss": -28.05518913269043, "global_step": 564550, "epoch": 6801} {"train_loss": -28.21705436706543, "global_step": 564551, "epoch": 6801} {"train_loss": -28.00701904296875, "global_step": 564552, "epoch": 6801} {"train_loss": -27.71284294128418, "global_step": 564553, "epoch": 6801} {"train_loss": -28.273767471313477, "global_step": 564554, "epoch": 6801} {"train_loss": -27.712255477905273, "global_step": 564555, "epoch": 6801} {"train_loss": -28.19744300842285, "global_step": 564556, "epoch": 6801} {"train_loss": -28.08247184753418, "global_step": 564557, "epoch": 6801} {"train_loss": -27.6824951171875, "global_step": 564558, "epoch": 6801} {"train_loss": -28.07063102722168, "global_step": 564559, "epoch": 6801} {"train_loss": -28.116107940673828, "global_step": 564560, "epoch": 6801} {"train_loss": -27.875995635986328, "global_step": 564561, "epoch": 6801} {"train_loss": -27.966415405273438, "global_step": 564562, "epoch": 6801} {"train_loss": -27.832763671875, "global_step": 564563, "epoch": 6801} {"train_loss": -27.601715087890625, "global_step": 564564, "epoch": 6801} {"train_loss": -27.681251824620258, "global_step": 564565, "epoch": 6801, "val_loss": 6558848.0} {"train_loss": -27.651992797851562, "global_step": 564566, "epoch": 6802} {"train_loss": -26.758575439453125, "global_step": 564567, "epoch": 6802} {"train_loss": -26.23224449157715, "global_step": 564568, "epoch": 6802} {"train_loss": -26.343732833862305, "global_step": 564569, "epoch": 6802} {"train_loss": -27.16653823852539, "global_step": 564570, "epoch": 6802} {"train_loss": -26.740930557250977, "global_step": 564571, "epoch": 6802} {"train_loss": -26.86051368713379, "global_step": 564572, "epoch": 6802} {"train_loss": -27.474048614501953, "global_step": 564573, "epoch": 6802} {"train_loss": -27.072134017944336, "global_step": 564574, "epoch": 6802} {"train_loss": -27.876611709594727, "global_step": 564575, "epoch": 6802} {"train_loss": -27.220062255859375, "global_step": 564576, "epoch": 6802} {"train_loss": -27.13559341430664, "global_step": 564577, "epoch": 6802} {"train_loss": -26.92496109008789, "global_step": 564578, "epoch": 6802} {"train_loss": -27.383081436157227, "global_step": 564579, "epoch": 6802} {"train_loss": -27.248815536499023, "global_step": 564580, "epoch": 6802} {"train_loss": -27.506174087524414, "global_step": 564581, "epoch": 6802} {"train_loss": -27.4990234375, "global_step": 564582, "epoch": 6802} {"train_loss": -27.356643676757812, "global_step": 564583, "epoch": 6802} {"train_loss": -27.5220890045166, "global_step": 564584, "epoch": 6802} {"train_loss": -27.526782989501953, "global_step": 564585, "epoch": 6802} {"train_loss": -27.552021026611328, "global_step": 564586, "epoch": 6802} {"train_loss": -27.66497802734375, "global_step": 564587, "epoch": 6802} {"train_loss": -27.875778198242188, "global_step": 564588, "epoch": 6802} {"train_loss": -27.645063400268555, "global_step": 564589, "epoch": 6802} {"train_loss": -27.734390258789062, "global_step": 564590, "epoch": 6802} {"train_loss": -27.54424476623535, "global_step": 564591, "epoch": 6802} {"train_loss": -27.780256271362305, "global_step": 564592, "epoch": 6802} {"train_loss": -27.738962173461914, "global_step": 564593, "epoch": 6802} {"train_loss": -27.36990737915039, "global_step": 564594, "epoch": 6802} {"train_loss": -27.95526123046875, "global_step": 564595, "epoch": 6802} {"train_loss": -27.537817001342773, "global_step": 564596, "epoch": 6802} {"train_loss": -27.870742797851562, "global_step": 564597, "epoch": 6802} {"train_loss": -27.608184814453125, "global_step": 564598, "epoch": 6802} {"train_loss": -27.682220458984375, "global_step": 564599, "epoch": 6802} {"train_loss": -27.84705924987793, "global_step": 564600, "epoch": 6802} {"train_loss": -27.678287506103516, "global_step": 564601, "epoch": 6802} {"train_loss": -27.41225242614746, "global_step": 564602, "epoch": 6802} {"train_loss": -28.138879776000977, "global_step": 564603, "epoch": 6802} {"train_loss": -27.79792594909668, "global_step": 564604, "epoch": 6802} {"train_loss": -27.769317626953125, "global_step": 564605, "epoch": 6802} {"train_loss": -27.687458038330078, "global_step": 564606, "epoch": 6802} {"train_loss": -27.75341796875, "global_step": 564607, "epoch": 6802} {"train_loss": -27.960041046142578, "global_step": 564608, "epoch": 6802} {"train_loss": -27.500537872314453, "global_step": 564609, "epoch": 6802} {"train_loss": -28.214099884033203, "global_step": 564610, "epoch": 6802} {"train_loss": -27.690221786499023, "global_step": 564611, "epoch": 6802} {"train_loss": -28.1362361907959, "global_step": 564612, "epoch": 6802} {"train_loss": -27.69119644165039, "global_step": 564613, "epoch": 6802} {"train_loss": -27.54172134399414, "global_step": 564614, "epoch": 6802} {"train_loss": -27.6806640625, "global_step": 564615, "epoch": 6802} {"train_loss": -27.583480834960938, "global_step": 564616, "epoch": 6802} {"train_loss": -27.763416290283203, "global_step": 564617, "epoch": 6802} {"train_loss": -27.8317928314209, "global_step": 564618, "epoch": 6802} {"train_loss": -27.689313888549805, "global_step": 564619, "epoch": 6802} {"train_loss": -27.75469970703125, "global_step": 564620, "epoch": 6802} {"train_loss": -27.8184757232666, "global_step": 564621, "epoch": 6802} {"train_loss": -27.379592895507812, "global_step": 564622, "epoch": 6802} {"train_loss": -27.417505264282227, "global_step": 564623, "epoch": 6802} {"train_loss": -27.54463768005371, "global_step": 564624, "epoch": 6802} {"train_loss": -27.860502243041992, "global_step": 564625, "epoch": 6802} {"train_loss": -27.775421142578125, "global_step": 564626, "epoch": 6802} {"train_loss": -27.708450317382812, "global_step": 564627, "epoch": 6802} {"train_loss": -27.506940841674805, "global_step": 564628, "epoch": 6802} {"train_loss": -27.868310928344727, "global_step": 564629, "epoch": 6802} {"train_loss": -27.817489624023438, "global_step": 564630, "epoch": 6802} {"train_loss": -27.605443954467773, "global_step": 564631, "epoch": 6802} {"train_loss": -27.963163375854492, "global_step": 564632, "epoch": 6802} {"train_loss": -27.366058349609375, "global_step": 564633, "epoch": 6802} {"train_loss": -27.660993576049805, "global_step": 564634, "epoch": 6802} {"train_loss": -27.705915451049805, "global_step": 564635, "epoch": 6802} {"train_loss": -27.891956329345703, "global_step": 564636, "epoch": 6802} {"train_loss": -27.94343376159668, "global_step": 564637, "epoch": 6802} {"train_loss": -27.840057373046875, "global_step": 564638, "epoch": 6802} {"train_loss": -28.0904598236084, "global_step": 564639, "epoch": 6802} {"train_loss": -27.795331954956055, "global_step": 564640, "epoch": 6802} {"train_loss": -28.0339412689209, "global_step": 564641, "epoch": 6802} {"train_loss": -28.017133712768555, "global_step": 564642, "epoch": 6802} {"train_loss": -27.6424560546875, "global_step": 564643, "epoch": 6802} {"train_loss": -27.99049186706543, "global_step": 564644, "epoch": 6802} {"train_loss": -28.030990600585938, "global_step": 564645, "epoch": 6802} {"train_loss": -27.991729736328125, "global_step": 564646, "epoch": 6802} {"train_loss": -27.839923858642578, "global_step": 564647, "epoch": 6802} {"train_loss": -27.62233612336308, "global_step": 564648, "epoch": 6802, "val_loss": 6582042.0} {"train_loss": -26.9157657623291, "global_step": 564649, "epoch": 6803} {"train_loss": -26.637115478515625, "global_step": 564650, "epoch": 6803} {"train_loss": -27.281909942626953, "global_step": 564651, "epoch": 6803} {"train_loss": -27.07048988342285, "global_step": 564652, "epoch": 6803} {"train_loss": -26.829059600830078, "global_step": 564653, "epoch": 6803} {"train_loss": -27.10627555847168, "global_step": 564654, "epoch": 6803} {"train_loss": -27.43174171447754, "global_step": 564655, "epoch": 6803} {"train_loss": -27.358922958374023, "global_step": 564656, "epoch": 6803} {"train_loss": -27.515018463134766, "global_step": 564657, "epoch": 6803} {"train_loss": -27.308950424194336, "global_step": 564658, "epoch": 6803} {"train_loss": -27.527851104736328, "global_step": 564659, "epoch": 6803} {"train_loss": -27.5706844329834, "global_step": 564660, "epoch": 6803} {"train_loss": -27.63897132873535, "global_step": 564661, "epoch": 6803} {"train_loss": -27.3184757232666, "global_step": 564662, "epoch": 6803} {"train_loss": -27.567697525024414, "global_step": 564663, "epoch": 6803} {"train_loss": -27.767377853393555, "global_step": 564664, "epoch": 6803} {"train_loss": -27.90610694885254, "global_step": 564665, "epoch": 6803} {"train_loss": -27.790847778320312, "global_step": 564666, "epoch": 6803} {"train_loss": -27.660863876342773, "global_step": 564667, "epoch": 6803} {"train_loss": -27.658349990844727, "global_step": 564668, "epoch": 6803} {"train_loss": -27.85373878479004, "global_step": 564669, "epoch": 6803} {"train_loss": -27.620410919189453, "global_step": 564670, "epoch": 6803} {"train_loss": -27.507537841796875, "global_step": 564671, "epoch": 6803} {"train_loss": -27.841318130493164, "global_step": 564672, "epoch": 6803} {"train_loss": -27.474639892578125, "global_step": 564673, "epoch": 6803} {"train_loss": -27.90130043029785, "global_step": 564674, "epoch": 6803} {"train_loss": -27.762975692749023, "global_step": 564675, "epoch": 6803} {"train_loss": -27.892255783081055, "global_step": 564676, "epoch": 6803} {"train_loss": -28.097675323486328, "global_step": 564677, "epoch": 6803} {"train_loss": -28.182891845703125, "global_step": 564678, "epoch": 6803} {"train_loss": -27.544025421142578, "global_step": 564679, "epoch": 6803} {"train_loss": -27.9396915435791, "global_step": 564680, "epoch": 6803} {"train_loss": -28.02618408203125, "global_step": 564681, "epoch": 6803} {"train_loss": -27.692508697509766, "global_step": 564682, "epoch": 6803} {"train_loss": -28.2739200592041, "global_step": 564683, "epoch": 6803} {"train_loss": -27.976287841796875, "global_step": 564684, "epoch": 6803} {"train_loss": -28.080839157104492, "global_step": 564685, "epoch": 6803} {"train_loss": -28.03241539001465, "global_step": 564686, "epoch": 6803} {"train_loss": -27.8217716217041, "global_step": 564687, "epoch": 6803} {"train_loss": -28.134063720703125, "global_step": 564688, "epoch": 6803} {"train_loss": -27.777387619018555, "global_step": 564689, "epoch": 6803} {"train_loss": -28.000097274780273, "global_step": 564690, "epoch": 6803} {"train_loss": -27.953760147094727, "global_step": 564691, "epoch": 6803} {"train_loss": -28.572858810424805, "global_step": 564692, "epoch": 6803} {"train_loss": -27.627155303955078, "global_step": 564693, "epoch": 6803} {"train_loss": -27.721424102783203, "global_step": 564694, "epoch": 6803} {"train_loss": -27.798187255859375, "global_step": 564695, "epoch": 6803} {"train_loss": -27.53058433532715, "global_step": 564696, "epoch": 6803} {"train_loss": -27.966169357299805, "global_step": 564697, "epoch": 6803} {"train_loss": -27.648670196533203, "global_step": 564698, "epoch": 6803} {"train_loss": -27.8670654296875, "global_step": 564699, "epoch": 6803} {"train_loss": -27.653064727783203, "global_step": 564700, "epoch": 6803} {"train_loss": -28.134815216064453, "global_step": 564701, "epoch": 6803} {"train_loss": -27.929590225219727, "global_step": 564702, "epoch": 6803} {"train_loss": -27.829992294311523, "global_step": 564703, "epoch": 6803} {"train_loss": -27.64117431640625, "global_step": 564704, "epoch": 6803} {"train_loss": -27.4481143951416, "global_step": 564705, "epoch": 6803} {"train_loss": -27.817075729370117, "global_step": 564706, "epoch": 6803} {"train_loss": -28.243335723876953, "global_step": 564707, "epoch": 6803} {"train_loss": -27.295522689819336, "global_step": 564708, "epoch": 6803} {"train_loss": -27.20261001586914, "global_step": 564709, "epoch": 6803} {"train_loss": -28.02155876159668, "global_step": 564710, "epoch": 6803} {"train_loss": -27.75396156311035, "global_step": 564711, "epoch": 6803} {"train_loss": -27.630537033081055, "global_step": 564712, "epoch": 6803} {"train_loss": -27.784391403198242, "global_step": 564713, "epoch": 6803} {"train_loss": -27.524566650390625, "global_step": 564714, "epoch": 6803} {"train_loss": -28.079328536987305, "global_step": 564715, "epoch": 6803} {"train_loss": -27.666656494140625, "global_step": 564716, "epoch": 6803} {"train_loss": -28.08985710144043, "global_step": 564717, "epoch": 6803} {"train_loss": -27.6148738861084, "global_step": 564718, "epoch": 6803} {"train_loss": -27.897306442260742, "global_step": 564719, "epoch": 6803} {"train_loss": -27.942337036132812, "global_step": 564720, "epoch": 6803} {"train_loss": -28.005781173706055, "global_step": 564721, "epoch": 6803} {"train_loss": -27.694873809814453, "global_step": 564722, "epoch": 6803} {"train_loss": -27.4943790435791, "global_step": 564723, "epoch": 6803} {"train_loss": -28.053571701049805, "global_step": 564724, "epoch": 6803} {"train_loss": -27.561460494995117, "global_step": 564725, "epoch": 6803} {"train_loss": -28.01955223083496, "global_step": 564726, "epoch": 6803} {"train_loss": -27.689367294311523, "global_step": 564727, "epoch": 6803} {"train_loss": -27.4323673248291, "global_step": 564728, "epoch": 6803} {"train_loss": -27.62788200378418, "global_step": 564729, "epoch": 6803} {"train_loss": -28.211225509643555, "global_step": 564730, "epoch": 6803} {"train_loss": -27.713900554611023, "global_step": 564731, "epoch": 6803, "val_loss": 6597451.0} {"train_loss": -27.646484375, "global_step": 564732, "epoch": 6804} {"train_loss": -27.23182487487793, "global_step": 564733, "epoch": 6804} {"train_loss": -27.33479881286621, "global_step": 564734, "epoch": 6804} {"train_loss": -27.711750030517578, "global_step": 564735, "epoch": 6804} {"train_loss": -27.26556396484375, "global_step": 564736, "epoch": 6804} {"train_loss": -27.013532638549805, "global_step": 564737, "epoch": 6804} {"train_loss": -27.085275650024414, "global_step": 564738, "epoch": 6804} {"train_loss": -26.597131729125977, "global_step": 564739, "epoch": 6804} {"train_loss": -27.3909969329834, "global_step": 564740, "epoch": 6804} {"train_loss": -26.958999633789062, "global_step": 564741, "epoch": 6804} {"train_loss": -27.41057777404785, "global_step": 564742, "epoch": 6804} {"train_loss": -27.35500144958496, "global_step": 564743, "epoch": 6804} {"train_loss": -27.0643253326416, "global_step": 564744, "epoch": 6804} {"train_loss": -27.44111442565918, "global_step": 564745, "epoch": 6804} {"train_loss": -27.50288963317871, "global_step": 564746, "epoch": 6804} {"train_loss": -27.52565574645996, "global_step": 564747, "epoch": 6804} {"train_loss": -27.391630172729492, "global_step": 564748, "epoch": 6804} {"train_loss": -27.23883056640625, "global_step": 564749, "epoch": 6804} {"train_loss": -27.489465713500977, "global_step": 564750, "epoch": 6804} {"train_loss": -27.05085563659668, "global_step": 564751, "epoch": 6804} {"train_loss": -27.694242477416992, "global_step": 564752, "epoch": 6804} {"train_loss": -27.573232650756836, "global_step": 564753, "epoch": 6804} {"train_loss": -27.623779296875, "global_step": 564754, "epoch": 6804} {"train_loss": -27.125980377197266, "global_step": 564755, "epoch": 6804} {"train_loss": -27.714679718017578, "global_step": 564756, "epoch": 6804} {"train_loss": -27.745100021362305, "global_step": 564757, "epoch": 6804} {"train_loss": -27.59772300720215, "global_step": 564758, "epoch": 6804} {"train_loss": -27.7575740814209, "global_step": 564759, "epoch": 6804} {"train_loss": -27.662282943725586, "global_step": 564760, "epoch": 6804} {"train_loss": -27.73174476623535, "global_step": 564761, "epoch": 6804} {"train_loss": -27.589191436767578, "global_step": 564762, "epoch": 6804} {"train_loss": -27.787912368774414, "global_step": 564763, "epoch": 6804} {"train_loss": -27.921926498413086, "global_step": 564764, "epoch": 6804} {"train_loss": -27.2880916595459, "global_step": 564765, "epoch": 6804} {"train_loss": -27.34456443786621, "global_step": 564766, "epoch": 6804} {"train_loss": -27.650617599487305, "global_step": 564767, "epoch": 6804} {"train_loss": -28.117597579956055, "global_step": 564768, "epoch": 6804} {"train_loss": -27.856124877929688, "global_step": 564769, "epoch": 6804} {"train_loss": -27.782724380493164, "global_step": 564770, "epoch": 6804} {"train_loss": -27.35059928894043, "global_step": 564771, "epoch": 6804} {"train_loss": -27.255725860595703, "global_step": 564772, "epoch": 6804} {"train_loss": -28.013212203979492, "global_step": 564773, "epoch": 6804} {"train_loss": -27.685144424438477, "global_step": 564774, "epoch": 6804} {"train_loss": -27.54473876953125, "global_step": 564775, "epoch": 6804} {"train_loss": -27.580961227416992, "global_step": 564776, "epoch": 6804} {"train_loss": -27.968061447143555, "global_step": 564777, "epoch": 6804} {"train_loss": -27.620763778686523, "global_step": 564778, "epoch": 6804} {"train_loss": -27.919851303100586, "global_step": 564779, "epoch": 6804} {"train_loss": -27.694746017456055, "global_step": 564780, "epoch": 6804} {"train_loss": -27.583593368530273, "global_step": 564781, "epoch": 6804} {"train_loss": -28.075170516967773, "global_step": 564782, "epoch": 6804} {"train_loss": -27.842838287353516, "global_step": 564783, "epoch": 6804} {"train_loss": -28.21836280822754, "global_step": 564784, "epoch": 6804} {"train_loss": -28.193130493164062, "global_step": 564785, "epoch": 6804} {"train_loss": -27.92621421813965, "global_step": 564786, "epoch": 6804} {"train_loss": -27.83637046813965, "global_step": 564787, "epoch": 6804} {"train_loss": -28.322284698486328, "global_step": 564788, "epoch": 6804} {"train_loss": -28.286863327026367, "global_step": 564789, "epoch": 6804} {"train_loss": -28.019275665283203, "global_step": 564790, "epoch": 6804} {"train_loss": -27.941152572631836, "global_step": 564791, "epoch": 6804} {"train_loss": -28.11274528503418, "global_step": 564792, "epoch": 6804} {"train_loss": -27.908796310424805, "global_step": 564793, "epoch": 6804} {"train_loss": -27.675617218017578, "global_step": 564794, "epoch": 6804} {"train_loss": -27.679651260375977, "global_step": 564795, "epoch": 6804} {"train_loss": -27.859174728393555, "global_step": 564796, "epoch": 6804} {"train_loss": -27.793628692626953, "global_step": 564797, "epoch": 6804} {"train_loss": -27.95790672302246, "global_step": 564798, "epoch": 6804} {"train_loss": -28.038129806518555, "global_step": 564799, "epoch": 6804} {"train_loss": -27.929906845092773, "global_step": 564800, "epoch": 6804} {"train_loss": -27.9633846282959, "global_step": 564801, "epoch": 6804} {"train_loss": -28.040124893188477, "global_step": 564802, "epoch": 6804} {"train_loss": -27.90852165222168, "global_step": 564803, "epoch": 6804} {"train_loss": -28.09547233581543, "global_step": 564804, "epoch": 6804} {"train_loss": -28.201278686523438, "global_step": 564805, "epoch": 6804} {"train_loss": -28.00209617614746, "global_step": 564806, "epoch": 6804} {"train_loss": -27.761016845703125, "global_step": 564807, "epoch": 6804} {"train_loss": -27.832813262939453, "global_step": 564808, "epoch": 6804} {"train_loss": -28.289899826049805, "global_step": 564809, "epoch": 6804} {"train_loss": -28.170515060424805, "global_step": 564810, "epoch": 6804} {"train_loss": -28.14322280883789, "global_step": 564811, "epoch": 6804} {"train_loss": -27.710296630859375, "global_step": 564812, "epoch": 6804} {"train_loss": -27.83036231994629, "global_step": 564813, "epoch": 6804} {"train_loss": -27.69845176604857, "global_step": 564814, "epoch": 6804, "val_loss": 6730610.0} {"train_loss": -27.9242000579834, "global_step": 564815, "epoch": 6805} {"train_loss": -27.995634078979492, "global_step": 564816, "epoch": 6805} {"train_loss": -27.76603126525879, "global_step": 564817, "epoch": 6805} {"train_loss": -27.56306266784668, "global_step": 564818, "epoch": 6805} {"train_loss": -27.68995475769043, "global_step": 564819, "epoch": 6805} {"train_loss": -27.323379516601562, "global_step": 564820, "epoch": 6805} {"train_loss": -27.76141929626465, "global_step": 564821, "epoch": 6805} {"train_loss": -27.570005416870117, "global_step": 564822, "epoch": 6805} {"train_loss": -27.580413818359375, "global_step": 564823, "epoch": 6805} {"train_loss": -27.561330795288086, "global_step": 564824, "epoch": 6805} {"train_loss": -27.676477432250977, "global_step": 564825, "epoch": 6805} {"train_loss": -27.585723876953125, "global_step": 564826, "epoch": 6805} {"train_loss": -27.799884796142578, "global_step": 564827, "epoch": 6805} {"train_loss": -27.3856258392334, "global_step": 564828, "epoch": 6805} {"train_loss": -27.709171295166016, "global_step": 564829, "epoch": 6805} {"train_loss": -27.39275550842285, "global_step": 564830, "epoch": 6805} {"train_loss": -27.850900650024414, "global_step": 564831, "epoch": 6805} {"train_loss": -27.872846603393555, "global_step": 564832, "epoch": 6805} {"train_loss": -27.347448348999023, "global_step": 564833, "epoch": 6805} {"train_loss": -27.55194091796875, "global_step": 564834, "epoch": 6805} {"train_loss": -27.728803634643555, "global_step": 564835, "epoch": 6805} {"train_loss": -27.907489776611328, "global_step": 564836, "epoch": 6805} {"train_loss": -27.572172164916992, "global_step": 564837, "epoch": 6805} {"train_loss": -27.24017333984375, "global_step": 564838, "epoch": 6805} {"train_loss": -27.88272476196289, "global_step": 564839, "epoch": 6805} {"train_loss": -27.618444442749023, "global_step": 564840, "epoch": 6805} {"train_loss": -27.64666748046875, "global_step": 564841, "epoch": 6805} {"train_loss": -27.52850341796875, "global_step": 564842, "epoch": 6805} {"train_loss": -27.4062442779541, "global_step": 564843, "epoch": 6805} {"train_loss": -27.4165096282959, "global_step": 564844, "epoch": 6805} {"train_loss": -27.958471298217773, "global_step": 564845, "epoch": 6805} {"train_loss": -27.678136825561523, "global_step": 564846, "epoch": 6805} {"train_loss": -27.922433853149414, "global_step": 564847, "epoch": 6805} {"train_loss": -27.872669219970703, "global_step": 564848, "epoch": 6805} {"train_loss": -28.054391860961914, "global_step": 564849, "epoch": 6805} {"train_loss": -27.62384605407715, "global_step": 564850, "epoch": 6805} {"train_loss": -28.005706787109375, "global_step": 564851, "epoch": 6805} {"train_loss": -27.912429809570312, "global_step": 564852, "epoch": 6805} {"train_loss": -27.75074577331543, "global_step": 564853, "epoch": 6805} {"train_loss": -28.394750595092773, "global_step": 564854, "epoch": 6805} {"train_loss": -27.609130859375, "global_step": 564855, "epoch": 6805} {"train_loss": -27.7882022857666, "global_step": 564856, "epoch": 6805} {"train_loss": -27.833242416381836, "global_step": 564857, "epoch": 6805} {"train_loss": -27.748472213745117, "global_step": 564858, "epoch": 6805} {"train_loss": -27.719640731811523, "global_step": 564859, "epoch": 6805} {"train_loss": -27.78656578063965, "global_step": 564860, "epoch": 6805} {"train_loss": -28.147159576416016, "global_step": 564861, "epoch": 6805} {"train_loss": -27.99267578125, "global_step": 564862, "epoch": 6805} {"train_loss": -27.82075309753418, "global_step": 564863, "epoch": 6805} {"train_loss": -28.152729034423828, "global_step": 564864, "epoch": 6805} {"train_loss": -27.899017333984375, "global_step": 564865, "epoch": 6805} {"train_loss": -27.86663818359375, "global_step": 564866, "epoch": 6805} {"train_loss": -27.624868392944336, "global_step": 564867, "epoch": 6805} {"train_loss": -27.703296661376953, "global_step": 564868, "epoch": 6805} {"train_loss": -27.904571533203125, "global_step": 564869, "epoch": 6805} {"train_loss": -27.333688735961914, "global_step": 564870, "epoch": 6805} {"train_loss": -27.75250816345215, "global_step": 564871, "epoch": 6805} {"train_loss": -27.16493797302246, "global_step": 564872, "epoch": 6805} {"train_loss": -27.683774948120117, "global_step": 564873, "epoch": 6805} {"train_loss": -27.6242733001709, "global_step": 564874, "epoch": 6805} {"train_loss": -27.88020133972168, "global_step": 564875, "epoch": 6805} {"train_loss": -27.308231353759766, "global_step": 564876, "epoch": 6805} {"train_loss": -27.615270614624023, "global_step": 564877, "epoch": 6805} {"train_loss": -27.966114044189453, "global_step": 564878, "epoch": 6805} {"train_loss": -28.030324935913086, "global_step": 564879, "epoch": 6805} {"train_loss": -28.103429794311523, "global_step": 564880, "epoch": 6805} {"train_loss": -27.797101974487305, "global_step": 564881, "epoch": 6805} {"train_loss": -27.553831100463867, "global_step": 564882, "epoch": 6805} {"train_loss": -27.92835807800293, "global_step": 564883, "epoch": 6805} {"train_loss": -27.599380493164062, "global_step": 564884, "epoch": 6805} {"train_loss": -27.718149185180664, "global_step": 564885, "epoch": 6805} {"train_loss": -27.878971099853516, "global_step": 564886, "epoch": 6805} {"train_loss": -27.53969383239746, "global_step": 564887, "epoch": 6805} {"train_loss": -27.625019073486328, "global_step": 564888, "epoch": 6805} {"train_loss": -28.025846481323242, "global_step": 564889, "epoch": 6805} {"train_loss": -28.072620391845703, "global_step": 564890, "epoch": 6805} {"train_loss": -28.11520767211914, "global_step": 564891, "epoch": 6805} {"train_loss": -27.98793601989746, "global_step": 564892, "epoch": 6805} {"train_loss": -27.954639434814453, "global_step": 564893, "epoch": 6805} {"train_loss": -27.509326934814453, "global_step": 564894, "epoch": 6805} {"train_loss": -27.84525489807129, "global_step": 564895, "epoch": 6805} {"train_loss": -27.697546005249023, "global_step": 564896, "epoch": 6805} {"train_loss": -27.726410027009894, "global_step": 564897, "epoch": 6805, "val_loss": 6593930.0} {"train_loss": -27.35407066345215, "global_step": 564898, "epoch": 6806} {"train_loss": -27.35822105407715, "global_step": 564899, "epoch": 6806} {"train_loss": -27.614276885986328, "global_step": 564900, "epoch": 6806} {"train_loss": -27.729736328125, "global_step": 564901, "epoch": 6806} {"train_loss": -27.175207138061523, "global_step": 564902, "epoch": 6806} {"train_loss": -27.41364097595215, "global_step": 564903, "epoch": 6806} {"train_loss": -27.861494064331055, "global_step": 564904, "epoch": 6806} {"train_loss": -27.439990997314453, "global_step": 564905, "epoch": 6806} {"train_loss": -27.268753051757812, "global_step": 564906, "epoch": 6806} {"train_loss": -27.976964950561523, "global_step": 564907, "epoch": 6806} {"train_loss": -28.144927978515625, "global_step": 564908, "epoch": 6806} {"train_loss": -27.639942169189453, "global_step": 564909, "epoch": 6806} {"train_loss": -28.11957359313965, "global_step": 564910, "epoch": 6806} {"train_loss": -27.621313095092773, "global_step": 564911, "epoch": 6806} {"train_loss": -27.652542114257812, "global_step": 564912, "epoch": 6806} {"train_loss": -27.63407325744629, "global_step": 564913, "epoch": 6806} {"train_loss": -27.878345489501953, "global_step": 564914, "epoch": 6806} {"train_loss": -27.600385665893555, "global_step": 564915, "epoch": 6806} {"train_loss": -27.754194259643555, "global_step": 564916, "epoch": 6806} {"train_loss": -27.526655197143555, "global_step": 564917, "epoch": 6806} {"train_loss": -27.401599884033203, "global_step": 564918, "epoch": 6806} {"train_loss": -27.895456314086914, "global_step": 564919, "epoch": 6806} {"train_loss": -27.339216232299805, "global_step": 564920, "epoch": 6806} {"train_loss": -28.095672607421875, "global_step": 564921, "epoch": 6806} {"train_loss": -27.796710968017578, "global_step": 564922, "epoch": 6806} {"train_loss": -27.824176788330078, "global_step": 564923, "epoch": 6806} {"train_loss": -27.4820556640625, "global_step": 564924, "epoch": 6806} {"train_loss": -27.333402633666992, "global_step": 564925, "epoch": 6806} {"train_loss": -27.748523712158203, "global_step": 564926, "epoch": 6806} {"train_loss": -27.409839630126953, "global_step": 564927, "epoch": 6806} {"train_loss": -28.05878257751465, "global_step": 564928, "epoch": 6806} {"train_loss": -27.734115600585938, "global_step": 564929, "epoch": 6806} {"train_loss": -27.710407257080078, "global_step": 564930, "epoch": 6806} {"train_loss": -27.502944946289062, "global_step": 564931, "epoch": 6806} {"train_loss": -27.95263671875, "global_step": 564932, "epoch": 6806} {"train_loss": -27.8543758392334, "global_step": 564933, "epoch": 6806} {"train_loss": -27.337736129760742, "global_step": 564934, "epoch": 6806} {"train_loss": -27.272785186767578, "global_step": 564935, "epoch": 6806} {"train_loss": -27.786462783813477, "global_step": 564936, "epoch": 6806} {"train_loss": -27.804889678955078, "global_step": 564937, "epoch": 6806} {"train_loss": -27.980026245117188, "global_step": 564938, "epoch": 6806} {"train_loss": -27.842700958251953, "global_step": 564939, "epoch": 6806} {"train_loss": -27.488693237304688, "global_step": 564940, "epoch": 6806} {"train_loss": -27.888731002807617, "global_step": 564941, "epoch": 6806} {"train_loss": -27.82655143737793, "global_step": 564942, "epoch": 6806} {"train_loss": -27.92938804626465, "global_step": 564943, "epoch": 6806} {"train_loss": -27.625202178955078, "global_step": 564944, "epoch": 6806} {"train_loss": -27.90618896484375, "global_step": 564945, "epoch": 6806} {"train_loss": -27.79864501953125, "global_step": 564946, "epoch": 6806} {"train_loss": -28.0048828125, "global_step": 564947, "epoch": 6806} {"train_loss": -27.851404190063477, "global_step": 564948, "epoch": 6806} {"train_loss": -27.919727325439453, "global_step": 564949, "epoch": 6806} {"train_loss": -27.916513442993164, "global_step": 564950, "epoch": 6806} {"train_loss": -27.908472061157227, "global_step": 564951, "epoch": 6806} {"train_loss": -27.959735870361328, "global_step": 564952, "epoch": 6806} {"train_loss": -27.6953125, "global_step": 564953, "epoch": 6806} {"train_loss": -27.906982421875, "global_step": 564954, "epoch": 6806} {"train_loss": -27.7398624420166, "global_step": 564955, "epoch": 6806} {"train_loss": -27.779523849487305, "global_step": 564956, "epoch": 6806} {"train_loss": -27.918094635009766, "global_step": 564957, "epoch": 6806} {"train_loss": -28.030109405517578, "global_step": 564958, "epoch": 6806} {"train_loss": -27.853565216064453, "global_step": 564959, "epoch": 6806} {"train_loss": -27.958026885986328, "global_step": 564960, "epoch": 6806} {"train_loss": -28.1064453125, "global_step": 564961, "epoch": 6806} {"train_loss": -28.2028865814209, "global_step": 564962, "epoch": 6806} {"train_loss": -27.95484733581543, "global_step": 564963, "epoch": 6806} {"train_loss": -28.39914894104004, "global_step": 564964, "epoch": 6806} {"train_loss": -27.891992568969727, "global_step": 564965, "epoch": 6806} {"train_loss": -27.95990562438965, "global_step": 564966, "epoch": 6806} {"train_loss": -27.90846824645996, "global_step": 564967, "epoch": 6806} {"train_loss": -27.95951271057129, "global_step": 564968, "epoch": 6806} {"train_loss": -28.083560943603516, "global_step": 564969, "epoch": 6806} {"train_loss": -27.643030166625977, "global_step": 564970, "epoch": 6806} {"train_loss": -27.452442169189453, "global_step": 564971, "epoch": 6806} {"train_loss": -27.612146377563477, "global_step": 564972, "epoch": 6806} {"train_loss": -27.77362060546875, "global_step": 564973, "epoch": 6806} {"train_loss": -27.625797271728516, "global_step": 564974, "epoch": 6806} {"train_loss": -27.784704208374023, "global_step": 564975, "epoch": 6806} {"train_loss": -27.512765884399414, "global_step": 564976, "epoch": 6806} {"train_loss": -28.115528106689453, "global_step": 564977, "epoch": 6806} {"train_loss": -27.897689819335938, "global_step": 564978, "epoch": 6806} {"train_loss": -28.204954147338867, "global_step": 564979, "epoch": 6806} {"train_loss": -27.75974179463214, "global_step": 564980, "epoch": 6806, "val_loss": 6558433.5} {"train_loss": -26.770038604736328, "global_step": 564981, "epoch": 6807} {"train_loss": -26.826751708984375, "global_step": 564982, "epoch": 6807} {"train_loss": -26.908395767211914, "global_step": 564983, "epoch": 6807} {"train_loss": -27.527923583984375, "global_step": 564984, "epoch": 6807} {"train_loss": -26.364093780517578, "global_step": 564985, "epoch": 6807} {"train_loss": -27.289752960205078, "global_step": 564986, "epoch": 6807} {"train_loss": -27.39750099182129, "global_step": 564987, "epoch": 6807} {"train_loss": -26.88824462890625, "global_step": 564988, "epoch": 6807} {"train_loss": -27.24960708618164, "global_step": 564989, "epoch": 6807} {"train_loss": -26.939733505249023, "global_step": 564990, "epoch": 6807} {"train_loss": -27.319456100463867, "global_step": 564991, "epoch": 6807} {"train_loss": -27.027429580688477, "global_step": 564992, "epoch": 6807} {"train_loss": -27.22617530822754, "global_step": 564993, "epoch": 6807} {"train_loss": -27.673376083374023, "global_step": 564994, "epoch": 6807} {"train_loss": -27.336063385009766, "global_step": 564995, "epoch": 6807} {"train_loss": -27.4367618560791, "global_step": 564996, "epoch": 6807} {"train_loss": -27.598804473876953, "global_step": 564997, "epoch": 6807} {"train_loss": -27.293197631835938, "global_step": 564998, "epoch": 6807} {"train_loss": -27.1019287109375, "global_step": 564999, "epoch": 6807} {"train_loss": -27.46490478515625, "global_step": 565000, "epoch": 6807} {"train_loss": -27.3704891204834, "global_step": 565001, "epoch": 6807} {"train_loss": -27.42368507385254, "global_step": 565002, "epoch": 6807} {"train_loss": -27.05018424987793, "global_step": 565003, "epoch": 6807} {"train_loss": -27.55238151550293, "global_step": 565004, "epoch": 6807} {"train_loss": -27.53896141052246, "global_step": 565005, "epoch": 6807} {"train_loss": -27.381528854370117, "global_step": 565006, "epoch": 6807} {"train_loss": -27.421859741210938, "global_step": 565007, "epoch": 6807} {"train_loss": -27.60801124572754, "global_step": 565008, "epoch": 6807} {"train_loss": -27.410608291625977, "global_step": 565009, "epoch": 6807} {"train_loss": -27.377710342407227, "global_step": 565010, "epoch": 6807} {"train_loss": -27.618473052978516, "global_step": 565011, "epoch": 6807} {"train_loss": -27.7139835357666, "global_step": 565012, "epoch": 6807} {"train_loss": -27.47021484375, "global_step": 565013, "epoch": 6807} {"train_loss": -27.523761749267578, "global_step": 565014, "epoch": 6807} {"train_loss": -27.815710067749023, "global_step": 565015, "epoch": 6807} {"train_loss": -27.743066787719727, "global_step": 565016, "epoch": 6807} {"train_loss": -27.62940788269043, "global_step": 565017, "epoch": 6807} {"train_loss": -27.57253074645996, "global_step": 565018, "epoch": 6807} {"train_loss": -28.044836044311523, "global_step": 565019, "epoch": 6807} {"train_loss": -28.182498931884766, "global_step": 565020, "epoch": 6807} {"train_loss": -27.765111923217773, "global_step": 565021, "epoch": 6807} {"train_loss": -28.066396713256836, "global_step": 565022, "epoch": 6807} {"train_loss": -27.955617904663086, "global_step": 565023, "epoch": 6807} {"train_loss": -27.807401657104492, "global_step": 565024, "epoch": 6807} {"train_loss": -27.875028610229492, "global_step": 565025, "epoch": 6807} {"train_loss": -27.975244522094727, "global_step": 565026, "epoch": 6807} {"train_loss": -28.028079986572266, "global_step": 565027, "epoch": 6807} {"train_loss": -28.038389205932617, "global_step": 565028, "epoch": 6807} {"train_loss": -27.960250854492188, "global_step": 565029, "epoch": 6807} {"train_loss": -28.102697372436523, "global_step": 565030, "epoch": 6807} {"train_loss": -27.975051879882812, "global_step": 565031, "epoch": 6807} {"train_loss": -28.041828155517578, "global_step": 565032, "epoch": 6807} {"train_loss": -28.10822868347168, "global_step": 565033, "epoch": 6807} {"train_loss": -28.0208683013916, "global_step": 565034, "epoch": 6807} {"train_loss": -28.28464126586914, "global_step": 565035, "epoch": 6807} {"train_loss": -28.156085968017578, "global_step": 565036, "epoch": 6807} {"train_loss": -28.2888126373291, "global_step": 565037, "epoch": 6807} {"train_loss": -28.081165313720703, "global_step": 565038, "epoch": 6807} {"train_loss": -28.07612419128418, "global_step": 565039, "epoch": 6807} {"train_loss": -28.082712173461914, "global_step": 565040, "epoch": 6807} {"train_loss": -27.77667808532715, "global_step": 565041, "epoch": 6807} {"train_loss": -27.57272720336914, "global_step": 565042, "epoch": 6807} {"train_loss": -27.5562744140625, "global_step": 565043, "epoch": 6807} {"train_loss": -28.14095115661621, "global_step": 565044, "epoch": 6807} {"train_loss": -27.910873413085938, "global_step": 565045, "epoch": 6807} {"train_loss": -27.932947158813477, "global_step": 565046, "epoch": 6807} {"train_loss": -27.76405906677246, "global_step": 565047, "epoch": 6807} {"train_loss": -27.603931427001953, "global_step": 565048, "epoch": 6807} {"train_loss": -27.439966201782227, "global_step": 565049, "epoch": 6807} {"train_loss": -27.133779525756836, "global_step": 565050, "epoch": 6807} {"train_loss": -27.417266845703125, "global_step": 565051, "epoch": 6807} {"train_loss": -27.35955810546875, "global_step": 565052, "epoch": 6807} {"train_loss": -27.893177032470703, "global_step": 565053, "epoch": 6807} {"train_loss": -27.660343170166016, "global_step": 565054, "epoch": 6807} {"train_loss": -27.70355796813965, "global_step": 565055, "epoch": 6807} {"train_loss": -27.539142608642578, "global_step": 565056, "epoch": 6807} {"train_loss": -27.40218162536621, "global_step": 565057, "epoch": 6807} {"train_loss": -27.785552978515625, "global_step": 565058, "epoch": 6807} {"train_loss": -27.675207138061523, "global_step": 565059, "epoch": 6807} {"train_loss": -27.583633422851562, "global_step": 565060, "epoch": 6807} {"train_loss": -27.958221435546875, "global_step": 565061, "epoch": 6807} {"train_loss": -27.515949249267578, "global_step": 565062, "epoch": 6807} {"train_loss": -27.612346258508154, "global_step": 565063, "epoch": 6807, "val_loss": 6618812.0} {"train_loss": -27.17580223083496, "global_step": 565064, "epoch": 6808} {"train_loss": -27.456939697265625, "global_step": 565065, "epoch": 6808} {"train_loss": -27.636072158813477, "global_step": 565066, "epoch": 6808} {"train_loss": -27.489206314086914, "global_step": 565067, "epoch": 6808} {"train_loss": -27.61097526550293, "global_step": 565068, "epoch": 6808} {"train_loss": -27.600269317626953, "global_step": 565069, "epoch": 6808} {"train_loss": -28.021503448486328, "global_step": 565070, "epoch": 6808} {"train_loss": -27.828266143798828, "global_step": 565071, "epoch": 6808} {"train_loss": -27.39823341369629, "global_step": 565072, "epoch": 6808} {"train_loss": -27.791702270507812, "global_step": 565073, "epoch": 6808} {"train_loss": -27.69294548034668, "global_step": 565074, "epoch": 6808} {"train_loss": -27.65471839904785, "global_step": 565075, "epoch": 6808} {"train_loss": -27.836362838745117, "global_step": 565076, "epoch": 6808} {"train_loss": -27.8635311126709, "global_step": 565077, "epoch": 6808} {"train_loss": -27.73773193359375, "global_step": 565078, "epoch": 6808} {"train_loss": -27.671239852905273, "global_step": 565079, "epoch": 6808} {"train_loss": -27.548954010009766, "global_step": 565080, "epoch": 6808} {"train_loss": -27.799535751342773, "global_step": 565081, "epoch": 6808} {"train_loss": -27.614789962768555, "global_step": 565082, "epoch": 6808} {"train_loss": -27.56373405456543, "global_step": 565083, "epoch": 6808} {"train_loss": -27.95654296875, "global_step": 565084, "epoch": 6808} {"train_loss": -27.718515396118164, "global_step": 565085, "epoch": 6808} {"train_loss": -27.500873565673828, "global_step": 565086, "epoch": 6808} {"train_loss": -27.65010643005371, "global_step": 565087, "epoch": 6808} {"train_loss": -27.73581886291504, "global_step": 565088, "epoch": 6808} {"train_loss": -27.892343521118164, "global_step": 565089, "epoch": 6808} {"train_loss": -27.944015502929688, "global_step": 565090, "epoch": 6808} {"train_loss": -27.837635040283203, "global_step": 565091, "epoch": 6808} {"train_loss": -27.687625885009766, "global_step": 565092, "epoch": 6808} {"train_loss": -28.000638961791992, "global_step": 565093, "epoch": 6808} {"train_loss": -27.809680938720703, "global_step": 565094, "epoch": 6808} {"train_loss": -27.9446964263916, "global_step": 565095, "epoch": 6808} {"train_loss": -28.218000411987305, "global_step": 565096, "epoch": 6808} {"train_loss": -28.08228874206543, "global_step": 565097, "epoch": 6808} {"train_loss": -27.633596420288086, "global_step": 565098, "epoch": 6808} {"train_loss": -27.85321044921875, "global_step": 565099, "epoch": 6808} {"train_loss": -27.80191421508789, "global_step": 565100, "epoch": 6808} {"train_loss": -27.945220947265625, "global_step": 565101, "epoch": 6808} {"train_loss": -28.053674697875977, "global_step": 565102, "epoch": 6808} {"train_loss": -27.953479766845703, "global_step": 565103, "epoch": 6808} {"train_loss": -27.991987228393555, "global_step": 565104, "epoch": 6808} {"train_loss": -27.697128295898438, "global_step": 565105, "epoch": 6808} {"train_loss": -28.038888931274414, "global_step": 565106, "epoch": 6808} {"train_loss": -27.958011627197266, "global_step": 565107, "epoch": 6808} {"train_loss": -28.02594566345215, "global_step": 565108, "epoch": 6808} {"train_loss": -27.50308609008789, "global_step": 565109, "epoch": 6808} {"train_loss": -27.452192306518555, "global_step": 565110, "epoch": 6808} {"train_loss": -27.554584503173828, "global_step": 565111, "epoch": 6808} {"train_loss": -27.842344284057617, "global_step": 565112, "epoch": 6808} {"train_loss": -28.020862579345703, "global_step": 565113, "epoch": 6808} {"train_loss": -27.732254028320312, "global_step": 565114, "epoch": 6808} {"train_loss": -28.313282012939453, "global_step": 565115, "epoch": 6808} {"train_loss": -27.547088623046875, "global_step": 565116, "epoch": 6808} {"train_loss": -28.208044052124023, "global_step": 565117, "epoch": 6808} {"train_loss": -27.941024780273438, "global_step": 565118, "epoch": 6808} {"train_loss": -27.764789581298828, "global_step": 565119, "epoch": 6808} {"train_loss": -27.825326919555664, "global_step": 565120, "epoch": 6808} {"train_loss": -27.93096923828125, "global_step": 565121, "epoch": 6808} {"train_loss": -27.945133209228516, "global_step": 565122, "epoch": 6808} {"train_loss": -28.0729923248291, "global_step": 565123, "epoch": 6808} {"train_loss": -27.928396224975586, "global_step": 565124, "epoch": 6808} {"train_loss": -27.890167236328125, "global_step": 565125, "epoch": 6808} {"train_loss": -28.106430053710938, "global_step": 565126, "epoch": 6808} {"train_loss": -27.907215118408203, "global_step": 565127, "epoch": 6808} {"train_loss": -28.001880645751953, "global_step": 565128, "epoch": 6808} {"train_loss": -28.00062370300293, "global_step": 565129, "epoch": 6808} {"train_loss": -27.691946029663086, "global_step": 565130, "epoch": 6808} {"train_loss": -27.88596534729004, "global_step": 565131, "epoch": 6808} {"train_loss": -27.686920166015625, "global_step": 565132, "epoch": 6808} {"train_loss": -26.983274459838867, "global_step": 565133, "epoch": 6808} {"train_loss": -26.75345230102539, "global_step": 565134, "epoch": 6808} {"train_loss": -26.517047882080078, "global_step": 565135, "epoch": 6808} {"train_loss": -26.4724063873291, "global_step": 565136, "epoch": 6808} {"train_loss": -27.840341567993164, "global_step": 565137, "epoch": 6808} {"train_loss": -28.09797477722168, "global_step": 565138, "epoch": 6808} {"train_loss": -27.3799991607666, "global_step": 565139, "epoch": 6808} {"train_loss": -27.64478874206543, "global_step": 565140, "epoch": 6808} {"train_loss": -27.159513473510742, "global_step": 565141, "epoch": 6808} {"train_loss": -26.971820831298828, "global_step": 565142, "epoch": 6808} {"train_loss": -27.782678604125977, "global_step": 565143, "epoch": 6808} {"train_loss": -27.534818649291992, "global_step": 565144, "epoch": 6808} {"train_loss": -27.65264892578125, "global_step": 565145, "epoch": 6808} {"train_loss": -27.7025868749044, "global_step": 565146, "epoch": 6808, "val_loss": 6621982.0} {"train_loss": -27.195667266845703, "global_step": 565147, "epoch": 6809} {"train_loss": -27.87590980529785, "global_step": 565148, "epoch": 6809} {"train_loss": -27.264135360717773, "global_step": 565149, "epoch": 6809} {"train_loss": -25.6568603515625, "global_step": 565150, "epoch": 6809} {"train_loss": -27.730697631835938, "global_step": 565151, "epoch": 6809} {"train_loss": -26.800464630126953, "global_step": 565152, "epoch": 6809} {"train_loss": -27.378828048706055, "global_step": 565153, "epoch": 6809} {"train_loss": -26.87344741821289, "global_step": 565154, "epoch": 6809} {"train_loss": -26.979093551635742, "global_step": 565155, "epoch": 6809} {"train_loss": -26.903411865234375, "global_step": 565156, "epoch": 6809} {"train_loss": -27.242145538330078, "global_step": 565157, "epoch": 6809} {"train_loss": -26.905012130737305, "global_step": 565158, "epoch": 6809} {"train_loss": -27.118549346923828, "global_step": 565159, "epoch": 6809} {"train_loss": -27.4427433013916, "global_step": 565160, "epoch": 6809} {"train_loss": -27.35348892211914, "global_step": 565161, "epoch": 6809} {"train_loss": -27.303756713867188, "global_step": 565162, "epoch": 6809} {"train_loss": -27.4567813873291, "global_step": 565163, "epoch": 6809} {"train_loss": -27.698644638061523, "global_step": 565164, "epoch": 6809} {"train_loss": -27.091962814331055, "global_step": 565165, "epoch": 6809} {"train_loss": -27.44769287109375, "global_step": 565166, "epoch": 6809} {"train_loss": -27.169052124023438, "global_step": 565167, "epoch": 6809} {"train_loss": -27.630762100219727, "global_step": 565168, "epoch": 6809} {"train_loss": -27.79498863220215, "global_step": 565169, "epoch": 6809} {"train_loss": -27.84857749938965, "global_step": 565170, "epoch": 6809} {"train_loss": -27.54073143005371, "global_step": 565171, "epoch": 6809} {"train_loss": -27.681848526000977, "global_step": 565172, "epoch": 6809} {"train_loss": -27.561986923217773, "global_step": 565173, "epoch": 6809} {"train_loss": -27.571441650390625, "global_step": 565174, "epoch": 6809} {"train_loss": -28.159997940063477, "global_step": 565175, "epoch": 6809} {"train_loss": -27.44727897644043, "global_step": 565176, "epoch": 6809} {"train_loss": -27.72662925720215, "global_step": 565177, "epoch": 6809} {"train_loss": -27.87798500061035, "global_step": 565178, "epoch": 6809} {"train_loss": -27.83905029296875, "global_step": 565179, "epoch": 6809} {"train_loss": -27.444982528686523, "global_step": 565180, "epoch": 6809} {"train_loss": -28.048004150390625, "global_step": 565181, "epoch": 6809} {"train_loss": -27.566022872924805, "global_step": 565182, "epoch": 6809} {"train_loss": -27.518646240234375, "global_step": 565183, "epoch": 6809} {"train_loss": -27.981719970703125, "global_step": 565184, "epoch": 6809} {"train_loss": -27.706684112548828, "global_step": 565185, "epoch": 6809} {"train_loss": -28.14226722717285, "global_step": 565186, "epoch": 6809} {"train_loss": -27.720962524414062, "global_step": 565187, "epoch": 6809} {"train_loss": -27.805810928344727, "global_step": 565188, "epoch": 6809} {"train_loss": -27.954221725463867, "global_step": 565189, "epoch": 6809} {"train_loss": -27.919519424438477, "global_step": 565190, "epoch": 6809} {"train_loss": -28.15480613708496, "global_step": 565191, "epoch": 6809} {"train_loss": -28.0726375579834, "global_step": 565192, "epoch": 6809} {"train_loss": -28.08367919921875, "global_step": 565193, "epoch": 6809} {"train_loss": -27.568525314331055, "global_step": 565194, "epoch": 6809} {"train_loss": -27.975513458251953, "global_step": 565195, "epoch": 6809} {"train_loss": -28.092132568359375, "global_step": 565196, "epoch": 6809} {"train_loss": -28.07826042175293, "global_step": 565197, "epoch": 6809} {"train_loss": -28.064346313476562, "global_step": 565198, "epoch": 6809} {"train_loss": -27.882959365844727, "global_step": 565199, "epoch": 6809} {"train_loss": -27.659616470336914, "global_step": 565200, "epoch": 6809} {"train_loss": -27.8032169342041, "global_step": 565201, "epoch": 6809} {"train_loss": -28.11372184753418, "global_step": 565202, "epoch": 6809} {"train_loss": -28.3234920501709, "global_step": 565203, "epoch": 6809} {"train_loss": -27.611974716186523, "global_step": 565204, "epoch": 6809} {"train_loss": -27.978071212768555, "global_step": 565205, "epoch": 6809} {"train_loss": -27.87981605529785, "global_step": 565206, "epoch": 6809} {"train_loss": -28.150094985961914, "global_step": 565207, "epoch": 6809} {"train_loss": -27.866907119750977, "global_step": 565208, "epoch": 6809} {"train_loss": -28.270843505859375, "global_step": 565209, "epoch": 6809} {"train_loss": -28.1146183013916, "global_step": 565210, "epoch": 6809} {"train_loss": -28.1835994720459, "global_step": 565211, "epoch": 6809} {"train_loss": -28.607742309570312, "global_step": 565212, "epoch": 6809} {"train_loss": -27.926071166992188, "global_step": 565213, "epoch": 6809} {"train_loss": -27.882007598876953, "global_step": 565214, "epoch": 6809} {"train_loss": -28.033361434936523, "global_step": 565215, "epoch": 6809} {"train_loss": -27.646448135375977, "global_step": 565216, "epoch": 6809} {"train_loss": -27.55327796936035, "global_step": 565217, "epoch": 6809} {"train_loss": -27.89238929748535, "global_step": 565218, "epoch": 6809} {"train_loss": -27.8612060546875, "global_step": 565219, "epoch": 6809} {"train_loss": -28.082895278930664, "global_step": 565220, "epoch": 6809} {"train_loss": -27.392169952392578, "global_step": 565221, "epoch": 6809} {"train_loss": -27.50432777404785, "global_step": 565222, "epoch": 6809} {"train_loss": -27.331024169921875, "global_step": 565223, "epoch": 6809} {"train_loss": -27.847211837768555, "global_step": 565224, "epoch": 6809} {"train_loss": -28.002460479736328, "global_step": 565225, "epoch": 6809} {"train_loss": -27.92171287536621, "global_step": 565226, "epoch": 6809} {"train_loss": -27.85548210144043, "global_step": 565227, "epoch": 6809} {"train_loss": -27.6523380279541, "global_step": 565228, "epoch": 6809} {"train_loss": -27.68838866360216, "global_step": 565229, "epoch": 6809, "val_loss": 6640122.0} {"train_loss": -27.8778076171875, "global_step": 565230, "epoch": 6810} {"train_loss": -27.195148468017578, "global_step": 565231, "epoch": 6810} {"train_loss": -27.668792724609375, "global_step": 565232, "epoch": 6810} {"train_loss": -27.115331649780273, "global_step": 565233, "epoch": 6810} {"train_loss": -27.433643341064453, "global_step": 565234, "epoch": 6810} {"train_loss": -27.085920333862305, "global_step": 565235, "epoch": 6810} {"train_loss": -27.691396713256836, "global_step": 565236, "epoch": 6810} {"train_loss": -27.37665367126465, "global_step": 565237, "epoch": 6810} {"train_loss": -27.09357261657715, "global_step": 565238, "epoch": 6810} {"train_loss": -27.6865177154541, "global_step": 565239, "epoch": 6810} {"train_loss": -27.6602840423584, "global_step": 565240, "epoch": 6810} {"train_loss": -27.104101181030273, "global_step": 565241, "epoch": 6810} {"train_loss": -27.670576095581055, "global_step": 565242, "epoch": 6810} {"train_loss": -27.463659286499023, "global_step": 565243, "epoch": 6810} {"train_loss": -27.19943618774414, "global_step": 565244, "epoch": 6810} {"train_loss": -27.568557739257812, "global_step": 565245, "epoch": 6810} {"train_loss": -27.903284072875977, "global_step": 565246, "epoch": 6810} {"train_loss": -27.31488037109375, "global_step": 565247, "epoch": 6810} {"train_loss": -27.701196670532227, "global_step": 565248, "epoch": 6810} {"train_loss": -27.84579849243164, "global_step": 565249, "epoch": 6810} {"train_loss": -27.261722564697266, "global_step": 565250, "epoch": 6810} {"train_loss": -27.762975692749023, "global_step": 565251, "epoch": 6810} {"train_loss": -27.812952041625977, "global_step": 565252, "epoch": 6810} {"train_loss": -27.31736183166504, "global_step": 565253, "epoch": 6810} {"train_loss": -27.850574493408203, "global_step": 565254, "epoch": 6810} {"train_loss": -27.836475372314453, "global_step": 565255, "epoch": 6810} {"train_loss": -27.650060653686523, "global_step": 565256, "epoch": 6810} {"train_loss": -27.657575607299805, "global_step": 565257, "epoch": 6810} {"train_loss": -27.77595329284668, "global_step": 565258, "epoch": 6810} {"train_loss": -27.395837783813477, "global_step": 565259, "epoch": 6810} {"train_loss": -27.773426055908203, "global_step": 565260, "epoch": 6810} {"train_loss": -27.785627365112305, "global_step": 565261, "epoch": 6810} {"train_loss": -27.6668758392334, "global_step": 565262, "epoch": 6810} {"train_loss": -27.566801071166992, "global_step": 565263, "epoch": 6810} {"train_loss": -27.8206844329834, "global_step": 565264, "epoch": 6810} {"train_loss": -27.878711700439453, "global_step": 565265, "epoch": 6810} {"train_loss": -27.857519149780273, "global_step": 565266, "epoch": 6810} {"train_loss": -27.939748764038086, "global_step": 565267, "epoch": 6810} {"train_loss": -27.54603385925293, "global_step": 565268, "epoch": 6810} {"train_loss": -27.354480743408203, "global_step": 565269, "epoch": 6810} {"train_loss": -26.851348876953125, "global_step": 565270, "epoch": 6810} {"train_loss": -26.712661743164062, "global_step": 565271, "epoch": 6810} {"train_loss": -27.745685577392578, "global_step": 565272, "epoch": 6810} {"train_loss": -27.570667266845703, "global_step": 565273, "epoch": 6810} {"train_loss": -27.916372299194336, "global_step": 565274, "epoch": 6810} {"train_loss": -27.9718017578125, "global_step": 565275, "epoch": 6810} {"train_loss": -27.701074600219727, "global_step": 565276, "epoch": 6810} {"train_loss": -27.782377243041992, "global_step": 565277, "epoch": 6810} {"train_loss": -28.06906509399414, "global_step": 565278, "epoch": 6810} {"train_loss": -27.693944931030273, "global_step": 565279, "epoch": 6810} {"train_loss": -27.67359733581543, "global_step": 565280, "epoch": 6810} {"train_loss": -27.779760360717773, "global_step": 565281, "epoch": 6810} {"train_loss": -27.696884155273438, "global_step": 565282, "epoch": 6810} {"train_loss": -27.70420265197754, "global_step": 565283, "epoch": 6810} {"train_loss": -27.796279907226562, "global_step": 565284, "epoch": 6810} {"train_loss": -27.967853546142578, "global_step": 565285, "epoch": 6810} {"train_loss": -27.72039222717285, "global_step": 565286, "epoch": 6810} {"train_loss": -27.76311683654785, "global_step": 565287, "epoch": 6810} {"train_loss": -27.660892486572266, "global_step": 565288, "epoch": 6810} {"train_loss": -27.918798446655273, "global_step": 565289, "epoch": 6810} {"train_loss": -28.2044620513916, "global_step": 565290, "epoch": 6810} {"train_loss": -28.02530288696289, "global_step": 565291, "epoch": 6810} {"train_loss": -27.62213134765625, "global_step": 565292, "epoch": 6810} {"train_loss": -28.165771484375, "global_step": 565293, "epoch": 6810} {"train_loss": -27.930362701416016, "global_step": 565294, "epoch": 6810} {"train_loss": -28.1114559173584, "global_step": 565295, "epoch": 6810} {"train_loss": -27.9190616607666, "global_step": 565296, "epoch": 6810} {"train_loss": -27.74407958984375, "global_step": 565297, "epoch": 6810} {"train_loss": -27.56365966796875, "global_step": 565298, "epoch": 6810} {"train_loss": -27.96734046936035, "global_step": 565299, "epoch": 6810} {"train_loss": -27.9594669342041, "global_step": 565300, "epoch": 6810} {"train_loss": -28.186481475830078, "global_step": 565301, "epoch": 6810} {"train_loss": -28.213048934936523, "global_step": 565302, "epoch": 6810} {"train_loss": -27.747802734375, "global_step": 565303, "epoch": 6810} {"train_loss": -28.207056045532227, "global_step": 565304, "epoch": 6810} {"train_loss": -28.024816513061523, "global_step": 565305, "epoch": 6810} {"train_loss": -28.102588653564453, "global_step": 565306, "epoch": 6810} {"train_loss": -27.979135513305664, "global_step": 565307, "epoch": 6810} {"train_loss": -27.797866821289062, "global_step": 565308, "epoch": 6810} {"train_loss": -28.082502365112305, "global_step": 565309, "epoch": 6810} {"train_loss": -27.955066680908203, "global_step": 565310, "epoch": 6810} {"train_loss": -27.946508407592773, "global_step": 565311, "epoch": 6810} {"train_loss": -27.71857422518443, "global_step": 565312, "epoch": 6810, "val_loss": 6626297.0} {"train_loss": -27.073638916015625, "global_step": 565313, "epoch": 6811} {"train_loss": -25.5384521484375, "global_step": 565314, "epoch": 6811} {"train_loss": -24.1661434173584, "global_step": 565315, "epoch": 6811} {"train_loss": -25.00676155090332, "global_step": 565316, "epoch": 6811} {"train_loss": -26.920759201049805, "global_step": 565317, "epoch": 6811} {"train_loss": -26.383405685424805, "global_step": 565318, "epoch": 6811} {"train_loss": -25.989999771118164, "global_step": 565319, "epoch": 6811} {"train_loss": -27.30860710144043, "global_step": 565320, "epoch": 6811} {"train_loss": -26.460458755493164, "global_step": 565321, "epoch": 6811} {"train_loss": -27.60821533203125, "global_step": 565322, "epoch": 6811} {"train_loss": -26.39484977722168, "global_step": 565323, "epoch": 6811} {"train_loss": -26.85418701171875, "global_step": 565324, "epoch": 6811} {"train_loss": -26.96746253967285, "global_step": 565325, "epoch": 6811} {"train_loss": -27.15323829650879, "global_step": 565326, "epoch": 6811} {"train_loss": -27.436447143554688, "global_step": 565327, "epoch": 6811} {"train_loss": -27.083484649658203, "global_step": 565328, "epoch": 6811} {"train_loss": -27.184782028198242, "global_step": 565329, "epoch": 6811} {"train_loss": -27.282917022705078, "global_step": 565330, "epoch": 6811} {"train_loss": -27.567243576049805, "global_step": 565331, "epoch": 6811} {"train_loss": -27.532373428344727, "global_step": 565332, "epoch": 6811} {"train_loss": -27.26934814453125, "global_step": 565333, "epoch": 6811} {"train_loss": -27.077604293823242, "global_step": 565334, "epoch": 6811} {"train_loss": -27.5024471282959, "global_step": 565335, "epoch": 6811} {"train_loss": -27.254247665405273, "global_step": 565336, "epoch": 6811} {"train_loss": -27.72517204284668, "global_step": 565337, "epoch": 6811} {"train_loss": -27.447607040405273, "global_step": 565338, "epoch": 6811} {"train_loss": -27.56587028503418, "global_step": 565339, "epoch": 6811} {"train_loss": -28.042572021484375, "global_step": 565340, "epoch": 6811} {"train_loss": -27.563703536987305, "global_step": 565341, "epoch": 6811} {"train_loss": -27.693967819213867, "global_step": 565342, "epoch": 6811} {"train_loss": -27.686981201171875, "global_step": 565343, "epoch": 6811} {"train_loss": -27.636972427368164, "global_step": 565344, "epoch": 6811} {"train_loss": -27.548181533813477, "global_step": 565345, "epoch": 6811} {"train_loss": -27.936420440673828, "global_step": 565346, "epoch": 6811} {"train_loss": -27.551252365112305, "global_step": 565347, "epoch": 6811} {"train_loss": -27.903030395507812, "global_step": 565348, "epoch": 6811} {"train_loss": -28.084348678588867, "global_step": 565349, "epoch": 6811} {"train_loss": -27.753385543823242, "global_step": 565350, "epoch": 6811} {"train_loss": -27.72981834411621, "global_step": 565351, "epoch": 6811} {"train_loss": -27.483535766601562, "global_step": 565352, "epoch": 6811} {"train_loss": -28.105152130126953, "global_step": 565353, "epoch": 6811} {"train_loss": -27.74567985534668, "global_step": 565354, "epoch": 6811} {"train_loss": -27.997089385986328, "global_step": 565355, "epoch": 6811} {"train_loss": -27.839324951171875, "global_step": 565356, "epoch": 6811} {"train_loss": -27.91253662109375, "global_step": 565357, "epoch": 6811} {"train_loss": -28.167943954467773, "global_step": 565358, "epoch": 6811} {"train_loss": -28.094579696655273, "global_step": 565359, "epoch": 6811} {"train_loss": -28.036359786987305, "global_step": 565360, "epoch": 6811} {"train_loss": -28.092517852783203, "global_step": 565361, "epoch": 6811} {"train_loss": -28.198108673095703, "global_step": 565362, "epoch": 6811} {"train_loss": -28.253833770751953, "global_step": 565363, "epoch": 6811} {"train_loss": -28.14906120300293, "global_step": 565364, "epoch": 6811} {"train_loss": -28.009918212890625, "global_step": 565365, "epoch": 6811} {"train_loss": -27.721296310424805, "global_step": 565366, "epoch": 6811} {"train_loss": -28.023473739624023, "global_step": 565367, "epoch": 6811} {"train_loss": -28.055402755737305, "global_step": 565368, "epoch": 6811} {"train_loss": -28.08660888671875, "global_step": 565369, "epoch": 6811} {"train_loss": -28.14202308654785, "global_step": 565370, "epoch": 6811} {"train_loss": -28.03156852722168, "global_step": 565371, "epoch": 6811} {"train_loss": -27.8828182220459, "global_step": 565372, "epoch": 6811} {"train_loss": -27.962631225585938, "global_step": 565373, "epoch": 6811} {"train_loss": -28.028079986572266, "global_step": 565374, "epoch": 6811} {"train_loss": -28.35343360900879, "global_step": 565375, "epoch": 6811} {"train_loss": -28.185033798217773, "global_step": 565376, "epoch": 6811} {"train_loss": -28.293989181518555, "global_step": 565377, "epoch": 6811} {"train_loss": -28.064594268798828, "global_step": 565378, "epoch": 6811} {"train_loss": -28.01495933532715, "global_step": 565379, "epoch": 6811} {"train_loss": -27.780567169189453, "global_step": 565380, "epoch": 6811} {"train_loss": -27.607471466064453, "global_step": 565381, "epoch": 6811} {"train_loss": -27.462142944335938, "global_step": 565382, "epoch": 6811} {"train_loss": -27.664091110229492, "global_step": 565383, "epoch": 6811} {"train_loss": -27.319990158081055, "global_step": 565384, "epoch": 6811} {"train_loss": -27.80915641784668, "global_step": 565385, "epoch": 6811} {"train_loss": -27.547683715820312, "global_step": 565386, "epoch": 6811} {"train_loss": -26.690107345581055, "global_step": 565387, "epoch": 6811} {"train_loss": -27.081298828125, "global_step": 565388, "epoch": 6811} {"train_loss": -27.07269287109375, "global_step": 565389, "epoch": 6811} {"train_loss": -27.54302406311035, "global_step": 565390, "epoch": 6811} {"train_loss": -27.14409828186035, "global_step": 565391, "epoch": 6811} {"train_loss": -27.25349235534668, "global_step": 565392, "epoch": 6811} {"train_loss": -27.797103881835938, "global_step": 565393, "epoch": 6811} {"train_loss": -27.3690185546875, "global_step": 565394, "epoch": 6811} {"train_loss": -27.499359130859375, "global_step": 565395, "epoch": 6811, "val_loss": 6656705.5} {"train_loss": -26.329923629760742, "global_step": 565396, "epoch": 6812} {"train_loss": -27.247974395751953, "global_step": 565397, "epoch": 6812} {"train_loss": -27.130294799804688, "global_step": 565398, "epoch": 6812} {"train_loss": -26.151325225830078, "global_step": 565399, "epoch": 6812} {"train_loss": -27.20517921447754, "global_step": 565400, "epoch": 6812} {"train_loss": -26.54728126525879, "global_step": 565401, "epoch": 6812} {"train_loss": -27.10097312927246, "global_step": 565402, "epoch": 6812} {"train_loss": -26.75800895690918, "global_step": 565403, "epoch": 6812} {"train_loss": -27.061487197875977, "global_step": 565404, "epoch": 6812} {"train_loss": -27.05926513671875, "global_step": 565405, "epoch": 6812} {"train_loss": -26.784040451049805, "global_step": 565406, "epoch": 6812} {"train_loss": -27.002185821533203, "global_step": 565407, "epoch": 6812} {"train_loss": -26.641845703125, "global_step": 565408, "epoch": 6812} {"train_loss": -27.442264556884766, "global_step": 565409, "epoch": 6812} {"train_loss": -27.124555587768555, "global_step": 565410, "epoch": 6812} {"train_loss": -27.369586944580078, "global_step": 565411, "epoch": 6812} {"train_loss": -27.232879638671875, "global_step": 565412, "epoch": 6812} {"train_loss": -27.417098999023438, "global_step": 565413, "epoch": 6812} {"train_loss": -27.333881378173828, "global_step": 565414, "epoch": 6812} {"train_loss": -27.286828994750977, "global_step": 565415, "epoch": 6812} {"train_loss": -27.466690063476562, "global_step": 565416, "epoch": 6812} {"train_loss": -27.259145736694336, "global_step": 565417, "epoch": 6812} {"train_loss": -27.295398712158203, "global_step": 565418, "epoch": 6812} {"train_loss": -27.261877059936523, "global_step": 565419, "epoch": 6812} {"train_loss": -27.169940948486328, "global_step": 565420, "epoch": 6812} {"train_loss": -27.71258544921875, "global_step": 565421, "epoch": 6812} {"train_loss": -27.424570083618164, "global_step": 565422, "epoch": 6812} {"train_loss": -27.567106246948242, "global_step": 565423, "epoch": 6812} {"train_loss": -27.355688095092773, "global_step": 565424, "epoch": 6812} {"train_loss": -27.53921890258789, "global_step": 565425, "epoch": 6812} {"train_loss": -27.764062881469727, "global_step": 565426, "epoch": 6812} {"train_loss": -27.603713989257812, "global_step": 565427, "epoch": 6812} {"train_loss": -27.85413932800293, "global_step": 565428, "epoch": 6812} {"train_loss": -27.978229522705078, "global_step": 565429, "epoch": 6812} {"train_loss": -27.748321533203125, "global_step": 565430, "epoch": 6812} {"train_loss": -28.045490264892578, "global_step": 565431, "epoch": 6812} {"train_loss": -27.860578536987305, "global_step": 565432, "epoch": 6812} {"train_loss": -27.738821029663086, "global_step": 565433, "epoch": 6812} {"train_loss": -27.73219871520996, "global_step": 565434, "epoch": 6812} {"train_loss": -27.777729034423828, "global_step": 565435, "epoch": 6812} {"train_loss": -27.604068756103516, "global_step": 565436, "epoch": 6812} {"train_loss": -28.067060470581055, "global_step": 565437, "epoch": 6812} {"train_loss": -27.823591232299805, "global_step": 565438, "epoch": 6812} {"train_loss": -28.16800308227539, "global_step": 565439, "epoch": 6812} {"train_loss": -28.017789840698242, "global_step": 565440, "epoch": 6812} {"train_loss": -28.325483322143555, "global_step": 565441, "epoch": 6812} {"train_loss": -27.6737060546875, "global_step": 565442, "epoch": 6812} {"train_loss": -28.346349716186523, "global_step": 565443, "epoch": 6812} {"train_loss": -27.7667293548584, "global_step": 565444, "epoch": 6812} {"train_loss": -28.033166885375977, "global_step": 565445, "epoch": 6812} {"train_loss": -28.084735870361328, "global_step": 565446, "epoch": 6812} {"train_loss": -28.3355770111084, "global_step": 565447, "epoch": 6812} {"train_loss": -28.527973175048828, "global_step": 565448, "epoch": 6812} {"train_loss": -28.036291122436523, "global_step": 565449, "epoch": 6812} {"train_loss": -27.782819747924805, "global_step": 565450, "epoch": 6812} {"train_loss": -27.97589111328125, "global_step": 565451, "epoch": 6812} {"train_loss": -27.34052848815918, "global_step": 565452, "epoch": 6812} {"train_loss": -27.88528823852539, "global_step": 565453, "epoch": 6812} {"train_loss": -28.3132266998291, "global_step": 565454, "epoch": 6812} {"train_loss": -28.039213180541992, "global_step": 565455, "epoch": 6812} {"train_loss": -28.073749542236328, "global_step": 565456, "epoch": 6812} {"train_loss": -27.625089645385742, "global_step": 565457, "epoch": 6812} {"train_loss": -27.680578231811523, "global_step": 565458, "epoch": 6812} {"train_loss": -28.058887481689453, "global_step": 565459, "epoch": 6812} {"train_loss": -27.768421173095703, "global_step": 565460, "epoch": 6812} {"train_loss": -27.795133590698242, "global_step": 565461, "epoch": 6812} {"train_loss": -27.491806030273438, "global_step": 565462, "epoch": 6812} {"train_loss": -28.092710494995117, "global_step": 565463, "epoch": 6812} {"train_loss": -27.7463321685791, "global_step": 565464, "epoch": 6812} {"train_loss": -27.586029052734375, "global_step": 565465, "epoch": 6812} {"train_loss": -27.790027618408203, "global_step": 565466, "epoch": 6812} {"train_loss": -27.8516845703125, "global_step": 565467, "epoch": 6812} {"train_loss": -27.848844528198242, "global_step": 565468, "epoch": 6812} {"train_loss": -27.6749210357666, "global_step": 565469, "epoch": 6812} {"train_loss": -27.670333862304688, "global_step": 565470, "epoch": 6812} {"train_loss": -28.09754753112793, "global_step": 565471, "epoch": 6812} {"train_loss": -28.0148868560791, "global_step": 565472, "epoch": 6812} {"train_loss": -27.986291885375977, "global_step": 565473, "epoch": 6812} {"train_loss": -27.912860870361328, "global_step": 565474, "epoch": 6812} {"train_loss": -28.006031036376953, "global_step": 565475, "epoch": 6812} {"train_loss": -28.061750411987305, "global_step": 565476, "epoch": 6812} {"train_loss": -27.785863876342773, "global_step": 565477, "epoch": 6812} {"train_loss": -27.62209248830037, "global_step": 565478, "epoch": 6812, "val_loss": 6624841.5} {"train_loss": -26.424325942993164, "global_step": 565479, "epoch": 6813} {"train_loss": -24.914976119995117, "global_step": 565480, "epoch": 6813} {"train_loss": -25.82099723815918, "global_step": 565481, "epoch": 6813} {"train_loss": -27.20160484313965, "global_step": 565482, "epoch": 6813} {"train_loss": -25.968902587890625, "global_step": 565483, "epoch": 6813} {"train_loss": -27.252466201782227, "global_step": 565484, "epoch": 6813} {"train_loss": -26.753082275390625, "global_step": 565485, "epoch": 6813} {"train_loss": -26.979663848876953, "global_step": 565486, "epoch": 6813} {"train_loss": -27.052778244018555, "global_step": 565487, "epoch": 6813} {"train_loss": -27.27888298034668, "global_step": 565488, "epoch": 6813} {"train_loss": -26.836669921875, "global_step": 565489, "epoch": 6813} {"train_loss": -27.205785751342773, "global_step": 565490, "epoch": 6813} {"train_loss": -27.190155029296875, "global_step": 565491, "epoch": 6813} {"train_loss": -27.277606964111328, "global_step": 565492, "epoch": 6813} {"train_loss": -26.919025421142578, "global_step": 565493, "epoch": 6813} {"train_loss": -27.416227340698242, "global_step": 565494, "epoch": 6813} {"train_loss": -27.023340225219727, "global_step": 565495, "epoch": 6813} {"train_loss": -27.2523193359375, "global_step": 565496, "epoch": 6813} {"train_loss": -27.170007705688477, "global_step": 565497, "epoch": 6813} {"train_loss": -26.8707275390625, "global_step": 565498, "epoch": 6813} {"train_loss": -27.17042350769043, "global_step": 565499, "epoch": 6813} {"train_loss": -27.31438636779785, "global_step": 565500, "epoch": 6813} {"train_loss": -27.334680557250977, "global_step": 565501, "epoch": 6813} {"train_loss": -27.50644874572754, "global_step": 565502, "epoch": 6813} {"train_loss": -27.198450088500977, "global_step": 565503, "epoch": 6813} {"train_loss": -27.228540420532227, "global_step": 565504, "epoch": 6813} {"train_loss": -27.4392032623291, "global_step": 565505, "epoch": 6813} {"train_loss": -27.610071182250977, "global_step": 565506, "epoch": 6813} {"train_loss": -27.472949981689453, "global_step": 565507, "epoch": 6813} {"train_loss": -27.431501388549805, "global_step": 565508, "epoch": 6813} {"train_loss": -27.758153915405273, "global_step": 565509, "epoch": 6813} {"train_loss": -27.294357299804688, "global_step": 565510, "epoch": 6813} {"train_loss": -28.024463653564453, "global_step": 565511, "epoch": 6813} {"train_loss": -27.704248428344727, "global_step": 565512, "epoch": 6813} {"train_loss": -27.465576171875, "global_step": 565513, "epoch": 6813} {"train_loss": -27.606489181518555, "global_step": 565514, "epoch": 6813} {"train_loss": -27.4792537689209, "global_step": 565515, "epoch": 6813} {"train_loss": -27.597126007080078, "global_step": 565516, "epoch": 6813} {"train_loss": -27.789907455444336, "global_step": 565517, "epoch": 6813} {"train_loss": -27.829959869384766, "global_step": 565518, "epoch": 6813} {"train_loss": -27.84149169921875, "global_step": 565519, "epoch": 6813} {"train_loss": -27.871225357055664, "global_step": 565520, "epoch": 6813} {"train_loss": -28.044422149658203, "global_step": 565521, "epoch": 6813} {"train_loss": -27.645971298217773, "global_step": 565522, "epoch": 6813} {"train_loss": -27.770116806030273, "global_step": 565523, "epoch": 6813} {"train_loss": -27.879499435424805, "global_step": 565524, "epoch": 6813} {"train_loss": -27.951797485351562, "global_step": 565525, "epoch": 6813} {"train_loss": -27.90006446838379, "global_step": 565526, "epoch": 6813} {"train_loss": -27.8607234954834, "global_step": 565527, "epoch": 6813} {"train_loss": -27.774768829345703, "global_step": 565528, "epoch": 6813} {"train_loss": -28.116668701171875, "global_step": 565529, "epoch": 6813} {"train_loss": -27.840864181518555, "global_step": 565530, "epoch": 6813} {"train_loss": -28.044116973876953, "global_step": 565531, "epoch": 6813} {"train_loss": -27.7477970123291, "global_step": 565532, "epoch": 6813} {"train_loss": -27.998565673828125, "global_step": 565533, "epoch": 6813} {"train_loss": -28.14950942993164, "global_step": 565534, "epoch": 6813} {"train_loss": -28.121826171875, "global_step": 565535, "epoch": 6813} {"train_loss": -28.120298385620117, "global_step": 565536, "epoch": 6813} {"train_loss": -28.070148468017578, "global_step": 565537, "epoch": 6813} {"train_loss": -28.265974044799805, "global_step": 565538, "epoch": 6813} {"train_loss": -27.94768714904785, "global_step": 565539, "epoch": 6813} {"train_loss": -28.216806411743164, "global_step": 565540, "epoch": 6813} {"train_loss": -28.194265365600586, "global_step": 565541, "epoch": 6813} {"train_loss": -28.30088233947754, "global_step": 565542, "epoch": 6813} {"train_loss": -27.875213623046875, "global_step": 565543, "epoch": 6813} {"train_loss": -27.96668815612793, "global_step": 565544, "epoch": 6813} {"train_loss": -27.85976219177246, "global_step": 565545, "epoch": 6813} {"train_loss": -27.51792335510254, "global_step": 565546, "epoch": 6813} {"train_loss": -27.040817260742188, "global_step": 565547, "epoch": 6813} {"train_loss": -25.43916130065918, "global_step": 565548, "epoch": 6813} {"train_loss": -25.489248275756836, "global_step": 565549, "epoch": 6813} {"train_loss": -27.14361000061035, "global_step": 565550, "epoch": 6813} {"train_loss": -27.33977699279785, "global_step": 565551, "epoch": 6813} {"train_loss": -26.763574600219727, "global_step": 565552, "epoch": 6813} {"train_loss": -26.55962562561035, "global_step": 565553, "epoch": 6813} {"train_loss": -27.382080078125, "global_step": 565554, "epoch": 6813} {"train_loss": -27.23114013671875, "global_step": 565555, "epoch": 6813} {"train_loss": -26.80850601196289, "global_step": 565556, "epoch": 6813} {"train_loss": -27.137481689453125, "global_step": 565557, "epoch": 6813} {"train_loss": -27.278553009033203, "global_step": 565558, "epoch": 6813} {"train_loss": -27.188989639282227, "global_step": 565559, "epoch": 6813} {"train_loss": -27.800628662109375, "global_step": 565560, "epoch": 6813} {"train_loss": -27.389022045824902, "global_step": 565561, "epoch": 6813, "val_loss": 6611732.0} {"train_loss": -27.056324005126953, "global_step": 565562, "epoch": 6814} {"train_loss": -27.2996768951416, "global_step": 565563, "epoch": 6814} {"train_loss": -26.889789581298828, "global_step": 565564, "epoch": 6814} {"train_loss": -27.18292808532715, "global_step": 565565, "epoch": 6814} {"train_loss": -27.352497100830078, "global_step": 565566, "epoch": 6814} {"train_loss": -27.233917236328125, "global_step": 565567, "epoch": 6814} {"train_loss": -27.084848403930664, "global_step": 565568, "epoch": 6814} {"train_loss": -27.24318504333496, "global_step": 565569, "epoch": 6814} {"train_loss": -27.255102157592773, "global_step": 565570, "epoch": 6814} {"train_loss": -27.36077308654785, "global_step": 565571, "epoch": 6814} {"train_loss": -27.49550437927246, "global_step": 565572, "epoch": 6814} {"train_loss": -27.499731063842773, "global_step": 565573, "epoch": 6814} {"train_loss": -27.400146484375, "global_step": 565574, "epoch": 6814} {"train_loss": -27.336904525756836, "global_step": 565575, "epoch": 6814} {"train_loss": -27.6453800201416, "global_step": 565576, "epoch": 6814} {"train_loss": -27.45881462097168, "global_step": 565577, "epoch": 6814} {"train_loss": -27.645843505859375, "global_step": 565578, "epoch": 6814} {"train_loss": -27.6339111328125, "global_step": 565579, "epoch": 6814} {"train_loss": -27.728845596313477, "global_step": 565580, "epoch": 6814} {"train_loss": -27.38525390625, "global_step": 565581, "epoch": 6814} {"train_loss": -27.536413192749023, "global_step": 565582, "epoch": 6814} {"train_loss": -27.675745010375977, "global_step": 565583, "epoch": 6814} {"train_loss": -27.7435245513916, "global_step": 565584, "epoch": 6814} {"train_loss": -27.886581420898438, "global_step": 565585, "epoch": 6814} {"train_loss": -27.763690948486328, "global_step": 565586, "epoch": 6814} {"train_loss": -27.91375732421875, "global_step": 565587, "epoch": 6814} {"train_loss": -27.592243194580078, "global_step": 565588, "epoch": 6814} {"train_loss": -27.92915153503418, "global_step": 565589, "epoch": 6814} {"train_loss": -27.82288932800293, "global_step": 565590, "epoch": 6814} {"train_loss": -27.873249053955078, "global_step": 565591, "epoch": 6814} {"train_loss": -27.728031158447266, "global_step": 565592, "epoch": 6814} {"train_loss": -27.820234298706055, "global_step": 565593, "epoch": 6814} {"train_loss": -27.630035400390625, "global_step": 565594, "epoch": 6814} {"train_loss": -28.053701400756836, "global_step": 565595, "epoch": 6814} {"train_loss": -27.701330184936523, "global_step": 565596, "epoch": 6814} {"train_loss": -27.64393424987793, "global_step": 565597, "epoch": 6814} {"train_loss": -27.97127342224121, "global_step": 565598, "epoch": 6814} {"train_loss": -28.31104850769043, "global_step": 565599, "epoch": 6814} {"train_loss": -27.61787223815918, "global_step": 565600, "epoch": 6814} {"train_loss": -27.811811447143555, "global_step": 565601, "epoch": 6814} {"train_loss": -27.94211196899414, "global_step": 565602, "epoch": 6814} {"train_loss": -28.128711700439453, "global_step": 565603, "epoch": 6814} {"train_loss": -27.881338119506836, "global_step": 565604, "epoch": 6814} {"train_loss": -27.790830612182617, "global_step": 565605, "epoch": 6814} {"train_loss": -27.87021827697754, "global_step": 565606, "epoch": 6814} {"train_loss": -28.189605712890625, "global_step": 565607, "epoch": 6814} {"train_loss": -27.99995994567871, "global_step": 565608, "epoch": 6814} {"train_loss": -28.168853759765625, "global_step": 565609, "epoch": 6814} {"train_loss": -27.93629264831543, "global_step": 565610, "epoch": 6814} {"train_loss": -27.776342391967773, "global_step": 565611, "epoch": 6814} {"train_loss": -27.9674129486084, "global_step": 565612, "epoch": 6814} {"train_loss": -28.600019454956055, "global_step": 565613, "epoch": 6814} {"train_loss": -27.94825553894043, "global_step": 565614, "epoch": 6814} {"train_loss": -28.16666603088379, "global_step": 565615, "epoch": 6814} {"train_loss": -28.044031143188477, "global_step": 565616, "epoch": 6814} {"train_loss": -27.93206214904785, "global_step": 565617, "epoch": 6814} {"train_loss": -28.213422775268555, "global_step": 565618, "epoch": 6814} {"train_loss": -28.1160831451416, "global_step": 565619, "epoch": 6814} {"train_loss": -28.247119903564453, "global_step": 565620, "epoch": 6814} {"train_loss": -28.0223445892334, "global_step": 565621, "epoch": 6814} {"train_loss": -28.040674209594727, "global_step": 565622, "epoch": 6814} {"train_loss": -27.776777267456055, "global_step": 565623, "epoch": 6814} {"train_loss": -27.576398849487305, "global_step": 565624, "epoch": 6814} {"train_loss": -27.41779899597168, "global_step": 565625, "epoch": 6814} {"train_loss": -27.9240779876709, "global_step": 565626, "epoch": 6814} {"train_loss": -28.0069637298584, "global_step": 565627, "epoch": 6814} {"train_loss": -27.7890682220459, "global_step": 565628, "epoch": 6814} {"train_loss": -27.418867111206055, "global_step": 565629, "epoch": 6814} {"train_loss": -27.83371353149414, "global_step": 565630, "epoch": 6814} {"train_loss": -27.545032501220703, "global_step": 565631, "epoch": 6814} {"train_loss": -27.85062026977539, "global_step": 565632, "epoch": 6814} {"train_loss": -27.7518310546875, "global_step": 565633, "epoch": 6814} {"train_loss": -28.249195098876953, "global_step": 565634, "epoch": 6814} {"train_loss": -27.399124145507812, "global_step": 565635, "epoch": 6814} {"train_loss": -27.6484432220459, "global_step": 565636, "epoch": 6814} {"train_loss": -27.216053009033203, "global_step": 565637, "epoch": 6814} {"train_loss": -27.138044357299805, "global_step": 565638, "epoch": 6814} {"train_loss": -27.44538688659668, "global_step": 565639, "epoch": 6814} {"train_loss": -27.928537368774414, "global_step": 565640, "epoch": 6814} {"train_loss": -27.6131591796875, "global_step": 565641, "epoch": 6814} {"train_loss": -27.781009674072266, "global_step": 565642, "epoch": 6814} {"train_loss": -27.97031593322754, "global_step": 565643, "epoch": 6814} {"train_loss": -27.737427240394684, "global_step": 565644, "epoch": 6814, "val_loss": 6611500.0} {"train_loss": -27.267139434814453, "global_step": 565645, "epoch": 6815} {"train_loss": -26.631397247314453, "global_step": 565646, "epoch": 6815} {"train_loss": -27.060504913330078, "global_step": 565647, "epoch": 6815} {"train_loss": -26.70411491394043, "global_step": 565648, "epoch": 6815} {"train_loss": -27.364612579345703, "global_step": 565649, "epoch": 6815} {"train_loss": -26.991214752197266, "global_step": 565650, "epoch": 6815} {"train_loss": -26.88624382019043, "global_step": 565651, "epoch": 6815} {"train_loss": -27.340167999267578, "global_step": 565652, "epoch": 6815} {"train_loss": -27.487213134765625, "global_step": 565653, "epoch": 6815} {"train_loss": -27.04983901977539, "global_step": 565654, "epoch": 6815} {"train_loss": -27.44046974182129, "global_step": 565655, "epoch": 6815} {"train_loss": -27.29926109313965, "global_step": 565656, "epoch": 6815} {"train_loss": -27.808441162109375, "global_step": 565657, "epoch": 6815} {"train_loss": -27.4316463470459, "global_step": 565658, "epoch": 6815} {"train_loss": -27.3115234375, "global_step": 565659, "epoch": 6815} {"train_loss": -27.349628448486328, "global_step": 565660, "epoch": 6815} {"train_loss": -27.93137550354004, "global_step": 565661, "epoch": 6815} {"train_loss": -27.7734317779541, "global_step": 565662, "epoch": 6815} {"train_loss": -27.844995498657227, "global_step": 565663, "epoch": 6815} {"train_loss": -27.805206298828125, "global_step": 565664, "epoch": 6815} {"train_loss": -27.209949493408203, "global_step": 565665, "epoch": 6815} {"train_loss": -27.861417770385742, "global_step": 565666, "epoch": 6815} {"train_loss": -27.999563217163086, "global_step": 565667, "epoch": 6815} {"train_loss": -27.77168083190918, "global_step": 565668, "epoch": 6815} {"train_loss": -27.54486083984375, "global_step": 565669, "epoch": 6815} {"train_loss": -27.909046173095703, "global_step": 565670, "epoch": 6815} {"train_loss": -27.415796279907227, "global_step": 565671, "epoch": 6815} {"train_loss": -27.875593185424805, "global_step": 565672, "epoch": 6815} {"train_loss": -27.80877685546875, "global_step": 565673, "epoch": 6815} {"train_loss": -27.80759048461914, "global_step": 565674, "epoch": 6815} {"train_loss": -27.872907638549805, "global_step": 565675, "epoch": 6815} {"train_loss": -27.61282730102539, "global_step": 565676, "epoch": 6815} {"train_loss": -28.18135643005371, "global_step": 565677, "epoch": 6815} {"train_loss": -27.747888565063477, "global_step": 565678, "epoch": 6815} {"train_loss": -27.82415771484375, "global_step": 565679, "epoch": 6815} {"train_loss": -27.943052291870117, "global_step": 565680, "epoch": 6815} {"train_loss": -27.987646102905273, "global_step": 565681, "epoch": 6815} {"train_loss": -28.1444149017334, "global_step": 565682, "epoch": 6815} {"train_loss": -27.97239112854004, "global_step": 565683, "epoch": 6815} {"train_loss": -28.13327407836914, "global_step": 565684, "epoch": 6815} {"train_loss": -28.15656852722168, "global_step": 565685, "epoch": 6815} {"train_loss": -28.325613021850586, "global_step": 565686, "epoch": 6815} {"train_loss": -28.051666259765625, "global_step": 565687, "epoch": 6815} {"train_loss": -28.091461181640625, "global_step": 565688, "epoch": 6815} {"train_loss": -28.09260368347168, "global_step": 565689, "epoch": 6815} {"train_loss": -28.01173210144043, "global_step": 565690, "epoch": 6815} {"train_loss": -27.888214111328125, "global_step": 565691, "epoch": 6815} {"train_loss": -28.24775505065918, "global_step": 565692, "epoch": 6815} {"train_loss": -28.123579025268555, "global_step": 565693, "epoch": 6815} {"train_loss": -27.960538864135742, "global_step": 565694, "epoch": 6815} {"train_loss": -27.82282829284668, "global_step": 565695, "epoch": 6815} {"train_loss": -27.59712028503418, "global_step": 565696, "epoch": 6815} {"train_loss": -27.991397857666016, "global_step": 565697, "epoch": 6815} {"train_loss": -27.832300186157227, "global_step": 565698, "epoch": 6815} {"train_loss": -27.7349910736084, "global_step": 565699, "epoch": 6815} {"train_loss": -27.945804595947266, "global_step": 565700, "epoch": 6815} {"train_loss": -27.57857322692871, "global_step": 565701, "epoch": 6815} {"train_loss": -27.78870964050293, "global_step": 565702, "epoch": 6815} {"train_loss": -27.761266708374023, "global_step": 565703, "epoch": 6815} {"train_loss": -28.03485107421875, "global_step": 565704, "epoch": 6815} {"train_loss": -28.175275802612305, "global_step": 565705, "epoch": 6815} {"train_loss": -28.179365158081055, "global_step": 565706, "epoch": 6815} {"train_loss": -28.23641014099121, "global_step": 565707, "epoch": 6815} {"train_loss": -28.239444732666016, "global_step": 565708, "epoch": 6815} {"train_loss": -27.887882232666016, "global_step": 565709, "epoch": 6815} {"train_loss": -27.792448043823242, "global_step": 565710, "epoch": 6815} {"train_loss": -28.08396339416504, "global_step": 565711, "epoch": 6815} {"train_loss": -27.427078247070312, "global_step": 565712, "epoch": 6815} {"train_loss": -27.217443466186523, "global_step": 565713, "epoch": 6815} {"train_loss": -27.02292823791504, "global_step": 565714, "epoch": 6815} {"train_loss": -27.682376861572266, "global_step": 565715, "epoch": 6815} {"train_loss": -27.60028076171875, "global_step": 565716, "epoch": 6815} {"train_loss": -27.706562042236328, "global_step": 565717, "epoch": 6815} {"train_loss": -27.83772087097168, "global_step": 565718, "epoch": 6815} {"train_loss": -27.5938777923584, "global_step": 565719, "epoch": 6815} {"train_loss": -27.708837509155273, "global_step": 565720, "epoch": 6815} {"train_loss": -27.69556999206543, "global_step": 565721, "epoch": 6815} {"train_loss": -27.851551055908203, "global_step": 565722, "epoch": 6815} {"train_loss": -27.90386390686035, "global_step": 565723, "epoch": 6815} {"train_loss": -27.919706344604492, "global_step": 565724, "epoch": 6815} {"train_loss": -27.995574951171875, "global_step": 565725, "epoch": 6815} {"train_loss": -28.134552001953125, "global_step": 565726, "epoch": 6815} {"train_loss": -27.73939840477633, "global_step": 565727, "epoch": 6815, "val_loss": 6585703.0} {"train_loss": -27.168354034423828, "global_step": 565728, "epoch": 6816} {"train_loss": -27.277368545532227, "global_step": 565729, "epoch": 6816} {"train_loss": -27.237430572509766, "global_step": 565730, "epoch": 6816} {"train_loss": -27.570602416992188, "global_step": 565731, "epoch": 6816} {"train_loss": -26.86094093322754, "global_step": 565732, "epoch": 6816} {"train_loss": -27.55877685546875, "global_step": 565733, "epoch": 6816} {"train_loss": -26.6943359375, "global_step": 565734, "epoch": 6816} {"train_loss": -27.573705673217773, "global_step": 565735, "epoch": 6816} {"train_loss": -27.34694480895996, "global_step": 565736, "epoch": 6816} {"train_loss": -27.48647117614746, "global_step": 565737, "epoch": 6816} {"train_loss": -27.383838653564453, "global_step": 565738, "epoch": 6816} {"train_loss": -27.519983291625977, "global_step": 565739, "epoch": 6816} {"train_loss": -27.42486572265625, "global_step": 565740, "epoch": 6816} {"train_loss": -27.554285049438477, "global_step": 565741, "epoch": 6816} {"train_loss": -27.5009708404541, "global_step": 565742, "epoch": 6816} {"train_loss": -27.515125274658203, "global_step": 565743, "epoch": 6816} {"train_loss": -27.365903854370117, "global_step": 565744, "epoch": 6816} {"train_loss": -27.57740592956543, "global_step": 565745, "epoch": 6816} {"train_loss": -27.2558536529541, "global_step": 565746, "epoch": 6816} {"train_loss": -27.257410049438477, "global_step": 565747, "epoch": 6816} {"train_loss": -27.725584030151367, "global_step": 565748, "epoch": 6816} {"train_loss": -27.421045303344727, "global_step": 565749, "epoch": 6816} {"train_loss": -27.559396743774414, "global_step": 565750, "epoch": 6816} {"train_loss": -27.410907745361328, "global_step": 565751, "epoch": 6816} {"train_loss": -27.559377670288086, "global_step": 565752, "epoch": 6816} {"train_loss": -27.707584381103516, "global_step": 565753, "epoch": 6816} {"train_loss": -28.047409057617188, "global_step": 565754, "epoch": 6816} {"train_loss": -27.88870620727539, "global_step": 565755, "epoch": 6816} {"train_loss": -27.3939151763916, "global_step": 565756, "epoch": 6816} {"train_loss": -27.944183349609375, "global_step": 565757, "epoch": 6816} {"train_loss": -27.768741607666016, "global_step": 565758, "epoch": 6816} {"train_loss": -27.733646392822266, "global_step": 565759, "epoch": 6816} {"train_loss": -27.80946159362793, "global_step": 565760, "epoch": 6816} {"train_loss": -27.876693725585938, "global_step": 565761, "epoch": 6816} {"train_loss": -27.927839279174805, "global_step": 565762, "epoch": 6816} {"train_loss": -27.996597290039062, "global_step": 565763, "epoch": 6816} {"train_loss": -28.039289474487305, "global_step": 565764, "epoch": 6816} {"train_loss": -27.803070068359375, "global_step": 565765, "epoch": 6816} {"train_loss": -27.434186935424805, "global_step": 565766, "epoch": 6816} {"train_loss": -27.312286376953125, "global_step": 565767, "epoch": 6816} {"train_loss": -27.53070640563965, "global_step": 565768, "epoch": 6816} {"train_loss": -27.80576515197754, "global_step": 565769, "epoch": 6816} {"train_loss": -27.9796142578125, "global_step": 565770, "epoch": 6816} {"train_loss": -28.023609161376953, "global_step": 565771, "epoch": 6816} {"train_loss": -28.062042236328125, "global_step": 565772, "epoch": 6816} {"train_loss": -27.681650161743164, "global_step": 565773, "epoch": 6816} {"train_loss": -28.181415557861328, "global_step": 565774, "epoch": 6816} {"train_loss": -27.769071578979492, "global_step": 565775, "epoch": 6816} {"train_loss": -28.028778076171875, "global_step": 565776, "epoch": 6816} {"train_loss": -27.55414390563965, "global_step": 565777, "epoch": 6816} {"train_loss": -28.134841918945312, "global_step": 565778, "epoch": 6816} {"train_loss": -28.099599838256836, "global_step": 565779, "epoch": 6816} {"train_loss": -27.872095108032227, "global_step": 565780, "epoch": 6816} {"train_loss": -27.820209503173828, "global_step": 565781, "epoch": 6816} {"train_loss": -27.652667999267578, "global_step": 565782, "epoch": 6816} {"train_loss": -27.956069946289062, "global_step": 565783, "epoch": 6816} {"train_loss": -28.18556785583496, "global_step": 565784, "epoch": 6816} {"train_loss": -27.940982818603516, "global_step": 565785, "epoch": 6816} {"train_loss": -27.933368682861328, "global_step": 565786, "epoch": 6816} {"train_loss": -27.938800811767578, "global_step": 565787, "epoch": 6816} {"train_loss": -28.329116821289062, "global_step": 565788, "epoch": 6816} {"train_loss": -27.840805053710938, "global_step": 565789, "epoch": 6816} {"train_loss": -28.153966903686523, "global_step": 565790, "epoch": 6816} {"train_loss": -27.688247680664062, "global_step": 565791, "epoch": 6816} {"train_loss": -27.66853904724121, "global_step": 565792, "epoch": 6816} {"train_loss": -27.35175895690918, "global_step": 565793, "epoch": 6816} {"train_loss": -26.96441078186035, "global_step": 565794, "epoch": 6816} {"train_loss": -27.271961212158203, "global_step": 565795, "epoch": 6816} {"train_loss": -27.282764434814453, "global_step": 565796, "epoch": 6816} {"train_loss": -28.225360870361328, "global_step": 565797, "epoch": 6816} {"train_loss": -27.7451114654541, "global_step": 565798, "epoch": 6816} {"train_loss": -27.64027214050293, "global_step": 565799, "epoch": 6816} {"train_loss": -27.694311141967773, "global_step": 565800, "epoch": 6816} {"train_loss": -28.158273696899414, "global_step": 565801, "epoch": 6816} {"train_loss": -27.782608032226562, "global_step": 565802, "epoch": 6816} {"train_loss": -28.06556510925293, "global_step": 565803, "epoch": 6816} {"train_loss": -28.0677547454834, "global_step": 565804, "epoch": 6816} {"train_loss": -27.84034538269043, "global_step": 565805, "epoch": 6816} {"train_loss": -28.046768188476562, "global_step": 565806, "epoch": 6816} {"train_loss": -27.75452995300293, "global_step": 565807, "epoch": 6816} {"train_loss": -27.896066665649414, "global_step": 565808, "epoch": 6816} {"train_loss": -28.079864501953125, "global_step": 565809, "epoch": 6816} {"train_loss": -27.695383485541285, "global_step": 565810, "epoch": 6816, "val_loss": 6708985.0} {"train_loss": -27.07389259338379, "global_step": 565811, "epoch": 6817} {"train_loss": -27.424142837524414, "global_step": 565812, "epoch": 6817} {"train_loss": -26.859540939331055, "global_step": 565813, "epoch": 6817} {"train_loss": -27.40216636657715, "global_step": 565814, "epoch": 6817} {"train_loss": -26.859434127807617, "global_step": 565815, "epoch": 6817} {"train_loss": -27.29998779296875, "global_step": 565816, "epoch": 6817} {"train_loss": -27.335309982299805, "global_step": 565817, "epoch": 6817} {"train_loss": -26.871496200561523, "global_step": 565818, "epoch": 6817} {"train_loss": -27.593414306640625, "global_step": 565819, "epoch": 6817} {"train_loss": -27.22406578063965, "global_step": 565820, "epoch": 6817} {"train_loss": -27.544403076171875, "global_step": 565821, "epoch": 6817} {"train_loss": -27.447208404541016, "global_step": 565822, "epoch": 6817} {"train_loss": -27.52933692932129, "global_step": 565823, "epoch": 6817} {"train_loss": -27.464826583862305, "global_step": 565824, "epoch": 6817} {"train_loss": -27.447010040283203, "global_step": 565825, "epoch": 6817} {"train_loss": -27.381855010986328, "global_step": 565826, "epoch": 6817} {"train_loss": -27.23443031311035, "global_step": 565827, "epoch": 6817} {"train_loss": -27.417236328125, "global_step": 565828, "epoch": 6817} {"train_loss": -27.466474533081055, "global_step": 565829, "epoch": 6817} {"train_loss": -27.60385513305664, "global_step": 565830, "epoch": 6817} {"train_loss": -28.0058536529541, "global_step": 565831, "epoch": 6817} {"train_loss": -27.978796005249023, "global_step": 565832, "epoch": 6817} {"train_loss": -27.893299102783203, "global_step": 565833, "epoch": 6817} {"train_loss": -27.811878204345703, "global_step": 565834, "epoch": 6817} {"train_loss": -27.481800079345703, "global_step": 565835, "epoch": 6817} {"train_loss": -27.77203941345215, "global_step": 565836, "epoch": 6817} {"train_loss": -27.712020874023438, "global_step": 565837, "epoch": 6817} {"train_loss": -27.938312530517578, "global_step": 565838, "epoch": 6817} {"train_loss": -27.58381462097168, "global_step": 565839, "epoch": 6817} {"train_loss": -27.8098087310791, "global_step": 565840, "epoch": 6817} {"train_loss": -27.58636474609375, "global_step": 565841, "epoch": 6817} {"train_loss": -27.60420036315918, "global_step": 565842, "epoch": 6817} {"train_loss": -27.858915328979492, "global_step": 565843, "epoch": 6817} {"train_loss": -27.982397079467773, "global_step": 565844, "epoch": 6817} {"train_loss": -27.798017501831055, "global_step": 565845, "epoch": 6817} {"train_loss": -27.91229248046875, "global_step": 565846, "epoch": 6817} {"train_loss": -28.185855865478516, "global_step": 565847, "epoch": 6817} {"train_loss": -27.938596725463867, "global_step": 565848, "epoch": 6817} {"train_loss": -28.034198760986328, "global_step": 565849, "epoch": 6817} {"train_loss": -27.964956283569336, "global_step": 565850, "epoch": 6817} {"train_loss": -27.8884220123291, "global_step": 565851, "epoch": 6817} {"train_loss": -27.88532829284668, "global_step": 565852, "epoch": 6817} {"train_loss": -27.884275436401367, "global_step": 565853, "epoch": 6817} {"train_loss": -28.083311080932617, "global_step": 565854, "epoch": 6817} {"train_loss": -27.95462417602539, "global_step": 565855, "epoch": 6817} {"train_loss": -28.045236587524414, "global_step": 565856, "epoch": 6817} {"train_loss": -28.07437515258789, "global_step": 565857, "epoch": 6817} {"train_loss": -27.93783950805664, "global_step": 565858, "epoch": 6817} {"train_loss": -28.249372482299805, "global_step": 565859, "epoch": 6817} {"train_loss": -28.353534698486328, "global_step": 565860, "epoch": 6817} {"train_loss": -28.2769832611084, "global_step": 565861, "epoch": 6817} {"train_loss": -28.133825302124023, "global_step": 565862, "epoch": 6817} {"train_loss": -28.12017822265625, "global_step": 565863, "epoch": 6817} {"train_loss": -28.2325382232666, "global_step": 565864, "epoch": 6817} {"train_loss": -27.779315948486328, "global_step": 565865, "epoch": 6817} {"train_loss": -27.78375816345215, "global_step": 565866, "epoch": 6817} {"train_loss": -27.682758331298828, "global_step": 565867, "epoch": 6817} {"train_loss": -27.842609405517578, "global_step": 565868, "epoch": 6817} {"train_loss": -27.135730743408203, "global_step": 565869, "epoch": 6817} {"train_loss": -26.723922729492188, "global_step": 565870, "epoch": 6817} {"train_loss": -26.246129989624023, "global_step": 565871, "epoch": 6817} {"train_loss": -25.53070640563965, "global_step": 565872, "epoch": 6817} {"train_loss": -26.428054809570312, "global_step": 565873, "epoch": 6817} {"train_loss": -27.859027862548828, "global_step": 565874, "epoch": 6817} {"train_loss": -26.34454345703125, "global_step": 565875, "epoch": 6817} {"train_loss": -27.464588165283203, "global_step": 565876, "epoch": 6817} {"train_loss": -26.6943302154541, "global_step": 565877, "epoch": 6817} {"train_loss": -27.6117000579834, "global_step": 565878, "epoch": 6817} {"train_loss": -27.07476806640625, "global_step": 565879, "epoch": 6817} {"train_loss": -27.514728546142578, "global_step": 565880, "epoch": 6817} {"train_loss": -27.634790420532227, "global_step": 565881, "epoch": 6817} {"train_loss": -27.240924835205078, "global_step": 565882, "epoch": 6817} {"train_loss": -27.549732208251953, "global_step": 565883, "epoch": 6817} {"train_loss": -27.464859008789062, "global_step": 565884, "epoch": 6817} {"train_loss": -27.669958114624023, "global_step": 565885, "epoch": 6817} {"train_loss": -27.45038414001465, "global_step": 565886, "epoch": 6817} {"train_loss": -27.874387741088867, "global_step": 565887, "epoch": 6817} {"train_loss": -27.512414932250977, "global_step": 565888, "epoch": 6817} {"train_loss": -27.41078758239746, "global_step": 565889, "epoch": 6817} {"train_loss": -27.48036003112793, "global_step": 565890, "epoch": 6817} {"train_loss": -27.67083740234375, "global_step": 565891, "epoch": 6817} {"train_loss": -27.51041030883789, "global_step": 565892, "epoch": 6817} {"train_loss": -27.577731121017273, "global_step": 565893, "epoch": 6817, "val_loss": 6732905.0} {"train_loss": -27.47260093688965, "global_step": 565894, "epoch": 6818} {"train_loss": -27.771411895751953, "global_step": 565895, "epoch": 6818} {"train_loss": -27.179372787475586, "global_step": 565896, "epoch": 6818} {"train_loss": -27.69938087463379, "global_step": 565897, "epoch": 6818} {"train_loss": -27.399938583374023, "global_step": 565898, "epoch": 6818} {"train_loss": -27.582731246948242, "global_step": 565899, "epoch": 6818} {"train_loss": -27.489688873291016, "global_step": 565900, "epoch": 6818} {"train_loss": -27.1469783782959, "global_step": 565901, "epoch": 6818} {"train_loss": -26.59162712097168, "global_step": 565902, "epoch": 6818} {"train_loss": -26.44189453125, "global_step": 565903, "epoch": 6818} {"train_loss": -27.48390007019043, "global_step": 565904, "epoch": 6818} {"train_loss": -27.2042179107666, "global_step": 565905, "epoch": 6818} {"train_loss": -27.0678768157959, "global_step": 565906, "epoch": 6818} {"train_loss": -27.810089111328125, "global_step": 565907, "epoch": 6818} {"train_loss": -26.977691650390625, "global_step": 565908, "epoch": 6818} {"train_loss": -27.398895263671875, "global_step": 565909, "epoch": 6818} {"train_loss": -27.042829513549805, "global_step": 565910, "epoch": 6818} {"train_loss": -27.222326278686523, "global_step": 565911, "epoch": 6818} {"train_loss": -27.12810707092285, "global_step": 565912, "epoch": 6818} {"train_loss": -27.54741859436035, "global_step": 565913, "epoch": 6818} {"train_loss": -27.309324264526367, "global_step": 565914, "epoch": 6818} {"train_loss": -27.682767868041992, "global_step": 565915, "epoch": 6818} {"train_loss": -27.320898056030273, "global_step": 565916, "epoch": 6818} {"train_loss": -27.724023818969727, "global_step": 565917, "epoch": 6818} {"train_loss": -27.571279525756836, "global_step": 565918, "epoch": 6818} {"train_loss": -27.982349395751953, "global_step": 565919, "epoch": 6818} {"train_loss": -27.84260368347168, "global_step": 565920, "epoch": 6818} {"train_loss": -27.435348510742188, "global_step": 565921, "epoch": 6818} {"train_loss": -27.564956665039062, "global_step": 565922, "epoch": 6818} {"train_loss": -27.439701080322266, "global_step": 565923, "epoch": 6818} {"train_loss": -27.985870361328125, "global_step": 565924, "epoch": 6818} {"train_loss": -27.322906494140625, "global_step": 565925, "epoch": 6818} {"train_loss": -27.984607696533203, "global_step": 565926, "epoch": 6818} {"train_loss": -27.887609481811523, "global_step": 565927, "epoch": 6818} {"train_loss": -27.66383171081543, "global_step": 565928, "epoch": 6818} {"train_loss": -27.81410026550293, "global_step": 565929, "epoch": 6818} {"train_loss": -27.924535751342773, "global_step": 565930, "epoch": 6818} {"train_loss": -27.729450225830078, "global_step": 565931, "epoch": 6818} {"train_loss": -28.066186904907227, "global_step": 565932, "epoch": 6818} {"train_loss": -28.091650009155273, "global_step": 565933, "epoch": 6818} {"train_loss": -27.858020782470703, "global_step": 565934, "epoch": 6818} {"train_loss": -27.94879722595215, "global_step": 565935, "epoch": 6818} {"train_loss": -28.127599716186523, "global_step": 565936, "epoch": 6818} {"train_loss": -28.147735595703125, "global_step": 565937, "epoch": 6818} {"train_loss": -27.82818031311035, "global_step": 565938, "epoch": 6818} {"train_loss": -27.87953758239746, "global_step": 565939, "epoch": 6818} {"train_loss": -27.911319732666016, "global_step": 565940, "epoch": 6818} {"train_loss": -27.940195083618164, "global_step": 565941, "epoch": 6818} {"train_loss": -27.720853805541992, "global_step": 565942, "epoch": 6818} {"train_loss": -27.91701316833496, "global_step": 565943, "epoch": 6818} {"train_loss": -28.16965103149414, "global_step": 565944, "epoch": 6818} {"train_loss": -28.11781883239746, "global_step": 565945, "epoch": 6818} {"train_loss": -27.966455459594727, "global_step": 565946, "epoch": 6818} {"train_loss": -27.697406768798828, "global_step": 565947, "epoch": 6818} {"train_loss": -27.851673126220703, "global_step": 565948, "epoch": 6818} {"train_loss": -28.008825302124023, "global_step": 565949, "epoch": 6818} {"train_loss": -28.334875106811523, "global_step": 565950, "epoch": 6818} {"train_loss": -27.987701416015625, "global_step": 565951, "epoch": 6818} {"train_loss": -28.153940200805664, "global_step": 565952, "epoch": 6818} {"train_loss": -27.837995529174805, "global_step": 565953, "epoch": 6818} {"train_loss": -27.929641723632812, "global_step": 565954, "epoch": 6818} {"train_loss": -28.031585693359375, "global_step": 565955, "epoch": 6818} {"train_loss": -27.811981201171875, "global_step": 565956, "epoch": 6818} {"train_loss": -28.450824737548828, "global_step": 565957, "epoch": 6818} {"train_loss": -28.096277236938477, "global_step": 565958, "epoch": 6818} {"train_loss": -27.9365177154541, "global_step": 565959, "epoch": 6818} {"train_loss": -28.009479522705078, "global_step": 565960, "epoch": 6818} {"train_loss": -27.84468650817871, "global_step": 565961, "epoch": 6818} {"train_loss": -28.084381103515625, "global_step": 565962, "epoch": 6818} {"train_loss": -27.92622184753418, "global_step": 565963, "epoch": 6818} {"train_loss": -27.899503707885742, "global_step": 565964, "epoch": 6818} {"train_loss": -28.437118530273438, "global_step": 565965, "epoch": 6818} {"train_loss": -27.840784072875977, "global_step": 565966, "epoch": 6818} {"train_loss": -28.13848304748535, "global_step": 565967, "epoch": 6818} {"train_loss": -28.24277687072754, "global_step": 565968, "epoch": 6818} {"train_loss": -27.940885543823242, "global_step": 565969, "epoch": 6818} {"train_loss": -27.82111930847168, "global_step": 565970, "epoch": 6818} {"train_loss": -28.18023109436035, "global_step": 565971, "epoch": 6818} {"train_loss": -28.098485946655273, "global_step": 565972, "epoch": 6818} {"train_loss": -27.97315788269043, "global_step": 565973, "epoch": 6818} {"train_loss": -27.755918502807617, "global_step": 565974, "epoch": 6818} {"train_loss": -27.836713790893555, "global_step": 565975, "epoch": 6818} {"train_loss": -27.768551217504296, "global_step": 565976, "epoch": 6818, "val_loss": 6755449.0} {"train_loss": -26.769697189331055, "global_step": 565977, "epoch": 6819} {"train_loss": -27.40467643737793, "global_step": 565978, "epoch": 6819} {"train_loss": -26.89883804321289, "global_step": 565979, "epoch": 6819} {"train_loss": -27.263172149658203, "global_step": 565980, "epoch": 6819} {"train_loss": -26.88520622253418, "global_step": 565981, "epoch": 6819} {"train_loss": -26.670820236206055, "global_step": 565982, "epoch": 6819} {"train_loss": -27.367023468017578, "global_step": 565983, "epoch": 6819} {"train_loss": -27.4183292388916, "global_step": 565984, "epoch": 6819} {"train_loss": -27.256433486938477, "global_step": 565985, "epoch": 6819} {"train_loss": -26.481985092163086, "global_step": 565986, "epoch": 6819} {"train_loss": -27.165985107421875, "global_step": 565987, "epoch": 6819} {"train_loss": -27.57783317565918, "global_step": 565988, "epoch": 6819} {"train_loss": -27.081079483032227, "global_step": 565989, "epoch": 6819} {"train_loss": -26.655115127563477, "global_step": 565990, "epoch": 6819} {"train_loss": -27.001968383789062, "global_step": 565991, "epoch": 6819} {"train_loss": -27.209012985229492, "global_step": 565992, "epoch": 6819} {"train_loss": -27.143400192260742, "global_step": 565993, "epoch": 6819} {"train_loss": -27.43584632873535, "global_step": 565994, "epoch": 6819} {"train_loss": -27.834827423095703, "global_step": 565995, "epoch": 6819} {"train_loss": -27.68487548828125, "global_step": 565996, "epoch": 6819} {"train_loss": -27.459897994995117, "global_step": 565997, "epoch": 6819} {"train_loss": -27.567895889282227, "global_step": 565998, "epoch": 6819} {"train_loss": -27.659833908081055, "global_step": 565999, "epoch": 6819} {"train_loss": -27.45196533203125, "global_step": 566000, "epoch": 6819} {"train_loss": -27.532316207885742, "global_step": 566001, "epoch": 6819} {"train_loss": -27.318897247314453, "global_step": 566002, "epoch": 6819} {"train_loss": -27.467527389526367, "global_step": 566003, "epoch": 6819} {"train_loss": -27.85162353515625, "global_step": 566004, "epoch": 6819} {"train_loss": -27.672626495361328, "global_step": 566005, "epoch": 6819} {"train_loss": -27.69317054748535, "global_step": 566006, "epoch": 6819} {"train_loss": -27.3695011138916, "global_step": 566007, "epoch": 6819} {"train_loss": -27.79829216003418, "global_step": 566008, "epoch": 6819} {"train_loss": -27.586624145507812, "global_step": 566009, "epoch": 6819} {"train_loss": -27.50629997253418, "global_step": 566010, "epoch": 6819} {"train_loss": -27.83037757873535, "global_step": 566011, "epoch": 6819} {"train_loss": -27.877050399780273, "global_step": 566012, "epoch": 6819} {"train_loss": -27.877424240112305, "global_step": 566013, "epoch": 6819} {"train_loss": -27.7823543548584, "global_step": 566014, "epoch": 6819} {"train_loss": -27.68293571472168, "global_step": 566015, "epoch": 6819} {"train_loss": -27.79816246032715, "global_step": 566016, "epoch": 6819} {"train_loss": -28.105966567993164, "global_step": 566017, "epoch": 6819} {"train_loss": -27.923452377319336, "global_step": 566018, "epoch": 6819} {"train_loss": -28.016910552978516, "global_step": 566019, "epoch": 6819} {"train_loss": -27.53485107421875, "global_step": 566020, "epoch": 6819} {"train_loss": -28.02223014831543, "global_step": 566021, "epoch": 6819} {"train_loss": -27.945388793945312, "global_step": 566022, "epoch": 6819} {"train_loss": -27.962003707885742, "global_step": 566023, "epoch": 6819} {"train_loss": -27.921100616455078, "global_step": 566024, "epoch": 6819} {"train_loss": -27.959915161132812, "global_step": 566025, "epoch": 6819} {"train_loss": -27.818988800048828, "global_step": 566026, "epoch": 6819} {"train_loss": -27.956317901611328, "global_step": 566027, "epoch": 6819} {"train_loss": -27.98371696472168, "global_step": 566028, "epoch": 6819} {"train_loss": -27.95550537109375, "global_step": 566029, "epoch": 6819} {"train_loss": -27.956384658813477, "global_step": 566030, "epoch": 6819} {"train_loss": -28.042821884155273, "global_step": 566031, "epoch": 6819} {"train_loss": -27.996992111206055, "global_step": 566032, "epoch": 6819} {"train_loss": -28.318775177001953, "global_step": 566033, "epoch": 6819} {"train_loss": -27.91419792175293, "global_step": 566034, "epoch": 6819} {"train_loss": -27.883930206298828, "global_step": 566035, "epoch": 6819} {"train_loss": -28.12579917907715, "global_step": 566036, "epoch": 6819} {"train_loss": -27.97757339477539, "global_step": 566037, "epoch": 6819} {"train_loss": -27.807165145874023, "global_step": 566038, "epoch": 6819} {"train_loss": -28.18906021118164, "global_step": 566039, "epoch": 6819} {"train_loss": -27.959253311157227, "global_step": 566040, "epoch": 6819} {"train_loss": -27.811859130859375, "global_step": 566041, "epoch": 6819} {"train_loss": -28.354211807250977, "global_step": 566042, "epoch": 6819} {"train_loss": -27.922595977783203, "global_step": 566043, "epoch": 6819} {"train_loss": -27.782093048095703, "global_step": 566044, "epoch": 6819} {"train_loss": -28.144189834594727, "global_step": 566045, "epoch": 6819} {"train_loss": -27.827756881713867, "global_step": 566046, "epoch": 6819} {"train_loss": -27.74678611755371, "global_step": 566047, "epoch": 6819} {"train_loss": -27.610828399658203, "global_step": 566048, "epoch": 6819} {"train_loss": -27.104406356811523, "global_step": 566049, "epoch": 6819} {"train_loss": -26.692371368408203, "global_step": 566050, "epoch": 6819} {"train_loss": -26.661630630493164, "global_step": 566051, "epoch": 6819} {"train_loss": -27.695892333984375, "global_step": 566052, "epoch": 6819} {"train_loss": -27.402067184448242, "global_step": 566053, "epoch": 6819} {"train_loss": -27.600555419921875, "global_step": 566054, "epoch": 6819} {"train_loss": -27.786380767822266, "global_step": 566055, "epoch": 6819} {"train_loss": -27.881391525268555, "global_step": 566056, "epoch": 6819} {"train_loss": -27.761951446533203, "global_step": 566057, "epoch": 6819} {"train_loss": -27.771514892578125, "global_step": 566058, "epoch": 6819} {"train_loss": -27.632052593920605, "global_step": 566059, "epoch": 6819, "val_loss": 6727838.0} {"train_loss": -27.11140251159668, "global_step": 566060, "epoch": 6820} {"train_loss": -25.883466720581055, "global_step": 566061, "epoch": 6820} {"train_loss": -25.52379035949707, "global_step": 566062, "epoch": 6820} {"train_loss": -26.233795166015625, "global_step": 566063, "epoch": 6820} {"train_loss": -27.137958526611328, "global_step": 566064, "epoch": 6820} {"train_loss": -26.325469970703125, "global_step": 566065, "epoch": 6820} {"train_loss": -27.524484634399414, "global_step": 566066, "epoch": 6820} {"train_loss": -26.4927921295166, "global_step": 566067, "epoch": 6820} {"train_loss": -27.08064079284668, "global_step": 566068, "epoch": 6820} {"train_loss": -26.616764068603516, "global_step": 566069, "epoch": 6820} {"train_loss": -27.455387115478516, "global_step": 566070, "epoch": 6820} {"train_loss": -27.137969970703125, "global_step": 566071, "epoch": 6820} {"train_loss": -27.36624526977539, "global_step": 566072, "epoch": 6820} {"train_loss": -27.621381759643555, "global_step": 566073, "epoch": 6820} {"train_loss": -27.377552032470703, "global_step": 566074, "epoch": 6820} {"train_loss": -27.36474609375, "global_step": 566075, "epoch": 6820} {"train_loss": -27.454910278320312, "global_step": 566076, "epoch": 6820} {"train_loss": -27.200815200805664, "global_step": 566077, "epoch": 6820} {"train_loss": -27.618772506713867, "global_step": 566078, "epoch": 6820} {"train_loss": -27.613483428955078, "global_step": 566079, "epoch": 6820} {"train_loss": -27.68372917175293, "global_step": 566080, "epoch": 6820} {"train_loss": -27.43277359008789, "global_step": 566081, "epoch": 6820} {"train_loss": -27.734960556030273, "global_step": 566082, "epoch": 6820} {"train_loss": -27.927255630493164, "global_step": 566083, "epoch": 6820} {"train_loss": -27.468002319335938, "global_step": 566084, "epoch": 6820} {"train_loss": -27.78126335144043, "global_step": 566085, "epoch": 6820} {"train_loss": -27.889698028564453, "global_step": 566086, "epoch": 6820} {"train_loss": -27.5758113861084, "global_step": 566087, "epoch": 6820} {"train_loss": -27.912595748901367, "global_step": 566088, "epoch": 6820} {"train_loss": -27.81315040588379, "global_step": 566089, "epoch": 6820} {"train_loss": -27.8044376373291, "global_step": 566090, "epoch": 6820} {"train_loss": -27.93133544921875, "global_step": 566091, "epoch": 6820} {"train_loss": -27.730091094970703, "global_step": 566092, "epoch": 6820} {"train_loss": -27.589696884155273, "global_step": 566093, "epoch": 6820} {"train_loss": -27.966604232788086, "global_step": 566094, "epoch": 6820} {"train_loss": -27.738000869750977, "global_step": 566095, "epoch": 6820} {"train_loss": -27.67970085144043, "global_step": 566096, "epoch": 6820} {"train_loss": -27.822742462158203, "global_step": 566097, "epoch": 6820} {"train_loss": -27.9833984375, "global_step": 566098, "epoch": 6820} {"train_loss": -27.860891342163086, "global_step": 566099, "epoch": 6820} {"train_loss": -28.044981002807617, "global_step": 566100, "epoch": 6820} {"train_loss": -27.72820472717285, "global_step": 566101, "epoch": 6820} {"train_loss": -27.923200607299805, "global_step": 566102, "epoch": 6820} {"train_loss": -27.83475112915039, "global_step": 566103, "epoch": 6820} {"train_loss": -27.83567237854004, "global_step": 566104, "epoch": 6820} {"train_loss": -28.123212814331055, "global_step": 566105, "epoch": 6820} {"train_loss": -27.986225128173828, "global_step": 566106, "epoch": 6820} {"train_loss": -27.798131942749023, "global_step": 566107, "epoch": 6820} {"train_loss": -27.8300838470459, "global_step": 566108, "epoch": 6820} {"train_loss": -27.82682228088379, "global_step": 566109, "epoch": 6820} {"train_loss": -28.088403701782227, "global_step": 566110, "epoch": 6820} {"train_loss": -27.914541244506836, "global_step": 566111, "epoch": 6820} {"train_loss": -28.132923126220703, "global_step": 566112, "epoch": 6820} {"train_loss": -27.99763298034668, "global_step": 566113, "epoch": 6820} {"train_loss": -28.232025146484375, "global_step": 566114, "epoch": 6820} {"train_loss": -28.004873275756836, "global_step": 566115, "epoch": 6820} {"train_loss": -27.606271743774414, "global_step": 566116, "epoch": 6820} {"train_loss": -28.016712188720703, "global_step": 566117, "epoch": 6820} {"train_loss": -27.795440673828125, "global_step": 566118, "epoch": 6820} {"train_loss": -28.05645179748535, "global_step": 566119, "epoch": 6820} {"train_loss": -27.9942684173584, "global_step": 566120, "epoch": 6820} {"train_loss": -27.938037872314453, "global_step": 566121, "epoch": 6820} {"train_loss": -27.9669189453125, "global_step": 566122, "epoch": 6820} {"train_loss": -27.845138549804688, "global_step": 566123, "epoch": 6820} {"train_loss": -28.01324462890625, "global_step": 566124, "epoch": 6820} {"train_loss": -27.7739315032959, "global_step": 566125, "epoch": 6820} {"train_loss": -28.0401668548584, "global_step": 566126, "epoch": 6820} {"train_loss": -27.40437126159668, "global_step": 566127, "epoch": 6820} {"train_loss": -27.995880126953125, "global_step": 566128, "epoch": 6820} {"train_loss": -28.115461349487305, "global_step": 566129, "epoch": 6820} {"train_loss": -28.26523780822754, "global_step": 566130, "epoch": 6820} {"train_loss": -27.39322280883789, "global_step": 566131, "epoch": 6820} {"train_loss": -27.334836959838867, "global_step": 566132, "epoch": 6820} {"train_loss": -27.673547744750977, "global_step": 566133, "epoch": 6820} {"train_loss": -27.771757125854492, "global_step": 566134, "epoch": 6820} {"train_loss": -27.938873291015625, "global_step": 566135, "epoch": 6820} {"train_loss": -27.495080947875977, "global_step": 566136, "epoch": 6820} {"train_loss": -27.79975700378418, "global_step": 566137, "epoch": 6820} {"train_loss": -27.608158111572266, "global_step": 566138, "epoch": 6820} {"train_loss": -27.763458251953125, "global_step": 566139, "epoch": 6820} {"train_loss": -27.596439361572266, "global_step": 566140, "epoch": 6820} {"train_loss": -27.904239654541016, "global_step": 566141, "epoch": 6820} {"train_loss": -27.642803789621375, "global_step": 566142, "epoch": 6820, "val_loss": 6740854.0} {"train_loss": -26.310468673706055, "global_step": 566143, "epoch": 6821} {"train_loss": -26.09694480895996, "global_step": 566144, "epoch": 6821} {"train_loss": -25.336917877197266, "global_step": 566145, "epoch": 6821} {"train_loss": -26.468454360961914, "global_step": 566146, "epoch": 6821} {"train_loss": -26.91843605041504, "global_step": 566147, "epoch": 6821} {"train_loss": -26.049680709838867, "global_step": 566148, "epoch": 6821} {"train_loss": -27.138837814331055, "global_step": 566149, "epoch": 6821} {"train_loss": -27.168848037719727, "global_step": 566150, "epoch": 6821} {"train_loss": -26.360036849975586, "global_step": 566151, "epoch": 6821} {"train_loss": -27.100492477416992, "global_step": 566152, "epoch": 6821} {"train_loss": -26.821517944335938, "global_step": 566153, "epoch": 6821} {"train_loss": -27.01593589782715, "global_step": 566154, "epoch": 6821} {"train_loss": -26.900876998901367, "global_step": 566155, "epoch": 6821} {"train_loss": -27.11971092224121, "global_step": 566156, "epoch": 6821} {"train_loss": -26.822946548461914, "global_step": 566157, "epoch": 6821} {"train_loss": -27.3891658782959, "global_step": 566158, "epoch": 6821} {"train_loss": -27.14288902282715, "global_step": 566159, "epoch": 6821} {"train_loss": -26.93364906311035, "global_step": 566160, "epoch": 6821} {"train_loss": -26.66409683227539, "global_step": 566161, "epoch": 6821} {"train_loss": -27.6411190032959, "global_step": 566162, "epoch": 6821} {"train_loss": -27.021453857421875, "global_step": 566163, "epoch": 6821} {"train_loss": -27.454626083374023, "global_step": 566164, "epoch": 6821} {"train_loss": -27.207935333251953, "global_step": 566165, "epoch": 6821} {"train_loss": -27.349609375, "global_step": 566166, "epoch": 6821} {"train_loss": -27.599599838256836, "global_step": 566167, "epoch": 6821} {"train_loss": -27.143274307250977, "global_step": 566168, "epoch": 6821} {"train_loss": -27.475183486938477, "global_step": 566169, "epoch": 6821} {"train_loss": -27.66925621032715, "global_step": 566170, "epoch": 6821} {"train_loss": -27.4282283782959, "global_step": 566171, "epoch": 6821} {"train_loss": -27.680891036987305, "global_step": 566172, "epoch": 6821} {"train_loss": -27.499378204345703, "global_step": 566173, "epoch": 6821} {"train_loss": -27.85107421875, "global_step": 566174, "epoch": 6821} {"train_loss": -27.600601196289062, "global_step": 566175, "epoch": 6821} {"train_loss": -27.60126304626465, "global_step": 566176, "epoch": 6821} {"train_loss": -27.60334587097168, "global_step": 566177, "epoch": 6821} {"train_loss": -27.9034366607666, "global_step": 566178, "epoch": 6821} {"train_loss": -27.61029052734375, "global_step": 566179, "epoch": 6821} {"train_loss": -27.6905460357666, "global_step": 566180, "epoch": 6821} {"train_loss": -27.688385009765625, "global_step": 566181, "epoch": 6821} {"train_loss": -27.66708755493164, "global_step": 566182, "epoch": 6821} {"train_loss": -27.84877586364746, "global_step": 566183, "epoch": 6821} {"train_loss": -28.0441951751709, "global_step": 566184, "epoch": 6821} {"train_loss": -27.819965362548828, "global_step": 566185, "epoch": 6821} {"train_loss": -27.719629287719727, "global_step": 566186, "epoch": 6821} {"train_loss": -28.174436569213867, "global_step": 566187, "epoch": 6821} {"train_loss": -27.504209518432617, "global_step": 566188, "epoch": 6821} {"train_loss": -27.7460994720459, "global_step": 566189, "epoch": 6821} {"train_loss": -28.00383949279785, "global_step": 566190, "epoch": 6821} {"train_loss": -27.781347274780273, "global_step": 566191, "epoch": 6821} {"train_loss": -27.833276748657227, "global_step": 566192, "epoch": 6821} {"train_loss": -27.98040199279785, "global_step": 566193, "epoch": 6821} {"train_loss": -27.912830352783203, "global_step": 566194, "epoch": 6821} {"train_loss": -27.828399658203125, "global_step": 566195, "epoch": 6821} {"train_loss": -27.6939697265625, "global_step": 566196, "epoch": 6821} {"train_loss": -28.19730567932129, "global_step": 566197, "epoch": 6821} {"train_loss": -28.01450538635254, "global_step": 566198, "epoch": 6821} {"train_loss": -28.033788681030273, "global_step": 566199, "epoch": 6821} {"train_loss": -28.196292877197266, "global_step": 566200, "epoch": 6821} {"train_loss": -28.068761825561523, "global_step": 566201, "epoch": 6821} {"train_loss": -27.87807273864746, "global_step": 566202, "epoch": 6821} {"train_loss": -28.372167587280273, "global_step": 566203, "epoch": 6821} {"train_loss": -27.6881103515625, "global_step": 566204, "epoch": 6821} {"train_loss": -27.98646354675293, "global_step": 566205, "epoch": 6821} {"train_loss": -27.835163116455078, "global_step": 566206, "epoch": 6821} {"train_loss": -28.09103775024414, "global_step": 566207, "epoch": 6821} {"train_loss": -28.3111629486084, "global_step": 566208, "epoch": 6821} {"train_loss": -27.790119171142578, "global_step": 566209, "epoch": 6821} {"train_loss": -28.039228439331055, "global_step": 566210, "epoch": 6821} {"train_loss": -28.032331466674805, "global_step": 566211, "epoch": 6821} {"train_loss": -27.841995239257812, "global_step": 566212, "epoch": 6821} {"train_loss": -28.056732177734375, "global_step": 566213, "epoch": 6821} {"train_loss": -27.831226348876953, "global_step": 566214, "epoch": 6821} {"train_loss": -27.673070907592773, "global_step": 566215, "epoch": 6821} {"train_loss": -28.214588165283203, "global_step": 566216, "epoch": 6821} {"train_loss": -28.099990844726562, "global_step": 566217, "epoch": 6821} {"train_loss": -28.019256591796875, "global_step": 566218, "epoch": 6821} {"train_loss": -27.7653865814209, "global_step": 566219, "epoch": 6821} {"train_loss": -27.87284278869629, "global_step": 566220, "epoch": 6821} {"train_loss": -27.7978515625, "global_step": 566221, "epoch": 6821} {"train_loss": -27.736133575439453, "global_step": 566222, "epoch": 6821} {"train_loss": -27.6920223236084, "global_step": 566223, "epoch": 6821} {"train_loss": -27.45100212097168, "global_step": 566224, "epoch": 6821} {"train_loss": -27.556289098348962, "global_step": 566225, "epoch": 6821, "val_loss": 6588141.5} {"train_loss": -26.439346313476562, "global_step": 566226, "epoch": 6822} {"train_loss": -23.474355697631836, "global_step": 566227, "epoch": 6822} {"train_loss": -25.7731990814209, "global_step": 566228, "epoch": 6822} {"train_loss": -26.013986587524414, "global_step": 566229, "epoch": 6822} {"train_loss": -26.379154205322266, "global_step": 566230, "epoch": 6822} {"train_loss": -25.762327194213867, "global_step": 566231, "epoch": 6822} {"train_loss": -26.4008846282959, "global_step": 566232, "epoch": 6822} {"train_loss": -26.18660545349121, "global_step": 566233, "epoch": 6822} {"train_loss": -26.799291610717773, "global_step": 566234, "epoch": 6822} {"train_loss": -26.63042640686035, "global_step": 566235, "epoch": 6822} {"train_loss": -26.37847900390625, "global_step": 566236, "epoch": 6822} {"train_loss": -26.96268653869629, "global_step": 566237, "epoch": 6822} {"train_loss": -26.574447631835938, "global_step": 566238, "epoch": 6822} {"train_loss": -26.73358154296875, "global_step": 566239, "epoch": 6822} {"train_loss": -27.001483917236328, "global_step": 566240, "epoch": 6822} {"train_loss": -27.05256462097168, "global_step": 566241, "epoch": 6822} {"train_loss": -27.004682540893555, "global_step": 566242, "epoch": 6822} {"train_loss": -27.36700439453125, "global_step": 566243, "epoch": 6822} {"train_loss": -27.044443130493164, "global_step": 566244, "epoch": 6822} {"train_loss": -26.92138671875, "global_step": 566245, "epoch": 6822} {"train_loss": -27.051050186157227, "global_step": 566246, "epoch": 6822} {"train_loss": -27.301904678344727, "global_step": 566247, "epoch": 6822} {"train_loss": -27.28352165222168, "global_step": 566248, "epoch": 6822} {"train_loss": -27.193723678588867, "global_step": 566249, "epoch": 6822} {"train_loss": -27.452377319335938, "global_step": 566250, "epoch": 6822} {"train_loss": -27.58688735961914, "global_step": 566251, "epoch": 6822} {"train_loss": -27.40191650390625, "global_step": 566252, "epoch": 6822} {"train_loss": -27.3171443939209, "global_step": 566253, "epoch": 6822} {"train_loss": -27.467260360717773, "global_step": 566254, "epoch": 6822} {"train_loss": -27.470947265625, "global_step": 566255, "epoch": 6822} {"train_loss": -27.631885528564453, "global_step": 566256, "epoch": 6822} {"train_loss": -27.479780197143555, "global_step": 566257, "epoch": 6822} {"train_loss": -27.341638565063477, "global_step": 566258, "epoch": 6822} {"train_loss": -27.594518661499023, "global_step": 566259, "epoch": 6822} {"train_loss": -27.431344985961914, "global_step": 566260, "epoch": 6822} {"train_loss": -27.61738395690918, "global_step": 566261, "epoch": 6822} {"train_loss": -27.873016357421875, "global_step": 566262, "epoch": 6822} {"train_loss": -27.88331413269043, "global_step": 566263, "epoch": 6822} {"train_loss": -27.969846725463867, "global_step": 566264, "epoch": 6822} {"train_loss": -27.689849853515625, "global_step": 566265, "epoch": 6822} {"train_loss": -27.708541870117188, "global_step": 566266, "epoch": 6822} {"train_loss": -27.817249298095703, "global_step": 566267, "epoch": 6822} {"train_loss": -27.99458122253418, "global_step": 566268, "epoch": 6822} {"train_loss": -27.821186065673828, "global_step": 566269, "epoch": 6822} {"train_loss": -27.81903648376465, "global_step": 566270, "epoch": 6822} {"train_loss": -27.698196411132812, "global_step": 566271, "epoch": 6822} {"train_loss": -27.93987464904785, "global_step": 566272, "epoch": 6822} {"train_loss": -27.942296981811523, "global_step": 566273, "epoch": 6822} {"train_loss": -28.070465087890625, "global_step": 566274, "epoch": 6822} {"train_loss": -27.824949264526367, "global_step": 566275, "epoch": 6822} {"train_loss": -27.9444637298584, "global_step": 566276, "epoch": 6822} {"train_loss": -27.99505043029785, "global_step": 566277, "epoch": 6822} {"train_loss": -28.320037841796875, "global_step": 566278, "epoch": 6822} {"train_loss": -28.10377311706543, "global_step": 566279, "epoch": 6822} {"train_loss": -28.0643310546875, "global_step": 566280, "epoch": 6822} {"train_loss": -27.910566329956055, "global_step": 566281, "epoch": 6822} {"train_loss": -28.05193519592285, "global_step": 566282, "epoch": 6822} {"train_loss": -28.014007568359375, "global_step": 566283, "epoch": 6822} {"train_loss": -28.317214965820312, "global_step": 566284, "epoch": 6822} {"train_loss": -28.17250633239746, "global_step": 566285, "epoch": 6822} {"train_loss": -27.74028968811035, "global_step": 566286, "epoch": 6822} {"train_loss": -27.96445083618164, "global_step": 566287, "epoch": 6822} {"train_loss": -28.275745391845703, "global_step": 566288, "epoch": 6822} {"train_loss": -28.04813575744629, "global_step": 566289, "epoch": 6822} {"train_loss": -27.99836540222168, "global_step": 566290, "epoch": 6822} {"train_loss": -28.290420532226562, "global_step": 566291, "epoch": 6822} {"train_loss": -28.15007972717285, "global_step": 566292, "epoch": 6822} {"train_loss": -28.104597091674805, "global_step": 566293, "epoch": 6822} {"train_loss": -27.99679946899414, "global_step": 566294, "epoch": 6822} {"train_loss": -28.0113525390625, "global_step": 566295, "epoch": 6822} {"train_loss": -27.871826171875, "global_step": 566296, "epoch": 6822} {"train_loss": -27.918659210205078, "global_step": 566297, "epoch": 6822} {"train_loss": -28.276947021484375, "global_step": 566298, "epoch": 6822} {"train_loss": -27.792631149291992, "global_step": 566299, "epoch": 6822} {"train_loss": -27.544946670532227, "global_step": 566300, "epoch": 6822} {"train_loss": -27.961267471313477, "global_step": 566301, "epoch": 6822} {"train_loss": -27.873703002929688, "global_step": 566302, "epoch": 6822} {"train_loss": -27.881113052368164, "global_step": 566303, "epoch": 6822} {"train_loss": -28.15338134765625, "global_step": 566304, "epoch": 6822} {"train_loss": -27.95282554626465, "global_step": 566305, "epoch": 6822} {"train_loss": -27.737409591674805, "global_step": 566306, "epoch": 6822} {"train_loss": -27.518701553344727, "global_step": 566307, "epoch": 6822} {"train_loss": -27.484995899430242, "global_step": 566308, "epoch": 6822, "val_loss": 6591264.0} {"train_loss": -26.55511474609375, "global_step": 566309, "epoch": 6823} {"train_loss": -25.753705978393555, "global_step": 566310, "epoch": 6823} {"train_loss": -26.064960479736328, "global_step": 566311, "epoch": 6823} {"train_loss": -26.342981338500977, "global_step": 566312, "epoch": 6823} {"train_loss": -25.860563278198242, "global_step": 566313, "epoch": 6823} {"train_loss": -26.55987548828125, "global_step": 566314, "epoch": 6823} {"train_loss": -25.509809494018555, "global_step": 566315, "epoch": 6823} {"train_loss": -26.137786865234375, "global_step": 566316, "epoch": 6823} {"train_loss": -26.353137969970703, "global_step": 566317, "epoch": 6823} {"train_loss": -26.500904083251953, "global_step": 566318, "epoch": 6823} {"train_loss": -26.964853286743164, "global_step": 566319, "epoch": 6823} {"train_loss": -26.59490966796875, "global_step": 566320, "epoch": 6823} {"train_loss": -27.186969757080078, "global_step": 566321, "epoch": 6823} {"train_loss": -26.86848258972168, "global_step": 566322, "epoch": 6823} {"train_loss": -26.4876708984375, "global_step": 566323, "epoch": 6823} {"train_loss": -26.608245849609375, "global_step": 566324, "epoch": 6823} {"train_loss": -26.985443115234375, "global_step": 566325, "epoch": 6823} {"train_loss": -27.130624771118164, "global_step": 566326, "epoch": 6823} {"train_loss": -27.27691650390625, "global_step": 566327, "epoch": 6823} {"train_loss": -27.126239776611328, "global_step": 566328, "epoch": 6823} {"train_loss": -27.426176071166992, "global_step": 566329, "epoch": 6823} {"train_loss": -27.0244083404541, "global_step": 566330, "epoch": 6823} {"train_loss": -27.543912887573242, "global_step": 566331, "epoch": 6823} {"train_loss": -27.593515396118164, "global_step": 566332, "epoch": 6823} {"train_loss": -27.4537410736084, "global_step": 566333, "epoch": 6823} {"train_loss": -27.406147003173828, "global_step": 566334, "epoch": 6823} {"train_loss": -27.885868072509766, "global_step": 566335, "epoch": 6823} {"train_loss": -27.552515029907227, "global_step": 566336, "epoch": 6823} {"train_loss": -27.3868350982666, "global_step": 566337, "epoch": 6823} {"train_loss": -27.287403106689453, "global_step": 566338, "epoch": 6823} {"train_loss": -27.751678466796875, "global_step": 566339, "epoch": 6823} {"train_loss": -27.5233097076416, "global_step": 566340, "epoch": 6823} {"train_loss": -27.448104858398438, "global_step": 566341, "epoch": 6823} {"train_loss": -27.512744903564453, "global_step": 566342, "epoch": 6823} {"train_loss": -28.003549575805664, "global_step": 566343, "epoch": 6823} {"train_loss": -27.641157150268555, "global_step": 566344, "epoch": 6823} {"train_loss": -27.43507194519043, "global_step": 566345, "epoch": 6823} {"train_loss": -27.50239372253418, "global_step": 566346, "epoch": 6823} {"train_loss": -27.854883193969727, "global_step": 566347, "epoch": 6823} {"train_loss": -27.712064743041992, "global_step": 566348, "epoch": 6823} {"train_loss": -28.125574111938477, "global_step": 566349, "epoch": 6823} {"train_loss": -27.738086700439453, "global_step": 566350, "epoch": 6823} {"train_loss": -27.535022735595703, "global_step": 566351, "epoch": 6823} {"train_loss": -28.198713302612305, "global_step": 566352, "epoch": 6823} {"train_loss": -28.16348648071289, "global_step": 566353, "epoch": 6823} {"train_loss": -28.039081573486328, "global_step": 566354, "epoch": 6823} {"train_loss": -27.70216178894043, "global_step": 566355, "epoch": 6823} {"train_loss": -28.304502487182617, "global_step": 566356, "epoch": 6823} {"train_loss": -28.02045249938965, "global_step": 566357, "epoch": 6823} {"train_loss": -28.035802841186523, "global_step": 566358, "epoch": 6823} {"train_loss": -27.87338638305664, "global_step": 566359, "epoch": 6823} {"train_loss": -27.974872589111328, "global_step": 566360, "epoch": 6823} {"train_loss": -28.368024826049805, "global_step": 566361, "epoch": 6823} {"train_loss": -27.676557540893555, "global_step": 566362, "epoch": 6823} {"train_loss": -27.75518226623535, "global_step": 566363, "epoch": 6823} {"train_loss": -27.790802001953125, "global_step": 566364, "epoch": 6823} {"train_loss": -28.32171630859375, "global_step": 566365, "epoch": 6823} {"train_loss": -27.961950302124023, "global_step": 566366, "epoch": 6823} {"train_loss": -27.88435173034668, "global_step": 566367, "epoch": 6823} {"train_loss": -27.846952438354492, "global_step": 566368, "epoch": 6823} {"train_loss": -28.355146408081055, "global_step": 566369, "epoch": 6823} {"train_loss": -28.159393310546875, "global_step": 566370, "epoch": 6823} {"train_loss": -27.968515396118164, "global_step": 566371, "epoch": 6823} {"train_loss": -27.848119735717773, "global_step": 566372, "epoch": 6823} {"train_loss": -27.941137313842773, "global_step": 566373, "epoch": 6823} {"train_loss": -27.62155532836914, "global_step": 566374, "epoch": 6823} {"train_loss": -27.881549835205078, "global_step": 566375, "epoch": 6823} {"train_loss": -28.130674362182617, "global_step": 566376, "epoch": 6823} {"train_loss": -27.94366455078125, "global_step": 566377, "epoch": 6823} {"train_loss": -27.841562271118164, "global_step": 566378, "epoch": 6823} {"train_loss": -27.82521629333496, "global_step": 566379, "epoch": 6823} {"train_loss": -27.751544952392578, "global_step": 566380, "epoch": 6823} {"train_loss": -27.9522762298584, "global_step": 566381, "epoch": 6823} {"train_loss": -28.032093048095703, "global_step": 566382, "epoch": 6823} {"train_loss": -27.982934951782227, "global_step": 566383, "epoch": 6823} {"train_loss": -28.088003158569336, "global_step": 566384, "epoch": 6823} {"train_loss": -27.782163619995117, "global_step": 566385, "epoch": 6823} {"train_loss": -27.745681762695312, "global_step": 566386, "epoch": 6823} {"train_loss": -27.721540451049805, "global_step": 566387, "epoch": 6823} {"train_loss": -27.859649658203125, "global_step": 566388, "epoch": 6823} {"train_loss": -28.183622360229492, "global_step": 566389, "epoch": 6823} {"train_loss": -28.150638580322266, "global_step": 566390, "epoch": 6823} {"train_loss": -27.52703937852239, "global_step": 566391, "epoch": 6823, "val_loss": 6637213.0} {"train_loss": -27.265674591064453, "global_step": 566392, "epoch": 6824} {"train_loss": -27.095630645751953, "global_step": 566393, "epoch": 6824} {"train_loss": -26.747060775756836, "global_step": 566394, "epoch": 6824} {"train_loss": -26.56403160095215, "global_step": 566395, "epoch": 6824} {"train_loss": -26.80218505859375, "global_step": 566396, "epoch": 6824} {"train_loss": -27.077611923217773, "global_step": 566397, "epoch": 6824} {"train_loss": -27.544361114501953, "global_step": 566398, "epoch": 6824} {"train_loss": -27.3426456451416, "global_step": 566399, "epoch": 6824} {"train_loss": -27.5833740234375, "global_step": 566400, "epoch": 6824} {"train_loss": -27.6204833984375, "global_step": 566401, "epoch": 6824} {"train_loss": -27.249731063842773, "global_step": 566402, "epoch": 6824} {"train_loss": -27.20647621154785, "global_step": 566403, "epoch": 6824} {"train_loss": -27.34404945373535, "global_step": 566404, "epoch": 6824} {"train_loss": -27.326171875, "global_step": 566405, "epoch": 6824} {"train_loss": -27.6275634765625, "global_step": 566406, "epoch": 6824} {"train_loss": -27.870664596557617, "global_step": 566407, "epoch": 6824} {"train_loss": -27.7423095703125, "global_step": 566408, "epoch": 6824} {"train_loss": -27.701704025268555, "global_step": 566409, "epoch": 6824} {"train_loss": -27.54786491394043, "global_step": 566410, "epoch": 6824} {"train_loss": -27.81307029724121, "global_step": 566411, "epoch": 6824} {"train_loss": -27.57636070251465, "global_step": 566412, "epoch": 6824} {"train_loss": -27.443323135375977, "global_step": 566413, "epoch": 6824} {"train_loss": -27.494394302368164, "global_step": 566414, "epoch": 6824} {"train_loss": -27.616668701171875, "global_step": 566415, "epoch": 6824} {"train_loss": -27.2615909576416, "global_step": 566416, "epoch": 6824} {"train_loss": -27.815643310546875, "global_step": 566417, "epoch": 6824} {"train_loss": -27.719266891479492, "global_step": 566418, "epoch": 6824} {"train_loss": -27.66228675842285, "global_step": 566419, "epoch": 6824} {"train_loss": -27.76858901977539, "global_step": 566420, "epoch": 6824} {"train_loss": -27.579025268554688, "global_step": 566421, "epoch": 6824} {"train_loss": -27.805505752563477, "global_step": 566422, "epoch": 6824} {"train_loss": -27.378095626831055, "global_step": 566423, "epoch": 6824} {"train_loss": -27.8149471282959, "global_step": 566424, "epoch": 6824} {"train_loss": -28.295434951782227, "global_step": 566425, "epoch": 6824} {"train_loss": -28.1505184173584, "global_step": 566426, "epoch": 6824} {"train_loss": -27.703479766845703, "global_step": 566427, "epoch": 6824} {"train_loss": -27.666091918945312, "global_step": 566428, "epoch": 6824} {"train_loss": -27.611907958984375, "global_step": 566429, "epoch": 6824} {"train_loss": -27.868127822875977, "global_step": 566430, "epoch": 6824} {"train_loss": -27.912246704101562, "global_step": 566431, "epoch": 6824} {"train_loss": -28.228971481323242, "global_step": 566432, "epoch": 6824} {"train_loss": -27.6042423248291, "global_step": 566433, "epoch": 6824} {"train_loss": -27.655073165893555, "global_step": 566434, "epoch": 6824} {"train_loss": -27.9390869140625, "global_step": 566435, "epoch": 6824} {"train_loss": -28.14801597595215, "global_step": 566436, "epoch": 6824} {"train_loss": -27.964460372924805, "global_step": 566437, "epoch": 6824} {"train_loss": -27.643720626831055, "global_step": 566438, "epoch": 6824} {"train_loss": -27.7574405670166, "global_step": 566439, "epoch": 6824} {"train_loss": -27.976728439331055, "global_step": 566440, "epoch": 6824} {"train_loss": -27.890729904174805, "global_step": 566441, "epoch": 6824} {"train_loss": -27.811676025390625, "global_step": 566442, "epoch": 6824} {"train_loss": -27.70001792907715, "global_step": 566443, "epoch": 6824} {"train_loss": -27.987548828125, "global_step": 566444, "epoch": 6824} {"train_loss": -27.386444091796875, "global_step": 566445, "epoch": 6824} {"train_loss": -27.96296501159668, "global_step": 566446, "epoch": 6824} {"train_loss": -27.7631778717041, "global_step": 566447, "epoch": 6824} {"train_loss": -27.950281143188477, "global_step": 566448, "epoch": 6824} {"train_loss": -27.551910400390625, "global_step": 566449, "epoch": 6824} {"train_loss": -28.174625396728516, "global_step": 566450, "epoch": 6824} {"train_loss": -28.13345718383789, "global_step": 566451, "epoch": 6824} {"train_loss": -28.072370529174805, "global_step": 566452, "epoch": 6824} {"train_loss": -28.14767837524414, "global_step": 566453, "epoch": 6824} {"train_loss": -27.482587814331055, "global_step": 566454, "epoch": 6824} {"train_loss": -27.99110221862793, "global_step": 566455, "epoch": 6824} {"train_loss": -27.896015167236328, "global_step": 566456, "epoch": 6824} {"train_loss": -28.179956436157227, "global_step": 566457, "epoch": 6824} {"train_loss": -28.222925186157227, "global_step": 566458, "epoch": 6824} {"train_loss": -27.827808380126953, "global_step": 566459, "epoch": 6824} {"train_loss": -28.2375431060791, "global_step": 566460, "epoch": 6824} {"train_loss": -28.00054359436035, "global_step": 566461, "epoch": 6824} {"train_loss": -27.676721572875977, "global_step": 566462, "epoch": 6824} {"train_loss": -27.856536865234375, "global_step": 566463, "epoch": 6824} {"train_loss": -27.70240592956543, "global_step": 566464, "epoch": 6824} {"train_loss": -28.158950805664062, "global_step": 566465, "epoch": 6824} {"train_loss": -27.78133201599121, "global_step": 566466, "epoch": 6824} {"train_loss": -27.852508544921875, "global_step": 566467, "epoch": 6824} {"train_loss": -27.91116714477539, "global_step": 566468, "epoch": 6824} {"train_loss": -27.79914665222168, "global_step": 566469, "epoch": 6824} {"train_loss": -28.00648307800293, "global_step": 566470, "epoch": 6824} {"train_loss": -27.918500900268555, "global_step": 566471, "epoch": 6824} {"train_loss": -28.093408584594727, "global_step": 566472, "epoch": 6824} {"train_loss": -28.04093360900879, "global_step": 566473, "epoch": 6824} {"train_loss": -27.73647547342691, "global_step": 566474, "epoch": 6824, "val_loss": 6592633.5} {"train_loss": -26.770126342773438, "global_step": 566475, "epoch": 6825} {"train_loss": -26.007238388061523, "global_step": 566476, "epoch": 6825} {"train_loss": -26.509424209594727, "global_step": 566477, "epoch": 6825} {"train_loss": -27.06867027282715, "global_step": 566478, "epoch": 6825} {"train_loss": -26.07364273071289, "global_step": 566479, "epoch": 6825} {"train_loss": -27.371753692626953, "global_step": 566480, "epoch": 6825} {"train_loss": -26.78382682800293, "global_step": 566481, "epoch": 6825} {"train_loss": -27.0899600982666, "global_step": 566482, "epoch": 6825} {"train_loss": -26.829248428344727, "global_step": 566483, "epoch": 6825} {"train_loss": -27.482711791992188, "global_step": 566484, "epoch": 6825} {"train_loss": -27.368810653686523, "global_step": 566485, "epoch": 6825} {"train_loss": -26.707706451416016, "global_step": 566486, "epoch": 6825} {"train_loss": -27.17302894592285, "global_step": 566487, "epoch": 6825} {"train_loss": -27.13535499572754, "global_step": 566488, "epoch": 6825} {"train_loss": -27.540939331054688, "global_step": 566489, "epoch": 6825} {"train_loss": -27.274587631225586, "global_step": 566490, "epoch": 6825} {"train_loss": -27.499011993408203, "global_step": 566491, "epoch": 6825} {"train_loss": -27.23703956604004, "global_step": 566492, "epoch": 6825} {"train_loss": -27.710193634033203, "global_step": 566493, "epoch": 6825} {"train_loss": -27.429275512695312, "global_step": 566494, "epoch": 6825} {"train_loss": -27.001800537109375, "global_step": 566495, "epoch": 6825} {"train_loss": -27.46728515625, "global_step": 566496, "epoch": 6825} {"train_loss": -27.23288345336914, "global_step": 566497, "epoch": 6825} {"train_loss": -27.542804718017578, "global_step": 566498, "epoch": 6825} {"train_loss": -27.71576499938965, "global_step": 566499, "epoch": 6825} {"train_loss": -27.400705337524414, "global_step": 566500, "epoch": 6825} {"train_loss": -27.75919532775879, "global_step": 566501, "epoch": 6825} {"train_loss": -27.326684951782227, "global_step": 566502, "epoch": 6825} {"train_loss": -27.674253463745117, "global_step": 566503, "epoch": 6825} {"train_loss": -27.28070068359375, "global_step": 566504, "epoch": 6825} {"train_loss": -27.60477066040039, "global_step": 566505, "epoch": 6825} {"train_loss": -27.59423828125, "global_step": 566506, "epoch": 6825} {"train_loss": -27.331506729125977, "global_step": 566507, "epoch": 6825} {"train_loss": -27.361068725585938, "global_step": 566508, "epoch": 6825} {"train_loss": -27.7325439453125, "global_step": 566509, "epoch": 6825} {"train_loss": -27.693918228149414, "global_step": 566510, "epoch": 6825} {"train_loss": -27.619842529296875, "global_step": 566511, "epoch": 6825} {"train_loss": -27.858154296875, "global_step": 566512, "epoch": 6825} {"train_loss": -27.8260555267334, "global_step": 566513, "epoch": 6825} {"train_loss": -27.94415855407715, "global_step": 566514, "epoch": 6825} {"train_loss": -27.653776168823242, "global_step": 566515, "epoch": 6825} {"train_loss": -28.157880783081055, "global_step": 566516, "epoch": 6825} {"train_loss": -27.84234619140625, "global_step": 566517, "epoch": 6825} {"train_loss": -28.150421142578125, "global_step": 566518, "epoch": 6825} {"train_loss": -28.00836181640625, "global_step": 566519, "epoch": 6825} {"train_loss": -27.744367599487305, "global_step": 566520, "epoch": 6825} {"train_loss": -27.930341720581055, "global_step": 566521, "epoch": 6825} {"train_loss": -28.05866813659668, "global_step": 566522, "epoch": 6825} {"train_loss": -28.110965728759766, "global_step": 566523, "epoch": 6825} {"train_loss": -28.123249053955078, "global_step": 566524, "epoch": 6825} {"train_loss": -28.023473739624023, "global_step": 566525, "epoch": 6825} {"train_loss": -28.027175903320312, "global_step": 566526, "epoch": 6825} {"train_loss": -27.85068130493164, "global_step": 566527, "epoch": 6825} {"train_loss": -28.118396759033203, "global_step": 566528, "epoch": 6825} {"train_loss": -28.227264404296875, "global_step": 566529, "epoch": 6825} {"train_loss": -28.276700973510742, "global_step": 566530, "epoch": 6825} {"train_loss": -27.88360023498535, "global_step": 566531, "epoch": 6825} {"train_loss": -27.838239669799805, "global_step": 566532, "epoch": 6825} {"train_loss": -27.897754669189453, "global_step": 566533, "epoch": 6825} {"train_loss": -27.865467071533203, "global_step": 566534, "epoch": 6825} {"train_loss": -27.807266235351562, "global_step": 566535, "epoch": 6825} {"train_loss": -27.791580200195312, "global_step": 566536, "epoch": 6825} {"train_loss": -27.621234893798828, "global_step": 566537, "epoch": 6825} {"train_loss": -28.21817970275879, "global_step": 566538, "epoch": 6825} {"train_loss": -27.56003761291504, "global_step": 566539, "epoch": 6825} {"train_loss": -27.741153717041016, "global_step": 566540, "epoch": 6825} {"train_loss": -27.990741729736328, "global_step": 566541, "epoch": 6825} {"train_loss": -27.961383819580078, "global_step": 566542, "epoch": 6825} {"train_loss": -27.729578018188477, "global_step": 566543, "epoch": 6825} {"train_loss": -27.620075225830078, "global_step": 566544, "epoch": 6825} {"train_loss": -27.352319717407227, "global_step": 566545, "epoch": 6825} {"train_loss": -27.793628692626953, "global_step": 566546, "epoch": 6825} {"train_loss": -27.62598991394043, "global_step": 566547, "epoch": 6825} {"train_loss": -27.704076766967773, "global_step": 566548, "epoch": 6825} {"train_loss": -27.487680435180664, "global_step": 566549, "epoch": 6825} {"train_loss": -27.17633628845215, "global_step": 566550, "epoch": 6825} {"train_loss": -27.6055850982666, "global_step": 566551, "epoch": 6825} {"train_loss": -27.648096084594727, "global_step": 566552, "epoch": 6825} {"train_loss": -27.505355834960938, "global_step": 566553, "epoch": 6825} {"train_loss": -27.394147872924805, "global_step": 566554, "epoch": 6825} {"train_loss": -27.534992218017578, "global_step": 566555, "epoch": 6825} {"train_loss": -27.727521896362305, "global_step": 566556, "epoch": 6825} {"train_loss": -27.57595772341073, "global_step": 566557, "epoch": 6825, "val_loss": 6607150.0} {"train_loss": -26.928302764892578, "global_step": 566558, "epoch": 6826} {"train_loss": -27.009418487548828, "global_step": 566559, "epoch": 6826} {"train_loss": -27.343124389648438, "global_step": 566560, "epoch": 6826} {"train_loss": -27.406274795532227, "global_step": 566561, "epoch": 6826} {"train_loss": -26.966344833374023, "global_step": 566562, "epoch": 6826} {"train_loss": -27.0333251953125, "global_step": 566563, "epoch": 6826} {"train_loss": -27.368255615234375, "global_step": 566564, "epoch": 6826} {"train_loss": -27.478185653686523, "global_step": 566565, "epoch": 6826} {"train_loss": -27.17156410217285, "global_step": 566566, "epoch": 6826} {"train_loss": -27.0644588470459, "global_step": 566567, "epoch": 6826} {"train_loss": -27.70588493347168, "global_step": 566568, "epoch": 6826} {"train_loss": -27.3143367767334, "global_step": 566569, "epoch": 6826} {"train_loss": -27.792373657226562, "global_step": 566570, "epoch": 6826} {"train_loss": -28.090856552124023, "global_step": 566571, "epoch": 6826} {"train_loss": -27.492706298828125, "global_step": 566572, "epoch": 6826} {"train_loss": -27.244470596313477, "global_step": 566573, "epoch": 6826} {"train_loss": -27.47007179260254, "global_step": 566574, "epoch": 6826} {"train_loss": -27.61322021484375, "global_step": 566575, "epoch": 6826} {"train_loss": -27.342376708984375, "global_step": 566576, "epoch": 6826} {"train_loss": -27.72882652282715, "global_step": 566577, "epoch": 6826} {"train_loss": -27.325641632080078, "global_step": 566578, "epoch": 6826} {"train_loss": -27.829517364501953, "global_step": 566579, "epoch": 6826} {"train_loss": -27.161975860595703, "global_step": 566580, "epoch": 6826} {"train_loss": -27.820419311523438, "global_step": 566581, "epoch": 6826} {"train_loss": -27.34006118774414, "global_step": 566582, "epoch": 6826} {"train_loss": -27.816564559936523, "global_step": 566583, "epoch": 6826} {"train_loss": -27.894245147705078, "global_step": 566584, "epoch": 6826} {"train_loss": -28.041563034057617, "global_step": 566585, "epoch": 6826} {"train_loss": -27.7227840423584, "global_step": 566586, "epoch": 6826} {"train_loss": -27.94548988342285, "global_step": 566587, "epoch": 6826} {"train_loss": -27.381973266601562, "global_step": 566588, "epoch": 6826} {"train_loss": -27.74712562561035, "global_step": 566589, "epoch": 6826} {"train_loss": -28.19354820251465, "global_step": 566590, "epoch": 6826} {"train_loss": -27.869779586791992, "global_step": 566591, "epoch": 6826} {"train_loss": -27.971210479736328, "global_step": 566592, "epoch": 6826} {"train_loss": -28.152624130249023, "global_step": 566593, "epoch": 6826} {"train_loss": -28.0723819732666, "global_step": 566594, "epoch": 6826} {"train_loss": -28.011316299438477, "global_step": 566595, "epoch": 6826} {"train_loss": -27.665754318237305, "global_step": 566596, "epoch": 6826} {"train_loss": -27.998971939086914, "global_step": 566597, "epoch": 6826} {"train_loss": -27.78338623046875, "global_step": 566598, "epoch": 6826} {"train_loss": -27.69459342956543, "global_step": 566599, "epoch": 6826} {"train_loss": -28.105121612548828, "global_step": 566600, "epoch": 6826} {"train_loss": -27.832250595092773, "global_step": 566601, "epoch": 6826} {"train_loss": -28.30997085571289, "global_step": 566602, "epoch": 6826} {"train_loss": -27.843759536743164, "global_step": 566603, "epoch": 6826} {"train_loss": -28.42365074157715, "global_step": 566604, "epoch": 6826} {"train_loss": -27.95131492614746, "global_step": 566605, "epoch": 6826} {"train_loss": -28.392902374267578, "global_step": 566606, "epoch": 6826} {"train_loss": -27.9476261138916, "global_step": 566607, "epoch": 6826} {"train_loss": -28.035175323486328, "global_step": 566608, "epoch": 6826} {"train_loss": -27.91843032836914, "global_step": 566609, "epoch": 6826} {"train_loss": -28.113447189331055, "global_step": 566610, "epoch": 6826} {"train_loss": -27.89838981628418, "global_step": 566611, "epoch": 6826} {"train_loss": -28.251617431640625, "global_step": 566612, "epoch": 6826} {"train_loss": -28.152332305908203, "global_step": 566613, "epoch": 6826} {"train_loss": -28.01896095275879, "global_step": 566614, "epoch": 6826} {"train_loss": -27.646963119506836, "global_step": 566615, "epoch": 6826} {"train_loss": -28.03207778930664, "global_step": 566616, "epoch": 6826} {"train_loss": -27.945850372314453, "global_step": 566617, "epoch": 6826} {"train_loss": -27.917707443237305, "global_step": 566618, "epoch": 6826} {"train_loss": -27.933349609375, "global_step": 566619, "epoch": 6826} {"train_loss": -27.86504554748535, "global_step": 566620, "epoch": 6826} {"train_loss": -27.846664428710938, "global_step": 566621, "epoch": 6826} {"train_loss": -27.43946647644043, "global_step": 566622, "epoch": 6826} {"train_loss": -27.745004653930664, "global_step": 566623, "epoch": 6826} {"train_loss": -28.098962783813477, "global_step": 566624, "epoch": 6826} {"train_loss": -27.866987228393555, "global_step": 566625, "epoch": 6826} {"train_loss": -27.714353561401367, "global_step": 566626, "epoch": 6826} {"train_loss": -27.56019401550293, "global_step": 566627, "epoch": 6826} {"train_loss": -27.62347412109375, "global_step": 566628, "epoch": 6826} {"train_loss": -27.407941818237305, "global_step": 566629, "epoch": 6826} {"train_loss": -27.0761661529541, "global_step": 566630, "epoch": 6826} {"train_loss": -27.890140533447266, "global_step": 566631, "epoch": 6826} {"train_loss": -27.704397201538086, "global_step": 566632, "epoch": 6826} {"train_loss": -27.327829360961914, "global_step": 566633, "epoch": 6826} {"train_loss": -27.414255142211914, "global_step": 566634, "epoch": 6826} {"train_loss": -27.582202911376953, "global_step": 566635, "epoch": 6826} {"train_loss": -27.495038986206055, "global_step": 566636, "epoch": 6826} {"train_loss": -27.73064613342285, "global_step": 566637, "epoch": 6826} {"train_loss": -28.11073112487793, "global_step": 566638, "epoch": 6826} {"train_loss": -27.36557388305664, "global_step": 566639, "epoch": 6826} {"train_loss": -27.71837243689112, "global_step": 566640, "epoch": 6826, "val_loss": 6655377.0} {"train_loss": -27.490848541259766, "global_step": 566641, "epoch": 6827} {"train_loss": -27.305871963500977, "global_step": 566642, "epoch": 6827} {"train_loss": -27.401159286499023, "global_step": 566643, "epoch": 6827} {"train_loss": -27.463525772094727, "global_step": 566644, "epoch": 6827} {"train_loss": -27.223539352416992, "global_step": 566645, "epoch": 6827} {"train_loss": -27.61623191833496, "global_step": 566646, "epoch": 6827} {"train_loss": -27.10293960571289, "global_step": 566647, "epoch": 6827} {"train_loss": -26.578954696655273, "global_step": 566648, "epoch": 6827} {"train_loss": -27.33808708190918, "global_step": 566649, "epoch": 6827} {"train_loss": -26.984745025634766, "global_step": 566650, "epoch": 6827} {"train_loss": -27.25984001159668, "global_step": 566651, "epoch": 6827} {"train_loss": -27.396656036376953, "global_step": 566652, "epoch": 6827} {"train_loss": -27.183435440063477, "global_step": 566653, "epoch": 6827} {"train_loss": -27.346012115478516, "global_step": 566654, "epoch": 6827} {"train_loss": -27.091779708862305, "global_step": 566655, "epoch": 6827} {"train_loss": -27.5811710357666, "global_step": 566656, "epoch": 6827} {"train_loss": -27.814496994018555, "global_step": 566657, "epoch": 6827} {"train_loss": -27.342182159423828, "global_step": 566658, "epoch": 6827} {"train_loss": -27.264631271362305, "global_step": 566659, "epoch": 6827} {"train_loss": -27.484851837158203, "global_step": 566660, "epoch": 6827} {"train_loss": -27.522619247436523, "global_step": 566661, "epoch": 6827} {"train_loss": -27.28242301940918, "global_step": 566662, "epoch": 6827} {"train_loss": -27.493574142456055, "global_step": 566663, "epoch": 6827} {"train_loss": -27.495208740234375, "global_step": 566664, "epoch": 6827} {"train_loss": -27.91920280456543, "global_step": 566665, "epoch": 6827} {"train_loss": -27.710132598876953, "global_step": 566666, "epoch": 6827} {"train_loss": -27.879541397094727, "global_step": 566667, "epoch": 6827} {"train_loss": -28.077239990234375, "global_step": 566668, "epoch": 6827} {"train_loss": -27.589248657226562, "global_step": 566669, "epoch": 6827} {"train_loss": -27.510833740234375, "global_step": 566670, "epoch": 6827} {"train_loss": -27.70639991760254, "global_step": 566671, "epoch": 6827} {"train_loss": -28.0616397857666, "global_step": 566672, "epoch": 6827} {"train_loss": -27.6003360748291, "global_step": 566673, "epoch": 6827} {"train_loss": -27.832691192626953, "global_step": 566674, "epoch": 6827} {"train_loss": -27.639453887939453, "global_step": 566675, "epoch": 6827} {"train_loss": -27.79134178161621, "global_step": 566676, "epoch": 6827} {"train_loss": -28.078933715820312, "global_step": 566677, "epoch": 6827} {"train_loss": -28.0089111328125, "global_step": 566678, "epoch": 6827} {"train_loss": -28.11773109436035, "global_step": 566679, "epoch": 6827} {"train_loss": -27.79766273498535, "global_step": 566680, "epoch": 6827} {"train_loss": -27.93406105041504, "global_step": 566681, "epoch": 6827} {"train_loss": -28.297657012939453, "global_step": 566682, "epoch": 6827} {"train_loss": -27.78314208984375, "global_step": 566683, "epoch": 6827} {"train_loss": -27.891345977783203, "global_step": 566684, "epoch": 6827} {"train_loss": -28.13584327697754, "global_step": 566685, "epoch": 6827} {"train_loss": -27.69537353515625, "global_step": 566686, "epoch": 6827} {"train_loss": -27.990192413330078, "global_step": 566687, "epoch": 6827} {"train_loss": -27.935007095336914, "global_step": 566688, "epoch": 6827} {"train_loss": -27.93842887878418, "global_step": 566689, "epoch": 6827} {"train_loss": -27.96009635925293, "global_step": 566690, "epoch": 6827} {"train_loss": -28.142608642578125, "global_step": 566691, "epoch": 6827} {"train_loss": -27.751066207885742, "global_step": 566692, "epoch": 6827} {"train_loss": -27.96356773376465, "global_step": 566693, "epoch": 6827} {"train_loss": -27.8958797454834, "global_step": 566694, "epoch": 6827} {"train_loss": -27.885791778564453, "global_step": 566695, "epoch": 6827} {"train_loss": -28.100605010986328, "global_step": 566696, "epoch": 6827} {"train_loss": -28.155698776245117, "global_step": 566697, "epoch": 6827} {"train_loss": -28.207632064819336, "global_step": 566698, "epoch": 6827} {"train_loss": -28.198949813842773, "global_step": 566699, "epoch": 6827} {"train_loss": -28.138402938842773, "global_step": 566700, "epoch": 6827} {"train_loss": -28.17959976196289, "global_step": 566701, "epoch": 6827} {"train_loss": -28.11859703063965, "global_step": 566702, "epoch": 6827} {"train_loss": -27.749975204467773, "global_step": 566703, "epoch": 6827} {"train_loss": -27.880462646484375, "global_step": 566704, "epoch": 6827} {"train_loss": -28.146207809448242, "global_step": 566705, "epoch": 6827} {"train_loss": -27.792022705078125, "global_step": 566706, "epoch": 6827} {"train_loss": -27.752832412719727, "global_step": 566707, "epoch": 6827} {"train_loss": -27.487628936767578, "global_step": 566708, "epoch": 6827} {"train_loss": -27.819860458374023, "global_step": 566709, "epoch": 6827} {"train_loss": -27.41114616394043, "global_step": 566710, "epoch": 6827} {"train_loss": -27.839492797851562, "global_step": 566711, "epoch": 6827} {"train_loss": -27.90372657775879, "global_step": 566712, "epoch": 6827} {"train_loss": -27.699512481689453, "global_step": 566713, "epoch": 6827} {"train_loss": -27.896991729736328, "global_step": 566714, "epoch": 6827} {"train_loss": -27.81342887878418, "global_step": 566715, "epoch": 6827} {"train_loss": -27.587390899658203, "global_step": 566716, "epoch": 6827} {"train_loss": -28.323760986328125, "global_step": 566717, "epoch": 6827} {"train_loss": -27.987995147705078, "global_step": 566718, "epoch": 6827} {"train_loss": -27.57398796081543, "global_step": 566719, "epoch": 6827} {"train_loss": -26.991321563720703, "global_step": 566720, "epoch": 6827} {"train_loss": -25.27811050415039, "global_step": 566721, "epoch": 6827} {"train_loss": -24.678119659423828, "global_step": 566722, "epoch": 6827} {"train_loss": -27.62142293998994, "global_step": 566723, "epoch": 6827, "val_loss": 6483560.5} {"train_loss": -26.4803409576416, "global_step": 566724, "epoch": 6828} {"train_loss": -24.173093795776367, "global_step": 566725, "epoch": 6828} {"train_loss": -26.285375595092773, "global_step": 566726, "epoch": 6828} {"train_loss": -25.11318016052246, "global_step": 566727, "epoch": 6828} {"train_loss": -25.88661003112793, "global_step": 566728, "epoch": 6828} {"train_loss": -26.176441192626953, "global_step": 566729, "epoch": 6828} {"train_loss": -26.11700439453125, "global_step": 566730, "epoch": 6828} {"train_loss": -26.00226402282715, "global_step": 566731, "epoch": 6828} {"train_loss": -26.282018661499023, "global_step": 566732, "epoch": 6828} {"train_loss": -26.790647506713867, "global_step": 566733, "epoch": 6828} {"train_loss": -26.153217315673828, "global_step": 566734, "epoch": 6828} {"train_loss": -26.398691177368164, "global_step": 566735, "epoch": 6828} {"train_loss": -26.67909049987793, "global_step": 566736, "epoch": 6828} {"train_loss": -26.338308334350586, "global_step": 566737, "epoch": 6828} {"train_loss": -26.14396095275879, "global_step": 566738, "epoch": 6828} {"train_loss": -26.75604248046875, "global_step": 566739, "epoch": 6828} {"train_loss": -26.630483627319336, "global_step": 566740, "epoch": 6828} {"train_loss": -26.76460838317871, "global_step": 566741, "epoch": 6828} {"train_loss": -26.69189453125, "global_step": 566742, "epoch": 6828} {"train_loss": -27.030729293823242, "global_step": 566743, "epoch": 6828} {"train_loss": -27.05695915222168, "global_step": 566744, "epoch": 6828} {"train_loss": -27.288366317749023, "global_step": 566745, "epoch": 6828} {"train_loss": -26.713092803955078, "global_step": 566746, "epoch": 6828} {"train_loss": -27.032617568969727, "global_step": 566747, "epoch": 6828} {"train_loss": -26.984149932861328, "global_step": 566748, "epoch": 6828} {"train_loss": -27.357824325561523, "global_step": 566749, "epoch": 6828} {"train_loss": -27.110034942626953, "global_step": 566750, "epoch": 6828} {"train_loss": -27.273977279663086, "global_step": 566751, "epoch": 6828} {"train_loss": -27.452320098876953, "global_step": 566752, "epoch": 6828} {"train_loss": -27.420862197875977, "global_step": 566753, "epoch": 6828} {"train_loss": -27.32293701171875, "global_step": 566754, "epoch": 6828} {"train_loss": -26.99542808532715, "global_step": 566755, "epoch": 6828} {"train_loss": -27.509958267211914, "global_step": 566756, "epoch": 6828} {"train_loss": -27.26790428161621, "global_step": 566757, "epoch": 6828} {"train_loss": -27.469350814819336, "global_step": 566758, "epoch": 6828} {"train_loss": -27.413557052612305, "global_step": 566759, "epoch": 6828} {"train_loss": -27.73859977722168, "global_step": 566760, "epoch": 6828} {"train_loss": -27.468276977539062, "global_step": 566761, "epoch": 6828} {"train_loss": -27.568408966064453, "global_step": 566762, "epoch": 6828} {"train_loss": -27.237995147705078, "global_step": 566763, "epoch": 6828} {"train_loss": -27.554529190063477, "global_step": 566764, "epoch": 6828} {"train_loss": -27.62249755859375, "global_step": 566765, "epoch": 6828} {"train_loss": -27.942157745361328, "global_step": 566766, "epoch": 6828} {"train_loss": -27.866666793823242, "global_step": 566767, "epoch": 6828} {"train_loss": -27.97707176208496, "global_step": 566768, "epoch": 6828} {"train_loss": -27.851789474487305, "global_step": 566769, "epoch": 6828} {"train_loss": -27.603580474853516, "global_step": 566770, "epoch": 6828} {"train_loss": -27.995431900024414, "global_step": 566771, "epoch": 6828} {"train_loss": -27.666776657104492, "global_step": 566772, "epoch": 6828} {"train_loss": -27.685338973999023, "global_step": 566773, "epoch": 6828} {"train_loss": -27.737695693969727, "global_step": 566774, "epoch": 6828} {"train_loss": -28.02471923828125, "global_step": 566775, "epoch": 6828} {"train_loss": -28.04962158203125, "global_step": 566776, "epoch": 6828} {"train_loss": -27.880420684814453, "global_step": 566777, "epoch": 6828} {"train_loss": -28.063642501831055, "global_step": 566778, "epoch": 6828} {"train_loss": -27.6612548828125, "global_step": 566779, "epoch": 6828} {"train_loss": -27.825544357299805, "global_step": 566780, "epoch": 6828} {"train_loss": -28.112287521362305, "global_step": 566781, "epoch": 6828} {"train_loss": -28.063024520874023, "global_step": 566782, "epoch": 6828} {"train_loss": -27.837488174438477, "global_step": 566783, "epoch": 6828} {"train_loss": -27.94117546081543, "global_step": 566784, "epoch": 6828} {"train_loss": -27.9678955078125, "global_step": 566785, "epoch": 6828} {"train_loss": -28.305639266967773, "global_step": 566786, "epoch": 6828} {"train_loss": -28.178943634033203, "global_step": 566787, "epoch": 6828} {"train_loss": -27.6929931640625, "global_step": 566788, "epoch": 6828} {"train_loss": -28.21875, "global_step": 566789, "epoch": 6828} {"train_loss": -27.892271041870117, "global_step": 566790, "epoch": 6828} {"train_loss": -27.972183227539062, "global_step": 566791, "epoch": 6828} {"train_loss": -28.263996124267578, "global_step": 566792, "epoch": 6828} {"train_loss": -27.088937759399414, "global_step": 566793, "epoch": 6828} {"train_loss": -27.373559951782227, "global_step": 566794, "epoch": 6828} {"train_loss": -27.76228904724121, "global_step": 566795, "epoch": 6828} {"train_loss": -27.903470993041992, "global_step": 566796, "epoch": 6828} {"train_loss": -27.457691192626953, "global_step": 566797, "epoch": 6828} {"train_loss": -27.598968505859375, "global_step": 566798, "epoch": 6828} {"train_loss": -27.80596351623535, "global_step": 566799, "epoch": 6828} {"train_loss": -28.14352798461914, "global_step": 566800, "epoch": 6828} {"train_loss": -27.8187255859375, "global_step": 566801, "epoch": 6828} {"train_loss": -27.789936065673828, "global_step": 566802, "epoch": 6828} {"train_loss": -28.018888473510742, "global_step": 566803, "epoch": 6828} {"train_loss": -27.899015426635742, "global_step": 566804, "epoch": 6828} {"train_loss": -28.00282096862793, "global_step": 566805, "epoch": 6828} {"train_loss": -27.320064085075654, "global_step": 566806, "epoch": 6828, "val_loss": 6780390.0} {"train_loss": -27.83042335510254, "global_step": 566807, "epoch": 6829} {"train_loss": -27.672391891479492, "global_step": 566808, "epoch": 6829} {"train_loss": -27.436933517456055, "global_step": 566809, "epoch": 6829} {"train_loss": -27.330921173095703, "global_step": 566810, "epoch": 6829} {"train_loss": -27.18702507019043, "global_step": 566811, "epoch": 6829} {"train_loss": -27.3778076171875, "global_step": 566812, "epoch": 6829} {"train_loss": -27.33246421813965, "global_step": 566813, "epoch": 6829} {"train_loss": -27.608184814453125, "global_step": 566814, "epoch": 6829} {"train_loss": -27.54216957092285, "global_step": 566815, "epoch": 6829} {"train_loss": -27.48826026916504, "global_step": 566816, "epoch": 6829} {"train_loss": -27.58377456665039, "global_step": 566817, "epoch": 6829} {"train_loss": -27.601621627807617, "global_step": 566818, "epoch": 6829} {"train_loss": -27.048566818237305, "global_step": 566819, "epoch": 6829} {"train_loss": -27.408435821533203, "global_step": 566820, "epoch": 6829} {"train_loss": -27.818958282470703, "global_step": 566821, "epoch": 6829} {"train_loss": -27.8659610748291, "global_step": 566822, "epoch": 6829} {"train_loss": -27.883886337280273, "global_step": 566823, "epoch": 6829} {"train_loss": -28.095285415649414, "global_step": 566824, "epoch": 6829} {"train_loss": -27.920394897460938, "global_step": 566825, "epoch": 6829} {"train_loss": -27.774362564086914, "global_step": 566826, "epoch": 6829} {"train_loss": -28.1704044342041, "global_step": 566827, "epoch": 6829} {"train_loss": -27.792814254760742, "global_step": 566828, "epoch": 6829} {"train_loss": -27.909616470336914, "global_step": 566829, "epoch": 6829} {"train_loss": -27.924579620361328, "global_step": 566830, "epoch": 6829} {"train_loss": -27.80463981628418, "global_step": 566831, "epoch": 6829} {"train_loss": -27.90939712524414, "global_step": 566832, "epoch": 6829} {"train_loss": -28.06536865234375, "global_step": 566833, "epoch": 6829} {"train_loss": -27.791400909423828, "global_step": 566834, "epoch": 6829} {"train_loss": -28.01710319519043, "global_step": 566835, "epoch": 6829} {"train_loss": -27.7421817779541, "global_step": 566836, "epoch": 6829} {"train_loss": -28.137161254882812, "global_step": 566837, "epoch": 6829} {"train_loss": -27.64609146118164, "global_step": 566838, "epoch": 6829} {"train_loss": -27.91806411743164, "global_step": 566839, "epoch": 6829} {"train_loss": -28.04842185974121, "global_step": 566840, "epoch": 6829} {"train_loss": -28.050756454467773, "global_step": 566841, "epoch": 6829} {"train_loss": -27.9221248626709, "global_step": 566842, "epoch": 6829} {"train_loss": -27.83487892150879, "global_step": 566843, "epoch": 6829} {"train_loss": -28.04953956604004, "global_step": 566844, "epoch": 6829} {"train_loss": -28.00172233581543, "global_step": 566845, "epoch": 6829} {"train_loss": -28.04005241394043, "global_step": 566846, "epoch": 6829} {"train_loss": -27.6783390045166, "global_step": 566847, "epoch": 6829} {"train_loss": -27.901025772094727, "global_step": 566848, "epoch": 6829} {"train_loss": -27.9029541015625, "global_step": 566849, "epoch": 6829} {"train_loss": -28.243879318237305, "global_step": 566850, "epoch": 6829} {"train_loss": -27.778400421142578, "global_step": 566851, "epoch": 6829} {"train_loss": -27.962173461914062, "global_step": 566852, "epoch": 6829} {"train_loss": -27.909433364868164, "global_step": 566853, "epoch": 6829} {"train_loss": -28.292144775390625, "global_step": 566854, "epoch": 6829} {"train_loss": -27.63946533203125, "global_step": 566855, "epoch": 6829} {"train_loss": -28.00567054748535, "global_step": 566856, "epoch": 6829} {"train_loss": -28.0242919921875, "global_step": 566857, "epoch": 6829} {"train_loss": -27.721426010131836, "global_step": 566858, "epoch": 6829} {"train_loss": -27.703372955322266, "global_step": 566859, "epoch": 6829} {"train_loss": -27.758651733398438, "global_step": 566860, "epoch": 6829} {"train_loss": -27.754865646362305, "global_step": 566861, "epoch": 6829} {"train_loss": -27.676660537719727, "global_step": 566862, "epoch": 6829} {"train_loss": -27.726404190063477, "global_step": 566863, "epoch": 6829} {"train_loss": -27.975473403930664, "global_step": 566864, "epoch": 6829} {"train_loss": -27.940759658813477, "global_step": 566865, "epoch": 6829} {"train_loss": -28.17987632751465, "global_step": 566866, "epoch": 6829} {"train_loss": -27.579395294189453, "global_step": 566867, "epoch": 6829} {"train_loss": -27.915143966674805, "global_step": 566868, "epoch": 6829} {"train_loss": -27.800586700439453, "global_step": 566869, "epoch": 6829} {"train_loss": -28.071292877197266, "global_step": 566870, "epoch": 6829} {"train_loss": -28.147241592407227, "global_step": 566871, "epoch": 6829} {"train_loss": -28.1527156829834, "global_step": 566872, "epoch": 6829} {"train_loss": -27.608585357666016, "global_step": 566873, "epoch": 6829} {"train_loss": -27.65020751953125, "global_step": 566874, "epoch": 6829} {"train_loss": -27.581085205078125, "global_step": 566875, "epoch": 6829} {"train_loss": -27.6218204498291, "global_step": 566876, "epoch": 6829} {"train_loss": -28.095508575439453, "global_step": 566877, "epoch": 6829} {"train_loss": -27.84919548034668, "global_step": 566878, "epoch": 6829} {"train_loss": -27.85097312927246, "global_step": 566879, "epoch": 6829} {"train_loss": -27.71356201171875, "global_step": 566880, "epoch": 6829} {"train_loss": -28.056020736694336, "global_step": 566881, "epoch": 6829} {"train_loss": -27.919086456298828, "global_step": 566882, "epoch": 6829} {"train_loss": -28.002155303955078, "global_step": 566883, "epoch": 6829} {"train_loss": -27.831602096557617, "global_step": 566884, "epoch": 6829} {"train_loss": -27.704370498657227, "global_step": 566885, "epoch": 6829} {"train_loss": -28.418561935424805, "global_step": 566886, "epoch": 6829} {"train_loss": -27.78950309753418, "global_step": 566887, "epoch": 6829} {"train_loss": -27.852598190307617, "global_step": 566888, "epoch": 6829} {"train_loss": -27.816475328192652, "global_step": 566889, "epoch": 6829, "val_loss": 6817782.0} {"train_loss": -27.57427406311035, "global_step": 566890, "epoch": 6830} {"train_loss": -25.264251708984375, "global_step": 566891, "epoch": 6830} {"train_loss": -23.02752685546875, "global_step": 566892, "epoch": 6830} {"train_loss": -26.7835636138916, "global_step": 566893, "epoch": 6830} {"train_loss": -24.99251937866211, "global_step": 566894, "epoch": 6830} {"train_loss": -26.841754913330078, "global_step": 566895, "epoch": 6830} {"train_loss": -25.63492202758789, "global_step": 566896, "epoch": 6830} {"train_loss": -26.417438507080078, "global_step": 566897, "epoch": 6830} {"train_loss": -26.889541625976562, "global_step": 566898, "epoch": 6830} {"train_loss": -25.712543487548828, "global_step": 566899, "epoch": 6830} {"train_loss": -26.43194007873535, "global_step": 566900, "epoch": 6830} {"train_loss": -26.77667808532715, "global_step": 566901, "epoch": 6830} {"train_loss": -26.934436798095703, "global_step": 566902, "epoch": 6830} {"train_loss": -26.840087890625, "global_step": 566903, "epoch": 6830} {"train_loss": -26.945892333984375, "global_step": 566904, "epoch": 6830} {"train_loss": -27.058795928955078, "global_step": 566905, "epoch": 6830} {"train_loss": -27.117252349853516, "global_step": 566906, "epoch": 6830} {"train_loss": -26.98935317993164, "global_step": 566907, "epoch": 6830} {"train_loss": -27.00489616394043, "global_step": 566908, "epoch": 6830} {"train_loss": -27.15142822265625, "global_step": 566909, "epoch": 6830} {"train_loss": -26.83731460571289, "global_step": 566910, "epoch": 6830} {"train_loss": -26.88404655456543, "global_step": 566911, "epoch": 6830} {"train_loss": -27.076068878173828, "global_step": 566912, "epoch": 6830} {"train_loss": -27.172529220581055, "global_step": 566913, "epoch": 6830} {"train_loss": -27.244909286499023, "global_step": 566914, "epoch": 6830} {"train_loss": -27.430240631103516, "global_step": 566915, "epoch": 6830} {"train_loss": -27.09393310546875, "global_step": 566916, "epoch": 6830} {"train_loss": -27.270614624023438, "global_step": 566917, "epoch": 6830} {"train_loss": -27.329755783081055, "global_step": 566918, "epoch": 6830} {"train_loss": -27.377225875854492, "global_step": 566919, "epoch": 6830} {"train_loss": -27.559009552001953, "global_step": 566920, "epoch": 6830} {"train_loss": -27.522558212280273, "global_step": 566921, "epoch": 6830} {"train_loss": -27.47607421875, "global_step": 566922, "epoch": 6830} {"train_loss": -27.262460708618164, "global_step": 566923, "epoch": 6830} {"train_loss": -27.6357421875, "global_step": 566924, "epoch": 6830} {"train_loss": -27.496381759643555, "global_step": 566925, "epoch": 6830} {"train_loss": -27.724273681640625, "global_step": 566926, "epoch": 6830} {"train_loss": -27.45133399963379, "global_step": 566927, "epoch": 6830} {"train_loss": -27.669519424438477, "global_step": 566928, "epoch": 6830} {"train_loss": -27.81720542907715, "global_step": 566929, "epoch": 6830} {"train_loss": -27.745214462280273, "global_step": 566930, "epoch": 6830} {"train_loss": -27.352054595947266, "global_step": 566931, "epoch": 6830} {"train_loss": -27.542224884033203, "global_step": 566932, "epoch": 6830} {"train_loss": -27.55909538269043, "global_step": 566933, "epoch": 6830} {"train_loss": -27.60076904296875, "global_step": 566934, "epoch": 6830} {"train_loss": -27.359649658203125, "global_step": 566935, "epoch": 6830} {"train_loss": -27.887409210205078, "global_step": 566936, "epoch": 6830} {"train_loss": -27.668701171875, "global_step": 566937, "epoch": 6830} {"train_loss": -27.810476303100586, "global_step": 566938, "epoch": 6830} {"train_loss": -27.652881622314453, "global_step": 566939, "epoch": 6830} {"train_loss": -28.171066284179688, "global_step": 566940, "epoch": 6830} {"train_loss": -28.090539932250977, "global_step": 566941, "epoch": 6830} {"train_loss": -27.519733428955078, "global_step": 566942, "epoch": 6830} {"train_loss": -27.987516403198242, "global_step": 566943, "epoch": 6830} {"train_loss": -27.73236656188965, "global_step": 566944, "epoch": 6830} {"train_loss": -27.690160751342773, "global_step": 566945, "epoch": 6830} {"train_loss": -27.846200942993164, "global_step": 566946, "epoch": 6830} {"train_loss": -27.8881893157959, "global_step": 566947, "epoch": 6830} {"train_loss": -28.070520401000977, "global_step": 566948, "epoch": 6830} {"train_loss": -27.977741241455078, "global_step": 566949, "epoch": 6830} {"train_loss": -27.904438018798828, "global_step": 566950, "epoch": 6830} {"train_loss": -28.114599227905273, "global_step": 566951, "epoch": 6830} {"train_loss": -27.943845748901367, "global_step": 566952, "epoch": 6830} {"train_loss": -27.728382110595703, "global_step": 566953, "epoch": 6830} {"train_loss": -27.75776481628418, "global_step": 566954, "epoch": 6830} {"train_loss": -27.8319034576416, "global_step": 566955, "epoch": 6830} {"train_loss": -28.01918601989746, "global_step": 566956, "epoch": 6830} {"train_loss": -27.67042350769043, "global_step": 566957, "epoch": 6830} {"train_loss": -27.735464096069336, "global_step": 566958, "epoch": 6830} {"train_loss": -27.425296783447266, "global_step": 566959, "epoch": 6830} {"train_loss": -27.754201889038086, "global_step": 566960, "epoch": 6830} {"train_loss": -27.6949520111084, "global_step": 566961, "epoch": 6830} {"train_loss": -28.26702880859375, "global_step": 566962, "epoch": 6830} {"train_loss": -27.91037368774414, "global_step": 566963, "epoch": 6830} {"train_loss": -27.504608154296875, "global_step": 566964, "epoch": 6830} {"train_loss": -27.74717140197754, "global_step": 566965, "epoch": 6830} {"train_loss": -27.25189208984375, "global_step": 566966, "epoch": 6830} {"train_loss": -27.031110763549805, "global_step": 566967, "epoch": 6830} {"train_loss": -27.632123947143555, "global_step": 566968, "epoch": 6830} {"train_loss": -27.869354248046875, "global_step": 566969, "epoch": 6830} {"train_loss": -27.323522567749023, "global_step": 566970, "epoch": 6830} {"train_loss": -27.7327823638916, "global_step": 566971, "epoch": 6830} {"train_loss": -27.317880055990564, "global_step": 566972, "epoch": 6830, "val_loss": 6810621.0} {"train_loss": -26.800867080688477, "global_step": 566973, "epoch": 6831} {"train_loss": -27.181900024414062, "global_step": 566974, "epoch": 6831} {"train_loss": -27.55116844177246, "global_step": 566975, "epoch": 6831} {"train_loss": -27.450519561767578, "global_step": 566976, "epoch": 6831} {"train_loss": -27.2517032623291, "global_step": 566977, "epoch": 6831} {"train_loss": -27.23311424255371, "global_step": 566978, "epoch": 6831} {"train_loss": -27.48480224609375, "global_step": 566979, "epoch": 6831} {"train_loss": -27.409543991088867, "global_step": 566980, "epoch": 6831} {"train_loss": -27.503324508666992, "global_step": 566981, "epoch": 6831} {"train_loss": -27.337106704711914, "global_step": 566982, "epoch": 6831} {"train_loss": -27.47344970703125, "global_step": 566983, "epoch": 6831} {"train_loss": -27.514795303344727, "global_step": 566984, "epoch": 6831} {"train_loss": -27.804443359375, "global_step": 566985, "epoch": 6831} {"train_loss": -27.720264434814453, "global_step": 566986, "epoch": 6831} {"train_loss": -27.946813583374023, "global_step": 566987, "epoch": 6831} {"train_loss": -27.72938346862793, "global_step": 566988, "epoch": 6831} {"train_loss": -27.89753532409668, "global_step": 566989, "epoch": 6831} {"train_loss": -27.793292999267578, "global_step": 566990, "epoch": 6831} {"train_loss": -27.868392944335938, "global_step": 566991, "epoch": 6831} {"train_loss": -27.722335815429688, "global_step": 566992, "epoch": 6831} {"train_loss": -27.939706802368164, "global_step": 566993, "epoch": 6831} {"train_loss": -28.085067749023438, "global_step": 566994, "epoch": 6831} {"train_loss": -27.545059204101562, "global_step": 566995, "epoch": 6831} {"train_loss": -27.534244537353516, "global_step": 566996, "epoch": 6831} {"train_loss": -27.928619384765625, "global_step": 566997, "epoch": 6831} {"train_loss": -28.193897247314453, "global_step": 566998, "epoch": 6831} {"train_loss": -27.836652755737305, "global_step": 566999, "epoch": 6831} {"train_loss": -27.583932876586914, "global_step": 567000, "epoch": 6831} {"train_loss": -27.641010284423828, "global_step": 567001, "epoch": 6831} {"train_loss": -27.877853393554688, "global_step": 567002, "epoch": 6831} {"train_loss": -27.839202880859375, "global_step": 567003, "epoch": 6831} {"train_loss": -27.632278442382812, "global_step": 567004, "epoch": 6831} {"train_loss": -27.780536651611328, "global_step": 567005, "epoch": 6831} {"train_loss": -27.802066802978516, "global_step": 567006, "epoch": 6831} {"train_loss": -27.908212661743164, "global_step": 567007, "epoch": 6831} {"train_loss": -28.135528564453125, "global_step": 567008, "epoch": 6831} {"train_loss": -27.913288116455078, "global_step": 567009, "epoch": 6831} {"train_loss": -27.88960075378418, "global_step": 567010, "epoch": 6831} {"train_loss": -27.647336959838867, "global_step": 567011, "epoch": 6831} {"train_loss": -28.009098052978516, "global_step": 567012, "epoch": 6831} {"train_loss": -27.90236473083496, "global_step": 567013, "epoch": 6831} {"train_loss": -27.709064483642578, "global_step": 567014, "epoch": 6831} {"train_loss": -27.764738082885742, "global_step": 567015, "epoch": 6831} {"train_loss": -27.812149047851562, "global_step": 567016, "epoch": 6831} {"train_loss": -28.433942794799805, "global_step": 567017, "epoch": 6831} {"train_loss": -28.27680778503418, "global_step": 567018, "epoch": 6831} {"train_loss": -28.009906768798828, "global_step": 567019, "epoch": 6831} {"train_loss": -27.657957077026367, "global_step": 567020, "epoch": 6831} {"train_loss": -27.534955978393555, "global_step": 567021, "epoch": 6831} {"train_loss": -27.635242462158203, "global_step": 567022, "epoch": 6831} {"train_loss": -27.37652587890625, "global_step": 567023, "epoch": 6831} {"train_loss": -26.8421573638916, "global_step": 567024, "epoch": 6831} {"train_loss": -27.286670684814453, "global_step": 567025, "epoch": 6831} {"train_loss": -27.86978530883789, "global_step": 567026, "epoch": 6831} {"train_loss": -27.51563835144043, "global_step": 567027, "epoch": 6831} {"train_loss": -27.145751953125, "global_step": 567028, "epoch": 6831} {"train_loss": -27.192779541015625, "global_step": 567029, "epoch": 6831} {"train_loss": -27.458669662475586, "global_step": 567030, "epoch": 6831} {"train_loss": -27.51163673400879, "global_step": 567031, "epoch": 6831} {"train_loss": -27.499164581298828, "global_step": 567032, "epoch": 6831} {"train_loss": -27.423620223999023, "global_step": 567033, "epoch": 6831} {"train_loss": -27.71600341796875, "global_step": 567034, "epoch": 6831} {"train_loss": -27.518766403198242, "global_step": 567035, "epoch": 6831} {"train_loss": -27.38286781311035, "global_step": 567036, "epoch": 6831} {"train_loss": -27.78839683532715, "global_step": 567037, "epoch": 6831} {"train_loss": -27.520917892456055, "global_step": 567038, "epoch": 6831} {"train_loss": -27.7203311920166, "global_step": 567039, "epoch": 6831} {"train_loss": -27.74554443359375, "global_step": 567040, "epoch": 6831} {"train_loss": -27.503381729125977, "global_step": 567041, "epoch": 6831} {"train_loss": -27.587400436401367, "global_step": 567042, "epoch": 6831} {"train_loss": -27.522754669189453, "global_step": 567043, "epoch": 6831} {"train_loss": -27.538293838500977, "global_step": 567044, "epoch": 6831} {"train_loss": -27.319482803344727, "global_step": 567045, "epoch": 6831} {"train_loss": -28.180830001831055, "global_step": 567046, "epoch": 6831} {"train_loss": -27.798572540283203, "global_step": 567047, "epoch": 6831} {"train_loss": -27.522693634033203, "global_step": 567048, "epoch": 6831} {"train_loss": -27.804492950439453, "global_step": 567049, "epoch": 6831} {"train_loss": -27.74342155456543, "global_step": 567050, "epoch": 6831} {"train_loss": -27.8869571685791, "global_step": 567051, "epoch": 6831} {"train_loss": -27.42400550842285, "global_step": 567052, "epoch": 6831} {"train_loss": -27.976709365844727, "global_step": 567053, "epoch": 6831} {"train_loss": -28.053647994995117, "global_step": 567054, "epoch": 6831} {"train_loss": -27.639206897781555, "global_step": 567055, "epoch": 6831, "val_loss": 6820058.0} {"train_loss": -26.724645614624023, "global_step": 567056, "epoch": 6832} {"train_loss": -27.270627975463867, "global_step": 567057, "epoch": 6832} {"train_loss": -26.85956382751465, "global_step": 567058, "epoch": 6832} {"train_loss": -27.296289443969727, "global_step": 567059, "epoch": 6832} {"train_loss": -27.531293869018555, "global_step": 567060, "epoch": 6832} {"train_loss": -26.884328842163086, "global_step": 567061, "epoch": 6832} {"train_loss": -27.477832794189453, "global_step": 567062, "epoch": 6832} {"train_loss": -27.6075439453125, "global_step": 567063, "epoch": 6832} {"train_loss": -27.4349422454834, "global_step": 567064, "epoch": 6832} {"train_loss": -27.46124839782715, "global_step": 567065, "epoch": 6832} {"train_loss": -27.35053825378418, "global_step": 567066, "epoch": 6832} {"train_loss": -27.386621475219727, "global_step": 567067, "epoch": 6832} {"train_loss": -27.514816284179688, "global_step": 567068, "epoch": 6832} {"train_loss": -27.363784790039062, "global_step": 567069, "epoch": 6832} {"train_loss": -27.623279571533203, "global_step": 567070, "epoch": 6832} {"train_loss": -27.71954917907715, "global_step": 567071, "epoch": 6832} {"train_loss": -28.0253963470459, "global_step": 567072, "epoch": 6832} {"train_loss": -28.103565216064453, "global_step": 567073, "epoch": 6832} {"train_loss": -27.482229232788086, "global_step": 567074, "epoch": 6832} {"train_loss": -27.6719913482666, "global_step": 567075, "epoch": 6832} {"train_loss": -27.877166748046875, "global_step": 567076, "epoch": 6832} {"train_loss": -27.753250122070312, "global_step": 567077, "epoch": 6832} {"train_loss": -27.569477081298828, "global_step": 567078, "epoch": 6832} {"train_loss": -27.853107452392578, "global_step": 567079, "epoch": 6832} {"train_loss": -27.866315841674805, "global_step": 567080, "epoch": 6832} {"train_loss": -27.725351333618164, "global_step": 567081, "epoch": 6832} {"train_loss": -27.994665145874023, "global_step": 567082, "epoch": 6832} {"train_loss": -27.4001522064209, "global_step": 567083, "epoch": 6832} {"train_loss": -27.4869384765625, "global_step": 567084, "epoch": 6832} {"train_loss": -27.730077743530273, "global_step": 567085, "epoch": 6832} {"train_loss": -28.109243392944336, "global_step": 567086, "epoch": 6832} {"train_loss": -27.77728843688965, "global_step": 567087, "epoch": 6832} {"train_loss": -27.83643913269043, "global_step": 567088, "epoch": 6832} {"train_loss": -27.744230270385742, "global_step": 567089, "epoch": 6832} {"train_loss": -28.021472930908203, "global_step": 567090, "epoch": 6832} {"train_loss": -27.902597427368164, "global_step": 567091, "epoch": 6832} {"train_loss": -27.52546501159668, "global_step": 567092, "epoch": 6832} {"train_loss": -27.701587677001953, "global_step": 567093, "epoch": 6832} {"train_loss": -27.926345825195312, "global_step": 567094, "epoch": 6832} {"train_loss": -28.465368270874023, "global_step": 567095, "epoch": 6832} {"train_loss": -28.3013858795166, "global_step": 567096, "epoch": 6832} {"train_loss": -27.75638771057129, "global_step": 567097, "epoch": 6832} {"train_loss": -28.2642879486084, "global_step": 567098, "epoch": 6832} {"train_loss": -27.888690948486328, "global_step": 567099, "epoch": 6832} {"train_loss": -28.134002685546875, "global_step": 567100, "epoch": 6832} {"train_loss": -27.990819931030273, "global_step": 567101, "epoch": 6832} {"train_loss": -28.210235595703125, "global_step": 567102, "epoch": 6832} {"train_loss": -28.0638370513916, "global_step": 567103, "epoch": 6832} {"train_loss": -28.025724411010742, "global_step": 567104, "epoch": 6832} {"train_loss": -27.871335983276367, "global_step": 567105, "epoch": 6832} {"train_loss": -27.54107666015625, "global_step": 567106, "epoch": 6832} {"train_loss": -27.988513946533203, "global_step": 567107, "epoch": 6832} {"train_loss": -27.618976593017578, "global_step": 567108, "epoch": 6832} {"train_loss": -27.986448287963867, "global_step": 567109, "epoch": 6832} {"train_loss": -28.158178329467773, "global_step": 567110, "epoch": 6832} {"train_loss": -27.840009689331055, "global_step": 567111, "epoch": 6832} {"train_loss": -27.78900718688965, "global_step": 567112, "epoch": 6832} {"train_loss": -27.899444580078125, "global_step": 567113, "epoch": 6832} {"train_loss": -27.891357421875, "global_step": 567114, "epoch": 6832} {"train_loss": -28.263418197631836, "global_step": 567115, "epoch": 6832} {"train_loss": -27.8065128326416, "global_step": 567116, "epoch": 6832} {"train_loss": -28.03639793395996, "global_step": 567117, "epoch": 6832} {"train_loss": -27.715808868408203, "global_step": 567118, "epoch": 6832} {"train_loss": -27.58685874938965, "global_step": 567119, "epoch": 6832} {"train_loss": -27.4816951751709, "global_step": 567120, "epoch": 6832} {"train_loss": -27.371335983276367, "global_step": 567121, "epoch": 6832} {"train_loss": -27.841474533081055, "global_step": 567122, "epoch": 6832} {"train_loss": -28.203271865844727, "global_step": 567123, "epoch": 6832} {"train_loss": -27.86726951599121, "global_step": 567124, "epoch": 6832} {"train_loss": -28.024808883666992, "global_step": 567125, "epoch": 6832} {"train_loss": -27.466266632080078, "global_step": 567126, "epoch": 6832} {"train_loss": -28.209421157836914, "global_step": 567127, "epoch": 6832} {"train_loss": -28.15109634399414, "global_step": 567128, "epoch": 6832} {"train_loss": -27.925296783447266, "global_step": 567129, "epoch": 6832} {"train_loss": -27.846424102783203, "global_step": 567130, "epoch": 6832} {"train_loss": -27.702314376831055, "global_step": 567131, "epoch": 6832} {"train_loss": -27.63298988342285, "global_step": 567132, "epoch": 6832} {"train_loss": -28.08757972717285, "global_step": 567133, "epoch": 6832} {"train_loss": -27.894224166870117, "global_step": 567134, "epoch": 6832} {"train_loss": -27.9505672454834, "global_step": 567135, "epoch": 6832} {"train_loss": -27.566076278686523, "global_step": 567136, "epoch": 6832} {"train_loss": -27.764699935913086, "global_step": 567137, "epoch": 6832} {"train_loss": -27.76927403369582, "global_step": 567138, "epoch": 6832, "val_loss": 6817744.0} {"train_loss": -27.538223266601562, "global_step": 567139, "epoch": 6833} {"train_loss": -27.495466232299805, "global_step": 567140, "epoch": 6833} {"train_loss": -27.55607032775879, "global_step": 567141, "epoch": 6833} {"train_loss": -27.565235137939453, "global_step": 567142, "epoch": 6833} {"train_loss": -27.326200485229492, "global_step": 567143, "epoch": 6833} {"train_loss": -27.618432998657227, "global_step": 567144, "epoch": 6833} {"train_loss": -27.2448673248291, "global_step": 567145, "epoch": 6833} {"train_loss": -26.910802841186523, "global_step": 567146, "epoch": 6833} {"train_loss": -27.709827423095703, "global_step": 567147, "epoch": 6833} {"train_loss": -27.735443115234375, "global_step": 567148, "epoch": 6833} {"train_loss": -27.38507652282715, "global_step": 567149, "epoch": 6833} {"train_loss": -27.636734008789062, "global_step": 567150, "epoch": 6833} {"train_loss": -27.152822494506836, "global_step": 567151, "epoch": 6833} {"train_loss": -27.52616310119629, "global_step": 567152, "epoch": 6833} {"train_loss": -27.755050659179688, "global_step": 567153, "epoch": 6833} {"train_loss": -27.657684326171875, "global_step": 567154, "epoch": 6833} {"train_loss": -27.90374755859375, "global_step": 567155, "epoch": 6833} {"train_loss": -27.35377311706543, "global_step": 567156, "epoch": 6833} {"train_loss": -27.77162742614746, "global_step": 567157, "epoch": 6833} {"train_loss": -27.357763290405273, "global_step": 567158, "epoch": 6833} {"train_loss": -27.893659591674805, "global_step": 567159, "epoch": 6833} {"train_loss": -27.763959884643555, "global_step": 567160, "epoch": 6833} {"train_loss": -27.680816650390625, "global_step": 567161, "epoch": 6833} {"train_loss": -27.828611373901367, "global_step": 567162, "epoch": 6833} {"train_loss": -27.779993057250977, "global_step": 567163, "epoch": 6833} {"train_loss": -27.849658966064453, "global_step": 567164, "epoch": 6833} {"train_loss": -27.944171905517578, "global_step": 567165, "epoch": 6833} {"train_loss": -28.0921573638916, "global_step": 567166, "epoch": 6833} {"train_loss": -27.565494537353516, "global_step": 567167, "epoch": 6833} {"train_loss": -27.6510009765625, "global_step": 567168, "epoch": 6833} {"train_loss": -28.113218307495117, "global_step": 567169, "epoch": 6833} {"train_loss": -27.9399356842041, "global_step": 567170, "epoch": 6833} {"train_loss": -27.830114364624023, "global_step": 567171, "epoch": 6833} {"train_loss": -27.55372428894043, "global_step": 567172, "epoch": 6833} {"train_loss": -27.892181396484375, "global_step": 567173, "epoch": 6833} {"train_loss": -27.69114112854004, "global_step": 567174, "epoch": 6833} {"train_loss": -27.8753662109375, "global_step": 567175, "epoch": 6833} {"train_loss": -27.755390167236328, "global_step": 567176, "epoch": 6833} {"train_loss": -27.598941802978516, "global_step": 567177, "epoch": 6833} {"train_loss": -27.61432456970215, "global_step": 567178, "epoch": 6833} {"train_loss": -27.85218620300293, "global_step": 567179, "epoch": 6833} {"train_loss": -27.827131271362305, "global_step": 567180, "epoch": 6833} {"train_loss": -27.477191925048828, "global_step": 567181, "epoch": 6833} {"train_loss": -28.076709747314453, "global_step": 567182, "epoch": 6833} {"train_loss": -27.823495864868164, "global_step": 567183, "epoch": 6833} {"train_loss": -27.9107723236084, "global_step": 567184, "epoch": 6833} {"train_loss": -27.91688346862793, "global_step": 567185, "epoch": 6833} {"train_loss": -27.916501998901367, "global_step": 567186, "epoch": 6833} {"train_loss": -27.837888717651367, "global_step": 567187, "epoch": 6833} {"train_loss": -27.866947174072266, "global_step": 567188, "epoch": 6833} {"train_loss": -27.6149845123291, "global_step": 567189, "epoch": 6833} {"train_loss": -28.0078125, "global_step": 567190, "epoch": 6833} {"train_loss": -27.825702667236328, "global_step": 567191, "epoch": 6833} {"train_loss": -27.734968185424805, "global_step": 567192, "epoch": 6833} {"train_loss": -27.917865753173828, "global_step": 567193, "epoch": 6833} {"train_loss": -27.572919845581055, "global_step": 567194, "epoch": 6833} {"train_loss": -28.060205459594727, "global_step": 567195, "epoch": 6833} {"train_loss": -27.94025993347168, "global_step": 567196, "epoch": 6833} {"train_loss": -28.04792594909668, "global_step": 567197, "epoch": 6833} {"train_loss": -27.82905387878418, "global_step": 567198, "epoch": 6833} {"train_loss": -28.075708389282227, "global_step": 567199, "epoch": 6833} {"train_loss": -27.656137466430664, "global_step": 567200, "epoch": 6833} {"train_loss": -27.691614151000977, "global_step": 567201, "epoch": 6833} {"train_loss": -27.839094161987305, "global_step": 567202, "epoch": 6833} {"train_loss": -27.431060791015625, "global_step": 567203, "epoch": 6833} {"train_loss": -27.873523712158203, "global_step": 567204, "epoch": 6833} {"train_loss": -27.365076065063477, "global_step": 567205, "epoch": 6833} {"train_loss": -27.861316680908203, "global_step": 567206, "epoch": 6833} {"train_loss": -28.04237174987793, "global_step": 567207, "epoch": 6833} {"train_loss": -28.06393814086914, "global_step": 567208, "epoch": 6833} {"train_loss": -27.670740127563477, "global_step": 567209, "epoch": 6833} {"train_loss": -28.08759880065918, "global_step": 567210, "epoch": 6833} {"train_loss": -27.666112899780273, "global_step": 567211, "epoch": 6833} {"train_loss": -28.092939376831055, "global_step": 567212, "epoch": 6833} {"train_loss": -27.745996475219727, "global_step": 567213, "epoch": 6833} {"train_loss": -27.916736602783203, "global_step": 567214, "epoch": 6833} {"train_loss": -28.394689559936523, "global_step": 567215, "epoch": 6833} {"train_loss": -28.0740909576416, "global_step": 567216, "epoch": 6833} {"train_loss": -27.813024520874023, "global_step": 567217, "epoch": 6833} {"train_loss": -27.749914169311523, "global_step": 567218, "epoch": 6833} {"train_loss": -28.057092666625977, "global_step": 567219, "epoch": 6833} {"train_loss": -27.502878189086914, "global_step": 567220, "epoch": 6833} {"train_loss": -27.730935383992023, "global_step": 567221, "epoch": 6833, "val_loss": 6807908.0} {"train_loss": -22.804946899414062, "global_step": 567222, "epoch": 6834} {"train_loss": -25.455759048461914, "global_step": 567223, "epoch": 6834} {"train_loss": -25.920129776000977, "global_step": 567224, "epoch": 6834} {"train_loss": -24.76032257080078, "global_step": 567225, "epoch": 6834} {"train_loss": -25.748218536376953, "global_step": 567226, "epoch": 6834} {"train_loss": -24.6865291595459, "global_step": 567227, "epoch": 6834} {"train_loss": -25.545700073242188, "global_step": 567228, "epoch": 6834} {"train_loss": -26.542531967163086, "global_step": 567229, "epoch": 6834} {"train_loss": -25.540403366088867, "global_step": 567230, "epoch": 6834} {"train_loss": -26.15106201171875, "global_step": 567231, "epoch": 6834} {"train_loss": -26.78597068786621, "global_step": 567232, "epoch": 6834} {"train_loss": -26.37837028503418, "global_step": 567233, "epoch": 6834} {"train_loss": -26.282575607299805, "global_step": 567234, "epoch": 6834} {"train_loss": -26.400564193725586, "global_step": 567235, "epoch": 6834} {"train_loss": -26.723957061767578, "global_step": 567236, "epoch": 6834} {"train_loss": -26.851037979125977, "global_step": 567237, "epoch": 6834} {"train_loss": -26.742725372314453, "global_step": 567238, "epoch": 6834} {"train_loss": -26.876001358032227, "global_step": 567239, "epoch": 6834} {"train_loss": -26.869312286376953, "global_step": 567240, "epoch": 6834} {"train_loss": -26.495819091796875, "global_step": 567241, "epoch": 6834} {"train_loss": -26.991485595703125, "global_step": 567242, "epoch": 6834} {"train_loss": -26.667638778686523, "global_step": 567243, "epoch": 6834} {"train_loss": -27.10614585876465, "global_step": 567244, "epoch": 6834} {"train_loss": -27.033355712890625, "global_step": 567245, "epoch": 6834} {"train_loss": -27.22568702697754, "global_step": 567246, "epoch": 6834} {"train_loss": -27.046483993530273, "global_step": 567247, "epoch": 6834} {"train_loss": -27.39100456237793, "global_step": 567248, "epoch": 6834} {"train_loss": -26.997486114501953, "global_step": 567249, "epoch": 6834} {"train_loss": -27.39463233947754, "global_step": 567250, "epoch": 6834} {"train_loss": -27.51953125, "global_step": 567251, "epoch": 6834} {"train_loss": -27.23722267150879, "global_step": 567252, "epoch": 6834} {"train_loss": -27.408782958984375, "global_step": 567253, "epoch": 6834} {"train_loss": -27.5622501373291, "global_step": 567254, "epoch": 6834} {"train_loss": -27.38942527770996, "global_step": 567255, "epoch": 6834} {"train_loss": -27.815759658813477, "global_step": 567256, "epoch": 6834} {"train_loss": -27.672998428344727, "global_step": 567257, "epoch": 6834} {"train_loss": -27.6675968170166, "global_step": 567258, "epoch": 6834} {"train_loss": -27.579547882080078, "global_step": 567259, "epoch": 6834} {"train_loss": -27.591068267822266, "global_step": 567260, "epoch": 6834} {"train_loss": -27.317792892456055, "global_step": 567261, "epoch": 6834} {"train_loss": -27.703332901000977, "global_step": 567262, "epoch": 6834} {"train_loss": -27.33920669555664, "global_step": 567263, "epoch": 6834} {"train_loss": -27.45550537109375, "global_step": 567264, "epoch": 6834} {"train_loss": -27.621570587158203, "global_step": 567265, "epoch": 6834} {"train_loss": -27.696805953979492, "global_step": 567266, "epoch": 6834} {"train_loss": -27.480329513549805, "global_step": 567267, "epoch": 6834} {"train_loss": -27.640018463134766, "global_step": 567268, "epoch": 6834} {"train_loss": -27.760883331298828, "global_step": 567269, "epoch": 6834} {"train_loss": -27.817798614501953, "global_step": 567270, "epoch": 6834} {"train_loss": -27.742298126220703, "global_step": 567271, "epoch": 6834} {"train_loss": -27.48026466369629, "global_step": 567272, "epoch": 6834} {"train_loss": -27.187061309814453, "global_step": 567273, "epoch": 6834} {"train_loss": -27.58447265625, "global_step": 567274, "epoch": 6834} {"train_loss": -27.751712799072266, "global_step": 567275, "epoch": 6834} {"train_loss": -27.58222007751465, "global_step": 567276, "epoch": 6834} {"train_loss": -27.678632736206055, "global_step": 567277, "epoch": 6834} {"train_loss": -27.626575469970703, "global_step": 567278, "epoch": 6834} {"train_loss": -27.128320693969727, "global_step": 567279, "epoch": 6834} {"train_loss": -27.150592803955078, "global_step": 567280, "epoch": 6834} {"train_loss": -27.072423934936523, "global_step": 567281, "epoch": 6834} {"train_loss": -26.76483154296875, "global_step": 567282, "epoch": 6834} {"train_loss": -27.608291625976562, "global_step": 567283, "epoch": 6834} {"train_loss": -27.748571395874023, "global_step": 567284, "epoch": 6834} {"train_loss": -27.176441192626953, "global_step": 567285, "epoch": 6834} {"train_loss": -27.168243408203125, "global_step": 567286, "epoch": 6834} {"train_loss": -27.621051788330078, "global_step": 567287, "epoch": 6834} {"train_loss": -27.84950828552246, "global_step": 567288, "epoch": 6834} {"train_loss": -27.893817901611328, "global_step": 567289, "epoch": 6834} {"train_loss": -27.814178466796875, "global_step": 567290, "epoch": 6834} {"train_loss": -27.503137588500977, "global_step": 567291, "epoch": 6834} {"train_loss": -27.520090103149414, "global_step": 567292, "epoch": 6834} {"train_loss": -27.48419761657715, "global_step": 567293, "epoch": 6834} {"train_loss": -28.21079444885254, "global_step": 567294, "epoch": 6834} {"train_loss": -27.270160675048828, "global_step": 567295, "epoch": 6834} {"train_loss": -27.6513614654541, "global_step": 567296, "epoch": 6834} {"train_loss": -27.413511276245117, "global_step": 567297, "epoch": 6834} {"train_loss": -27.563262939453125, "global_step": 567298, "epoch": 6834} {"train_loss": -27.469160079956055, "global_step": 567299, "epoch": 6834} {"train_loss": -28.06007194519043, "global_step": 567300, "epoch": 6834} {"train_loss": -27.67254066467285, "global_step": 567301, "epoch": 6834} {"train_loss": -27.781085968017578, "global_step": 567302, "epoch": 6834} {"train_loss": -27.840240478515625, "global_step": 567303, "epoch": 6834} {"train_loss": -27.139601650008235, "global_step": 567304, "epoch": 6834, "val_loss": 6869817.0} {"train_loss": -27.26324462890625, "global_step": 567305, "epoch": 6835} {"train_loss": -27.62408447265625, "global_step": 567306, "epoch": 6835} {"train_loss": -27.110443115234375, "global_step": 567307, "epoch": 6835} {"train_loss": -27.275787353515625, "global_step": 567308, "epoch": 6835} {"train_loss": -27.047452926635742, "global_step": 567309, "epoch": 6835} {"train_loss": -27.456098556518555, "global_step": 567310, "epoch": 6835} {"train_loss": -27.520050048828125, "global_step": 567311, "epoch": 6835} {"train_loss": -26.900604248046875, "global_step": 567312, "epoch": 6835} {"train_loss": -27.176013946533203, "global_step": 567313, "epoch": 6835} {"train_loss": -27.83975601196289, "global_step": 567314, "epoch": 6835} {"train_loss": -27.193078994750977, "global_step": 567315, "epoch": 6835} {"train_loss": -27.4589900970459, "global_step": 567316, "epoch": 6835} {"train_loss": -27.709247589111328, "global_step": 567317, "epoch": 6835} {"train_loss": -27.6127872467041, "global_step": 567318, "epoch": 6835} {"train_loss": -27.46038246154785, "global_step": 567319, "epoch": 6835} {"train_loss": -27.595672607421875, "global_step": 567320, "epoch": 6835} {"train_loss": -27.649383544921875, "global_step": 567321, "epoch": 6835} {"train_loss": -28.09309196472168, "global_step": 567322, "epoch": 6835} {"train_loss": -27.492918014526367, "global_step": 567323, "epoch": 6835} {"train_loss": -27.35719871520996, "global_step": 567324, "epoch": 6835} {"train_loss": -27.698165893554688, "global_step": 567325, "epoch": 6835} {"train_loss": -27.703022003173828, "global_step": 567326, "epoch": 6835} {"train_loss": -27.766332626342773, "global_step": 567327, "epoch": 6835} {"train_loss": -28.035207748413086, "global_step": 567328, "epoch": 6835} {"train_loss": -27.369802474975586, "global_step": 567329, "epoch": 6835} {"train_loss": -27.8620662689209, "global_step": 567330, "epoch": 6835} {"train_loss": -27.8461971282959, "global_step": 567331, "epoch": 6835} {"train_loss": -27.8023624420166, "global_step": 567332, "epoch": 6835} {"train_loss": -28.19074058532715, "global_step": 567333, "epoch": 6835} {"train_loss": -28.199115753173828, "global_step": 567334, "epoch": 6835} {"train_loss": -28.074050903320312, "global_step": 567335, "epoch": 6835} {"train_loss": -27.8684139251709, "global_step": 567336, "epoch": 6835} {"train_loss": -27.986698150634766, "global_step": 567337, "epoch": 6835} {"train_loss": -28.033828735351562, "global_step": 567338, "epoch": 6835} {"train_loss": -27.632293701171875, "global_step": 567339, "epoch": 6835} {"train_loss": -27.425521850585938, "global_step": 567340, "epoch": 6835} {"train_loss": -27.70857048034668, "global_step": 567341, "epoch": 6835} {"train_loss": -28.16281509399414, "global_step": 567342, "epoch": 6835} {"train_loss": -27.90925407409668, "global_step": 567343, "epoch": 6835} {"train_loss": -27.58045768737793, "global_step": 567344, "epoch": 6835} {"train_loss": -28.060302734375, "global_step": 567345, "epoch": 6835} {"train_loss": -28.022031784057617, "global_step": 567346, "epoch": 6835} {"train_loss": -28.075794219970703, "global_step": 567347, "epoch": 6835} {"train_loss": -27.701330184936523, "global_step": 567348, "epoch": 6835} {"train_loss": -28.09043312072754, "global_step": 567349, "epoch": 6835} {"train_loss": -27.537738800048828, "global_step": 567350, "epoch": 6835} {"train_loss": -28.204334259033203, "global_step": 567351, "epoch": 6835} {"train_loss": -28.15467643737793, "global_step": 567352, "epoch": 6835} {"train_loss": -27.702722549438477, "global_step": 567353, "epoch": 6835} {"train_loss": -28.015329360961914, "global_step": 567354, "epoch": 6835} {"train_loss": -28.0092716217041, "global_step": 567355, "epoch": 6835} {"train_loss": -27.95589256286621, "global_step": 567356, "epoch": 6835} {"train_loss": -27.821157455444336, "global_step": 567357, "epoch": 6835} {"train_loss": -27.980676651000977, "global_step": 567358, "epoch": 6835} {"train_loss": -27.130033493041992, "global_step": 567359, "epoch": 6835} {"train_loss": -27.5098876953125, "global_step": 567360, "epoch": 6835} {"train_loss": -27.207992553710938, "global_step": 567361, "epoch": 6835} {"train_loss": -27.98312759399414, "global_step": 567362, "epoch": 6835} {"train_loss": -27.8950252532959, "global_step": 567363, "epoch": 6835} {"train_loss": -27.4160213470459, "global_step": 567364, "epoch": 6835} {"train_loss": -27.65456199645996, "global_step": 567365, "epoch": 6835} {"train_loss": -27.88587760925293, "global_step": 567366, "epoch": 6835} {"train_loss": -27.796966552734375, "global_step": 567367, "epoch": 6835} {"train_loss": -27.48187828063965, "global_step": 567368, "epoch": 6835} {"train_loss": -27.372608184814453, "global_step": 567369, "epoch": 6835} {"train_loss": -27.741601943969727, "global_step": 567370, "epoch": 6835} {"train_loss": -27.82610511779785, "global_step": 567371, "epoch": 6835} {"train_loss": -27.738500595092773, "global_step": 567372, "epoch": 6835} {"train_loss": -27.97369384765625, "global_step": 567373, "epoch": 6835} {"train_loss": -27.74525260925293, "global_step": 567374, "epoch": 6835} {"train_loss": -27.734975814819336, "global_step": 567375, "epoch": 6835} {"train_loss": -28.138525009155273, "global_step": 567376, "epoch": 6835} {"train_loss": -28.039142608642578, "global_step": 567377, "epoch": 6835} {"train_loss": -27.895965576171875, "global_step": 567378, "epoch": 6835} {"train_loss": -28.00819969177246, "global_step": 567379, "epoch": 6835} {"train_loss": -28.1187686920166, "global_step": 567380, "epoch": 6835} {"train_loss": -27.698949813842773, "global_step": 567381, "epoch": 6835} {"train_loss": -27.848743438720703, "global_step": 567382, "epoch": 6835} {"train_loss": -27.671497344970703, "global_step": 567383, "epoch": 6835} {"train_loss": -28.283447265625, "global_step": 567384, "epoch": 6835} {"train_loss": -27.823932647705078, "global_step": 567385, "epoch": 6835} {"train_loss": -27.888517379760742, "global_step": 567386, "epoch": 6835} {"train_loss": -27.74293469808188, "global_step": 567387, "epoch": 6835, "val_loss": 6836902.5} {"train_loss": -27.5842342376709, "global_step": 567388, "epoch": 6836} {"train_loss": -27.065673828125, "global_step": 567389, "epoch": 6836} {"train_loss": -27.51812744140625, "global_step": 567390, "epoch": 6836} {"train_loss": -27.8521785736084, "global_step": 567391, "epoch": 6836} {"train_loss": -27.496082305908203, "global_step": 567392, "epoch": 6836} {"train_loss": -27.602994918823242, "global_step": 567393, "epoch": 6836} {"train_loss": -27.64068603515625, "global_step": 567394, "epoch": 6836} {"train_loss": -27.894372940063477, "global_step": 567395, "epoch": 6836} {"train_loss": -27.5106143951416, "global_step": 567396, "epoch": 6836} {"train_loss": -27.826904296875, "global_step": 567397, "epoch": 6836} {"train_loss": -27.70265007019043, "global_step": 567398, "epoch": 6836} {"train_loss": -27.366500854492188, "global_step": 567399, "epoch": 6836} {"train_loss": -27.677377700805664, "global_step": 567400, "epoch": 6836} {"train_loss": -27.80030632019043, "global_step": 567401, "epoch": 6836} {"train_loss": -27.390430450439453, "global_step": 567402, "epoch": 6836} {"train_loss": -27.501956939697266, "global_step": 567403, "epoch": 6836} {"train_loss": -27.812992095947266, "global_step": 567404, "epoch": 6836} {"train_loss": -27.589649200439453, "global_step": 567405, "epoch": 6836} {"train_loss": -27.6994686126709, "global_step": 567406, "epoch": 6836} {"train_loss": -27.2385196685791, "global_step": 567407, "epoch": 6836} {"train_loss": -28.052921295166016, "global_step": 567408, "epoch": 6836} {"train_loss": -27.752225875854492, "global_step": 567409, "epoch": 6836} {"train_loss": -27.667072296142578, "global_step": 567410, "epoch": 6836} {"train_loss": -27.986356735229492, "global_step": 567411, "epoch": 6836} {"train_loss": -27.676700592041016, "global_step": 567412, "epoch": 6836} {"train_loss": -27.835357666015625, "global_step": 567413, "epoch": 6836} {"train_loss": -27.656579971313477, "global_step": 567414, "epoch": 6836} {"train_loss": -27.74249267578125, "global_step": 567415, "epoch": 6836} {"train_loss": -27.743640899658203, "global_step": 567416, "epoch": 6836} {"train_loss": -27.793394088745117, "global_step": 567417, "epoch": 6836} {"train_loss": -27.66485595703125, "global_step": 567418, "epoch": 6836} {"train_loss": -27.492963790893555, "global_step": 567419, "epoch": 6836} {"train_loss": -27.93829917907715, "global_step": 567420, "epoch": 6836} {"train_loss": -27.486953735351562, "global_step": 567421, "epoch": 6836} {"train_loss": -28.188398361206055, "global_step": 567422, "epoch": 6836} {"train_loss": -27.727102279663086, "global_step": 567423, "epoch": 6836} {"train_loss": -28.193256378173828, "global_step": 567424, "epoch": 6836} {"train_loss": -28.098602294921875, "global_step": 567425, "epoch": 6836} {"train_loss": -27.989242553710938, "global_step": 567426, "epoch": 6836} {"train_loss": -27.57828712463379, "global_step": 567427, "epoch": 6836} {"train_loss": -27.732166290283203, "global_step": 567428, "epoch": 6836} {"train_loss": -27.94869041442871, "global_step": 567429, "epoch": 6836} {"train_loss": -28.184741973876953, "global_step": 567430, "epoch": 6836} {"train_loss": -27.84136962890625, "global_step": 567431, "epoch": 6836} {"train_loss": -28.09114646911621, "global_step": 567432, "epoch": 6836} {"train_loss": -27.963943481445312, "global_step": 567433, "epoch": 6836} {"train_loss": -27.847402572631836, "global_step": 567434, "epoch": 6836} {"train_loss": -27.69068717956543, "global_step": 567435, "epoch": 6836} {"train_loss": -27.892486572265625, "global_step": 567436, "epoch": 6836} {"train_loss": -28.265501022338867, "global_step": 567437, "epoch": 6836} {"train_loss": -27.93082618713379, "global_step": 567438, "epoch": 6836} {"train_loss": -27.77326774597168, "global_step": 567439, "epoch": 6836} {"train_loss": -27.996671676635742, "global_step": 567440, "epoch": 6836} {"train_loss": -27.735437393188477, "global_step": 567441, "epoch": 6836} {"train_loss": -27.92963981628418, "global_step": 567442, "epoch": 6836} {"train_loss": -27.904733657836914, "global_step": 567443, "epoch": 6836} {"train_loss": -27.903656005859375, "global_step": 567444, "epoch": 6836} {"train_loss": -28.077112197875977, "global_step": 567445, "epoch": 6836} {"train_loss": -28.013248443603516, "global_step": 567446, "epoch": 6836} {"train_loss": -27.77543067932129, "global_step": 567447, "epoch": 6836} {"train_loss": -28.023792266845703, "global_step": 567448, "epoch": 6836} {"train_loss": -27.702314376831055, "global_step": 567449, "epoch": 6836} {"train_loss": -27.94659996032715, "global_step": 567450, "epoch": 6836} {"train_loss": -27.910505294799805, "global_step": 567451, "epoch": 6836} {"train_loss": -27.77225112915039, "global_step": 567452, "epoch": 6836} {"train_loss": -28.30982780456543, "global_step": 567453, "epoch": 6836} {"train_loss": -28.1793212890625, "global_step": 567454, "epoch": 6836} {"train_loss": -28.2640438079834, "global_step": 567455, "epoch": 6836} {"train_loss": -28.190656661987305, "global_step": 567456, "epoch": 6836} {"train_loss": -28.015356063842773, "global_step": 567457, "epoch": 6836} {"train_loss": -28.130146026611328, "global_step": 567458, "epoch": 6836} {"train_loss": -27.904926300048828, "global_step": 567459, "epoch": 6836} {"train_loss": -27.95488929748535, "global_step": 567460, "epoch": 6836} {"train_loss": -27.821020126342773, "global_step": 567461, "epoch": 6836} {"train_loss": -27.39876365661621, "global_step": 567462, "epoch": 6836} {"train_loss": -27.231143951416016, "global_step": 567463, "epoch": 6836} {"train_loss": -26.811054229736328, "global_step": 567464, "epoch": 6836} {"train_loss": -25.928436279296875, "global_step": 567465, "epoch": 6836} {"train_loss": -26.527475357055664, "global_step": 567466, "epoch": 6836} {"train_loss": -27.345733642578125, "global_step": 567467, "epoch": 6836} {"train_loss": -27.544818878173828, "global_step": 567468, "epoch": 6836} {"train_loss": -26.616727828979492, "global_step": 567469, "epoch": 6836} {"train_loss": -27.732992195221314, "global_step": 567470, "epoch": 6836, "val_loss": 6858627.0} {"train_loss": -26.364459991455078, "global_step": 567471, "epoch": 6837} {"train_loss": -26.96713638305664, "global_step": 567472, "epoch": 6837} {"train_loss": -27.32390785217285, "global_step": 567473, "epoch": 6837} {"train_loss": -26.585046768188477, "global_step": 567474, "epoch": 6837} {"train_loss": -26.92921257019043, "global_step": 567475, "epoch": 6837} {"train_loss": -26.347253799438477, "global_step": 567476, "epoch": 6837} {"train_loss": -27.20806312561035, "global_step": 567477, "epoch": 6837} {"train_loss": -26.448474884033203, "global_step": 567478, "epoch": 6837} {"train_loss": -27.476964950561523, "global_step": 567479, "epoch": 6837} {"train_loss": -26.92510986328125, "global_step": 567480, "epoch": 6837} {"train_loss": -27.422195434570312, "global_step": 567481, "epoch": 6837} {"train_loss": -27.07293128967285, "global_step": 567482, "epoch": 6837} {"train_loss": -26.722461700439453, "global_step": 567483, "epoch": 6837} {"train_loss": -27.158788681030273, "global_step": 567484, "epoch": 6837} {"train_loss": -27.197174072265625, "global_step": 567485, "epoch": 6837} {"train_loss": -27.072860717773438, "global_step": 567486, "epoch": 6837} {"train_loss": -27.37774658203125, "global_step": 567487, "epoch": 6837} {"train_loss": -27.526411056518555, "global_step": 567488, "epoch": 6837} {"train_loss": -27.364831924438477, "global_step": 567489, "epoch": 6837} {"train_loss": -26.99379539489746, "global_step": 567490, "epoch": 6837} {"train_loss": -27.634714126586914, "global_step": 567491, "epoch": 6837} {"train_loss": -27.181976318359375, "global_step": 567492, "epoch": 6837} {"train_loss": -27.283533096313477, "global_step": 567493, "epoch": 6837} {"train_loss": -27.32083511352539, "global_step": 567494, "epoch": 6837} {"train_loss": -27.651538848876953, "global_step": 567495, "epoch": 6837} {"train_loss": -27.763870239257812, "global_step": 567496, "epoch": 6837} {"train_loss": -27.401899337768555, "global_step": 567497, "epoch": 6837} {"train_loss": -27.82137107849121, "global_step": 567498, "epoch": 6837} {"train_loss": -27.62456703186035, "global_step": 567499, "epoch": 6837} {"train_loss": -27.504255294799805, "global_step": 567500, "epoch": 6837} {"train_loss": -27.631921768188477, "global_step": 567501, "epoch": 6837} {"train_loss": -27.82568359375, "global_step": 567502, "epoch": 6837} {"train_loss": -27.73356056213379, "global_step": 567503, "epoch": 6837} {"train_loss": -27.862470626831055, "global_step": 567504, "epoch": 6837} {"train_loss": -27.426624298095703, "global_step": 567505, "epoch": 6837} {"train_loss": -27.59272575378418, "global_step": 567506, "epoch": 6837} {"train_loss": -27.761428833007812, "global_step": 567507, "epoch": 6837} {"train_loss": -27.40394401550293, "global_step": 567508, "epoch": 6837} {"train_loss": -27.938886642456055, "global_step": 567509, "epoch": 6837} {"train_loss": -27.960844039916992, "global_step": 567510, "epoch": 6837} {"train_loss": -27.604907989501953, "global_step": 567511, "epoch": 6837} {"train_loss": -27.805938720703125, "global_step": 567512, "epoch": 6837} {"train_loss": -27.843713760375977, "global_step": 567513, "epoch": 6837} {"train_loss": -27.90717124938965, "global_step": 567514, "epoch": 6837} {"train_loss": -27.74171257019043, "global_step": 567515, "epoch": 6837} {"train_loss": -27.860971450805664, "global_step": 567516, "epoch": 6837} {"train_loss": -28.03555679321289, "global_step": 567517, "epoch": 6837} {"train_loss": -27.94087028503418, "global_step": 567518, "epoch": 6837} {"train_loss": -28.198822021484375, "global_step": 567519, "epoch": 6837} {"train_loss": -27.97041893005371, "global_step": 567520, "epoch": 6837} {"train_loss": -28.048429489135742, "global_step": 567521, "epoch": 6837} {"train_loss": -27.839033126831055, "global_step": 567522, "epoch": 6837} {"train_loss": -28.187702178955078, "global_step": 567523, "epoch": 6837} {"train_loss": -28.058948516845703, "global_step": 567524, "epoch": 6837} {"train_loss": -27.912616729736328, "global_step": 567525, "epoch": 6837} {"train_loss": -28.323062896728516, "global_step": 567526, "epoch": 6837} {"train_loss": -27.959842681884766, "global_step": 567527, "epoch": 6837} {"train_loss": -28.067413330078125, "global_step": 567528, "epoch": 6837} {"train_loss": -27.981428146362305, "global_step": 567529, "epoch": 6837} {"train_loss": -28.142908096313477, "global_step": 567530, "epoch": 6837} {"train_loss": -27.56378173828125, "global_step": 567531, "epoch": 6837} {"train_loss": -28.19758415222168, "global_step": 567532, "epoch": 6837} {"train_loss": -27.785343170166016, "global_step": 567533, "epoch": 6837} {"train_loss": -27.951169967651367, "global_step": 567534, "epoch": 6837} {"train_loss": -28.113754272460938, "global_step": 567535, "epoch": 6837} {"train_loss": -27.689558029174805, "global_step": 567536, "epoch": 6837} {"train_loss": -27.974353790283203, "global_step": 567537, "epoch": 6837} {"train_loss": -27.891149520874023, "global_step": 567538, "epoch": 6837} {"train_loss": -27.92658042907715, "global_step": 567539, "epoch": 6837} {"train_loss": -28.61433219909668, "global_step": 567540, "epoch": 6837} {"train_loss": -27.629369735717773, "global_step": 567541, "epoch": 6837} {"train_loss": -28.139860153198242, "global_step": 567542, "epoch": 6837} {"train_loss": -28.032705307006836, "global_step": 567543, "epoch": 6837} {"train_loss": -27.9894962310791, "global_step": 567544, "epoch": 6837} {"train_loss": -28.27695655822754, "global_step": 567545, "epoch": 6837} {"train_loss": -27.96189308166504, "global_step": 567546, "epoch": 6837} {"train_loss": -28.27886962890625, "global_step": 567547, "epoch": 6837} {"train_loss": -27.981000900268555, "global_step": 567548, "epoch": 6837} {"train_loss": -28.072839736938477, "global_step": 567549, "epoch": 6837} {"train_loss": -27.945234298706055, "global_step": 567550, "epoch": 6837} {"train_loss": -27.757715225219727, "global_step": 567551, "epoch": 6837} {"train_loss": -28.10861587524414, "global_step": 567552, "epoch": 6837} {"train_loss": -27.64273131037333, "global_step": 567553, "epoch": 6837, "val_loss": 6863146.0} {"train_loss": -27.771459579467773, "global_step": 567554, "epoch": 6838} {"train_loss": -27.875659942626953, "global_step": 567555, "epoch": 6838} {"train_loss": -28.005002975463867, "global_step": 567556, "epoch": 6838} {"train_loss": -27.868732452392578, "global_step": 567557, "epoch": 6838} {"train_loss": -27.86343765258789, "global_step": 567558, "epoch": 6838} {"train_loss": -27.299238204956055, "global_step": 567559, "epoch": 6838} {"train_loss": -27.744428634643555, "global_step": 567560, "epoch": 6838} {"train_loss": -27.913755416870117, "global_step": 567561, "epoch": 6838} {"train_loss": -27.0887508392334, "global_step": 567562, "epoch": 6838} {"train_loss": -27.351612091064453, "global_step": 567563, "epoch": 6838} {"train_loss": -27.81011390686035, "global_step": 567564, "epoch": 6838} {"train_loss": -27.546518325805664, "global_step": 567565, "epoch": 6838} {"train_loss": -27.43391990661621, "global_step": 567566, "epoch": 6838} {"train_loss": -28.060077667236328, "global_step": 567567, "epoch": 6838} {"train_loss": -27.403335571289062, "global_step": 567568, "epoch": 6838} {"train_loss": -28.189441680908203, "global_step": 567569, "epoch": 6838} {"train_loss": -27.335790634155273, "global_step": 567570, "epoch": 6838} {"train_loss": -27.80010986328125, "global_step": 567571, "epoch": 6838} {"train_loss": -27.26984977722168, "global_step": 567572, "epoch": 6838} {"train_loss": -27.97574806213379, "global_step": 567573, "epoch": 6838} {"train_loss": -28.066495895385742, "global_step": 567574, "epoch": 6838} {"train_loss": -27.565113067626953, "global_step": 567575, "epoch": 6838} {"train_loss": -27.73565673828125, "global_step": 567576, "epoch": 6838} {"train_loss": -27.630924224853516, "global_step": 567577, "epoch": 6838} {"train_loss": -27.714521408081055, "global_step": 567578, "epoch": 6838} {"train_loss": -27.7576847076416, "global_step": 567579, "epoch": 6838} {"train_loss": -27.988235473632812, "global_step": 567580, "epoch": 6838} {"train_loss": -27.501758575439453, "global_step": 567581, "epoch": 6838} {"train_loss": -27.698598861694336, "global_step": 567582, "epoch": 6838} {"train_loss": -27.609649658203125, "global_step": 567583, "epoch": 6838} {"train_loss": -27.4254093170166, "global_step": 567584, "epoch": 6838} {"train_loss": -27.555883407592773, "global_step": 567585, "epoch": 6838} {"train_loss": -28.30402183532715, "global_step": 567586, "epoch": 6838} {"train_loss": -28.039716720581055, "global_step": 567587, "epoch": 6838} {"train_loss": -27.69207763671875, "global_step": 567588, "epoch": 6838} {"train_loss": -27.84566307067871, "global_step": 567589, "epoch": 6838} {"train_loss": -27.96577262878418, "global_step": 567590, "epoch": 6838} {"train_loss": -27.9025936126709, "global_step": 567591, "epoch": 6838} {"train_loss": -28.159162521362305, "global_step": 567592, "epoch": 6838} {"train_loss": -27.99383544921875, "global_step": 567593, "epoch": 6838} {"train_loss": -27.94173240661621, "global_step": 567594, "epoch": 6838} {"train_loss": -28.286422729492188, "global_step": 567595, "epoch": 6838} {"train_loss": -28.26409912109375, "global_step": 567596, "epoch": 6838} {"train_loss": -27.785627365112305, "global_step": 567597, "epoch": 6838} {"train_loss": -27.651824951171875, "global_step": 567598, "epoch": 6838} {"train_loss": -27.689443588256836, "global_step": 567599, "epoch": 6838} {"train_loss": -28.155054092407227, "global_step": 567600, "epoch": 6838} {"train_loss": -27.9948787689209, "global_step": 567601, "epoch": 6838} {"train_loss": -27.94544792175293, "global_step": 567602, "epoch": 6838} {"train_loss": -27.821887969970703, "global_step": 567603, "epoch": 6838} {"train_loss": -28.03731346130371, "global_step": 567604, "epoch": 6838} {"train_loss": -27.83563804626465, "global_step": 567605, "epoch": 6838} {"train_loss": -27.846899032592773, "global_step": 567606, "epoch": 6838} {"train_loss": -27.77536392211914, "global_step": 567607, "epoch": 6838} {"train_loss": -27.77374839782715, "global_step": 567608, "epoch": 6838} {"train_loss": -28.029346466064453, "global_step": 567609, "epoch": 6838} {"train_loss": -27.83674430847168, "global_step": 567610, "epoch": 6838} {"train_loss": -27.501953125, "global_step": 567611, "epoch": 6838} {"train_loss": -27.744293212890625, "global_step": 567612, "epoch": 6838} {"train_loss": -27.860218048095703, "global_step": 567613, "epoch": 6838} {"train_loss": -28.248828887939453, "global_step": 567614, "epoch": 6838} {"train_loss": -27.934284210205078, "global_step": 567615, "epoch": 6838} {"train_loss": -27.776777267456055, "global_step": 567616, "epoch": 6838} {"train_loss": -27.8272762298584, "global_step": 567617, "epoch": 6838} {"train_loss": -27.8922119140625, "global_step": 567618, "epoch": 6838} {"train_loss": -27.579313278198242, "global_step": 567619, "epoch": 6838} {"train_loss": -28.1129093170166, "global_step": 567620, "epoch": 6838} {"train_loss": -27.78633689880371, "global_step": 567621, "epoch": 6838} {"train_loss": -27.99224281311035, "global_step": 567622, "epoch": 6838} {"train_loss": -27.857030868530273, "global_step": 567623, "epoch": 6838} {"train_loss": -28.14324951171875, "global_step": 567624, "epoch": 6838} {"train_loss": -27.557788848876953, "global_step": 567625, "epoch": 6838} {"train_loss": -27.681432723999023, "global_step": 567626, "epoch": 6838} {"train_loss": -27.653949737548828, "global_step": 567627, "epoch": 6838} {"train_loss": -27.996490478515625, "global_step": 567628, "epoch": 6838} {"train_loss": -27.75042724609375, "global_step": 567629, "epoch": 6838} {"train_loss": -27.598737716674805, "global_step": 567630, "epoch": 6838} {"train_loss": -27.198017120361328, "global_step": 567631, "epoch": 6838} {"train_loss": -27.978490829467773, "global_step": 567632, "epoch": 6838} {"train_loss": -27.71424674987793, "global_step": 567633, "epoch": 6838} {"train_loss": -28.110212326049805, "global_step": 567634, "epoch": 6838} {"train_loss": -27.595645904541016, "global_step": 567635, "epoch": 6838} {"train_loss": -27.798125025737715, "global_step": 567636, "epoch": 6838, "val_loss": 6870075.0} {"train_loss": -26.936908721923828, "global_step": 567637, "epoch": 6839} {"train_loss": -27.631494522094727, "global_step": 567638, "epoch": 6839} {"train_loss": -26.842548370361328, "global_step": 567639, "epoch": 6839} {"train_loss": -27.166717529296875, "global_step": 567640, "epoch": 6839} {"train_loss": -27.071949005126953, "global_step": 567641, "epoch": 6839} {"train_loss": -26.741931915283203, "global_step": 567642, "epoch": 6839} {"train_loss": -27.292667388916016, "global_step": 567643, "epoch": 6839} {"train_loss": -26.839269638061523, "global_step": 567644, "epoch": 6839} {"train_loss": -27.320035934448242, "global_step": 567645, "epoch": 6839} {"train_loss": -27.003021240234375, "global_step": 567646, "epoch": 6839} {"train_loss": -27.379240036010742, "global_step": 567647, "epoch": 6839} {"train_loss": -27.159534454345703, "global_step": 567648, "epoch": 6839} {"train_loss": -27.058801651000977, "global_step": 567649, "epoch": 6839} {"train_loss": -27.255605697631836, "global_step": 567650, "epoch": 6839} {"train_loss": -27.43474769592285, "global_step": 567651, "epoch": 6839} {"train_loss": -27.3074951171875, "global_step": 567652, "epoch": 6839} {"train_loss": -27.08554458618164, "global_step": 567653, "epoch": 6839} {"train_loss": -27.382604598999023, "global_step": 567654, "epoch": 6839} {"train_loss": -27.154205322265625, "global_step": 567655, "epoch": 6839} {"train_loss": -26.807348251342773, "global_step": 567656, "epoch": 6839} {"train_loss": -27.749231338500977, "global_step": 567657, "epoch": 6839} {"train_loss": -27.01239585876465, "global_step": 567658, "epoch": 6839} {"train_loss": -27.65630531311035, "global_step": 567659, "epoch": 6839} {"train_loss": -27.973188400268555, "global_step": 567660, "epoch": 6839} {"train_loss": -27.41224479675293, "global_step": 567661, "epoch": 6839} {"train_loss": -27.526098251342773, "global_step": 567662, "epoch": 6839} {"train_loss": -27.59712028503418, "global_step": 567663, "epoch": 6839} {"train_loss": -27.32325553894043, "global_step": 567664, "epoch": 6839} {"train_loss": -28.134252548217773, "global_step": 567665, "epoch": 6839} {"train_loss": -27.440454483032227, "global_step": 567666, "epoch": 6839} {"train_loss": -27.707624435424805, "global_step": 567667, "epoch": 6839} {"train_loss": -27.6986083984375, "global_step": 567668, "epoch": 6839} {"train_loss": -27.99818992614746, "global_step": 567669, "epoch": 6839} {"train_loss": -27.844018936157227, "global_step": 567670, "epoch": 6839} {"train_loss": -27.783430099487305, "global_step": 567671, "epoch": 6839} {"train_loss": -27.80853271484375, "global_step": 567672, "epoch": 6839} {"train_loss": -27.552377700805664, "global_step": 567673, "epoch": 6839} {"train_loss": -27.6232967376709, "global_step": 567674, "epoch": 6839} {"train_loss": -28.22800636291504, "global_step": 567675, "epoch": 6839} {"train_loss": -27.5463809967041, "global_step": 567676, "epoch": 6839} {"train_loss": -27.72234535217285, "global_step": 567677, "epoch": 6839} {"train_loss": -27.7901668548584, "global_step": 567678, "epoch": 6839} {"train_loss": -27.435836791992188, "global_step": 567679, "epoch": 6839} {"train_loss": -28.106475830078125, "global_step": 567680, "epoch": 6839} {"train_loss": -27.569976806640625, "global_step": 567681, "epoch": 6839} {"train_loss": -27.912012100219727, "global_step": 567682, "epoch": 6839} {"train_loss": -27.736921310424805, "global_step": 567683, "epoch": 6839} {"train_loss": -27.6761531829834, "global_step": 567684, "epoch": 6839} {"train_loss": -27.837162017822266, "global_step": 567685, "epoch": 6839} {"train_loss": -27.797119140625, "global_step": 567686, "epoch": 6839} {"train_loss": -27.51704216003418, "global_step": 567687, "epoch": 6839} {"train_loss": -27.663007736206055, "global_step": 567688, "epoch": 6839} {"train_loss": -27.760278701782227, "global_step": 567689, "epoch": 6839} {"train_loss": -28.144208908081055, "global_step": 567690, "epoch": 6839} {"train_loss": -27.70185661315918, "global_step": 567691, "epoch": 6839} {"train_loss": -28.06104850769043, "global_step": 567692, "epoch": 6839} {"train_loss": -27.897003173828125, "global_step": 567693, "epoch": 6839} {"train_loss": -28.13154411315918, "global_step": 567694, "epoch": 6839} {"train_loss": -27.903961181640625, "global_step": 567695, "epoch": 6839} {"train_loss": -27.868494033813477, "global_step": 567696, "epoch": 6839} {"train_loss": -28.169580459594727, "global_step": 567697, "epoch": 6839} {"train_loss": -28.17371940612793, "global_step": 567698, "epoch": 6839} {"train_loss": -28.065526962280273, "global_step": 567699, "epoch": 6839} {"train_loss": -27.627180099487305, "global_step": 567700, "epoch": 6839} {"train_loss": -27.675186157226562, "global_step": 567701, "epoch": 6839} {"train_loss": -28.044897079467773, "global_step": 567702, "epoch": 6839} {"train_loss": -27.86799430847168, "global_step": 567703, "epoch": 6839} {"train_loss": -28.106647491455078, "global_step": 567704, "epoch": 6839} {"train_loss": -27.732641220092773, "global_step": 567705, "epoch": 6839} {"train_loss": -27.83466911315918, "global_step": 567706, "epoch": 6839} {"train_loss": -27.828405380249023, "global_step": 567707, "epoch": 6839} {"train_loss": -27.64003562927246, "global_step": 567708, "epoch": 6839} {"train_loss": -27.86737060546875, "global_step": 567709, "epoch": 6839} {"train_loss": -28.078855514526367, "global_step": 567710, "epoch": 6839} {"train_loss": -28.22247886657715, "global_step": 567711, "epoch": 6839} {"train_loss": -27.81776237487793, "global_step": 567712, "epoch": 6839} {"train_loss": -27.644765853881836, "global_step": 567713, "epoch": 6839} {"train_loss": -27.99079704284668, "global_step": 567714, "epoch": 6839} {"train_loss": -28.12849235534668, "global_step": 567715, "epoch": 6839} {"train_loss": -27.9127140045166, "global_step": 567716, "epoch": 6839} {"train_loss": -27.892013549804688, "global_step": 567717, "epoch": 6839} {"train_loss": -27.64727210998535, "global_step": 567718, "epoch": 6839} {"train_loss": -27.6403986229954, "global_step": 567719, "epoch": 6839, "val_loss": 6822117.5} {"train_loss": -27.431018829345703, "global_step": 567720, "epoch": 6840} {"train_loss": -26.444055557250977, "global_step": 567721, "epoch": 6840} {"train_loss": -26.463748931884766, "global_step": 567722, "epoch": 6840} {"train_loss": -27.2716064453125, "global_step": 567723, "epoch": 6840} {"train_loss": -26.588470458984375, "global_step": 567724, "epoch": 6840} {"train_loss": -26.604755401611328, "global_step": 567725, "epoch": 6840} {"train_loss": -27.26226806640625, "global_step": 567726, "epoch": 6840} {"train_loss": -26.65156364440918, "global_step": 567727, "epoch": 6840} {"train_loss": -26.998443603515625, "global_step": 567728, "epoch": 6840} {"train_loss": -27.019153594970703, "global_step": 567729, "epoch": 6840} {"train_loss": -27.281085968017578, "global_step": 567730, "epoch": 6840} {"train_loss": -27.346588134765625, "global_step": 567731, "epoch": 6840} {"train_loss": -27.17068862915039, "global_step": 567732, "epoch": 6840} {"train_loss": -27.358856201171875, "global_step": 567733, "epoch": 6840} {"train_loss": -27.44832420349121, "global_step": 567734, "epoch": 6840} {"train_loss": -27.19410514831543, "global_step": 567735, "epoch": 6840} {"train_loss": -27.3193359375, "global_step": 567736, "epoch": 6840} {"train_loss": -27.54585075378418, "global_step": 567737, "epoch": 6840} {"train_loss": -27.38876724243164, "global_step": 567738, "epoch": 6840} {"train_loss": -27.29304313659668, "global_step": 567739, "epoch": 6840} {"train_loss": -27.2174015045166, "global_step": 567740, "epoch": 6840} {"train_loss": -27.46601676940918, "global_step": 567741, "epoch": 6840} {"train_loss": -27.429336547851562, "global_step": 567742, "epoch": 6840} {"train_loss": -27.585721969604492, "global_step": 567743, "epoch": 6840} {"train_loss": -27.447927474975586, "global_step": 567744, "epoch": 6840} {"train_loss": -27.2987060546875, "global_step": 567745, "epoch": 6840} {"train_loss": -27.5714111328125, "global_step": 567746, "epoch": 6840} {"train_loss": -27.523893356323242, "global_step": 567747, "epoch": 6840} {"train_loss": -27.460529327392578, "global_step": 567748, "epoch": 6840} {"train_loss": -27.291135787963867, "global_step": 567749, "epoch": 6840} {"train_loss": -27.5484619140625, "global_step": 567750, "epoch": 6840} {"train_loss": -27.44037437438965, "global_step": 567751, "epoch": 6840} {"train_loss": -28.34661293029785, "global_step": 567752, "epoch": 6840} {"train_loss": -27.836645126342773, "global_step": 567753, "epoch": 6840} {"train_loss": -27.632001876831055, "global_step": 567754, "epoch": 6840} {"train_loss": -27.87922477722168, "global_step": 567755, "epoch": 6840} {"train_loss": -27.663135528564453, "global_step": 567756, "epoch": 6840} {"train_loss": -27.62222671508789, "global_step": 567757, "epoch": 6840} {"train_loss": -27.93269157409668, "global_step": 567758, "epoch": 6840} {"train_loss": -27.832595825195312, "global_step": 567759, "epoch": 6840} {"train_loss": -28.13288688659668, "global_step": 567760, "epoch": 6840} {"train_loss": -27.576141357421875, "global_step": 567761, "epoch": 6840} {"train_loss": -27.874006271362305, "global_step": 567762, "epoch": 6840} {"train_loss": -27.846967697143555, "global_step": 567763, "epoch": 6840} {"train_loss": -27.521284103393555, "global_step": 567764, "epoch": 6840} {"train_loss": -28.10386085510254, "global_step": 567765, "epoch": 6840} {"train_loss": -27.807514190673828, "global_step": 567766, "epoch": 6840} {"train_loss": -27.96610450744629, "global_step": 567767, "epoch": 6840} {"train_loss": -27.429418563842773, "global_step": 567768, "epoch": 6840} {"train_loss": -28.126684188842773, "global_step": 567769, "epoch": 6840} {"train_loss": -28.181554794311523, "global_step": 567770, "epoch": 6840} {"train_loss": -27.965961456298828, "global_step": 567771, "epoch": 6840} {"train_loss": -27.807159423828125, "global_step": 567772, "epoch": 6840} {"train_loss": -27.998157501220703, "global_step": 567773, "epoch": 6840} {"train_loss": -27.992218017578125, "global_step": 567774, "epoch": 6840} {"train_loss": -27.889240264892578, "global_step": 567775, "epoch": 6840} {"train_loss": -28.13116455078125, "global_step": 567776, "epoch": 6840} {"train_loss": -28.126712799072266, "global_step": 567777, "epoch": 6840} {"train_loss": -28.21923828125, "global_step": 567778, "epoch": 6840} {"train_loss": -28.003305435180664, "global_step": 567779, "epoch": 6840} {"train_loss": -27.962148666381836, "global_step": 567780, "epoch": 6840} {"train_loss": -27.880664825439453, "global_step": 567781, "epoch": 6840} {"train_loss": -27.3105411529541, "global_step": 567782, "epoch": 6840} {"train_loss": -28.11920738220215, "global_step": 567783, "epoch": 6840} {"train_loss": -27.715478897094727, "global_step": 567784, "epoch": 6840} {"train_loss": -27.8944091796875, "global_step": 567785, "epoch": 6840} {"train_loss": -27.759246826171875, "global_step": 567786, "epoch": 6840} {"train_loss": -28.113540649414062, "global_step": 567787, "epoch": 6840} {"train_loss": -27.947168350219727, "global_step": 567788, "epoch": 6840} {"train_loss": -28.13503074645996, "global_step": 567789, "epoch": 6840} {"train_loss": -27.717199325561523, "global_step": 567790, "epoch": 6840} {"train_loss": -28.046772003173828, "global_step": 567791, "epoch": 6840} {"train_loss": -27.961347579956055, "global_step": 567792, "epoch": 6840} {"train_loss": -27.921863555908203, "global_step": 567793, "epoch": 6840} {"train_loss": -27.917882919311523, "global_step": 567794, "epoch": 6840} {"train_loss": -28.190404891967773, "global_step": 567795, "epoch": 6840} {"train_loss": -28.201858520507812, "global_step": 567796, "epoch": 6840} {"train_loss": -27.802017211914062, "global_step": 567797, "epoch": 6840} {"train_loss": -28.14680290222168, "global_step": 567798, "epoch": 6840} {"train_loss": -28.163190841674805, "global_step": 567799, "epoch": 6840} {"train_loss": -28.15447998046875, "global_step": 567800, "epoch": 6840} {"train_loss": -27.243738174438477, "global_step": 567801, "epoch": 6840} {"train_loss": -27.64250270429864, "global_step": 567802, "epoch": 6840, "val_loss": 6816543.0} {"train_loss": -26.51206398010254, "global_step": 567803, "epoch": 6841} {"train_loss": -26.21827507019043, "global_step": 567804, "epoch": 6841} {"train_loss": -26.46518325805664, "global_step": 567805, "epoch": 6841} {"train_loss": -26.946990966796875, "global_step": 567806, "epoch": 6841} {"train_loss": -27.3704776763916, "global_step": 567807, "epoch": 6841} {"train_loss": -27.285547256469727, "global_step": 567808, "epoch": 6841} {"train_loss": -27.4666805267334, "global_step": 567809, "epoch": 6841} {"train_loss": -27.307096481323242, "global_step": 567810, "epoch": 6841} {"train_loss": -26.9872989654541, "global_step": 567811, "epoch": 6841} {"train_loss": -27.325963973999023, "global_step": 567812, "epoch": 6841} {"train_loss": -27.17919921875, "global_step": 567813, "epoch": 6841} {"train_loss": -27.645648956298828, "global_step": 567814, "epoch": 6841} {"train_loss": -27.194232940673828, "global_step": 567815, "epoch": 6841} {"train_loss": -27.31329345703125, "global_step": 567816, "epoch": 6841} {"train_loss": -27.11561393737793, "global_step": 567817, "epoch": 6841} {"train_loss": -27.33330726623535, "global_step": 567818, "epoch": 6841} {"train_loss": -26.91036033630371, "global_step": 567819, "epoch": 6841} {"train_loss": -27.7351131439209, "global_step": 567820, "epoch": 6841} {"train_loss": -27.27978515625, "global_step": 567821, "epoch": 6841} {"train_loss": -27.656396865844727, "global_step": 567822, "epoch": 6841} {"train_loss": -27.36514663696289, "global_step": 567823, "epoch": 6841} {"train_loss": -27.298208236694336, "global_step": 567824, "epoch": 6841} {"train_loss": -27.777997970581055, "global_step": 567825, "epoch": 6841} {"train_loss": -27.603885650634766, "global_step": 567826, "epoch": 6841} {"train_loss": -27.815839767456055, "global_step": 567827, "epoch": 6841} {"train_loss": -27.594648361206055, "global_step": 567828, "epoch": 6841} {"train_loss": -27.897974014282227, "global_step": 567829, "epoch": 6841} {"train_loss": -27.96331214904785, "global_step": 567830, "epoch": 6841} {"train_loss": -27.727991104125977, "global_step": 567831, "epoch": 6841} {"train_loss": -27.497333526611328, "global_step": 567832, "epoch": 6841} {"train_loss": -27.320377349853516, "global_step": 567833, "epoch": 6841} {"train_loss": -27.611682891845703, "global_step": 567834, "epoch": 6841} {"train_loss": -27.85332679748535, "global_step": 567835, "epoch": 6841} {"train_loss": -27.67803382873535, "global_step": 567836, "epoch": 6841} {"train_loss": -27.300830841064453, "global_step": 567837, "epoch": 6841} {"train_loss": -27.660947799682617, "global_step": 567838, "epoch": 6841} {"train_loss": -27.610715866088867, "global_step": 567839, "epoch": 6841} {"train_loss": -27.395139694213867, "global_step": 567840, "epoch": 6841} {"train_loss": -27.80010986328125, "global_step": 567841, "epoch": 6841} {"train_loss": -27.746179580688477, "global_step": 567842, "epoch": 6841} {"train_loss": -27.658737182617188, "global_step": 567843, "epoch": 6841} {"train_loss": -28.021270751953125, "global_step": 567844, "epoch": 6841} {"train_loss": -28.036060333251953, "global_step": 567845, "epoch": 6841} {"train_loss": -27.95125389099121, "global_step": 567846, "epoch": 6841} {"train_loss": -27.60371208190918, "global_step": 567847, "epoch": 6841} {"train_loss": -27.730024337768555, "global_step": 567848, "epoch": 6841} {"train_loss": -28.069379806518555, "global_step": 567849, "epoch": 6841} {"train_loss": -27.608346939086914, "global_step": 567850, "epoch": 6841} {"train_loss": -27.971235275268555, "global_step": 567851, "epoch": 6841} {"train_loss": -27.8380126953125, "global_step": 567852, "epoch": 6841} {"train_loss": -27.931427001953125, "global_step": 567853, "epoch": 6841} {"train_loss": -28.249353408813477, "global_step": 567854, "epoch": 6841} {"train_loss": -27.9160213470459, "global_step": 567855, "epoch": 6841} {"train_loss": -28.08643913269043, "global_step": 567856, "epoch": 6841} {"train_loss": -27.98927116394043, "global_step": 567857, "epoch": 6841} {"train_loss": -27.554584503173828, "global_step": 567858, "epoch": 6841} {"train_loss": -27.7916316986084, "global_step": 567859, "epoch": 6841} {"train_loss": -28.0668888092041, "global_step": 567860, "epoch": 6841} {"train_loss": -27.748645782470703, "global_step": 567861, "epoch": 6841} {"train_loss": -27.786788940429688, "global_step": 567862, "epoch": 6841} {"train_loss": -27.77741813659668, "global_step": 567863, "epoch": 6841} {"train_loss": -27.78122329711914, "global_step": 567864, "epoch": 6841} {"train_loss": -27.56707763671875, "global_step": 567865, "epoch": 6841} {"train_loss": -27.6767578125, "global_step": 567866, "epoch": 6841} {"train_loss": -27.95757484436035, "global_step": 567867, "epoch": 6841} {"train_loss": -28.000980377197266, "global_step": 567868, "epoch": 6841} {"train_loss": -28.018827438354492, "global_step": 567869, "epoch": 6841} {"train_loss": -27.419824600219727, "global_step": 567870, "epoch": 6841} {"train_loss": -27.56377601623535, "global_step": 567871, "epoch": 6841} {"train_loss": -27.556625366210938, "global_step": 567872, "epoch": 6841} {"train_loss": -28.1680965423584, "global_step": 567873, "epoch": 6841} {"train_loss": -27.84882164001465, "global_step": 567874, "epoch": 6841} {"train_loss": -27.259679794311523, "global_step": 567875, "epoch": 6841} {"train_loss": -27.095136642456055, "global_step": 567876, "epoch": 6841} {"train_loss": -27.438323974609375, "global_step": 567877, "epoch": 6841} {"train_loss": -27.74615478515625, "global_step": 567878, "epoch": 6841} {"train_loss": -27.7590389251709, "global_step": 567879, "epoch": 6841} {"train_loss": -27.981678009033203, "global_step": 567880, "epoch": 6841} {"train_loss": -27.545257568359375, "global_step": 567881, "epoch": 6841} {"train_loss": -27.726791381835938, "global_step": 567882, "epoch": 6841} {"train_loss": -27.952295303344727, "global_step": 567883, "epoch": 6841} {"train_loss": -27.877450942993164, "global_step": 567884, "epoch": 6841} {"train_loss": -27.601902490638825, "global_step": 567885, "epoch": 6841, "val_loss": 6780048.0} {"train_loss": -27.014108657836914, "global_step": 567886, "epoch": 6842} {"train_loss": -27.383527755737305, "global_step": 567887, "epoch": 6842} {"train_loss": -27.538732528686523, "global_step": 567888, "epoch": 6842} {"train_loss": -27.266767501831055, "global_step": 567889, "epoch": 6842} {"train_loss": -27.158933639526367, "global_step": 567890, "epoch": 6842} {"train_loss": -27.508163452148438, "global_step": 567891, "epoch": 6842} {"train_loss": -27.5009765625, "global_step": 567892, "epoch": 6842} {"train_loss": -27.770736694335938, "global_step": 567893, "epoch": 6842} {"train_loss": -27.59139060974121, "global_step": 567894, "epoch": 6842} {"train_loss": -27.694929122924805, "global_step": 567895, "epoch": 6842} {"train_loss": -27.662931442260742, "global_step": 567896, "epoch": 6842} {"train_loss": -27.757482528686523, "global_step": 567897, "epoch": 6842} {"train_loss": -27.329975128173828, "global_step": 567898, "epoch": 6842} {"train_loss": -27.843643188476562, "global_step": 567899, "epoch": 6842} {"train_loss": -27.6922607421875, "global_step": 567900, "epoch": 6842} {"train_loss": -27.981311798095703, "global_step": 567901, "epoch": 6842} {"train_loss": -27.530241012573242, "global_step": 567902, "epoch": 6842} {"train_loss": -27.580001831054688, "global_step": 567903, "epoch": 6842} {"train_loss": -27.559309005737305, "global_step": 567904, "epoch": 6842} {"train_loss": -27.776153564453125, "global_step": 567905, "epoch": 6842} {"train_loss": -27.966161727905273, "global_step": 567906, "epoch": 6842} {"train_loss": -27.49537467956543, "global_step": 567907, "epoch": 6842} {"train_loss": -27.7243595123291, "global_step": 567908, "epoch": 6842} {"train_loss": -27.68428611755371, "global_step": 567909, "epoch": 6842} {"train_loss": -27.61492919921875, "global_step": 567910, "epoch": 6842} {"train_loss": -27.490503311157227, "global_step": 567911, "epoch": 6842} {"train_loss": -27.6439208984375, "global_step": 567912, "epoch": 6842} {"train_loss": -27.514150619506836, "global_step": 567913, "epoch": 6842} {"train_loss": -27.598791122436523, "global_step": 567914, "epoch": 6842} {"train_loss": -27.317249298095703, "global_step": 567915, "epoch": 6842} {"train_loss": -27.73031997680664, "global_step": 567916, "epoch": 6842} {"train_loss": -27.880325317382812, "global_step": 567917, "epoch": 6842} {"train_loss": -27.84027099609375, "global_step": 567918, "epoch": 6842} {"train_loss": -27.735321044921875, "global_step": 567919, "epoch": 6842} {"train_loss": -27.709928512573242, "global_step": 567920, "epoch": 6842} {"train_loss": -27.22991943359375, "global_step": 567921, "epoch": 6842} {"train_loss": -27.687362670898438, "global_step": 567922, "epoch": 6842} {"train_loss": -27.815576553344727, "global_step": 567923, "epoch": 6842} {"train_loss": -27.513721466064453, "global_step": 567924, "epoch": 6842} {"train_loss": -27.770395278930664, "global_step": 567925, "epoch": 6842} {"train_loss": -27.9207820892334, "global_step": 567926, "epoch": 6842} {"train_loss": -27.76960563659668, "global_step": 567927, "epoch": 6842} {"train_loss": -27.760343551635742, "global_step": 567928, "epoch": 6842} {"train_loss": -27.628360748291016, "global_step": 567929, "epoch": 6842} {"train_loss": -27.977405548095703, "global_step": 567930, "epoch": 6842} {"train_loss": -27.339269638061523, "global_step": 567931, "epoch": 6842} {"train_loss": -28.08698081970215, "global_step": 567932, "epoch": 6842} {"train_loss": -27.72861671447754, "global_step": 567933, "epoch": 6842} {"train_loss": -27.800201416015625, "global_step": 567934, "epoch": 6842} {"train_loss": -28.1763858795166, "global_step": 567935, "epoch": 6842} {"train_loss": -27.7380313873291, "global_step": 567936, "epoch": 6842} {"train_loss": -27.969858169555664, "global_step": 567937, "epoch": 6842} {"train_loss": -27.61639404296875, "global_step": 567938, "epoch": 6842} {"train_loss": -27.586292266845703, "global_step": 567939, "epoch": 6842} {"train_loss": -27.783674240112305, "global_step": 567940, "epoch": 6842} {"train_loss": -27.801931381225586, "global_step": 567941, "epoch": 6842} {"train_loss": -27.931726455688477, "global_step": 567942, "epoch": 6842} {"train_loss": -27.949310302734375, "global_step": 567943, "epoch": 6842} {"train_loss": -27.82074546813965, "global_step": 567944, "epoch": 6842} {"train_loss": -27.933841705322266, "global_step": 567945, "epoch": 6842} {"train_loss": -27.936477661132812, "global_step": 567946, "epoch": 6842} {"train_loss": -27.480499267578125, "global_step": 567947, "epoch": 6842} {"train_loss": -27.791624069213867, "global_step": 567948, "epoch": 6842} {"train_loss": -27.4488468170166, "global_step": 567949, "epoch": 6842} {"train_loss": -27.984888076782227, "global_step": 567950, "epoch": 6842} {"train_loss": -27.541040420532227, "global_step": 567951, "epoch": 6842} {"train_loss": -27.78211784362793, "global_step": 567952, "epoch": 6842} {"train_loss": -27.2047119140625, "global_step": 567953, "epoch": 6842} {"train_loss": -27.94215202331543, "global_step": 567954, "epoch": 6842} {"train_loss": -27.975278854370117, "global_step": 567955, "epoch": 6842} {"train_loss": -27.562408447265625, "global_step": 567956, "epoch": 6842} {"train_loss": -27.618688583374023, "global_step": 567957, "epoch": 6842} {"train_loss": -27.850683212280273, "global_step": 567958, "epoch": 6842} {"train_loss": -28.156055450439453, "global_step": 567959, "epoch": 6842} {"train_loss": -27.677188873291016, "global_step": 567960, "epoch": 6842} {"train_loss": -27.574569702148438, "global_step": 567961, "epoch": 6842} {"train_loss": -27.629724502563477, "global_step": 567962, "epoch": 6842} {"train_loss": -27.57730484008789, "global_step": 567963, "epoch": 6842} {"train_loss": -27.597333908081055, "global_step": 567964, "epoch": 6842} {"train_loss": -27.471166610717773, "global_step": 567965, "epoch": 6842} {"train_loss": -27.79871940612793, "global_step": 567966, "epoch": 6842} {"train_loss": -27.609495162963867, "global_step": 567967, "epoch": 6842} {"train_loss": -27.690919209675616, "global_step": 567968, "epoch": 6842, "val_loss": 6720563.0} {"train_loss": -26.984455108642578, "global_step": 567969, "epoch": 6843} {"train_loss": -26.32496452331543, "global_step": 567970, "epoch": 6843} {"train_loss": -27.48932456970215, "global_step": 567971, "epoch": 6843} {"train_loss": -27.22739028930664, "global_step": 567972, "epoch": 6843} {"train_loss": -27.08197593688965, "global_step": 567973, "epoch": 6843} {"train_loss": -26.906538009643555, "global_step": 567974, "epoch": 6843} {"train_loss": -27.868759155273438, "global_step": 567975, "epoch": 6843} {"train_loss": -27.091657638549805, "global_step": 567976, "epoch": 6843} {"train_loss": -27.64243507385254, "global_step": 567977, "epoch": 6843} {"train_loss": -26.855545043945312, "global_step": 567978, "epoch": 6843} {"train_loss": -27.322568893432617, "global_step": 567979, "epoch": 6843} {"train_loss": -27.56145668029785, "global_step": 567980, "epoch": 6843} {"train_loss": -27.726654052734375, "global_step": 567981, "epoch": 6843} {"train_loss": -27.83387565612793, "global_step": 567982, "epoch": 6843} {"train_loss": -28.030546188354492, "global_step": 567983, "epoch": 6843} {"train_loss": -27.758575439453125, "global_step": 567984, "epoch": 6843} {"train_loss": -27.890933990478516, "global_step": 567985, "epoch": 6843} {"train_loss": -27.64163589477539, "global_step": 567986, "epoch": 6843} {"train_loss": -27.573400497436523, "global_step": 567987, "epoch": 6843} {"train_loss": -28.021894454956055, "global_step": 567988, "epoch": 6843} {"train_loss": -27.547412872314453, "global_step": 567989, "epoch": 6843} {"train_loss": -27.924951553344727, "global_step": 567990, "epoch": 6843} {"train_loss": -27.673095703125, "global_step": 567991, "epoch": 6843} {"train_loss": -27.7750244140625, "global_step": 567992, "epoch": 6843} {"train_loss": -27.507816314697266, "global_step": 567993, "epoch": 6843} {"train_loss": -27.691425323486328, "global_step": 567994, "epoch": 6843} {"train_loss": -27.392974853515625, "global_step": 567995, "epoch": 6843} {"train_loss": -28.26948356628418, "global_step": 567996, "epoch": 6843} {"train_loss": -27.465307235717773, "global_step": 567997, "epoch": 6843} {"train_loss": -27.731769561767578, "global_step": 567998, "epoch": 6843} {"train_loss": -27.953556060791016, "global_step": 567999, "epoch": 6843} {"train_loss": -27.837732315063477, "global_step": 568000, "epoch": 6843} {"train_loss": -27.880725860595703, "global_step": 568001, "epoch": 6843} {"train_loss": -27.482587814331055, "global_step": 568002, "epoch": 6843} {"train_loss": -27.692523956298828, "global_step": 568003, "epoch": 6843} {"train_loss": -27.964990615844727, "global_step": 568004, "epoch": 6843} {"train_loss": -27.571430206298828, "global_step": 568005, "epoch": 6843} {"train_loss": -28.344741821289062, "global_step": 568006, "epoch": 6843} {"train_loss": -27.874460220336914, "global_step": 568007, "epoch": 6843} {"train_loss": -28.07594108581543, "global_step": 568008, "epoch": 6843} {"train_loss": -27.735427856445312, "global_step": 568009, "epoch": 6843} {"train_loss": -28.18145751953125, "global_step": 568010, "epoch": 6843} {"train_loss": -27.723194122314453, "global_step": 568011, "epoch": 6843} {"train_loss": -27.592870712280273, "global_step": 568012, "epoch": 6843} {"train_loss": -27.658161163330078, "global_step": 568013, "epoch": 6843} {"train_loss": -27.933042526245117, "global_step": 568014, "epoch": 6843} {"train_loss": -27.64753532409668, "global_step": 568015, "epoch": 6843} {"train_loss": -27.71302604675293, "global_step": 568016, "epoch": 6843} {"train_loss": -27.91998863220215, "global_step": 568017, "epoch": 6843} {"train_loss": -27.609119415283203, "global_step": 568018, "epoch": 6843} {"train_loss": -27.628204345703125, "global_step": 568019, "epoch": 6843} {"train_loss": -27.776716232299805, "global_step": 568020, "epoch": 6843} {"train_loss": -27.782758712768555, "global_step": 568021, "epoch": 6843} {"train_loss": -27.684812545776367, "global_step": 568022, "epoch": 6843} {"train_loss": -27.74842643737793, "global_step": 568023, "epoch": 6843} {"train_loss": -28.10065269470215, "global_step": 568024, "epoch": 6843} {"train_loss": -27.90913200378418, "global_step": 568025, "epoch": 6843} {"train_loss": -27.7961368560791, "global_step": 568026, "epoch": 6843} {"train_loss": -27.6329288482666, "global_step": 568027, "epoch": 6843} {"train_loss": -28.114572525024414, "global_step": 568028, "epoch": 6843} {"train_loss": -27.760786056518555, "global_step": 568029, "epoch": 6843} {"train_loss": -27.365802764892578, "global_step": 568030, "epoch": 6843} {"train_loss": -27.287311553955078, "global_step": 568031, "epoch": 6843} {"train_loss": -27.865453720092773, "global_step": 568032, "epoch": 6843} {"train_loss": -27.720449447631836, "global_step": 568033, "epoch": 6843} {"train_loss": -28.255558013916016, "global_step": 568034, "epoch": 6843} {"train_loss": -28.0936336517334, "global_step": 568035, "epoch": 6843} {"train_loss": -27.923629760742188, "global_step": 568036, "epoch": 6843} {"train_loss": -27.384033203125, "global_step": 568037, "epoch": 6843} {"train_loss": -28.038137435913086, "global_step": 568038, "epoch": 6843} {"train_loss": -28.398569107055664, "global_step": 568039, "epoch": 6843} {"train_loss": -27.835371017456055, "global_step": 568040, "epoch": 6843} {"train_loss": -27.7608699798584, "global_step": 568041, "epoch": 6843} {"train_loss": -27.628782272338867, "global_step": 568042, "epoch": 6843} {"train_loss": -28.04664421081543, "global_step": 568043, "epoch": 6843} {"train_loss": -27.957416534423828, "global_step": 568044, "epoch": 6843} {"train_loss": -27.603046417236328, "global_step": 568045, "epoch": 6843} {"train_loss": -28.015792846679688, "global_step": 568046, "epoch": 6843} {"train_loss": -27.564252853393555, "global_step": 568047, "epoch": 6843} {"train_loss": -27.65286636352539, "global_step": 568048, "epoch": 6843} {"train_loss": -27.529499053955078, "global_step": 568049, "epoch": 6843} {"train_loss": -27.69703483581543, "global_step": 568050, "epoch": 6843} {"train_loss": -27.718427543180535, "global_step": 568051, "epoch": 6843, "val_loss": 6746233.0} {"train_loss": -27.483610153198242, "global_step": 568052, "epoch": 6844} {"train_loss": -26.261396408081055, "global_step": 568053, "epoch": 6844} {"train_loss": -26.99014663696289, "global_step": 568054, "epoch": 6844} {"train_loss": -27.6207218170166, "global_step": 568055, "epoch": 6844} {"train_loss": -26.572040557861328, "global_step": 568056, "epoch": 6844} {"train_loss": -26.54111099243164, "global_step": 568057, "epoch": 6844} {"train_loss": -27.037031173706055, "global_step": 568058, "epoch": 6844} {"train_loss": -27.37640380859375, "global_step": 568059, "epoch": 6844} {"train_loss": -27.51584243774414, "global_step": 568060, "epoch": 6844} {"train_loss": -27.229150772094727, "global_step": 568061, "epoch": 6844} {"train_loss": -27.7186336517334, "global_step": 568062, "epoch": 6844} {"train_loss": -27.456619262695312, "global_step": 568063, "epoch": 6844} {"train_loss": -27.39984703063965, "global_step": 568064, "epoch": 6844} {"train_loss": -27.480213165283203, "global_step": 568065, "epoch": 6844} {"train_loss": -27.34872817993164, "global_step": 568066, "epoch": 6844} {"train_loss": -27.772220611572266, "global_step": 568067, "epoch": 6844} {"train_loss": -27.387073516845703, "global_step": 568068, "epoch": 6844} {"train_loss": -27.639923095703125, "global_step": 568069, "epoch": 6844} {"train_loss": -27.60498046875, "global_step": 568070, "epoch": 6844} {"train_loss": -27.685163497924805, "global_step": 568071, "epoch": 6844} {"train_loss": -27.345947265625, "global_step": 568072, "epoch": 6844} {"train_loss": -27.484943389892578, "global_step": 568073, "epoch": 6844} {"train_loss": -27.345041275024414, "global_step": 568074, "epoch": 6844} {"train_loss": -27.62485694885254, "global_step": 568075, "epoch": 6844} {"train_loss": -27.99513053894043, "global_step": 568076, "epoch": 6844} {"train_loss": -27.615924835205078, "global_step": 568077, "epoch": 6844} {"train_loss": -27.71719741821289, "global_step": 568078, "epoch": 6844} {"train_loss": -27.691869735717773, "global_step": 568079, "epoch": 6844} {"train_loss": -27.648773193359375, "global_step": 568080, "epoch": 6844} {"train_loss": -27.668283462524414, "global_step": 568081, "epoch": 6844} {"train_loss": -28.002323150634766, "global_step": 568082, "epoch": 6844} {"train_loss": -27.697772979736328, "global_step": 568083, "epoch": 6844} {"train_loss": -28.049392700195312, "global_step": 568084, "epoch": 6844} {"train_loss": -27.846296310424805, "global_step": 568085, "epoch": 6844} {"train_loss": -27.903614044189453, "global_step": 568086, "epoch": 6844} {"train_loss": -28.44988441467285, "global_step": 568087, "epoch": 6844} {"train_loss": -27.679529190063477, "global_step": 568088, "epoch": 6844} {"train_loss": -27.9628849029541, "global_step": 568089, "epoch": 6844} {"train_loss": -27.806299209594727, "global_step": 568090, "epoch": 6844} {"train_loss": -28.043027877807617, "global_step": 568091, "epoch": 6844} {"train_loss": -27.991437911987305, "global_step": 568092, "epoch": 6844} {"train_loss": -27.91680335998535, "global_step": 568093, "epoch": 6844} {"train_loss": -27.93558692932129, "global_step": 568094, "epoch": 6844} {"train_loss": -28.315793991088867, "global_step": 568095, "epoch": 6844} {"train_loss": -28.1365966796875, "global_step": 568096, "epoch": 6844} {"train_loss": -28.1221923828125, "global_step": 568097, "epoch": 6844} {"train_loss": -28.391530990600586, "global_step": 568098, "epoch": 6844} {"train_loss": -28.01682472229004, "global_step": 568099, "epoch": 6844} {"train_loss": -27.732309341430664, "global_step": 568100, "epoch": 6844} {"train_loss": -27.933731079101562, "global_step": 568101, "epoch": 6844} {"train_loss": -27.947052001953125, "global_step": 568102, "epoch": 6844} {"train_loss": -27.70302391052246, "global_step": 568103, "epoch": 6844} {"train_loss": -27.658273696899414, "global_step": 568104, "epoch": 6844} {"train_loss": -27.669086456298828, "global_step": 568105, "epoch": 6844} {"train_loss": -27.9954891204834, "global_step": 568106, "epoch": 6844} {"train_loss": -28.001554489135742, "global_step": 568107, "epoch": 6844} {"train_loss": -27.82248306274414, "global_step": 568108, "epoch": 6844} {"train_loss": -27.950674057006836, "global_step": 568109, "epoch": 6844} {"train_loss": -28.214574813842773, "global_step": 568110, "epoch": 6844} {"train_loss": -27.741718292236328, "global_step": 568111, "epoch": 6844} {"train_loss": -28.0974178314209, "global_step": 568112, "epoch": 6844} {"train_loss": -27.82730484008789, "global_step": 568113, "epoch": 6844} {"train_loss": -28.024173736572266, "global_step": 568114, "epoch": 6844} {"train_loss": -27.651763916015625, "global_step": 568115, "epoch": 6844} {"train_loss": -28.0025634765625, "global_step": 568116, "epoch": 6844} {"train_loss": -27.735010147094727, "global_step": 568117, "epoch": 6844} {"train_loss": -27.54998779296875, "global_step": 568118, "epoch": 6844} {"train_loss": -27.89020347595215, "global_step": 568119, "epoch": 6844} {"train_loss": -27.940954208374023, "global_step": 568120, "epoch": 6844} {"train_loss": -28.02839469909668, "global_step": 568121, "epoch": 6844} {"train_loss": -27.903228759765625, "global_step": 568122, "epoch": 6844} {"train_loss": -27.856164932250977, "global_step": 568123, "epoch": 6844} {"train_loss": -27.770523071289062, "global_step": 568124, "epoch": 6844} {"train_loss": -28.092737197875977, "global_step": 568125, "epoch": 6844} {"train_loss": -28.338043212890625, "global_step": 568126, "epoch": 6844} {"train_loss": -27.7609920501709, "global_step": 568127, "epoch": 6844} {"train_loss": -27.86197853088379, "global_step": 568128, "epoch": 6844} {"train_loss": -28.1274471282959, "global_step": 568129, "epoch": 6844} {"train_loss": -27.837141036987305, "global_step": 568130, "epoch": 6844} {"train_loss": -27.84095573425293, "global_step": 568131, "epoch": 6844} {"train_loss": -27.788671493530273, "global_step": 568132, "epoch": 6844} {"train_loss": -27.795499801635742, "global_step": 568133, "epoch": 6844} {"train_loss": -27.74163039333849, "global_step": 568134, "epoch": 6844, "val_loss": 6743368.5} {"train_loss": -27.301313400268555, "global_step": 568135, "epoch": 6845} {"train_loss": -26.67658805847168, "global_step": 568136, "epoch": 6845} {"train_loss": -26.665271759033203, "global_step": 568137, "epoch": 6845} {"train_loss": -27.004932403564453, "global_step": 568138, "epoch": 6845} {"train_loss": -26.81060218811035, "global_step": 568139, "epoch": 6845} {"train_loss": -26.2954044342041, "global_step": 568140, "epoch": 6845} {"train_loss": -27.125049591064453, "global_step": 568141, "epoch": 6845} {"train_loss": -25.882404327392578, "global_step": 568142, "epoch": 6845} {"train_loss": -26.800128936767578, "global_step": 568143, "epoch": 6845} {"train_loss": -26.777881622314453, "global_step": 568144, "epoch": 6845} {"train_loss": -26.899093627929688, "global_step": 568145, "epoch": 6845} {"train_loss": -26.409032821655273, "global_step": 568146, "epoch": 6845} {"train_loss": -26.74007225036621, "global_step": 568147, "epoch": 6845} {"train_loss": -26.778247833251953, "global_step": 568148, "epoch": 6845} {"train_loss": -27.41224479675293, "global_step": 568149, "epoch": 6845} {"train_loss": -26.777740478515625, "global_step": 568150, "epoch": 6845} {"train_loss": -27.037078857421875, "global_step": 568151, "epoch": 6845} {"train_loss": -26.977935791015625, "global_step": 568152, "epoch": 6845} {"train_loss": -27.28675651550293, "global_step": 568153, "epoch": 6845} {"train_loss": -26.928186416625977, "global_step": 568154, "epoch": 6845} {"train_loss": -27.356616973876953, "global_step": 568155, "epoch": 6845} {"train_loss": -26.934814453125, "global_step": 568156, "epoch": 6845} {"train_loss": -27.233304977416992, "global_step": 568157, "epoch": 6845} {"train_loss": -27.48785400390625, "global_step": 568158, "epoch": 6845} {"train_loss": -27.3167724609375, "global_step": 568159, "epoch": 6845} {"train_loss": -27.530811309814453, "global_step": 568160, "epoch": 6845} {"train_loss": -27.475000381469727, "global_step": 568161, "epoch": 6845} {"train_loss": -27.729999542236328, "global_step": 568162, "epoch": 6845} {"train_loss": -27.18241310119629, "global_step": 568163, "epoch": 6845} {"train_loss": -27.813505172729492, "global_step": 568164, "epoch": 6845} {"train_loss": -27.602209091186523, "global_step": 568165, "epoch": 6845} {"train_loss": -27.57752799987793, "global_step": 568166, "epoch": 6845} {"train_loss": -27.350345611572266, "global_step": 568167, "epoch": 6845} {"train_loss": -27.545578002929688, "global_step": 568168, "epoch": 6845} {"train_loss": -27.692296981811523, "global_step": 568169, "epoch": 6845} {"train_loss": -27.95673942565918, "global_step": 568170, "epoch": 6845} {"train_loss": -27.983606338500977, "global_step": 568171, "epoch": 6845} {"train_loss": -27.7419376373291, "global_step": 568172, "epoch": 6845} {"train_loss": -27.70841407775879, "global_step": 568173, "epoch": 6845} {"train_loss": -27.876422882080078, "global_step": 568174, "epoch": 6845} {"train_loss": -27.611112594604492, "global_step": 568175, "epoch": 6845} {"train_loss": -27.71352195739746, "global_step": 568176, "epoch": 6845} {"train_loss": -27.888574600219727, "global_step": 568177, "epoch": 6845} {"train_loss": -27.549238204956055, "global_step": 568178, "epoch": 6845} {"train_loss": -28.36322593688965, "global_step": 568179, "epoch": 6845} {"train_loss": -27.811279296875, "global_step": 568180, "epoch": 6845} {"train_loss": -27.4913330078125, "global_step": 568181, "epoch": 6845} {"train_loss": -28.07217788696289, "global_step": 568182, "epoch": 6845} {"train_loss": -27.80810546875, "global_step": 568183, "epoch": 6845} {"train_loss": -27.817062377929688, "global_step": 568184, "epoch": 6845} {"train_loss": -28.09248161315918, "global_step": 568185, "epoch": 6845} {"train_loss": -27.758380889892578, "global_step": 568186, "epoch": 6845} {"train_loss": -27.7670841217041, "global_step": 568187, "epoch": 6845} {"train_loss": -27.770471572875977, "global_step": 568188, "epoch": 6845} {"train_loss": -27.594009399414062, "global_step": 568189, "epoch": 6845} {"train_loss": -28.038843154907227, "global_step": 568190, "epoch": 6845} {"train_loss": -27.71967887878418, "global_step": 568191, "epoch": 6845} {"train_loss": -27.990955352783203, "global_step": 568192, "epoch": 6845} {"train_loss": -28.124963760375977, "global_step": 568193, "epoch": 6845} {"train_loss": -27.69048500061035, "global_step": 568194, "epoch": 6845} {"train_loss": -28.034536361694336, "global_step": 568195, "epoch": 6845} {"train_loss": -27.522491455078125, "global_step": 568196, "epoch": 6845} {"train_loss": -27.69109535217285, "global_step": 568197, "epoch": 6845} {"train_loss": -28.025754928588867, "global_step": 568198, "epoch": 6845} {"train_loss": -27.762434005737305, "global_step": 568199, "epoch": 6845} {"train_loss": -28.098255157470703, "global_step": 568200, "epoch": 6845} {"train_loss": -27.98609733581543, "global_step": 568201, "epoch": 6845} {"train_loss": -28.050352096557617, "global_step": 568202, "epoch": 6845} {"train_loss": -27.5772762298584, "global_step": 568203, "epoch": 6845} {"train_loss": -28.111820220947266, "global_step": 568204, "epoch": 6845} {"train_loss": -28.22588539123535, "global_step": 568205, "epoch": 6845} {"train_loss": -27.5001163482666, "global_step": 568206, "epoch": 6845} {"train_loss": -27.9866943359375, "global_step": 568207, "epoch": 6845} {"train_loss": -27.9453067779541, "global_step": 568208, "epoch": 6845} {"train_loss": -27.597064971923828, "global_step": 568209, "epoch": 6845} {"train_loss": -27.90125846862793, "global_step": 568210, "epoch": 6845} {"train_loss": -28.42104148864746, "global_step": 568211, "epoch": 6845} {"train_loss": -27.766077041625977, "global_step": 568212, "epoch": 6845} {"train_loss": -27.387781143188477, "global_step": 568213, "epoch": 6845} {"train_loss": -27.570816040039062, "global_step": 568214, "epoch": 6845} {"train_loss": -27.495840072631836, "global_step": 568215, "epoch": 6845} {"train_loss": -27.871145248413086, "global_step": 568216, "epoch": 6845} {"train_loss": -27.525170429643378, "global_step": 568217, "epoch": 6845, "val_loss": 6622469.0} {"train_loss": -25.956567764282227, "global_step": 568218, "epoch": 6846} {"train_loss": -26.445112228393555, "global_step": 568219, "epoch": 6846} {"train_loss": -26.343826293945312, "global_step": 568220, "epoch": 6846} {"train_loss": -27.237518310546875, "global_step": 568221, "epoch": 6846} {"train_loss": -26.518033981323242, "global_step": 568222, "epoch": 6846} {"train_loss": -27.047088623046875, "global_step": 568223, "epoch": 6846} {"train_loss": -26.616703033447266, "global_step": 568224, "epoch": 6846} {"train_loss": -26.70823097229004, "global_step": 568225, "epoch": 6846} {"train_loss": -27.166187286376953, "global_step": 568226, "epoch": 6846} {"train_loss": -26.92299461364746, "global_step": 568227, "epoch": 6846} {"train_loss": -26.96755027770996, "global_step": 568228, "epoch": 6846} {"train_loss": -27.02569007873535, "global_step": 568229, "epoch": 6846} {"train_loss": -27.557540893554688, "global_step": 568230, "epoch": 6846} {"train_loss": -26.864622116088867, "global_step": 568231, "epoch": 6846} {"train_loss": -27.41845703125, "global_step": 568232, "epoch": 6846} {"train_loss": -27.32147789001465, "global_step": 568233, "epoch": 6846} {"train_loss": -26.85507583618164, "global_step": 568234, "epoch": 6846} {"train_loss": -27.064374923706055, "global_step": 568235, "epoch": 6846} {"train_loss": -27.235462188720703, "global_step": 568236, "epoch": 6846} {"train_loss": -27.189350128173828, "global_step": 568237, "epoch": 6846} {"train_loss": -26.989395141601562, "global_step": 568238, "epoch": 6846} {"train_loss": -27.40913200378418, "global_step": 568239, "epoch": 6846} {"train_loss": -27.242786407470703, "global_step": 568240, "epoch": 6846} {"train_loss": -27.44712257385254, "global_step": 568241, "epoch": 6846} {"train_loss": -27.20576286315918, "global_step": 568242, "epoch": 6846} {"train_loss": -27.068525314331055, "global_step": 568243, "epoch": 6846} {"train_loss": -27.48042106628418, "global_step": 568244, "epoch": 6846} {"train_loss": -27.244348526000977, "global_step": 568245, "epoch": 6846} {"train_loss": -27.490222930908203, "global_step": 568246, "epoch": 6846} {"train_loss": -27.57059097290039, "global_step": 568247, "epoch": 6846} {"train_loss": -27.500629425048828, "global_step": 568248, "epoch": 6846} {"train_loss": -27.603546142578125, "global_step": 568249, "epoch": 6846} {"train_loss": -27.205322265625, "global_step": 568250, "epoch": 6846} {"train_loss": -27.267908096313477, "global_step": 568251, "epoch": 6846} {"train_loss": -27.569828033447266, "global_step": 568252, "epoch": 6846} {"train_loss": -27.427570343017578, "global_step": 568253, "epoch": 6846} {"train_loss": -27.381866455078125, "global_step": 568254, "epoch": 6846} {"train_loss": -27.824506759643555, "global_step": 568255, "epoch": 6846} {"train_loss": -27.565210342407227, "global_step": 568256, "epoch": 6846} {"train_loss": -27.577850341796875, "global_step": 568257, "epoch": 6846} {"train_loss": -27.845916748046875, "global_step": 568258, "epoch": 6846} {"train_loss": -27.82672691345215, "global_step": 568259, "epoch": 6846} {"train_loss": -27.93523597717285, "global_step": 568260, "epoch": 6846} {"train_loss": -27.886762619018555, "global_step": 568261, "epoch": 6846} {"train_loss": -27.9205265045166, "global_step": 568262, "epoch": 6846} {"train_loss": -27.464574813842773, "global_step": 568263, "epoch": 6846} {"train_loss": -27.42030906677246, "global_step": 568264, "epoch": 6846} {"train_loss": -28.2708683013916, "global_step": 568265, "epoch": 6846} {"train_loss": -28.025146484375, "global_step": 568266, "epoch": 6846} {"train_loss": -27.956073760986328, "global_step": 568267, "epoch": 6846} {"train_loss": -28.194974899291992, "global_step": 568268, "epoch": 6846} {"train_loss": -27.889057159423828, "global_step": 568269, "epoch": 6846} {"train_loss": -28.231672286987305, "global_step": 568270, "epoch": 6846} {"train_loss": -28.151315689086914, "global_step": 568271, "epoch": 6846} {"train_loss": -27.959436416625977, "global_step": 568272, "epoch": 6846} {"train_loss": -28.2277889251709, "global_step": 568273, "epoch": 6846} {"train_loss": -28.077777862548828, "global_step": 568274, "epoch": 6846} {"train_loss": -27.90754508972168, "global_step": 568275, "epoch": 6846} {"train_loss": -28.45707130432129, "global_step": 568276, "epoch": 6846} {"train_loss": -28.1197566986084, "global_step": 568277, "epoch": 6846} {"train_loss": -28.175125122070312, "global_step": 568278, "epoch": 6846} {"train_loss": -28.231245040893555, "global_step": 568279, "epoch": 6846} {"train_loss": -28.28281021118164, "global_step": 568280, "epoch": 6846} {"train_loss": -28.14752769470215, "global_step": 568281, "epoch": 6846} {"train_loss": -28.120990753173828, "global_step": 568282, "epoch": 6846} {"train_loss": -28.124073028564453, "global_step": 568283, "epoch": 6846} {"train_loss": -28.188093185424805, "global_step": 568284, "epoch": 6846} {"train_loss": -28.265974044799805, "global_step": 568285, "epoch": 6846} {"train_loss": -27.84346580505371, "global_step": 568286, "epoch": 6846} {"train_loss": -27.860193252563477, "global_step": 568287, "epoch": 6846} {"train_loss": -28.142047882080078, "global_step": 568288, "epoch": 6846} {"train_loss": -27.674657821655273, "global_step": 568289, "epoch": 6846} {"train_loss": -27.797626495361328, "global_step": 568290, "epoch": 6846} {"train_loss": -27.707250595092773, "global_step": 568291, "epoch": 6846} {"train_loss": -28.240320205688477, "global_step": 568292, "epoch": 6846} {"train_loss": -28.15472412109375, "global_step": 568293, "epoch": 6846} {"train_loss": -28.084014892578125, "global_step": 568294, "epoch": 6846} {"train_loss": -27.757287979125977, "global_step": 568295, "epoch": 6846} {"train_loss": -27.833927154541016, "global_step": 568296, "epoch": 6846} {"train_loss": -28.13801383972168, "global_step": 568297, "epoch": 6846} {"train_loss": -28.17512321472168, "global_step": 568298, "epoch": 6846} {"train_loss": -27.996124267578125, "global_step": 568299, "epoch": 6846} {"train_loss": -27.61059554226427, "global_step": 568300, "epoch": 6846, "val_loss": 6666838.0} {"train_loss": -27.682870864868164, "global_step": 568301, "epoch": 6847} {"train_loss": -27.852924346923828, "global_step": 568302, "epoch": 6847} {"train_loss": -27.221588134765625, "global_step": 568303, "epoch": 6847} {"train_loss": -27.381851196289062, "global_step": 568304, "epoch": 6847} {"train_loss": -27.28777503967285, "global_step": 568305, "epoch": 6847} {"train_loss": -27.08148765563965, "global_step": 568306, "epoch": 6847} {"train_loss": -27.049575805664062, "global_step": 568307, "epoch": 6847} {"train_loss": -27.546875, "global_step": 568308, "epoch": 6847} {"train_loss": -26.947158813476562, "global_step": 568309, "epoch": 6847} {"train_loss": -27.07122802734375, "global_step": 568310, "epoch": 6847} {"train_loss": -26.85898780822754, "global_step": 568311, "epoch": 6847} {"train_loss": -27.013097763061523, "global_step": 568312, "epoch": 6847} {"train_loss": -27.297882080078125, "global_step": 568313, "epoch": 6847} {"train_loss": -27.415929794311523, "global_step": 568314, "epoch": 6847} {"train_loss": -27.80195426940918, "global_step": 568315, "epoch": 6847} {"train_loss": -27.256122589111328, "global_step": 568316, "epoch": 6847} {"train_loss": -27.82136344909668, "global_step": 568317, "epoch": 6847} {"train_loss": -27.51856803894043, "global_step": 568318, "epoch": 6847} {"train_loss": -27.46234130859375, "global_step": 568319, "epoch": 6847} {"train_loss": -27.804031372070312, "global_step": 568320, "epoch": 6847} {"train_loss": -27.535795211791992, "global_step": 568321, "epoch": 6847} {"train_loss": -27.3389835357666, "global_step": 568322, "epoch": 6847} {"train_loss": -27.642675399780273, "global_step": 568323, "epoch": 6847} {"train_loss": -28.087814331054688, "global_step": 568324, "epoch": 6847} {"train_loss": -27.49773597717285, "global_step": 568325, "epoch": 6847} {"train_loss": -27.68890380859375, "global_step": 568326, "epoch": 6847} {"train_loss": -27.633960723876953, "global_step": 568327, "epoch": 6847} {"train_loss": -27.691267013549805, "global_step": 568328, "epoch": 6847} {"train_loss": -27.53165626525879, "global_step": 568329, "epoch": 6847} {"train_loss": -27.74408531188965, "global_step": 568330, "epoch": 6847} {"train_loss": -27.4593505859375, "global_step": 568331, "epoch": 6847} {"train_loss": -27.912464141845703, "global_step": 568332, "epoch": 6847} {"train_loss": -27.9757022857666, "global_step": 568333, "epoch": 6847} {"train_loss": -27.6282901763916, "global_step": 568334, "epoch": 6847} {"train_loss": -27.94904136657715, "global_step": 568335, "epoch": 6847} {"train_loss": -28.060510635375977, "global_step": 568336, "epoch": 6847} {"train_loss": -27.65313720703125, "global_step": 568337, "epoch": 6847} {"train_loss": -27.9625186920166, "global_step": 568338, "epoch": 6847} {"train_loss": -28.396747589111328, "global_step": 568339, "epoch": 6847} {"train_loss": -27.963064193725586, "global_step": 568340, "epoch": 6847} {"train_loss": -27.889972686767578, "global_step": 568341, "epoch": 6847} {"train_loss": -28.01499366760254, "global_step": 568342, "epoch": 6847} {"train_loss": -27.866281509399414, "global_step": 568343, "epoch": 6847} {"train_loss": -28.191938400268555, "global_step": 568344, "epoch": 6847} {"train_loss": -27.4567928314209, "global_step": 568345, "epoch": 6847} {"train_loss": -28.190839767456055, "global_step": 568346, "epoch": 6847} {"train_loss": -27.744421005249023, "global_step": 568347, "epoch": 6847} {"train_loss": -27.970062255859375, "global_step": 568348, "epoch": 6847} {"train_loss": -28.00459098815918, "global_step": 568349, "epoch": 6847} {"train_loss": -28.072912216186523, "global_step": 568350, "epoch": 6847} {"train_loss": -27.666584014892578, "global_step": 568351, "epoch": 6847} {"train_loss": -28.11181640625, "global_step": 568352, "epoch": 6847} {"train_loss": -27.751386642456055, "global_step": 568353, "epoch": 6847} {"train_loss": -27.325292587280273, "global_step": 568354, "epoch": 6847} {"train_loss": -28.210376739501953, "global_step": 568355, "epoch": 6847} {"train_loss": -27.988101959228516, "global_step": 568356, "epoch": 6847} {"train_loss": -28.135269165039062, "global_step": 568357, "epoch": 6847} {"train_loss": -27.694171905517578, "global_step": 568358, "epoch": 6847} {"train_loss": -27.47930335998535, "global_step": 568359, "epoch": 6847} {"train_loss": -27.84659194946289, "global_step": 568360, "epoch": 6847} {"train_loss": -28.179584503173828, "global_step": 568361, "epoch": 6847} {"train_loss": -27.534666061401367, "global_step": 568362, "epoch": 6847} {"train_loss": -27.6237735748291, "global_step": 568363, "epoch": 6847} {"train_loss": -27.74074363708496, "global_step": 568364, "epoch": 6847} {"train_loss": -27.8499755859375, "global_step": 568365, "epoch": 6847} {"train_loss": -28.0194091796875, "global_step": 568366, "epoch": 6847} {"train_loss": -27.9967098236084, "global_step": 568367, "epoch": 6847} {"train_loss": -28.1792049407959, "global_step": 568368, "epoch": 6847} {"train_loss": -27.71746826171875, "global_step": 568369, "epoch": 6847} {"train_loss": -27.6683406829834, "global_step": 568370, "epoch": 6847} {"train_loss": -27.960805892944336, "global_step": 568371, "epoch": 6847} {"train_loss": -27.9355525970459, "global_step": 568372, "epoch": 6847} {"train_loss": -28.215900421142578, "global_step": 568373, "epoch": 6847} {"train_loss": -27.929044723510742, "global_step": 568374, "epoch": 6847} {"train_loss": -27.6427059173584, "global_step": 568375, "epoch": 6847} {"train_loss": -27.93848991394043, "global_step": 568376, "epoch": 6847} {"train_loss": -28.1174259185791, "global_step": 568377, "epoch": 6847} {"train_loss": -28.21563148498535, "global_step": 568378, "epoch": 6847} {"train_loss": -28.07895278930664, "global_step": 568379, "epoch": 6847} {"train_loss": -27.957788467407227, "global_step": 568380, "epoch": 6847} {"train_loss": -28.058996200561523, "global_step": 568381, "epoch": 6847} {"train_loss": -28.053998947143555, "global_step": 568382, "epoch": 6847} {"train_loss": -27.730709788310957, "global_step": 568383, "epoch": 6847, "val_loss": 6652123.0} {"train_loss": -27.855253219604492, "global_step": 568384, "epoch": 6848} {"train_loss": -26.97760581970215, "global_step": 568385, "epoch": 6848} {"train_loss": -27.2869873046875, "global_step": 568386, "epoch": 6848} {"train_loss": -26.601491928100586, "global_step": 568387, "epoch": 6848} {"train_loss": -27.5145263671875, "global_step": 568388, "epoch": 6848} {"train_loss": -27.32505226135254, "global_step": 568389, "epoch": 6848} {"train_loss": -27.101776123046875, "global_step": 568390, "epoch": 6848} {"train_loss": -27.281421661376953, "global_step": 568391, "epoch": 6848} {"train_loss": -27.449750900268555, "global_step": 568392, "epoch": 6848} {"train_loss": -27.399877548217773, "global_step": 568393, "epoch": 6848} {"train_loss": -27.628116607666016, "global_step": 568394, "epoch": 6848} {"train_loss": -26.946094512939453, "global_step": 568395, "epoch": 6848} {"train_loss": -27.634077072143555, "global_step": 568396, "epoch": 6848} {"train_loss": -27.263996124267578, "global_step": 568397, "epoch": 6848} {"train_loss": -27.53607749938965, "global_step": 568398, "epoch": 6848} {"train_loss": -27.285573959350586, "global_step": 568399, "epoch": 6848} {"train_loss": -27.7270565032959, "global_step": 568400, "epoch": 6848} {"train_loss": -27.665063858032227, "global_step": 568401, "epoch": 6848} {"train_loss": -27.817602157592773, "global_step": 568402, "epoch": 6848} {"train_loss": -27.587360382080078, "global_step": 568403, "epoch": 6848} {"train_loss": -27.370548248291016, "global_step": 568404, "epoch": 6848} {"train_loss": -27.481271743774414, "global_step": 568405, "epoch": 6848} {"train_loss": -27.690881729125977, "global_step": 568406, "epoch": 6848} {"train_loss": -27.943225860595703, "global_step": 568407, "epoch": 6848} {"train_loss": -27.45992088317871, "global_step": 568408, "epoch": 6848} {"train_loss": -27.76215934753418, "global_step": 568409, "epoch": 6848} {"train_loss": -27.749494552612305, "global_step": 568410, "epoch": 6848} {"train_loss": -27.959226608276367, "global_step": 568411, "epoch": 6848} {"train_loss": -27.765914916992188, "global_step": 568412, "epoch": 6848} {"train_loss": -27.797216415405273, "global_step": 568413, "epoch": 6848} {"train_loss": -27.6855525970459, "global_step": 568414, "epoch": 6848} {"train_loss": -27.63592529296875, "global_step": 568415, "epoch": 6848} {"train_loss": -27.6697940826416, "global_step": 568416, "epoch": 6848} {"train_loss": -27.510473251342773, "global_step": 568417, "epoch": 6848} {"train_loss": -27.697006225585938, "global_step": 568418, "epoch": 6848} {"train_loss": -27.804372787475586, "global_step": 568419, "epoch": 6848} {"train_loss": -27.49993324279785, "global_step": 568420, "epoch": 6848} {"train_loss": -27.795034408569336, "global_step": 568421, "epoch": 6848} {"train_loss": -27.8631649017334, "global_step": 568422, "epoch": 6848} {"train_loss": -27.7218074798584, "global_step": 568423, "epoch": 6848} {"train_loss": -27.847686767578125, "global_step": 568424, "epoch": 6848} {"train_loss": -27.576648712158203, "global_step": 568425, "epoch": 6848} {"train_loss": -28.152545928955078, "global_step": 568426, "epoch": 6848} {"train_loss": -27.896738052368164, "global_step": 568427, "epoch": 6848} {"train_loss": -27.889734268188477, "global_step": 568428, "epoch": 6848} {"train_loss": -27.977783203125, "global_step": 568429, "epoch": 6848} {"train_loss": -28.2092227935791, "global_step": 568430, "epoch": 6848} {"train_loss": -28.067228317260742, "global_step": 568431, "epoch": 6848} {"train_loss": -27.852048873901367, "global_step": 568432, "epoch": 6848} {"train_loss": -28.10928726196289, "global_step": 568433, "epoch": 6848} {"train_loss": -28.028852462768555, "global_step": 568434, "epoch": 6848} {"train_loss": -27.893802642822266, "global_step": 568435, "epoch": 6848} {"train_loss": -27.863447189331055, "global_step": 568436, "epoch": 6848} {"train_loss": -28.085641860961914, "global_step": 568437, "epoch": 6848} {"train_loss": -28.347198486328125, "global_step": 568438, "epoch": 6848} {"train_loss": -28.154626846313477, "global_step": 568439, "epoch": 6848} {"train_loss": -28.024768829345703, "global_step": 568440, "epoch": 6848} {"train_loss": -28.029590606689453, "global_step": 568441, "epoch": 6848} {"train_loss": -27.792768478393555, "global_step": 568442, "epoch": 6848} {"train_loss": -28.376815795898438, "global_step": 568443, "epoch": 6848} {"train_loss": -28.381500244140625, "global_step": 568444, "epoch": 6848} {"train_loss": -28.197935104370117, "global_step": 568445, "epoch": 6848} {"train_loss": -27.992090225219727, "global_step": 568446, "epoch": 6848} {"train_loss": -27.824909210205078, "global_step": 568447, "epoch": 6848} {"train_loss": -28.110471725463867, "global_step": 568448, "epoch": 6848} {"train_loss": -27.692764282226562, "global_step": 568449, "epoch": 6848} {"train_loss": -27.506977081298828, "global_step": 568450, "epoch": 6848} {"train_loss": -26.979101181030273, "global_step": 568451, "epoch": 6848} {"train_loss": -26.58025550842285, "global_step": 568452, "epoch": 6848} {"train_loss": -26.90964126586914, "global_step": 568453, "epoch": 6848} {"train_loss": -26.774084091186523, "global_step": 568454, "epoch": 6848} {"train_loss": -27.392562866210938, "global_step": 568455, "epoch": 6848} {"train_loss": -27.618637084960938, "global_step": 568456, "epoch": 6848} {"train_loss": -27.517648696899414, "global_step": 568457, "epoch": 6848} {"train_loss": -27.2449893951416, "global_step": 568458, "epoch": 6848} {"train_loss": -27.363828659057617, "global_step": 568459, "epoch": 6848} {"train_loss": -28.16855812072754, "global_step": 568460, "epoch": 6848} {"train_loss": -27.420806884765625, "global_step": 568461, "epoch": 6848} {"train_loss": -27.794065475463867, "global_step": 568462, "epoch": 6848} {"train_loss": -27.45584487915039, "global_step": 568463, "epoch": 6848} {"train_loss": -27.963245391845703, "global_step": 568464, "epoch": 6848} {"train_loss": -27.152379989624023, "global_step": 568465, "epoch": 6848} {"train_loss": -27.668238099799098, "global_step": 568466, "epoch": 6848, "val_loss": 6658946.0} {"train_loss": -24.216588973999023, "global_step": 568467, "epoch": 6849} {"train_loss": -25.098196029663086, "global_step": 568468, "epoch": 6849} {"train_loss": -26.3289794921875, "global_step": 568469, "epoch": 6849} {"train_loss": -25.644392013549805, "global_step": 568470, "epoch": 6849} {"train_loss": -26.708831787109375, "global_step": 568471, "epoch": 6849} {"train_loss": -25.85993766784668, "global_step": 568472, "epoch": 6849} {"train_loss": -26.3193416595459, "global_step": 568473, "epoch": 6849} {"train_loss": -26.333740234375, "global_step": 568474, "epoch": 6849} {"train_loss": -26.49698829650879, "global_step": 568475, "epoch": 6849} {"train_loss": -26.5402889251709, "global_step": 568476, "epoch": 6849} {"train_loss": -26.553884506225586, "global_step": 568477, "epoch": 6849} {"train_loss": -26.396228790283203, "global_step": 568478, "epoch": 6849} {"train_loss": -26.9094181060791, "global_step": 568479, "epoch": 6849} {"train_loss": -26.85235595703125, "global_step": 568480, "epoch": 6849} {"train_loss": -26.866872787475586, "global_step": 568481, "epoch": 6849} {"train_loss": -27.268701553344727, "global_step": 568482, "epoch": 6849} {"train_loss": -26.934667587280273, "global_step": 568483, "epoch": 6849} {"train_loss": -26.95599937438965, "global_step": 568484, "epoch": 6849} {"train_loss": -27.044708251953125, "global_step": 568485, "epoch": 6849} {"train_loss": -27.4512882232666, "global_step": 568486, "epoch": 6849} {"train_loss": -27.389307022094727, "global_step": 568487, "epoch": 6849} {"train_loss": -26.904767990112305, "global_step": 568488, "epoch": 6849} {"train_loss": -27.54794692993164, "global_step": 568489, "epoch": 6849} {"train_loss": -27.491230010986328, "global_step": 568490, "epoch": 6849} {"train_loss": -27.05573081970215, "global_step": 568491, "epoch": 6849} {"train_loss": -27.029510498046875, "global_step": 568492, "epoch": 6849} {"train_loss": -27.519439697265625, "global_step": 568493, "epoch": 6849} {"train_loss": -27.503589630126953, "global_step": 568494, "epoch": 6849} {"train_loss": -27.581647872924805, "global_step": 568495, "epoch": 6849} {"train_loss": -27.855579376220703, "global_step": 568496, "epoch": 6849} {"train_loss": -27.536331176757812, "global_step": 568497, "epoch": 6849} {"train_loss": -27.57794189453125, "global_step": 568498, "epoch": 6849} {"train_loss": -27.63852310180664, "global_step": 568499, "epoch": 6849} {"train_loss": -27.978757858276367, "global_step": 568500, "epoch": 6849} {"train_loss": -27.41694450378418, "global_step": 568501, "epoch": 6849} {"train_loss": -27.653539657592773, "global_step": 568502, "epoch": 6849} {"train_loss": -27.414655685424805, "global_step": 568503, "epoch": 6849} {"train_loss": -28.054731369018555, "global_step": 568504, "epoch": 6849} {"train_loss": -27.99610710144043, "global_step": 568505, "epoch": 6849} {"train_loss": -27.8724422454834, "global_step": 568506, "epoch": 6849} {"train_loss": -27.803394317626953, "global_step": 568507, "epoch": 6849} {"train_loss": -27.557865142822266, "global_step": 568508, "epoch": 6849} {"train_loss": -27.71969985961914, "global_step": 568509, "epoch": 6849} {"train_loss": -28.15022087097168, "global_step": 568510, "epoch": 6849} {"train_loss": -27.41131591796875, "global_step": 568511, "epoch": 6849} {"train_loss": -27.9212589263916, "global_step": 568512, "epoch": 6849} {"train_loss": -27.579557418823242, "global_step": 568513, "epoch": 6849} {"train_loss": -27.9639892578125, "global_step": 568514, "epoch": 6849} {"train_loss": -27.606210708618164, "global_step": 568515, "epoch": 6849} {"train_loss": -27.85878562927246, "global_step": 568516, "epoch": 6849} {"train_loss": -27.7584228515625, "global_step": 568517, "epoch": 6849} {"train_loss": -28.001386642456055, "global_step": 568518, "epoch": 6849} {"train_loss": -27.825788497924805, "global_step": 568519, "epoch": 6849} {"train_loss": -28.039392471313477, "global_step": 568520, "epoch": 6849} {"train_loss": -27.851181030273438, "global_step": 568521, "epoch": 6849} {"train_loss": -27.76234245300293, "global_step": 568522, "epoch": 6849} {"train_loss": -27.993499755859375, "global_step": 568523, "epoch": 6849} {"train_loss": -27.788867950439453, "global_step": 568524, "epoch": 6849} {"train_loss": -28.161169052124023, "global_step": 568525, "epoch": 6849} {"train_loss": -27.913663864135742, "global_step": 568526, "epoch": 6849} {"train_loss": -27.87885093688965, "global_step": 568527, "epoch": 6849} {"train_loss": -28.03900146484375, "global_step": 568528, "epoch": 6849} {"train_loss": -28.218168258666992, "global_step": 568529, "epoch": 6849} {"train_loss": -27.843830108642578, "global_step": 568530, "epoch": 6849} {"train_loss": -28.000600814819336, "global_step": 568531, "epoch": 6849} {"train_loss": -27.838916778564453, "global_step": 568532, "epoch": 6849} {"train_loss": -27.814481735229492, "global_step": 568533, "epoch": 6849} {"train_loss": -27.61262321472168, "global_step": 568534, "epoch": 6849} {"train_loss": -27.846532821655273, "global_step": 568535, "epoch": 6849} {"train_loss": -27.90987205505371, "global_step": 568536, "epoch": 6849} {"train_loss": -27.996429443359375, "global_step": 568537, "epoch": 6849} {"train_loss": -27.5482234954834, "global_step": 568538, "epoch": 6849} {"train_loss": -27.40553092956543, "global_step": 568539, "epoch": 6849} {"train_loss": -27.24558448791504, "global_step": 568540, "epoch": 6849} {"train_loss": -27.674360275268555, "global_step": 568541, "epoch": 6849} {"train_loss": -27.97920036315918, "global_step": 568542, "epoch": 6849} {"train_loss": -27.55759620666504, "global_step": 568543, "epoch": 6849} {"train_loss": -27.449888229370117, "global_step": 568544, "epoch": 6849} {"train_loss": -27.895904541015625, "global_step": 568545, "epoch": 6849} {"train_loss": -27.54152488708496, "global_step": 568546, "epoch": 6849} {"train_loss": -27.715545654296875, "global_step": 568547, "epoch": 6849} {"train_loss": -27.661054611206055, "global_step": 568548, "epoch": 6849} {"train_loss": -27.418318507183027, "global_step": 568549, "epoch": 6849, "val_loss": 6685840.0} {"train_loss": -27.708057403564453, "global_step": 568550, "epoch": 6850} {"train_loss": -27.923221588134766, "global_step": 568551, "epoch": 6850} {"train_loss": -27.54840660095215, "global_step": 568552, "epoch": 6850} {"train_loss": -27.679187774658203, "global_step": 568553, "epoch": 6850} {"train_loss": -27.327863693237305, "global_step": 568554, "epoch": 6850} {"train_loss": -27.7816162109375, "global_step": 568555, "epoch": 6850} {"train_loss": -27.83510398864746, "global_step": 568556, "epoch": 6850} {"train_loss": -27.628061294555664, "global_step": 568557, "epoch": 6850} {"train_loss": -27.69829750061035, "global_step": 568558, "epoch": 6850} {"train_loss": -27.557458877563477, "global_step": 568559, "epoch": 6850} {"train_loss": -27.481674194335938, "global_step": 568560, "epoch": 6850} {"train_loss": -27.73590087890625, "global_step": 568561, "epoch": 6850} {"train_loss": -27.767587661743164, "global_step": 568562, "epoch": 6850} {"train_loss": -27.5164794921875, "global_step": 568563, "epoch": 6850} {"train_loss": -27.854516983032227, "global_step": 568564, "epoch": 6850} {"train_loss": -27.79096794128418, "global_step": 568565, "epoch": 6850} {"train_loss": -27.760700225830078, "global_step": 568566, "epoch": 6850} {"train_loss": -27.735431671142578, "global_step": 568567, "epoch": 6850} {"train_loss": -28.080957412719727, "global_step": 568568, "epoch": 6850} {"train_loss": -27.22136878967285, "global_step": 568569, "epoch": 6850} {"train_loss": -28.082672119140625, "global_step": 568570, "epoch": 6850} {"train_loss": -27.51141357421875, "global_step": 568571, "epoch": 6850} {"train_loss": -27.492887496948242, "global_step": 568572, "epoch": 6850} {"train_loss": -27.709806442260742, "global_step": 568573, "epoch": 6850} {"train_loss": -28.106367111206055, "global_step": 568574, "epoch": 6850} {"train_loss": -28.0562686920166, "global_step": 568575, "epoch": 6850} {"train_loss": -27.758508682250977, "global_step": 568576, "epoch": 6850} {"train_loss": -27.71811866760254, "global_step": 568577, "epoch": 6850} {"train_loss": -27.731664657592773, "global_step": 568578, "epoch": 6850} {"train_loss": -27.42486572265625, "global_step": 568579, "epoch": 6850} {"train_loss": -27.98196792602539, "global_step": 568580, "epoch": 6850} {"train_loss": -28.0418701171875, "global_step": 568581, "epoch": 6850} {"train_loss": -27.740325927734375, "global_step": 568582, "epoch": 6850} {"train_loss": -27.620819091796875, "global_step": 568583, "epoch": 6850} {"train_loss": -27.851301193237305, "global_step": 568584, "epoch": 6850} {"train_loss": -27.839893341064453, "global_step": 568585, "epoch": 6850} {"train_loss": -28.2242374420166, "global_step": 568586, "epoch": 6850} {"train_loss": -28.0255069732666, "global_step": 568587, "epoch": 6850} {"train_loss": -27.868818283081055, "global_step": 568588, "epoch": 6850} {"train_loss": -28.08201026916504, "global_step": 568589, "epoch": 6850} {"train_loss": -27.8590030670166, "global_step": 568590, "epoch": 6850} {"train_loss": -28.263830184936523, "global_step": 568591, "epoch": 6850} {"train_loss": -27.82355308532715, "global_step": 568592, "epoch": 6850} {"train_loss": -27.9818172454834, "global_step": 568593, "epoch": 6850} {"train_loss": -28.003103256225586, "global_step": 568594, "epoch": 6850} {"train_loss": -27.88334083557129, "global_step": 568595, "epoch": 6850} {"train_loss": -27.80588722229004, "global_step": 568596, "epoch": 6850} {"train_loss": -27.66912841796875, "global_step": 568597, "epoch": 6850} {"train_loss": -28.016498565673828, "global_step": 568598, "epoch": 6850} {"train_loss": -27.881277084350586, "global_step": 568599, "epoch": 6850} {"train_loss": -27.7707576751709, "global_step": 568600, "epoch": 6850} {"train_loss": -27.659204483032227, "global_step": 568601, "epoch": 6850} {"train_loss": -27.709457397460938, "global_step": 568602, "epoch": 6850} {"train_loss": -28.29339027404785, "global_step": 568603, "epoch": 6850} {"train_loss": -28.12375259399414, "global_step": 568604, "epoch": 6850} {"train_loss": -27.6541748046875, "global_step": 568605, "epoch": 6850} {"train_loss": -27.747467041015625, "global_step": 568606, "epoch": 6850} {"train_loss": -27.858230590820312, "global_step": 568607, "epoch": 6850} {"train_loss": -27.830305099487305, "global_step": 568608, "epoch": 6850} {"train_loss": -27.932144165039062, "global_step": 568609, "epoch": 6850} {"train_loss": -28.056127548217773, "global_step": 568610, "epoch": 6850} {"train_loss": -28.01340103149414, "global_step": 568611, "epoch": 6850} {"train_loss": -27.6920223236084, "global_step": 568612, "epoch": 6850} {"train_loss": -28.067453384399414, "global_step": 568613, "epoch": 6850} {"train_loss": -27.885461807250977, "global_step": 568614, "epoch": 6850} {"train_loss": -27.92496109008789, "global_step": 568615, "epoch": 6850} {"train_loss": -27.938573837280273, "global_step": 568616, "epoch": 6850} {"train_loss": -27.633054733276367, "global_step": 568617, "epoch": 6850} {"train_loss": -27.749908447265625, "global_step": 568618, "epoch": 6850} {"train_loss": -27.80439567565918, "global_step": 568619, "epoch": 6850} {"train_loss": -28.148345947265625, "global_step": 568620, "epoch": 6850} {"train_loss": -28.214111328125, "global_step": 568621, "epoch": 6850} {"train_loss": -28.210119247436523, "global_step": 568622, "epoch": 6850} {"train_loss": -27.97629165649414, "global_step": 568623, "epoch": 6850} {"train_loss": -28.040334701538086, "global_step": 568624, "epoch": 6850} {"train_loss": -27.988447189331055, "global_step": 568625, "epoch": 6850} {"train_loss": -27.6965274810791, "global_step": 568626, "epoch": 6850} {"train_loss": -27.511579513549805, "global_step": 568627, "epoch": 6850} {"train_loss": -27.64578628540039, "global_step": 568628, "epoch": 6850} {"train_loss": -27.32427978515625, "global_step": 568629, "epoch": 6850} {"train_loss": -28.151569366455078, "global_step": 568630, "epoch": 6850} {"train_loss": -27.713102340698242, "global_step": 568631, "epoch": 6850} {"train_loss": -27.836634923176593, "global_step": 568632, "epoch": 6850, "train/sim_max_reward_0": 1.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4500000": 1.0, "test/sim_max_reward_4500001": 1.0, "test/sim_max_reward_4500002": 1.0, "test/sim_max_reward_4500003": 1.0, "test/sim_max_reward_4500004": 1.0, "test/sim_max_reward_4500005": 1.0, "test/sim_max_reward_4500006": 1.0, "test/sim_max_reward_4500007": 1.0, "test/sim_max_reward_4500008": 1.0, "test/sim_max_reward_4500009": 1.0, "test/sim_max_reward_4500010": 1.0, "test/sim_max_reward_4500011": 1.0, "test/sim_max_reward_4500012": 1.0, "test/sim_max_reward_4500013": 0.0, "test/sim_max_reward_4500014": 1.0, "test/sim_max_reward_4500015": 1.0, "test/sim_max_reward_4500016": 1.0, "test/sim_max_reward_4500017": 1.0, "test/sim_max_reward_4500018": 0.0, "test/sim_max_reward_4500019": 0.0, "test/sim_max_reward_4500020": 0.0, "test/sim_max_reward_4500021": 1.0, "train/mean_score": 1.0, "test/mean_score": 0.8181818181818182, "val_loss": 6652827.0} {"train_loss": -26.345111846923828, "global_step": 568633, "epoch": 6851} {"train_loss": -24.284406661987305, "global_step": 568634, "epoch": 6851} {"train_loss": -26.04192543029785, "global_step": 568635, "epoch": 6851} {"train_loss": -25.020631790161133, "global_step": 568636, "epoch": 6851} {"train_loss": -26.666440963745117, "global_step": 568637, "epoch": 6851} {"train_loss": -25.7354679107666, "global_step": 568638, "epoch": 6851} {"train_loss": -26.438261032104492, "global_step": 568639, "epoch": 6851} {"train_loss": -26.118986129760742, "global_step": 568640, "epoch": 6851} {"train_loss": -26.682676315307617, "global_step": 568641, "epoch": 6851} {"train_loss": -26.5051326751709, "global_step": 568642, "epoch": 6851} {"train_loss": -26.766157150268555, "global_step": 568643, "epoch": 6851} {"train_loss": -26.364643096923828, "global_step": 568644, "epoch": 6851} {"train_loss": -26.77503776550293, "global_step": 568645, "epoch": 6851} {"train_loss": -26.9785213470459, "global_step": 568646, "epoch": 6851} {"train_loss": -27.091506958007812, "global_step": 568647, "epoch": 6851} {"train_loss": -26.75444984436035, "global_step": 568648, "epoch": 6851} {"train_loss": -27.15216636657715, "global_step": 568649, "epoch": 6851} {"train_loss": -27.189105987548828, "global_step": 568650, "epoch": 6851} {"train_loss": -26.848297119140625, "global_step": 568651, "epoch": 6851} {"train_loss": -27.021753311157227, "global_step": 568652, "epoch": 6851} {"train_loss": -27.008472442626953, "global_step": 568653, "epoch": 6851} {"train_loss": -27.413028717041016, "global_step": 568654, "epoch": 6851} {"train_loss": -26.997364044189453, "global_step": 568655, "epoch": 6851} {"train_loss": -27.094266891479492, "global_step": 568656, "epoch": 6851} {"train_loss": -27.160114288330078, "global_step": 568657, "epoch": 6851} {"train_loss": -27.34714698791504, "global_step": 568658, "epoch": 6851} {"train_loss": -27.310998916625977, "global_step": 568659, "epoch": 6851} {"train_loss": -27.51447105407715, "global_step": 568660, "epoch": 6851} {"train_loss": -27.48996925354004, "global_step": 568661, "epoch": 6851} {"train_loss": -27.808719635009766, "global_step": 568662, "epoch": 6851} {"train_loss": -27.728870391845703, "global_step": 568663, "epoch": 6851} {"train_loss": -27.281665802001953, "global_step": 568664, "epoch": 6851} {"train_loss": -27.242359161376953, "global_step": 568665, "epoch": 6851} {"train_loss": -27.466501235961914, "global_step": 568666, "epoch": 6851} {"train_loss": -27.574914932250977, "global_step": 568667, "epoch": 6851} {"train_loss": -27.43842887878418, "global_step": 568668, "epoch": 6851} {"train_loss": -27.447235107421875, "global_step": 568669, "epoch": 6851} {"train_loss": -27.78937339782715, "global_step": 568670, "epoch": 6851} {"train_loss": -27.28144645690918, "global_step": 568671, "epoch": 6851} {"train_loss": -27.31827163696289, "global_step": 568672, "epoch": 6851} {"train_loss": -27.735219955444336, "global_step": 568673, "epoch": 6851} {"train_loss": -27.503814697265625, "global_step": 568674, "epoch": 6851} {"train_loss": -27.733251571655273, "global_step": 568675, "epoch": 6851} {"train_loss": -27.79718589782715, "global_step": 568676, "epoch": 6851} {"train_loss": -27.77387809753418, "global_step": 568677, "epoch": 6851} {"train_loss": -27.849380493164062, "global_step": 568678, "epoch": 6851} {"train_loss": -27.86956214904785, "global_step": 568679, "epoch": 6851} {"train_loss": -27.982624053955078, "global_step": 568680, "epoch": 6851} {"train_loss": -27.896656036376953, "global_step": 568681, "epoch": 6851} {"train_loss": -27.728376388549805, "global_step": 568682, "epoch": 6851} {"train_loss": -27.623611450195312, "global_step": 568683, "epoch": 6851} {"train_loss": -27.55780601501465, "global_step": 568684, "epoch": 6851} {"train_loss": -27.9930419921875, "global_step": 568685, "epoch": 6851} {"train_loss": -27.882308959960938, "global_step": 568686, "epoch": 6851} {"train_loss": -28.07659339904785, "global_step": 568687, "epoch": 6851} {"train_loss": -28.047605514526367, "global_step": 568688, "epoch": 6851} {"train_loss": -27.94855308532715, "global_step": 568689, "epoch": 6851} {"train_loss": -28.0208740234375, "global_step": 568690, "epoch": 6851} {"train_loss": -27.895917892456055, "global_step": 568691, "epoch": 6851} {"train_loss": -28.074878692626953, "global_step": 568692, "epoch": 6851} {"train_loss": -27.835590362548828, "global_step": 568693, "epoch": 6851} {"train_loss": -28.02570152282715, "global_step": 568694, "epoch": 6851} {"train_loss": -27.76434898376465, "global_step": 568695, "epoch": 6851} {"train_loss": -28.149377822875977, "global_step": 568696, "epoch": 6851} {"train_loss": -28.155675888061523, "global_step": 568697, "epoch": 6851} {"train_loss": -28.565982818603516, "global_step": 568698, "epoch": 6851} {"train_loss": -28.175878524780273, "global_step": 568699, "epoch": 6851} {"train_loss": -27.987899780273438, "global_step": 568700, "epoch": 6851} {"train_loss": -28.10420036315918, "global_step": 568701, "epoch": 6851} {"train_loss": -28.219751358032227, "global_step": 568702, "epoch": 6851} {"train_loss": -28.24237632751465, "global_step": 568703, "epoch": 6851} {"train_loss": -28.144546508789062, "global_step": 568704, "epoch": 6851} {"train_loss": -28.0170955657959, "global_step": 568705, "epoch": 6851} {"train_loss": -27.823917388916016, "global_step": 568706, "epoch": 6851} {"train_loss": -28.303985595703125, "global_step": 568707, "epoch": 6851} {"train_loss": -28.027389526367188, "global_step": 568708, "epoch": 6851} {"train_loss": -27.83274269104004, "global_step": 568709, "epoch": 6851} {"train_loss": -27.662179946899414, "global_step": 568710, "epoch": 6851} {"train_loss": -27.284032821655273, "global_step": 568711, "epoch": 6851} {"train_loss": -26.16806983947754, "global_step": 568712, "epoch": 6851} {"train_loss": -25.059019088745117, "global_step": 568713, "epoch": 6851} {"train_loss": -24.796533584594727, "global_step": 568714, "epoch": 6851} {"train_loss": -27.340668368052288, "global_step": 568715, "epoch": 6851, "val_loss": 6676198.0} {"train_loss": -24.533279418945312, "global_step": 568716, "epoch": 6852} {"train_loss": -25.37824821472168, "global_step": 568717, "epoch": 6852} {"train_loss": -25.429222106933594, "global_step": 568718, "epoch": 6852} {"train_loss": -25.9729061126709, "global_step": 568719, "epoch": 6852} {"train_loss": -25.1629695892334, "global_step": 568720, "epoch": 6852} {"train_loss": -25.994184494018555, "global_step": 568721, "epoch": 6852} {"train_loss": -26.432205200195312, "global_step": 568722, "epoch": 6852} {"train_loss": -26.033994674682617, "global_step": 568723, "epoch": 6852} {"train_loss": -26.17352867126465, "global_step": 568724, "epoch": 6852} {"train_loss": -26.186628341674805, "global_step": 568725, "epoch": 6852} {"train_loss": -26.81882095336914, "global_step": 568726, "epoch": 6852} {"train_loss": -26.3640079498291, "global_step": 568727, "epoch": 6852} {"train_loss": -26.39143943786621, "global_step": 568728, "epoch": 6852} {"train_loss": -27.12652015686035, "global_step": 568729, "epoch": 6852} {"train_loss": -26.444021224975586, "global_step": 568730, "epoch": 6852} {"train_loss": -26.848468780517578, "global_step": 568731, "epoch": 6852} {"train_loss": -26.729761123657227, "global_step": 568732, "epoch": 6852} {"train_loss": -27.0743465423584, "global_step": 568733, "epoch": 6852} {"train_loss": -26.937414169311523, "global_step": 568734, "epoch": 6852} {"train_loss": -26.888477325439453, "global_step": 568735, "epoch": 6852} {"train_loss": -26.784137725830078, "global_step": 568736, "epoch": 6852} {"train_loss": -27.147750854492188, "global_step": 568737, "epoch": 6852} {"train_loss": -26.934309005737305, "global_step": 568738, "epoch": 6852} {"train_loss": -26.793256759643555, "global_step": 568739, "epoch": 6852} {"train_loss": -27.077957153320312, "global_step": 568740, "epoch": 6852} {"train_loss": -27.10837173461914, "global_step": 568741, "epoch": 6852} {"train_loss": -27.371265411376953, "global_step": 568742, "epoch": 6852} {"train_loss": -27.139896392822266, "global_step": 568743, "epoch": 6852} {"train_loss": -27.588674545288086, "global_step": 568744, "epoch": 6852} {"train_loss": -27.022729873657227, "global_step": 568745, "epoch": 6852} {"train_loss": -27.30756950378418, "global_step": 568746, "epoch": 6852} {"train_loss": -27.2779598236084, "global_step": 568747, "epoch": 6852} {"train_loss": -27.190134048461914, "global_step": 568748, "epoch": 6852} {"train_loss": -27.55680274963379, "global_step": 568749, "epoch": 6852} {"train_loss": -27.443073272705078, "global_step": 568750, "epoch": 6852} {"train_loss": -27.295862197875977, "global_step": 568751, "epoch": 6852} {"train_loss": -27.722583770751953, "global_step": 568752, "epoch": 6852} {"train_loss": -27.74527359008789, "global_step": 568753, "epoch": 6852} {"train_loss": -27.53748893737793, "global_step": 568754, "epoch": 6852} {"train_loss": -27.641448974609375, "global_step": 568755, "epoch": 6852} {"train_loss": -28.055280685424805, "global_step": 568756, "epoch": 6852} {"train_loss": -27.701459884643555, "global_step": 568757, "epoch": 6852} {"train_loss": -28.036054611206055, "global_step": 568758, "epoch": 6852} {"train_loss": -27.940759658813477, "global_step": 568759, "epoch": 6852} {"train_loss": -27.798490524291992, "global_step": 568760, "epoch": 6852} {"train_loss": -27.8901424407959, "global_step": 568761, "epoch": 6852} {"train_loss": -27.81247329711914, "global_step": 568762, "epoch": 6852} {"train_loss": -27.774383544921875, "global_step": 568763, "epoch": 6852} {"train_loss": -27.9053897857666, "global_step": 568764, "epoch": 6852} {"train_loss": -27.87664222717285, "global_step": 568765, "epoch": 6852} {"train_loss": -27.711252212524414, "global_step": 568766, "epoch": 6852} {"train_loss": -27.74269676208496, "global_step": 568767, "epoch": 6852} {"train_loss": -27.797992706298828, "global_step": 568768, "epoch": 6852} {"train_loss": -27.736652374267578, "global_step": 568769, "epoch": 6852} {"train_loss": -27.715009689331055, "global_step": 568770, "epoch": 6852} {"train_loss": -27.566049575805664, "global_step": 568771, "epoch": 6852} {"train_loss": -27.896650314331055, "global_step": 568772, "epoch": 6852} {"train_loss": -27.688552856445312, "global_step": 568773, "epoch": 6852} {"train_loss": -27.486907958984375, "global_step": 568774, "epoch": 6852} {"train_loss": -27.605321884155273, "global_step": 568775, "epoch": 6852} {"train_loss": -27.486143112182617, "global_step": 568776, "epoch": 6852} {"train_loss": -28.100126266479492, "global_step": 568777, "epoch": 6852} {"train_loss": -27.835371017456055, "global_step": 568778, "epoch": 6852} {"train_loss": -27.642587661743164, "global_step": 568779, "epoch": 6852} {"train_loss": -27.886869430541992, "global_step": 568780, "epoch": 6852} {"train_loss": -28.07568359375, "global_step": 568781, "epoch": 6852} {"train_loss": -27.780750274658203, "global_step": 568782, "epoch": 6852} {"train_loss": -28.21417236328125, "global_step": 568783, "epoch": 6852} {"train_loss": -28.13864517211914, "global_step": 568784, "epoch": 6852} {"train_loss": -27.987812042236328, "global_step": 568785, "epoch": 6852} {"train_loss": -27.85921287536621, "global_step": 568786, "epoch": 6852} {"train_loss": -28.003355026245117, "global_step": 568787, "epoch": 6852} {"train_loss": -27.81964683532715, "global_step": 568788, "epoch": 6852} {"train_loss": -27.799291610717773, "global_step": 568789, "epoch": 6852} {"train_loss": -28.02216148376465, "global_step": 568790, "epoch": 6852} {"train_loss": -27.804304122924805, "global_step": 568791, "epoch": 6852} {"train_loss": -27.800012588500977, "global_step": 568792, "epoch": 6852} {"train_loss": -27.650800704956055, "global_step": 568793, "epoch": 6852} {"train_loss": -27.69476318359375, "global_step": 568794, "epoch": 6852} {"train_loss": -28.140396118164062, "global_step": 568795, "epoch": 6852} {"train_loss": -27.845056533813477, "global_step": 568796, "epoch": 6852} {"train_loss": -27.70496940612793, "global_step": 568797, "epoch": 6852} {"train_loss": -27.296064606632093, "global_step": 568798, "epoch": 6852, "val_loss": 6609975.0} {"train_loss": -26.899072647094727, "global_step": 568799, "epoch": 6853} {"train_loss": -27.433399200439453, "global_step": 568800, "epoch": 6853} {"train_loss": -27.14862632751465, "global_step": 568801, "epoch": 6853} {"train_loss": -27.345483779907227, "global_step": 568802, "epoch": 6853} {"train_loss": -27.75931739807129, "global_step": 568803, "epoch": 6853} {"train_loss": -27.552234649658203, "global_step": 568804, "epoch": 6853} {"train_loss": -27.289907455444336, "global_step": 568805, "epoch": 6853} {"train_loss": -27.113943099975586, "global_step": 568806, "epoch": 6853} {"train_loss": -27.512638092041016, "global_step": 568807, "epoch": 6853} {"train_loss": -27.2157039642334, "global_step": 568808, "epoch": 6853} {"train_loss": -27.48126792907715, "global_step": 568809, "epoch": 6853} {"train_loss": -27.581640243530273, "global_step": 568810, "epoch": 6853} {"train_loss": -27.531909942626953, "global_step": 568811, "epoch": 6853} {"train_loss": -27.347492218017578, "global_step": 568812, "epoch": 6853} {"train_loss": -27.68311882019043, "global_step": 568813, "epoch": 6853} {"train_loss": -27.63035011291504, "global_step": 568814, "epoch": 6853} {"train_loss": -27.662961959838867, "global_step": 568815, "epoch": 6853} {"train_loss": -27.41925621032715, "global_step": 568816, "epoch": 6853} {"train_loss": -27.815902709960938, "global_step": 568817, "epoch": 6853} {"train_loss": -27.71407127380371, "global_step": 568818, "epoch": 6853} {"train_loss": -27.684192657470703, "global_step": 568819, "epoch": 6853} {"train_loss": -27.711252212524414, "global_step": 568820, "epoch": 6853} {"train_loss": -28.07511329650879, "global_step": 568821, "epoch": 6853} {"train_loss": -28.026458740234375, "global_step": 568822, "epoch": 6853} {"train_loss": -27.620380401611328, "global_step": 568823, "epoch": 6853} {"train_loss": -27.949634552001953, "global_step": 568824, "epoch": 6853} {"train_loss": -27.732202529907227, "global_step": 568825, "epoch": 6853} {"train_loss": -27.79508399963379, "global_step": 568826, "epoch": 6853} {"train_loss": -27.916852951049805, "global_step": 568827, "epoch": 6853} {"train_loss": -28.21323585510254, "global_step": 568828, "epoch": 6853} {"train_loss": -28.089508056640625, "global_step": 568829, "epoch": 6853} {"train_loss": -28.215139389038086, "global_step": 568830, "epoch": 6853} {"train_loss": -27.94239616394043, "global_step": 568831, "epoch": 6853} {"train_loss": -28.052778244018555, "global_step": 568832, "epoch": 6853} {"train_loss": -28.092313766479492, "global_step": 568833, "epoch": 6853} {"train_loss": -28.00715446472168, "global_step": 568834, "epoch": 6853} {"train_loss": -27.840539932250977, "global_step": 568835, "epoch": 6853} {"train_loss": -27.92396354675293, "global_step": 568836, "epoch": 6853} {"train_loss": -27.77325439453125, "global_step": 568837, "epoch": 6853} {"train_loss": -28.18674659729004, "global_step": 568838, "epoch": 6853} {"train_loss": -28.027692794799805, "global_step": 568839, "epoch": 6853} {"train_loss": -28.096487045288086, "global_step": 568840, "epoch": 6853} {"train_loss": -27.9739990234375, "global_step": 568841, "epoch": 6853} {"train_loss": -27.7861328125, "global_step": 568842, "epoch": 6853} {"train_loss": -27.910200119018555, "global_step": 568843, "epoch": 6853} {"train_loss": -28.416589736938477, "global_step": 568844, "epoch": 6853} {"train_loss": -27.820465087890625, "global_step": 568845, "epoch": 6853} {"train_loss": -27.94858741760254, "global_step": 568846, "epoch": 6853} {"train_loss": -27.8920955657959, "global_step": 568847, "epoch": 6853} {"train_loss": -27.53729820251465, "global_step": 568848, "epoch": 6853} {"train_loss": -27.245893478393555, "global_step": 568849, "epoch": 6853} {"train_loss": -27.762714385986328, "global_step": 568850, "epoch": 6853} {"train_loss": -27.886077880859375, "global_step": 568851, "epoch": 6853} {"train_loss": -28.092870712280273, "global_step": 568852, "epoch": 6853} {"train_loss": -27.995126724243164, "global_step": 568853, "epoch": 6853} {"train_loss": -27.89395523071289, "global_step": 568854, "epoch": 6853} {"train_loss": -28.163488388061523, "global_step": 568855, "epoch": 6853} {"train_loss": -27.9713134765625, "global_step": 568856, "epoch": 6853} {"train_loss": -28.094573974609375, "global_step": 568857, "epoch": 6853} {"train_loss": -27.92547035217285, "global_step": 568858, "epoch": 6853} {"train_loss": -27.568500518798828, "global_step": 568859, "epoch": 6853} {"train_loss": -28.04254150390625, "global_step": 568860, "epoch": 6853} {"train_loss": -28.005056381225586, "global_step": 568861, "epoch": 6853} {"train_loss": -27.83978271484375, "global_step": 568862, "epoch": 6853} {"train_loss": -27.855634689331055, "global_step": 568863, "epoch": 6853} {"train_loss": -27.93170738220215, "global_step": 568864, "epoch": 6853} {"train_loss": -27.93912696838379, "global_step": 568865, "epoch": 6853} {"train_loss": -28.25605583190918, "global_step": 568866, "epoch": 6853} {"train_loss": -27.96710205078125, "global_step": 568867, "epoch": 6853} {"train_loss": -27.805877685546875, "global_step": 568868, "epoch": 6853} {"train_loss": -27.921579360961914, "global_step": 568869, "epoch": 6853} {"train_loss": -27.8990421295166, "global_step": 568870, "epoch": 6853} {"train_loss": -28.033533096313477, "global_step": 568871, "epoch": 6853} {"train_loss": -28.167312622070312, "global_step": 568872, "epoch": 6853} {"train_loss": -27.94771385192871, "global_step": 568873, "epoch": 6853} {"train_loss": -28.362951278686523, "global_step": 568874, "epoch": 6853} {"train_loss": -27.9683895111084, "global_step": 568875, "epoch": 6853} {"train_loss": -28.019269943237305, "global_step": 568876, "epoch": 6853} {"train_loss": -27.754270553588867, "global_step": 568877, "epoch": 6853} {"train_loss": -27.541641235351562, "global_step": 568878, "epoch": 6853} {"train_loss": -27.892292022705078, "global_step": 568879, "epoch": 6853} {"train_loss": -28.07441520690918, "global_step": 568880, "epoch": 6853} {"train_loss": -27.826999066823937, "global_step": 568881, "epoch": 6853, "val_loss": 6677800.0} {"train_loss": -26.744098663330078, "global_step": 568882, "epoch": 6854} {"train_loss": -25.9193115234375, "global_step": 568883, "epoch": 6854} {"train_loss": -25.9882869720459, "global_step": 568884, "epoch": 6854} {"train_loss": -26.83371925354004, "global_step": 568885, "epoch": 6854} {"train_loss": -26.799274444580078, "global_step": 568886, "epoch": 6854} {"train_loss": -26.471302032470703, "global_step": 568887, "epoch": 6854} {"train_loss": -26.8701229095459, "global_step": 568888, "epoch": 6854} {"train_loss": -26.31727409362793, "global_step": 568889, "epoch": 6854} {"train_loss": -26.838668823242188, "global_step": 568890, "epoch": 6854} {"train_loss": -26.775959014892578, "global_step": 568891, "epoch": 6854} {"train_loss": -27.054214477539062, "global_step": 568892, "epoch": 6854} {"train_loss": -27.0406551361084, "global_step": 568893, "epoch": 6854} {"train_loss": -27.214731216430664, "global_step": 568894, "epoch": 6854} {"train_loss": -26.7580509185791, "global_step": 568895, "epoch": 6854} {"train_loss": -27.207382202148438, "global_step": 568896, "epoch": 6854} {"train_loss": -27.38026237487793, "global_step": 568897, "epoch": 6854} {"train_loss": -27.390356063842773, "global_step": 568898, "epoch": 6854} {"train_loss": -27.3902645111084, "global_step": 568899, "epoch": 6854} {"train_loss": -27.286462783813477, "global_step": 568900, "epoch": 6854} {"train_loss": -27.618406295776367, "global_step": 568901, "epoch": 6854} {"train_loss": -27.430206298828125, "global_step": 568902, "epoch": 6854} {"train_loss": -27.279876708984375, "global_step": 568903, "epoch": 6854} {"train_loss": -27.63895606994629, "global_step": 568904, "epoch": 6854} {"train_loss": -27.531213760375977, "global_step": 568905, "epoch": 6854} {"train_loss": -27.7233829498291, "global_step": 568906, "epoch": 6854} {"train_loss": -27.651763916015625, "global_step": 568907, "epoch": 6854} {"train_loss": -27.219701766967773, "global_step": 568908, "epoch": 6854} {"train_loss": -27.6734619140625, "global_step": 568909, "epoch": 6854} {"train_loss": -27.649946212768555, "global_step": 568910, "epoch": 6854} {"train_loss": -27.86549949645996, "global_step": 568911, "epoch": 6854} {"train_loss": -27.67645835876465, "global_step": 568912, "epoch": 6854} {"train_loss": -27.54891014099121, "global_step": 568913, "epoch": 6854} {"train_loss": -27.867456436157227, "global_step": 568914, "epoch": 6854} {"train_loss": -28.351062774658203, "global_step": 568915, "epoch": 6854} {"train_loss": -27.946409225463867, "global_step": 568916, "epoch": 6854} {"train_loss": -27.87074851989746, "global_step": 568917, "epoch": 6854} {"train_loss": -27.62799644470215, "global_step": 568918, "epoch": 6854} {"train_loss": -27.510034561157227, "global_step": 568919, "epoch": 6854} {"train_loss": -27.871198654174805, "global_step": 568920, "epoch": 6854} {"train_loss": -27.921268463134766, "global_step": 568921, "epoch": 6854} {"train_loss": -28.02199363708496, "global_step": 568922, "epoch": 6854} {"train_loss": -27.611066818237305, "global_step": 568923, "epoch": 6854} {"train_loss": -28.2427921295166, "global_step": 568924, "epoch": 6854} {"train_loss": -27.716217041015625, "global_step": 568925, "epoch": 6854} {"train_loss": -27.996091842651367, "global_step": 568926, "epoch": 6854} {"train_loss": -28.08626365661621, "global_step": 568927, "epoch": 6854} {"train_loss": -28.151660919189453, "global_step": 568928, "epoch": 6854} {"train_loss": -27.764801025390625, "global_step": 568929, "epoch": 6854} {"train_loss": -28.24879264831543, "global_step": 568930, "epoch": 6854} {"train_loss": -27.591760635375977, "global_step": 568931, "epoch": 6854} {"train_loss": -27.932601928710938, "global_step": 568932, "epoch": 6854} {"train_loss": -27.507471084594727, "global_step": 568933, "epoch": 6854} {"train_loss": -28.107303619384766, "global_step": 568934, "epoch": 6854} {"train_loss": -28.150043487548828, "global_step": 568935, "epoch": 6854} {"train_loss": -28.14957618713379, "global_step": 568936, "epoch": 6854} {"train_loss": -27.885679244995117, "global_step": 568937, "epoch": 6854} {"train_loss": -28.228483200073242, "global_step": 568938, "epoch": 6854} {"train_loss": -27.83856201171875, "global_step": 568939, "epoch": 6854} {"train_loss": -27.841825485229492, "global_step": 568940, "epoch": 6854} {"train_loss": -28.080469131469727, "global_step": 568941, "epoch": 6854} {"train_loss": -27.97071647644043, "global_step": 568942, "epoch": 6854} {"train_loss": -27.807584762573242, "global_step": 568943, "epoch": 6854} {"train_loss": -27.8461971282959, "global_step": 568944, "epoch": 6854} {"train_loss": -27.851709365844727, "global_step": 568945, "epoch": 6854} {"train_loss": -27.96870994567871, "global_step": 568946, "epoch": 6854} {"train_loss": -27.666614532470703, "global_step": 568947, "epoch": 6854} {"train_loss": -28.268964767456055, "global_step": 568948, "epoch": 6854} {"train_loss": -28.220794677734375, "global_step": 568949, "epoch": 6854} {"train_loss": -27.8548583984375, "global_step": 568950, "epoch": 6854} {"train_loss": -27.792434692382812, "global_step": 568951, "epoch": 6854} {"train_loss": -28.0695743560791, "global_step": 568952, "epoch": 6854} {"train_loss": -28.019208908081055, "global_step": 568953, "epoch": 6854} {"train_loss": -27.86867332458496, "global_step": 568954, "epoch": 6854} {"train_loss": -28.0638370513916, "global_step": 568955, "epoch": 6854} {"train_loss": -28.234943389892578, "global_step": 568956, "epoch": 6854} {"train_loss": -27.977163314819336, "global_step": 568957, "epoch": 6854} {"train_loss": -28.097558975219727, "global_step": 568958, "epoch": 6854} {"train_loss": -28.057092666625977, "global_step": 568959, "epoch": 6854} {"train_loss": -28.145843505859375, "global_step": 568960, "epoch": 6854} {"train_loss": -28.08028221130371, "global_step": 568961, "epoch": 6854} {"train_loss": -28.022302627563477, "global_step": 568962, "epoch": 6854} {"train_loss": -28.071043014526367, "global_step": 568963, "epoch": 6854} {"train_loss": -27.632959595645765, "global_step": 568964, "epoch": 6854, "val_loss": 6664606.0} {"train_loss": -24.511886596679688, "global_step": 568965, "epoch": 6855} {"train_loss": -22.190628051757812, "global_step": 568966, "epoch": 6855} {"train_loss": -23.16460418701172, "global_step": 568967, "epoch": 6855} {"train_loss": -24.440170288085938, "global_step": 568968, "epoch": 6855} {"train_loss": -25.104137420654297, "global_step": 568969, "epoch": 6855} {"train_loss": -26.08002281188965, "global_step": 568970, "epoch": 6855} {"train_loss": -25.316852569580078, "global_step": 568971, "epoch": 6855} {"train_loss": -25.923126220703125, "global_step": 568972, "epoch": 6855} {"train_loss": -26.123254776000977, "global_step": 568973, "epoch": 6855} {"train_loss": -25.761999130249023, "global_step": 568974, "epoch": 6855} {"train_loss": -26.647836685180664, "global_step": 568975, "epoch": 6855} {"train_loss": -26.3740177154541, "global_step": 568976, "epoch": 6855} {"train_loss": -26.532255172729492, "global_step": 568977, "epoch": 6855} {"train_loss": -26.791046142578125, "global_step": 568978, "epoch": 6855} {"train_loss": -26.6455135345459, "global_step": 568979, "epoch": 6855} {"train_loss": -26.726789474487305, "global_step": 568980, "epoch": 6855} {"train_loss": -26.35538673400879, "global_step": 568981, "epoch": 6855} {"train_loss": -26.7005615234375, "global_step": 568982, "epoch": 6855} {"train_loss": -27.21964454650879, "global_step": 568983, "epoch": 6855} {"train_loss": -26.762866973876953, "global_step": 568984, "epoch": 6855} {"train_loss": -26.626264572143555, "global_step": 568985, "epoch": 6855} {"train_loss": -27.07490348815918, "global_step": 568986, "epoch": 6855} {"train_loss": -26.580453872680664, "global_step": 568987, "epoch": 6855} {"train_loss": -26.96712303161621, "global_step": 568988, "epoch": 6855} {"train_loss": -26.938995361328125, "global_step": 568989, "epoch": 6855} {"train_loss": -26.660085678100586, "global_step": 568990, "epoch": 6855} {"train_loss": -27.289052963256836, "global_step": 568991, "epoch": 6855} {"train_loss": -27.14556312561035, "global_step": 568992, "epoch": 6855} {"train_loss": -26.775775909423828, "global_step": 568993, "epoch": 6855} {"train_loss": -27.20948600769043, "global_step": 568994, "epoch": 6855} {"train_loss": -27.514196395874023, "global_step": 568995, "epoch": 6855} {"train_loss": -27.12603759765625, "global_step": 568996, "epoch": 6855} {"train_loss": -27.39967155456543, "global_step": 568997, "epoch": 6855} {"train_loss": -27.380035400390625, "global_step": 568998, "epoch": 6855} {"train_loss": -27.2203369140625, "global_step": 568999, "epoch": 6855} {"train_loss": -27.587493896484375, "global_step": 569000, "epoch": 6855} {"train_loss": -27.492116928100586, "global_step": 569001, "epoch": 6855} {"train_loss": -27.063425064086914, "global_step": 569002, "epoch": 6855} {"train_loss": -27.901504516601562, "global_step": 569003, "epoch": 6855} {"train_loss": -27.672061920166016, "global_step": 569004, "epoch": 6855} {"train_loss": -27.563241958618164, "global_step": 569005, "epoch": 6855} {"train_loss": -27.521615982055664, "global_step": 569006, "epoch": 6855} {"train_loss": -27.510730743408203, "global_step": 569007, "epoch": 6855} {"train_loss": -27.58550453186035, "global_step": 569008, "epoch": 6855} {"train_loss": -27.955322265625, "global_step": 569009, "epoch": 6855} {"train_loss": -27.634387969970703, "global_step": 569010, "epoch": 6855} {"train_loss": -27.6508731842041, "global_step": 569011, "epoch": 6855} {"train_loss": -28.04376220703125, "global_step": 569012, "epoch": 6855} {"train_loss": -28.206384658813477, "global_step": 569013, "epoch": 6855} {"train_loss": -27.8546085357666, "global_step": 569014, "epoch": 6855} {"train_loss": -27.54570960998535, "global_step": 569015, "epoch": 6855} {"train_loss": -27.9476375579834, "global_step": 569016, "epoch": 6855} {"train_loss": -27.77960205078125, "global_step": 569017, "epoch": 6855} {"train_loss": -28.043970108032227, "global_step": 569018, "epoch": 6855} {"train_loss": -28.07490348815918, "global_step": 569019, "epoch": 6855} {"train_loss": -27.96906089782715, "global_step": 569020, "epoch": 6855} {"train_loss": -27.94199562072754, "global_step": 569021, "epoch": 6855} {"train_loss": -27.701114654541016, "global_step": 569022, "epoch": 6855} {"train_loss": -27.750654220581055, "global_step": 569023, "epoch": 6855} {"train_loss": -28.2205753326416, "global_step": 569024, "epoch": 6855} {"train_loss": -27.93352699279785, "global_step": 569025, "epoch": 6855} {"train_loss": -27.97966957092285, "global_step": 569026, "epoch": 6855} {"train_loss": -27.597808837890625, "global_step": 569027, "epoch": 6855} {"train_loss": -27.79962730407715, "global_step": 569028, "epoch": 6855} {"train_loss": -27.89291763305664, "global_step": 569029, "epoch": 6855} {"train_loss": -27.91416358947754, "global_step": 569030, "epoch": 6855} {"train_loss": -27.910001754760742, "global_step": 569031, "epoch": 6855} {"train_loss": -27.75123405456543, "global_step": 569032, "epoch": 6855} {"train_loss": -28.04022216796875, "global_step": 569033, "epoch": 6855} {"train_loss": -28.013471603393555, "global_step": 569034, "epoch": 6855} {"train_loss": -27.961084365844727, "global_step": 569035, "epoch": 6855} {"train_loss": -28.064916610717773, "global_step": 569036, "epoch": 6855} {"train_loss": -27.96644401550293, "global_step": 569037, "epoch": 6855} {"train_loss": -28.08021354675293, "global_step": 569038, "epoch": 6855} {"train_loss": -28.05109977722168, "global_step": 569039, "epoch": 6855} {"train_loss": -27.82440757751465, "global_step": 569040, "epoch": 6855} {"train_loss": -28.227401733398438, "global_step": 569041, "epoch": 6855} {"train_loss": -28.1949405670166, "global_step": 569042, "epoch": 6855} {"train_loss": -28.18951416015625, "global_step": 569043, "epoch": 6855} {"train_loss": -27.67095947265625, "global_step": 569044, "epoch": 6855} {"train_loss": -27.919031143188477, "global_step": 569045, "epoch": 6855} {"train_loss": -28.182661056518555, "global_step": 569046, "epoch": 6855} {"train_loss": -27.205600784485597, "global_step": 569047, "epoch": 6855, "val_loss": 6750731.0} {"train_loss": -27.478418350219727, "global_step": 569048, "epoch": 6856} {"train_loss": -27.4617919921875, "global_step": 569049, "epoch": 6856} {"train_loss": -27.747882843017578, "global_step": 569050, "epoch": 6856} {"train_loss": -27.590368270874023, "global_step": 569051, "epoch": 6856} {"train_loss": -27.437238693237305, "global_step": 569052, "epoch": 6856} {"train_loss": -28.068395614624023, "global_step": 569053, "epoch": 6856} {"train_loss": -27.736652374267578, "global_step": 569054, "epoch": 6856} {"train_loss": -27.9754581451416, "global_step": 569055, "epoch": 6856} {"train_loss": -28.086505889892578, "global_step": 569056, "epoch": 6856} {"train_loss": -27.897878646850586, "global_step": 569057, "epoch": 6856} {"train_loss": -27.495290756225586, "global_step": 569058, "epoch": 6856} {"train_loss": -27.67014503479004, "global_step": 569059, "epoch": 6856} {"train_loss": -27.74409294128418, "global_step": 569060, "epoch": 6856} {"train_loss": -27.78493309020996, "global_step": 569061, "epoch": 6856} {"train_loss": -27.996082305908203, "global_step": 569062, "epoch": 6856} {"train_loss": -27.88715171813965, "global_step": 569063, "epoch": 6856} {"train_loss": -27.100255966186523, "global_step": 569064, "epoch": 6856} {"train_loss": -27.638357162475586, "global_step": 569065, "epoch": 6856} {"train_loss": -27.4533634185791, "global_step": 569066, "epoch": 6856} {"train_loss": -27.77362632751465, "global_step": 569067, "epoch": 6856} {"train_loss": -27.748693466186523, "global_step": 569068, "epoch": 6856} {"train_loss": -27.610427856445312, "global_step": 569069, "epoch": 6856} {"train_loss": -27.903417587280273, "global_step": 569070, "epoch": 6856} {"train_loss": -27.880573272705078, "global_step": 569071, "epoch": 6856} {"train_loss": -28.094404220581055, "global_step": 569072, "epoch": 6856} {"train_loss": -27.72199821472168, "global_step": 569073, "epoch": 6856} {"train_loss": -27.783340454101562, "global_step": 569074, "epoch": 6856} {"train_loss": -27.99183464050293, "global_step": 569075, "epoch": 6856} {"train_loss": -27.779499053955078, "global_step": 569076, "epoch": 6856} {"train_loss": -27.596418380737305, "global_step": 569077, "epoch": 6856} {"train_loss": -28.308359146118164, "global_step": 569078, "epoch": 6856} {"train_loss": -27.804157257080078, "global_step": 569079, "epoch": 6856} {"train_loss": -27.66376304626465, "global_step": 569080, "epoch": 6856} {"train_loss": -27.921899795532227, "global_step": 569081, "epoch": 6856} {"train_loss": -27.869970321655273, "global_step": 569082, "epoch": 6856} {"train_loss": -27.767980575561523, "global_step": 569083, "epoch": 6856} {"train_loss": -28.13657569885254, "global_step": 569084, "epoch": 6856} {"train_loss": -27.577239990234375, "global_step": 569085, "epoch": 6856} {"train_loss": -27.69767189025879, "global_step": 569086, "epoch": 6856} {"train_loss": -27.346342086791992, "global_step": 569087, "epoch": 6856} {"train_loss": -27.651403427124023, "global_step": 569088, "epoch": 6856} {"train_loss": -27.72877311706543, "global_step": 569089, "epoch": 6856} {"train_loss": -27.43145179748535, "global_step": 569090, "epoch": 6856} {"train_loss": -27.613996505737305, "global_step": 569091, "epoch": 6856} {"train_loss": -27.749929428100586, "global_step": 569092, "epoch": 6856} {"train_loss": -27.650373458862305, "global_step": 569093, "epoch": 6856} {"train_loss": -27.70536231994629, "global_step": 569094, "epoch": 6856} {"train_loss": -27.411376953125, "global_step": 569095, "epoch": 6856} {"train_loss": -27.771102905273438, "global_step": 569096, "epoch": 6856} {"train_loss": -27.598804473876953, "global_step": 569097, "epoch": 6856} {"train_loss": -27.748350143432617, "global_step": 569098, "epoch": 6856} {"train_loss": -27.776260375976562, "global_step": 569099, "epoch": 6856} {"train_loss": -27.742740631103516, "global_step": 569100, "epoch": 6856} {"train_loss": -27.732364654541016, "global_step": 569101, "epoch": 6856} {"train_loss": -28.1131534576416, "global_step": 569102, "epoch": 6856} {"train_loss": -27.7109317779541, "global_step": 569103, "epoch": 6856} {"train_loss": -27.615461349487305, "global_step": 569104, "epoch": 6856} {"train_loss": -27.7287540435791, "global_step": 569105, "epoch": 6856} {"train_loss": -27.477514266967773, "global_step": 569106, "epoch": 6856} {"train_loss": -27.594196319580078, "global_step": 569107, "epoch": 6856} {"train_loss": -27.769989013671875, "global_step": 569108, "epoch": 6856} {"train_loss": -27.11882972717285, "global_step": 569109, "epoch": 6856} {"train_loss": -26.076093673706055, "global_step": 569110, "epoch": 6856} {"train_loss": -24.642332077026367, "global_step": 569111, "epoch": 6856} {"train_loss": -26.641510009765625, "global_step": 569112, "epoch": 6856} {"train_loss": -27.352354049682617, "global_step": 569113, "epoch": 6856} {"train_loss": -26.394428253173828, "global_step": 569114, "epoch": 6856} {"train_loss": -27.5322322845459, "global_step": 569115, "epoch": 6856} {"train_loss": -26.624771118164062, "global_step": 569116, "epoch": 6856} {"train_loss": -27.389678955078125, "global_step": 569117, "epoch": 6856} {"train_loss": -27.592655181884766, "global_step": 569118, "epoch": 6856} {"train_loss": -27.060211181640625, "global_step": 569119, "epoch": 6856} {"train_loss": -27.481664657592773, "global_step": 569120, "epoch": 6856} {"train_loss": -27.128828048706055, "global_step": 569121, "epoch": 6856} {"train_loss": -27.467056274414062, "global_step": 569122, "epoch": 6856} {"train_loss": -27.601581573486328, "global_step": 569123, "epoch": 6856} {"train_loss": -27.504779815673828, "global_step": 569124, "epoch": 6856} {"train_loss": -27.404815673828125, "global_step": 569125, "epoch": 6856} {"train_loss": -27.424701690673828, "global_step": 569126, "epoch": 6856} {"train_loss": -27.595813751220703, "global_step": 569127, "epoch": 6856} {"train_loss": -27.52571678161621, "global_step": 569128, "epoch": 6856} {"train_loss": -27.35808753967285, "global_step": 569129, "epoch": 6856} {"train_loss": -27.560474188931018, "global_step": 569130, "epoch": 6856, "val_loss": 6769794.0} {"train_loss": -27.43012809753418, "global_step": 569131, "epoch": 6857} {"train_loss": -27.67592430114746, "global_step": 569132, "epoch": 6857} {"train_loss": -27.8106632232666, "global_step": 569133, "epoch": 6857} {"train_loss": -26.994165420532227, "global_step": 569134, "epoch": 6857} {"train_loss": -27.481348037719727, "global_step": 569135, "epoch": 6857} {"train_loss": -27.52667808532715, "global_step": 569136, "epoch": 6857} {"train_loss": -27.332416534423828, "global_step": 569137, "epoch": 6857} {"train_loss": -27.43975830078125, "global_step": 569138, "epoch": 6857} {"train_loss": -27.974796295166016, "global_step": 569139, "epoch": 6857} {"train_loss": -27.513341903686523, "global_step": 569140, "epoch": 6857} {"train_loss": -27.260522842407227, "global_step": 569141, "epoch": 6857} {"train_loss": -27.930988311767578, "global_step": 569142, "epoch": 6857} {"train_loss": -27.22625160217285, "global_step": 569143, "epoch": 6857} {"train_loss": -27.763626098632812, "global_step": 569144, "epoch": 6857} {"train_loss": -27.972570419311523, "global_step": 569145, "epoch": 6857} {"train_loss": -27.91822624206543, "global_step": 569146, "epoch": 6857} {"train_loss": -27.38027000427246, "global_step": 569147, "epoch": 6857} {"train_loss": -27.828962326049805, "global_step": 569148, "epoch": 6857} {"train_loss": -27.82264518737793, "global_step": 569149, "epoch": 6857} {"train_loss": -28.016077041625977, "global_step": 569150, "epoch": 6857} {"train_loss": -27.527652740478516, "global_step": 569151, "epoch": 6857} {"train_loss": -27.898618698120117, "global_step": 569152, "epoch": 6857} {"train_loss": -27.59486198425293, "global_step": 569153, "epoch": 6857} {"train_loss": -27.84219741821289, "global_step": 569154, "epoch": 6857} {"train_loss": -28.01545524597168, "global_step": 569155, "epoch": 6857} {"train_loss": -27.870929718017578, "global_step": 569156, "epoch": 6857} {"train_loss": -28.14716148376465, "global_step": 569157, "epoch": 6857} {"train_loss": -27.542434692382812, "global_step": 569158, "epoch": 6857} {"train_loss": -28.00642204284668, "global_step": 569159, "epoch": 6857} {"train_loss": -27.989110946655273, "global_step": 569160, "epoch": 6857} {"train_loss": -27.496265411376953, "global_step": 569161, "epoch": 6857} {"train_loss": -27.885656356811523, "global_step": 569162, "epoch": 6857} {"train_loss": -28.02618408203125, "global_step": 569163, "epoch": 6857} {"train_loss": -27.986286163330078, "global_step": 569164, "epoch": 6857} {"train_loss": -28.084182739257812, "global_step": 569165, "epoch": 6857} {"train_loss": -27.785791397094727, "global_step": 569166, "epoch": 6857} {"train_loss": -27.62310218811035, "global_step": 569167, "epoch": 6857} {"train_loss": -27.40926170349121, "global_step": 569168, "epoch": 6857} {"train_loss": -27.335006713867188, "global_step": 569169, "epoch": 6857} {"train_loss": -27.47589111328125, "global_step": 569170, "epoch": 6857} {"train_loss": -28.19818687438965, "global_step": 569171, "epoch": 6857} {"train_loss": -27.761621475219727, "global_step": 569172, "epoch": 6857} {"train_loss": -27.45978355407715, "global_step": 569173, "epoch": 6857} {"train_loss": -27.685546875, "global_step": 569174, "epoch": 6857} {"train_loss": -27.366933822631836, "global_step": 569175, "epoch": 6857} {"train_loss": -27.935544967651367, "global_step": 569176, "epoch": 6857} {"train_loss": -28.2182559967041, "global_step": 569177, "epoch": 6857} {"train_loss": -27.588306427001953, "global_step": 569178, "epoch": 6857} {"train_loss": -27.915985107421875, "global_step": 569179, "epoch": 6857} {"train_loss": -28.037429809570312, "global_step": 569180, "epoch": 6857} {"train_loss": -27.956573486328125, "global_step": 569181, "epoch": 6857} {"train_loss": -27.702009201049805, "global_step": 569182, "epoch": 6857} {"train_loss": -28.264148712158203, "global_step": 569183, "epoch": 6857} {"train_loss": -27.180700302124023, "global_step": 569184, "epoch": 6857} {"train_loss": -28.06513786315918, "global_step": 569185, "epoch": 6857} {"train_loss": -27.939416885375977, "global_step": 569186, "epoch": 6857} {"train_loss": -27.76676368713379, "global_step": 569187, "epoch": 6857} {"train_loss": -28.019012451171875, "global_step": 569188, "epoch": 6857} {"train_loss": -27.833881378173828, "global_step": 569189, "epoch": 6857} {"train_loss": -27.97017478942871, "global_step": 569190, "epoch": 6857} {"train_loss": -28.08722496032715, "global_step": 569191, "epoch": 6857} {"train_loss": -27.929731369018555, "global_step": 569192, "epoch": 6857} {"train_loss": -27.793928146362305, "global_step": 569193, "epoch": 6857} {"train_loss": -28.22340965270996, "global_step": 569194, "epoch": 6857} {"train_loss": -28.091421127319336, "global_step": 569195, "epoch": 6857} {"train_loss": -27.944257736206055, "global_step": 569196, "epoch": 6857} {"train_loss": -28.09173011779785, "global_step": 569197, "epoch": 6857} {"train_loss": -28.08648681640625, "global_step": 569198, "epoch": 6857} {"train_loss": -27.58881950378418, "global_step": 569199, "epoch": 6857} {"train_loss": -28.174304962158203, "global_step": 569200, "epoch": 6857} {"train_loss": -28.162006378173828, "global_step": 569201, "epoch": 6857} {"train_loss": -27.8170166015625, "global_step": 569202, "epoch": 6857} {"train_loss": -28.463409423828125, "global_step": 569203, "epoch": 6857} {"train_loss": -27.97932243347168, "global_step": 569204, "epoch": 6857} {"train_loss": -27.979095458984375, "global_step": 569205, "epoch": 6857} {"train_loss": -27.9072208404541, "global_step": 569206, "epoch": 6857} {"train_loss": -27.976179122924805, "global_step": 569207, "epoch": 6857} {"train_loss": -27.711576461791992, "global_step": 569208, "epoch": 6857} {"train_loss": -27.97077751159668, "global_step": 569209, "epoch": 6857} {"train_loss": -27.887237548828125, "global_step": 569210, "epoch": 6857} {"train_loss": -27.586444854736328, "global_step": 569211, "epoch": 6857} {"train_loss": -27.884078979492188, "global_step": 569212, "epoch": 6857} {"train_loss": -27.797078282000072, "global_step": 569213, "epoch": 6857, "val_loss": 6717814.0} {"train_loss": -27.564016342163086, "global_step": 569214, "epoch": 6858} {"train_loss": -26.554895401000977, "global_step": 569215, "epoch": 6858} {"train_loss": -27.12972068786621, "global_step": 569216, "epoch": 6858} {"train_loss": -27.4500732421875, "global_step": 569217, "epoch": 6858} {"train_loss": -27.311193466186523, "global_step": 569218, "epoch": 6858} {"train_loss": -26.6291446685791, "global_step": 569219, "epoch": 6858} {"train_loss": -27.33905601501465, "global_step": 569220, "epoch": 6858} {"train_loss": -26.717090606689453, "global_step": 569221, "epoch": 6858} {"train_loss": -27.55908203125, "global_step": 569222, "epoch": 6858} {"train_loss": -27.612873077392578, "global_step": 569223, "epoch": 6858} {"train_loss": -26.553308486938477, "global_step": 569224, "epoch": 6858} {"train_loss": -27.252614974975586, "global_step": 569225, "epoch": 6858} {"train_loss": -26.915781021118164, "global_step": 569226, "epoch": 6858} {"train_loss": -27.542469024658203, "global_step": 569227, "epoch": 6858} {"train_loss": -27.137821197509766, "global_step": 569228, "epoch": 6858} {"train_loss": -27.251367568969727, "global_step": 569229, "epoch": 6858} {"train_loss": -27.432485580444336, "global_step": 569230, "epoch": 6858} {"train_loss": -27.51680564880371, "global_step": 569231, "epoch": 6858} {"train_loss": -27.406543731689453, "global_step": 569232, "epoch": 6858} {"train_loss": -27.06852149963379, "global_step": 569233, "epoch": 6858} {"train_loss": -27.336231231689453, "global_step": 569234, "epoch": 6858} {"train_loss": -27.472558975219727, "global_step": 569235, "epoch": 6858} {"train_loss": -27.751386642456055, "global_step": 569236, "epoch": 6858} {"train_loss": -27.439584732055664, "global_step": 569237, "epoch": 6858} {"train_loss": -27.215377807617188, "global_step": 569238, "epoch": 6858} {"train_loss": -27.82625389099121, "global_step": 569239, "epoch": 6858} {"train_loss": -27.746051788330078, "global_step": 569240, "epoch": 6858} {"train_loss": -27.4245662689209, "global_step": 569241, "epoch": 6858} {"train_loss": -27.760950088500977, "global_step": 569242, "epoch": 6858} {"train_loss": -27.789213180541992, "global_step": 569243, "epoch": 6858} {"train_loss": -27.575092315673828, "global_step": 569244, "epoch": 6858} {"train_loss": -27.635053634643555, "global_step": 569245, "epoch": 6858} {"train_loss": -27.682947158813477, "global_step": 569246, "epoch": 6858} {"train_loss": -27.743488311767578, "global_step": 569247, "epoch": 6858} {"train_loss": -27.886554718017578, "global_step": 569248, "epoch": 6858} {"train_loss": -27.679309844970703, "global_step": 569249, "epoch": 6858} {"train_loss": -27.972227096557617, "global_step": 569250, "epoch": 6858} {"train_loss": -28.11881446838379, "global_step": 569251, "epoch": 6858} {"train_loss": -27.929553985595703, "global_step": 569252, "epoch": 6858} {"train_loss": -27.949926376342773, "global_step": 569253, "epoch": 6858} {"train_loss": -28.14447593688965, "global_step": 569254, "epoch": 6858} {"train_loss": -27.708784103393555, "global_step": 569255, "epoch": 6858} {"train_loss": -28.064498901367188, "global_step": 569256, "epoch": 6858} {"train_loss": -28.220792770385742, "global_step": 569257, "epoch": 6858} {"train_loss": -27.77553367614746, "global_step": 569258, "epoch": 6858} {"train_loss": -28.34561538696289, "global_step": 569259, "epoch": 6858} {"train_loss": -27.964014053344727, "global_step": 569260, "epoch": 6858} {"train_loss": -28.071151733398438, "global_step": 569261, "epoch": 6858} {"train_loss": -28.14093017578125, "global_step": 569262, "epoch": 6858} {"train_loss": -28.071313858032227, "global_step": 569263, "epoch": 6858} {"train_loss": -28.092453002929688, "global_step": 569264, "epoch": 6858} {"train_loss": -27.98488426208496, "global_step": 569265, "epoch": 6858} {"train_loss": -27.92313575744629, "global_step": 569266, "epoch": 6858} {"train_loss": -27.717426300048828, "global_step": 569267, "epoch": 6858} {"train_loss": -27.684858322143555, "global_step": 569268, "epoch": 6858} {"train_loss": -27.5982723236084, "global_step": 569269, "epoch": 6858} {"train_loss": -27.63458824157715, "global_step": 569270, "epoch": 6858} {"train_loss": -28.15874671936035, "global_step": 569271, "epoch": 6858} {"train_loss": -28.027606964111328, "global_step": 569272, "epoch": 6858} {"train_loss": -28.089502334594727, "global_step": 569273, "epoch": 6858} {"train_loss": -28.298507690429688, "global_step": 569274, "epoch": 6858} {"train_loss": -27.744140625, "global_step": 569275, "epoch": 6858} {"train_loss": -28.19416618347168, "global_step": 569276, "epoch": 6858} {"train_loss": -27.832260131835938, "global_step": 569277, "epoch": 6858} {"train_loss": -28.231733322143555, "global_step": 569278, "epoch": 6858} {"train_loss": -27.996246337890625, "global_step": 569279, "epoch": 6858} {"train_loss": -28.152074813842773, "global_step": 569280, "epoch": 6858} {"train_loss": -27.75310707092285, "global_step": 569281, "epoch": 6858} {"train_loss": -28.248767852783203, "global_step": 569282, "epoch": 6858} {"train_loss": -28.22690773010254, "global_step": 569283, "epoch": 6858} {"train_loss": -28.0550594329834, "global_step": 569284, "epoch": 6858} {"train_loss": -28.186004638671875, "global_step": 569285, "epoch": 6858} {"train_loss": -28.007129669189453, "global_step": 569286, "epoch": 6858} {"train_loss": -28.0567626953125, "global_step": 569287, "epoch": 6858} {"train_loss": -28.0465087890625, "global_step": 569288, "epoch": 6858} {"train_loss": -28.382299423217773, "global_step": 569289, "epoch": 6858} {"train_loss": -27.995819091796875, "global_step": 569290, "epoch": 6858} {"train_loss": -28.22574234008789, "global_step": 569291, "epoch": 6858} {"train_loss": -27.61920166015625, "global_step": 569292, "epoch": 6858} {"train_loss": -27.795928955078125, "global_step": 569293, "epoch": 6858} {"train_loss": -28.13062858581543, "global_step": 569294, "epoch": 6858} {"train_loss": -27.912649154663086, "global_step": 569295, "epoch": 6858} {"train_loss": -27.739693055669946, "global_step": 569296, "epoch": 6858, "val_loss": 6698276.5} {"train_loss": -27.299758911132812, "global_step": 569297, "epoch": 6859} {"train_loss": -26.59083366394043, "global_step": 569298, "epoch": 6859} {"train_loss": -26.82877540588379, "global_step": 569299, "epoch": 6859} {"train_loss": -26.88054847717285, "global_step": 569300, "epoch": 6859} {"train_loss": -26.872711181640625, "global_step": 569301, "epoch": 6859} {"train_loss": -26.74462890625, "global_step": 569302, "epoch": 6859} {"train_loss": -27.454614639282227, "global_step": 569303, "epoch": 6859} {"train_loss": -26.807790756225586, "global_step": 569304, "epoch": 6859} {"train_loss": -26.590591430664062, "global_step": 569305, "epoch": 6859} {"train_loss": -28.157629013061523, "global_step": 569306, "epoch": 6859} {"train_loss": -26.659748077392578, "global_step": 569307, "epoch": 6859} {"train_loss": -27.285181045532227, "global_step": 569308, "epoch": 6859} {"train_loss": -27.2348690032959, "global_step": 569309, "epoch": 6859} {"train_loss": -27.493885040283203, "global_step": 569310, "epoch": 6859} {"train_loss": -27.214069366455078, "global_step": 569311, "epoch": 6859} {"train_loss": -27.053632736206055, "global_step": 569312, "epoch": 6859} {"train_loss": -27.4820556640625, "global_step": 569313, "epoch": 6859} {"train_loss": -27.775049209594727, "global_step": 569314, "epoch": 6859} {"train_loss": -27.482038497924805, "global_step": 569315, "epoch": 6859} {"train_loss": -27.708984375, "global_step": 569316, "epoch": 6859} {"train_loss": -27.56086540222168, "global_step": 569317, "epoch": 6859} {"train_loss": -27.708358764648438, "global_step": 569318, "epoch": 6859} {"train_loss": -27.3818359375, "global_step": 569319, "epoch": 6859} {"train_loss": -27.07172203063965, "global_step": 569320, "epoch": 6859} {"train_loss": -27.601919174194336, "global_step": 569321, "epoch": 6859} {"train_loss": -27.833484649658203, "global_step": 569322, "epoch": 6859} {"train_loss": -28.028095245361328, "global_step": 569323, "epoch": 6859} {"train_loss": -27.6785888671875, "global_step": 569324, "epoch": 6859} {"train_loss": -27.760473251342773, "global_step": 569325, "epoch": 6859} {"train_loss": -27.6231632232666, "global_step": 569326, "epoch": 6859} {"train_loss": -28.128747940063477, "global_step": 569327, "epoch": 6859} {"train_loss": -27.5429630279541, "global_step": 569328, "epoch": 6859} {"train_loss": -27.950891494750977, "global_step": 569329, "epoch": 6859} {"train_loss": -27.903528213500977, "global_step": 569330, "epoch": 6859} {"train_loss": -28.027502059936523, "global_step": 569331, "epoch": 6859} {"train_loss": -27.84734535217285, "global_step": 569332, "epoch": 6859} {"train_loss": -27.862043380737305, "global_step": 569333, "epoch": 6859} {"train_loss": -28.093576431274414, "global_step": 569334, "epoch": 6859} {"train_loss": -27.919464111328125, "global_step": 569335, "epoch": 6859} {"train_loss": -27.98638343811035, "global_step": 569336, "epoch": 6859} {"train_loss": -27.761062622070312, "global_step": 569337, "epoch": 6859} {"train_loss": -27.678064346313477, "global_step": 569338, "epoch": 6859} {"train_loss": -27.524744033813477, "global_step": 569339, "epoch": 6859} {"train_loss": -28.13651466369629, "global_step": 569340, "epoch": 6859} {"train_loss": -27.94943618774414, "global_step": 569341, "epoch": 6859} {"train_loss": -28.162078857421875, "global_step": 569342, "epoch": 6859} {"train_loss": -27.923114776611328, "global_step": 569343, "epoch": 6859} {"train_loss": -28.272891998291016, "global_step": 569344, "epoch": 6859} {"train_loss": -27.914228439331055, "global_step": 569345, "epoch": 6859} {"train_loss": -27.88580894470215, "global_step": 569346, "epoch": 6859} {"train_loss": -27.775360107421875, "global_step": 569347, "epoch": 6859} {"train_loss": -28.334705352783203, "global_step": 569348, "epoch": 6859} {"train_loss": -27.826154708862305, "global_step": 569349, "epoch": 6859} {"train_loss": -28.036972045898438, "global_step": 569350, "epoch": 6859} {"train_loss": -27.738866806030273, "global_step": 569351, "epoch": 6859} {"train_loss": -27.750518798828125, "global_step": 569352, "epoch": 6859} {"train_loss": -27.8717098236084, "global_step": 569353, "epoch": 6859} {"train_loss": -27.986135482788086, "global_step": 569354, "epoch": 6859} {"train_loss": -27.808517456054688, "global_step": 569355, "epoch": 6859} {"train_loss": -28.005849838256836, "global_step": 569356, "epoch": 6859} {"train_loss": -28.30571937561035, "global_step": 569357, "epoch": 6859} {"train_loss": -28.162094116210938, "global_step": 569358, "epoch": 6859} {"train_loss": -27.984405517578125, "global_step": 569359, "epoch": 6859} {"train_loss": -28.382801055908203, "global_step": 569360, "epoch": 6859} {"train_loss": -28.420949935913086, "global_step": 569361, "epoch": 6859} {"train_loss": -28.10019302368164, "global_step": 569362, "epoch": 6859} {"train_loss": -27.89312744140625, "global_step": 569363, "epoch": 6859} {"train_loss": -27.984968185424805, "global_step": 569364, "epoch": 6859} {"train_loss": -28.13935661315918, "global_step": 569365, "epoch": 6859} {"train_loss": -28.211627960205078, "global_step": 569366, "epoch": 6859} {"train_loss": -28.12116050720215, "global_step": 569367, "epoch": 6859} {"train_loss": -28.251190185546875, "global_step": 569368, "epoch": 6859} {"train_loss": -27.75724220275879, "global_step": 569369, "epoch": 6859} {"train_loss": -28.174802780151367, "global_step": 569370, "epoch": 6859} {"train_loss": -28.06769371032715, "global_step": 569371, "epoch": 6859} {"train_loss": -28.02605628967285, "global_step": 569372, "epoch": 6859} {"train_loss": -28.093687057495117, "global_step": 569373, "epoch": 6859} {"train_loss": -27.706390380859375, "global_step": 569374, "epoch": 6859} {"train_loss": -27.508132934570312, "global_step": 569375, "epoch": 6859} {"train_loss": -27.243032455444336, "global_step": 569376, "epoch": 6859} {"train_loss": -27.717182159423828, "global_step": 569377, "epoch": 6859} {"train_loss": -27.5621395111084, "global_step": 569378, "epoch": 6859} {"train_loss": -27.71512279740299, "global_step": 569379, "epoch": 6859, "val_loss": 6731225.0} {"train_loss": -27.110584259033203, "global_step": 569380, "epoch": 6860} {"train_loss": -27.006366729736328, "global_step": 569381, "epoch": 6860} {"train_loss": -26.80584144592285, "global_step": 569382, "epoch": 6860} {"train_loss": -27.29506492614746, "global_step": 569383, "epoch": 6860} {"train_loss": -26.99212074279785, "global_step": 569384, "epoch": 6860} {"train_loss": -26.86464500427246, "global_step": 569385, "epoch": 6860} {"train_loss": -26.905826568603516, "global_step": 569386, "epoch": 6860} {"train_loss": -26.973424911499023, "global_step": 569387, "epoch": 6860} {"train_loss": -27.470922470092773, "global_step": 569388, "epoch": 6860} {"train_loss": -27.084508895874023, "global_step": 569389, "epoch": 6860} {"train_loss": -27.556875228881836, "global_step": 569390, "epoch": 6860} {"train_loss": -27.596790313720703, "global_step": 569391, "epoch": 6860} {"train_loss": -27.564313888549805, "global_step": 569392, "epoch": 6860} {"train_loss": -27.27945899963379, "global_step": 569393, "epoch": 6860} {"train_loss": -27.2883243560791, "global_step": 569394, "epoch": 6860} {"train_loss": -27.261438369750977, "global_step": 569395, "epoch": 6860} {"train_loss": -27.780256271362305, "global_step": 569396, "epoch": 6860} {"train_loss": -27.365060806274414, "global_step": 569397, "epoch": 6860} {"train_loss": -27.70737648010254, "global_step": 569398, "epoch": 6860} {"train_loss": -27.245275497436523, "global_step": 569399, "epoch": 6860} {"train_loss": -27.698429107666016, "global_step": 569400, "epoch": 6860} {"train_loss": -27.524118423461914, "global_step": 569401, "epoch": 6860} {"train_loss": -27.655954360961914, "global_step": 569402, "epoch": 6860} {"train_loss": -27.491968154907227, "global_step": 569403, "epoch": 6860} {"train_loss": -27.836408615112305, "global_step": 569404, "epoch": 6860} {"train_loss": -27.7850284576416, "global_step": 569405, "epoch": 6860} {"train_loss": -27.50103187561035, "global_step": 569406, "epoch": 6860} {"train_loss": -27.882598876953125, "global_step": 569407, "epoch": 6860} {"train_loss": -27.401453018188477, "global_step": 569408, "epoch": 6860} {"train_loss": -27.488636016845703, "global_step": 569409, "epoch": 6860} {"train_loss": -27.513681411743164, "global_step": 569410, "epoch": 6860} {"train_loss": -27.260847091674805, "global_step": 569411, "epoch": 6860} {"train_loss": -27.590795516967773, "global_step": 569412, "epoch": 6860} {"train_loss": -27.675458908081055, "global_step": 569413, "epoch": 6860} {"train_loss": -28.007068634033203, "global_step": 569414, "epoch": 6860} {"train_loss": -27.6470890045166, "global_step": 569415, "epoch": 6860} {"train_loss": -27.499637603759766, "global_step": 569416, "epoch": 6860} {"train_loss": -27.696996688842773, "global_step": 569417, "epoch": 6860} {"train_loss": -28.018518447875977, "global_step": 569418, "epoch": 6860} {"train_loss": -27.94392967224121, "global_step": 569419, "epoch": 6860} {"train_loss": -27.968664169311523, "global_step": 569420, "epoch": 6860} {"train_loss": -27.69046401977539, "global_step": 569421, "epoch": 6860} {"train_loss": -27.391437530517578, "global_step": 569422, "epoch": 6860} {"train_loss": -28.06534194946289, "global_step": 569423, "epoch": 6860} {"train_loss": -27.77149772644043, "global_step": 569424, "epoch": 6860} {"train_loss": -27.128498077392578, "global_step": 569425, "epoch": 6860} {"train_loss": -27.761260986328125, "global_step": 569426, "epoch": 6860} {"train_loss": -27.35196304321289, "global_step": 569427, "epoch": 6860} {"train_loss": -27.87274742126465, "global_step": 569428, "epoch": 6860} {"train_loss": -27.47145652770996, "global_step": 569429, "epoch": 6860} {"train_loss": -27.490131378173828, "global_step": 569430, "epoch": 6860} {"train_loss": -27.5467586517334, "global_step": 569431, "epoch": 6860} {"train_loss": -27.437488555908203, "global_step": 569432, "epoch": 6860} {"train_loss": -28.097900390625, "global_step": 569433, "epoch": 6860} {"train_loss": -27.814111709594727, "global_step": 569434, "epoch": 6860} {"train_loss": -27.730093002319336, "global_step": 569435, "epoch": 6860} {"train_loss": -27.800413131713867, "global_step": 569436, "epoch": 6860} {"train_loss": -27.87360954284668, "global_step": 569437, "epoch": 6860} {"train_loss": -27.872350692749023, "global_step": 569438, "epoch": 6860} {"train_loss": -27.51202964782715, "global_step": 569439, "epoch": 6860} {"train_loss": -28.12733268737793, "global_step": 569440, "epoch": 6860} {"train_loss": -27.519580841064453, "global_step": 569441, "epoch": 6860} {"train_loss": -27.946765899658203, "global_step": 569442, "epoch": 6860} {"train_loss": -27.385175704956055, "global_step": 569443, "epoch": 6860} {"train_loss": -27.623462677001953, "global_step": 569444, "epoch": 6860} {"train_loss": -27.62786293029785, "global_step": 569445, "epoch": 6860} {"train_loss": -28.26006507873535, "global_step": 569446, "epoch": 6860} {"train_loss": -27.539182662963867, "global_step": 569447, "epoch": 6860} {"train_loss": -27.931884765625, "global_step": 569448, "epoch": 6860} {"train_loss": -27.977142333984375, "global_step": 569449, "epoch": 6860} {"train_loss": -27.86433219909668, "global_step": 569450, "epoch": 6860} {"train_loss": -27.908935546875, "global_step": 569451, "epoch": 6860} {"train_loss": -28.231760025024414, "global_step": 569452, "epoch": 6860} {"train_loss": -28.12424659729004, "global_step": 569453, "epoch": 6860} {"train_loss": -28.0432071685791, "global_step": 569454, "epoch": 6860} {"train_loss": -28.007709503173828, "global_step": 569455, "epoch": 6860} {"train_loss": -27.879098892211914, "global_step": 569456, "epoch": 6860} {"train_loss": -27.936756134033203, "global_step": 569457, "epoch": 6860} {"train_loss": -27.780210494995117, "global_step": 569458, "epoch": 6860} {"train_loss": -28.248828887939453, "global_step": 569459, "epoch": 6860} {"train_loss": -27.99226188659668, "global_step": 569460, "epoch": 6860} {"train_loss": -28.232358932495117, "global_step": 569461, "epoch": 6860} {"train_loss": -27.63059397777879, "global_step": 569462, "epoch": 6860, "val_loss": 6675578.0} {"train_loss": -27.426916122436523, "global_step": 569463, "epoch": 6861} {"train_loss": -27.127805709838867, "global_step": 569464, "epoch": 6861} {"train_loss": -27.58308982849121, "global_step": 569465, "epoch": 6861} {"train_loss": -26.879108428955078, "global_step": 569466, "epoch": 6861} {"train_loss": -26.930606842041016, "global_step": 569467, "epoch": 6861} {"train_loss": -26.872739791870117, "global_step": 569468, "epoch": 6861} {"train_loss": -27.626331329345703, "global_step": 569469, "epoch": 6861} {"train_loss": -27.144580841064453, "global_step": 569470, "epoch": 6861} {"train_loss": -27.566497802734375, "global_step": 569471, "epoch": 6861} {"train_loss": -27.191625595092773, "global_step": 569472, "epoch": 6861} {"train_loss": -27.507160186767578, "global_step": 569473, "epoch": 6861} {"train_loss": -27.251026153564453, "global_step": 569474, "epoch": 6861} {"train_loss": -27.207202911376953, "global_step": 569475, "epoch": 6861} {"train_loss": -27.775644302368164, "global_step": 569476, "epoch": 6861} {"train_loss": -27.468175888061523, "global_step": 569477, "epoch": 6861} {"train_loss": -27.067707061767578, "global_step": 569478, "epoch": 6861} {"train_loss": -27.45806312561035, "global_step": 569479, "epoch": 6861} {"train_loss": -27.64716911315918, "global_step": 569480, "epoch": 6861} {"train_loss": -27.398160934448242, "global_step": 569481, "epoch": 6861} {"train_loss": -27.53140640258789, "global_step": 569482, "epoch": 6861} {"train_loss": -27.31601905822754, "global_step": 569483, "epoch": 6861} {"train_loss": -27.8713321685791, "global_step": 569484, "epoch": 6861} {"train_loss": -27.9616641998291, "global_step": 569485, "epoch": 6861} {"train_loss": -27.85797119140625, "global_step": 569486, "epoch": 6861} {"train_loss": -28.0294246673584, "global_step": 569487, "epoch": 6861} {"train_loss": -27.875768661499023, "global_step": 569488, "epoch": 6861} {"train_loss": -27.90424919128418, "global_step": 569489, "epoch": 6861} {"train_loss": -27.724679946899414, "global_step": 569490, "epoch": 6861} {"train_loss": -27.927967071533203, "global_step": 569491, "epoch": 6861} {"train_loss": -27.983291625976562, "global_step": 569492, "epoch": 6861} {"train_loss": -28.058765411376953, "global_step": 569493, "epoch": 6861} {"train_loss": -28.204517364501953, "global_step": 569494, "epoch": 6861} {"train_loss": -28.196033477783203, "global_step": 569495, "epoch": 6861} {"train_loss": -28.0119686126709, "global_step": 569496, "epoch": 6861} {"train_loss": -27.727588653564453, "global_step": 569497, "epoch": 6861} {"train_loss": -28.136621475219727, "global_step": 569498, "epoch": 6861} {"train_loss": -27.605077743530273, "global_step": 569499, "epoch": 6861} {"train_loss": -27.81866455078125, "global_step": 569500, "epoch": 6861} {"train_loss": -27.9671573638916, "global_step": 569501, "epoch": 6861} {"train_loss": -28.117834091186523, "global_step": 569502, "epoch": 6861} {"train_loss": -27.688800811767578, "global_step": 569503, "epoch": 6861} {"train_loss": -28.10335350036621, "global_step": 569504, "epoch": 6861} {"train_loss": -27.84638023376465, "global_step": 569505, "epoch": 6861} {"train_loss": -27.683990478515625, "global_step": 569506, "epoch": 6861} {"train_loss": -28.167112350463867, "global_step": 569507, "epoch": 6861} {"train_loss": -28.102466583251953, "global_step": 569508, "epoch": 6861} {"train_loss": -28.088415145874023, "global_step": 569509, "epoch": 6861} {"train_loss": -28.033437728881836, "global_step": 569510, "epoch": 6861} {"train_loss": -28.395496368408203, "global_step": 569511, "epoch": 6861} {"train_loss": -28.11659812927246, "global_step": 569512, "epoch": 6861} {"train_loss": -28.180023193359375, "global_step": 569513, "epoch": 6861} {"train_loss": -28.1230525970459, "global_step": 569514, "epoch": 6861} {"train_loss": -27.911649703979492, "global_step": 569515, "epoch": 6861} {"train_loss": -27.670032501220703, "global_step": 569516, "epoch": 6861} {"train_loss": -28.09419059753418, "global_step": 569517, "epoch": 6861} {"train_loss": -28.140140533447266, "global_step": 569518, "epoch": 6861} {"train_loss": -28.064802169799805, "global_step": 569519, "epoch": 6861} {"train_loss": -28.03618812561035, "global_step": 569520, "epoch": 6861} {"train_loss": -27.769580841064453, "global_step": 569521, "epoch": 6861} {"train_loss": -27.986310958862305, "global_step": 569522, "epoch": 6861} {"train_loss": -27.959701538085938, "global_step": 569523, "epoch": 6861} {"train_loss": -27.489246368408203, "global_step": 569524, "epoch": 6861} {"train_loss": -28.074872970581055, "global_step": 569525, "epoch": 6861} {"train_loss": -28.1207332611084, "global_step": 569526, "epoch": 6861} {"train_loss": -28.167844772338867, "global_step": 569527, "epoch": 6861} {"train_loss": -28.079700469970703, "global_step": 569528, "epoch": 6861} {"train_loss": -27.97165870666504, "global_step": 569529, "epoch": 6861} {"train_loss": -28.139862060546875, "global_step": 569530, "epoch": 6861} {"train_loss": -28.156009674072266, "global_step": 569531, "epoch": 6861} {"train_loss": -28.2194766998291, "global_step": 569532, "epoch": 6861} {"train_loss": -27.66169548034668, "global_step": 569533, "epoch": 6861} {"train_loss": -28.026214599609375, "global_step": 569534, "epoch": 6861} {"train_loss": -27.99493408203125, "global_step": 569535, "epoch": 6861} {"train_loss": -27.968122482299805, "global_step": 569536, "epoch": 6861} {"train_loss": -27.834400177001953, "global_step": 569537, "epoch": 6861} {"train_loss": -27.459009170532227, "global_step": 569538, "epoch": 6861} {"train_loss": -27.80487632751465, "global_step": 569539, "epoch": 6861} {"train_loss": -28.251422882080078, "global_step": 569540, "epoch": 6861} {"train_loss": -27.901830673217773, "global_step": 569541, "epoch": 6861} {"train_loss": -27.8941650390625, "global_step": 569542, "epoch": 6861} {"train_loss": -27.1097469329834, "global_step": 569543, "epoch": 6861} {"train_loss": -27.4881649017334, "global_step": 569544, "epoch": 6861} {"train_loss": -27.77977959506483, "global_step": 569545, "epoch": 6861, "val_loss": 6745556.0} {"train_loss": -26.854007720947266, "global_step": 569546, "epoch": 6862} {"train_loss": -26.421255111694336, "global_step": 569547, "epoch": 6862} {"train_loss": -27.180410385131836, "global_step": 569548, "epoch": 6862} {"train_loss": -26.0694522857666, "global_step": 569549, "epoch": 6862} {"train_loss": -26.758459091186523, "global_step": 569550, "epoch": 6862} {"train_loss": -26.47943687438965, "global_step": 569551, "epoch": 6862} {"train_loss": -25.95444679260254, "global_step": 569552, "epoch": 6862} {"train_loss": -27.120197296142578, "global_step": 569553, "epoch": 6862} {"train_loss": -27.0022029876709, "global_step": 569554, "epoch": 6862} {"train_loss": -26.9907169342041, "global_step": 569555, "epoch": 6862} {"train_loss": -26.486780166625977, "global_step": 569556, "epoch": 6862} {"train_loss": -26.941486358642578, "global_step": 569557, "epoch": 6862} {"train_loss": -26.873920440673828, "global_step": 569558, "epoch": 6862} {"train_loss": -27.132492065429688, "global_step": 569559, "epoch": 6862} {"train_loss": -27.072629928588867, "global_step": 569560, "epoch": 6862} {"train_loss": -27.16815185546875, "global_step": 569561, "epoch": 6862} {"train_loss": -27.083662033081055, "global_step": 569562, "epoch": 6862} {"train_loss": -27.045812606811523, "global_step": 569563, "epoch": 6862} {"train_loss": -27.111326217651367, "global_step": 569564, "epoch": 6862} {"train_loss": -27.420135498046875, "global_step": 569565, "epoch": 6862} {"train_loss": -27.817365646362305, "global_step": 569566, "epoch": 6862} {"train_loss": -26.98162269592285, "global_step": 569567, "epoch": 6862} {"train_loss": -27.250720977783203, "global_step": 569568, "epoch": 6862} {"train_loss": -27.2778377532959, "global_step": 569569, "epoch": 6862} {"train_loss": -27.728849411010742, "global_step": 569570, "epoch": 6862} {"train_loss": -27.303592681884766, "global_step": 569571, "epoch": 6862} {"train_loss": -27.37314796447754, "global_step": 569572, "epoch": 6862} {"train_loss": -27.826749801635742, "global_step": 569573, "epoch": 6862} {"train_loss": -27.485260009765625, "global_step": 569574, "epoch": 6862} {"train_loss": -27.3621826171875, "global_step": 569575, "epoch": 6862} {"train_loss": -27.443708419799805, "global_step": 569576, "epoch": 6862} {"train_loss": -27.663532257080078, "global_step": 569577, "epoch": 6862} {"train_loss": -27.757429122924805, "global_step": 569578, "epoch": 6862} {"train_loss": -27.961225509643555, "global_step": 569579, "epoch": 6862} {"train_loss": -27.607105255126953, "global_step": 569580, "epoch": 6862} {"train_loss": -27.611204147338867, "global_step": 569581, "epoch": 6862} {"train_loss": -27.382104873657227, "global_step": 569582, "epoch": 6862} {"train_loss": -27.73065185546875, "global_step": 569583, "epoch": 6862} {"train_loss": -27.969228744506836, "global_step": 569584, "epoch": 6862} {"train_loss": -27.534399032592773, "global_step": 569585, "epoch": 6862} {"train_loss": -27.68438720703125, "global_step": 569586, "epoch": 6862} {"train_loss": -27.69211769104004, "global_step": 569587, "epoch": 6862} {"train_loss": -27.920475006103516, "global_step": 569588, "epoch": 6862} {"train_loss": -27.968708038330078, "global_step": 569589, "epoch": 6862} {"train_loss": -27.5142822265625, "global_step": 569590, "epoch": 6862} {"train_loss": -28.031721115112305, "global_step": 569591, "epoch": 6862} {"train_loss": -27.657373428344727, "global_step": 569592, "epoch": 6862} {"train_loss": -27.87550163269043, "global_step": 569593, "epoch": 6862} {"train_loss": -27.56912612915039, "global_step": 569594, "epoch": 6862} {"train_loss": -28.003238677978516, "global_step": 569595, "epoch": 6862} {"train_loss": -28.223968505859375, "global_step": 569596, "epoch": 6862} {"train_loss": -27.68977928161621, "global_step": 569597, "epoch": 6862} {"train_loss": -28.192182540893555, "global_step": 569598, "epoch": 6862} {"train_loss": -27.94780921936035, "global_step": 569599, "epoch": 6862} {"train_loss": -27.92146873474121, "global_step": 569600, "epoch": 6862} {"train_loss": -27.919769287109375, "global_step": 569601, "epoch": 6862} {"train_loss": -28.085285186767578, "global_step": 569602, "epoch": 6862} {"train_loss": -28.490325927734375, "global_step": 569603, "epoch": 6862} {"train_loss": -28.19439125061035, "global_step": 569604, "epoch": 6862} {"train_loss": -28.2816219329834, "global_step": 569605, "epoch": 6862} {"train_loss": -27.9736270904541, "global_step": 569606, "epoch": 6862} {"train_loss": -28.03468132019043, "global_step": 569607, "epoch": 6862} {"train_loss": -27.83633804321289, "global_step": 569608, "epoch": 6862} {"train_loss": -28.093387603759766, "global_step": 569609, "epoch": 6862} {"train_loss": -28.0255069732666, "global_step": 569610, "epoch": 6862} {"train_loss": -28.339563369750977, "global_step": 569611, "epoch": 6862} {"train_loss": -28.079395294189453, "global_step": 569612, "epoch": 6862} {"train_loss": -28.587589263916016, "global_step": 569613, "epoch": 6862} {"train_loss": -27.85715675354004, "global_step": 569614, "epoch": 6862} {"train_loss": -28.075937271118164, "global_step": 569615, "epoch": 6862} {"train_loss": -27.78608512878418, "global_step": 569616, "epoch": 6862} {"train_loss": -27.963109970092773, "global_step": 569617, "epoch": 6862} {"train_loss": -27.986658096313477, "global_step": 569618, "epoch": 6862} {"train_loss": -28.037321090698242, "global_step": 569619, "epoch": 6862} {"train_loss": -28.24751091003418, "global_step": 569620, "epoch": 6862} {"train_loss": -28.162628173828125, "global_step": 569621, "epoch": 6862} {"train_loss": -28.118438720703125, "global_step": 569622, "epoch": 6862} {"train_loss": -27.98418617248535, "global_step": 569623, "epoch": 6862} {"train_loss": -27.706724166870117, "global_step": 569624, "epoch": 6862} {"train_loss": -27.644811630249023, "global_step": 569625, "epoch": 6862} {"train_loss": -27.4288272857666, "global_step": 569626, "epoch": 6862} {"train_loss": -27.70209312438965, "global_step": 569627, "epoch": 6862} {"train_loss": -27.599091426435724, "global_step": 569628, "epoch": 6862, "val_loss": 6647286.0} {"train_loss": -22.792499542236328, "global_step": 569629, "epoch": 6863} {"train_loss": -24.657316207885742, "global_step": 569630, "epoch": 6863} {"train_loss": -22.280973434448242, "global_step": 569631, "epoch": 6863} {"train_loss": -24.879371643066406, "global_step": 569632, "epoch": 6863} {"train_loss": -24.138147354125977, "global_step": 569633, "epoch": 6863} {"train_loss": -25.669591903686523, "global_step": 569634, "epoch": 6863} {"train_loss": -25.491697311401367, "global_step": 569635, "epoch": 6863} {"train_loss": -24.810026168823242, "global_step": 569636, "epoch": 6863} {"train_loss": -26.0262393951416, "global_step": 569637, "epoch": 6863} {"train_loss": -25.382770538330078, "global_step": 569638, "epoch": 6863} {"train_loss": -25.992807388305664, "global_step": 569639, "epoch": 6863} {"train_loss": -25.88555335998535, "global_step": 569640, "epoch": 6863} {"train_loss": -26.229536056518555, "global_step": 569641, "epoch": 6863} {"train_loss": -25.909381866455078, "global_step": 569642, "epoch": 6863} {"train_loss": -25.951257705688477, "global_step": 569643, "epoch": 6863} {"train_loss": -26.02446937561035, "global_step": 569644, "epoch": 6863} {"train_loss": -26.40199089050293, "global_step": 569645, "epoch": 6863} {"train_loss": -26.2197208404541, "global_step": 569646, "epoch": 6863} {"train_loss": -26.30354118347168, "global_step": 569647, "epoch": 6863} {"train_loss": -26.365976333618164, "global_step": 569648, "epoch": 6863} {"train_loss": -26.462726593017578, "global_step": 569649, "epoch": 6863} {"train_loss": -26.86574363708496, "global_step": 569650, "epoch": 6863} {"train_loss": -26.799285888671875, "global_step": 569651, "epoch": 6863} {"train_loss": -26.3508358001709, "global_step": 569652, "epoch": 6863} {"train_loss": -26.656604766845703, "global_step": 569653, "epoch": 6863} {"train_loss": -26.8559513092041, "global_step": 569654, "epoch": 6863} {"train_loss": -26.797510147094727, "global_step": 569655, "epoch": 6863} {"train_loss": -27.02984046936035, "global_step": 569656, "epoch": 6863} {"train_loss": -27.063703536987305, "global_step": 569657, "epoch": 6863} {"train_loss": -26.874902725219727, "global_step": 569658, "epoch": 6863} {"train_loss": -27.096113204956055, "global_step": 569659, "epoch": 6863} {"train_loss": -26.986011505126953, "global_step": 569660, "epoch": 6863} {"train_loss": -27.502172470092773, "global_step": 569661, "epoch": 6863} {"train_loss": -27.142414093017578, "global_step": 569662, "epoch": 6863} {"train_loss": -26.825407028198242, "global_step": 569663, "epoch": 6863} {"train_loss": -27.304487228393555, "global_step": 569664, "epoch": 6863} {"train_loss": -27.247421264648438, "global_step": 569665, "epoch": 6863} {"train_loss": -27.295490264892578, "global_step": 569666, "epoch": 6863} {"train_loss": -27.37220573425293, "global_step": 569667, "epoch": 6863} {"train_loss": -27.55718994140625, "global_step": 569668, "epoch": 6863} {"train_loss": -27.48333168029785, "global_step": 569669, "epoch": 6863} {"train_loss": -27.615589141845703, "global_step": 569670, "epoch": 6863} {"train_loss": -27.582212448120117, "global_step": 569671, "epoch": 6863} {"train_loss": -27.64827537536621, "global_step": 569672, "epoch": 6863} {"train_loss": -27.557483673095703, "global_step": 569673, "epoch": 6863} {"train_loss": -27.488056182861328, "global_step": 569674, "epoch": 6863} {"train_loss": -27.661518096923828, "global_step": 569675, "epoch": 6863} {"train_loss": -27.82183265686035, "global_step": 569676, "epoch": 6863} {"train_loss": -27.766315460205078, "global_step": 569677, "epoch": 6863} {"train_loss": -27.928064346313477, "global_step": 569678, "epoch": 6863} {"train_loss": -27.4155216217041, "global_step": 569679, "epoch": 6863} {"train_loss": -27.866788864135742, "global_step": 569680, "epoch": 6863} {"train_loss": -27.722686767578125, "global_step": 569681, "epoch": 6863} {"train_loss": -27.935653686523438, "global_step": 569682, "epoch": 6863} {"train_loss": -27.46036720275879, "global_step": 569683, "epoch": 6863} {"train_loss": -27.8985652923584, "global_step": 569684, "epoch": 6863} {"train_loss": -27.771169662475586, "global_step": 569685, "epoch": 6863} {"train_loss": -27.7517032623291, "global_step": 569686, "epoch": 6863} {"train_loss": -28.308786392211914, "global_step": 569687, "epoch": 6863} {"train_loss": -28.074865341186523, "global_step": 569688, "epoch": 6863} {"train_loss": -27.440153121948242, "global_step": 569689, "epoch": 6863} {"train_loss": -28.019428253173828, "global_step": 569690, "epoch": 6863} {"train_loss": -27.989044189453125, "global_step": 569691, "epoch": 6863} {"train_loss": -27.894729614257812, "global_step": 569692, "epoch": 6863} {"train_loss": -28.187732696533203, "global_step": 569693, "epoch": 6863} {"train_loss": -28.243688583374023, "global_step": 569694, "epoch": 6863} {"train_loss": -27.69220542907715, "global_step": 569695, "epoch": 6863} {"train_loss": -27.750873565673828, "global_step": 569696, "epoch": 6863} {"train_loss": -27.651830673217773, "global_step": 569697, "epoch": 6863} {"train_loss": -27.434667587280273, "global_step": 569698, "epoch": 6863} {"train_loss": -27.61029052734375, "global_step": 569699, "epoch": 6863} {"train_loss": -27.086669921875, "global_step": 569700, "epoch": 6863} {"train_loss": -27.44194984436035, "global_step": 569701, "epoch": 6863} {"train_loss": -27.326629638671875, "global_step": 569702, "epoch": 6863} {"train_loss": -27.946130752563477, "global_step": 569703, "epoch": 6863} {"train_loss": -27.3426513671875, "global_step": 569704, "epoch": 6863} {"train_loss": -27.444860458374023, "global_step": 569705, "epoch": 6863} {"train_loss": -27.572711944580078, "global_step": 569706, "epoch": 6863} {"train_loss": -27.555877685546875, "global_step": 569707, "epoch": 6863} {"train_loss": -27.6361026763916, "global_step": 569708, "epoch": 6863} {"train_loss": -27.68796157836914, "global_step": 569709, "epoch": 6863} {"train_loss": -27.83904457092285, "global_step": 569710, "epoch": 6863} {"train_loss": -26.987296460622765, "global_step": 569711, "epoch": 6863, "val_loss": 6672369.0} {"train_loss": -26.810718536376953, "global_step": 569712, "epoch": 6864} {"train_loss": -26.879968643188477, "global_step": 569713, "epoch": 6864} {"train_loss": -26.791278839111328, "global_step": 569714, "epoch": 6864} {"train_loss": -26.62607765197754, "global_step": 569715, "epoch": 6864} {"train_loss": -25.35881233215332, "global_step": 569716, "epoch": 6864} {"train_loss": -26.76336669921875, "global_step": 569717, "epoch": 6864} {"train_loss": -26.810922622680664, "global_step": 569718, "epoch": 6864} {"train_loss": -26.624847412109375, "global_step": 569719, "epoch": 6864} {"train_loss": -26.614501953125, "global_step": 569720, "epoch": 6864} {"train_loss": -26.929330825805664, "global_step": 569721, "epoch": 6864} {"train_loss": -27.0745792388916, "global_step": 569722, "epoch": 6864} {"train_loss": -27.35584831237793, "global_step": 569723, "epoch": 6864} {"train_loss": -27.197675704956055, "global_step": 569724, "epoch": 6864} {"train_loss": -27.045734405517578, "global_step": 569725, "epoch": 6864} {"train_loss": -27.60610008239746, "global_step": 569726, "epoch": 6864} {"train_loss": -27.092275619506836, "global_step": 569727, "epoch": 6864} {"train_loss": -27.314416885375977, "global_step": 569728, "epoch": 6864} {"train_loss": -27.2568359375, "global_step": 569729, "epoch": 6864} {"train_loss": -27.32539939880371, "global_step": 569730, "epoch": 6864} {"train_loss": -27.3388671875, "global_step": 569731, "epoch": 6864} {"train_loss": -27.512054443359375, "global_step": 569732, "epoch": 6864} {"train_loss": -27.736560821533203, "global_step": 569733, "epoch": 6864} {"train_loss": -27.484907150268555, "global_step": 569734, "epoch": 6864} {"train_loss": -27.527759552001953, "global_step": 569735, "epoch": 6864} {"train_loss": -27.501880645751953, "global_step": 569736, "epoch": 6864} {"train_loss": -27.669788360595703, "global_step": 569737, "epoch": 6864} {"train_loss": -27.475360870361328, "global_step": 569738, "epoch": 6864} {"train_loss": -27.77775001525879, "global_step": 569739, "epoch": 6864} {"train_loss": -27.787763595581055, "global_step": 569740, "epoch": 6864} {"train_loss": -27.710874557495117, "global_step": 569741, "epoch": 6864} {"train_loss": -27.82470703125, "global_step": 569742, "epoch": 6864} {"train_loss": -27.8585262298584, "global_step": 569743, "epoch": 6864} {"train_loss": -27.4423885345459, "global_step": 569744, "epoch": 6864} {"train_loss": -27.40949821472168, "global_step": 569745, "epoch": 6864} {"train_loss": -27.581018447875977, "global_step": 569746, "epoch": 6864} {"train_loss": -27.640676498413086, "global_step": 569747, "epoch": 6864} {"train_loss": -27.988601684570312, "global_step": 569748, "epoch": 6864} {"train_loss": -27.490924835205078, "global_step": 569749, "epoch": 6864} {"train_loss": -27.713455200195312, "global_step": 569750, "epoch": 6864} {"train_loss": -27.862415313720703, "global_step": 569751, "epoch": 6864} {"train_loss": -28.015241622924805, "global_step": 569752, "epoch": 6864} {"train_loss": -27.885574340820312, "global_step": 569753, "epoch": 6864} {"train_loss": -27.888031005859375, "global_step": 569754, "epoch": 6864} {"train_loss": -27.887073516845703, "global_step": 569755, "epoch": 6864} {"train_loss": -27.725332260131836, "global_step": 569756, "epoch": 6864} {"train_loss": -28.39740562438965, "global_step": 569757, "epoch": 6864} {"train_loss": -28.067468643188477, "global_step": 569758, "epoch": 6864} {"train_loss": -27.762908935546875, "global_step": 569759, "epoch": 6864} {"train_loss": -27.8090877532959, "global_step": 569760, "epoch": 6864} {"train_loss": -27.470783233642578, "global_step": 569761, "epoch": 6864} {"train_loss": -27.79949378967285, "global_step": 569762, "epoch": 6864} {"train_loss": -27.7375545501709, "global_step": 569763, "epoch": 6864} {"train_loss": -28.119571685791016, "global_step": 569764, "epoch": 6864} {"train_loss": -27.973968505859375, "global_step": 569765, "epoch": 6864} {"train_loss": -27.998083114624023, "global_step": 569766, "epoch": 6864} {"train_loss": -27.880430221557617, "global_step": 569767, "epoch": 6864} {"train_loss": -27.671354293823242, "global_step": 569768, "epoch": 6864} {"train_loss": -27.93611717224121, "global_step": 569769, "epoch": 6864} {"train_loss": -28.183176040649414, "global_step": 569770, "epoch": 6864} {"train_loss": -27.819528579711914, "global_step": 569771, "epoch": 6864} {"train_loss": -28.275440216064453, "global_step": 569772, "epoch": 6864} {"train_loss": -28.517154693603516, "global_step": 569773, "epoch": 6864} {"train_loss": -27.821569442749023, "global_step": 569774, "epoch": 6864} {"train_loss": -28.03346061706543, "global_step": 569775, "epoch": 6864} {"train_loss": -28.253681182861328, "global_step": 569776, "epoch": 6864} {"train_loss": -28.0958251953125, "global_step": 569777, "epoch": 6864} {"train_loss": -28.128326416015625, "global_step": 569778, "epoch": 6864} {"train_loss": -27.649784088134766, "global_step": 569779, "epoch": 6864} {"train_loss": -28.005889892578125, "global_step": 569780, "epoch": 6864} {"train_loss": -28.045862197875977, "global_step": 569781, "epoch": 6864} {"train_loss": -28.046613693237305, "global_step": 569782, "epoch": 6864} {"train_loss": -27.683929443359375, "global_step": 569783, "epoch": 6864} {"train_loss": -28.34078025817871, "global_step": 569784, "epoch": 6864} {"train_loss": -27.88252067565918, "global_step": 569785, "epoch": 6864} {"train_loss": -27.9732666015625, "global_step": 569786, "epoch": 6864} {"train_loss": -28.134489059448242, "global_step": 569787, "epoch": 6864} {"train_loss": -28.243295669555664, "global_step": 569788, "epoch": 6864} {"train_loss": -28.129663467407227, "global_step": 569789, "epoch": 6864} {"train_loss": -27.9244327545166, "global_step": 569790, "epoch": 6864} {"train_loss": -28.33112144470215, "global_step": 569791, "epoch": 6864} {"train_loss": -27.79829216003418, "global_step": 569792, "epoch": 6864} {"train_loss": -27.93460464477539, "global_step": 569793, "epoch": 6864} {"train_loss": -27.661554382508058, "global_step": 569794, "epoch": 6864, "val_loss": 6724926.0} {"train_loss": -26.991703033447266, "global_step": 569795, "epoch": 6865} {"train_loss": -27.272790908813477, "global_step": 569796, "epoch": 6865} {"train_loss": -27.7428035736084, "global_step": 569797, "epoch": 6865} {"train_loss": -26.992691040039062, "global_step": 569798, "epoch": 6865} {"train_loss": -26.778715133666992, "global_step": 569799, "epoch": 6865} {"train_loss": -26.776906967163086, "global_step": 569800, "epoch": 6865} {"train_loss": -27.569808959960938, "global_step": 569801, "epoch": 6865} {"train_loss": -27.1140193939209, "global_step": 569802, "epoch": 6865} {"train_loss": -27.146692276000977, "global_step": 569803, "epoch": 6865} {"train_loss": -27.412694931030273, "global_step": 569804, "epoch": 6865} {"train_loss": -27.220998764038086, "global_step": 569805, "epoch": 6865} {"train_loss": -27.528507232666016, "global_step": 569806, "epoch": 6865} {"train_loss": -27.23573875427246, "global_step": 569807, "epoch": 6865} {"train_loss": -27.321979522705078, "global_step": 569808, "epoch": 6865} {"train_loss": -27.103469848632812, "global_step": 569809, "epoch": 6865} {"train_loss": -27.51297378540039, "global_step": 569810, "epoch": 6865} {"train_loss": -27.3885498046875, "global_step": 569811, "epoch": 6865} {"train_loss": -27.49582290649414, "global_step": 569812, "epoch": 6865} {"train_loss": -27.756351470947266, "global_step": 569813, "epoch": 6865} {"train_loss": -27.541889190673828, "global_step": 569814, "epoch": 6865} {"train_loss": -27.536375045776367, "global_step": 569815, "epoch": 6865} {"train_loss": -27.995655059814453, "global_step": 569816, "epoch": 6865} {"train_loss": -27.7237491607666, "global_step": 569817, "epoch": 6865} {"train_loss": -27.58741569519043, "global_step": 569818, "epoch": 6865} {"train_loss": -27.717453002929688, "global_step": 569819, "epoch": 6865} {"train_loss": -27.411762237548828, "global_step": 569820, "epoch": 6865} {"train_loss": -27.223108291625977, "global_step": 569821, "epoch": 6865} {"train_loss": -27.952152252197266, "global_step": 569822, "epoch": 6865} {"train_loss": -28.08524513244629, "global_step": 569823, "epoch": 6865} {"train_loss": -27.561481475830078, "global_step": 569824, "epoch": 6865} {"train_loss": -27.849950790405273, "global_step": 569825, "epoch": 6865} {"train_loss": -27.407520294189453, "global_step": 569826, "epoch": 6865} {"train_loss": -27.496728897094727, "global_step": 569827, "epoch": 6865} {"train_loss": -27.42182731628418, "global_step": 569828, "epoch": 6865} {"train_loss": -27.653364181518555, "global_step": 569829, "epoch": 6865} {"train_loss": -27.496564865112305, "global_step": 569830, "epoch": 6865} {"train_loss": -27.78656005859375, "global_step": 569831, "epoch": 6865} {"train_loss": -27.48321533203125, "global_step": 569832, "epoch": 6865} {"train_loss": -28.064359664916992, "global_step": 569833, "epoch": 6865} {"train_loss": -27.51387596130371, "global_step": 569834, "epoch": 6865} {"train_loss": -28.09160804748535, "global_step": 569835, "epoch": 6865} {"train_loss": -27.662229537963867, "global_step": 569836, "epoch": 6865} {"train_loss": -27.83038902282715, "global_step": 569837, "epoch": 6865} {"train_loss": -27.727888107299805, "global_step": 569838, "epoch": 6865} {"train_loss": -27.925750732421875, "global_step": 569839, "epoch": 6865} {"train_loss": -27.89208984375, "global_step": 569840, "epoch": 6865} {"train_loss": -28.120336532592773, "global_step": 569841, "epoch": 6865} {"train_loss": -28.150732040405273, "global_step": 569842, "epoch": 6865} {"train_loss": -27.90864372253418, "global_step": 569843, "epoch": 6865} {"train_loss": -28.07380485534668, "global_step": 569844, "epoch": 6865} {"train_loss": -27.728652954101562, "global_step": 569845, "epoch": 6865} {"train_loss": -28.046432495117188, "global_step": 569846, "epoch": 6865} {"train_loss": -27.925046920776367, "global_step": 569847, "epoch": 6865} {"train_loss": -28.114471435546875, "global_step": 569848, "epoch": 6865} {"train_loss": -27.814306259155273, "global_step": 569849, "epoch": 6865} {"train_loss": -28.15789794921875, "global_step": 569850, "epoch": 6865} {"train_loss": -28.01785659790039, "global_step": 569851, "epoch": 6865} {"train_loss": -27.8659725189209, "global_step": 569852, "epoch": 6865} {"train_loss": -27.894519805908203, "global_step": 569853, "epoch": 6865} {"train_loss": -27.692584991455078, "global_step": 569854, "epoch": 6865} {"train_loss": -27.45619010925293, "global_step": 569855, "epoch": 6865} {"train_loss": -27.313583374023438, "global_step": 569856, "epoch": 6865} {"train_loss": -26.925745010375977, "global_step": 569857, "epoch": 6865} {"train_loss": -27.519018173217773, "global_step": 569858, "epoch": 6865} {"train_loss": -28.015827178955078, "global_step": 569859, "epoch": 6865} {"train_loss": -28.27686882019043, "global_step": 569860, "epoch": 6865} {"train_loss": -27.406494140625, "global_step": 569861, "epoch": 6865} {"train_loss": -27.301563262939453, "global_step": 569862, "epoch": 6865} {"train_loss": -27.813230514526367, "global_step": 569863, "epoch": 6865} {"train_loss": -27.950159072875977, "global_step": 569864, "epoch": 6865} {"train_loss": -27.584716796875, "global_step": 569865, "epoch": 6865} {"train_loss": -28.087987899780273, "global_step": 569866, "epoch": 6865} {"train_loss": -27.675397872924805, "global_step": 569867, "epoch": 6865} {"train_loss": -27.828510284423828, "global_step": 569868, "epoch": 6865} {"train_loss": -27.550466537475586, "global_step": 569869, "epoch": 6865} {"train_loss": -27.51602554321289, "global_step": 569870, "epoch": 6865} {"train_loss": -27.633813858032227, "global_step": 569871, "epoch": 6865} {"train_loss": -28.20601463317871, "global_step": 569872, "epoch": 6865} {"train_loss": -27.716968536376953, "global_step": 569873, "epoch": 6865} {"train_loss": -27.800647735595703, "global_step": 569874, "epoch": 6865} {"train_loss": -27.634048461914062, "global_step": 569875, "epoch": 6865} {"train_loss": -28.168664932250977, "global_step": 569876, "epoch": 6865} {"train_loss": -27.632651018809124, "global_step": 569877, "epoch": 6865, "val_loss": 6804013.0} {"train_loss": -27.50188636779785, "global_step": 569878, "epoch": 6866} {"train_loss": -27.765308380126953, "global_step": 569879, "epoch": 6866} {"train_loss": -27.7034912109375, "global_step": 569880, "epoch": 6866} {"train_loss": -27.590200424194336, "global_step": 569881, "epoch": 6866} {"train_loss": -27.37407875061035, "global_step": 569882, "epoch": 6866} {"train_loss": -27.848058700561523, "global_step": 569883, "epoch": 6866} {"train_loss": -27.843597412109375, "global_step": 569884, "epoch": 6866} {"train_loss": -27.34002685546875, "global_step": 569885, "epoch": 6866} {"train_loss": -27.793371200561523, "global_step": 569886, "epoch": 6866} {"train_loss": -27.612537384033203, "global_step": 569887, "epoch": 6866} {"train_loss": -27.84083366394043, "global_step": 569888, "epoch": 6866} {"train_loss": -28.02581787109375, "global_step": 569889, "epoch": 6866} {"train_loss": -27.481122970581055, "global_step": 569890, "epoch": 6866} {"train_loss": -27.221887588500977, "global_step": 569891, "epoch": 6866} {"train_loss": -27.36439323425293, "global_step": 569892, "epoch": 6866} {"train_loss": -27.446592330932617, "global_step": 569893, "epoch": 6866} {"train_loss": -27.381540298461914, "global_step": 569894, "epoch": 6866} {"train_loss": -27.7694149017334, "global_step": 569895, "epoch": 6866} {"train_loss": -27.567249298095703, "global_step": 569896, "epoch": 6866} {"train_loss": -27.876575469970703, "global_step": 569897, "epoch": 6866} {"train_loss": -27.84735679626465, "global_step": 569898, "epoch": 6866} {"train_loss": -27.218061447143555, "global_step": 569899, "epoch": 6866} {"train_loss": -27.976362228393555, "global_step": 569900, "epoch": 6866} {"train_loss": -27.707807540893555, "global_step": 569901, "epoch": 6866} {"train_loss": -27.28938102722168, "global_step": 569902, "epoch": 6866} {"train_loss": -27.57566261291504, "global_step": 569903, "epoch": 6866} {"train_loss": -27.695077896118164, "global_step": 569904, "epoch": 6866} {"train_loss": -27.6868839263916, "global_step": 569905, "epoch": 6866} {"train_loss": -28.004560470581055, "global_step": 569906, "epoch": 6866} {"train_loss": -27.9730224609375, "global_step": 569907, "epoch": 6866} {"train_loss": -27.689666748046875, "global_step": 569908, "epoch": 6866} {"train_loss": -27.727615356445312, "global_step": 569909, "epoch": 6866} {"train_loss": -27.964181900024414, "global_step": 569910, "epoch": 6866} {"train_loss": -27.75347328186035, "global_step": 569911, "epoch": 6866} {"train_loss": -27.509567260742188, "global_step": 569912, "epoch": 6866} {"train_loss": -27.653711318969727, "global_step": 569913, "epoch": 6866} {"train_loss": -28.1448974609375, "global_step": 569914, "epoch": 6866} {"train_loss": -28.076757431030273, "global_step": 569915, "epoch": 6866} {"train_loss": -27.76422691345215, "global_step": 569916, "epoch": 6866} {"train_loss": -28.2222843170166, "global_step": 569917, "epoch": 6866} {"train_loss": -27.618566513061523, "global_step": 569918, "epoch": 6866} {"train_loss": -27.970739364624023, "global_step": 569919, "epoch": 6866} {"train_loss": -27.875974655151367, "global_step": 569920, "epoch": 6866} {"train_loss": -27.786285400390625, "global_step": 569921, "epoch": 6866} {"train_loss": -27.928525924682617, "global_step": 569922, "epoch": 6866} {"train_loss": -27.81464195251465, "global_step": 569923, "epoch": 6866} {"train_loss": -27.850391387939453, "global_step": 569924, "epoch": 6866} {"train_loss": -27.71711540222168, "global_step": 569925, "epoch": 6866} {"train_loss": -27.79949951171875, "global_step": 569926, "epoch": 6866} {"train_loss": -27.689428329467773, "global_step": 569927, "epoch": 6866} {"train_loss": -27.8255672454834, "global_step": 569928, "epoch": 6866} {"train_loss": -27.9381046295166, "global_step": 569929, "epoch": 6866} {"train_loss": -27.735858917236328, "global_step": 569930, "epoch": 6866} {"train_loss": -27.75123405456543, "global_step": 569931, "epoch": 6866} {"train_loss": -27.800067901611328, "global_step": 569932, "epoch": 6866} {"train_loss": -27.82306480407715, "global_step": 569933, "epoch": 6866} {"train_loss": -27.91657829284668, "global_step": 569934, "epoch": 6866} {"train_loss": -28.19390296936035, "global_step": 569935, "epoch": 6866} {"train_loss": -27.822683334350586, "global_step": 569936, "epoch": 6866} {"train_loss": -28.076169967651367, "global_step": 569937, "epoch": 6866} {"train_loss": -27.951141357421875, "global_step": 569938, "epoch": 6866} {"train_loss": -28.16864013671875, "global_step": 569939, "epoch": 6866} {"train_loss": -28.112167358398438, "global_step": 569940, "epoch": 6866} {"train_loss": -28.102079391479492, "global_step": 569941, "epoch": 6866} {"train_loss": -27.741037368774414, "global_step": 569942, "epoch": 6866} {"train_loss": -27.55084800720215, "global_step": 569943, "epoch": 6866} {"train_loss": -27.8151912689209, "global_step": 569944, "epoch": 6866} {"train_loss": -27.167394638061523, "global_step": 569945, "epoch": 6866} {"train_loss": -27.401504516601562, "global_step": 569946, "epoch": 6866} {"train_loss": -28.317350387573242, "global_step": 569947, "epoch": 6866} {"train_loss": -28.059162139892578, "global_step": 569948, "epoch": 6866} {"train_loss": -28.1629695892334, "global_step": 569949, "epoch": 6866} {"train_loss": -28.061756134033203, "global_step": 569950, "epoch": 6866} {"train_loss": -28.064411163330078, "global_step": 569951, "epoch": 6866} {"train_loss": -28.101160049438477, "global_step": 569952, "epoch": 6866} {"train_loss": -28.036441802978516, "global_step": 569953, "epoch": 6866} {"train_loss": -27.825586318969727, "global_step": 569954, "epoch": 6866} {"train_loss": -28.11557388305664, "global_step": 569955, "epoch": 6866} {"train_loss": -27.46657371520996, "global_step": 569956, "epoch": 6866} {"train_loss": -27.917448043823242, "global_step": 569957, "epoch": 6866} {"train_loss": -27.977659225463867, "global_step": 569958, "epoch": 6866} {"train_loss": -28.085098266601562, "global_step": 569959, "epoch": 6866} {"train_loss": -27.799316659031145, "global_step": 569960, "epoch": 6866, "val_loss": 6677886.0} {"train_loss": -27.62372398376465, "global_step": 569961, "epoch": 6867} {"train_loss": -27.624317169189453, "global_step": 569962, "epoch": 6867} {"train_loss": -27.266706466674805, "global_step": 569963, "epoch": 6867} {"train_loss": -27.540557861328125, "global_step": 569964, "epoch": 6867} {"train_loss": -27.834522247314453, "global_step": 569965, "epoch": 6867} {"train_loss": -27.448532104492188, "global_step": 569966, "epoch": 6867} {"train_loss": -27.7227840423584, "global_step": 569967, "epoch": 6867} {"train_loss": -27.514020919799805, "global_step": 569968, "epoch": 6867} {"train_loss": -27.183643341064453, "global_step": 569969, "epoch": 6867} {"train_loss": -27.540058135986328, "global_step": 569970, "epoch": 6867} {"train_loss": -27.863126754760742, "global_step": 569971, "epoch": 6867} {"train_loss": -27.9158992767334, "global_step": 569972, "epoch": 6867} {"train_loss": -28.105728149414062, "global_step": 569973, "epoch": 6867} {"train_loss": -27.750844955444336, "global_step": 569974, "epoch": 6867} {"train_loss": -27.831928253173828, "global_step": 569975, "epoch": 6867} {"train_loss": -27.73761558532715, "global_step": 569976, "epoch": 6867} {"train_loss": -27.4058780670166, "global_step": 569977, "epoch": 6867} {"train_loss": -27.58255958557129, "global_step": 569978, "epoch": 6867} {"train_loss": -27.666549682617188, "global_step": 569979, "epoch": 6867} {"train_loss": -27.631153106689453, "global_step": 569980, "epoch": 6867} {"train_loss": -27.710739135742188, "global_step": 569981, "epoch": 6867} {"train_loss": -27.986541748046875, "global_step": 569982, "epoch": 6867} {"train_loss": -27.660181045532227, "global_step": 569983, "epoch": 6867} {"train_loss": -27.610855102539062, "global_step": 569984, "epoch": 6867} {"train_loss": -27.673730850219727, "global_step": 569985, "epoch": 6867} {"train_loss": -27.510883331298828, "global_step": 569986, "epoch": 6867} {"train_loss": -27.96656608581543, "global_step": 569987, "epoch": 6867} {"train_loss": -27.4742488861084, "global_step": 569988, "epoch": 6867} {"train_loss": -27.901273727416992, "global_step": 569989, "epoch": 6867} {"train_loss": -28.065744400024414, "global_step": 569990, "epoch": 6867} {"train_loss": -27.734283447265625, "global_step": 569991, "epoch": 6867} {"train_loss": -27.898269653320312, "global_step": 569992, "epoch": 6867} {"train_loss": -27.891651153564453, "global_step": 569993, "epoch": 6867} {"train_loss": -27.595319747924805, "global_step": 569994, "epoch": 6867} {"train_loss": -27.974706649780273, "global_step": 569995, "epoch": 6867} {"train_loss": -27.468961715698242, "global_step": 569996, "epoch": 6867} {"train_loss": -28.111190795898438, "global_step": 569997, "epoch": 6867} {"train_loss": -27.84967041015625, "global_step": 569998, "epoch": 6867} {"train_loss": -27.915485382080078, "global_step": 569999, "epoch": 6867} {"train_loss": -28.09012222290039, "global_step": 570000, "epoch": 6867} {"train_loss": -28.206308364868164, "global_step": 570001, "epoch": 6867} {"train_loss": -27.88629150390625, "global_step": 570002, "epoch": 6867} {"train_loss": -28.24347496032715, "global_step": 570003, "epoch": 6867} {"train_loss": -27.788076400756836, "global_step": 570004, "epoch": 6867} {"train_loss": -27.86887550354004, "global_step": 570005, "epoch": 6867} {"train_loss": -27.51954460144043, "global_step": 570006, "epoch": 6867} {"train_loss": -27.9666690826416, "global_step": 570007, "epoch": 6867} {"train_loss": -27.61127281188965, "global_step": 570008, "epoch": 6867} {"train_loss": -28.0274658203125, "global_step": 570009, "epoch": 6867} {"train_loss": -27.891040802001953, "global_step": 570010, "epoch": 6867} {"train_loss": -28.151086807250977, "global_step": 570011, "epoch": 6867} {"train_loss": -28.188312530517578, "global_step": 570012, "epoch": 6867} {"train_loss": -27.726551055908203, "global_step": 570013, "epoch": 6867} {"train_loss": -27.98121452331543, "global_step": 570014, "epoch": 6867} {"train_loss": -27.546875, "global_step": 570015, "epoch": 6867} {"train_loss": -27.944204330444336, "global_step": 570016, "epoch": 6867} {"train_loss": -28.000904083251953, "global_step": 570017, "epoch": 6867} {"train_loss": -27.69970703125, "global_step": 570018, "epoch": 6867} {"train_loss": -28.764699935913086, "global_step": 570019, "epoch": 6867} {"train_loss": -27.6508846282959, "global_step": 570020, "epoch": 6867} {"train_loss": -27.610021591186523, "global_step": 570021, "epoch": 6867} {"train_loss": -27.610898971557617, "global_step": 570022, "epoch": 6867} {"train_loss": -27.509302139282227, "global_step": 570023, "epoch": 6867} {"train_loss": -27.771076202392578, "global_step": 570024, "epoch": 6867} {"train_loss": -28.112775802612305, "global_step": 570025, "epoch": 6867} {"train_loss": -27.902002334594727, "global_step": 570026, "epoch": 6867} {"train_loss": -27.712072372436523, "global_step": 570027, "epoch": 6867} {"train_loss": -27.68607521057129, "global_step": 570028, "epoch": 6867} {"train_loss": -27.666259765625, "global_step": 570029, "epoch": 6867} {"train_loss": -27.69416618347168, "global_step": 570030, "epoch": 6867} {"train_loss": -27.752307891845703, "global_step": 570031, "epoch": 6867} {"train_loss": -27.955713272094727, "global_step": 570032, "epoch": 6867} {"train_loss": -27.440845489501953, "global_step": 570033, "epoch": 6867} {"train_loss": -28.33109474182129, "global_step": 570034, "epoch": 6867} {"train_loss": -28.190793991088867, "global_step": 570035, "epoch": 6867} {"train_loss": -28.34266471862793, "global_step": 570036, "epoch": 6867} {"train_loss": -28.012557983398438, "global_step": 570037, "epoch": 6867} {"train_loss": -28.284347534179688, "global_step": 570038, "epoch": 6867} {"train_loss": -28.111835479736328, "global_step": 570039, "epoch": 6867} {"train_loss": -27.774194717407227, "global_step": 570040, "epoch": 6867} {"train_loss": -27.667343139648438, "global_step": 570041, "epoch": 6867} {"train_loss": -28.180713653564453, "global_step": 570042, "epoch": 6867} {"train_loss": -27.8279307262007, "global_step": 570043, "epoch": 6867, "val_loss": 6689331.0} {"train_loss": -27.512409210205078, "global_step": 570044, "epoch": 6868} {"train_loss": -27.411176681518555, "global_step": 570045, "epoch": 6868} {"train_loss": -26.91224479675293, "global_step": 570046, "epoch": 6868} {"train_loss": -27.51835060119629, "global_step": 570047, "epoch": 6868} {"train_loss": -27.17548179626465, "global_step": 570048, "epoch": 6868} {"train_loss": -26.879199981689453, "global_step": 570049, "epoch": 6868} {"train_loss": -27.16158103942871, "global_step": 570050, "epoch": 6868} {"train_loss": -27.524892807006836, "global_step": 570051, "epoch": 6868} {"train_loss": -27.3531436920166, "global_step": 570052, "epoch": 6868} {"train_loss": -27.868789672851562, "global_step": 570053, "epoch": 6868} {"train_loss": -27.542104721069336, "global_step": 570054, "epoch": 6868} {"train_loss": -27.555194854736328, "global_step": 570055, "epoch": 6868} {"train_loss": -27.74920082092285, "global_step": 570056, "epoch": 6868} {"train_loss": -27.61212730407715, "global_step": 570057, "epoch": 6868} {"train_loss": -27.489282608032227, "global_step": 570058, "epoch": 6868} {"train_loss": -27.3925838470459, "global_step": 570059, "epoch": 6868} {"train_loss": -27.73175048828125, "global_step": 570060, "epoch": 6868} {"train_loss": -27.59808349609375, "global_step": 570061, "epoch": 6868} {"train_loss": -27.715930938720703, "global_step": 570062, "epoch": 6868} {"train_loss": -27.255346298217773, "global_step": 570063, "epoch": 6868} {"train_loss": -27.741180419921875, "global_step": 570064, "epoch": 6868} {"train_loss": -27.963605880737305, "global_step": 570065, "epoch": 6868} {"train_loss": -28.167804718017578, "global_step": 570066, "epoch": 6868} {"train_loss": -27.714780807495117, "global_step": 570067, "epoch": 6868} {"train_loss": -27.67336082458496, "global_step": 570068, "epoch": 6868} {"train_loss": -27.95802879333496, "global_step": 570069, "epoch": 6868} {"train_loss": -27.72682762145996, "global_step": 570070, "epoch": 6868} {"train_loss": -27.82254409790039, "global_step": 570071, "epoch": 6868} {"train_loss": -27.889251708984375, "global_step": 570072, "epoch": 6868} {"train_loss": -27.939477920532227, "global_step": 570073, "epoch": 6868} {"train_loss": -27.571277618408203, "global_step": 570074, "epoch": 6868} {"train_loss": -27.922704696655273, "global_step": 570075, "epoch": 6868} {"train_loss": -28.056198120117188, "global_step": 570076, "epoch": 6868} {"train_loss": -27.7364501953125, "global_step": 570077, "epoch": 6868} {"train_loss": -27.844213485717773, "global_step": 570078, "epoch": 6868} {"train_loss": -27.816980361938477, "global_step": 570079, "epoch": 6868} {"train_loss": -27.870563507080078, "global_step": 570080, "epoch": 6868} {"train_loss": -28.2010498046875, "global_step": 570081, "epoch": 6868} {"train_loss": -27.757892608642578, "global_step": 570082, "epoch": 6868} {"train_loss": -27.996509552001953, "global_step": 570083, "epoch": 6868} {"train_loss": -28.403034210205078, "global_step": 570084, "epoch": 6868} {"train_loss": -28.066267013549805, "global_step": 570085, "epoch": 6868} {"train_loss": -27.792877197265625, "global_step": 570086, "epoch": 6868} {"train_loss": -28.2674617767334, "global_step": 570087, "epoch": 6868} {"train_loss": -28.033132553100586, "global_step": 570088, "epoch": 6868} {"train_loss": -27.9677791595459, "global_step": 570089, "epoch": 6868} {"train_loss": -28.08857536315918, "global_step": 570090, "epoch": 6868} {"train_loss": -27.875885009765625, "global_step": 570091, "epoch": 6868} {"train_loss": -27.537336349487305, "global_step": 570092, "epoch": 6868} {"train_loss": -28.139013290405273, "global_step": 570093, "epoch": 6868} {"train_loss": -27.869583129882812, "global_step": 570094, "epoch": 6868} {"train_loss": -28.12788200378418, "global_step": 570095, "epoch": 6868} {"train_loss": -27.999561309814453, "global_step": 570096, "epoch": 6868} {"train_loss": -28.27008056640625, "global_step": 570097, "epoch": 6868} {"train_loss": -27.559507369995117, "global_step": 570098, "epoch": 6868} {"train_loss": -27.864410400390625, "global_step": 570099, "epoch": 6868} {"train_loss": -27.88661003112793, "global_step": 570100, "epoch": 6868} {"train_loss": -28.015003204345703, "global_step": 570101, "epoch": 6868} {"train_loss": -28.0327205657959, "global_step": 570102, "epoch": 6868} {"train_loss": -27.602005004882812, "global_step": 570103, "epoch": 6868} {"train_loss": -27.96272850036621, "global_step": 570104, "epoch": 6868} {"train_loss": -27.77507972717285, "global_step": 570105, "epoch": 6868} {"train_loss": -28.0941162109375, "global_step": 570106, "epoch": 6868} {"train_loss": -27.72136878967285, "global_step": 570107, "epoch": 6868} {"train_loss": -27.605627059936523, "global_step": 570108, "epoch": 6868} {"train_loss": -27.56682777404785, "global_step": 570109, "epoch": 6868} {"train_loss": -27.29736328125, "global_step": 570110, "epoch": 6868} {"train_loss": -27.24146842956543, "global_step": 570111, "epoch": 6868} {"train_loss": -27.92578125, "global_step": 570112, "epoch": 6868} {"train_loss": -27.792224884033203, "global_step": 570113, "epoch": 6868} {"train_loss": -27.849660873413086, "global_step": 570114, "epoch": 6868} {"train_loss": -27.6878662109375, "global_step": 570115, "epoch": 6868} {"train_loss": -27.65005874633789, "global_step": 570116, "epoch": 6868} {"train_loss": -27.889612197875977, "global_step": 570117, "epoch": 6868} {"train_loss": -28.236774444580078, "global_step": 570118, "epoch": 6868} {"train_loss": -27.918045043945312, "global_step": 570119, "epoch": 6868} {"train_loss": -27.834985733032227, "global_step": 570120, "epoch": 6868} {"train_loss": -27.807388305664062, "global_step": 570121, "epoch": 6868} {"train_loss": -27.960241317749023, "global_step": 570122, "epoch": 6868} {"train_loss": -27.593524932861328, "global_step": 570123, "epoch": 6868} {"train_loss": -26.935791015625, "global_step": 570124, "epoch": 6868} {"train_loss": -26.33721351623535, "global_step": 570125, "epoch": 6868} {"train_loss": -27.737029477774378, "global_step": 570126, "epoch": 6868, "val_loss": 6673876.0} {"train_loss": -26.455183029174805, "global_step": 570127, "epoch": 6869} {"train_loss": -25.54047203063965, "global_step": 570128, "epoch": 6869} {"train_loss": -25.688079833984375, "global_step": 570129, "epoch": 6869} {"train_loss": -26.26055335998535, "global_step": 570130, "epoch": 6869} {"train_loss": -25.80523681640625, "global_step": 570131, "epoch": 6869} {"train_loss": -26.91605567932129, "global_step": 570132, "epoch": 6869} {"train_loss": -25.661767959594727, "global_step": 570133, "epoch": 6869} {"train_loss": -26.789194107055664, "global_step": 570134, "epoch": 6869} {"train_loss": -26.631244659423828, "global_step": 570135, "epoch": 6869} {"train_loss": -27.058948516845703, "global_step": 570136, "epoch": 6869} {"train_loss": -26.64828872680664, "global_step": 570137, "epoch": 6869} {"train_loss": -26.88427734375, "global_step": 570138, "epoch": 6869} {"train_loss": -26.741790771484375, "global_step": 570139, "epoch": 6869} {"train_loss": -27.344568252563477, "global_step": 570140, "epoch": 6869} {"train_loss": -27.032733917236328, "global_step": 570141, "epoch": 6869} {"train_loss": -26.726099014282227, "global_step": 570142, "epoch": 6869} {"train_loss": -27.5859375, "global_step": 570143, "epoch": 6869} {"train_loss": -26.71616554260254, "global_step": 570144, "epoch": 6869} {"train_loss": -27.389204025268555, "global_step": 570145, "epoch": 6869} {"train_loss": -26.94646644592285, "global_step": 570146, "epoch": 6869} {"train_loss": -27.226709365844727, "global_step": 570147, "epoch": 6869} {"train_loss": -27.25116539001465, "global_step": 570148, "epoch": 6869} {"train_loss": -26.718555450439453, "global_step": 570149, "epoch": 6869} {"train_loss": -27.4924259185791, "global_step": 570150, "epoch": 6869} {"train_loss": -27.061643600463867, "global_step": 570151, "epoch": 6869} {"train_loss": -27.549182891845703, "global_step": 570152, "epoch": 6869} {"train_loss": -27.74920082092285, "global_step": 570153, "epoch": 6869} {"train_loss": -27.645254135131836, "global_step": 570154, "epoch": 6869} {"train_loss": -27.143280029296875, "global_step": 570155, "epoch": 6869} {"train_loss": -27.567581176757812, "global_step": 570156, "epoch": 6869} {"train_loss": -27.3160343170166, "global_step": 570157, "epoch": 6869} {"train_loss": -27.5332088470459, "global_step": 570158, "epoch": 6869} {"train_loss": -27.6494197845459, "global_step": 570159, "epoch": 6869} {"train_loss": -27.799535751342773, "global_step": 570160, "epoch": 6869} {"train_loss": -27.628759384155273, "global_step": 570161, "epoch": 6869} {"train_loss": -27.7574462890625, "global_step": 570162, "epoch": 6869} {"train_loss": -27.73324966430664, "global_step": 570163, "epoch": 6869} {"train_loss": -27.902973175048828, "global_step": 570164, "epoch": 6869} {"train_loss": -27.9612979888916, "global_step": 570165, "epoch": 6869} {"train_loss": -27.86151695251465, "global_step": 570166, "epoch": 6869} {"train_loss": -27.827686309814453, "global_step": 570167, "epoch": 6869} {"train_loss": -27.2633113861084, "global_step": 570168, "epoch": 6869} {"train_loss": -27.669885635375977, "global_step": 570169, "epoch": 6869} {"train_loss": -27.64544677734375, "global_step": 570170, "epoch": 6869} {"train_loss": -27.91375732421875, "global_step": 570171, "epoch": 6869} {"train_loss": -27.80950355529785, "global_step": 570172, "epoch": 6869} {"train_loss": -27.72525405883789, "global_step": 570173, "epoch": 6869} {"train_loss": -27.59101676940918, "global_step": 570174, "epoch": 6869} {"train_loss": -27.896772384643555, "global_step": 570175, "epoch": 6869} {"train_loss": -28.01630210876465, "global_step": 570176, "epoch": 6869} {"train_loss": -28.048200607299805, "global_step": 570177, "epoch": 6869} {"train_loss": -28.199071884155273, "global_step": 570178, "epoch": 6869} {"train_loss": -27.751306533813477, "global_step": 570179, "epoch": 6869} {"train_loss": -27.90216636657715, "global_step": 570180, "epoch": 6869} {"train_loss": -27.856739044189453, "global_step": 570181, "epoch": 6869} {"train_loss": -27.843969345092773, "global_step": 570182, "epoch": 6869} {"train_loss": -27.88642692565918, "global_step": 570183, "epoch": 6869} {"train_loss": -28.022705078125, "global_step": 570184, "epoch": 6869} {"train_loss": -27.983945846557617, "global_step": 570185, "epoch": 6869} {"train_loss": -27.826154708862305, "global_step": 570186, "epoch": 6869} {"train_loss": -28.183008193969727, "global_step": 570187, "epoch": 6869} {"train_loss": -27.90968132019043, "global_step": 570188, "epoch": 6869} {"train_loss": -27.92669105529785, "global_step": 570189, "epoch": 6869} {"train_loss": -27.911426544189453, "global_step": 570190, "epoch": 6869} {"train_loss": -28.585866928100586, "global_step": 570191, "epoch": 6869} {"train_loss": -27.83160400390625, "global_step": 570192, "epoch": 6869} {"train_loss": -27.537952423095703, "global_step": 570193, "epoch": 6869} {"train_loss": -27.493520736694336, "global_step": 570194, "epoch": 6869} {"train_loss": -27.672727584838867, "global_step": 570195, "epoch": 6869} {"train_loss": -27.924427032470703, "global_step": 570196, "epoch": 6869} {"train_loss": -28.247161865234375, "global_step": 570197, "epoch": 6869} {"train_loss": -28.17096519470215, "global_step": 570198, "epoch": 6869} {"train_loss": -27.83698081970215, "global_step": 570199, "epoch": 6869} {"train_loss": -28.282312393188477, "global_step": 570200, "epoch": 6869} {"train_loss": -28.074499130249023, "global_step": 570201, "epoch": 6869} {"train_loss": -27.99248695373535, "global_step": 570202, "epoch": 6869} {"train_loss": -27.66627311706543, "global_step": 570203, "epoch": 6869} {"train_loss": -27.747156143188477, "global_step": 570204, "epoch": 6869} {"train_loss": -27.806629180908203, "global_step": 570205, "epoch": 6869} {"train_loss": -27.64324378967285, "global_step": 570206, "epoch": 6869} {"train_loss": -27.874713897705078, "global_step": 570207, "epoch": 6869} {"train_loss": -28.058822631835938, "global_step": 570208, "epoch": 6869} {"train_loss": -27.484298568174065, "global_step": 570209, "epoch": 6869, "val_loss": 6760065.0} {"train_loss": -26.949512481689453, "global_step": 570210, "epoch": 6870} {"train_loss": -26.883832931518555, "global_step": 570211, "epoch": 6870} {"train_loss": -27.022571563720703, "global_step": 570212, "epoch": 6870} {"train_loss": -26.558624267578125, "global_step": 570213, "epoch": 6870} {"train_loss": -27.618072509765625, "global_step": 570214, "epoch": 6870} {"train_loss": -27.147464752197266, "global_step": 570215, "epoch": 6870} {"train_loss": -26.977005004882812, "global_step": 570216, "epoch": 6870} {"train_loss": -26.91535758972168, "global_step": 570217, "epoch": 6870} {"train_loss": -27.430646896362305, "global_step": 570218, "epoch": 6870} {"train_loss": -27.587011337280273, "global_step": 570219, "epoch": 6870} {"train_loss": -27.401996612548828, "global_step": 570220, "epoch": 6870} {"train_loss": -27.683719635009766, "global_step": 570221, "epoch": 6870} {"train_loss": -27.2332706451416, "global_step": 570222, "epoch": 6870} {"train_loss": -27.312152862548828, "global_step": 570223, "epoch": 6870} {"train_loss": -27.380273818969727, "global_step": 570224, "epoch": 6870} {"train_loss": -27.347990036010742, "global_step": 570225, "epoch": 6870} {"train_loss": -27.12639808654785, "global_step": 570226, "epoch": 6870} {"train_loss": -27.657705307006836, "global_step": 570227, "epoch": 6870} {"train_loss": -27.05264663696289, "global_step": 570228, "epoch": 6870} {"train_loss": -27.4105224609375, "global_step": 570229, "epoch": 6870} {"train_loss": -27.992889404296875, "global_step": 570230, "epoch": 6870} {"train_loss": -27.6826229095459, "global_step": 570231, "epoch": 6870} {"train_loss": -27.606372833251953, "global_step": 570232, "epoch": 6870} {"train_loss": -27.37745475769043, "global_step": 570233, "epoch": 6870} {"train_loss": -28.01263427734375, "global_step": 570234, "epoch": 6870} {"train_loss": -27.62238121032715, "global_step": 570235, "epoch": 6870} {"train_loss": -27.732202529907227, "global_step": 570236, "epoch": 6870} {"train_loss": -27.68726921081543, "global_step": 570237, "epoch": 6870} {"train_loss": -27.797779083251953, "global_step": 570238, "epoch": 6870} {"train_loss": -28.119699478149414, "global_step": 570239, "epoch": 6870} {"train_loss": -27.667510986328125, "global_step": 570240, "epoch": 6870} {"train_loss": -28.019729614257812, "global_step": 570241, "epoch": 6870} {"train_loss": -27.95301628112793, "global_step": 570242, "epoch": 6870} {"train_loss": -27.638925552368164, "global_step": 570243, "epoch": 6870} {"train_loss": -27.645864486694336, "global_step": 570244, "epoch": 6870} {"train_loss": -27.950138092041016, "global_step": 570245, "epoch": 6870} {"train_loss": -27.71441650390625, "global_step": 570246, "epoch": 6870} {"train_loss": -27.971784591674805, "global_step": 570247, "epoch": 6870} {"train_loss": -27.7565860748291, "global_step": 570248, "epoch": 6870} {"train_loss": -27.951520919799805, "global_step": 570249, "epoch": 6870} {"train_loss": -27.897375106811523, "global_step": 570250, "epoch": 6870} {"train_loss": -27.580480575561523, "global_step": 570251, "epoch": 6870} {"train_loss": -27.807294845581055, "global_step": 570252, "epoch": 6870} {"train_loss": -27.69839859008789, "global_step": 570253, "epoch": 6870} {"train_loss": -28.076154708862305, "global_step": 570254, "epoch": 6870} {"train_loss": -27.997766494750977, "global_step": 570255, "epoch": 6870} {"train_loss": -27.62293815612793, "global_step": 570256, "epoch": 6870} {"train_loss": -27.629796981811523, "global_step": 570257, "epoch": 6870} {"train_loss": -28.021656036376953, "global_step": 570258, "epoch": 6870} {"train_loss": -27.732763290405273, "global_step": 570259, "epoch": 6870} {"train_loss": -27.94647216796875, "global_step": 570260, "epoch": 6870} {"train_loss": -27.91548728942871, "global_step": 570261, "epoch": 6870} {"train_loss": -27.67140769958496, "global_step": 570262, "epoch": 6870} {"train_loss": -27.662494659423828, "global_step": 570263, "epoch": 6870} {"train_loss": -27.8164119720459, "global_step": 570264, "epoch": 6870} {"train_loss": -27.93805503845215, "global_step": 570265, "epoch": 6870} {"train_loss": -27.964990615844727, "global_step": 570266, "epoch": 6870} {"train_loss": -27.615161895751953, "global_step": 570267, "epoch": 6870} {"train_loss": -27.8082218170166, "global_step": 570268, "epoch": 6870} {"train_loss": -28.0897159576416, "global_step": 570269, "epoch": 6870} {"train_loss": -27.714496612548828, "global_step": 570270, "epoch": 6870} {"train_loss": -28.107959747314453, "global_step": 570271, "epoch": 6870} {"train_loss": -27.66678237915039, "global_step": 570272, "epoch": 6870} {"train_loss": -27.537973403930664, "global_step": 570273, "epoch": 6870} {"train_loss": -27.831623077392578, "global_step": 570274, "epoch": 6870} {"train_loss": -27.961706161499023, "global_step": 570275, "epoch": 6870} {"train_loss": -27.88678550720215, "global_step": 570276, "epoch": 6870} {"train_loss": -28.018091201782227, "global_step": 570277, "epoch": 6870} {"train_loss": -27.980459213256836, "global_step": 570278, "epoch": 6870} {"train_loss": -28.15654945373535, "global_step": 570279, "epoch": 6870} {"train_loss": -27.659780502319336, "global_step": 570280, "epoch": 6870} {"train_loss": -27.87495231628418, "global_step": 570281, "epoch": 6870} {"train_loss": -27.726415634155273, "global_step": 570282, "epoch": 6870} {"train_loss": -27.565393447875977, "global_step": 570283, "epoch": 6870} {"train_loss": -27.8797664642334, "global_step": 570284, "epoch": 6870} {"train_loss": -27.810644149780273, "global_step": 570285, "epoch": 6870} {"train_loss": -27.925750732421875, "global_step": 570286, "epoch": 6870} {"train_loss": -28.198394775390625, "global_step": 570287, "epoch": 6870} {"train_loss": -27.7960205078125, "global_step": 570288, "epoch": 6870} {"train_loss": -27.829267501831055, "global_step": 570289, "epoch": 6870} {"train_loss": -27.941181182861328, "global_step": 570290, "epoch": 6870} {"train_loss": -28.00248146057129, "global_step": 570291, "epoch": 6870} {"train_loss": -27.69777242821383, "global_step": 570292, "epoch": 6870, "val_loss": 6501369.0} {"train_loss": -27.180883407592773, "global_step": 570293, "epoch": 6871} {"train_loss": -27.11956214904785, "global_step": 570294, "epoch": 6871} {"train_loss": -27.16719627380371, "global_step": 570295, "epoch": 6871} {"train_loss": -27.130868911743164, "global_step": 570296, "epoch": 6871} {"train_loss": -27.05682945251465, "global_step": 570297, "epoch": 6871} {"train_loss": -27.219953536987305, "global_step": 570298, "epoch": 6871} {"train_loss": -27.24293327331543, "global_step": 570299, "epoch": 6871} {"train_loss": -26.915998458862305, "global_step": 570300, "epoch": 6871} {"train_loss": -27.189411163330078, "global_step": 570301, "epoch": 6871} {"train_loss": -27.17083740234375, "global_step": 570302, "epoch": 6871} {"train_loss": -27.1644287109375, "global_step": 570303, "epoch": 6871} {"train_loss": -27.051923751831055, "global_step": 570304, "epoch": 6871} {"train_loss": -27.126754760742188, "global_step": 570305, "epoch": 6871} {"train_loss": -27.315954208374023, "global_step": 570306, "epoch": 6871} {"train_loss": -27.3884334564209, "global_step": 570307, "epoch": 6871} {"train_loss": -26.968061447143555, "global_step": 570308, "epoch": 6871} {"train_loss": -27.64459228515625, "global_step": 570309, "epoch": 6871} {"train_loss": -27.367197036743164, "global_step": 570310, "epoch": 6871} {"train_loss": -27.4815616607666, "global_step": 570311, "epoch": 6871} {"train_loss": -26.99358558654785, "global_step": 570312, "epoch": 6871} {"train_loss": -27.969165802001953, "global_step": 570313, "epoch": 6871} {"train_loss": -27.472448348999023, "global_step": 570314, "epoch": 6871} {"train_loss": -27.6402587890625, "global_step": 570315, "epoch": 6871} {"train_loss": -27.361867904663086, "global_step": 570316, "epoch": 6871} {"train_loss": -27.243921279907227, "global_step": 570317, "epoch": 6871} {"train_loss": -27.600574493408203, "global_step": 570318, "epoch": 6871} {"train_loss": -27.57632827758789, "global_step": 570319, "epoch": 6871} {"train_loss": -27.690631866455078, "global_step": 570320, "epoch": 6871} {"train_loss": -27.90140724182129, "global_step": 570321, "epoch": 6871} {"train_loss": -27.9788818359375, "global_step": 570322, "epoch": 6871} {"train_loss": -27.6629638671875, "global_step": 570323, "epoch": 6871} {"train_loss": -27.76749038696289, "global_step": 570324, "epoch": 6871} {"train_loss": -27.461475372314453, "global_step": 570325, "epoch": 6871} {"train_loss": -27.93023681640625, "global_step": 570326, "epoch": 6871} {"train_loss": -27.91548728942871, "global_step": 570327, "epoch": 6871} {"train_loss": -27.903884887695312, "global_step": 570328, "epoch": 6871} {"train_loss": -27.88389015197754, "global_step": 570329, "epoch": 6871} {"train_loss": -27.642866134643555, "global_step": 570330, "epoch": 6871} {"train_loss": -27.94331169128418, "global_step": 570331, "epoch": 6871} {"train_loss": -27.851490020751953, "global_step": 570332, "epoch": 6871} {"train_loss": -27.828567504882812, "global_step": 570333, "epoch": 6871} {"train_loss": -27.697961807250977, "global_step": 570334, "epoch": 6871} {"train_loss": -28.06831169128418, "global_step": 570335, "epoch": 6871} {"train_loss": -28.18198013305664, "global_step": 570336, "epoch": 6871} {"train_loss": -28.1116943359375, "global_step": 570337, "epoch": 6871} {"train_loss": -28.139923095703125, "global_step": 570338, "epoch": 6871} {"train_loss": -27.546875, "global_step": 570339, "epoch": 6871} {"train_loss": -27.804487228393555, "global_step": 570340, "epoch": 6871} {"train_loss": -27.912195205688477, "global_step": 570341, "epoch": 6871} {"train_loss": -28.038848876953125, "global_step": 570342, "epoch": 6871} {"train_loss": -28.23154067993164, "global_step": 570343, "epoch": 6871} {"train_loss": -28.020421981811523, "global_step": 570344, "epoch": 6871} {"train_loss": -27.8679256439209, "global_step": 570345, "epoch": 6871} {"train_loss": -27.955184936523438, "global_step": 570346, "epoch": 6871} {"train_loss": -27.934036254882812, "global_step": 570347, "epoch": 6871} {"train_loss": -28.23042106628418, "global_step": 570348, "epoch": 6871} {"train_loss": -27.931869506835938, "global_step": 570349, "epoch": 6871} {"train_loss": -27.68671989440918, "global_step": 570350, "epoch": 6871} {"train_loss": -27.6805477142334, "global_step": 570351, "epoch": 6871} {"train_loss": -27.715087890625, "global_step": 570352, "epoch": 6871} {"train_loss": -27.854719161987305, "global_step": 570353, "epoch": 6871} {"train_loss": -28.040725708007812, "global_step": 570354, "epoch": 6871} {"train_loss": -27.508747100830078, "global_step": 570355, "epoch": 6871} {"train_loss": -27.632715225219727, "global_step": 570356, "epoch": 6871} {"train_loss": -27.4561710357666, "global_step": 570357, "epoch": 6871} {"train_loss": -27.672616958618164, "global_step": 570358, "epoch": 6871} {"train_loss": -28.25531005859375, "global_step": 570359, "epoch": 6871} {"train_loss": -27.86761474609375, "global_step": 570360, "epoch": 6871} {"train_loss": -27.775711059570312, "global_step": 570361, "epoch": 6871} {"train_loss": -28.046857833862305, "global_step": 570362, "epoch": 6871} {"train_loss": -28.014745712280273, "global_step": 570363, "epoch": 6871} {"train_loss": -27.809051513671875, "global_step": 570364, "epoch": 6871} {"train_loss": -28.181171417236328, "global_step": 570365, "epoch": 6871} {"train_loss": -27.747434616088867, "global_step": 570366, "epoch": 6871} {"train_loss": -27.723859786987305, "global_step": 570367, "epoch": 6871} {"train_loss": -27.833654403686523, "global_step": 570368, "epoch": 6871} {"train_loss": -27.7196044921875, "global_step": 570369, "epoch": 6871} {"train_loss": -27.93536376953125, "global_step": 570370, "epoch": 6871} {"train_loss": -27.720767974853516, "global_step": 570371, "epoch": 6871} {"train_loss": -27.939422607421875, "global_step": 570372, "epoch": 6871} {"train_loss": -27.80403709411621, "global_step": 570373, "epoch": 6871} {"train_loss": -27.850255966186523, "global_step": 570374, "epoch": 6871} {"train_loss": -27.662537057715728, "global_step": 570375, "epoch": 6871, "val_loss": 6565572.0} {"train_loss": -26.865049362182617, "global_step": 570376, "epoch": 6872} {"train_loss": -25.99655532836914, "global_step": 570377, "epoch": 6872} {"train_loss": -27.28717041015625, "global_step": 570378, "epoch": 6872} {"train_loss": -26.949857711791992, "global_step": 570379, "epoch": 6872} {"train_loss": -26.7755184173584, "global_step": 570380, "epoch": 6872} {"train_loss": -26.932214736938477, "global_step": 570381, "epoch": 6872} {"train_loss": -27.08489418029785, "global_step": 570382, "epoch": 6872} {"train_loss": -26.924829483032227, "global_step": 570383, "epoch": 6872} {"train_loss": -26.99560546875, "global_step": 570384, "epoch": 6872} {"train_loss": -27.4299373626709, "global_step": 570385, "epoch": 6872} {"train_loss": -27.478595733642578, "global_step": 570386, "epoch": 6872} {"train_loss": -27.322174072265625, "global_step": 570387, "epoch": 6872} {"train_loss": -27.196868896484375, "global_step": 570388, "epoch": 6872} {"train_loss": -27.264020919799805, "global_step": 570389, "epoch": 6872} {"train_loss": -27.31916618347168, "global_step": 570390, "epoch": 6872} {"train_loss": -27.402084350585938, "global_step": 570391, "epoch": 6872} {"train_loss": -27.184040069580078, "global_step": 570392, "epoch": 6872} {"train_loss": -27.62415885925293, "global_step": 570393, "epoch": 6872} {"train_loss": -27.47905921936035, "global_step": 570394, "epoch": 6872} {"train_loss": -27.86769676208496, "global_step": 570395, "epoch": 6872} {"train_loss": -27.06937026977539, "global_step": 570396, "epoch": 6872} {"train_loss": -27.486347198486328, "global_step": 570397, "epoch": 6872} {"train_loss": -27.853879928588867, "global_step": 570398, "epoch": 6872} {"train_loss": -27.731412887573242, "global_step": 570399, "epoch": 6872} {"train_loss": -27.995441436767578, "global_step": 570400, "epoch": 6872} {"train_loss": -27.8129940032959, "global_step": 570401, "epoch": 6872} {"train_loss": -27.973285675048828, "global_step": 570402, "epoch": 6872} {"train_loss": -27.8883113861084, "global_step": 570403, "epoch": 6872} {"train_loss": -27.849597930908203, "global_step": 570404, "epoch": 6872} {"train_loss": -27.65106773376465, "global_step": 570405, "epoch": 6872} {"train_loss": -27.826431274414062, "global_step": 570406, "epoch": 6872} {"train_loss": -27.622365951538086, "global_step": 570407, "epoch": 6872} {"train_loss": -27.668842315673828, "global_step": 570408, "epoch": 6872} {"train_loss": -27.99159049987793, "global_step": 570409, "epoch": 6872} {"train_loss": -27.908710479736328, "global_step": 570410, "epoch": 6872} {"train_loss": -28.372119903564453, "global_step": 570411, "epoch": 6872} {"train_loss": -27.73944664001465, "global_step": 570412, "epoch": 6872} {"train_loss": -28.11336326599121, "global_step": 570413, "epoch": 6872} {"train_loss": -27.872785568237305, "global_step": 570414, "epoch": 6872} {"train_loss": -28.183063507080078, "global_step": 570415, "epoch": 6872} {"train_loss": -28.47865104675293, "global_step": 570416, "epoch": 6872} {"train_loss": -27.769367218017578, "global_step": 570417, "epoch": 6872} {"train_loss": -27.712692260742188, "global_step": 570418, "epoch": 6872} {"train_loss": -27.982990264892578, "global_step": 570419, "epoch": 6872} {"train_loss": -27.640899658203125, "global_step": 570420, "epoch": 6872} {"train_loss": -27.63130760192871, "global_step": 570421, "epoch": 6872} {"train_loss": -27.760211944580078, "global_step": 570422, "epoch": 6872} {"train_loss": -27.768035888671875, "global_step": 570423, "epoch": 6872} {"train_loss": -27.74517250061035, "global_step": 570424, "epoch": 6872} {"train_loss": -27.950912475585938, "global_step": 570425, "epoch": 6872} {"train_loss": -27.985321044921875, "global_step": 570426, "epoch": 6872} {"train_loss": -27.6563663482666, "global_step": 570427, "epoch": 6872} {"train_loss": -27.8583927154541, "global_step": 570428, "epoch": 6872} {"train_loss": -27.581226348876953, "global_step": 570429, "epoch": 6872} {"train_loss": -28.000669479370117, "global_step": 570430, "epoch": 6872} {"train_loss": -27.938720703125, "global_step": 570431, "epoch": 6872} {"train_loss": -28.089414596557617, "global_step": 570432, "epoch": 6872} {"train_loss": -27.848737716674805, "global_step": 570433, "epoch": 6872} {"train_loss": -27.56243324279785, "global_step": 570434, "epoch": 6872} {"train_loss": -28.13568115234375, "global_step": 570435, "epoch": 6872} {"train_loss": -27.69504165649414, "global_step": 570436, "epoch": 6872} {"train_loss": -27.529218673706055, "global_step": 570437, "epoch": 6872} {"train_loss": -27.88306999206543, "global_step": 570438, "epoch": 6872} {"train_loss": -27.94513511657715, "global_step": 570439, "epoch": 6872} {"train_loss": -27.762195587158203, "global_step": 570440, "epoch": 6872} {"train_loss": -27.937610626220703, "global_step": 570441, "epoch": 6872} {"train_loss": -27.759275436401367, "global_step": 570442, "epoch": 6872} {"train_loss": -27.88031005859375, "global_step": 570443, "epoch": 6872} {"train_loss": -28.004108428955078, "global_step": 570444, "epoch": 6872} {"train_loss": -28.001800537109375, "global_step": 570445, "epoch": 6872} {"train_loss": -27.80927085876465, "global_step": 570446, "epoch": 6872} {"train_loss": -27.47150993347168, "global_step": 570447, "epoch": 6872} {"train_loss": -27.54091453552246, "global_step": 570448, "epoch": 6872} {"train_loss": -27.87131118774414, "global_step": 570449, "epoch": 6872} {"train_loss": -28.03720474243164, "global_step": 570450, "epoch": 6872} {"train_loss": -27.5195255279541, "global_step": 570451, "epoch": 6872} {"train_loss": -27.5976619720459, "global_step": 570452, "epoch": 6872} {"train_loss": -27.863317489624023, "global_step": 570453, "epoch": 6872} {"train_loss": -27.52357292175293, "global_step": 570454, "epoch": 6872} {"train_loss": -27.386554718017578, "global_step": 570455, "epoch": 6872} {"train_loss": -27.845691680908203, "global_step": 570456, "epoch": 6872} {"train_loss": -27.964874267578125, "global_step": 570457, "epoch": 6872} {"train_loss": -27.663301261074572, "global_step": 570458, "epoch": 6872, "val_loss": 6554015.0} {"train_loss": -27.247770309448242, "global_step": 570459, "epoch": 6873} {"train_loss": -25.948139190673828, "global_step": 570460, "epoch": 6873} {"train_loss": -25.406335830688477, "global_step": 570461, "epoch": 6873} {"train_loss": -25.932037353515625, "global_step": 570462, "epoch": 6873} {"train_loss": -27.108728408813477, "global_step": 570463, "epoch": 6873} {"train_loss": -26.040302276611328, "global_step": 570464, "epoch": 6873} {"train_loss": -27.1634521484375, "global_step": 570465, "epoch": 6873} {"train_loss": -26.76800537109375, "global_step": 570466, "epoch": 6873} {"train_loss": -27.246984481811523, "global_step": 570467, "epoch": 6873} {"train_loss": -27.505508422851562, "global_step": 570468, "epoch": 6873} {"train_loss": -26.864606857299805, "global_step": 570469, "epoch": 6873} {"train_loss": -27.377552032470703, "global_step": 570470, "epoch": 6873} {"train_loss": -27.460010528564453, "global_step": 570471, "epoch": 6873} {"train_loss": -27.13569450378418, "global_step": 570472, "epoch": 6873} {"train_loss": -27.450626373291016, "global_step": 570473, "epoch": 6873} {"train_loss": -27.283979415893555, "global_step": 570474, "epoch": 6873} {"train_loss": -27.651321411132812, "global_step": 570475, "epoch": 6873} {"train_loss": -26.80352210998535, "global_step": 570476, "epoch": 6873} {"train_loss": -27.514501571655273, "global_step": 570477, "epoch": 6873} {"train_loss": -27.33974266052246, "global_step": 570478, "epoch": 6873} {"train_loss": -27.52130699157715, "global_step": 570479, "epoch": 6873} {"train_loss": -27.433908462524414, "global_step": 570480, "epoch": 6873} {"train_loss": -27.305728912353516, "global_step": 570481, "epoch": 6873} {"train_loss": -27.3934326171875, "global_step": 570482, "epoch": 6873} {"train_loss": -28.012357711791992, "global_step": 570483, "epoch": 6873} {"train_loss": -27.830163955688477, "global_step": 570484, "epoch": 6873} {"train_loss": -27.5576114654541, "global_step": 570485, "epoch": 6873} {"train_loss": -27.536352157592773, "global_step": 570486, "epoch": 6873} {"train_loss": -27.605926513671875, "global_step": 570487, "epoch": 6873} {"train_loss": -27.944583892822266, "global_step": 570488, "epoch": 6873} {"train_loss": -28.03775978088379, "global_step": 570489, "epoch": 6873} {"train_loss": -27.707855224609375, "global_step": 570490, "epoch": 6873} {"train_loss": -27.79030418395996, "global_step": 570491, "epoch": 6873} {"train_loss": -27.677173614501953, "global_step": 570492, "epoch": 6873} {"train_loss": -27.79951286315918, "global_step": 570493, "epoch": 6873} {"train_loss": -28.137914657592773, "global_step": 570494, "epoch": 6873} {"train_loss": -27.863439559936523, "global_step": 570495, "epoch": 6873} {"train_loss": -27.7155704498291, "global_step": 570496, "epoch": 6873} {"train_loss": -27.875635147094727, "global_step": 570497, "epoch": 6873} {"train_loss": -27.701080322265625, "global_step": 570498, "epoch": 6873} {"train_loss": -27.73740005493164, "global_step": 570499, "epoch": 6873} {"train_loss": -28.027713775634766, "global_step": 570500, "epoch": 6873} {"train_loss": -28.151355743408203, "global_step": 570501, "epoch": 6873} {"train_loss": -27.795013427734375, "global_step": 570502, "epoch": 6873} {"train_loss": -28.017658233642578, "global_step": 570503, "epoch": 6873} {"train_loss": -28.035430908203125, "global_step": 570504, "epoch": 6873} {"train_loss": -28.000961303710938, "global_step": 570505, "epoch": 6873} {"train_loss": -28.11993408203125, "global_step": 570506, "epoch": 6873} {"train_loss": -27.933019638061523, "global_step": 570507, "epoch": 6873} {"train_loss": -28.285619735717773, "global_step": 570508, "epoch": 6873} {"train_loss": -27.549524307250977, "global_step": 570509, "epoch": 6873} {"train_loss": -27.6109561920166, "global_step": 570510, "epoch": 6873} {"train_loss": -27.4005069732666, "global_step": 570511, "epoch": 6873} {"train_loss": -27.877614974975586, "global_step": 570512, "epoch": 6873} {"train_loss": -28.05588722229004, "global_step": 570513, "epoch": 6873} {"train_loss": -27.63852882385254, "global_step": 570514, "epoch": 6873} {"train_loss": -27.73249626159668, "global_step": 570515, "epoch": 6873} {"train_loss": -28.036483764648438, "global_step": 570516, "epoch": 6873} {"train_loss": -27.950437545776367, "global_step": 570517, "epoch": 6873} {"train_loss": -28.021432876586914, "global_step": 570518, "epoch": 6873} {"train_loss": -28.02487564086914, "global_step": 570519, "epoch": 6873} {"train_loss": -27.823068618774414, "global_step": 570520, "epoch": 6873} {"train_loss": -28.147781372070312, "global_step": 570521, "epoch": 6873} {"train_loss": -27.979883193969727, "global_step": 570522, "epoch": 6873} {"train_loss": -27.726160049438477, "global_step": 570523, "epoch": 6873} {"train_loss": -28.08430290222168, "global_step": 570524, "epoch": 6873} {"train_loss": -27.695117950439453, "global_step": 570525, "epoch": 6873} {"train_loss": -28.384368896484375, "global_step": 570526, "epoch": 6873} {"train_loss": -28.03989028930664, "global_step": 570527, "epoch": 6873} {"train_loss": -27.905460357666016, "global_step": 570528, "epoch": 6873} {"train_loss": -27.818201065063477, "global_step": 570529, "epoch": 6873} {"train_loss": -28.065717697143555, "global_step": 570530, "epoch": 6873} {"train_loss": -28.06756591796875, "global_step": 570531, "epoch": 6873} {"train_loss": -27.9211368560791, "global_step": 570532, "epoch": 6873} {"train_loss": -28.25848388671875, "global_step": 570533, "epoch": 6873} {"train_loss": -27.580060958862305, "global_step": 570534, "epoch": 6873} {"train_loss": -28.10576820373535, "global_step": 570535, "epoch": 6873} {"train_loss": -28.101516723632812, "global_step": 570536, "epoch": 6873} {"train_loss": -28.299596786499023, "global_step": 570537, "epoch": 6873} {"train_loss": -27.687198638916016, "global_step": 570538, "epoch": 6873} {"train_loss": -27.83904457092285, "global_step": 570539, "epoch": 6873} {"train_loss": -27.6558837890625, "global_step": 570540, "epoch": 6873} {"train_loss": -27.647943174982647, "global_step": 570541, "epoch": 6873, "val_loss": 6484404.0} {"train_loss": -27.987150192260742, "global_step": 570542, "epoch": 6874} {"train_loss": -27.0441951751709, "global_step": 570543, "epoch": 6874} {"train_loss": -24.902700424194336, "global_step": 570544, "epoch": 6874} {"train_loss": -24.716064453125, "global_step": 570545, "epoch": 6874} {"train_loss": -26.636205673217773, "global_step": 570546, "epoch": 6874} {"train_loss": -26.347936630249023, "global_step": 570547, "epoch": 6874} {"train_loss": -26.621042251586914, "global_step": 570548, "epoch": 6874} {"train_loss": -26.21375846862793, "global_step": 570549, "epoch": 6874} {"train_loss": -27.452606201171875, "global_step": 570550, "epoch": 6874} {"train_loss": -27.09250259399414, "global_step": 570551, "epoch": 6874} {"train_loss": -27.02400016784668, "global_step": 570552, "epoch": 6874} {"train_loss": -27.348651885986328, "global_step": 570553, "epoch": 6874} {"train_loss": -26.773969650268555, "global_step": 570554, "epoch": 6874} {"train_loss": -27.092849731445312, "global_step": 570555, "epoch": 6874} {"train_loss": -27.268354415893555, "global_step": 570556, "epoch": 6874} {"train_loss": -27.222137451171875, "global_step": 570557, "epoch": 6874} {"train_loss": -28.060882568359375, "global_step": 570558, "epoch": 6874} {"train_loss": -27.459623336791992, "global_step": 570559, "epoch": 6874} {"train_loss": -27.03423500061035, "global_step": 570560, "epoch": 6874} {"train_loss": -27.50461196899414, "global_step": 570561, "epoch": 6874} {"train_loss": -27.3482666015625, "global_step": 570562, "epoch": 6874} {"train_loss": -27.153533935546875, "global_step": 570563, "epoch": 6874} {"train_loss": -27.39466667175293, "global_step": 570564, "epoch": 6874} {"train_loss": -27.820087432861328, "global_step": 570565, "epoch": 6874} {"train_loss": -27.730859756469727, "global_step": 570566, "epoch": 6874} {"train_loss": -27.270395278930664, "global_step": 570567, "epoch": 6874} {"train_loss": -27.080780029296875, "global_step": 570568, "epoch": 6874} {"train_loss": -27.841917037963867, "global_step": 570569, "epoch": 6874} {"train_loss": -27.270456314086914, "global_step": 570570, "epoch": 6874} {"train_loss": -27.463092803955078, "global_step": 570571, "epoch": 6874} {"train_loss": -27.64987564086914, "global_step": 570572, "epoch": 6874} {"train_loss": -27.595075607299805, "global_step": 570573, "epoch": 6874} {"train_loss": -27.64484214782715, "global_step": 570574, "epoch": 6874} {"train_loss": -27.661380767822266, "global_step": 570575, "epoch": 6874} {"train_loss": -27.87861442565918, "global_step": 570576, "epoch": 6874} {"train_loss": -27.67490005493164, "global_step": 570577, "epoch": 6874} {"train_loss": -28.159332275390625, "global_step": 570578, "epoch": 6874} {"train_loss": -27.813297271728516, "global_step": 570579, "epoch": 6874} {"train_loss": -27.9157772064209, "global_step": 570580, "epoch": 6874} {"train_loss": -27.598907470703125, "global_step": 570581, "epoch": 6874} {"train_loss": -27.766820907592773, "global_step": 570582, "epoch": 6874} {"train_loss": -27.839200973510742, "global_step": 570583, "epoch": 6874} {"train_loss": -28.146560668945312, "global_step": 570584, "epoch": 6874} {"train_loss": -27.74961280822754, "global_step": 570585, "epoch": 6874} {"train_loss": -27.774703979492188, "global_step": 570586, "epoch": 6874} {"train_loss": -27.920522689819336, "global_step": 570587, "epoch": 6874} {"train_loss": -28.120336532592773, "global_step": 570588, "epoch": 6874} {"train_loss": -27.533369064331055, "global_step": 570589, "epoch": 6874} {"train_loss": -27.7479305267334, "global_step": 570590, "epoch": 6874} {"train_loss": -28.055835723876953, "global_step": 570591, "epoch": 6874} {"train_loss": -27.733367919921875, "global_step": 570592, "epoch": 6874} {"train_loss": -27.8270320892334, "global_step": 570593, "epoch": 6874} {"train_loss": -27.93198585510254, "global_step": 570594, "epoch": 6874} {"train_loss": -27.810428619384766, "global_step": 570595, "epoch": 6874} {"train_loss": -28.101354598999023, "global_step": 570596, "epoch": 6874} {"train_loss": -28.02105140686035, "global_step": 570597, "epoch": 6874} {"train_loss": -28.06536293029785, "global_step": 570598, "epoch": 6874} {"train_loss": -27.791217803955078, "global_step": 570599, "epoch": 6874} {"train_loss": -27.691740036010742, "global_step": 570600, "epoch": 6874} {"train_loss": -27.855335235595703, "global_step": 570601, "epoch": 6874} {"train_loss": -27.59027671813965, "global_step": 570602, "epoch": 6874} {"train_loss": -27.666406631469727, "global_step": 570603, "epoch": 6874} {"train_loss": -27.756732940673828, "global_step": 570604, "epoch": 6874} {"train_loss": -27.863601684570312, "global_step": 570605, "epoch": 6874} {"train_loss": -27.67691421508789, "global_step": 570606, "epoch": 6874} {"train_loss": -28.126577377319336, "global_step": 570607, "epoch": 6874} {"train_loss": -27.79107666015625, "global_step": 570608, "epoch": 6874} {"train_loss": -27.76002311706543, "global_step": 570609, "epoch": 6874} {"train_loss": -27.917428970336914, "global_step": 570610, "epoch": 6874} {"train_loss": -28.046533584594727, "global_step": 570611, "epoch": 6874} {"train_loss": -27.674396514892578, "global_step": 570612, "epoch": 6874} {"train_loss": -27.97320556640625, "global_step": 570613, "epoch": 6874} {"train_loss": -28.20682144165039, "global_step": 570614, "epoch": 6874} {"train_loss": -28.168338775634766, "global_step": 570615, "epoch": 6874} {"train_loss": -27.932636260986328, "global_step": 570616, "epoch": 6874} {"train_loss": -28.240432739257812, "global_step": 570617, "epoch": 6874} {"train_loss": -28.242441177368164, "global_step": 570618, "epoch": 6874} {"train_loss": -28.10711097717285, "global_step": 570619, "epoch": 6874} {"train_loss": -28.270193099975586, "global_step": 570620, "epoch": 6874} {"train_loss": -27.94415855407715, "global_step": 570621, "epoch": 6874} {"train_loss": -28.30057144165039, "global_step": 570622, "epoch": 6874} {"train_loss": -28.090808868408203, "global_step": 570623, "epoch": 6874} {"train_loss": -27.60476045723421, "global_step": 570624, "epoch": 6874, "val_loss": 6455935.0} {"train_loss": -27.31756591796875, "global_step": 570625, "epoch": 6875} {"train_loss": -27.496679306030273, "global_step": 570626, "epoch": 6875} {"train_loss": -27.544269561767578, "global_step": 570627, "epoch": 6875} {"train_loss": -27.815448760986328, "global_step": 570628, "epoch": 6875} {"train_loss": -27.751134872436523, "global_step": 570629, "epoch": 6875} {"train_loss": -27.55853843688965, "global_step": 570630, "epoch": 6875} {"train_loss": -27.908740997314453, "global_step": 570631, "epoch": 6875} {"train_loss": -28.0339298248291, "global_step": 570632, "epoch": 6875} {"train_loss": -27.74899673461914, "global_step": 570633, "epoch": 6875} {"train_loss": -27.63641357421875, "global_step": 570634, "epoch": 6875} {"train_loss": -27.929473876953125, "global_step": 570635, "epoch": 6875} {"train_loss": -27.415006637573242, "global_step": 570636, "epoch": 6875} {"train_loss": -27.745580673217773, "global_step": 570637, "epoch": 6875} {"train_loss": -27.815454483032227, "global_step": 570638, "epoch": 6875} {"train_loss": -27.375410079956055, "global_step": 570639, "epoch": 6875} {"train_loss": -27.215662002563477, "global_step": 570640, "epoch": 6875} {"train_loss": -27.301916122436523, "global_step": 570641, "epoch": 6875} {"train_loss": -27.984182357788086, "global_step": 570642, "epoch": 6875} {"train_loss": -27.522659301757812, "global_step": 570643, "epoch": 6875} {"train_loss": -27.423070907592773, "global_step": 570644, "epoch": 6875} {"train_loss": -27.432056427001953, "global_step": 570645, "epoch": 6875} {"train_loss": -27.8361759185791, "global_step": 570646, "epoch": 6875} {"train_loss": -27.721967697143555, "global_step": 570647, "epoch": 6875} {"train_loss": -27.622333526611328, "global_step": 570648, "epoch": 6875} {"train_loss": -27.753625869750977, "global_step": 570649, "epoch": 6875} {"train_loss": -27.642349243164062, "global_step": 570650, "epoch": 6875} {"train_loss": -27.642621994018555, "global_step": 570651, "epoch": 6875} {"train_loss": -27.4735164642334, "global_step": 570652, "epoch": 6875} {"train_loss": -27.86771011352539, "global_step": 570653, "epoch": 6875} {"train_loss": -27.64154624938965, "global_step": 570654, "epoch": 6875} {"train_loss": -27.405136108398438, "global_step": 570655, "epoch": 6875} {"train_loss": -27.88740348815918, "global_step": 570656, "epoch": 6875} {"train_loss": -27.763568878173828, "global_step": 570657, "epoch": 6875} {"train_loss": -27.00459098815918, "global_step": 570658, "epoch": 6875} {"train_loss": -27.49363136291504, "global_step": 570659, "epoch": 6875} {"train_loss": -27.81399917602539, "global_step": 570660, "epoch": 6875} {"train_loss": -27.499256134033203, "global_step": 570661, "epoch": 6875} {"train_loss": -28.128158569335938, "global_step": 570662, "epoch": 6875} {"train_loss": -27.76953125, "global_step": 570663, "epoch": 6875} {"train_loss": -27.79151725769043, "global_step": 570664, "epoch": 6875} {"train_loss": -27.85062599182129, "global_step": 570665, "epoch": 6875} {"train_loss": -27.975122451782227, "global_step": 570666, "epoch": 6875} {"train_loss": -28.127344131469727, "global_step": 570667, "epoch": 6875} {"train_loss": -27.946287155151367, "global_step": 570668, "epoch": 6875} {"train_loss": -28.1123046875, "global_step": 570669, "epoch": 6875} {"train_loss": -27.982275009155273, "global_step": 570670, "epoch": 6875} {"train_loss": -27.767822265625, "global_step": 570671, "epoch": 6875} {"train_loss": -27.96793556213379, "global_step": 570672, "epoch": 6875} {"train_loss": -27.849365234375, "global_step": 570673, "epoch": 6875} {"train_loss": -27.674819946289062, "global_step": 570674, "epoch": 6875} {"train_loss": -28.01459312438965, "global_step": 570675, "epoch": 6875} {"train_loss": -27.633163452148438, "global_step": 570676, "epoch": 6875} {"train_loss": -27.849506378173828, "global_step": 570677, "epoch": 6875} {"train_loss": -28.082141876220703, "global_step": 570678, "epoch": 6875} {"train_loss": -27.560138702392578, "global_step": 570679, "epoch": 6875} {"train_loss": -27.695632934570312, "global_step": 570680, "epoch": 6875} {"train_loss": -27.852436065673828, "global_step": 570681, "epoch": 6875} {"train_loss": -28.344959259033203, "global_step": 570682, "epoch": 6875} {"train_loss": -28.21291160583496, "global_step": 570683, "epoch": 6875} {"train_loss": -28.160690307617188, "global_step": 570684, "epoch": 6875} {"train_loss": -28.184415817260742, "global_step": 570685, "epoch": 6875} {"train_loss": -28.130102157592773, "global_step": 570686, "epoch": 6875} {"train_loss": -28.1127872467041, "global_step": 570687, "epoch": 6875} {"train_loss": -28.343259811401367, "global_step": 570688, "epoch": 6875} {"train_loss": -28.192041397094727, "global_step": 570689, "epoch": 6875} {"train_loss": -28.3342342376709, "global_step": 570690, "epoch": 6875} {"train_loss": -28.049854278564453, "global_step": 570691, "epoch": 6875} {"train_loss": -27.68806266784668, "global_step": 570692, "epoch": 6875} {"train_loss": -27.560626983642578, "global_step": 570693, "epoch": 6875} {"train_loss": -28.2589168548584, "global_step": 570694, "epoch": 6875} {"train_loss": -28.075653076171875, "global_step": 570695, "epoch": 6875} {"train_loss": -27.722156524658203, "global_step": 570696, "epoch": 6875} {"train_loss": -27.788122177124023, "global_step": 570697, "epoch": 6875} {"train_loss": -28.200244903564453, "global_step": 570698, "epoch": 6875} {"train_loss": -27.709875106811523, "global_step": 570699, "epoch": 6875} {"train_loss": -28.281274795532227, "global_step": 570700, "epoch": 6875} {"train_loss": -27.681915283203125, "global_step": 570701, "epoch": 6875} {"train_loss": -27.94632339477539, "global_step": 570702, "epoch": 6875} {"train_loss": -27.797775268554688, "global_step": 570703, "epoch": 6875} {"train_loss": -27.27607536315918, "global_step": 570704, "epoch": 6875} {"train_loss": -27.261932373046875, "global_step": 570705, "epoch": 6875} {"train_loss": -26.914220809936523, "global_step": 570706, "epoch": 6875} {"train_loss": -27.780362186661687, "global_step": 570707, "epoch": 6875, "val_loss": 6442715.5} {"train_loss": -27.257699966430664, "global_step": 570708, "epoch": 6876} {"train_loss": -26.759078979492188, "global_step": 570709, "epoch": 6876} {"train_loss": -27.138376235961914, "global_step": 570710, "epoch": 6876} {"train_loss": -27.336828231811523, "global_step": 570711, "epoch": 6876} {"train_loss": -26.47053337097168, "global_step": 570712, "epoch": 6876} {"train_loss": -26.271469116210938, "global_step": 570713, "epoch": 6876} {"train_loss": -26.72385025024414, "global_step": 570714, "epoch": 6876} {"train_loss": -27.250879287719727, "global_step": 570715, "epoch": 6876} {"train_loss": -27.101850509643555, "global_step": 570716, "epoch": 6876} {"train_loss": -27.2047119140625, "global_step": 570717, "epoch": 6876} {"train_loss": -27.40215492248535, "global_step": 570718, "epoch": 6876} {"train_loss": -27.067703247070312, "global_step": 570719, "epoch": 6876} {"train_loss": -27.609363555908203, "global_step": 570720, "epoch": 6876} {"train_loss": -27.265369415283203, "global_step": 570721, "epoch": 6876} {"train_loss": -27.63429832458496, "global_step": 570722, "epoch": 6876} {"train_loss": -27.546890258789062, "global_step": 570723, "epoch": 6876} {"train_loss": -27.24285888671875, "global_step": 570724, "epoch": 6876} {"train_loss": -27.725082397460938, "global_step": 570725, "epoch": 6876} {"train_loss": -27.651586532592773, "global_step": 570726, "epoch": 6876} {"train_loss": -27.65448570251465, "global_step": 570727, "epoch": 6876} {"train_loss": -27.480512619018555, "global_step": 570728, "epoch": 6876} {"train_loss": -26.993091583251953, "global_step": 570729, "epoch": 6876} {"train_loss": -27.840015411376953, "global_step": 570730, "epoch": 6876} {"train_loss": -27.67131996154785, "global_step": 570731, "epoch": 6876} {"train_loss": -28.057086944580078, "global_step": 570732, "epoch": 6876} {"train_loss": -27.9813289642334, "global_step": 570733, "epoch": 6876} {"train_loss": -28.058374404907227, "global_step": 570734, "epoch": 6876} {"train_loss": -27.74480628967285, "global_step": 570735, "epoch": 6876} {"train_loss": -27.978925704956055, "global_step": 570736, "epoch": 6876} {"train_loss": -27.868244171142578, "global_step": 570737, "epoch": 6876} {"train_loss": -27.821325302124023, "global_step": 570738, "epoch": 6876} {"train_loss": -28.127939224243164, "global_step": 570739, "epoch": 6876} {"train_loss": -27.79314613342285, "global_step": 570740, "epoch": 6876} {"train_loss": -27.871479034423828, "global_step": 570741, "epoch": 6876} {"train_loss": -27.719074249267578, "global_step": 570742, "epoch": 6876} {"train_loss": -27.969202041625977, "global_step": 570743, "epoch": 6876} {"train_loss": -28.353961944580078, "global_step": 570744, "epoch": 6876} {"train_loss": -27.930561065673828, "global_step": 570745, "epoch": 6876} {"train_loss": -27.970788955688477, "global_step": 570746, "epoch": 6876} {"train_loss": -28.010120391845703, "global_step": 570747, "epoch": 6876} {"train_loss": -28.197778701782227, "global_step": 570748, "epoch": 6876} {"train_loss": -27.917631149291992, "global_step": 570749, "epoch": 6876} {"train_loss": -28.3933162689209, "global_step": 570750, "epoch": 6876} {"train_loss": -27.942106246948242, "global_step": 570751, "epoch": 6876} {"train_loss": -27.985595703125, "global_step": 570752, "epoch": 6876} {"train_loss": -27.829980850219727, "global_step": 570753, "epoch": 6876} {"train_loss": -28.237232208251953, "global_step": 570754, "epoch": 6876} {"train_loss": -27.868478775024414, "global_step": 570755, "epoch": 6876} {"train_loss": -27.715106964111328, "global_step": 570756, "epoch": 6876} {"train_loss": -27.9996280670166, "global_step": 570757, "epoch": 6876} {"train_loss": -27.8474063873291, "global_step": 570758, "epoch": 6876} {"train_loss": -27.41058349609375, "global_step": 570759, "epoch": 6876} {"train_loss": -27.778976440429688, "global_step": 570760, "epoch": 6876} {"train_loss": -28.250213623046875, "global_step": 570761, "epoch": 6876} {"train_loss": -27.480764389038086, "global_step": 570762, "epoch": 6876} {"train_loss": -27.8236141204834, "global_step": 570763, "epoch": 6876} {"train_loss": -27.42584800720215, "global_step": 570764, "epoch": 6876} {"train_loss": -28.113555908203125, "global_step": 570765, "epoch": 6876} {"train_loss": -28.268835067749023, "global_step": 570766, "epoch": 6876} {"train_loss": -28.030628204345703, "global_step": 570767, "epoch": 6876} {"train_loss": -28.08083152770996, "global_step": 570768, "epoch": 6876} {"train_loss": -27.87578773498535, "global_step": 570769, "epoch": 6876} {"train_loss": -28.064056396484375, "global_step": 570770, "epoch": 6876} {"train_loss": -27.827978134155273, "global_step": 570771, "epoch": 6876} {"train_loss": -28.038373947143555, "global_step": 570772, "epoch": 6876} {"train_loss": -27.778852462768555, "global_step": 570773, "epoch": 6876} {"train_loss": -27.7164363861084, "global_step": 570774, "epoch": 6876} {"train_loss": -27.484699249267578, "global_step": 570775, "epoch": 6876} {"train_loss": -27.599597930908203, "global_step": 570776, "epoch": 6876} {"train_loss": -28.045886993408203, "global_step": 570777, "epoch": 6876} {"train_loss": -28.10320472717285, "global_step": 570778, "epoch": 6876} {"train_loss": -28.148040771484375, "global_step": 570779, "epoch": 6876} {"train_loss": -28.026819229125977, "global_step": 570780, "epoch": 6876} {"train_loss": -28.254064559936523, "global_step": 570781, "epoch": 6876} {"train_loss": -27.90687370300293, "global_step": 570782, "epoch": 6876} {"train_loss": -27.484394073486328, "global_step": 570783, "epoch": 6876} {"train_loss": -27.871612548828125, "global_step": 570784, "epoch": 6876} {"train_loss": -28.06123161315918, "global_step": 570785, "epoch": 6876} {"train_loss": -28.191864013671875, "global_step": 570786, "epoch": 6876} {"train_loss": -27.996652603149414, "global_step": 570787, "epoch": 6876} {"train_loss": -28.014734268188477, "global_step": 570788, "epoch": 6876} {"train_loss": -27.975666046142578, "global_step": 570789, "epoch": 6876} {"train_loss": -27.755989856030567, "global_step": 570790, "epoch": 6876, "val_loss": 6520088.0} {"train_loss": -28.111896514892578, "global_step": 570791, "epoch": 6877} {"train_loss": -27.840124130249023, "global_step": 570792, "epoch": 6877} {"train_loss": -27.676572799682617, "global_step": 570793, "epoch": 6877} {"train_loss": -27.660018920898438, "global_step": 570794, "epoch": 6877} {"train_loss": -27.540796279907227, "global_step": 570795, "epoch": 6877} {"train_loss": -27.92669677734375, "global_step": 570796, "epoch": 6877} {"train_loss": -27.8540096282959, "global_step": 570797, "epoch": 6877} {"train_loss": -27.55694007873535, "global_step": 570798, "epoch": 6877} {"train_loss": -27.768369674682617, "global_step": 570799, "epoch": 6877} {"train_loss": -27.6978816986084, "global_step": 570800, "epoch": 6877} {"train_loss": -27.375463485717773, "global_step": 570801, "epoch": 6877} {"train_loss": -27.510412216186523, "global_step": 570802, "epoch": 6877} {"train_loss": -27.868595123291016, "global_step": 570803, "epoch": 6877} {"train_loss": -27.810272216796875, "global_step": 570804, "epoch": 6877} {"train_loss": -28.015995025634766, "global_step": 570805, "epoch": 6877} {"train_loss": -27.661874771118164, "global_step": 570806, "epoch": 6877} {"train_loss": -28.318939208984375, "global_step": 570807, "epoch": 6877} {"train_loss": -28.170499801635742, "global_step": 570808, "epoch": 6877} {"train_loss": -27.754730224609375, "global_step": 570809, "epoch": 6877} {"train_loss": -27.92976951599121, "global_step": 570810, "epoch": 6877} {"train_loss": -27.85951805114746, "global_step": 570811, "epoch": 6877} {"train_loss": -27.477863311767578, "global_step": 570812, "epoch": 6877} {"train_loss": -27.863630294799805, "global_step": 570813, "epoch": 6877} {"train_loss": -27.82330894470215, "global_step": 570814, "epoch": 6877} {"train_loss": -27.385696411132812, "global_step": 570815, "epoch": 6877} {"train_loss": -27.76409339904785, "global_step": 570816, "epoch": 6877} {"train_loss": -27.529706954956055, "global_step": 570817, "epoch": 6877} {"train_loss": -28.074853897094727, "global_step": 570818, "epoch": 6877} {"train_loss": -27.891504287719727, "global_step": 570819, "epoch": 6877} {"train_loss": -27.55671501159668, "global_step": 570820, "epoch": 6877} {"train_loss": -27.984304428100586, "global_step": 570821, "epoch": 6877} {"train_loss": -27.952014923095703, "global_step": 570822, "epoch": 6877} {"train_loss": -27.918766021728516, "global_step": 570823, "epoch": 6877} {"train_loss": -27.6101016998291, "global_step": 570824, "epoch": 6877} {"train_loss": -27.986175537109375, "global_step": 570825, "epoch": 6877} {"train_loss": -28.031118392944336, "global_step": 570826, "epoch": 6877} {"train_loss": -27.84049415588379, "global_step": 570827, "epoch": 6877} {"train_loss": -27.947925567626953, "global_step": 570828, "epoch": 6877} {"train_loss": -27.44428825378418, "global_step": 570829, "epoch": 6877} {"train_loss": -27.611968994140625, "global_step": 570830, "epoch": 6877} {"train_loss": -27.729185104370117, "global_step": 570831, "epoch": 6877} {"train_loss": -27.83513832092285, "global_step": 570832, "epoch": 6877} {"train_loss": -27.61830711364746, "global_step": 570833, "epoch": 6877} {"train_loss": -27.91950035095215, "global_step": 570834, "epoch": 6877} {"train_loss": -27.75021743774414, "global_step": 570835, "epoch": 6877} {"train_loss": -28.022785186767578, "global_step": 570836, "epoch": 6877} {"train_loss": -27.930267333984375, "global_step": 570837, "epoch": 6877} {"train_loss": -28.04559326171875, "global_step": 570838, "epoch": 6877} {"train_loss": -27.68833351135254, "global_step": 570839, "epoch": 6877} {"train_loss": -27.992374420166016, "global_step": 570840, "epoch": 6877} {"train_loss": -27.78928565979004, "global_step": 570841, "epoch": 6877} {"train_loss": -27.813297271728516, "global_step": 570842, "epoch": 6877} {"train_loss": -27.65772819519043, "global_step": 570843, "epoch": 6877} {"train_loss": -28.05348777770996, "global_step": 570844, "epoch": 6877} {"train_loss": -28.1611328125, "global_step": 570845, "epoch": 6877} {"train_loss": -27.594038009643555, "global_step": 570846, "epoch": 6877} {"train_loss": -27.647985458374023, "global_step": 570847, "epoch": 6877} {"train_loss": -27.250173568725586, "global_step": 570848, "epoch": 6877} {"train_loss": -27.489309310913086, "global_step": 570849, "epoch": 6877} {"train_loss": -27.47810173034668, "global_step": 570850, "epoch": 6877} {"train_loss": -27.459760665893555, "global_step": 570851, "epoch": 6877} {"train_loss": -27.68776512145996, "global_step": 570852, "epoch": 6877} {"train_loss": -26.83326530456543, "global_step": 570853, "epoch": 6877} {"train_loss": -27.63949966430664, "global_step": 570854, "epoch": 6877} {"train_loss": -27.11916160583496, "global_step": 570855, "epoch": 6877} {"train_loss": -27.26140785217285, "global_step": 570856, "epoch": 6877} {"train_loss": -27.650741577148438, "global_step": 570857, "epoch": 6877} {"train_loss": -27.843353271484375, "global_step": 570858, "epoch": 6877} {"train_loss": -26.875812530517578, "global_step": 570859, "epoch": 6877} {"train_loss": -27.626249313354492, "global_step": 570860, "epoch": 6877} {"train_loss": -27.47942543029785, "global_step": 570861, "epoch": 6877} {"train_loss": -27.728620529174805, "global_step": 570862, "epoch": 6877} {"train_loss": -27.25815200805664, "global_step": 570863, "epoch": 6877} {"train_loss": -27.54056739807129, "global_step": 570864, "epoch": 6877} {"train_loss": -28.047840118408203, "global_step": 570865, "epoch": 6877} {"train_loss": -27.815933227539062, "global_step": 570866, "epoch": 6877} {"train_loss": -27.965112686157227, "global_step": 570867, "epoch": 6877} {"train_loss": -28.192371368408203, "global_step": 570868, "epoch": 6877} {"train_loss": -27.683349609375, "global_step": 570869, "epoch": 6877} {"train_loss": -27.93312644958496, "global_step": 570870, "epoch": 6877} {"train_loss": -27.59474754333496, "global_step": 570871, "epoch": 6877} {"train_loss": -27.890888214111328, "global_step": 570872, "epoch": 6877} {"train_loss": -27.746710329170686, "global_step": 570873, "epoch": 6877, "val_loss": 6481988.0} {"train_loss": -27.42144203186035, "global_step": 570874, "epoch": 6878} {"train_loss": -27.509912490844727, "global_step": 570875, "epoch": 6878} {"train_loss": -27.062915802001953, "global_step": 570876, "epoch": 6878} {"train_loss": -27.52215576171875, "global_step": 570877, "epoch": 6878} {"train_loss": -27.257787704467773, "global_step": 570878, "epoch": 6878} {"train_loss": -26.9488525390625, "global_step": 570879, "epoch": 6878} {"train_loss": -27.630603790283203, "global_step": 570880, "epoch": 6878} {"train_loss": -27.659326553344727, "global_step": 570881, "epoch": 6878} {"train_loss": -27.741369247436523, "global_step": 570882, "epoch": 6878} {"train_loss": -27.91353416442871, "global_step": 570883, "epoch": 6878} {"train_loss": -27.84293556213379, "global_step": 570884, "epoch": 6878} {"train_loss": -27.830554962158203, "global_step": 570885, "epoch": 6878} {"train_loss": -27.578588485717773, "global_step": 570886, "epoch": 6878} {"train_loss": -27.811182022094727, "global_step": 570887, "epoch": 6878} {"train_loss": -28.005115509033203, "global_step": 570888, "epoch": 6878} {"train_loss": -28.05353355407715, "global_step": 570889, "epoch": 6878} {"train_loss": -27.841455459594727, "global_step": 570890, "epoch": 6878} {"train_loss": -27.81598472595215, "global_step": 570891, "epoch": 6878} {"train_loss": -27.77644157409668, "global_step": 570892, "epoch": 6878} {"train_loss": -27.738325119018555, "global_step": 570893, "epoch": 6878} {"train_loss": -27.989904403686523, "global_step": 570894, "epoch": 6878} {"train_loss": -27.520526885986328, "global_step": 570895, "epoch": 6878} {"train_loss": -28.094085693359375, "global_step": 570896, "epoch": 6878} {"train_loss": -27.741186141967773, "global_step": 570897, "epoch": 6878} {"train_loss": -27.67266273498535, "global_step": 570898, "epoch": 6878} {"train_loss": -27.933984756469727, "global_step": 570899, "epoch": 6878} {"train_loss": -28.209314346313477, "global_step": 570900, "epoch": 6878} {"train_loss": -27.930139541625977, "global_step": 570901, "epoch": 6878} {"train_loss": -27.591527938842773, "global_step": 570902, "epoch": 6878} {"train_loss": -27.779163360595703, "global_step": 570903, "epoch": 6878} {"train_loss": -27.85394287109375, "global_step": 570904, "epoch": 6878} {"train_loss": -27.89154624938965, "global_step": 570905, "epoch": 6878} {"train_loss": -28.152353286743164, "global_step": 570906, "epoch": 6878} {"train_loss": -27.832494735717773, "global_step": 570907, "epoch": 6878} {"train_loss": -27.812055587768555, "global_step": 570908, "epoch": 6878} {"train_loss": -27.590734481811523, "global_step": 570909, "epoch": 6878} {"train_loss": -27.943103790283203, "global_step": 570910, "epoch": 6878} {"train_loss": -28.376239776611328, "global_step": 570911, "epoch": 6878} {"train_loss": -27.723669052124023, "global_step": 570912, "epoch": 6878} {"train_loss": -28.011423110961914, "global_step": 570913, "epoch": 6878} {"train_loss": -27.841848373413086, "global_step": 570914, "epoch": 6878} {"train_loss": -27.99005126953125, "global_step": 570915, "epoch": 6878} {"train_loss": -28.348203659057617, "global_step": 570916, "epoch": 6878} {"train_loss": -27.930419921875, "global_step": 570917, "epoch": 6878} {"train_loss": -28.34486198425293, "global_step": 570918, "epoch": 6878} {"train_loss": -28.0686092376709, "global_step": 570919, "epoch": 6878} {"train_loss": -28.107563018798828, "global_step": 570920, "epoch": 6878} {"train_loss": -27.613264083862305, "global_step": 570921, "epoch": 6878} {"train_loss": -27.377256393432617, "global_step": 570922, "epoch": 6878} {"train_loss": -26.95298194885254, "global_step": 570923, "epoch": 6878} {"train_loss": -27.264429092407227, "global_step": 570924, "epoch": 6878} {"train_loss": -27.695642471313477, "global_step": 570925, "epoch": 6878} {"train_loss": -27.798410415649414, "global_step": 570926, "epoch": 6878} {"train_loss": -26.786945343017578, "global_step": 570927, "epoch": 6878} {"train_loss": -26.777494430541992, "global_step": 570928, "epoch": 6878} {"train_loss": -27.61115837097168, "global_step": 570929, "epoch": 6878} {"train_loss": -27.228824615478516, "global_step": 570930, "epoch": 6878} {"train_loss": -28.018573760986328, "global_step": 570931, "epoch": 6878} {"train_loss": -27.351408004760742, "global_step": 570932, "epoch": 6878} {"train_loss": -27.721399307250977, "global_step": 570933, "epoch": 6878} {"train_loss": -27.348194122314453, "global_step": 570934, "epoch": 6878} {"train_loss": -27.382612228393555, "global_step": 570935, "epoch": 6878} {"train_loss": -27.783910751342773, "global_step": 570936, "epoch": 6878} {"train_loss": -27.628957748413086, "global_step": 570937, "epoch": 6878} {"train_loss": -27.379236221313477, "global_step": 570938, "epoch": 6878} {"train_loss": -27.95438003540039, "global_step": 570939, "epoch": 6878} {"train_loss": -27.640949249267578, "global_step": 570940, "epoch": 6878} {"train_loss": -27.463022232055664, "global_step": 570941, "epoch": 6878} {"train_loss": -27.963483810424805, "global_step": 570942, "epoch": 6878} {"train_loss": -27.505889892578125, "global_step": 570943, "epoch": 6878} {"train_loss": -27.739118576049805, "global_step": 570944, "epoch": 6878} {"train_loss": -27.740827560424805, "global_step": 570945, "epoch": 6878} {"train_loss": -27.6107234954834, "global_step": 570946, "epoch": 6878} {"train_loss": -27.8957462310791, "global_step": 570947, "epoch": 6878} {"train_loss": -28.038867950439453, "global_step": 570948, "epoch": 6878} {"train_loss": -27.7394962310791, "global_step": 570949, "epoch": 6878} {"train_loss": -27.78364372253418, "global_step": 570950, "epoch": 6878} {"train_loss": -27.69411277770996, "global_step": 570951, "epoch": 6878} {"train_loss": -28.04163932800293, "global_step": 570952, "epoch": 6878} {"train_loss": -28.0546932220459, "global_step": 570953, "epoch": 6878} {"train_loss": -28.384862899780273, "global_step": 570954, "epoch": 6878} {"train_loss": -27.882474899291992, "global_step": 570955, "epoch": 6878} {"train_loss": -27.73820973591632, "global_step": 570956, "epoch": 6878, "val_loss": 6517219.5} {"train_loss": -25.91077995300293, "global_step": 570957, "epoch": 6879} {"train_loss": -25.14305305480957, "global_step": 570958, "epoch": 6879} {"train_loss": -25.587474822998047, "global_step": 570959, "epoch": 6879} {"train_loss": -27.63213539123535, "global_step": 570960, "epoch": 6879} {"train_loss": -25.933435440063477, "global_step": 570961, "epoch": 6879} {"train_loss": -27.045820236206055, "global_step": 570962, "epoch": 6879} {"train_loss": -26.761911392211914, "global_step": 570963, "epoch": 6879} {"train_loss": -26.499958038330078, "global_step": 570964, "epoch": 6879} {"train_loss": -27.332311630249023, "global_step": 570965, "epoch": 6879} {"train_loss": -27.09271812438965, "global_step": 570966, "epoch": 6879} {"train_loss": -27.059614181518555, "global_step": 570967, "epoch": 6879} {"train_loss": -27.5472412109375, "global_step": 570968, "epoch": 6879} {"train_loss": -27.436538696289062, "global_step": 570969, "epoch": 6879} {"train_loss": -27.3503475189209, "global_step": 570970, "epoch": 6879} {"train_loss": -27.289838790893555, "global_step": 570971, "epoch": 6879} {"train_loss": -27.456802368164062, "global_step": 570972, "epoch": 6879} {"train_loss": -27.30051040649414, "global_step": 570973, "epoch": 6879} {"train_loss": -27.433063507080078, "global_step": 570974, "epoch": 6879} {"train_loss": -27.691076278686523, "global_step": 570975, "epoch": 6879} {"train_loss": -27.3131046295166, "global_step": 570976, "epoch": 6879} {"train_loss": -27.83649253845215, "global_step": 570977, "epoch": 6879} {"train_loss": -27.633161544799805, "global_step": 570978, "epoch": 6879} {"train_loss": -27.411880493164062, "global_step": 570979, "epoch": 6879} {"train_loss": -27.25937271118164, "global_step": 570980, "epoch": 6879} {"train_loss": -27.639429092407227, "global_step": 570981, "epoch": 6879} {"train_loss": -27.321325302124023, "global_step": 570982, "epoch": 6879} {"train_loss": -27.48805046081543, "global_step": 570983, "epoch": 6879} {"train_loss": -27.74647331237793, "global_step": 570984, "epoch": 6879} {"train_loss": -27.753864288330078, "global_step": 570985, "epoch": 6879} {"train_loss": -27.722803115844727, "global_step": 570986, "epoch": 6879} {"train_loss": -27.80805015563965, "global_step": 570987, "epoch": 6879} {"train_loss": -27.635828018188477, "global_step": 570988, "epoch": 6879} {"train_loss": -27.791898727416992, "global_step": 570989, "epoch": 6879} {"train_loss": -27.499128341674805, "global_step": 570990, "epoch": 6879} {"train_loss": -27.89723014831543, "global_step": 570991, "epoch": 6879} {"train_loss": -27.760419845581055, "global_step": 570992, "epoch": 6879} {"train_loss": -27.985794067382812, "global_step": 570993, "epoch": 6879} {"train_loss": -27.928665161132812, "global_step": 570994, "epoch": 6879} {"train_loss": -28.069013595581055, "global_step": 570995, "epoch": 6879} {"train_loss": -28.031957626342773, "global_step": 570996, "epoch": 6879} {"train_loss": -28.000762939453125, "global_step": 570997, "epoch": 6879} {"train_loss": -28.067102432250977, "global_step": 570998, "epoch": 6879} {"train_loss": -28.1539363861084, "global_step": 570999, "epoch": 6879} {"train_loss": -27.909650802612305, "global_step": 571000, "epoch": 6879} {"train_loss": -28.048078536987305, "global_step": 571001, "epoch": 6879} {"train_loss": -27.93934440612793, "global_step": 571002, "epoch": 6879} {"train_loss": -28.057376861572266, "global_step": 571003, "epoch": 6879} {"train_loss": -27.71392822265625, "global_step": 571004, "epoch": 6879} {"train_loss": -28.17043113708496, "global_step": 571005, "epoch": 6879} {"train_loss": -28.16338539123535, "global_step": 571006, "epoch": 6879} {"train_loss": -27.92561149597168, "global_step": 571007, "epoch": 6879} {"train_loss": -27.798248291015625, "global_step": 571008, "epoch": 6879} {"train_loss": -27.955280303955078, "global_step": 571009, "epoch": 6879} {"train_loss": -27.24395179748535, "global_step": 571010, "epoch": 6879} {"train_loss": -27.667800903320312, "global_step": 571011, "epoch": 6879} {"train_loss": -27.740039825439453, "global_step": 571012, "epoch": 6879} {"train_loss": -28.1369686126709, "global_step": 571013, "epoch": 6879} {"train_loss": -27.811752319335938, "global_step": 571014, "epoch": 6879} {"train_loss": -27.04910659790039, "global_step": 571015, "epoch": 6879} {"train_loss": -27.77422523498535, "global_step": 571016, "epoch": 6879} {"train_loss": -27.64253044128418, "global_step": 571017, "epoch": 6879} {"train_loss": -27.88148307800293, "global_step": 571018, "epoch": 6879} {"train_loss": -27.986679077148438, "global_step": 571019, "epoch": 6879} {"train_loss": -27.80159568786621, "global_step": 571020, "epoch": 6879} {"train_loss": -27.624021530151367, "global_step": 571021, "epoch": 6879} {"train_loss": -27.79132652282715, "global_step": 571022, "epoch": 6879} {"train_loss": -27.888898849487305, "global_step": 571023, "epoch": 6879} {"train_loss": -27.924219131469727, "global_step": 571024, "epoch": 6879} {"train_loss": -27.959035873413086, "global_step": 571025, "epoch": 6879} {"train_loss": -27.67136001586914, "global_step": 571026, "epoch": 6879} {"train_loss": -28.00860023498535, "global_step": 571027, "epoch": 6879} {"train_loss": -27.547931671142578, "global_step": 571028, "epoch": 6879} {"train_loss": -28.14200210571289, "global_step": 571029, "epoch": 6879} {"train_loss": -28.172643661499023, "global_step": 571030, "epoch": 6879} {"train_loss": -28.004907608032227, "global_step": 571031, "epoch": 6879} {"train_loss": -28.1435604095459, "global_step": 571032, "epoch": 6879} {"train_loss": -28.33216667175293, "global_step": 571033, "epoch": 6879} {"train_loss": -28.09125328063965, "global_step": 571034, "epoch": 6879} {"train_loss": -27.813505172729492, "global_step": 571035, "epoch": 6879} {"train_loss": -28.046167373657227, "global_step": 571036, "epoch": 6879} {"train_loss": -27.68839454650879, "global_step": 571037, "epoch": 6879} {"train_loss": -28.076019287109375, "global_step": 571038, "epoch": 6879} {"train_loss": -27.622558570769897, "global_step": 571039, "epoch": 6879, "val_loss": 6466119.0} {"train_loss": -26.935577392578125, "global_step": 571040, "epoch": 6880} {"train_loss": -24.612512588500977, "global_step": 571041, "epoch": 6880} {"train_loss": -20.81452178955078, "global_step": 571042, "epoch": 6880} {"train_loss": -22.82228660583496, "global_step": 571043, "epoch": 6880} {"train_loss": -27.213544845581055, "global_step": 571044, "epoch": 6880} {"train_loss": -24.561843872070312, "global_step": 571045, "epoch": 6880} {"train_loss": -26.926984786987305, "global_step": 571046, "epoch": 6880} {"train_loss": -25.805627822875977, "global_step": 571047, "epoch": 6880} {"train_loss": -27.1050968170166, "global_step": 571048, "epoch": 6880} {"train_loss": -26.955015182495117, "global_step": 571049, "epoch": 6880} {"train_loss": -26.373981475830078, "global_step": 571050, "epoch": 6880} {"train_loss": -26.989675521850586, "global_step": 571051, "epoch": 6880} {"train_loss": -27.143701553344727, "global_step": 571052, "epoch": 6880} {"train_loss": -26.54231071472168, "global_step": 571053, "epoch": 6880} {"train_loss": -26.474201202392578, "global_step": 571054, "epoch": 6880} {"train_loss": -27.172033309936523, "global_step": 571055, "epoch": 6880} {"train_loss": -26.888731002807617, "global_step": 571056, "epoch": 6880} {"train_loss": -26.879657745361328, "global_step": 571057, "epoch": 6880} {"train_loss": -26.95480728149414, "global_step": 571058, "epoch": 6880} {"train_loss": -27.226383209228516, "global_step": 571059, "epoch": 6880} {"train_loss": -27.012348175048828, "global_step": 571060, "epoch": 6880} {"train_loss": -27.1426944732666, "global_step": 571061, "epoch": 6880} {"train_loss": -27.36993980407715, "global_step": 571062, "epoch": 6880} {"train_loss": -27.260114669799805, "global_step": 571063, "epoch": 6880} {"train_loss": -27.331308364868164, "global_step": 571064, "epoch": 6880} {"train_loss": -27.17486572265625, "global_step": 571065, "epoch": 6880} {"train_loss": -26.923486709594727, "global_step": 571066, "epoch": 6880} {"train_loss": -26.99965476989746, "global_step": 571067, "epoch": 6880} {"train_loss": -27.6403751373291, "global_step": 571068, "epoch": 6880} {"train_loss": -27.53438377380371, "global_step": 571069, "epoch": 6880} {"train_loss": -27.34499168395996, "global_step": 571070, "epoch": 6880} {"train_loss": -27.5548152923584, "global_step": 571071, "epoch": 6880} {"train_loss": -27.144367218017578, "global_step": 571072, "epoch": 6880} {"train_loss": -27.60426139831543, "global_step": 571073, "epoch": 6880} {"train_loss": -27.310224533081055, "global_step": 571074, "epoch": 6880} {"train_loss": -27.90046501159668, "global_step": 571075, "epoch": 6880} {"train_loss": -27.790266036987305, "global_step": 571076, "epoch": 6880} {"train_loss": -27.6949462890625, "global_step": 571077, "epoch": 6880} {"train_loss": -27.61604118347168, "global_step": 571078, "epoch": 6880} {"train_loss": -27.68646240234375, "global_step": 571079, "epoch": 6880} {"train_loss": -27.77542495727539, "global_step": 571080, "epoch": 6880} {"train_loss": -27.742172241210938, "global_step": 571081, "epoch": 6880} {"train_loss": -27.496545791625977, "global_step": 571082, "epoch": 6880} {"train_loss": -27.463586807250977, "global_step": 571083, "epoch": 6880} {"train_loss": -27.759469985961914, "global_step": 571084, "epoch": 6880} {"train_loss": -27.64166259765625, "global_step": 571085, "epoch": 6880} {"train_loss": -27.66114616394043, "global_step": 571086, "epoch": 6880} {"train_loss": -27.700815200805664, "global_step": 571087, "epoch": 6880} {"train_loss": -27.6597900390625, "global_step": 571088, "epoch": 6880} {"train_loss": -27.908422470092773, "global_step": 571089, "epoch": 6880} {"train_loss": -27.721683502197266, "global_step": 571090, "epoch": 6880} {"train_loss": -27.7982234954834, "global_step": 571091, "epoch": 6880} {"train_loss": -27.863697052001953, "global_step": 571092, "epoch": 6880} {"train_loss": -27.87941551208496, "global_step": 571093, "epoch": 6880} {"train_loss": -27.652118682861328, "global_step": 571094, "epoch": 6880} {"train_loss": -27.84073829650879, "global_step": 571095, "epoch": 6880} {"train_loss": -27.8111572265625, "global_step": 571096, "epoch": 6880} {"train_loss": -27.941497802734375, "global_step": 571097, "epoch": 6880} {"train_loss": -28.187274932861328, "global_step": 571098, "epoch": 6880} {"train_loss": -28.130889892578125, "global_step": 571099, "epoch": 6880} {"train_loss": -27.729284286499023, "global_step": 571100, "epoch": 6880} {"train_loss": -27.83814811706543, "global_step": 571101, "epoch": 6880} {"train_loss": -27.881610870361328, "global_step": 571102, "epoch": 6880} {"train_loss": -27.982654571533203, "global_step": 571103, "epoch": 6880} {"train_loss": -28.051273345947266, "global_step": 571104, "epoch": 6880} {"train_loss": -27.543119430541992, "global_step": 571105, "epoch": 6880} {"train_loss": -27.93756675720215, "global_step": 571106, "epoch": 6880} {"train_loss": -27.182052612304688, "global_step": 571107, "epoch": 6880} {"train_loss": -27.2890625, "global_step": 571108, "epoch": 6880} {"train_loss": -27.36323356628418, "global_step": 571109, "epoch": 6880} {"train_loss": -27.943769454956055, "global_step": 571110, "epoch": 6880} {"train_loss": -27.76772117614746, "global_step": 571111, "epoch": 6880} {"train_loss": -27.535449981689453, "global_step": 571112, "epoch": 6880} {"train_loss": -27.36935806274414, "global_step": 571113, "epoch": 6880} {"train_loss": -27.784040451049805, "global_step": 571114, "epoch": 6880} {"train_loss": -27.190519332885742, "global_step": 571115, "epoch": 6880} {"train_loss": -27.641687393188477, "global_step": 571116, "epoch": 6880} {"train_loss": -27.77101707458496, "global_step": 571117, "epoch": 6880} {"train_loss": -27.388458251953125, "global_step": 571118, "epoch": 6880} {"train_loss": -27.75111198425293, "global_step": 571119, "epoch": 6880} {"train_loss": -27.956079483032227, "global_step": 571120, "epoch": 6880} {"train_loss": -27.777185440063477, "global_step": 571121, "epoch": 6880} {"train_loss": -27.228140336921417, "global_step": 571122, "epoch": 6880, "val_loss": 6449995.0} {"train_loss": -25.6895751953125, "global_step": 571123, "epoch": 6881} {"train_loss": -24.00140953063965, "global_step": 571124, "epoch": 6881} {"train_loss": -25.067306518554688, "global_step": 571125, "epoch": 6881} {"train_loss": -24.62036895751953, "global_step": 571126, "epoch": 6881} {"train_loss": -25.489978790283203, "global_step": 571127, "epoch": 6881} {"train_loss": -25.771244049072266, "global_step": 571128, "epoch": 6881} {"train_loss": -25.50480079650879, "global_step": 571129, "epoch": 6881} {"train_loss": -26.334049224853516, "global_step": 571130, "epoch": 6881} {"train_loss": -26.573028564453125, "global_step": 571131, "epoch": 6881} {"train_loss": -27.084009170532227, "global_step": 571132, "epoch": 6881} {"train_loss": -26.79340934753418, "global_step": 571133, "epoch": 6881} {"train_loss": -26.62445068359375, "global_step": 571134, "epoch": 6881} {"train_loss": -26.54029655456543, "global_step": 571135, "epoch": 6881} {"train_loss": -26.743825912475586, "global_step": 571136, "epoch": 6881} {"train_loss": -26.740747451782227, "global_step": 571137, "epoch": 6881} {"train_loss": -26.64826774597168, "global_step": 571138, "epoch": 6881} {"train_loss": -27.31607437133789, "global_step": 571139, "epoch": 6881} {"train_loss": -26.950239181518555, "global_step": 571140, "epoch": 6881} {"train_loss": -27.388681411743164, "global_step": 571141, "epoch": 6881} {"train_loss": -26.99854850769043, "global_step": 571142, "epoch": 6881} {"train_loss": -27.42451286315918, "global_step": 571143, "epoch": 6881} {"train_loss": -27.122589111328125, "global_step": 571144, "epoch": 6881} {"train_loss": -27.6416015625, "global_step": 571145, "epoch": 6881} {"train_loss": -27.42402458190918, "global_step": 571146, "epoch": 6881} {"train_loss": -27.505666732788086, "global_step": 571147, "epoch": 6881} {"train_loss": -27.26572036743164, "global_step": 571148, "epoch": 6881} {"train_loss": -27.701461791992188, "global_step": 571149, "epoch": 6881} {"train_loss": -27.363683700561523, "global_step": 571150, "epoch": 6881} {"train_loss": -27.482030868530273, "global_step": 571151, "epoch": 6881} {"train_loss": -27.300512313842773, "global_step": 571152, "epoch": 6881} {"train_loss": -27.885461807250977, "global_step": 571153, "epoch": 6881} {"train_loss": -27.734647750854492, "global_step": 571154, "epoch": 6881} {"train_loss": -27.447010040283203, "global_step": 571155, "epoch": 6881} {"train_loss": -27.64849853515625, "global_step": 571156, "epoch": 6881} {"train_loss": -27.629623413085938, "global_step": 571157, "epoch": 6881} {"train_loss": -27.58835792541504, "global_step": 571158, "epoch": 6881} {"train_loss": -27.689682006835938, "global_step": 571159, "epoch": 6881} {"train_loss": -27.627445220947266, "global_step": 571160, "epoch": 6881} {"train_loss": -27.7972469329834, "global_step": 571161, "epoch": 6881} {"train_loss": -27.607595443725586, "global_step": 571162, "epoch": 6881} {"train_loss": -27.58567237854004, "global_step": 571163, "epoch": 6881} {"train_loss": -27.92645835876465, "global_step": 571164, "epoch": 6881} {"train_loss": -27.872177124023438, "global_step": 571165, "epoch": 6881} {"train_loss": -28.20953369140625, "global_step": 571166, "epoch": 6881} {"train_loss": -27.68446159362793, "global_step": 571167, "epoch": 6881} {"train_loss": -27.839588165283203, "global_step": 571168, "epoch": 6881} {"train_loss": -27.96186637878418, "global_step": 571169, "epoch": 6881} {"train_loss": -27.993932723999023, "global_step": 571170, "epoch": 6881} {"train_loss": -27.751800537109375, "global_step": 571171, "epoch": 6881} {"train_loss": -27.948083877563477, "global_step": 571172, "epoch": 6881} {"train_loss": -28.336416244506836, "global_step": 571173, "epoch": 6881} {"train_loss": -28.1568660736084, "global_step": 571174, "epoch": 6881} {"train_loss": -27.547693252563477, "global_step": 571175, "epoch": 6881} {"train_loss": -27.4725399017334, "global_step": 571176, "epoch": 6881} {"train_loss": -27.74104118347168, "global_step": 571177, "epoch": 6881} {"train_loss": -28.20930290222168, "global_step": 571178, "epoch": 6881} {"train_loss": -27.956735610961914, "global_step": 571179, "epoch": 6881} {"train_loss": -27.500934600830078, "global_step": 571180, "epoch": 6881} {"train_loss": -27.751739501953125, "global_step": 571181, "epoch": 6881} {"train_loss": -27.712890625, "global_step": 571182, "epoch": 6881} {"train_loss": -27.946731567382812, "global_step": 571183, "epoch": 6881} {"train_loss": -27.877416610717773, "global_step": 571184, "epoch": 6881} {"train_loss": -27.564462661743164, "global_step": 571185, "epoch": 6881} {"train_loss": -27.990015029907227, "global_step": 571186, "epoch": 6881} {"train_loss": -28.064075469970703, "global_step": 571187, "epoch": 6881} {"train_loss": -27.823556900024414, "global_step": 571188, "epoch": 6881} {"train_loss": -27.627399444580078, "global_step": 571189, "epoch": 6881} {"train_loss": -27.443878173828125, "global_step": 571190, "epoch": 6881} {"train_loss": -26.9466609954834, "global_step": 571191, "epoch": 6881} {"train_loss": -27.444162368774414, "global_step": 571192, "epoch": 6881} {"train_loss": -27.444747924804688, "global_step": 571193, "epoch": 6881} {"train_loss": -26.3681583404541, "global_step": 571194, "epoch": 6881} {"train_loss": -27.228036880493164, "global_step": 571195, "epoch": 6881} {"train_loss": -27.248065948486328, "global_step": 571196, "epoch": 6881} {"train_loss": -26.757587432861328, "global_step": 571197, "epoch": 6881} {"train_loss": -27.1878662109375, "global_step": 571198, "epoch": 6881} {"train_loss": -26.944141387939453, "global_step": 571199, "epoch": 6881} {"train_loss": -27.16620445251465, "global_step": 571200, "epoch": 6881} {"train_loss": -27.48541831970215, "global_step": 571201, "epoch": 6881} {"train_loss": -27.738508224487305, "global_step": 571202, "epoch": 6881} {"train_loss": -27.890430450439453, "global_step": 571203, "epoch": 6881} {"train_loss": -27.54435157775879, "global_step": 571204, "epoch": 6881} {"train_loss": -27.2860703525773, "global_step": 571205, "epoch": 6881, "val_loss": 6381091.0} {"train_loss": -26.75349998474121, "global_step": 571206, "epoch": 6882} {"train_loss": -27.6490421295166, "global_step": 571207, "epoch": 6882} {"train_loss": -26.97477149963379, "global_step": 571208, "epoch": 6882} {"train_loss": -27.2514591217041, "global_step": 571209, "epoch": 6882} {"train_loss": -27.127532958984375, "global_step": 571210, "epoch": 6882} {"train_loss": -27.657703399658203, "global_step": 571211, "epoch": 6882} {"train_loss": -27.439783096313477, "global_step": 571212, "epoch": 6882} {"train_loss": -27.40858268737793, "global_step": 571213, "epoch": 6882} {"train_loss": -27.732635498046875, "global_step": 571214, "epoch": 6882} {"train_loss": -27.12994384765625, "global_step": 571215, "epoch": 6882} {"train_loss": -27.263355255126953, "global_step": 571216, "epoch": 6882} {"train_loss": -27.385211944580078, "global_step": 571217, "epoch": 6882} {"train_loss": -27.124927520751953, "global_step": 571218, "epoch": 6882} {"train_loss": -27.417804718017578, "global_step": 571219, "epoch": 6882} {"train_loss": -27.29363441467285, "global_step": 571220, "epoch": 6882} {"train_loss": -27.447179794311523, "global_step": 571221, "epoch": 6882} {"train_loss": -27.5778865814209, "global_step": 571222, "epoch": 6882} {"train_loss": -27.38665771484375, "global_step": 571223, "epoch": 6882} {"train_loss": -27.965686798095703, "global_step": 571224, "epoch": 6882} {"train_loss": -27.335432052612305, "global_step": 571225, "epoch": 6882} {"train_loss": -27.760400772094727, "global_step": 571226, "epoch": 6882} {"train_loss": -27.505395889282227, "global_step": 571227, "epoch": 6882} {"train_loss": -27.584543228149414, "global_step": 571228, "epoch": 6882} {"train_loss": -27.41326332092285, "global_step": 571229, "epoch": 6882} {"train_loss": -27.5281982421875, "global_step": 571230, "epoch": 6882} {"train_loss": -27.241910934448242, "global_step": 571231, "epoch": 6882} {"train_loss": -28.0788631439209, "global_step": 571232, "epoch": 6882} {"train_loss": -27.88368034362793, "global_step": 571233, "epoch": 6882} {"train_loss": -27.9134578704834, "global_step": 571234, "epoch": 6882} {"train_loss": -27.878644943237305, "global_step": 571235, "epoch": 6882} {"train_loss": -27.902196884155273, "global_step": 571236, "epoch": 6882} {"train_loss": -28.382232666015625, "global_step": 571237, "epoch": 6882} {"train_loss": -28.005252838134766, "global_step": 571238, "epoch": 6882} {"train_loss": -28.082273483276367, "global_step": 571239, "epoch": 6882} {"train_loss": -27.655319213867188, "global_step": 571240, "epoch": 6882} {"train_loss": -28.120222091674805, "global_step": 571241, "epoch": 6882} {"train_loss": -28.235748291015625, "global_step": 571242, "epoch": 6882} {"train_loss": -28.133106231689453, "global_step": 571243, "epoch": 6882} {"train_loss": -27.993743896484375, "global_step": 571244, "epoch": 6882} {"train_loss": -27.954614639282227, "global_step": 571245, "epoch": 6882} {"train_loss": -28.017194747924805, "global_step": 571246, "epoch": 6882} {"train_loss": -27.836618423461914, "global_step": 571247, "epoch": 6882} {"train_loss": -27.811277389526367, "global_step": 571248, "epoch": 6882} {"train_loss": -27.950286865234375, "global_step": 571249, "epoch": 6882} {"train_loss": -28.11724281311035, "global_step": 571250, "epoch": 6882} {"train_loss": -28.0067081451416, "global_step": 571251, "epoch": 6882} {"train_loss": -28.150501251220703, "global_step": 571252, "epoch": 6882} {"train_loss": -27.8327693939209, "global_step": 571253, "epoch": 6882} {"train_loss": -28.027450561523438, "global_step": 571254, "epoch": 6882} {"train_loss": -27.646696090698242, "global_step": 571255, "epoch": 6882} {"train_loss": -27.925125122070312, "global_step": 571256, "epoch": 6882} {"train_loss": -27.791812896728516, "global_step": 571257, "epoch": 6882} {"train_loss": -27.509916305541992, "global_step": 571258, "epoch": 6882} {"train_loss": -27.03681755065918, "global_step": 571259, "epoch": 6882} {"train_loss": -26.781721115112305, "global_step": 571260, "epoch": 6882} {"train_loss": -27.421483993530273, "global_step": 571261, "epoch": 6882} {"train_loss": -27.86124038696289, "global_step": 571262, "epoch": 6882} {"train_loss": -27.313018798828125, "global_step": 571263, "epoch": 6882} {"train_loss": -27.554962158203125, "global_step": 571264, "epoch": 6882} {"train_loss": -27.5599422454834, "global_step": 571265, "epoch": 6882} {"train_loss": -27.37314224243164, "global_step": 571266, "epoch": 6882} {"train_loss": -27.63736915588379, "global_step": 571267, "epoch": 6882} {"train_loss": -27.366418838500977, "global_step": 571268, "epoch": 6882} {"train_loss": -27.740747451782227, "global_step": 571269, "epoch": 6882} {"train_loss": -27.9379825592041, "global_step": 571270, "epoch": 6882} {"train_loss": -28.08642578125, "global_step": 571271, "epoch": 6882} {"train_loss": -27.42742347717285, "global_step": 571272, "epoch": 6882} {"train_loss": -27.777698516845703, "global_step": 571273, "epoch": 6882} {"train_loss": -28.119749069213867, "global_step": 571274, "epoch": 6882} {"train_loss": -27.81007194519043, "global_step": 571275, "epoch": 6882} {"train_loss": -27.93927001953125, "global_step": 571276, "epoch": 6882} {"train_loss": -28.00408935546875, "global_step": 571277, "epoch": 6882} {"train_loss": -27.52936363220215, "global_step": 571278, "epoch": 6882} {"train_loss": -27.836685180664062, "global_step": 571279, "epoch": 6882} {"train_loss": -27.8079833984375, "global_step": 571280, "epoch": 6882} {"train_loss": -28.091150283813477, "global_step": 571281, "epoch": 6882} {"train_loss": -27.500595092773438, "global_step": 571282, "epoch": 6882} {"train_loss": -27.512868881225586, "global_step": 571283, "epoch": 6882} {"train_loss": -27.8244686126709, "global_step": 571284, "epoch": 6882} {"train_loss": -27.49067497253418, "global_step": 571285, "epoch": 6882} {"train_loss": -27.543075561523438, "global_step": 571286, "epoch": 6882} {"train_loss": -27.92331886291504, "global_step": 571287, "epoch": 6882} {"train_loss": -27.676549819578607, "global_step": 571288, "epoch": 6882, "val_loss": 6394187.0} {"train_loss": -27.544620513916016, "global_step": 571289, "epoch": 6883} {"train_loss": -27.303058624267578, "global_step": 571290, "epoch": 6883} {"train_loss": -27.678466796875, "global_step": 571291, "epoch": 6883} {"train_loss": -27.80029296875, "global_step": 571292, "epoch": 6883} {"train_loss": -27.987634658813477, "global_step": 571293, "epoch": 6883} {"train_loss": -28.154932022094727, "global_step": 571294, "epoch": 6883} {"train_loss": -27.5515193939209, "global_step": 571295, "epoch": 6883} {"train_loss": -27.833112716674805, "global_step": 571296, "epoch": 6883} {"train_loss": -27.90705680847168, "global_step": 571297, "epoch": 6883} {"train_loss": -27.660608291625977, "global_step": 571298, "epoch": 6883} {"train_loss": -28.074176788330078, "global_step": 571299, "epoch": 6883} {"train_loss": -27.329381942749023, "global_step": 571300, "epoch": 6883} {"train_loss": -27.856170654296875, "global_step": 571301, "epoch": 6883} {"train_loss": -28.156095504760742, "global_step": 571302, "epoch": 6883} {"train_loss": -27.80975914001465, "global_step": 571303, "epoch": 6883} {"train_loss": -28.22498893737793, "global_step": 571304, "epoch": 6883} {"train_loss": -27.81609535217285, "global_step": 571305, "epoch": 6883} {"train_loss": -27.936437606811523, "global_step": 571306, "epoch": 6883} {"train_loss": -27.999372482299805, "global_step": 571307, "epoch": 6883} {"train_loss": -27.995635986328125, "global_step": 571308, "epoch": 6883} {"train_loss": -27.819910049438477, "global_step": 571309, "epoch": 6883} {"train_loss": -27.940540313720703, "global_step": 571310, "epoch": 6883} {"train_loss": -28.04201316833496, "global_step": 571311, "epoch": 6883} {"train_loss": -28.038776397705078, "global_step": 571312, "epoch": 6883} {"train_loss": -28.047780990600586, "global_step": 571313, "epoch": 6883} {"train_loss": -27.57850456237793, "global_step": 571314, "epoch": 6883} {"train_loss": -28.300369262695312, "global_step": 571315, "epoch": 6883} {"train_loss": -28.0833740234375, "global_step": 571316, "epoch": 6883} {"train_loss": -27.910573959350586, "global_step": 571317, "epoch": 6883} {"train_loss": -27.91334342956543, "global_step": 571318, "epoch": 6883} {"train_loss": -28.172931671142578, "global_step": 571319, "epoch": 6883} {"train_loss": -27.51346778869629, "global_step": 571320, "epoch": 6883} {"train_loss": -27.679121017456055, "global_step": 571321, "epoch": 6883} {"train_loss": -27.891759872436523, "global_step": 571322, "epoch": 6883} {"train_loss": -28.13336753845215, "global_step": 571323, "epoch": 6883} {"train_loss": -27.731204986572266, "global_step": 571324, "epoch": 6883} {"train_loss": -27.85797691345215, "global_step": 571325, "epoch": 6883} {"train_loss": -27.6732177734375, "global_step": 571326, "epoch": 6883} {"train_loss": -27.445236206054688, "global_step": 571327, "epoch": 6883} {"train_loss": -27.298877716064453, "global_step": 571328, "epoch": 6883} {"train_loss": -27.69168472290039, "global_step": 571329, "epoch": 6883} {"train_loss": -27.876264572143555, "global_step": 571330, "epoch": 6883} {"train_loss": -27.779434204101562, "global_step": 571331, "epoch": 6883} {"train_loss": -27.966541290283203, "global_step": 571332, "epoch": 6883} {"train_loss": -28.014570236206055, "global_step": 571333, "epoch": 6883} {"train_loss": -27.872730255126953, "global_step": 571334, "epoch": 6883} {"train_loss": -27.719898223876953, "global_step": 571335, "epoch": 6883} {"train_loss": -27.806127548217773, "global_step": 571336, "epoch": 6883} {"train_loss": -28.11529541015625, "global_step": 571337, "epoch": 6883} {"train_loss": -28.133142471313477, "global_step": 571338, "epoch": 6883} {"train_loss": -28.27294921875, "global_step": 571339, "epoch": 6883} {"train_loss": -27.9538516998291, "global_step": 571340, "epoch": 6883} {"train_loss": -27.553937911987305, "global_step": 571341, "epoch": 6883} {"train_loss": -28.195907592773438, "global_step": 571342, "epoch": 6883} {"train_loss": -27.88873863220215, "global_step": 571343, "epoch": 6883} {"train_loss": -27.74293327331543, "global_step": 571344, "epoch": 6883} {"train_loss": -28.40144157409668, "global_step": 571345, "epoch": 6883} {"train_loss": -27.89794921875, "global_step": 571346, "epoch": 6883} {"train_loss": -27.781253814697266, "global_step": 571347, "epoch": 6883} {"train_loss": -28.169843673706055, "global_step": 571348, "epoch": 6883} {"train_loss": -27.695831298828125, "global_step": 571349, "epoch": 6883} {"train_loss": -27.765430450439453, "global_step": 571350, "epoch": 6883} {"train_loss": -27.790607452392578, "global_step": 571351, "epoch": 6883} {"train_loss": -27.148481369018555, "global_step": 571352, "epoch": 6883} {"train_loss": -28.022354125976562, "global_step": 571353, "epoch": 6883} {"train_loss": -27.675796508789062, "global_step": 571354, "epoch": 6883} {"train_loss": -28.102054595947266, "global_step": 571355, "epoch": 6883} {"train_loss": -27.890827178955078, "global_step": 571356, "epoch": 6883} {"train_loss": -27.922882080078125, "global_step": 571357, "epoch": 6883} {"train_loss": -27.893268585205078, "global_step": 571358, "epoch": 6883} {"train_loss": -27.993579864501953, "global_step": 571359, "epoch": 6883} {"train_loss": -27.858245849609375, "global_step": 571360, "epoch": 6883} {"train_loss": -27.707117080688477, "global_step": 571361, "epoch": 6883} {"train_loss": -27.85849952697754, "global_step": 571362, "epoch": 6883} {"train_loss": -28.059589385986328, "global_step": 571363, "epoch": 6883} {"train_loss": -28.029132843017578, "global_step": 571364, "epoch": 6883} {"train_loss": -28.256458282470703, "global_step": 571365, "epoch": 6883} {"train_loss": -28.328353881835938, "global_step": 571366, "epoch": 6883} {"train_loss": -27.661230087280273, "global_step": 571367, "epoch": 6883} {"train_loss": -27.73308753967285, "global_step": 571368, "epoch": 6883} {"train_loss": -28.350000381469727, "global_step": 571369, "epoch": 6883} {"train_loss": -27.6292781829834, "global_step": 571370, "epoch": 6883} {"train_loss": -27.865375105156957, "global_step": 571371, "epoch": 6883, "val_loss": 6410846.5} {"train_loss": -27.63079833984375, "global_step": 571372, "epoch": 6884} {"train_loss": -26.48948097229004, "global_step": 571373, "epoch": 6884} {"train_loss": -25.83245277404785, "global_step": 571374, "epoch": 6884} {"train_loss": -25.170949935913086, "global_step": 571375, "epoch": 6884} {"train_loss": -26.171741485595703, "global_step": 571376, "epoch": 6884} {"train_loss": -27.023807525634766, "global_step": 571377, "epoch": 6884} {"train_loss": -26.98200035095215, "global_step": 571378, "epoch": 6884} {"train_loss": -27.035085678100586, "global_step": 571379, "epoch": 6884} {"train_loss": -27.271469116210938, "global_step": 571380, "epoch": 6884} {"train_loss": -27.047266006469727, "global_step": 571381, "epoch": 6884} {"train_loss": -27.4594783782959, "global_step": 571382, "epoch": 6884} {"train_loss": -27.385549545288086, "global_step": 571383, "epoch": 6884} {"train_loss": -27.2457218170166, "global_step": 571384, "epoch": 6884} {"train_loss": -27.4508056640625, "global_step": 571385, "epoch": 6884} {"train_loss": -27.503393173217773, "global_step": 571386, "epoch": 6884} {"train_loss": -27.489511489868164, "global_step": 571387, "epoch": 6884} {"train_loss": -27.40765953063965, "global_step": 571388, "epoch": 6884} {"train_loss": -27.607946395874023, "global_step": 571389, "epoch": 6884} {"train_loss": -27.688215255737305, "global_step": 571390, "epoch": 6884} {"train_loss": -27.69852066040039, "global_step": 571391, "epoch": 6884} {"train_loss": -27.495492935180664, "global_step": 571392, "epoch": 6884} {"train_loss": -27.498981475830078, "global_step": 571393, "epoch": 6884} {"train_loss": -27.362512588500977, "global_step": 571394, "epoch": 6884} {"train_loss": -27.622800827026367, "global_step": 571395, "epoch": 6884} {"train_loss": -27.686004638671875, "global_step": 571396, "epoch": 6884} {"train_loss": -27.814252853393555, "global_step": 571397, "epoch": 6884} {"train_loss": -27.942045211791992, "global_step": 571398, "epoch": 6884} {"train_loss": -27.698286056518555, "global_step": 571399, "epoch": 6884} {"train_loss": -27.339645385742188, "global_step": 571400, "epoch": 6884} {"train_loss": -27.995630264282227, "global_step": 571401, "epoch": 6884} {"train_loss": -28.016223907470703, "global_step": 571402, "epoch": 6884} {"train_loss": -27.74692153930664, "global_step": 571403, "epoch": 6884} {"train_loss": -27.550012588500977, "global_step": 571404, "epoch": 6884} {"train_loss": -27.825687408447266, "global_step": 571405, "epoch": 6884} {"train_loss": -28.1058406829834, "global_step": 571406, "epoch": 6884} {"train_loss": -27.8438720703125, "global_step": 571407, "epoch": 6884} {"train_loss": -27.65081214904785, "global_step": 571408, "epoch": 6884} {"train_loss": -27.945398330688477, "global_step": 571409, "epoch": 6884} {"train_loss": -28.154279708862305, "global_step": 571410, "epoch": 6884} {"train_loss": -28.31129264831543, "global_step": 571411, "epoch": 6884} {"train_loss": -27.967206954956055, "global_step": 571412, "epoch": 6884} {"train_loss": -27.7977294921875, "global_step": 571413, "epoch": 6884} {"train_loss": -28.380178451538086, "global_step": 571414, "epoch": 6884} {"train_loss": -28.300806045532227, "global_step": 571415, "epoch": 6884} {"train_loss": -28.405481338500977, "global_step": 571416, "epoch": 6884} {"train_loss": -28.018390655517578, "global_step": 571417, "epoch": 6884} {"train_loss": -27.943866729736328, "global_step": 571418, "epoch": 6884} {"train_loss": -28.3055419921875, "global_step": 571419, "epoch": 6884} {"train_loss": -28.11835289001465, "global_step": 571420, "epoch": 6884} {"train_loss": -27.857624053955078, "global_step": 571421, "epoch": 6884} {"train_loss": -27.77707862854004, "global_step": 571422, "epoch": 6884} {"train_loss": -28.40542984008789, "global_step": 571423, "epoch": 6884} {"train_loss": -28.1966552734375, "global_step": 571424, "epoch": 6884} {"train_loss": -27.76210594177246, "global_step": 571425, "epoch": 6884} {"train_loss": -28.42201805114746, "global_step": 571426, "epoch": 6884} {"train_loss": -27.705066680908203, "global_step": 571427, "epoch": 6884} {"train_loss": -28.100610733032227, "global_step": 571428, "epoch": 6884} {"train_loss": -27.564044952392578, "global_step": 571429, "epoch": 6884} {"train_loss": -28.242691040039062, "global_step": 571430, "epoch": 6884} {"train_loss": -27.786285400390625, "global_step": 571431, "epoch": 6884} {"train_loss": -27.882917404174805, "global_step": 571432, "epoch": 6884} {"train_loss": -27.925718307495117, "global_step": 571433, "epoch": 6884} {"train_loss": -27.851694107055664, "global_step": 571434, "epoch": 6884} {"train_loss": -27.729206085205078, "global_step": 571435, "epoch": 6884} {"train_loss": -27.9294490814209, "global_step": 571436, "epoch": 6884} {"train_loss": -28.063034057617188, "global_step": 571437, "epoch": 6884} {"train_loss": -27.783466339111328, "global_step": 571438, "epoch": 6884} {"train_loss": -28.007978439331055, "global_step": 571439, "epoch": 6884} {"train_loss": -28.146759033203125, "global_step": 571440, "epoch": 6884} {"train_loss": -28.112289428710938, "global_step": 571441, "epoch": 6884} {"train_loss": -28.268842697143555, "global_step": 571442, "epoch": 6884} {"train_loss": -28.170103073120117, "global_step": 571443, "epoch": 6884} {"train_loss": -27.7679386138916, "global_step": 571444, "epoch": 6884} {"train_loss": -27.8535213470459, "global_step": 571445, "epoch": 6884} {"train_loss": -27.83066749572754, "global_step": 571446, "epoch": 6884} {"train_loss": -28.526111602783203, "global_step": 571447, "epoch": 6884} {"train_loss": -27.9511661529541, "global_step": 571448, "epoch": 6884} {"train_loss": -28.017675399780273, "global_step": 571449, "epoch": 6884} {"train_loss": -27.97420310974121, "global_step": 571450, "epoch": 6884} {"train_loss": -27.986133575439453, "global_step": 571451, "epoch": 6884} {"train_loss": -27.988073348999023, "global_step": 571452, "epoch": 6884} {"train_loss": -28.343677520751953, "global_step": 571453, "epoch": 6884} {"train_loss": -27.72565446417016, "global_step": 571454, "epoch": 6884, "val_loss": 6414825.0} {"train_loss": -25.835819244384766, "global_step": 571455, "epoch": 6885} {"train_loss": -25.31821060180664, "global_step": 571456, "epoch": 6885} {"train_loss": -26.051116943359375, "global_step": 571457, "epoch": 6885} {"train_loss": -26.792505264282227, "global_step": 571458, "epoch": 6885} {"train_loss": -26.76154899597168, "global_step": 571459, "epoch": 6885} {"train_loss": -26.981481552124023, "global_step": 571460, "epoch": 6885} {"train_loss": -26.72760581970215, "global_step": 571461, "epoch": 6885} {"train_loss": -27.5199031829834, "global_step": 571462, "epoch": 6885} {"train_loss": -27.423492431640625, "global_step": 571463, "epoch": 6885} {"train_loss": -27.459259033203125, "global_step": 571464, "epoch": 6885} {"train_loss": -26.915449142456055, "global_step": 571465, "epoch": 6885} {"train_loss": -27.24749183654785, "global_step": 571466, "epoch": 6885} {"train_loss": -27.66366958618164, "global_step": 571467, "epoch": 6885} {"train_loss": -27.337879180908203, "global_step": 571468, "epoch": 6885} {"train_loss": -27.616790771484375, "global_step": 571469, "epoch": 6885} {"train_loss": -27.556955337524414, "global_step": 571470, "epoch": 6885} {"train_loss": -27.177785873413086, "global_step": 571471, "epoch": 6885} {"train_loss": -27.481138229370117, "global_step": 571472, "epoch": 6885} {"train_loss": -27.675668716430664, "global_step": 571473, "epoch": 6885} {"train_loss": -27.762136459350586, "global_step": 571474, "epoch": 6885} {"train_loss": -27.489532470703125, "global_step": 571475, "epoch": 6885} {"train_loss": -27.371597290039062, "global_step": 571476, "epoch": 6885} {"train_loss": -27.59220314025879, "global_step": 571477, "epoch": 6885} {"train_loss": -27.348615646362305, "global_step": 571478, "epoch": 6885} {"train_loss": -27.5751953125, "global_step": 571479, "epoch": 6885} {"train_loss": -27.423437118530273, "global_step": 571480, "epoch": 6885} {"train_loss": -27.363019943237305, "global_step": 571481, "epoch": 6885} {"train_loss": -27.345752716064453, "global_step": 571482, "epoch": 6885} {"train_loss": -27.443531036376953, "global_step": 571483, "epoch": 6885} {"train_loss": -27.667240142822266, "global_step": 571484, "epoch": 6885} {"train_loss": -27.753543853759766, "global_step": 571485, "epoch": 6885} {"train_loss": -27.507007598876953, "global_step": 571486, "epoch": 6885} {"train_loss": -27.28278160095215, "global_step": 571487, "epoch": 6885} {"train_loss": -27.61417579650879, "global_step": 571488, "epoch": 6885} {"train_loss": -27.25461196899414, "global_step": 571489, "epoch": 6885} {"train_loss": -27.8436222076416, "global_step": 571490, "epoch": 6885} {"train_loss": -27.996749877929688, "global_step": 571491, "epoch": 6885} {"train_loss": -27.558263778686523, "global_step": 571492, "epoch": 6885} {"train_loss": -27.629730224609375, "global_step": 571493, "epoch": 6885} {"train_loss": -28.149860382080078, "global_step": 571494, "epoch": 6885} {"train_loss": -27.84762954711914, "global_step": 571495, "epoch": 6885} {"train_loss": -27.79745864868164, "global_step": 571496, "epoch": 6885} {"train_loss": -27.718231201171875, "global_step": 571497, "epoch": 6885} {"train_loss": -27.607513427734375, "global_step": 571498, "epoch": 6885} {"train_loss": -27.87550163269043, "global_step": 571499, "epoch": 6885} {"train_loss": -27.762704849243164, "global_step": 571500, "epoch": 6885} {"train_loss": -27.650598526000977, "global_step": 571501, "epoch": 6885} {"train_loss": -27.903593063354492, "global_step": 571502, "epoch": 6885} {"train_loss": -27.933185577392578, "global_step": 571503, "epoch": 6885} {"train_loss": -27.729284286499023, "global_step": 571504, "epoch": 6885} {"train_loss": -27.9140682220459, "global_step": 571505, "epoch": 6885} {"train_loss": -28.25628089904785, "global_step": 571506, "epoch": 6885} {"train_loss": -27.836780548095703, "global_step": 571507, "epoch": 6885} {"train_loss": -27.913862228393555, "global_step": 571508, "epoch": 6885} {"train_loss": -27.60529899597168, "global_step": 571509, "epoch": 6885} {"train_loss": -28.049713134765625, "global_step": 571510, "epoch": 6885} {"train_loss": -27.872888565063477, "global_step": 571511, "epoch": 6885} {"train_loss": -27.80952262878418, "global_step": 571512, "epoch": 6885} {"train_loss": -28.04786491394043, "global_step": 571513, "epoch": 6885} {"train_loss": -28.080493927001953, "global_step": 571514, "epoch": 6885} {"train_loss": -28.339441299438477, "global_step": 571515, "epoch": 6885} {"train_loss": -27.84731101989746, "global_step": 571516, "epoch": 6885} {"train_loss": -27.61060905456543, "global_step": 571517, "epoch": 6885} {"train_loss": -28.350833892822266, "global_step": 571518, "epoch": 6885} {"train_loss": -27.861438751220703, "global_step": 571519, "epoch": 6885} {"train_loss": -27.71771812438965, "global_step": 571520, "epoch": 6885} {"train_loss": -27.616479873657227, "global_step": 571521, "epoch": 6885} {"train_loss": -28.1845760345459, "global_step": 571522, "epoch": 6885} {"train_loss": -27.853322982788086, "global_step": 571523, "epoch": 6885} {"train_loss": -27.701465606689453, "global_step": 571524, "epoch": 6885} {"train_loss": -27.955060958862305, "global_step": 571525, "epoch": 6885} {"train_loss": -28.164459228515625, "global_step": 571526, "epoch": 6885} {"train_loss": -27.965368270874023, "global_step": 571527, "epoch": 6885} {"train_loss": -27.845626831054688, "global_step": 571528, "epoch": 6885} {"train_loss": -27.726572036743164, "global_step": 571529, "epoch": 6885} {"train_loss": -27.673980712890625, "global_step": 571530, "epoch": 6885} {"train_loss": -27.957782745361328, "global_step": 571531, "epoch": 6885} {"train_loss": -27.894805908203125, "global_step": 571532, "epoch": 6885} {"train_loss": -28.456518173217773, "global_step": 571533, "epoch": 6885} {"train_loss": -27.958005905151367, "global_step": 571534, "epoch": 6885} {"train_loss": -27.932748794555664, "global_step": 571535, "epoch": 6885} {"train_loss": -27.736600875854492, "global_step": 571536, "epoch": 6885} {"train_loss": -27.622836239366645, "global_step": 571537, "epoch": 6885, "val_loss": 6393002.0} {"train_loss": -27.51436424255371, "global_step": 571538, "epoch": 6886} {"train_loss": -27.459930419921875, "global_step": 571539, "epoch": 6886} {"train_loss": -27.4456787109375, "global_step": 571540, "epoch": 6886} {"train_loss": -27.443342208862305, "global_step": 571541, "epoch": 6886} {"train_loss": -27.607177734375, "global_step": 571542, "epoch": 6886} {"train_loss": -27.05975341796875, "global_step": 571543, "epoch": 6886} {"train_loss": -26.72247886657715, "global_step": 571544, "epoch": 6886} {"train_loss": -26.6199951171875, "global_step": 571545, "epoch": 6886} {"train_loss": -27.152860641479492, "global_step": 571546, "epoch": 6886} {"train_loss": -27.12015724182129, "global_step": 571547, "epoch": 6886} {"train_loss": -27.4896183013916, "global_step": 571548, "epoch": 6886} {"train_loss": -27.533050537109375, "global_step": 571549, "epoch": 6886} {"train_loss": -27.628421783447266, "global_step": 571550, "epoch": 6886} {"train_loss": -27.438159942626953, "global_step": 571551, "epoch": 6886} {"train_loss": -27.502899169921875, "global_step": 571552, "epoch": 6886} {"train_loss": -27.780927658081055, "global_step": 571553, "epoch": 6886} {"train_loss": -27.63783836364746, "global_step": 571554, "epoch": 6886} {"train_loss": -27.257953643798828, "global_step": 571555, "epoch": 6886} {"train_loss": -27.310535430908203, "global_step": 571556, "epoch": 6886} {"train_loss": -27.81776237487793, "global_step": 571557, "epoch": 6886} {"train_loss": -27.71652603149414, "global_step": 571558, "epoch": 6886} {"train_loss": -27.49966812133789, "global_step": 571559, "epoch": 6886} {"train_loss": -27.373676300048828, "global_step": 571560, "epoch": 6886} {"train_loss": -27.472370147705078, "global_step": 571561, "epoch": 6886} {"train_loss": -27.939468383789062, "global_step": 571562, "epoch": 6886} {"train_loss": -27.798816680908203, "global_step": 571563, "epoch": 6886} {"train_loss": -27.4713077545166, "global_step": 571564, "epoch": 6886} {"train_loss": -27.525930404663086, "global_step": 571565, "epoch": 6886} {"train_loss": -27.424407958984375, "global_step": 571566, "epoch": 6886} {"train_loss": -27.49755859375, "global_step": 571567, "epoch": 6886} {"train_loss": -27.896926879882812, "global_step": 571568, "epoch": 6886} {"train_loss": -27.590362548828125, "global_step": 571569, "epoch": 6886} {"train_loss": -27.727741241455078, "global_step": 571570, "epoch": 6886} {"train_loss": -27.630664825439453, "global_step": 571571, "epoch": 6886} {"train_loss": -27.462018966674805, "global_step": 571572, "epoch": 6886} {"train_loss": -27.745763778686523, "global_step": 571573, "epoch": 6886} {"train_loss": -27.751977920532227, "global_step": 571574, "epoch": 6886} {"train_loss": -27.710987091064453, "global_step": 571575, "epoch": 6886} {"train_loss": -27.808780670166016, "global_step": 571576, "epoch": 6886} {"train_loss": -27.80146598815918, "global_step": 571577, "epoch": 6886} {"train_loss": -28.14521598815918, "global_step": 571578, "epoch": 6886} {"train_loss": -27.904211044311523, "global_step": 571579, "epoch": 6886} {"train_loss": -28.357980728149414, "global_step": 571580, "epoch": 6886} {"train_loss": -28.02187156677246, "global_step": 571581, "epoch": 6886} {"train_loss": -28.179065704345703, "global_step": 571582, "epoch": 6886} {"train_loss": -28.052021026611328, "global_step": 571583, "epoch": 6886} {"train_loss": -28.065282821655273, "global_step": 571584, "epoch": 6886} {"train_loss": -28.09427261352539, "global_step": 571585, "epoch": 6886} {"train_loss": -27.968708038330078, "global_step": 571586, "epoch": 6886} {"train_loss": -27.7567195892334, "global_step": 571587, "epoch": 6886} {"train_loss": -27.8764705657959, "global_step": 571588, "epoch": 6886} {"train_loss": -28.23317527770996, "global_step": 571589, "epoch": 6886} {"train_loss": -28.198078155517578, "global_step": 571590, "epoch": 6886} {"train_loss": -28.127777099609375, "global_step": 571591, "epoch": 6886} {"train_loss": -27.71148681640625, "global_step": 571592, "epoch": 6886} {"train_loss": -28.23951530456543, "global_step": 571593, "epoch": 6886} {"train_loss": -27.904632568359375, "global_step": 571594, "epoch": 6886} {"train_loss": -28.01563835144043, "global_step": 571595, "epoch": 6886} {"train_loss": -28.372961044311523, "global_step": 571596, "epoch": 6886} {"train_loss": -28.253950119018555, "global_step": 571597, "epoch": 6886} {"train_loss": -27.95096206665039, "global_step": 571598, "epoch": 6886} {"train_loss": -27.856027603149414, "global_step": 571599, "epoch": 6886} {"train_loss": -28.08477210998535, "global_step": 571600, "epoch": 6886} {"train_loss": -28.030237197875977, "global_step": 571601, "epoch": 6886} {"train_loss": -28.19732093811035, "global_step": 571602, "epoch": 6886} {"train_loss": -27.869037628173828, "global_step": 571603, "epoch": 6886} {"train_loss": -28.201751708984375, "global_step": 571604, "epoch": 6886} {"train_loss": -28.033863067626953, "global_step": 571605, "epoch": 6886} {"train_loss": -27.83246421813965, "global_step": 571606, "epoch": 6886} {"train_loss": -27.783430099487305, "global_step": 571607, "epoch": 6886} {"train_loss": -27.909076690673828, "global_step": 571608, "epoch": 6886} {"train_loss": -28.22391700744629, "global_step": 571609, "epoch": 6886} {"train_loss": -27.781782150268555, "global_step": 571610, "epoch": 6886} {"train_loss": -28.417123794555664, "global_step": 571611, "epoch": 6886} {"train_loss": -28.19972038269043, "global_step": 571612, "epoch": 6886} {"train_loss": -27.394994735717773, "global_step": 571613, "epoch": 6886} {"train_loss": -26.819616317749023, "global_step": 571614, "epoch": 6886} {"train_loss": -27.44301414489746, "global_step": 571615, "epoch": 6886} {"train_loss": -26.862058639526367, "global_step": 571616, "epoch": 6886} {"train_loss": -27.37693214416504, "global_step": 571617, "epoch": 6886} {"train_loss": -28.026029586791992, "global_step": 571618, "epoch": 6886} {"train_loss": -27.714391708374023, "global_step": 571619, "epoch": 6886} {"train_loss": -27.7176691308079, "global_step": 571620, "epoch": 6886, "val_loss": 6474768.0} {"train_loss": -26.263830184936523, "global_step": 571621, "epoch": 6887} {"train_loss": -27.07636070251465, "global_step": 571622, "epoch": 6887} {"train_loss": -27.396432876586914, "global_step": 571623, "epoch": 6887} {"train_loss": -26.849409103393555, "global_step": 571624, "epoch": 6887} {"train_loss": -26.661361694335938, "global_step": 571625, "epoch": 6887} {"train_loss": -27.2849178314209, "global_step": 571626, "epoch": 6887} {"train_loss": -27.533899307250977, "global_step": 571627, "epoch": 6887} {"train_loss": -27.25385856628418, "global_step": 571628, "epoch": 6887} {"train_loss": -27.712207794189453, "global_step": 571629, "epoch": 6887} {"train_loss": -27.704273223876953, "global_step": 571630, "epoch": 6887} {"train_loss": -27.5229434967041, "global_step": 571631, "epoch": 6887} {"train_loss": -27.345081329345703, "global_step": 571632, "epoch": 6887} {"train_loss": -27.421117782592773, "global_step": 571633, "epoch": 6887} {"train_loss": -27.37225341796875, "global_step": 571634, "epoch": 6887} {"train_loss": -27.895292282104492, "global_step": 571635, "epoch": 6887} {"train_loss": -27.73438835144043, "global_step": 571636, "epoch": 6887} {"train_loss": -27.52924919128418, "global_step": 571637, "epoch": 6887} {"train_loss": -27.829030990600586, "global_step": 571638, "epoch": 6887} {"train_loss": -27.77716636657715, "global_step": 571639, "epoch": 6887} {"train_loss": -27.80463218688965, "global_step": 571640, "epoch": 6887} {"train_loss": -27.95490074157715, "global_step": 571641, "epoch": 6887} {"train_loss": -27.5639591217041, "global_step": 571642, "epoch": 6887} {"train_loss": -27.46122169494629, "global_step": 571643, "epoch": 6887} {"train_loss": -27.945215225219727, "global_step": 571644, "epoch": 6887} {"train_loss": -27.733366012573242, "global_step": 571645, "epoch": 6887} {"train_loss": -28.029022216796875, "global_step": 571646, "epoch": 6887} {"train_loss": -27.627328872680664, "global_step": 571647, "epoch": 6887} {"train_loss": -27.728586196899414, "global_step": 571648, "epoch": 6887} {"train_loss": -27.71044921875, "global_step": 571649, "epoch": 6887} {"train_loss": -28.270511627197266, "global_step": 571650, "epoch": 6887} {"train_loss": -27.646127700805664, "global_step": 571651, "epoch": 6887} {"train_loss": -27.373031616210938, "global_step": 571652, "epoch": 6887} {"train_loss": -28.052616119384766, "global_step": 571653, "epoch": 6887} {"train_loss": -27.9221134185791, "global_step": 571654, "epoch": 6887} {"train_loss": -27.964452743530273, "global_step": 571655, "epoch": 6887} {"train_loss": -28.181806564331055, "global_step": 571656, "epoch": 6887} {"train_loss": -28.1220703125, "global_step": 571657, "epoch": 6887} {"train_loss": -28.0673828125, "global_step": 571658, "epoch": 6887} {"train_loss": -27.677204132080078, "global_step": 571659, "epoch": 6887} {"train_loss": -27.80622673034668, "global_step": 571660, "epoch": 6887} {"train_loss": -28.05118751525879, "global_step": 571661, "epoch": 6887} {"train_loss": -27.729598999023438, "global_step": 571662, "epoch": 6887} {"train_loss": -28.106664657592773, "global_step": 571663, "epoch": 6887} {"train_loss": -28.24530029296875, "global_step": 571664, "epoch": 6887} {"train_loss": -28.16470718383789, "global_step": 571665, "epoch": 6887} {"train_loss": -28.079999923706055, "global_step": 571666, "epoch": 6887} {"train_loss": -27.872013092041016, "global_step": 571667, "epoch": 6887} {"train_loss": -28.03460121154785, "global_step": 571668, "epoch": 6887} {"train_loss": -28.201282501220703, "global_step": 571669, "epoch": 6887} {"train_loss": -28.075681686401367, "global_step": 571670, "epoch": 6887} {"train_loss": -28.329259872436523, "global_step": 571671, "epoch": 6887} {"train_loss": -27.785032272338867, "global_step": 571672, "epoch": 6887} {"train_loss": -27.812891006469727, "global_step": 571673, "epoch": 6887} {"train_loss": -27.815778732299805, "global_step": 571674, "epoch": 6887} {"train_loss": -27.800601959228516, "global_step": 571675, "epoch": 6887} {"train_loss": -28.150793075561523, "global_step": 571676, "epoch": 6887} {"train_loss": -28.221654891967773, "global_step": 571677, "epoch": 6887} {"train_loss": -27.795902252197266, "global_step": 571678, "epoch": 6887} {"train_loss": -27.48940086364746, "global_step": 571679, "epoch": 6887} {"train_loss": -27.960229873657227, "global_step": 571680, "epoch": 6887} {"train_loss": -27.675216674804688, "global_step": 571681, "epoch": 6887} {"train_loss": -27.6165828704834, "global_step": 571682, "epoch": 6887} {"train_loss": -27.54815673828125, "global_step": 571683, "epoch": 6887} {"train_loss": -27.416336059570312, "global_step": 571684, "epoch": 6887} {"train_loss": -27.26954460144043, "global_step": 571685, "epoch": 6887} {"train_loss": -27.2911376953125, "global_step": 571686, "epoch": 6887} {"train_loss": -28.147851943969727, "global_step": 571687, "epoch": 6887} {"train_loss": -27.708118438720703, "global_step": 571688, "epoch": 6887} {"train_loss": -27.536224365234375, "global_step": 571689, "epoch": 6887} {"train_loss": -27.77387809753418, "global_step": 571690, "epoch": 6887} {"train_loss": -27.460296630859375, "global_step": 571691, "epoch": 6887} {"train_loss": -27.87244987487793, "global_step": 571692, "epoch": 6887} {"train_loss": -27.611515045166016, "global_step": 571693, "epoch": 6887} {"train_loss": -27.540435791015625, "global_step": 571694, "epoch": 6887} {"train_loss": -27.413776397705078, "global_step": 571695, "epoch": 6887} {"train_loss": -27.57661247253418, "global_step": 571696, "epoch": 6887} {"train_loss": -27.02850914001465, "global_step": 571697, "epoch": 6887} {"train_loss": -27.320648193359375, "global_step": 571698, "epoch": 6887} {"train_loss": -27.78862953186035, "global_step": 571699, "epoch": 6887} {"train_loss": -27.59395408630371, "global_step": 571700, "epoch": 6887} {"train_loss": -27.48963737487793, "global_step": 571701, "epoch": 6887} {"train_loss": -27.952184677124023, "global_step": 571702, "epoch": 6887} {"train_loss": -27.69875252964985, "global_step": 571703, "epoch": 6887, "val_loss": 6539769.0} {"train_loss": -26.314746856689453, "global_step": 571704, "epoch": 6888} {"train_loss": -25.225149154663086, "global_step": 571705, "epoch": 6888} {"train_loss": -27.031362533569336, "global_step": 571706, "epoch": 6888} {"train_loss": -26.848310470581055, "global_step": 571707, "epoch": 6888} {"train_loss": -26.98813247680664, "global_step": 571708, "epoch": 6888} {"train_loss": -27.356409072875977, "global_step": 571709, "epoch": 6888} {"train_loss": -27.026655197143555, "global_step": 571710, "epoch": 6888} {"train_loss": -27.23744010925293, "global_step": 571711, "epoch": 6888} {"train_loss": -27.240341186523438, "global_step": 571712, "epoch": 6888} {"train_loss": -26.751386642456055, "global_step": 571713, "epoch": 6888} {"train_loss": -27.54513931274414, "global_step": 571714, "epoch": 6888} {"train_loss": -27.099695205688477, "global_step": 571715, "epoch": 6888} {"train_loss": -27.286731719970703, "global_step": 571716, "epoch": 6888} {"train_loss": -27.168628692626953, "global_step": 571717, "epoch": 6888} {"train_loss": -27.426822662353516, "global_step": 571718, "epoch": 6888} {"train_loss": -27.71245765686035, "global_step": 571719, "epoch": 6888} {"train_loss": -27.627546310424805, "global_step": 571720, "epoch": 6888} {"train_loss": -27.244367599487305, "global_step": 571721, "epoch": 6888} {"train_loss": -27.25322914123535, "global_step": 571722, "epoch": 6888} {"train_loss": -27.780736923217773, "global_step": 571723, "epoch": 6888} {"train_loss": -27.457935333251953, "global_step": 571724, "epoch": 6888} {"train_loss": -27.612457275390625, "global_step": 571725, "epoch": 6888} {"train_loss": -27.555810928344727, "global_step": 571726, "epoch": 6888} {"train_loss": -27.594318389892578, "global_step": 571727, "epoch": 6888} {"train_loss": -27.681365966796875, "global_step": 571728, "epoch": 6888} {"train_loss": -27.382099151611328, "global_step": 571729, "epoch": 6888} {"train_loss": -27.695301055908203, "global_step": 571730, "epoch": 6888} {"train_loss": -27.61104393005371, "global_step": 571731, "epoch": 6888} {"train_loss": -28.033491134643555, "global_step": 571732, "epoch": 6888} {"train_loss": -27.503498077392578, "global_step": 571733, "epoch": 6888} {"train_loss": -28.024518966674805, "global_step": 571734, "epoch": 6888} {"train_loss": -27.914304733276367, "global_step": 571735, "epoch": 6888} {"train_loss": -27.52362060546875, "global_step": 571736, "epoch": 6888} {"train_loss": -28.184545516967773, "global_step": 571737, "epoch": 6888} {"train_loss": -28.01788330078125, "global_step": 571738, "epoch": 6888} {"train_loss": -28.12885856628418, "global_step": 571739, "epoch": 6888} {"train_loss": -28.17295265197754, "global_step": 571740, "epoch": 6888} {"train_loss": -27.691553115844727, "global_step": 571741, "epoch": 6888} {"train_loss": -27.71637535095215, "global_step": 571742, "epoch": 6888} {"train_loss": -27.82118034362793, "global_step": 571743, "epoch": 6888} {"train_loss": -27.945606231689453, "global_step": 571744, "epoch": 6888} {"train_loss": -27.983230590820312, "global_step": 571745, "epoch": 6888} {"train_loss": -28.154882431030273, "global_step": 571746, "epoch": 6888} {"train_loss": -28.14847183227539, "global_step": 571747, "epoch": 6888} {"train_loss": -27.92804527282715, "global_step": 571748, "epoch": 6888} {"train_loss": -28.118423461914062, "global_step": 571749, "epoch": 6888} {"train_loss": -28.210041046142578, "global_step": 571750, "epoch": 6888} {"train_loss": -28.038488388061523, "global_step": 571751, "epoch": 6888} {"train_loss": -27.77734375, "global_step": 571752, "epoch": 6888} {"train_loss": -27.8149471282959, "global_step": 571753, "epoch": 6888} {"train_loss": -27.92473793029785, "global_step": 571754, "epoch": 6888} {"train_loss": -27.78680992126465, "global_step": 571755, "epoch": 6888} {"train_loss": -28.454702377319336, "global_step": 571756, "epoch": 6888} {"train_loss": -28.25341796875, "global_step": 571757, "epoch": 6888} {"train_loss": -28.25142478942871, "global_step": 571758, "epoch": 6888} {"train_loss": -28.100177764892578, "global_step": 571759, "epoch": 6888} {"train_loss": -28.2723388671875, "global_step": 571760, "epoch": 6888} {"train_loss": -28.07599449157715, "global_step": 571761, "epoch": 6888} {"train_loss": -28.214014053344727, "global_step": 571762, "epoch": 6888} {"train_loss": -28.37922477722168, "global_step": 571763, "epoch": 6888} {"train_loss": -28.29572868347168, "global_step": 571764, "epoch": 6888} {"train_loss": -27.962158203125, "global_step": 571765, "epoch": 6888} {"train_loss": -27.89337158203125, "global_step": 571766, "epoch": 6888} {"train_loss": -27.616872787475586, "global_step": 571767, "epoch": 6888} {"train_loss": -27.640039443969727, "global_step": 571768, "epoch": 6888} {"train_loss": -28.218677520751953, "global_step": 571769, "epoch": 6888} {"train_loss": -28.064023971557617, "global_step": 571770, "epoch": 6888} {"train_loss": -28.20118522644043, "global_step": 571771, "epoch": 6888} {"train_loss": -27.656997680664062, "global_step": 571772, "epoch": 6888} {"train_loss": -27.805810928344727, "global_step": 571773, "epoch": 6888} {"train_loss": -27.906173706054688, "global_step": 571774, "epoch": 6888} {"train_loss": -27.61928367614746, "global_step": 571775, "epoch": 6888} {"train_loss": -27.742883682250977, "global_step": 571776, "epoch": 6888} {"train_loss": -27.9511775970459, "global_step": 571777, "epoch": 6888} {"train_loss": -28.249526977539062, "global_step": 571778, "epoch": 6888} {"train_loss": -27.85895347595215, "global_step": 571779, "epoch": 6888} {"train_loss": -27.55832862854004, "global_step": 571780, "epoch": 6888} {"train_loss": -28.520986557006836, "global_step": 571781, "epoch": 6888} {"train_loss": -28.15833854675293, "global_step": 571782, "epoch": 6888} {"train_loss": -27.6774959564209, "global_step": 571783, "epoch": 6888} {"train_loss": -28.09576988220215, "global_step": 571784, "epoch": 6888} {"train_loss": -27.985692977905273, "global_step": 571785, "epoch": 6888} {"train_loss": -27.725172548408967, "global_step": 571786, "epoch": 6888, "val_loss": 6413054.0} {"train_loss": -27.71706199645996, "global_step": 571787, "epoch": 6889} {"train_loss": -27.491880416870117, "global_step": 571788, "epoch": 6889} {"train_loss": -27.767745971679688, "global_step": 571789, "epoch": 6889} {"train_loss": -27.37141227722168, "global_step": 571790, "epoch": 6889} {"train_loss": -27.623493194580078, "global_step": 571791, "epoch": 6889} {"train_loss": -27.146957397460938, "global_step": 571792, "epoch": 6889} {"train_loss": -27.869897842407227, "global_step": 571793, "epoch": 6889} {"train_loss": -27.58418083190918, "global_step": 571794, "epoch": 6889} {"train_loss": -27.444171905517578, "global_step": 571795, "epoch": 6889} {"train_loss": -27.519338607788086, "global_step": 571796, "epoch": 6889} {"train_loss": -27.617630004882812, "global_step": 571797, "epoch": 6889} {"train_loss": -27.56890869140625, "global_step": 571798, "epoch": 6889} {"train_loss": -27.846277236938477, "global_step": 571799, "epoch": 6889} {"train_loss": -27.750375747680664, "global_step": 571800, "epoch": 6889} {"train_loss": -27.929615020751953, "global_step": 571801, "epoch": 6889} {"train_loss": -28.0139217376709, "global_step": 571802, "epoch": 6889} {"train_loss": -28.01283073425293, "global_step": 571803, "epoch": 6889} {"train_loss": -28.058368682861328, "global_step": 571804, "epoch": 6889} {"train_loss": -27.6911563873291, "global_step": 571805, "epoch": 6889} {"train_loss": -27.64993667602539, "global_step": 571806, "epoch": 6889} {"train_loss": -27.798078536987305, "global_step": 571807, "epoch": 6889} {"train_loss": -27.57732582092285, "global_step": 571808, "epoch": 6889} {"train_loss": -27.843643188476562, "global_step": 571809, "epoch": 6889} {"train_loss": -27.421802520751953, "global_step": 571810, "epoch": 6889} {"train_loss": -27.65069580078125, "global_step": 571811, "epoch": 6889} {"train_loss": -28.120080947875977, "global_step": 571812, "epoch": 6889} {"train_loss": -27.84186363220215, "global_step": 571813, "epoch": 6889} {"train_loss": -27.8795108795166, "global_step": 571814, "epoch": 6889} {"train_loss": -27.935338973999023, "global_step": 571815, "epoch": 6889} {"train_loss": -27.573322296142578, "global_step": 571816, "epoch": 6889} {"train_loss": -27.634357452392578, "global_step": 571817, "epoch": 6889} {"train_loss": -28.091230392456055, "global_step": 571818, "epoch": 6889} {"train_loss": -27.7470645904541, "global_step": 571819, "epoch": 6889} {"train_loss": -27.877460479736328, "global_step": 571820, "epoch": 6889} {"train_loss": -27.74497413635254, "global_step": 571821, "epoch": 6889} {"train_loss": -27.90955924987793, "global_step": 571822, "epoch": 6889} {"train_loss": -27.611669540405273, "global_step": 571823, "epoch": 6889} {"train_loss": -27.8548583984375, "global_step": 571824, "epoch": 6889} {"train_loss": -27.800155639648438, "global_step": 571825, "epoch": 6889} {"train_loss": -27.716522216796875, "global_step": 571826, "epoch": 6889} {"train_loss": -28.150543212890625, "global_step": 571827, "epoch": 6889} {"train_loss": -28.222152709960938, "global_step": 571828, "epoch": 6889} {"train_loss": -27.957839965820312, "global_step": 571829, "epoch": 6889} {"train_loss": -27.67677116394043, "global_step": 571830, "epoch": 6889} {"train_loss": -27.959918975830078, "global_step": 571831, "epoch": 6889} {"train_loss": -28.1163272857666, "global_step": 571832, "epoch": 6889} {"train_loss": -28.01443862915039, "global_step": 571833, "epoch": 6889} {"train_loss": -27.751379013061523, "global_step": 571834, "epoch": 6889} {"train_loss": -28.14884376525879, "global_step": 571835, "epoch": 6889} {"train_loss": -28.084613800048828, "global_step": 571836, "epoch": 6889} {"train_loss": -28.164525985717773, "global_step": 571837, "epoch": 6889} {"train_loss": -27.971960067749023, "global_step": 571838, "epoch": 6889} {"train_loss": -27.814416885375977, "global_step": 571839, "epoch": 6889} {"train_loss": -27.749420166015625, "global_step": 571840, "epoch": 6889} {"train_loss": -28.02984619140625, "global_step": 571841, "epoch": 6889} {"train_loss": -28.00892448425293, "global_step": 571842, "epoch": 6889} {"train_loss": -28.176227569580078, "global_step": 571843, "epoch": 6889} {"train_loss": -28.183197021484375, "global_step": 571844, "epoch": 6889} {"train_loss": -27.919843673706055, "global_step": 571845, "epoch": 6889} {"train_loss": -27.990081787109375, "global_step": 571846, "epoch": 6889} {"train_loss": -27.823486328125, "global_step": 571847, "epoch": 6889} {"train_loss": -28.09686279296875, "global_step": 571848, "epoch": 6889} {"train_loss": -27.955163955688477, "global_step": 571849, "epoch": 6889} {"train_loss": -27.070236206054688, "global_step": 571850, "epoch": 6889} {"train_loss": -27.293033599853516, "global_step": 571851, "epoch": 6889} {"train_loss": -27.519001007080078, "global_step": 571852, "epoch": 6889} {"train_loss": -28.281757354736328, "global_step": 571853, "epoch": 6889} {"train_loss": -27.63169288635254, "global_step": 571854, "epoch": 6889} {"train_loss": -27.194904327392578, "global_step": 571855, "epoch": 6889} {"train_loss": -27.726593017578125, "global_step": 571856, "epoch": 6889} {"train_loss": -27.908233642578125, "global_step": 571857, "epoch": 6889} {"train_loss": -27.286376953125, "global_step": 571858, "epoch": 6889} {"train_loss": -27.46625328063965, "global_step": 571859, "epoch": 6889} {"train_loss": -27.82110595703125, "global_step": 571860, "epoch": 6889} {"train_loss": -27.681201934814453, "global_step": 571861, "epoch": 6889} {"train_loss": -27.963525772094727, "global_step": 571862, "epoch": 6889} {"train_loss": -27.892934799194336, "global_step": 571863, "epoch": 6889} {"train_loss": -27.55475425720215, "global_step": 571864, "epoch": 6889} {"train_loss": -27.846872329711914, "global_step": 571865, "epoch": 6889} {"train_loss": -27.774784088134766, "global_step": 571866, "epoch": 6889} {"train_loss": -27.65058708190918, "global_step": 571867, "epoch": 6889} {"train_loss": -27.956039428710938, "global_step": 571868, "epoch": 6889} {"train_loss": -27.795933895800488, "global_step": 571869, "epoch": 6889, "val_loss": 6417301.5} {"train_loss": -27.361083984375, "global_step": 571870, "epoch": 6890} {"train_loss": -27.083606719970703, "global_step": 571871, "epoch": 6890} {"train_loss": -27.621850967407227, "global_step": 571872, "epoch": 6890} {"train_loss": -27.148136138916016, "global_step": 571873, "epoch": 6890} {"train_loss": -27.638425827026367, "global_step": 571874, "epoch": 6890} {"train_loss": -27.448450088500977, "global_step": 571875, "epoch": 6890} {"train_loss": -27.566070556640625, "global_step": 571876, "epoch": 6890} {"train_loss": -28.0093994140625, "global_step": 571877, "epoch": 6890} {"train_loss": -27.869892120361328, "global_step": 571878, "epoch": 6890} {"train_loss": -27.29684829711914, "global_step": 571879, "epoch": 6890} {"train_loss": -27.82205581665039, "global_step": 571880, "epoch": 6890} {"train_loss": -27.692630767822266, "global_step": 571881, "epoch": 6890} {"train_loss": -27.547170639038086, "global_step": 571882, "epoch": 6890} {"train_loss": -27.838163375854492, "global_step": 571883, "epoch": 6890} {"train_loss": -27.894062042236328, "global_step": 571884, "epoch": 6890} {"train_loss": -27.544172286987305, "global_step": 571885, "epoch": 6890} {"train_loss": -28.147302627563477, "global_step": 571886, "epoch": 6890} {"train_loss": -27.9614315032959, "global_step": 571887, "epoch": 6890} {"train_loss": -27.96628189086914, "global_step": 571888, "epoch": 6890} {"train_loss": -27.837934494018555, "global_step": 571889, "epoch": 6890} {"train_loss": -27.7059326171875, "global_step": 571890, "epoch": 6890} {"train_loss": -27.908044815063477, "global_step": 571891, "epoch": 6890} {"train_loss": -27.849027633666992, "global_step": 571892, "epoch": 6890} {"train_loss": -28.025659561157227, "global_step": 571893, "epoch": 6890} {"train_loss": -27.69527244567871, "global_step": 571894, "epoch": 6890} {"train_loss": -27.885583877563477, "global_step": 571895, "epoch": 6890} {"train_loss": -27.83649253845215, "global_step": 571896, "epoch": 6890} {"train_loss": -27.56475257873535, "global_step": 571897, "epoch": 6890} {"train_loss": -28.132558822631836, "global_step": 571898, "epoch": 6890} {"train_loss": -28.120731353759766, "global_step": 571899, "epoch": 6890} {"train_loss": -27.57793617248535, "global_step": 571900, "epoch": 6890} {"train_loss": -27.850610733032227, "global_step": 571901, "epoch": 6890} {"train_loss": -27.906476974487305, "global_step": 571902, "epoch": 6890} {"train_loss": -27.837238311767578, "global_step": 571903, "epoch": 6890} {"train_loss": -27.701339721679688, "global_step": 571904, "epoch": 6890} {"train_loss": -28.014312744140625, "global_step": 571905, "epoch": 6890} {"train_loss": -28.034711837768555, "global_step": 571906, "epoch": 6890} {"train_loss": -28.116287231445312, "global_step": 571907, "epoch": 6890} {"train_loss": -27.841602325439453, "global_step": 571908, "epoch": 6890} {"train_loss": -27.745532989501953, "global_step": 571909, "epoch": 6890} {"train_loss": -27.268085479736328, "global_step": 571910, "epoch": 6890} {"train_loss": -27.536334991455078, "global_step": 571911, "epoch": 6890} {"train_loss": -27.39374351501465, "global_step": 571912, "epoch": 6890} {"train_loss": -28.02765464782715, "global_step": 571913, "epoch": 6890} {"train_loss": -27.261798858642578, "global_step": 571914, "epoch": 6890} {"train_loss": -27.381103515625, "global_step": 571915, "epoch": 6890} {"train_loss": -27.450754165649414, "global_step": 571916, "epoch": 6890} {"train_loss": -27.736169815063477, "global_step": 571917, "epoch": 6890} {"train_loss": -27.69416618347168, "global_step": 571918, "epoch": 6890} {"train_loss": -28.084875106811523, "global_step": 571919, "epoch": 6890} {"train_loss": -27.484405517578125, "global_step": 571920, "epoch": 6890} {"train_loss": -27.81024169921875, "global_step": 571921, "epoch": 6890} {"train_loss": -27.16596794128418, "global_step": 571922, "epoch": 6890} {"train_loss": -27.639480590820312, "global_step": 571923, "epoch": 6890} {"train_loss": -27.399412155151367, "global_step": 571924, "epoch": 6890} {"train_loss": -27.530088424682617, "global_step": 571925, "epoch": 6890} {"train_loss": -27.843076705932617, "global_step": 571926, "epoch": 6890} {"train_loss": -27.46430015563965, "global_step": 571927, "epoch": 6890} {"train_loss": -27.486474990844727, "global_step": 571928, "epoch": 6890} {"train_loss": -27.852741241455078, "global_step": 571929, "epoch": 6890} {"train_loss": -27.64002799987793, "global_step": 571930, "epoch": 6890} {"train_loss": -27.69752311706543, "global_step": 571931, "epoch": 6890} {"train_loss": -27.575952529907227, "global_step": 571932, "epoch": 6890} {"train_loss": -27.458084106445312, "global_step": 571933, "epoch": 6890} {"train_loss": -27.8166561126709, "global_step": 571934, "epoch": 6890} {"train_loss": -27.722543716430664, "global_step": 571935, "epoch": 6890} {"train_loss": -27.87763023376465, "global_step": 571936, "epoch": 6890} {"train_loss": -27.826019287109375, "global_step": 571937, "epoch": 6890} {"train_loss": -27.485401153564453, "global_step": 571938, "epoch": 6890} {"train_loss": -27.612262725830078, "global_step": 571939, "epoch": 6890} {"train_loss": -27.737720489501953, "global_step": 571940, "epoch": 6890} {"train_loss": -27.849075317382812, "global_step": 571941, "epoch": 6890} {"train_loss": -27.91036033630371, "global_step": 571942, "epoch": 6890} {"train_loss": -28.122873306274414, "global_step": 571943, "epoch": 6890} {"train_loss": -27.895252227783203, "global_step": 571944, "epoch": 6890} {"train_loss": -27.7148380279541, "global_step": 571945, "epoch": 6890} {"train_loss": -27.908899307250977, "global_step": 571946, "epoch": 6890} {"train_loss": -27.9970645904541, "global_step": 571947, "epoch": 6890} {"train_loss": -27.54093360900879, "global_step": 571948, "epoch": 6890} {"train_loss": -28.4558162689209, "global_step": 571949, "epoch": 6890} {"train_loss": -27.639495849609375, "global_step": 571950, "epoch": 6890} {"train_loss": -28.031702041625977, "global_step": 571951, "epoch": 6890} {"train_loss": -27.718431197017072, "global_step": 571952, "epoch": 6890, "val_loss": 6435490.0} {"train_loss": -27.53657341003418, "global_step": 571953, "epoch": 6891} {"train_loss": -27.192922592163086, "global_step": 571954, "epoch": 6891} {"train_loss": -26.42474365234375, "global_step": 571955, "epoch": 6891} {"train_loss": -26.919469833374023, "global_step": 571956, "epoch": 6891} {"train_loss": -27.244165420532227, "global_step": 571957, "epoch": 6891} {"train_loss": -26.4156551361084, "global_step": 571958, "epoch": 6891} {"train_loss": -26.614776611328125, "global_step": 571959, "epoch": 6891} {"train_loss": -27.48394775390625, "global_step": 571960, "epoch": 6891} {"train_loss": -26.862445831298828, "global_step": 571961, "epoch": 6891} {"train_loss": -27.43584632873535, "global_step": 571962, "epoch": 6891} {"train_loss": -27.209537506103516, "global_step": 571963, "epoch": 6891} {"train_loss": -27.876148223876953, "global_step": 571964, "epoch": 6891} {"train_loss": -26.901981353759766, "global_step": 571965, "epoch": 6891} {"train_loss": -27.277679443359375, "global_step": 571966, "epoch": 6891} {"train_loss": -27.438058853149414, "global_step": 571967, "epoch": 6891} {"train_loss": -27.611242294311523, "global_step": 571968, "epoch": 6891} {"train_loss": -27.20838737487793, "global_step": 571969, "epoch": 6891} {"train_loss": -27.361047744750977, "global_step": 571970, "epoch": 6891} {"train_loss": -27.774738311767578, "global_step": 571971, "epoch": 6891} {"train_loss": -27.3382568359375, "global_step": 571972, "epoch": 6891} {"train_loss": -27.357946395874023, "global_step": 571973, "epoch": 6891} {"train_loss": -27.56422233581543, "global_step": 571974, "epoch": 6891} {"train_loss": -27.76923942565918, "global_step": 571975, "epoch": 6891} {"train_loss": -28.004438400268555, "global_step": 571976, "epoch": 6891} {"train_loss": -27.811573028564453, "global_step": 571977, "epoch": 6891} {"train_loss": -27.53873634338379, "global_step": 571978, "epoch": 6891} {"train_loss": -27.800989151000977, "global_step": 571979, "epoch": 6891} {"train_loss": -28.075794219970703, "global_step": 571980, "epoch": 6891} {"train_loss": -27.597360610961914, "global_step": 571981, "epoch": 6891} {"train_loss": -27.75921630859375, "global_step": 571982, "epoch": 6891} {"train_loss": -27.76787757873535, "global_step": 571983, "epoch": 6891} {"train_loss": -27.90610694885254, "global_step": 571984, "epoch": 6891} {"train_loss": -27.5284481048584, "global_step": 571985, "epoch": 6891} {"train_loss": -27.480661392211914, "global_step": 571986, "epoch": 6891} {"train_loss": -27.619611740112305, "global_step": 571987, "epoch": 6891} {"train_loss": -27.563003540039062, "global_step": 571988, "epoch": 6891} {"train_loss": -27.741718292236328, "global_step": 571989, "epoch": 6891} {"train_loss": -27.134069442749023, "global_step": 571990, "epoch": 6891} {"train_loss": -27.296613693237305, "global_step": 571991, "epoch": 6891} {"train_loss": -28.10407829284668, "global_step": 571992, "epoch": 6891} {"train_loss": -28.162817001342773, "global_step": 571993, "epoch": 6891} {"train_loss": -27.681150436401367, "global_step": 571994, "epoch": 6891} {"train_loss": -27.843204498291016, "global_step": 571995, "epoch": 6891} {"train_loss": -27.928476333618164, "global_step": 571996, "epoch": 6891} {"train_loss": -27.6718692779541, "global_step": 571997, "epoch": 6891} {"train_loss": -27.380746841430664, "global_step": 571998, "epoch": 6891} {"train_loss": -27.729385375976562, "global_step": 571999, "epoch": 6891} {"train_loss": -28.10163688659668, "global_step": 572000, "epoch": 6891} {"train_loss": -27.83253288269043, "global_step": 572001, "epoch": 6891} {"train_loss": -28.30580711364746, "global_step": 572002, "epoch": 6891} {"train_loss": -27.871658325195312, "global_step": 572003, "epoch": 6891} {"train_loss": -28.0487060546875, "global_step": 572004, "epoch": 6891} {"train_loss": -27.821182250976562, "global_step": 572005, "epoch": 6891} {"train_loss": -27.945850372314453, "global_step": 572006, "epoch": 6891} {"train_loss": -28.020221710205078, "global_step": 572007, "epoch": 6891} {"train_loss": -27.799972534179688, "global_step": 572008, "epoch": 6891} {"train_loss": -27.789947509765625, "global_step": 572009, "epoch": 6891} {"train_loss": -27.862913131713867, "global_step": 572010, "epoch": 6891} {"train_loss": -28.287519454956055, "global_step": 572011, "epoch": 6891} {"train_loss": -27.9173641204834, "global_step": 572012, "epoch": 6891} {"train_loss": -27.96156883239746, "global_step": 572013, "epoch": 6891} {"train_loss": -28.197797775268555, "global_step": 572014, "epoch": 6891} {"train_loss": -27.78850746154785, "global_step": 572015, "epoch": 6891} {"train_loss": -28.064462661743164, "global_step": 572016, "epoch": 6891} {"train_loss": -28.091480255126953, "global_step": 572017, "epoch": 6891} {"train_loss": -28.289859771728516, "global_step": 572018, "epoch": 6891} {"train_loss": -27.74991798400879, "global_step": 572019, "epoch": 6891} {"train_loss": -28.035619735717773, "global_step": 572020, "epoch": 6891} {"train_loss": -27.847000122070312, "global_step": 572021, "epoch": 6891} {"train_loss": -28.152769088745117, "global_step": 572022, "epoch": 6891} {"train_loss": -27.825321197509766, "global_step": 572023, "epoch": 6891} {"train_loss": -27.9735107421875, "global_step": 572024, "epoch": 6891} {"train_loss": -27.951635360717773, "global_step": 572025, "epoch": 6891} {"train_loss": -27.812454223632812, "global_step": 572026, "epoch": 6891} {"train_loss": -28.0595645904541, "global_step": 572027, "epoch": 6891} {"train_loss": -28.228845596313477, "global_step": 572028, "epoch": 6891} {"train_loss": -28.081029891967773, "global_step": 572029, "epoch": 6891} {"train_loss": -27.91560173034668, "global_step": 572030, "epoch": 6891} {"train_loss": -27.982685089111328, "global_step": 572031, "epoch": 6891} {"train_loss": -27.94477653503418, "global_step": 572032, "epoch": 6891} {"train_loss": -27.92780876159668, "global_step": 572033, "epoch": 6891} {"train_loss": -27.872095108032227, "global_step": 572034, "epoch": 6891} {"train_loss": -27.702974756079985, "global_step": 572035, "epoch": 6891, "val_loss": 6486459.0} {"train_loss": -27.39535903930664, "global_step": 572036, "epoch": 6892} {"train_loss": -27.175954818725586, "global_step": 572037, "epoch": 6892} {"train_loss": -27.531896591186523, "global_step": 572038, "epoch": 6892} {"train_loss": -27.620161056518555, "global_step": 572039, "epoch": 6892} {"train_loss": -27.422452926635742, "global_step": 572040, "epoch": 6892} {"train_loss": -27.279815673828125, "global_step": 572041, "epoch": 6892} {"train_loss": -27.468915939331055, "global_step": 572042, "epoch": 6892} {"train_loss": -26.984241485595703, "global_step": 572043, "epoch": 6892} {"train_loss": -27.652942657470703, "global_step": 572044, "epoch": 6892} {"train_loss": -27.537384033203125, "global_step": 572045, "epoch": 6892} {"train_loss": -27.379735946655273, "global_step": 572046, "epoch": 6892} {"train_loss": -27.7392578125, "global_step": 572047, "epoch": 6892} {"train_loss": -27.248798370361328, "global_step": 572048, "epoch": 6892} {"train_loss": -27.50396156311035, "global_step": 572049, "epoch": 6892} {"train_loss": -27.439477920532227, "global_step": 572050, "epoch": 6892} {"train_loss": -27.794208526611328, "global_step": 572051, "epoch": 6892} {"train_loss": -27.489343643188477, "global_step": 572052, "epoch": 6892} {"train_loss": -27.561908721923828, "global_step": 572053, "epoch": 6892} {"train_loss": -27.378705978393555, "global_step": 572054, "epoch": 6892} {"train_loss": -27.634140014648438, "global_step": 572055, "epoch": 6892} {"train_loss": -27.926055908203125, "global_step": 572056, "epoch": 6892} {"train_loss": -27.566492080688477, "global_step": 572057, "epoch": 6892} {"train_loss": -27.882186889648438, "global_step": 572058, "epoch": 6892} {"train_loss": -27.75845718383789, "global_step": 572059, "epoch": 6892} {"train_loss": -27.483245849609375, "global_step": 572060, "epoch": 6892} {"train_loss": -27.617908477783203, "global_step": 572061, "epoch": 6892} {"train_loss": -27.75811767578125, "global_step": 572062, "epoch": 6892} {"train_loss": -27.725982666015625, "global_step": 572063, "epoch": 6892} {"train_loss": -28.0410213470459, "global_step": 572064, "epoch": 6892} {"train_loss": -27.94028091430664, "global_step": 572065, "epoch": 6892} {"train_loss": -27.894073486328125, "global_step": 572066, "epoch": 6892} {"train_loss": -27.79315185546875, "global_step": 572067, "epoch": 6892} {"train_loss": -27.946334838867188, "global_step": 572068, "epoch": 6892} {"train_loss": -27.924625396728516, "global_step": 572069, "epoch": 6892} {"train_loss": -27.947269439697266, "global_step": 572070, "epoch": 6892} {"train_loss": -27.730457305908203, "global_step": 572071, "epoch": 6892} {"train_loss": -27.998260498046875, "global_step": 572072, "epoch": 6892} {"train_loss": -28.107105255126953, "global_step": 572073, "epoch": 6892} {"train_loss": -27.99017906188965, "global_step": 572074, "epoch": 6892} {"train_loss": -28.10503578186035, "global_step": 572075, "epoch": 6892} {"train_loss": -28.0056095123291, "global_step": 572076, "epoch": 6892} {"train_loss": -27.77933120727539, "global_step": 572077, "epoch": 6892} {"train_loss": -27.95574951171875, "global_step": 572078, "epoch": 6892} {"train_loss": -27.830535888671875, "global_step": 572079, "epoch": 6892} {"train_loss": -27.732807159423828, "global_step": 572080, "epoch": 6892} {"train_loss": -28.135990142822266, "global_step": 572081, "epoch": 6892} {"train_loss": -27.93448829650879, "global_step": 572082, "epoch": 6892} {"train_loss": -27.82474136352539, "global_step": 572083, "epoch": 6892} {"train_loss": -28.057607650756836, "global_step": 572084, "epoch": 6892} {"train_loss": -27.561033248901367, "global_step": 572085, "epoch": 6892} {"train_loss": -27.56925392150879, "global_step": 572086, "epoch": 6892} {"train_loss": -27.84232521057129, "global_step": 572087, "epoch": 6892} {"train_loss": -28.026554107666016, "global_step": 572088, "epoch": 6892} {"train_loss": -28.3100643157959, "global_step": 572089, "epoch": 6892} {"train_loss": -27.809894561767578, "global_step": 572090, "epoch": 6892} {"train_loss": -27.65287208557129, "global_step": 572091, "epoch": 6892} {"train_loss": -27.3043155670166, "global_step": 572092, "epoch": 6892} {"train_loss": -27.854063034057617, "global_step": 572093, "epoch": 6892} {"train_loss": -28.09647560119629, "global_step": 572094, "epoch": 6892} {"train_loss": -27.823932647705078, "global_step": 572095, "epoch": 6892} {"train_loss": -27.8975830078125, "global_step": 572096, "epoch": 6892} {"train_loss": -27.663354873657227, "global_step": 572097, "epoch": 6892} {"train_loss": -27.69477653503418, "global_step": 572098, "epoch": 6892} {"train_loss": -28.045557022094727, "global_step": 572099, "epoch": 6892} {"train_loss": -27.51727294921875, "global_step": 572100, "epoch": 6892} {"train_loss": -27.82230567932129, "global_step": 572101, "epoch": 6892} {"train_loss": -27.91471290588379, "global_step": 572102, "epoch": 6892} {"train_loss": -27.760496139526367, "global_step": 572103, "epoch": 6892} {"train_loss": -27.861621856689453, "global_step": 572104, "epoch": 6892} {"train_loss": -27.363758087158203, "global_step": 572105, "epoch": 6892} {"train_loss": -27.879302978515625, "global_step": 572106, "epoch": 6892} {"train_loss": -27.84075927734375, "global_step": 572107, "epoch": 6892} {"train_loss": -27.695556640625, "global_step": 572108, "epoch": 6892} {"train_loss": -27.721933364868164, "global_step": 572109, "epoch": 6892} {"train_loss": -27.76171875, "global_step": 572110, "epoch": 6892} {"train_loss": -27.368284225463867, "global_step": 572111, "epoch": 6892} {"train_loss": -27.656356811523438, "global_step": 572112, "epoch": 6892} {"train_loss": -27.758970260620117, "global_step": 572113, "epoch": 6892} {"train_loss": -27.98470115661621, "global_step": 572114, "epoch": 6892} {"train_loss": -27.317874908447266, "global_step": 572115, "epoch": 6892} {"train_loss": -27.905759811401367, "global_step": 572116, "epoch": 6892} {"train_loss": -28.00090980529785, "global_step": 572117, "epoch": 6892} {"train_loss": -27.730779624847045, "global_step": 572118, "epoch": 6892, "val_loss": 6531068.0} {"train_loss": -26.763153076171875, "global_step": 572119, "epoch": 6893} {"train_loss": -27.17877769470215, "global_step": 572120, "epoch": 6893} {"train_loss": -27.302997589111328, "global_step": 572121, "epoch": 6893} {"train_loss": -26.719924926757812, "global_step": 572122, "epoch": 6893} {"train_loss": -26.902145385742188, "global_step": 572123, "epoch": 6893} {"train_loss": -27.226144790649414, "global_step": 572124, "epoch": 6893} {"train_loss": -27.187122344970703, "global_step": 572125, "epoch": 6893} {"train_loss": -27.47941017150879, "global_step": 572126, "epoch": 6893} {"train_loss": -26.887537002563477, "global_step": 572127, "epoch": 6893} {"train_loss": -27.27382469177246, "global_step": 572128, "epoch": 6893} {"train_loss": -27.25986099243164, "global_step": 572129, "epoch": 6893} {"train_loss": -27.261066436767578, "global_step": 572130, "epoch": 6893} {"train_loss": -27.396203994750977, "global_step": 572131, "epoch": 6893} {"train_loss": -27.103515625, "global_step": 572132, "epoch": 6893} {"train_loss": -27.684635162353516, "global_step": 572133, "epoch": 6893} {"train_loss": -27.34705924987793, "global_step": 572134, "epoch": 6893} {"train_loss": -27.43971061706543, "global_step": 572135, "epoch": 6893} {"train_loss": -27.258825302124023, "global_step": 572136, "epoch": 6893} {"train_loss": -27.703205108642578, "global_step": 572137, "epoch": 6893} {"train_loss": -27.750120162963867, "global_step": 572138, "epoch": 6893} {"train_loss": -27.690237045288086, "global_step": 572139, "epoch": 6893} {"train_loss": -27.370853424072266, "global_step": 572140, "epoch": 6893} {"train_loss": -27.79221534729004, "global_step": 572141, "epoch": 6893} {"train_loss": -27.583532333374023, "global_step": 572142, "epoch": 6893} {"train_loss": -27.8728084564209, "global_step": 572143, "epoch": 6893} {"train_loss": -27.763818740844727, "global_step": 572144, "epoch": 6893} {"train_loss": -27.709766387939453, "global_step": 572145, "epoch": 6893} {"train_loss": -27.661151885986328, "global_step": 572146, "epoch": 6893} {"train_loss": -27.472171783447266, "global_step": 572147, "epoch": 6893} {"train_loss": -27.92877197265625, "global_step": 572148, "epoch": 6893} {"train_loss": -27.814956665039062, "global_step": 572149, "epoch": 6893} {"train_loss": -27.868896484375, "global_step": 572150, "epoch": 6893} {"train_loss": -27.42826271057129, "global_step": 572151, "epoch": 6893} {"train_loss": -27.700836181640625, "global_step": 572152, "epoch": 6893} {"train_loss": -27.581958770751953, "global_step": 572153, "epoch": 6893} {"train_loss": -28.094282150268555, "global_step": 572154, "epoch": 6893} {"train_loss": -27.721881866455078, "global_step": 572155, "epoch": 6893} {"train_loss": -27.878482818603516, "global_step": 572156, "epoch": 6893} {"train_loss": -28.078384399414062, "global_step": 572157, "epoch": 6893} {"train_loss": -27.807392120361328, "global_step": 572158, "epoch": 6893} {"train_loss": -28.1110897064209, "global_step": 572159, "epoch": 6893} {"train_loss": -28.264469146728516, "global_step": 572160, "epoch": 6893} {"train_loss": -27.750263214111328, "global_step": 572161, "epoch": 6893} {"train_loss": -27.796621322631836, "global_step": 572162, "epoch": 6893} {"train_loss": -28.36739158630371, "global_step": 572163, "epoch": 6893} {"train_loss": -28.064289093017578, "global_step": 572164, "epoch": 6893} {"train_loss": -27.804523468017578, "global_step": 572165, "epoch": 6893} {"train_loss": -28.200220108032227, "global_step": 572166, "epoch": 6893} {"train_loss": -28.408157348632812, "global_step": 572167, "epoch": 6893} {"train_loss": -27.912261962890625, "global_step": 572168, "epoch": 6893} {"train_loss": -28.254430770874023, "global_step": 572169, "epoch": 6893} {"train_loss": -27.992313385009766, "global_step": 572170, "epoch": 6893} {"train_loss": -28.074615478515625, "global_step": 572171, "epoch": 6893} {"train_loss": -28.148778915405273, "global_step": 572172, "epoch": 6893} {"train_loss": -27.743408203125, "global_step": 572173, "epoch": 6893} {"train_loss": -27.2409725189209, "global_step": 572174, "epoch": 6893} {"train_loss": -26.747039794921875, "global_step": 572175, "epoch": 6893} {"train_loss": -27.033817291259766, "global_step": 572176, "epoch": 6893} {"train_loss": -27.7871150970459, "global_step": 572177, "epoch": 6893} {"train_loss": -28.141162872314453, "global_step": 572178, "epoch": 6893} {"train_loss": -27.72273063659668, "global_step": 572179, "epoch": 6893} {"train_loss": -27.482481002807617, "global_step": 572180, "epoch": 6893} {"train_loss": -27.608972549438477, "global_step": 572181, "epoch": 6893} {"train_loss": -27.805225372314453, "global_step": 572182, "epoch": 6893} {"train_loss": -27.541406631469727, "global_step": 572183, "epoch": 6893} {"train_loss": -27.570585250854492, "global_step": 572184, "epoch": 6893} {"train_loss": -27.891681671142578, "global_step": 572185, "epoch": 6893} {"train_loss": -27.757282257080078, "global_step": 572186, "epoch": 6893} {"train_loss": -27.89399528503418, "global_step": 572187, "epoch": 6893} {"train_loss": -27.886859893798828, "global_step": 572188, "epoch": 6893} {"train_loss": -27.70965003967285, "global_step": 572189, "epoch": 6893} {"train_loss": -27.781286239624023, "global_step": 572190, "epoch": 6893} {"train_loss": -27.99066734313965, "global_step": 572191, "epoch": 6893} {"train_loss": -27.752134323120117, "global_step": 572192, "epoch": 6893} {"train_loss": -28.018680572509766, "global_step": 572193, "epoch": 6893} {"train_loss": -28.252212524414062, "global_step": 572194, "epoch": 6893} {"train_loss": -27.967029571533203, "global_step": 572195, "epoch": 6893} {"train_loss": -27.69325065612793, "global_step": 572196, "epoch": 6893} {"train_loss": -28.084875106811523, "global_step": 572197, "epoch": 6893} {"train_loss": -28.052734375, "global_step": 572198, "epoch": 6893} {"train_loss": -27.9853572845459, "global_step": 572199, "epoch": 6893} {"train_loss": -27.755542755126953, "global_step": 572200, "epoch": 6893} {"train_loss": -27.70434885139925, "global_step": 572201, "epoch": 6893, "val_loss": 6426612.5} {"train_loss": -27.459692001342773, "global_step": 572202, "epoch": 6894} {"train_loss": -27.155517578125, "global_step": 572203, "epoch": 6894} {"train_loss": -27.04363441467285, "global_step": 572204, "epoch": 6894} {"train_loss": -26.65860366821289, "global_step": 572205, "epoch": 6894} {"train_loss": -26.578420639038086, "global_step": 572206, "epoch": 6894} {"train_loss": -27.217884063720703, "global_step": 572207, "epoch": 6894} {"train_loss": -27.47346305847168, "global_step": 572208, "epoch": 6894} {"train_loss": -27.3940486907959, "global_step": 572209, "epoch": 6894} {"train_loss": -26.9544677734375, "global_step": 572210, "epoch": 6894} {"train_loss": -27.702377319335938, "global_step": 572211, "epoch": 6894} {"train_loss": -27.483091354370117, "global_step": 572212, "epoch": 6894} {"train_loss": -27.771238327026367, "global_step": 572213, "epoch": 6894} {"train_loss": -27.6451416015625, "global_step": 572214, "epoch": 6894} {"train_loss": -27.34876823425293, "global_step": 572215, "epoch": 6894} {"train_loss": -27.723068237304688, "global_step": 572216, "epoch": 6894} {"train_loss": -27.452667236328125, "global_step": 572217, "epoch": 6894} {"train_loss": -27.864133834838867, "global_step": 572218, "epoch": 6894} {"train_loss": -27.999786376953125, "global_step": 572219, "epoch": 6894} {"train_loss": -27.608808517456055, "global_step": 572220, "epoch": 6894} {"train_loss": -27.85638427734375, "global_step": 572221, "epoch": 6894} {"train_loss": -27.475513458251953, "global_step": 572222, "epoch": 6894} {"train_loss": -27.681737899780273, "global_step": 572223, "epoch": 6894} {"train_loss": -27.74114990234375, "global_step": 572224, "epoch": 6894} {"train_loss": -28.0538330078125, "global_step": 572225, "epoch": 6894} {"train_loss": -28.031543731689453, "global_step": 572226, "epoch": 6894} {"train_loss": -27.86515235900879, "global_step": 572227, "epoch": 6894} {"train_loss": -27.945966720581055, "global_step": 572228, "epoch": 6894} {"train_loss": -28.026386260986328, "global_step": 572229, "epoch": 6894} {"train_loss": -27.9505558013916, "global_step": 572230, "epoch": 6894} {"train_loss": -27.483301162719727, "global_step": 572231, "epoch": 6894} {"train_loss": -27.821874618530273, "global_step": 572232, "epoch": 6894} {"train_loss": -27.916868209838867, "global_step": 572233, "epoch": 6894} {"train_loss": -27.98674964904785, "global_step": 572234, "epoch": 6894} {"train_loss": -27.961973190307617, "global_step": 572235, "epoch": 6894} {"train_loss": -27.52081871032715, "global_step": 572236, "epoch": 6894} {"train_loss": -28.090595245361328, "global_step": 572237, "epoch": 6894} {"train_loss": -27.224096298217773, "global_step": 572238, "epoch": 6894} {"train_loss": -27.7853946685791, "global_step": 572239, "epoch": 6894} {"train_loss": -28.142126083374023, "global_step": 572240, "epoch": 6894} {"train_loss": -27.843830108642578, "global_step": 572241, "epoch": 6894} {"train_loss": -27.92626953125, "global_step": 572242, "epoch": 6894} {"train_loss": -27.9415340423584, "global_step": 572243, "epoch": 6894} {"train_loss": -28.16607093811035, "global_step": 572244, "epoch": 6894} {"train_loss": -28.0782413482666, "global_step": 572245, "epoch": 6894} {"train_loss": -28.022993087768555, "global_step": 572246, "epoch": 6894} {"train_loss": -28.284780502319336, "global_step": 572247, "epoch": 6894} {"train_loss": -28.454431533813477, "global_step": 572248, "epoch": 6894} {"train_loss": -28.30078125, "global_step": 572249, "epoch": 6894} {"train_loss": -28.01051139831543, "global_step": 572250, "epoch": 6894} {"train_loss": -28.277393341064453, "global_step": 572251, "epoch": 6894} {"train_loss": -27.6312255859375, "global_step": 572252, "epoch": 6894} {"train_loss": -28.291284561157227, "global_step": 572253, "epoch": 6894} {"train_loss": -27.462095260620117, "global_step": 572254, "epoch": 6894} {"train_loss": -27.12751579284668, "global_step": 572255, "epoch": 6894} {"train_loss": -27.333099365234375, "global_step": 572256, "epoch": 6894} {"train_loss": -27.886255264282227, "global_step": 572257, "epoch": 6894} {"train_loss": -27.595563888549805, "global_step": 572258, "epoch": 6894} {"train_loss": -27.417312622070312, "global_step": 572259, "epoch": 6894} {"train_loss": -27.76535987854004, "global_step": 572260, "epoch": 6894} {"train_loss": -28.105127334594727, "global_step": 572261, "epoch": 6894} {"train_loss": -27.720693588256836, "global_step": 572262, "epoch": 6894} {"train_loss": -27.87615394592285, "global_step": 572263, "epoch": 6894} {"train_loss": -28.104724884033203, "global_step": 572264, "epoch": 6894} {"train_loss": -27.863691329956055, "global_step": 572265, "epoch": 6894} {"train_loss": -28.64470863342285, "global_step": 572266, "epoch": 6894} {"train_loss": -28.125537872314453, "global_step": 572267, "epoch": 6894} {"train_loss": -27.63362693786621, "global_step": 572268, "epoch": 6894} {"train_loss": -27.851171493530273, "global_step": 572269, "epoch": 6894} {"train_loss": -27.727441787719727, "global_step": 572270, "epoch": 6894} {"train_loss": -27.92856216430664, "global_step": 572271, "epoch": 6894} {"train_loss": -28.034082412719727, "global_step": 572272, "epoch": 6894} {"train_loss": -27.827056884765625, "global_step": 572273, "epoch": 6894} {"train_loss": -27.944477081298828, "global_step": 572274, "epoch": 6894} {"train_loss": -28.117475509643555, "global_step": 572275, "epoch": 6894} {"train_loss": -27.425405502319336, "global_step": 572276, "epoch": 6894} {"train_loss": -27.44879722595215, "global_step": 572277, "epoch": 6894} {"train_loss": -28.22665786743164, "global_step": 572278, "epoch": 6894} {"train_loss": -27.916624069213867, "global_step": 572279, "epoch": 6894} {"train_loss": -27.58002281188965, "global_step": 572280, "epoch": 6894} {"train_loss": -27.754255294799805, "global_step": 572281, "epoch": 6894} {"train_loss": -27.839710235595703, "global_step": 572282, "epoch": 6894} {"train_loss": -27.89185905456543, "global_step": 572283, "epoch": 6894} {"train_loss": -27.76635643373053, "global_step": 572284, "epoch": 6894, "val_loss": 6430105.0} {"train_loss": -27.5767822265625, "global_step": 572285, "epoch": 6895} {"train_loss": -27.436559677124023, "global_step": 572286, "epoch": 6895} {"train_loss": -27.019256591796875, "global_step": 572287, "epoch": 6895} {"train_loss": -27.05230140686035, "global_step": 572288, "epoch": 6895} {"train_loss": -26.981735229492188, "global_step": 572289, "epoch": 6895} {"train_loss": -27.554410934448242, "global_step": 572290, "epoch": 6895} {"train_loss": -27.114532470703125, "global_step": 572291, "epoch": 6895} {"train_loss": -27.308074951171875, "global_step": 572292, "epoch": 6895} {"train_loss": -27.43442726135254, "global_step": 572293, "epoch": 6895} {"train_loss": -27.422510147094727, "global_step": 572294, "epoch": 6895} {"train_loss": -27.51641273498535, "global_step": 572295, "epoch": 6895} {"train_loss": -27.59407615661621, "global_step": 572296, "epoch": 6895} {"train_loss": -27.62094497680664, "global_step": 572297, "epoch": 6895} {"train_loss": -27.6867733001709, "global_step": 572298, "epoch": 6895} {"train_loss": -27.444229125976562, "global_step": 572299, "epoch": 6895} {"train_loss": -27.825918197631836, "global_step": 572300, "epoch": 6895} {"train_loss": -27.79355239868164, "global_step": 572301, "epoch": 6895} {"train_loss": -27.65097999572754, "global_step": 572302, "epoch": 6895} {"train_loss": -27.973709106445312, "global_step": 572303, "epoch": 6895} {"train_loss": -27.664920806884766, "global_step": 572304, "epoch": 6895} {"train_loss": -27.680866241455078, "global_step": 572305, "epoch": 6895} {"train_loss": -27.868240356445312, "global_step": 572306, "epoch": 6895} {"train_loss": -27.691614151000977, "global_step": 572307, "epoch": 6895} {"train_loss": -27.83979606628418, "global_step": 572308, "epoch": 6895} {"train_loss": -27.86669921875, "global_step": 572309, "epoch": 6895} {"train_loss": -27.968616485595703, "global_step": 572310, "epoch": 6895} {"train_loss": -27.9958438873291, "global_step": 572311, "epoch": 6895} {"train_loss": -27.89815330505371, "global_step": 572312, "epoch": 6895} {"train_loss": -27.958850860595703, "global_step": 572313, "epoch": 6895} {"train_loss": -27.837696075439453, "global_step": 572314, "epoch": 6895} {"train_loss": -28.145715713500977, "global_step": 572315, "epoch": 6895} {"train_loss": -28.012115478515625, "global_step": 572316, "epoch": 6895} {"train_loss": -27.980661392211914, "global_step": 572317, "epoch": 6895} {"train_loss": -27.576765060424805, "global_step": 572318, "epoch": 6895} {"train_loss": -27.850202560424805, "global_step": 572319, "epoch": 6895} {"train_loss": -27.52557945251465, "global_step": 572320, "epoch": 6895} {"train_loss": -27.98870277404785, "global_step": 572321, "epoch": 6895} {"train_loss": -27.916662216186523, "global_step": 572322, "epoch": 6895} {"train_loss": -28.175622940063477, "global_step": 572323, "epoch": 6895} {"train_loss": -28.02728271484375, "global_step": 572324, "epoch": 6895} {"train_loss": -28.2914981842041, "global_step": 572325, "epoch": 6895} {"train_loss": -27.93153190612793, "global_step": 572326, "epoch": 6895} {"train_loss": -27.732343673706055, "global_step": 572327, "epoch": 6895} {"train_loss": -27.572742462158203, "global_step": 572328, "epoch": 6895} {"train_loss": -27.553924560546875, "global_step": 572329, "epoch": 6895} {"train_loss": -28.20734977722168, "global_step": 572330, "epoch": 6895} {"train_loss": -28.30963134765625, "global_step": 572331, "epoch": 6895} {"train_loss": -28.224445343017578, "global_step": 572332, "epoch": 6895} {"train_loss": -27.99555015563965, "global_step": 572333, "epoch": 6895} {"train_loss": -27.704172134399414, "global_step": 572334, "epoch": 6895} {"train_loss": -28.05100440979004, "global_step": 572335, "epoch": 6895} {"train_loss": -28.29703712463379, "global_step": 572336, "epoch": 6895} {"train_loss": -28.1308650970459, "global_step": 572337, "epoch": 6895} {"train_loss": -27.839374542236328, "global_step": 572338, "epoch": 6895} {"train_loss": -27.969959259033203, "global_step": 572339, "epoch": 6895} {"train_loss": -28.205474853515625, "global_step": 572340, "epoch": 6895} {"train_loss": -27.94764518737793, "global_step": 572341, "epoch": 6895} {"train_loss": -27.723119735717773, "global_step": 572342, "epoch": 6895} {"train_loss": -28.26865005493164, "global_step": 572343, "epoch": 6895} {"train_loss": -27.827850341796875, "global_step": 572344, "epoch": 6895} {"train_loss": -27.909305572509766, "global_step": 572345, "epoch": 6895} {"train_loss": -27.90327262878418, "global_step": 572346, "epoch": 6895} {"train_loss": -27.415496826171875, "global_step": 572347, "epoch": 6895} {"train_loss": -27.562658309936523, "global_step": 572348, "epoch": 6895} {"train_loss": -27.17009925842285, "global_step": 572349, "epoch": 6895} {"train_loss": -26.36252212524414, "global_step": 572350, "epoch": 6895} {"train_loss": -26.643646240234375, "global_step": 572351, "epoch": 6895} {"train_loss": -27.88237953186035, "global_step": 572352, "epoch": 6895} {"train_loss": -26.49237060546875, "global_step": 572353, "epoch": 6895} {"train_loss": -27.285383224487305, "global_step": 572354, "epoch": 6895} {"train_loss": -26.607593536376953, "global_step": 572355, "epoch": 6895} {"train_loss": -27.122024536132812, "global_step": 572356, "epoch": 6895} {"train_loss": -26.38873863220215, "global_step": 572357, "epoch": 6895} {"train_loss": -27.125274658203125, "global_step": 572358, "epoch": 6895} {"train_loss": -26.27618980407715, "global_step": 572359, "epoch": 6895} {"train_loss": -27.517499923706055, "global_step": 572360, "epoch": 6895} {"train_loss": -27.160261154174805, "global_step": 572361, "epoch": 6895} {"train_loss": -26.7595157623291, "global_step": 572362, "epoch": 6895} {"train_loss": -27.199787139892578, "global_step": 572363, "epoch": 6895} {"train_loss": -27.76799964904785, "global_step": 572364, "epoch": 6895} {"train_loss": -27.00714111328125, "global_step": 572365, "epoch": 6895} {"train_loss": -27.229772567749023, "global_step": 572366, "epoch": 6895} {"train_loss": -27.59981031302946, "global_step": 572367, "epoch": 6895, "val_loss": 6368155.0} {"train_loss": -26.615636825561523, "global_step": 572368, "epoch": 6896} {"train_loss": -26.37017250061035, "global_step": 572369, "epoch": 6896} {"train_loss": -25.959293365478516, "global_step": 572370, "epoch": 6896} {"train_loss": -26.474166870117188, "global_step": 572371, "epoch": 6896} {"train_loss": -26.932296752929688, "global_step": 572372, "epoch": 6896} {"train_loss": -27.06751823425293, "global_step": 572373, "epoch": 6896} {"train_loss": -26.418493270874023, "global_step": 572374, "epoch": 6896} {"train_loss": -26.133136749267578, "global_step": 572375, "epoch": 6896} {"train_loss": -27.088626861572266, "global_step": 572376, "epoch": 6896} {"train_loss": -27.286792755126953, "global_step": 572377, "epoch": 6896} {"train_loss": -27.174991607666016, "global_step": 572378, "epoch": 6896} {"train_loss": -27.38191795349121, "global_step": 572379, "epoch": 6896} {"train_loss": -27.45563316345215, "global_step": 572380, "epoch": 6896} {"train_loss": -27.156585693359375, "global_step": 572381, "epoch": 6896} {"train_loss": -27.367694854736328, "global_step": 572382, "epoch": 6896} {"train_loss": -27.087255477905273, "global_step": 572383, "epoch": 6896} {"train_loss": -27.28546714782715, "global_step": 572384, "epoch": 6896} {"train_loss": -27.48832130432129, "global_step": 572385, "epoch": 6896} {"train_loss": -27.356143951416016, "global_step": 572386, "epoch": 6896} {"train_loss": -27.442922592163086, "global_step": 572387, "epoch": 6896} {"train_loss": -27.456867218017578, "global_step": 572388, "epoch": 6896} {"train_loss": -27.3991641998291, "global_step": 572389, "epoch": 6896} {"train_loss": -27.188013076782227, "global_step": 572390, "epoch": 6896} {"train_loss": -27.739974975585938, "global_step": 572391, "epoch": 6896} {"train_loss": -27.354352951049805, "global_step": 572392, "epoch": 6896} {"train_loss": -27.559432983398438, "global_step": 572393, "epoch": 6896} {"train_loss": -27.54343032836914, "global_step": 572394, "epoch": 6896} {"train_loss": -27.73834228515625, "global_step": 572395, "epoch": 6896} {"train_loss": -27.93475341796875, "global_step": 572396, "epoch": 6896} {"train_loss": -27.929243087768555, "global_step": 572397, "epoch": 6896} {"train_loss": -27.720197677612305, "global_step": 572398, "epoch": 6896} {"train_loss": -27.334304809570312, "global_step": 572399, "epoch": 6896} {"train_loss": -27.983184814453125, "global_step": 572400, "epoch": 6896} {"train_loss": -27.5855655670166, "global_step": 572401, "epoch": 6896} {"train_loss": -27.654220581054688, "global_step": 572402, "epoch": 6896} {"train_loss": -27.96262550354004, "global_step": 572403, "epoch": 6896} {"train_loss": -27.755563735961914, "global_step": 572404, "epoch": 6896} {"train_loss": -27.836933135986328, "global_step": 572405, "epoch": 6896} {"train_loss": -27.708410263061523, "global_step": 572406, "epoch": 6896} {"train_loss": -27.884119033813477, "global_step": 572407, "epoch": 6896} {"train_loss": -27.972944259643555, "global_step": 572408, "epoch": 6896} {"train_loss": -27.782596588134766, "global_step": 572409, "epoch": 6896} {"train_loss": -27.868698120117188, "global_step": 572410, "epoch": 6896} {"train_loss": -27.891027450561523, "global_step": 572411, "epoch": 6896} {"train_loss": -28.061553955078125, "global_step": 572412, "epoch": 6896} {"train_loss": -27.87021827697754, "global_step": 572413, "epoch": 6896} {"train_loss": -28.082082748413086, "global_step": 572414, "epoch": 6896} {"train_loss": -27.661014556884766, "global_step": 572415, "epoch": 6896} {"train_loss": -28.1832332611084, "global_step": 572416, "epoch": 6896} {"train_loss": -28.111806869506836, "global_step": 572417, "epoch": 6896} {"train_loss": -27.857410430908203, "global_step": 572418, "epoch": 6896} {"train_loss": -27.82570457458496, "global_step": 572419, "epoch": 6896} {"train_loss": -28.1347599029541, "global_step": 572420, "epoch": 6896} {"train_loss": -28.017004013061523, "global_step": 572421, "epoch": 6896} {"train_loss": -27.662511825561523, "global_step": 572422, "epoch": 6896} {"train_loss": -28.038619995117188, "global_step": 572423, "epoch": 6896} {"train_loss": -27.77475357055664, "global_step": 572424, "epoch": 6896} {"train_loss": -27.832019805908203, "global_step": 572425, "epoch": 6896} {"train_loss": -27.924856185913086, "global_step": 572426, "epoch": 6896} {"train_loss": -27.72433853149414, "global_step": 572427, "epoch": 6896} {"train_loss": -27.683069229125977, "global_step": 572428, "epoch": 6896} {"train_loss": -28.274444580078125, "global_step": 572429, "epoch": 6896} {"train_loss": -27.576969146728516, "global_step": 572430, "epoch": 6896} {"train_loss": -27.947650909423828, "global_step": 572431, "epoch": 6896} {"train_loss": -27.7866153717041, "global_step": 572432, "epoch": 6896} {"train_loss": -28.182220458984375, "global_step": 572433, "epoch": 6896} {"train_loss": -27.509872436523438, "global_step": 572434, "epoch": 6896} {"train_loss": -27.629236221313477, "global_step": 572435, "epoch": 6896} {"train_loss": -27.77202796936035, "global_step": 572436, "epoch": 6896} {"train_loss": -27.655237197875977, "global_step": 572437, "epoch": 6896} {"train_loss": -27.625959396362305, "global_step": 572438, "epoch": 6896} {"train_loss": -27.969547271728516, "global_step": 572439, "epoch": 6896} {"train_loss": -27.5502986907959, "global_step": 572440, "epoch": 6896} {"train_loss": -27.90972328186035, "global_step": 572441, "epoch": 6896} {"train_loss": -27.839324951171875, "global_step": 572442, "epoch": 6896} {"train_loss": -27.573904037475586, "global_step": 572443, "epoch": 6896} {"train_loss": -28.009998321533203, "global_step": 572444, "epoch": 6896} {"train_loss": -27.792261123657227, "global_step": 572445, "epoch": 6896} {"train_loss": -27.78968620300293, "global_step": 572446, "epoch": 6896} {"train_loss": -28.027374267578125, "global_step": 572447, "epoch": 6896} {"train_loss": -28.026845932006836, "global_step": 572448, "epoch": 6896} {"train_loss": -27.96759605407715, "global_step": 572449, "epoch": 6896} {"train_loss": -27.608913099909405, "global_step": 572450, "epoch": 6896, "val_loss": 6458115.5} {"train_loss": -27.641355514526367, "global_step": 572451, "epoch": 6897} {"train_loss": -27.453283309936523, "global_step": 572452, "epoch": 6897} {"train_loss": -27.03900718688965, "global_step": 572453, "epoch": 6897} {"train_loss": -27.725915908813477, "global_step": 572454, "epoch": 6897} {"train_loss": -26.964902877807617, "global_step": 572455, "epoch": 6897} {"train_loss": -27.34528923034668, "global_step": 572456, "epoch": 6897} {"train_loss": -27.124155044555664, "global_step": 572457, "epoch": 6897} {"train_loss": -27.5983829498291, "global_step": 572458, "epoch": 6897} {"train_loss": -27.537841796875, "global_step": 572459, "epoch": 6897} {"train_loss": -27.457687377929688, "global_step": 572460, "epoch": 6897} {"train_loss": -27.739179611206055, "global_step": 572461, "epoch": 6897} {"train_loss": -27.514745712280273, "global_step": 572462, "epoch": 6897} {"train_loss": -27.464147567749023, "global_step": 572463, "epoch": 6897} {"train_loss": -27.940702438354492, "global_step": 572464, "epoch": 6897} {"train_loss": -27.629901885986328, "global_step": 572465, "epoch": 6897} {"train_loss": -27.724889755249023, "global_step": 572466, "epoch": 6897} {"train_loss": -28.144535064697266, "global_step": 572467, "epoch": 6897} {"train_loss": -28.090087890625, "global_step": 572468, "epoch": 6897} {"train_loss": -27.48182487487793, "global_step": 572469, "epoch": 6897} {"train_loss": -27.684677124023438, "global_step": 572470, "epoch": 6897} {"train_loss": -27.70499038696289, "global_step": 572471, "epoch": 6897} {"train_loss": -27.695676803588867, "global_step": 572472, "epoch": 6897} {"train_loss": -28.5308895111084, "global_step": 572473, "epoch": 6897} {"train_loss": -27.572641372680664, "global_step": 572474, "epoch": 6897} {"train_loss": -27.593353271484375, "global_step": 572475, "epoch": 6897} {"train_loss": -27.90357780456543, "global_step": 572476, "epoch": 6897} {"train_loss": -27.6151180267334, "global_step": 572477, "epoch": 6897} {"train_loss": -28.11903190612793, "global_step": 572478, "epoch": 6897} {"train_loss": -27.31495475769043, "global_step": 572479, "epoch": 6897} {"train_loss": -27.894855499267578, "global_step": 572480, "epoch": 6897} {"train_loss": -27.529006958007812, "global_step": 572481, "epoch": 6897} {"train_loss": -27.811847686767578, "global_step": 572482, "epoch": 6897} {"train_loss": -27.768720626831055, "global_step": 572483, "epoch": 6897} {"train_loss": -28.07013511657715, "global_step": 572484, "epoch": 6897} {"train_loss": -27.964767456054688, "global_step": 572485, "epoch": 6897} {"train_loss": -28.04336929321289, "global_step": 572486, "epoch": 6897} {"train_loss": -27.776859283447266, "global_step": 572487, "epoch": 6897} {"train_loss": -27.7452392578125, "global_step": 572488, "epoch": 6897} {"train_loss": -27.8060302734375, "global_step": 572489, "epoch": 6897} {"train_loss": -27.728748321533203, "global_step": 572490, "epoch": 6897} {"train_loss": -27.78797721862793, "global_step": 572491, "epoch": 6897} {"train_loss": -28.011005401611328, "global_step": 572492, "epoch": 6897} {"train_loss": -28.163959503173828, "global_step": 572493, "epoch": 6897} {"train_loss": -28.10816764831543, "global_step": 572494, "epoch": 6897} {"train_loss": -27.883527755737305, "global_step": 572495, "epoch": 6897} {"train_loss": -27.410146713256836, "global_step": 572496, "epoch": 6897} {"train_loss": -27.899662017822266, "global_step": 572497, "epoch": 6897} {"train_loss": -28.113235473632812, "global_step": 572498, "epoch": 6897} {"train_loss": -27.96619987487793, "global_step": 572499, "epoch": 6897} {"train_loss": -27.772968292236328, "global_step": 572500, "epoch": 6897} {"train_loss": -27.53525733947754, "global_step": 572501, "epoch": 6897} {"train_loss": -27.869403839111328, "global_step": 572502, "epoch": 6897} {"train_loss": -27.705596923828125, "global_step": 572503, "epoch": 6897} {"train_loss": -28.157611846923828, "global_step": 572504, "epoch": 6897} {"train_loss": -27.541101455688477, "global_step": 572505, "epoch": 6897} {"train_loss": -27.909399032592773, "global_step": 572506, "epoch": 6897} {"train_loss": -27.9874210357666, "global_step": 572507, "epoch": 6897} {"train_loss": -27.70368766784668, "global_step": 572508, "epoch": 6897} {"train_loss": -27.852161407470703, "global_step": 572509, "epoch": 6897} {"train_loss": -27.515661239624023, "global_step": 572510, "epoch": 6897} {"train_loss": -27.951629638671875, "global_step": 572511, "epoch": 6897} {"train_loss": -27.861042022705078, "global_step": 572512, "epoch": 6897} {"train_loss": -27.685224533081055, "global_step": 572513, "epoch": 6897} {"train_loss": -27.732715606689453, "global_step": 572514, "epoch": 6897} {"train_loss": -27.65060806274414, "global_step": 572515, "epoch": 6897} {"train_loss": -27.754858016967773, "global_step": 572516, "epoch": 6897} {"train_loss": -27.90382194519043, "global_step": 572517, "epoch": 6897} {"train_loss": -28.086225509643555, "global_step": 572518, "epoch": 6897} {"train_loss": -27.300077438354492, "global_step": 572519, "epoch": 6897} {"train_loss": -27.512969970703125, "global_step": 572520, "epoch": 6897} {"train_loss": -27.6240291595459, "global_step": 572521, "epoch": 6897} {"train_loss": -26.951221466064453, "global_step": 572522, "epoch": 6897} {"train_loss": -27.075788497924805, "global_step": 572523, "epoch": 6897} {"train_loss": -27.809797286987305, "global_step": 572524, "epoch": 6897} {"train_loss": -27.305084228515625, "global_step": 572525, "epoch": 6897} {"train_loss": -27.436994552612305, "global_step": 572526, "epoch": 6897} {"train_loss": -27.56768226623535, "global_step": 572527, "epoch": 6897} {"train_loss": -27.515146255493164, "global_step": 572528, "epoch": 6897} {"train_loss": -27.6834774017334, "global_step": 572529, "epoch": 6897} {"train_loss": -27.799152374267578, "global_step": 572530, "epoch": 6897} {"train_loss": -27.6510009765625, "global_step": 572531, "epoch": 6897} {"train_loss": -27.721277236938477, "global_step": 572532, "epoch": 6897} {"train_loss": -27.70888804240399, "global_step": 572533, "epoch": 6897, "val_loss": 6453003.0} {"train_loss": -26.800830841064453, "global_step": 572534, "epoch": 6898} {"train_loss": -26.73023796081543, "global_step": 572535, "epoch": 6898} {"train_loss": -27.014087677001953, "global_step": 572536, "epoch": 6898} {"train_loss": -27.090991973876953, "global_step": 572537, "epoch": 6898} {"train_loss": -27.276044845581055, "global_step": 572538, "epoch": 6898} {"train_loss": -27.17643165588379, "global_step": 572539, "epoch": 6898} {"train_loss": -27.02273941040039, "global_step": 572540, "epoch": 6898} {"train_loss": -27.348148345947266, "global_step": 572541, "epoch": 6898} {"train_loss": -27.26324462890625, "global_step": 572542, "epoch": 6898} {"train_loss": -27.44464111328125, "global_step": 572543, "epoch": 6898} {"train_loss": -27.519189834594727, "global_step": 572544, "epoch": 6898} {"train_loss": -27.423192977905273, "global_step": 572545, "epoch": 6898} {"train_loss": -27.400409698486328, "global_step": 572546, "epoch": 6898} {"train_loss": -27.699262619018555, "global_step": 572547, "epoch": 6898} {"train_loss": -27.221277236938477, "global_step": 572548, "epoch": 6898} {"train_loss": -27.446752548217773, "global_step": 572549, "epoch": 6898} {"train_loss": -27.33921241760254, "global_step": 572550, "epoch": 6898} {"train_loss": -27.478851318359375, "global_step": 572551, "epoch": 6898} {"train_loss": -27.56597900390625, "global_step": 572552, "epoch": 6898} {"train_loss": -27.73874855041504, "global_step": 572553, "epoch": 6898} {"train_loss": -27.5792293548584, "global_step": 572554, "epoch": 6898} {"train_loss": -27.694128036499023, "global_step": 572555, "epoch": 6898} {"train_loss": -27.6983585357666, "global_step": 572556, "epoch": 6898} {"train_loss": -27.472858428955078, "global_step": 572557, "epoch": 6898} {"train_loss": -27.949237823486328, "global_step": 572558, "epoch": 6898} {"train_loss": -27.791162490844727, "global_step": 572559, "epoch": 6898} {"train_loss": -27.544076919555664, "global_step": 572560, "epoch": 6898} {"train_loss": -27.663623809814453, "global_step": 572561, "epoch": 6898} {"train_loss": -27.830642700195312, "global_step": 572562, "epoch": 6898} {"train_loss": -27.817188262939453, "global_step": 572563, "epoch": 6898} {"train_loss": -27.7226505279541, "global_step": 572564, "epoch": 6898} {"train_loss": -28.026655197143555, "global_step": 572565, "epoch": 6898} {"train_loss": -28.270322799682617, "global_step": 572566, "epoch": 6898} {"train_loss": -28.190717697143555, "global_step": 572567, "epoch": 6898} {"train_loss": -28.095001220703125, "global_step": 572568, "epoch": 6898} {"train_loss": -27.822397232055664, "global_step": 572569, "epoch": 6898} {"train_loss": -27.7493839263916, "global_step": 572570, "epoch": 6898} {"train_loss": -27.689680099487305, "global_step": 572571, "epoch": 6898} {"train_loss": -28.14344596862793, "global_step": 572572, "epoch": 6898} {"train_loss": -27.98026466369629, "global_step": 572573, "epoch": 6898} {"train_loss": -27.82710075378418, "global_step": 572574, "epoch": 6898} {"train_loss": -27.949472427368164, "global_step": 572575, "epoch": 6898} {"train_loss": -28.112258911132812, "global_step": 572576, "epoch": 6898} {"train_loss": -27.721155166625977, "global_step": 572577, "epoch": 6898} {"train_loss": -28.107135772705078, "global_step": 572578, "epoch": 6898} {"train_loss": -27.91658592224121, "global_step": 572579, "epoch": 6898} {"train_loss": -27.7579402923584, "global_step": 572580, "epoch": 6898} {"train_loss": -28.35084342956543, "global_step": 572581, "epoch": 6898} {"train_loss": -27.852294921875, "global_step": 572582, "epoch": 6898} {"train_loss": -28.363927841186523, "global_step": 572583, "epoch": 6898} {"train_loss": -27.618179321289062, "global_step": 572584, "epoch": 6898} {"train_loss": -27.682193756103516, "global_step": 572585, "epoch": 6898} {"train_loss": -27.85796546936035, "global_step": 572586, "epoch": 6898} {"train_loss": -27.64161491394043, "global_step": 572587, "epoch": 6898} {"train_loss": -27.908735275268555, "global_step": 572588, "epoch": 6898} {"train_loss": -27.879175186157227, "global_step": 572589, "epoch": 6898} {"train_loss": -27.779760360717773, "global_step": 572590, "epoch": 6898} {"train_loss": -27.667037963867188, "global_step": 572591, "epoch": 6898} {"train_loss": -27.971769332885742, "global_step": 572592, "epoch": 6898} {"train_loss": -27.978071212768555, "global_step": 572593, "epoch": 6898} {"train_loss": -28.305179595947266, "global_step": 572594, "epoch": 6898} {"train_loss": -27.939334869384766, "global_step": 572595, "epoch": 6898} {"train_loss": -27.700220108032227, "global_step": 572596, "epoch": 6898} {"train_loss": -27.88663101196289, "global_step": 572597, "epoch": 6898} {"train_loss": -27.55936050415039, "global_step": 572598, "epoch": 6898} {"train_loss": -27.933731079101562, "global_step": 572599, "epoch": 6898} {"train_loss": -28.10627555847168, "global_step": 572600, "epoch": 6898} {"train_loss": -28.160369873046875, "global_step": 572601, "epoch": 6898} {"train_loss": -28.136219024658203, "global_step": 572602, "epoch": 6898} {"train_loss": -27.831811904907227, "global_step": 572603, "epoch": 6898} {"train_loss": -28.041568756103516, "global_step": 572604, "epoch": 6898} {"train_loss": -27.836318969726562, "global_step": 572605, "epoch": 6898} {"train_loss": -27.883808135986328, "global_step": 572606, "epoch": 6898} {"train_loss": -27.98543357849121, "global_step": 572607, "epoch": 6898} {"train_loss": -27.772689819335938, "global_step": 572608, "epoch": 6898} {"train_loss": -27.223112106323242, "global_step": 572609, "epoch": 6898} {"train_loss": -27.400678634643555, "global_step": 572610, "epoch": 6898} {"train_loss": -27.43097496032715, "global_step": 572611, "epoch": 6898} {"train_loss": -27.89432144165039, "global_step": 572612, "epoch": 6898} {"train_loss": -27.675016403198242, "global_step": 572613, "epoch": 6898} {"train_loss": -27.817167282104492, "global_step": 572614, "epoch": 6898} {"train_loss": -28.26749038696289, "global_step": 572615, "epoch": 6898} {"train_loss": -27.731574368764118, "global_step": 572616, "epoch": 6898, "val_loss": 6461886.0} {"train_loss": -27.844614028930664, "global_step": 572617, "epoch": 6899} {"train_loss": -27.21946144104004, "global_step": 572618, "epoch": 6899} {"train_loss": -27.26064109802246, "global_step": 572619, "epoch": 6899} {"train_loss": -27.428274154663086, "global_step": 572620, "epoch": 6899} {"train_loss": -27.39448356628418, "global_step": 572621, "epoch": 6899} {"train_loss": -27.594669342041016, "global_step": 572622, "epoch": 6899} {"train_loss": -27.312774658203125, "global_step": 572623, "epoch": 6899} {"train_loss": -27.056406021118164, "global_step": 572624, "epoch": 6899} {"train_loss": -27.366113662719727, "global_step": 572625, "epoch": 6899} {"train_loss": -27.656158447265625, "global_step": 572626, "epoch": 6899} {"train_loss": -27.686681747436523, "global_step": 572627, "epoch": 6899} {"train_loss": -27.696786880493164, "global_step": 572628, "epoch": 6899} {"train_loss": -27.5190372467041, "global_step": 572629, "epoch": 6899} {"train_loss": -27.430444717407227, "global_step": 572630, "epoch": 6899} {"train_loss": -27.613052368164062, "global_step": 572631, "epoch": 6899} {"train_loss": -27.872512817382812, "global_step": 572632, "epoch": 6899} {"train_loss": -27.790372848510742, "global_step": 572633, "epoch": 6899} {"train_loss": -27.672712326049805, "global_step": 572634, "epoch": 6899} {"train_loss": -27.770587921142578, "global_step": 572635, "epoch": 6899} {"train_loss": -27.875762939453125, "global_step": 572636, "epoch": 6899} {"train_loss": -27.92868423461914, "global_step": 572637, "epoch": 6899} {"train_loss": -27.533239364624023, "global_step": 572638, "epoch": 6899} {"train_loss": -27.73526954650879, "global_step": 572639, "epoch": 6899} {"train_loss": -27.8438777923584, "global_step": 572640, "epoch": 6899} {"train_loss": -27.9683895111084, "global_step": 572641, "epoch": 6899} {"train_loss": -27.613996505737305, "global_step": 572642, "epoch": 6899} {"train_loss": -27.4212703704834, "global_step": 572643, "epoch": 6899} {"train_loss": -27.901365280151367, "global_step": 572644, "epoch": 6899} {"train_loss": -27.83514976501465, "global_step": 572645, "epoch": 6899} {"train_loss": -27.54294776916504, "global_step": 572646, "epoch": 6899} {"train_loss": -27.865503311157227, "global_step": 572647, "epoch": 6899} {"train_loss": -27.853351593017578, "global_step": 572648, "epoch": 6899} {"train_loss": -28.223119735717773, "global_step": 572649, "epoch": 6899} {"train_loss": -27.874975204467773, "global_step": 572650, "epoch": 6899} {"train_loss": -27.924030303955078, "global_step": 572651, "epoch": 6899} {"train_loss": -28.06867027282715, "global_step": 572652, "epoch": 6899} {"train_loss": -27.71278953552246, "global_step": 572653, "epoch": 6899} {"train_loss": -28.003692626953125, "global_step": 572654, "epoch": 6899} {"train_loss": -28.002838134765625, "global_step": 572655, "epoch": 6899} {"train_loss": -28.161298751831055, "global_step": 572656, "epoch": 6899} {"train_loss": -28.22527503967285, "global_step": 572657, "epoch": 6899} {"train_loss": -27.93354606628418, "global_step": 572658, "epoch": 6899} {"train_loss": -28.18204116821289, "global_step": 572659, "epoch": 6899} {"train_loss": -28.142911911010742, "global_step": 572660, "epoch": 6899} {"train_loss": -28.138172149658203, "global_step": 572661, "epoch": 6899} {"train_loss": -28.13614273071289, "global_step": 572662, "epoch": 6899} {"train_loss": -27.949100494384766, "global_step": 572663, "epoch": 6899} {"train_loss": -28.179889678955078, "global_step": 572664, "epoch": 6899} {"train_loss": -28.017364501953125, "global_step": 572665, "epoch": 6899} {"train_loss": -28.337207794189453, "global_step": 572666, "epoch": 6899} {"train_loss": -28.051528930664062, "global_step": 572667, "epoch": 6899} {"train_loss": -28.526779174804688, "global_step": 572668, "epoch": 6899} {"train_loss": -28.155454635620117, "global_step": 572669, "epoch": 6899} {"train_loss": -28.07354736328125, "global_step": 572670, "epoch": 6899} {"train_loss": -27.957685470581055, "global_step": 572671, "epoch": 6899} {"train_loss": -28.230133056640625, "global_step": 572672, "epoch": 6899} {"train_loss": -28.087976455688477, "global_step": 572673, "epoch": 6899} {"train_loss": -27.87632179260254, "global_step": 572674, "epoch": 6899} {"train_loss": -28.111371994018555, "global_step": 572675, "epoch": 6899} {"train_loss": -28.11262321472168, "global_step": 572676, "epoch": 6899} {"train_loss": -28.01654052734375, "global_step": 572677, "epoch": 6899} {"train_loss": -28.109439849853516, "global_step": 572678, "epoch": 6899} {"train_loss": -27.425893783569336, "global_step": 572679, "epoch": 6899} {"train_loss": -27.594776153564453, "global_step": 572680, "epoch": 6899} {"train_loss": -27.649099349975586, "global_step": 572681, "epoch": 6899} {"train_loss": -27.9948787689209, "global_step": 572682, "epoch": 6899} {"train_loss": -28.0054931640625, "global_step": 572683, "epoch": 6899} {"train_loss": -28.05366325378418, "global_step": 572684, "epoch": 6899} {"train_loss": -27.733734130859375, "global_step": 572685, "epoch": 6899} {"train_loss": -27.80328369140625, "global_step": 572686, "epoch": 6899} {"train_loss": -27.387678146362305, "global_step": 572687, "epoch": 6899} {"train_loss": -27.62558364868164, "global_step": 572688, "epoch": 6899} {"train_loss": -27.99871253967285, "global_step": 572689, "epoch": 6899} {"train_loss": -27.52423667907715, "global_step": 572690, "epoch": 6899} {"train_loss": -27.86359977722168, "global_step": 572691, "epoch": 6899} {"train_loss": -27.6656436920166, "global_step": 572692, "epoch": 6899} {"train_loss": -27.682544708251953, "global_step": 572693, "epoch": 6899} {"train_loss": -27.820804595947266, "global_step": 572694, "epoch": 6899} {"train_loss": -27.955570220947266, "global_step": 572695, "epoch": 6899} {"train_loss": -27.365497589111328, "global_step": 572696, "epoch": 6899} {"train_loss": -27.554595947265625, "global_step": 572697, "epoch": 6899} {"train_loss": -27.94182777404785, "global_step": 572698, "epoch": 6899} {"train_loss": -27.80861454699413, "global_step": 572699, "epoch": 6899, "val_loss": 6482103.0} {"train_loss": -26.998126983642578, "global_step": 572700, "epoch": 6900} {"train_loss": -26.3641357421875, "global_step": 572701, "epoch": 6900} {"train_loss": -27.27976417541504, "global_step": 572702, "epoch": 6900} {"train_loss": -26.142623901367188, "global_step": 572703, "epoch": 6900} {"train_loss": -26.106464385986328, "global_step": 572704, "epoch": 6900} {"train_loss": -26.425424575805664, "global_step": 572705, "epoch": 6900} {"train_loss": -26.306013107299805, "global_step": 572706, "epoch": 6900} {"train_loss": -26.342634201049805, "global_step": 572707, "epoch": 6900} {"train_loss": -26.923023223876953, "global_step": 572708, "epoch": 6900} {"train_loss": -26.799589157104492, "global_step": 572709, "epoch": 6900} {"train_loss": -26.81207847595215, "global_step": 572710, "epoch": 6900} {"train_loss": -27.101449966430664, "global_step": 572711, "epoch": 6900} {"train_loss": -26.89048194885254, "global_step": 572712, "epoch": 6900} {"train_loss": -27.332508087158203, "global_step": 572713, "epoch": 6900} {"train_loss": -27.2918643951416, "global_step": 572714, "epoch": 6900} {"train_loss": -26.769699096679688, "global_step": 572715, "epoch": 6900} {"train_loss": -27.423803329467773, "global_step": 572716, "epoch": 6900} {"train_loss": -27.31428337097168, "global_step": 572717, "epoch": 6900} {"train_loss": -27.027074813842773, "global_step": 572718, "epoch": 6900} {"train_loss": -27.284698486328125, "global_step": 572719, "epoch": 6900} {"train_loss": -27.419239044189453, "global_step": 572720, "epoch": 6900} {"train_loss": -27.26582145690918, "global_step": 572721, "epoch": 6900} {"train_loss": -27.675016403198242, "global_step": 572722, "epoch": 6900} {"train_loss": -27.509443283081055, "global_step": 572723, "epoch": 6900} {"train_loss": -27.44635581970215, "global_step": 572724, "epoch": 6900} {"train_loss": -27.390155792236328, "global_step": 572725, "epoch": 6900} {"train_loss": -27.27781105041504, "global_step": 572726, "epoch": 6900} {"train_loss": -27.57493019104004, "global_step": 572727, "epoch": 6900} {"train_loss": -27.78168296813965, "global_step": 572728, "epoch": 6900} {"train_loss": -27.81814956665039, "global_step": 572729, "epoch": 6900} {"train_loss": -27.705585479736328, "global_step": 572730, "epoch": 6900} {"train_loss": -27.640003204345703, "global_step": 572731, "epoch": 6900} {"train_loss": -27.78253173828125, "global_step": 572732, "epoch": 6900} {"train_loss": -27.764816284179688, "global_step": 572733, "epoch": 6900} {"train_loss": -27.830707550048828, "global_step": 572734, "epoch": 6900} {"train_loss": -27.714155197143555, "global_step": 572735, "epoch": 6900} {"train_loss": -28.16472816467285, "global_step": 572736, "epoch": 6900} {"train_loss": -27.9088077545166, "global_step": 572737, "epoch": 6900} {"train_loss": -27.534088134765625, "global_step": 572738, "epoch": 6900} {"train_loss": -27.917861938476562, "global_step": 572739, "epoch": 6900} {"train_loss": -27.618804931640625, "global_step": 572740, "epoch": 6900} {"train_loss": -28.0424747467041, "global_step": 572741, "epoch": 6900} {"train_loss": -28.103246688842773, "global_step": 572742, "epoch": 6900} {"train_loss": -27.949893951416016, "global_step": 572743, "epoch": 6900} {"train_loss": -28.03523063659668, "global_step": 572744, "epoch": 6900} {"train_loss": -28.08932876586914, "global_step": 572745, "epoch": 6900} {"train_loss": -27.627304077148438, "global_step": 572746, "epoch": 6900} {"train_loss": -28.026874542236328, "global_step": 572747, "epoch": 6900} {"train_loss": -28.247467041015625, "global_step": 572748, "epoch": 6900} {"train_loss": -28.100080490112305, "global_step": 572749, "epoch": 6900} {"train_loss": -28.144241333007812, "global_step": 572750, "epoch": 6900} {"train_loss": -27.7435302734375, "global_step": 572751, "epoch": 6900} {"train_loss": -28.025976181030273, "global_step": 572752, "epoch": 6900} {"train_loss": -28.136816024780273, "global_step": 572753, "epoch": 6900} {"train_loss": -28.12416648864746, "global_step": 572754, "epoch": 6900} {"train_loss": -27.692174911499023, "global_step": 572755, "epoch": 6900} {"train_loss": -27.937652587890625, "global_step": 572756, "epoch": 6900} {"train_loss": -27.939029693603516, "global_step": 572757, "epoch": 6900} {"train_loss": -28.045501708984375, "global_step": 572758, "epoch": 6900} {"train_loss": -28.27967643737793, "global_step": 572759, "epoch": 6900} {"train_loss": -27.73749351501465, "global_step": 572760, "epoch": 6900} {"train_loss": -28.093290328979492, "global_step": 572761, "epoch": 6900} {"train_loss": -27.7623348236084, "global_step": 572762, "epoch": 6900} {"train_loss": -27.365802764892578, "global_step": 572763, "epoch": 6900} {"train_loss": -28.050275802612305, "global_step": 572764, "epoch": 6900} {"train_loss": -28.21246337890625, "global_step": 572765, "epoch": 6900} {"train_loss": -27.8243465423584, "global_step": 572766, "epoch": 6900} {"train_loss": -27.717517852783203, "global_step": 572767, "epoch": 6900} {"train_loss": -28.304126739501953, "global_step": 572768, "epoch": 6900} {"train_loss": -28.103235244750977, "global_step": 572769, "epoch": 6900} {"train_loss": -27.605060577392578, "global_step": 572770, "epoch": 6900} {"train_loss": -27.815832138061523, "global_step": 572771, "epoch": 6900} {"train_loss": -27.828481674194336, "global_step": 572772, "epoch": 6900} {"train_loss": -27.716053009033203, "global_step": 572773, "epoch": 6900} {"train_loss": -27.887939453125, "global_step": 572774, "epoch": 6900} {"train_loss": -27.64571189880371, "global_step": 572775, "epoch": 6900} {"train_loss": -27.773595809936523, "global_step": 572776, "epoch": 6900} {"train_loss": -27.72598648071289, "global_step": 572777, "epoch": 6900} {"train_loss": -27.996612548828125, "global_step": 572778, "epoch": 6900} {"train_loss": -28.345502853393555, "global_step": 572779, "epoch": 6900} {"train_loss": -28.034439086914062, "global_step": 572780, "epoch": 6900} {"train_loss": -27.808124542236328, "global_step": 572781, "epoch": 6900} {"train_loss": -27.58219038722027, "global_step": 572782, "epoch": 6900, "train/sim_max_reward_0": 0.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4500000": 1.0, "test/sim_max_reward_4500001": 1.0, "test/sim_max_reward_4500002": 1.0, "test/sim_max_reward_4500003": 1.0, "test/sim_max_reward_4500004": 0.0, "test/sim_max_reward_4500005": 1.0, "test/sim_max_reward_4500006": 1.0, "test/sim_max_reward_4500007": 0.0, "test/sim_max_reward_4500008": 1.0, "test/sim_max_reward_4500009": 1.0, "test/sim_max_reward_4500010": 1.0, "test/sim_max_reward_4500011": 1.0, "test/sim_max_reward_4500012": 1.0, "test/sim_max_reward_4500013": 0.0, "test/sim_max_reward_4500014": 1.0, "test/sim_max_reward_4500015": 1.0, "test/sim_max_reward_4500016": 1.0, "test/sim_max_reward_4500017": 1.0, "test/sim_max_reward_4500018": 1.0, "test/sim_max_reward_4500019": 0.0, "test/sim_max_reward_4500020": 1.0, "test/sim_max_reward_4500021": 1.0, "train/mean_score": 0.8333333333333334, "test/mean_score": 0.8181818181818182, "val_loss": 6420186.0} {"train_loss": -27.49146842956543, "global_step": 572783, "epoch": 6901} {"train_loss": -27.513427734375, "global_step": 572784, "epoch": 6901} {"train_loss": -27.31003189086914, "global_step": 572785, "epoch": 6901} {"train_loss": -27.477930068969727, "global_step": 572786, "epoch": 6901} {"train_loss": -27.554880142211914, "global_step": 572787, "epoch": 6901} {"train_loss": -26.82944107055664, "global_step": 572788, "epoch": 6901} {"train_loss": -26.68351173400879, "global_step": 572789, "epoch": 6901} {"train_loss": -27.178014755249023, "global_step": 572790, "epoch": 6901} {"train_loss": -27.530149459838867, "global_step": 572791, "epoch": 6901} {"train_loss": -27.740842819213867, "global_step": 572792, "epoch": 6901} {"train_loss": -26.82781410217285, "global_step": 572793, "epoch": 6901} {"train_loss": -27.034015655517578, "global_step": 572794, "epoch": 6901} {"train_loss": -27.266714096069336, "global_step": 572795, "epoch": 6901} {"train_loss": -27.234228134155273, "global_step": 572796, "epoch": 6901} {"train_loss": -27.83465576171875, "global_step": 572797, "epoch": 6901} {"train_loss": -27.142969131469727, "global_step": 572798, "epoch": 6901} {"train_loss": -27.043119430541992, "global_step": 572799, "epoch": 6901} {"train_loss": -27.516128540039062, "global_step": 572800, "epoch": 6901} {"train_loss": -27.354211807250977, "global_step": 572801, "epoch": 6901} {"train_loss": -27.754779815673828, "global_step": 572802, "epoch": 6901} {"train_loss": -27.560388565063477, "global_step": 572803, "epoch": 6901} {"train_loss": -27.589981079101562, "global_step": 572804, "epoch": 6901} {"train_loss": -27.623016357421875, "global_step": 572805, "epoch": 6901} {"train_loss": -27.975860595703125, "global_step": 572806, "epoch": 6901} {"train_loss": -27.230224609375, "global_step": 572807, "epoch": 6901} {"train_loss": -27.714893341064453, "global_step": 572808, "epoch": 6901} {"train_loss": -27.389158248901367, "global_step": 572809, "epoch": 6901} {"train_loss": -27.96217155456543, "global_step": 572810, "epoch": 6901} {"train_loss": -27.409381866455078, "global_step": 572811, "epoch": 6901} {"train_loss": -27.890737533569336, "global_step": 572812, "epoch": 6901} {"train_loss": -27.918241500854492, "global_step": 572813, "epoch": 6901} {"train_loss": -28.16977310180664, "global_step": 572814, "epoch": 6901} {"train_loss": -27.396411895751953, "global_step": 572815, "epoch": 6901} {"train_loss": -27.69473648071289, "global_step": 572816, "epoch": 6901} {"train_loss": -27.507299423217773, "global_step": 572817, "epoch": 6901} {"train_loss": -27.454389572143555, "global_step": 572818, "epoch": 6901} {"train_loss": -27.357995986938477, "global_step": 572819, "epoch": 6901} {"train_loss": -27.808303833007812, "global_step": 572820, "epoch": 6901} {"train_loss": -27.85774040222168, "global_step": 572821, "epoch": 6901} {"train_loss": -27.92881202697754, "global_step": 572822, "epoch": 6901} {"train_loss": -27.92178726196289, "global_step": 572823, "epoch": 6901} {"train_loss": -27.7965030670166, "global_step": 572824, "epoch": 6901} {"train_loss": -28.25239372253418, "global_step": 572825, "epoch": 6901} {"train_loss": -27.793609619140625, "global_step": 572826, "epoch": 6901} {"train_loss": -27.74013328552246, "global_step": 572827, "epoch": 6901} {"train_loss": -28.134424209594727, "global_step": 572828, "epoch": 6901} {"train_loss": -27.665571212768555, "global_step": 572829, "epoch": 6901} {"train_loss": -27.98211669921875, "global_step": 572830, "epoch": 6901} {"train_loss": -27.507923126220703, "global_step": 572831, "epoch": 6901} {"train_loss": -27.388477325439453, "global_step": 572832, "epoch": 6901} {"train_loss": -27.217493057250977, "global_step": 572833, "epoch": 6901} {"train_loss": -27.910736083984375, "global_step": 572834, "epoch": 6901} {"train_loss": -26.987049102783203, "global_step": 572835, "epoch": 6901} {"train_loss": -26.514423370361328, "global_step": 572836, "epoch": 6901} {"train_loss": -27.750198364257812, "global_step": 572837, "epoch": 6901} {"train_loss": -27.794729232788086, "global_step": 572838, "epoch": 6901} {"train_loss": -27.231983184814453, "global_step": 572839, "epoch": 6901} {"train_loss": -27.45911979675293, "global_step": 572840, "epoch": 6901} {"train_loss": -27.475006103515625, "global_step": 572841, "epoch": 6901} {"train_loss": -27.485380172729492, "global_step": 572842, "epoch": 6901} {"train_loss": -27.492034912109375, "global_step": 572843, "epoch": 6901} {"train_loss": -27.62775230407715, "global_step": 572844, "epoch": 6901} {"train_loss": -28.055715560913086, "global_step": 572845, "epoch": 6901} {"train_loss": -27.635610580444336, "global_step": 572846, "epoch": 6901} {"train_loss": -28.013778686523438, "global_step": 572847, "epoch": 6901} {"train_loss": -27.48444175720215, "global_step": 572848, "epoch": 6901} {"train_loss": -27.633092880249023, "global_step": 572849, "epoch": 6901} {"train_loss": -27.714208602905273, "global_step": 572850, "epoch": 6901} {"train_loss": -28.253759384155273, "global_step": 572851, "epoch": 6901} {"train_loss": -27.95572280883789, "global_step": 572852, "epoch": 6901} {"train_loss": -27.884307861328125, "global_step": 572853, "epoch": 6901} {"train_loss": -27.870574951171875, "global_step": 572854, "epoch": 6901} {"train_loss": -27.796112060546875, "global_step": 572855, "epoch": 6901} {"train_loss": -27.80472183227539, "global_step": 572856, "epoch": 6901} {"train_loss": -27.65215492248535, "global_step": 572857, "epoch": 6901} {"train_loss": -27.964252471923828, "global_step": 572858, "epoch": 6901} {"train_loss": -28.081439971923828, "global_step": 572859, "epoch": 6901} {"train_loss": -27.837568283081055, "global_step": 572860, "epoch": 6901} {"train_loss": -27.375675201416016, "global_step": 572861, "epoch": 6901} {"train_loss": -27.746326446533203, "global_step": 572862, "epoch": 6901} {"train_loss": -27.649274826049805, "global_step": 572863, "epoch": 6901} {"train_loss": -27.721750259399414, "global_step": 572864, "epoch": 6901} {"train_loss": -27.59978446041245, "global_step": 572865, "epoch": 6901, "val_loss": 6482879.0} {"train_loss": -26.73114585876465, "global_step": 572866, "epoch": 6902} {"train_loss": -27.10708999633789, "global_step": 572867, "epoch": 6902} {"train_loss": -27.188642501831055, "global_step": 572868, "epoch": 6902} {"train_loss": -27.174238204956055, "global_step": 572869, "epoch": 6902} {"train_loss": -27.05927848815918, "global_step": 572870, "epoch": 6902} {"train_loss": -26.944128036499023, "global_step": 572871, "epoch": 6902} {"train_loss": -26.897388458251953, "global_step": 572872, "epoch": 6902} {"train_loss": -27.295703887939453, "global_step": 572873, "epoch": 6902} {"train_loss": -27.1533260345459, "global_step": 572874, "epoch": 6902} {"train_loss": -27.49469566345215, "global_step": 572875, "epoch": 6902} {"train_loss": -27.068002700805664, "global_step": 572876, "epoch": 6902} {"train_loss": -27.62993812561035, "global_step": 572877, "epoch": 6902} {"train_loss": -27.440771102905273, "global_step": 572878, "epoch": 6902} {"train_loss": -27.14008903503418, "global_step": 572879, "epoch": 6902} {"train_loss": -27.56744956970215, "global_step": 572880, "epoch": 6902} {"train_loss": -27.62351417541504, "global_step": 572881, "epoch": 6902} {"train_loss": -27.646955490112305, "global_step": 572882, "epoch": 6902} {"train_loss": -27.69620704650879, "global_step": 572883, "epoch": 6902} {"train_loss": -27.51084327697754, "global_step": 572884, "epoch": 6902} {"train_loss": -27.37803077697754, "global_step": 572885, "epoch": 6902} {"train_loss": -27.965612411499023, "global_step": 572886, "epoch": 6902} {"train_loss": -27.7325439453125, "global_step": 572887, "epoch": 6902} {"train_loss": -27.78473472595215, "global_step": 572888, "epoch": 6902} {"train_loss": -27.824054718017578, "global_step": 572889, "epoch": 6902} {"train_loss": -27.695825576782227, "global_step": 572890, "epoch": 6902} {"train_loss": -27.809701919555664, "global_step": 572891, "epoch": 6902} {"train_loss": -27.413305282592773, "global_step": 572892, "epoch": 6902} {"train_loss": -27.923004150390625, "global_step": 572893, "epoch": 6902} {"train_loss": -28.01789665222168, "global_step": 572894, "epoch": 6902} {"train_loss": -27.905969619750977, "global_step": 572895, "epoch": 6902} {"train_loss": -27.874027252197266, "global_step": 572896, "epoch": 6902} {"train_loss": -27.6761474609375, "global_step": 572897, "epoch": 6902} {"train_loss": -27.6651668548584, "global_step": 572898, "epoch": 6902} {"train_loss": -27.942800521850586, "global_step": 572899, "epoch": 6902} {"train_loss": -28.009119033813477, "global_step": 572900, "epoch": 6902} {"train_loss": -28.1137638092041, "global_step": 572901, "epoch": 6902} {"train_loss": -27.87691307067871, "global_step": 572902, "epoch": 6902} {"train_loss": -28.132949829101562, "global_step": 572903, "epoch": 6902} {"train_loss": -27.841028213500977, "global_step": 572904, "epoch": 6902} {"train_loss": -28.21964454650879, "global_step": 572905, "epoch": 6902} {"train_loss": -27.792875289916992, "global_step": 572906, "epoch": 6902} {"train_loss": -27.74562644958496, "global_step": 572907, "epoch": 6902} {"train_loss": -28.155380249023438, "global_step": 572908, "epoch": 6902} {"train_loss": -27.82986831665039, "global_step": 572909, "epoch": 6902} {"train_loss": -28.3960018157959, "global_step": 572910, "epoch": 6902} {"train_loss": -28.0324764251709, "global_step": 572911, "epoch": 6902} {"train_loss": -28.07387351989746, "global_step": 572912, "epoch": 6902} {"train_loss": -27.803699493408203, "global_step": 572913, "epoch": 6902} {"train_loss": -27.882776260375977, "global_step": 572914, "epoch": 6902} {"train_loss": -27.93706703186035, "global_step": 572915, "epoch": 6902} {"train_loss": -27.889291763305664, "global_step": 572916, "epoch": 6902} {"train_loss": -27.71024513244629, "global_step": 572917, "epoch": 6902} {"train_loss": -27.358219146728516, "global_step": 572918, "epoch": 6902} {"train_loss": -27.832605361938477, "global_step": 572919, "epoch": 6902} {"train_loss": -27.739898681640625, "global_step": 572920, "epoch": 6902} {"train_loss": -27.3194637298584, "global_step": 572921, "epoch": 6902} {"train_loss": -26.950098037719727, "global_step": 572922, "epoch": 6902} {"train_loss": -27.245763778686523, "global_step": 572923, "epoch": 6902} {"train_loss": -27.795654296875, "global_step": 572924, "epoch": 6902} {"train_loss": -28.0701961517334, "global_step": 572925, "epoch": 6902} {"train_loss": -27.38394546508789, "global_step": 572926, "epoch": 6902} {"train_loss": -27.6624698638916, "global_step": 572927, "epoch": 6902} {"train_loss": -27.872848510742188, "global_step": 572928, "epoch": 6902} {"train_loss": -27.9083309173584, "global_step": 572929, "epoch": 6902} {"train_loss": -27.8415584564209, "global_step": 572930, "epoch": 6902} {"train_loss": -27.69339942932129, "global_step": 572931, "epoch": 6902} {"train_loss": -27.737348556518555, "global_step": 572932, "epoch": 6902} {"train_loss": -28.090341567993164, "global_step": 572933, "epoch": 6902} {"train_loss": -27.174854278564453, "global_step": 572934, "epoch": 6902} {"train_loss": -27.703306198120117, "global_step": 572935, "epoch": 6902} {"train_loss": -27.666906356811523, "global_step": 572936, "epoch": 6902} {"train_loss": -27.79304313659668, "global_step": 572937, "epoch": 6902} {"train_loss": -27.604642868041992, "global_step": 572938, "epoch": 6902} {"train_loss": -27.91773796081543, "global_step": 572939, "epoch": 6902} {"train_loss": -27.6868896484375, "global_step": 572940, "epoch": 6902} {"train_loss": -27.922128677368164, "global_step": 572941, "epoch": 6902} {"train_loss": -27.70196533203125, "global_step": 572942, "epoch": 6902} {"train_loss": -27.98505973815918, "global_step": 572943, "epoch": 6902} {"train_loss": -27.820484161376953, "global_step": 572944, "epoch": 6902} {"train_loss": -27.848989486694336, "global_step": 572945, "epoch": 6902} {"train_loss": -28.031509399414062, "global_step": 572946, "epoch": 6902} {"train_loss": -27.989261627197266, "global_step": 572947, "epoch": 6902} {"train_loss": -27.690496996224645, "global_step": 572948, "epoch": 6902, "val_loss": 6469358.5} {"train_loss": -27.672040939331055, "global_step": 572949, "epoch": 6903} {"train_loss": -27.704004287719727, "global_step": 572950, "epoch": 6903} {"train_loss": -27.729135513305664, "global_step": 572951, "epoch": 6903} {"train_loss": -27.423690795898438, "global_step": 572952, "epoch": 6903} {"train_loss": -27.365070343017578, "global_step": 572953, "epoch": 6903} {"train_loss": -27.569665908813477, "global_step": 572954, "epoch": 6903} {"train_loss": -27.649978637695312, "global_step": 572955, "epoch": 6903} {"train_loss": -27.823944091796875, "global_step": 572956, "epoch": 6903} {"train_loss": -27.719085693359375, "global_step": 572957, "epoch": 6903} {"train_loss": -27.358469009399414, "global_step": 572958, "epoch": 6903} {"train_loss": -27.86856460571289, "global_step": 572959, "epoch": 6903} {"train_loss": -27.602664947509766, "global_step": 572960, "epoch": 6903} {"train_loss": -27.792463302612305, "global_step": 572961, "epoch": 6903} {"train_loss": -27.57693862915039, "global_step": 572962, "epoch": 6903} {"train_loss": -28.08466148376465, "global_step": 572963, "epoch": 6903} {"train_loss": -27.662755966186523, "global_step": 572964, "epoch": 6903} {"train_loss": -27.6575870513916, "global_step": 572965, "epoch": 6903} {"train_loss": -27.830219268798828, "global_step": 572966, "epoch": 6903} {"train_loss": -27.950153350830078, "global_step": 572967, "epoch": 6903} {"train_loss": -28.071613311767578, "global_step": 572968, "epoch": 6903} {"train_loss": -27.85980796813965, "global_step": 572969, "epoch": 6903} {"train_loss": -27.756139755249023, "global_step": 572970, "epoch": 6903} {"train_loss": -27.627538681030273, "global_step": 572971, "epoch": 6903} {"train_loss": -27.88202476501465, "global_step": 572972, "epoch": 6903} {"train_loss": -27.9637508392334, "global_step": 572973, "epoch": 6903} {"train_loss": -28.270994186401367, "global_step": 572974, "epoch": 6903} {"train_loss": -27.774023056030273, "global_step": 572975, "epoch": 6903} {"train_loss": -27.987104415893555, "global_step": 572976, "epoch": 6903} {"train_loss": -27.965524673461914, "global_step": 572977, "epoch": 6903} {"train_loss": -27.378314971923828, "global_step": 572978, "epoch": 6903} {"train_loss": -28.12848472595215, "global_step": 572979, "epoch": 6903} {"train_loss": -28.312885284423828, "global_step": 572980, "epoch": 6903} {"train_loss": -28.041339874267578, "global_step": 572981, "epoch": 6903} {"train_loss": -27.57130241394043, "global_step": 572982, "epoch": 6903} {"train_loss": -27.8892765045166, "global_step": 572983, "epoch": 6903} {"train_loss": -27.964004516601562, "global_step": 572984, "epoch": 6903} {"train_loss": -28.036212921142578, "global_step": 572985, "epoch": 6903} {"train_loss": -28.1353816986084, "global_step": 572986, "epoch": 6903} {"train_loss": -27.799779891967773, "global_step": 572987, "epoch": 6903} {"train_loss": -28.297285079956055, "global_step": 572988, "epoch": 6903} {"train_loss": -28.073896408081055, "global_step": 572989, "epoch": 6903} {"train_loss": -28.177152633666992, "global_step": 572990, "epoch": 6903} {"train_loss": -28.08924674987793, "global_step": 572991, "epoch": 6903} {"train_loss": -28.178457260131836, "global_step": 572992, "epoch": 6903} {"train_loss": -27.661026000976562, "global_step": 572993, "epoch": 6903} {"train_loss": -27.673330307006836, "global_step": 572994, "epoch": 6903} {"train_loss": -28.177276611328125, "global_step": 572995, "epoch": 6903} {"train_loss": -27.900060653686523, "global_step": 572996, "epoch": 6903} {"train_loss": -28.267887115478516, "global_step": 572997, "epoch": 6903} {"train_loss": -27.867216110229492, "global_step": 572998, "epoch": 6903} {"train_loss": -27.437177658081055, "global_step": 572999, "epoch": 6903} {"train_loss": -28.094879150390625, "global_step": 573000, "epoch": 6903} {"train_loss": -27.629291534423828, "global_step": 573001, "epoch": 6903} {"train_loss": -27.634870529174805, "global_step": 573002, "epoch": 6903} {"train_loss": -27.584360122680664, "global_step": 573003, "epoch": 6903} {"train_loss": -28.063922882080078, "global_step": 573004, "epoch": 6903} {"train_loss": -27.839279174804688, "global_step": 573005, "epoch": 6903} {"train_loss": -27.44264030456543, "global_step": 573006, "epoch": 6903} {"train_loss": -28.2677059173584, "global_step": 573007, "epoch": 6903} {"train_loss": -27.880172729492188, "global_step": 573008, "epoch": 6903} {"train_loss": -28.173681259155273, "global_step": 573009, "epoch": 6903} {"train_loss": -28.17682456970215, "global_step": 573010, "epoch": 6903} {"train_loss": -27.869892120361328, "global_step": 573011, "epoch": 6903} {"train_loss": -27.4913330078125, "global_step": 573012, "epoch": 6903} {"train_loss": -27.529943466186523, "global_step": 573013, "epoch": 6903} {"train_loss": -27.7501220703125, "global_step": 573014, "epoch": 6903} {"train_loss": -27.853595733642578, "global_step": 573015, "epoch": 6903} {"train_loss": -28.023651123046875, "global_step": 573016, "epoch": 6903} {"train_loss": -27.579345703125, "global_step": 573017, "epoch": 6903} {"train_loss": -27.91004753112793, "global_step": 573018, "epoch": 6903} {"train_loss": -27.82403564453125, "global_step": 573019, "epoch": 6903} {"train_loss": -27.689895629882812, "global_step": 573020, "epoch": 6903} {"train_loss": -27.45659828186035, "global_step": 573021, "epoch": 6903} {"train_loss": -27.91387939453125, "global_step": 573022, "epoch": 6903} {"train_loss": -28.259260177612305, "global_step": 573023, "epoch": 6903} {"train_loss": -27.947866439819336, "global_step": 573024, "epoch": 6903} {"train_loss": -28.016759872436523, "global_step": 573025, "epoch": 6903} {"train_loss": -28.288511276245117, "global_step": 573026, "epoch": 6903} {"train_loss": -28.122709274291992, "global_step": 573027, "epoch": 6903} {"train_loss": -28.093753814697266, "global_step": 573028, "epoch": 6903} {"train_loss": -28.04188346862793, "global_step": 573029, "epoch": 6903} {"train_loss": -27.74200439453125, "global_step": 573030, "epoch": 6903} {"train_loss": -27.865656680371387, "global_step": 573031, "epoch": 6903, "val_loss": 6504658.0} {"train_loss": -27.20216178894043, "global_step": 573032, "epoch": 6904} {"train_loss": -26.814374923706055, "global_step": 573033, "epoch": 6904} {"train_loss": -27.1414852142334, "global_step": 573034, "epoch": 6904} {"train_loss": -26.414941787719727, "global_step": 573035, "epoch": 6904} {"train_loss": -27.794164657592773, "global_step": 573036, "epoch": 6904} {"train_loss": -26.452499389648438, "global_step": 573037, "epoch": 6904} {"train_loss": -27.973615646362305, "global_step": 573038, "epoch": 6904} {"train_loss": -26.895673751831055, "global_step": 573039, "epoch": 6904} {"train_loss": -27.551733016967773, "global_step": 573040, "epoch": 6904} {"train_loss": -27.501550674438477, "global_step": 573041, "epoch": 6904} {"train_loss": -27.68007469177246, "global_step": 573042, "epoch": 6904} {"train_loss": -27.613683700561523, "global_step": 573043, "epoch": 6904} {"train_loss": -27.6552734375, "global_step": 573044, "epoch": 6904} {"train_loss": -27.392841339111328, "global_step": 573045, "epoch": 6904} {"train_loss": -27.65431022644043, "global_step": 573046, "epoch": 6904} {"train_loss": -27.65105628967285, "global_step": 573047, "epoch": 6904} {"train_loss": -27.6944637298584, "global_step": 573048, "epoch": 6904} {"train_loss": -27.667444229125977, "global_step": 573049, "epoch": 6904} {"train_loss": -27.8686466217041, "global_step": 573050, "epoch": 6904} {"train_loss": -27.721464157104492, "global_step": 573051, "epoch": 6904} {"train_loss": -27.803083419799805, "global_step": 573052, "epoch": 6904} {"train_loss": -27.301721572875977, "global_step": 573053, "epoch": 6904} {"train_loss": -27.712865829467773, "global_step": 573054, "epoch": 6904} {"train_loss": -27.537519454956055, "global_step": 573055, "epoch": 6904} {"train_loss": -27.609073638916016, "global_step": 573056, "epoch": 6904} {"train_loss": -27.568883895874023, "global_step": 573057, "epoch": 6904} {"train_loss": -28.114215850830078, "global_step": 573058, "epoch": 6904} {"train_loss": -27.75081443786621, "global_step": 573059, "epoch": 6904} {"train_loss": -27.71613121032715, "global_step": 573060, "epoch": 6904} {"train_loss": -28.05708122253418, "global_step": 573061, "epoch": 6904} {"train_loss": -27.6741886138916, "global_step": 573062, "epoch": 6904} {"train_loss": -27.508148193359375, "global_step": 573063, "epoch": 6904} {"train_loss": -28.024770736694336, "global_step": 573064, "epoch": 6904} {"train_loss": -27.859832763671875, "global_step": 573065, "epoch": 6904} {"train_loss": -27.658170700073242, "global_step": 573066, "epoch": 6904} {"train_loss": -28.04813575744629, "global_step": 573067, "epoch": 6904} {"train_loss": -27.995361328125, "global_step": 573068, "epoch": 6904} {"train_loss": -27.953882217407227, "global_step": 573069, "epoch": 6904} {"train_loss": -27.969776153564453, "global_step": 573070, "epoch": 6904} {"train_loss": -27.557703018188477, "global_step": 573071, "epoch": 6904} {"train_loss": -28.020532608032227, "global_step": 573072, "epoch": 6904} {"train_loss": -27.996732711791992, "global_step": 573073, "epoch": 6904} {"train_loss": -27.75599479675293, "global_step": 573074, "epoch": 6904} {"train_loss": -27.745107650756836, "global_step": 573075, "epoch": 6904} {"train_loss": -27.599273681640625, "global_step": 573076, "epoch": 6904} {"train_loss": -27.399145126342773, "global_step": 573077, "epoch": 6904} {"train_loss": -27.00310707092285, "global_step": 573078, "epoch": 6904} {"train_loss": -27.235137939453125, "global_step": 573079, "epoch": 6904} {"train_loss": -27.618793487548828, "global_step": 573080, "epoch": 6904} {"train_loss": -27.749237060546875, "global_step": 573081, "epoch": 6904} {"train_loss": -27.215696334838867, "global_step": 573082, "epoch": 6904} {"train_loss": -27.3548526763916, "global_step": 573083, "epoch": 6904} {"train_loss": -27.7434024810791, "global_step": 573084, "epoch": 6904} {"train_loss": -27.796823501586914, "global_step": 573085, "epoch": 6904} {"train_loss": -27.8763370513916, "global_step": 573086, "epoch": 6904} {"train_loss": -27.5921688079834, "global_step": 573087, "epoch": 6904} {"train_loss": -27.88355827331543, "global_step": 573088, "epoch": 6904} {"train_loss": -27.699365615844727, "global_step": 573089, "epoch": 6904} {"train_loss": -28.0661678314209, "global_step": 573090, "epoch": 6904} {"train_loss": -27.710172653198242, "global_step": 573091, "epoch": 6904} {"train_loss": -27.639745712280273, "global_step": 573092, "epoch": 6904} {"train_loss": -27.6037654876709, "global_step": 573093, "epoch": 6904} {"train_loss": -27.628263473510742, "global_step": 573094, "epoch": 6904} {"train_loss": -27.38006019592285, "global_step": 573095, "epoch": 6904} {"train_loss": -26.937744140625, "global_step": 573096, "epoch": 6904} {"train_loss": -27.832584381103516, "global_step": 573097, "epoch": 6904} {"train_loss": -27.677478790283203, "global_step": 573098, "epoch": 6904} {"train_loss": -27.39287757873535, "global_step": 573099, "epoch": 6904} {"train_loss": -27.318326950073242, "global_step": 573100, "epoch": 6904} {"train_loss": -27.43494987487793, "global_step": 573101, "epoch": 6904} {"train_loss": -27.899717330932617, "global_step": 573102, "epoch": 6904} {"train_loss": -27.388870239257812, "global_step": 573103, "epoch": 6904} {"train_loss": -27.934192657470703, "global_step": 573104, "epoch": 6904} {"train_loss": -27.449066162109375, "global_step": 573105, "epoch": 6904} {"train_loss": -27.75166130065918, "global_step": 573106, "epoch": 6904} {"train_loss": -27.71735954284668, "global_step": 573107, "epoch": 6904} {"train_loss": -27.655725479125977, "global_step": 573108, "epoch": 6904} {"train_loss": -28.046838760375977, "global_step": 573109, "epoch": 6904} {"train_loss": -27.349079132080078, "global_step": 573110, "epoch": 6904} {"train_loss": -27.718963623046875, "global_step": 573111, "epoch": 6904} {"train_loss": -27.452590942382812, "global_step": 573112, "epoch": 6904} {"train_loss": -28.011310577392578, "global_step": 573113, "epoch": 6904} {"train_loss": -27.607772873108644, "global_step": 573114, "epoch": 6904, "val_loss": 6471375.5} {"train_loss": -27.621490478515625, "global_step": 573115, "epoch": 6905} {"train_loss": -27.339130401611328, "global_step": 573116, "epoch": 6905} {"train_loss": -27.22216796875, "global_step": 573117, "epoch": 6905} {"train_loss": -27.357751846313477, "global_step": 573118, "epoch": 6905} {"train_loss": -26.9958438873291, "global_step": 573119, "epoch": 6905} {"train_loss": -27.62092399597168, "global_step": 573120, "epoch": 6905} {"train_loss": -27.53281593322754, "global_step": 573121, "epoch": 6905} {"train_loss": -27.532835006713867, "global_step": 573122, "epoch": 6905} {"train_loss": -27.744367599487305, "global_step": 573123, "epoch": 6905} {"train_loss": -27.57177734375, "global_step": 573124, "epoch": 6905} {"train_loss": -27.608633041381836, "global_step": 573125, "epoch": 6905} {"train_loss": -27.297765731811523, "global_step": 573126, "epoch": 6905} {"train_loss": -27.58571434020996, "global_step": 573127, "epoch": 6905} {"train_loss": -27.790937423706055, "global_step": 573128, "epoch": 6905} {"train_loss": -27.748205184936523, "global_step": 573129, "epoch": 6905} {"train_loss": -27.759521484375, "global_step": 573130, "epoch": 6905} {"train_loss": -27.560443878173828, "global_step": 573131, "epoch": 6905} {"train_loss": -27.640668869018555, "global_step": 573132, "epoch": 6905} {"train_loss": -27.52130126953125, "global_step": 573133, "epoch": 6905} {"train_loss": -27.781381607055664, "global_step": 573134, "epoch": 6905} {"train_loss": -27.768415451049805, "global_step": 573135, "epoch": 6905} {"train_loss": -27.7523193359375, "global_step": 573136, "epoch": 6905} {"train_loss": -27.74081802368164, "global_step": 573137, "epoch": 6905} {"train_loss": -27.659259796142578, "global_step": 573138, "epoch": 6905} {"train_loss": -27.731887817382812, "global_step": 573139, "epoch": 6905} {"train_loss": -27.859210968017578, "global_step": 573140, "epoch": 6905} {"train_loss": -27.86360740661621, "global_step": 573141, "epoch": 6905} {"train_loss": -27.821533203125, "global_step": 573142, "epoch": 6905} {"train_loss": -27.99812889099121, "global_step": 573143, "epoch": 6905} {"train_loss": -27.911056518554688, "global_step": 573144, "epoch": 6905} {"train_loss": -27.88529396057129, "global_step": 573145, "epoch": 6905} {"train_loss": -28.047327041625977, "global_step": 573146, "epoch": 6905} {"train_loss": -27.81449317932129, "global_step": 573147, "epoch": 6905} {"train_loss": -28.069700241088867, "global_step": 573148, "epoch": 6905} {"train_loss": -28.35401725769043, "global_step": 573149, "epoch": 6905} {"train_loss": -28.245609283447266, "global_step": 573150, "epoch": 6905} {"train_loss": -27.641149520874023, "global_step": 573151, "epoch": 6905} {"train_loss": -28.13275718688965, "global_step": 573152, "epoch": 6905} {"train_loss": -27.694543838500977, "global_step": 573153, "epoch": 6905} {"train_loss": -28.28315544128418, "global_step": 573154, "epoch": 6905} {"train_loss": -27.831220626831055, "global_step": 573155, "epoch": 6905} {"train_loss": -27.954986572265625, "global_step": 573156, "epoch": 6905} {"train_loss": -28.00079345703125, "global_step": 573157, "epoch": 6905} {"train_loss": -27.655126571655273, "global_step": 573158, "epoch": 6905} {"train_loss": -27.752700805664062, "global_step": 573159, "epoch": 6905} {"train_loss": -27.524946212768555, "global_step": 573160, "epoch": 6905} {"train_loss": -27.819568634033203, "global_step": 573161, "epoch": 6905} {"train_loss": -28.112167358398438, "global_step": 573162, "epoch": 6905} {"train_loss": -27.708740234375, "global_step": 573163, "epoch": 6905} {"train_loss": -27.82465934753418, "global_step": 573164, "epoch": 6905} {"train_loss": -28.046100616455078, "global_step": 573165, "epoch": 6905} {"train_loss": -27.94097328186035, "global_step": 573166, "epoch": 6905} {"train_loss": -27.800174713134766, "global_step": 573167, "epoch": 6905} {"train_loss": -28.09889793395996, "global_step": 573168, "epoch": 6905} {"train_loss": -27.83454704284668, "global_step": 573169, "epoch": 6905} {"train_loss": -28.087141036987305, "global_step": 573170, "epoch": 6905} {"train_loss": -27.934778213500977, "global_step": 573171, "epoch": 6905} {"train_loss": -27.762487411499023, "global_step": 573172, "epoch": 6905} {"train_loss": -27.86700439453125, "global_step": 573173, "epoch": 6905} {"train_loss": -27.913333892822266, "global_step": 573174, "epoch": 6905} {"train_loss": -27.98540687561035, "global_step": 573175, "epoch": 6905} {"train_loss": -27.741931915283203, "global_step": 573176, "epoch": 6905} {"train_loss": -28.208486557006836, "global_step": 573177, "epoch": 6905} {"train_loss": -28.647611618041992, "global_step": 573178, "epoch": 6905} {"train_loss": -28.0128173828125, "global_step": 573179, "epoch": 6905} {"train_loss": -27.81121253967285, "global_step": 573180, "epoch": 6905} {"train_loss": -28.0076847076416, "global_step": 573181, "epoch": 6905} {"train_loss": -27.6075439453125, "global_step": 573182, "epoch": 6905} {"train_loss": -28.026803970336914, "global_step": 573183, "epoch": 6905} {"train_loss": -27.7331485748291, "global_step": 573184, "epoch": 6905} {"train_loss": -27.947406768798828, "global_step": 573185, "epoch": 6905} {"train_loss": -27.902484893798828, "global_step": 573186, "epoch": 6905} {"train_loss": -27.80141258239746, "global_step": 573187, "epoch": 6905} {"train_loss": -28.040205001831055, "global_step": 573188, "epoch": 6905} {"train_loss": -28.076446533203125, "global_step": 573189, "epoch": 6905} {"train_loss": -27.888837814331055, "global_step": 573190, "epoch": 6905} {"train_loss": -27.67474365234375, "global_step": 573191, "epoch": 6905} {"train_loss": -27.90302848815918, "global_step": 573192, "epoch": 6905} {"train_loss": -28.001422882080078, "global_step": 573193, "epoch": 6905} {"train_loss": -28.107763290405273, "global_step": 573194, "epoch": 6905} {"train_loss": -28.46795654296875, "global_step": 573195, "epoch": 6905} {"train_loss": -28.1539249420166, "global_step": 573196, "epoch": 6905} {"train_loss": -27.83364957786468, "global_step": 573197, "epoch": 6905, "val_loss": 6463846.0} {"train_loss": -27.619848251342773, "global_step": 573198, "epoch": 6906} {"train_loss": -27.091785430908203, "global_step": 573199, "epoch": 6906} {"train_loss": -26.251554489135742, "global_step": 573200, "epoch": 6906} {"train_loss": -26.40700340270996, "global_step": 573201, "epoch": 6906} {"train_loss": -27.10578727722168, "global_step": 573202, "epoch": 6906} {"train_loss": -26.83209228515625, "global_step": 573203, "epoch": 6906} {"train_loss": -27.2645320892334, "global_step": 573204, "epoch": 6906} {"train_loss": -26.5809326171875, "global_step": 573205, "epoch": 6906} {"train_loss": -26.94752311706543, "global_step": 573206, "epoch": 6906} {"train_loss": -27.07804298400879, "global_step": 573207, "epoch": 6906} {"train_loss": -26.452926635742188, "global_step": 573208, "epoch": 6906} {"train_loss": -27.13691520690918, "global_step": 573209, "epoch": 6906} {"train_loss": -27.016372680664062, "global_step": 573210, "epoch": 6906} {"train_loss": -27.31500816345215, "global_step": 573211, "epoch": 6906} {"train_loss": -27.303552627563477, "global_step": 573212, "epoch": 6906} {"train_loss": -27.797870635986328, "global_step": 573213, "epoch": 6906} {"train_loss": -27.810022354125977, "global_step": 573214, "epoch": 6906} {"train_loss": -27.448455810546875, "global_step": 573215, "epoch": 6906} {"train_loss": -27.118640899658203, "global_step": 573216, "epoch": 6906} {"train_loss": -26.86664390563965, "global_step": 573217, "epoch": 6906} {"train_loss": -27.651296615600586, "global_step": 573218, "epoch": 6906} {"train_loss": -27.595041275024414, "global_step": 573219, "epoch": 6906} {"train_loss": -27.251623153686523, "global_step": 573220, "epoch": 6906} {"train_loss": -27.580068588256836, "global_step": 573221, "epoch": 6906} {"train_loss": -27.459192276000977, "global_step": 573222, "epoch": 6906} {"train_loss": -27.413806915283203, "global_step": 573223, "epoch": 6906} {"train_loss": -27.538604736328125, "global_step": 573224, "epoch": 6906} {"train_loss": -27.201330184936523, "global_step": 573225, "epoch": 6906} {"train_loss": -27.862319946289062, "global_step": 573226, "epoch": 6906} {"train_loss": -27.591787338256836, "global_step": 573227, "epoch": 6906} {"train_loss": -28.090133666992188, "global_step": 573228, "epoch": 6906} {"train_loss": -27.640790939331055, "global_step": 573229, "epoch": 6906} {"train_loss": -27.552322387695312, "global_step": 573230, "epoch": 6906} {"train_loss": -27.629730224609375, "global_step": 573231, "epoch": 6906} {"train_loss": -27.737150192260742, "global_step": 573232, "epoch": 6906} {"train_loss": -27.915332794189453, "global_step": 573233, "epoch": 6906} {"train_loss": -27.913928985595703, "global_step": 573234, "epoch": 6906} {"train_loss": -27.703662872314453, "global_step": 573235, "epoch": 6906} {"train_loss": -28.06418800354004, "global_step": 573236, "epoch": 6906} {"train_loss": -27.3548641204834, "global_step": 573237, "epoch": 6906} {"train_loss": -27.918745040893555, "global_step": 573238, "epoch": 6906} {"train_loss": -27.918745040893555, "global_step": 573239, "epoch": 6906} {"train_loss": -27.831649780273438, "global_step": 573240, "epoch": 6906} {"train_loss": -28.11555290222168, "global_step": 573241, "epoch": 6906} {"train_loss": -27.592741012573242, "global_step": 573242, "epoch": 6906} {"train_loss": -27.7539005279541, "global_step": 573243, "epoch": 6906} {"train_loss": -28.11165428161621, "global_step": 573244, "epoch": 6906} {"train_loss": -27.6092586517334, "global_step": 573245, "epoch": 6906} {"train_loss": -28.034162521362305, "global_step": 573246, "epoch": 6906} {"train_loss": -27.873510360717773, "global_step": 573247, "epoch": 6906} {"train_loss": -28.253860473632812, "global_step": 573248, "epoch": 6906} {"train_loss": -28.22625732421875, "global_step": 573249, "epoch": 6906} {"train_loss": -28.1977481842041, "global_step": 573250, "epoch": 6906} {"train_loss": -27.551727294921875, "global_step": 573251, "epoch": 6906} {"train_loss": -28.059133529663086, "global_step": 573252, "epoch": 6906} {"train_loss": -27.88699722290039, "global_step": 573253, "epoch": 6906} {"train_loss": -27.754138946533203, "global_step": 573254, "epoch": 6906} {"train_loss": -28.254491806030273, "global_step": 573255, "epoch": 6906} {"train_loss": -27.947772979736328, "global_step": 573256, "epoch": 6906} {"train_loss": -28.145004272460938, "global_step": 573257, "epoch": 6906} {"train_loss": -27.691513061523438, "global_step": 573258, "epoch": 6906} {"train_loss": -28.006322860717773, "global_step": 573259, "epoch": 6906} {"train_loss": -28.109180450439453, "global_step": 573260, "epoch": 6906} {"train_loss": -28.031936645507812, "global_step": 573261, "epoch": 6906} {"train_loss": -28.17595863342285, "global_step": 573262, "epoch": 6906} {"train_loss": -28.009069442749023, "global_step": 573263, "epoch": 6906} {"train_loss": -27.762205123901367, "global_step": 573264, "epoch": 6906} {"train_loss": -28.070205688476562, "global_step": 573265, "epoch": 6906} {"train_loss": -28.074811935424805, "global_step": 573266, "epoch": 6906} {"train_loss": -27.655933380126953, "global_step": 573267, "epoch": 6906} {"train_loss": -27.695037841796875, "global_step": 573268, "epoch": 6906} {"train_loss": -28.088083267211914, "global_step": 573269, "epoch": 6906} {"train_loss": -27.76806640625, "global_step": 573270, "epoch": 6906} {"train_loss": -28.43048667907715, "global_step": 573271, "epoch": 6906} {"train_loss": -27.6896915435791, "global_step": 573272, "epoch": 6906} {"train_loss": -27.81427001953125, "global_step": 573273, "epoch": 6906} {"train_loss": -27.870513916015625, "global_step": 573274, "epoch": 6906} {"train_loss": -27.879901885986328, "global_step": 573275, "epoch": 6906} {"train_loss": -28.145353317260742, "global_step": 573276, "epoch": 6906} {"train_loss": -27.75347900390625, "global_step": 573277, "epoch": 6906} {"train_loss": -27.797651290893555, "global_step": 573278, "epoch": 6906} {"train_loss": -27.694570541381836, "global_step": 573279, "epoch": 6906} {"train_loss": -27.657864834888873, "global_step": 573280, "epoch": 6906, "val_loss": 6543049.0} {"train_loss": -27.219343185424805, "global_step": 573281, "epoch": 6907} {"train_loss": -26.401840209960938, "global_step": 573282, "epoch": 6907} {"train_loss": -26.80499267578125, "global_step": 573283, "epoch": 6907} {"train_loss": -26.915241241455078, "global_step": 573284, "epoch": 6907} {"train_loss": -27.359045028686523, "global_step": 573285, "epoch": 6907} {"train_loss": -27.26997184753418, "global_step": 573286, "epoch": 6907} {"train_loss": -26.984479904174805, "global_step": 573287, "epoch": 6907} {"train_loss": -27.352399826049805, "global_step": 573288, "epoch": 6907} {"train_loss": -27.89983558654785, "global_step": 573289, "epoch": 6907} {"train_loss": -27.428955078125, "global_step": 573290, "epoch": 6907} {"train_loss": -27.116796493530273, "global_step": 573291, "epoch": 6907} {"train_loss": -27.284351348876953, "global_step": 573292, "epoch": 6907} {"train_loss": -27.298954010009766, "global_step": 573293, "epoch": 6907} {"train_loss": -27.32510757446289, "global_step": 573294, "epoch": 6907} {"train_loss": -27.53968620300293, "global_step": 573295, "epoch": 6907} {"train_loss": -27.451770782470703, "global_step": 573296, "epoch": 6907} {"train_loss": -27.980056762695312, "global_step": 573297, "epoch": 6907} {"train_loss": -27.546600341796875, "global_step": 573298, "epoch": 6907} {"train_loss": -27.835102081298828, "global_step": 573299, "epoch": 6907} {"train_loss": -27.84115982055664, "global_step": 573300, "epoch": 6907} {"train_loss": -27.45953941345215, "global_step": 573301, "epoch": 6907} {"train_loss": -27.64837074279785, "global_step": 573302, "epoch": 6907} {"train_loss": -27.896804809570312, "global_step": 573303, "epoch": 6907} {"train_loss": -28.163471221923828, "global_step": 573304, "epoch": 6907} {"train_loss": -27.918537139892578, "global_step": 573305, "epoch": 6907} {"train_loss": -27.497339248657227, "global_step": 573306, "epoch": 6907} {"train_loss": -28.198505401611328, "global_step": 573307, "epoch": 6907} {"train_loss": -28.02389907836914, "global_step": 573308, "epoch": 6907} {"train_loss": -27.8880615234375, "global_step": 573309, "epoch": 6907} {"train_loss": -27.5983829498291, "global_step": 573310, "epoch": 6907} {"train_loss": -27.907474517822266, "global_step": 573311, "epoch": 6907} {"train_loss": -28.018295288085938, "global_step": 573312, "epoch": 6907} {"train_loss": -28.1010684967041, "global_step": 573313, "epoch": 6907} {"train_loss": -28.125986099243164, "global_step": 573314, "epoch": 6907} {"train_loss": -28.10102653503418, "global_step": 573315, "epoch": 6907} {"train_loss": -28.13580894470215, "global_step": 573316, "epoch": 6907} {"train_loss": -27.61824607849121, "global_step": 573317, "epoch": 6907} {"train_loss": -28.098804473876953, "global_step": 573318, "epoch": 6907} {"train_loss": -27.998676300048828, "global_step": 573319, "epoch": 6907} {"train_loss": -27.7690486907959, "global_step": 573320, "epoch": 6907} {"train_loss": -27.881195068359375, "global_step": 573321, "epoch": 6907} {"train_loss": -28.109222412109375, "global_step": 573322, "epoch": 6907} {"train_loss": -27.622541427612305, "global_step": 573323, "epoch": 6907} {"train_loss": -27.818267822265625, "global_step": 573324, "epoch": 6907} {"train_loss": -28.085615158081055, "global_step": 573325, "epoch": 6907} {"train_loss": -27.9888916015625, "global_step": 573326, "epoch": 6907} {"train_loss": -27.6686954498291, "global_step": 573327, "epoch": 6907} {"train_loss": -27.607421875, "global_step": 573328, "epoch": 6907} {"train_loss": -27.94049644470215, "global_step": 573329, "epoch": 6907} {"train_loss": -27.919275283813477, "global_step": 573330, "epoch": 6907} {"train_loss": -28.20765495300293, "global_step": 573331, "epoch": 6907} {"train_loss": -28.293691635131836, "global_step": 573332, "epoch": 6907} {"train_loss": -28.15106201171875, "global_step": 573333, "epoch": 6907} {"train_loss": -28.479394912719727, "global_step": 573334, "epoch": 6907} {"train_loss": -28.073877334594727, "global_step": 573335, "epoch": 6907} {"train_loss": -27.67850112915039, "global_step": 573336, "epoch": 6907} {"train_loss": -27.603174209594727, "global_step": 573337, "epoch": 6907} {"train_loss": -27.966428756713867, "global_step": 573338, "epoch": 6907} {"train_loss": -28.193836212158203, "global_step": 573339, "epoch": 6907} {"train_loss": -27.851428985595703, "global_step": 573340, "epoch": 6907} {"train_loss": -27.841888427734375, "global_step": 573341, "epoch": 6907} {"train_loss": -27.732702255249023, "global_step": 573342, "epoch": 6907} {"train_loss": -27.896215438842773, "global_step": 573343, "epoch": 6907} {"train_loss": -28.356861114501953, "global_step": 573344, "epoch": 6907} {"train_loss": -27.78022575378418, "global_step": 573345, "epoch": 6907} {"train_loss": -28.122222900390625, "global_step": 573346, "epoch": 6907} {"train_loss": -28.090412139892578, "global_step": 573347, "epoch": 6907} {"train_loss": -28.174951553344727, "global_step": 573348, "epoch": 6907} {"train_loss": -28.035287857055664, "global_step": 573349, "epoch": 6907} {"train_loss": -27.834442138671875, "global_step": 573350, "epoch": 6907} {"train_loss": -27.991947174072266, "global_step": 573351, "epoch": 6907} {"train_loss": -27.97263526916504, "global_step": 573352, "epoch": 6907} {"train_loss": -27.795806884765625, "global_step": 573353, "epoch": 6907} {"train_loss": -27.789798736572266, "global_step": 573354, "epoch": 6907} {"train_loss": -27.873645782470703, "global_step": 573355, "epoch": 6907} {"train_loss": -27.93635368347168, "global_step": 573356, "epoch": 6907} {"train_loss": -27.880781173706055, "global_step": 573357, "epoch": 6907} {"train_loss": -27.866525650024414, "global_step": 573358, "epoch": 6907} {"train_loss": -27.870641708374023, "global_step": 573359, "epoch": 6907} {"train_loss": -28.112226486206055, "global_step": 573360, "epoch": 6907} {"train_loss": -28.2066593170166, "global_step": 573361, "epoch": 6907} {"train_loss": -27.98776626586914, "global_step": 573362, "epoch": 6907} {"train_loss": -27.805825198989318, "global_step": 573363, "epoch": 6907, "val_loss": 6524118.0} {"train_loss": -27.63985252380371, "global_step": 573364, "epoch": 6908} {"train_loss": -27.6218204498291, "global_step": 573365, "epoch": 6908} {"train_loss": -27.864425659179688, "global_step": 573366, "epoch": 6908} {"train_loss": -27.745962142944336, "global_step": 573367, "epoch": 6908} {"train_loss": -27.774250030517578, "global_step": 573368, "epoch": 6908} {"train_loss": -27.508230209350586, "global_step": 573369, "epoch": 6908} {"train_loss": -27.366552352905273, "global_step": 573370, "epoch": 6908} {"train_loss": -27.333860397338867, "global_step": 573371, "epoch": 6908} {"train_loss": -27.763946533203125, "global_step": 573372, "epoch": 6908} {"train_loss": -27.269617080688477, "global_step": 573373, "epoch": 6908} {"train_loss": -27.637256622314453, "global_step": 573374, "epoch": 6908} {"train_loss": -28.188852310180664, "global_step": 573375, "epoch": 6908} {"train_loss": -27.820526123046875, "global_step": 573376, "epoch": 6908} {"train_loss": -27.39383888244629, "global_step": 573377, "epoch": 6908} {"train_loss": -27.763437271118164, "global_step": 573378, "epoch": 6908} {"train_loss": -27.34610366821289, "global_step": 573379, "epoch": 6908} {"train_loss": -27.7006893157959, "global_step": 573380, "epoch": 6908} {"train_loss": -27.86480140686035, "global_step": 573381, "epoch": 6908} {"train_loss": -27.623432159423828, "global_step": 573382, "epoch": 6908} {"train_loss": -28.003583908081055, "global_step": 573383, "epoch": 6908} {"train_loss": -27.680139541625977, "global_step": 573384, "epoch": 6908} {"train_loss": -27.954797744750977, "global_step": 573385, "epoch": 6908} {"train_loss": -27.59406852722168, "global_step": 573386, "epoch": 6908} {"train_loss": -27.78114891052246, "global_step": 573387, "epoch": 6908} {"train_loss": -27.796003341674805, "global_step": 573388, "epoch": 6908} {"train_loss": -27.64926528930664, "global_step": 573389, "epoch": 6908} {"train_loss": -27.873350143432617, "global_step": 573390, "epoch": 6908} {"train_loss": -27.651798248291016, "global_step": 573391, "epoch": 6908} {"train_loss": -27.97113037109375, "global_step": 573392, "epoch": 6908} {"train_loss": -27.67933464050293, "global_step": 573393, "epoch": 6908} {"train_loss": -27.882978439331055, "global_step": 573394, "epoch": 6908} {"train_loss": -27.416187286376953, "global_step": 573395, "epoch": 6908} {"train_loss": -28.33893394470215, "global_step": 573396, "epoch": 6908} {"train_loss": -27.944629669189453, "global_step": 573397, "epoch": 6908} {"train_loss": -28.09711265563965, "global_step": 573398, "epoch": 6908} {"train_loss": -28.2095947265625, "global_step": 573399, "epoch": 6908} {"train_loss": -27.818906784057617, "global_step": 573400, "epoch": 6908} {"train_loss": -27.736921310424805, "global_step": 573401, "epoch": 6908} {"train_loss": -27.910446166992188, "global_step": 573402, "epoch": 6908} {"train_loss": -27.799026489257812, "global_step": 573403, "epoch": 6908} {"train_loss": -28.299915313720703, "global_step": 573404, "epoch": 6908} {"train_loss": -27.813858032226562, "global_step": 573405, "epoch": 6908} {"train_loss": -28.25979995727539, "global_step": 573406, "epoch": 6908} {"train_loss": -28.22846794128418, "global_step": 573407, "epoch": 6908} {"train_loss": -28.01438331604004, "global_step": 573408, "epoch": 6908} {"train_loss": -28.088769912719727, "global_step": 573409, "epoch": 6908} {"train_loss": -27.94965171813965, "global_step": 573410, "epoch": 6908} {"train_loss": -28.10041618347168, "global_step": 573411, "epoch": 6908} {"train_loss": -28.1669921875, "global_step": 573412, "epoch": 6908} {"train_loss": -27.916828155517578, "global_step": 573413, "epoch": 6908} {"train_loss": -27.9731388092041, "global_step": 573414, "epoch": 6908} {"train_loss": -28.12232780456543, "global_step": 573415, "epoch": 6908} {"train_loss": -27.72235107421875, "global_step": 573416, "epoch": 6908} {"train_loss": -27.9890079498291, "global_step": 573417, "epoch": 6908} {"train_loss": -27.89088249206543, "global_step": 573418, "epoch": 6908} {"train_loss": -28.071674346923828, "global_step": 573419, "epoch": 6908} {"train_loss": -27.88355827331543, "global_step": 573420, "epoch": 6908} {"train_loss": -28.012842178344727, "global_step": 573421, "epoch": 6908} {"train_loss": -28.1092586517334, "global_step": 573422, "epoch": 6908} {"train_loss": -27.8646183013916, "global_step": 573423, "epoch": 6908} {"train_loss": -28.0130672454834, "global_step": 573424, "epoch": 6908} {"train_loss": -27.832815170288086, "global_step": 573425, "epoch": 6908} {"train_loss": -28.249420166015625, "global_step": 573426, "epoch": 6908} {"train_loss": -27.839075088500977, "global_step": 573427, "epoch": 6908} {"train_loss": -27.64240074157715, "global_step": 573428, "epoch": 6908} {"train_loss": -27.333410263061523, "global_step": 573429, "epoch": 6908} {"train_loss": -27.631439208984375, "global_step": 573430, "epoch": 6908} {"train_loss": -28.175153732299805, "global_step": 573431, "epoch": 6908} {"train_loss": -27.846845626831055, "global_step": 573432, "epoch": 6908} {"train_loss": -27.532123565673828, "global_step": 573433, "epoch": 6908} {"train_loss": -27.608118057250977, "global_step": 573434, "epoch": 6908} {"train_loss": -27.745267868041992, "global_step": 573435, "epoch": 6908} {"train_loss": -28.065778732299805, "global_step": 573436, "epoch": 6908} {"train_loss": -27.991941452026367, "global_step": 573437, "epoch": 6908} {"train_loss": -27.66597557067871, "global_step": 573438, "epoch": 6908} {"train_loss": -27.828466415405273, "global_step": 573439, "epoch": 6908} {"train_loss": -28.09982681274414, "global_step": 573440, "epoch": 6908} {"train_loss": -28.168054580688477, "global_step": 573441, "epoch": 6908} {"train_loss": -28.34559440612793, "global_step": 573442, "epoch": 6908} {"train_loss": -28.1434383392334, "global_step": 573443, "epoch": 6908} {"train_loss": -27.694223403930664, "global_step": 573444, "epoch": 6908} {"train_loss": -27.74617576599121, "global_step": 573445, "epoch": 6908} {"train_loss": -27.858519979270106, "global_step": 573446, "epoch": 6908, "val_loss": 6421030.0} {"train_loss": -26.55231285095215, "global_step": 573447, "epoch": 6909} {"train_loss": -25.088438034057617, "global_step": 573448, "epoch": 6909} {"train_loss": -26.021930694580078, "global_step": 573449, "epoch": 6909} {"train_loss": -26.178070068359375, "global_step": 573450, "epoch": 6909} {"train_loss": -26.322845458984375, "global_step": 573451, "epoch": 6909} {"train_loss": -25.817712783813477, "global_step": 573452, "epoch": 6909} {"train_loss": -27.164464950561523, "global_step": 573453, "epoch": 6909} {"train_loss": -26.870864868164062, "global_step": 573454, "epoch": 6909} {"train_loss": -26.867218017578125, "global_step": 573455, "epoch": 6909} {"train_loss": -26.9800968170166, "global_step": 573456, "epoch": 6909} {"train_loss": -27.029333114624023, "global_step": 573457, "epoch": 6909} {"train_loss": -26.5850772857666, "global_step": 573458, "epoch": 6909} {"train_loss": -26.911096572875977, "global_step": 573459, "epoch": 6909} {"train_loss": -27.192651748657227, "global_step": 573460, "epoch": 6909} {"train_loss": -27.02252197265625, "global_step": 573461, "epoch": 6909} {"train_loss": -27.215845108032227, "global_step": 573462, "epoch": 6909} {"train_loss": -27.282941818237305, "global_step": 573463, "epoch": 6909} {"train_loss": -27.452301025390625, "global_step": 573464, "epoch": 6909} {"train_loss": -27.1582088470459, "global_step": 573465, "epoch": 6909} {"train_loss": -27.246139526367188, "global_step": 573466, "epoch": 6909} {"train_loss": -27.421152114868164, "global_step": 573467, "epoch": 6909} {"train_loss": -27.437971115112305, "global_step": 573468, "epoch": 6909} {"train_loss": -27.25270652770996, "global_step": 573469, "epoch": 6909} {"train_loss": -27.59931755065918, "global_step": 573470, "epoch": 6909} {"train_loss": -27.29121208190918, "global_step": 573471, "epoch": 6909} {"train_loss": -27.418378829956055, "global_step": 573472, "epoch": 6909} {"train_loss": -27.593488693237305, "global_step": 573473, "epoch": 6909} {"train_loss": -27.370141983032227, "global_step": 573474, "epoch": 6909} {"train_loss": -27.421035766601562, "global_step": 573475, "epoch": 6909} {"train_loss": -27.499540328979492, "global_step": 573476, "epoch": 6909} {"train_loss": -27.733905792236328, "global_step": 573477, "epoch": 6909} {"train_loss": -27.73384666442871, "global_step": 573478, "epoch": 6909} {"train_loss": -27.743408203125, "global_step": 573479, "epoch": 6909} {"train_loss": -27.522104263305664, "global_step": 573480, "epoch": 6909} {"train_loss": -27.801733016967773, "global_step": 573481, "epoch": 6909} {"train_loss": -27.69795799255371, "global_step": 573482, "epoch": 6909} {"train_loss": -27.84004020690918, "global_step": 573483, "epoch": 6909} {"train_loss": -28.36041831970215, "global_step": 573484, "epoch": 6909} {"train_loss": -27.95625877380371, "global_step": 573485, "epoch": 6909} {"train_loss": -27.680606842041016, "global_step": 573486, "epoch": 6909} {"train_loss": -27.754779815673828, "global_step": 573487, "epoch": 6909} {"train_loss": -27.789535522460938, "global_step": 573488, "epoch": 6909} {"train_loss": -27.991636276245117, "global_step": 573489, "epoch": 6909} {"train_loss": -28.275854110717773, "global_step": 573490, "epoch": 6909} {"train_loss": -28.138031005859375, "global_step": 573491, "epoch": 6909} {"train_loss": -27.55875015258789, "global_step": 573492, "epoch": 6909} {"train_loss": -27.966888427734375, "global_step": 573493, "epoch": 6909} {"train_loss": -27.86978530883789, "global_step": 573494, "epoch": 6909} {"train_loss": -27.814313888549805, "global_step": 573495, "epoch": 6909} {"train_loss": -27.831205368041992, "global_step": 573496, "epoch": 6909} {"train_loss": -27.80872917175293, "global_step": 573497, "epoch": 6909} {"train_loss": -28.18914794921875, "global_step": 573498, "epoch": 6909} {"train_loss": -27.763015747070312, "global_step": 573499, "epoch": 6909} {"train_loss": -27.680709838867188, "global_step": 573500, "epoch": 6909} {"train_loss": -28.04263687133789, "global_step": 573501, "epoch": 6909} {"train_loss": -27.784992218017578, "global_step": 573502, "epoch": 6909} {"train_loss": -28.08772850036621, "global_step": 573503, "epoch": 6909} {"train_loss": -28.372644424438477, "global_step": 573504, "epoch": 6909} {"train_loss": -28.0551815032959, "global_step": 573505, "epoch": 6909} {"train_loss": -28.066333770751953, "global_step": 573506, "epoch": 6909} {"train_loss": -27.749958038330078, "global_step": 573507, "epoch": 6909} {"train_loss": -28.361011505126953, "global_step": 573508, "epoch": 6909} {"train_loss": -28.16303062438965, "global_step": 573509, "epoch": 6909} {"train_loss": -27.867719650268555, "global_step": 573510, "epoch": 6909} {"train_loss": -27.809743881225586, "global_step": 573511, "epoch": 6909} {"train_loss": -28.23981285095215, "global_step": 573512, "epoch": 6909} {"train_loss": -28.076391220092773, "global_step": 573513, "epoch": 6909} {"train_loss": -28.235431671142578, "global_step": 573514, "epoch": 6909} {"train_loss": -27.932418823242188, "global_step": 573515, "epoch": 6909} {"train_loss": -28.204864501953125, "global_step": 573516, "epoch": 6909} {"train_loss": -28.12704849243164, "global_step": 573517, "epoch": 6909} {"train_loss": -27.924041748046875, "global_step": 573518, "epoch": 6909} {"train_loss": -27.797494888305664, "global_step": 573519, "epoch": 6909} {"train_loss": -27.386642456054688, "global_step": 573520, "epoch": 6909} {"train_loss": -27.250518798828125, "global_step": 573521, "epoch": 6909} {"train_loss": -26.410409927368164, "global_step": 573522, "epoch": 6909} {"train_loss": -27.015716552734375, "global_step": 573523, "epoch": 6909} {"train_loss": -27.864301681518555, "global_step": 573524, "epoch": 6909} {"train_loss": -27.399255752563477, "global_step": 573525, "epoch": 6909} {"train_loss": -27.18613052368164, "global_step": 573526, "epoch": 6909} {"train_loss": -27.287933349609375, "global_step": 573527, "epoch": 6909} {"train_loss": -26.873931884765625, "global_step": 573528, "epoch": 6909} {"train_loss": -27.502102334815337, "global_step": 573529, "epoch": 6909, "val_loss": 6513109.5} {"train_loss": -25.352863311767578, "global_step": 573530, "epoch": 6910} {"train_loss": -26.15848731994629, "global_step": 573531, "epoch": 6910} {"train_loss": -25.375532150268555, "global_step": 573532, "epoch": 6910} {"train_loss": -25.971189498901367, "global_step": 573533, "epoch": 6910} {"train_loss": -26.489591598510742, "global_step": 573534, "epoch": 6910} {"train_loss": -26.408552169799805, "global_step": 573535, "epoch": 6910} {"train_loss": -26.3927059173584, "global_step": 573536, "epoch": 6910} {"train_loss": -26.880422592163086, "global_step": 573537, "epoch": 6910} {"train_loss": -26.66046714782715, "global_step": 573538, "epoch": 6910} {"train_loss": -26.914813995361328, "global_step": 573539, "epoch": 6910} {"train_loss": -26.729694366455078, "global_step": 573540, "epoch": 6910} {"train_loss": -26.8572998046875, "global_step": 573541, "epoch": 6910} {"train_loss": -26.814977645874023, "global_step": 573542, "epoch": 6910} {"train_loss": -26.947797775268555, "global_step": 573543, "epoch": 6910} {"train_loss": -26.8416805267334, "global_step": 573544, "epoch": 6910} {"train_loss": -27.425247192382812, "global_step": 573545, "epoch": 6910} {"train_loss": -27.185138702392578, "global_step": 573546, "epoch": 6910} {"train_loss": -26.855915069580078, "global_step": 573547, "epoch": 6910} {"train_loss": -27.122900009155273, "global_step": 573548, "epoch": 6910} {"train_loss": -27.410058975219727, "global_step": 573549, "epoch": 6910} {"train_loss": -27.377883911132812, "global_step": 573550, "epoch": 6910} {"train_loss": -27.441205978393555, "global_step": 573551, "epoch": 6910} {"train_loss": -27.230640411376953, "global_step": 573552, "epoch": 6910} {"train_loss": -27.67225456237793, "global_step": 573553, "epoch": 6910} {"train_loss": -27.597341537475586, "global_step": 573554, "epoch": 6910} {"train_loss": -27.55958366394043, "global_step": 573555, "epoch": 6910} {"train_loss": -27.20015525817871, "global_step": 573556, "epoch": 6910} {"train_loss": -27.522626876831055, "global_step": 573557, "epoch": 6910} {"train_loss": -27.463171005249023, "global_step": 573558, "epoch": 6910} {"train_loss": -27.610687255859375, "global_step": 573559, "epoch": 6910} {"train_loss": -27.877668380737305, "global_step": 573560, "epoch": 6910} {"train_loss": -27.55047607421875, "global_step": 573561, "epoch": 6910} {"train_loss": -27.540685653686523, "global_step": 573562, "epoch": 6910} {"train_loss": -27.3848876953125, "global_step": 573563, "epoch": 6910} {"train_loss": -27.806066513061523, "global_step": 573564, "epoch": 6910} {"train_loss": -27.782135009765625, "global_step": 573565, "epoch": 6910} {"train_loss": -27.694610595703125, "global_step": 573566, "epoch": 6910} {"train_loss": -27.55501365661621, "global_step": 573567, "epoch": 6910} {"train_loss": -27.858301162719727, "global_step": 573568, "epoch": 6910} {"train_loss": -27.7446346282959, "global_step": 573569, "epoch": 6910} {"train_loss": -27.97039794921875, "global_step": 573570, "epoch": 6910} {"train_loss": -27.90308952331543, "global_step": 573571, "epoch": 6910} {"train_loss": -27.61212158203125, "global_step": 573572, "epoch": 6910} {"train_loss": -27.773773193359375, "global_step": 573573, "epoch": 6910} {"train_loss": -27.69019889831543, "global_step": 573574, "epoch": 6910} {"train_loss": -27.760181427001953, "global_step": 573575, "epoch": 6910} {"train_loss": -27.553430557250977, "global_step": 573576, "epoch": 6910} {"train_loss": -27.892072677612305, "global_step": 573577, "epoch": 6910} {"train_loss": -27.58673667907715, "global_step": 573578, "epoch": 6910} {"train_loss": -27.33890151977539, "global_step": 573579, "epoch": 6910} {"train_loss": -27.635950088500977, "global_step": 573580, "epoch": 6910} {"train_loss": -27.675024032592773, "global_step": 573581, "epoch": 6910} {"train_loss": -27.495161056518555, "global_step": 573582, "epoch": 6910} {"train_loss": -27.415189743041992, "global_step": 573583, "epoch": 6910} {"train_loss": -27.96870231628418, "global_step": 573584, "epoch": 6910} {"train_loss": -27.58062171936035, "global_step": 573585, "epoch": 6910} {"train_loss": -27.87529945373535, "global_step": 573586, "epoch": 6910} {"train_loss": -27.6220760345459, "global_step": 573587, "epoch": 6910} {"train_loss": -28.04816246032715, "global_step": 573588, "epoch": 6910} {"train_loss": -27.7281494140625, "global_step": 573589, "epoch": 6910} {"train_loss": -27.6616268157959, "global_step": 573590, "epoch": 6910} {"train_loss": -27.58823013305664, "global_step": 573591, "epoch": 6910} {"train_loss": -27.52016258239746, "global_step": 573592, "epoch": 6910} {"train_loss": -27.83162498474121, "global_step": 573593, "epoch": 6910} {"train_loss": -27.706342697143555, "global_step": 573594, "epoch": 6910} {"train_loss": -27.580839157104492, "global_step": 573595, "epoch": 6910} {"train_loss": -27.561166763305664, "global_step": 573596, "epoch": 6910} {"train_loss": -28.007238388061523, "global_step": 573597, "epoch": 6910} {"train_loss": -27.580322265625, "global_step": 573598, "epoch": 6910} {"train_loss": -27.653043746948242, "global_step": 573599, "epoch": 6910} {"train_loss": -27.540700912475586, "global_step": 573600, "epoch": 6910} {"train_loss": -27.5945987701416, "global_step": 573601, "epoch": 6910} {"train_loss": -27.58489418029785, "global_step": 573602, "epoch": 6910} {"train_loss": -27.523700714111328, "global_step": 573603, "epoch": 6910} {"train_loss": -27.828784942626953, "global_step": 573604, "epoch": 6910} {"train_loss": -27.281457901000977, "global_step": 573605, "epoch": 6910} {"train_loss": -27.65447425842285, "global_step": 573606, "epoch": 6910} {"train_loss": -27.640380859375, "global_step": 573607, "epoch": 6910} {"train_loss": -27.481403350830078, "global_step": 573608, "epoch": 6910} {"train_loss": -27.881336212158203, "global_step": 573609, "epoch": 6910} {"train_loss": -27.822555541992188, "global_step": 573610, "epoch": 6910} {"train_loss": -27.92510414123535, "global_step": 573611, "epoch": 6910} {"train_loss": -27.42114949513631, "global_step": 573612, "epoch": 6910, "val_loss": 6468857.5} {"train_loss": -26.963483810424805, "global_step": 573613, "epoch": 6911} {"train_loss": -26.482608795166016, "global_step": 573614, "epoch": 6911} {"train_loss": -27.156885147094727, "global_step": 573615, "epoch": 6911} {"train_loss": -27.315916061401367, "global_step": 573616, "epoch": 6911} {"train_loss": -27.221357345581055, "global_step": 573617, "epoch": 6911} {"train_loss": -27.046545028686523, "global_step": 573618, "epoch": 6911} {"train_loss": -27.158710479736328, "global_step": 573619, "epoch": 6911} {"train_loss": -27.129383087158203, "global_step": 573620, "epoch": 6911} {"train_loss": -27.523059844970703, "global_step": 573621, "epoch": 6911} {"train_loss": -27.550582885742188, "global_step": 573622, "epoch": 6911} {"train_loss": -27.49383544921875, "global_step": 573623, "epoch": 6911} {"train_loss": -27.22651481628418, "global_step": 573624, "epoch": 6911} {"train_loss": -27.454965591430664, "global_step": 573625, "epoch": 6911} {"train_loss": -27.541522979736328, "global_step": 573626, "epoch": 6911} {"train_loss": -27.43942642211914, "global_step": 573627, "epoch": 6911} {"train_loss": -27.389434814453125, "global_step": 573628, "epoch": 6911} {"train_loss": -27.9918155670166, "global_step": 573629, "epoch": 6911} {"train_loss": -27.519001007080078, "global_step": 573630, "epoch": 6911} {"train_loss": -27.892093658447266, "global_step": 573631, "epoch": 6911} {"train_loss": -27.727005004882812, "global_step": 573632, "epoch": 6911} {"train_loss": -27.558059692382812, "global_step": 573633, "epoch": 6911} {"train_loss": -27.99662208557129, "global_step": 573634, "epoch": 6911} {"train_loss": -28.102025985717773, "global_step": 573635, "epoch": 6911} {"train_loss": -27.994277954101562, "global_step": 573636, "epoch": 6911} {"train_loss": -28.122760772705078, "global_step": 573637, "epoch": 6911} {"train_loss": -27.54215431213379, "global_step": 573638, "epoch": 6911} {"train_loss": -27.954669952392578, "global_step": 573639, "epoch": 6911} {"train_loss": -28.018436431884766, "global_step": 573640, "epoch": 6911} {"train_loss": -27.555530548095703, "global_step": 573641, "epoch": 6911} {"train_loss": -27.6700382232666, "global_step": 573642, "epoch": 6911} {"train_loss": -28.114233016967773, "global_step": 573643, "epoch": 6911} {"train_loss": -27.74261474609375, "global_step": 573644, "epoch": 6911} {"train_loss": -27.8073787689209, "global_step": 573645, "epoch": 6911} {"train_loss": -27.645465850830078, "global_step": 573646, "epoch": 6911} {"train_loss": -28.009191513061523, "global_step": 573647, "epoch": 6911} {"train_loss": -28.004331588745117, "global_step": 573648, "epoch": 6911} {"train_loss": -28.009607315063477, "global_step": 573649, "epoch": 6911} {"train_loss": -27.91802978515625, "global_step": 573650, "epoch": 6911} {"train_loss": -27.830642700195312, "global_step": 573651, "epoch": 6911} {"train_loss": -27.92817497253418, "global_step": 573652, "epoch": 6911} {"train_loss": -27.951435089111328, "global_step": 573653, "epoch": 6911} {"train_loss": -28.06789207458496, "global_step": 573654, "epoch": 6911} {"train_loss": -27.96608543395996, "global_step": 573655, "epoch": 6911} {"train_loss": -27.900548934936523, "global_step": 573656, "epoch": 6911} {"train_loss": -27.53460121154785, "global_step": 573657, "epoch": 6911} {"train_loss": -27.60980796813965, "global_step": 573658, "epoch": 6911} {"train_loss": -28.003015518188477, "global_step": 573659, "epoch": 6911} {"train_loss": -27.793170928955078, "global_step": 573660, "epoch": 6911} {"train_loss": -27.964197158813477, "global_step": 573661, "epoch": 6911} {"train_loss": -27.386877059936523, "global_step": 573662, "epoch": 6911} {"train_loss": -27.64027214050293, "global_step": 573663, "epoch": 6911} {"train_loss": -28.03340721130371, "global_step": 573664, "epoch": 6911} {"train_loss": -28.198598861694336, "global_step": 573665, "epoch": 6911} {"train_loss": -28.024139404296875, "global_step": 573666, "epoch": 6911} {"train_loss": -28.14653968811035, "global_step": 573667, "epoch": 6911} {"train_loss": -27.85894203186035, "global_step": 573668, "epoch": 6911} {"train_loss": -28.01438331604004, "global_step": 573669, "epoch": 6911} {"train_loss": -28.384992599487305, "global_step": 573670, "epoch": 6911} {"train_loss": -27.989181518554688, "global_step": 573671, "epoch": 6911} {"train_loss": -27.762939453125, "global_step": 573672, "epoch": 6911} {"train_loss": -27.50275230407715, "global_step": 573673, "epoch": 6911} {"train_loss": -27.70356559753418, "global_step": 573674, "epoch": 6911} {"train_loss": -28.057632446289062, "global_step": 573675, "epoch": 6911} {"train_loss": -27.947834014892578, "global_step": 573676, "epoch": 6911} {"train_loss": -27.824787139892578, "global_step": 573677, "epoch": 6911} {"train_loss": -27.68277931213379, "global_step": 573678, "epoch": 6911} {"train_loss": -27.820653915405273, "global_step": 573679, "epoch": 6911} {"train_loss": -28.01287269592285, "global_step": 573680, "epoch": 6911} {"train_loss": -27.60941505432129, "global_step": 573681, "epoch": 6911} {"train_loss": -27.777875900268555, "global_step": 573682, "epoch": 6911} {"train_loss": -27.80108070373535, "global_step": 573683, "epoch": 6911} {"train_loss": -27.698278427124023, "global_step": 573684, "epoch": 6911} {"train_loss": -27.663497924804688, "global_step": 573685, "epoch": 6911} {"train_loss": -28.129871368408203, "global_step": 573686, "epoch": 6911} {"train_loss": -27.93916130065918, "global_step": 573687, "epoch": 6911} {"train_loss": -27.465940475463867, "global_step": 573688, "epoch": 6911} {"train_loss": -27.490863800048828, "global_step": 573689, "epoch": 6911} {"train_loss": -26.200780868530273, "global_step": 573690, "epoch": 6911} {"train_loss": -26.67194175720215, "global_step": 573691, "epoch": 6911} {"train_loss": -27.74359130859375, "global_step": 573692, "epoch": 6911} {"train_loss": -27.57097816467285, "global_step": 573693, "epoch": 6911} {"train_loss": -27.221820831298828, "global_step": 573694, "epoch": 6911} {"train_loss": -27.677229272313866, "global_step": 573695, "epoch": 6911, "val_loss": 6473661.0} {"train_loss": -26.802661895751953, "global_step": 573696, "epoch": 6912} {"train_loss": -26.220251083374023, "global_step": 573697, "epoch": 6912} {"train_loss": -27.323606491088867, "global_step": 573698, "epoch": 6912} {"train_loss": -26.4633846282959, "global_step": 573699, "epoch": 6912} {"train_loss": -26.86896324157715, "global_step": 573700, "epoch": 6912} {"train_loss": -26.813135147094727, "global_step": 573701, "epoch": 6912} {"train_loss": -27.207578659057617, "global_step": 573702, "epoch": 6912} {"train_loss": -26.787405014038086, "global_step": 573703, "epoch": 6912} {"train_loss": -27.070581436157227, "global_step": 573704, "epoch": 6912} {"train_loss": -27.34539794921875, "global_step": 573705, "epoch": 6912} {"train_loss": -27.082138061523438, "global_step": 573706, "epoch": 6912} {"train_loss": -27.768909454345703, "global_step": 573707, "epoch": 6912} {"train_loss": -27.2064208984375, "global_step": 573708, "epoch": 6912} {"train_loss": -27.333908081054688, "global_step": 573709, "epoch": 6912} {"train_loss": -27.530920028686523, "global_step": 573710, "epoch": 6912} {"train_loss": -27.28608512878418, "global_step": 573711, "epoch": 6912} {"train_loss": -27.277124404907227, "global_step": 573712, "epoch": 6912} {"train_loss": -27.56463050842285, "global_step": 573713, "epoch": 6912} {"train_loss": -27.497806549072266, "global_step": 573714, "epoch": 6912} {"train_loss": -27.47800636291504, "global_step": 573715, "epoch": 6912} {"train_loss": -27.361352920532227, "global_step": 573716, "epoch": 6912} {"train_loss": -27.338769912719727, "global_step": 573717, "epoch": 6912} {"train_loss": -27.535572052001953, "global_step": 573718, "epoch": 6912} {"train_loss": -27.674091339111328, "global_step": 573719, "epoch": 6912} {"train_loss": -27.992843627929688, "global_step": 573720, "epoch": 6912} {"train_loss": -27.683837890625, "global_step": 573721, "epoch": 6912} {"train_loss": -27.663742065429688, "global_step": 573722, "epoch": 6912} {"train_loss": -27.95600700378418, "global_step": 573723, "epoch": 6912} {"train_loss": -27.363805770874023, "global_step": 573724, "epoch": 6912} {"train_loss": -27.9040584564209, "global_step": 573725, "epoch": 6912} {"train_loss": -27.984155654907227, "global_step": 573726, "epoch": 6912} {"train_loss": -27.74346351623535, "global_step": 573727, "epoch": 6912} {"train_loss": -27.676931381225586, "global_step": 573728, "epoch": 6912} {"train_loss": -27.66082763671875, "global_step": 573729, "epoch": 6912} {"train_loss": -27.658960342407227, "global_step": 573730, "epoch": 6912} {"train_loss": -27.83677101135254, "global_step": 573731, "epoch": 6912} {"train_loss": -28.07927894592285, "global_step": 573732, "epoch": 6912} {"train_loss": -27.91733741760254, "global_step": 573733, "epoch": 6912} {"train_loss": -27.90410804748535, "global_step": 573734, "epoch": 6912} {"train_loss": -27.73713493347168, "global_step": 573735, "epoch": 6912} {"train_loss": -27.678007125854492, "global_step": 573736, "epoch": 6912} {"train_loss": -28.002119064331055, "global_step": 573737, "epoch": 6912} {"train_loss": -27.66693115234375, "global_step": 573738, "epoch": 6912} {"train_loss": -27.982181549072266, "global_step": 573739, "epoch": 6912} {"train_loss": -28.193756103515625, "global_step": 573740, "epoch": 6912} {"train_loss": -27.75, "global_step": 573741, "epoch": 6912} {"train_loss": -27.664386749267578, "global_step": 573742, "epoch": 6912} {"train_loss": -28.0541934967041, "global_step": 573743, "epoch": 6912} {"train_loss": -28.235137939453125, "global_step": 573744, "epoch": 6912} {"train_loss": -27.7415714263916, "global_step": 573745, "epoch": 6912} {"train_loss": -27.423328399658203, "global_step": 573746, "epoch": 6912} {"train_loss": -27.32322120666504, "global_step": 573747, "epoch": 6912} {"train_loss": -28.07512855529785, "global_step": 573748, "epoch": 6912} {"train_loss": -27.781476974487305, "global_step": 573749, "epoch": 6912} {"train_loss": -28.035654067993164, "global_step": 573750, "epoch": 6912} {"train_loss": -27.8150691986084, "global_step": 573751, "epoch": 6912} {"train_loss": -28.077253341674805, "global_step": 573752, "epoch": 6912} {"train_loss": -28.097631454467773, "global_step": 573753, "epoch": 6912} {"train_loss": -28.545032501220703, "global_step": 573754, "epoch": 6912} {"train_loss": -28.19135856628418, "global_step": 573755, "epoch": 6912} {"train_loss": -27.778100967407227, "global_step": 573756, "epoch": 6912} {"train_loss": -27.9471492767334, "global_step": 573757, "epoch": 6912} {"train_loss": -28.184738159179688, "global_step": 573758, "epoch": 6912} {"train_loss": -28.20099449157715, "global_step": 573759, "epoch": 6912} {"train_loss": -27.92412757873535, "global_step": 573760, "epoch": 6912} {"train_loss": -27.974472045898438, "global_step": 573761, "epoch": 6912} {"train_loss": -27.724401473999023, "global_step": 573762, "epoch": 6912} {"train_loss": -28.065771102905273, "global_step": 573763, "epoch": 6912} {"train_loss": -27.916961669921875, "global_step": 573764, "epoch": 6912} {"train_loss": -27.67095375061035, "global_step": 573765, "epoch": 6912} {"train_loss": -27.932180404663086, "global_step": 573766, "epoch": 6912} {"train_loss": -27.828622817993164, "global_step": 573767, "epoch": 6912} {"train_loss": -27.504077911376953, "global_step": 573768, "epoch": 6912} {"train_loss": -27.15618896484375, "global_step": 573769, "epoch": 6912} {"train_loss": -27.37916374206543, "global_step": 573770, "epoch": 6912} {"train_loss": -27.46308708190918, "global_step": 573771, "epoch": 6912} {"train_loss": -27.421091079711914, "global_step": 573772, "epoch": 6912} {"train_loss": -27.86347007751465, "global_step": 573773, "epoch": 6912} {"train_loss": -27.6936092376709, "global_step": 573774, "epoch": 6912} {"train_loss": -27.863574981689453, "global_step": 573775, "epoch": 6912} {"train_loss": -27.810705184936523, "global_step": 573776, "epoch": 6912} {"train_loss": -27.530765533447266, "global_step": 573777, "epoch": 6912} {"train_loss": -27.622485448078937, "global_step": 573778, "epoch": 6912, "val_loss": 6505284.0} {"train_loss": -26.62129020690918, "global_step": 573779, "epoch": 6913} {"train_loss": -26.145191192626953, "global_step": 573780, "epoch": 6913} {"train_loss": -26.421545028686523, "global_step": 573781, "epoch": 6913} {"train_loss": -26.9205265045166, "global_step": 573782, "epoch": 6913} {"train_loss": -26.4016170501709, "global_step": 573783, "epoch": 6913} {"train_loss": -26.671344757080078, "global_step": 573784, "epoch": 6913} {"train_loss": -26.584569931030273, "global_step": 573785, "epoch": 6913} {"train_loss": -26.936508178710938, "global_step": 573786, "epoch": 6913} {"train_loss": -26.7463436126709, "global_step": 573787, "epoch": 6913} {"train_loss": -26.585046768188477, "global_step": 573788, "epoch": 6913} {"train_loss": -26.747034072875977, "global_step": 573789, "epoch": 6913} {"train_loss": -27.22952651977539, "global_step": 573790, "epoch": 6913} {"train_loss": -26.772708892822266, "global_step": 573791, "epoch": 6913} {"train_loss": -26.80560302734375, "global_step": 573792, "epoch": 6913} {"train_loss": -26.762283325195312, "global_step": 573793, "epoch": 6913} {"train_loss": -26.9388484954834, "global_step": 573794, "epoch": 6913} {"train_loss": -27.19270133972168, "global_step": 573795, "epoch": 6913} {"train_loss": -27.157779693603516, "global_step": 573796, "epoch": 6913} {"train_loss": -27.182540893554688, "global_step": 573797, "epoch": 6913} {"train_loss": -27.29612159729004, "global_step": 573798, "epoch": 6913} {"train_loss": -27.42435646057129, "global_step": 573799, "epoch": 6913} {"train_loss": -27.568805694580078, "global_step": 573800, "epoch": 6913} {"train_loss": -27.13010025024414, "global_step": 573801, "epoch": 6913} {"train_loss": -27.3438720703125, "global_step": 573802, "epoch": 6913} {"train_loss": -27.27435874938965, "global_step": 573803, "epoch": 6913} {"train_loss": -27.30267333984375, "global_step": 573804, "epoch": 6913} {"train_loss": -27.325891494750977, "global_step": 573805, "epoch": 6913} {"train_loss": -27.243310928344727, "global_step": 573806, "epoch": 6913} {"train_loss": -27.3891544342041, "global_step": 573807, "epoch": 6913} {"train_loss": -27.7333927154541, "global_step": 573808, "epoch": 6913} {"train_loss": -27.621429443359375, "global_step": 573809, "epoch": 6913} {"train_loss": -27.328582763671875, "global_step": 573810, "epoch": 6913} {"train_loss": -27.608259201049805, "global_step": 573811, "epoch": 6913} {"train_loss": -27.499242782592773, "global_step": 573812, "epoch": 6913} {"train_loss": -27.7191162109375, "global_step": 573813, "epoch": 6913} {"train_loss": -27.742597579956055, "global_step": 573814, "epoch": 6913} {"train_loss": -27.93975830078125, "global_step": 573815, "epoch": 6913} {"train_loss": -27.913843154907227, "global_step": 573816, "epoch": 6913} {"train_loss": -28.005447387695312, "global_step": 573817, "epoch": 6913} {"train_loss": -27.98383140563965, "global_step": 573818, "epoch": 6913} {"train_loss": -27.578901290893555, "global_step": 573819, "epoch": 6913} {"train_loss": -27.89592933654785, "global_step": 573820, "epoch": 6913} {"train_loss": -27.7338924407959, "global_step": 573821, "epoch": 6913} {"train_loss": -27.814163208007812, "global_step": 573822, "epoch": 6913} {"train_loss": -27.869781494140625, "global_step": 573823, "epoch": 6913} {"train_loss": -28.013952255249023, "global_step": 573824, "epoch": 6913} {"train_loss": -27.74777603149414, "global_step": 573825, "epoch": 6913} {"train_loss": -27.569997787475586, "global_step": 573826, "epoch": 6913} {"train_loss": -28.107023239135742, "global_step": 573827, "epoch": 6913} {"train_loss": -27.914417266845703, "global_step": 573828, "epoch": 6913} {"train_loss": -27.989843368530273, "global_step": 573829, "epoch": 6913} {"train_loss": -27.62522315979004, "global_step": 573830, "epoch": 6913} {"train_loss": -27.770368576049805, "global_step": 573831, "epoch": 6913} {"train_loss": -28.33928871154785, "global_step": 573832, "epoch": 6913} {"train_loss": -27.885318756103516, "global_step": 573833, "epoch": 6913} {"train_loss": -27.9183349609375, "global_step": 573834, "epoch": 6913} {"train_loss": -27.557172775268555, "global_step": 573835, "epoch": 6913} {"train_loss": -27.57791519165039, "global_step": 573836, "epoch": 6913} {"train_loss": -28.01417350769043, "global_step": 573837, "epoch": 6913} {"train_loss": -28.183868408203125, "global_step": 573838, "epoch": 6913} {"train_loss": -27.92237663269043, "global_step": 573839, "epoch": 6913} {"train_loss": -27.5725040435791, "global_step": 573840, "epoch": 6913} {"train_loss": -27.904844284057617, "global_step": 573841, "epoch": 6913} {"train_loss": -28.354902267456055, "global_step": 573842, "epoch": 6913} {"train_loss": -27.8858642578125, "global_step": 573843, "epoch": 6913} {"train_loss": -28.021772384643555, "global_step": 573844, "epoch": 6913} {"train_loss": -28.47474479675293, "global_step": 573845, "epoch": 6913} {"train_loss": -27.59537124633789, "global_step": 573846, "epoch": 6913} {"train_loss": -28.118072509765625, "global_step": 573847, "epoch": 6913} {"train_loss": -28.11713218688965, "global_step": 573848, "epoch": 6913} {"train_loss": -27.92681312561035, "global_step": 573849, "epoch": 6913} {"train_loss": -28.090728759765625, "global_step": 573850, "epoch": 6913} {"train_loss": -27.900842666625977, "global_step": 573851, "epoch": 6913} {"train_loss": -28.11701774597168, "global_step": 573852, "epoch": 6913} {"train_loss": -27.897705078125, "global_step": 573853, "epoch": 6913} {"train_loss": -28.045507431030273, "global_step": 573854, "epoch": 6913} {"train_loss": -28.010278701782227, "global_step": 573855, "epoch": 6913} {"train_loss": -28.10877799987793, "global_step": 573856, "epoch": 6913} {"train_loss": -27.988317489624023, "global_step": 573857, "epoch": 6913} {"train_loss": -28.09596061706543, "global_step": 573858, "epoch": 6913} {"train_loss": -27.9419002532959, "global_step": 573859, "epoch": 6913} {"train_loss": -27.88331413269043, "global_step": 573860, "epoch": 6913} {"train_loss": -27.55697553703584, "global_step": 573861, "epoch": 6913, "val_loss": 6484571.0} {"train_loss": -25.59849739074707, "global_step": 573862, "epoch": 6914} {"train_loss": -21.07498550415039, "global_step": 573863, "epoch": 6914} {"train_loss": -19.620290756225586, "global_step": 573864, "epoch": 6914} {"train_loss": -25.258193969726562, "global_step": 573865, "epoch": 6914} {"train_loss": -24.767576217651367, "global_step": 573866, "epoch": 6914} {"train_loss": -25.34014892578125, "global_step": 573867, "epoch": 6914} {"train_loss": -24.835800170898438, "global_step": 573868, "epoch": 6914} {"train_loss": -25.741674423217773, "global_step": 573869, "epoch": 6914} {"train_loss": -25.464054107666016, "global_step": 573870, "epoch": 6914} {"train_loss": -25.146181106567383, "global_step": 573871, "epoch": 6914} {"train_loss": -26.191190719604492, "global_step": 573872, "epoch": 6914} {"train_loss": -26.100576400756836, "global_step": 573873, "epoch": 6914} {"train_loss": -25.916379928588867, "global_step": 573874, "epoch": 6914} {"train_loss": -26.2476806640625, "global_step": 573875, "epoch": 6914} {"train_loss": -26.682342529296875, "global_step": 573876, "epoch": 6914} {"train_loss": -26.78342628479004, "global_step": 573877, "epoch": 6914} {"train_loss": -26.350324630737305, "global_step": 573878, "epoch": 6914} {"train_loss": -26.287643432617188, "global_step": 573879, "epoch": 6914} {"train_loss": -26.06049919128418, "global_step": 573880, "epoch": 6914} {"train_loss": -26.770902633666992, "global_step": 573881, "epoch": 6914} {"train_loss": -26.77207374572754, "global_step": 573882, "epoch": 6914} {"train_loss": -26.35862159729004, "global_step": 573883, "epoch": 6914} {"train_loss": -26.760711669921875, "global_step": 573884, "epoch": 6914} {"train_loss": -27.236328125, "global_step": 573885, "epoch": 6914} {"train_loss": -26.748193740844727, "global_step": 573886, "epoch": 6914} {"train_loss": -26.764419555664062, "global_step": 573887, "epoch": 6914} {"train_loss": -27.113271713256836, "global_step": 573888, "epoch": 6914} {"train_loss": -27.138975143432617, "global_step": 573889, "epoch": 6914} {"train_loss": -27.065509796142578, "global_step": 573890, "epoch": 6914} {"train_loss": -27.246784210205078, "global_step": 573891, "epoch": 6914} {"train_loss": -27.379230499267578, "global_step": 573892, "epoch": 6914} {"train_loss": -27.407751083374023, "global_step": 573893, "epoch": 6914} {"train_loss": -27.09395408630371, "global_step": 573894, "epoch": 6914} {"train_loss": -27.2437801361084, "global_step": 573895, "epoch": 6914} {"train_loss": -27.370107650756836, "global_step": 573896, "epoch": 6914} {"train_loss": -27.163654327392578, "global_step": 573897, "epoch": 6914} {"train_loss": -27.054691314697266, "global_step": 573898, "epoch": 6914} {"train_loss": -27.465173721313477, "global_step": 573899, "epoch": 6914} {"train_loss": -27.578397750854492, "global_step": 573900, "epoch": 6914} {"train_loss": -27.413150787353516, "global_step": 573901, "epoch": 6914} {"train_loss": -27.392593383789062, "global_step": 573902, "epoch": 6914} {"train_loss": -27.36052894592285, "global_step": 573903, "epoch": 6914} {"train_loss": -27.764007568359375, "global_step": 573904, "epoch": 6914} {"train_loss": -27.878681182861328, "global_step": 573905, "epoch": 6914} {"train_loss": -27.822662353515625, "global_step": 573906, "epoch": 6914} {"train_loss": -27.774999618530273, "global_step": 573907, "epoch": 6914} {"train_loss": -27.659717559814453, "global_step": 573908, "epoch": 6914} {"train_loss": -27.75252342224121, "global_step": 573909, "epoch": 6914} {"train_loss": -27.887052536010742, "global_step": 573910, "epoch": 6914} {"train_loss": -27.737226486206055, "global_step": 573911, "epoch": 6914} {"train_loss": -27.9272518157959, "global_step": 573912, "epoch": 6914} {"train_loss": -27.62102699279785, "global_step": 573913, "epoch": 6914} {"train_loss": -27.820722579956055, "global_step": 573914, "epoch": 6914} {"train_loss": -27.86056900024414, "global_step": 573915, "epoch": 6914} {"train_loss": -27.54339027404785, "global_step": 573916, "epoch": 6914} {"train_loss": -27.550100326538086, "global_step": 573917, "epoch": 6914} {"train_loss": -27.64266014099121, "global_step": 573918, "epoch": 6914} {"train_loss": -27.651411056518555, "global_step": 573919, "epoch": 6914} {"train_loss": -27.843246459960938, "global_step": 573920, "epoch": 6914} {"train_loss": -28.091510772705078, "global_step": 573921, "epoch": 6914} {"train_loss": -27.918701171875, "global_step": 573922, "epoch": 6914} {"train_loss": -27.685840606689453, "global_step": 573923, "epoch": 6914} {"train_loss": -27.419178009033203, "global_step": 573924, "epoch": 6914} {"train_loss": -27.83563804626465, "global_step": 573925, "epoch": 6914} {"train_loss": -27.270673751831055, "global_step": 573926, "epoch": 6914} {"train_loss": -27.276519775390625, "global_step": 573927, "epoch": 6914} {"train_loss": -27.430322647094727, "global_step": 573928, "epoch": 6914} {"train_loss": -27.505233764648438, "global_step": 573929, "epoch": 6914} {"train_loss": -27.7355899810791, "global_step": 573930, "epoch": 6914} {"train_loss": -27.774396896362305, "global_step": 573931, "epoch": 6914} {"train_loss": -27.528488159179688, "global_step": 573932, "epoch": 6914} {"train_loss": -28.083160400390625, "global_step": 573933, "epoch": 6914} {"train_loss": -27.714208602905273, "global_step": 573934, "epoch": 6914} {"train_loss": -27.611631393432617, "global_step": 573935, "epoch": 6914} {"train_loss": -28.302433013916016, "global_step": 573936, "epoch": 6914} {"train_loss": -27.729145050048828, "global_step": 573937, "epoch": 6914} {"train_loss": -27.33542823791504, "global_step": 573938, "epoch": 6914} {"train_loss": -27.570545196533203, "global_step": 573939, "epoch": 6914} {"train_loss": -27.705778121948242, "global_step": 573940, "epoch": 6914} {"train_loss": -27.65475845336914, "global_step": 573941, "epoch": 6914} {"train_loss": -27.988616943359375, "global_step": 573942, "epoch": 6914} {"train_loss": -27.933643341064453, "global_step": 573943, "epoch": 6914} {"train_loss": -26.994220825562994, "global_step": 573944, "epoch": 6914, "val_loss": 6475902.5} {"train_loss": -27.03151512145996, "global_step": 573945, "epoch": 6915} {"train_loss": -26.36236572265625, "global_step": 573946, "epoch": 6915} {"train_loss": -26.787084579467773, "global_step": 573947, "epoch": 6915} {"train_loss": -26.44622230529785, "global_step": 573948, "epoch": 6915} {"train_loss": -27.603275299072266, "global_step": 573949, "epoch": 6915} {"train_loss": -26.727502822875977, "global_step": 573950, "epoch": 6915} {"train_loss": -27.359777450561523, "global_step": 573951, "epoch": 6915} {"train_loss": -26.9105167388916, "global_step": 573952, "epoch": 6915} {"train_loss": -27.154951095581055, "global_step": 573953, "epoch": 6915} {"train_loss": -26.92054557800293, "global_step": 573954, "epoch": 6915} {"train_loss": -27.646081924438477, "global_step": 573955, "epoch": 6915} {"train_loss": -26.91193962097168, "global_step": 573956, "epoch": 6915} {"train_loss": -27.6888370513916, "global_step": 573957, "epoch": 6915} {"train_loss": -27.573877334594727, "global_step": 573958, "epoch": 6915} {"train_loss": -27.13129997253418, "global_step": 573959, "epoch": 6915} {"train_loss": -27.37214469909668, "global_step": 573960, "epoch": 6915} {"train_loss": -27.18172264099121, "global_step": 573961, "epoch": 6915} {"train_loss": -27.457056045532227, "global_step": 573962, "epoch": 6915} {"train_loss": -27.394819259643555, "global_step": 573963, "epoch": 6915} {"train_loss": -27.16019630432129, "global_step": 573964, "epoch": 6915} {"train_loss": -27.66737174987793, "global_step": 573965, "epoch": 6915} {"train_loss": -27.934324264526367, "global_step": 573966, "epoch": 6915} {"train_loss": -27.701120376586914, "global_step": 573967, "epoch": 6915} {"train_loss": -27.62650489807129, "global_step": 573968, "epoch": 6915} {"train_loss": -28.09503746032715, "global_step": 573969, "epoch": 6915} {"train_loss": -27.70364761352539, "global_step": 573970, "epoch": 6915} {"train_loss": -27.600189208984375, "global_step": 573971, "epoch": 6915} {"train_loss": -27.570058822631836, "global_step": 573972, "epoch": 6915} {"train_loss": -27.696680068969727, "global_step": 573973, "epoch": 6915} {"train_loss": -27.74362564086914, "global_step": 573974, "epoch": 6915} {"train_loss": -27.953388214111328, "global_step": 573975, "epoch": 6915} {"train_loss": -27.869857788085938, "global_step": 573976, "epoch": 6915} {"train_loss": -27.863061904907227, "global_step": 573977, "epoch": 6915} {"train_loss": -27.77935791015625, "global_step": 573978, "epoch": 6915} {"train_loss": -28.021459579467773, "global_step": 573979, "epoch": 6915} {"train_loss": -27.434667587280273, "global_step": 573980, "epoch": 6915} {"train_loss": -27.848907470703125, "global_step": 573981, "epoch": 6915} {"train_loss": -27.81904411315918, "global_step": 573982, "epoch": 6915} {"train_loss": -27.8060302734375, "global_step": 573983, "epoch": 6915} {"train_loss": -28.27490234375, "global_step": 573984, "epoch": 6915} {"train_loss": -27.756113052368164, "global_step": 573985, "epoch": 6915} {"train_loss": -28.04974937438965, "global_step": 573986, "epoch": 6915} {"train_loss": -27.871057510375977, "global_step": 573987, "epoch": 6915} {"train_loss": -27.818622589111328, "global_step": 573988, "epoch": 6915} {"train_loss": -27.903364181518555, "global_step": 573989, "epoch": 6915} {"train_loss": -28.318140029907227, "global_step": 573990, "epoch": 6915} {"train_loss": -27.896081924438477, "global_step": 573991, "epoch": 6915} {"train_loss": -28.357345581054688, "global_step": 573992, "epoch": 6915} {"train_loss": -28.043292999267578, "global_step": 573993, "epoch": 6915} {"train_loss": -27.942792892456055, "global_step": 573994, "epoch": 6915} {"train_loss": -28.335668563842773, "global_step": 573995, "epoch": 6915} {"train_loss": -27.989856719970703, "global_step": 573996, "epoch": 6915} {"train_loss": -28.274768829345703, "global_step": 573997, "epoch": 6915} {"train_loss": -28.266693115234375, "global_step": 573998, "epoch": 6915} {"train_loss": -28.197656631469727, "global_step": 573999, "epoch": 6915} {"train_loss": -28.3848876953125, "global_step": 574000, "epoch": 6915} {"train_loss": -28.164947509765625, "global_step": 574001, "epoch": 6915} {"train_loss": -28.076765060424805, "global_step": 574002, "epoch": 6915} {"train_loss": -28.3065128326416, "global_step": 574003, "epoch": 6915} {"train_loss": -27.72010612487793, "global_step": 574004, "epoch": 6915} {"train_loss": -27.76784324645996, "global_step": 574005, "epoch": 6915} {"train_loss": -28.191883087158203, "global_step": 574006, "epoch": 6915} {"train_loss": -27.9615535736084, "global_step": 574007, "epoch": 6915} {"train_loss": -27.878997802734375, "global_step": 574008, "epoch": 6915} {"train_loss": -28.0468692779541, "global_step": 574009, "epoch": 6915} {"train_loss": -27.65077018737793, "global_step": 574010, "epoch": 6915} {"train_loss": -27.851369857788086, "global_step": 574011, "epoch": 6915} {"train_loss": -27.689355850219727, "global_step": 574012, "epoch": 6915} {"train_loss": -27.73042106628418, "global_step": 574013, "epoch": 6915} {"train_loss": -27.87459373474121, "global_step": 574014, "epoch": 6915} {"train_loss": -28.1444034576416, "global_step": 574015, "epoch": 6915} {"train_loss": -28.126127243041992, "global_step": 574016, "epoch": 6915} {"train_loss": -27.803180694580078, "global_step": 574017, "epoch": 6915} {"train_loss": -28.424488067626953, "global_step": 574018, "epoch": 6915} {"train_loss": -27.995391845703125, "global_step": 574019, "epoch": 6915} {"train_loss": -27.95566749572754, "global_step": 574020, "epoch": 6915} {"train_loss": -28.278501510620117, "global_step": 574021, "epoch": 6915} {"train_loss": -28.00717544555664, "global_step": 574022, "epoch": 6915} {"train_loss": -27.8680477142334, "global_step": 574023, "epoch": 6915} {"train_loss": -27.943103790283203, "global_step": 574024, "epoch": 6915} {"train_loss": -28.069732666015625, "global_step": 574025, "epoch": 6915} {"train_loss": -28.17612648010254, "global_step": 574026, "epoch": 6915} {"train_loss": -27.767548319805098, "global_step": 574027, "epoch": 6915, "val_loss": 6508622.5} {"train_loss": -26.718305587768555, "global_step": 574028, "epoch": 6916} {"train_loss": -26.920690536499023, "global_step": 574029, "epoch": 6916} {"train_loss": -26.84784507751465, "global_step": 574030, "epoch": 6916} {"train_loss": -27.25221061706543, "global_step": 574031, "epoch": 6916} {"train_loss": -26.68816566467285, "global_step": 574032, "epoch": 6916} {"train_loss": -27.596576690673828, "global_step": 574033, "epoch": 6916} {"train_loss": -27.668659210205078, "global_step": 574034, "epoch": 6916} {"train_loss": -27.707990646362305, "global_step": 574035, "epoch": 6916} {"train_loss": -27.43597984313965, "global_step": 574036, "epoch": 6916} {"train_loss": -27.769811630249023, "global_step": 574037, "epoch": 6916} {"train_loss": -28.0902156829834, "global_step": 574038, "epoch": 6916} {"train_loss": -27.5933780670166, "global_step": 574039, "epoch": 6916} {"train_loss": -27.638874053955078, "global_step": 574040, "epoch": 6916} {"train_loss": -27.34967613220215, "global_step": 574041, "epoch": 6916} {"train_loss": -27.410388946533203, "global_step": 574042, "epoch": 6916} {"train_loss": -27.7268123626709, "global_step": 574043, "epoch": 6916} {"train_loss": -27.724210739135742, "global_step": 574044, "epoch": 6916} {"train_loss": -27.61850357055664, "global_step": 574045, "epoch": 6916} {"train_loss": -28.072351455688477, "global_step": 574046, "epoch": 6916} {"train_loss": -28.062768936157227, "global_step": 574047, "epoch": 6916} {"train_loss": -27.60947036743164, "global_step": 574048, "epoch": 6916} {"train_loss": -28.032169342041016, "global_step": 574049, "epoch": 6916} {"train_loss": -27.738483428955078, "global_step": 574050, "epoch": 6916} {"train_loss": -27.53742790222168, "global_step": 574051, "epoch": 6916} {"train_loss": -27.539722442626953, "global_step": 574052, "epoch": 6916} {"train_loss": -27.35101318359375, "global_step": 574053, "epoch": 6916} {"train_loss": -27.865787506103516, "global_step": 574054, "epoch": 6916} {"train_loss": -27.73943519592285, "global_step": 574055, "epoch": 6916} {"train_loss": -27.86854362487793, "global_step": 574056, "epoch": 6916} {"train_loss": -28.195514678955078, "global_step": 574057, "epoch": 6916} {"train_loss": -27.880126953125, "global_step": 574058, "epoch": 6916} {"train_loss": -27.907394409179688, "global_step": 574059, "epoch": 6916} {"train_loss": -28.021854400634766, "global_step": 574060, "epoch": 6916} {"train_loss": -27.993881225585938, "global_step": 574061, "epoch": 6916} {"train_loss": -27.861417770385742, "global_step": 574062, "epoch": 6916} {"train_loss": -28.055776596069336, "global_step": 574063, "epoch": 6916} {"train_loss": -27.919113159179688, "global_step": 574064, "epoch": 6916} {"train_loss": -28.003427505493164, "global_step": 574065, "epoch": 6916} {"train_loss": -27.79741859436035, "global_step": 574066, "epoch": 6916} {"train_loss": -28.058624267578125, "global_step": 574067, "epoch": 6916} {"train_loss": -27.82645606994629, "global_step": 574068, "epoch": 6916} {"train_loss": -28.16913414001465, "global_step": 574069, "epoch": 6916} {"train_loss": -27.74347496032715, "global_step": 574070, "epoch": 6916} {"train_loss": -28.239423751831055, "global_step": 574071, "epoch": 6916} {"train_loss": -27.89923095703125, "global_step": 574072, "epoch": 6916} {"train_loss": -28.165861129760742, "global_step": 574073, "epoch": 6916} {"train_loss": -28.48841667175293, "global_step": 574074, "epoch": 6916} {"train_loss": -27.91615867614746, "global_step": 574075, "epoch": 6916} {"train_loss": -28.123315811157227, "global_step": 574076, "epoch": 6916} {"train_loss": -28.224872589111328, "global_step": 574077, "epoch": 6916} {"train_loss": -27.949146270751953, "global_step": 574078, "epoch": 6916} {"train_loss": -27.788049697875977, "global_step": 574079, "epoch": 6916} {"train_loss": -28.151586532592773, "global_step": 574080, "epoch": 6916} {"train_loss": -27.736713409423828, "global_step": 574081, "epoch": 6916} {"train_loss": -27.734241485595703, "global_step": 574082, "epoch": 6916} {"train_loss": -27.7265682220459, "global_step": 574083, "epoch": 6916} {"train_loss": -27.61979103088379, "global_step": 574084, "epoch": 6916} {"train_loss": -28.139575958251953, "global_step": 574085, "epoch": 6916} {"train_loss": -27.98455810546875, "global_step": 574086, "epoch": 6916} {"train_loss": -27.9499568939209, "global_step": 574087, "epoch": 6916} {"train_loss": -27.785409927368164, "global_step": 574088, "epoch": 6916} {"train_loss": -27.77863121032715, "global_step": 574089, "epoch": 6916} {"train_loss": -27.778974533081055, "global_step": 574090, "epoch": 6916} {"train_loss": -28.01377296447754, "global_step": 574091, "epoch": 6916} {"train_loss": -27.33379554748535, "global_step": 574092, "epoch": 6916} {"train_loss": -27.75473976135254, "global_step": 574093, "epoch": 6916} {"train_loss": -27.687009811401367, "global_step": 574094, "epoch": 6916} {"train_loss": -28.111242294311523, "global_step": 574095, "epoch": 6916} {"train_loss": -27.842300415039062, "global_step": 574096, "epoch": 6916} {"train_loss": -27.7957706451416, "global_step": 574097, "epoch": 6916} {"train_loss": -27.544248580932617, "global_step": 574098, "epoch": 6916} {"train_loss": -27.85515785217285, "global_step": 574099, "epoch": 6916} {"train_loss": -27.996484756469727, "global_step": 574100, "epoch": 6916} {"train_loss": -27.900135040283203, "global_step": 574101, "epoch": 6916} {"train_loss": -27.929834365844727, "global_step": 574102, "epoch": 6916} {"train_loss": -27.89613914489746, "global_step": 574103, "epoch": 6916} {"train_loss": -27.596179962158203, "global_step": 574104, "epoch": 6916} {"train_loss": -27.65496826171875, "global_step": 574105, "epoch": 6916} {"train_loss": -27.753122329711914, "global_step": 574106, "epoch": 6916} {"train_loss": -27.66474723815918, "global_step": 574107, "epoch": 6916} {"train_loss": -28.075454711914062, "global_step": 574108, "epoch": 6916} {"train_loss": -28.0111141204834, "global_step": 574109, "epoch": 6916} {"train_loss": -27.785686332059193, "global_step": 574110, "epoch": 6916, "val_loss": 6533764.5} {"train_loss": -27.2818603515625, "global_step": 574111, "epoch": 6917} {"train_loss": -27.235361099243164, "global_step": 574112, "epoch": 6917} {"train_loss": -27.427885055541992, "global_step": 574113, "epoch": 6917} {"train_loss": -27.376184463500977, "global_step": 574114, "epoch": 6917} {"train_loss": -27.969099044799805, "global_step": 574115, "epoch": 6917} {"train_loss": -27.501882553100586, "global_step": 574116, "epoch": 6917} {"train_loss": -27.65411376953125, "global_step": 574117, "epoch": 6917} {"train_loss": -27.69292640686035, "global_step": 574118, "epoch": 6917} {"train_loss": -27.623220443725586, "global_step": 574119, "epoch": 6917} {"train_loss": -27.322431564331055, "global_step": 574120, "epoch": 6917} {"train_loss": -27.65370750427246, "global_step": 574121, "epoch": 6917} {"train_loss": -27.998647689819336, "global_step": 574122, "epoch": 6917} {"train_loss": -27.849390029907227, "global_step": 574123, "epoch": 6917} {"train_loss": -27.560087203979492, "global_step": 574124, "epoch": 6917} {"train_loss": -27.483001708984375, "global_step": 574125, "epoch": 6917} {"train_loss": -27.841861724853516, "global_step": 574126, "epoch": 6917} {"train_loss": -28.066869735717773, "global_step": 574127, "epoch": 6917} {"train_loss": -27.60743522644043, "global_step": 574128, "epoch": 6917} {"train_loss": -27.664356231689453, "global_step": 574129, "epoch": 6917} {"train_loss": -27.87078285217285, "global_step": 574130, "epoch": 6917} {"train_loss": -27.810117721557617, "global_step": 574131, "epoch": 6917} {"train_loss": -27.71677589416504, "global_step": 574132, "epoch": 6917} {"train_loss": -27.8861141204834, "global_step": 574133, "epoch": 6917} {"train_loss": -27.753416061401367, "global_step": 574134, "epoch": 6917} {"train_loss": -27.819360733032227, "global_step": 574135, "epoch": 6917} {"train_loss": -27.7961368560791, "global_step": 574136, "epoch": 6917} {"train_loss": -27.61356544494629, "global_step": 574137, "epoch": 6917} {"train_loss": -27.700536727905273, "global_step": 574138, "epoch": 6917} {"train_loss": -27.752796173095703, "global_step": 574139, "epoch": 6917} {"train_loss": -28.08296775817871, "global_step": 574140, "epoch": 6917} {"train_loss": -28.176599502563477, "global_step": 574141, "epoch": 6917} {"train_loss": -28.11117935180664, "global_step": 574142, "epoch": 6917} {"train_loss": -27.82793617248535, "global_step": 574143, "epoch": 6917} {"train_loss": -27.977127075195312, "global_step": 574144, "epoch": 6917} {"train_loss": -27.93390464782715, "global_step": 574145, "epoch": 6917} {"train_loss": -28.11216163635254, "global_step": 574146, "epoch": 6917} {"train_loss": -28.289030075073242, "global_step": 574147, "epoch": 6917} {"train_loss": -28.314599990844727, "global_step": 574148, "epoch": 6917} {"train_loss": -28.26584815979004, "global_step": 574149, "epoch": 6917} {"train_loss": -27.9049015045166, "global_step": 574150, "epoch": 6917} {"train_loss": -27.964136123657227, "global_step": 574151, "epoch": 6917} {"train_loss": -27.60199546813965, "global_step": 574152, "epoch": 6917} {"train_loss": -27.71534538269043, "global_step": 574153, "epoch": 6917} {"train_loss": -27.918912887573242, "global_step": 574154, "epoch": 6917} {"train_loss": -28.146345138549805, "global_step": 574155, "epoch": 6917} {"train_loss": -28.225461959838867, "global_step": 574156, "epoch": 6917} {"train_loss": -27.670324325561523, "global_step": 574157, "epoch": 6917} {"train_loss": -27.889902114868164, "global_step": 574158, "epoch": 6917} {"train_loss": -27.60455322265625, "global_step": 574159, "epoch": 6917} {"train_loss": -28.2092227935791, "global_step": 574160, "epoch": 6917} {"train_loss": -28.281957626342773, "global_step": 574161, "epoch": 6917} {"train_loss": -28.19257164001465, "global_step": 574162, "epoch": 6917} {"train_loss": -27.674741744995117, "global_step": 574163, "epoch": 6917} {"train_loss": -27.72159767150879, "global_step": 574164, "epoch": 6917} {"train_loss": -27.750629425048828, "global_step": 574165, "epoch": 6917} {"train_loss": -27.735620498657227, "global_step": 574166, "epoch": 6917} {"train_loss": -28.220922470092773, "global_step": 574167, "epoch": 6917} {"train_loss": -27.9927978515625, "global_step": 574168, "epoch": 6917} {"train_loss": -28.29425621032715, "global_step": 574169, "epoch": 6917} {"train_loss": -28.13715934753418, "global_step": 574170, "epoch": 6917} {"train_loss": -28.192840576171875, "global_step": 574171, "epoch": 6917} {"train_loss": -28.33931541442871, "global_step": 574172, "epoch": 6917} {"train_loss": -28.363422393798828, "global_step": 574173, "epoch": 6917} {"train_loss": -28.320358276367188, "global_step": 574174, "epoch": 6917} {"train_loss": -28.2069034576416, "global_step": 574175, "epoch": 6917} {"train_loss": -27.633392333984375, "global_step": 574176, "epoch": 6917} {"train_loss": -27.942707061767578, "global_step": 574177, "epoch": 6917} {"train_loss": -27.733983993530273, "global_step": 574178, "epoch": 6917} {"train_loss": -28.379064559936523, "global_step": 574179, "epoch": 6917} {"train_loss": -28.33184814453125, "global_step": 574180, "epoch": 6917} {"train_loss": -28.04657554626465, "global_step": 574181, "epoch": 6917} {"train_loss": -27.918502807617188, "global_step": 574182, "epoch": 6917} {"train_loss": -28.076587677001953, "global_step": 574183, "epoch": 6917} {"train_loss": -27.501480102539062, "global_step": 574184, "epoch": 6917} {"train_loss": -27.17477798461914, "global_step": 574185, "epoch": 6917} {"train_loss": -26.00918960571289, "global_step": 574186, "epoch": 6917} {"train_loss": -26.434965133666992, "global_step": 574187, "epoch": 6917} {"train_loss": -27.552555084228516, "global_step": 574188, "epoch": 6917} {"train_loss": -26.720861434936523, "global_step": 574189, "epoch": 6917} {"train_loss": -27.5692195892334, "global_step": 574190, "epoch": 6917} {"train_loss": -27.670400619506836, "global_step": 574191, "epoch": 6917} {"train_loss": -27.714399337768555, "global_step": 574192, "epoch": 6917} {"train_loss": -27.77929142871535, "global_step": 574193, "epoch": 6917, "val_loss": 6534460.0} {"train_loss": -26.4173583984375, "global_step": 574194, "epoch": 6918} {"train_loss": -26.283720016479492, "global_step": 574195, "epoch": 6918} {"train_loss": -26.890783309936523, "global_step": 574196, "epoch": 6918} {"train_loss": -26.576995849609375, "global_step": 574197, "epoch": 6918} {"train_loss": -26.95941162109375, "global_step": 574198, "epoch": 6918} {"train_loss": -27.179716110229492, "global_step": 574199, "epoch": 6918} {"train_loss": -26.52880859375, "global_step": 574200, "epoch": 6918} {"train_loss": -26.399438858032227, "global_step": 574201, "epoch": 6918} {"train_loss": -27.517187118530273, "global_step": 574202, "epoch": 6918} {"train_loss": -27.03694725036621, "global_step": 574203, "epoch": 6918} {"train_loss": -26.848133087158203, "global_step": 574204, "epoch": 6918} {"train_loss": -27.044239044189453, "global_step": 574205, "epoch": 6918} {"train_loss": -26.9216251373291, "global_step": 574206, "epoch": 6918} {"train_loss": -27.106592178344727, "global_step": 574207, "epoch": 6918} {"train_loss": -27.4715576171875, "global_step": 574208, "epoch": 6918} {"train_loss": -26.72786521911621, "global_step": 574209, "epoch": 6918} {"train_loss": -27.232324600219727, "global_step": 574210, "epoch": 6918} {"train_loss": -27.335254669189453, "global_step": 574211, "epoch": 6918} {"train_loss": -26.968219757080078, "global_step": 574212, "epoch": 6918} {"train_loss": -27.54621696472168, "global_step": 574213, "epoch": 6918} {"train_loss": -27.2257137298584, "global_step": 574214, "epoch": 6918} {"train_loss": -27.504907608032227, "global_step": 574215, "epoch": 6918} {"train_loss": -27.458044052124023, "global_step": 574216, "epoch": 6918} {"train_loss": -27.663497924804688, "global_step": 574217, "epoch": 6918} {"train_loss": -27.6478271484375, "global_step": 574218, "epoch": 6918} {"train_loss": -27.234601974487305, "global_step": 574219, "epoch": 6918} {"train_loss": -27.62653923034668, "global_step": 574220, "epoch": 6918} {"train_loss": -27.611526489257812, "global_step": 574221, "epoch": 6918} {"train_loss": -27.57636070251465, "global_step": 574222, "epoch": 6918} {"train_loss": -27.57301902770996, "global_step": 574223, "epoch": 6918} {"train_loss": -27.56998634338379, "global_step": 574224, "epoch": 6918} {"train_loss": -27.968488693237305, "global_step": 574225, "epoch": 6918} {"train_loss": -27.615890502929688, "global_step": 574226, "epoch": 6918} {"train_loss": -27.706409454345703, "global_step": 574227, "epoch": 6918} {"train_loss": -27.911848068237305, "global_step": 574228, "epoch": 6918} {"train_loss": -27.693073272705078, "global_step": 574229, "epoch": 6918} {"train_loss": -27.89371109008789, "global_step": 574230, "epoch": 6918} {"train_loss": -27.603321075439453, "global_step": 574231, "epoch": 6918} {"train_loss": -28.09576416015625, "global_step": 574232, "epoch": 6918} {"train_loss": -27.81354331970215, "global_step": 574233, "epoch": 6918} {"train_loss": -27.79621696472168, "global_step": 574234, "epoch": 6918} {"train_loss": -28.36258316040039, "global_step": 574235, "epoch": 6918} {"train_loss": -27.69390869140625, "global_step": 574236, "epoch": 6918} {"train_loss": -27.971698760986328, "global_step": 574237, "epoch": 6918} {"train_loss": -28.11835289001465, "global_step": 574238, "epoch": 6918} {"train_loss": -28.012643814086914, "global_step": 574239, "epoch": 6918} {"train_loss": -27.822980880737305, "global_step": 574240, "epoch": 6918} {"train_loss": -27.526702880859375, "global_step": 574241, "epoch": 6918} {"train_loss": -28.180952072143555, "global_step": 574242, "epoch": 6918} {"train_loss": -27.8782901763916, "global_step": 574243, "epoch": 6918} {"train_loss": -27.6792049407959, "global_step": 574244, "epoch": 6918} {"train_loss": -27.76556968688965, "global_step": 574245, "epoch": 6918} {"train_loss": -28.055200576782227, "global_step": 574246, "epoch": 6918} {"train_loss": -28.0277042388916, "global_step": 574247, "epoch": 6918} {"train_loss": -27.350080490112305, "global_step": 574248, "epoch": 6918} {"train_loss": -27.809171676635742, "global_step": 574249, "epoch": 6918} {"train_loss": -27.820661544799805, "global_step": 574250, "epoch": 6918} {"train_loss": -27.512907028198242, "global_step": 574251, "epoch": 6918} {"train_loss": -27.813684463500977, "global_step": 574252, "epoch": 6918} {"train_loss": -28.123197555541992, "global_step": 574253, "epoch": 6918} {"train_loss": -27.738950729370117, "global_step": 574254, "epoch": 6918} {"train_loss": -28.31184196472168, "global_step": 574255, "epoch": 6918} {"train_loss": -27.725894927978516, "global_step": 574256, "epoch": 6918} {"train_loss": -28.23317527770996, "global_step": 574257, "epoch": 6918} {"train_loss": -27.812307357788086, "global_step": 574258, "epoch": 6918} {"train_loss": -27.868383407592773, "global_step": 574259, "epoch": 6918} {"train_loss": -27.61359977722168, "global_step": 574260, "epoch": 6918} {"train_loss": -28.12334632873535, "global_step": 574261, "epoch": 6918} {"train_loss": -27.96371841430664, "global_step": 574262, "epoch": 6918} {"train_loss": -27.865095138549805, "global_step": 574263, "epoch": 6918} {"train_loss": -27.970651626586914, "global_step": 574264, "epoch": 6918} {"train_loss": -28.0643310546875, "global_step": 574265, "epoch": 6918} {"train_loss": -28.1263427734375, "global_step": 574266, "epoch": 6918} {"train_loss": -27.645124435424805, "global_step": 574267, "epoch": 6918} {"train_loss": -27.833450317382812, "global_step": 574268, "epoch": 6918} {"train_loss": -28.246051788330078, "global_step": 574269, "epoch": 6918} {"train_loss": -27.993452072143555, "global_step": 574270, "epoch": 6918} {"train_loss": -28.001733779907227, "global_step": 574271, "epoch": 6918} {"train_loss": -28.106760025024414, "global_step": 574272, "epoch": 6918} {"train_loss": -28.110769271850586, "global_step": 574273, "epoch": 6918} {"train_loss": -28.117597579956055, "global_step": 574274, "epoch": 6918} {"train_loss": -27.86060905456543, "global_step": 574275, "epoch": 6918} {"train_loss": -27.61349896350539, "global_step": 574276, "epoch": 6918, "val_loss": 6543506.0} {"train_loss": -27.22650146484375, "global_step": 574277, "epoch": 6919} {"train_loss": -26.61978530883789, "global_step": 574278, "epoch": 6919} {"train_loss": -27.34473991394043, "global_step": 574279, "epoch": 6919} {"train_loss": -27.241811752319336, "global_step": 574280, "epoch": 6919} {"train_loss": -27.45947265625, "global_step": 574281, "epoch": 6919} {"train_loss": -27.37056541442871, "global_step": 574282, "epoch": 6919} {"train_loss": -27.22275161743164, "global_step": 574283, "epoch": 6919} {"train_loss": -27.991107940673828, "global_step": 574284, "epoch": 6919} {"train_loss": -27.046796798706055, "global_step": 574285, "epoch": 6919} {"train_loss": -27.537750244140625, "global_step": 574286, "epoch": 6919} {"train_loss": -27.316741943359375, "global_step": 574287, "epoch": 6919} {"train_loss": -27.37604331970215, "global_step": 574288, "epoch": 6919} {"train_loss": -27.13258171081543, "global_step": 574289, "epoch": 6919} {"train_loss": -27.9229793548584, "global_step": 574290, "epoch": 6919} {"train_loss": -27.383649826049805, "global_step": 574291, "epoch": 6919} {"train_loss": -27.52341079711914, "global_step": 574292, "epoch": 6919} {"train_loss": -27.48075294494629, "global_step": 574293, "epoch": 6919} {"train_loss": -28.041589736938477, "global_step": 574294, "epoch": 6919} {"train_loss": -27.48378562927246, "global_step": 574295, "epoch": 6919} {"train_loss": -27.63373374938965, "global_step": 574296, "epoch": 6919} {"train_loss": -27.503875732421875, "global_step": 574297, "epoch": 6919} {"train_loss": -27.610004425048828, "global_step": 574298, "epoch": 6919} {"train_loss": -27.94245719909668, "global_step": 574299, "epoch": 6919} {"train_loss": -27.668048858642578, "global_step": 574300, "epoch": 6919} {"train_loss": -28.170358657836914, "global_step": 574301, "epoch": 6919} {"train_loss": -27.768329620361328, "global_step": 574302, "epoch": 6919} {"train_loss": -27.645160675048828, "global_step": 574303, "epoch": 6919} {"train_loss": -27.811620712280273, "global_step": 574304, "epoch": 6919} {"train_loss": -27.801305770874023, "global_step": 574305, "epoch": 6919} {"train_loss": -27.692102432250977, "global_step": 574306, "epoch": 6919} {"train_loss": -27.977468490600586, "global_step": 574307, "epoch": 6919} {"train_loss": -27.717914581298828, "global_step": 574308, "epoch": 6919} {"train_loss": -27.655029296875, "global_step": 574309, "epoch": 6919} {"train_loss": -27.584369659423828, "global_step": 574310, "epoch": 6919} {"train_loss": -27.881864547729492, "global_step": 574311, "epoch": 6919} {"train_loss": -27.92144203186035, "global_step": 574312, "epoch": 6919} {"train_loss": -27.98341178894043, "global_step": 574313, "epoch": 6919} {"train_loss": -28.158727645874023, "global_step": 574314, "epoch": 6919} {"train_loss": -27.75349235534668, "global_step": 574315, "epoch": 6919} {"train_loss": -28.242095947265625, "global_step": 574316, "epoch": 6919} {"train_loss": -28.089920043945312, "global_step": 574317, "epoch": 6919} {"train_loss": -27.77809715270996, "global_step": 574318, "epoch": 6919} {"train_loss": -28.342365264892578, "global_step": 574319, "epoch": 6919} {"train_loss": -27.92001724243164, "global_step": 574320, "epoch": 6919} {"train_loss": -27.874237060546875, "global_step": 574321, "epoch": 6919} {"train_loss": -28.059310913085938, "global_step": 574322, "epoch": 6919} {"train_loss": -28.235309600830078, "global_step": 574323, "epoch": 6919} {"train_loss": -28.079153060913086, "global_step": 574324, "epoch": 6919} {"train_loss": -28.066614151000977, "global_step": 574325, "epoch": 6919} {"train_loss": -28.153356552124023, "global_step": 574326, "epoch": 6919} {"train_loss": -27.687158584594727, "global_step": 574327, "epoch": 6919} {"train_loss": -27.892139434814453, "global_step": 574328, "epoch": 6919} {"train_loss": -27.4256591796875, "global_step": 574329, "epoch": 6919} {"train_loss": -28.066329956054688, "global_step": 574330, "epoch": 6919} {"train_loss": -27.869277954101562, "global_step": 574331, "epoch": 6919} {"train_loss": -28.030698776245117, "global_step": 574332, "epoch": 6919} {"train_loss": -27.896825790405273, "global_step": 574333, "epoch": 6919} {"train_loss": -27.844470977783203, "global_step": 574334, "epoch": 6919} {"train_loss": -28.08936882019043, "global_step": 574335, "epoch": 6919} {"train_loss": -28.24030876159668, "global_step": 574336, "epoch": 6919} {"train_loss": -27.661239624023438, "global_step": 574337, "epoch": 6919} {"train_loss": -28.20639991760254, "global_step": 574338, "epoch": 6919} {"train_loss": -27.728595733642578, "global_step": 574339, "epoch": 6919} {"train_loss": -28.216718673706055, "global_step": 574340, "epoch": 6919} {"train_loss": -28.317218780517578, "global_step": 574341, "epoch": 6919} {"train_loss": -28.11785316467285, "global_step": 574342, "epoch": 6919} {"train_loss": -28.332868576049805, "global_step": 574343, "epoch": 6919} {"train_loss": -28.316543579101562, "global_step": 574344, "epoch": 6919} {"train_loss": -28.265796661376953, "global_step": 574345, "epoch": 6919} {"train_loss": -28.017780303955078, "global_step": 574346, "epoch": 6919} {"train_loss": -28.104084014892578, "global_step": 574347, "epoch": 6919} {"train_loss": -28.30445671081543, "global_step": 574348, "epoch": 6919} {"train_loss": -28.231237411499023, "global_step": 574349, "epoch": 6919} {"train_loss": -27.921655654907227, "global_step": 574350, "epoch": 6919} {"train_loss": -28.137710571289062, "global_step": 574351, "epoch": 6919} {"train_loss": -27.45606803894043, "global_step": 574352, "epoch": 6919} {"train_loss": -27.837142944335938, "global_step": 574353, "epoch": 6919} {"train_loss": -27.84109878540039, "global_step": 574354, "epoch": 6919} {"train_loss": -27.80087661743164, "global_step": 574355, "epoch": 6919} {"train_loss": -28.31512451171875, "global_step": 574356, "epoch": 6919} {"train_loss": -27.91242790222168, "global_step": 574357, "epoch": 6919} {"train_loss": -27.567834854125977, "global_step": 574358, "epoch": 6919} {"train_loss": -27.821870206350304, "global_step": 574359, "epoch": 6919, "val_loss": 6533724.5} {"train_loss": -26.148258209228516, "global_step": 574360, "epoch": 6920} {"train_loss": -25.70829200744629, "global_step": 574361, "epoch": 6920} {"train_loss": -26.173765182495117, "global_step": 574362, "epoch": 6920} {"train_loss": -27.299808502197266, "global_step": 574363, "epoch": 6920} {"train_loss": -26.6519775390625, "global_step": 574364, "epoch": 6920} {"train_loss": -27.163604736328125, "global_step": 574365, "epoch": 6920} {"train_loss": -26.688217163085938, "global_step": 574366, "epoch": 6920} {"train_loss": -26.737384796142578, "global_step": 574367, "epoch": 6920} {"train_loss": -26.949827194213867, "global_step": 574368, "epoch": 6920} {"train_loss": -27.045490264892578, "global_step": 574369, "epoch": 6920} {"train_loss": -27.035154342651367, "global_step": 574370, "epoch": 6920} {"train_loss": -27.50819206237793, "global_step": 574371, "epoch": 6920} {"train_loss": -27.39276695251465, "global_step": 574372, "epoch": 6920} {"train_loss": -27.277118682861328, "global_step": 574373, "epoch": 6920} {"train_loss": -27.438108444213867, "global_step": 574374, "epoch": 6920} {"train_loss": -27.206140518188477, "global_step": 574375, "epoch": 6920} {"train_loss": -27.40009880065918, "global_step": 574376, "epoch": 6920} {"train_loss": -27.286706924438477, "global_step": 574377, "epoch": 6920} {"train_loss": -27.161481857299805, "global_step": 574378, "epoch": 6920} {"train_loss": -27.4012451171875, "global_step": 574379, "epoch": 6920} {"train_loss": -27.637258529663086, "global_step": 574380, "epoch": 6920} {"train_loss": -27.231342315673828, "global_step": 574381, "epoch": 6920} {"train_loss": -27.53066062927246, "global_step": 574382, "epoch": 6920} {"train_loss": -27.613800048828125, "global_step": 574383, "epoch": 6920} {"train_loss": -27.557025909423828, "global_step": 574384, "epoch": 6920} {"train_loss": -27.64715576171875, "global_step": 574385, "epoch": 6920} {"train_loss": -27.532150268554688, "global_step": 574386, "epoch": 6920} {"train_loss": -27.717426300048828, "global_step": 574387, "epoch": 6920} {"train_loss": -27.845361709594727, "global_step": 574388, "epoch": 6920} {"train_loss": -27.717466354370117, "global_step": 574389, "epoch": 6920} {"train_loss": -27.57325553894043, "global_step": 574390, "epoch": 6920} {"train_loss": -27.972986221313477, "global_step": 574391, "epoch": 6920} {"train_loss": -27.950485229492188, "global_step": 574392, "epoch": 6920} {"train_loss": -27.744794845581055, "global_step": 574393, "epoch": 6920} {"train_loss": -27.6855411529541, "global_step": 574394, "epoch": 6920} {"train_loss": -27.750568389892578, "global_step": 574395, "epoch": 6920} {"train_loss": -27.85492515563965, "global_step": 574396, "epoch": 6920} {"train_loss": -27.55683708190918, "global_step": 574397, "epoch": 6920} {"train_loss": -27.647409439086914, "global_step": 574398, "epoch": 6920} {"train_loss": -27.93191909790039, "global_step": 574399, "epoch": 6920} {"train_loss": -27.878494262695312, "global_step": 574400, "epoch": 6920} {"train_loss": -27.9705753326416, "global_step": 574401, "epoch": 6920} {"train_loss": -27.766271591186523, "global_step": 574402, "epoch": 6920} {"train_loss": -27.653818130493164, "global_step": 574403, "epoch": 6920} {"train_loss": -27.59185791015625, "global_step": 574404, "epoch": 6920} {"train_loss": -27.9605770111084, "global_step": 574405, "epoch": 6920} {"train_loss": -28.148120880126953, "global_step": 574406, "epoch": 6920} {"train_loss": -27.878570556640625, "global_step": 574407, "epoch": 6920} {"train_loss": -28.068479537963867, "global_step": 574408, "epoch": 6920} {"train_loss": -27.73122215270996, "global_step": 574409, "epoch": 6920} {"train_loss": -28.102331161499023, "global_step": 574410, "epoch": 6920} {"train_loss": -27.95552635192871, "global_step": 574411, "epoch": 6920} {"train_loss": -27.78114128112793, "global_step": 574412, "epoch": 6920} {"train_loss": -27.89385986328125, "global_step": 574413, "epoch": 6920} {"train_loss": -28.059040069580078, "global_step": 574414, "epoch": 6920} {"train_loss": -28.03142738342285, "global_step": 574415, "epoch": 6920} {"train_loss": -28.11052894592285, "global_step": 574416, "epoch": 6920} {"train_loss": -28.052648544311523, "global_step": 574417, "epoch": 6920} {"train_loss": -27.977874755859375, "global_step": 574418, "epoch": 6920} {"train_loss": -27.950122833251953, "global_step": 574419, "epoch": 6920} {"train_loss": -28.08680534362793, "global_step": 574420, "epoch": 6920} {"train_loss": -27.785816192626953, "global_step": 574421, "epoch": 6920} {"train_loss": -27.97760581970215, "global_step": 574422, "epoch": 6920} {"train_loss": -28.384923934936523, "global_step": 574423, "epoch": 6920} {"train_loss": -27.985794067382812, "global_step": 574424, "epoch": 6920} {"train_loss": -27.755735397338867, "global_step": 574425, "epoch": 6920} {"train_loss": -27.17660903930664, "global_step": 574426, "epoch": 6920} {"train_loss": -27.371051788330078, "global_step": 574427, "epoch": 6920} {"train_loss": -27.785924911499023, "global_step": 574428, "epoch": 6920} {"train_loss": -27.813858032226562, "global_step": 574429, "epoch": 6920} {"train_loss": -27.64295768737793, "global_step": 574430, "epoch": 6920} {"train_loss": -27.696462631225586, "global_step": 574431, "epoch": 6920} {"train_loss": -27.781192779541016, "global_step": 574432, "epoch": 6920} {"train_loss": -28.376712799072266, "global_step": 574433, "epoch": 6920} {"train_loss": -27.972461700439453, "global_step": 574434, "epoch": 6920} {"train_loss": -27.781198501586914, "global_step": 574435, "epoch": 6920} {"train_loss": -27.77058982849121, "global_step": 574436, "epoch": 6920} {"train_loss": -27.575834274291992, "global_step": 574437, "epoch": 6920} {"train_loss": -27.98748207092285, "global_step": 574438, "epoch": 6920} {"train_loss": -28.072940826416016, "global_step": 574439, "epoch": 6920} {"train_loss": -27.762842178344727, "global_step": 574440, "epoch": 6920} {"train_loss": -28.113006591796875, "global_step": 574441, "epoch": 6920} {"train_loss": -27.625625863132708, "global_step": 574442, "epoch": 6920, "val_loss": 6487648.5} {"train_loss": -27.312997817993164, "global_step": 574443, "epoch": 6921} {"train_loss": -27.472631454467773, "global_step": 574444, "epoch": 6921} {"train_loss": -27.130239486694336, "global_step": 574445, "epoch": 6921} {"train_loss": -27.18329429626465, "global_step": 574446, "epoch": 6921} {"train_loss": -27.746795654296875, "global_step": 574447, "epoch": 6921} {"train_loss": -27.364521026611328, "global_step": 574448, "epoch": 6921} {"train_loss": -27.189697265625, "global_step": 574449, "epoch": 6921} {"train_loss": -27.146839141845703, "global_step": 574450, "epoch": 6921} {"train_loss": -27.200788497924805, "global_step": 574451, "epoch": 6921} {"train_loss": -27.595458984375, "global_step": 574452, "epoch": 6921} {"train_loss": -27.441858291625977, "global_step": 574453, "epoch": 6921} {"train_loss": -27.278833389282227, "global_step": 574454, "epoch": 6921} {"train_loss": -27.98801040649414, "global_step": 574455, "epoch": 6921} {"train_loss": -27.550373077392578, "global_step": 574456, "epoch": 6921} {"train_loss": -27.869140625, "global_step": 574457, "epoch": 6921} {"train_loss": -27.756555557250977, "global_step": 574458, "epoch": 6921} {"train_loss": -27.80238151550293, "global_step": 574459, "epoch": 6921} {"train_loss": -27.52454948425293, "global_step": 574460, "epoch": 6921} {"train_loss": -27.756412506103516, "global_step": 574461, "epoch": 6921} {"train_loss": -27.644927978515625, "global_step": 574462, "epoch": 6921} {"train_loss": -27.595563888549805, "global_step": 574463, "epoch": 6921} {"train_loss": -27.591724395751953, "global_step": 574464, "epoch": 6921} {"train_loss": -27.866291046142578, "global_step": 574465, "epoch": 6921} {"train_loss": -28.0338077545166, "global_step": 574466, "epoch": 6921} {"train_loss": -28.197967529296875, "global_step": 574467, "epoch": 6921} {"train_loss": -27.861881256103516, "global_step": 574468, "epoch": 6921} {"train_loss": -27.834857940673828, "global_step": 574469, "epoch": 6921} {"train_loss": -27.950353622436523, "global_step": 574470, "epoch": 6921} {"train_loss": -27.544937133789062, "global_step": 574471, "epoch": 6921} {"train_loss": -27.833572387695312, "global_step": 574472, "epoch": 6921} {"train_loss": -27.995197296142578, "global_step": 574473, "epoch": 6921} {"train_loss": -28.122211456298828, "global_step": 574474, "epoch": 6921} {"train_loss": -27.732221603393555, "global_step": 574475, "epoch": 6921} {"train_loss": -27.9023494720459, "global_step": 574476, "epoch": 6921} {"train_loss": -27.5609188079834, "global_step": 574477, "epoch": 6921} {"train_loss": -28.007251739501953, "global_step": 574478, "epoch": 6921} {"train_loss": -27.75312614440918, "global_step": 574479, "epoch": 6921} {"train_loss": -27.83538246154785, "global_step": 574480, "epoch": 6921} {"train_loss": -27.82038688659668, "global_step": 574481, "epoch": 6921} {"train_loss": -27.955066680908203, "global_step": 574482, "epoch": 6921} {"train_loss": -27.703649520874023, "global_step": 574483, "epoch": 6921} {"train_loss": -27.897235870361328, "global_step": 574484, "epoch": 6921} {"train_loss": -28.043033599853516, "global_step": 574485, "epoch": 6921} {"train_loss": -28.081151962280273, "global_step": 574486, "epoch": 6921} {"train_loss": -27.8847713470459, "global_step": 574487, "epoch": 6921} {"train_loss": -27.975128173828125, "global_step": 574488, "epoch": 6921} {"train_loss": -28.356008529663086, "global_step": 574489, "epoch": 6921} {"train_loss": -27.68214225769043, "global_step": 574490, "epoch": 6921} {"train_loss": -28.289031982421875, "global_step": 574491, "epoch": 6921} {"train_loss": -27.867658615112305, "global_step": 574492, "epoch": 6921} {"train_loss": -28.187835693359375, "global_step": 574493, "epoch": 6921} {"train_loss": -28.153945922851562, "global_step": 574494, "epoch": 6921} {"train_loss": -27.784534454345703, "global_step": 574495, "epoch": 6921} {"train_loss": -27.876962661743164, "global_step": 574496, "epoch": 6921} {"train_loss": -28.156240463256836, "global_step": 574497, "epoch": 6921} {"train_loss": -28.060453414916992, "global_step": 574498, "epoch": 6921} {"train_loss": -27.617584228515625, "global_step": 574499, "epoch": 6921} {"train_loss": -27.66769790649414, "global_step": 574500, "epoch": 6921} {"train_loss": -27.686994552612305, "global_step": 574501, "epoch": 6921} {"train_loss": -28.234601974487305, "global_step": 574502, "epoch": 6921} {"train_loss": -28.055362701416016, "global_step": 574503, "epoch": 6921} {"train_loss": -27.420154571533203, "global_step": 574504, "epoch": 6921} {"train_loss": -27.845258712768555, "global_step": 574505, "epoch": 6921} {"train_loss": -28.003265380859375, "global_step": 574506, "epoch": 6921} {"train_loss": -27.803211212158203, "global_step": 574507, "epoch": 6921} {"train_loss": -28.065174102783203, "global_step": 574508, "epoch": 6921} {"train_loss": -27.736515045166016, "global_step": 574509, "epoch": 6921} {"train_loss": -27.812885284423828, "global_step": 574510, "epoch": 6921} {"train_loss": -27.81130027770996, "global_step": 574511, "epoch": 6921} {"train_loss": -27.947345733642578, "global_step": 574512, "epoch": 6921} {"train_loss": -28.15293312072754, "global_step": 574513, "epoch": 6921} {"train_loss": -28.261890411376953, "global_step": 574514, "epoch": 6921} {"train_loss": -28.026477813720703, "global_step": 574515, "epoch": 6921} {"train_loss": -27.914419174194336, "global_step": 574516, "epoch": 6921} {"train_loss": -28.150226593017578, "global_step": 574517, "epoch": 6921} {"train_loss": -27.48895835876465, "global_step": 574518, "epoch": 6921} {"train_loss": -27.222482681274414, "global_step": 574519, "epoch": 6921} {"train_loss": -27.42775535583496, "global_step": 574520, "epoch": 6921} {"train_loss": -27.131946563720703, "global_step": 574521, "epoch": 6921} {"train_loss": -27.8013973236084, "global_step": 574522, "epoch": 6921} {"train_loss": -27.824512481689453, "global_step": 574523, "epoch": 6921} {"train_loss": -28.2047061920166, "global_step": 574524, "epoch": 6921} {"train_loss": -27.780561332243035, "global_step": 574525, "epoch": 6921, "val_loss": 6474063.0} {"train_loss": -27.6909122467041, "global_step": 574526, "epoch": 6922} {"train_loss": -26.825910568237305, "global_step": 574527, "epoch": 6922} {"train_loss": -27.763843536376953, "global_step": 574528, "epoch": 6922} {"train_loss": -27.230426788330078, "global_step": 574529, "epoch": 6922} {"train_loss": -27.0225887298584, "global_step": 574530, "epoch": 6922} {"train_loss": -27.152292251586914, "global_step": 574531, "epoch": 6922} {"train_loss": -27.400394439697266, "global_step": 574532, "epoch": 6922} {"train_loss": -27.56281852722168, "global_step": 574533, "epoch": 6922} {"train_loss": -26.907819747924805, "global_step": 574534, "epoch": 6922} {"train_loss": -27.29117774963379, "global_step": 574535, "epoch": 6922} {"train_loss": -27.599546432495117, "global_step": 574536, "epoch": 6922} {"train_loss": -27.262842178344727, "global_step": 574537, "epoch": 6922} {"train_loss": -26.8039493560791, "global_step": 574538, "epoch": 6922} {"train_loss": -27.522741317749023, "global_step": 574539, "epoch": 6922} {"train_loss": -27.356769561767578, "global_step": 574540, "epoch": 6922} {"train_loss": -27.638181686401367, "global_step": 574541, "epoch": 6922} {"train_loss": -27.649328231811523, "global_step": 574542, "epoch": 6922} {"train_loss": -27.047513961791992, "global_step": 574543, "epoch": 6922} {"train_loss": -27.713947296142578, "global_step": 574544, "epoch": 6922} {"train_loss": -27.350849151611328, "global_step": 574545, "epoch": 6922} {"train_loss": -27.506738662719727, "global_step": 574546, "epoch": 6922} {"train_loss": -27.56473159790039, "global_step": 574547, "epoch": 6922} {"train_loss": -27.459503173828125, "global_step": 574548, "epoch": 6922} {"train_loss": -27.653608322143555, "global_step": 574549, "epoch": 6922} {"train_loss": -27.617725372314453, "global_step": 574550, "epoch": 6922} {"train_loss": -27.836606979370117, "global_step": 574551, "epoch": 6922} {"train_loss": -27.50055503845215, "global_step": 574552, "epoch": 6922} {"train_loss": -28.100385665893555, "global_step": 574553, "epoch": 6922} {"train_loss": -27.55403709411621, "global_step": 574554, "epoch": 6922} {"train_loss": -27.875812530517578, "global_step": 574555, "epoch": 6922} {"train_loss": -27.74897575378418, "global_step": 574556, "epoch": 6922} {"train_loss": -28.03557777404785, "global_step": 574557, "epoch": 6922} {"train_loss": -28.087650299072266, "global_step": 574558, "epoch": 6922} {"train_loss": -27.908727645874023, "global_step": 574559, "epoch": 6922} {"train_loss": -27.446935653686523, "global_step": 574560, "epoch": 6922} {"train_loss": -27.866613388061523, "global_step": 574561, "epoch": 6922} {"train_loss": -27.977697372436523, "global_step": 574562, "epoch": 6922} {"train_loss": -27.686279296875, "global_step": 574563, "epoch": 6922} {"train_loss": -27.573856353759766, "global_step": 574564, "epoch": 6922} {"train_loss": -27.852685928344727, "global_step": 574565, "epoch": 6922} {"train_loss": -27.859485626220703, "global_step": 574566, "epoch": 6922} {"train_loss": -28.109241485595703, "global_step": 574567, "epoch": 6922} {"train_loss": -27.524505615234375, "global_step": 574568, "epoch": 6922} {"train_loss": -27.412328720092773, "global_step": 574569, "epoch": 6922} {"train_loss": -27.599822998046875, "global_step": 574570, "epoch": 6922} {"train_loss": -27.756982803344727, "global_step": 574571, "epoch": 6922} {"train_loss": -27.875417709350586, "global_step": 574572, "epoch": 6922} {"train_loss": -27.900808334350586, "global_step": 574573, "epoch": 6922} {"train_loss": -27.848663330078125, "global_step": 574574, "epoch": 6922} {"train_loss": -27.884063720703125, "global_step": 574575, "epoch": 6922} {"train_loss": -28.0382022857666, "global_step": 574576, "epoch": 6922} {"train_loss": -27.772216796875, "global_step": 574577, "epoch": 6922} {"train_loss": -28.031890869140625, "global_step": 574578, "epoch": 6922} {"train_loss": -28.297571182250977, "global_step": 574579, "epoch": 6922} {"train_loss": -27.719675064086914, "global_step": 574580, "epoch": 6922} {"train_loss": -28.203540802001953, "global_step": 574581, "epoch": 6922} {"train_loss": -27.9171199798584, "global_step": 574582, "epoch": 6922} {"train_loss": -28.088123321533203, "global_step": 574583, "epoch": 6922} {"train_loss": -28.191022872924805, "global_step": 574584, "epoch": 6922} {"train_loss": -27.96016502380371, "global_step": 574585, "epoch": 6922} {"train_loss": -28.390607833862305, "global_step": 574586, "epoch": 6922} {"train_loss": -28.336292266845703, "global_step": 574587, "epoch": 6922} {"train_loss": -27.729114532470703, "global_step": 574588, "epoch": 6922} {"train_loss": -27.91180992126465, "global_step": 574589, "epoch": 6922} {"train_loss": -27.912817001342773, "global_step": 574590, "epoch": 6922} {"train_loss": -27.856689453125, "global_step": 574591, "epoch": 6922} {"train_loss": -27.97001075744629, "global_step": 574592, "epoch": 6922} {"train_loss": -28.448139190673828, "global_step": 574593, "epoch": 6922} {"train_loss": -28.186187744140625, "global_step": 574594, "epoch": 6922} {"train_loss": -28.067584991455078, "global_step": 574595, "epoch": 6922} {"train_loss": -27.97871208190918, "global_step": 574596, "epoch": 6922} {"train_loss": -28.031024932861328, "global_step": 574597, "epoch": 6922} {"train_loss": -28.430654525756836, "global_step": 574598, "epoch": 6922} {"train_loss": -27.650421142578125, "global_step": 574599, "epoch": 6922} {"train_loss": -27.46461296081543, "global_step": 574600, "epoch": 6922} {"train_loss": -27.3946475982666, "global_step": 574601, "epoch": 6922} {"train_loss": -27.5462646484375, "global_step": 574602, "epoch": 6922} {"train_loss": -28.05573844909668, "global_step": 574603, "epoch": 6922} {"train_loss": -28.135915756225586, "global_step": 574604, "epoch": 6922} {"train_loss": -27.835973739624023, "global_step": 574605, "epoch": 6922} {"train_loss": -28.13590431213379, "global_step": 574606, "epoch": 6922} {"train_loss": -28.101499557495117, "global_step": 574607, "epoch": 6922} {"train_loss": -27.750642753509155, "global_step": 574608, "epoch": 6922, "val_loss": 6483320.0} {"train_loss": -27.68610954284668, "global_step": 574609, "epoch": 6923} {"train_loss": -27.26091957092285, "global_step": 574610, "epoch": 6923} {"train_loss": -27.1446475982666, "global_step": 574611, "epoch": 6923} {"train_loss": -27.621118545532227, "global_step": 574612, "epoch": 6923} {"train_loss": -27.715551376342773, "global_step": 574613, "epoch": 6923} {"train_loss": -28.019559860229492, "global_step": 574614, "epoch": 6923} {"train_loss": -27.566965103149414, "global_step": 574615, "epoch": 6923} {"train_loss": -27.448251724243164, "global_step": 574616, "epoch": 6923} {"train_loss": -27.88804054260254, "global_step": 574617, "epoch": 6923} {"train_loss": -27.860687255859375, "global_step": 574618, "epoch": 6923} {"train_loss": -27.729175567626953, "global_step": 574619, "epoch": 6923} {"train_loss": -27.6341609954834, "global_step": 574620, "epoch": 6923} {"train_loss": -27.500341415405273, "global_step": 574621, "epoch": 6923} {"train_loss": -27.719757080078125, "global_step": 574622, "epoch": 6923} {"train_loss": -28.002866744995117, "global_step": 574623, "epoch": 6923} {"train_loss": -27.562137603759766, "global_step": 574624, "epoch": 6923} {"train_loss": -27.849817276000977, "global_step": 574625, "epoch": 6923} {"train_loss": -27.925537109375, "global_step": 574626, "epoch": 6923} {"train_loss": -27.813955307006836, "global_step": 574627, "epoch": 6923} {"train_loss": -28.097692489624023, "global_step": 574628, "epoch": 6923} {"train_loss": -28.078479766845703, "global_step": 574629, "epoch": 6923} {"train_loss": -27.881498336791992, "global_step": 574630, "epoch": 6923} {"train_loss": -27.6158390045166, "global_step": 574631, "epoch": 6923} {"train_loss": -27.767847061157227, "global_step": 574632, "epoch": 6923} {"train_loss": -27.708227157592773, "global_step": 574633, "epoch": 6923} {"train_loss": -28.26568031311035, "global_step": 574634, "epoch": 6923} {"train_loss": -27.71527099609375, "global_step": 574635, "epoch": 6923} {"train_loss": -28.088956832885742, "global_step": 574636, "epoch": 6923} {"train_loss": -27.897430419921875, "global_step": 574637, "epoch": 6923} {"train_loss": -27.795019149780273, "global_step": 574638, "epoch": 6923} {"train_loss": -27.99186134338379, "global_step": 574639, "epoch": 6923} {"train_loss": -27.455106735229492, "global_step": 574640, "epoch": 6923} {"train_loss": -27.78497314453125, "global_step": 574641, "epoch": 6923} {"train_loss": -27.7279052734375, "global_step": 574642, "epoch": 6923} {"train_loss": -27.74637794494629, "global_step": 574643, "epoch": 6923} {"train_loss": -28.213470458984375, "global_step": 574644, "epoch": 6923} {"train_loss": -27.635055541992188, "global_step": 574645, "epoch": 6923} {"train_loss": -27.83391761779785, "global_step": 574646, "epoch": 6923} {"train_loss": -27.891759872436523, "global_step": 574647, "epoch": 6923} {"train_loss": -28.02618980407715, "global_step": 574648, "epoch": 6923} {"train_loss": -28.313566207885742, "global_step": 574649, "epoch": 6923} {"train_loss": -27.7618350982666, "global_step": 574650, "epoch": 6923} {"train_loss": -27.851078033447266, "global_step": 574651, "epoch": 6923} {"train_loss": -28.010318756103516, "global_step": 574652, "epoch": 6923} {"train_loss": -28.028738021850586, "global_step": 574653, "epoch": 6923} {"train_loss": -28.15228843688965, "global_step": 574654, "epoch": 6923} {"train_loss": -28.004474639892578, "global_step": 574655, "epoch": 6923} {"train_loss": -28.018512725830078, "global_step": 574656, "epoch": 6923} {"train_loss": -27.83371925354004, "global_step": 574657, "epoch": 6923} {"train_loss": -27.848031997680664, "global_step": 574658, "epoch": 6923} {"train_loss": -28.049341201782227, "global_step": 574659, "epoch": 6923} {"train_loss": -28.113754272460938, "global_step": 574660, "epoch": 6923} {"train_loss": -27.7885799407959, "global_step": 574661, "epoch": 6923} {"train_loss": -27.757781982421875, "global_step": 574662, "epoch": 6923} {"train_loss": -27.949695587158203, "global_step": 574663, "epoch": 6923} {"train_loss": -28.07708740234375, "global_step": 574664, "epoch": 6923} {"train_loss": -28.094907760620117, "global_step": 574665, "epoch": 6923} {"train_loss": -27.921680450439453, "global_step": 574666, "epoch": 6923} {"train_loss": -27.901447296142578, "global_step": 574667, "epoch": 6923} {"train_loss": -27.91265296936035, "global_step": 574668, "epoch": 6923} {"train_loss": -27.807743072509766, "global_step": 574669, "epoch": 6923} {"train_loss": -27.394556045532227, "global_step": 574670, "epoch": 6923} {"train_loss": -27.886737823486328, "global_step": 574671, "epoch": 6923} {"train_loss": -28.1490535736084, "global_step": 574672, "epoch": 6923} {"train_loss": -27.4831485748291, "global_step": 574673, "epoch": 6923} {"train_loss": -26.521703720092773, "global_step": 574674, "epoch": 6923} {"train_loss": -26.73172378540039, "global_step": 574675, "epoch": 6923} {"train_loss": -27.068729400634766, "global_step": 574676, "epoch": 6923} {"train_loss": -26.24698257446289, "global_step": 574677, "epoch": 6923} {"train_loss": -27.1660213470459, "global_step": 574678, "epoch": 6923} {"train_loss": -26.791425704956055, "global_step": 574679, "epoch": 6923} {"train_loss": -26.3920841217041, "global_step": 574680, "epoch": 6923} {"train_loss": -27.19162368774414, "global_step": 574681, "epoch": 6923} {"train_loss": -27.216367721557617, "global_step": 574682, "epoch": 6923} {"train_loss": -27.309171676635742, "global_step": 574683, "epoch": 6923} {"train_loss": -26.64088249206543, "global_step": 574684, "epoch": 6923} {"train_loss": -27.49030113220215, "global_step": 574685, "epoch": 6923} {"train_loss": -27.301639556884766, "global_step": 574686, "epoch": 6923} {"train_loss": -27.07613182067871, "global_step": 574687, "epoch": 6923} {"train_loss": -27.531171798706055, "global_step": 574688, "epoch": 6923} {"train_loss": -27.469446182250977, "global_step": 574689, "epoch": 6923} {"train_loss": -27.40629005432129, "global_step": 574690, "epoch": 6923} {"train_loss": -27.654615149440534, "global_step": 574691, "epoch": 6923, "val_loss": 6483227.0} {"train_loss": -27.17911148071289, "global_step": 574692, "epoch": 6924} {"train_loss": -26.82461929321289, "global_step": 574693, "epoch": 6924} {"train_loss": -26.753889083862305, "global_step": 574694, "epoch": 6924} {"train_loss": -27.1745662689209, "global_step": 574695, "epoch": 6924} {"train_loss": -27.005945205688477, "global_step": 574696, "epoch": 6924} {"train_loss": -27.137989044189453, "global_step": 574697, "epoch": 6924} {"train_loss": -27.069665908813477, "global_step": 574698, "epoch": 6924} {"train_loss": -27.323287963867188, "global_step": 574699, "epoch": 6924} {"train_loss": -27.249448776245117, "global_step": 574700, "epoch": 6924} {"train_loss": -27.33321189880371, "global_step": 574701, "epoch": 6924} {"train_loss": -27.392663955688477, "global_step": 574702, "epoch": 6924} {"train_loss": -27.700366973876953, "global_step": 574703, "epoch": 6924} {"train_loss": -27.812036514282227, "global_step": 574704, "epoch": 6924} {"train_loss": -27.517932891845703, "global_step": 574705, "epoch": 6924} {"train_loss": -27.535675048828125, "global_step": 574706, "epoch": 6924} {"train_loss": -27.491464614868164, "global_step": 574707, "epoch": 6924} {"train_loss": -27.744461059570312, "global_step": 574708, "epoch": 6924} {"train_loss": -27.648096084594727, "global_step": 574709, "epoch": 6924} {"train_loss": -27.485815048217773, "global_step": 574710, "epoch": 6924} {"train_loss": -27.693281173706055, "global_step": 574711, "epoch": 6924} {"train_loss": -27.694807052612305, "global_step": 574712, "epoch": 6924} {"train_loss": -27.401533126831055, "global_step": 574713, "epoch": 6924} {"train_loss": -27.329330444335938, "global_step": 574714, "epoch": 6924} {"train_loss": -27.635828018188477, "global_step": 574715, "epoch": 6924} {"train_loss": -27.8651065826416, "global_step": 574716, "epoch": 6924} {"train_loss": -27.765722274780273, "global_step": 574717, "epoch": 6924} {"train_loss": -27.729543685913086, "global_step": 574718, "epoch": 6924} {"train_loss": -27.745229721069336, "global_step": 574719, "epoch": 6924} {"train_loss": -27.60407066345215, "global_step": 574720, "epoch": 6924} {"train_loss": -27.93047523498535, "global_step": 574721, "epoch": 6924} {"train_loss": -27.85068130493164, "global_step": 574722, "epoch": 6924} {"train_loss": -27.8348331451416, "global_step": 574723, "epoch": 6924} {"train_loss": -27.77975845336914, "global_step": 574724, "epoch": 6924} {"train_loss": -27.763330459594727, "global_step": 574725, "epoch": 6924} {"train_loss": -28.058923721313477, "global_step": 574726, "epoch": 6924} {"train_loss": -27.581207275390625, "global_step": 574727, "epoch": 6924} {"train_loss": -28.279829025268555, "global_step": 574728, "epoch": 6924} {"train_loss": -28.21514892578125, "global_step": 574729, "epoch": 6924} {"train_loss": -28.0700626373291, "global_step": 574730, "epoch": 6924} {"train_loss": -27.78815269470215, "global_step": 574731, "epoch": 6924} {"train_loss": -28.05575942993164, "global_step": 574732, "epoch": 6924} {"train_loss": -27.85390281677246, "global_step": 574733, "epoch": 6924} {"train_loss": -27.950830459594727, "global_step": 574734, "epoch": 6924} {"train_loss": -27.9588623046875, "global_step": 574735, "epoch": 6924} {"train_loss": -28.363882064819336, "global_step": 574736, "epoch": 6924} {"train_loss": -28.256591796875, "global_step": 574737, "epoch": 6924} {"train_loss": -27.724695205688477, "global_step": 574738, "epoch": 6924} {"train_loss": -28.235754013061523, "global_step": 574739, "epoch": 6924} {"train_loss": -28.053674697875977, "global_step": 574740, "epoch": 6924} {"train_loss": -27.99452018737793, "global_step": 574741, "epoch": 6924} {"train_loss": -27.56583023071289, "global_step": 574742, "epoch": 6924} {"train_loss": -28.1473331451416, "global_step": 574743, "epoch": 6924} {"train_loss": -27.80132484436035, "global_step": 574744, "epoch": 6924} {"train_loss": -28.07387351989746, "global_step": 574745, "epoch": 6924} {"train_loss": -27.815704345703125, "global_step": 574746, "epoch": 6924} {"train_loss": -28.069183349609375, "global_step": 574747, "epoch": 6924} {"train_loss": -28.42523765563965, "global_step": 574748, "epoch": 6924} {"train_loss": -27.978134155273438, "global_step": 574749, "epoch": 6924} {"train_loss": -28.22334098815918, "global_step": 574750, "epoch": 6924} {"train_loss": -28.17359733581543, "global_step": 574751, "epoch": 6924} {"train_loss": -27.21588706970215, "global_step": 574752, "epoch": 6924} {"train_loss": -27.481918334960938, "global_step": 574753, "epoch": 6924} {"train_loss": -28.216665267944336, "global_step": 574754, "epoch": 6924} {"train_loss": -27.79213523864746, "global_step": 574755, "epoch": 6924} {"train_loss": -27.34309196472168, "global_step": 574756, "epoch": 6924} {"train_loss": -28.17152214050293, "global_step": 574757, "epoch": 6924} {"train_loss": -27.03508949279785, "global_step": 574758, "epoch": 6924} {"train_loss": -27.910245895385742, "global_step": 574759, "epoch": 6924} {"train_loss": -27.373090744018555, "global_step": 574760, "epoch": 6924} {"train_loss": -27.87738609313965, "global_step": 574761, "epoch": 6924} {"train_loss": -27.64422607421875, "global_step": 574762, "epoch": 6924} {"train_loss": -27.79697608947754, "global_step": 574763, "epoch": 6924} {"train_loss": -28.213834762573242, "global_step": 574764, "epoch": 6924} {"train_loss": -27.84954261779785, "global_step": 574765, "epoch": 6924} {"train_loss": -27.739057540893555, "global_step": 574766, "epoch": 6924} {"train_loss": -28.000925064086914, "global_step": 574767, "epoch": 6924} {"train_loss": -27.808761596679688, "global_step": 574768, "epoch": 6924} {"train_loss": -27.79326820373535, "global_step": 574769, "epoch": 6924} {"train_loss": -27.886133193969727, "global_step": 574770, "epoch": 6924} {"train_loss": -27.784326553344727, "global_step": 574771, "epoch": 6924} {"train_loss": -27.237247467041016, "global_step": 574772, "epoch": 6924} {"train_loss": -27.74709129333496, "global_step": 574773, "epoch": 6924} {"train_loss": -27.72583839692265, "global_step": 574774, "epoch": 6924, "val_loss": 6567005.0} {"train_loss": -26.51093101501465, "global_step": 574775, "epoch": 6925} {"train_loss": -26.144412994384766, "global_step": 574776, "epoch": 6925} {"train_loss": -26.759939193725586, "global_step": 574777, "epoch": 6925} {"train_loss": -27.25701332092285, "global_step": 574778, "epoch": 6925} {"train_loss": -26.1838321685791, "global_step": 574779, "epoch": 6925} {"train_loss": -27.02418327331543, "global_step": 574780, "epoch": 6925} {"train_loss": -27.0117244720459, "global_step": 574781, "epoch": 6925} {"train_loss": -27.16200065612793, "global_step": 574782, "epoch": 6925} {"train_loss": -27.096296310424805, "global_step": 574783, "epoch": 6925} {"train_loss": -27.41684341430664, "global_step": 574784, "epoch": 6925} {"train_loss": -27.49799919128418, "global_step": 574785, "epoch": 6925} {"train_loss": -27.494293212890625, "global_step": 574786, "epoch": 6925} {"train_loss": -27.099594116210938, "global_step": 574787, "epoch": 6925} {"train_loss": -27.507471084594727, "global_step": 574788, "epoch": 6925} {"train_loss": -27.0023136138916, "global_step": 574789, "epoch": 6925} {"train_loss": -28.022241592407227, "global_step": 574790, "epoch": 6925} {"train_loss": -27.129743576049805, "global_step": 574791, "epoch": 6925} {"train_loss": -27.425220489501953, "global_step": 574792, "epoch": 6925} {"train_loss": -27.6389217376709, "global_step": 574793, "epoch": 6925} {"train_loss": -27.26531982421875, "global_step": 574794, "epoch": 6925} {"train_loss": -27.789844512939453, "global_step": 574795, "epoch": 6925} {"train_loss": -27.046527862548828, "global_step": 574796, "epoch": 6925} {"train_loss": -27.331897735595703, "global_step": 574797, "epoch": 6925} {"train_loss": -27.30817222595215, "global_step": 574798, "epoch": 6925} {"train_loss": -27.66559410095215, "global_step": 574799, "epoch": 6925} {"train_loss": -27.505786895751953, "global_step": 574800, "epoch": 6925} {"train_loss": -27.57328224182129, "global_step": 574801, "epoch": 6925} {"train_loss": -27.621789932250977, "global_step": 574802, "epoch": 6925} {"train_loss": -27.84173011779785, "global_step": 574803, "epoch": 6925} {"train_loss": -27.780689239501953, "global_step": 574804, "epoch": 6925} {"train_loss": -27.8845272064209, "global_step": 574805, "epoch": 6925} {"train_loss": -28.087976455688477, "global_step": 574806, "epoch": 6925} {"train_loss": -27.67188835144043, "global_step": 574807, "epoch": 6925} {"train_loss": -27.797937393188477, "global_step": 574808, "epoch": 6925} {"train_loss": -27.48813247680664, "global_step": 574809, "epoch": 6925} {"train_loss": -27.79438591003418, "global_step": 574810, "epoch": 6925} {"train_loss": -28.109373092651367, "global_step": 574811, "epoch": 6925} {"train_loss": -27.866596221923828, "global_step": 574812, "epoch": 6925} {"train_loss": -28.38750648498535, "global_step": 574813, "epoch": 6925} {"train_loss": -28.087814331054688, "global_step": 574814, "epoch": 6925} {"train_loss": -27.91440773010254, "global_step": 574815, "epoch": 6925} {"train_loss": -28.121641159057617, "global_step": 574816, "epoch": 6925} {"train_loss": -27.705677032470703, "global_step": 574817, "epoch": 6925} {"train_loss": -28.209543228149414, "global_step": 574818, "epoch": 6925} {"train_loss": -27.940948486328125, "global_step": 574819, "epoch": 6925} {"train_loss": -27.996408462524414, "global_step": 574820, "epoch": 6925} {"train_loss": -27.924259185791016, "global_step": 574821, "epoch": 6925} {"train_loss": -28.281158447265625, "global_step": 574822, "epoch": 6925} {"train_loss": -28.050994873046875, "global_step": 574823, "epoch": 6925} {"train_loss": -28.360387802124023, "global_step": 574824, "epoch": 6925} {"train_loss": -28.02435874938965, "global_step": 574825, "epoch": 6925} {"train_loss": -27.85276222229004, "global_step": 574826, "epoch": 6925} {"train_loss": -28.185590744018555, "global_step": 574827, "epoch": 6925} {"train_loss": -28.277509689331055, "global_step": 574828, "epoch": 6925} {"train_loss": -28.08355712890625, "global_step": 574829, "epoch": 6925} {"train_loss": -27.894739151000977, "global_step": 574830, "epoch": 6925} {"train_loss": -27.862537384033203, "global_step": 574831, "epoch": 6925} {"train_loss": -28.0526065826416, "global_step": 574832, "epoch": 6925} {"train_loss": -28.009428024291992, "global_step": 574833, "epoch": 6925} {"train_loss": -27.717529296875, "global_step": 574834, "epoch": 6925} {"train_loss": -28.065832138061523, "global_step": 574835, "epoch": 6925} {"train_loss": -28.42618751525879, "global_step": 574836, "epoch": 6925} {"train_loss": -28.22861099243164, "global_step": 574837, "epoch": 6925} {"train_loss": -27.972244262695312, "global_step": 574838, "epoch": 6925} {"train_loss": -27.926959991455078, "global_step": 574839, "epoch": 6925} {"train_loss": -27.814422607421875, "global_step": 574840, "epoch": 6925} {"train_loss": -27.982467651367188, "global_step": 574841, "epoch": 6925} {"train_loss": -27.624265670776367, "global_step": 574842, "epoch": 6925} {"train_loss": -27.71439552307129, "global_step": 574843, "epoch": 6925} {"train_loss": -27.957433700561523, "global_step": 574844, "epoch": 6925} {"train_loss": -28.158193588256836, "global_step": 574845, "epoch": 6925} {"train_loss": -28.090682983398438, "global_step": 574846, "epoch": 6925} {"train_loss": -28.208276748657227, "global_step": 574847, "epoch": 6925} {"train_loss": -28.203344345092773, "global_step": 574848, "epoch": 6925} {"train_loss": -28.358001708984375, "global_step": 574849, "epoch": 6925} {"train_loss": -27.9804630279541, "global_step": 574850, "epoch": 6925} {"train_loss": -27.862863540649414, "global_step": 574851, "epoch": 6925} {"train_loss": -28.075223922729492, "global_step": 574852, "epoch": 6925} {"train_loss": -28.035505294799805, "global_step": 574853, "epoch": 6925} {"train_loss": -28.296466827392578, "global_step": 574854, "epoch": 6925} {"train_loss": -28.354333877563477, "global_step": 574855, "epoch": 6925} {"train_loss": -28.326557159423828, "global_step": 574856, "epoch": 6925} {"train_loss": -27.753038705113422, "global_step": 574857, "epoch": 6925, "val_loss": 6446699.0} {"train_loss": -27.17182731628418, "global_step": 574858, "epoch": 6926} {"train_loss": -27.095294952392578, "global_step": 574859, "epoch": 6926} {"train_loss": -27.115331649780273, "global_step": 574860, "epoch": 6926} {"train_loss": -25.97358512878418, "global_step": 574861, "epoch": 6926} {"train_loss": -26.54819679260254, "global_step": 574862, "epoch": 6926} {"train_loss": -26.787145614624023, "global_step": 574863, "epoch": 6926} {"train_loss": -26.408802032470703, "global_step": 574864, "epoch": 6926} {"train_loss": -27.0048828125, "global_step": 574865, "epoch": 6926} {"train_loss": -26.720661163330078, "global_step": 574866, "epoch": 6926} {"train_loss": -26.711872100830078, "global_step": 574867, "epoch": 6926} {"train_loss": -26.883426666259766, "global_step": 574868, "epoch": 6926} {"train_loss": -26.5401554107666, "global_step": 574869, "epoch": 6926} {"train_loss": -27.397993087768555, "global_step": 574870, "epoch": 6926} {"train_loss": -26.766630172729492, "global_step": 574871, "epoch": 6926} {"train_loss": -27.385818481445312, "global_step": 574872, "epoch": 6926} {"train_loss": -27.167694091796875, "global_step": 574873, "epoch": 6926} {"train_loss": -27.079559326171875, "global_step": 574874, "epoch": 6926} {"train_loss": -27.247821807861328, "global_step": 574875, "epoch": 6926} {"train_loss": -27.445112228393555, "global_step": 574876, "epoch": 6926} {"train_loss": -27.48306655883789, "global_step": 574877, "epoch": 6926} {"train_loss": -26.940460205078125, "global_step": 574878, "epoch": 6926} {"train_loss": -27.417652130126953, "global_step": 574879, "epoch": 6926} {"train_loss": -27.3676700592041, "global_step": 574880, "epoch": 6926} {"train_loss": -27.51399803161621, "global_step": 574881, "epoch": 6926} {"train_loss": -27.478540420532227, "global_step": 574882, "epoch": 6926} {"train_loss": -27.732135772705078, "global_step": 574883, "epoch": 6926} {"train_loss": -27.815893173217773, "global_step": 574884, "epoch": 6926} {"train_loss": -27.70682144165039, "global_step": 574885, "epoch": 6926} {"train_loss": -27.485279083251953, "global_step": 574886, "epoch": 6926} {"train_loss": -27.836902618408203, "global_step": 574887, "epoch": 6926} {"train_loss": -27.701766967773438, "global_step": 574888, "epoch": 6926} {"train_loss": -27.494464874267578, "global_step": 574889, "epoch": 6926} {"train_loss": -27.640241622924805, "global_step": 574890, "epoch": 6926} {"train_loss": -28.061904907226562, "global_step": 574891, "epoch": 6926} {"train_loss": -27.645538330078125, "global_step": 574892, "epoch": 6926} {"train_loss": -27.684131622314453, "global_step": 574893, "epoch": 6926} {"train_loss": -27.526235580444336, "global_step": 574894, "epoch": 6926} {"train_loss": -27.717756271362305, "global_step": 574895, "epoch": 6926} {"train_loss": -28.204442977905273, "global_step": 574896, "epoch": 6926} {"train_loss": -28.21306800842285, "global_step": 574897, "epoch": 6926} {"train_loss": -27.923791885375977, "global_step": 574898, "epoch": 6926} {"train_loss": -27.82550621032715, "global_step": 574899, "epoch": 6926} {"train_loss": -27.966028213500977, "global_step": 574900, "epoch": 6926} {"train_loss": -28.15838050842285, "global_step": 574901, "epoch": 6926} {"train_loss": -27.839324951171875, "global_step": 574902, "epoch": 6926} {"train_loss": -27.67475700378418, "global_step": 574903, "epoch": 6926} {"train_loss": -28.071409225463867, "global_step": 574904, "epoch": 6926} {"train_loss": -27.96246337890625, "global_step": 574905, "epoch": 6926} {"train_loss": -27.917682647705078, "global_step": 574906, "epoch": 6926} {"train_loss": -27.66840171813965, "global_step": 574907, "epoch": 6926} {"train_loss": -27.310199737548828, "global_step": 574908, "epoch": 6926} {"train_loss": -28.139591217041016, "global_step": 574909, "epoch": 6926} {"train_loss": -28.19207191467285, "global_step": 574910, "epoch": 6926} {"train_loss": -27.782562255859375, "global_step": 574911, "epoch": 6926} {"train_loss": -27.15679931640625, "global_step": 574912, "epoch": 6926} {"train_loss": -27.13307762145996, "global_step": 574913, "epoch": 6926} {"train_loss": -27.31019401550293, "global_step": 574914, "epoch": 6926} {"train_loss": -27.982685089111328, "global_step": 574915, "epoch": 6926} {"train_loss": -28.16860008239746, "global_step": 574916, "epoch": 6926} {"train_loss": -27.691314697265625, "global_step": 574917, "epoch": 6926} {"train_loss": -27.89735221862793, "global_step": 574918, "epoch": 6926} {"train_loss": -27.93218994140625, "global_step": 574919, "epoch": 6926} {"train_loss": -27.846363067626953, "global_step": 574920, "epoch": 6926} {"train_loss": -27.613773345947266, "global_step": 574921, "epoch": 6926} {"train_loss": -27.68744468688965, "global_step": 574922, "epoch": 6926} {"train_loss": -28.03187370300293, "global_step": 574923, "epoch": 6926} {"train_loss": -28.316747665405273, "global_step": 574924, "epoch": 6926} {"train_loss": -28.074377059936523, "global_step": 574925, "epoch": 6926} {"train_loss": -27.902698516845703, "global_step": 574926, "epoch": 6926} {"train_loss": -27.902973175048828, "global_step": 574927, "epoch": 6926} {"train_loss": -27.75575065612793, "global_step": 574928, "epoch": 6926} {"train_loss": -27.625959396362305, "global_step": 574929, "epoch": 6926} {"train_loss": -28.023351669311523, "global_step": 574930, "epoch": 6926} {"train_loss": -27.851428985595703, "global_step": 574931, "epoch": 6926} {"train_loss": -27.93696403503418, "global_step": 574932, "epoch": 6926} {"train_loss": -27.96531105041504, "global_step": 574933, "epoch": 6926} {"train_loss": -28.05620765686035, "global_step": 574934, "epoch": 6926} {"train_loss": -28.146625518798828, "global_step": 574935, "epoch": 6926} {"train_loss": -27.760318756103516, "global_step": 574936, "epoch": 6926} {"train_loss": -28.161243438720703, "global_step": 574937, "epoch": 6926} {"train_loss": -28.0039119720459, "global_step": 574938, "epoch": 6926} {"train_loss": -28.01535987854004, "global_step": 574939, "epoch": 6926} {"train_loss": -27.611792529921935, "global_step": 574940, "epoch": 6926, "val_loss": 6559877.0} {"train_loss": -27.4462947845459, "global_step": 574941, "epoch": 6927} {"train_loss": -27.360580444335938, "global_step": 574942, "epoch": 6927} {"train_loss": -27.10919761657715, "global_step": 574943, "epoch": 6927} {"train_loss": -27.898075103759766, "global_step": 574944, "epoch": 6927} {"train_loss": -27.593366622924805, "global_step": 574945, "epoch": 6927} {"train_loss": -27.360498428344727, "global_step": 574946, "epoch": 6927} {"train_loss": -27.858922958374023, "global_step": 574947, "epoch": 6927} {"train_loss": -27.7808837890625, "global_step": 574948, "epoch": 6927} {"train_loss": -27.5350284576416, "global_step": 574949, "epoch": 6927} {"train_loss": -27.724027633666992, "global_step": 574950, "epoch": 6927} {"train_loss": -27.78712272644043, "global_step": 574951, "epoch": 6927} {"train_loss": -27.322967529296875, "global_step": 574952, "epoch": 6927} {"train_loss": -27.434890747070312, "global_step": 574953, "epoch": 6927} {"train_loss": -27.52506446838379, "global_step": 574954, "epoch": 6927} {"train_loss": -27.9356746673584, "global_step": 574955, "epoch": 6927} {"train_loss": -27.250730514526367, "global_step": 574956, "epoch": 6927} {"train_loss": -27.65814208984375, "global_step": 574957, "epoch": 6927} {"train_loss": -28.04402732849121, "global_step": 574958, "epoch": 6927} {"train_loss": -27.36286735534668, "global_step": 574959, "epoch": 6927} {"train_loss": -27.63884925842285, "global_step": 574960, "epoch": 6927} {"train_loss": -27.808149337768555, "global_step": 574961, "epoch": 6927} {"train_loss": -27.848142623901367, "global_step": 574962, "epoch": 6927} {"train_loss": -27.605331420898438, "global_step": 574963, "epoch": 6927} {"train_loss": -27.71807289123535, "global_step": 574964, "epoch": 6927} {"train_loss": -27.788724899291992, "global_step": 574965, "epoch": 6927} {"train_loss": -27.877668380737305, "global_step": 574966, "epoch": 6927} {"train_loss": -28.051666259765625, "global_step": 574967, "epoch": 6927} {"train_loss": -27.694211959838867, "global_step": 574968, "epoch": 6927} {"train_loss": -27.489917755126953, "global_step": 574969, "epoch": 6927} {"train_loss": -27.70257568359375, "global_step": 574970, "epoch": 6927} {"train_loss": -28.073205947875977, "global_step": 574971, "epoch": 6927} {"train_loss": -27.791431427001953, "global_step": 574972, "epoch": 6927} {"train_loss": -28.222204208374023, "global_step": 574973, "epoch": 6927} {"train_loss": -27.531274795532227, "global_step": 574974, "epoch": 6927} {"train_loss": -27.743255615234375, "global_step": 574975, "epoch": 6927} {"train_loss": -28.01726722717285, "global_step": 574976, "epoch": 6927} {"train_loss": -27.97281837463379, "global_step": 574977, "epoch": 6927} {"train_loss": -28.0562686920166, "global_step": 574978, "epoch": 6927} {"train_loss": -27.6339168548584, "global_step": 574979, "epoch": 6927} {"train_loss": -27.95867919921875, "global_step": 574980, "epoch": 6927} {"train_loss": -27.606494903564453, "global_step": 574981, "epoch": 6927} {"train_loss": -27.852994918823242, "global_step": 574982, "epoch": 6927} {"train_loss": -28.1906795501709, "global_step": 574983, "epoch": 6927} {"train_loss": -27.94904136657715, "global_step": 574984, "epoch": 6927} {"train_loss": -28.233869552612305, "global_step": 574985, "epoch": 6927} {"train_loss": -28.270544052124023, "global_step": 574986, "epoch": 6927} {"train_loss": -28.217670440673828, "global_step": 574987, "epoch": 6927} {"train_loss": -27.877721786499023, "global_step": 574988, "epoch": 6927} {"train_loss": -27.73700523376465, "global_step": 574989, "epoch": 6927} {"train_loss": -27.452056884765625, "global_step": 574990, "epoch": 6927} {"train_loss": -26.84663200378418, "global_step": 574991, "epoch": 6927} {"train_loss": -26.18934440612793, "global_step": 574992, "epoch": 6927} {"train_loss": -25.974035263061523, "global_step": 574993, "epoch": 6927} {"train_loss": -27.775394439697266, "global_step": 574994, "epoch": 6927} {"train_loss": -27.579736709594727, "global_step": 574995, "epoch": 6927} {"train_loss": -27.54070472717285, "global_step": 574996, "epoch": 6927} {"train_loss": -27.988264083862305, "global_step": 574997, "epoch": 6927} {"train_loss": -27.000364303588867, "global_step": 574998, "epoch": 6927} {"train_loss": -27.87308120727539, "global_step": 574999, "epoch": 6927} {"train_loss": -27.52288246154785, "global_step": 575000, "epoch": 6927} {"train_loss": -27.8842830657959, "global_step": 575001, "epoch": 6927} {"train_loss": -27.415592193603516, "global_step": 575002, "epoch": 6927} {"train_loss": -27.522809982299805, "global_step": 575003, "epoch": 6927} {"train_loss": -27.724334716796875, "global_step": 575004, "epoch": 6927} {"train_loss": -27.840604782104492, "global_step": 575005, "epoch": 6927} {"train_loss": -27.559757232666016, "global_step": 575006, "epoch": 6927} {"train_loss": -27.643844604492188, "global_step": 575007, "epoch": 6927} {"train_loss": -27.810590744018555, "global_step": 575008, "epoch": 6927} {"train_loss": -27.62855339050293, "global_step": 575009, "epoch": 6927} {"train_loss": -28.047943115234375, "global_step": 575010, "epoch": 6927} {"train_loss": -27.622175216674805, "global_step": 575011, "epoch": 6927} {"train_loss": -27.993408203125, "global_step": 575012, "epoch": 6927} {"train_loss": -28.047245025634766, "global_step": 575013, "epoch": 6927} {"train_loss": -27.626245498657227, "global_step": 575014, "epoch": 6927} {"train_loss": -27.72523307800293, "global_step": 575015, "epoch": 6927} {"train_loss": -27.70551872253418, "global_step": 575016, "epoch": 6927} {"train_loss": -27.540796279907227, "global_step": 575017, "epoch": 6927} {"train_loss": -27.83188247680664, "global_step": 575018, "epoch": 6927} {"train_loss": -28.04591941833496, "global_step": 575019, "epoch": 6927} {"train_loss": -27.864362716674805, "global_step": 575020, "epoch": 6927} {"train_loss": -28.083332061767578, "global_step": 575021, "epoch": 6927} {"train_loss": -27.500289916992188, "global_step": 575022, "epoch": 6927} {"train_loss": -27.689279694155037, "global_step": 575023, "epoch": 6927, "val_loss": 6626582.5} {"train_loss": -27.567493438720703, "global_step": 575024, "epoch": 6928} {"train_loss": -26.81928062438965, "global_step": 575025, "epoch": 6928} {"train_loss": -27.3055477142334, "global_step": 575026, "epoch": 6928} {"train_loss": -27.104949951171875, "global_step": 575027, "epoch": 6928} {"train_loss": -27.138904571533203, "global_step": 575028, "epoch": 6928} {"train_loss": -27.45985221862793, "global_step": 575029, "epoch": 6928} {"train_loss": -27.52203941345215, "global_step": 575030, "epoch": 6928} {"train_loss": -27.332380294799805, "global_step": 575031, "epoch": 6928} {"train_loss": -27.495412826538086, "global_step": 575032, "epoch": 6928} {"train_loss": -27.207929611206055, "global_step": 575033, "epoch": 6928} {"train_loss": -27.57314109802246, "global_step": 575034, "epoch": 6928} {"train_loss": -27.48638916015625, "global_step": 575035, "epoch": 6928} {"train_loss": -27.58049964904785, "global_step": 575036, "epoch": 6928} {"train_loss": -27.399765014648438, "global_step": 575037, "epoch": 6928} {"train_loss": -27.233915328979492, "global_step": 575038, "epoch": 6928} {"train_loss": -27.891666412353516, "global_step": 575039, "epoch": 6928} {"train_loss": -27.70619010925293, "global_step": 575040, "epoch": 6928} {"train_loss": -27.46123695373535, "global_step": 575041, "epoch": 6928} {"train_loss": -27.72930908203125, "global_step": 575042, "epoch": 6928} {"train_loss": -27.5560302734375, "global_step": 575043, "epoch": 6928} {"train_loss": -27.6811580657959, "global_step": 575044, "epoch": 6928} {"train_loss": -27.703840255737305, "global_step": 575045, "epoch": 6928} {"train_loss": -27.642770767211914, "global_step": 575046, "epoch": 6928} {"train_loss": -27.769880294799805, "global_step": 575047, "epoch": 6928} {"train_loss": -27.673200607299805, "global_step": 575048, "epoch": 6928} {"train_loss": -27.38943862915039, "global_step": 575049, "epoch": 6928} {"train_loss": -27.5378475189209, "global_step": 575050, "epoch": 6928} {"train_loss": -27.88019371032715, "global_step": 575051, "epoch": 6928} {"train_loss": -27.963245391845703, "global_step": 575052, "epoch": 6928} {"train_loss": -27.570829391479492, "global_step": 575053, "epoch": 6928} {"train_loss": -27.756031036376953, "global_step": 575054, "epoch": 6928} {"train_loss": -28.35565757751465, "global_step": 575055, "epoch": 6928} {"train_loss": -27.795373916625977, "global_step": 575056, "epoch": 6928} {"train_loss": -27.959897994995117, "global_step": 575057, "epoch": 6928} {"train_loss": -27.895645141601562, "global_step": 575058, "epoch": 6928} {"train_loss": -28.105316162109375, "global_step": 575059, "epoch": 6928} {"train_loss": -27.88606071472168, "global_step": 575060, "epoch": 6928} {"train_loss": -27.797815322875977, "global_step": 575061, "epoch": 6928} {"train_loss": -27.683597564697266, "global_step": 575062, "epoch": 6928} {"train_loss": -27.50412368774414, "global_step": 575063, "epoch": 6928} {"train_loss": -28.365198135375977, "global_step": 575064, "epoch": 6928} {"train_loss": -28.0234432220459, "global_step": 575065, "epoch": 6928} {"train_loss": -27.9588623046875, "global_step": 575066, "epoch": 6928} {"train_loss": -28.1794376373291, "global_step": 575067, "epoch": 6928} {"train_loss": -27.992780685424805, "global_step": 575068, "epoch": 6928} {"train_loss": -27.626188278198242, "global_step": 575069, "epoch": 6928} {"train_loss": -28.055322647094727, "global_step": 575070, "epoch": 6928} {"train_loss": -27.961694717407227, "global_step": 575071, "epoch": 6928} {"train_loss": -27.81007194519043, "global_step": 575072, "epoch": 6928} {"train_loss": -27.84197425842285, "global_step": 575073, "epoch": 6928} {"train_loss": -27.740924835205078, "global_step": 575074, "epoch": 6928} {"train_loss": -27.52814292907715, "global_step": 575075, "epoch": 6928} {"train_loss": -28.0151424407959, "global_step": 575076, "epoch": 6928} {"train_loss": -27.914167404174805, "global_step": 575077, "epoch": 6928} {"train_loss": -28.17426872253418, "global_step": 575078, "epoch": 6928} {"train_loss": -28.24985122680664, "global_step": 575079, "epoch": 6928} {"train_loss": -27.926197052001953, "global_step": 575080, "epoch": 6928} {"train_loss": -27.91248893737793, "global_step": 575081, "epoch": 6928} {"train_loss": -28.02865982055664, "global_step": 575082, "epoch": 6928} {"train_loss": -28.08949851989746, "global_step": 575083, "epoch": 6928} {"train_loss": -28.26859474182129, "global_step": 575084, "epoch": 6928} {"train_loss": -28.2865047454834, "global_step": 575085, "epoch": 6928} {"train_loss": -27.922149658203125, "global_step": 575086, "epoch": 6928} {"train_loss": -28.400510787963867, "global_step": 575087, "epoch": 6928} {"train_loss": -28.008020401000977, "global_step": 575088, "epoch": 6928} {"train_loss": -28.10407829284668, "global_step": 575089, "epoch": 6928} {"train_loss": -28.1036319732666, "global_step": 575090, "epoch": 6928} {"train_loss": -27.668317794799805, "global_step": 575091, "epoch": 6928} {"train_loss": -27.873193740844727, "global_step": 575092, "epoch": 6928} {"train_loss": -28.027597427368164, "global_step": 575093, "epoch": 6928} {"train_loss": -27.928197860717773, "global_step": 575094, "epoch": 6928} {"train_loss": -27.9241886138916, "global_step": 575095, "epoch": 6928} {"train_loss": -27.927473068237305, "global_step": 575096, "epoch": 6928} {"train_loss": -28.257726669311523, "global_step": 575097, "epoch": 6928} {"train_loss": -27.91254997253418, "global_step": 575098, "epoch": 6928} {"train_loss": -27.732620239257812, "global_step": 575099, "epoch": 6928} {"train_loss": -28.195520401000977, "global_step": 575100, "epoch": 6928} {"train_loss": -28.575759887695312, "global_step": 575101, "epoch": 6928} {"train_loss": -27.471521377563477, "global_step": 575102, "epoch": 6928} {"train_loss": -27.791173934936523, "global_step": 575103, "epoch": 6928} {"train_loss": -27.831161499023438, "global_step": 575104, "epoch": 6928} {"train_loss": -27.8944091796875, "global_step": 575105, "epoch": 6928} {"train_loss": -27.8097926679864, "global_step": 575106, "epoch": 6928, "val_loss": 6562741.0} {"train_loss": -27.09329605102539, "global_step": 575107, "epoch": 6929} {"train_loss": -27.266279220581055, "global_step": 575108, "epoch": 6929} {"train_loss": -27.39338493347168, "global_step": 575109, "epoch": 6929} {"train_loss": -26.920425415039062, "global_step": 575110, "epoch": 6929} {"train_loss": -26.62664794921875, "global_step": 575111, "epoch": 6929} {"train_loss": -26.848388671875, "global_step": 575112, "epoch": 6929} {"train_loss": -27.22308921813965, "global_step": 575113, "epoch": 6929} {"train_loss": -26.78761100769043, "global_step": 575114, "epoch": 6929} {"train_loss": -27.11252784729004, "global_step": 575115, "epoch": 6929} {"train_loss": -27.360599517822266, "global_step": 575116, "epoch": 6929} {"train_loss": -26.795495986938477, "global_step": 575117, "epoch": 6929} {"train_loss": -27.3294734954834, "global_step": 575118, "epoch": 6929} {"train_loss": -27.66400146484375, "global_step": 575119, "epoch": 6929} {"train_loss": -27.111536026000977, "global_step": 575120, "epoch": 6929} {"train_loss": -27.1412353515625, "global_step": 575121, "epoch": 6929} {"train_loss": -27.31678581237793, "global_step": 575122, "epoch": 6929} {"train_loss": -27.506128311157227, "global_step": 575123, "epoch": 6929} {"train_loss": -27.73504638671875, "global_step": 575124, "epoch": 6929} {"train_loss": -27.44439125061035, "global_step": 575125, "epoch": 6929} {"train_loss": -27.5476016998291, "global_step": 575126, "epoch": 6929} {"train_loss": -27.898197174072266, "global_step": 575127, "epoch": 6929} {"train_loss": -27.880857467651367, "global_step": 575128, "epoch": 6929} {"train_loss": -27.676666259765625, "global_step": 575129, "epoch": 6929} {"train_loss": -27.764434814453125, "global_step": 575130, "epoch": 6929} {"train_loss": -27.547760009765625, "global_step": 575131, "epoch": 6929} {"train_loss": -27.8842830657959, "global_step": 575132, "epoch": 6929} {"train_loss": -27.737720489501953, "global_step": 575133, "epoch": 6929} {"train_loss": -28.347875595092773, "global_step": 575134, "epoch": 6929} {"train_loss": -27.806119918823242, "global_step": 575135, "epoch": 6929} {"train_loss": -27.61200523376465, "global_step": 575136, "epoch": 6929} {"train_loss": -27.699216842651367, "global_step": 575137, "epoch": 6929} {"train_loss": -27.636585235595703, "global_step": 575138, "epoch": 6929} {"train_loss": -27.51600456237793, "global_step": 575139, "epoch": 6929} {"train_loss": -27.62885093688965, "global_step": 575140, "epoch": 6929} {"train_loss": -27.901203155517578, "global_step": 575141, "epoch": 6929} {"train_loss": -28.147235870361328, "global_step": 575142, "epoch": 6929} {"train_loss": -27.854211807250977, "global_step": 575143, "epoch": 6929} {"train_loss": -28.03375244140625, "global_step": 575144, "epoch": 6929} {"train_loss": -27.7723388671875, "global_step": 575145, "epoch": 6929} {"train_loss": -28.18601417541504, "global_step": 575146, "epoch": 6929} {"train_loss": -28.078266143798828, "global_step": 575147, "epoch": 6929} {"train_loss": -28.040159225463867, "global_step": 575148, "epoch": 6929} {"train_loss": -27.824377059936523, "global_step": 575149, "epoch": 6929} {"train_loss": -27.9865665435791, "global_step": 575150, "epoch": 6929} {"train_loss": -28.047595977783203, "global_step": 575151, "epoch": 6929} {"train_loss": -28.14461326599121, "global_step": 575152, "epoch": 6929} {"train_loss": -27.74957847595215, "global_step": 575153, "epoch": 6929} {"train_loss": -27.972412109375, "global_step": 575154, "epoch": 6929} {"train_loss": -28.09058952331543, "global_step": 575155, "epoch": 6929} {"train_loss": -27.658523559570312, "global_step": 575156, "epoch": 6929} {"train_loss": -28.151105880737305, "global_step": 575157, "epoch": 6929} {"train_loss": -27.809864044189453, "global_step": 575158, "epoch": 6929} {"train_loss": -27.827726364135742, "global_step": 575159, "epoch": 6929} {"train_loss": -28.154926300048828, "global_step": 575160, "epoch": 6929} {"train_loss": -28.049848556518555, "global_step": 575161, "epoch": 6929} {"train_loss": -27.899250030517578, "global_step": 575162, "epoch": 6929} {"train_loss": -27.871417999267578, "global_step": 575163, "epoch": 6929} {"train_loss": -28.34479331970215, "global_step": 575164, "epoch": 6929} {"train_loss": -28.029706954956055, "global_step": 575165, "epoch": 6929} {"train_loss": -27.98542594909668, "global_step": 575166, "epoch": 6929} {"train_loss": -28.466657638549805, "global_step": 575167, "epoch": 6929} {"train_loss": -28.158288955688477, "global_step": 575168, "epoch": 6929} {"train_loss": -28.146728515625, "global_step": 575169, "epoch": 6929} {"train_loss": -27.836669921875, "global_step": 575170, "epoch": 6929} {"train_loss": -27.906213760375977, "global_step": 575171, "epoch": 6929} {"train_loss": -28.3060302734375, "global_step": 575172, "epoch": 6929} {"train_loss": -28.080825805664062, "global_step": 575173, "epoch": 6929} {"train_loss": -28.054351806640625, "global_step": 575174, "epoch": 6929} {"train_loss": -27.894250869750977, "global_step": 575175, "epoch": 6929} {"train_loss": -28.0153865814209, "global_step": 575176, "epoch": 6929} {"train_loss": -27.63803482055664, "global_step": 575177, "epoch": 6929} {"train_loss": -27.70975685119629, "global_step": 575178, "epoch": 6929} {"train_loss": -27.672332763671875, "global_step": 575179, "epoch": 6929} {"train_loss": -28.14573097229004, "global_step": 575180, "epoch": 6929} {"train_loss": -27.660663604736328, "global_step": 575181, "epoch": 6929} {"train_loss": -27.874114990234375, "global_step": 575182, "epoch": 6929} {"train_loss": -27.7320613861084, "global_step": 575183, "epoch": 6929} {"train_loss": -27.740034103393555, "global_step": 575184, "epoch": 6929} {"train_loss": -27.915197372436523, "global_step": 575185, "epoch": 6929} {"train_loss": -27.788095474243164, "global_step": 575186, "epoch": 6929} {"train_loss": -27.758533477783203, "global_step": 575187, "epoch": 6929} {"train_loss": -28.025012969970703, "global_step": 575188, "epoch": 6929} {"train_loss": -27.74277402119464, "global_step": 575189, "epoch": 6929, "val_loss": 6612017.5} {"train_loss": -26.81707191467285, "global_step": 575190, "epoch": 6930} {"train_loss": -26.80922508239746, "global_step": 575191, "epoch": 6930} {"train_loss": -26.772979736328125, "global_step": 575192, "epoch": 6930} {"train_loss": -27.229461669921875, "global_step": 575193, "epoch": 6930} {"train_loss": -27.201648712158203, "global_step": 575194, "epoch": 6930} {"train_loss": -27.361968994140625, "global_step": 575195, "epoch": 6930} {"train_loss": -27.30164909362793, "global_step": 575196, "epoch": 6930} {"train_loss": -27.114240646362305, "global_step": 575197, "epoch": 6930} {"train_loss": -27.541738510131836, "global_step": 575198, "epoch": 6930} {"train_loss": -27.098020553588867, "global_step": 575199, "epoch": 6930} {"train_loss": -27.00591468811035, "global_step": 575200, "epoch": 6930} {"train_loss": -27.20676612854004, "global_step": 575201, "epoch": 6930} {"train_loss": -27.485416412353516, "global_step": 575202, "epoch": 6930} {"train_loss": -27.123538970947266, "global_step": 575203, "epoch": 6930} {"train_loss": -27.22934341430664, "global_step": 575204, "epoch": 6930} {"train_loss": -27.414968490600586, "global_step": 575205, "epoch": 6930} {"train_loss": -27.4722843170166, "global_step": 575206, "epoch": 6930} {"train_loss": -27.479902267456055, "global_step": 575207, "epoch": 6930} {"train_loss": -27.556415557861328, "global_step": 575208, "epoch": 6930} {"train_loss": -27.408422470092773, "global_step": 575209, "epoch": 6930} {"train_loss": -27.034622192382812, "global_step": 575210, "epoch": 6930} {"train_loss": -27.379749298095703, "global_step": 575211, "epoch": 6930} {"train_loss": -27.291513442993164, "global_step": 575212, "epoch": 6930} {"train_loss": -27.432968139648438, "global_step": 575213, "epoch": 6930} {"train_loss": -27.470922470092773, "global_step": 575214, "epoch": 6930} {"train_loss": -27.37359619140625, "global_step": 575215, "epoch": 6930} {"train_loss": -27.383596420288086, "global_step": 575216, "epoch": 6930} {"train_loss": -27.579999923706055, "global_step": 575217, "epoch": 6930} {"train_loss": -27.719736099243164, "global_step": 575218, "epoch": 6930} {"train_loss": -27.49116325378418, "global_step": 575219, "epoch": 6930} {"train_loss": -27.126535415649414, "global_step": 575220, "epoch": 6930} {"train_loss": -27.7668514251709, "global_step": 575221, "epoch": 6930} {"train_loss": -27.843006134033203, "global_step": 575222, "epoch": 6930} {"train_loss": -27.522302627563477, "global_step": 575223, "epoch": 6930} {"train_loss": -27.90204429626465, "global_step": 575224, "epoch": 6930} {"train_loss": -27.50815200805664, "global_step": 575225, "epoch": 6930} {"train_loss": -27.8277645111084, "global_step": 575226, "epoch": 6930} {"train_loss": -27.6705379486084, "global_step": 575227, "epoch": 6930} {"train_loss": -27.71904945373535, "global_step": 575228, "epoch": 6930} {"train_loss": -27.685073852539062, "global_step": 575229, "epoch": 6930} {"train_loss": -27.6627254486084, "global_step": 575230, "epoch": 6930} {"train_loss": -27.587970733642578, "global_step": 575231, "epoch": 6930} {"train_loss": -27.512182235717773, "global_step": 575232, "epoch": 6930} {"train_loss": -27.92926025390625, "global_step": 575233, "epoch": 6930} {"train_loss": -28.31414222717285, "global_step": 575234, "epoch": 6930} {"train_loss": -27.550458908081055, "global_step": 575235, "epoch": 6930} {"train_loss": -28.0306453704834, "global_step": 575236, "epoch": 6930} {"train_loss": -27.542957305908203, "global_step": 575237, "epoch": 6930} {"train_loss": -28.362537384033203, "global_step": 575238, "epoch": 6930} {"train_loss": -27.89740562438965, "global_step": 575239, "epoch": 6930} {"train_loss": -28.04078483581543, "global_step": 575240, "epoch": 6930} {"train_loss": -28.1986083984375, "global_step": 575241, "epoch": 6930} {"train_loss": -27.97494888305664, "global_step": 575242, "epoch": 6930} {"train_loss": -28.194982528686523, "global_step": 575243, "epoch": 6930} {"train_loss": -27.79123306274414, "global_step": 575244, "epoch": 6930} {"train_loss": -28.17340660095215, "global_step": 575245, "epoch": 6930} {"train_loss": -28.010080337524414, "global_step": 575246, "epoch": 6930} {"train_loss": -28.544897079467773, "global_step": 575247, "epoch": 6930} {"train_loss": -28.1757869720459, "global_step": 575248, "epoch": 6930} {"train_loss": -28.070972442626953, "global_step": 575249, "epoch": 6930} {"train_loss": -28.246118545532227, "global_step": 575250, "epoch": 6930} {"train_loss": -27.834802627563477, "global_step": 575251, "epoch": 6930} {"train_loss": -28.137765884399414, "global_step": 575252, "epoch": 6930} {"train_loss": -28.376379013061523, "global_step": 575253, "epoch": 6930} {"train_loss": -28.168643951416016, "global_step": 575254, "epoch": 6930} {"train_loss": -27.91547966003418, "global_step": 575255, "epoch": 6930} {"train_loss": -27.991622924804688, "global_step": 575256, "epoch": 6930} {"train_loss": -27.75370216369629, "global_step": 575257, "epoch": 6930} {"train_loss": -27.981176376342773, "global_step": 575258, "epoch": 6930} {"train_loss": -27.906970977783203, "global_step": 575259, "epoch": 6930} {"train_loss": -28.1722354888916, "global_step": 575260, "epoch": 6930} {"train_loss": -28.092947006225586, "global_step": 575261, "epoch": 6930} {"train_loss": -27.957340240478516, "global_step": 575262, "epoch": 6930} {"train_loss": -27.909198760986328, "global_step": 575263, "epoch": 6930} {"train_loss": -27.97409439086914, "global_step": 575264, "epoch": 6930} {"train_loss": -27.952255249023438, "global_step": 575265, "epoch": 6930} {"train_loss": -27.934492111206055, "global_step": 575266, "epoch": 6930} {"train_loss": -27.90534782409668, "global_step": 575267, "epoch": 6930} {"train_loss": -27.097150802612305, "global_step": 575268, "epoch": 6930} {"train_loss": -26.982221603393555, "global_step": 575269, "epoch": 6930} {"train_loss": -27.446569442749023, "global_step": 575270, "epoch": 6930} {"train_loss": -27.888471603393555, "global_step": 575271, "epoch": 6930} {"train_loss": -27.66227264863899, "global_step": 575272, "epoch": 6930, "val_loss": 6595674.0} {"train_loss": -23.967458724975586, "global_step": 575273, "epoch": 6931} {"train_loss": -26.102371215820312, "global_step": 575274, "epoch": 6931} {"train_loss": -26.446680068969727, "global_step": 575275, "epoch": 6931} {"train_loss": -25.552427291870117, "global_step": 575276, "epoch": 6931} {"train_loss": -26.20252799987793, "global_step": 575277, "epoch": 6931} {"train_loss": -25.935749053955078, "global_step": 575278, "epoch": 6931} {"train_loss": -26.579679489135742, "global_step": 575279, "epoch": 6931} {"train_loss": -26.412565231323242, "global_step": 575280, "epoch": 6931} {"train_loss": -26.806594848632812, "global_step": 575281, "epoch": 6931} {"train_loss": -26.82696533203125, "global_step": 575282, "epoch": 6931} {"train_loss": -26.658735275268555, "global_step": 575283, "epoch": 6931} {"train_loss": -26.42317008972168, "global_step": 575284, "epoch": 6931} {"train_loss": -27.0316219329834, "global_step": 575285, "epoch": 6931} {"train_loss": -26.6002140045166, "global_step": 575286, "epoch": 6931} {"train_loss": -26.85426902770996, "global_step": 575287, "epoch": 6931} {"train_loss": -26.637128829956055, "global_step": 575288, "epoch": 6931} {"train_loss": -27.0151424407959, "global_step": 575289, "epoch": 6931} {"train_loss": -27.285919189453125, "global_step": 575290, "epoch": 6931} {"train_loss": -27.316944122314453, "global_step": 575291, "epoch": 6931} {"train_loss": -27.073883056640625, "global_step": 575292, "epoch": 6931} {"train_loss": -27.602462768554688, "global_step": 575293, "epoch": 6931} {"train_loss": -27.0363826751709, "global_step": 575294, "epoch": 6931} {"train_loss": -27.39680290222168, "global_step": 575295, "epoch": 6931} {"train_loss": -27.141260147094727, "global_step": 575296, "epoch": 6931} {"train_loss": -27.702417373657227, "global_step": 575297, "epoch": 6931} {"train_loss": -27.504724502563477, "global_step": 575298, "epoch": 6931} {"train_loss": -27.55517578125, "global_step": 575299, "epoch": 6931} {"train_loss": -27.5037784576416, "global_step": 575300, "epoch": 6931} {"train_loss": -27.427688598632812, "global_step": 575301, "epoch": 6931} {"train_loss": -27.595829010009766, "global_step": 575302, "epoch": 6931} {"train_loss": -27.78797721862793, "global_step": 575303, "epoch": 6931} {"train_loss": -27.551137924194336, "global_step": 575304, "epoch": 6931} {"train_loss": -27.381818771362305, "global_step": 575305, "epoch": 6931} {"train_loss": -27.70880699157715, "global_step": 575306, "epoch": 6931} {"train_loss": -27.72096061706543, "global_step": 575307, "epoch": 6931} {"train_loss": -27.546003341674805, "global_step": 575308, "epoch": 6931} {"train_loss": -27.414884567260742, "global_step": 575309, "epoch": 6931} {"train_loss": -27.62410545349121, "global_step": 575310, "epoch": 6931} {"train_loss": -27.63203239440918, "global_step": 575311, "epoch": 6931} {"train_loss": -27.789215087890625, "global_step": 575312, "epoch": 6931} {"train_loss": -28.143695831298828, "global_step": 575313, "epoch": 6931} {"train_loss": -27.814443588256836, "global_step": 575314, "epoch": 6931} {"train_loss": -27.677661895751953, "global_step": 575315, "epoch": 6931} {"train_loss": -28.025815963745117, "global_step": 575316, "epoch": 6931} {"train_loss": -28.008743286132812, "global_step": 575317, "epoch": 6931} {"train_loss": -27.80560302734375, "global_step": 575318, "epoch": 6931} {"train_loss": -28.191299438476562, "global_step": 575319, "epoch": 6931} {"train_loss": -27.871219635009766, "global_step": 575320, "epoch": 6931} {"train_loss": -27.498382568359375, "global_step": 575321, "epoch": 6931} {"train_loss": -28.10135841369629, "global_step": 575322, "epoch": 6931} {"train_loss": -27.947967529296875, "global_step": 575323, "epoch": 6931} {"train_loss": -28.161497116088867, "global_step": 575324, "epoch": 6931} {"train_loss": -28.34441566467285, "global_step": 575325, "epoch": 6931} {"train_loss": -28.0247859954834, "global_step": 575326, "epoch": 6931} {"train_loss": -27.957233428955078, "global_step": 575327, "epoch": 6931} {"train_loss": -27.917612075805664, "global_step": 575328, "epoch": 6931} {"train_loss": -28.007373809814453, "global_step": 575329, "epoch": 6931} {"train_loss": -28.24677848815918, "global_step": 575330, "epoch": 6931} {"train_loss": -28.365631103515625, "global_step": 575331, "epoch": 6931} {"train_loss": -28.11321449279785, "global_step": 575332, "epoch": 6931} {"train_loss": -28.276227951049805, "global_step": 575333, "epoch": 6931} {"train_loss": -28.313444137573242, "global_step": 575334, "epoch": 6931} {"train_loss": -27.989973068237305, "global_step": 575335, "epoch": 6931} {"train_loss": -28.02292823791504, "global_step": 575336, "epoch": 6931} {"train_loss": -27.569128036499023, "global_step": 575337, "epoch": 6931} {"train_loss": -27.13004493713379, "global_step": 575338, "epoch": 6931} {"train_loss": -27.704254150390625, "global_step": 575339, "epoch": 6931} {"train_loss": -27.65570640563965, "global_step": 575340, "epoch": 6931} {"train_loss": -27.9498348236084, "global_step": 575341, "epoch": 6931} {"train_loss": -28.13197898864746, "global_step": 575342, "epoch": 6931} {"train_loss": -28.257831573486328, "global_step": 575343, "epoch": 6931} {"train_loss": -27.973392486572266, "global_step": 575344, "epoch": 6931} {"train_loss": -27.6855525970459, "global_step": 575345, "epoch": 6931} {"train_loss": -27.5655460357666, "global_step": 575346, "epoch": 6931} {"train_loss": -27.950693130493164, "global_step": 575347, "epoch": 6931} {"train_loss": -27.62952995300293, "global_step": 575348, "epoch": 6931} {"train_loss": -27.6702880859375, "global_step": 575349, "epoch": 6931} {"train_loss": -28.04218101501465, "global_step": 575350, "epoch": 6931} {"train_loss": -27.8456974029541, "global_step": 575351, "epoch": 6931} {"train_loss": -27.823596954345703, "global_step": 575352, "epoch": 6931} {"train_loss": -27.965320587158203, "global_step": 575353, "epoch": 6931} {"train_loss": -27.630720138549805, "global_step": 575354, "epoch": 6931} {"train_loss": -27.488652838281837, "global_step": 575355, "epoch": 6931, "val_loss": 6491265.0} {"train_loss": -27.36762046813965, "global_step": 575356, "epoch": 6932} {"train_loss": -27.548084259033203, "global_step": 575357, "epoch": 6932} {"train_loss": -27.619918823242188, "global_step": 575358, "epoch": 6932} {"train_loss": -27.62396812438965, "global_step": 575359, "epoch": 6932} {"train_loss": -27.86017417907715, "global_step": 575360, "epoch": 6932} {"train_loss": -28.068689346313477, "global_step": 575361, "epoch": 6932} {"train_loss": -27.94873046875, "global_step": 575362, "epoch": 6932} {"train_loss": -27.83961296081543, "global_step": 575363, "epoch": 6932} {"train_loss": -27.61553955078125, "global_step": 575364, "epoch": 6932} {"train_loss": -28.122461318969727, "global_step": 575365, "epoch": 6932} {"train_loss": -27.986249923706055, "global_step": 575366, "epoch": 6932} {"train_loss": -27.656370162963867, "global_step": 575367, "epoch": 6932} {"train_loss": -27.6649112701416, "global_step": 575368, "epoch": 6932} {"train_loss": -27.912464141845703, "global_step": 575369, "epoch": 6932} {"train_loss": -28.041357040405273, "global_step": 575370, "epoch": 6932} {"train_loss": -27.696216583251953, "global_step": 575371, "epoch": 6932} {"train_loss": -27.844324111938477, "global_step": 575372, "epoch": 6932} {"train_loss": -27.876861572265625, "global_step": 575373, "epoch": 6932} {"train_loss": -28.273563385009766, "global_step": 575374, "epoch": 6932} {"train_loss": -27.679523468017578, "global_step": 575375, "epoch": 6932} {"train_loss": -27.6938533782959, "global_step": 575376, "epoch": 6932} {"train_loss": -28.04798698425293, "global_step": 575377, "epoch": 6932} {"train_loss": -27.808551788330078, "global_step": 575378, "epoch": 6932} {"train_loss": -27.691003799438477, "global_step": 575379, "epoch": 6932} {"train_loss": -27.567331314086914, "global_step": 575380, "epoch": 6932} {"train_loss": -28.293415069580078, "global_step": 575381, "epoch": 6932} {"train_loss": -27.976551055908203, "global_step": 575382, "epoch": 6932} {"train_loss": -27.9671630859375, "global_step": 575383, "epoch": 6932} {"train_loss": -28.1424560546875, "global_step": 575384, "epoch": 6932} {"train_loss": -27.750349044799805, "global_step": 575385, "epoch": 6932} {"train_loss": -28.390405654907227, "global_step": 575386, "epoch": 6932} {"train_loss": -28.404376983642578, "global_step": 575387, "epoch": 6932} {"train_loss": -28.1788330078125, "global_step": 575388, "epoch": 6932} {"train_loss": -27.763931274414062, "global_step": 575389, "epoch": 6932} {"train_loss": -27.81617546081543, "global_step": 575390, "epoch": 6932} {"train_loss": -27.726200103759766, "global_step": 575391, "epoch": 6932} {"train_loss": -27.649036407470703, "global_step": 575392, "epoch": 6932} {"train_loss": -27.777196884155273, "global_step": 575393, "epoch": 6932} {"train_loss": -27.791227340698242, "global_step": 575394, "epoch": 6932} {"train_loss": -28.123533248901367, "global_step": 575395, "epoch": 6932} {"train_loss": -27.536619186401367, "global_step": 575396, "epoch": 6932} {"train_loss": -27.77583122253418, "global_step": 575397, "epoch": 6932} {"train_loss": -28.043455123901367, "global_step": 575398, "epoch": 6932} {"train_loss": -27.827850341796875, "global_step": 575399, "epoch": 6932} {"train_loss": -28.083465576171875, "global_step": 575400, "epoch": 6932} {"train_loss": -27.99104881286621, "global_step": 575401, "epoch": 6932} {"train_loss": -27.868371963500977, "global_step": 575402, "epoch": 6932} {"train_loss": -27.864816665649414, "global_step": 575403, "epoch": 6932} {"train_loss": -27.8228702545166, "global_step": 575404, "epoch": 6932} {"train_loss": -28.022008895874023, "global_step": 575405, "epoch": 6932} {"train_loss": -27.99348258972168, "global_step": 575406, "epoch": 6932} {"train_loss": -27.948627471923828, "global_step": 575407, "epoch": 6932} {"train_loss": -28.271451950073242, "global_step": 575408, "epoch": 6932} {"train_loss": -27.77406120300293, "global_step": 575409, "epoch": 6932} {"train_loss": -28.050189971923828, "global_step": 575410, "epoch": 6932} {"train_loss": -28.157196044921875, "global_step": 575411, "epoch": 6932} {"train_loss": -27.63507652282715, "global_step": 575412, "epoch": 6932} {"train_loss": -27.94465446472168, "global_step": 575413, "epoch": 6932} {"train_loss": -27.61749839782715, "global_step": 575414, "epoch": 6932} {"train_loss": -27.64912986755371, "global_step": 575415, "epoch": 6932} {"train_loss": -27.84137535095215, "global_step": 575416, "epoch": 6932} {"train_loss": -28.04292106628418, "global_step": 575417, "epoch": 6932} {"train_loss": -28.021738052368164, "global_step": 575418, "epoch": 6932} {"train_loss": -28.4708194732666, "global_step": 575419, "epoch": 6932} {"train_loss": -27.841724395751953, "global_step": 575420, "epoch": 6932} {"train_loss": -27.185667037963867, "global_step": 575421, "epoch": 6932} {"train_loss": -27.28436851501465, "global_step": 575422, "epoch": 6932} {"train_loss": -28.429784774780273, "global_step": 575423, "epoch": 6932} {"train_loss": -27.937597274780273, "global_step": 575424, "epoch": 6932} {"train_loss": -27.8082218170166, "global_step": 575425, "epoch": 6932} {"train_loss": -28.12885093688965, "global_step": 575426, "epoch": 6932} {"train_loss": -27.752599716186523, "global_step": 575427, "epoch": 6932} {"train_loss": -27.719161987304688, "global_step": 575428, "epoch": 6932} {"train_loss": -27.660999298095703, "global_step": 575429, "epoch": 6932} {"train_loss": -27.937835693359375, "global_step": 575430, "epoch": 6932} {"train_loss": -27.86602210998535, "global_step": 575431, "epoch": 6932} {"train_loss": -28.198089599609375, "global_step": 575432, "epoch": 6932} {"train_loss": -28.06629753112793, "global_step": 575433, "epoch": 6932} {"train_loss": -28.056432723999023, "global_step": 575434, "epoch": 6932} {"train_loss": -27.87992286682129, "global_step": 575435, "epoch": 6932} {"train_loss": -28.064029693603516, "global_step": 575436, "epoch": 6932} {"train_loss": -27.872854232788086, "global_step": 575437, "epoch": 6932} {"train_loss": -27.884785824511425, "global_step": 575438, "epoch": 6932, "val_loss": 6513816.5} {"train_loss": -27.469573974609375, "global_step": 575439, "epoch": 6933} {"train_loss": -27.225988388061523, "global_step": 575440, "epoch": 6933} {"train_loss": -27.177719116210938, "global_step": 575441, "epoch": 6933} {"train_loss": -27.505340576171875, "global_step": 575442, "epoch": 6933} {"train_loss": -27.3989315032959, "global_step": 575443, "epoch": 6933} {"train_loss": -27.59540367126465, "global_step": 575444, "epoch": 6933} {"train_loss": -27.432647705078125, "global_step": 575445, "epoch": 6933} {"train_loss": -27.642383575439453, "global_step": 575446, "epoch": 6933} {"train_loss": -27.2064208984375, "global_step": 575447, "epoch": 6933} {"train_loss": -27.877552032470703, "global_step": 575448, "epoch": 6933} {"train_loss": -26.800268173217773, "global_step": 575449, "epoch": 6933} {"train_loss": -27.5318660736084, "global_step": 575450, "epoch": 6933} {"train_loss": -27.619836807250977, "global_step": 575451, "epoch": 6933} {"train_loss": -27.45831871032715, "global_step": 575452, "epoch": 6933} {"train_loss": -27.4077091217041, "global_step": 575453, "epoch": 6933} {"train_loss": -27.464487075805664, "global_step": 575454, "epoch": 6933} {"train_loss": -27.042789459228516, "global_step": 575455, "epoch": 6933} {"train_loss": -27.147632598876953, "global_step": 575456, "epoch": 6933} {"train_loss": -27.493518829345703, "global_step": 575457, "epoch": 6933} {"train_loss": -27.47812843322754, "global_step": 575458, "epoch": 6933} {"train_loss": -27.329925537109375, "global_step": 575459, "epoch": 6933} {"train_loss": -27.6617488861084, "global_step": 575460, "epoch": 6933} {"train_loss": -27.656295776367188, "global_step": 575461, "epoch": 6933} {"train_loss": -27.778295516967773, "global_step": 575462, "epoch": 6933} {"train_loss": -27.78107261657715, "global_step": 575463, "epoch": 6933} {"train_loss": -27.639652252197266, "global_step": 575464, "epoch": 6933} {"train_loss": -27.408771514892578, "global_step": 575465, "epoch": 6933} {"train_loss": -27.75201988220215, "global_step": 575466, "epoch": 6933} {"train_loss": -27.7216739654541, "global_step": 575467, "epoch": 6933} {"train_loss": -27.79178810119629, "global_step": 575468, "epoch": 6933} {"train_loss": -27.703760147094727, "global_step": 575469, "epoch": 6933} {"train_loss": -27.433820724487305, "global_step": 575470, "epoch": 6933} {"train_loss": -27.689102172851562, "global_step": 575471, "epoch": 6933} {"train_loss": -28.09089469909668, "global_step": 575472, "epoch": 6933} {"train_loss": -27.581689834594727, "global_step": 575473, "epoch": 6933} {"train_loss": -27.601743698120117, "global_step": 575474, "epoch": 6933} {"train_loss": -28.360828399658203, "global_step": 575475, "epoch": 6933} {"train_loss": -28.23145866394043, "global_step": 575476, "epoch": 6933} {"train_loss": -28.081323623657227, "global_step": 575477, "epoch": 6933} {"train_loss": -27.9915714263916, "global_step": 575478, "epoch": 6933} {"train_loss": -27.915267944335938, "global_step": 575479, "epoch": 6933} {"train_loss": -28.20306396484375, "global_step": 575480, "epoch": 6933} {"train_loss": -27.981409072875977, "global_step": 575481, "epoch": 6933} {"train_loss": -28.006887435913086, "global_step": 575482, "epoch": 6933} {"train_loss": -27.971113204956055, "global_step": 575483, "epoch": 6933} {"train_loss": -27.855783462524414, "global_step": 575484, "epoch": 6933} {"train_loss": -27.514698028564453, "global_step": 575485, "epoch": 6933} {"train_loss": -27.927066802978516, "global_step": 575486, "epoch": 6933} {"train_loss": -27.879011154174805, "global_step": 575487, "epoch": 6933} {"train_loss": -27.9823055267334, "global_step": 575488, "epoch": 6933} {"train_loss": -28.080398559570312, "global_step": 575489, "epoch": 6933} {"train_loss": -28.499109268188477, "global_step": 575490, "epoch": 6933} {"train_loss": -27.679975509643555, "global_step": 575491, "epoch": 6933} {"train_loss": -28.160810470581055, "global_step": 575492, "epoch": 6933} {"train_loss": -28.019071578979492, "global_step": 575493, "epoch": 6933} {"train_loss": -28.185956954956055, "global_step": 575494, "epoch": 6933} {"train_loss": -28.427534103393555, "global_step": 575495, "epoch": 6933} {"train_loss": -27.972410202026367, "global_step": 575496, "epoch": 6933} {"train_loss": -28.076765060424805, "global_step": 575497, "epoch": 6933} {"train_loss": -28.176380157470703, "global_step": 575498, "epoch": 6933} {"train_loss": -28.038043975830078, "global_step": 575499, "epoch": 6933} {"train_loss": -28.35542869567871, "global_step": 575500, "epoch": 6933} {"train_loss": -28.179035186767578, "global_step": 575501, "epoch": 6933} {"train_loss": -27.51272964477539, "global_step": 575502, "epoch": 6933} {"train_loss": -27.656274795532227, "global_step": 575503, "epoch": 6933} {"train_loss": -26.921201705932617, "global_step": 575504, "epoch": 6933} {"train_loss": -26.28352165222168, "global_step": 575505, "epoch": 6933} {"train_loss": -26.97681999206543, "global_step": 575506, "epoch": 6933} {"train_loss": -27.944955825805664, "global_step": 575507, "epoch": 6933} {"train_loss": -27.6817626953125, "global_step": 575508, "epoch": 6933} {"train_loss": -27.393268585205078, "global_step": 575509, "epoch": 6933} {"train_loss": -27.6085205078125, "global_step": 575510, "epoch": 6933} {"train_loss": -27.44378662109375, "global_step": 575511, "epoch": 6933} {"train_loss": -27.451862335205078, "global_step": 575512, "epoch": 6933} {"train_loss": -27.812519073486328, "global_step": 575513, "epoch": 6933} {"train_loss": -27.988489151000977, "global_step": 575514, "epoch": 6933} {"train_loss": -27.80616569519043, "global_step": 575515, "epoch": 6933} {"train_loss": -27.57769203186035, "global_step": 575516, "epoch": 6933} {"train_loss": -27.96219253540039, "global_step": 575517, "epoch": 6933} {"train_loss": -27.81585121154785, "global_step": 575518, "epoch": 6933} {"train_loss": -27.791900634765625, "global_step": 575519, "epoch": 6933} {"train_loss": -27.969736099243164, "global_step": 575520, "epoch": 6933} {"train_loss": -27.679928469370648, "global_step": 575521, "epoch": 6933, "val_loss": 6560603.0} {"train_loss": -27.691207885742188, "global_step": 575522, "epoch": 6934} {"train_loss": -27.320337295532227, "global_step": 575523, "epoch": 6934} {"train_loss": -27.215076446533203, "global_step": 575524, "epoch": 6934} {"train_loss": -27.16727066040039, "global_step": 575525, "epoch": 6934} {"train_loss": -27.124780654907227, "global_step": 575526, "epoch": 6934} {"train_loss": -27.42970085144043, "global_step": 575527, "epoch": 6934} {"train_loss": -27.570037841796875, "global_step": 575528, "epoch": 6934} {"train_loss": -27.332660675048828, "global_step": 575529, "epoch": 6934} {"train_loss": -27.78285026550293, "global_step": 575530, "epoch": 6934} {"train_loss": -27.694263458251953, "global_step": 575531, "epoch": 6934} {"train_loss": -27.70607566833496, "global_step": 575532, "epoch": 6934} {"train_loss": -27.405759811401367, "global_step": 575533, "epoch": 6934} {"train_loss": -27.508472442626953, "global_step": 575534, "epoch": 6934} {"train_loss": -27.747314453125, "global_step": 575535, "epoch": 6934} {"train_loss": -27.329343795776367, "global_step": 575536, "epoch": 6934} {"train_loss": -27.646881103515625, "global_step": 575537, "epoch": 6934} {"train_loss": -27.785064697265625, "global_step": 575538, "epoch": 6934} {"train_loss": -27.867996215820312, "global_step": 575539, "epoch": 6934} {"train_loss": -27.529462814331055, "global_step": 575540, "epoch": 6934} {"train_loss": -27.62465476989746, "global_step": 575541, "epoch": 6934} {"train_loss": -28.10078239440918, "global_step": 575542, "epoch": 6934} {"train_loss": -28.3081111907959, "global_step": 575543, "epoch": 6934} {"train_loss": -27.86903953552246, "global_step": 575544, "epoch": 6934} {"train_loss": -28.14657974243164, "global_step": 575545, "epoch": 6934} {"train_loss": -27.740148544311523, "global_step": 575546, "epoch": 6934} {"train_loss": -27.667932510375977, "global_step": 575547, "epoch": 6934} {"train_loss": -27.805078506469727, "global_step": 575548, "epoch": 6934} {"train_loss": -27.68674087524414, "global_step": 575549, "epoch": 6934} {"train_loss": -27.8691349029541, "global_step": 575550, "epoch": 6934} {"train_loss": -28.078125, "global_step": 575551, "epoch": 6934} {"train_loss": -28.048330307006836, "global_step": 575552, "epoch": 6934} {"train_loss": -27.734027862548828, "global_step": 575553, "epoch": 6934} {"train_loss": -28.360767364501953, "global_step": 575554, "epoch": 6934} {"train_loss": -28.279890060424805, "global_step": 575555, "epoch": 6934} {"train_loss": -27.843353271484375, "global_step": 575556, "epoch": 6934} {"train_loss": -27.82545280456543, "global_step": 575557, "epoch": 6934} {"train_loss": -27.866567611694336, "global_step": 575558, "epoch": 6934} {"train_loss": -28.001300811767578, "global_step": 575559, "epoch": 6934} {"train_loss": -27.63203239440918, "global_step": 575560, "epoch": 6934} {"train_loss": -27.995410919189453, "global_step": 575561, "epoch": 6934} {"train_loss": -27.626789093017578, "global_step": 575562, "epoch": 6934} {"train_loss": -27.86136817932129, "global_step": 575563, "epoch": 6934} {"train_loss": -28.254968643188477, "global_step": 575564, "epoch": 6934} {"train_loss": -28.229501724243164, "global_step": 575565, "epoch": 6934} {"train_loss": -27.97821044921875, "global_step": 575566, "epoch": 6934} {"train_loss": -28.15470314025879, "global_step": 575567, "epoch": 6934} {"train_loss": -28.1343936920166, "global_step": 575568, "epoch": 6934} {"train_loss": -28.00608253479004, "global_step": 575569, "epoch": 6934} {"train_loss": -27.933340072631836, "global_step": 575570, "epoch": 6934} {"train_loss": -28.064697265625, "global_step": 575571, "epoch": 6934} {"train_loss": -28.07879638671875, "global_step": 575572, "epoch": 6934} {"train_loss": -27.71809196472168, "global_step": 575573, "epoch": 6934} {"train_loss": -27.359527587890625, "global_step": 575574, "epoch": 6934} {"train_loss": -27.356870651245117, "global_step": 575575, "epoch": 6934} {"train_loss": -27.521360397338867, "global_step": 575576, "epoch": 6934} {"train_loss": -27.88931655883789, "global_step": 575577, "epoch": 6934} {"train_loss": -27.553333282470703, "global_step": 575578, "epoch": 6934} {"train_loss": -27.622236251831055, "global_step": 575579, "epoch": 6934} {"train_loss": -27.41584587097168, "global_step": 575580, "epoch": 6934} {"train_loss": -27.562103271484375, "global_step": 575581, "epoch": 6934} {"train_loss": -28.150848388671875, "global_step": 575582, "epoch": 6934} {"train_loss": -27.408231735229492, "global_step": 575583, "epoch": 6934} {"train_loss": -27.938688278198242, "global_step": 575584, "epoch": 6934} {"train_loss": -28.02046012878418, "global_step": 575585, "epoch": 6934} {"train_loss": -27.513748168945312, "global_step": 575586, "epoch": 6934} {"train_loss": -28.377798080444336, "global_step": 575587, "epoch": 6934} {"train_loss": -27.727039337158203, "global_step": 575588, "epoch": 6934} {"train_loss": -27.744123458862305, "global_step": 575589, "epoch": 6934} {"train_loss": -27.923389434814453, "global_step": 575590, "epoch": 6934} {"train_loss": -27.816009521484375, "global_step": 575591, "epoch": 6934} {"train_loss": -27.54612159729004, "global_step": 575592, "epoch": 6934} {"train_loss": -28.112714767456055, "global_step": 575593, "epoch": 6934} {"train_loss": -27.5042724609375, "global_step": 575594, "epoch": 6934} {"train_loss": -27.5076961517334, "global_step": 575595, "epoch": 6934} {"train_loss": -27.652027130126953, "global_step": 575596, "epoch": 6934} {"train_loss": -27.653064727783203, "global_step": 575597, "epoch": 6934} {"train_loss": -27.972631454467773, "global_step": 575598, "epoch": 6934} {"train_loss": -27.789474487304688, "global_step": 575599, "epoch": 6934} {"train_loss": -28.071949005126953, "global_step": 575600, "epoch": 6934} {"train_loss": -27.59067153930664, "global_step": 575601, "epoch": 6934} {"train_loss": -27.807357788085938, "global_step": 575602, "epoch": 6934} {"train_loss": -27.907800674438477, "global_step": 575603, "epoch": 6934} {"train_loss": -27.763160567685784, "global_step": 575604, "epoch": 6934, "val_loss": 6532728.5} {"train_loss": -27.399927139282227, "global_step": 575605, "epoch": 6935} {"train_loss": -27.459003448486328, "global_step": 575606, "epoch": 6935} {"train_loss": -27.40030860900879, "global_step": 575607, "epoch": 6935} {"train_loss": -26.500898361206055, "global_step": 575608, "epoch": 6935} {"train_loss": -26.575307846069336, "global_step": 575609, "epoch": 6935} {"train_loss": -27.10359001159668, "global_step": 575610, "epoch": 6935} {"train_loss": -27.50599479675293, "global_step": 575611, "epoch": 6935} {"train_loss": -27.081995010375977, "global_step": 575612, "epoch": 6935} {"train_loss": -27.390974044799805, "global_step": 575613, "epoch": 6935} {"train_loss": -27.5135440826416, "global_step": 575614, "epoch": 6935} {"train_loss": -27.28484535217285, "global_step": 575615, "epoch": 6935} {"train_loss": -27.380544662475586, "global_step": 575616, "epoch": 6935} {"train_loss": -27.746870040893555, "global_step": 575617, "epoch": 6935} {"train_loss": -27.13521385192871, "global_step": 575618, "epoch": 6935} {"train_loss": -27.11627769470215, "global_step": 575619, "epoch": 6935} {"train_loss": -27.60672950744629, "global_step": 575620, "epoch": 6935} {"train_loss": -27.488615036010742, "global_step": 575621, "epoch": 6935} {"train_loss": -26.96050453186035, "global_step": 575622, "epoch": 6935} {"train_loss": -27.558563232421875, "global_step": 575623, "epoch": 6935} {"train_loss": -27.323776245117188, "global_step": 575624, "epoch": 6935} {"train_loss": -27.464248657226562, "global_step": 575625, "epoch": 6935} {"train_loss": -27.804779052734375, "global_step": 575626, "epoch": 6935} {"train_loss": -27.55669593811035, "global_step": 575627, "epoch": 6935} {"train_loss": -27.827960968017578, "global_step": 575628, "epoch": 6935} {"train_loss": -27.49237060546875, "global_step": 575629, "epoch": 6935} {"train_loss": -27.459396362304688, "global_step": 575630, "epoch": 6935} {"train_loss": -27.802167892456055, "global_step": 575631, "epoch": 6935} {"train_loss": -27.57374382019043, "global_step": 575632, "epoch": 6935} {"train_loss": -27.508161544799805, "global_step": 575633, "epoch": 6935} {"train_loss": -27.929101943969727, "global_step": 575634, "epoch": 6935} {"train_loss": -27.577041625976562, "global_step": 575635, "epoch": 6935} {"train_loss": -27.726245880126953, "global_step": 575636, "epoch": 6935} {"train_loss": -27.786102294921875, "global_step": 575637, "epoch": 6935} {"train_loss": -27.840967178344727, "global_step": 575638, "epoch": 6935} {"train_loss": -27.9703426361084, "global_step": 575639, "epoch": 6935} {"train_loss": -27.78366470336914, "global_step": 575640, "epoch": 6935} {"train_loss": -27.908124923706055, "global_step": 575641, "epoch": 6935} {"train_loss": -27.566852569580078, "global_step": 575642, "epoch": 6935} {"train_loss": -27.96134376525879, "global_step": 575643, "epoch": 6935} {"train_loss": -27.540603637695312, "global_step": 575644, "epoch": 6935} {"train_loss": -27.8347110748291, "global_step": 575645, "epoch": 6935} {"train_loss": -27.740991592407227, "global_step": 575646, "epoch": 6935} {"train_loss": -27.88008689880371, "global_step": 575647, "epoch": 6935} {"train_loss": -27.94293785095215, "global_step": 575648, "epoch": 6935} {"train_loss": -28.13972282409668, "global_step": 575649, "epoch": 6935} {"train_loss": -28.138763427734375, "global_step": 575650, "epoch": 6935} {"train_loss": -27.84366226196289, "global_step": 575651, "epoch": 6935} {"train_loss": -27.908588409423828, "global_step": 575652, "epoch": 6935} {"train_loss": -28.078556060791016, "global_step": 575653, "epoch": 6935} {"train_loss": -28.183027267456055, "global_step": 575654, "epoch": 6935} {"train_loss": -28.239643096923828, "global_step": 575655, "epoch": 6935} {"train_loss": -27.877622604370117, "global_step": 575656, "epoch": 6935} {"train_loss": -27.683349609375, "global_step": 575657, "epoch": 6935} {"train_loss": -28.13852310180664, "global_step": 575658, "epoch": 6935} {"train_loss": -27.992572784423828, "global_step": 575659, "epoch": 6935} {"train_loss": -28.124008178710938, "global_step": 575660, "epoch": 6935} {"train_loss": -28.014606475830078, "global_step": 575661, "epoch": 6935} {"train_loss": -28.0730037689209, "global_step": 575662, "epoch": 6935} {"train_loss": -28.153409957885742, "global_step": 575663, "epoch": 6935} {"train_loss": -28.433780670166016, "global_step": 575664, "epoch": 6935} {"train_loss": -27.703123092651367, "global_step": 575665, "epoch": 6935} {"train_loss": -27.853544235229492, "global_step": 575666, "epoch": 6935} {"train_loss": -28.040624618530273, "global_step": 575667, "epoch": 6935} {"train_loss": -27.899023056030273, "global_step": 575668, "epoch": 6935} {"train_loss": -28.155553817749023, "global_step": 575669, "epoch": 6935} {"train_loss": -27.942230224609375, "global_step": 575670, "epoch": 6935} {"train_loss": -28.106037139892578, "global_step": 575671, "epoch": 6935} {"train_loss": -27.862768173217773, "global_step": 575672, "epoch": 6935} {"train_loss": -27.86224937438965, "global_step": 575673, "epoch": 6935} {"train_loss": -27.673837661743164, "global_step": 575674, "epoch": 6935} {"train_loss": -28.05246925354004, "global_step": 575675, "epoch": 6935} {"train_loss": -27.90767478942871, "global_step": 575676, "epoch": 6935} {"train_loss": -27.801782608032227, "global_step": 575677, "epoch": 6935} {"train_loss": -28.16450309753418, "global_step": 575678, "epoch": 6935} {"train_loss": -27.822132110595703, "global_step": 575679, "epoch": 6935} {"train_loss": -28.113637924194336, "global_step": 575680, "epoch": 6935} {"train_loss": -28.026153564453125, "global_step": 575681, "epoch": 6935} {"train_loss": -27.855749130249023, "global_step": 575682, "epoch": 6935} {"train_loss": -27.629541397094727, "global_step": 575683, "epoch": 6935} {"train_loss": -27.523365020751953, "global_step": 575684, "epoch": 6935} {"train_loss": -27.582731246948242, "global_step": 575685, "epoch": 6935} {"train_loss": -28.05201530456543, "global_step": 575686, "epoch": 6935} {"train_loss": -27.73807109694883, "global_step": 575687, "epoch": 6935, "val_loss": 6609210.0} {"train_loss": -27.609851837158203, "global_step": 575688, "epoch": 6936} {"train_loss": -27.13226318359375, "global_step": 575689, "epoch": 6936} {"train_loss": -27.031766891479492, "global_step": 575690, "epoch": 6936} {"train_loss": -27.433923721313477, "global_step": 575691, "epoch": 6936} {"train_loss": -26.9564208984375, "global_step": 575692, "epoch": 6936} {"train_loss": -27.2236385345459, "global_step": 575693, "epoch": 6936} {"train_loss": -26.81666374206543, "global_step": 575694, "epoch": 6936} {"train_loss": -27.50614356994629, "global_step": 575695, "epoch": 6936} {"train_loss": -27.328821182250977, "global_step": 575696, "epoch": 6936} {"train_loss": -27.561857223510742, "global_step": 575697, "epoch": 6936} {"train_loss": -27.505191802978516, "global_step": 575698, "epoch": 6936} {"train_loss": -27.44529151916504, "global_step": 575699, "epoch": 6936} {"train_loss": -27.778186798095703, "global_step": 575700, "epoch": 6936} {"train_loss": -27.52312660217285, "global_step": 575701, "epoch": 6936} {"train_loss": -27.761138916015625, "global_step": 575702, "epoch": 6936} {"train_loss": -27.662399291992188, "global_step": 575703, "epoch": 6936} {"train_loss": -27.534589767456055, "global_step": 575704, "epoch": 6936} {"train_loss": -27.729022979736328, "global_step": 575705, "epoch": 6936} {"train_loss": -27.883054733276367, "global_step": 575706, "epoch": 6936} {"train_loss": -27.757917404174805, "global_step": 575707, "epoch": 6936} {"train_loss": -27.884016036987305, "global_step": 575708, "epoch": 6936} {"train_loss": -27.89788818359375, "global_step": 575709, "epoch": 6936} {"train_loss": -27.52161979675293, "global_step": 575710, "epoch": 6936} {"train_loss": -28.17898941040039, "global_step": 575711, "epoch": 6936} {"train_loss": -27.840787887573242, "global_step": 575712, "epoch": 6936} {"train_loss": -27.866979598999023, "global_step": 575713, "epoch": 6936} {"train_loss": -27.675363540649414, "global_step": 575714, "epoch": 6936} {"train_loss": -27.8759708404541, "global_step": 575715, "epoch": 6936} {"train_loss": -28.187170028686523, "global_step": 575716, "epoch": 6936} {"train_loss": -28.16438102722168, "global_step": 575717, "epoch": 6936} {"train_loss": -28.128681182861328, "global_step": 575718, "epoch": 6936} {"train_loss": -27.964262008666992, "global_step": 575719, "epoch": 6936} {"train_loss": -28.103046417236328, "global_step": 575720, "epoch": 6936} {"train_loss": -28.212446212768555, "global_step": 575721, "epoch": 6936} {"train_loss": -28.038782119750977, "global_step": 575722, "epoch": 6936} {"train_loss": -28.105337142944336, "global_step": 575723, "epoch": 6936} {"train_loss": -27.486560821533203, "global_step": 575724, "epoch": 6936} {"train_loss": -28.452207565307617, "global_step": 575725, "epoch": 6936} {"train_loss": -27.777921676635742, "global_step": 575726, "epoch": 6936} {"train_loss": -28.039352416992188, "global_step": 575727, "epoch": 6936} {"train_loss": -28.373437881469727, "global_step": 575728, "epoch": 6936} {"train_loss": -28.167001724243164, "global_step": 575729, "epoch": 6936} {"train_loss": -28.170547485351562, "global_step": 575730, "epoch": 6936} {"train_loss": -28.015966415405273, "global_step": 575731, "epoch": 6936} {"train_loss": -28.305158615112305, "global_step": 575732, "epoch": 6936} {"train_loss": -28.17779541015625, "global_step": 575733, "epoch": 6936} {"train_loss": -28.074472427368164, "global_step": 575734, "epoch": 6936} {"train_loss": -28.056150436401367, "global_step": 575735, "epoch": 6936} {"train_loss": -27.78769874572754, "global_step": 575736, "epoch": 6936} {"train_loss": -28.30706787109375, "global_step": 575737, "epoch": 6936} {"train_loss": -28.49382972717285, "global_step": 575738, "epoch": 6936} {"train_loss": -28.021757125854492, "global_step": 575739, "epoch": 6936} {"train_loss": -27.673206329345703, "global_step": 575740, "epoch": 6936} {"train_loss": -27.83342933654785, "global_step": 575741, "epoch": 6936} {"train_loss": -28.19991111755371, "global_step": 575742, "epoch": 6936} {"train_loss": -27.956579208374023, "global_step": 575743, "epoch": 6936} {"train_loss": -27.66108512878418, "global_step": 575744, "epoch": 6936} {"train_loss": -27.651060104370117, "global_step": 575745, "epoch": 6936} {"train_loss": -27.773664474487305, "global_step": 575746, "epoch": 6936} {"train_loss": -27.90681266784668, "global_step": 575747, "epoch": 6936} {"train_loss": -27.92646598815918, "global_step": 575748, "epoch": 6936} {"train_loss": -27.5794677734375, "global_step": 575749, "epoch": 6936} {"train_loss": -27.414209365844727, "global_step": 575750, "epoch": 6936} {"train_loss": -28.055517196655273, "global_step": 575751, "epoch": 6936} {"train_loss": -27.717914581298828, "global_step": 575752, "epoch": 6936} {"train_loss": -27.450170516967773, "global_step": 575753, "epoch": 6936} {"train_loss": -27.698287963867188, "global_step": 575754, "epoch": 6936} {"train_loss": -27.540115356445312, "global_step": 575755, "epoch": 6936} {"train_loss": -27.40264892578125, "global_step": 575756, "epoch": 6936} {"train_loss": -27.64507484436035, "global_step": 575757, "epoch": 6936} {"train_loss": -27.452056884765625, "global_step": 575758, "epoch": 6936} {"train_loss": -27.48554039001465, "global_step": 575759, "epoch": 6936} {"train_loss": -27.46787452697754, "global_step": 575760, "epoch": 6936} {"train_loss": -27.51045036315918, "global_step": 575761, "epoch": 6936} {"train_loss": -27.945541381835938, "global_step": 575762, "epoch": 6936} {"train_loss": -27.326038360595703, "global_step": 575763, "epoch": 6936} {"train_loss": -27.04701042175293, "global_step": 575764, "epoch": 6936} {"train_loss": -26.884750366210938, "global_step": 575765, "epoch": 6936} {"train_loss": -27.58938980102539, "global_step": 575766, "epoch": 6936} {"train_loss": -27.67384147644043, "global_step": 575767, "epoch": 6936} {"train_loss": -27.56141471862793, "global_step": 575768, "epoch": 6936} {"train_loss": -27.500959396362305, "global_step": 575769, "epoch": 6936} {"train_loss": -27.749115013214478, "global_step": 575770, "epoch": 6936, "val_loss": 6546648.0} {"train_loss": -26.664533615112305, "global_step": 575771, "epoch": 6937} {"train_loss": -26.912567138671875, "global_step": 575772, "epoch": 6937} {"train_loss": -26.640966415405273, "global_step": 575773, "epoch": 6937} {"train_loss": -27.093748092651367, "global_step": 575774, "epoch": 6937} {"train_loss": -26.637170791625977, "global_step": 575775, "epoch": 6937} {"train_loss": -26.627273559570312, "global_step": 575776, "epoch": 6937} {"train_loss": -26.80409049987793, "global_step": 575777, "epoch": 6937} {"train_loss": -27.15803337097168, "global_step": 575778, "epoch": 6937} {"train_loss": -27.173084259033203, "global_step": 575779, "epoch": 6937} {"train_loss": -26.88459587097168, "global_step": 575780, "epoch": 6937} {"train_loss": -27.2635440826416, "global_step": 575781, "epoch": 6937} {"train_loss": -26.980798721313477, "global_step": 575782, "epoch": 6937} {"train_loss": -27.28053855895996, "global_step": 575783, "epoch": 6937} {"train_loss": -27.379880905151367, "global_step": 575784, "epoch": 6937} {"train_loss": -27.338796615600586, "global_step": 575785, "epoch": 6937} {"train_loss": -27.274810791015625, "global_step": 575786, "epoch": 6937} {"train_loss": -27.651281356811523, "global_step": 575787, "epoch": 6937} {"train_loss": -27.394580841064453, "global_step": 575788, "epoch": 6937} {"train_loss": -27.471893310546875, "global_step": 575789, "epoch": 6937} {"train_loss": -27.851078033447266, "global_step": 575790, "epoch": 6937} {"train_loss": -27.497915267944336, "global_step": 575791, "epoch": 6937} {"train_loss": -27.686384201049805, "global_step": 575792, "epoch": 6937} {"train_loss": -27.834918975830078, "global_step": 575793, "epoch": 6937} {"train_loss": -27.2654972076416, "global_step": 575794, "epoch": 6937} {"train_loss": -27.65619468688965, "global_step": 575795, "epoch": 6937} {"train_loss": -27.912403106689453, "global_step": 575796, "epoch": 6937} {"train_loss": -27.8581485748291, "global_step": 575797, "epoch": 6937} {"train_loss": -27.517383575439453, "global_step": 575798, "epoch": 6937} {"train_loss": -28.1697940826416, "global_step": 575799, "epoch": 6937} {"train_loss": -27.98301124572754, "global_step": 575800, "epoch": 6937} {"train_loss": -28.080671310424805, "global_step": 575801, "epoch": 6937} {"train_loss": -27.682897567749023, "global_step": 575802, "epoch": 6937} {"train_loss": -27.775964736938477, "global_step": 575803, "epoch": 6937} {"train_loss": -28.12101173400879, "global_step": 575804, "epoch": 6937} {"train_loss": -28.2218074798584, "global_step": 575805, "epoch": 6937} {"train_loss": -28.09907341003418, "global_step": 575806, "epoch": 6937} {"train_loss": -28.1041316986084, "global_step": 575807, "epoch": 6937} {"train_loss": -27.946619033813477, "global_step": 575808, "epoch": 6937} {"train_loss": -27.929174423217773, "global_step": 575809, "epoch": 6937} {"train_loss": -27.91377067565918, "global_step": 575810, "epoch": 6937} {"train_loss": -27.8782958984375, "global_step": 575811, "epoch": 6937} {"train_loss": -27.915327072143555, "global_step": 575812, "epoch": 6937} {"train_loss": -28.125141143798828, "global_step": 575813, "epoch": 6937} {"train_loss": -27.95526123046875, "global_step": 575814, "epoch": 6937} {"train_loss": -27.869312286376953, "global_step": 575815, "epoch": 6937} {"train_loss": -28.102680206298828, "global_step": 575816, "epoch": 6937} {"train_loss": -28.08902359008789, "global_step": 575817, "epoch": 6937} {"train_loss": -28.053686141967773, "global_step": 575818, "epoch": 6937} {"train_loss": -27.415042877197266, "global_step": 575819, "epoch": 6937} {"train_loss": -27.626874923706055, "global_step": 575820, "epoch": 6937} {"train_loss": -28.034103393554688, "global_step": 575821, "epoch": 6937} {"train_loss": -27.696264266967773, "global_step": 575822, "epoch": 6937} {"train_loss": -27.95269203186035, "global_step": 575823, "epoch": 6937} {"train_loss": -27.814682006835938, "global_step": 575824, "epoch": 6937} {"train_loss": -27.760971069335938, "global_step": 575825, "epoch": 6937} {"train_loss": -28.01141929626465, "global_step": 575826, "epoch": 6937} {"train_loss": -28.046131134033203, "global_step": 575827, "epoch": 6937} {"train_loss": -27.698505401611328, "global_step": 575828, "epoch": 6937} {"train_loss": -27.618350982666016, "global_step": 575829, "epoch": 6937} {"train_loss": -28.037384033203125, "global_step": 575830, "epoch": 6937} {"train_loss": -27.649234771728516, "global_step": 575831, "epoch": 6937} {"train_loss": -27.9077205657959, "global_step": 575832, "epoch": 6937} {"train_loss": -28.01443862915039, "global_step": 575833, "epoch": 6937} {"train_loss": -27.64495849609375, "global_step": 575834, "epoch": 6937} {"train_loss": -27.553470611572266, "global_step": 575835, "epoch": 6937} {"train_loss": -28.15521240234375, "global_step": 575836, "epoch": 6937} {"train_loss": -27.840301513671875, "global_step": 575837, "epoch": 6937} {"train_loss": -28.14332389831543, "global_step": 575838, "epoch": 6937} {"train_loss": -28.012420654296875, "global_step": 575839, "epoch": 6937} {"train_loss": -27.94672203063965, "global_step": 575840, "epoch": 6937} {"train_loss": -27.86683464050293, "global_step": 575841, "epoch": 6937} {"train_loss": -28.1778507232666, "global_step": 575842, "epoch": 6937} {"train_loss": -27.737741470336914, "global_step": 575843, "epoch": 6937} {"train_loss": -27.776044845581055, "global_step": 575844, "epoch": 6937} {"train_loss": -28.02906608581543, "global_step": 575845, "epoch": 6937} {"train_loss": -27.916540145874023, "global_step": 575846, "epoch": 6937} {"train_loss": -28.0042781829834, "global_step": 575847, "epoch": 6937} {"train_loss": -27.784088134765625, "global_step": 575848, "epoch": 6937} {"train_loss": -27.99420738220215, "global_step": 575849, "epoch": 6937} {"train_loss": -28.304426193237305, "global_step": 575850, "epoch": 6937} {"train_loss": -28.1181583404541, "global_step": 575851, "epoch": 6937} {"train_loss": -28.29294204711914, "global_step": 575852, "epoch": 6937} {"train_loss": -27.718900197959808, "global_step": 575853, "epoch": 6937, "val_loss": 6562390.0} {"train_loss": -27.61887550354004, "global_step": 575854, "epoch": 6938} {"train_loss": -26.867399215698242, "global_step": 575855, "epoch": 6938} {"train_loss": -26.15738296508789, "global_step": 575856, "epoch": 6938} {"train_loss": -26.414167404174805, "global_step": 575857, "epoch": 6938} {"train_loss": -27.260313034057617, "global_step": 575858, "epoch": 6938} {"train_loss": -27.360260009765625, "global_step": 575859, "epoch": 6938} {"train_loss": -27.055557250976562, "global_step": 575860, "epoch": 6938} {"train_loss": -27.17840003967285, "global_step": 575861, "epoch": 6938} {"train_loss": -27.35333824157715, "global_step": 575862, "epoch": 6938} {"train_loss": -27.380868911743164, "global_step": 575863, "epoch": 6938} {"train_loss": -27.52875328063965, "global_step": 575864, "epoch": 6938} {"train_loss": -27.59773063659668, "global_step": 575865, "epoch": 6938} {"train_loss": -27.414518356323242, "global_step": 575866, "epoch": 6938} {"train_loss": -27.386396408081055, "global_step": 575867, "epoch": 6938} {"train_loss": -27.938642501831055, "global_step": 575868, "epoch": 6938} {"train_loss": -27.54534339904785, "global_step": 575869, "epoch": 6938} {"train_loss": -27.30191993713379, "global_step": 575870, "epoch": 6938} {"train_loss": -27.479398727416992, "global_step": 575871, "epoch": 6938} {"train_loss": -27.796377182006836, "global_step": 575872, "epoch": 6938} {"train_loss": -27.667444229125977, "global_step": 575873, "epoch": 6938} {"train_loss": -27.749420166015625, "global_step": 575874, "epoch": 6938} {"train_loss": -27.720523834228516, "global_step": 575875, "epoch": 6938} {"train_loss": -27.57643699645996, "global_step": 575876, "epoch": 6938} {"train_loss": -27.96260643005371, "global_step": 575877, "epoch": 6938} {"train_loss": -27.93303871154785, "global_step": 575878, "epoch": 6938} {"train_loss": -27.921375274658203, "global_step": 575879, "epoch": 6938} {"train_loss": -28.0759334564209, "global_step": 575880, "epoch": 6938} {"train_loss": -27.5875244140625, "global_step": 575881, "epoch": 6938} {"train_loss": -27.81671714782715, "global_step": 575882, "epoch": 6938} {"train_loss": -27.733718872070312, "global_step": 575883, "epoch": 6938} {"train_loss": -27.950754165649414, "global_step": 575884, "epoch": 6938} {"train_loss": -27.954099655151367, "global_step": 575885, "epoch": 6938} {"train_loss": -27.978994369506836, "global_step": 575886, "epoch": 6938} {"train_loss": -28.145233154296875, "global_step": 575887, "epoch": 6938} {"train_loss": -28.158599853515625, "global_step": 575888, "epoch": 6938} {"train_loss": -28.134830474853516, "global_step": 575889, "epoch": 6938} {"train_loss": -27.807697296142578, "global_step": 575890, "epoch": 6938} {"train_loss": -27.931598663330078, "global_step": 575891, "epoch": 6938} {"train_loss": -27.942468643188477, "global_step": 575892, "epoch": 6938} {"train_loss": -27.884130477905273, "global_step": 575893, "epoch": 6938} {"train_loss": -27.96034049987793, "global_step": 575894, "epoch": 6938} {"train_loss": -27.67583656311035, "global_step": 575895, "epoch": 6938} {"train_loss": -27.999496459960938, "global_step": 575896, "epoch": 6938} {"train_loss": -27.6955509185791, "global_step": 575897, "epoch": 6938} {"train_loss": -28.129934310913086, "global_step": 575898, "epoch": 6938} {"train_loss": -27.7922306060791, "global_step": 575899, "epoch": 6938} {"train_loss": -28.1453857421875, "global_step": 575900, "epoch": 6938} {"train_loss": -28.108646392822266, "global_step": 575901, "epoch": 6938} {"train_loss": -28.332904815673828, "global_step": 575902, "epoch": 6938} {"train_loss": -28.261816024780273, "global_step": 575903, "epoch": 6938} {"train_loss": -28.232385635375977, "global_step": 575904, "epoch": 6938} {"train_loss": -28.085779190063477, "global_step": 575905, "epoch": 6938} {"train_loss": -27.8370361328125, "global_step": 575906, "epoch": 6938} {"train_loss": -27.808948516845703, "global_step": 575907, "epoch": 6938} {"train_loss": -27.991291046142578, "global_step": 575908, "epoch": 6938} {"train_loss": -28.026212692260742, "global_step": 575909, "epoch": 6938} {"train_loss": -27.672199249267578, "global_step": 575910, "epoch": 6938} {"train_loss": -27.618711471557617, "global_step": 575911, "epoch": 6938} {"train_loss": -28.249624252319336, "global_step": 575912, "epoch": 6938} {"train_loss": -28.075428009033203, "global_step": 575913, "epoch": 6938} {"train_loss": -27.72967529296875, "global_step": 575914, "epoch": 6938} {"train_loss": -27.559051513671875, "global_step": 575915, "epoch": 6938} {"train_loss": -27.71514892578125, "global_step": 575916, "epoch": 6938} {"train_loss": -27.92731285095215, "global_step": 575917, "epoch": 6938} {"train_loss": -27.97037124633789, "global_step": 575918, "epoch": 6938} {"train_loss": -28.20891761779785, "global_step": 575919, "epoch": 6938} {"train_loss": -28.076013565063477, "global_step": 575920, "epoch": 6938} {"train_loss": -27.772008895874023, "global_step": 575921, "epoch": 6938} {"train_loss": -27.98172378540039, "global_step": 575922, "epoch": 6938} {"train_loss": -27.795385360717773, "global_step": 575923, "epoch": 6938} {"train_loss": -27.933568954467773, "global_step": 575924, "epoch": 6938} {"train_loss": -28.043859481811523, "global_step": 575925, "epoch": 6938} {"train_loss": -28.136016845703125, "global_step": 575926, "epoch": 6938} {"train_loss": -27.72950553894043, "global_step": 575927, "epoch": 6938} {"train_loss": -28.267988204956055, "global_step": 575928, "epoch": 6938} {"train_loss": -28.01910972595215, "global_step": 575929, "epoch": 6938} {"train_loss": -27.952503204345703, "global_step": 575930, "epoch": 6938} {"train_loss": -27.866540908813477, "global_step": 575931, "epoch": 6938} {"train_loss": -28.19129753112793, "global_step": 575932, "epoch": 6938} {"train_loss": -27.887060165405273, "global_step": 575933, "epoch": 6938} {"train_loss": -28.086761474609375, "global_step": 575934, "epoch": 6938} {"train_loss": -28.484121322631836, "global_step": 575935, "epoch": 6938} {"train_loss": -27.793515124952936, "global_step": 575936, "epoch": 6938, "val_loss": 6587289.0} {"train_loss": -26.883909225463867, "global_step": 575937, "epoch": 6939} {"train_loss": -26.653736114501953, "global_step": 575938, "epoch": 6939} {"train_loss": -27.333311080932617, "global_step": 575939, "epoch": 6939} {"train_loss": -27.211669921875, "global_step": 575940, "epoch": 6939} {"train_loss": -26.9992733001709, "global_step": 575941, "epoch": 6939} {"train_loss": -27.45765495300293, "global_step": 575942, "epoch": 6939} {"train_loss": -26.968006134033203, "global_step": 575943, "epoch": 6939} {"train_loss": -27.517187118530273, "global_step": 575944, "epoch": 6939} {"train_loss": -26.922338485717773, "global_step": 575945, "epoch": 6939} {"train_loss": -27.07832145690918, "global_step": 575946, "epoch": 6939} {"train_loss": -27.42853355407715, "global_step": 575947, "epoch": 6939} {"train_loss": -27.504629135131836, "global_step": 575948, "epoch": 6939} {"train_loss": -27.59360122680664, "global_step": 575949, "epoch": 6939} {"train_loss": -27.280439376831055, "global_step": 575950, "epoch": 6939} {"train_loss": -27.844913482666016, "global_step": 575951, "epoch": 6939} {"train_loss": -27.37013053894043, "global_step": 575952, "epoch": 6939} {"train_loss": -27.56723976135254, "global_step": 575953, "epoch": 6939} {"train_loss": -27.713607788085938, "global_step": 575954, "epoch": 6939} {"train_loss": -27.313806533813477, "global_step": 575955, "epoch": 6939} {"train_loss": -27.4097843170166, "global_step": 575956, "epoch": 6939} {"train_loss": -27.768085479736328, "global_step": 575957, "epoch": 6939} {"train_loss": -27.603918075561523, "global_step": 575958, "epoch": 6939} {"train_loss": -27.53961753845215, "global_step": 575959, "epoch": 6939} {"train_loss": -27.89849853515625, "global_step": 575960, "epoch": 6939} {"train_loss": -27.654211044311523, "global_step": 575961, "epoch": 6939} {"train_loss": -27.64739418029785, "global_step": 575962, "epoch": 6939} {"train_loss": -27.60272216796875, "global_step": 575963, "epoch": 6939} {"train_loss": -27.75771141052246, "global_step": 575964, "epoch": 6939} {"train_loss": -28.070541381835938, "global_step": 575965, "epoch": 6939} {"train_loss": -27.667621612548828, "global_step": 575966, "epoch": 6939} {"train_loss": -27.864120483398438, "global_step": 575967, "epoch": 6939} {"train_loss": -27.673553466796875, "global_step": 575968, "epoch": 6939} {"train_loss": -27.89571189880371, "global_step": 575969, "epoch": 6939} {"train_loss": -27.905515670776367, "global_step": 575970, "epoch": 6939} {"train_loss": -28.00396156311035, "global_step": 575971, "epoch": 6939} {"train_loss": -28.000720977783203, "global_step": 575972, "epoch": 6939} {"train_loss": -27.570520401000977, "global_step": 575973, "epoch": 6939} {"train_loss": -27.637832641601562, "global_step": 575974, "epoch": 6939} {"train_loss": -28.12204933166504, "global_step": 575975, "epoch": 6939} {"train_loss": -27.754117965698242, "global_step": 575976, "epoch": 6939} {"train_loss": -28.096487045288086, "global_step": 575977, "epoch": 6939} {"train_loss": -27.864477157592773, "global_step": 575978, "epoch": 6939} {"train_loss": -27.736730575561523, "global_step": 575979, "epoch": 6939} {"train_loss": -28.100173950195312, "global_step": 575980, "epoch": 6939} {"train_loss": -27.67400550842285, "global_step": 575981, "epoch": 6939} {"train_loss": -27.85491371154785, "global_step": 575982, "epoch": 6939} {"train_loss": -27.87409782409668, "global_step": 575983, "epoch": 6939} {"train_loss": -28.079090118408203, "global_step": 575984, "epoch": 6939} {"train_loss": -27.875320434570312, "global_step": 575985, "epoch": 6939} {"train_loss": -27.1795654296875, "global_step": 575986, "epoch": 6939} {"train_loss": -28.162817001342773, "global_step": 575987, "epoch": 6939} {"train_loss": -27.614377975463867, "global_step": 575988, "epoch": 6939} {"train_loss": -28.127466201782227, "global_step": 575989, "epoch": 6939} {"train_loss": -27.59040641784668, "global_step": 575990, "epoch": 6939} {"train_loss": -28.065942764282227, "global_step": 575991, "epoch": 6939} {"train_loss": -27.689727783203125, "global_step": 575992, "epoch": 6939} {"train_loss": -27.220605850219727, "global_step": 575993, "epoch": 6939} {"train_loss": -27.090595245361328, "global_step": 575994, "epoch": 6939} {"train_loss": -27.880430221557617, "global_step": 575995, "epoch": 6939} {"train_loss": -27.788022994995117, "global_step": 575996, "epoch": 6939} {"train_loss": -27.81972312927246, "global_step": 575997, "epoch": 6939} {"train_loss": -27.831933975219727, "global_step": 575998, "epoch": 6939} {"train_loss": -27.69803237915039, "global_step": 575999, "epoch": 6939} {"train_loss": -27.855173110961914, "global_step": 576000, "epoch": 6939} {"train_loss": -27.758554458618164, "global_step": 576001, "epoch": 6939} {"train_loss": -27.918806076049805, "global_step": 576002, "epoch": 6939} {"train_loss": -28.238849639892578, "global_step": 576003, "epoch": 6939} {"train_loss": -27.685333251953125, "global_step": 576004, "epoch": 6939} {"train_loss": -28.076929092407227, "global_step": 576005, "epoch": 6939} {"train_loss": -27.648435592651367, "global_step": 576006, "epoch": 6939} {"train_loss": -28.267492294311523, "global_step": 576007, "epoch": 6939} {"train_loss": -27.317646026611328, "global_step": 576008, "epoch": 6939} {"train_loss": -27.928415298461914, "global_step": 576009, "epoch": 6939} {"train_loss": -28.319196701049805, "global_step": 576010, "epoch": 6939} {"train_loss": -27.784631729125977, "global_step": 576011, "epoch": 6939} {"train_loss": -27.404138565063477, "global_step": 576012, "epoch": 6939} {"train_loss": -27.898239135742188, "global_step": 576013, "epoch": 6939} {"train_loss": -27.910764694213867, "global_step": 576014, "epoch": 6939} {"train_loss": -28.13720703125, "global_step": 576015, "epoch": 6939} {"train_loss": -28.06680679321289, "global_step": 576016, "epoch": 6939} {"train_loss": -27.89625358581543, "global_step": 576017, "epoch": 6939} {"train_loss": -28.3170223236084, "global_step": 576018, "epoch": 6939} {"train_loss": -27.69061378111322, "global_step": 576019, "epoch": 6939, "val_loss": 6549152.0} {"train_loss": -27.619510650634766, "global_step": 576020, "epoch": 6940} {"train_loss": -27.5076847076416, "global_step": 576021, "epoch": 6940} {"train_loss": -27.583484649658203, "global_step": 576022, "epoch": 6940} {"train_loss": -27.768177032470703, "global_step": 576023, "epoch": 6940} {"train_loss": -27.807632446289062, "global_step": 576024, "epoch": 6940} {"train_loss": -27.792875289916992, "global_step": 576025, "epoch": 6940} {"train_loss": -27.760700225830078, "global_step": 576026, "epoch": 6940} {"train_loss": -27.587060928344727, "global_step": 576027, "epoch": 6940} {"train_loss": -27.809762954711914, "global_step": 576028, "epoch": 6940} {"train_loss": -28.0362491607666, "global_step": 576029, "epoch": 6940} {"train_loss": -27.914915084838867, "global_step": 576030, "epoch": 6940} {"train_loss": -27.4426212310791, "global_step": 576031, "epoch": 6940} {"train_loss": -27.570947647094727, "global_step": 576032, "epoch": 6940} {"train_loss": -27.47284507751465, "global_step": 576033, "epoch": 6940} {"train_loss": -27.843170166015625, "global_step": 576034, "epoch": 6940} {"train_loss": -27.96087646484375, "global_step": 576035, "epoch": 6940} {"train_loss": -27.7468318939209, "global_step": 576036, "epoch": 6940} {"train_loss": -27.6431827545166, "global_step": 576037, "epoch": 6940} {"train_loss": -27.98103141784668, "global_step": 576038, "epoch": 6940} {"train_loss": -27.75104331970215, "global_step": 576039, "epoch": 6940} {"train_loss": -28.157608032226562, "global_step": 576040, "epoch": 6940} {"train_loss": -27.761091232299805, "global_step": 576041, "epoch": 6940} {"train_loss": -27.73434829711914, "global_step": 576042, "epoch": 6940} {"train_loss": -28.37041664123535, "global_step": 576043, "epoch": 6940} {"train_loss": -28.074777603149414, "global_step": 576044, "epoch": 6940} {"train_loss": -27.698516845703125, "global_step": 576045, "epoch": 6940} {"train_loss": -27.975086212158203, "global_step": 576046, "epoch": 6940} {"train_loss": -27.952146530151367, "global_step": 576047, "epoch": 6940} {"train_loss": -27.914661407470703, "global_step": 576048, "epoch": 6940} {"train_loss": -28.2473201751709, "global_step": 576049, "epoch": 6940} {"train_loss": -28.4416446685791, "global_step": 576050, "epoch": 6940} {"train_loss": -28.353490829467773, "global_step": 576051, "epoch": 6940} {"train_loss": -28.04743003845215, "global_step": 576052, "epoch": 6940} {"train_loss": -27.49915885925293, "global_step": 576053, "epoch": 6940} {"train_loss": -27.885150909423828, "global_step": 576054, "epoch": 6940} {"train_loss": -27.45985984802246, "global_step": 576055, "epoch": 6940} {"train_loss": -27.837615966796875, "global_step": 576056, "epoch": 6940} {"train_loss": -28.036945343017578, "global_step": 576057, "epoch": 6940} {"train_loss": -27.66240882873535, "global_step": 576058, "epoch": 6940} {"train_loss": -27.728225708007812, "global_step": 576059, "epoch": 6940} {"train_loss": -27.903432846069336, "global_step": 576060, "epoch": 6940} {"train_loss": -27.987857818603516, "global_step": 576061, "epoch": 6940} {"train_loss": -28.026330947875977, "global_step": 576062, "epoch": 6940} {"train_loss": -27.815271377563477, "global_step": 576063, "epoch": 6940} {"train_loss": -27.564926147460938, "global_step": 576064, "epoch": 6940} {"train_loss": -27.98028564453125, "global_step": 576065, "epoch": 6940} {"train_loss": -28.076496124267578, "global_step": 576066, "epoch": 6940} {"train_loss": -27.594335556030273, "global_step": 576067, "epoch": 6940} {"train_loss": -27.90256118774414, "global_step": 576068, "epoch": 6940} {"train_loss": -27.732641220092773, "global_step": 576069, "epoch": 6940} {"train_loss": -28.179136276245117, "global_step": 576070, "epoch": 6940} {"train_loss": -27.635364532470703, "global_step": 576071, "epoch": 6940} {"train_loss": -28.059219360351562, "global_step": 576072, "epoch": 6940} {"train_loss": -27.754804611206055, "global_step": 576073, "epoch": 6940} {"train_loss": -27.692920684814453, "global_step": 576074, "epoch": 6940} {"train_loss": -27.943368911743164, "global_step": 576075, "epoch": 6940} {"train_loss": -27.451812744140625, "global_step": 576076, "epoch": 6940} {"train_loss": -27.412885665893555, "global_step": 576077, "epoch": 6940} {"train_loss": -27.784503936767578, "global_step": 576078, "epoch": 6940} {"train_loss": -27.644556045532227, "global_step": 576079, "epoch": 6940} {"train_loss": -27.123029708862305, "global_step": 576080, "epoch": 6940} {"train_loss": -27.416833877563477, "global_step": 576081, "epoch": 6940} {"train_loss": -27.355838775634766, "global_step": 576082, "epoch": 6940} {"train_loss": -27.1844425201416, "global_step": 576083, "epoch": 6940} {"train_loss": -27.41790199279785, "global_step": 576084, "epoch": 6940} {"train_loss": -27.86933708190918, "global_step": 576085, "epoch": 6940} {"train_loss": -26.995512008666992, "global_step": 576086, "epoch": 6940} {"train_loss": -27.610748291015625, "global_step": 576087, "epoch": 6940} {"train_loss": -27.333240509033203, "global_step": 576088, "epoch": 6940} {"train_loss": -27.44523048400879, "global_step": 576089, "epoch": 6940} {"train_loss": -27.37344741821289, "global_step": 576090, "epoch": 6940} {"train_loss": -27.531784057617188, "global_step": 576091, "epoch": 6940} {"train_loss": -27.533252716064453, "global_step": 576092, "epoch": 6940} {"train_loss": -27.5974063873291, "global_step": 576093, "epoch": 6940} {"train_loss": -27.45952796936035, "global_step": 576094, "epoch": 6940} {"train_loss": -27.82111167907715, "global_step": 576095, "epoch": 6940} {"train_loss": -27.814279556274414, "global_step": 576096, "epoch": 6940} {"train_loss": -27.5689697265625, "global_step": 576097, "epoch": 6940} {"train_loss": -27.821231842041016, "global_step": 576098, "epoch": 6940} {"train_loss": -27.584653854370117, "global_step": 576099, "epoch": 6940} {"train_loss": -27.35975456237793, "global_step": 576100, "epoch": 6940} {"train_loss": -27.87562370300293, "global_step": 576101, "epoch": 6940} {"train_loss": -27.74148499822042, "global_step": 576102, "epoch": 6940, "val_loss": 6474549.0} {"train_loss": -27.21738624572754, "global_step": 576103, "epoch": 6941} {"train_loss": -27.237531661987305, "global_step": 576104, "epoch": 6941} {"train_loss": -27.83628273010254, "global_step": 576105, "epoch": 6941} {"train_loss": -27.025781631469727, "global_step": 576106, "epoch": 6941} {"train_loss": -27.460256576538086, "global_step": 576107, "epoch": 6941} {"train_loss": -27.496103286743164, "global_step": 576108, "epoch": 6941} {"train_loss": -27.2844295501709, "global_step": 576109, "epoch": 6941} {"train_loss": -27.266157150268555, "global_step": 576110, "epoch": 6941} {"train_loss": -27.2109375, "global_step": 576111, "epoch": 6941} {"train_loss": -27.531600952148438, "global_step": 576112, "epoch": 6941} {"train_loss": -27.697513580322266, "global_step": 576113, "epoch": 6941} {"train_loss": -27.497785568237305, "global_step": 576114, "epoch": 6941} {"train_loss": -27.036209106445312, "global_step": 576115, "epoch": 6941} {"train_loss": -27.874298095703125, "global_step": 576116, "epoch": 6941} {"train_loss": -27.967437744140625, "global_step": 576117, "epoch": 6941} {"train_loss": -27.688648223876953, "global_step": 576118, "epoch": 6941} {"train_loss": -27.916351318359375, "global_step": 576119, "epoch": 6941} {"train_loss": -27.84761619567871, "global_step": 576120, "epoch": 6941} {"train_loss": -27.748310089111328, "global_step": 576121, "epoch": 6941} {"train_loss": -27.89449119567871, "global_step": 576122, "epoch": 6941} {"train_loss": -28.021503448486328, "global_step": 576123, "epoch": 6941} {"train_loss": -27.698654174804688, "global_step": 576124, "epoch": 6941} {"train_loss": -28.084060668945312, "global_step": 576125, "epoch": 6941} {"train_loss": -28.09522819519043, "global_step": 576126, "epoch": 6941} {"train_loss": -28.052793502807617, "global_step": 576127, "epoch": 6941} {"train_loss": -27.540283203125, "global_step": 576128, "epoch": 6941} {"train_loss": -27.976301193237305, "global_step": 576129, "epoch": 6941} {"train_loss": -27.857786178588867, "global_step": 576130, "epoch": 6941} {"train_loss": -27.781423568725586, "global_step": 576131, "epoch": 6941} {"train_loss": -27.62745475769043, "global_step": 576132, "epoch": 6941} {"train_loss": -27.8953800201416, "global_step": 576133, "epoch": 6941} {"train_loss": -27.72963523864746, "global_step": 576134, "epoch": 6941} {"train_loss": -27.939624786376953, "global_step": 576135, "epoch": 6941} {"train_loss": -28.115833282470703, "global_step": 576136, "epoch": 6941} {"train_loss": -27.66849708557129, "global_step": 576137, "epoch": 6941} {"train_loss": -28.044845581054688, "global_step": 576138, "epoch": 6941} {"train_loss": -27.882373809814453, "global_step": 576139, "epoch": 6941} {"train_loss": -27.44927406311035, "global_step": 576140, "epoch": 6941} {"train_loss": -27.74444580078125, "global_step": 576141, "epoch": 6941} {"train_loss": -27.771093368530273, "global_step": 576142, "epoch": 6941} {"train_loss": -27.644271850585938, "global_step": 576143, "epoch": 6941} {"train_loss": -27.6230411529541, "global_step": 576144, "epoch": 6941} {"train_loss": -27.71024513244629, "global_step": 576145, "epoch": 6941} {"train_loss": -27.533828735351562, "global_step": 576146, "epoch": 6941} {"train_loss": -27.79426383972168, "global_step": 576147, "epoch": 6941} {"train_loss": -27.761383056640625, "global_step": 576148, "epoch": 6941} {"train_loss": -27.96563148498535, "global_step": 576149, "epoch": 6941} {"train_loss": -27.3750057220459, "global_step": 576150, "epoch": 6941} {"train_loss": -27.67862892150879, "global_step": 576151, "epoch": 6941} {"train_loss": -27.21677017211914, "global_step": 576152, "epoch": 6941} {"train_loss": -27.905935287475586, "global_step": 576153, "epoch": 6941} {"train_loss": -27.814910888671875, "global_step": 576154, "epoch": 6941} {"train_loss": -27.432661056518555, "global_step": 576155, "epoch": 6941} {"train_loss": -28.255109786987305, "global_step": 576156, "epoch": 6941} {"train_loss": -27.468219757080078, "global_step": 576157, "epoch": 6941} {"train_loss": -27.51803970336914, "global_step": 576158, "epoch": 6941} {"train_loss": -27.74749183654785, "global_step": 576159, "epoch": 6941} {"train_loss": -27.587295532226562, "global_step": 576160, "epoch": 6941} {"train_loss": -27.16888999938965, "global_step": 576161, "epoch": 6941} {"train_loss": -27.762649536132812, "global_step": 576162, "epoch": 6941} {"train_loss": -27.981714248657227, "global_step": 576163, "epoch": 6941} {"train_loss": -27.591272354125977, "global_step": 576164, "epoch": 6941} {"train_loss": -27.811315536499023, "global_step": 576165, "epoch": 6941} {"train_loss": -28.0069637298584, "global_step": 576166, "epoch": 6941} {"train_loss": -27.97748374938965, "global_step": 576167, "epoch": 6941} {"train_loss": -27.806182861328125, "global_step": 576168, "epoch": 6941} {"train_loss": -28.097211837768555, "global_step": 576169, "epoch": 6941} {"train_loss": -27.766584396362305, "global_step": 576170, "epoch": 6941} {"train_loss": -27.79831314086914, "global_step": 576171, "epoch": 6941} {"train_loss": -27.703338623046875, "global_step": 576172, "epoch": 6941} {"train_loss": -27.884180068969727, "global_step": 576173, "epoch": 6941} {"train_loss": -28.29471206665039, "global_step": 576174, "epoch": 6941} {"train_loss": -28.275928497314453, "global_step": 576175, "epoch": 6941} {"train_loss": -27.817350387573242, "global_step": 576176, "epoch": 6941} {"train_loss": -27.87040138244629, "global_step": 576177, "epoch": 6941} {"train_loss": -27.969879150390625, "global_step": 576178, "epoch": 6941} {"train_loss": -28.024917602539062, "global_step": 576179, "epoch": 6941} {"train_loss": -27.981618881225586, "global_step": 576180, "epoch": 6941} {"train_loss": -27.735767364501953, "global_step": 576181, "epoch": 6941} {"train_loss": -27.99017906188965, "global_step": 576182, "epoch": 6941} {"train_loss": -28.098901748657227, "global_step": 576183, "epoch": 6941} {"train_loss": -27.79823875427246, "global_step": 576184, "epoch": 6941} {"train_loss": -27.73136600816106, "global_step": 576185, "epoch": 6941, "val_loss": 6593319.0} {"train_loss": -26.799819946289062, "global_step": 576186, "epoch": 6942} {"train_loss": -26.433975219726562, "global_step": 576187, "epoch": 6942} {"train_loss": -26.977039337158203, "global_step": 576188, "epoch": 6942} {"train_loss": -27.172550201416016, "global_step": 576189, "epoch": 6942} {"train_loss": -26.4097957611084, "global_step": 576190, "epoch": 6942} {"train_loss": -27.29998207092285, "global_step": 576191, "epoch": 6942} {"train_loss": -27.122278213500977, "global_step": 576192, "epoch": 6942} {"train_loss": -27.5581111907959, "global_step": 576193, "epoch": 6942} {"train_loss": -26.808212280273438, "global_step": 576194, "epoch": 6942} {"train_loss": -27.161840438842773, "global_step": 576195, "epoch": 6942} {"train_loss": -27.436758041381836, "global_step": 576196, "epoch": 6942} {"train_loss": -27.420984268188477, "global_step": 576197, "epoch": 6942} {"train_loss": -27.439855575561523, "global_step": 576198, "epoch": 6942} {"train_loss": -27.41876792907715, "global_step": 576199, "epoch": 6942} {"train_loss": -27.289886474609375, "global_step": 576200, "epoch": 6942} {"train_loss": -27.066781997680664, "global_step": 576201, "epoch": 6942} {"train_loss": -27.430587768554688, "global_step": 576202, "epoch": 6942} {"train_loss": -27.478683471679688, "global_step": 576203, "epoch": 6942} {"train_loss": -27.704065322875977, "global_step": 576204, "epoch": 6942} {"train_loss": -27.826690673828125, "global_step": 576205, "epoch": 6942} {"train_loss": -27.259815216064453, "global_step": 576206, "epoch": 6942} {"train_loss": -27.70999526977539, "global_step": 576207, "epoch": 6942} {"train_loss": -27.99959373474121, "global_step": 576208, "epoch": 6942} {"train_loss": -27.650854110717773, "global_step": 576209, "epoch": 6942} {"train_loss": -27.463886260986328, "global_step": 576210, "epoch": 6942} {"train_loss": -27.59217643737793, "global_step": 576211, "epoch": 6942} {"train_loss": -27.34138298034668, "global_step": 576212, "epoch": 6942} {"train_loss": -27.62762451171875, "global_step": 576213, "epoch": 6942} {"train_loss": -27.787567138671875, "global_step": 576214, "epoch": 6942} {"train_loss": -27.928857803344727, "global_step": 576215, "epoch": 6942} {"train_loss": -27.994375228881836, "global_step": 576216, "epoch": 6942} {"train_loss": -27.85798454284668, "global_step": 576217, "epoch": 6942} {"train_loss": -27.792627334594727, "global_step": 576218, "epoch": 6942} {"train_loss": -27.780170440673828, "global_step": 576219, "epoch": 6942} {"train_loss": -27.842687606811523, "global_step": 576220, "epoch": 6942} {"train_loss": -27.75831413269043, "global_step": 576221, "epoch": 6942} {"train_loss": -28.228673934936523, "global_step": 576222, "epoch": 6942} {"train_loss": -28.04450798034668, "global_step": 576223, "epoch": 6942} {"train_loss": -27.697635650634766, "global_step": 576224, "epoch": 6942} {"train_loss": -27.593351364135742, "global_step": 576225, "epoch": 6942} {"train_loss": -27.796878814697266, "global_step": 576226, "epoch": 6942} {"train_loss": -27.919097900390625, "global_step": 576227, "epoch": 6942} {"train_loss": -28.182531356811523, "global_step": 576228, "epoch": 6942} {"train_loss": -27.96393394470215, "global_step": 576229, "epoch": 6942} {"train_loss": -27.896081924438477, "global_step": 576230, "epoch": 6942} {"train_loss": -27.95966148376465, "global_step": 576231, "epoch": 6942} {"train_loss": -27.77532386779785, "global_step": 576232, "epoch": 6942} {"train_loss": -28.363239288330078, "global_step": 576233, "epoch": 6942} {"train_loss": -28.140111923217773, "global_step": 576234, "epoch": 6942} {"train_loss": -27.880863189697266, "global_step": 576235, "epoch": 6942} {"train_loss": -28.104263305664062, "global_step": 576236, "epoch": 6942} {"train_loss": -27.858762741088867, "global_step": 576237, "epoch": 6942} {"train_loss": -28.231786727905273, "global_step": 576238, "epoch": 6942} {"train_loss": -27.979379653930664, "global_step": 576239, "epoch": 6942} {"train_loss": -28.249908447265625, "global_step": 576240, "epoch": 6942} {"train_loss": -27.756067276000977, "global_step": 576241, "epoch": 6942} {"train_loss": -27.84235954284668, "global_step": 576242, "epoch": 6942} {"train_loss": -27.63306999206543, "global_step": 576243, "epoch": 6942} {"train_loss": -27.219409942626953, "global_step": 576244, "epoch": 6942} {"train_loss": -26.619831085205078, "global_step": 576245, "epoch": 6942} {"train_loss": -26.92058753967285, "global_step": 576246, "epoch": 6942} {"train_loss": -27.519495010375977, "global_step": 576247, "epoch": 6942} {"train_loss": -27.535816192626953, "global_step": 576248, "epoch": 6942} {"train_loss": -27.01595115661621, "global_step": 576249, "epoch": 6942} {"train_loss": -27.16440200805664, "global_step": 576250, "epoch": 6942} {"train_loss": -27.156885147094727, "global_step": 576251, "epoch": 6942} {"train_loss": -27.692712783813477, "global_step": 576252, "epoch": 6942} {"train_loss": -27.524566650390625, "global_step": 576253, "epoch": 6942} {"train_loss": -27.282567977905273, "global_step": 576254, "epoch": 6942} {"train_loss": -27.840198516845703, "global_step": 576255, "epoch": 6942} {"train_loss": -27.35909080505371, "global_step": 576256, "epoch": 6942} {"train_loss": -27.990177154541016, "global_step": 576257, "epoch": 6942} {"train_loss": -27.77589225769043, "global_step": 576258, "epoch": 6942} {"train_loss": -27.469879150390625, "global_step": 576259, "epoch": 6942} {"train_loss": -28.022680282592773, "global_step": 576260, "epoch": 6942} {"train_loss": -27.993085861206055, "global_step": 576261, "epoch": 6942} {"train_loss": -28.200214385986328, "global_step": 576262, "epoch": 6942} {"train_loss": -28.10031509399414, "global_step": 576263, "epoch": 6942} {"train_loss": -27.58347511291504, "global_step": 576264, "epoch": 6942} {"train_loss": -27.556949615478516, "global_step": 576265, "epoch": 6942} {"train_loss": -27.94671630859375, "global_step": 576266, "epoch": 6942} {"train_loss": -27.631549835205078, "global_step": 576267, "epoch": 6942} {"train_loss": -27.610083913228596, "global_step": 576268, "epoch": 6942, "val_loss": 6519181.0} {"train_loss": -26.694990158081055, "global_step": 576269, "epoch": 6943} {"train_loss": -27.50738525390625, "global_step": 576270, "epoch": 6943} {"train_loss": -27.30849266052246, "global_step": 576271, "epoch": 6943} {"train_loss": -26.67999839782715, "global_step": 576272, "epoch": 6943} {"train_loss": -26.375341415405273, "global_step": 576273, "epoch": 6943} {"train_loss": -27.078107833862305, "global_step": 576274, "epoch": 6943} {"train_loss": -26.5137939453125, "global_step": 576275, "epoch": 6943} {"train_loss": -27.291305541992188, "global_step": 576276, "epoch": 6943} {"train_loss": -27.1912784576416, "global_step": 576277, "epoch": 6943} {"train_loss": -27.162342071533203, "global_step": 576278, "epoch": 6943} {"train_loss": -27.414533615112305, "global_step": 576279, "epoch": 6943} {"train_loss": -26.879980087280273, "global_step": 576280, "epoch": 6943} {"train_loss": -27.363767623901367, "global_step": 576281, "epoch": 6943} {"train_loss": -27.068647384643555, "global_step": 576282, "epoch": 6943} {"train_loss": -27.726720809936523, "global_step": 576283, "epoch": 6943} {"train_loss": -27.50404167175293, "global_step": 576284, "epoch": 6943} {"train_loss": -27.61968421936035, "global_step": 576285, "epoch": 6943} {"train_loss": -27.751733779907227, "global_step": 576286, "epoch": 6943} {"train_loss": -27.824735641479492, "global_step": 576287, "epoch": 6943} {"train_loss": -27.7658748626709, "global_step": 576288, "epoch": 6943} {"train_loss": -27.74298667907715, "global_step": 576289, "epoch": 6943} {"train_loss": -27.75567054748535, "global_step": 576290, "epoch": 6943} {"train_loss": -27.845691680908203, "global_step": 576291, "epoch": 6943} {"train_loss": -27.625537872314453, "global_step": 576292, "epoch": 6943} {"train_loss": -27.61481285095215, "global_step": 576293, "epoch": 6943} {"train_loss": -27.786848068237305, "global_step": 576294, "epoch": 6943} {"train_loss": -27.884994506835938, "global_step": 576295, "epoch": 6943} {"train_loss": -27.5950927734375, "global_step": 576296, "epoch": 6943} {"train_loss": -27.776288986206055, "global_step": 576297, "epoch": 6943} {"train_loss": -27.5031681060791, "global_step": 576298, "epoch": 6943} {"train_loss": -27.683744430541992, "global_step": 576299, "epoch": 6943} {"train_loss": -27.92708396911621, "global_step": 576300, "epoch": 6943} {"train_loss": -28.03375244140625, "global_step": 576301, "epoch": 6943} {"train_loss": -27.84889030456543, "global_step": 576302, "epoch": 6943} {"train_loss": -27.82630729675293, "global_step": 576303, "epoch": 6943} {"train_loss": -27.4990234375, "global_step": 576304, "epoch": 6943} {"train_loss": -28.16505241394043, "global_step": 576305, "epoch": 6943} {"train_loss": -27.7761173248291, "global_step": 576306, "epoch": 6943} {"train_loss": -28.2752742767334, "global_step": 576307, "epoch": 6943} {"train_loss": -27.71843910217285, "global_step": 576308, "epoch": 6943} {"train_loss": -27.83951759338379, "global_step": 576309, "epoch": 6943} {"train_loss": -27.630353927612305, "global_step": 576310, "epoch": 6943} {"train_loss": -27.409107208251953, "global_step": 576311, "epoch": 6943} {"train_loss": -28.115446090698242, "global_step": 576312, "epoch": 6943} {"train_loss": -27.861295700073242, "global_step": 576313, "epoch": 6943} {"train_loss": -28.16375160217285, "global_step": 576314, "epoch": 6943} {"train_loss": -27.81109619140625, "global_step": 576315, "epoch": 6943} {"train_loss": -28.623188018798828, "global_step": 576316, "epoch": 6943} {"train_loss": -27.9845027923584, "global_step": 576317, "epoch": 6943} {"train_loss": -28.31647300720215, "global_step": 576318, "epoch": 6943} {"train_loss": -27.956571578979492, "global_step": 576319, "epoch": 6943} {"train_loss": -28.009296417236328, "global_step": 576320, "epoch": 6943} {"train_loss": -28.058374404907227, "global_step": 576321, "epoch": 6943} {"train_loss": -28.33498191833496, "global_step": 576322, "epoch": 6943} {"train_loss": -28.0747013092041, "global_step": 576323, "epoch": 6943} {"train_loss": -27.996124267578125, "global_step": 576324, "epoch": 6943} {"train_loss": -27.817859649658203, "global_step": 576325, "epoch": 6943} {"train_loss": -27.907846450805664, "global_step": 576326, "epoch": 6943} {"train_loss": -28.517484664916992, "global_step": 576327, "epoch": 6943} {"train_loss": -28.504749298095703, "global_step": 576328, "epoch": 6943} {"train_loss": -28.207300186157227, "global_step": 576329, "epoch": 6943} {"train_loss": -27.978857040405273, "global_step": 576330, "epoch": 6943} {"train_loss": -27.962417602539062, "global_step": 576331, "epoch": 6943} {"train_loss": -28.011335372924805, "global_step": 576332, "epoch": 6943} {"train_loss": -28.152692794799805, "global_step": 576333, "epoch": 6943} {"train_loss": -27.946598052978516, "global_step": 576334, "epoch": 6943} {"train_loss": -27.893354415893555, "global_step": 576335, "epoch": 6943} {"train_loss": -27.83935546875, "global_step": 576336, "epoch": 6943} {"train_loss": -27.294340133666992, "global_step": 576337, "epoch": 6943} {"train_loss": -27.396549224853516, "global_step": 576338, "epoch": 6943} {"train_loss": -28.03171157836914, "global_step": 576339, "epoch": 6943} {"train_loss": -28.374114990234375, "global_step": 576340, "epoch": 6943} {"train_loss": -27.698719024658203, "global_step": 576341, "epoch": 6943} {"train_loss": -27.5554256439209, "global_step": 576342, "epoch": 6943} {"train_loss": -27.688129425048828, "global_step": 576343, "epoch": 6943} {"train_loss": -27.106164932250977, "global_step": 576344, "epoch": 6943} {"train_loss": -27.228307723999023, "global_step": 576345, "epoch": 6943} {"train_loss": -26.66485595703125, "global_step": 576346, "epoch": 6943} {"train_loss": -26.576461791992188, "global_step": 576347, "epoch": 6943} {"train_loss": -27.643232345581055, "global_step": 576348, "epoch": 6943} {"train_loss": -27.751739501953125, "global_step": 576349, "epoch": 6943} {"train_loss": -27.410659790039062, "global_step": 576350, "epoch": 6943} {"train_loss": -27.69241422630218, "global_step": 576351, "epoch": 6943, "val_loss": 6561101.0} {"train_loss": -26.620502471923828, "global_step": 576352, "epoch": 6944} {"train_loss": -25.970947265625, "global_step": 576353, "epoch": 6944} {"train_loss": -26.098098754882812, "global_step": 576354, "epoch": 6944} {"train_loss": -26.312580108642578, "global_step": 576355, "epoch": 6944} {"train_loss": -26.4625186920166, "global_step": 576356, "epoch": 6944} {"train_loss": -25.657812118530273, "global_step": 576357, "epoch": 6944} {"train_loss": -27.149137496948242, "global_step": 576358, "epoch": 6944} {"train_loss": -26.396076202392578, "global_step": 576359, "epoch": 6944} {"train_loss": -27.25873374938965, "global_step": 576360, "epoch": 6944} {"train_loss": -27.040403366088867, "global_step": 576361, "epoch": 6944} {"train_loss": -27.22529411315918, "global_step": 576362, "epoch": 6944} {"train_loss": -26.993976593017578, "global_step": 576363, "epoch": 6944} {"train_loss": -26.822656631469727, "global_step": 576364, "epoch": 6944} {"train_loss": -26.859460830688477, "global_step": 576365, "epoch": 6944} {"train_loss": -27.069061279296875, "global_step": 576366, "epoch": 6944} {"train_loss": -26.751495361328125, "global_step": 576367, "epoch": 6944} {"train_loss": -26.616382598876953, "global_step": 576368, "epoch": 6944} {"train_loss": -27.150836944580078, "global_step": 576369, "epoch": 6944} {"train_loss": -27.2652645111084, "global_step": 576370, "epoch": 6944} {"train_loss": -27.264301300048828, "global_step": 576371, "epoch": 6944} {"train_loss": -27.26373863220215, "global_step": 576372, "epoch": 6944} {"train_loss": -27.01141929626465, "global_step": 576373, "epoch": 6944} {"train_loss": -27.135984420776367, "global_step": 576374, "epoch": 6944} {"train_loss": -27.304859161376953, "global_step": 576375, "epoch": 6944} {"train_loss": -27.610193252563477, "global_step": 576376, "epoch": 6944} {"train_loss": -27.448627471923828, "global_step": 576377, "epoch": 6944} {"train_loss": -27.459381103515625, "global_step": 576378, "epoch": 6944} {"train_loss": -27.424457550048828, "global_step": 576379, "epoch": 6944} {"train_loss": -27.38144302368164, "global_step": 576380, "epoch": 6944} {"train_loss": -27.678266525268555, "global_step": 576381, "epoch": 6944} {"train_loss": -27.69287109375, "global_step": 576382, "epoch": 6944} {"train_loss": -27.75245475769043, "global_step": 576383, "epoch": 6944} {"train_loss": -27.388748168945312, "global_step": 576384, "epoch": 6944} {"train_loss": -27.47649574279785, "global_step": 576385, "epoch": 6944} {"train_loss": -27.825458526611328, "global_step": 576386, "epoch": 6944} {"train_loss": -27.9205322265625, "global_step": 576387, "epoch": 6944} {"train_loss": -27.796741485595703, "global_step": 576388, "epoch": 6944} {"train_loss": -27.922266006469727, "global_step": 576389, "epoch": 6944} {"train_loss": -27.817596435546875, "global_step": 576390, "epoch": 6944} {"train_loss": -27.68427848815918, "global_step": 576391, "epoch": 6944} {"train_loss": -28.117223739624023, "global_step": 576392, "epoch": 6944} {"train_loss": -28.144025802612305, "global_step": 576393, "epoch": 6944} {"train_loss": -27.893762588500977, "global_step": 576394, "epoch": 6944} {"train_loss": -28.193029403686523, "global_step": 576395, "epoch": 6944} {"train_loss": -27.968061447143555, "global_step": 576396, "epoch": 6944} {"train_loss": -27.93145751953125, "global_step": 576397, "epoch": 6944} {"train_loss": -27.92948341369629, "global_step": 576398, "epoch": 6944} {"train_loss": -27.974262237548828, "global_step": 576399, "epoch": 6944} {"train_loss": -27.627033233642578, "global_step": 576400, "epoch": 6944} {"train_loss": -28.011001586914062, "global_step": 576401, "epoch": 6944} {"train_loss": -27.535480499267578, "global_step": 576402, "epoch": 6944} {"train_loss": -27.902318954467773, "global_step": 576403, "epoch": 6944} {"train_loss": -27.986099243164062, "global_step": 576404, "epoch": 6944} {"train_loss": -27.89851188659668, "global_step": 576405, "epoch": 6944} {"train_loss": -27.911314010620117, "global_step": 576406, "epoch": 6944} {"train_loss": -27.94610023498535, "global_step": 576407, "epoch": 6944} {"train_loss": -27.932538986206055, "global_step": 576408, "epoch": 6944} {"train_loss": -27.8261661529541, "global_step": 576409, "epoch": 6944} {"train_loss": -27.743871688842773, "global_step": 576410, "epoch": 6944} {"train_loss": -27.710351943969727, "global_step": 576411, "epoch": 6944} {"train_loss": -28.25832176208496, "global_step": 576412, "epoch": 6944} {"train_loss": -28.0454158782959, "global_step": 576413, "epoch": 6944} {"train_loss": -27.245508193969727, "global_step": 576414, "epoch": 6944} {"train_loss": -27.525232315063477, "global_step": 576415, "epoch": 6944} {"train_loss": -27.840375900268555, "global_step": 576416, "epoch": 6944} {"train_loss": -28.334314346313477, "global_step": 576417, "epoch": 6944} {"train_loss": -27.98190689086914, "global_step": 576418, "epoch": 6944} {"train_loss": -27.778562545776367, "global_step": 576419, "epoch": 6944} {"train_loss": -28.297025680541992, "global_step": 576420, "epoch": 6944} {"train_loss": -27.972583770751953, "global_step": 576421, "epoch": 6944} {"train_loss": -28.106870651245117, "global_step": 576422, "epoch": 6944} {"train_loss": -28.088626861572266, "global_step": 576423, "epoch": 6944} {"train_loss": -28.119882583618164, "global_step": 576424, "epoch": 6944} {"train_loss": -28.094165802001953, "global_step": 576425, "epoch": 6944} {"train_loss": -27.57002067565918, "global_step": 576426, "epoch": 6944} {"train_loss": -28.087182998657227, "global_step": 576427, "epoch": 6944} {"train_loss": -27.77093505859375, "global_step": 576428, "epoch": 6944} {"train_loss": -27.832599639892578, "global_step": 576429, "epoch": 6944} {"train_loss": -27.754560470581055, "global_step": 576430, "epoch": 6944} {"train_loss": -27.9327335357666, "global_step": 576431, "epoch": 6944} {"train_loss": -27.977079391479492, "global_step": 576432, "epoch": 6944} {"train_loss": -28.090702056884766, "global_step": 576433, "epoch": 6944} {"train_loss": -27.53861788094762, "global_step": 576434, "epoch": 6944, "val_loss": 6584021.0} {"train_loss": -27.467090606689453, "global_step": 576435, "epoch": 6945} {"train_loss": -26.37354850769043, "global_step": 576436, "epoch": 6945} {"train_loss": -26.826059341430664, "global_step": 576437, "epoch": 6945} {"train_loss": -26.99674415588379, "global_step": 576438, "epoch": 6945} {"train_loss": -27.100955963134766, "global_step": 576439, "epoch": 6945} {"train_loss": -27.1219482421875, "global_step": 576440, "epoch": 6945} {"train_loss": -26.646350860595703, "global_step": 576441, "epoch": 6945} {"train_loss": -27.184812545776367, "global_step": 576442, "epoch": 6945} {"train_loss": -26.89728355407715, "global_step": 576443, "epoch": 6945} {"train_loss": -27.208707809448242, "global_step": 576444, "epoch": 6945} {"train_loss": -26.913976669311523, "global_step": 576445, "epoch": 6945} {"train_loss": -27.091947555541992, "global_step": 576446, "epoch": 6945} {"train_loss": -26.9040584564209, "global_step": 576447, "epoch": 6945} {"train_loss": -27.391584396362305, "global_step": 576448, "epoch": 6945} {"train_loss": -27.351675033569336, "global_step": 576449, "epoch": 6945} {"train_loss": -27.498647689819336, "global_step": 576450, "epoch": 6945} {"train_loss": -27.652524948120117, "global_step": 576451, "epoch": 6945} {"train_loss": -27.953283309936523, "global_step": 576452, "epoch": 6945} {"train_loss": -27.031782150268555, "global_step": 576453, "epoch": 6945} {"train_loss": -27.390731811523438, "global_step": 576454, "epoch": 6945} {"train_loss": -27.367919921875, "global_step": 576455, "epoch": 6945} {"train_loss": -27.642932891845703, "global_step": 576456, "epoch": 6945} {"train_loss": -27.556350708007812, "global_step": 576457, "epoch": 6945} {"train_loss": -27.340063095092773, "global_step": 576458, "epoch": 6945} {"train_loss": -27.489521026611328, "global_step": 576459, "epoch": 6945} {"train_loss": -27.668720245361328, "global_step": 576460, "epoch": 6945} {"train_loss": -27.734180450439453, "global_step": 576461, "epoch": 6945} {"train_loss": -27.564788818359375, "global_step": 576462, "epoch": 6945} {"train_loss": -27.81342887878418, "global_step": 576463, "epoch": 6945} {"train_loss": -27.740375518798828, "global_step": 576464, "epoch": 6945} {"train_loss": -27.748184204101562, "global_step": 576465, "epoch": 6945} {"train_loss": -27.919479370117188, "global_step": 576466, "epoch": 6945} {"train_loss": -28.093679428100586, "global_step": 576467, "epoch": 6945} {"train_loss": -28.02374839782715, "global_step": 576468, "epoch": 6945} {"train_loss": -27.852848052978516, "global_step": 576469, "epoch": 6945} {"train_loss": -27.497159957885742, "global_step": 576470, "epoch": 6945} {"train_loss": -28.268701553344727, "global_step": 576471, "epoch": 6945} {"train_loss": -27.629669189453125, "global_step": 576472, "epoch": 6945} {"train_loss": -27.88525390625, "global_step": 576473, "epoch": 6945} {"train_loss": -28.240869522094727, "global_step": 576474, "epoch": 6945} {"train_loss": -28.010345458984375, "global_step": 576475, "epoch": 6945} {"train_loss": -27.662179946899414, "global_step": 576476, "epoch": 6945} {"train_loss": -28.005329132080078, "global_step": 576477, "epoch": 6945} {"train_loss": -27.85015869140625, "global_step": 576478, "epoch": 6945} {"train_loss": -27.441022872924805, "global_step": 576479, "epoch": 6945} {"train_loss": -27.801054000854492, "global_step": 576480, "epoch": 6945} {"train_loss": -27.865772247314453, "global_step": 576481, "epoch": 6945} {"train_loss": -27.607290267944336, "global_step": 576482, "epoch": 6945} {"train_loss": -27.88814353942871, "global_step": 576483, "epoch": 6945} {"train_loss": -27.863012313842773, "global_step": 576484, "epoch": 6945} {"train_loss": -28.14918327331543, "global_step": 576485, "epoch": 6945} {"train_loss": -28.048364639282227, "global_step": 576486, "epoch": 6945} {"train_loss": -28.317676544189453, "global_step": 576487, "epoch": 6945} {"train_loss": -28.02863883972168, "global_step": 576488, "epoch": 6945} {"train_loss": -28.100446701049805, "global_step": 576489, "epoch": 6945} {"train_loss": -27.69837760925293, "global_step": 576490, "epoch": 6945} {"train_loss": -28.127344131469727, "global_step": 576491, "epoch": 6945} {"train_loss": -28.16513442993164, "global_step": 576492, "epoch": 6945} {"train_loss": -28.0449275970459, "global_step": 576493, "epoch": 6945} {"train_loss": -27.612279891967773, "global_step": 576494, "epoch": 6945} {"train_loss": -27.25166130065918, "global_step": 576495, "epoch": 6945} {"train_loss": -27.8259334564209, "global_step": 576496, "epoch": 6945} {"train_loss": -28.073339462280273, "global_step": 576497, "epoch": 6945} {"train_loss": -27.446369171142578, "global_step": 576498, "epoch": 6945} {"train_loss": -27.718835830688477, "global_step": 576499, "epoch": 6945} {"train_loss": -27.74639892578125, "global_step": 576500, "epoch": 6945} {"train_loss": -28.040882110595703, "global_step": 576501, "epoch": 6945} {"train_loss": -27.793598175048828, "global_step": 576502, "epoch": 6945} {"train_loss": -28.12774085998535, "global_step": 576503, "epoch": 6945} {"train_loss": -27.772546768188477, "global_step": 576504, "epoch": 6945} {"train_loss": -27.689573287963867, "global_step": 576505, "epoch": 6945} {"train_loss": -28.222503662109375, "global_step": 576506, "epoch": 6945} {"train_loss": -27.961828231811523, "global_step": 576507, "epoch": 6945} {"train_loss": -27.907201766967773, "global_step": 576508, "epoch": 6945} {"train_loss": -27.460464477539062, "global_step": 576509, "epoch": 6945} {"train_loss": -27.671796798706055, "global_step": 576510, "epoch": 6945} {"train_loss": -28.07636833190918, "global_step": 576511, "epoch": 6945} {"train_loss": -27.929569244384766, "global_step": 576512, "epoch": 6945} {"train_loss": -27.714208602905273, "global_step": 576513, "epoch": 6945} {"train_loss": -27.889495849609375, "global_step": 576514, "epoch": 6945} {"train_loss": -27.888416290283203, "global_step": 576515, "epoch": 6945} {"train_loss": -28.006017684936523, "global_step": 576516, "epoch": 6945} {"train_loss": -27.67961134393531, "global_step": 576517, "epoch": 6945, "val_loss": 6656426.0} {"train_loss": -27.653745651245117, "global_step": 576518, "epoch": 6946} {"train_loss": -27.145971298217773, "global_step": 576519, "epoch": 6946} {"train_loss": -27.902069091796875, "global_step": 576520, "epoch": 6946} {"train_loss": -26.827640533447266, "global_step": 576521, "epoch": 6946} {"train_loss": -27.058612823486328, "global_step": 576522, "epoch": 6946} {"train_loss": -27.4658145904541, "global_step": 576523, "epoch": 6946} {"train_loss": -28.007675170898438, "global_step": 576524, "epoch": 6946} {"train_loss": -27.922998428344727, "global_step": 576525, "epoch": 6946} {"train_loss": -27.569671630859375, "global_step": 576526, "epoch": 6946} {"train_loss": -27.28059196472168, "global_step": 576527, "epoch": 6946} {"train_loss": -27.692441940307617, "global_step": 576528, "epoch": 6946} {"train_loss": -27.510330200195312, "global_step": 576529, "epoch": 6946} {"train_loss": -27.28728675842285, "global_step": 576530, "epoch": 6946} {"train_loss": -27.438268661499023, "global_step": 576531, "epoch": 6946} {"train_loss": -27.581268310546875, "global_step": 576532, "epoch": 6946} {"train_loss": -27.64947509765625, "global_step": 576533, "epoch": 6946} {"train_loss": -27.82090187072754, "global_step": 576534, "epoch": 6946} {"train_loss": -27.605371475219727, "global_step": 576535, "epoch": 6946} {"train_loss": -27.430469512939453, "global_step": 576536, "epoch": 6946} {"train_loss": -27.860990524291992, "global_step": 576537, "epoch": 6946} {"train_loss": -27.782270431518555, "global_step": 576538, "epoch": 6946} {"train_loss": -27.821863174438477, "global_step": 576539, "epoch": 6946} {"train_loss": -27.753515243530273, "global_step": 576540, "epoch": 6946} {"train_loss": -27.810256958007812, "global_step": 576541, "epoch": 6946} {"train_loss": -27.647485733032227, "global_step": 576542, "epoch": 6946} {"train_loss": -27.673730850219727, "global_step": 576543, "epoch": 6946} {"train_loss": -27.950092315673828, "global_step": 576544, "epoch": 6946} {"train_loss": -27.91082191467285, "global_step": 576545, "epoch": 6946} {"train_loss": -27.49883460998535, "global_step": 576546, "epoch": 6946} {"train_loss": -27.7956485748291, "global_step": 576547, "epoch": 6946} {"train_loss": -27.617109298706055, "global_step": 576548, "epoch": 6946} {"train_loss": -27.798526763916016, "global_step": 576549, "epoch": 6946} {"train_loss": -27.882694244384766, "global_step": 576550, "epoch": 6946} {"train_loss": -27.94501304626465, "global_step": 576551, "epoch": 6946} {"train_loss": -27.753515243530273, "global_step": 576552, "epoch": 6946} {"train_loss": -27.490753173828125, "global_step": 576553, "epoch": 6946} {"train_loss": -27.641141891479492, "global_step": 576554, "epoch": 6946} {"train_loss": -27.424182891845703, "global_step": 576555, "epoch": 6946} {"train_loss": -27.508283615112305, "global_step": 576556, "epoch": 6946} {"train_loss": -27.730695724487305, "global_step": 576557, "epoch": 6946} {"train_loss": -27.8691349029541, "global_step": 576558, "epoch": 6946} {"train_loss": -27.661787033081055, "global_step": 576559, "epoch": 6946} {"train_loss": -27.45245933532715, "global_step": 576560, "epoch": 6946} {"train_loss": -27.841419219970703, "global_step": 576561, "epoch": 6946} {"train_loss": -27.878332138061523, "global_step": 576562, "epoch": 6946} {"train_loss": -27.97480583190918, "global_step": 576563, "epoch": 6946} {"train_loss": -28.14801597595215, "global_step": 576564, "epoch": 6946} {"train_loss": -27.90021324157715, "global_step": 576565, "epoch": 6946} {"train_loss": -28.001901626586914, "global_step": 576566, "epoch": 6946} {"train_loss": -28.008468627929688, "global_step": 576567, "epoch": 6946} {"train_loss": -27.8029842376709, "global_step": 576568, "epoch": 6946} {"train_loss": -27.7737979888916, "global_step": 576569, "epoch": 6946} {"train_loss": -28.01297378540039, "global_step": 576570, "epoch": 6946} {"train_loss": -27.797821044921875, "global_step": 576571, "epoch": 6946} {"train_loss": -28.055593490600586, "global_step": 576572, "epoch": 6946} {"train_loss": -28.347064971923828, "global_step": 576573, "epoch": 6946} {"train_loss": -27.938034057617188, "global_step": 576574, "epoch": 6946} {"train_loss": -28.11957359313965, "global_step": 576575, "epoch": 6946} {"train_loss": -27.717721939086914, "global_step": 576576, "epoch": 6946} {"train_loss": -28.3077392578125, "global_step": 576577, "epoch": 6946} {"train_loss": -27.97223472595215, "global_step": 576578, "epoch": 6946} {"train_loss": -27.833404541015625, "global_step": 576579, "epoch": 6946} {"train_loss": -27.95944595336914, "global_step": 576580, "epoch": 6946} {"train_loss": -27.974157333374023, "global_step": 576581, "epoch": 6946} {"train_loss": -27.831022262573242, "global_step": 576582, "epoch": 6946} {"train_loss": -27.639169692993164, "global_step": 576583, "epoch": 6946} {"train_loss": -27.52583885192871, "global_step": 576584, "epoch": 6946} {"train_loss": -28.007251739501953, "global_step": 576585, "epoch": 6946} {"train_loss": -27.735334396362305, "global_step": 576586, "epoch": 6946} {"train_loss": -27.299100875854492, "global_step": 576587, "epoch": 6946} {"train_loss": -27.624387741088867, "global_step": 576588, "epoch": 6946} {"train_loss": -27.187808990478516, "global_step": 576589, "epoch": 6946} {"train_loss": -28.152191162109375, "global_step": 576590, "epoch": 6946} {"train_loss": -27.788516998291016, "global_step": 576591, "epoch": 6946} {"train_loss": -28.08345603942871, "global_step": 576592, "epoch": 6946} {"train_loss": -28.022003173828125, "global_step": 576593, "epoch": 6946} {"train_loss": -27.812488555908203, "global_step": 576594, "epoch": 6946} {"train_loss": -28.118289947509766, "global_step": 576595, "epoch": 6946} {"train_loss": -28.007028579711914, "global_step": 576596, "epoch": 6946} {"train_loss": -27.999679565429688, "global_step": 576597, "epoch": 6946} {"train_loss": -28.24903678894043, "global_step": 576598, "epoch": 6946} {"train_loss": -28.1506290435791, "global_step": 576599, "epoch": 6946} {"train_loss": -27.76299892563418, "global_step": 576600, "epoch": 6946, "val_loss": 6594215.0} {"train_loss": -27.059934616088867, "global_step": 576601, "epoch": 6947} {"train_loss": -27.18433952331543, "global_step": 576602, "epoch": 6947} {"train_loss": -27.493518829345703, "global_step": 576603, "epoch": 6947} {"train_loss": -27.38132667541504, "global_step": 576604, "epoch": 6947} {"train_loss": -27.28609275817871, "global_step": 576605, "epoch": 6947} {"train_loss": -26.86933708190918, "global_step": 576606, "epoch": 6947} {"train_loss": -27.914731979370117, "global_step": 576607, "epoch": 6947} {"train_loss": -27.733564376831055, "global_step": 576608, "epoch": 6947} {"train_loss": -27.654911041259766, "global_step": 576609, "epoch": 6947} {"train_loss": -27.36456871032715, "global_step": 576610, "epoch": 6947} {"train_loss": -27.30645751953125, "global_step": 576611, "epoch": 6947} {"train_loss": -27.496246337890625, "global_step": 576612, "epoch": 6947} {"train_loss": -27.6391658782959, "global_step": 576613, "epoch": 6947} {"train_loss": -27.697614669799805, "global_step": 576614, "epoch": 6947} {"train_loss": -28.015466690063477, "global_step": 576615, "epoch": 6947} {"train_loss": -27.599897384643555, "global_step": 576616, "epoch": 6947} {"train_loss": -27.271398544311523, "global_step": 576617, "epoch": 6947} {"train_loss": -27.81431007385254, "global_step": 576618, "epoch": 6947} {"train_loss": -26.86865234375, "global_step": 576619, "epoch": 6947} {"train_loss": -27.327184677124023, "global_step": 576620, "epoch": 6947} {"train_loss": -27.399030685424805, "global_step": 576621, "epoch": 6947} {"train_loss": -27.7019100189209, "global_step": 576622, "epoch": 6947} {"train_loss": -27.370542526245117, "global_step": 576623, "epoch": 6947} {"train_loss": -27.845443725585938, "global_step": 576624, "epoch": 6947} {"train_loss": -27.824888229370117, "global_step": 576625, "epoch": 6947} {"train_loss": -27.517194747924805, "global_step": 576626, "epoch": 6947} {"train_loss": -27.72303581237793, "global_step": 576627, "epoch": 6947} {"train_loss": -27.897031784057617, "global_step": 576628, "epoch": 6947} {"train_loss": -27.9490909576416, "global_step": 576629, "epoch": 6947} {"train_loss": -27.7027530670166, "global_step": 576630, "epoch": 6947} {"train_loss": -27.8568172454834, "global_step": 576631, "epoch": 6947} {"train_loss": -27.502918243408203, "global_step": 576632, "epoch": 6947} {"train_loss": -27.55116081237793, "global_step": 576633, "epoch": 6947} {"train_loss": -27.797204971313477, "global_step": 576634, "epoch": 6947} {"train_loss": -27.730438232421875, "global_step": 576635, "epoch": 6947} {"train_loss": -27.739856719970703, "global_step": 576636, "epoch": 6947} {"train_loss": -27.819507598876953, "global_step": 576637, "epoch": 6947} {"train_loss": -27.882186889648438, "global_step": 576638, "epoch": 6947} {"train_loss": -28.0217227935791, "global_step": 576639, "epoch": 6947} {"train_loss": -28.352880477905273, "global_step": 576640, "epoch": 6947} {"train_loss": -27.89226722717285, "global_step": 576641, "epoch": 6947} {"train_loss": -28.030332565307617, "global_step": 576642, "epoch": 6947} {"train_loss": -27.86579704284668, "global_step": 576643, "epoch": 6947} {"train_loss": -28.139978408813477, "global_step": 576644, "epoch": 6947} {"train_loss": -27.639184951782227, "global_step": 576645, "epoch": 6947} {"train_loss": -28.013525009155273, "global_step": 576646, "epoch": 6947} {"train_loss": -27.4478816986084, "global_step": 576647, "epoch": 6947} {"train_loss": -28.14845085144043, "global_step": 576648, "epoch": 6947} {"train_loss": -28.329309463500977, "global_step": 576649, "epoch": 6947} {"train_loss": -27.64520835876465, "global_step": 576650, "epoch": 6947} {"train_loss": -28.169870376586914, "global_step": 576651, "epoch": 6947} {"train_loss": -27.910669326782227, "global_step": 576652, "epoch": 6947} {"train_loss": -27.961658477783203, "global_step": 576653, "epoch": 6947} {"train_loss": -27.752180099487305, "global_step": 576654, "epoch": 6947} {"train_loss": -28.024072647094727, "global_step": 576655, "epoch": 6947} {"train_loss": -27.545475006103516, "global_step": 576656, "epoch": 6947} {"train_loss": -28.006574630737305, "global_step": 576657, "epoch": 6947} {"train_loss": -27.97593116760254, "global_step": 576658, "epoch": 6947} {"train_loss": -28.1198673248291, "global_step": 576659, "epoch": 6947} {"train_loss": -27.7777042388916, "global_step": 576660, "epoch": 6947} {"train_loss": -27.679792404174805, "global_step": 576661, "epoch": 6947} {"train_loss": -27.884265899658203, "global_step": 576662, "epoch": 6947} {"train_loss": -27.92167091369629, "global_step": 576663, "epoch": 6947} {"train_loss": -27.61648941040039, "global_step": 576664, "epoch": 6947} {"train_loss": -27.639739990234375, "global_step": 576665, "epoch": 6947} {"train_loss": -28.061725616455078, "global_step": 576666, "epoch": 6947} {"train_loss": -27.93031120300293, "global_step": 576667, "epoch": 6947} {"train_loss": -28.11561393737793, "global_step": 576668, "epoch": 6947} {"train_loss": -27.950647354125977, "global_step": 576669, "epoch": 6947} {"train_loss": -27.61767578125, "global_step": 576670, "epoch": 6947} {"train_loss": -28.41975212097168, "global_step": 576671, "epoch": 6947} {"train_loss": -27.572677612304688, "global_step": 576672, "epoch": 6947} {"train_loss": -27.951435089111328, "global_step": 576673, "epoch": 6947} {"train_loss": -27.844202041625977, "global_step": 576674, "epoch": 6947} {"train_loss": -27.80877113342285, "global_step": 576675, "epoch": 6947} {"train_loss": -27.927871704101562, "global_step": 576676, "epoch": 6947} {"train_loss": -27.940372467041016, "global_step": 576677, "epoch": 6947} {"train_loss": -28.039907455444336, "global_step": 576678, "epoch": 6947} {"train_loss": -27.86859130859375, "global_step": 576679, "epoch": 6947} {"train_loss": -27.6864013671875, "global_step": 576680, "epoch": 6947} {"train_loss": -27.961090087890625, "global_step": 576681, "epoch": 6947} {"train_loss": -27.90940284729004, "global_step": 576682, "epoch": 6947} {"train_loss": -27.75343550256936, "global_step": 576683, "epoch": 6947, "val_loss": 6649663.0} {"train_loss": -27.131916046142578, "global_step": 576684, "epoch": 6948} {"train_loss": -26.91178321838379, "global_step": 576685, "epoch": 6948} {"train_loss": -26.170923233032227, "global_step": 576686, "epoch": 6948} {"train_loss": -26.373044967651367, "global_step": 576687, "epoch": 6948} {"train_loss": -26.973682403564453, "global_step": 576688, "epoch": 6948} {"train_loss": -27.5836124420166, "global_step": 576689, "epoch": 6948} {"train_loss": -26.904706954956055, "global_step": 576690, "epoch": 6948} {"train_loss": -27.112096786499023, "global_step": 576691, "epoch": 6948} {"train_loss": -27.065006256103516, "global_step": 576692, "epoch": 6948} {"train_loss": -27.15966796875, "global_step": 576693, "epoch": 6948} {"train_loss": -26.791309356689453, "global_step": 576694, "epoch": 6948} {"train_loss": -27.258337020874023, "global_step": 576695, "epoch": 6948} {"train_loss": -27.043466567993164, "global_step": 576696, "epoch": 6948} {"train_loss": -27.473876953125, "global_step": 576697, "epoch": 6948} {"train_loss": -27.102319717407227, "global_step": 576698, "epoch": 6948} {"train_loss": -27.038373947143555, "global_step": 576699, "epoch": 6948} {"train_loss": -27.374608993530273, "global_step": 576700, "epoch": 6948} {"train_loss": -27.015277862548828, "global_step": 576701, "epoch": 6948} {"train_loss": -27.41981315612793, "global_step": 576702, "epoch": 6948} {"train_loss": -27.369211196899414, "global_step": 576703, "epoch": 6948} {"train_loss": -27.525318145751953, "global_step": 576704, "epoch": 6948} {"train_loss": -27.51325035095215, "global_step": 576705, "epoch": 6948} {"train_loss": -27.603429794311523, "global_step": 576706, "epoch": 6948} {"train_loss": -27.453643798828125, "global_step": 576707, "epoch": 6948} {"train_loss": -27.7806396484375, "global_step": 576708, "epoch": 6948} {"train_loss": -27.789670944213867, "global_step": 576709, "epoch": 6948} {"train_loss": -27.420654296875, "global_step": 576710, "epoch": 6948} {"train_loss": -27.918561935424805, "global_step": 576711, "epoch": 6948} {"train_loss": -27.642038345336914, "global_step": 576712, "epoch": 6948} {"train_loss": -27.782758712768555, "global_step": 576713, "epoch": 6948} {"train_loss": -27.915021896362305, "global_step": 576714, "epoch": 6948} {"train_loss": -27.432453155517578, "global_step": 576715, "epoch": 6948} {"train_loss": -27.53578758239746, "global_step": 576716, "epoch": 6948} {"train_loss": -27.85944175720215, "global_step": 576717, "epoch": 6948} {"train_loss": -27.767026901245117, "global_step": 576718, "epoch": 6948} {"train_loss": -27.96438980102539, "global_step": 576719, "epoch": 6948} {"train_loss": -27.633106231689453, "global_step": 576720, "epoch": 6948} {"train_loss": -27.739398956298828, "global_step": 576721, "epoch": 6948} {"train_loss": -27.72292137145996, "global_step": 576722, "epoch": 6948} {"train_loss": -28.053720474243164, "global_step": 576723, "epoch": 6948} {"train_loss": -27.801965713500977, "global_step": 576724, "epoch": 6948} {"train_loss": -28.032241821289062, "global_step": 576725, "epoch": 6948} {"train_loss": -27.93438720703125, "global_step": 576726, "epoch": 6948} {"train_loss": -27.64862060546875, "global_step": 576727, "epoch": 6948} {"train_loss": -28.093896865844727, "global_step": 576728, "epoch": 6948} {"train_loss": -27.66031837463379, "global_step": 576729, "epoch": 6948} {"train_loss": -28.166189193725586, "global_step": 576730, "epoch": 6948} {"train_loss": -27.795806884765625, "global_step": 576731, "epoch": 6948} {"train_loss": -28.3024959564209, "global_step": 576732, "epoch": 6948} {"train_loss": -28.008405685424805, "global_step": 576733, "epoch": 6948} {"train_loss": -28.44496726989746, "global_step": 576734, "epoch": 6948} {"train_loss": -28.08674430847168, "global_step": 576735, "epoch": 6948} {"train_loss": -28.071186065673828, "global_step": 576736, "epoch": 6948} {"train_loss": -27.805877685546875, "global_step": 576737, "epoch": 6948} {"train_loss": -27.760114669799805, "global_step": 576738, "epoch": 6948} {"train_loss": -28.442514419555664, "global_step": 576739, "epoch": 6948} {"train_loss": -28.304096221923828, "global_step": 576740, "epoch": 6948} {"train_loss": -28.17110252380371, "global_step": 576741, "epoch": 6948} {"train_loss": -27.924367904663086, "global_step": 576742, "epoch": 6948} {"train_loss": -27.655176162719727, "global_step": 576743, "epoch": 6948} {"train_loss": -27.975622177124023, "global_step": 576744, "epoch": 6948} {"train_loss": -27.555683135986328, "global_step": 576745, "epoch": 6948} {"train_loss": -26.508581161499023, "global_step": 576746, "epoch": 6948} {"train_loss": -25.06302261352539, "global_step": 576747, "epoch": 6948} {"train_loss": -25.900928497314453, "global_step": 576748, "epoch": 6948} {"train_loss": -27.712799072265625, "global_step": 576749, "epoch": 6948} {"train_loss": -26.35968017578125, "global_step": 576750, "epoch": 6948} {"train_loss": -27.5489501953125, "global_step": 576751, "epoch": 6948} {"train_loss": -26.883289337158203, "global_step": 576752, "epoch": 6948} {"train_loss": -27.723529815673828, "global_step": 576753, "epoch": 6948} {"train_loss": -27.019758224487305, "global_step": 576754, "epoch": 6948} {"train_loss": -26.846466064453125, "global_step": 576755, "epoch": 6948} {"train_loss": -27.40032958984375, "global_step": 576756, "epoch": 6948} {"train_loss": -27.175251007080078, "global_step": 576757, "epoch": 6948} {"train_loss": -27.688276290893555, "global_step": 576758, "epoch": 6948} {"train_loss": -27.40288734436035, "global_step": 576759, "epoch": 6948} {"train_loss": -26.85329246520996, "global_step": 576760, "epoch": 6948} {"train_loss": -27.081201553344727, "global_step": 576761, "epoch": 6948} {"train_loss": -26.888853073120117, "global_step": 576762, "epoch": 6948} {"train_loss": -27.394681930541992, "global_step": 576763, "epoch": 6948} {"train_loss": -27.205982208251953, "global_step": 576764, "epoch": 6948} {"train_loss": -26.9344539642334, "global_step": 576765, "epoch": 6948} {"train_loss": -27.454232250351502, "global_step": 576766, "epoch": 6948, "val_loss": 6562459.0} {"train_loss": -25.54958152770996, "global_step": 576767, "epoch": 6949} {"train_loss": -21.430614471435547, "global_step": 576768, "epoch": 6949} {"train_loss": -26.197668075561523, "global_step": 576769, "epoch": 6949} {"train_loss": -24.455249786376953, "global_step": 576770, "epoch": 6949} {"train_loss": -26.36991310119629, "global_step": 576771, "epoch": 6949} {"train_loss": -24.99092674255371, "global_step": 576772, "epoch": 6949} {"train_loss": -26.972501754760742, "global_step": 576773, "epoch": 6949} {"train_loss": -25.80889320373535, "global_step": 576774, "epoch": 6949} {"train_loss": -25.41559410095215, "global_step": 576775, "epoch": 6949} {"train_loss": -26.85576820373535, "global_step": 576776, "epoch": 6949} {"train_loss": -26.111230850219727, "global_step": 576777, "epoch": 6949} {"train_loss": -26.221805572509766, "global_step": 576778, "epoch": 6949} {"train_loss": -26.776514053344727, "global_step": 576779, "epoch": 6949} {"train_loss": -26.8973331451416, "global_step": 576780, "epoch": 6949} {"train_loss": -27.0017032623291, "global_step": 576781, "epoch": 6949} {"train_loss": -26.38850212097168, "global_step": 576782, "epoch": 6949} {"train_loss": -26.802343368530273, "global_step": 576783, "epoch": 6949} {"train_loss": -26.772520065307617, "global_step": 576784, "epoch": 6949} {"train_loss": -26.664203643798828, "global_step": 576785, "epoch": 6949} {"train_loss": -27.24713134765625, "global_step": 576786, "epoch": 6949} {"train_loss": -26.730594635009766, "global_step": 576787, "epoch": 6949} {"train_loss": -26.89496421813965, "global_step": 576788, "epoch": 6949} {"train_loss": -26.8125, "global_step": 576789, "epoch": 6949} {"train_loss": -26.506494522094727, "global_step": 576790, "epoch": 6949} {"train_loss": -26.896589279174805, "global_step": 576791, "epoch": 6949} {"train_loss": -27.25404167175293, "global_step": 576792, "epoch": 6949} {"train_loss": -26.8624324798584, "global_step": 576793, "epoch": 6949} {"train_loss": -26.9434871673584, "global_step": 576794, "epoch": 6949} {"train_loss": -27.172149658203125, "global_step": 576795, "epoch": 6949} {"train_loss": -27.393606185913086, "global_step": 576796, "epoch": 6949} {"train_loss": -26.987186431884766, "global_step": 576797, "epoch": 6949} {"train_loss": -27.5330753326416, "global_step": 576798, "epoch": 6949} {"train_loss": -27.39202880859375, "global_step": 576799, "epoch": 6949} {"train_loss": -27.62680435180664, "global_step": 576800, "epoch": 6949} {"train_loss": -27.374073028564453, "global_step": 576801, "epoch": 6949} {"train_loss": -26.871320724487305, "global_step": 576802, "epoch": 6949} {"train_loss": -27.619552612304688, "global_step": 576803, "epoch": 6949} {"train_loss": -27.430408477783203, "global_step": 576804, "epoch": 6949} {"train_loss": -27.7602481842041, "global_step": 576805, "epoch": 6949} {"train_loss": -27.9129695892334, "global_step": 576806, "epoch": 6949} {"train_loss": -27.75034523010254, "global_step": 576807, "epoch": 6949} {"train_loss": -27.4842586517334, "global_step": 576808, "epoch": 6949} {"train_loss": -27.724933624267578, "global_step": 576809, "epoch": 6949} {"train_loss": -27.662582397460938, "global_step": 576810, "epoch": 6949} {"train_loss": -27.592365264892578, "global_step": 576811, "epoch": 6949} {"train_loss": -27.691694259643555, "global_step": 576812, "epoch": 6949} {"train_loss": -28.03399085998535, "global_step": 576813, "epoch": 6949} {"train_loss": -27.558807373046875, "global_step": 576814, "epoch": 6949} {"train_loss": -27.361846923828125, "global_step": 576815, "epoch": 6949} {"train_loss": -27.840301513671875, "global_step": 576816, "epoch": 6949} {"train_loss": -27.94486427307129, "global_step": 576817, "epoch": 6949} {"train_loss": -27.680282592773438, "global_step": 576818, "epoch": 6949} {"train_loss": -27.5191593170166, "global_step": 576819, "epoch": 6949} {"train_loss": -28.283203125, "global_step": 576820, "epoch": 6949} {"train_loss": -27.41670799255371, "global_step": 576821, "epoch": 6949} {"train_loss": -27.8387508392334, "global_step": 576822, "epoch": 6949} {"train_loss": -27.580463409423828, "global_step": 576823, "epoch": 6949} {"train_loss": -28.04290771484375, "global_step": 576824, "epoch": 6949} {"train_loss": -28.091495513916016, "global_step": 576825, "epoch": 6949} {"train_loss": -27.789051055908203, "global_step": 576826, "epoch": 6949} {"train_loss": -27.879180908203125, "global_step": 576827, "epoch": 6949} {"train_loss": -27.80048942565918, "global_step": 576828, "epoch": 6949} {"train_loss": -27.431018829345703, "global_step": 576829, "epoch": 6949} {"train_loss": -27.27103042602539, "global_step": 576830, "epoch": 6949} {"train_loss": -26.992650985717773, "global_step": 576831, "epoch": 6949} {"train_loss": -27.785354614257812, "global_step": 576832, "epoch": 6949} {"train_loss": -27.897327423095703, "global_step": 576833, "epoch": 6949} {"train_loss": -27.794233322143555, "global_step": 576834, "epoch": 6949} {"train_loss": -27.391891479492188, "global_step": 576835, "epoch": 6949} {"train_loss": -27.796295166015625, "global_step": 576836, "epoch": 6949} {"train_loss": -27.99869155883789, "global_step": 576837, "epoch": 6949} {"train_loss": -27.987821578979492, "global_step": 576838, "epoch": 6949} {"train_loss": -27.890283584594727, "global_step": 576839, "epoch": 6949} {"train_loss": -27.977935791015625, "global_step": 576840, "epoch": 6949} {"train_loss": -27.942468643188477, "global_step": 576841, "epoch": 6949} {"train_loss": -27.965564727783203, "global_step": 576842, "epoch": 6949} {"train_loss": -27.4676513671875, "global_step": 576843, "epoch": 6949} {"train_loss": -27.897876739501953, "global_step": 576844, "epoch": 6949} {"train_loss": -27.652530670166016, "global_step": 576845, "epoch": 6949} {"train_loss": -27.34956169128418, "global_step": 576846, "epoch": 6949} {"train_loss": -28.079431533813477, "global_step": 576847, "epoch": 6949} {"train_loss": -28.06488609313965, "global_step": 576848, "epoch": 6949} {"train_loss": -27.217394380684357, "global_step": 576849, "epoch": 6949, "val_loss": 6614849.0} {"train_loss": -27.673559188842773, "global_step": 576850, "epoch": 6950} {"train_loss": -27.397205352783203, "global_step": 576851, "epoch": 6950} {"train_loss": -26.84624671936035, "global_step": 576852, "epoch": 6950} {"train_loss": -27.355560302734375, "global_step": 576853, "epoch": 6950} {"train_loss": -27.45173454284668, "global_step": 576854, "epoch": 6950} {"train_loss": -27.63679313659668, "global_step": 576855, "epoch": 6950} {"train_loss": -27.586151123046875, "global_step": 576856, "epoch": 6950} {"train_loss": -27.818042755126953, "global_step": 576857, "epoch": 6950} {"train_loss": -27.7271671295166, "global_step": 576858, "epoch": 6950} {"train_loss": -27.751264572143555, "global_step": 576859, "epoch": 6950} {"train_loss": -27.16796875, "global_step": 576860, "epoch": 6950} {"train_loss": -27.505401611328125, "global_step": 576861, "epoch": 6950} {"train_loss": -27.99103355407715, "global_step": 576862, "epoch": 6950} {"train_loss": -27.4843692779541, "global_step": 576863, "epoch": 6950} {"train_loss": -27.649127960205078, "global_step": 576864, "epoch": 6950} {"train_loss": -27.263717651367188, "global_step": 576865, "epoch": 6950} {"train_loss": -27.937244415283203, "global_step": 576866, "epoch": 6950} {"train_loss": -28.331287384033203, "global_step": 576867, "epoch": 6950} {"train_loss": -27.82142448425293, "global_step": 576868, "epoch": 6950} {"train_loss": -27.86517906188965, "global_step": 576869, "epoch": 6950} {"train_loss": -28.0611572265625, "global_step": 576870, "epoch": 6950} {"train_loss": -27.895099639892578, "global_step": 576871, "epoch": 6950} {"train_loss": -27.87447166442871, "global_step": 576872, "epoch": 6950} {"train_loss": -28.447423934936523, "global_step": 576873, "epoch": 6950} {"train_loss": -27.85346031188965, "global_step": 576874, "epoch": 6950} {"train_loss": -27.947269439697266, "global_step": 576875, "epoch": 6950} {"train_loss": -27.8392276763916, "global_step": 576876, "epoch": 6950} {"train_loss": -27.946949005126953, "global_step": 576877, "epoch": 6950} {"train_loss": -27.66824722290039, "global_step": 576878, "epoch": 6950} {"train_loss": -28.429550170898438, "global_step": 576879, "epoch": 6950} {"train_loss": -28.044178009033203, "global_step": 576880, "epoch": 6950} {"train_loss": -28.143157958984375, "global_step": 576881, "epoch": 6950} {"train_loss": -27.907873153686523, "global_step": 576882, "epoch": 6950} {"train_loss": -28.412403106689453, "global_step": 576883, "epoch": 6950} {"train_loss": -28.132781982421875, "global_step": 576884, "epoch": 6950} {"train_loss": -28.11020278930664, "global_step": 576885, "epoch": 6950} {"train_loss": -27.6935977935791, "global_step": 576886, "epoch": 6950} {"train_loss": -28.203588485717773, "global_step": 576887, "epoch": 6950} {"train_loss": -28.044050216674805, "global_step": 576888, "epoch": 6950} {"train_loss": -28.357242584228516, "global_step": 576889, "epoch": 6950} {"train_loss": -27.99574089050293, "global_step": 576890, "epoch": 6950} {"train_loss": -27.67923355102539, "global_step": 576891, "epoch": 6950} {"train_loss": -27.501317977905273, "global_step": 576892, "epoch": 6950} {"train_loss": -27.509504318237305, "global_step": 576893, "epoch": 6950} {"train_loss": -27.181659698486328, "global_step": 576894, "epoch": 6950} {"train_loss": -27.86638832092285, "global_step": 576895, "epoch": 6950} {"train_loss": -27.898069381713867, "global_step": 576896, "epoch": 6950} {"train_loss": -28.19354820251465, "global_step": 576897, "epoch": 6950} {"train_loss": -27.61334800720215, "global_step": 576898, "epoch": 6950} {"train_loss": -27.906827926635742, "global_step": 576899, "epoch": 6950} {"train_loss": -28.039655685424805, "global_step": 576900, "epoch": 6950} {"train_loss": -28.00152587890625, "global_step": 576901, "epoch": 6950} {"train_loss": -27.774921417236328, "global_step": 576902, "epoch": 6950} {"train_loss": -28.00910758972168, "global_step": 576903, "epoch": 6950} {"train_loss": -28.01560401916504, "global_step": 576904, "epoch": 6950} {"train_loss": -27.966039657592773, "global_step": 576905, "epoch": 6950} {"train_loss": -27.91876792907715, "global_step": 576906, "epoch": 6950} {"train_loss": -27.893218994140625, "global_step": 576907, "epoch": 6950} {"train_loss": -27.963363647460938, "global_step": 576908, "epoch": 6950} {"train_loss": -27.642847061157227, "global_step": 576909, "epoch": 6950} {"train_loss": -28.109027862548828, "global_step": 576910, "epoch": 6950} {"train_loss": -27.795475006103516, "global_step": 576911, "epoch": 6950} {"train_loss": -28.182233810424805, "global_step": 576912, "epoch": 6950} {"train_loss": -27.719745635986328, "global_step": 576913, "epoch": 6950} {"train_loss": -27.967304229736328, "global_step": 576914, "epoch": 6950} {"train_loss": -28.024417877197266, "global_step": 576915, "epoch": 6950} {"train_loss": -28.17842674255371, "global_step": 576916, "epoch": 6950} {"train_loss": -28.189044952392578, "global_step": 576917, "epoch": 6950} {"train_loss": -28.042205810546875, "global_step": 576918, "epoch": 6950} {"train_loss": -27.64069175720215, "global_step": 576919, "epoch": 6950} {"train_loss": -27.991840362548828, "global_step": 576920, "epoch": 6950} {"train_loss": -28.284900665283203, "global_step": 576921, "epoch": 6950} {"train_loss": -28.248016357421875, "global_step": 576922, "epoch": 6950} {"train_loss": -28.14630126953125, "global_step": 576923, "epoch": 6950} {"train_loss": -28.353179931640625, "global_step": 576924, "epoch": 6950} {"train_loss": -28.30924415588379, "global_step": 576925, "epoch": 6950} {"train_loss": -28.28443717956543, "global_step": 576926, "epoch": 6950} {"train_loss": -28.32440185546875, "global_step": 576927, "epoch": 6950} {"train_loss": -28.203277587890625, "global_step": 576928, "epoch": 6950} {"train_loss": -28.129194259643555, "global_step": 576929, "epoch": 6950} {"train_loss": -28.213287353515625, "global_step": 576930, "epoch": 6950} {"train_loss": -28.063257217407227, "global_step": 576931, "epoch": 6950} {"train_loss": -27.90187081945948, "global_step": 576932, "epoch": 6950, "train/sim_max_reward_0": 0.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4500000": 1.0, "test/sim_max_reward_4500001": 1.0, "test/sim_max_reward_4500002": 1.0, "test/sim_max_reward_4500003": 1.0, "test/sim_max_reward_4500004": 1.0, "test/sim_max_reward_4500005": 1.0, "test/sim_max_reward_4500006": 1.0, "test/sim_max_reward_4500007": 0.0, "test/sim_max_reward_4500008": 1.0, "test/sim_max_reward_4500009": 1.0, "test/sim_max_reward_4500010": 1.0, "test/sim_max_reward_4500011": 1.0, "test/sim_max_reward_4500012": 1.0, "test/sim_max_reward_4500013": 0.0, "test/sim_max_reward_4500014": 1.0, "test/sim_max_reward_4500015": 1.0, "test/sim_max_reward_4500016": 1.0, "test/sim_max_reward_4500017": 1.0, "test/sim_max_reward_4500018": 0.0, "test/sim_max_reward_4500019": 1.0, "test/sim_max_reward_4500020": 1.0, "test/sim_max_reward_4500021": 1.0, "train/mean_score": 0.8333333333333334, "test/mean_score": 0.8636363636363636, "val_loss": 6607090.0} {"train_loss": -27.98773193359375, "global_step": 576933, "epoch": 6951} {"train_loss": -27.195697784423828, "global_step": 576934, "epoch": 6951} {"train_loss": -27.546875, "global_step": 576935, "epoch": 6951} {"train_loss": -27.474578857421875, "global_step": 576936, "epoch": 6951} {"train_loss": -27.91448974609375, "global_step": 576937, "epoch": 6951} {"train_loss": -27.40180778503418, "global_step": 576938, "epoch": 6951} {"train_loss": -27.510766983032227, "global_step": 576939, "epoch": 6951} {"train_loss": -27.636640548706055, "global_step": 576940, "epoch": 6951} {"train_loss": -27.90717887878418, "global_step": 576941, "epoch": 6951} {"train_loss": -27.6583309173584, "global_step": 576942, "epoch": 6951} {"train_loss": -27.2418270111084, "global_step": 576943, "epoch": 6951} {"train_loss": -27.58994483947754, "global_step": 576944, "epoch": 6951} {"train_loss": -27.571060180664062, "global_step": 576945, "epoch": 6951} {"train_loss": -27.700815200805664, "global_step": 576946, "epoch": 6951} {"train_loss": -27.767866134643555, "global_step": 576947, "epoch": 6951} {"train_loss": -27.602384567260742, "global_step": 576948, "epoch": 6951} {"train_loss": -27.89023208618164, "global_step": 576949, "epoch": 6951} {"train_loss": -27.99757194519043, "global_step": 576950, "epoch": 6951} {"train_loss": -27.210575103759766, "global_step": 576951, "epoch": 6951} {"train_loss": -27.967084884643555, "global_step": 576952, "epoch": 6951} {"train_loss": -27.322660446166992, "global_step": 576953, "epoch": 6951} {"train_loss": -27.354551315307617, "global_step": 576954, "epoch": 6951} {"train_loss": -27.885990142822266, "global_step": 576955, "epoch": 6951} {"train_loss": -27.5307674407959, "global_step": 576956, "epoch": 6951} {"train_loss": -27.645429611206055, "global_step": 576957, "epoch": 6951} {"train_loss": -27.279998779296875, "global_step": 576958, "epoch": 6951} {"train_loss": -27.925199508666992, "global_step": 576959, "epoch": 6951} {"train_loss": -27.556562423706055, "global_step": 576960, "epoch": 6951} {"train_loss": -27.42926025390625, "global_step": 576961, "epoch": 6951} {"train_loss": -28.010700225830078, "global_step": 576962, "epoch": 6951} {"train_loss": -27.628332138061523, "global_step": 576963, "epoch": 6951} {"train_loss": -28.197925567626953, "global_step": 576964, "epoch": 6951} {"train_loss": -27.644546508789062, "global_step": 576965, "epoch": 6951} {"train_loss": -27.970417022705078, "global_step": 576966, "epoch": 6951} {"train_loss": -27.870145797729492, "global_step": 576967, "epoch": 6951} {"train_loss": -27.855792999267578, "global_step": 576968, "epoch": 6951} {"train_loss": -27.824567794799805, "global_step": 576969, "epoch": 6951} {"train_loss": -27.77569580078125, "global_step": 576970, "epoch": 6951} {"train_loss": -28.085081100463867, "global_step": 576971, "epoch": 6951} {"train_loss": -27.960647583007812, "global_step": 576972, "epoch": 6951} {"train_loss": -28.039350509643555, "global_step": 576973, "epoch": 6951} {"train_loss": -27.785364151000977, "global_step": 576974, "epoch": 6951} {"train_loss": -28.07516860961914, "global_step": 576975, "epoch": 6951} {"train_loss": -27.917810440063477, "global_step": 576976, "epoch": 6951} {"train_loss": -27.626379013061523, "global_step": 576977, "epoch": 6951} {"train_loss": -27.541166305541992, "global_step": 576978, "epoch": 6951} {"train_loss": -27.972875595092773, "global_step": 576979, "epoch": 6951} {"train_loss": -27.96965980529785, "global_step": 576980, "epoch": 6951} {"train_loss": -27.963836669921875, "global_step": 576981, "epoch": 6951} {"train_loss": -28.156492233276367, "global_step": 576982, "epoch": 6951} {"train_loss": -27.96923828125, "global_step": 576983, "epoch": 6951} {"train_loss": -27.80315589904785, "global_step": 576984, "epoch": 6951} {"train_loss": -28.057172775268555, "global_step": 576985, "epoch": 6951} {"train_loss": -28.0929012298584, "global_step": 576986, "epoch": 6951} {"train_loss": -28.0447998046875, "global_step": 576987, "epoch": 6951} {"train_loss": -28.130460739135742, "global_step": 576988, "epoch": 6951} {"train_loss": -27.93408203125, "global_step": 576989, "epoch": 6951} {"train_loss": -27.639514923095703, "global_step": 576990, "epoch": 6951} {"train_loss": -27.846654891967773, "global_step": 576991, "epoch": 6951} {"train_loss": -27.505908966064453, "global_step": 576992, "epoch": 6951} {"train_loss": -27.806318283081055, "global_step": 576993, "epoch": 6951} {"train_loss": -27.443273544311523, "global_step": 576994, "epoch": 6951} {"train_loss": -27.858367919921875, "global_step": 576995, "epoch": 6951} {"train_loss": -27.985456466674805, "global_step": 576996, "epoch": 6951} {"train_loss": -28.21234703063965, "global_step": 576997, "epoch": 6951} {"train_loss": -27.98126220703125, "global_step": 576998, "epoch": 6951} {"train_loss": -28.23792839050293, "global_step": 576999, "epoch": 6951} {"train_loss": -28.056127548217773, "global_step": 577000, "epoch": 6951} {"train_loss": -27.788955688476562, "global_step": 577001, "epoch": 6951} {"train_loss": -28.25652503967285, "global_step": 577002, "epoch": 6951} {"train_loss": -28.06080436706543, "global_step": 577003, "epoch": 6951} {"train_loss": -28.12677574157715, "global_step": 577004, "epoch": 6951} {"train_loss": -27.643598556518555, "global_step": 577005, "epoch": 6951} {"train_loss": -27.671560287475586, "global_step": 577006, "epoch": 6951} {"train_loss": -27.838720321655273, "global_step": 577007, "epoch": 6951} {"train_loss": -27.702985763549805, "global_step": 577008, "epoch": 6951} {"train_loss": -27.965728759765625, "global_step": 577009, "epoch": 6951} {"train_loss": -27.49216079711914, "global_step": 577010, "epoch": 6951} {"train_loss": -27.745336532592773, "global_step": 577011, "epoch": 6951} {"train_loss": -27.7911319732666, "global_step": 577012, "epoch": 6951} {"train_loss": -27.59699821472168, "global_step": 577013, "epoch": 6951} {"train_loss": -28.011838912963867, "global_step": 577014, "epoch": 6951} {"train_loss": -27.800790901643683, "global_step": 577015, "epoch": 6951, "val_loss": 6562705.5} {"train_loss": -22.329225540161133, "global_step": 577016, "epoch": 6952} {"train_loss": -25.29533576965332, "global_step": 577017, "epoch": 6952} {"train_loss": -23.45086669921875, "global_step": 577018, "epoch": 6952} {"train_loss": -26.06308364868164, "global_step": 577019, "epoch": 6952} {"train_loss": -25.301198959350586, "global_step": 577020, "epoch": 6952} {"train_loss": -25.608966827392578, "global_step": 577021, "epoch": 6952} {"train_loss": -26.182514190673828, "global_step": 577022, "epoch": 6952} {"train_loss": -25.741628646850586, "global_step": 577023, "epoch": 6952} {"train_loss": -26.05902671813965, "global_step": 577024, "epoch": 6952} {"train_loss": -25.935998916625977, "global_step": 577025, "epoch": 6952} {"train_loss": -26.43973159790039, "global_step": 577026, "epoch": 6952} {"train_loss": -26.142688751220703, "global_step": 577027, "epoch": 6952} {"train_loss": -26.317350387573242, "global_step": 577028, "epoch": 6952} {"train_loss": -26.027204513549805, "global_step": 577029, "epoch": 6952} {"train_loss": -26.7282657623291, "global_step": 577030, "epoch": 6952} {"train_loss": -26.290912628173828, "global_step": 577031, "epoch": 6952} {"train_loss": -26.443222045898438, "global_step": 577032, "epoch": 6952} {"train_loss": -26.492475509643555, "global_step": 577033, "epoch": 6952} {"train_loss": -26.852161407470703, "global_step": 577034, "epoch": 6952} {"train_loss": -26.452930450439453, "global_step": 577035, "epoch": 6952} {"train_loss": -26.703271865844727, "global_step": 577036, "epoch": 6952} {"train_loss": -26.84913444519043, "global_step": 577037, "epoch": 6952} {"train_loss": -26.651121139526367, "global_step": 577038, "epoch": 6952} {"train_loss": -26.74603271484375, "global_step": 577039, "epoch": 6952} {"train_loss": -26.88422966003418, "global_step": 577040, "epoch": 6952} {"train_loss": -27.006622314453125, "global_step": 577041, "epoch": 6952} {"train_loss": -26.971893310546875, "global_step": 577042, "epoch": 6952} {"train_loss": -27.197858810424805, "global_step": 577043, "epoch": 6952} {"train_loss": -27.011310577392578, "global_step": 577044, "epoch": 6952} {"train_loss": -27.036182403564453, "global_step": 577045, "epoch": 6952} {"train_loss": -27.235492706298828, "global_step": 577046, "epoch": 6952} {"train_loss": -26.917724609375, "global_step": 577047, "epoch": 6952} {"train_loss": -27.32317543029785, "global_step": 577048, "epoch": 6952} {"train_loss": -27.243412017822266, "global_step": 577049, "epoch": 6952} {"train_loss": -27.358020782470703, "global_step": 577050, "epoch": 6952} {"train_loss": -27.258665084838867, "global_step": 577051, "epoch": 6952} {"train_loss": -27.213560104370117, "global_step": 577052, "epoch": 6952} {"train_loss": -27.823715209960938, "global_step": 577053, "epoch": 6952} {"train_loss": -27.586719512939453, "global_step": 577054, "epoch": 6952} {"train_loss": -27.820749282836914, "global_step": 577055, "epoch": 6952} {"train_loss": -27.447675704956055, "global_step": 577056, "epoch": 6952} {"train_loss": -27.843647003173828, "global_step": 577057, "epoch": 6952} {"train_loss": -27.593189239501953, "global_step": 577058, "epoch": 6952} {"train_loss": -27.379819869995117, "global_step": 577059, "epoch": 6952} {"train_loss": -28.117162704467773, "global_step": 577060, "epoch": 6952} {"train_loss": -27.900821685791016, "global_step": 577061, "epoch": 6952} {"train_loss": -27.9588623046875, "global_step": 577062, "epoch": 6952} {"train_loss": -27.779356002807617, "global_step": 577063, "epoch": 6952} {"train_loss": -27.604475021362305, "global_step": 577064, "epoch": 6952} {"train_loss": -28.053369522094727, "global_step": 577065, "epoch": 6952} {"train_loss": -27.588369369506836, "global_step": 577066, "epoch": 6952} {"train_loss": -27.938053131103516, "global_step": 577067, "epoch": 6952} {"train_loss": -27.670303344726562, "global_step": 577068, "epoch": 6952} {"train_loss": -27.98224449157715, "global_step": 577069, "epoch": 6952} {"train_loss": -27.958606719970703, "global_step": 577070, "epoch": 6952} {"train_loss": -28.091022491455078, "global_step": 577071, "epoch": 6952} {"train_loss": -27.54047203063965, "global_step": 577072, "epoch": 6952} {"train_loss": -27.787490844726562, "global_step": 577073, "epoch": 6952} {"train_loss": -28.005878448486328, "global_step": 577074, "epoch": 6952} {"train_loss": -28.03496742248535, "global_step": 577075, "epoch": 6952} {"train_loss": -28.0758113861084, "global_step": 577076, "epoch": 6952} {"train_loss": -27.963714599609375, "global_step": 577077, "epoch": 6952} {"train_loss": -28.338214874267578, "global_step": 577078, "epoch": 6952} {"train_loss": -27.659748077392578, "global_step": 577079, "epoch": 6952} {"train_loss": -28.168659210205078, "global_step": 577080, "epoch": 6952} {"train_loss": -27.966083526611328, "global_step": 577081, "epoch": 6952} {"train_loss": -27.919849395751953, "global_step": 577082, "epoch": 6952} {"train_loss": -28.03849220275879, "global_step": 577083, "epoch": 6952} {"train_loss": -28.4259033203125, "global_step": 577084, "epoch": 6952} {"train_loss": -27.866865158081055, "global_step": 577085, "epoch": 6952} {"train_loss": -27.728757858276367, "global_step": 577086, "epoch": 6952} {"train_loss": -28.09028434753418, "global_step": 577087, "epoch": 6952} {"train_loss": -28.248666763305664, "global_step": 577088, "epoch": 6952} {"train_loss": -27.949499130249023, "global_step": 577089, "epoch": 6952} {"train_loss": -27.904739379882812, "global_step": 577090, "epoch": 6952} {"train_loss": -27.170812606811523, "global_step": 577091, "epoch": 6952} {"train_loss": -25.725605010986328, "global_step": 577092, "epoch": 6952} {"train_loss": -24.226388931274414, "global_step": 577093, "epoch": 6952} {"train_loss": -25.8026180267334, "global_step": 577094, "epoch": 6952} {"train_loss": -27.94229507446289, "global_step": 577095, "epoch": 6952} {"train_loss": -26.946760177612305, "global_step": 577096, "epoch": 6952} {"train_loss": -27.6058349609375, "global_step": 577097, "epoch": 6952} {"train_loss": -27.069930777492292, "global_step": 577098, "epoch": 6952, "val_loss": 6611654.0} {"train_loss": -26.744220733642578, "global_step": 577099, "epoch": 6953} {"train_loss": -26.184675216674805, "global_step": 577100, "epoch": 6953} {"train_loss": -27.00501823425293, "global_step": 577101, "epoch": 6953} {"train_loss": -27.36279296875, "global_step": 577102, "epoch": 6953} {"train_loss": -26.428442001342773, "global_step": 577103, "epoch": 6953} {"train_loss": -27.38978385925293, "global_step": 577104, "epoch": 6953} {"train_loss": -27.608976364135742, "global_step": 577105, "epoch": 6953} {"train_loss": -27.104398727416992, "global_step": 577106, "epoch": 6953} {"train_loss": -27.193368911743164, "global_step": 577107, "epoch": 6953} {"train_loss": -27.090728759765625, "global_step": 577108, "epoch": 6953} {"train_loss": -27.42374038696289, "global_step": 577109, "epoch": 6953} {"train_loss": -26.741559982299805, "global_step": 577110, "epoch": 6953} {"train_loss": -27.297138214111328, "global_step": 577111, "epoch": 6953} {"train_loss": -27.100759506225586, "global_step": 577112, "epoch": 6953} {"train_loss": -27.22662925720215, "global_step": 577113, "epoch": 6953} {"train_loss": -26.83282470703125, "global_step": 577114, "epoch": 6953} {"train_loss": -27.50118064880371, "global_step": 577115, "epoch": 6953} {"train_loss": -27.254180908203125, "global_step": 577116, "epoch": 6953} {"train_loss": -27.69439697265625, "global_step": 577117, "epoch": 6953} {"train_loss": -26.800954818725586, "global_step": 577118, "epoch": 6953} {"train_loss": -27.4992618560791, "global_step": 577119, "epoch": 6953} {"train_loss": -27.272418975830078, "global_step": 577120, "epoch": 6953} {"train_loss": -27.44536781311035, "global_step": 577121, "epoch": 6953} {"train_loss": -27.423004150390625, "global_step": 577122, "epoch": 6953} {"train_loss": -27.482040405273438, "global_step": 577123, "epoch": 6953} {"train_loss": -27.392139434814453, "global_step": 577124, "epoch": 6953} {"train_loss": -27.466903686523438, "global_step": 577125, "epoch": 6953} {"train_loss": -27.449071884155273, "global_step": 577126, "epoch": 6953} {"train_loss": -27.399641036987305, "global_step": 577127, "epoch": 6953} {"train_loss": -27.53196144104004, "global_step": 577128, "epoch": 6953} {"train_loss": -27.551977157592773, "global_step": 577129, "epoch": 6953} {"train_loss": -27.150848388671875, "global_step": 577130, "epoch": 6953} {"train_loss": -27.306079864501953, "global_step": 577131, "epoch": 6953} {"train_loss": -27.759418487548828, "global_step": 577132, "epoch": 6953} {"train_loss": -27.71923828125, "global_step": 577133, "epoch": 6953} {"train_loss": -27.906869888305664, "global_step": 577134, "epoch": 6953} {"train_loss": -27.617267608642578, "global_step": 577135, "epoch": 6953} {"train_loss": -27.72587013244629, "global_step": 577136, "epoch": 6953} {"train_loss": -27.757953643798828, "global_step": 577137, "epoch": 6953} {"train_loss": -27.9448299407959, "global_step": 577138, "epoch": 6953} {"train_loss": -27.6142520904541, "global_step": 577139, "epoch": 6953} {"train_loss": -27.713891983032227, "global_step": 577140, "epoch": 6953} {"train_loss": -27.633930206298828, "global_step": 577141, "epoch": 6953} {"train_loss": -28.0684871673584, "global_step": 577142, "epoch": 6953} {"train_loss": -28.043615341186523, "global_step": 577143, "epoch": 6953} {"train_loss": -28.158411026000977, "global_step": 577144, "epoch": 6953} {"train_loss": -27.848770141601562, "global_step": 577145, "epoch": 6953} {"train_loss": -27.837665557861328, "global_step": 577146, "epoch": 6953} {"train_loss": -27.624555587768555, "global_step": 577147, "epoch": 6953} {"train_loss": -27.85352897644043, "global_step": 577148, "epoch": 6953} {"train_loss": -28.040876388549805, "global_step": 577149, "epoch": 6953} {"train_loss": -27.875585556030273, "global_step": 577150, "epoch": 6953} {"train_loss": -28.1959171295166, "global_step": 577151, "epoch": 6953} {"train_loss": -28.02515983581543, "global_step": 577152, "epoch": 6953} {"train_loss": -28.668466567993164, "global_step": 577153, "epoch": 6953} {"train_loss": -28.0666446685791, "global_step": 577154, "epoch": 6953} {"train_loss": -27.90179443359375, "global_step": 577155, "epoch": 6953} {"train_loss": -28.07413101196289, "global_step": 577156, "epoch": 6953} {"train_loss": -28.029027938842773, "global_step": 577157, "epoch": 6953} {"train_loss": -27.795429229736328, "global_step": 577158, "epoch": 6953} {"train_loss": -27.794921875, "global_step": 577159, "epoch": 6953} {"train_loss": -28.10468864440918, "global_step": 577160, "epoch": 6953} {"train_loss": -28.021093368530273, "global_step": 577161, "epoch": 6953} {"train_loss": -27.807462692260742, "global_step": 577162, "epoch": 6953} {"train_loss": -27.690765380859375, "global_step": 577163, "epoch": 6953} {"train_loss": -28.446191787719727, "global_step": 577164, "epoch": 6953} {"train_loss": -28.105411529541016, "global_step": 577165, "epoch": 6953} {"train_loss": -28.276626586914062, "global_step": 577166, "epoch": 6953} {"train_loss": -28.240711212158203, "global_step": 577167, "epoch": 6953} {"train_loss": -28.23982048034668, "global_step": 577168, "epoch": 6953} {"train_loss": -27.932819366455078, "global_step": 577169, "epoch": 6953} {"train_loss": -28.171899795532227, "global_step": 577170, "epoch": 6953} {"train_loss": -28.211780548095703, "global_step": 577171, "epoch": 6953} {"train_loss": -28.18256187438965, "global_step": 577172, "epoch": 6953} {"train_loss": -27.9256534576416, "global_step": 577173, "epoch": 6953} {"train_loss": -28.20369529724121, "global_step": 577174, "epoch": 6953} {"train_loss": -27.914066314697266, "global_step": 577175, "epoch": 6953} {"train_loss": -28.25349235534668, "global_step": 577176, "epoch": 6953} {"train_loss": -27.93869972229004, "global_step": 577177, "epoch": 6953} {"train_loss": -28.165769577026367, "global_step": 577178, "epoch": 6953} {"train_loss": -27.8807315826416, "global_step": 577179, "epoch": 6953} {"train_loss": -28.42889404296875, "global_step": 577180, "epoch": 6953} {"train_loss": -27.691655055586114, "global_step": 577181, "epoch": 6953, "val_loss": 6590565.0} {"train_loss": -27.1729793548584, "global_step": 577182, "epoch": 6954} {"train_loss": -26.483301162719727, "global_step": 577183, "epoch": 6954} {"train_loss": -25.367713928222656, "global_step": 577184, "epoch": 6954} {"train_loss": -25.19184684753418, "global_step": 577185, "epoch": 6954} {"train_loss": -27.217206954956055, "global_step": 577186, "epoch": 6954} {"train_loss": -26.407394409179688, "global_step": 577187, "epoch": 6954} {"train_loss": -26.58042335510254, "global_step": 577188, "epoch": 6954} {"train_loss": -26.26668357849121, "global_step": 577189, "epoch": 6954} {"train_loss": -26.95114517211914, "global_step": 577190, "epoch": 6954} {"train_loss": -26.614044189453125, "global_step": 577191, "epoch": 6954} {"train_loss": -27.243688583374023, "global_step": 577192, "epoch": 6954} {"train_loss": -26.684545516967773, "global_step": 577193, "epoch": 6954} {"train_loss": -27.54233169555664, "global_step": 577194, "epoch": 6954} {"train_loss": -26.62592887878418, "global_step": 577195, "epoch": 6954} {"train_loss": -27.239118576049805, "global_step": 577196, "epoch": 6954} {"train_loss": -27.154651641845703, "global_step": 577197, "epoch": 6954} {"train_loss": -27.22272300720215, "global_step": 577198, "epoch": 6954} {"train_loss": -27.479766845703125, "global_step": 577199, "epoch": 6954} {"train_loss": -27.221094131469727, "global_step": 577200, "epoch": 6954} {"train_loss": -27.76724624633789, "global_step": 577201, "epoch": 6954} {"train_loss": -27.674072265625, "global_step": 577202, "epoch": 6954} {"train_loss": -27.8150577545166, "global_step": 577203, "epoch": 6954} {"train_loss": -27.517902374267578, "global_step": 577204, "epoch": 6954} {"train_loss": -27.565753936767578, "global_step": 577205, "epoch": 6954} {"train_loss": -27.677576065063477, "global_step": 577206, "epoch": 6954} {"train_loss": -27.692113876342773, "global_step": 577207, "epoch": 6954} {"train_loss": -27.48813247680664, "global_step": 577208, "epoch": 6954} {"train_loss": -27.455554962158203, "global_step": 577209, "epoch": 6954} {"train_loss": -27.49629020690918, "global_step": 577210, "epoch": 6954} {"train_loss": -27.757144927978516, "global_step": 577211, "epoch": 6954} {"train_loss": -27.596359252929688, "global_step": 577212, "epoch": 6954} {"train_loss": -27.7222843170166, "global_step": 577213, "epoch": 6954} {"train_loss": -28.022369384765625, "global_step": 577214, "epoch": 6954} {"train_loss": -27.91798973083496, "global_step": 577215, "epoch": 6954} {"train_loss": -27.57537841796875, "global_step": 577216, "epoch": 6954} {"train_loss": -27.684839248657227, "global_step": 577217, "epoch": 6954} {"train_loss": -28.118432998657227, "global_step": 577218, "epoch": 6954} {"train_loss": -27.772998809814453, "global_step": 577219, "epoch": 6954} {"train_loss": -27.943456649780273, "global_step": 577220, "epoch": 6954} {"train_loss": -27.898038864135742, "global_step": 577221, "epoch": 6954} {"train_loss": -27.91788101196289, "global_step": 577222, "epoch": 6954} {"train_loss": -27.996301651000977, "global_step": 577223, "epoch": 6954} {"train_loss": -27.981061935424805, "global_step": 577224, "epoch": 6954} {"train_loss": -27.641437530517578, "global_step": 577225, "epoch": 6954} {"train_loss": -28.245092391967773, "global_step": 577226, "epoch": 6954} {"train_loss": -27.844680786132812, "global_step": 577227, "epoch": 6954} {"train_loss": -27.790063858032227, "global_step": 577228, "epoch": 6954} {"train_loss": -28.109289169311523, "global_step": 577229, "epoch": 6954} {"train_loss": -28.090106964111328, "global_step": 577230, "epoch": 6954} {"train_loss": -27.841827392578125, "global_step": 577231, "epoch": 6954} {"train_loss": -28.31599998474121, "global_step": 577232, "epoch": 6954} {"train_loss": -27.956897735595703, "global_step": 577233, "epoch": 6954} {"train_loss": -27.959875106811523, "global_step": 577234, "epoch": 6954} {"train_loss": -28.119281768798828, "global_step": 577235, "epoch": 6954} {"train_loss": -28.03022575378418, "global_step": 577236, "epoch": 6954} {"train_loss": -28.06098747253418, "global_step": 577237, "epoch": 6954} {"train_loss": -27.984130859375, "global_step": 577238, "epoch": 6954} {"train_loss": -27.86536979675293, "global_step": 577239, "epoch": 6954} {"train_loss": -28.14723777770996, "global_step": 577240, "epoch": 6954} {"train_loss": -27.9854679107666, "global_step": 577241, "epoch": 6954} {"train_loss": -27.879959106445312, "global_step": 577242, "epoch": 6954} {"train_loss": -28.02896499633789, "global_step": 577243, "epoch": 6954} {"train_loss": -28.54097557067871, "global_step": 577244, "epoch": 6954} {"train_loss": -28.188297271728516, "global_step": 577245, "epoch": 6954} {"train_loss": -28.16115379333496, "global_step": 577246, "epoch": 6954} {"train_loss": -28.15777015686035, "global_step": 577247, "epoch": 6954} {"train_loss": -27.937780380249023, "global_step": 577248, "epoch": 6954} {"train_loss": -27.990589141845703, "global_step": 577249, "epoch": 6954} {"train_loss": -28.033355712890625, "global_step": 577250, "epoch": 6954} {"train_loss": -28.049274444580078, "global_step": 577251, "epoch": 6954} {"train_loss": -28.021982192993164, "global_step": 577252, "epoch": 6954} {"train_loss": -27.820556640625, "global_step": 577253, "epoch": 6954} {"train_loss": -28.20673179626465, "global_step": 577254, "epoch": 6954} {"train_loss": -28.0936222076416, "global_step": 577255, "epoch": 6954} {"train_loss": -27.894384384155273, "global_step": 577256, "epoch": 6954} {"train_loss": -28.207204818725586, "global_step": 577257, "epoch": 6954} {"train_loss": -28.457366943359375, "global_step": 577258, "epoch": 6954} {"train_loss": -28.10723304748535, "global_step": 577259, "epoch": 6954} {"train_loss": -27.93513298034668, "global_step": 577260, "epoch": 6954} {"train_loss": -27.82166862487793, "global_step": 577261, "epoch": 6954} {"train_loss": -27.737567901611328, "global_step": 577262, "epoch": 6954} {"train_loss": -27.79754638671875, "global_step": 577263, "epoch": 6954} {"train_loss": -27.66053765078625, "global_step": 577264, "epoch": 6954, "val_loss": 6609597.0} {"train_loss": -26.50356101989746, "global_step": 577265, "epoch": 6955} {"train_loss": -27.035232543945312, "global_step": 577266, "epoch": 6955} {"train_loss": -27.241397857666016, "global_step": 577267, "epoch": 6955} {"train_loss": -27.0260066986084, "global_step": 577268, "epoch": 6955} {"train_loss": -27.6704044342041, "global_step": 577269, "epoch": 6955} {"train_loss": -26.903242111206055, "global_step": 577270, "epoch": 6955} {"train_loss": -27.63178825378418, "global_step": 577271, "epoch": 6955} {"train_loss": -27.25215721130371, "global_step": 577272, "epoch": 6955} {"train_loss": -27.097492218017578, "global_step": 577273, "epoch": 6955} {"train_loss": -27.007770538330078, "global_step": 577274, "epoch": 6955} {"train_loss": -27.591352462768555, "global_step": 577275, "epoch": 6955} {"train_loss": -27.53020668029785, "global_step": 577276, "epoch": 6955} {"train_loss": -27.535009384155273, "global_step": 577277, "epoch": 6955} {"train_loss": -27.54658317565918, "global_step": 577278, "epoch": 6955} {"train_loss": -27.609891891479492, "global_step": 577279, "epoch": 6955} {"train_loss": -27.51418113708496, "global_step": 577280, "epoch": 6955} {"train_loss": -27.336156845092773, "global_step": 577281, "epoch": 6955} {"train_loss": -27.59393882751465, "global_step": 577282, "epoch": 6955} {"train_loss": -27.625396728515625, "global_step": 577283, "epoch": 6955} {"train_loss": -27.849294662475586, "global_step": 577284, "epoch": 6955} {"train_loss": -27.398548126220703, "global_step": 577285, "epoch": 6955} {"train_loss": -27.66570472717285, "global_step": 577286, "epoch": 6955} {"train_loss": -27.60438346862793, "global_step": 577287, "epoch": 6955} {"train_loss": -27.94599723815918, "global_step": 577288, "epoch": 6955} {"train_loss": -27.508880615234375, "global_step": 577289, "epoch": 6955} {"train_loss": -27.83619499206543, "global_step": 577290, "epoch": 6955} {"train_loss": -27.9066162109375, "global_step": 577291, "epoch": 6955} {"train_loss": -27.992029190063477, "global_step": 577292, "epoch": 6955} {"train_loss": -27.967443466186523, "global_step": 577293, "epoch": 6955} {"train_loss": -27.684412002563477, "global_step": 577294, "epoch": 6955} {"train_loss": -28.020612716674805, "global_step": 577295, "epoch": 6955} {"train_loss": -27.60883903503418, "global_step": 577296, "epoch": 6955} {"train_loss": -27.826887130737305, "global_step": 577297, "epoch": 6955} {"train_loss": -27.865774154663086, "global_step": 577298, "epoch": 6955} {"train_loss": -27.91048240661621, "global_step": 577299, "epoch": 6955} {"train_loss": -27.63148307800293, "global_step": 577300, "epoch": 6955} {"train_loss": -27.83220863342285, "global_step": 577301, "epoch": 6955} {"train_loss": -27.685949325561523, "global_step": 577302, "epoch": 6955} {"train_loss": -27.96649742126465, "global_step": 577303, "epoch": 6955} {"train_loss": -27.924169540405273, "global_step": 577304, "epoch": 6955} {"train_loss": -27.5037784576416, "global_step": 577305, "epoch": 6955} {"train_loss": -27.532424926757812, "global_step": 577306, "epoch": 6955} {"train_loss": -27.741437911987305, "global_step": 577307, "epoch": 6955} {"train_loss": -27.904272079467773, "global_step": 577308, "epoch": 6955} {"train_loss": -27.444894790649414, "global_step": 577309, "epoch": 6955} {"train_loss": -27.69520378112793, "global_step": 577310, "epoch": 6955} {"train_loss": -27.966949462890625, "global_step": 577311, "epoch": 6955} {"train_loss": -28.04542350769043, "global_step": 577312, "epoch": 6955} {"train_loss": -27.9461612701416, "global_step": 577313, "epoch": 6955} {"train_loss": -28.031103134155273, "global_step": 577314, "epoch": 6955} {"train_loss": -27.876544952392578, "global_step": 577315, "epoch": 6955} {"train_loss": -28.350921630859375, "global_step": 577316, "epoch": 6955} {"train_loss": -27.958648681640625, "global_step": 577317, "epoch": 6955} {"train_loss": -28.470829010009766, "global_step": 577318, "epoch": 6955} {"train_loss": -28.02392578125, "global_step": 577319, "epoch": 6955} {"train_loss": -28.3027286529541, "global_step": 577320, "epoch": 6955} {"train_loss": -28.443923950195312, "global_step": 577321, "epoch": 6955} {"train_loss": -28.246082305908203, "global_step": 577322, "epoch": 6955} {"train_loss": -28.152698516845703, "global_step": 577323, "epoch": 6955} {"train_loss": -27.915637969970703, "global_step": 577324, "epoch": 6955} {"train_loss": -28.095932006835938, "global_step": 577325, "epoch": 6955} {"train_loss": -28.162023544311523, "global_step": 577326, "epoch": 6955} {"train_loss": -28.184951782226562, "global_step": 577327, "epoch": 6955} {"train_loss": -28.0494384765625, "global_step": 577328, "epoch": 6955} {"train_loss": -27.765417098999023, "global_step": 577329, "epoch": 6955} {"train_loss": -28.130237579345703, "global_step": 577330, "epoch": 6955} {"train_loss": -27.824634552001953, "global_step": 577331, "epoch": 6955} {"train_loss": -27.802480697631836, "global_step": 577332, "epoch": 6955} {"train_loss": -28.174856185913086, "global_step": 577333, "epoch": 6955} {"train_loss": -28.05218505859375, "global_step": 577334, "epoch": 6955} {"train_loss": -28.11636734008789, "global_step": 577335, "epoch": 6955} {"train_loss": -27.9638614654541, "global_step": 577336, "epoch": 6955} {"train_loss": -28.18289566040039, "global_step": 577337, "epoch": 6955} {"train_loss": -28.2940616607666, "global_step": 577338, "epoch": 6955} {"train_loss": -27.44428825378418, "global_step": 577339, "epoch": 6955} {"train_loss": -28.08188819885254, "global_step": 577340, "epoch": 6955} {"train_loss": -27.909109115600586, "global_step": 577341, "epoch": 6955} {"train_loss": -28.18805503845215, "global_step": 577342, "epoch": 6955} {"train_loss": -27.591821670532227, "global_step": 577343, "epoch": 6955} {"train_loss": -28.11231803894043, "global_step": 577344, "epoch": 6955} {"train_loss": -28.31817626953125, "global_step": 577345, "epoch": 6955} {"train_loss": -28.007186889648438, "global_step": 577346, "epoch": 6955} {"train_loss": -27.799505670386626, "global_step": 577347, "epoch": 6955, "val_loss": 6669530.0} {"train_loss": -26.775238037109375, "global_step": 577348, "epoch": 6956} {"train_loss": -25.544677734375, "global_step": 577349, "epoch": 6956} {"train_loss": -26.253284454345703, "global_step": 577350, "epoch": 6956} {"train_loss": -25.829818725585938, "global_step": 577351, "epoch": 6956} {"train_loss": -26.744916915893555, "global_step": 577352, "epoch": 6956} {"train_loss": -26.819766998291016, "global_step": 577353, "epoch": 6956} {"train_loss": -27.210351943969727, "global_step": 577354, "epoch": 6956} {"train_loss": -26.877399444580078, "global_step": 577355, "epoch": 6956} {"train_loss": -27.2342472076416, "global_step": 577356, "epoch": 6956} {"train_loss": -26.951025009155273, "global_step": 577357, "epoch": 6956} {"train_loss": -26.65213394165039, "global_step": 577358, "epoch": 6956} {"train_loss": -27.404296875, "global_step": 577359, "epoch": 6956} {"train_loss": -27.092578887939453, "global_step": 577360, "epoch": 6956} {"train_loss": -27.47507095336914, "global_step": 577361, "epoch": 6956} {"train_loss": -27.27980613708496, "global_step": 577362, "epoch": 6956} {"train_loss": -27.003931045532227, "global_step": 577363, "epoch": 6956} {"train_loss": -27.408893585205078, "global_step": 577364, "epoch": 6956} {"train_loss": -27.497446060180664, "global_step": 577365, "epoch": 6956} {"train_loss": -27.315649032592773, "global_step": 577366, "epoch": 6956} {"train_loss": -27.36236572265625, "global_step": 577367, "epoch": 6956} {"train_loss": -27.72199821472168, "global_step": 577368, "epoch": 6956} {"train_loss": -27.744037628173828, "global_step": 577369, "epoch": 6956} {"train_loss": -27.7721004486084, "global_step": 577370, "epoch": 6956} {"train_loss": -27.4050350189209, "global_step": 577371, "epoch": 6956} {"train_loss": -27.396717071533203, "global_step": 577372, "epoch": 6956} {"train_loss": -27.68671989440918, "global_step": 577373, "epoch": 6956} {"train_loss": -27.8555908203125, "global_step": 577374, "epoch": 6956} {"train_loss": -27.356536865234375, "global_step": 577375, "epoch": 6956} {"train_loss": -27.517902374267578, "global_step": 577376, "epoch": 6956} {"train_loss": -27.36264991760254, "global_step": 577377, "epoch": 6956} {"train_loss": -27.610950469970703, "global_step": 577378, "epoch": 6956} {"train_loss": -27.8432674407959, "global_step": 577379, "epoch": 6956} {"train_loss": -27.830530166625977, "global_step": 577380, "epoch": 6956} {"train_loss": -27.671600341796875, "global_step": 577381, "epoch": 6956} {"train_loss": -28.077320098876953, "global_step": 577382, "epoch": 6956} {"train_loss": -27.89906120300293, "global_step": 577383, "epoch": 6956} {"train_loss": -28.05389976501465, "global_step": 577384, "epoch": 6956} {"train_loss": -28.155359268188477, "global_step": 577385, "epoch": 6956} {"train_loss": -27.937240600585938, "global_step": 577386, "epoch": 6956} {"train_loss": -28.415674209594727, "global_step": 577387, "epoch": 6956} {"train_loss": -27.9711971282959, "global_step": 577388, "epoch": 6956} {"train_loss": -28.179519653320312, "global_step": 577389, "epoch": 6956} {"train_loss": -27.720632553100586, "global_step": 577390, "epoch": 6956} {"train_loss": -28.0200138092041, "global_step": 577391, "epoch": 6956} {"train_loss": -28.227689743041992, "global_step": 577392, "epoch": 6956} {"train_loss": -27.97053337097168, "global_step": 577393, "epoch": 6956} {"train_loss": -27.90838623046875, "global_step": 577394, "epoch": 6956} {"train_loss": -28.107343673706055, "global_step": 577395, "epoch": 6956} {"train_loss": -28.057422637939453, "global_step": 577396, "epoch": 6956} {"train_loss": -28.20599365234375, "global_step": 577397, "epoch": 6956} {"train_loss": -27.89544105529785, "global_step": 577398, "epoch": 6956} {"train_loss": -28.05177116394043, "global_step": 577399, "epoch": 6956} {"train_loss": -28.28780174255371, "global_step": 577400, "epoch": 6956} {"train_loss": -28.386219024658203, "global_step": 577401, "epoch": 6956} {"train_loss": -28.025775909423828, "global_step": 577402, "epoch": 6956} {"train_loss": -27.85177993774414, "global_step": 577403, "epoch": 6956} {"train_loss": -27.654699325561523, "global_step": 577404, "epoch": 6956} {"train_loss": -27.717382431030273, "global_step": 577405, "epoch": 6956} {"train_loss": -28.026334762573242, "global_step": 577406, "epoch": 6956} {"train_loss": -27.960824966430664, "global_step": 577407, "epoch": 6956} {"train_loss": -27.96766471862793, "global_step": 577408, "epoch": 6956} {"train_loss": -28.05055046081543, "global_step": 577409, "epoch": 6956} {"train_loss": -28.00486183166504, "global_step": 577410, "epoch": 6956} {"train_loss": -28.05122184753418, "global_step": 577411, "epoch": 6956} {"train_loss": -27.62318229675293, "global_step": 577412, "epoch": 6956} {"train_loss": -27.569671630859375, "global_step": 577413, "epoch": 6956} {"train_loss": -27.588430404663086, "global_step": 577414, "epoch": 6956} {"train_loss": -27.669660568237305, "global_step": 577415, "epoch": 6956} {"train_loss": -28.224414825439453, "global_step": 577416, "epoch": 6956} {"train_loss": -27.521665573120117, "global_step": 577417, "epoch": 6956} {"train_loss": -27.865304946899414, "global_step": 577418, "epoch": 6956} {"train_loss": -27.994298934936523, "global_step": 577419, "epoch": 6956} {"train_loss": -27.1975040435791, "global_step": 577420, "epoch": 6956} {"train_loss": -27.728071212768555, "global_step": 577421, "epoch": 6956} {"train_loss": -27.550695419311523, "global_step": 577422, "epoch": 6956} {"train_loss": -27.3331241607666, "global_step": 577423, "epoch": 6956} {"train_loss": -27.590742111206055, "global_step": 577424, "epoch": 6956} {"train_loss": -28.072378158569336, "global_step": 577425, "epoch": 6956} {"train_loss": -27.60491371154785, "global_step": 577426, "epoch": 6956} {"train_loss": -27.445968627929688, "global_step": 577427, "epoch": 6956} {"train_loss": -27.579818725585938, "global_step": 577428, "epoch": 6956} {"train_loss": -27.947546005249023, "global_step": 577429, "epoch": 6956} {"train_loss": -27.610556774828808, "global_step": 577430, "epoch": 6956, "val_loss": 6619603.0} {"train_loss": -26.93955421447754, "global_step": 577431, "epoch": 6957} {"train_loss": -27.437463760375977, "global_step": 577432, "epoch": 6957} {"train_loss": -27.474750518798828, "global_step": 577433, "epoch": 6957} {"train_loss": -27.211889266967773, "global_step": 577434, "epoch": 6957} {"train_loss": -26.908618927001953, "global_step": 577435, "epoch": 6957} {"train_loss": -27.643878936767578, "global_step": 577436, "epoch": 6957} {"train_loss": -27.219533920288086, "global_step": 577437, "epoch": 6957} {"train_loss": -27.287200927734375, "global_step": 577438, "epoch": 6957} {"train_loss": -27.638593673706055, "global_step": 577439, "epoch": 6957} {"train_loss": -27.4151611328125, "global_step": 577440, "epoch": 6957} {"train_loss": -27.180591583251953, "global_step": 577441, "epoch": 6957} {"train_loss": -27.34879493713379, "global_step": 577442, "epoch": 6957} {"train_loss": -27.649961471557617, "global_step": 577443, "epoch": 6957} {"train_loss": -27.660888671875, "global_step": 577444, "epoch": 6957} {"train_loss": -27.544116973876953, "global_step": 577445, "epoch": 6957} {"train_loss": -27.486286163330078, "global_step": 577446, "epoch": 6957} {"train_loss": -27.36036491394043, "global_step": 577447, "epoch": 6957} {"train_loss": -28.058307647705078, "global_step": 577448, "epoch": 6957} {"train_loss": -27.93072509765625, "global_step": 577449, "epoch": 6957} {"train_loss": -27.6547794342041, "global_step": 577450, "epoch": 6957} {"train_loss": -27.992300033569336, "global_step": 577451, "epoch": 6957} {"train_loss": -27.73001480102539, "global_step": 577452, "epoch": 6957} {"train_loss": -27.938379287719727, "global_step": 577453, "epoch": 6957} {"train_loss": -27.693994522094727, "global_step": 577454, "epoch": 6957} {"train_loss": -27.746042251586914, "global_step": 577455, "epoch": 6957} {"train_loss": -27.914154052734375, "global_step": 577456, "epoch": 6957} {"train_loss": -27.871667861938477, "global_step": 577457, "epoch": 6957} {"train_loss": -27.90060806274414, "global_step": 577458, "epoch": 6957} {"train_loss": -27.929670333862305, "global_step": 577459, "epoch": 6957} {"train_loss": -28.20808219909668, "global_step": 577460, "epoch": 6957} {"train_loss": -27.74846839904785, "global_step": 577461, "epoch": 6957} {"train_loss": -27.920413970947266, "global_step": 577462, "epoch": 6957} {"train_loss": -28.0132999420166, "global_step": 577463, "epoch": 6957} {"train_loss": -28.177526473999023, "global_step": 577464, "epoch": 6957} {"train_loss": -27.78706169128418, "global_step": 577465, "epoch": 6957} {"train_loss": -27.998380661010742, "global_step": 577466, "epoch": 6957} {"train_loss": -27.918689727783203, "global_step": 577467, "epoch": 6957} {"train_loss": -28.434589385986328, "global_step": 577468, "epoch": 6957} {"train_loss": -28.130115509033203, "global_step": 577469, "epoch": 6957} {"train_loss": -28.262271881103516, "global_step": 577470, "epoch": 6957} {"train_loss": -28.209943771362305, "global_step": 577471, "epoch": 6957} {"train_loss": -27.820714950561523, "global_step": 577472, "epoch": 6957} {"train_loss": -28.077991485595703, "global_step": 577473, "epoch": 6957} {"train_loss": -28.013883590698242, "global_step": 577474, "epoch": 6957} {"train_loss": -28.2818546295166, "global_step": 577475, "epoch": 6957} {"train_loss": -27.97003173828125, "global_step": 577476, "epoch": 6957} {"train_loss": -28.104816436767578, "global_step": 577477, "epoch": 6957} {"train_loss": -28.154708862304688, "global_step": 577478, "epoch": 6957} {"train_loss": -27.882644653320312, "global_step": 577479, "epoch": 6957} {"train_loss": -27.983062744140625, "global_step": 577480, "epoch": 6957} {"train_loss": -27.330982208251953, "global_step": 577481, "epoch": 6957} {"train_loss": -27.716657638549805, "global_step": 577482, "epoch": 6957} {"train_loss": -27.40744400024414, "global_step": 577483, "epoch": 6957} {"train_loss": -27.79436683654785, "global_step": 577484, "epoch": 6957} {"train_loss": -27.837661743164062, "global_step": 577485, "epoch": 6957} {"train_loss": -27.814956665039062, "global_step": 577486, "epoch": 6957} {"train_loss": -27.654083251953125, "global_step": 577487, "epoch": 6957} {"train_loss": -27.88478660583496, "global_step": 577488, "epoch": 6957} {"train_loss": -27.558393478393555, "global_step": 577489, "epoch": 6957} {"train_loss": -28.123157501220703, "global_step": 577490, "epoch": 6957} {"train_loss": -27.759958267211914, "global_step": 577491, "epoch": 6957} {"train_loss": -28.055185317993164, "global_step": 577492, "epoch": 6957} {"train_loss": -28.1839542388916, "global_step": 577493, "epoch": 6957} {"train_loss": -27.6763916015625, "global_step": 577494, "epoch": 6957} {"train_loss": -28.353872299194336, "global_step": 577495, "epoch": 6957} {"train_loss": -27.918014526367188, "global_step": 577496, "epoch": 6957} {"train_loss": -28.33173179626465, "global_step": 577497, "epoch": 6957} {"train_loss": -28.044458389282227, "global_step": 577498, "epoch": 6957} {"train_loss": -28.312238693237305, "global_step": 577499, "epoch": 6957} {"train_loss": -27.76063346862793, "global_step": 577500, "epoch": 6957} {"train_loss": -28.185903549194336, "global_step": 577501, "epoch": 6957} {"train_loss": -28.222238540649414, "global_step": 577502, "epoch": 6957} {"train_loss": -27.924274444580078, "global_step": 577503, "epoch": 6957} {"train_loss": -28.07795524597168, "global_step": 577504, "epoch": 6957} {"train_loss": -28.005908966064453, "global_step": 577505, "epoch": 6957} {"train_loss": -27.960065841674805, "global_step": 577506, "epoch": 6957} {"train_loss": -28.289936065673828, "global_step": 577507, "epoch": 6957} {"train_loss": -27.794626235961914, "global_step": 577508, "epoch": 6957} {"train_loss": -27.969837188720703, "global_step": 577509, "epoch": 6957} {"train_loss": -28.12940788269043, "global_step": 577510, "epoch": 6957} {"train_loss": -28.00471305847168, "global_step": 577511, "epoch": 6957} {"train_loss": -28.11713981628418, "global_step": 577512, "epoch": 6957} {"train_loss": -27.840460352150792, "global_step": 577513, "epoch": 6957, "val_loss": 6601618.5} {"train_loss": -27.747568130493164, "global_step": 577514, "epoch": 6958} {"train_loss": -27.750715255737305, "global_step": 577515, "epoch": 6958} {"train_loss": -27.712661743164062, "global_step": 577516, "epoch": 6958} {"train_loss": -27.35907554626465, "global_step": 577517, "epoch": 6958} {"train_loss": -27.6636962890625, "global_step": 577518, "epoch": 6958} {"train_loss": -27.713361740112305, "global_step": 577519, "epoch": 6958} {"train_loss": -27.67917251586914, "global_step": 577520, "epoch": 6958} {"train_loss": -27.88727378845215, "global_step": 577521, "epoch": 6958} {"train_loss": -27.8026065826416, "global_step": 577522, "epoch": 6958} {"train_loss": -27.549741744995117, "global_step": 577523, "epoch": 6958} {"train_loss": -27.1799373626709, "global_step": 577524, "epoch": 6958} {"train_loss": -27.464435577392578, "global_step": 577525, "epoch": 6958} {"train_loss": -27.497394561767578, "global_step": 577526, "epoch": 6958} {"train_loss": -27.76604652404785, "global_step": 577527, "epoch": 6958} {"train_loss": -27.696706771850586, "global_step": 577528, "epoch": 6958} {"train_loss": -27.817157745361328, "global_step": 577529, "epoch": 6958} {"train_loss": -27.458454132080078, "global_step": 577530, "epoch": 6958} {"train_loss": -27.556283950805664, "global_step": 577531, "epoch": 6958} {"train_loss": -27.3878116607666, "global_step": 577532, "epoch": 6958} {"train_loss": -27.520938873291016, "global_step": 577533, "epoch": 6958} {"train_loss": -28.1204891204834, "global_step": 577534, "epoch": 6958} {"train_loss": -27.793659210205078, "global_step": 577535, "epoch": 6958} {"train_loss": -28.014617919921875, "global_step": 577536, "epoch": 6958} {"train_loss": -27.577802658081055, "global_step": 577537, "epoch": 6958} {"train_loss": -28.15166664123535, "global_step": 577538, "epoch": 6958} {"train_loss": -28.062780380249023, "global_step": 577539, "epoch": 6958} {"train_loss": -27.869476318359375, "global_step": 577540, "epoch": 6958} {"train_loss": -27.853479385375977, "global_step": 577541, "epoch": 6958} {"train_loss": -27.370407104492188, "global_step": 577542, "epoch": 6958} {"train_loss": -27.889020919799805, "global_step": 577543, "epoch": 6958} {"train_loss": -27.880048751831055, "global_step": 577544, "epoch": 6958} {"train_loss": -28.165922164916992, "global_step": 577545, "epoch": 6958} {"train_loss": -27.874908447265625, "global_step": 577546, "epoch": 6958} {"train_loss": -28.188888549804688, "global_step": 577547, "epoch": 6958} {"train_loss": -27.9047908782959, "global_step": 577548, "epoch": 6958} {"train_loss": -28.3311710357666, "global_step": 577549, "epoch": 6958} {"train_loss": -28.00086784362793, "global_step": 577550, "epoch": 6958} {"train_loss": -27.84754753112793, "global_step": 577551, "epoch": 6958} {"train_loss": -27.927480697631836, "global_step": 577552, "epoch": 6958} {"train_loss": -27.718774795532227, "global_step": 577553, "epoch": 6958} {"train_loss": -27.827686309814453, "global_step": 577554, "epoch": 6958} {"train_loss": -28.03485107421875, "global_step": 577555, "epoch": 6958} {"train_loss": -27.839277267456055, "global_step": 577556, "epoch": 6958} {"train_loss": -28.02033042907715, "global_step": 577557, "epoch": 6958} {"train_loss": -28.169042587280273, "global_step": 577558, "epoch": 6958} {"train_loss": -27.775781631469727, "global_step": 577559, "epoch": 6958} {"train_loss": -27.942703247070312, "global_step": 577560, "epoch": 6958} {"train_loss": -27.89468765258789, "global_step": 577561, "epoch": 6958} {"train_loss": -28.214080810546875, "global_step": 577562, "epoch": 6958} {"train_loss": -28.427839279174805, "global_step": 577563, "epoch": 6958} {"train_loss": -27.9842529296875, "global_step": 577564, "epoch": 6958} {"train_loss": -28.104475021362305, "global_step": 577565, "epoch": 6958} {"train_loss": -27.9747314453125, "global_step": 577566, "epoch": 6958} {"train_loss": -27.87677574157715, "global_step": 577567, "epoch": 6958} {"train_loss": -28.174392700195312, "global_step": 577568, "epoch": 6958} {"train_loss": -27.767908096313477, "global_step": 577569, "epoch": 6958} {"train_loss": -27.967395782470703, "global_step": 577570, "epoch": 6958} {"train_loss": -27.82024574279785, "global_step": 577571, "epoch": 6958} {"train_loss": -27.806665420532227, "global_step": 577572, "epoch": 6958} {"train_loss": -28.18794822692871, "global_step": 577573, "epoch": 6958} {"train_loss": -28.24838638305664, "global_step": 577574, "epoch": 6958} {"train_loss": -28.505172729492188, "global_step": 577575, "epoch": 6958} {"train_loss": -28.310083389282227, "global_step": 577576, "epoch": 6958} {"train_loss": -28.02473258972168, "global_step": 577577, "epoch": 6958} {"train_loss": -27.859827041625977, "global_step": 577578, "epoch": 6958} {"train_loss": -28.214574813842773, "global_step": 577579, "epoch": 6958} {"train_loss": -27.921894073486328, "global_step": 577580, "epoch": 6958} {"train_loss": -27.74561882019043, "global_step": 577581, "epoch": 6958} {"train_loss": -27.741342544555664, "global_step": 577582, "epoch": 6958} {"train_loss": -27.69647216796875, "global_step": 577583, "epoch": 6958} {"train_loss": -28.015974044799805, "global_step": 577584, "epoch": 6958} {"train_loss": -27.987180709838867, "global_step": 577585, "epoch": 6958} {"train_loss": -27.774433135986328, "global_step": 577586, "epoch": 6958} {"train_loss": -28.001407623291016, "global_step": 577587, "epoch": 6958} {"train_loss": -27.4534969329834, "global_step": 577588, "epoch": 6958} {"train_loss": -27.763940811157227, "global_step": 577589, "epoch": 6958} {"train_loss": -28.12122917175293, "global_step": 577590, "epoch": 6958} {"train_loss": -27.717870712280273, "global_step": 577591, "epoch": 6958} {"train_loss": -27.235797882080078, "global_step": 577592, "epoch": 6958} {"train_loss": -27.863758087158203, "global_step": 577593, "epoch": 6958} {"train_loss": -27.627197265625, "global_step": 577594, "epoch": 6958} {"train_loss": -27.354354858398438, "global_step": 577595, "epoch": 6958} {"train_loss": -27.852216490780016, "global_step": 577596, "epoch": 6958, "val_loss": 6564460.5} {"train_loss": -26.397607803344727, "global_step": 577597, "epoch": 6959} {"train_loss": -26.74277114868164, "global_step": 577598, "epoch": 6959} {"train_loss": -26.146148681640625, "global_step": 577599, "epoch": 6959} {"train_loss": -26.42095947265625, "global_step": 577600, "epoch": 6959} {"train_loss": -25.849567413330078, "global_step": 577601, "epoch": 6959} {"train_loss": -26.909658432006836, "global_step": 577602, "epoch": 6959} {"train_loss": -26.88129234313965, "global_step": 577603, "epoch": 6959} {"train_loss": -27.120288848876953, "global_step": 577604, "epoch": 6959} {"train_loss": -26.527210235595703, "global_step": 577605, "epoch": 6959} {"train_loss": -26.968536376953125, "global_step": 577606, "epoch": 6959} {"train_loss": -27.05289649963379, "global_step": 577607, "epoch": 6959} {"train_loss": -26.819684982299805, "global_step": 577608, "epoch": 6959} {"train_loss": -26.893564224243164, "global_step": 577609, "epoch": 6959} {"train_loss": -26.84499168395996, "global_step": 577610, "epoch": 6959} {"train_loss": -27.124052047729492, "global_step": 577611, "epoch": 6959} {"train_loss": -27.23384666442871, "global_step": 577612, "epoch": 6959} {"train_loss": -27.889028549194336, "global_step": 577613, "epoch": 6959} {"train_loss": -27.19904899597168, "global_step": 577614, "epoch": 6959} {"train_loss": -27.66754150390625, "global_step": 577615, "epoch": 6959} {"train_loss": -27.41817283630371, "global_step": 577616, "epoch": 6959} {"train_loss": -27.193151473999023, "global_step": 577617, "epoch": 6959} {"train_loss": -27.224201202392578, "global_step": 577618, "epoch": 6959} {"train_loss": -27.36834144592285, "global_step": 577619, "epoch": 6959} {"train_loss": -27.652210235595703, "global_step": 577620, "epoch": 6959} {"train_loss": -27.65093994140625, "global_step": 577621, "epoch": 6959} {"train_loss": -27.469396591186523, "global_step": 577622, "epoch": 6959} {"train_loss": -27.24285316467285, "global_step": 577623, "epoch": 6959} {"train_loss": -27.534442901611328, "global_step": 577624, "epoch": 6959} {"train_loss": -27.48518180847168, "global_step": 577625, "epoch": 6959} {"train_loss": -27.937551498413086, "global_step": 577626, "epoch": 6959} {"train_loss": -27.830326080322266, "global_step": 577627, "epoch": 6959} {"train_loss": -27.724700927734375, "global_step": 577628, "epoch": 6959} {"train_loss": -27.87843132019043, "global_step": 577629, "epoch": 6959} {"train_loss": -28.0950984954834, "global_step": 577630, "epoch": 6959} {"train_loss": -27.760168075561523, "global_step": 577631, "epoch": 6959} {"train_loss": -28.1624755859375, "global_step": 577632, "epoch": 6959} {"train_loss": -27.931549072265625, "global_step": 577633, "epoch": 6959} {"train_loss": -27.886188507080078, "global_step": 577634, "epoch": 6959} {"train_loss": -28.05527687072754, "global_step": 577635, "epoch": 6959} {"train_loss": -27.82673454284668, "global_step": 577636, "epoch": 6959} {"train_loss": -28.17022705078125, "global_step": 577637, "epoch": 6959} {"train_loss": -27.95699119567871, "global_step": 577638, "epoch": 6959} {"train_loss": -28.103742599487305, "global_step": 577639, "epoch": 6959} {"train_loss": -27.610458374023438, "global_step": 577640, "epoch": 6959} {"train_loss": -28.029403686523438, "global_step": 577641, "epoch": 6959} {"train_loss": -28.241003036499023, "global_step": 577642, "epoch": 6959} {"train_loss": -27.899600982666016, "global_step": 577643, "epoch": 6959} {"train_loss": -28.181867599487305, "global_step": 577644, "epoch": 6959} {"train_loss": -28.13772964477539, "global_step": 577645, "epoch": 6959} {"train_loss": -28.172626495361328, "global_step": 577646, "epoch": 6959} {"train_loss": -28.05743408203125, "global_step": 577647, "epoch": 6959} {"train_loss": -28.121509552001953, "global_step": 577648, "epoch": 6959} {"train_loss": -28.05299186706543, "global_step": 577649, "epoch": 6959} {"train_loss": -28.2183780670166, "global_step": 577650, "epoch": 6959} {"train_loss": -28.052770614624023, "global_step": 577651, "epoch": 6959} {"train_loss": -27.77009391784668, "global_step": 577652, "epoch": 6959} {"train_loss": -28.373218536376953, "global_step": 577653, "epoch": 6959} {"train_loss": -28.235076904296875, "global_step": 577654, "epoch": 6959} {"train_loss": -28.101642608642578, "global_step": 577655, "epoch": 6959} {"train_loss": -27.92374038696289, "global_step": 577656, "epoch": 6959} {"train_loss": -28.06400489807129, "global_step": 577657, "epoch": 6959} {"train_loss": -28.199832916259766, "global_step": 577658, "epoch": 6959} {"train_loss": -28.05854606628418, "global_step": 577659, "epoch": 6959} {"train_loss": -27.83234977722168, "global_step": 577660, "epoch": 6959} {"train_loss": -27.923681259155273, "global_step": 577661, "epoch": 6959} {"train_loss": -28.05609703063965, "global_step": 577662, "epoch": 6959} {"train_loss": -28.215229034423828, "global_step": 577663, "epoch": 6959} {"train_loss": -27.919401168823242, "global_step": 577664, "epoch": 6959} {"train_loss": -28.214096069335938, "global_step": 577665, "epoch": 6959} {"train_loss": -28.244550704956055, "global_step": 577666, "epoch": 6959} {"train_loss": -28.319787979125977, "global_step": 577667, "epoch": 6959} {"train_loss": -28.404821395874023, "global_step": 577668, "epoch": 6959} {"train_loss": -28.244232177734375, "global_step": 577669, "epoch": 6959} {"train_loss": -28.2733211517334, "global_step": 577670, "epoch": 6959} {"train_loss": -28.114927291870117, "global_step": 577671, "epoch": 6959} {"train_loss": -27.933216094970703, "global_step": 577672, "epoch": 6959} {"train_loss": -28.37060546875, "global_step": 577673, "epoch": 6959} {"train_loss": -28.315982818603516, "global_step": 577674, "epoch": 6959} {"train_loss": -27.4960994720459, "global_step": 577675, "epoch": 6959} {"train_loss": -27.473957061767578, "global_step": 577676, "epoch": 6959} {"train_loss": -27.63978385925293, "global_step": 577677, "epoch": 6959} {"train_loss": -27.87188148498535, "global_step": 577678, "epoch": 6959} {"train_loss": -27.6885888892484, "global_step": 577679, "epoch": 6959, "val_loss": 6542113.0} {"train_loss": -25.42466163635254, "global_step": 577680, "epoch": 6960} {"train_loss": -20.582324981689453, "global_step": 577681, "epoch": 6960} {"train_loss": -22.138845443725586, "global_step": 577682, "epoch": 6960} {"train_loss": -25.113412857055664, "global_step": 577683, "epoch": 6960} {"train_loss": -20.602909088134766, "global_step": 577684, "epoch": 6960} {"train_loss": -23.92935562133789, "global_step": 577685, "epoch": 6960} {"train_loss": -23.57137107849121, "global_step": 577686, "epoch": 6960} {"train_loss": -25.236318588256836, "global_step": 577687, "epoch": 6960} {"train_loss": -22.875782012939453, "global_step": 577688, "epoch": 6960} {"train_loss": -24.601776123046875, "global_step": 577689, "epoch": 6960} {"train_loss": -24.834945678710938, "global_step": 577690, "epoch": 6960} {"train_loss": -25.028539657592773, "global_step": 577691, "epoch": 6960} {"train_loss": -24.815826416015625, "global_step": 577692, "epoch": 6960} {"train_loss": -25.487686157226562, "global_step": 577693, "epoch": 6960} {"train_loss": -25.663232803344727, "global_step": 577694, "epoch": 6960} {"train_loss": -25.284832000732422, "global_step": 577695, "epoch": 6960} {"train_loss": -25.64177894592285, "global_step": 577696, "epoch": 6960} {"train_loss": -25.72283935546875, "global_step": 577697, "epoch": 6960} {"train_loss": -26.08878517150879, "global_step": 577698, "epoch": 6960} {"train_loss": -25.72373390197754, "global_step": 577699, "epoch": 6960} {"train_loss": -25.96966552734375, "global_step": 577700, "epoch": 6960} {"train_loss": -25.701004028320312, "global_step": 577701, "epoch": 6960} {"train_loss": -26.160749435424805, "global_step": 577702, "epoch": 6960} {"train_loss": -26.0181827545166, "global_step": 577703, "epoch": 6960} {"train_loss": -26.157119750976562, "global_step": 577704, "epoch": 6960} {"train_loss": -26.116226196289062, "global_step": 577705, "epoch": 6960} {"train_loss": -25.87403678894043, "global_step": 577706, "epoch": 6960} {"train_loss": -26.20490837097168, "global_step": 577707, "epoch": 6960} {"train_loss": -26.483572006225586, "global_step": 577708, "epoch": 6960} {"train_loss": -26.60809898376465, "global_step": 577709, "epoch": 6960} {"train_loss": -26.605457305908203, "global_step": 577710, "epoch": 6960} {"train_loss": -26.871606826782227, "global_step": 577711, "epoch": 6960} {"train_loss": -26.63800621032715, "global_step": 577712, "epoch": 6960} {"train_loss": -26.915693283081055, "global_step": 577713, "epoch": 6960} {"train_loss": -26.775501251220703, "global_step": 577714, "epoch": 6960} {"train_loss": -26.542255401611328, "global_step": 577715, "epoch": 6960} {"train_loss": -26.46173095703125, "global_step": 577716, "epoch": 6960} {"train_loss": -26.648242950439453, "global_step": 577717, "epoch": 6960} {"train_loss": -26.39253807067871, "global_step": 577718, "epoch": 6960} {"train_loss": -26.759906768798828, "global_step": 577719, "epoch": 6960} {"train_loss": -27.354429244995117, "global_step": 577720, "epoch": 6960} {"train_loss": -27.129873275756836, "global_step": 577721, "epoch": 6960} {"train_loss": -27.022506713867188, "global_step": 577722, "epoch": 6960} {"train_loss": -26.95011329650879, "global_step": 577723, "epoch": 6960} {"train_loss": -27.093536376953125, "global_step": 577724, "epoch": 6960} {"train_loss": -27.00507164001465, "global_step": 577725, "epoch": 6960} {"train_loss": -27.262540817260742, "global_step": 577726, "epoch": 6960} {"train_loss": -27.1738224029541, "global_step": 577727, "epoch": 6960} {"train_loss": -27.190351486206055, "global_step": 577728, "epoch": 6960} {"train_loss": -27.465051651000977, "global_step": 577729, "epoch": 6960} {"train_loss": -27.2941837310791, "global_step": 577730, "epoch": 6960} {"train_loss": -27.384260177612305, "global_step": 577731, "epoch": 6960} {"train_loss": -27.485315322875977, "global_step": 577732, "epoch": 6960} {"train_loss": -27.5115966796875, "global_step": 577733, "epoch": 6960} {"train_loss": -27.872339248657227, "global_step": 577734, "epoch": 6960} {"train_loss": -27.158283233642578, "global_step": 577735, "epoch": 6960} {"train_loss": -27.42127799987793, "global_step": 577736, "epoch": 6960} {"train_loss": -27.604129791259766, "global_step": 577737, "epoch": 6960} {"train_loss": -27.841873168945312, "global_step": 577738, "epoch": 6960} {"train_loss": -27.65461540222168, "global_step": 577739, "epoch": 6960} {"train_loss": -27.96954917907715, "global_step": 577740, "epoch": 6960} {"train_loss": -27.649580001831055, "global_step": 577741, "epoch": 6960} {"train_loss": -27.3472900390625, "global_step": 577742, "epoch": 6960} {"train_loss": -27.790603637695312, "global_step": 577743, "epoch": 6960} {"train_loss": -27.914443969726562, "global_step": 577744, "epoch": 6960} {"train_loss": -27.493473052978516, "global_step": 577745, "epoch": 6960} {"train_loss": -28.19414710998535, "global_step": 577746, "epoch": 6960} {"train_loss": -27.600723266601562, "global_step": 577747, "epoch": 6960} {"train_loss": -27.809778213500977, "global_step": 577748, "epoch": 6960} {"train_loss": -27.916967391967773, "global_step": 577749, "epoch": 6960} {"train_loss": -28.038232803344727, "global_step": 577750, "epoch": 6960} {"train_loss": -27.735828399658203, "global_step": 577751, "epoch": 6960} {"train_loss": -27.827472686767578, "global_step": 577752, "epoch": 6960} {"train_loss": -27.739694595336914, "global_step": 577753, "epoch": 6960} {"train_loss": -27.636926651000977, "global_step": 577754, "epoch": 6960} {"train_loss": -27.70794677734375, "global_step": 577755, "epoch": 6960} {"train_loss": -27.896270751953125, "global_step": 577756, "epoch": 6960} {"train_loss": -27.865468978881836, "global_step": 577757, "epoch": 6960} {"train_loss": -28.393945693969727, "global_step": 577758, "epoch": 6960} {"train_loss": -27.923171997070312, "global_step": 577759, "epoch": 6960} {"train_loss": -27.642215728759766, "global_step": 577760, "epoch": 6960} {"train_loss": -27.950824737548828, "global_step": 577761, "epoch": 6960} {"train_loss": -26.534461975097656, "global_step": 577762, "epoch": 6960, "val_loss": 6551992.5} {"train_loss": -27.647571563720703, "global_step": 577763, "epoch": 6961} {"train_loss": -27.54728126525879, "global_step": 577764, "epoch": 6961} {"train_loss": -28.186431884765625, "global_step": 577765, "epoch": 6961} {"train_loss": -27.613935470581055, "global_step": 577766, "epoch": 6961} {"train_loss": -27.973358154296875, "global_step": 577767, "epoch": 6961} {"train_loss": -27.798635482788086, "global_step": 577768, "epoch": 6961} {"train_loss": -27.58282470703125, "global_step": 577769, "epoch": 6961} {"train_loss": -27.804990768432617, "global_step": 577770, "epoch": 6961} {"train_loss": -27.61787223815918, "global_step": 577771, "epoch": 6961} {"train_loss": -27.822467803955078, "global_step": 577772, "epoch": 6961} {"train_loss": -27.942087173461914, "global_step": 577773, "epoch": 6961} {"train_loss": -27.76092529296875, "global_step": 577774, "epoch": 6961} {"train_loss": -27.971023559570312, "global_step": 577775, "epoch": 6961} {"train_loss": -28.022144317626953, "global_step": 577776, "epoch": 6961} {"train_loss": -27.588687896728516, "global_step": 577777, "epoch": 6961} {"train_loss": -28.06990623474121, "global_step": 577778, "epoch": 6961} {"train_loss": -27.65091323852539, "global_step": 577779, "epoch": 6961} {"train_loss": -27.871118545532227, "global_step": 577780, "epoch": 6961} {"train_loss": -27.88010597229004, "global_step": 577781, "epoch": 6961} {"train_loss": -27.593488693237305, "global_step": 577782, "epoch": 6961} {"train_loss": -28.0535831451416, "global_step": 577783, "epoch": 6961} {"train_loss": -27.83405876159668, "global_step": 577784, "epoch": 6961} {"train_loss": -28.01325035095215, "global_step": 577785, "epoch": 6961} {"train_loss": -27.9642333984375, "global_step": 577786, "epoch": 6961} {"train_loss": -28.071069717407227, "global_step": 577787, "epoch": 6961} {"train_loss": -27.714624404907227, "global_step": 577788, "epoch": 6961} {"train_loss": -27.915485382080078, "global_step": 577789, "epoch": 6961} {"train_loss": -27.944461822509766, "global_step": 577790, "epoch": 6961} {"train_loss": -27.858991622924805, "global_step": 577791, "epoch": 6961} {"train_loss": -27.742578506469727, "global_step": 577792, "epoch": 6961} {"train_loss": -27.695886611938477, "global_step": 577793, "epoch": 6961} {"train_loss": -27.9411563873291, "global_step": 577794, "epoch": 6961} {"train_loss": -28.004484176635742, "global_step": 577795, "epoch": 6961} {"train_loss": -27.9510498046875, "global_step": 577796, "epoch": 6961} {"train_loss": -27.813247680664062, "global_step": 577797, "epoch": 6961} {"train_loss": -27.837865829467773, "global_step": 577798, "epoch": 6961} {"train_loss": -28.378116607666016, "global_step": 577799, "epoch": 6961} {"train_loss": -27.66779899597168, "global_step": 577800, "epoch": 6961} {"train_loss": -28.132043838500977, "global_step": 577801, "epoch": 6961} {"train_loss": -28.058292388916016, "global_step": 577802, "epoch": 6961} {"train_loss": -27.99688148498535, "global_step": 577803, "epoch": 6961} {"train_loss": -28.214405059814453, "global_step": 577804, "epoch": 6961} {"train_loss": -28.267560958862305, "global_step": 577805, "epoch": 6961} {"train_loss": -28.217636108398438, "global_step": 577806, "epoch": 6961} {"train_loss": -27.81597900390625, "global_step": 577807, "epoch": 6961} {"train_loss": -28.029516220092773, "global_step": 577808, "epoch": 6961} {"train_loss": -28.14788246154785, "global_step": 577809, "epoch": 6961} {"train_loss": -27.956846237182617, "global_step": 577810, "epoch": 6961} {"train_loss": -28.194721221923828, "global_step": 577811, "epoch": 6961} {"train_loss": -27.549001693725586, "global_step": 577812, "epoch": 6961} {"train_loss": -27.951391220092773, "global_step": 577813, "epoch": 6961} {"train_loss": -27.682321548461914, "global_step": 577814, "epoch": 6961} {"train_loss": -28.111618041992188, "global_step": 577815, "epoch": 6961} {"train_loss": -28.08022117614746, "global_step": 577816, "epoch": 6961} {"train_loss": -27.654958724975586, "global_step": 577817, "epoch": 6961} {"train_loss": -27.790395736694336, "global_step": 577818, "epoch": 6961} {"train_loss": -28.02496337890625, "global_step": 577819, "epoch": 6961} {"train_loss": -28.34341812133789, "global_step": 577820, "epoch": 6961} {"train_loss": -27.99249267578125, "global_step": 577821, "epoch": 6961} {"train_loss": -27.993520736694336, "global_step": 577822, "epoch": 6961} {"train_loss": -27.441980361938477, "global_step": 577823, "epoch": 6961} {"train_loss": -27.804046630859375, "global_step": 577824, "epoch": 6961} {"train_loss": -27.934919357299805, "global_step": 577825, "epoch": 6961} {"train_loss": -27.770416259765625, "global_step": 577826, "epoch": 6961} {"train_loss": -26.991117477416992, "global_step": 577827, "epoch": 6961} {"train_loss": -27.513233184814453, "global_step": 577828, "epoch": 6961} {"train_loss": -27.199438095092773, "global_step": 577829, "epoch": 6961} {"train_loss": -26.760412216186523, "global_step": 577830, "epoch": 6961} {"train_loss": -27.560047149658203, "global_step": 577831, "epoch": 6961} {"train_loss": -27.25508689880371, "global_step": 577832, "epoch": 6961} {"train_loss": -27.63167381286621, "global_step": 577833, "epoch": 6961} {"train_loss": -27.266565322875977, "global_step": 577834, "epoch": 6961} {"train_loss": -27.36677360534668, "global_step": 577835, "epoch": 6961} {"train_loss": -27.64044761657715, "global_step": 577836, "epoch": 6961} {"train_loss": -27.471765518188477, "global_step": 577837, "epoch": 6961} {"train_loss": -27.332639694213867, "global_step": 577838, "epoch": 6961} {"train_loss": -27.87531089782715, "global_step": 577839, "epoch": 6961} {"train_loss": -27.965152740478516, "global_step": 577840, "epoch": 6961} {"train_loss": -27.468246459960938, "global_step": 577841, "epoch": 6961} {"train_loss": -27.759580612182617, "global_step": 577842, "epoch": 6961} {"train_loss": -27.8776912689209, "global_step": 577843, "epoch": 6961} {"train_loss": -28.28775978088379, "global_step": 577844, "epoch": 6961} {"train_loss": -27.829613880938794, "global_step": 577845, "epoch": 6961, "val_loss": 6615476.0} {"train_loss": -27.37196922302246, "global_step": 577846, "epoch": 6962} {"train_loss": -27.06534767150879, "global_step": 577847, "epoch": 6962} {"train_loss": -27.170658111572266, "global_step": 577848, "epoch": 6962} {"train_loss": -26.68845558166504, "global_step": 577849, "epoch": 6962} {"train_loss": -27.035064697265625, "global_step": 577850, "epoch": 6962} {"train_loss": -27.334394454956055, "global_step": 577851, "epoch": 6962} {"train_loss": -27.275924682617188, "global_step": 577852, "epoch": 6962} {"train_loss": -27.214609146118164, "global_step": 577853, "epoch": 6962} {"train_loss": -27.440587997436523, "global_step": 577854, "epoch": 6962} {"train_loss": -26.840620040893555, "global_step": 577855, "epoch": 6962} {"train_loss": -27.200244903564453, "global_step": 577856, "epoch": 6962} {"train_loss": -27.35389518737793, "global_step": 577857, "epoch": 6962} {"train_loss": -27.272552490234375, "global_step": 577858, "epoch": 6962} {"train_loss": -27.555011749267578, "global_step": 577859, "epoch": 6962} {"train_loss": -27.434186935424805, "global_step": 577860, "epoch": 6962} {"train_loss": -27.53983497619629, "global_step": 577861, "epoch": 6962} {"train_loss": -27.601926803588867, "global_step": 577862, "epoch": 6962} {"train_loss": -27.332305908203125, "global_step": 577863, "epoch": 6962} {"train_loss": -27.791486740112305, "global_step": 577864, "epoch": 6962} {"train_loss": -27.494863510131836, "global_step": 577865, "epoch": 6962} {"train_loss": -27.783100128173828, "global_step": 577866, "epoch": 6962} {"train_loss": -27.882068634033203, "global_step": 577867, "epoch": 6962} {"train_loss": -27.7027587890625, "global_step": 577868, "epoch": 6962} {"train_loss": -27.503341674804688, "global_step": 577869, "epoch": 6962} {"train_loss": -27.672616958618164, "global_step": 577870, "epoch": 6962} {"train_loss": -27.468175888061523, "global_step": 577871, "epoch": 6962} {"train_loss": -28.047870635986328, "global_step": 577872, "epoch": 6962} {"train_loss": -27.603361129760742, "global_step": 577873, "epoch": 6962} {"train_loss": -27.858320236206055, "global_step": 577874, "epoch": 6962} {"train_loss": -27.6732177734375, "global_step": 577875, "epoch": 6962} {"train_loss": -27.823057174682617, "global_step": 577876, "epoch": 6962} {"train_loss": -27.68768310546875, "global_step": 577877, "epoch": 6962} {"train_loss": -27.71070671081543, "global_step": 577878, "epoch": 6962} {"train_loss": -27.853656768798828, "global_step": 577879, "epoch": 6962} {"train_loss": -28.120864868164062, "global_step": 577880, "epoch": 6962} {"train_loss": -27.85812759399414, "global_step": 577881, "epoch": 6962} {"train_loss": -27.982803344726562, "global_step": 577882, "epoch": 6962} {"train_loss": -27.888452529907227, "global_step": 577883, "epoch": 6962} {"train_loss": -28.164899826049805, "global_step": 577884, "epoch": 6962} {"train_loss": -28.1248779296875, "global_step": 577885, "epoch": 6962} {"train_loss": -27.886920928955078, "global_step": 577886, "epoch": 6962} {"train_loss": -27.672056198120117, "global_step": 577887, "epoch": 6962} {"train_loss": -27.99627113342285, "global_step": 577888, "epoch": 6962} {"train_loss": -27.79843521118164, "global_step": 577889, "epoch": 6962} {"train_loss": -27.900522232055664, "global_step": 577890, "epoch": 6962} {"train_loss": -27.968704223632812, "global_step": 577891, "epoch": 6962} {"train_loss": -28.40913200378418, "global_step": 577892, "epoch": 6962} {"train_loss": -27.719648361206055, "global_step": 577893, "epoch": 6962} {"train_loss": -28.098785400390625, "global_step": 577894, "epoch": 6962} {"train_loss": -28.3441162109375, "global_step": 577895, "epoch": 6962} {"train_loss": -28.3242130279541, "global_step": 577896, "epoch": 6962} {"train_loss": -28.012088775634766, "global_step": 577897, "epoch": 6962} {"train_loss": -28.399534225463867, "global_step": 577898, "epoch": 6962} {"train_loss": -28.10184097290039, "global_step": 577899, "epoch": 6962} {"train_loss": -28.215612411499023, "global_step": 577900, "epoch": 6962} {"train_loss": -28.43625831604004, "global_step": 577901, "epoch": 6962} {"train_loss": -28.30267333984375, "global_step": 577902, "epoch": 6962} {"train_loss": -28.1560115814209, "global_step": 577903, "epoch": 6962} {"train_loss": -28.040327072143555, "global_step": 577904, "epoch": 6962} {"train_loss": -28.306045532226562, "global_step": 577905, "epoch": 6962} {"train_loss": -27.63483238220215, "global_step": 577906, "epoch": 6962} {"train_loss": -28.203907012939453, "global_step": 577907, "epoch": 6962} {"train_loss": -27.848438262939453, "global_step": 577908, "epoch": 6962} {"train_loss": -28.163497924804688, "global_step": 577909, "epoch": 6962} {"train_loss": -28.11024284362793, "global_step": 577910, "epoch": 6962} {"train_loss": -28.393482208251953, "global_step": 577911, "epoch": 6962} {"train_loss": -28.01267433166504, "global_step": 577912, "epoch": 6962} {"train_loss": -28.03944206237793, "global_step": 577913, "epoch": 6962} {"train_loss": -27.87188720703125, "global_step": 577914, "epoch": 6962} {"train_loss": -28.242145538330078, "global_step": 577915, "epoch": 6962} {"train_loss": -27.703527450561523, "global_step": 577916, "epoch": 6962} {"train_loss": -27.832006454467773, "global_step": 577917, "epoch": 6962} {"train_loss": -27.84500503540039, "global_step": 577918, "epoch": 6962} {"train_loss": -28.05036735534668, "global_step": 577919, "epoch": 6962} {"train_loss": -27.93603515625, "global_step": 577920, "epoch": 6962} {"train_loss": -27.8362979888916, "global_step": 577921, "epoch": 6962} {"train_loss": -27.889707565307617, "global_step": 577922, "epoch": 6962} {"train_loss": -28.005659103393555, "global_step": 577923, "epoch": 6962} {"train_loss": -27.839731216430664, "global_step": 577924, "epoch": 6962} {"train_loss": -28.188318252563477, "global_step": 577925, "epoch": 6962} {"train_loss": -27.831256866455078, "global_step": 577926, "epoch": 6962} {"train_loss": -27.531763076782227, "global_step": 577927, "epoch": 6962} {"train_loss": -27.79970460914704, "global_step": 577928, "epoch": 6962, "val_loss": 6579285.0} {"train_loss": -27.74563980102539, "global_step": 577929, "epoch": 6963} {"train_loss": -27.631921768188477, "global_step": 577930, "epoch": 6963} {"train_loss": -27.526508331298828, "global_step": 577931, "epoch": 6963} {"train_loss": -27.4835262298584, "global_step": 577932, "epoch": 6963} {"train_loss": -27.56218910217285, "global_step": 577933, "epoch": 6963} {"train_loss": -27.747421264648438, "global_step": 577934, "epoch": 6963} {"train_loss": -27.48615837097168, "global_step": 577935, "epoch": 6963} {"train_loss": -27.904264450073242, "global_step": 577936, "epoch": 6963} {"train_loss": -27.559234619140625, "global_step": 577937, "epoch": 6963} {"train_loss": -27.796194076538086, "global_step": 577938, "epoch": 6963} {"train_loss": -27.598020553588867, "global_step": 577939, "epoch": 6963} {"train_loss": -27.85991859436035, "global_step": 577940, "epoch": 6963} {"train_loss": -28.046491622924805, "global_step": 577941, "epoch": 6963} {"train_loss": -27.908447265625, "global_step": 577942, "epoch": 6963} {"train_loss": -28.00125503540039, "global_step": 577943, "epoch": 6963} {"train_loss": -27.51112937927246, "global_step": 577944, "epoch": 6963} {"train_loss": -27.70624351501465, "global_step": 577945, "epoch": 6963} {"train_loss": -27.816415786743164, "global_step": 577946, "epoch": 6963} {"train_loss": -28.331090927124023, "global_step": 577947, "epoch": 6963} {"train_loss": -28.1057071685791, "global_step": 577948, "epoch": 6963} {"train_loss": -27.874967575073242, "global_step": 577949, "epoch": 6963} {"train_loss": -27.58442497253418, "global_step": 577950, "epoch": 6963} {"train_loss": -28.02573585510254, "global_step": 577951, "epoch": 6963} {"train_loss": -27.998554229736328, "global_step": 577952, "epoch": 6963} {"train_loss": -28.23211097717285, "global_step": 577953, "epoch": 6963} {"train_loss": -27.828033447265625, "global_step": 577954, "epoch": 6963} {"train_loss": -27.9746150970459, "global_step": 577955, "epoch": 6963} {"train_loss": -27.93617820739746, "global_step": 577956, "epoch": 6963} {"train_loss": -27.8436279296875, "global_step": 577957, "epoch": 6963} {"train_loss": -27.754180908203125, "global_step": 577958, "epoch": 6963} {"train_loss": -27.729663848876953, "global_step": 577959, "epoch": 6963} {"train_loss": -28.020740509033203, "global_step": 577960, "epoch": 6963} {"train_loss": -27.928625106811523, "global_step": 577961, "epoch": 6963} {"train_loss": -27.8719425201416, "global_step": 577962, "epoch": 6963} {"train_loss": -28.182575225830078, "global_step": 577963, "epoch": 6963} {"train_loss": -27.93231773376465, "global_step": 577964, "epoch": 6963} {"train_loss": -27.890522003173828, "global_step": 577965, "epoch": 6963} {"train_loss": -28.125146865844727, "global_step": 577966, "epoch": 6963} {"train_loss": -28.1463565826416, "global_step": 577967, "epoch": 6963} {"train_loss": -28.244373321533203, "global_step": 577968, "epoch": 6963} {"train_loss": -28.0594482421875, "global_step": 577969, "epoch": 6963} {"train_loss": -28.224782943725586, "global_step": 577970, "epoch": 6963} {"train_loss": -28.208032608032227, "global_step": 577971, "epoch": 6963} {"train_loss": -28.449705123901367, "global_step": 577972, "epoch": 6963} {"train_loss": -28.329526901245117, "global_step": 577973, "epoch": 6963} {"train_loss": -28.058013916015625, "global_step": 577974, "epoch": 6963} {"train_loss": -28.298852920532227, "global_step": 577975, "epoch": 6963} {"train_loss": -28.28030776977539, "global_step": 577976, "epoch": 6963} {"train_loss": -28.055740356445312, "global_step": 577977, "epoch": 6963} {"train_loss": -28.230926513671875, "global_step": 577978, "epoch": 6963} {"train_loss": -28.06879997253418, "global_step": 577979, "epoch": 6963} {"train_loss": -28.117151260375977, "global_step": 577980, "epoch": 6963} {"train_loss": -28.014196395874023, "global_step": 577981, "epoch": 6963} {"train_loss": -28.53433609008789, "global_step": 577982, "epoch": 6963} {"train_loss": -28.082914352416992, "global_step": 577983, "epoch": 6963} {"train_loss": -28.207233428955078, "global_step": 577984, "epoch": 6963} {"train_loss": -27.933515548706055, "global_step": 577985, "epoch": 6963} {"train_loss": -27.79266929626465, "global_step": 577986, "epoch": 6963} {"train_loss": -28.16668701171875, "global_step": 577987, "epoch": 6963} {"train_loss": -28.354475021362305, "global_step": 577988, "epoch": 6963} {"train_loss": -27.164655685424805, "global_step": 577989, "epoch": 6963} {"train_loss": -27.303302764892578, "global_step": 577990, "epoch": 6963} {"train_loss": -27.261951446533203, "global_step": 577991, "epoch": 6963} {"train_loss": -27.653791427612305, "global_step": 577992, "epoch": 6963} {"train_loss": -27.8204402923584, "global_step": 577993, "epoch": 6963} {"train_loss": -27.597620010375977, "global_step": 577994, "epoch": 6963} {"train_loss": -27.71746253967285, "global_step": 577995, "epoch": 6963} {"train_loss": -28.0974063873291, "global_step": 577996, "epoch": 6963} {"train_loss": -27.408344268798828, "global_step": 577997, "epoch": 6963} {"train_loss": -27.976123809814453, "global_step": 577998, "epoch": 6963} {"train_loss": -28.036727905273438, "global_step": 577999, "epoch": 6963} {"train_loss": -27.859272003173828, "global_step": 578000, "epoch": 6963} {"train_loss": -27.792211532592773, "global_step": 578001, "epoch": 6963} {"train_loss": -27.508588790893555, "global_step": 578002, "epoch": 6963} {"train_loss": -27.804031372070312, "global_step": 578003, "epoch": 6963} {"train_loss": -27.611093521118164, "global_step": 578004, "epoch": 6963} {"train_loss": -27.66046714782715, "global_step": 578005, "epoch": 6963} {"train_loss": -27.937454223632812, "global_step": 578006, "epoch": 6963} {"train_loss": -27.53889274597168, "global_step": 578007, "epoch": 6963} {"train_loss": -27.353010177612305, "global_step": 578008, "epoch": 6963} {"train_loss": -28.01300048828125, "global_step": 578009, "epoch": 6963} {"train_loss": -27.843738555908203, "global_step": 578010, "epoch": 6963} {"train_loss": -27.867244559598255, "global_step": 578011, "epoch": 6963, "val_loss": 6457341.5} {"train_loss": -27.15966796875, "global_step": 578012, "epoch": 6964} {"train_loss": -25.083576202392578, "global_step": 578013, "epoch": 6964} {"train_loss": -26.353666305541992, "global_step": 578014, "epoch": 6964} {"train_loss": -27.131357192993164, "global_step": 578015, "epoch": 6964} {"train_loss": -26.479095458984375, "global_step": 578016, "epoch": 6964} {"train_loss": -27.333648681640625, "global_step": 578017, "epoch": 6964} {"train_loss": -26.86404800415039, "global_step": 578018, "epoch": 6964} {"train_loss": -26.970800399780273, "global_step": 578019, "epoch": 6964} {"train_loss": -27.006317138671875, "global_step": 578020, "epoch": 6964} {"train_loss": -27.129322052001953, "global_step": 578021, "epoch": 6964} {"train_loss": -27.191740036010742, "global_step": 578022, "epoch": 6964} {"train_loss": -26.92926597595215, "global_step": 578023, "epoch": 6964} {"train_loss": -26.419553756713867, "global_step": 578024, "epoch": 6964} {"train_loss": -27.315465927124023, "global_step": 578025, "epoch": 6964} {"train_loss": -26.773168563842773, "global_step": 578026, "epoch": 6964} {"train_loss": -27.011615753173828, "global_step": 578027, "epoch": 6964} {"train_loss": -27.420068740844727, "global_step": 578028, "epoch": 6964} {"train_loss": -27.208837509155273, "global_step": 578029, "epoch": 6964} {"train_loss": -27.30854606628418, "global_step": 578030, "epoch": 6964} {"train_loss": -27.6826229095459, "global_step": 578031, "epoch": 6964} {"train_loss": -27.24175453186035, "global_step": 578032, "epoch": 6964} {"train_loss": -27.249326705932617, "global_step": 578033, "epoch": 6964} {"train_loss": -27.368152618408203, "global_step": 578034, "epoch": 6964} {"train_loss": -27.6737003326416, "global_step": 578035, "epoch": 6964} {"train_loss": -27.496479034423828, "global_step": 578036, "epoch": 6964} {"train_loss": -27.724517822265625, "global_step": 578037, "epoch": 6964} {"train_loss": -27.524194717407227, "global_step": 578038, "epoch": 6964} {"train_loss": -27.555158615112305, "global_step": 578039, "epoch": 6964} {"train_loss": -27.9487247467041, "global_step": 578040, "epoch": 6964} {"train_loss": -27.478158950805664, "global_step": 578041, "epoch": 6964} {"train_loss": -27.817596435546875, "global_step": 578042, "epoch": 6964} {"train_loss": -27.454374313354492, "global_step": 578043, "epoch": 6964} {"train_loss": -27.638696670532227, "global_step": 578044, "epoch": 6964} {"train_loss": -27.874805450439453, "global_step": 578045, "epoch": 6964} {"train_loss": -27.628080368041992, "global_step": 578046, "epoch": 6964} {"train_loss": -27.860092163085938, "global_step": 578047, "epoch": 6964} {"train_loss": -27.91865348815918, "global_step": 578048, "epoch": 6964} {"train_loss": -28.003662109375, "global_step": 578049, "epoch": 6964} {"train_loss": -27.844654083251953, "global_step": 578050, "epoch": 6964} {"train_loss": -27.988311767578125, "global_step": 578051, "epoch": 6964} {"train_loss": -27.988788604736328, "global_step": 578052, "epoch": 6964} {"train_loss": -27.85822105407715, "global_step": 578053, "epoch": 6964} {"train_loss": -28.00186538696289, "global_step": 578054, "epoch": 6964} {"train_loss": -27.800626754760742, "global_step": 578055, "epoch": 6964} {"train_loss": -27.9699764251709, "global_step": 578056, "epoch": 6964} {"train_loss": -27.9654483795166, "global_step": 578057, "epoch": 6964} {"train_loss": -28.132604598999023, "global_step": 578058, "epoch": 6964} {"train_loss": -28.109695434570312, "global_step": 578059, "epoch": 6964} {"train_loss": -27.832660675048828, "global_step": 578060, "epoch": 6964} {"train_loss": -28.022008895874023, "global_step": 578061, "epoch": 6964} {"train_loss": -28.160776138305664, "global_step": 578062, "epoch": 6964} {"train_loss": -28.235015869140625, "global_step": 578063, "epoch": 6964} {"train_loss": -27.829191207885742, "global_step": 578064, "epoch": 6964} {"train_loss": -27.908544540405273, "global_step": 578065, "epoch": 6964} {"train_loss": -28.014989852905273, "global_step": 578066, "epoch": 6964} {"train_loss": -27.709054946899414, "global_step": 578067, "epoch": 6964} {"train_loss": -27.93952751159668, "global_step": 578068, "epoch": 6964} {"train_loss": -27.960676193237305, "global_step": 578069, "epoch": 6964} {"train_loss": -28.165449142456055, "global_step": 578070, "epoch": 6964} {"train_loss": -28.36712074279785, "global_step": 578071, "epoch": 6964} {"train_loss": -27.99820327758789, "global_step": 578072, "epoch": 6964} {"train_loss": -28.36602783203125, "global_step": 578073, "epoch": 6964} {"train_loss": -27.681507110595703, "global_step": 578074, "epoch": 6964} {"train_loss": -27.8158016204834, "global_step": 578075, "epoch": 6964} {"train_loss": -27.33670425415039, "global_step": 578076, "epoch": 6964} {"train_loss": -27.59356689453125, "global_step": 578077, "epoch": 6964} {"train_loss": -27.8380184173584, "global_step": 578078, "epoch": 6964} {"train_loss": -28.154993057250977, "global_step": 578079, "epoch": 6964} {"train_loss": -27.649946212768555, "global_step": 578080, "epoch": 6964} {"train_loss": -27.458820343017578, "global_step": 578081, "epoch": 6964} {"train_loss": -27.595544815063477, "global_step": 578082, "epoch": 6964} {"train_loss": -27.959516525268555, "global_step": 578083, "epoch": 6964} {"train_loss": -27.670379638671875, "global_step": 578084, "epoch": 6964} {"train_loss": -27.77640151977539, "global_step": 578085, "epoch": 6964} {"train_loss": -28.143817901611328, "global_step": 578086, "epoch": 6964} {"train_loss": -27.7423095703125, "global_step": 578087, "epoch": 6964} {"train_loss": -28.11203956604004, "global_step": 578088, "epoch": 6964} {"train_loss": -27.798940658569336, "global_step": 578089, "epoch": 6964} {"train_loss": -27.787811279296875, "global_step": 578090, "epoch": 6964} {"train_loss": -28.14371681213379, "global_step": 578091, "epoch": 6964} {"train_loss": -27.69703483581543, "global_step": 578092, "epoch": 6964} {"train_loss": -27.86932373046875, "global_step": 578093, "epoch": 6964} {"train_loss": -27.599251092198383, "global_step": 578094, "epoch": 6964, "val_loss": 6445159.0} {"train_loss": -27.19317626953125, "global_step": 578095, "epoch": 6965} {"train_loss": -26.257278442382812, "global_step": 578096, "epoch": 6965} {"train_loss": -27.2047061920166, "global_step": 578097, "epoch": 6965} {"train_loss": -27.5306396484375, "global_step": 578098, "epoch": 6965} {"train_loss": -26.65003776550293, "global_step": 578099, "epoch": 6965} {"train_loss": -26.943281173706055, "global_step": 578100, "epoch": 6965} {"train_loss": -27.452838897705078, "global_step": 578101, "epoch": 6965} {"train_loss": -27.38608741760254, "global_step": 578102, "epoch": 6965} {"train_loss": -27.393945693969727, "global_step": 578103, "epoch": 6965} {"train_loss": -27.338760375976562, "global_step": 578104, "epoch": 6965} {"train_loss": -27.26947021484375, "global_step": 578105, "epoch": 6965} {"train_loss": -27.29359245300293, "global_step": 578106, "epoch": 6965} {"train_loss": -27.411035537719727, "global_step": 578107, "epoch": 6965} {"train_loss": -27.304834365844727, "global_step": 578108, "epoch": 6965} {"train_loss": -27.508106231689453, "global_step": 578109, "epoch": 6965} {"train_loss": -27.112451553344727, "global_step": 578110, "epoch": 6965} {"train_loss": -27.37041664123535, "global_step": 578111, "epoch": 6965} {"train_loss": -27.552398681640625, "global_step": 578112, "epoch": 6965} {"train_loss": -27.954055786132812, "global_step": 578113, "epoch": 6965} {"train_loss": -27.67038917541504, "global_step": 578114, "epoch": 6965} {"train_loss": -27.954980850219727, "global_step": 578115, "epoch": 6965} {"train_loss": -27.746458053588867, "global_step": 578116, "epoch": 6965} {"train_loss": -27.590768814086914, "global_step": 578117, "epoch": 6965} {"train_loss": -27.842971801757812, "global_step": 578118, "epoch": 6965} {"train_loss": -27.82843589782715, "global_step": 578119, "epoch": 6965} {"train_loss": -27.900226593017578, "global_step": 578120, "epoch": 6965} {"train_loss": -28.052722930908203, "global_step": 578121, "epoch": 6965} {"train_loss": -27.828205108642578, "global_step": 578122, "epoch": 6965} {"train_loss": -27.98712158203125, "global_step": 578123, "epoch": 6965} {"train_loss": -27.67481803894043, "global_step": 578124, "epoch": 6965} {"train_loss": -27.76521110534668, "global_step": 578125, "epoch": 6965} {"train_loss": -27.954788208007812, "global_step": 578126, "epoch": 6965} {"train_loss": -27.77621841430664, "global_step": 578127, "epoch": 6965} {"train_loss": -27.5194149017334, "global_step": 578128, "epoch": 6965} {"train_loss": -28.066761016845703, "global_step": 578129, "epoch": 6965} {"train_loss": -28.04573631286621, "global_step": 578130, "epoch": 6965} {"train_loss": -27.934858322143555, "global_step": 578131, "epoch": 6965} {"train_loss": -28.08063316345215, "global_step": 578132, "epoch": 6965} {"train_loss": -28.21661376953125, "global_step": 578133, "epoch": 6965} {"train_loss": -27.841156005859375, "global_step": 578134, "epoch": 6965} {"train_loss": -28.076101303100586, "global_step": 578135, "epoch": 6965} {"train_loss": -28.003477096557617, "global_step": 578136, "epoch": 6965} {"train_loss": -27.931421279907227, "global_step": 578137, "epoch": 6965} {"train_loss": -27.774438858032227, "global_step": 578138, "epoch": 6965} {"train_loss": -28.157928466796875, "global_step": 578139, "epoch": 6965} {"train_loss": -27.682165145874023, "global_step": 578140, "epoch": 6965} {"train_loss": -27.652267456054688, "global_step": 578141, "epoch": 6965} {"train_loss": -28.39215087890625, "global_step": 578142, "epoch": 6965} {"train_loss": -28.1958065032959, "global_step": 578143, "epoch": 6965} {"train_loss": -27.79741859436035, "global_step": 578144, "epoch": 6965} {"train_loss": -27.855493545532227, "global_step": 578145, "epoch": 6965} {"train_loss": -27.834714889526367, "global_step": 578146, "epoch": 6965} {"train_loss": -27.5291748046875, "global_step": 578147, "epoch": 6965} {"train_loss": -27.96613121032715, "global_step": 578148, "epoch": 6965} {"train_loss": -27.71994400024414, "global_step": 578149, "epoch": 6965} {"train_loss": -27.603796005249023, "global_step": 578150, "epoch": 6965} {"train_loss": -28.1379337310791, "global_step": 578151, "epoch": 6965} {"train_loss": -27.997461318969727, "global_step": 578152, "epoch": 6965} {"train_loss": -28.080280303955078, "global_step": 578153, "epoch": 6965} {"train_loss": -27.870197296142578, "global_step": 578154, "epoch": 6965} {"train_loss": -27.782724380493164, "global_step": 578155, "epoch": 6965} {"train_loss": -27.9505615234375, "global_step": 578156, "epoch": 6965} {"train_loss": -28.356327056884766, "global_step": 578157, "epoch": 6965} {"train_loss": -27.92013931274414, "global_step": 578158, "epoch": 6965} {"train_loss": -28.145471572875977, "global_step": 578159, "epoch": 6965} {"train_loss": -27.908781051635742, "global_step": 578160, "epoch": 6965} {"train_loss": -28.121362686157227, "global_step": 578161, "epoch": 6965} {"train_loss": -27.7030086517334, "global_step": 578162, "epoch": 6965} {"train_loss": -28.193281173706055, "global_step": 578163, "epoch": 6965} {"train_loss": -28.05295181274414, "global_step": 578164, "epoch": 6965} {"train_loss": -28.407638549804688, "global_step": 578165, "epoch": 6965} {"train_loss": -28.134321212768555, "global_step": 578166, "epoch": 6965} {"train_loss": -28.020727157592773, "global_step": 578167, "epoch": 6965} {"train_loss": -28.242319107055664, "global_step": 578168, "epoch": 6965} {"train_loss": -27.71892738342285, "global_step": 578169, "epoch": 6965} {"train_loss": -28.102508544921875, "global_step": 578170, "epoch": 6965} {"train_loss": -28.115198135375977, "global_step": 578171, "epoch": 6965} {"train_loss": -27.96986198425293, "global_step": 578172, "epoch": 6965} {"train_loss": -28.152631759643555, "global_step": 578173, "epoch": 6965} {"train_loss": -28.036252975463867, "global_step": 578174, "epoch": 6965} {"train_loss": -28.088159561157227, "global_step": 578175, "epoch": 6965} {"train_loss": -28.277063369750977, "global_step": 578176, "epoch": 6965} {"train_loss": -27.788010424878223, "global_step": 578177, "epoch": 6965, "val_loss": 6435879.5} {"train_loss": -26.715856552124023, "global_step": 578178, "epoch": 6966} {"train_loss": -26.73335075378418, "global_step": 578179, "epoch": 6966} {"train_loss": -27.15677833557129, "global_step": 578180, "epoch": 6966} {"train_loss": -27.673242568969727, "global_step": 578181, "epoch": 6966} {"train_loss": -27.347354888916016, "global_step": 578182, "epoch": 6966} {"train_loss": -27.401575088500977, "global_step": 578183, "epoch": 6966} {"train_loss": -27.675262451171875, "global_step": 578184, "epoch": 6966} {"train_loss": -27.173206329345703, "global_step": 578185, "epoch": 6966} {"train_loss": -27.865842819213867, "global_step": 578186, "epoch": 6966} {"train_loss": -27.612445831298828, "global_step": 578187, "epoch": 6966} {"train_loss": -27.5152530670166, "global_step": 578188, "epoch": 6966} {"train_loss": -27.705244064331055, "global_step": 578189, "epoch": 6966} {"train_loss": -27.925140380859375, "global_step": 578190, "epoch": 6966} {"train_loss": -27.69931983947754, "global_step": 578191, "epoch": 6966} {"train_loss": -28.12188720703125, "global_step": 578192, "epoch": 6966} {"train_loss": -27.49017906188965, "global_step": 578193, "epoch": 6966} {"train_loss": -27.65473747253418, "global_step": 578194, "epoch": 6966} {"train_loss": -27.328641891479492, "global_step": 578195, "epoch": 6966} {"train_loss": -27.80225944519043, "global_step": 578196, "epoch": 6966} {"train_loss": -27.89162254333496, "global_step": 578197, "epoch": 6966} {"train_loss": -28.094839096069336, "global_step": 578198, "epoch": 6966} {"train_loss": -27.696243286132812, "global_step": 578199, "epoch": 6966} {"train_loss": -28.089710235595703, "global_step": 578200, "epoch": 6966} {"train_loss": -27.96721839904785, "global_step": 578201, "epoch": 6966} {"train_loss": -27.934778213500977, "global_step": 578202, "epoch": 6966} {"train_loss": -27.878448486328125, "global_step": 578203, "epoch": 6966} {"train_loss": -27.87995719909668, "global_step": 578204, "epoch": 6966} {"train_loss": -27.930368423461914, "global_step": 578205, "epoch": 6966} {"train_loss": -27.518346786499023, "global_step": 578206, "epoch": 6966} {"train_loss": -28.015287399291992, "global_step": 578207, "epoch": 6966} {"train_loss": -28.030324935913086, "global_step": 578208, "epoch": 6966} {"train_loss": -27.78786277770996, "global_step": 578209, "epoch": 6966} {"train_loss": -28.319211959838867, "global_step": 578210, "epoch": 6966} {"train_loss": -28.00473976135254, "global_step": 578211, "epoch": 6966} {"train_loss": -27.88313102722168, "global_step": 578212, "epoch": 6966} {"train_loss": -28.09259605407715, "global_step": 578213, "epoch": 6966} {"train_loss": -27.928991317749023, "global_step": 578214, "epoch": 6966} {"train_loss": -27.9160213470459, "global_step": 578215, "epoch": 6966} {"train_loss": -28.108854293823242, "global_step": 578216, "epoch": 6966} {"train_loss": -27.8587589263916, "global_step": 578217, "epoch": 6966} {"train_loss": -27.750532150268555, "global_step": 578218, "epoch": 6966} {"train_loss": -28.169530868530273, "global_step": 578219, "epoch": 6966} {"train_loss": -27.9674015045166, "global_step": 578220, "epoch": 6966} {"train_loss": -28.025848388671875, "global_step": 578221, "epoch": 6966} {"train_loss": -27.782506942749023, "global_step": 578222, "epoch": 6966} {"train_loss": -27.845630645751953, "global_step": 578223, "epoch": 6966} {"train_loss": -28.068090438842773, "global_step": 578224, "epoch": 6966} {"train_loss": -27.67780876159668, "global_step": 578225, "epoch": 6966} {"train_loss": -28.196582794189453, "global_step": 578226, "epoch": 6966} {"train_loss": -27.749048233032227, "global_step": 578227, "epoch": 6966} {"train_loss": -27.91805076599121, "global_step": 578228, "epoch": 6966} {"train_loss": -27.80340576171875, "global_step": 578229, "epoch": 6966} {"train_loss": -28.15888023376465, "global_step": 578230, "epoch": 6966} {"train_loss": -28.2259464263916, "global_step": 578231, "epoch": 6966} {"train_loss": -27.891559600830078, "global_step": 578232, "epoch": 6966} {"train_loss": -27.858091354370117, "global_step": 578233, "epoch": 6966} {"train_loss": -28.3388729095459, "global_step": 578234, "epoch": 6966} {"train_loss": -27.861785888671875, "global_step": 578235, "epoch": 6966} {"train_loss": -27.802282333374023, "global_step": 578236, "epoch": 6966} {"train_loss": -27.82686424255371, "global_step": 578237, "epoch": 6966} {"train_loss": -28.000370025634766, "global_step": 578238, "epoch": 6966} {"train_loss": -28.229785919189453, "global_step": 578239, "epoch": 6966} {"train_loss": -28.104108810424805, "global_step": 578240, "epoch": 6966} {"train_loss": -27.795734405517578, "global_step": 578241, "epoch": 6966} {"train_loss": -27.523569107055664, "global_step": 578242, "epoch": 6966} {"train_loss": -27.648120880126953, "global_step": 578243, "epoch": 6966} {"train_loss": -28.260650634765625, "global_step": 578244, "epoch": 6966} {"train_loss": -27.600061416625977, "global_step": 578245, "epoch": 6966} {"train_loss": -27.7127742767334, "global_step": 578246, "epoch": 6966} {"train_loss": -27.6854305267334, "global_step": 578247, "epoch": 6966} {"train_loss": -28.22066307067871, "global_step": 578248, "epoch": 6966} {"train_loss": -27.43214988708496, "global_step": 578249, "epoch": 6966} {"train_loss": -27.6540584564209, "global_step": 578250, "epoch": 6966} {"train_loss": -27.971349716186523, "global_step": 578251, "epoch": 6966} {"train_loss": -27.816816329956055, "global_step": 578252, "epoch": 6966} {"train_loss": -28.04860496520996, "global_step": 578253, "epoch": 6966} {"train_loss": -27.975921630859375, "global_step": 578254, "epoch": 6966} {"train_loss": -27.8897705078125, "global_step": 578255, "epoch": 6966} {"train_loss": -28.24094581604004, "global_step": 578256, "epoch": 6966} {"train_loss": -27.731000900268555, "global_step": 578257, "epoch": 6966} {"train_loss": -27.890762329101562, "global_step": 578258, "epoch": 6966} {"train_loss": -28.096393585205078, "global_step": 578259, "epoch": 6966} {"train_loss": -27.83125040904585, "global_step": 578260, "epoch": 6966, "val_loss": 6467258.0} {"train_loss": -27.5399112701416, "global_step": 578261, "epoch": 6967} {"train_loss": -27.441999435424805, "global_step": 578262, "epoch": 6967} {"train_loss": -27.56341552734375, "global_step": 578263, "epoch": 6967} {"train_loss": -27.809314727783203, "global_step": 578264, "epoch": 6967} {"train_loss": -27.768468856811523, "global_step": 578265, "epoch": 6967} {"train_loss": -27.78864860534668, "global_step": 578266, "epoch": 6967} {"train_loss": -27.607595443725586, "global_step": 578267, "epoch": 6967} {"train_loss": -27.819101333618164, "global_step": 578268, "epoch": 6967} {"train_loss": -27.630996704101562, "global_step": 578269, "epoch": 6967} {"train_loss": -27.830646514892578, "global_step": 578270, "epoch": 6967} {"train_loss": -28.047266006469727, "global_step": 578271, "epoch": 6967} {"train_loss": -27.728586196899414, "global_step": 578272, "epoch": 6967} {"train_loss": -27.981250762939453, "global_step": 578273, "epoch": 6967} {"train_loss": -27.840734481811523, "global_step": 578274, "epoch": 6967} {"train_loss": -27.689687728881836, "global_step": 578275, "epoch": 6967} {"train_loss": -27.6213436126709, "global_step": 578276, "epoch": 6967} {"train_loss": -28.15700340270996, "global_step": 578277, "epoch": 6967} {"train_loss": -27.576757431030273, "global_step": 578278, "epoch": 6967} {"train_loss": -27.688547134399414, "global_step": 578279, "epoch": 6967} {"train_loss": -27.75593376159668, "global_step": 578280, "epoch": 6967} {"train_loss": -27.972076416015625, "global_step": 578281, "epoch": 6967} {"train_loss": -28.08241081237793, "global_step": 578282, "epoch": 6967} {"train_loss": -27.856733322143555, "global_step": 578283, "epoch": 6967} {"train_loss": -28.219099044799805, "global_step": 578284, "epoch": 6967} {"train_loss": -27.867538452148438, "global_step": 578285, "epoch": 6967} {"train_loss": -27.738895416259766, "global_step": 578286, "epoch": 6967} {"train_loss": -27.567983627319336, "global_step": 578287, "epoch": 6967} {"train_loss": -28.07443618774414, "global_step": 578288, "epoch": 6967} {"train_loss": -27.443159103393555, "global_step": 578289, "epoch": 6967} {"train_loss": -26.801288604736328, "global_step": 578290, "epoch": 6967} {"train_loss": -26.7585391998291, "global_step": 578291, "epoch": 6967} {"train_loss": -27.4997501373291, "global_step": 578292, "epoch": 6967} {"train_loss": -27.52851676940918, "global_step": 578293, "epoch": 6967} {"train_loss": -26.80470848083496, "global_step": 578294, "epoch": 6967} {"train_loss": -26.881540298461914, "global_step": 578295, "epoch": 6967} {"train_loss": -26.650976181030273, "global_step": 578296, "epoch": 6967} {"train_loss": -27.42767906188965, "global_step": 578297, "epoch": 6967} {"train_loss": -27.416614532470703, "global_step": 578298, "epoch": 6967} {"train_loss": -27.28798484802246, "global_step": 578299, "epoch": 6967} {"train_loss": -27.5076847076416, "global_step": 578300, "epoch": 6967} {"train_loss": -27.319971084594727, "global_step": 578301, "epoch": 6967} {"train_loss": -27.468656539916992, "global_step": 578302, "epoch": 6967} {"train_loss": -27.763324737548828, "global_step": 578303, "epoch": 6967} {"train_loss": -27.747289657592773, "global_step": 578304, "epoch": 6967} {"train_loss": -28.289508819580078, "global_step": 578305, "epoch": 6967} {"train_loss": -27.458402633666992, "global_step": 578306, "epoch": 6967} {"train_loss": -27.954254150390625, "global_step": 578307, "epoch": 6967} {"train_loss": -27.65218162536621, "global_step": 578308, "epoch": 6967} {"train_loss": -28.006855010986328, "global_step": 578309, "epoch": 6967} {"train_loss": -27.8812255859375, "global_step": 578310, "epoch": 6967} {"train_loss": -28.059412002563477, "global_step": 578311, "epoch": 6967} {"train_loss": -27.942707061767578, "global_step": 578312, "epoch": 6967} {"train_loss": -27.77564811706543, "global_step": 578313, "epoch": 6967} {"train_loss": -27.74859046936035, "global_step": 578314, "epoch": 6967} {"train_loss": -27.916492462158203, "global_step": 578315, "epoch": 6967} {"train_loss": -28.075439453125, "global_step": 578316, "epoch": 6967} {"train_loss": -27.78828239440918, "global_step": 578317, "epoch": 6967} {"train_loss": -27.88233757019043, "global_step": 578318, "epoch": 6967} {"train_loss": -28.143798828125, "global_step": 578319, "epoch": 6967} {"train_loss": -27.7705020904541, "global_step": 578320, "epoch": 6967} {"train_loss": -28.23972511291504, "global_step": 578321, "epoch": 6967} {"train_loss": -28.327838897705078, "global_step": 578322, "epoch": 6967} {"train_loss": -27.55012321472168, "global_step": 578323, "epoch": 6967} {"train_loss": -28.08155632019043, "global_step": 578324, "epoch": 6967} {"train_loss": -27.881916046142578, "global_step": 578325, "epoch": 6967} {"train_loss": -27.776166915893555, "global_step": 578326, "epoch": 6967} {"train_loss": -28.300195693969727, "global_step": 578327, "epoch": 6967} {"train_loss": -27.88999366760254, "global_step": 578328, "epoch": 6967} {"train_loss": -27.921127319335938, "global_step": 578329, "epoch": 6967} {"train_loss": -28.12430191040039, "global_step": 578330, "epoch": 6967} {"train_loss": -28.0367374420166, "global_step": 578331, "epoch": 6967} {"train_loss": -27.96735191345215, "global_step": 578332, "epoch": 6967} {"train_loss": -28.194482803344727, "global_step": 578333, "epoch": 6967} {"train_loss": -28.076841354370117, "global_step": 578334, "epoch": 6967} {"train_loss": -27.892688751220703, "global_step": 578335, "epoch": 6967} {"train_loss": -27.683576583862305, "global_step": 578336, "epoch": 6967} {"train_loss": -28.196767807006836, "global_step": 578337, "epoch": 6967} {"train_loss": -27.658679962158203, "global_step": 578338, "epoch": 6967} {"train_loss": -27.90484619140625, "global_step": 578339, "epoch": 6967} {"train_loss": -27.94101333618164, "global_step": 578340, "epoch": 6967} {"train_loss": -28.4985408782959, "global_step": 578341, "epoch": 6967} {"train_loss": -28.110193252563477, "global_step": 578342, "epoch": 6967} {"train_loss": -27.768498501145697, "global_step": 578343, "epoch": 6967, "val_loss": 6428735.0} {"train_loss": -26.733081817626953, "global_step": 578344, "epoch": 6968} {"train_loss": -26.168119430541992, "global_step": 578345, "epoch": 6968} {"train_loss": -26.56500244140625, "global_step": 578346, "epoch": 6968} {"train_loss": -26.49191665649414, "global_step": 578347, "epoch": 6968} {"train_loss": -27.28093910217285, "global_step": 578348, "epoch": 6968} {"train_loss": -26.841262817382812, "global_step": 578349, "epoch": 6968} {"train_loss": -26.716161727905273, "global_step": 578350, "epoch": 6968} {"train_loss": -27.2882080078125, "global_step": 578351, "epoch": 6968} {"train_loss": -27.373193740844727, "global_step": 578352, "epoch": 6968} {"train_loss": -27.240509033203125, "global_step": 578353, "epoch": 6968} {"train_loss": -27.443695068359375, "global_step": 578354, "epoch": 6968} {"train_loss": -27.646581649780273, "global_step": 578355, "epoch": 6968} {"train_loss": -27.790695190429688, "global_step": 578356, "epoch": 6968} {"train_loss": -27.51692771911621, "global_step": 578357, "epoch": 6968} {"train_loss": -27.5513916015625, "global_step": 578358, "epoch": 6968} {"train_loss": -27.220291137695312, "global_step": 578359, "epoch": 6968} {"train_loss": -27.821136474609375, "global_step": 578360, "epoch": 6968} {"train_loss": -27.828031539916992, "global_step": 578361, "epoch": 6968} {"train_loss": -27.62664794921875, "global_step": 578362, "epoch": 6968} {"train_loss": -28.004343032836914, "global_step": 578363, "epoch": 6968} {"train_loss": -27.611661911010742, "global_step": 578364, "epoch": 6968} {"train_loss": -27.442340850830078, "global_step": 578365, "epoch": 6968} {"train_loss": -27.993839263916016, "global_step": 578366, "epoch": 6968} {"train_loss": -27.928247451782227, "global_step": 578367, "epoch": 6968} {"train_loss": -27.514822006225586, "global_step": 578368, "epoch": 6968} {"train_loss": -28.0533390045166, "global_step": 578369, "epoch": 6968} {"train_loss": -27.580114364624023, "global_step": 578370, "epoch": 6968} {"train_loss": -28.101545333862305, "global_step": 578371, "epoch": 6968} {"train_loss": -27.7337646484375, "global_step": 578372, "epoch": 6968} {"train_loss": -27.712635040283203, "global_step": 578373, "epoch": 6968} {"train_loss": -27.777265548706055, "global_step": 578374, "epoch": 6968} {"train_loss": -28.04315757751465, "global_step": 578375, "epoch": 6968} {"train_loss": -27.75469970703125, "global_step": 578376, "epoch": 6968} {"train_loss": -27.913862228393555, "global_step": 578377, "epoch": 6968} {"train_loss": -28.099090576171875, "global_step": 578378, "epoch": 6968} {"train_loss": -28.086517333984375, "global_step": 578379, "epoch": 6968} {"train_loss": -28.089086532592773, "global_step": 578380, "epoch": 6968} {"train_loss": -28.01716423034668, "global_step": 578381, "epoch": 6968} {"train_loss": -27.958520889282227, "global_step": 578382, "epoch": 6968} {"train_loss": -27.9754638671875, "global_step": 578383, "epoch": 6968} {"train_loss": -28.266803741455078, "global_step": 578384, "epoch": 6968} {"train_loss": -28.530942916870117, "global_step": 578385, "epoch": 6968} {"train_loss": -27.954605102539062, "global_step": 578386, "epoch": 6968} {"train_loss": -27.871021270751953, "global_step": 578387, "epoch": 6968} {"train_loss": -28.196369171142578, "global_step": 578388, "epoch": 6968} {"train_loss": -28.169403076171875, "global_step": 578389, "epoch": 6968} {"train_loss": -27.97454833984375, "global_step": 578390, "epoch": 6968} {"train_loss": -27.95831871032715, "global_step": 578391, "epoch": 6968} {"train_loss": -28.357343673706055, "global_step": 578392, "epoch": 6968} {"train_loss": -28.269250869750977, "global_step": 578393, "epoch": 6968} {"train_loss": -28.26593589782715, "global_step": 578394, "epoch": 6968} {"train_loss": -28.19533348083496, "global_step": 578395, "epoch": 6968} {"train_loss": -28.052331924438477, "global_step": 578396, "epoch": 6968} {"train_loss": -28.076435089111328, "global_step": 578397, "epoch": 6968} {"train_loss": -28.0194149017334, "global_step": 578398, "epoch": 6968} {"train_loss": -27.882282257080078, "global_step": 578399, "epoch": 6968} {"train_loss": -27.758970260620117, "global_step": 578400, "epoch": 6968} {"train_loss": -28.001317977905273, "global_step": 578401, "epoch": 6968} {"train_loss": -27.701313018798828, "global_step": 578402, "epoch": 6968} {"train_loss": -27.93134117126465, "global_step": 578403, "epoch": 6968} {"train_loss": -27.768280029296875, "global_step": 578404, "epoch": 6968} {"train_loss": -28.21021842956543, "global_step": 578405, "epoch": 6968} {"train_loss": -28.00618553161621, "global_step": 578406, "epoch": 6968} {"train_loss": -27.18008804321289, "global_step": 578407, "epoch": 6968} {"train_loss": -27.692840576171875, "global_step": 578408, "epoch": 6968} {"train_loss": -27.654577255249023, "global_step": 578409, "epoch": 6968} {"train_loss": -28.26802635192871, "global_step": 578410, "epoch": 6968} {"train_loss": -27.7365779876709, "global_step": 578411, "epoch": 6968} {"train_loss": -28.280323028564453, "global_step": 578412, "epoch": 6968} {"train_loss": -27.8769588470459, "global_step": 578413, "epoch": 6968} {"train_loss": -27.464588165283203, "global_step": 578414, "epoch": 6968} {"train_loss": -27.738927841186523, "global_step": 578415, "epoch": 6968} {"train_loss": -27.356109619140625, "global_step": 578416, "epoch": 6968} {"train_loss": -27.92291831970215, "global_step": 578417, "epoch": 6968} {"train_loss": -27.797657012939453, "global_step": 578418, "epoch": 6968} {"train_loss": -27.40309715270996, "global_step": 578419, "epoch": 6968} {"train_loss": -27.912799835205078, "global_step": 578420, "epoch": 6968} {"train_loss": -27.82734489440918, "global_step": 578421, "epoch": 6968} {"train_loss": -28.17587661743164, "global_step": 578422, "epoch": 6968} {"train_loss": -27.617752075195312, "global_step": 578423, "epoch": 6968} {"train_loss": -28.0018310546875, "global_step": 578424, "epoch": 6968} {"train_loss": -27.772964477539062, "global_step": 578425, "epoch": 6968} {"train_loss": -27.753930241228588, "global_step": 578426, "epoch": 6968, "val_loss": 6470319.0} {"train_loss": -26.88873863220215, "global_step": 578427, "epoch": 6969} {"train_loss": -25.750242233276367, "global_step": 578428, "epoch": 6969} {"train_loss": -24.552194595336914, "global_step": 578429, "epoch": 6969} {"train_loss": -26.950241088867188, "global_step": 578430, "epoch": 6969} {"train_loss": -27.22684097290039, "global_step": 578431, "epoch": 6969} {"train_loss": -26.48383140563965, "global_step": 578432, "epoch": 6969} {"train_loss": -26.522293090820312, "global_step": 578433, "epoch": 6969} {"train_loss": -26.96559715270996, "global_step": 578434, "epoch": 6969} {"train_loss": -26.79084587097168, "global_step": 578435, "epoch": 6969} {"train_loss": -27.472265243530273, "global_step": 578436, "epoch": 6969} {"train_loss": -27.038970947265625, "global_step": 578437, "epoch": 6969} {"train_loss": -26.66843032836914, "global_step": 578438, "epoch": 6969} {"train_loss": -27.377277374267578, "global_step": 578439, "epoch": 6969} {"train_loss": -27.62095069885254, "global_step": 578440, "epoch": 6969} {"train_loss": -26.881988525390625, "global_step": 578441, "epoch": 6969} {"train_loss": -27.58091163635254, "global_step": 578442, "epoch": 6969} {"train_loss": -26.845123291015625, "global_step": 578443, "epoch": 6969} {"train_loss": -27.28798484802246, "global_step": 578444, "epoch": 6969} {"train_loss": -27.335189819335938, "global_step": 578445, "epoch": 6969} {"train_loss": -27.741851806640625, "global_step": 578446, "epoch": 6969} {"train_loss": -27.447967529296875, "global_step": 578447, "epoch": 6969} {"train_loss": -27.624731063842773, "global_step": 578448, "epoch": 6969} {"train_loss": -27.971521377563477, "global_step": 578449, "epoch": 6969} {"train_loss": -27.647552490234375, "global_step": 578450, "epoch": 6969} {"train_loss": -27.528547286987305, "global_step": 578451, "epoch": 6969} {"train_loss": -27.738006591796875, "global_step": 578452, "epoch": 6969} {"train_loss": -27.562894821166992, "global_step": 578453, "epoch": 6969} {"train_loss": -27.702001571655273, "global_step": 578454, "epoch": 6969} {"train_loss": -27.635656356811523, "global_step": 578455, "epoch": 6969} {"train_loss": -27.559345245361328, "global_step": 578456, "epoch": 6969} {"train_loss": -27.740636825561523, "global_step": 578457, "epoch": 6969} {"train_loss": -27.386062622070312, "global_step": 578458, "epoch": 6969} {"train_loss": -27.831525802612305, "global_step": 578459, "epoch": 6969} {"train_loss": -27.5142765045166, "global_step": 578460, "epoch": 6969} {"train_loss": -27.781970977783203, "global_step": 578461, "epoch": 6969} {"train_loss": -27.38189697265625, "global_step": 578462, "epoch": 6969} {"train_loss": -27.887434005737305, "global_step": 578463, "epoch": 6969} {"train_loss": -27.69434928894043, "global_step": 578464, "epoch": 6969} {"train_loss": -27.981781005859375, "global_step": 578465, "epoch": 6969} {"train_loss": -28.110746383666992, "global_step": 578466, "epoch": 6969} {"train_loss": -27.727048873901367, "global_step": 578467, "epoch": 6969} {"train_loss": -27.649322509765625, "global_step": 578468, "epoch": 6969} {"train_loss": -27.9217472076416, "global_step": 578469, "epoch": 6969} {"train_loss": -27.716230392456055, "global_step": 578470, "epoch": 6969} {"train_loss": -27.978073120117188, "global_step": 578471, "epoch": 6969} {"train_loss": -27.73845863342285, "global_step": 578472, "epoch": 6969} {"train_loss": -27.78554344177246, "global_step": 578473, "epoch": 6969} {"train_loss": -28.464496612548828, "global_step": 578474, "epoch": 6969} {"train_loss": -27.897449493408203, "global_step": 578475, "epoch": 6969} {"train_loss": -27.844287872314453, "global_step": 578476, "epoch": 6969} {"train_loss": -28.361404418945312, "global_step": 578477, "epoch": 6969} {"train_loss": -27.7445011138916, "global_step": 578478, "epoch": 6969} {"train_loss": -27.946020126342773, "global_step": 578479, "epoch": 6969} {"train_loss": -28.10565185546875, "global_step": 578480, "epoch": 6969} {"train_loss": -28.26596450805664, "global_step": 578481, "epoch": 6969} {"train_loss": -27.894519805908203, "global_step": 578482, "epoch": 6969} {"train_loss": -28.2237606048584, "global_step": 578483, "epoch": 6969} {"train_loss": -27.634180068969727, "global_step": 578484, "epoch": 6969} {"train_loss": -27.968381881713867, "global_step": 578485, "epoch": 6969} {"train_loss": -28.066654205322266, "global_step": 578486, "epoch": 6969} {"train_loss": -28.18219566345215, "global_step": 578487, "epoch": 6969} {"train_loss": -27.974218368530273, "global_step": 578488, "epoch": 6969} {"train_loss": -27.866125106811523, "global_step": 578489, "epoch": 6969} {"train_loss": -28.068586349487305, "global_step": 578490, "epoch": 6969} {"train_loss": -27.695423126220703, "global_step": 578491, "epoch": 6969} {"train_loss": -27.877317428588867, "global_step": 578492, "epoch": 6969} {"train_loss": -27.778539657592773, "global_step": 578493, "epoch": 6969} {"train_loss": -27.729400634765625, "global_step": 578494, "epoch": 6969} {"train_loss": -27.917800903320312, "global_step": 578495, "epoch": 6969} {"train_loss": -28.0997314453125, "global_step": 578496, "epoch": 6969} {"train_loss": -27.916574478149414, "global_step": 578497, "epoch": 6969} {"train_loss": -28.289854049682617, "global_step": 578498, "epoch": 6969} {"train_loss": -28.4352970123291, "global_step": 578499, "epoch": 6969} {"train_loss": -27.6675968170166, "global_step": 578500, "epoch": 6969} {"train_loss": -27.90851402282715, "global_step": 578501, "epoch": 6969} {"train_loss": -27.96796989440918, "global_step": 578502, "epoch": 6969} {"train_loss": -28.02447509765625, "global_step": 578503, "epoch": 6969} {"train_loss": -28.11221694946289, "global_step": 578504, "epoch": 6969} {"train_loss": -28.118711471557617, "global_step": 578505, "epoch": 6969} {"train_loss": -28.09637451171875, "global_step": 578506, "epoch": 6969} {"train_loss": -27.873022079467773, "global_step": 578507, "epoch": 6969} {"train_loss": -28.014490127563477, "global_step": 578508, "epoch": 6969} {"train_loss": -27.651733444397706, "global_step": 578509, "epoch": 6969, "val_loss": 6475722.0} {"train_loss": -27.0953369140625, "global_step": 578510, "epoch": 6970} {"train_loss": -27.218311309814453, "global_step": 578511, "epoch": 6970} {"train_loss": -27.04998207092285, "global_step": 578512, "epoch": 6970} {"train_loss": -26.7000732421875, "global_step": 578513, "epoch": 6970} {"train_loss": -27.075376510620117, "global_step": 578514, "epoch": 6970} {"train_loss": -27.029321670532227, "global_step": 578515, "epoch": 6970} {"train_loss": -27.754140853881836, "global_step": 578516, "epoch": 6970} {"train_loss": -27.2877254486084, "global_step": 578517, "epoch": 6970} {"train_loss": -27.627172470092773, "global_step": 578518, "epoch": 6970} {"train_loss": -27.83734703063965, "global_step": 578519, "epoch": 6970} {"train_loss": -27.288227081298828, "global_step": 578520, "epoch": 6970} {"train_loss": -27.419111251831055, "global_step": 578521, "epoch": 6970} {"train_loss": -27.646976470947266, "global_step": 578522, "epoch": 6970} {"train_loss": -27.8790225982666, "global_step": 578523, "epoch": 6970} {"train_loss": -27.458084106445312, "global_step": 578524, "epoch": 6970} {"train_loss": -27.551513671875, "global_step": 578525, "epoch": 6970} {"train_loss": -27.922391891479492, "global_step": 578526, "epoch": 6970} {"train_loss": -27.7569580078125, "global_step": 578527, "epoch": 6970} {"train_loss": -27.78972816467285, "global_step": 578528, "epoch": 6970} {"train_loss": -27.50502586364746, "global_step": 578529, "epoch": 6970} {"train_loss": -28.15376091003418, "global_step": 578530, "epoch": 6970} {"train_loss": -27.667078018188477, "global_step": 578531, "epoch": 6970} {"train_loss": -27.79579734802246, "global_step": 578532, "epoch": 6970} {"train_loss": -27.51165771484375, "global_step": 578533, "epoch": 6970} {"train_loss": -27.4528865814209, "global_step": 578534, "epoch": 6970} {"train_loss": -27.940221786499023, "global_step": 578535, "epoch": 6970} {"train_loss": -27.848590850830078, "global_step": 578536, "epoch": 6970} {"train_loss": -28.061384201049805, "global_step": 578537, "epoch": 6970} {"train_loss": -27.720239639282227, "global_step": 578538, "epoch": 6970} {"train_loss": -27.791379928588867, "global_step": 578539, "epoch": 6970} {"train_loss": -27.949630737304688, "global_step": 578540, "epoch": 6970} {"train_loss": -28.036157608032227, "global_step": 578541, "epoch": 6970} {"train_loss": -28.181507110595703, "global_step": 578542, "epoch": 6970} {"train_loss": -27.821704864501953, "global_step": 578543, "epoch": 6970} {"train_loss": -27.683746337890625, "global_step": 578544, "epoch": 6970} {"train_loss": -27.86273193359375, "global_step": 578545, "epoch": 6970} {"train_loss": -27.737548828125, "global_step": 578546, "epoch": 6970} {"train_loss": -27.764326095581055, "global_step": 578547, "epoch": 6970} {"train_loss": -27.700641632080078, "global_step": 578548, "epoch": 6970} {"train_loss": -28.11812400817871, "global_step": 578549, "epoch": 6970} {"train_loss": -27.791702270507812, "global_step": 578550, "epoch": 6970} {"train_loss": -27.675464630126953, "global_step": 578551, "epoch": 6970} {"train_loss": -28.138137817382812, "global_step": 578552, "epoch": 6970} {"train_loss": -28.13001823425293, "global_step": 578553, "epoch": 6970} {"train_loss": -28.2474422454834, "global_step": 578554, "epoch": 6970} {"train_loss": -28.047504425048828, "global_step": 578555, "epoch": 6970} {"train_loss": -27.869115829467773, "global_step": 578556, "epoch": 6970} {"train_loss": -27.87921142578125, "global_step": 578557, "epoch": 6970} {"train_loss": -27.987897872924805, "global_step": 578558, "epoch": 6970} {"train_loss": -28.164260864257812, "global_step": 578559, "epoch": 6970} {"train_loss": -28.084060668945312, "global_step": 578560, "epoch": 6970} {"train_loss": -28.633573532104492, "global_step": 578561, "epoch": 6970} {"train_loss": -27.91122817993164, "global_step": 578562, "epoch": 6970} {"train_loss": -28.134878158569336, "global_step": 578563, "epoch": 6970} {"train_loss": -27.799030303955078, "global_step": 578564, "epoch": 6970} {"train_loss": -28.40699577331543, "global_step": 578565, "epoch": 6970} {"train_loss": -28.10857582092285, "global_step": 578566, "epoch": 6970} {"train_loss": -28.2136287689209, "global_step": 578567, "epoch": 6970} {"train_loss": -27.889606475830078, "global_step": 578568, "epoch": 6970} {"train_loss": -28.04624366760254, "global_step": 578569, "epoch": 6970} {"train_loss": -28.157516479492188, "global_step": 578570, "epoch": 6970} {"train_loss": -28.245580673217773, "global_step": 578571, "epoch": 6970} {"train_loss": -28.027542114257812, "global_step": 578572, "epoch": 6970} {"train_loss": -27.78826904296875, "global_step": 578573, "epoch": 6970} {"train_loss": -27.638803482055664, "global_step": 578574, "epoch": 6970} {"train_loss": -28.169294357299805, "global_step": 578575, "epoch": 6970} {"train_loss": -27.8179988861084, "global_step": 578576, "epoch": 6970} {"train_loss": -27.650854110717773, "global_step": 578577, "epoch": 6970} {"train_loss": -27.443195343017578, "global_step": 578578, "epoch": 6970} {"train_loss": -28.1875, "global_step": 578579, "epoch": 6970} {"train_loss": -27.868427276611328, "global_step": 578580, "epoch": 6970} {"train_loss": -28.242273330688477, "global_step": 578581, "epoch": 6970} {"train_loss": -27.657669067382812, "global_step": 578582, "epoch": 6970} {"train_loss": -27.554838180541992, "global_step": 578583, "epoch": 6970} {"train_loss": -27.733932495117188, "global_step": 578584, "epoch": 6970} {"train_loss": -27.498703002929688, "global_step": 578585, "epoch": 6970} {"train_loss": -28.078550338745117, "global_step": 578586, "epoch": 6970} {"train_loss": -27.779312133789062, "global_step": 578587, "epoch": 6970} {"train_loss": -27.802326202392578, "global_step": 578588, "epoch": 6970} {"train_loss": -28.026996612548828, "global_step": 578589, "epoch": 6970} {"train_loss": -27.607177734375, "global_step": 578590, "epoch": 6970} {"train_loss": -28.344390869140625, "global_step": 578591, "epoch": 6970} {"train_loss": -27.81357680171369, "global_step": 578592, "epoch": 6970, "val_loss": 6530516.0} {"train_loss": -26.4438533782959, "global_step": 578593, "epoch": 6971} {"train_loss": -26.63007926940918, "global_step": 578594, "epoch": 6971} {"train_loss": -26.922306060791016, "global_step": 578595, "epoch": 6971} {"train_loss": -27.253034591674805, "global_step": 578596, "epoch": 6971} {"train_loss": -26.623815536499023, "global_step": 578597, "epoch": 6971} {"train_loss": -27.084863662719727, "global_step": 578598, "epoch": 6971} {"train_loss": -27.04168701171875, "global_step": 578599, "epoch": 6971} {"train_loss": -27.082265853881836, "global_step": 578600, "epoch": 6971} {"train_loss": -27.69550895690918, "global_step": 578601, "epoch": 6971} {"train_loss": -26.85210609436035, "global_step": 578602, "epoch": 6971} {"train_loss": -27.6002254486084, "global_step": 578603, "epoch": 6971} {"train_loss": -27.446155548095703, "global_step": 578604, "epoch": 6971} {"train_loss": -27.021804809570312, "global_step": 578605, "epoch": 6971} {"train_loss": -27.4815731048584, "global_step": 578606, "epoch": 6971} {"train_loss": -27.782672882080078, "global_step": 578607, "epoch": 6971} {"train_loss": -27.435321807861328, "global_step": 578608, "epoch": 6971} {"train_loss": -27.2135009765625, "global_step": 578609, "epoch": 6971} {"train_loss": -27.475961685180664, "global_step": 578610, "epoch": 6971} {"train_loss": -27.2432918548584, "global_step": 578611, "epoch": 6971} {"train_loss": -27.499048233032227, "global_step": 578612, "epoch": 6971} {"train_loss": -27.59429359436035, "global_step": 578613, "epoch": 6971} {"train_loss": -27.575498580932617, "global_step": 578614, "epoch": 6971} {"train_loss": -27.515655517578125, "global_step": 578615, "epoch": 6971} {"train_loss": -27.596912384033203, "global_step": 578616, "epoch": 6971} {"train_loss": -27.496984481811523, "global_step": 578617, "epoch": 6971} {"train_loss": -27.72600746154785, "global_step": 578618, "epoch": 6971} {"train_loss": -27.85944938659668, "global_step": 578619, "epoch": 6971} {"train_loss": -27.69879722595215, "global_step": 578620, "epoch": 6971} {"train_loss": -27.9808292388916, "global_step": 578621, "epoch": 6971} {"train_loss": -27.68894386291504, "global_step": 578622, "epoch": 6971} {"train_loss": -27.89710807800293, "global_step": 578623, "epoch": 6971} {"train_loss": -28.0103702545166, "global_step": 578624, "epoch": 6971} {"train_loss": -27.82264518737793, "global_step": 578625, "epoch": 6971} {"train_loss": -27.57940673828125, "global_step": 578626, "epoch": 6971} {"train_loss": -27.940839767456055, "global_step": 578627, "epoch": 6971} {"train_loss": -28.0885066986084, "global_step": 578628, "epoch": 6971} {"train_loss": -28.14505386352539, "global_step": 578629, "epoch": 6971} {"train_loss": -28.012861251831055, "global_step": 578630, "epoch": 6971} {"train_loss": -27.987096786499023, "global_step": 578631, "epoch": 6971} {"train_loss": -27.84852409362793, "global_step": 578632, "epoch": 6971} {"train_loss": -27.681501388549805, "global_step": 578633, "epoch": 6971} {"train_loss": -27.416593551635742, "global_step": 578634, "epoch": 6971} {"train_loss": -27.762744903564453, "global_step": 578635, "epoch": 6971} {"train_loss": -28.166391372680664, "global_step": 578636, "epoch": 6971} {"train_loss": -28.164295196533203, "global_step": 578637, "epoch": 6971} {"train_loss": -27.986433029174805, "global_step": 578638, "epoch": 6971} {"train_loss": -27.66237449645996, "global_step": 578639, "epoch": 6971} {"train_loss": -28.365081787109375, "global_step": 578640, "epoch": 6971} {"train_loss": -28.13397216796875, "global_step": 578641, "epoch": 6971} {"train_loss": -28.105798721313477, "global_step": 578642, "epoch": 6971} {"train_loss": -27.706939697265625, "global_step": 578643, "epoch": 6971} {"train_loss": -28.046857833862305, "global_step": 578644, "epoch": 6971} {"train_loss": -27.921192169189453, "global_step": 578645, "epoch": 6971} {"train_loss": -27.912328720092773, "global_step": 578646, "epoch": 6971} {"train_loss": -27.50250816345215, "global_step": 578647, "epoch": 6971} {"train_loss": -27.582122802734375, "global_step": 578648, "epoch": 6971} {"train_loss": -27.852087020874023, "global_step": 578649, "epoch": 6971} {"train_loss": -27.912744522094727, "global_step": 578650, "epoch": 6971} {"train_loss": -28.04632568359375, "global_step": 578651, "epoch": 6971} {"train_loss": -28.23316764831543, "global_step": 578652, "epoch": 6971} {"train_loss": -28.158666610717773, "global_step": 578653, "epoch": 6971} {"train_loss": -28.06808853149414, "global_step": 578654, "epoch": 6971} {"train_loss": -28.071033477783203, "global_step": 578655, "epoch": 6971} {"train_loss": -27.96526527404785, "global_step": 578656, "epoch": 6971} {"train_loss": -28.077442169189453, "global_step": 578657, "epoch": 6971} {"train_loss": -27.84144401550293, "global_step": 578658, "epoch": 6971} {"train_loss": -27.115036010742188, "global_step": 578659, "epoch": 6971} {"train_loss": -27.6885929107666, "global_step": 578660, "epoch": 6971} {"train_loss": -28.1743106842041, "global_step": 578661, "epoch": 6971} {"train_loss": -27.535049438476562, "global_step": 578662, "epoch": 6971} {"train_loss": -28.1568603515625, "global_step": 578663, "epoch": 6971} {"train_loss": -28.161230087280273, "global_step": 578664, "epoch": 6971} {"train_loss": -28.079730987548828, "global_step": 578665, "epoch": 6971} {"train_loss": -27.96563148498535, "global_step": 578666, "epoch": 6971} {"train_loss": -27.980283737182617, "global_step": 578667, "epoch": 6971} {"train_loss": -28.009113311767578, "global_step": 578668, "epoch": 6971} {"train_loss": -27.371496200561523, "global_step": 578669, "epoch": 6971} {"train_loss": -27.949609756469727, "global_step": 578670, "epoch": 6971} {"train_loss": -27.962024688720703, "global_step": 578671, "epoch": 6971} {"train_loss": -27.80796241760254, "global_step": 578672, "epoch": 6971} {"train_loss": -27.70077896118164, "global_step": 578673, "epoch": 6971} {"train_loss": -27.2985897064209, "global_step": 578674, "epoch": 6971} {"train_loss": -27.693386399602314, "global_step": 578675, "epoch": 6971, "val_loss": 6543151.5} {"train_loss": -26.750036239624023, "global_step": 578676, "epoch": 6972} {"train_loss": -26.421567916870117, "global_step": 578677, "epoch": 6972} {"train_loss": -27.01470947265625, "global_step": 578678, "epoch": 6972} {"train_loss": -26.487934112548828, "global_step": 578679, "epoch": 6972} {"train_loss": -27.0365047454834, "global_step": 578680, "epoch": 6972} {"train_loss": -26.503774642944336, "global_step": 578681, "epoch": 6972} {"train_loss": -26.3673038482666, "global_step": 578682, "epoch": 6972} {"train_loss": -27.481103897094727, "global_step": 578683, "epoch": 6972} {"train_loss": -27.203489303588867, "global_step": 578684, "epoch": 6972} {"train_loss": -27.04047203063965, "global_step": 578685, "epoch": 6972} {"train_loss": -27.13214683532715, "global_step": 578686, "epoch": 6972} {"train_loss": -26.9963436126709, "global_step": 578687, "epoch": 6972} {"train_loss": -27.112218856811523, "global_step": 578688, "epoch": 6972} {"train_loss": -27.1873836517334, "global_step": 578689, "epoch": 6972} {"train_loss": -27.225635528564453, "global_step": 578690, "epoch": 6972} {"train_loss": -27.55095863342285, "global_step": 578691, "epoch": 6972} {"train_loss": -27.2032527923584, "global_step": 578692, "epoch": 6972} {"train_loss": -27.75275993347168, "global_step": 578693, "epoch": 6972} {"train_loss": -27.606781005859375, "global_step": 578694, "epoch": 6972} {"train_loss": -27.73177146911621, "global_step": 578695, "epoch": 6972} {"train_loss": -27.6617488861084, "global_step": 578696, "epoch": 6972} {"train_loss": -27.340784072875977, "global_step": 578697, "epoch": 6972} {"train_loss": -27.176206588745117, "global_step": 578698, "epoch": 6972} {"train_loss": -27.440000534057617, "global_step": 578699, "epoch": 6972} {"train_loss": -27.4840030670166, "global_step": 578700, "epoch": 6972} {"train_loss": -27.368810653686523, "global_step": 578701, "epoch": 6972} {"train_loss": -28.211471557617188, "global_step": 578702, "epoch": 6972} {"train_loss": -27.811059951782227, "global_step": 578703, "epoch": 6972} {"train_loss": -27.386987686157227, "global_step": 578704, "epoch": 6972} {"train_loss": -27.778303146362305, "global_step": 578705, "epoch": 6972} {"train_loss": -27.6065673828125, "global_step": 578706, "epoch": 6972} {"train_loss": -27.787933349609375, "global_step": 578707, "epoch": 6972} {"train_loss": -27.640111923217773, "global_step": 578708, "epoch": 6972} {"train_loss": -27.761417388916016, "global_step": 578709, "epoch": 6972} {"train_loss": -27.861133575439453, "global_step": 578710, "epoch": 6972} {"train_loss": -27.64762306213379, "global_step": 578711, "epoch": 6972} {"train_loss": -27.476232528686523, "global_step": 578712, "epoch": 6972} {"train_loss": -27.712890625, "global_step": 578713, "epoch": 6972} {"train_loss": -27.81648063659668, "global_step": 578714, "epoch": 6972} {"train_loss": -27.68598747253418, "global_step": 578715, "epoch": 6972} {"train_loss": -27.75375747680664, "global_step": 578716, "epoch": 6972} {"train_loss": -28.10792350769043, "global_step": 578717, "epoch": 6972} {"train_loss": -27.80950927734375, "global_step": 578718, "epoch": 6972} {"train_loss": -27.544950485229492, "global_step": 578719, "epoch": 6972} {"train_loss": -28.329151153564453, "global_step": 578720, "epoch": 6972} {"train_loss": -27.67437171936035, "global_step": 578721, "epoch": 6972} {"train_loss": -28.227340698242188, "global_step": 578722, "epoch": 6972} {"train_loss": -28.037092208862305, "global_step": 578723, "epoch": 6972} {"train_loss": -28.161718368530273, "global_step": 578724, "epoch": 6972} {"train_loss": -28.257471084594727, "global_step": 578725, "epoch": 6972} {"train_loss": -28.049360275268555, "global_step": 578726, "epoch": 6972} {"train_loss": -27.76446533203125, "global_step": 578727, "epoch": 6972} {"train_loss": -27.97555923461914, "global_step": 578728, "epoch": 6972} {"train_loss": -28.10774040222168, "global_step": 578729, "epoch": 6972} {"train_loss": -28.422719955444336, "global_step": 578730, "epoch": 6972} {"train_loss": -27.940998077392578, "global_step": 578731, "epoch": 6972} {"train_loss": -28.009723663330078, "global_step": 578732, "epoch": 6972} {"train_loss": -28.123987197875977, "global_step": 578733, "epoch": 6972} {"train_loss": -27.738422393798828, "global_step": 578734, "epoch": 6972} {"train_loss": -27.951202392578125, "global_step": 578735, "epoch": 6972} {"train_loss": -28.012495040893555, "global_step": 578736, "epoch": 6972} {"train_loss": -28.031158447265625, "global_step": 578737, "epoch": 6972} {"train_loss": -27.867630004882812, "global_step": 578738, "epoch": 6972} {"train_loss": -28.047712326049805, "global_step": 578739, "epoch": 6972} {"train_loss": -27.834753036499023, "global_step": 578740, "epoch": 6972} {"train_loss": -28.21360206604004, "global_step": 578741, "epoch": 6972} {"train_loss": -27.89129066467285, "global_step": 578742, "epoch": 6972} {"train_loss": -27.770044326782227, "global_step": 578743, "epoch": 6972} {"train_loss": -28.17536735534668, "global_step": 578744, "epoch": 6972} {"train_loss": -27.537872314453125, "global_step": 578745, "epoch": 6972} {"train_loss": -27.82636070251465, "global_step": 578746, "epoch": 6972} {"train_loss": -27.907129287719727, "global_step": 578747, "epoch": 6972} {"train_loss": -28.069440841674805, "global_step": 578748, "epoch": 6972} {"train_loss": -28.07183837890625, "global_step": 578749, "epoch": 6972} {"train_loss": -28.115921020507812, "global_step": 578750, "epoch": 6972} {"train_loss": -28.071746826171875, "global_step": 578751, "epoch": 6972} {"train_loss": -27.838464736938477, "global_step": 578752, "epoch": 6972} {"train_loss": -28.123260498046875, "global_step": 578753, "epoch": 6972} {"train_loss": -28.36079978942871, "global_step": 578754, "epoch": 6972} {"train_loss": -27.72205924987793, "global_step": 578755, "epoch": 6972} {"train_loss": -27.886449813842773, "global_step": 578756, "epoch": 6972} {"train_loss": -27.87359619140625, "global_step": 578757, "epoch": 6972} {"train_loss": -27.689301801015095, "global_step": 578758, "epoch": 6972, "val_loss": 6528395.0} {"train_loss": -23.19556999206543, "global_step": 578759, "epoch": 6973} {"train_loss": -26.90398597717285, "global_step": 578760, "epoch": 6973} {"train_loss": -22.670988082885742, "global_step": 578761, "epoch": 6973} {"train_loss": -24.93218421936035, "global_step": 578762, "epoch": 6973} {"train_loss": -24.909780502319336, "global_step": 578763, "epoch": 6973} {"train_loss": -26.060169219970703, "global_step": 578764, "epoch": 6973} {"train_loss": -26.1965389251709, "global_step": 578765, "epoch": 6973} {"train_loss": -25.639326095581055, "global_step": 578766, "epoch": 6973} {"train_loss": -25.888208389282227, "global_step": 578767, "epoch": 6973} {"train_loss": -26.0765323638916, "global_step": 578768, "epoch": 6973} {"train_loss": -26.66529655456543, "global_step": 578769, "epoch": 6973} {"train_loss": -26.27777671813965, "global_step": 578770, "epoch": 6973} {"train_loss": -26.384845733642578, "global_step": 578771, "epoch": 6973} {"train_loss": -25.967395782470703, "global_step": 578772, "epoch": 6973} {"train_loss": -26.661706924438477, "global_step": 578773, "epoch": 6973} {"train_loss": -26.44431495666504, "global_step": 578774, "epoch": 6973} {"train_loss": -26.40105628967285, "global_step": 578775, "epoch": 6973} {"train_loss": -26.727514266967773, "global_step": 578776, "epoch": 6973} {"train_loss": -26.680082321166992, "global_step": 578777, "epoch": 6973} {"train_loss": -26.67352867126465, "global_step": 578778, "epoch": 6973} {"train_loss": -27.302276611328125, "global_step": 578779, "epoch": 6973} {"train_loss": -26.611318588256836, "global_step": 578780, "epoch": 6973} {"train_loss": -26.543745040893555, "global_step": 578781, "epoch": 6973} {"train_loss": -26.886335372924805, "global_step": 578782, "epoch": 6973} {"train_loss": -26.920166015625, "global_step": 578783, "epoch": 6973} {"train_loss": -26.8458251953125, "global_step": 578784, "epoch": 6973} {"train_loss": -27.129364013671875, "global_step": 578785, "epoch": 6973} {"train_loss": -26.932708740234375, "global_step": 578786, "epoch": 6973} {"train_loss": -27.126874923706055, "global_step": 578787, "epoch": 6973} {"train_loss": -27.093215942382812, "global_step": 578788, "epoch": 6973} {"train_loss": -27.424280166625977, "global_step": 578789, "epoch": 6973} {"train_loss": -27.12360191345215, "global_step": 578790, "epoch": 6973} {"train_loss": -27.337787628173828, "global_step": 578791, "epoch": 6973} {"train_loss": -27.25144386291504, "global_step": 578792, "epoch": 6973} {"train_loss": -27.600934982299805, "global_step": 578793, "epoch": 6973} {"train_loss": -27.517560958862305, "global_step": 578794, "epoch": 6973} {"train_loss": -27.15960121154785, "global_step": 578795, "epoch": 6973} {"train_loss": -27.356220245361328, "global_step": 578796, "epoch": 6973} {"train_loss": -27.52793312072754, "global_step": 578797, "epoch": 6973} {"train_loss": -27.700164794921875, "global_step": 578798, "epoch": 6973} {"train_loss": -27.623083114624023, "global_step": 578799, "epoch": 6973} {"train_loss": -27.358518600463867, "global_step": 578800, "epoch": 6973} {"train_loss": -27.477935791015625, "global_step": 578801, "epoch": 6973} {"train_loss": -27.6995906829834, "global_step": 578802, "epoch": 6973} {"train_loss": -27.70420265197754, "global_step": 578803, "epoch": 6973} {"train_loss": -27.60426139831543, "global_step": 578804, "epoch": 6973} {"train_loss": -27.641752243041992, "global_step": 578805, "epoch": 6973} {"train_loss": -27.564077377319336, "global_step": 578806, "epoch": 6973} {"train_loss": -27.912450790405273, "global_step": 578807, "epoch": 6973} {"train_loss": -27.299680709838867, "global_step": 578808, "epoch": 6973} {"train_loss": -27.760862350463867, "global_step": 578809, "epoch": 6973} {"train_loss": -27.559650421142578, "global_step": 578810, "epoch": 6973} {"train_loss": -27.92671012878418, "global_step": 578811, "epoch": 6973} {"train_loss": -27.871234893798828, "global_step": 578812, "epoch": 6973} {"train_loss": -27.756946563720703, "global_step": 578813, "epoch": 6973} {"train_loss": -27.964401245117188, "global_step": 578814, "epoch": 6973} {"train_loss": -28.150531768798828, "global_step": 578815, "epoch": 6973} {"train_loss": -27.888952255249023, "global_step": 578816, "epoch": 6973} {"train_loss": -28.111310958862305, "global_step": 578817, "epoch": 6973} {"train_loss": -27.983783721923828, "global_step": 578818, "epoch": 6973} {"train_loss": -28.31573486328125, "global_step": 578819, "epoch": 6973} {"train_loss": -27.851688385009766, "global_step": 578820, "epoch": 6973} {"train_loss": -27.759618759155273, "global_step": 578821, "epoch": 6973} {"train_loss": -27.834985733032227, "global_step": 578822, "epoch": 6973} {"train_loss": -28.283056259155273, "global_step": 578823, "epoch": 6973} {"train_loss": -27.597036361694336, "global_step": 578824, "epoch": 6973} {"train_loss": -27.747528076171875, "global_step": 578825, "epoch": 6973} {"train_loss": -27.8325138092041, "global_step": 578826, "epoch": 6973} {"train_loss": -27.72235679626465, "global_step": 578827, "epoch": 6973} {"train_loss": -27.8275146484375, "global_step": 578828, "epoch": 6973} {"train_loss": -28.0833740234375, "global_step": 578829, "epoch": 6973} {"train_loss": -28.04300308227539, "global_step": 578830, "epoch": 6973} {"train_loss": -27.957983016967773, "global_step": 578831, "epoch": 6973} {"train_loss": -27.73075294494629, "global_step": 578832, "epoch": 6973} {"train_loss": -28.062210083007812, "global_step": 578833, "epoch": 6973} {"train_loss": -27.889530181884766, "global_step": 578834, "epoch": 6973} {"train_loss": -27.74749183654785, "global_step": 578835, "epoch": 6973} {"train_loss": -27.944812774658203, "global_step": 578836, "epoch": 6973} {"train_loss": -27.368759155273438, "global_step": 578837, "epoch": 6973} {"train_loss": -28.011335372924805, "global_step": 578838, "epoch": 6973} {"train_loss": -28.147464752197266, "global_step": 578839, "epoch": 6973} {"train_loss": -28.111042022705078, "global_step": 578840, "epoch": 6973} {"train_loss": -27.188450640942676, "global_step": 578841, "epoch": 6973, "val_loss": 6474728.0} {"train_loss": -26.715320587158203, "global_step": 578842, "epoch": 6974} {"train_loss": -26.777698516845703, "global_step": 578843, "epoch": 6974} {"train_loss": -26.73360252380371, "global_step": 578844, "epoch": 6974} {"train_loss": -27.29658317565918, "global_step": 578845, "epoch": 6974} {"train_loss": -27.424375534057617, "global_step": 578846, "epoch": 6974} {"train_loss": -27.047962188720703, "global_step": 578847, "epoch": 6974} {"train_loss": -27.68741798400879, "global_step": 578848, "epoch": 6974} {"train_loss": -27.476083755493164, "global_step": 578849, "epoch": 6974} {"train_loss": -27.628393173217773, "global_step": 578850, "epoch": 6974} {"train_loss": -27.727338790893555, "global_step": 578851, "epoch": 6974} {"train_loss": -27.5101375579834, "global_step": 578852, "epoch": 6974} {"train_loss": -27.808094024658203, "global_step": 578853, "epoch": 6974} {"train_loss": -27.797393798828125, "global_step": 578854, "epoch": 6974} {"train_loss": -27.394086837768555, "global_step": 578855, "epoch": 6974} {"train_loss": -28.04819679260254, "global_step": 578856, "epoch": 6974} {"train_loss": -27.60695457458496, "global_step": 578857, "epoch": 6974} {"train_loss": -27.367170333862305, "global_step": 578858, "epoch": 6974} {"train_loss": -27.554296493530273, "global_step": 578859, "epoch": 6974} {"train_loss": -27.453290939331055, "global_step": 578860, "epoch": 6974} {"train_loss": -28.20253562927246, "global_step": 578861, "epoch": 6974} {"train_loss": -27.569095611572266, "global_step": 578862, "epoch": 6974} {"train_loss": -27.7193660736084, "global_step": 578863, "epoch": 6974} {"train_loss": -27.614822387695312, "global_step": 578864, "epoch": 6974} {"train_loss": -27.951629638671875, "global_step": 578865, "epoch": 6974} {"train_loss": -27.720813751220703, "global_step": 578866, "epoch": 6974} {"train_loss": -27.866621017456055, "global_step": 578867, "epoch": 6974} {"train_loss": -27.970123291015625, "global_step": 578868, "epoch": 6974} {"train_loss": -27.5767879486084, "global_step": 578869, "epoch": 6974} {"train_loss": -28.1788272857666, "global_step": 578870, "epoch": 6974} {"train_loss": -27.81353759765625, "global_step": 578871, "epoch": 6974} {"train_loss": -27.617700576782227, "global_step": 578872, "epoch": 6974} {"train_loss": -27.892898559570312, "global_step": 578873, "epoch": 6974} {"train_loss": -28.000646591186523, "global_step": 578874, "epoch": 6974} {"train_loss": -27.629995346069336, "global_step": 578875, "epoch": 6974} {"train_loss": -27.825336456298828, "global_step": 578876, "epoch": 6974} {"train_loss": -27.649580001831055, "global_step": 578877, "epoch": 6974} {"train_loss": -27.85902214050293, "global_step": 578878, "epoch": 6974} {"train_loss": -27.71525001525879, "global_step": 578879, "epoch": 6974} {"train_loss": -27.952478408813477, "global_step": 578880, "epoch": 6974} {"train_loss": -28.266611099243164, "global_step": 578881, "epoch": 6974} {"train_loss": -28.040903091430664, "global_step": 578882, "epoch": 6974} {"train_loss": -27.726516723632812, "global_step": 578883, "epoch": 6974} {"train_loss": -27.97353172302246, "global_step": 578884, "epoch": 6974} {"train_loss": -27.966222763061523, "global_step": 578885, "epoch": 6974} {"train_loss": -27.77154541015625, "global_step": 578886, "epoch": 6974} {"train_loss": -27.947492599487305, "global_step": 578887, "epoch": 6974} {"train_loss": -27.692529678344727, "global_step": 578888, "epoch": 6974} {"train_loss": -27.332666397094727, "global_step": 578889, "epoch": 6974} {"train_loss": -27.006189346313477, "global_step": 578890, "epoch": 6974} {"train_loss": -27.17563819885254, "global_step": 578891, "epoch": 6974} {"train_loss": -28.06056022644043, "global_step": 578892, "epoch": 6974} {"train_loss": -27.67518424987793, "global_step": 578893, "epoch": 6974} {"train_loss": -27.799421310424805, "global_step": 578894, "epoch": 6974} {"train_loss": -27.986616134643555, "global_step": 578895, "epoch": 6974} {"train_loss": -27.916797637939453, "global_step": 578896, "epoch": 6974} {"train_loss": -27.975830078125, "global_step": 578897, "epoch": 6974} {"train_loss": -28.038288116455078, "global_step": 578898, "epoch": 6974} {"train_loss": -28.111948013305664, "global_step": 578899, "epoch": 6974} {"train_loss": -27.94675636291504, "global_step": 578900, "epoch": 6974} {"train_loss": -28.175703048706055, "global_step": 578901, "epoch": 6974} {"train_loss": -27.918691635131836, "global_step": 578902, "epoch": 6974} {"train_loss": -28.151514053344727, "global_step": 578903, "epoch": 6974} {"train_loss": -27.9746150970459, "global_step": 578904, "epoch": 6974} {"train_loss": -27.864288330078125, "global_step": 578905, "epoch": 6974} {"train_loss": -27.9134578704834, "global_step": 578906, "epoch": 6974} {"train_loss": -27.88666343688965, "global_step": 578907, "epoch": 6974} {"train_loss": -27.90260124206543, "global_step": 578908, "epoch": 6974} {"train_loss": -28.04314613342285, "global_step": 578909, "epoch": 6974} {"train_loss": -27.67848777770996, "global_step": 578910, "epoch": 6974} {"train_loss": -28.377023696899414, "global_step": 578911, "epoch": 6974} {"train_loss": -27.924360275268555, "global_step": 578912, "epoch": 6974} {"train_loss": -27.79120445251465, "global_step": 578913, "epoch": 6974} {"train_loss": -27.874372482299805, "global_step": 578914, "epoch": 6974} {"train_loss": -28.02762222290039, "global_step": 578915, "epoch": 6974} {"train_loss": -28.20979118347168, "global_step": 578916, "epoch": 6974} {"train_loss": -27.89080810546875, "global_step": 578917, "epoch": 6974} {"train_loss": -27.734573364257812, "global_step": 578918, "epoch": 6974} {"train_loss": -28.034626007080078, "global_step": 578919, "epoch": 6974} {"train_loss": -28.056066513061523, "global_step": 578920, "epoch": 6974} {"train_loss": -27.9060115814209, "global_step": 578921, "epoch": 6974} {"train_loss": -27.721384048461914, "global_step": 578922, "epoch": 6974} {"train_loss": -28.31842041015625, "global_step": 578923, "epoch": 6974} {"train_loss": -27.77361159726798, "global_step": 578924, "epoch": 6974, "val_loss": 6442332.0} {"train_loss": -27.70557975769043, "global_step": 578925, "epoch": 6975} {"train_loss": -27.7232666015625, "global_step": 578926, "epoch": 6975} {"train_loss": -27.70684242248535, "global_step": 578927, "epoch": 6975} {"train_loss": -27.722639083862305, "global_step": 578928, "epoch": 6975} {"train_loss": -27.49769401550293, "global_step": 578929, "epoch": 6975} {"train_loss": -27.426788330078125, "global_step": 578930, "epoch": 6975} {"train_loss": -26.613122940063477, "global_step": 578931, "epoch": 6975} {"train_loss": -25.900793075561523, "global_step": 578932, "epoch": 6975} {"train_loss": -26.33584976196289, "global_step": 578933, "epoch": 6975} {"train_loss": -26.83037757873535, "global_step": 578934, "epoch": 6975} {"train_loss": -27.06199073791504, "global_step": 578935, "epoch": 6975} {"train_loss": -27.0394344329834, "global_step": 578936, "epoch": 6975} {"train_loss": -26.851211547851562, "global_step": 578937, "epoch": 6975} {"train_loss": -26.79981803894043, "global_step": 578938, "epoch": 6975} {"train_loss": -27.977996826171875, "global_step": 578939, "epoch": 6975} {"train_loss": -27.109582901000977, "global_step": 578940, "epoch": 6975} {"train_loss": -27.64544105529785, "global_step": 578941, "epoch": 6975} {"train_loss": -27.717206954956055, "global_step": 578942, "epoch": 6975} {"train_loss": -27.762561798095703, "global_step": 578943, "epoch": 6975} {"train_loss": -27.421783447265625, "global_step": 578944, "epoch": 6975} {"train_loss": -27.383520126342773, "global_step": 578945, "epoch": 6975} {"train_loss": -27.367645263671875, "global_step": 578946, "epoch": 6975} {"train_loss": -27.44342613220215, "global_step": 578947, "epoch": 6975} {"train_loss": -27.4625186920166, "global_step": 578948, "epoch": 6975} {"train_loss": -27.200159072875977, "global_step": 578949, "epoch": 6975} {"train_loss": -27.605972290039062, "global_step": 578950, "epoch": 6975} {"train_loss": -27.478994369506836, "global_step": 578951, "epoch": 6975} {"train_loss": -27.494977951049805, "global_step": 578952, "epoch": 6975} {"train_loss": -27.665863037109375, "global_step": 578953, "epoch": 6975} {"train_loss": -27.6882266998291, "global_step": 578954, "epoch": 6975} {"train_loss": -27.466604232788086, "global_step": 578955, "epoch": 6975} {"train_loss": -27.762876510620117, "global_step": 578956, "epoch": 6975} {"train_loss": -27.8407039642334, "global_step": 578957, "epoch": 6975} {"train_loss": -27.730005264282227, "global_step": 578958, "epoch": 6975} {"train_loss": -27.219562530517578, "global_step": 578959, "epoch": 6975} {"train_loss": -28.112218856811523, "global_step": 578960, "epoch": 6975} {"train_loss": -28.01639747619629, "global_step": 578961, "epoch": 6975} {"train_loss": -27.602258682250977, "global_step": 578962, "epoch": 6975} {"train_loss": -28.033573150634766, "global_step": 578963, "epoch": 6975} {"train_loss": -27.643280029296875, "global_step": 578964, "epoch": 6975} {"train_loss": -28.0570068359375, "global_step": 578965, "epoch": 6975} {"train_loss": -27.912321090698242, "global_step": 578966, "epoch": 6975} {"train_loss": -27.816991806030273, "global_step": 578967, "epoch": 6975} {"train_loss": -27.756031036376953, "global_step": 578968, "epoch": 6975} {"train_loss": -27.798086166381836, "global_step": 578969, "epoch": 6975} {"train_loss": -27.9084415435791, "global_step": 578970, "epoch": 6975} {"train_loss": -28.1160888671875, "global_step": 578971, "epoch": 6975} {"train_loss": -27.810205459594727, "global_step": 578972, "epoch": 6975} {"train_loss": -27.784704208374023, "global_step": 578973, "epoch": 6975} {"train_loss": -27.975549697875977, "global_step": 578974, "epoch": 6975} {"train_loss": -28.026580810546875, "global_step": 578975, "epoch": 6975} {"train_loss": -28.295209884643555, "global_step": 578976, "epoch": 6975} {"train_loss": -27.825698852539062, "global_step": 578977, "epoch": 6975} {"train_loss": -27.96687126159668, "global_step": 578978, "epoch": 6975} {"train_loss": -28.24237632751465, "global_step": 578979, "epoch": 6975} {"train_loss": -28.1678466796875, "global_step": 578980, "epoch": 6975} {"train_loss": -27.834716796875, "global_step": 578981, "epoch": 6975} {"train_loss": -27.922042846679688, "global_step": 578982, "epoch": 6975} {"train_loss": -28.00977897644043, "global_step": 578983, "epoch": 6975} {"train_loss": -28.02205467224121, "global_step": 578984, "epoch": 6975} {"train_loss": -28.058759689331055, "global_step": 578985, "epoch": 6975} {"train_loss": -27.947248458862305, "global_step": 578986, "epoch": 6975} {"train_loss": -28.19940757751465, "global_step": 578987, "epoch": 6975} {"train_loss": -28.476943969726562, "global_step": 578988, "epoch": 6975} {"train_loss": -28.087615966796875, "global_step": 578989, "epoch": 6975} {"train_loss": -28.358800888061523, "global_step": 578990, "epoch": 6975} {"train_loss": -27.998184204101562, "global_step": 578991, "epoch": 6975} {"train_loss": -28.1013240814209, "global_step": 578992, "epoch": 6975} {"train_loss": -28.084970474243164, "global_step": 578993, "epoch": 6975} {"train_loss": -28.208372116088867, "global_step": 578994, "epoch": 6975} {"train_loss": -28.181058883666992, "global_step": 578995, "epoch": 6975} {"train_loss": -27.8448543548584, "global_step": 578996, "epoch": 6975} {"train_loss": -28.1524658203125, "global_step": 578997, "epoch": 6975} {"train_loss": -27.821889877319336, "global_step": 578998, "epoch": 6975} {"train_loss": -27.997634887695312, "global_step": 578999, "epoch": 6975} {"train_loss": -27.83856201171875, "global_step": 579000, "epoch": 6975} {"train_loss": -28.071496963500977, "global_step": 579001, "epoch": 6975} {"train_loss": -27.762516021728516, "global_step": 579002, "epoch": 6975} {"train_loss": -27.979307174682617, "global_step": 579003, "epoch": 6975} {"train_loss": -28.342086791992188, "global_step": 579004, "epoch": 6975} {"train_loss": -28.22260093688965, "global_step": 579005, "epoch": 6975} {"train_loss": -28.06477165222168, "global_step": 579006, "epoch": 6975} {"train_loss": -27.721825266458904, "global_step": 579007, "epoch": 6975, "val_loss": 6436038.0} {"train_loss": -27.707752227783203, "global_step": 579008, "epoch": 6976} {"train_loss": -27.376516342163086, "global_step": 579009, "epoch": 6976} {"train_loss": -26.901845932006836, "global_step": 579010, "epoch": 6976} {"train_loss": -27.088703155517578, "global_step": 579011, "epoch": 6976} {"train_loss": -26.951141357421875, "global_step": 579012, "epoch": 6976} {"train_loss": -27.43409538269043, "global_step": 579013, "epoch": 6976} {"train_loss": -27.3165340423584, "global_step": 579014, "epoch": 6976} {"train_loss": -27.413482666015625, "global_step": 579015, "epoch": 6976} {"train_loss": -27.783924102783203, "global_step": 579016, "epoch": 6976} {"train_loss": -27.606510162353516, "global_step": 579017, "epoch": 6976} {"train_loss": -27.260883331298828, "global_step": 579018, "epoch": 6976} {"train_loss": -27.02765464782715, "global_step": 579019, "epoch": 6976} {"train_loss": -27.388818740844727, "global_step": 579020, "epoch": 6976} {"train_loss": -27.716400146484375, "global_step": 579021, "epoch": 6976} {"train_loss": -27.368637084960938, "global_step": 579022, "epoch": 6976} {"train_loss": -27.4390926361084, "global_step": 579023, "epoch": 6976} {"train_loss": -27.868268966674805, "global_step": 579024, "epoch": 6976} {"train_loss": -27.68545913696289, "global_step": 579025, "epoch": 6976} {"train_loss": -27.35149574279785, "global_step": 579026, "epoch": 6976} {"train_loss": -27.368087768554688, "global_step": 579027, "epoch": 6976} {"train_loss": -27.6550350189209, "global_step": 579028, "epoch": 6976} {"train_loss": -27.790678024291992, "global_step": 579029, "epoch": 6976} {"train_loss": -27.802392959594727, "global_step": 579030, "epoch": 6976} {"train_loss": -27.90077018737793, "global_step": 579031, "epoch": 6976} {"train_loss": -27.661176681518555, "global_step": 579032, "epoch": 6976} {"train_loss": -27.6343936920166, "global_step": 579033, "epoch": 6976} {"train_loss": -27.665143966674805, "global_step": 579034, "epoch": 6976} {"train_loss": -28.012121200561523, "global_step": 579035, "epoch": 6976} {"train_loss": -27.959421157836914, "global_step": 579036, "epoch": 6976} {"train_loss": -27.859018325805664, "global_step": 579037, "epoch": 6976} {"train_loss": -28.182424545288086, "global_step": 579038, "epoch": 6976} {"train_loss": -27.973424911499023, "global_step": 579039, "epoch": 6976} {"train_loss": -27.961530685424805, "global_step": 579040, "epoch": 6976} {"train_loss": -27.529830932617188, "global_step": 579041, "epoch": 6976} {"train_loss": -27.972143173217773, "global_step": 579042, "epoch": 6976} {"train_loss": -28.10725975036621, "global_step": 579043, "epoch": 6976} {"train_loss": -28.252649307250977, "global_step": 579044, "epoch": 6976} {"train_loss": -27.921005249023438, "global_step": 579045, "epoch": 6976} {"train_loss": -28.201642990112305, "global_step": 579046, "epoch": 6976} {"train_loss": -27.975011825561523, "global_step": 579047, "epoch": 6976} {"train_loss": -27.8996639251709, "global_step": 579048, "epoch": 6976} {"train_loss": -28.409299850463867, "global_step": 579049, "epoch": 6976} {"train_loss": -28.147872924804688, "global_step": 579050, "epoch": 6976} {"train_loss": -27.774885177612305, "global_step": 579051, "epoch": 6976} {"train_loss": -28.427953720092773, "global_step": 579052, "epoch": 6976} {"train_loss": -28.193201065063477, "global_step": 579053, "epoch": 6976} {"train_loss": -28.070972442626953, "global_step": 579054, "epoch": 6976} {"train_loss": -28.155282974243164, "global_step": 579055, "epoch": 6976} {"train_loss": -28.030420303344727, "global_step": 579056, "epoch": 6976} {"train_loss": -27.838098526000977, "global_step": 579057, "epoch": 6976} {"train_loss": -28.14678382873535, "global_step": 579058, "epoch": 6976} {"train_loss": -28.408084869384766, "global_step": 579059, "epoch": 6976} {"train_loss": -28.3574275970459, "global_step": 579060, "epoch": 6976} {"train_loss": -27.989368438720703, "global_step": 579061, "epoch": 6976} {"train_loss": -28.06141471862793, "global_step": 579062, "epoch": 6976} {"train_loss": -27.875659942626953, "global_step": 579063, "epoch": 6976} {"train_loss": -28.31106948852539, "global_step": 579064, "epoch": 6976} {"train_loss": -28.01399040222168, "global_step": 579065, "epoch": 6976} {"train_loss": -27.780858993530273, "global_step": 579066, "epoch": 6976} {"train_loss": -28.05502700805664, "global_step": 579067, "epoch": 6976} {"train_loss": -28.093719482421875, "global_step": 579068, "epoch": 6976} {"train_loss": -28.090351104736328, "global_step": 579069, "epoch": 6976} {"train_loss": -28.077138900756836, "global_step": 579070, "epoch": 6976} {"train_loss": -28.216699600219727, "global_step": 579071, "epoch": 6976} {"train_loss": -28.519994735717773, "global_step": 579072, "epoch": 6976} {"train_loss": -27.924535751342773, "global_step": 579073, "epoch": 6976} {"train_loss": -28.266416549682617, "global_step": 579074, "epoch": 6976} {"train_loss": -28.013263702392578, "global_step": 579075, "epoch": 6976} {"train_loss": -27.396686553955078, "global_step": 579076, "epoch": 6976} {"train_loss": -27.43671989440918, "global_step": 579077, "epoch": 6976} {"train_loss": -27.623859405517578, "global_step": 579078, "epoch": 6976} {"train_loss": -28.055768966674805, "global_step": 579079, "epoch": 6976} {"train_loss": -28.30568504333496, "global_step": 579080, "epoch": 6976} {"train_loss": -27.695404052734375, "global_step": 579081, "epoch": 6976} {"train_loss": -27.6949405670166, "global_step": 579082, "epoch": 6976} {"train_loss": -27.799591064453125, "global_step": 579083, "epoch": 6976} {"train_loss": -28.127042770385742, "global_step": 579084, "epoch": 6976} {"train_loss": -27.68133544921875, "global_step": 579085, "epoch": 6976} {"train_loss": -27.918018341064453, "global_step": 579086, "epoch": 6976} {"train_loss": -27.442935943603516, "global_step": 579087, "epoch": 6976} {"train_loss": -27.565256118774414, "global_step": 579088, "epoch": 6976} {"train_loss": -28.082324981689453, "global_step": 579089, "epoch": 6976} {"train_loss": -27.813234007502178, "global_step": 579090, "epoch": 6976, "val_loss": 6461269.5} {"train_loss": -27.59429359436035, "global_step": 579091, "epoch": 6977} {"train_loss": -27.241174697875977, "global_step": 579092, "epoch": 6977} {"train_loss": -27.2055721282959, "global_step": 579093, "epoch": 6977} {"train_loss": -27.125568389892578, "global_step": 579094, "epoch": 6977} {"train_loss": -27.610980987548828, "global_step": 579095, "epoch": 6977} {"train_loss": -27.829132080078125, "global_step": 579096, "epoch": 6977} {"train_loss": -27.402881622314453, "global_step": 579097, "epoch": 6977} {"train_loss": -27.512304306030273, "global_step": 579098, "epoch": 6977} {"train_loss": -27.2985897064209, "global_step": 579099, "epoch": 6977} {"train_loss": -27.508527755737305, "global_step": 579100, "epoch": 6977} {"train_loss": -27.466482162475586, "global_step": 579101, "epoch": 6977} {"train_loss": -26.77796745300293, "global_step": 579102, "epoch": 6977} {"train_loss": -27.986974716186523, "global_step": 579103, "epoch": 6977} {"train_loss": -27.68146324157715, "global_step": 579104, "epoch": 6977} {"train_loss": -27.257566452026367, "global_step": 579105, "epoch": 6977} {"train_loss": -28.074811935424805, "global_step": 579106, "epoch": 6977} {"train_loss": -27.478967666625977, "global_step": 579107, "epoch": 6977} {"train_loss": -27.50824546813965, "global_step": 579108, "epoch": 6977} {"train_loss": -27.54263687133789, "global_step": 579109, "epoch": 6977} {"train_loss": -27.595565795898438, "global_step": 579110, "epoch": 6977} {"train_loss": -27.648284912109375, "global_step": 579111, "epoch": 6977} {"train_loss": -27.87457275390625, "global_step": 579112, "epoch": 6977} {"train_loss": -27.779895782470703, "global_step": 579113, "epoch": 6977} {"train_loss": -27.68580436706543, "global_step": 579114, "epoch": 6977} {"train_loss": -27.391565322875977, "global_step": 579115, "epoch": 6977} {"train_loss": -27.754352569580078, "global_step": 579116, "epoch": 6977} {"train_loss": -28.064533233642578, "global_step": 579117, "epoch": 6977} {"train_loss": -27.470062255859375, "global_step": 579118, "epoch": 6977} {"train_loss": -27.753042221069336, "global_step": 579119, "epoch": 6977} {"train_loss": -27.495868682861328, "global_step": 579120, "epoch": 6977} {"train_loss": -27.341815948486328, "global_step": 579121, "epoch": 6977} {"train_loss": -27.484830856323242, "global_step": 579122, "epoch": 6977} {"train_loss": -27.991291046142578, "global_step": 579123, "epoch": 6977} {"train_loss": -27.762006759643555, "global_step": 579124, "epoch": 6977} {"train_loss": -27.6981201171875, "global_step": 579125, "epoch": 6977} {"train_loss": -27.706226348876953, "global_step": 579126, "epoch": 6977} {"train_loss": -28.02032470703125, "global_step": 579127, "epoch": 6977} {"train_loss": -27.697895050048828, "global_step": 579128, "epoch": 6977} {"train_loss": -27.754409790039062, "global_step": 579129, "epoch": 6977} {"train_loss": -27.801904678344727, "global_step": 579130, "epoch": 6977} {"train_loss": -28.27947425842285, "global_step": 579131, "epoch": 6977} {"train_loss": -28.1043758392334, "global_step": 579132, "epoch": 6977} {"train_loss": -28.100589752197266, "global_step": 579133, "epoch": 6977} {"train_loss": -28.007978439331055, "global_step": 579134, "epoch": 6977} {"train_loss": -27.94024658203125, "global_step": 579135, "epoch": 6977} {"train_loss": -27.79436683654785, "global_step": 579136, "epoch": 6977} {"train_loss": -27.755157470703125, "global_step": 579137, "epoch": 6977} {"train_loss": -28.198013305664062, "global_step": 579138, "epoch": 6977} {"train_loss": -27.679723739624023, "global_step": 579139, "epoch": 6977} {"train_loss": -27.83037757873535, "global_step": 579140, "epoch": 6977} {"train_loss": -28.17303466796875, "global_step": 579141, "epoch": 6977} {"train_loss": -28.041671752929688, "global_step": 579142, "epoch": 6977} {"train_loss": -27.809743881225586, "global_step": 579143, "epoch": 6977} {"train_loss": -27.972166061401367, "global_step": 579144, "epoch": 6977} {"train_loss": -27.885894775390625, "global_step": 579145, "epoch": 6977} {"train_loss": -27.95745849609375, "global_step": 579146, "epoch": 6977} {"train_loss": -28.2346134185791, "global_step": 579147, "epoch": 6977} {"train_loss": -27.765295028686523, "global_step": 579148, "epoch": 6977} {"train_loss": -28.275766372680664, "global_step": 579149, "epoch": 6977} {"train_loss": -27.68938636779785, "global_step": 579150, "epoch": 6977} {"train_loss": -27.927265167236328, "global_step": 579151, "epoch": 6977} {"train_loss": -28.26239013671875, "global_step": 579152, "epoch": 6977} {"train_loss": -28.149749755859375, "global_step": 579153, "epoch": 6977} {"train_loss": -28.266637802124023, "global_step": 579154, "epoch": 6977} {"train_loss": -28.381439208984375, "global_step": 579155, "epoch": 6977} {"train_loss": -27.87354850769043, "global_step": 579156, "epoch": 6977} {"train_loss": -28.357105255126953, "global_step": 579157, "epoch": 6977} {"train_loss": -28.271656036376953, "global_step": 579158, "epoch": 6977} {"train_loss": -27.977558135986328, "global_step": 579159, "epoch": 6977} {"train_loss": -28.391260147094727, "global_step": 579160, "epoch": 6977} {"train_loss": -28.42205238342285, "global_step": 579161, "epoch": 6977} {"train_loss": -28.0015869140625, "global_step": 579162, "epoch": 6977} {"train_loss": -28.0843505859375, "global_step": 579163, "epoch": 6977} {"train_loss": -27.901737213134766, "global_step": 579164, "epoch": 6977} {"train_loss": -27.583698272705078, "global_step": 579165, "epoch": 6977} {"train_loss": -27.888395309448242, "global_step": 579166, "epoch": 6977} {"train_loss": -27.327850341796875, "global_step": 579167, "epoch": 6977} {"train_loss": -26.826810836791992, "global_step": 579168, "epoch": 6977} {"train_loss": -26.72723388671875, "global_step": 579169, "epoch": 6977} {"train_loss": -26.623401641845703, "global_step": 579170, "epoch": 6977} {"train_loss": -27.34125328063965, "global_step": 579171, "epoch": 6977} {"train_loss": -27.848989486694336, "global_step": 579172, "epoch": 6977} {"train_loss": -27.750719736857587, "global_step": 579173, "epoch": 6977, "val_loss": 6441605.0} {"train_loss": -24.994062423706055, "global_step": 579174, "epoch": 6978} {"train_loss": -26.875202178955078, "global_step": 579175, "epoch": 6978} {"train_loss": -26.084508895874023, "global_step": 579176, "epoch": 6978} {"train_loss": -26.338428497314453, "global_step": 579177, "epoch": 6978} {"train_loss": -26.26491355895996, "global_step": 579178, "epoch": 6978} {"train_loss": -26.405902862548828, "global_step": 579179, "epoch": 6978} {"train_loss": -26.475555419921875, "global_step": 579180, "epoch": 6978} {"train_loss": -27.085315704345703, "global_step": 579181, "epoch": 6978} {"train_loss": -26.9183292388916, "global_step": 579182, "epoch": 6978} {"train_loss": -26.917407989501953, "global_step": 579183, "epoch": 6978} {"train_loss": -26.882617950439453, "global_step": 579184, "epoch": 6978} {"train_loss": -26.566144943237305, "global_step": 579185, "epoch": 6978} {"train_loss": -26.90423011779785, "global_step": 579186, "epoch": 6978} {"train_loss": -26.9985408782959, "global_step": 579187, "epoch": 6978} {"train_loss": -27.345117568969727, "global_step": 579188, "epoch": 6978} {"train_loss": -27.037267684936523, "global_step": 579189, "epoch": 6978} {"train_loss": -27.04078483581543, "global_step": 579190, "epoch": 6978} {"train_loss": -27.458057403564453, "global_step": 579191, "epoch": 6978} {"train_loss": -27.3795166015625, "global_step": 579192, "epoch": 6978} {"train_loss": -27.0240535736084, "global_step": 579193, "epoch": 6978} {"train_loss": -27.04677391052246, "global_step": 579194, "epoch": 6978} {"train_loss": -27.288375854492188, "global_step": 579195, "epoch": 6978} {"train_loss": -27.257953643798828, "global_step": 579196, "epoch": 6978} {"train_loss": -27.827239990234375, "global_step": 579197, "epoch": 6978} {"train_loss": -27.192541122436523, "global_step": 579198, "epoch": 6978} {"train_loss": -27.527240753173828, "global_step": 579199, "epoch": 6978} {"train_loss": -27.292078018188477, "global_step": 579200, "epoch": 6978} {"train_loss": -27.5764217376709, "global_step": 579201, "epoch": 6978} {"train_loss": -27.384647369384766, "global_step": 579202, "epoch": 6978} {"train_loss": -27.66868019104004, "global_step": 579203, "epoch": 6978} {"train_loss": -27.681976318359375, "global_step": 579204, "epoch": 6978} {"train_loss": -27.734848022460938, "global_step": 579205, "epoch": 6978} {"train_loss": -27.64589500427246, "global_step": 579206, "epoch": 6978} {"train_loss": -27.401386260986328, "global_step": 579207, "epoch": 6978} {"train_loss": -27.17878532409668, "global_step": 579208, "epoch": 6978} {"train_loss": -27.738147735595703, "global_step": 579209, "epoch": 6978} {"train_loss": -27.895832061767578, "global_step": 579210, "epoch": 6978} {"train_loss": -27.70087242126465, "global_step": 579211, "epoch": 6978} {"train_loss": -27.649152755737305, "global_step": 579212, "epoch": 6978} {"train_loss": -27.713232040405273, "global_step": 579213, "epoch": 6978} {"train_loss": -27.466278076171875, "global_step": 579214, "epoch": 6978} {"train_loss": -27.954833984375, "global_step": 579215, "epoch": 6978} {"train_loss": -27.909595489501953, "global_step": 579216, "epoch": 6978} {"train_loss": -27.664968490600586, "global_step": 579217, "epoch": 6978} {"train_loss": -27.87200355529785, "global_step": 579218, "epoch": 6978} {"train_loss": -27.816267013549805, "global_step": 579219, "epoch": 6978} {"train_loss": -27.978118896484375, "global_step": 579220, "epoch": 6978} {"train_loss": -27.97844886779785, "global_step": 579221, "epoch": 6978} {"train_loss": -28.179479598999023, "global_step": 579222, "epoch": 6978} {"train_loss": -27.87649917602539, "global_step": 579223, "epoch": 6978} {"train_loss": -27.72434425354004, "global_step": 579224, "epoch": 6978} {"train_loss": -27.921844482421875, "global_step": 579225, "epoch": 6978} {"train_loss": -27.774450302124023, "global_step": 579226, "epoch": 6978} {"train_loss": -28.6920166015625, "global_step": 579227, "epoch": 6978} {"train_loss": -27.676538467407227, "global_step": 579228, "epoch": 6978} {"train_loss": -28.272619247436523, "global_step": 579229, "epoch": 6978} {"train_loss": -27.6966609954834, "global_step": 579230, "epoch": 6978} {"train_loss": -27.923315048217773, "global_step": 579231, "epoch": 6978} {"train_loss": -28.022369384765625, "global_step": 579232, "epoch": 6978} {"train_loss": -27.95075798034668, "global_step": 579233, "epoch": 6978} {"train_loss": -28.0129451751709, "global_step": 579234, "epoch": 6978} {"train_loss": -27.61591911315918, "global_step": 579235, "epoch": 6978} {"train_loss": -28.254301071166992, "global_step": 579236, "epoch": 6978} {"train_loss": -28.007261276245117, "global_step": 579237, "epoch": 6978} {"train_loss": -27.789045333862305, "global_step": 579238, "epoch": 6978} {"train_loss": -27.525379180908203, "global_step": 579239, "epoch": 6978} {"train_loss": -28.165624618530273, "global_step": 579240, "epoch": 6978} {"train_loss": -28.406143188476562, "global_step": 579241, "epoch": 6978} {"train_loss": -28.133808135986328, "global_step": 579242, "epoch": 6978} {"train_loss": -27.656085968017578, "global_step": 579243, "epoch": 6978} {"train_loss": -26.541961669921875, "global_step": 579244, "epoch": 6978} {"train_loss": -26.234134674072266, "global_step": 579245, "epoch": 6978} {"train_loss": -28.27797508239746, "global_step": 579246, "epoch": 6978} {"train_loss": -27.090600967407227, "global_step": 579247, "epoch": 6978} {"train_loss": -26.982574462890625, "global_step": 579248, "epoch": 6978} {"train_loss": -28.085065841674805, "global_step": 579249, "epoch": 6978} {"train_loss": -27.040414810180664, "global_step": 579250, "epoch": 6978} {"train_loss": -28.17205238342285, "global_step": 579251, "epoch": 6978} {"train_loss": -27.40321159362793, "global_step": 579252, "epoch": 6978} {"train_loss": -27.717914581298828, "global_step": 579253, "epoch": 6978} {"train_loss": -27.749937057495117, "global_step": 579254, "epoch": 6978} {"train_loss": -27.82773780822754, "global_step": 579255, "epoch": 6978} {"train_loss": -27.472659260393627, "global_step": 579256, "epoch": 6978, "val_loss": 6441977.5} {"train_loss": -27.085485458374023, "global_step": 579257, "epoch": 6979} {"train_loss": -25.74298095703125, "global_step": 579258, "epoch": 6979} {"train_loss": -27.210163116455078, "global_step": 579259, "epoch": 6979} {"train_loss": -26.581501007080078, "global_step": 579260, "epoch": 6979} {"train_loss": -27.233123779296875, "global_step": 579261, "epoch": 6979} {"train_loss": -26.97144889831543, "global_step": 579262, "epoch": 6979} {"train_loss": -27.390546798706055, "global_step": 579263, "epoch": 6979} {"train_loss": -27.077899932861328, "global_step": 579264, "epoch": 6979} {"train_loss": -26.406789779663086, "global_step": 579265, "epoch": 6979} {"train_loss": -26.974964141845703, "global_step": 579266, "epoch": 6979} {"train_loss": -27.474218368530273, "global_step": 579267, "epoch": 6979} {"train_loss": -27.1901912689209, "global_step": 579268, "epoch": 6979} {"train_loss": -26.47430992126465, "global_step": 579269, "epoch": 6979} {"train_loss": -27.512481689453125, "global_step": 579270, "epoch": 6979} {"train_loss": -27.42524528503418, "global_step": 579271, "epoch": 6979} {"train_loss": -27.325361251831055, "global_step": 579272, "epoch": 6979} {"train_loss": -26.717084884643555, "global_step": 579273, "epoch": 6979} {"train_loss": -26.77736473083496, "global_step": 579274, "epoch": 6979} {"train_loss": -27.085128784179688, "global_step": 579275, "epoch": 6979} {"train_loss": -26.744251251220703, "global_step": 579276, "epoch": 6979} {"train_loss": -27.412195205688477, "global_step": 579277, "epoch": 6979} {"train_loss": -27.932098388671875, "global_step": 579278, "epoch": 6979} {"train_loss": -27.6752872467041, "global_step": 579279, "epoch": 6979} {"train_loss": -27.466291427612305, "global_step": 579280, "epoch": 6979} {"train_loss": -27.270736694335938, "global_step": 579281, "epoch": 6979} {"train_loss": -27.40130043029785, "global_step": 579282, "epoch": 6979} {"train_loss": -27.66025161743164, "global_step": 579283, "epoch": 6979} {"train_loss": -27.74750328063965, "global_step": 579284, "epoch": 6979} {"train_loss": -27.3935489654541, "global_step": 579285, "epoch": 6979} {"train_loss": -27.873090744018555, "global_step": 579286, "epoch": 6979} {"train_loss": -27.861530303955078, "global_step": 579287, "epoch": 6979} {"train_loss": -27.374643325805664, "global_step": 579288, "epoch": 6979} {"train_loss": -27.10995864868164, "global_step": 579289, "epoch": 6979} {"train_loss": -27.553211212158203, "global_step": 579290, "epoch": 6979} {"train_loss": -27.3474178314209, "global_step": 579291, "epoch": 6979} {"train_loss": -27.319665908813477, "global_step": 579292, "epoch": 6979} {"train_loss": -27.750951766967773, "global_step": 579293, "epoch": 6979} {"train_loss": -27.922718048095703, "global_step": 579294, "epoch": 6979} {"train_loss": -28.09819984436035, "global_step": 579295, "epoch": 6979} {"train_loss": -27.76734733581543, "global_step": 579296, "epoch": 6979} {"train_loss": -28.0782527923584, "global_step": 579297, "epoch": 6979} {"train_loss": -27.80742835998535, "global_step": 579298, "epoch": 6979} {"train_loss": -27.715011596679688, "global_step": 579299, "epoch": 6979} {"train_loss": -27.8770694732666, "global_step": 579300, "epoch": 6979} {"train_loss": -27.739770889282227, "global_step": 579301, "epoch": 6979} {"train_loss": -27.67230796813965, "global_step": 579302, "epoch": 6979} {"train_loss": -27.877927780151367, "global_step": 579303, "epoch": 6979} {"train_loss": -27.53204345703125, "global_step": 579304, "epoch": 6979} {"train_loss": -27.705514907836914, "global_step": 579305, "epoch": 6979} {"train_loss": -28.139556884765625, "global_step": 579306, "epoch": 6979} {"train_loss": -27.79620933532715, "global_step": 579307, "epoch": 6979} {"train_loss": -27.361682891845703, "global_step": 579308, "epoch": 6979} {"train_loss": -28.126462936401367, "global_step": 579309, "epoch": 6979} {"train_loss": -27.91765785217285, "global_step": 579310, "epoch": 6979} {"train_loss": -28.147985458374023, "global_step": 579311, "epoch": 6979} {"train_loss": -28.0461368560791, "global_step": 579312, "epoch": 6979} {"train_loss": -27.925418853759766, "global_step": 579313, "epoch": 6979} {"train_loss": -27.73187255859375, "global_step": 579314, "epoch": 6979} {"train_loss": -28.163049697875977, "global_step": 579315, "epoch": 6979} {"train_loss": -27.86041259765625, "global_step": 579316, "epoch": 6979} {"train_loss": -27.83087158203125, "global_step": 579317, "epoch": 6979} {"train_loss": -28.501325607299805, "global_step": 579318, "epoch": 6979} {"train_loss": -27.895526885986328, "global_step": 579319, "epoch": 6979} {"train_loss": -28.025650024414062, "global_step": 579320, "epoch": 6979} {"train_loss": -28.2657470703125, "global_step": 579321, "epoch": 6979} {"train_loss": -27.853132247924805, "global_step": 579322, "epoch": 6979} {"train_loss": -27.985830307006836, "global_step": 579323, "epoch": 6979} {"train_loss": -28.208032608032227, "global_step": 579324, "epoch": 6979} {"train_loss": -27.8173885345459, "global_step": 579325, "epoch": 6979} {"train_loss": -28.089282989501953, "global_step": 579326, "epoch": 6979} {"train_loss": -28.148788452148438, "global_step": 579327, "epoch": 6979} {"train_loss": -28.146692276000977, "global_step": 579328, "epoch": 6979} {"train_loss": -27.97125816345215, "global_step": 579329, "epoch": 6979} {"train_loss": -28.07464599609375, "global_step": 579330, "epoch": 6979} {"train_loss": -28.24720573425293, "global_step": 579331, "epoch": 6979} {"train_loss": -27.832386016845703, "global_step": 579332, "epoch": 6979} {"train_loss": -27.95476722717285, "global_step": 579333, "epoch": 6979} {"train_loss": -27.50778579711914, "global_step": 579334, "epoch": 6979} {"train_loss": -28.00550651550293, "global_step": 579335, "epoch": 6979} {"train_loss": -27.969970703125, "global_step": 579336, "epoch": 6979} {"train_loss": -27.58455467224121, "global_step": 579337, "epoch": 6979} {"train_loss": -27.76908302307129, "global_step": 579338, "epoch": 6979} {"train_loss": -27.614729915756776, "global_step": 579339, "epoch": 6979, "val_loss": 6534943.0} {"train_loss": -27.5355224609375, "global_step": 579340, "epoch": 6980} {"train_loss": -26.868179321289062, "global_step": 579341, "epoch": 6980} {"train_loss": -27.596515655517578, "global_step": 579342, "epoch": 6980} {"train_loss": -27.2620849609375, "global_step": 579343, "epoch": 6980} {"train_loss": -26.56648826599121, "global_step": 579344, "epoch": 6980} {"train_loss": -27.172992706298828, "global_step": 579345, "epoch": 6980} {"train_loss": -27.02813720703125, "global_step": 579346, "epoch": 6980} {"train_loss": -27.32883644104004, "global_step": 579347, "epoch": 6980} {"train_loss": -27.241836547851562, "global_step": 579348, "epoch": 6980} {"train_loss": -27.426870346069336, "global_step": 579349, "epoch": 6980} {"train_loss": -27.735721588134766, "global_step": 579350, "epoch": 6980} {"train_loss": -27.450937271118164, "global_step": 579351, "epoch": 6980} {"train_loss": -27.450077056884766, "global_step": 579352, "epoch": 6980} {"train_loss": -27.768198013305664, "global_step": 579353, "epoch": 6980} {"train_loss": -27.66360855102539, "global_step": 579354, "epoch": 6980} {"train_loss": -27.48361587524414, "global_step": 579355, "epoch": 6980} {"train_loss": -27.85371971130371, "global_step": 579356, "epoch": 6980} {"train_loss": -27.568695068359375, "global_step": 579357, "epoch": 6980} {"train_loss": -27.40540885925293, "global_step": 579358, "epoch": 6980} {"train_loss": -27.553638458251953, "global_step": 579359, "epoch": 6980} {"train_loss": -27.837316513061523, "global_step": 579360, "epoch": 6980} {"train_loss": -27.901199340820312, "global_step": 579361, "epoch": 6980} {"train_loss": -27.934118270874023, "global_step": 579362, "epoch": 6980} {"train_loss": -27.77166175842285, "global_step": 579363, "epoch": 6980} {"train_loss": -27.855804443359375, "global_step": 579364, "epoch": 6980} {"train_loss": -27.84054946899414, "global_step": 579365, "epoch": 6980} {"train_loss": -27.843769073486328, "global_step": 579366, "epoch": 6980} {"train_loss": -28.060855865478516, "global_step": 579367, "epoch": 6980} {"train_loss": -27.29473304748535, "global_step": 579368, "epoch": 6980} {"train_loss": -27.627355575561523, "global_step": 579369, "epoch": 6980} {"train_loss": -27.99334144592285, "global_step": 579370, "epoch": 6980} {"train_loss": -27.907278060913086, "global_step": 579371, "epoch": 6980} {"train_loss": -27.7327823638916, "global_step": 579372, "epoch": 6980} {"train_loss": -27.52668571472168, "global_step": 579373, "epoch": 6980} {"train_loss": -28.050634384155273, "global_step": 579374, "epoch": 6980} {"train_loss": -27.913183212280273, "global_step": 579375, "epoch": 6980} {"train_loss": -27.964618682861328, "global_step": 579376, "epoch": 6980} {"train_loss": -27.895837783813477, "global_step": 579377, "epoch": 6980} {"train_loss": -28.0175724029541, "global_step": 579378, "epoch": 6980} {"train_loss": -27.887161254882812, "global_step": 579379, "epoch": 6980} {"train_loss": -28.302473068237305, "global_step": 579380, "epoch": 6980} {"train_loss": -28.022613525390625, "global_step": 579381, "epoch": 6980} {"train_loss": -28.040964126586914, "global_step": 579382, "epoch": 6980} {"train_loss": -28.028837203979492, "global_step": 579383, "epoch": 6980} {"train_loss": -28.119251251220703, "global_step": 579384, "epoch": 6980} {"train_loss": -28.416107177734375, "global_step": 579385, "epoch": 6980} {"train_loss": -27.861328125, "global_step": 579386, "epoch": 6980} {"train_loss": -27.729162216186523, "global_step": 579387, "epoch": 6980} {"train_loss": -27.940534591674805, "global_step": 579388, "epoch": 6980} {"train_loss": -28.127063751220703, "global_step": 579389, "epoch": 6980} {"train_loss": -28.1239070892334, "global_step": 579390, "epoch": 6980} {"train_loss": -28.33057975769043, "global_step": 579391, "epoch": 6980} {"train_loss": -27.911298751831055, "global_step": 579392, "epoch": 6980} {"train_loss": -27.54786491394043, "global_step": 579393, "epoch": 6980} {"train_loss": -27.628469467163086, "global_step": 579394, "epoch": 6980} {"train_loss": -27.906583786010742, "global_step": 579395, "epoch": 6980} {"train_loss": -28.161096572875977, "global_step": 579396, "epoch": 6980} {"train_loss": -27.305051803588867, "global_step": 579397, "epoch": 6980} {"train_loss": -26.884862899780273, "global_step": 579398, "epoch": 6980} {"train_loss": -27.752182006835938, "global_step": 579399, "epoch": 6980} {"train_loss": -28.026538848876953, "global_step": 579400, "epoch": 6980} {"train_loss": -27.469074249267578, "global_step": 579401, "epoch": 6980} {"train_loss": -27.8911075592041, "global_step": 579402, "epoch": 6980} {"train_loss": -27.97905921936035, "global_step": 579403, "epoch": 6980} {"train_loss": -27.72905921936035, "global_step": 579404, "epoch": 6980} {"train_loss": -27.769418716430664, "global_step": 579405, "epoch": 6980} {"train_loss": -27.81440544128418, "global_step": 579406, "epoch": 6980} {"train_loss": -28.08001708984375, "global_step": 579407, "epoch": 6980} {"train_loss": -27.992040634155273, "global_step": 579408, "epoch": 6980} {"train_loss": -28.24446678161621, "global_step": 579409, "epoch": 6980} {"train_loss": -27.671600341796875, "global_step": 579410, "epoch": 6980} {"train_loss": -27.8256893157959, "global_step": 579411, "epoch": 6980} {"train_loss": -27.472822189331055, "global_step": 579412, "epoch": 6980} {"train_loss": -27.75420570373535, "global_step": 579413, "epoch": 6980} {"train_loss": -27.820831298828125, "global_step": 579414, "epoch": 6980} {"train_loss": -28.182687759399414, "global_step": 579415, "epoch": 6980} {"train_loss": -27.953907012939453, "global_step": 579416, "epoch": 6980} {"train_loss": -27.97125816345215, "global_step": 579417, "epoch": 6980} {"train_loss": -28.106225967407227, "global_step": 579418, "epoch": 6980} {"train_loss": -27.657962799072266, "global_step": 579419, "epoch": 6980} {"train_loss": -27.84077262878418, "global_step": 579420, "epoch": 6980} {"train_loss": -28.0832462310791, "global_step": 579421, "epoch": 6980} {"train_loss": -27.752529971570855, "global_step": 579422, "epoch": 6980, "val_loss": 6487465.0} {"train_loss": -27.6755428314209, "global_step": 579423, "epoch": 6981} {"train_loss": -26.673233032226562, "global_step": 579424, "epoch": 6981} {"train_loss": -26.197107315063477, "global_step": 579425, "epoch": 6981} {"train_loss": -26.61433982849121, "global_step": 579426, "epoch": 6981} {"train_loss": -27.320545196533203, "global_step": 579427, "epoch": 6981} {"train_loss": -26.744352340698242, "global_step": 579428, "epoch": 6981} {"train_loss": -27.095050811767578, "global_step": 579429, "epoch": 6981} {"train_loss": -27.773168563842773, "global_step": 579430, "epoch": 6981} {"train_loss": -27.28214454650879, "global_step": 579431, "epoch": 6981} {"train_loss": -27.33278465270996, "global_step": 579432, "epoch": 6981} {"train_loss": -27.4964656829834, "global_step": 579433, "epoch": 6981} {"train_loss": -27.364822387695312, "global_step": 579434, "epoch": 6981} {"train_loss": -27.01100730895996, "global_step": 579435, "epoch": 6981} {"train_loss": -27.115924835205078, "global_step": 579436, "epoch": 6981} {"train_loss": -27.125354766845703, "global_step": 579437, "epoch": 6981} {"train_loss": -27.243696212768555, "global_step": 579438, "epoch": 6981} {"train_loss": -27.51820182800293, "global_step": 579439, "epoch": 6981} {"train_loss": -26.792938232421875, "global_step": 579440, "epoch": 6981} {"train_loss": -28.041791915893555, "global_step": 579441, "epoch": 6981} {"train_loss": -27.3074893951416, "global_step": 579442, "epoch": 6981} {"train_loss": -27.880115509033203, "global_step": 579443, "epoch": 6981} {"train_loss": -27.3690128326416, "global_step": 579444, "epoch": 6981} {"train_loss": -27.866485595703125, "global_step": 579445, "epoch": 6981} {"train_loss": -27.70599937438965, "global_step": 579446, "epoch": 6981} {"train_loss": -27.641454696655273, "global_step": 579447, "epoch": 6981} {"train_loss": -27.591114044189453, "global_step": 579448, "epoch": 6981} {"train_loss": -27.595935821533203, "global_step": 579449, "epoch": 6981} {"train_loss": -27.340524673461914, "global_step": 579450, "epoch": 6981} {"train_loss": -27.701190948486328, "global_step": 579451, "epoch": 6981} {"train_loss": -27.59673500061035, "global_step": 579452, "epoch": 6981} {"train_loss": -27.650522232055664, "global_step": 579453, "epoch": 6981} {"train_loss": -27.465473175048828, "global_step": 579454, "epoch": 6981} {"train_loss": -27.493322372436523, "global_step": 579455, "epoch": 6981} {"train_loss": -27.757709503173828, "global_step": 579456, "epoch": 6981} {"train_loss": -27.964282989501953, "global_step": 579457, "epoch": 6981} {"train_loss": -27.68548011779785, "global_step": 579458, "epoch": 6981} {"train_loss": -27.559940338134766, "global_step": 579459, "epoch": 6981} {"train_loss": -27.69246482849121, "global_step": 579460, "epoch": 6981} {"train_loss": -27.83394432067871, "global_step": 579461, "epoch": 6981} {"train_loss": -28.03480339050293, "global_step": 579462, "epoch": 6981} {"train_loss": -28.1478271484375, "global_step": 579463, "epoch": 6981} {"train_loss": -27.854019165039062, "global_step": 579464, "epoch": 6981} {"train_loss": -27.885229110717773, "global_step": 579465, "epoch": 6981} {"train_loss": -27.98248291015625, "global_step": 579466, "epoch": 6981} {"train_loss": -28.13812828063965, "global_step": 579467, "epoch": 6981} {"train_loss": -27.917896270751953, "global_step": 579468, "epoch": 6981} {"train_loss": -27.93556785583496, "global_step": 579469, "epoch": 6981} {"train_loss": -28.42754554748535, "global_step": 579470, "epoch": 6981} {"train_loss": -27.8720703125, "global_step": 579471, "epoch": 6981} {"train_loss": -28.118488311767578, "global_step": 579472, "epoch": 6981} {"train_loss": -27.85441017150879, "global_step": 579473, "epoch": 6981} {"train_loss": -28.052204132080078, "global_step": 579474, "epoch": 6981} {"train_loss": -27.992725372314453, "global_step": 579475, "epoch": 6981} {"train_loss": -28.424728393554688, "global_step": 579476, "epoch": 6981} {"train_loss": -28.01859474182129, "global_step": 579477, "epoch": 6981} {"train_loss": -28.101919174194336, "global_step": 579478, "epoch": 6981} {"train_loss": -28.19902992248535, "global_step": 579479, "epoch": 6981} {"train_loss": -28.305944442749023, "global_step": 579480, "epoch": 6981} {"train_loss": -28.20488929748535, "global_step": 579481, "epoch": 6981} {"train_loss": -28.116790771484375, "global_step": 579482, "epoch": 6981} {"train_loss": -27.893461227416992, "global_step": 579483, "epoch": 6981} {"train_loss": -27.92096519470215, "global_step": 579484, "epoch": 6981} {"train_loss": -28.309326171875, "global_step": 579485, "epoch": 6981} {"train_loss": -27.981525421142578, "global_step": 579486, "epoch": 6981} {"train_loss": -27.90752601623535, "global_step": 579487, "epoch": 6981} {"train_loss": -27.443286895751953, "global_step": 579488, "epoch": 6981} {"train_loss": -27.343626022338867, "global_step": 579489, "epoch": 6981} {"train_loss": -27.96878433227539, "global_step": 579490, "epoch": 6981} {"train_loss": -27.902292251586914, "global_step": 579491, "epoch": 6981} {"train_loss": -27.8746395111084, "global_step": 579492, "epoch": 6981} {"train_loss": -27.74114418029785, "global_step": 579493, "epoch": 6981} {"train_loss": -27.62006950378418, "global_step": 579494, "epoch": 6981} {"train_loss": -28.345285415649414, "global_step": 579495, "epoch": 6981} {"train_loss": -27.76749610900879, "global_step": 579496, "epoch": 6981} {"train_loss": -27.68511390686035, "global_step": 579497, "epoch": 6981} {"train_loss": -27.69595718383789, "global_step": 579498, "epoch": 6981} {"train_loss": -27.529417037963867, "global_step": 579499, "epoch": 6981} {"train_loss": -28.08725929260254, "global_step": 579500, "epoch": 6981} {"train_loss": -27.68488121032715, "global_step": 579501, "epoch": 6981} {"train_loss": -27.0804500579834, "global_step": 579502, "epoch": 6981} {"train_loss": -27.46573829650879, "global_step": 579503, "epoch": 6981} {"train_loss": -27.78590965270996, "global_step": 579504, "epoch": 6981} {"train_loss": -27.682788458215185, "global_step": 579505, "epoch": 6981, "val_loss": 6577325.5} {"train_loss": -26.84027671813965, "global_step": 579506, "epoch": 6982} {"train_loss": -26.459659576416016, "global_step": 579507, "epoch": 6982} {"train_loss": -26.628950119018555, "global_step": 579508, "epoch": 6982} {"train_loss": -27.152185440063477, "global_step": 579509, "epoch": 6982} {"train_loss": -26.70842933654785, "global_step": 579510, "epoch": 6982} {"train_loss": -27.479944229125977, "global_step": 579511, "epoch": 6982} {"train_loss": -27.204833984375, "global_step": 579512, "epoch": 6982} {"train_loss": -27.344970703125, "global_step": 579513, "epoch": 6982} {"train_loss": -27.632720947265625, "global_step": 579514, "epoch": 6982} {"train_loss": -27.41367530822754, "global_step": 579515, "epoch": 6982} {"train_loss": -27.214895248413086, "global_step": 579516, "epoch": 6982} {"train_loss": -27.515506744384766, "global_step": 579517, "epoch": 6982} {"train_loss": -26.720773696899414, "global_step": 579518, "epoch": 6982} {"train_loss": -27.24371337890625, "global_step": 579519, "epoch": 6982} {"train_loss": -27.473651885986328, "global_step": 579520, "epoch": 6982} {"train_loss": -27.28828239440918, "global_step": 579521, "epoch": 6982} {"train_loss": -27.721616744995117, "global_step": 579522, "epoch": 6982} {"train_loss": -27.540897369384766, "global_step": 579523, "epoch": 6982} {"train_loss": -27.59050941467285, "global_step": 579524, "epoch": 6982} {"train_loss": -27.490339279174805, "global_step": 579525, "epoch": 6982} {"train_loss": -27.591516494750977, "global_step": 579526, "epoch": 6982} {"train_loss": -27.865705490112305, "global_step": 579527, "epoch": 6982} {"train_loss": -27.643945693969727, "global_step": 579528, "epoch": 6982} {"train_loss": -27.745166778564453, "global_step": 579529, "epoch": 6982} {"train_loss": -27.582693099975586, "global_step": 579530, "epoch": 6982} {"train_loss": -27.459753036499023, "global_step": 579531, "epoch": 6982} {"train_loss": -27.9433650970459, "global_step": 579532, "epoch": 6982} {"train_loss": -27.68887710571289, "global_step": 579533, "epoch": 6982} {"train_loss": -27.700231552124023, "global_step": 579534, "epoch": 6982} {"train_loss": -28.02113151550293, "global_step": 579535, "epoch": 6982} {"train_loss": -27.488086700439453, "global_step": 579536, "epoch": 6982} {"train_loss": -27.786853790283203, "global_step": 579537, "epoch": 6982} {"train_loss": -28.08729362487793, "global_step": 579538, "epoch": 6982} {"train_loss": -28.153858184814453, "global_step": 579539, "epoch": 6982} {"train_loss": -27.81496238708496, "global_step": 579540, "epoch": 6982} {"train_loss": -27.79889488220215, "global_step": 579541, "epoch": 6982} {"train_loss": -27.99348258972168, "global_step": 579542, "epoch": 6982} {"train_loss": -27.896772384643555, "global_step": 579543, "epoch": 6982} {"train_loss": -27.98235511779785, "global_step": 579544, "epoch": 6982} {"train_loss": -28.192907333374023, "global_step": 579545, "epoch": 6982} {"train_loss": -28.046417236328125, "global_step": 579546, "epoch": 6982} {"train_loss": -28.13422966003418, "global_step": 579547, "epoch": 6982} {"train_loss": -27.700885772705078, "global_step": 579548, "epoch": 6982} {"train_loss": -27.64153480529785, "global_step": 579549, "epoch": 6982} {"train_loss": -27.772602081298828, "global_step": 579550, "epoch": 6982} {"train_loss": -27.908533096313477, "global_step": 579551, "epoch": 6982} {"train_loss": -27.85443687438965, "global_step": 579552, "epoch": 6982} {"train_loss": -27.790973663330078, "global_step": 579553, "epoch": 6982} {"train_loss": -28.27994155883789, "global_step": 579554, "epoch": 6982} {"train_loss": -27.920263290405273, "global_step": 579555, "epoch": 6982} {"train_loss": -27.841083526611328, "global_step": 579556, "epoch": 6982} {"train_loss": -27.950891494750977, "global_step": 579557, "epoch": 6982} {"train_loss": -27.952367782592773, "global_step": 579558, "epoch": 6982} {"train_loss": -28.060806274414062, "global_step": 579559, "epoch": 6982} {"train_loss": -28.204343795776367, "global_step": 579560, "epoch": 6982} {"train_loss": -28.080854415893555, "global_step": 579561, "epoch": 6982} {"train_loss": -27.660688400268555, "global_step": 579562, "epoch": 6982} {"train_loss": -28.022220611572266, "global_step": 579563, "epoch": 6982} {"train_loss": -28.06304359436035, "global_step": 579564, "epoch": 6982} {"train_loss": -28.1268367767334, "global_step": 579565, "epoch": 6982} {"train_loss": -27.70871353149414, "global_step": 579566, "epoch": 6982} {"train_loss": -28.085987091064453, "global_step": 579567, "epoch": 6982} {"train_loss": -28.019922256469727, "global_step": 579568, "epoch": 6982} {"train_loss": -27.902790069580078, "global_step": 579569, "epoch": 6982} {"train_loss": -27.86696434020996, "global_step": 579570, "epoch": 6982} {"train_loss": -28.252431869506836, "global_step": 579571, "epoch": 6982} {"train_loss": -28.21573829650879, "global_step": 579572, "epoch": 6982} {"train_loss": -28.451868057250977, "global_step": 579573, "epoch": 6982} {"train_loss": -28.033857345581055, "global_step": 579574, "epoch": 6982} {"train_loss": -28.01071548461914, "global_step": 579575, "epoch": 6982} {"train_loss": -28.0771484375, "global_step": 579576, "epoch": 6982} {"train_loss": -27.89478874206543, "global_step": 579577, "epoch": 6982} {"train_loss": -27.968677520751953, "global_step": 579578, "epoch": 6982} {"train_loss": -28.05280113220215, "global_step": 579579, "epoch": 6982} {"train_loss": -27.649505615234375, "global_step": 579580, "epoch": 6982} {"train_loss": -28.55768394470215, "global_step": 579581, "epoch": 6982} {"train_loss": -28.17344093322754, "global_step": 579582, "epoch": 6982} {"train_loss": -28.03742790222168, "global_step": 579583, "epoch": 6982} {"train_loss": -28.075159072875977, "global_step": 579584, "epoch": 6982} {"train_loss": -28.2440242767334, "global_step": 579585, "epoch": 6982} {"train_loss": -27.855533599853516, "global_step": 579586, "epoch": 6982} {"train_loss": -27.91790199279785, "global_step": 579587, "epoch": 6982} {"train_loss": -27.778562063194183, "global_step": 579588, "epoch": 6982, "val_loss": 6536272.0} {"train_loss": -27.343463897705078, "global_step": 579589, "epoch": 6983} {"train_loss": -27.017465591430664, "global_step": 579590, "epoch": 6983} {"train_loss": -25.3149471282959, "global_step": 579591, "epoch": 6983} {"train_loss": -25.210981369018555, "global_step": 579592, "epoch": 6983} {"train_loss": -27.683242797851562, "global_step": 579593, "epoch": 6983} {"train_loss": -26.061389923095703, "global_step": 579594, "epoch": 6983} {"train_loss": -26.92583656311035, "global_step": 579595, "epoch": 6983} {"train_loss": -27.075164794921875, "global_step": 579596, "epoch": 6983} {"train_loss": -26.9436092376709, "global_step": 579597, "epoch": 6983} {"train_loss": -26.353668212890625, "global_step": 579598, "epoch": 6983} {"train_loss": -27.559656143188477, "global_step": 579599, "epoch": 6983} {"train_loss": -26.9180908203125, "global_step": 579600, "epoch": 6983} {"train_loss": -26.604841232299805, "global_step": 579601, "epoch": 6983} {"train_loss": -27.949167251586914, "global_step": 579602, "epoch": 6983} {"train_loss": -26.559070587158203, "global_step": 579603, "epoch": 6983} {"train_loss": -27.637109756469727, "global_step": 579604, "epoch": 6983} {"train_loss": -27.300418853759766, "global_step": 579605, "epoch": 6983} {"train_loss": -27.25689125061035, "global_step": 579606, "epoch": 6983} {"train_loss": -26.727243423461914, "global_step": 579607, "epoch": 6983} {"train_loss": -27.616668701171875, "global_step": 579608, "epoch": 6983} {"train_loss": -27.222776412963867, "global_step": 579609, "epoch": 6983} {"train_loss": -26.96345329284668, "global_step": 579610, "epoch": 6983} {"train_loss": -27.008039474487305, "global_step": 579611, "epoch": 6983} {"train_loss": -26.91346549987793, "global_step": 579612, "epoch": 6983} {"train_loss": -27.502099990844727, "global_step": 579613, "epoch": 6983} {"train_loss": -26.648529052734375, "global_step": 579614, "epoch": 6983} {"train_loss": -27.121417999267578, "global_step": 579615, "epoch": 6983} {"train_loss": -27.431482315063477, "global_step": 579616, "epoch": 6983} {"train_loss": -27.55669593811035, "global_step": 579617, "epoch": 6983} {"train_loss": -27.250638961791992, "global_step": 579618, "epoch": 6983} {"train_loss": -27.29499626159668, "global_step": 579619, "epoch": 6983} {"train_loss": -27.742664337158203, "global_step": 579620, "epoch": 6983} {"train_loss": -27.471242904663086, "global_step": 579621, "epoch": 6983} {"train_loss": -27.60785484313965, "global_step": 579622, "epoch": 6983} {"train_loss": -27.772418975830078, "global_step": 579623, "epoch": 6983} {"train_loss": -27.674041748046875, "global_step": 579624, "epoch": 6983} {"train_loss": -27.75563621520996, "global_step": 579625, "epoch": 6983} {"train_loss": -28.0484619140625, "global_step": 579626, "epoch": 6983} {"train_loss": -27.940465927124023, "global_step": 579627, "epoch": 6983} {"train_loss": -27.635395050048828, "global_step": 579628, "epoch": 6983} {"train_loss": -27.76944351196289, "global_step": 579629, "epoch": 6983} {"train_loss": -27.675275802612305, "global_step": 579630, "epoch": 6983} {"train_loss": -27.42914390563965, "global_step": 579631, "epoch": 6983} {"train_loss": -27.54068946838379, "global_step": 579632, "epoch": 6983} {"train_loss": -27.784509658813477, "global_step": 579633, "epoch": 6983} {"train_loss": -27.9963436126709, "global_step": 579634, "epoch": 6983} {"train_loss": -27.869333267211914, "global_step": 579635, "epoch": 6983} {"train_loss": -27.825759887695312, "global_step": 579636, "epoch": 6983} {"train_loss": -27.562158584594727, "global_step": 579637, "epoch": 6983} {"train_loss": -27.774702072143555, "global_step": 579638, "epoch": 6983} {"train_loss": -27.906400680541992, "global_step": 579639, "epoch": 6983} {"train_loss": -27.70086669921875, "global_step": 579640, "epoch": 6983} {"train_loss": -27.91745376586914, "global_step": 579641, "epoch": 6983} {"train_loss": -27.924360275268555, "global_step": 579642, "epoch": 6983} {"train_loss": -27.93269157409668, "global_step": 579643, "epoch": 6983} {"train_loss": -28.110748291015625, "global_step": 579644, "epoch": 6983} {"train_loss": -28.102460861206055, "global_step": 579645, "epoch": 6983} {"train_loss": -27.973556518554688, "global_step": 579646, "epoch": 6983} {"train_loss": -27.8387393951416, "global_step": 579647, "epoch": 6983} {"train_loss": -27.817279815673828, "global_step": 579648, "epoch": 6983} {"train_loss": -27.924474716186523, "global_step": 579649, "epoch": 6983} {"train_loss": -27.63824462890625, "global_step": 579650, "epoch": 6983} {"train_loss": -28.12179946899414, "global_step": 579651, "epoch": 6983} {"train_loss": -28.057966232299805, "global_step": 579652, "epoch": 6983} {"train_loss": -28.19232177734375, "global_step": 579653, "epoch": 6983} {"train_loss": -27.781232833862305, "global_step": 579654, "epoch": 6983} {"train_loss": -27.832447052001953, "global_step": 579655, "epoch": 6983} {"train_loss": -28.292383193969727, "global_step": 579656, "epoch": 6983} {"train_loss": -27.985315322875977, "global_step": 579657, "epoch": 6983} {"train_loss": -27.668094635009766, "global_step": 579658, "epoch": 6983} {"train_loss": -27.950973510742188, "global_step": 579659, "epoch": 6983} {"train_loss": -27.869068145751953, "global_step": 579660, "epoch": 6983} {"train_loss": -28.02880859375, "global_step": 579661, "epoch": 6983} {"train_loss": -27.918310165405273, "global_step": 579662, "epoch": 6983} {"train_loss": -28.10507583618164, "global_step": 579663, "epoch": 6983} {"train_loss": -27.9676513671875, "global_step": 579664, "epoch": 6983} {"train_loss": -28.34549331665039, "global_step": 579665, "epoch": 6983} {"train_loss": -27.98858070373535, "global_step": 579666, "epoch": 6983} {"train_loss": -27.820209503173828, "global_step": 579667, "epoch": 6983} {"train_loss": -28.153614044189453, "global_step": 579668, "epoch": 6983} {"train_loss": -28.259424209594727, "global_step": 579669, "epoch": 6983} {"train_loss": -27.931671142578125, "global_step": 579670, "epoch": 6983} {"train_loss": -27.54810183881277, "global_step": 579671, "epoch": 6983, "val_loss": 6482635.0} {"train_loss": -27.367950439453125, "global_step": 579672, "epoch": 6984} {"train_loss": -27.037412643432617, "global_step": 579673, "epoch": 6984} {"train_loss": -27.80124282836914, "global_step": 579674, "epoch": 6984} {"train_loss": -26.945837020874023, "global_step": 579675, "epoch": 6984} {"train_loss": -26.95058250427246, "global_step": 579676, "epoch": 6984} {"train_loss": -27.394317626953125, "global_step": 579677, "epoch": 6984} {"train_loss": -27.512741088867188, "global_step": 579678, "epoch": 6984} {"train_loss": -27.264562606811523, "global_step": 579679, "epoch": 6984} {"train_loss": -26.937421798706055, "global_step": 579680, "epoch": 6984} {"train_loss": -27.293949127197266, "global_step": 579681, "epoch": 6984} {"train_loss": -27.79787254333496, "global_step": 579682, "epoch": 6984} {"train_loss": -27.360681533813477, "global_step": 579683, "epoch": 6984} {"train_loss": -27.702306747436523, "global_step": 579684, "epoch": 6984} {"train_loss": -27.736948013305664, "global_step": 579685, "epoch": 6984} {"train_loss": -28.12994384765625, "global_step": 579686, "epoch": 6984} {"train_loss": -27.54245376586914, "global_step": 579687, "epoch": 6984} {"train_loss": -27.614545822143555, "global_step": 579688, "epoch": 6984} {"train_loss": -27.919601440429688, "global_step": 579689, "epoch": 6984} {"train_loss": -27.439350128173828, "global_step": 579690, "epoch": 6984} {"train_loss": -27.845361709594727, "global_step": 579691, "epoch": 6984} {"train_loss": -27.75201416015625, "global_step": 579692, "epoch": 6984} {"train_loss": -28.106775283813477, "global_step": 579693, "epoch": 6984} {"train_loss": -27.45844841003418, "global_step": 579694, "epoch": 6984} {"train_loss": -27.509626388549805, "global_step": 579695, "epoch": 6984} {"train_loss": -27.5429630279541, "global_step": 579696, "epoch": 6984} {"train_loss": -27.766782760620117, "global_step": 579697, "epoch": 6984} {"train_loss": -28.073835372924805, "global_step": 579698, "epoch": 6984} {"train_loss": -28.05866050720215, "global_step": 579699, "epoch": 6984} {"train_loss": -27.4036922454834, "global_step": 579700, "epoch": 6984} {"train_loss": -27.90915870666504, "global_step": 579701, "epoch": 6984} {"train_loss": -27.9450740814209, "global_step": 579702, "epoch": 6984} {"train_loss": -27.72999382019043, "global_step": 579703, "epoch": 6984} {"train_loss": -27.903547286987305, "global_step": 579704, "epoch": 6984} {"train_loss": -28.151336669921875, "global_step": 579705, "epoch": 6984} {"train_loss": -27.90852165222168, "global_step": 579706, "epoch": 6984} {"train_loss": -28.169097900390625, "global_step": 579707, "epoch": 6984} {"train_loss": -27.9132137298584, "global_step": 579708, "epoch": 6984} {"train_loss": -27.920856475830078, "global_step": 579709, "epoch": 6984} {"train_loss": -27.93094253540039, "global_step": 579710, "epoch": 6984} {"train_loss": -28.040771484375, "global_step": 579711, "epoch": 6984} {"train_loss": -28.015949249267578, "global_step": 579712, "epoch": 6984} {"train_loss": -27.66571044921875, "global_step": 579713, "epoch": 6984} {"train_loss": -28.077234268188477, "global_step": 579714, "epoch": 6984} {"train_loss": -28.00615882873535, "global_step": 579715, "epoch": 6984} {"train_loss": -28.109113693237305, "global_step": 579716, "epoch": 6984} {"train_loss": -27.946094512939453, "global_step": 579717, "epoch": 6984} {"train_loss": -27.878503799438477, "global_step": 579718, "epoch": 6984} {"train_loss": -27.994617462158203, "global_step": 579719, "epoch": 6984} {"train_loss": -28.117889404296875, "global_step": 579720, "epoch": 6984} {"train_loss": -28.265451431274414, "global_step": 579721, "epoch": 6984} {"train_loss": -28.119314193725586, "global_step": 579722, "epoch": 6984} {"train_loss": -27.821752548217773, "global_step": 579723, "epoch": 6984} {"train_loss": -27.972675323486328, "global_step": 579724, "epoch": 6984} {"train_loss": -27.626562118530273, "global_step": 579725, "epoch": 6984} {"train_loss": -27.91182518005371, "global_step": 579726, "epoch": 6984} {"train_loss": -28.0600528717041, "global_step": 579727, "epoch": 6984} {"train_loss": -28.216033935546875, "global_step": 579728, "epoch": 6984} {"train_loss": -28.085098266601562, "global_step": 579729, "epoch": 6984} {"train_loss": -28.243432998657227, "global_step": 579730, "epoch": 6984} {"train_loss": -28.112051010131836, "global_step": 579731, "epoch": 6984} {"train_loss": -27.997297286987305, "global_step": 579732, "epoch": 6984} {"train_loss": -28.194677352905273, "global_step": 579733, "epoch": 6984} {"train_loss": -28.080312728881836, "global_step": 579734, "epoch": 6984} {"train_loss": -28.371702194213867, "global_step": 579735, "epoch": 6984} {"train_loss": -27.884580612182617, "global_step": 579736, "epoch": 6984} {"train_loss": -28.17852210998535, "global_step": 579737, "epoch": 6984} {"train_loss": -27.835865020751953, "global_step": 579738, "epoch": 6984} {"train_loss": -27.51835060119629, "global_step": 579739, "epoch": 6984} {"train_loss": -27.5788516998291, "global_step": 579740, "epoch": 6984} {"train_loss": -27.849042892456055, "global_step": 579741, "epoch": 6984} {"train_loss": -27.929059982299805, "global_step": 579742, "epoch": 6984} {"train_loss": -27.904279708862305, "global_step": 579743, "epoch": 6984} {"train_loss": -27.585193634033203, "global_step": 579744, "epoch": 6984} {"train_loss": -27.968671798706055, "global_step": 579745, "epoch": 6984} {"train_loss": -28.012975692749023, "global_step": 579746, "epoch": 6984} {"train_loss": -27.941207885742188, "global_step": 579747, "epoch": 6984} {"train_loss": -28.134057998657227, "global_step": 579748, "epoch": 6984} {"train_loss": -28.326574325561523, "global_step": 579749, "epoch": 6984} {"train_loss": -27.913070678710938, "global_step": 579750, "epoch": 6984} {"train_loss": -27.820098876953125, "global_step": 579751, "epoch": 6984} {"train_loss": -28.061832427978516, "global_step": 579752, "epoch": 6984} {"train_loss": -27.592405319213867, "global_step": 579753, "epoch": 6984} {"train_loss": -27.831960149558192, "global_step": 579754, "epoch": 6984, "val_loss": 6530843.5} {"train_loss": -27.593326568603516, "global_step": 579755, "epoch": 6985} {"train_loss": -26.6031494140625, "global_step": 579756, "epoch": 6985} {"train_loss": -26.105871200561523, "global_step": 579757, "epoch": 6985} {"train_loss": -26.7531681060791, "global_step": 579758, "epoch": 6985} {"train_loss": -27.263654708862305, "global_step": 579759, "epoch": 6985} {"train_loss": -27.433155059814453, "global_step": 579760, "epoch": 6985} {"train_loss": -26.870386123657227, "global_step": 579761, "epoch": 6985} {"train_loss": -27.33377456665039, "global_step": 579762, "epoch": 6985} {"train_loss": -27.617252349853516, "global_step": 579763, "epoch": 6985} {"train_loss": -27.646686553955078, "global_step": 579764, "epoch": 6985} {"train_loss": -26.67255210876465, "global_step": 579765, "epoch": 6985} {"train_loss": -27.709396362304688, "global_step": 579766, "epoch": 6985} {"train_loss": -27.112913131713867, "global_step": 579767, "epoch": 6985} {"train_loss": -27.17537498474121, "global_step": 579768, "epoch": 6985} {"train_loss": -27.190942764282227, "global_step": 579769, "epoch": 6985} {"train_loss": -27.422773361206055, "global_step": 579770, "epoch": 6985} {"train_loss": -26.92046546936035, "global_step": 579771, "epoch": 6985} {"train_loss": -27.467199325561523, "global_step": 579772, "epoch": 6985} {"train_loss": -27.45290184020996, "global_step": 579773, "epoch": 6985} {"train_loss": -27.674285888671875, "global_step": 579774, "epoch": 6985} {"train_loss": -27.369504928588867, "global_step": 579775, "epoch": 6985} {"train_loss": -27.40828514099121, "global_step": 579776, "epoch": 6985} {"train_loss": -27.48541259765625, "global_step": 579777, "epoch": 6985} {"train_loss": -27.797107696533203, "global_step": 579778, "epoch": 6985} {"train_loss": -27.374881744384766, "global_step": 579779, "epoch": 6985} {"train_loss": -27.708515167236328, "global_step": 579780, "epoch": 6985} {"train_loss": -27.55356216430664, "global_step": 579781, "epoch": 6985} {"train_loss": -27.42465591430664, "global_step": 579782, "epoch": 6985} {"train_loss": -27.65301513671875, "global_step": 579783, "epoch": 6985} {"train_loss": -27.405303955078125, "global_step": 579784, "epoch": 6985} {"train_loss": -27.660144805908203, "global_step": 579785, "epoch": 6985} {"train_loss": -27.536664962768555, "global_step": 579786, "epoch": 6985} {"train_loss": -27.71701431274414, "global_step": 579787, "epoch": 6985} {"train_loss": -27.94544792175293, "global_step": 579788, "epoch": 6985} {"train_loss": -27.76825523376465, "global_step": 579789, "epoch": 6985} {"train_loss": -27.710412979125977, "global_step": 579790, "epoch": 6985} {"train_loss": -28.033416748046875, "global_step": 579791, "epoch": 6985} {"train_loss": -27.823270797729492, "global_step": 579792, "epoch": 6985} {"train_loss": -27.984195709228516, "global_step": 579793, "epoch": 6985} {"train_loss": -27.519250869750977, "global_step": 579794, "epoch": 6985} {"train_loss": -27.835596084594727, "global_step": 579795, "epoch": 6985} {"train_loss": -27.925750732421875, "global_step": 579796, "epoch": 6985} {"train_loss": -28.071670532226562, "global_step": 579797, "epoch": 6985} {"train_loss": -28.034460067749023, "global_step": 579798, "epoch": 6985} {"train_loss": -28.11337661743164, "global_step": 579799, "epoch": 6985} {"train_loss": -27.937780380249023, "global_step": 579800, "epoch": 6985} {"train_loss": -27.945051193237305, "global_step": 579801, "epoch": 6985} {"train_loss": -28.10752296447754, "global_step": 579802, "epoch": 6985} {"train_loss": -27.990758895874023, "global_step": 579803, "epoch": 6985} {"train_loss": -28.029455184936523, "global_step": 579804, "epoch": 6985} {"train_loss": -28.152118682861328, "global_step": 579805, "epoch": 6985} {"train_loss": -27.64008903503418, "global_step": 579806, "epoch": 6985} {"train_loss": -28.103174209594727, "global_step": 579807, "epoch": 6985} {"train_loss": -28.213769912719727, "global_step": 579808, "epoch": 6985} {"train_loss": -28.002302169799805, "global_step": 579809, "epoch": 6985} {"train_loss": -27.85746192932129, "global_step": 579810, "epoch": 6985} {"train_loss": -27.865697860717773, "global_step": 579811, "epoch": 6985} {"train_loss": -27.7051944732666, "global_step": 579812, "epoch": 6985} {"train_loss": -27.781179428100586, "global_step": 579813, "epoch": 6985} {"train_loss": -27.79783058166504, "global_step": 579814, "epoch": 6985} {"train_loss": -28.34051513671875, "global_step": 579815, "epoch": 6985} {"train_loss": -27.947711944580078, "global_step": 579816, "epoch": 6985} {"train_loss": -28.23438835144043, "global_step": 579817, "epoch": 6985} {"train_loss": -27.699024200439453, "global_step": 579818, "epoch": 6985} {"train_loss": -28.1563663482666, "global_step": 579819, "epoch": 6985} {"train_loss": -27.866056442260742, "global_step": 579820, "epoch": 6985} {"train_loss": -28.069849014282227, "global_step": 579821, "epoch": 6985} {"train_loss": -28.29099464416504, "global_step": 579822, "epoch": 6985} {"train_loss": -28.384042739868164, "global_step": 579823, "epoch": 6985} {"train_loss": -28.142520904541016, "global_step": 579824, "epoch": 6985} {"train_loss": -28.114850997924805, "global_step": 579825, "epoch": 6985} {"train_loss": -28.103784561157227, "global_step": 579826, "epoch": 6985} {"train_loss": -28.02789306640625, "global_step": 579827, "epoch": 6985} {"train_loss": -27.805158615112305, "global_step": 579828, "epoch": 6985} {"train_loss": -27.5548038482666, "global_step": 579829, "epoch": 6985} {"train_loss": -27.528961181640625, "global_step": 579830, "epoch": 6985} {"train_loss": -28.028675079345703, "global_step": 579831, "epoch": 6985} {"train_loss": -27.904279708862305, "global_step": 579832, "epoch": 6985} {"train_loss": -28.264423370361328, "global_step": 579833, "epoch": 6985} {"train_loss": -27.96986198425293, "global_step": 579834, "epoch": 6985} {"train_loss": -27.950775146484375, "global_step": 579835, "epoch": 6985} {"train_loss": -28.0251522064209, "global_step": 579836, "epoch": 6985} {"train_loss": -27.72023449173893, "global_step": 579837, "epoch": 6985, "val_loss": 6507366.5} {"train_loss": -27.051666259765625, "global_step": 579838, "epoch": 6986} {"train_loss": -26.450519561767578, "global_step": 579839, "epoch": 6986} {"train_loss": -27.043670654296875, "global_step": 579840, "epoch": 6986} {"train_loss": -27.010297775268555, "global_step": 579841, "epoch": 6986} {"train_loss": -27.038293838500977, "global_step": 579842, "epoch": 6986} {"train_loss": -27.28958511352539, "global_step": 579843, "epoch": 6986} {"train_loss": -27.020832061767578, "global_step": 579844, "epoch": 6986} {"train_loss": -27.45944595336914, "global_step": 579845, "epoch": 6986} {"train_loss": -26.9976863861084, "global_step": 579846, "epoch": 6986} {"train_loss": -27.232751846313477, "global_step": 579847, "epoch": 6986} {"train_loss": -27.501684188842773, "global_step": 579848, "epoch": 6986} {"train_loss": -26.884366989135742, "global_step": 579849, "epoch": 6986} {"train_loss": -27.410480499267578, "global_step": 579850, "epoch": 6986} {"train_loss": -27.825857162475586, "global_step": 579851, "epoch": 6986} {"train_loss": -27.576786041259766, "global_step": 579852, "epoch": 6986} {"train_loss": -27.232467651367188, "global_step": 579853, "epoch": 6986} {"train_loss": -27.629791259765625, "global_step": 579854, "epoch": 6986} {"train_loss": -28.0502872467041, "global_step": 579855, "epoch": 6986} {"train_loss": -27.5909423828125, "global_step": 579856, "epoch": 6986} {"train_loss": -27.764692306518555, "global_step": 579857, "epoch": 6986} {"train_loss": -27.732147216796875, "global_step": 579858, "epoch": 6986} {"train_loss": -27.88581657409668, "global_step": 579859, "epoch": 6986} {"train_loss": -27.641748428344727, "global_step": 579860, "epoch": 6986} {"train_loss": -28.02168083190918, "global_step": 579861, "epoch": 6986} {"train_loss": -27.6562442779541, "global_step": 579862, "epoch": 6986} {"train_loss": -27.877378463745117, "global_step": 579863, "epoch": 6986} {"train_loss": -27.696496963500977, "global_step": 579864, "epoch": 6986} {"train_loss": -28.3043212890625, "global_step": 579865, "epoch": 6986} {"train_loss": -27.827625274658203, "global_step": 579866, "epoch": 6986} {"train_loss": -28.16921043395996, "global_step": 579867, "epoch": 6986} {"train_loss": -28.07784080505371, "global_step": 579868, "epoch": 6986} {"train_loss": -27.62677574157715, "global_step": 579869, "epoch": 6986} {"train_loss": -28.1375789642334, "global_step": 579870, "epoch": 6986} {"train_loss": -28.27280044555664, "global_step": 579871, "epoch": 6986} {"train_loss": -27.918792724609375, "global_step": 579872, "epoch": 6986} {"train_loss": -27.798547744750977, "global_step": 579873, "epoch": 6986} {"train_loss": -27.794330596923828, "global_step": 579874, "epoch": 6986} {"train_loss": -28.402753829956055, "global_step": 579875, "epoch": 6986} {"train_loss": -27.873193740844727, "global_step": 579876, "epoch": 6986} {"train_loss": -27.65915870666504, "global_step": 579877, "epoch": 6986} {"train_loss": -27.40473747253418, "global_step": 579878, "epoch": 6986} {"train_loss": -27.884836196899414, "global_step": 579879, "epoch": 6986} {"train_loss": -28.115497589111328, "global_step": 579880, "epoch": 6986} {"train_loss": -27.881601333618164, "global_step": 579881, "epoch": 6986} {"train_loss": -27.885061264038086, "global_step": 579882, "epoch": 6986} {"train_loss": -27.502180099487305, "global_step": 579883, "epoch": 6986} {"train_loss": -27.56220817565918, "global_step": 579884, "epoch": 6986} {"train_loss": -28.269775390625, "global_step": 579885, "epoch": 6986} {"train_loss": -27.93965721130371, "global_step": 579886, "epoch": 6986} {"train_loss": -27.580656051635742, "global_step": 579887, "epoch": 6986} {"train_loss": -28.106088638305664, "global_step": 579888, "epoch": 6986} {"train_loss": -27.896203994750977, "global_step": 579889, "epoch": 6986} {"train_loss": -27.664941787719727, "global_step": 579890, "epoch": 6986} {"train_loss": -27.97802734375, "global_step": 579891, "epoch": 6986} {"train_loss": -27.61565589904785, "global_step": 579892, "epoch": 6986} {"train_loss": -28.102575302124023, "global_step": 579893, "epoch": 6986} {"train_loss": -27.995502471923828, "global_step": 579894, "epoch": 6986} {"train_loss": -27.82840919494629, "global_step": 579895, "epoch": 6986} {"train_loss": -27.565515518188477, "global_step": 579896, "epoch": 6986} {"train_loss": -28.20521354675293, "global_step": 579897, "epoch": 6986} {"train_loss": -28.348737716674805, "global_step": 579898, "epoch": 6986} {"train_loss": -28.09285545349121, "global_step": 579899, "epoch": 6986} {"train_loss": -28.037073135375977, "global_step": 579900, "epoch": 6986} {"train_loss": -27.928150177001953, "global_step": 579901, "epoch": 6986} {"train_loss": -28.0166072845459, "global_step": 579902, "epoch": 6986} {"train_loss": -28.153827667236328, "global_step": 579903, "epoch": 6986} {"train_loss": -28.177215576171875, "global_step": 579904, "epoch": 6986} {"train_loss": -28.216323852539062, "global_step": 579905, "epoch": 6986} {"train_loss": -28.326251983642578, "global_step": 579906, "epoch": 6986} {"train_loss": -28.008193969726562, "global_step": 579907, "epoch": 6986} {"train_loss": -28.139453887939453, "global_step": 579908, "epoch": 6986} {"train_loss": -27.901636123657227, "global_step": 579909, "epoch": 6986} {"train_loss": -28.377851486206055, "global_step": 579910, "epoch": 6986} {"train_loss": -27.82925796508789, "global_step": 579911, "epoch": 6986} {"train_loss": -28.50434684753418, "global_step": 579912, "epoch": 6986} {"train_loss": -28.223337173461914, "global_step": 579913, "epoch": 6986} {"train_loss": -27.956918716430664, "global_step": 579914, "epoch": 6986} {"train_loss": -28.12236976623535, "global_step": 579915, "epoch": 6986} {"train_loss": -27.561969757080078, "global_step": 579916, "epoch": 6986} {"train_loss": -27.767303466796875, "global_step": 579917, "epoch": 6986} {"train_loss": -27.813505172729492, "global_step": 579918, "epoch": 6986} {"train_loss": -28.4671630859375, "global_step": 579919, "epoch": 6986} {"train_loss": -27.810790624963232, "global_step": 579920, "epoch": 6986, "val_loss": 6542277.5} {"train_loss": -27.912633895874023, "global_step": 579921, "epoch": 6987} {"train_loss": -27.871402740478516, "global_step": 579922, "epoch": 6987} {"train_loss": -27.715478897094727, "global_step": 579923, "epoch": 6987} {"train_loss": -27.567108154296875, "global_step": 579924, "epoch": 6987} {"train_loss": -27.564184188842773, "global_step": 579925, "epoch": 6987} {"train_loss": -27.7828369140625, "global_step": 579926, "epoch": 6987} {"train_loss": -27.433454513549805, "global_step": 579927, "epoch": 6987} {"train_loss": -27.35218620300293, "global_step": 579928, "epoch": 6987} {"train_loss": -27.371076583862305, "global_step": 579929, "epoch": 6987} {"train_loss": -26.9952392578125, "global_step": 579930, "epoch": 6987} {"train_loss": -27.58563804626465, "global_step": 579931, "epoch": 6987} {"train_loss": -27.708099365234375, "global_step": 579932, "epoch": 6987} {"train_loss": -27.331314086914062, "global_step": 579933, "epoch": 6987} {"train_loss": -27.390777587890625, "global_step": 579934, "epoch": 6987} {"train_loss": -27.60145378112793, "global_step": 579935, "epoch": 6987} {"train_loss": -27.291013717651367, "global_step": 579936, "epoch": 6987} {"train_loss": -27.809513092041016, "global_step": 579937, "epoch": 6987} {"train_loss": -27.397375106811523, "global_step": 579938, "epoch": 6987} {"train_loss": -27.837316513061523, "global_step": 579939, "epoch": 6987} {"train_loss": -27.645963668823242, "global_step": 579940, "epoch": 6987} {"train_loss": -27.464160919189453, "global_step": 579941, "epoch": 6987} {"train_loss": -27.6693172454834, "global_step": 579942, "epoch": 6987} {"train_loss": -27.61516761779785, "global_step": 579943, "epoch": 6987} {"train_loss": -28.156574249267578, "global_step": 579944, "epoch": 6987} {"train_loss": -27.896076202392578, "global_step": 579945, "epoch": 6987} {"train_loss": -27.571714401245117, "global_step": 579946, "epoch": 6987} {"train_loss": -27.853498458862305, "global_step": 579947, "epoch": 6987} {"train_loss": -28.12665367126465, "global_step": 579948, "epoch": 6987} {"train_loss": -28.22230339050293, "global_step": 579949, "epoch": 6987} {"train_loss": -27.756677627563477, "global_step": 579950, "epoch": 6987} {"train_loss": -27.748144149780273, "global_step": 579951, "epoch": 6987} {"train_loss": -28.2123966217041, "global_step": 579952, "epoch": 6987} {"train_loss": -28.146427154541016, "global_step": 579953, "epoch": 6987} {"train_loss": -27.681676864624023, "global_step": 579954, "epoch": 6987} {"train_loss": -28.293994903564453, "global_step": 579955, "epoch": 6987} {"train_loss": -27.82916259765625, "global_step": 579956, "epoch": 6987} {"train_loss": -27.909894943237305, "global_step": 579957, "epoch": 6987} {"train_loss": -27.78962516784668, "global_step": 579958, "epoch": 6987} {"train_loss": -28.17694664001465, "global_step": 579959, "epoch": 6987} {"train_loss": -27.731109619140625, "global_step": 579960, "epoch": 6987} {"train_loss": -28.18787956237793, "global_step": 579961, "epoch": 6987} {"train_loss": -27.656768798828125, "global_step": 579962, "epoch": 6987} {"train_loss": -27.88498306274414, "global_step": 579963, "epoch": 6987} {"train_loss": -28.11610984802246, "global_step": 579964, "epoch": 6987} {"train_loss": -27.862323760986328, "global_step": 579965, "epoch": 6987} {"train_loss": -28.26897621154785, "global_step": 579966, "epoch": 6987} {"train_loss": -28.23211669921875, "global_step": 579967, "epoch": 6987} {"train_loss": -28.482587814331055, "global_step": 579968, "epoch": 6987} {"train_loss": -28.094953536987305, "global_step": 579969, "epoch": 6987} {"train_loss": -27.85809326171875, "global_step": 579970, "epoch": 6987} {"train_loss": -27.98764419555664, "global_step": 579971, "epoch": 6987} {"train_loss": -28.107290267944336, "global_step": 579972, "epoch": 6987} {"train_loss": -28.398019790649414, "global_step": 579973, "epoch": 6987} {"train_loss": -27.544153213500977, "global_step": 579974, "epoch": 6987} {"train_loss": -28.035425186157227, "global_step": 579975, "epoch": 6987} {"train_loss": -27.849853515625, "global_step": 579976, "epoch": 6987} {"train_loss": -27.9571533203125, "global_step": 579977, "epoch": 6987} {"train_loss": -27.689167022705078, "global_step": 579978, "epoch": 6987} {"train_loss": -27.35894203186035, "global_step": 579979, "epoch": 6987} {"train_loss": -27.6302490234375, "global_step": 579980, "epoch": 6987} {"train_loss": -27.809823989868164, "global_step": 579981, "epoch": 6987} {"train_loss": -27.603235244750977, "global_step": 579982, "epoch": 6987} {"train_loss": -27.95387077331543, "global_step": 579983, "epoch": 6987} {"train_loss": -27.968236923217773, "global_step": 579984, "epoch": 6987} {"train_loss": -27.874242782592773, "global_step": 579985, "epoch": 6987} {"train_loss": -27.7165584564209, "global_step": 579986, "epoch": 6987} {"train_loss": -27.6427059173584, "global_step": 579987, "epoch": 6987} {"train_loss": -27.923206329345703, "global_step": 579988, "epoch": 6987} {"train_loss": -28.386754989624023, "global_step": 579989, "epoch": 6987} {"train_loss": -27.796628952026367, "global_step": 579990, "epoch": 6987} {"train_loss": -27.944116592407227, "global_step": 579991, "epoch": 6987} {"train_loss": -28.014490127563477, "global_step": 579992, "epoch": 6987} {"train_loss": -27.968963623046875, "global_step": 579993, "epoch": 6987} {"train_loss": -27.850492477416992, "global_step": 579994, "epoch": 6987} {"train_loss": -27.978412628173828, "global_step": 579995, "epoch": 6987} {"train_loss": -28.001317977905273, "global_step": 579996, "epoch": 6987} {"train_loss": -28.28214454650879, "global_step": 579997, "epoch": 6987} {"train_loss": -27.91048240661621, "global_step": 579998, "epoch": 6987} {"train_loss": -27.922510147094727, "global_step": 579999, "epoch": 6987} {"train_loss": -28.117034912109375, "global_step": 580000, "epoch": 6987} {"train_loss": -27.707752227783203, "global_step": 580001, "epoch": 6987} {"train_loss": -28.17450523376465, "global_step": 580002, "epoch": 6987} {"train_loss": -27.845375750438276, "global_step": 580003, "epoch": 6987, "val_loss": 6532247.5} {"train_loss": -27.721099853515625, "global_step": 580004, "epoch": 6988} {"train_loss": -28.0081844329834, "global_step": 580005, "epoch": 6988} {"train_loss": -27.16351890563965, "global_step": 580006, "epoch": 6988} {"train_loss": -27.267974853515625, "global_step": 580007, "epoch": 6988} {"train_loss": -27.33783531188965, "global_step": 580008, "epoch": 6988} {"train_loss": -27.5518798828125, "global_step": 580009, "epoch": 6988} {"train_loss": -27.187768936157227, "global_step": 580010, "epoch": 6988} {"train_loss": -27.01607322692871, "global_step": 580011, "epoch": 6988} {"train_loss": -26.891223907470703, "global_step": 580012, "epoch": 6988} {"train_loss": -27.468305587768555, "global_step": 580013, "epoch": 6988} {"train_loss": -26.415027618408203, "global_step": 580014, "epoch": 6988} {"train_loss": -26.59377098083496, "global_step": 580015, "epoch": 6988} {"train_loss": -27.57379150390625, "global_step": 580016, "epoch": 6988} {"train_loss": -27.128509521484375, "global_step": 580017, "epoch": 6988} {"train_loss": -27.374252319335938, "global_step": 580018, "epoch": 6988} {"train_loss": -27.084394454956055, "global_step": 580019, "epoch": 6988} {"train_loss": -27.378942489624023, "global_step": 580020, "epoch": 6988} {"train_loss": -27.644330978393555, "global_step": 580021, "epoch": 6988} {"train_loss": -27.304601669311523, "global_step": 580022, "epoch": 6988} {"train_loss": -27.760950088500977, "global_step": 580023, "epoch": 6988} {"train_loss": -27.330175399780273, "global_step": 580024, "epoch": 6988} {"train_loss": -27.530628204345703, "global_step": 580025, "epoch": 6988} {"train_loss": -27.75433349609375, "global_step": 580026, "epoch": 6988} {"train_loss": -27.853179931640625, "global_step": 580027, "epoch": 6988} {"train_loss": -27.8162784576416, "global_step": 580028, "epoch": 6988} {"train_loss": -27.7982234954834, "global_step": 580029, "epoch": 6988} {"train_loss": -27.698312759399414, "global_step": 580030, "epoch": 6988} {"train_loss": -27.501983642578125, "global_step": 580031, "epoch": 6988} {"train_loss": -27.6143741607666, "global_step": 580032, "epoch": 6988} {"train_loss": -27.840057373046875, "global_step": 580033, "epoch": 6988} {"train_loss": -27.962610244750977, "global_step": 580034, "epoch": 6988} {"train_loss": -27.956424713134766, "global_step": 580035, "epoch": 6988} {"train_loss": -27.687604904174805, "global_step": 580036, "epoch": 6988} {"train_loss": -27.937768936157227, "global_step": 580037, "epoch": 6988} {"train_loss": -27.602142333984375, "global_step": 580038, "epoch": 6988} {"train_loss": -27.87489891052246, "global_step": 580039, "epoch": 6988} {"train_loss": -27.542346954345703, "global_step": 580040, "epoch": 6988} {"train_loss": -28.280202865600586, "global_step": 580041, "epoch": 6988} {"train_loss": -27.511032104492188, "global_step": 580042, "epoch": 6988} {"train_loss": -27.744617462158203, "global_step": 580043, "epoch": 6988} {"train_loss": -28.00634765625, "global_step": 580044, "epoch": 6988} {"train_loss": -27.862035751342773, "global_step": 580045, "epoch": 6988} {"train_loss": -28.025182723999023, "global_step": 580046, "epoch": 6988} {"train_loss": -27.98953628540039, "global_step": 580047, "epoch": 6988} {"train_loss": -28.354345321655273, "global_step": 580048, "epoch": 6988} {"train_loss": -27.866241455078125, "global_step": 580049, "epoch": 6988} {"train_loss": -28.05196189880371, "global_step": 580050, "epoch": 6988} {"train_loss": -27.799509048461914, "global_step": 580051, "epoch": 6988} {"train_loss": -28.09712028503418, "global_step": 580052, "epoch": 6988} {"train_loss": -28.337629318237305, "global_step": 580053, "epoch": 6988} {"train_loss": -28.729053497314453, "global_step": 580054, "epoch": 6988} {"train_loss": -28.075885772705078, "global_step": 580055, "epoch": 6988} {"train_loss": -28.20590591430664, "global_step": 580056, "epoch": 6988} {"train_loss": -27.868423461914062, "global_step": 580057, "epoch": 6988} {"train_loss": -28.372243881225586, "global_step": 580058, "epoch": 6988} {"train_loss": -27.872940063476562, "global_step": 580059, "epoch": 6988} {"train_loss": -27.91107749938965, "global_step": 580060, "epoch": 6988} {"train_loss": -27.763334274291992, "global_step": 580061, "epoch": 6988} {"train_loss": -27.520416259765625, "global_step": 580062, "epoch": 6988} {"train_loss": -27.31715202331543, "global_step": 580063, "epoch": 6988} {"train_loss": -27.173664093017578, "global_step": 580064, "epoch": 6988} {"train_loss": -27.579431533813477, "global_step": 580065, "epoch": 6988} {"train_loss": -28.003772735595703, "global_step": 580066, "epoch": 6988} {"train_loss": -28.08284568786621, "global_step": 580067, "epoch": 6988} {"train_loss": -27.776575088500977, "global_step": 580068, "epoch": 6988} {"train_loss": -27.8143310546875, "global_step": 580069, "epoch": 6988} {"train_loss": -27.996484756469727, "global_step": 580070, "epoch": 6988} {"train_loss": -28.14885902404785, "global_step": 580071, "epoch": 6988} {"train_loss": -27.5187931060791, "global_step": 580072, "epoch": 6988} {"train_loss": -27.791915893554688, "global_step": 580073, "epoch": 6988} {"train_loss": -27.90591812133789, "global_step": 580074, "epoch": 6988} {"train_loss": -27.576581954956055, "global_step": 580075, "epoch": 6988} {"train_loss": -27.591388702392578, "global_step": 580076, "epoch": 6988} {"train_loss": -27.95990562438965, "global_step": 580077, "epoch": 6988} {"train_loss": -28.23822593688965, "global_step": 580078, "epoch": 6988} {"train_loss": -27.452468872070312, "global_step": 580079, "epoch": 6988} {"train_loss": -27.7985897064209, "global_step": 580080, "epoch": 6988} {"train_loss": -27.727706909179688, "global_step": 580081, "epoch": 6988} {"train_loss": -28.07089614868164, "global_step": 580082, "epoch": 6988} {"train_loss": -28.426687240600586, "global_step": 580083, "epoch": 6988} {"train_loss": -28.18292236328125, "global_step": 580084, "epoch": 6988} {"train_loss": -28.069217681884766, "global_step": 580085, "epoch": 6988} {"train_loss": -27.73468304829425, "global_step": 580086, "epoch": 6988, "val_loss": 6577211.0} {"train_loss": -25.367008209228516, "global_step": 580087, "epoch": 6989} {"train_loss": -26.859394073486328, "global_step": 580088, "epoch": 6989} {"train_loss": -25.712020874023438, "global_step": 580089, "epoch": 6989} {"train_loss": -26.33770179748535, "global_step": 580090, "epoch": 6989} {"train_loss": -26.87456703186035, "global_step": 580091, "epoch": 6989} {"train_loss": -26.672983169555664, "global_step": 580092, "epoch": 6989} {"train_loss": -26.803699493408203, "global_step": 580093, "epoch": 6989} {"train_loss": -26.807294845581055, "global_step": 580094, "epoch": 6989} {"train_loss": -27.055118560791016, "global_step": 580095, "epoch": 6989} {"train_loss": -26.87298583984375, "global_step": 580096, "epoch": 6989} {"train_loss": -26.832059860229492, "global_step": 580097, "epoch": 6989} {"train_loss": -27.19941520690918, "global_step": 580098, "epoch": 6989} {"train_loss": -26.955692291259766, "global_step": 580099, "epoch": 6989} {"train_loss": -27.348546981811523, "global_step": 580100, "epoch": 6989} {"train_loss": -27.251264572143555, "global_step": 580101, "epoch": 6989} {"train_loss": -27.5206356048584, "global_step": 580102, "epoch": 6989} {"train_loss": -27.175329208374023, "global_step": 580103, "epoch": 6989} {"train_loss": -27.426105499267578, "global_step": 580104, "epoch": 6989} {"train_loss": -27.495492935180664, "global_step": 580105, "epoch": 6989} {"train_loss": -27.375349044799805, "global_step": 580106, "epoch": 6989} {"train_loss": -27.34773063659668, "global_step": 580107, "epoch": 6989} {"train_loss": -27.559057235717773, "global_step": 580108, "epoch": 6989} {"train_loss": -27.4245662689209, "global_step": 580109, "epoch": 6989} {"train_loss": -27.613788604736328, "global_step": 580110, "epoch": 6989} {"train_loss": -27.622222900390625, "global_step": 580111, "epoch": 6989} {"train_loss": -27.619739532470703, "global_step": 580112, "epoch": 6989} {"train_loss": -27.852680206298828, "global_step": 580113, "epoch": 6989} {"train_loss": -27.716922760009766, "global_step": 580114, "epoch": 6989} {"train_loss": -27.575794219970703, "global_step": 580115, "epoch": 6989} {"train_loss": -27.85658836364746, "global_step": 580116, "epoch": 6989} {"train_loss": -27.496320724487305, "global_step": 580117, "epoch": 6989} {"train_loss": -27.660924911499023, "global_step": 580118, "epoch": 6989} {"train_loss": -27.2287540435791, "global_step": 580119, "epoch": 6989} {"train_loss": -27.746158599853516, "global_step": 580120, "epoch": 6989} {"train_loss": -27.153736114501953, "global_step": 580121, "epoch": 6989} {"train_loss": -27.796377182006836, "global_step": 580122, "epoch": 6989} {"train_loss": -27.681655883789062, "global_step": 580123, "epoch": 6989} {"train_loss": -27.666748046875, "global_step": 580124, "epoch": 6989} {"train_loss": -27.8967342376709, "global_step": 580125, "epoch": 6989} {"train_loss": -27.8516902923584, "global_step": 580126, "epoch": 6989} {"train_loss": -27.921600341796875, "global_step": 580127, "epoch": 6989} {"train_loss": -28.00446891784668, "global_step": 580128, "epoch": 6989} {"train_loss": -28.078201293945312, "global_step": 580129, "epoch": 6989} {"train_loss": -28.190067291259766, "global_step": 580130, "epoch": 6989} {"train_loss": -28.056501388549805, "global_step": 580131, "epoch": 6989} {"train_loss": -28.36444091796875, "global_step": 580132, "epoch": 6989} {"train_loss": -28.022480010986328, "global_step": 580133, "epoch": 6989} {"train_loss": -28.022741317749023, "global_step": 580134, "epoch": 6989} {"train_loss": -28.061567306518555, "global_step": 580135, "epoch": 6989} {"train_loss": -27.744384765625, "global_step": 580136, "epoch": 6989} {"train_loss": -27.8923282623291, "global_step": 580137, "epoch": 6989} {"train_loss": -27.99989891052246, "global_step": 580138, "epoch": 6989} {"train_loss": -27.564001083374023, "global_step": 580139, "epoch": 6989} {"train_loss": -27.554351806640625, "global_step": 580140, "epoch": 6989} {"train_loss": -27.773176193237305, "global_step": 580141, "epoch": 6989} {"train_loss": -28.2387752532959, "global_step": 580142, "epoch": 6989} {"train_loss": -28.16193962097168, "global_step": 580143, "epoch": 6989} {"train_loss": -27.994565963745117, "global_step": 580144, "epoch": 6989} {"train_loss": -28.014158248901367, "global_step": 580145, "epoch": 6989} {"train_loss": -27.988855361938477, "global_step": 580146, "epoch": 6989} {"train_loss": -28.269773483276367, "global_step": 580147, "epoch": 6989} {"train_loss": -28.049102783203125, "global_step": 580148, "epoch": 6989} {"train_loss": -28.040266036987305, "global_step": 580149, "epoch": 6989} {"train_loss": -27.99564552307129, "global_step": 580150, "epoch": 6989} {"train_loss": -27.95602798461914, "global_step": 580151, "epoch": 6989} {"train_loss": -28.34440040588379, "global_step": 580152, "epoch": 6989} {"train_loss": -28.27833366394043, "global_step": 580153, "epoch": 6989} {"train_loss": -28.3510799407959, "global_step": 580154, "epoch": 6989} {"train_loss": -27.922773361206055, "global_step": 580155, "epoch": 6989} {"train_loss": -28.620670318603516, "global_step": 580156, "epoch": 6989} {"train_loss": -28.15569496154785, "global_step": 580157, "epoch": 6989} {"train_loss": -28.481704711914062, "global_step": 580158, "epoch": 6989} {"train_loss": -28.39546775817871, "global_step": 580159, "epoch": 6989} {"train_loss": -27.849201202392578, "global_step": 580160, "epoch": 6989} {"train_loss": -28.24053382873535, "global_step": 580161, "epoch": 6989} {"train_loss": -27.90435218811035, "global_step": 580162, "epoch": 6989} {"train_loss": -27.765043258666992, "global_step": 580163, "epoch": 6989} {"train_loss": -27.892841339111328, "global_step": 580164, "epoch": 6989} {"train_loss": -28.074451446533203, "global_step": 580165, "epoch": 6989} {"train_loss": -27.919992446899414, "global_step": 580166, "epoch": 6989} {"train_loss": -27.7137393951416, "global_step": 580167, "epoch": 6989} {"train_loss": -27.769775390625, "global_step": 580168, "epoch": 6989} {"train_loss": -27.662023130669652, "global_step": 580169, "epoch": 6989, "val_loss": 6502358.0} {"train_loss": -27.79856300354004, "global_step": 580170, "epoch": 6990} {"train_loss": -27.097360610961914, "global_step": 580171, "epoch": 6990} {"train_loss": -27.45794677734375, "global_step": 580172, "epoch": 6990} {"train_loss": -27.36701011657715, "global_step": 580173, "epoch": 6990} {"train_loss": -27.771530151367188, "global_step": 580174, "epoch": 6990} {"train_loss": -27.583515167236328, "global_step": 580175, "epoch": 6990} {"train_loss": -27.392993927001953, "global_step": 580176, "epoch": 6990} {"train_loss": -27.408374786376953, "global_step": 580177, "epoch": 6990} {"train_loss": -27.803363800048828, "global_step": 580178, "epoch": 6990} {"train_loss": -27.569005966186523, "global_step": 580179, "epoch": 6990} {"train_loss": -27.859216690063477, "global_step": 580180, "epoch": 6990} {"train_loss": -27.43141746520996, "global_step": 580181, "epoch": 6990} {"train_loss": -27.35824966430664, "global_step": 580182, "epoch": 6990} {"train_loss": -27.30500602722168, "global_step": 580183, "epoch": 6990} {"train_loss": -27.626379013061523, "global_step": 580184, "epoch": 6990} {"train_loss": -27.832990646362305, "global_step": 580185, "epoch": 6990} {"train_loss": -27.347686767578125, "global_step": 580186, "epoch": 6990} {"train_loss": -27.522069931030273, "global_step": 580187, "epoch": 6990} {"train_loss": -27.48785972595215, "global_step": 580188, "epoch": 6990} {"train_loss": -27.8822021484375, "global_step": 580189, "epoch": 6990} {"train_loss": -27.920917510986328, "global_step": 580190, "epoch": 6990} {"train_loss": -27.95591163635254, "global_step": 580191, "epoch": 6990} {"train_loss": -27.551313400268555, "global_step": 580192, "epoch": 6990} {"train_loss": -27.757904052734375, "global_step": 580193, "epoch": 6990} {"train_loss": -27.971649169921875, "global_step": 580194, "epoch": 6990} {"train_loss": -27.79932975769043, "global_step": 580195, "epoch": 6990} {"train_loss": -27.74822998046875, "global_step": 580196, "epoch": 6990} {"train_loss": -27.723485946655273, "global_step": 580197, "epoch": 6990} {"train_loss": -27.9792537689209, "global_step": 580198, "epoch": 6990} {"train_loss": -27.6185359954834, "global_step": 580199, "epoch": 6990} {"train_loss": -27.90618324279785, "global_step": 580200, "epoch": 6990} {"train_loss": -27.718494415283203, "global_step": 580201, "epoch": 6990} {"train_loss": -27.81507682800293, "global_step": 580202, "epoch": 6990} {"train_loss": -27.960773468017578, "global_step": 580203, "epoch": 6990} {"train_loss": -27.988666534423828, "global_step": 580204, "epoch": 6990} {"train_loss": -28.006406784057617, "global_step": 580205, "epoch": 6990} {"train_loss": -27.86030387878418, "global_step": 580206, "epoch": 6990} {"train_loss": -28.033191680908203, "global_step": 580207, "epoch": 6990} {"train_loss": -28.224531173706055, "global_step": 580208, "epoch": 6990} {"train_loss": -28.15117835998535, "global_step": 580209, "epoch": 6990} {"train_loss": -28.252960205078125, "global_step": 580210, "epoch": 6990} {"train_loss": -27.627561569213867, "global_step": 580211, "epoch": 6990} {"train_loss": -27.860849380493164, "global_step": 580212, "epoch": 6990} {"train_loss": -28.127979278564453, "global_step": 580213, "epoch": 6990} {"train_loss": -28.22857093811035, "global_step": 580214, "epoch": 6990} {"train_loss": -27.959686279296875, "global_step": 580215, "epoch": 6990} {"train_loss": -28.094968795776367, "global_step": 580216, "epoch": 6990} {"train_loss": -28.31951332092285, "global_step": 580217, "epoch": 6990} {"train_loss": -27.643035888671875, "global_step": 580218, "epoch": 6990} {"train_loss": -27.82331657409668, "global_step": 580219, "epoch": 6990} {"train_loss": -27.110015869140625, "global_step": 580220, "epoch": 6990} {"train_loss": -27.453046798706055, "global_step": 580221, "epoch": 6990} {"train_loss": -27.970478057861328, "global_step": 580222, "epoch": 6990} {"train_loss": -28.04376792907715, "global_step": 580223, "epoch": 6990} {"train_loss": -27.14686393737793, "global_step": 580224, "epoch": 6990} {"train_loss": -27.462507247924805, "global_step": 580225, "epoch": 6990} {"train_loss": -27.435144424438477, "global_step": 580226, "epoch": 6990} {"train_loss": -27.59735107421875, "global_step": 580227, "epoch": 6990} {"train_loss": -27.673297882080078, "global_step": 580228, "epoch": 6990} {"train_loss": -27.174474716186523, "global_step": 580229, "epoch": 6990} {"train_loss": -27.35931968688965, "global_step": 580230, "epoch": 6990} {"train_loss": -27.657926559448242, "global_step": 580231, "epoch": 6990} {"train_loss": -27.5145320892334, "global_step": 580232, "epoch": 6990} {"train_loss": -27.703079223632812, "global_step": 580233, "epoch": 6990} {"train_loss": -27.650922775268555, "global_step": 580234, "epoch": 6990} {"train_loss": -27.721027374267578, "global_step": 580235, "epoch": 6990} {"train_loss": -27.912220001220703, "global_step": 580236, "epoch": 6990} {"train_loss": -27.287851333618164, "global_step": 580237, "epoch": 6990} {"train_loss": -27.882211685180664, "global_step": 580238, "epoch": 6990} {"train_loss": -27.504507064819336, "global_step": 580239, "epoch": 6990} {"train_loss": -27.79083251953125, "global_step": 580240, "epoch": 6990} {"train_loss": -27.554128646850586, "global_step": 580241, "epoch": 6990} {"train_loss": -27.908111572265625, "global_step": 580242, "epoch": 6990} {"train_loss": -27.482091903686523, "global_step": 580243, "epoch": 6990} {"train_loss": -27.412281036376953, "global_step": 580244, "epoch": 6990} {"train_loss": -27.292898178100586, "global_step": 580245, "epoch": 6990} {"train_loss": -27.71186637878418, "global_step": 580246, "epoch": 6990} {"train_loss": -27.854867935180664, "global_step": 580247, "epoch": 6990} {"train_loss": -27.899951934814453, "global_step": 580248, "epoch": 6990} {"train_loss": -27.501371383666992, "global_step": 580249, "epoch": 6990} {"train_loss": -27.878524780273438, "global_step": 580250, "epoch": 6990} {"train_loss": -27.455724716186523, "global_step": 580251, "epoch": 6990} {"train_loss": -27.70032673571483, "global_step": 580252, "epoch": 6990, "val_loss": 6538613.5} {"train_loss": -26.566442489624023, "global_step": 580253, "epoch": 6991} {"train_loss": -27.048063278198242, "global_step": 580254, "epoch": 6991} {"train_loss": -27.609357833862305, "global_step": 580255, "epoch": 6991} {"train_loss": -27.106054306030273, "global_step": 580256, "epoch": 6991} {"train_loss": -27.37061882019043, "global_step": 580257, "epoch": 6991} {"train_loss": -27.462738037109375, "global_step": 580258, "epoch": 6991} {"train_loss": -27.515302658081055, "global_step": 580259, "epoch": 6991} {"train_loss": -27.354337692260742, "global_step": 580260, "epoch": 6991} {"train_loss": -27.465137481689453, "global_step": 580261, "epoch": 6991} {"train_loss": -27.449453353881836, "global_step": 580262, "epoch": 6991} {"train_loss": -27.678760528564453, "global_step": 580263, "epoch": 6991} {"train_loss": -27.624670028686523, "global_step": 580264, "epoch": 6991} {"train_loss": -27.530866622924805, "global_step": 580265, "epoch": 6991} {"train_loss": -27.746612548828125, "global_step": 580266, "epoch": 6991} {"train_loss": -27.557464599609375, "global_step": 580267, "epoch": 6991} {"train_loss": -27.44059181213379, "global_step": 580268, "epoch": 6991} {"train_loss": -28.076465606689453, "global_step": 580269, "epoch": 6991} {"train_loss": -27.7978515625, "global_step": 580270, "epoch": 6991} {"train_loss": -27.718164443969727, "global_step": 580271, "epoch": 6991} {"train_loss": -28.161218643188477, "global_step": 580272, "epoch": 6991} {"train_loss": -27.8958683013916, "global_step": 580273, "epoch": 6991} {"train_loss": -27.76004409790039, "global_step": 580274, "epoch": 6991} {"train_loss": -27.970083236694336, "global_step": 580275, "epoch": 6991} {"train_loss": -27.9409236907959, "global_step": 580276, "epoch": 6991} {"train_loss": -27.58429527282715, "global_step": 580277, "epoch": 6991} {"train_loss": -27.81504249572754, "global_step": 580278, "epoch": 6991} {"train_loss": -27.624927520751953, "global_step": 580279, "epoch": 6991} {"train_loss": -27.977697372436523, "global_step": 580280, "epoch": 6991} {"train_loss": -27.82843017578125, "global_step": 580281, "epoch": 6991} {"train_loss": -27.983936309814453, "global_step": 580282, "epoch": 6991} {"train_loss": -28.0168514251709, "global_step": 580283, "epoch": 6991} {"train_loss": -27.612567901611328, "global_step": 580284, "epoch": 6991} {"train_loss": -28.2200870513916, "global_step": 580285, "epoch": 6991} {"train_loss": -27.90986442565918, "global_step": 580286, "epoch": 6991} {"train_loss": -27.88791275024414, "global_step": 580287, "epoch": 6991} {"train_loss": -27.975194931030273, "global_step": 580288, "epoch": 6991} {"train_loss": -27.805118560791016, "global_step": 580289, "epoch": 6991} {"train_loss": -28.634078979492188, "global_step": 580290, "epoch": 6991} {"train_loss": -28.078916549682617, "global_step": 580291, "epoch": 6991} {"train_loss": -27.674665451049805, "global_step": 580292, "epoch": 6991} {"train_loss": -27.791799545288086, "global_step": 580293, "epoch": 6991} {"train_loss": -28.2501220703125, "global_step": 580294, "epoch": 6991} {"train_loss": -27.7724552154541, "global_step": 580295, "epoch": 6991} {"train_loss": -27.701269149780273, "global_step": 580296, "epoch": 6991} {"train_loss": -28.000385284423828, "global_step": 580297, "epoch": 6991} {"train_loss": -28.25408363342285, "global_step": 580298, "epoch": 6991} {"train_loss": -27.334522247314453, "global_step": 580299, "epoch": 6991} {"train_loss": -27.691205978393555, "global_step": 580300, "epoch": 6991} {"train_loss": -28.270721435546875, "global_step": 580301, "epoch": 6991} {"train_loss": -28.12871742248535, "global_step": 580302, "epoch": 6991} {"train_loss": -28.274658203125, "global_step": 580303, "epoch": 6991} {"train_loss": -28.112960815429688, "global_step": 580304, "epoch": 6991} {"train_loss": -27.95954704284668, "global_step": 580305, "epoch": 6991} {"train_loss": -28.059961318969727, "global_step": 580306, "epoch": 6991} {"train_loss": -27.69447898864746, "global_step": 580307, "epoch": 6991} {"train_loss": -27.97857666015625, "global_step": 580308, "epoch": 6991} {"train_loss": -27.9982967376709, "global_step": 580309, "epoch": 6991} {"train_loss": -27.44966697692871, "global_step": 580310, "epoch": 6991} {"train_loss": -27.181119918823242, "global_step": 580311, "epoch": 6991} {"train_loss": -26.633575439453125, "global_step": 580312, "epoch": 6991} {"train_loss": -26.751251220703125, "global_step": 580313, "epoch": 6991} {"train_loss": -27.63373374938965, "global_step": 580314, "epoch": 6991} {"train_loss": -28.23737144470215, "global_step": 580315, "epoch": 6991} {"train_loss": -27.717212677001953, "global_step": 580316, "epoch": 6991} {"train_loss": -28.402429580688477, "global_step": 580317, "epoch": 6991} {"train_loss": -27.710224151611328, "global_step": 580318, "epoch": 6991} {"train_loss": -28.32795524597168, "global_step": 580319, "epoch": 6991} {"train_loss": -27.724273681640625, "global_step": 580320, "epoch": 6991} {"train_loss": -27.357080459594727, "global_step": 580321, "epoch": 6991} {"train_loss": -28.295429229736328, "global_step": 580322, "epoch": 6991} {"train_loss": -27.729406356811523, "global_step": 580323, "epoch": 6991} {"train_loss": -27.9296875, "global_step": 580324, "epoch": 6991} {"train_loss": -28.06278419494629, "global_step": 580325, "epoch": 6991} {"train_loss": -28.137847900390625, "global_step": 580326, "epoch": 6991} {"train_loss": -27.762924194335938, "global_step": 580327, "epoch": 6991} {"train_loss": -27.91486167907715, "global_step": 580328, "epoch": 6991} {"train_loss": -27.892377853393555, "global_step": 580329, "epoch": 6991} {"train_loss": -27.84937858581543, "global_step": 580330, "epoch": 6991} {"train_loss": -28.127471923828125, "global_step": 580331, "epoch": 6991} {"train_loss": -28.163925170898438, "global_step": 580332, "epoch": 6991} {"train_loss": -27.82215690612793, "global_step": 580333, "epoch": 6991} {"train_loss": -28.086353302001953, "global_step": 580334, "epoch": 6991} {"train_loss": -27.781944343842657, "global_step": 580335, "epoch": 6991, "val_loss": 6516030.5} {"train_loss": -27.774906158447266, "global_step": 580336, "epoch": 6992} {"train_loss": -27.60175895690918, "global_step": 580337, "epoch": 6992} {"train_loss": -27.926084518432617, "global_step": 580338, "epoch": 6992} {"train_loss": -27.140024185180664, "global_step": 580339, "epoch": 6992} {"train_loss": -27.853940963745117, "global_step": 580340, "epoch": 6992} {"train_loss": -27.803022384643555, "global_step": 580341, "epoch": 6992} {"train_loss": -27.3819522857666, "global_step": 580342, "epoch": 6992} {"train_loss": -27.4656982421875, "global_step": 580343, "epoch": 6992} {"train_loss": -27.38941764831543, "global_step": 580344, "epoch": 6992} {"train_loss": -27.711261749267578, "global_step": 580345, "epoch": 6992} {"train_loss": -27.926061630249023, "global_step": 580346, "epoch": 6992} {"train_loss": -27.4337215423584, "global_step": 580347, "epoch": 6992} {"train_loss": -27.504846572875977, "global_step": 580348, "epoch": 6992} {"train_loss": -27.66620445251465, "global_step": 580349, "epoch": 6992} {"train_loss": -27.687942504882812, "global_step": 580350, "epoch": 6992} {"train_loss": -28.060697555541992, "global_step": 580351, "epoch": 6992} {"train_loss": -27.822589874267578, "global_step": 580352, "epoch": 6992} {"train_loss": -28.112104415893555, "global_step": 580353, "epoch": 6992} {"train_loss": -27.335844039916992, "global_step": 580354, "epoch": 6992} {"train_loss": -27.264972686767578, "global_step": 580355, "epoch": 6992} {"train_loss": -27.785236358642578, "global_step": 580356, "epoch": 6992} {"train_loss": -27.738637924194336, "global_step": 580357, "epoch": 6992} {"train_loss": -27.80852699279785, "global_step": 580358, "epoch": 6992} {"train_loss": -27.61114501953125, "global_step": 580359, "epoch": 6992} {"train_loss": -27.71723747253418, "global_step": 580360, "epoch": 6992} {"train_loss": -27.946176528930664, "global_step": 580361, "epoch": 6992} {"train_loss": -27.773054122924805, "global_step": 580362, "epoch": 6992} {"train_loss": -28.2263126373291, "global_step": 580363, "epoch": 6992} {"train_loss": -27.86895179748535, "global_step": 580364, "epoch": 6992} {"train_loss": -27.82508659362793, "global_step": 580365, "epoch": 6992} {"train_loss": -27.766620635986328, "global_step": 580366, "epoch": 6992} {"train_loss": -27.8206787109375, "global_step": 580367, "epoch": 6992} {"train_loss": -28.07940673828125, "global_step": 580368, "epoch": 6992} {"train_loss": -28.180749893188477, "global_step": 580369, "epoch": 6992} {"train_loss": -27.79205322265625, "global_step": 580370, "epoch": 6992} {"train_loss": -27.53313636779785, "global_step": 580371, "epoch": 6992} {"train_loss": -27.53765296936035, "global_step": 580372, "epoch": 6992} {"train_loss": -27.670007705688477, "global_step": 580373, "epoch": 6992} {"train_loss": -28.36248207092285, "global_step": 580374, "epoch": 6992} {"train_loss": -28.027130126953125, "global_step": 580375, "epoch": 6992} {"train_loss": -28.240610122680664, "global_step": 580376, "epoch": 6992} {"train_loss": -27.986988067626953, "global_step": 580377, "epoch": 6992} {"train_loss": -28.129566192626953, "global_step": 580378, "epoch": 6992} {"train_loss": -27.945409774780273, "global_step": 580379, "epoch": 6992} {"train_loss": -28.105350494384766, "global_step": 580380, "epoch": 6992} {"train_loss": -28.081628799438477, "global_step": 580381, "epoch": 6992} {"train_loss": -27.855453491210938, "global_step": 580382, "epoch": 6992} {"train_loss": -28.034149169921875, "global_step": 580383, "epoch": 6992} {"train_loss": -27.911069869995117, "global_step": 580384, "epoch": 6992} {"train_loss": -27.880512237548828, "global_step": 580385, "epoch": 6992} {"train_loss": -28.161096572875977, "global_step": 580386, "epoch": 6992} {"train_loss": -27.917211532592773, "global_step": 580387, "epoch": 6992} {"train_loss": -27.66204833984375, "global_step": 580388, "epoch": 6992} {"train_loss": -28.229230880737305, "global_step": 580389, "epoch": 6992} {"train_loss": -27.94611930847168, "global_step": 580390, "epoch": 6992} {"train_loss": -27.620849609375, "global_step": 580391, "epoch": 6992} {"train_loss": -27.634510040283203, "global_step": 580392, "epoch": 6992} {"train_loss": -27.532489776611328, "global_step": 580393, "epoch": 6992} {"train_loss": -27.852399826049805, "global_step": 580394, "epoch": 6992} {"train_loss": -27.37746238708496, "global_step": 580395, "epoch": 6992} {"train_loss": -27.296039581298828, "global_step": 580396, "epoch": 6992} {"train_loss": -27.510013580322266, "global_step": 580397, "epoch": 6992} {"train_loss": -27.796491622924805, "global_step": 580398, "epoch": 6992} {"train_loss": -27.376691818237305, "global_step": 580399, "epoch": 6992} {"train_loss": -27.554401397705078, "global_step": 580400, "epoch": 6992} {"train_loss": -27.74251365661621, "global_step": 580401, "epoch": 6992} {"train_loss": -27.624530792236328, "global_step": 580402, "epoch": 6992} {"train_loss": -28.107831954956055, "global_step": 580403, "epoch": 6992} {"train_loss": -27.76152992248535, "global_step": 580404, "epoch": 6992} {"train_loss": -27.831632614135742, "global_step": 580405, "epoch": 6992} {"train_loss": -27.891571044921875, "global_step": 580406, "epoch": 6992} {"train_loss": -27.771169662475586, "global_step": 580407, "epoch": 6992} {"train_loss": -27.66532325744629, "global_step": 580408, "epoch": 6992} {"train_loss": -28.128498077392578, "global_step": 580409, "epoch": 6992} {"train_loss": -27.968475341796875, "global_step": 580410, "epoch": 6992} {"train_loss": -27.890018463134766, "global_step": 580411, "epoch": 6992} {"train_loss": -27.80097007751465, "global_step": 580412, "epoch": 6992} {"train_loss": -27.681411743164062, "global_step": 580413, "epoch": 6992} {"train_loss": -27.8488712310791, "global_step": 580414, "epoch": 6992} {"train_loss": -27.832433700561523, "global_step": 580415, "epoch": 6992} {"train_loss": -28.22353172302246, "global_step": 580416, "epoch": 6992} {"train_loss": -28.223392486572266, "global_step": 580417, "epoch": 6992} {"train_loss": -27.801566204392767, "global_step": 580418, "epoch": 6992, "val_loss": 6400819.5} {"train_loss": -25.678735733032227, "global_step": 580419, "epoch": 6993} {"train_loss": -25.573383331298828, "global_step": 580420, "epoch": 6993} {"train_loss": -27.1259822845459, "global_step": 580421, "epoch": 6993} {"train_loss": -25.960500717163086, "global_step": 580422, "epoch": 6993} {"train_loss": -26.550561904907227, "global_step": 580423, "epoch": 6993} {"train_loss": -26.944839477539062, "global_step": 580424, "epoch": 6993} {"train_loss": -25.84869384765625, "global_step": 580425, "epoch": 6993} {"train_loss": -26.64385986328125, "global_step": 580426, "epoch": 6993} {"train_loss": -26.897632598876953, "global_step": 580427, "epoch": 6993} {"train_loss": -26.646146774291992, "global_step": 580428, "epoch": 6993} {"train_loss": -27.01002311706543, "global_step": 580429, "epoch": 6993} {"train_loss": -27.18744468688965, "global_step": 580430, "epoch": 6993} {"train_loss": -26.828266143798828, "global_step": 580431, "epoch": 6993} {"train_loss": -27.050628662109375, "global_step": 580432, "epoch": 6993} {"train_loss": -27.01849937438965, "global_step": 580433, "epoch": 6993} {"train_loss": -27.220121383666992, "global_step": 580434, "epoch": 6993} {"train_loss": -27.253324508666992, "global_step": 580435, "epoch": 6993} {"train_loss": -27.752838134765625, "global_step": 580436, "epoch": 6993} {"train_loss": -27.274526596069336, "global_step": 580437, "epoch": 6993} {"train_loss": -27.390838623046875, "global_step": 580438, "epoch": 6993} {"train_loss": -27.737531661987305, "global_step": 580439, "epoch": 6993} {"train_loss": -27.202077865600586, "global_step": 580440, "epoch": 6993} {"train_loss": -27.290449142456055, "global_step": 580441, "epoch": 6993} {"train_loss": -27.4220027923584, "global_step": 580442, "epoch": 6993} {"train_loss": -27.395864486694336, "global_step": 580443, "epoch": 6993} {"train_loss": -27.601337432861328, "global_step": 580444, "epoch": 6993} {"train_loss": -27.35707664489746, "global_step": 580445, "epoch": 6993} {"train_loss": -27.4118595123291, "global_step": 580446, "epoch": 6993} {"train_loss": -27.44805335998535, "global_step": 580447, "epoch": 6993} {"train_loss": -27.7746639251709, "global_step": 580448, "epoch": 6993} {"train_loss": -27.447961807250977, "global_step": 580449, "epoch": 6993} {"train_loss": -27.733732223510742, "global_step": 580450, "epoch": 6993} {"train_loss": -27.952802658081055, "global_step": 580451, "epoch": 6993} {"train_loss": -27.2392635345459, "global_step": 580452, "epoch": 6993} {"train_loss": -27.950057983398438, "global_step": 580453, "epoch": 6993} {"train_loss": -27.72150993347168, "global_step": 580454, "epoch": 6993} {"train_loss": -27.600561141967773, "global_step": 580455, "epoch": 6993} {"train_loss": -27.636987686157227, "global_step": 580456, "epoch": 6993} {"train_loss": -27.66815757751465, "global_step": 580457, "epoch": 6993} {"train_loss": -27.647607803344727, "global_step": 580458, "epoch": 6993} {"train_loss": -27.578901290893555, "global_step": 580459, "epoch": 6993} {"train_loss": -27.6708984375, "global_step": 580460, "epoch": 6993} {"train_loss": -28.01117515563965, "global_step": 580461, "epoch": 6993} {"train_loss": -27.803131103515625, "global_step": 580462, "epoch": 6993} {"train_loss": -27.74344253540039, "global_step": 580463, "epoch": 6993} {"train_loss": -28.208271026611328, "global_step": 580464, "epoch": 6993} {"train_loss": -27.991891860961914, "global_step": 580465, "epoch": 6993} {"train_loss": -27.741735458374023, "global_step": 580466, "epoch": 6993} {"train_loss": -27.759693145751953, "global_step": 580467, "epoch": 6993} {"train_loss": -28.20210075378418, "global_step": 580468, "epoch": 6993} {"train_loss": -27.820425033569336, "global_step": 580469, "epoch": 6993} {"train_loss": -28.37336540222168, "global_step": 580470, "epoch": 6993} {"train_loss": -27.8708438873291, "global_step": 580471, "epoch": 6993} {"train_loss": -28.311548233032227, "global_step": 580472, "epoch": 6993} {"train_loss": -28.2648983001709, "global_step": 580473, "epoch": 6993} {"train_loss": -27.9948787689209, "global_step": 580474, "epoch": 6993} {"train_loss": -27.854461669921875, "global_step": 580475, "epoch": 6993} {"train_loss": -27.99677085876465, "global_step": 580476, "epoch": 6993} {"train_loss": -27.811399459838867, "global_step": 580477, "epoch": 6993} {"train_loss": -27.92702293395996, "global_step": 580478, "epoch": 6993} {"train_loss": -27.687829971313477, "global_step": 580479, "epoch": 6993} {"train_loss": -27.89109230041504, "global_step": 580480, "epoch": 6993} {"train_loss": -28.0328426361084, "global_step": 580481, "epoch": 6993} {"train_loss": -28.35908317565918, "global_step": 580482, "epoch": 6993} {"train_loss": -27.993513107299805, "global_step": 580483, "epoch": 6993} {"train_loss": -28.101856231689453, "global_step": 580484, "epoch": 6993} {"train_loss": -27.638158798217773, "global_step": 580485, "epoch": 6993} {"train_loss": -27.7668514251709, "global_step": 580486, "epoch": 6993} {"train_loss": -27.8869686126709, "global_step": 580487, "epoch": 6993} {"train_loss": -28.05095863342285, "global_step": 580488, "epoch": 6993} {"train_loss": -28.086179733276367, "global_step": 580489, "epoch": 6993} {"train_loss": -28.155263900756836, "global_step": 580490, "epoch": 6993} {"train_loss": -28.12244987487793, "global_step": 580491, "epoch": 6993} {"train_loss": -28.078052520751953, "global_step": 580492, "epoch": 6993} {"train_loss": -28.27570152282715, "global_step": 580493, "epoch": 6993} {"train_loss": -28.088586807250977, "global_step": 580494, "epoch": 6993} {"train_loss": -27.745941162109375, "global_step": 580495, "epoch": 6993} {"train_loss": -27.908926010131836, "global_step": 580496, "epoch": 6993} {"train_loss": -27.885650634765625, "global_step": 580497, "epoch": 6993} {"train_loss": -28.122480392456055, "global_step": 580498, "epoch": 6993} {"train_loss": -27.87109375, "global_step": 580499, "epoch": 6993} {"train_loss": -27.913040161132812, "global_step": 580500, "epoch": 6993} {"train_loss": -27.58672160412892, "global_step": 580501, "epoch": 6993, "val_loss": 6475803.0} {"train_loss": -27.07014274597168, "global_step": 580502, "epoch": 6994} {"train_loss": -26.7623291015625, "global_step": 580503, "epoch": 6994} {"train_loss": -26.967870712280273, "global_step": 580504, "epoch": 6994} {"train_loss": -27.443716049194336, "global_step": 580505, "epoch": 6994} {"train_loss": -26.80350112915039, "global_step": 580506, "epoch": 6994} {"train_loss": -26.620731353759766, "global_step": 580507, "epoch": 6994} {"train_loss": -27.55276870727539, "global_step": 580508, "epoch": 6994} {"train_loss": -27.147790908813477, "global_step": 580509, "epoch": 6994} {"train_loss": -27.195068359375, "global_step": 580510, "epoch": 6994} {"train_loss": -27.473052978515625, "global_step": 580511, "epoch": 6994} {"train_loss": -27.530597686767578, "global_step": 580512, "epoch": 6994} {"train_loss": -27.48823356628418, "global_step": 580513, "epoch": 6994} {"train_loss": -27.051685333251953, "global_step": 580514, "epoch": 6994} {"train_loss": -27.445037841796875, "global_step": 580515, "epoch": 6994} {"train_loss": -27.607248306274414, "global_step": 580516, "epoch": 6994} {"train_loss": -27.477741241455078, "global_step": 580517, "epoch": 6994} {"train_loss": -28.06963539123535, "global_step": 580518, "epoch": 6994} {"train_loss": -27.240833282470703, "global_step": 580519, "epoch": 6994} {"train_loss": -27.937469482421875, "global_step": 580520, "epoch": 6994} {"train_loss": -27.511646270751953, "global_step": 580521, "epoch": 6994} {"train_loss": -27.449756622314453, "global_step": 580522, "epoch": 6994} {"train_loss": -27.654224395751953, "global_step": 580523, "epoch": 6994} {"train_loss": -27.64754295349121, "global_step": 580524, "epoch": 6994} {"train_loss": -28.062009811401367, "global_step": 580525, "epoch": 6994} {"train_loss": -27.870746612548828, "global_step": 580526, "epoch": 6994} {"train_loss": -27.88728141784668, "global_step": 580527, "epoch": 6994} {"train_loss": -27.82990837097168, "global_step": 580528, "epoch": 6994} {"train_loss": -28.21945571899414, "global_step": 580529, "epoch": 6994} {"train_loss": -27.81678581237793, "global_step": 580530, "epoch": 6994} {"train_loss": -27.839696884155273, "global_step": 580531, "epoch": 6994} {"train_loss": -27.926044464111328, "global_step": 580532, "epoch": 6994} {"train_loss": -27.8855037689209, "global_step": 580533, "epoch": 6994} {"train_loss": -27.889938354492188, "global_step": 580534, "epoch": 6994} {"train_loss": -27.58148765563965, "global_step": 580535, "epoch": 6994} {"train_loss": -27.981781005859375, "global_step": 580536, "epoch": 6994} {"train_loss": -28.287750244140625, "global_step": 580537, "epoch": 6994} {"train_loss": -28.11614418029785, "global_step": 580538, "epoch": 6994} {"train_loss": -27.800048828125, "global_step": 580539, "epoch": 6994} {"train_loss": -27.867237091064453, "global_step": 580540, "epoch": 6994} {"train_loss": -28.29841423034668, "global_step": 580541, "epoch": 6994} {"train_loss": -28.443525314331055, "global_step": 580542, "epoch": 6994} {"train_loss": -28.252912521362305, "global_step": 580543, "epoch": 6994} {"train_loss": -28.314910888671875, "global_step": 580544, "epoch": 6994} {"train_loss": -28.12005615234375, "global_step": 580545, "epoch": 6994} {"train_loss": -28.113351821899414, "global_step": 580546, "epoch": 6994} {"train_loss": -27.848276138305664, "global_step": 580547, "epoch": 6994} {"train_loss": -28.239892959594727, "global_step": 580548, "epoch": 6994} {"train_loss": -28.067575454711914, "global_step": 580549, "epoch": 6994} {"train_loss": -28.06696128845215, "global_step": 580550, "epoch": 6994} {"train_loss": -28.228742599487305, "global_step": 580551, "epoch": 6994} {"train_loss": -28.099761962890625, "global_step": 580552, "epoch": 6994} {"train_loss": -27.71492576599121, "global_step": 580553, "epoch": 6994} {"train_loss": -28.17157554626465, "global_step": 580554, "epoch": 6994} {"train_loss": -28.24454689025879, "global_step": 580555, "epoch": 6994} {"train_loss": -27.879947662353516, "global_step": 580556, "epoch": 6994} {"train_loss": -28.094812393188477, "global_step": 580557, "epoch": 6994} {"train_loss": -27.722768783569336, "global_step": 580558, "epoch": 6994} {"train_loss": -27.244705200195312, "global_step": 580559, "epoch": 6994} {"train_loss": -27.459735870361328, "global_step": 580560, "epoch": 6994} {"train_loss": -27.64393424987793, "global_step": 580561, "epoch": 6994} {"train_loss": -27.546920776367188, "global_step": 580562, "epoch": 6994} {"train_loss": -27.925256729125977, "global_step": 580563, "epoch": 6994} {"train_loss": -27.595457077026367, "global_step": 580564, "epoch": 6994} {"train_loss": -27.842763900756836, "global_step": 580565, "epoch": 6994} {"train_loss": -27.47869300842285, "global_step": 580566, "epoch": 6994} {"train_loss": -27.294708251953125, "global_step": 580567, "epoch": 6994} {"train_loss": -27.66690444946289, "global_step": 580568, "epoch": 6994} {"train_loss": -27.564741134643555, "global_step": 580569, "epoch": 6994} {"train_loss": -27.587324142456055, "global_step": 580570, "epoch": 6994} {"train_loss": -28.11917495727539, "global_step": 580571, "epoch": 6994} {"train_loss": -27.9281063079834, "global_step": 580572, "epoch": 6994} {"train_loss": -27.897815704345703, "global_step": 580573, "epoch": 6994} {"train_loss": -28.116840362548828, "global_step": 580574, "epoch": 6994} {"train_loss": -28.039602279663086, "global_step": 580575, "epoch": 6994} {"train_loss": -27.875593185424805, "global_step": 580576, "epoch": 6994} {"train_loss": -27.890756607055664, "global_step": 580577, "epoch": 6994} {"train_loss": -27.8873348236084, "global_step": 580578, "epoch": 6994} {"train_loss": -27.770627975463867, "global_step": 580579, "epoch": 6994} {"train_loss": -27.780424118041992, "global_step": 580580, "epoch": 6994} {"train_loss": -28.07135009765625, "global_step": 580581, "epoch": 6994} {"train_loss": -28.038145065307617, "global_step": 580582, "epoch": 6994} {"train_loss": -28.112720489501953, "global_step": 580583, "epoch": 6994} {"train_loss": -27.746037402784967, "global_step": 580584, "epoch": 6994, "val_loss": 6440901.0} {"train_loss": -27.985727310180664, "global_step": 580585, "epoch": 6995} {"train_loss": -27.345901489257812, "global_step": 580586, "epoch": 6995} {"train_loss": -27.85943603515625, "global_step": 580587, "epoch": 6995} {"train_loss": -27.687803268432617, "global_step": 580588, "epoch": 6995} {"train_loss": -27.453351974487305, "global_step": 580589, "epoch": 6995} {"train_loss": -27.32928466796875, "global_step": 580590, "epoch": 6995} {"train_loss": -27.8026065826416, "global_step": 580591, "epoch": 6995} {"train_loss": -27.37079429626465, "global_step": 580592, "epoch": 6995} {"train_loss": -27.23451042175293, "global_step": 580593, "epoch": 6995} {"train_loss": -27.66843032836914, "global_step": 580594, "epoch": 6995} {"train_loss": -27.759733200073242, "global_step": 580595, "epoch": 6995} {"train_loss": -27.358381271362305, "global_step": 580596, "epoch": 6995} {"train_loss": -26.835058212280273, "global_step": 580597, "epoch": 6995} {"train_loss": -27.62981605529785, "global_step": 580598, "epoch": 6995} {"train_loss": -27.446584701538086, "global_step": 580599, "epoch": 6995} {"train_loss": -27.836328506469727, "global_step": 580600, "epoch": 6995} {"train_loss": -27.8604679107666, "global_step": 580601, "epoch": 6995} {"train_loss": -27.5425968170166, "global_step": 580602, "epoch": 6995} {"train_loss": -27.118322372436523, "global_step": 580603, "epoch": 6995} {"train_loss": -27.560712814331055, "global_step": 580604, "epoch": 6995} {"train_loss": -27.821619033813477, "global_step": 580605, "epoch": 6995} {"train_loss": -27.530242919921875, "global_step": 580606, "epoch": 6995} {"train_loss": -27.323928833007812, "global_step": 580607, "epoch": 6995} {"train_loss": -27.47013282775879, "global_step": 580608, "epoch": 6995} {"train_loss": -27.594257354736328, "global_step": 580609, "epoch": 6995} {"train_loss": -28.0994930267334, "global_step": 580610, "epoch": 6995} {"train_loss": -27.6522274017334, "global_step": 580611, "epoch": 6995} {"train_loss": -27.912439346313477, "global_step": 580612, "epoch": 6995} {"train_loss": -28.043004989624023, "global_step": 580613, "epoch": 6995} {"train_loss": -27.66961669921875, "global_step": 580614, "epoch": 6995} {"train_loss": -27.509668350219727, "global_step": 580615, "epoch": 6995} {"train_loss": -27.767972946166992, "global_step": 580616, "epoch": 6995} {"train_loss": -28.010656356811523, "global_step": 580617, "epoch": 6995} {"train_loss": -28.029111862182617, "global_step": 580618, "epoch": 6995} {"train_loss": -28.058948516845703, "global_step": 580619, "epoch": 6995} {"train_loss": -27.99003028869629, "global_step": 580620, "epoch": 6995} {"train_loss": -27.616724014282227, "global_step": 580621, "epoch": 6995} {"train_loss": -27.871109008789062, "global_step": 580622, "epoch": 6995} {"train_loss": -27.941940307617188, "global_step": 580623, "epoch": 6995} {"train_loss": -28.1997013092041, "global_step": 580624, "epoch": 6995} {"train_loss": -27.928319931030273, "global_step": 580625, "epoch": 6995} {"train_loss": -28.463682174682617, "global_step": 580626, "epoch": 6995} {"train_loss": -28.247528076171875, "global_step": 580627, "epoch": 6995} {"train_loss": -28.059553146362305, "global_step": 580628, "epoch": 6995} {"train_loss": -28.03291893005371, "global_step": 580629, "epoch": 6995} {"train_loss": -27.86036491394043, "global_step": 580630, "epoch": 6995} {"train_loss": -27.790205001831055, "global_step": 580631, "epoch": 6995} {"train_loss": -27.81354331970215, "global_step": 580632, "epoch": 6995} {"train_loss": -27.890920639038086, "global_step": 580633, "epoch": 6995} {"train_loss": -27.091156005859375, "global_step": 580634, "epoch": 6995} {"train_loss": -26.411392211914062, "global_step": 580635, "epoch": 6995} {"train_loss": -26.172210693359375, "global_step": 580636, "epoch": 6995} {"train_loss": -27.255414962768555, "global_step": 580637, "epoch": 6995} {"train_loss": -26.8258113861084, "global_step": 580638, "epoch": 6995} {"train_loss": -26.733570098876953, "global_step": 580639, "epoch": 6995} {"train_loss": -26.55255126953125, "global_step": 580640, "epoch": 6995} {"train_loss": -27.180017471313477, "global_step": 580641, "epoch": 6995} {"train_loss": -27.428333282470703, "global_step": 580642, "epoch": 6995} {"train_loss": -27.8110408782959, "global_step": 580643, "epoch": 6995} {"train_loss": -27.443359375, "global_step": 580644, "epoch": 6995} {"train_loss": -27.690509796142578, "global_step": 580645, "epoch": 6995} {"train_loss": -27.430057525634766, "global_step": 580646, "epoch": 6995} {"train_loss": -27.558149337768555, "global_step": 580647, "epoch": 6995} {"train_loss": -27.83234977722168, "global_step": 580648, "epoch": 6995} {"train_loss": -27.94707679748535, "global_step": 580649, "epoch": 6995} {"train_loss": -27.530475616455078, "global_step": 580650, "epoch": 6995} {"train_loss": -27.356525421142578, "global_step": 580651, "epoch": 6995} {"train_loss": -27.408954620361328, "global_step": 580652, "epoch": 6995} {"train_loss": -28.149572372436523, "global_step": 580653, "epoch": 6995} {"train_loss": -27.465377807617188, "global_step": 580654, "epoch": 6995} {"train_loss": -27.728574752807617, "global_step": 580655, "epoch": 6995} {"train_loss": -27.439420700073242, "global_step": 580656, "epoch": 6995} {"train_loss": -27.92486572265625, "global_step": 580657, "epoch": 6995} {"train_loss": -27.86065673828125, "global_step": 580658, "epoch": 6995} {"train_loss": -28.128589630126953, "global_step": 580659, "epoch": 6995} {"train_loss": -28.101682662963867, "global_step": 580660, "epoch": 6995} {"train_loss": -27.561878204345703, "global_step": 580661, "epoch": 6995} {"train_loss": -27.99776268005371, "global_step": 580662, "epoch": 6995} {"train_loss": -27.94695472717285, "global_step": 580663, "epoch": 6995} {"train_loss": -28.248502731323242, "global_step": 580664, "epoch": 6995} {"train_loss": -27.729902267456055, "global_step": 580665, "epoch": 6995} {"train_loss": -27.622114181518555, "global_step": 580666, "epoch": 6995} {"train_loss": -27.638378832713666, "global_step": 580667, "epoch": 6995, "val_loss": 6423837.5} {"train_loss": -27.340473175048828, "global_step": 580668, "epoch": 6996} {"train_loss": -27.650888442993164, "global_step": 580669, "epoch": 6996} {"train_loss": -26.935993194580078, "global_step": 580670, "epoch": 6996} {"train_loss": -27.569849014282227, "global_step": 580671, "epoch": 6996} {"train_loss": -27.1575870513916, "global_step": 580672, "epoch": 6996} {"train_loss": -27.564420700073242, "global_step": 580673, "epoch": 6996} {"train_loss": -27.454334259033203, "global_step": 580674, "epoch": 6996} {"train_loss": -27.290327072143555, "global_step": 580675, "epoch": 6996} {"train_loss": -27.359094619750977, "global_step": 580676, "epoch": 6996} {"train_loss": -27.418811798095703, "global_step": 580677, "epoch": 6996} {"train_loss": -27.45305824279785, "global_step": 580678, "epoch": 6996} {"train_loss": -27.52081871032715, "global_step": 580679, "epoch": 6996} {"train_loss": -27.559473037719727, "global_step": 580680, "epoch": 6996} {"train_loss": -27.717010498046875, "global_step": 580681, "epoch": 6996} {"train_loss": -28.094165802001953, "global_step": 580682, "epoch": 6996} {"train_loss": -27.33039665222168, "global_step": 580683, "epoch": 6996} {"train_loss": -27.722808837890625, "global_step": 580684, "epoch": 6996} {"train_loss": -27.981794357299805, "global_step": 580685, "epoch": 6996} {"train_loss": -27.88494873046875, "global_step": 580686, "epoch": 6996} {"train_loss": -27.937604904174805, "global_step": 580687, "epoch": 6996} {"train_loss": -28.07660484313965, "global_step": 580688, "epoch": 6996} {"train_loss": -27.565128326416016, "global_step": 580689, "epoch": 6996} {"train_loss": -27.880237579345703, "global_step": 580690, "epoch": 6996} {"train_loss": -28.04860496520996, "global_step": 580691, "epoch": 6996} {"train_loss": -27.95081901550293, "global_step": 580692, "epoch": 6996} {"train_loss": -27.987951278686523, "global_step": 580693, "epoch": 6996} {"train_loss": -27.830183029174805, "global_step": 580694, "epoch": 6996} {"train_loss": -27.922718048095703, "global_step": 580695, "epoch": 6996} {"train_loss": -27.84814453125, "global_step": 580696, "epoch": 6996} {"train_loss": -27.724821090698242, "global_step": 580697, "epoch": 6996} {"train_loss": -28.098865509033203, "global_step": 580698, "epoch": 6996} {"train_loss": -28.12325096130371, "global_step": 580699, "epoch": 6996} {"train_loss": -28.3253173828125, "global_step": 580700, "epoch": 6996} {"train_loss": -27.981489181518555, "global_step": 580701, "epoch": 6996} {"train_loss": -28.192350387573242, "global_step": 580702, "epoch": 6996} {"train_loss": -27.465686798095703, "global_step": 580703, "epoch": 6996} {"train_loss": -27.96253776550293, "global_step": 580704, "epoch": 6996} {"train_loss": -28.123193740844727, "global_step": 580705, "epoch": 6996} {"train_loss": -27.551477432250977, "global_step": 580706, "epoch": 6996} {"train_loss": -27.931259155273438, "global_step": 580707, "epoch": 6996} {"train_loss": -27.988672256469727, "global_step": 580708, "epoch": 6996} {"train_loss": -28.232446670532227, "global_step": 580709, "epoch": 6996} {"train_loss": -27.874731063842773, "global_step": 580710, "epoch": 6996} {"train_loss": -27.819263458251953, "global_step": 580711, "epoch": 6996} {"train_loss": -28.554746627807617, "global_step": 580712, "epoch": 6996} {"train_loss": -28.237457275390625, "global_step": 580713, "epoch": 6996} {"train_loss": -28.041242599487305, "global_step": 580714, "epoch": 6996} {"train_loss": -28.15093994140625, "global_step": 580715, "epoch": 6996} {"train_loss": -27.84024429321289, "global_step": 580716, "epoch": 6996} {"train_loss": -27.916095733642578, "global_step": 580717, "epoch": 6996} {"train_loss": -28.102481842041016, "global_step": 580718, "epoch": 6996} {"train_loss": -28.4377498626709, "global_step": 580719, "epoch": 6996} {"train_loss": -27.8494873046875, "global_step": 580720, "epoch": 6996} {"train_loss": -28.431751251220703, "global_step": 580721, "epoch": 6996} {"train_loss": -28.14297866821289, "global_step": 580722, "epoch": 6996} {"train_loss": -28.076282501220703, "global_step": 580723, "epoch": 6996} {"train_loss": -28.217010498046875, "global_step": 580724, "epoch": 6996} {"train_loss": -28.13617515563965, "global_step": 580725, "epoch": 6996} {"train_loss": -27.68928337097168, "global_step": 580726, "epoch": 6996} {"train_loss": -28.14741325378418, "global_step": 580727, "epoch": 6996} {"train_loss": -28.346765518188477, "global_step": 580728, "epoch": 6996} {"train_loss": -28.002439498901367, "global_step": 580729, "epoch": 6996} {"train_loss": -28.013111114501953, "global_step": 580730, "epoch": 6996} {"train_loss": -27.75368309020996, "global_step": 580731, "epoch": 6996} {"train_loss": -27.9136905670166, "global_step": 580732, "epoch": 6996} {"train_loss": -27.61924171447754, "global_step": 580733, "epoch": 6996} {"train_loss": -27.715198516845703, "global_step": 580734, "epoch": 6996} {"train_loss": -27.660053253173828, "global_step": 580735, "epoch": 6996} {"train_loss": -26.776142120361328, "global_step": 580736, "epoch": 6996} {"train_loss": -27.39930534362793, "global_step": 580737, "epoch": 6996} {"train_loss": -27.717451095581055, "global_step": 580738, "epoch": 6996} {"train_loss": -27.367877960205078, "global_step": 580739, "epoch": 6996} {"train_loss": -26.92341423034668, "global_step": 580740, "epoch": 6996} {"train_loss": -27.53594398498535, "global_step": 580741, "epoch": 6996} {"train_loss": -27.441802978515625, "global_step": 580742, "epoch": 6996} {"train_loss": -27.415191650390625, "global_step": 580743, "epoch": 6996} {"train_loss": -28.048566818237305, "global_step": 580744, "epoch": 6996} {"train_loss": -27.32135009765625, "global_step": 580745, "epoch": 6996} {"train_loss": -27.500568389892578, "global_step": 580746, "epoch": 6996} {"train_loss": -27.4428768157959, "global_step": 580747, "epoch": 6996} {"train_loss": -27.848730087280273, "global_step": 580748, "epoch": 6996} {"train_loss": -27.77252769470215, "global_step": 580749, "epoch": 6996} {"train_loss": -27.81202219767743, "global_step": 580750, "epoch": 6996, "val_loss": 6532964.0} {"train_loss": -27.27064323425293, "global_step": 580751, "epoch": 6997} {"train_loss": -26.514265060424805, "global_step": 580752, "epoch": 6997} {"train_loss": -27.192371368408203, "global_step": 580753, "epoch": 6997} {"train_loss": -27.489973068237305, "global_step": 580754, "epoch": 6997} {"train_loss": -27.392135620117188, "global_step": 580755, "epoch": 6997} {"train_loss": -27.3204345703125, "global_step": 580756, "epoch": 6997} {"train_loss": -27.554410934448242, "global_step": 580757, "epoch": 6997} {"train_loss": -27.574804306030273, "global_step": 580758, "epoch": 6997} {"train_loss": -27.591100692749023, "global_step": 580759, "epoch": 6997} {"train_loss": -27.763158798217773, "global_step": 580760, "epoch": 6997} {"train_loss": -27.495620727539062, "global_step": 580761, "epoch": 6997} {"train_loss": -27.696033477783203, "global_step": 580762, "epoch": 6997} {"train_loss": -27.850500106811523, "global_step": 580763, "epoch": 6997} {"train_loss": -27.628726959228516, "global_step": 580764, "epoch": 6997} {"train_loss": -27.623151779174805, "global_step": 580765, "epoch": 6997} {"train_loss": -27.962156295776367, "global_step": 580766, "epoch": 6997} {"train_loss": -27.671741485595703, "global_step": 580767, "epoch": 6997} {"train_loss": -27.643390655517578, "global_step": 580768, "epoch": 6997} {"train_loss": -27.821191787719727, "global_step": 580769, "epoch": 6997} {"train_loss": -27.55807876586914, "global_step": 580770, "epoch": 6997} {"train_loss": -27.58070182800293, "global_step": 580771, "epoch": 6997} {"train_loss": -28.04599952697754, "global_step": 580772, "epoch": 6997} {"train_loss": -27.723249435424805, "global_step": 580773, "epoch": 6997} {"train_loss": -27.7625789642334, "global_step": 580774, "epoch": 6997} {"train_loss": -27.921039581298828, "global_step": 580775, "epoch": 6997} {"train_loss": -28.10951805114746, "global_step": 580776, "epoch": 6997} {"train_loss": -27.725513458251953, "global_step": 580777, "epoch": 6997} {"train_loss": -27.739988327026367, "global_step": 580778, "epoch": 6997} {"train_loss": -28.014570236206055, "global_step": 580779, "epoch": 6997} {"train_loss": -28.02069091796875, "global_step": 580780, "epoch": 6997} {"train_loss": -27.965362548828125, "global_step": 580781, "epoch": 6997} {"train_loss": -28.232696533203125, "global_step": 580782, "epoch": 6997} {"train_loss": -28.212249755859375, "global_step": 580783, "epoch": 6997} {"train_loss": -27.812549591064453, "global_step": 580784, "epoch": 6997} {"train_loss": -28.35099220275879, "global_step": 580785, "epoch": 6997} {"train_loss": -28.06671714782715, "global_step": 580786, "epoch": 6997} {"train_loss": -28.185317993164062, "global_step": 580787, "epoch": 6997} {"train_loss": -28.105085372924805, "global_step": 580788, "epoch": 6997} {"train_loss": -27.964380264282227, "global_step": 580789, "epoch": 6997} {"train_loss": -27.859027862548828, "global_step": 580790, "epoch": 6997} {"train_loss": -28.091489791870117, "global_step": 580791, "epoch": 6997} {"train_loss": -27.820178985595703, "global_step": 580792, "epoch": 6997} {"train_loss": -28.157068252563477, "global_step": 580793, "epoch": 6997} {"train_loss": -28.271337509155273, "global_step": 580794, "epoch": 6997} {"train_loss": -28.216999053955078, "global_step": 580795, "epoch": 6997} {"train_loss": -28.064809799194336, "global_step": 580796, "epoch": 6997} {"train_loss": -28.02650260925293, "global_step": 580797, "epoch": 6997} {"train_loss": -28.1586856842041, "global_step": 580798, "epoch": 6997} {"train_loss": -27.7246150970459, "global_step": 580799, "epoch": 6997} {"train_loss": -28.167463302612305, "global_step": 580800, "epoch": 6997} {"train_loss": -28.13037109375, "global_step": 580801, "epoch": 6997} {"train_loss": -28.152257919311523, "global_step": 580802, "epoch": 6997} {"train_loss": -28.110992431640625, "global_step": 580803, "epoch": 6997} {"train_loss": -28.193603515625, "global_step": 580804, "epoch": 6997} {"train_loss": -27.711456298828125, "global_step": 580805, "epoch": 6997} {"train_loss": -28.181791305541992, "global_step": 580806, "epoch": 6997} {"train_loss": -27.48883628845215, "global_step": 580807, "epoch": 6997} {"train_loss": -27.2401180267334, "global_step": 580808, "epoch": 6997} {"train_loss": -26.977584838867188, "global_step": 580809, "epoch": 6997} {"train_loss": -27.971118927001953, "global_step": 580810, "epoch": 6997} {"train_loss": -27.4927921295166, "global_step": 580811, "epoch": 6997} {"train_loss": -26.996570587158203, "global_step": 580812, "epoch": 6997} {"train_loss": -27.410675048828125, "global_step": 580813, "epoch": 6997} {"train_loss": -28.153417587280273, "global_step": 580814, "epoch": 6997} {"train_loss": -27.65380859375, "global_step": 580815, "epoch": 6997} {"train_loss": -27.184865951538086, "global_step": 580816, "epoch": 6997} {"train_loss": -27.715940475463867, "global_step": 580817, "epoch": 6997} {"train_loss": -27.391605377197266, "global_step": 580818, "epoch": 6997} {"train_loss": -27.758163452148438, "global_step": 580819, "epoch": 6997} {"train_loss": -27.6356258392334, "global_step": 580820, "epoch": 6997} {"train_loss": -27.6358585357666, "global_step": 580821, "epoch": 6997} {"train_loss": -27.86495018005371, "global_step": 580822, "epoch": 6997} {"train_loss": -28.152036666870117, "global_step": 580823, "epoch": 6997} {"train_loss": -27.91169548034668, "global_step": 580824, "epoch": 6997} {"train_loss": -27.770160675048828, "global_step": 580825, "epoch": 6997} {"train_loss": -27.826904296875, "global_step": 580826, "epoch": 6997} {"train_loss": -27.740741729736328, "global_step": 580827, "epoch": 6997} {"train_loss": -27.79157829284668, "global_step": 580828, "epoch": 6997} {"train_loss": -28.057159423828125, "global_step": 580829, "epoch": 6997} {"train_loss": -28.00269889831543, "global_step": 580830, "epoch": 6997} {"train_loss": -27.5762939453125, "global_step": 580831, "epoch": 6997} {"train_loss": -28.076801300048828, "global_step": 580832, "epoch": 6997} {"train_loss": -27.795298082282745, "global_step": 580833, "epoch": 6997, "val_loss": 6486364.5} {"train_loss": -27.262165069580078, "global_step": 580834, "epoch": 6998} {"train_loss": -27.470468521118164, "global_step": 580835, "epoch": 6998} {"train_loss": -27.538959503173828, "global_step": 580836, "epoch": 6998} {"train_loss": -27.622228622436523, "global_step": 580837, "epoch": 6998} {"train_loss": -27.69318199157715, "global_step": 580838, "epoch": 6998} {"train_loss": -27.605331420898438, "global_step": 580839, "epoch": 6998} {"train_loss": -27.93556022644043, "global_step": 580840, "epoch": 6998} {"train_loss": -27.4329891204834, "global_step": 580841, "epoch": 6998} {"train_loss": -26.91668701171875, "global_step": 580842, "epoch": 6998} {"train_loss": -27.977819442749023, "global_step": 580843, "epoch": 6998} {"train_loss": -27.46626091003418, "global_step": 580844, "epoch": 6998} {"train_loss": -26.74690055847168, "global_step": 580845, "epoch": 6998} {"train_loss": -27.575885772705078, "global_step": 580846, "epoch": 6998} {"train_loss": -26.808258056640625, "global_step": 580847, "epoch": 6998} {"train_loss": -27.298065185546875, "global_step": 580848, "epoch": 6998} {"train_loss": -27.064441680908203, "global_step": 580849, "epoch": 6998} {"train_loss": -27.335866928100586, "global_step": 580850, "epoch": 6998} {"train_loss": -27.080801010131836, "global_step": 580851, "epoch": 6998} {"train_loss": -27.549640655517578, "global_step": 580852, "epoch": 6998} {"train_loss": -27.63614845275879, "global_step": 580853, "epoch": 6998} {"train_loss": -27.011030197143555, "global_step": 580854, "epoch": 6998} {"train_loss": -27.214569091796875, "global_step": 580855, "epoch": 6998} {"train_loss": -27.793325424194336, "global_step": 580856, "epoch": 6998} {"train_loss": -27.110004425048828, "global_step": 580857, "epoch": 6998} {"train_loss": -27.583398818969727, "global_step": 580858, "epoch": 6998} {"train_loss": -27.702722549438477, "global_step": 580859, "epoch": 6998} {"train_loss": -27.59205436706543, "global_step": 580860, "epoch": 6998} {"train_loss": -27.696334838867188, "global_step": 580861, "epoch": 6998} {"train_loss": -27.66448402404785, "global_step": 580862, "epoch": 6998} {"train_loss": -27.8078670501709, "global_step": 580863, "epoch": 6998} {"train_loss": -27.74932861328125, "global_step": 580864, "epoch": 6998} {"train_loss": -27.44184684753418, "global_step": 580865, "epoch": 6998} {"train_loss": -27.747665405273438, "global_step": 580866, "epoch": 6998} {"train_loss": -27.619901657104492, "global_step": 580867, "epoch": 6998} {"train_loss": -27.741369247436523, "global_step": 580868, "epoch": 6998} {"train_loss": -28.0748291015625, "global_step": 580869, "epoch": 6998} {"train_loss": -27.762378692626953, "global_step": 580870, "epoch": 6998} {"train_loss": -27.514917373657227, "global_step": 580871, "epoch": 6998} {"train_loss": -28.09148597717285, "global_step": 580872, "epoch": 6998} {"train_loss": -27.802160263061523, "global_step": 580873, "epoch": 6998} {"train_loss": -27.73333168029785, "global_step": 580874, "epoch": 6998} {"train_loss": -27.666906356811523, "global_step": 580875, "epoch": 6998} {"train_loss": -27.786474227905273, "global_step": 580876, "epoch": 6998} {"train_loss": -27.708459854125977, "global_step": 580877, "epoch": 6998} {"train_loss": -27.879058837890625, "global_step": 580878, "epoch": 6998} {"train_loss": -27.645389556884766, "global_step": 580879, "epoch": 6998} {"train_loss": -28.022138595581055, "global_step": 580880, "epoch": 6998} {"train_loss": -27.52248191833496, "global_step": 580881, "epoch": 6998} {"train_loss": -27.725011825561523, "global_step": 580882, "epoch": 6998} {"train_loss": -27.750280380249023, "global_step": 580883, "epoch": 6998} {"train_loss": -27.940826416015625, "global_step": 580884, "epoch": 6998} {"train_loss": -27.96211051940918, "global_step": 580885, "epoch": 6998} {"train_loss": -27.936365127563477, "global_step": 580886, "epoch": 6998} {"train_loss": -28.342809677124023, "global_step": 580887, "epoch": 6998} {"train_loss": -27.932687759399414, "global_step": 580888, "epoch": 6998} {"train_loss": -27.9693546295166, "global_step": 580889, "epoch": 6998} {"train_loss": -28.223852157592773, "global_step": 580890, "epoch": 6998} {"train_loss": -27.975866317749023, "global_step": 580891, "epoch": 6998} {"train_loss": -28.310810089111328, "global_step": 580892, "epoch": 6998} {"train_loss": -28.095380783081055, "global_step": 580893, "epoch": 6998} {"train_loss": -27.765832901000977, "global_step": 580894, "epoch": 6998} {"train_loss": -28.1173038482666, "global_step": 580895, "epoch": 6998} {"train_loss": -28.06298828125, "global_step": 580896, "epoch": 6998} {"train_loss": -28.057493209838867, "global_step": 580897, "epoch": 6998} {"train_loss": -27.97870445251465, "global_step": 580898, "epoch": 6998} {"train_loss": -27.903064727783203, "global_step": 580899, "epoch": 6998} {"train_loss": -28.16742515563965, "global_step": 580900, "epoch": 6998} {"train_loss": -28.193607330322266, "global_step": 580901, "epoch": 6998} {"train_loss": -27.99872398376465, "global_step": 580902, "epoch": 6998} {"train_loss": -28.049213409423828, "global_step": 580903, "epoch": 6998} {"train_loss": -28.180835723876953, "global_step": 580904, "epoch": 6998} {"train_loss": -28.249286651611328, "global_step": 580905, "epoch": 6998} {"train_loss": -28.101791381835938, "global_step": 580906, "epoch": 6998} {"train_loss": -27.984296798706055, "global_step": 580907, "epoch": 6998} {"train_loss": -27.946027755737305, "global_step": 580908, "epoch": 6998} {"train_loss": -27.199481964111328, "global_step": 580909, "epoch": 6998} {"train_loss": -27.265384674072266, "global_step": 580910, "epoch": 6998} {"train_loss": -27.525390625, "global_step": 580911, "epoch": 6998} {"train_loss": -27.415821075439453, "global_step": 580912, "epoch": 6998} {"train_loss": -27.998016357421875, "global_step": 580913, "epoch": 6998} {"train_loss": -27.69525718688965, "global_step": 580914, "epoch": 6998} {"train_loss": -27.929035186767578, "global_step": 580915, "epoch": 6998} {"train_loss": -27.701286178037346, "global_step": 580916, "epoch": 6998, "val_loss": 6412250.0} {"train_loss": -27.4578857421875, "global_step": 580917, "epoch": 6999} {"train_loss": -27.26983642578125, "global_step": 580918, "epoch": 6999} {"train_loss": -27.454620361328125, "global_step": 580919, "epoch": 6999} {"train_loss": -27.28816032409668, "global_step": 580920, "epoch": 6999} {"train_loss": -26.325292587280273, "global_step": 580921, "epoch": 6999} {"train_loss": -26.47490882873535, "global_step": 580922, "epoch": 6999} {"train_loss": -28.105886459350586, "global_step": 580923, "epoch": 6999} {"train_loss": -27.14649772644043, "global_step": 580924, "epoch": 6999} {"train_loss": -27.07447624206543, "global_step": 580925, "epoch": 6999} {"train_loss": -27.568639755249023, "global_step": 580926, "epoch": 6999} {"train_loss": -27.44569206237793, "global_step": 580927, "epoch": 6999} {"train_loss": -27.582509994506836, "global_step": 580928, "epoch": 6999} {"train_loss": -27.499832153320312, "global_step": 580929, "epoch": 6999} {"train_loss": -27.23589515686035, "global_step": 580930, "epoch": 6999} {"train_loss": -27.16046142578125, "global_step": 580931, "epoch": 6999} {"train_loss": -27.67010498046875, "global_step": 580932, "epoch": 6999} {"train_loss": -27.76639175415039, "global_step": 580933, "epoch": 6999} {"train_loss": -27.279403686523438, "global_step": 580934, "epoch": 6999} {"train_loss": -27.215545654296875, "global_step": 580935, "epoch": 6999} {"train_loss": -27.639053344726562, "global_step": 580936, "epoch": 6999} {"train_loss": -27.5948486328125, "global_step": 580937, "epoch": 6999} {"train_loss": -27.86628532409668, "global_step": 580938, "epoch": 6999} {"train_loss": -27.863250732421875, "global_step": 580939, "epoch": 6999} {"train_loss": -27.71710777282715, "global_step": 580940, "epoch": 6999} {"train_loss": -27.8825626373291, "global_step": 580941, "epoch": 6999} {"train_loss": -27.670551300048828, "global_step": 580942, "epoch": 6999} {"train_loss": -27.62006187438965, "global_step": 580943, "epoch": 6999} {"train_loss": -27.330480575561523, "global_step": 580944, "epoch": 6999} {"train_loss": -28.22701072692871, "global_step": 580945, "epoch": 6999} {"train_loss": -27.585813522338867, "global_step": 580946, "epoch": 6999} {"train_loss": -27.94464111328125, "global_step": 580947, "epoch": 6999} {"train_loss": -28.07840347290039, "global_step": 580948, "epoch": 6999} {"train_loss": -27.591596603393555, "global_step": 580949, "epoch": 6999} {"train_loss": -27.673986434936523, "global_step": 580950, "epoch": 6999} {"train_loss": -27.73377799987793, "global_step": 580951, "epoch": 6999} {"train_loss": -27.717880249023438, "global_step": 580952, "epoch": 6999} {"train_loss": -27.91684913635254, "global_step": 580953, "epoch": 6999} {"train_loss": -27.78812026977539, "global_step": 580954, "epoch": 6999} {"train_loss": -27.85800552368164, "global_step": 580955, "epoch": 6999} {"train_loss": -28.296817779541016, "global_step": 580956, "epoch": 6999} {"train_loss": -27.773517608642578, "global_step": 580957, "epoch": 6999} {"train_loss": -27.664587020874023, "global_step": 580958, "epoch": 6999} {"train_loss": -27.808704376220703, "global_step": 580959, "epoch": 6999} {"train_loss": -28.00006103515625, "global_step": 580960, "epoch": 6999} {"train_loss": -27.9013614654541, "global_step": 580961, "epoch": 6999} {"train_loss": -27.963144302368164, "global_step": 580962, "epoch": 6999} {"train_loss": -27.87163734436035, "global_step": 580963, "epoch": 6999} {"train_loss": -28.450387954711914, "global_step": 580964, "epoch": 6999} {"train_loss": -27.84539794921875, "global_step": 580965, "epoch": 6999} {"train_loss": -28.24712562561035, "global_step": 580966, "epoch": 6999} {"train_loss": -27.9267520904541, "global_step": 580967, "epoch": 6999} {"train_loss": -28.260513305664062, "global_step": 580968, "epoch": 6999} {"train_loss": -28.29136085510254, "global_step": 580969, "epoch": 6999} {"train_loss": -28.329120635986328, "global_step": 580970, "epoch": 6999} {"train_loss": -28.095571517944336, "global_step": 580971, "epoch": 6999} {"train_loss": -27.891193389892578, "global_step": 580972, "epoch": 6999} {"train_loss": -28.115585327148438, "global_step": 580973, "epoch": 6999} {"train_loss": -28.213470458984375, "global_step": 580974, "epoch": 6999} {"train_loss": -28.237401962280273, "global_step": 580975, "epoch": 6999} {"train_loss": -28.255828857421875, "global_step": 580976, "epoch": 6999} {"train_loss": -27.889448165893555, "global_step": 580977, "epoch": 6999} {"train_loss": -28.29542350769043, "global_step": 580978, "epoch": 6999} {"train_loss": -27.6441707611084, "global_step": 580979, "epoch": 6999} {"train_loss": -27.623035430908203, "global_step": 580980, "epoch": 6999} {"train_loss": -28.23029136657715, "global_step": 580981, "epoch": 6999} {"train_loss": -27.88465690612793, "global_step": 580982, "epoch": 6999} {"train_loss": -27.911823272705078, "global_step": 580983, "epoch": 6999} {"train_loss": -28.045896530151367, "global_step": 580984, "epoch": 6999} {"train_loss": -27.936634063720703, "global_step": 580985, "epoch": 6999} {"train_loss": -28.28312110900879, "global_step": 580986, "epoch": 6999} {"train_loss": -28.084585189819336, "global_step": 580987, "epoch": 6999} {"train_loss": -27.73291015625, "global_step": 580988, "epoch": 6999} {"train_loss": -28.072296142578125, "global_step": 580989, "epoch": 6999} {"train_loss": -28.304214477539062, "global_step": 580990, "epoch": 6999} {"train_loss": -27.823760986328125, "global_step": 580991, "epoch": 6999} {"train_loss": -28.14539909362793, "global_step": 580992, "epoch": 6999} {"train_loss": -27.89876365661621, "global_step": 580993, "epoch": 6999} {"train_loss": -28.33306884765625, "global_step": 580994, "epoch": 6999} {"train_loss": -28.152490615844727, "global_step": 580995, "epoch": 6999} {"train_loss": -28.33631706237793, "global_step": 580996, "epoch": 6999} {"train_loss": -28.221881866455078, "global_step": 580997, "epoch": 6999} {"train_loss": -28.265491485595703, "global_step": 580998, "epoch": 6999} {"train_loss": -27.817715357585126, "global_step": 580999, "epoch": 6999, "val_loss": 6432823.0} {"train_loss": -27.893903732299805, "global_step": 581000, "epoch": 7000} {"train_loss": -27.646228790283203, "global_step": 581001, "epoch": 7000} {"train_loss": -27.31821632385254, "global_step": 581002, "epoch": 7000} {"train_loss": -27.729766845703125, "global_step": 581003, "epoch": 7000} {"train_loss": -28.31839942932129, "global_step": 581004, "epoch": 7000} {"train_loss": -27.528003692626953, "global_step": 581005, "epoch": 7000} {"train_loss": -27.336591720581055, "global_step": 581006, "epoch": 7000} {"train_loss": -27.282209396362305, "global_step": 581007, "epoch": 7000} {"train_loss": -27.274526596069336, "global_step": 581008, "epoch": 7000} {"train_loss": -27.488813400268555, "global_step": 581009, "epoch": 7000} {"train_loss": -27.558027267456055, "global_step": 581010, "epoch": 7000} {"train_loss": -27.836109161376953, "global_step": 581011, "epoch": 7000} {"train_loss": -27.47018814086914, "global_step": 581012, "epoch": 7000} {"train_loss": -27.98652458190918, "global_step": 581013, "epoch": 7000} {"train_loss": -27.37436294555664, "global_step": 581014, "epoch": 7000} {"train_loss": -27.456378936767578, "global_step": 581015, "epoch": 7000} {"train_loss": -27.592849731445312, "global_step": 581016, "epoch": 7000} {"train_loss": -27.7858829498291, "global_step": 581017, "epoch": 7000} {"train_loss": -27.708463668823242, "global_step": 581018, "epoch": 7000} {"train_loss": -27.539764404296875, "global_step": 581019, "epoch": 7000} {"train_loss": -27.538442611694336, "global_step": 581020, "epoch": 7000} {"train_loss": -27.488168716430664, "global_step": 581021, "epoch": 7000} {"train_loss": -28.042266845703125, "global_step": 581022, "epoch": 7000} {"train_loss": -27.50648307800293, "global_step": 581023, "epoch": 7000} {"train_loss": -28.099292755126953, "global_step": 581024, "epoch": 7000} {"train_loss": -27.510175704956055, "global_step": 581025, "epoch": 7000} {"train_loss": -27.69672966003418, "global_step": 581026, "epoch": 7000} {"train_loss": -27.882612228393555, "global_step": 581027, "epoch": 7000} {"train_loss": -27.832157135009766, "global_step": 581028, "epoch": 7000} {"train_loss": -27.819995880126953, "global_step": 581029, "epoch": 7000} {"train_loss": -27.658832550048828, "global_step": 581030, "epoch": 7000} {"train_loss": -28.10983657836914, "global_step": 581031, "epoch": 7000} {"train_loss": -27.930927276611328, "global_step": 581032, "epoch": 7000} {"train_loss": -27.9586238861084, "global_step": 581033, "epoch": 7000} {"train_loss": -27.866683959960938, "global_step": 581034, "epoch": 7000} {"train_loss": -28.16266441345215, "global_step": 581035, "epoch": 7000} {"train_loss": -28.10694694519043, "global_step": 581036, "epoch": 7000} {"train_loss": -27.8886661529541, "global_step": 581037, "epoch": 7000} {"train_loss": -27.744287490844727, "global_step": 581038, "epoch": 7000} {"train_loss": -28.052356719970703, "global_step": 581039, "epoch": 7000} {"train_loss": -27.831592559814453, "global_step": 581040, "epoch": 7000} {"train_loss": -28.034255981445312, "global_step": 581041, "epoch": 7000} {"train_loss": -27.917200088500977, "global_step": 581042, "epoch": 7000} {"train_loss": -27.638931274414062, "global_step": 581043, "epoch": 7000} {"train_loss": -28.26993751525879, "global_step": 581044, "epoch": 7000} {"train_loss": -28.075424194335938, "global_step": 581045, "epoch": 7000} {"train_loss": -28.061969757080078, "global_step": 581046, "epoch": 7000} {"train_loss": -27.68216896057129, "global_step": 581047, "epoch": 7000} {"train_loss": -27.81890296936035, "global_step": 581048, "epoch": 7000} {"train_loss": -27.537506103515625, "global_step": 581049, "epoch": 7000} {"train_loss": -27.905105590820312, "global_step": 581050, "epoch": 7000} {"train_loss": -28.358991622924805, "global_step": 581051, "epoch": 7000} {"train_loss": -28.08892822265625, "global_step": 581052, "epoch": 7000} {"train_loss": -27.9592342376709, "global_step": 581053, "epoch": 7000} {"train_loss": -27.91035270690918, "global_step": 581054, "epoch": 7000} {"train_loss": -28.213125228881836, "global_step": 581055, "epoch": 7000} {"train_loss": -28.3710880279541, "global_step": 581056, "epoch": 7000} {"train_loss": -28.016712188720703, "global_step": 581057, "epoch": 7000} {"train_loss": -27.75665855407715, "global_step": 581058, "epoch": 7000} {"train_loss": -27.82233238220215, "global_step": 581059, "epoch": 7000} {"train_loss": -28.31431007385254, "global_step": 581060, "epoch": 7000} {"train_loss": -28.234149932861328, "global_step": 581061, "epoch": 7000} {"train_loss": -27.989694595336914, "global_step": 581062, "epoch": 7000} {"train_loss": -28.282562255859375, "global_step": 581063, "epoch": 7000} {"train_loss": -28.1816349029541, "global_step": 581064, "epoch": 7000} {"train_loss": -27.369964599609375, "global_step": 581065, "epoch": 7000} {"train_loss": -27.62762451171875, "global_step": 581066, "epoch": 7000} {"train_loss": -26.980091094970703, "global_step": 581067, "epoch": 7000} {"train_loss": -26.845264434814453, "global_step": 581068, "epoch": 7000} {"train_loss": -27.639434814453125, "global_step": 581069, "epoch": 7000} {"train_loss": -27.71870231628418, "global_step": 581070, "epoch": 7000} {"train_loss": -27.034521102905273, "global_step": 581071, "epoch": 7000} {"train_loss": -27.028188705444336, "global_step": 581072, "epoch": 7000} {"train_loss": -27.662214279174805, "global_step": 581073, "epoch": 7000} {"train_loss": -26.904539108276367, "global_step": 581074, "epoch": 7000} {"train_loss": -28.01922035217285, "global_step": 581075, "epoch": 7000} {"train_loss": -27.38385581970215, "global_step": 581076, "epoch": 7000} {"train_loss": -27.631458282470703, "global_step": 581077, "epoch": 7000} {"train_loss": -27.734777450561523, "global_step": 581078, "epoch": 7000} {"train_loss": -27.821149826049805, "global_step": 581079, "epoch": 7000} {"train_loss": -27.815204620361328, "global_step": 581080, "epoch": 7000} {"train_loss": -27.874990463256836, "global_step": 581081, "epoch": 7000} {"train_loss": -27.744881135871612, "global_step": 581082, "epoch": 7000, "train/sim_max_reward_0": 1.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4500000": 1.0, "test/sim_max_reward_4500001": 1.0, "test/sim_max_reward_4500002": 1.0, "test/sim_max_reward_4500003": 1.0, "test/sim_max_reward_4500004": 1.0, "test/sim_max_reward_4500005": 1.0, "test/sim_max_reward_4500006": 1.0, "test/sim_max_reward_4500007": 0.0, "test/sim_max_reward_4500008": 1.0, "test/sim_max_reward_4500009": 1.0, "test/sim_max_reward_4500010": 1.0, "test/sim_max_reward_4500011": 1.0, "test/sim_max_reward_4500012": 1.0, "test/sim_max_reward_4500013": 0.0, "test/sim_max_reward_4500014": 1.0, "test/sim_max_reward_4500015": 1.0, "test/sim_max_reward_4500016": 1.0, "test/sim_max_reward_4500017": 1.0, "test/sim_max_reward_4500018": 0.0, "test/sim_max_reward_4500019": 0.0, "test/sim_max_reward_4500020": 1.0, "test/sim_max_reward_4500021": 1.0, "train/mean_score": 1.0, "test/mean_score": 0.8181818181818182, "val_loss": 6491181.5} {"train_loss": -26.54463005065918, "global_step": 581083, "epoch": 7001} {"train_loss": -26.762189865112305, "global_step": 581084, "epoch": 7001} {"train_loss": -27.168365478515625, "global_step": 581085, "epoch": 7001} {"train_loss": -26.554706573486328, "global_step": 581086, "epoch": 7001} {"train_loss": -27.303730010986328, "global_step": 581087, "epoch": 7001} {"train_loss": -26.626392364501953, "global_step": 581088, "epoch": 7001} {"train_loss": -27.273889541625977, "global_step": 581089, "epoch": 7001} {"train_loss": -26.959997177124023, "global_step": 581090, "epoch": 7001} {"train_loss": -27.458173751831055, "global_step": 581091, "epoch": 7001} {"train_loss": -27.4200382232666, "global_step": 581092, "epoch": 7001} {"train_loss": -27.697607040405273, "global_step": 581093, "epoch": 7001} {"train_loss": -27.768598556518555, "global_step": 581094, "epoch": 7001} {"train_loss": -27.67170524597168, "global_step": 581095, "epoch": 7001} {"train_loss": -27.689233779907227, "global_step": 581096, "epoch": 7001} {"train_loss": -27.476593017578125, "global_step": 581097, "epoch": 7001} {"train_loss": -27.63880729675293, "global_step": 581098, "epoch": 7001} {"train_loss": -27.698007583618164, "global_step": 581099, "epoch": 7001} {"train_loss": -27.618432998657227, "global_step": 581100, "epoch": 7001} {"train_loss": -27.757720947265625, "global_step": 581101, "epoch": 7001} {"train_loss": -27.81525993347168, "global_step": 581102, "epoch": 7001} {"train_loss": -27.745656967163086, "global_step": 581103, "epoch": 7001} {"train_loss": -28.01429557800293, "global_step": 581104, "epoch": 7001} {"train_loss": -27.536291122436523, "global_step": 581105, "epoch": 7001} {"train_loss": -28.057214736938477, "global_step": 581106, "epoch": 7001} {"train_loss": -27.69121742248535, "global_step": 581107, "epoch": 7001} {"train_loss": -27.778974533081055, "global_step": 581108, "epoch": 7001} {"train_loss": -27.854150772094727, "global_step": 581109, "epoch": 7001} {"train_loss": -27.73689842224121, "global_step": 581110, "epoch": 7001} {"train_loss": -28.276565551757812, "global_step": 581111, "epoch": 7001} {"train_loss": -27.763574600219727, "global_step": 581112, "epoch": 7001} {"train_loss": -27.832849502563477, "global_step": 581113, "epoch": 7001} {"train_loss": -27.8698787689209, "global_step": 581114, "epoch": 7001} {"train_loss": -28.266082763671875, "global_step": 581115, "epoch": 7001} {"train_loss": -28.128986358642578, "global_step": 581116, "epoch": 7001} {"train_loss": -27.890356063842773, "global_step": 581117, "epoch": 7001} {"train_loss": -28.10530662536621, "global_step": 581118, "epoch": 7001} {"train_loss": -28.127531051635742, "global_step": 581119, "epoch": 7001} {"train_loss": -27.859968185424805, "global_step": 581120, "epoch": 7001} {"train_loss": -27.839162826538086, "global_step": 581121, "epoch": 7001} {"train_loss": -27.955204010009766, "global_step": 581122, "epoch": 7001} {"train_loss": -27.972944259643555, "global_step": 581123, "epoch": 7001} {"train_loss": -28.142841339111328, "global_step": 581124, "epoch": 7001} {"train_loss": -27.58461570739746, "global_step": 581125, "epoch": 7001} {"train_loss": -27.869171142578125, "global_step": 581126, "epoch": 7001} {"train_loss": -28.008840560913086, "global_step": 581127, "epoch": 7001} {"train_loss": -28.359527587890625, "global_step": 581128, "epoch": 7001} {"train_loss": -28.02643394470215, "global_step": 581129, "epoch": 7001} {"train_loss": -27.788589477539062, "global_step": 581130, "epoch": 7001} {"train_loss": -28.677398681640625, "global_step": 581131, "epoch": 7001} {"train_loss": -28.200366973876953, "global_step": 581132, "epoch": 7001} {"train_loss": -28.258092880249023, "global_step": 581133, "epoch": 7001} {"train_loss": -28.012842178344727, "global_step": 581134, "epoch": 7001} {"train_loss": -28.15280532836914, "global_step": 581135, "epoch": 7001} {"train_loss": -27.877599716186523, "global_step": 581136, "epoch": 7001} {"train_loss": -28.35162925720215, "global_step": 581137, "epoch": 7001} {"train_loss": -27.74830436706543, "global_step": 581138, "epoch": 7001} {"train_loss": -27.996000289916992, "global_step": 581139, "epoch": 7001} {"train_loss": -28.0978946685791, "global_step": 581140, "epoch": 7001} {"train_loss": -28.19233512878418, "global_step": 581141, "epoch": 7001} {"train_loss": -28.461462020874023, "global_step": 581142, "epoch": 7001} {"train_loss": -28.3604679107666, "global_step": 581143, "epoch": 7001} {"train_loss": -28.056859970092773, "global_step": 581144, "epoch": 7001} {"train_loss": -27.7625732421875, "global_step": 581145, "epoch": 7001} {"train_loss": -27.443933486938477, "global_step": 581146, "epoch": 7001} {"train_loss": -27.408430099487305, "global_step": 581147, "epoch": 7001} {"train_loss": -26.436279296875, "global_step": 581148, "epoch": 7001} {"train_loss": -25.430967330932617, "global_step": 581149, "epoch": 7001} {"train_loss": -26.79618263244629, "global_step": 581150, "epoch": 7001} {"train_loss": -27.65046501159668, "global_step": 581151, "epoch": 7001} {"train_loss": -26.342477798461914, "global_step": 581152, "epoch": 7001} {"train_loss": -26.63286781311035, "global_step": 581153, "epoch": 7001} {"train_loss": -27.602558135986328, "global_step": 581154, "epoch": 7001} {"train_loss": -27.2684383392334, "global_step": 581155, "epoch": 7001} {"train_loss": -27.72254753112793, "global_step": 581156, "epoch": 7001} {"train_loss": -27.289602279663086, "global_step": 581157, "epoch": 7001} {"train_loss": -27.498273849487305, "global_step": 581158, "epoch": 7001} {"train_loss": -27.421512603759766, "global_step": 581159, "epoch": 7001} {"train_loss": -27.25738525390625, "global_step": 581160, "epoch": 7001} {"train_loss": -27.796751022338867, "global_step": 581161, "epoch": 7001} {"train_loss": -27.366662979125977, "global_step": 581162, "epoch": 7001} {"train_loss": -27.657262802124023, "global_step": 581163, "epoch": 7001} {"train_loss": -27.65630531311035, "global_step": 581164, "epoch": 7001} {"train_loss": -27.673251278429145, "global_step": 581165, "epoch": 7001, "val_loss": 6376446.0} {"train_loss": -27.665735244750977, "global_step": 581166, "epoch": 7002} {"train_loss": -27.27005386352539, "global_step": 581167, "epoch": 7002} {"train_loss": -27.465728759765625, "global_step": 581168, "epoch": 7002} {"train_loss": -27.410741806030273, "global_step": 581169, "epoch": 7002} {"train_loss": -27.507837295532227, "global_step": 581170, "epoch": 7002} {"train_loss": -27.072402954101562, "global_step": 581171, "epoch": 7002} {"train_loss": -27.555133819580078, "global_step": 581172, "epoch": 7002} {"train_loss": -27.28169059753418, "global_step": 581173, "epoch": 7002} {"train_loss": -27.525487899780273, "global_step": 581174, "epoch": 7002} {"train_loss": -27.66925621032715, "global_step": 581175, "epoch": 7002} {"train_loss": -27.4832763671875, "global_step": 581176, "epoch": 7002} {"train_loss": -27.599096298217773, "global_step": 581177, "epoch": 7002} {"train_loss": -27.56976318359375, "global_step": 581178, "epoch": 7002} {"train_loss": -28.119733810424805, "global_step": 581179, "epoch": 7002} {"train_loss": -27.8489990234375, "global_step": 581180, "epoch": 7002} {"train_loss": -27.738117218017578, "global_step": 581181, "epoch": 7002} {"train_loss": -27.909276962280273, "global_step": 581182, "epoch": 7002} {"train_loss": -27.929548263549805, "global_step": 581183, "epoch": 7002} {"train_loss": -27.990976333618164, "global_step": 581184, "epoch": 7002} {"train_loss": -28.067981719970703, "global_step": 581185, "epoch": 7002} {"train_loss": -27.587879180908203, "global_step": 581186, "epoch": 7002} {"train_loss": -27.79144859313965, "global_step": 581187, "epoch": 7002} {"train_loss": -27.75856590270996, "global_step": 581188, "epoch": 7002} {"train_loss": -28.164854049682617, "global_step": 581189, "epoch": 7002} {"train_loss": -27.765729904174805, "global_step": 581190, "epoch": 7002} {"train_loss": -27.926746368408203, "global_step": 581191, "epoch": 7002} {"train_loss": -28.086576461791992, "global_step": 581192, "epoch": 7002} {"train_loss": -28.38071632385254, "global_step": 581193, "epoch": 7002} {"train_loss": -27.49654197692871, "global_step": 581194, "epoch": 7002} {"train_loss": -28.120641708374023, "global_step": 581195, "epoch": 7002} {"train_loss": -27.935041427612305, "global_step": 581196, "epoch": 7002} {"train_loss": -27.8819580078125, "global_step": 581197, "epoch": 7002} {"train_loss": -28.270185470581055, "global_step": 581198, "epoch": 7002} {"train_loss": -27.969343185424805, "global_step": 581199, "epoch": 7002} {"train_loss": -28.380115509033203, "global_step": 581200, "epoch": 7002} {"train_loss": -27.741193771362305, "global_step": 581201, "epoch": 7002} {"train_loss": -27.851810455322266, "global_step": 581202, "epoch": 7002} {"train_loss": -27.533605575561523, "global_step": 581203, "epoch": 7002} {"train_loss": -27.798383712768555, "global_step": 581204, "epoch": 7002} {"train_loss": -28.28388023376465, "global_step": 581205, "epoch": 7002} {"train_loss": -28.128320693969727, "global_step": 581206, "epoch": 7002} {"train_loss": -28.09906005859375, "global_step": 581207, "epoch": 7002} {"train_loss": -27.816070556640625, "global_step": 581208, "epoch": 7002} {"train_loss": -27.801843643188477, "global_step": 581209, "epoch": 7002} {"train_loss": -28.0966739654541, "global_step": 581210, "epoch": 7002} {"train_loss": -27.740964889526367, "global_step": 581211, "epoch": 7002} {"train_loss": -27.603368759155273, "global_step": 581212, "epoch": 7002} {"train_loss": -28.245153427124023, "global_step": 581213, "epoch": 7002} {"train_loss": -27.765039443969727, "global_step": 581214, "epoch": 7002} {"train_loss": -28.25191307067871, "global_step": 581215, "epoch": 7002} {"train_loss": -28.060468673706055, "global_step": 581216, "epoch": 7002} {"train_loss": -27.88823890686035, "global_step": 581217, "epoch": 7002} {"train_loss": -28.11732292175293, "global_step": 581218, "epoch": 7002} {"train_loss": -27.781564712524414, "global_step": 581219, "epoch": 7002} {"train_loss": -27.93450355529785, "global_step": 581220, "epoch": 7002} {"train_loss": -27.896570205688477, "global_step": 581221, "epoch": 7002} {"train_loss": -27.934980392456055, "global_step": 581222, "epoch": 7002} {"train_loss": -28.337833404541016, "global_step": 581223, "epoch": 7002} {"train_loss": -28.13457679748535, "global_step": 581224, "epoch": 7002} {"train_loss": -27.905988693237305, "global_step": 581225, "epoch": 7002} {"train_loss": -27.8731689453125, "global_step": 581226, "epoch": 7002} {"train_loss": -28.3632755279541, "global_step": 581227, "epoch": 7002} {"train_loss": -27.959150314331055, "global_step": 581228, "epoch": 7002} {"train_loss": -27.976715087890625, "global_step": 581229, "epoch": 7002} {"train_loss": -28.00868034362793, "global_step": 581230, "epoch": 7002} {"train_loss": -28.129064559936523, "global_step": 581231, "epoch": 7002} {"train_loss": -28.250598907470703, "global_step": 581232, "epoch": 7002} {"train_loss": -28.397287368774414, "global_step": 581233, "epoch": 7002} {"train_loss": -28.24045753479004, "global_step": 581234, "epoch": 7002} {"train_loss": -28.05755615234375, "global_step": 581235, "epoch": 7002} {"train_loss": -27.89019775390625, "global_step": 581236, "epoch": 7002} {"train_loss": -28.351200103759766, "global_step": 581237, "epoch": 7002} {"train_loss": -28.2977352142334, "global_step": 581238, "epoch": 7002} {"train_loss": -27.971708297729492, "global_step": 581239, "epoch": 7002} {"train_loss": -27.617481231689453, "global_step": 581240, "epoch": 7002} {"train_loss": -27.863134384155273, "global_step": 581241, "epoch": 7002} {"train_loss": -27.803064346313477, "global_step": 581242, "epoch": 7002} {"train_loss": -27.858154296875, "global_step": 581243, "epoch": 7002} {"train_loss": -27.865896224975586, "global_step": 581244, "epoch": 7002} {"train_loss": -27.956567764282227, "global_step": 581245, "epoch": 7002} {"train_loss": -28.110336303710938, "global_step": 581246, "epoch": 7002} {"train_loss": -27.731281280517578, "global_step": 581247, "epoch": 7002} {"train_loss": -27.882016400256788, "global_step": 581248, "epoch": 7002, "val_loss": 6554323.0} {"train_loss": -26.255573272705078, "global_step": 581249, "epoch": 7003} {"train_loss": -25.561445236206055, "global_step": 581250, "epoch": 7003} {"train_loss": -26.575641632080078, "global_step": 581251, "epoch": 7003} {"train_loss": -26.02543067932129, "global_step": 581252, "epoch": 7003} {"train_loss": -26.185434341430664, "global_step": 581253, "epoch": 7003} {"train_loss": -26.451629638671875, "global_step": 581254, "epoch": 7003} {"train_loss": -26.725797653198242, "global_step": 581255, "epoch": 7003} {"train_loss": -26.692474365234375, "global_step": 581256, "epoch": 7003} {"train_loss": -26.632863998413086, "global_step": 581257, "epoch": 7003} {"train_loss": -26.873233795166016, "global_step": 581258, "epoch": 7003} {"train_loss": -26.9872989654541, "global_step": 581259, "epoch": 7003} {"train_loss": -27.102502822875977, "global_step": 581260, "epoch": 7003} {"train_loss": -27.2533016204834, "global_step": 581261, "epoch": 7003} {"train_loss": -27.304473876953125, "global_step": 581262, "epoch": 7003} {"train_loss": -27.220428466796875, "global_step": 581263, "epoch": 7003} {"train_loss": -27.24826431274414, "global_step": 581264, "epoch": 7003} {"train_loss": -27.285919189453125, "global_step": 581265, "epoch": 7003} {"train_loss": -27.417713165283203, "global_step": 581266, "epoch": 7003} {"train_loss": -27.51385498046875, "global_step": 581267, "epoch": 7003} {"train_loss": -27.44527244567871, "global_step": 581268, "epoch": 7003} {"train_loss": -27.736474990844727, "global_step": 581269, "epoch": 7003} {"train_loss": -27.622161865234375, "global_step": 581270, "epoch": 7003} {"train_loss": -27.61163902282715, "global_step": 581271, "epoch": 7003} {"train_loss": -27.739059448242188, "global_step": 581272, "epoch": 7003} {"train_loss": -27.552549362182617, "global_step": 581273, "epoch": 7003} {"train_loss": -27.520288467407227, "global_step": 581274, "epoch": 7003} {"train_loss": -28.152978897094727, "global_step": 581275, "epoch": 7003} {"train_loss": -27.375898361206055, "global_step": 581276, "epoch": 7003} {"train_loss": -27.62748146057129, "global_step": 581277, "epoch": 7003} {"train_loss": -27.75115394592285, "global_step": 581278, "epoch": 7003} {"train_loss": -27.808135986328125, "global_step": 581279, "epoch": 7003} {"train_loss": -27.51398277282715, "global_step": 581280, "epoch": 7003} {"train_loss": -27.434778213500977, "global_step": 581281, "epoch": 7003} {"train_loss": -27.689138412475586, "global_step": 581282, "epoch": 7003} {"train_loss": -27.832931518554688, "global_step": 581283, "epoch": 7003} {"train_loss": -27.7518253326416, "global_step": 581284, "epoch": 7003} {"train_loss": -27.962848663330078, "global_step": 581285, "epoch": 7003} {"train_loss": -27.687393188476562, "global_step": 581286, "epoch": 7003} {"train_loss": -28.132368087768555, "global_step": 581287, "epoch": 7003} {"train_loss": -27.979623794555664, "global_step": 581288, "epoch": 7003} {"train_loss": -27.668668746948242, "global_step": 581289, "epoch": 7003} {"train_loss": -27.998382568359375, "global_step": 581290, "epoch": 7003} {"train_loss": -27.91541862487793, "global_step": 581291, "epoch": 7003} {"train_loss": -28.157148361206055, "global_step": 581292, "epoch": 7003} {"train_loss": -28.064685821533203, "global_step": 581293, "epoch": 7003} {"train_loss": -27.805078506469727, "global_step": 581294, "epoch": 7003} {"train_loss": -27.9788761138916, "global_step": 581295, "epoch": 7003} {"train_loss": -27.95230484008789, "global_step": 581296, "epoch": 7003} {"train_loss": -28.13836097717285, "global_step": 581297, "epoch": 7003} {"train_loss": -27.874774932861328, "global_step": 581298, "epoch": 7003} {"train_loss": -27.62774658203125, "global_step": 581299, "epoch": 7003} {"train_loss": -28.104536056518555, "global_step": 581300, "epoch": 7003} {"train_loss": -28.064987182617188, "global_step": 581301, "epoch": 7003} {"train_loss": -28.190244674682617, "global_step": 581302, "epoch": 7003} {"train_loss": -28.127105712890625, "global_step": 581303, "epoch": 7003} {"train_loss": -28.528076171875, "global_step": 581304, "epoch": 7003} {"train_loss": -27.886188507080078, "global_step": 581305, "epoch": 7003} {"train_loss": -28.132587432861328, "global_step": 581306, "epoch": 7003} {"train_loss": -28.44537925720215, "global_step": 581307, "epoch": 7003} {"train_loss": -27.89019203186035, "global_step": 581308, "epoch": 7003} {"train_loss": -28.323993682861328, "global_step": 581309, "epoch": 7003} {"train_loss": -27.97102165222168, "global_step": 581310, "epoch": 7003} {"train_loss": -28.061553955078125, "global_step": 581311, "epoch": 7003} {"train_loss": -28.004133224487305, "global_step": 581312, "epoch": 7003} {"train_loss": -27.7541561126709, "global_step": 581313, "epoch": 7003} {"train_loss": -27.573490142822266, "global_step": 581314, "epoch": 7003} {"train_loss": -27.91655921936035, "global_step": 581315, "epoch": 7003} {"train_loss": -28.038354873657227, "global_step": 581316, "epoch": 7003} {"train_loss": -28.098440170288086, "global_step": 581317, "epoch": 7003} {"train_loss": -28.4154109954834, "global_step": 581318, "epoch": 7003} {"train_loss": -28.01983642578125, "global_step": 581319, "epoch": 7003} {"train_loss": -27.822919845581055, "global_step": 581320, "epoch": 7003} {"train_loss": -27.50336265563965, "global_step": 581321, "epoch": 7003} {"train_loss": -27.62885093688965, "global_step": 581322, "epoch": 7003} {"train_loss": -27.06977653503418, "global_step": 581323, "epoch": 7003} {"train_loss": -27.41843605041504, "global_step": 581324, "epoch": 7003} {"train_loss": -27.66547966003418, "global_step": 581325, "epoch": 7003} {"train_loss": -27.838623046875, "global_step": 581326, "epoch": 7003} {"train_loss": -27.53263282775879, "global_step": 581327, "epoch": 7003} {"train_loss": -27.744384765625, "global_step": 581328, "epoch": 7003} {"train_loss": -27.59468650817871, "global_step": 581329, "epoch": 7003} {"train_loss": -27.517892837524414, "global_step": 581330, "epoch": 7003} {"train_loss": -27.603383305561113, "global_step": 581331, "epoch": 7003, "val_loss": 6595017.0} {"train_loss": -27.37255859375, "global_step": 581332, "epoch": 7004} {"train_loss": -26.746292114257812, "global_step": 581333, "epoch": 7004} {"train_loss": -26.357135772705078, "global_step": 581334, "epoch": 7004} {"train_loss": -26.898969650268555, "global_step": 581335, "epoch": 7004} {"train_loss": -27.081357955932617, "global_step": 581336, "epoch": 7004} {"train_loss": -27.085752487182617, "global_step": 581337, "epoch": 7004} {"train_loss": -26.946592330932617, "global_step": 581338, "epoch": 7004} {"train_loss": -26.931432723999023, "global_step": 581339, "epoch": 7004} {"train_loss": -27.521936416625977, "global_step": 581340, "epoch": 7004} {"train_loss": -27.26030921936035, "global_step": 581341, "epoch": 7004} {"train_loss": -27.037403106689453, "global_step": 581342, "epoch": 7004} {"train_loss": -27.352453231811523, "global_step": 581343, "epoch": 7004} {"train_loss": -27.09364128112793, "global_step": 581344, "epoch": 7004} {"train_loss": -27.431684494018555, "global_step": 581345, "epoch": 7004} {"train_loss": -27.2703857421875, "global_step": 581346, "epoch": 7004} {"train_loss": -27.030935287475586, "global_step": 581347, "epoch": 7004} {"train_loss": -27.28289222717285, "global_step": 581348, "epoch": 7004} {"train_loss": -27.488759994506836, "global_step": 581349, "epoch": 7004} {"train_loss": -27.6092529296875, "global_step": 581350, "epoch": 7004} {"train_loss": -27.38077163696289, "global_step": 581351, "epoch": 7004} {"train_loss": -27.58685874938965, "global_step": 581352, "epoch": 7004} {"train_loss": -27.30112075805664, "global_step": 581353, "epoch": 7004} {"train_loss": -27.45612907409668, "global_step": 581354, "epoch": 7004} {"train_loss": -27.467487335205078, "global_step": 581355, "epoch": 7004} {"train_loss": -27.540945053100586, "global_step": 581356, "epoch": 7004} {"train_loss": -27.538297653198242, "global_step": 581357, "epoch": 7004} {"train_loss": -27.609893798828125, "global_step": 581358, "epoch": 7004} {"train_loss": -27.72073745727539, "global_step": 581359, "epoch": 7004} {"train_loss": -27.685810089111328, "global_step": 581360, "epoch": 7004} {"train_loss": -27.607440948486328, "global_step": 581361, "epoch": 7004} {"train_loss": -27.804540634155273, "global_step": 581362, "epoch": 7004} {"train_loss": -27.880762100219727, "global_step": 581363, "epoch": 7004} {"train_loss": -27.874710083007812, "global_step": 581364, "epoch": 7004} {"train_loss": -27.659910202026367, "global_step": 581365, "epoch": 7004} {"train_loss": -27.6578426361084, "global_step": 581366, "epoch": 7004} {"train_loss": -27.76905632019043, "global_step": 581367, "epoch": 7004} {"train_loss": -27.72307777404785, "global_step": 581368, "epoch": 7004} {"train_loss": -28.177783966064453, "global_step": 581369, "epoch": 7004} {"train_loss": -27.781164169311523, "global_step": 581370, "epoch": 7004} {"train_loss": -27.81973648071289, "global_step": 581371, "epoch": 7004} {"train_loss": -28.313100814819336, "global_step": 581372, "epoch": 7004} {"train_loss": -27.711767196655273, "global_step": 581373, "epoch": 7004} {"train_loss": -27.971603393554688, "global_step": 581374, "epoch": 7004} {"train_loss": -27.788293838500977, "global_step": 581375, "epoch": 7004} {"train_loss": -28.17279624938965, "global_step": 581376, "epoch": 7004} {"train_loss": -27.85639762878418, "global_step": 581377, "epoch": 7004} {"train_loss": -27.9570369720459, "global_step": 581378, "epoch": 7004} {"train_loss": -27.945606231689453, "global_step": 581379, "epoch": 7004} {"train_loss": -27.809850692749023, "global_step": 581380, "epoch": 7004} {"train_loss": -27.947301864624023, "global_step": 581381, "epoch": 7004} {"train_loss": -28.01210594177246, "global_step": 581382, "epoch": 7004} {"train_loss": -27.991321563720703, "global_step": 581383, "epoch": 7004} {"train_loss": -28.281982421875, "global_step": 581384, "epoch": 7004} {"train_loss": -27.851367950439453, "global_step": 581385, "epoch": 7004} {"train_loss": -27.56739616394043, "global_step": 581386, "epoch": 7004} {"train_loss": -27.848154067993164, "global_step": 581387, "epoch": 7004} {"train_loss": -28.258512496948242, "global_step": 581388, "epoch": 7004} {"train_loss": -28.271804809570312, "global_step": 581389, "epoch": 7004} {"train_loss": -28.067174911499023, "global_step": 581390, "epoch": 7004} {"train_loss": -28.069974899291992, "global_step": 581391, "epoch": 7004} {"train_loss": -27.836807250976562, "global_step": 581392, "epoch": 7004} {"train_loss": -27.858600616455078, "global_step": 581393, "epoch": 7004} {"train_loss": -27.440658569335938, "global_step": 581394, "epoch": 7004} {"train_loss": -27.817096710205078, "global_step": 581395, "epoch": 7004} {"train_loss": -28.033838272094727, "global_step": 581396, "epoch": 7004} {"train_loss": -27.58994483947754, "global_step": 581397, "epoch": 7004} {"train_loss": -27.5416202545166, "global_step": 581398, "epoch": 7004} {"train_loss": -27.867446899414062, "global_step": 581399, "epoch": 7004} {"train_loss": -28.221899032592773, "global_step": 581400, "epoch": 7004} {"train_loss": -27.9937686920166, "global_step": 581401, "epoch": 7004} {"train_loss": -27.888254165649414, "global_step": 581402, "epoch": 7004} {"train_loss": -28.282739639282227, "global_step": 581403, "epoch": 7004} {"train_loss": -27.75716209411621, "global_step": 581404, "epoch": 7004} {"train_loss": -28.184284210205078, "global_step": 581405, "epoch": 7004} {"train_loss": -27.919769287109375, "global_step": 581406, "epoch": 7004} {"train_loss": -27.77358055114746, "global_step": 581407, "epoch": 7004} {"train_loss": -28.18251609802246, "global_step": 581408, "epoch": 7004} {"train_loss": -28.118194580078125, "global_step": 581409, "epoch": 7004} {"train_loss": -28.221948623657227, "global_step": 581410, "epoch": 7004} {"train_loss": -28.031005859375, "global_step": 581411, "epoch": 7004} {"train_loss": -28.003995895385742, "global_step": 581412, "epoch": 7004} {"train_loss": -27.97265625, "global_step": 581413, "epoch": 7004} {"train_loss": -27.696065466087983, "global_step": 581414, "epoch": 7004, "val_loss": 6550933.5} {"train_loss": -27.781925201416016, "global_step": 581415, "epoch": 7005} {"train_loss": -27.30624771118164, "global_step": 581416, "epoch": 7005} {"train_loss": -27.536157608032227, "global_step": 581417, "epoch": 7005} {"train_loss": -26.844318389892578, "global_step": 581418, "epoch": 7005} {"train_loss": -27.075439453125, "global_step": 581419, "epoch": 7005} {"train_loss": -27.210012435913086, "global_step": 581420, "epoch": 7005} {"train_loss": -27.84026527404785, "global_step": 581421, "epoch": 7005} {"train_loss": -27.491535186767578, "global_step": 581422, "epoch": 7005} {"train_loss": -27.571481704711914, "global_step": 581423, "epoch": 7005} {"train_loss": -27.898941040039062, "global_step": 581424, "epoch": 7005} {"train_loss": -27.692142486572266, "global_step": 581425, "epoch": 7005} {"train_loss": -27.8348388671875, "global_step": 581426, "epoch": 7005} {"train_loss": -27.717578887939453, "global_step": 581427, "epoch": 7005} {"train_loss": -27.648818969726562, "global_step": 581428, "epoch": 7005} {"train_loss": -27.83991813659668, "global_step": 581429, "epoch": 7005} {"train_loss": -27.60725975036621, "global_step": 581430, "epoch": 7005} {"train_loss": -27.334436416625977, "global_step": 581431, "epoch": 7005} {"train_loss": -27.620929718017578, "global_step": 581432, "epoch": 7005} {"train_loss": -27.635196685791016, "global_step": 581433, "epoch": 7005} {"train_loss": -27.59449577331543, "global_step": 581434, "epoch": 7005} {"train_loss": -27.84061050415039, "global_step": 581435, "epoch": 7005} {"train_loss": -27.694915771484375, "global_step": 581436, "epoch": 7005} {"train_loss": -27.779407501220703, "global_step": 581437, "epoch": 7005} {"train_loss": -27.809051513671875, "global_step": 581438, "epoch": 7005} {"train_loss": -27.804534912109375, "global_step": 581439, "epoch": 7005} {"train_loss": -27.991653442382812, "global_step": 581440, "epoch": 7005} {"train_loss": -27.86789894104004, "global_step": 581441, "epoch": 7005} {"train_loss": -27.782093048095703, "global_step": 581442, "epoch": 7005} {"train_loss": -27.938146591186523, "global_step": 581443, "epoch": 7005} {"train_loss": -27.7802677154541, "global_step": 581444, "epoch": 7005} {"train_loss": -28.06504249572754, "global_step": 581445, "epoch": 7005} {"train_loss": -27.8007755279541, "global_step": 581446, "epoch": 7005} {"train_loss": -27.868127822875977, "global_step": 581447, "epoch": 7005} {"train_loss": -28.1448917388916, "global_step": 581448, "epoch": 7005} {"train_loss": -27.794891357421875, "global_step": 581449, "epoch": 7005} {"train_loss": -28.100378036499023, "global_step": 581450, "epoch": 7005} {"train_loss": -28.350082397460938, "global_step": 581451, "epoch": 7005} {"train_loss": -27.937580108642578, "global_step": 581452, "epoch": 7005} {"train_loss": -28.04928970336914, "global_step": 581453, "epoch": 7005} {"train_loss": -28.187788009643555, "global_step": 581454, "epoch": 7005} {"train_loss": -27.79400062561035, "global_step": 581455, "epoch": 7005} {"train_loss": -27.957731246948242, "global_step": 581456, "epoch": 7005} {"train_loss": -27.88534927368164, "global_step": 581457, "epoch": 7005} {"train_loss": -27.77201271057129, "global_step": 581458, "epoch": 7005} {"train_loss": -27.886682510375977, "global_step": 581459, "epoch": 7005} {"train_loss": -28.34946060180664, "global_step": 581460, "epoch": 7005} {"train_loss": -28.65353775024414, "global_step": 581461, "epoch": 7005} {"train_loss": -27.9857234954834, "global_step": 581462, "epoch": 7005} {"train_loss": -27.974945068359375, "global_step": 581463, "epoch": 7005} {"train_loss": -28.13508415222168, "global_step": 581464, "epoch": 7005} {"train_loss": -28.27994155883789, "global_step": 581465, "epoch": 7005} {"train_loss": -28.14228630065918, "global_step": 581466, "epoch": 7005} {"train_loss": -28.154455184936523, "global_step": 581467, "epoch": 7005} {"train_loss": -28.213775634765625, "global_step": 581468, "epoch": 7005} {"train_loss": -27.900434494018555, "global_step": 581469, "epoch": 7005} {"train_loss": -27.897321701049805, "global_step": 581470, "epoch": 7005} {"train_loss": -28.195240020751953, "global_step": 581471, "epoch": 7005} {"train_loss": -27.965600967407227, "global_step": 581472, "epoch": 7005} {"train_loss": -28.19989013671875, "global_step": 581473, "epoch": 7005} {"train_loss": -28.016447067260742, "global_step": 581474, "epoch": 7005} {"train_loss": -27.819379806518555, "global_step": 581475, "epoch": 7005} {"train_loss": -27.228656768798828, "global_step": 581476, "epoch": 7005} {"train_loss": -26.711877822875977, "global_step": 581477, "epoch": 7005} {"train_loss": -27.793622970581055, "global_step": 581478, "epoch": 7005} {"train_loss": -27.689977645874023, "global_step": 581479, "epoch": 7005} {"train_loss": -27.408771514892578, "global_step": 581480, "epoch": 7005} {"train_loss": -27.658292770385742, "global_step": 581481, "epoch": 7005} {"train_loss": -28.205053329467773, "global_step": 581482, "epoch": 7005} {"train_loss": -27.759998321533203, "global_step": 581483, "epoch": 7005} {"train_loss": -27.767337799072266, "global_step": 581484, "epoch": 7005} {"train_loss": -28.141321182250977, "global_step": 581485, "epoch": 7005} {"train_loss": -27.687570571899414, "global_step": 581486, "epoch": 7005} {"train_loss": -27.51783561706543, "global_step": 581487, "epoch": 7005} {"train_loss": -27.403961181640625, "global_step": 581488, "epoch": 7005} {"train_loss": -28.140872955322266, "global_step": 581489, "epoch": 7005} {"train_loss": -27.7989501953125, "global_step": 581490, "epoch": 7005} {"train_loss": -27.927453994750977, "global_step": 581491, "epoch": 7005} {"train_loss": -27.88563346862793, "global_step": 581492, "epoch": 7005} {"train_loss": -28.290271759033203, "global_step": 581493, "epoch": 7005} {"train_loss": -27.783185958862305, "global_step": 581494, "epoch": 7005} {"train_loss": -28.30134391784668, "global_step": 581495, "epoch": 7005} {"train_loss": -28.00796890258789, "global_step": 581496, "epoch": 7005} {"train_loss": -27.837436423244245, "global_step": 581497, "epoch": 7005, "val_loss": 6502898.0} {"train_loss": -27.304431915283203, "global_step": 581498, "epoch": 7006} {"train_loss": -27.183303833007812, "global_step": 581499, "epoch": 7006} {"train_loss": -27.356800079345703, "global_step": 581500, "epoch": 7006} {"train_loss": -27.533283233642578, "global_step": 581501, "epoch": 7006} {"train_loss": -27.761274337768555, "global_step": 581502, "epoch": 7006} {"train_loss": -27.545621871948242, "global_step": 581503, "epoch": 7006} {"train_loss": -27.993566513061523, "global_step": 581504, "epoch": 7006} {"train_loss": -27.297826766967773, "global_step": 581505, "epoch": 7006} {"train_loss": -27.3421688079834, "global_step": 581506, "epoch": 7006} {"train_loss": -27.738330841064453, "global_step": 581507, "epoch": 7006} {"train_loss": -27.707794189453125, "global_step": 581508, "epoch": 7006} {"train_loss": -27.436941146850586, "global_step": 581509, "epoch": 7006} {"train_loss": -27.81571388244629, "global_step": 581510, "epoch": 7006} {"train_loss": -27.7440128326416, "global_step": 581511, "epoch": 7006} {"train_loss": -27.574472427368164, "global_step": 581512, "epoch": 7006} {"train_loss": -27.59453773498535, "global_step": 581513, "epoch": 7006} {"train_loss": -27.79107093811035, "global_step": 581514, "epoch": 7006} {"train_loss": -27.908857345581055, "global_step": 581515, "epoch": 7006} {"train_loss": -28.140777587890625, "global_step": 581516, "epoch": 7006} {"train_loss": -27.578622817993164, "global_step": 581517, "epoch": 7006} {"train_loss": -27.06339454650879, "global_step": 581518, "epoch": 7006} {"train_loss": -27.460468292236328, "global_step": 581519, "epoch": 7006} {"train_loss": -28.097318649291992, "global_step": 581520, "epoch": 7006} {"train_loss": -27.70160484313965, "global_step": 581521, "epoch": 7006} {"train_loss": -27.695392608642578, "global_step": 581522, "epoch": 7006} {"train_loss": -27.909759521484375, "global_step": 581523, "epoch": 7006} {"train_loss": -28.157690048217773, "global_step": 581524, "epoch": 7006} {"train_loss": -27.829517364501953, "global_step": 581525, "epoch": 7006} {"train_loss": -27.897876739501953, "global_step": 581526, "epoch": 7006} {"train_loss": -28.08555030822754, "global_step": 581527, "epoch": 7006} {"train_loss": -28.26995277404785, "global_step": 581528, "epoch": 7006} {"train_loss": -27.92268180847168, "global_step": 581529, "epoch": 7006} {"train_loss": -27.903644561767578, "global_step": 581530, "epoch": 7006} {"train_loss": -28.088415145874023, "global_step": 581531, "epoch": 7006} {"train_loss": -27.773221969604492, "global_step": 581532, "epoch": 7006} {"train_loss": -28.127384185791016, "global_step": 581533, "epoch": 7006} {"train_loss": -28.09844398498535, "global_step": 581534, "epoch": 7006} {"train_loss": -28.277280807495117, "global_step": 581535, "epoch": 7006} {"train_loss": -28.039295196533203, "global_step": 581536, "epoch": 7006} {"train_loss": -27.776514053344727, "global_step": 581537, "epoch": 7006} {"train_loss": -28.322967529296875, "global_step": 581538, "epoch": 7006} {"train_loss": -27.926679611206055, "global_step": 581539, "epoch": 7006} {"train_loss": -27.586511611938477, "global_step": 581540, "epoch": 7006} {"train_loss": -27.6817684173584, "global_step": 581541, "epoch": 7006} {"train_loss": -27.66745948791504, "global_step": 581542, "epoch": 7006} {"train_loss": -27.503021240234375, "global_step": 581543, "epoch": 7006} {"train_loss": -27.68145179748535, "global_step": 581544, "epoch": 7006} {"train_loss": -27.476438522338867, "global_step": 581545, "epoch": 7006} {"train_loss": -27.753137588500977, "global_step": 581546, "epoch": 7006} {"train_loss": -27.560590744018555, "global_step": 581547, "epoch": 7006} {"train_loss": -27.584125518798828, "global_step": 581548, "epoch": 7006} {"train_loss": -27.5672607421875, "global_step": 581549, "epoch": 7006} {"train_loss": -27.579853057861328, "global_step": 581550, "epoch": 7006} {"train_loss": -27.99761390686035, "global_step": 581551, "epoch": 7006} {"train_loss": -27.607421875, "global_step": 581552, "epoch": 7006} {"train_loss": -27.968725204467773, "global_step": 581553, "epoch": 7006} {"train_loss": -27.94464111328125, "global_step": 581554, "epoch": 7006} {"train_loss": -27.88043212890625, "global_step": 581555, "epoch": 7006} {"train_loss": -27.83945083618164, "global_step": 581556, "epoch": 7006} {"train_loss": -27.327829360961914, "global_step": 581557, "epoch": 7006} {"train_loss": -27.80902671813965, "global_step": 581558, "epoch": 7006} {"train_loss": -27.67156982421875, "global_step": 581559, "epoch": 7006} {"train_loss": -27.875452041625977, "global_step": 581560, "epoch": 7006} {"train_loss": -27.82588005065918, "global_step": 581561, "epoch": 7006} {"train_loss": -28.008657455444336, "global_step": 581562, "epoch": 7006} {"train_loss": -27.73299217224121, "global_step": 581563, "epoch": 7006} {"train_loss": -28.109710693359375, "global_step": 581564, "epoch": 7006} {"train_loss": -27.91411781311035, "global_step": 581565, "epoch": 7006} {"train_loss": -27.619537353515625, "global_step": 581566, "epoch": 7006} {"train_loss": -27.820648193359375, "global_step": 581567, "epoch": 7006} {"train_loss": -28.3044490814209, "global_step": 581568, "epoch": 7006} {"train_loss": -27.859174728393555, "global_step": 581569, "epoch": 7006} {"train_loss": -27.989179611206055, "global_step": 581570, "epoch": 7006} {"train_loss": -27.96954345703125, "global_step": 581571, "epoch": 7006} {"train_loss": -27.862768173217773, "global_step": 581572, "epoch": 7006} {"train_loss": -27.74798583984375, "global_step": 581573, "epoch": 7006} {"train_loss": -28.2385311126709, "global_step": 581574, "epoch": 7006} {"train_loss": -27.990442276000977, "global_step": 581575, "epoch": 7006} {"train_loss": -28.173974990844727, "global_step": 581576, "epoch": 7006} {"train_loss": -28.363006591796875, "global_step": 581577, "epoch": 7006} {"train_loss": -28.091787338256836, "global_step": 581578, "epoch": 7006} {"train_loss": -27.84173583984375, "global_step": 581579, "epoch": 7006} {"train_loss": -27.81171146071101, "global_step": 581580, "epoch": 7006, "val_loss": 6606187.0} {"train_loss": -27.78175926208496, "global_step": 581581, "epoch": 7007} {"train_loss": -27.374460220336914, "global_step": 581582, "epoch": 7007} {"train_loss": -27.779483795166016, "global_step": 581583, "epoch": 7007} {"train_loss": -27.39056396484375, "global_step": 581584, "epoch": 7007} {"train_loss": -26.592493057250977, "global_step": 581585, "epoch": 7007} {"train_loss": -27.032514572143555, "global_step": 581586, "epoch": 7007} {"train_loss": -27.366046905517578, "global_step": 581587, "epoch": 7007} {"train_loss": -26.82366943359375, "global_step": 581588, "epoch": 7007} {"train_loss": -26.56841468811035, "global_step": 581589, "epoch": 7007} {"train_loss": -27.64581298828125, "global_step": 581590, "epoch": 7007} {"train_loss": -26.589832305908203, "global_step": 581591, "epoch": 7007} {"train_loss": -27.497161865234375, "global_step": 581592, "epoch": 7007} {"train_loss": -26.794721603393555, "global_step": 581593, "epoch": 7007} {"train_loss": -27.086591720581055, "global_step": 581594, "epoch": 7007} {"train_loss": -26.89153480529785, "global_step": 581595, "epoch": 7007} {"train_loss": -27.2895450592041, "global_step": 581596, "epoch": 7007} {"train_loss": -27.164060592651367, "global_step": 581597, "epoch": 7007} {"train_loss": -27.314664840698242, "global_step": 581598, "epoch": 7007} {"train_loss": -27.318037033081055, "global_step": 581599, "epoch": 7007} {"train_loss": -28.058629989624023, "global_step": 581600, "epoch": 7007} {"train_loss": -27.24456214904785, "global_step": 581601, "epoch": 7007} {"train_loss": -27.3187313079834, "global_step": 581602, "epoch": 7007} {"train_loss": -28.172576904296875, "global_step": 581603, "epoch": 7007} {"train_loss": -27.453704833984375, "global_step": 581604, "epoch": 7007} {"train_loss": -27.407636642456055, "global_step": 581605, "epoch": 7007} {"train_loss": -27.85288429260254, "global_step": 581606, "epoch": 7007} {"train_loss": -27.582733154296875, "global_step": 581607, "epoch": 7007} {"train_loss": -27.456653594970703, "global_step": 581608, "epoch": 7007} {"train_loss": -27.74177360534668, "global_step": 581609, "epoch": 7007} {"train_loss": -28.063770294189453, "global_step": 581610, "epoch": 7007} {"train_loss": -27.629825592041016, "global_step": 581611, "epoch": 7007} {"train_loss": -27.90809440612793, "global_step": 581612, "epoch": 7007} {"train_loss": -27.495763778686523, "global_step": 581613, "epoch": 7007} {"train_loss": -27.769704818725586, "global_step": 581614, "epoch": 7007} {"train_loss": -27.82461929321289, "global_step": 581615, "epoch": 7007} {"train_loss": -28.050840377807617, "global_step": 581616, "epoch": 7007} {"train_loss": -27.886625289916992, "global_step": 581617, "epoch": 7007} {"train_loss": -27.91241455078125, "global_step": 581618, "epoch": 7007} {"train_loss": -27.9681339263916, "global_step": 581619, "epoch": 7007} {"train_loss": -27.792774200439453, "global_step": 581620, "epoch": 7007} {"train_loss": -27.87557029724121, "global_step": 581621, "epoch": 7007} {"train_loss": -27.750396728515625, "global_step": 581622, "epoch": 7007} {"train_loss": -28.108917236328125, "global_step": 581623, "epoch": 7007} {"train_loss": -28.208646774291992, "global_step": 581624, "epoch": 7007} {"train_loss": -27.919010162353516, "global_step": 581625, "epoch": 7007} {"train_loss": -27.978483200073242, "global_step": 581626, "epoch": 7007} {"train_loss": -28.074207305908203, "global_step": 581627, "epoch": 7007} {"train_loss": -28.12640380859375, "global_step": 581628, "epoch": 7007} {"train_loss": -28.054203033447266, "global_step": 581629, "epoch": 7007} {"train_loss": -27.937326431274414, "global_step": 581630, "epoch": 7007} {"train_loss": -28.275787353515625, "global_step": 581631, "epoch": 7007} {"train_loss": -28.119897842407227, "global_step": 581632, "epoch": 7007} {"train_loss": -27.817462921142578, "global_step": 581633, "epoch": 7007} {"train_loss": -28.030582427978516, "global_step": 581634, "epoch": 7007} {"train_loss": -27.9254207611084, "global_step": 581635, "epoch": 7007} {"train_loss": -28.00264549255371, "global_step": 581636, "epoch": 7007} {"train_loss": -28.200916290283203, "global_step": 581637, "epoch": 7007} {"train_loss": -27.868947982788086, "global_step": 581638, "epoch": 7007} {"train_loss": -27.636463165283203, "global_step": 581639, "epoch": 7007} {"train_loss": -28.044570922851562, "global_step": 581640, "epoch": 7007} {"train_loss": -28.13813591003418, "global_step": 581641, "epoch": 7007} {"train_loss": -28.194555282592773, "global_step": 581642, "epoch": 7007} {"train_loss": -27.818811416625977, "global_step": 581643, "epoch": 7007} {"train_loss": -27.55942153930664, "global_step": 581644, "epoch": 7007} {"train_loss": -27.99302101135254, "global_step": 581645, "epoch": 7007} {"train_loss": -28.20172691345215, "global_step": 581646, "epoch": 7007} {"train_loss": -27.95466423034668, "global_step": 581647, "epoch": 7007} {"train_loss": -28.251996994018555, "global_step": 581648, "epoch": 7007} {"train_loss": -28.423675537109375, "global_step": 581649, "epoch": 7007} {"train_loss": -28.00144386291504, "global_step": 581650, "epoch": 7007} {"train_loss": -28.0484619140625, "global_step": 581651, "epoch": 7007} {"train_loss": -28.067325592041016, "global_step": 581652, "epoch": 7007} {"train_loss": -27.667211532592773, "global_step": 581653, "epoch": 7007} {"train_loss": -28.164844512939453, "global_step": 581654, "epoch": 7007} {"train_loss": -27.93568229675293, "global_step": 581655, "epoch": 7007} {"train_loss": -27.62310218811035, "global_step": 581656, "epoch": 7007} {"train_loss": -27.820068359375, "global_step": 581657, "epoch": 7007} {"train_loss": -27.50446891784668, "global_step": 581658, "epoch": 7007} {"train_loss": -28.055225372314453, "global_step": 581659, "epoch": 7007} {"train_loss": -28.21221351623535, "global_step": 581660, "epoch": 7007} {"train_loss": -28.13616371154785, "global_step": 581661, "epoch": 7007} {"train_loss": -27.241230010986328, "global_step": 581662, "epoch": 7007} {"train_loss": -27.73532830663474, "global_step": 581663, "epoch": 7007, "val_loss": 6612455.0} {"train_loss": -27.40872573852539, "global_step": 581664, "epoch": 7008} {"train_loss": -27.47958755493164, "global_step": 581665, "epoch": 7008} {"train_loss": -26.82000160217285, "global_step": 581666, "epoch": 7008} {"train_loss": -26.37628746032715, "global_step": 581667, "epoch": 7008} {"train_loss": -25.86910057067871, "global_step": 581668, "epoch": 7008} {"train_loss": -26.69887351989746, "global_step": 581669, "epoch": 7008} {"train_loss": -26.766468048095703, "global_step": 581670, "epoch": 7008} {"train_loss": -27.015954971313477, "global_step": 581671, "epoch": 7008} {"train_loss": -26.723119735717773, "global_step": 581672, "epoch": 7008} {"train_loss": -26.66071128845215, "global_step": 581673, "epoch": 7008} {"train_loss": -27.122900009155273, "global_step": 581674, "epoch": 7008} {"train_loss": -27.341093063354492, "global_step": 581675, "epoch": 7008} {"train_loss": -27.402027130126953, "global_step": 581676, "epoch": 7008} {"train_loss": -27.47199058532715, "global_step": 581677, "epoch": 7008} {"train_loss": -27.2828426361084, "global_step": 581678, "epoch": 7008} {"train_loss": -27.719818115234375, "global_step": 581679, "epoch": 7008} {"train_loss": -27.181310653686523, "global_step": 581680, "epoch": 7008} {"train_loss": -27.381778717041016, "global_step": 581681, "epoch": 7008} {"train_loss": -27.416540145874023, "global_step": 581682, "epoch": 7008} {"train_loss": -27.947738647460938, "global_step": 581683, "epoch": 7008} {"train_loss": -27.742101669311523, "global_step": 581684, "epoch": 7008} {"train_loss": -28.02802085876465, "global_step": 581685, "epoch": 7008} {"train_loss": -27.75923728942871, "global_step": 581686, "epoch": 7008} {"train_loss": -27.96884536743164, "global_step": 581687, "epoch": 7008} {"train_loss": -27.429365158081055, "global_step": 581688, "epoch": 7008} {"train_loss": -27.625757217407227, "global_step": 581689, "epoch": 7008} {"train_loss": -27.737234115600586, "global_step": 581690, "epoch": 7008} {"train_loss": -27.535083770751953, "global_step": 581691, "epoch": 7008} {"train_loss": -27.39544677734375, "global_step": 581692, "epoch": 7008} {"train_loss": -28.085983276367188, "global_step": 581693, "epoch": 7008} {"train_loss": -28.255701065063477, "global_step": 581694, "epoch": 7008} {"train_loss": -27.780790328979492, "global_step": 581695, "epoch": 7008} {"train_loss": -27.85261344909668, "global_step": 581696, "epoch": 7008} {"train_loss": -27.684011459350586, "global_step": 581697, "epoch": 7008} {"train_loss": -27.790639877319336, "global_step": 581698, "epoch": 7008} {"train_loss": -28.02851676940918, "global_step": 581699, "epoch": 7008} {"train_loss": -27.88142204284668, "global_step": 581700, "epoch": 7008} {"train_loss": -27.92459487915039, "global_step": 581701, "epoch": 7008} {"train_loss": -28.111194610595703, "global_step": 581702, "epoch": 7008} {"train_loss": -28.049762725830078, "global_step": 581703, "epoch": 7008} {"train_loss": -28.16305923461914, "global_step": 581704, "epoch": 7008} {"train_loss": -27.869230270385742, "global_step": 581705, "epoch": 7008} {"train_loss": -28.06135368347168, "global_step": 581706, "epoch": 7008} {"train_loss": -28.04972267150879, "global_step": 581707, "epoch": 7008} {"train_loss": -27.588266372680664, "global_step": 581708, "epoch": 7008} {"train_loss": -28.039901733398438, "global_step": 581709, "epoch": 7008} {"train_loss": -27.69179344177246, "global_step": 581710, "epoch": 7008} {"train_loss": -27.981403350830078, "global_step": 581711, "epoch": 7008} {"train_loss": -27.864105224609375, "global_step": 581712, "epoch": 7008} {"train_loss": -28.11980628967285, "global_step": 581713, "epoch": 7008} {"train_loss": -28.354801177978516, "global_step": 581714, "epoch": 7008} {"train_loss": -27.95647621154785, "global_step": 581715, "epoch": 7008} {"train_loss": -28.225107192993164, "global_step": 581716, "epoch": 7008} {"train_loss": -27.7666072845459, "global_step": 581717, "epoch": 7008} {"train_loss": -27.4943904876709, "global_step": 581718, "epoch": 7008} {"train_loss": -27.852277755737305, "global_step": 581719, "epoch": 7008} {"train_loss": -28.154071807861328, "global_step": 581720, "epoch": 7008} {"train_loss": -28.021360397338867, "global_step": 581721, "epoch": 7008} {"train_loss": -27.787866592407227, "global_step": 581722, "epoch": 7008} {"train_loss": -27.37093162536621, "global_step": 581723, "epoch": 7008} {"train_loss": -27.462778091430664, "global_step": 581724, "epoch": 7008} {"train_loss": -27.40308952331543, "global_step": 581725, "epoch": 7008} {"train_loss": -27.460254669189453, "global_step": 581726, "epoch": 7008} {"train_loss": -28.243900299072266, "global_step": 581727, "epoch": 7008} {"train_loss": -27.439783096313477, "global_step": 581728, "epoch": 7008} {"train_loss": -27.45209312438965, "global_step": 581729, "epoch": 7008} {"train_loss": -27.53729248046875, "global_step": 581730, "epoch": 7008} {"train_loss": -27.97769546508789, "global_step": 581731, "epoch": 7008} {"train_loss": -27.905567169189453, "global_step": 581732, "epoch": 7008} {"train_loss": -27.589929580688477, "global_step": 581733, "epoch": 7008} {"train_loss": -27.632299423217773, "global_step": 581734, "epoch": 7008} {"train_loss": -27.95197868347168, "global_step": 581735, "epoch": 7008} {"train_loss": -27.620187759399414, "global_step": 581736, "epoch": 7008} {"train_loss": -27.519372940063477, "global_step": 581737, "epoch": 7008} {"train_loss": -27.9073429107666, "global_step": 581738, "epoch": 7008} {"train_loss": -27.918212890625, "global_step": 581739, "epoch": 7008} {"train_loss": -27.718713760375977, "global_step": 581740, "epoch": 7008} {"train_loss": -28.3044490814209, "global_step": 581741, "epoch": 7008} {"train_loss": -27.665943145751953, "global_step": 581742, "epoch": 7008} {"train_loss": -27.690195083618164, "global_step": 581743, "epoch": 7008} {"train_loss": -28.116926193237305, "global_step": 581744, "epoch": 7008} {"train_loss": -27.921554565429688, "global_step": 581745, "epoch": 7008} {"train_loss": -27.657062323696643, "global_step": 581746, "epoch": 7008, "val_loss": 6608143.0} {"train_loss": -27.478418350219727, "global_step": 581747, "epoch": 7009} {"train_loss": -27.876087188720703, "global_step": 581748, "epoch": 7009} {"train_loss": -27.0899658203125, "global_step": 581749, "epoch": 7009} {"train_loss": -27.624048233032227, "global_step": 581750, "epoch": 7009} {"train_loss": -28.11124038696289, "global_step": 581751, "epoch": 7009} {"train_loss": -27.86566162109375, "global_step": 581752, "epoch": 7009} {"train_loss": -27.673791885375977, "global_step": 581753, "epoch": 7009} {"train_loss": -27.424158096313477, "global_step": 581754, "epoch": 7009} {"train_loss": -27.724145889282227, "global_step": 581755, "epoch": 7009} {"train_loss": -28.039655685424805, "global_step": 581756, "epoch": 7009} {"train_loss": -27.5233211517334, "global_step": 581757, "epoch": 7009} {"train_loss": -28.029325485229492, "global_step": 581758, "epoch": 7009} {"train_loss": -27.675556182861328, "global_step": 581759, "epoch": 7009} {"train_loss": -27.30402183532715, "global_step": 581760, "epoch": 7009} {"train_loss": -27.643163681030273, "global_step": 581761, "epoch": 7009} {"train_loss": -28.042707443237305, "global_step": 581762, "epoch": 7009} {"train_loss": -28.22603416442871, "global_step": 581763, "epoch": 7009} {"train_loss": -28.11627769470215, "global_step": 581764, "epoch": 7009} {"train_loss": -27.919681549072266, "global_step": 581765, "epoch": 7009} {"train_loss": -28.02012062072754, "global_step": 581766, "epoch": 7009} {"train_loss": -27.71257972717285, "global_step": 581767, "epoch": 7009} {"train_loss": -27.9902286529541, "global_step": 581768, "epoch": 7009} {"train_loss": -28.069324493408203, "global_step": 581769, "epoch": 7009} {"train_loss": -27.645261764526367, "global_step": 581770, "epoch": 7009} {"train_loss": -28.448841094970703, "global_step": 581771, "epoch": 7009} {"train_loss": -27.943546295166016, "global_step": 581772, "epoch": 7009} {"train_loss": -28.312917709350586, "global_step": 581773, "epoch": 7009} {"train_loss": -27.9273681640625, "global_step": 581774, "epoch": 7009} {"train_loss": -27.95856285095215, "global_step": 581775, "epoch": 7009} {"train_loss": -27.9274845123291, "global_step": 581776, "epoch": 7009} {"train_loss": -28.144886016845703, "global_step": 581777, "epoch": 7009} {"train_loss": -28.227100372314453, "global_step": 581778, "epoch": 7009} {"train_loss": -28.13702964782715, "global_step": 581779, "epoch": 7009} {"train_loss": -28.126447677612305, "global_step": 581780, "epoch": 7009} {"train_loss": -28.35711097717285, "global_step": 581781, "epoch": 7009} {"train_loss": -27.800024032592773, "global_step": 581782, "epoch": 7009} {"train_loss": -27.992664337158203, "global_step": 581783, "epoch": 7009} {"train_loss": -28.196481704711914, "global_step": 581784, "epoch": 7009} {"train_loss": -28.11639404296875, "global_step": 581785, "epoch": 7009} {"train_loss": -27.848596572875977, "global_step": 581786, "epoch": 7009} {"train_loss": -28.226987838745117, "global_step": 581787, "epoch": 7009} {"train_loss": -27.87109375, "global_step": 581788, "epoch": 7009} {"train_loss": -28.08845329284668, "global_step": 581789, "epoch": 7009} {"train_loss": -28.0585880279541, "global_step": 581790, "epoch": 7009} {"train_loss": -27.736112594604492, "global_step": 581791, "epoch": 7009} {"train_loss": -27.54776382446289, "global_step": 581792, "epoch": 7009} {"train_loss": -26.98590660095215, "global_step": 581793, "epoch": 7009} {"train_loss": -27.4578857421875, "global_step": 581794, "epoch": 7009} {"train_loss": -27.734731674194336, "global_step": 581795, "epoch": 7009} {"train_loss": -26.933393478393555, "global_step": 581796, "epoch": 7009} {"train_loss": -27.544660568237305, "global_step": 581797, "epoch": 7009} {"train_loss": -27.857086181640625, "global_step": 581798, "epoch": 7009} {"train_loss": -28.017688751220703, "global_step": 581799, "epoch": 7009} {"train_loss": -27.627668380737305, "global_step": 581800, "epoch": 7009} {"train_loss": -27.815702438354492, "global_step": 581801, "epoch": 7009} {"train_loss": -28.10584831237793, "global_step": 581802, "epoch": 7009} {"train_loss": -27.5090389251709, "global_step": 581803, "epoch": 7009} {"train_loss": -27.81544303894043, "global_step": 581804, "epoch": 7009} {"train_loss": -27.732385635375977, "global_step": 581805, "epoch": 7009} {"train_loss": -27.982202529907227, "global_step": 581806, "epoch": 7009} {"train_loss": -27.817138671875, "global_step": 581807, "epoch": 7009} {"train_loss": -27.968780517578125, "global_step": 581808, "epoch": 7009} {"train_loss": -27.740564346313477, "global_step": 581809, "epoch": 7009} {"train_loss": -28.066085815429688, "global_step": 581810, "epoch": 7009} {"train_loss": -27.538070678710938, "global_step": 581811, "epoch": 7009} {"train_loss": -27.922260284423828, "global_step": 581812, "epoch": 7009} {"train_loss": -27.681625366210938, "global_step": 581813, "epoch": 7009} {"train_loss": -27.57122802734375, "global_step": 581814, "epoch": 7009} {"train_loss": -28.16704750061035, "global_step": 581815, "epoch": 7009} {"train_loss": -27.80594825744629, "global_step": 581816, "epoch": 7009} {"train_loss": -27.892541885375977, "global_step": 581817, "epoch": 7009} {"train_loss": -27.94350242614746, "global_step": 581818, "epoch": 7009} {"train_loss": -27.661840438842773, "global_step": 581819, "epoch": 7009} {"train_loss": -27.591299057006836, "global_step": 581820, "epoch": 7009} {"train_loss": -27.896142959594727, "global_step": 581821, "epoch": 7009} {"train_loss": -27.98720359802246, "global_step": 581822, "epoch": 7009} {"train_loss": -27.657733917236328, "global_step": 581823, "epoch": 7009} {"train_loss": -27.990232467651367, "global_step": 581824, "epoch": 7009} {"train_loss": -27.806537628173828, "global_step": 581825, "epoch": 7009} {"train_loss": -28.298681259155273, "global_step": 581826, "epoch": 7009} {"train_loss": -27.90669059753418, "global_step": 581827, "epoch": 7009} {"train_loss": -28.04474449157715, "global_step": 581828, "epoch": 7009} {"train_loss": -27.848246470991388, "global_step": 581829, "epoch": 7009, "val_loss": 6688911.0} {"train_loss": -26.222827911376953, "global_step": 581830, "epoch": 7010} {"train_loss": -26.77985191345215, "global_step": 581831, "epoch": 7010} {"train_loss": -27.08572769165039, "global_step": 581832, "epoch": 7010} {"train_loss": -26.41160011291504, "global_step": 581833, "epoch": 7010} {"train_loss": -26.989370346069336, "global_step": 581834, "epoch": 7010} {"train_loss": -27.423694610595703, "global_step": 581835, "epoch": 7010} {"train_loss": -27.490320205688477, "global_step": 581836, "epoch": 7010} {"train_loss": -27.086790084838867, "global_step": 581837, "epoch": 7010} {"train_loss": -27.727996826171875, "global_step": 581838, "epoch": 7010} {"train_loss": -27.30063247680664, "global_step": 581839, "epoch": 7010} {"train_loss": -27.3797607421875, "global_step": 581840, "epoch": 7010} {"train_loss": -27.34356117248535, "global_step": 581841, "epoch": 7010} {"train_loss": -27.194067001342773, "global_step": 581842, "epoch": 7010} {"train_loss": -27.713361740112305, "global_step": 581843, "epoch": 7010} {"train_loss": -27.31424331665039, "global_step": 581844, "epoch": 7010} {"train_loss": -27.47174644470215, "global_step": 581845, "epoch": 7010} {"train_loss": -27.263916015625, "global_step": 581846, "epoch": 7010} {"train_loss": -27.940296173095703, "global_step": 581847, "epoch": 7010} {"train_loss": -27.49445915222168, "global_step": 581848, "epoch": 7010} {"train_loss": -27.6263484954834, "global_step": 581849, "epoch": 7010} {"train_loss": -27.724756240844727, "global_step": 581850, "epoch": 7010} {"train_loss": -27.6340274810791, "global_step": 581851, "epoch": 7010} {"train_loss": -27.349689483642578, "global_step": 581852, "epoch": 7010} {"train_loss": -27.93450355529785, "global_step": 581853, "epoch": 7010} {"train_loss": -27.28968620300293, "global_step": 581854, "epoch": 7010} {"train_loss": -27.730316162109375, "global_step": 581855, "epoch": 7010} {"train_loss": -27.584646224975586, "global_step": 581856, "epoch": 7010} {"train_loss": -27.708845138549805, "global_step": 581857, "epoch": 7010} {"train_loss": -27.675384521484375, "global_step": 581858, "epoch": 7010} {"train_loss": -27.7126522064209, "global_step": 581859, "epoch": 7010} {"train_loss": -27.690290451049805, "global_step": 581860, "epoch": 7010} {"train_loss": -27.82611083984375, "global_step": 581861, "epoch": 7010} {"train_loss": -27.568607330322266, "global_step": 581862, "epoch": 7010} {"train_loss": -27.749414443969727, "global_step": 581863, "epoch": 7010} {"train_loss": -27.8245792388916, "global_step": 581864, "epoch": 7010} {"train_loss": -27.474897384643555, "global_step": 581865, "epoch": 7010} {"train_loss": -28.166126251220703, "global_step": 581866, "epoch": 7010} {"train_loss": -28.151636123657227, "global_step": 581867, "epoch": 7010} {"train_loss": -28.070465087890625, "global_step": 581868, "epoch": 7010} {"train_loss": -27.874414443969727, "global_step": 581869, "epoch": 7010} {"train_loss": -28.364398956298828, "global_step": 581870, "epoch": 7010} {"train_loss": -27.85572624206543, "global_step": 581871, "epoch": 7010} {"train_loss": -27.95185661315918, "global_step": 581872, "epoch": 7010} {"train_loss": -27.669950485229492, "global_step": 581873, "epoch": 7010} {"train_loss": -28.2298583984375, "global_step": 581874, "epoch": 7010} {"train_loss": -28.321533203125, "global_step": 581875, "epoch": 7010} {"train_loss": -28.17569923400879, "global_step": 581876, "epoch": 7010} {"train_loss": -28.391748428344727, "global_step": 581877, "epoch": 7010} {"train_loss": -27.885610580444336, "global_step": 581878, "epoch": 7010} {"train_loss": -28.11134910583496, "global_step": 581879, "epoch": 7010} {"train_loss": -27.763647079467773, "global_step": 581880, "epoch": 7010} {"train_loss": -28.06440544128418, "global_step": 581881, "epoch": 7010} {"train_loss": -28.059553146362305, "global_step": 581882, "epoch": 7010} {"train_loss": -27.947315216064453, "global_step": 581883, "epoch": 7010} {"train_loss": -28.153329849243164, "global_step": 581884, "epoch": 7010} {"train_loss": -28.517959594726562, "global_step": 581885, "epoch": 7010} {"train_loss": -27.92841148376465, "global_step": 581886, "epoch": 7010} {"train_loss": -27.819965362548828, "global_step": 581887, "epoch": 7010} {"train_loss": -27.87171745300293, "global_step": 581888, "epoch": 7010} {"train_loss": -27.84662437438965, "global_step": 581889, "epoch": 7010} {"train_loss": -28.089746475219727, "global_step": 581890, "epoch": 7010} {"train_loss": -28.245166778564453, "global_step": 581891, "epoch": 7010} {"train_loss": -28.005630493164062, "global_step": 581892, "epoch": 7010} {"train_loss": -28.054800033569336, "global_step": 581893, "epoch": 7010} {"train_loss": -28.06939697265625, "global_step": 581894, "epoch": 7010} {"train_loss": -28.402008056640625, "global_step": 581895, "epoch": 7010} {"train_loss": -28.132373809814453, "global_step": 581896, "epoch": 7010} {"train_loss": -27.70197868347168, "global_step": 581897, "epoch": 7010} {"train_loss": -28.171289443969727, "global_step": 581898, "epoch": 7010} {"train_loss": -27.96805191040039, "global_step": 581899, "epoch": 7010} {"train_loss": -28.0565185546875, "global_step": 581900, "epoch": 7010} {"train_loss": -28.16451072692871, "global_step": 581901, "epoch": 7010} {"train_loss": -27.877103805541992, "global_step": 581902, "epoch": 7010} {"train_loss": -28.038681030273438, "global_step": 581903, "epoch": 7010} {"train_loss": -28.143024444580078, "global_step": 581904, "epoch": 7010} {"train_loss": -27.73151969909668, "global_step": 581905, "epoch": 7010} {"train_loss": -27.95460319519043, "global_step": 581906, "epoch": 7010} {"train_loss": -28.123077392578125, "global_step": 581907, "epoch": 7010} {"train_loss": -28.416065216064453, "global_step": 581908, "epoch": 7010} {"train_loss": -27.900333404541016, "global_step": 581909, "epoch": 7010} {"train_loss": -28.00177001953125, "global_step": 581910, "epoch": 7010} {"train_loss": -27.82742691040039, "global_step": 581911, "epoch": 7010} {"train_loss": -27.79181011613593, "global_step": 581912, "epoch": 7010, "val_loss": 6576432.5} {"train_loss": -27.4024715423584, "global_step": 581913, "epoch": 7011} {"train_loss": -26.822586059570312, "global_step": 581914, "epoch": 7011} {"train_loss": -26.99016761779785, "global_step": 581915, "epoch": 7011} {"train_loss": -27.3026123046875, "global_step": 581916, "epoch": 7011} {"train_loss": -27.207944869995117, "global_step": 581917, "epoch": 7011} {"train_loss": -27.174243927001953, "global_step": 581918, "epoch": 7011} {"train_loss": -27.233957290649414, "global_step": 581919, "epoch": 7011} {"train_loss": -27.081424713134766, "global_step": 581920, "epoch": 7011} {"train_loss": -27.903717041015625, "global_step": 581921, "epoch": 7011} {"train_loss": -26.60004997253418, "global_step": 581922, "epoch": 7011} {"train_loss": -26.78676414489746, "global_step": 581923, "epoch": 7011} {"train_loss": -26.417236328125, "global_step": 581924, "epoch": 7011} {"train_loss": -27.654773712158203, "global_step": 581925, "epoch": 7011} {"train_loss": -26.897993087768555, "global_step": 581926, "epoch": 7011} {"train_loss": -27.566614151000977, "global_step": 581927, "epoch": 7011} {"train_loss": -26.4959716796875, "global_step": 581928, "epoch": 7011} {"train_loss": -27.094696044921875, "global_step": 581929, "epoch": 7011} {"train_loss": -27.547119140625, "global_step": 581930, "epoch": 7011} {"train_loss": -27.612741470336914, "global_step": 581931, "epoch": 7011} {"train_loss": -27.566354751586914, "global_step": 581932, "epoch": 7011} {"train_loss": -27.116992950439453, "global_step": 581933, "epoch": 7011} {"train_loss": -27.250873565673828, "global_step": 581934, "epoch": 7011} {"train_loss": -27.57575035095215, "global_step": 581935, "epoch": 7011} {"train_loss": -27.245849609375, "global_step": 581936, "epoch": 7011} {"train_loss": -27.784042358398438, "global_step": 581937, "epoch": 7011} {"train_loss": -27.311017990112305, "global_step": 581938, "epoch": 7011} {"train_loss": -27.901865005493164, "global_step": 581939, "epoch": 7011} {"train_loss": -27.771970748901367, "global_step": 581940, "epoch": 7011} {"train_loss": -28.203277587890625, "global_step": 581941, "epoch": 7011} {"train_loss": -27.78838539123535, "global_step": 581942, "epoch": 7011} {"train_loss": -27.71101188659668, "global_step": 581943, "epoch": 7011} {"train_loss": -27.95528221130371, "global_step": 581944, "epoch": 7011} {"train_loss": -27.48958396911621, "global_step": 581945, "epoch": 7011} {"train_loss": -27.971418380737305, "global_step": 581946, "epoch": 7011} {"train_loss": -27.87002944946289, "global_step": 581947, "epoch": 7011} {"train_loss": -27.84136390686035, "global_step": 581948, "epoch": 7011} {"train_loss": -27.8380126953125, "global_step": 581949, "epoch": 7011} {"train_loss": -27.913827896118164, "global_step": 581950, "epoch": 7011} {"train_loss": -27.850976943969727, "global_step": 581951, "epoch": 7011} {"train_loss": -28.11570167541504, "global_step": 581952, "epoch": 7011} {"train_loss": -28.2947998046875, "global_step": 581953, "epoch": 7011} {"train_loss": -28.15711784362793, "global_step": 581954, "epoch": 7011} {"train_loss": -28.055896759033203, "global_step": 581955, "epoch": 7011} {"train_loss": -27.713247299194336, "global_step": 581956, "epoch": 7011} {"train_loss": -28.063745498657227, "global_step": 581957, "epoch": 7011} {"train_loss": -28.599740982055664, "global_step": 581958, "epoch": 7011} {"train_loss": -27.812946319580078, "global_step": 581959, "epoch": 7011} {"train_loss": -27.991079330444336, "global_step": 581960, "epoch": 7011} {"train_loss": -27.993122100830078, "global_step": 581961, "epoch": 7011} {"train_loss": -27.964319229125977, "global_step": 581962, "epoch": 7011} {"train_loss": -28.129941940307617, "global_step": 581963, "epoch": 7011} {"train_loss": -28.379566192626953, "global_step": 581964, "epoch": 7011} {"train_loss": -27.709253311157227, "global_step": 581965, "epoch": 7011} {"train_loss": -28.02313232421875, "global_step": 581966, "epoch": 7011} {"train_loss": -28.050384521484375, "global_step": 581967, "epoch": 7011} {"train_loss": -28.017780303955078, "global_step": 581968, "epoch": 7011} {"train_loss": -28.077245712280273, "global_step": 581969, "epoch": 7011} {"train_loss": -28.428817749023438, "global_step": 581970, "epoch": 7011} {"train_loss": -28.0516414642334, "global_step": 581971, "epoch": 7011} {"train_loss": -27.817243576049805, "global_step": 581972, "epoch": 7011} {"train_loss": -28.130615234375, "global_step": 581973, "epoch": 7011} {"train_loss": -28.331296920776367, "global_step": 581974, "epoch": 7011} {"train_loss": -28.18387222290039, "global_step": 581975, "epoch": 7011} {"train_loss": -27.79762077331543, "global_step": 581976, "epoch": 7011} {"train_loss": -27.71107292175293, "global_step": 581977, "epoch": 7011} {"train_loss": -27.023447036743164, "global_step": 581978, "epoch": 7011} {"train_loss": -27.661420822143555, "global_step": 581979, "epoch": 7011} {"train_loss": -28.0352783203125, "global_step": 581980, "epoch": 7011} {"train_loss": -27.93931007385254, "global_step": 581981, "epoch": 7011} {"train_loss": -27.992786407470703, "global_step": 581982, "epoch": 7011} {"train_loss": -27.87470817565918, "global_step": 581983, "epoch": 7011} {"train_loss": -27.229333877563477, "global_step": 581984, "epoch": 7011} {"train_loss": -27.77994155883789, "global_step": 581985, "epoch": 7011} {"train_loss": -28.016876220703125, "global_step": 581986, "epoch": 7011} {"train_loss": -27.94317626953125, "global_step": 581987, "epoch": 7011} {"train_loss": -28.1575984954834, "global_step": 581988, "epoch": 7011} {"train_loss": -27.971059799194336, "global_step": 581989, "epoch": 7011} {"train_loss": -27.639230728149414, "global_step": 581990, "epoch": 7011} {"train_loss": -27.535114288330078, "global_step": 581991, "epoch": 7011} {"train_loss": -27.599157333374023, "global_step": 581992, "epoch": 7011} {"train_loss": -27.992053985595703, "global_step": 581993, "epoch": 7011} {"train_loss": -27.66521644592285, "global_step": 581994, "epoch": 7011} {"train_loss": -27.688193194837456, "global_step": 581995, "epoch": 7011, "val_loss": 6617345.0} {"train_loss": -26.739643096923828, "global_step": 581996, "epoch": 7012} {"train_loss": -26.997228622436523, "global_step": 581997, "epoch": 7012} {"train_loss": -27.344160079956055, "global_step": 581998, "epoch": 7012} {"train_loss": -27.245214462280273, "global_step": 581999, "epoch": 7012} {"train_loss": -27.597227096557617, "global_step": 582000, "epoch": 7012} {"train_loss": -27.3570499420166, "global_step": 582001, "epoch": 7012} {"train_loss": -27.122846603393555, "global_step": 582002, "epoch": 7012} {"train_loss": -28.05470848083496, "global_step": 582003, "epoch": 7012} {"train_loss": -27.382612228393555, "global_step": 582004, "epoch": 7012} {"train_loss": -28.1590576171875, "global_step": 582005, "epoch": 7012} {"train_loss": -27.586780548095703, "global_step": 582006, "epoch": 7012} {"train_loss": -27.515268325805664, "global_step": 582007, "epoch": 7012} {"train_loss": -28.326034545898438, "global_step": 582008, "epoch": 7012} {"train_loss": -27.889652252197266, "global_step": 582009, "epoch": 7012} {"train_loss": -28.214813232421875, "global_step": 582010, "epoch": 7012} {"train_loss": -27.520132064819336, "global_step": 582011, "epoch": 7012} {"train_loss": -27.84981346130371, "global_step": 582012, "epoch": 7012} {"train_loss": -27.77692985534668, "global_step": 582013, "epoch": 7012} {"train_loss": -27.801868438720703, "global_step": 582014, "epoch": 7012} {"train_loss": -27.69761085510254, "global_step": 582015, "epoch": 7012} {"train_loss": -27.806859970092773, "global_step": 582016, "epoch": 7012} {"train_loss": -27.836044311523438, "global_step": 582017, "epoch": 7012} {"train_loss": -27.967435836791992, "global_step": 582018, "epoch": 7012} {"train_loss": -27.57402992248535, "global_step": 582019, "epoch": 7012} {"train_loss": -27.5285701751709, "global_step": 582020, "epoch": 7012} {"train_loss": -27.848119735717773, "global_step": 582021, "epoch": 7012} {"train_loss": -27.547834396362305, "global_step": 582022, "epoch": 7012} {"train_loss": -28.08614158630371, "global_step": 582023, "epoch": 7012} {"train_loss": -28.08406639099121, "global_step": 582024, "epoch": 7012} {"train_loss": -28.067819595336914, "global_step": 582025, "epoch": 7012} {"train_loss": -27.955947875976562, "global_step": 582026, "epoch": 7012} {"train_loss": -27.937255859375, "global_step": 582027, "epoch": 7012} {"train_loss": -28.330921173095703, "global_step": 582028, "epoch": 7012} {"train_loss": -28.5787296295166, "global_step": 582029, "epoch": 7012} {"train_loss": -28.146345138549805, "global_step": 582030, "epoch": 7012} {"train_loss": -28.18995475769043, "global_step": 582031, "epoch": 7012} {"train_loss": -28.17282485961914, "global_step": 582032, "epoch": 7012} {"train_loss": -28.02191734313965, "global_step": 582033, "epoch": 7012} {"train_loss": -28.18218421936035, "global_step": 582034, "epoch": 7012} {"train_loss": -27.910207748413086, "global_step": 582035, "epoch": 7012} {"train_loss": -28.39507484436035, "global_step": 582036, "epoch": 7012} {"train_loss": -28.1881103515625, "global_step": 582037, "epoch": 7012} {"train_loss": -28.051740646362305, "global_step": 582038, "epoch": 7012} {"train_loss": -28.13944435119629, "global_step": 582039, "epoch": 7012} {"train_loss": -28.304975509643555, "global_step": 582040, "epoch": 7012} {"train_loss": -28.3035831451416, "global_step": 582041, "epoch": 7012} {"train_loss": -28.4879093170166, "global_step": 582042, "epoch": 7012} {"train_loss": -28.073566436767578, "global_step": 582043, "epoch": 7012} {"train_loss": -27.864957809448242, "global_step": 582044, "epoch": 7012} {"train_loss": -27.652448654174805, "global_step": 582045, "epoch": 7012} {"train_loss": -27.988983154296875, "global_step": 582046, "epoch": 7012} {"train_loss": -27.984777450561523, "global_step": 582047, "epoch": 7012} {"train_loss": -27.938169479370117, "global_step": 582048, "epoch": 7012} {"train_loss": -27.655303955078125, "global_step": 582049, "epoch": 7012} {"train_loss": -27.80440330505371, "global_step": 582050, "epoch": 7012} {"train_loss": -27.85194969177246, "global_step": 582051, "epoch": 7012} {"train_loss": -27.996225357055664, "global_step": 582052, "epoch": 7012} {"train_loss": -28.2808837890625, "global_step": 582053, "epoch": 7012} {"train_loss": -28.120847702026367, "global_step": 582054, "epoch": 7012} {"train_loss": -27.774490356445312, "global_step": 582055, "epoch": 7012} {"train_loss": -28.155221939086914, "global_step": 582056, "epoch": 7012} {"train_loss": -27.997817993164062, "global_step": 582057, "epoch": 7012} {"train_loss": -28.079410552978516, "global_step": 582058, "epoch": 7012} {"train_loss": -27.839025497436523, "global_step": 582059, "epoch": 7012} {"train_loss": -27.830102920532227, "global_step": 582060, "epoch": 7012} {"train_loss": -27.920881271362305, "global_step": 582061, "epoch": 7012} {"train_loss": -28.242755889892578, "global_step": 582062, "epoch": 7012} {"train_loss": -27.92310905456543, "global_step": 582063, "epoch": 7012} {"train_loss": -28.090768814086914, "global_step": 582064, "epoch": 7012} {"train_loss": -28.06182861328125, "global_step": 582065, "epoch": 7012} {"train_loss": -28.22090721130371, "global_step": 582066, "epoch": 7012} {"train_loss": -28.03188133239746, "global_step": 582067, "epoch": 7012} {"train_loss": -28.26778221130371, "global_step": 582068, "epoch": 7012} {"train_loss": -28.28767204284668, "global_step": 582069, "epoch": 7012} {"train_loss": -28.205249786376953, "global_step": 582070, "epoch": 7012} {"train_loss": -28.169958114624023, "global_step": 582071, "epoch": 7012} {"train_loss": -28.31436538696289, "global_step": 582072, "epoch": 7012} {"train_loss": -28.21771240234375, "global_step": 582073, "epoch": 7012} {"train_loss": -28.01498794555664, "global_step": 582074, "epoch": 7012} {"train_loss": -27.855640411376953, "global_step": 582075, "epoch": 7012} {"train_loss": -28.12223243713379, "global_step": 582076, "epoch": 7012} {"train_loss": -27.825048446655273, "global_step": 582077, "epoch": 7012} {"train_loss": -27.92749464655497, "global_step": 582078, "epoch": 7012, "val_loss": 6539186.0} {"train_loss": -25.6695556640625, "global_step": 582079, "epoch": 7013} {"train_loss": -23.250858306884766, "global_step": 582080, "epoch": 7013} {"train_loss": -21.809141159057617, "global_step": 582081, "epoch": 7013} {"train_loss": -26.739126205444336, "global_step": 582082, "epoch": 7013} {"train_loss": -24.45555877685547, "global_step": 582083, "epoch": 7013} {"train_loss": -26.378217697143555, "global_step": 582084, "epoch": 7013} {"train_loss": -25.105558395385742, "global_step": 582085, "epoch": 7013} {"train_loss": -26.999303817749023, "global_step": 582086, "epoch": 7013} {"train_loss": -26.41693115234375, "global_step": 582087, "epoch": 7013} {"train_loss": -26.587125778198242, "global_step": 582088, "epoch": 7013} {"train_loss": -26.653608322143555, "global_step": 582089, "epoch": 7013} {"train_loss": -26.57590103149414, "global_step": 582090, "epoch": 7013} {"train_loss": -26.526519775390625, "global_step": 582091, "epoch": 7013} {"train_loss": -26.59307861328125, "global_step": 582092, "epoch": 7013} {"train_loss": -27.314794540405273, "global_step": 582093, "epoch": 7013} {"train_loss": -25.99704933166504, "global_step": 582094, "epoch": 7013} {"train_loss": -26.777713775634766, "global_step": 582095, "epoch": 7013} {"train_loss": -26.834766387939453, "global_step": 582096, "epoch": 7013} {"train_loss": -27.1960391998291, "global_step": 582097, "epoch": 7013} {"train_loss": -26.862524032592773, "global_step": 582098, "epoch": 7013} {"train_loss": -27.40043067932129, "global_step": 582099, "epoch": 7013} {"train_loss": -27.040876388549805, "global_step": 582100, "epoch": 7013} {"train_loss": -27.149200439453125, "global_step": 582101, "epoch": 7013} {"train_loss": -27.12530517578125, "global_step": 582102, "epoch": 7013} {"train_loss": -27.05048179626465, "global_step": 582103, "epoch": 7013} {"train_loss": -27.642261505126953, "global_step": 582104, "epoch": 7013} {"train_loss": -27.009445190429688, "global_step": 582105, "epoch": 7013} {"train_loss": -27.188602447509766, "global_step": 582106, "epoch": 7013} {"train_loss": -27.533905029296875, "global_step": 582107, "epoch": 7013} {"train_loss": -27.41204261779785, "global_step": 582108, "epoch": 7013} {"train_loss": -27.179418563842773, "global_step": 582109, "epoch": 7013} {"train_loss": -27.180688858032227, "global_step": 582110, "epoch": 7013} {"train_loss": -27.290796279907227, "global_step": 582111, "epoch": 7013} {"train_loss": -27.31715202331543, "global_step": 582112, "epoch": 7013} {"train_loss": -27.431116104125977, "global_step": 582113, "epoch": 7013} {"train_loss": -27.371423721313477, "global_step": 582114, "epoch": 7013} {"train_loss": -27.2669620513916, "global_step": 582115, "epoch": 7013} {"train_loss": -27.64823341369629, "global_step": 582116, "epoch": 7013} {"train_loss": -27.5925350189209, "global_step": 582117, "epoch": 7013} {"train_loss": -27.33186149597168, "global_step": 582118, "epoch": 7013} {"train_loss": -27.77888298034668, "global_step": 582119, "epoch": 7013} {"train_loss": -27.66144371032715, "global_step": 582120, "epoch": 7013} {"train_loss": -27.511768341064453, "global_step": 582121, "epoch": 7013} {"train_loss": -27.9600772857666, "global_step": 582122, "epoch": 7013} {"train_loss": -27.84025001525879, "global_step": 582123, "epoch": 7013} {"train_loss": -27.544424057006836, "global_step": 582124, "epoch": 7013} {"train_loss": -27.405517578125, "global_step": 582125, "epoch": 7013} {"train_loss": -27.588293075561523, "global_step": 582126, "epoch": 7013} {"train_loss": -27.565479278564453, "global_step": 582127, "epoch": 7013} {"train_loss": -28.20123863220215, "global_step": 582128, "epoch": 7013} {"train_loss": -28.038110733032227, "global_step": 582129, "epoch": 7013} {"train_loss": -27.944202423095703, "global_step": 582130, "epoch": 7013} {"train_loss": -27.72774314880371, "global_step": 582131, "epoch": 7013} {"train_loss": -27.789600372314453, "global_step": 582132, "epoch": 7013} {"train_loss": -27.873254776000977, "global_step": 582133, "epoch": 7013} {"train_loss": -27.810169219970703, "global_step": 582134, "epoch": 7013} {"train_loss": -27.9771785736084, "global_step": 582135, "epoch": 7013} {"train_loss": -27.734037399291992, "global_step": 582136, "epoch": 7013} {"train_loss": -27.713403701782227, "global_step": 582137, "epoch": 7013} {"train_loss": -28.22614860534668, "global_step": 582138, "epoch": 7013} {"train_loss": -27.638254165649414, "global_step": 582139, "epoch": 7013} {"train_loss": -27.89837646484375, "global_step": 582140, "epoch": 7013} {"train_loss": -27.817590713500977, "global_step": 582141, "epoch": 7013} {"train_loss": -28.23001480102539, "global_step": 582142, "epoch": 7013} {"train_loss": -28.023548126220703, "global_step": 582143, "epoch": 7013} {"train_loss": -27.9960994720459, "global_step": 582144, "epoch": 7013} {"train_loss": -27.783615112304688, "global_step": 582145, "epoch": 7013} {"train_loss": -28.17767333984375, "global_step": 582146, "epoch": 7013} {"train_loss": -28.145111083984375, "global_step": 582147, "epoch": 7013} {"train_loss": -27.7705078125, "global_step": 582148, "epoch": 7013} {"train_loss": -28.160924911499023, "global_step": 582149, "epoch": 7013} {"train_loss": -27.780838012695312, "global_step": 582150, "epoch": 7013} {"train_loss": -27.754575729370117, "global_step": 582151, "epoch": 7013} {"train_loss": -27.949743270874023, "global_step": 582152, "epoch": 7013} {"train_loss": -27.85358238220215, "global_step": 582153, "epoch": 7013} {"train_loss": -27.821430206298828, "global_step": 582154, "epoch": 7013} {"train_loss": -28.064624786376953, "global_step": 582155, "epoch": 7013} {"train_loss": -28.205413818359375, "global_step": 582156, "epoch": 7013} {"train_loss": -27.9117431640625, "global_step": 582157, "epoch": 7013} {"train_loss": -27.902494430541992, "global_step": 582158, "epoch": 7013} {"train_loss": -27.756567001342773, "global_step": 582159, "epoch": 7013} {"train_loss": -27.401681900024414, "global_step": 582160, "epoch": 7013} {"train_loss": -27.300548070884613, "global_step": 582161, "epoch": 7013, "val_loss": 6591901.0} {"train_loss": -27.2996768951416, "global_step": 582162, "epoch": 7014} {"train_loss": -26.42030143737793, "global_step": 582163, "epoch": 7014} {"train_loss": -26.255796432495117, "global_step": 582164, "epoch": 7014} {"train_loss": -26.736127853393555, "global_step": 582165, "epoch": 7014} {"train_loss": -26.786605834960938, "global_step": 582166, "epoch": 7014} {"train_loss": -26.4519100189209, "global_step": 582167, "epoch": 7014} {"train_loss": -26.972370147705078, "global_step": 582168, "epoch": 7014} {"train_loss": -26.71649742126465, "global_step": 582169, "epoch": 7014} {"train_loss": -26.94404411315918, "global_step": 582170, "epoch": 7014} {"train_loss": -26.961400985717773, "global_step": 582171, "epoch": 7014} {"train_loss": -27.800811767578125, "global_step": 582172, "epoch": 7014} {"train_loss": -27.2329044342041, "global_step": 582173, "epoch": 7014} {"train_loss": -27.593210220336914, "global_step": 582174, "epoch": 7014} {"train_loss": -27.189096450805664, "global_step": 582175, "epoch": 7014} {"train_loss": -27.287799835205078, "global_step": 582176, "epoch": 7014} {"train_loss": -27.16851806640625, "global_step": 582177, "epoch": 7014} {"train_loss": -27.161075592041016, "global_step": 582178, "epoch": 7014} {"train_loss": -27.349851608276367, "global_step": 582179, "epoch": 7014} {"train_loss": -27.453384399414062, "global_step": 582180, "epoch": 7014} {"train_loss": -27.721393585205078, "global_step": 582181, "epoch": 7014} {"train_loss": -27.538055419921875, "global_step": 582182, "epoch": 7014} {"train_loss": -27.56458854675293, "global_step": 582183, "epoch": 7014} {"train_loss": -27.35346794128418, "global_step": 582184, "epoch": 7014} {"train_loss": -27.61565589904785, "global_step": 582185, "epoch": 7014} {"train_loss": -27.66887855529785, "global_step": 582186, "epoch": 7014} {"train_loss": -27.06290626525879, "global_step": 582187, "epoch": 7014} {"train_loss": -27.665441513061523, "global_step": 582188, "epoch": 7014} {"train_loss": -27.489999771118164, "global_step": 582189, "epoch": 7014} {"train_loss": -27.71099281311035, "global_step": 582190, "epoch": 7014} {"train_loss": -27.982812881469727, "global_step": 582191, "epoch": 7014} {"train_loss": -27.76519203186035, "global_step": 582192, "epoch": 7014} {"train_loss": -27.916532516479492, "global_step": 582193, "epoch": 7014} {"train_loss": -27.61359977722168, "global_step": 582194, "epoch": 7014} {"train_loss": -27.9720458984375, "global_step": 582195, "epoch": 7014} {"train_loss": -27.560821533203125, "global_step": 582196, "epoch": 7014} {"train_loss": -28.191137313842773, "global_step": 582197, "epoch": 7014} {"train_loss": -27.977493286132812, "global_step": 582198, "epoch": 7014} {"train_loss": -28.042688369750977, "global_step": 582199, "epoch": 7014} {"train_loss": -27.913070678710938, "global_step": 582200, "epoch": 7014} {"train_loss": -28.19496726989746, "global_step": 582201, "epoch": 7014} {"train_loss": -27.883865356445312, "global_step": 582202, "epoch": 7014} {"train_loss": -28.15240478515625, "global_step": 582203, "epoch": 7014} {"train_loss": -28.18071937561035, "global_step": 582204, "epoch": 7014} {"train_loss": -27.704381942749023, "global_step": 582205, "epoch": 7014} {"train_loss": -28.219970703125, "global_step": 582206, "epoch": 7014} {"train_loss": -27.971145629882812, "global_step": 582207, "epoch": 7014} {"train_loss": -28.1718692779541, "global_step": 582208, "epoch": 7014} {"train_loss": -27.84507179260254, "global_step": 582209, "epoch": 7014} {"train_loss": -27.730716705322266, "global_step": 582210, "epoch": 7014} {"train_loss": -28.009357452392578, "global_step": 582211, "epoch": 7014} {"train_loss": -28.397085189819336, "global_step": 582212, "epoch": 7014} {"train_loss": -28.10139274597168, "global_step": 582213, "epoch": 7014} {"train_loss": -28.19451332092285, "global_step": 582214, "epoch": 7014} {"train_loss": -28.157882690429688, "global_step": 582215, "epoch": 7014} {"train_loss": -28.052997589111328, "global_step": 582216, "epoch": 7014} {"train_loss": -27.90911293029785, "global_step": 582217, "epoch": 7014} {"train_loss": -27.963266372680664, "global_step": 582218, "epoch": 7014} {"train_loss": -27.943313598632812, "global_step": 582219, "epoch": 7014} {"train_loss": -28.178049087524414, "global_step": 582220, "epoch": 7014} {"train_loss": -28.258398056030273, "global_step": 582221, "epoch": 7014} {"train_loss": -28.130361557006836, "global_step": 582222, "epoch": 7014} {"train_loss": -28.14214515686035, "global_step": 582223, "epoch": 7014} {"train_loss": -27.59662437438965, "global_step": 582224, "epoch": 7014} {"train_loss": -28.17085075378418, "global_step": 582225, "epoch": 7014} {"train_loss": -28.464221954345703, "global_step": 582226, "epoch": 7014} {"train_loss": -27.990341186523438, "global_step": 582227, "epoch": 7014} {"train_loss": -27.7455997467041, "global_step": 582228, "epoch": 7014} {"train_loss": -27.538482666015625, "global_step": 582229, "epoch": 7014} {"train_loss": -27.586328506469727, "global_step": 582230, "epoch": 7014} {"train_loss": -28.0394344329834, "global_step": 582231, "epoch": 7014} {"train_loss": -27.93861198425293, "global_step": 582232, "epoch": 7014} {"train_loss": -28.178878784179688, "global_step": 582233, "epoch": 7014} {"train_loss": -28.099475860595703, "global_step": 582234, "epoch": 7014} {"train_loss": -27.76704978942871, "global_step": 582235, "epoch": 7014} {"train_loss": -28.056421279907227, "global_step": 582236, "epoch": 7014} {"train_loss": -27.991012573242188, "global_step": 582237, "epoch": 7014} {"train_loss": -27.872953414916992, "global_step": 582238, "epoch": 7014} {"train_loss": -27.91269302368164, "global_step": 582239, "epoch": 7014} {"train_loss": -27.92548942565918, "global_step": 582240, "epoch": 7014} {"train_loss": -28.05323600769043, "global_step": 582241, "epoch": 7014} {"train_loss": -27.597314834594727, "global_step": 582242, "epoch": 7014} {"train_loss": -27.9908504486084, "global_step": 582243, "epoch": 7014} {"train_loss": -27.711974500173547, "global_step": 582244, "epoch": 7014, "val_loss": 6507149.0} {"train_loss": -27.438405990600586, "global_step": 582245, "epoch": 7015} {"train_loss": -27.066864013671875, "global_step": 582246, "epoch": 7015} {"train_loss": -26.85138511657715, "global_step": 582247, "epoch": 7015} {"train_loss": -27.051183700561523, "global_step": 582248, "epoch": 7015} {"train_loss": -27.393436431884766, "global_step": 582249, "epoch": 7015} {"train_loss": -27.2147274017334, "global_step": 582250, "epoch": 7015} {"train_loss": -27.05433464050293, "global_step": 582251, "epoch": 7015} {"train_loss": -27.509967803955078, "global_step": 582252, "epoch": 7015} {"train_loss": -27.47455406188965, "global_step": 582253, "epoch": 7015} {"train_loss": -27.689075469970703, "global_step": 582254, "epoch": 7015} {"train_loss": -27.58099365234375, "global_step": 582255, "epoch": 7015} {"train_loss": -27.59902000427246, "global_step": 582256, "epoch": 7015} {"train_loss": -27.596731185913086, "global_step": 582257, "epoch": 7015} {"train_loss": -27.60407829284668, "global_step": 582258, "epoch": 7015} {"train_loss": -27.353778839111328, "global_step": 582259, "epoch": 7015} {"train_loss": -27.584802627563477, "global_step": 582260, "epoch": 7015} {"train_loss": -27.686559677124023, "global_step": 582261, "epoch": 7015} {"train_loss": -27.81415367126465, "global_step": 582262, "epoch": 7015} {"train_loss": -28.17976951599121, "global_step": 582263, "epoch": 7015} {"train_loss": -27.401899337768555, "global_step": 582264, "epoch": 7015} {"train_loss": -27.992069244384766, "global_step": 582265, "epoch": 7015} {"train_loss": -27.63031578063965, "global_step": 582266, "epoch": 7015} {"train_loss": -28.104455947875977, "global_step": 582267, "epoch": 7015} {"train_loss": -27.78607177734375, "global_step": 582268, "epoch": 7015} {"train_loss": -28.026275634765625, "global_step": 582269, "epoch": 7015} {"train_loss": -27.81393814086914, "global_step": 582270, "epoch": 7015} {"train_loss": -27.79242515563965, "global_step": 582271, "epoch": 7015} {"train_loss": -27.638288497924805, "global_step": 582272, "epoch": 7015} {"train_loss": -27.835290908813477, "global_step": 582273, "epoch": 7015} {"train_loss": -27.83636474609375, "global_step": 582274, "epoch": 7015} {"train_loss": -27.75371742248535, "global_step": 582275, "epoch": 7015} {"train_loss": -27.85706901550293, "global_step": 582276, "epoch": 7015} {"train_loss": -27.995254516601562, "global_step": 582277, "epoch": 7015} {"train_loss": -28.049091339111328, "global_step": 582278, "epoch": 7015} {"train_loss": -27.87314224243164, "global_step": 582279, "epoch": 7015} {"train_loss": -28.178579330444336, "global_step": 582280, "epoch": 7015} {"train_loss": -28.1440486907959, "global_step": 582281, "epoch": 7015} {"train_loss": -27.874847412109375, "global_step": 582282, "epoch": 7015} {"train_loss": -28.24210548400879, "global_step": 582283, "epoch": 7015} {"train_loss": -27.858373641967773, "global_step": 582284, "epoch": 7015} {"train_loss": -28.284528732299805, "global_step": 582285, "epoch": 7015} {"train_loss": -28.08408546447754, "global_step": 582286, "epoch": 7015} {"train_loss": -27.84137535095215, "global_step": 582287, "epoch": 7015} {"train_loss": -27.97882080078125, "global_step": 582288, "epoch": 7015} {"train_loss": -27.744367599487305, "global_step": 582289, "epoch": 7015} {"train_loss": -27.959089279174805, "global_step": 582290, "epoch": 7015} {"train_loss": -28.349313735961914, "global_step": 582291, "epoch": 7015} {"train_loss": -28.319005966186523, "global_step": 582292, "epoch": 7015} {"train_loss": -27.99212074279785, "global_step": 582293, "epoch": 7015} {"train_loss": -27.92925453186035, "global_step": 582294, "epoch": 7015} {"train_loss": -28.148075103759766, "global_step": 582295, "epoch": 7015} {"train_loss": -27.941816329956055, "global_step": 582296, "epoch": 7015} {"train_loss": -27.8583927154541, "global_step": 582297, "epoch": 7015} {"train_loss": -28.234853744506836, "global_step": 582298, "epoch": 7015} {"train_loss": -28.080673217773438, "global_step": 582299, "epoch": 7015} {"train_loss": -28.1455135345459, "global_step": 582300, "epoch": 7015} {"train_loss": -28.031234741210938, "global_step": 582301, "epoch": 7015} {"train_loss": -28.342710494995117, "global_step": 582302, "epoch": 7015} {"train_loss": -27.934537887573242, "global_step": 582303, "epoch": 7015} {"train_loss": -27.612146377563477, "global_step": 582304, "epoch": 7015} {"train_loss": -27.0438232421875, "global_step": 582305, "epoch": 7015} {"train_loss": -25.69943618774414, "global_step": 582306, "epoch": 7015} {"train_loss": -24.07657241821289, "global_step": 582307, "epoch": 7015} {"train_loss": -24.958547592163086, "global_step": 582308, "epoch": 7015} {"train_loss": -25.887939453125, "global_step": 582309, "epoch": 7015} {"train_loss": -26.647003173828125, "global_step": 582310, "epoch": 7015} {"train_loss": -27.584165573120117, "global_step": 582311, "epoch": 7015} {"train_loss": -26.43293571472168, "global_step": 582312, "epoch": 7015} {"train_loss": -26.376447677612305, "global_step": 582313, "epoch": 7015} {"train_loss": -27.564916610717773, "global_step": 582314, "epoch": 7015} {"train_loss": -26.48272705078125, "global_step": 582315, "epoch": 7015} {"train_loss": -27.6229305267334, "global_step": 582316, "epoch": 7015} {"train_loss": -27.033111572265625, "global_step": 582317, "epoch": 7015} {"train_loss": -27.417709350585938, "global_step": 582318, "epoch": 7015} {"train_loss": -27.11835289001465, "global_step": 582319, "epoch": 7015} {"train_loss": -27.255203247070312, "global_step": 582320, "epoch": 7015} {"train_loss": -27.08346939086914, "global_step": 582321, "epoch": 7015} {"train_loss": -27.077163696289062, "global_step": 582322, "epoch": 7015} {"train_loss": -26.864871978759766, "global_step": 582323, "epoch": 7015} {"train_loss": -27.17122459411621, "global_step": 582324, "epoch": 7015} {"train_loss": -27.391260147094727, "global_step": 582325, "epoch": 7015} {"train_loss": -27.23848533630371, "global_step": 582326, "epoch": 7015} {"train_loss": -27.52598939459008, "global_step": 582327, "epoch": 7015, "val_loss": 6556955.0} {"train_loss": -27.03644371032715, "global_step": 582328, "epoch": 7016} {"train_loss": -27.25299072265625, "global_step": 582329, "epoch": 7016} {"train_loss": -26.959692001342773, "global_step": 582330, "epoch": 7016} {"train_loss": -27.195383071899414, "global_step": 582331, "epoch": 7016} {"train_loss": -26.796051025390625, "global_step": 582332, "epoch": 7016} {"train_loss": -27.3446044921875, "global_step": 582333, "epoch": 7016} {"train_loss": -27.16265869140625, "global_step": 582334, "epoch": 7016} {"train_loss": -26.97662925720215, "global_step": 582335, "epoch": 7016} {"train_loss": -27.40998649597168, "global_step": 582336, "epoch": 7016} {"train_loss": -27.15127944946289, "global_step": 582337, "epoch": 7016} {"train_loss": -27.61195945739746, "global_step": 582338, "epoch": 7016} {"train_loss": -27.3420467376709, "global_step": 582339, "epoch": 7016} {"train_loss": -27.216562271118164, "global_step": 582340, "epoch": 7016} {"train_loss": -27.68461036682129, "global_step": 582341, "epoch": 7016} {"train_loss": -27.458057403564453, "global_step": 582342, "epoch": 7016} {"train_loss": -27.67154884338379, "global_step": 582343, "epoch": 7016} {"train_loss": -27.687063217163086, "global_step": 582344, "epoch": 7016} {"train_loss": -27.682600021362305, "global_step": 582345, "epoch": 7016} {"train_loss": -27.525190353393555, "global_step": 582346, "epoch": 7016} {"train_loss": -27.885343551635742, "global_step": 582347, "epoch": 7016} {"train_loss": -27.757938385009766, "global_step": 582348, "epoch": 7016} {"train_loss": -27.84046745300293, "global_step": 582349, "epoch": 7016} {"train_loss": -27.8399658203125, "global_step": 582350, "epoch": 7016} {"train_loss": -27.59259033203125, "global_step": 582351, "epoch": 7016} {"train_loss": -27.74476432800293, "global_step": 582352, "epoch": 7016} {"train_loss": -28.1380615234375, "global_step": 582353, "epoch": 7016} {"train_loss": -27.849958419799805, "global_step": 582354, "epoch": 7016} {"train_loss": -27.996692657470703, "global_step": 582355, "epoch": 7016} {"train_loss": -28.260522842407227, "global_step": 582356, "epoch": 7016} {"train_loss": -27.875732421875, "global_step": 582357, "epoch": 7016} {"train_loss": -27.85599708557129, "global_step": 582358, "epoch": 7016} {"train_loss": -27.8460750579834, "global_step": 582359, "epoch": 7016} {"train_loss": -28.299646377563477, "global_step": 582360, "epoch": 7016} {"train_loss": -28.0133056640625, "global_step": 582361, "epoch": 7016} {"train_loss": -28.330957412719727, "global_step": 582362, "epoch": 7016} {"train_loss": -28.194265365600586, "global_step": 582363, "epoch": 7016} {"train_loss": -27.90413475036621, "global_step": 582364, "epoch": 7016} {"train_loss": -28.142017364501953, "global_step": 582365, "epoch": 7016} {"train_loss": -27.760242462158203, "global_step": 582366, "epoch": 7016} {"train_loss": -28.196619033813477, "global_step": 582367, "epoch": 7016} {"train_loss": -28.064939498901367, "global_step": 582368, "epoch": 7016} {"train_loss": -28.203027725219727, "global_step": 582369, "epoch": 7016} {"train_loss": -27.70517921447754, "global_step": 582370, "epoch": 7016} {"train_loss": -28.061304092407227, "global_step": 582371, "epoch": 7016} {"train_loss": -28.09088706970215, "global_step": 582372, "epoch": 7016} {"train_loss": -28.11777687072754, "global_step": 582373, "epoch": 7016} {"train_loss": -28.036941528320312, "global_step": 582374, "epoch": 7016} {"train_loss": -28.1361083984375, "global_step": 582375, "epoch": 7016} {"train_loss": -27.84357261657715, "global_step": 582376, "epoch": 7016} {"train_loss": -28.213850021362305, "global_step": 582377, "epoch": 7016} {"train_loss": -28.21192741394043, "global_step": 582378, "epoch": 7016} {"train_loss": -27.447784423828125, "global_step": 582379, "epoch": 7016} {"train_loss": -27.636890411376953, "global_step": 582380, "epoch": 7016} {"train_loss": -27.539697647094727, "global_step": 582381, "epoch": 7016} {"train_loss": -27.846572875976562, "global_step": 582382, "epoch": 7016} {"train_loss": -28.00347328186035, "global_step": 582383, "epoch": 7016} {"train_loss": -27.376554489135742, "global_step": 582384, "epoch": 7016} {"train_loss": -27.87485122680664, "global_step": 582385, "epoch": 7016} {"train_loss": -27.707975387573242, "global_step": 582386, "epoch": 7016} {"train_loss": -27.576740264892578, "global_step": 582387, "epoch": 7016} {"train_loss": -28.146503448486328, "global_step": 582388, "epoch": 7016} {"train_loss": -27.583038330078125, "global_step": 582389, "epoch": 7016} {"train_loss": -27.547393798828125, "global_step": 582390, "epoch": 7016} {"train_loss": -27.35456657409668, "global_step": 582391, "epoch": 7016} {"train_loss": -28.0589599609375, "global_step": 582392, "epoch": 7016} {"train_loss": -28.0609188079834, "global_step": 582393, "epoch": 7016} {"train_loss": -27.6644229888916, "global_step": 582394, "epoch": 7016} {"train_loss": -27.181615829467773, "global_step": 582395, "epoch": 7016} {"train_loss": -27.828092575073242, "global_step": 582396, "epoch": 7016} {"train_loss": -27.861255645751953, "global_step": 582397, "epoch": 7016} {"train_loss": -27.506793975830078, "global_step": 582398, "epoch": 7016} {"train_loss": -27.301990509033203, "global_step": 582399, "epoch": 7016} {"train_loss": -27.74652671813965, "global_step": 582400, "epoch": 7016} {"train_loss": -28.19341468811035, "global_step": 582401, "epoch": 7016} {"train_loss": -27.842941284179688, "global_step": 582402, "epoch": 7016} {"train_loss": -27.79523277282715, "global_step": 582403, "epoch": 7016} {"train_loss": -28.284128189086914, "global_step": 582404, "epoch": 7016} {"train_loss": -28.11750602722168, "global_step": 582405, "epoch": 7016} {"train_loss": -27.716232299804688, "global_step": 582406, "epoch": 7016} {"train_loss": -28.02655029296875, "global_step": 582407, "epoch": 7016} {"train_loss": -28.05655288696289, "global_step": 582408, "epoch": 7016} {"train_loss": -27.91251564025879, "global_step": 582409, "epoch": 7016} {"train_loss": -27.756950470338385, "global_step": 582410, "epoch": 7016, "val_loss": 6554566.0} {"train_loss": -27.7567081451416, "global_step": 582411, "epoch": 7017} {"train_loss": -27.242080688476562, "global_step": 582412, "epoch": 7017} {"train_loss": -27.37957763671875, "global_step": 582413, "epoch": 7017} {"train_loss": -27.44960594177246, "global_step": 582414, "epoch": 7017} {"train_loss": -27.763690948486328, "global_step": 582415, "epoch": 7017} {"train_loss": -27.295516967773438, "global_step": 582416, "epoch": 7017} {"train_loss": -27.491743087768555, "global_step": 582417, "epoch": 7017} {"train_loss": -27.640867233276367, "global_step": 582418, "epoch": 7017} {"train_loss": -27.39813232421875, "global_step": 582419, "epoch": 7017} {"train_loss": -28.0522403717041, "global_step": 582420, "epoch": 7017} {"train_loss": -27.328779220581055, "global_step": 582421, "epoch": 7017} {"train_loss": -27.70888328552246, "global_step": 582422, "epoch": 7017} {"train_loss": -27.445098876953125, "global_step": 582423, "epoch": 7017} {"train_loss": -27.69939613342285, "global_step": 582424, "epoch": 7017} {"train_loss": -27.4959659576416, "global_step": 582425, "epoch": 7017} {"train_loss": -27.31781578063965, "global_step": 582426, "epoch": 7017} {"train_loss": -27.87544822692871, "global_step": 582427, "epoch": 7017} {"train_loss": -27.5718936920166, "global_step": 582428, "epoch": 7017} {"train_loss": -27.779041290283203, "global_step": 582429, "epoch": 7017} {"train_loss": -28.054533004760742, "global_step": 582430, "epoch": 7017} {"train_loss": -27.633024215698242, "global_step": 582431, "epoch": 7017} {"train_loss": -28.060596466064453, "global_step": 582432, "epoch": 7017} {"train_loss": -27.926679611206055, "global_step": 582433, "epoch": 7017} {"train_loss": -27.611164093017578, "global_step": 582434, "epoch": 7017} {"train_loss": -28.1557674407959, "global_step": 582435, "epoch": 7017} {"train_loss": -27.700857162475586, "global_step": 582436, "epoch": 7017} {"train_loss": -27.657873153686523, "global_step": 582437, "epoch": 7017} {"train_loss": -27.936582565307617, "global_step": 582438, "epoch": 7017} {"train_loss": -27.93501091003418, "global_step": 582439, "epoch": 7017} {"train_loss": -28.065149307250977, "global_step": 582440, "epoch": 7017} {"train_loss": -27.947240829467773, "global_step": 582441, "epoch": 7017} {"train_loss": -27.682722091674805, "global_step": 582442, "epoch": 7017} {"train_loss": -27.7515926361084, "global_step": 582443, "epoch": 7017} {"train_loss": -28.050872802734375, "global_step": 582444, "epoch": 7017} {"train_loss": -27.936574935913086, "global_step": 582445, "epoch": 7017} {"train_loss": -27.982633590698242, "global_step": 582446, "epoch": 7017} {"train_loss": -27.480487823486328, "global_step": 582447, "epoch": 7017} {"train_loss": -28.087549209594727, "global_step": 582448, "epoch": 7017} {"train_loss": -27.935468673706055, "global_step": 582449, "epoch": 7017} {"train_loss": -27.943593978881836, "global_step": 582450, "epoch": 7017} {"train_loss": -27.993793487548828, "global_step": 582451, "epoch": 7017} {"train_loss": -27.793073654174805, "global_step": 582452, "epoch": 7017} {"train_loss": -28.00409507751465, "global_step": 582453, "epoch": 7017} {"train_loss": -27.9921932220459, "global_step": 582454, "epoch": 7017} {"train_loss": -27.814313888549805, "global_step": 582455, "epoch": 7017} {"train_loss": -27.86941909790039, "global_step": 582456, "epoch": 7017} {"train_loss": -27.72919273376465, "global_step": 582457, "epoch": 7017} {"train_loss": -28.118982315063477, "global_step": 582458, "epoch": 7017} {"train_loss": -27.183584213256836, "global_step": 582459, "epoch": 7017} {"train_loss": -27.734716415405273, "global_step": 582460, "epoch": 7017} {"train_loss": -28.2003173828125, "global_step": 582461, "epoch": 7017} {"train_loss": -28.095706939697266, "global_step": 582462, "epoch": 7017} {"train_loss": -28.264678955078125, "global_step": 582463, "epoch": 7017} {"train_loss": -27.692432403564453, "global_step": 582464, "epoch": 7017} {"train_loss": -27.8928279876709, "global_step": 582465, "epoch": 7017} {"train_loss": -27.84964942932129, "global_step": 582466, "epoch": 7017} {"train_loss": -28.007080078125, "global_step": 582467, "epoch": 7017} {"train_loss": -27.930856704711914, "global_step": 582468, "epoch": 7017} {"train_loss": -28.17905616760254, "global_step": 582469, "epoch": 7017} {"train_loss": -28.01209831237793, "global_step": 582470, "epoch": 7017} {"train_loss": -28.402084350585938, "global_step": 582471, "epoch": 7017} {"train_loss": -28.133193969726562, "global_step": 582472, "epoch": 7017} {"train_loss": -27.963409423828125, "global_step": 582473, "epoch": 7017} {"train_loss": -28.237171173095703, "global_step": 582474, "epoch": 7017} {"train_loss": -28.2688045501709, "global_step": 582475, "epoch": 7017} {"train_loss": -28.348114013671875, "global_step": 582476, "epoch": 7017} {"train_loss": -28.15204429626465, "global_step": 582477, "epoch": 7017} {"train_loss": -28.163700103759766, "global_step": 582478, "epoch": 7017} {"train_loss": -27.84505271911621, "global_step": 582479, "epoch": 7017} {"train_loss": -28.04266929626465, "global_step": 582480, "epoch": 7017} {"train_loss": -27.953256607055664, "global_step": 582481, "epoch": 7017} {"train_loss": -28.3500919342041, "global_step": 582482, "epoch": 7017} {"train_loss": -28.14246940612793, "global_step": 582483, "epoch": 7017} {"train_loss": -28.013540267944336, "global_step": 582484, "epoch": 7017} {"train_loss": -28.03712272644043, "global_step": 582485, "epoch": 7017} {"train_loss": -28.236982345581055, "global_step": 582486, "epoch": 7017} {"train_loss": -27.941070556640625, "global_step": 582487, "epoch": 7017} {"train_loss": -28.149717330932617, "global_step": 582488, "epoch": 7017} {"train_loss": -28.335168838500977, "global_step": 582489, "epoch": 7017} {"train_loss": -28.08921241760254, "global_step": 582490, "epoch": 7017} {"train_loss": -28.05472755432129, "global_step": 582491, "epoch": 7017} {"train_loss": -28.242359161376953, "global_step": 582492, "epoch": 7017} {"train_loss": -27.882609195019825, "global_step": 582493, "epoch": 7017, "val_loss": 6556373.0} {"train_loss": -27.341028213500977, "global_step": 582494, "epoch": 7018} {"train_loss": -26.49881362915039, "global_step": 582495, "epoch": 7018} {"train_loss": -25.675954818725586, "global_step": 582496, "epoch": 7018} {"train_loss": -26.15821647644043, "global_step": 582497, "epoch": 7018} {"train_loss": -25.588430404663086, "global_step": 582498, "epoch": 7018} {"train_loss": -26.165359497070312, "global_step": 582499, "epoch": 7018} {"train_loss": -26.710296630859375, "global_step": 582500, "epoch": 7018} {"train_loss": -27.284748077392578, "global_step": 582501, "epoch": 7018} {"train_loss": -26.952688217163086, "global_step": 582502, "epoch": 7018} {"train_loss": -26.933856964111328, "global_step": 582503, "epoch": 7018} {"train_loss": -26.82122230529785, "global_step": 582504, "epoch": 7018} {"train_loss": -27.056533813476562, "global_step": 582505, "epoch": 7018} {"train_loss": -26.89594841003418, "global_step": 582506, "epoch": 7018} {"train_loss": -27.093311309814453, "global_step": 582507, "epoch": 7018} {"train_loss": -27.417545318603516, "global_step": 582508, "epoch": 7018} {"train_loss": -27.254241943359375, "global_step": 582509, "epoch": 7018} {"train_loss": -27.089635848999023, "global_step": 582510, "epoch": 7018} {"train_loss": -27.387720108032227, "global_step": 582511, "epoch": 7018} {"train_loss": -27.060850143432617, "global_step": 582512, "epoch": 7018} {"train_loss": -27.486127853393555, "global_step": 582513, "epoch": 7018} {"train_loss": -27.3510684967041, "global_step": 582514, "epoch": 7018} {"train_loss": -27.19354820251465, "global_step": 582515, "epoch": 7018} {"train_loss": -27.678998947143555, "global_step": 582516, "epoch": 7018} {"train_loss": -27.554670333862305, "global_step": 582517, "epoch": 7018} {"train_loss": -27.386442184448242, "global_step": 582518, "epoch": 7018} {"train_loss": -27.086706161499023, "global_step": 582519, "epoch": 7018} {"train_loss": -27.454620361328125, "global_step": 582520, "epoch": 7018} {"train_loss": -27.477005004882812, "global_step": 582521, "epoch": 7018} {"train_loss": -27.419818878173828, "global_step": 582522, "epoch": 7018} {"train_loss": -27.324462890625, "global_step": 582523, "epoch": 7018} {"train_loss": -27.646276473999023, "global_step": 582524, "epoch": 7018} {"train_loss": -27.484174728393555, "global_step": 582525, "epoch": 7018} {"train_loss": -27.832868576049805, "global_step": 582526, "epoch": 7018} {"train_loss": -27.653579711914062, "global_step": 582527, "epoch": 7018} {"train_loss": -27.64973258972168, "global_step": 582528, "epoch": 7018} {"train_loss": -27.72614097595215, "global_step": 582529, "epoch": 7018} {"train_loss": -27.93524169921875, "global_step": 582530, "epoch": 7018} {"train_loss": -28.029010772705078, "global_step": 582531, "epoch": 7018} {"train_loss": -27.8314266204834, "global_step": 582532, "epoch": 7018} {"train_loss": -27.994873046875, "global_step": 582533, "epoch": 7018} {"train_loss": -27.972097396850586, "global_step": 582534, "epoch": 7018} {"train_loss": -27.6268367767334, "global_step": 582535, "epoch": 7018} {"train_loss": -27.923294067382812, "global_step": 582536, "epoch": 7018} {"train_loss": -28.098371505737305, "global_step": 582537, "epoch": 7018} {"train_loss": -27.855987548828125, "global_step": 582538, "epoch": 7018} {"train_loss": -27.89350700378418, "global_step": 582539, "epoch": 7018} {"train_loss": -27.899871826171875, "global_step": 582540, "epoch": 7018} {"train_loss": -27.874103546142578, "global_step": 582541, "epoch": 7018} {"train_loss": -28.12843132019043, "global_step": 582542, "epoch": 7018} {"train_loss": -27.977609634399414, "global_step": 582543, "epoch": 7018} {"train_loss": -27.911645889282227, "global_step": 582544, "epoch": 7018} {"train_loss": -27.850860595703125, "global_step": 582545, "epoch": 7018} {"train_loss": -28.08928871154785, "global_step": 582546, "epoch": 7018} {"train_loss": -28.4940128326416, "global_step": 582547, "epoch": 7018} {"train_loss": -28.456146240234375, "global_step": 582548, "epoch": 7018} {"train_loss": -28.08326530456543, "global_step": 582549, "epoch": 7018} {"train_loss": -28.04901123046875, "global_step": 582550, "epoch": 7018} {"train_loss": -28.022741317749023, "global_step": 582551, "epoch": 7018} {"train_loss": -28.21693992614746, "global_step": 582552, "epoch": 7018} {"train_loss": -28.1851749420166, "global_step": 582553, "epoch": 7018} {"train_loss": -27.86529541015625, "global_step": 582554, "epoch": 7018} {"train_loss": -28.356876373291016, "global_step": 582555, "epoch": 7018} {"train_loss": -28.056869506835938, "global_step": 582556, "epoch": 7018} {"train_loss": -28.316730499267578, "global_step": 582557, "epoch": 7018} {"train_loss": -27.880170822143555, "global_step": 582558, "epoch": 7018} {"train_loss": -28.213788986206055, "global_step": 582559, "epoch": 7018} {"train_loss": -28.336597442626953, "global_step": 582560, "epoch": 7018} {"train_loss": -28.17365837097168, "global_step": 582561, "epoch": 7018} {"train_loss": -27.887359619140625, "global_step": 582562, "epoch": 7018} {"train_loss": -27.872182846069336, "global_step": 582563, "epoch": 7018} {"train_loss": -27.916168212890625, "global_step": 582564, "epoch": 7018} {"train_loss": -27.911535263061523, "global_step": 582565, "epoch": 7018} {"train_loss": -27.753894805908203, "global_step": 582566, "epoch": 7018} {"train_loss": -27.4399471282959, "global_step": 582567, "epoch": 7018} {"train_loss": -26.50331687927246, "global_step": 582568, "epoch": 7018} {"train_loss": -26.58572769165039, "global_step": 582569, "epoch": 7018} {"train_loss": -27.596771240234375, "global_step": 582570, "epoch": 7018} {"train_loss": -28.28961181640625, "global_step": 582571, "epoch": 7018} {"train_loss": -27.376663208007812, "global_step": 582572, "epoch": 7018} {"train_loss": -27.6951904296875, "global_step": 582573, "epoch": 7018} {"train_loss": -27.861692428588867, "global_step": 582574, "epoch": 7018} {"train_loss": -27.756500244140625, "global_step": 582575, "epoch": 7018} {"train_loss": -27.57204602712608, "global_step": 582576, "epoch": 7018, "val_loss": 6545433.5} {"train_loss": -26.914508819580078, "global_step": 582577, "epoch": 7019} {"train_loss": -26.65380859375, "global_step": 582578, "epoch": 7019} {"train_loss": -25.914350509643555, "global_step": 582579, "epoch": 7019} {"train_loss": -26.2005558013916, "global_step": 582580, "epoch": 7019} {"train_loss": -26.46368980407715, "global_step": 582581, "epoch": 7019} {"train_loss": -27.248706817626953, "global_step": 582582, "epoch": 7019} {"train_loss": -27.119958877563477, "global_step": 582583, "epoch": 7019} {"train_loss": -26.728158950805664, "global_step": 582584, "epoch": 7019} {"train_loss": -27.13245964050293, "global_step": 582585, "epoch": 7019} {"train_loss": -26.576496124267578, "global_step": 582586, "epoch": 7019} {"train_loss": -27.18707847595215, "global_step": 582587, "epoch": 7019} {"train_loss": -27.455890655517578, "global_step": 582588, "epoch": 7019} {"train_loss": -26.998151779174805, "global_step": 582589, "epoch": 7019} {"train_loss": -26.7713680267334, "global_step": 582590, "epoch": 7019} {"train_loss": -27.3475341796875, "global_step": 582591, "epoch": 7019} {"train_loss": -27.674396514892578, "global_step": 582592, "epoch": 7019} {"train_loss": -27.455015182495117, "global_step": 582593, "epoch": 7019} {"train_loss": -27.208044052124023, "global_step": 582594, "epoch": 7019} {"train_loss": -27.48908042907715, "global_step": 582595, "epoch": 7019} {"train_loss": -27.443470001220703, "global_step": 582596, "epoch": 7019} {"train_loss": -27.57830810546875, "global_step": 582597, "epoch": 7019} {"train_loss": -27.34809684753418, "global_step": 582598, "epoch": 7019} {"train_loss": -27.750762939453125, "global_step": 582599, "epoch": 7019} {"train_loss": -27.378652572631836, "global_step": 582600, "epoch": 7019} {"train_loss": -27.833280563354492, "global_step": 582601, "epoch": 7019} {"train_loss": -27.51019859313965, "global_step": 582602, "epoch": 7019} {"train_loss": -27.961034774780273, "global_step": 582603, "epoch": 7019} {"train_loss": -27.216968536376953, "global_step": 582604, "epoch": 7019} {"train_loss": -27.957937240600586, "global_step": 582605, "epoch": 7019} {"train_loss": -27.44089698791504, "global_step": 582606, "epoch": 7019} {"train_loss": -27.712955474853516, "global_step": 582607, "epoch": 7019} {"train_loss": -27.600543975830078, "global_step": 582608, "epoch": 7019} {"train_loss": -27.453580856323242, "global_step": 582609, "epoch": 7019} {"train_loss": -27.609455108642578, "global_step": 582610, "epoch": 7019} {"train_loss": -27.64615821838379, "global_step": 582611, "epoch": 7019} {"train_loss": -27.565845489501953, "global_step": 582612, "epoch": 7019} {"train_loss": -28.02548599243164, "global_step": 582613, "epoch": 7019} {"train_loss": -27.867767333984375, "global_step": 582614, "epoch": 7019} {"train_loss": -27.802112579345703, "global_step": 582615, "epoch": 7019} {"train_loss": -27.768848419189453, "global_step": 582616, "epoch": 7019} {"train_loss": -28.197711944580078, "global_step": 582617, "epoch": 7019} {"train_loss": -28.079755783081055, "global_step": 582618, "epoch": 7019} {"train_loss": -27.777204513549805, "global_step": 582619, "epoch": 7019} {"train_loss": -28.03995132446289, "global_step": 582620, "epoch": 7019} {"train_loss": -28.29937744140625, "global_step": 582621, "epoch": 7019} {"train_loss": -27.883655548095703, "global_step": 582622, "epoch": 7019} {"train_loss": -27.956388473510742, "global_step": 582623, "epoch": 7019} {"train_loss": -27.977771759033203, "global_step": 582624, "epoch": 7019} {"train_loss": -28.173059463500977, "global_step": 582625, "epoch": 7019} {"train_loss": -27.939722061157227, "global_step": 582626, "epoch": 7019} {"train_loss": -28.10828971862793, "global_step": 582627, "epoch": 7019} {"train_loss": -28.289615631103516, "global_step": 582628, "epoch": 7019} {"train_loss": -28.075275421142578, "global_step": 582629, "epoch": 7019} {"train_loss": -28.078298568725586, "global_step": 582630, "epoch": 7019} {"train_loss": -27.958683013916016, "global_step": 582631, "epoch": 7019} {"train_loss": -28.128751754760742, "global_step": 582632, "epoch": 7019} {"train_loss": -28.319808959960938, "global_step": 582633, "epoch": 7019} {"train_loss": -28.086410522460938, "global_step": 582634, "epoch": 7019} {"train_loss": -28.245697021484375, "global_step": 582635, "epoch": 7019} {"train_loss": -28.256732940673828, "global_step": 582636, "epoch": 7019} {"train_loss": -28.16251564025879, "global_step": 582637, "epoch": 7019} {"train_loss": -27.892419815063477, "global_step": 582638, "epoch": 7019} {"train_loss": -28.406721115112305, "global_step": 582639, "epoch": 7019} {"train_loss": -28.2717342376709, "global_step": 582640, "epoch": 7019} {"train_loss": -28.247791290283203, "global_step": 582641, "epoch": 7019} {"train_loss": -28.315052032470703, "global_step": 582642, "epoch": 7019} {"train_loss": -28.056049346923828, "global_step": 582643, "epoch": 7019} {"train_loss": -27.825321197509766, "global_step": 582644, "epoch": 7019} {"train_loss": -27.181934356689453, "global_step": 582645, "epoch": 7019} {"train_loss": -26.662296295166016, "global_step": 582646, "epoch": 7019} {"train_loss": -26.655065536499023, "global_step": 582647, "epoch": 7019} {"train_loss": -28.08846092224121, "global_step": 582648, "epoch": 7019} {"train_loss": -27.41094970703125, "global_step": 582649, "epoch": 7019} {"train_loss": -27.87867546081543, "global_step": 582650, "epoch": 7019} {"train_loss": -27.232580184936523, "global_step": 582651, "epoch": 7019} {"train_loss": -28.153003692626953, "global_step": 582652, "epoch": 7019} {"train_loss": -27.654294967651367, "global_step": 582653, "epoch": 7019} {"train_loss": -28.239404678344727, "global_step": 582654, "epoch": 7019} {"train_loss": -27.248645782470703, "global_step": 582655, "epoch": 7019} {"train_loss": -27.830068588256836, "global_step": 582656, "epoch": 7019} {"train_loss": -27.917266845703125, "global_step": 582657, "epoch": 7019} {"train_loss": -27.80129051208496, "global_step": 582658, "epoch": 7019} {"train_loss": -27.626762619937757, "global_step": 582659, "epoch": 7019, "val_loss": 6426837.0} {"train_loss": -25.283979415893555, "global_step": 582660, "epoch": 7020} {"train_loss": -26.110273361206055, "global_step": 582661, "epoch": 7020} {"train_loss": -26.11903953552246, "global_step": 582662, "epoch": 7020} {"train_loss": -26.2658748626709, "global_step": 582663, "epoch": 7020} {"train_loss": -26.626148223876953, "global_step": 582664, "epoch": 7020} {"train_loss": -25.614974975585938, "global_step": 582665, "epoch": 7020} {"train_loss": -26.1358642578125, "global_step": 582666, "epoch": 7020} {"train_loss": -26.908788681030273, "global_step": 582667, "epoch": 7020} {"train_loss": -26.46235466003418, "global_step": 582668, "epoch": 7020} {"train_loss": -26.902978897094727, "global_step": 582669, "epoch": 7020} {"train_loss": -27.294469833374023, "global_step": 582670, "epoch": 7020} {"train_loss": -26.91688346862793, "global_step": 582671, "epoch": 7020} {"train_loss": -27.07551383972168, "global_step": 582672, "epoch": 7020} {"train_loss": -27.282102584838867, "global_step": 582673, "epoch": 7020} {"train_loss": -26.88166618347168, "global_step": 582674, "epoch": 7020} {"train_loss": -26.896961212158203, "global_step": 582675, "epoch": 7020} {"train_loss": -27.1926326751709, "global_step": 582676, "epoch": 7020} {"train_loss": -26.862136840820312, "global_step": 582677, "epoch": 7020} {"train_loss": -27.049535751342773, "global_step": 582678, "epoch": 7020} {"train_loss": -27.111093521118164, "global_step": 582679, "epoch": 7020} {"train_loss": -27.352813720703125, "global_step": 582680, "epoch": 7020} {"train_loss": -27.687744140625, "global_step": 582681, "epoch": 7020} {"train_loss": -27.3253116607666, "global_step": 582682, "epoch": 7020} {"train_loss": -27.049945831298828, "global_step": 582683, "epoch": 7020} {"train_loss": -27.294879913330078, "global_step": 582684, "epoch": 7020} {"train_loss": -27.68367576599121, "global_step": 582685, "epoch": 7020} {"train_loss": -27.42963981628418, "global_step": 582686, "epoch": 7020} {"train_loss": -27.592100143432617, "global_step": 582687, "epoch": 7020} {"train_loss": -27.33565330505371, "global_step": 582688, "epoch": 7020} {"train_loss": -27.464197158813477, "global_step": 582689, "epoch": 7020} {"train_loss": -27.646270751953125, "global_step": 582690, "epoch": 7020} {"train_loss": -27.53792381286621, "global_step": 582691, "epoch": 7020} {"train_loss": -27.79111099243164, "global_step": 582692, "epoch": 7020} {"train_loss": -27.736286163330078, "global_step": 582693, "epoch": 7020} {"train_loss": -27.6538028717041, "global_step": 582694, "epoch": 7020} {"train_loss": -27.6685791015625, "global_step": 582695, "epoch": 7020} {"train_loss": -27.517780303955078, "global_step": 582696, "epoch": 7020} {"train_loss": -27.68622398376465, "global_step": 582697, "epoch": 7020} {"train_loss": -27.818479537963867, "global_step": 582698, "epoch": 7020} {"train_loss": -27.931476593017578, "global_step": 582699, "epoch": 7020} {"train_loss": -27.72104263305664, "global_step": 582700, "epoch": 7020} {"train_loss": -27.659238815307617, "global_step": 582701, "epoch": 7020} {"train_loss": -28.000579833984375, "global_step": 582702, "epoch": 7020} {"train_loss": -28.07777214050293, "global_step": 582703, "epoch": 7020} {"train_loss": -27.75544548034668, "global_step": 582704, "epoch": 7020} {"train_loss": -27.95961570739746, "global_step": 582705, "epoch": 7020} {"train_loss": -27.73090171813965, "global_step": 582706, "epoch": 7020} {"train_loss": -27.74789810180664, "global_step": 582707, "epoch": 7020} {"train_loss": -28.03242301940918, "global_step": 582708, "epoch": 7020} {"train_loss": -28.11995506286621, "global_step": 582709, "epoch": 7020} {"train_loss": -28.181690216064453, "global_step": 582710, "epoch": 7020} {"train_loss": -27.637372970581055, "global_step": 582711, "epoch": 7020} {"train_loss": -28.11146354675293, "global_step": 582712, "epoch": 7020} {"train_loss": -28.1107120513916, "global_step": 582713, "epoch": 7020} {"train_loss": -27.893705368041992, "global_step": 582714, "epoch": 7020} {"train_loss": -27.722639083862305, "global_step": 582715, "epoch": 7020} {"train_loss": -28.066009521484375, "global_step": 582716, "epoch": 7020} {"train_loss": -27.917089462280273, "global_step": 582717, "epoch": 7020} {"train_loss": -28.38996696472168, "global_step": 582718, "epoch": 7020} {"train_loss": -27.87859535217285, "global_step": 582719, "epoch": 7020} {"train_loss": -28.327604293823242, "global_step": 582720, "epoch": 7020} {"train_loss": -27.896595001220703, "global_step": 582721, "epoch": 7020} {"train_loss": -28.153120040893555, "global_step": 582722, "epoch": 7020} {"train_loss": -27.72600746154785, "global_step": 582723, "epoch": 7020} {"train_loss": -28.272912979125977, "global_step": 582724, "epoch": 7020} {"train_loss": -28.1101131439209, "global_step": 582725, "epoch": 7020} {"train_loss": -27.810810089111328, "global_step": 582726, "epoch": 7020} {"train_loss": -28.007843017578125, "global_step": 582727, "epoch": 7020} {"train_loss": -27.79426383972168, "global_step": 582728, "epoch": 7020} {"train_loss": -27.968006134033203, "global_step": 582729, "epoch": 7020} {"train_loss": -28.057178497314453, "global_step": 582730, "epoch": 7020} {"train_loss": -27.84055519104004, "global_step": 582731, "epoch": 7020} {"train_loss": -27.947973251342773, "global_step": 582732, "epoch": 7020} {"train_loss": -28.119489669799805, "global_step": 582733, "epoch": 7020} {"train_loss": -28.103290557861328, "global_step": 582734, "epoch": 7020} {"train_loss": -28.41998291015625, "global_step": 582735, "epoch": 7020} {"train_loss": -27.74614906311035, "global_step": 582736, "epoch": 7020} {"train_loss": -27.92996597290039, "global_step": 582737, "epoch": 7020} {"train_loss": -28.16082763671875, "global_step": 582738, "epoch": 7020} {"train_loss": -27.90900993347168, "global_step": 582739, "epoch": 7020} {"train_loss": -27.993391036987305, "global_step": 582740, "epoch": 7020} {"train_loss": -28.37727165222168, "global_step": 582741, "epoch": 7020} {"train_loss": -27.55106167620923, "global_step": 582742, "epoch": 7020, "val_loss": 6697295.0} {"train_loss": -27.338581085205078, "global_step": 582743, "epoch": 7021} {"train_loss": -26.343366622924805, "global_step": 582744, "epoch": 7021} {"train_loss": -27.392749786376953, "global_step": 582745, "epoch": 7021} {"train_loss": -27.933958053588867, "global_step": 582746, "epoch": 7021} {"train_loss": -27.144479751586914, "global_step": 582747, "epoch": 7021} {"train_loss": -27.592512130737305, "global_step": 582748, "epoch": 7021} {"train_loss": -27.597549438476562, "global_step": 582749, "epoch": 7021} {"train_loss": -27.68365478515625, "global_step": 582750, "epoch": 7021} {"train_loss": -27.134531021118164, "global_step": 582751, "epoch": 7021} {"train_loss": -27.288244247436523, "global_step": 582752, "epoch": 7021} {"train_loss": -27.35774040222168, "global_step": 582753, "epoch": 7021} {"train_loss": -27.6921443939209, "global_step": 582754, "epoch": 7021} {"train_loss": -27.579069137573242, "global_step": 582755, "epoch": 7021} {"train_loss": -27.72336769104004, "global_step": 582756, "epoch": 7021} {"train_loss": -27.42303466796875, "global_step": 582757, "epoch": 7021} {"train_loss": -27.71442985534668, "global_step": 582758, "epoch": 7021} {"train_loss": -27.679737091064453, "global_step": 582759, "epoch": 7021} {"train_loss": -27.808673858642578, "global_step": 582760, "epoch": 7021} {"train_loss": -27.518301010131836, "global_step": 582761, "epoch": 7021} {"train_loss": -28.0026798248291, "global_step": 582762, "epoch": 7021} {"train_loss": -28.09633445739746, "global_step": 582763, "epoch": 7021} {"train_loss": -27.84248924255371, "global_step": 582764, "epoch": 7021} {"train_loss": -28.26059341430664, "global_step": 582765, "epoch": 7021} {"train_loss": -27.772186279296875, "global_step": 582766, "epoch": 7021} {"train_loss": -27.878143310546875, "global_step": 582767, "epoch": 7021} {"train_loss": -27.798490524291992, "global_step": 582768, "epoch": 7021} {"train_loss": -27.737411499023438, "global_step": 582769, "epoch": 7021} {"train_loss": -27.542593002319336, "global_step": 582770, "epoch": 7021} {"train_loss": -27.39349365234375, "global_step": 582771, "epoch": 7021} {"train_loss": -27.68195152282715, "global_step": 582772, "epoch": 7021} {"train_loss": -27.615827560424805, "global_step": 582773, "epoch": 7021} {"train_loss": -27.5692195892334, "global_step": 582774, "epoch": 7021} {"train_loss": -27.679296493530273, "global_step": 582775, "epoch": 7021} {"train_loss": -27.415790557861328, "global_step": 582776, "epoch": 7021} {"train_loss": -28.137176513671875, "global_step": 582777, "epoch": 7021} {"train_loss": -27.691410064697266, "global_step": 582778, "epoch": 7021} {"train_loss": -27.844221115112305, "global_step": 582779, "epoch": 7021} {"train_loss": -27.246374130249023, "global_step": 582780, "epoch": 7021} {"train_loss": -27.43866539001465, "global_step": 582781, "epoch": 7021} {"train_loss": -27.86380958557129, "global_step": 582782, "epoch": 7021} {"train_loss": -27.710163116455078, "global_step": 582783, "epoch": 7021} {"train_loss": -28.027236938476562, "global_step": 582784, "epoch": 7021} {"train_loss": -28.094650268554688, "global_step": 582785, "epoch": 7021} {"train_loss": -27.89776039123535, "global_step": 582786, "epoch": 7021} {"train_loss": -27.764768600463867, "global_step": 582787, "epoch": 7021} {"train_loss": -27.712940216064453, "global_step": 582788, "epoch": 7021} {"train_loss": -27.873035430908203, "global_step": 582789, "epoch": 7021} {"train_loss": -28.199390411376953, "global_step": 582790, "epoch": 7021} {"train_loss": -27.948522567749023, "global_step": 582791, "epoch": 7021} {"train_loss": -28.31941032409668, "global_step": 582792, "epoch": 7021} {"train_loss": -28.060033798217773, "global_step": 582793, "epoch": 7021} {"train_loss": -28.115869522094727, "global_step": 582794, "epoch": 7021} {"train_loss": -27.862028121948242, "global_step": 582795, "epoch": 7021} {"train_loss": -27.902851104736328, "global_step": 582796, "epoch": 7021} {"train_loss": -28.061574935913086, "global_step": 582797, "epoch": 7021} {"train_loss": -28.131555557250977, "global_step": 582798, "epoch": 7021} {"train_loss": -28.201948165893555, "global_step": 582799, "epoch": 7021} {"train_loss": -28.2376766204834, "global_step": 582800, "epoch": 7021} {"train_loss": -28.1867618560791, "global_step": 582801, "epoch": 7021} {"train_loss": -28.593704223632812, "global_step": 582802, "epoch": 7021} {"train_loss": -28.272510528564453, "global_step": 582803, "epoch": 7021} {"train_loss": -28.10126304626465, "global_step": 582804, "epoch": 7021} {"train_loss": -27.725919723510742, "global_step": 582805, "epoch": 7021} {"train_loss": -27.813581466674805, "global_step": 582806, "epoch": 7021} {"train_loss": -28.052820205688477, "global_step": 582807, "epoch": 7021} {"train_loss": -28.6617488861084, "global_step": 582808, "epoch": 7021} {"train_loss": -27.93086814880371, "global_step": 582809, "epoch": 7021} {"train_loss": -27.606760025024414, "global_step": 582810, "epoch": 7021} {"train_loss": -28.119489669799805, "global_step": 582811, "epoch": 7021} {"train_loss": -27.87353515625, "global_step": 582812, "epoch": 7021} {"train_loss": -28.15570640563965, "global_step": 582813, "epoch": 7021} {"train_loss": -27.775808334350586, "global_step": 582814, "epoch": 7021} {"train_loss": -27.77088737487793, "global_step": 582815, "epoch": 7021} {"train_loss": -28.037994384765625, "global_step": 582816, "epoch": 7021} {"train_loss": -27.80389404296875, "global_step": 582817, "epoch": 7021} {"train_loss": -27.59820556640625, "global_step": 582818, "epoch": 7021} {"train_loss": -28.140213012695312, "global_step": 582819, "epoch": 7021} {"train_loss": -28.1295166015625, "global_step": 582820, "epoch": 7021} {"train_loss": -27.94878578186035, "global_step": 582821, "epoch": 7021} {"train_loss": -27.88325309753418, "global_step": 582822, "epoch": 7021} {"train_loss": -28.094776153564453, "global_step": 582823, "epoch": 7021} {"train_loss": -28.170881271362305, "global_step": 582824, "epoch": 7021} {"train_loss": -27.826792567609303, "global_step": 582825, "epoch": 7021, "val_loss": 6774549.0} {"train_loss": -27.732458114624023, "global_step": 582826, "epoch": 7022} {"train_loss": -27.40178871154785, "global_step": 582827, "epoch": 7022} {"train_loss": -27.659048080444336, "global_step": 582828, "epoch": 7022} {"train_loss": -28.359149932861328, "global_step": 582829, "epoch": 7022} {"train_loss": -27.482568740844727, "global_step": 582830, "epoch": 7022} {"train_loss": -27.411630630493164, "global_step": 582831, "epoch": 7022} {"train_loss": -27.680633544921875, "global_step": 582832, "epoch": 7022} {"train_loss": -28.028797149658203, "global_step": 582833, "epoch": 7022} {"train_loss": -27.026779174804688, "global_step": 582834, "epoch": 7022} {"train_loss": -27.548681259155273, "global_step": 582835, "epoch": 7022} {"train_loss": -27.97247314453125, "global_step": 582836, "epoch": 7022} {"train_loss": -27.60501480102539, "global_step": 582837, "epoch": 7022} {"train_loss": -27.823217391967773, "global_step": 582838, "epoch": 7022} {"train_loss": -27.86664390563965, "global_step": 582839, "epoch": 7022} {"train_loss": -27.57260513305664, "global_step": 582840, "epoch": 7022} {"train_loss": -28.304712295532227, "global_step": 582841, "epoch": 7022} {"train_loss": -28.074798583984375, "global_step": 582842, "epoch": 7022} {"train_loss": -27.786014556884766, "global_step": 582843, "epoch": 7022} {"train_loss": -28.094404220581055, "global_step": 582844, "epoch": 7022} {"train_loss": -27.96590232849121, "global_step": 582845, "epoch": 7022} {"train_loss": -28.098539352416992, "global_step": 582846, "epoch": 7022} {"train_loss": -27.93408203125, "global_step": 582847, "epoch": 7022} {"train_loss": -28.08453941345215, "global_step": 582848, "epoch": 7022} {"train_loss": -28.105228424072266, "global_step": 582849, "epoch": 7022} {"train_loss": -27.613386154174805, "global_step": 582850, "epoch": 7022} {"train_loss": -27.987890243530273, "global_step": 582851, "epoch": 7022} {"train_loss": -28.086591720581055, "global_step": 582852, "epoch": 7022} {"train_loss": -28.254011154174805, "global_step": 582853, "epoch": 7022} {"train_loss": -28.042516708374023, "global_step": 582854, "epoch": 7022} {"train_loss": -28.118091583251953, "global_step": 582855, "epoch": 7022} {"train_loss": -27.55747413635254, "global_step": 582856, "epoch": 7022} {"train_loss": -28.081073760986328, "global_step": 582857, "epoch": 7022} {"train_loss": -27.83694839477539, "global_step": 582858, "epoch": 7022} {"train_loss": -28.284210205078125, "global_step": 582859, "epoch": 7022} {"train_loss": -28.221078872680664, "global_step": 582860, "epoch": 7022} {"train_loss": -27.808551788330078, "global_step": 582861, "epoch": 7022} {"train_loss": -27.311630249023438, "global_step": 582862, "epoch": 7022} {"train_loss": -27.030776977539062, "global_step": 582863, "epoch": 7022} {"train_loss": -27.64753532409668, "global_step": 582864, "epoch": 7022} {"train_loss": -27.444568634033203, "global_step": 582865, "epoch": 7022} {"train_loss": -27.635086059570312, "global_step": 582866, "epoch": 7022} {"train_loss": -27.40811538696289, "global_step": 582867, "epoch": 7022} {"train_loss": -27.338953018188477, "global_step": 582868, "epoch": 7022} {"train_loss": -27.60818862915039, "global_step": 582869, "epoch": 7022} {"train_loss": -27.40265464782715, "global_step": 582870, "epoch": 7022} {"train_loss": -27.578418731689453, "global_step": 582871, "epoch": 7022} {"train_loss": -27.794727325439453, "global_step": 582872, "epoch": 7022} {"train_loss": -27.50229835510254, "global_step": 582873, "epoch": 7022} {"train_loss": -28.27779197692871, "global_step": 582874, "epoch": 7022} {"train_loss": -27.44257926940918, "global_step": 582875, "epoch": 7022} {"train_loss": -27.69562339782715, "global_step": 582876, "epoch": 7022} {"train_loss": -27.70892906188965, "global_step": 582877, "epoch": 7022} {"train_loss": -27.801374435424805, "global_step": 582878, "epoch": 7022} {"train_loss": -27.92885398864746, "global_step": 582879, "epoch": 7022} {"train_loss": -27.916366577148438, "global_step": 582880, "epoch": 7022} {"train_loss": -27.667089462280273, "global_step": 582881, "epoch": 7022} {"train_loss": -28.2608699798584, "global_step": 582882, "epoch": 7022} {"train_loss": -28.28517723083496, "global_step": 582883, "epoch": 7022} {"train_loss": -27.796218872070312, "global_step": 582884, "epoch": 7022} {"train_loss": -27.691495895385742, "global_step": 582885, "epoch": 7022} {"train_loss": -28.162023544311523, "global_step": 582886, "epoch": 7022} {"train_loss": -27.9049072265625, "global_step": 582887, "epoch": 7022} {"train_loss": -27.685773849487305, "global_step": 582888, "epoch": 7022} {"train_loss": -28.025360107421875, "global_step": 582889, "epoch": 7022} {"train_loss": -27.917648315429688, "global_step": 582890, "epoch": 7022} {"train_loss": -27.947473526000977, "global_step": 582891, "epoch": 7022} {"train_loss": -27.610462188720703, "global_step": 582892, "epoch": 7022} {"train_loss": -27.846729278564453, "global_step": 582893, "epoch": 7022} {"train_loss": -28.07770347595215, "global_step": 582894, "epoch": 7022} {"train_loss": -28.188720703125, "global_step": 582895, "epoch": 7022} {"train_loss": -27.640457153320312, "global_step": 582896, "epoch": 7022} {"train_loss": -28.041242599487305, "global_step": 582897, "epoch": 7022} {"train_loss": -28.00469970703125, "global_step": 582898, "epoch": 7022} {"train_loss": -28.05327796936035, "global_step": 582899, "epoch": 7022} {"train_loss": -28.38128662109375, "global_step": 582900, "epoch": 7022} {"train_loss": -28.13687515258789, "global_step": 582901, "epoch": 7022} {"train_loss": -28.729230880737305, "global_step": 582902, "epoch": 7022} {"train_loss": -27.951934814453125, "global_step": 582903, "epoch": 7022} {"train_loss": -28.042943954467773, "global_step": 582904, "epoch": 7022} {"train_loss": -27.806171417236328, "global_step": 582905, "epoch": 7022} {"train_loss": -27.679229736328125, "global_step": 582906, "epoch": 7022} {"train_loss": -27.950366973876953, "global_step": 582907, "epoch": 7022} {"train_loss": -27.848246999533778, "global_step": 582908, "epoch": 7022, "val_loss": 6807219.5} {"train_loss": -27.57329750061035, "global_step": 582909, "epoch": 7023} {"train_loss": -27.213520050048828, "global_step": 582910, "epoch": 7023} {"train_loss": -27.52070426940918, "global_step": 582911, "epoch": 7023} {"train_loss": -27.6180362701416, "global_step": 582912, "epoch": 7023} {"train_loss": -27.391525268554688, "global_step": 582913, "epoch": 7023} {"train_loss": -27.40511131286621, "global_step": 582914, "epoch": 7023} {"train_loss": -27.2614803314209, "global_step": 582915, "epoch": 7023} {"train_loss": -27.717206954956055, "global_step": 582916, "epoch": 7023} {"train_loss": -27.848133087158203, "global_step": 582917, "epoch": 7023} {"train_loss": -27.951955795288086, "global_step": 582918, "epoch": 7023} {"train_loss": -27.558130264282227, "global_step": 582919, "epoch": 7023} {"train_loss": -28.061603546142578, "global_step": 582920, "epoch": 7023} {"train_loss": -27.806659698486328, "global_step": 582921, "epoch": 7023} {"train_loss": -27.7111759185791, "global_step": 582922, "epoch": 7023} {"train_loss": -27.780012130737305, "global_step": 582923, "epoch": 7023} {"train_loss": -27.730777740478516, "global_step": 582924, "epoch": 7023} {"train_loss": -27.571807861328125, "global_step": 582925, "epoch": 7023} {"train_loss": -27.754140853881836, "global_step": 582926, "epoch": 7023} {"train_loss": -27.9467830657959, "global_step": 582927, "epoch": 7023} {"train_loss": -27.872465133666992, "global_step": 582928, "epoch": 7023} {"train_loss": -27.831390380859375, "global_step": 582929, "epoch": 7023} {"train_loss": -27.99627113342285, "global_step": 582930, "epoch": 7023} {"train_loss": -28.023794174194336, "global_step": 582931, "epoch": 7023} {"train_loss": -27.635116577148438, "global_step": 582932, "epoch": 7023} {"train_loss": -27.8990478515625, "global_step": 582933, "epoch": 7023} {"train_loss": -27.8448543548584, "global_step": 582934, "epoch": 7023} {"train_loss": -27.95855140686035, "global_step": 582935, "epoch": 7023} {"train_loss": -27.78730583190918, "global_step": 582936, "epoch": 7023} {"train_loss": -27.529123306274414, "global_step": 582937, "epoch": 7023} {"train_loss": -27.36395263671875, "global_step": 582938, "epoch": 7023} {"train_loss": -27.6916561126709, "global_step": 582939, "epoch": 7023} {"train_loss": -28.114124298095703, "global_step": 582940, "epoch": 7023} {"train_loss": -27.458831787109375, "global_step": 582941, "epoch": 7023} {"train_loss": -27.142515182495117, "global_step": 582942, "epoch": 7023} {"train_loss": -27.994586944580078, "global_step": 582943, "epoch": 7023} {"train_loss": -28.079111099243164, "global_step": 582944, "epoch": 7023} {"train_loss": -27.554859161376953, "global_step": 582945, "epoch": 7023} {"train_loss": -27.885908126831055, "global_step": 582946, "epoch": 7023} {"train_loss": -27.96430778503418, "global_step": 582947, "epoch": 7023} {"train_loss": -27.490650177001953, "global_step": 582948, "epoch": 7023} {"train_loss": -27.901121139526367, "global_step": 582949, "epoch": 7023} {"train_loss": -28.244245529174805, "global_step": 582950, "epoch": 7023} {"train_loss": -27.511249542236328, "global_step": 582951, "epoch": 7023} {"train_loss": -27.94331932067871, "global_step": 582952, "epoch": 7023} {"train_loss": -27.596338272094727, "global_step": 582953, "epoch": 7023} {"train_loss": -28.142364501953125, "global_step": 582954, "epoch": 7023} {"train_loss": -28.009449005126953, "global_step": 582955, "epoch": 7023} {"train_loss": -27.496938705444336, "global_step": 582956, "epoch": 7023} {"train_loss": -28.267744064331055, "global_step": 582957, "epoch": 7023} {"train_loss": -27.858545303344727, "global_step": 582958, "epoch": 7023} {"train_loss": -27.8176212310791, "global_step": 582959, "epoch": 7023} {"train_loss": -27.614233016967773, "global_step": 582960, "epoch": 7023} {"train_loss": -27.907642364501953, "global_step": 582961, "epoch": 7023} {"train_loss": -27.980321884155273, "global_step": 582962, "epoch": 7023} {"train_loss": -27.82632827758789, "global_step": 582963, "epoch": 7023} {"train_loss": -27.817855834960938, "global_step": 582964, "epoch": 7023} {"train_loss": -28.014394760131836, "global_step": 582965, "epoch": 7023} {"train_loss": -28.07598304748535, "global_step": 582966, "epoch": 7023} {"train_loss": -27.90936279296875, "global_step": 582967, "epoch": 7023} {"train_loss": -27.655914306640625, "global_step": 582968, "epoch": 7023} {"train_loss": -27.960168838500977, "global_step": 582969, "epoch": 7023} {"train_loss": -28.048120498657227, "global_step": 582970, "epoch": 7023} {"train_loss": -28.20513916015625, "global_step": 582971, "epoch": 7023} {"train_loss": -27.923095703125, "global_step": 582972, "epoch": 7023} {"train_loss": -27.862333297729492, "global_step": 582973, "epoch": 7023} {"train_loss": -28.12752342224121, "global_step": 582974, "epoch": 7023} {"train_loss": -27.914798736572266, "global_step": 582975, "epoch": 7023} {"train_loss": -27.918432235717773, "global_step": 582976, "epoch": 7023} {"train_loss": -27.79816246032715, "global_step": 582977, "epoch": 7023} {"train_loss": -28.176101684570312, "global_step": 582978, "epoch": 7023} {"train_loss": -28.01373863220215, "global_step": 582979, "epoch": 7023} {"train_loss": -27.96584129333496, "global_step": 582980, "epoch": 7023} {"train_loss": -28.099720001220703, "global_step": 582981, "epoch": 7023} {"train_loss": -28.020160675048828, "global_step": 582982, "epoch": 7023} {"train_loss": -28.038898468017578, "global_step": 582983, "epoch": 7023} {"train_loss": -27.838830947875977, "global_step": 582984, "epoch": 7023} {"train_loss": -28.134811401367188, "global_step": 582985, "epoch": 7023} {"train_loss": -27.56215476989746, "global_step": 582986, "epoch": 7023} {"train_loss": -28.00202751159668, "global_step": 582987, "epoch": 7023} {"train_loss": -28.198699951171875, "global_step": 582988, "epoch": 7023} {"train_loss": -27.83053970336914, "global_step": 582989, "epoch": 7023} {"train_loss": -28.03255271911621, "global_step": 582990, "epoch": 7023} {"train_loss": -27.835462639130743, "global_step": 582991, "epoch": 7023, "val_loss": 6703170.0} {"train_loss": -27.365522384643555, "global_step": 582992, "epoch": 7024} {"train_loss": -27.6623477935791, "global_step": 582993, "epoch": 7024} {"train_loss": -27.905120849609375, "global_step": 582994, "epoch": 7024} {"train_loss": -27.858606338500977, "global_step": 582995, "epoch": 7024} {"train_loss": -27.54828453063965, "global_step": 582996, "epoch": 7024} {"train_loss": -27.728208541870117, "global_step": 582997, "epoch": 7024} {"train_loss": -27.658309936523438, "global_step": 582998, "epoch": 7024} {"train_loss": -27.65297508239746, "global_step": 582999, "epoch": 7024} {"train_loss": -27.52385902404785, "global_step": 583000, "epoch": 7024} {"train_loss": -27.92262077331543, "global_step": 583001, "epoch": 7024} {"train_loss": -27.774194717407227, "global_step": 583002, "epoch": 7024} {"train_loss": -27.786685943603516, "global_step": 583003, "epoch": 7024} {"train_loss": -27.967199325561523, "global_step": 583004, "epoch": 7024} {"train_loss": -28.046369552612305, "global_step": 583005, "epoch": 7024} {"train_loss": -27.87745475769043, "global_step": 583006, "epoch": 7024} {"train_loss": -27.854318618774414, "global_step": 583007, "epoch": 7024} {"train_loss": -27.8122501373291, "global_step": 583008, "epoch": 7024} {"train_loss": -27.904144287109375, "global_step": 583009, "epoch": 7024} {"train_loss": -27.6391658782959, "global_step": 583010, "epoch": 7024} {"train_loss": -28.08890724182129, "global_step": 583011, "epoch": 7024} {"train_loss": -27.92876625061035, "global_step": 583012, "epoch": 7024} {"train_loss": -27.9215087890625, "global_step": 583013, "epoch": 7024} {"train_loss": -27.656381607055664, "global_step": 583014, "epoch": 7024} {"train_loss": -27.989343643188477, "global_step": 583015, "epoch": 7024} {"train_loss": -28.148725509643555, "global_step": 583016, "epoch": 7024} {"train_loss": -28.000654220581055, "global_step": 583017, "epoch": 7024} {"train_loss": -28.122055053710938, "global_step": 583018, "epoch": 7024} {"train_loss": -28.20282554626465, "global_step": 583019, "epoch": 7024} {"train_loss": -28.134552001953125, "global_step": 583020, "epoch": 7024} {"train_loss": -27.481245040893555, "global_step": 583021, "epoch": 7024} {"train_loss": -27.840845108032227, "global_step": 583022, "epoch": 7024} {"train_loss": -28.0361270904541, "global_step": 583023, "epoch": 7024} {"train_loss": -27.912872314453125, "global_step": 583024, "epoch": 7024} {"train_loss": -28.043851852416992, "global_step": 583025, "epoch": 7024} {"train_loss": -28.109603881835938, "global_step": 583026, "epoch": 7024} {"train_loss": -27.83368492126465, "global_step": 583027, "epoch": 7024} {"train_loss": -28.0104923248291, "global_step": 583028, "epoch": 7024} {"train_loss": -28.010385513305664, "global_step": 583029, "epoch": 7024} {"train_loss": -28.179227828979492, "global_step": 583030, "epoch": 7024} {"train_loss": -28.0967960357666, "global_step": 583031, "epoch": 7024} {"train_loss": -27.86518669128418, "global_step": 583032, "epoch": 7024} {"train_loss": -27.50465202331543, "global_step": 583033, "epoch": 7024} {"train_loss": -27.924213409423828, "global_step": 583034, "epoch": 7024} {"train_loss": -28.008270263671875, "global_step": 583035, "epoch": 7024} {"train_loss": -28.1357479095459, "global_step": 583036, "epoch": 7024} {"train_loss": -27.955488204956055, "global_step": 583037, "epoch": 7024} {"train_loss": -27.501020431518555, "global_step": 583038, "epoch": 7024} {"train_loss": -27.752878189086914, "global_step": 583039, "epoch": 7024} {"train_loss": -27.8144474029541, "global_step": 583040, "epoch": 7024} {"train_loss": -27.941389083862305, "global_step": 583041, "epoch": 7024} {"train_loss": -28.08151626586914, "global_step": 583042, "epoch": 7024} {"train_loss": -28.210744857788086, "global_step": 583043, "epoch": 7024} {"train_loss": -28.227008819580078, "global_step": 583044, "epoch": 7024} {"train_loss": -28.285802841186523, "global_step": 583045, "epoch": 7024} {"train_loss": -28.229597091674805, "global_step": 583046, "epoch": 7024} {"train_loss": -28.23736572265625, "global_step": 583047, "epoch": 7024} {"train_loss": -27.980276107788086, "global_step": 583048, "epoch": 7024} {"train_loss": -28.016193389892578, "global_step": 583049, "epoch": 7024} {"train_loss": -28.144506454467773, "global_step": 583050, "epoch": 7024} {"train_loss": -27.8785457611084, "global_step": 583051, "epoch": 7024} {"train_loss": -28.021732330322266, "global_step": 583052, "epoch": 7024} {"train_loss": -28.391162872314453, "global_step": 583053, "epoch": 7024} {"train_loss": -28.037424087524414, "global_step": 583054, "epoch": 7024} {"train_loss": -27.94325065612793, "global_step": 583055, "epoch": 7024} {"train_loss": -27.56458854675293, "global_step": 583056, "epoch": 7024} {"train_loss": -27.30966567993164, "global_step": 583057, "epoch": 7024} {"train_loss": -26.7165584564209, "global_step": 583058, "epoch": 7024} {"train_loss": -27.4500732421875, "global_step": 583059, "epoch": 7024} {"train_loss": -28.033750534057617, "global_step": 583060, "epoch": 7024} {"train_loss": -27.368988037109375, "global_step": 583061, "epoch": 7024} {"train_loss": -27.94758415222168, "global_step": 583062, "epoch": 7024} {"train_loss": -27.73878288269043, "global_step": 583063, "epoch": 7024} {"train_loss": -27.569250106811523, "global_step": 583064, "epoch": 7024} {"train_loss": -27.659570693969727, "global_step": 583065, "epoch": 7024} {"train_loss": -27.55120277404785, "global_step": 583066, "epoch": 7024} {"train_loss": -27.687177658081055, "global_step": 583067, "epoch": 7024} {"train_loss": -27.472848892211914, "global_step": 583068, "epoch": 7024} {"train_loss": -27.510150909423828, "global_step": 583069, "epoch": 7024} {"train_loss": -27.364728927612305, "global_step": 583070, "epoch": 7024} {"train_loss": -27.70589256286621, "global_step": 583071, "epoch": 7024} {"train_loss": -27.7050838470459, "global_step": 583072, "epoch": 7024} {"train_loss": -27.652746200561523, "global_step": 583073, "epoch": 7024} {"train_loss": -27.846303710018297, "global_step": 583074, "epoch": 7024, "val_loss": 6760727.0} {"train_loss": -27.24036979675293, "global_step": 583075, "epoch": 7025} {"train_loss": -27.28086280822754, "global_step": 583076, "epoch": 7025} {"train_loss": -26.78689956665039, "global_step": 583077, "epoch": 7025} {"train_loss": -27.295209884643555, "global_step": 583078, "epoch": 7025} {"train_loss": -26.864093780517578, "global_step": 583079, "epoch": 7025} {"train_loss": -27.878620147705078, "global_step": 583080, "epoch": 7025} {"train_loss": -27.085697174072266, "global_step": 583081, "epoch": 7025} {"train_loss": -26.9508113861084, "global_step": 583082, "epoch": 7025} {"train_loss": -27.146102905273438, "global_step": 583083, "epoch": 7025} {"train_loss": -27.286279678344727, "global_step": 583084, "epoch": 7025} {"train_loss": -27.083271026611328, "global_step": 583085, "epoch": 7025} {"train_loss": -27.875904083251953, "global_step": 583086, "epoch": 7025} {"train_loss": -27.420934677124023, "global_step": 583087, "epoch": 7025} {"train_loss": -27.28582191467285, "global_step": 583088, "epoch": 7025} {"train_loss": -27.510711669921875, "global_step": 583089, "epoch": 7025} {"train_loss": -27.625478744506836, "global_step": 583090, "epoch": 7025} {"train_loss": -27.591150283813477, "global_step": 583091, "epoch": 7025} {"train_loss": -27.526941299438477, "global_step": 583092, "epoch": 7025} {"train_loss": -27.1459903717041, "global_step": 583093, "epoch": 7025} {"train_loss": -27.4665584564209, "global_step": 583094, "epoch": 7025} {"train_loss": -27.4090518951416, "global_step": 583095, "epoch": 7025} {"train_loss": -27.67421531677246, "global_step": 583096, "epoch": 7025} {"train_loss": -27.992074966430664, "global_step": 583097, "epoch": 7025} {"train_loss": -27.62784194946289, "global_step": 583098, "epoch": 7025} {"train_loss": -28.144437789916992, "global_step": 583099, "epoch": 7025} {"train_loss": -27.96990394592285, "global_step": 583100, "epoch": 7025} {"train_loss": -28.100067138671875, "global_step": 583101, "epoch": 7025} {"train_loss": -27.722137451171875, "global_step": 583102, "epoch": 7025} {"train_loss": -28.01812171936035, "global_step": 583103, "epoch": 7025} {"train_loss": -27.973119735717773, "global_step": 583104, "epoch": 7025} {"train_loss": -27.90509033203125, "global_step": 583105, "epoch": 7025} {"train_loss": -27.87544822692871, "global_step": 583106, "epoch": 7025} {"train_loss": -27.437482833862305, "global_step": 583107, "epoch": 7025} {"train_loss": -28.134674072265625, "global_step": 583108, "epoch": 7025} {"train_loss": -28.187488555908203, "global_step": 583109, "epoch": 7025} {"train_loss": -27.693836212158203, "global_step": 583110, "epoch": 7025} {"train_loss": -27.92376136779785, "global_step": 583111, "epoch": 7025} {"train_loss": -27.528547286987305, "global_step": 583112, "epoch": 7025} {"train_loss": -27.874670028686523, "global_step": 583113, "epoch": 7025} {"train_loss": -28.068180084228516, "global_step": 583114, "epoch": 7025} {"train_loss": -28.406387329101562, "global_step": 583115, "epoch": 7025} {"train_loss": -27.798873901367188, "global_step": 583116, "epoch": 7025} {"train_loss": -27.767578125, "global_step": 583117, "epoch": 7025} {"train_loss": -28.115345001220703, "global_step": 583118, "epoch": 7025} {"train_loss": -28.201831817626953, "global_step": 583119, "epoch": 7025} {"train_loss": -28.27986717224121, "global_step": 583120, "epoch": 7025} {"train_loss": -28.028244018554688, "global_step": 583121, "epoch": 7025} {"train_loss": -28.082677841186523, "global_step": 583122, "epoch": 7025} {"train_loss": -28.284271240234375, "global_step": 583123, "epoch": 7025} {"train_loss": -28.158803939819336, "global_step": 583124, "epoch": 7025} {"train_loss": -28.330175399780273, "global_step": 583125, "epoch": 7025} {"train_loss": -27.986806869506836, "global_step": 583126, "epoch": 7025} {"train_loss": -28.370025634765625, "global_step": 583127, "epoch": 7025} {"train_loss": -27.864553451538086, "global_step": 583128, "epoch": 7025} {"train_loss": -28.279041290283203, "global_step": 583129, "epoch": 7025} {"train_loss": -28.421445846557617, "global_step": 583130, "epoch": 7025} {"train_loss": -28.291101455688477, "global_step": 583131, "epoch": 7025} {"train_loss": -27.739294052124023, "global_step": 583132, "epoch": 7025} {"train_loss": -27.66446304321289, "global_step": 583133, "epoch": 7025} {"train_loss": -27.575326919555664, "global_step": 583134, "epoch": 7025} {"train_loss": -28.08552360534668, "global_step": 583135, "epoch": 7025} {"train_loss": -27.939777374267578, "global_step": 583136, "epoch": 7025} {"train_loss": -27.913740158081055, "global_step": 583137, "epoch": 7025} {"train_loss": -28.60215187072754, "global_step": 583138, "epoch": 7025} {"train_loss": -27.995859146118164, "global_step": 583139, "epoch": 7025} {"train_loss": -28.093719482421875, "global_step": 583140, "epoch": 7025} {"train_loss": -27.839984893798828, "global_step": 583141, "epoch": 7025} {"train_loss": -28.06914710998535, "global_step": 583142, "epoch": 7025} {"train_loss": -28.174474716186523, "global_step": 583143, "epoch": 7025} {"train_loss": -28.054401397705078, "global_step": 583144, "epoch": 7025} {"train_loss": -28.056949615478516, "global_step": 583145, "epoch": 7025} {"train_loss": -27.793899536132812, "global_step": 583146, "epoch": 7025} {"train_loss": -28.170103073120117, "global_step": 583147, "epoch": 7025} {"train_loss": -28.208032608032227, "global_step": 583148, "epoch": 7025} {"train_loss": -27.841657638549805, "global_step": 583149, "epoch": 7025} {"train_loss": -28.162811279296875, "global_step": 583150, "epoch": 7025} {"train_loss": -28.055408477783203, "global_step": 583151, "epoch": 7025} {"train_loss": -27.981332778930664, "global_step": 583152, "epoch": 7025} {"train_loss": -27.923254013061523, "global_step": 583153, "epoch": 7025} {"train_loss": -28.014352798461914, "global_step": 583154, "epoch": 7025} {"train_loss": -27.622150421142578, "global_step": 583155, "epoch": 7025} {"train_loss": -28.008710861206055, "global_step": 583156, "epoch": 7025} {"train_loss": -27.828366911554912, "global_step": 583157, "epoch": 7025, "val_loss": 6693752.0} {"train_loss": -27.995656967163086, "global_step": 583158, "epoch": 7026} {"train_loss": -27.60304832458496, "global_step": 583159, "epoch": 7026} {"train_loss": -27.323307037353516, "global_step": 583160, "epoch": 7026} {"train_loss": -27.344968795776367, "global_step": 583161, "epoch": 7026} {"train_loss": -27.755720138549805, "global_step": 583162, "epoch": 7026} {"train_loss": -27.188934326171875, "global_step": 583163, "epoch": 7026} {"train_loss": -27.605850219726562, "global_step": 583164, "epoch": 7026} {"train_loss": -27.732257843017578, "global_step": 583165, "epoch": 7026} {"train_loss": -27.735036849975586, "global_step": 583166, "epoch": 7026} {"train_loss": -27.86240577697754, "global_step": 583167, "epoch": 7026} {"train_loss": -27.380035400390625, "global_step": 583168, "epoch": 7026} {"train_loss": -27.73262596130371, "global_step": 583169, "epoch": 7026} {"train_loss": -27.91988182067871, "global_step": 583170, "epoch": 7026} {"train_loss": -28.043806076049805, "global_step": 583171, "epoch": 7026} {"train_loss": -27.850677490234375, "global_step": 583172, "epoch": 7026} {"train_loss": -27.884845733642578, "global_step": 583173, "epoch": 7026} {"train_loss": -27.773685455322266, "global_step": 583174, "epoch": 7026} {"train_loss": -28.013586044311523, "global_step": 583175, "epoch": 7026} {"train_loss": -27.860143661499023, "global_step": 583176, "epoch": 7026} {"train_loss": -27.777759552001953, "global_step": 583177, "epoch": 7026} {"train_loss": -27.96832275390625, "global_step": 583178, "epoch": 7026} {"train_loss": -28.0502986907959, "global_step": 583179, "epoch": 7026} {"train_loss": -27.76128578186035, "global_step": 583180, "epoch": 7026} {"train_loss": -27.856826782226562, "global_step": 583181, "epoch": 7026} {"train_loss": -27.84793472290039, "global_step": 583182, "epoch": 7026} {"train_loss": -27.692890167236328, "global_step": 583183, "epoch": 7026} {"train_loss": -27.586896896362305, "global_step": 583184, "epoch": 7026} {"train_loss": -27.87627601623535, "global_step": 583185, "epoch": 7026} {"train_loss": -27.942670822143555, "global_step": 583186, "epoch": 7026} {"train_loss": -27.669403076171875, "global_step": 583187, "epoch": 7026} {"train_loss": -27.50813865661621, "global_step": 583188, "epoch": 7026} {"train_loss": -28.25478172302246, "global_step": 583189, "epoch": 7026} {"train_loss": -27.867902755737305, "global_step": 583190, "epoch": 7026} {"train_loss": -27.97649574279785, "global_step": 583191, "epoch": 7026} {"train_loss": -28.270254135131836, "global_step": 583192, "epoch": 7026} {"train_loss": -28.03949546813965, "global_step": 583193, "epoch": 7026} {"train_loss": -28.191308975219727, "global_step": 583194, "epoch": 7026} {"train_loss": -28.023473739624023, "global_step": 583195, "epoch": 7026} {"train_loss": -28.015960693359375, "global_step": 583196, "epoch": 7026} {"train_loss": -27.736974716186523, "global_step": 583197, "epoch": 7026} {"train_loss": -27.76435661315918, "global_step": 583198, "epoch": 7026} {"train_loss": -28.00223159790039, "global_step": 583199, "epoch": 7026} {"train_loss": -28.21526527404785, "global_step": 583200, "epoch": 7026} {"train_loss": -27.764118194580078, "global_step": 583201, "epoch": 7026} {"train_loss": -28.234228134155273, "global_step": 583202, "epoch": 7026} {"train_loss": -27.96051597595215, "global_step": 583203, "epoch": 7026} {"train_loss": -27.974695205688477, "global_step": 583204, "epoch": 7026} {"train_loss": -28.01555824279785, "global_step": 583205, "epoch": 7026} {"train_loss": -28.17673110961914, "global_step": 583206, "epoch": 7026} {"train_loss": -27.840219497680664, "global_step": 583207, "epoch": 7026} {"train_loss": -28.270544052124023, "global_step": 583208, "epoch": 7026} {"train_loss": -28.313196182250977, "global_step": 583209, "epoch": 7026} {"train_loss": -28.013639450073242, "global_step": 583210, "epoch": 7026} {"train_loss": -27.9043025970459, "global_step": 583211, "epoch": 7026} {"train_loss": -28.01070213317871, "global_step": 583212, "epoch": 7026} {"train_loss": -28.065399169921875, "global_step": 583213, "epoch": 7026} {"train_loss": -28.068708419799805, "global_step": 583214, "epoch": 7026} {"train_loss": -28.52155876159668, "global_step": 583215, "epoch": 7026} {"train_loss": -28.197324752807617, "global_step": 583216, "epoch": 7026} {"train_loss": -27.98530387878418, "global_step": 583217, "epoch": 7026} {"train_loss": -27.972305297851562, "global_step": 583218, "epoch": 7026} {"train_loss": -28.000173568725586, "global_step": 583219, "epoch": 7026} {"train_loss": -28.024932861328125, "global_step": 583220, "epoch": 7026} {"train_loss": -27.753040313720703, "global_step": 583221, "epoch": 7026} {"train_loss": -27.796995162963867, "global_step": 583222, "epoch": 7026} {"train_loss": -28.337787628173828, "global_step": 583223, "epoch": 7026} {"train_loss": -27.823856353759766, "global_step": 583224, "epoch": 7026} {"train_loss": -27.892658233642578, "global_step": 583225, "epoch": 7026} {"train_loss": -28.157861709594727, "global_step": 583226, "epoch": 7026} {"train_loss": -27.673948287963867, "global_step": 583227, "epoch": 7026} {"train_loss": -27.5926456451416, "global_step": 583228, "epoch": 7026} {"train_loss": -27.62965965270996, "global_step": 583229, "epoch": 7026} {"train_loss": -27.966114044189453, "global_step": 583230, "epoch": 7026} {"train_loss": -27.650619506835938, "global_step": 583231, "epoch": 7026} {"train_loss": -28.2171573638916, "global_step": 583232, "epoch": 7026} {"train_loss": -27.627965927124023, "global_step": 583233, "epoch": 7026} {"train_loss": -28.103927612304688, "global_step": 583234, "epoch": 7026} {"train_loss": -27.622732162475586, "global_step": 583235, "epoch": 7026} {"train_loss": -28.210193634033203, "global_step": 583236, "epoch": 7026} {"train_loss": -27.96245765686035, "global_step": 583237, "epoch": 7026} {"train_loss": -27.998075485229492, "global_step": 583238, "epoch": 7026} {"train_loss": -27.97700309753418, "global_step": 583239, "epoch": 7026} {"train_loss": -27.89589339566518, "global_step": 583240, "epoch": 7026, "val_loss": 6742514.5} {"train_loss": -27.694456100463867, "global_step": 583241, "epoch": 7027} {"train_loss": -27.527135848999023, "global_step": 583242, "epoch": 7027} {"train_loss": -27.314014434814453, "global_step": 583243, "epoch": 7027} {"train_loss": -27.51308250427246, "global_step": 583244, "epoch": 7027} {"train_loss": -27.499059677124023, "global_step": 583245, "epoch": 7027} {"train_loss": -27.810806274414062, "global_step": 583246, "epoch": 7027} {"train_loss": -27.582263946533203, "global_step": 583247, "epoch": 7027} {"train_loss": -27.447437286376953, "global_step": 583248, "epoch": 7027} {"train_loss": -27.552021026611328, "global_step": 583249, "epoch": 7027} {"train_loss": -27.84116554260254, "global_step": 583250, "epoch": 7027} {"train_loss": -27.48138999938965, "global_step": 583251, "epoch": 7027} {"train_loss": -27.66828727722168, "global_step": 583252, "epoch": 7027} {"train_loss": -27.901493072509766, "global_step": 583253, "epoch": 7027} {"train_loss": -27.93300437927246, "global_step": 583254, "epoch": 7027} {"train_loss": -27.620502471923828, "global_step": 583255, "epoch": 7027} {"train_loss": -27.64680290222168, "global_step": 583256, "epoch": 7027} {"train_loss": -27.374555587768555, "global_step": 583257, "epoch": 7027} {"train_loss": -27.968420028686523, "global_step": 583258, "epoch": 7027} {"train_loss": -27.560285568237305, "global_step": 583259, "epoch": 7027} {"train_loss": -27.552688598632812, "global_step": 583260, "epoch": 7027} {"train_loss": -28.102981567382812, "global_step": 583261, "epoch": 7027} {"train_loss": -28.036090850830078, "global_step": 583262, "epoch": 7027} {"train_loss": -27.986907958984375, "global_step": 583263, "epoch": 7027} {"train_loss": -27.65155601501465, "global_step": 583264, "epoch": 7027} {"train_loss": -27.77510643005371, "global_step": 583265, "epoch": 7027} {"train_loss": -27.758747100830078, "global_step": 583266, "epoch": 7027} {"train_loss": -28.045501708984375, "global_step": 583267, "epoch": 7027} {"train_loss": -27.654281616210938, "global_step": 583268, "epoch": 7027} {"train_loss": -27.869354248046875, "global_step": 583269, "epoch": 7027} {"train_loss": -28.006628036499023, "global_step": 583270, "epoch": 7027} {"train_loss": -27.91107177734375, "global_step": 583271, "epoch": 7027} {"train_loss": -27.805444717407227, "global_step": 583272, "epoch": 7027} {"train_loss": -27.710437774658203, "global_step": 583273, "epoch": 7027} {"train_loss": -27.820096969604492, "global_step": 583274, "epoch": 7027} {"train_loss": -28.08466148376465, "global_step": 583275, "epoch": 7027} {"train_loss": -28.362262725830078, "global_step": 583276, "epoch": 7027} {"train_loss": -27.92987632751465, "global_step": 583277, "epoch": 7027} {"train_loss": -28.208227157592773, "global_step": 583278, "epoch": 7027} {"train_loss": -28.35780143737793, "global_step": 583279, "epoch": 7027} {"train_loss": -28.212759017944336, "global_step": 583280, "epoch": 7027} {"train_loss": -28.152624130249023, "global_step": 583281, "epoch": 7027} {"train_loss": -28.40871238708496, "global_step": 583282, "epoch": 7027} {"train_loss": -28.093847274780273, "global_step": 583283, "epoch": 7027} {"train_loss": -28.290424346923828, "global_step": 583284, "epoch": 7027} {"train_loss": -28.11466407775879, "global_step": 583285, "epoch": 7027} {"train_loss": -28.128406524658203, "global_step": 583286, "epoch": 7027} {"train_loss": -27.665451049804688, "global_step": 583287, "epoch": 7027} {"train_loss": -27.883214950561523, "global_step": 583288, "epoch": 7027} {"train_loss": -27.999937057495117, "global_step": 583289, "epoch": 7027} {"train_loss": -27.880338668823242, "global_step": 583290, "epoch": 7027} {"train_loss": -27.9342041015625, "global_step": 583291, "epoch": 7027} {"train_loss": -27.779621124267578, "global_step": 583292, "epoch": 7027} {"train_loss": -28.368122100830078, "global_step": 583293, "epoch": 7027} {"train_loss": -28.025415420532227, "global_step": 583294, "epoch": 7027} {"train_loss": -27.964277267456055, "global_step": 583295, "epoch": 7027} {"train_loss": -27.91556739807129, "global_step": 583296, "epoch": 7027} {"train_loss": -28.23542594909668, "global_step": 583297, "epoch": 7027} {"train_loss": -28.216684341430664, "global_step": 583298, "epoch": 7027} {"train_loss": -28.056257247924805, "global_step": 583299, "epoch": 7027} {"train_loss": -28.356916427612305, "global_step": 583300, "epoch": 7027} {"train_loss": -28.281909942626953, "global_step": 583301, "epoch": 7027} {"train_loss": -27.977636337280273, "global_step": 583302, "epoch": 7027} {"train_loss": -28.0295467376709, "global_step": 583303, "epoch": 7027} {"train_loss": -28.0279598236084, "global_step": 583304, "epoch": 7027} {"train_loss": -28.04914665222168, "global_step": 583305, "epoch": 7027} {"train_loss": -27.894367218017578, "global_step": 583306, "epoch": 7027} {"train_loss": -28.21364402770996, "global_step": 583307, "epoch": 7027} {"train_loss": -28.175302505493164, "global_step": 583308, "epoch": 7027} {"train_loss": -28.022451400756836, "global_step": 583309, "epoch": 7027} {"train_loss": -28.00662612915039, "global_step": 583310, "epoch": 7027} {"train_loss": -28.018442153930664, "global_step": 583311, "epoch": 7027} {"train_loss": -28.32464027404785, "global_step": 583312, "epoch": 7027} {"train_loss": -28.160358428955078, "global_step": 583313, "epoch": 7027} {"train_loss": -27.604333877563477, "global_step": 583314, "epoch": 7027} {"train_loss": -27.732690811157227, "global_step": 583315, "epoch": 7027} {"train_loss": -27.455188751220703, "global_step": 583316, "epoch": 7027} {"train_loss": -27.860137939453125, "global_step": 583317, "epoch": 7027} {"train_loss": -27.640295028686523, "global_step": 583318, "epoch": 7027} {"train_loss": -27.351593017578125, "global_step": 583319, "epoch": 7027} {"train_loss": -28.018529891967773, "global_step": 583320, "epoch": 7027} {"train_loss": -28.004714965820312, "global_step": 583321, "epoch": 7027} {"train_loss": -28.2075252532959, "global_step": 583322, "epoch": 7027} {"train_loss": -27.914469546582325, "global_step": 583323, "epoch": 7027, "val_loss": 6696818.0} {"train_loss": -27.58506202697754, "global_step": 583324, "epoch": 7028} {"train_loss": -27.168554306030273, "global_step": 583325, "epoch": 7028} {"train_loss": -27.566694259643555, "global_step": 583326, "epoch": 7028} {"train_loss": -27.159164428710938, "global_step": 583327, "epoch": 7028} {"train_loss": -27.258270263671875, "global_step": 583328, "epoch": 7028} {"train_loss": -27.331558227539062, "global_step": 583329, "epoch": 7028} {"train_loss": -26.783456802368164, "global_step": 583330, "epoch": 7028} {"train_loss": -27.210458755493164, "global_step": 583331, "epoch": 7028} {"train_loss": -26.994901657104492, "global_step": 583332, "epoch": 7028} {"train_loss": -27.795703887939453, "global_step": 583333, "epoch": 7028} {"train_loss": -27.215972900390625, "global_step": 583334, "epoch": 7028} {"train_loss": -27.532958984375, "global_step": 583335, "epoch": 7028} {"train_loss": -27.39803123474121, "global_step": 583336, "epoch": 7028} {"train_loss": -27.216665267944336, "global_step": 583337, "epoch": 7028} {"train_loss": -27.721393585205078, "global_step": 583338, "epoch": 7028} {"train_loss": -27.375085830688477, "global_step": 583339, "epoch": 7028} {"train_loss": -26.737401962280273, "global_step": 583340, "epoch": 7028} {"train_loss": -27.782180786132812, "global_step": 583341, "epoch": 7028} {"train_loss": -27.067901611328125, "global_step": 583342, "epoch": 7028} {"train_loss": -27.477558135986328, "global_step": 583343, "epoch": 7028} {"train_loss": -27.670852661132812, "global_step": 583344, "epoch": 7028} {"train_loss": -27.187009811401367, "global_step": 583345, "epoch": 7028} {"train_loss": -27.195566177368164, "global_step": 583346, "epoch": 7028} {"train_loss": -27.8356876373291, "global_step": 583347, "epoch": 7028} {"train_loss": -27.28449058532715, "global_step": 583348, "epoch": 7028} {"train_loss": -27.870344161987305, "global_step": 583349, "epoch": 7028} {"train_loss": -27.12224769592285, "global_step": 583350, "epoch": 7028} {"train_loss": -27.787067413330078, "global_step": 583351, "epoch": 7028} {"train_loss": -27.99592399597168, "global_step": 583352, "epoch": 7028} {"train_loss": -27.500085830688477, "global_step": 583353, "epoch": 7028} {"train_loss": -27.815107345581055, "global_step": 583354, "epoch": 7028} {"train_loss": -27.560373306274414, "global_step": 583355, "epoch": 7028} {"train_loss": -27.7243595123291, "global_step": 583356, "epoch": 7028} {"train_loss": -27.451730728149414, "global_step": 583357, "epoch": 7028} {"train_loss": -27.835529327392578, "global_step": 583358, "epoch": 7028} {"train_loss": -27.623584747314453, "global_step": 583359, "epoch": 7028} {"train_loss": -27.32122230529785, "global_step": 583360, "epoch": 7028} {"train_loss": -27.9927921295166, "global_step": 583361, "epoch": 7028} {"train_loss": -27.793781280517578, "global_step": 583362, "epoch": 7028} {"train_loss": -27.677509307861328, "global_step": 583363, "epoch": 7028} {"train_loss": -27.673307418823242, "global_step": 583364, "epoch": 7028} {"train_loss": -28.114990234375, "global_step": 583365, "epoch": 7028} {"train_loss": -27.838897705078125, "global_step": 583366, "epoch": 7028} {"train_loss": -27.96734619140625, "global_step": 583367, "epoch": 7028} {"train_loss": -27.952072143554688, "global_step": 583368, "epoch": 7028} {"train_loss": -27.763391494750977, "global_step": 583369, "epoch": 7028} {"train_loss": -27.791364669799805, "global_step": 583370, "epoch": 7028} {"train_loss": -28.039459228515625, "global_step": 583371, "epoch": 7028} {"train_loss": -28.049718856811523, "global_step": 583372, "epoch": 7028} {"train_loss": -28.0648136138916, "global_step": 583373, "epoch": 7028} {"train_loss": -27.696762084960938, "global_step": 583374, "epoch": 7028} {"train_loss": -28.04976463317871, "global_step": 583375, "epoch": 7028} {"train_loss": -27.855161666870117, "global_step": 583376, "epoch": 7028} {"train_loss": -27.86696434020996, "global_step": 583377, "epoch": 7028} {"train_loss": -28.48179054260254, "global_step": 583378, "epoch": 7028} {"train_loss": -27.664691925048828, "global_step": 583379, "epoch": 7028} {"train_loss": -28.356494903564453, "global_step": 583380, "epoch": 7028} {"train_loss": -27.522069931030273, "global_step": 583381, "epoch": 7028} {"train_loss": -28.00067710876465, "global_step": 583382, "epoch": 7028} {"train_loss": -27.97490882873535, "global_step": 583383, "epoch": 7028} {"train_loss": -28.132801055908203, "global_step": 583384, "epoch": 7028} {"train_loss": -27.961057662963867, "global_step": 583385, "epoch": 7028} {"train_loss": -28.26776695251465, "global_step": 583386, "epoch": 7028} {"train_loss": -27.921649932861328, "global_step": 583387, "epoch": 7028} {"train_loss": -28.356840133666992, "global_step": 583388, "epoch": 7028} {"train_loss": -27.65400505065918, "global_step": 583389, "epoch": 7028} {"train_loss": -27.889297485351562, "global_step": 583390, "epoch": 7028} {"train_loss": -27.772552490234375, "global_step": 583391, "epoch": 7028} {"train_loss": -27.916101455688477, "global_step": 583392, "epoch": 7028} {"train_loss": -27.798755645751953, "global_step": 583393, "epoch": 7028} {"train_loss": -28.09097671508789, "global_step": 583394, "epoch": 7028} {"train_loss": -28.209182739257812, "global_step": 583395, "epoch": 7028} {"train_loss": -27.88994789123535, "global_step": 583396, "epoch": 7028} {"train_loss": -27.850622177124023, "global_step": 583397, "epoch": 7028} {"train_loss": -27.5490779876709, "global_step": 583398, "epoch": 7028} {"train_loss": -28.126495361328125, "global_step": 583399, "epoch": 7028} {"train_loss": -27.898889541625977, "global_step": 583400, "epoch": 7028} {"train_loss": -27.786483764648438, "global_step": 583401, "epoch": 7028} {"train_loss": -28.07208824157715, "global_step": 583402, "epoch": 7028} {"train_loss": -28.076623916625977, "global_step": 583403, "epoch": 7028} {"train_loss": -27.838693618774414, "global_step": 583404, "epoch": 7028} {"train_loss": -28.00322914123535, "global_step": 583405, "epoch": 7028} {"train_loss": -27.715736779821924, "global_step": 583406, "epoch": 7028, "val_loss": 6686416.0} {"train_loss": -27.757938385009766, "global_step": 583407, "epoch": 7029} {"train_loss": -27.189136505126953, "global_step": 583408, "epoch": 7029} {"train_loss": -26.79054069519043, "global_step": 583409, "epoch": 7029} {"train_loss": -27.174991607666016, "global_step": 583410, "epoch": 7029} {"train_loss": -27.234527587890625, "global_step": 583411, "epoch": 7029} {"train_loss": -27.727283477783203, "global_step": 583412, "epoch": 7029} {"train_loss": -27.102630615234375, "global_step": 583413, "epoch": 7029} {"train_loss": -27.274341583251953, "global_step": 583414, "epoch": 7029} {"train_loss": -27.235870361328125, "global_step": 583415, "epoch": 7029} {"train_loss": -27.456266403198242, "global_step": 583416, "epoch": 7029} {"train_loss": -27.738996505737305, "global_step": 583417, "epoch": 7029} {"train_loss": -27.495691299438477, "global_step": 583418, "epoch": 7029} {"train_loss": -27.65576171875, "global_step": 583419, "epoch": 7029} {"train_loss": -27.515756607055664, "global_step": 583420, "epoch": 7029} {"train_loss": -27.813684463500977, "global_step": 583421, "epoch": 7029} {"train_loss": -27.739459991455078, "global_step": 583422, "epoch": 7029} {"train_loss": -27.84107780456543, "global_step": 583423, "epoch": 7029} {"train_loss": -27.661890029907227, "global_step": 583424, "epoch": 7029} {"train_loss": -27.36212158203125, "global_step": 583425, "epoch": 7029} {"train_loss": -28.093830108642578, "global_step": 583426, "epoch": 7029} {"train_loss": -27.74604606628418, "global_step": 583427, "epoch": 7029} {"train_loss": -28.21845054626465, "global_step": 583428, "epoch": 7029} {"train_loss": -27.868301391601562, "global_step": 583429, "epoch": 7029} {"train_loss": -28.155059814453125, "global_step": 583430, "epoch": 7029} {"train_loss": -27.852262496948242, "global_step": 583431, "epoch": 7029} {"train_loss": -27.9169921875, "global_step": 583432, "epoch": 7029} {"train_loss": -27.976184844970703, "global_step": 583433, "epoch": 7029} {"train_loss": -27.856552124023438, "global_step": 583434, "epoch": 7029} {"train_loss": -27.977781295776367, "global_step": 583435, "epoch": 7029} {"train_loss": -27.865888595581055, "global_step": 583436, "epoch": 7029} {"train_loss": -27.76458740234375, "global_step": 583437, "epoch": 7029} {"train_loss": -27.795034408569336, "global_step": 583438, "epoch": 7029} {"train_loss": -27.947219848632812, "global_step": 583439, "epoch": 7029} {"train_loss": -27.9654483795166, "global_step": 583440, "epoch": 7029} {"train_loss": -28.255374908447266, "global_step": 583441, "epoch": 7029} {"train_loss": -27.97676658630371, "global_step": 583442, "epoch": 7029} {"train_loss": -28.11536979675293, "global_step": 583443, "epoch": 7029} {"train_loss": -28.027271270751953, "global_step": 583444, "epoch": 7029} {"train_loss": -27.62981605529785, "global_step": 583445, "epoch": 7029} {"train_loss": -27.938474655151367, "global_step": 583446, "epoch": 7029} {"train_loss": -28.089948654174805, "global_step": 583447, "epoch": 7029} {"train_loss": -28.1402645111084, "global_step": 583448, "epoch": 7029} {"train_loss": -28.004901885986328, "global_step": 583449, "epoch": 7029} {"train_loss": -27.261917114257812, "global_step": 583450, "epoch": 7029} {"train_loss": -27.306655883789062, "global_step": 583451, "epoch": 7029} {"train_loss": -27.809967041015625, "global_step": 583452, "epoch": 7029} {"train_loss": -27.951974868774414, "global_step": 583453, "epoch": 7029} {"train_loss": -27.82953453063965, "global_step": 583454, "epoch": 7029} {"train_loss": -27.9414119720459, "global_step": 583455, "epoch": 7029} {"train_loss": -28.393829345703125, "global_step": 583456, "epoch": 7029} {"train_loss": -28.350027084350586, "global_step": 583457, "epoch": 7029} {"train_loss": -27.63054847717285, "global_step": 583458, "epoch": 7029} {"train_loss": -27.879308700561523, "global_step": 583459, "epoch": 7029} {"train_loss": -27.8101863861084, "global_step": 583460, "epoch": 7029} {"train_loss": -27.7236270904541, "global_step": 583461, "epoch": 7029} {"train_loss": -27.819442749023438, "global_step": 583462, "epoch": 7029} {"train_loss": -27.858173370361328, "global_step": 583463, "epoch": 7029} {"train_loss": -27.6219425201416, "global_step": 583464, "epoch": 7029} {"train_loss": -27.733240127563477, "global_step": 583465, "epoch": 7029} {"train_loss": -28.306777954101562, "global_step": 583466, "epoch": 7029} {"train_loss": -28.13225746154785, "global_step": 583467, "epoch": 7029} {"train_loss": -27.539794921875, "global_step": 583468, "epoch": 7029} {"train_loss": -27.812108993530273, "global_step": 583469, "epoch": 7029} {"train_loss": -28.17412757873535, "global_step": 583470, "epoch": 7029} {"train_loss": -27.897947311401367, "global_step": 583471, "epoch": 7029} {"train_loss": -27.817468643188477, "global_step": 583472, "epoch": 7029} {"train_loss": -28.013769149780273, "global_step": 583473, "epoch": 7029} {"train_loss": -27.64082145690918, "global_step": 583474, "epoch": 7029} {"train_loss": -27.875354766845703, "global_step": 583475, "epoch": 7029} {"train_loss": -27.888498306274414, "global_step": 583476, "epoch": 7029} {"train_loss": -28.250110626220703, "global_step": 583477, "epoch": 7029} {"train_loss": -27.714330673217773, "global_step": 583478, "epoch": 7029} {"train_loss": -27.772598266601562, "global_step": 583479, "epoch": 7029} {"train_loss": -27.791370391845703, "global_step": 583480, "epoch": 7029} {"train_loss": -28.189844131469727, "global_step": 583481, "epoch": 7029} {"train_loss": -27.819799423217773, "global_step": 583482, "epoch": 7029} {"train_loss": -27.853261947631836, "global_step": 583483, "epoch": 7029} {"train_loss": -28.215805053710938, "global_step": 583484, "epoch": 7029} {"train_loss": -27.895109176635742, "global_step": 583485, "epoch": 7029} {"train_loss": -28.06634521484375, "global_step": 583486, "epoch": 7029} {"train_loss": -27.8710994720459, "global_step": 583487, "epoch": 7029} {"train_loss": -27.95865821838379, "global_step": 583488, "epoch": 7029} {"train_loss": -27.822219297110315, "global_step": 583489, "epoch": 7029, "val_loss": 6690555.0} {"train_loss": -27.905527114868164, "global_step": 583490, "epoch": 7030} {"train_loss": -27.729116439819336, "global_step": 583491, "epoch": 7030} {"train_loss": -27.667190551757812, "global_step": 583492, "epoch": 7030} {"train_loss": -27.358478546142578, "global_step": 583493, "epoch": 7030} {"train_loss": -26.76912498474121, "global_step": 583494, "epoch": 7030} {"train_loss": -27.39044761657715, "global_step": 583495, "epoch": 7030} {"train_loss": -27.392786026000977, "global_step": 583496, "epoch": 7030} {"train_loss": -27.703643798828125, "global_step": 583497, "epoch": 7030} {"train_loss": -28.008228302001953, "global_step": 583498, "epoch": 7030} {"train_loss": -27.61032485961914, "global_step": 583499, "epoch": 7030} {"train_loss": -28.018463134765625, "global_step": 583500, "epoch": 7030} {"train_loss": -27.4493465423584, "global_step": 583501, "epoch": 7030} {"train_loss": -27.460315704345703, "global_step": 583502, "epoch": 7030} {"train_loss": -27.837629318237305, "global_step": 583503, "epoch": 7030} {"train_loss": -27.54220962524414, "global_step": 583504, "epoch": 7030} {"train_loss": -27.8447208404541, "global_step": 583505, "epoch": 7030} {"train_loss": -28.033069610595703, "global_step": 583506, "epoch": 7030} {"train_loss": -27.380903244018555, "global_step": 583507, "epoch": 7030} {"train_loss": -28.213438034057617, "global_step": 583508, "epoch": 7030} {"train_loss": -27.837488174438477, "global_step": 583509, "epoch": 7030} {"train_loss": -28.13176918029785, "global_step": 583510, "epoch": 7030} {"train_loss": -27.762537002563477, "global_step": 583511, "epoch": 7030} {"train_loss": -28.015722274780273, "global_step": 583512, "epoch": 7030} {"train_loss": -27.523242950439453, "global_step": 583513, "epoch": 7030} {"train_loss": -28.229345321655273, "global_step": 583514, "epoch": 7030} {"train_loss": -27.7855224609375, "global_step": 583515, "epoch": 7030} {"train_loss": -27.810216903686523, "global_step": 583516, "epoch": 7030} {"train_loss": -28.139493942260742, "global_step": 583517, "epoch": 7030} {"train_loss": -28.177169799804688, "global_step": 583518, "epoch": 7030} {"train_loss": -27.6877384185791, "global_step": 583519, "epoch": 7030} {"train_loss": -27.914365768432617, "global_step": 583520, "epoch": 7030} {"train_loss": -27.790924072265625, "global_step": 583521, "epoch": 7030} {"train_loss": -27.6170654296875, "global_step": 583522, "epoch": 7030} {"train_loss": -27.392871856689453, "global_step": 583523, "epoch": 7030} {"train_loss": -27.245899200439453, "global_step": 583524, "epoch": 7030} {"train_loss": -27.6119384765625, "global_step": 583525, "epoch": 7030} {"train_loss": -27.909109115600586, "global_step": 583526, "epoch": 7030} {"train_loss": -27.6594181060791, "global_step": 583527, "epoch": 7030} {"train_loss": -27.675201416015625, "global_step": 583528, "epoch": 7030} {"train_loss": -27.563858032226562, "global_step": 583529, "epoch": 7030} {"train_loss": -27.480640411376953, "global_step": 583530, "epoch": 7030} {"train_loss": -27.920642852783203, "global_step": 583531, "epoch": 7030} {"train_loss": -27.459217071533203, "global_step": 583532, "epoch": 7030} {"train_loss": -27.625173568725586, "global_step": 583533, "epoch": 7030} {"train_loss": -27.6046199798584, "global_step": 583534, "epoch": 7030} {"train_loss": -28.063230514526367, "global_step": 583535, "epoch": 7030} {"train_loss": -27.53460693359375, "global_step": 583536, "epoch": 7030} {"train_loss": -27.813867568969727, "global_step": 583537, "epoch": 7030} {"train_loss": -28.377660751342773, "global_step": 583538, "epoch": 7030} {"train_loss": -27.464466094970703, "global_step": 583539, "epoch": 7030} {"train_loss": -27.561573028564453, "global_step": 583540, "epoch": 7030} {"train_loss": -27.973215103149414, "global_step": 583541, "epoch": 7030} {"train_loss": -28.35672378540039, "global_step": 583542, "epoch": 7030} {"train_loss": -27.918725967407227, "global_step": 583543, "epoch": 7030} {"train_loss": -27.9736270904541, "global_step": 583544, "epoch": 7030} {"train_loss": -28.07545280456543, "global_step": 583545, "epoch": 7030} {"train_loss": -28.03400993347168, "global_step": 583546, "epoch": 7030} {"train_loss": -28.3090763092041, "global_step": 583547, "epoch": 7030} {"train_loss": -28.277084350585938, "global_step": 583548, "epoch": 7030} {"train_loss": -28.51373863220215, "global_step": 583549, "epoch": 7030} {"train_loss": -27.93548583984375, "global_step": 583550, "epoch": 7030} {"train_loss": -28.009235382080078, "global_step": 583551, "epoch": 7030} {"train_loss": -28.197912216186523, "global_step": 583552, "epoch": 7030} {"train_loss": -27.7606143951416, "global_step": 583553, "epoch": 7030} {"train_loss": -27.769922256469727, "global_step": 583554, "epoch": 7030} {"train_loss": -28.050756454467773, "global_step": 583555, "epoch": 7030} {"train_loss": -27.744916915893555, "global_step": 583556, "epoch": 7030} {"train_loss": -27.842453002929688, "global_step": 583557, "epoch": 7030} {"train_loss": -28.086362838745117, "global_step": 583558, "epoch": 7030} {"train_loss": -28.273242950439453, "global_step": 583559, "epoch": 7030} {"train_loss": -27.834028244018555, "global_step": 583560, "epoch": 7030} {"train_loss": -27.858596801757812, "global_step": 583561, "epoch": 7030} {"train_loss": -28.188058853149414, "global_step": 583562, "epoch": 7030} {"train_loss": -27.753347396850586, "global_step": 583563, "epoch": 7030} {"train_loss": -27.928699493408203, "global_step": 583564, "epoch": 7030} {"train_loss": -28.08451271057129, "global_step": 583565, "epoch": 7030} {"train_loss": -28.043447494506836, "global_step": 583566, "epoch": 7030} {"train_loss": -28.089460372924805, "global_step": 583567, "epoch": 7030} {"train_loss": -27.736051559448242, "global_step": 583568, "epoch": 7030} {"train_loss": -27.918561935424805, "global_step": 583569, "epoch": 7030} {"train_loss": -28.091262817382812, "global_step": 583570, "epoch": 7030} {"train_loss": -27.903900146484375, "global_step": 583571, "epoch": 7030} {"train_loss": -27.843460427709374, "global_step": 583572, "epoch": 7030, "val_loss": 6729969.5} {"train_loss": -27.382001876831055, "global_step": 583573, "epoch": 7031} {"train_loss": -27.483966827392578, "global_step": 583574, "epoch": 7031} {"train_loss": -27.792203903198242, "global_step": 583575, "epoch": 7031} {"train_loss": -27.770557403564453, "global_step": 583576, "epoch": 7031} {"train_loss": -27.724897384643555, "global_step": 583577, "epoch": 7031} {"train_loss": -27.580554962158203, "global_step": 583578, "epoch": 7031} {"train_loss": -27.490478515625, "global_step": 583579, "epoch": 7031} {"train_loss": -27.716726303100586, "global_step": 583580, "epoch": 7031} {"train_loss": -27.383447647094727, "global_step": 583581, "epoch": 7031} {"train_loss": -26.790082931518555, "global_step": 583582, "epoch": 7031} {"train_loss": -26.498937606811523, "global_step": 583583, "epoch": 7031} {"train_loss": -27.90935707092285, "global_step": 583584, "epoch": 7031} {"train_loss": -27.430917739868164, "global_step": 583585, "epoch": 7031} {"train_loss": -26.398996353149414, "global_step": 583586, "epoch": 7031} {"train_loss": -27.829364776611328, "global_step": 583587, "epoch": 7031} {"train_loss": -27.13252067565918, "global_step": 583588, "epoch": 7031} {"train_loss": -27.2508602142334, "global_step": 583589, "epoch": 7031} {"train_loss": -27.13775634765625, "global_step": 583590, "epoch": 7031} {"train_loss": -27.96700096130371, "global_step": 583591, "epoch": 7031} {"train_loss": -27.338367462158203, "global_step": 583592, "epoch": 7031} {"train_loss": -27.762725830078125, "global_step": 583593, "epoch": 7031} {"train_loss": -27.623464584350586, "global_step": 583594, "epoch": 7031} {"train_loss": -27.732263565063477, "global_step": 583595, "epoch": 7031} {"train_loss": -27.780160903930664, "global_step": 583596, "epoch": 7031} {"train_loss": -27.834264755249023, "global_step": 583597, "epoch": 7031} {"train_loss": -27.467702865600586, "global_step": 583598, "epoch": 7031} {"train_loss": -27.762418746948242, "global_step": 583599, "epoch": 7031} {"train_loss": -27.51861572265625, "global_step": 583600, "epoch": 7031} {"train_loss": -27.722064971923828, "global_step": 583601, "epoch": 7031} {"train_loss": -27.79145622253418, "global_step": 583602, "epoch": 7031} {"train_loss": -27.6492919921875, "global_step": 583603, "epoch": 7031} {"train_loss": -27.95672035217285, "global_step": 583604, "epoch": 7031} {"train_loss": -27.91767692565918, "global_step": 583605, "epoch": 7031} {"train_loss": -27.841333389282227, "global_step": 583606, "epoch": 7031} {"train_loss": -27.992563247680664, "global_step": 583607, "epoch": 7031} {"train_loss": -28.266508102416992, "global_step": 583608, "epoch": 7031} {"train_loss": -27.916162490844727, "global_step": 583609, "epoch": 7031} {"train_loss": -28.29078483581543, "global_step": 583610, "epoch": 7031} {"train_loss": -27.933032989501953, "global_step": 583611, "epoch": 7031} {"train_loss": -28.01179313659668, "global_step": 583612, "epoch": 7031} {"train_loss": -27.797409057617188, "global_step": 583613, "epoch": 7031} {"train_loss": -27.862506866455078, "global_step": 583614, "epoch": 7031} {"train_loss": -28.05012321472168, "global_step": 583615, "epoch": 7031} {"train_loss": -28.03082847595215, "global_step": 583616, "epoch": 7031} {"train_loss": -27.754724502563477, "global_step": 583617, "epoch": 7031} {"train_loss": -28.11930274963379, "global_step": 583618, "epoch": 7031} {"train_loss": -27.971960067749023, "global_step": 583619, "epoch": 7031} {"train_loss": -27.90509033203125, "global_step": 583620, "epoch": 7031} {"train_loss": -27.635284423828125, "global_step": 583621, "epoch": 7031} {"train_loss": -27.7943058013916, "global_step": 583622, "epoch": 7031} {"train_loss": -28.34366798400879, "global_step": 583623, "epoch": 7031} {"train_loss": -27.985937118530273, "global_step": 583624, "epoch": 7031} {"train_loss": -27.814123153686523, "global_step": 583625, "epoch": 7031} {"train_loss": -27.796497344970703, "global_step": 583626, "epoch": 7031} {"train_loss": -27.3126220703125, "global_step": 583627, "epoch": 7031} {"train_loss": -27.37601661682129, "global_step": 583628, "epoch": 7031} {"train_loss": -27.645986557006836, "global_step": 583629, "epoch": 7031} {"train_loss": -28.271839141845703, "global_step": 583630, "epoch": 7031} {"train_loss": -27.883214950561523, "global_step": 583631, "epoch": 7031} {"train_loss": -27.72159194946289, "global_step": 583632, "epoch": 7031} {"train_loss": -27.676000595092773, "global_step": 583633, "epoch": 7031} {"train_loss": -28.048786163330078, "global_step": 583634, "epoch": 7031} {"train_loss": -27.52008056640625, "global_step": 583635, "epoch": 7031} {"train_loss": -27.382781982421875, "global_step": 583636, "epoch": 7031} {"train_loss": -27.822956085205078, "global_step": 583637, "epoch": 7031} {"train_loss": -27.846515655517578, "global_step": 583638, "epoch": 7031} {"train_loss": -27.855504989624023, "global_step": 583639, "epoch": 7031} {"train_loss": -27.904590606689453, "global_step": 583640, "epoch": 7031} {"train_loss": -27.877246856689453, "global_step": 583641, "epoch": 7031} {"train_loss": -27.81926918029785, "global_step": 583642, "epoch": 7031} {"train_loss": -27.95343017578125, "global_step": 583643, "epoch": 7031} {"train_loss": -27.8443660736084, "global_step": 583644, "epoch": 7031} {"train_loss": -27.780344009399414, "global_step": 583645, "epoch": 7031} {"train_loss": -28.089313507080078, "global_step": 583646, "epoch": 7031} {"train_loss": -28.155929565429688, "global_step": 583647, "epoch": 7031} {"train_loss": -28.118330001831055, "global_step": 583648, "epoch": 7031} {"train_loss": -27.802881240844727, "global_step": 583649, "epoch": 7031} {"train_loss": -27.92513084411621, "global_step": 583650, "epoch": 7031} {"train_loss": -27.770654678344727, "global_step": 583651, "epoch": 7031} {"train_loss": -27.873580932617188, "global_step": 583652, "epoch": 7031} {"train_loss": -27.677343368530273, "global_step": 583653, "epoch": 7031} {"train_loss": -27.703094482421875, "global_step": 583654, "epoch": 7031} {"train_loss": -27.746841614504895, "global_step": 583655, "epoch": 7031, "val_loss": 6736010.5} {"train_loss": -26.827285766601562, "global_step": 583656, "epoch": 7032} {"train_loss": -26.59098243713379, "global_step": 583657, "epoch": 7032} {"train_loss": -26.80909538269043, "global_step": 583658, "epoch": 7032} {"train_loss": -25.8204288482666, "global_step": 583659, "epoch": 7032} {"train_loss": -26.881759643554688, "global_step": 583660, "epoch": 7032} {"train_loss": -26.702661514282227, "global_step": 583661, "epoch": 7032} {"train_loss": -26.538421630859375, "global_step": 583662, "epoch": 7032} {"train_loss": -27.387744903564453, "global_step": 583663, "epoch": 7032} {"train_loss": -26.747114181518555, "global_step": 583664, "epoch": 7032} {"train_loss": -26.85929298400879, "global_step": 583665, "epoch": 7032} {"train_loss": -27.229598999023438, "global_step": 583666, "epoch": 7032} {"train_loss": -27.08815574645996, "global_step": 583667, "epoch": 7032} {"train_loss": -27.432828903198242, "global_step": 583668, "epoch": 7032} {"train_loss": -26.986679077148438, "global_step": 583669, "epoch": 7032} {"train_loss": -27.564939498901367, "global_step": 583670, "epoch": 7032} {"train_loss": -27.309072494506836, "global_step": 583671, "epoch": 7032} {"train_loss": -27.488529205322266, "global_step": 583672, "epoch": 7032} {"train_loss": -27.539209365844727, "global_step": 583673, "epoch": 7032} {"train_loss": -27.588525772094727, "global_step": 583674, "epoch": 7032} {"train_loss": -26.954904556274414, "global_step": 583675, "epoch": 7032} {"train_loss": -27.488006591796875, "global_step": 583676, "epoch": 7032} {"train_loss": -27.179147720336914, "global_step": 583677, "epoch": 7032} {"train_loss": -27.419891357421875, "global_step": 583678, "epoch": 7032} {"train_loss": -27.5648136138916, "global_step": 583679, "epoch": 7032} {"train_loss": -27.791828155517578, "global_step": 583680, "epoch": 7032} {"train_loss": -27.9882755279541, "global_step": 583681, "epoch": 7032} {"train_loss": -27.6262149810791, "global_step": 583682, "epoch": 7032} {"train_loss": -27.93987464904785, "global_step": 583683, "epoch": 7032} {"train_loss": -27.570404052734375, "global_step": 583684, "epoch": 7032} {"train_loss": -27.8098087310791, "global_step": 583685, "epoch": 7032} {"train_loss": -27.597843170166016, "global_step": 583686, "epoch": 7032} {"train_loss": -27.577157974243164, "global_step": 583687, "epoch": 7032} {"train_loss": -27.7095947265625, "global_step": 583688, "epoch": 7032} {"train_loss": -27.94523048400879, "global_step": 583689, "epoch": 7032} {"train_loss": -28.1459903717041, "global_step": 583690, "epoch": 7032} {"train_loss": -27.91716957092285, "global_step": 583691, "epoch": 7032} {"train_loss": -27.865955352783203, "global_step": 583692, "epoch": 7032} {"train_loss": -27.864643096923828, "global_step": 583693, "epoch": 7032} {"train_loss": -28.27096939086914, "global_step": 583694, "epoch": 7032} {"train_loss": -28.025175094604492, "global_step": 583695, "epoch": 7032} {"train_loss": -27.826032638549805, "global_step": 583696, "epoch": 7032} {"train_loss": -28.1203670501709, "global_step": 583697, "epoch": 7032} {"train_loss": -28.273151397705078, "global_step": 583698, "epoch": 7032} {"train_loss": -28.452621459960938, "global_step": 583699, "epoch": 7032} {"train_loss": -27.725738525390625, "global_step": 583700, "epoch": 7032} {"train_loss": -28.238351821899414, "global_step": 583701, "epoch": 7032} {"train_loss": -27.833200454711914, "global_step": 583702, "epoch": 7032} {"train_loss": -27.7205810546875, "global_step": 583703, "epoch": 7032} {"train_loss": -27.713220596313477, "global_step": 583704, "epoch": 7032} {"train_loss": -28.1538143157959, "global_step": 583705, "epoch": 7032} {"train_loss": -27.715906143188477, "global_step": 583706, "epoch": 7032} {"train_loss": -27.596765518188477, "global_step": 583707, "epoch": 7032} {"train_loss": -27.96653175354004, "global_step": 583708, "epoch": 7032} {"train_loss": -27.6429386138916, "global_step": 583709, "epoch": 7032} {"train_loss": -27.96413230895996, "global_step": 583710, "epoch": 7032} {"train_loss": -28.017745971679688, "global_step": 583711, "epoch": 7032} {"train_loss": -27.698974609375, "global_step": 583712, "epoch": 7032} {"train_loss": -27.701635360717773, "global_step": 583713, "epoch": 7032} {"train_loss": -27.972827911376953, "global_step": 583714, "epoch": 7032} {"train_loss": -28.101842880249023, "global_step": 583715, "epoch": 7032} {"train_loss": -27.95525550842285, "global_step": 583716, "epoch": 7032} {"train_loss": -28.037158966064453, "global_step": 583717, "epoch": 7032} {"train_loss": -27.843969345092773, "global_step": 583718, "epoch": 7032} {"train_loss": -27.590381622314453, "global_step": 583719, "epoch": 7032} {"train_loss": -27.80513572692871, "global_step": 583720, "epoch": 7032} {"train_loss": -28.15456199645996, "global_step": 583721, "epoch": 7032} {"train_loss": -28.09913444519043, "global_step": 583722, "epoch": 7032} {"train_loss": -27.755308151245117, "global_step": 583723, "epoch": 7032} {"train_loss": -28.030200958251953, "global_step": 583724, "epoch": 7032} {"train_loss": -28.14576530456543, "global_step": 583725, "epoch": 7032} {"train_loss": -28.404199600219727, "global_step": 583726, "epoch": 7032} {"train_loss": -27.948163986206055, "global_step": 583727, "epoch": 7032} {"train_loss": -28.177515029907227, "global_step": 583728, "epoch": 7032} {"train_loss": -28.337549209594727, "global_step": 583729, "epoch": 7032} {"train_loss": -28.0329532623291, "global_step": 583730, "epoch": 7032} {"train_loss": -28.31022071838379, "global_step": 583731, "epoch": 7032} {"train_loss": -28.008268356323242, "global_step": 583732, "epoch": 7032} {"train_loss": -28.079788208007812, "global_step": 583733, "epoch": 7032} {"train_loss": -28.253177642822266, "global_step": 583734, "epoch": 7032} {"train_loss": -27.8753662109375, "global_step": 583735, "epoch": 7032} {"train_loss": -28.16963005065918, "global_step": 583736, "epoch": 7032} {"train_loss": -28.478260040283203, "global_step": 583737, "epoch": 7032} {"train_loss": -27.698727940938557, "global_step": 583738, "epoch": 7032, "val_loss": 6706495.0} {"train_loss": -27.103483200073242, "global_step": 583739, "epoch": 7033} {"train_loss": -27.237653732299805, "global_step": 583740, "epoch": 7033} {"train_loss": -27.664173126220703, "global_step": 583741, "epoch": 7033} {"train_loss": -27.568891525268555, "global_step": 583742, "epoch": 7033} {"train_loss": -26.8223819732666, "global_step": 583743, "epoch": 7033} {"train_loss": -25.257028579711914, "global_step": 583744, "epoch": 7033} {"train_loss": -27.212482452392578, "global_step": 583745, "epoch": 7033} {"train_loss": -27.102331161499023, "global_step": 583746, "epoch": 7033} {"train_loss": -26.62342643737793, "global_step": 583747, "epoch": 7033} {"train_loss": -27.221784591674805, "global_step": 583748, "epoch": 7033} {"train_loss": -26.454809188842773, "global_step": 583749, "epoch": 7033} {"train_loss": -27.135175704956055, "global_step": 583750, "epoch": 7033} {"train_loss": -27.065942764282227, "global_step": 583751, "epoch": 7033} {"train_loss": -27.0572452545166, "global_step": 583752, "epoch": 7033} {"train_loss": -27.027008056640625, "global_step": 583753, "epoch": 7033} {"train_loss": -27.330198287963867, "global_step": 583754, "epoch": 7033} {"train_loss": -27.33536148071289, "global_step": 583755, "epoch": 7033} {"train_loss": -27.06951332092285, "global_step": 583756, "epoch": 7033} {"train_loss": -27.664493560791016, "global_step": 583757, "epoch": 7033} {"train_loss": -27.152389526367188, "global_step": 583758, "epoch": 7033} {"train_loss": -27.711105346679688, "global_step": 583759, "epoch": 7033} {"train_loss": -27.201099395751953, "global_step": 583760, "epoch": 7033} {"train_loss": -27.09760856628418, "global_step": 583761, "epoch": 7033} {"train_loss": -27.3182373046875, "global_step": 583762, "epoch": 7033} {"train_loss": -27.737279891967773, "global_step": 583763, "epoch": 7033} {"train_loss": -27.215137481689453, "global_step": 583764, "epoch": 7033} {"train_loss": -27.61822509765625, "global_step": 583765, "epoch": 7033} {"train_loss": -27.896167755126953, "global_step": 583766, "epoch": 7033} {"train_loss": -27.7309513092041, "global_step": 583767, "epoch": 7033} {"train_loss": -27.764368057250977, "global_step": 583768, "epoch": 7033} {"train_loss": -27.95050048828125, "global_step": 583769, "epoch": 7033} {"train_loss": -27.89750099182129, "global_step": 583770, "epoch": 7033} {"train_loss": -27.767658233642578, "global_step": 583771, "epoch": 7033} {"train_loss": -27.78895378112793, "global_step": 583772, "epoch": 7033} {"train_loss": -28.011188507080078, "global_step": 583773, "epoch": 7033} {"train_loss": -28.010868072509766, "global_step": 583774, "epoch": 7033} {"train_loss": -27.850194931030273, "global_step": 583775, "epoch": 7033} {"train_loss": -28.01458740234375, "global_step": 583776, "epoch": 7033} {"train_loss": -27.745532989501953, "global_step": 583777, "epoch": 7033} {"train_loss": -27.684833526611328, "global_step": 583778, "epoch": 7033} {"train_loss": -27.766925811767578, "global_step": 583779, "epoch": 7033} {"train_loss": -28.129596710205078, "global_step": 583780, "epoch": 7033} {"train_loss": -28.006513595581055, "global_step": 583781, "epoch": 7033} {"train_loss": -28.08721923828125, "global_step": 583782, "epoch": 7033} {"train_loss": -28.08062171936035, "global_step": 583783, "epoch": 7033} {"train_loss": -28.21759033203125, "global_step": 583784, "epoch": 7033} {"train_loss": -27.806812286376953, "global_step": 583785, "epoch": 7033} {"train_loss": -27.904699325561523, "global_step": 583786, "epoch": 7033} {"train_loss": -27.97429847717285, "global_step": 583787, "epoch": 7033} {"train_loss": -27.982614517211914, "global_step": 583788, "epoch": 7033} {"train_loss": -27.86848258972168, "global_step": 583789, "epoch": 7033} {"train_loss": -27.740758895874023, "global_step": 583790, "epoch": 7033} {"train_loss": -27.939619064331055, "global_step": 583791, "epoch": 7033} {"train_loss": -28.121976852416992, "global_step": 583792, "epoch": 7033} {"train_loss": -27.927820205688477, "global_step": 583793, "epoch": 7033} {"train_loss": -27.75349235534668, "global_step": 583794, "epoch": 7033} {"train_loss": -27.75982093811035, "global_step": 583795, "epoch": 7033} {"train_loss": -28.132963180541992, "global_step": 583796, "epoch": 7033} {"train_loss": -28.003345489501953, "global_step": 583797, "epoch": 7033} {"train_loss": -27.7831974029541, "global_step": 583798, "epoch": 7033} {"train_loss": -27.857282638549805, "global_step": 583799, "epoch": 7033} {"train_loss": -27.99146842956543, "global_step": 583800, "epoch": 7033} {"train_loss": -27.49421501159668, "global_step": 583801, "epoch": 7033} {"train_loss": -27.49117088317871, "global_step": 583802, "epoch": 7033} {"train_loss": -28.12864112854004, "global_step": 583803, "epoch": 7033} {"train_loss": -27.831140518188477, "global_step": 583804, "epoch": 7033} {"train_loss": -27.85318946838379, "global_step": 583805, "epoch": 7033} {"train_loss": -27.85650062561035, "global_step": 583806, "epoch": 7033} {"train_loss": -27.858585357666016, "global_step": 583807, "epoch": 7033} {"train_loss": -28.197717666625977, "global_step": 583808, "epoch": 7033} {"train_loss": -27.38205337524414, "global_step": 583809, "epoch": 7033} {"train_loss": -27.967737197875977, "global_step": 583810, "epoch": 7033} {"train_loss": -27.951242446899414, "global_step": 583811, "epoch": 7033} {"train_loss": -27.24116325378418, "global_step": 583812, "epoch": 7033} {"train_loss": -28.018537521362305, "global_step": 583813, "epoch": 7033} {"train_loss": -27.789142608642578, "global_step": 583814, "epoch": 7033} {"train_loss": -28.196685791015625, "global_step": 583815, "epoch": 7033} {"train_loss": -27.53118896484375, "global_step": 583816, "epoch": 7033} {"train_loss": -27.473928451538086, "global_step": 583817, "epoch": 7033} {"train_loss": -27.951929092407227, "global_step": 583818, "epoch": 7033} {"train_loss": -28.253528594970703, "global_step": 583819, "epoch": 7033} {"train_loss": -27.948505401611328, "global_step": 583820, "epoch": 7033} {"train_loss": -27.649611576493964, "global_step": 583821, "epoch": 7033, "val_loss": 6652023.0} {"train_loss": -27.7763614654541, "global_step": 583822, "epoch": 7034} {"train_loss": -27.277551651000977, "global_step": 583823, "epoch": 7034} {"train_loss": -27.99826431274414, "global_step": 583824, "epoch": 7034} {"train_loss": -27.491790771484375, "global_step": 583825, "epoch": 7034} {"train_loss": -27.508544921875, "global_step": 583826, "epoch": 7034} {"train_loss": -27.202619552612305, "global_step": 583827, "epoch": 7034} {"train_loss": -27.820941925048828, "global_step": 583828, "epoch": 7034} {"train_loss": -27.747455596923828, "global_step": 583829, "epoch": 7034} {"train_loss": -27.430143356323242, "global_step": 583830, "epoch": 7034} {"train_loss": -27.370580673217773, "global_step": 583831, "epoch": 7034} {"train_loss": -27.259933471679688, "global_step": 583832, "epoch": 7034} {"train_loss": -27.532470703125, "global_step": 583833, "epoch": 7034} {"train_loss": -27.357812881469727, "global_step": 583834, "epoch": 7034} {"train_loss": -27.557905197143555, "global_step": 583835, "epoch": 7034} {"train_loss": -27.71664810180664, "global_step": 583836, "epoch": 7034} {"train_loss": -27.5128116607666, "global_step": 583837, "epoch": 7034} {"train_loss": -27.59805679321289, "global_step": 583838, "epoch": 7034} {"train_loss": -27.800201416015625, "global_step": 583839, "epoch": 7034} {"train_loss": -27.634618759155273, "global_step": 583840, "epoch": 7034} {"train_loss": -27.91627311706543, "global_step": 583841, "epoch": 7034} {"train_loss": -27.457813262939453, "global_step": 583842, "epoch": 7034} {"train_loss": -27.6653995513916, "global_step": 583843, "epoch": 7034} {"train_loss": -27.602558135986328, "global_step": 583844, "epoch": 7034} {"train_loss": -27.996417999267578, "global_step": 583845, "epoch": 7034} {"train_loss": -27.76875877380371, "global_step": 583846, "epoch": 7034} {"train_loss": -27.983667373657227, "global_step": 583847, "epoch": 7034} {"train_loss": -28.131261825561523, "global_step": 583848, "epoch": 7034} {"train_loss": -27.550851821899414, "global_step": 583849, "epoch": 7034} {"train_loss": -28.003080368041992, "global_step": 583850, "epoch": 7034} {"train_loss": -27.818510055541992, "global_step": 583851, "epoch": 7034} {"train_loss": -28.067977905273438, "global_step": 583852, "epoch": 7034} {"train_loss": -28.15284538269043, "global_step": 583853, "epoch": 7034} {"train_loss": -28.032215118408203, "global_step": 583854, "epoch": 7034} {"train_loss": -27.957406997680664, "global_step": 583855, "epoch": 7034} {"train_loss": -27.610952377319336, "global_step": 583856, "epoch": 7034} {"train_loss": -28.130674362182617, "global_step": 583857, "epoch": 7034} {"train_loss": -28.145933151245117, "global_step": 583858, "epoch": 7034} {"train_loss": -28.1046142578125, "global_step": 583859, "epoch": 7034} {"train_loss": -27.805566787719727, "global_step": 583860, "epoch": 7034} {"train_loss": -28.260602951049805, "global_step": 583861, "epoch": 7034} {"train_loss": -27.950159072875977, "global_step": 583862, "epoch": 7034} {"train_loss": -28.137847900390625, "global_step": 583863, "epoch": 7034} {"train_loss": -28.019973754882812, "global_step": 583864, "epoch": 7034} {"train_loss": -28.161453247070312, "global_step": 583865, "epoch": 7034} {"train_loss": -28.231016159057617, "global_step": 583866, "epoch": 7034} {"train_loss": -28.53814125061035, "global_step": 583867, "epoch": 7034} {"train_loss": -28.079206466674805, "global_step": 583868, "epoch": 7034} {"train_loss": -28.386255264282227, "global_step": 583869, "epoch": 7034} {"train_loss": -27.761693954467773, "global_step": 583870, "epoch": 7034} {"train_loss": -28.009077072143555, "global_step": 583871, "epoch": 7034} {"train_loss": -27.4697322845459, "global_step": 583872, "epoch": 7034} {"train_loss": -27.896574020385742, "global_step": 583873, "epoch": 7034} {"train_loss": -27.706912994384766, "global_step": 583874, "epoch": 7034} {"train_loss": -28.54481315612793, "global_step": 583875, "epoch": 7034} {"train_loss": -27.68366813659668, "global_step": 583876, "epoch": 7034} {"train_loss": -27.892181396484375, "global_step": 583877, "epoch": 7034} {"train_loss": -27.7835750579834, "global_step": 583878, "epoch": 7034} {"train_loss": -27.7861270904541, "global_step": 583879, "epoch": 7034} {"train_loss": -28.0433406829834, "global_step": 583880, "epoch": 7034} {"train_loss": -28.235681533813477, "global_step": 583881, "epoch": 7034} {"train_loss": -27.79584312438965, "global_step": 583882, "epoch": 7034} {"train_loss": -27.851837158203125, "global_step": 583883, "epoch": 7034} {"train_loss": -27.89434242248535, "global_step": 583884, "epoch": 7034} {"train_loss": -27.944570541381836, "global_step": 583885, "epoch": 7034} {"train_loss": -28.11591148376465, "global_step": 583886, "epoch": 7034} {"train_loss": -28.07282066345215, "global_step": 583887, "epoch": 7034} {"train_loss": -27.448774337768555, "global_step": 583888, "epoch": 7034} {"train_loss": -27.781253814697266, "global_step": 583889, "epoch": 7034} {"train_loss": -27.97320556640625, "global_step": 583890, "epoch": 7034} {"train_loss": -27.835119247436523, "global_step": 583891, "epoch": 7034} {"train_loss": -27.9229736328125, "global_step": 583892, "epoch": 7034} {"train_loss": -27.668729782104492, "global_step": 583893, "epoch": 7034} {"train_loss": -27.75787353515625, "global_step": 583894, "epoch": 7034} {"train_loss": -27.7740478515625, "global_step": 583895, "epoch": 7034} {"train_loss": -26.983625411987305, "global_step": 583896, "epoch": 7034} {"train_loss": -27.331714630126953, "global_step": 583897, "epoch": 7034} {"train_loss": -27.881765365600586, "global_step": 583898, "epoch": 7034} {"train_loss": -27.700565338134766, "global_step": 583899, "epoch": 7034} {"train_loss": -27.792591094970703, "global_step": 583900, "epoch": 7034} {"train_loss": -27.477447509765625, "global_step": 583901, "epoch": 7034} {"train_loss": -27.572818756103516, "global_step": 583902, "epoch": 7034} {"train_loss": -28.039236068725586, "global_step": 583903, "epoch": 7034} {"train_loss": -27.81595326618976, "global_step": 583904, "epoch": 7034, "val_loss": 6721543.0} {"train_loss": -27.625659942626953, "global_step": 583905, "epoch": 7035} {"train_loss": -27.7818660736084, "global_step": 583906, "epoch": 7035} {"train_loss": -27.61246681213379, "global_step": 583907, "epoch": 7035} {"train_loss": -27.536230087280273, "global_step": 583908, "epoch": 7035} {"train_loss": -27.346206665039062, "global_step": 583909, "epoch": 7035} {"train_loss": -27.36995506286621, "global_step": 583910, "epoch": 7035} {"train_loss": -27.563337326049805, "global_step": 583911, "epoch": 7035} {"train_loss": -27.3983154296875, "global_step": 583912, "epoch": 7035} {"train_loss": -27.823400497436523, "global_step": 583913, "epoch": 7035} {"train_loss": -27.390533447265625, "global_step": 583914, "epoch": 7035} {"train_loss": -27.576007843017578, "global_step": 583915, "epoch": 7035} {"train_loss": -27.49953269958496, "global_step": 583916, "epoch": 7035} {"train_loss": -27.584228515625, "global_step": 583917, "epoch": 7035} {"train_loss": -27.657114028930664, "global_step": 583918, "epoch": 7035} {"train_loss": -27.896753311157227, "global_step": 583919, "epoch": 7035} {"train_loss": -27.800317764282227, "global_step": 583920, "epoch": 7035} {"train_loss": -27.75190544128418, "global_step": 583921, "epoch": 7035} {"train_loss": -28.19525146484375, "global_step": 583922, "epoch": 7035} {"train_loss": -27.8794002532959, "global_step": 583923, "epoch": 7035} {"train_loss": -28.15288734436035, "global_step": 583924, "epoch": 7035} {"train_loss": -27.815998077392578, "global_step": 583925, "epoch": 7035} {"train_loss": -27.919483184814453, "global_step": 583926, "epoch": 7035} {"train_loss": -28.295385360717773, "global_step": 583927, "epoch": 7035} {"train_loss": -27.795652389526367, "global_step": 583928, "epoch": 7035} {"train_loss": -27.913610458374023, "global_step": 583929, "epoch": 7035} {"train_loss": -27.839292526245117, "global_step": 583930, "epoch": 7035} {"train_loss": -28.16583824157715, "global_step": 583931, "epoch": 7035} {"train_loss": -28.042749404907227, "global_step": 583932, "epoch": 7035} {"train_loss": -28.210769653320312, "global_step": 583933, "epoch": 7035} {"train_loss": -27.8825626373291, "global_step": 583934, "epoch": 7035} {"train_loss": -28.14520263671875, "global_step": 583935, "epoch": 7035} {"train_loss": -27.957162857055664, "global_step": 583936, "epoch": 7035} {"train_loss": -27.989667892456055, "global_step": 583937, "epoch": 7035} {"train_loss": -28.082611083984375, "global_step": 583938, "epoch": 7035} {"train_loss": -28.02850341796875, "global_step": 583939, "epoch": 7035} {"train_loss": -27.76148796081543, "global_step": 583940, "epoch": 7035} {"train_loss": -28.00473976135254, "global_step": 583941, "epoch": 7035} {"train_loss": -28.227008819580078, "global_step": 583942, "epoch": 7035} {"train_loss": -28.116989135742188, "global_step": 583943, "epoch": 7035} {"train_loss": -27.87107276916504, "global_step": 583944, "epoch": 7035} {"train_loss": -28.316938400268555, "global_step": 583945, "epoch": 7035} {"train_loss": -28.194990158081055, "global_step": 583946, "epoch": 7035} {"train_loss": -28.06219482421875, "global_step": 583947, "epoch": 7035} {"train_loss": -28.0965518951416, "global_step": 583948, "epoch": 7035} {"train_loss": -27.921323776245117, "global_step": 583949, "epoch": 7035} {"train_loss": -27.94205093383789, "global_step": 583950, "epoch": 7035} {"train_loss": -27.850299835205078, "global_step": 583951, "epoch": 7035} {"train_loss": -27.93830680847168, "global_step": 583952, "epoch": 7035} {"train_loss": -27.646926879882812, "global_step": 583953, "epoch": 7035} {"train_loss": -27.97694969177246, "global_step": 583954, "epoch": 7035} {"train_loss": -27.917795181274414, "global_step": 583955, "epoch": 7035} {"train_loss": -27.87562370300293, "global_step": 583956, "epoch": 7035} {"train_loss": -28.021392822265625, "global_step": 583957, "epoch": 7035} {"train_loss": -27.370878219604492, "global_step": 583958, "epoch": 7035} {"train_loss": -26.899805068969727, "global_step": 583959, "epoch": 7035} {"train_loss": -26.86024284362793, "global_step": 583960, "epoch": 7035} {"train_loss": -27.707929611206055, "global_step": 583961, "epoch": 7035} {"train_loss": -27.843582153320312, "global_step": 583962, "epoch": 7035} {"train_loss": -27.665319442749023, "global_step": 583963, "epoch": 7035} {"train_loss": -27.767515182495117, "global_step": 583964, "epoch": 7035} {"train_loss": -27.663528442382812, "global_step": 583965, "epoch": 7035} {"train_loss": -27.162586212158203, "global_step": 583966, "epoch": 7035} {"train_loss": -27.534109115600586, "global_step": 583967, "epoch": 7035} {"train_loss": -27.750818252563477, "global_step": 583968, "epoch": 7035} {"train_loss": -27.380369186401367, "global_step": 583969, "epoch": 7035} {"train_loss": -27.471786499023438, "global_step": 583970, "epoch": 7035} {"train_loss": -27.615034103393555, "global_step": 583971, "epoch": 7035} {"train_loss": -27.999988555908203, "global_step": 583972, "epoch": 7035} {"train_loss": -28.225244522094727, "global_step": 583973, "epoch": 7035} {"train_loss": -27.747949600219727, "global_step": 583974, "epoch": 7035} {"train_loss": -27.916296005249023, "global_step": 583975, "epoch": 7035} {"train_loss": -27.975942611694336, "global_step": 583976, "epoch": 7035} {"train_loss": -27.67124366760254, "global_step": 583977, "epoch": 7035} {"train_loss": -27.804533004760742, "global_step": 583978, "epoch": 7035} {"train_loss": -27.998218536376953, "global_step": 583979, "epoch": 7035} {"train_loss": -27.623321533203125, "global_step": 583980, "epoch": 7035} {"train_loss": -27.8260498046875, "global_step": 583981, "epoch": 7035} {"train_loss": -27.777118682861328, "global_step": 583982, "epoch": 7035} {"train_loss": -27.836780548095703, "global_step": 583983, "epoch": 7035} {"train_loss": -27.861112594604492, "global_step": 583984, "epoch": 7035} {"train_loss": -27.652639389038086, "global_step": 583985, "epoch": 7035} {"train_loss": -28.11128044128418, "global_step": 583986, "epoch": 7035} {"train_loss": -27.78722703313253, "global_step": 583987, "epoch": 7035, "val_loss": 6726297.0} {"train_loss": -27.638507843017578, "global_step": 583988, "epoch": 7036} {"train_loss": -27.726896286010742, "global_step": 583989, "epoch": 7036} {"train_loss": -27.361814498901367, "global_step": 583990, "epoch": 7036} {"train_loss": -27.342681884765625, "global_step": 583991, "epoch": 7036} {"train_loss": -27.529653549194336, "global_step": 583992, "epoch": 7036} {"train_loss": -27.61106300354004, "global_step": 583993, "epoch": 7036} {"train_loss": -28.00090980529785, "global_step": 583994, "epoch": 7036} {"train_loss": -27.421072006225586, "global_step": 583995, "epoch": 7036} {"train_loss": -27.563159942626953, "global_step": 583996, "epoch": 7036} {"train_loss": -27.562702178955078, "global_step": 583997, "epoch": 7036} {"train_loss": -27.779260635375977, "global_step": 583998, "epoch": 7036} {"train_loss": -27.704282760620117, "global_step": 583999, "epoch": 7036} {"train_loss": -27.74806022644043, "global_step": 584000, "epoch": 7036} {"train_loss": -27.54909324645996, "global_step": 584001, "epoch": 7036} {"train_loss": -27.753366470336914, "global_step": 584002, "epoch": 7036} {"train_loss": -27.64033317565918, "global_step": 584003, "epoch": 7036} {"train_loss": -27.661869049072266, "global_step": 584004, "epoch": 7036} {"train_loss": -27.60658073425293, "global_step": 584005, "epoch": 7036} {"train_loss": -27.5394229888916, "global_step": 584006, "epoch": 7036} {"train_loss": -27.913711547851562, "global_step": 584007, "epoch": 7036} {"train_loss": -27.907196044921875, "global_step": 584008, "epoch": 7036} {"train_loss": -27.402185440063477, "global_step": 584009, "epoch": 7036} {"train_loss": -27.718738555908203, "global_step": 584010, "epoch": 7036} {"train_loss": -27.77587890625, "global_step": 584011, "epoch": 7036} {"train_loss": -27.312519073486328, "global_step": 584012, "epoch": 7036} {"train_loss": -27.90121841430664, "global_step": 584013, "epoch": 7036} {"train_loss": -27.193017959594727, "global_step": 584014, "epoch": 7036} {"train_loss": -27.32583999633789, "global_step": 584015, "epoch": 7036} {"train_loss": -27.994779586791992, "global_step": 584016, "epoch": 7036} {"train_loss": -27.406476974487305, "global_step": 584017, "epoch": 7036} {"train_loss": -27.59051513671875, "global_step": 584018, "epoch": 7036} {"train_loss": -27.628589630126953, "global_step": 584019, "epoch": 7036} {"train_loss": -27.672632217407227, "global_step": 584020, "epoch": 7036} {"train_loss": -27.4122314453125, "global_step": 584021, "epoch": 7036} {"train_loss": -27.516498565673828, "global_step": 584022, "epoch": 7036} {"train_loss": -27.963336944580078, "global_step": 584023, "epoch": 7036} {"train_loss": -27.476526260375977, "global_step": 584024, "epoch": 7036} {"train_loss": -27.96573829650879, "global_step": 584025, "epoch": 7036} {"train_loss": -27.466766357421875, "global_step": 584026, "epoch": 7036} {"train_loss": -27.862146377563477, "global_step": 584027, "epoch": 7036} {"train_loss": -27.550458908081055, "global_step": 584028, "epoch": 7036} {"train_loss": -27.62465476989746, "global_step": 584029, "epoch": 7036} {"train_loss": -27.804859161376953, "global_step": 584030, "epoch": 7036} {"train_loss": -27.8697452545166, "global_step": 584031, "epoch": 7036} {"train_loss": -27.85698890686035, "global_step": 584032, "epoch": 7036} {"train_loss": -27.93024253845215, "global_step": 584033, "epoch": 7036} {"train_loss": -27.736297607421875, "global_step": 584034, "epoch": 7036} {"train_loss": -27.925321578979492, "global_step": 584035, "epoch": 7036} {"train_loss": -28.1512393951416, "global_step": 584036, "epoch": 7036} {"train_loss": -27.83669090270996, "global_step": 584037, "epoch": 7036} {"train_loss": -28.19817543029785, "global_step": 584038, "epoch": 7036} {"train_loss": -27.72968864440918, "global_step": 584039, "epoch": 7036} {"train_loss": -28.284442901611328, "global_step": 584040, "epoch": 7036} {"train_loss": -28.0860595703125, "global_step": 584041, "epoch": 7036} {"train_loss": -28.584339141845703, "global_step": 584042, "epoch": 7036} {"train_loss": -27.90262794494629, "global_step": 584043, "epoch": 7036} {"train_loss": -28.215686798095703, "global_step": 584044, "epoch": 7036} {"train_loss": -28.19504737854004, "global_step": 584045, "epoch": 7036} {"train_loss": -27.9816837310791, "global_step": 584046, "epoch": 7036} {"train_loss": -27.84895133972168, "global_step": 584047, "epoch": 7036} {"train_loss": -28.082319259643555, "global_step": 584048, "epoch": 7036} {"train_loss": -28.334552764892578, "global_step": 584049, "epoch": 7036} {"train_loss": -28.424503326416016, "global_step": 584050, "epoch": 7036} {"train_loss": -28.30756950378418, "global_step": 584051, "epoch": 7036} {"train_loss": -28.292972564697266, "global_step": 584052, "epoch": 7036} {"train_loss": -28.14443016052246, "global_step": 584053, "epoch": 7036} {"train_loss": -27.3427791595459, "global_step": 584054, "epoch": 7036} {"train_loss": -28.16581153869629, "global_step": 584055, "epoch": 7036} {"train_loss": -27.824676513671875, "global_step": 584056, "epoch": 7036} {"train_loss": -28.061609268188477, "global_step": 584057, "epoch": 7036} {"train_loss": -28.330381393432617, "global_step": 584058, "epoch": 7036} {"train_loss": -28.019514083862305, "global_step": 584059, "epoch": 7036} {"train_loss": -28.40003776550293, "global_step": 584060, "epoch": 7036} {"train_loss": -28.037992477416992, "global_step": 584061, "epoch": 7036} {"train_loss": -27.347675323486328, "global_step": 584062, "epoch": 7036} {"train_loss": -27.11917495727539, "global_step": 584063, "epoch": 7036} {"train_loss": -27.049942016601562, "global_step": 584064, "epoch": 7036} {"train_loss": -26.793659210205078, "global_step": 584065, "epoch": 7036} {"train_loss": -27.254541397094727, "global_step": 584066, "epoch": 7036} {"train_loss": -27.851552963256836, "global_step": 584067, "epoch": 7036} {"train_loss": -27.825082778930664, "global_step": 584068, "epoch": 7036} {"train_loss": -27.18207359313965, "global_step": 584069, "epoch": 7036} {"train_loss": -27.755023634577373, "global_step": 584070, "epoch": 7036, "val_loss": 6789345.0} {"train_loss": -26.99478530883789, "global_step": 584071, "epoch": 7037} {"train_loss": -26.160017013549805, "global_step": 584072, "epoch": 7037} {"train_loss": -26.62556266784668, "global_step": 584073, "epoch": 7037} {"train_loss": -26.570829391479492, "global_step": 584074, "epoch": 7037} {"train_loss": -26.397470474243164, "global_step": 584075, "epoch": 7037} {"train_loss": -26.675146102905273, "global_step": 584076, "epoch": 7037} {"train_loss": -26.934661865234375, "global_step": 584077, "epoch": 7037} {"train_loss": -26.789642333984375, "global_step": 584078, "epoch": 7037} {"train_loss": -25.677473068237305, "global_step": 584079, "epoch": 7037} {"train_loss": -26.6153507232666, "global_step": 584080, "epoch": 7037} {"train_loss": -26.7573184967041, "global_step": 584081, "epoch": 7037} {"train_loss": -26.705297470092773, "global_step": 584082, "epoch": 7037} {"train_loss": -27.757266998291016, "global_step": 584083, "epoch": 7037} {"train_loss": -26.68184471130371, "global_step": 584084, "epoch": 7037} {"train_loss": -27.271535873413086, "global_step": 584085, "epoch": 7037} {"train_loss": -27.03754234313965, "global_step": 584086, "epoch": 7037} {"train_loss": -27.084836959838867, "global_step": 584087, "epoch": 7037} {"train_loss": -27.10529136657715, "global_step": 584088, "epoch": 7037} {"train_loss": -27.487415313720703, "global_step": 584089, "epoch": 7037} {"train_loss": -27.58935546875, "global_step": 584090, "epoch": 7037} {"train_loss": -27.19282341003418, "global_step": 584091, "epoch": 7037} {"train_loss": -27.246814727783203, "global_step": 584092, "epoch": 7037} {"train_loss": -27.661911010742188, "global_step": 584093, "epoch": 7037} {"train_loss": -27.399816513061523, "global_step": 584094, "epoch": 7037} {"train_loss": -27.38714599609375, "global_step": 584095, "epoch": 7037} {"train_loss": -27.32177734375, "global_step": 584096, "epoch": 7037} {"train_loss": -27.45782470703125, "global_step": 584097, "epoch": 7037} {"train_loss": -27.458112716674805, "global_step": 584098, "epoch": 7037} {"train_loss": -27.275680541992188, "global_step": 584099, "epoch": 7037} {"train_loss": -27.575952529907227, "global_step": 584100, "epoch": 7037} {"train_loss": -27.711669921875, "global_step": 584101, "epoch": 7037} {"train_loss": -27.671741485595703, "global_step": 584102, "epoch": 7037} {"train_loss": -27.503637313842773, "global_step": 584103, "epoch": 7037} {"train_loss": -27.632307052612305, "global_step": 584104, "epoch": 7037} {"train_loss": -27.67081642150879, "global_step": 584105, "epoch": 7037} {"train_loss": -27.8465633392334, "global_step": 584106, "epoch": 7037} {"train_loss": -27.871007919311523, "global_step": 584107, "epoch": 7037} {"train_loss": -28.070905685424805, "global_step": 584108, "epoch": 7037} {"train_loss": -27.7875919342041, "global_step": 584109, "epoch": 7037} {"train_loss": -27.941791534423828, "global_step": 584110, "epoch": 7037} {"train_loss": -28.113025665283203, "global_step": 584111, "epoch": 7037} {"train_loss": -27.7823543548584, "global_step": 584112, "epoch": 7037} {"train_loss": -27.774402618408203, "global_step": 584113, "epoch": 7037} {"train_loss": -28.090055465698242, "global_step": 584114, "epoch": 7037} {"train_loss": -27.616113662719727, "global_step": 584115, "epoch": 7037} {"train_loss": -28.202001571655273, "global_step": 584116, "epoch": 7037} {"train_loss": -27.86528968811035, "global_step": 584117, "epoch": 7037} {"train_loss": -28.293012619018555, "global_step": 584118, "epoch": 7037} {"train_loss": -28.194517135620117, "global_step": 584119, "epoch": 7037} {"train_loss": -27.9395751953125, "global_step": 584120, "epoch": 7037} {"train_loss": -28.28974723815918, "global_step": 584121, "epoch": 7037} {"train_loss": -28.352869033813477, "global_step": 584122, "epoch": 7037} {"train_loss": -28.046655654907227, "global_step": 584123, "epoch": 7037} {"train_loss": -27.88286781311035, "global_step": 584124, "epoch": 7037} {"train_loss": -27.991718292236328, "global_step": 584125, "epoch": 7037} {"train_loss": -28.367877960205078, "global_step": 584126, "epoch": 7037} {"train_loss": -27.970901489257812, "global_step": 584127, "epoch": 7037} {"train_loss": -27.830764770507812, "global_step": 584128, "epoch": 7037} {"train_loss": -28.0007381439209, "global_step": 584129, "epoch": 7037} {"train_loss": -28.052785873413086, "global_step": 584130, "epoch": 7037} {"train_loss": -28.2269287109375, "global_step": 584131, "epoch": 7037} {"train_loss": -28.117528915405273, "global_step": 584132, "epoch": 7037} {"train_loss": -27.73700523376465, "global_step": 584133, "epoch": 7037} {"train_loss": -27.575103759765625, "global_step": 584134, "epoch": 7037} {"train_loss": -28.1900634765625, "global_step": 584135, "epoch": 7037} {"train_loss": -27.95846939086914, "global_step": 584136, "epoch": 7037} {"train_loss": -28.240991592407227, "global_step": 584137, "epoch": 7037} {"train_loss": -27.935651779174805, "global_step": 584138, "epoch": 7037} {"train_loss": -28.091968536376953, "global_step": 584139, "epoch": 7037} {"train_loss": -28.079666137695312, "global_step": 584140, "epoch": 7037} {"train_loss": -27.931711196899414, "global_step": 584141, "epoch": 7037} {"train_loss": -28.10056495666504, "global_step": 584142, "epoch": 7037} {"train_loss": -28.2463436126709, "global_step": 584143, "epoch": 7037} {"train_loss": -28.0748291015625, "global_step": 584144, "epoch": 7037} {"train_loss": -27.959638595581055, "global_step": 584145, "epoch": 7037} {"train_loss": -27.886825561523438, "global_step": 584146, "epoch": 7037} {"train_loss": -27.802337646484375, "global_step": 584147, "epoch": 7037} {"train_loss": -28.22126579284668, "global_step": 584148, "epoch": 7037} {"train_loss": -27.821746826171875, "global_step": 584149, "epoch": 7037} {"train_loss": -27.86097526550293, "global_step": 584150, "epoch": 7037} {"train_loss": -27.897871017456055, "global_step": 584151, "epoch": 7037} {"train_loss": -28.098779678344727, "global_step": 584152, "epoch": 7037} {"train_loss": -27.625024657651604, "global_step": 584153, "epoch": 7037, "val_loss": 6757702.0} {"train_loss": -27.60922622680664, "global_step": 584154, "epoch": 7038} {"train_loss": -27.097003936767578, "global_step": 584155, "epoch": 7038} {"train_loss": -27.095251083374023, "global_step": 584156, "epoch": 7038} {"train_loss": -27.5804500579834, "global_step": 584157, "epoch": 7038} {"train_loss": -27.467945098876953, "global_step": 584158, "epoch": 7038} {"train_loss": -27.392059326171875, "global_step": 584159, "epoch": 7038} {"train_loss": -27.266210556030273, "global_step": 584160, "epoch": 7038} {"train_loss": -27.766864776611328, "global_step": 584161, "epoch": 7038} {"train_loss": -27.588363647460938, "global_step": 584162, "epoch": 7038} {"train_loss": -27.363733291625977, "global_step": 584163, "epoch": 7038} {"train_loss": -27.599512100219727, "global_step": 584164, "epoch": 7038} {"train_loss": -27.942041397094727, "global_step": 584165, "epoch": 7038} {"train_loss": -27.71758460998535, "global_step": 584166, "epoch": 7038} {"train_loss": -27.490924835205078, "global_step": 584167, "epoch": 7038} {"train_loss": -27.880828857421875, "global_step": 584168, "epoch": 7038} {"train_loss": -27.86835289001465, "global_step": 584169, "epoch": 7038} {"train_loss": -27.787982940673828, "global_step": 584170, "epoch": 7038} {"train_loss": -27.808582305908203, "global_step": 584171, "epoch": 7038} {"train_loss": -28.270986557006836, "global_step": 584172, "epoch": 7038} {"train_loss": -27.866239547729492, "global_step": 584173, "epoch": 7038} {"train_loss": -28.063215255737305, "global_step": 584174, "epoch": 7038} {"train_loss": -27.743194580078125, "global_step": 584175, "epoch": 7038} {"train_loss": -27.978897094726562, "global_step": 584176, "epoch": 7038} {"train_loss": -27.782703399658203, "global_step": 584177, "epoch": 7038} {"train_loss": -28.113452911376953, "global_step": 584178, "epoch": 7038} {"train_loss": -27.765363693237305, "global_step": 584179, "epoch": 7038} {"train_loss": -27.69697380065918, "global_step": 584180, "epoch": 7038} {"train_loss": -28.046024322509766, "global_step": 584181, "epoch": 7038} {"train_loss": -27.98089599609375, "global_step": 584182, "epoch": 7038} {"train_loss": -28.022119522094727, "global_step": 584183, "epoch": 7038} {"train_loss": -28.011686325073242, "global_step": 584184, "epoch": 7038} {"train_loss": -28.196821212768555, "global_step": 584185, "epoch": 7038} {"train_loss": -27.690229415893555, "global_step": 584186, "epoch": 7038} {"train_loss": -28.15553855895996, "global_step": 584187, "epoch": 7038} {"train_loss": -28.201383590698242, "global_step": 584188, "epoch": 7038} {"train_loss": -28.035017013549805, "global_step": 584189, "epoch": 7038} {"train_loss": -28.110462188720703, "global_step": 584190, "epoch": 7038} {"train_loss": -27.90935707092285, "global_step": 584191, "epoch": 7038} {"train_loss": -28.16411781311035, "global_step": 584192, "epoch": 7038} {"train_loss": -27.857959747314453, "global_step": 584193, "epoch": 7038} {"train_loss": -28.42206382751465, "global_step": 584194, "epoch": 7038} {"train_loss": -28.088470458984375, "global_step": 584195, "epoch": 7038} {"train_loss": -28.271757125854492, "global_step": 584196, "epoch": 7038} {"train_loss": -28.09882926940918, "global_step": 584197, "epoch": 7038} {"train_loss": -27.80649757385254, "global_step": 584198, "epoch": 7038} {"train_loss": -27.719329833984375, "global_step": 584199, "epoch": 7038} {"train_loss": -27.84816551208496, "global_step": 584200, "epoch": 7038} {"train_loss": -27.671350479125977, "global_step": 584201, "epoch": 7038} {"train_loss": -27.996353149414062, "global_step": 584202, "epoch": 7038} {"train_loss": -27.505170822143555, "global_step": 584203, "epoch": 7038} {"train_loss": -28.011932373046875, "global_step": 584204, "epoch": 7038} {"train_loss": -27.7779598236084, "global_step": 584205, "epoch": 7038} {"train_loss": -27.779077529907227, "global_step": 584206, "epoch": 7038} {"train_loss": -27.948774337768555, "global_step": 584207, "epoch": 7038} {"train_loss": -27.54836082458496, "global_step": 584208, "epoch": 7038} {"train_loss": -27.76704216003418, "global_step": 584209, "epoch": 7038} {"train_loss": -27.828516006469727, "global_step": 584210, "epoch": 7038} {"train_loss": -27.7224178314209, "global_step": 584211, "epoch": 7038} {"train_loss": -27.32184410095215, "global_step": 584212, "epoch": 7038} {"train_loss": -28.010351181030273, "global_step": 584213, "epoch": 7038} {"train_loss": -27.267431259155273, "global_step": 584214, "epoch": 7038} {"train_loss": -28.0836124420166, "global_step": 584215, "epoch": 7038} {"train_loss": -27.93181800842285, "global_step": 584216, "epoch": 7038} {"train_loss": -28.07380485534668, "global_step": 584217, "epoch": 7038} {"train_loss": -27.94034194946289, "global_step": 584218, "epoch": 7038} {"train_loss": -28.328357696533203, "global_step": 584219, "epoch": 7038} {"train_loss": -28.0909481048584, "global_step": 584220, "epoch": 7038} {"train_loss": -27.63544273376465, "global_step": 584221, "epoch": 7038} {"train_loss": -28.1635684967041, "global_step": 584222, "epoch": 7038} {"train_loss": -27.8966121673584, "global_step": 584223, "epoch": 7038} {"train_loss": -27.826459884643555, "global_step": 584224, "epoch": 7038} {"train_loss": -28.314071655273438, "global_step": 584225, "epoch": 7038} {"train_loss": -27.64434242248535, "global_step": 584226, "epoch": 7038} {"train_loss": -27.864944458007812, "global_step": 584227, "epoch": 7038} {"train_loss": -27.79384422302246, "global_step": 584228, "epoch": 7038} {"train_loss": -28.051782608032227, "global_step": 584229, "epoch": 7038} {"train_loss": -28.0747127532959, "global_step": 584230, "epoch": 7038} {"train_loss": -28.079986572265625, "global_step": 584231, "epoch": 7038} {"train_loss": -27.65003776550293, "global_step": 584232, "epoch": 7038} {"train_loss": -27.967193603515625, "global_step": 584233, "epoch": 7038} {"train_loss": -28.2934513092041, "global_step": 584234, "epoch": 7038} {"train_loss": -28.128253936767578, "global_step": 584235, "epoch": 7038} {"train_loss": -27.847028502498766, "global_step": 584236, "epoch": 7038, "val_loss": 6636323.0} {"train_loss": -27.395116806030273, "global_step": 584237, "epoch": 7039} {"train_loss": -27.1098575592041, "global_step": 584238, "epoch": 7039} {"train_loss": -27.65032958984375, "global_step": 584239, "epoch": 7039} {"train_loss": -26.936996459960938, "global_step": 584240, "epoch": 7039} {"train_loss": -27.32490348815918, "global_step": 584241, "epoch": 7039} {"train_loss": -27.020278930664062, "global_step": 584242, "epoch": 7039} {"train_loss": -27.314239501953125, "global_step": 584243, "epoch": 7039} {"train_loss": -27.43255615234375, "global_step": 584244, "epoch": 7039} {"train_loss": -27.48063087463379, "global_step": 584245, "epoch": 7039} {"train_loss": -27.082538604736328, "global_step": 584246, "epoch": 7039} {"train_loss": -27.015384674072266, "global_step": 584247, "epoch": 7039} {"train_loss": -27.480422973632812, "global_step": 584248, "epoch": 7039} {"train_loss": -27.553131103515625, "global_step": 584249, "epoch": 7039} {"train_loss": -27.573883056640625, "global_step": 584250, "epoch": 7039} {"train_loss": -27.635717391967773, "global_step": 584251, "epoch": 7039} {"train_loss": -27.503644943237305, "global_step": 584252, "epoch": 7039} {"train_loss": -27.54386329650879, "global_step": 584253, "epoch": 7039} {"train_loss": -27.692548751831055, "global_step": 584254, "epoch": 7039} {"train_loss": -27.608783721923828, "global_step": 584255, "epoch": 7039} {"train_loss": -27.209735870361328, "global_step": 584256, "epoch": 7039} {"train_loss": -27.795673370361328, "global_step": 584257, "epoch": 7039} {"train_loss": -27.336627960205078, "global_step": 584258, "epoch": 7039} {"train_loss": -27.44278907775879, "global_step": 584259, "epoch": 7039} {"train_loss": -27.60572624206543, "global_step": 584260, "epoch": 7039} {"train_loss": -27.867887496948242, "global_step": 584261, "epoch": 7039} {"train_loss": -28.064655303955078, "global_step": 584262, "epoch": 7039} {"train_loss": -27.800617218017578, "global_step": 584263, "epoch": 7039} {"train_loss": -27.8704891204834, "global_step": 584264, "epoch": 7039} {"train_loss": -28.212265014648438, "global_step": 584265, "epoch": 7039} {"train_loss": -27.809650421142578, "global_step": 584266, "epoch": 7039} {"train_loss": -27.910308837890625, "global_step": 584267, "epoch": 7039} {"train_loss": -28.0393009185791, "global_step": 584268, "epoch": 7039} {"train_loss": -28.208953857421875, "global_step": 584269, "epoch": 7039} {"train_loss": -28.10440444946289, "global_step": 584270, "epoch": 7039} {"train_loss": -27.9814395904541, "global_step": 584271, "epoch": 7039} {"train_loss": -28.123754501342773, "global_step": 584272, "epoch": 7039} {"train_loss": -28.28289794921875, "global_step": 584273, "epoch": 7039} {"train_loss": -27.78254508972168, "global_step": 584274, "epoch": 7039} {"train_loss": -28.085586547851562, "global_step": 584275, "epoch": 7039} {"train_loss": -27.896392822265625, "global_step": 584276, "epoch": 7039} {"train_loss": -28.591156005859375, "global_step": 584277, "epoch": 7039} {"train_loss": -28.066247940063477, "global_step": 584278, "epoch": 7039} {"train_loss": -27.857227325439453, "global_step": 584279, "epoch": 7039} {"train_loss": -28.441389083862305, "global_step": 584280, "epoch": 7039} {"train_loss": -28.227705001831055, "global_step": 584281, "epoch": 7039} {"train_loss": -28.388952255249023, "global_step": 584282, "epoch": 7039} {"train_loss": -28.061731338500977, "global_step": 584283, "epoch": 7039} {"train_loss": -28.472829818725586, "global_step": 584284, "epoch": 7039} {"train_loss": -28.433074951171875, "global_step": 584285, "epoch": 7039} {"train_loss": -28.30551528930664, "global_step": 584286, "epoch": 7039} {"train_loss": -28.106000900268555, "global_step": 584287, "epoch": 7039} {"train_loss": -28.247907638549805, "global_step": 584288, "epoch": 7039} {"train_loss": -28.085601806640625, "global_step": 584289, "epoch": 7039} {"train_loss": -28.017261505126953, "global_step": 584290, "epoch": 7039} {"train_loss": -28.015445709228516, "global_step": 584291, "epoch": 7039} {"train_loss": -27.59065055847168, "global_step": 584292, "epoch": 7039} {"train_loss": -27.8731689453125, "global_step": 584293, "epoch": 7039} {"train_loss": -27.825307846069336, "global_step": 584294, "epoch": 7039} {"train_loss": -27.20745849609375, "global_step": 584295, "epoch": 7039} {"train_loss": -27.695541381835938, "global_step": 584296, "epoch": 7039} {"train_loss": -27.512197494506836, "global_step": 584297, "epoch": 7039} {"train_loss": -27.64609718322754, "global_step": 584298, "epoch": 7039} {"train_loss": -27.20310401916504, "global_step": 584299, "epoch": 7039} {"train_loss": -27.726318359375, "global_step": 584300, "epoch": 7039} {"train_loss": -27.910120010375977, "global_step": 584301, "epoch": 7039} {"train_loss": -27.995899200439453, "global_step": 584302, "epoch": 7039} {"train_loss": -27.701467514038086, "global_step": 584303, "epoch": 7039} {"train_loss": -27.860105514526367, "global_step": 584304, "epoch": 7039} {"train_loss": -27.6628475189209, "global_step": 584305, "epoch": 7039} {"train_loss": -27.664335250854492, "global_step": 584306, "epoch": 7039} {"train_loss": -27.6368465423584, "global_step": 584307, "epoch": 7039} {"train_loss": -27.29949378967285, "global_step": 584308, "epoch": 7039} {"train_loss": -28.098630905151367, "global_step": 584309, "epoch": 7039} {"train_loss": -27.928897857666016, "global_step": 584310, "epoch": 7039} {"train_loss": -27.852039337158203, "global_step": 584311, "epoch": 7039} {"train_loss": -27.94597816467285, "global_step": 584312, "epoch": 7039} {"train_loss": -27.511962890625, "global_step": 584313, "epoch": 7039} {"train_loss": -27.68426513671875, "global_step": 584314, "epoch": 7039} {"train_loss": -28.29372215270996, "global_step": 584315, "epoch": 7039} {"train_loss": -27.869543075561523, "global_step": 584316, "epoch": 7039} {"train_loss": -27.859106063842773, "global_step": 584317, "epoch": 7039} {"train_loss": -28.033435821533203, "global_step": 584318, "epoch": 7039} {"train_loss": -27.806667235960443, "global_step": 584319, "epoch": 7039, "val_loss": 6622494.0} {"train_loss": -27.45098876953125, "global_step": 584320, "epoch": 7040} {"train_loss": -27.98243522644043, "global_step": 584321, "epoch": 7040} {"train_loss": -27.910741806030273, "global_step": 584322, "epoch": 7040} {"train_loss": -27.897663116455078, "global_step": 584323, "epoch": 7040} {"train_loss": -28.183408737182617, "global_step": 584324, "epoch": 7040} {"train_loss": -28.0195255279541, "global_step": 584325, "epoch": 7040} {"train_loss": -27.781885147094727, "global_step": 584326, "epoch": 7040} {"train_loss": -27.749317169189453, "global_step": 584327, "epoch": 7040} {"train_loss": -27.811798095703125, "global_step": 584328, "epoch": 7040} {"train_loss": -28.086889266967773, "global_step": 584329, "epoch": 7040} {"train_loss": -28.06805992126465, "global_step": 584330, "epoch": 7040} {"train_loss": -28.11582374572754, "global_step": 584331, "epoch": 7040} {"train_loss": -28.241016387939453, "global_step": 584332, "epoch": 7040} {"train_loss": -27.992963790893555, "global_step": 584333, "epoch": 7040} {"train_loss": -27.286041259765625, "global_step": 584334, "epoch": 7040} {"train_loss": -28.16554832458496, "global_step": 584335, "epoch": 7040} {"train_loss": -28.072607040405273, "global_step": 584336, "epoch": 7040} {"train_loss": -27.810016632080078, "global_step": 584337, "epoch": 7040} {"train_loss": -27.84037208557129, "global_step": 584338, "epoch": 7040} {"train_loss": -28.3194580078125, "global_step": 584339, "epoch": 7040} {"train_loss": -28.147586822509766, "global_step": 584340, "epoch": 7040} {"train_loss": -28.09779167175293, "global_step": 584341, "epoch": 7040} {"train_loss": -27.871686935424805, "global_step": 584342, "epoch": 7040} {"train_loss": -27.739896774291992, "global_step": 584343, "epoch": 7040} {"train_loss": -27.837080001831055, "global_step": 584344, "epoch": 7040} {"train_loss": -28.04021644592285, "global_step": 584345, "epoch": 7040} {"train_loss": -28.179636001586914, "global_step": 584346, "epoch": 7040} {"train_loss": -27.882410049438477, "global_step": 584347, "epoch": 7040} {"train_loss": -28.347003936767578, "global_step": 584348, "epoch": 7040} {"train_loss": -27.8975887298584, "global_step": 584349, "epoch": 7040} {"train_loss": -27.625600814819336, "global_step": 584350, "epoch": 7040} {"train_loss": -28.006811141967773, "global_step": 584351, "epoch": 7040} {"train_loss": -27.66855239868164, "global_step": 584352, "epoch": 7040} {"train_loss": -28.267566680908203, "global_step": 584353, "epoch": 7040} {"train_loss": -28.40315055847168, "global_step": 584354, "epoch": 7040} {"train_loss": -27.8197021484375, "global_step": 584355, "epoch": 7040} {"train_loss": -27.625720977783203, "global_step": 584356, "epoch": 7040} {"train_loss": -27.862436294555664, "global_step": 584357, "epoch": 7040} {"train_loss": -27.83131217956543, "global_step": 584358, "epoch": 7040} {"train_loss": -27.995101928710938, "global_step": 584359, "epoch": 7040} {"train_loss": -28.192243576049805, "global_step": 584360, "epoch": 7040} {"train_loss": -27.955951690673828, "global_step": 584361, "epoch": 7040} {"train_loss": -28.200347900390625, "global_step": 584362, "epoch": 7040} {"train_loss": -28.10957145690918, "global_step": 584363, "epoch": 7040} {"train_loss": -27.93079948425293, "global_step": 584364, "epoch": 7040} {"train_loss": -27.64912223815918, "global_step": 584365, "epoch": 7040} {"train_loss": -27.816482543945312, "global_step": 584366, "epoch": 7040} {"train_loss": -28.020193099975586, "global_step": 584367, "epoch": 7040} {"train_loss": -28.2274112701416, "global_step": 584368, "epoch": 7040} {"train_loss": -27.690887451171875, "global_step": 584369, "epoch": 7040} {"train_loss": -28.360034942626953, "global_step": 584370, "epoch": 7040} {"train_loss": -27.69915771484375, "global_step": 584371, "epoch": 7040} {"train_loss": -27.502832412719727, "global_step": 584372, "epoch": 7040} {"train_loss": -27.722015380859375, "global_step": 584373, "epoch": 7040} {"train_loss": -28.460723876953125, "global_step": 584374, "epoch": 7040} {"train_loss": -28.044830322265625, "global_step": 584375, "epoch": 7040} {"train_loss": -28.0181941986084, "global_step": 584376, "epoch": 7040} {"train_loss": -27.983076095581055, "global_step": 584377, "epoch": 7040} {"train_loss": -27.605085372924805, "global_step": 584378, "epoch": 7040} {"train_loss": -27.55999755859375, "global_step": 584379, "epoch": 7040} {"train_loss": -27.831634521484375, "global_step": 584380, "epoch": 7040} {"train_loss": -28.102094650268555, "global_step": 584381, "epoch": 7040} {"train_loss": -28.181161880493164, "global_step": 584382, "epoch": 7040} {"train_loss": -28.041196823120117, "global_step": 584383, "epoch": 7040} {"train_loss": -28.0727596282959, "global_step": 584384, "epoch": 7040} {"train_loss": -28.127660751342773, "global_step": 584385, "epoch": 7040} {"train_loss": -27.972583770751953, "global_step": 584386, "epoch": 7040} {"train_loss": -28.370849609375, "global_step": 584387, "epoch": 7040} {"train_loss": -28.133359909057617, "global_step": 584388, "epoch": 7040} {"train_loss": -27.9334774017334, "global_step": 584389, "epoch": 7040} {"train_loss": -28.202863693237305, "global_step": 584390, "epoch": 7040} {"train_loss": -27.77482032775879, "global_step": 584391, "epoch": 7040} {"train_loss": -28.075668334960938, "global_step": 584392, "epoch": 7040} {"train_loss": -27.8573055267334, "global_step": 584393, "epoch": 7040} {"train_loss": -27.990036010742188, "global_step": 584394, "epoch": 7040} {"train_loss": -27.667972564697266, "global_step": 584395, "epoch": 7040} {"train_loss": -27.975238800048828, "global_step": 584396, "epoch": 7040} {"train_loss": -28.084585189819336, "global_step": 584397, "epoch": 7040} {"train_loss": -27.713476181030273, "global_step": 584398, "epoch": 7040} {"train_loss": -27.769001007080078, "global_step": 584399, "epoch": 7040} {"train_loss": -28.273351669311523, "global_step": 584400, "epoch": 7040} {"train_loss": -27.894088745117188, "global_step": 584401, "epoch": 7040} {"train_loss": -27.944812843598516, "global_step": 584402, "epoch": 7040, "val_loss": 6733222.0} {"train_loss": -27.408618927001953, "global_step": 584403, "epoch": 7041} {"train_loss": -27.189367294311523, "global_step": 584404, "epoch": 7041} {"train_loss": -27.0339298248291, "global_step": 584405, "epoch": 7041} {"train_loss": -27.366870880126953, "global_step": 584406, "epoch": 7041} {"train_loss": -27.340961456298828, "global_step": 584407, "epoch": 7041} {"train_loss": -26.98895835876465, "global_step": 584408, "epoch": 7041} {"train_loss": -27.414798736572266, "global_step": 584409, "epoch": 7041} {"train_loss": -27.874963760375977, "global_step": 584410, "epoch": 7041} {"train_loss": -26.89344596862793, "global_step": 584411, "epoch": 7041} {"train_loss": -27.391096115112305, "global_step": 584412, "epoch": 7041} {"train_loss": -27.114505767822266, "global_step": 584413, "epoch": 7041} {"train_loss": -27.3320255279541, "global_step": 584414, "epoch": 7041} {"train_loss": -27.52298927307129, "global_step": 584415, "epoch": 7041} {"train_loss": -27.279462814331055, "global_step": 584416, "epoch": 7041} {"train_loss": -27.410125732421875, "global_step": 584417, "epoch": 7041} {"train_loss": -27.39347267150879, "global_step": 584418, "epoch": 7041} {"train_loss": -26.962478637695312, "global_step": 584419, "epoch": 7041} {"train_loss": -27.36355972290039, "global_step": 584420, "epoch": 7041} {"train_loss": -27.704275131225586, "global_step": 584421, "epoch": 7041} {"train_loss": -27.493518829345703, "global_step": 584422, "epoch": 7041} {"train_loss": -27.682300567626953, "global_step": 584423, "epoch": 7041} {"train_loss": -27.625436782836914, "global_step": 584424, "epoch": 7041} {"train_loss": -27.53279685974121, "global_step": 584425, "epoch": 7041} {"train_loss": -27.788808822631836, "global_step": 584426, "epoch": 7041} {"train_loss": -27.386159896850586, "global_step": 584427, "epoch": 7041} {"train_loss": -27.646106719970703, "global_step": 584428, "epoch": 7041} {"train_loss": -27.76167106628418, "global_step": 584429, "epoch": 7041} {"train_loss": -27.658117294311523, "global_step": 584430, "epoch": 7041} {"train_loss": -27.973331451416016, "global_step": 584431, "epoch": 7041} {"train_loss": -27.687543869018555, "global_step": 584432, "epoch": 7041} {"train_loss": -27.607126235961914, "global_step": 584433, "epoch": 7041} {"train_loss": -27.923187255859375, "global_step": 584434, "epoch": 7041} {"train_loss": -27.706098556518555, "global_step": 584435, "epoch": 7041} {"train_loss": -27.67498779296875, "global_step": 584436, "epoch": 7041} {"train_loss": -27.592273712158203, "global_step": 584437, "epoch": 7041} {"train_loss": -27.802404403686523, "global_step": 584438, "epoch": 7041} {"train_loss": -27.68006706237793, "global_step": 584439, "epoch": 7041} {"train_loss": -27.92034339904785, "global_step": 584440, "epoch": 7041} {"train_loss": -27.952838897705078, "global_step": 584441, "epoch": 7041} {"train_loss": -27.8241024017334, "global_step": 584442, "epoch": 7041} {"train_loss": -28.236160278320312, "global_step": 584443, "epoch": 7041} {"train_loss": -28.264739990234375, "global_step": 584444, "epoch": 7041} {"train_loss": -28.088354110717773, "global_step": 584445, "epoch": 7041} {"train_loss": -27.517309188842773, "global_step": 584446, "epoch": 7041} {"train_loss": -28.302490234375, "global_step": 584447, "epoch": 7041} {"train_loss": -28.2473201751709, "global_step": 584448, "epoch": 7041} {"train_loss": -28.127735137939453, "global_step": 584449, "epoch": 7041} {"train_loss": -27.964811325073242, "global_step": 584450, "epoch": 7041} {"train_loss": -27.995569229125977, "global_step": 584451, "epoch": 7041} {"train_loss": -28.366947174072266, "global_step": 584452, "epoch": 7041} {"train_loss": -28.132709503173828, "global_step": 584453, "epoch": 7041} {"train_loss": -28.022872924804688, "global_step": 584454, "epoch": 7041} {"train_loss": -27.930099487304688, "global_step": 584455, "epoch": 7041} {"train_loss": -27.865644454956055, "global_step": 584456, "epoch": 7041} {"train_loss": -28.2005672454834, "global_step": 584457, "epoch": 7041} {"train_loss": -28.095388412475586, "global_step": 584458, "epoch": 7041} {"train_loss": -28.358938217163086, "global_step": 584459, "epoch": 7041} {"train_loss": -27.953323364257812, "global_step": 584460, "epoch": 7041} {"train_loss": -28.01478385925293, "global_step": 584461, "epoch": 7041} {"train_loss": -28.248151779174805, "global_step": 584462, "epoch": 7041} {"train_loss": -28.16485595703125, "global_step": 584463, "epoch": 7041} {"train_loss": -28.329431533813477, "global_step": 584464, "epoch": 7041} {"train_loss": -28.155517578125, "global_step": 584465, "epoch": 7041} {"train_loss": -28.221906661987305, "global_step": 584466, "epoch": 7041} {"train_loss": -27.897130966186523, "global_step": 584467, "epoch": 7041} {"train_loss": -27.138427734375, "global_step": 584468, "epoch": 7041} {"train_loss": -26.9786319732666, "global_step": 584469, "epoch": 7041} {"train_loss": -26.87605094909668, "global_step": 584470, "epoch": 7041} {"train_loss": -26.733789443969727, "global_step": 584471, "epoch": 7041} {"train_loss": -28.0872859954834, "global_step": 584472, "epoch": 7041} {"train_loss": -27.422382354736328, "global_step": 584473, "epoch": 7041} {"train_loss": -27.349822998046875, "global_step": 584474, "epoch": 7041} {"train_loss": -26.82877540588379, "global_step": 584475, "epoch": 7041} {"train_loss": -27.30682373046875, "global_step": 584476, "epoch": 7041} {"train_loss": -27.4080753326416, "global_step": 584477, "epoch": 7041} {"train_loss": -27.651386260986328, "global_step": 584478, "epoch": 7041} {"train_loss": -27.01044273376465, "global_step": 584479, "epoch": 7041} {"train_loss": -27.888214111328125, "global_step": 584480, "epoch": 7041} {"train_loss": -27.601099014282227, "global_step": 584481, "epoch": 7041} {"train_loss": -27.47234535217285, "global_step": 584482, "epoch": 7041} {"train_loss": -27.690637588500977, "global_step": 584483, "epoch": 7041} {"train_loss": -27.94339370727539, "global_step": 584484, "epoch": 7041} {"train_loss": -27.666533228862715, "global_step": 584485, "epoch": 7041, "val_loss": 6751360.5} {"train_loss": -27.079029083251953, "global_step": 584486, "epoch": 7042} {"train_loss": -26.514001846313477, "global_step": 584487, "epoch": 7042} {"train_loss": -27.25448989868164, "global_step": 584488, "epoch": 7042} {"train_loss": -26.76604652404785, "global_step": 584489, "epoch": 7042} {"train_loss": -27.216064453125, "global_step": 584490, "epoch": 7042} {"train_loss": -26.978784561157227, "global_step": 584491, "epoch": 7042} {"train_loss": -27.018911361694336, "global_step": 584492, "epoch": 7042} {"train_loss": -27.471899032592773, "global_step": 584493, "epoch": 7042} {"train_loss": -27.515356063842773, "global_step": 584494, "epoch": 7042} {"train_loss": -27.495630264282227, "global_step": 584495, "epoch": 7042} {"train_loss": -27.205957412719727, "global_step": 584496, "epoch": 7042} {"train_loss": -27.25406265258789, "global_step": 584497, "epoch": 7042} {"train_loss": -27.184690475463867, "global_step": 584498, "epoch": 7042} {"train_loss": -27.712167739868164, "global_step": 584499, "epoch": 7042} {"train_loss": -27.60648536682129, "global_step": 584500, "epoch": 7042} {"train_loss": -27.305774688720703, "global_step": 584501, "epoch": 7042} {"train_loss": -27.351581573486328, "global_step": 584502, "epoch": 7042} {"train_loss": -27.895023345947266, "global_step": 584503, "epoch": 7042} {"train_loss": -27.282968521118164, "global_step": 584504, "epoch": 7042} {"train_loss": -27.65494155883789, "global_step": 584505, "epoch": 7042} {"train_loss": -27.985403060913086, "global_step": 584506, "epoch": 7042} {"train_loss": -27.756235122680664, "global_step": 584507, "epoch": 7042} {"train_loss": -27.450605392456055, "global_step": 584508, "epoch": 7042} {"train_loss": -27.714365005493164, "global_step": 584509, "epoch": 7042} {"train_loss": -27.739627838134766, "global_step": 584510, "epoch": 7042} {"train_loss": -28.056432723999023, "global_step": 584511, "epoch": 7042} {"train_loss": -28.01661491394043, "global_step": 584512, "epoch": 7042} {"train_loss": -28.01828384399414, "global_step": 584513, "epoch": 7042} {"train_loss": -27.81884765625, "global_step": 584514, "epoch": 7042} {"train_loss": -27.908658981323242, "global_step": 584515, "epoch": 7042} {"train_loss": -27.588764190673828, "global_step": 584516, "epoch": 7042} {"train_loss": -28.019556045532227, "global_step": 584517, "epoch": 7042} {"train_loss": -27.5972900390625, "global_step": 584518, "epoch": 7042} {"train_loss": -28.091251373291016, "global_step": 584519, "epoch": 7042} {"train_loss": -28.096715927124023, "global_step": 584520, "epoch": 7042} {"train_loss": -28.15359878540039, "global_step": 584521, "epoch": 7042} {"train_loss": -28.48142433166504, "global_step": 584522, "epoch": 7042} {"train_loss": -28.186548233032227, "global_step": 584523, "epoch": 7042} {"train_loss": -28.491018295288086, "global_step": 584524, "epoch": 7042} {"train_loss": -27.95191764831543, "global_step": 584525, "epoch": 7042} {"train_loss": -28.04827308654785, "global_step": 584526, "epoch": 7042} {"train_loss": -28.0119571685791, "global_step": 584527, "epoch": 7042} {"train_loss": -28.07474136352539, "global_step": 584528, "epoch": 7042} {"train_loss": -28.187475204467773, "global_step": 584529, "epoch": 7042} {"train_loss": -28.114124298095703, "global_step": 584530, "epoch": 7042} {"train_loss": -28.02459716796875, "global_step": 584531, "epoch": 7042} {"train_loss": -28.14997673034668, "global_step": 584532, "epoch": 7042} {"train_loss": -27.596485137939453, "global_step": 584533, "epoch": 7042} {"train_loss": -28.078657150268555, "global_step": 584534, "epoch": 7042} {"train_loss": -27.930145263671875, "global_step": 584535, "epoch": 7042} {"train_loss": -27.73379898071289, "global_step": 584536, "epoch": 7042} {"train_loss": -27.89716148376465, "global_step": 584537, "epoch": 7042} {"train_loss": -28.05425453186035, "global_step": 584538, "epoch": 7042} {"train_loss": -27.995336532592773, "global_step": 584539, "epoch": 7042} {"train_loss": -27.690332412719727, "global_step": 584540, "epoch": 7042} {"train_loss": -27.772876739501953, "global_step": 584541, "epoch": 7042} {"train_loss": -28.081796646118164, "global_step": 584542, "epoch": 7042} {"train_loss": -28.061420440673828, "global_step": 584543, "epoch": 7042} {"train_loss": -28.332666397094727, "global_step": 584544, "epoch": 7042} {"train_loss": -28.10565185546875, "global_step": 584545, "epoch": 7042} {"train_loss": -27.952224731445312, "global_step": 584546, "epoch": 7042} {"train_loss": -27.914203643798828, "global_step": 584547, "epoch": 7042} {"train_loss": -27.77322769165039, "global_step": 584548, "epoch": 7042} {"train_loss": -28.37529945373535, "global_step": 584549, "epoch": 7042} {"train_loss": -27.9475040435791, "global_step": 584550, "epoch": 7042} {"train_loss": -27.854272842407227, "global_step": 584551, "epoch": 7042} {"train_loss": -27.6937198638916, "global_step": 584552, "epoch": 7042} {"train_loss": -27.8452091217041, "global_step": 584553, "epoch": 7042} {"train_loss": -28.041662216186523, "global_step": 584554, "epoch": 7042} {"train_loss": -27.979578018188477, "global_step": 584555, "epoch": 7042} {"train_loss": -27.420801162719727, "global_step": 584556, "epoch": 7042} {"train_loss": -27.948780059814453, "global_step": 584557, "epoch": 7042} {"train_loss": -27.997238159179688, "global_step": 584558, "epoch": 7042} {"train_loss": -27.90341567993164, "global_step": 584559, "epoch": 7042} {"train_loss": -28.28578758239746, "global_step": 584560, "epoch": 7042} {"train_loss": -27.96868896484375, "global_step": 584561, "epoch": 7042} {"train_loss": -27.789905548095703, "global_step": 584562, "epoch": 7042} {"train_loss": -28.044050216674805, "global_step": 584563, "epoch": 7042} {"train_loss": -27.69283103942871, "global_step": 584564, "epoch": 7042} {"train_loss": -28.137304306030273, "global_step": 584565, "epoch": 7042} {"train_loss": -27.67377281188965, "global_step": 584566, "epoch": 7042} {"train_loss": -28.161848068237305, "global_step": 584567, "epoch": 7042} {"train_loss": -27.812389626560442, "global_step": 584568, "epoch": 7042, "val_loss": 6679051.5} {"train_loss": -27.076648712158203, "global_step": 584569, "epoch": 7043} {"train_loss": -27.123788833618164, "global_step": 584570, "epoch": 7043} {"train_loss": -27.449460983276367, "global_step": 584571, "epoch": 7043} {"train_loss": -27.63991355895996, "global_step": 584572, "epoch": 7043} {"train_loss": -27.212244033813477, "global_step": 584573, "epoch": 7043} {"train_loss": -27.035120010375977, "global_step": 584574, "epoch": 7043} {"train_loss": -27.12591552734375, "global_step": 584575, "epoch": 7043} {"train_loss": -27.345136642456055, "global_step": 584576, "epoch": 7043} {"train_loss": -27.51470947265625, "global_step": 584577, "epoch": 7043} {"train_loss": -27.538818359375, "global_step": 584578, "epoch": 7043} {"train_loss": -27.660221099853516, "global_step": 584579, "epoch": 7043} {"train_loss": -27.736316680908203, "global_step": 584580, "epoch": 7043} {"train_loss": -27.4134578704834, "global_step": 584581, "epoch": 7043} {"train_loss": -27.867572784423828, "global_step": 584582, "epoch": 7043} {"train_loss": -27.604772567749023, "global_step": 584583, "epoch": 7043} {"train_loss": -27.0235652923584, "global_step": 584584, "epoch": 7043} {"train_loss": -27.503070831298828, "global_step": 584585, "epoch": 7043} {"train_loss": -27.63555908203125, "global_step": 584586, "epoch": 7043} {"train_loss": -27.1783390045166, "global_step": 584587, "epoch": 7043} {"train_loss": -27.861713409423828, "global_step": 584588, "epoch": 7043} {"train_loss": -27.726734161376953, "global_step": 584589, "epoch": 7043} {"train_loss": -27.337095260620117, "global_step": 584590, "epoch": 7043} {"train_loss": -27.205127716064453, "global_step": 584591, "epoch": 7043} {"train_loss": -27.63947868347168, "global_step": 584592, "epoch": 7043} {"train_loss": -27.90155601501465, "global_step": 584593, "epoch": 7043} {"train_loss": -27.404285430908203, "global_step": 584594, "epoch": 7043} {"train_loss": -28.026782989501953, "global_step": 584595, "epoch": 7043} {"train_loss": -27.670215606689453, "global_step": 584596, "epoch": 7043} {"train_loss": -27.50248146057129, "global_step": 584597, "epoch": 7043} {"train_loss": -27.552799224853516, "global_step": 584598, "epoch": 7043} {"train_loss": -27.76297950744629, "global_step": 584599, "epoch": 7043} {"train_loss": -27.890607833862305, "global_step": 584600, "epoch": 7043} {"train_loss": -28.03413963317871, "global_step": 584601, "epoch": 7043} {"train_loss": -28.099088668823242, "global_step": 584602, "epoch": 7043} {"train_loss": -28.066303253173828, "global_step": 584603, "epoch": 7043} {"train_loss": -27.922332763671875, "global_step": 584604, "epoch": 7043} {"train_loss": -27.79375648498535, "global_step": 584605, "epoch": 7043} {"train_loss": -28.174245834350586, "global_step": 584606, "epoch": 7043} {"train_loss": -28.235212326049805, "global_step": 584607, "epoch": 7043} {"train_loss": -27.84722900390625, "global_step": 584608, "epoch": 7043} {"train_loss": -27.85206413269043, "global_step": 584609, "epoch": 7043} {"train_loss": -28.130084991455078, "global_step": 584610, "epoch": 7043} {"train_loss": -28.12299919128418, "global_step": 584611, "epoch": 7043} {"train_loss": -28.268613815307617, "global_step": 584612, "epoch": 7043} {"train_loss": -28.23029899597168, "global_step": 584613, "epoch": 7043} {"train_loss": -28.07699966430664, "global_step": 584614, "epoch": 7043} {"train_loss": -28.04578971862793, "global_step": 584615, "epoch": 7043} {"train_loss": -28.29559898376465, "global_step": 584616, "epoch": 7043} {"train_loss": -28.028675079345703, "global_step": 584617, "epoch": 7043} {"train_loss": -28.051593780517578, "global_step": 584618, "epoch": 7043} {"train_loss": -27.980518341064453, "global_step": 584619, "epoch": 7043} {"train_loss": -27.762069702148438, "global_step": 584620, "epoch": 7043} {"train_loss": -28.05436134338379, "global_step": 584621, "epoch": 7043} {"train_loss": -28.00649070739746, "global_step": 584622, "epoch": 7043} {"train_loss": -28.10004997253418, "global_step": 584623, "epoch": 7043} {"train_loss": -28.201404571533203, "global_step": 584624, "epoch": 7043} {"train_loss": -28.12306022644043, "global_step": 584625, "epoch": 7043} {"train_loss": -27.983495712280273, "global_step": 584626, "epoch": 7043} {"train_loss": -27.918243408203125, "global_step": 584627, "epoch": 7043} {"train_loss": -28.469146728515625, "global_step": 584628, "epoch": 7043} {"train_loss": -28.378183364868164, "global_step": 584629, "epoch": 7043} {"train_loss": -28.161706924438477, "global_step": 584630, "epoch": 7043} {"train_loss": -27.486087799072266, "global_step": 584631, "epoch": 7043} {"train_loss": -27.413755416870117, "global_step": 584632, "epoch": 7043} {"train_loss": -27.776355743408203, "global_step": 584633, "epoch": 7043} {"train_loss": -27.760059356689453, "global_step": 584634, "epoch": 7043} {"train_loss": -27.939289093017578, "global_step": 584635, "epoch": 7043} {"train_loss": -28.02569580078125, "global_step": 584636, "epoch": 7043} {"train_loss": -28.2830810546875, "global_step": 584637, "epoch": 7043} {"train_loss": -27.9444522857666, "global_step": 584638, "epoch": 7043} {"train_loss": -27.761859893798828, "global_step": 584639, "epoch": 7043} {"train_loss": -27.79859733581543, "global_step": 584640, "epoch": 7043} {"train_loss": -27.97662353515625, "global_step": 584641, "epoch": 7043} {"train_loss": -27.417078018188477, "global_step": 584642, "epoch": 7043} {"train_loss": -27.65713882446289, "global_step": 584643, "epoch": 7043} {"train_loss": -27.986921310424805, "global_step": 584644, "epoch": 7043} {"train_loss": -28.133880615234375, "global_step": 584645, "epoch": 7043} {"train_loss": -27.837661743164062, "global_step": 584646, "epoch": 7043} {"train_loss": -27.62660026550293, "global_step": 584647, "epoch": 7043} {"train_loss": -27.306568145751953, "global_step": 584648, "epoch": 7043} {"train_loss": -27.90231704711914, "global_step": 584649, "epoch": 7043} {"train_loss": -27.947118759155273, "global_step": 584650, "epoch": 7043} {"train_loss": -27.771001494074444, "global_step": 584651, "epoch": 7043, "val_loss": 6655296.0} {"train_loss": -26.787073135375977, "global_step": 584652, "epoch": 7044} {"train_loss": -27.537342071533203, "global_step": 584653, "epoch": 7044} {"train_loss": -27.103723526000977, "global_step": 584654, "epoch": 7044} {"train_loss": -27.252044677734375, "global_step": 584655, "epoch": 7044} {"train_loss": -26.603382110595703, "global_step": 584656, "epoch": 7044} {"train_loss": -27.069583892822266, "global_step": 584657, "epoch": 7044} {"train_loss": -26.73175621032715, "global_step": 584658, "epoch": 7044} {"train_loss": -27.397268295288086, "global_step": 584659, "epoch": 7044} {"train_loss": -27.6588191986084, "global_step": 584660, "epoch": 7044} {"train_loss": -27.60003662109375, "global_step": 584661, "epoch": 7044} {"train_loss": -27.618499755859375, "global_step": 584662, "epoch": 7044} {"train_loss": -27.353321075439453, "global_step": 584663, "epoch": 7044} {"train_loss": -27.659704208374023, "global_step": 584664, "epoch": 7044} {"train_loss": -27.573163986206055, "global_step": 584665, "epoch": 7044} {"train_loss": -27.598114013671875, "global_step": 584666, "epoch": 7044} {"train_loss": -27.570363998413086, "global_step": 584667, "epoch": 7044} {"train_loss": -27.38727378845215, "global_step": 584668, "epoch": 7044} {"train_loss": -27.901769638061523, "global_step": 584669, "epoch": 7044} {"train_loss": -27.4311580657959, "global_step": 584670, "epoch": 7044} {"train_loss": -27.795068740844727, "global_step": 584671, "epoch": 7044} {"train_loss": -27.63177490234375, "global_step": 584672, "epoch": 7044} {"train_loss": -27.703510284423828, "global_step": 584673, "epoch": 7044} {"train_loss": -27.556676864624023, "global_step": 584674, "epoch": 7044} {"train_loss": -27.790937423706055, "global_step": 584675, "epoch": 7044} {"train_loss": -27.909210205078125, "global_step": 584676, "epoch": 7044} {"train_loss": -27.741418838500977, "global_step": 584677, "epoch": 7044} {"train_loss": -27.65583610534668, "global_step": 584678, "epoch": 7044} {"train_loss": -27.749637603759766, "global_step": 584679, "epoch": 7044} {"train_loss": -27.513269424438477, "global_step": 584680, "epoch": 7044} {"train_loss": -27.826129913330078, "global_step": 584681, "epoch": 7044} {"train_loss": -27.71246337890625, "global_step": 584682, "epoch": 7044} {"train_loss": -27.718610763549805, "global_step": 584683, "epoch": 7044} {"train_loss": -27.796142578125, "global_step": 584684, "epoch": 7044} {"train_loss": -27.77581214904785, "global_step": 584685, "epoch": 7044} {"train_loss": -28.122058868408203, "global_step": 584686, "epoch": 7044} {"train_loss": -28.23992919921875, "global_step": 584687, "epoch": 7044} {"train_loss": -27.962194442749023, "global_step": 584688, "epoch": 7044} {"train_loss": -27.88276481628418, "global_step": 584689, "epoch": 7044} {"train_loss": -27.71796226501465, "global_step": 584690, "epoch": 7044} {"train_loss": -28.097000122070312, "global_step": 584691, "epoch": 7044} {"train_loss": -28.448291778564453, "global_step": 584692, "epoch": 7044} {"train_loss": -27.859634399414062, "global_step": 584693, "epoch": 7044} {"train_loss": -28.036558151245117, "global_step": 584694, "epoch": 7044} {"train_loss": -27.93267822265625, "global_step": 584695, "epoch": 7044} {"train_loss": -28.048572540283203, "global_step": 584696, "epoch": 7044} {"train_loss": -28.2166690826416, "global_step": 584697, "epoch": 7044} {"train_loss": -27.896137237548828, "global_step": 584698, "epoch": 7044} {"train_loss": -28.222604751586914, "global_step": 584699, "epoch": 7044} {"train_loss": -28.466796875, "global_step": 584700, "epoch": 7044} {"train_loss": -28.324466705322266, "global_step": 584701, "epoch": 7044} {"train_loss": -27.83026695251465, "global_step": 584702, "epoch": 7044} {"train_loss": -28.129547119140625, "global_step": 584703, "epoch": 7044} {"train_loss": -28.039295196533203, "global_step": 584704, "epoch": 7044} {"train_loss": -27.941137313842773, "global_step": 584705, "epoch": 7044} {"train_loss": -28.19052505493164, "global_step": 584706, "epoch": 7044} {"train_loss": -28.13020133972168, "global_step": 584707, "epoch": 7044} {"train_loss": -28.151227951049805, "global_step": 584708, "epoch": 7044} {"train_loss": -28.030181884765625, "global_step": 584709, "epoch": 7044} {"train_loss": -27.732465744018555, "global_step": 584710, "epoch": 7044} {"train_loss": -27.914091110229492, "global_step": 584711, "epoch": 7044} {"train_loss": -27.790014266967773, "global_step": 584712, "epoch": 7044} {"train_loss": -28.218032836914062, "global_step": 584713, "epoch": 7044} {"train_loss": -27.716909408569336, "global_step": 584714, "epoch": 7044} {"train_loss": -27.70051383972168, "global_step": 584715, "epoch": 7044} {"train_loss": -28.13522720336914, "global_step": 584716, "epoch": 7044} {"train_loss": -28.128576278686523, "global_step": 584717, "epoch": 7044} {"train_loss": -28.013620376586914, "global_step": 584718, "epoch": 7044} {"train_loss": -28.117460250854492, "global_step": 584719, "epoch": 7044} {"train_loss": -27.992101669311523, "global_step": 584720, "epoch": 7044} {"train_loss": -28.411970138549805, "global_step": 584721, "epoch": 7044} {"train_loss": -27.88142204284668, "global_step": 584722, "epoch": 7044} {"train_loss": -27.8994197845459, "global_step": 584723, "epoch": 7044} {"train_loss": -28.152490615844727, "global_step": 584724, "epoch": 7044} {"train_loss": -27.665983200073242, "global_step": 584725, "epoch": 7044} {"train_loss": -27.9760684967041, "global_step": 584726, "epoch": 7044} {"train_loss": -27.802570343017578, "global_step": 584727, "epoch": 7044} {"train_loss": -28.324462890625, "global_step": 584728, "epoch": 7044} {"train_loss": -27.84844398498535, "global_step": 584729, "epoch": 7044} {"train_loss": -27.86580467224121, "global_step": 584730, "epoch": 7044} {"train_loss": -27.67376708984375, "global_step": 584731, "epoch": 7044} {"train_loss": -27.643436431884766, "global_step": 584732, "epoch": 7044} {"train_loss": -27.917896270751953, "global_step": 584733, "epoch": 7044} {"train_loss": -27.79397270478398, "global_step": 584734, "epoch": 7044, "val_loss": 6784487.0} {"train_loss": -27.060285568237305, "global_step": 584735, "epoch": 7045} {"train_loss": -25.098390579223633, "global_step": 584736, "epoch": 7045} {"train_loss": -25.761709213256836, "global_step": 584737, "epoch": 7045} {"train_loss": -26.56241226196289, "global_step": 584738, "epoch": 7045} {"train_loss": -26.511062622070312, "global_step": 584739, "epoch": 7045} {"train_loss": -26.976728439331055, "global_step": 584740, "epoch": 7045} {"train_loss": -26.265966415405273, "global_step": 584741, "epoch": 7045} {"train_loss": -27.54730224609375, "global_step": 584742, "epoch": 7045} {"train_loss": -27.317975997924805, "global_step": 584743, "epoch": 7045} {"train_loss": -27.009580612182617, "global_step": 584744, "epoch": 7045} {"train_loss": -27.09124183654785, "global_step": 584745, "epoch": 7045} {"train_loss": -26.934326171875, "global_step": 584746, "epoch": 7045} {"train_loss": -27.177230834960938, "global_step": 584747, "epoch": 7045} {"train_loss": -27.597156524658203, "global_step": 584748, "epoch": 7045} {"train_loss": -27.42341423034668, "global_step": 584749, "epoch": 7045} {"train_loss": -27.151229858398438, "global_step": 584750, "epoch": 7045} {"train_loss": -27.240467071533203, "global_step": 584751, "epoch": 7045} {"train_loss": -27.537921905517578, "global_step": 584752, "epoch": 7045} {"train_loss": -27.260618209838867, "global_step": 584753, "epoch": 7045} {"train_loss": -27.525182723999023, "global_step": 584754, "epoch": 7045} {"train_loss": -27.465469360351562, "global_step": 584755, "epoch": 7045} {"train_loss": -27.56158447265625, "global_step": 584756, "epoch": 7045} {"train_loss": -27.662826538085938, "global_step": 584757, "epoch": 7045} {"train_loss": -27.526731491088867, "global_step": 584758, "epoch": 7045} {"train_loss": -27.50115394592285, "global_step": 584759, "epoch": 7045} {"train_loss": -28.026611328125, "global_step": 584760, "epoch": 7045} {"train_loss": -27.433042526245117, "global_step": 584761, "epoch": 7045} {"train_loss": -27.670454025268555, "global_step": 584762, "epoch": 7045} {"train_loss": -27.798559188842773, "global_step": 584763, "epoch": 7045} {"train_loss": -27.924047470092773, "global_step": 584764, "epoch": 7045} {"train_loss": -27.666324615478516, "global_step": 584765, "epoch": 7045} {"train_loss": -27.9644775390625, "global_step": 584766, "epoch": 7045} {"train_loss": -27.762876510620117, "global_step": 584767, "epoch": 7045} {"train_loss": -27.660938262939453, "global_step": 584768, "epoch": 7045} {"train_loss": -27.9389591217041, "global_step": 584769, "epoch": 7045} {"train_loss": -27.79485511779785, "global_step": 584770, "epoch": 7045} {"train_loss": -28.089399337768555, "global_step": 584771, "epoch": 7045} {"train_loss": -27.795888900756836, "global_step": 584772, "epoch": 7045} {"train_loss": -28.051959991455078, "global_step": 584773, "epoch": 7045} {"train_loss": -28.139541625976562, "global_step": 584774, "epoch": 7045} {"train_loss": -27.750308990478516, "global_step": 584775, "epoch": 7045} {"train_loss": -27.83550453186035, "global_step": 584776, "epoch": 7045} {"train_loss": -27.93549156188965, "global_step": 584777, "epoch": 7045} {"train_loss": -28.184396743774414, "global_step": 584778, "epoch": 7045} {"train_loss": -27.762939453125, "global_step": 584779, "epoch": 7045} {"train_loss": -28.38091468811035, "global_step": 584780, "epoch": 7045} {"train_loss": -27.6805477142334, "global_step": 584781, "epoch": 7045} {"train_loss": -28.19716453552246, "global_step": 584782, "epoch": 7045} {"train_loss": -28.02724266052246, "global_step": 584783, "epoch": 7045} {"train_loss": -27.868579864501953, "global_step": 584784, "epoch": 7045} {"train_loss": -27.534351348876953, "global_step": 584785, "epoch": 7045} {"train_loss": -27.6966552734375, "global_step": 584786, "epoch": 7045} {"train_loss": -27.837268829345703, "global_step": 584787, "epoch": 7045} {"train_loss": -27.822528839111328, "global_step": 584788, "epoch": 7045} {"train_loss": -27.847213745117188, "global_step": 584789, "epoch": 7045} {"train_loss": -27.874582290649414, "global_step": 584790, "epoch": 7045} {"train_loss": -27.752674102783203, "global_step": 584791, "epoch": 7045} {"train_loss": -28.192646026611328, "global_step": 584792, "epoch": 7045} {"train_loss": -27.9300594329834, "global_step": 584793, "epoch": 7045} {"train_loss": -27.84803581237793, "global_step": 584794, "epoch": 7045} {"train_loss": -27.8172607421875, "global_step": 584795, "epoch": 7045} {"train_loss": -28.096158981323242, "global_step": 584796, "epoch": 7045} {"train_loss": -27.719745635986328, "global_step": 584797, "epoch": 7045} {"train_loss": -28.140531539916992, "global_step": 584798, "epoch": 7045} {"train_loss": -28.17652702331543, "global_step": 584799, "epoch": 7045} {"train_loss": -27.768970489501953, "global_step": 584800, "epoch": 7045} {"train_loss": -28.114761352539062, "global_step": 584801, "epoch": 7045} {"train_loss": -28.327077865600586, "global_step": 584802, "epoch": 7045} {"train_loss": -28.10049819946289, "global_step": 584803, "epoch": 7045} {"train_loss": -28.292844772338867, "global_step": 584804, "epoch": 7045} {"train_loss": -28.304325103759766, "global_step": 584805, "epoch": 7045} {"train_loss": -28.052770614624023, "global_step": 584806, "epoch": 7045} {"train_loss": -28.238256454467773, "global_step": 584807, "epoch": 7045} {"train_loss": -27.69645118713379, "global_step": 584808, "epoch": 7045} {"train_loss": -27.925016403198242, "global_step": 584809, "epoch": 7045} {"train_loss": -28.440998077392578, "global_step": 584810, "epoch": 7045} {"train_loss": -28.074237823486328, "global_step": 584811, "epoch": 7045} {"train_loss": -27.610395431518555, "global_step": 584812, "epoch": 7045} {"train_loss": -27.766340255737305, "global_step": 584813, "epoch": 7045} {"train_loss": -27.708316802978516, "global_step": 584814, "epoch": 7045} {"train_loss": -28.02105712890625, "global_step": 584815, "epoch": 7045} {"train_loss": -27.638080596923828, "global_step": 584816, "epoch": 7045} {"train_loss": -27.676012682627483, "global_step": 584817, "epoch": 7045, "val_loss": 6695716.5} {"train_loss": -27.309280395507812, "global_step": 584818, "epoch": 7046} {"train_loss": -25.88006019592285, "global_step": 584819, "epoch": 7046} {"train_loss": -27.02268409729004, "global_step": 584820, "epoch": 7046} {"train_loss": -27.126157760620117, "global_step": 584821, "epoch": 7046} {"train_loss": -26.875112533569336, "global_step": 584822, "epoch": 7046} {"train_loss": -26.910730361938477, "global_step": 584823, "epoch": 7046} {"train_loss": -27.515033721923828, "global_step": 584824, "epoch": 7046} {"train_loss": -26.88926124572754, "global_step": 584825, "epoch": 7046} {"train_loss": -26.877904891967773, "global_step": 584826, "epoch": 7046} {"train_loss": -27.483251571655273, "global_step": 584827, "epoch": 7046} {"train_loss": -27.17698097229004, "global_step": 584828, "epoch": 7046} {"train_loss": -27.7902889251709, "global_step": 584829, "epoch": 7046} {"train_loss": -27.26907730102539, "global_step": 584830, "epoch": 7046} {"train_loss": -27.32477378845215, "global_step": 584831, "epoch": 7046} {"train_loss": -27.060443878173828, "global_step": 584832, "epoch": 7046} {"train_loss": -27.113666534423828, "global_step": 584833, "epoch": 7046} {"train_loss": -27.492767333984375, "global_step": 584834, "epoch": 7046} {"train_loss": -27.970001220703125, "global_step": 584835, "epoch": 7046} {"train_loss": -27.519861221313477, "global_step": 584836, "epoch": 7046} {"train_loss": -27.48097801208496, "global_step": 584837, "epoch": 7046} {"train_loss": -27.118900299072266, "global_step": 584838, "epoch": 7046} {"train_loss": -27.677305221557617, "global_step": 584839, "epoch": 7046} {"train_loss": -27.50812339782715, "global_step": 584840, "epoch": 7046} {"train_loss": -27.495468139648438, "global_step": 584841, "epoch": 7046} {"train_loss": -27.817581176757812, "global_step": 584842, "epoch": 7046} {"train_loss": -27.886993408203125, "global_step": 584843, "epoch": 7046} {"train_loss": -27.43800163269043, "global_step": 584844, "epoch": 7046} {"train_loss": -27.40947914123535, "global_step": 584845, "epoch": 7046} {"train_loss": -27.386184692382812, "global_step": 584846, "epoch": 7046} {"train_loss": -27.731138229370117, "global_step": 584847, "epoch": 7046} {"train_loss": -27.755264282226562, "global_step": 584848, "epoch": 7046} {"train_loss": -27.47353172302246, "global_step": 584849, "epoch": 7046} {"train_loss": -27.266592025756836, "global_step": 584850, "epoch": 7046} {"train_loss": -27.57264518737793, "global_step": 584851, "epoch": 7046} {"train_loss": -27.745161056518555, "global_step": 584852, "epoch": 7046} {"train_loss": -27.54459571838379, "global_step": 584853, "epoch": 7046} {"train_loss": -27.713186264038086, "global_step": 584854, "epoch": 7046} {"train_loss": -27.963361740112305, "global_step": 584855, "epoch": 7046} {"train_loss": -27.88245964050293, "global_step": 584856, "epoch": 7046} {"train_loss": -27.676334381103516, "global_step": 584857, "epoch": 7046} {"train_loss": -27.651655197143555, "global_step": 584858, "epoch": 7046} {"train_loss": -28.090539932250977, "global_step": 584859, "epoch": 7046} {"train_loss": -27.621301651000977, "global_step": 584860, "epoch": 7046} {"train_loss": -27.652063369750977, "global_step": 584861, "epoch": 7046} {"train_loss": -27.70706558227539, "global_step": 584862, "epoch": 7046} {"train_loss": -27.607587814331055, "global_step": 584863, "epoch": 7046} {"train_loss": -28.143539428710938, "global_step": 584864, "epoch": 7046} {"train_loss": -27.55183982849121, "global_step": 584865, "epoch": 7046} {"train_loss": -28.002973556518555, "global_step": 584866, "epoch": 7046} {"train_loss": -28.065814971923828, "global_step": 584867, "epoch": 7046} {"train_loss": -28.3707218170166, "global_step": 584868, "epoch": 7046} {"train_loss": -27.80732536315918, "global_step": 584869, "epoch": 7046} {"train_loss": -28.06288719177246, "global_step": 584870, "epoch": 7046} {"train_loss": -28.004560470581055, "global_step": 584871, "epoch": 7046} {"train_loss": -27.938749313354492, "global_step": 584872, "epoch": 7046} {"train_loss": -28.157703399658203, "global_step": 584873, "epoch": 7046} {"train_loss": -27.718042373657227, "global_step": 584874, "epoch": 7046} {"train_loss": -27.885009765625, "global_step": 584875, "epoch": 7046} {"train_loss": -27.846960067749023, "global_step": 584876, "epoch": 7046} {"train_loss": -27.28046989440918, "global_step": 584877, "epoch": 7046} {"train_loss": -26.275121688842773, "global_step": 584878, "epoch": 7046} {"train_loss": -25.041330337524414, "global_step": 584879, "epoch": 7046} {"train_loss": -25.604475021362305, "global_step": 584880, "epoch": 7046} {"train_loss": -25.98004150390625, "global_step": 584881, "epoch": 7046} {"train_loss": -26.235029220581055, "global_step": 584882, "epoch": 7046} {"train_loss": -28.14631462097168, "global_step": 584883, "epoch": 7046} {"train_loss": -26.8260440826416, "global_step": 584884, "epoch": 7046} {"train_loss": -27.411680221557617, "global_step": 584885, "epoch": 7046} {"train_loss": -27.460233688354492, "global_step": 584886, "epoch": 7046} {"train_loss": -26.978422164916992, "global_step": 584887, "epoch": 7046} {"train_loss": -27.11903190612793, "global_step": 584888, "epoch": 7046} {"train_loss": -27.47938346862793, "global_step": 584889, "epoch": 7046} {"train_loss": -27.18194580078125, "global_step": 584890, "epoch": 7046} {"train_loss": -27.38319206237793, "global_step": 584891, "epoch": 7046} {"train_loss": -27.459735870361328, "global_step": 584892, "epoch": 7046} {"train_loss": -27.71146011352539, "global_step": 584893, "epoch": 7046} {"train_loss": -27.672199249267578, "global_step": 584894, "epoch": 7046} {"train_loss": -27.849828720092773, "global_step": 584895, "epoch": 7046} {"train_loss": -27.627811431884766, "global_step": 584896, "epoch": 7046} {"train_loss": -27.591190338134766, "global_step": 584897, "epoch": 7046} {"train_loss": -27.86836814880371, "global_step": 584898, "epoch": 7046} {"train_loss": -27.704044342041016, "global_step": 584899, "epoch": 7046} {"train_loss": -27.434377095785486, "global_step": 584900, "epoch": 7046, "val_loss": 6638175.0} {"train_loss": -27.2116641998291, "global_step": 584901, "epoch": 7047} {"train_loss": -27.33156394958496, "global_step": 584902, "epoch": 7047} {"train_loss": -27.14592933654785, "global_step": 584903, "epoch": 7047} {"train_loss": -27.347797393798828, "global_step": 584904, "epoch": 7047} {"train_loss": -27.18008804321289, "global_step": 584905, "epoch": 7047} {"train_loss": -27.4500732421875, "global_step": 584906, "epoch": 7047} {"train_loss": -27.59797477722168, "global_step": 584907, "epoch": 7047} {"train_loss": -27.45966911315918, "global_step": 584908, "epoch": 7047} {"train_loss": -27.613279342651367, "global_step": 584909, "epoch": 7047} {"train_loss": -27.67335319519043, "global_step": 584910, "epoch": 7047} {"train_loss": -27.29733657836914, "global_step": 584911, "epoch": 7047} {"train_loss": -27.6374454498291, "global_step": 584912, "epoch": 7047} {"train_loss": -27.548175811767578, "global_step": 584913, "epoch": 7047} {"train_loss": -27.4768009185791, "global_step": 584914, "epoch": 7047} {"train_loss": -27.801990509033203, "global_step": 584915, "epoch": 7047} {"train_loss": -27.21602439880371, "global_step": 584916, "epoch": 7047} {"train_loss": -27.709003448486328, "global_step": 584917, "epoch": 7047} {"train_loss": -27.4184627532959, "global_step": 584918, "epoch": 7047} {"train_loss": -27.365692138671875, "global_step": 584919, "epoch": 7047} {"train_loss": -27.61699867248535, "global_step": 584920, "epoch": 7047} {"train_loss": -27.66636085510254, "global_step": 584921, "epoch": 7047} {"train_loss": -27.3790340423584, "global_step": 584922, "epoch": 7047} {"train_loss": -28.003803253173828, "global_step": 584923, "epoch": 7047} {"train_loss": -27.9144287109375, "global_step": 584924, "epoch": 7047} {"train_loss": -27.739011764526367, "global_step": 584925, "epoch": 7047} {"train_loss": -27.8002872467041, "global_step": 584926, "epoch": 7047} {"train_loss": -27.534570693969727, "global_step": 584927, "epoch": 7047} {"train_loss": -27.78681755065918, "global_step": 584928, "epoch": 7047} {"train_loss": -27.77927589416504, "global_step": 584929, "epoch": 7047} {"train_loss": -28.184162139892578, "global_step": 584930, "epoch": 7047} {"train_loss": -28.04277992248535, "global_step": 584931, "epoch": 7047} {"train_loss": -27.884357452392578, "global_step": 584932, "epoch": 7047} {"train_loss": -27.917158126831055, "global_step": 584933, "epoch": 7047} {"train_loss": -27.8435115814209, "global_step": 584934, "epoch": 7047} {"train_loss": -27.900278091430664, "global_step": 584935, "epoch": 7047} {"train_loss": -27.760517120361328, "global_step": 584936, "epoch": 7047} {"train_loss": -28.297595977783203, "global_step": 584937, "epoch": 7047} {"train_loss": -27.945363998413086, "global_step": 584938, "epoch": 7047} {"train_loss": -27.66853141784668, "global_step": 584939, "epoch": 7047} {"train_loss": -27.79862403869629, "global_step": 584940, "epoch": 7047} {"train_loss": -28.158544540405273, "global_step": 584941, "epoch": 7047} {"train_loss": -27.984512329101562, "global_step": 584942, "epoch": 7047} {"train_loss": -27.758930206298828, "global_step": 584943, "epoch": 7047} {"train_loss": -28.028650283813477, "global_step": 584944, "epoch": 7047} {"train_loss": -27.890649795532227, "global_step": 584945, "epoch": 7047} {"train_loss": -28.441482543945312, "global_step": 584946, "epoch": 7047} {"train_loss": -28.2349910736084, "global_step": 584947, "epoch": 7047} {"train_loss": -27.8859806060791, "global_step": 584948, "epoch": 7047} {"train_loss": -27.8555850982666, "global_step": 584949, "epoch": 7047} {"train_loss": -27.937835693359375, "global_step": 584950, "epoch": 7047} {"train_loss": -27.913415908813477, "global_step": 584951, "epoch": 7047} {"train_loss": -27.924991607666016, "global_step": 584952, "epoch": 7047} {"train_loss": -27.89027214050293, "global_step": 584953, "epoch": 7047} {"train_loss": -28.203378677368164, "global_step": 584954, "epoch": 7047} {"train_loss": -27.6735897064209, "global_step": 584955, "epoch": 7047} {"train_loss": -28.243408203125, "global_step": 584956, "epoch": 7047} {"train_loss": -28.00562858581543, "global_step": 584957, "epoch": 7047} {"train_loss": -28.089130401611328, "global_step": 584958, "epoch": 7047} {"train_loss": -27.67038917541504, "global_step": 584959, "epoch": 7047} {"train_loss": -27.557004928588867, "global_step": 584960, "epoch": 7047} {"train_loss": -27.981821060180664, "global_step": 584961, "epoch": 7047} {"train_loss": -28.33173942565918, "global_step": 584962, "epoch": 7047} {"train_loss": -27.8944034576416, "global_step": 584963, "epoch": 7047} {"train_loss": -28.036550521850586, "global_step": 584964, "epoch": 7047} {"train_loss": -27.929601669311523, "global_step": 584965, "epoch": 7047} {"train_loss": -27.87885856628418, "global_step": 584966, "epoch": 7047} {"train_loss": -27.955835342407227, "global_step": 584967, "epoch": 7047} {"train_loss": -27.167438507080078, "global_step": 584968, "epoch": 7047} {"train_loss": -27.2806396484375, "global_step": 584969, "epoch": 7047} {"train_loss": -27.499897003173828, "global_step": 584970, "epoch": 7047} {"train_loss": -27.95844078063965, "global_step": 584971, "epoch": 7047} {"train_loss": -28.183637619018555, "global_step": 584972, "epoch": 7047} {"train_loss": -28.20237159729004, "global_step": 584973, "epoch": 7047} {"train_loss": -27.877044677734375, "global_step": 584974, "epoch": 7047} {"train_loss": -28.148212432861328, "global_step": 584975, "epoch": 7047} {"train_loss": -27.994094848632812, "global_step": 584976, "epoch": 7047} {"train_loss": -28.126935958862305, "global_step": 584977, "epoch": 7047} {"train_loss": -28.115591049194336, "global_step": 584978, "epoch": 7047} {"train_loss": -27.64814567565918, "global_step": 584979, "epoch": 7047} {"train_loss": -28.037994384765625, "global_step": 584980, "epoch": 7047} {"train_loss": -28.190458297729492, "global_step": 584981, "epoch": 7047} {"train_loss": -28.392114639282227, "global_step": 584982, "epoch": 7047} {"train_loss": -27.80982327748494, "global_step": 584983, "epoch": 7047, "val_loss": 6691356.0} {"train_loss": -27.690515518188477, "global_step": 584984, "epoch": 7048} {"train_loss": -27.748701095581055, "global_step": 584985, "epoch": 7048} {"train_loss": -27.3082275390625, "global_step": 584986, "epoch": 7048} {"train_loss": -27.548633575439453, "global_step": 584987, "epoch": 7048} {"train_loss": -27.568023681640625, "global_step": 584988, "epoch": 7048} {"train_loss": -27.425857543945312, "global_step": 584989, "epoch": 7048} {"train_loss": -27.287317276000977, "global_step": 584990, "epoch": 7048} {"train_loss": -27.42066764831543, "global_step": 584991, "epoch": 7048} {"train_loss": -27.265546798706055, "global_step": 584992, "epoch": 7048} {"train_loss": -27.950286865234375, "global_step": 584993, "epoch": 7048} {"train_loss": -27.774383544921875, "global_step": 584994, "epoch": 7048} {"train_loss": -27.639636993408203, "global_step": 584995, "epoch": 7048} {"train_loss": -27.480422973632812, "global_step": 584996, "epoch": 7048} {"train_loss": -28.038074493408203, "global_step": 584997, "epoch": 7048} {"train_loss": -27.794538497924805, "global_step": 584998, "epoch": 7048} {"train_loss": -27.76999855041504, "global_step": 584999, "epoch": 7048} {"train_loss": -28.263965606689453, "global_step": 585000, "epoch": 7048} {"train_loss": -27.952320098876953, "global_step": 585001, "epoch": 7048} {"train_loss": -28.183761596679688, "global_step": 585002, "epoch": 7048} {"train_loss": -27.8528995513916, "global_step": 585003, "epoch": 7048} {"train_loss": -27.9591007232666, "global_step": 585004, "epoch": 7048} {"train_loss": -27.69292640686035, "global_step": 585005, "epoch": 7048} {"train_loss": -28.316938400268555, "global_step": 585006, "epoch": 7048} {"train_loss": -28.06503677368164, "global_step": 585007, "epoch": 7048} {"train_loss": -27.929533004760742, "global_step": 585008, "epoch": 7048} {"train_loss": -28.002614974975586, "global_step": 585009, "epoch": 7048} {"train_loss": -27.745756149291992, "global_step": 585010, "epoch": 7048} {"train_loss": -28.156888961791992, "global_step": 585011, "epoch": 7048} {"train_loss": -27.93073081970215, "global_step": 585012, "epoch": 7048} {"train_loss": -27.98296546936035, "global_step": 585013, "epoch": 7048} {"train_loss": -28.093229293823242, "global_step": 585014, "epoch": 7048} {"train_loss": -27.932397842407227, "global_step": 585015, "epoch": 7048} {"train_loss": -27.86285400390625, "global_step": 585016, "epoch": 7048} {"train_loss": -28.1346435546875, "global_step": 585017, "epoch": 7048} {"train_loss": -28.009443283081055, "global_step": 585018, "epoch": 7048} {"train_loss": -28.139978408813477, "global_step": 585019, "epoch": 7048} {"train_loss": -28.16766357421875, "global_step": 585020, "epoch": 7048} {"train_loss": -27.911054611206055, "global_step": 585021, "epoch": 7048} {"train_loss": -27.964706420898438, "global_step": 585022, "epoch": 7048} {"train_loss": -28.07252311706543, "global_step": 585023, "epoch": 7048} {"train_loss": -27.937116622924805, "global_step": 585024, "epoch": 7048} {"train_loss": -28.46563148498535, "global_step": 585025, "epoch": 7048} {"train_loss": -28.171253204345703, "global_step": 585026, "epoch": 7048} {"train_loss": -28.139667510986328, "global_step": 585027, "epoch": 7048} {"train_loss": -28.125244140625, "global_step": 585028, "epoch": 7048} {"train_loss": -28.1347599029541, "global_step": 585029, "epoch": 7048} {"train_loss": -28.0677547454834, "global_step": 585030, "epoch": 7048} {"train_loss": -28.350055694580078, "global_step": 585031, "epoch": 7048} {"train_loss": -28.012969970703125, "global_step": 585032, "epoch": 7048} {"train_loss": -28.01859474182129, "global_step": 585033, "epoch": 7048} {"train_loss": -28.007871627807617, "global_step": 585034, "epoch": 7048} {"train_loss": -27.908483505249023, "global_step": 585035, "epoch": 7048} {"train_loss": -27.950973510742188, "global_step": 585036, "epoch": 7048} {"train_loss": -28.281665802001953, "global_step": 585037, "epoch": 7048} {"train_loss": -28.0345516204834, "global_step": 585038, "epoch": 7048} {"train_loss": -28.27057456970215, "global_step": 585039, "epoch": 7048} {"train_loss": -28.0960636138916, "global_step": 585040, "epoch": 7048} {"train_loss": -28.144006729125977, "global_step": 585041, "epoch": 7048} {"train_loss": -28.43592643737793, "global_step": 585042, "epoch": 7048} {"train_loss": -28.029254913330078, "global_step": 585043, "epoch": 7048} {"train_loss": -27.95163345336914, "global_step": 585044, "epoch": 7048} {"train_loss": -28.052398681640625, "global_step": 585045, "epoch": 7048} {"train_loss": -27.933048248291016, "global_step": 585046, "epoch": 7048} {"train_loss": -28.139867782592773, "global_step": 585047, "epoch": 7048} {"train_loss": -28.003131866455078, "global_step": 585048, "epoch": 7048} {"train_loss": -27.78265953063965, "global_step": 585049, "epoch": 7048} {"train_loss": -28.072961807250977, "global_step": 585050, "epoch": 7048} {"train_loss": -28.258752822875977, "global_step": 585051, "epoch": 7048} {"train_loss": -27.911645889282227, "global_step": 585052, "epoch": 7048} {"train_loss": -28.0836238861084, "global_step": 585053, "epoch": 7048} {"train_loss": -27.980005264282227, "global_step": 585054, "epoch": 7048} {"train_loss": -28.120275497436523, "global_step": 585055, "epoch": 7048} {"train_loss": -28.13819694519043, "global_step": 585056, "epoch": 7048} {"train_loss": -28.023090362548828, "global_step": 585057, "epoch": 7048} {"train_loss": -27.469074249267578, "global_step": 585058, "epoch": 7048} {"train_loss": -27.668928146362305, "global_step": 585059, "epoch": 7048} {"train_loss": -27.50034523010254, "global_step": 585060, "epoch": 7048} {"train_loss": -26.7795467376709, "global_step": 585061, "epoch": 7048} {"train_loss": -26.096967697143555, "global_step": 585062, "epoch": 7048} {"train_loss": -26.503173828125, "global_step": 585063, "epoch": 7048} {"train_loss": -27.20844841003418, "global_step": 585064, "epoch": 7048} {"train_loss": -27.74289894104004, "global_step": 585065, "epoch": 7048} {"train_loss": -27.882735447711255, "global_step": 585066, "epoch": 7048, "val_loss": 6697663.0} {"train_loss": -26.51938819885254, "global_step": 585067, "epoch": 7049} {"train_loss": -26.881372451782227, "global_step": 585068, "epoch": 7049} {"train_loss": -26.549835205078125, "global_step": 585069, "epoch": 7049} {"train_loss": -26.69544792175293, "global_step": 585070, "epoch": 7049} {"train_loss": -26.93658447265625, "global_step": 585071, "epoch": 7049} {"train_loss": -26.948755264282227, "global_step": 585072, "epoch": 7049} {"train_loss": -26.983484268188477, "global_step": 585073, "epoch": 7049} {"train_loss": -27.092041015625, "global_step": 585074, "epoch": 7049} {"train_loss": -26.995935440063477, "global_step": 585075, "epoch": 7049} {"train_loss": -27.271284103393555, "global_step": 585076, "epoch": 7049} {"train_loss": -27.094654083251953, "global_step": 585077, "epoch": 7049} {"train_loss": -26.983184814453125, "global_step": 585078, "epoch": 7049} {"train_loss": -26.979883193969727, "global_step": 585079, "epoch": 7049} {"train_loss": -27.47524070739746, "global_step": 585080, "epoch": 7049} {"train_loss": -27.16485023498535, "global_step": 585081, "epoch": 7049} {"train_loss": -27.41749382019043, "global_step": 585082, "epoch": 7049} {"train_loss": -27.49036979675293, "global_step": 585083, "epoch": 7049} {"train_loss": -27.553247451782227, "global_step": 585084, "epoch": 7049} {"train_loss": -27.785200119018555, "global_step": 585085, "epoch": 7049} {"train_loss": -27.8185977935791, "global_step": 585086, "epoch": 7049} {"train_loss": -27.32572364807129, "global_step": 585087, "epoch": 7049} {"train_loss": -27.606891632080078, "global_step": 585088, "epoch": 7049} {"train_loss": -27.501760482788086, "global_step": 585089, "epoch": 7049} {"train_loss": -27.82490348815918, "global_step": 585090, "epoch": 7049} {"train_loss": -27.474609375, "global_step": 585091, "epoch": 7049} {"train_loss": -27.46150779724121, "global_step": 585092, "epoch": 7049} {"train_loss": -27.71176528930664, "global_step": 585093, "epoch": 7049} {"train_loss": -27.75998878479004, "global_step": 585094, "epoch": 7049} {"train_loss": -27.6817684173584, "global_step": 585095, "epoch": 7049} {"train_loss": -27.91071891784668, "global_step": 585096, "epoch": 7049} {"train_loss": -27.869482040405273, "global_step": 585097, "epoch": 7049} {"train_loss": -27.993488311767578, "global_step": 585098, "epoch": 7049} {"train_loss": -27.79389762878418, "global_step": 585099, "epoch": 7049} {"train_loss": -27.869482040405273, "global_step": 585100, "epoch": 7049} {"train_loss": -27.700448989868164, "global_step": 585101, "epoch": 7049} {"train_loss": -27.859968185424805, "global_step": 585102, "epoch": 7049} {"train_loss": -27.737823486328125, "global_step": 585103, "epoch": 7049} {"train_loss": -28.05425453186035, "global_step": 585104, "epoch": 7049} {"train_loss": -28.08845329284668, "global_step": 585105, "epoch": 7049} {"train_loss": -28.215198516845703, "global_step": 585106, "epoch": 7049} {"train_loss": -28.443450927734375, "global_step": 585107, "epoch": 7049} {"train_loss": -27.8320255279541, "global_step": 585108, "epoch": 7049} {"train_loss": -27.945953369140625, "global_step": 585109, "epoch": 7049} {"train_loss": -27.824909210205078, "global_step": 585110, "epoch": 7049} {"train_loss": -28.16990089416504, "global_step": 585111, "epoch": 7049} {"train_loss": -28.25068473815918, "global_step": 585112, "epoch": 7049} {"train_loss": -27.944318771362305, "global_step": 585113, "epoch": 7049} {"train_loss": -28.187397003173828, "global_step": 585114, "epoch": 7049} {"train_loss": -27.944015502929688, "global_step": 585115, "epoch": 7049} {"train_loss": -28.442731857299805, "global_step": 585116, "epoch": 7049} {"train_loss": -28.044668197631836, "global_step": 585117, "epoch": 7049} {"train_loss": -28.27239418029785, "global_step": 585118, "epoch": 7049} {"train_loss": -27.967443466186523, "global_step": 585119, "epoch": 7049} {"train_loss": -27.681440353393555, "global_step": 585120, "epoch": 7049} {"train_loss": -28.071521759033203, "global_step": 585121, "epoch": 7049} {"train_loss": -27.424558639526367, "global_step": 585122, "epoch": 7049} {"train_loss": -26.937788009643555, "global_step": 585123, "epoch": 7049} {"train_loss": -27.63665771484375, "global_step": 585124, "epoch": 7049} {"train_loss": -27.7069149017334, "global_step": 585125, "epoch": 7049} {"train_loss": -27.476423263549805, "global_step": 585126, "epoch": 7049} {"train_loss": -27.791797637939453, "global_step": 585127, "epoch": 7049} {"train_loss": -28.007373809814453, "global_step": 585128, "epoch": 7049} {"train_loss": -27.860980987548828, "global_step": 585129, "epoch": 7049} {"train_loss": -27.951324462890625, "global_step": 585130, "epoch": 7049} {"train_loss": -27.697219848632812, "global_step": 585131, "epoch": 7049} {"train_loss": -28.336301803588867, "global_step": 585132, "epoch": 7049} {"train_loss": -27.65900230407715, "global_step": 585133, "epoch": 7049} {"train_loss": -27.94281578063965, "global_step": 585134, "epoch": 7049} {"train_loss": -27.395416259765625, "global_step": 585135, "epoch": 7049} {"train_loss": -27.541553497314453, "global_step": 585136, "epoch": 7049} {"train_loss": -27.870203018188477, "global_step": 585137, "epoch": 7049} {"train_loss": -27.91379737854004, "global_step": 585138, "epoch": 7049} {"train_loss": -28.084491729736328, "global_step": 585139, "epoch": 7049} {"train_loss": -28.188003540039062, "global_step": 585140, "epoch": 7049} {"train_loss": -27.62470817565918, "global_step": 585141, "epoch": 7049} {"train_loss": -27.78932762145996, "global_step": 585142, "epoch": 7049} {"train_loss": -28.244863510131836, "global_step": 585143, "epoch": 7049} {"train_loss": -28.142194747924805, "global_step": 585144, "epoch": 7049} {"train_loss": -28.413105010986328, "global_step": 585145, "epoch": 7049} {"train_loss": -28.110107421875, "global_step": 585146, "epoch": 7049} {"train_loss": -27.61098289489746, "global_step": 585147, "epoch": 7049} {"train_loss": -27.93202018737793, "global_step": 585148, "epoch": 7049} {"train_loss": -27.67542282931776, "global_step": 585149, "epoch": 7049, "val_loss": 6576014.0} {"train_loss": -27.533050537109375, "global_step": 585150, "epoch": 7050} {"train_loss": -26.993961334228516, "global_step": 585151, "epoch": 7050} {"train_loss": -27.56353759765625, "global_step": 585152, "epoch": 7050} {"train_loss": -27.29231071472168, "global_step": 585153, "epoch": 7050} {"train_loss": -27.635452270507812, "global_step": 585154, "epoch": 7050} {"train_loss": -27.19317626953125, "global_step": 585155, "epoch": 7050} {"train_loss": -27.059528350830078, "global_step": 585156, "epoch": 7050} {"train_loss": -27.2698974609375, "global_step": 585157, "epoch": 7050} {"train_loss": -27.750329971313477, "global_step": 585158, "epoch": 7050} {"train_loss": -27.309329986572266, "global_step": 585159, "epoch": 7050} {"train_loss": -27.61202049255371, "global_step": 585160, "epoch": 7050} {"train_loss": -27.563467025756836, "global_step": 585161, "epoch": 7050} {"train_loss": -27.4880428314209, "global_step": 585162, "epoch": 7050} {"train_loss": -27.620031356811523, "global_step": 585163, "epoch": 7050} {"train_loss": -27.71625328063965, "global_step": 585164, "epoch": 7050} {"train_loss": -27.834320068359375, "global_step": 585165, "epoch": 7050} {"train_loss": -27.817214965820312, "global_step": 585166, "epoch": 7050} {"train_loss": -27.697113037109375, "global_step": 585167, "epoch": 7050} {"train_loss": -27.617246627807617, "global_step": 585168, "epoch": 7050} {"train_loss": -27.697622299194336, "global_step": 585169, "epoch": 7050} {"train_loss": -27.600671768188477, "global_step": 585170, "epoch": 7050} {"train_loss": -27.661279678344727, "global_step": 585171, "epoch": 7050} {"train_loss": -27.453205108642578, "global_step": 585172, "epoch": 7050} {"train_loss": -27.673364639282227, "global_step": 585173, "epoch": 7050} {"train_loss": -27.636579513549805, "global_step": 585174, "epoch": 7050} {"train_loss": -27.952280044555664, "global_step": 585175, "epoch": 7050} {"train_loss": -28.155832290649414, "global_step": 585176, "epoch": 7050} {"train_loss": -28.175430297851562, "global_step": 585177, "epoch": 7050} {"train_loss": -27.945470809936523, "global_step": 585178, "epoch": 7050} {"train_loss": -27.825424194335938, "global_step": 585179, "epoch": 7050} {"train_loss": -27.611515045166016, "global_step": 585180, "epoch": 7050} {"train_loss": -28.13210105895996, "global_step": 585181, "epoch": 7050} {"train_loss": -28.29253578186035, "global_step": 585182, "epoch": 7050} {"train_loss": -27.868139266967773, "global_step": 585183, "epoch": 7050} {"train_loss": -28.05527114868164, "global_step": 585184, "epoch": 7050} {"train_loss": -28.2994384765625, "global_step": 585185, "epoch": 7050} {"train_loss": -28.400436401367188, "global_step": 585186, "epoch": 7050} {"train_loss": -28.16060447692871, "global_step": 585187, "epoch": 7050} {"train_loss": -28.227920532226562, "global_step": 585188, "epoch": 7050} {"train_loss": -28.403339385986328, "global_step": 585189, "epoch": 7050} {"train_loss": -28.33391761779785, "global_step": 585190, "epoch": 7050} {"train_loss": -28.26247215270996, "global_step": 585191, "epoch": 7050} {"train_loss": -27.73451042175293, "global_step": 585192, "epoch": 7050} {"train_loss": -28.2352352142334, "global_step": 585193, "epoch": 7050} {"train_loss": -27.839324951171875, "global_step": 585194, "epoch": 7050} {"train_loss": -27.763568878173828, "global_step": 585195, "epoch": 7050} {"train_loss": -27.246734619140625, "global_step": 585196, "epoch": 7050} {"train_loss": -27.321943283081055, "global_step": 585197, "epoch": 7050} {"train_loss": -27.629499435424805, "global_step": 585198, "epoch": 7050} {"train_loss": -28.090356826782227, "global_step": 585199, "epoch": 7050} {"train_loss": -27.74072265625, "global_step": 585200, "epoch": 7050} {"train_loss": -27.52351951599121, "global_step": 585201, "epoch": 7050} {"train_loss": -27.703567504882812, "global_step": 585202, "epoch": 7050} {"train_loss": -27.932010650634766, "global_step": 585203, "epoch": 7050} {"train_loss": -27.730777740478516, "global_step": 585204, "epoch": 7050} {"train_loss": -27.808340072631836, "global_step": 585205, "epoch": 7050} {"train_loss": -28.062841415405273, "global_step": 585206, "epoch": 7050} {"train_loss": -27.77052116394043, "global_step": 585207, "epoch": 7050} {"train_loss": -27.74233055114746, "global_step": 585208, "epoch": 7050} {"train_loss": -27.812549591064453, "global_step": 585209, "epoch": 7050} {"train_loss": -27.827890396118164, "global_step": 585210, "epoch": 7050} {"train_loss": -27.939544677734375, "global_step": 585211, "epoch": 7050} {"train_loss": -27.87135887145996, "global_step": 585212, "epoch": 7050} {"train_loss": -28.00314712524414, "global_step": 585213, "epoch": 7050} {"train_loss": -27.52018165588379, "global_step": 585214, "epoch": 7050} {"train_loss": -27.771345138549805, "global_step": 585215, "epoch": 7050} {"train_loss": -27.71588134765625, "global_step": 585216, "epoch": 7050} {"train_loss": -27.92500114440918, "global_step": 585217, "epoch": 7050} {"train_loss": -28.135162353515625, "global_step": 585218, "epoch": 7050} {"train_loss": -28.18861198425293, "global_step": 585219, "epoch": 7050} {"train_loss": -28.072172164916992, "global_step": 585220, "epoch": 7050} {"train_loss": -28.544713973999023, "global_step": 585221, "epoch": 7050} {"train_loss": -28.054229736328125, "global_step": 585222, "epoch": 7050} {"train_loss": -28.02277946472168, "global_step": 585223, "epoch": 7050} {"train_loss": -27.924976348876953, "global_step": 585224, "epoch": 7050} {"train_loss": -27.97467041015625, "global_step": 585225, "epoch": 7050} {"train_loss": -28.166120529174805, "global_step": 585226, "epoch": 7050} {"train_loss": -28.26661491394043, "global_step": 585227, "epoch": 7050} {"train_loss": -28.122516632080078, "global_step": 585228, "epoch": 7050} {"train_loss": -28.240741729736328, "global_step": 585229, "epoch": 7050} {"train_loss": -28.511032104492188, "global_step": 585230, "epoch": 7050} {"train_loss": -28.509389877319336, "global_step": 585231, "epoch": 7050} {"train_loss": -27.85818706650332, "global_step": 585232, "epoch": 7050, "train/sim_max_reward_0": 0.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 0.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4500000": 1.0, "test/sim_max_reward_4500001": 1.0, "test/sim_max_reward_4500002": 1.0, "test/sim_max_reward_4500003": 1.0, "test/sim_max_reward_4500004": 1.0, "test/sim_max_reward_4500005": 1.0, "test/sim_max_reward_4500006": 1.0, "test/sim_max_reward_4500007": 1.0, "test/sim_max_reward_4500008": 1.0, "test/sim_max_reward_4500009": 1.0, "test/sim_max_reward_4500010": 1.0, "test/sim_max_reward_4500011": 1.0, "test/sim_max_reward_4500012": 1.0, "test/sim_max_reward_4500013": 0.0, "test/sim_max_reward_4500014": 1.0, "test/sim_max_reward_4500015": 1.0, "test/sim_max_reward_4500016": 1.0, "test/sim_max_reward_4500017": 1.0, "test/sim_max_reward_4500018": 0.0, "test/sim_max_reward_4500019": 1.0, "test/sim_max_reward_4500020": 1.0, "test/sim_max_reward_4500021": 1.0, "train/mean_score": 0.6666666666666666, "test/mean_score": 0.9090909090909091, "val_loss": 6593809.0} {"train_loss": -27.666458129882812, "global_step": 585233, "epoch": 7051} {"train_loss": -27.24664306640625, "global_step": 585234, "epoch": 7051} {"train_loss": -27.571828842163086, "global_step": 585235, "epoch": 7051} {"train_loss": -27.19768714904785, "global_step": 585236, "epoch": 7051} {"train_loss": -27.17789077758789, "global_step": 585237, "epoch": 7051} {"train_loss": -27.40412712097168, "global_step": 585238, "epoch": 7051} {"train_loss": -27.290021896362305, "global_step": 585239, "epoch": 7051} {"train_loss": -27.25925064086914, "global_step": 585240, "epoch": 7051} {"train_loss": -26.853321075439453, "global_step": 585241, "epoch": 7051} {"train_loss": -27.156402587890625, "global_step": 585242, "epoch": 7051} {"train_loss": -27.55950355529785, "global_step": 585243, "epoch": 7051} {"train_loss": -28.09259033203125, "global_step": 585244, "epoch": 7051} {"train_loss": -27.48573112487793, "global_step": 585245, "epoch": 7051} {"train_loss": -28.151636123657227, "global_step": 585246, "epoch": 7051} {"train_loss": -27.451745986938477, "global_step": 585247, "epoch": 7051} {"train_loss": -27.589908599853516, "global_step": 585248, "epoch": 7051} {"train_loss": -27.5155029296875, "global_step": 585249, "epoch": 7051} {"train_loss": -27.75408935546875, "global_step": 585250, "epoch": 7051} {"train_loss": -27.78303337097168, "global_step": 585251, "epoch": 7051} {"train_loss": -27.8145809173584, "global_step": 585252, "epoch": 7051} {"train_loss": -28.1147403717041, "global_step": 585253, "epoch": 7051} {"train_loss": -28.056867599487305, "global_step": 585254, "epoch": 7051} {"train_loss": -27.894620895385742, "global_step": 585255, "epoch": 7051} {"train_loss": -27.900861740112305, "global_step": 585256, "epoch": 7051} {"train_loss": -28.255624771118164, "global_step": 585257, "epoch": 7051} {"train_loss": -28.026214599609375, "global_step": 585258, "epoch": 7051} {"train_loss": -28.039447784423828, "global_step": 585259, "epoch": 7051} {"train_loss": -28.008024215698242, "global_step": 585260, "epoch": 7051} {"train_loss": -28.241443634033203, "global_step": 585261, "epoch": 7051} {"train_loss": -27.84406089782715, "global_step": 585262, "epoch": 7051} {"train_loss": -27.962228775024414, "global_step": 585263, "epoch": 7051} {"train_loss": -27.92470359802246, "global_step": 585264, "epoch": 7051} {"train_loss": -27.729450225830078, "global_step": 585265, "epoch": 7051} {"train_loss": -28.1672420501709, "global_step": 585266, "epoch": 7051} {"train_loss": -28.079626083374023, "global_step": 585267, "epoch": 7051} {"train_loss": -28.56251335144043, "global_step": 585268, "epoch": 7051} {"train_loss": -28.2794246673584, "global_step": 585269, "epoch": 7051} {"train_loss": -28.04498291015625, "global_step": 585270, "epoch": 7051} {"train_loss": -27.943185806274414, "global_step": 585271, "epoch": 7051} {"train_loss": -27.779123306274414, "global_step": 585272, "epoch": 7051} {"train_loss": -28.347131729125977, "global_step": 585273, "epoch": 7051} {"train_loss": -28.115015029907227, "global_step": 585274, "epoch": 7051} {"train_loss": -28.429468154907227, "global_step": 585275, "epoch": 7051} {"train_loss": -27.896390914916992, "global_step": 585276, "epoch": 7051} {"train_loss": -27.82541275024414, "global_step": 585277, "epoch": 7051} {"train_loss": -27.918638229370117, "global_step": 585278, "epoch": 7051} {"train_loss": -28.5050048828125, "global_step": 585279, "epoch": 7051} {"train_loss": -28.043725967407227, "global_step": 585280, "epoch": 7051} {"train_loss": -27.54339599609375, "global_step": 585281, "epoch": 7051} {"train_loss": -28.05763053894043, "global_step": 585282, "epoch": 7051} {"train_loss": -27.789905548095703, "global_step": 585283, "epoch": 7051} {"train_loss": -27.795654296875, "global_step": 585284, "epoch": 7051} {"train_loss": -27.950305938720703, "global_step": 585285, "epoch": 7051} {"train_loss": -28.22233009338379, "global_step": 585286, "epoch": 7051} {"train_loss": -28.020267486572266, "global_step": 585287, "epoch": 7051} {"train_loss": -28.327713012695312, "global_step": 585288, "epoch": 7051} {"train_loss": -28.1354923248291, "global_step": 585289, "epoch": 7051} {"train_loss": -27.967792510986328, "global_step": 585290, "epoch": 7051} {"train_loss": -27.968732833862305, "global_step": 585291, "epoch": 7051} {"train_loss": -27.9616756439209, "global_step": 585292, "epoch": 7051} {"train_loss": -28.033023834228516, "global_step": 585293, "epoch": 7051} {"train_loss": -28.366912841796875, "global_step": 585294, "epoch": 7051} {"train_loss": -27.916461944580078, "global_step": 585295, "epoch": 7051} {"train_loss": -27.843154907226562, "global_step": 585296, "epoch": 7051} {"train_loss": -27.962860107421875, "global_step": 585297, "epoch": 7051} {"train_loss": -28.16768455505371, "global_step": 585298, "epoch": 7051} {"train_loss": -28.0234375, "global_step": 585299, "epoch": 7051} {"train_loss": -28.38132667541504, "global_step": 585300, "epoch": 7051} {"train_loss": -27.848957061767578, "global_step": 585301, "epoch": 7051} {"train_loss": -27.87575340270996, "global_step": 585302, "epoch": 7051} {"train_loss": -27.80350685119629, "global_step": 585303, "epoch": 7051} {"train_loss": -28.19272232055664, "global_step": 585304, "epoch": 7051} {"train_loss": -27.9905948638916, "global_step": 585305, "epoch": 7051} {"train_loss": -27.553985595703125, "global_step": 585306, "epoch": 7051} {"train_loss": -27.036407470703125, "global_step": 585307, "epoch": 7051} {"train_loss": -26.697446823120117, "global_step": 585308, "epoch": 7051} {"train_loss": -27.453161239624023, "global_step": 585309, "epoch": 7051} {"train_loss": -27.975202560424805, "global_step": 585310, "epoch": 7051} {"train_loss": -26.558673858642578, "global_step": 585311, "epoch": 7051} {"train_loss": -26.425806045532227, "global_step": 585312, "epoch": 7051} {"train_loss": -27.623611450195312, "global_step": 585313, "epoch": 7051} {"train_loss": -27.2994384765625, "global_step": 585314, "epoch": 7051} {"train_loss": -27.80485805833196, "global_step": 585315, "epoch": 7051, "val_loss": 6599592.0} {"train_loss": -26.267648696899414, "global_step": 585316, "epoch": 7052} {"train_loss": -27.423925399780273, "global_step": 585317, "epoch": 7052} {"train_loss": -26.499197006225586, "global_step": 585318, "epoch": 7052} {"train_loss": -27.387365341186523, "global_step": 585319, "epoch": 7052} {"train_loss": -26.61849021911621, "global_step": 585320, "epoch": 7052} {"train_loss": -26.641504287719727, "global_step": 585321, "epoch": 7052} {"train_loss": -27.432355880737305, "global_step": 585322, "epoch": 7052} {"train_loss": -27.179920196533203, "global_step": 585323, "epoch": 7052} {"train_loss": -26.977691650390625, "global_step": 585324, "epoch": 7052} {"train_loss": -27.419570922851562, "global_step": 585325, "epoch": 7052} {"train_loss": -27.554224014282227, "global_step": 585326, "epoch": 7052} {"train_loss": -27.447479248046875, "global_step": 585327, "epoch": 7052} {"train_loss": -27.254169464111328, "global_step": 585328, "epoch": 7052} {"train_loss": -27.182952880859375, "global_step": 585329, "epoch": 7052} {"train_loss": -27.364704132080078, "global_step": 585330, "epoch": 7052} {"train_loss": -27.071125030517578, "global_step": 585331, "epoch": 7052} {"train_loss": -27.415802001953125, "global_step": 585332, "epoch": 7052} {"train_loss": -26.901203155517578, "global_step": 585333, "epoch": 7052} {"train_loss": -27.54352378845215, "global_step": 585334, "epoch": 7052} {"train_loss": -27.647302627563477, "global_step": 585335, "epoch": 7052} {"train_loss": -27.537580490112305, "global_step": 585336, "epoch": 7052} {"train_loss": -28.003381729125977, "global_step": 585337, "epoch": 7052} {"train_loss": -27.58770179748535, "global_step": 585338, "epoch": 7052} {"train_loss": -27.775114059448242, "global_step": 585339, "epoch": 7052} {"train_loss": -27.748798370361328, "global_step": 585340, "epoch": 7052} {"train_loss": -27.908384323120117, "global_step": 585341, "epoch": 7052} {"train_loss": -27.44207763671875, "global_step": 585342, "epoch": 7052} {"train_loss": -27.73841667175293, "global_step": 585343, "epoch": 7052} {"train_loss": -27.83735466003418, "global_step": 585344, "epoch": 7052} {"train_loss": -28.1777286529541, "global_step": 585345, "epoch": 7052} {"train_loss": -27.984689712524414, "global_step": 585346, "epoch": 7052} {"train_loss": -27.900522232055664, "global_step": 585347, "epoch": 7052} {"train_loss": -28.07960319519043, "global_step": 585348, "epoch": 7052} {"train_loss": -27.77400779724121, "global_step": 585349, "epoch": 7052} {"train_loss": -27.702375411987305, "global_step": 585350, "epoch": 7052} {"train_loss": -27.859228134155273, "global_step": 585351, "epoch": 7052} {"train_loss": -27.822553634643555, "global_step": 585352, "epoch": 7052} {"train_loss": -28.206708908081055, "global_step": 585353, "epoch": 7052} {"train_loss": -27.729827880859375, "global_step": 585354, "epoch": 7052} {"train_loss": -28.03742027282715, "global_step": 585355, "epoch": 7052} {"train_loss": -28.184656143188477, "global_step": 585356, "epoch": 7052} {"train_loss": -27.978490829467773, "global_step": 585357, "epoch": 7052} {"train_loss": -28.12531852722168, "global_step": 585358, "epoch": 7052} {"train_loss": -28.388259887695312, "global_step": 585359, "epoch": 7052} {"train_loss": -28.078474044799805, "global_step": 585360, "epoch": 7052} {"train_loss": -27.895612716674805, "global_step": 585361, "epoch": 7052} {"train_loss": -27.64959144592285, "global_step": 585362, "epoch": 7052} {"train_loss": -27.8459529876709, "global_step": 585363, "epoch": 7052} {"train_loss": -28.052291870117188, "global_step": 585364, "epoch": 7052} {"train_loss": -27.7174129486084, "global_step": 585365, "epoch": 7052} {"train_loss": -28.15838623046875, "global_step": 585366, "epoch": 7052} {"train_loss": -27.70700454711914, "global_step": 585367, "epoch": 7052} {"train_loss": -28.039541244506836, "global_step": 585368, "epoch": 7052} {"train_loss": -28.137359619140625, "global_step": 585369, "epoch": 7052} {"train_loss": -28.004047393798828, "global_step": 585370, "epoch": 7052} {"train_loss": -28.075016021728516, "global_step": 585371, "epoch": 7052} {"train_loss": -28.125158309936523, "global_step": 585372, "epoch": 7052} {"train_loss": -28.10515785217285, "global_step": 585373, "epoch": 7052} {"train_loss": -27.943897247314453, "global_step": 585374, "epoch": 7052} {"train_loss": -28.192829132080078, "global_step": 585375, "epoch": 7052} {"train_loss": -28.411645889282227, "global_step": 585376, "epoch": 7052} {"train_loss": -28.168842315673828, "global_step": 585377, "epoch": 7052} {"train_loss": -27.74716567993164, "global_step": 585378, "epoch": 7052} {"train_loss": -28.334308624267578, "global_step": 585379, "epoch": 7052} {"train_loss": -28.337085723876953, "global_step": 585380, "epoch": 7052} {"train_loss": -28.551166534423828, "global_step": 585381, "epoch": 7052} {"train_loss": -28.285297393798828, "global_step": 585382, "epoch": 7052} {"train_loss": -28.239591598510742, "global_step": 585383, "epoch": 7052} {"train_loss": -28.30549430847168, "global_step": 585384, "epoch": 7052} {"train_loss": -28.009061813354492, "global_step": 585385, "epoch": 7052} {"train_loss": -28.043684005737305, "global_step": 585386, "epoch": 7052} {"train_loss": -28.383392333984375, "global_step": 585387, "epoch": 7052} {"train_loss": -27.750104904174805, "global_step": 585388, "epoch": 7052} {"train_loss": -27.778226852416992, "global_step": 585389, "epoch": 7052} {"train_loss": -27.843469619750977, "global_step": 585390, "epoch": 7052} {"train_loss": -27.9814510345459, "global_step": 585391, "epoch": 7052} {"train_loss": -27.822412490844727, "global_step": 585392, "epoch": 7052} {"train_loss": -27.415054321289062, "global_step": 585393, "epoch": 7052} {"train_loss": -26.64190101623535, "global_step": 585394, "epoch": 7052} {"train_loss": -26.872119903564453, "global_step": 585395, "epoch": 7052} {"train_loss": -26.845361709594727, "global_step": 585396, "epoch": 7052} {"train_loss": -27.03285026550293, "global_step": 585397, "epoch": 7052} {"train_loss": -27.724495255803486, "global_step": 585398, "epoch": 7052, "val_loss": 6592968.0} {"train_loss": -25.349430084228516, "global_step": 585399, "epoch": 7053} {"train_loss": -26.377145767211914, "global_step": 585400, "epoch": 7053} {"train_loss": -25.665441513061523, "global_step": 585401, "epoch": 7053} {"train_loss": -25.21140480041504, "global_step": 585402, "epoch": 7053} {"train_loss": -26.2209415435791, "global_step": 585403, "epoch": 7053} {"train_loss": -26.56743812561035, "global_step": 585404, "epoch": 7053} {"train_loss": -26.388341903686523, "global_step": 585405, "epoch": 7053} {"train_loss": -26.98847007751465, "global_step": 585406, "epoch": 7053} {"train_loss": -26.495344161987305, "global_step": 585407, "epoch": 7053} {"train_loss": -26.619876861572266, "global_step": 585408, "epoch": 7053} {"train_loss": -26.893362045288086, "global_step": 585409, "epoch": 7053} {"train_loss": -26.471637725830078, "global_step": 585410, "epoch": 7053} {"train_loss": -26.861173629760742, "global_step": 585411, "epoch": 7053} {"train_loss": -26.891698837280273, "global_step": 585412, "epoch": 7053} {"train_loss": -26.552108764648438, "global_step": 585413, "epoch": 7053} {"train_loss": -26.987350463867188, "global_step": 585414, "epoch": 7053} {"train_loss": -27.063932418823242, "global_step": 585415, "epoch": 7053} {"train_loss": -26.8630313873291, "global_step": 585416, "epoch": 7053} {"train_loss": -26.80781364440918, "global_step": 585417, "epoch": 7053} {"train_loss": -27.3455867767334, "global_step": 585418, "epoch": 7053} {"train_loss": -27.054182052612305, "global_step": 585419, "epoch": 7053} {"train_loss": -26.93366813659668, "global_step": 585420, "epoch": 7053} {"train_loss": -27.309406280517578, "global_step": 585421, "epoch": 7053} {"train_loss": -27.268848419189453, "global_step": 585422, "epoch": 7053} {"train_loss": -27.322067260742188, "global_step": 585423, "epoch": 7053} {"train_loss": -27.328195571899414, "global_step": 585424, "epoch": 7053} {"train_loss": -27.255817413330078, "global_step": 585425, "epoch": 7053} {"train_loss": -27.4272518157959, "global_step": 585426, "epoch": 7053} {"train_loss": -27.262897491455078, "global_step": 585427, "epoch": 7053} {"train_loss": -27.671247482299805, "global_step": 585428, "epoch": 7053} {"train_loss": -27.29193687438965, "global_step": 585429, "epoch": 7053} {"train_loss": -27.56800651550293, "global_step": 585430, "epoch": 7053} {"train_loss": -27.3326358795166, "global_step": 585431, "epoch": 7053} {"train_loss": -27.717193603515625, "global_step": 585432, "epoch": 7053} {"train_loss": -27.973901748657227, "global_step": 585433, "epoch": 7053} {"train_loss": -27.958389282226562, "global_step": 585434, "epoch": 7053} {"train_loss": -27.489362716674805, "global_step": 585435, "epoch": 7053} {"train_loss": -27.62900733947754, "global_step": 585436, "epoch": 7053} {"train_loss": -27.817716598510742, "global_step": 585437, "epoch": 7053} {"train_loss": -27.87543296813965, "global_step": 585438, "epoch": 7053} {"train_loss": -27.627683639526367, "global_step": 585439, "epoch": 7053} {"train_loss": -28.0697021484375, "global_step": 585440, "epoch": 7053} {"train_loss": -27.895294189453125, "global_step": 585441, "epoch": 7053} {"train_loss": -28.021411895751953, "global_step": 585442, "epoch": 7053} {"train_loss": -27.72279930114746, "global_step": 585443, "epoch": 7053} {"train_loss": -28.03940200805664, "global_step": 585444, "epoch": 7053} {"train_loss": -27.7393798828125, "global_step": 585445, "epoch": 7053} {"train_loss": -27.801061630249023, "global_step": 585446, "epoch": 7053} {"train_loss": -27.828134536743164, "global_step": 585447, "epoch": 7053} {"train_loss": -28.311960220336914, "global_step": 585448, "epoch": 7053} {"train_loss": -28.127546310424805, "global_step": 585449, "epoch": 7053} {"train_loss": -27.99066734313965, "global_step": 585450, "epoch": 7053} {"train_loss": -27.845239639282227, "global_step": 585451, "epoch": 7053} {"train_loss": -28.3837947845459, "global_step": 585452, "epoch": 7053} {"train_loss": -28.417999267578125, "global_step": 585453, "epoch": 7053} {"train_loss": -28.069177627563477, "global_step": 585454, "epoch": 7053} {"train_loss": -28.170629501342773, "global_step": 585455, "epoch": 7053} {"train_loss": -28.0720157623291, "global_step": 585456, "epoch": 7053} {"train_loss": -28.02294921875, "global_step": 585457, "epoch": 7053} {"train_loss": -28.07075309753418, "global_step": 585458, "epoch": 7053} {"train_loss": -27.979461669921875, "global_step": 585459, "epoch": 7053} {"train_loss": -28.279367446899414, "global_step": 585460, "epoch": 7053} {"train_loss": -27.884368896484375, "global_step": 585461, "epoch": 7053} {"train_loss": -28.152210235595703, "global_step": 585462, "epoch": 7053} {"train_loss": -28.15974235534668, "global_step": 585463, "epoch": 7053} {"train_loss": -27.88465690612793, "global_step": 585464, "epoch": 7053} {"train_loss": -27.903778076171875, "global_step": 585465, "epoch": 7053} {"train_loss": -28.118350982666016, "global_step": 585466, "epoch": 7053} {"train_loss": -27.937597274780273, "global_step": 585467, "epoch": 7053} {"train_loss": -28.05836296081543, "global_step": 585468, "epoch": 7053} {"train_loss": -28.32279396057129, "global_step": 585469, "epoch": 7053} {"train_loss": -28.08088493347168, "global_step": 585470, "epoch": 7053} {"train_loss": -28.1469783782959, "global_step": 585471, "epoch": 7053} {"train_loss": -28.337568283081055, "global_step": 585472, "epoch": 7053} {"train_loss": -27.92820167541504, "global_step": 585473, "epoch": 7053} {"train_loss": -28.478300094604492, "global_step": 585474, "epoch": 7053} {"train_loss": -28.353254318237305, "global_step": 585475, "epoch": 7053} {"train_loss": -28.195636749267578, "global_step": 585476, "epoch": 7053} {"train_loss": -28.16633415222168, "global_step": 585477, "epoch": 7053} {"train_loss": -28.0789794921875, "global_step": 585478, "epoch": 7053} {"train_loss": -27.900129318237305, "global_step": 585479, "epoch": 7053} {"train_loss": -27.79694175720215, "global_step": 585480, "epoch": 7053} {"train_loss": -27.532808993236127, "global_step": 585481, "epoch": 7053, "val_loss": 6556159.0} {"train_loss": -27.542621612548828, "global_step": 585482, "epoch": 7054} {"train_loss": -26.951887130737305, "global_step": 585483, "epoch": 7054} {"train_loss": -27.610868453979492, "global_step": 585484, "epoch": 7054} {"train_loss": -27.123754501342773, "global_step": 585485, "epoch": 7054} {"train_loss": -26.72649574279785, "global_step": 585486, "epoch": 7054} {"train_loss": -27.503286361694336, "global_step": 585487, "epoch": 7054} {"train_loss": -27.395587921142578, "global_step": 585488, "epoch": 7054} {"train_loss": -27.11456871032715, "global_step": 585489, "epoch": 7054} {"train_loss": -27.160327911376953, "global_step": 585490, "epoch": 7054} {"train_loss": -27.383121490478516, "global_step": 585491, "epoch": 7054} {"train_loss": -27.11005210876465, "global_step": 585492, "epoch": 7054} {"train_loss": -27.1029052734375, "global_step": 585493, "epoch": 7054} {"train_loss": -27.498926162719727, "global_step": 585494, "epoch": 7054} {"train_loss": -27.280654907226562, "global_step": 585495, "epoch": 7054} {"train_loss": -27.59784507751465, "global_step": 585496, "epoch": 7054} {"train_loss": -27.59303092956543, "global_step": 585497, "epoch": 7054} {"train_loss": -27.3670597076416, "global_step": 585498, "epoch": 7054} {"train_loss": -27.89472007751465, "global_step": 585499, "epoch": 7054} {"train_loss": -27.529438018798828, "global_step": 585500, "epoch": 7054} {"train_loss": -27.630056381225586, "global_step": 585501, "epoch": 7054} {"train_loss": -27.72487449645996, "global_step": 585502, "epoch": 7054} {"train_loss": -27.8568172454834, "global_step": 585503, "epoch": 7054} {"train_loss": -27.90693473815918, "global_step": 585504, "epoch": 7054} {"train_loss": -27.617284774780273, "global_step": 585505, "epoch": 7054} {"train_loss": -27.534290313720703, "global_step": 585506, "epoch": 7054} {"train_loss": -27.60369300842285, "global_step": 585507, "epoch": 7054} {"train_loss": -27.72991943359375, "global_step": 585508, "epoch": 7054} {"train_loss": -27.770660400390625, "global_step": 585509, "epoch": 7054} {"train_loss": -28.147022247314453, "global_step": 585510, "epoch": 7054} {"train_loss": -27.80865478515625, "global_step": 585511, "epoch": 7054} {"train_loss": -27.66912841796875, "global_step": 585512, "epoch": 7054} {"train_loss": -28.0069637298584, "global_step": 585513, "epoch": 7054} {"train_loss": -27.9014949798584, "global_step": 585514, "epoch": 7054} {"train_loss": -28.14306640625, "global_step": 585515, "epoch": 7054} {"train_loss": -28.021106719970703, "global_step": 585516, "epoch": 7054} {"train_loss": -27.835912704467773, "global_step": 585517, "epoch": 7054} {"train_loss": -27.796661376953125, "global_step": 585518, "epoch": 7054} {"train_loss": -28.28704833984375, "global_step": 585519, "epoch": 7054} {"train_loss": -28.01582908630371, "global_step": 585520, "epoch": 7054} {"train_loss": -28.121784210205078, "global_step": 585521, "epoch": 7054} {"train_loss": -28.283628463745117, "global_step": 585522, "epoch": 7054} {"train_loss": -28.3161563873291, "global_step": 585523, "epoch": 7054} {"train_loss": -27.906824111938477, "global_step": 585524, "epoch": 7054} {"train_loss": -27.98882484436035, "global_step": 585525, "epoch": 7054} {"train_loss": -28.28827476501465, "global_step": 585526, "epoch": 7054} {"train_loss": -27.94032096862793, "global_step": 585527, "epoch": 7054} {"train_loss": -28.089696884155273, "global_step": 585528, "epoch": 7054} {"train_loss": -27.892541885375977, "global_step": 585529, "epoch": 7054} {"train_loss": -28.190114974975586, "global_step": 585530, "epoch": 7054} {"train_loss": -27.962326049804688, "global_step": 585531, "epoch": 7054} {"train_loss": -28.395612716674805, "global_step": 585532, "epoch": 7054} {"train_loss": -28.10030174255371, "global_step": 585533, "epoch": 7054} {"train_loss": -28.118377685546875, "global_step": 585534, "epoch": 7054} {"train_loss": -28.30266761779785, "global_step": 585535, "epoch": 7054} {"train_loss": -28.257476806640625, "global_step": 585536, "epoch": 7054} {"train_loss": -27.807056427001953, "global_step": 585537, "epoch": 7054} {"train_loss": -27.358280181884766, "global_step": 585538, "epoch": 7054} {"train_loss": -26.8415470123291, "global_step": 585539, "epoch": 7054} {"train_loss": -27.137619018554688, "global_step": 585540, "epoch": 7054} {"train_loss": -28.267749786376953, "global_step": 585541, "epoch": 7054} {"train_loss": -27.445194244384766, "global_step": 585542, "epoch": 7054} {"train_loss": -27.223922729492188, "global_step": 585543, "epoch": 7054} {"train_loss": -26.81209373474121, "global_step": 585544, "epoch": 7054} {"train_loss": -27.123611450195312, "global_step": 585545, "epoch": 7054} {"train_loss": -27.78773307800293, "global_step": 585546, "epoch": 7054} {"train_loss": -27.61214256286621, "global_step": 585547, "epoch": 7054} {"train_loss": -27.144397735595703, "global_step": 585548, "epoch": 7054} {"train_loss": -27.33854103088379, "global_step": 585549, "epoch": 7054} {"train_loss": -27.56987953186035, "global_step": 585550, "epoch": 7054} {"train_loss": -27.5449161529541, "global_step": 585551, "epoch": 7054} {"train_loss": -27.68495750427246, "global_step": 585552, "epoch": 7054} {"train_loss": -27.412336349487305, "global_step": 585553, "epoch": 7054} {"train_loss": -27.498865127563477, "global_step": 585554, "epoch": 7054} {"train_loss": -27.94122886657715, "global_step": 585555, "epoch": 7054} {"train_loss": -27.68292808532715, "global_step": 585556, "epoch": 7054} {"train_loss": -28.05316734313965, "global_step": 585557, "epoch": 7054} {"train_loss": -27.897748947143555, "global_step": 585558, "epoch": 7054} {"train_loss": -27.93427085876465, "global_step": 585559, "epoch": 7054} {"train_loss": -27.727283477783203, "global_step": 585560, "epoch": 7054} {"train_loss": -27.702627182006836, "global_step": 585561, "epoch": 7054} {"train_loss": -27.582019805908203, "global_step": 585562, "epoch": 7054} {"train_loss": -27.91822624206543, "global_step": 585563, "epoch": 7054} {"train_loss": -27.693693344851575, "global_step": 585564, "epoch": 7054, "val_loss": 6509249.0} {"train_loss": -27.315357208251953, "global_step": 585565, "epoch": 7055} {"train_loss": -26.271841049194336, "global_step": 585566, "epoch": 7055} {"train_loss": -26.848834991455078, "global_step": 585567, "epoch": 7055} {"train_loss": -27.45111083984375, "global_step": 585568, "epoch": 7055} {"train_loss": -27.034717559814453, "global_step": 585569, "epoch": 7055} {"train_loss": -26.070737838745117, "global_step": 585570, "epoch": 7055} {"train_loss": -27.336294174194336, "global_step": 585571, "epoch": 7055} {"train_loss": -27.439868927001953, "global_step": 585572, "epoch": 7055} {"train_loss": -27.750085830688477, "global_step": 585573, "epoch": 7055} {"train_loss": -27.3089542388916, "global_step": 585574, "epoch": 7055} {"train_loss": -27.33233642578125, "global_step": 585575, "epoch": 7055} {"train_loss": -27.339399337768555, "global_step": 585576, "epoch": 7055} {"train_loss": -27.257476806640625, "global_step": 585577, "epoch": 7055} {"train_loss": -27.448034286499023, "global_step": 585578, "epoch": 7055} {"train_loss": -27.323627471923828, "global_step": 585579, "epoch": 7055} {"train_loss": -27.868192672729492, "global_step": 585580, "epoch": 7055} {"train_loss": -27.54996681213379, "global_step": 585581, "epoch": 7055} {"train_loss": -27.9405574798584, "global_step": 585582, "epoch": 7055} {"train_loss": -27.661670684814453, "global_step": 585583, "epoch": 7055} {"train_loss": -27.602148056030273, "global_step": 585584, "epoch": 7055} {"train_loss": -27.778066635131836, "global_step": 585585, "epoch": 7055} {"train_loss": -27.978546142578125, "global_step": 585586, "epoch": 7055} {"train_loss": -27.844812393188477, "global_step": 585587, "epoch": 7055} {"train_loss": -27.664098739624023, "global_step": 585588, "epoch": 7055} {"train_loss": -27.845346450805664, "global_step": 585589, "epoch": 7055} {"train_loss": -27.656402587890625, "global_step": 585590, "epoch": 7055} {"train_loss": -27.57062339782715, "global_step": 585591, "epoch": 7055} {"train_loss": -28.036518096923828, "global_step": 585592, "epoch": 7055} {"train_loss": -27.716339111328125, "global_step": 585593, "epoch": 7055} {"train_loss": -27.881467819213867, "global_step": 585594, "epoch": 7055} {"train_loss": -27.876943588256836, "global_step": 585595, "epoch": 7055} {"train_loss": -27.83685874938965, "global_step": 585596, "epoch": 7055} {"train_loss": -27.897430419921875, "global_step": 585597, "epoch": 7055} {"train_loss": -28.1678409576416, "global_step": 585598, "epoch": 7055} {"train_loss": -27.988037109375, "global_step": 585599, "epoch": 7055} {"train_loss": -27.83890724182129, "global_step": 585600, "epoch": 7055} {"train_loss": -28.265823364257812, "global_step": 585601, "epoch": 7055} {"train_loss": -27.775989532470703, "global_step": 585602, "epoch": 7055} {"train_loss": -28.081680297851562, "global_step": 585603, "epoch": 7055} {"train_loss": -27.990848541259766, "global_step": 585604, "epoch": 7055} {"train_loss": -27.544015884399414, "global_step": 585605, "epoch": 7055} {"train_loss": -27.988815307617188, "global_step": 585606, "epoch": 7055} {"train_loss": -27.920917510986328, "global_step": 585607, "epoch": 7055} {"train_loss": -27.674970626831055, "global_step": 585608, "epoch": 7055} {"train_loss": -28.047683715820312, "global_step": 585609, "epoch": 7055} {"train_loss": -27.75018310546875, "global_step": 585610, "epoch": 7055} {"train_loss": -27.751630783081055, "global_step": 585611, "epoch": 7055} {"train_loss": -27.5707950592041, "global_step": 585612, "epoch": 7055} {"train_loss": -27.766101837158203, "global_step": 585613, "epoch": 7055} {"train_loss": -28.040369033813477, "global_step": 585614, "epoch": 7055} {"train_loss": -28.021543502807617, "global_step": 585615, "epoch": 7055} {"train_loss": -27.9920597076416, "global_step": 585616, "epoch": 7055} {"train_loss": -28.113534927368164, "global_step": 585617, "epoch": 7055} {"train_loss": -28.2087345123291, "global_step": 585618, "epoch": 7055} {"train_loss": -28.06770133972168, "global_step": 585619, "epoch": 7055} {"train_loss": -28.394824981689453, "global_step": 585620, "epoch": 7055} {"train_loss": -27.936832427978516, "global_step": 585621, "epoch": 7055} {"train_loss": -28.263540267944336, "global_step": 585622, "epoch": 7055} {"train_loss": -27.91107749938965, "global_step": 585623, "epoch": 7055} {"train_loss": -28.222671508789062, "global_step": 585624, "epoch": 7055} {"train_loss": -28.4073486328125, "global_step": 585625, "epoch": 7055} {"train_loss": -28.422195434570312, "global_step": 585626, "epoch": 7055} {"train_loss": -27.905813217163086, "global_step": 585627, "epoch": 7055} {"train_loss": -27.9936466217041, "global_step": 585628, "epoch": 7055} {"train_loss": -28.122068405151367, "global_step": 585629, "epoch": 7055} {"train_loss": -27.81976890563965, "global_step": 585630, "epoch": 7055} {"train_loss": -27.9114933013916, "global_step": 585631, "epoch": 7055} {"train_loss": -27.81612205505371, "global_step": 585632, "epoch": 7055} {"train_loss": -28.022327423095703, "global_step": 585633, "epoch": 7055} {"train_loss": -27.723514556884766, "global_step": 585634, "epoch": 7055} {"train_loss": -28.087148666381836, "global_step": 585635, "epoch": 7055} {"train_loss": -28.14872169494629, "global_step": 585636, "epoch": 7055} {"train_loss": -27.6943302154541, "global_step": 585637, "epoch": 7055} {"train_loss": -27.97906494140625, "global_step": 585638, "epoch": 7055} {"train_loss": -28.4470157623291, "global_step": 585639, "epoch": 7055} {"train_loss": -28.0220947265625, "global_step": 585640, "epoch": 7055} {"train_loss": -28.324539184570312, "global_step": 585641, "epoch": 7055} {"train_loss": -28.23305320739746, "global_step": 585642, "epoch": 7055} {"train_loss": -28.184101104736328, "global_step": 585643, "epoch": 7055} {"train_loss": -28.389493942260742, "global_step": 585644, "epoch": 7055} {"train_loss": -28.339353561401367, "global_step": 585645, "epoch": 7055} {"train_loss": -27.999540328979492, "global_step": 585646, "epoch": 7055} {"train_loss": -27.81842493723674, "global_step": 585647, "epoch": 7055, "val_loss": 6503830.0} {"train_loss": -25.97743034362793, "global_step": 585648, "epoch": 7056} {"train_loss": -24.17995262145996, "global_step": 585649, "epoch": 7056} {"train_loss": -26.817996978759766, "global_step": 585650, "epoch": 7056} {"train_loss": -27.086957931518555, "global_step": 585651, "epoch": 7056} {"train_loss": -26.06646728515625, "global_step": 585652, "epoch": 7056} {"train_loss": -26.972436904907227, "global_step": 585653, "epoch": 7056} {"train_loss": -26.411970138549805, "global_step": 585654, "epoch": 7056} {"train_loss": -26.944299697875977, "global_step": 585655, "epoch": 7056} {"train_loss": -27.263904571533203, "global_step": 585656, "epoch": 7056} {"train_loss": -27.06142234802246, "global_step": 585657, "epoch": 7056} {"train_loss": -27.076269149780273, "global_step": 585658, "epoch": 7056} {"train_loss": -27.29570960998535, "global_step": 585659, "epoch": 7056} {"train_loss": -27.0139102935791, "global_step": 585660, "epoch": 7056} {"train_loss": -27.27974510192871, "global_step": 585661, "epoch": 7056} {"train_loss": -27.261484146118164, "global_step": 585662, "epoch": 7056} {"train_loss": -27.215656280517578, "global_step": 585663, "epoch": 7056} {"train_loss": -27.473072052001953, "global_step": 585664, "epoch": 7056} {"train_loss": -27.57861328125, "global_step": 585665, "epoch": 7056} {"train_loss": -27.460363388061523, "global_step": 585666, "epoch": 7056} {"train_loss": -27.446008682250977, "global_step": 585667, "epoch": 7056} {"train_loss": -27.5628719329834, "global_step": 585668, "epoch": 7056} {"train_loss": -27.671125411987305, "global_step": 585669, "epoch": 7056} {"train_loss": -27.448938369750977, "global_step": 585670, "epoch": 7056} {"train_loss": -27.466175079345703, "global_step": 585671, "epoch": 7056} {"train_loss": -27.54876708984375, "global_step": 585672, "epoch": 7056} {"train_loss": -27.48589515686035, "global_step": 585673, "epoch": 7056} {"train_loss": -27.379138946533203, "global_step": 585674, "epoch": 7056} {"train_loss": -27.609683990478516, "global_step": 585675, "epoch": 7056} {"train_loss": -27.573942184448242, "global_step": 585676, "epoch": 7056} {"train_loss": -27.516077041625977, "global_step": 585677, "epoch": 7056} {"train_loss": -28.171842575073242, "global_step": 585678, "epoch": 7056} {"train_loss": -27.499164581298828, "global_step": 585679, "epoch": 7056} {"train_loss": -28.034320831298828, "global_step": 585680, "epoch": 7056} {"train_loss": -27.928226470947266, "global_step": 585681, "epoch": 7056} {"train_loss": -27.450332641601562, "global_step": 585682, "epoch": 7056} {"train_loss": -27.749649047851562, "global_step": 585683, "epoch": 7056} {"train_loss": -27.810327529907227, "global_step": 585684, "epoch": 7056} {"train_loss": -27.66641616821289, "global_step": 585685, "epoch": 7056} {"train_loss": -27.782379150390625, "global_step": 585686, "epoch": 7056} {"train_loss": -27.832691192626953, "global_step": 585687, "epoch": 7056} {"train_loss": -27.707660675048828, "global_step": 585688, "epoch": 7056} {"train_loss": -27.734663009643555, "global_step": 585689, "epoch": 7056} {"train_loss": -27.77039909362793, "global_step": 585690, "epoch": 7056} {"train_loss": -27.750940322875977, "global_step": 585691, "epoch": 7056} {"train_loss": -28.075536727905273, "global_step": 585692, "epoch": 7056} {"train_loss": -28.056320190429688, "global_step": 585693, "epoch": 7056} {"train_loss": -28.075855255126953, "global_step": 585694, "epoch": 7056} {"train_loss": -27.864429473876953, "global_step": 585695, "epoch": 7056} {"train_loss": -27.8222713470459, "global_step": 585696, "epoch": 7056} {"train_loss": -28.64106559753418, "global_step": 585697, "epoch": 7056} {"train_loss": -27.977827072143555, "global_step": 585698, "epoch": 7056} {"train_loss": -27.9534854888916, "global_step": 585699, "epoch": 7056} {"train_loss": -28.401187896728516, "global_step": 585700, "epoch": 7056} {"train_loss": -27.938404083251953, "global_step": 585701, "epoch": 7056} {"train_loss": -28.241989135742188, "global_step": 585702, "epoch": 7056} {"train_loss": -28.402851104736328, "global_step": 585703, "epoch": 7056} {"train_loss": -28.052167892456055, "global_step": 585704, "epoch": 7056} {"train_loss": -27.802764892578125, "global_step": 585705, "epoch": 7056} {"train_loss": -27.828815460205078, "global_step": 585706, "epoch": 7056} {"train_loss": -27.88286781311035, "global_step": 585707, "epoch": 7056} {"train_loss": -28.06281852722168, "global_step": 585708, "epoch": 7056} {"train_loss": -28.497882843017578, "global_step": 585709, "epoch": 7056} {"train_loss": -27.97792625427246, "global_step": 585710, "epoch": 7056} {"train_loss": -28.090375900268555, "global_step": 585711, "epoch": 7056} {"train_loss": -28.4464168548584, "global_step": 585712, "epoch": 7056} {"train_loss": -28.291229248046875, "global_step": 585713, "epoch": 7056} {"train_loss": -28.11383628845215, "global_step": 585714, "epoch": 7056} {"train_loss": -27.920835494995117, "global_step": 585715, "epoch": 7056} {"train_loss": -27.994443893432617, "global_step": 585716, "epoch": 7056} {"train_loss": -28.188156127929688, "global_step": 585717, "epoch": 7056} {"train_loss": -27.758039474487305, "global_step": 585718, "epoch": 7056} {"train_loss": -27.986413955688477, "global_step": 585719, "epoch": 7056} {"train_loss": -27.753131866455078, "global_step": 585720, "epoch": 7056} {"train_loss": -28.073461532592773, "global_step": 585721, "epoch": 7056} {"train_loss": -27.80160903930664, "global_step": 585722, "epoch": 7056} {"train_loss": -27.010334014892578, "global_step": 585723, "epoch": 7056} {"train_loss": -26.943700790405273, "global_step": 585724, "epoch": 7056} {"train_loss": -26.831151962280273, "global_step": 585725, "epoch": 7056} {"train_loss": -27.100027084350586, "global_step": 585726, "epoch": 7056} {"train_loss": -27.33401870727539, "global_step": 585727, "epoch": 7056} {"train_loss": -27.347904205322266, "global_step": 585728, "epoch": 7056} {"train_loss": -27.318511962890625, "global_step": 585729, "epoch": 7056} {"train_loss": -27.592507098094526, "global_step": 585730, "epoch": 7056, "val_loss": 6524130.5} {"train_loss": -26.339406967163086, "global_step": 585731, "epoch": 7057} {"train_loss": -26.659805297851562, "global_step": 585732, "epoch": 7057} {"train_loss": -26.466901779174805, "global_step": 585733, "epoch": 7057} {"train_loss": -26.236907958984375, "global_step": 585734, "epoch": 7057} {"train_loss": -26.698413848876953, "global_step": 585735, "epoch": 7057} {"train_loss": -26.26470375061035, "global_step": 585736, "epoch": 7057} {"train_loss": -25.32581329345703, "global_step": 585737, "epoch": 7057} {"train_loss": -27.047718048095703, "global_step": 585738, "epoch": 7057} {"train_loss": -26.809019088745117, "global_step": 585739, "epoch": 7057} {"train_loss": -26.8841552734375, "global_step": 585740, "epoch": 7057} {"train_loss": -26.15228271484375, "global_step": 585741, "epoch": 7057} {"train_loss": -26.587177276611328, "global_step": 585742, "epoch": 7057} {"train_loss": -27.065439224243164, "global_step": 585743, "epoch": 7057} {"train_loss": -27.13092613220215, "global_step": 585744, "epoch": 7057} {"train_loss": -26.95516014099121, "global_step": 585745, "epoch": 7057} {"train_loss": -27.14749526977539, "global_step": 585746, "epoch": 7057} {"train_loss": -27.01312828063965, "global_step": 585747, "epoch": 7057} {"train_loss": -27.444482803344727, "global_step": 585748, "epoch": 7057} {"train_loss": -26.950271606445312, "global_step": 585749, "epoch": 7057} {"train_loss": -27.264514923095703, "global_step": 585750, "epoch": 7057} {"train_loss": -27.420886993408203, "global_step": 585751, "epoch": 7057} {"train_loss": -27.01032829284668, "global_step": 585752, "epoch": 7057} {"train_loss": -27.670734405517578, "global_step": 585753, "epoch": 7057} {"train_loss": -27.247541427612305, "global_step": 585754, "epoch": 7057} {"train_loss": -27.067182540893555, "global_step": 585755, "epoch": 7057} {"train_loss": -27.508405685424805, "global_step": 585756, "epoch": 7057} {"train_loss": -27.68910026550293, "global_step": 585757, "epoch": 7057} {"train_loss": -27.61614990234375, "global_step": 585758, "epoch": 7057} {"train_loss": -27.455005645751953, "global_step": 585759, "epoch": 7057} {"train_loss": -27.7407283782959, "global_step": 585760, "epoch": 7057} {"train_loss": -27.90797233581543, "global_step": 585761, "epoch": 7057} {"train_loss": -27.536230087280273, "global_step": 585762, "epoch": 7057} {"train_loss": -27.409561157226562, "global_step": 585763, "epoch": 7057} {"train_loss": -27.671613693237305, "global_step": 585764, "epoch": 7057} {"train_loss": -27.76484489440918, "global_step": 585765, "epoch": 7057} {"train_loss": -28.08233070373535, "global_step": 585766, "epoch": 7057} {"train_loss": -28.018781661987305, "global_step": 585767, "epoch": 7057} {"train_loss": -28.052717208862305, "global_step": 585768, "epoch": 7057} {"train_loss": -27.827680587768555, "global_step": 585769, "epoch": 7057} {"train_loss": -27.768787384033203, "global_step": 585770, "epoch": 7057} {"train_loss": -28.05311393737793, "global_step": 585771, "epoch": 7057} {"train_loss": -28.017669677734375, "global_step": 585772, "epoch": 7057} {"train_loss": -28.278980255126953, "global_step": 585773, "epoch": 7057} {"train_loss": -27.93349266052246, "global_step": 585774, "epoch": 7057} {"train_loss": -28.22926139831543, "global_step": 585775, "epoch": 7057} {"train_loss": -27.517820358276367, "global_step": 585776, "epoch": 7057} {"train_loss": -28.0748233795166, "global_step": 585777, "epoch": 7057} {"train_loss": -28.297574996948242, "global_step": 585778, "epoch": 7057} {"train_loss": -27.99004554748535, "global_step": 585779, "epoch": 7057} {"train_loss": -27.80095863342285, "global_step": 585780, "epoch": 7057} {"train_loss": -27.923925399780273, "global_step": 585781, "epoch": 7057} {"train_loss": -27.733163833618164, "global_step": 585782, "epoch": 7057} {"train_loss": -27.96600914001465, "global_step": 585783, "epoch": 7057} {"train_loss": -28.0604248046875, "global_step": 585784, "epoch": 7057} {"train_loss": -28.06084632873535, "global_step": 585785, "epoch": 7057} {"train_loss": -28.13458824157715, "global_step": 585786, "epoch": 7057} {"train_loss": -28.064733505249023, "global_step": 585787, "epoch": 7057} {"train_loss": -28.204736709594727, "global_step": 585788, "epoch": 7057} {"train_loss": -28.082006454467773, "global_step": 585789, "epoch": 7057} {"train_loss": -28.095434188842773, "global_step": 585790, "epoch": 7057} {"train_loss": -28.655073165893555, "global_step": 585791, "epoch": 7057} {"train_loss": -28.068323135375977, "global_step": 585792, "epoch": 7057} {"train_loss": -27.958011627197266, "global_step": 585793, "epoch": 7057} {"train_loss": -28.001073837280273, "global_step": 585794, "epoch": 7057} {"train_loss": -28.414447784423828, "global_step": 585795, "epoch": 7057} {"train_loss": -28.082809448242188, "global_step": 585796, "epoch": 7057} {"train_loss": -28.043161392211914, "global_step": 585797, "epoch": 7057} {"train_loss": -28.127328872680664, "global_step": 585798, "epoch": 7057} {"train_loss": -28.209671020507812, "global_step": 585799, "epoch": 7057} {"train_loss": -28.1184024810791, "global_step": 585800, "epoch": 7057} {"train_loss": -28.258642196655273, "global_step": 585801, "epoch": 7057} {"train_loss": -28.02119255065918, "global_step": 585802, "epoch": 7057} {"train_loss": -28.254323959350586, "global_step": 585803, "epoch": 7057} {"train_loss": -28.367441177368164, "global_step": 585804, "epoch": 7057} {"train_loss": -28.174962997436523, "global_step": 585805, "epoch": 7057} {"train_loss": -28.092578887939453, "global_step": 585806, "epoch": 7057} {"train_loss": -28.14217185974121, "global_step": 585807, "epoch": 7057} {"train_loss": -27.880142211914062, "global_step": 585808, "epoch": 7057} {"train_loss": -27.7707576751709, "global_step": 585809, "epoch": 7057} {"train_loss": -27.907440185546875, "global_step": 585810, "epoch": 7057} {"train_loss": -28.243478775024414, "global_step": 585811, "epoch": 7057} {"train_loss": -27.6674861907959, "global_step": 585812, "epoch": 7057} {"train_loss": -27.644243631018213, "global_step": 585813, "epoch": 7057, "val_loss": 6599577.5} {"train_loss": -26.810327529907227, "global_step": 585814, "epoch": 7058} {"train_loss": -26.895673751831055, "global_step": 585815, "epoch": 7058} {"train_loss": -26.548925399780273, "global_step": 585816, "epoch": 7058} {"train_loss": -26.383869171142578, "global_step": 585817, "epoch": 7058} {"train_loss": -26.427902221679688, "global_step": 585818, "epoch": 7058} {"train_loss": -26.539932250976562, "global_step": 585819, "epoch": 7058} {"train_loss": -27.104928970336914, "global_step": 585820, "epoch": 7058} {"train_loss": -26.899337768554688, "global_step": 585821, "epoch": 7058} {"train_loss": -26.7194881439209, "global_step": 585822, "epoch": 7058} {"train_loss": -26.932783126831055, "global_step": 585823, "epoch": 7058} {"train_loss": -27.174787521362305, "global_step": 585824, "epoch": 7058} {"train_loss": -27.3349666595459, "global_step": 585825, "epoch": 7058} {"train_loss": -27.045141220092773, "global_step": 585826, "epoch": 7058} {"train_loss": -27.01235008239746, "global_step": 585827, "epoch": 7058} {"train_loss": -27.1055965423584, "global_step": 585828, "epoch": 7058} {"train_loss": -27.03138542175293, "global_step": 585829, "epoch": 7058} {"train_loss": -27.414840698242188, "global_step": 585830, "epoch": 7058} {"train_loss": -27.326465606689453, "global_step": 585831, "epoch": 7058} {"train_loss": -27.638996124267578, "global_step": 585832, "epoch": 7058} {"train_loss": -27.54302406311035, "global_step": 585833, "epoch": 7058} {"train_loss": -27.733945846557617, "global_step": 585834, "epoch": 7058} {"train_loss": -27.485013961791992, "global_step": 585835, "epoch": 7058} {"train_loss": -27.538904190063477, "global_step": 585836, "epoch": 7058} {"train_loss": -27.813800811767578, "global_step": 585837, "epoch": 7058} {"train_loss": -27.625812530517578, "global_step": 585838, "epoch": 7058} {"train_loss": -27.492816925048828, "global_step": 585839, "epoch": 7058} {"train_loss": -27.663532257080078, "global_step": 585840, "epoch": 7058} {"train_loss": -27.718168258666992, "global_step": 585841, "epoch": 7058} {"train_loss": -27.995681762695312, "global_step": 585842, "epoch": 7058} {"train_loss": -27.66145896911621, "global_step": 585843, "epoch": 7058} {"train_loss": -28.166900634765625, "global_step": 585844, "epoch": 7058} {"train_loss": -27.94582176208496, "global_step": 585845, "epoch": 7058} {"train_loss": -28.08323097229004, "global_step": 585846, "epoch": 7058} {"train_loss": -27.5870304107666, "global_step": 585847, "epoch": 7058} {"train_loss": -27.865896224975586, "global_step": 585848, "epoch": 7058} {"train_loss": -28.14865493774414, "global_step": 585849, "epoch": 7058} {"train_loss": -27.93140983581543, "global_step": 585850, "epoch": 7058} {"train_loss": -27.73996353149414, "global_step": 585851, "epoch": 7058} {"train_loss": -27.856159210205078, "global_step": 585852, "epoch": 7058} {"train_loss": -27.912433624267578, "global_step": 585853, "epoch": 7058} {"train_loss": -27.806076049804688, "global_step": 585854, "epoch": 7058} {"train_loss": -27.876068115234375, "global_step": 585855, "epoch": 7058} {"train_loss": -27.980817794799805, "global_step": 585856, "epoch": 7058} {"train_loss": -27.699390411376953, "global_step": 585857, "epoch": 7058} {"train_loss": -28.270496368408203, "global_step": 585858, "epoch": 7058} {"train_loss": -27.6103515625, "global_step": 585859, "epoch": 7058} {"train_loss": -28.203779220581055, "global_step": 585860, "epoch": 7058} {"train_loss": -27.551513671875, "global_step": 585861, "epoch": 7058} {"train_loss": -27.93647575378418, "global_step": 585862, "epoch": 7058} {"train_loss": -28.224084854125977, "global_step": 585863, "epoch": 7058} {"train_loss": -27.604984283447266, "global_step": 585864, "epoch": 7058} {"train_loss": -27.82891845703125, "global_step": 585865, "epoch": 7058} {"train_loss": -28.199594497680664, "global_step": 585866, "epoch": 7058} {"train_loss": -27.997879028320312, "global_step": 585867, "epoch": 7058} {"train_loss": -28.06617546081543, "global_step": 585868, "epoch": 7058} {"train_loss": -27.827016830444336, "global_step": 585869, "epoch": 7058} {"train_loss": -28.079736709594727, "global_step": 585870, "epoch": 7058} {"train_loss": -27.92498207092285, "global_step": 585871, "epoch": 7058} {"train_loss": -27.853504180908203, "global_step": 585872, "epoch": 7058} {"train_loss": -27.986291885375977, "global_step": 585873, "epoch": 7058} {"train_loss": -27.80517578125, "global_step": 585874, "epoch": 7058} {"train_loss": -28.395620346069336, "global_step": 585875, "epoch": 7058} {"train_loss": -28.11435890197754, "global_step": 585876, "epoch": 7058} {"train_loss": -27.697315216064453, "global_step": 585877, "epoch": 7058} {"train_loss": -28.159927368164062, "global_step": 585878, "epoch": 7058} {"train_loss": -28.13937759399414, "global_step": 585879, "epoch": 7058} {"train_loss": -27.568592071533203, "global_step": 585880, "epoch": 7058} {"train_loss": -27.834705352783203, "global_step": 585881, "epoch": 7058} {"train_loss": -28.27813148498535, "global_step": 585882, "epoch": 7058} {"train_loss": -28.079425811767578, "global_step": 585883, "epoch": 7058} {"train_loss": -27.852514266967773, "global_step": 585884, "epoch": 7058} {"train_loss": -28.13616371154785, "global_step": 585885, "epoch": 7058} {"train_loss": -27.461084365844727, "global_step": 585886, "epoch": 7058} {"train_loss": -28.03057289123535, "global_step": 585887, "epoch": 7058} {"train_loss": -28.164636611938477, "global_step": 585888, "epoch": 7058} {"train_loss": -27.822574615478516, "global_step": 585889, "epoch": 7058} {"train_loss": -27.83782386779785, "global_step": 585890, "epoch": 7058} {"train_loss": -28.143407821655273, "global_step": 585891, "epoch": 7058} {"train_loss": -28.16143226623535, "global_step": 585892, "epoch": 7058} {"train_loss": -28.14924430847168, "global_step": 585893, "epoch": 7058} {"train_loss": -27.93855857849121, "global_step": 585894, "epoch": 7058} {"train_loss": -28.37055778503418, "global_step": 585895, "epoch": 7058} {"train_loss": -27.695016562220562, "global_step": 585896, "epoch": 7058, "val_loss": 6563865.0} {"train_loss": -27.114246368408203, "global_step": 585897, "epoch": 7059} {"train_loss": -27.299062728881836, "global_step": 585898, "epoch": 7059} {"train_loss": -27.4626522064209, "global_step": 585899, "epoch": 7059} {"train_loss": -27.7835636138916, "global_step": 585900, "epoch": 7059} {"train_loss": -27.091571807861328, "global_step": 585901, "epoch": 7059} {"train_loss": -27.37276268005371, "global_step": 585902, "epoch": 7059} {"train_loss": -27.18634033203125, "global_step": 585903, "epoch": 7059} {"train_loss": -27.5269718170166, "global_step": 585904, "epoch": 7059} {"train_loss": -27.155487060546875, "global_step": 585905, "epoch": 7059} {"train_loss": -27.252283096313477, "global_step": 585906, "epoch": 7059} {"train_loss": -27.302295684814453, "global_step": 585907, "epoch": 7059} {"train_loss": -27.694650650024414, "global_step": 585908, "epoch": 7059} {"train_loss": -27.37135124206543, "global_step": 585909, "epoch": 7059} {"train_loss": -27.59665298461914, "global_step": 585910, "epoch": 7059} {"train_loss": -26.72736167907715, "global_step": 585911, "epoch": 7059} {"train_loss": -27.54351806640625, "global_step": 585912, "epoch": 7059} {"train_loss": -27.7725887298584, "global_step": 585913, "epoch": 7059} {"train_loss": -27.5465087890625, "global_step": 585914, "epoch": 7059} {"train_loss": -27.667926788330078, "global_step": 585915, "epoch": 7059} {"train_loss": -27.45588493347168, "global_step": 585916, "epoch": 7059} {"train_loss": -27.74952507019043, "global_step": 585917, "epoch": 7059} {"train_loss": -27.782629013061523, "global_step": 585918, "epoch": 7059} {"train_loss": -27.791467666625977, "global_step": 585919, "epoch": 7059} {"train_loss": -27.856435775756836, "global_step": 585920, "epoch": 7059} {"train_loss": -27.84954261779785, "global_step": 585921, "epoch": 7059} {"train_loss": -27.641834259033203, "global_step": 585922, "epoch": 7059} {"train_loss": -28.078596115112305, "global_step": 585923, "epoch": 7059} {"train_loss": -27.768369674682617, "global_step": 585924, "epoch": 7059} {"train_loss": -27.825925827026367, "global_step": 585925, "epoch": 7059} {"train_loss": -27.722232818603516, "global_step": 585926, "epoch": 7059} {"train_loss": -27.94012451171875, "global_step": 585927, "epoch": 7059} {"train_loss": -28.038557052612305, "global_step": 585928, "epoch": 7059} {"train_loss": -27.958898544311523, "global_step": 585929, "epoch": 7059} {"train_loss": -27.400482177734375, "global_step": 585930, "epoch": 7059} {"train_loss": -27.9666748046875, "global_step": 585931, "epoch": 7059} {"train_loss": -27.985614776611328, "global_step": 585932, "epoch": 7059} {"train_loss": -27.973859786987305, "global_step": 585933, "epoch": 7059} {"train_loss": -28.1291561126709, "global_step": 585934, "epoch": 7059} {"train_loss": -27.844812393188477, "global_step": 585935, "epoch": 7059} {"train_loss": -28.316303253173828, "global_step": 585936, "epoch": 7059} {"train_loss": -28.173828125, "global_step": 585937, "epoch": 7059} {"train_loss": -28.08199119567871, "global_step": 585938, "epoch": 7059} {"train_loss": -27.87041664123535, "global_step": 585939, "epoch": 7059} {"train_loss": -28.3455810546875, "global_step": 585940, "epoch": 7059} {"train_loss": -27.842390060424805, "global_step": 585941, "epoch": 7059} {"train_loss": -27.81501579284668, "global_step": 585942, "epoch": 7059} {"train_loss": -27.856830596923828, "global_step": 585943, "epoch": 7059} {"train_loss": -27.822956085205078, "global_step": 585944, "epoch": 7059} {"train_loss": -28.239933013916016, "global_step": 585945, "epoch": 7059} {"train_loss": -28.37639808654785, "global_step": 585946, "epoch": 7059} {"train_loss": -28.21748161315918, "global_step": 585947, "epoch": 7059} {"train_loss": -28.1909236907959, "global_step": 585948, "epoch": 7059} {"train_loss": -28.111616134643555, "global_step": 585949, "epoch": 7059} {"train_loss": -28.44952392578125, "global_step": 585950, "epoch": 7059} {"train_loss": -27.86859130859375, "global_step": 585951, "epoch": 7059} {"train_loss": -28.05262565612793, "global_step": 585952, "epoch": 7059} {"train_loss": -28.183155059814453, "global_step": 585953, "epoch": 7059} {"train_loss": -28.052295684814453, "global_step": 585954, "epoch": 7059} {"train_loss": -27.90015983581543, "global_step": 585955, "epoch": 7059} {"train_loss": -27.903614044189453, "global_step": 585956, "epoch": 7059} {"train_loss": -28.237720489501953, "global_step": 585957, "epoch": 7059} {"train_loss": -28.039005279541016, "global_step": 585958, "epoch": 7059} {"train_loss": -27.880685806274414, "global_step": 585959, "epoch": 7059} {"train_loss": -27.78737449645996, "global_step": 585960, "epoch": 7059} {"train_loss": -28.051137924194336, "global_step": 585961, "epoch": 7059} {"train_loss": -27.835174560546875, "global_step": 585962, "epoch": 7059} {"train_loss": -27.9859676361084, "global_step": 585963, "epoch": 7059} {"train_loss": -27.6286563873291, "global_step": 585964, "epoch": 7059} {"train_loss": -27.133045196533203, "global_step": 585965, "epoch": 7059} {"train_loss": -26.37531089782715, "global_step": 585966, "epoch": 7059} {"train_loss": -26.202789306640625, "global_step": 585967, "epoch": 7059} {"train_loss": -27.38174819946289, "global_step": 585968, "epoch": 7059} {"train_loss": -27.440134048461914, "global_step": 585969, "epoch": 7059} {"train_loss": -27.353778839111328, "global_step": 585970, "epoch": 7059} {"train_loss": -27.737829208374023, "global_step": 585971, "epoch": 7059} {"train_loss": -27.371536254882812, "global_step": 585972, "epoch": 7059} {"train_loss": -27.75797462463379, "global_step": 585973, "epoch": 7059} {"train_loss": -27.720182418823242, "global_step": 585974, "epoch": 7059} {"train_loss": -27.90164566040039, "global_step": 585975, "epoch": 7059} {"train_loss": -27.716821670532227, "global_step": 585976, "epoch": 7059} {"train_loss": -28.1711368560791, "global_step": 585977, "epoch": 7059} {"train_loss": -27.666595458984375, "global_step": 585978, "epoch": 7059} {"train_loss": -27.75712284409856, "global_step": 585979, "epoch": 7059, "val_loss": 6472260.0} {"train_loss": -26.403919219970703, "global_step": 585980, "epoch": 7060} {"train_loss": -26.714984893798828, "global_step": 585981, "epoch": 7060} {"train_loss": -26.58392333984375, "global_step": 585982, "epoch": 7060} {"train_loss": -27.08693504333496, "global_step": 585983, "epoch": 7060} {"train_loss": -27.161544799804688, "global_step": 585984, "epoch": 7060} {"train_loss": -27.01433753967285, "global_step": 585985, "epoch": 7060} {"train_loss": -27.385486602783203, "global_step": 585986, "epoch": 7060} {"train_loss": -27.291479110717773, "global_step": 585987, "epoch": 7060} {"train_loss": -27.041284561157227, "global_step": 585988, "epoch": 7060} {"train_loss": -27.40167808532715, "global_step": 585989, "epoch": 7060} {"train_loss": -27.410755157470703, "global_step": 585990, "epoch": 7060} {"train_loss": -27.416284561157227, "global_step": 585991, "epoch": 7060} {"train_loss": -27.411279678344727, "global_step": 585992, "epoch": 7060} {"train_loss": -27.739490509033203, "global_step": 585993, "epoch": 7060} {"train_loss": -27.36395263671875, "global_step": 585994, "epoch": 7060} {"train_loss": -27.27276039123535, "global_step": 585995, "epoch": 7060} {"train_loss": -27.61492347717285, "global_step": 585996, "epoch": 7060} {"train_loss": -28.0538330078125, "global_step": 585997, "epoch": 7060} {"train_loss": -27.29731559753418, "global_step": 585998, "epoch": 7060} {"train_loss": -27.592763900756836, "global_step": 585999, "epoch": 7060} {"train_loss": -27.903650283813477, "global_step": 586000, "epoch": 7060} {"train_loss": -27.825855255126953, "global_step": 586001, "epoch": 7060} {"train_loss": -28.118459701538086, "global_step": 586002, "epoch": 7060} {"train_loss": -27.758502960205078, "global_step": 586003, "epoch": 7060} {"train_loss": -27.64359474182129, "global_step": 586004, "epoch": 7060} {"train_loss": -27.80609130859375, "global_step": 586005, "epoch": 7060} {"train_loss": -27.863073348999023, "global_step": 586006, "epoch": 7060} {"train_loss": -27.724023818969727, "global_step": 586007, "epoch": 7060} {"train_loss": -28.00847816467285, "global_step": 586008, "epoch": 7060} {"train_loss": -27.996368408203125, "global_step": 586009, "epoch": 7060} {"train_loss": -28.042362213134766, "global_step": 586010, "epoch": 7060} {"train_loss": -28.031579971313477, "global_step": 586011, "epoch": 7060} {"train_loss": -27.792097091674805, "global_step": 586012, "epoch": 7060} {"train_loss": -27.79462242126465, "global_step": 586013, "epoch": 7060} {"train_loss": -28.013595581054688, "global_step": 586014, "epoch": 7060} {"train_loss": -27.955930709838867, "global_step": 586015, "epoch": 7060} {"train_loss": -27.99338722229004, "global_step": 586016, "epoch": 7060} {"train_loss": -27.888965606689453, "global_step": 586017, "epoch": 7060} {"train_loss": -28.28182029724121, "global_step": 586018, "epoch": 7060} {"train_loss": -28.155195236206055, "global_step": 586019, "epoch": 7060} {"train_loss": -28.3214111328125, "global_step": 586020, "epoch": 7060} {"train_loss": -27.784814834594727, "global_step": 586021, "epoch": 7060} {"train_loss": -28.462665557861328, "global_step": 586022, "epoch": 7060} {"train_loss": -27.9256591796875, "global_step": 586023, "epoch": 7060} {"train_loss": -27.882917404174805, "global_step": 586024, "epoch": 7060} {"train_loss": -27.85114860534668, "global_step": 586025, "epoch": 7060} {"train_loss": -28.042245864868164, "global_step": 586026, "epoch": 7060} {"train_loss": -28.121387481689453, "global_step": 586027, "epoch": 7060} {"train_loss": -27.90364646911621, "global_step": 586028, "epoch": 7060} {"train_loss": -28.154401779174805, "global_step": 586029, "epoch": 7060} {"train_loss": -28.36231803894043, "global_step": 586030, "epoch": 7060} {"train_loss": -28.006601333618164, "global_step": 586031, "epoch": 7060} {"train_loss": -28.421539306640625, "global_step": 586032, "epoch": 7060} {"train_loss": -28.585607528686523, "global_step": 586033, "epoch": 7060} {"train_loss": -28.124134063720703, "global_step": 586034, "epoch": 7060} {"train_loss": -27.942102432250977, "global_step": 586035, "epoch": 7060} {"train_loss": -27.985395431518555, "global_step": 586036, "epoch": 7060} {"train_loss": -27.87763023376465, "global_step": 586037, "epoch": 7060} {"train_loss": -28.149341583251953, "global_step": 586038, "epoch": 7060} {"train_loss": -27.92853355407715, "global_step": 586039, "epoch": 7060} {"train_loss": -28.11627769470215, "global_step": 586040, "epoch": 7060} {"train_loss": -28.208484649658203, "global_step": 586041, "epoch": 7060} {"train_loss": -28.025684356689453, "global_step": 586042, "epoch": 7060} {"train_loss": -27.987842559814453, "global_step": 586043, "epoch": 7060} {"train_loss": -28.03399658203125, "global_step": 586044, "epoch": 7060} {"train_loss": -27.610559463500977, "global_step": 586045, "epoch": 7060} {"train_loss": -27.450647354125977, "global_step": 586046, "epoch": 7060} {"train_loss": -27.450143814086914, "global_step": 586047, "epoch": 7060} {"train_loss": -28.0456485748291, "global_step": 586048, "epoch": 7060} {"train_loss": -28.1549015045166, "global_step": 586049, "epoch": 7060} {"train_loss": -27.740392684936523, "global_step": 586050, "epoch": 7060} {"train_loss": -27.727994918823242, "global_step": 586051, "epoch": 7060} {"train_loss": -27.708698272705078, "global_step": 586052, "epoch": 7060} {"train_loss": -27.3230037689209, "global_step": 586053, "epoch": 7060} {"train_loss": -26.664859771728516, "global_step": 586054, "epoch": 7060} {"train_loss": -26.374881744384766, "global_step": 586055, "epoch": 7060} {"train_loss": -27.086278915405273, "global_step": 586056, "epoch": 7060} {"train_loss": -27.959211349487305, "global_step": 586057, "epoch": 7060} {"train_loss": -27.0096492767334, "global_step": 586058, "epoch": 7060} {"train_loss": -27.67426872253418, "global_step": 586059, "epoch": 7060} {"train_loss": -27.2165584564209, "global_step": 586060, "epoch": 7060} {"train_loss": -27.246484756469727, "global_step": 586061, "epoch": 7060} {"train_loss": -27.72559154464538, "global_step": 586062, "epoch": 7060, "val_loss": 6599770.0} {"train_loss": -27.232938766479492, "global_step": 586063, "epoch": 7061} {"train_loss": -27.137588500976562, "global_step": 586064, "epoch": 7061} {"train_loss": -27.034650802612305, "global_step": 586065, "epoch": 7061} {"train_loss": -27.87285804748535, "global_step": 586066, "epoch": 7061} {"train_loss": -27.00186538696289, "global_step": 586067, "epoch": 7061} {"train_loss": -27.688138961791992, "global_step": 586068, "epoch": 7061} {"train_loss": -27.0445556640625, "global_step": 586069, "epoch": 7061} {"train_loss": -27.87198257446289, "global_step": 586070, "epoch": 7061} {"train_loss": -27.748600006103516, "global_step": 586071, "epoch": 7061} {"train_loss": -27.511646270751953, "global_step": 586072, "epoch": 7061} {"train_loss": -27.360157012939453, "global_step": 586073, "epoch": 7061} {"train_loss": -27.37471580505371, "global_step": 586074, "epoch": 7061} {"train_loss": -27.238693237304688, "global_step": 586075, "epoch": 7061} {"train_loss": -27.81422996520996, "global_step": 586076, "epoch": 7061} {"train_loss": -27.719919204711914, "global_step": 586077, "epoch": 7061} {"train_loss": -27.515033721923828, "global_step": 586078, "epoch": 7061} {"train_loss": -27.71685218811035, "global_step": 586079, "epoch": 7061} {"train_loss": -27.81365394592285, "global_step": 586080, "epoch": 7061} {"train_loss": -27.9443416595459, "global_step": 586081, "epoch": 7061} {"train_loss": -27.675018310546875, "global_step": 586082, "epoch": 7061} {"train_loss": -27.69463539123535, "global_step": 586083, "epoch": 7061} {"train_loss": -27.793989181518555, "global_step": 586084, "epoch": 7061} {"train_loss": -28.136066436767578, "global_step": 586085, "epoch": 7061} {"train_loss": -27.598600387573242, "global_step": 586086, "epoch": 7061} {"train_loss": -27.989765167236328, "global_step": 586087, "epoch": 7061} {"train_loss": -27.769073486328125, "global_step": 586088, "epoch": 7061} {"train_loss": -27.86838150024414, "global_step": 586089, "epoch": 7061} {"train_loss": -28.0865478515625, "global_step": 586090, "epoch": 7061} {"train_loss": -27.95643424987793, "global_step": 586091, "epoch": 7061} {"train_loss": -28.597412109375, "global_step": 586092, "epoch": 7061} {"train_loss": -28.016149520874023, "global_step": 586093, "epoch": 7061} {"train_loss": -28.3768367767334, "global_step": 586094, "epoch": 7061} {"train_loss": -27.947179794311523, "global_step": 586095, "epoch": 7061} {"train_loss": -27.91768455505371, "global_step": 586096, "epoch": 7061} {"train_loss": -28.116168975830078, "global_step": 586097, "epoch": 7061} {"train_loss": -27.933252334594727, "global_step": 586098, "epoch": 7061} {"train_loss": -28.255720138549805, "global_step": 586099, "epoch": 7061} {"train_loss": -27.984731674194336, "global_step": 586100, "epoch": 7061} {"train_loss": -28.200292587280273, "global_step": 586101, "epoch": 7061} {"train_loss": -27.779401779174805, "global_step": 586102, "epoch": 7061} {"train_loss": -28.186376571655273, "global_step": 586103, "epoch": 7061} {"train_loss": -27.97261619567871, "global_step": 586104, "epoch": 7061} {"train_loss": -28.020450592041016, "global_step": 586105, "epoch": 7061} {"train_loss": -28.2065486907959, "global_step": 586106, "epoch": 7061} {"train_loss": -28.113428115844727, "global_step": 586107, "epoch": 7061} {"train_loss": -28.0056095123291, "global_step": 586108, "epoch": 7061} {"train_loss": -28.42637062072754, "global_step": 586109, "epoch": 7061} {"train_loss": -28.4741153717041, "global_step": 586110, "epoch": 7061} {"train_loss": -27.9469051361084, "global_step": 586111, "epoch": 7061} {"train_loss": -27.592147827148438, "global_step": 586112, "epoch": 7061} {"train_loss": -28.045026779174805, "global_step": 586113, "epoch": 7061} {"train_loss": -27.88899803161621, "global_step": 586114, "epoch": 7061} {"train_loss": -28.284154891967773, "global_step": 586115, "epoch": 7061} {"train_loss": -28.274255752563477, "global_step": 586116, "epoch": 7061} {"train_loss": -27.737661361694336, "global_step": 586117, "epoch": 7061} {"train_loss": -28.408340454101562, "global_step": 586118, "epoch": 7061} {"train_loss": -28.2867488861084, "global_step": 586119, "epoch": 7061} {"train_loss": -27.780115127563477, "global_step": 586120, "epoch": 7061} {"train_loss": -27.801374435424805, "global_step": 586121, "epoch": 7061} {"train_loss": -27.845800399780273, "global_step": 586122, "epoch": 7061} {"train_loss": -28.101669311523438, "global_step": 586123, "epoch": 7061} {"train_loss": -28.243408203125, "global_step": 586124, "epoch": 7061} {"train_loss": -28.026981353759766, "global_step": 586125, "epoch": 7061} {"train_loss": -28.050128936767578, "global_step": 586126, "epoch": 7061} {"train_loss": -28.08637046813965, "global_step": 586127, "epoch": 7061} {"train_loss": -28.069128036499023, "global_step": 586128, "epoch": 7061} {"train_loss": -27.91839027404785, "global_step": 586129, "epoch": 7061} {"train_loss": -27.85700035095215, "global_step": 586130, "epoch": 7061} {"train_loss": -27.539016723632812, "global_step": 586131, "epoch": 7061} {"train_loss": -28.010700225830078, "global_step": 586132, "epoch": 7061} {"train_loss": -27.884113311767578, "global_step": 586133, "epoch": 7061} {"train_loss": -27.837112426757812, "global_step": 586134, "epoch": 7061} {"train_loss": -27.87046241760254, "global_step": 586135, "epoch": 7061} {"train_loss": -28.0015811920166, "global_step": 586136, "epoch": 7061} {"train_loss": -27.9136905670166, "global_step": 586137, "epoch": 7061} {"train_loss": -28.011571884155273, "global_step": 586138, "epoch": 7061} {"train_loss": -28.035802841186523, "global_step": 586139, "epoch": 7061} {"train_loss": -28.092626571655273, "global_step": 586140, "epoch": 7061} {"train_loss": -28.341405868530273, "global_step": 586141, "epoch": 7061} {"train_loss": -28.262897491455078, "global_step": 586142, "epoch": 7061} {"train_loss": -28.194120407104492, "global_step": 586143, "epoch": 7061} {"train_loss": -27.886682510375977, "global_step": 586144, "epoch": 7061} {"train_loss": -27.90228305954531, "global_step": 586145, "epoch": 7061, "val_loss": 6479419.0} {"train_loss": -25.86311149597168, "global_step": 586146, "epoch": 7062} {"train_loss": -25.18906593322754, "global_step": 586147, "epoch": 7062} {"train_loss": -26.693561553955078, "global_step": 586148, "epoch": 7062} {"train_loss": -26.944936752319336, "global_step": 586149, "epoch": 7062} {"train_loss": -26.998083114624023, "global_step": 586150, "epoch": 7062} {"train_loss": -27.21809959411621, "global_step": 586151, "epoch": 7062} {"train_loss": -26.610401153564453, "global_step": 586152, "epoch": 7062} {"train_loss": -27.76527214050293, "global_step": 586153, "epoch": 7062} {"train_loss": -26.46820640563965, "global_step": 586154, "epoch": 7062} {"train_loss": -26.87897300720215, "global_step": 586155, "epoch": 7062} {"train_loss": -26.97883415222168, "global_step": 586156, "epoch": 7062} {"train_loss": -26.784971237182617, "global_step": 586157, "epoch": 7062} {"train_loss": -27.564868927001953, "global_step": 586158, "epoch": 7062} {"train_loss": -27.452072143554688, "global_step": 586159, "epoch": 7062} {"train_loss": -27.539159774780273, "global_step": 586160, "epoch": 7062} {"train_loss": -27.416391372680664, "global_step": 586161, "epoch": 7062} {"train_loss": -27.320199966430664, "global_step": 586162, "epoch": 7062} {"train_loss": -27.592309951782227, "global_step": 586163, "epoch": 7062} {"train_loss": -27.672388076782227, "global_step": 586164, "epoch": 7062} {"train_loss": -27.735092163085938, "global_step": 586165, "epoch": 7062} {"train_loss": -27.390247344970703, "global_step": 586166, "epoch": 7062} {"train_loss": -27.805540084838867, "global_step": 586167, "epoch": 7062} {"train_loss": -27.744464874267578, "global_step": 586168, "epoch": 7062} {"train_loss": -27.96417808532715, "global_step": 586169, "epoch": 7062} {"train_loss": -27.649555206298828, "global_step": 586170, "epoch": 7062} {"train_loss": -27.755773544311523, "global_step": 586171, "epoch": 7062} {"train_loss": -27.621912002563477, "global_step": 586172, "epoch": 7062} {"train_loss": -27.64545249938965, "global_step": 586173, "epoch": 7062} {"train_loss": -27.6624813079834, "global_step": 586174, "epoch": 7062} {"train_loss": -27.703073501586914, "global_step": 586175, "epoch": 7062} {"train_loss": -27.699743270874023, "global_step": 586176, "epoch": 7062} {"train_loss": -27.770751953125, "global_step": 586177, "epoch": 7062} {"train_loss": -28.184284210205078, "global_step": 586178, "epoch": 7062} {"train_loss": -27.9300537109375, "global_step": 586179, "epoch": 7062} {"train_loss": -27.882801055908203, "global_step": 586180, "epoch": 7062} {"train_loss": -27.68732261657715, "global_step": 586181, "epoch": 7062} {"train_loss": -27.73431968688965, "global_step": 586182, "epoch": 7062} {"train_loss": -27.445661544799805, "global_step": 586183, "epoch": 7062} {"train_loss": -28.204259872436523, "global_step": 586184, "epoch": 7062} {"train_loss": -27.72116470336914, "global_step": 586185, "epoch": 7062} {"train_loss": -27.839574813842773, "global_step": 586186, "epoch": 7062} {"train_loss": -28.064044952392578, "global_step": 586187, "epoch": 7062} {"train_loss": -28.13642692565918, "global_step": 586188, "epoch": 7062} {"train_loss": -28.18743896484375, "global_step": 586189, "epoch": 7062} {"train_loss": -27.72528076171875, "global_step": 586190, "epoch": 7062} {"train_loss": -27.979358673095703, "global_step": 586191, "epoch": 7062} {"train_loss": -28.090635299682617, "global_step": 586192, "epoch": 7062} {"train_loss": -27.89177894592285, "global_step": 586193, "epoch": 7062} {"train_loss": -27.537860870361328, "global_step": 586194, "epoch": 7062} {"train_loss": -27.51738929748535, "global_step": 586195, "epoch": 7062} {"train_loss": -28.273651123046875, "global_step": 586196, "epoch": 7062} {"train_loss": -27.873884201049805, "global_step": 586197, "epoch": 7062} {"train_loss": -28.302154541015625, "global_step": 586198, "epoch": 7062} {"train_loss": -28.011205673217773, "global_step": 586199, "epoch": 7062} {"train_loss": -28.231002807617188, "global_step": 586200, "epoch": 7062} {"train_loss": -28.247629165649414, "global_step": 586201, "epoch": 7062} {"train_loss": -27.7519588470459, "global_step": 586202, "epoch": 7062} {"train_loss": -28.054800033569336, "global_step": 586203, "epoch": 7062} {"train_loss": -27.83500099182129, "global_step": 586204, "epoch": 7062} {"train_loss": -27.786130905151367, "global_step": 586205, "epoch": 7062} {"train_loss": -27.64924430847168, "global_step": 586206, "epoch": 7062} {"train_loss": -27.400304794311523, "global_step": 586207, "epoch": 7062} {"train_loss": -28.067800521850586, "global_step": 586208, "epoch": 7062} {"train_loss": -28.07769203186035, "global_step": 586209, "epoch": 7062} {"train_loss": -27.739103317260742, "global_step": 586210, "epoch": 7062} {"train_loss": -27.817617416381836, "global_step": 586211, "epoch": 7062} {"train_loss": -27.8364200592041, "global_step": 586212, "epoch": 7062} {"train_loss": -27.593097686767578, "global_step": 586213, "epoch": 7062} {"train_loss": -27.8439998626709, "global_step": 586214, "epoch": 7062} {"train_loss": -27.765369415283203, "global_step": 586215, "epoch": 7062} {"train_loss": -28.331466674804688, "global_step": 586216, "epoch": 7062} {"train_loss": -27.965280532836914, "global_step": 586217, "epoch": 7062} {"train_loss": -27.514123916625977, "global_step": 586218, "epoch": 7062} {"train_loss": -27.781064987182617, "global_step": 586219, "epoch": 7062} {"train_loss": -27.54578971862793, "global_step": 586220, "epoch": 7062} {"train_loss": -27.482812881469727, "global_step": 586221, "epoch": 7062} {"train_loss": -27.7725772857666, "global_step": 586222, "epoch": 7062} {"train_loss": -27.775671005249023, "global_step": 586223, "epoch": 7062} {"train_loss": -28.003156661987305, "global_step": 586224, "epoch": 7062} {"train_loss": -27.568695068359375, "global_step": 586225, "epoch": 7062} {"train_loss": -28.135923385620117, "global_step": 586226, "epoch": 7062} {"train_loss": -27.6621036529541, "global_step": 586227, "epoch": 7062} {"train_loss": -27.634183056383247, "global_step": 586228, "epoch": 7062, "val_loss": 6531198.5} {"train_loss": -27.585947036743164, "global_step": 586229, "epoch": 7063} {"train_loss": -27.096837997436523, "global_step": 586230, "epoch": 7063} {"train_loss": -26.765731811523438, "global_step": 586231, "epoch": 7063} {"train_loss": -27.511281967163086, "global_step": 586232, "epoch": 7063} {"train_loss": -27.710371017456055, "global_step": 586233, "epoch": 7063} {"train_loss": -27.4168643951416, "global_step": 586234, "epoch": 7063} {"train_loss": -27.135986328125, "global_step": 586235, "epoch": 7063} {"train_loss": -27.561431884765625, "global_step": 586236, "epoch": 7063} {"train_loss": -27.093753814697266, "global_step": 586237, "epoch": 7063} {"train_loss": -26.962268829345703, "global_step": 586238, "epoch": 7063} {"train_loss": -27.225717544555664, "global_step": 586239, "epoch": 7063} {"train_loss": -27.55938148498535, "global_step": 586240, "epoch": 7063} {"train_loss": -27.3013916015625, "global_step": 586241, "epoch": 7063} {"train_loss": -27.746505737304688, "global_step": 586242, "epoch": 7063} {"train_loss": -27.436660766601562, "global_step": 586243, "epoch": 7063} {"train_loss": -27.585790634155273, "global_step": 586244, "epoch": 7063} {"train_loss": -27.226943969726562, "global_step": 586245, "epoch": 7063} {"train_loss": -27.56206703186035, "global_step": 586246, "epoch": 7063} {"train_loss": -27.842010498046875, "global_step": 586247, "epoch": 7063} {"train_loss": -27.818954467773438, "global_step": 586248, "epoch": 7063} {"train_loss": -27.78898048400879, "global_step": 586249, "epoch": 7063} {"train_loss": -27.841693878173828, "global_step": 586250, "epoch": 7063} {"train_loss": -27.829574584960938, "global_step": 586251, "epoch": 7063} {"train_loss": -27.478687286376953, "global_step": 586252, "epoch": 7063} {"train_loss": -28.127050399780273, "global_step": 586253, "epoch": 7063} {"train_loss": -27.4029541015625, "global_step": 586254, "epoch": 7063} {"train_loss": -27.752660751342773, "global_step": 586255, "epoch": 7063} {"train_loss": -27.9266357421875, "global_step": 586256, "epoch": 7063} {"train_loss": -27.68892478942871, "global_step": 586257, "epoch": 7063} {"train_loss": -27.282257080078125, "global_step": 586258, "epoch": 7063} {"train_loss": -27.849821090698242, "global_step": 586259, "epoch": 7063} {"train_loss": -27.623626708984375, "global_step": 586260, "epoch": 7063} {"train_loss": -27.755661010742188, "global_step": 586261, "epoch": 7063} {"train_loss": -27.689197540283203, "global_step": 586262, "epoch": 7063} {"train_loss": -27.9531192779541, "global_step": 586263, "epoch": 7063} {"train_loss": -27.937170028686523, "global_step": 586264, "epoch": 7063} {"train_loss": -27.639617919921875, "global_step": 586265, "epoch": 7063} {"train_loss": -28.0762996673584, "global_step": 586266, "epoch": 7063} {"train_loss": -27.922590255737305, "global_step": 586267, "epoch": 7063} {"train_loss": -27.772705078125, "global_step": 586268, "epoch": 7063} {"train_loss": -27.824176788330078, "global_step": 586269, "epoch": 7063} {"train_loss": -27.946002960205078, "global_step": 586270, "epoch": 7063} {"train_loss": -27.882986068725586, "global_step": 586271, "epoch": 7063} {"train_loss": -28.086200714111328, "global_step": 586272, "epoch": 7063} {"train_loss": -27.912137985229492, "global_step": 586273, "epoch": 7063} {"train_loss": -28.007415771484375, "global_step": 586274, "epoch": 7063} {"train_loss": -27.53718376159668, "global_step": 586275, "epoch": 7063} {"train_loss": -28.175321578979492, "global_step": 586276, "epoch": 7063} {"train_loss": -27.967252731323242, "global_step": 586277, "epoch": 7063} {"train_loss": -27.93793296813965, "global_step": 586278, "epoch": 7063} {"train_loss": -28.00215721130371, "global_step": 586279, "epoch": 7063} {"train_loss": -28.052326202392578, "global_step": 586280, "epoch": 7063} {"train_loss": -28.394927978515625, "global_step": 586281, "epoch": 7063} {"train_loss": -28.411741256713867, "global_step": 586282, "epoch": 7063} {"train_loss": -28.089263916015625, "global_step": 586283, "epoch": 7063} {"train_loss": -28.190942764282227, "global_step": 586284, "epoch": 7063} {"train_loss": -28.010034561157227, "global_step": 586285, "epoch": 7063} {"train_loss": -28.168659210205078, "global_step": 586286, "epoch": 7063} {"train_loss": -28.150760650634766, "global_step": 586287, "epoch": 7063} {"train_loss": -28.034040451049805, "global_step": 586288, "epoch": 7063} {"train_loss": -27.884153366088867, "global_step": 586289, "epoch": 7063} {"train_loss": -27.5006046295166, "global_step": 586290, "epoch": 7063} {"train_loss": -27.827259063720703, "global_step": 586291, "epoch": 7063} {"train_loss": -27.946317672729492, "global_step": 586292, "epoch": 7063} {"train_loss": -27.95623779296875, "global_step": 586293, "epoch": 7063} {"train_loss": -28.029088973999023, "global_step": 586294, "epoch": 7063} {"train_loss": -27.391605377197266, "global_step": 586295, "epoch": 7063} {"train_loss": -27.66767692565918, "global_step": 586296, "epoch": 7063} {"train_loss": -28.234283447265625, "global_step": 586297, "epoch": 7063} {"train_loss": -27.874723434448242, "global_step": 586298, "epoch": 7063} {"train_loss": -28.095434188842773, "global_step": 586299, "epoch": 7063} {"train_loss": -27.921186447143555, "global_step": 586300, "epoch": 7063} {"train_loss": -27.45166015625, "global_step": 586301, "epoch": 7063} {"train_loss": -28.0963191986084, "global_step": 586302, "epoch": 7063} {"train_loss": -28.094970703125, "global_step": 586303, "epoch": 7063} {"train_loss": -27.857807159423828, "global_step": 586304, "epoch": 7063} {"train_loss": -28.132184982299805, "global_step": 586305, "epoch": 7063} {"train_loss": -27.655841827392578, "global_step": 586306, "epoch": 7063} {"train_loss": -27.838424682617188, "global_step": 586307, "epoch": 7063} {"train_loss": -28.10805320739746, "global_step": 586308, "epoch": 7063} {"train_loss": -27.82553482055664, "global_step": 586309, "epoch": 7063} {"train_loss": -27.97344970703125, "global_step": 586310, "epoch": 7063} {"train_loss": -27.780145254479834, "global_step": 586311, "epoch": 7063, "val_loss": 6510363.5} {"train_loss": -26.885833740234375, "global_step": 586312, "epoch": 7064} {"train_loss": -26.150339126586914, "global_step": 586313, "epoch": 7064} {"train_loss": -26.562726974487305, "global_step": 586314, "epoch": 7064} {"train_loss": -26.19330406188965, "global_step": 586315, "epoch": 7064} {"train_loss": -27.075275421142578, "global_step": 586316, "epoch": 7064} {"train_loss": -26.504552841186523, "global_step": 586317, "epoch": 7064} {"train_loss": -26.97708511352539, "global_step": 586318, "epoch": 7064} {"train_loss": -26.745264053344727, "global_step": 586319, "epoch": 7064} {"train_loss": -26.81402015686035, "global_step": 586320, "epoch": 7064} {"train_loss": -26.95830726623535, "global_step": 586321, "epoch": 7064} {"train_loss": -27.090784072875977, "global_step": 586322, "epoch": 7064} {"train_loss": -26.861774444580078, "global_step": 586323, "epoch": 7064} {"train_loss": -27.295881271362305, "global_step": 586324, "epoch": 7064} {"train_loss": -27.326984405517578, "global_step": 586325, "epoch": 7064} {"train_loss": -27.242223739624023, "global_step": 586326, "epoch": 7064} {"train_loss": -27.185260772705078, "global_step": 586327, "epoch": 7064} {"train_loss": -27.506885528564453, "global_step": 586328, "epoch": 7064} {"train_loss": -27.58201026916504, "global_step": 586329, "epoch": 7064} {"train_loss": -27.727344512939453, "global_step": 586330, "epoch": 7064} {"train_loss": -27.723892211914062, "global_step": 586331, "epoch": 7064} {"train_loss": -27.691919326782227, "global_step": 586332, "epoch": 7064} {"train_loss": -27.359472274780273, "global_step": 586333, "epoch": 7064} {"train_loss": -27.72881507873535, "global_step": 586334, "epoch": 7064} {"train_loss": -27.69099235534668, "global_step": 586335, "epoch": 7064} {"train_loss": -27.820520401000977, "global_step": 586336, "epoch": 7064} {"train_loss": -27.777587890625, "global_step": 586337, "epoch": 7064} {"train_loss": -27.55092430114746, "global_step": 586338, "epoch": 7064} {"train_loss": -27.52247428894043, "global_step": 586339, "epoch": 7064} {"train_loss": -27.8159236907959, "global_step": 586340, "epoch": 7064} {"train_loss": -28.071496963500977, "global_step": 586341, "epoch": 7064} {"train_loss": -27.927947998046875, "global_step": 586342, "epoch": 7064} {"train_loss": -27.92292594909668, "global_step": 586343, "epoch": 7064} {"train_loss": -27.7626895904541, "global_step": 586344, "epoch": 7064} {"train_loss": -27.822296142578125, "global_step": 586345, "epoch": 7064} {"train_loss": -27.940317153930664, "global_step": 586346, "epoch": 7064} {"train_loss": -27.9342041015625, "global_step": 586347, "epoch": 7064} {"train_loss": -27.602619171142578, "global_step": 586348, "epoch": 7064} {"train_loss": -27.908536911010742, "global_step": 586349, "epoch": 7064} {"train_loss": -27.719451904296875, "global_step": 586350, "epoch": 7064} {"train_loss": -27.819793701171875, "global_step": 586351, "epoch": 7064} {"train_loss": -27.76401138305664, "global_step": 586352, "epoch": 7064} {"train_loss": -27.872268676757812, "global_step": 586353, "epoch": 7064} {"train_loss": -28.00152587890625, "global_step": 586354, "epoch": 7064} {"train_loss": -28.207700729370117, "global_step": 586355, "epoch": 7064} {"train_loss": -27.84205436706543, "global_step": 586356, "epoch": 7064} {"train_loss": -28.061359405517578, "global_step": 586357, "epoch": 7064} {"train_loss": -28.426727294921875, "global_step": 586358, "epoch": 7064} {"train_loss": -28.1386661529541, "global_step": 586359, "epoch": 7064} {"train_loss": -28.044387817382812, "global_step": 586360, "epoch": 7064} {"train_loss": -28.338281631469727, "global_step": 586361, "epoch": 7064} {"train_loss": -27.838937759399414, "global_step": 586362, "epoch": 7064} {"train_loss": -27.965656280517578, "global_step": 586363, "epoch": 7064} {"train_loss": -28.221343994140625, "global_step": 586364, "epoch": 7064} {"train_loss": -28.029218673706055, "global_step": 586365, "epoch": 7064} {"train_loss": -28.042205810546875, "global_step": 586366, "epoch": 7064} {"train_loss": -28.429113388061523, "global_step": 586367, "epoch": 7064} {"train_loss": -28.31013298034668, "global_step": 586368, "epoch": 7064} {"train_loss": -28.2658748626709, "global_step": 586369, "epoch": 7064} {"train_loss": -28.247343063354492, "global_step": 586370, "epoch": 7064} {"train_loss": -28.56439208984375, "global_step": 586371, "epoch": 7064} {"train_loss": -28.311620712280273, "global_step": 586372, "epoch": 7064} {"train_loss": -28.146591186523438, "global_step": 586373, "epoch": 7064} {"train_loss": -28.39728355407715, "global_step": 586374, "epoch": 7064} {"train_loss": -28.01641273498535, "global_step": 586375, "epoch": 7064} {"train_loss": -28.12977409362793, "global_step": 586376, "epoch": 7064} {"train_loss": -28.20703125, "global_step": 586377, "epoch": 7064} {"train_loss": -27.875202178955078, "global_step": 586378, "epoch": 7064} {"train_loss": -27.662931442260742, "global_step": 586379, "epoch": 7064} {"train_loss": -27.121244430541992, "global_step": 586380, "epoch": 7064} {"train_loss": -26.513303756713867, "global_step": 586381, "epoch": 7064} {"train_loss": -25.668689727783203, "global_step": 586382, "epoch": 7064} {"train_loss": -25.747055053710938, "global_step": 586383, "epoch": 7064} {"train_loss": -27.271764755249023, "global_step": 586384, "epoch": 7064} {"train_loss": -26.7291259765625, "global_step": 586385, "epoch": 7064} {"train_loss": -27.621479034423828, "global_step": 586386, "epoch": 7064} {"train_loss": -26.7009220123291, "global_step": 586387, "epoch": 7064} {"train_loss": -28.2652645111084, "global_step": 586388, "epoch": 7064} {"train_loss": -27.411218643188477, "global_step": 586389, "epoch": 7064} {"train_loss": -27.644575119018555, "global_step": 586390, "epoch": 7064} {"train_loss": -27.517866134643555, "global_step": 586391, "epoch": 7064} {"train_loss": -27.029645919799805, "global_step": 586392, "epoch": 7064} {"train_loss": -27.22482681274414, "global_step": 586393, "epoch": 7064} {"train_loss": -27.58256061967597, "global_step": 586394, "epoch": 7064, "val_loss": 6567032.0} {"train_loss": -27.134389877319336, "global_step": 586395, "epoch": 7065} {"train_loss": -27.75095558166504, "global_step": 586396, "epoch": 7065} {"train_loss": -27.331623077392578, "global_step": 586397, "epoch": 7065} {"train_loss": -27.138751983642578, "global_step": 586398, "epoch": 7065} {"train_loss": -26.90021324157715, "global_step": 586399, "epoch": 7065} {"train_loss": -27.24305534362793, "global_step": 586400, "epoch": 7065} {"train_loss": -26.327062606811523, "global_step": 586401, "epoch": 7065} {"train_loss": -27.79510498046875, "global_step": 586402, "epoch": 7065} {"train_loss": -27.071533203125, "global_step": 586403, "epoch": 7065} {"train_loss": -28.112287521362305, "global_step": 586404, "epoch": 7065} {"train_loss": -27.172407150268555, "global_step": 586405, "epoch": 7065} {"train_loss": -27.231327056884766, "global_step": 586406, "epoch": 7065} {"train_loss": -27.20014762878418, "global_step": 586407, "epoch": 7065} {"train_loss": -27.216766357421875, "global_step": 586408, "epoch": 7065} {"train_loss": -27.466327667236328, "global_step": 586409, "epoch": 7065} {"train_loss": -26.92970085144043, "global_step": 586410, "epoch": 7065} {"train_loss": -27.369495391845703, "global_step": 586411, "epoch": 7065} {"train_loss": -27.543394088745117, "global_step": 586412, "epoch": 7065} {"train_loss": -27.510812759399414, "global_step": 586413, "epoch": 7065} {"train_loss": -27.833356857299805, "global_step": 586414, "epoch": 7065} {"train_loss": -27.74675941467285, "global_step": 586415, "epoch": 7065} {"train_loss": -27.58884620666504, "global_step": 586416, "epoch": 7065} {"train_loss": -27.31598472595215, "global_step": 586417, "epoch": 7065} {"train_loss": -27.7304630279541, "global_step": 586418, "epoch": 7065} {"train_loss": -27.52882194519043, "global_step": 586419, "epoch": 7065} {"train_loss": -27.53949546813965, "global_step": 586420, "epoch": 7065} {"train_loss": -27.880842208862305, "global_step": 586421, "epoch": 7065} {"train_loss": -27.627145767211914, "global_step": 586422, "epoch": 7065} {"train_loss": -28.276092529296875, "global_step": 586423, "epoch": 7065} {"train_loss": -27.513147354125977, "global_step": 586424, "epoch": 7065} {"train_loss": -27.8964900970459, "global_step": 586425, "epoch": 7065} {"train_loss": -27.598295211791992, "global_step": 586426, "epoch": 7065} {"train_loss": -28.262548446655273, "global_step": 586427, "epoch": 7065} {"train_loss": -28.25772476196289, "global_step": 586428, "epoch": 7065} {"train_loss": -27.93497657775879, "global_step": 586429, "epoch": 7065} {"train_loss": -27.882299423217773, "global_step": 586430, "epoch": 7065} {"train_loss": -28.054059982299805, "global_step": 586431, "epoch": 7065} {"train_loss": -27.950963973999023, "global_step": 586432, "epoch": 7065} {"train_loss": -27.80848503112793, "global_step": 586433, "epoch": 7065} {"train_loss": -27.719160079956055, "global_step": 586434, "epoch": 7065} {"train_loss": -28.038644790649414, "global_step": 586435, "epoch": 7065} {"train_loss": -27.75092887878418, "global_step": 586436, "epoch": 7065} {"train_loss": -27.55817985534668, "global_step": 586437, "epoch": 7065} {"train_loss": -28.339223861694336, "global_step": 586438, "epoch": 7065} {"train_loss": -27.55350685119629, "global_step": 586439, "epoch": 7065} {"train_loss": -27.876596450805664, "global_step": 586440, "epoch": 7065} {"train_loss": -28.1973876953125, "global_step": 586441, "epoch": 7065} {"train_loss": -27.854711532592773, "global_step": 586442, "epoch": 7065} {"train_loss": -27.918903350830078, "global_step": 586443, "epoch": 7065} {"train_loss": -27.4980411529541, "global_step": 586444, "epoch": 7065} {"train_loss": -28.05124282836914, "global_step": 586445, "epoch": 7065} {"train_loss": -27.853498458862305, "global_step": 586446, "epoch": 7065} {"train_loss": -27.85285758972168, "global_step": 586447, "epoch": 7065} {"train_loss": -28.104642868041992, "global_step": 586448, "epoch": 7065} {"train_loss": -27.776874542236328, "global_step": 586449, "epoch": 7065} {"train_loss": -27.987585067749023, "global_step": 586450, "epoch": 7065} {"train_loss": -28.108051300048828, "global_step": 586451, "epoch": 7065} {"train_loss": -27.95087242126465, "global_step": 586452, "epoch": 7065} {"train_loss": -27.834569931030273, "global_step": 586453, "epoch": 7065} {"train_loss": -27.798192977905273, "global_step": 586454, "epoch": 7065} {"train_loss": -27.919626235961914, "global_step": 586455, "epoch": 7065} {"train_loss": -28.05454444885254, "global_step": 586456, "epoch": 7065} {"train_loss": -27.7370662689209, "global_step": 586457, "epoch": 7065} {"train_loss": -28.006250381469727, "global_step": 586458, "epoch": 7065} {"train_loss": -27.56355094909668, "global_step": 586459, "epoch": 7065} {"train_loss": -28.305997848510742, "global_step": 586460, "epoch": 7065} {"train_loss": -28.010778427124023, "global_step": 586461, "epoch": 7065} {"train_loss": -27.235153198242188, "global_step": 586462, "epoch": 7065} {"train_loss": -27.675168991088867, "global_step": 586463, "epoch": 7065} {"train_loss": -28.063207626342773, "global_step": 586464, "epoch": 7065} {"train_loss": -27.879865646362305, "global_step": 586465, "epoch": 7065} {"train_loss": -27.743127822875977, "global_step": 586466, "epoch": 7065} {"train_loss": -27.848876953125, "global_step": 586467, "epoch": 7065} {"train_loss": -27.798465728759766, "global_step": 586468, "epoch": 7065} {"train_loss": -27.729816436767578, "global_step": 586469, "epoch": 7065} {"train_loss": -27.58268165588379, "global_step": 586470, "epoch": 7065} {"train_loss": -28.311796188354492, "global_step": 586471, "epoch": 7065} {"train_loss": -27.55454444885254, "global_step": 586472, "epoch": 7065} {"train_loss": -28.404926300048828, "global_step": 586473, "epoch": 7065} {"train_loss": -27.98836326599121, "global_step": 586474, "epoch": 7065} {"train_loss": -28.0787353515625, "global_step": 586475, "epoch": 7065} {"train_loss": -27.700769424438477, "global_step": 586476, "epoch": 7065} {"train_loss": -27.73020236463432, "global_step": 586477, "epoch": 7065, "val_loss": 6545953.0} {"train_loss": -27.818647384643555, "global_step": 586478, "epoch": 7066} {"train_loss": -27.44478416442871, "global_step": 586479, "epoch": 7066} {"train_loss": -27.556188583374023, "global_step": 586480, "epoch": 7066} {"train_loss": -27.26374626159668, "global_step": 586481, "epoch": 7066} {"train_loss": -27.457244873046875, "global_step": 586482, "epoch": 7066} {"train_loss": -27.318592071533203, "global_step": 586483, "epoch": 7066} {"train_loss": -27.29154396057129, "global_step": 586484, "epoch": 7066} {"train_loss": -27.489660263061523, "global_step": 586485, "epoch": 7066} {"train_loss": -27.73834228515625, "global_step": 586486, "epoch": 7066} {"train_loss": -27.351367950439453, "global_step": 586487, "epoch": 7066} {"train_loss": -27.61370277404785, "global_step": 586488, "epoch": 7066} {"train_loss": -27.808273315429688, "global_step": 586489, "epoch": 7066} {"train_loss": -27.8475341796875, "global_step": 586490, "epoch": 7066} {"train_loss": -27.88629150390625, "global_step": 586491, "epoch": 7066} {"train_loss": -28.029428482055664, "global_step": 586492, "epoch": 7066} {"train_loss": -27.646015167236328, "global_step": 586493, "epoch": 7066} {"train_loss": -27.69659423828125, "global_step": 586494, "epoch": 7066} {"train_loss": -27.674396514892578, "global_step": 586495, "epoch": 7066} {"train_loss": -27.9716796875, "global_step": 586496, "epoch": 7066} {"train_loss": -27.45704460144043, "global_step": 586497, "epoch": 7066} {"train_loss": -27.72454261779785, "global_step": 586498, "epoch": 7066} {"train_loss": -27.961257934570312, "global_step": 586499, "epoch": 7066} {"train_loss": -27.66632080078125, "global_step": 586500, "epoch": 7066} {"train_loss": -27.78204917907715, "global_step": 586501, "epoch": 7066} {"train_loss": -27.599225997924805, "global_step": 586502, "epoch": 7066} {"train_loss": -28.163572311401367, "global_step": 586503, "epoch": 7066} {"train_loss": -27.886526107788086, "global_step": 586504, "epoch": 7066} {"train_loss": -27.72463035583496, "global_step": 586505, "epoch": 7066} {"train_loss": -27.9105281829834, "global_step": 586506, "epoch": 7066} {"train_loss": -27.674482345581055, "global_step": 586507, "epoch": 7066} {"train_loss": -28.413532257080078, "global_step": 586508, "epoch": 7066} {"train_loss": -28.117597579956055, "global_step": 586509, "epoch": 7066} {"train_loss": -27.759784698486328, "global_step": 586510, "epoch": 7066} {"train_loss": -27.836273193359375, "global_step": 586511, "epoch": 7066} {"train_loss": -28.034589767456055, "global_step": 586512, "epoch": 7066} {"train_loss": -28.30263328552246, "global_step": 586513, "epoch": 7066} {"train_loss": -28.044010162353516, "global_step": 586514, "epoch": 7066} {"train_loss": -28.02943992614746, "global_step": 586515, "epoch": 7066} {"train_loss": -27.884794235229492, "global_step": 586516, "epoch": 7066} {"train_loss": -28.269519805908203, "global_step": 586517, "epoch": 7066} {"train_loss": -28.014768600463867, "global_step": 586518, "epoch": 7066} {"train_loss": -27.92323875427246, "global_step": 586519, "epoch": 7066} {"train_loss": -28.07484245300293, "global_step": 586520, "epoch": 7066} {"train_loss": -27.750080108642578, "global_step": 586521, "epoch": 7066} {"train_loss": -27.749027252197266, "global_step": 586522, "epoch": 7066} {"train_loss": -28.154220581054688, "global_step": 586523, "epoch": 7066} {"train_loss": -27.7934513092041, "global_step": 586524, "epoch": 7066} {"train_loss": -27.67669105529785, "global_step": 586525, "epoch": 7066} {"train_loss": -28.103967666625977, "global_step": 586526, "epoch": 7066} {"train_loss": -28.328760147094727, "global_step": 586527, "epoch": 7066} {"train_loss": -27.902118682861328, "global_step": 586528, "epoch": 7066} {"train_loss": -28.187225341796875, "global_step": 586529, "epoch": 7066} {"train_loss": -27.6824893951416, "global_step": 586530, "epoch": 7066} {"train_loss": -27.657806396484375, "global_step": 586531, "epoch": 7066} {"train_loss": -27.975879669189453, "global_step": 586532, "epoch": 7066} {"train_loss": -28.2793025970459, "global_step": 586533, "epoch": 7066} {"train_loss": -27.733173370361328, "global_step": 586534, "epoch": 7066} {"train_loss": -28.176523208618164, "global_step": 586535, "epoch": 7066} {"train_loss": -27.778091430664062, "global_step": 586536, "epoch": 7066} {"train_loss": -28.088001251220703, "global_step": 586537, "epoch": 7066} {"train_loss": -27.998037338256836, "global_step": 586538, "epoch": 7066} {"train_loss": -28.201032638549805, "global_step": 586539, "epoch": 7066} {"train_loss": -28.033262252807617, "global_step": 586540, "epoch": 7066} {"train_loss": -28.037139892578125, "global_step": 586541, "epoch": 7066} {"train_loss": -27.9444522857666, "global_step": 586542, "epoch": 7066} {"train_loss": -28.29570960998535, "global_step": 586543, "epoch": 7066} {"train_loss": -27.877431869506836, "global_step": 586544, "epoch": 7066} {"train_loss": -27.52738380432129, "global_step": 586545, "epoch": 7066} {"train_loss": -27.469797134399414, "global_step": 586546, "epoch": 7066} {"train_loss": -27.92267417907715, "global_step": 586547, "epoch": 7066} {"train_loss": -27.73089599609375, "global_step": 586548, "epoch": 7066} {"train_loss": -27.427366256713867, "global_step": 586549, "epoch": 7066} {"train_loss": -28.13861656188965, "global_step": 586550, "epoch": 7066} {"train_loss": -27.7072696685791, "global_step": 586551, "epoch": 7066} {"train_loss": -27.772659301757812, "global_step": 586552, "epoch": 7066} {"train_loss": -27.643238067626953, "global_step": 586553, "epoch": 7066} {"train_loss": -27.79652214050293, "global_step": 586554, "epoch": 7066} {"train_loss": -27.970319747924805, "global_step": 586555, "epoch": 7066} {"train_loss": -27.965652465820312, "global_step": 586556, "epoch": 7066} {"train_loss": -27.836706161499023, "global_step": 586557, "epoch": 7066} {"train_loss": -27.879074096679688, "global_step": 586558, "epoch": 7066} {"train_loss": -27.81396484375, "global_step": 586559, "epoch": 7066} {"train_loss": -27.84426659273814, "global_step": 586560, "epoch": 7066, "val_loss": 6490523.0} {"train_loss": -26.44087028503418, "global_step": 586561, "epoch": 7067} {"train_loss": -23.415985107421875, "global_step": 586562, "epoch": 7067} {"train_loss": -25.091413497924805, "global_step": 586563, "epoch": 7067} {"train_loss": -26.858631134033203, "global_step": 586564, "epoch": 7067} {"train_loss": -24.5162353515625, "global_step": 586565, "epoch": 7067} {"train_loss": -27.138708114624023, "global_step": 586566, "epoch": 7067} {"train_loss": -25.672407150268555, "global_step": 586567, "epoch": 7067} {"train_loss": -27.197223663330078, "global_step": 586568, "epoch": 7067} {"train_loss": -26.361371994018555, "global_step": 586569, "epoch": 7067} {"train_loss": -26.473011016845703, "global_step": 586570, "epoch": 7067} {"train_loss": -26.6762638092041, "global_step": 586571, "epoch": 7067} {"train_loss": -27.109479904174805, "global_step": 586572, "epoch": 7067} {"train_loss": -26.475513458251953, "global_step": 586573, "epoch": 7067} {"train_loss": -26.96038246154785, "global_step": 586574, "epoch": 7067} {"train_loss": -26.939422607421875, "global_step": 586575, "epoch": 7067} {"train_loss": -27.18037223815918, "global_step": 586576, "epoch": 7067} {"train_loss": -27.039697647094727, "global_step": 586577, "epoch": 7067} {"train_loss": -26.930204391479492, "global_step": 586578, "epoch": 7067} {"train_loss": -26.794885635375977, "global_step": 586579, "epoch": 7067} {"train_loss": -26.915817260742188, "global_step": 586580, "epoch": 7067} {"train_loss": -27.36234474182129, "global_step": 586581, "epoch": 7067} {"train_loss": -26.865270614624023, "global_step": 586582, "epoch": 7067} {"train_loss": -27.65919303894043, "global_step": 586583, "epoch": 7067} {"train_loss": -27.127395629882812, "global_step": 586584, "epoch": 7067} {"train_loss": -27.372522354125977, "global_step": 586585, "epoch": 7067} {"train_loss": -27.431604385375977, "global_step": 586586, "epoch": 7067} {"train_loss": -27.468957901000977, "global_step": 586587, "epoch": 7067} {"train_loss": -27.137826919555664, "global_step": 586588, "epoch": 7067} {"train_loss": -27.552820205688477, "global_step": 586589, "epoch": 7067} {"train_loss": -27.39008903503418, "global_step": 586590, "epoch": 7067} {"train_loss": -27.503976821899414, "global_step": 586591, "epoch": 7067} {"train_loss": -27.45057487487793, "global_step": 586592, "epoch": 7067} {"train_loss": -27.467071533203125, "global_step": 586593, "epoch": 7067} {"train_loss": -27.730224609375, "global_step": 586594, "epoch": 7067} {"train_loss": -27.704025268554688, "global_step": 586595, "epoch": 7067} {"train_loss": -27.670385360717773, "global_step": 586596, "epoch": 7067} {"train_loss": -27.93678092956543, "global_step": 586597, "epoch": 7067} {"train_loss": -27.921308517456055, "global_step": 586598, "epoch": 7067} {"train_loss": -27.819303512573242, "global_step": 586599, "epoch": 7067} {"train_loss": -28.032440185546875, "global_step": 586600, "epoch": 7067} {"train_loss": -27.54892921447754, "global_step": 586601, "epoch": 7067} {"train_loss": -27.926599502563477, "global_step": 586602, "epoch": 7067} {"train_loss": -28.16489028930664, "global_step": 586603, "epoch": 7067} {"train_loss": -27.544416427612305, "global_step": 586604, "epoch": 7067} {"train_loss": -27.68543815612793, "global_step": 586605, "epoch": 7067} {"train_loss": -27.970657348632812, "global_step": 586606, "epoch": 7067} {"train_loss": -27.96445655822754, "global_step": 586607, "epoch": 7067} {"train_loss": -27.813934326171875, "global_step": 586608, "epoch": 7067} {"train_loss": -28.022947311401367, "global_step": 586609, "epoch": 7067} {"train_loss": -28.045801162719727, "global_step": 586610, "epoch": 7067} {"train_loss": -27.951343536376953, "global_step": 586611, "epoch": 7067} {"train_loss": -28.4031982421875, "global_step": 586612, "epoch": 7067} {"train_loss": -27.805089950561523, "global_step": 586613, "epoch": 7067} {"train_loss": -27.78626823425293, "global_step": 586614, "epoch": 7067} {"train_loss": -28.05987548828125, "global_step": 586615, "epoch": 7067} {"train_loss": -27.872034072875977, "global_step": 586616, "epoch": 7067} {"train_loss": -28.22950553894043, "global_step": 586617, "epoch": 7067} {"train_loss": -27.620563507080078, "global_step": 586618, "epoch": 7067} {"train_loss": -28.24968910217285, "global_step": 586619, "epoch": 7067} {"train_loss": -28.02699089050293, "global_step": 586620, "epoch": 7067} {"train_loss": -28.033483505249023, "global_step": 586621, "epoch": 7067} {"train_loss": -28.243839263916016, "global_step": 586622, "epoch": 7067} {"train_loss": -28.2582950592041, "global_step": 586623, "epoch": 7067} {"train_loss": -28.057111740112305, "global_step": 586624, "epoch": 7067} {"train_loss": -27.714054107666016, "global_step": 586625, "epoch": 7067} {"train_loss": -27.8459529876709, "global_step": 586626, "epoch": 7067} {"train_loss": -27.07468605041504, "global_step": 586627, "epoch": 7067} {"train_loss": -25.812225341796875, "global_step": 586628, "epoch": 7067} {"train_loss": -25.518728256225586, "global_step": 586629, "epoch": 7067} {"train_loss": -27.000598907470703, "global_step": 586630, "epoch": 7067} {"train_loss": -27.108673095703125, "global_step": 586631, "epoch": 7067} {"train_loss": -27.035390853881836, "global_step": 586632, "epoch": 7067} {"train_loss": -26.89093589782715, "global_step": 586633, "epoch": 7067} {"train_loss": -27.1397762298584, "global_step": 586634, "epoch": 7067} {"train_loss": -27.45368003845215, "global_step": 586635, "epoch": 7067} {"train_loss": -27.53895378112793, "global_step": 586636, "epoch": 7067} {"train_loss": -27.10255241394043, "global_step": 586637, "epoch": 7067} {"train_loss": -27.68840980529785, "global_step": 586638, "epoch": 7067} {"train_loss": -27.547399520874023, "global_step": 586639, "epoch": 7067} {"train_loss": -27.806427001953125, "global_step": 586640, "epoch": 7067} {"train_loss": -27.556238174438477, "global_step": 586641, "epoch": 7067} {"train_loss": -27.441125869750977, "global_step": 586642, "epoch": 7067} {"train_loss": -27.302465323942254, "global_step": 586643, "epoch": 7067, "val_loss": 6507126.0} {"train_loss": -26.817493438720703, "global_step": 586644, "epoch": 7068} {"train_loss": -26.640913009643555, "global_step": 586645, "epoch": 7068} {"train_loss": -27.250898361206055, "global_step": 586646, "epoch": 7068} {"train_loss": -27.465280532836914, "global_step": 586647, "epoch": 7068} {"train_loss": -27.23321533203125, "global_step": 586648, "epoch": 7068} {"train_loss": -27.057941436767578, "global_step": 586649, "epoch": 7068} {"train_loss": -27.350311279296875, "global_step": 586650, "epoch": 7068} {"train_loss": -27.5010986328125, "global_step": 586651, "epoch": 7068} {"train_loss": -27.476459503173828, "global_step": 586652, "epoch": 7068} {"train_loss": -27.579702377319336, "global_step": 586653, "epoch": 7068} {"train_loss": -27.33591651916504, "global_step": 586654, "epoch": 7068} {"train_loss": -27.689212799072266, "global_step": 586655, "epoch": 7068} {"train_loss": -27.496692657470703, "global_step": 586656, "epoch": 7068} {"train_loss": -27.327070236206055, "global_step": 586657, "epoch": 7068} {"train_loss": -28.11573600769043, "global_step": 586658, "epoch": 7068} {"train_loss": -27.851062774658203, "global_step": 586659, "epoch": 7068} {"train_loss": -27.63437271118164, "global_step": 586660, "epoch": 7068} {"train_loss": -27.777881622314453, "global_step": 586661, "epoch": 7068} {"train_loss": -27.66713523864746, "global_step": 586662, "epoch": 7068} {"train_loss": -27.56467056274414, "global_step": 586663, "epoch": 7068} {"train_loss": -28.138708114624023, "global_step": 586664, "epoch": 7068} {"train_loss": -27.858076095581055, "global_step": 586665, "epoch": 7068} {"train_loss": -27.831165313720703, "global_step": 586666, "epoch": 7068} {"train_loss": -27.765592575073242, "global_step": 586667, "epoch": 7068} {"train_loss": -27.640060424804688, "global_step": 586668, "epoch": 7068} {"train_loss": -27.898839950561523, "global_step": 586669, "epoch": 7068} {"train_loss": -28.01397705078125, "global_step": 586670, "epoch": 7068} {"train_loss": -27.8400821685791, "global_step": 586671, "epoch": 7068} {"train_loss": -27.7205867767334, "global_step": 586672, "epoch": 7068} {"train_loss": -27.638458251953125, "global_step": 586673, "epoch": 7068} {"train_loss": -27.918487548828125, "global_step": 586674, "epoch": 7068} {"train_loss": -27.874277114868164, "global_step": 586675, "epoch": 7068} {"train_loss": -28.126230239868164, "global_step": 586676, "epoch": 7068} {"train_loss": -28.210540771484375, "global_step": 586677, "epoch": 7068} {"train_loss": -27.838605880737305, "global_step": 586678, "epoch": 7068} {"train_loss": -28.074359893798828, "global_step": 586679, "epoch": 7068} {"train_loss": -28.06184196472168, "global_step": 586680, "epoch": 7068} {"train_loss": -28.131093978881836, "global_step": 586681, "epoch": 7068} {"train_loss": -27.743793487548828, "global_step": 586682, "epoch": 7068} {"train_loss": -28.40361976623535, "global_step": 586683, "epoch": 7068} {"train_loss": -27.99700927734375, "global_step": 586684, "epoch": 7068} {"train_loss": -28.2752685546875, "global_step": 586685, "epoch": 7068} {"train_loss": -28.29140281677246, "global_step": 586686, "epoch": 7068} {"train_loss": -28.261688232421875, "global_step": 586687, "epoch": 7068} {"train_loss": -28.279098510742188, "global_step": 586688, "epoch": 7068} {"train_loss": -27.903888702392578, "global_step": 586689, "epoch": 7068} {"train_loss": -28.197641372680664, "global_step": 586690, "epoch": 7068} {"train_loss": -27.99531364440918, "global_step": 586691, "epoch": 7068} {"train_loss": -28.36801528930664, "global_step": 586692, "epoch": 7068} {"train_loss": -27.93855094909668, "global_step": 586693, "epoch": 7068} {"train_loss": -28.138202667236328, "global_step": 586694, "epoch": 7068} {"train_loss": -28.3669376373291, "global_step": 586695, "epoch": 7068} {"train_loss": -28.404285430908203, "global_step": 586696, "epoch": 7068} {"train_loss": -28.375656127929688, "global_step": 586697, "epoch": 7068} {"train_loss": -28.14858055114746, "global_step": 586698, "epoch": 7068} {"train_loss": -28.088001251220703, "global_step": 586699, "epoch": 7068} {"train_loss": -28.319488525390625, "global_step": 586700, "epoch": 7068} {"train_loss": -28.117185592651367, "global_step": 586701, "epoch": 7068} {"train_loss": -27.74061393737793, "global_step": 586702, "epoch": 7068} {"train_loss": -27.938867568969727, "global_step": 586703, "epoch": 7068} {"train_loss": -28.040891647338867, "global_step": 586704, "epoch": 7068} {"train_loss": -28.085468292236328, "global_step": 586705, "epoch": 7068} {"train_loss": -27.833845138549805, "global_step": 586706, "epoch": 7068} {"train_loss": -27.992645263671875, "global_step": 586707, "epoch": 7068} {"train_loss": -27.990222930908203, "global_step": 586708, "epoch": 7068} {"train_loss": -27.83509635925293, "global_step": 586709, "epoch": 7068} {"train_loss": -27.95745277404785, "global_step": 586710, "epoch": 7068} {"train_loss": -28.177017211914062, "global_step": 586711, "epoch": 7068} {"train_loss": -28.29801368713379, "global_step": 586712, "epoch": 7068} {"train_loss": -27.888952255249023, "global_step": 586713, "epoch": 7068} {"train_loss": -28.1163330078125, "global_step": 586714, "epoch": 7068} {"train_loss": -27.583845138549805, "global_step": 586715, "epoch": 7068} {"train_loss": -28.199743270874023, "global_step": 586716, "epoch": 7068} {"train_loss": -28.091949462890625, "global_step": 586717, "epoch": 7068} {"train_loss": -27.727880477905273, "global_step": 586718, "epoch": 7068} {"train_loss": -28.0462646484375, "global_step": 586719, "epoch": 7068} {"train_loss": -28.046430587768555, "global_step": 586720, "epoch": 7068} {"train_loss": -28.02373695373535, "global_step": 586721, "epoch": 7068} {"train_loss": -28.395538330078125, "global_step": 586722, "epoch": 7068} {"train_loss": -27.96921730041504, "global_step": 586723, "epoch": 7068} {"train_loss": -27.983388900756836, "global_step": 586724, "epoch": 7068} {"train_loss": -27.71344566345215, "global_step": 586725, "epoch": 7068} {"train_loss": -27.906464427350514, "global_step": 586726, "epoch": 7068, "val_loss": 6536406.0} {"train_loss": -27.77945327758789, "global_step": 586727, "epoch": 7069} {"train_loss": -26.12872886657715, "global_step": 586728, "epoch": 7069} {"train_loss": -26.903125762939453, "global_step": 586729, "epoch": 7069} {"train_loss": -27.634862899780273, "global_step": 586730, "epoch": 7069} {"train_loss": -27.105255126953125, "global_step": 586731, "epoch": 7069} {"train_loss": -27.09820556640625, "global_step": 586732, "epoch": 7069} {"train_loss": -27.846723556518555, "global_step": 586733, "epoch": 7069} {"train_loss": -27.41425895690918, "global_step": 586734, "epoch": 7069} {"train_loss": -27.637868881225586, "global_step": 586735, "epoch": 7069} {"train_loss": -27.167160034179688, "global_step": 586736, "epoch": 7069} {"train_loss": -27.310773849487305, "global_step": 586737, "epoch": 7069} {"train_loss": -27.57936668395996, "global_step": 586738, "epoch": 7069} {"train_loss": -27.842370986938477, "global_step": 586739, "epoch": 7069} {"train_loss": -27.97748374938965, "global_step": 586740, "epoch": 7069} {"train_loss": -27.851028442382812, "global_step": 586741, "epoch": 7069} {"train_loss": -27.541534423828125, "global_step": 586742, "epoch": 7069} {"train_loss": -27.85881996154785, "global_step": 586743, "epoch": 7069} {"train_loss": -28.156478881835938, "global_step": 586744, "epoch": 7069} {"train_loss": -27.658597946166992, "global_step": 586745, "epoch": 7069} {"train_loss": -27.96967887878418, "global_step": 586746, "epoch": 7069} {"train_loss": -27.788183212280273, "global_step": 586747, "epoch": 7069} {"train_loss": -27.8808650970459, "global_step": 586748, "epoch": 7069} {"train_loss": -28.033401489257812, "global_step": 586749, "epoch": 7069} {"train_loss": -27.897216796875, "global_step": 586750, "epoch": 7069} {"train_loss": -27.631153106689453, "global_step": 586751, "epoch": 7069} {"train_loss": -27.67292594909668, "global_step": 586752, "epoch": 7069} {"train_loss": -27.78004264831543, "global_step": 586753, "epoch": 7069} {"train_loss": -27.711200714111328, "global_step": 586754, "epoch": 7069} {"train_loss": -28.023401260375977, "global_step": 586755, "epoch": 7069} {"train_loss": -28.33417320251465, "global_step": 586756, "epoch": 7069} {"train_loss": -27.66861343383789, "global_step": 586757, "epoch": 7069} {"train_loss": -27.9127140045166, "global_step": 586758, "epoch": 7069} {"train_loss": -27.64410972595215, "global_step": 586759, "epoch": 7069} {"train_loss": -27.832080841064453, "global_step": 586760, "epoch": 7069} {"train_loss": -27.87214469909668, "global_step": 586761, "epoch": 7069} {"train_loss": -28.020933151245117, "global_step": 586762, "epoch": 7069} {"train_loss": -27.857742309570312, "global_step": 586763, "epoch": 7069} {"train_loss": -28.091718673706055, "global_step": 586764, "epoch": 7069} {"train_loss": -28.22816276550293, "global_step": 586765, "epoch": 7069} {"train_loss": -28.21673583984375, "global_step": 586766, "epoch": 7069} {"train_loss": -28.00884437561035, "global_step": 586767, "epoch": 7069} {"train_loss": -28.193017959594727, "global_step": 586768, "epoch": 7069} {"train_loss": -28.35536766052246, "global_step": 586769, "epoch": 7069} {"train_loss": -27.685596466064453, "global_step": 586770, "epoch": 7069} {"train_loss": -27.89613151550293, "global_step": 586771, "epoch": 7069} {"train_loss": -28.018041610717773, "global_step": 586772, "epoch": 7069} {"train_loss": -27.984262466430664, "global_step": 586773, "epoch": 7069} {"train_loss": -27.891010284423828, "global_step": 586774, "epoch": 7069} {"train_loss": -28.2471866607666, "global_step": 586775, "epoch": 7069} {"train_loss": -27.90242576599121, "global_step": 586776, "epoch": 7069} {"train_loss": -27.76778221130371, "global_step": 586777, "epoch": 7069} {"train_loss": -27.78358268737793, "global_step": 586778, "epoch": 7069} {"train_loss": -27.744298934936523, "global_step": 586779, "epoch": 7069} {"train_loss": -28.168766021728516, "global_step": 586780, "epoch": 7069} {"train_loss": -28.00465202331543, "global_step": 586781, "epoch": 7069} {"train_loss": -28.40839958190918, "global_step": 586782, "epoch": 7069} {"train_loss": -28.053205490112305, "global_step": 586783, "epoch": 7069} {"train_loss": -27.8905029296875, "global_step": 586784, "epoch": 7069} {"train_loss": -27.59210777282715, "global_step": 586785, "epoch": 7069} {"train_loss": -27.7456111907959, "global_step": 586786, "epoch": 7069} {"train_loss": -27.985097885131836, "global_step": 586787, "epoch": 7069} {"train_loss": -28.292810440063477, "global_step": 586788, "epoch": 7069} {"train_loss": -27.96211051940918, "global_step": 586789, "epoch": 7069} {"train_loss": -27.891845703125, "global_step": 586790, "epoch": 7069} {"train_loss": -27.75119972229004, "global_step": 586791, "epoch": 7069} {"train_loss": -28.227294921875, "global_step": 586792, "epoch": 7069} {"train_loss": -28.005477905273438, "global_step": 586793, "epoch": 7069} {"train_loss": -28.045734405517578, "global_step": 586794, "epoch": 7069} {"train_loss": -27.990116119384766, "global_step": 586795, "epoch": 7069} {"train_loss": -28.1058349609375, "global_step": 586796, "epoch": 7069} {"train_loss": -27.90677261352539, "global_step": 586797, "epoch": 7069} {"train_loss": -28.19618797302246, "global_step": 586798, "epoch": 7069} {"train_loss": -28.569305419921875, "global_step": 586799, "epoch": 7069} {"train_loss": -27.903949737548828, "global_step": 586800, "epoch": 7069} {"train_loss": -28.111377716064453, "global_step": 586801, "epoch": 7069} {"train_loss": -28.291473388671875, "global_step": 586802, "epoch": 7069} {"train_loss": -28.048025131225586, "global_step": 586803, "epoch": 7069} {"train_loss": -28.10999870300293, "global_step": 586804, "epoch": 7069} {"train_loss": -28.058340072631836, "global_step": 586805, "epoch": 7069} {"train_loss": -27.980737686157227, "global_step": 586806, "epoch": 7069} {"train_loss": -27.570255279541016, "global_step": 586807, "epoch": 7069} {"train_loss": -26.74820327758789, "global_step": 586808, "epoch": 7069} {"train_loss": -27.81554814993617, "global_step": 586809, "epoch": 7069, "val_loss": 6534113.0} {"train_loss": -25.070560455322266, "global_step": 586810, "epoch": 7070} {"train_loss": -24.472532272338867, "global_step": 586811, "epoch": 7070} {"train_loss": -24.888525009155273, "global_step": 586812, "epoch": 7070} {"train_loss": -24.72922134399414, "global_step": 586813, "epoch": 7070} {"train_loss": -24.565113067626953, "global_step": 586814, "epoch": 7070} {"train_loss": -25.40488052368164, "global_step": 586815, "epoch": 7070} {"train_loss": -25.47822380065918, "global_step": 586816, "epoch": 7070} {"train_loss": -26.19902992248535, "global_step": 586817, "epoch": 7070} {"train_loss": -25.69685173034668, "global_step": 586818, "epoch": 7070} {"train_loss": -25.609235763549805, "global_step": 586819, "epoch": 7070} {"train_loss": -25.405776977539062, "global_step": 586820, "epoch": 7070} {"train_loss": -25.868600845336914, "global_step": 586821, "epoch": 7070} {"train_loss": -25.855365753173828, "global_step": 586822, "epoch": 7070} {"train_loss": -26.32606315612793, "global_step": 586823, "epoch": 7070} {"train_loss": -26.274511337280273, "global_step": 586824, "epoch": 7070} {"train_loss": -26.814294815063477, "global_step": 586825, "epoch": 7070} {"train_loss": -26.735523223876953, "global_step": 586826, "epoch": 7070} {"train_loss": -26.501977920532227, "global_step": 586827, "epoch": 7070} {"train_loss": -26.600255966186523, "global_step": 586828, "epoch": 7070} {"train_loss": -26.60150146484375, "global_step": 586829, "epoch": 7070} {"train_loss": -27.051422119140625, "global_step": 586830, "epoch": 7070} {"train_loss": -26.640838623046875, "global_step": 586831, "epoch": 7070} {"train_loss": -26.625045776367188, "global_step": 586832, "epoch": 7070} {"train_loss": -26.827539443969727, "global_step": 586833, "epoch": 7070} {"train_loss": -26.918012619018555, "global_step": 586834, "epoch": 7070} {"train_loss": -26.962018966674805, "global_step": 586835, "epoch": 7070} {"train_loss": -26.986562728881836, "global_step": 586836, "epoch": 7070} {"train_loss": -26.963043212890625, "global_step": 586837, "epoch": 7070} {"train_loss": -27.103368759155273, "global_step": 586838, "epoch": 7070} {"train_loss": -27.365110397338867, "global_step": 586839, "epoch": 7070} {"train_loss": -27.358448028564453, "global_step": 586840, "epoch": 7070} {"train_loss": -27.320554733276367, "global_step": 586841, "epoch": 7070} {"train_loss": -27.053617477416992, "global_step": 586842, "epoch": 7070} {"train_loss": -27.3999080657959, "global_step": 586843, "epoch": 7070} {"train_loss": -27.2866153717041, "global_step": 586844, "epoch": 7070} {"train_loss": -27.11282730102539, "global_step": 586845, "epoch": 7070} {"train_loss": -27.348005294799805, "global_step": 586846, "epoch": 7070} {"train_loss": -27.393346786499023, "global_step": 586847, "epoch": 7070} {"train_loss": -27.43720054626465, "global_step": 586848, "epoch": 7070} {"train_loss": -27.470991134643555, "global_step": 586849, "epoch": 7070} {"train_loss": -27.230194091796875, "global_step": 586850, "epoch": 7070} {"train_loss": -27.65867042541504, "global_step": 586851, "epoch": 7070} {"train_loss": -27.5118465423584, "global_step": 586852, "epoch": 7070} {"train_loss": -27.52910804748535, "global_step": 586853, "epoch": 7070} {"train_loss": -27.438520431518555, "global_step": 586854, "epoch": 7070} {"train_loss": -27.549779891967773, "global_step": 586855, "epoch": 7070} {"train_loss": -27.31317138671875, "global_step": 586856, "epoch": 7070} {"train_loss": -27.607391357421875, "global_step": 586857, "epoch": 7070} {"train_loss": -27.7845516204834, "global_step": 586858, "epoch": 7070} {"train_loss": -27.34211540222168, "global_step": 586859, "epoch": 7070} {"train_loss": -27.45660972595215, "global_step": 586860, "epoch": 7070} {"train_loss": -27.941160202026367, "global_step": 586861, "epoch": 7070} {"train_loss": -27.643766403198242, "global_step": 586862, "epoch": 7070} {"train_loss": -27.577259063720703, "global_step": 586863, "epoch": 7070} {"train_loss": -27.844486236572266, "global_step": 586864, "epoch": 7070} {"train_loss": -27.539661407470703, "global_step": 586865, "epoch": 7070} {"train_loss": -28.155685424804688, "global_step": 586866, "epoch": 7070} {"train_loss": -27.5684757232666, "global_step": 586867, "epoch": 7070} {"train_loss": -28.0971622467041, "global_step": 586868, "epoch": 7070} {"train_loss": -27.43499183654785, "global_step": 586869, "epoch": 7070} {"train_loss": -28.106603622436523, "global_step": 586870, "epoch": 7070} {"train_loss": -27.734113693237305, "global_step": 586871, "epoch": 7070} {"train_loss": -28.067609786987305, "global_step": 586872, "epoch": 7070} {"train_loss": -27.674970626831055, "global_step": 586873, "epoch": 7070} {"train_loss": -27.787200927734375, "global_step": 586874, "epoch": 7070} {"train_loss": -28.034204483032227, "global_step": 586875, "epoch": 7070} {"train_loss": -28.03500747680664, "global_step": 586876, "epoch": 7070} {"train_loss": -28.070343017578125, "global_step": 586877, "epoch": 7070} {"train_loss": -27.88571548461914, "global_step": 586878, "epoch": 7070} {"train_loss": -28.253503799438477, "global_step": 586879, "epoch": 7070} {"train_loss": -27.815214157104492, "global_step": 586880, "epoch": 7070} {"train_loss": -27.904993057250977, "global_step": 586881, "epoch": 7070} {"train_loss": -27.75674819946289, "global_step": 586882, "epoch": 7070} {"train_loss": -27.913742065429688, "global_step": 586883, "epoch": 7070} {"train_loss": -28.01822280883789, "global_step": 586884, "epoch": 7070} {"train_loss": -28.38397216796875, "global_step": 586885, "epoch": 7070} {"train_loss": -27.940942764282227, "global_step": 586886, "epoch": 7070} {"train_loss": -27.964521408081055, "global_step": 586887, "epoch": 7070} {"train_loss": -27.978729248046875, "global_step": 586888, "epoch": 7070} {"train_loss": -28.0357608795166, "global_step": 586889, "epoch": 7070} {"train_loss": -27.83258628845215, "global_step": 586890, "epoch": 7070} {"train_loss": -27.86459732055664, "global_step": 586891, "epoch": 7070} {"train_loss": -27.141138904065972, "global_step": 586892, "epoch": 7070, "val_loss": 6481594.0} {"train_loss": -27.704450607299805, "global_step": 586893, "epoch": 7071} {"train_loss": -27.608749389648438, "global_step": 586894, "epoch": 7071} {"train_loss": -27.801488876342773, "global_step": 586895, "epoch": 7071} {"train_loss": -27.521299362182617, "global_step": 586896, "epoch": 7071} {"train_loss": -27.703937530517578, "global_step": 586897, "epoch": 7071} {"train_loss": -27.797107696533203, "global_step": 586898, "epoch": 7071} {"train_loss": -27.99176597595215, "global_step": 586899, "epoch": 7071} {"train_loss": -28.170185089111328, "global_step": 586900, "epoch": 7071} {"train_loss": -27.5601749420166, "global_step": 586901, "epoch": 7071} {"train_loss": -27.769567489624023, "global_step": 586902, "epoch": 7071} {"train_loss": -27.890684127807617, "global_step": 586903, "epoch": 7071} {"train_loss": -27.97214126586914, "global_step": 586904, "epoch": 7071} {"train_loss": -27.70293617248535, "global_step": 586905, "epoch": 7071} {"train_loss": -27.408954620361328, "global_step": 586906, "epoch": 7071} {"train_loss": -27.68402099609375, "global_step": 586907, "epoch": 7071} {"train_loss": -28.1829891204834, "global_step": 586908, "epoch": 7071} {"train_loss": -27.649429321289062, "global_step": 586909, "epoch": 7071} {"train_loss": -27.963489532470703, "global_step": 586910, "epoch": 7071} {"train_loss": -27.6993465423584, "global_step": 586911, "epoch": 7071} {"train_loss": -27.810470581054688, "global_step": 586912, "epoch": 7071} {"train_loss": -28.00897216796875, "global_step": 586913, "epoch": 7071} {"train_loss": -27.81351661682129, "global_step": 586914, "epoch": 7071} {"train_loss": -27.926467895507812, "global_step": 586915, "epoch": 7071} {"train_loss": -28.091480255126953, "global_step": 586916, "epoch": 7071} {"train_loss": -28.172992706298828, "global_step": 586917, "epoch": 7071} {"train_loss": -28.08970069885254, "global_step": 586918, "epoch": 7071} {"train_loss": -27.96186637878418, "global_step": 586919, "epoch": 7071} {"train_loss": -27.80647087097168, "global_step": 586920, "epoch": 7071} {"train_loss": -28.225629806518555, "global_step": 586921, "epoch": 7071} {"train_loss": -27.804309844970703, "global_step": 586922, "epoch": 7071} {"train_loss": -28.254840850830078, "global_step": 586923, "epoch": 7071} {"train_loss": -28.03081703186035, "global_step": 586924, "epoch": 7071} {"train_loss": -28.220478057861328, "global_step": 586925, "epoch": 7071} {"train_loss": -28.162750244140625, "global_step": 586926, "epoch": 7071} {"train_loss": -28.131948471069336, "global_step": 586927, "epoch": 7071} {"train_loss": -28.247907638549805, "global_step": 586928, "epoch": 7071} {"train_loss": -28.003620147705078, "global_step": 586929, "epoch": 7071} {"train_loss": -28.140287399291992, "global_step": 586930, "epoch": 7071} {"train_loss": -27.8383731842041, "global_step": 586931, "epoch": 7071} {"train_loss": -28.2923583984375, "global_step": 586932, "epoch": 7071} {"train_loss": -27.91290283203125, "global_step": 586933, "epoch": 7071} {"train_loss": -28.112821578979492, "global_step": 586934, "epoch": 7071} {"train_loss": -27.975244522094727, "global_step": 586935, "epoch": 7071} {"train_loss": -28.278839111328125, "global_step": 586936, "epoch": 7071} {"train_loss": -28.053592681884766, "global_step": 586937, "epoch": 7071} {"train_loss": -28.163482666015625, "global_step": 586938, "epoch": 7071} {"train_loss": -28.095706939697266, "global_step": 586939, "epoch": 7071} {"train_loss": -28.171218872070312, "global_step": 586940, "epoch": 7071} {"train_loss": -28.429059982299805, "global_step": 586941, "epoch": 7071} {"train_loss": -28.137964248657227, "global_step": 586942, "epoch": 7071} {"train_loss": -28.225860595703125, "global_step": 586943, "epoch": 7071} {"train_loss": -27.774627685546875, "global_step": 586944, "epoch": 7071} {"train_loss": -27.85546875, "global_step": 586945, "epoch": 7071} {"train_loss": -27.924955368041992, "global_step": 586946, "epoch": 7071} {"train_loss": -28.370275497436523, "global_step": 586947, "epoch": 7071} {"train_loss": -27.8659610748291, "global_step": 586948, "epoch": 7071} {"train_loss": -28.285192489624023, "global_step": 586949, "epoch": 7071} {"train_loss": -28.43985366821289, "global_step": 586950, "epoch": 7071} {"train_loss": -28.1862850189209, "global_step": 586951, "epoch": 7071} {"train_loss": -28.164703369140625, "global_step": 586952, "epoch": 7071} {"train_loss": -28.11701011657715, "global_step": 586953, "epoch": 7071} {"train_loss": -27.894805908203125, "global_step": 586954, "epoch": 7071} {"train_loss": -27.41114616394043, "global_step": 586955, "epoch": 7071} {"train_loss": -27.06805419921875, "global_step": 586956, "epoch": 7071} {"train_loss": -26.52310562133789, "global_step": 586957, "epoch": 7071} {"train_loss": -26.021039962768555, "global_step": 586958, "epoch": 7071} {"train_loss": -26.46438980102539, "global_step": 586959, "epoch": 7071} {"train_loss": -27.60906410217285, "global_step": 586960, "epoch": 7071} {"train_loss": -26.762359619140625, "global_step": 586961, "epoch": 7071} {"train_loss": -27.284378051757812, "global_step": 586962, "epoch": 7071} {"train_loss": -27.69268798828125, "global_step": 586963, "epoch": 7071} {"train_loss": -27.14545249938965, "global_step": 586964, "epoch": 7071} {"train_loss": -27.393896102905273, "global_step": 586965, "epoch": 7071} {"train_loss": -27.378314971923828, "global_step": 586966, "epoch": 7071} {"train_loss": -28.02241325378418, "global_step": 586967, "epoch": 7071} {"train_loss": -27.7010498046875, "global_step": 586968, "epoch": 7071} {"train_loss": -27.709989547729492, "global_step": 586969, "epoch": 7071} {"train_loss": -27.504199981689453, "global_step": 586970, "epoch": 7071} {"train_loss": -27.4339599609375, "global_step": 586971, "epoch": 7071} {"train_loss": -27.35247802734375, "global_step": 586972, "epoch": 7071} {"train_loss": -27.53790855407715, "global_step": 586973, "epoch": 7071} {"train_loss": -27.820209503173828, "global_step": 586974, "epoch": 7071} {"train_loss": -27.809406602239033, "global_step": 586975, "epoch": 7071, "val_loss": 6532818.5} {"train_loss": -27.858976364135742, "global_step": 586976, "epoch": 7072} {"train_loss": -27.404022216796875, "global_step": 586977, "epoch": 7072} {"train_loss": -27.3768310546875, "global_step": 586978, "epoch": 7072} {"train_loss": -27.436124801635742, "global_step": 586979, "epoch": 7072} {"train_loss": -27.344120025634766, "global_step": 586980, "epoch": 7072} {"train_loss": -27.434362411499023, "global_step": 586981, "epoch": 7072} {"train_loss": -27.397296905517578, "global_step": 586982, "epoch": 7072} {"train_loss": -27.795881271362305, "global_step": 586983, "epoch": 7072} {"train_loss": -27.544599533081055, "global_step": 586984, "epoch": 7072} {"train_loss": -27.6406307220459, "global_step": 586985, "epoch": 7072} {"train_loss": -27.69767189025879, "global_step": 586986, "epoch": 7072} {"train_loss": -27.49810791015625, "global_step": 586987, "epoch": 7072} {"train_loss": -28.1071834564209, "global_step": 586988, "epoch": 7072} {"train_loss": -27.674381256103516, "global_step": 586989, "epoch": 7072} {"train_loss": -27.933063507080078, "global_step": 586990, "epoch": 7072} {"train_loss": -27.78016471862793, "global_step": 586991, "epoch": 7072} {"train_loss": -27.5587158203125, "global_step": 586992, "epoch": 7072} {"train_loss": -28.085041046142578, "global_step": 586993, "epoch": 7072} {"train_loss": -27.65736961364746, "global_step": 586994, "epoch": 7072} {"train_loss": -28.04749870300293, "global_step": 586995, "epoch": 7072} {"train_loss": -27.8554744720459, "global_step": 586996, "epoch": 7072} {"train_loss": -27.941974639892578, "global_step": 586997, "epoch": 7072} {"train_loss": -27.910568237304688, "global_step": 586998, "epoch": 7072} {"train_loss": -27.440412521362305, "global_step": 586999, "epoch": 7072} {"train_loss": -27.939233779907227, "global_step": 587000, "epoch": 7072} {"train_loss": -28.221759796142578, "global_step": 587001, "epoch": 7072} {"train_loss": -27.70745277404785, "global_step": 587002, "epoch": 7072} {"train_loss": -27.75239372253418, "global_step": 587003, "epoch": 7072} {"train_loss": -28.2016544342041, "global_step": 587004, "epoch": 7072} {"train_loss": -27.494644165039062, "global_step": 587005, "epoch": 7072} {"train_loss": -28.15863037109375, "global_step": 587006, "epoch": 7072} {"train_loss": -27.988544464111328, "global_step": 587007, "epoch": 7072} {"train_loss": -28.329914093017578, "global_step": 587008, "epoch": 7072} {"train_loss": -27.91046142578125, "global_step": 587009, "epoch": 7072} {"train_loss": -27.71979331970215, "global_step": 587010, "epoch": 7072} {"train_loss": -28.056161880493164, "global_step": 587011, "epoch": 7072} {"train_loss": -28.23982048034668, "global_step": 587012, "epoch": 7072} {"train_loss": -28.270666122436523, "global_step": 587013, "epoch": 7072} {"train_loss": -28.08286476135254, "global_step": 587014, "epoch": 7072} {"train_loss": -27.925296783447266, "global_step": 587015, "epoch": 7072} {"train_loss": -28.334569931030273, "global_step": 587016, "epoch": 7072} {"train_loss": -28.08870506286621, "global_step": 587017, "epoch": 7072} {"train_loss": -27.607282638549805, "global_step": 587018, "epoch": 7072} {"train_loss": -27.85736656188965, "global_step": 587019, "epoch": 7072} {"train_loss": -27.65065574645996, "global_step": 587020, "epoch": 7072} {"train_loss": -28.059110641479492, "global_step": 587021, "epoch": 7072} {"train_loss": -27.980310440063477, "global_step": 587022, "epoch": 7072} {"train_loss": -27.1809024810791, "global_step": 587023, "epoch": 7072} {"train_loss": -26.545703887939453, "global_step": 587024, "epoch": 7072} {"train_loss": -27.570398330688477, "global_step": 587025, "epoch": 7072} {"train_loss": -28.296884536743164, "global_step": 587026, "epoch": 7072} {"train_loss": -27.53249168395996, "global_step": 587027, "epoch": 7072} {"train_loss": -27.90688133239746, "global_step": 587028, "epoch": 7072} {"train_loss": -28.05014419555664, "global_step": 587029, "epoch": 7072} {"train_loss": -27.900983810424805, "global_step": 587030, "epoch": 7072} {"train_loss": -27.418720245361328, "global_step": 587031, "epoch": 7072} {"train_loss": -27.15838623046875, "global_step": 587032, "epoch": 7072} {"train_loss": -27.930585861206055, "global_step": 587033, "epoch": 7072} {"train_loss": -27.448949813842773, "global_step": 587034, "epoch": 7072} {"train_loss": -27.85927391052246, "global_step": 587035, "epoch": 7072} {"train_loss": -27.53412437438965, "global_step": 587036, "epoch": 7072} {"train_loss": -27.72966957092285, "global_step": 587037, "epoch": 7072} {"train_loss": -27.67280387878418, "global_step": 587038, "epoch": 7072} {"train_loss": -27.8388671875, "global_step": 587039, "epoch": 7072} {"train_loss": -27.817747116088867, "global_step": 587040, "epoch": 7072} {"train_loss": -27.879419326782227, "global_step": 587041, "epoch": 7072} {"train_loss": -27.9129638671875, "global_step": 587042, "epoch": 7072} {"train_loss": -27.6018009185791, "global_step": 587043, "epoch": 7072} {"train_loss": -28.053205490112305, "global_step": 587044, "epoch": 7072} {"train_loss": -27.767261505126953, "global_step": 587045, "epoch": 7072} {"train_loss": -27.910572052001953, "global_step": 587046, "epoch": 7072} {"train_loss": -27.6884765625, "global_step": 587047, "epoch": 7072} {"train_loss": -27.840225219726562, "global_step": 587048, "epoch": 7072} {"train_loss": -27.70075035095215, "global_step": 587049, "epoch": 7072} {"train_loss": -27.896289825439453, "global_step": 587050, "epoch": 7072} {"train_loss": -27.997480392456055, "global_step": 587051, "epoch": 7072} {"train_loss": -27.65736198425293, "global_step": 587052, "epoch": 7072} {"train_loss": -28.377796173095703, "global_step": 587053, "epoch": 7072} {"train_loss": -27.802881240844727, "global_step": 587054, "epoch": 7072} {"train_loss": -27.563589096069336, "global_step": 587055, "epoch": 7072} {"train_loss": -27.96375846862793, "global_step": 587056, "epoch": 7072} {"train_loss": -27.9505672454834, "global_step": 587057, "epoch": 7072} {"train_loss": -27.80414232001247, "global_step": 587058, "epoch": 7072, "val_loss": 6561076.0} {"train_loss": -26.447092056274414, "global_step": 587059, "epoch": 7073} {"train_loss": -27.193830490112305, "global_step": 587060, "epoch": 7073} {"train_loss": -27.85796546936035, "global_step": 587061, "epoch": 7073} {"train_loss": -26.684040069580078, "global_step": 587062, "epoch": 7073} {"train_loss": -26.669260025024414, "global_step": 587063, "epoch": 7073} {"train_loss": -26.699737548828125, "global_step": 587064, "epoch": 7073} {"train_loss": -26.79317283630371, "global_step": 587065, "epoch": 7073} {"train_loss": -27.265674591064453, "global_step": 587066, "epoch": 7073} {"train_loss": -27.0124454498291, "global_step": 587067, "epoch": 7073} {"train_loss": -27.441089630126953, "global_step": 587068, "epoch": 7073} {"train_loss": -27.719573974609375, "global_step": 587069, "epoch": 7073} {"train_loss": -27.010400772094727, "global_step": 587070, "epoch": 7073} {"train_loss": -27.1107120513916, "global_step": 587071, "epoch": 7073} {"train_loss": -27.474842071533203, "global_step": 587072, "epoch": 7073} {"train_loss": -27.410165786743164, "global_step": 587073, "epoch": 7073} {"train_loss": -26.80438232421875, "global_step": 587074, "epoch": 7073} {"train_loss": -27.413665771484375, "global_step": 587075, "epoch": 7073} {"train_loss": -27.57333755493164, "global_step": 587076, "epoch": 7073} {"train_loss": -27.42917251586914, "global_step": 587077, "epoch": 7073} {"train_loss": -27.687030792236328, "global_step": 587078, "epoch": 7073} {"train_loss": -27.66570472717285, "global_step": 587079, "epoch": 7073} {"train_loss": -27.605514526367188, "global_step": 587080, "epoch": 7073} {"train_loss": -27.560781478881836, "global_step": 587081, "epoch": 7073} {"train_loss": -27.540973663330078, "global_step": 587082, "epoch": 7073} {"train_loss": -27.467737197875977, "global_step": 587083, "epoch": 7073} {"train_loss": -27.672321319580078, "global_step": 587084, "epoch": 7073} {"train_loss": -27.849206924438477, "global_step": 587085, "epoch": 7073} {"train_loss": -27.37679100036621, "global_step": 587086, "epoch": 7073} {"train_loss": -27.769062042236328, "global_step": 587087, "epoch": 7073} {"train_loss": -27.67877769470215, "global_step": 587088, "epoch": 7073} {"train_loss": -28.038375854492188, "global_step": 587089, "epoch": 7073} {"train_loss": -27.655059814453125, "global_step": 587090, "epoch": 7073} {"train_loss": -27.728260040283203, "global_step": 587091, "epoch": 7073} {"train_loss": -27.915084838867188, "global_step": 587092, "epoch": 7073} {"train_loss": -27.77597999572754, "global_step": 587093, "epoch": 7073} {"train_loss": -27.969482421875, "global_step": 587094, "epoch": 7073} {"train_loss": -27.794448852539062, "global_step": 587095, "epoch": 7073} {"train_loss": -27.631637573242188, "global_step": 587096, "epoch": 7073} {"train_loss": -27.994672775268555, "global_step": 587097, "epoch": 7073} {"train_loss": -27.586273193359375, "global_step": 587098, "epoch": 7073} {"train_loss": -28.352270126342773, "global_step": 587099, "epoch": 7073} {"train_loss": -28.105710983276367, "global_step": 587100, "epoch": 7073} {"train_loss": -27.58804702758789, "global_step": 587101, "epoch": 7073} {"train_loss": -27.8916015625, "global_step": 587102, "epoch": 7073} {"train_loss": -28.140649795532227, "global_step": 587103, "epoch": 7073} {"train_loss": -27.694629669189453, "global_step": 587104, "epoch": 7073} {"train_loss": -28.20992088317871, "global_step": 587105, "epoch": 7073} {"train_loss": -28.044031143188477, "global_step": 587106, "epoch": 7073} {"train_loss": -27.692163467407227, "global_step": 587107, "epoch": 7073} {"train_loss": -27.943078994750977, "global_step": 587108, "epoch": 7073} {"train_loss": -28.151010513305664, "global_step": 587109, "epoch": 7073} {"train_loss": -28.253467559814453, "global_step": 587110, "epoch": 7073} {"train_loss": -27.908599853515625, "global_step": 587111, "epoch": 7073} {"train_loss": -28.05216407775879, "global_step": 587112, "epoch": 7073} {"train_loss": -27.770727157592773, "global_step": 587113, "epoch": 7073} {"train_loss": -27.887592315673828, "global_step": 587114, "epoch": 7073} {"train_loss": -27.811567306518555, "global_step": 587115, "epoch": 7073} {"train_loss": -27.65167808532715, "global_step": 587116, "epoch": 7073} {"train_loss": -28.29396629333496, "global_step": 587117, "epoch": 7073} {"train_loss": -27.92510414123535, "global_step": 587118, "epoch": 7073} {"train_loss": -28.137632369995117, "global_step": 587119, "epoch": 7073} {"train_loss": -28.08375358581543, "global_step": 587120, "epoch": 7073} {"train_loss": -28.04665184020996, "global_step": 587121, "epoch": 7073} {"train_loss": -27.9016056060791, "global_step": 587122, "epoch": 7073} {"train_loss": -27.893905639648438, "global_step": 587123, "epoch": 7073} {"train_loss": -28.35072135925293, "global_step": 587124, "epoch": 7073} {"train_loss": -28.30975914001465, "global_step": 587125, "epoch": 7073} {"train_loss": -27.981542587280273, "global_step": 587126, "epoch": 7073} {"train_loss": -28.39592933654785, "global_step": 587127, "epoch": 7073} {"train_loss": -28.066547393798828, "global_step": 587128, "epoch": 7073} {"train_loss": -27.947385787963867, "global_step": 587129, "epoch": 7073} {"train_loss": -28.369245529174805, "global_step": 587130, "epoch": 7073} {"train_loss": -28.35896110534668, "global_step": 587131, "epoch": 7073} {"train_loss": -28.2186222076416, "global_step": 587132, "epoch": 7073} {"train_loss": -27.80396842956543, "global_step": 587133, "epoch": 7073} {"train_loss": -28.117719650268555, "global_step": 587134, "epoch": 7073} {"train_loss": -27.89371109008789, "global_step": 587135, "epoch": 7073} {"train_loss": -28.106555938720703, "global_step": 587136, "epoch": 7073} {"train_loss": -28.28045082092285, "global_step": 587137, "epoch": 7073} {"train_loss": -28.264368057250977, "global_step": 587138, "epoch": 7073} {"train_loss": -28.275924682617188, "global_step": 587139, "epoch": 7073} {"train_loss": -28.208898544311523, "global_step": 587140, "epoch": 7073} {"train_loss": -27.765429324414356, "global_step": 587141, "epoch": 7073, "val_loss": 6628646.0} {"train_loss": -27.77076530456543, "global_step": 587142, "epoch": 7074} {"train_loss": -27.55604362487793, "global_step": 587143, "epoch": 7074} {"train_loss": -27.574539184570312, "global_step": 587144, "epoch": 7074} {"train_loss": -27.271703720092773, "global_step": 587145, "epoch": 7074} {"train_loss": -27.578754425048828, "global_step": 587146, "epoch": 7074} {"train_loss": -27.38612174987793, "global_step": 587147, "epoch": 7074} {"train_loss": -27.73126220703125, "global_step": 587148, "epoch": 7074} {"train_loss": -27.612110137939453, "global_step": 587149, "epoch": 7074} {"train_loss": -27.356306076049805, "global_step": 587150, "epoch": 7074} {"train_loss": -27.340147018432617, "global_step": 587151, "epoch": 7074} {"train_loss": -27.69577980041504, "global_step": 587152, "epoch": 7074} {"train_loss": -27.548547744750977, "global_step": 587153, "epoch": 7074} {"train_loss": -27.63054847717285, "global_step": 587154, "epoch": 7074} {"train_loss": -27.46320915222168, "global_step": 587155, "epoch": 7074} {"train_loss": -27.202499389648438, "global_step": 587156, "epoch": 7074} {"train_loss": -27.9218692779541, "global_step": 587157, "epoch": 7074} {"train_loss": -27.782155990600586, "global_step": 587158, "epoch": 7074} {"train_loss": -27.395605087280273, "global_step": 587159, "epoch": 7074} {"train_loss": -27.39048194885254, "global_step": 587160, "epoch": 7074} {"train_loss": -27.58782386779785, "global_step": 587161, "epoch": 7074} {"train_loss": -27.507007598876953, "global_step": 587162, "epoch": 7074} {"train_loss": -28.059417724609375, "global_step": 587163, "epoch": 7074} {"train_loss": -27.592985153198242, "global_step": 587164, "epoch": 7074} {"train_loss": -27.46253776550293, "global_step": 587165, "epoch": 7074} {"train_loss": -27.874441146850586, "global_step": 587166, "epoch": 7074} {"train_loss": -27.4696102142334, "global_step": 587167, "epoch": 7074} {"train_loss": -27.616804122924805, "global_step": 587168, "epoch": 7074} {"train_loss": -27.980060577392578, "global_step": 587169, "epoch": 7074} {"train_loss": -27.69086265563965, "global_step": 587170, "epoch": 7074} {"train_loss": -27.994150161743164, "global_step": 587171, "epoch": 7074} {"train_loss": -27.93027114868164, "global_step": 587172, "epoch": 7074} {"train_loss": -27.9055118560791, "global_step": 587173, "epoch": 7074} {"train_loss": -28.224994659423828, "global_step": 587174, "epoch": 7074} {"train_loss": -28.074024200439453, "global_step": 587175, "epoch": 7074} {"train_loss": -27.70265007019043, "global_step": 587176, "epoch": 7074} {"train_loss": -28.463062286376953, "global_step": 587177, "epoch": 7074} {"train_loss": -27.541868209838867, "global_step": 587178, "epoch": 7074} {"train_loss": -27.666873931884766, "global_step": 587179, "epoch": 7074} {"train_loss": -27.803266525268555, "global_step": 587180, "epoch": 7074} {"train_loss": -27.758543014526367, "global_step": 587181, "epoch": 7074} {"train_loss": -27.850147247314453, "global_step": 587182, "epoch": 7074} {"train_loss": -28.29962730407715, "global_step": 587183, "epoch": 7074} {"train_loss": -28.121912002563477, "global_step": 587184, "epoch": 7074} {"train_loss": -28.009662628173828, "global_step": 587185, "epoch": 7074} {"train_loss": -28.274206161499023, "global_step": 587186, "epoch": 7074} {"train_loss": -28.20768165588379, "global_step": 587187, "epoch": 7074} {"train_loss": -27.963159561157227, "global_step": 587188, "epoch": 7074} {"train_loss": -28.21640968322754, "global_step": 587189, "epoch": 7074} {"train_loss": -28.132665634155273, "global_step": 587190, "epoch": 7074} {"train_loss": -27.806564331054688, "global_step": 587191, "epoch": 7074} {"train_loss": -28.402067184448242, "global_step": 587192, "epoch": 7074} {"train_loss": -27.968799591064453, "global_step": 587193, "epoch": 7074} {"train_loss": -28.02507972717285, "global_step": 587194, "epoch": 7074} {"train_loss": -27.93084144592285, "global_step": 587195, "epoch": 7074} {"train_loss": -27.962554931640625, "global_step": 587196, "epoch": 7074} {"train_loss": -28.07958984375, "global_step": 587197, "epoch": 7074} {"train_loss": -28.36305046081543, "global_step": 587198, "epoch": 7074} {"train_loss": -28.128835678100586, "global_step": 587199, "epoch": 7074} {"train_loss": -28.2271671295166, "global_step": 587200, "epoch": 7074} {"train_loss": -27.824201583862305, "global_step": 587201, "epoch": 7074} {"train_loss": -27.893207550048828, "global_step": 587202, "epoch": 7074} {"train_loss": -27.61374282836914, "global_step": 587203, "epoch": 7074} {"train_loss": -27.9058780670166, "global_step": 587204, "epoch": 7074} {"train_loss": -27.825841903686523, "global_step": 587205, "epoch": 7074} {"train_loss": -27.87742042541504, "global_step": 587206, "epoch": 7074} {"train_loss": -27.897741317749023, "global_step": 587207, "epoch": 7074} {"train_loss": -28.0024471282959, "global_step": 587208, "epoch": 7074} {"train_loss": -28.169605255126953, "global_step": 587209, "epoch": 7074} {"train_loss": -28.245620727539062, "global_step": 587210, "epoch": 7074} {"train_loss": -28.16480827331543, "global_step": 587211, "epoch": 7074} {"train_loss": -28.17974281311035, "global_step": 587212, "epoch": 7074} {"train_loss": -27.848180770874023, "global_step": 587213, "epoch": 7074} {"train_loss": -28.513803482055664, "global_step": 587214, "epoch": 7074} {"train_loss": -28.32207679748535, "global_step": 587215, "epoch": 7074} {"train_loss": -28.076282501220703, "global_step": 587216, "epoch": 7074} {"train_loss": -28.024871826171875, "global_step": 587217, "epoch": 7074} {"train_loss": -28.031171798706055, "global_step": 587218, "epoch": 7074} {"train_loss": -28.110275268554688, "global_step": 587219, "epoch": 7074} {"train_loss": -28.09474754333496, "global_step": 587220, "epoch": 7074} {"train_loss": -27.853290557861328, "global_step": 587221, "epoch": 7074} {"train_loss": -28.27849769592285, "global_step": 587222, "epoch": 7074} {"train_loss": -28.26181411743164, "global_step": 587223, "epoch": 7074} {"train_loss": -27.88919248925634, "global_step": 587224, "epoch": 7074, "val_loss": 6606903.0} {"train_loss": -27.547901153564453, "global_step": 587225, "epoch": 7075} {"train_loss": -27.509672164916992, "global_step": 587226, "epoch": 7075} {"train_loss": -27.811920166015625, "global_step": 587227, "epoch": 7075} {"train_loss": -27.412626266479492, "global_step": 587228, "epoch": 7075} {"train_loss": -27.3214054107666, "global_step": 587229, "epoch": 7075} {"train_loss": -27.211532592773438, "global_step": 587230, "epoch": 7075} {"train_loss": -27.0976505279541, "global_step": 587231, "epoch": 7075} {"train_loss": -27.681509017944336, "global_step": 587232, "epoch": 7075} {"train_loss": -27.513233184814453, "global_step": 587233, "epoch": 7075} {"train_loss": -27.6341552734375, "global_step": 587234, "epoch": 7075} {"train_loss": -27.51068115234375, "global_step": 587235, "epoch": 7075} {"train_loss": -27.705366134643555, "global_step": 587236, "epoch": 7075} {"train_loss": -26.68340492248535, "global_step": 587237, "epoch": 7075} {"train_loss": -27.617523193359375, "global_step": 587238, "epoch": 7075} {"train_loss": -27.453893661499023, "global_step": 587239, "epoch": 7075} {"train_loss": -27.44978904724121, "global_step": 587240, "epoch": 7075} {"train_loss": -27.71710205078125, "global_step": 587241, "epoch": 7075} {"train_loss": -27.413192749023438, "global_step": 587242, "epoch": 7075} {"train_loss": -27.8989315032959, "global_step": 587243, "epoch": 7075} {"train_loss": -27.76331901550293, "global_step": 587244, "epoch": 7075} {"train_loss": -27.91572380065918, "global_step": 587245, "epoch": 7075} {"train_loss": -27.47987174987793, "global_step": 587246, "epoch": 7075} {"train_loss": -27.99321937561035, "global_step": 587247, "epoch": 7075} {"train_loss": -27.387420654296875, "global_step": 587248, "epoch": 7075} {"train_loss": -27.787322998046875, "global_step": 587249, "epoch": 7075} {"train_loss": -27.26362419128418, "global_step": 587250, "epoch": 7075} {"train_loss": -27.373586654663086, "global_step": 587251, "epoch": 7075} {"train_loss": -27.90838050842285, "global_step": 587252, "epoch": 7075} {"train_loss": -27.689748764038086, "global_step": 587253, "epoch": 7075} {"train_loss": -27.600635528564453, "global_step": 587254, "epoch": 7075} {"train_loss": -27.937564849853516, "global_step": 587255, "epoch": 7075} {"train_loss": -27.74053382873535, "global_step": 587256, "epoch": 7075} {"train_loss": -27.947574615478516, "global_step": 587257, "epoch": 7075} {"train_loss": -27.84274673461914, "global_step": 587258, "epoch": 7075} {"train_loss": -27.58160972595215, "global_step": 587259, "epoch": 7075} {"train_loss": -27.5333251953125, "global_step": 587260, "epoch": 7075} {"train_loss": -27.823486328125, "global_step": 587261, "epoch": 7075} {"train_loss": -27.487730026245117, "global_step": 587262, "epoch": 7075} {"train_loss": -27.828495025634766, "global_step": 587263, "epoch": 7075} {"train_loss": -27.68345069885254, "global_step": 587264, "epoch": 7075} {"train_loss": -27.810638427734375, "global_step": 587265, "epoch": 7075} {"train_loss": -27.68800926208496, "global_step": 587266, "epoch": 7075} {"train_loss": -27.901763916015625, "global_step": 587267, "epoch": 7075} {"train_loss": -28.034286499023438, "global_step": 587268, "epoch": 7075} {"train_loss": -27.732507705688477, "global_step": 587269, "epoch": 7075} {"train_loss": -27.754886627197266, "global_step": 587270, "epoch": 7075} {"train_loss": -27.93912124633789, "global_step": 587271, "epoch": 7075} {"train_loss": -28.094614028930664, "global_step": 587272, "epoch": 7075} {"train_loss": -28.060245513916016, "global_step": 587273, "epoch": 7075} {"train_loss": -27.6887149810791, "global_step": 587274, "epoch": 7075} {"train_loss": -27.54093360900879, "global_step": 587275, "epoch": 7075} {"train_loss": -27.808837890625, "global_step": 587276, "epoch": 7075} {"train_loss": -28.175622940063477, "global_step": 587277, "epoch": 7075} {"train_loss": -28.13553237915039, "global_step": 587278, "epoch": 7075} {"train_loss": -28.036407470703125, "global_step": 587279, "epoch": 7075} {"train_loss": -28.104673385620117, "global_step": 587280, "epoch": 7075} {"train_loss": -27.980878829956055, "global_step": 587281, "epoch": 7075} {"train_loss": -27.895389556884766, "global_step": 587282, "epoch": 7075} {"train_loss": -27.92408561706543, "global_step": 587283, "epoch": 7075} {"train_loss": -28.25848960876465, "global_step": 587284, "epoch": 7075} {"train_loss": -28.225433349609375, "global_step": 587285, "epoch": 7075} {"train_loss": -27.72490882873535, "global_step": 587286, "epoch": 7075} {"train_loss": -27.8601016998291, "global_step": 587287, "epoch": 7075} {"train_loss": -28.376361846923828, "global_step": 587288, "epoch": 7075} {"train_loss": -27.811649322509766, "global_step": 587289, "epoch": 7075} {"train_loss": -27.702320098876953, "global_step": 587290, "epoch": 7075} {"train_loss": -27.798059463500977, "global_step": 587291, "epoch": 7075} {"train_loss": -27.738779067993164, "global_step": 587292, "epoch": 7075} {"train_loss": -28.29676628112793, "global_step": 587293, "epoch": 7075} {"train_loss": -27.69717788696289, "global_step": 587294, "epoch": 7075} {"train_loss": -27.933990478515625, "global_step": 587295, "epoch": 7075} {"train_loss": -27.84095573425293, "global_step": 587296, "epoch": 7075} {"train_loss": -28.145374298095703, "global_step": 587297, "epoch": 7075} {"train_loss": -28.167531967163086, "global_step": 587298, "epoch": 7075} {"train_loss": -27.718036651611328, "global_step": 587299, "epoch": 7075} {"train_loss": -28.08644676208496, "global_step": 587300, "epoch": 7075} {"train_loss": -27.849609375, "global_step": 587301, "epoch": 7075} {"train_loss": -27.731287002563477, "global_step": 587302, "epoch": 7075} {"train_loss": -27.5605525970459, "global_step": 587303, "epoch": 7075} {"train_loss": -28.09201431274414, "global_step": 587304, "epoch": 7075} {"train_loss": -28.333337783813477, "global_step": 587305, "epoch": 7075} {"train_loss": -27.82940101623535, "global_step": 587306, "epoch": 7075} {"train_loss": -27.7669712204531, "global_step": 587307, "epoch": 7075, "val_loss": 6507561.0} {"train_loss": -27.36842155456543, "global_step": 587308, "epoch": 7076} {"train_loss": -27.219348907470703, "global_step": 587309, "epoch": 7076} {"train_loss": -26.97492027282715, "global_step": 587310, "epoch": 7076} {"train_loss": -27.17425537109375, "global_step": 587311, "epoch": 7076} {"train_loss": -26.643402099609375, "global_step": 587312, "epoch": 7076} {"train_loss": -27.54315185546875, "global_step": 587313, "epoch": 7076} {"train_loss": -27.099267959594727, "global_step": 587314, "epoch": 7076} {"train_loss": -27.231718063354492, "global_step": 587315, "epoch": 7076} {"train_loss": -27.38760757446289, "global_step": 587316, "epoch": 7076} {"train_loss": -27.528457641601562, "global_step": 587317, "epoch": 7076} {"train_loss": -27.192716598510742, "global_step": 587318, "epoch": 7076} {"train_loss": -27.29951286315918, "global_step": 587319, "epoch": 7076} {"train_loss": -27.633466720581055, "global_step": 587320, "epoch": 7076} {"train_loss": -27.722076416015625, "global_step": 587321, "epoch": 7076} {"train_loss": -27.612943649291992, "global_step": 587322, "epoch": 7076} {"train_loss": -27.631671905517578, "global_step": 587323, "epoch": 7076} {"train_loss": -27.43743324279785, "global_step": 587324, "epoch": 7076} {"train_loss": -27.450485229492188, "global_step": 587325, "epoch": 7076} {"train_loss": -27.70357322692871, "global_step": 587326, "epoch": 7076} {"train_loss": -27.607099533081055, "global_step": 587327, "epoch": 7076} {"train_loss": -27.875141143798828, "global_step": 587328, "epoch": 7076} {"train_loss": -27.46137046813965, "global_step": 587329, "epoch": 7076} {"train_loss": -27.688796997070312, "global_step": 587330, "epoch": 7076} {"train_loss": -27.547895431518555, "global_step": 587331, "epoch": 7076} {"train_loss": -27.63209342956543, "global_step": 587332, "epoch": 7076} {"train_loss": -27.57553482055664, "global_step": 587333, "epoch": 7076} {"train_loss": -27.691869735717773, "global_step": 587334, "epoch": 7076} {"train_loss": -27.577917098999023, "global_step": 587335, "epoch": 7076} {"train_loss": -27.821165084838867, "global_step": 587336, "epoch": 7076} {"train_loss": -27.88813591003418, "global_step": 587337, "epoch": 7076} {"train_loss": -27.88788414001465, "global_step": 587338, "epoch": 7076} {"train_loss": -27.500598907470703, "global_step": 587339, "epoch": 7076} {"train_loss": -28.229846954345703, "global_step": 587340, "epoch": 7076} {"train_loss": -27.784442901611328, "global_step": 587341, "epoch": 7076} {"train_loss": -28.011117935180664, "global_step": 587342, "epoch": 7076} {"train_loss": -28.061248779296875, "global_step": 587343, "epoch": 7076} {"train_loss": -28.048126220703125, "global_step": 587344, "epoch": 7076} {"train_loss": -27.846338272094727, "global_step": 587345, "epoch": 7076} {"train_loss": -28.122791290283203, "global_step": 587346, "epoch": 7076} {"train_loss": -27.677793502807617, "global_step": 587347, "epoch": 7076} {"train_loss": -27.935400009155273, "global_step": 587348, "epoch": 7076} {"train_loss": -28.43037223815918, "global_step": 587349, "epoch": 7076} {"train_loss": -28.06367301940918, "global_step": 587350, "epoch": 7076} {"train_loss": -28.010700225830078, "global_step": 587351, "epoch": 7076} {"train_loss": -27.778915405273438, "global_step": 587352, "epoch": 7076} {"train_loss": -27.919025421142578, "global_step": 587353, "epoch": 7076} {"train_loss": -28.150339126586914, "global_step": 587354, "epoch": 7076} {"train_loss": -27.81326675415039, "global_step": 587355, "epoch": 7076} {"train_loss": -28.059133529663086, "global_step": 587356, "epoch": 7076} {"train_loss": -27.9124813079834, "global_step": 587357, "epoch": 7076} {"train_loss": -27.97394371032715, "global_step": 587358, "epoch": 7076} {"train_loss": -28.390256881713867, "global_step": 587359, "epoch": 7076} {"train_loss": -28.380102157592773, "global_step": 587360, "epoch": 7076} {"train_loss": -28.005701065063477, "global_step": 587361, "epoch": 7076} {"train_loss": -28.00461196899414, "global_step": 587362, "epoch": 7076} {"train_loss": -27.86299705505371, "global_step": 587363, "epoch": 7076} {"train_loss": -27.64422035217285, "global_step": 587364, "epoch": 7076} {"train_loss": -28.314664840698242, "global_step": 587365, "epoch": 7076} {"train_loss": -27.643543243408203, "global_step": 587366, "epoch": 7076} {"train_loss": -27.866317749023438, "global_step": 587367, "epoch": 7076} {"train_loss": -27.487873077392578, "global_step": 587368, "epoch": 7076} {"train_loss": -27.945819854736328, "global_step": 587369, "epoch": 7076} {"train_loss": -28.112646102905273, "global_step": 587370, "epoch": 7076} {"train_loss": -27.748859405517578, "global_step": 587371, "epoch": 7076} {"train_loss": -27.79865074157715, "global_step": 587372, "epoch": 7076} {"train_loss": -28.267704010009766, "global_step": 587373, "epoch": 7076} {"train_loss": -27.581073760986328, "global_step": 587374, "epoch": 7076} {"train_loss": -27.874963760375977, "global_step": 587375, "epoch": 7076} {"train_loss": -28.219247817993164, "global_step": 587376, "epoch": 7076} {"train_loss": -27.843902587890625, "global_step": 587377, "epoch": 7076} {"train_loss": -27.709259033203125, "global_step": 587378, "epoch": 7076} {"train_loss": -28.32236099243164, "global_step": 587379, "epoch": 7076} {"train_loss": -27.819196701049805, "global_step": 587380, "epoch": 7076} {"train_loss": -27.865758895874023, "global_step": 587381, "epoch": 7076} {"train_loss": -28.373462677001953, "global_step": 587382, "epoch": 7076} {"train_loss": -28.156091690063477, "global_step": 587383, "epoch": 7076} {"train_loss": -28.247480392456055, "global_step": 587384, "epoch": 7076} {"train_loss": -27.915754318237305, "global_step": 587385, "epoch": 7076} {"train_loss": -28.021747589111328, "global_step": 587386, "epoch": 7076} {"train_loss": -28.1488037109375, "global_step": 587387, "epoch": 7076} {"train_loss": -28.234210968017578, "global_step": 587388, "epoch": 7076} {"train_loss": -28.259876251220703, "global_step": 587389, "epoch": 7076} {"train_loss": -27.789556893957666, "global_step": 587390, "epoch": 7076, "val_loss": 6557852.5} {"train_loss": -27.683557510375977, "global_step": 587391, "epoch": 7077} {"train_loss": -27.21396255493164, "global_step": 587392, "epoch": 7077} {"train_loss": -27.440061569213867, "global_step": 587393, "epoch": 7077} {"train_loss": -27.46454429626465, "global_step": 587394, "epoch": 7077} {"train_loss": -27.78242301940918, "global_step": 587395, "epoch": 7077} {"train_loss": -27.828887939453125, "global_step": 587396, "epoch": 7077} {"train_loss": -27.5762939453125, "global_step": 587397, "epoch": 7077} {"train_loss": -27.310285568237305, "global_step": 587398, "epoch": 7077} {"train_loss": -27.217208862304688, "global_step": 587399, "epoch": 7077} {"train_loss": -27.65582275390625, "global_step": 587400, "epoch": 7077} {"train_loss": -27.66031265258789, "global_step": 587401, "epoch": 7077} {"train_loss": -27.7176456451416, "global_step": 587402, "epoch": 7077} {"train_loss": -27.60702896118164, "global_step": 587403, "epoch": 7077} {"train_loss": -27.709003448486328, "global_step": 587404, "epoch": 7077} {"train_loss": -28.0670108795166, "global_step": 587405, "epoch": 7077} {"train_loss": -27.76399803161621, "global_step": 587406, "epoch": 7077} {"train_loss": -27.34437370300293, "global_step": 587407, "epoch": 7077} {"train_loss": -27.33466911315918, "global_step": 587408, "epoch": 7077} {"train_loss": -27.70404052734375, "global_step": 587409, "epoch": 7077} {"train_loss": -27.26126480102539, "global_step": 587410, "epoch": 7077} {"train_loss": -27.44362449645996, "global_step": 587411, "epoch": 7077} {"train_loss": -27.5438175201416, "global_step": 587412, "epoch": 7077} {"train_loss": -27.224958419799805, "global_step": 587413, "epoch": 7077} {"train_loss": -27.383909225463867, "global_step": 587414, "epoch": 7077} {"train_loss": -27.623737335205078, "global_step": 587415, "epoch": 7077} {"train_loss": -27.764123916625977, "global_step": 587416, "epoch": 7077} {"train_loss": -27.659046173095703, "global_step": 587417, "epoch": 7077} {"train_loss": -27.726642608642578, "global_step": 587418, "epoch": 7077} {"train_loss": -27.709457397460938, "global_step": 587419, "epoch": 7077} {"train_loss": -27.780323028564453, "global_step": 587420, "epoch": 7077} {"train_loss": -27.72478675842285, "global_step": 587421, "epoch": 7077} {"train_loss": -27.761072158813477, "global_step": 587422, "epoch": 7077} {"train_loss": -27.644577026367188, "global_step": 587423, "epoch": 7077} {"train_loss": -27.83723258972168, "global_step": 587424, "epoch": 7077} {"train_loss": -27.535297393798828, "global_step": 587425, "epoch": 7077} {"train_loss": -27.878732681274414, "global_step": 587426, "epoch": 7077} {"train_loss": -27.807546615600586, "global_step": 587427, "epoch": 7077} {"train_loss": -27.907331466674805, "global_step": 587428, "epoch": 7077} {"train_loss": -27.985509872436523, "global_step": 587429, "epoch": 7077} {"train_loss": -27.801366806030273, "global_step": 587430, "epoch": 7077} {"train_loss": -27.64825439453125, "global_step": 587431, "epoch": 7077} {"train_loss": -28.20352554321289, "global_step": 587432, "epoch": 7077} {"train_loss": -28.063486099243164, "global_step": 587433, "epoch": 7077} {"train_loss": -28.27247428894043, "global_step": 587434, "epoch": 7077} {"train_loss": -27.927295684814453, "global_step": 587435, "epoch": 7077} {"train_loss": -27.6719913482666, "global_step": 587436, "epoch": 7077} {"train_loss": -28.104450225830078, "global_step": 587437, "epoch": 7077} {"train_loss": -28.033945083618164, "global_step": 587438, "epoch": 7077} {"train_loss": -27.883947372436523, "global_step": 587439, "epoch": 7077} {"train_loss": -27.698352813720703, "global_step": 587440, "epoch": 7077} {"train_loss": -27.9152889251709, "global_step": 587441, "epoch": 7077} {"train_loss": -27.836645126342773, "global_step": 587442, "epoch": 7077} {"train_loss": -28.128442764282227, "global_step": 587443, "epoch": 7077} {"train_loss": -28.2384033203125, "global_step": 587444, "epoch": 7077} {"train_loss": -28.17431640625, "global_step": 587445, "epoch": 7077} {"train_loss": -28.176959991455078, "global_step": 587446, "epoch": 7077} {"train_loss": -28.202234268188477, "global_step": 587447, "epoch": 7077} {"train_loss": -28.02766990661621, "global_step": 587448, "epoch": 7077} {"train_loss": -27.89557456970215, "global_step": 587449, "epoch": 7077} {"train_loss": -28.40401268005371, "global_step": 587450, "epoch": 7077} {"train_loss": -27.925216674804688, "global_step": 587451, "epoch": 7077} {"train_loss": -28.072317123413086, "global_step": 587452, "epoch": 7077} {"train_loss": -28.386579513549805, "global_step": 587453, "epoch": 7077} {"train_loss": -28.217493057250977, "global_step": 587454, "epoch": 7077} {"train_loss": -27.889646530151367, "global_step": 587455, "epoch": 7077} {"train_loss": -27.89544677734375, "global_step": 587456, "epoch": 7077} {"train_loss": -27.878156661987305, "global_step": 587457, "epoch": 7077} {"train_loss": -27.93121337890625, "global_step": 587458, "epoch": 7077} {"train_loss": -28.190820693969727, "global_step": 587459, "epoch": 7077} {"train_loss": -28.381086349487305, "global_step": 587460, "epoch": 7077} {"train_loss": -27.535064697265625, "global_step": 587461, "epoch": 7077} {"train_loss": -28.137939453125, "global_step": 587462, "epoch": 7077} {"train_loss": -28.10272789001465, "global_step": 587463, "epoch": 7077} {"train_loss": -27.690326690673828, "global_step": 587464, "epoch": 7077} {"train_loss": -28.015899658203125, "global_step": 587465, "epoch": 7077} {"train_loss": -27.8193302154541, "global_step": 587466, "epoch": 7077} {"train_loss": -28.29031753540039, "global_step": 587467, "epoch": 7077} {"train_loss": -28.44830322265625, "global_step": 587468, "epoch": 7077} {"train_loss": -27.550329208374023, "global_step": 587469, "epoch": 7077} {"train_loss": -28.335407257080078, "global_step": 587470, "epoch": 7077} {"train_loss": -28.26822280883789, "global_step": 587471, "epoch": 7077} {"train_loss": -27.960371017456055, "global_step": 587472, "epoch": 7077} {"train_loss": -27.853612899780273, "global_step": 587473, "epoch": 7077, "val_loss": 6555130.0} {"train_loss": -27.948461532592773, "global_step": 587474, "epoch": 7078} {"train_loss": -27.784387588500977, "global_step": 587475, "epoch": 7078} {"train_loss": -27.42719841003418, "global_step": 587476, "epoch": 7078} {"train_loss": -27.967716217041016, "global_step": 587477, "epoch": 7078} {"train_loss": -27.81113624572754, "global_step": 587478, "epoch": 7078} {"train_loss": -27.6716251373291, "global_step": 587479, "epoch": 7078} {"train_loss": -28.078271865844727, "global_step": 587480, "epoch": 7078} {"train_loss": -27.35788917541504, "global_step": 587481, "epoch": 7078} {"train_loss": -27.93191909790039, "global_step": 587482, "epoch": 7078} {"train_loss": -27.34827995300293, "global_step": 587483, "epoch": 7078} {"train_loss": -26.943262100219727, "global_step": 587484, "epoch": 7078} {"train_loss": -27.121753692626953, "global_step": 587485, "epoch": 7078} {"train_loss": -27.350614547729492, "global_step": 587486, "epoch": 7078} {"train_loss": -27.172285079956055, "global_step": 587487, "epoch": 7078} {"train_loss": -28.217041015625, "global_step": 587488, "epoch": 7078} {"train_loss": -27.610239028930664, "global_step": 587489, "epoch": 7078} {"train_loss": -27.774438858032227, "global_step": 587490, "epoch": 7078} {"train_loss": -27.398101806640625, "global_step": 587491, "epoch": 7078} {"train_loss": -27.743213653564453, "global_step": 587492, "epoch": 7078} {"train_loss": -27.79973793029785, "global_step": 587493, "epoch": 7078} {"train_loss": -27.84877586364746, "global_step": 587494, "epoch": 7078} {"train_loss": -27.54667091369629, "global_step": 587495, "epoch": 7078} {"train_loss": -27.48948097229004, "global_step": 587496, "epoch": 7078} {"train_loss": -27.841291427612305, "global_step": 587497, "epoch": 7078} {"train_loss": -27.65814208984375, "global_step": 587498, "epoch": 7078} {"train_loss": -28.070941925048828, "global_step": 587499, "epoch": 7078} {"train_loss": -27.616947174072266, "global_step": 587500, "epoch": 7078} {"train_loss": -28.021909713745117, "global_step": 587501, "epoch": 7078} {"train_loss": -27.96009635925293, "global_step": 587502, "epoch": 7078} {"train_loss": -27.757959365844727, "global_step": 587503, "epoch": 7078} {"train_loss": -27.68068504333496, "global_step": 587504, "epoch": 7078} {"train_loss": -27.9151668548584, "global_step": 587505, "epoch": 7078} {"train_loss": -27.96381187438965, "global_step": 587506, "epoch": 7078} {"train_loss": -28.416278839111328, "global_step": 587507, "epoch": 7078} {"train_loss": -27.791296005249023, "global_step": 587508, "epoch": 7078} {"train_loss": -28.104999542236328, "global_step": 587509, "epoch": 7078} {"train_loss": -27.772436141967773, "global_step": 587510, "epoch": 7078} {"train_loss": -28.329782485961914, "global_step": 587511, "epoch": 7078} {"train_loss": -27.555917739868164, "global_step": 587512, "epoch": 7078} {"train_loss": -27.93684196472168, "global_step": 587513, "epoch": 7078} {"train_loss": -27.95014762878418, "global_step": 587514, "epoch": 7078} {"train_loss": -27.968708038330078, "global_step": 587515, "epoch": 7078} {"train_loss": -27.93096351623535, "global_step": 587516, "epoch": 7078} {"train_loss": -27.738433837890625, "global_step": 587517, "epoch": 7078} {"train_loss": -27.825185775756836, "global_step": 587518, "epoch": 7078} {"train_loss": -27.8775577545166, "global_step": 587519, "epoch": 7078} {"train_loss": -27.797626495361328, "global_step": 587520, "epoch": 7078} {"train_loss": -28.266223907470703, "global_step": 587521, "epoch": 7078} {"train_loss": -28.268295288085938, "global_step": 587522, "epoch": 7078} {"train_loss": -28.223535537719727, "global_step": 587523, "epoch": 7078} {"train_loss": -27.984344482421875, "global_step": 587524, "epoch": 7078} {"train_loss": -28.46219825744629, "global_step": 587525, "epoch": 7078} {"train_loss": -28.237043380737305, "global_step": 587526, "epoch": 7078} {"train_loss": -28.47723960876465, "global_step": 587527, "epoch": 7078} {"train_loss": -28.00624656677246, "global_step": 587528, "epoch": 7078} {"train_loss": -28.343902587890625, "global_step": 587529, "epoch": 7078} {"train_loss": -28.114316940307617, "global_step": 587530, "epoch": 7078} {"train_loss": -28.047204971313477, "global_step": 587531, "epoch": 7078} {"train_loss": -28.2036075592041, "global_step": 587532, "epoch": 7078} {"train_loss": -28.148818969726562, "global_step": 587533, "epoch": 7078} {"train_loss": -28.185285568237305, "global_step": 587534, "epoch": 7078} {"train_loss": -28.551406860351562, "global_step": 587535, "epoch": 7078} {"train_loss": -28.0540714263916, "global_step": 587536, "epoch": 7078} {"train_loss": -28.28370475769043, "global_step": 587537, "epoch": 7078} {"train_loss": -28.173492431640625, "global_step": 587538, "epoch": 7078} {"train_loss": -28.42051124572754, "global_step": 587539, "epoch": 7078} {"train_loss": -28.50552749633789, "global_step": 587540, "epoch": 7078} {"train_loss": -28.10614013671875, "global_step": 587541, "epoch": 7078} {"train_loss": -28.226293563842773, "global_step": 587542, "epoch": 7078} {"train_loss": -28.369176864624023, "global_step": 587543, "epoch": 7078} {"train_loss": -28.443897247314453, "global_step": 587544, "epoch": 7078} {"train_loss": -28.107023239135742, "global_step": 587545, "epoch": 7078} {"train_loss": -27.826597213745117, "global_step": 587546, "epoch": 7078} {"train_loss": -28.006723403930664, "global_step": 587547, "epoch": 7078} {"train_loss": -27.892108917236328, "global_step": 587548, "epoch": 7078} {"train_loss": -27.86624526977539, "global_step": 587549, "epoch": 7078} {"train_loss": -27.94317054748535, "global_step": 587550, "epoch": 7078} {"train_loss": -28.02534294128418, "global_step": 587551, "epoch": 7078} {"train_loss": -27.57657241821289, "global_step": 587552, "epoch": 7078} {"train_loss": -27.0083065032959, "global_step": 587553, "epoch": 7078} {"train_loss": -25.927152633666992, "global_step": 587554, "epoch": 7078} {"train_loss": -26.0674991607666, "global_step": 587555, "epoch": 7078} {"train_loss": -27.854748553540333, "global_step": 587556, "epoch": 7078, "val_loss": 6509782.0} {"train_loss": -25.68889808654785, "global_step": 587557, "epoch": 7079} {"train_loss": -19.804336547851562, "global_step": 587558, "epoch": 7079} {"train_loss": -25.965307235717773, "global_step": 587559, "epoch": 7079} {"train_loss": -24.269498825073242, "global_step": 587560, "epoch": 7079} {"train_loss": -25.569311141967773, "global_step": 587561, "epoch": 7079} {"train_loss": -25.413272857666016, "global_step": 587562, "epoch": 7079} {"train_loss": -25.69551658630371, "global_step": 587563, "epoch": 7079} {"train_loss": -25.712610244750977, "global_step": 587564, "epoch": 7079} {"train_loss": -26.001943588256836, "global_step": 587565, "epoch": 7079} {"train_loss": -26.124134063720703, "global_step": 587566, "epoch": 7079} {"train_loss": -26.568201065063477, "global_step": 587567, "epoch": 7079} {"train_loss": -25.71994972229004, "global_step": 587568, "epoch": 7079} {"train_loss": -26.461639404296875, "global_step": 587569, "epoch": 7079} {"train_loss": -26.429901123046875, "global_step": 587570, "epoch": 7079} {"train_loss": -26.309741973876953, "global_step": 587571, "epoch": 7079} {"train_loss": -26.58475112915039, "global_step": 587572, "epoch": 7079} {"train_loss": -26.426481246948242, "global_step": 587573, "epoch": 7079} {"train_loss": -26.44719886779785, "global_step": 587574, "epoch": 7079} {"train_loss": -26.774005889892578, "global_step": 587575, "epoch": 7079} {"train_loss": -26.939350128173828, "global_step": 587576, "epoch": 7079} {"train_loss": -26.87526512145996, "global_step": 587577, "epoch": 7079} {"train_loss": -26.98492431640625, "global_step": 587578, "epoch": 7079} {"train_loss": -26.938556671142578, "global_step": 587579, "epoch": 7079} {"train_loss": -27.083173751831055, "global_step": 587580, "epoch": 7079} {"train_loss": -27.0482177734375, "global_step": 587581, "epoch": 7079} {"train_loss": -26.765249252319336, "global_step": 587582, "epoch": 7079} {"train_loss": -27.31682777404785, "global_step": 587583, "epoch": 7079} {"train_loss": -26.997350692749023, "global_step": 587584, "epoch": 7079} {"train_loss": -26.992477416992188, "global_step": 587585, "epoch": 7079} {"train_loss": -27.304492950439453, "global_step": 587586, "epoch": 7079} {"train_loss": -27.599828720092773, "global_step": 587587, "epoch": 7079} {"train_loss": -27.019479751586914, "global_step": 587588, "epoch": 7079} {"train_loss": -27.344161987304688, "global_step": 587589, "epoch": 7079} {"train_loss": -27.283239364624023, "global_step": 587590, "epoch": 7079} {"train_loss": -27.077966690063477, "global_step": 587591, "epoch": 7079} {"train_loss": -27.32122230529785, "global_step": 587592, "epoch": 7079} {"train_loss": -27.479022979736328, "global_step": 587593, "epoch": 7079} {"train_loss": -27.954105377197266, "global_step": 587594, "epoch": 7079} {"train_loss": -27.50299072265625, "global_step": 587595, "epoch": 7079} {"train_loss": -27.653318405151367, "global_step": 587596, "epoch": 7079} {"train_loss": -27.544464111328125, "global_step": 587597, "epoch": 7079} {"train_loss": -27.358610153198242, "global_step": 587598, "epoch": 7079} {"train_loss": -27.386987686157227, "global_step": 587599, "epoch": 7079} {"train_loss": -27.844379425048828, "global_step": 587600, "epoch": 7079} {"train_loss": -27.80437660217285, "global_step": 587601, "epoch": 7079} {"train_loss": -27.789281845092773, "global_step": 587602, "epoch": 7079} {"train_loss": -27.583402633666992, "global_step": 587603, "epoch": 7079} {"train_loss": -27.83637809753418, "global_step": 587604, "epoch": 7079} {"train_loss": -28.099584579467773, "global_step": 587605, "epoch": 7079} {"train_loss": -27.8477725982666, "global_step": 587606, "epoch": 7079} {"train_loss": -27.548826217651367, "global_step": 587607, "epoch": 7079} {"train_loss": -27.895435333251953, "global_step": 587608, "epoch": 7079} {"train_loss": -27.700946807861328, "global_step": 587609, "epoch": 7079} {"train_loss": -27.9876766204834, "global_step": 587610, "epoch": 7079} {"train_loss": -28.264896392822266, "global_step": 587611, "epoch": 7079} {"train_loss": -27.64668083190918, "global_step": 587612, "epoch": 7079} {"train_loss": -27.638004302978516, "global_step": 587613, "epoch": 7079} {"train_loss": -27.777353286743164, "global_step": 587614, "epoch": 7079} {"train_loss": -27.793264389038086, "global_step": 587615, "epoch": 7079} {"train_loss": -27.65862464904785, "global_step": 587616, "epoch": 7079} {"train_loss": -27.322568893432617, "global_step": 587617, "epoch": 7079} {"train_loss": -28.101369857788086, "global_step": 587618, "epoch": 7079} {"train_loss": -27.61576271057129, "global_step": 587619, "epoch": 7079} {"train_loss": -27.703550338745117, "global_step": 587620, "epoch": 7079} {"train_loss": -27.65289878845215, "global_step": 587621, "epoch": 7079} {"train_loss": -27.85915184020996, "global_step": 587622, "epoch": 7079} {"train_loss": -28.167264938354492, "global_step": 587623, "epoch": 7079} {"train_loss": -27.7243595123291, "global_step": 587624, "epoch": 7079} {"train_loss": -28.213165283203125, "global_step": 587625, "epoch": 7079} {"train_loss": -27.827001571655273, "global_step": 587626, "epoch": 7079} {"train_loss": -27.863052368164062, "global_step": 587627, "epoch": 7079} {"train_loss": -27.565170288085938, "global_step": 587628, "epoch": 7079} {"train_loss": -28.045440673828125, "global_step": 587629, "epoch": 7079} {"train_loss": -28.014331817626953, "global_step": 587630, "epoch": 7079} {"train_loss": -27.740833282470703, "global_step": 587631, "epoch": 7079} {"train_loss": -28.16240882873535, "global_step": 587632, "epoch": 7079} {"train_loss": -28.014362335205078, "global_step": 587633, "epoch": 7079} {"train_loss": -28.489398956298828, "global_step": 587634, "epoch": 7079} {"train_loss": -27.942153930664062, "global_step": 587635, "epoch": 7079} {"train_loss": -27.859827041625977, "global_step": 587636, "epoch": 7079} {"train_loss": -27.816137313842773, "global_step": 587637, "epoch": 7079} {"train_loss": -28.108625411987305, "global_step": 587638, "epoch": 7079} {"train_loss": -27.184731196208173, "global_step": 587639, "epoch": 7079, "val_loss": 6601655.0} {"train_loss": -27.699193954467773, "global_step": 587640, "epoch": 7080} {"train_loss": -26.96040916442871, "global_step": 587641, "epoch": 7080} {"train_loss": -27.69268798828125, "global_step": 587642, "epoch": 7080} {"train_loss": -27.762088775634766, "global_step": 587643, "epoch": 7080} {"train_loss": -27.510480880737305, "global_step": 587644, "epoch": 7080} {"train_loss": -27.679487228393555, "global_step": 587645, "epoch": 7080} {"train_loss": -27.746362686157227, "global_step": 587646, "epoch": 7080} {"train_loss": -27.57280921936035, "global_step": 587647, "epoch": 7080} {"train_loss": -27.457782745361328, "global_step": 587648, "epoch": 7080} {"train_loss": -27.641881942749023, "global_step": 587649, "epoch": 7080} {"train_loss": -27.516437530517578, "global_step": 587650, "epoch": 7080} {"train_loss": -27.824430465698242, "global_step": 587651, "epoch": 7080} {"train_loss": -27.767913818359375, "global_step": 587652, "epoch": 7080} {"train_loss": -27.976612091064453, "global_step": 587653, "epoch": 7080} {"train_loss": -27.81060791015625, "global_step": 587654, "epoch": 7080} {"train_loss": -27.792633056640625, "global_step": 587655, "epoch": 7080} {"train_loss": -28.005910873413086, "global_step": 587656, "epoch": 7080} {"train_loss": -28.004819869995117, "global_step": 587657, "epoch": 7080} {"train_loss": -27.729597091674805, "global_step": 587658, "epoch": 7080} {"train_loss": -27.726165771484375, "global_step": 587659, "epoch": 7080} {"train_loss": -27.959781646728516, "global_step": 587660, "epoch": 7080} {"train_loss": -28.197046279907227, "global_step": 587661, "epoch": 7080} {"train_loss": -27.674468994140625, "global_step": 587662, "epoch": 7080} {"train_loss": -27.558074951171875, "global_step": 587663, "epoch": 7080} {"train_loss": -27.97635841369629, "global_step": 587664, "epoch": 7080} {"train_loss": -27.69111442565918, "global_step": 587665, "epoch": 7080} {"train_loss": -27.886417388916016, "global_step": 587666, "epoch": 7080} {"train_loss": -27.75050163269043, "global_step": 587667, "epoch": 7080} {"train_loss": -28.01812171936035, "global_step": 587668, "epoch": 7080} {"train_loss": -27.847198486328125, "global_step": 587669, "epoch": 7080} {"train_loss": -27.958515167236328, "global_step": 587670, "epoch": 7080} {"train_loss": -28.000396728515625, "global_step": 587671, "epoch": 7080} {"train_loss": -28.02373695373535, "global_step": 587672, "epoch": 7080} {"train_loss": -27.6640567779541, "global_step": 587673, "epoch": 7080} {"train_loss": -27.908246994018555, "global_step": 587674, "epoch": 7080} {"train_loss": -27.96649742126465, "global_step": 587675, "epoch": 7080} {"train_loss": -27.629499435424805, "global_step": 587676, "epoch": 7080} {"train_loss": -28.4481143951416, "global_step": 587677, "epoch": 7080} {"train_loss": -27.82277488708496, "global_step": 587678, "epoch": 7080} {"train_loss": -27.7041072845459, "global_step": 587679, "epoch": 7080} {"train_loss": -28.35369300842285, "global_step": 587680, "epoch": 7080} {"train_loss": -28.19660758972168, "global_step": 587681, "epoch": 7080} {"train_loss": -27.981168746948242, "global_step": 587682, "epoch": 7080} {"train_loss": -27.893259048461914, "global_step": 587683, "epoch": 7080} {"train_loss": -28.034605026245117, "global_step": 587684, "epoch": 7080} {"train_loss": -27.994754791259766, "global_step": 587685, "epoch": 7080} {"train_loss": -27.884180068969727, "global_step": 587686, "epoch": 7080} {"train_loss": -28.392059326171875, "global_step": 587687, "epoch": 7080} {"train_loss": -28.251224517822266, "global_step": 587688, "epoch": 7080} {"train_loss": -27.964019775390625, "global_step": 587689, "epoch": 7080} {"train_loss": -28.1759033203125, "global_step": 587690, "epoch": 7080} {"train_loss": -28.30047607421875, "global_step": 587691, "epoch": 7080} {"train_loss": -28.254932403564453, "global_step": 587692, "epoch": 7080} {"train_loss": -27.870548248291016, "global_step": 587693, "epoch": 7080} {"train_loss": -27.99683952331543, "global_step": 587694, "epoch": 7080} {"train_loss": -28.00095558166504, "global_step": 587695, "epoch": 7080} {"train_loss": -27.91416358947754, "global_step": 587696, "epoch": 7080} {"train_loss": -28.009262084960938, "global_step": 587697, "epoch": 7080} {"train_loss": -28.192981719970703, "global_step": 587698, "epoch": 7080} {"train_loss": -27.93450927734375, "global_step": 587699, "epoch": 7080} {"train_loss": -28.074081420898438, "global_step": 587700, "epoch": 7080} {"train_loss": -28.016510009765625, "global_step": 587701, "epoch": 7080} {"train_loss": -28.015277862548828, "global_step": 587702, "epoch": 7080} {"train_loss": -27.838821411132812, "global_step": 587703, "epoch": 7080} {"train_loss": -27.891407012939453, "global_step": 587704, "epoch": 7080} {"train_loss": -28.196569442749023, "global_step": 587705, "epoch": 7080} {"train_loss": -27.583154678344727, "global_step": 587706, "epoch": 7080} {"train_loss": -27.3004093170166, "global_step": 587707, "epoch": 7080} {"train_loss": -27.13325309753418, "global_step": 587708, "epoch": 7080} {"train_loss": -27.2176456451416, "global_step": 587709, "epoch": 7080} {"train_loss": -27.55499267578125, "global_step": 587710, "epoch": 7080} {"train_loss": -28.041776657104492, "global_step": 587711, "epoch": 7080} {"train_loss": -27.8382625579834, "global_step": 587712, "epoch": 7080} {"train_loss": -27.937177658081055, "global_step": 587713, "epoch": 7080} {"train_loss": -27.77813148498535, "global_step": 587714, "epoch": 7080} {"train_loss": -28.18104362487793, "global_step": 587715, "epoch": 7080} {"train_loss": -27.60317039489746, "global_step": 587716, "epoch": 7080} {"train_loss": -27.931432723999023, "global_step": 587717, "epoch": 7080} {"train_loss": -27.6937255859375, "global_step": 587718, "epoch": 7080} {"train_loss": -28.305078506469727, "global_step": 587719, "epoch": 7080} {"train_loss": -28.028356552124023, "global_step": 587720, "epoch": 7080} {"train_loss": -27.539478302001953, "global_step": 587721, "epoch": 7080} {"train_loss": -27.857860565185547, "global_step": 587722, "epoch": 7080, "val_loss": 6531364.0} {"train_loss": -26.96956443786621, "global_step": 587723, "epoch": 7081} {"train_loss": -27.643280029296875, "global_step": 587724, "epoch": 7081} {"train_loss": -27.038726806640625, "global_step": 587725, "epoch": 7081} {"train_loss": -27.294164657592773, "global_step": 587726, "epoch": 7081} {"train_loss": -27.427453994750977, "global_step": 587727, "epoch": 7081} {"train_loss": -26.635419845581055, "global_step": 587728, "epoch": 7081} {"train_loss": -27.561838150024414, "global_step": 587729, "epoch": 7081} {"train_loss": -27.047016143798828, "global_step": 587730, "epoch": 7081} {"train_loss": -27.363256454467773, "global_step": 587731, "epoch": 7081} {"train_loss": -27.375045776367188, "global_step": 587732, "epoch": 7081} {"train_loss": -27.770837783813477, "global_step": 587733, "epoch": 7081} {"train_loss": -27.080427169799805, "global_step": 587734, "epoch": 7081} {"train_loss": -27.158491134643555, "global_step": 587735, "epoch": 7081} {"train_loss": -27.28985595703125, "global_step": 587736, "epoch": 7081} {"train_loss": -27.6543025970459, "global_step": 587737, "epoch": 7081} {"train_loss": -27.499792098999023, "global_step": 587738, "epoch": 7081} {"train_loss": -27.123737335205078, "global_step": 587739, "epoch": 7081} {"train_loss": -27.68186378479004, "global_step": 587740, "epoch": 7081} {"train_loss": -27.852340698242188, "global_step": 587741, "epoch": 7081} {"train_loss": -27.467056274414062, "global_step": 587742, "epoch": 7081} {"train_loss": -27.78301429748535, "global_step": 587743, "epoch": 7081} {"train_loss": -27.690847396850586, "global_step": 587744, "epoch": 7081} {"train_loss": -27.81204605102539, "global_step": 587745, "epoch": 7081} {"train_loss": -27.640600204467773, "global_step": 587746, "epoch": 7081} {"train_loss": -27.930194854736328, "global_step": 587747, "epoch": 7081} {"train_loss": -27.95161247253418, "global_step": 587748, "epoch": 7081} {"train_loss": -27.895360946655273, "global_step": 587749, "epoch": 7081} {"train_loss": -27.754255294799805, "global_step": 587750, "epoch": 7081} {"train_loss": -28.099180221557617, "global_step": 587751, "epoch": 7081} {"train_loss": -27.880207061767578, "global_step": 587752, "epoch": 7081} {"train_loss": -27.6219539642334, "global_step": 587753, "epoch": 7081} {"train_loss": -28.16084861755371, "global_step": 587754, "epoch": 7081} {"train_loss": -27.5297794342041, "global_step": 587755, "epoch": 7081} {"train_loss": -28.188385009765625, "global_step": 587756, "epoch": 7081} {"train_loss": -27.942541122436523, "global_step": 587757, "epoch": 7081} {"train_loss": -28.007659912109375, "global_step": 587758, "epoch": 7081} {"train_loss": -27.934341430664062, "global_step": 587759, "epoch": 7081} {"train_loss": -28.010635375976562, "global_step": 587760, "epoch": 7081} {"train_loss": -28.201704025268555, "global_step": 587761, "epoch": 7081} {"train_loss": -28.07391929626465, "global_step": 587762, "epoch": 7081} {"train_loss": -28.039945602416992, "global_step": 587763, "epoch": 7081} {"train_loss": -27.809844970703125, "global_step": 587764, "epoch": 7081} {"train_loss": -27.395864486694336, "global_step": 587765, "epoch": 7081} {"train_loss": -27.587909698486328, "global_step": 587766, "epoch": 7081} {"train_loss": -27.933820724487305, "global_step": 587767, "epoch": 7081} {"train_loss": -27.923053741455078, "global_step": 587768, "epoch": 7081} {"train_loss": -28.2589111328125, "global_step": 587769, "epoch": 7081} {"train_loss": -27.529163360595703, "global_step": 587770, "epoch": 7081} {"train_loss": -27.7623348236084, "global_step": 587771, "epoch": 7081} {"train_loss": -27.8385066986084, "global_step": 587772, "epoch": 7081} {"train_loss": -27.783796310424805, "global_step": 587773, "epoch": 7081} {"train_loss": -28.063833236694336, "global_step": 587774, "epoch": 7081} {"train_loss": -28.06074333190918, "global_step": 587775, "epoch": 7081} {"train_loss": -28.200387954711914, "global_step": 587776, "epoch": 7081} {"train_loss": -28.29999351501465, "global_step": 587777, "epoch": 7081} {"train_loss": -28.134540557861328, "global_step": 587778, "epoch": 7081} {"train_loss": -28.23109245300293, "global_step": 587779, "epoch": 7081} {"train_loss": -28.175024032592773, "global_step": 587780, "epoch": 7081} {"train_loss": -27.84583854675293, "global_step": 587781, "epoch": 7081} {"train_loss": -28.22602653503418, "global_step": 587782, "epoch": 7081} {"train_loss": -28.044620513916016, "global_step": 587783, "epoch": 7081} {"train_loss": -27.85065269470215, "global_step": 587784, "epoch": 7081} {"train_loss": -28.22332763671875, "global_step": 587785, "epoch": 7081} {"train_loss": -28.311071395874023, "global_step": 587786, "epoch": 7081} {"train_loss": -27.609638214111328, "global_step": 587787, "epoch": 7081} {"train_loss": -27.822385787963867, "global_step": 587788, "epoch": 7081} {"train_loss": -27.78960609436035, "global_step": 587789, "epoch": 7081} {"train_loss": -27.849090576171875, "global_step": 587790, "epoch": 7081} {"train_loss": -28.378042221069336, "global_step": 587791, "epoch": 7081} {"train_loss": -28.014907836914062, "global_step": 587792, "epoch": 7081} {"train_loss": -28.056543350219727, "global_step": 587793, "epoch": 7081} {"train_loss": -28.059274673461914, "global_step": 587794, "epoch": 7081} {"train_loss": -28.133544921875, "global_step": 587795, "epoch": 7081} {"train_loss": -27.797765731811523, "global_step": 587796, "epoch": 7081} {"train_loss": -28.26724624633789, "global_step": 587797, "epoch": 7081} {"train_loss": -28.117053985595703, "global_step": 587798, "epoch": 7081} {"train_loss": -28.259037017822266, "global_step": 587799, "epoch": 7081} {"train_loss": -27.963428497314453, "global_step": 587800, "epoch": 7081} {"train_loss": -27.888736724853516, "global_step": 587801, "epoch": 7081} {"train_loss": -27.76149559020996, "global_step": 587802, "epoch": 7081} {"train_loss": -28.133438110351562, "global_step": 587803, "epoch": 7081} {"train_loss": -28.26482582092285, "global_step": 587804, "epoch": 7081} {"train_loss": -27.82357854728239, "global_step": 587805, "epoch": 7081, "val_loss": 6597770.0} {"train_loss": -26.854902267456055, "global_step": 587806, "epoch": 7082} {"train_loss": -26.565900802612305, "global_step": 587807, "epoch": 7082} {"train_loss": -27.600351333618164, "global_step": 587808, "epoch": 7082} {"train_loss": -26.9467830657959, "global_step": 587809, "epoch": 7082} {"train_loss": -26.759679794311523, "global_step": 587810, "epoch": 7082} {"train_loss": -27.19777488708496, "global_step": 587811, "epoch": 7082} {"train_loss": -26.70025634765625, "global_step": 587812, "epoch": 7082} {"train_loss": -27.322851181030273, "global_step": 587813, "epoch": 7082} {"train_loss": -27.264867782592773, "global_step": 587814, "epoch": 7082} {"train_loss": -27.138660430908203, "global_step": 587815, "epoch": 7082} {"train_loss": -27.635034561157227, "global_step": 587816, "epoch": 7082} {"train_loss": -27.353153228759766, "global_step": 587817, "epoch": 7082} {"train_loss": -27.84189796447754, "global_step": 587818, "epoch": 7082} {"train_loss": -27.450321197509766, "global_step": 587819, "epoch": 7082} {"train_loss": -27.564489364624023, "global_step": 587820, "epoch": 7082} {"train_loss": -27.763763427734375, "global_step": 587821, "epoch": 7082} {"train_loss": -27.856735229492188, "global_step": 587822, "epoch": 7082} {"train_loss": -27.57452964782715, "global_step": 587823, "epoch": 7082} {"train_loss": -27.857431411743164, "global_step": 587824, "epoch": 7082} {"train_loss": -27.483367919921875, "global_step": 587825, "epoch": 7082} {"train_loss": -27.79572868347168, "global_step": 587826, "epoch": 7082} {"train_loss": -27.87506675720215, "global_step": 587827, "epoch": 7082} {"train_loss": -27.612756729125977, "global_step": 587828, "epoch": 7082} {"train_loss": -27.263858795166016, "global_step": 587829, "epoch": 7082} {"train_loss": -28.00455665588379, "global_step": 587830, "epoch": 7082} {"train_loss": -27.915842056274414, "global_step": 587831, "epoch": 7082} {"train_loss": -27.960254669189453, "global_step": 587832, "epoch": 7082} {"train_loss": -27.935932159423828, "global_step": 587833, "epoch": 7082} {"train_loss": -27.7235050201416, "global_step": 587834, "epoch": 7082} {"train_loss": -27.493398666381836, "global_step": 587835, "epoch": 7082} {"train_loss": -28.308218002319336, "global_step": 587836, "epoch": 7082} {"train_loss": -27.763132095336914, "global_step": 587837, "epoch": 7082} {"train_loss": -28.249969482421875, "global_step": 587838, "epoch": 7082} {"train_loss": -28.141876220703125, "global_step": 587839, "epoch": 7082} {"train_loss": -28.077041625976562, "global_step": 587840, "epoch": 7082} {"train_loss": -28.101654052734375, "global_step": 587841, "epoch": 7082} {"train_loss": -28.245609283447266, "global_step": 587842, "epoch": 7082} {"train_loss": -27.924707412719727, "global_step": 587843, "epoch": 7082} {"train_loss": -28.532135009765625, "global_step": 587844, "epoch": 7082} {"train_loss": -28.38624382019043, "global_step": 587845, "epoch": 7082} {"train_loss": -28.1599178314209, "global_step": 587846, "epoch": 7082} {"train_loss": -28.144800186157227, "global_step": 587847, "epoch": 7082} {"train_loss": -28.216711044311523, "global_step": 587848, "epoch": 7082} {"train_loss": -28.202442169189453, "global_step": 587849, "epoch": 7082} {"train_loss": -27.840696334838867, "global_step": 587850, "epoch": 7082} {"train_loss": -27.734167098999023, "global_step": 587851, "epoch": 7082} {"train_loss": -27.6260929107666, "global_step": 587852, "epoch": 7082} {"train_loss": -28.23489761352539, "global_step": 587853, "epoch": 7082} {"train_loss": -28.154874801635742, "global_step": 587854, "epoch": 7082} {"train_loss": -28.083698272705078, "global_step": 587855, "epoch": 7082} {"train_loss": -27.642541885375977, "global_step": 587856, "epoch": 7082} {"train_loss": -27.9406795501709, "global_step": 587857, "epoch": 7082} {"train_loss": -27.515859603881836, "global_step": 587858, "epoch": 7082} {"train_loss": -26.513456344604492, "global_step": 587859, "epoch": 7082} {"train_loss": -25.882543563842773, "global_step": 587860, "epoch": 7082} {"train_loss": -25.59602928161621, "global_step": 587861, "epoch": 7082} {"train_loss": -27.933216094970703, "global_step": 587862, "epoch": 7082} {"train_loss": -26.77312660217285, "global_step": 587863, "epoch": 7082} {"train_loss": -27.187061309814453, "global_step": 587864, "epoch": 7082} {"train_loss": -28.08978843688965, "global_step": 587865, "epoch": 7082} {"train_loss": -27.017805099487305, "global_step": 587866, "epoch": 7082} {"train_loss": -27.411518096923828, "global_step": 587867, "epoch": 7082} {"train_loss": -27.572402954101562, "global_step": 587868, "epoch": 7082} {"train_loss": -27.56028175354004, "global_step": 587869, "epoch": 7082} {"train_loss": -27.1668643951416, "global_step": 587870, "epoch": 7082} {"train_loss": -27.622074127197266, "global_step": 587871, "epoch": 7082} {"train_loss": -27.311115264892578, "global_step": 587872, "epoch": 7082} {"train_loss": -27.629032135009766, "global_step": 587873, "epoch": 7082} {"train_loss": -27.392078399658203, "global_step": 587874, "epoch": 7082} {"train_loss": -27.596914291381836, "global_step": 587875, "epoch": 7082} {"train_loss": -28.14414405822754, "global_step": 587876, "epoch": 7082} {"train_loss": -27.762344360351562, "global_step": 587877, "epoch": 7082} {"train_loss": -27.415449142456055, "global_step": 587878, "epoch": 7082} {"train_loss": -28.085134506225586, "global_step": 587879, "epoch": 7082} {"train_loss": -27.38462257385254, "global_step": 587880, "epoch": 7082} {"train_loss": -27.693511962890625, "global_step": 587881, "epoch": 7082} {"train_loss": -27.842060089111328, "global_step": 587882, "epoch": 7082} {"train_loss": -27.247251510620117, "global_step": 587883, "epoch": 7082} {"train_loss": -27.63982582092285, "global_step": 587884, "epoch": 7082} {"train_loss": -27.900705337524414, "global_step": 587885, "epoch": 7082} {"train_loss": -27.833515167236328, "global_step": 587886, "epoch": 7082} {"train_loss": -27.537179946899414, "global_step": 587887, "epoch": 7082} {"train_loss": -27.617817821272883, "global_step": 587888, "epoch": 7082, "val_loss": 6579416.0} {"train_loss": -27.413928985595703, "global_step": 587889, "epoch": 7083} {"train_loss": -27.534635543823242, "global_step": 587890, "epoch": 7083} {"train_loss": -27.627944946289062, "global_step": 587891, "epoch": 7083} {"train_loss": -27.271482467651367, "global_step": 587892, "epoch": 7083} {"train_loss": -27.0345458984375, "global_step": 587893, "epoch": 7083} {"train_loss": -27.415374755859375, "global_step": 587894, "epoch": 7083} {"train_loss": -27.546222686767578, "global_step": 587895, "epoch": 7083} {"train_loss": -27.696699142456055, "global_step": 587896, "epoch": 7083} {"train_loss": -27.47406005859375, "global_step": 587897, "epoch": 7083} {"train_loss": -28.062650680541992, "global_step": 587898, "epoch": 7083} {"train_loss": -27.633764266967773, "global_step": 587899, "epoch": 7083} {"train_loss": -27.75628089904785, "global_step": 587900, "epoch": 7083} {"train_loss": -27.945560455322266, "global_step": 587901, "epoch": 7083} {"train_loss": -27.496023178100586, "global_step": 587902, "epoch": 7083} {"train_loss": -27.80586051940918, "global_step": 587903, "epoch": 7083} {"train_loss": -27.899999618530273, "global_step": 587904, "epoch": 7083} {"train_loss": -27.562427520751953, "global_step": 587905, "epoch": 7083} {"train_loss": -27.9840087890625, "global_step": 587906, "epoch": 7083} {"train_loss": -27.677457809448242, "global_step": 587907, "epoch": 7083} {"train_loss": -28.045047760009766, "global_step": 587908, "epoch": 7083} {"train_loss": -27.63114356994629, "global_step": 587909, "epoch": 7083} {"train_loss": -28.0693359375, "global_step": 587910, "epoch": 7083} {"train_loss": -27.70075035095215, "global_step": 587911, "epoch": 7083} {"train_loss": -28.032398223876953, "global_step": 587912, "epoch": 7083} {"train_loss": -27.828855514526367, "global_step": 587913, "epoch": 7083} {"train_loss": -28.058115005493164, "global_step": 587914, "epoch": 7083} {"train_loss": -27.81131362915039, "global_step": 587915, "epoch": 7083} {"train_loss": -27.78759765625, "global_step": 587916, "epoch": 7083} {"train_loss": -27.99674415588379, "global_step": 587917, "epoch": 7083} {"train_loss": -27.7252254486084, "global_step": 587918, "epoch": 7083} {"train_loss": -28.241668701171875, "global_step": 587919, "epoch": 7083} {"train_loss": -27.90825843811035, "global_step": 587920, "epoch": 7083} {"train_loss": -27.6038875579834, "global_step": 587921, "epoch": 7083} {"train_loss": -27.892187118530273, "global_step": 587922, "epoch": 7083} {"train_loss": -27.796722412109375, "global_step": 587923, "epoch": 7083} {"train_loss": -27.741474151611328, "global_step": 587924, "epoch": 7083} {"train_loss": -27.709115982055664, "global_step": 587925, "epoch": 7083} {"train_loss": -27.7587890625, "global_step": 587926, "epoch": 7083} {"train_loss": -28.011463165283203, "global_step": 587927, "epoch": 7083} {"train_loss": -28.299457550048828, "global_step": 587928, "epoch": 7083} {"train_loss": -28.357900619506836, "global_step": 587929, "epoch": 7083} {"train_loss": -28.217208862304688, "global_step": 587930, "epoch": 7083} {"train_loss": -28.015634536743164, "global_step": 587931, "epoch": 7083} {"train_loss": -28.098302841186523, "global_step": 587932, "epoch": 7083} {"train_loss": -28.067890167236328, "global_step": 587933, "epoch": 7083} {"train_loss": -27.854400634765625, "global_step": 587934, "epoch": 7083} {"train_loss": -27.872241973876953, "global_step": 587935, "epoch": 7083} {"train_loss": -27.9256649017334, "global_step": 587936, "epoch": 7083} {"train_loss": -27.99420738220215, "global_step": 587937, "epoch": 7083} {"train_loss": -27.684040069580078, "global_step": 587938, "epoch": 7083} {"train_loss": -28.22389030456543, "global_step": 587939, "epoch": 7083} {"train_loss": -28.126394271850586, "global_step": 587940, "epoch": 7083} {"train_loss": -27.911237716674805, "global_step": 587941, "epoch": 7083} {"train_loss": -27.333709716796875, "global_step": 587942, "epoch": 7083} {"train_loss": -27.93408203125, "global_step": 587943, "epoch": 7083} {"train_loss": -28.111310958862305, "global_step": 587944, "epoch": 7083} {"train_loss": -28.048925399780273, "global_step": 587945, "epoch": 7083} {"train_loss": -27.564044952392578, "global_step": 587946, "epoch": 7083} {"train_loss": -28.099756240844727, "global_step": 587947, "epoch": 7083} {"train_loss": -28.219104766845703, "global_step": 587948, "epoch": 7083} {"train_loss": -28.026535034179688, "global_step": 587949, "epoch": 7083} {"train_loss": -28.276025772094727, "global_step": 587950, "epoch": 7083} {"train_loss": -28.113759994506836, "global_step": 587951, "epoch": 7083} {"train_loss": -27.795368194580078, "global_step": 587952, "epoch": 7083} {"train_loss": -28.186511993408203, "global_step": 587953, "epoch": 7083} {"train_loss": -27.878698348999023, "global_step": 587954, "epoch": 7083} {"train_loss": -28.11577796936035, "global_step": 587955, "epoch": 7083} {"train_loss": -28.31171226501465, "global_step": 587956, "epoch": 7083} {"train_loss": -27.92766761779785, "global_step": 587957, "epoch": 7083} {"train_loss": -28.3124942779541, "global_step": 587958, "epoch": 7083} {"train_loss": -27.787445068359375, "global_step": 587959, "epoch": 7083} {"train_loss": -28.210983276367188, "global_step": 587960, "epoch": 7083} {"train_loss": -28.382312774658203, "global_step": 587961, "epoch": 7083} {"train_loss": -28.424121856689453, "global_step": 587962, "epoch": 7083} {"train_loss": -28.015888214111328, "global_step": 587963, "epoch": 7083} {"train_loss": -28.557666778564453, "global_step": 587964, "epoch": 7083} {"train_loss": -28.1361141204834, "global_step": 587965, "epoch": 7083} {"train_loss": -28.093433380126953, "global_step": 587966, "epoch": 7083} {"train_loss": -27.95596694946289, "global_step": 587967, "epoch": 7083} {"train_loss": -28.041410446166992, "global_step": 587968, "epoch": 7083} {"train_loss": -27.936315536499023, "global_step": 587969, "epoch": 7083} {"train_loss": -27.994421005249023, "global_step": 587970, "epoch": 7083} {"train_loss": -27.917013926678393, "global_step": 587971, "epoch": 7083, "val_loss": 6578624.5} {"train_loss": -27.3948974609375, "global_step": 587972, "epoch": 7084} {"train_loss": -26.233871459960938, "global_step": 587973, "epoch": 7084} {"train_loss": -26.5151309967041, "global_step": 587974, "epoch": 7084} {"train_loss": -27.402099609375, "global_step": 587975, "epoch": 7084} {"train_loss": -26.12476921081543, "global_step": 587976, "epoch": 7084} {"train_loss": -27.575336456298828, "global_step": 587977, "epoch": 7084} {"train_loss": -27.4233455657959, "global_step": 587978, "epoch": 7084} {"train_loss": -27.18001365661621, "global_step": 587979, "epoch": 7084} {"train_loss": -27.49500846862793, "global_step": 587980, "epoch": 7084} {"train_loss": -27.111923217773438, "global_step": 587981, "epoch": 7084} {"train_loss": -27.423887252807617, "global_step": 587982, "epoch": 7084} {"train_loss": -27.492446899414062, "global_step": 587983, "epoch": 7084} {"train_loss": -27.56037712097168, "global_step": 587984, "epoch": 7084} {"train_loss": -27.04827308654785, "global_step": 587985, "epoch": 7084} {"train_loss": -27.610647201538086, "global_step": 587986, "epoch": 7084} {"train_loss": -27.435272216796875, "global_step": 587987, "epoch": 7084} {"train_loss": -27.679845809936523, "global_step": 587988, "epoch": 7084} {"train_loss": -27.6453800201416, "global_step": 587989, "epoch": 7084} {"train_loss": -27.75164222717285, "global_step": 587990, "epoch": 7084} {"train_loss": -27.707447052001953, "global_step": 587991, "epoch": 7084} {"train_loss": -27.664581298828125, "global_step": 587992, "epoch": 7084} {"train_loss": -27.593061447143555, "global_step": 587993, "epoch": 7084} {"train_loss": -27.372480392456055, "global_step": 587994, "epoch": 7084} {"train_loss": -27.856042861938477, "global_step": 587995, "epoch": 7084} {"train_loss": -27.47509765625, "global_step": 587996, "epoch": 7084} {"train_loss": -27.59329605102539, "global_step": 587997, "epoch": 7084} {"train_loss": -27.639692306518555, "global_step": 587998, "epoch": 7084} {"train_loss": -27.8632869720459, "global_step": 587999, "epoch": 7084} {"train_loss": -27.760950088500977, "global_step": 588000, "epoch": 7084} {"train_loss": -27.572473526000977, "global_step": 588001, "epoch": 7084} {"train_loss": -28.057147979736328, "global_step": 588002, "epoch": 7084} {"train_loss": -27.785018920898438, "global_step": 588003, "epoch": 7084} {"train_loss": -27.854007720947266, "global_step": 588004, "epoch": 7084} {"train_loss": -27.993932723999023, "global_step": 588005, "epoch": 7084} {"train_loss": -27.784381866455078, "global_step": 588006, "epoch": 7084} {"train_loss": -28.055540084838867, "global_step": 588007, "epoch": 7084} {"train_loss": -27.78157615661621, "global_step": 588008, "epoch": 7084} {"train_loss": -27.724353790283203, "global_step": 588009, "epoch": 7084} {"train_loss": -28.002777099609375, "global_step": 588010, "epoch": 7084} {"train_loss": -27.634252548217773, "global_step": 588011, "epoch": 7084} {"train_loss": -28.109472274780273, "global_step": 588012, "epoch": 7084} {"train_loss": -28.101547241210938, "global_step": 588013, "epoch": 7084} {"train_loss": -27.732318878173828, "global_step": 588014, "epoch": 7084} {"train_loss": -28.21083641052246, "global_step": 588015, "epoch": 7084} {"train_loss": -28.023672103881836, "global_step": 588016, "epoch": 7084} {"train_loss": -28.136981964111328, "global_step": 588017, "epoch": 7084} {"train_loss": -28.187702178955078, "global_step": 588018, "epoch": 7084} {"train_loss": -27.96823501586914, "global_step": 588019, "epoch": 7084} {"train_loss": -28.30948829650879, "global_step": 588020, "epoch": 7084} {"train_loss": -28.2561092376709, "global_step": 588021, "epoch": 7084} {"train_loss": -28.447132110595703, "global_step": 588022, "epoch": 7084} {"train_loss": -27.749252319335938, "global_step": 588023, "epoch": 7084} {"train_loss": -28.001489639282227, "global_step": 588024, "epoch": 7084} {"train_loss": -28.331817626953125, "global_step": 588025, "epoch": 7084} {"train_loss": -27.871740341186523, "global_step": 588026, "epoch": 7084} {"train_loss": -28.213857650756836, "global_step": 588027, "epoch": 7084} {"train_loss": -28.165481567382812, "global_step": 588028, "epoch": 7084} {"train_loss": -27.866758346557617, "global_step": 588029, "epoch": 7084} {"train_loss": -28.406965255737305, "global_step": 588030, "epoch": 7084} {"train_loss": -28.337793350219727, "global_step": 588031, "epoch": 7084} {"train_loss": -27.896493911743164, "global_step": 588032, "epoch": 7084} {"train_loss": -27.9532470703125, "global_step": 588033, "epoch": 7084} {"train_loss": -27.8089599609375, "global_step": 588034, "epoch": 7084} {"train_loss": -28.15692138671875, "global_step": 588035, "epoch": 7084} {"train_loss": -28.519739151000977, "global_step": 588036, "epoch": 7084} {"train_loss": -27.81488037109375, "global_step": 588037, "epoch": 7084} {"train_loss": -28.32698631286621, "global_step": 588038, "epoch": 7084} {"train_loss": -28.19504165649414, "global_step": 588039, "epoch": 7084} {"train_loss": -28.05074119567871, "global_step": 588040, "epoch": 7084} {"train_loss": -28.04428482055664, "global_step": 588041, "epoch": 7084} {"train_loss": -27.827985763549805, "global_step": 588042, "epoch": 7084} {"train_loss": -27.91908836364746, "global_step": 588043, "epoch": 7084} {"train_loss": -28.1181583404541, "global_step": 588044, "epoch": 7084} {"train_loss": -27.986066818237305, "global_step": 588045, "epoch": 7084} {"train_loss": -28.377897262573242, "global_step": 588046, "epoch": 7084} {"train_loss": -28.078582763671875, "global_step": 588047, "epoch": 7084} {"train_loss": -28.043563842773438, "global_step": 588048, "epoch": 7084} {"train_loss": -28.274112701416016, "global_step": 588049, "epoch": 7084} {"train_loss": -27.9916934967041, "global_step": 588050, "epoch": 7084} {"train_loss": -28.129562377929688, "global_step": 588051, "epoch": 7084} {"train_loss": -28.001117706298828, "global_step": 588052, "epoch": 7084} {"train_loss": -28.00419044494629, "global_step": 588053, "epoch": 7084} {"train_loss": -27.81279816684953, "global_step": 588054, "epoch": 7084, "val_loss": 6601873.0} {"train_loss": -27.21221351623535, "global_step": 588055, "epoch": 7085} {"train_loss": -26.526288986206055, "global_step": 588056, "epoch": 7085} {"train_loss": -26.58233070373535, "global_step": 588057, "epoch": 7085} {"train_loss": -26.3160400390625, "global_step": 588058, "epoch": 7085} {"train_loss": -24.8964786529541, "global_step": 588059, "epoch": 7085} {"train_loss": -25.161325454711914, "global_step": 588060, "epoch": 7085} {"train_loss": -26.750030517578125, "global_step": 588061, "epoch": 7085} {"train_loss": -26.905237197875977, "global_step": 588062, "epoch": 7085} {"train_loss": -26.24485206604004, "global_step": 588063, "epoch": 7085} {"train_loss": -27.381994247436523, "global_step": 588064, "epoch": 7085} {"train_loss": -26.696826934814453, "global_step": 588065, "epoch": 7085} {"train_loss": -27.328866958618164, "global_step": 588066, "epoch": 7085} {"train_loss": -26.92180824279785, "global_step": 588067, "epoch": 7085} {"train_loss": -27.103506088256836, "global_step": 588068, "epoch": 7085} {"train_loss": -27.4174861907959, "global_step": 588069, "epoch": 7085} {"train_loss": -27.25630760192871, "global_step": 588070, "epoch": 7085} {"train_loss": -27.674585342407227, "global_step": 588071, "epoch": 7085} {"train_loss": -27.571256637573242, "global_step": 588072, "epoch": 7085} {"train_loss": -27.092172622680664, "global_step": 588073, "epoch": 7085} {"train_loss": -27.52143669128418, "global_step": 588074, "epoch": 7085} {"train_loss": -27.448776245117188, "global_step": 588075, "epoch": 7085} {"train_loss": -27.487979888916016, "global_step": 588076, "epoch": 7085} {"train_loss": -27.77292823791504, "global_step": 588077, "epoch": 7085} {"train_loss": -27.690458297729492, "global_step": 588078, "epoch": 7085} {"train_loss": -27.7408390045166, "global_step": 588079, "epoch": 7085} {"train_loss": -27.644384384155273, "global_step": 588080, "epoch": 7085} {"train_loss": -28.105005264282227, "global_step": 588081, "epoch": 7085} {"train_loss": -27.690176010131836, "global_step": 588082, "epoch": 7085} {"train_loss": -27.829071044921875, "global_step": 588083, "epoch": 7085} {"train_loss": -27.621923446655273, "global_step": 588084, "epoch": 7085} {"train_loss": -28.151264190673828, "global_step": 588085, "epoch": 7085} {"train_loss": -27.789398193359375, "global_step": 588086, "epoch": 7085} {"train_loss": -27.876026153564453, "global_step": 588087, "epoch": 7085} {"train_loss": -27.999441146850586, "global_step": 588088, "epoch": 7085} {"train_loss": -27.91352653503418, "global_step": 588089, "epoch": 7085} {"train_loss": -27.730743408203125, "global_step": 588090, "epoch": 7085} {"train_loss": -28.081451416015625, "global_step": 588091, "epoch": 7085} {"train_loss": -27.911718368530273, "global_step": 588092, "epoch": 7085} {"train_loss": -28.405282974243164, "global_step": 588093, "epoch": 7085} {"train_loss": -28.256973266601562, "global_step": 588094, "epoch": 7085} {"train_loss": -28.104583740234375, "global_step": 588095, "epoch": 7085} {"train_loss": -27.828811645507812, "global_step": 588096, "epoch": 7085} {"train_loss": -27.947111129760742, "global_step": 588097, "epoch": 7085} {"train_loss": -27.6759033203125, "global_step": 588098, "epoch": 7085} {"train_loss": -28.351337432861328, "global_step": 588099, "epoch": 7085} {"train_loss": -28.023061752319336, "global_step": 588100, "epoch": 7085} {"train_loss": -28.520313262939453, "global_step": 588101, "epoch": 7085} {"train_loss": -27.987014770507812, "global_step": 588102, "epoch": 7085} {"train_loss": -27.63168716430664, "global_step": 588103, "epoch": 7085} {"train_loss": -28.04497718811035, "global_step": 588104, "epoch": 7085} {"train_loss": -28.097808837890625, "global_step": 588105, "epoch": 7085} {"train_loss": -28.213666915893555, "global_step": 588106, "epoch": 7085} {"train_loss": -27.631078720092773, "global_step": 588107, "epoch": 7085} {"train_loss": -27.57303810119629, "global_step": 588108, "epoch": 7085} {"train_loss": -27.671478271484375, "global_step": 588109, "epoch": 7085} {"train_loss": -27.587696075439453, "global_step": 588110, "epoch": 7085} {"train_loss": -27.69563865661621, "global_step": 588111, "epoch": 7085} {"train_loss": -27.7822265625, "global_step": 588112, "epoch": 7085} {"train_loss": -27.766448974609375, "global_step": 588113, "epoch": 7085} {"train_loss": -27.765472412109375, "global_step": 588114, "epoch": 7085} {"train_loss": -28.005111694335938, "global_step": 588115, "epoch": 7085} {"train_loss": -27.984167098999023, "global_step": 588116, "epoch": 7085} {"train_loss": -28.070642471313477, "global_step": 588117, "epoch": 7085} {"train_loss": -28.17042350769043, "global_step": 588118, "epoch": 7085} {"train_loss": -28.270614624023438, "global_step": 588119, "epoch": 7085} {"train_loss": -28.214035034179688, "global_step": 588120, "epoch": 7085} {"train_loss": -28.3389949798584, "global_step": 588121, "epoch": 7085} {"train_loss": -28.196374893188477, "global_step": 588122, "epoch": 7085} {"train_loss": -28.208959579467773, "global_step": 588123, "epoch": 7085} {"train_loss": -28.067367553710938, "global_step": 588124, "epoch": 7085} {"train_loss": -27.853513717651367, "global_step": 588125, "epoch": 7085} {"train_loss": -28.183019638061523, "global_step": 588126, "epoch": 7085} {"train_loss": -28.257831573486328, "global_step": 588127, "epoch": 7085} {"train_loss": -27.836673736572266, "global_step": 588128, "epoch": 7085} {"train_loss": -28.143030166625977, "global_step": 588129, "epoch": 7085} {"train_loss": -28.155820846557617, "global_step": 588130, "epoch": 7085} {"train_loss": -28.210622787475586, "global_step": 588131, "epoch": 7085} {"train_loss": -28.300607681274414, "global_step": 588132, "epoch": 7085} {"train_loss": -28.068439483642578, "global_step": 588133, "epoch": 7085} {"train_loss": -28.187393188476562, "global_step": 588134, "epoch": 7085} {"train_loss": -27.940290451049805, "global_step": 588135, "epoch": 7085} {"train_loss": -28.326358795166016, "global_step": 588136, "epoch": 7085} {"train_loss": -27.69361532739846, "global_step": 588137, "epoch": 7085, "val_loss": 6656488.0} {"train_loss": -27.63080406188965, "global_step": 588138, "epoch": 7086} {"train_loss": -26.875951766967773, "global_step": 588139, "epoch": 7086} {"train_loss": -26.62917137145996, "global_step": 588140, "epoch": 7086} {"train_loss": -27.226240158081055, "global_step": 588141, "epoch": 7086} {"train_loss": -27.651020050048828, "global_step": 588142, "epoch": 7086} {"train_loss": -27.31525230407715, "global_step": 588143, "epoch": 7086} {"train_loss": -27.45366859436035, "global_step": 588144, "epoch": 7086} {"train_loss": -27.76267433166504, "global_step": 588145, "epoch": 7086} {"train_loss": -27.762664794921875, "global_step": 588146, "epoch": 7086} {"train_loss": -27.45231056213379, "global_step": 588147, "epoch": 7086} {"train_loss": -27.736103057861328, "global_step": 588148, "epoch": 7086} {"train_loss": -27.75433921813965, "global_step": 588149, "epoch": 7086} {"train_loss": -27.528852462768555, "global_step": 588150, "epoch": 7086} {"train_loss": -27.643207550048828, "global_step": 588151, "epoch": 7086} {"train_loss": -27.6538028717041, "global_step": 588152, "epoch": 7086} {"train_loss": -27.913305282592773, "global_step": 588153, "epoch": 7086} {"train_loss": -27.862762451171875, "global_step": 588154, "epoch": 7086} {"train_loss": -27.427438735961914, "global_step": 588155, "epoch": 7086} {"train_loss": -27.91876220703125, "global_step": 588156, "epoch": 7086} {"train_loss": -27.704160690307617, "global_step": 588157, "epoch": 7086} {"train_loss": -28.137231826782227, "global_step": 588158, "epoch": 7086} {"train_loss": -27.704483032226562, "global_step": 588159, "epoch": 7086} {"train_loss": -27.77425193786621, "global_step": 588160, "epoch": 7086} {"train_loss": -28.459381103515625, "global_step": 588161, "epoch": 7086} {"train_loss": -27.880231857299805, "global_step": 588162, "epoch": 7086} {"train_loss": -28.108320236206055, "global_step": 588163, "epoch": 7086} {"train_loss": -27.8872013092041, "global_step": 588164, "epoch": 7086} {"train_loss": -27.767398834228516, "global_step": 588165, "epoch": 7086} {"train_loss": -27.751428604125977, "global_step": 588166, "epoch": 7086} {"train_loss": -27.920120239257812, "global_step": 588167, "epoch": 7086} {"train_loss": -28.06492042541504, "global_step": 588168, "epoch": 7086} {"train_loss": -27.907978057861328, "global_step": 588169, "epoch": 7086} {"train_loss": -27.934497833251953, "global_step": 588170, "epoch": 7086} {"train_loss": -28.001333236694336, "global_step": 588171, "epoch": 7086} {"train_loss": -27.9440975189209, "global_step": 588172, "epoch": 7086} {"train_loss": -28.3076229095459, "global_step": 588173, "epoch": 7086} {"train_loss": -28.151594161987305, "global_step": 588174, "epoch": 7086} {"train_loss": -27.781005859375, "global_step": 588175, "epoch": 7086} {"train_loss": -27.937744140625, "global_step": 588176, "epoch": 7086} {"train_loss": -27.95454216003418, "global_step": 588177, "epoch": 7086} {"train_loss": -28.391189575195312, "global_step": 588178, "epoch": 7086} {"train_loss": -27.953168869018555, "global_step": 588179, "epoch": 7086} {"train_loss": -28.238178253173828, "global_step": 588180, "epoch": 7086} {"train_loss": -28.00540542602539, "global_step": 588181, "epoch": 7086} {"train_loss": -28.1899356842041, "global_step": 588182, "epoch": 7086} {"train_loss": -28.025419235229492, "global_step": 588183, "epoch": 7086} {"train_loss": -28.27131462097168, "global_step": 588184, "epoch": 7086} {"train_loss": -28.20941162109375, "global_step": 588185, "epoch": 7086} {"train_loss": -28.073596954345703, "global_step": 588186, "epoch": 7086} {"train_loss": -28.423675537109375, "global_step": 588187, "epoch": 7086} {"train_loss": -28.30984878540039, "global_step": 588188, "epoch": 7086} {"train_loss": -28.16839599609375, "global_step": 588189, "epoch": 7086} {"train_loss": -27.780139923095703, "global_step": 588190, "epoch": 7086} {"train_loss": -28.228687286376953, "global_step": 588191, "epoch": 7086} {"train_loss": -28.242963790893555, "global_step": 588192, "epoch": 7086} {"train_loss": -28.427350997924805, "global_step": 588193, "epoch": 7086} {"train_loss": -28.238758087158203, "global_step": 588194, "epoch": 7086} {"train_loss": -28.253559112548828, "global_step": 588195, "epoch": 7086} {"train_loss": -28.138580322265625, "global_step": 588196, "epoch": 7086} {"train_loss": -28.16963005065918, "global_step": 588197, "epoch": 7086} {"train_loss": -28.20953369140625, "global_step": 588198, "epoch": 7086} {"train_loss": -28.097064971923828, "global_step": 588199, "epoch": 7086} {"train_loss": -28.04636573791504, "global_step": 588200, "epoch": 7086} {"train_loss": -27.870746612548828, "global_step": 588201, "epoch": 7086} {"train_loss": -27.5578670501709, "global_step": 588202, "epoch": 7086} {"train_loss": -26.450519561767578, "global_step": 588203, "epoch": 7086} {"train_loss": -26.707672119140625, "global_step": 588204, "epoch": 7086} {"train_loss": -27.63567543029785, "global_step": 588205, "epoch": 7086} {"train_loss": -27.6397762298584, "global_step": 588206, "epoch": 7086} {"train_loss": -26.923070907592773, "global_step": 588207, "epoch": 7086} {"train_loss": -27.786865234375, "global_step": 588208, "epoch": 7086} {"train_loss": -27.37400245666504, "global_step": 588209, "epoch": 7086} {"train_loss": -28.056299209594727, "global_step": 588210, "epoch": 7086} {"train_loss": -27.413965225219727, "global_step": 588211, "epoch": 7086} {"train_loss": -27.71466636657715, "global_step": 588212, "epoch": 7086} {"train_loss": -27.378210067749023, "global_step": 588213, "epoch": 7086} {"train_loss": -27.94129753112793, "global_step": 588214, "epoch": 7086} {"train_loss": -27.468826293945312, "global_step": 588215, "epoch": 7086} {"train_loss": -27.280282974243164, "global_step": 588216, "epoch": 7086} {"train_loss": -27.390426635742188, "global_step": 588217, "epoch": 7086} {"train_loss": -26.93372917175293, "global_step": 588218, "epoch": 7086} {"train_loss": -27.909509658813477, "global_step": 588219, "epoch": 7086} {"train_loss": -27.80886964912874, "global_step": 588220, "epoch": 7086, "val_loss": 6705452.0} {"train_loss": -26.359882354736328, "global_step": 588221, "epoch": 7087} {"train_loss": -26.849576950073242, "global_step": 588222, "epoch": 7087} {"train_loss": -26.75211524963379, "global_step": 588223, "epoch": 7087} {"train_loss": -27.00008201599121, "global_step": 588224, "epoch": 7087} {"train_loss": -27.19624137878418, "global_step": 588225, "epoch": 7087} {"train_loss": -27.2817325592041, "global_step": 588226, "epoch": 7087} {"train_loss": -27.42999839782715, "global_step": 588227, "epoch": 7087} {"train_loss": -27.405792236328125, "global_step": 588228, "epoch": 7087} {"train_loss": -27.575788497924805, "global_step": 588229, "epoch": 7087} {"train_loss": -27.28533935546875, "global_step": 588230, "epoch": 7087} {"train_loss": -27.63370132446289, "global_step": 588231, "epoch": 7087} {"train_loss": -27.70832633972168, "global_step": 588232, "epoch": 7087} {"train_loss": -27.51116371154785, "global_step": 588233, "epoch": 7087} {"train_loss": -27.716398239135742, "global_step": 588234, "epoch": 7087} {"train_loss": -27.37116813659668, "global_step": 588235, "epoch": 7087} {"train_loss": -27.881946563720703, "global_step": 588236, "epoch": 7087} {"train_loss": -27.441909790039062, "global_step": 588237, "epoch": 7087} {"train_loss": -27.562957763671875, "global_step": 588238, "epoch": 7087} {"train_loss": -27.810522079467773, "global_step": 588239, "epoch": 7087} {"train_loss": -27.827905654907227, "global_step": 588240, "epoch": 7087} {"train_loss": -27.658344268798828, "global_step": 588241, "epoch": 7087} {"train_loss": -27.644895553588867, "global_step": 588242, "epoch": 7087} {"train_loss": -27.481977462768555, "global_step": 588243, "epoch": 7087} {"train_loss": -27.799039840698242, "global_step": 588244, "epoch": 7087} {"train_loss": -28.01038932800293, "global_step": 588245, "epoch": 7087} {"train_loss": -27.667383193969727, "global_step": 588246, "epoch": 7087} {"train_loss": -27.5782470703125, "global_step": 588247, "epoch": 7087} {"train_loss": -27.946949005126953, "global_step": 588248, "epoch": 7087} {"train_loss": -27.725793838500977, "global_step": 588249, "epoch": 7087} {"train_loss": -28.065454483032227, "global_step": 588250, "epoch": 7087} {"train_loss": -27.925607681274414, "global_step": 588251, "epoch": 7087} {"train_loss": -28.219839096069336, "global_step": 588252, "epoch": 7087} {"train_loss": -27.948163986206055, "global_step": 588253, "epoch": 7087} {"train_loss": -27.746505737304688, "global_step": 588254, "epoch": 7087} {"train_loss": -28.1487979888916, "global_step": 588255, "epoch": 7087} {"train_loss": -27.889394760131836, "global_step": 588256, "epoch": 7087} {"train_loss": -27.916034698486328, "global_step": 588257, "epoch": 7087} {"train_loss": -27.863605499267578, "global_step": 588258, "epoch": 7087} {"train_loss": -27.762121200561523, "global_step": 588259, "epoch": 7087} {"train_loss": -28.051849365234375, "global_step": 588260, "epoch": 7087} {"train_loss": -28.187061309814453, "global_step": 588261, "epoch": 7087} {"train_loss": -28.34968376159668, "global_step": 588262, "epoch": 7087} {"train_loss": -27.9800968170166, "global_step": 588263, "epoch": 7087} {"train_loss": -28.118066787719727, "global_step": 588264, "epoch": 7087} {"train_loss": -28.192230224609375, "global_step": 588265, "epoch": 7087} {"train_loss": -28.09474754333496, "global_step": 588266, "epoch": 7087} {"train_loss": -28.62666130065918, "global_step": 588267, "epoch": 7087} {"train_loss": -28.19571876525879, "global_step": 588268, "epoch": 7087} {"train_loss": -28.25701332092285, "global_step": 588269, "epoch": 7087} {"train_loss": -28.248981475830078, "global_step": 588270, "epoch": 7087} {"train_loss": -28.456586837768555, "global_step": 588271, "epoch": 7087} {"train_loss": -28.036771774291992, "global_step": 588272, "epoch": 7087} {"train_loss": -28.366037368774414, "global_step": 588273, "epoch": 7087} {"train_loss": -27.991491317749023, "global_step": 588274, "epoch": 7087} {"train_loss": -28.09796142578125, "global_step": 588275, "epoch": 7087} {"train_loss": -28.4301815032959, "global_step": 588276, "epoch": 7087} {"train_loss": -27.779529571533203, "global_step": 588277, "epoch": 7087} {"train_loss": -28.376163482666016, "global_step": 588278, "epoch": 7087} {"train_loss": -28.177343368530273, "global_step": 588279, "epoch": 7087} {"train_loss": -28.01874351501465, "global_step": 588280, "epoch": 7087} {"train_loss": -27.965808868408203, "global_step": 588281, "epoch": 7087} {"train_loss": -28.420385360717773, "global_step": 588282, "epoch": 7087} {"train_loss": -28.022430419921875, "global_step": 588283, "epoch": 7087} {"train_loss": -28.18885612487793, "global_step": 588284, "epoch": 7087} {"train_loss": -27.98688316345215, "global_step": 588285, "epoch": 7087} {"train_loss": -28.245214462280273, "global_step": 588286, "epoch": 7087} {"train_loss": -28.188587188720703, "global_step": 588287, "epoch": 7087} {"train_loss": -27.87278175354004, "global_step": 588288, "epoch": 7087} {"train_loss": -27.950475692749023, "global_step": 588289, "epoch": 7087} {"train_loss": -28.11500358581543, "global_step": 588290, "epoch": 7087} {"train_loss": -28.067590713500977, "global_step": 588291, "epoch": 7087} {"train_loss": -28.360761642456055, "global_step": 588292, "epoch": 7087} {"train_loss": -28.24679946899414, "global_step": 588293, "epoch": 7087} {"train_loss": -28.133041381835938, "global_step": 588294, "epoch": 7087} {"train_loss": -28.024005889892578, "global_step": 588295, "epoch": 7087} {"train_loss": -28.240121841430664, "global_step": 588296, "epoch": 7087} {"train_loss": -28.09267234802246, "global_step": 588297, "epoch": 7087} {"train_loss": -27.844070434570312, "global_step": 588298, "epoch": 7087} {"train_loss": -27.81195068359375, "global_step": 588299, "epoch": 7087} {"train_loss": -28.06385612487793, "global_step": 588300, "epoch": 7087} {"train_loss": -27.540271759033203, "global_step": 588301, "epoch": 7087} {"train_loss": -27.69036865234375, "global_step": 588302, "epoch": 7087} {"train_loss": -27.88266142879624, "global_step": 588303, "epoch": 7087, "val_loss": 6719113.0} {"train_loss": -27.3792667388916, "global_step": 588304, "epoch": 7088} {"train_loss": -27.22735595703125, "global_step": 588305, "epoch": 7088} {"train_loss": -27.563007354736328, "global_step": 588306, "epoch": 7088} {"train_loss": -27.35394859313965, "global_step": 588307, "epoch": 7088} {"train_loss": -26.859586715698242, "global_step": 588308, "epoch": 7088} {"train_loss": -27.40888786315918, "global_step": 588309, "epoch": 7088} {"train_loss": -27.029489517211914, "global_step": 588310, "epoch": 7088} {"train_loss": -27.48689079284668, "global_step": 588311, "epoch": 7088} {"train_loss": -27.59354019165039, "global_step": 588312, "epoch": 7088} {"train_loss": -27.41704750061035, "global_step": 588313, "epoch": 7088} {"train_loss": -27.842214584350586, "global_step": 588314, "epoch": 7088} {"train_loss": -27.737686157226562, "global_step": 588315, "epoch": 7088} {"train_loss": -27.7344913482666, "global_step": 588316, "epoch": 7088} {"train_loss": -27.67708396911621, "global_step": 588317, "epoch": 7088} {"train_loss": -27.699628829956055, "global_step": 588318, "epoch": 7088} {"train_loss": -27.490446090698242, "global_step": 588319, "epoch": 7088} {"train_loss": -27.692480087280273, "global_step": 588320, "epoch": 7088} {"train_loss": -27.677881240844727, "global_step": 588321, "epoch": 7088} {"train_loss": -27.9998722076416, "global_step": 588322, "epoch": 7088} {"train_loss": -27.841510772705078, "global_step": 588323, "epoch": 7088} {"train_loss": -27.875436782836914, "global_step": 588324, "epoch": 7088} {"train_loss": -27.839508056640625, "global_step": 588325, "epoch": 7088} {"train_loss": -27.912206649780273, "global_step": 588326, "epoch": 7088} {"train_loss": -28.205350875854492, "global_step": 588327, "epoch": 7088} {"train_loss": -27.830463409423828, "global_step": 588328, "epoch": 7088} {"train_loss": -27.80830192565918, "global_step": 588329, "epoch": 7088} {"train_loss": -28.204975128173828, "global_step": 588330, "epoch": 7088} {"train_loss": -28.04546546936035, "global_step": 588331, "epoch": 7088} {"train_loss": -28.266942977905273, "global_step": 588332, "epoch": 7088} {"train_loss": -28.133337020874023, "global_step": 588333, "epoch": 7088} {"train_loss": -28.325586318969727, "global_step": 588334, "epoch": 7088} {"train_loss": -28.4587459564209, "global_step": 588335, "epoch": 7088} {"train_loss": -28.638166427612305, "global_step": 588336, "epoch": 7088} {"train_loss": -28.065174102783203, "global_step": 588337, "epoch": 7088} {"train_loss": -28.04120445251465, "global_step": 588338, "epoch": 7088} {"train_loss": -28.269445419311523, "global_step": 588339, "epoch": 7088} {"train_loss": -27.87542724609375, "global_step": 588340, "epoch": 7088} {"train_loss": -27.690412521362305, "global_step": 588341, "epoch": 7088} {"train_loss": -28.0126895904541, "global_step": 588342, "epoch": 7088} {"train_loss": -28.064685821533203, "global_step": 588343, "epoch": 7088} {"train_loss": -27.808271408081055, "global_step": 588344, "epoch": 7088} {"train_loss": -27.771381378173828, "global_step": 588345, "epoch": 7088} {"train_loss": -27.60982322692871, "global_step": 588346, "epoch": 7088} {"train_loss": -27.83841896057129, "global_step": 588347, "epoch": 7088} {"train_loss": -27.907224655151367, "global_step": 588348, "epoch": 7088} {"train_loss": -28.257904052734375, "global_step": 588349, "epoch": 7088} {"train_loss": -28.001846313476562, "global_step": 588350, "epoch": 7088} {"train_loss": -28.145421981811523, "global_step": 588351, "epoch": 7088} {"train_loss": -28.081451416015625, "global_step": 588352, "epoch": 7088} {"train_loss": -27.662885665893555, "global_step": 588353, "epoch": 7088} {"train_loss": -28.03847312927246, "global_step": 588354, "epoch": 7088} {"train_loss": -28.119375228881836, "global_step": 588355, "epoch": 7088} {"train_loss": -27.96219253540039, "global_step": 588356, "epoch": 7088} {"train_loss": -27.92011070251465, "global_step": 588357, "epoch": 7088} {"train_loss": -28.226659774780273, "global_step": 588358, "epoch": 7088} {"train_loss": -27.669631958007812, "global_step": 588359, "epoch": 7088} {"train_loss": -27.92561149597168, "global_step": 588360, "epoch": 7088} {"train_loss": -28.09625244140625, "global_step": 588361, "epoch": 7088} {"train_loss": -28.282358169555664, "global_step": 588362, "epoch": 7088} {"train_loss": -27.97019386291504, "global_step": 588363, "epoch": 7088} {"train_loss": -28.160449981689453, "global_step": 588364, "epoch": 7088} {"train_loss": -28.319345474243164, "global_step": 588365, "epoch": 7088} {"train_loss": -27.71553611755371, "global_step": 588366, "epoch": 7088} {"train_loss": -28.119932174682617, "global_step": 588367, "epoch": 7088} {"train_loss": -27.951658248901367, "global_step": 588368, "epoch": 7088} {"train_loss": -27.98600196838379, "global_step": 588369, "epoch": 7088} {"train_loss": -28.0650691986084, "global_step": 588370, "epoch": 7088} {"train_loss": -28.253387451171875, "global_step": 588371, "epoch": 7088} {"train_loss": -28.21514320373535, "global_step": 588372, "epoch": 7088} {"train_loss": -28.160383224487305, "global_step": 588373, "epoch": 7088} {"train_loss": -27.859607696533203, "global_step": 588374, "epoch": 7088} {"train_loss": -27.8942813873291, "global_step": 588375, "epoch": 7088} {"train_loss": -27.862201690673828, "global_step": 588376, "epoch": 7088} {"train_loss": -27.80402946472168, "global_step": 588377, "epoch": 7088} {"train_loss": -27.806324005126953, "global_step": 588378, "epoch": 7088} {"train_loss": -27.8240909576416, "global_step": 588379, "epoch": 7088} {"train_loss": -27.998403549194336, "global_step": 588380, "epoch": 7088} {"train_loss": -28.435110092163086, "global_step": 588381, "epoch": 7088} {"train_loss": -28.177509307861328, "global_step": 588382, "epoch": 7088} {"train_loss": -27.98726463317871, "global_step": 588383, "epoch": 7088} {"train_loss": -28.230566024780273, "global_step": 588384, "epoch": 7088} {"train_loss": -28.455825805664062, "global_step": 588385, "epoch": 7088} {"train_loss": -27.902644651481904, "global_step": 588386, "epoch": 7088, "val_loss": 6660601.0} {"train_loss": -28.122228622436523, "global_step": 588387, "epoch": 7089} {"train_loss": -27.66385269165039, "global_step": 588388, "epoch": 7089} {"train_loss": -27.52857780456543, "global_step": 588389, "epoch": 7089} {"train_loss": -27.699628829956055, "global_step": 588390, "epoch": 7089} {"train_loss": -27.773263931274414, "global_step": 588391, "epoch": 7089} {"train_loss": -27.76887321472168, "global_step": 588392, "epoch": 7089} {"train_loss": -27.751615524291992, "global_step": 588393, "epoch": 7089} {"train_loss": -27.957006454467773, "global_step": 588394, "epoch": 7089} {"train_loss": -27.51722526550293, "global_step": 588395, "epoch": 7089} {"train_loss": -27.38570213317871, "global_step": 588396, "epoch": 7089} {"train_loss": -27.015836715698242, "global_step": 588397, "epoch": 7089} {"train_loss": -27.54451560974121, "global_step": 588398, "epoch": 7089} {"train_loss": -27.46774673461914, "global_step": 588399, "epoch": 7089} {"train_loss": -26.737279891967773, "global_step": 588400, "epoch": 7089} {"train_loss": -27.71435546875, "global_step": 588401, "epoch": 7089} {"train_loss": -27.14710807800293, "global_step": 588402, "epoch": 7089} {"train_loss": -27.581562042236328, "global_step": 588403, "epoch": 7089} {"train_loss": -27.82729148864746, "global_step": 588404, "epoch": 7089} {"train_loss": -27.65581703186035, "global_step": 588405, "epoch": 7089} {"train_loss": -27.40852165222168, "global_step": 588406, "epoch": 7089} {"train_loss": -27.488895416259766, "global_step": 588407, "epoch": 7089} {"train_loss": -27.832935333251953, "global_step": 588408, "epoch": 7089} {"train_loss": -27.79024314880371, "global_step": 588409, "epoch": 7089} {"train_loss": -27.336761474609375, "global_step": 588410, "epoch": 7089} {"train_loss": -27.578672409057617, "global_step": 588411, "epoch": 7089} {"train_loss": -27.62312126159668, "global_step": 588412, "epoch": 7089} {"train_loss": -27.520801544189453, "global_step": 588413, "epoch": 7089} {"train_loss": -27.191757202148438, "global_step": 588414, "epoch": 7089} {"train_loss": -27.668935775756836, "global_step": 588415, "epoch": 7089} {"train_loss": -27.938608169555664, "global_step": 588416, "epoch": 7089} {"train_loss": -27.87662124633789, "global_step": 588417, "epoch": 7089} {"train_loss": -28.28285026550293, "global_step": 588418, "epoch": 7089} {"train_loss": -27.705053329467773, "global_step": 588419, "epoch": 7089} {"train_loss": -27.70688819885254, "global_step": 588420, "epoch": 7089} {"train_loss": -27.416778564453125, "global_step": 588421, "epoch": 7089} {"train_loss": -27.84718132019043, "global_step": 588422, "epoch": 7089} {"train_loss": -27.713348388671875, "global_step": 588423, "epoch": 7089} {"train_loss": -27.995044708251953, "global_step": 588424, "epoch": 7089} {"train_loss": -28.143146514892578, "global_step": 588425, "epoch": 7089} {"train_loss": -27.69388198852539, "global_step": 588426, "epoch": 7089} {"train_loss": -27.84041404724121, "global_step": 588427, "epoch": 7089} {"train_loss": -27.956602096557617, "global_step": 588428, "epoch": 7089} {"train_loss": -27.617115020751953, "global_step": 588429, "epoch": 7089} {"train_loss": -27.484235763549805, "global_step": 588430, "epoch": 7089} {"train_loss": -27.393722534179688, "global_step": 588431, "epoch": 7089} {"train_loss": -27.791229248046875, "global_step": 588432, "epoch": 7089} {"train_loss": -27.97321891784668, "global_step": 588433, "epoch": 7089} {"train_loss": -27.784666061401367, "global_step": 588434, "epoch": 7089} {"train_loss": -27.74005699157715, "global_step": 588435, "epoch": 7089} {"train_loss": -27.53875160217285, "global_step": 588436, "epoch": 7089} {"train_loss": -28.082263946533203, "global_step": 588437, "epoch": 7089} {"train_loss": -28.057861328125, "global_step": 588438, "epoch": 7089} {"train_loss": -27.61091423034668, "global_step": 588439, "epoch": 7089} {"train_loss": -27.949548721313477, "global_step": 588440, "epoch": 7089} {"train_loss": -27.69049072265625, "global_step": 588441, "epoch": 7089} {"train_loss": -27.99827003479004, "global_step": 588442, "epoch": 7089} {"train_loss": -28.128442764282227, "global_step": 588443, "epoch": 7089} {"train_loss": -28.308454513549805, "global_step": 588444, "epoch": 7089} {"train_loss": -27.909530639648438, "global_step": 588445, "epoch": 7089} {"train_loss": -27.884729385375977, "global_step": 588446, "epoch": 7089} {"train_loss": -28.023420333862305, "global_step": 588447, "epoch": 7089} {"train_loss": -27.882949829101562, "global_step": 588448, "epoch": 7089} {"train_loss": -27.837369918823242, "global_step": 588449, "epoch": 7089} {"train_loss": -28.18440818786621, "global_step": 588450, "epoch": 7089} {"train_loss": -27.686553955078125, "global_step": 588451, "epoch": 7089} {"train_loss": -27.7785587310791, "global_step": 588452, "epoch": 7089} {"train_loss": -27.680530548095703, "global_step": 588453, "epoch": 7089} {"train_loss": -27.828022003173828, "global_step": 588454, "epoch": 7089} {"train_loss": -28.148542404174805, "global_step": 588455, "epoch": 7089} {"train_loss": -27.810800552368164, "global_step": 588456, "epoch": 7089} {"train_loss": -27.51167106628418, "global_step": 588457, "epoch": 7089} {"train_loss": -28.554122924804688, "global_step": 588458, "epoch": 7089} {"train_loss": -27.86083984375, "global_step": 588459, "epoch": 7089} {"train_loss": -28.0093936920166, "global_step": 588460, "epoch": 7089} {"train_loss": -28.151397705078125, "global_step": 588461, "epoch": 7089} {"train_loss": -28.000890731811523, "global_step": 588462, "epoch": 7089} {"train_loss": -27.9984188079834, "global_step": 588463, "epoch": 7089} {"train_loss": -28.226654052734375, "global_step": 588464, "epoch": 7089} {"train_loss": -27.94904899597168, "global_step": 588465, "epoch": 7089} {"train_loss": -28.49442481994629, "global_step": 588466, "epoch": 7089} {"train_loss": -27.939252853393555, "global_step": 588467, "epoch": 7089} {"train_loss": -28.114368438720703, "global_step": 588468, "epoch": 7089} {"train_loss": -27.79364891511848, "global_step": 588469, "epoch": 7089, "val_loss": 6661064.0} {"train_loss": -27.303735733032227, "global_step": 588470, "epoch": 7090} {"train_loss": -27.24298095703125, "global_step": 588471, "epoch": 7090} {"train_loss": -27.52860450744629, "global_step": 588472, "epoch": 7090} {"train_loss": -27.637195587158203, "global_step": 588473, "epoch": 7090} {"train_loss": -27.73126220703125, "global_step": 588474, "epoch": 7090} {"train_loss": -27.46967124938965, "global_step": 588475, "epoch": 7090} {"train_loss": -27.422382354736328, "global_step": 588476, "epoch": 7090} {"train_loss": -27.49382972717285, "global_step": 588477, "epoch": 7090} {"train_loss": -27.89715576171875, "global_step": 588478, "epoch": 7090} {"train_loss": -27.880340576171875, "global_step": 588479, "epoch": 7090} {"train_loss": -27.768224716186523, "global_step": 588480, "epoch": 7090} {"train_loss": -27.771900177001953, "global_step": 588481, "epoch": 7090} {"train_loss": -27.924072265625, "global_step": 588482, "epoch": 7090} {"train_loss": -28.011493682861328, "global_step": 588483, "epoch": 7090} {"train_loss": -27.701313018798828, "global_step": 588484, "epoch": 7090} {"train_loss": -27.87286376953125, "global_step": 588485, "epoch": 7090} {"train_loss": -27.71697998046875, "global_step": 588486, "epoch": 7090} {"train_loss": -27.623310089111328, "global_step": 588487, "epoch": 7090} {"train_loss": -27.925384521484375, "global_step": 588488, "epoch": 7090} {"train_loss": -27.869516372680664, "global_step": 588489, "epoch": 7090} {"train_loss": -28.073820114135742, "global_step": 588490, "epoch": 7090} {"train_loss": -27.95599365234375, "global_step": 588491, "epoch": 7090} {"train_loss": -28.021387100219727, "global_step": 588492, "epoch": 7090} {"train_loss": -28.15579605102539, "global_step": 588493, "epoch": 7090} {"train_loss": -28.0518798828125, "global_step": 588494, "epoch": 7090} {"train_loss": -28.464706420898438, "global_step": 588495, "epoch": 7090} {"train_loss": -27.743688583374023, "global_step": 588496, "epoch": 7090} {"train_loss": -28.14507484436035, "global_step": 588497, "epoch": 7090} {"train_loss": -27.847524642944336, "global_step": 588498, "epoch": 7090} {"train_loss": -28.1706600189209, "global_step": 588499, "epoch": 7090} {"train_loss": -27.90512466430664, "global_step": 588500, "epoch": 7090} {"train_loss": -27.754104614257812, "global_step": 588501, "epoch": 7090} {"train_loss": -27.717809677124023, "global_step": 588502, "epoch": 7090} {"train_loss": -27.711034774780273, "global_step": 588503, "epoch": 7090} {"train_loss": -27.59867286682129, "global_step": 588504, "epoch": 7090} {"train_loss": -28.017520904541016, "global_step": 588505, "epoch": 7090} {"train_loss": -28.0993595123291, "global_step": 588506, "epoch": 7090} {"train_loss": -28.22601318359375, "global_step": 588507, "epoch": 7090} {"train_loss": -28.137807846069336, "global_step": 588508, "epoch": 7090} {"train_loss": -27.77129554748535, "global_step": 588509, "epoch": 7090} {"train_loss": -27.82476234436035, "global_step": 588510, "epoch": 7090} {"train_loss": -27.752283096313477, "global_step": 588511, "epoch": 7090} {"train_loss": -28.17593765258789, "global_step": 588512, "epoch": 7090} {"train_loss": -27.52985954284668, "global_step": 588513, "epoch": 7090} {"train_loss": -27.96891212463379, "global_step": 588514, "epoch": 7090} {"train_loss": -28.19439125061035, "global_step": 588515, "epoch": 7090} {"train_loss": -28.174118041992188, "global_step": 588516, "epoch": 7090} {"train_loss": -28.015750885009766, "global_step": 588517, "epoch": 7090} {"train_loss": -27.772541046142578, "global_step": 588518, "epoch": 7090} {"train_loss": -28.027868270874023, "global_step": 588519, "epoch": 7090} {"train_loss": -28.222333908081055, "global_step": 588520, "epoch": 7090} {"train_loss": -27.98798942565918, "global_step": 588521, "epoch": 7090} {"train_loss": -27.875946044921875, "global_step": 588522, "epoch": 7090} {"train_loss": -27.82000732421875, "global_step": 588523, "epoch": 7090} {"train_loss": -28.00098991394043, "global_step": 588524, "epoch": 7090} {"train_loss": -28.160175323486328, "global_step": 588525, "epoch": 7090} {"train_loss": -27.839557647705078, "global_step": 588526, "epoch": 7090} {"train_loss": -27.840280532836914, "global_step": 588527, "epoch": 7090} {"train_loss": -27.820127487182617, "global_step": 588528, "epoch": 7090} {"train_loss": -27.42048454284668, "global_step": 588529, "epoch": 7090} {"train_loss": -27.585723876953125, "global_step": 588530, "epoch": 7090} {"train_loss": -27.673254013061523, "global_step": 588531, "epoch": 7090} {"train_loss": -28.2520809173584, "global_step": 588532, "epoch": 7090} {"train_loss": -27.930267333984375, "global_step": 588533, "epoch": 7090} {"train_loss": -27.99179458618164, "global_step": 588534, "epoch": 7090} {"train_loss": -28.126691818237305, "global_step": 588535, "epoch": 7090} {"train_loss": -27.66718101501465, "global_step": 588536, "epoch": 7090} {"train_loss": -27.888126373291016, "global_step": 588537, "epoch": 7090} {"train_loss": -27.92424964904785, "global_step": 588538, "epoch": 7090} {"train_loss": -28.07148551940918, "global_step": 588539, "epoch": 7090} {"train_loss": -28.04949378967285, "global_step": 588540, "epoch": 7090} {"train_loss": -28.204492568969727, "global_step": 588541, "epoch": 7090} {"train_loss": -28.249963760375977, "global_step": 588542, "epoch": 7090} {"train_loss": -28.355443954467773, "global_step": 588543, "epoch": 7090} {"train_loss": -28.048648834228516, "global_step": 588544, "epoch": 7090} {"train_loss": -28.12421226501465, "global_step": 588545, "epoch": 7090} {"train_loss": -27.980810165405273, "global_step": 588546, "epoch": 7090} {"train_loss": -27.738229751586914, "global_step": 588547, "epoch": 7090} {"train_loss": -27.690921783447266, "global_step": 588548, "epoch": 7090} {"train_loss": -27.941823959350586, "global_step": 588549, "epoch": 7090} {"train_loss": -28.254364013671875, "global_step": 588550, "epoch": 7090} {"train_loss": -28.050994873046875, "global_step": 588551, "epoch": 7090} {"train_loss": -27.90094722609922, "global_step": 588552, "epoch": 7090, "val_loss": 6623597.0} {"train_loss": -27.156879425048828, "global_step": 588553, "epoch": 7091} {"train_loss": -27.591968536376953, "global_step": 588554, "epoch": 7091} {"train_loss": -26.9631404876709, "global_step": 588555, "epoch": 7091} {"train_loss": -27.145404815673828, "global_step": 588556, "epoch": 7091} {"train_loss": -27.35175895690918, "global_step": 588557, "epoch": 7091} {"train_loss": -27.52984046936035, "global_step": 588558, "epoch": 7091} {"train_loss": -27.488788604736328, "global_step": 588559, "epoch": 7091} {"train_loss": -27.17661476135254, "global_step": 588560, "epoch": 7091} {"train_loss": -27.03620719909668, "global_step": 588561, "epoch": 7091} {"train_loss": -27.772077560424805, "global_step": 588562, "epoch": 7091} {"train_loss": -27.5195369720459, "global_step": 588563, "epoch": 7091} {"train_loss": -27.767871856689453, "global_step": 588564, "epoch": 7091} {"train_loss": -27.638517379760742, "global_step": 588565, "epoch": 7091} {"train_loss": -27.471481323242188, "global_step": 588566, "epoch": 7091} {"train_loss": -27.72590446472168, "global_step": 588567, "epoch": 7091} {"train_loss": -27.62117576599121, "global_step": 588568, "epoch": 7091} {"train_loss": -27.77255630493164, "global_step": 588569, "epoch": 7091} {"train_loss": -27.571081161499023, "global_step": 588570, "epoch": 7091} {"train_loss": -27.355976104736328, "global_step": 588571, "epoch": 7091} {"train_loss": -27.81211280822754, "global_step": 588572, "epoch": 7091} {"train_loss": -28.25002098083496, "global_step": 588573, "epoch": 7091} {"train_loss": -27.82508659362793, "global_step": 588574, "epoch": 7091} {"train_loss": -27.917709350585938, "global_step": 588575, "epoch": 7091} {"train_loss": -28.353254318237305, "global_step": 588576, "epoch": 7091} {"train_loss": -27.7302188873291, "global_step": 588577, "epoch": 7091} {"train_loss": -28.1491756439209, "global_step": 588578, "epoch": 7091} {"train_loss": -27.863388061523438, "global_step": 588579, "epoch": 7091} {"train_loss": -27.9987850189209, "global_step": 588580, "epoch": 7091} {"train_loss": -27.752389907836914, "global_step": 588581, "epoch": 7091} {"train_loss": -27.98416519165039, "global_step": 588582, "epoch": 7091} {"train_loss": -27.939926147460938, "global_step": 588583, "epoch": 7091} {"train_loss": -27.931640625, "global_step": 588584, "epoch": 7091} {"train_loss": -27.71626091003418, "global_step": 588585, "epoch": 7091} {"train_loss": -28.35994529724121, "global_step": 588586, "epoch": 7091} {"train_loss": -28.2135009765625, "global_step": 588587, "epoch": 7091} {"train_loss": -27.91248893737793, "global_step": 588588, "epoch": 7091} {"train_loss": -28.122425079345703, "global_step": 588589, "epoch": 7091} {"train_loss": -27.877241134643555, "global_step": 588590, "epoch": 7091} {"train_loss": -27.994943618774414, "global_step": 588591, "epoch": 7091} {"train_loss": -27.878101348876953, "global_step": 588592, "epoch": 7091} {"train_loss": -27.991491317749023, "global_step": 588593, "epoch": 7091} {"train_loss": -28.030426025390625, "global_step": 588594, "epoch": 7091} {"train_loss": -27.820180892944336, "global_step": 588595, "epoch": 7091} {"train_loss": -28.167362213134766, "global_step": 588596, "epoch": 7091} {"train_loss": -28.174894332885742, "global_step": 588597, "epoch": 7091} {"train_loss": -27.65300941467285, "global_step": 588598, "epoch": 7091} {"train_loss": -27.848026275634766, "global_step": 588599, "epoch": 7091} {"train_loss": -28.185062408447266, "global_step": 588600, "epoch": 7091} {"train_loss": -27.84925651550293, "global_step": 588601, "epoch": 7091} {"train_loss": -28.226947784423828, "global_step": 588602, "epoch": 7091} {"train_loss": -27.9681339263916, "global_step": 588603, "epoch": 7091} {"train_loss": -28.25642204284668, "global_step": 588604, "epoch": 7091} {"train_loss": -28.06263542175293, "global_step": 588605, "epoch": 7091} {"train_loss": -28.219079971313477, "global_step": 588606, "epoch": 7091} {"train_loss": -28.58011245727539, "global_step": 588607, "epoch": 7091} {"train_loss": -28.039648056030273, "global_step": 588608, "epoch": 7091} {"train_loss": -28.112791061401367, "global_step": 588609, "epoch": 7091} {"train_loss": -27.480976104736328, "global_step": 588610, "epoch": 7091} {"train_loss": -27.330163955688477, "global_step": 588611, "epoch": 7091} {"train_loss": -27.580121994018555, "global_step": 588612, "epoch": 7091} {"train_loss": -28.029409408569336, "global_step": 588613, "epoch": 7091} {"train_loss": -27.925342559814453, "global_step": 588614, "epoch": 7091} {"train_loss": -28.29225730895996, "global_step": 588615, "epoch": 7091} {"train_loss": -27.715972900390625, "global_step": 588616, "epoch": 7091} {"train_loss": -28.218399047851562, "global_step": 588617, "epoch": 7091} {"train_loss": -28.14617919921875, "global_step": 588618, "epoch": 7091} {"train_loss": -27.788671493530273, "global_step": 588619, "epoch": 7091} {"train_loss": -28.2028751373291, "global_step": 588620, "epoch": 7091} {"train_loss": -27.98974609375, "global_step": 588621, "epoch": 7091} {"train_loss": -28.24354362487793, "global_step": 588622, "epoch": 7091} {"train_loss": -28.1087589263916, "global_step": 588623, "epoch": 7091} {"train_loss": -28.22998046875, "global_step": 588624, "epoch": 7091} {"train_loss": -27.658597946166992, "global_step": 588625, "epoch": 7091} {"train_loss": -27.8497314453125, "global_step": 588626, "epoch": 7091} {"train_loss": -27.570653915405273, "global_step": 588627, "epoch": 7091} {"train_loss": -27.848005294799805, "global_step": 588628, "epoch": 7091} {"train_loss": -27.45037269592285, "global_step": 588629, "epoch": 7091} {"train_loss": -27.364965438842773, "global_step": 588630, "epoch": 7091} {"train_loss": -27.82415771484375, "global_step": 588631, "epoch": 7091} {"train_loss": -27.806427001953125, "global_step": 588632, "epoch": 7091} {"train_loss": -27.451284408569336, "global_step": 588633, "epoch": 7091} {"train_loss": -27.425024032592773, "global_step": 588634, "epoch": 7091} {"train_loss": -27.826229440160546, "global_step": 588635, "epoch": 7091, "val_loss": 6589956.0} {"train_loss": -26.033117294311523, "global_step": 588636, "epoch": 7092} {"train_loss": -25.625192642211914, "global_step": 588637, "epoch": 7092} {"train_loss": -25.597179412841797, "global_step": 588638, "epoch": 7092} {"train_loss": -26.704858779907227, "global_step": 588639, "epoch": 7092} {"train_loss": -25.480627059936523, "global_step": 588640, "epoch": 7092} {"train_loss": -27.094573974609375, "global_step": 588641, "epoch": 7092} {"train_loss": -25.79697608947754, "global_step": 588642, "epoch": 7092} {"train_loss": -27.167837142944336, "global_step": 588643, "epoch": 7092} {"train_loss": -26.538076400756836, "global_step": 588644, "epoch": 7092} {"train_loss": -27.036970138549805, "global_step": 588645, "epoch": 7092} {"train_loss": -26.716222763061523, "global_step": 588646, "epoch": 7092} {"train_loss": -27.090539932250977, "global_step": 588647, "epoch": 7092} {"train_loss": -26.734952926635742, "global_step": 588648, "epoch": 7092} {"train_loss": -27.327747344970703, "global_step": 588649, "epoch": 7092} {"train_loss": -27.18035888671875, "global_step": 588650, "epoch": 7092} {"train_loss": -27.140920639038086, "global_step": 588651, "epoch": 7092} {"train_loss": -27.3382568359375, "global_step": 588652, "epoch": 7092} {"train_loss": -27.168426513671875, "global_step": 588653, "epoch": 7092} {"train_loss": -27.307907104492188, "global_step": 588654, "epoch": 7092} {"train_loss": -27.225177764892578, "global_step": 588655, "epoch": 7092} {"train_loss": -26.899885177612305, "global_step": 588656, "epoch": 7092} {"train_loss": -27.260879516601562, "global_step": 588657, "epoch": 7092} {"train_loss": -27.213178634643555, "global_step": 588658, "epoch": 7092} {"train_loss": -27.016769409179688, "global_step": 588659, "epoch": 7092} {"train_loss": -27.66718101501465, "global_step": 588660, "epoch": 7092} {"train_loss": -27.443851470947266, "global_step": 588661, "epoch": 7092} {"train_loss": -27.37959861755371, "global_step": 588662, "epoch": 7092} {"train_loss": -27.350671768188477, "global_step": 588663, "epoch": 7092} {"train_loss": -27.600736618041992, "global_step": 588664, "epoch": 7092} {"train_loss": -27.243793487548828, "global_step": 588665, "epoch": 7092} {"train_loss": -27.60859489440918, "global_step": 588666, "epoch": 7092} {"train_loss": -27.534320831298828, "global_step": 588667, "epoch": 7092} {"train_loss": -27.729782104492188, "global_step": 588668, "epoch": 7092} {"train_loss": -27.864398956298828, "global_step": 588669, "epoch": 7092} {"train_loss": -27.778121948242188, "global_step": 588670, "epoch": 7092} {"train_loss": -27.54945182800293, "global_step": 588671, "epoch": 7092} {"train_loss": -27.68792152404785, "global_step": 588672, "epoch": 7092} {"train_loss": -27.63361930847168, "global_step": 588673, "epoch": 7092} {"train_loss": -27.799102783203125, "global_step": 588674, "epoch": 7092} {"train_loss": -28.10361099243164, "global_step": 588675, "epoch": 7092} {"train_loss": -27.43902587890625, "global_step": 588676, "epoch": 7092} {"train_loss": -27.387420654296875, "global_step": 588677, "epoch": 7092} {"train_loss": -27.46211814880371, "global_step": 588678, "epoch": 7092} {"train_loss": -27.974105834960938, "global_step": 588679, "epoch": 7092} {"train_loss": -27.709854125976562, "global_step": 588680, "epoch": 7092} {"train_loss": -28.0679931640625, "global_step": 588681, "epoch": 7092} {"train_loss": -27.867971420288086, "global_step": 588682, "epoch": 7092} {"train_loss": -27.958227157592773, "global_step": 588683, "epoch": 7092} {"train_loss": -27.951190948486328, "global_step": 588684, "epoch": 7092} {"train_loss": -27.769811630249023, "global_step": 588685, "epoch": 7092} {"train_loss": -27.932077407836914, "global_step": 588686, "epoch": 7092} {"train_loss": -27.803823471069336, "global_step": 588687, "epoch": 7092} {"train_loss": -27.978290557861328, "global_step": 588688, "epoch": 7092} {"train_loss": -27.788787841796875, "global_step": 588689, "epoch": 7092} {"train_loss": -28.050006866455078, "global_step": 588690, "epoch": 7092} {"train_loss": -27.914594650268555, "global_step": 588691, "epoch": 7092} {"train_loss": -28.041967391967773, "global_step": 588692, "epoch": 7092} {"train_loss": -27.622106552124023, "global_step": 588693, "epoch": 7092} {"train_loss": -28.211633682250977, "global_step": 588694, "epoch": 7092} {"train_loss": -28.204803466796875, "global_step": 588695, "epoch": 7092} {"train_loss": -27.79593276977539, "global_step": 588696, "epoch": 7092} {"train_loss": -27.808801651000977, "global_step": 588697, "epoch": 7092} {"train_loss": -28.0990047454834, "global_step": 588698, "epoch": 7092} {"train_loss": -28.035200119018555, "global_step": 588699, "epoch": 7092} {"train_loss": -27.313695907592773, "global_step": 588700, "epoch": 7092} {"train_loss": -27.471969604492188, "global_step": 588701, "epoch": 7092} {"train_loss": -27.800235748291016, "global_step": 588702, "epoch": 7092} {"train_loss": -28.02596092224121, "global_step": 588703, "epoch": 7092} {"train_loss": -28.21297264099121, "global_step": 588704, "epoch": 7092} {"train_loss": -27.940704345703125, "global_step": 588705, "epoch": 7092} {"train_loss": -27.91682243347168, "global_step": 588706, "epoch": 7092} {"train_loss": -27.807544708251953, "global_step": 588707, "epoch": 7092} {"train_loss": -27.782617568969727, "global_step": 588708, "epoch": 7092} {"train_loss": -27.916244506835938, "global_step": 588709, "epoch": 7092} {"train_loss": -27.8054141998291, "global_step": 588710, "epoch": 7092} {"train_loss": -28.0308837890625, "global_step": 588711, "epoch": 7092} {"train_loss": -28.179019927978516, "global_step": 588712, "epoch": 7092} {"train_loss": -27.993289947509766, "global_step": 588713, "epoch": 7092} {"train_loss": -28.213403701782227, "global_step": 588714, "epoch": 7092} {"train_loss": -27.6280460357666, "global_step": 588715, "epoch": 7092} {"train_loss": -28.106616973876953, "global_step": 588716, "epoch": 7092} {"train_loss": -28.29859733581543, "global_step": 588717, "epoch": 7092} {"train_loss": -27.515501137239387, "global_step": 588718, "epoch": 7092, "val_loss": 6665561.0} {"train_loss": -26.429855346679688, "global_step": 588719, "epoch": 7093} {"train_loss": -27.507184982299805, "global_step": 588720, "epoch": 7093} {"train_loss": -27.036396026611328, "global_step": 588721, "epoch": 7093} {"train_loss": -27.664947509765625, "global_step": 588722, "epoch": 7093} {"train_loss": -27.223310470581055, "global_step": 588723, "epoch": 7093} {"train_loss": -27.1384220123291, "global_step": 588724, "epoch": 7093} {"train_loss": -27.340017318725586, "global_step": 588725, "epoch": 7093} {"train_loss": -27.5430908203125, "global_step": 588726, "epoch": 7093} {"train_loss": -27.6461238861084, "global_step": 588727, "epoch": 7093} {"train_loss": -27.759307861328125, "global_step": 588728, "epoch": 7093} {"train_loss": -27.644811630249023, "global_step": 588729, "epoch": 7093} {"train_loss": -27.488025665283203, "global_step": 588730, "epoch": 7093} {"train_loss": -27.338138580322266, "global_step": 588731, "epoch": 7093} {"train_loss": -27.710309982299805, "global_step": 588732, "epoch": 7093} {"train_loss": -27.384363174438477, "global_step": 588733, "epoch": 7093} {"train_loss": -27.593408584594727, "global_step": 588734, "epoch": 7093} {"train_loss": -27.77712059020996, "global_step": 588735, "epoch": 7093} {"train_loss": -27.724323272705078, "global_step": 588736, "epoch": 7093} {"train_loss": -27.934070587158203, "global_step": 588737, "epoch": 7093} {"train_loss": -27.480066299438477, "global_step": 588738, "epoch": 7093} {"train_loss": -28.104206085205078, "global_step": 588739, "epoch": 7093} {"train_loss": -27.56947135925293, "global_step": 588740, "epoch": 7093} {"train_loss": -28.145343780517578, "global_step": 588741, "epoch": 7093} {"train_loss": -27.893308639526367, "global_step": 588742, "epoch": 7093} {"train_loss": -28.11992835998535, "global_step": 588743, "epoch": 7093} {"train_loss": -28.034290313720703, "global_step": 588744, "epoch": 7093} {"train_loss": -27.734027862548828, "global_step": 588745, "epoch": 7093} {"train_loss": -28.107847213745117, "global_step": 588746, "epoch": 7093} {"train_loss": -27.93402099609375, "global_step": 588747, "epoch": 7093} {"train_loss": -28.083295822143555, "global_step": 588748, "epoch": 7093} {"train_loss": -28.050891876220703, "global_step": 588749, "epoch": 7093} {"train_loss": -28.15740966796875, "global_step": 588750, "epoch": 7093} {"train_loss": -28.088459014892578, "global_step": 588751, "epoch": 7093} {"train_loss": -27.898237228393555, "global_step": 588752, "epoch": 7093} {"train_loss": -28.142160415649414, "global_step": 588753, "epoch": 7093} {"train_loss": -28.248966217041016, "global_step": 588754, "epoch": 7093} {"train_loss": -28.273252487182617, "global_step": 588755, "epoch": 7093} {"train_loss": -28.373823165893555, "global_step": 588756, "epoch": 7093} {"train_loss": -27.84897232055664, "global_step": 588757, "epoch": 7093} {"train_loss": -28.053852081298828, "global_step": 588758, "epoch": 7093} {"train_loss": -28.37994384765625, "global_step": 588759, "epoch": 7093} {"train_loss": -28.42637062072754, "global_step": 588760, "epoch": 7093} {"train_loss": -28.160802841186523, "global_step": 588761, "epoch": 7093} {"train_loss": -28.3521785736084, "global_step": 588762, "epoch": 7093} {"train_loss": -28.124740600585938, "global_step": 588763, "epoch": 7093} {"train_loss": -28.31385612487793, "global_step": 588764, "epoch": 7093} {"train_loss": -28.358488082885742, "global_step": 588765, "epoch": 7093} {"train_loss": -28.137149810791016, "global_step": 588766, "epoch": 7093} {"train_loss": -28.229734420776367, "global_step": 588767, "epoch": 7093} {"train_loss": -28.089757919311523, "global_step": 588768, "epoch": 7093} {"train_loss": -28.40775489807129, "global_step": 588769, "epoch": 7093} {"train_loss": -28.06363296508789, "global_step": 588770, "epoch": 7093} {"train_loss": -28.044641494750977, "global_step": 588771, "epoch": 7093} {"train_loss": -27.832386016845703, "global_step": 588772, "epoch": 7093} {"train_loss": -27.754602432250977, "global_step": 588773, "epoch": 7093} {"train_loss": -27.790807723999023, "global_step": 588774, "epoch": 7093} {"train_loss": -28.13618278503418, "global_step": 588775, "epoch": 7093} {"train_loss": -27.983911514282227, "global_step": 588776, "epoch": 7093} {"train_loss": -28.181385040283203, "global_step": 588777, "epoch": 7093} {"train_loss": -28.178272247314453, "global_step": 588778, "epoch": 7093} {"train_loss": -27.71640968322754, "global_step": 588779, "epoch": 7093} {"train_loss": -27.975080490112305, "global_step": 588780, "epoch": 7093} {"train_loss": -27.278961181640625, "global_step": 588781, "epoch": 7093} {"train_loss": -28.129261016845703, "global_step": 588782, "epoch": 7093} {"train_loss": -27.88299560546875, "global_step": 588783, "epoch": 7093} {"train_loss": -28.139907836914062, "global_step": 588784, "epoch": 7093} {"train_loss": -28.21856117248535, "global_step": 588785, "epoch": 7093} {"train_loss": -28.079870223999023, "global_step": 588786, "epoch": 7093} {"train_loss": -27.803619384765625, "global_step": 588787, "epoch": 7093} {"train_loss": -27.80348014831543, "global_step": 588788, "epoch": 7093} {"train_loss": -28.1882381439209, "global_step": 588789, "epoch": 7093} {"train_loss": -28.116262435913086, "global_step": 588790, "epoch": 7093} {"train_loss": -28.075109481811523, "global_step": 588791, "epoch": 7093} {"train_loss": -28.209049224853516, "global_step": 588792, "epoch": 7093} {"train_loss": -28.233800888061523, "global_step": 588793, "epoch": 7093} {"train_loss": -27.841455459594727, "global_step": 588794, "epoch": 7093} {"train_loss": -27.971704483032227, "global_step": 588795, "epoch": 7093} {"train_loss": -28.011693954467773, "global_step": 588796, "epoch": 7093} {"train_loss": -28.007375717163086, "global_step": 588797, "epoch": 7093} {"train_loss": -27.69008445739746, "global_step": 588798, "epoch": 7093} {"train_loss": -27.0747127532959, "global_step": 588799, "epoch": 7093} {"train_loss": -27.82337760925293, "global_step": 588800, "epoch": 7093} {"train_loss": -27.904297932084784, "global_step": 588801, "epoch": 7093, "val_loss": 6602597.0} {"train_loss": -27.201608657836914, "global_step": 588802, "epoch": 7094} {"train_loss": -27.1513614654541, "global_step": 588803, "epoch": 7094} {"train_loss": -26.941808700561523, "global_step": 588804, "epoch": 7094} {"train_loss": -27.265722274780273, "global_step": 588805, "epoch": 7094} {"train_loss": -26.9000244140625, "global_step": 588806, "epoch": 7094} {"train_loss": -27.572284698486328, "global_step": 588807, "epoch": 7094} {"train_loss": -26.923065185546875, "global_step": 588808, "epoch": 7094} {"train_loss": -27.53339195251465, "global_step": 588809, "epoch": 7094} {"train_loss": -27.865478515625, "global_step": 588810, "epoch": 7094} {"train_loss": -27.744354248046875, "global_step": 588811, "epoch": 7094} {"train_loss": -27.56586265563965, "global_step": 588812, "epoch": 7094} {"train_loss": -27.734405517578125, "global_step": 588813, "epoch": 7094} {"train_loss": -27.6237850189209, "global_step": 588814, "epoch": 7094} {"train_loss": -27.784162521362305, "global_step": 588815, "epoch": 7094} {"train_loss": -27.837116241455078, "global_step": 588816, "epoch": 7094} {"train_loss": -27.766626358032227, "global_step": 588817, "epoch": 7094} {"train_loss": -27.58444595336914, "global_step": 588818, "epoch": 7094} {"train_loss": -27.795440673828125, "global_step": 588819, "epoch": 7094} {"train_loss": -27.667570114135742, "global_step": 588820, "epoch": 7094} {"train_loss": -27.638233184814453, "global_step": 588821, "epoch": 7094} {"train_loss": -27.858911514282227, "global_step": 588822, "epoch": 7094} {"train_loss": -27.476163864135742, "global_step": 588823, "epoch": 7094} {"train_loss": -27.958967208862305, "global_step": 588824, "epoch": 7094} {"train_loss": -27.650634765625, "global_step": 588825, "epoch": 7094} {"train_loss": -28.089557647705078, "global_step": 588826, "epoch": 7094} {"train_loss": -27.740034103393555, "global_step": 588827, "epoch": 7094} {"train_loss": -27.639179229736328, "global_step": 588828, "epoch": 7094} {"train_loss": -27.64208984375, "global_step": 588829, "epoch": 7094} {"train_loss": -28.00198745727539, "global_step": 588830, "epoch": 7094} {"train_loss": -27.9021053314209, "global_step": 588831, "epoch": 7094} {"train_loss": -27.82413101196289, "global_step": 588832, "epoch": 7094} {"train_loss": -27.67487144470215, "global_step": 588833, "epoch": 7094} {"train_loss": -28.00501823425293, "global_step": 588834, "epoch": 7094} {"train_loss": -28.12103271484375, "global_step": 588835, "epoch": 7094} {"train_loss": -27.705671310424805, "global_step": 588836, "epoch": 7094} {"train_loss": -27.834653854370117, "global_step": 588837, "epoch": 7094} {"train_loss": -28.022705078125, "global_step": 588838, "epoch": 7094} {"train_loss": -28.189680099487305, "global_step": 588839, "epoch": 7094} {"train_loss": -27.687292098999023, "global_step": 588840, "epoch": 7094} {"train_loss": -28.05706787109375, "global_step": 588841, "epoch": 7094} {"train_loss": -28.099416732788086, "global_step": 588842, "epoch": 7094} {"train_loss": -28.259262084960938, "global_step": 588843, "epoch": 7094} {"train_loss": -28.017532348632812, "global_step": 588844, "epoch": 7094} {"train_loss": -28.245258331298828, "global_step": 588845, "epoch": 7094} {"train_loss": -28.12481689453125, "global_step": 588846, "epoch": 7094} {"train_loss": -28.113168716430664, "global_step": 588847, "epoch": 7094} {"train_loss": -27.997541427612305, "global_step": 588848, "epoch": 7094} {"train_loss": -28.11646842956543, "global_step": 588849, "epoch": 7094} {"train_loss": -28.01495933532715, "global_step": 588850, "epoch": 7094} {"train_loss": -27.90217399597168, "global_step": 588851, "epoch": 7094} {"train_loss": -28.535308837890625, "global_step": 588852, "epoch": 7094} {"train_loss": -28.316869735717773, "global_step": 588853, "epoch": 7094} {"train_loss": -28.285940170288086, "global_step": 588854, "epoch": 7094} {"train_loss": -28.1212100982666, "global_step": 588855, "epoch": 7094} {"train_loss": -28.183807373046875, "global_step": 588856, "epoch": 7094} {"train_loss": -27.9650936126709, "global_step": 588857, "epoch": 7094} {"train_loss": -27.92730712890625, "global_step": 588858, "epoch": 7094} {"train_loss": -27.8970947265625, "global_step": 588859, "epoch": 7094} {"train_loss": -28.115589141845703, "global_step": 588860, "epoch": 7094} {"train_loss": -28.14761734008789, "global_step": 588861, "epoch": 7094} {"train_loss": -27.98477554321289, "global_step": 588862, "epoch": 7094} {"train_loss": -27.377761840820312, "global_step": 588863, "epoch": 7094} {"train_loss": -27.934131622314453, "global_step": 588864, "epoch": 7094} {"train_loss": -26.98697853088379, "global_step": 588865, "epoch": 7094} {"train_loss": -26.9764347076416, "global_step": 588866, "epoch": 7094} {"train_loss": -27.634662628173828, "global_step": 588867, "epoch": 7094} {"train_loss": -27.986974716186523, "global_step": 588868, "epoch": 7094} {"train_loss": -27.49139404296875, "global_step": 588869, "epoch": 7094} {"train_loss": -27.650409698486328, "global_step": 588870, "epoch": 7094} {"train_loss": -26.814239501953125, "global_step": 588871, "epoch": 7094} {"train_loss": -27.73988914489746, "global_step": 588872, "epoch": 7094} {"train_loss": -28.274255752563477, "global_step": 588873, "epoch": 7094} {"train_loss": -27.779523849487305, "global_step": 588874, "epoch": 7094} {"train_loss": -27.372394561767578, "global_step": 588875, "epoch": 7094} {"train_loss": -27.84112548828125, "global_step": 588876, "epoch": 7094} {"train_loss": -27.966711044311523, "global_step": 588877, "epoch": 7094} {"train_loss": -27.566150665283203, "global_step": 588878, "epoch": 7094} {"train_loss": -27.937458038330078, "global_step": 588879, "epoch": 7094} {"train_loss": -27.629682540893555, "global_step": 588880, "epoch": 7094} {"train_loss": -27.834991455078125, "global_step": 588881, "epoch": 7094} {"train_loss": -28.170562744140625, "global_step": 588882, "epoch": 7094} {"train_loss": -28.004011154174805, "global_step": 588883, "epoch": 7094} {"train_loss": -27.794979761882, "global_step": 588884, "epoch": 7094, "val_loss": 6559877.0} {"train_loss": -26.374481201171875, "global_step": 588885, "epoch": 7095} {"train_loss": -26.9282169342041, "global_step": 588886, "epoch": 7095} {"train_loss": -26.49542808532715, "global_step": 588887, "epoch": 7095} {"train_loss": -25.971418380737305, "global_step": 588888, "epoch": 7095} {"train_loss": -27.40729331970215, "global_step": 588889, "epoch": 7095} {"train_loss": -26.501379013061523, "global_step": 588890, "epoch": 7095} {"train_loss": -27.240707397460938, "global_step": 588891, "epoch": 7095} {"train_loss": -26.911157608032227, "global_step": 588892, "epoch": 7095} {"train_loss": -26.85991859436035, "global_step": 588893, "epoch": 7095} {"train_loss": -27.24492835998535, "global_step": 588894, "epoch": 7095} {"train_loss": -27.18397331237793, "global_step": 588895, "epoch": 7095} {"train_loss": -26.9274959564209, "global_step": 588896, "epoch": 7095} {"train_loss": -27.156757354736328, "global_step": 588897, "epoch": 7095} {"train_loss": -26.93575096130371, "global_step": 588898, "epoch": 7095} {"train_loss": -27.466760635375977, "global_step": 588899, "epoch": 7095} {"train_loss": -27.438812255859375, "global_step": 588900, "epoch": 7095} {"train_loss": -27.2591552734375, "global_step": 588901, "epoch": 7095} {"train_loss": -27.233129501342773, "global_step": 588902, "epoch": 7095} {"train_loss": -27.664098739624023, "global_step": 588903, "epoch": 7095} {"train_loss": -27.246061325073242, "global_step": 588904, "epoch": 7095} {"train_loss": -27.742124557495117, "global_step": 588905, "epoch": 7095} {"train_loss": -27.34498405456543, "global_step": 588906, "epoch": 7095} {"train_loss": -27.49216079711914, "global_step": 588907, "epoch": 7095} {"train_loss": -27.591772079467773, "global_step": 588908, "epoch": 7095} {"train_loss": -27.503095626831055, "global_step": 588909, "epoch": 7095} {"train_loss": -27.660425186157227, "global_step": 588910, "epoch": 7095} {"train_loss": -28.018173217773438, "global_step": 588911, "epoch": 7095} {"train_loss": -27.60519790649414, "global_step": 588912, "epoch": 7095} {"train_loss": -27.422651290893555, "global_step": 588913, "epoch": 7095} {"train_loss": -27.976593017578125, "global_step": 588914, "epoch": 7095} {"train_loss": -27.851972579956055, "global_step": 588915, "epoch": 7095} {"train_loss": -27.4880313873291, "global_step": 588916, "epoch": 7095} {"train_loss": -27.7152099609375, "global_step": 588917, "epoch": 7095} {"train_loss": -27.719009399414062, "global_step": 588918, "epoch": 7095} {"train_loss": -27.665695190429688, "global_step": 588919, "epoch": 7095} {"train_loss": -27.75372314453125, "global_step": 588920, "epoch": 7095} {"train_loss": -27.835824966430664, "global_step": 588921, "epoch": 7095} {"train_loss": -27.955320358276367, "global_step": 588922, "epoch": 7095} {"train_loss": -28.166669845581055, "global_step": 588923, "epoch": 7095} {"train_loss": -28.239582061767578, "global_step": 588924, "epoch": 7095} {"train_loss": -28.053089141845703, "global_step": 588925, "epoch": 7095} {"train_loss": -28.016904830932617, "global_step": 588926, "epoch": 7095} {"train_loss": -28.13547134399414, "global_step": 588927, "epoch": 7095} {"train_loss": -27.98158836364746, "global_step": 588928, "epoch": 7095} {"train_loss": -28.398534774780273, "global_step": 588929, "epoch": 7095} {"train_loss": -27.976285934448242, "global_step": 588930, "epoch": 7095} {"train_loss": -27.9375057220459, "global_step": 588931, "epoch": 7095} {"train_loss": -27.712081909179688, "global_step": 588932, "epoch": 7095} {"train_loss": -28.198949813842773, "global_step": 588933, "epoch": 7095} {"train_loss": -28.23493766784668, "global_step": 588934, "epoch": 7095} {"train_loss": -28.249216079711914, "global_step": 588935, "epoch": 7095} {"train_loss": -28.206588745117188, "global_step": 588936, "epoch": 7095} {"train_loss": -28.039215087890625, "global_step": 588937, "epoch": 7095} {"train_loss": -28.187620162963867, "global_step": 588938, "epoch": 7095} {"train_loss": -27.53066062927246, "global_step": 588939, "epoch": 7095} {"train_loss": -27.944732666015625, "global_step": 588940, "epoch": 7095} {"train_loss": -27.398889541625977, "global_step": 588941, "epoch": 7095} {"train_loss": -27.54481315612793, "global_step": 588942, "epoch": 7095} {"train_loss": -27.753454208374023, "global_step": 588943, "epoch": 7095} {"train_loss": -28.115957260131836, "global_step": 588944, "epoch": 7095} {"train_loss": -27.978046417236328, "global_step": 588945, "epoch": 7095} {"train_loss": -27.83928871154785, "global_step": 588946, "epoch": 7095} {"train_loss": -28.072839736938477, "global_step": 588947, "epoch": 7095} {"train_loss": -27.657068252563477, "global_step": 588948, "epoch": 7095} {"train_loss": -27.974384307861328, "global_step": 588949, "epoch": 7095} {"train_loss": -28.025049209594727, "global_step": 588950, "epoch": 7095} {"train_loss": -28.035818099975586, "global_step": 588951, "epoch": 7095} {"train_loss": -27.93732261657715, "global_step": 588952, "epoch": 7095} {"train_loss": -27.971332550048828, "global_step": 588953, "epoch": 7095} {"train_loss": -27.62273597717285, "global_step": 588954, "epoch": 7095} {"train_loss": -27.687164306640625, "global_step": 588955, "epoch": 7095} {"train_loss": -28.18227195739746, "global_step": 588956, "epoch": 7095} {"train_loss": -28.083478927612305, "global_step": 588957, "epoch": 7095} {"train_loss": -27.68238639831543, "global_step": 588958, "epoch": 7095} {"train_loss": -27.700498580932617, "global_step": 588959, "epoch": 7095} {"train_loss": -28.310556411743164, "global_step": 588960, "epoch": 7095} {"train_loss": -27.73674964904785, "global_step": 588961, "epoch": 7095} {"train_loss": -27.758695602416992, "global_step": 588962, "epoch": 7095} {"train_loss": -28.101232528686523, "global_step": 588963, "epoch": 7095} {"train_loss": -28.177032470703125, "global_step": 588964, "epoch": 7095} {"train_loss": -27.76116371154785, "global_step": 588965, "epoch": 7095} {"train_loss": -27.804487228393555, "global_step": 588966, "epoch": 7095} {"train_loss": -27.698494853743586, "global_step": 588967, "epoch": 7095, "val_loss": 6568135.5} {"train_loss": -27.205045700073242, "global_step": 588968, "epoch": 7096} {"train_loss": -27.906347274780273, "global_step": 588969, "epoch": 7096} {"train_loss": -27.639511108398438, "global_step": 588970, "epoch": 7096} {"train_loss": -27.461811065673828, "global_step": 588971, "epoch": 7096} {"train_loss": -28.1282958984375, "global_step": 588972, "epoch": 7096} {"train_loss": -27.51081657409668, "global_step": 588973, "epoch": 7096} {"train_loss": -27.757568359375, "global_step": 588974, "epoch": 7096} {"train_loss": -27.582275390625, "global_step": 588975, "epoch": 7096} {"train_loss": -27.46394920349121, "global_step": 588976, "epoch": 7096} {"train_loss": -27.434356689453125, "global_step": 588977, "epoch": 7096} {"train_loss": -28.126306533813477, "global_step": 588978, "epoch": 7096} {"train_loss": -27.744802474975586, "global_step": 588979, "epoch": 7096} {"train_loss": -27.605194091796875, "global_step": 588980, "epoch": 7096} {"train_loss": -27.840124130249023, "global_step": 588981, "epoch": 7096} {"train_loss": -27.94732093811035, "global_step": 588982, "epoch": 7096} {"train_loss": -27.953231811523438, "global_step": 588983, "epoch": 7096} {"train_loss": -27.448301315307617, "global_step": 588984, "epoch": 7096} {"train_loss": -28.14858055114746, "global_step": 588985, "epoch": 7096} {"train_loss": -27.959936141967773, "global_step": 588986, "epoch": 7096} {"train_loss": -27.9549560546875, "global_step": 588987, "epoch": 7096} {"train_loss": -27.99786376953125, "global_step": 588988, "epoch": 7096} {"train_loss": -27.99879264831543, "global_step": 588989, "epoch": 7096} {"train_loss": -28.07465934753418, "global_step": 588990, "epoch": 7096} {"train_loss": -27.75739097595215, "global_step": 588991, "epoch": 7096} {"train_loss": -27.397043228149414, "global_step": 588992, "epoch": 7096} {"train_loss": -27.350324630737305, "global_step": 588993, "epoch": 7096} {"train_loss": -28.18232536315918, "global_step": 588994, "epoch": 7096} {"train_loss": -28.059301376342773, "global_step": 588995, "epoch": 7096} {"train_loss": -28.368459701538086, "global_step": 588996, "epoch": 7096} {"train_loss": -28.065534591674805, "global_step": 588997, "epoch": 7096} {"train_loss": -27.971662521362305, "global_step": 588998, "epoch": 7096} {"train_loss": -28.076385498046875, "global_step": 588999, "epoch": 7096} {"train_loss": -27.93027114868164, "global_step": 589000, "epoch": 7096} {"train_loss": -28.207746505737305, "global_step": 589001, "epoch": 7096} {"train_loss": -28.17844581604004, "global_step": 589002, "epoch": 7096} {"train_loss": -28.386808395385742, "global_step": 589003, "epoch": 7096} {"train_loss": -27.87969398498535, "global_step": 589004, "epoch": 7096} {"train_loss": -28.352304458618164, "global_step": 589005, "epoch": 7096} {"train_loss": -28.112186431884766, "global_step": 589006, "epoch": 7096} {"train_loss": -28.399240493774414, "global_step": 589007, "epoch": 7096} {"train_loss": -27.837879180908203, "global_step": 589008, "epoch": 7096} {"train_loss": -28.277896881103516, "global_step": 589009, "epoch": 7096} {"train_loss": -28.180463790893555, "global_step": 589010, "epoch": 7096} {"train_loss": -27.795011520385742, "global_step": 589011, "epoch": 7096} {"train_loss": -28.036895751953125, "global_step": 589012, "epoch": 7096} {"train_loss": -27.76138687133789, "global_step": 589013, "epoch": 7096} {"train_loss": -28.266681671142578, "global_step": 589014, "epoch": 7096} {"train_loss": -28.2330322265625, "global_step": 589015, "epoch": 7096} {"train_loss": -27.708093643188477, "global_step": 589016, "epoch": 7096} {"train_loss": -28.032642364501953, "global_step": 589017, "epoch": 7096} {"train_loss": -28.22895622253418, "global_step": 589018, "epoch": 7096} {"train_loss": -27.9705753326416, "global_step": 589019, "epoch": 7096} {"train_loss": -27.549589157104492, "global_step": 589020, "epoch": 7096} {"train_loss": -27.85536003112793, "global_step": 589021, "epoch": 7096} {"train_loss": -27.662460327148438, "global_step": 589022, "epoch": 7096} {"train_loss": -27.40565299987793, "global_step": 589023, "epoch": 7096} {"train_loss": -27.397537231445312, "global_step": 589024, "epoch": 7096} {"train_loss": -27.224721908569336, "global_step": 589025, "epoch": 7096} {"train_loss": -27.26788330078125, "global_step": 589026, "epoch": 7096} {"train_loss": -27.5937442779541, "global_step": 589027, "epoch": 7096} {"train_loss": -28.006336212158203, "global_step": 589028, "epoch": 7096} {"train_loss": -27.563440322875977, "global_step": 589029, "epoch": 7096} {"train_loss": -27.577173233032227, "global_step": 589030, "epoch": 7096} {"train_loss": -27.824859619140625, "global_step": 589031, "epoch": 7096} {"train_loss": -27.63760757446289, "global_step": 589032, "epoch": 7096} {"train_loss": -28.196502685546875, "global_step": 589033, "epoch": 7096} {"train_loss": -27.77461051940918, "global_step": 589034, "epoch": 7096} {"train_loss": -27.69594383239746, "global_step": 589035, "epoch": 7096} {"train_loss": -27.82516860961914, "global_step": 589036, "epoch": 7096} {"train_loss": -27.956335067749023, "global_step": 589037, "epoch": 7096} {"train_loss": -27.603626251220703, "global_step": 589038, "epoch": 7096} {"train_loss": -28.06776237487793, "global_step": 589039, "epoch": 7096} {"train_loss": -27.649824142456055, "global_step": 589040, "epoch": 7096} {"train_loss": -28.05720329284668, "global_step": 589041, "epoch": 7096} {"train_loss": -28.1148681640625, "global_step": 589042, "epoch": 7096} {"train_loss": -28.06159019470215, "global_step": 589043, "epoch": 7096} {"train_loss": -27.96711540222168, "global_step": 589044, "epoch": 7096} {"train_loss": -27.659265518188477, "global_step": 589045, "epoch": 7096} {"train_loss": -28.088336944580078, "global_step": 589046, "epoch": 7096} {"train_loss": -28.28852653503418, "global_step": 589047, "epoch": 7096} {"train_loss": -27.891149520874023, "global_step": 589048, "epoch": 7096} {"train_loss": -27.984085083007812, "global_step": 589049, "epoch": 7096} {"train_loss": -27.847570901893707, "global_step": 589050, "epoch": 7096, "val_loss": 6498163.0} {"train_loss": -27.204015731811523, "global_step": 589051, "epoch": 7097} {"train_loss": -27.957849502563477, "global_step": 589052, "epoch": 7097} {"train_loss": -27.334766387939453, "global_step": 589053, "epoch": 7097} {"train_loss": -27.606595993041992, "global_step": 589054, "epoch": 7097} {"train_loss": -27.366413116455078, "global_step": 589055, "epoch": 7097} {"train_loss": -27.428207397460938, "global_step": 589056, "epoch": 7097} {"train_loss": -27.35089111328125, "global_step": 589057, "epoch": 7097} {"train_loss": -27.445158004760742, "global_step": 589058, "epoch": 7097} {"train_loss": -27.50043296813965, "global_step": 589059, "epoch": 7097} {"train_loss": -28.009052276611328, "global_step": 589060, "epoch": 7097} {"train_loss": -27.635986328125, "global_step": 589061, "epoch": 7097} {"train_loss": -27.655881881713867, "global_step": 589062, "epoch": 7097} {"train_loss": -27.864145278930664, "global_step": 589063, "epoch": 7097} {"train_loss": -27.569501876831055, "global_step": 589064, "epoch": 7097} {"train_loss": -27.697708129882812, "global_step": 589065, "epoch": 7097} {"train_loss": -27.98969841003418, "global_step": 589066, "epoch": 7097} {"train_loss": -28.035215377807617, "global_step": 589067, "epoch": 7097} {"train_loss": -27.577762603759766, "global_step": 589068, "epoch": 7097} {"train_loss": -27.823034286499023, "global_step": 589069, "epoch": 7097} {"train_loss": -27.67792320251465, "global_step": 589070, "epoch": 7097} {"train_loss": -27.895965576171875, "global_step": 589071, "epoch": 7097} {"train_loss": -28.213003158569336, "global_step": 589072, "epoch": 7097} {"train_loss": -27.86468505859375, "global_step": 589073, "epoch": 7097} {"train_loss": -28.01616859436035, "global_step": 589074, "epoch": 7097} {"train_loss": -27.839496612548828, "global_step": 589075, "epoch": 7097} {"train_loss": -28.021970748901367, "global_step": 589076, "epoch": 7097} {"train_loss": -27.900110244750977, "global_step": 589077, "epoch": 7097} {"train_loss": -27.53944206237793, "global_step": 589078, "epoch": 7097} {"train_loss": -28.044530868530273, "global_step": 589079, "epoch": 7097} {"train_loss": -27.63739013671875, "global_step": 589080, "epoch": 7097} {"train_loss": -27.962491989135742, "global_step": 589081, "epoch": 7097} {"train_loss": -28.30063819885254, "global_step": 589082, "epoch": 7097} {"train_loss": -27.862567901611328, "global_step": 589083, "epoch": 7097} {"train_loss": -27.951370239257812, "global_step": 589084, "epoch": 7097} {"train_loss": -27.657093048095703, "global_step": 589085, "epoch": 7097} {"train_loss": -28.420568466186523, "global_step": 589086, "epoch": 7097} {"train_loss": -28.068267822265625, "global_step": 589087, "epoch": 7097} {"train_loss": -27.785593032836914, "global_step": 589088, "epoch": 7097} {"train_loss": -28.186172485351562, "global_step": 589089, "epoch": 7097} {"train_loss": -27.93617057800293, "global_step": 589090, "epoch": 7097} {"train_loss": -28.31781005859375, "global_step": 589091, "epoch": 7097} {"train_loss": -27.623523712158203, "global_step": 589092, "epoch": 7097} {"train_loss": -28.239145278930664, "global_step": 589093, "epoch": 7097} {"train_loss": -28.194860458374023, "global_step": 589094, "epoch": 7097} {"train_loss": -27.437824249267578, "global_step": 589095, "epoch": 7097} {"train_loss": -27.781463623046875, "global_step": 589096, "epoch": 7097} {"train_loss": -28.23074722290039, "global_step": 589097, "epoch": 7097} {"train_loss": -27.96625328063965, "global_step": 589098, "epoch": 7097} {"train_loss": -27.529590606689453, "global_step": 589099, "epoch": 7097} {"train_loss": -27.77996253967285, "global_step": 589100, "epoch": 7097} {"train_loss": -28.087549209594727, "global_step": 589101, "epoch": 7097} {"train_loss": -28.398595809936523, "global_step": 589102, "epoch": 7097} {"train_loss": -28.026269912719727, "global_step": 589103, "epoch": 7097} {"train_loss": -28.1317138671875, "global_step": 589104, "epoch": 7097} {"train_loss": -27.866479873657227, "global_step": 589105, "epoch": 7097} {"train_loss": -27.52544593811035, "global_step": 589106, "epoch": 7097} {"train_loss": -27.682687759399414, "global_step": 589107, "epoch": 7097} {"train_loss": -27.82053565979004, "global_step": 589108, "epoch": 7097} {"train_loss": -28.15730857849121, "global_step": 589109, "epoch": 7097} {"train_loss": -27.961694717407227, "global_step": 589110, "epoch": 7097} {"train_loss": -28.024988174438477, "global_step": 589111, "epoch": 7097} {"train_loss": -27.565235137939453, "global_step": 589112, "epoch": 7097} {"train_loss": -27.701465606689453, "global_step": 589113, "epoch": 7097} {"train_loss": -28.1466007232666, "global_step": 589114, "epoch": 7097} {"train_loss": -27.70453453063965, "global_step": 589115, "epoch": 7097} {"train_loss": -27.768238067626953, "global_step": 589116, "epoch": 7097} {"train_loss": -28.189777374267578, "global_step": 589117, "epoch": 7097} {"train_loss": -27.832197189331055, "global_step": 589118, "epoch": 7097} {"train_loss": -27.701160430908203, "global_step": 589119, "epoch": 7097} {"train_loss": -27.80720329284668, "global_step": 589120, "epoch": 7097} {"train_loss": -28.228193283081055, "global_step": 589121, "epoch": 7097} {"train_loss": -28.267520904541016, "global_step": 589122, "epoch": 7097} {"train_loss": -27.51310157775879, "global_step": 589123, "epoch": 7097} {"train_loss": -27.907819747924805, "global_step": 589124, "epoch": 7097} {"train_loss": -28.27886962890625, "global_step": 589125, "epoch": 7097} {"train_loss": -27.807825088500977, "global_step": 589126, "epoch": 7097} {"train_loss": -28.10955810546875, "global_step": 589127, "epoch": 7097} {"train_loss": -28.185138702392578, "global_step": 589128, "epoch": 7097} {"train_loss": -28.294574737548828, "global_step": 589129, "epoch": 7097} {"train_loss": -27.82819175720215, "global_step": 589130, "epoch": 7097} {"train_loss": -27.740955352783203, "global_step": 589131, "epoch": 7097} {"train_loss": -27.445173263549805, "global_step": 589132, "epoch": 7097} {"train_loss": -27.87611340901938, "global_step": 589133, "epoch": 7097, "val_loss": 6535826.0} {"train_loss": -27.006256103515625, "global_step": 589134, "epoch": 7098} {"train_loss": -26.9365234375, "global_step": 589135, "epoch": 7098} {"train_loss": -26.651519775390625, "global_step": 589136, "epoch": 7098} {"train_loss": -27.545581817626953, "global_step": 589137, "epoch": 7098} {"train_loss": -27.146703720092773, "global_step": 589138, "epoch": 7098} {"train_loss": -27.198522567749023, "global_step": 589139, "epoch": 7098} {"train_loss": -27.413782119750977, "global_step": 589140, "epoch": 7098} {"train_loss": -27.489959716796875, "global_step": 589141, "epoch": 7098} {"train_loss": -27.35031509399414, "global_step": 589142, "epoch": 7098} {"train_loss": -27.40065574645996, "global_step": 589143, "epoch": 7098} {"train_loss": -27.46140480041504, "global_step": 589144, "epoch": 7098} {"train_loss": -27.81049156188965, "global_step": 589145, "epoch": 7098} {"train_loss": -27.587263107299805, "global_step": 589146, "epoch": 7098} {"train_loss": -27.770666122436523, "global_step": 589147, "epoch": 7098} {"train_loss": -27.48931884765625, "global_step": 589148, "epoch": 7098} {"train_loss": -27.79202651977539, "global_step": 589149, "epoch": 7098} {"train_loss": -27.6639461517334, "global_step": 589150, "epoch": 7098} {"train_loss": -27.51611328125, "global_step": 589151, "epoch": 7098} {"train_loss": -27.831817626953125, "global_step": 589152, "epoch": 7098} {"train_loss": -27.8045711517334, "global_step": 589153, "epoch": 7098} {"train_loss": -27.62858009338379, "global_step": 589154, "epoch": 7098} {"train_loss": -27.79078483581543, "global_step": 589155, "epoch": 7098} {"train_loss": -27.865869522094727, "global_step": 589156, "epoch": 7098} {"train_loss": -27.80218505859375, "global_step": 589157, "epoch": 7098} {"train_loss": -28.264326095581055, "global_step": 589158, "epoch": 7098} {"train_loss": -27.965076446533203, "global_step": 589159, "epoch": 7098} {"train_loss": -27.557336807250977, "global_step": 589160, "epoch": 7098} {"train_loss": -27.838293075561523, "global_step": 589161, "epoch": 7098} {"train_loss": -28.071054458618164, "global_step": 589162, "epoch": 7098} {"train_loss": -28.103824615478516, "global_step": 589163, "epoch": 7098} {"train_loss": -28.200916290283203, "global_step": 589164, "epoch": 7098} {"train_loss": -28.24812889099121, "global_step": 589165, "epoch": 7098} {"train_loss": -27.919055938720703, "global_step": 589166, "epoch": 7098} {"train_loss": -27.892486572265625, "global_step": 589167, "epoch": 7098} {"train_loss": -28.068073272705078, "global_step": 589168, "epoch": 7098} {"train_loss": -28.081165313720703, "global_step": 589169, "epoch": 7098} {"train_loss": -28.09937858581543, "global_step": 589170, "epoch": 7098} {"train_loss": -27.924856185913086, "global_step": 589171, "epoch": 7098} {"train_loss": -27.93505859375, "global_step": 589172, "epoch": 7098} {"train_loss": -28.346729278564453, "global_step": 589173, "epoch": 7098} {"train_loss": -28.038328170776367, "global_step": 589174, "epoch": 7098} {"train_loss": -28.186933517456055, "global_step": 589175, "epoch": 7098} {"train_loss": -27.71744155883789, "global_step": 589176, "epoch": 7098} {"train_loss": -27.16132164001465, "global_step": 589177, "epoch": 7098} {"train_loss": -27.15801429748535, "global_step": 589178, "epoch": 7098} {"train_loss": -27.52613639831543, "global_step": 589179, "epoch": 7098} {"train_loss": -28.280414581298828, "global_step": 589180, "epoch": 7098} {"train_loss": -27.574878692626953, "global_step": 589181, "epoch": 7098} {"train_loss": -27.48919677734375, "global_step": 589182, "epoch": 7098} {"train_loss": -27.99928855895996, "global_step": 589183, "epoch": 7098} {"train_loss": -27.91168785095215, "global_step": 589184, "epoch": 7098} {"train_loss": -27.809690475463867, "global_step": 589185, "epoch": 7098} {"train_loss": -27.92390251159668, "global_step": 589186, "epoch": 7098} {"train_loss": -27.72041893005371, "global_step": 589187, "epoch": 7098} {"train_loss": -27.618961334228516, "global_step": 589188, "epoch": 7098} {"train_loss": -27.690448760986328, "global_step": 589189, "epoch": 7098} {"train_loss": -27.908203125, "global_step": 589190, "epoch": 7098} {"train_loss": -27.800140380859375, "global_step": 589191, "epoch": 7098} {"train_loss": -28.3994140625, "global_step": 589192, "epoch": 7098} {"train_loss": -27.7301025390625, "global_step": 589193, "epoch": 7098} {"train_loss": -27.588754653930664, "global_step": 589194, "epoch": 7098} {"train_loss": -27.732954025268555, "global_step": 589195, "epoch": 7098} {"train_loss": -27.680164337158203, "global_step": 589196, "epoch": 7098} {"train_loss": -27.04104995727539, "global_step": 589197, "epoch": 7098} {"train_loss": -27.693166732788086, "global_step": 589198, "epoch": 7098} {"train_loss": -27.75776481628418, "global_step": 589199, "epoch": 7098} {"train_loss": -27.676193237304688, "global_step": 589200, "epoch": 7098} {"train_loss": -27.762006759643555, "global_step": 589201, "epoch": 7098} {"train_loss": -27.98370361328125, "global_step": 589202, "epoch": 7098} {"train_loss": -27.8708438873291, "global_step": 589203, "epoch": 7098} {"train_loss": -28.14995765686035, "global_step": 589204, "epoch": 7098} {"train_loss": -27.90802001953125, "global_step": 589205, "epoch": 7098} {"train_loss": -27.80059814453125, "global_step": 589206, "epoch": 7098} {"train_loss": -27.75263786315918, "global_step": 589207, "epoch": 7098} {"train_loss": -28.345203399658203, "global_step": 589208, "epoch": 7098} {"train_loss": -28.537912368774414, "global_step": 589209, "epoch": 7098} {"train_loss": -28.346176147460938, "global_step": 589210, "epoch": 7098} {"train_loss": -28.1062068939209, "global_step": 589211, "epoch": 7098} {"train_loss": -27.67567253112793, "global_step": 589212, "epoch": 7098} {"train_loss": -28.15585708618164, "global_step": 589213, "epoch": 7098} {"train_loss": -28.1254940032959, "global_step": 589214, "epoch": 7098} {"train_loss": -27.961933135986328, "global_step": 589215, "epoch": 7098} {"train_loss": -27.7650920224477, "global_step": 589216, "epoch": 7098, "val_loss": 6557633.0} {"train_loss": -27.971715927124023, "global_step": 589217, "epoch": 7099} {"train_loss": -27.59100341796875, "global_step": 589218, "epoch": 7099} {"train_loss": -27.736316680908203, "global_step": 589219, "epoch": 7099} {"train_loss": -27.325687408447266, "global_step": 589220, "epoch": 7099} {"train_loss": -27.3060359954834, "global_step": 589221, "epoch": 7099} {"train_loss": -27.171655654907227, "global_step": 589222, "epoch": 7099} {"train_loss": -27.6025447845459, "global_step": 589223, "epoch": 7099} {"train_loss": -27.199750900268555, "global_step": 589224, "epoch": 7099} {"train_loss": -27.650190353393555, "global_step": 589225, "epoch": 7099} {"train_loss": -27.7746524810791, "global_step": 589226, "epoch": 7099} {"train_loss": -27.149993896484375, "global_step": 589227, "epoch": 7099} {"train_loss": -27.711149215698242, "global_step": 589228, "epoch": 7099} {"train_loss": -27.9434814453125, "global_step": 589229, "epoch": 7099} {"train_loss": -27.801380157470703, "global_step": 589230, "epoch": 7099} {"train_loss": -27.65740966796875, "global_step": 589231, "epoch": 7099} {"train_loss": -27.953693389892578, "global_step": 589232, "epoch": 7099} {"train_loss": -27.898273468017578, "global_step": 589233, "epoch": 7099} {"train_loss": -27.55470085144043, "global_step": 589234, "epoch": 7099} {"train_loss": -27.55328369140625, "global_step": 589235, "epoch": 7099} {"train_loss": -27.513458251953125, "global_step": 589236, "epoch": 7099} {"train_loss": -27.678674697875977, "global_step": 589237, "epoch": 7099} {"train_loss": -27.448822021484375, "global_step": 589238, "epoch": 7099} {"train_loss": -27.964786529541016, "global_step": 589239, "epoch": 7099} {"train_loss": -27.96170425415039, "global_step": 589240, "epoch": 7099} {"train_loss": -27.827939987182617, "global_step": 589241, "epoch": 7099} {"train_loss": -27.851423263549805, "global_step": 589242, "epoch": 7099} {"train_loss": -28.000568389892578, "global_step": 589243, "epoch": 7099} {"train_loss": -27.87564468383789, "global_step": 589244, "epoch": 7099} {"train_loss": -27.96540641784668, "global_step": 589245, "epoch": 7099} {"train_loss": -27.88018226623535, "global_step": 589246, "epoch": 7099} {"train_loss": -27.96877098083496, "global_step": 589247, "epoch": 7099} {"train_loss": -28.064712524414062, "global_step": 589248, "epoch": 7099} {"train_loss": -27.535276412963867, "global_step": 589249, "epoch": 7099} {"train_loss": -28.039770126342773, "global_step": 589250, "epoch": 7099} {"train_loss": -27.687671661376953, "global_step": 589251, "epoch": 7099} {"train_loss": -27.82728385925293, "global_step": 589252, "epoch": 7099} {"train_loss": -28.21168327331543, "global_step": 589253, "epoch": 7099} {"train_loss": -28.059558868408203, "global_step": 589254, "epoch": 7099} {"train_loss": -28.09800148010254, "global_step": 589255, "epoch": 7099} {"train_loss": -27.99004554748535, "global_step": 589256, "epoch": 7099} {"train_loss": -28.061017990112305, "global_step": 589257, "epoch": 7099} {"train_loss": -28.01445960998535, "global_step": 589258, "epoch": 7099} {"train_loss": -28.190916061401367, "global_step": 589259, "epoch": 7099} {"train_loss": -28.17310905456543, "global_step": 589260, "epoch": 7099} {"train_loss": -28.188705444335938, "global_step": 589261, "epoch": 7099} {"train_loss": -28.08021354675293, "global_step": 589262, "epoch": 7099} {"train_loss": -28.16212272644043, "global_step": 589263, "epoch": 7099} {"train_loss": -28.130460739135742, "global_step": 589264, "epoch": 7099} {"train_loss": -28.357656478881836, "global_step": 589265, "epoch": 7099} {"train_loss": -28.091474533081055, "global_step": 589266, "epoch": 7099} {"train_loss": -28.599445343017578, "global_step": 589267, "epoch": 7099} {"train_loss": -27.990095138549805, "global_step": 589268, "epoch": 7099} {"train_loss": -28.246784210205078, "global_step": 589269, "epoch": 7099} {"train_loss": -28.30006217956543, "global_step": 589270, "epoch": 7099} {"train_loss": -27.866064071655273, "global_step": 589271, "epoch": 7099} {"train_loss": -27.628787994384766, "global_step": 589272, "epoch": 7099} {"train_loss": -27.47890281677246, "global_step": 589273, "epoch": 7099} {"train_loss": -27.698944091796875, "global_step": 589274, "epoch": 7099} {"train_loss": -27.77241325378418, "global_step": 589275, "epoch": 7099} {"train_loss": -28.11722755432129, "global_step": 589276, "epoch": 7099} {"train_loss": -27.485822677612305, "global_step": 589277, "epoch": 7099} {"train_loss": -28.169347763061523, "global_step": 589278, "epoch": 7099} {"train_loss": -28.008634567260742, "global_step": 589279, "epoch": 7099} {"train_loss": -28.162092208862305, "global_step": 589280, "epoch": 7099} {"train_loss": -28.094562530517578, "global_step": 589281, "epoch": 7099} {"train_loss": -28.04990005493164, "global_step": 589282, "epoch": 7099} {"train_loss": -27.83235740661621, "global_step": 589283, "epoch": 7099} {"train_loss": -27.9044246673584, "global_step": 589284, "epoch": 7099} {"train_loss": -27.834447860717773, "global_step": 589285, "epoch": 7099} {"train_loss": -28.20255470275879, "global_step": 589286, "epoch": 7099} {"train_loss": -27.925537109375, "global_step": 589287, "epoch": 7099} {"train_loss": -28.22260093688965, "global_step": 589288, "epoch": 7099} {"train_loss": -28.032678604125977, "global_step": 589289, "epoch": 7099} {"train_loss": -27.801349639892578, "global_step": 589290, "epoch": 7099} {"train_loss": -27.487060546875, "global_step": 589291, "epoch": 7099} {"train_loss": -27.835498809814453, "global_step": 589292, "epoch": 7099} {"train_loss": -27.585926055908203, "global_step": 589293, "epoch": 7099} {"train_loss": -28.020099639892578, "global_step": 589294, "epoch": 7099} {"train_loss": -27.86029052734375, "global_step": 589295, "epoch": 7099} {"train_loss": -28.127256393432617, "global_step": 589296, "epoch": 7099} {"train_loss": -28.004674911499023, "global_step": 589297, "epoch": 7099} {"train_loss": -27.504377365112305, "global_step": 589298, "epoch": 7099} {"train_loss": -27.860013846891473, "global_step": 589299, "epoch": 7099, "val_loss": 6525069.5} {"train_loss": -27.66562271118164, "global_step": 589300, "epoch": 7100} {"train_loss": -26.926111221313477, "global_step": 589301, "epoch": 7100} {"train_loss": -26.869873046875, "global_step": 589302, "epoch": 7100} {"train_loss": -27.19624900817871, "global_step": 589303, "epoch": 7100} {"train_loss": -27.216108322143555, "global_step": 589304, "epoch": 7100} {"train_loss": -26.748197555541992, "global_step": 589305, "epoch": 7100} {"train_loss": -27.02143669128418, "global_step": 589306, "epoch": 7100} {"train_loss": -26.653095245361328, "global_step": 589307, "epoch": 7100} {"train_loss": -27.653059005737305, "global_step": 589308, "epoch": 7100} {"train_loss": -27.506256103515625, "global_step": 589309, "epoch": 7100} {"train_loss": -26.6844425201416, "global_step": 589310, "epoch": 7100} {"train_loss": -27.606002807617188, "global_step": 589311, "epoch": 7100} {"train_loss": -27.088598251342773, "global_step": 589312, "epoch": 7100} {"train_loss": -27.270116806030273, "global_step": 589313, "epoch": 7100} {"train_loss": -27.91874122619629, "global_step": 589314, "epoch": 7100} {"train_loss": -27.08212661743164, "global_step": 589315, "epoch": 7100} {"train_loss": -27.624425888061523, "global_step": 589316, "epoch": 7100} {"train_loss": -27.53212547302246, "global_step": 589317, "epoch": 7100} {"train_loss": -27.35499382019043, "global_step": 589318, "epoch": 7100} {"train_loss": -27.8230037689209, "global_step": 589319, "epoch": 7100} {"train_loss": -27.91596794128418, "global_step": 589320, "epoch": 7100} {"train_loss": -27.990304946899414, "global_step": 589321, "epoch": 7100} {"train_loss": -27.410917282104492, "global_step": 589322, "epoch": 7100} {"train_loss": -27.659366607666016, "global_step": 589323, "epoch": 7100} {"train_loss": -28.027029037475586, "global_step": 589324, "epoch": 7100} {"train_loss": -27.647296905517578, "global_step": 589325, "epoch": 7100} {"train_loss": -28.204315185546875, "global_step": 589326, "epoch": 7100} {"train_loss": -28.10881996154785, "global_step": 589327, "epoch": 7100} {"train_loss": -28.07484245300293, "global_step": 589328, "epoch": 7100} {"train_loss": -28.035215377807617, "global_step": 589329, "epoch": 7100} {"train_loss": -27.912078857421875, "global_step": 589330, "epoch": 7100} {"train_loss": -27.832965850830078, "global_step": 589331, "epoch": 7100} {"train_loss": -28.158395767211914, "global_step": 589332, "epoch": 7100} {"train_loss": -27.949298858642578, "global_step": 589333, "epoch": 7100} {"train_loss": -28.08839988708496, "global_step": 589334, "epoch": 7100} {"train_loss": -28.17559242248535, "global_step": 589335, "epoch": 7100} {"train_loss": -28.044260025024414, "global_step": 589336, "epoch": 7100} {"train_loss": -27.62162208557129, "global_step": 589337, "epoch": 7100} {"train_loss": -28.056589126586914, "global_step": 589338, "epoch": 7100} {"train_loss": -28.149866104125977, "global_step": 589339, "epoch": 7100} {"train_loss": -28.34149169921875, "global_step": 589340, "epoch": 7100} {"train_loss": -28.292356491088867, "global_step": 589341, "epoch": 7100} {"train_loss": -27.901437759399414, "global_step": 589342, "epoch": 7100} {"train_loss": -27.928436279296875, "global_step": 589343, "epoch": 7100} {"train_loss": -28.04912757873535, "global_step": 589344, "epoch": 7100} {"train_loss": -28.057043075561523, "global_step": 589345, "epoch": 7100} {"train_loss": -27.772418975830078, "global_step": 589346, "epoch": 7100} {"train_loss": -28.186017990112305, "global_step": 589347, "epoch": 7100} {"train_loss": -27.71135902404785, "global_step": 589348, "epoch": 7100} {"train_loss": -27.64703369140625, "global_step": 589349, "epoch": 7100} {"train_loss": -27.979949951171875, "global_step": 589350, "epoch": 7100} {"train_loss": -27.942346572875977, "global_step": 589351, "epoch": 7100} {"train_loss": -27.926544189453125, "global_step": 589352, "epoch": 7100} {"train_loss": -28.25187110900879, "global_step": 589353, "epoch": 7100} {"train_loss": -27.91737937927246, "global_step": 589354, "epoch": 7100} {"train_loss": -28.03508949279785, "global_step": 589355, "epoch": 7100} {"train_loss": -27.84661865234375, "global_step": 589356, "epoch": 7100} {"train_loss": -27.252124786376953, "global_step": 589357, "epoch": 7100} {"train_loss": -27.882108688354492, "global_step": 589358, "epoch": 7100} {"train_loss": -27.50251579284668, "global_step": 589359, "epoch": 7100} {"train_loss": -28.270627975463867, "global_step": 589360, "epoch": 7100} {"train_loss": -28.129079818725586, "global_step": 589361, "epoch": 7100} {"train_loss": -28.011245727539062, "global_step": 589362, "epoch": 7100} {"train_loss": -27.81833267211914, "global_step": 589363, "epoch": 7100} {"train_loss": -28.480932235717773, "global_step": 589364, "epoch": 7100} {"train_loss": -27.922903060913086, "global_step": 589365, "epoch": 7100} {"train_loss": -27.8514347076416, "global_step": 589366, "epoch": 7100} {"train_loss": -27.990310668945312, "global_step": 589367, "epoch": 7100} {"train_loss": -27.905445098876953, "global_step": 589368, "epoch": 7100} {"train_loss": -28.215774536132812, "global_step": 589369, "epoch": 7100} {"train_loss": -28.248676300048828, "global_step": 589370, "epoch": 7100} {"train_loss": -27.78083610534668, "global_step": 589371, "epoch": 7100} {"train_loss": -28.10357093811035, "global_step": 589372, "epoch": 7100} {"train_loss": -28.272993087768555, "global_step": 589373, "epoch": 7100} {"train_loss": -27.885244369506836, "global_step": 589374, "epoch": 7100} {"train_loss": -27.98370361328125, "global_step": 589375, "epoch": 7100} {"train_loss": -27.92487144470215, "global_step": 589376, "epoch": 7100} {"train_loss": -27.434417724609375, "global_step": 589377, "epoch": 7100} {"train_loss": -27.53460121154785, "global_step": 589378, "epoch": 7100} {"train_loss": -27.738204956054688, "global_step": 589379, "epoch": 7100} {"train_loss": -27.87983512878418, "global_step": 589380, "epoch": 7100} {"train_loss": -28.0244197845459, "global_step": 589381, "epoch": 7100} {"train_loss": -27.786287859261755, "global_step": 589382, "epoch": 7100, "train/sim_max_reward_0": 1.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4500000": 0.0, "test/sim_max_reward_4500001": 1.0, "test/sim_max_reward_4500002": 1.0, "test/sim_max_reward_4500003": 1.0, "test/sim_max_reward_4500004": 1.0, "test/sim_max_reward_4500005": 1.0, "test/sim_max_reward_4500006": 1.0, "test/sim_max_reward_4500007": 0.0, "test/sim_max_reward_4500008": 1.0, "test/sim_max_reward_4500009": 1.0, "test/sim_max_reward_4500010": 1.0, "test/sim_max_reward_4500011": 1.0, "test/sim_max_reward_4500012": 1.0, "test/sim_max_reward_4500013": 0.0, "test/sim_max_reward_4500014": 1.0, "test/sim_max_reward_4500015": 1.0, "test/sim_max_reward_4500016": 1.0, "test/sim_max_reward_4500017": 1.0, "test/sim_max_reward_4500018": 1.0, "test/sim_max_reward_4500019": 1.0, "test/sim_max_reward_4500020": 1.0, "test/sim_max_reward_4500021": 1.0, "train/mean_score": 1.0, "test/mean_score": 0.8636363636363636, "val_loss": 6570266.0} {"train_loss": -26.746295928955078, "global_step": 589383, "epoch": 7101} {"train_loss": -26.97610855102539, "global_step": 589384, "epoch": 7101} {"train_loss": -26.573942184448242, "global_step": 589385, "epoch": 7101} {"train_loss": -26.886188507080078, "global_step": 589386, "epoch": 7101} {"train_loss": -26.855712890625, "global_step": 589387, "epoch": 7101} {"train_loss": -26.747333526611328, "global_step": 589388, "epoch": 7101} {"train_loss": -27.112613677978516, "global_step": 589389, "epoch": 7101} {"train_loss": -27.116504669189453, "global_step": 589390, "epoch": 7101} {"train_loss": -27.03506851196289, "global_step": 589391, "epoch": 7101} {"train_loss": -27.640045166015625, "global_step": 589392, "epoch": 7101} {"train_loss": -27.316221237182617, "global_step": 589393, "epoch": 7101} {"train_loss": -27.05194664001465, "global_step": 589394, "epoch": 7101} {"train_loss": -27.68572998046875, "global_step": 589395, "epoch": 7101} {"train_loss": -27.715707778930664, "global_step": 589396, "epoch": 7101} {"train_loss": -27.324811935424805, "global_step": 589397, "epoch": 7101} {"train_loss": -27.562854766845703, "global_step": 589398, "epoch": 7101} {"train_loss": -27.891422271728516, "global_step": 589399, "epoch": 7101} {"train_loss": -27.52998161315918, "global_step": 589400, "epoch": 7101} {"train_loss": -27.373937606811523, "global_step": 589401, "epoch": 7101} {"train_loss": -27.839141845703125, "global_step": 589402, "epoch": 7101} {"train_loss": -27.67426872253418, "global_step": 589403, "epoch": 7101} {"train_loss": -27.712177276611328, "global_step": 589404, "epoch": 7101} {"train_loss": -27.77790641784668, "global_step": 589405, "epoch": 7101} {"train_loss": -27.571908950805664, "global_step": 589406, "epoch": 7101} {"train_loss": -27.647979736328125, "global_step": 589407, "epoch": 7101} {"train_loss": -28.040098190307617, "global_step": 589408, "epoch": 7101} {"train_loss": -28.24566078186035, "global_step": 589409, "epoch": 7101} {"train_loss": -28.118350982666016, "global_step": 589410, "epoch": 7101} {"train_loss": -27.989654541015625, "global_step": 589411, "epoch": 7101} {"train_loss": -27.947284698486328, "global_step": 589412, "epoch": 7101} {"train_loss": -27.785425186157227, "global_step": 589413, "epoch": 7101} {"train_loss": -28.220666885375977, "global_step": 589414, "epoch": 7101} {"train_loss": -28.205209732055664, "global_step": 589415, "epoch": 7101} {"train_loss": -28.07303237915039, "global_step": 589416, "epoch": 7101} {"train_loss": -27.9456729888916, "global_step": 589417, "epoch": 7101} {"train_loss": -28.097082138061523, "global_step": 589418, "epoch": 7101} {"train_loss": -28.157785415649414, "global_step": 589419, "epoch": 7101} {"train_loss": -27.927160263061523, "global_step": 589420, "epoch": 7101} {"train_loss": -28.030811309814453, "global_step": 589421, "epoch": 7101} {"train_loss": -28.1490535736084, "global_step": 589422, "epoch": 7101} {"train_loss": -28.359525680541992, "global_step": 589423, "epoch": 7101} {"train_loss": -28.2275447845459, "global_step": 589424, "epoch": 7101} {"train_loss": -28.375776290893555, "global_step": 589425, "epoch": 7101} {"train_loss": -28.26984214782715, "global_step": 589426, "epoch": 7101} {"train_loss": -28.261859893798828, "global_step": 589427, "epoch": 7101} {"train_loss": -27.835737228393555, "global_step": 589428, "epoch": 7101} {"train_loss": -27.742170333862305, "global_step": 589429, "epoch": 7101} {"train_loss": -28.097736358642578, "global_step": 589430, "epoch": 7101} {"train_loss": -28.515243530273438, "global_step": 589431, "epoch": 7101} {"train_loss": -27.906396865844727, "global_step": 589432, "epoch": 7101} {"train_loss": -27.98366355895996, "global_step": 589433, "epoch": 7101} {"train_loss": -28.147974014282227, "global_step": 589434, "epoch": 7101} {"train_loss": -27.74344253540039, "global_step": 589435, "epoch": 7101} {"train_loss": -27.968494415283203, "global_step": 589436, "epoch": 7101} {"train_loss": -27.799579620361328, "global_step": 589437, "epoch": 7101} {"train_loss": -27.930572509765625, "global_step": 589438, "epoch": 7101} {"train_loss": -27.7969970703125, "global_step": 589439, "epoch": 7101} {"train_loss": -27.688879013061523, "global_step": 589440, "epoch": 7101} {"train_loss": -27.60536003112793, "global_step": 589441, "epoch": 7101} {"train_loss": -27.552087783813477, "global_step": 589442, "epoch": 7101} {"train_loss": -27.874649047851562, "global_step": 589443, "epoch": 7101} {"train_loss": -27.5371150970459, "global_step": 589444, "epoch": 7101} {"train_loss": -27.8887939453125, "global_step": 589445, "epoch": 7101} {"train_loss": -27.878721237182617, "global_step": 589446, "epoch": 7101} {"train_loss": -28.108800888061523, "global_step": 589447, "epoch": 7101} {"train_loss": -28.304767608642578, "global_step": 589448, "epoch": 7101} {"train_loss": -27.56560707092285, "global_step": 589449, "epoch": 7101} {"train_loss": -28.24114990234375, "global_step": 589450, "epoch": 7101} {"train_loss": -27.991159439086914, "global_step": 589451, "epoch": 7101} {"train_loss": -27.9626522064209, "global_step": 589452, "epoch": 7101} {"train_loss": -27.56473159790039, "global_step": 589453, "epoch": 7101} {"train_loss": -28.138723373413086, "global_step": 589454, "epoch": 7101} {"train_loss": -28.007156372070312, "global_step": 589455, "epoch": 7101} {"train_loss": -28.218698501586914, "global_step": 589456, "epoch": 7101} {"train_loss": -28.40093421936035, "global_step": 589457, "epoch": 7101} {"train_loss": -27.643991470336914, "global_step": 589458, "epoch": 7101} {"train_loss": -28.06402015686035, "global_step": 589459, "epoch": 7101} {"train_loss": -28.062488555908203, "global_step": 589460, "epoch": 7101} {"train_loss": -28.1320858001709, "global_step": 589461, "epoch": 7101} {"train_loss": -28.02850914001465, "global_step": 589462, "epoch": 7101} {"train_loss": -28.148639678955078, "global_step": 589463, "epoch": 7101} {"train_loss": -28.31768798828125, "global_step": 589464, "epoch": 7101} {"train_loss": -27.802600883575806, "global_step": 589465, "epoch": 7101, "val_loss": 6574112.5} {"train_loss": -25.504663467407227, "global_step": 589466, "epoch": 7102} {"train_loss": -24.083532333374023, "global_step": 589467, "epoch": 7102} {"train_loss": -23.558149337768555, "global_step": 589468, "epoch": 7102} {"train_loss": -26.271087646484375, "global_step": 589469, "epoch": 7102} {"train_loss": -25.63169288635254, "global_step": 589470, "epoch": 7102} {"train_loss": -26.455408096313477, "global_step": 589471, "epoch": 7102} {"train_loss": -25.59064483642578, "global_step": 589472, "epoch": 7102} {"train_loss": -26.464025497436523, "global_step": 589473, "epoch": 7102} {"train_loss": -25.788053512573242, "global_step": 589474, "epoch": 7102} {"train_loss": -26.2814884185791, "global_step": 589475, "epoch": 7102} {"train_loss": -26.15673828125, "global_step": 589476, "epoch": 7102} {"train_loss": -26.829797744750977, "global_step": 589477, "epoch": 7102} {"train_loss": -26.575220108032227, "global_step": 589478, "epoch": 7102} {"train_loss": -27.479095458984375, "global_step": 589479, "epoch": 7102} {"train_loss": -26.475452423095703, "global_step": 589480, "epoch": 7102} {"train_loss": -26.878921508789062, "global_step": 589481, "epoch": 7102} {"train_loss": -27.113142013549805, "global_step": 589482, "epoch": 7102} {"train_loss": -27.232471466064453, "global_step": 589483, "epoch": 7102} {"train_loss": -27.085098266601562, "global_step": 589484, "epoch": 7102} {"train_loss": -27.274765014648438, "global_step": 589485, "epoch": 7102} {"train_loss": -27.217212677001953, "global_step": 589486, "epoch": 7102} {"train_loss": -27.515695571899414, "global_step": 589487, "epoch": 7102} {"train_loss": -27.16986656188965, "global_step": 589488, "epoch": 7102} {"train_loss": -26.986576080322266, "global_step": 589489, "epoch": 7102} {"train_loss": -27.435165405273438, "global_step": 589490, "epoch": 7102} {"train_loss": -27.412954330444336, "global_step": 589491, "epoch": 7102} {"train_loss": -27.39539909362793, "global_step": 589492, "epoch": 7102} {"train_loss": -27.768310546875, "global_step": 589493, "epoch": 7102} {"train_loss": -27.108861923217773, "global_step": 589494, "epoch": 7102} {"train_loss": -27.45781898498535, "global_step": 589495, "epoch": 7102} {"train_loss": -27.276947021484375, "global_step": 589496, "epoch": 7102} {"train_loss": -27.39333152770996, "global_step": 589497, "epoch": 7102} {"train_loss": -27.52557945251465, "global_step": 589498, "epoch": 7102} {"train_loss": -27.572553634643555, "global_step": 589499, "epoch": 7102} {"train_loss": -27.683212280273438, "global_step": 589500, "epoch": 7102} {"train_loss": -27.647464752197266, "global_step": 589501, "epoch": 7102} {"train_loss": -27.546619415283203, "global_step": 589502, "epoch": 7102} {"train_loss": -27.680206298828125, "global_step": 589503, "epoch": 7102} {"train_loss": -28.021060943603516, "global_step": 589504, "epoch": 7102} {"train_loss": -27.841827392578125, "global_step": 589505, "epoch": 7102} {"train_loss": -27.544958114624023, "global_step": 589506, "epoch": 7102} {"train_loss": -27.6392822265625, "global_step": 589507, "epoch": 7102} {"train_loss": -27.871747970581055, "global_step": 589508, "epoch": 7102} {"train_loss": -27.73945426940918, "global_step": 589509, "epoch": 7102} {"train_loss": -27.839969635009766, "global_step": 589510, "epoch": 7102} {"train_loss": -28.023542404174805, "global_step": 589511, "epoch": 7102} {"train_loss": -27.62845230102539, "global_step": 589512, "epoch": 7102} {"train_loss": -27.646936416625977, "global_step": 589513, "epoch": 7102} {"train_loss": -27.724058151245117, "global_step": 589514, "epoch": 7102} {"train_loss": -27.93505859375, "global_step": 589515, "epoch": 7102} {"train_loss": -27.950653076171875, "global_step": 589516, "epoch": 7102} {"train_loss": -28.093774795532227, "global_step": 589517, "epoch": 7102} {"train_loss": -27.717987060546875, "global_step": 589518, "epoch": 7102} {"train_loss": -28.346195220947266, "global_step": 589519, "epoch": 7102} {"train_loss": -27.77617835998535, "global_step": 589520, "epoch": 7102} {"train_loss": -27.938312530517578, "global_step": 589521, "epoch": 7102} {"train_loss": -28.395483016967773, "global_step": 589522, "epoch": 7102} {"train_loss": -27.882246017456055, "global_step": 589523, "epoch": 7102} {"train_loss": -28.18109703063965, "global_step": 589524, "epoch": 7102} {"train_loss": -28.10798454284668, "global_step": 589525, "epoch": 7102} {"train_loss": -27.642608642578125, "global_step": 589526, "epoch": 7102} {"train_loss": -27.65167236328125, "global_step": 589527, "epoch": 7102} {"train_loss": -27.72190284729004, "global_step": 589528, "epoch": 7102} {"train_loss": -27.746051788330078, "global_step": 589529, "epoch": 7102} {"train_loss": -27.35886573791504, "global_step": 589530, "epoch": 7102} {"train_loss": -27.850147247314453, "global_step": 589531, "epoch": 7102} {"train_loss": -27.972553253173828, "global_step": 589532, "epoch": 7102} {"train_loss": -27.414289474487305, "global_step": 589533, "epoch": 7102} {"train_loss": -28.232030868530273, "global_step": 589534, "epoch": 7102} {"train_loss": -27.427215576171875, "global_step": 589535, "epoch": 7102} {"train_loss": -27.6595516204834, "global_step": 589536, "epoch": 7102} {"train_loss": -27.70849609375, "global_step": 589537, "epoch": 7102} {"train_loss": -27.56485366821289, "global_step": 589538, "epoch": 7102} {"train_loss": -28.04058265686035, "global_step": 589539, "epoch": 7102} {"train_loss": -27.807037353515625, "global_step": 589540, "epoch": 7102} {"train_loss": -28.014923095703125, "global_step": 589541, "epoch": 7102} {"train_loss": -27.861297607421875, "global_step": 589542, "epoch": 7102} {"train_loss": -28.180496215820312, "global_step": 589543, "epoch": 7102} {"train_loss": -27.7490234375, "global_step": 589544, "epoch": 7102} {"train_loss": -27.751514434814453, "global_step": 589545, "epoch": 7102} {"train_loss": -28.040063858032227, "global_step": 589546, "epoch": 7102} {"train_loss": -27.63315200805664, "global_step": 589547, "epoch": 7102} {"train_loss": -27.35633597316512, "global_step": 589548, "epoch": 7102, "val_loss": 6542654.0} {"train_loss": -27.78301429748535, "global_step": 589549, "epoch": 7103} {"train_loss": -27.61427879333496, "global_step": 589550, "epoch": 7103} {"train_loss": -27.437427520751953, "global_step": 589551, "epoch": 7103} {"train_loss": -27.490503311157227, "global_step": 589552, "epoch": 7103} {"train_loss": -27.827539443969727, "global_step": 589553, "epoch": 7103} {"train_loss": -27.846948623657227, "global_step": 589554, "epoch": 7103} {"train_loss": -27.466262817382812, "global_step": 589555, "epoch": 7103} {"train_loss": -27.92243003845215, "global_step": 589556, "epoch": 7103} {"train_loss": -27.348876953125, "global_step": 589557, "epoch": 7103} {"train_loss": -27.149616241455078, "global_step": 589558, "epoch": 7103} {"train_loss": -27.485010147094727, "global_step": 589559, "epoch": 7103} {"train_loss": -27.93023681640625, "global_step": 589560, "epoch": 7103} {"train_loss": -27.69428825378418, "global_step": 589561, "epoch": 7103} {"train_loss": -27.613849639892578, "global_step": 589562, "epoch": 7103} {"train_loss": -27.778949737548828, "global_step": 589563, "epoch": 7103} {"train_loss": -27.60249137878418, "global_step": 589564, "epoch": 7103} {"train_loss": -27.498584747314453, "global_step": 589565, "epoch": 7103} {"train_loss": -27.864959716796875, "global_step": 589566, "epoch": 7103} {"train_loss": -27.36280632019043, "global_step": 589567, "epoch": 7103} {"train_loss": -27.889862060546875, "global_step": 589568, "epoch": 7103} {"train_loss": -27.946958541870117, "global_step": 589569, "epoch": 7103} {"train_loss": -28.13716697692871, "global_step": 589570, "epoch": 7103} {"train_loss": -27.6236629486084, "global_step": 589571, "epoch": 7103} {"train_loss": -27.932876586914062, "global_step": 589572, "epoch": 7103} {"train_loss": -28.14234733581543, "global_step": 589573, "epoch": 7103} {"train_loss": -27.806198120117188, "global_step": 589574, "epoch": 7103} {"train_loss": -27.566370010375977, "global_step": 589575, "epoch": 7103} {"train_loss": -27.8181209564209, "global_step": 589576, "epoch": 7103} {"train_loss": -28.416959762573242, "global_step": 589577, "epoch": 7103} {"train_loss": -28.24395179748535, "global_step": 589578, "epoch": 7103} {"train_loss": -28.134571075439453, "global_step": 589579, "epoch": 7103} {"train_loss": -28.210866928100586, "global_step": 589580, "epoch": 7103} {"train_loss": -28.227298736572266, "global_step": 589581, "epoch": 7103} {"train_loss": -27.878692626953125, "global_step": 589582, "epoch": 7103} {"train_loss": -28.03775978088379, "global_step": 589583, "epoch": 7103} {"train_loss": -28.195297241210938, "global_step": 589584, "epoch": 7103} {"train_loss": -28.17734718322754, "global_step": 589585, "epoch": 7103} {"train_loss": -28.075260162353516, "global_step": 589586, "epoch": 7103} {"train_loss": -28.24234962463379, "global_step": 589587, "epoch": 7103} {"train_loss": -28.02621841430664, "global_step": 589588, "epoch": 7103} {"train_loss": -27.8842716217041, "global_step": 589589, "epoch": 7103} {"train_loss": -28.5284366607666, "global_step": 589590, "epoch": 7103} {"train_loss": -28.39960289001465, "global_step": 589591, "epoch": 7103} {"train_loss": -28.17868423461914, "global_step": 589592, "epoch": 7103} {"train_loss": -28.09738540649414, "global_step": 589593, "epoch": 7103} {"train_loss": -28.38577651977539, "global_step": 589594, "epoch": 7103} {"train_loss": -28.31689453125, "global_step": 589595, "epoch": 7103} {"train_loss": -28.232324600219727, "global_step": 589596, "epoch": 7103} {"train_loss": -27.937244415283203, "global_step": 589597, "epoch": 7103} {"train_loss": -28.29505729675293, "global_step": 589598, "epoch": 7103} {"train_loss": -27.768869400024414, "global_step": 589599, "epoch": 7103} {"train_loss": -27.46697998046875, "global_step": 589600, "epoch": 7103} {"train_loss": -27.5938663482666, "global_step": 589601, "epoch": 7103} {"train_loss": -27.28712272644043, "global_step": 589602, "epoch": 7103} {"train_loss": -26.188079833984375, "global_step": 589603, "epoch": 7103} {"train_loss": -26.1157283782959, "global_step": 589604, "epoch": 7103} {"train_loss": -27.456756591796875, "global_step": 589605, "epoch": 7103} {"train_loss": -27.520994186401367, "global_step": 589606, "epoch": 7103} {"train_loss": -27.541763305664062, "global_step": 589607, "epoch": 7103} {"train_loss": -27.70417594909668, "global_step": 589608, "epoch": 7103} {"train_loss": -27.6047420501709, "global_step": 589609, "epoch": 7103} {"train_loss": -27.607269287109375, "global_step": 589610, "epoch": 7103} {"train_loss": -28.04877281188965, "global_step": 589611, "epoch": 7103} {"train_loss": -27.531330108642578, "global_step": 589612, "epoch": 7103} {"train_loss": -27.623950958251953, "global_step": 589613, "epoch": 7103} {"train_loss": -27.846466064453125, "global_step": 589614, "epoch": 7103} {"train_loss": -27.84539222717285, "global_step": 589615, "epoch": 7103} {"train_loss": -27.7049617767334, "global_step": 589616, "epoch": 7103} {"train_loss": -27.665985107421875, "global_step": 589617, "epoch": 7103} {"train_loss": -27.991403579711914, "global_step": 589618, "epoch": 7103} {"train_loss": -27.532123565673828, "global_step": 589619, "epoch": 7103} {"train_loss": -27.891357421875, "global_step": 589620, "epoch": 7103} {"train_loss": -27.8004207611084, "global_step": 589621, "epoch": 7103} {"train_loss": -27.885955810546875, "global_step": 589622, "epoch": 7103} {"train_loss": -27.49798583984375, "global_step": 589623, "epoch": 7103} {"train_loss": -28.13922691345215, "global_step": 589624, "epoch": 7103} {"train_loss": -27.608795166015625, "global_step": 589625, "epoch": 7103} {"train_loss": -27.790998458862305, "global_step": 589626, "epoch": 7103} {"train_loss": -28.024763107299805, "global_step": 589627, "epoch": 7103} {"train_loss": -27.627099990844727, "global_step": 589628, "epoch": 7103} {"train_loss": -27.319793701171875, "global_step": 589629, "epoch": 7103} {"train_loss": -27.519927978515625, "global_step": 589630, "epoch": 7103} {"train_loss": -27.76625787206443, "global_step": 589631, "epoch": 7103, "val_loss": 6540786.0} {"train_loss": -25.503599166870117, "global_step": 589632, "epoch": 7104} {"train_loss": -26.614042282104492, "global_step": 589633, "epoch": 7104} {"train_loss": -26.383670806884766, "global_step": 589634, "epoch": 7104} {"train_loss": -26.429548263549805, "global_step": 589635, "epoch": 7104} {"train_loss": -27.06903076171875, "global_step": 589636, "epoch": 7104} {"train_loss": -26.416996002197266, "global_step": 589637, "epoch": 7104} {"train_loss": -26.596271514892578, "global_step": 589638, "epoch": 7104} {"train_loss": -26.295347213745117, "global_step": 589639, "epoch": 7104} {"train_loss": -26.960119247436523, "global_step": 589640, "epoch": 7104} {"train_loss": -26.044967651367188, "global_step": 589641, "epoch": 7104} {"train_loss": -26.950225830078125, "global_step": 589642, "epoch": 7104} {"train_loss": -27.04343605041504, "global_step": 589643, "epoch": 7104} {"train_loss": -26.85866355895996, "global_step": 589644, "epoch": 7104} {"train_loss": -26.830230712890625, "global_step": 589645, "epoch": 7104} {"train_loss": -27.406747817993164, "global_step": 589646, "epoch": 7104} {"train_loss": -27.367002487182617, "global_step": 589647, "epoch": 7104} {"train_loss": -26.825010299682617, "global_step": 589648, "epoch": 7104} {"train_loss": -27.48712158203125, "global_step": 589649, "epoch": 7104} {"train_loss": -27.239593505859375, "global_step": 589650, "epoch": 7104} {"train_loss": -27.25282096862793, "global_step": 589651, "epoch": 7104} {"train_loss": -27.247922897338867, "global_step": 589652, "epoch": 7104} {"train_loss": -27.443628311157227, "global_step": 589653, "epoch": 7104} {"train_loss": -27.37188720703125, "global_step": 589654, "epoch": 7104} {"train_loss": -27.35518455505371, "global_step": 589655, "epoch": 7104} {"train_loss": -27.586441040039062, "global_step": 589656, "epoch": 7104} {"train_loss": -27.44220542907715, "global_step": 589657, "epoch": 7104} {"train_loss": -27.566747665405273, "global_step": 589658, "epoch": 7104} {"train_loss": -27.844552993774414, "global_step": 589659, "epoch": 7104} {"train_loss": -27.585779190063477, "global_step": 589660, "epoch": 7104} {"train_loss": -27.733976364135742, "global_step": 589661, "epoch": 7104} {"train_loss": -27.804609298706055, "global_step": 589662, "epoch": 7104} {"train_loss": -28.005847930908203, "global_step": 589663, "epoch": 7104} {"train_loss": -28.360107421875, "global_step": 589664, "epoch": 7104} {"train_loss": -27.435895919799805, "global_step": 589665, "epoch": 7104} {"train_loss": -28.07500648498535, "global_step": 589666, "epoch": 7104} {"train_loss": -28.044687271118164, "global_step": 589667, "epoch": 7104} {"train_loss": -28.160663604736328, "global_step": 589668, "epoch": 7104} {"train_loss": -27.644662857055664, "global_step": 589669, "epoch": 7104} {"train_loss": -27.756855010986328, "global_step": 589670, "epoch": 7104} {"train_loss": -27.91826820373535, "global_step": 589671, "epoch": 7104} {"train_loss": -28.23151206970215, "global_step": 589672, "epoch": 7104} {"train_loss": -27.852798461914062, "global_step": 589673, "epoch": 7104} {"train_loss": -27.67291831970215, "global_step": 589674, "epoch": 7104} {"train_loss": -28.196197509765625, "global_step": 589675, "epoch": 7104} {"train_loss": -28.106298446655273, "global_step": 589676, "epoch": 7104} {"train_loss": -28.192907333374023, "global_step": 589677, "epoch": 7104} {"train_loss": -28.073102951049805, "global_step": 589678, "epoch": 7104} {"train_loss": -27.968027114868164, "global_step": 589679, "epoch": 7104} {"train_loss": -27.86067771911621, "global_step": 589680, "epoch": 7104} {"train_loss": -28.059112548828125, "global_step": 589681, "epoch": 7104} {"train_loss": -28.045995712280273, "global_step": 589682, "epoch": 7104} {"train_loss": -27.980310440063477, "global_step": 589683, "epoch": 7104} {"train_loss": -28.14784049987793, "global_step": 589684, "epoch": 7104} {"train_loss": -27.976917266845703, "global_step": 589685, "epoch": 7104} {"train_loss": -28.184890747070312, "global_step": 589686, "epoch": 7104} {"train_loss": -27.84919548034668, "global_step": 589687, "epoch": 7104} {"train_loss": -28.040130615234375, "global_step": 589688, "epoch": 7104} {"train_loss": -28.206762313842773, "global_step": 589689, "epoch": 7104} {"train_loss": -27.984073638916016, "global_step": 589690, "epoch": 7104} {"train_loss": -28.383758544921875, "global_step": 589691, "epoch": 7104} {"train_loss": -28.39349937438965, "global_step": 589692, "epoch": 7104} {"train_loss": -28.093994140625, "global_step": 589693, "epoch": 7104} {"train_loss": -28.364728927612305, "global_step": 589694, "epoch": 7104} {"train_loss": -28.091238021850586, "global_step": 589695, "epoch": 7104} {"train_loss": -27.96219253540039, "global_step": 589696, "epoch": 7104} {"train_loss": -28.34290885925293, "global_step": 589697, "epoch": 7104} {"train_loss": -28.13448143005371, "global_step": 589698, "epoch": 7104} {"train_loss": -27.959287643432617, "global_step": 589699, "epoch": 7104} {"train_loss": -28.522253036499023, "global_step": 589700, "epoch": 7104} {"train_loss": -27.98725700378418, "global_step": 589701, "epoch": 7104} {"train_loss": -28.02337074279785, "global_step": 589702, "epoch": 7104} {"train_loss": -27.806049346923828, "global_step": 589703, "epoch": 7104} {"train_loss": -27.990087509155273, "global_step": 589704, "epoch": 7104} {"train_loss": -27.981159210205078, "global_step": 589705, "epoch": 7104} {"train_loss": -27.910261154174805, "global_step": 589706, "epoch": 7104} {"train_loss": -27.648828506469727, "global_step": 589707, "epoch": 7104} {"train_loss": -27.503738403320312, "global_step": 589708, "epoch": 7104} {"train_loss": -27.65497398376465, "global_step": 589709, "epoch": 7104} {"train_loss": -27.60685157775879, "global_step": 589710, "epoch": 7104} {"train_loss": -27.389911651611328, "global_step": 589711, "epoch": 7104} {"train_loss": -27.69330406188965, "global_step": 589712, "epoch": 7104} {"train_loss": -27.62734031677246, "global_step": 589713, "epoch": 7104} {"train_loss": -27.625018200242376, "global_step": 589714, "epoch": 7104, "val_loss": 6516008.0} {"train_loss": -25.5214786529541, "global_step": 589715, "epoch": 7105} {"train_loss": -26.815587997436523, "global_step": 589716, "epoch": 7105} {"train_loss": -26.841039657592773, "global_step": 589717, "epoch": 7105} {"train_loss": -25.715444564819336, "global_step": 589718, "epoch": 7105} {"train_loss": -27.326431274414062, "global_step": 589719, "epoch": 7105} {"train_loss": -26.594436645507812, "global_step": 589720, "epoch": 7105} {"train_loss": -27.062179565429688, "global_step": 589721, "epoch": 7105} {"train_loss": -26.949003219604492, "global_step": 589722, "epoch": 7105} {"train_loss": -26.965641021728516, "global_step": 589723, "epoch": 7105} {"train_loss": -27.860427856445312, "global_step": 589724, "epoch": 7105} {"train_loss": -27.478515625, "global_step": 589725, "epoch": 7105} {"train_loss": -27.533447265625, "global_step": 589726, "epoch": 7105} {"train_loss": -27.408472061157227, "global_step": 589727, "epoch": 7105} {"train_loss": -27.257455825805664, "global_step": 589728, "epoch": 7105} {"train_loss": -27.597837448120117, "global_step": 589729, "epoch": 7105} {"train_loss": -27.31854248046875, "global_step": 589730, "epoch": 7105} {"train_loss": -27.540176391601562, "global_step": 589731, "epoch": 7105} {"train_loss": -27.37115478515625, "global_step": 589732, "epoch": 7105} {"train_loss": -27.59962272644043, "global_step": 589733, "epoch": 7105} {"train_loss": -27.525785446166992, "global_step": 589734, "epoch": 7105} {"train_loss": -27.303009033203125, "global_step": 589735, "epoch": 7105} {"train_loss": -27.359893798828125, "global_step": 589736, "epoch": 7105} {"train_loss": -27.69879150390625, "global_step": 589737, "epoch": 7105} {"train_loss": -27.78706169128418, "global_step": 589738, "epoch": 7105} {"train_loss": -27.723758697509766, "global_step": 589739, "epoch": 7105} {"train_loss": -27.566150665283203, "global_step": 589740, "epoch": 7105} {"train_loss": -27.30842399597168, "global_step": 589741, "epoch": 7105} {"train_loss": -27.594879150390625, "global_step": 589742, "epoch": 7105} {"train_loss": -27.855981826782227, "global_step": 589743, "epoch": 7105} {"train_loss": -27.303552627563477, "global_step": 589744, "epoch": 7105} {"train_loss": -27.760656356811523, "global_step": 589745, "epoch": 7105} {"train_loss": -27.833621978759766, "global_step": 589746, "epoch": 7105} {"train_loss": -27.9378604888916, "global_step": 589747, "epoch": 7105} {"train_loss": -27.455841064453125, "global_step": 589748, "epoch": 7105} {"train_loss": -27.83149528503418, "global_step": 589749, "epoch": 7105} {"train_loss": -27.834014892578125, "global_step": 589750, "epoch": 7105} {"train_loss": -27.99004554748535, "global_step": 589751, "epoch": 7105} {"train_loss": -28.22108268737793, "global_step": 589752, "epoch": 7105} {"train_loss": -28.008176803588867, "global_step": 589753, "epoch": 7105} {"train_loss": -27.7315616607666, "global_step": 589754, "epoch": 7105} {"train_loss": -27.74793815612793, "global_step": 589755, "epoch": 7105} {"train_loss": -27.9957218170166, "global_step": 589756, "epoch": 7105} {"train_loss": -28.08515739440918, "global_step": 589757, "epoch": 7105} {"train_loss": -28.239328384399414, "global_step": 589758, "epoch": 7105} {"train_loss": -28.047046661376953, "global_step": 589759, "epoch": 7105} {"train_loss": -27.941364288330078, "global_step": 589760, "epoch": 7105} {"train_loss": -28.245880126953125, "global_step": 589761, "epoch": 7105} {"train_loss": -27.840518951416016, "global_step": 589762, "epoch": 7105} {"train_loss": -28.093677520751953, "global_step": 589763, "epoch": 7105} {"train_loss": -28.12285804748535, "global_step": 589764, "epoch": 7105} {"train_loss": -28.00892448425293, "global_step": 589765, "epoch": 7105} {"train_loss": -27.64032554626465, "global_step": 589766, "epoch": 7105} {"train_loss": -27.986408233642578, "global_step": 589767, "epoch": 7105} {"train_loss": -27.998743057250977, "global_step": 589768, "epoch": 7105} {"train_loss": -28.22150993347168, "global_step": 589769, "epoch": 7105} {"train_loss": -27.619482040405273, "global_step": 589770, "epoch": 7105} {"train_loss": -27.917652130126953, "global_step": 589771, "epoch": 7105} {"train_loss": -28.091028213500977, "global_step": 589772, "epoch": 7105} {"train_loss": -28.05327796936035, "global_step": 589773, "epoch": 7105} {"train_loss": -27.918115615844727, "global_step": 589774, "epoch": 7105} {"train_loss": -27.447309494018555, "global_step": 589775, "epoch": 7105} {"train_loss": -27.753646850585938, "global_step": 589776, "epoch": 7105} {"train_loss": -27.636213302612305, "global_step": 589777, "epoch": 7105} {"train_loss": -28.061246871948242, "global_step": 589778, "epoch": 7105} {"train_loss": -28.06500816345215, "global_step": 589779, "epoch": 7105} {"train_loss": -27.873106002807617, "global_step": 589780, "epoch": 7105} {"train_loss": -28.101593017578125, "global_step": 589781, "epoch": 7105} {"train_loss": -27.945449829101562, "global_step": 589782, "epoch": 7105} {"train_loss": -28.2425594329834, "global_step": 589783, "epoch": 7105} {"train_loss": -28.192001342773438, "global_step": 589784, "epoch": 7105} {"train_loss": -28.1834774017334, "global_step": 589785, "epoch": 7105} {"train_loss": -27.928604125976562, "global_step": 589786, "epoch": 7105} {"train_loss": -27.759647369384766, "global_step": 589787, "epoch": 7105} {"train_loss": -28.142072677612305, "global_step": 589788, "epoch": 7105} {"train_loss": -27.781003952026367, "global_step": 589789, "epoch": 7105} {"train_loss": -28.110868453979492, "global_step": 589790, "epoch": 7105} {"train_loss": -27.900060653686523, "global_step": 589791, "epoch": 7105} {"train_loss": -28.22547721862793, "global_step": 589792, "epoch": 7105} {"train_loss": -27.93946647644043, "global_step": 589793, "epoch": 7105} {"train_loss": -28.3228702545166, "global_step": 589794, "epoch": 7105} {"train_loss": -28.11029624938965, "global_step": 589795, "epoch": 7105} {"train_loss": -28.229938507080078, "global_step": 589796, "epoch": 7105} {"train_loss": -27.702484475560937, "global_step": 589797, "epoch": 7105, "val_loss": 6620578.0} {"train_loss": -25.906599044799805, "global_step": 589798, "epoch": 7106} {"train_loss": -26.81744384765625, "global_step": 589799, "epoch": 7106} {"train_loss": -27.692550659179688, "global_step": 589800, "epoch": 7106} {"train_loss": -26.475940704345703, "global_step": 589801, "epoch": 7106} {"train_loss": -26.48410987854004, "global_step": 589802, "epoch": 7106} {"train_loss": -27.0809326171875, "global_step": 589803, "epoch": 7106} {"train_loss": -26.77414321899414, "global_step": 589804, "epoch": 7106} {"train_loss": -27.33584976196289, "global_step": 589805, "epoch": 7106} {"train_loss": -27.160886764526367, "global_step": 589806, "epoch": 7106} {"train_loss": -26.826934814453125, "global_step": 589807, "epoch": 7106} {"train_loss": -27.6173152923584, "global_step": 589808, "epoch": 7106} {"train_loss": -27.425153732299805, "global_step": 589809, "epoch": 7106} {"train_loss": -27.518823623657227, "global_step": 589810, "epoch": 7106} {"train_loss": -27.33082389831543, "global_step": 589811, "epoch": 7106} {"train_loss": -27.490478515625, "global_step": 589812, "epoch": 7106} {"train_loss": -27.222412109375, "global_step": 589813, "epoch": 7106} {"train_loss": -27.326251983642578, "global_step": 589814, "epoch": 7106} {"train_loss": -27.293506622314453, "global_step": 589815, "epoch": 7106} {"train_loss": -27.13018798828125, "global_step": 589816, "epoch": 7106} {"train_loss": -27.605484008789062, "global_step": 589817, "epoch": 7106} {"train_loss": -27.248870849609375, "global_step": 589818, "epoch": 7106} {"train_loss": -27.055212020874023, "global_step": 589819, "epoch": 7106} {"train_loss": -27.419294357299805, "global_step": 589820, "epoch": 7106} {"train_loss": -27.41410255432129, "global_step": 589821, "epoch": 7106} {"train_loss": -27.807464599609375, "global_step": 589822, "epoch": 7106} {"train_loss": -27.554636001586914, "global_step": 589823, "epoch": 7106} {"train_loss": -27.281030654907227, "global_step": 589824, "epoch": 7106} {"train_loss": -27.925817489624023, "global_step": 589825, "epoch": 7106} {"train_loss": -27.664844512939453, "global_step": 589826, "epoch": 7106} {"train_loss": -27.718128204345703, "global_step": 589827, "epoch": 7106} {"train_loss": -27.81692886352539, "global_step": 589828, "epoch": 7106} {"train_loss": -27.62882423400879, "global_step": 589829, "epoch": 7106} {"train_loss": -28.034027099609375, "global_step": 589830, "epoch": 7106} {"train_loss": -27.76871109008789, "global_step": 589831, "epoch": 7106} {"train_loss": -27.965408325195312, "global_step": 589832, "epoch": 7106} {"train_loss": -27.852466583251953, "global_step": 589833, "epoch": 7106} {"train_loss": -27.79799461364746, "global_step": 589834, "epoch": 7106} {"train_loss": -27.86992835998535, "global_step": 589835, "epoch": 7106} {"train_loss": -28.07879638671875, "global_step": 589836, "epoch": 7106} {"train_loss": -28.287017822265625, "global_step": 589837, "epoch": 7106} {"train_loss": -28.116409301757812, "global_step": 589838, "epoch": 7106} {"train_loss": -27.668607711791992, "global_step": 589839, "epoch": 7106} {"train_loss": -28.15386390686035, "global_step": 589840, "epoch": 7106} {"train_loss": -27.816537857055664, "global_step": 589841, "epoch": 7106} {"train_loss": -28.061996459960938, "global_step": 589842, "epoch": 7106} {"train_loss": -27.718366622924805, "global_step": 589843, "epoch": 7106} {"train_loss": -28.286535263061523, "global_step": 589844, "epoch": 7106} {"train_loss": -28.001264572143555, "global_step": 589845, "epoch": 7106} {"train_loss": -28.07318687438965, "global_step": 589846, "epoch": 7106} {"train_loss": -28.065353393554688, "global_step": 589847, "epoch": 7106} {"train_loss": -28.1264705657959, "global_step": 589848, "epoch": 7106} {"train_loss": -28.036733627319336, "global_step": 589849, "epoch": 7106} {"train_loss": -28.07806968688965, "global_step": 589850, "epoch": 7106} {"train_loss": -28.38685417175293, "global_step": 589851, "epoch": 7106} {"train_loss": -28.16737174987793, "global_step": 589852, "epoch": 7106} {"train_loss": -28.240442276000977, "global_step": 589853, "epoch": 7106} {"train_loss": -28.220258712768555, "global_step": 589854, "epoch": 7106} {"train_loss": -27.828336715698242, "global_step": 589855, "epoch": 7106} {"train_loss": -28.025333404541016, "global_step": 589856, "epoch": 7106} {"train_loss": -27.998044967651367, "global_step": 589857, "epoch": 7106} {"train_loss": -27.916858673095703, "global_step": 589858, "epoch": 7106} {"train_loss": -28.239709854125977, "global_step": 589859, "epoch": 7106} {"train_loss": -28.050058364868164, "global_step": 589860, "epoch": 7106} {"train_loss": -28.113086700439453, "global_step": 589861, "epoch": 7106} {"train_loss": -28.285877227783203, "global_step": 589862, "epoch": 7106} {"train_loss": -28.470001220703125, "global_step": 589863, "epoch": 7106} {"train_loss": -28.254810333251953, "global_step": 589864, "epoch": 7106} {"train_loss": -28.334680557250977, "global_step": 589865, "epoch": 7106} {"train_loss": -28.310016632080078, "global_step": 589866, "epoch": 7106} {"train_loss": -28.15462303161621, "global_step": 589867, "epoch": 7106} {"train_loss": -28.289365768432617, "global_step": 589868, "epoch": 7106} {"train_loss": -27.77919578552246, "global_step": 589869, "epoch": 7106} {"train_loss": -27.506696701049805, "global_step": 589870, "epoch": 7106} {"train_loss": -28.038339614868164, "global_step": 589871, "epoch": 7106} {"train_loss": -28.151403427124023, "global_step": 589872, "epoch": 7106} {"train_loss": -27.95136833190918, "global_step": 589873, "epoch": 7106} {"train_loss": -27.82321548461914, "global_step": 589874, "epoch": 7106} {"train_loss": -27.988143920898438, "global_step": 589875, "epoch": 7106} {"train_loss": -28.291385650634766, "global_step": 589876, "epoch": 7106} {"train_loss": -28.111896514892578, "global_step": 589877, "epoch": 7106} {"train_loss": -28.316909790039062, "global_step": 589878, "epoch": 7106} {"train_loss": -27.919696807861328, "global_step": 589879, "epoch": 7106} {"train_loss": -27.77101833849068, "global_step": 589880, "epoch": 7106, "val_loss": 6598272.5} {"train_loss": -27.05116844177246, "global_step": 589881, "epoch": 7107} {"train_loss": -25.337539672851562, "global_step": 589882, "epoch": 7107} {"train_loss": -27.104230880737305, "global_step": 589883, "epoch": 7107} {"train_loss": -26.249616622924805, "global_step": 589884, "epoch": 7107} {"train_loss": -26.824132919311523, "global_step": 589885, "epoch": 7107} {"train_loss": -26.265363693237305, "global_step": 589886, "epoch": 7107} {"train_loss": -27.371435165405273, "global_step": 589887, "epoch": 7107} {"train_loss": -26.629444122314453, "global_step": 589888, "epoch": 7107} {"train_loss": -26.878896713256836, "global_step": 589889, "epoch": 7107} {"train_loss": -27.116321563720703, "global_step": 589890, "epoch": 7107} {"train_loss": -27.08292579650879, "global_step": 589891, "epoch": 7107} {"train_loss": -27.458532333374023, "global_step": 589892, "epoch": 7107} {"train_loss": -27.36862564086914, "global_step": 589893, "epoch": 7107} {"train_loss": -27.278717041015625, "global_step": 589894, "epoch": 7107} {"train_loss": -26.879552841186523, "global_step": 589895, "epoch": 7107} {"train_loss": -27.536584854125977, "global_step": 589896, "epoch": 7107} {"train_loss": -27.64532470703125, "global_step": 589897, "epoch": 7107} {"train_loss": -27.226043701171875, "global_step": 589898, "epoch": 7107} {"train_loss": -27.389631271362305, "global_step": 589899, "epoch": 7107} {"train_loss": -27.50982666015625, "global_step": 589900, "epoch": 7107} {"train_loss": -27.11041259765625, "global_step": 589901, "epoch": 7107} {"train_loss": -27.70596694946289, "global_step": 589902, "epoch": 7107} {"train_loss": -27.62734031677246, "global_step": 589903, "epoch": 7107} {"train_loss": -27.28046989440918, "global_step": 589904, "epoch": 7107} {"train_loss": -27.278852462768555, "global_step": 589905, "epoch": 7107} {"train_loss": -27.78692054748535, "global_step": 589906, "epoch": 7107} {"train_loss": -27.857666015625, "global_step": 589907, "epoch": 7107} {"train_loss": -27.428258895874023, "global_step": 589908, "epoch": 7107} {"train_loss": -27.720483779907227, "global_step": 589909, "epoch": 7107} {"train_loss": -27.539779663085938, "global_step": 589910, "epoch": 7107} {"train_loss": -27.548419952392578, "global_step": 589911, "epoch": 7107} {"train_loss": -27.812902450561523, "global_step": 589912, "epoch": 7107} {"train_loss": -27.62955093383789, "global_step": 589913, "epoch": 7107} {"train_loss": -27.63157081604004, "global_step": 589914, "epoch": 7107} {"train_loss": -27.757190704345703, "global_step": 589915, "epoch": 7107} {"train_loss": -28.075347900390625, "global_step": 589916, "epoch": 7107} {"train_loss": -27.883102416992188, "global_step": 589917, "epoch": 7107} {"train_loss": -27.727563858032227, "global_step": 589918, "epoch": 7107} {"train_loss": -27.94797706604004, "global_step": 589919, "epoch": 7107} {"train_loss": -27.985193252563477, "global_step": 589920, "epoch": 7107} {"train_loss": -27.99909782409668, "global_step": 589921, "epoch": 7107} {"train_loss": -28.079008102416992, "global_step": 589922, "epoch": 7107} {"train_loss": -28.111602783203125, "global_step": 589923, "epoch": 7107} {"train_loss": -28.093591690063477, "global_step": 589924, "epoch": 7107} {"train_loss": -27.617807388305664, "global_step": 589925, "epoch": 7107} {"train_loss": -27.991804122924805, "global_step": 589926, "epoch": 7107} {"train_loss": -28.06556510925293, "global_step": 589927, "epoch": 7107} {"train_loss": -28.29511833190918, "global_step": 589928, "epoch": 7107} {"train_loss": -28.282779693603516, "global_step": 589929, "epoch": 7107} {"train_loss": -27.99072265625, "global_step": 589930, "epoch": 7107} {"train_loss": -27.9405574798584, "global_step": 589931, "epoch": 7107} {"train_loss": -28.236038208007812, "global_step": 589932, "epoch": 7107} {"train_loss": -28.12334632873535, "global_step": 589933, "epoch": 7107} {"train_loss": -28.0744571685791, "global_step": 589934, "epoch": 7107} {"train_loss": -28.227436065673828, "global_step": 589935, "epoch": 7107} {"train_loss": -28.31873893737793, "global_step": 589936, "epoch": 7107} {"train_loss": -28.107135772705078, "global_step": 589937, "epoch": 7107} {"train_loss": -27.96906089782715, "global_step": 589938, "epoch": 7107} {"train_loss": -27.812429428100586, "global_step": 589939, "epoch": 7107} {"train_loss": -27.774877548217773, "global_step": 589940, "epoch": 7107} {"train_loss": -28.00714683532715, "global_step": 589941, "epoch": 7107} {"train_loss": -27.7966365814209, "global_step": 589942, "epoch": 7107} {"train_loss": -28.027740478515625, "global_step": 589943, "epoch": 7107} {"train_loss": -28.13477897644043, "global_step": 589944, "epoch": 7107} {"train_loss": -28.158390045166016, "global_step": 589945, "epoch": 7107} {"train_loss": -28.27317237854004, "global_step": 589946, "epoch": 7107} {"train_loss": -28.26360511779785, "global_step": 589947, "epoch": 7107} {"train_loss": -28.20781898498535, "global_step": 589948, "epoch": 7107} {"train_loss": -27.944854736328125, "global_step": 589949, "epoch": 7107} {"train_loss": -28.021894454956055, "global_step": 589950, "epoch": 7107} {"train_loss": -27.864933013916016, "global_step": 589951, "epoch": 7107} {"train_loss": -28.125213623046875, "global_step": 589952, "epoch": 7107} {"train_loss": -28.0167179107666, "global_step": 589953, "epoch": 7107} {"train_loss": -27.636066436767578, "global_step": 589954, "epoch": 7107} {"train_loss": -27.49774169921875, "global_step": 589955, "epoch": 7107} {"train_loss": -27.5919246673584, "global_step": 589956, "epoch": 7107} {"train_loss": -27.967260360717773, "global_step": 589957, "epoch": 7107} {"train_loss": -27.82525062561035, "global_step": 589958, "epoch": 7107} {"train_loss": -27.363819122314453, "global_step": 589959, "epoch": 7107} {"train_loss": -27.966140747070312, "global_step": 589960, "epoch": 7107} {"train_loss": -28.244892120361328, "global_step": 589961, "epoch": 7107} {"train_loss": -27.349241256713867, "global_step": 589962, "epoch": 7107} {"train_loss": -27.676796350134424, "global_step": 589963, "epoch": 7107, "val_loss": 6519571.0} {"train_loss": -27.35107421875, "global_step": 589964, "epoch": 7108} {"train_loss": -27.602087020874023, "global_step": 589965, "epoch": 7108} {"train_loss": -27.85404396057129, "global_step": 589966, "epoch": 7108} {"train_loss": -27.590356826782227, "global_step": 589967, "epoch": 7108} {"train_loss": -27.26629066467285, "global_step": 589968, "epoch": 7108} {"train_loss": -27.87470817565918, "global_step": 589969, "epoch": 7108} {"train_loss": -27.51324462890625, "global_step": 589970, "epoch": 7108} {"train_loss": -27.72223472595215, "global_step": 589971, "epoch": 7108} {"train_loss": -27.290624618530273, "global_step": 589972, "epoch": 7108} {"train_loss": -27.664777755737305, "global_step": 589973, "epoch": 7108} {"train_loss": -27.821674346923828, "global_step": 589974, "epoch": 7108} {"train_loss": -27.76258659362793, "global_step": 589975, "epoch": 7108} {"train_loss": -27.246246337890625, "global_step": 589976, "epoch": 7108} {"train_loss": -27.24651527404785, "global_step": 589977, "epoch": 7108} {"train_loss": -27.4449520111084, "global_step": 589978, "epoch": 7108} {"train_loss": -28.03949546813965, "global_step": 589979, "epoch": 7108} {"train_loss": -27.3635311126709, "global_step": 589980, "epoch": 7108} {"train_loss": -27.873762130737305, "global_step": 589981, "epoch": 7108} {"train_loss": -27.81450843811035, "global_step": 589982, "epoch": 7108} {"train_loss": -27.656171798706055, "global_step": 589983, "epoch": 7108} {"train_loss": -27.835052490234375, "global_step": 589984, "epoch": 7108} {"train_loss": -27.70442008972168, "global_step": 589985, "epoch": 7108} {"train_loss": -27.943084716796875, "global_step": 589986, "epoch": 7108} {"train_loss": -27.73548698425293, "global_step": 589987, "epoch": 7108} {"train_loss": -27.67437171936035, "global_step": 589988, "epoch": 7108} {"train_loss": -27.958118438720703, "global_step": 589989, "epoch": 7108} {"train_loss": -27.84528160095215, "global_step": 589990, "epoch": 7108} {"train_loss": -27.666730880737305, "global_step": 589991, "epoch": 7108} {"train_loss": -27.672876358032227, "global_step": 589992, "epoch": 7108} {"train_loss": -27.936033248901367, "global_step": 589993, "epoch": 7108} {"train_loss": -27.767200469970703, "global_step": 589994, "epoch": 7108} {"train_loss": -28.36690330505371, "global_step": 589995, "epoch": 7108} {"train_loss": -27.687849044799805, "global_step": 589996, "epoch": 7108} {"train_loss": -28.155609130859375, "global_step": 589997, "epoch": 7108} {"train_loss": -27.989288330078125, "global_step": 589998, "epoch": 7108} {"train_loss": -27.8724308013916, "global_step": 589999, "epoch": 7108} {"train_loss": -27.500791549682617, "global_step": 590000, "epoch": 7108} {"train_loss": -27.665496826171875, "global_step": 590001, "epoch": 7108} {"train_loss": -28.187763214111328, "global_step": 590002, "epoch": 7108} {"train_loss": -27.95127296447754, "global_step": 590003, "epoch": 7108} {"train_loss": -27.43756103515625, "global_step": 590004, "epoch": 7108} {"train_loss": -28.4863338470459, "global_step": 590005, "epoch": 7108} {"train_loss": -27.671056747436523, "global_step": 590006, "epoch": 7108} {"train_loss": -27.732318878173828, "global_step": 590007, "epoch": 7108} {"train_loss": -28.137725830078125, "global_step": 590008, "epoch": 7108} {"train_loss": -28.112558364868164, "global_step": 590009, "epoch": 7108} {"train_loss": -28.39850425720215, "global_step": 590010, "epoch": 7108} {"train_loss": -28.391101837158203, "global_step": 590011, "epoch": 7108} {"train_loss": -28.093414306640625, "global_step": 590012, "epoch": 7108} {"train_loss": -28.08391761779785, "global_step": 590013, "epoch": 7108} {"train_loss": -28.1665096282959, "global_step": 590014, "epoch": 7108} {"train_loss": -28.035688400268555, "global_step": 590015, "epoch": 7108} {"train_loss": -28.441791534423828, "global_step": 590016, "epoch": 7108} {"train_loss": -27.940204620361328, "global_step": 590017, "epoch": 7108} {"train_loss": -28.316547393798828, "global_step": 590018, "epoch": 7108} {"train_loss": -28.05364990234375, "global_step": 590019, "epoch": 7108} {"train_loss": -28.350696563720703, "global_step": 590020, "epoch": 7108} {"train_loss": -28.769596099853516, "global_step": 590021, "epoch": 7108} {"train_loss": -28.3765869140625, "global_step": 590022, "epoch": 7108} {"train_loss": -28.09575843811035, "global_step": 590023, "epoch": 7108} {"train_loss": -28.4683780670166, "global_step": 590024, "epoch": 7108} {"train_loss": -28.403711318969727, "global_step": 590025, "epoch": 7108} {"train_loss": -28.35986328125, "global_step": 590026, "epoch": 7108} {"train_loss": -27.741376876831055, "global_step": 590027, "epoch": 7108} {"train_loss": -27.694263458251953, "global_step": 590028, "epoch": 7108} {"train_loss": -28.144393920898438, "global_step": 590029, "epoch": 7108} {"train_loss": -27.559412002563477, "global_step": 590030, "epoch": 7108} {"train_loss": -27.89056968688965, "global_step": 590031, "epoch": 7108} {"train_loss": -27.940155029296875, "global_step": 590032, "epoch": 7108} {"train_loss": -27.704633712768555, "global_step": 590033, "epoch": 7108} {"train_loss": -27.239959716796875, "global_step": 590034, "epoch": 7108} {"train_loss": -26.53948974609375, "global_step": 590035, "epoch": 7108} {"train_loss": -25.456623077392578, "global_step": 590036, "epoch": 7108} {"train_loss": -27.338611602783203, "global_step": 590037, "epoch": 7108} {"train_loss": -27.244369506835938, "global_step": 590038, "epoch": 7108} {"train_loss": -26.676162719726562, "global_step": 590039, "epoch": 7108} {"train_loss": -27.618026733398438, "global_step": 590040, "epoch": 7108} {"train_loss": -26.801105499267578, "global_step": 590041, "epoch": 7108} {"train_loss": -27.153467178344727, "global_step": 590042, "epoch": 7108} {"train_loss": -27.738513946533203, "global_step": 590043, "epoch": 7108} {"train_loss": -27.34478759765625, "global_step": 590044, "epoch": 7108} {"train_loss": -26.909503936767578, "global_step": 590045, "epoch": 7108} {"train_loss": -27.79477022929364, "global_step": 590046, "epoch": 7108, "val_loss": 6443037.0} {"train_loss": -23.687070846557617, "global_step": 590047, "epoch": 7109} {"train_loss": -25.548507690429688, "global_step": 590048, "epoch": 7109} {"train_loss": -25.07972526550293, "global_step": 590049, "epoch": 7109} {"train_loss": -25.90471839904785, "global_step": 590050, "epoch": 7109} {"train_loss": -24.905012130737305, "global_step": 590051, "epoch": 7109} {"train_loss": -26.121946334838867, "global_step": 590052, "epoch": 7109} {"train_loss": -26.24419593811035, "global_step": 590053, "epoch": 7109} {"train_loss": -26.09165382385254, "global_step": 590054, "epoch": 7109} {"train_loss": -26.132566452026367, "global_step": 590055, "epoch": 7109} {"train_loss": -26.871854782104492, "global_step": 590056, "epoch": 7109} {"train_loss": -26.221105575561523, "global_step": 590057, "epoch": 7109} {"train_loss": -26.391559600830078, "global_step": 590058, "epoch": 7109} {"train_loss": -26.562274932861328, "global_step": 590059, "epoch": 7109} {"train_loss": -26.923450469970703, "global_step": 590060, "epoch": 7109} {"train_loss": -26.432723999023438, "global_step": 590061, "epoch": 7109} {"train_loss": -26.306791305541992, "global_step": 590062, "epoch": 7109} {"train_loss": -27.046878814697266, "global_step": 590063, "epoch": 7109} {"train_loss": -27.068445205688477, "global_step": 590064, "epoch": 7109} {"train_loss": -27.114089965820312, "global_step": 590065, "epoch": 7109} {"train_loss": -26.500211715698242, "global_step": 590066, "epoch": 7109} {"train_loss": -26.88181495666504, "global_step": 590067, "epoch": 7109} {"train_loss": -27.189258575439453, "global_step": 590068, "epoch": 7109} {"train_loss": -27.03403663635254, "global_step": 590069, "epoch": 7109} {"train_loss": -27.250707626342773, "global_step": 590070, "epoch": 7109} {"train_loss": -27.004987716674805, "global_step": 590071, "epoch": 7109} {"train_loss": -27.153793334960938, "global_step": 590072, "epoch": 7109} {"train_loss": -27.239492416381836, "global_step": 590073, "epoch": 7109} {"train_loss": -27.096715927124023, "global_step": 590074, "epoch": 7109} {"train_loss": -27.755285263061523, "global_step": 590075, "epoch": 7109} {"train_loss": -27.2316837310791, "global_step": 590076, "epoch": 7109} {"train_loss": -27.492578506469727, "global_step": 590077, "epoch": 7109} {"train_loss": -27.463642120361328, "global_step": 590078, "epoch": 7109} {"train_loss": -27.515888214111328, "global_step": 590079, "epoch": 7109} {"train_loss": -27.612171173095703, "global_step": 590080, "epoch": 7109} {"train_loss": -27.19806480407715, "global_step": 590081, "epoch": 7109} {"train_loss": -27.493711471557617, "global_step": 590082, "epoch": 7109} {"train_loss": -27.41357421875, "global_step": 590083, "epoch": 7109} {"train_loss": -27.5238037109375, "global_step": 590084, "epoch": 7109} {"train_loss": -27.48371696472168, "global_step": 590085, "epoch": 7109} {"train_loss": -27.377338409423828, "global_step": 590086, "epoch": 7109} {"train_loss": -27.302961349487305, "global_step": 590087, "epoch": 7109} {"train_loss": -27.77842140197754, "global_step": 590088, "epoch": 7109} {"train_loss": -27.613605499267578, "global_step": 590089, "epoch": 7109} {"train_loss": -27.72344398498535, "global_step": 590090, "epoch": 7109} {"train_loss": -27.95399284362793, "global_step": 590091, "epoch": 7109} {"train_loss": -27.88624382019043, "global_step": 590092, "epoch": 7109} {"train_loss": -28.181486129760742, "global_step": 590093, "epoch": 7109} {"train_loss": -27.90937614440918, "global_step": 590094, "epoch": 7109} {"train_loss": -27.93499755859375, "global_step": 590095, "epoch": 7109} {"train_loss": -27.95926856994629, "global_step": 590096, "epoch": 7109} {"train_loss": -28.03937339782715, "global_step": 590097, "epoch": 7109} {"train_loss": -28.129852294921875, "global_step": 590098, "epoch": 7109} {"train_loss": -27.374439239501953, "global_step": 590099, "epoch": 7109} {"train_loss": -27.990076065063477, "global_step": 590100, "epoch": 7109} {"train_loss": -27.825199127197266, "global_step": 590101, "epoch": 7109} {"train_loss": -27.989715576171875, "global_step": 590102, "epoch": 7109} {"train_loss": -28.052160263061523, "global_step": 590103, "epoch": 7109} {"train_loss": -28.208036422729492, "global_step": 590104, "epoch": 7109} {"train_loss": -27.961353302001953, "global_step": 590105, "epoch": 7109} {"train_loss": -28.08914566040039, "global_step": 590106, "epoch": 7109} {"train_loss": -27.865619659423828, "global_step": 590107, "epoch": 7109} {"train_loss": -28.299976348876953, "global_step": 590108, "epoch": 7109} {"train_loss": -27.663496017456055, "global_step": 590109, "epoch": 7109} {"train_loss": -27.926910400390625, "global_step": 590110, "epoch": 7109} {"train_loss": -28.190160751342773, "global_step": 590111, "epoch": 7109} {"train_loss": -28.2786865234375, "global_step": 590112, "epoch": 7109} {"train_loss": -28.324848175048828, "global_step": 590113, "epoch": 7109} {"train_loss": -28.078693389892578, "global_step": 590114, "epoch": 7109} {"train_loss": -28.1614933013916, "global_step": 590115, "epoch": 7109} {"train_loss": -28.239990234375, "global_step": 590116, "epoch": 7109} {"train_loss": -28.182037353515625, "global_step": 590117, "epoch": 7109} {"train_loss": -28.084136962890625, "global_step": 590118, "epoch": 7109} {"train_loss": -28.12542152404785, "global_step": 590119, "epoch": 7109} {"train_loss": -28.23699378967285, "global_step": 590120, "epoch": 7109} {"train_loss": -28.359861373901367, "global_step": 590121, "epoch": 7109} {"train_loss": -27.933324813842773, "global_step": 590122, "epoch": 7109} {"train_loss": -27.959716796875, "global_step": 590123, "epoch": 7109} {"train_loss": -27.722009658813477, "global_step": 590124, "epoch": 7109} {"train_loss": -27.542770385742188, "global_step": 590125, "epoch": 7109} {"train_loss": -27.339740753173828, "global_step": 590126, "epoch": 7109} {"train_loss": -27.39063835144043, "global_step": 590127, "epoch": 7109} {"train_loss": -27.47894287109375, "global_step": 590128, "epoch": 7109} {"train_loss": -27.34535382741905, "global_step": 590129, "epoch": 7109, "val_loss": 6539575.0} {"train_loss": -27.237451553344727, "global_step": 590130, "epoch": 7110} {"train_loss": -26.368717193603516, "global_step": 590131, "epoch": 7110} {"train_loss": -26.1007137298584, "global_step": 590132, "epoch": 7110} {"train_loss": -27.335651397705078, "global_step": 590133, "epoch": 7110} {"train_loss": -27.050872802734375, "global_step": 590134, "epoch": 7110} {"train_loss": -26.573749542236328, "global_step": 590135, "epoch": 7110} {"train_loss": -26.981977462768555, "global_step": 590136, "epoch": 7110} {"train_loss": -26.9561710357666, "global_step": 590137, "epoch": 7110} {"train_loss": -27.537321090698242, "global_step": 590138, "epoch": 7110} {"train_loss": -27.170303344726562, "global_step": 590139, "epoch": 7110} {"train_loss": -27.147933959960938, "global_step": 590140, "epoch": 7110} {"train_loss": -27.51285743713379, "global_step": 590141, "epoch": 7110} {"train_loss": -27.392072677612305, "global_step": 590142, "epoch": 7110} {"train_loss": -27.439451217651367, "global_step": 590143, "epoch": 7110} {"train_loss": -27.587890625, "global_step": 590144, "epoch": 7110} {"train_loss": -27.45220375061035, "global_step": 590145, "epoch": 7110} {"train_loss": -27.57465171813965, "global_step": 590146, "epoch": 7110} {"train_loss": -27.620893478393555, "global_step": 590147, "epoch": 7110} {"train_loss": -27.852872848510742, "global_step": 590148, "epoch": 7110} {"train_loss": -27.656585693359375, "global_step": 590149, "epoch": 7110} {"train_loss": -27.441791534423828, "global_step": 590150, "epoch": 7110} {"train_loss": -27.778345108032227, "global_step": 590151, "epoch": 7110} {"train_loss": -27.521032333374023, "global_step": 590152, "epoch": 7110} {"train_loss": -26.92531394958496, "global_step": 590153, "epoch": 7110} {"train_loss": -27.807294845581055, "global_step": 590154, "epoch": 7110} {"train_loss": -27.744403839111328, "global_step": 590155, "epoch": 7110} {"train_loss": -27.631616592407227, "global_step": 590156, "epoch": 7110} {"train_loss": -27.34156608581543, "global_step": 590157, "epoch": 7110} {"train_loss": -27.583059310913086, "global_step": 590158, "epoch": 7110} {"train_loss": -27.833887100219727, "global_step": 590159, "epoch": 7110} {"train_loss": -27.580503463745117, "global_step": 590160, "epoch": 7110} {"train_loss": -27.441791534423828, "global_step": 590161, "epoch": 7110} {"train_loss": -27.762720108032227, "global_step": 590162, "epoch": 7110} {"train_loss": -27.65956687927246, "global_step": 590163, "epoch": 7110} {"train_loss": -27.73308753967285, "global_step": 590164, "epoch": 7110} {"train_loss": -27.541278839111328, "global_step": 590165, "epoch": 7110} {"train_loss": -27.867639541625977, "global_step": 590166, "epoch": 7110} {"train_loss": -27.88983726501465, "global_step": 590167, "epoch": 7110} {"train_loss": -27.834274291992188, "global_step": 590168, "epoch": 7110} {"train_loss": -28.1119441986084, "global_step": 590169, "epoch": 7110} {"train_loss": -27.669458389282227, "global_step": 590170, "epoch": 7110} {"train_loss": -27.715513229370117, "global_step": 590171, "epoch": 7110} {"train_loss": -28.042083740234375, "global_step": 590172, "epoch": 7110} {"train_loss": -27.889068603515625, "global_step": 590173, "epoch": 7110} {"train_loss": -27.8104248046875, "global_step": 590174, "epoch": 7110} {"train_loss": -27.889211654663086, "global_step": 590175, "epoch": 7110} {"train_loss": -28.29852867126465, "global_step": 590176, "epoch": 7110} {"train_loss": -28.0201473236084, "global_step": 590177, "epoch": 7110} {"train_loss": -28.14792823791504, "global_step": 590178, "epoch": 7110} {"train_loss": -28.208539962768555, "global_step": 590179, "epoch": 7110} {"train_loss": -28.128910064697266, "global_step": 590180, "epoch": 7110} {"train_loss": -28.201826095581055, "global_step": 590181, "epoch": 7110} {"train_loss": -28.110700607299805, "global_step": 590182, "epoch": 7110} {"train_loss": -28.293378829956055, "global_step": 590183, "epoch": 7110} {"train_loss": -28.417917251586914, "global_step": 590184, "epoch": 7110} {"train_loss": -28.07663345336914, "global_step": 590185, "epoch": 7110} {"train_loss": -28.066394805908203, "global_step": 590186, "epoch": 7110} {"train_loss": -27.94829750061035, "global_step": 590187, "epoch": 7110} {"train_loss": -28.20599365234375, "global_step": 590188, "epoch": 7110} {"train_loss": -28.198461532592773, "global_step": 590189, "epoch": 7110} {"train_loss": -28.046247482299805, "global_step": 590190, "epoch": 7110} {"train_loss": -28.121057510375977, "global_step": 590191, "epoch": 7110} {"train_loss": -27.84561538696289, "global_step": 590192, "epoch": 7110} {"train_loss": -27.777578353881836, "global_step": 590193, "epoch": 7110} {"train_loss": -27.8646240234375, "global_step": 590194, "epoch": 7110} {"train_loss": -28.408405303955078, "global_step": 590195, "epoch": 7110} {"train_loss": -28.284658432006836, "global_step": 590196, "epoch": 7110} {"train_loss": -28.0205020904541, "global_step": 590197, "epoch": 7110} {"train_loss": -28.30023765563965, "global_step": 590198, "epoch": 7110} {"train_loss": -28.088598251342773, "global_step": 590199, "epoch": 7110} {"train_loss": -28.143522262573242, "global_step": 590200, "epoch": 7110} {"train_loss": -28.111591339111328, "global_step": 590201, "epoch": 7110} {"train_loss": -27.977163314819336, "global_step": 590202, "epoch": 7110} {"train_loss": -28.43474769592285, "global_step": 590203, "epoch": 7110} {"train_loss": -28.50813102722168, "global_step": 590204, "epoch": 7110} {"train_loss": -28.417295455932617, "global_step": 590205, "epoch": 7110} {"train_loss": -28.448444366455078, "global_step": 590206, "epoch": 7110} {"train_loss": -28.684494018554688, "global_step": 590207, "epoch": 7110} {"train_loss": -28.384565353393555, "global_step": 590208, "epoch": 7110} {"train_loss": -28.74622917175293, "global_step": 590209, "epoch": 7110} {"train_loss": -28.37042808532715, "global_step": 590210, "epoch": 7110} {"train_loss": -28.313650131225586, "global_step": 590211, "epoch": 7110} {"train_loss": -27.801075556192053, "global_step": 590212, "epoch": 7110, "val_loss": 6582258.5} {"train_loss": -27.824676513671875, "global_step": 590213, "epoch": 7111} {"train_loss": -28.003049850463867, "global_step": 590214, "epoch": 7111} {"train_loss": -27.5072078704834, "global_step": 590215, "epoch": 7111} {"train_loss": -27.940298080444336, "global_step": 590216, "epoch": 7111} {"train_loss": -27.25394630432129, "global_step": 590217, "epoch": 7111} {"train_loss": -27.45306968688965, "global_step": 590218, "epoch": 7111} {"train_loss": -27.706623077392578, "global_step": 590219, "epoch": 7111} {"train_loss": -27.733564376831055, "global_step": 590220, "epoch": 7111} {"train_loss": -27.58124351501465, "global_step": 590221, "epoch": 7111} {"train_loss": -27.664594650268555, "global_step": 590222, "epoch": 7111} {"train_loss": -27.463171005249023, "global_step": 590223, "epoch": 7111} {"train_loss": -27.814558029174805, "global_step": 590224, "epoch": 7111} {"train_loss": -27.97772216796875, "global_step": 590225, "epoch": 7111} {"train_loss": -27.683889389038086, "global_step": 590226, "epoch": 7111} {"train_loss": -27.480728149414062, "global_step": 590227, "epoch": 7111} {"train_loss": -28.085590362548828, "global_step": 590228, "epoch": 7111} {"train_loss": -27.909521102905273, "global_step": 590229, "epoch": 7111} {"train_loss": -27.88704490661621, "global_step": 590230, "epoch": 7111} {"train_loss": -27.839963912963867, "global_step": 590231, "epoch": 7111} {"train_loss": -27.21600914001465, "global_step": 590232, "epoch": 7111} {"train_loss": -27.35481071472168, "global_step": 590233, "epoch": 7111} {"train_loss": -27.786808013916016, "global_step": 590234, "epoch": 7111} {"train_loss": -27.925281524658203, "global_step": 590235, "epoch": 7111} {"train_loss": -27.72321128845215, "global_step": 590236, "epoch": 7111} {"train_loss": -27.43157958984375, "global_step": 590237, "epoch": 7111} {"train_loss": -28.31235122680664, "global_step": 590238, "epoch": 7111} {"train_loss": -27.807947158813477, "global_step": 590239, "epoch": 7111} {"train_loss": -27.78980827331543, "global_step": 590240, "epoch": 7111} {"train_loss": -27.793338775634766, "global_step": 590241, "epoch": 7111} {"train_loss": -27.878637313842773, "global_step": 590242, "epoch": 7111} {"train_loss": -27.933889389038086, "global_step": 590243, "epoch": 7111} {"train_loss": -28.27842140197754, "global_step": 590244, "epoch": 7111} {"train_loss": -27.419294357299805, "global_step": 590245, "epoch": 7111} {"train_loss": -27.533859252929688, "global_step": 590246, "epoch": 7111} {"train_loss": -28.1524600982666, "global_step": 590247, "epoch": 7111} {"train_loss": -27.885305404663086, "global_step": 590248, "epoch": 7111} {"train_loss": -27.44904136657715, "global_step": 590249, "epoch": 7111} {"train_loss": -27.75418472290039, "global_step": 590250, "epoch": 7111} {"train_loss": -27.736608505249023, "global_step": 590251, "epoch": 7111} {"train_loss": -28.136804580688477, "global_step": 590252, "epoch": 7111} {"train_loss": -27.8115234375, "global_step": 590253, "epoch": 7111} {"train_loss": -27.653675079345703, "global_step": 590254, "epoch": 7111} {"train_loss": -27.423694610595703, "global_step": 590255, "epoch": 7111} {"train_loss": -27.946996688842773, "global_step": 590256, "epoch": 7111} {"train_loss": -27.717008590698242, "global_step": 590257, "epoch": 7111} {"train_loss": -27.856786727905273, "global_step": 590258, "epoch": 7111} {"train_loss": -27.895267486572266, "global_step": 590259, "epoch": 7111} {"train_loss": -28.2230224609375, "global_step": 590260, "epoch": 7111} {"train_loss": -27.98492431640625, "global_step": 590261, "epoch": 7111} {"train_loss": -27.92633056640625, "global_step": 590262, "epoch": 7111} {"train_loss": -27.65186882019043, "global_step": 590263, "epoch": 7111} {"train_loss": -27.85370445251465, "global_step": 590264, "epoch": 7111} {"train_loss": -28.087182998657227, "global_step": 590265, "epoch": 7111} {"train_loss": -28.04622459411621, "global_step": 590266, "epoch": 7111} {"train_loss": -28.040006637573242, "global_step": 590267, "epoch": 7111} {"train_loss": -28.233001708984375, "global_step": 590268, "epoch": 7111} {"train_loss": -28.063459396362305, "global_step": 590269, "epoch": 7111} {"train_loss": -28.13764762878418, "global_step": 590270, "epoch": 7111} {"train_loss": -28.09100341796875, "global_step": 590271, "epoch": 7111} {"train_loss": -28.34235954284668, "global_step": 590272, "epoch": 7111} {"train_loss": -28.39588737487793, "global_step": 590273, "epoch": 7111} {"train_loss": -28.00969886779785, "global_step": 590274, "epoch": 7111} {"train_loss": -28.297119140625, "global_step": 590275, "epoch": 7111} {"train_loss": -28.2729434967041, "global_step": 590276, "epoch": 7111} {"train_loss": -28.243112564086914, "global_step": 590277, "epoch": 7111} {"train_loss": -28.167896270751953, "global_step": 590278, "epoch": 7111} {"train_loss": -28.167341232299805, "global_step": 590279, "epoch": 7111} {"train_loss": -28.19339942932129, "global_step": 590280, "epoch": 7111} {"train_loss": -28.165510177612305, "global_step": 590281, "epoch": 7111} {"train_loss": -28.059314727783203, "global_step": 590282, "epoch": 7111} {"train_loss": -28.531757354736328, "global_step": 590283, "epoch": 7111} {"train_loss": -28.09468650817871, "global_step": 590284, "epoch": 7111} {"train_loss": -28.11331558227539, "global_step": 590285, "epoch": 7111} {"train_loss": -28.354124069213867, "global_step": 590286, "epoch": 7111} {"train_loss": -28.209287643432617, "global_step": 590287, "epoch": 7111} {"train_loss": -28.384902954101562, "global_step": 590288, "epoch": 7111} {"train_loss": -27.868549346923828, "global_step": 590289, "epoch": 7111} {"train_loss": -28.1190242767334, "global_step": 590290, "epoch": 7111} {"train_loss": -28.110803604125977, "global_step": 590291, "epoch": 7111} {"train_loss": -28.592243194580078, "global_step": 590292, "epoch": 7111} {"train_loss": -27.782453536987305, "global_step": 590293, "epoch": 7111} {"train_loss": -27.591114044189453, "global_step": 590294, "epoch": 7111} {"train_loss": -27.908454504357763, "global_step": 590295, "epoch": 7111, "val_loss": 6583425.5} {"train_loss": -26.386545181274414, "global_step": 590296, "epoch": 7112} {"train_loss": -26.316177368164062, "global_step": 590297, "epoch": 7112} {"train_loss": -27.24342155456543, "global_step": 590298, "epoch": 7112} {"train_loss": -27.395437240600586, "global_step": 590299, "epoch": 7112} {"train_loss": -26.68096351623535, "global_step": 590300, "epoch": 7112} {"train_loss": -27.71377944946289, "global_step": 590301, "epoch": 7112} {"train_loss": -27.467639923095703, "global_step": 590302, "epoch": 7112} {"train_loss": -27.579498291015625, "global_step": 590303, "epoch": 7112} {"train_loss": -27.498458862304688, "global_step": 590304, "epoch": 7112} {"train_loss": -27.764026641845703, "global_step": 590305, "epoch": 7112} {"train_loss": -27.512470245361328, "global_step": 590306, "epoch": 7112} {"train_loss": -28.162826538085938, "global_step": 590307, "epoch": 7112} {"train_loss": -27.43507194519043, "global_step": 590308, "epoch": 7112} {"train_loss": -27.970428466796875, "global_step": 590309, "epoch": 7112} {"train_loss": -27.860990524291992, "global_step": 590310, "epoch": 7112} {"train_loss": -27.922632217407227, "global_step": 590311, "epoch": 7112} {"train_loss": -27.682775497436523, "global_step": 590312, "epoch": 7112} {"train_loss": -27.78749656677246, "global_step": 590313, "epoch": 7112} {"train_loss": -27.788007736206055, "global_step": 590314, "epoch": 7112} {"train_loss": -27.348066329956055, "global_step": 590315, "epoch": 7112} {"train_loss": -27.5869197845459, "global_step": 590316, "epoch": 7112} {"train_loss": -27.789081573486328, "global_step": 590317, "epoch": 7112} {"train_loss": -28.093429565429688, "global_step": 590318, "epoch": 7112} {"train_loss": -28.010791778564453, "global_step": 590319, "epoch": 7112} {"train_loss": -27.940717697143555, "global_step": 590320, "epoch": 7112} {"train_loss": -27.59161949157715, "global_step": 590321, "epoch": 7112} {"train_loss": -27.270557403564453, "global_step": 590322, "epoch": 7112} {"train_loss": -28.01971435546875, "global_step": 590323, "epoch": 7112} {"train_loss": -27.938358306884766, "global_step": 590324, "epoch": 7112} {"train_loss": -27.634084701538086, "global_step": 590325, "epoch": 7112} {"train_loss": -27.841047286987305, "global_step": 590326, "epoch": 7112} {"train_loss": -28.089691162109375, "global_step": 590327, "epoch": 7112} {"train_loss": -27.43328285217285, "global_step": 590328, "epoch": 7112} {"train_loss": -27.908720016479492, "global_step": 590329, "epoch": 7112} {"train_loss": -27.687345504760742, "global_step": 590330, "epoch": 7112} {"train_loss": -27.95167350769043, "global_step": 590331, "epoch": 7112} {"train_loss": -28.160871505737305, "global_step": 590332, "epoch": 7112} {"train_loss": -27.710895538330078, "global_step": 590333, "epoch": 7112} {"train_loss": -28.068572998046875, "global_step": 590334, "epoch": 7112} {"train_loss": -27.432260513305664, "global_step": 590335, "epoch": 7112} {"train_loss": -27.896936416625977, "global_step": 590336, "epoch": 7112} {"train_loss": -27.629125595092773, "global_step": 590337, "epoch": 7112} {"train_loss": -27.935379028320312, "global_step": 590338, "epoch": 7112} {"train_loss": -28.092803955078125, "global_step": 590339, "epoch": 7112} {"train_loss": -27.998382568359375, "global_step": 590340, "epoch": 7112} {"train_loss": -27.78733253479004, "global_step": 590341, "epoch": 7112} {"train_loss": -28.17987632751465, "global_step": 590342, "epoch": 7112} {"train_loss": -28.0373477935791, "global_step": 590343, "epoch": 7112} {"train_loss": -27.863508224487305, "global_step": 590344, "epoch": 7112} {"train_loss": -28.01885414123535, "global_step": 590345, "epoch": 7112} {"train_loss": -28.209869384765625, "global_step": 590346, "epoch": 7112} {"train_loss": -28.08845329284668, "global_step": 590347, "epoch": 7112} {"train_loss": -27.75067710876465, "global_step": 590348, "epoch": 7112} {"train_loss": -27.85572624206543, "global_step": 590349, "epoch": 7112} {"train_loss": -27.861923217773438, "global_step": 590350, "epoch": 7112} {"train_loss": -28.25062370300293, "global_step": 590351, "epoch": 7112} {"train_loss": -27.502532958984375, "global_step": 590352, "epoch": 7112} {"train_loss": -27.678335189819336, "global_step": 590353, "epoch": 7112} {"train_loss": -27.649219512939453, "global_step": 590354, "epoch": 7112} {"train_loss": -27.744186401367188, "global_step": 590355, "epoch": 7112} {"train_loss": -27.94614601135254, "global_step": 590356, "epoch": 7112} {"train_loss": -28.1782169342041, "global_step": 590357, "epoch": 7112} {"train_loss": -27.98187828063965, "global_step": 590358, "epoch": 7112} {"train_loss": -27.955154418945312, "global_step": 590359, "epoch": 7112} {"train_loss": -27.874425888061523, "global_step": 590360, "epoch": 7112} {"train_loss": -28.027179718017578, "global_step": 590361, "epoch": 7112} {"train_loss": -27.86781120300293, "global_step": 590362, "epoch": 7112} {"train_loss": -28.012165069580078, "global_step": 590363, "epoch": 7112} {"train_loss": -27.80072021484375, "global_step": 590364, "epoch": 7112} {"train_loss": -27.995590209960938, "global_step": 590365, "epoch": 7112} {"train_loss": -27.719751358032227, "global_step": 590366, "epoch": 7112} {"train_loss": -28.504812240600586, "global_step": 590367, "epoch": 7112} {"train_loss": -28.221582412719727, "global_step": 590368, "epoch": 7112} {"train_loss": -28.298995971679688, "global_step": 590369, "epoch": 7112} {"train_loss": -27.918405532836914, "global_step": 590370, "epoch": 7112} {"train_loss": -28.008337020874023, "global_step": 590371, "epoch": 7112} {"train_loss": -27.79623794555664, "global_step": 590372, "epoch": 7112} {"train_loss": -26.890527725219727, "global_step": 590373, "epoch": 7112} {"train_loss": -26.788742065429688, "global_step": 590374, "epoch": 7112} {"train_loss": -27.80657386779785, "global_step": 590375, "epoch": 7112} {"train_loss": -28.2123966217041, "global_step": 590376, "epoch": 7112} {"train_loss": -27.444171905517578, "global_step": 590377, "epoch": 7112} {"train_loss": -27.753800725362385, "global_step": 590378, "epoch": 7112, "val_loss": 6568791.5} {"train_loss": -27.577198028564453, "global_step": 590379, "epoch": 7113} {"train_loss": -27.671045303344727, "global_step": 590380, "epoch": 7113} {"train_loss": -27.133493423461914, "global_step": 590381, "epoch": 7113} {"train_loss": -27.156225204467773, "global_step": 590382, "epoch": 7113} {"train_loss": -27.645246505737305, "global_step": 590383, "epoch": 7113} {"train_loss": -27.64491081237793, "global_step": 590384, "epoch": 7113} {"train_loss": -27.305255889892578, "global_step": 590385, "epoch": 7113} {"train_loss": -27.718158721923828, "global_step": 590386, "epoch": 7113} {"train_loss": -27.50381851196289, "global_step": 590387, "epoch": 7113} {"train_loss": -27.294178009033203, "global_step": 590388, "epoch": 7113} {"train_loss": -27.96253776550293, "global_step": 590389, "epoch": 7113} {"train_loss": -27.73291015625, "global_step": 590390, "epoch": 7113} {"train_loss": -27.48602867126465, "global_step": 590391, "epoch": 7113} {"train_loss": -27.52035903930664, "global_step": 590392, "epoch": 7113} {"train_loss": -27.396564483642578, "global_step": 590393, "epoch": 7113} {"train_loss": -27.698888778686523, "global_step": 590394, "epoch": 7113} {"train_loss": -27.276554107666016, "global_step": 590395, "epoch": 7113} {"train_loss": -27.770917892456055, "global_step": 590396, "epoch": 7113} {"train_loss": -27.574079513549805, "global_step": 590397, "epoch": 7113} {"train_loss": -27.786762237548828, "global_step": 590398, "epoch": 7113} {"train_loss": -27.734006881713867, "global_step": 590399, "epoch": 7113} {"train_loss": -27.599454879760742, "global_step": 590400, "epoch": 7113} {"train_loss": -27.627567291259766, "global_step": 590401, "epoch": 7113} {"train_loss": -28.11456871032715, "global_step": 590402, "epoch": 7113} {"train_loss": -27.43292236328125, "global_step": 590403, "epoch": 7113} {"train_loss": -27.92041015625, "global_step": 590404, "epoch": 7113} {"train_loss": -27.99114418029785, "global_step": 590405, "epoch": 7113} {"train_loss": -27.706893920898438, "global_step": 590406, "epoch": 7113} {"train_loss": -27.825336456298828, "global_step": 590407, "epoch": 7113} {"train_loss": -27.9977970123291, "global_step": 590408, "epoch": 7113} {"train_loss": -27.668317794799805, "global_step": 590409, "epoch": 7113} {"train_loss": -27.49286460876465, "global_step": 590410, "epoch": 7113} {"train_loss": -27.567813873291016, "global_step": 590411, "epoch": 7113} {"train_loss": -27.937376022338867, "global_step": 590412, "epoch": 7113} {"train_loss": -27.815631866455078, "global_step": 590413, "epoch": 7113} {"train_loss": -27.77277946472168, "global_step": 590414, "epoch": 7113} {"train_loss": -27.64297866821289, "global_step": 590415, "epoch": 7113} {"train_loss": -28.017440795898438, "global_step": 590416, "epoch": 7113} {"train_loss": -27.64375114440918, "global_step": 590417, "epoch": 7113} {"train_loss": -28.031763076782227, "global_step": 590418, "epoch": 7113} {"train_loss": -28.02570915222168, "global_step": 590419, "epoch": 7113} {"train_loss": -27.94423484802246, "global_step": 590420, "epoch": 7113} {"train_loss": -28.132394790649414, "global_step": 590421, "epoch": 7113} {"train_loss": -27.973539352416992, "global_step": 590422, "epoch": 7113} {"train_loss": -28.10116958618164, "global_step": 590423, "epoch": 7113} {"train_loss": -27.95929527282715, "global_step": 590424, "epoch": 7113} {"train_loss": -27.89277458190918, "global_step": 590425, "epoch": 7113} {"train_loss": -27.725849151611328, "global_step": 590426, "epoch": 7113} {"train_loss": -28.18561363220215, "global_step": 590427, "epoch": 7113} {"train_loss": -27.701257705688477, "global_step": 590428, "epoch": 7113} {"train_loss": -27.99655532836914, "global_step": 590429, "epoch": 7113} {"train_loss": -27.67689323425293, "global_step": 590430, "epoch": 7113} {"train_loss": -28.247827529907227, "global_step": 590431, "epoch": 7113} {"train_loss": -27.987897872924805, "global_step": 590432, "epoch": 7113} {"train_loss": -28.443347930908203, "global_step": 590433, "epoch": 7113} {"train_loss": -27.65797996520996, "global_step": 590434, "epoch": 7113} {"train_loss": -28.503665924072266, "global_step": 590435, "epoch": 7113} {"train_loss": -27.773040771484375, "global_step": 590436, "epoch": 7113} {"train_loss": -27.748350143432617, "global_step": 590437, "epoch": 7113} {"train_loss": -28.021238327026367, "global_step": 590438, "epoch": 7113} {"train_loss": -27.793136596679688, "global_step": 590439, "epoch": 7113} {"train_loss": -28.214263916015625, "global_step": 590440, "epoch": 7113} {"train_loss": -27.93706703186035, "global_step": 590441, "epoch": 7113} {"train_loss": -27.88385009765625, "global_step": 590442, "epoch": 7113} {"train_loss": -27.780176162719727, "global_step": 590443, "epoch": 7113} {"train_loss": -27.77039909362793, "global_step": 590444, "epoch": 7113} {"train_loss": -27.572101593017578, "global_step": 590445, "epoch": 7113} {"train_loss": -27.95110511779785, "global_step": 590446, "epoch": 7113} {"train_loss": -28.044321060180664, "global_step": 590447, "epoch": 7113} {"train_loss": -27.6968994140625, "global_step": 590448, "epoch": 7113} {"train_loss": -28.12533950805664, "global_step": 590449, "epoch": 7113} {"train_loss": -28.057968139648438, "global_step": 590450, "epoch": 7113} {"train_loss": -27.847394943237305, "global_step": 590451, "epoch": 7113} {"train_loss": -27.828153610229492, "global_step": 590452, "epoch": 7113} {"train_loss": -27.99526023864746, "global_step": 590453, "epoch": 7113} {"train_loss": -28.325153350830078, "global_step": 590454, "epoch": 7113} {"train_loss": -27.964176177978516, "global_step": 590455, "epoch": 7113} {"train_loss": -27.963592529296875, "global_step": 590456, "epoch": 7113} {"train_loss": -27.65203285217285, "global_step": 590457, "epoch": 7113} {"train_loss": -28.263031005859375, "global_step": 590458, "epoch": 7113} {"train_loss": -27.912778854370117, "global_step": 590459, "epoch": 7113} {"train_loss": -28.1109676361084, "global_step": 590460, "epoch": 7113} {"train_loss": -27.82472176149667, "global_step": 590461, "epoch": 7113, "val_loss": 6563799.0} {"train_loss": -26.966434478759766, "global_step": 590462, "epoch": 7114} {"train_loss": -26.647571563720703, "global_step": 590463, "epoch": 7114} {"train_loss": -27.074148178100586, "global_step": 590464, "epoch": 7114} {"train_loss": -27.688444137573242, "global_step": 590465, "epoch": 7114} {"train_loss": -26.948034286499023, "global_step": 590466, "epoch": 7114} {"train_loss": -27.60312843322754, "global_step": 590467, "epoch": 7114} {"train_loss": -26.807336807250977, "global_step": 590468, "epoch": 7114} {"train_loss": -27.103836059570312, "global_step": 590469, "epoch": 7114} {"train_loss": -27.54902458190918, "global_step": 590470, "epoch": 7114} {"train_loss": -26.484054565429688, "global_step": 590471, "epoch": 7114} {"train_loss": -27.032550811767578, "global_step": 590472, "epoch": 7114} {"train_loss": -27.424779891967773, "global_step": 590473, "epoch": 7114} {"train_loss": -26.963109970092773, "global_step": 590474, "epoch": 7114} {"train_loss": -27.028417587280273, "global_step": 590475, "epoch": 7114} {"train_loss": -27.01175880432129, "global_step": 590476, "epoch": 7114} {"train_loss": -27.832763671875, "global_step": 590477, "epoch": 7114} {"train_loss": -27.144392013549805, "global_step": 590478, "epoch": 7114} {"train_loss": -27.58349609375, "global_step": 590479, "epoch": 7114} {"train_loss": -27.136322021484375, "global_step": 590480, "epoch": 7114} {"train_loss": -27.58444595336914, "global_step": 590481, "epoch": 7114} {"train_loss": -27.34071922302246, "global_step": 590482, "epoch": 7114} {"train_loss": -27.158172607421875, "global_step": 590483, "epoch": 7114} {"train_loss": -27.283477783203125, "global_step": 590484, "epoch": 7114} {"train_loss": -27.474714279174805, "global_step": 590485, "epoch": 7114} {"train_loss": -27.423736572265625, "global_step": 590486, "epoch": 7114} {"train_loss": -27.615930557250977, "global_step": 590487, "epoch": 7114} {"train_loss": -27.3759822845459, "global_step": 590488, "epoch": 7114} {"train_loss": -27.591955184936523, "global_step": 590489, "epoch": 7114} {"train_loss": -27.615161895751953, "global_step": 590490, "epoch": 7114} {"train_loss": -27.332244873046875, "global_step": 590491, "epoch": 7114} {"train_loss": -27.570398330688477, "global_step": 590492, "epoch": 7114} {"train_loss": -28.075775146484375, "global_step": 590493, "epoch": 7114} {"train_loss": -27.525043487548828, "global_step": 590494, "epoch": 7114} {"train_loss": -27.819671630859375, "global_step": 590495, "epoch": 7114} {"train_loss": -27.72236442565918, "global_step": 590496, "epoch": 7114} {"train_loss": -27.909561157226562, "global_step": 590497, "epoch": 7114} {"train_loss": -27.84028434753418, "global_step": 590498, "epoch": 7114} {"train_loss": -27.8336238861084, "global_step": 590499, "epoch": 7114} {"train_loss": -27.9381160736084, "global_step": 590500, "epoch": 7114} {"train_loss": -28.241302490234375, "global_step": 590501, "epoch": 7114} {"train_loss": -28.10576820373535, "global_step": 590502, "epoch": 7114} {"train_loss": -28.21782875061035, "global_step": 590503, "epoch": 7114} {"train_loss": -28.0623836517334, "global_step": 590504, "epoch": 7114} {"train_loss": -27.560626983642578, "global_step": 590505, "epoch": 7114} {"train_loss": -27.993871688842773, "global_step": 590506, "epoch": 7114} {"train_loss": -28.070159912109375, "global_step": 590507, "epoch": 7114} {"train_loss": -28.12457275390625, "global_step": 590508, "epoch": 7114} {"train_loss": -27.964508056640625, "global_step": 590509, "epoch": 7114} {"train_loss": -28.020227432250977, "global_step": 590510, "epoch": 7114} {"train_loss": -27.887134552001953, "global_step": 590511, "epoch": 7114} {"train_loss": -28.03431510925293, "global_step": 590512, "epoch": 7114} {"train_loss": -27.8834285736084, "global_step": 590513, "epoch": 7114} {"train_loss": -28.017812728881836, "global_step": 590514, "epoch": 7114} {"train_loss": -27.9771671295166, "global_step": 590515, "epoch": 7114} {"train_loss": -28.411182403564453, "global_step": 590516, "epoch": 7114} {"train_loss": -27.948104858398438, "global_step": 590517, "epoch": 7114} {"train_loss": -28.309192657470703, "global_step": 590518, "epoch": 7114} {"train_loss": -28.302997589111328, "global_step": 590519, "epoch": 7114} {"train_loss": -28.451934814453125, "global_step": 590520, "epoch": 7114} {"train_loss": -28.1717529296875, "global_step": 590521, "epoch": 7114} {"train_loss": -28.0570068359375, "global_step": 590522, "epoch": 7114} {"train_loss": -28.100690841674805, "global_step": 590523, "epoch": 7114} {"train_loss": -28.15070915222168, "global_step": 590524, "epoch": 7114} {"train_loss": -28.03399085998535, "global_step": 590525, "epoch": 7114} {"train_loss": -28.055856704711914, "global_step": 590526, "epoch": 7114} {"train_loss": -28.241849899291992, "global_step": 590527, "epoch": 7114} {"train_loss": -28.15557861328125, "global_step": 590528, "epoch": 7114} {"train_loss": -28.156442642211914, "global_step": 590529, "epoch": 7114} {"train_loss": -27.742462158203125, "global_step": 590530, "epoch": 7114} {"train_loss": -26.917572021484375, "global_step": 590531, "epoch": 7114} {"train_loss": -27.27249526977539, "global_step": 590532, "epoch": 7114} {"train_loss": -27.912372589111328, "global_step": 590533, "epoch": 7114} {"train_loss": -28.070514678955078, "global_step": 590534, "epoch": 7114} {"train_loss": -27.439498901367188, "global_step": 590535, "epoch": 7114} {"train_loss": -27.866840362548828, "global_step": 590536, "epoch": 7114} {"train_loss": -28.233978271484375, "global_step": 590537, "epoch": 7114} {"train_loss": -28.0511531829834, "global_step": 590538, "epoch": 7114} {"train_loss": -28.10272216796875, "global_step": 590539, "epoch": 7114} {"train_loss": -27.9696102142334, "global_step": 590540, "epoch": 7114} {"train_loss": -27.785863876342773, "global_step": 590541, "epoch": 7114} {"train_loss": -27.632795333862305, "global_step": 590542, "epoch": 7114} {"train_loss": -28.0499267578125, "global_step": 590543, "epoch": 7114} {"train_loss": -27.71509694478598, "global_step": 590544, "epoch": 7114, "val_loss": 6570193.0} {"train_loss": -27.19422721862793, "global_step": 590545, "epoch": 7115} {"train_loss": -26.63701820373535, "global_step": 590546, "epoch": 7115} {"train_loss": -27.56711196899414, "global_step": 590547, "epoch": 7115} {"train_loss": -27.263776779174805, "global_step": 590548, "epoch": 7115} {"train_loss": -27.087488174438477, "global_step": 590549, "epoch": 7115} {"train_loss": -27.570043563842773, "global_step": 590550, "epoch": 7115} {"train_loss": -27.49600601196289, "global_step": 590551, "epoch": 7115} {"train_loss": -27.63397216796875, "global_step": 590552, "epoch": 7115} {"train_loss": -27.650121688842773, "global_step": 590553, "epoch": 7115} {"train_loss": -27.61616325378418, "global_step": 590554, "epoch": 7115} {"train_loss": -27.642065048217773, "global_step": 590555, "epoch": 7115} {"train_loss": -27.875885009765625, "global_step": 590556, "epoch": 7115} {"train_loss": -27.870758056640625, "global_step": 590557, "epoch": 7115} {"train_loss": -27.812936782836914, "global_step": 590558, "epoch": 7115} {"train_loss": -27.651355743408203, "global_step": 590559, "epoch": 7115} {"train_loss": -27.614850997924805, "global_step": 590560, "epoch": 7115} {"train_loss": -27.712646484375, "global_step": 590561, "epoch": 7115} {"train_loss": -27.8291072845459, "global_step": 590562, "epoch": 7115} {"train_loss": -28.261093139648438, "global_step": 590563, "epoch": 7115} {"train_loss": -27.77923011779785, "global_step": 590564, "epoch": 7115} {"train_loss": -27.9520206451416, "global_step": 590565, "epoch": 7115} {"train_loss": -28.06243324279785, "global_step": 590566, "epoch": 7115} {"train_loss": -27.98361587524414, "global_step": 590567, "epoch": 7115} {"train_loss": -27.97614860534668, "global_step": 590568, "epoch": 7115} {"train_loss": -27.729772567749023, "global_step": 590569, "epoch": 7115} {"train_loss": -27.79070472717285, "global_step": 590570, "epoch": 7115} {"train_loss": -27.939023971557617, "global_step": 590571, "epoch": 7115} {"train_loss": -28.006275177001953, "global_step": 590572, "epoch": 7115} {"train_loss": -28.237823486328125, "global_step": 590573, "epoch": 7115} {"train_loss": -28.07179069519043, "global_step": 590574, "epoch": 7115} {"train_loss": -28.272756576538086, "global_step": 590575, "epoch": 7115} {"train_loss": -27.82038688659668, "global_step": 590576, "epoch": 7115} {"train_loss": -28.011444091796875, "global_step": 590577, "epoch": 7115} {"train_loss": -28.087493896484375, "global_step": 590578, "epoch": 7115} {"train_loss": -27.946130752563477, "global_step": 590579, "epoch": 7115} {"train_loss": -28.34638023376465, "global_step": 590580, "epoch": 7115} {"train_loss": -28.138916015625, "global_step": 590581, "epoch": 7115} {"train_loss": -27.9266300201416, "global_step": 590582, "epoch": 7115} {"train_loss": -27.965198516845703, "global_step": 590583, "epoch": 7115} {"train_loss": -28.04401969909668, "global_step": 590584, "epoch": 7115} {"train_loss": -28.022729873657227, "global_step": 590585, "epoch": 7115} {"train_loss": -28.40279197692871, "global_step": 590586, "epoch": 7115} {"train_loss": -27.97671890258789, "global_step": 590587, "epoch": 7115} {"train_loss": -28.160810470581055, "global_step": 590588, "epoch": 7115} {"train_loss": -27.991104125976562, "global_step": 590589, "epoch": 7115} {"train_loss": -28.04792594909668, "global_step": 590590, "epoch": 7115} {"train_loss": -28.687387466430664, "global_step": 590591, "epoch": 7115} {"train_loss": -27.872684478759766, "global_step": 590592, "epoch": 7115} {"train_loss": -28.19048500061035, "global_step": 590593, "epoch": 7115} {"train_loss": -28.374332427978516, "global_step": 590594, "epoch": 7115} {"train_loss": -27.667089462280273, "global_step": 590595, "epoch": 7115} {"train_loss": -28.354450225830078, "global_step": 590596, "epoch": 7115} {"train_loss": -28.166555404663086, "global_step": 590597, "epoch": 7115} {"train_loss": -28.344236373901367, "global_step": 590598, "epoch": 7115} {"train_loss": -27.73917007446289, "global_step": 590599, "epoch": 7115} {"train_loss": -28.07185173034668, "global_step": 590600, "epoch": 7115} {"train_loss": -28.023544311523438, "global_step": 590601, "epoch": 7115} {"train_loss": -28.384939193725586, "global_step": 590602, "epoch": 7115} {"train_loss": -28.161209106445312, "global_step": 590603, "epoch": 7115} {"train_loss": -27.827016830444336, "global_step": 590604, "epoch": 7115} {"train_loss": -27.45428466796875, "global_step": 590605, "epoch": 7115} {"train_loss": -28.276391983032227, "global_step": 590606, "epoch": 7115} {"train_loss": -28.299331665039062, "global_step": 590607, "epoch": 7115} {"train_loss": -27.832799911499023, "global_step": 590608, "epoch": 7115} {"train_loss": -28.090045928955078, "global_step": 590609, "epoch": 7115} {"train_loss": -27.685209274291992, "global_step": 590610, "epoch": 7115} {"train_loss": -27.89700698852539, "global_step": 590611, "epoch": 7115} {"train_loss": -27.48919105529785, "global_step": 590612, "epoch": 7115} {"train_loss": -27.549406051635742, "global_step": 590613, "epoch": 7115} {"train_loss": -27.834699630737305, "global_step": 590614, "epoch": 7115} {"train_loss": -27.5364990234375, "global_step": 590615, "epoch": 7115} {"train_loss": -27.39093589782715, "global_step": 590616, "epoch": 7115} {"train_loss": -27.747039794921875, "global_step": 590617, "epoch": 7115} {"train_loss": -27.95600700378418, "global_step": 590618, "epoch": 7115} {"train_loss": -27.83799171447754, "global_step": 590619, "epoch": 7115} {"train_loss": -27.876708984375, "global_step": 590620, "epoch": 7115} {"train_loss": -27.819982528686523, "global_step": 590621, "epoch": 7115} {"train_loss": -28.009687423706055, "global_step": 590622, "epoch": 7115} {"train_loss": -27.53040885925293, "global_step": 590623, "epoch": 7115} {"train_loss": -27.456302642822266, "global_step": 590624, "epoch": 7115} {"train_loss": -27.850574493408203, "global_step": 590625, "epoch": 7115} {"train_loss": -27.266921997070312, "global_step": 590626, "epoch": 7115} {"train_loss": -27.85107755086508, "global_step": 590627, "epoch": 7115, "val_loss": 6528483.5} {"train_loss": -27.79266357421875, "global_step": 590628, "epoch": 7116} {"train_loss": -27.417652130126953, "global_step": 590629, "epoch": 7116} {"train_loss": -27.327163696289062, "global_step": 590630, "epoch": 7116} {"train_loss": -27.530353546142578, "global_step": 590631, "epoch": 7116} {"train_loss": -27.35841178894043, "global_step": 590632, "epoch": 7116} {"train_loss": -27.465076446533203, "global_step": 590633, "epoch": 7116} {"train_loss": -27.54412269592285, "global_step": 590634, "epoch": 7116} {"train_loss": -27.33053970336914, "global_step": 590635, "epoch": 7116} {"train_loss": -27.38807487487793, "global_step": 590636, "epoch": 7116} {"train_loss": -27.608469009399414, "global_step": 590637, "epoch": 7116} {"train_loss": -27.56927490234375, "global_step": 590638, "epoch": 7116} {"train_loss": -27.437671661376953, "global_step": 590639, "epoch": 7116} {"train_loss": -27.408002853393555, "global_step": 590640, "epoch": 7116} {"train_loss": -27.820022583007812, "global_step": 590641, "epoch": 7116} {"train_loss": -27.471277236938477, "global_step": 590642, "epoch": 7116} {"train_loss": -27.785131454467773, "global_step": 590643, "epoch": 7116} {"train_loss": -27.720703125, "global_step": 590644, "epoch": 7116} {"train_loss": -27.742727279663086, "global_step": 590645, "epoch": 7116} {"train_loss": -28.041213989257812, "global_step": 590646, "epoch": 7116} {"train_loss": -27.77385902404785, "global_step": 590647, "epoch": 7116} {"train_loss": -27.889087677001953, "global_step": 590648, "epoch": 7116} {"train_loss": -27.792652130126953, "global_step": 590649, "epoch": 7116} {"train_loss": -27.647571563720703, "global_step": 590650, "epoch": 7116} {"train_loss": -28.02449607849121, "global_step": 590651, "epoch": 7116} {"train_loss": -28.049158096313477, "global_step": 590652, "epoch": 7116} {"train_loss": -27.774198532104492, "global_step": 590653, "epoch": 7116} {"train_loss": -28.408004760742188, "global_step": 590654, "epoch": 7116} {"train_loss": -27.679651260375977, "global_step": 590655, "epoch": 7116} {"train_loss": -28.22379493713379, "global_step": 590656, "epoch": 7116} {"train_loss": -28.277490615844727, "global_step": 590657, "epoch": 7116} {"train_loss": -27.918561935424805, "global_step": 590658, "epoch": 7116} {"train_loss": -27.905689239501953, "global_step": 590659, "epoch": 7116} {"train_loss": -27.934223175048828, "global_step": 590660, "epoch": 7116} {"train_loss": -27.825031280517578, "global_step": 590661, "epoch": 7116} {"train_loss": -27.61590576171875, "global_step": 590662, "epoch": 7116} {"train_loss": -28.201566696166992, "global_step": 590663, "epoch": 7116} {"train_loss": -27.752470016479492, "global_step": 590664, "epoch": 7116} {"train_loss": -27.72773551940918, "global_step": 590665, "epoch": 7116} {"train_loss": -27.812225341796875, "global_step": 590666, "epoch": 7116} {"train_loss": -28.336883544921875, "global_step": 590667, "epoch": 7116} {"train_loss": -27.911828994750977, "global_step": 590668, "epoch": 7116} {"train_loss": -28.183027267456055, "global_step": 590669, "epoch": 7116} {"train_loss": -28.20235252380371, "global_step": 590670, "epoch": 7116} {"train_loss": -27.686065673828125, "global_step": 590671, "epoch": 7116} {"train_loss": -28.018817901611328, "global_step": 590672, "epoch": 7116} {"train_loss": -27.84368324279785, "global_step": 590673, "epoch": 7116} {"train_loss": -27.948923110961914, "global_step": 590674, "epoch": 7116} {"train_loss": -28.085041046142578, "global_step": 590675, "epoch": 7116} {"train_loss": -27.994495391845703, "global_step": 590676, "epoch": 7116} {"train_loss": -28.251739501953125, "global_step": 590677, "epoch": 7116} {"train_loss": -28.076879501342773, "global_step": 590678, "epoch": 7116} {"train_loss": -28.2598876953125, "global_step": 590679, "epoch": 7116} {"train_loss": -28.2082462310791, "global_step": 590680, "epoch": 7116} {"train_loss": -28.384475708007812, "global_step": 590681, "epoch": 7116} {"train_loss": -28.05735206604004, "global_step": 590682, "epoch": 7116} {"train_loss": -27.916563034057617, "global_step": 590683, "epoch": 7116} {"train_loss": -28.24566078186035, "global_step": 590684, "epoch": 7116} {"train_loss": -28.245145797729492, "global_step": 590685, "epoch": 7116} {"train_loss": -27.571645736694336, "global_step": 590686, "epoch": 7116} {"train_loss": -27.83314323425293, "global_step": 590687, "epoch": 7116} {"train_loss": -28.202362060546875, "global_step": 590688, "epoch": 7116} {"train_loss": -28.13886070251465, "global_step": 590689, "epoch": 7116} {"train_loss": -28.01905632019043, "global_step": 590690, "epoch": 7116} {"train_loss": -28.029571533203125, "global_step": 590691, "epoch": 7116} {"train_loss": -27.974273681640625, "global_step": 590692, "epoch": 7116} {"train_loss": -28.3078556060791, "global_step": 590693, "epoch": 7116} {"train_loss": -27.9085693359375, "global_step": 590694, "epoch": 7116} {"train_loss": -27.474231719970703, "global_step": 590695, "epoch": 7116} {"train_loss": -28.10690689086914, "global_step": 590696, "epoch": 7116} {"train_loss": -28.0197696685791, "global_step": 590697, "epoch": 7116} {"train_loss": -27.99664306640625, "global_step": 590698, "epoch": 7116} {"train_loss": -27.61821937561035, "global_step": 590699, "epoch": 7116} {"train_loss": -27.517780303955078, "global_step": 590700, "epoch": 7116} {"train_loss": -27.814924240112305, "global_step": 590701, "epoch": 7116} {"train_loss": -27.85357666015625, "global_step": 590702, "epoch": 7116} {"train_loss": -28.320484161376953, "global_step": 590703, "epoch": 7116} {"train_loss": -28.051427841186523, "global_step": 590704, "epoch": 7116} {"train_loss": -27.81404685974121, "global_step": 590705, "epoch": 7116} {"train_loss": -28.19563102722168, "global_step": 590706, "epoch": 7116} {"train_loss": -27.875308990478516, "global_step": 590707, "epoch": 7116} {"train_loss": -27.792821884155273, "global_step": 590708, "epoch": 7116} {"train_loss": -27.655868530273438, "global_step": 590709, "epoch": 7116} {"train_loss": -27.878866839121624, "global_step": 590710, "epoch": 7116, "val_loss": 6599168.0} {"train_loss": -27.435577392578125, "global_step": 590711, "epoch": 7117} {"train_loss": -27.32712173461914, "global_step": 590712, "epoch": 7117} {"train_loss": -26.52984046936035, "global_step": 590713, "epoch": 7117} {"train_loss": -27.063520431518555, "global_step": 590714, "epoch": 7117} {"train_loss": -26.97808265686035, "global_step": 590715, "epoch": 7117} {"train_loss": -26.58196449279785, "global_step": 590716, "epoch": 7117} {"train_loss": -27.129072189331055, "global_step": 590717, "epoch": 7117} {"train_loss": -27.09705924987793, "global_step": 590718, "epoch": 7117} {"train_loss": -27.21685218811035, "global_step": 590719, "epoch": 7117} {"train_loss": -27.5565242767334, "global_step": 590720, "epoch": 7117} {"train_loss": -27.349597930908203, "global_step": 590721, "epoch": 7117} {"train_loss": -27.22492790222168, "global_step": 590722, "epoch": 7117} {"train_loss": -27.412906646728516, "global_step": 590723, "epoch": 7117} {"train_loss": -27.577070236206055, "global_step": 590724, "epoch": 7117} {"train_loss": -27.211896896362305, "global_step": 590725, "epoch": 7117} {"train_loss": -27.89261817932129, "global_step": 590726, "epoch": 7117} {"train_loss": -27.377431869506836, "global_step": 590727, "epoch": 7117} {"train_loss": -27.735586166381836, "global_step": 590728, "epoch": 7117} {"train_loss": -27.518972396850586, "global_step": 590729, "epoch": 7117} {"train_loss": -28.195343017578125, "global_step": 590730, "epoch": 7117} {"train_loss": -27.94999122619629, "global_step": 590731, "epoch": 7117} {"train_loss": -27.580102920532227, "global_step": 590732, "epoch": 7117} {"train_loss": -27.83637046813965, "global_step": 590733, "epoch": 7117} {"train_loss": -28.004108428955078, "global_step": 590734, "epoch": 7117} {"train_loss": -27.6395320892334, "global_step": 590735, "epoch": 7117} {"train_loss": -27.909223556518555, "global_step": 590736, "epoch": 7117} {"train_loss": -28.32159423828125, "global_step": 590737, "epoch": 7117} {"train_loss": -28.081897735595703, "global_step": 590738, "epoch": 7117} {"train_loss": -27.914854049682617, "global_step": 590739, "epoch": 7117} {"train_loss": -27.94254493713379, "global_step": 590740, "epoch": 7117} {"train_loss": -28.073272705078125, "global_step": 590741, "epoch": 7117} {"train_loss": -27.852025985717773, "global_step": 590742, "epoch": 7117} {"train_loss": -28.147668838500977, "global_step": 590743, "epoch": 7117} {"train_loss": -27.72572898864746, "global_step": 590744, "epoch": 7117} {"train_loss": -27.904199600219727, "global_step": 590745, "epoch": 7117} {"train_loss": -27.777795791625977, "global_step": 590746, "epoch": 7117} {"train_loss": -27.971704483032227, "global_step": 590747, "epoch": 7117} {"train_loss": -28.078405380249023, "global_step": 590748, "epoch": 7117} {"train_loss": -28.287311553955078, "global_step": 590749, "epoch": 7117} {"train_loss": -28.32979393005371, "global_step": 590750, "epoch": 7117} {"train_loss": -28.352569580078125, "global_step": 590751, "epoch": 7117} {"train_loss": -27.863584518432617, "global_step": 590752, "epoch": 7117} {"train_loss": -28.27521324157715, "global_step": 590753, "epoch": 7117} {"train_loss": -28.1129093170166, "global_step": 590754, "epoch": 7117} {"train_loss": -28.349882125854492, "global_step": 590755, "epoch": 7117} {"train_loss": -28.232324600219727, "global_step": 590756, "epoch": 7117} {"train_loss": -28.10999870300293, "global_step": 590757, "epoch": 7117} {"train_loss": -27.950428009033203, "global_step": 590758, "epoch": 7117} {"train_loss": -28.13114356994629, "global_step": 590759, "epoch": 7117} {"train_loss": -28.248580932617188, "global_step": 590760, "epoch": 7117} {"train_loss": -28.518402099609375, "global_step": 590761, "epoch": 7117} {"train_loss": -28.002958297729492, "global_step": 590762, "epoch": 7117} {"train_loss": -28.421411514282227, "global_step": 590763, "epoch": 7117} {"train_loss": -27.87636375427246, "global_step": 590764, "epoch": 7117} {"train_loss": -28.197925567626953, "global_step": 590765, "epoch": 7117} {"train_loss": -28.204547882080078, "global_step": 590766, "epoch": 7117} {"train_loss": -28.177621841430664, "global_step": 590767, "epoch": 7117} {"train_loss": -28.001739501953125, "global_step": 590768, "epoch": 7117} {"train_loss": -28.08827018737793, "global_step": 590769, "epoch": 7117} {"train_loss": -28.184263229370117, "global_step": 590770, "epoch": 7117} {"train_loss": -28.55314064025879, "global_step": 590771, "epoch": 7117} {"train_loss": -27.89283561706543, "global_step": 590772, "epoch": 7117} {"train_loss": -27.86052894592285, "global_step": 590773, "epoch": 7117} {"train_loss": -27.95342445373535, "global_step": 590774, "epoch": 7117} {"train_loss": -28.161914825439453, "global_step": 590775, "epoch": 7117} {"train_loss": -28.237634658813477, "global_step": 590776, "epoch": 7117} {"train_loss": -27.64173698425293, "global_step": 590777, "epoch": 7117} {"train_loss": -27.63349723815918, "global_step": 590778, "epoch": 7117} {"train_loss": -27.690977096557617, "global_step": 590779, "epoch": 7117} {"train_loss": -27.20709800720215, "global_step": 590780, "epoch": 7117} {"train_loss": -27.179218292236328, "global_step": 590781, "epoch": 7117} {"train_loss": -26.477691650390625, "global_step": 590782, "epoch": 7117} {"train_loss": -27.065109252929688, "global_step": 590783, "epoch": 7117} {"train_loss": -27.999927520751953, "global_step": 590784, "epoch": 7117} {"train_loss": -27.028043746948242, "global_step": 590785, "epoch": 7117} {"train_loss": -27.318729400634766, "global_step": 590786, "epoch": 7117} {"train_loss": -27.663904190063477, "global_step": 590787, "epoch": 7117} {"train_loss": -27.200719833374023, "global_step": 590788, "epoch": 7117} {"train_loss": -27.72719383239746, "global_step": 590789, "epoch": 7117} {"train_loss": -27.58978843688965, "global_step": 590790, "epoch": 7117} {"train_loss": -27.943679809570312, "global_step": 590791, "epoch": 7117} {"train_loss": -27.64089012145996, "global_step": 590792, "epoch": 7117} {"train_loss": -27.78662784990058, "global_step": 590793, "epoch": 7117, "val_loss": 6551507.0} {"train_loss": -27.583938598632812, "global_step": 590794, "epoch": 7118} {"train_loss": -27.378759384155273, "global_step": 590795, "epoch": 7118} {"train_loss": -27.743000030517578, "global_step": 590796, "epoch": 7118} {"train_loss": -27.306081771850586, "global_step": 590797, "epoch": 7118} {"train_loss": -28.101179122924805, "global_step": 590798, "epoch": 7118} {"train_loss": -27.405582427978516, "global_step": 590799, "epoch": 7118} {"train_loss": -27.55560302734375, "global_step": 590800, "epoch": 7118} {"train_loss": -27.939563751220703, "global_step": 590801, "epoch": 7118} {"train_loss": -27.511829376220703, "global_step": 590802, "epoch": 7118} {"train_loss": -27.87647819519043, "global_step": 590803, "epoch": 7118} {"train_loss": -27.71571159362793, "global_step": 590804, "epoch": 7118} {"train_loss": -27.945165634155273, "global_step": 590805, "epoch": 7118} {"train_loss": -27.476049423217773, "global_step": 590806, "epoch": 7118} {"train_loss": -27.70218849182129, "global_step": 590807, "epoch": 7118} {"train_loss": -27.652347564697266, "global_step": 590808, "epoch": 7118} {"train_loss": -27.4018611907959, "global_step": 590809, "epoch": 7118} {"train_loss": -27.763853073120117, "global_step": 590810, "epoch": 7118} {"train_loss": -27.891666412353516, "global_step": 590811, "epoch": 7118} {"train_loss": -28.113012313842773, "global_step": 590812, "epoch": 7118} {"train_loss": -27.94069480895996, "global_step": 590813, "epoch": 7118} {"train_loss": -27.528974533081055, "global_step": 590814, "epoch": 7118} {"train_loss": -27.47174644470215, "global_step": 590815, "epoch": 7118} {"train_loss": -27.32086753845215, "global_step": 590816, "epoch": 7118} {"train_loss": -27.051513671875, "global_step": 590817, "epoch": 7118} {"train_loss": -27.25015640258789, "global_step": 590818, "epoch": 7118} {"train_loss": -28.092578887939453, "global_step": 590819, "epoch": 7118} {"train_loss": -27.696287155151367, "global_step": 590820, "epoch": 7118} {"train_loss": -27.7148380279541, "global_step": 590821, "epoch": 7118} {"train_loss": -27.922250747680664, "global_step": 590822, "epoch": 7118} {"train_loss": -27.75516128540039, "global_step": 590823, "epoch": 7118} {"train_loss": -28.079303741455078, "global_step": 590824, "epoch": 7118} {"train_loss": -27.980615615844727, "global_step": 590825, "epoch": 7118} {"train_loss": -28.09503173828125, "global_step": 590826, "epoch": 7118} {"train_loss": -27.82368278503418, "global_step": 590827, "epoch": 7118} {"train_loss": -28.263898849487305, "global_step": 590828, "epoch": 7118} {"train_loss": -27.877099990844727, "global_step": 590829, "epoch": 7118} {"train_loss": -28.356958389282227, "global_step": 590830, "epoch": 7118} {"train_loss": -27.807865142822266, "global_step": 590831, "epoch": 7118} {"train_loss": -28.166248321533203, "global_step": 590832, "epoch": 7118} {"train_loss": -28.102842330932617, "global_step": 590833, "epoch": 7118} {"train_loss": -28.1673526763916, "global_step": 590834, "epoch": 7118} {"train_loss": -27.99905776977539, "global_step": 590835, "epoch": 7118} {"train_loss": -28.24004554748535, "global_step": 590836, "epoch": 7118} {"train_loss": -27.87147331237793, "global_step": 590837, "epoch": 7118} {"train_loss": -28.03434181213379, "global_step": 590838, "epoch": 7118} {"train_loss": -28.0649356842041, "global_step": 590839, "epoch": 7118} {"train_loss": -28.21708106994629, "global_step": 590840, "epoch": 7118} {"train_loss": -28.094968795776367, "global_step": 590841, "epoch": 7118} {"train_loss": -28.280454635620117, "global_step": 590842, "epoch": 7118} {"train_loss": -27.986555099487305, "global_step": 590843, "epoch": 7118} {"train_loss": -28.228017807006836, "global_step": 590844, "epoch": 7118} {"train_loss": -27.998748779296875, "global_step": 590845, "epoch": 7118} {"train_loss": -28.082584381103516, "global_step": 590846, "epoch": 7118} {"train_loss": -27.989103317260742, "global_step": 590847, "epoch": 7118} {"train_loss": -27.888916015625, "global_step": 590848, "epoch": 7118} {"train_loss": -27.8532657623291, "global_step": 590849, "epoch": 7118} {"train_loss": -28.10454750061035, "global_step": 590850, "epoch": 7118} {"train_loss": -27.96034049987793, "global_step": 590851, "epoch": 7118} {"train_loss": -28.159210205078125, "global_step": 590852, "epoch": 7118} {"train_loss": -28.18169593811035, "global_step": 590853, "epoch": 7118} {"train_loss": -28.299482345581055, "global_step": 590854, "epoch": 7118} {"train_loss": -28.6473331451416, "global_step": 590855, "epoch": 7118} {"train_loss": -28.41309928894043, "global_step": 590856, "epoch": 7118} {"train_loss": -28.135435104370117, "global_step": 590857, "epoch": 7118} {"train_loss": -28.265247344970703, "global_step": 590858, "epoch": 7118} {"train_loss": -28.65986442565918, "global_step": 590859, "epoch": 7118} {"train_loss": -27.761991500854492, "global_step": 590860, "epoch": 7118} {"train_loss": -28.281940460205078, "global_step": 590861, "epoch": 7118} {"train_loss": -27.610021591186523, "global_step": 590862, "epoch": 7118} {"train_loss": -28.187103271484375, "global_step": 590863, "epoch": 7118} {"train_loss": -27.96500587463379, "global_step": 590864, "epoch": 7118} {"train_loss": -27.942594528198242, "global_step": 590865, "epoch": 7118} {"train_loss": -27.41120719909668, "global_step": 590866, "epoch": 7118} {"train_loss": -27.590518951416016, "global_step": 590867, "epoch": 7118} {"train_loss": -27.393945693969727, "global_step": 590868, "epoch": 7118} {"train_loss": -28.198461532592773, "global_step": 590869, "epoch": 7118} {"train_loss": -28.13019371032715, "global_step": 590870, "epoch": 7118} {"train_loss": -27.539905548095703, "global_step": 590871, "epoch": 7118} {"train_loss": -27.9520320892334, "global_step": 590872, "epoch": 7118} {"train_loss": -27.99152946472168, "global_step": 590873, "epoch": 7118} {"train_loss": -27.744131088256836, "global_step": 590874, "epoch": 7118} {"train_loss": -27.718114852905273, "global_step": 590875, "epoch": 7118} {"train_loss": -27.88786042454731, "global_step": 590876, "epoch": 7118, "val_loss": 6517417.0} {"train_loss": -27.291004180908203, "global_step": 590877, "epoch": 7119} {"train_loss": -26.859506607055664, "global_step": 590878, "epoch": 7119} {"train_loss": -27.382959365844727, "global_step": 590879, "epoch": 7119} {"train_loss": -27.315231323242188, "global_step": 590880, "epoch": 7119} {"train_loss": -26.76862144470215, "global_step": 590881, "epoch": 7119} {"train_loss": -26.970569610595703, "global_step": 590882, "epoch": 7119} {"train_loss": -27.27862548828125, "global_step": 590883, "epoch": 7119} {"train_loss": -27.182453155517578, "global_step": 590884, "epoch": 7119} {"train_loss": -27.336896896362305, "global_step": 590885, "epoch": 7119} {"train_loss": -27.475461959838867, "global_step": 590886, "epoch": 7119} {"train_loss": -27.351041793823242, "global_step": 590887, "epoch": 7119} {"train_loss": -27.67806053161621, "global_step": 590888, "epoch": 7119} {"train_loss": -27.332447052001953, "global_step": 590889, "epoch": 7119} {"train_loss": -27.14826011657715, "global_step": 590890, "epoch": 7119} {"train_loss": -27.25263786315918, "global_step": 590891, "epoch": 7119} {"train_loss": -27.465469360351562, "global_step": 590892, "epoch": 7119} {"train_loss": -27.444782257080078, "global_step": 590893, "epoch": 7119} {"train_loss": -27.756540298461914, "global_step": 590894, "epoch": 7119} {"train_loss": -27.73896598815918, "global_step": 590895, "epoch": 7119} {"train_loss": -27.889911651611328, "global_step": 590896, "epoch": 7119} {"train_loss": -27.528112411499023, "global_step": 590897, "epoch": 7119} {"train_loss": -27.733423233032227, "global_step": 590898, "epoch": 7119} {"train_loss": -27.705366134643555, "global_step": 590899, "epoch": 7119} {"train_loss": -27.6812686920166, "global_step": 590900, "epoch": 7119} {"train_loss": -27.817529678344727, "global_step": 590901, "epoch": 7119} {"train_loss": -27.850385665893555, "global_step": 590902, "epoch": 7119} {"train_loss": -27.569684982299805, "global_step": 590903, "epoch": 7119} {"train_loss": -27.668195724487305, "global_step": 590904, "epoch": 7119} {"train_loss": -27.75326919555664, "global_step": 590905, "epoch": 7119} {"train_loss": -28.012893676757812, "global_step": 590906, "epoch": 7119} {"train_loss": -27.649885177612305, "global_step": 590907, "epoch": 7119} {"train_loss": -27.781599044799805, "global_step": 590908, "epoch": 7119} {"train_loss": -27.761825561523438, "global_step": 590909, "epoch": 7119} {"train_loss": -27.941816329956055, "global_step": 590910, "epoch": 7119} {"train_loss": -27.8583927154541, "global_step": 590911, "epoch": 7119} {"train_loss": -27.67670249938965, "global_step": 590912, "epoch": 7119} {"train_loss": -28.011810302734375, "global_step": 590913, "epoch": 7119} {"train_loss": -27.92371940612793, "global_step": 590914, "epoch": 7119} {"train_loss": -28.04078483581543, "global_step": 590915, "epoch": 7119} {"train_loss": -28.07222557067871, "global_step": 590916, "epoch": 7119} {"train_loss": -28.277820587158203, "global_step": 590917, "epoch": 7119} {"train_loss": -28.025226593017578, "global_step": 590918, "epoch": 7119} {"train_loss": -28.08198356628418, "global_step": 590919, "epoch": 7119} {"train_loss": -28.072568893432617, "global_step": 590920, "epoch": 7119} {"train_loss": -28.444852828979492, "global_step": 590921, "epoch": 7119} {"train_loss": -28.216602325439453, "global_step": 590922, "epoch": 7119} {"train_loss": -28.12491798400879, "global_step": 590923, "epoch": 7119} {"train_loss": -28.121305465698242, "global_step": 590924, "epoch": 7119} {"train_loss": -27.761770248413086, "global_step": 590925, "epoch": 7119} {"train_loss": -28.081592559814453, "global_step": 590926, "epoch": 7119} {"train_loss": -27.91131591796875, "global_step": 590927, "epoch": 7119} {"train_loss": -28.13299560546875, "global_step": 590928, "epoch": 7119} {"train_loss": -28.248046875, "global_step": 590929, "epoch": 7119} {"train_loss": -28.62758445739746, "global_step": 590930, "epoch": 7119} {"train_loss": -27.70111083984375, "global_step": 590931, "epoch": 7119} {"train_loss": -27.9315185546875, "global_step": 590932, "epoch": 7119} {"train_loss": -27.573699951171875, "global_step": 590933, "epoch": 7119} {"train_loss": -27.47393226623535, "global_step": 590934, "epoch": 7119} {"train_loss": -27.331684112548828, "global_step": 590935, "epoch": 7119} {"train_loss": -27.579381942749023, "global_step": 590936, "epoch": 7119} {"train_loss": -28.2012939453125, "global_step": 590937, "epoch": 7119} {"train_loss": -27.633819580078125, "global_step": 590938, "epoch": 7119} {"train_loss": -27.88605308532715, "global_step": 590939, "epoch": 7119} {"train_loss": -27.956750869750977, "global_step": 590940, "epoch": 7119} {"train_loss": -27.762048721313477, "global_step": 590941, "epoch": 7119} {"train_loss": -28.22772216796875, "global_step": 590942, "epoch": 7119} {"train_loss": -28.066274642944336, "global_step": 590943, "epoch": 7119} {"train_loss": -28.033649444580078, "global_step": 590944, "epoch": 7119} {"train_loss": -27.946521759033203, "global_step": 590945, "epoch": 7119} {"train_loss": -27.964155197143555, "global_step": 590946, "epoch": 7119} {"train_loss": -27.885700225830078, "global_step": 590947, "epoch": 7119} {"train_loss": -28.117029190063477, "global_step": 590948, "epoch": 7119} {"train_loss": -28.347381591796875, "global_step": 590949, "epoch": 7119} {"train_loss": -27.87495231628418, "global_step": 590950, "epoch": 7119} {"train_loss": -28.199853897094727, "global_step": 590951, "epoch": 7119} {"train_loss": -28.017017364501953, "global_step": 590952, "epoch": 7119} {"train_loss": -28.047977447509766, "global_step": 590953, "epoch": 7119} {"train_loss": -27.807239532470703, "global_step": 590954, "epoch": 7119} {"train_loss": -28.201414108276367, "global_step": 590955, "epoch": 7119} {"train_loss": -28.13567543029785, "global_step": 590956, "epoch": 7119} {"train_loss": -27.7606258392334, "global_step": 590957, "epoch": 7119} {"train_loss": -27.966703414916992, "global_step": 590958, "epoch": 7119} {"train_loss": -27.8002757566521, "global_step": 590959, "epoch": 7119, "val_loss": 6512174.0} {"train_loss": -25.845294952392578, "global_step": 590960, "epoch": 7120} {"train_loss": -25.67682456970215, "global_step": 590961, "epoch": 7120} {"train_loss": -26.793264389038086, "global_step": 590962, "epoch": 7120} {"train_loss": -26.861082077026367, "global_step": 590963, "epoch": 7120} {"train_loss": -26.5179443359375, "global_step": 590964, "epoch": 7120} {"train_loss": -26.879270553588867, "global_step": 590965, "epoch": 7120} {"train_loss": -27.241641998291016, "global_step": 590966, "epoch": 7120} {"train_loss": -26.419260025024414, "global_step": 590967, "epoch": 7120} {"train_loss": -27.161752700805664, "global_step": 590968, "epoch": 7120} {"train_loss": -27.363208770751953, "global_step": 590969, "epoch": 7120} {"train_loss": -26.934375762939453, "global_step": 590970, "epoch": 7120} {"train_loss": -27.10916519165039, "global_step": 590971, "epoch": 7120} {"train_loss": -27.0378360748291, "global_step": 590972, "epoch": 7120} {"train_loss": -27.454309463500977, "global_step": 590973, "epoch": 7120} {"train_loss": -26.811872482299805, "global_step": 590974, "epoch": 7120} {"train_loss": -27.4647216796875, "global_step": 590975, "epoch": 7120} {"train_loss": -27.507963180541992, "global_step": 590976, "epoch": 7120} {"train_loss": -27.289554595947266, "global_step": 590977, "epoch": 7120} {"train_loss": -27.537290573120117, "global_step": 590978, "epoch": 7120} {"train_loss": -27.9489803314209, "global_step": 590979, "epoch": 7120} {"train_loss": -27.702136993408203, "global_step": 590980, "epoch": 7120} {"train_loss": -27.51592445373535, "global_step": 590981, "epoch": 7120} {"train_loss": -27.863065719604492, "global_step": 590982, "epoch": 7120} {"train_loss": -27.87875747680664, "global_step": 590983, "epoch": 7120} {"train_loss": -27.93690299987793, "global_step": 590984, "epoch": 7120} {"train_loss": -27.68132972717285, "global_step": 590985, "epoch": 7120} {"train_loss": -27.944904327392578, "global_step": 590986, "epoch": 7120} {"train_loss": -27.6411190032959, "global_step": 590987, "epoch": 7120} {"train_loss": -27.55757713317871, "global_step": 590988, "epoch": 7120} {"train_loss": -27.662397384643555, "global_step": 590989, "epoch": 7120} {"train_loss": -27.812957763671875, "global_step": 590990, "epoch": 7120} {"train_loss": -27.375675201416016, "global_step": 590991, "epoch": 7120} {"train_loss": -27.50089454650879, "global_step": 590992, "epoch": 7120} {"train_loss": -27.77884292602539, "global_step": 590993, "epoch": 7120} {"train_loss": -27.710315704345703, "global_step": 590994, "epoch": 7120} {"train_loss": -28.084609985351562, "global_step": 590995, "epoch": 7120} {"train_loss": -27.912378311157227, "global_step": 590996, "epoch": 7120} {"train_loss": -27.809064865112305, "global_step": 590997, "epoch": 7120} {"train_loss": -27.797016143798828, "global_step": 590998, "epoch": 7120} {"train_loss": -27.87530517578125, "global_step": 590999, "epoch": 7120} {"train_loss": -28.13014030456543, "global_step": 591000, "epoch": 7120} {"train_loss": -27.84650230407715, "global_step": 591001, "epoch": 7120} {"train_loss": -28.254135131835938, "global_step": 591002, "epoch": 7120} {"train_loss": -28.048532485961914, "global_step": 591003, "epoch": 7120} {"train_loss": -27.788938522338867, "global_step": 591004, "epoch": 7120} {"train_loss": -27.79073143005371, "global_step": 591005, "epoch": 7120} {"train_loss": -27.88092041015625, "global_step": 591006, "epoch": 7120} {"train_loss": -28.119482040405273, "global_step": 591007, "epoch": 7120} {"train_loss": -27.825428009033203, "global_step": 591008, "epoch": 7120} {"train_loss": -27.74708366394043, "global_step": 591009, "epoch": 7120} {"train_loss": -27.722681045532227, "global_step": 591010, "epoch": 7120} {"train_loss": -28.165380477905273, "global_step": 591011, "epoch": 7120} {"train_loss": -27.860198974609375, "global_step": 591012, "epoch": 7120} {"train_loss": -27.917255401611328, "global_step": 591013, "epoch": 7120} {"train_loss": -27.504541397094727, "global_step": 591014, "epoch": 7120} {"train_loss": -28.061725616455078, "global_step": 591015, "epoch": 7120} {"train_loss": -27.73028564453125, "global_step": 591016, "epoch": 7120} {"train_loss": -28.098556518554688, "global_step": 591017, "epoch": 7120} {"train_loss": -27.17002296447754, "global_step": 591018, "epoch": 7120} {"train_loss": -26.1429500579834, "global_step": 591019, "epoch": 7120} {"train_loss": -26.4666805267334, "global_step": 591020, "epoch": 7120} {"train_loss": -27.47930908203125, "global_step": 591021, "epoch": 7120} {"train_loss": -27.037261962890625, "global_step": 591022, "epoch": 7120} {"train_loss": -26.783552169799805, "global_step": 591023, "epoch": 7120} {"train_loss": -27.438810348510742, "global_step": 591024, "epoch": 7120} {"train_loss": -27.375782012939453, "global_step": 591025, "epoch": 7120} {"train_loss": -27.873960494995117, "global_step": 591026, "epoch": 7120} {"train_loss": -26.662662506103516, "global_step": 591027, "epoch": 7120} {"train_loss": -27.260602951049805, "global_step": 591028, "epoch": 7120} {"train_loss": -27.191930770874023, "global_step": 591029, "epoch": 7120} {"train_loss": -27.34541130065918, "global_step": 591030, "epoch": 7120} {"train_loss": -27.555438995361328, "global_step": 591031, "epoch": 7120} {"train_loss": -27.68653678894043, "global_step": 591032, "epoch": 7120} {"train_loss": -27.297571182250977, "global_step": 591033, "epoch": 7120} {"train_loss": -27.36749267578125, "global_step": 591034, "epoch": 7120} {"train_loss": -27.359907150268555, "global_step": 591035, "epoch": 7120} {"train_loss": -27.7673282623291, "global_step": 591036, "epoch": 7120} {"train_loss": -27.635990142822266, "global_step": 591037, "epoch": 7120} {"train_loss": -27.829639434814453, "global_step": 591038, "epoch": 7120} {"train_loss": -27.81341552734375, "global_step": 591039, "epoch": 7120} {"train_loss": -27.585132598876953, "global_step": 591040, "epoch": 7120} {"train_loss": -27.693283081054688, "global_step": 591041, "epoch": 7120} {"train_loss": -27.474090277430523, "global_step": 591042, "epoch": 7120, "val_loss": 6586085.0} {"train_loss": -27.448347091674805, "global_step": 591043, "epoch": 7121} {"train_loss": -27.338882446289062, "global_step": 591044, "epoch": 7121} {"train_loss": -27.52705192565918, "global_step": 591045, "epoch": 7121} {"train_loss": -27.468494415283203, "global_step": 591046, "epoch": 7121} {"train_loss": -27.393964767456055, "global_step": 591047, "epoch": 7121} {"train_loss": -27.88315200805664, "global_step": 591048, "epoch": 7121} {"train_loss": -27.32074546813965, "global_step": 591049, "epoch": 7121} {"train_loss": -27.561878204345703, "global_step": 591050, "epoch": 7121} {"train_loss": -27.650434494018555, "global_step": 591051, "epoch": 7121} {"train_loss": -27.810468673706055, "global_step": 591052, "epoch": 7121} {"train_loss": -27.635339736938477, "global_step": 591053, "epoch": 7121} {"train_loss": -27.4317684173584, "global_step": 591054, "epoch": 7121} {"train_loss": -27.809743881225586, "global_step": 591055, "epoch": 7121} {"train_loss": -27.764423370361328, "global_step": 591056, "epoch": 7121} {"train_loss": -27.93317985534668, "global_step": 591057, "epoch": 7121} {"train_loss": -27.942474365234375, "global_step": 591058, "epoch": 7121} {"train_loss": -27.480382919311523, "global_step": 591059, "epoch": 7121} {"train_loss": -28.18121910095215, "global_step": 591060, "epoch": 7121} {"train_loss": -27.507177352905273, "global_step": 591061, "epoch": 7121} {"train_loss": -27.54315185546875, "global_step": 591062, "epoch": 7121} {"train_loss": -28.111230850219727, "global_step": 591063, "epoch": 7121} {"train_loss": -27.861618041992188, "global_step": 591064, "epoch": 7121} {"train_loss": -28.038787841796875, "global_step": 591065, "epoch": 7121} {"train_loss": -28.16401481628418, "global_step": 591066, "epoch": 7121} {"train_loss": -27.79547691345215, "global_step": 591067, "epoch": 7121} {"train_loss": -27.886642456054688, "global_step": 591068, "epoch": 7121} {"train_loss": -28.012174606323242, "global_step": 591069, "epoch": 7121} {"train_loss": -28.196176528930664, "global_step": 591070, "epoch": 7121} {"train_loss": -28.197647094726562, "global_step": 591071, "epoch": 7121} {"train_loss": -27.842687606811523, "global_step": 591072, "epoch": 7121} {"train_loss": -28.1629581451416, "global_step": 591073, "epoch": 7121} {"train_loss": -28.0429744720459, "global_step": 591074, "epoch": 7121} {"train_loss": -27.87652015686035, "global_step": 591075, "epoch": 7121} {"train_loss": -27.963796615600586, "global_step": 591076, "epoch": 7121} {"train_loss": -27.947050094604492, "global_step": 591077, "epoch": 7121} {"train_loss": -28.018310546875, "global_step": 591078, "epoch": 7121} {"train_loss": -27.839141845703125, "global_step": 591079, "epoch": 7121} {"train_loss": -28.128498077392578, "global_step": 591080, "epoch": 7121} {"train_loss": -27.88690757751465, "global_step": 591081, "epoch": 7121} {"train_loss": -27.63355827331543, "global_step": 591082, "epoch": 7121} {"train_loss": -27.69577407836914, "global_step": 591083, "epoch": 7121} {"train_loss": -28.075056076049805, "global_step": 591084, "epoch": 7121} {"train_loss": -27.817047119140625, "global_step": 591085, "epoch": 7121} {"train_loss": -27.830419540405273, "global_step": 591086, "epoch": 7121} {"train_loss": -27.767175674438477, "global_step": 591087, "epoch": 7121} {"train_loss": -28.036880493164062, "global_step": 591088, "epoch": 7121} {"train_loss": -28.402576446533203, "global_step": 591089, "epoch": 7121} {"train_loss": -28.038190841674805, "global_step": 591090, "epoch": 7121} {"train_loss": -27.937849044799805, "global_step": 591091, "epoch": 7121} {"train_loss": -28.233325958251953, "global_step": 591092, "epoch": 7121} {"train_loss": -27.725004196166992, "global_step": 591093, "epoch": 7121} {"train_loss": -28.092132568359375, "global_step": 591094, "epoch": 7121} {"train_loss": -27.90476417541504, "global_step": 591095, "epoch": 7121} {"train_loss": -27.864423751831055, "global_step": 591096, "epoch": 7121} {"train_loss": -28.20345115661621, "global_step": 591097, "epoch": 7121} {"train_loss": -28.1750545501709, "global_step": 591098, "epoch": 7121} {"train_loss": -27.91727638244629, "global_step": 591099, "epoch": 7121} {"train_loss": -28.0324764251709, "global_step": 591100, "epoch": 7121} {"train_loss": -28.103473663330078, "global_step": 591101, "epoch": 7121} {"train_loss": -27.79377555847168, "global_step": 591102, "epoch": 7121} {"train_loss": -27.621469497680664, "global_step": 591103, "epoch": 7121} {"train_loss": -28.04429054260254, "global_step": 591104, "epoch": 7121} {"train_loss": -28.183734893798828, "global_step": 591105, "epoch": 7121} {"train_loss": -28.006322860717773, "global_step": 591106, "epoch": 7121} {"train_loss": -27.9602108001709, "global_step": 591107, "epoch": 7121} {"train_loss": -28.009735107421875, "global_step": 591108, "epoch": 7121} {"train_loss": -28.41908073425293, "global_step": 591109, "epoch": 7121} {"train_loss": -27.900678634643555, "global_step": 591110, "epoch": 7121} {"train_loss": -28.419889450073242, "global_step": 591111, "epoch": 7121} {"train_loss": -28.1475830078125, "global_step": 591112, "epoch": 7121} {"train_loss": -28.321903228759766, "global_step": 591113, "epoch": 7121} {"train_loss": -27.96571159362793, "global_step": 591114, "epoch": 7121} {"train_loss": -28.356216430664062, "global_step": 591115, "epoch": 7121} {"train_loss": -28.091632843017578, "global_step": 591116, "epoch": 7121} {"train_loss": -28.26856803894043, "global_step": 591117, "epoch": 7121} {"train_loss": -27.770374298095703, "global_step": 591118, "epoch": 7121} {"train_loss": -27.0793399810791, "global_step": 591119, "epoch": 7121} {"train_loss": -27.423919677734375, "global_step": 591120, "epoch": 7121} {"train_loss": -27.968244552612305, "global_step": 591121, "epoch": 7121} {"train_loss": -27.79678726196289, "global_step": 591122, "epoch": 7121} {"train_loss": -28.12386131286621, "global_step": 591123, "epoch": 7121} {"train_loss": -27.861148834228516, "global_step": 591124, "epoch": 7121} {"train_loss": -27.881942128560627, "global_step": 591125, "epoch": 7121, "val_loss": 6609497.5} {"train_loss": -26.04620361328125, "global_step": 591126, "epoch": 7122} {"train_loss": -27.27008628845215, "global_step": 591127, "epoch": 7122} {"train_loss": -27.32026481628418, "global_step": 591128, "epoch": 7122} {"train_loss": -25.82695960998535, "global_step": 591129, "epoch": 7122} {"train_loss": -27.57809829711914, "global_step": 591130, "epoch": 7122} {"train_loss": -26.692371368408203, "global_step": 591131, "epoch": 7122} {"train_loss": -27.797155380249023, "global_step": 591132, "epoch": 7122} {"train_loss": -26.701629638671875, "global_step": 591133, "epoch": 7122} {"train_loss": -27.31514549255371, "global_step": 591134, "epoch": 7122} {"train_loss": -26.90004539489746, "global_step": 591135, "epoch": 7122} {"train_loss": -27.345136642456055, "global_step": 591136, "epoch": 7122} {"train_loss": -27.375812530517578, "global_step": 591137, "epoch": 7122} {"train_loss": -27.409320831298828, "global_step": 591138, "epoch": 7122} {"train_loss": -27.376005172729492, "global_step": 591139, "epoch": 7122} {"train_loss": -27.51604652404785, "global_step": 591140, "epoch": 7122} {"train_loss": -27.33574867248535, "global_step": 591141, "epoch": 7122} {"train_loss": -27.370162963867188, "global_step": 591142, "epoch": 7122} {"train_loss": -27.81511878967285, "global_step": 591143, "epoch": 7122} {"train_loss": -27.80902099609375, "global_step": 591144, "epoch": 7122} {"train_loss": -27.55356788635254, "global_step": 591145, "epoch": 7122} {"train_loss": -27.441553115844727, "global_step": 591146, "epoch": 7122} {"train_loss": -27.5456485748291, "global_step": 591147, "epoch": 7122} {"train_loss": -27.47637939453125, "global_step": 591148, "epoch": 7122} {"train_loss": -27.7462215423584, "global_step": 591149, "epoch": 7122} {"train_loss": -27.8784122467041, "global_step": 591150, "epoch": 7122} {"train_loss": -27.589258193969727, "global_step": 591151, "epoch": 7122} {"train_loss": -27.70944595336914, "global_step": 591152, "epoch": 7122} {"train_loss": -28.132604598999023, "global_step": 591153, "epoch": 7122} {"train_loss": -28.205106735229492, "global_step": 591154, "epoch": 7122} {"train_loss": -27.85053825378418, "global_step": 591155, "epoch": 7122} {"train_loss": -27.553516387939453, "global_step": 591156, "epoch": 7122} {"train_loss": -28.217269897460938, "global_step": 591157, "epoch": 7122} {"train_loss": -27.9705753326416, "global_step": 591158, "epoch": 7122} {"train_loss": -28.034971237182617, "global_step": 591159, "epoch": 7122} {"train_loss": -27.933822631835938, "global_step": 591160, "epoch": 7122} {"train_loss": -28.09954833984375, "global_step": 591161, "epoch": 7122} {"train_loss": -28.114898681640625, "global_step": 591162, "epoch": 7122} {"train_loss": -28.181127548217773, "global_step": 591163, "epoch": 7122} {"train_loss": -28.04011344909668, "global_step": 591164, "epoch": 7122} {"train_loss": -27.618322372436523, "global_step": 591165, "epoch": 7122} {"train_loss": -28.020978927612305, "global_step": 591166, "epoch": 7122} {"train_loss": -28.17877769470215, "global_step": 591167, "epoch": 7122} {"train_loss": -28.084461212158203, "global_step": 591168, "epoch": 7122} {"train_loss": -28.238386154174805, "global_step": 591169, "epoch": 7122} {"train_loss": -28.265644073486328, "global_step": 591170, "epoch": 7122} {"train_loss": -27.55421257019043, "global_step": 591171, "epoch": 7122} {"train_loss": -27.95723533630371, "global_step": 591172, "epoch": 7122} {"train_loss": -28.053577423095703, "global_step": 591173, "epoch": 7122} {"train_loss": -28.2670841217041, "global_step": 591174, "epoch": 7122} {"train_loss": -28.101612091064453, "global_step": 591175, "epoch": 7122} {"train_loss": -28.411636352539062, "global_step": 591176, "epoch": 7122} {"train_loss": -27.938745498657227, "global_step": 591177, "epoch": 7122} {"train_loss": -27.737628936767578, "global_step": 591178, "epoch": 7122} {"train_loss": -27.845840454101562, "global_step": 591179, "epoch": 7122} {"train_loss": -28.140485763549805, "global_step": 591180, "epoch": 7122} {"train_loss": -27.805822372436523, "global_step": 591181, "epoch": 7122} {"train_loss": -27.9318904876709, "global_step": 591182, "epoch": 7122} {"train_loss": -28.146991729736328, "global_step": 591183, "epoch": 7122} {"train_loss": -28.076465606689453, "global_step": 591184, "epoch": 7122} {"train_loss": -27.909149169921875, "global_step": 591185, "epoch": 7122} {"train_loss": -27.746305465698242, "global_step": 591186, "epoch": 7122} {"train_loss": -27.962736129760742, "global_step": 591187, "epoch": 7122} {"train_loss": -28.131393432617188, "global_step": 591188, "epoch": 7122} {"train_loss": -27.929889678955078, "global_step": 591189, "epoch": 7122} {"train_loss": -28.085391998291016, "global_step": 591190, "epoch": 7122} {"train_loss": -27.711780548095703, "global_step": 591191, "epoch": 7122} {"train_loss": -28.06494140625, "global_step": 591192, "epoch": 7122} {"train_loss": -27.767053604125977, "global_step": 591193, "epoch": 7122} {"train_loss": -27.670026779174805, "global_step": 591194, "epoch": 7122} {"train_loss": -28.012094497680664, "global_step": 591195, "epoch": 7122} {"train_loss": -28.0211124420166, "global_step": 591196, "epoch": 7122} {"train_loss": -28.06154441833496, "global_step": 591197, "epoch": 7122} {"train_loss": -27.850494384765625, "global_step": 591198, "epoch": 7122} {"train_loss": -28.211347579956055, "global_step": 591199, "epoch": 7122} {"train_loss": -27.967065811157227, "global_step": 591200, "epoch": 7122} {"train_loss": -27.914304733276367, "global_step": 591201, "epoch": 7122} {"train_loss": -28.175189971923828, "global_step": 591202, "epoch": 7122} {"train_loss": -28.093530654907227, "global_step": 591203, "epoch": 7122} {"train_loss": -28.277145385742188, "global_step": 591204, "epoch": 7122} {"train_loss": -28.36040687561035, "global_step": 591205, "epoch": 7122} {"train_loss": -28.041513442993164, "global_step": 591206, "epoch": 7122} {"train_loss": -27.78521728515625, "global_step": 591207, "epoch": 7122} {"train_loss": -27.79374984373529, "global_step": 591208, "epoch": 7122, "val_loss": 6498127.5} {"train_loss": -26.867584228515625, "global_step": 591209, "epoch": 7123} {"train_loss": -26.8411808013916, "global_step": 591210, "epoch": 7123} {"train_loss": -27.573575973510742, "global_step": 591211, "epoch": 7123} {"train_loss": -26.674047470092773, "global_step": 591212, "epoch": 7123} {"train_loss": -26.879690170288086, "global_step": 591213, "epoch": 7123} {"train_loss": -26.6492977142334, "global_step": 591214, "epoch": 7123} {"train_loss": -27.33841896057129, "global_step": 591215, "epoch": 7123} {"train_loss": -27.54085350036621, "global_step": 591216, "epoch": 7123} {"train_loss": -27.249616622924805, "global_step": 591217, "epoch": 7123} {"train_loss": -27.446308135986328, "global_step": 591218, "epoch": 7123} {"train_loss": -27.080713272094727, "global_step": 591219, "epoch": 7123} {"train_loss": -27.755624771118164, "global_step": 591220, "epoch": 7123} {"train_loss": -27.291234970092773, "global_step": 591221, "epoch": 7123} {"train_loss": -27.568090438842773, "global_step": 591222, "epoch": 7123} {"train_loss": -27.67571449279785, "global_step": 591223, "epoch": 7123} {"train_loss": -27.201007843017578, "global_step": 591224, "epoch": 7123} {"train_loss": -27.547321319580078, "global_step": 591225, "epoch": 7123} {"train_loss": -27.386798858642578, "global_step": 591226, "epoch": 7123} {"train_loss": -28.044092178344727, "global_step": 591227, "epoch": 7123} {"train_loss": -27.513402938842773, "global_step": 591228, "epoch": 7123} {"train_loss": -27.5687198638916, "global_step": 591229, "epoch": 7123} {"train_loss": -27.5958309173584, "global_step": 591230, "epoch": 7123} {"train_loss": -27.35334587097168, "global_step": 591231, "epoch": 7123} {"train_loss": -27.74342918395996, "global_step": 591232, "epoch": 7123} {"train_loss": -28.21866226196289, "global_step": 591233, "epoch": 7123} {"train_loss": -27.86109733581543, "global_step": 591234, "epoch": 7123} {"train_loss": -28.04947280883789, "global_step": 591235, "epoch": 7123} {"train_loss": -27.29840087890625, "global_step": 591236, "epoch": 7123} {"train_loss": -27.720434188842773, "global_step": 591237, "epoch": 7123} {"train_loss": -27.806974411010742, "global_step": 591238, "epoch": 7123} {"train_loss": -27.596521377563477, "global_step": 591239, "epoch": 7123} {"train_loss": -27.995691299438477, "global_step": 591240, "epoch": 7123} {"train_loss": -27.907758712768555, "global_step": 591241, "epoch": 7123} {"train_loss": -28.13788414001465, "global_step": 591242, "epoch": 7123} {"train_loss": -28.217416763305664, "global_step": 591243, "epoch": 7123} {"train_loss": -28.250274658203125, "global_step": 591244, "epoch": 7123} {"train_loss": -28.19927978515625, "global_step": 591245, "epoch": 7123} {"train_loss": -28.035568237304688, "global_step": 591246, "epoch": 7123} {"train_loss": -27.923995971679688, "global_step": 591247, "epoch": 7123} {"train_loss": -28.1693058013916, "global_step": 591248, "epoch": 7123} {"train_loss": -28.06574058532715, "global_step": 591249, "epoch": 7123} {"train_loss": -27.755390167236328, "global_step": 591250, "epoch": 7123} {"train_loss": -27.91151237487793, "global_step": 591251, "epoch": 7123} {"train_loss": -28.004779815673828, "global_step": 591252, "epoch": 7123} {"train_loss": -28.13557243347168, "global_step": 591253, "epoch": 7123} {"train_loss": -28.55921745300293, "global_step": 591254, "epoch": 7123} {"train_loss": -27.982318878173828, "global_step": 591255, "epoch": 7123} {"train_loss": -28.225900650024414, "global_step": 591256, "epoch": 7123} {"train_loss": -28.33380699157715, "global_step": 591257, "epoch": 7123} {"train_loss": -28.045129776000977, "global_step": 591258, "epoch": 7123} {"train_loss": -28.351343154907227, "global_step": 591259, "epoch": 7123} {"train_loss": -28.280622482299805, "global_step": 591260, "epoch": 7123} {"train_loss": -28.139326095581055, "global_step": 591261, "epoch": 7123} {"train_loss": -28.20918083190918, "global_step": 591262, "epoch": 7123} {"train_loss": -28.292028427124023, "global_step": 591263, "epoch": 7123} {"train_loss": -28.424213409423828, "global_step": 591264, "epoch": 7123} {"train_loss": -28.645660400390625, "global_step": 591265, "epoch": 7123} {"train_loss": -28.035297393798828, "global_step": 591266, "epoch": 7123} {"train_loss": -28.223297119140625, "global_step": 591267, "epoch": 7123} {"train_loss": -27.975507736206055, "global_step": 591268, "epoch": 7123} {"train_loss": -28.31839370727539, "global_step": 591269, "epoch": 7123} {"train_loss": -28.149658203125, "global_step": 591270, "epoch": 7123} {"train_loss": -28.357498168945312, "global_step": 591271, "epoch": 7123} {"train_loss": -28.014373779296875, "global_step": 591272, "epoch": 7123} {"train_loss": -28.078662872314453, "global_step": 591273, "epoch": 7123} {"train_loss": -27.351476669311523, "global_step": 591274, "epoch": 7123} {"train_loss": -26.716846466064453, "global_step": 591275, "epoch": 7123} {"train_loss": -26.75238609313965, "global_step": 591276, "epoch": 7123} {"train_loss": -26.780588150024414, "global_step": 591277, "epoch": 7123} {"train_loss": -27.83564567565918, "global_step": 591278, "epoch": 7123} {"train_loss": -27.4497127532959, "global_step": 591279, "epoch": 7123} {"train_loss": -26.95199966430664, "global_step": 591280, "epoch": 7123} {"train_loss": -26.59524917602539, "global_step": 591281, "epoch": 7123} {"train_loss": -27.362375259399414, "global_step": 591282, "epoch": 7123} {"train_loss": -27.918943405151367, "global_step": 591283, "epoch": 7123} {"train_loss": -26.757553100585938, "global_step": 591284, "epoch": 7123} {"train_loss": -27.014362335205078, "global_step": 591285, "epoch": 7123} {"train_loss": -27.94367027282715, "global_step": 591286, "epoch": 7123} {"train_loss": -27.705564498901367, "global_step": 591287, "epoch": 7123} {"train_loss": -27.350812911987305, "global_step": 591288, "epoch": 7123} {"train_loss": -27.685138702392578, "global_step": 591289, "epoch": 7123} {"train_loss": -27.497180938720703, "global_step": 591290, "epoch": 7123} {"train_loss": -27.690863666764226, "global_step": 591291, "epoch": 7123, "val_loss": 6656207.0} {"train_loss": -27.13953971862793, "global_step": 591292, "epoch": 7124} {"train_loss": -26.633121490478516, "global_step": 591293, "epoch": 7124} {"train_loss": -26.777114868164062, "global_step": 591294, "epoch": 7124} {"train_loss": -26.765771865844727, "global_step": 591295, "epoch": 7124} {"train_loss": -26.384679794311523, "global_step": 591296, "epoch": 7124} {"train_loss": -26.635574340820312, "global_step": 591297, "epoch": 7124} {"train_loss": -27.1474609375, "global_step": 591298, "epoch": 7124} {"train_loss": -27.09120750427246, "global_step": 591299, "epoch": 7124} {"train_loss": -26.586145401000977, "global_step": 591300, "epoch": 7124} {"train_loss": -27.191299438476562, "global_step": 591301, "epoch": 7124} {"train_loss": -26.94179344177246, "global_step": 591302, "epoch": 7124} {"train_loss": -27.013671875, "global_step": 591303, "epoch": 7124} {"train_loss": -27.295562744140625, "global_step": 591304, "epoch": 7124} {"train_loss": -27.095556259155273, "global_step": 591305, "epoch": 7124} {"train_loss": -27.39969825744629, "global_step": 591306, "epoch": 7124} {"train_loss": -27.022998809814453, "global_step": 591307, "epoch": 7124} {"train_loss": -27.611310958862305, "global_step": 591308, "epoch": 7124} {"train_loss": -27.196455001831055, "global_step": 591309, "epoch": 7124} {"train_loss": -27.351226806640625, "global_step": 591310, "epoch": 7124} {"train_loss": -27.702707290649414, "global_step": 591311, "epoch": 7124} {"train_loss": -27.574331283569336, "global_step": 591312, "epoch": 7124} {"train_loss": -27.54890251159668, "global_step": 591313, "epoch": 7124} {"train_loss": -27.37993812561035, "global_step": 591314, "epoch": 7124} {"train_loss": -27.229398727416992, "global_step": 591315, "epoch": 7124} {"train_loss": -27.732013702392578, "global_step": 591316, "epoch": 7124} {"train_loss": -27.620885848999023, "global_step": 591317, "epoch": 7124} {"train_loss": -27.42327880859375, "global_step": 591318, "epoch": 7124} {"train_loss": -27.790546417236328, "global_step": 591319, "epoch": 7124} {"train_loss": -27.9722957611084, "global_step": 591320, "epoch": 7124} {"train_loss": -28.064062118530273, "global_step": 591321, "epoch": 7124} {"train_loss": -28.092145919799805, "global_step": 591322, "epoch": 7124} {"train_loss": -27.772842407226562, "global_step": 591323, "epoch": 7124} {"train_loss": -27.80647850036621, "global_step": 591324, "epoch": 7124} {"train_loss": -27.8695125579834, "global_step": 591325, "epoch": 7124} {"train_loss": -27.81521987915039, "global_step": 591326, "epoch": 7124} {"train_loss": -27.807687759399414, "global_step": 591327, "epoch": 7124} {"train_loss": -27.812885284423828, "global_step": 591328, "epoch": 7124} {"train_loss": -28.183561325073242, "global_step": 591329, "epoch": 7124} {"train_loss": -28.26028823852539, "global_step": 591330, "epoch": 7124} {"train_loss": -28.177947998046875, "global_step": 591331, "epoch": 7124} {"train_loss": -27.96998405456543, "global_step": 591332, "epoch": 7124} {"train_loss": -27.91012954711914, "global_step": 591333, "epoch": 7124} {"train_loss": -27.83673095703125, "global_step": 591334, "epoch": 7124} {"train_loss": -28.192371368408203, "global_step": 591335, "epoch": 7124} {"train_loss": -28.010961532592773, "global_step": 591336, "epoch": 7124} {"train_loss": -27.841938018798828, "global_step": 591337, "epoch": 7124} {"train_loss": -28.059356689453125, "global_step": 591338, "epoch": 7124} {"train_loss": -28.012624740600586, "global_step": 591339, "epoch": 7124} {"train_loss": -27.84821891784668, "global_step": 591340, "epoch": 7124} {"train_loss": -28.244770050048828, "global_step": 591341, "epoch": 7124} {"train_loss": -28.301223754882812, "global_step": 591342, "epoch": 7124} {"train_loss": -28.389738082885742, "global_step": 591343, "epoch": 7124} {"train_loss": -28.106891632080078, "global_step": 591344, "epoch": 7124} {"train_loss": -28.305883407592773, "global_step": 591345, "epoch": 7124} {"train_loss": -28.066434860229492, "global_step": 591346, "epoch": 7124} {"train_loss": -28.602548599243164, "global_step": 591347, "epoch": 7124} {"train_loss": -27.76654052734375, "global_step": 591348, "epoch": 7124} {"train_loss": -28.308578491210938, "global_step": 591349, "epoch": 7124} {"train_loss": -27.88212013244629, "global_step": 591350, "epoch": 7124} {"train_loss": -28.28378677368164, "global_step": 591351, "epoch": 7124} {"train_loss": -28.478519439697266, "global_step": 591352, "epoch": 7124} {"train_loss": -28.218353271484375, "global_step": 591353, "epoch": 7124} {"train_loss": -28.377029418945312, "global_step": 591354, "epoch": 7124} {"train_loss": -27.856063842773438, "global_step": 591355, "epoch": 7124} {"train_loss": -28.288557052612305, "global_step": 591356, "epoch": 7124} {"train_loss": -28.28607177734375, "global_step": 591357, "epoch": 7124} {"train_loss": -28.242292404174805, "global_step": 591358, "epoch": 7124} {"train_loss": -27.807498931884766, "global_step": 591359, "epoch": 7124} {"train_loss": -27.208890914916992, "global_step": 591360, "epoch": 7124} {"train_loss": -26.6213321685791, "global_step": 591361, "epoch": 7124} {"train_loss": -26.842605590820312, "global_step": 591362, "epoch": 7124} {"train_loss": -27.626855850219727, "global_step": 591363, "epoch": 7124} {"train_loss": -27.590978622436523, "global_step": 591364, "epoch": 7124} {"train_loss": -27.31654167175293, "global_step": 591365, "epoch": 7124} {"train_loss": -27.690099716186523, "global_step": 591366, "epoch": 7124} {"train_loss": -27.621631622314453, "global_step": 591367, "epoch": 7124} {"train_loss": -27.156204223632812, "global_step": 591368, "epoch": 7124} {"train_loss": -27.922170639038086, "global_step": 591369, "epoch": 7124} {"train_loss": -27.49039077758789, "global_step": 591370, "epoch": 7124} {"train_loss": -27.02369499206543, "global_step": 591371, "epoch": 7124} {"train_loss": -27.714574813842773, "global_step": 591372, "epoch": 7124} {"train_loss": -27.509458541870117, "global_step": 591373, "epoch": 7124} {"train_loss": -27.6853703648211, "global_step": 591374, "epoch": 7124, "val_loss": 6645184.0} {"train_loss": -26.8398494720459, "global_step": 591375, "epoch": 7125} {"train_loss": -27.37005615234375, "global_step": 591376, "epoch": 7125} {"train_loss": -26.671283721923828, "global_step": 591377, "epoch": 7125} {"train_loss": -27.366323471069336, "global_step": 591378, "epoch": 7125} {"train_loss": -26.978757858276367, "global_step": 591379, "epoch": 7125} {"train_loss": -27.09010124206543, "global_step": 591380, "epoch": 7125} {"train_loss": -27.416650772094727, "global_step": 591381, "epoch": 7125} {"train_loss": -26.979949951171875, "global_step": 591382, "epoch": 7125} {"train_loss": -26.90045166015625, "global_step": 591383, "epoch": 7125} {"train_loss": -27.36669921875, "global_step": 591384, "epoch": 7125} {"train_loss": -26.834808349609375, "global_step": 591385, "epoch": 7125} {"train_loss": -27.24186134338379, "global_step": 591386, "epoch": 7125} {"train_loss": -27.145553588867188, "global_step": 591387, "epoch": 7125} {"train_loss": -27.3215274810791, "global_step": 591388, "epoch": 7125} {"train_loss": -26.912145614624023, "global_step": 591389, "epoch": 7125} {"train_loss": -27.151697158813477, "global_step": 591390, "epoch": 7125} {"train_loss": -27.718286514282227, "global_step": 591391, "epoch": 7125} {"train_loss": -27.40278434753418, "global_step": 591392, "epoch": 7125} {"train_loss": -27.734033584594727, "global_step": 591393, "epoch": 7125} {"train_loss": -27.4506893157959, "global_step": 591394, "epoch": 7125} {"train_loss": -27.4793701171875, "global_step": 591395, "epoch": 7125} {"train_loss": -27.47006607055664, "global_step": 591396, "epoch": 7125} {"train_loss": -27.74720573425293, "global_step": 591397, "epoch": 7125} {"train_loss": -27.323606491088867, "global_step": 591398, "epoch": 7125} {"train_loss": -27.473886489868164, "global_step": 591399, "epoch": 7125} {"train_loss": -27.737226486206055, "global_step": 591400, "epoch": 7125} {"train_loss": -27.51844596862793, "global_step": 591401, "epoch": 7125} {"train_loss": -27.79318618774414, "global_step": 591402, "epoch": 7125} {"train_loss": -27.80698585510254, "global_step": 591403, "epoch": 7125} {"train_loss": -27.49652099609375, "global_step": 591404, "epoch": 7125} {"train_loss": -27.81123924255371, "global_step": 591405, "epoch": 7125} {"train_loss": -27.715503692626953, "global_step": 591406, "epoch": 7125} {"train_loss": -27.55328369140625, "global_step": 591407, "epoch": 7125} {"train_loss": -27.645877838134766, "global_step": 591408, "epoch": 7125} {"train_loss": -27.82899284362793, "global_step": 591409, "epoch": 7125} {"train_loss": -27.808095932006836, "global_step": 591410, "epoch": 7125} {"train_loss": -27.944091796875, "global_step": 591411, "epoch": 7125} {"train_loss": -27.78020668029785, "global_step": 591412, "epoch": 7125} {"train_loss": -27.84346580505371, "global_step": 591413, "epoch": 7125} {"train_loss": -27.626325607299805, "global_step": 591414, "epoch": 7125} {"train_loss": -28.05722999572754, "global_step": 591415, "epoch": 7125} {"train_loss": -27.612045288085938, "global_step": 591416, "epoch": 7125} {"train_loss": -28.012989044189453, "global_step": 591417, "epoch": 7125} {"train_loss": -28.274341583251953, "global_step": 591418, "epoch": 7125} {"train_loss": -27.9659366607666, "global_step": 591419, "epoch": 7125} {"train_loss": -27.798192977905273, "global_step": 591420, "epoch": 7125} {"train_loss": -27.918176651000977, "global_step": 591421, "epoch": 7125} {"train_loss": -28.254810333251953, "global_step": 591422, "epoch": 7125} {"train_loss": -28.462644577026367, "global_step": 591423, "epoch": 7125} {"train_loss": -28.48649024963379, "global_step": 591424, "epoch": 7125} {"train_loss": -28.025541305541992, "global_step": 591425, "epoch": 7125} {"train_loss": -28.237279891967773, "global_step": 591426, "epoch": 7125} {"train_loss": -28.13032341003418, "global_step": 591427, "epoch": 7125} {"train_loss": -27.98211669921875, "global_step": 591428, "epoch": 7125} {"train_loss": -28.226781845092773, "global_step": 591429, "epoch": 7125} {"train_loss": -28.450536727905273, "global_step": 591430, "epoch": 7125} {"train_loss": -27.99325942993164, "global_step": 591431, "epoch": 7125} {"train_loss": -28.190597534179688, "global_step": 591432, "epoch": 7125} {"train_loss": -28.1545467376709, "global_step": 591433, "epoch": 7125} {"train_loss": -28.165206909179688, "global_step": 591434, "epoch": 7125} {"train_loss": -28.03790283203125, "global_step": 591435, "epoch": 7125} {"train_loss": -28.201078414916992, "global_step": 591436, "epoch": 7125} {"train_loss": -28.284875869750977, "global_step": 591437, "epoch": 7125} {"train_loss": -28.126062393188477, "global_step": 591438, "epoch": 7125} {"train_loss": -28.04884147644043, "global_step": 591439, "epoch": 7125} {"train_loss": -28.024887084960938, "global_step": 591440, "epoch": 7125} {"train_loss": -28.178680419921875, "global_step": 591441, "epoch": 7125} {"train_loss": -28.363697052001953, "global_step": 591442, "epoch": 7125} {"train_loss": -28.196212768554688, "global_step": 591443, "epoch": 7125} {"train_loss": -28.096044540405273, "global_step": 591444, "epoch": 7125} {"train_loss": -28.163854598999023, "global_step": 591445, "epoch": 7125} {"train_loss": -28.34681510925293, "global_step": 591446, "epoch": 7125} {"train_loss": -28.363773345947266, "global_step": 591447, "epoch": 7125} {"train_loss": -27.92868423461914, "global_step": 591448, "epoch": 7125} {"train_loss": -28.54825782775879, "global_step": 591449, "epoch": 7125} {"train_loss": -28.44757080078125, "global_step": 591450, "epoch": 7125} {"train_loss": -28.169797897338867, "global_step": 591451, "epoch": 7125} {"train_loss": -27.988874435424805, "global_step": 591452, "epoch": 7125} {"train_loss": -27.460432052612305, "global_step": 591453, "epoch": 7125} {"train_loss": -26.779890060424805, "global_step": 591454, "epoch": 7125} {"train_loss": -26.96363639831543, "global_step": 591455, "epoch": 7125} {"train_loss": -27.033857345581055, "global_step": 591456, "epoch": 7125} {"train_loss": -27.748132567807854, "global_step": 591457, "epoch": 7125, "val_loss": 6600318.0} {"train_loss": -24.96771812438965, "global_step": 591458, "epoch": 7126} {"train_loss": -26.132139205932617, "global_step": 591459, "epoch": 7126} {"train_loss": -26.917646408081055, "global_step": 591460, "epoch": 7126} {"train_loss": -25.976974487304688, "global_step": 591461, "epoch": 7126} {"train_loss": -25.761255264282227, "global_step": 591462, "epoch": 7126} {"train_loss": -26.856260299682617, "global_step": 591463, "epoch": 7126} {"train_loss": -26.4088191986084, "global_step": 591464, "epoch": 7126} {"train_loss": -27.020313262939453, "global_step": 591465, "epoch": 7126} {"train_loss": -26.696826934814453, "global_step": 591466, "epoch": 7126} {"train_loss": -26.908828735351562, "global_step": 591467, "epoch": 7126} {"train_loss": -27.08674430847168, "global_step": 591468, "epoch": 7126} {"train_loss": -26.680448532104492, "global_step": 591469, "epoch": 7126} {"train_loss": -27.0108699798584, "global_step": 591470, "epoch": 7126} {"train_loss": -27.519454956054688, "global_step": 591471, "epoch": 7126} {"train_loss": -27.29090690612793, "global_step": 591472, "epoch": 7126} {"train_loss": -27.1030216217041, "global_step": 591473, "epoch": 7126} {"train_loss": -26.91192626953125, "global_step": 591474, "epoch": 7126} {"train_loss": -27.001922607421875, "global_step": 591475, "epoch": 7126} {"train_loss": -26.85650062561035, "global_step": 591476, "epoch": 7126} {"train_loss": -27.25309181213379, "global_step": 591477, "epoch": 7126} {"train_loss": -27.465789794921875, "global_step": 591478, "epoch": 7126} {"train_loss": -27.245758056640625, "global_step": 591479, "epoch": 7126} {"train_loss": -27.437637329101562, "global_step": 591480, "epoch": 7126} {"train_loss": -27.33489990234375, "global_step": 591481, "epoch": 7126} {"train_loss": -27.2698917388916, "global_step": 591482, "epoch": 7126} {"train_loss": -27.436132431030273, "global_step": 591483, "epoch": 7126} {"train_loss": -27.402801513671875, "global_step": 591484, "epoch": 7126} {"train_loss": -27.206357955932617, "global_step": 591485, "epoch": 7126} {"train_loss": -27.314319610595703, "global_step": 591486, "epoch": 7126} {"train_loss": -27.489561080932617, "global_step": 591487, "epoch": 7126} {"train_loss": -27.491758346557617, "global_step": 591488, "epoch": 7126} {"train_loss": -27.270069122314453, "global_step": 591489, "epoch": 7126} {"train_loss": -28.023923873901367, "global_step": 591490, "epoch": 7126} {"train_loss": -27.321989059448242, "global_step": 591491, "epoch": 7126} {"train_loss": -27.4481201171875, "global_step": 591492, "epoch": 7126} {"train_loss": -27.72369384765625, "global_step": 591493, "epoch": 7126} {"train_loss": -27.297815322875977, "global_step": 591494, "epoch": 7126} {"train_loss": -27.8229923248291, "global_step": 591495, "epoch": 7126} {"train_loss": -27.65411949157715, "global_step": 591496, "epoch": 7126} {"train_loss": -27.670639038085938, "global_step": 591497, "epoch": 7126} {"train_loss": -27.627145767211914, "global_step": 591498, "epoch": 7126} {"train_loss": -27.493396759033203, "global_step": 591499, "epoch": 7126} {"train_loss": -27.970075607299805, "global_step": 591500, "epoch": 7126} {"train_loss": -27.94390869140625, "global_step": 591501, "epoch": 7126} {"train_loss": -27.946752548217773, "global_step": 591502, "epoch": 7126} {"train_loss": -27.916980743408203, "global_step": 591503, "epoch": 7126} {"train_loss": -27.880542755126953, "global_step": 591504, "epoch": 7126} {"train_loss": -28.177682876586914, "global_step": 591505, "epoch": 7126} {"train_loss": -28.157032012939453, "global_step": 591506, "epoch": 7126} {"train_loss": -27.7752628326416, "global_step": 591507, "epoch": 7126} {"train_loss": -27.99859046936035, "global_step": 591508, "epoch": 7126} {"train_loss": -27.77699089050293, "global_step": 591509, "epoch": 7126} {"train_loss": -27.795795440673828, "global_step": 591510, "epoch": 7126} {"train_loss": -27.87334632873535, "global_step": 591511, "epoch": 7126} {"train_loss": -28.030797958374023, "global_step": 591512, "epoch": 7126} {"train_loss": -28.392547607421875, "global_step": 591513, "epoch": 7126} {"train_loss": -28.221540451049805, "global_step": 591514, "epoch": 7126} {"train_loss": -28.244049072265625, "global_step": 591515, "epoch": 7126} {"train_loss": -28.022001266479492, "global_step": 591516, "epoch": 7126} {"train_loss": -28.119733810424805, "global_step": 591517, "epoch": 7126} {"train_loss": -28.252456665039062, "global_step": 591518, "epoch": 7126} {"train_loss": -28.18440818786621, "global_step": 591519, "epoch": 7126} {"train_loss": -27.842422485351562, "global_step": 591520, "epoch": 7126} {"train_loss": -28.180932998657227, "global_step": 591521, "epoch": 7126} {"train_loss": -28.253950119018555, "global_step": 591522, "epoch": 7126} {"train_loss": -28.31984519958496, "global_step": 591523, "epoch": 7126} {"train_loss": -28.096826553344727, "global_step": 591524, "epoch": 7126} {"train_loss": -28.01047134399414, "global_step": 591525, "epoch": 7126} {"train_loss": -28.19120216369629, "global_step": 591526, "epoch": 7126} {"train_loss": -28.03077507019043, "global_step": 591527, "epoch": 7126} {"train_loss": -28.129804611206055, "global_step": 591528, "epoch": 7126} {"train_loss": -28.09100914001465, "global_step": 591529, "epoch": 7126} {"train_loss": -27.70623779296875, "global_step": 591530, "epoch": 7126} {"train_loss": -28.026498794555664, "global_step": 591531, "epoch": 7126} {"train_loss": -28.469013214111328, "global_step": 591532, "epoch": 7126} {"train_loss": -27.956235885620117, "global_step": 591533, "epoch": 7126} {"train_loss": -28.223419189453125, "global_step": 591534, "epoch": 7126} {"train_loss": -27.95318031311035, "global_step": 591535, "epoch": 7126} {"train_loss": -27.762731552124023, "global_step": 591536, "epoch": 7126} {"train_loss": -28.197223663330078, "global_step": 591537, "epoch": 7126} {"train_loss": -27.973114013671875, "global_step": 591538, "epoch": 7126} {"train_loss": -28.11471939086914, "global_step": 591539, "epoch": 7126} {"train_loss": -27.573855710316852, "global_step": 591540, "epoch": 7126, "val_loss": 6678000.5} {"train_loss": -27.153913497924805, "global_step": 591541, "epoch": 7127} {"train_loss": -26.967456817626953, "global_step": 591542, "epoch": 7127} {"train_loss": -27.350086212158203, "global_step": 591543, "epoch": 7127} {"train_loss": -27.800949096679688, "global_step": 591544, "epoch": 7127} {"train_loss": -27.804859161376953, "global_step": 591545, "epoch": 7127} {"train_loss": -27.564208984375, "global_step": 591546, "epoch": 7127} {"train_loss": -27.61383628845215, "global_step": 591547, "epoch": 7127} {"train_loss": -27.71748161315918, "global_step": 591548, "epoch": 7127} {"train_loss": -27.406095504760742, "global_step": 591549, "epoch": 7127} {"train_loss": -27.430402755737305, "global_step": 591550, "epoch": 7127} {"train_loss": -27.58975601196289, "global_step": 591551, "epoch": 7127} {"train_loss": -27.48779296875, "global_step": 591552, "epoch": 7127} {"train_loss": -27.671655654907227, "global_step": 591553, "epoch": 7127} {"train_loss": -27.47930335998535, "global_step": 591554, "epoch": 7127} {"train_loss": -27.161291122436523, "global_step": 591555, "epoch": 7127} {"train_loss": -28.148334503173828, "global_step": 591556, "epoch": 7127} {"train_loss": -27.7557315826416, "global_step": 591557, "epoch": 7127} {"train_loss": -27.804487228393555, "global_step": 591558, "epoch": 7127} {"train_loss": -27.89316177368164, "global_step": 591559, "epoch": 7127} {"train_loss": -28.095855712890625, "global_step": 591560, "epoch": 7127} {"train_loss": -28.163862228393555, "global_step": 591561, "epoch": 7127} {"train_loss": -27.90882682800293, "global_step": 591562, "epoch": 7127} {"train_loss": -28.14959144592285, "global_step": 591563, "epoch": 7127} {"train_loss": -28.327375411987305, "global_step": 591564, "epoch": 7127} {"train_loss": -27.7899227142334, "global_step": 591565, "epoch": 7127} {"train_loss": -27.8359432220459, "global_step": 591566, "epoch": 7127} {"train_loss": -27.91773796081543, "global_step": 591567, "epoch": 7127} {"train_loss": -27.846765518188477, "global_step": 591568, "epoch": 7127} {"train_loss": -28.08013916015625, "global_step": 591569, "epoch": 7127} {"train_loss": -28.276960372924805, "global_step": 591570, "epoch": 7127} {"train_loss": -27.943456649780273, "global_step": 591571, "epoch": 7127} {"train_loss": -27.417236328125, "global_step": 591572, "epoch": 7127} {"train_loss": -27.858509063720703, "global_step": 591573, "epoch": 7127} {"train_loss": -28.055200576782227, "global_step": 591574, "epoch": 7127} {"train_loss": -27.806310653686523, "global_step": 591575, "epoch": 7127} {"train_loss": -28.295129776000977, "global_step": 591576, "epoch": 7127} {"train_loss": -27.744108200073242, "global_step": 591577, "epoch": 7127} {"train_loss": -27.817142486572266, "global_step": 591578, "epoch": 7127} {"train_loss": -28.474103927612305, "global_step": 591579, "epoch": 7127} {"train_loss": -28.18088722229004, "global_step": 591580, "epoch": 7127} {"train_loss": -28.120336532592773, "global_step": 591581, "epoch": 7127} {"train_loss": -28.393247604370117, "global_step": 591582, "epoch": 7127} {"train_loss": -28.119766235351562, "global_step": 591583, "epoch": 7127} {"train_loss": -27.96023941040039, "global_step": 591584, "epoch": 7127} {"train_loss": -28.253131866455078, "global_step": 591585, "epoch": 7127} {"train_loss": -28.113637924194336, "global_step": 591586, "epoch": 7127} {"train_loss": -28.072513580322266, "global_step": 591587, "epoch": 7127} {"train_loss": -28.30231285095215, "global_step": 591588, "epoch": 7127} {"train_loss": -28.209217071533203, "global_step": 591589, "epoch": 7127} {"train_loss": -28.300724029541016, "global_step": 591590, "epoch": 7127} {"train_loss": -27.8955078125, "global_step": 591591, "epoch": 7127} {"train_loss": -27.965595245361328, "global_step": 591592, "epoch": 7127} {"train_loss": -28.37318229675293, "global_step": 591593, "epoch": 7127} {"train_loss": -28.081281661987305, "global_step": 591594, "epoch": 7127} {"train_loss": -28.029943466186523, "global_step": 591595, "epoch": 7127} {"train_loss": -28.2703857421875, "global_step": 591596, "epoch": 7127} {"train_loss": -28.10736083984375, "global_step": 591597, "epoch": 7127} {"train_loss": -28.0681209564209, "global_step": 591598, "epoch": 7127} {"train_loss": -27.796157836914062, "global_step": 591599, "epoch": 7127} {"train_loss": -27.840620040893555, "global_step": 591600, "epoch": 7127} {"train_loss": -28.061649322509766, "global_step": 591601, "epoch": 7127} {"train_loss": -27.651336669921875, "global_step": 591602, "epoch": 7127} {"train_loss": -27.858041763305664, "global_step": 591603, "epoch": 7127} {"train_loss": -28.11899757385254, "global_step": 591604, "epoch": 7127} {"train_loss": -27.5767879486084, "global_step": 591605, "epoch": 7127} {"train_loss": -27.188495635986328, "global_step": 591606, "epoch": 7127} {"train_loss": -28.227014541625977, "global_step": 591607, "epoch": 7127} {"train_loss": -27.564157485961914, "global_step": 591608, "epoch": 7127} {"train_loss": -27.486682891845703, "global_step": 591609, "epoch": 7127} {"train_loss": -27.6728572845459, "global_step": 591610, "epoch": 7127} {"train_loss": -27.9567928314209, "global_step": 591611, "epoch": 7127} {"train_loss": -27.4022159576416, "global_step": 591612, "epoch": 7127} {"train_loss": -27.794763565063477, "global_step": 591613, "epoch": 7127} {"train_loss": -27.647321701049805, "global_step": 591614, "epoch": 7127} {"train_loss": -27.8749942779541, "global_step": 591615, "epoch": 7127} {"train_loss": -27.67671012878418, "global_step": 591616, "epoch": 7127} {"train_loss": -27.762372970581055, "global_step": 591617, "epoch": 7127} {"train_loss": -27.97322654724121, "global_step": 591618, "epoch": 7127} {"train_loss": -27.50844383239746, "global_step": 591619, "epoch": 7127} {"train_loss": -28.090717315673828, "global_step": 591620, "epoch": 7127} {"train_loss": -27.862869262695312, "global_step": 591621, "epoch": 7127} {"train_loss": -28.31806755065918, "global_step": 591622, "epoch": 7127} {"train_loss": -27.868229417915803, "global_step": 591623, "epoch": 7127, "val_loss": 6689198.0} {"train_loss": -27.547616958618164, "global_step": 591624, "epoch": 7128} {"train_loss": -26.307113647460938, "global_step": 591625, "epoch": 7128} {"train_loss": -27.131732940673828, "global_step": 591626, "epoch": 7128} {"train_loss": -27.15549659729004, "global_step": 591627, "epoch": 7128} {"train_loss": -27.909805297851562, "global_step": 591628, "epoch": 7128} {"train_loss": -27.064558029174805, "global_step": 591629, "epoch": 7128} {"train_loss": -27.014062881469727, "global_step": 591630, "epoch": 7128} {"train_loss": -27.755767822265625, "global_step": 591631, "epoch": 7128} {"train_loss": -27.19184684753418, "global_step": 591632, "epoch": 7128} {"train_loss": -27.620222091674805, "global_step": 591633, "epoch": 7128} {"train_loss": -27.194522857666016, "global_step": 591634, "epoch": 7128} {"train_loss": -27.608617782592773, "global_step": 591635, "epoch": 7128} {"train_loss": -27.3609561920166, "global_step": 591636, "epoch": 7128} {"train_loss": -27.46014404296875, "global_step": 591637, "epoch": 7128} {"train_loss": -27.72962760925293, "global_step": 591638, "epoch": 7128} {"train_loss": -27.478097915649414, "global_step": 591639, "epoch": 7128} {"train_loss": -27.1519718170166, "global_step": 591640, "epoch": 7128} {"train_loss": -27.880512237548828, "global_step": 591641, "epoch": 7128} {"train_loss": -27.47340202331543, "global_step": 591642, "epoch": 7128} {"train_loss": -27.95792579650879, "global_step": 591643, "epoch": 7128} {"train_loss": -27.5661563873291, "global_step": 591644, "epoch": 7128} {"train_loss": -27.702497482299805, "global_step": 591645, "epoch": 7128} {"train_loss": -27.437314987182617, "global_step": 591646, "epoch": 7128} {"train_loss": -28.000381469726562, "global_step": 591647, "epoch": 7128} {"train_loss": -27.512853622436523, "global_step": 591648, "epoch": 7128} {"train_loss": -27.971561431884766, "global_step": 591649, "epoch": 7128} {"train_loss": -27.99191665649414, "global_step": 591650, "epoch": 7128} {"train_loss": -27.81634521484375, "global_step": 591651, "epoch": 7128} {"train_loss": -27.94891357421875, "global_step": 591652, "epoch": 7128} {"train_loss": -28.07801628112793, "global_step": 591653, "epoch": 7128} {"train_loss": -27.923437118530273, "global_step": 591654, "epoch": 7128} {"train_loss": -27.977930068969727, "global_step": 591655, "epoch": 7128} {"train_loss": -28.135522842407227, "global_step": 591656, "epoch": 7128} {"train_loss": -27.948881149291992, "global_step": 591657, "epoch": 7128} {"train_loss": -28.054889678955078, "global_step": 591658, "epoch": 7128} {"train_loss": -27.88653564453125, "global_step": 591659, "epoch": 7128} {"train_loss": -27.964582443237305, "global_step": 591660, "epoch": 7128} {"train_loss": -28.37848472595215, "global_step": 591661, "epoch": 7128} {"train_loss": -28.056421279907227, "global_step": 591662, "epoch": 7128} {"train_loss": -28.044408798217773, "global_step": 591663, "epoch": 7128} {"train_loss": -27.77646255493164, "global_step": 591664, "epoch": 7128} {"train_loss": -28.090131759643555, "global_step": 591665, "epoch": 7128} {"train_loss": -27.777891159057617, "global_step": 591666, "epoch": 7128} {"train_loss": -28.011627197265625, "global_step": 591667, "epoch": 7128} {"train_loss": -27.8603458404541, "global_step": 591668, "epoch": 7128} {"train_loss": -27.888940811157227, "global_step": 591669, "epoch": 7128} {"train_loss": -28.320154190063477, "global_step": 591670, "epoch": 7128} {"train_loss": -28.84783935546875, "global_step": 591671, "epoch": 7128} {"train_loss": -27.894210815429688, "global_step": 591672, "epoch": 7128} {"train_loss": -28.0034122467041, "global_step": 591673, "epoch": 7128} {"train_loss": -28.25799560546875, "global_step": 591674, "epoch": 7128} {"train_loss": -28.291946411132812, "global_step": 591675, "epoch": 7128} {"train_loss": -28.103857040405273, "global_step": 591676, "epoch": 7128} {"train_loss": -28.46882438659668, "global_step": 591677, "epoch": 7128} {"train_loss": -28.24025535583496, "global_step": 591678, "epoch": 7128} {"train_loss": -28.38800048828125, "global_step": 591679, "epoch": 7128} {"train_loss": -28.308441162109375, "global_step": 591680, "epoch": 7128} {"train_loss": -28.382984161376953, "global_step": 591681, "epoch": 7128} {"train_loss": -28.41718864440918, "global_step": 591682, "epoch": 7128} {"train_loss": -27.87625503540039, "global_step": 591683, "epoch": 7128} {"train_loss": -28.117359161376953, "global_step": 591684, "epoch": 7128} {"train_loss": -28.275617599487305, "global_step": 591685, "epoch": 7128} {"train_loss": -28.26478385925293, "global_step": 591686, "epoch": 7128} {"train_loss": -28.283140182495117, "global_step": 591687, "epoch": 7128} {"train_loss": -27.916852951049805, "global_step": 591688, "epoch": 7128} {"train_loss": -28.313756942749023, "global_step": 591689, "epoch": 7128} {"train_loss": -28.624359130859375, "global_step": 591690, "epoch": 7128} {"train_loss": -28.225011825561523, "global_step": 591691, "epoch": 7128} {"train_loss": -28.295392990112305, "global_step": 591692, "epoch": 7128} {"train_loss": -28.238447189331055, "global_step": 591693, "epoch": 7128} {"train_loss": -28.301502227783203, "global_step": 591694, "epoch": 7128} {"train_loss": -28.39460563659668, "global_step": 591695, "epoch": 7128} {"train_loss": -28.27585220336914, "global_step": 591696, "epoch": 7128} {"train_loss": -28.031591415405273, "global_step": 591697, "epoch": 7128} {"train_loss": -27.84722900390625, "global_step": 591698, "epoch": 7128} {"train_loss": -27.943002700805664, "global_step": 591699, "epoch": 7128} {"train_loss": -27.721677780151367, "global_step": 591700, "epoch": 7128} {"train_loss": -27.939245223999023, "global_step": 591701, "epoch": 7128} {"train_loss": -27.664011001586914, "global_step": 591702, "epoch": 7128} {"train_loss": -27.82813835144043, "global_step": 591703, "epoch": 7128} {"train_loss": -27.7213077545166, "global_step": 591704, "epoch": 7128} {"train_loss": -27.999677658081055, "global_step": 591705, "epoch": 7128} {"train_loss": -27.905021299798804, "global_step": 591706, "epoch": 7128, "val_loss": 6566374.0} {"train_loss": -26.97591209411621, "global_step": 591707, "epoch": 7129} {"train_loss": -26.758264541625977, "global_step": 591708, "epoch": 7129} {"train_loss": -27.525503158569336, "global_step": 591709, "epoch": 7129} {"train_loss": -26.909116744995117, "global_step": 591710, "epoch": 7129} {"train_loss": -27.247547149658203, "global_step": 591711, "epoch": 7129} {"train_loss": -28.03717041015625, "global_step": 591712, "epoch": 7129} {"train_loss": -27.455921173095703, "global_step": 591713, "epoch": 7129} {"train_loss": -27.729522705078125, "global_step": 591714, "epoch": 7129} {"train_loss": -27.33167839050293, "global_step": 591715, "epoch": 7129} {"train_loss": -27.413288116455078, "global_step": 591716, "epoch": 7129} {"train_loss": -27.251544952392578, "global_step": 591717, "epoch": 7129} {"train_loss": -27.706998825073242, "global_step": 591718, "epoch": 7129} {"train_loss": -27.37698745727539, "global_step": 591719, "epoch": 7129} {"train_loss": -28.079345703125, "global_step": 591720, "epoch": 7129} {"train_loss": -27.860681533813477, "global_step": 591721, "epoch": 7129} {"train_loss": -27.88274574279785, "global_step": 591722, "epoch": 7129} {"train_loss": -28.26441764831543, "global_step": 591723, "epoch": 7129} {"train_loss": -27.595972061157227, "global_step": 591724, "epoch": 7129} {"train_loss": -28.23797607421875, "global_step": 591725, "epoch": 7129} {"train_loss": -27.69464111328125, "global_step": 591726, "epoch": 7129} {"train_loss": -28.114002227783203, "global_step": 591727, "epoch": 7129} {"train_loss": -27.991437911987305, "global_step": 591728, "epoch": 7129} {"train_loss": -27.670312881469727, "global_step": 591729, "epoch": 7129} {"train_loss": -28.1005916595459, "global_step": 591730, "epoch": 7129} {"train_loss": -28.020736694335938, "global_step": 591731, "epoch": 7129} {"train_loss": -27.910980224609375, "global_step": 591732, "epoch": 7129} {"train_loss": -28.178380966186523, "global_step": 591733, "epoch": 7129} {"train_loss": -27.811420440673828, "global_step": 591734, "epoch": 7129} {"train_loss": -27.948047637939453, "global_step": 591735, "epoch": 7129} {"train_loss": -27.885969161987305, "global_step": 591736, "epoch": 7129} {"train_loss": -27.7331485748291, "global_step": 591737, "epoch": 7129} {"train_loss": -28.15461540222168, "global_step": 591738, "epoch": 7129} {"train_loss": -27.981327056884766, "global_step": 591739, "epoch": 7129} {"train_loss": -28.359827041625977, "global_step": 591740, "epoch": 7129} {"train_loss": -28.044050216674805, "global_step": 591741, "epoch": 7129} {"train_loss": -28.23027992248535, "global_step": 591742, "epoch": 7129} {"train_loss": -27.97003746032715, "global_step": 591743, "epoch": 7129} {"train_loss": -28.370014190673828, "global_step": 591744, "epoch": 7129} {"train_loss": -28.01569175720215, "global_step": 591745, "epoch": 7129} {"train_loss": -28.24114418029785, "global_step": 591746, "epoch": 7129} {"train_loss": -28.3120174407959, "global_step": 591747, "epoch": 7129} {"train_loss": -27.77827262878418, "global_step": 591748, "epoch": 7129} {"train_loss": -28.383380889892578, "global_step": 591749, "epoch": 7129} {"train_loss": -28.24135398864746, "global_step": 591750, "epoch": 7129} {"train_loss": -28.19489860534668, "global_step": 591751, "epoch": 7129} {"train_loss": -28.218839645385742, "global_step": 591752, "epoch": 7129} {"train_loss": -28.228290557861328, "global_step": 591753, "epoch": 7129} {"train_loss": -28.447935104370117, "global_step": 591754, "epoch": 7129} {"train_loss": -28.226367950439453, "global_step": 591755, "epoch": 7129} {"train_loss": -28.238378524780273, "global_step": 591756, "epoch": 7129} {"train_loss": -28.285795211791992, "global_step": 591757, "epoch": 7129} {"train_loss": -28.05097007751465, "global_step": 591758, "epoch": 7129} {"train_loss": -28.065326690673828, "global_step": 591759, "epoch": 7129} {"train_loss": -27.9056339263916, "global_step": 591760, "epoch": 7129} {"train_loss": -28.031391143798828, "global_step": 591761, "epoch": 7129} {"train_loss": -27.847326278686523, "global_step": 591762, "epoch": 7129} {"train_loss": -28.402013778686523, "global_step": 591763, "epoch": 7129} {"train_loss": -28.338348388671875, "global_step": 591764, "epoch": 7129} {"train_loss": -28.20660400390625, "global_step": 591765, "epoch": 7129} {"train_loss": -28.192777633666992, "global_step": 591766, "epoch": 7129} {"train_loss": -28.313444137573242, "global_step": 591767, "epoch": 7129} {"train_loss": -28.128192901611328, "global_step": 591768, "epoch": 7129} {"train_loss": -27.97808265686035, "global_step": 591769, "epoch": 7129} {"train_loss": -27.572797775268555, "global_step": 591770, "epoch": 7129} {"train_loss": -27.629180908203125, "global_step": 591771, "epoch": 7129} {"train_loss": -26.6290225982666, "global_step": 591772, "epoch": 7129} {"train_loss": -23.737567901611328, "global_step": 591773, "epoch": 7129} {"train_loss": -22.217008590698242, "global_step": 591774, "epoch": 7129} {"train_loss": -25.6289005279541, "global_step": 591775, "epoch": 7129} {"train_loss": -26.796735763549805, "global_step": 591776, "epoch": 7129} {"train_loss": -26.166601181030273, "global_step": 591777, "epoch": 7129} {"train_loss": -26.025110244750977, "global_step": 591778, "epoch": 7129} {"train_loss": -27.09528923034668, "global_step": 591779, "epoch": 7129} {"train_loss": -26.45366859436035, "global_step": 591780, "epoch": 7129} {"train_loss": -26.97556495666504, "global_step": 591781, "epoch": 7129} {"train_loss": -27.123981475830078, "global_step": 591782, "epoch": 7129} {"train_loss": -26.786558151245117, "global_step": 591783, "epoch": 7129} {"train_loss": -26.99629020690918, "global_step": 591784, "epoch": 7129} {"train_loss": -27.413970947265625, "global_step": 591785, "epoch": 7129} {"train_loss": -27.166370391845703, "global_step": 591786, "epoch": 7129} {"train_loss": -26.88160514831543, "global_step": 591787, "epoch": 7129} {"train_loss": -27.258649826049805, "global_step": 591788, "epoch": 7129} {"train_loss": -27.59280799957643, "global_step": 591789, "epoch": 7129, "val_loss": 6640762.5} {"train_loss": -27.02144432067871, "global_step": 591790, "epoch": 7130} {"train_loss": -26.368711471557617, "global_step": 591791, "epoch": 7130} {"train_loss": -27.067235946655273, "global_step": 591792, "epoch": 7130} {"train_loss": -27.156341552734375, "global_step": 591793, "epoch": 7130} {"train_loss": -26.557086944580078, "global_step": 591794, "epoch": 7130} {"train_loss": -27.002063751220703, "global_step": 591795, "epoch": 7130} {"train_loss": -26.888595581054688, "global_step": 591796, "epoch": 7130} {"train_loss": -26.728967666625977, "global_step": 591797, "epoch": 7130} {"train_loss": -27.035364151000977, "global_step": 591798, "epoch": 7130} {"train_loss": -26.961761474609375, "global_step": 591799, "epoch": 7130} {"train_loss": -26.917566299438477, "global_step": 591800, "epoch": 7130} {"train_loss": -26.91448974609375, "global_step": 591801, "epoch": 7130} {"train_loss": -26.938629150390625, "global_step": 591802, "epoch": 7130} {"train_loss": -27.605009078979492, "global_step": 591803, "epoch": 7130} {"train_loss": -27.1995849609375, "global_step": 591804, "epoch": 7130} {"train_loss": -27.1956729888916, "global_step": 591805, "epoch": 7130} {"train_loss": -27.326623916625977, "global_step": 591806, "epoch": 7130} {"train_loss": -27.6463565826416, "global_step": 591807, "epoch": 7130} {"train_loss": -27.63079833984375, "global_step": 591808, "epoch": 7130} {"train_loss": -27.763568878173828, "global_step": 591809, "epoch": 7130} {"train_loss": -27.42848014831543, "global_step": 591810, "epoch": 7130} {"train_loss": -27.81324577331543, "global_step": 591811, "epoch": 7130} {"train_loss": -27.647680282592773, "global_step": 591812, "epoch": 7130} {"train_loss": -27.411563873291016, "global_step": 591813, "epoch": 7130} {"train_loss": -27.793872833251953, "global_step": 591814, "epoch": 7130} {"train_loss": -27.7243595123291, "global_step": 591815, "epoch": 7130} {"train_loss": -27.916610717773438, "global_step": 591816, "epoch": 7130} {"train_loss": -27.852956771850586, "global_step": 591817, "epoch": 7130} {"train_loss": -27.6722412109375, "global_step": 591818, "epoch": 7130} {"train_loss": -27.49700355529785, "global_step": 591819, "epoch": 7130} {"train_loss": -28.08461570739746, "global_step": 591820, "epoch": 7130} {"train_loss": -27.68975830078125, "global_step": 591821, "epoch": 7130} {"train_loss": -28.26141357421875, "global_step": 591822, "epoch": 7130} {"train_loss": -28.058340072631836, "global_step": 591823, "epoch": 7130} {"train_loss": -27.88465690612793, "global_step": 591824, "epoch": 7130} {"train_loss": -27.650415420532227, "global_step": 591825, "epoch": 7130} {"train_loss": -27.980121612548828, "global_step": 591826, "epoch": 7130} {"train_loss": -27.970129013061523, "global_step": 591827, "epoch": 7130} {"train_loss": -27.94733238220215, "global_step": 591828, "epoch": 7130} {"train_loss": -27.983123779296875, "global_step": 591829, "epoch": 7130} {"train_loss": -27.797199249267578, "global_step": 591830, "epoch": 7130} {"train_loss": -28.107715606689453, "global_step": 591831, "epoch": 7130} {"train_loss": -28.006610870361328, "global_step": 591832, "epoch": 7130} {"train_loss": -27.82895851135254, "global_step": 591833, "epoch": 7130} {"train_loss": -27.99502944946289, "global_step": 591834, "epoch": 7130} {"train_loss": -28.264698028564453, "global_step": 591835, "epoch": 7130} {"train_loss": -27.404993057250977, "global_step": 591836, "epoch": 7130} {"train_loss": -28.095294952392578, "global_step": 591837, "epoch": 7130} {"train_loss": -27.640302658081055, "global_step": 591838, "epoch": 7130} {"train_loss": -27.973072052001953, "global_step": 591839, "epoch": 7130} {"train_loss": -27.731542587280273, "global_step": 591840, "epoch": 7130} {"train_loss": -27.9138126373291, "global_step": 591841, "epoch": 7130} {"train_loss": -27.785192489624023, "global_step": 591842, "epoch": 7130} {"train_loss": -27.505523681640625, "global_step": 591843, "epoch": 7130} {"train_loss": -27.805994033813477, "global_step": 591844, "epoch": 7130} {"train_loss": -27.82887077331543, "global_step": 591845, "epoch": 7130} {"train_loss": -27.72767448425293, "global_step": 591846, "epoch": 7130} {"train_loss": -27.84242057800293, "global_step": 591847, "epoch": 7130} {"train_loss": -27.73383140563965, "global_step": 591848, "epoch": 7130} {"train_loss": -27.472965240478516, "global_step": 591849, "epoch": 7130} {"train_loss": -28.195526123046875, "global_step": 591850, "epoch": 7130} {"train_loss": -27.679304122924805, "global_step": 591851, "epoch": 7130} {"train_loss": -27.798145294189453, "global_step": 591852, "epoch": 7130} {"train_loss": -28.23280143737793, "global_step": 591853, "epoch": 7130} {"train_loss": -27.71687126159668, "global_step": 591854, "epoch": 7130} {"train_loss": -27.24942970275879, "global_step": 591855, "epoch": 7130} {"train_loss": -27.427221298217773, "global_step": 591856, "epoch": 7130} {"train_loss": -27.65557861328125, "global_step": 591857, "epoch": 7130} {"train_loss": -27.039838790893555, "global_step": 591858, "epoch": 7130} {"train_loss": -27.82892417907715, "global_step": 591859, "epoch": 7130} {"train_loss": -27.6015682220459, "global_step": 591860, "epoch": 7130} {"train_loss": -27.393354415893555, "global_step": 591861, "epoch": 7130} {"train_loss": -27.658344268798828, "global_step": 591862, "epoch": 7130} {"train_loss": -27.490875244140625, "global_step": 591863, "epoch": 7130} {"train_loss": -27.65940284729004, "global_step": 591864, "epoch": 7130} {"train_loss": -27.81585121154785, "global_step": 591865, "epoch": 7130} {"train_loss": -27.744720458984375, "global_step": 591866, "epoch": 7130} {"train_loss": -27.841144561767578, "global_step": 591867, "epoch": 7130} {"train_loss": -28.041059494018555, "global_step": 591868, "epoch": 7130} {"train_loss": -27.62788200378418, "global_step": 591869, "epoch": 7130} {"train_loss": -27.669452667236328, "global_step": 591870, "epoch": 7130} {"train_loss": -27.871173858642578, "global_step": 591871, "epoch": 7130} {"train_loss": -27.60642033312694, "global_step": 591872, "epoch": 7130, "val_loss": 6545240.0} {"train_loss": -27.595666885375977, "global_step": 591873, "epoch": 7131} {"train_loss": -27.30936622619629, "global_step": 591874, "epoch": 7131} {"train_loss": -27.5902099609375, "global_step": 591875, "epoch": 7131} {"train_loss": -27.42933464050293, "global_step": 591876, "epoch": 7131} {"train_loss": -27.722381591796875, "global_step": 591877, "epoch": 7131} {"train_loss": -27.912240982055664, "global_step": 591878, "epoch": 7131} {"train_loss": -27.717315673828125, "global_step": 591879, "epoch": 7131} {"train_loss": -27.759033203125, "global_step": 591880, "epoch": 7131} {"train_loss": -27.81731605529785, "global_step": 591881, "epoch": 7131} {"train_loss": -27.79627799987793, "global_step": 591882, "epoch": 7131} {"train_loss": -27.937274932861328, "global_step": 591883, "epoch": 7131} {"train_loss": -27.727249145507812, "global_step": 591884, "epoch": 7131} {"train_loss": -27.868061065673828, "global_step": 591885, "epoch": 7131} {"train_loss": -27.720611572265625, "global_step": 591886, "epoch": 7131} {"train_loss": -27.9730281829834, "global_step": 591887, "epoch": 7131} {"train_loss": -28.46225357055664, "global_step": 591888, "epoch": 7131} {"train_loss": -27.571460723876953, "global_step": 591889, "epoch": 7131} {"train_loss": -28.197134017944336, "global_step": 591890, "epoch": 7131} {"train_loss": -27.789737701416016, "global_step": 591891, "epoch": 7131} {"train_loss": -28.04807472229004, "global_step": 591892, "epoch": 7131} {"train_loss": -27.855833053588867, "global_step": 591893, "epoch": 7131} {"train_loss": -27.75823402404785, "global_step": 591894, "epoch": 7131} {"train_loss": -28.19635009765625, "global_step": 591895, "epoch": 7131} {"train_loss": -27.890869140625, "global_step": 591896, "epoch": 7131} {"train_loss": -28.141082763671875, "global_step": 591897, "epoch": 7131} {"train_loss": -28.052968978881836, "global_step": 591898, "epoch": 7131} {"train_loss": -28.303476333618164, "global_step": 591899, "epoch": 7131} {"train_loss": -28.440540313720703, "global_step": 591900, "epoch": 7131} {"train_loss": -28.082956314086914, "global_step": 591901, "epoch": 7131} {"train_loss": -28.2042236328125, "global_step": 591902, "epoch": 7131} {"train_loss": -28.166257858276367, "global_step": 591903, "epoch": 7131} {"train_loss": -27.696701049804688, "global_step": 591904, "epoch": 7131} {"train_loss": -28.27411460876465, "global_step": 591905, "epoch": 7131} {"train_loss": -28.109333038330078, "global_step": 591906, "epoch": 7131} {"train_loss": -28.03800392150879, "global_step": 591907, "epoch": 7131} {"train_loss": -28.176483154296875, "global_step": 591908, "epoch": 7131} {"train_loss": -27.768817901611328, "global_step": 591909, "epoch": 7131} {"train_loss": -28.336688995361328, "global_step": 591910, "epoch": 7131} {"train_loss": -28.16937828063965, "global_step": 591911, "epoch": 7131} {"train_loss": -28.055078506469727, "global_step": 591912, "epoch": 7131} {"train_loss": -27.826181411743164, "global_step": 591913, "epoch": 7131} {"train_loss": -28.2194766998291, "global_step": 591914, "epoch": 7131} {"train_loss": -28.060293197631836, "global_step": 591915, "epoch": 7131} {"train_loss": -28.052734375, "global_step": 591916, "epoch": 7131} {"train_loss": -27.67424964904785, "global_step": 591917, "epoch": 7131} {"train_loss": -27.960834503173828, "global_step": 591918, "epoch": 7131} {"train_loss": -28.058324813842773, "global_step": 591919, "epoch": 7131} {"train_loss": -27.637739181518555, "global_step": 591920, "epoch": 7131} {"train_loss": -27.47681999206543, "global_step": 591921, "epoch": 7131} {"train_loss": -27.329059600830078, "global_step": 591922, "epoch": 7131} {"train_loss": -26.60384178161621, "global_step": 591923, "epoch": 7131} {"train_loss": -27.347814559936523, "global_step": 591924, "epoch": 7131} {"train_loss": -27.346359252929688, "global_step": 591925, "epoch": 7131} {"train_loss": -27.7299861907959, "global_step": 591926, "epoch": 7131} {"train_loss": -27.578815460205078, "global_step": 591927, "epoch": 7131} {"train_loss": -27.916669845581055, "global_step": 591928, "epoch": 7131} {"train_loss": -27.89043617248535, "global_step": 591929, "epoch": 7131} {"train_loss": -27.829986572265625, "global_step": 591930, "epoch": 7131} {"train_loss": -27.58526039123535, "global_step": 591931, "epoch": 7131} {"train_loss": -27.7272891998291, "global_step": 591932, "epoch": 7131} {"train_loss": -27.660078048706055, "global_step": 591933, "epoch": 7131} {"train_loss": -27.79402732849121, "global_step": 591934, "epoch": 7131} {"train_loss": -28.1915340423584, "global_step": 591935, "epoch": 7131} {"train_loss": -27.80537223815918, "global_step": 591936, "epoch": 7131} {"train_loss": -27.98444175720215, "global_step": 591937, "epoch": 7131} {"train_loss": -27.777082443237305, "global_step": 591938, "epoch": 7131} {"train_loss": -28.346723556518555, "global_step": 591939, "epoch": 7131} {"train_loss": -28.166833877563477, "global_step": 591940, "epoch": 7131} {"train_loss": -28.22185707092285, "global_step": 591941, "epoch": 7131} {"train_loss": -27.90275001525879, "global_step": 591942, "epoch": 7131} {"train_loss": -27.98908042907715, "global_step": 591943, "epoch": 7131} {"train_loss": -27.857208251953125, "global_step": 591944, "epoch": 7131} {"train_loss": -28.011205673217773, "global_step": 591945, "epoch": 7131} {"train_loss": -28.2486629486084, "global_step": 591946, "epoch": 7131} {"train_loss": -28.034727096557617, "global_step": 591947, "epoch": 7131} {"train_loss": -27.769819259643555, "global_step": 591948, "epoch": 7131} {"train_loss": -28.10758399963379, "global_step": 591949, "epoch": 7131} {"train_loss": -27.994186401367188, "global_step": 591950, "epoch": 7131} {"train_loss": -28.045602798461914, "global_step": 591951, "epoch": 7131} {"train_loss": -28.3869686126709, "global_step": 591952, "epoch": 7131} {"train_loss": -28.312747955322266, "global_step": 591953, "epoch": 7131} {"train_loss": -28.123891830444336, "global_step": 591954, "epoch": 7131} {"train_loss": -27.91751491592591, "global_step": 591955, "epoch": 7131, "val_loss": 6451086.0} {"train_loss": -27.150938034057617, "global_step": 591956, "epoch": 7132} {"train_loss": -27.288843154907227, "global_step": 591957, "epoch": 7132} {"train_loss": -27.123310089111328, "global_step": 591958, "epoch": 7132} {"train_loss": -27.547107696533203, "global_step": 591959, "epoch": 7132} {"train_loss": -27.097150802612305, "global_step": 591960, "epoch": 7132} {"train_loss": -27.681528091430664, "global_step": 591961, "epoch": 7132} {"train_loss": -27.63360595703125, "global_step": 591962, "epoch": 7132} {"train_loss": -26.826398849487305, "global_step": 591963, "epoch": 7132} {"train_loss": -27.059650421142578, "global_step": 591964, "epoch": 7132} {"train_loss": -27.169652938842773, "global_step": 591965, "epoch": 7132} {"train_loss": -27.497913360595703, "global_step": 591966, "epoch": 7132} {"train_loss": -27.53261375427246, "global_step": 591967, "epoch": 7132} {"train_loss": -27.273529052734375, "global_step": 591968, "epoch": 7132} {"train_loss": -27.422632217407227, "global_step": 591969, "epoch": 7132} {"train_loss": -27.441110610961914, "global_step": 591970, "epoch": 7132} {"train_loss": -27.671483993530273, "global_step": 591971, "epoch": 7132} {"train_loss": -27.658605575561523, "global_step": 591972, "epoch": 7132} {"train_loss": -27.881397247314453, "global_step": 591973, "epoch": 7132} {"train_loss": -28.01887321472168, "global_step": 591974, "epoch": 7132} {"train_loss": -27.58430290222168, "global_step": 591975, "epoch": 7132} {"train_loss": -27.81605339050293, "global_step": 591976, "epoch": 7132} {"train_loss": -27.81879234313965, "global_step": 591977, "epoch": 7132} {"train_loss": -27.6263370513916, "global_step": 591978, "epoch": 7132} {"train_loss": -27.88408851623535, "global_step": 591979, "epoch": 7132} {"train_loss": -27.696813583374023, "global_step": 591980, "epoch": 7132} {"train_loss": -27.652191162109375, "global_step": 591981, "epoch": 7132} {"train_loss": -28.306745529174805, "global_step": 591982, "epoch": 7132} {"train_loss": -27.706436157226562, "global_step": 591983, "epoch": 7132} {"train_loss": -27.99833106994629, "global_step": 591984, "epoch": 7132} {"train_loss": -27.85800552368164, "global_step": 591985, "epoch": 7132} {"train_loss": -27.96196937561035, "global_step": 591986, "epoch": 7132} {"train_loss": -28.055450439453125, "global_step": 591987, "epoch": 7132} {"train_loss": -27.726367950439453, "global_step": 591988, "epoch": 7132} {"train_loss": -28.334272384643555, "global_step": 591989, "epoch": 7132} {"train_loss": -27.57002067565918, "global_step": 591990, "epoch": 7132} {"train_loss": -27.78461265563965, "global_step": 591991, "epoch": 7132} {"train_loss": -27.913379669189453, "global_step": 591992, "epoch": 7132} {"train_loss": -27.976682662963867, "global_step": 591993, "epoch": 7132} {"train_loss": -27.8840389251709, "global_step": 591994, "epoch": 7132} {"train_loss": -28.04302978515625, "global_step": 591995, "epoch": 7132} {"train_loss": -28.444049835205078, "global_step": 591996, "epoch": 7132} {"train_loss": -28.32631492614746, "global_step": 591997, "epoch": 7132} {"train_loss": -27.87872886657715, "global_step": 591998, "epoch": 7132} {"train_loss": -28.047536849975586, "global_step": 591999, "epoch": 7132} {"train_loss": -28.273941040039062, "global_step": 592000, "epoch": 7132} {"train_loss": -28.2298583984375, "global_step": 592001, "epoch": 7132} {"train_loss": -27.798572540283203, "global_step": 592002, "epoch": 7132} {"train_loss": -27.811567306518555, "global_step": 592003, "epoch": 7132} {"train_loss": -28.16241455078125, "global_step": 592004, "epoch": 7132} {"train_loss": -28.372411727905273, "global_step": 592005, "epoch": 7132} {"train_loss": -28.568561553955078, "global_step": 592006, "epoch": 7132} {"train_loss": -28.092727661132812, "global_step": 592007, "epoch": 7132} {"train_loss": -28.070158004760742, "global_step": 592008, "epoch": 7132} {"train_loss": -28.35877799987793, "global_step": 592009, "epoch": 7132} {"train_loss": -28.396942138671875, "global_step": 592010, "epoch": 7132} {"train_loss": -28.311939239501953, "global_step": 592011, "epoch": 7132} {"train_loss": -28.434585571289062, "global_step": 592012, "epoch": 7132} {"train_loss": -28.06134605407715, "global_step": 592013, "epoch": 7132} {"train_loss": -27.967885971069336, "global_step": 592014, "epoch": 7132} {"train_loss": -27.768415451049805, "global_step": 592015, "epoch": 7132} {"train_loss": -27.78474235534668, "global_step": 592016, "epoch": 7132} {"train_loss": -27.509937286376953, "global_step": 592017, "epoch": 7132} {"train_loss": -28.259002685546875, "global_step": 592018, "epoch": 7132} {"train_loss": -28.65753173828125, "global_step": 592019, "epoch": 7132} {"train_loss": -28.013792037963867, "global_step": 592020, "epoch": 7132} {"train_loss": -27.96973991394043, "global_step": 592021, "epoch": 7132} {"train_loss": -28.016233444213867, "global_step": 592022, "epoch": 7132} {"train_loss": -27.54733657836914, "global_step": 592023, "epoch": 7132} {"train_loss": -27.419416427612305, "global_step": 592024, "epoch": 7132} {"train_loss": -27.61433219909668, "global_step": 592025, "epoch": 7132} {"train_loss": -27.917591094970703, "global_step": 592026, "epoch": 7132} {"train_loss": -28.047876358032227, "global_step": 592027, "epoch": 7132} {"train_loss": -28.205297470092773, "global_step": 592028, "epoch": 7132} {"train_loss": -28.03627586364746, "global_step": 592029, "epoch": 7132} {"train_loss": -28.25552749633789, "global_step": 592030, "epoch": 7132} {"train_loss": -28.06568717956543, "global_step": 592031, "epoch": 7132} {"train_loss": -28.1680908203125, "global_step": 592032, "epoch": 7132} {"train_loss": -28.158294677734375, "global_step": 592033, "epoch": 7132} {"train_loss": -28.01453971862793, "global_step": 592034, "epoch": 7132} {"train_loss": -27.867996215820312, "global_step": 592035, "epoch": 7132} {"train_loss": -27.91929054260254, "global_step": 592036, "epoch": 7132} {"train_loss": -28.186925888061523, "global_step": 592037, "epoch": 7132} {"train_loss": -27.871830492134553, "global_step": 592038, "epoch": 7132, "val_loss": 6554439.0} {"train_loss": -27.588825225830078, "global_step": 592039, "epoch": 7133} {"train_loss": -28.219552993774414, "global_step": 592040, "epoch": 7133} {"train_loss": -27.515522003173828, "global_step": 592041, "epoch": 7133} {"train_loss": -26.697988510131836, "global_step": 592042, "epoch": 7133} {"train_loss": -27.196012496948242, "global_step": 592043, "epoch": 7133} {"train_loss": -27.610736846923828, "global_step": 592044, "epoch": 7133} {"train_loss": -27.34893798828125, "global_step": 592045, "epoch": 7133} {"train_loss": -27.66831398010254, "global_step": 592046, "epoch": 7133} {"train_loss": -27.243383407592773, "global_step": 592047, "epoch": 7133} {"train_loss": -27.742267608642578, "global_step": 592048, "epoch": 7133} {"train_loss": -27.424535751342773, "global_step": 592049, "epoch": 7133} {"train_loss": -27.19331169128418, "global_step": 592050, "epoch": 7133} {"train_loss": -27.56325340270996, "global_step": 592051, "epoch": 7133} {"train_loss": -27.829343795776367, "global_step": 592052, "epoch": 7133} {"train_loss": -27.501373291015625, "global_step": 592053, "epoch": 7133} {"train_loss": -27.75967788696289, "global_step": 592054, "epoch": 7133} {"train_loss": -27.731122970581055, "global_step": 592055, "epoch": 7133} {"train_loss": -27.476348876953125, "global_step": 592056, "epoch": 7133} {"train_loss": -27.992145538330078, "global_step": 592057, "epoch": 7133} {"train_loss": -27.490747451782227, "global_step": 592058, "epoch": 7133} {"train_loss": -27.777149200439453, "global_step": 592059, "epoch": 7133} {"train_loss": -28.172033309936523, "global_step": 592060, "epoch": 7133} {"train_loss": -27.719379425048828, "global_step": 592061, "epoch": 7133} {"train_loss": -27.791370391845703, "global_step": 592062, "epoch": 7133} {"train_loss": -27.7962646484375, "global_step": 592063, "epoch": 7133} {"train_loss": -27.964126586914062, "global_step": 592064, "epoch": 7133} {"train_loss": -27.96732521057129, "global_step": 592065, "epoch": 7133} {"train_loss": -27.989730834960938, "global_step": 592066, "epoch": 7133} {"train_loss": -27.9945068359375, "global_step": 592067, "epoch": 7133} {"train_loss": -27.9643497467041, "global_step": 592068, "epoch": 7133} {"train_loss": -27.8039493560791, "global_step": 592069, "epoch": 7133} {"train_loss": -27.556241989135742, "global_step": 592070, "epoch": 7133} {"train_loss": -27.64316177368164, "global_step": 592071, "epoch": 7133} {"train_loss": -28.021432876586914, "global_step": 592072, "epoch": 7133} {"train_loss": -27.874902725219727, "global_step": 592073, "epoch": 7133} {"train_loss": -27.944141387939453, "global_step": 592074, "epoch": 7133} {"train_loss": -27.590686798095703, "global_step": 592075, "epoch": 7133} {"train_loss": -27.542627334594727, "global_step": 592076, "epoch": 7133} {"train_loss": -28.221891403198242, "global_step": 592077, "epoch": 7133} {"train_loss": -28.068876266479492, "global_step": 592078, "epoch": 7133} {"train_loss": -28.347375869750977, "global_step": 592079, "epoch": 7133} {"train_loss": -28.235279083251953, "global_step": 592080, "epoch": 7133} {"train_loss": -28.013906478881836, "global_step": 592081, "epoch": 7133} {"train_loss": -28.26361656188965, "global_step": 592082, "epoch": 7133} {"train_loss": -28.15047264099121, "global_step": 592083, "epoch": 7133} {"train_loss": -28.040430068969727, "global_step": 592084, "epoch": 7133} {"train_loss": -28.02425193786621, "global_step": 592085, "epoch": 7133} {"train_loss": -28.058263778686523, "global_step": 592086, "epoch": 7133} {"train_loss": -28.0050106048584, "global_step": 592087, "epoch": 7133} {"train_loss": -28.03955078125, "global_step": 592088, "epoch": 7133} {"train_loss": -28.140579223632812, "global_step": 592089, "epoch": 7133} {"train_loss": -28.415969848632812, "global_step": 592090, "epoch": 7133} {"train_loss": -28.22336196899414, "global_step": 592091, "epoch": 7133} {"train_loss": -27.861648559570312, "global_step": 592092, "epoch": 7133} {"train_loss": -28.075214385986328, "global_step": 592093, "epoch": 7133} {"train_loss": -27.988937377929688, "global_step": 592094, "epoch": 7133} {"train_loss": -27.544727325439453, "global_step": 592095, "epoch": 7133} {"train_loss": -26.721237182617188, "global_step": 592096, "epoch": 7133} {"train_loss": -26.171833038330078, "global_step": 592097, "epoch": 7133} {"train_loss": -27.653003692626953, "global_step": 592098, "epoch": 7133} {"train_loss": -27.465139389038086, "global_step": 592099, "epoch": 7133} {"train_loss": -27.25848960876465, "global_step": 592100, "epoch": 7133} {"train_loss": -28.07404899597168, "global_step": 592101, "epoch": 7133} {"train_loss": -27.28767204284668, "global_step": 592102, "epoch": 7133} {"train_loss": -27.743078231811523, "global_step": 592103, "epoch": 7133} {"train_loss": -27.9088134765625, "global_step": 592104, "epoch": 7133} {"train_loss": -27.74755859375, "global_step": 592105, "epoch": 7133} {"train_loss": -27.65962028503418, "global_step": 592106, "epoch": 7133} {"train_loss": -27.696924209594727, "global_step": 592107, "epoch": 7133} {"train_loss": -27.999256134033203, "global_step": 592108, "epoch": 7133} {"train_loss": -27.708423614501953, "global_step": 592109, "epoch": 7133} {"train_loss": -27.8494873046875, "global_step": 592110, "epoch": 7133} {"train_loss": -28.22187614440918, "global_step": 592111, "epoch": 7133} {"train_loss": -27.98789405822754, "global_step": 592112, "epoch": 7133} {"train_loss": -27.832788467407227, "global_step": 592113, "epoch": 7133} {"train_loss": -28.222858428955078, "global_step": 592114, "epoch": 7133} {"train_loss": -28.49395751953125, "global_step": 592115, "epoch": 7133} {"train_loss": -27.8264102935791, "global_step": 592116, "epoch": 7133} {"train_loss": -27.811023712158203, "global_step": 592117, "epoch": 7133} {"train_loss": -27.657865524291992, "global_step": 592118, "epoch": 7133} {"train_loss": -27.706226348876953, "global_step": 592119, "epoch": 7133} {"train_loss": -27.74875831604004, "global_step": 592120, "epoch": 7133} {"train_loss": -27.764903907316278, "global_step": 592121, "epoch": 7133, "val_loss": 6584150.0} {"train_loss": -26.481962203979492, "global_step": 592122, "epoch": 7134} {"train_loss": -25.91359519958496, "global_step": 592123, "epoch": 7134} {"train_loss": -25.229948043823242, "global_step": 592124, "epoch": 7134} {"train_loss": -26.67352867126465, "global_step": 592125, "epoch": 7134} {"train_loss": -25.963476181030273, "global_step": 592126, "epoch": 7134} {"train_loss": -25.884504318237305, "global_step": 592127, "epoch": 7134} {"train_loss": -26.53822898864746, "global_step": 592128, "epoch": 7134} {"train_loss": -26.246301651000977, "global_step": 592129, "epoch": 7134} {"train_loss": -26.729467391967773, "global_step": 592130, "epoch": 7134} {"train_loss": -26.796222686767578, "global_step": 592131, "epoch": 7134} {"train_loss": -26.771814346313477, "global_step": 592132, "epoch": 7134} {"train_loss": -26.1424503326416, "global_step": 592133, "epoch": 7134} {"train_loss": -26.671369552612305, "global_step": 592134, "epoch": 7134} {"train_loss": -26.537378311157227, "global_step": 592135, "epoch": 7134} {"train_loss": -27.27780532836914, "global_step": 592136, "epoch": 7134} {"train_loss": -26.9576358795166, "global_step": 592137, "epoch": 7134} {"train_loss": -27.267438888549805, "global_step": 592138, "epoch": 7134} {"train_loss": -27.20802116394043, "global_step": 592139, "epoch": 7134} {"train_loss": -27.213064193725586, "global_step": 592140, "epoch": 7134} {"train_loss": -26.872156143188477, "global_step": 592141, "epoch": 7134} {"train_loss": -27.378265380859375, "global_step": 592142, "epoch": 7134} {"train_loss": -27.603803634643555, "global_step": 592143, "epoch": 7134} {"train_loss": -27.340545654296875, "global_step": 592144, "epoch": 7134} {"train_loss": -27.594192504882812, "global_step": 592145, "epoch": 7134} {"train_loss": -27.09228515625, "global_step": 592146, "epoch": 7134} {"train_loss": -27.431859970092773, "global_step": 592147, "epoch": 7134} {"train_loss": -27.740676879882812, "global_step": 592148, "epoch": 7134} {"train_loss": -27.902753829956055, "global_step": 592149, "epoch": 7134} {"train_loss": -27.70965003967285, "global_step": 592150, "epoch": 7134} {"train_loss": -27.64752197265625, "global_step": 592151, "epoch": 7134} {"train_loss": -27.33283042907715, "global_step": 592152, "epoch": 7134} {"train_loss": -27.80509376525879, "global_step": 592153, "epoch": 7134} {"train_loss": -27.56320571899414, "global_step": 592154, "epoch": 7134} {"train_loss": -27.626123428344727, "global_step": 592155, "epoch": 7134} {"train_loss": -27.657514572143555, "global_step": 592156, "epoch": 7134} {"train_loss": -28.145261764526367, "global_step": 592157, "epoch": 7134} {"train_loss": -27.906112670898438, "global_step": 592158, "epoch": 7134} {"train_loss": -27.799894332885742, "global_step": 592159, "epoch": 7134} {"train_loss": -27.819665908813477, "global_step": 592160, "epoch": 7134} {"train_loss": -27.807830810546875, "global_step": 592161, "epoch": 7134} {"train_loss": -28.13164710998535, "global_step": 592162, "epoch": 7134} {"train_loss": -27.73681640625, "global_step": 592163, "epoch": 7134} {"train_loss": -27.83914566040039, "global_step": 592164, "epoch": 7134} {"train_loss": -27.94085693359375, "global_step": 592165, "epoch": 7134} {"train_loss": -27.759191513061523, "global_step": 592166, "epoch": 7134} {"train_loss": -27.929662704467773, "global_step": 592167, "epoch": 7134} {"train_loss": -27.879621505737305, "global_step": 592168, "epoch": 7134} {"train_loss": -28.127771377563477, "global_step": 592169, "epoch": 7134} {"train_loss": -27.871938705444336, "global_step": 592170, "epoch": 7134} {"train_loss": -28.289813995361328, "global_step": 592171, "epoch": 7134} {"train_loss": -28.132770538330078, "global_step": 592172, "epoch": 7134} {"train_loss": -27.77286148071289, "global_step": 592173, "epoch": 7134} {"train_loss": -28.147602081298828, "global_step": 592174, "epoch": 7134} {"train_loss": -28.32952880859375, "global_step": 592175, "epoch": 7134} {"train_loss": -28.075397491455078, "global_step": 592176, "epoch": 7134} {"train_loss": -28.10294532775879, "global_step": 592177, "epoch": 7134} {"train_loss": -27.899763107299805, "global_step": 592178, "epoch": 7134} {"train_loss": -27.961084365844727, "global_step": 592179, "epoch": 7134} {"train_loss": -28.613040924072266, "global_step": 592180, "epoch": 7134} {"train_loss": -28.051910400390625, "global_step": 592181, "epoch": 7134} {"train_loss": -28.537519454956055, "global_step": 592182, "epoch": 7134} {"train_loss": -28.289587020874023, "global_step": 592183, "epoch": 7134} {"train_loss": -27.91950798034668, "global_step": 592184, "epoch": 7134} {"train_loss": -28.4339656829834, "global_step": 592185, "epoch": 7134} {"train_loss": -28.379087448120117, "global_step": 592186, "epoch": 7134} {"train_loss": -28.518415451049805, "global_step": 592187, "epoch": 7134} {"train_loss": -28.287961959838867, "global_step": 592188, "epoch": 7134} {"train_loss": -28.231779098510742, "global_step": 592189, "epoch": 7134} {"train_loss": -28.0667781829834, "global_step": 592190, "epoch": 7134} {"train_loss": -28.428302764892578, "global_step": 592191, "epoch": 7134} {"train_loss": -28.119232177734375, "global_step": 592192, "epoch": 7134} {"train_loss": -28.090993881225586, "global_step": 592193, "epoch": 7134} {"train_loss": -28.104511260986328, "global_step": 592194, "epoch": 7134} {"train_loss": -27.9510555267334, "global_step": 592195, "epoch": 7134} {"train_loss": -28.13123893737793, "global_step": 592196, "epoch": 7134} {"train_loss": -28.090564727783203, "global_step": 592197, "epoch": 7134} {"train_loss": -28.063688278198242, "global_step": 592198, "epoch": 7134} {"train_loss": -28.122821807861328, "global_step": 592199, "epoch": 7134} {"train_loss": -28.203266143798828, "global_step": 592200, "epoch": 7134} {"train_loss": -27.7340030670166, "global_step": 592201, "epoch": 7134} {"train_loss": -27.06753921508789, "global_step": 592202, "epoch": 7134} {"train_loss": -26.841413497924805, "global_step": 592203, "epoch": 7134} {"train_loss": -27.551381582237152, "global_step": 592204, "epoch": 7134, "val_loss": 6518250.0} {"train_loss": -19.902143478393555, "global_step": 592205, "epoch": 7135} {"train_loss": -24.21845817565918, "global_step": 592206, "epoch": 7135} {"train_loss": -26.17569351196289, "global_step": 592207, "epoch": 7135} {"train_loss": -24.73285484313965, "global_step": 592208, "epoch": 7135} {"train_loss": -26.378583908081055, "global_step": 592209, "epoch": 7135} {"train_loss": -24.83051872253418, "global_step": 592210, "epoch": 7135} {"train_loss": -25.897748947143555, "global_step": 592211, "epoch": 7135} {"train_loss": -26.26544189453125, "global_step": 592212, "epoch": 7135} {"train_loss": -25.727697372436523, "global_step": 592213, "epoch": 7135} {"train_loss": -26.9960994720459, "global_step": 592214, "epoch": 7135} {"train_loss": -26.684778213500977, "global_step": 592215, "epoch": 7135} {"train_loss": -26.2110538482666, "global_step": 592216, "epoch": 7135} {"train_loss": -27.102548599243164, "global_step": 592217, "epoch": 7135} {"train_loss": -26.610925674438477, "global_step": 592218, "epoch": 7135} {"train_loss": -26.994647979736328, "global_step": 592219, "epoch": 7135} {"train_loss": -26.674930572509766, "global_step": 592220, "epoch": 7135} {"train_loss": -27.408838272094727, "global_step": 592221, "epoch": 7135} {"train_loss": -26.765615463256836, "global_step": 592222, "epoch": 7135} {"train_loss": -27.411136627197266, "global_step": 592223, "epoch": 7135} {"train_loss": -27.24163818359375, "global_step": 592224, "epoch": 7135} {"train_loss": -27.08662223815918, "global_step": 592225, "epoch": 7135} {"train_loss": -27.207645416259766, "global_step": 592226, "epoch": 7135} {"train_loss": -27.311437606811523, "global_step": 592227, "epoch": 7135} {"train_loss": -27.282440185546875, "global_step": 592228, "epoch": 7135} {"train_loss": -27.4018611907959, "global_step": 592229, "epoch": 7135} {"train_loss": -27.204198837280273, "global_step": 592230, "epoch": 7135} {"train_loss": -27.134021759033203, "global_step": 592231, "epoch": 7135} {"train_loss": -27.55598258972168, "global_step": 592232, "epoch": 7135} {"train_loss": -27.04413414001465, "global_step": 592233, "epoch": 7135} {"train_loss": -27.185791015625, "global_step": 592234, "epoch": 7135} {"train_loss": -27.559589385986328, "global_step": 592235, "epoch": 7135} {"train_loss": -27.90264892578125, "global_step": 592236, "epoch": 7135} {"train_loss": -27.322357177734375, "global_step": 592237, "epoch": 7135} {"train_loss": -27.5674991607666, "global_step": 592238, "epoch": 7135} {"train_loss": -27.630939483642578, "global_step": 592239, "epoch": 7135} {"train_loss": -27.293201446533203, "global_step": 592240, "epoch": 7135} {"train_loss": -28.105878829956055, "global_step": 592241, "epoch": 7135} {"train_loss": -27.594327926635742, "global_step": 592242, "epoch": 7135} {"train_loss": -27.72003173828125, "global_step": 592243, "epoch": 7135} {"train_loss": -27.645282745361328, "global_step": 592244, "epoch": 7135} {"train_loss": -27.242761611938477, "global_step": 592245, "epoch": 7135} {"train_loss": -27.9240665435791, "global_step": 592246, "epoch": 7135} {"train_loss": -28.093854904174805, "global_step": 592247, "epoch": 7135} {"train_loss": -27.558012008666992, "global_step": 592248, "epoch": 7135} {"train_loss": -27.789188385009766, "global_step": 592249, "epoch": 7135} {"train_loss": -27.534778594970703, "global_step": 592250, "epoch": 7135} {"train_loss": -27.674915313720703, "global_step": 592251, "epoch": 7135} {"train_loss": -27.754261016845703, "global_step": 592252, "epoch": 7135} {"train_loss": -27.962005615234375, "global_step": 592253, "epoch": 7135} {"train_loss": -28.057477951049805, "global_step": 592254, "epoch": 7135} {"train_loss": -27.993799209594727, "global_step": 592255, "epoch": 7135} {"train_loss": -27.828943252563477, "global_step": 592256, "epoch": 7135} {"train_loss": -27.86808204650879, "global_step": 592257, "epoch": 7135} {"train_loss": -28.14985466003418, "global_step": 592258, "epoch": 7135} {"train_loss": -27.700956344604492, "global_step": 592259, "epoch": 7135} {"train_loss": -28.104848861694336, "global_step": 592260, "epoch": 7135} {"train_loss": -27.757801055908203, "global_step": 592261, "epoch": 7135} {"train_loss": -27.741254806518555, "global_step": 592262, "epoch": 7135} {"train_loss": -28.1533260345459, "global_step": 592263, "epoch": 7135} {"train_loss": -27.84909439086914, "global_step": 592264, "epoch": 7135} {"train_loss": -27.9821720123291, "global_step": 592265, "epoch": 7135} {"train_loss": -28.008136749267578, "global_step": 592266, "epoch": 7135} {"train_loss": -27.890045166015625, "global_step": 592267, "epoch": 7135} {"train_loss": -27.980854034423828, "global_step": 592268, "epoch": 7135} {"train_loss": -28.213104248046875, "global_step": 592269, "epoch": 7135} {"train_loss": -28.14447593688965, "global_step": 592270, "epoch": 7135} {"train_loss": -27.56201171875, "global_step": 592271, "epoch": 7135} {"train_loss": -27.7725830078125, "global_step": 592272, "epoch": 7135} {"train_loss": -28.179166793823242, "global_step": 592273, "epoch": 7135} {"train_loss": -27.4284725189209, "global_step": 592274, "epoch": 7135} {"train_loss": -28.110681533813477, "global_step": 592275, "epoch": 7135} {"train_loss": -27.612354278564453, "global_step": 592276, "epoch": 7135} {"train_loss": -27.931055068969727, "global_step": 592277, "epoch": 7135} {"train_loss": -27.39790916442871, "global_step": 592278, "epoch": 7135} {"train_loss": -27.767715454101562, "global_step": 592279, "epoch": 7135} {"train_loss": -27.823108673095703, "global_step": 592280, "epoch": 7135} {"train_loss": -27.932392120361328, "global_step": 592281, "epoch": 7135} {"train_loss": -28.213117599487305, "global_step": 592282, "epoch": 7135} {"train_loss": -28.061954498291016, "global_step": 592283, "epoch": 7135} {"train_loss": -27.71925163269043, "global_step": 592284, "epoch": 7135} {"train_loss": -28.18995475769043, "global_step": 592285, "epoch": 7135} {"train_loss": -27.89395523071289, "global_step": 592286, "epoch": 7135} {"train_loss": -27.31970318254218, "global_step": 592287, "epoch": 7135, "val_loss": 6528632.0} {"train_loss": -28.171371459960938, "global_step": 592288, "epoch": 7136} {"train_loss": -27.722314834594727, "global_step": 592289, "epoch": 7136} {"train_loss": -27.95166015625, "global_step": 592290, "epoch": 7136} {"train_loss": -27.86494255065918, "global_step": 592291, "epoch": 7136} {"train_loss": -27.733142852783203, "global_step": 592292, "epoch": 7136} {"train_loss": -27.6486873626709, "global_step": 592293, "epoch": 7136} {"train_loss": -27.762939453125, "global_step": 592294, "epoch": 7136} {"train_loss": -28.255218505859375, "global_step": 592295, "epoch": 7136} {"train_loss": -27.72197914123535, "global_step": 592296, "epoch": 7136} {"train_loss": -28.012460708618164, "global_step": 592297, "epoch": 7136} {"train_loss": -27.6773681640625, "global_step": 592298, "epoch": 7136} {"train_loss": -27.935277938842773, "global_step": 592299, "epoch": 7136} {"train_loss": -27.917118072509766, "global_step": 592300, "epoch": 7136} {"train_loss": -28.137861251831055, "global_step": 592301, "epoch": 7136} {"train_loss": -28.147130966186523, "global_step": 592302, "epoch": 7136} {"train_loss": -28.041980743408203, "global_step": 592303, "epoch": 7136} {"train_loss": -27.672565460205078, "global_step": 592304, "epoch": 7136} {"train_loss": -28.213485717773438, "global_step": 592305, "epoch": 7136} {"train_loss": -27.879810333251953, "global_step": 592306, "epoch": 7136} {"train_loss": -28.417020797729492, "global_step": 592307, "epoch": 7136} {"train_loss": -28.198978424072266, "global_step": 592308, "epoch": 7136} {"train_loss": -28.2803897857666, "global_step": 592309, "epoch": 7136} {"train_loss": -28.212926864624023, "global_step": 592310, "epoch": 7136} {"train_loss": -27.84584617614746, "global_step": 592311, "epoch": 7136} {"train_loss": -28.199548721313477, "global_step": 592312, "epoch": 7136} {"train_loss": -27.922582626342773, "global_step": 592313, "epoch": 7136} {"train_loss": -28.219263076782227, "global_step": 592314, "epoch": 7136} {"train_loss": -28.121448516845703, "global_step": 592315, "epoch": 7136} {"train_loss": -28.50872230529785, "global_step": 592316, "epoch": 7136} {"train_loss": -28.309839248657227, "global_step": 592317, "epoch": 7136} {"train_loss": -28.339447021484375, "global_step": 592318, "epoch": 7136} {"train_loss": -28.077939987182617, "global_step": 592319, "epoch": 7136} {"train_loss": -28.2536678314209, "global_step": 592320, "epoch": 7136} {"train_loss": -28.234785079956055, "global_step": 592321, "epoch": 7136} {"train_loss": -27.75567054748535, "global_step": 592322, "epoch": 7136} {"train_loss": -27.674152374267578, "global_step": 592323, "epoch": 7136} {"train_loss": -28.207300186157227, "global_step": 592324, "epoch": 7136} {"train_loss": -27.963489532470703, "global_step": 592325, "epoch": 7136} {"train_loss": -28.046186447143555, "global_step": 592326, "epoch": 7136} {"train_loss": -27.864871978759766, "global_step": 592327, "epoch": 7136} {"train_loss": -27.993240356445312, "global_step": 592328, "epoch": 7136} {"train_loss": -27.635061264038086, "global_step": 592329, "epoch": 7136} {"train_loss": -27.96790885925293, "global_step": 592330, "epoch": 7136} {"train_loss": -28.173490524291992, "global_step": 592331, "epoch": 7136} {"train_loss": -27.907007217407227, "global_step": 592332, "epoch": 7136} {"train_loss": -27.850711822509766, "global_step": 592333, "epoch": 7136} {"train_loss": -27.911407470703125, "global_step": 592334, "epoch": 7136} {"train_loss": -28.371789932250977, "global_step": 592335, "epoch": 7136} {"train_loss": -27.61590003967285, "global_step": 592336, "epoch": 7136} {"train_loss": -27.817840576171875, "global_step": 592337, "epoch": 7136} {"train_loss": -27.825849533081055, "global_step": 592338, "epoch": 7136} {"train_loss": -27.74348258972168, "global_step": 592339, "epoch": 7136} {"train_loss": -27.87922477722168, "global_step": 592340, "epoch": 7136} {"train_loss": -27.906879425048828, "global_step": 592341, "epoch": 7136} {"train_loss": -27.873693466186523, "global_step": 592342, "epoch": 7136} {"train_loss": -28.10956382751465, "global_step": 592343, "epoch": 7136} {"train_loss": -28.13787841796875, "global_step": 592344, "epoch": 7136} {"train_loss": -28.196155548095703, "global_step": 592345, "epoch": 7136} {"train_loss": -27.99846839904785, "global_step": 592346, "epoch": 7136} {"train_loss": -28.220550537109375, "global_step": 592347, "epoch": 7136} {"train_loss": -28.80409812927246, "global_step": 592348, "epoch": 7136} {"train_loss": -28.00390625, "global_step": 592349, "epoch": 7136} {"train_loss": -27.8555850982666, "global_step": 592350, "epoch": 7136} {"train_loss": -28.04987144470215, "global_step": 592351, "epoch": 7136} {"train_loss": -27.988895416259766, "global_step": 592352, "epoch": 7136} {"train_loss": -28.087024688720703, "global_step": 592353, "epoch": 7136} {"train_loss": -27.539960861206055, "global_step": 592354, "epoch": 7136} {"train_loss": -28.045984268188477, "global_step": 592355, "epoch": 7136} {"train_loss": -28.05978775024414, "global_step": 592356, "epoch": 7136} {"train_loss": -28.090375900268555, "global_step": 592357, "epoch": 7136} {"train_loss": -28.455673217773438, "global_step": 592358, "epoch": 7136} {"train_loss": -28.0439395904541, "global_step": 592359, "epoch": 7136} {"train_loss": -28.161243438720703, "global_step": 592360, "epoch": 7136} {"train_loss": -28.40582847595215, "global_step": 592361, "epoch": 7136} {"train_loss": -28.25591468811035, "global_step": 592362, "epoch": 7136} {"train_loss": -27.92445182800293, "global_step": 592363, "epoch": 7136} {"train_loss": -28.54952049255371, "global_step": 592364, "epoch": 7136} {"train_loss": -28.24289894104004, "global_step": 592365, "epoch": 7136} {"train_loss": -28.039941787719727, "global_step": 592366, "epoch": 7136} {"train_loss": -27.95551872253418, "global_step": 592367, "epoch": 7136} {"train_loss": -28.096527099609375, "global_step": 592368, "epoch": 7136} {"train_loss": -27.952198028564453, "global_step": 592369, "epoch": 7136} {"train_loss": -28.034829105239318, "global_step": 592370, "epoch": 7136, "val_loss": 6541694.0} {"train_loss": -26.41607093811035, "global_step": 592371, "epoch": 7137} {"train_loss": -25.89810562133789, "global_step": 592372, "epoch": 7137} {"train_loss": -27.614551544189453, "global_step": 592373, "epoch": 7137} {"train_loss": -27.43256187438965, "global_step": 592374, "epoch": 7137} {"train_loss": -26.92939567565918, "global_step": 592375, "epoch": 7137} {"train_loss": -27.058948516845703, "global_step": 592376, "epoch": 7137} {"train_loss": -27.71436882019043, "global_step": 592377, "epoch": 7137} {"train_loss": -27.291900634765625, "global_step": 592378, "epoch": 7137} {"train_loss": -27.512144088745117, "global_step": 592379, "epoch": 7137} {"train_loss": -27.26630973815918, "global_step": 592380, "epoch": 7137} {"train_loss": -27.17960548400879, "global_step": 592381, "epoch": 7137} {"train_loss": -27.01533317565918, "global_step": 592382, "epoch": 7137} {"train_loss": -27.641250610351562, "global_step": 592383, "epoch": 7137} {"train_loss": -27.4125919342041, "global_step": 592384, "epoch": 7137} {"train_loss": -27.390439987182617, "global_step": 592385, "epoch": 7137} {"train_loss": -27.1451473236084, "global_step": 592386, "epoch": 7137} {"train_loss": -27.8124942779541, "global_step": 592387, "epoch": 7137} {"train_loss": -27.455310821533203, "global_step": 592388, "epoch": 7137} {"train_loss": -27.5694637298584, "global_step": 592389, "epoch": 7137} {"train_loss": -27.679853439331055, "global_step": 592390, "epoch": 7137} {"train_loss": -27.5052547454834, "global_step": 592391, "epoch": 7137} {"train_loss": -27.869415283203125, "global_step": 592392, "epoch": 7137} {"train_loss": -27.81282615661621, "global_step": 592393, "epoch": 7137} {"train_loss": -27.661548614501953, "global_step": 592394, "epoch": 7137} {"train_loss": -27.73285484313965, "global_step": 592395, "epoch": 7137} {"train_loss": -27.548248291015625, "global_step": 592396, "epoch": 7137} {"train_loss": -27.620630264282227, "global_step": 592397, "epoch": 7137} {"train_loss": -27.766357421875, "global_step": 592398, "epoch": 7137} {"train_loss": -27.534225463867188, "global_step": 592399, "epoch": 7137} {"train_loss": -27.96927833557129, "global_step": 592400, "epoch": 7137} {"train_loss": -27.721323013305664, "global_step": 592401, "epoch": 7137} {"train_loss": -27.794666290283203, "global_step": 592402, "epoch": 7137} {"train_loss": -28.176782608032227, "global_step": 592403, "epoch": 7137} {"train_loss": -27.75649070739746, "global_step": 592404, "epoch": 7137} {"train_loss": -27.616607666015625, "global_step": 592405, "epoch": 7137} {"train_loss": -27.811269760131836, "global_step": 592406, "epoch": 7137} {"train_loss": -27.659101486206055, "global_step": 592407, "epoch": 7137} {"train_loss": -27.68691062927246, "global_step": 592408, "epoch": 7137} {"train_loss": -27.823226928710938, "global_step": 592409, "epoch": 7137} {"train_loss": -27.798856735229492, "global_step": 592410, "epoch": 7137} {"train_loss": -27.960494995117188, "global_step": 592411, "epoch": 7137} {"train_loss": -27.90576171875, "global_step": 592412, "epoch": 7137} {"train_loss": -27.986236572265625, "global_step": 592413, "epoch": 7137} {"train_loss": -28.3118896484375, "global_step": 592414, "epoch": 7137} {"train_loss": -27.600711822509766, "global_step": 592415, "epoch": 7137} {"train_loss": -27.459430694580078, "global_step": 592416, "epoch": 7137} {"train_loss": -28.156635284423828, "global_step": 592417, "epoch": 7137} {"train_loss": -28.391569137573242, "global_step": 592418, "epoch": 7137} {"train_loss": -27.885040283203125, "global_step": 592419, "epoch": 7137} {"train_loss": -28.1229248046875, "global_step": 592420, "epoch": 7137} {"train_loss": -28.035253524780273, "global_step": 592421, "epoch": 7137} {"train_loss": -28.138671875, "global_step": 592422, "epoch": 7137} {"train_loss": -28.076318740844727, "global_step": 592423, "epoch": 7137} {"train_loss": -27.912988662719727, "global_step": 592424, "epoch": 7137} {"train_loss": -27.807172775268555, "global_step": 592425, "epoch": 7137} {"train_loss": -27.690479278564453, "global_step": 592426, "epoch": 7137} {"train_loss": -28.1242618560791, "global_step": 592427, "epoch": 7137} {"train_loss": -27.897918701171875, "global_step": 592428, "epoch": 7137} {"train_loss": -28.3326416015625, "global_step": 592429, "epoch": 7137} {"train_loss": -27.85053062438965, "global_step": 592430, "epoch": 7137} {"train_loss": -27.790124893188477, "global_step": 592431, "epoch": 7137} {"train_loss": -27.8785457611084, "global_step": 592432, "epoch": 7137} {"train_loss": -28.262771606445312, "global_step": 592433, "epoch": 7137} {"train_loss": -27.977781295776367, "global_step": 592434, "epoch": 7137} {"train_loss": -28.020986557006836, "global_step": 592435, "epoch": 7137} {"train_loss": -28.62078857421875, "global_step": 592436, "epoch": 7137} {"train_loss": -28.072219848632812, "global_step": 592437, "epoch": 7137} {"train_loss": -27.524749755859375, "global_step": 592438, "epoch": 7137} {"train_loss": -28.398603439331055, "global_step": 592439, "epoch": 7137} {"train_loss": -28.078500747680664, "global_step": 592440, "epoch": 7137} {"train_loss": -28.286020278930664, "global_step": 592441, "epoch": 7137} {"train_loss": -28.393054962158203, "global_step": 592442, "epoch": 7137} {"train_loss": -28.321359634399414, "global_step": 592443, "epoch": 7137} {"train_loss": -28.0805721282959, "global_step": 592444, "epoch": 7137} {"train_loss": -28.166290283203125, "global_step": 592445, "epoch": 7137} {"train_loss": -28.076007843017578, "global_step": 592446, "epoch": 7137} {"train_loss": -27.83449363708496, "global_step": 592447, "epoch": 7137} {"train_loss": -28.05026626586914, "global_step": 592448, "epoch": 7137} {"train_loss": -28.188745498657227, "global_step": 592449, "epoch": 7137} {"train_loss": -27.786319732666016, "global_step": 592450, "epoch": 7137} {"train_loss": -28.004926681518555, "global_step": 592451, "epoch": 7137} {"train_loss": -28.17683219909668, "global_step": 592452, "epoch": 7137} {"train_loss": -27.794564396502025, "global_step": 592453, "epoch": 7137, "val_loss": 6454384.0} {"train_loss": -25.824644088745117, "global_step": 592454, "epoch": 7138} {"train_loss": -27.03070640563965, "global_step": 592455, "epoch": 7138} {"train_loss": -27.25978660583496, "global_step": 592456, "epoch": 7138} {"train_loss": -26.725976943969727, "global_step": 592457, "epoch": 7138} {"train_loss": -26.67354393005371, "global_step": 592458, "epoch": 7138} {"train_loss": -26.61834716796875, "global_step": 592459, "epoch": 7138} {"train_loss": -26.825958251953125, "global_step": 592460, "epoch": 7138} {"train_loss": -27.411563873291016, "global_step": 592461, "epoch": 7138} {"train_loss": -27.575210571289062, "global_step": 592462, "epoch": 7138} {"train_loss": -27.303058624267578, "global_step": 592463, "epoch": 7138} {"train_loss": -27.42079734802246, "global_step": 592464, "epoch": 7138} {"train_loss": -27.27137565612793, "global_step": 592465, "epoch": 7138} {"train_loss": -27.429075241088867, "global_step": 592466, "epoch": 7138} {"train_loss": -27.6908016204834, "global_step": 592467, "epoch": 7138} {"train_loss": -27.68875503540039, "global_step": 592468, "epoch": 7138} {"train_loss": -27.330047607421875, "global_step": 592469, "epoch": 7138} {"train_loss": -27.969724655151367, "global_step": 592470, "epoch": 7138} {"train_loss": -27.7369441986084, "global_step": 592471, "epoch": 7138} {"train_loss": -27.552936553955078, "global_step": 592472, "epoch": 7138} {"train_loss": -27.698339462280273, "global_step": 592473, "epoch": 7138} {"train_loss": -27.9222354888916, "global_step": 592474, "epoch": 7138} {"train_loss": -27.73819351196289, "global_step": 592475, "epoch": 7138} {"train_loss": -27.47443199157715, "global_step": 592476, "epoch": 7138} {"train_loss": -27.70000648498535, "global_step": 592477, "epoch": 7138} {"train_loss": -28.124435424804688, "global_step": 592478, "epoch": 7138} {"train_loss": -27.990863800048828, "global_step": 592479, "epoch": 7138} {"train_loss": -27.7657413482666, "global_step": 592480, "epoch": 7138} {"train_loss": -27.849462509155273, "global_step": 592481, "epoch": 7138} {"train_loss": -27.895612716674805, "global_step": 592482, "epoch": 7138} {"train_loss": -27.830175399780273, "global_step": 592483, "epoch": 7138} {"train_loss": -27.5440673828125, "global_step": 592484, "epoch": 7138} {"train_loss": -27.911802291870117, "global_step": 592485, "epoch": 7138} {"train_loss": -28.00998306274414, "global_step": 592486, "epoch": 7138} {"train_loss": -27.703964233398438, "global_step": 592487, "epoch": 7138} {"train_loss": -28.111181259155273, "global_step": 592488, "epoch": 7138} {"train_loss": -27.74640464782715, "global_step": 592489, "epoch": 7138} {"train_loss": -27.94471549987793, "global_step": 592490, "epoch": 7138} {"train_loss": -27.961822509765625, "global_step": 592491, "epoch": 7138} {"train_loss": -28.010862350463867, "global_step": 592492, "epoch": 7138} {"train_loss": -28.245559692382812, "global_step": 592493, "epoch": 7138} {"train_loss": -28.128385543823242, "global_step": 592494, "epoch": 7138} {"train_loss": -27.759124755859375, "global_step": 592495, "epoch": 7138} {"train_loss": -27.904539108276367, "global_step": 592496, "epoch": 7138} {"train_loss": -27.805877685546875, "global_step": 592497, "epoch": 7138} {"train_loss": -27.68556022644043, "global_step": 592498, "epoch": 7138} {"train_loss": -28.056095123291016, "global_step": 592499, "epoch": 7138} {"train_loss": -27.8105525970459, "global_step": 592500, "epoch": 7138} {"train_loss": -28.389062881469727, "global_step": 592501, "epoch": 7138} {"train_loss": -27.94575309753418, "global_step": 592502, "epoch": 7138} {"train_loss": -27.7176570892334, "global_step": 592503, "epoch": 7138} {"train_loss": -28.088022232055664, "global_step": 592504, "epoch": 7138} {"train_loss": -27.817487716674805, "global_step": 592505, "epoch": 7138} {"train_loss": -27.86881446838379, "global_step": 592506, "epoch": 7138} {"train_loss": -28.05975914001465, "global_step": 592507, "epoch": 7138} {"train_loss": -27.992765426635742, "global_step": 592508, "epoch": 7138} {"train_loss": -27.90656089782715, "global_step": 592509, "epoch": 7138} {"train_loss": -28.320112228393555, "global_step": 592510, "epoch": 7138} {"train_loss": -28.486011505126953, "global_step": 592511, "epoch": 7138} {"train_loss": -28.070316314697266, "global_step": 592512, "epoch": 7138} {"train_loss": -28.156042098999023, "global_step": 592513, "epoch": 7138} {"train_loss": -28.052536010742188, "global_step": 592514, "epoch": 7138} {"train_loss": -28.124845504760742, "global_step": 592515, "epoch": 7138} {"train_loss": -28.345609664916992, "global_step": 592516, "epoch": 7138} {"train_loss": -28.347326278686523, "global_step": 592517, "epoch": 7138} {"train_loss": -28.3520565032959, "global_step": 592518, "epoch": 7138} {"train_loss": -28.050439834594727, "global_step": 592519, "epoch": 7138} {"train_loss": -28.21579933166504, "global_step": 592520, "epoch": 7138} {"train_loss": -28.37180519104004, "global_step": 592521, "epoch": 7138} {"train_loss": -28.1112117767334, "global_step": 592522, "epoch": 7138} {"train_loss": -27.9666690826416, "global_step": 592523, "epoch": 7138} {"train_loss": -27.714452743530273, "global_step": 592524, "epoch": 7138} {"train_loss": -27.71650505065918, "global_step": 592525, "epoch": 7138} {"train_loss": -27.89548683166504, "global_step": 592526, "epoch": 7138} {"train_loss": -28.21831703186035, "global_step": 592527, "epoch": 7138} {"train_loss": -27.65242576599121, "global_step": 592528, "epoch": 7138} {"train_loss": -28.165267944335938, "global_step": 592529, "epoch": 7138} {"train_loss": -27.99448013305664, "global_step": 592530, "epoch": 7138} {"train_loss": -28.140460968017578, "global_step": 592531, "epoch": 7138} {"train_loss": -27.745380401611328, "global_step": 592532, "epoch": 7138} {"train_loss": -28.17423439025879, "global_step": 592533, "epoch": 7138} {"train_loss": -28.018207550048828, "global_step": 592534, "epoch": 7138} {"train_loss": -27.8520450592041, "global_step": 592535, "epoch": 7138} {"train_loss": -27.823361155498457, "global_step": 592536, "epoch": 7138, "val_loss": 6498828.0} {"train_loss": -26.202173233032227, "global_step": 592537, "epoch": 7139} {"train_loss": -24.381290435791016, "global_step": 592538, "epoch": 7139} {"train_loss": -25.840009689331055, "global_step": 592539, "epoch": 7139} {"train_loss": -27.254453659057617, "global_step": 592540, "epoch": 7139} {"train_loss": -26.64851188659668, "global_step": 592541, "epoch": 7139} {"train_loss": -26.423627853393555, "global_step": 592542, "epoch": 7139} {"train_loss": -27.542226791381836, "global_step": 592543, "epoch": 7139} {"train_loss": -26.5053653717041, "global_step": 592544, "epoch": 7139} {"train_loss": -27.542510986328125, "global_step": 592545, "epoch": 7139} {"train_loss": -26.751453399658203, "global_step": 592546, "epoch": 7139} {"train_loss": -27.48494529724121, "global_step": 592547, "epoch": 7139} {"train_loss": -27.494831085205078, "global_step": 592548, "epoch": 7139} {"train_loss": -27.13409423828125, "global_step": 592549, "epoch": 7139} {"train_loss": -27.4931583404541, "global_step": 592550, "epoch": 7139} {"train_loss": -27.44455337524414, "global_step": 592551, "epoch": 7139} {"train_loss": -27.672042846679688, "global_step": 592552, "epoch": 7139} {"train_loss": -27.15109634399414, "global_step": 592553, "epoch": 7139} {"train_loss": -27.63068962097168, "global_step": 592554, "epoch": 7139} {"train_loss": -27.488662719726562, "global_step": 592555, "epoch": 7139} {"train_loss": -27.600141525268555, "global_step": 592556, "epoch": 7139} {"train_loss": -27.626672744750977, "global_step": 592557, "epoch": 7139} {"train_loss": -27.365636825561523, "global_step": 592558, "epoch": 7139} {"train_loss": -27.536930084228516, "global_step": 592559, "epoch": 7139} {"train_loss": -27.607421875, "global_step": 592560, "epoch": 7139} {"train_loss": -27.6506290435791, "global_step": 592561, "epoch": 7139} {"train_loss": -27.765737533569336, "global_step": 592562, "epoch": 7139} {"train_loss": -27.351587295532227, "global_step": 592563, "epoch": 7139} {"train_loss": -28.040624618530273, "global_step": 592564, "epoch": 7139} {"train_loss": -27.79083251953125, "global_step": 592565, "epoch": 7139} {"train_loss": -28.144214630126953, "global_step": 592566, "epoch": 7139} {"train_loss": -27.274311065673828, "global_step": 592567, "epoch": 7139} {"train_loss": -27.968053817749023, "global_step": 592568, "epoch": 7139} {"train_loss": -27.928064346313477, "global_step": 592569, "epoch": 7139} {"train_loss": -27.984485626220703, "global_step": 592570, "epoch": 7139} {"train_loss": -27.86269187927246, "global_step": 592571, "epoch": 7139} {"train_loss": -27.52752113342285, "global_step": 592572, "epoch": 7139} {"train_loss": -28.1856632232666, "global_step": 592573, "epoch": 7139} {"train_loss": -27.814916610717773, "global_step": 592574, "epoch": 7139} {"train_loss": -27.91861343383789, "global_step": 592575, "epoch": 7139} {"train_loss": -28.03864097595215, "global_step": 592576, "epoch": 7139} {"train_loss": -28.00762367248535, "global_step": 592577, "epoch": 7139} {"train_loss": -28.079130172729492, "global_step": 592578, "epoch": 7139} {"train_loss": -28.096837997436523, "global_step": 592579, "epoch": 7139} {"train_loss": -28.064672470092773, "global_step": 592580, "epoch": 7139} {"train_loss": -27.7541561126709, "global_step": 592581, "epoch": 7139} {"train_loss": -28.30218505859375, "global_step": 592582, "epoch": 7139} {"train_loss": -28.07010269165039, "global_step": 592583, "epoch": 7139} {"train_loss": -28.22049331665039, "global_step": 592584, "epoch": 7139} {"train_loss": -27.924774169921875, "global_step": 592585, "epoch": 7139} {"train_loss": -28.00564956665039, "global_step": 592586, "epoch": 7139} {"train_loss": -27.97586441040039, "global_step": 592587, "epoch": 7139} {"train_loss": -28.317670822143555, "global_step": 592588, "epoch": 7139} {"train_loss": -28.304895401000977, "global_step": 592589, "epoch": 7139} {"train_loss": -28.186466217041016, "global_step": 592590, "epoch": 7139} {"train_loss": -28.416126251220703, "global_step": 592591, "epoch": 7139} {"train_loss": -28.09943962097168, "global_step": 592592, "epoch": 7139} {"train_loss": -28.076025009155273, "global_step": 592593, "epoch": 7139} {"train_loss": -27.58450698852539, "global_step": 592594, "epoch": 7139} {"train_loss": -28.46051025390625, "global_step": 592595, "epoch": 7139} {"train_loss": -28.556360244750977, "global_step": 592596, "epoch": 7139} {"train_loss": -28.263845443725586, "global_step": 592597, "epoch": 7139} {"train_loss": -27.865478515625, "global_step": 592598, "epoch": 7139} {"train_loss": -27.898298263549805, "global_step": 592599, "epoch": 7139} {"train_loss": -27.87237548828125, "global_step": 592600, "epoch": 7139} {"train_loss": -28.047719955444336, "global_step": 592601, "epoch": 7139} {"train_loss": -27.67865562438965, "global_step": 592602, "epoch": 7139} {"train_loss": -28.017236709594727, "global_step": 592603, "epoch": 7139} {"train_loss": -28.209569931030273, "global_step": 592604, "epoch": 7139} {"train_loss": -27.758604049682617, "global_step": 592605, "epoch": 7139} {"train_loss": -28.071645736694336, "global_step": 592606, "epoch": 7139} {"train_loss": -27.972997665405273, "global_step": 592607, "epoch": 7139} {"train_loss": -27.688846588134766, "global_step": 592608, "epoch": 7139} {"train_loss": -28.181570053100586, "global_step": 592609, "epoch": 7139} {"train_loss": -27.373706817626953, "global_step": 592610, "epoch": 7139} {"train_loss": -27.345285415649414, "global_step": 592611, "epoch": 7139} {"train_loss": -27.856067657470703, "global_step": 592612, "epoch": 7139} {"train_loss": -27.84467887878418, "global_step": 592613, "epoch": 7139} {"train_loss": -27.911609649658203, "global_step": 592614, "epoch": 7139} {"train_loss": -28.080759048461914, "global_step": 592615, "epoch": 7139} {"train_loss": -27.75386619567871, "global_step": 592616, "epoch": 7139} {"train_loss": -28.21735191345215, "global_step": 592617, "epoch": 7139} {"train_loss": -27.759906768798828, "global_step": 592618, "epoch": 7139} {"train_loss": -27.703560932573065, "global_step": 592619, "epoch": 7139, "val_loss": 6543020.0} {"train_loss": -27.172210693359375, "global_step": 592620, "epoch": 7140} {"train_loss": -27.499591827392578, "global_step": 592621, "epoch": 7140} {"train_loss": -26.583057403564453, "global_step": 592622, "epoch": 7140} {"train_loss": -28.12821388244629, "global_step": 592623, "epoch": 7140} {"train_loss": -27.320804595947266, "global_step": 592624, "epoch": 7140} {"train_loss": -27.285581588745117, "global_step": 592625, "epoch": 7140} {"train_loss": -28.062170028686523, "global_step": 592626, "epoch": 7140} {"train_loss": -27.05621910095215, "global_step": 592627, "epoch": 7140} {"train_loss": -27.65152359008789, "global_step": 592628, "epoch": 7140} {"train_loss": -27.44416618347168, "global_step": 592629, "epoch": 7140} {"train_loss": -27.63251304626465, "global_step": 592630, "epoch": 7140} {"train_loss": -27.477466583251953, "global_step": 592631, "epoch": 7140} {"train_loss": -27.4150447845459, "global_step": 592632, "epoch": 7140} {"train_loss": -27.78193473815918, "global_step": 592633, "epoch": 7140} {"train_loss": -27.733097076416016, "global_step": 592634, "epoch": 7140} {"train_loss": -27.888381958007812, "global_step": 592635, "epoch": 7140} {"train_loss": -27.763330459594727, "global_step": 592636, "epoch": 7140} {"train_loss": -28.148822784423828, "global_step": 592637, "epoch": 7140} {"train_loss": -27.766931533813477, "global_step": 592638, "epoch": 7140} {"train_loss": -27.389602661132812, "global_step": 592639, "epoch": 7140} {"train_loss": -27.50775146484375, "global_step": 592640, "epoch": 7140} {"train_loss": -27.73040771484375, "global_step": 592641, "epoch": 7140} {"train_loss": -27.676401138305664, "global_step": 592642, "epoch": 7140} {"train_loss": -27.70025634765625, "global_step": 592643, "epoch": 7140} {"train_loss": -28.3494873046875, "global_step": 592644, "epoch": 7140} {"train_loss": -27.945581436157227, "global_step": 592645, "epoch": 7140} {"train_loss": -27.828367233276367, "global_step": 592646, "epoch": 7140} {"train_loss": -28.363311767578125, "global_step": 592647, "epoch": 7140} {"train_loss": -27.979480743408203, "global_step": 592648, "epoch": 7140} {"train_loss": -27.941070556640625, "global_step": 592649, "epoch": 7140} {"train_loss": -28.267187118530273, "global_step": 592650, "epoch": 7140} {"train_loss": -28.148639678955078, "global_step": 592651, "epoch": 7140} {"train_loss": -28.252532958984375, "global_step": 592652, "epoch": 7140} {"train_loss": -27.872106552124023, "global_step": 592653, "epoch": 7140} {"train_loss": -28.238317489624023, "global_step": 592654, "epoch": 7140} {"train_loss": -28.21435546875, "global_step": 592655, "epoch": 7140} {"train_loss": -28.295751571655273, "global_step": 592656, "epoch": 7140} {"train_loss": -28.054248809814453, "global_step": 592657, "epoch": 7140} {"train_loss": -28.088733673095703, "global_step": 592658, "epoch": 7140} {"train_loss": -28.288959503173828, "global_step": 592659, "epoch": 7140} {"train_loss": -27.99590492248535, "global_step": 592660, "epoch": 7140} {"train_loss": -28.129596710205078, "global_step": 592661, "epoch": 7140} {"train_loss": -28.01322364807129, "global_step": 592662, "epoch": 7140} {"train_loss": -28.019287109375, "global_step": 592663, "epoch": 7140} {"train_loss": -27.993234634399414, "global_step": 592664, "epoch": 7140} {"train_loss": -28.01056480407715, "global_step": 592665, "epoch": 7140} {"train_loss": -27.901601791381836, "global_step": 592666, "epoch": 7140} {"train_loss": -27.882848739624023, "global_step": 592667, "epoch": 7140} {"train_loss": -28.310211181640625, "global_step": 592668, "epoch": 7140} {"train_loss": -28.029926300048828, "global_step": 592669, "epoch": 7140} {"train_loss": -28.527074813842773, "global_step": 592670, "epoch": 7140} {"train_loss": -27.955530166625977, "global_step": 592671, "epoch": 7140} {"train_loss": -27.839319229125977, "global_step": 592672, "epoch": 7140} {"train_loss": -27.982763290405273, "global_step": 592673, "epoch": 7140} {"train_loss": -28.5031795501709, "global_step": 592674, "epoch": 7140} {"train_loss": -28.079065322875977, "global_step": 592675, "epoch": 7140} {"train_loss": -27.61983299255371, "global_step": 592676, "epoch": 7140} {"train_loss": -28.406177520751953, "global_step": 592677, "epoch": 7140} {"train_loss": -28.25899314880371, "global_step": 592678, "epoch": 7140} {"train_loss": -27.602985382080078, "global_step": 592679, "epoch": 7140} {"train_loss": -28.30413818359375, "global_step": 592680, "epoch": 7140} {"train_loss": -27.95721435546875, "global_step": 592681, "epoch": 7140} {"train_loss": -28.151655197143555, "global_step": 592682, "epoch": 7140} {"train_loss": -28.05067253112793, "global_step": 592683, "epoch": 7140} {"train_loss": -28.04191017150879, "global_step": 592684, "epoch": 7140} {"train_loss": -28.524885177612305, "global_step": 592685, "epoch": 7140} {"train_loss": -28.3157958984375, "global_step": 592686, "epoch": 7140} {"train_loss": -27.632007598876953, "global_step": 592687, "epoch": 7140} {"train_loss": -27.754608154296875, "global_step": 592688, "epoch": 7140} {"train_loss": -27.2979679107666, "global_step": 592689, "epoch": 7140} {"train_loss": -27.32049560546875, "global_step": 592690, "epoch": 7140} {"train_loss": -27.785791397094727, "global_step": 592691, "epoch": 7140} {"train_loss": -27.52424430847168, "global_step": 592692, "epoch": 7140} {"train_loss": -27.93597412109375, "global_step": 592693, "epoch": 7140} {"train_loss": -27.786865234375, "global_step": 592694, "epoch": 7140} {"train_loss": -27.47414207458496, "global_step": 592695, "epoch": 7140} {"train_loss": -27.656787872314453, "global_step": 592696, "epoch": 7140} {"train_loss": -27.603439331054688, "global_step": 592697, "epoch": 7140} {"train_loss": -27.919172286987305, "global_step": 592698, "epoch": 7140} {"train_loss": -28.072885513305664, "global_step": 592699, "epoch": 7140} {"train_loss": -27.62312126159668, "global_step": 592700, "epoch": 7140} {"train_loss": -27.746479034423828, "global_step": 592701, "epoch": 7140} {"train_loss": -27.86551776564265, "global_step": 592702, "epoch": 7140, "val_loss": 6597375.0} {"train_loss": -27.269948959350586, "global_step": 592703, "epoch": 7141} {"train_loss": -27.3310604095459, "global_step": 592704, "epoch": 7141} {"train_loss": -27.825641632080078, "global_step": 592705, "epoch": 7141} {"train_loss": -27.29290771484375, "global_step": 592706, "epoch": 7141} {"train_loss": -27.021427154541016, "global_step": 592707, "epoch": 7141} {"train_loss": -27.453815460205078, "global_step": 592708, "epoch": 7141} {"train_loss": -26.977313995361328, "global_step": 592709, "epoch": 7141} {"train_loss": -27.307348251342773, "global_step": 592710, "epoch": 7141} {"train_loss": -27.379058837890625, "global_step": 592711, "epoch": 7141} {"train_loss": -27.447797775268555, "global_step": 592712, "epoch": 7141} {"train_loss": -27.905227661132812, "global_step": 592713, "epoch": 7141} {"train_loss": -27.376392364501953, "global_step": 592714, "epoch": 7141} {"train_loss": -27.647083282470703, "global_step": 592715, "epoch": 7141} {"train_loss": -27.84830665588379, "global_step": 592716, "epoch": 7141} {"train_loss": -27.43252944946289, "global_step": 592717, "epoch": 7141} {"train_loss": -27.511808395385742, "global_step": 592718, "epoch": 7141} {"train_loss": -27.782743453979492, "global_step": 592719, "epoch": 7141} {"train_loss": -27.633819580078125, "global_step": 592720, "epoch": 7141} {"train_loss": -27.78458023071289, "global_step": 592721, "epoch": 7141} {"train_loss": -27.516897201538086, "global_step": 592722, "epoch": 7141} {"train_loss": -28.02724266052246, "global_step": 592723, "epoch": 7141} {"train_loss": -27.688413619995117, "global_step": 592724, "epoch": 7141} {"train_loss": -27.491018295288086, "global_step": 592725, "epoch": 7141} {"train_loss": -27.8284969329834, "global_step": 592726, "epoch": 7141} {"train_loss": -27.697010040283203, "global_step": 592727, "epoch": 7141} {"train_loss": -27.850662231445312, "global_step": 592728, "epoch": 7141} {"train_loss": -27.992374420166016, "global_step": 592729, "epoch": 7141} {"train_loss": -27.89375114440918, "global_step": 592730, "epoch": 7141} {"train_loss": -27.7509708404541, "global_step": 592731, "epoch": 7141} {"train_loss": -28.194257736206055, "global_step": 592732, "epoch": 7141} {"train_loss": -28.224485397338867, "global_step": 592733, "epoch": 7141} {"train_loss": -28.046262741088867, "global_step": 592734, "epoch": 7141} {"train_loss": -27.92169189453125, "global_step": 592735, "epoch": 7141} {"train_loss": -27.78376579284668, "global_step": 592736, "epoch": 7141} {"train_loss": -28.038257598876953, "global_step": 592737, "epoch": 7141} {"train_loss": -28.207120895385742, "global_step": 592738, "epoch": 7141} {"train_loss": -28.0834903717041, "global_step": 592739, "epoch": 7141} {"train_loss": -27.96076774597168, "global_step": 592740, "epoch": 7141} {"train_loss": -28.193288803100586, "global_step": 592741, "epoch": 7141} {"train_loss": -27.975629806518555, "global_step": 592742, "epoch": 7141} {"train_loss": -28.007770538330078, "global_step": 592743, "epoch": 7141} {"train_loss": -28.25006103515625, "global_step": 592744, "epoch": 7141} {"train_loss": -28.63714599609375, "global_step": 592745, "epoch": 7141} {"train_loss": -28.05518913269043, "global_step": 592746, "epoch": 7141} {"train_loss": -28.093372344970703, "global_step": 592747, "epoch": 7141} {"train_loss": -27.943958282470703, "global_step": 592748, "epoch": 7141} {"train_loss": -28.572834014892578, "global_step": 592749, "epoch": 7141} {"train_loss": -27.9466609954834, "global_step": 592750, "epoch": 7141} {"train_loss": -28.281415939331055, "global_step": 592751, "epoch": 7141} {"train_loss": -28.007034301757812, "global_step": 592752, "epoch": 7141} {"train_loss": -28.125280380249023, "global_step": 592753, "epoch": 7141} {"train_loss": -27.950998306274414, "global_step": 592754, "epoch": 7141} {"train_loss": -28.580982208251953, "global_step": 592755, "epoch": 7141} {"train_loss": -27.85601234436035, "global_step": 592756, "epoch": 7141} {"train_loss": -28.249591827392578, "global_step": 592757, "epoch": 7141} {"train_loss": -28.123092651367188, "global_step": 592758, "epoch": 7141} {"train_loss": -27.8771915435791, "global_step": 592759, "epoch": 7141} {"train_loss": -27.69169044494629, "global_step": 592760, "epoch": 7141} {"train_loss": -27.734817504882812, "global_step": 592761, "epoch": 7141} {"train_loss": -26.991987228393555, "global_step": 592762, "epoch": 7141} {"train_loss": -27.568805694580078, "global_step": 592763, "epoch": 7141} {"train_loss": -27.8388729095459, "global_step": 592764, "epoch": 7141} {"train_loss": -27.591251373291016, "global_step": 592765, "epoch": 7141} {"train_loss": -27.268476486206055, "global_step": 592766, "epoch": 7141} {"train_loss": -27.918304443359375, "global_step": 592767, "epoch": 7141} {"train_loss": -27.46620750427246, "global_step": 592768, "epoch": 7141} {"train_loss": -28.067407608032227, "global_step": 592769, "epoch": 7141} {"train_loss": -27.6129207611084, "global_step": 592770, "epoch": 7141} {"train_loss": -27.545785903930664, "global_step": 592771, "epoch": 7141} {"train_loss": -27.81048011779785, "global_step": 592772, "epoch": 7141} {"train_loss": -28.039838790893555, "global_step": 592773, "epoch": 7141} {"train_loss": -28.014362335205078, "global_step": 592774, "epoch": 7141} {"train_loss": -27.6343994140625, "global_step": 592775, "epoch": 7141} {"train_loss": -27.852087020874023, "global_step": 592776, "epoch": 7141} {"train_loss": -28.037097930908203, "global_step": 592777, "epoch": 7141} {"train_loss": -27.47974967956543, "global_step": 592778, "epoch": 7141} {"train_loss": -27.344181060791016, "global_step": 592779, "epoch": 7141} {"train_loss": -27.84218406677246, "global_step": 592780, "epoch": 7141} {"train_loss": -27.895523071289062, "global_step": 592781, "epoch": 7141} {"train_loss": -27.54975700378418, "global_step": 592782, "epoch": 7141} {"train_loss": -28.196338653564453, "global_step": 592783, "epoch": 7141} {"train_loss": -28.132673263549805, "global_step": 592784, "epoch": 7141} {"train_loss": -27.8027177374047, "global_step": 592785, "epoch": 7141, "val_loss": 6595096.0} {"train_loss": -27.699254989624023, "global_step": 592786, "epoch": 7142} {"train_loss": -27.796905517578125, "global_step": 592787, "epoch": 7142} {"train_loss": -27.984827041625977, "global_step": 592788, "epoch": 7142} {"train_loss": -27.615381240844727, "global_step": 592789, "epoch": 7142} {"train_loss": -28.04339027404785, "global_step": 592790, "epoch": 7142} {"train_loss": -27.398883819580078, "global_step": 592791, "epoch": 7142} {"train_loss": -27.6485652923584, "global_step": 592792, "epoch": 7142} {"train_loss": -27.328826904296875, "global_step": 592793, "epoch": 7142} {"train_loss": -27.60676383972168, "global_step": 592794, "epoch": 7142} {"train_loss": -27.008604049682617, "global_step": 592795, "epoch": 7142} {"train_loss": -27.601520538330078, "global_step": 592796, "epoch": 7142} {"train_loss": -27.45216178894043, "global_step": 592797, "epoch": 7142} {"train_loss": -27.845579147338867, "global_step": 592798, "epoch": 7142} {"train_loss": -27.888586044311523, "global_step": 592799, "epoch": 7142} {"train_loss": -27.714441299438477, "global_step": 592800, "epoch": 7142} {"train_loss": -27.528156280517578, "global_step": 592801, "epoch": 7142} {"train_loss": -27.97627067565918, "global_step": 592802, "epoch": 7142} {"train_loss": -27.954864501953125, "global_step": 592803, "epoch": 7142} {"train_loss": -27.7004451751709, "global_step": 592804, "epoch": 7142} {"train_loss": -28.00641441345215, "global_step": 592805, "epoch": 7142} {"train_loss": -27.321613311767578, "global_step": 592806, "epoch": 7142} {"train_loss": -27.96188735961914, "global_step": 592807, "epoch": 7142} {"train_loss": -28.08139991760254, "global_step": 592808, "epoch": 7142} {"train_loss": -27.697986602783203, "global_step": 592809, "epoch": 7142} {"train_loss": -28.1029109954834, "global_step": 592810, "epoch": 7142} {"train_loss": -28.091123580932617, "global_step": 592811, "epoch": 7142} {"train_loss": -28.16352653503418, "global_step": 592812, "epoch": 7142} {"train_loss": -27.700345993041992, "global_step": 592813, "epoch": 7142} {"train_loss": -28.078216552734375, "global_step": 592814, "epoch": 7142} {"train_loss": -28.109045028686523, "global_step": 592815, "epoch": 7142} {"train_loss": -27.940473556518555, "global_step": 592816, "epoch": 7142} {"train_loss": -27.920740127563477, "global_step": 592817, "epoch": 7142} {"train_loss": -28.219457626342773, "global_step": 592818, "epoch": 7142} {"train_loss": -27.72223472595215, "global_step": 592819, "epoch": 7142} {"train_loss": -27.83550453186035, "global_step": 592820, "epoch": 7142} {"train_loss": -27.639623641967773, "global_step": 592821, "epoch": 7142} {"train_loss": -28.044666290283203, "global_step": 592822, "epoch": 7142} {"train_loss": -28.133893966674805, "global_step": 592823, "epoch": 7142} {"train_loss": -28.12548828125, "global_step": 592824, "epoch": 7142} {"train_loss": -27.95631217956543, "global_step": 592825, "epoch": 7142} {"train_loss": -28.30817222595215, "global_step": 592826, "epoch": 7142} {"train_loss": -27.965499877929688, "global_step": 592827, "epoch": 7142} {"train_loss": -27.886966705322266, "global_step": 592828, "epoch": 7142} {"train_loss": -28.200971603393555, "global_step": 592829, "epoch": 7142} {"train_loss": -28.155170440673828, "global_step": 592830, "epoch": 7142} {"train_loss": -28.136335372924805, "global_step": 592831, "epoch": 7142} {"train_loss": -27.972187042236328, "global_step": 592832, "epoch": 7142} {"train_loss": -27.688329696655273, "global_step": 592833, "epoch": 7142} {"train_loss": -28.17600440979004, "global_step": 592834, "epoch": 7142} {"train_loss": -28.227609634399414, "global_step": 592835, "epoch": 7142} {"train_loss": -28.27577018737793, "global_step": 592836, "epoch": 7142} {"train_loss": -27.597883224487305, "global_step": 592837, "epoch": 7142} {"train_loss": -27.730127334594727, "global_step": 592838, "epoch": 7142} {"train_loss": -28.232580184936523, "global_step": 592839, "epoch": 7142} {"train_loss": -27.62888526916504, "global_step": 592840, "epoch": 7142} {"train_loss": -27.726566314697266, "global_step": 592841, "epoch": 7142} {"train_loss": -28.112287521362305, "global_step": 592842, "epoch": 7142} {"train_loss": -28.39410972595215, "global_step": 592843, "epoch": 7142} {"train_loss": -28.1873779296875, "global_step": 592844, "epoch": 7142} {"train_loss": -27.9354305267334, "global_step": 592845, "epoch": 7142} {"train_loss": -28.172199249267578, "global_step": 592846, "epoch": 7142} {"train_loss": -27.54958152770996, "global_step": 592847, "epoch": 7142} {"train_loss": -27.774856567382812, "global_step": 592848, "epoch": 7142} {"train_loss": -28.260778427124023, "global_step": 592849, "epoch": 7142} {"train_loss": -27.305768966674805, "global_step": 592850, "epoch": 7142} {"train_loss": -27.295684814453125, "global_step": 592851, "epoch": 7142} {"train_loss": -27.573827743530273, "global_step": 592852, "epoch": 7142} {"train_loss": -27.255111694335938, "global_step": 592853, "epoch": 7142} {"train_loss": -27.6044979095459, "global_step": 592854, "epoch": 7142} {"train_loss": -27.502765655517578, "global_step": 592855, "epoch": 7142} {"train_loss": -27.614593505859375, "global_step": 592856, "epoch": 7142} {"train_loss": -27.895587921142578, "global_step": 592857, "epoch": 7142} {"train_loss": -28.010435104370117, "global_step": 592858, "epoch": 7142} {"train_loss": -27.779333114624023, "global_step": 592859, "epoch": 7142} {"train_loss": -27.86969566345215, "global_step": 592860, "epoch": 7142} {"train_loss": -27.702802658081055, "global_step": 592861, "epoch": 7142} {"train_loss": -27.652551651000977, "global_step": 592862, "epoch": 7142} {"train_loss": -28.036243438720703, "global_step": 592863, "epoch": 7142} {"train_loss": -27.660688400268555, "global_step": 592864, "epoch": 7142} {"train_loss": -27.595083236694336, "global_step": 592865, "epoch": 7142} {"train_loss": -28.217432022094727, "global_step": 592866, "epoch": 7142} {"train_loss": -28.06597900390625, "global_step": 592867, "epoch": 7142} {"train_loss": -27.84355754162892, "global_step": 592868, "epoch": 7142, "val_loss": 6578594.0} {"train_loss": -27.243661880493164, "global_step": 592869, "epoch": 7143} {"train_loss": -26.573556900024414, "global_step": 592870, "epoch": 7143} {"train_loss": -27.518268585205078, "global_step": 592871, "epoch": 7143} {"train_loss": -26.750768661499023, "global_step": 592872, "epoch": 7143} {"train_loss": -27.496021270751953, "global_step": 592873, "epoch": 7143} {"train_loss": -26.880674362182617, "global_step": 592874, "epoch": 7143} {"train_loss": -27.572004318237305, "global_step": 592875, "epoch": 7143} {"train_loss": -27.396717071533203, "global_step": 592876, "epoch": 7143} {"train_loss": -27.734609603881836, "global_step": 592877, "epoch": 7143} {"train_loss": -27.379064559936523, "global_step": 592878, "epoch": 7143} {"train_loss": -27.6370849609375, "global_step": 592879, "epoch": 7143} {"train_loss": -27.74563980102539, "global_step": 592880, "epoch": 7143} {"train_loss": -27.480588912963867, "global_step": 592881, "epoch": 7143} {"train_loss": -27.7634220123291, "global_step": 592882, "epoch": 7143} {"train_loss": -27.493330001831055, "global_step": 592883, "epoch": 7143} {"train_loss": -27.38993263244629, "global_step": 592884, "epoch": 7143} {"train_loss": -27.90425682067871, "global_step": 592885, "epoch": 7143} {"train_loss": -27.414081573486328, "global_step": 592886, "epoch": 7143} {"train_loss": -27.398258209228516, "global_step": 592887, "epoch": 7143} {"train_loss": -27.635461807250977, "global_step": 592888, "epoch": 7143} {"train_loss": -27.381820678710938, "global_step": 592889, "epoch": 7143} {"train_loss": -27.673315048217773, "global_step": 592890, "epoch": 7143} {"train_loss": -27.507843017578125, "global_step": 592891, "epoch": 7143} {"train_loss": -27.6886043548584, "global_step": 592892, "epoch": 7143} {"train_loss": -27.6954402923584, "global_step": 592893, "epoch": 7143} {"train_loss": -27.83808708190918, "global_step": 592894, "epoch": 7143} {"train_loss": -27.686283111572266, "global_step": 592895, "epoch": 7143} {"train_loss": -28.055707931518555, "global_step": 592896, "epoch": 7143} {"train_loss": -27.999744415283203, "global_step": 592897, "epoch": 7143} {"train_loss": -27.651199340820312, "global_step": 592898, "epoch": 7143} {"train_loss": -27.708831787109375, "global_step": 592899, "epoch": 7143} {"train_loss": -27.763397216796875, "global_step": 592900, "epoch": 7143} {"train_loss": -27.7884578704834, "global_step": 592901, "epoch": 7143} {"train_loss": -28.058063507080078, "global_step": 592902, "epoch": 7143} {"train_loss": -28.182031631469727, "global_step": 592903, "epoch": 7143} {"train_loss": -28.153051376342773, "global_step": 592904, "epoch": 7143} {"train_loss": -28.122465133666992, "global_step": 592905, "epoch": 7143} {"train_loss": -27.9642391204834, "global_step": 592906, "epoch": 7143} {"train_loss": -28.3657169342041, "global_step": 592907, "epoch": 7143} {"train_loss": -28.2257022857666, "global_step": 592908, "epoch": 7143} {"train_loss": -27.71475601196289, "global_step": 592909, "epoch": 7143} {"train_loss": -28.012502670288086, "global_step": 592910, "epoch": 7143} {"train_loss": -28.08204460144043, "global_step": 592911, "epoch": 7143} {"train_loss": -28.187274932861328, "global_step": 592912, "epoch": 7143} {"train_loss": -28.05666160583496, "global_step": 592913, "epoch": 7143} {"train_loss": -28.232099533081055, "global_step": 592914, "epoch": 7143} {"train_loss": -28.41828727722168, "global_step": 592915, "epoch": 7143} {"train_loss": -27.682525634765625, "global_step": 592916, "epoch": 7143} {"train_loss": -28.294849395751953, "global_step": 592917, "epoch": 7143} {"train_loss": -28.3654842376709, "global_step": 592918, "epoch": 7143} {"train_loss": -27.88861083984375, "global_step": 592919, "epoch": 7143} {"train_loss": -28.18247413635254, "global_step": 592920, "epoch": 7143} {"train_loss": -27.844284057617188, "global_step": 592921, "epoch": 7143} {"train_loss": -27.897916793823242, "global_step": 592922, "epoch": 7143} {"train_loss": -27.494964599609375, "global_step": 592923, "epoch": 7143} {"train_loss": -27.336822509765625, "global_step": 592924, "epoch": 7143} {"train_loss": -27.202863693237305, "global_step": 592925, "epoch": 7143} {"train_loss": -26.823652267456055, "global_step": 592926, "epoch": 7143} {"train_loss": -27.235681533813477, "global_step": 592927, "epoch": 7143} {"train_loss": -28.0948429107666, "global_step": 592928, "epoch": 7143} {"train_loss": -27.737516403198242, "global_step": 592929, "epoch": 7143} {"train_loss": -27.69882583618164, "global_step": 592930, "epoch": 7143} {"train_loss": -27.808536529541016, "global_step": 592931, "epoch": 7143} {"train_loss": -27.777923583984375, "global_step": 592932, "epoch": 7143} {"train_loss": -28.130645751953125, "global_step": 592933, "epoch": 7143} {"train_loss": -27.557403564453125, "global_step": 592934, "epoch": 7143} {"train_loss": -27.77984046936035, "global_step": 592935, "epoch": 7143} {"train_loss": -27.85149574279785, "global_step": 592936, "epoch": 7143} {"train_loss": -27.823871612548828, "global_step": 592937, "epoch": 7143} {"train_loss": -28.0607852935791, "global_step": 592938, "epoch": 7143} {"train_loss": -27.703638076782227, "global_step": 592939, "epoch": 7143} {"train_loss": -27.869129180908203, "global_step": 592940, "epoch": 7143} {"train_loss": -27.786148071289062, "global_step": 592941, "epoch": 7143} {"train_loss": -28.25710105895996, "global_step": 592942, "epoch": 7143} {"train_loss": -27.97198486328125, "global_step": 592943, "epoch": 7143} {"train_loss": -28.218637466430664, "global_step": 592944, "epoch": 7143} {"train_loss": -27.903257369995117, "global_step": 592945, "epoch": 7143} {"train_loss": -28.210493087768555, "global_step": 592946, "epoch": 7143} {"train_loss": -28.059173583984375, "global_step": 592947, "epoch": 7143} {"train_loss": -27.984149932861328, "global_step": 592948, "epoch": 7143} {"train_loss": -28.158008575439453, "global_step": 592949, "epoch": 7143} {"train_loss": -27.693740844726562, "global_step": 592950, "epoch": 7143} {"train_loss": -27.761943886078985, "global_step": 592951, "epoch": 7143, "val_loss": 6554056.0} {"train_loss": -27.858966827392578, "global_step": 592952, "epoch": 7144} {"train_loss": -27.603870391845703, "global_step": 592953, "epoch": 7144} {"train_loss": -28.081119537353516, "global_step": 592954, "epoch": 7144} {"train_loss": -28.009296417236328, "global_step": 592955, "epoch": 7144} {"train_loss": -27.80573081970215, "global_step": 592956, "epoch": 7144} {"train_loss": -27.9685001373291, "global_step": 592957, "epoch": 7144} {"train_loss": -27.991857528686523, "global_step": 592958, "epoch": 7144} {"train_loss": -27.7277889251709, "global_step": 592959, "epoch": 7144} {"train_loss": -27.589635848999023, "global_step": 592960, "epoch": 7144} {"train_loss": -27.968046188354492, "global_step": 592961, "epoch": 7144} {"train_loss": -27.965173721313477, "global_step": 592962, "epoch": 7144} {"train_loss": -27.836149215698242, "global_step": 592963, "epoch": 7144} {"train_loss": -28.014328002929688, "global_step": 592964, "epoch": 7144} {"train_loss": -27.806196212768555, "global_step": 592965, "epoch": 7144} {"train_loss": -27.866016387939453, "global_step": 592966, "epoch": 7144} {"train_loss": -28.129003524780273, "global_step": 592967, "epoch": 7144} {"train_loss": -28.102142333984375, "global_step": 592968, "epoch": 7144} {"train_loss": -27.94696044921875, "global_step": 592969, "epoch": 7144} {"train_loss": -28.485517501831055, "global_step": 592970, "epoch": 7144} {"train_loss": -27.958295822143555, "global_step": 592971, "epoch": 7144} {"train_loss": -28.290058135986328, "global_step": 592972, "epoch": 7144} {"train_loss": -28.076635360717773, "global_step": 592973, "epoch": 7144} {"train_loss": -27.90974235534668, "global_step": 592974, "epoch": 7144} {"train_loss": -28.334150314331055, "global_step": 592975, "epoch": 7144} {"train_loss": -28.007465362548828, "global_step": 592976, "epoch": 7144} {"train_loss": -28.046396255493164, "global_step": 592977, "epoch": 7144} {"train_loss": -28.124359130859375, "global_step": 592978, "epoch": 7144} {"train_loss": -27.971485137939453, "global_step": 592979, "epoch": 7144} {"train_loss": -28.293598175048828, "global_step": 592980, "epoch": 7144} {"train_loss": -28.16840934753418, "global_step": 592981, "epoch": 7144} {"train_loss": -27.815107345581055, "global_step": 592982, "epoch": 7144} {"train_loss": -28.456750869750977, "global_step": 592983, "epoch": 7144} {"train_loss": -28.021459579467773, "global_step": 592984, "epoch": 7144} {"train_loss": -28.085235595703125, "global_step": 592985, "epoch": 7144} {"train_loss": -28.314228057861328, "global_step": 592986, "epoch": 7144} {"train_loss": -27.84662437438965, "global_step": 592987, "epoch": 7144} {"train_loss": -28.00412368774414, "global_step": 592988, "epoch": 7144} {"train_loss": -27.965173721313477, "global_step": 592989, "epoch": 7144} {"train_loss": -27.790149688720703, "global_step": 592990, "epoch": 7144} {"train_loss": -28.35235023498535, "global_step": 592991, "epoch": 7144} {"train_loss": -28.164899826049805, "global_step": 592992, "epoch": 7144} {"train_loss": -27.64645767211914, "global_step": 592993, "epoch": 7144} {"train_loss": -28.26222038269043, "global_step": 592994, "epoch": 7144} {"train_loss": -27.850019454956055, "global_step": 592995, "epoch": 7144} {"train_loss": -27.62432289123535, "global_step": 592996, "epoch": 7144} {"train_loss": -28.159149169921875, "global_step": 592997, "epoch": 7144} {"train_loss": -27.61821937561035, "global_step": 592998, "epoch": 7144} {"train_loss": -27.9244384765625, "global_step": 592999, "epoch": 7144} {"train_loss": -28.193506240844727, "global_step": 593000, "epoch": 7144} {"train_loss": -27.46510124206543, "global_step": 593001, "epoch": 7144} {"train_loss": -27.376678466796875, "global_step": 593002, "epoch": 7144} {"train_loss": -27.4960880279541, "global_step": 593003, "epoch": 7144} {"train_loss": -27.592670440673828, "global_step": 593004, "epoch": 7144} {"train_loss": -28.192611694335938, "global_step": 593005, "epoch": 7144} {"train_loss": -27.491003036499023, "global_step": 593006, "epoch": 7144} {"train_loss": -27.66693687438965, "global_step": 593007, "epoch": 7144} {"train_loss": -27.59604835510254, "global_step": 593008, "epoch": 7144} {"train_loss": -28.22462272644043, "global_step": 593009, "epoch": 7144} {"train_loss": -28.02133560180664, "global_step": 593010, "epoch": 7144} {"train_loss": -28.000696182250977, "global_step": 593011, "epoch": 7144} {"train_loss": -28.060089111328125, "global_step": 593012, "epoch": 7144} {"train_loss": -28.127582550048828, "global_step": 593013, "epoch": 7144} {"train_loss": -28.323150634765625, "global_step": 593014, "epoch": 7144} {"train_loss": -27.540128707885742, "global_step": 593015, "epoch": 7144} {"train_loss": -28.167999267578125, "global_step": 593016, "epoch": 7144} {"train_loss": -27.855667114257812, "global_step": 593017, "epoch": 7144} {"train_loss": -27.862747192382812, "global_step": 593018, "epoch": 7144} {"train_loss": -28.2639217376709, "global_step": 593019, "epoch": 7144} {"train_loss": -27.978185653686523, "global_step": 593020, "epoch": 7144} {"train_loss": -27.721363067626953, "global_step": 593021, "epoch": 7144} {"train_loss": -27.995763778686523, "global_step": 593022, "epoch": 7144} {"train_loss": -28.178964614868164, "global_step": 593023, "epoch": 7144} {"train_loss": -28.23935317993164, "global_step": 593024, "epoch": 7144} {"train_loss": -27.698270797729492, "global_step": 593025, "epoch": 7144} {"train_loss": -28.02010154724121, "global_step": 593026, "epoch": 7144} {"train_loss": -28.088550567626953, "global_step": 593027, "epoch": 7144} {"train_loss": -28.074085235595703, "global_step": 593028, "epoch": 7144} {"train_loss": -27.738134384155273, "global_step": 593029, "epoch": 7144} {"train_loss": -28.069751739501953, "global_step": 593030, "epoch": 7144} {"train_loss": -28.353336334228516, "global_step": 593031, "epoch": 7144} {"train_loss": -28.25420570373535, "global_step": 593032, "epoch": 7144} {"train_loss": -28.07781982421875, "global_step": 593033, "epoch": 7144} {"train_loss": -27.98445568314518, "global_step": 593034, "epoch": 7144, "val_loss": 6613787.0} {"train_loss": -28.052392959594727, "global_step": 593035, "epoch": 7145} {"train_loss": -27.13911247253418, "global_step": 593036, "epoch": 7145} {"train_loss": -27.30763816833496, "global_step": 593037, "epoch": 7145} {"train_loss": -27.238697052001953, "global_step": 593038, "epoch": 7145} {"train_loss": -27.577177047729492, "global_step": 593039, "epoch": 7145} {"train_loss": -27.418094635009766, "global_step": 593040, "epoch": 7145} {"train_loss": -27.766132354736328, "global_step": 593041, "epoch": 7145} {"train_loss": -27.38593864440918, "global_step": 593042, "epoch": 7145} {"train_loss": -27.836318969726562, "global_step": 593043, "epoch": 7145} {"train_loss": -27.484619140625, "global_step": 593044, "epoch": 7145} {"train_loss": -27.515356063842773, "global_step": 593045, "epoch": 7145} {"train_loss": -27.6047306060791, "global_step": 593046, "epoch": 7145} {"train_loss": -27.5650577545166, "global_step": 593047, "epoch": 7145} {"train_loss": -27.648740768432617, "global_step": 593048, "epoch": 7145} {"train_loss": -27.76971435546875, "global_step": 593049, "epoch": 7145} {"train_loss": -27.55543327331543, "global_step": 593050, "epoch": 7145} {"train_loss": -27.827966690063477, "global_step": 593051, "epoch": 7145} {"train_loss": -27.762662887573242, "global_step": 593052, "epoch": 7145} {"train_loss": -27.703418731689453, "global_step": 593053, "epoch": 7145} {"train_loss": -27.821455001831055, "global_step": 593054, "epoch": 7145} {"train_loss": -28.083526611328125, "global_step": 593055, "epoch": 7145} {"train_loss": -27.597211837768555, "global_step": 593056, "epoch": 7145} {"train_loss": -27.8079833984375, "global_step": 593057, "epoch": 7145} {"train_loss": -27.86748695373535, "global_step": 593058, "epoch": 7145} {"train_loss": -27.797231674194336, "global_step": 593059, "epoch": 7145} {"train_loss": -28.2889347076416, "global_step": 593060, "epoch": 7145} {"train_loss": -27.58791160583496, "global_step": 593061, "epoch": 7145} {"train_loss": -27.63508415222168, "global_step": 593062, "epoch": 7145} {"train_loss": -28.433080673217773, "global_step": 593063, "epoch": 7145} {"train_loss": -27.84174156188965, "global_step": 593064, "epoch": 7145} {"train_loss": -27.85564613342285, "global_step": 593065, "epoch": 7145} {"train_loss": -27.958322525024414, "global_step": 593066, "epoch": 7145} {"train_loss": -27.628198623657227, "global_step": 593067, "epoch": 7145} {"train_loss": -27.983993530273438, "global_step": 593068, "epoch": 7145} {"train_loss": -27.714635848999023, "global_step": 593069, "epoch": 7145} {"train_loss": -28.041767120361328, "global_step": 593070, "epoch": 7145} {"train_loss": -27.73048210144043, "global_step": 593071, "epoch": 7145} {"train_loss": -27.962081909179688, "global_step": 593072, "epoch": 7145} {"train_loss": -28.062589645385742, "global_step": 593073, "epoch": 7145} {"train_loss": -27.768903732299805, "global_step": 593074, "epoch": 7145} {"train_loss": -27.90106201171875, "global_step": 593075, "epoch": 7145} {"train_loss": -28.152267456054688, "global_step": 593076, "epoch": 7145} {"train_loss": -27.945545196533203, "global_step": 593077, "epoch": 7145} {"train_loss": -28.1093807220459, "global_step": 593078, "epoch": 7145} {"train_loss": -27.945425033569336, "global_step": 593079, "epoch": 7145} {"train_loss": -28.08574867248535, "global_step": 593080, "epoch": 7145} {"train_loss": -27.79195213317871, "global_step": 593081, "epoch": 7145} {"train_loss": -28.03919792175293, "global_step": 593082, "epoch": 7145} {"train_loss": -27.645883560180664, "global_step": 593083, "epoch": 7145} {"train_loss": -27.731082916259766, "global_step": 593084, "epoch": 7145} {"train_loss": -27.5694637298584, "global_step": 593085, "epoch": 7145} {"train_loss": -28.024890899658203, "global_step": 593086, "epoch": 7145} {"train_loss": -27.967121124267578, "global_step": 593087, "epoch": 7145} {"train_loss": -28.12396812438965, "global_step": 593088, "epoch": 7145} {"train_loss": -28.086950302124023, "global_step": 593089, "epoch": 7145} {"train_loss": -27.784423828125, "global_step": 593090, "epoch": 7145} {"train_loss": -28.42817497253418, "global_step": 593091, "epoch": 7145} {"train_loss": -27.989160537719727, "global_step": 593092, "epoch": 7145} {"train_loss": -27.791915893554688, "global_step": 593093, "epoch": 7145} {"train_loss": -28.130674362182617, "global_step": 593094, "epoch": 7145} {"train_loss": -27.875036239624023, "global_step": 593095, "epoch": 7145} {"train_loss": -28.07476234436035, "global_step": 593096, "epoch": 7145} {"train_loss": -28.1057186126709, "global_step": 593097, "epoch": 7145} {"train_loss": -27.873727798461914, "global_step": 593098, "epoch": 7145} {"train_loss": -27.78046989440918, "global_step": 593099, "epoch": 7145} {"train_loss": -28.0040283203125, "global_step": 593100, "epoch": 7145} {"train_loss": -27.8563232421875, "global_step": 593101, "epoch": 7145} {"train_loss": -27.83233642578125, "global_step": 593102, "epoch": 7145} {"train_loss": -27.707916259765625, "global_step": 593103, "epoch": 7145} {"train_loss": -27.8226318359375, "global_step": 593104, "epoch": 7145} {"train_loss": -28.453128814697266, "global_step": 593105, "epoch": 7145} {"train_loss": -27.999658584594727, "global_step": 593106, "epoch": 7145} {"train_loss": -27.81902503967285, "global_step": 593107, "epoch": 7145} {"train_loss": -28.033910751342773, "global_step": 593108, "epoch": 7145} {"train_loss": -27.965585708618164, "global_step": 593109, "epoch": 7145} {"train_loss": -27.88136100769043, "global_step": 593110, "epoch": 7145} {"train_loss": -27.991708755493164, "global_step": 593111, "epoch": 7145} {"train_loss": -28.137205123901367, "global_step": 593112, "epoch": 7145} {"train_loss": -27.96962547302246, "global_step": 593113, "epoch": 7145} {"train_loss": -27.925464630126953, "global_step": 593114, "epoch": 7145} {"train_loss": -27.88685417175293, "global_step": 593115, "epoch": 7145} {"train_loss": -28.1645565032959, "global_step": 593116, "epoch": 7145} {"train_loss": -27.853124572570067, "global_step": 593117, "epoch": 7145, "val_loss": 6540314.5} {"train_loss": -27.629911422729492, "global_step": 593118, "epoch": 7146} {"train_loss": -26.9599552154541, "global_step": 593119, "epoch": 7146} {"train_loss": -27.359113693237305, "global_step": 593120, "epoch": 7146} {"train_loss": -27.875598907470703, "global_step": 593121, "epoch": 7146} {"train_loss": -27.82889747619629, "global_step": 593122, "epoch": 7146} {"train_loss": -27.244110107421875, "global_step": 593123, "epoch": 7146} {"train_loss": -27.44264030456543, "global_step": 593124, "epoch": 7146} {"train_loss": -27.557525634765625, "global_step": 593125, "epoch": 7146} {"train_loss": -27.642581939697266, "global_step": 593126, "epoch": 7146} {"train_loss": -27.799823760986328, "global_step": 593127, "epoch": 7146} {"train_loss": -27.794464111328125, "global_step": 593128, "epoch": 7146} {"train_loss": -27.64619255065918, "global_step": 593129, "epoch": 7146} {"train_loss": -27.647735595703125, "global_step": 593130, "epoch": 7146} {"train_loss": -27.5164737701416, "global_step": 593131, "epoch": 7146} {"train_loss": -27.79129981994629, "global_step": 593132, "epoch": 7146} {"train_loss": -28.245914459228516, "global_step": 593133, "epoch": 7146} {"train_loss": -27.600854873657227, "global_step": 593134, "epoch": 7146} {"train_loss": -27.751209259033203, "global_step": 593135, "epoch": 7146} {"train_loss": -27.35773277282715, "global_step": 593136, "epoch": 7146} {"train_loss": -27.77533531188965, "global_step": 593137, "epoch": 7146} {"train_loss": -27.81805419921875, "global_step": 593138, "epoch": 7146} {"train_loss": -27.680692672729492, "global_step": 593139, "epoch": 7146} {"train_loss": -28.32843017578125, "global_step": 593140, "epoch": 7146} {"train_loss": -27.276092529296875, "global_step": 593141, "epoch": 7146} {"train_loss": -27.2150936126709, "global_step": 593142, "epoch": 7146} {"train_loss": -27.865955352783203, "global_step": 593143, "epoch": 7146} {"train_loss": -27.586851119995117, "global_step": 593144, "epoch": 7146} {"train_loss": -27.850330352783203, "global_step": 593145, "epoch": 7146} {"train_loss": -27.9073429107666, "global_step": 593146, "epoch": 7146} {"train_loss": -27.478683471679688, "global_step": 593147, "epoch": 7146} {"train_loss": -27.536487579345703, "global_step": 593148, "epoch": 7146} {"train_loss": -28.17498779296875, "global_step": 593149, "epoch": 7146} {"train_loss": -27.714162826538086, "global_step": 593150, "epoch": 7146} {"train_loss": -27.701019287109375, "global_step": 593151, "epoch": 7146} {"train_loss": -27.8936710357666, "global_step": 593152, "epoch": 7146} {"train_loss": -27.932178497314453, "global_step": 593153, "epoch": 7146} {"train_loss": -27.8581600189209, "global_step": 593154, "epoch": 7146} {"train_loss": -28.4447078704834, "global_step": 593155, "epoch": 7146} {"train_loss": -27.907785415649414, "global_step": 593156, "epoch": 7146} {"train_loss": -28.147052764892578, "global_step": 593157, "epoch": 7146} {"train_loss": -27.94707679748535, "global_step": 593158, "epoch": 7146} {"train_loss": -28.018075942993164, "global_step": 593159, "epoch": 7146} {"train_loss": -28.151844024658203, "global_step": 593160, "epoch": 7146} {"train_loss": -28.515186309814453, "global_step": 593161, "epoch": 7146} {"train_loss": -28.5632266998291, "global_step": 593162, "epoch": 7146} {"train_loss": -28.23040199279785, "global_step": 593163, "epoch": 7146} {"train_loss": -28.300037384033203, "global_step": 593164, "epoch": 7146} {"train_loss": -28.329025268554688, "global_step": 593165, "epoch": 7146} {"train_loss": -28.3603515625, "global_step": 593166, "epoch": 7146} {"train_loss": -28.372068405151367, "global_step": 593167, "epoch": 7146} {"train_loss": -28.20490837097168, "global_step": 593168, "epoch": 7146} {"train_loss": -27.77337646484375, "global_step": 593169, "epoch": 7146} {"train_loss": -28.145605087280273, "global_step": 593170, "epoch": 7146} {"train_loss": -28.286590576171875, "global_step": 593171, "epoch": 7146} {"train_loss": -28.11140251159668, "global_step": 593172, "epoch": 7146} {"train_loss": -27.858732223510742, "global_step": 593173, "epoch": 7146} {"train_loss": -27.998456954956055, "global_step": 593174, "epoch": 7146} {"train_loss": -28.01102638244629, "global_step": 593175, "epoch": 7146} {"train_loss": -27.5896053314209, "global_step": 593176, "epoch": 7146} {"train_loss": -27.716299057006836, "global_step": 593177, "epoch": 7146} {"train_loss": -27.89875602722168, "global_step": 593178, "epoch": 7146} {"train_loss": -28.028860092163086, "global_step": 593179, "epoch": 7146} {"train_loss": -28.017993927001953, "global_step": 593180, "epoch": 7146} {"train_loss": -28.0947208404541, "global_step": 593181, "epoch": 7146} {"train_loss": -27.897146224975586, "global_step": 593182, "epoch": 7146} {"train_loss": -28.205408096313477, "global_step": 593183, "epoch": 7146} {"train_loss": -28.20745849609375, "global_step": 593184, "epoch": 7146} {"train_loss": -28.132465362548828, "global_step": 593185, "epoch": 7146} {"train_loss": -28.094623565673828, "global_step": 593186, "epoch": 7146} {"train_loss": -28.13429069519043, "global_step": 593187, "epoch": 7146} {"train_loss": -27.943134307861328, "global_step": 593188, "epoch": 7146} {"train_loss": -28.011737823486328, "global_step": 593189, "epoch": 7146} {"train_loss": -27.838220596313477, "global_step": 593190, "epoch": 7146} {"train_loss": -28.020389556884766, "global_step": 593191, "epoch": 7146} {"train_loss": -27.8304500579834, "global_step": 593192, "epoch": 7146} {"train_loss": -28.10405921936035, "global_step": 593193, "epoch": 7146} {"train_loss": -27.854223251342773, "global_step": 593194, "epoch": 7146} {"train_loss": -28.20802879333496, "global_step": 593195, "epoch": 7146} {"train_loss": -28.021032333374023, "global_step": 593196, "epoch": 7146} {"train_loss": -27.971364974975586, "global_step": 593197, "epoch": 7146} {"train_loss": -28.259618759155273, "global_step": 593198, "epoch": 7146} {"train_loss": -28.336633682250977, "global_step": 593199, "epoch": 7146} {"train_loss": -27.910233279308642, "global_step": 593200, "epoch": 7146, "val_loss": 6609829.5} {"train_loss": -27.05988121032715, "global_step": 593201, "epoch": 7147} {"train_loss": -27.097211837768555, "global_step": 593202, "epoch": 7147} {"train_loss": -27.440479278564453, "global_step": 593203, "epoch": 7147} {"train_loss": -27.479394912719727, "global_step": 593204, "epoch": 7147} {"train_loss": -27.957731246948242, "global_step": 593205, "epoch": 7147} {"train_loss": -27.700122833251953, "global_step": 593206, "epoch": 7147} {"train_loss": -27.596847534179688, "global_step": 593207, "epoch": 7147} {"train_loss": -27.825937271118164, "global_step": 593208, "epoch": 7147} {"train_loss": -27.641443252563477, "global_step": 593209, "epoch": 7147} {"train_loss": -27.651798248291016, "global_step": 593210, "epoch": 7147} {"train_loss": -27.58100700378418, "global_step": 593211, "epoch": 7147} {"train_loss": -27.71014976501465, "global_step": 593212, "epoch": 7147} {"train_loss": -27.619138717651367, "global_step": 593213, "epoch": 7147} {"train_loss": -27.8272705078125, "global_step": 593214, "epoch": 7147} {"train_loss": -28.093992233276367, "global_step": 593215, "epoch": 7147} {"train_loss": -27.862157821655273, "global_step": 593216, "epoch": 7147} {"train_loss": -27.692352294921875, "global_step": 593217, "epoch": 7147} {"train_loss": -27.84030532836914, "global_step": 593218, "epoch": 7147} {"train_loss": -27.97065544128418, "global_step": 593219, "epoch": 7147} {"train_loss": -28.04155921936035, "global_step": 593220, "epoch": 7147} {"train_loss": -27.9122371673584, "global_step": 593221, "epoch": 7147} {"train_loss": -27.982412338256836, "global_step": 593222, "epoch": 7147} {"train_loss": -28.142087936401367, "global_step": 593223, "epoch": 7147} {"train_loss": -28.224918365478516, "global_step": 593224, "epoch": 7147} {"train_loss": -27.685895919799805, "global_step": 593225, "epoch": 7147} {"train_loss": -27.807294845581055, "global_step": 593226, "epoch": 7147} {"train_loss": -28.2303524017334, "global_step": 593227, "epoch": 7147} {"train_loss": -27.87554931640625, "global_step": 593228, "epoch": 7147} {"train_loss": -28.03570556640625, "global_step": 593229, "epoch": 7147} {"train_loss": -28.007089614868164, "global_step": 593230, "epoch": 7147} {"train_loss": -28.2604923248291, "global_step": 593231, "epoch": 7147} {"train_loss": -28.19468116760254, "global_step": 593232, "epoch": 7147} {"train_loss": -27.73382568359375, "global_step": 593233, "epoch": 7147} {"train_loss": -27.807373046875, "global_step": 593234, "epoch": 7147} {"train_loss": -28.156774520874023, "global_step": 593235, "epoch": 7147} {"train_loss": -28.25312614440918, "global_step": 593236, "epoch": 7147} {"train_loss": -28.100000381469727, "global_step": 593237, "epoch": 7147} {"train_loss": -27.59427833557129, "global_step": 593238, "epoch": 7147} {"train_loss": -27.802648544311523, "global_step": 593239, "epoch": 7147} {"train_loss": -28.327808380126953, "global_step": 593240, "epoch": 7147} {"train_loss": -28.15654945373535, "global_step": 593241, "epoch": 7147} {"train_loss": -28.21591567993164, "global_step": 593242, "epoch": 7147} {"train_loss": -28.489154815673828, "global_step": 593243, "epoch": 7147} {"train_loss": -27.58466148376465, "global_step": 593244, "epoch": 7147} {"train_loss": -28.218164443969727, "global_step": 593245, "epoch": 7147} {"train_loss": -28.243406295776367, "global_step": 593246, "epoch": 7147} {"train_loss": -28.234445571899414, "global_step": 593247, "epoch": 7147} {"train_loss": -27.957324981689453, "global_step": 593248, "epoch": 7147} {"train_loss": -27.817340850830078, "global_step": 593249, "epoch": 7147} {"train_loss": -28.158491134643555, "global_step": 593250, "epoch": 7147} {"train_loss": -27.6397705078125, "global_step": 593251, "epoch": 7147} {"train_loss": -27.859649658203125, "global_step": 593252, "epoch": 7147} {"train_loss": -27.642995834350586, "global_step": 593253, "epoch": 7147} {"train_loss": -27.719818115234375, "global_step": 593254, "epoch": 7147} {"train_loss": -28.568506240844727, "global_step": 593255, "epoch": 7147} {"train_loss": -28.24595069885254, "global_step": 593256, "epoch": 7147} {"train_loss": -28.247314453125, "global_step": 593257, "epoch": 7147} {"train_loss": -27.73712158203125, "global_step": 593258, "epoch": 7147} {"train_loss": -28.200239181518555, "global_step": 593259, "epoch": 7147} {"train_loss": -27.822235107421875, "global_step": 593260, "epoch": 7147} {"train_loss": -28.053150177001953, "global_step": 593261, "epoch": 7147} {"train_loss": -28.18460464477539, "global_step": 593262, "epoch": 7147} {"train_loss": -28.4554443359375, "global_step": 593263, "epoch": 7147} {"train_loss": -28.1599178314209, "global_step": 593264, "epoch": 7147} {"train_loss": -28.16180992126465, "global_step": 593265, "epoch": 7147} {"train_loss": -27.834747314453125, "global_step": 593266, "epoch": 7147} {"train_loss": -27.80616569519043, "global_step": 593267, "epoch": 7147} {"train_loss": -27.5524845123291, "global_step": 593268, "epoch": 7147} {"train_loss": -27.65681266784668, "global_step": 593269, "epoch": 7147} {"train_loss": -27.81611442565918, "global_step": 593270, "epoch": 7147} {"train_loss": -27.842395782470703, "global_step": 593271, "epoch": 7147} {"train_loss": -27.765981674194336, "global_step": 593272, "epoch": 7147} {"train_loss": -28.055932998657227, "global_step": 593273, "epoch": 7147} {"train_loss": -28.09905433654785, "global_step": 593274, "epoch": 7147} {"train_loss": -28.001249313354492, "global_step": 593275, "epoch": 7147} {"train_loss": -27.98602867126465, "global_step": 593276, "epoch": 7147} {"train_loss": -27.85430908203125, "global_step": 593277, "epoch": 7147} {"train_loss": -28.384124755859375, "global_step": 593278, "epoch": 7147} {"train_loss": -27.811126708984375, "global_step": 593279, "epoch": 7147} {"train_loss": -28.0928897857666, "global_step": 593280, "epoch": 7147} {"train_loss": -28.159875869750977, "global_step": 593281, "epoch": 7147} {"train_loss": -27.926532745361328, "global_step": 593282, "epoch": 7147} {"train_loss": -27.91262927687312, "global_step": 593283, "epoch": 7147, "val_loss": 6680106.0} {"train_loss": -27.14752769470215, "global_step": 593284, "epoch": 7148} {"train_loss": -27.311742782592773, "global_step": 593285, "epoch": 7148} {"train_loss": -27.432621002197266, "global_step": 593286, "epoch": 7148} {"train_loss": -27.372547149658203, "global_step": 593287, "epoch": 7148} {"train_loss": -27.507116317749023, "global_step": 593288, "epoch": 7148} {"train_loss": -26.835142135620117, "global_step": 593289, "epoch": 7148} {"train_loss": -27.120824813842773, "global_step": 593290, "epoch": 7148} {"train_loss": -27.473752975463867, "global_step": 593291, "epoch": 7148} {"train_loss": -27.179126739501953, "global_step": 593292, "epoch": 7148} {"train_loss": -27.568225860595703, "global_step": 593293, "epoch": 7148} {"train_loss": -27.5418643951416, "global_step": 593294, "epoch": 7148} {"train_loss": -27.39688491821289, "global_step": 593295, "epoch": 7148} {"train_loss": -27.30763816833496, "global_step": 593296, "epoch": 7148} {"train_loss": -27.031843185424805, "global_step": 593297, "epoch": 7148} {"train_loss": -27.710607528686523, "global_step": 593298, "epoch": 7148} {"train_loss": -27.054218292236328, "global_step": 593299, "epoch": 7148} {"train_loss": -27.346593856811523, "global_step": 593300, "epoch": 7148} {"train_loss": -27.38335609436035, "global_step": 593301, "epoch": 7148} {"train_loss": -27.284467697143555, "global_step": 593302, "epoch": 7148} {"train_loss": -27.562774658203125, "global_step": 593303, "epoch": 7148} {"train_loss": -27.280298233032227, "global_step": 593304, "epoch": 7148} {"train_loss": -27.50575065612793, "global_step": 593305, "epoch": 7148} {"train_loss": -27.652624130249023, "global_step": 593306, "epoch": 7148} {"train_loss": -27.249921798706055, "global_step": 593307, "epoch": 7148} {"train_loss": -27.612884521484375, "global_step": 593308, "epoch": 7148} {"train_loss": -27.334503173828125, "global_step": 593309, "epoch": 7148} {"train_loss": -27.961612701416016, "global_step": 593310, "epoch": 7148} {"train_loss": -27.896728515625, "global_step": 593311, "epoch": 7148} {"train_loss": -27.93836784362793, "global_step": 593312, "epoch": 7148} {"train_loss": -27.646697998046875, "global_step": 593313, "epoch": 7148} {"train_loss": -27.888275146484375, "global_step": 593314, "epoch": 7148} {"train_loss": -27.632272720336914, "global_step": 593315, "epoch": 7148} {"train_loss": -28.102771759033203, "global_step": 593316, "epoch": 7148} {"train_loss": -28.00323486328125, "global_step": 593317, "epoch": 7148} {"train_loss": -27.96628189086914, "global_step": 593318, "epoch": 7148} {"train_loss": -27.794158935546875, "global_step": 593319, "epoch": 7148} {"train_loss": -27.874942779541016, "global_step": 593320, "epoch": 7148} {"train_loss": -27.724939346313477, "global_step": 593321, "epoch": 7148} {"train_loss": -27.810415267944336, "global_step": 593322, "epoch": 7148} {"train_loss": -27.93873405456543, "global_step": 593323, "epoch": 7148} {"train_loss": -28.11686134338379, "global_step": 593324, "epoch": 7148} {"train_loss": -28.1790714263916, "global_step": 593325, "epoch": 7148} {"train_loss": -28.013830184936523, "global_step": 593326, "epoch": 7148} {"train_loss": -28.142826080322266, "global_step": 593327, "epoch": 7148} {"train_loss": -28.102991104125977, "global_step": 593328, "epoch": 7148} {"train_loss": -27.71518325805664, "global_step": 593329, "epoch": 7148} {"train_loss": -28.040945053100586, "global_step": 593330, "epoch": 7148} {"train_loss": -28.15220069885254, "global_step": 593331, "epoch": 7148} {"train_loss": -28.24140739440918, "global_step": 593332, "epoch": 7148} {"train_loss": -27.9881591796875, "global_step": 593333, "epoch": 7148} {"train_loss": -28.437170028686523, "global_step": 593334, "epoch": 7148} {"train_loss": -28.20379066467285, "global_step": 593335, "epoch": 7148} {"train_loss": -28.210067749023438, "global_step": 593336, "epoch": 7148} {"train_loss": -28.304489135742188, "global_step": 593337, "epoch": 7148} {"train_loss": -28.126636505126953, "global_step": 593338, "epoch": 7148} {"train_loss": -28.42169761657715, "global_step": 593339, "epoch": 7148} {"train_loss": -27.801944732666016, "global_step": 593340, "epoch": 7148} {"train_loss": -27.77666664123535, "global_step": 593341, "epoch": 7148} {"train_loss": -28.252683639526367, "global_step": 593342, "epoch": 7148} {"train_loss": -28.611785888671875, "global_step": 593343, "epoch": 7148} {"train_loss": -27.9338436126709, "global_step": 593344, "epoch": 7148} {"train_loss": -28.27400779724121, "global_step": 593345, "epoch": 7148} {"train_loss": -28.220733642578125, "global_step": 593346, "epoch": 7148} {"train_loss": -28.315698623657227, "global_step": 593347, "epoch": 7148} {"train_loss": -27.940088272094727, "global_step": 593348, "epoch": 7148} {"train_loss": -27.893232345581055, "global_step": 593349, "epoch": 7148} {"train_loss": -28.64116859436035, "global_step": 593350, "epoch": 7148} {"train_loss": -27.779132843017578, "global_step": 593351, "epoch": 7148} {"train_loss": -27.817672729492188, "global_step": 593352, "epoch": 7148} {"train_loss": -27.874393463134766, "global_step": 593353, "epoch": 7148} {"train_loss": -28.0155029296875, "global_step": 593354, "epoch": 7148} {"train_loss": -28.16582679748535, "global_step": 593355, "epoch": 7148} {"train_loss": -27.164875030517578, "global_step": 593356, "epoch": 7148} {"train_loss": -27.1585750579834, "global_step": 593357, "epoch": 7148} {"train_loss": -27.310565948486328, "global_step": 593358, "epoch": 7148} {"train_loss": -27.696081161499023, "global_step": 593359, "epoch": 7148} {"train_loss": -27.711523056030273, "global_step": 593360, "epoch": 7148} {"train_loss": -27.7417049407959, "global_step": 593361, "epoch": 7148} {"train_loss": -27.719934463500977, "global_step": 593362, "epoch": 7148} {"train_loss": -27.446765899658203, "global_step": 593363, "epoch": 7148} {"train_loss": -27.902816772460938, "global_step": 593364, "epoch": 7148} {"train_loss": -27.801259994506836, "global_step": 593365, "epoch": 7148} {"train_loss": -27.763869848596045, "global_step": 593366, "epoch": 7148, "val_loss": 6532835.0} {"train_loss": -26.79154396057129, "global_step": 593367, "epoch": 7149} {"train_loss": -26.576337814331055, "global_step": 593368, "epoch": 7149} {"train_loss": -27.213178634643555, "global_step": 593369, "epoch": 7149} {"train_loss": -27.045434951782227, "global_step": 593370, "epoch": 7149} {"train_loss": -27.232839584350586, "global_step": 593371, "epoch": 7149} {"train_loss": -27.320404052734375, "global_step": 593372, "epoch": 7149} {"train_loss": -26.77485466003418, "global_step": 593373, "epoch": 7149} {"train_loss": -27.235187530517578, "global_step": 593374, "epoch": 7149} {"train_loss": -27.19125747680664, "global_step": 593375, "epoch": 7149} {"train_loss": -27.345706939697266, "global_step": 593376, "epoch": 7149} {"train_loss": -27.722341537475586, "global_step": 593377, "epoch": 7149} {"train_loss": -27.49332618713379, "global_step": 593378, "epoch": 7149} {"train_loss": -27.803903579711914, "global_step": 593379, "epoch": 7149} {"train_loss": -27.183740615844727, "global_step": 593380, "epoch": 7149} {"train_loss": -27.6197566986084, "global_step": 593381, "epoch": 7149} {"train_loss": -27.420507431030273, "global_step": 593382, "epoch": 7149} {"train_loss": -27.651962280273438, "global_step": 593383, "epoch": 7149} {"train_loss": -27.689481735229492, "global_step": 593384, "epoch": 7149} {"train_loss": -27.75702476501465, "global_step": 593385, "epoch": 7149} {"train_loss": -27.615808486938477, "global_step": 593386, "epoch": 7149} {"train_loss": -27.486576080322266, "global_step": 593387, "epoch": 7149} {"train_loss": -27.76251792907715, "global_step": 593388, "epoch": 7149} {"train_loss": -27.362289428710938, "global_step": 593389, "epoch": 7149} {"train_loss": -27.98733901977539, "global_step": 593390, "epoch": 7149} {"train_loss": -27.726593017578125, "global_step": 593391, "epoch": 7149} {"train_loss": -27.892704010009766, "global_step": 593392, "epoch": 7149} {"train_loss": -27.43427085876465, "global_step": 593393, "epoch": 7149} {"train_loss": -28.17633628845215, "global_step": 593394, "epoch": 7149} {"train_loss": -27.394086837768555, "global_step": 593395, "epoch": 7149} {"train_loss": -28.06214714050293, "global_step": 593396, "epoch": 7149} {"train_loss": -27.690176010131836, "global_step": 593397, "epoch": 7149} {"train_loss": -27.820459365844727, "global_step": 593398, "epoch": 7149} {"train_loss": -28.00965690612793, "global_step": 593399, "epoch": 7149} {"train_loss": -27.7890682220459, "global_step": 593400, "epoch": 7149} {"train_loss": -27.90662956237793, "global_step": 593401, "epoch": 7149} {"train_loss": -27.95792579650879, "global_step": 593402, "epoch": 7149} {"train_loss": -27.724105834960938, "global_step": 593403, "epoch": 7149} {"train_loss": -27.601612091064453, "global_step": 593404, "epoch": 7149} {"train_loss": -27.8779239654541, "global_step": 593405, "epoch": 7149} {"train_loss": -27.85699462890625, "global_step": 593406, "epoch": 7149} {"train_loss": -27.853870391845703, "global_step": 593407, "epoch": 7149} {"train_loss": -28.102481842041016, "global_step": 593408, "epoch": 7149} {"train_loss": -27.805822372436523, "global_step": 593409, "epoch": 7149} {"train_loss": -28.144269943237305, "global_step": 593410, "epoch": 7149} {"train_loss": -27.988550186157227, "global_step": 593411, "epoch": 7149} {"train_loss": -27.97088050842285, "global_step": 593412, "epoch": 7149} {"train_loss": -27.930633544921875, "global_step": 593413, "epoch": 7149} {"train_loss": -27.697309494018555, "global_step": 593414, "epoch": 7149} {"train_loss": -28.20575523376465, "global_step": 593415, "epoch": 7149} {"train_loss": -28.06585693359375, "global_step": 593416, "epoch": 7149} {"train_loss": -27.974939346313477, "global_step": 593417, "epoch": 7149} {"train_loss": -28.496871948242188, "global_step": 593418, "epoch": 7149} {"train_loss": -27.992111206054688, "global_step": 593419, "epoch": 7149} {"train_loss": -28.358474731445312, "global_step": 593420, "epoch": 7149} {"train_loss": -28.4287109375, "global_step": 593421, "epoch": 7149} {"train_loss": -28.449548721313477, "global_step": 593422, "epoch": 7149} {"train_loss": -28.2122859954834, "global_step": 593423, "epoch": 7149} {"train_loss": -28.356399536132812, "global_step": 593424, "epoch": 7149} {"train_loss": -28.047134399414062, "global_step": 593425, "epoch": 7149} {"train_loss": -27.944433212280273, "global_step": 593426, "epoch": 7149} {"train_loss": -27.94147300720215, "global_step": 593427, "epoch": 7149} {"train_loss": -28.1694278717041, "global_step": 593428, "epoch": 7149} {"train_loss": -28.216272354125977, "global_step": 593429, "epoch": 7149} {"train_loss": -28.462743759155273, "global_step": 593430, "epoch": 7149} {"train_loss": -28.130666732788086, "global_step": 593431, "epoch": 7149} {"train_loss": -28.19471549987793, "global_step": 593432, "epoch": 7149} {"train_loss": -27.9691162109375, "global_step": 593433, "epoch": 7149} {"train_loss": -28.47134780883789, "global_step": 593434, "epoch": 7149} {"train_loss": -27.97870445251465, "global_step": 593435, "epoch": 7149} {"train_loss": -28.10153579711914, "global_step": 593436, "epoch": 7149} {"train_loss": -27.914093017578125, "global_step": 593437, "epoch": 7149} {"train_loss": -27.43291664123535, "global_step": 593438, "epoch": 7149} {"train_loss": -27.097875595092773, "global_step": 593439, "epoch": 7149} {"train_loss": -26.146982192993164, "global_step": 593440, "epoch": 7149} {"train_loss": -25.81744956970215, "global_step": 593441, "epoch": 7149} {"train_loss": -26.546951293945312, "global_step": 593442, "epoch": 7149} {"train_loss": -26.961889266967773, "global_step": 593443, "epoch": 7149} {"train_loss": -27.32269287109375, "global_step": 593444, "epoch": 7149} {"train_loss": -27.76030921936035, "global_step": 593445, "epoch": 7149} {"train_loss": -27.231786727905273, "global_step": 593446, "epoch": 7149} {"train_loss": -27.932865142822266, "global_step": 593447, "epoch": 7149} {"train_loss": -27.696470260620117, "global_step": 593448, "epoch": 7149} {"train_loss": -27.694642928709467, "global_step": 593449, "epoch": 7149, "val_loss": 6635604.0} {"train_loss": -26.84470558166504, "global_step": 593450, "epoch": 7150} {"train_loss": -27.304296493530273, "global_step": 593451, "epoch": 7150} {"train_loss": -26.417760848999023, "global_step": 593452, "epoch": 7150} {"train_loss": -27.244604110717773, "global_step": 593453, "epoch": 7150} {"train_loss": -26.91015625, "global_step": 593454, "epoch": 7150} {"train_loss": -27.272851943969727, "global_step": 593455, "epoch": 7150} {"train_loss": -27.493854522705078, "global_step": 593456, "epoch": 7150} {"train_loss": -27.10443115234375, "global_step": 593457, "epoch": 7150} {"train_loss": -27.265003204345703, "global_step": 593458, "epoch": 7150} {"train_loss": -27.595169067382812, "global_step": 593459, "epoch": 7150} {"train_loss": -27.414203643798828, "global_step": 593460, "epoch": 7150} {"train_loss": -27.094970703125, "global_step": 593461, "epoch": 7150} {"train_loss": -27.38919448852539, "global_step": 593462, "epoch": 7150} {"train_loss": -27.760908126831055, "global_step": 593463, "epoch": 7150} {"train_loss": -27.459857940673828, "global_step": 593464, "epoch": 7150} {"train_loss": -27.274433135986328, "global_step": 593465, "epoch": 7150} {"train_loss": -27.343402862548828, "global_step": 593466, "epoch": 7150} {"train_loss": -27.447290420532227, "global_step": 593467, "epoch": 7150} {"train_loss": -27.687673568725586, "global_step": 593468, "epoch": 7150} {"train_loss": -27.436359405517578, "global_step": 593469, "epoch": 7150} {"train_loss": -27.5378360748291, "global_step": 593470, "epoch": 7150} {"train_loss": -27.531274795532227, "global_step": 593471, "epoch": 7150} {"train_loss": -27.971576690673828, "global_step": 593472, "epoch": 7150} {"train_loss": -27.624486923217773, "global_step": 593473, "epoch": 7150} {"train_loss": -27.483448028564453, "global_step": 593474, "epoch": 7150} {"train_loss": -27.909454345703125, "global_step": 593475, "epoch": 7150} {"train_loss": -27.37629508972168, "global_step": 593476, "epoch": 7150} {"train_loss": -27.633991241455078, "global_step": 593477, "epoch": 7150} {"train_loss": -28.193500518798828, "global_step": 593478, "epoch": 7150} {"train_loss": -27.654376983642578, "global_step": 593479, "epoch": 7150} {"train_loss": -28.252843856811523, "global_step": 593480, "epoch": 7150} {"train_loss": -27.772186279296875, "global_step": 593481, "epoch": 7150} {"train_loss": -27.873151779174805, "global_step": 593482, "epoch": 7150} {"train_loss": -27.845172882080078, "global_step": 593483, "epoch": 7150} {"train_loss": -27.656723022460938, "global_step": 593484, "epoch": 7150} {"train_loss": -27.832258224487305, "global_step": 593485, "epoch": 7150} {"train_loss": -27.653125762939453, "global_step": 593486, "epoch": 7150} {"train_loss": -28.184301376342773, "global_step": 593487, "epoch": 7150} {"train_loss": -28.272123336791992, "global_step": 593488, "epoch": 7150} {"train_loss": -27.836172103881836, "global_step": 593489, "epoch": 7150} {"train_loss": -27.717254638671875, "global_step": 593490, "epoch": 7150} {"train_loss": -27.808576583862305, "global_step": 593491, "epoch": 7150} {"train_loss": -27.895599365234375, "global_step": 593492, "epoch": 7150} {"train_loss": -27.994916915893555, "global_step": 593493, "epoch": 7150} {"train_loss": -27.726911544799805, "global_step": 593494, "epoch": 7150} {"train_loss": -27.90180778503418, "global_step": 593495, "epoch": 7150} {"train_loss": -28.04615592956543, "global_step": 593496, "epoch": 7150} {"train_loss": -28.05838966369629, "global_step": 593497, "epoch": 7150} {"train_loss": -28.310827255249023, "global_step": 593498, "epoch": 7150} {"train_loss": -28.55496597290039, "global_step": 593499, "epoch": 7150} {"train_loss": -28.368982315063477, "global_step": 593500, "epoch": 7150} {"train_loss": -28.2628116607666, "global_step": 593501, "epoch": 7150} {"train_loss": -28.303815841674805, "global_step": 593502, "epoch": 7150} {"train_loss": -28.071395874023438, "global_step": 593503, "epoch": 7150} {"train_loss": -28.0283260345459, "global_step": 593504, "epoch": 7150} {"train_loss": -28.226871490478516, "global_step": 593505, "epoch": 7150} {"train_loss": -28.141366958618164, "global_step": 593506, "epoch": 7150} {"train_loss": -28.21949577331543, "global_step": 593507, "epoch": 7150} {"train_loss": -27.870929718017578, "global_step": 593508, "epoch": 7150} {"train_loss": -28.448654174804688, "global_step": 593509, "epoch": 7150} {"train_loss": -27.992420196533203, "global_step": 593510, "epoch": 7150} {"train_loss": -28.134885787963867, "global_step": 593511, "epoch": 7150} {"train_loss": -28.278594970703125, "global_step": 593512, "epoch": 7150} {"train_loss": -28.32379150390625, "global_step": 593513, "epoch": 7150} {"train_loss": -28.319013595581055, "global_step": 593514, "epoch": 7150} {"train_loss": -28.090351104736328, "global_step": 593515, "epoch": 7150} {"train_loss": -28.280004501342773, "global_step": 593516, "epoch": 7150} {"train_loss": -28.19536781311035, "global_step": 593517, "epoch": 7150} {"train_loss": -27.84040641784668, "global_step": 593518, "epoch": 7150} {"train_loss": -27.742780685424805, "global_step": 593519, "epoch": 7150} {"train_loss": -27.900747299194336, "global_step": 593520, "epoch": 7150} {"train_loss": -28.364002227783203, "global_step": 593521, "epoch": 7150} {"train_loss": -28.424585342407227, "global_step": 593522, "epoch": 7150} {"train_loss": -28.080886840820312, "global_step": 593523, "epoch": 7150} {"train_loss": -27.714200973510742, "global_step": 593524, "epoch": 7150} {"train_loss": -28.11469078063965, "global_step": 593525, "epoch": 7150} {"train_loss": -28.513654708862305, "global_step": 593526, "epoch": 7150} {"train_loss": -27.553190231323242, "global_step": 593527, "epoch": 7150} {"train_loss": -27.86325454711914, "global_step": 593528, "epoch": 7150} {"train_loss": -27.809385299682617, "global_step": 593529, "epoch": 7150} {"train_loss": -28.556055068969727, "global_step": 593530, "epoch": 7150} {"train_loss": -27.859176635742188, "global_step": 593531, "epoch": 7150} {"train_loss": -27.834361386586384, "global_step": 593532, "epoch": 7150, "train/sim_max_reward_0": 1.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4500000": 1.0, "test/sim_max_reward_4500001": 1.0, "test/sim_max_reward_4500002": 1.0, "test/sim_max_reward_4500003": 1.0, "test/sim_max_reward_4500004": 1.0, "test/sim_max_reward_4500005": 1.0, "test/sim_max_reward_4500006": 1.0, "test/sim_max_reward_4500007": 1.0, "test/sim_max_reward_4500008": 1.0, "test/sim_max_reward_4500009": 1.0, "test/sim_max_reward_4500010": 1.0, "test/sim_max_reward_4500011": 1.0, "test/sim_max_reward_4500012": 1.0, "test/sim_max_reward_4500013": 1.0, "test/sim_max_reward_4500014": 1.0, "test/sim_max_reward_4500015": 1.0, "test/sim_max_reward_4500016": 0.0, "test/sim_max_reward_4500017": 1.0, "test/sim_max_reward_4500018": 0.0, "test/sim_max_reward_4500019": 1.0, "test/sim_max_reward_4500020": 1.0, "test/sim_max_reward_4500021": 1.0, "train/mean_score": 1.0, "test/mean_score": 0.9090909090909091, "val_loss": 6597078.0} {"train_loss": -27.216022491455078, "global_step": 593533, "epoch": 7151} {"train_loss": -26.78461265563965, "global_step": 593534, "epoch": 7151} {"train_loss": -27.175695419311523, "global_step": 593535, "epoch": 7151} {"train_loss": -27.17925453186035, "global_step": 593536, "epoch": 7151} {"train_loss": -27.463525772094727, "global_step": 593537, "epoch": 7151} {"train_loss": -27.73491859436035, "global_step": 593538, "epoch": 7151} {"train_loss": -27.286191940307617, "global_step": 593539, "epoch": 7151} {"train_loss": -27.81296730041504, "global_step": 593540, "epoch": 7151} {"train_loss": -27.751312255859375, "global_step": 593541, "epoch": 7151} {"train_loss": -27.63514518737793, "global_step": 593542, "epoch": 7151} {"train_loss": -27.695240020751953, "global_step": 593543, "epoch": 7151} {"train_loss": -27.883508682250977, "global_step": 593544, "epoch": 7151} {"train_loss": -27.507184982299805, "global_step": 593545, "epoch": 7151} {"train_loss": -27.301422119140625, "global_step": 593546, "epoch": 7151} {"train_loss": -27.8913631439209, "global_step": 593547, "epoch": 7151} {"train_loss": -27.69569206237793, "global_step": 593548, "epoch": 7151} {"train_loss": -27.952728271484375, "global_step": 593549, "epoch": 7151} {"train_loss": -27.537017822265625, "global_step": 593550, "epoch": 7151} {"train_loss": -27.33536720275879, "global_step": 593551, "epoch": 7151} {"train_loss": -27.741804122924805, "global_step": 593552, "epoch": 7151} {"train_loss": -27.64703941345215, "global_step": 593553, "epoch": 7151} {"train_loss": -27.662893295288086, "global_step": 593554, "epoch": 7151} {"train_loss": -27.825632095336914, "global_step": 593555, "epoch": 7151} {"train_loss": -28.011266708374023, "global_step": 593556, "epoch": 7151} {"train_loss": -28.100509643554688, "global_step": 593557, "epoch": 7151} {"train_loss": -27.712804794311523, "global_step": 593558, "epoch": 7151} {"train_loss": -27.92220115661621, "global_step": 593559, "epoch": 7151} {"train_loss": -27.77106285095215, "global_step": 593560, "epoch": 7151} {"train_loss": -28.057373046875, "global_step": 593561, "epoch": 7151} {"train_loss": -28.18534278869629, "global_step": 593562, "epoch": 7151} {"train_loss": -27.660114288330078, "global_step": 593563, "epoch": 7151} {"train_loss": -28.1616268157959, "global_step": 593564, "epoch": 7151} {"train_loss": -28.12003517150879, "global_step": 593565, "epoch": 7151} {"train_loss": -27.77935218811035, "global_step": 593566, "epoch": 7151} {"train_loss": -27.9525089263916, "global_step": 593567, "epoch": 7151} {"train_loss": -28.174610137939453, "global_step": 593568, "epoch": 7151} {"train_loss": -27.971357345581055, "global_step": 593569, "epoch": 7151} {"train_loss": -28.03631019592285, "global_step": 593570, "epoch": 7151} {"train_loss": -27.896947860717773, "global_step": 593571, "epoch": 7151} {"train_loss": -28.211477279663086, "global_step": 593572, "epoch": 7151} {"train_loss": -28.403778076171875, "global_step": 593573, "epoch": 7151} {"train_loss": -28.154647827148438, "global_step": 593574, "epoch": 7151} {"train_loss": -28.2077579498291, "global_step": 593575, "epoch": 7151} {"train_loss": -28.111724853515625, "global_step": 593576, "epoch": 7151} {"train_loss": -28.191450119018555, "global_step": 593577, "epoch": 7151} {"train_loss": -28.2037410736084, "global_step": 593578, "epoch": 7151} {"train_loss": -28.2742919921875, "global_step": 593579, "epoch": 7151} {"train_loss": -27.732955932617188, "global_step": 593580, "epoch": 7151} {"train_loss": -27.836292266845703, "global_step": 593581, "epoch": 7151} {"train_loss": -27.42084312438965, "global_step": 593582, "epoch": 7151} {"train_loss": -28.135656356811523, "global_step": 593583, "epoch": 7151} {"train_loss": -28.41315269470215, "global_step": 593584, "epoch": 7151} {"train_loss": -28.179609298706055, "global_step": 593585, "epoch": 7151} {"train_loss": -27.84848403930664, "global_step": 593586, "epoch": 7151} {"train_loss": -27.955982208251953, "global_step": 593587, "epoch": 7151} {"train_loss": -27.736658096313477, "global_step": 593588, "epoch": 7151} {"train_loss": -28.292633056640625, "global_step": 593589, "epoch": 7151} {"train_loss": -28.02322769165039, "global_step": 593590, "epoch": 7151} {"train_loss": -28.00986099243164, "global_step": 593591, "epoch": 7151} {"train_loss": -28.15838623046875, "global_step": 593592, "epoch": 7151} {"train_loss": -27.597570419311523, "global_step": 593593, "epoch": 7151} {"train_loss": -28.094268798828125, "global_step": 593594, "epoch": 7151} {"train_loss": -27.583698272705078, "global_step": 593595, "epoch": 7151} {"train_loss": -28.024261474609375, "global_step": 593596, "epoch": 7151} {"train_loss": -28.011676788330078, "global_step": 593597, "epoch": 7151} {"train_loss": -28.27680015563965, "global_step": 593598, "epoch": 7151} {"train_loss": -28.137165069580078, "global_step": 593599, "epoch": 7151} {"train_loss": -28.214130401611328, "global_step": 593600, "epoch": 7151} {"train_loss": -28.510950088500977, "global_step": 593601, "epoch": 7151} {"train_loss": -27.762939453125, "global_step": 593602, "epoch": 7151} {"train_loss": -28.005680084228516, "global_step": 593603, "epoch": 7151} {"train_loss": -28.155792236328125, "global_step": 593604, "epoch": 7151} {"train_loss": -28.04831314086914, "global_step": 593605, "epoch": 7151} {"train_loss": -28.260700225830078, "global_step": 593606, "epoch": 7151} {"train_loss": -27.84490394592285, "global_step": 593607, "epoch": 7151} {"train_loss": -28.405075073242188, "global_step": 593608, "epoch": 7151} {"train_loss": -27.970279693603516, "global_step": 593609, "epoch": 7151} {"train_loss": -28.24704360961914, "global_step": 593610, "epoch": 7151} {"train_loss": -28.085718154907227, "global_step": 593611, "epoch": 7151} {"train_loss": -27.78533935546875, "global_step": 593612, "epoch": 7151} {"train_loss": -28.235553741455078, "global_step": 593613, "epoch": 7151} {"train_loss": -27.782302856445312, "global_step": 593614, "epoch": 7151} {"train_loss": -27.893057214208397, "global_step": 593615, "epoch": 7151, "val_loss": 6623721.5} {"train_loss": -27.376651763916016, "global_step": 593616, "epoch": 7152} {"train_loss": -25.7329044342041, "global_step": 593617, "epoch": 7152} {"train_loss": -27.34295082092285, "global_step": 593618, "epoch": 7152} {"train_loss": -26.991392135620117, "global_step": 593619, "epoch": 7152} {"train_loss": -27.26777458190918, "global_step": 593620, "epoch": 7152} {"train_loss": -27.13752555847168, "global_step": 593621, "epoch": 7152} {"train_loss": -27.4429988861084, "global_step": 593622, "epoch": 7152} {"train_loss": -27.452245712280273, "global_step": 593623, "epoch": 7152} {"train_loss": -27.531919479370117, "global_step": 593624, "epoch": 7152} {"train_loss": -27.821699142456055, "global_step": 593625, "epoch": 7152} {"train_loss": -27.666601181030273, "global_step": 593626, "epoch": 7152} {"train_loss": -28.021408081054688, "global_step": 593627, "epoch": 7152} {"train_loss": -27.538888931274414, "global_step": 593628, "epoch": 7152} {"train_loss": -27.890335083007812, "global_step": 593629, "epoch": 7152} {"train_loss": -27.740930557250977, "global_step": 593630, "epoch": 7152} {"train_loss": -27.700550079345703, "global_step": 593631, "epoch": 7152} {"train_loss": -27.28767204284668, "global_step": 593632, "epoch": 7152} {"train_loss": -27.985212326049805, "global_step": 593633, "epoch": 7152} {"train_loss": -27.669668197631836, "global_step": 593634, "epoch": 7152} {"train_loss": -27.602506637573242, "global_step": 593635, "epoch": 7152} {"train_loss": -28.17963981628418, "global_step": 593636, "epoch": 7152} {"train_loss": -27.972625732421875, "global_step": 593637, "epoch": 7152} {"train_loss": -27.91958999633789, "global_step": 593638, "epoch": 7152} {"train_loss": -28.30279541015625, "global_step": 593639, "epoch": 7152} {"train_loss": -27.877899169921875, "global_step": 593640, "epoch": 7152} {"train_loss": -28.159683227539062, "global_step": 593641, "epoch": 7152} {"train_loss": -27.894107818603516, "global_step": 593642, "epoch": 7152} {"train_loss": -28.093473434448242, "global_step": 593643, "epoch": 7152} {"train_loss": -28.133880615234375, "global_step": 593644, "epoch": 7152} {"train_loss": -28.071104049682617, "global_step": 593645, "epoch": 7152} {"train_loss": -28.152135848999023, "global_step": 593646, "epoch": 7152} {"train_loss": -27.818740844726562, "global_step": 593647, "epoch": 7152} {"train_loss": -28.03837013244629, "global_step": 593648, "epoch": 7152} {"train_loss": -28.134748458862305, "global_step": 593649, "epoch": 7152} {"train_loss": -28.073102951049805, "global_step": 593650, "epoch": 7152} {"train_loss": -28.162378311157227, "global_step": 593651, "epoch": 7152} {"train_loss": -28.36380958557129, "global_step": 593652, "epoch": 7152} {"train_loss": -28.144445419311523, "global_step": 593653, "epoch": 7152} {"train_loss": -27.94318199157715, "global_step": 593654, "epoch": 7152} {"train_loss": -28.24030876159668, "global_step": 593655, "epoch": 7152} {"train_loss": -27.982486724853516, "global_step": 593656, "epoch": 7152} {"train_loss": -27.584537506103516, "global_step": 593657, "epoch": 7152} {"train_loss": -27.416173934936523, "global_step": 593658, "epoch": 7152} {"train_loss": -28.029956817626953, "global_step": 593659, "epoch": 7152} {"train_loss": -27.560392379760742, "global_step": 593660, "epoch": 7152} {"train_loss": -27.759119033813477, "global_step": 593661, "epoch": 7152} {"train_loss": -28.06049156188965, "global_step": 593662, "epoch": 7152} {"train_loss": -27.675418853759766, "global_step": 593663, "epoch": 7152} {"train_loss": -28.12872886657715, "global_step": 593664, "epoch": 7152} {"train_loss": -27.772510528564453, "global_step": 593665, "epoch": 7152} {"train_loss": -27.064558029174805, "global_step": 593666, "epoch": 7152} {"train_loss": -26.808446884155273, "global_step": 593667, "epoch": 7152} {"train_loss": -27.523462295532227, "global_step": 593668, "epoch": 7152} {"train_loss": -27.868879318237305, "global_step": 593669, "epoch": 7152} {"train_loss": -27.315357208251953, "global_step": 593670, "epoch": 7152} {"train_loss": -27.7139949798584, "global_step": 593671, "epoch": 7152} {"train_loss": -27.861358642578125, "global_step": 593672, "epoch": 7152} {"train_loss": -27.505918502807617, "global_step": 593673, "epoch": 7152} {"train_loss": -28.141538619995117, "global_step": 593674, "epoch": 7152} {"train_loss": -27.907012939453125, "global_step": 593675, "epoch": 7152} {"train_loss": -27.52631187438965, "global_step": 593676, "epoch": 7152} {"train_loss": -27.673879623413086, "global_step": 593677, "epoch": 7152} {"train_loss": -27.667362213134766, "global_step": 593678, "epoch": 7152} {"train_loss": -27.509326934814453, "global_step": 593679, "epoch": 7152} {"train_loss": -27.7711238861084, "global_step": 593680, "epoch": 7152} {"train_loss": -28.059629440307617, "global_step": 593681, "epoch": 7152} {"train_loss": -27.987796783447266, "global_step": 593682, "epoch": 7152} {"train_loss": -27.902851104736328, "global_step": 593683, "epoch": 7152} {"train_loss": -28.095285415649414, "global_step": 593684, "epoch": 7152} {"train_loss": -28.11224365234375, "global_step": 593685, "epoch": 7152} {"train_loss": -28.05276870727539, "global_step": 593686, "epoch": 7152} {"train_loss": -28.19684410095215, "global_step": 593687, "epoch": 7152} {"train_loss": -28.120603561401367, "global_step": 593688, "epoch": 7152} {"train_loss": -27.891523361206055, "global_step": 593689, "epoch": 7152} {"train_loss": -27.902780532836914, "global_step": 593690, "epoch": 7152} {"train_loss": -28.248876571655273, "global_step": 593691, "epoch": 7152} {"train_loss": -27.926578521728516, "global_step": 593692, "epoch": 7152} {"train_loss": -28.16573143005371, "global_step": 593693, "epoch": 7152} {"train_loss": -28.215925216674805, "global_step": 593694, "epoch": 7152} {"train_loss": -28.236652374267578, "global_step": 593695, "epoch": 7152} {"train_loss": -28.086181640625, "global_step": 593696, "epoch": 7152} {"train_loss": -27.888782501220703, "global_step": 593697, "epoch": 7152} {"train_loss": -27.808052729411298, "global_step": 593698, "epoch": 7152, "val_loss": 6572675.0} {"train_loss": -27.377588272094727, "global_step": 593699, "epoch": 7153} {"train_loss": -27.894865036010742, "global_step": 593700, "epoch": 7153} {"train_loss": -27.60959243774414, "global_step": 593701, "epoch": 7153} {"train_loss": -27.633386611938477, "global_step": 593702, "epoch": 7153} {"train_loss": -27.568256378173828, "global_step": 593703, "epoch": 7153} {"train_loss": -27.553394317626953, "global_step": 593704, "epoch": 7153} {"train_loss": -27.72391128540039, "global_step": 593705, "epoch": 7153} {"train_loss": -26.957990646362305, "global_step": 593706, "epoch": 7153} {"train_loss": -27.5109920501709, "global_step": 593707, "epoch": 7153} {"train_loss": -27.444183349609375, "global_step": 593708, "epoch": 7153} {"train_loss": -27.0672607421875, "global_step": 593709, "epoch": 7153} {"train_loss": -27.583099365234375, "global_step": 593710, "epoch": 7153} {"train_loss": -27.76483154296875, "global_step": 593711, "epoch": 7153} {"train_loss": -27.35422134399414, "global_step": 593712, "epoch": 7153} {"train_loss": -27.856565475463867, "global_step": 593713, "epoch": 7153} {"train_loss": -28.01877784729004, "global_step": 593714, "epoch": 7153} {"train_loss": -27.759429931640625, "global_step": 593715, "epoch": 7153} {"train_loss": -27.67388343811035, "global_step": 593716, "epoch": 7153} {"train_loss": -27.902240753173828, "global_step": 593717, "epoch": 7153} {"train_loss": -27.70796012878418, "global_step": 593718, "epoch": 7153} {"train_loss": -27.77240562438965, "global_step": 593719, "epoch": 7153} {"train_loss": -27.75656509399414, "global_step": 593720, "epoch": 7153} {"train_loss": -28.065824508666992, "global_step": 593721, "epoch": 7153} {"train_loss": -27.985858917236328, "global_step": 593722, "epoch": 7153} {"train_loss": -27.84134864807129, "global_step": 593723, "epoch": 7153} {"train_loss": -28.090576171875, "global_step": 593724, "epoch": 7153} {"train_loss": -27.837329864501953, "global_step": 593725, "epoch": 7153} {"train_loss": -27.492034912109375, "global_step": 593726, "epoch": 7153} {"train_loss": -27.498218536376953, "global_step": 593727, "epoch": 7153} {"train_loss": -27.6270694732666, "global_step": 593728, "epoch": 7153} {"train_loss": -27.917194366455078, "global_step": 593729, "epoch": 7153} {"train_loss": -27.958627700805664, "global_step": 593730, "epoch": 7153} {"train_loss": -27.46002769470215, "global_step": 593731, "epoch": 7153} {"train_loss": -27.6124324798584, "global_step": 593732, "epoch": 7153} {"train_loss": -27.590164184570312, "global_step": 593733, "epoch": 7153} {"train_loss": -27.450519561767578, "global_step": 593734, "epoch": 7153} {"train_loss": -27.58595085144043, "global_step": 593735, "epoch": 7153} {"train_loss": -27.29140281677246, "global_step": 593736, "epoch": 7153} {"train_loss": -28.00269889831543, "global_step": 593737, "epoch": 7153} {"train_loss": -27.81098747253418, "global_step": 593738, "epoch": 7153} {"train_loss": -28.193042755126953, "global_step": 593739, "epoch": 7153} {"train_loss": -27.81805419921875, "global_step": 593740, "epoch": 7153} {"train_loss": -27.79269790649414, "global_step": 593741, "epoch": 7153} {"train_loss": -28.06195068359375, "global_step": 593742, "epoch": 7153} {"train_loss": -27.956823348999023, "global_step": 593743, "epoch": 7153} {"train_loss": -28.1124324798584, "global_step": 593744, "epoch": 7153} {"train_loss": -28.12726402282715, "global_step": 593745, "epoch": 7153} {"train_loss": -27.722105026245117, "global_step": 593746, "epoch": 7153} {"train_loss": -27.889556884765625, "global_step": 593747, "epoch": 7153} {"train_loss": -28.0643310546875, "global_step": 593748, "epoch": 7153} {"train_loss": -27.89288330078125, "global_step": 593749, "epoch": 7153} {"train_loss": -28.322528839111328, "global_step": 593750, "epoch": 7153} {"train_loss": -27.971698760986328, "global_step": 593751, "epoch": 7153} {"train_loss": -28.113901138305664, "global_step": 593752, "epoch": 7153} {"train_loss": -27.5960750579834, "global_step": 593753, "epoch": 7153} {"train_loss": -27.94581413269043, "global_step": 593754, "epoch": 7153} {"train_loss": -28.164398193359375, "global_step": 593755, "epoch": 7153} {"train_loss": -28.008710861206055, "global_step": 593756, "epoch": 7153} {"train_loss": -28.000152587890625, "global_step": 593757, "epoch": 7153} {"train_loss": -27.89580726623535, "global_step": 593758, "epoch": 7153} {"train_loss": -27.851423263549805, "global_step": 593759, "epoch": 7153} {"train_loss": -28.192859649658203, "global_step": 593760, "epoch": 7153} {"train_loss": -27.888410568237305, "global_step": 593761, "epoch": 7153} {"train_loss": -27.905527114868164, "global_step": 593762, "epoch": 7153} {"train_loss": -28.386005401611328, "global_step": 593763, "epoch": 7153} {"train_loss": -28.335351943969727, "global_step": 593764, "epoch": 7153} {"train_loss": -28.188583374023438, "global_step": 593765, "epoch": 7153} {"train_loss": -28.15411949157715, "global_step": 593766, "epoch": 7153} {"train_loss": -28.10442543029785, "global_step": 593767, "epoch": 7153} {"train_loss": -28.282520294189453, "global_step": 593768, "epoch": 7153} {"train_loss": -28.122655868530273, "global_step": 593769, "epoch": 7153} {"train_loss": -28.218122482299805, "global_step": 593770, "epoch": 7153} {"train_loss": -28.194238662719727, "global_step": 593771, "epoch": 7153} {"train_loss": -28.131086349487305, "global_step": 593772, "epoch": 7153} {"train_loss": -28.04949378967285, "global_step": 593773, "epoch": 7153} {"train_loss": -28.556005477905273, "global_step": 593774, "epoch": 7153} {"train_loss": -28.092365264892578, "global_step": 593775, "epoch": 7153} {"train_loss": -28.02969741821289, "global_step": 593776, "epoch": 7153} {"train_loss": -28.490753173828125, "global_step": 593777, "epoch": 7153} {"train_loss": -28.14470863342285, "global_step": 593778, "epoch": 7153} {"train_loss": -28.152921676635742, "global_step": 593779, "epoch": 7153} {"train_loss": -28.27583122253418, "global_step": 593780, "epoch": 7153} {"train_loss": -27.893106391630976, "global_step": 593781, "epoch": 7153, "val_loss": 6581212.0} {"train_loss": -26.278079986572266, "global_step": 593782, "epoch": 7154} {"train_loss": -25.346765518188477, "global_step": 593783, "epoch": 7154} {"train_loss": -26.934553146362305, "global_step": 593784, "epoch": 7154} {"train_loss": -27.536298751831055, "global_step": 593785, "epoch": 7154} {"train_loss": -26.8667049407959, "global_step": 593786, "epoch": 7154} {"train_loss": -27.89044761657715, "global_step": 593787, "epoch": 7154} {"train_loss": -27.019330978393555, "global_step": 593788, "epoch": 7154} {"train_loss": -27.29046630859375, "global_step": 593789, "epoch": 7154} {"train_loss": -27.7977352142334, "global_step": 593790, "epoch": 7154} {"train_loss": -27.553892135620117, "global_step": 593791, "epoch": 7154} {"train_loss": -27.672351837158203, "global_step": 593792, "epoch": 7154} {"train_loss": -27.36467933654785, "global_step": 593793, "epoch": 7154} {"train_loss": -27.535938262939453, "global_step": 593794, "epoch": 7154} {"train_loss": -27.25640296936035, "global_step": 593795, "epoch": 7154} {"train_loss": -27.43242835998535, "global_step": 593796, "epoch": 7154} {"train_loss": -27.17437171936035, "global_step": 593797, "epoch": 7154} {"train_loss": -27.924482345581055, "global_step": 593798, "epoch": 7154} {"train_loss": -27.691360473632812, "global_step": 593799, "epoch": 7154} {"train_loss": -27.957685470581055, "global_step": 593800, "epoch": 7154} {"train_loss": -27.68179702758789, "global_step": 593801, "epoch": 7154} {"train_loss": -27.830732345581055, "global_step": 593802, "epoch": 7154} {"train_loss": -27.586917877197266, "global_step": 593803, "epoch": 7154} {"train_loss": -28.138959884643555, "global_step": 593804, "epoch": 7154} {"train_loss": -27.878202438354492, "global_step": 593805, "epoch": 7154} {"train_loss": -28.157806396484375, "global_step": 593806, "epoch": 7154} {"train_loss": -27.673425674438477, "global_step": 593807, "epoch": 7154} {"train_loss": -28.04886817932129, "global_step": 593808, "epoch": 7154} {"train_loss": -27.843414306640625, "global_step": 593809, "epoch": 7154} {"train_loss": -27.986454010009766, "global_step": 593810, "epoch": 7154} {"train_loss": -27.69270133972168, "global_step": 593811, "epoch": 7154} {"train_loss": -28.002683639526367, "global_step": 593812, "epoch": 7154} {"train_loss": -27.782302856445312, "global_step": 593813, "epoch": 7154} {"train_loss": -27.969715118408203, "global_step": 593814, "epoch": 7154} {"train_loss": -27.77389907836914, "global_step": 593815, "epoch": 7154} {"train_loss": -28.0878849029541, "global_step": 593816, "epoch": 7154} {"train_loss": -28.23273277282715, "global_step": 593817, "epoch": 7154} {"train_loss": -27.793859481811523, "global_step": 593818, "epoch": 7154} {"train_loss": -28.048114776611328, "global_step": 593819, "epoch": 7154} {"train_loss": -27.80179786682129, "global_step": 593820, "epoch": 7154} {"train_loss": -28.13233757019043, "global_step": 593821, "epoch": 7154} {"train_loss": -27.645919799804688, "global_step": 593822, "epoch": 7154} {"train_loss": -27.852697372436523, "global_step": 593823, "epoch": 7154} {"train_loss": -28.1605224609375, "global_step": 593824, "epoch": 7154} {"train_loss": -28.129541397094727, "global_step": 593825, "epoch": 7154} {"train_loss": -28.0018310546875, "global_step": 593826, "epoch": 7154} {"train_loss": -28.56915855407715, "global_step": 593827, "epoch": 7154} {"train_loss": -27.553308486938477, "global_step": 593828, "epoch": 7154} {"train_loss": -27.76813316345215, "global_step": 593829, "epoch": 7154} {"train_loss": -27.767805099487305, "global_step": 593830, "epoch": 7154} {"train_loss": -28.622058868408203, "global_step": 593831, "epoch": 7154} {"train_loss": -28.095056533813477, "global_step": 593832, "epoch": 7154} {"train_loss": -28.115951538085938, "global_step": 593833, "epoch": 7154} {"train_loss": -28.030981063842773, "global_step": 593834, "epoch": 7154} {"train_loss": -28.192127227783203, "global_step": 593835, "epoch": 7154} {"train_loss": -28.098169326782227, "global_step": 593836, "epoch": 7154} {"train_loss": -27.760894775390625, "global_step": 593837, "epoch": 7154} {"train_loss": -27.65956687927246, "global_step": 593838, "epoch": 7154} {"train_loss": -27.8989315032959, "global_step": 593839, "epoch": 7154} {"train_loss": -28.149763107299805, "global_step": 593840, "epoch": 7154} {"train_loss": -28.42559814453125, "global_step": 593841, "epoch": 7154} {"train_loss": -27.767078399658203, "global_step": 593842, "epoch": 7154} {"train_loss": -28.017780303955078, "global_step": 593843, "epoch": 7154} {"train_loss": -27.97903823852539, "global_step": 593844, "epoch": 7154} {"train_loss": -28.207305908203125, "global_step": 593845, "epoch": 7154} {"train_loss": -27.781173706054688, "global_step": 593846, "epoch": 7154} {"train_loss": -28.351226806640625, "global_step": 593847, "epoch": 7154} {"train_loss": -27.796875, "global_step": 593848, "epoch": 7154} {"train_loss": -28.07440185546875, "global_step": 593849, "epoch": 7154} {"train_loss": -28.134435653686523, "global_step": 593850, "epoch": 7154} {"train_loss": -27.953962326049805, "global_step": 593851, "epoch": 7154} {"train_loss": -27.9397029876709, "global_step": 593852, "epoch": 7154} {"train_loss": -28.2263126373291, "global_step": 593853, "epoch": 7154} {"train_loss": -28.233875274658203, "global_step": 593854, "epoch": 7154} {"train_loss": -28.420703887939453, "global_step": 593855, "epoch": 7154} {"train_loss": -28.22394371032715, "global_step": 593856, "epoch": 7154} {"train_loss": -28.360626220703125, "global_step": 593857, "epoch": 7154} {"train_loss": -28.06989097595215, "global_step": 593858, "epoch": 7154} {"train_loss": -28.032819747924805, "global_step": 593859, "epoch": 7154} {"train_loss": -27.980749130249023, "global_step": 593860, "epoch": 7154} {"train_loss": -27.958332061767578, "global_step": 593861, "epoch": 7154} {"train_loss": -28.224714279174805, "global_step": 593862, "epoch": 7154} {"train_loss": -28.154321670532227, "global_step": 593863, "epoch": 7154} {"train_loss": -27.855159299919404, "global_step": 593864, "epoch": 7154, "val_loss": 6615724.0} {"train_loss": -26.728302001953125, "global_step": 593865, "epoch": 7155} {"train_loss": -26.4528865814209, "global_step": 593866, "epoch": 7155} {"train_loss": -26.123260498046875, "global_step": 593867, "epoch": 7155} {"train_loss": -26.64800453186035, "global_step": 593868, "epoch": 7155} {"train_loss": -27.088342666625977, "global_step": 593869, "epoch": 7155} {"train_loss": -26.354963302612305, "global_step": 593870, "epoch": 7155} {"train_loss": -26.792463302612305, "global_step": 593871, "epoch": 7155} {"train_loss": -27.119983673095703, "global_step": 593872, "epoch": 7155} {"train_loss": -26.833816528320312, "global_step": 593873, "epoch": 7155} {"train_loss": -26.8719425201416, "global_step": 593874, "epoch": 7155} {"train_loss": -27.121042251586914, "global_step": 593875, "epoch": 7155} {"train_loss": -27.110065460205078, "global_step": 593876, "epoch": 7155} {"train_loss": -27.052234649658203, "global_step": 593877, "epoch": 7155} {"train_loss": -27.136402130126953, "global_step": 593878, "epoch": 7155} {"train_loss": -27.3955020904541, "global_step": 593879, "epoch": 7155} {"train_loss": -27.036951065063477, "global_step": 593880, "epoch": 7155} {"train_loss": -26.737335205078125, "global_step": 593881, "epoch": 7155} {"train_loss": -27.292539596557617, "global_step": 593882, "epoch": 7155} {"train_loss": -27.551645278930664, "global_step": 593883, "epoch": 7155} {"train_loss": -27.287952423095703, "global_step": 593884, "epoch": 7155} {"train_loss": -27.209075927734375, "global_step": 593885, "epoch": 7155} {"train_loss": -27.4663028717041, "global_step": 593886, "epoch": 7155} {"train_loss": -27.147192001342773, "global_step": 593887, "epoch": 7155} {"train_loss": -27.532453536987305, "global_step": 593888, "epoch": 7155} {"train_loss": -27.527820587158203, "global_step": 593889, "epoch": 7155} {"train_loss": -27.97930908203125, "global_step": 593890, "epoch": 7155} {"train_loss": -27.584386825561523, "global_step": 593891, "epoch": 7155} {"train_loss": -27.617477416992188, "global_step": 593892, "epoch": 7155} {"train_loss": -28.049610137939453, "global_step": 593893, "epoch": 7155} {"train_loss": -27.737350463867188, "global_step": 593894, "epoch": 7155} {"train_loss": -27.72186851501465, "global_step": 593895, "epoch": 7155} {"train_loss": -27.566869735717773, "global_step": 593896, "epoch": 7155} {"train_loss": -27.567956924438477, "global_step": 593897, "epoch": 7155} {"train_loss": -27.655872344970703, "global_step": 593898, "epoch": 7155} {"train_loss": -28.039047241210938, "global_step": 593899, "epoch": 7155} {"train_loss": -28.142919540405273, "global_step": 593900, "epoch": 7155} {"train_loss": -27.407611846923828, "global_step": 593901, "epoch": 7155} {"train_loss": -27.842243194580078, "global_step": 593902, "epoch": 7155} {"train_loss": -28.196014404296875, "global_step": 593903, "epoch": 7155} {"train_loss": -28.07389259338379, "global_step": 593904, "epoch": 7155} {"train_loss": -27.8121280670166, "global_step": 593905, "epoch": 7155} {"train_loss": -27.625391006469727, "global_step": 593906, "epoch": 7155} {"train_loss": -27.859281539916992, "global_step": 593907, "epoch": 7155} {"train_loss": -27.727453231811523, "global_step": 593908, "epoch": 7155} {"train_loss": -28.151525497436523, "global_step": 593909, "epoch": 7155} {"train_loss": -27.94539451599121, "global_step": 593910, "epoch": 7155} {"train_loss": -27.69793128967285, "global_step": 593911, "epoch": 7155} {"train_loss": -28.239606857299805, "global_step": 593912, "epoch": 7155} {"train_loss": -28.20160484313965, "global_step": 593913, "epoch": 7155} {"train_loss": -28.06357192993164, "global_step": 593914, "epoch": 7155} {"train_loss": -28.01313591003418, "global_step": 593915, "epoch": 7155} {"train_loss": -28.08473014831543, "global_step": 593916, "epoch": 7155} {"train_loss": -27.907306671142578, "global_step": 593917, "epoch": 7155} {"train_loss": -28.061115264892578, "global_step": 593918, "epoch": 7155} {"train_loss": -28.147130966186523, "global_step": 593919, "epoch": 7155} {"train_loss": -28.177906036376953, "global_step": 593920, "epoch": 7155} {"train_loss": -27.97673988342285, "global_step": 593921, "epoch": 7155} {"train_loss": -27.994543075561523, "global_step": 593922, "epoch": 7155} {"train_loss": -28.04218101501465, "global_step": 593923, "epoch": 7155} {"train_loss": -28.177356719970703, "global_step": 593924, "epoch": 7155} {"train_loss": -28.005756378173828, "global_step": 593925, "epoch": 7155} {"train_loss": -28.070005416870117, "global_step": 593926, "epoch": 7155} {"train_loss": -27.9219913482666, "global_step": 593927, "epoch": 7155} {"train_loss": -28.179702758789062, "global_step": 593928, "epoch": 7155} {"train_loss": -27.777099609375, "global_step": 593929, "epoch": 7155} {"train_loss": -28.179983139038086, "global_step": 593930, "epoch": 7155} {"train_loss": -27.616125106811523, "global_step": 593931, "epoch": 7155} {"train_loss": -28.502822875976562, "global_step": 593932, "epoch": 7155} {"train_loss": -28.32472038269043, "global_step": 593933, "epoch": 7155} {"train_loss": -28.028905868530273, "global_step": 593934, "epoch": 7155} {"train_loss": -27.850427627563477, "global_step": 593935, "epoch": 7155} {"train_loss": -27.906585693359375, "global_step": 593936, "epoch": 7155} {"train_loss": -28.112497329711914, "global_step": 593937, "epoch": 7155} {"train_loss": -28.16224479675293, "global_step": 593938, "epoch": 7155} {"train_loss": -28.24850845336914, "global_step": 593939, "epoch": 7155} {"train_loss": -27.96038246154785, "global_step": 593940, "epoch": 7155} {"train_loss": -27.598133087158203, "global_step": 593941, "epoch": 7155} {"train_loss": -28.158777236938477, "global_step": 593942, "epoch": 7155} {"train_loss": -28.15681266784668, "global_step": 593943, "epoch": 7155} {"train_loss": -27.970800399780273, "global_step": 593944, "epoch": 7155} {"train_loss": -28.291433334350586, "global_step": 593945, "epoch": 7155} {"train_loss": -27.7327880859375, "global_step": 593946, "epoch": 7155} {"train_loss": -27.680830231632093, "global_step": 593947, "epoch": 7155, "val_loss": 6537789.0} {"train_loss": -27.3254337310791, "global_step": 593948, "epoch": 7156} {"train_loss": -26.351552963256836, "global_step": 593949, "epoch": 7156} {"train_loss": -26.732467651367188, "global_step": 593950, "epoch": 7156} {"train_loss": -27.6488037109375, "global_step": 593951, "epoch": 7156} {"train_loss": -27.308759689331055, "global_step": 593952, "epoch": 7156} {"train_loss": -27.4547176361084, "global_step": 593953, "epoch": 7156} {"train_loss": -27.453723907470703, "global_step": 593954, "epoch": 7156} {"train_loss": -27.542236328125, "global_step": 593955, "epoch": 7156} {"train_loss": -27.380218505859375, "global_step": 593956, "epoch": 7156} {"train_loss": -27.273990631103516, "global_step": 593957, "epoch": 7156} {"train_loss": -27.439605712890625, "global_step": 593958, "epoch": 7156} {"train_loss": -27.579299926757812, "global_step": 593959, "epoch": 7156} {"train_loss": -27.12898826599121, "global_step": 593960, "epoch": 7156} {"train_loss": -27.711639404296875, "global_step": 593961, "epoch": 7156} {"train_loss": -27.83833122253418, "global_step": 593962, "epoch": 7156} {"train_loss": -27.56477165222168, "global_step": 593963, "epoch": 7156} {"train_loss": -27.862165451049805, "global_step": 593964, "epoch": 7156} {"train_loss": -27.74875259399414, "global_step": 593965, "epoch": 7156} {"train_loss": -27.521747589111328, "global_step": 593966, "epoch": 7156} {"train_loss": -27.820480346679688, "global_step": 593967, "epoch": 7156} {"train_loss": -27.104761123657227, "global_step": 593968, "epoch": 7156} {"train_loss": -27.674123764038086, "global_step": 593969, "epoch": 7156} {"train_loss": -27.434228897094727, "global_step": 593970, "epoch": 7156} {"train_loss": -27.538015365600586, "global_step": 593971, "epoch": 7156} {"train_loss": -27.838653564453125, "global_step": 593972, "epoch": 7156} {"train_loss": -27.797529220581055, "global_step": 593973, "epoch": 7156} {"train_loss": -27.916961669921875, "global_step": 593974, "epoch": 7156} {"train_loss": -27.943374633789062, "global_step": 593975, "epoch": 7156} {"train_loss": -27.913375854492188, "global_step": 593976, "epoch": 7156} {"train_loss": -27.881412506103516, "global_step": 593977, "epoch": 7156} {"train_loss": -27.87489128112793, "global_step": 593978, "epoch": 7156} {"train_loss": -28.119159698486328, "global_step": 593979, "epoch": 7156} {"train_loss": -27.511564254760742, "global_step": 593980, "epoch": 7156} {"train_loss": -28.131122589111328, "global_step": 593981, "epoch": 7156} {"train_loss": -27.840356826782227, "global_step": 593982, "epoch": 7156} {"train_loss": -27.8218936920166, "global_step": 593983, "epoch": 7156} {"train_loss": -28.139448165893555, "global_step": 593984, "epoch": 7156} {"train_loss": -28.27619743347168, "global_step": 593985, "epoch": 7156} {"train_loss": -27.59295082092285, "global_step": 593986, "epoch": 7156} {"train_loss": -27.550323486328125, "global_step": 593987, "epoch": 7156} {"train_loss": -27.74365234375, "global_step": 593988, "epoch": 7156} {"train_loss": -27.805908203125, "global_step": 593989, "epoch": 7156} {"train_loss": -28.01321792602539, "global_step": 593990, "epoch": 7156} {"train_loss": -28.553680419921875, "global_step": 593991, "epoch": 7156} {"train_loss": -28.307554244995117, "global_step": 593992, "epoch": 7156} {"train_loss": -28.1955509185791, "global_step": 593993, "epoch": 7156} {"train_loss": -27.894805908203125, "global_step": 593994, "epoch": 7156} {"train_loss": -28.241708755493164, "global_step": 593995, "epoch": 7156} {"train_loss": -28.324689865112305, "global_step": 593996, "epoch": 7156} {"train_loss": -27.71245765686035, "global_step": 593997, "epoch": 7156} {"train_loss": -27.96136474609375, "global_step": 593998, "epoch": 7156} {"train_loss": -27.605268478393555, "global_step": 593999, "epoch": 7156} {"train_loss": -27.347553253173828, "global_step": 594000, "epoch": 7156} {"train_loss": -27.181798934936523, "global_step": 594001, "epoch": 7156} {"train_loss": -27.048786163330078, "global_step": 594002, "epoch": 7156} {"train_loss": -27.82525062561035, "global_step": 594003, "epoch": 7156} {"train_loss": -28.04233741760254, "global_step": 594004, "epoch": 7156} {"train_loss": -27.98870849609375, "global_step": 594005, "epoch": 7156} {"train_loss": -28.4384765625, "global_step": 594006, "epoch": 7156} {"train_loss": -27.950855255126953, "global_step": 594007, "epoch": 7156} {"train_loss": -28.32940101623535, "global_step": 594008, "epoch": 7156} {"train_loss": -27.783857345581055, "global_step": 594009, "epoch": 7156} {"train_loss": -27.896589279174805, "global_step": 594010, "epoch": 7156} {"train_loss": -27.995908737182617, "global_step": 594011, "epoch": 7156} {"train_loss": -27.94021987915039, "global_step": 594012, "epoch": 7156} {"train_loss": -28.0806827545166, "global_step": 594013, "epoch": 7156} {"train_loss": -28.35988426208496, "global_step": 594014, "epoch": 7156} {"train_loss": -28.127851486206055, "global_step": 594015, "epoch": 7156} {"train_loss": -28.289121627807617, "global_step": 594016, "epoch": 7156} {"train_loss": -28.12922477722168, "global_step": 594017, "epoch": 7156} {"train_loss": -27.924707412719727, "global_step": 594018, "epoch": 7156} {"train_loss": -28.0095157623291, "global_step": 594019, "epoch": 7156} {"train_loss": -27.601581573486328, "global_step": 594020, "epoch": 7156} {"train_loss": -28.010107040405273, "global_step": 594021, "epoch": 7156} {"train_loss": -27.664587020874023, "global_step": 594022, "epoch": 7156} {"train_loss": -28.051166534423828, "global_step": 594023, "epoch": 7156} {"train_loss": -28.234180450439453, "global_step": 594024, "epoch": 7156} {"train_loss": -27.943078994750977, "global_step": 594025, "epoch": 7156} {"train_loss": -27.769315719604492, "global_step": 594026, "epoch": 7156} {"train_loss": -27.99553871154785, "global_step": 594027, "epoch": 7156} {"train_loss": -27.558441162109375, "global_step": 594028, "epoch": 7156} {"train_loss": -27.752933502197266, "global_step": 594029, "epoch": 7156} {"train_loss": -27.791621495442218, "global_step": 594030, "epoch": 7156, "val_loss": 6555593.0} {"train_loss": -26.464202880859375, "global_step": 594031, "epoch": 7157} {"train_loss": -25.032949447631836, "global_step": 594032, "epoch": 7157} {"train_loss": -26.133901596069336, "global_step": 594033, "epoch": 7157} {"train_loss": -27.181720733642578, "global_step": 594034, "epoch": 7157} {"train_loss": -26.86887550354004, "global_step": 594035, "epoch": 7157} {"train_loss": -25.865478515625, "global_step": 594036, "epoch": 7157} {"train_loss": -26.716489791870117, "global_step": 594037, "epoch": 7157} {"train_loss": -26.9443302154541, "global_step": 594038, "epoch": 7157} {"train_loss": -27.02350425720215, "global_step": 594039, "epoch": 7157} {"train_loss": -27.38002586364746, "global_step": 594040, "epoch": 7157} {"train_loss": -27.207294464111328, "global_step": 594041, "epoch": 7157} {"train_loss": -27.22324562072754, "global_step": 594042, "epoch": 7157} {"train_loss": -27.26999855041504, "global_step": 594043, "epoch": 7157} {"train_loss": -27.190717697143555, "global_step": 594044, "epoch": 7157} {"train_loss": -27.39082145690918, "global_step": 594045, "epoch": 7157} {"train_loss": -27.072179794311523, "global_step": 594046, "epoch": 7157} {"train_loss": -27.030065536499023, "global_step": 594047, "epoch": 7157} {"train_loss": -27.54969596862793, "global_step": 594048, "epoch": 7157} {"train_loss": -27.263111114501953, "global_step": 594049, "epoch": 7157} {"train_loss": -27.447433471679688, "global_step": 594050, "epoch": 7157} {"train_loss": -27.452457427978516, "global_step": 594051, "epoch": 7157} {"train_loss": -27.77032470703125, "global_step": 594052, "epoch": 7157} {"train_loss": -27.28858757019043, "global_step": 594053, "epoch": 7157} {"train_loss": -27.49004554748535, "global_step": 594054, "epoch": 7157} {"train_loss": -27.476016998291016, "global_step": 594055, "epoch": 7157} {"train_loss": -27.75459098815918, "global_step": 594056, "epoch": 7157} {"train_loss": -27.514514923095703, "global_step": 594057, "epoch": 7157} {"train_loss": -27.595178604125977, "global_step": 594058, "epoch": 7157} {"train_loss": -27.607013702392578, "global_step": 594059, "epoch": 7157} {"train_loss": -27.790287017822266, "global_step": 594060, "epoch": 7157} {"train_loss": -27.727773666381836, "global_step": 594061, "epoch": 7157} {"train_loss": -27.6219482421875, "global_step": 594062, "epoch": 7157} {"train_loss": -27.75465965270996, "global_step": 594063, "epoch": 7157} {"train_loss": -27.986114501953125, "global_step": 594064, "epoch": 7157} {"train_loss": -27.960229873657227, "global_step": 594065, "epoch": 7157} {"train_loss": -27.661787033081055, "global_step": 594066, "epoch": 7157} {"train_loss": -27.795379638671875, "global_step": 594067, "epoch": 7157} {"train_loss": -28.063583374023438, "global_step": 594068, "epoch": 7157} {"train_loss": -27.6758975982666, "global_step": 594069, "epoch": 7157} {"train_loss": -27.9542293548584, "global_step": 594070, "epoch": 7157} {"train_loss": -28.03801918029785, "global_step": 594071, "epoch": 7157} {"train_loss": -28.288244247436523, "global_step": 594072, "epoch": 7157} {"train_loss": -28.071842193603516, "global_step": 594073, "epoch": 7157} {"train_loss": -27.96453285217285, "global_step": 594074, "epoch": 7157} {"train_loss": -28.029388427734375, "global_step": 594075, "epoch": 7157} {"train_loss": -27.97625732421875, "global_step": 594076, "epoch": 7157} {"train_loss": -28.1021671295166, "global_step": 594077, "epoch": 7157} {"train_loss": -28.315847396850586, "global_step": 594078, "epoch": 7157} {"train_loss": -28.02227783203125, "global_step": 594079, "epoch": 7157} {"train_loss": -28.254968643188477, "global_step": 594080, "epoch": 7157} {"train_loss": -27.86342430114746, "global_step": 594081, "epoch": 7157} {"train_loss": -28.17416763305664, "global_step": 594082, "epoch": 7157} {"train_loss": -28.152999877929688, "global_step": 594083, "epoch": 7157} {"train_loss": -28.256696701049805, "global_step": 594084, "epoch": 7157} {"train_loss": -27.735031127929688, "global_step": 594085, "epoch": 7157} {"train_loss": -27.899444580078125, "global_step": 594086, "epoch": 7157} {"train_loss": -28.243661880493164, "global_step": 594087, "epoch": 7157} {"train_loss": -28.037216186523438, "global_step": 594088, "epoch": 7157} {"train_loss": -28.308279037475586, "global_step": 594089, "epoch": 7157} {"train_loss": -28.2009220123291, "global_step": 594090, "epoch": 7157} {"train_loss": -28.106220245361328, "global_step": 594091, "epoch": 7157} {"train_loss": -28.232833862304688, "global_step": 594092, "epoch": 7157} {"train_loss": -28.20002555847168, "global_step": 594093, "epoch": 7157} {"train_loss": -28.41777992248535, "global_step": 594094, "epoch": 7157} {"train_loss": -28.37298011779785, "global_step": 594095, "epoch": 7157} {"train_loss": -28.167327880859375, "global_step": 594096, "epoch": 7157} {"train_loss": -27.962970733642578, "global_step": 594097, "epoch": 7157} {"train_loss": -28.26202392578125, "global_step": 594098, "epoch": 7157} {"train_loss": -28.181257247924805, "global_step": 594099, "epoch": 7157} {"train_loss": -28.3646297454834, "global_step": 594100, "epoch": 7157} {"train_loss": -28.46878433227539, "global_step": 594101, "epoch": 7157} {"train_loss": -28.267242431640625, "global_step": 594102, "epoch": 7157} {"train_loss": -28.29719352722168, "global_step": 594103, "epoch": 7157} {"train_loss": -27.541852951049805, "global_step": 594104, "epoch": 7157} {"train_loss": -27.96820068359375, "global_step": 594105, "epoch": 7157} {"train_loss": -27.785236358642578, "global_step": 594106, "epoch": 7157} {"train_loss": -27.63557243347168, "global_step": 594107, "epoch": 7157} {"train_loss": -27.983612060546875, "global_step": 594108, "epoch": 7157} {"train_loss": -27.979455947875977, "global_step": 594109, "epoch": 7157} {"train_loss": -28.3963565826416, "global_step": 594110, "epoch": 7157} {"train_loss": -27.695037841796875, "global_step": 594111, "epoch": 7157} {"train_loss": -27.82440185546875, "global_step": 594112, "epoch": 7157} {"train_loss": -27.725080926734282, "global_step": 594113, "epoch": 7157, "val_loss": 6583514.0} {"train_loss": -27.479822158813477, "global_step": 594114, "epoch": 7158} {"train_loss": -26.302398681640625, "global_step": 594115, "epoch": 7158} {"train_loss": -26.84564781188965, "global_step": 594116, "epoch": 7158} {"train_loss": -26.586851119995117, "global_step": 594117, "epoch": 7158} {"train_loss": -26.20981216430664, "global_step": 594118, "epoch": 7158} {"train_loss": -27.418867111206055, "global_step": 594119, "epoch": 7158} {"train_loss": -26.532581329345703, "global_step": 594120, "epoch": 7158} {"train_loss": -26.81597900390625, "global_step": 594121, "epoch": 7158} {"train_loss": -27.248971939086914, "global_step": 594122, "epoch": 7158} {"train_loss": -27.476776123046875, "global_step": 594123, "epoch": 7158} {"train_loss": -26.720417022705078, "global_step": 594124, "epoch": 7158} {"train_loss": -26.88929557800293, "global_step": 594125, "epoch": 7158} {"train_loss": -27.83363914489746, "global_step": 594126, "epoch": 7158} {"train_loss": -26.96424674987793, "global_step": 594127, "epoch": 7158} {"train_loss": -27.2647647857666, "global_step": 594128, "epoch": 7158} {"train_loss": -27.154510498046875, "global_step": 594129, "epoch": 7158} {"train_loss": -27.312707901000977, "global_step": 594130, "epoch": 7158} {"train_loss": -27.423614501953125, "global_step": 594131, "epoch": 7158} {"train_loss": -27.01924705505371, "global_step": 594132, "epoch": 7158} {"train_loss": -27.5001220703125, "global_step": 594133, "epoch": 7158} {"train_loss": -27.522192001342773, "global_step": 594134, "epoch": 7158} {"train_loss": -27.48940086364746, "global_step": 594135, "epoch": 7158} {"train_loss": -27.206226348876953, "global_step": 594136, "epoch": 7158} {"train_loss": -27.656946182250977, "global_step": 594137, "epoch": 7158} {"train_loss": -27.763280868530273, "global_step": 594138, "epoch": 7158} {"train_loss": -27.542028427124023, "global_step": 594139, "epoch": 7158} {"train_loss": -27.820556640625, "global_step": 594140, "epoch": 7158} {"train_loss": -27.673566818237305, "global_step": 594141, "epoch": 7158} {"train_loss": -28.034093856811523, "global_step": 594142, "epoch": 7158} {"train_loss": -27.421091079711914, "global_step": 594143, "epoch": 7158} {"train_loss": -27.845645904541016, "global_step": 594144, "epoch": 7158} {"train_loss": -27.998443603515625, "global_step": 594145, "epoch": 7158} {"train_loss": -27.7937068939209, "global_step": 594146, "epoch": 7158} {"train_loss": -27.840978622436523, "global_step": 594147, "epoch": 7158} {"train_loss": -27.662073135375977, "global_step": 594148, "epoch": 7158} {"train_loss": -28.1164493560791, "global_step": 594149, "epoch": 7158} {"train_loss": -27.799823760986328, "global_step": 594150, "epoch": 7158} {"train_loss": -28.188709259033203, "global_step": 594151, "epoch": 7158} {"train_loss": -27.774633407592773, "global_step": 594152, "epoch": 7158} {"train_loss": -27.46539878845215, "global_step": 594153, "epoch": 7158} {"train_loss": -27.994985580444336, "global_step": 594154, "epoch": 7158} {"train_loss": -28.1529541015625, "global_step": 594155, "epoch": 7158} {"train_loss": -27.9904842376709, "global_step": 594156, "epoch": 7158} {"train_loss": -27.70535659790039, "global_step": 594157, "epoch": 7158} {"train_loss": -28.134984970092773, "global_step": 594158, "epoch": 7158} {"train_loss": -28.086170196533203, "global_step": 594159, "epoch": 7158} {"train_loss": -28.17408561706543, "global_step": 594160, "epoch": 7158} {"train_loss": -28.345060348510742, "global_step": 594161, "epoch": 7158} {"train_loss": -28.14771842956543, "global_step": 594162, "epoch": 7158} {"train_loss": -28.109882354736328, "global_step": 594163, "epoch": 7158} {"train_loss": -28.370471954345703, "global_step": 594164, "epoch": 7158} {"train_loss": -28.354639053344727, "global_step": 594165, "epoch": 7158} {"train_loss": -28.3161563873291, "global_step": 594166, "epoch": 7158} {"train_loss": -28.150985717773438, "global_step": 594167, "epoch": 7158} {"train_loss": -28.383543014526367, "global_step": 594168, "epoch": 7158} {"train_loss": -28.138641357421875, "global_step": 594169, "epoch": 7158} {"train_loss": -28.75331687927246, "global_step": 594170, "epoch": 7158} {"train_loss": -28.048856735229492, "global_step": 594171, "epoch": 7158} {"train_loss": -28.188810348510742, "global_step": 594172, "epoch": 7158} {"train_loss": -28.323749542236328, "global_step": 594173, "epoch": 7158} {"train_loss": -28.0339412689209, "global_step": 594174, "epoch": 7158} {"train_loss": -27.06296157836914, "global_step": 594175, "epoch": 7158} {"train_loss": -25.684955596923828, "global_step": 594176, "epoch": 7158} {"train_loss": -25.029577255249023, "global_step": 594177, "epoch": 7158} {"train_loss": -27.76409339904785, "global_step": 594178, "epoch": 7158} {"train_loss": -26.79898452758789, "global_step": 594179, "epoch": 7158} {"train_loss": -27.382129669189453, "global_step": 594180, "epoch": 7158} {"train_loss": -27.095975875854492, "global_step": 594181, "epoch": 7158} {"train_loss": -27.77485466003418, "global_step": 594182, "epoch": 7158} {"train_loss": -27.333703994750977, "global_step": 594183, "epoch": 7158} {"train_loss": -27.728742599487305, "global_step": 594184, "epoch": 7158} {"train_loss": -27.67171287536621, "global_step": 594185, "epoch": 7158} {"train_loss": -27.412572860717773, "global_step": 594186, "epoch": 7158} {"train_loss": -27.247238159179688, "global_step": 594187, "epoch": 7158} {"train_loss": -27.678571701049805, "global_step": 594188, "epoch": 7158} {"train_loss": -27.5781307220459, "global_step": 594189, "epoch": 7158} {"train_loss": -27.781545639038086, "global_step": 594190, "epoch": 7158} {"train_loss": -27.432653427124023, "global_step": 594191, "epoch": 7158} {"train_loss": -27.56601333618164, "global_step": 594192, "epoch": 7158} {"train_loss": -27.074298858642578, "global_step": 594193, "epoch": 7158} {"train_loss": -27.68015480041504, "global_step": 594194, "epoch": 7158} {"train_loss": -27.8520565032959, "global_step": 594195, "epoch": 7158} {"train_loss": -27.545158639011614, "global_step": 594196, "epoch": 7158, "val_loss": 6586478.0} {"train_loss": -27.256488800048828, "global_step": 594197, "epoch": 7159} {"train_loss": -26.97900390625, "global_step": 594198, "epoch": 7159} {"train_loss": -27.37175941467285, "global_step": 594199, "epoch": 7159} {"train_loss": -27.342395782470703, "global_step": 594200, "epoch": 7159} {"train_loss": -27.125732421875, "global_step": 594201, "epoch": 7159} {"train_loss": -27.030048370361328, "global_step": 594202, "epoch": 7159} {"train_loss": -27.541629791259766, "global_step": 594203, "epoch": 7159} {"train_loss": -26.685407638549805, "global_step": 594204, "epoch": 7159} {"train_loss": -27.589078903198242, "global_step": 594205, "epoch": 7159} {"train_loss": -27.168155670166016, "global_step": 594206, "epoch": 7159} {"train_loss": -27.592609405517578, "global_step": 594207, "epoch": 7159} {"train_loss": -27.61376953125, "global_step": 594208, "epoch": 7159} {"train_loss": -26.83831214904785, "global_step": 594209, "epoch": 7159} {"train_loss": -27.306623458862305, "global_step": 594210, "epoch": 7159} {"train_loss": -27.624059677124023, "global_step": 594211, "epoch": 7159} {"train_loss": -27.622350692749023, "global_step": 594212, "epoch": 7159} {"train_loss": -27.4826602935791, "global_step": 594213, "epoch": 7159} {"train_loss": -27.85177993774414, "global_step": 594214, "epoch": 7159} {"train_loss": -27.75330924987793, "global_step": 594215, "epoch": 7159} {"train_loss": -27.895822525024414, "global_step": 594216, "epoch": 7159} {"train_loss": -27.764789581298828, "global_step": 594217, "epoch": 7159} {"train_loss": -27.719770431518555, "global_step": 594218, "epoch": 7159} {"train_loss": -27.743154525756836, "global_step": 594219, "epoch": 7159} {"train_loss": -27.750354766845703, "global_step": 594220, "epoch": 7159} {"train_loss": -27.53073501586914, "global_step": 594221, "epoch": 7159} {"train_loss": -27.706424713134766, "global_step": 594222, "epoch": 7159} {"train_loss": -27.70292091369629, "global_step": 594223, "epoch": 7159} {"train_loss": -28.030017852783203, "global_step": 594224, "epoch": 7159} {"train_loss": -27.797321319580078, "global_step": 594225, "epoch": 7159} {"train_loss": -27.883991241455078, "global_step": 594226, "epoch": 7159} {"train_loss": -27.767745971679688, "global_step": 594227, "epoch": 7159} {"train_loss": -28.042455673217773, "global_step": 594228, "epoch": 7159} {"train_loss": -28.153247833251953, "global_step": 594229, "epoch": 7159} {"train_loss": -27.716394424438477, "global_step": 594230, "epoch": 7159} {"train_loss": -28.010156631469727, "global_step": 594231, "epoch": 7159} {"train_loss": -28.09377098083496, "global_step": 594232, "epoch": 7159} {"train_loss": -28.051034927368164, "global_step": 594233, "epoch": 7159} {"train_loss": -28.078489303588867, "global_step": 594234, "epoch": 7159} {"train_loss": -28.200580596923828, "global_step": 594235, "epoch": 7159} {"train_loss": -28.054555892944336, "global_step": 594236, "epoch": 7159} {"train_loss": -27.897062301635742, "global_step": 594237, "epoch": 7159} {"train_loss": -27.95916748046875, "global_step": 594238, "epoch": 7159} {"train_loss": -28.212491989135742, "global_step": 594239, "epoch": 7159} {"train_loss": -28.16016960144043, "global_step": 594240, "epoch": 7159} {"train_loss": -28.011474609375, "global_step": 594241, "epoch": 7159} {"train_loss": -28.190465927124023, "global_step": 594242, "epoch": 7159} {"train_loss": -28.15703773498535, "global_step": 594243, "epoch": 7159} {"train_loss": -28.21443748474121, "global_step": 594244, "epoch": 7159} {"train_loss": -27.952743530273438, "global_step": 594245, "epoch": 7159} {"train_loss": -28.207067489624023, "global_step": 594246, "epoch": 7159} {"train_loss": -28.042749404907227, "global_step": 594247, "epoch": 7159} {"train_loss": -28.244678497314453, "global_step": 594248, "epoch": 7159} {"train_loss": -28.12420082092285, "global_step": 594249, "epoch": 7159} {"train_loss": -28.269697189331055, "global_step": 594250, "epoch": 7159} {"train_loss": -28.3031005859375, "global_step": 594251, "epoch": 7159} {"train_loss": -27.833728790283203, "global_step": 594252, "epoch": 7159} {"train_loss": -27.929960250854492, "global_step": 594253, "epoch": 7159} {"train_loss": -28.181039810180664, "global_step": 594254, "epoch": 7159} {"train_loss": -28.34467887878418, "global_step": 594255, "epoch": 7159} {"train_loss": -28.51006507873535, "global_step": 594256, "epoch": 7159} {"train_loss": -27.9940185546875, "global_step": 594257, "epoch": 7159} {"train_loss": -28.5330810546875, "global_step": 594258, "epoch": 7159} {"train_loss": -28.427419662475586, "global_step": 594259, "epoch": 7159} {"train_loss": -28.27814292907715, "global_step": 594260, "epoch": 7159} {"train_loss": -27.956750869750977, "global_step": 594261, "epoch": 7159} {"train_loss": -28.365802764892578, "global_step": 594262, "epoch": 7159} {"train_loss": -27.90765380859375, "global_step": 594263, "epoch": 7159} {"train_loss": -27.779279708862305, "global_step": 594264, "epoch": 7159} {"train_loss": -27.510339736938477, "global_step": 594265, "epoch": 7159} {"train_loss": -26.21998405456543, "global_step": 594266, "epoch": 7159} {"train_loss": -26.050338745117188, "global_step": 594267, "epoch": 7159} {"train_loss": -26.880895614624023, "global_step": 594268, "epoch": 7159} {"train_loss": -27.871265411376953, "global_step": 594269, "epoch": 7159} {"train_loss": -27.414093017578125, "global_step": 594270, "epoch": 7159} {"train_loss": -27.780759811401367, "global_step": 594271, "epoch": 7159} {"train_loss": -27.38775062561035, "global_step": 594272, "epoch": 7159} {"train_loss": -26.944807052612305, "global_step": 594273, "epoch": 7159} {"train_loss": -26.923599243164062, "global_step": 594274, "epoch": 7159} {"train_loss": -27.449674606323242, "global_step": 594275, "epoch": 7159} {"train_loss": -27.704944610595703, "global_step": 594276, "epoch": 7159} {"train_loss": -27.33411979675293, "global_step": 594277, "epoch": 7159} {"train_loss": -26.9802188873291, "global_step": 594278, "epoch": 7159} {"train_loss": -27.740224263754236, "global_step": 594279, "epoch": 7159, "val_loss": 6561202.5} {"train_loss": -26.49920654296875, "global_step": 594280, "epoch": 7160} {"train_loss": -26.248249053955078, "global_step": 594281, "epoch": 7160} {"train_loss": -26.442285537719727, "global_step": 594282, "epoch": 7160} {"train_loss": -27.063474655151367, "global_step": 594283, "epoch": 7160} {"train_loss": -26.529016494750977, "global_step": 594284, "epoch": 7160} {"train_loss": -26.51462173461914, "global_step": 594285, "epoch": 7160} {"train_loss": -26.32557487487793, "global_step": 594286, "epoch": 7160} {"train_loss": -26.96548843383789, "global_step": 594287, "epoch": 7160} {"train_loss": -26.737573623657227, "global_step": 594288, "epoch": 7160} {"train_loss": -27.108800888061523, "global_step": 594289, "epoch": 7160} {"train_loss": -26.94662857055664, "global_step": 594290, "epoch": 7160} {"train_loss": -26.785175323486328, "global_step": 594291, "epoch": 7160} {"train_loss": -27.116506576538086, "global_step": 594292, "epoch": 7160} {"train_loss": -27.187353134155273, "global_step": 594293, "epoch": 7160} {"train_loss": -26.97879981994629, "global_step": 594294, "epoch": 7160} {"train_loss": -27.034452438354492, "global_step": 594295, "epoch": 7160} {"train_loss": -27.3287353515625, "global_step": 594296, "epoch": 7160} {"train_loss": -27.203739166259766, "global_step": 594297, "epoch": 7160} {"train_loss": -27.227741241455078, "global_step": 594298, "epoch": 7160} {"train_loss": -27.48956298828125, "global_step": 594299, "epoch": 7160} {"train_loss": -27.504236221313477, "global_step": 594300, "epoch": 7160} {"train_loss": -27.48969841003418, "global_step": 594301, "epoch": 7160} {"train_loss": -27.37322998046875, "global_step": 594302, "epoch": 7160} {"train_loss": -27.509963989257812, "global_step": 594303, "epoch": 7160} {"train_loss": -27.40869140625, "global_step": 594304, "epoch": 7160} {"train_loss": -27.291217803955078, "global_step": 594305, "epoch": 7160} {"train_loss": -27.79743003845215, "global_step": 594306, "epoch": 7160} {"train_loss": -27.74676513671875, "global_step": 594307, "epoch": 7160} {"train_loss": -27.908185958862305, "global_step": 594308, "epoch": 7160} {"train_loss": -27.944660186767578, "global_step": 594309, "epoch": 7160} {"train_loss": -27.83820152282715, "global_step": 594310, "epoch": 7160} {"train_loss": -27.56806755065918, "global_step": 594311, "epoch": 7160} {"train_loss": -27.666772842407227, "global_step": 594312, "epoch": 7160} {"train_loss": -27.861448287963867, "global_step": 594313, "epoch": 7160} {"train_loss": -27.8171443939209, "global_step": 594314, "epoch": 7160} {"train_loss": -28.081640243530273, "global_step": 594315, "epoch": 7160} {"train_loss": -27.925729751586914, "global_step": 594316, "epoch": 7160} {"train_loss": -28.059141159057617, "global_step": 594317, "epoch": 7160} {"train_loss": -27.658451080322266, "global_step": 594318, "epoch": 7160} {"train_loss": -27.925363540649414, "global_step": 594319, "epoch": 7160} {"train_loss": -27.86665153503418, "global_step": 594320, "epoch": 7160} {"train_loss": -28.526269912719727, "global_step": 594321, "epoch": 7160} {"train_loss": -27.838117599487305, "global_step": 594322, "epoch": 7160} {"train_loss": -28.016767501831055, "global_step": 594323, "epoch": 7160} {"train_loss": -27.83124351501465, "global_step": 594324, "epoch": 7160} {"train_loss": -27.981470108032227, "global_step": 594325, "epoch": 7160} {"train_loss": -28.100910186767578, "global_step": 594326, "epoch": 7160} {"train_loss": -28.362096786499023, "global_step": 594327, "epoch": 7160} {"train_loss": -28.110654830932617, "global_step": 594328, "epoch": 7160} {"train_loss": -28.05228042602539, "global_step": 594329, "epoch": 7160} {"train_loss": -28.02788734436035, "global_step": 594330, "epoch": 7160} {"train_loss": -27.979475021362305, "global_step": 594331, "epoch": 7160} {"train_loss": -27.889936447143555, "global_step": 594332, "epoch": 7160} {"train_loss": -28.11048698425293, "global_step": 594333, "epoch": 7160} {"train_loss": -27.961545944213867, "global_step": 594334, "epoch": 7160} {"train_loss": -28.018091201782227, "global_step": 594335, "epoch": 7160} {"train_loss": -28.378286361694336, "global_step": 594336, "epoch": 7160} {"train_loss": -27.72919273376465, "global_step": 594337, "epoch": 7160} {"train_loss": -28.127521514892578, "global_step": 594338, "epoch": 7160} {"train_loss": -28.21625328063965, "global_step": 594339, "epoch": 7160} {"train_loss": -28.277206420898438, "global_step": 594340, "epoch": 7160} {"train_loss": -28.24384880065918, "global_step": 594341, "epoch": 7160} {"train_loss": -28.263214111328125, "global_step": 594342, "epoch": 7160} {"train_loss": -28.205154418945312, "global_step": 594343, "epoch": 7160} {"train_loss": -28.136383056640625, "global_step": 594344, "epoch": 7160} {"train_loss": -27.99139404296875, "global_step": 594345, "epoch": 7160} {"train_loss": -28.777463912963867, "global_step": 594346, "epoch": 7160} {"train_loss": -27.945053100585938, "global_step": 594347, "epoch": 7160} {"train_loss": -28.220914840698242, "global_step": 594348, "epoch": 7160} {"train_loss": -28.000883102416992, "global_step": 594349, "epoch": 7160} {"train_loss": -28.24440574645996, "global_step": 594350, "epoch": 7160} {"train_loss": -28.076709747314453, "global_step": 594351, "epoch": 7160} {"train_loss": -27.884571075439453, "global_step": 594352, "epoch": 7160} {"train_loss": -27.941335678100586, "global_step": 594353, "epoch": 7160} {"train_loss": -27.936603546142578, "global_step": 594354, "epoch": 7160} {"train_loss": -28.030134201049805, "global_step": 594355, "epoch": 7160} {"train_loss": -28.287601470947266, "global_step": 594356, "epoch": 7160} {"train_loss": -27.50274085998535, "global_step": 594357, "epoch": 7160} {"train_loss": -27.603961944580078, "global_step": 594358, "epoch": 7160} {"train_loss": -27.64947509765625, "global_step": 594359, "epoch": 7160} {"train_loss": -27.964094161987305, "global_step": 594360, "epoch": 7160} {"train_loss": -27.85980224609375, "global_step": 594361, "epoch": 7160} {"train_loss": -27.678225459822688, "global_step": 594362, "epoch": 7160, "val_loss": 6610534.0} {"train_loss": -27.516141891479492, "global_step": 594363, "epoch": 7161} {"train_loss": -26.5288028717041, "global_step": 594364, "epoch": 7161} {"train_loss": -26.898944854736328, "global_step": 594365, "epoch": 7161} {"train_loss": -27.28232765197754, "global_step": 594366, "epoch": 7161} {"train_loss": -27.0341854095459, "global_step": 594367, "epoch": 7161} {"train_loss": -27.039098739624023, "global_step": 594368, "epoch": 7161} {"train_loss": -26.82815933227539, "global_step": 594369, "epoch": 7161} {"train_loss": -27.1241512298584, "global_step": 594370, "epoch": 7161} {"train_loss": -27.3891544342041, "global_step": 594371, "epoch": 7161} {"train_loss": -27.208845138549805, "global_step": 594372, "epoch": 7161} {"train_loss": -26.776123046875, "global_step": 594373, "epoch": 7161} {"train_loss": -27.14615249633789, "global_step": 594374, "epoch": 7161} {"train_loss": -27.01700210571289, "global_step": 594375, "epoch": 7161} {"train_loss": -26.965167999267578, "global_step": 594376, "epoch": 7161} {"train_loss": -26.938827514648438, "global_step": 594377, "epoch": 7161} {"train_loss": -27.865278244018555, "global_step": 594378, "epoch": 7161} {"train_loss": -26.96455192565918, "global_step": 594379, "epoch": 7161} {"train_loss": -24.73891830444336, "global_step": 594380, "epoch": 7161} {"train_loss": -27.31056785583496, "global_step": 594381, "epoch": 7161} {"train_loss": -27.092517852783203, "global_step": 594382, "epoch": 7161} {"train_loss": -27.58795738220215, "global_step": 594383, "epoch": 7161} {"train_loss": -27.080102920532227, "global_step": 594384, "epoch": 7161} {"train_loss": -27.14387321472168, "global_step": 594385, "epoch": 7161} {"train_loss": -27.282516479492188, "global_step": 594386, "epoch": 7161} {"train_loss": -27.524335861206055, "global_step": 594387, "epoch": 7161} {"train_loss": -27.617773056030273, "global_step": 594388, "epoch": 7161} {"train_loss": -27.34589958190918, "global_step": 594389, "epoch": 7161} {"train_loss": -27.5295467376709, "global_step": 594390, "epoch": 7161} {"train_loss": -27.33160400390625, "global_step": 594391, "epoch": 7161} {"train_loss": -27.73435401916504, "global_step": 594392, "epoch": 7161} {"train_loss": -27.566099166870117, "global_step": 594393, "epoch": 7161} {"train_loss": -27.37119483947754, "global_step": 594394, "epoch": 7161} {"train_loss": -27.585248947143555, "global_step": 594395, "epoch": 7161} {"train_loss": -27.3587646484375, "global_step": 594396, "epoch": 7161} {"train_loss": -28.066390991210938, "global_step": 594397, "epoch": 7161} {"train_loss": -27.920068740844727, "global_step": 594398, "epoch": 7161} {"train_loss": -27.37908935546875, "global_step": 594399, "epoch": 7161} {"train_loss": -27.66845703125, "global_step": 594400, "epoch": 7161} {"train_loss": -27.526105880737305, "global_step": 594401, "epoch": 7161} {"train_loss": -28.08253288269043, "global_step": 594402, "epoch": 7161} {"train_loss": -27.69745445251465, "global_step": 594403, "epoch": 7161} {"train_loss": -27.76861000061035, "global_step": 594404, "epoch": 7161} {"train_loss": -28.2969970703125, "global_step": 594405, "epoch": 7161} {"train_loss": -27.957849502563477, "global_step": 594406, "epoch": 7161} {"train_loss": -27.63169288635254, "global_step": 594407, "epoch": 7161} {"train_loss": -28.075098037719727, "global_step": 594408, "epoch": 7161} {"train_loss": -27.839242935180664, "global_step": 594409, "epoch": 7161} {"train_loss": -27.84970474243164, "global_step": 594410, "epoch": 7161} {"train_loss": -28.100332260131836, "global_step": 594411, "epoch": 7161} {"train_loss": -28.183210372924805, "global_step": 594412, "epoch": 7161} {"train_loss": -27.803945541381836, "global_step": 594413, "epoch": 7161} {"train_loss": -27.872333526611328, "global_step": 594414, "epoch": 7161} {"train_loss": -28.184675216674805, "global_step": 594415, "epoch": 7161} {"train_loss": -28.095874786376953, "global_step": 594416, "epoch": 7161} {"train_loss": -28.01373291015625, "global_step": 594417, "epoch": 7161} {"train_loss": -28.416181564331055, "global_step": 594418, "epoch": 7161} {"train_loss": -27.97859764099121, "global_step": 594419, "epoch": 7161} {"train_loss": -28.204877853393555, "global_step": 594420, "epoch": 7161} {"train_loss": -28.078641891479492, "global_step": 594421, "epoch": 7161} {"train_loss": -28.06011962890625, "global_step": 594422, "epoch": 7161} {"train_loss": -28.059131622314453, "global_step": 594423, "epoch": 7161} {"train_loss": -28.398761749267578, "global_step": 594424, "epoch": 7161} {"train_loss": -27.992589950561523, "global_step": 594425, "epoch": 7161} {"train_loss": -28.352094650268555, "global_step": 594426, "epoch": 7161} {"train_loss": -28.31182861328125, "global_step": 594427, "epoch": 7161} {"train_loss": -28.361215591430664, "global_step": 594428, "epoch": 7161} {"train_loss": -28.043256759643555, "global_step": 594429, "epoch": 7161} {"train_loss": -28.20657730102539, "global_step": 594430, "epoch": 7161} {"train_loss": -28.17561912536621, "global_step": 594431, "epoch": 7161} {"train_loss": -28.236021041870117, "global_step": 594432, "epoch": 7161} {"train_loss": -28.31794548034668, "global_step": 594433, "epoch": 7161} {"train_loss": -28.214649200439453, "global_step": 594434, "epoch": 7161} {"train_loss": -27.566919326782227, "global_step": 594435, "epoch": 7161} {"train_loss": -28.29266929626465, "global_step": 594436, "epoch": 7161} {"train_loss": -28.41033363342285, "global_step": 594437, "epoch": 7161} {"train_loss": -27.886127471923828, "global_step": 594438, "epoch": 7161} {"train_loss": -28.252532958984375, "global_step": 594439, "epoch": 7161} {"train_loss": -28.05745506286621, "global_step": 594440, "epoch": 7161} {"train_loss": -27.619531631469727, "global_step": 594441, "epoch": 7161} {"train_loss": -27.98475456237793, "global_step": 594442, "epoch": 7161} {"train_loss": -27.838287353515625, "global_step": 594443, "epoch": 7161} {"train_loss": -28.112430572509766, "global_step": 594444, "epoch": 7161} {"train_loss": -27.67136718566159, "global_step": 594445, "epoch": 7161, "val_loss": 6563313.0} {"train_loss": -25.03839683532715, "global_step": 594446, "epoch": 7162} {"train_loss": -20.113676071166992, "global_step": 594447, "epoch": 7162} {"train_loss": -22.1776065826416, "global_step": 594448, "epoch": 7162} {"train_loss": -24.853708267211914, "global_step": 594449, "epoch": 7162} {"train_loss": -24.526580810546875, "global_step": 594450, "epoch": 7162} {"train_loss": -25.071401596069336, "global_step": 594451, "epoch": 7162} {"train_loss": -26.25126075744629, "global_step": 594452, "epoch": 7162} {"train_loss": -24.0884952545166, "global_step": 594453, "epoch": 7162} {"train_loss": -25.5404109954834, "global_step": 594454, "epoch": 7162} {"train_loss": -26.19007682800293, "global_step": 594455, "epoch": 7162} {"train_loss": -24.909433364868164, "global_step": 594456, "epoch": 7162} {"train_loss": -26.50788688659668, "global_step": 594457, "epoch": 7162} {"train_loss": -26.49909782409668, "global_step": 594458, "epoch": 7162} {"train_loss": -26.205747604370117, "global_step": 594459, "epoch": 7162} {"train_loss": -26.344741821289062, "global_step": 594460, "epoch": 7162} {"train_loss": -26.243518829345703, "global_step": 594461, "epoch": 7162} {"train_loss": -26.526031494140625, "global_step": 594462, "epoch": 7162} {"train_loss": -26.92095947265625, "global_step": 594463, "epoch": 7162} {"train_loss": -26.24030876159668, "global_step": 594464, "epoch": 7162} {"train_loss": -26.781400680541992, "global_step": 594465, "epoch": 7162} {"train_loss": -26.994260787963867, "global_step": 594466, "epoch": 7162} {"train_loss": -26.7857666015625, "global_step": 594467, "epoch": 7162} {"train_loss": -26.906057357788086, "global_step": 594468, "epoch": 7162} {"train_loss": -27.00908851623535, "global_step": 594469, "epoch": 7162} {"train_loss": -27.253009796142578, "global_step": 594470, "epoch": 7162} {"train_loss": -27.140380859375, "global_step": 594471, "epoch": 7162} {"train_loss": -26.927000045776367, "global_step": 594472, "epoch": 7162} {"train_loss": -26.775487899780273, "global_step": 594473, "epoch": 7162} {"train_loss": -26.844160079956055, "global_step": 594474, "epoch": 7162} {"train_loss": -27.486379623413086, "global_step": 594475, "epoch": 7162} {"train_loss": -27.17268180847168, "global_step": 594476, "epoch": 7162} {"train_loss": -27.1356201171875, "global_step": 594477, "epoch": 7162} {"train_loss": -27.408451080322266, "global_step": 594478, "epoch": 7162} {"train_loss": -27.460851669311523, "global_step": 594479, "epoch": 7162} {"train_loss": -27.021270751953125, "global_step": 594480, "epoch": 7162} {"train_loss": -27.2552490234375, "global_step": 594481, "epoch": 7162} {"train_loss": -27.40155029296875, "global_step": 594482, "epoch": 7162} {"train_loss": -27.474578857421875, "global_step": 594483, "epoch": 7162} {"train_loss": -27.013097763061523, "global_step": 594484, "epoch": 7162} {"train_loss": -27.5172176361084, "global_step": 594485, "epoch": 7162} {"train_loss": -27.195728302001953, "global_step": 594486, "epoch": 7162} {"train_loss": -27.623376846313477, "global_step": 594487, "epoch": 7162} {"train_loss": -27.58619499206543, "global_step": 594488, "epoch": 7162} {"train_loss": -27.574268341064453, "global_step": 594489, "epoch": 7162} {"train_loss": -27.71320152282715, "global_step": 594490, "epoch": 7162} {"train_loss": -27.4847412109375, "global_step": 594491, "epoch": 7162} {"train_loss": -27.67644691467285, "global_step": 594492, "epoch": 7162} {"train_loss": -27.70183753967285, "global_step": 594493, "epoch": 7162} {"train_loss": -27.633726119995117, "global_step": 594494, "epoch": 7162} {"train_loss": -28.03291130065918, "global_step": 594495, "epoch": 7162} {"train_loss": -27.89373779296875, "global_step": 594496, "epoch": 7162} {"train_loss": -27.81268882751465, "global_step": 594497, "epoch": 7162} {"train_loss": -27.56159782409668, "global_step": 594498, "epoch": 7162} {"train_loss": -27.86073112487793, "global_step": 594499, "epoch": 7162} {"train_loss": -27.863759994506836, "global_step": 594500, "epoch": 7162} {"train_loss": -27.853872299194336, "global_step": 594501, "epoch": 7162} {"train_loss": -27.6795711517334, "global_step": 594502, "epoch": 7162} {"train_loss": -28.00324821472168, "global_step": 594503, "epoch": 7162} {"train_loss": -27.682880401611328, "global_step": 594504, "epoch": 7162} {"train_loss": -27.96176528930664, "global_step": 594505, "epoch": 7162} {"train_loss": -27.986730575561523, "global_step": 594506, "epoch": 7162} {"train_loss": -28.327865600585938, "global_step": 594507, "epoch": 7162} {"train_loss": -28.156808853149414, "global_step": 594508, "epoch": 7162} {"train_loss": -27.759668350219727, "global_step": 594509, "epoch": 7162} {"train_loss": -28.080646514892578, "global_step": 594510, "epoch": 7162} {"train_loss": -28.12943458557129, "global_step": 594511, "epoch": 7162} {"train_loss": -28.1511287689209, "global_step": 594512, "epoch": 7162} {"train_loss": -28.46242332458496, "global_step": 594513, "epoch": 7162} {"train_loss": -27.8627986907959, "global_step": 594514, "epoch": 7162} {"train_loss": -27.91379165649414, "global_step": 594515, "epoch": 7162} {"train_loss": -28.149524688720703, "global_step": 594516, "epoch": 7162} {"train_loss": -28.171966552734375, "global_step": 594517, "epoch": 7162} {"train_loss": -27.916772842407227, "global_step": 594518, "epoch": 7162} {"train_loss": -28.22784423828125, "global_step": 594519, "epoch": 7162} {"train_loss": -27.683557510375977, "global_step": 594520, "epoch": 7162} {"train_loss": -27.90007972717285, "global_step": 594521, "epoch": 7162} {"train_loss": -28.119665145874023, "global_step": 594522, "epoch": 7162} {"train_loss": -28.00127601623535, "global_step": 594523, "epoch": 7162} {"train_loss": -27.926959991455078, "global_step": 594524, "epoch": 7162} {"train_loss": -28.03409194946289, "global_step": 594525, "epoch": 7162} {"train_loss": -27.92010498046875, "global_step": 594526, "epoch": 7162} {"train_loss": -28.338794708251953, "global_step": 594527, "epoch": 7162} {"train_loss": -27.09486044458596, "global_step": 594528, "epoch": 7162, "val_loss": 6509245.0} {"train_loss": -27.18060302734375, "global_step": 594529, "epoch": 7163} {"train_loss": -27.220861434936523, "global_step": 594530, "epoch": 7163} {"train_loss": -27.734094619750977, "global_step": 594531, "epoch": 7163} {"train_loss": -27.394824981689453, "global_step": 594532, "epoch": 7163} {"train_loss": -27.226974487304688, "global_step": 594533, "epoch": 7163} {"train_loss": -27.615503311157227, "global_step": 594534, "epoch": 7163} {"train_loss": -27.2537784576416, "global_step": 594535, "epoch": 7163} {"train_loss": -27.021717071533203, "global_step": 594536, "epoch": 7163} {"train_loss": -27.58814811706543, "global_step": 594537, "epoch": 7163} {"train_loss": -27.310937881469727, "global_step": 594538, "epoch": 7163} {"train_loss": -27.40863609313965, "global_step": 594539, "epoch": 7163} {"train_loss": -27.5211181640625, "global_step": 594540, "epoch": 7163} {"train_loss": -27.687597274780273, "global_step": 594541, "epoch": 7163} {"train_loss": -27.483417510986328, "global_step": 594542, "epoch": 7163} {"train_loss": -27.9743595123291, "global_step": 594543, "epoch": 7163} {"train_loss": -27.414831161499023, "global_step": 594544, "epoch": 7163} {"train_loss": -27.67096519470215, "global_step": 594545, "epoch": 7163} {"train_loss": -27.28822135925293, "global_step": 594546, "epoch": 7163} {"train_loss": -27.944578170776367, "global_step": 594547, "epoch": 7163} {"train_loss": -27.424453735351562, "global_step": 594548, "epoch": 7163} {"train_loss": -28.009794235229492, "global_step": 594549, "epoch": 7163} {"train_loss": -27.738000869750977, "global_step": 594550, "epoch": 7163} {"train_loss": -27.7254695892334, "global_step": 594551, "epoch": 7163} {"train_loss": -27.683164596557617, "global_step": 594552, "epoch": 7163} {"train_loss": -27.590381622314453, "global_step": 594553, "epoch": 7163} {"train_loss": -27.96404457092285, "global_step": 594554, "epoch": 7163} {"train_loss": -27.864673614501953, "global_step": 594555, "epoch": 7163} {"train_loss": -27.7176456451416, "global_step": 594556, "epoch": 7163} {"train_loss": -27.909460067749023, "global_step": 594557, "epoch": 7163} {"train_loss": -27.72098731994629, "global_step": 594558, "epoch": 7163} {"train_loss": -27.909799575805664, "global_step": 594559, "epoch": 7163} {"train_loss": -27.48792839050293, "global_step": 594560, "epoch": 7163} {"train_loss": -28.088703155517578, "global_step": 594561, "epoch": 7163} {"train_loss": -27.627614974975586, "global_step": 594562, "epoch": 7163} {"train_loss": -28.501667022705078, "global_step": 594563, "epoch": 7163} {"train_loss": -28.204076766967773, "global_step": 594564, "epoch": 7163} {"train_loss": -28.016260147094727, "global_step": 594565, "epoch": 7163} {"train_loss": -27.907760620117188, "global_step": 594566, "epoch": 7163} {"train_loss": -28.247079849243164, "global_step": 594567, "epoch": 7163} {"train_loss": -28.045841217041016, "global_step": 594568, "epoch": 7163} {"train_loss": -28.191801071166992, "global_step": 594569, "epoch": 7163} {"train_loss": -27.702285766601562, "global_step": 594570, "epoch": 7163} {"train_loss": -27.85556983947754, "global_step": 594571, "epoch": 7163} {"train_loss": -28.151609420776367, "global_step": 594572, "epoch": 7163} {"train_loss": -28.201873779296875, "global_step": 594573, "epoch": 7163} {"train_loss": -28.09549331665039, "global_step": 594574, "epoch": 7163} {"train_loss": -28.472562789916992, "global_step": 594575, "epoch": 7163} {"train_loss": -28.065906524658203, "global_step": 594576, "epoch": 7163} {"train_loss": -28.0395450592041, "global_step": 594577, "epoch": 7163} {"train_loss": -27.949682235717773, "global_step": 594578, "epoch": 7163} {"train_loss": -27.93610954284668, "global_step": 594579, "epoch": 7163} {"train_loss": -28.16353416442871, "global_step": 594580, "epoch": 7163} {"train_loss": -28.288007736206055, "global_step": 594581, "epoch": 7163} {"train_loss": -28.185291290283203, "global_step": 594582, "epoch": 7163} {"train_loss": -28.408233642578125, "global_step": 594583, "epoch": 7163} {"train_loss": -28.43804359436035, "global_step": 594584, "epoch": 7163} {"train_loss": -28.3228759765625, "global_step": 594585, "epoch": 7163} {"train_loss": -28.1798038482666, "global_step": 594586, "epoch": 7163} {"train_loss": -28.293615341186523, "global_step": 594587, "epoch": 7163} {"train_loss": -28.235986709594727, "global_step": 594588, "epoch": 7163} {"train_loss": -27.854633331298828, "global_step": 594589, "epoch": 7163} {"train_loss": -27.81243324279785, "global_step": 594590, "epoch": 7163} {"train_loss": -28.251401901245117, "global_step": 594591, "epoch": 7163} {"train_loss": -28.356748580932617, "global_step": 594592, "epoch": 7163} {"train_loss": -28.20615577697754, "global_step": 594593, "epoch": 7163} {"train_loss": -28.04448890686035, "global_step": 594594, "epoch": 7163} {"train_loss": -28.057788848876953, "global_step": 594595, "epoch": 7163} {"train_loss": -28.0596981048584, "global_step": 594596, "epoch": 7163} {"train_loss": -27.378881454467773, "global_step": 594597, "epoch": 7163} {"train_loss": -27.41983413696289, "global_step": 594598, "epoch": 7163} {"train_loss": -27.588092803955078, "global_step": 594599, "epoch": 7163} {"train_loss": -28.252029418945312, "global_step": 594600, "epoch": 7163} {"train_loss": -27.847919464111328, "global_step": 594601, "epoch": 7163} {"train_loss": -27.522785186767578, "global_step": 594602, "epoch": 7163} {"train_loss": -27.620573043823242, "global_step": 594603, "epoch": 7163} {"train_loss": -28.010831832885742, "global_step": 594604, "epoch": 7163} {"train_loss": -27.979238510131836, "global_step": 594605, "epoch": 7163} {"train_loss": -28.008398056030273, "global_step": 594606, "epoch": 7163} {"train_loss": -28.356109619140625, "global_step": 594607, "epoch": 7163} {"train_loss": -28.361120223999023, "global_step": 594608, "epoch": 7163} {"train_loss": -28.229068756103516, "global_step": 594609, "epoch": 7163} {"train_loss": -27.99541664123535, "global_step": 594610, "epoch": 7163} {"train_loss": -27.86937948020108, "global_step": 594611, "epoch": 7163, "val_loss": 6630948.5} {"train_loss": -26.92905044555664, "global_step": 594612, "epoch": 7164} {"train_loss": -27.008955001831055, "global_step": 594613, "epoch": 7164} {"train_loss": -27.434125900268555, "global_step": 594614, "epoch": 7164} {"train_loss": -27.049646377563477, "global_step": 594615, "epoch": 7164} {"train_loss": -27.08308219909668, "global_step": 594616, "epoch": 7164} {"train_loss": -27.481908798217773, "global_step": 594617, "epoch": 7164} {"train_loss": -27.119415283203125, "global_step": 594618, "epoch": 7164} {"train_loss": -27.298181533813477, "global_step": 594619, "epoch": 7164} {"train_loss": -26.893156051635742, "global_step": 594620, "epoch": 7164} {"train_loss": -27.4876651763916, "global_step": 594621, "epoch": 7164} {"train_loss": -27.20436668395996, "global_step": 594622, "epoch": 7164} {"train_loss": -27.6104679107666, "global_step": 594623, "epoch": 7164} {"train_loss": -27.297903060913086, "global_step": 594624, "epoch": 7164} {"train_loss": -27.640226364135742, "global_step": 594625, "epoch": 7164} {"train_loss": -27.449298858642578, "global_step": 594626, "epoch": 7164} {"train_loss": -27.45667839050293, "global_step": 594627, "epoch": 7164} {"train_loss": -27.906513214111328, "global_step": 594628, "epoch": 7164} {"train_loss": -27.8204288482666, "global_step": 594629, "epoch": 7164} {"train_loss": -27.606687545776367, "global_step": 594630, "epoch": 7164} {"train_loss": -28.076919555664062, "global_step": 594631, "epoch": 7164} {"train_loss": -27.6572208404541, "global_step": 594632, "epoch": 7164} {"train_loss": -27.725982666015625, "global_step": 594633, "epoch": 7164} {"train_loss": -27.77326774597168, "global_step": 594634, "epoch": 7164} {"train_loss": -27.568517684936523, "global_step": 594635, "epoch": 7164} {"train_loss": -27.837366104125977, "global_step": 594636, "epoch": 7164} {"train_loss": -27.772113800048828, "global_step": 594637, "epoch": 7164} {"train_loss": -27.980737686157227, "global_step": 594638, "epoch": 7164} {"train_loss": -27.9189510345459, "global_step": 594639, "epoch": 7164} {"train_loss": -28.220458984375, "global_step": 594640, "epoch": 7164} {"train_loss": -28.14890480041504, "global_step": 594641, "epoch": 7164} {"train_loss": -27.9437255859375, "global_step": 594642, "epoch": 7164} {"train_loss": -28.104700088500977, "global_step": 594643, "epoch": 7164} {"train_loss": -27.995956420898438, "global_step": 594644, "epoch": 7164} {"train_loss": -28.0025691986084, "global_step": 594645, "epoch": 7164} {"train_loss": -28.07663345336914, "global_step": 594646, "epoch": 7164} {"train_loss": -28.097959518432617, "global_step": 594647, "epoch": 7164} {"train_loss": -28.394241333007812, "global_step": 594648, "epoch": 7164} {"train_loss": -28.279727935791016, "global_step": 594649, "epoch": 7164} {"train_loss": -28.323776245117188, "global_step": 594650, "epoch": 7164} {"train_loss": -28.339141845703125, "global_step": 594651, "epoch": 7164} {"train_loss": -28.35772132873535, "global_step": 594652, "epoch": 7164} {"train_loss": -28.158193588256836, "global_step": 594653, "epoch": 7164} {"train_loss": -28.154590606689453, "global_step": 594654, "epoch": 7164} {"train_loss": -27.85341453552246, "global_step": 594655, "epoch": 7164} {"train_loss": -28.281198501586914, "global_step": 594656, "epoch": 7164} {"train_loss": -28.289525985717773, "global_step": 594657, "epoch": 7164} {"train_loss": -28.24800682067871, "global_step": 594658, "epoch": 7164} {"train_loss": -28.012250900268555, "global_step": 594659, "epoch": 7164} {"train_loss": -28.2474422454834, "global_step": 594660, "epoch": 7164} {"train_loss": -28.14703941345215, "global_step": 594661, "epoch": 7164} {"train_loss": -27.921823501586914, "global_step": 594662, "epoch": 7164} {"train_loss": -27.95013427734375, "global_step": 594663, "epoch": 7164} {"train_loss": -27.954578399658203, "global_step": 594664, "epoch": 7164} {"train_loss": -27.44480323791504, "global_step": 594665, "epoch": 7164} {"train_loss": -27.675979614257812, "global_step": 594666, "epoch": 7164} {"train_loss": -27.710697174072266, "global_step": 594667, "epoch": 7164} {"train_loss": -27.96247673034668, "global_step": 594668, "epoch": 7164} {"train_loss": -27.877960205078125, "global_step": 594669, "epoch": 7164} {"train_loss": -27.71095848083496, "global_step": 594670, "epoch": 7164} {"train_loss": -27.88446617126465, "global_step": 594671, "epoch": 7164} {"train_loss": -27.85096549987793, "global_step": 594672, "epoch": 7164} {"train_loss": -28.02507972717285, "global_step": 594673, "epoch": 7164} {"train_loss": -28.581396102905273, "global_step": 594674, "epoch": 7164} {"train_loss": -27.741931915283203, "global_step": 594675, "epoch": 7164} {"train_loss": -27.963642120361328, "global_step": 594676, "epoch": 7164} {"train_loss": -28.375226974487305, "global_step": 594677, "epoch": 7164} {"train_loss": -28.05240821838379, "global_step": 594678, "epoch": 7164} {"train_loss": -27.844268798828125, "global_step": 594679, "epoch": 7164} {"train_loss": -28.0760555267334, "global_step": 594680, "epoch": 7164} {"train_loss": -27.987524032592773, "global_step": 594681, "epoch": 7164} {"train_loss": -28.125837326049805, "global_step": 594682, "epoch": 7164} {"train_loss": -27.882211685180664, "global_step": 594683, "epoch": 7164} {"train_loss": -28.21036720275879, "global_step": 594684, "epoch": 7164} {"train_loss": -27.931293487548828, "global_step": 594685, "epoch": 7164} {"train_loss": -27.731672286987305, "global_step": 594686, "epoch": 7164} {"train_loss": -27.763891220092773, "global_step": 594687, "epoch": 7164} {"train_loss": -27.975311279296875, "global_step": 594688, "epoch": 7164} {"train_loss": -27.965808868408203, "global_step": 594689, "epoch": 7164} {"train_loss": -27.822097778320312, "global_step": 594690, "epoch": 7164} {"train_loss": -27.70123863220215, "global_step": 594691, "epoch": 7164} {"train_loss": -27.877765655517578, "global_step": 594692, "epoch": 7164} {"train_loss": -27.700977325439453, "global_step": 594693, "epoch": 7164} {"train_loss": -27.84096892483263, "global_step": 594694, "epoch": 7164, "val_loss": 6566200.0} {"train_loss": -27.136877059936523, "global_step": 594695, "epoch": 7165} {"train_loss": -27.324934005737305, "global_step": 594696, "epoch": 7165} {"train_loss": -27.296878814697266, "global_step": 594697, "epoch": 7165} {"train_loss": -26.38349723815918, "global_step": 594698, "epoch": 7165} {"train_loss": -26.185758590698242, "global_step": 594699, "epoch": 7165} {"train_loss": -26.942365646362305, "global_step": 594700, "epoch": 7165} {"train_loss": -27.29437828063965, "global_step": 594701, "epoch": 7165} {"train_loss": -27.0668888092041, "global_step": 594702, "epoch": 7165} {"train_loss": -27.2005672454834, "global_step": 594703, "epoch": 7165} {"train_loss": -27.20477867126465, "global_step": 594704, "epoch": 7165} {"train_loss": -27.295454025268555, "global_step": 594705, "epoch": 7165} {"train_loss": -27.389631271362305, "global_step": 594706, "epoch": 7165} {"train_loss": -27.167505264282227, "global_step": 594707, "epoch": 7165} {"train_loss": -27.185993194580078, "global_step": 594708, "epoch": 7165} {"train_loss": -27.2567138671875, "global_step": 594709, "epoch": 7165} {"train_loss": -27.953460693359375, "global_step": 594710, "epoch": 7165} {"train_loss": -27.383270263671875, "global_step": 594711, "epoch": 7165} {"train_loss": -27.756275177001953, "global_step": 594712, "epoch": 7165} {"train_loss": -27.688064575195312, "global_step": 594713, "epoch": 7165} {"train_loss": -28.0125675201416, "global_step": 594714, "epoch": 7165} {"train_loss": -27.4045467376709, "global_step": 594715, "epoch": 7165} {"train_loss": -27.920246124267578, "global_step": 594716, "epoch": 7165} {"train_loss": -28.0091495513916, "global_step": 594717, "epoch": 7165} {"train_loss": -27.4766845703125, "global_step": 594718, "epoch": 7165} {"train_loss": -27.292709350585938, "global_step": 594719, "epoch": 7165} {"train_loss": -27.501617431640625, "global_step": 594720, "epoch": 7165} {"train_loss": -27.792510986328125, "global_step": 594721, "epoch": 7165} {"train_loss": -27.940597534179688, "global_step": 594722, "epoch": 7165} {"train_loss": -27.763273239135742, "global_step": 594723, "epoch": 7165} {"train_loss": -27.933658599853516, "global_step": 594724, "epoch": 7165} {"train_loss": -28.1236629486084, "global_step": 594725, "epoch": 7165} {"train_loss": -28.064163208007812, "global_step": 594726, "epoch": 7165} {"train_loss": -27.560073852539062, "global_step": 594727, "epoch": 7165} {"train_loss": -27.70478630065918, "global_step": 594728, "epoch": 7165} {"train_loss": -28.27923011779785, "global_step": 594729, "epoch": 7165} {"train_loss": -28.043394088745117, "global_step": 594730, "epoch": 7165} {"train_loss": -28.226743698120117, "global_step": 594731, "epoch": 7165} {"train_loss": -28.04789161682129, "global_step": 594732, "epoch": 7165} {"train_loss": -28.175512313842773, "global_step": 594733, "epoch": 7165} {"train_loss": -28.14652442932129, "global_step": 594734, "epoch": 7165} {"train_loss": -28.320556640625, "global_step": 594735, "epoch": 7165} {"train_loss": -27.9304256439209, "global_step": 594736, "epoch": 7165} {"train_loss": -28.23105812072754, "global_step": 594737, "epoch": 7165} {"train_loss": -27.974933624267578, "global_step": 594738, "epoch": 7165} {"train_loss": -28.299280166625977, "global_step": 594739, "epoch": 7165} {"train_loss": -27.996923446655273, "global_step": 594740, "epoch": 7165} {"train_loss": -28.20246696472168, "global_step": 594741, "epoch": 7165} {"train_loss": -28.36423110961914, "global_step": 594742, "epoch": 7165} {"train_loss": -28.518096923828125, "global_step": 594743, "epoch": 7165} {"train_loss": -28.59340476989746, "global_step": 594744, "epoch": 7165} {"train_loss": -28.3424072265625, "global_step": 594745, "epoch": 7165} {"train_loss": -27.979116439819336, "global_step": 594746, "epoch": 7165} {"train_loss": -27.989093780517578, "global_step": 594747, "epoch": 7165} {"train_loss": -28.785619735717773, "global_step": 594748, "epoch": 7165} {"train_loss": -28.486480712890625, "global_step": 594749, "epoch": 7165} {"train_loss": -27.909067153930664, "global_step": 594750, "epoch": 7165} {"train_loss": -28.436294555664062, "global_step": 594751, "epoch": 7165} {"train_loss": -28.403730392456055, "global_step": 594752, "epoch": 7165} {"train_loss": -28.00861930847168, "global_step": 594753, "epoch": 7165} {"train_loss": -28.17695426940918, "global_step": 594754, "epoch": 7165} {"train_loss": -28.085763931274414, "global_step": 594755, "epoch": 7165} {"train_loss": -28.383193969726562, "global_step": 594756, "epoch": 7165} {"train_loss": -28.232685089111328, "global_step": 594757, "epoch": 7165} {"train_loss": -28.058740615844727, "global_step": 594758, "epoch": 7165} {"train_loss": -27.954145431518555, "global_step": 594759, "epoch": 7165} {"train_loss": -28.119749069213867, "global_step": 594760, "epoch": 7165} {"train_loss": -28.04425621032715, "global_step": 594761, "epoch": 7165} {"train_loss": -27.98528480529785, "global_step": 594762, "epoch": 7165} {"train_loss": -28.534942626953125, "global_step": 594763, "epoch": 7165} {"train_loss": -28.143234252929688, "global_step": 594764, "epoch": 7165} {"train_loss": -28.294635772705078, "global_step": 594765, "epoch": 7165} {"train_loss": -28.233671188354492, "global_step": 594766, "epoch": 7165} {"train_loss": -28.276935577392578, "global_step": 594767, "epoch": 7165} {"train_loss": -28.057464599609375, "global_step": 594768, "epoch": 7165} {"train_loss": -28.110746383666992, "global_step": 594769, "epoch": 7165} {"train_loss": -27.6666259765625, "global_step": 594770, "epoch": 7165} {"train_loss": -27.279645919799805, "global_step": 594771, "epoch": 7165} {"train_loss": -27.396793365478516, "global_step": 594772, "epoch": 7165} {"train_loss": -27.3497371673584, "global_step": 594773, "epoch": 7165} {"train_loss": -26.920581817626953, "global_step": 594774, "epoch": 7165} {"train_loss": -27.735776901245117, "global_step": 594775, "epoch": 7165} {"train_loss": -27.120269775390625, "global_step": 594776, "epoch": 7165} {"train_loss": -27.833374414099268, "global_step": 594777, "epoch": 7165, "val_loss": 6581244.0} {"train_loss": -24.86484146118164, "global_step": 594778, "epoch": 7166} {"train_loss": -21.979230880737305, "global_step": 594779, "epoch": 7166} {"train_loss": -26.028289794921875, "global_step": 594780, "epoch": 7166} {"train_loss": -25.114110946655273, "global_step": 594781, "epoch": 7166} {"train_loss": -25.477006912231445, "global_step": 594782, "epoch": 7166} {"train_loss": -27.05263328552246, "global_step": 594783, "epoch": 7166} {"train_loss": -24.82987403869629, "global_step": 594784, "epoch": 7166} {"train_loss": -26.19683837890625, "global_step": 594785, "epoch": 7166} {"train_loss": -26.893386840820312, "global_step": 594786, "epoch": 7166} {"train_loss": -26.521894454956055, "global_step": 594787, "epoch": 7166} {"train_loss": -26.47112464904785, "global_step": 594788, "epoch": 7166} {"train_loss": -27.025684356689453, "global_step": 594789, "epoch": 7166} {"train_loss": -26.809473037719727, "global_step": 594790, "epoch": 7166} {"train_loss": -26.699262619018555, "global_step": 594791, "epoch": 7166} {"train_loss": -26.654373168945312, "global_step": 594792, "epoch": 7166} {"train_loss": -26.97784996032715, "global_step": 594793, "epoch": 7166} {"train_loss": -27.20029067993164, "global_step": 594794, "epoch": 7166} {"train_loss": -27.3525390625, "global_step": 594795, "epoch": 7166} {"train_loss": -27.279815673828125, "global_step": 594796, "epoch": 7166} {"train_loss": -27.1240291595459, "global_step": 594797, "epoch": 7166} {"train_loss": -27.0794677734375, "global_step": 594798, "epoch": 7166} {"train_loss": -27.266799926757812, "global_step": 594799, "epoch": 7166} {"train_loss": -27.41965675354004, "global_step": 594800, "epoch": 7166} {"train_loss": -27.381067276000977, "global_step": 594801, "epoch": 7166} {"train_loss": -27.24309730529785, "global_step": 594802, "epoch": 7166} {"train_loss": -27.3173885345459, "global_step": 594803, "epoch": 7166} {"train_loss": -27.419233322143555, "global_step": 594804, "epoch": 7166} {"train_loss": -26.7165584564209, "global_step": 594805, "epoch": 7166} {"train_loss": -27.30006217956543, "global_step": 594806, "epoch": 7166} {"train_loss": -27.615659713745117, "global_step": 594807, "epoch": 7166} {"train_loss": -27.3969669342041, "global_step": 594808, "epoch": 7166} {"train_loss": -27.7774715423584, "global_step": 594809, "epoch": 7166} {"train_loss": -27.6568546295166, "global_step": 594810, "epoch": 7166} {"train_loss": -27.7578125, "global_step": 594811, "epoch": 7166} {"train_loss": -27.362878799438477, "global_step": 594812, "epoch": 7166} {"train_loss": -27.938703536987305, "global_step": 594813, "epoch": 7166} {"train_loss": -27.623517990112305, "global_step": 594814, "epoch": 7166} {"train_loss": -27.61115074157715, "global_step": 594815, "epoch": 7166} {"train_loss": -27.879560470581055, "global_step": 594816, "epoch": 7166} {"train_loss": -27.952306747436523, "global_step": 594817, "epoch": 7166} {"train_loss": -27.698205947875977, "global_step": 594818, "epoch": 7166} {"train_loss": -27.998584747314453, "global_step": 594819, "epoch": 7166} {"train_loss": -27.88655662536621, "global_step": 594820, "epoch": 7166} {"train_loss": -27.768421173095703, "global_step": 594821, "epoch": 7166} {"train_loss": -27.9515438079834, "global_step": 594822, "epoch": 7166} {"train_loss": -27.60530662536621, "global_step": 594823, "epoch": 7166} {"train_loss": -27.819171905517578, "global_step": 594824, "epoch": 7166} {"train_loss": -27.989599227905273, "global_step": 594825, "epoch": 7166} {"train_loss": -27.852392196655273, "global_step": 594826, "epoch": 7166} {"train_loss": -27.848388671875, "global_step": 594827, "epoch": 7166} {"train_loss": -27.73044776916504, "global_step": 594828, "epoch": 7166} {"train_loss": -28.141326904296875, "global_step": 594829, "epoch": 7166} {"train_loss": -27.80816078186035, "global_step": 594830, "epoch": 7166} {"train_loss": -27.462491989135742, "global_step": 594831, "epoch": 7166} {"train_loss": -27.388843536376953, "global_step": 594832, "epoch": 7166} {"train_loss": -27.386615753173828, "global_step": 594833, "epoch": 7166} {"train_loss": -27.542102813720703, "global_step": 594834, "epoch": 7166} {"train_loss": -27.4395751953125, "global_step": 594835, "epoch": 7166} {"train_loss": -27.54786491394043, "global_step": 594836, "epoch": 7166} {"train_loss": -27.137537002563477, "global_step": 594837, "epoch": 7166} {"train_loss": -27.794677734375, "global_step": 594838, "epoch": 7166} {"train_loss": -27.559911727905273, "global_step": 594839, "epoch": 7166} {"train_loss": -27.724218368530273, "global_step": 594840, "epoch": 7166} {"train_loss": -27.95533561706543, "global_step": 594841, "epoch": 7166} {"train_loss": -27.984851837158203, "global_step": 594842, "epoch": 7166} {"train_loss": -28.023303985595703, "global_step": 594843, "epoch": 7166} {"train_loss": -27.346485137939453, "global_step": 594844, "epoch": 7166} {"train_loss": -27.5881290435791, "global_step": 594845, "epoch": 7166} {"train_loss": -27.8902587890625, "global_step": 594846, "epoch": 7166} {"train_loss": -27.777881622314453, "global_step": 594847, "epoch": 7166} {"train_loss": -27.850080490112305, "global_step": 594848, "epoch": 7166} {"train_loss": -27.699859619140625, "global_step": 594849, "epoch": 7166} {"train_loss": -27.911279678344727, "global_step": 594850, "epoch": 7166} {"train_loss": -27.905405044555664, "global_step": 594851, "epoch": 7166} {"train_loss": -27.91932487487793, "global_step": 594852, "epoch": 7166} {"train_loss": -28.4046630859375, "global_step": 594853, "epoch": 7166} {"train_loss": -28.223840713500977, "global_step": 594854, "epoch": 7166} {"train_loss": -27.732141494750977, "global_step": 594855, "epoch": 7166} {"train_loss": -27.982736587524414, "global_step": 594856, "epoch": 7166} {"train_loss": -28.164411544799805, "global_step": 594857, "epoch": 7166} {"train_loss": -27.98491859436035, "global_step": 594858, "epoch": 7166} {"train_loss": -27.972333908081055, "global_step": 594859, "epoch": 7166} {"train_loss": -27.34683091956449, "global_step": 594860, "epoch": 7166, "val_loss": 6654094.0} {"train_loss": -28.14639663696289, "global_step": 594861, "epoch": 7167} {"train_loss": -27.605228424072266, "global_step": 594862, "epoch": 7167} {"train_loss": -26.975011825561523, "global_step": 594863, "epoch": 7167} {"train_loss": -27.178598403930664, "global_step": 594864, "epoch": 7167} {"train_loss": -27.562759399414062, "global_step": 594865, "epoch": 7167} {"train_loss": -27.227493286132812, "global_step": 594866, "epoch": 7167} {"train_loss": -28.197589874267578, "global_step": 594867, "epoch": 7167} {"train_loss": -27.556201934814453, "global_step": 594868, "epoch": 7167} {"train_loss": -27.951902389526367, "global_step": 594869, "epoch": 7167} {"train_loss": -27.6474609375, "global_step": 594870, "epoch": 7167} {"train_loss": -28.076223373413086, "global_step": 594871, "epoch": 7167} {"train_loss": -27.685678482055664, "global_step": 594872, "epoch": 7167} {"train_loss": -27.876300811767578, "global_step": 594873, "epoch": 7167} {"train_loss": -27.624042510986328, "global_step": 594874, "epoch": 7167} {"train_loss": -27.617956161499023, "global_step": 594875, "epoch": 7167} {"train_loss": -27.83230972290039, "global_step": 594876, "epoch": 7167} {"train_loss": -27.659948348999023, "global_step": 594877, "epoch": 7167} {"train_loss": -27.814443588256836, "global_step": 594878, "epoch": 7167} {"train_loss": -27.84865379333496, "global_step": 594879, "epoch": 7167} {"train_loss": -27.766103744506836, "global_step": 594880, "epoch": 7167} {"train_loss": -27.908090591430664, "global_step": 594881, "epoch": 7167} {"train_loss": -28.068700790405273, "global_step": 594882, "epoch": 7167} {"train_loss": -27.50860023498535, "global_step": 594883, "epoch": 7167} {"train_loss": -27.899587631225586, "global_step": 594884, "epoch": 7167} {"train_loss": -27.84273338317871, "global_step": 594885, "epoch": 7167} {"train_loss": -28.16094970703125, "global_step": 594886, "epoch": 7167} {"train_loss": -27.46906089782715, "global_step": 594887, "epoch": 7167} {"train_loss": -27.70773696899414, "global_step": 594888, "epoch": 7167} {"train_loss": -27.922460556030273, "global_step": 594889, "epoch": 7167} {"train_loss": -28.0461368560791, "global_step": 594890, "epoch": 7167} {"train_loss": -27.921079635620117, "global_step": 594891, "epoch": 7167} {"train_loss": -27.91072654724121, "global_step": 594892, "epoch": 7167} {"train_loss": -28.092681884765625, "global_step": 594893, "epoch": 7167} {"train_loss": -27.9721622467041, "global_step": 594894, "epoch": 7167} {"train_loss": -27.499780654907227, "global_step": 594895, "epoch": 7167} {"train_loss": -27.581403732299805, "global_step": 594896, "epoch": 7167} {"train_loss": -27.75410270690918, "global_step": 594897, "epoch": 7167} {"train_loss": -27.968896865844727, "global_step": 594898, "epoch": 7167} {"train_loss": -27.796070098876953, "global_step": 594899, "epoch": 7167} {"train_loss": -27.778076171875, "global_step": 594900, "epoch": 7167} {"train_loss": -28.03546714782715, "global_step": 594901, "epoch": 7167} {"train_loss": -27.857471466064453, "global_step": 594902, "epoch": 7167} {"train_loss": -27.812223434448242, "global_step": 594903, "epoch": 7167} {"train_loss": -28.244464874267578, "global_step": 594904, "epoch": 7167} {"train_loss": -27.918195724487305, "global_step": 594905, "epoch": 7167} {"train_loss": -28.276748657226562, "global_step": 594906, "epoch": 7167} {"train_loss": -27.97783851623535, "global_step": 594907, "epoch": 7167} {"train_loss": -28.0014591217041, "global_step": 594908, "epoch": 7167} {"train_loss": -28.180261611938477, "global_step": 594909, "epoch": 7167} {"train_loss": -28.298934936523438, "global_step": 594910, "epoch": 7167} {"train_loss": -28.01569938659668, "global_step": 594911, "epoch": 7167} {"train_loss": -28.075244903564453, "global_step": 594912, "epoch": 7167} {"train_loss": -28.1832332611084, "global_step": 594913, "epoch": 7167} {"train_loss": -28.254199981689453, "global_step": 594914, "epoch": 7167} {"train_loss": -27.88091468811035, "global_step": 594915, "epoch": 7167} {"train_loss": -27.93329429626465, "global_step": 594916, "epoch": 7167} {"train_loss": -28.056180953979492, "global_step": 594917, "epoch": 7167} {"train_loss": -28.30427360534668, "global_step": 594918, "epoch": 7167} {"train_loss": -28.287878036499023, "global_step": 594919, "epoch": 7167} {"train_loss": -28.421384811401367, "global_step": 594920, "epoch": 7167} {"train_loss": -28.385604858398438, "global_step": 594921, "epoch": 7167} {"train_loss": -28.123945236206055, "global_step": 594922, "epoch": 7167} {"train_loss": -28.272863388061523, "global_step": 594923, "epoch": 7167} {"train_loss": -28.2786865234375, "global_step": 594924, "epoch": 7167} {"train_loss": -28.295801162719727, "global_step": 594925, "epoch": 7167} {"train_loss": -28.215728759765625, "global_step": 594926, "epoch": 7167} {"train_loss": -28.1408634185791, "global_step": 594927, "epoch": 7167} {"train_loss": -28.438398361206055, "global_step": 594928, "epoch": 7167} {"train_loss": -28.014678955078125, "global_step": 594929, "epoch": 7167} {"train_loss": -28.006784439086914, "global_step": 594930, "epoch": 7167} {"train_loss": -28.272109985351562, "global_step": 594931, "epoch": 7167} {"train_loss": -28.206090927124023, "global_step": 594932, "epoch": 7167} {"train_loss": -28.09087562561035, "global_step": 594933, "epoch": 7167} {"train_loss": -28.309375762939453, "global_step": 594934, "epoch": 7167} {"train_loss": -28.097898483276367, "global_step": 594935, "epoch": 7167} {"train_loss": -27.9370059967041, "global_step": 594936, "epoch": 7167} {"train_loss": -28.239057540893555, "global_step": 594937, "epoch": 7167} {"train_loss": -27.739734649658203, "global_step": 594938, "epoch": 7167} {"train_loss": -28.386322021484375, "global_step": 594939, "epoch": 7167} {"train_loss": -28.030378341674805, "global_step": 594940, "epoch": 7167} {"train_loss": -28.113086700439453, "global_step": 594941, "epoch": 7167} {"train_loss": -27.75477409362793, "global_step": 594942, "epoch": 7167} {"train_loss": -27.946779963481855, "global_step": 594943, "epoch": 7167, "val_loss": 6668690.5} {"train_loss": -26.242223739624023, "global_step": 594944, "epoch": 7168} {"train_loss": -25.200700759887695, "global_step": 594945, "epoch": 7168} {"train_loss": -26.625852584838867, "global_step": 594946, "epoch": 7168} {"train_loss": -27.376157760620117, "global_step": 594947, "epoch": 7168} {"train_loss": -25.904829025268555, "global_step": 594948, "epoch": 7168} {"train_loss": -25.486896514892578, "global_step": 594949, "epoch": 7168} {"train_loss": -26.725357055664062, "global_step": 594950, "epoch": 7168} {"train_loss": -26.24416160583496, "global_step": 594951, "epoch": 7168} {"train_loss": -26.665754318237305, "global_step": 594952, "epoch": 7168} {"train_loss": -25.99871826171875, "global_step": 594953, "epoch": 7168} {"train_loss": -26.78696632385254, "global_step": 594954, "epoch": 7168} {"train_loss": -26.8439998626709, "global_step": 594955, "epoch": 7168} {"train_loss": -27.134063720703125, "global_step": 594956, "epoch": 7168} {"train_loss": -27.40323257446289, "global_step": 594957, "epoch": 7168} {"train_loss": -27.23004150390625, "global_step": 594958, "epoch": 7168} {"train_loss": -27.4174861907959, "global_step": 594959, "epoch": 7168} {"train_loss": -27.046924591064453, "global_step": 594960, "epoch": 7168} {"train_loss": -27.66434097290039, "global_step": 594961, "epoch": 7168} {"train_loss": -27.19046401977539, "global_step": 594962, "epoch": 7168} {"train_loss": -27.112958908081055, "global_step": 594963, "epoch": 7168} {"train_loss": -27.435327529907227, "global_step": 594964, "epoch": 7168} {"train_loss": -27.265085220336914, "global_step": 594965, "epoch": 7168} {"train_loss": -27.58089256286621, "global_step": 594966, "epoch": 7168} {"train_loss": -26.95694351196289, "global_step": 594967, "epoch": 7168} {"train_loss": -27.926929473876953, "global_step": 594968, "epoch": 7168} {"train_loss": -27.955297470092773, "global_step": 594969, "epoch": 7168} {"train_loss": -27.47962760925293, "global_step": 594970, "epoch": 7168} {"train_loss": -27.325082778930664, "global_step": 594971, "epoch": 7168} {"train_loss": -27.722272872924805, "global_step": 594972, "epoch": 7168} {"train_loss": -27.7451171875, "global_step": 594973, "epoch": 7168} {"train_loss": -27.7818603515625, "global_step": 594974, "epoch": 7168} {"train_loss": -27.894208908081055, "global_step": 594975, "epoch": 7168} {"train_loss": -27.80291748046875, "global_step": 594976, "epoch": 7168} {"train_loss": -28.078155517578125, "global_step": 594977, "epoch": 7168} {"train_loss": -27.873519897460938, "global_step": 594978, "epoch": 7168} {"train_loss": -27.84078025817871, "global_step": 594979, "epoch": 7168} {"train_loss": -28.020185470581055, "global_step": 594980, "epoch": 7168} {"train_loss": -28.060169219970703, "global_step": 594981, "epoch": 7168} {"train_loss": -28.169214248657227, "global_step": 594982, "epoch": 7168} {"train_loss": -27.877105712890625, "global_step": 594983, "epoch": 7168} {"train_loss": -27.952579498291016, "global_step": 594984, "epoch": 7168} {"train_loss": -28.016082763671875, "global_step": 594985, "epoch": 7168} {"train_loss": -28.309497833251953, "global_step": 594986, "epoch": 7168} {"train_loss": -28.172382354736328, "global_step": 594987, "epoch": 7168} {"train_loss": -28.022912979125977, "global_step": 594988, "epoch": 7168} {"train_loss": -27.987314224243164, "global_step": 594989, "epoch": 7168} {"train_loss": -28.179718017578125, "global_step": 594990, "epoch": 7168} {"train_loss": -28.370269775390625, "global_step": 594991, "epoch": 7168} {"train_loss": -27.93588638305664, "global_step": 594992, "epoch": 7168} {"train_loss": -28.317935943603516, "global_step": 594993, "epoch": 7168} {"train_loss": -28.3062744140625, "global_step": 594994, "epoch": 7168} {"train_loss": -28.491058349609375, "global_step": 594995, "epoch": 7168} {"train_loss": -28.127445220947266, "global_step": 594996, "epoch": 7168} {"train_loss": -28.2795467376709, "global_step": 594997, "epoch": 7168} {"train_loss": -28.64420509338379, "global_step": 594998, "epoch": 7168} {"train_loss": -28.39208984375, "global_step": 594999, "epoch": 7168} {"train_loss": -27.8203182220459, "global_step": 595000, "epoch": 7168} {"train_loss": -28.417678833007812, "global_step": 595001, "epoch": 7168} {"train_loss": -28.03079605102539, "global_step": 595002, "epoch": 7168} {"train_loss": -28.200571060180664, "global_step": 595003, "epoch": 7168} {"train_loss": -27.95753288269043, "global_step": 595004, "epoch": 7168} {"train_loss": -28.180273056030273, "global_step": 595005, "epoch": 7168} {"train_loss": -28.709884643554688, "global_step": 595006, "epoch": 7168} {"train_loss": -28.211172103881836, "global_step": 595007, "epoch": 7168} {"train_loss": -28.025531768798828, "global_step": 595008, "epoch": 7168} {"train_loss": -28.372344970703125, "global_step": 595009, "epoch": 7168} {"train_loss": -27.904571533203125, "global_step": 595010, "epoch": 7168} {"train_loss": -28.24481201171875, "global_step": 595011, "epoch": 7168} {"train_loss": -28.1584529876709, "global_step": 595012, "epoch": 7168} {"train_loss": -28.562097549438477, "global_step": 595013, "epoch": 7168} {"train_loss": -28.24945068359375, "global_step": 595014, "epoch": 7168} {"train_loss": -28.356689453125, "global_step": 595015, "epoch": 7168} {"train_loss": -28.36417579650879, "global_step": 595016, "epoch": 7168} {"train_loss": -28.113616943359375, "global_step": 595017, "epoch": 7168} {"train_loss": -27.97027015686035, "global_step": 595018, "epoch": 7168} {"train_loss": -28.01025390625, "global_step": 595019, "epoch": 7168} {"train_loss": -28.127111434936523, "global_step": 595020, "epoch": 7168} {"train_loss": -27.67352867126465, "global_step": 595021, "epoch": 7168} {"train_loss": -28.101959228515625, "global_step": 595022, "epoch": 7168} {"train_loss": -28.28997230529785, "global_step": 595023, "epoch": 7168} {"train_loss": -27.97002601623535, "global_step": 595024, "epoch": 7168} {"train_loss": -28.04779052734375, "global_step": 595025, "epoch": 7168} {"train_loss": -27.720874809357056, "global_step": 595026, "epoch": 7168, "val_loss": 6700996.5} {"train_loss": -27.42085075378418, "global_step": 595027, "epoch": 7169} {"train_loss": -26.645822525024414, "global_step": 595028, "epoch": 7169} {"train_loss": -27.055511474609375, "global_step": 595029, "epoch": 7169} {"train_loss": -27.06232261657715, "global_step": 595030, "epoch": 7169} {"train_loss": -27.089130401611328, "global_step": 595031, "epoch": 7169} {"train_loss": -27.639245986938477, "global_step": 595032, "epoch": 7169} {"train_loss": -27.92400550842285, "global_step": 595033, "epoch": 7169} {"train_loss": -27.295751571655273, "global_step": 595034, "epoch": 7169} {"train_loss": -27.68890953063965, "global_step": 595035, "epoch": 7169} {"train_loss": -27.639053344726562, "global_step": 595036, "epoch": 7169} {"train_loss": -27.37505531311035, "global_step": 595037, "epoch": 7169} {"train_loss": -27.681182861328125, "global_step": 595038, "epoch": 7169} {"train_loss": -27.730066299438477, "global_step": 595039, "epoch": 7169} {"train_loss": -27.575281143188477, "global_step": 595040, "epoch": 7169} {"train_loss": -27.849760055541992, "global_step": 595041, "epoch": 7169} {"train_loss": -27.556333541870117, "global_step": 595042, "epoch": 7169} {"train_loss": -27.869983673095703, "global_step": 595043, "epoch": 7169} {"train_loss": -27.57099723815918, "global_step": 595044, "epoch": 7169} {"train_loss": -27.781705856323242, "global_step": 595045, "epoch": 7169} {"train_loss": -27.570730209350586, "global_step": 595046, "epoch": 7169} {"train_loss": -27.624114990234375, "global_step": 595047, "epoch": 7169} {"train_loss": -27.608535766601562, "global_step": 595048, "epoch": 7169} {"train_loss": -27.5228271484375, "global_step": 595049, "epoch": 7169} {"train_loss": -27.5101318359375, "global_step": 595050, "epoch": 7169} {"train_loss": -27.801603317260742, "global_step": 595051, "epoch": 7169} {"train_loss": -27.41753578186035, "global_step": 595052, "epoch": 7169} {"train_loss": -27.611555099487305, "global_step": 595053, "epoch": 7169} {"train_loss": -27.8687744140625, "global_step": 595054, "epoch": 7169} {"train_loss": -27.884382247924805, "global_step": 595055, "epoch": 7169} {"train_loss": -27.80243492126465, "global_step": 595056, "epoch": 7169} {"train_loss": -28.17246437072754, "global_step": 595057, "epoch": 7169} {"train_loss": -28.028095245361328, "global_step": 595058, "epoch": 7169} {"train_loss": -27.636991500854492, "global_step": 595059, "epoch": 7169} {"train_loss": -28.013463973999023, "global_step": 595060, "epoch": 7169} {"train_loss": -28.076679229736328, "global_step": 595061, "epoch": 7169} {"train_loss": -28.125171661376953, "global_step": 595062, "epoch": 7169} {"train_loss": -27.97260856628418, "global_step": 595063, "epoch": 7169} {"train_loss": -28.150354385375977, "global_step": 595064, "epoch": 7169} {"train_loss": -27.74053382873535, "global_step": 595065, "epoch": 7169} {"train_loss": -28.342065811157227, "global_step": 595066, "epoch": 7169} {"train_loss": -27.9583683013916, "global_step": 595067, "epoch": 7169} {"train_loss": -27.95138931274414, "global_step": 595068, "epoch": 7169} {"train_loss": -28.306921005249023, "global_step": 595069, "epoch": 7169} {"train_loss": -27.583219528198242, "global_step": 595070, "epoch": 7169} {"train_loss": -28.275531768798828, "global_step": 595071, "epoch": 7169} {"train_loss": -28.051950454711914, "global_step": 595072, "epoch": 7169} {"train_loss": -27.96319580078125, "global_step": 595073, "epoch": 7169} {"train_loss": -28.046972274780273, "global_step": 595074, "epoch": 7169} {"train_loss": -28.49674415588379, "global_step": 595075, "epoch": 7169} {"train_loss": -28.412317276000977, "global_step": 595076, "epoch": 7169} {"train_loss": -28.417102813720703, "global_step": 595077, "epoch": 7169} {"train_loss": -28.291608810424805, "global_step": 595078, "epoch": 7169} {"train_loss": -28.15810203552246, "global_step": 595079, "epoch": 7169} {"train_loss": -28.310760498046875, "global_step": 595080, "epoch": 7169} {"train_loss": -27.99588394165039, "global_step": 595081, "epoch": 7169} {"train_loss": -28.016254425048828, "global_step": 595082, "epoch": 7169} {"train_loss": -28.01236343383789, "global_step": 595083, "epoch": 7169} {"train_loss": -28.203893661499023, "global_step": 595084, "epoch": 7169} {"train_loss": -28.091033935546875, "global_step": 595085, "epoch": 7169} {"train_loss": -27.913877487182617, "global_step": 595086, "epoch": 7169} {"train_loss": -27.8265438079834, "global_step": 595087, "epoch": 7169} {"train_loss": -27.152746200561523, "global_step": 595088, "epoch": 7169} {"train_loss": -28.033361434936523, "global_step": 595089, "epoch": 7169} {"train_loss": -28.214557647705078, "global_step": 595090, "epoch": 7169} {"train_loss": -28.11639976501465, "global_step": 595091, "epoch": 7169} {"train_loss": -27.701684951782227, "global_step": 595092, "epoch": 7169} {"train_loss": -28.16242027282715, "global_step": 595093, "epoch": 7169} {"train_loss": -27.795434951782227, "global_step": 595094, "epoch": 7169} {"train_loss": -28.057025909423828, "global_step": 595095, "epoch": 7169} {"train_loss": -27.82635498046875, "global_step": 595096, "epoch": 7169} {"train_loss": -28.260986328125, "global_step": 595097, "epoch": 7169} {"train_loss": -28.013031005859375, "global_step": 595098, "epoch": 7169} {"train_loss": -28.038482666015625, "global_step": 595099, "epoch": 7169} {"train_loss": -28.173063278198242, "global_step": 595100, "epoch": 7169} {"train_loss": -28.035663604736328, "global_step": 595101, "epoch": 7169} {"train_loss": -28.07404899597168, "global_step": 595102, "epoch": 7169} {"train_loss": -28.201374053955078, "global_step": 595103, "epoch": 7169} {"train_loss": -28.132232666015625, "global_step": 595104, "epoch": 7169} {"train_loss": -28.257726669311523, "global_step": 595105, "epoch": 7169} {"train_loss": -27.93487548828125, "global_step": 595106, "epoch": 7169} {"train_loss": -28.142337799072266, "global_step": 595107, "epoch": 7169} {"train_loss": -27.967248916625977, "global_step": 595108, "epoch": 7169} {"train_loss": -27.860193114682854, "global_step": 595109, "epoch": 7169, "val_loss": 6651879.0} {"train_loss": -25.64181900024414, "global_step": 595110, "epoch": 7170} {"train_loss": -26.445770263671875, "global_step": 595111, "epoch": 7170} {"train_loss": -26.902429580688477, "global_step": 595112, "epoch": 7170} {"train_loss": -26.832672119140625, "global_step": 595113, "epoch": 7170} {"train_loss": -27.350940704345703, "global_step": 595114, "epoch": 7170} {"train_loss": -27.811689376831055, "global_step": 595115, "epoch": 7170} {"train_loss": -27.282373428344727, "global_step": 595116, "epoch": 7170} {"train_loss": -27.28558349609375, "global_step": 595117, "epoch": 7170} {"train_loss": -27.375181198120117, "global_step": 595118, "epoch": 7170} {"train_loss": -27.53580093383789, "global_step": 595119, "epoch": 7170} {"train_loss": -26.980777740478516, "global_step": 595120, "epoch": 7170} {"train_loss": -27.2762451171875, "global_step": 595121, "epoch": 7170} {"train_loss": -27.43499183654785, "global_step": 595122, "epoch": 7170} {"train_loss": -26.896560668945312, "global_step": 595123, "epoch": 7170} {"train_loss": -27.745771408081055, "global_step": 595124, "epoch": 7170} {"train_loss": -27.19379997253418, "global_step": 595125, "epoch": 7170} {"train_loss": -27.39325523376465, "global_step": 595126, "epoch": 7170} {"train_loss": -27.655405044555664, "global_step": 595127, "epoch": 7170} {"train_loss": -27.645740509033203, "global_step": 595128, "epoch": 7170} {"train_loss": -27.662878036499023, "global_step": 595129, "epoch": 7170} {"train_loss": -27.153167724609375, "global_step": 595130, "epoch": 7170} {"train_loss": -27.795612335205078, "global_step": 595131, "epoch": 7170} {"train_loss": -27.43018913269043, "global_step": 595132, "epoch": 7170} {"train_loss": -27.72000503540039, "global_step": 595133, "epoch": 7170} {"train_loss": -27.264850616455078, "global_step": 595134, "epoch": 7170} {"train_loss": -27.8161563873291, "global_step": 595135, "epoch": 7170} {"train_loss": -27.756458282470703, "global_step": 595136, "epoch": 7170} {"train_loss": -27.85016441345215, "global_step": 595137, "epoch": 7170} {"train_loss": -27.994354248046875, "global_step": 595138, "epoch": 7170} {"train_loss": -28.1226863861084, "global_step": 595139, "epoch": 7170} {"train_loss": -28.066247940063477, "global_step": 595140, "epoch": 7170} {"train_loss": -27.576276779174805, "global_step": 595141, "epoch": 7170} {"train_loss": -28.0812931060791, "global_step": 595142, "epoch": 7170} {"train_loss": -27.60177993774414, "global_step": 595143, "epoch": 7170} {"train_loss": -28.222700119018555, "global_step": 595144, "epoch": 7170} {"train_loss": -27.963342666625977, "global_step": 595145, "epoch": 7170} {"train_loss": -27.594640731811523, "global_step": 595146, "epoch": 7170} {"train_loss": -27.924396514892578, "global_step": 595147, "epoch": 7170} {"train_loss": -28.142200469970703, "global_step": 595148, "epoch": 7170} {"train_loss": -27.437101364135742, "global_step": 595149, "epoch": 7170} {"train_loss": -27.81741714477539, "global_step": 595150, "epoch": 7170} {"train_loss": -28.14619255065918, "global_step": 595151, "epoch": 7170} {"train_loss": -28.300891876220703, "global_step": 595152, "epoch": 7170} {"train_loss": -27.991458892822266, "global_step": 595153, "epoch": 7170} {"train_loss": -27.8049373626709, "global_step": 595154, "epoch": 7170} {"train_loss": -27.3212890625, "global_step": 595155, "epoch": 7170} {"train_loss": -27.96734619140625, "global_step": 595156, "epoch": 7170} {"train_loss": -27.746137619018555, "global_step": 595157, "epoch": 7170} {"train_loss": -27.97747802734375, "global_step": 595158, "epoch": 7170} {"train_loss": -28.160755157470703, "global_step": 595159, "epoch": 7170} {"train_loss": -27.77692985534668, "global_step": 595160, "epoch": 7170} {"train_loss": -28.262659072875977, "global_step": 595161, "epoch": 7170} {"train_loss": -27.67340087890625, "global_step": 595162, "epoch": 7170} {"train_loss": -28.25519371032715, "global_step": 595163, "epoch": 7170} {"train_loss": -27.903982162475586, "global_step": 595164, "epoch": 7170} {"train_loss": -28.381696701049805, "global_step": 595165, "epoch": 7170} {"train_loss": -27.83765983581543, "global_step": 595166, "epoch": 7170} {"train_loss": -27.68366813659668, "global_step": 595167, "epoch": 7170} {"train_loss": -28.133142471313477, "global_step": 595168, "epoch": 7170} {"train_loss": -28.215351104736328, "global_step": 595169, "epoch": 7170} {"train_loss": -27.572092056274414, "global_step": 595170, "epoch": 7170} {"train_loss": -27.873376846313477, "global_step": 595171, "epoch": 7170} {"train_loss": -28.200897216796875, "global_step": 595172, "epoch": 7170} {"train_loss": -28.17877769470215, "global_step": 595173, "epoch": 7170} {"train_loss": -28.097339630126953, "global_step": 595174, "epoch": 7170} {"train_loss": -27.64789390563965, "global_step": 595175, "epoch": 7170} {"train_loss": -27.956418991088867, "global_step": 595176, "epoch": 7170} {"train_loss": -27.937292098999023, "global_step": 595177, "epoch": 7170} {"train_loss": -28.119726181030273, "global_step": 595178, "epoch": 7170} {"train_loss": -27.977643966674805, "global_step": 595179, "epoch": 7170} {"train_loss": -27.932687759399414, "global_step": 595180, "epoch": 7170} {"train_loss": -28.0677433013916, "global_step": 595181, "epoch": 7170} {"train_loss": -27.648269653320312, "global_step": 595182, "epoch": 7170} {"train_loss": -27.86149024963379, "global_step": 595183, "epoch": 7170} {"train_loss": -27.982624053955078, "global_step": 595184, "epoch": 7170} {"train_loss": -28.097396850585938, "global_step": 595185, "epoch": 7170} {"train_loss": -28.041976928710938, "global_step": 595186, "epoch": 7170} {"train_loss": -27.69049072265625, "global_step": 595187, "epoch": 7170} {"train_loss": -27.9427433013916, "global_step": 595188, "epoch": 7170} {"train_loss": -28.493534088134766, "global_step": 595189, "epoch": 7170} {"train_loss": -27.905303955078125, "global_step": 595190, "epoch": 7170} {"train_loss": -27.820178985595703, "global_step": 595191, "epoch": 7170} {"train_loss": -27.742383612207618, "global_step": 595192, "epoch": 7170, "val_loss": 6634981.5} {"train_loss": -27.691162109375, "global_step": 595193, "epoch": 7171} {"train_loss": -27.64597511291504, "global_step": 595194, "epoch": 7171} {"train_loss": -27.70145034790039, "global_step": 595195, "epoch": 7171} {"train_loss": -27.898529052734375, "global_step": 595196, "epoch": 7171} {"train_loss": -27.285470962524414, "global_step": 595197, "epoch": 7171} {"train_loss": -27.509708404541016, "global_step": 595198, "epoch": 7171} {"train_loss": -27.893264770507812, "global_step": 595199, "epoch": 7171} {"train_loss": -27.46168327331543, "global_step": 595200, "epoch": 7171} {"train_loss": -27.16214942932129, "global_step": 595201, "epoch": 7171} {"train_loss": -27.329212188720703, "global_step": 595202, "epoch": 7171} {"train_loss": -27.786121368408203, "global_step": 595203, "epoch": 7171} {"train_loss": -27.552743911743164, "global_step": 595204, "epoch": 7171} {"train_loss": -26.764585494995117, "global_step": 595205, "epoch": 7171} {"train_loss": -27.674280166625977, "global_step": 595206, "epoch": 7171} {"train_loss": -27.82474136352539, "global_step": 595207, "epoch": 7171} {"train_loss": -27.512487411499023, "global_step": 595208, "epoch": 7171} {"train_loss": -27.983945846557617, "global_step": 595209, "epoch": 7171} {"train_loss": -27.691186904907227, "global_step": 595210, "epoch": 7171} {"train_loss": -27.388031005859375, "global_step": 595211, "epoch": 7171} {"train_loss": -27.749765396118164, "global_step": 595212, "epoch": 7171} {"train_loss": -27.83257484436035, "global_step": 595213, "epoch": 7171} {"train_loss": -27.5828800201416, "global_step": 595214, "epoch": 7171} {"train_loss": -27.707172393798828, "global_step": 595215, "epoch": 7171} {"train_loss": -27.745534896850586, "global_step": 595216, "epoch": 7171} {"train_loss": -27.8889217376709, "global_step": 595217, "epoch": 7171} {"train_loss": -27.64984130859375, "global_step": 595218, "epoch": 7171} {"train_loss": -28.12908363342285, "global_step": 595219, "epoch": 7171} {"train_loss": -27.701889038085938, "global_step": 595220, "epoch": 7171} {"train_loss": -27.931554794311523, "global_step": 595221, "epoch": 7171} {"train_loss": -27.818029403686523, "global_step": 595222, "epoch": 7171} {"train_loss": -28.1295108795166, "global_step": 595223, "epoch": 7171} {"train_loss": -27.733295440673828, "global_step": 595224, "epoch": 7171} {"train_loss": -27.909839630126953, "global_step": 595225, "epoch": 7171} {"train_loss": -28.183637619018555, "global_step": 595226, "epoch": 7171} {"train_loss": -27.8690185546875, "global_step": 595227, "epoch": 7171} {"train_loss": -27.879867553710938, "global_step": 595228, "epoch": 7171} {"train_loss": -27.740436553955078, "global_step": 595229, "epoch": 7171} {"train_loss": -28.0092716217041, "global_step": 595230, "epoch": 7171} {"train_loss": -27.738407135009766, "global_step": 595231, "epoch": 7171} {"train_loss": -28.20767593383789, "global_step": 595232, "epoch": 7171} {"train_loss": -28.423065185546875, "global_step": 595233, "epoch": 7171} {"train_loss": -28.278547286987305, "global_step": 595234, "epoch": 7171} {"train_loss": -28.2086124420166, "global_step": 595235, "epoch": 7171} {"train_loss": -28.23554801940918, "global_step": 595236, "epoch": 7171} {"train_loss": -28.197092056274414, "global_step": 595237, "epoch": 7171} {"train_loss": -28.2086124420166, "global_step": 595238, "epoch": 7171} {"train_loss": -28.255844116210938, "global_step": 595239, "epoch": 7171} {"train_loss": -28.130884170532227, "global_step": 595240, "epoch": 7171} {"train_loss": -28.224430084228516, "global_step": 595241, "epoch": 7171} {"train_loss": -28.413965225219727, "global_step": 595242, "epoch": 7171} {"train_loss": -28.349903106689453, "global_step": 595243, "epoch": 7171} {"train_loss": -28.132104873657227, "global_step": 595244, "epoch": 7171} {"train_loss": -28.050418853759766, "global_step": 595245, "epoch": 7171} {"train_loss": -27.9840145111084, "global_step": 595246, "epoch": 7171} {"train_loss": -27.888797760009766, "global_step": 595247, "epoch": 7171} {"train_loss": -28.1102237701416, "global_step": 595248, "epoch": 7171} {"train_loss": -27.93074607849121, "global_step": 595249, "epoch": 7171} {"train_loss": -27.65231704711914, "global_step": 595250, "epoch": 7171} {"train_loss": -27.914655685424805, "global_step": 595251, "epoch": 7171} {"train_loss": -28.036008834838867, "global_step": 595252, "epoch": 7171} {"train_loss": -27.857471466064453, "global_step": 595253, "epoch": 7171} {"train_loss": -28.00777244567871, "global_step": 595254, "epoch": 7171} {"train_loss": -27.460926055908203, "global_step": 595255, "epoch": 7171} {"train_loss": -27.57175636291504, "global_step": 595256, "epoch": 7171} {"train_loss": -28.06390953063965, "global_step": 595257, "epoch": 7171} {"train_loss": -27.627655029296875, "global_step": 595258, "epoch": 7171} {"train_loss": -28.1131649017334, "global_step": 595259, "epoch": 7171} {"train_loss": -27.159107208251953, "global_step": 595260, "epoch": 7171} {"train_loss": -27.423551559448242, "global_step": 595261, "epoch": 7171} {"train_loss": -27.794702529907227, "global_step": 595262, "epoch": 7171} {"train_loss": -27.700048446655273, "global_step": 595263, "epoch": 7171} {"train_loss": -27.892297744750977, "global_step": 595264, "epoch": 7171} {"train_loss": -27.46889305114746, "global_step": 595265, "epoch": 7171} {"train_loss": -27.651060104370117, "global_step": 595266, "epoch": 7171} {"train_loss": -27.93177604675293, "global_step": 595267, "epoch": 7171} {"train_loss": -27.871850967407227, "global_step": 595268, "epoch": 7171} {"train_loss": -27.85200309753418, "global_step": 595269, "epoch": 7171} {"train_loss": -27.969587326049805, "global_step": 595270, "epoch": 7171} {"train_loss": -28.08418083190918, "global_step": 595271, "epoch": 7171} {"train_loss": -28.193191528320312, "global_step": 595272, "epoch": 7171} {"train_loss": -27.750619888305664, "global_step": 595273, "epoch": 7171} {"train_loss": -28.18202018737793, "global_step": 595274, "epoch": 7171} {"train_loss": -27.84352856371776, "global_step": 595275, "epoch": 7171, "val_loss": 6553013.0} {"train_loss": -26.626861572265625, "global_step": 595276, "epoch": 7172} {"train_loss": -26.915302276611328, "global_step": 595277, "epoch": 7172} {"train_loss": -27.786672592163086, "global_step": 595278, "epoch": 7172} {"train_loss": -27.44977378845215, "global_step": 595279, "epoch": 7172} {"train_loss": -27.77353286743164, "global_step": 595280, "epoch": 7172} {"train_loss": -27.251758575439453, "global_step": 595281, "epoch": 7172} {"train_loss": -27.4096622467041, "global_step": 595282, "epoch": 7172} {"train_loss": -27.39613151550293, "global_step": 595283, "epoch": 7172} {"train_loss": -27.7232723236084, "global_step": 595284, "epoch": 7172} {"train_loss": -27.49213218688965, "global_step": 595285, "epoch": 7172} {"train_loss": -27.690351486206055, "global_step": 595286, "epoch": 7172} {"train_loss": -27.774686813354492, "global_step": 595287, "epoch": 7172} {"train_loss": -27.335668563842773, "global_step": 595288, "epoch": 7172} {"train_loss": -27.58538246154785, "global_step": 595289, "epoch": 7172} {"train_loss": -27.516773223876953, "global_step": 595290, "epoch": 7172} {"train_loss": -27.672956466674805, "global_step": 595291, "epoch": 7172} {"train_loss": -27.5122127532959, "global_step": 595292, "epoch": 7172} {"train_loss": -27.783777236938477, "global_step": 595293, "epoch": 7172} {"train_loss": -27.5296688079834, "global_step": 595294, "epoch": 7172} {"train_loss": -28.048364639282227, "global_step": 595295, "epoch": 7172} {"train_loss": -27.748279571533203, "global_step": 595296, "epoch": 7172} {"train_loss": -27.820926666259766, "global_step": 595297, "epoch": 7172} {"train_loss": -27.99509620666504, "global_step": 595298, "epoch": 7172} {"train_loss": -28.07246208190918, "global_step": 595299, "epoch": 7172} {"train_loss": -27.87042808532715, "global_step": 595300, "epoch": 7172} {"train_loss": -28.080493927001953, "global_step": 595301, "epoch": 7172} {"train_loss": -28.129301071166992, "global_step": 595302, "epoch": 7172} {"train_loss": -28.258197784423828, "global_step": 595303, "epoch": 7172} {"train_loss": -27.88250160217285, "global_step": 595304, "epoch": 7172} {"train_loss": -28.139419555664062, "global_step": 595305, "epoch": 7172} {"train_loss": -27.770837783813477, "global_step": 595306, "epoch": 7172} {"train_loss": -28.07794761657715, "global_step": 595307, "epoch": 7172} {"train_loss": -27.829059600830078, "global_step": 595308, "epoch": 7172} {"train_loss": -27.919111251831055, "global_step": 595309, "epoch": 7172} {"train_loss": -28.080610275268555, "global_step": 595310, "epoch": 7172} {"train_loss": -28.177967071533203, "global_step": 595311, "epoch": 7172} {"train_loss": -28.02048683166504, "global_step": 595312, "epoch": 7172} {"train_loss": -28.058948516845703, "global_step": 595313, "epoch": 7172} {"train_loss": -28.157501220703125, "global_step": 595314, "epoch": 7172} {"train_loss": -28.40436363220215, "global_step": 595315, "epoch": 7172} {"train_loss": -27.854528427124023, "global_step": 595316, "epoch": 7172} {"train_loss": -27.92574119567871, "global_step": 595317, "epoch": 7172} {"train_loss": -28.1662654876709, "global_step": 595318, "epoch": 7172} {"train_loss": -27.6965274810791, "global_step": 595319, "epoch": 7172} {"train_loss": -27.923315048217773, "global_step": 595320, "epoch": 7172} {"train_loss": -27.6651554107666, "global_step": 595321, "epoch": 7172} {"train_loss": -28.33698844909668, "global_step": 595322, "epoch": 7172} {"train_loss": -27.9471435546875, "global_step": 595323, "epoch": 7172} {"train_loss": -27.889493942260742, "global_step": 595324, "epoch": 7172} {"train_loss": -27.657495498657227, "global_step": 595325, "epoch": 7172} {"train_loss": -27.96747398376465, "global_step": 595326, "epoch": 7172} {"train_loss": -28.652267456054688, "global_step": 595327, "epoch": 7172} {"train_loss": -28.113855361938477, "global_step": 595328, "epoch": 7172} {"train_loss": -28.04987144470215, "global_step": 595329, "epoch": 7172} {"train_loss": -28.001052856445312, "global_step": 595330, "epoch": 7172} {"train_loss": -28.343006134033203, "global_step": 595331, "epoch": 7172} {"train_loss": -28.071313858032227, "global_step": 595332, "epoch": 7172} {"train_loss": -28.196426391601562, "global_step": 595333, "epoch": 7172} {"train_loss": -28.314367294311523, "global_step": 595334, "epoch": 7172} {"train_loss": -28.35273551940918, "global_step": 595335, "epoch": 7172} {"train_loss": -28.391605377197266, "global_step": 595336, "epoch": 7172} {"train_loss": -27.82855224609375, "global_step": 595337, "epoch": 7172} {"train_loss": -28.149816513061523, "global_step": 595338, "epoch": 7172} {"train_loss": -28.185766220092773, "global_step": 595339, "epoch": 7172} {"train_loss": -28.28778648376465, "global_step": 595340, "epoch": 7172} {"train_loss": -28.39826774597168, "global_step": 595341, "epoch": 7172} {"train_loss": -28.073400497436523, "global_step": 595342, "epoch": 7172} {"train_loss": -28.09163475036621, "global_step": 595343, "epoch": 7172} {"train_loss": -28.102466583251953, "global_step": 595344, "epoch": 7172} {"train_loss": -28.142959594726562, "global_step": 595345, "epoch": 7172} {"train_loss": -28.21734619140625, "global_step": 595346, "epoch": 7172} {"train_loss": -28.418066024780273, "global_step": 595347, "epoch": 7172} {"train_loss": -28.121124267578125, "global_step": 595348, "epoch": 7172} {"train_loss": -28.119306564331055, "global_step": 595349, "epoch": 7172} {"train_loss": -28.074371337890625, "global_step": 595350, "epoch": 7172} {"train_loss": -27.99667739868164, "global_step": 595351, "epoch": 7172} {"train_loss": -28.222671508789062, "global_step": 595352, "epoch": 7172} {"train_loss": -28.316762924194336, "global_step": 595353, "epoch": 7172} {"train_loss": -28.095273971557617, "global_step": 595354, "epoch": 7172} {"train_loss": -28.256622314453125, "global_step": 595355, "epoch": 7172} {"train_loss": -28.765729904174805, "global_step": 595356, "epoch": 7172} {"train_loss": -28.19940757751465, "global_step": 595357, "epoch": 7172} {"train_loss": -27.959444873304253, "global_step": 595358, "epoch": 7172, "val_loss": 6652190.5} {"train_loss": -28.018613815307617, "global_step": 595359, "epoch": 7173} {"train_loss": -27.077362060546875, "global_step": 595360, "epoch": 7173} {"train_loss": -27.120105743408203, "global_step": 595361, "epoch": 7173} {"train_loss": -27.164255142211914, "global_step": 595362, "epoch": 7173} {"train_loss": -27.273834228515625, "global_step": 595363, "epoch": 7173} {"train_loss": -27.771249771118164, "global_step": 595364, "epoch": 7173} {"train_loss": -27.6787052154541, "global_step": 595365, "epoch": 7173} {"train_loss": -27.2149600982666, "global_step": 595366, "epoch": 7173} {"train_loss": -26.978052139282227, "global_step": 595367, "epoch": 7173} {"train_loss": -27.184894561767578, "global_step": 595368, "epoch": 7173} {"train_loss": -28.002334594726562, "global_step": 595369, "epoch": 7173} {"train_loss": -27.247228622436523, "global_step": 595370, "epoch": 7173} {"train_loss": -27.693317413330078, "global_step": 595371, "epoch": 7173} {"train_loss": -27.480825424194336, "global_step": 595372, "epoch": 7173} {"train_loss": -27.42519187927246, "global_step": 595373, "epoch": 7173} {"train_loss": -27.503936767578125, "global_step": 595374, "epoch": 7173} {"train_loss": -27.747583389282227, "global_step": 595375, "epoch": 7173} {"train_loss": -27.39947509765625, "global_step": 595376, "epoch": 7173} {"train_loss": -28.012165069580078, "global_step": 595377, "epoch": 7173} {"train_loss": -27.912424087524414, "global_step": 595378, "epoch": 7173} {"train_loss": -27.925321578979492, "global_step": 595379, "epoch": 7173} {"train_loss": -27.651611328125, "global_step": 595380, "epoch": 7173} {"train_loss": -27.798416137695312, "global_step": 595381, "epoch": 7173} {"train_loss": -27.779382705688477, "global_step": 595382, "epoch": 7173} {"train_loss": -27.980207443237305, "global_step": 595383, "epoch": 7173} {"train_loss": -27.495344161987305, "global_step": 595384, "epoch": 7173} {"train_loss": -27.883056640625, "global_step": 595385, "epoch": 7173} {"train_loss": -27.884382247924805, "global_step": 595386, "epoch": 7173} {"train_loss": -27.969030380249023, "global_step": 595387, "epoch": 7173} {"train_loss": -27.706457138061523, "global_step": 595388, "epoch": 7173} {"train_loss": -27.7706356048584, "global_step": 595389, "epoch": 7173} {"train_loss": -27.872182846069336, "global_step": 595390, "epoch": 7173} {"train_loss": -28.202777862548828, "global_step": 595391, "epoch": 7173} {"train_loss": -27.94942283630371, "global_step": 595392, "epoch": 7173} {"train_loss": -27.825122833251953, "global_step": 595393, "epoch": 7173} {"train_loss": -28.241256713867188, "global_step": 595394, "epoch": 7173} {"train_loss": -28.230377197265625, "global_step": 595395, "epoch": 7173} {"train_loss": -27.8201904296875, "global_step": 595396, "epoch": 7173} {"train_loss": -27.820280075073242, "global_step": 595397, "epoch": 7173} {"train_loss": -27.981796264648438, "global_step": 595398, "epoch": 7173} {"train_loss": -28.22161865234375, "global_step": 595399, "epoch": 7173} {"train_loss": -28.198129653930664, "global_step": 595400, "epoch": 7173} {"train_loss": -28.225513458251953, "global_step": 595401, "epoch": 7173} {"train_loss": -28.156736373901367, "global_step": 595402, "epoch": 7173} {"train_loss": -28.05198097229004, "global_step": 595403, "epoch": 7173} {"train_loss": -27.849475860595703, "global_step": 595404, "epoch": 7173} {"train_loss": -28.039997100830078, "global_step": 595405, "epoch": 7173} {"train_loss": -28.04032325744629, "global_step": 595406, "epoch": 7173} {"train_loss": -27.964590072631836, "global_step": 595407, "epoch": 7173} {"train_loss": -28.313343048095703, "global_step": 595408, "epoch": 7173} {"train_loss": -28.334692001342773, "global_step": 595409, "epoch": 7173} {"train_loss": -28.175039291381836, "global_step": 595410, "epoch": 7173} {"train_loss": -28.3685245513916, "global_step": 595411, "epoch": 7173} {"train_loss": -28.269214630126953, "global_step": 595412, "epoch": 7173} {"train_loss": -28.284765243530273, "global_step": 595413, "epoch": 7173} {"train_loss": -28.32295036315918, "global_step": 595414, "epoch": 7173} {"train_loss": -28.122283935546875, "global_step": 595415, "epoch": 7173} {"train_loss": -28.20208740234375, "global_step": 595416, "epoch": 7173} {"train_loss": -28.460254669189453, "global_step": 595417, "epoch": 7173} {"train_loss": -28.209976196289062, "global_step": 595418, "epoch": 7173} {"train_loss": -28.403818130493164, "global_step": 595419, "epoch": 7173} {"train_loss": -28.14789390563965, "global_step": 595420, "epoch": 7173} {"train_loss": -28.069936752319336, "global_step": 595421, "epoch": 7173} {"train_loss": -28.221105575561523, "global_step": 595422, "epoch": 7173} {"train_loss": -27.957412719726562, "global_step": 595423, "epoch": 7173} {"train_loss": -28.428726196289062, "global_step": 595424, "epoch": 7173} {"train_loss": -28.37881851196289, "global_step": 595425, "epoch": 7173} {"train_loss": -27.870391845703125, "global_step": 595426, "epoch": 7173} {"train_loss": -28.149423599243164, "global_step": 595427, "epoch": 7173} {"train_loss": -28.129247665405273, "global_step": 595428, "epoch": 7173} {"train_loss": -27.79031753540039, "global_step": 595429, "epoch": 7173} {"train_loss": -28.05926513671875, "global_step": 595430, "epoch": 7173} {"train_loss": -27.775745391845703, "global_step": 595431, "epoch": 7173} {"train_loss": -27.89849853515625, "global_step": 595432, "epoch": 7173} {"train_loss": -27.514352798461914, "global_step": 595433, "epoch": 7173} {"train_loss": -27.242324829101562, "global_step": 595434, "epoch": 7173} {"train_loss": -27.61431312561035, "global_step": 595435, "epoch": 7173} {"train_loss": -27.372650146484375, "global_step": 595436, "epoch": 7173} {"train_loss": -27.18855094909668, "global_step": 595437, "epoch": 7173} {"train_loss": -28.13791847229004, "global_step": 595438, "epoch": 7173} {"train_loss": -27.641407012939453, "global_step": 595439, "epoch": 7173} {"train_loss": -27.676496505737305, "global_step": 595440, "epoch": 7173} {"train_loss": -27.86477771437312, "global_step": 595441, "epoch": 7173, "val_loss": 6626459.0} {"train_loss": -26.429553985595703, "global_step": 595442, "epoch": 7174} {"train_loss": -25.934202194213867, "global_step": 595443, "epoch": 7174} {"train_loss": -25.982196807861328, "global_step": 595444, "epoch": 7174} {"train_loss": -27.621551513671875, "global_step": 595445, "epoch": 7174} {"train_loss": -26.937667846679688, "global_step": 595446, "epoch": 7174} {"train_loss": -26.706159591674805, "global_step": 595447, "epoch": 7174} {"train_loss": -27.25704002380371, "global_step": 595448, "epoch": 7174} {"train_loss": -27.331464767456055, "global_step": 595449, "epoch": 7174} {"train_loss": -26.785200119018555, "global_step": 595450, "epoch": 7174} {"train_loss": -27.321237564086914, "global_step": 595451, "epoch": 7174} {"train_loss": -27.1173038482666, "global_step": 595452, "epoch": 7174} {"train_loss": -27.3430233001709, "global_step": 595453, "epoch": 7174} {"train_loss": -27.432926177978516, "global_step": 595454, "epoch": 7174} {"train_loss": -27.60114097595215, "global_step": 595455, "epoch": 7174} {"train_loss": -27.632904052734375, "global_step": 595456, "epoch": 7174} {"train_loss": -27.557132720947266, "global_step": 595457, "epoch": 7174} {"train_loss": -27.63530921936035, "global_step": 595458, "epoch": 7174} {"train_loss": -27.3210391998291, "global_step": 595459, "epoch": 7174} {"train_loss": -27.596826553344727, "global_step": 595460, "epoch": 7174} {"train_loss": -27.646997451782227, "global_step": 595461, "epoch": 7174} {"train_loss": -28.0155086517334, "global_step": 595462, "epoch": 7174} {"train_loss": -27.685657501220703, "global_step": 595463, "epoch": 7174} {"train_loss": -28.120258331298828, "global_step": 595464, "epoch": 7174} {"train_loss": -27.7751522064209, "global_step": 595465, "epoch": 7174} {"train_loss": -27.409826278686523, "global_step": 595466, "epoch": 7174} {"train_loss": -27.871997833251953, "global_step": 595467, "epoch": 7174} {"train_loss": -28.124311447143555, "global_step": 595468, "epoch": 7174} {"train_loss": -28.006256103515625, "global_step": 595469, "epoch": 7174} {"train_loss": -27.92511558532715, "global_step": 595470, "epoch": 7174} {"train_loss": -28.09515380859375, "global_step": 595471, "epoch": 7174} {"train_loss": -27.874780654907227, "global_step": 595472, "epoch": 7174} {"train_loss": -27.90968132019043, "global_step": 595473, "epoch": 7174} {"train_loss": -27.988080978393555, "global_step": 595474, "epoch": 7174} {"train_loss": -28.169382095336914, "global_step": 595475, "epoch": 7174} {"train_loss": -27.943750381469727, "global_step": 595476, "epoch": 7174} {"train_loss": -28.26067543029785, "global_step": 595477, "epoch": 7174} {"train_loss": -27.887784957885742, "global_step": 595478, "epoch": 7174} {"train_loss": -28.218433380126953, "global_step": 595479, "epoch": 7174} {"train_loss": -28.221914291381836, "global_step": 595480, "epoch": 7174} {"train_loss": -28.130542755126953, "global_step": 595481, "epoch": 7174} {"train_loss": -27.744062423706055, "global_step": 595482, "epoch": 7174} {"train_loss": -28.213871002197266, "global_step": 595483, "epoch": 7174} {"train_loss": -28.051773071289062, "global_step": 595484, "epoch": 7174} {"train_loss": -28.386005401611328, "global_step": 595485, "epoch": 7174} {"train_loss": -27.896320343017578, "global_step": 595486, "epoch": 7174} {"train_loss": -28.191083908081055, "global_step": 595487, "epoch": 7174} {"train_loss": -28.353185653686523, "global_step": 595488, "epoch": 7174} {"train_loss": -28.397321701049805, "global_step": 595489, "epoch": 7174} {"train_loss": -27.945911407470703, "global_step": 595490, "epoch": 7174} {"train_loss": -28.18757438659668, "global_step": 595491, "epoch": 7174} {"train_loss": -28.236230850219727, "global_step": 595492, "epoch": 7174} {"train_loss": -28.357629776000977, "global_step": 595493, "epoch": 7174} {"train_loss": -28.0662899017334, "global_step": 595494, "epoch": 7174} {"train_loss": -28.2791748046875, "global_step": 595495, "epoch": 7174} {"train_loss": -28.11847496032715, "global_step": 595496, "epoch": 7174} {"train_loss": -28.0594482421875, "global_step": 595497, "epoch": 7174} {"train_loss": -28.35505485534668, "global_step": 595498, "epoch": 7174} {"train_loss": -27.77121353149414, "global_step": 595499, "epoch": 7174} {"train_loss": -28.012231826782227, "global_step": 595500, "epoch": 7174} {"train_loss": -28.535139083862305, "global_step": 595501, "epoch": 7174} {"train_loss": -28.223373413085938, "global_step": 595502, "epoch": 7174} {"train_loss": -28.062597274780273, "global_step": 595503, "epoch": 7174} {"train_loss": -28.290063858032227, "global_step": 595504, "epoch": 7174} {"train_loss": -28.219940185546875, "global_step": 595505, "epoch": 7174} {"train_loss": -27.953540802001953, "global_step": 595506, "epoch": 7174} {"train_loss": -28.272851943969727, "global_step": 595507, "epoch": 7174} {"train_loss": -28.034626007080078, "global_step": 595508, "epoch": 7174} {"train_loss": -28.286767959594727, "global_step": 595509, "epoch": 7174} {"train_loss": -28.15662956237793, "global_step": 595510, "epoch": 7174} {"train_loss": -28.252826690673828, "global_step": 595511, "epoch": 7174} {"train_loss": -28.089588165283203, "global_step": 595512, "epoch": 7174} {"train_loss": -28.074254989624023, "global_step": 595513, "epoch": 7174} {"train_loss": -27.948659896850586, "global_step": 595514, "epoch": 7174} {"train_loss": -27.93782615661621, "global_step": 595515, "epoch": 7174} {"train_loss": -28.428863525390625, "global_step": 595516, "epoch": 7174} {"train_loss": -28.350194931030273, "global_step": 595517, "epoch": 7174} {"train_loss": -28.129316329956055, "global_step": 595518, "epoch": 7174} {"train_loss": -28.410730361938477, "global_step": 595519, "epoch": 7174} {"train_loss": -28.092334747314453, "global_step": 595520, "epoch": 7174} {"train_loss": -28.30079460144043, "global_step": 595521, "epoch": 7174} {"train_loss": -28.16315269470215, "global_step": 595522, "epoch": 7174} {"train_loss": -27.814361572265625, "global_step": 595523, "epoch": 7174} {"train_loss": -27.868111644882752, "global_step": 595524, "epoch": 7174, "val_loss": 6593215.0} {"train_loss": -27.77161979675293, "global_step": 595525, "epoch": 7175} {"train_loss": -27.480030059814453, "global_step": 595526, "epoch": 7175} {"train_loss": -27.631732940673828, "global_step": 595527, "epoch": 7175} {"train_loss": -27.274219512939453, "global_step": 595528, "epoch": 7175} {"train_loss": -27.249603271484375, "global_step": 595529, "epoch": 7175} {"train_loss": -27.794437408447266, "global_step": 595530, "epoch": 7175} {"train_loss": -27.890857696533203, "global_step": 595531, "epoch": 7175} {"train_loss": -27.69312858581543, "global_step": 595532, "epoch": 7175} {"train_loss": -27.55341911315918, "global_step": 595533, "epoch": 7175} {"train_loss": -27.640256881713867, "global_step": 595534, "epoch": 7175} {"train_loss": -27.67180824279785, "global_step": 595535, "epoch": 7175} {"train_loss": -27.894500732421875, "global_step": 595536, "epoch": 7175} {"train_loss": -28.110136032104492, "global_step": 595537, "epoch": 7175} {"train_loss": -27.71778678894043, "global_step": 595538, "epoch": 7175} {"train_loss": -27.737207412719727, "global_step": 595539, "epoch": 7175} {"train_loss": -27.50153923034668, "global_step": 595540, "epoch": 7175} {"train_loss": -27.70130729675293, "global_step": 595541, "epoch": 7175} {"train_loss": -27.858840942382812, "global_step": 595542, "epoch": 7175} {"train_loss": -27.901214599609375, "global_step": 595543, "epoch": 7175} {"train_loss": -27.567426681518555, "global_step": 595544, "epoch": 7175} {"train_loss": -28.203073501586914, "global_step": 595545, "epoch": 7175} {"train_loss": -27.47639274597168, "global_step": 595546, "epoch": 7175} {"train_loss": -27.78644371032715, "global_step": 595547, "epoch": 7175} {"train_loss": -27.877710342407227, "global_step": 595548, "epoch": 7175} {"train_loss": -28.050495147705078, "global_step": 595549, "epoch": 7175} {"train_loss": -27.37934684753418, "global_step": 595550, "epoch": 7175} {"train_loss": -28.212072372436523, "global_step": 595551, "epoch": 7175} {"train_loss": -27.93304443359375, "global_step": 595552, "epoch": 7175} {"train_loss": -28.007017135620117, "global_step": 595553, "epoch": 7175} {"train_loss": -27.565998077392578, "global_step": 595554, "epoch": 7175} {"train_loss": -27.627344131469727, "global_step": 595555, "epoch": 7175} {"train_loss": -27.803125381469727, "global_step": 595556, "epoch": 7175} {"train_loss": -27.9414119720459, "global_step": 595557, "epoch": 7175} {"train_loss": -27.596872329711914, "global_step": 595558, "epoch": 7175} {"train_loss": -27.91509437561035, "global_step": 595559, "epoch": 7175} {"train_loss": -27.67420768737793, "global_step": 595560, "epoch": 7175} {"train_loss": -27.913938522338867, "global_step": 595561, "epoch": 7175} {"train_loss": -28.054309844970703, "global_step": 595562, "epoch": 7175} {"train_loss": -27.881433486938477, "global_step": 595563, "epoch": 7175} {"train_loss": -27.86865234375, "global_step": 595564, "epoch": 7175} {"train_loss": -28.28986930847168, "global_step": 595565, "epoch": 7175} {"train_loss": -27.721893310546875, "global_step": 595566, "epoch": 7175} {"train_loss": -27.88545799255371, "global_step": 595567, "epoch": 7175} {"train_loss": -28.187976837158203, "global_step": 595568, "epoch": 7175} {"train_loss": -27.8980655670166, "global_step": 595569, "epoch": 7175} {"train_loss": -28.087690353393555, "global_step": 595570, "epoch": 7175} {"train_loss": -27.866254806518555, "global_step": 595571, "epoch": 7175} {"train_loss": -28.033288955688477, "global_step": 595572, "epoch": 7175} {"train_loss": -27.598703384399414, "global_step": 595573, "epoch": 7175} {"train_loss": -27.55109977722168, "global_step": 595574, "epoch": 7175} {"train_loss": -27.948450088500977, "global_step": 595575, "epoch": 7175} {"train_loss": -27.80350112915039, "global_step": 595576, "epoch": 7175} {"train_loss": -27.462270736694336, "global_step": 595577, "epoch": 7175} {"train_loss": -28.17939567565918, "global_step": 595578, "epoch": 7175} {"train_loss": -27.853132247924805, "global_step": 595579, "epoch": 7175} {"train_loss": -27.29541015625, "global_step": 595580, "epoch": 7175} {"train_loss": -27.75653076171875, "global_step": 595581, "epoch": 7175} {"train_loss": -27.877578735351562, "global_step": 595582, "epoch": 7175} {"train_loss": -28.022138595581055, "global_step": 595583, "epoch": 7175} {"train_loss": -27.960798263549805, "global_step": 595584, "epoch": 7175} {"train_loss": -27.726581573486328, "global_step": 595585, "epoch": 7175} {"train_loss": -28.255029678344727, "global_step": 595586, "epoch": 7175} {"train_loss": -28.387969970703125, "global_step": 595587, "epoch": 7175} {"train_loss": -28.062580108642578, "global_step": 595588, "epoch": 7175} {"train_loss": -28.183002471923828, "global_step": 595589, "epoch": 7175} {"train_loss": -27.7823543548584, "global_step": 595590, "epoch": 7175} {"train_loss": -27.976715087890625, "global_step": 595591, "epoch": 7175} {"train_loss": -28.07706069946289, "global_step": 595592, "epoch": 7175} {"train_loss": -28.065282821655273, "global_step": 595593, "epoch": 7175} {"train_loss": -27.8489990234375, "global_step": 595594, "epoch": 7175} {"train_loss": -27.96363639831543, "global_step": 595595, "epoch": 7175} {"train_loss": -28.01520347595215, "global_step": 595596, "epoch": 7175} {"train_loss": -28.191162109375, "global_step": 595597, "epoch": 7175} {"train_loss": -28.054828643798828, "global_step": 595598, "epoch": 7175} {"train_loss": -27.425695419311523, "global_step": 595599, "epoch": 7175} {"train_loss": -27.662952423095703, "global_step": 595600, "epoch": 7175} {"train_loss": -28.1859188079834, "global_step": 595601, "epoch": 7175} {"train_loss": -28.112598419189453, "global_step": 595602, "epoch": 7175} {"train_loss": -28.12163734436035, "global_step": 595603, "epoch": 7175} {"train_loss": -28.051822662353516, "global_step": 595604, "epoch": 7175} {"train_loss": -28.697538375854492, "global_step": 595605, "epoch": 7175} {"train_loss": -28.129480361938477, "global_step": 595606, "epoch": 7175} {"train_loss": -27.84985443482916, "global_step": 595607, "epoch": 7175, "val_loss": 6548059.0} {"train_loss": -27.2770938873291, "global_step": 595608, "epoch": 7176} {"train_loss": -25.825414657592773, "global_step": 595609, "epoch": 7176} {"train_loss": -27.45170021057129, "global_step": 595610, "epoch": 7176} {"train_loss": -27.3704833984375, "global_step": 595611, "epoch": 7176} {"train_loss": -27.119007110595703, "global_step": 595612, "epoch": 7176} {"train_loss": -27.729171752929688, "global_step": 595613, "epoch": 7176} {"train_loss": -27.29096794128418, "global_step": 595614, "epoch": 7176} {"train_loss": -27.51239013671875, "global_step": 595615, "epoch": 7176} {"train_loss": -26.88190269470215, "global_step": 595616, "epoch": 7176} {"train_loss": -27.121967315673828, "global_step": 595617, "epoch": 7176} {"train_loss": -27.5166072845459, "global_step": 595618, "epoch": 7176} {"train_loss": -27.709369659423828, "global_step": 595619, "epoch": 7176} {"train_loss": -27.098175048828125, "global_step": 595620, "epoch": 7176} {"train_loss": -27.56698989868164, "global_step": 595621, "epoch": 7176} {"train_loss": -27.455265045166016, "global_step": 595622, "epoch": 7176} {"train_loss": -27.76270866394043, "global_step": 595623, "epoch": 7176} {"train_loss": -27.264368057250977, "global_step": 595624, "epoch": 7176} {"train_loss": -27.9245548248291, "global_step": 595625, "epoch": 7176} {"train_loss": -27.82667350769043, "global_step": 595626, "epoch": 7176} {"train_loss": -27.954816818237305, "global_step": 595627, "epoch": 7176} {"train_loss": -28.121694564819336, "global_step": 595628, "epoch": 7176} {"train_loss": -28.0371150970459, "global_step": 595629, "epoch": 7176} {"train_loss": -28.004064559936523, "global_step": 595630, "epoch": 7176} {"train_loss": -27.68417739868164, "global_step": 595631, "epoch": 7176} {"train_loss": -28.016132354736328, "global_step": 595632, "epoch": 7176} {"train_loss": -27.91155433654785, "global_step": 595633, "epoch": 7176} {"train_loss": -28.08076286315918, "global_step": 595634, "epoch": 7176} {"train_loss": -27.879474639892578, "global_step": 595635, "epoch": 7176} {"train_loss": -27.998090744018555, "global_step": 595636, "epoch": 7176} {"train_loss": -27.810443878173828, "global_step": 595637, "epoch": 7176} {"train_loss": -27.756546020507812, "global_step": 595638, "epoch": 7176} {"train_loss": -27.848066329956055, "global_step": 595639, "epoch": 7176} {"train_loss": -28.055252075195312, "global_step": 595640, "epoch": 7176} {"train_loss": -27.73750114440918, "global_step": 595641, "epoch": 7176} {"train_loss": -27.562362670898438, "global_step": 595642, "epoch": 7176} {"train_loss": -27.658044815063477, "global_step": 595643, "epoch": 7176} {"train_loss": -28.104822158813477, "global_step": 595644, "epoch": 7176} {"train_loss": -28.108783721923828, "global_step": 595645, "epoch": 7176} {"train_loss": -28.140705108642578, "global_step": 595646, "epoch": 7176} {"train_loss": -28.012134552001953, "global_step": 595647, "epoch": 7176} {"train_loss": -28.046722412109375, "global_step": 595648, "epoch": 7176} {"train_loss": -28.10084342956543, "global_step": 595649, "epoch": 7176} {"train_loss": -27.88532066345215, "global_step": 595650, "epoch": 7176} {"train_loss": -27.84372329711914, "global_step": 595651, "epoch": 7176} {"train_loss": -28.379257202148438, "global_step": 595652, "epoch": 7176} {"train_loss": -28.190799713134766, "global_step": 595653, "epoch": 7176} {"train_loss": -28.146955490112305, "global_step": 595654, "epoch": 7176} {"train_loss": -28.561986923217773, "global_step": 595655, "epoch": 7176} {"train_loss": -28.4158992767334, "global_step": 595656, "epoch": 7176} {"train_loss": -27.89912986755371, "global_step": 595657, "epoch": 7176} {"train_loss": -28.1397705078125, "global_step": 595658, "epoch": 7176} {"train_loss": -28.383947372436523, "global_step": 595659, "epoch": 7176} {"train_loss": -28.2142333984375, "global_step": 595660, "epoch": 7176} {"train_loss": -28.242944717407227, "global_step": 595661, "epoch": 7176} {"train_loss": -28.307485580444336, "global_step": 595662, "epoch": 7176} {"train_loss": -28.460708618164062, "global_step": 595663, "epoch": 7176} {"train_loss": -28.325897216796875, "global_step": 595664, "epoch": 7176} {"train_loss": -28.14545249938965, "global_step": 595665, "epoch": 7176} {"train_loss": -28.191864013671875, "global_step": 595666, "epoch": 7176} {"train_loss": -27.85584831237793, "global_step": 595667, "epoch": 7176} {"train_loss": -27.904050827026367, "global_step": 595668, "epoch": 7176} {"train_loss": -28.100784301757812, "global_step": 595669, "epoch": 7176} {"train_loss": -27.83762550354004, "global_step": 595670, "epoch": 7176} {"train_loss": -28.325292587280273, "global_step": 595671, "epoch": 7176} {"train_loss": -28.38214111328125, "global_step": 595672, "epoch": 7176} {"train_loss": -27.950063705444336, "global_step": 595673, "epoch": 7176} {"train_loss": -28.075307846069336, "global_step": 595674, "epoch": 7176} {"train_loss": -27.39373779296875, "global_step": 595675, "epoch": 7176} {"train_loss": -27.560510635375977, "global_step": 595676, "epoch": 7176} {"train_loss": -27.41376304626465, "global_step": 595677, "epoch": 7176} {"train_loss": -28.035037994384766, "global_step": 595678, "epoch": 7176} {"train_loss": -28.387414932250977, "global_step": 595679, "epoch": 7176} {"train_loss": -28.214252471923828, "global_step": 595680, "epoch": 7176} {"train_loss": -28.095056533813477, "global_step": 595681, "epoch": 7176} {"train_loss": -27.53946304321289, "global_step": 595682, "epoch": 7176} {"train_loss": -27.842060089111328, "global_step": 595683, "epoch": 7176} {"train_loss": -27.9648380279541, "global_step": 595684, "epoch": 7176} {"train_loss": -27.7360782623291, "global_step": 595685, "epoch": 7176} {"train_loss": -27.96370506286621, "global_step": 595686, "epoch": 7176} {"train_loss": -27.96809959411621, "global_step": 595687, "epoch": 7176} {"train_loss": -28.0257625579834, "global_step": 595688, "epoch": 7176} {"train_loss": -27.841079711914062, "global_step": 595689, "epoch": 7176} {"train_loss": -27.868725627301686, "global_step": 595690, "epoch": 7176, "val_loss": 6545202.0} {"train_loss": -26.47688102722168, "global_step": 595691, "epoch": 7177} {"train_loss": -25.10862159729004, "global_step": 595692, "epoch": 7177} {"train_loss": -27.003625869750977, "global_step": 595693, "epoch": 7177} {"train_loss": -27.021081924438477, "global_step": 595694, "epoch": 7177} {"train_loss": -26.202844619750977, "global_step": 595695, "epoch": 7177} {"train_loss": -27.131671905517578, "global_step": 595696, "epoch": 7177} {"train_loss": -27.130826950073242, "global_step": 595697, "epoch": 7177} {"train_loss": -27.663488388061523, "global_step": 595698, "epoch": 7177} {"train_loss": -27.048114776611328, "global_step": 595699, "epoch": 7177} {"train_loss": -27.285242080688477, "global_step": 595700, "epoch": 7177} {"train_loss": -26.740375518798828, "global_step": 595701, "epoch": 7177} {"train_loss": -27.237152099609375, "global_step": 595702, "epoch": 7177} {"train_loss": -27.244626998901367, "global_step": 595703, "epoch": 7177} {"train_loss": -27.616933822631836, "global_step": 595704, "epoch": 7177} {"train_loss": -27.4046573638916, "global_step": 595705, "epoch": 7177} {"train_loss": -27.648242950439453, "global_step": 595706, "epoch": 7177} {"train_loss": -27.1588134765625, "global_step": 595707, "epoch": 7177} {"train_loss": -27.562406539916992, "global_step": 595708, "epoch": 7177} {"train_loss": -27.302839279174805, "global_step": 595709, "epoch": 7177} {"train_loss": -27.65091323852539, "global_step": 595710, "epoch": 7177} {"train_loss": -27.370161056518555, "global_step": 595711, "epoch": 7177} {"train_loss": -27.9267578125, "global_step": 595712, "epoch": 7177} {"train_loss": -27.882221221923828, "global_step": 595713, "epoch": 7177} {"train_loss": -27.7601375579834, "global_step": 595714, "epoch": 7177} {"train_loss": -27.843698501586914, "global_step": 595715, "epoch": 7177} {"train_loss": -27.778589248657227, "global_step": 595716, "epoch": 7177} {"train_loss": -27.78485679626465, "global_step": 595717, "epoch": 7177} {"train_loss": -27.673294067382812, "global_step": 595718, "epoch": 7177} {"train_loss": -27.810749053955078, "global_step": 595719, "epoch": 7177} {"train_loss": -27.58933448791504, "global_step": 595720, "epoch": 7177} {"train_loss": -27.891393661499023, "global_step": 595721, "epoch": 7177} {"train_loss": -27.75813102722168, "global_step": 595722, "epoch": 7177} {"train_loss": -27.8676700592041, "global_step": 595723, "epoch": 7177} {"train_loss": -28.22519874572754, "global_step": 595724, "epoch": 7177} {"train_loss": -27.8512020111084, "global_step": 595725, "epoch": 7177} {"train_loss": -27.85438346862793, "global_step": 595726, "epoch": 7177} {"train_loss": -28.144149780273438, "global_step": 595727, "epoch": 7177} {"train_loss": -28.132720947265625, "global_step": 595728, "epoch": 7177} {"train_loss": -28.02345085144043, "global_step": 595729, "epoch": 7177} {"train_loss": -27.901208877563477, "global_step": 595730, "epoch": 7177} {"train_loss": -27.800094604492188, "global_step": 595731, "epoch": 7177} {"train_loss": -27.4250545501709, "global_step": 595732, "epoch": 7177} {"train_loss": -28.083642959594727, "global_step": 595733, "epoch": 7177} {"train_loss": -28.013885498046875, "global_step": 595734, "epoch": 7177} {"train_loss": -28.119400024414062, "global_step": 595735, "epoch": 7177} {"train_loss": -28.11622428894043, "global_step": 595736, "epoch": 7177} {"train_loss": -27.621490478515625, "global_step": 595737, "epoch": 7177} {"train_loss": -28.071557998657227, "global_step": 595738, "epoch": 7177} {"train_loss": -28.430606842041016, "global_step": 595739, "epoch": 7177} {"train_loss": -28.187360763549805, "global_step": 595740, "epoch": 7177} {"train_loss": -27.662633895874023, "global_step": 595741, "epoch": 7177} {"train_loss": -28.2524471282959, "global_step": 595742, "epoch": 7177} {"train_loss": -27.933740615844727, "global_step": 595743, "epoch": 7177} {"train_loss": -27.97983741760254, "global_step": 595744, "epoch": 7177} {"train_loss": -28.48716163635254, "global_step": 595745, "epoch": 7177} {"train_loss": -27.939924240112305, "global_step": 595746, "epoch": 7177} {"train_loss": -28.01186180114746, "global_step": 595747, "epoch": 7177} {"train_loss": -27.878162384033203, "global_step": 595748, "epoch": 7177} {"train_loss": -28.289936065673828, "global_step": 595749, "epoch": 7177} {"train_loss": -28.230030059814453, "global_step": 595750, "epoch": 7177} {"train_loss": -28.233793258666992, "global_step": 595751, "epoch": 7177} {"train_loss": -28.323049545288086, "global_step": 595752, "epoch": 7177} {"train_loss": -28.3388729095459, "global_step": 595753, "epoch": 7177} {"train_loss": -28.28559684753418, "global_step": 595754, "epoch": 7177} {"train_loss": -28.34819984436035, "global_step": 595755, "epoch": 7177} {"train_loss": -28.1433162689209, "global_step": 595756, "epoch": 7177} {"train_loss": -27.904144287109375, "global_step": 595757, "epoch": 7177} {"train_loss": -28.46482276916504, "global_step": 595758, "epoch": 7177} {"train_loss": -28.53407096862793, "global_step": 595759, "epoch": 7177} {"train_loss": -28.02182960510254, "global_step": 595760, "epoch": 7177} {"train_loss": -28.447202682495117, "global_step": 595761, "epoch": 7177} {"train_loss": -28.267322540283203, "global_step": 595762, "epoch": 7177} {"train_loss": -28.067712783813477, "global_step": 595763, "epoch": 7177} {"train_loss": -28.304853439331055, "global_step": 595764, "epoch": 7177} {"train_loss": -28.2274227142334, "global_step": 595765, "epoch": 7177} {"train_loss": -27.842191696166992, "global_step": 595766, "epoch": 7177} {"train_loss": -28.125629425048828, "global_step": 595767, "epoch": 7177} {"train_loss": -27.731786727905273, "global_step": 595768, "epoch": 7177} {"train_loss": -28.050830841064453, "global_step": 595769, "epoch": 7177} {"train_loss": -27.954299926757812, "global_step": 595770, "epoch": 7177} {"train_loss": -27.838367462158203, "global_step": 595771, "epoch": 7177} {"train_loss": -28.227811813354492, "global_step": 595772, "epoch": 7177} {"train_loss": -27.79477487127465, "global_step": 595773, "epoch": 7177, "val_loss": 6596160.5} {"train_loss": -27.291791915893555, "global_step": 595774, "epoch": 7178} {"train_loss": -27.253019332885742, "global_step": 595775, "epoch": 7178} {"train_loss": -27.326528549194336, "global_step": 595776, "epoch": 7178} {"train_loss": -27.9968204498291, "global_step": 595777, "epoch": 7178} {"train_loss": -27.609302520751953, "global_step": 595778, "epoch": 7178} {"train_loss": -27.275266647338867, "global_step": 595779, "epoch": 7178} {"train_loss": -27.481353759765625, "global_step": 595780, "epoch": 7178} {"train_loss": -27.52897071838379, "global_step": 595781, "epoch": 7178} {"train_loss": -27.40230369567871, "global_step": 595782, "epoch": 7178} {"train_loss": -27.2794132232666, "global_step": 595783, "epoch": 7178} {"train_loss": -27.920761108398438, "global_step": 595784, "epoch": 7178} {"train_loss": -27.80118179321289, "global_step": 595785, "epoch": 7178} {"train_loss": -27.779159545898438, "global_step": 595786, "epoch": 7178} {"train_loss": -27.816404342651367, "global_step": 595787, "epoch": 7178} {"train_loss": -27.627471923828125, "global_step": 595788, "epoch": 7178} {"train_loss": -27.821765899658203, "global_step": 595789, "epoch": 7178} {"train_loss": -27.63856315612793, "global_step": 595790, "epoch": 7178} {"train_loss": -27.887054443359375, "global_step": 595791, "epoch": 7178} {"train_loss": -27.78204345703125, "global_step": 595792, "epoch": 7178} {"train_loss": -27.84966468811035, "global_step": 595793, "epoch": 7178} {"train_loss": -28.00872230529785, "global_step": 595794, "epoch": 7178} {"train_loss": -27.95741844177246, "global_step": 595795, "epoch": 7178} {"train_loss": -27.857776641845703, "global_step": 595796, "epoch": 7178} {"train_loss": -27.570764541625977, "global_step": 595797, "epoch": 7178} {"train_loss": -28.431827545166016, "global_step": 595798, "epoch": 7178} {"train_loss": -28.10951042175293, "global_step": 595799, "epoch": 7178} {"train_loss": -27.96864891052246, "global_step": 595800, "epoch": 7178} {"train_loss": -27.99262046813965, "global_step": 595801, "epoch": 7178} {"train_loss": -27.705341339111328, "global_step": 595802, "epoch": 7178} {"train_loss": -27.716480255126953, "global_step": 595803, "epoch": 7178} {"train_loss": -27.671436309814453, "global_step": 595804, "epoch": 7178} {"train_loss": -27.910919189453125, "global_step": 595805, "epoch": 7178} {"train_loss": -28.298593521118164, "global_step": 595806, "epoch": 7178} {"train_loss": -27.804244995117188, "global_step": 595807, "epoch": 7178} {"train_loss": -27.90513038635254, "global_step": 595808, "epoch": 7178} {"train_loss": -28.046384811401367, "global_step": 595809, "epoch": 7178} {"train_loss": -27.8074951171875, "global_step": 595810, "epoch": 7178} {"train_loss": -28.258169174194336, "global_step": 595811, "epoch": 7178} {"train_loss": -28.099384307861328, "global_step": 595812, "epoch": 7178} {"train_loss": -28.1013126373291, "global_step": 595813, "epoch": 7178} {"train_loss": -28.08062171936035, "global_step": 595814, "epoch": 7178} {"train_loss": -28.453474044799805, "global_step": 595815, "epoch": 7178} {"train_loss": -28.575275421142578, "global_step": 595816, "epoch": 7178} {"train_loss": -28.322601318359375, "global_step": 595817, "epoch": 7178} {"train_loss": -28.055017471313477, "global_step": 595818, "epoch": 7178} {"train_loss": -28.23780632019043, "global_step": 595819, "epoch": 7178} {"train_loss": -28.40423011779785, "global_step": 595820, "epoch": 7178} {"train_loss": -28.098682403564453, "global_step": 595821, "epoch": 7178} {"train_loss": -28.3233585357666, "global_step": 595822, "epoch": 7178} {"train_loss": -28.438995361328125, "global_step": 595823, "epoch": 7178} {"train_loss": -28.037282943725586, "global_step": 595824, "epoch": 7178} {"train_loss": -28.024372100830078, "global_step": 595825, "epoch": 7178} {"train_loss": -28.065185546875, "global_step": 595826, "epoch": 7178} {"train_loss": -27.80214500427246, "global_step": 595827, "epoch": 7178} {"train_loss": -28.295745849609375, "global_step": 595828, "epoch": 7178} {"train_loss": -28.222919464111328, "global_step": 595829, "epoch": 7178} {"train_loss": -28.094852447509766, "global_step": 595830, "epoch": 7178} {"train_loss": -28.212949752807617, "global_step": 595831, "epoch": 7178} {"train_loss": -27.873865127563477, "global_step": 595832, "epoch": 7178} {"train_loss": -28.285863876342773, "global_step": 595833, "epoch": 7178} {"train_loss": -28.153715133666992, "global_step": 595834, "epoch": 7178} {"train_loss": -28.3071231842041, "global_step": 595835, "epoch": 7178} {"train_loss": -28.196699142456055, "global_step": 595836, "epoch": 7178} {"train_loss": -27.66962242126465, "global_step": 595837, "epoch": 7178} {"train_loss": -28.240575790405273, "global_step": 595838, "epoch": 7178} {"train_loss": -28.148351669311523, "global_step": 595839, "epoch": 7178} {"train_loss": -28.17181968688965, "global_step": 595840, "epoch": 7178} {"train_loss": -28.080307006835938, "global_step": 595841, "epoch": 7178} {"train_loss": -27.879682540893555, "global_step": 595842, "epoch": 7178} {"train_loss": -28.190937042236328, "global_step": 595843, "epoch": 7178} {"train_loss": -28.717382431030273, "global_step": 595844, "epoch": 7178} {"train_loss": -28.465627670288086, "global_step": 595845, "epoch": 7178} {"train_loss": -28.16851806640625, "global_step": 595846, "epoch": 7178} {"train_loss": -28.408361434936523, "global_step": 595847, "epoch": 7178} {"train_loss": -28.211917877197266, "global_step": 595848, "epoch": 7178} {"train_loss": -27.927133560180664, "global_step": 595849, "epoch": 7178} {"train_loss": -28.022565841674805, "global_step": 595850, "epoch": 7178} {"train_loss": -27.5620059967041, "global_step": 595851, "epoch": 7178} {"train_loss": -27.96953773498535, "global_step": 595852, "epoch": 7178} {"train_loss": -27.883371353149414, "global_step": 595853, "epoch": 7178} {"train_loss": -27.351154327392578, "global_step": 595854, "epoch": 7178} {"train_loss": -28.024322509765625, "global_step": 595855, "epoch": 7178} {"train_loss": -27.978232326277766, "global_step": 595856, "epoch": 7178, "val_loss": 6553640.0} {"train_loss": -27.569761276245117, "global_step": 595857, "epoch": 7179} {"train_loss": -27.57598876953125, "global_step": 595858, "epoch": 7179} {"train_loss": -27.477216720581055, "global_step": 595859, "epoch": 7179} {"train_loss": -26.64545249938965, "global_step": 595860, "epoch": 7179} {"train_loss": -26.701309204101562, "global_step": 595861, "epoch": 7179} {"train_loss": -26.668521881103516, "global_step": 595862, "epoch": 7179} {"train_loss": -26.705810546875, "global_step": 595863, "epoch": 7179} {"train_loss": -27.892866134643555, "global_step": 595864, "epoch": 7179} {"train_loss": -27.414051055908203, "global_step": 595865, "epoch": 7179} {"train_loss": -27.4603271484375, "global_step": 595866, "epoch": 7179} {"train_loss": -27.5047607421875, "global_step": 595867, "epoch": 7179} {"train_loss": -27.426916122436523, "global_step": 595868, "epoch": 7179} {"train_loss": -27.516632080078125, "global_step": 595869, "epoch": 7179} {"train_loss": -27.5454044342041, "global_step": 595870, "epoch": 7179} {"train_loss": -27.738479614257812, "global_step": 595871, "epoch": 7179} {"train_loss": -27.660144805908203, "global_step": 595872, "epoch": 7179} {"train_loss": -27.491357803344727, "global_step": 595873, "epoch": 7179} {"train_loss": -27.6090087890625, "global_step": 595874, "epoch": 7179} {"train_loss": -27.421064376831055, "global_step": 595875, "epoch": 7179} {"train_loss": -27.6975040435791, "global_step": 595876, "epoch": 7179} {"train_loss": -27.88205337524414, "global_step": 595877, "epoch": 7179} {"train_loss": -27.38724708557129, "global_step": 595878, "epoch": 7179} {"train_loss": -27.814847946166992, "global_step": 595879, "epoch": 7179} {"train_loss": -27.7445068359375, "global_step": 595880, "epoch": 7179} {"train_loss": -27.920867919921875, "global_step": 595881, "epoch": 7179} {"train_loss": -27.264074325561523, "global_step": 595882, "epoch": 7179} {"train_loss": -27.6215877532959, "global_step": 595883, "epoch": 7179} {"train_loss": -27.83064079284668, "global_step": 595884, "epoch": 7179} {"train_loss": -27.848255157470703, "global_step": 595885, "epoch": 7179} {"train_loss": -27.86527442932129, "global_step": 595886, "epoch": 7179} {"train_loss": -27.524280548095703, "global_step": 595887, "epoch": 7179} {"train_loss": -27.734149932861328, "global_step": 595888, "epoch": 7179} {"train_loss": -27.714136123657227, "global_step": 595889, "epoch": 7179} {"train_loss": -27.931976318359375, "global_step": 595890, "epoch": 7179} {"train_loss": -27.82606315612793, "global_step": 595891, "epoch": 7179} {"train_loss": -27.87489128112793, "global_step": 595892, "epoch": 7179} {"train_loss": -28.37324333190918, "global_step": 595893, "epoch": 7179} {"train_loss": -28.094568252563477, "global_step": 595894, "epoch": 7179} {"train_loss": -28.019933700561523, "global_step": 595895, "epoch": 7179} {"train_loss": -27.982080459594727, "global_step": 595896, "epoch": 7179} {"train_loss": -28.245412826538086, "global_step": 595897, "epoch": 7179} {"train_loss": -28.236597061157227, "global_step": 595898, "epoch": 7179} {"train_loss": -28.34950065612793, "global_step": 595899, "epoch": 7179} {"train_loss": -27.8961181640625, "global_step": 595900, "epoch": 7179} {"train_loss": -28.350488662719727, "global_step": 595901, "epoch": 7179} {"train_loss": -28.052265167236328, "global_step": 595902, "epoch": 7179} {"train_loss": -28.0001220703125, "global_step": 595903, "epoch": 7179} {"train_loss": -27.888141632080078, "global_step": 595904, "epoch": 7179} {"train_loss": -27.741607666015625, "global_step": 595905, "epoch": 7179} {"train_loss": -28.16560935974121, "global_step": 595906, "epoch": 7179} {"train_loss": -28.14214515686035, "global_step": 595907, "epoch": 7179} {"train_loss": -27.818653106689453, "global_step": 595908, "epoch": 7179} {"train_loss": -27.6304874420166, "global_step": 595909, "epoch": 7179} {"train_loss": -27.826416015625, "global_step": 595910, "epoch": 7179} {"train_loss": -27.851459503173828, "global_step": 595911, "epoch": 7179} {"train_loss": -28.27857780456543, "global_step": 595912, "epoch": 7179} {"train_loss": -28.004255294799805, "global_step": 595913, "epoch": 7179} {"train_loss": -27.8111629486084, "global_step": 595914, "epoch": 7179} {"train_loss": -27.956335067749023, "global_step": 595915, "epoch": 7179} {"train_loss": -28.050695419311523, "global_step": 595916, "epoch": 7179} {"train_loss": -27.69929313659668, "global_step": 595917, "epoch": 7179} {"train_loss": -27.65960121154785, "global_step": 595918, "epoch": 7179} {"train_loss": -27.26861572265625, "global_step": 595919, "epoch": 7179} {"train_loss": -27.545135498046875, "global_step": 595920, "epoch": 7179} {"train_loss": -27.941959381103516, "global_step": 595921, "epoch": 7179} {"train_loss": -27.92327308654785, "global_step": 595922, "epoch": 7179} {"train_loss": -28.137481689453125, "global_step": 595923, "epoch": 7179} {"train_loss": -28.13836669921875, "global_step": 595924, "epoch": 7179} {"train_loss": -28.016382217407227, "global_step": 595925, "epoch": 7179} {"train_loss": -27.763671875, "global_step": 595926, "epoch": 7179} {"train_loss": -27.861902236938477, "global_step": 595927, "epoch": 7179} {"train_loss": -28.33355140686035, "global_step": 595928, "epoch": 7179} {"train_loss": -27.865467071533203, "global_step": 595929, "epoch": 7179} {"train_loss": -28.13909912109375, "global_step": 595930, "epoch": 7179} {"train_loss": -28.400238037109375, "global_step": 595931, "epoch": 7179} {"train_loss": -27.857751846313477, "global_step": 595932, "epoch": 7179} {"train_loss": -27.7631778717041, "global_step": 595933, "epoch": 7179} {"train_loss": -27.921491622924805, "global_step": 595934, "epoch": 7179} {"train_loss": -28.155414581298828, "global_step": 595935, "epoch": 7179} {"train_loss": -28.016220092773438, "global_step": 595936, "epoch": 7179} {"train_loss": -28.004093170166016, "global_step": 595937, "epoch": 7179} {"train_loss": -28.170658111572266, "global_step": 595938, "epoch": 7179} {"train_loss": -27.78508719478745, "global_step": 595939, "epoch": 7179, "val_loss": 6605719.0} {"train_loss": -26.42225456237793, "global_step": 595940, "epoch": 7180} {"train_loss": -26.983139038085938, "global_step": 595941, "epoch": 7180} {"train_loss": -26.890966415405273, "global_step": 595942, "epoch": 7180} {"train_loss": -25.418210983276367, "global_step": 595943, "epoch": 7180} {"train_loss": -27.339643478393555, "global_step": 595944, "epoch": 7180} {"train_loss": -26.544118881225586, "global_step": 595945, "epoch": 7180} {"train_loss": -26.953937530517578, "global_step": 595946, "epoch": 7180} {"train_loss": -27.038366317749023, "global_step": 595947, "epoch": 7180} {"train_loss": -27.31178092956543, "global_step": 595948, "epoch": 7180} {"train_loss": -27.349714279174805, "global_step": 595949, "epoch": 7180} {"train_loss": -27.307462692260742, "global_step": 595950, "epoch": 7180} {"train_loss": -27.326635360717773, "global_step": 595951, "epoch": 7180} {"train_loss": -27.4599666595459, "global_step": 595952, "epoch": 7180} {"train_loss": -27.196949005126953, "global_step": 595953, "epoch": 7180} {"train_loss": -27.356779098510742, "global_step": 595954, "epoch": 7180} {"train_loss": -27.209814071655273, "global_step": 595955, "epoch": 7180} {"train_loss": -27.411975860595703, "global_step": 595956, "epoch": 7180} {"train_loss": -27.355512619018555, "global_step": 595957, "epoch": 7180} {"train_loss": -27.530221939086914, "global_step": 595958, "epoch": 7180} {"train_loss": -27.5023250579834, "global_step": 595959, "epoch": 7180} {"train_loss": -28.03765869140625, "global_step": 595960, "epoch": 7180} {"train_loss": -27.662137985229492, "global_step": 595961, "epoch": 7180} {"train_loss": -27.77887535095215, "global_step": 595962, "epoch": 7180} {"train_loss": -27.62354850769043, "global_step": 595963, "epoch": 7180} {"train_loss": -28.28740882873535, "global_step": 595964, "epoch": 7180} {"train_loss": -27.675567626953125, "global_step": 595965, "epoch": 7180} {"train_loss": -27.806188583374023, "global_step": 595966, "epoch": 7180} {"train_loss": -27.814950942993164, "global_step": 595967, "epoch": 7180} {"train_loss": -28.229969024658203, "global_step": 595968, "epoch": 7180} {"train_loss": -27.773542404174805, "global_step": 595969, "epoch": 7180} {"train_loss": -27.861852645874023, "global_step": 595970, "epoch": 7180} {"train_loss": -28.128437042236328, "global_step": 595971, "epoch": 7180} {"train_loss": -27.805307388305664, "global_step": 595972, "epoch": 7180} {"train_loss": -27.89314842224121, "global_step": 595973, "epoch": 7180} {"train_loss": -27.783767700195312, "global_step": 595974, "epoch": 7180} {"train_loss": -27.959745407104492, "global_step": 595975, "epoch": 7180} {"train_loss": -27.809152603149414, "global_step": 595976, "epoch": 7180} {"train_loss": -27.645410537719727, "global_step": 595977, "epoch": 7180} {"train_loss": -28.124387741088867, "global_step": 595978, "epoch": 7180} {"train_loss": -28.09071922302246, "global_step": 595979, "epoch": 7180} {"train_loss": -28.17864418029785, "global_step": 595980, "epoch": 7180} {"train_loss": -27.933704376220703, "global_step": 595981, "epoch": 7180} {"train_loss": -28.13031578063965, "global_step": 595982, "epoch": 7180} {"train_loss": -28.197179794311523, "global_step": 595983, "epoch": 7180} {"train_loss": -28.137073516845703, "global_step": 595984, "epoch": 7180} {"train_loss": -28.222410202026367, "global_step": 595985, "epoch": 7180} {"train_loss": -27.980426788330078, "global_step": 595986, "epoch": 7180} {"train_loss": -27.95533561706543, "global_step": 595987, "epoch": 7180} {"train_loss": -27.912988662719727, "global_step": 595988, "epoch": 7180} {"train_loss": -28.118661880493164, "global_step": 595989, "epoch": 7180} {"train_loss": -28.398706436157227, "global_step": 595990, "epoch": 7180} {"train_loss": -27.82672119140625, "global_step": 595991, "epoch": 7180} {"train_loss": -28.369855880737305, "global_step": 595992, "epoch": 7180} {"train_loss": -28.10064697265625, "global_step": 595993, "epoch": 7180} {"train_loss": -27.838581085205078, "global_step": 595994, "epoch": 7180} {"train_loss": -27.975183486938477, "global_step": 595995, "epoch": 7180} {"train_loss": -28.319427490234375, "global_step": 595996, "epoch": 7180} {"train_loss": -28.06046485900879, "global_step": 595997, "epoch": 7180} {"train_loss": -27.69060707092285, "global_step": 595998, "epoch": 7180} {"train_loss": -28.2029972076416, "global_step": 595999, "epoch": 7180} {"train_loss": -28.629230499267578, "global_step": 596000, "epoch": 7180} {"train_loss": -28.54005241394043, "global_step": 596001, "epoch": 7180} {"train_loss": -28.22776222229004, "global_step": 596002, "epoch": 7180} {"train_loss": -28.0136661529541, "global_step": 596003, "epoch": 7180} {"train_loss": -28.043853759765625, "global_step": 596004, "epoch": 7180} {"train_loss": -27.845930099487305, "global_step": 596005, "epoch": 7180} {"train_loss": -28.129053115844727, "global_step": 596006, "epoch": 7180} {"train_loss": -27.845813751220703, "global_step": 596007, "epoch": 7180} {"train_loss": -28.110136032104492, "global_step": 596008, "epoch": 7180} {"train_loss": -28.082965850830078, "global_step": 596009, "epoch": 7180} {"train_loss": -28.270645141601562, "global_step": 596010, "epoch": 7180} {"train_loss": -28.30682373046875, "global_step": 596011, "epoch": 7180} {"train_loss": -28.01144790649414, "global_step": 596012, "epoch": 7180} {"train_loss": -28.409046173095703, "global_step": 596013, "epoch": 7180} {"train_loss": -28.337299346923828, "global_step": 596014, "epoch": 7180} {"train_loss": -27.84437370300293, "global_step": 596015, "epoch": 7180} {"train_loss": -28.1785831451416, "global_step": 596016, "epoch": 7180} {"train_loss": -28.285058975219727, "global_step": 596017, "epoch": 7180} {"train_loss": -28.06012535095215, "global_step": 596018, "epoch": 7180} {"train_loss": -28.50520133972168, "global_step": 596019, "epoch": 7180} {"train_loss": -28.346755981445312, "global_step": 596020, "epoch": 7180} {"train_loss": -28.364944458007812, "global_step": 596021, "epoch": 7180} {"train_loss": -27.835525190973858, "global_step": 596022, "epoch": 7180, "val_loss": 6657452.0} {"train_loss": -26.470487594604492, "global_step": 596023, "epoch": 7181} {"train_loss": -26.96044921875, "global_step": 596024, "epoch": 7181} {"train_loss": -27.630939483642578, "global_step": 596025, "epoch": 7181} {"train_loss": -26.980459213256836, "global_step": 596026, "epoch": 7181} {"train_loss": -27.315946578979492, "global_step": 596027, "epoch": 7181} {"train_loss": -27.28175163269043, "global_step": 596028, "epoch": 7181} {"train_loss": -27.489093780517578, "global_step": 596029, "epoch": 7181} {"train_loss": -27.4942684173584, "global_step": 596030, "epoch": 7181} {"train_loss": -27.46026611328125, "global_step": 596031, "epoch": 7181} {"train_loss": -27.651647567749023, "global_step": 596032, "epoch": 7181} {"train_loss": -27.662006378173828, "global_step": 596033, "epoch": 7181} {"train_loss": -27.89835548400879, "global_step": 596034, "epoch": 7181} {"train_loss": -27.574371337890625, "global_step": 596035, "epoch": 7181} {"train_loss": -27.1868896484375, "global_step": 596036, "epoch": 7181} {"train_loss": -27.5781307220459, "global_step": 596037, "epoch": 7181} {"train_loss": -27.760974884033203, "global_step": 596038, "epoch": 7181} {"train_loss": -27.838199615478516, "global_step": 596039, "epoch": 7181} {"train_loss": -27.93120765686035, "global_step": 596040, "epoch": 7181} {"train_loss": -28.224695205688477, "global_step": 596041, "epoch": 7181} {"train_loss": -28.22796630859375, "global_step": 596042, "epoch": 7181} {"train_loss": -28.06073570251465, "global_step": 596043, "epoch": 7181} {"train_loss": -27.627857208251953, "global_step": 596044, "epoch": 7181} {"train_loss": -27.650623321533203, "global_step": 596045, "epoch": 7181} {"train_loss": -27.754138946533203, "global_step": 596046, "epoch": 7181} {"train_loss": -27.81562614440918, "global_step": 596047, "epoch": 7181} {"train_loss": -27.852020263671875, "global_step": 596048, "epoch": 7181} {"train_loss": -27.607797622680664, "global_step": 596049, "epoch": 7181} {"train_loss": -28.006702423095703, "global_step": 596050, "epoch": 7181} {"train_loss": -28.11370277404785, "global_step": 596051, "epoch": 7181} {"train_loss": -27.943761825561523, "global_step": 596052, "epoch": 7181} {"train_loss": -27.664072036743164, "global_step": 596053, "epoch": 7181} {"train_loss": -27.52631950378418, "global_step": 596054, "epoch": 7181} {"train_loss": -28.04733657836914, "global_step": 596055, "epoch": 7181} {"train_loss": -27.69947624206543, "global_step": 596056, "epoch": 7181} {"train_loss": -28.03497886657715, "global_step": 596057, "epoch": 7181} {"train_loss": -27.48652458190918, "global_step": 596058, "epoch": 7181} {"train_loss": -28.051136016845703, "global_step": 596059, "epoch": 7181} {"train_loss": -28.14362907409668, "global_step": 596060, "epoch": 7181} {"train_loss": -28.533191680908203, "global_step": 596061, "epoch": 7181} {"train_loss": -28.334768295288086, "global_step": 596062, "epoch": 7181} {"train_loss": -28.074344635009766, "global_step": 596063, "epoch": 7181} {"train_loss": -27.757673263549805, "global_step": 596064, "epoch": 7181} {"train_loss": -27.904081344604492, "global_step": 596065, "epoch": 7181} {"train_loss": -28.023944854736328, "global_step": 596066, "epoch": 7181} {"train_loss": -27.779951095581055, "global_step": 596067, "epoch": 7181} {"train_loss": -28.108762741088867, "global_step": 596068, "epoch": 7181} {"train_loss": -28.243362426757812, "global_step": 596069, "epoch": 7181} {"train_loss": -28.353961944580078, "global_step": 596070, "epoch": 7181} {"train_loss": -27.851675033569336, "global_step": 596071, "epoch": 7181} {"train_loss": -28.209701538085938, "global_step": 596072, "epoch": 7181} {"train_loss": -27.898237228393555, "global_step": 596073, "epoch": 7181} {"train_loss": -28.500207901000977, "global_step": 596074, "epoch": 7181} {"train_loss": -28.045129776000977, "global_step": 596075, "epoch": 7181} {"train_loss": -28.48337173461914, "global_step": 596076, "epoch": 7181} {"train_loss": -27.901472091674805, "global_step": 596077, "epoch": 7181} {"train_loss": -28.282764434814453, "global_step": 596078, "epoch": 7181} {"train_loss": -28.194883346557617, "global_step": 596079, "epoch": 7181} {"train_loss": -28.21417808532715, "global_step": 596080, "epoch": 7181} {"train_loss": -28.1585693359375, "global_step": 596081, "epoch": 7181} {"train_loss": -27.723291397094727, "global_step": 596082, "epoch": 7181} {"train_loss": -28.26702880859375, "global_step": 596083, "epoch": 7181} {"train_loss": -28.22210693359375, "global_step": 596084, "epoch": 7181} {"train_loss": -27.856733322143555, "global_step": 596085, "epoch": 7181} {"train_loss": -28.061237335205078, "global_step": 596086, "epoch": 7181} {"train_loss": -27.7654972076416, "global_step": 596087, "epoch": 7181} {"train_loss": -28.424753189086914, "global_step": 596088, "epoch": 7181} {"train_loss": -28.103790283203125, "global_step": 596089, "epoch": 7181} {"train_loss": -27.976491928100586, "global_step": 596090, "epoch": 7181} {"train_loss": -27.715314865112305, "global_step": 596091, "epoch": 7181} {"train_loss": -27.820093154907227, "global_step": 596092, "epoch": 7181} {"train_loss": -28.297992706298828, "global_step": 596093, "epoch": 7181} {"train_loss": -27.88629150390625, "global_step": 596094, "epoch": 7181} {"train_loss": -27.758594512939453, "global_step": 596095, "epoch": 7181} {"train_loss": -27.90020751953125, "global_step": 596096, "epoch": 7181} {"train_loss": -27.922025680541992, "global_step": 596097, "epoch": 7181} {"train_loss": -28.03436851501465, "global_step": 596098, "epoch": 7181} {"train_loss": -28.06843376159668, "global_step": 596099, "epoch": 7181} {"train_loss": -28.025434494018555, "global_step": 596100, "epoch": 7181} {"train_loss": -27.999082565307617, "global_step": 596101, "epoch": 7181} {"train_loss": -28.10426139831543, "global_step": 596102, "epoch": 7181} {"train_loss": -28.049604415893555, "global_step": 596103, "epoch": 7181} {"train_loss": -28.356449127197266, "global_step": 596104, "epoch": 7181} {"train_loss": -27.895652426294532, "global_step": 596105, "epoch": 7181, "val_loss": 6478809.0} {"train_loss": -27.7934627532959, "global_step": 596106, "epoch": 7182} {"train_loss": -27.805688858032227, "global_step": 596107, "epoch": 7182} {"train_loss": -27.025360107421875, "global_step": 596108, "epoch": 7182} {"train_loss": -27.39337158203125, "global_step": 596109, "epoch": 7182} {"train_loss": -27.481006622314453, "global_step": 596110, "epoch": 7182} {"train_loss": -26.754318237304688, "global_step": 596111, "epoch": 7182} {"train_loss": -26.805389404296875, "global_step": 596112, "epoch": 7182} {"train_loss": -27.2264404296875, "global_step": 596113, "epoch": 7182} {"train_loss": -27.681615829467773, "global_step": 596114, "epoch": 7182} {"train_loss": -27.47537612915039, "global_step": 596115, "epoch": 7182} {"train_loss": -26.974145889282227, "global_step": 596116, "epoch": 7182} {"train_loss": -27.695331573486328, "global_step": 596117, "epoch": 7182} {"train_loss": -26.741870880126953, "global_step": 596118, "epoch": 7182} {"train_loss": -27.807300567626953, "global_step": 596119, "epoch": 7182} {"train_loss": -27.53769302368164, "global_step": 596120, "epoch": 7182} {"train_loss": -27.703657150268555, "global_step": 596121, "epoch": 7182} {"train_loss": -27.675668716430664, "global_step": 596122, "epoch": 7182} {"train_loss": -27.759384155273438, "global_step": 596123, "epoch": 7182} {"train_loss": -27.707563400268555, "global_step": 596124, "epoch": 7182} {"train_loss": -28.42604637145996, "global_step": 596125, "epoch": 7182} {"train_loss": -27.7260799407959, "global_step": 596126, "epoch": 7182} {"train_loss": -27.578638076782227, "global_step": 596127, "epoch": 7182} {"train_loss": -27.804706573486328, "global_step": 596128, "epoch": 7182} {"train_loss": -27.787738800048828, "global_step": 596129, "epoch": 7182} {"train_loss": -27.963788986206055, "global_step": 596130, "epoch": 7182} {"train_loss": -28.002674102783203, "global_step": 596131, "epoch": 7182} {"train_loss": -28.21815299987793, "global_step": 596132, "epoch": 7182} {"train_loss": -27.465503692626953, "global_step": 596133, "epoch": 7182} {"train_loss": -27.79563331604004, "global_step": 596134, "epoch": 7182} {"train_loss": -27.916107177734375, "global_step": 596135, "epoch": 7182} {"train_loss": -28.219104766845703, "global_step": 596136, "epoch": 7182} {"train_loss": -27.8883113861084, "global_step": 596137, "epoch": 7182} {"train_loss": -28.361608505249023, "global_step": 596138, "epoch": 7182} {"train_loss": -28.169055938720703, "global_step": 596139, "epoch": 7182} {"train_loss": -28.305545806884766, "global_step": 596140, "epoch": 7182} {"train_loss": -27.747028350830078, "global_step": 596141, "epoch": 7182} {"train_loss": -28.17915153503418, "global_step": 596142, "epoch": 7182} {"train_loss": -27.854001998901367, "global_step": 596143, "epoch": 7182} {"train_loss": -27.97540283203125, "global_step": 596144, "epoch": 7182} {"train_loss": -28.38503074645996, "global_step": 596145, "epoch": 7182} {"train_loss": -28.0407772064209, "global_step": 596146, "epoch": 7182} {"train_loss": -28.512897491455078, "global_step": 596147, "epoch": 7182} {"train_loss": -28.381378173828125, "global_step": 596148, "epoch": 7182} {"train_loss": -28.03127098083496, "global_step": 596149, "epoch": 7182} {"train_loss": -28.36128044128418, "global_step": 596150, "epoch": 7182} {"train_loss": -27.908262252807617, "global_step": 596151, "epoch": 7182} {"train_loss": -28.104528427124023, "global_step": 596152, "epoch": 7182} {"train_loss": -28.34228515625, "global_step": 596153, "epoch": 7182} {"train_loss": -28.06488037109375, "global_step": 596154, "epoch": 7182} {"train_loss": -28.066190719604492, "global_step": 596155, "epoch": 7182} {"train_loss": -27.572498321533203, "global_step": 596156, "epoch": 7182} {"train_loss": -28.19620704650879, "global_step": 596157, "epoch": 7182} {"train_loss": -27.868051528930664, "global_step": 596158, "epoch": 7182} {"train_loss": -27.89784812927246, "global_step": 596159, "epoch": 7182} {"train_loss": -27.86762046813965, "global_step": 596160, "epoch": 7182} {"train_loss": -28.376102447509766, "global_step": 596161, "epoch": 7182} {"train_loss": -27.588972091674805, "global_step": 596162, "epoch": 7182} {"train_loss": -28.4816837310791, "global_step": 596163, "epoch": 7182} {"train_loss": -28.520872116088867, "global_step": 596164, "epoch": 7182} {"train_loss": -28.19074058532715, "global_step": 596165, "epoch": 7182} {"train_loss": -28.301441192626953, "global_step": 596166, "epoch": 7182} {"train_loss": -28.3892822265625, "global_step": 596167, "epoch": 7182} {"train_loss": -28.27613639831543, "global_step": 596168, "epoch": 7182} {"train_loss": -27.781591415405273, "global_step": 596169, "epoch": 7182} {"train_loss": -28.168537139892578, "global_step": 596170, "epoch": 7182} {"train_loss": -27.709339141845703, "global_step": 596171, "epoch": 7182} {"train_loss": -27.961095809936523, "global_step": 596172, "epoch": 7182} {"train_loss": -27.976842880249023, "global_step": 596173, "epoch": 7182} {"train_loss": -28.075605392456055, "global_step": 596174, "epoch": 7182} {"train_loss": -27.981821060180664, "global_step": 596175, "epoch": 7182} {"train_loss": -28.194305419921875, "global_step": 596176, "epoch": 7182} {"train_loss": -28.10464859008789, "global_step": 596177, "epoch": 7182} {"train_loss": -27.868223190307617, "global_step": 596178, "epoch": 7182} {"train_loss": -28.43110466003418, "global_step": 596179, "epoch": 7182} {"train_loss": -27.998937606811523, "global_step": 596180, "epoch": 7182} {"train_loss": -28.30653190612793, "global_step": 596181, "epoch": 7182} {"train_loss": -28.0688533782959, "global_step": 596182, "epoch": 7182} {"train_loss": -27.924152374267578, "global_step": 596183, "epoch": 7182} {"train_loss": -28.203601837158203, "global_step": 596184, "epoch": 7182} {"train_loss": -28.1743221282959, "global_step": 596185, "epoch": 7182} {"train_loss": -28.464553833007812, "global_step": 596186, "epoch": 7182} {"train_loss": -28.03742790222168, "global_step": 596187, "epoch": 7182} {"train_loss": -27.93374298279544, "global_step": 596188, "epoch": 7182, "val_loss": 6577406.0} {"train_loss": -26.428686141967773, "global_step": 596189, "epoch": 7183} {"train_loss": -27.025390625, "global_step": 596190, "epoch": 7183} {"train_loss": -26.70033073425293, "global_step": 596191, "epoch": 7183} {"train_loss": -27.475488662719727, "global_step": 596192, "epoch": 7183} {"train_loss": -27.426633834838867, "global_step": 596193, "epoch": 7183} {"train_loss": -26.951242446899414, "global_step": 596194, "epoch": 7183} {"train_loss": -26.87430763244629, "global_step": 596195, "epoch": 7183} {"train_loss": -27.16285514831543, "global_step": 596196, "epoch": 7183} {"train_loss": -27.979764938354492, "global_step": 596197, "epoch": 7183} {"train_loss": -27.783649444580078, "global_step": 596198, "epoch": 7183} {"train_loss": -27.66341209411621, "global_step": 596199, "epoch": 7183} {"train_loss": -27.550458908081055, "global_step": 596200, "epoch": 7183} {"train_loss": -27.693281173706055, "global_step": 596201, "epoch": 7183} {"train_loss": -27.998586654663086, "global_step": 596202, "epoch": 7183} {"train_loss": -27.50343132019043, "global_step": 596203, "epoch": 7183} {"train_loss": -27.652210235595703, "global_step": 596204, "epoch": 7183} {"train_loss": -27.51055335998535, "global_step": 596205, "epoch": 7183} {"train_loss": -27.89103126525879, "global_step": 596206, "epoch": 7183} {"train_loss": -27.744449615478516, "global_step": 596207, "epoch": 7183} {"train_loss": -27.79913902282715, "global_step": 596208, "epoch": 7183} {"train_loss": -27.991138458251953, "global_step": 596209, "epoch": 7183} {"train_loss": -27.908491134643555, "global_step": 596210, "epoch": 7183} {"train_loss": -27.881366729736328, "global_step": 596211, "epoch": 7183} {"train_loss": -28.03175163269043, "global_step": 596212, "epoch": 7183} {"train_loss": -28.088855743408203, "global_step": 596213, "epoch": 7183} {"train_loss": -28.03500747680664, "global_step": 596214, "epoch": 7183} {"train_loss": -27.729663848876953, "global_step": 596215, "epoch": 7183} {"train_loss": -27.928434371948242, "global_step": 596216, "epoch": 7183} {"train_loss": -27.717863082885742, "global_step": 596217, "epoch": 7183} {"train_loss": -27.751325607299805, "global_step": 596218, "epoch": 7183} {"train_loss": -27.9953556060791, "global_step": 596219, "epoch": 7183} {"train_loss": -27.728641510009766, "global_step": 596220, "epoch": 7183} {"train_loss": -28.095855712890625, "global_step": 596221, "epoch": 7183} {"train_loss": -28.3251895904541, "global_step": 596222, "epoch": 7183} {"train_loss": -27.819040298461914, "global_step": 596223, "epoch": 7183} {"train_loss": -27.683780670166016, "global_step": 596224, "epoch": 7183} {"train_loss": -28.277362823486328, "global_step": 596225, "epoch": 7183} {"train_loss": -28.364227294921875, "global_step": 596226, "epoch": 7183} {"train_loss": -28.095813751220703, "global_step": 596227, "epoch": 7183} {"train_loss": -27.884540557861328, "global_step": 596228, "epoch": 7183} {"train_loss": -27.916425704956055, "global_step": 596229, "epoch": 7183} {"train_loss": -27.88495445251465, "global_step": 596230, "epoch": 7183} {"train_loss": -28.107397079467773, "global_step": 596231, "epoch": 7183} {"train_loss": -27.7049503326416, "global_step": 596232, "epoch": 7183} {"train_loss": -28.050329208374023, "global_step": 596233, "epoch": 7183} {"train_loss": -28.19927978515625, "global_step": 596234, "epoch": 7183} {"train_loss": -27.809101104736328, "global_step": 596235, "epoch": 7183} {"train_loss": -28.20438003540039, "global_step": 596236, "epoch": 7183} {"train_loss": -28.205915451049805, "global_step": 596237, "epoch": 7183} {"train_loss": -28.22768211364746, "global_step": 596238, "epoch": 7183} {"train_loss": -28.063058853149414, "global_step": 596239, "epoch": 7183} {"train_loss": -28.178924560546875, "global_step": 596240, "epoch": 7183} {"train_loss": -28.206491470336914, "global_step": 596241, "epoch": 7183} {"train_loss": -28.001394271850586, "global_step": 596242, "epoch": 7183} {"train_loss": -28.019439697265625, "global_step": 596243, "epoch": 7183} {"train_loss": -28.287799835205078, "global_step": 596244, "epoch": 7183} {"train_loss": -28.171789169311523, "global_step": 596245, "epoch": 7183} {"train_loss": -28.062137603759766, "global_step": 596246, "epoch": 7183} {"train_loss": -28.234420776367188, "global_step": 596247, "epoch": 7183} {"train_loss": -28.473108291625977, "global_step": 596248, "epoch": 7183} {"train_loss": -28.134790420532227, "global_step": 596249, "epoch": 7183} {"train_loss": -28.21248435974121, "global_step": 596250, "epoch": 7183} {"train_loss": -28.280975341796875, "global_step": 596251, "epoch": 7183} {"train_loss": -28.15595054626465, "global_step": 596252, "epoch": 7183} {"train_loss": -28.374250411987305, "global_step": 596253, "epoch": 7183} {"train_loss": -28.365570068359375, "global_step": 596254, "epoch": 7183} {"train_loss": -27.978296279907227, "global_step": 596255, "epoch": 7183} {"train_loss": -27.7562313079834, "global_step": 596256, "epoch": 7183} {"train_loss": -28.555444717407227, "global_step": 596257, "epoch": 7183} {"train_loss": -28.137643814086914, "global_step": 596258, "epoch": 7183} {"train_loss": -28.21088218688965, "global_step": 596259, "epoch": 7183} {"train_loss": -27.883047103881836, "global_step": 596260, "epoch": 7183} {"train_loss": -28.120676040649414, "global_step": 596261, "epoch": 7183} {"train_loss": -28.259199142456055, "global_step": 596262, "epoch": 7183} {"train_loss": -27.35687828063965, "global_step": 596263, "epoch": 7183} {"train_loss": -27.912317276000977, "global_step": 596264, "epoch": 7183} {"train_loss": -27.600988388061523, "global_step": 596265, "epoch": 7183} {"train_loss": -27.993616104125977, "global_step": 596266, "epoch": 7183} {"train_loss": -27.91607093811035, "global_step": 596267, "epoch": 7183} {"train_loss": -28.487287521362305, "global_step": 596268, "epoch": 7183} {"train_loss": -28.049514770507812, "global_step": 596269, "epoch": 7183} {"train_loss": -28.16571617126465, "global_step": 596270, "epoch": 7183} {"train_loss": -27.919185247765967, "global_step": 596271, "epoch": 7183, "val_loss": 6517140.0} {"train_loss": -26.606109619140625, "global_step": 596272, "epoch": 7184} {"train_loss": -25.413366317749023, "global_step": 596273, "epoch": 7184} {"train_loss": -26.034250259399414, "global_step": 596274, "epoch": 7184} {"train_loss": -26.86814308166504, "global_step": 596275, "epoch": 7184} {"train_loss": -26.130746841430664, "global_step": 596276, "epoch": 7184} {"train_loss": -26.98891258239746, "global_step": 596277, "epoch": 7184} {"train_loss": -27.041614532470703, "global_step": 596278, "epoch": 7184} {"train_loss": -27.3955020904541, "global_step": 596279, "epoch": 7184} {"train_loss": -26.81146240234375, "global_step": 596280, "epoch": 7184} {"train_loss": -27.428491592407227, "global_step": 596281, "epoch": 7184} {"train_loss": -27.1966495513916, "global_step": 596282, "epoch": 7184} {"train_loss": -27.43818473815918, "global_step": 596283, "epoch": 7184} {"train_loss": -27.67450523376465, "global_step": 596284, "epoch": 7184} {"train_loss": -27.310327529907227, "global_step": 596285, "epoch": 7184} {"train_loss": -27.352035522460938, "global_step": 596286, "epoch": 7184} {"train_loss": -27.770599365234375, "global_step": 596287, "epoch": 7184} {"train_loss": -27.18597984313965, "global_step": 596288, "epoch": 7184} {"train_loss": -27.772897720336914, "global_step": 596289, "epoch": 7184} {"train_loss": -27.470014572143555, "global_step": 596290, "epoch": 7184} {"train_loss": -27.96857261657715, "global_step": 596291, "epoch": 7184} {"train_loss": -27.665679931640625, "global_step": 596292, "epoch": 7184} {"train_loss": -27.506742477416992, "global_step": 596293, "epoch": 7184} {"train_loss": -27.586700439453125, "global_step": 596294, "epoch": 7184} {"train_loss": -27.647586822509766, "global_step": 596295, "epoch": 7184} {"train_loss": -27.437469482421875, "global_step": 596296, "epoch": 7184} {"train_loss": -28.202075958251953, "global_step": 596297, "epoch": 7184} {"train_loss": -27.7441349029541, "global_step": 596298, "epoch": 7184} {"train_loss": -27.8314266204834, "global_step": 596299, "epoch": 7184} {"train_loss": -27.744953155517578, "global_step": 596300, "epoch": 7184} {"train_loss": -27.73272132873535, "global_step": 596301, "epoch": 7184} {"train_loss": -27.9348201751709, "global_step": 596302, "epoch": 7184} {"train_loss": -27.832843780517578, "global_step": 596303, "epoch": 7184} {"train_loss": -28.05352210998535, "global_step": 596304, "epoch": 7184} {"train_loss": -28.09100341796875, "global_step": 596305, "epoch": 7184} {"train_loss": -28.24599266052246, "global_step": 596306, "epoch": 7184} {"train_loss": -27.937952041625977, "global_step": 596307, "epoch": 7184} {"train_loss": -27.936471939086914, "global_step": 596308, "epoch": 7184} {"train_loss": -28.14646339416504, "global_step": 596309, "epoch": 7184} {"train_loss": -28.464406967163086, "global_step": 596310, "epoch": 7184} {"train_loss": -27.8587589263916, "global_step": 596311, "epoch": 7184} {"train_loss": -28.059341430664062, "global_step": 596312, "epoch": 7184} {"train_loss": -28.04973793029785, "global_step": 596313, "epoch": 7184} {"train_loss": -27.909896850585938, "global_step": 596314, "epoch": 7184} {"train_loss": -27.908863067626953, "global_step": 596315, "epoch": 7184} {"train_loss": -28.21430015563965, "global_step": 596316, "epoch": 7184} {"train_loss": -28.383716583251953, "global_step": 596317, "epoch": 7184} {"train_loss": -28.351520538330078, "global_step": 596318, "epoch": 7184} {"train_loss": -28.337385177612305, "global_step": 596319, "epoch": 7184} {"train_loss": -28.3150577545166, "global_step": 596320, "epoch": 7184} {"train_loss": -28.165557861328125, "global_step": 596321, "epoch": 7184} {"train_loss": -28.212461471557617, "global_step": 596322, "epoch": 7184} {"train_loss": -27.455265045166016, "global_step": 596323, "epoch": 7184} {"train_loss": -27.867090225219727, "global_step": 596324, "epoch": 7184} {"train_loss": -27.81922721862793, "global_step": 596325, "epoch": 7184} {"train_loss": -27.90850830078125, "global_step": 596326, "epoch": 7184} {"train_loss": -27.656070709228516, "global_step": 596327, "epoch": 7184} {"train_loss": -27.714862823486328, "global_step": 596328, "epoch": 7184} {"train_loss": -27.824243545532227, "global_step": 596329, "epoch": 7184} {"train_loss": -28.108495712280273, "global_step": 596330, "epoch": 7184} {"train_loss": -27.747528076171875, "global_step": 596331, "epoch": 7184} {"train_loss": -27.984155654907227, "global_step": 596332, "epoch": 7184} {"train_loss": -27.80219078063965, "global_step": 596333, "epoch": 7184} {"train_loss": -27.530933380126953, "global_step": 596334, "epoch": 7184} {"train_loss": -27.76776695251465, "global_step": 596335, "epoch": 7184} {"train_loss": -28.09942626953125, "global_step": 596336, "epoch": 7184} {"train_loss": -27.80356216430664, "global_step": 596337, "epoch": 7184} {"train_loss": -27.3080997467041, "global_step": 596338, "epoch": 7184} {"train_loss": -27.638172149658203, "global_step": 596339, "epoch": 7184} {"train_loss": -27.504074096679688, "global_step": 596340, "epoch": 7184} {"train_loss": -27.709827423095703, "global_step": 596341, "epoch": 7184} {"train_loss": -28.22810173034668, "global_step": 596342, "epoch": 7184} {"train_loss": -27.787006378173828, "global_step": 596343, "epoch": 7184} {"train_loss": -27.622583389282227, "global_step": 596344, "epoch": 7184} {"train_loss": -27.865076065063477, "global_step": 596345, "epoch": 7184} {"train_loss": -27.989715576171875, "global_step": 596346, "epoch": 7184} {"train_loss": -27.91863441467285, "global_step": 596347, "epoch": 7184} {"train_loss": -27.83111572265625, "global_step": 596348, "epoch": 7184} {"train_loss": -27.859750747680664, "global_step": 596349, "epoch": 7184} {"train_loss": -27.958099365234375, "global_step": 596350, "epoch": 7184} {"train_loss": -27.816558837890625, "global_step": 596351, "epoch": 7184} {"train_loss": -28.30426597595215, "global_step": 596352, "epoch": 7184} {"train_loss": -27.824026107788086, "global_step": 596353, "epoch": 7184} {"train_loss": -27.728770681174403, "global_step": 596354, "epoch": 7184, "val_loss": 6603008.0} {"train_loss": -27.44073486328125, "global_step": 596355, "epoch": 7185} {"train_loss": -28.07096290588379, "global_step": 596356, "epoch": 7185} {"train_loss": -27.861698150634766, "global_step": 596357, "epoch": 7185} {"train_loss": -27.55401039123535, "global_step": 596358, "epoch": 7185} {"train_loss": -27.658660888671875, "global_step": 596359, "epoch": 7185} {"train_loss": -27.481998443603516, "global_step": 596360, "epoch": 7185} {"train_loss": -27.78788185119629, "global_step": 596361, "epoch": 7185} {"train_loss": -27.954893112182617, "global_step": 596362, "epoch": 7185} {"train_loss": -27.95985984802246, "global_step": 596363, "epoch": 7185} {"train_loss": -27.664159774780273, "global_step": 596364, "epoch": 7185} {"train_loss": -27.807538986206055, "global_step": 596365, "epoch": 7185} {"train_loss": -27.69672203063965, "global_step": 596366, "epoch": 7185} {"train_loss": -28.010595321655273, "global_step": 596367, "epoch": 7185} {"train_loss": -27.487537384033203, "global_step": 596368, "epoch": 7185} {"train_loss": -27.759174346923828, "global_step": 596369, "epoch": 7185} {"train_loss": -27.992141723632812, "global_step": 596370, "epoch": 7185} {"train_loss": -27.877105712890625, "global_step": 596371, "epoch": 7185} {"train_loss": -27.983844757080078, "global_step": 596372, "epoch": 7185} {"train_loss": -27.833450317382812, "global_step": 596373, "epoch": 7185} {"train_loss": -28.015033721923828, "global_step": 596374, "epoch": 7185} {"train_loss": -27.92279624938965, "global_step": 596375, "epoch": 7185} {"train_loss": -28.383996963500977, "global_step": 596376, "epoch": 7185} {"train_loss": -28.50538444519043, "global_step": 596377, "epoch": 7185} {"train_loss": -28.11689567565918, "global_step": 596378, "epoch": 7185} {"train_loss": -27.817846298217773, "global_step": 596379, "epoch": 7185} {"train_loss": -28.23284912109375, "global_step": 596380, "epoch": 7185} {"train_loss": -28.149490356445312, "global_step": 596381, "epoch": 7185} {"train_loss": -28.0972900390625, "global_step": 596382, "epoch": 7185} {"train_loss": -28.354413986206055, "global_step": 596383, "epoch": 7185} {"train_loss": -27.910070419311523, "global_step": 596384, "epoch": 7185} {"train_loss": -28.046186447143555, "global_step": 596385, "epoch": 7185} {"train_loss": -28.3682918548584, "global_step": 596386, "epoch": 7185} {"train_loss": -27.85491943359375, "global_step": 596387, "epoch": 7185} {"train_loss": -27.943191528320312, "global_step": 596388, "epoch": 7185} {"train_loss": -28.095325469970703, "global_step": 596389, "epoch": 7185} {"train_loss": -28.363128662109375, "global_step": 596390, "epoch": 7185} {"train_loss": -28.322858810424805, "global_step": 596391, "epoch": 7185} {"train_loss": -28.201139450073242, "global_step": 596392, "epoch": 7185} {"train_loss": -28.401777267456055, "global_step": 596393, "epoch": 7185} {"train_loss": -28.4200439453125, "global_step": 596394, "epoch": 7185} {"train_loss": -28.08112144470215, "global_step": 596395, "epoch": 7185} {"train_loss": -28.15960121154785, "global_step": 596396, "epoch": 7185} {"train_loss": -27.828033447265625, "global_step": 596397, "epoch": 7185} {"train_loss": -27.69862937927246, "global_step": 596398, "epoch": 7185} {"train_loss": -27.234601974487305, "global_step": 596399, "epoch": 7185} {"train_loss": -26.629379272460938, "global_step": 596400, "epoch": 7185} {"train_loss": -26.288793563842773, "global_step": 596401, "epoch": 7185} {"train_loss": -27.18226432800293, "global_step": 596402, "epoch": 7185} {"train_loss": -27.83406639099121, "global_step": 596403, "epoch": 7185} {"train_loss": -28.123579025268555, "global_step": 596404, "epoch": 7185} {"train_loss": -27.32747459411621, "global_step": 596405, "epoch": 7185} {"train_loss": -28.074071884155273, "global_step": 596406, "epoch": 7185} {"train_loss": -27.926740646362305, "global_step": 596407, "epoch": 7185} {"train_loss": -28.159860610961914, "global_step": 596408, "epoch": 7185} {"train_loss": -28.189626693725586, "global_step": 596409, "epoch": 7185} {"train_loss": -28.100854873657227, "global_step": 596410, "epoch": 7185} {"train_loss": -28.181501388549805, "global_step": 596411, "epoch": 7185} {"train_loss": -28.053882598876953, "global_step": 596412, "epoch": 7185} {"train_loss": -27.977802276611328, "global_step": 596413, "epoch": 7185} {"train_loss": -28.124597549438477, "global_step": 596414, "epoch": 7185} {"train_loss": -28.17620849609375, "global_step": 596415, "epoch": 7185} {"train_loss": -27.8725643157959, "global_step": 596416, "epoch": 7185} {"train_loss": -27.865461349487305, "global_step": 596417, "epoch": 7185} {"train_loss": -28.377660751342773, "global_step": 596418, "epoch": 7185} {"train_loss": -28.07625389099121, "global_step": 596419, "epoch": 7185} {"train_loss": -27.73328971862793, "global_step": 596420, "epoch": 7185} {"train_loss": -27.85019302368164, "global_step": 596421, "epoch": 7185} {"train_loss": -28.33340835571289, "global_step": 596422, "epoch": 7185} {"train_loss": -27.82562828063965, "global_step": 596423, "epoch": 7185} {"train_loss": -28.113483428955078, "global_step": 596424, "epoch": 7185} {"train_loss": -27.918323516845703, "global_step": 596425, "epoch": 7185} {"train_loss": -28.228199005126953, "global_step": 596426, "epoch": 7185} {"train_loss": -28.333423614501953, "global_step": 596427, "epoch": 7185} {"train_loss": -28.05950355529785, "global_step": 596428, "epoch": 7185} {"train_loss": -27.88494300842285, "global_step": 596429, "epoch": 7185} {"train_loss": -28.0540771484375, "global_step": 596430, "epoch": 7185} {"train_loss": -28.24395179748535, "global_step": 596431, "epoch": 7185} {"train_loss": -28.098058700561523, "global_step": 596432, "epoch": 7185} {"train_loss": -27.25921058654785, "global_step": 596433, "epoch": 7185} {"train_loss": -27.50653076171875, "global_step": 596434, "epoch": 7185} {"train_loss": -28.308155059814453, "global_step": 596435, "epoch": 7185} {"train_loss": -27.46038246154785, "global_step": 596436, "epoch": 7185} {"train_loss": -27.93868425668004, "global_step": 596437, "epoch": 7185, "val_loss": 6595717.5} {"train_loss": -27.2385311126709, "global_step": 596438, "epoch": 7186} {"train_loss": -27.024036407470703, "global_step": 596439, "epoch": 7186} {"train_loss": -27.888174057006836, "global_step": 596440, "epoch": 7186} {"train_loss": -26.63640785217285, "global_step": 596441, "epoch": 7186} {"train_loss": -27.305622100830078, "global_step": 596442, "epoch": 7186} {"train_loss": -27.313405990600586, "global_step": 596443, "epoch": 7186} {"train_loss": -27.182104110717773, "global_step": 596444, "epoch": 7186} {"train_loss": -27.198535919189453, "global_step": 596445, "epoch": 7186} {"train_loss": -27.024585723876953, "global_step": 596446, "epoch": 7186} {"train_loss": -27.542865753173828, "global_step": 596447, "epoch": 7186} {"train_loss": -27.39776039123535, "global_step": 596448, "epoch": 7186} {"train_loss": -27.422216415405273, "global_step": 596449, "epoch": 7186} {"train_loss": -27.187192916870117, "global_step": 596450, "epoch": 7186} {"train_loss": -27.521066665649414, "global_step": 596451, "epoch": 7186} {"train_loss": -26.695531845092773, "global_step": 596452, "epoch": 7186} {"train_loss": -27.41790771484375, "global_step": 596453, "epoch": 7186} {"train_loss": -26.857709884643555, "global_step": 596454, "epoch": 7186} {"train_loss": -27.134733200073242, "global_step": 596455, "epoch": 7186} {"train_loss": -27.584095001220703, "global_step": 596456, "epoch": 7186} {"train_loss": -27.276992797851562, "global_step": 596457, "epoch": 7186} {"train_loss": -27.887237548828125, "global_step": 596458, "epoch": 7186} {"train_loss": -27.657697677612305, "global_step": 596459, "epoch": 7186} {"train_loss": -27.752399444580078, "global_step": 596460, "epoch": 7186} {"train_loss": -27.505908966064453, "global_step": 596461, "epoch": 7186} {"train_loss": -27.73995018005371, "global_step": 596462, "epoch": 7186} {"train_loss": -27.50440788269043, "global_step": 596463, "epoch": 7186} {"train_loss": -27.35877799987793, "global_step": 596464, "epoch": 7186} {"train_loss": -27.34148597717285, "global_step": 596465, "epoch": 7186} {"train_loss": -27.65846824645996, "global_step": 596466, "epoch": 7186} {"train_loss": -27.63567543029785, "global_step": 596467, "epoch": 7186} {"train_loss": -27.215396881103516, "global_step": 596468, "epoch": 7186} {"train_loss": -27.94106101989746, "global_step": 596469, "epoch": 7186} {"train_loss": -27.830036163330078, "global_step": 596470, "epoch": 7186} {"train_loss": -27.501855850219727, "global_step": 596471, "epoch": 7186} {"train_loss": -28.00960350036621, "global_step": 596472, "epoch": 7186} {"train_loss": -27.8607120513916, "global_step": 596473, "epoch": 7186} {"train_loss": -27.272247314453125, "global_step": 596474, "epoch": 7186} {"train_loss": -27.677520751953125, "global_step": 596475, "epoch": 7186} {"train_loss": -27.985462188720703, "global_step": 596476, "epoch": 7186} {"train_loss": -28.11148452758789, "global_step": 596477, "epoch": 7186} {"train_loss": -28.0011043548584, "global_step": 596478, "epoch": 7186} {"train_loss": -27.673236846923828, "global_step": 596479, "epoch": 7186} {"train_loss": -28.16729736328125, "global_step": 596480, "epoch": 7186} {"train_loss": -27.7631893157959, "global_step": 596481, "epoch": 7186} {"train_loss": -28.131772994995117, "global_step": 596482, "epoch": 7186} {"train_loss": -27.683744430541992, "global_step": 596483, "epoch": 7186} {"train_loss": -27.98611831665039, "global_step": 596484, "epoch": 7186} {"train_loss": -27.845905303955078, "global_step": 596485, "epoch": 7186} {"train_loss": -27.83588981628418, "global_step": 596486, "epoch": 7186} {"train_loss": -27.97870445251465, "global_step": 596487, "epoch": 7186} {"train_loss": -28.44536781311035, "global_step": 596488, "epoch": 7186} {"train_loss": -28.063207626342773, "global_step": 596489, "epoch": 7186} {"train_loss": -28.10043716430664, "global_step": 596490, "epoch": 7186} {"train_loss": -28.316059112548828, "global_step": 596491, "epoch": 7186} {"train_loss": -28.156356811523438, "global_step": 596492, "epoch": 7186} {"train_loss": -28.179502487182617, "global_step": 596493, "epoch": 7186} {"train_loss": -28.07099723815918, "global_step": 596494, "epoch": 7186} {"train_loss": -28.040082931518555, "global_step": 596495, "epoch": 7186} {"train_loss": -28.205371856689453, "global_step": 596496, "epoch": 7186} {"train_loss": -27.984241485595703, "global_step": 596497, "epoch": 7186} {"train_loss": -28.009265899658203, "global_step": 596498, "epoch": 7186} {"train_loss": -28.40763282775879, "global_step": 596499, "epoch": 7186} {"train_loss": -28.211395263671875, "global_step": 596500, "epoch": 7186} {"train_loss": -28.03989028930664, "global_step": 596501, "epoch": 7186} {"train_loss": -28.304737091064453, "global_step": 596502, "epoch": 7186} {"train_loss": -27.97134780883789, "global_step": 596503, "epoch": 7186} {"train_loss": -28.139554977416992, "global_step": 596504, "epoch": 7186} {"train_loss": -28.049182891845703, "global_step": 596505, "epoch": 7186} {"train_loss": -28.108224868774414, "global_step": 596506, "epoch": 7186} {"train_loss": -28.54669761657715, "global_step": 596507, "epoch": 7186} {"train_loss": -28.507726669311523, "global_step": 596508, "epoch": 7186} {"train_loss": -28.045801162719727, "global_step": 596509, "epoch": 7186} {"train_loss": -27.691314697265625, "global_step": 596510, "epoch": 7186} {"train_loss": -28.01112174987793, "global_step": 596511, "epoch": 7186} {"train_loss": -28.147314071655273, "global_step": 596512, "epoch": 7186} {"train_loss": -28.676624298095703, "global_step": 596513, "epoch": 7186} {"train_loss": -28.366113662719727, "global_step": 596514, "epoch": 7186} {"train_loss": -28.512466430664062, "global_step": 596515, "epoch": 7186} {"train_loss": -28.197280883789062, "global_step": 596516, "epoch": 7186} {"train_loss": -27.714563369750977, "global_step": 596517, "epoch": 7186} {"train_loss": -28.201725006103516, "global_step": 596518, "epoch": 7186} {"train_loss": -27.83395767211914, "global_step": 596519, "epoch": 7186} {"train_loss": -27.784194394766565, "global_step": 596520, "epoch": 7186, "val_loss": 6603696.0} {"train_loss": -26.085418701171875, "global_step": 596521, "epoch": 7187} {"train_loss": -24.500823974609375, "global_step": 596522, "epoch": 7187} {"train_loss": -24.418010711669922, "global_step": 596523, "epoch": 7187} {"train_loss": -25.092092514038086, "global_step": 596524, "epoch": 7187} {"train_loss": -26.16090965270996, "global_step": 596525, "epoch": 7187} {"train_loss": -26.658187866210938, "global_step": 596526, "epoch": 7187} {"train_loss": -26.56671142578125, "global_step": 596527, "epoch": 7187} {"train_loss": -25.9354248046875, "global_step": 596528, "epoch": 7187} {"train_loss": -26.85173988342285, "global_step": 596529, "epoch": 7187} {"train_loss": -26.35798454284668, "global_step": 596530, "epoch": 7187} {"train_loss": -26.403669357299805, "global_step": 596531, "epoch": 7187} {"train_loss": -26.530004501342773, "global_step": 596532, "epoch": 7187} {"train_loss": -26.689468383789062, "global_step": 596533, "epoch": 7187} {"train_loss": -27.331029891967773, "global_step": 596534, "epoch": 7187} {"train_loss": -26.455957412719727, "global_step": 596535, "epoch": 7187} {"train_loss": -26.45184326171875, "global_step": 596536, "epoch": 7187} {"train_loss": -27.143720626831055, "global_step": 596537, "epoch": 7187} {"train_loss": -27.10993766784668, "global_step": 596538, "epoch": 7187} {"train_loss": -26.92457389831543, "global_step": 596539, "epoch": 7187} {"train_loss": -27.36823081970215, "global_step": 596540, "epoch": 7187} {"train_loss": -27.57379150390625, "global_step": 596541, "epoch": 7187} {"train_loss": -27.284866333007812, "global_step": 596542, "epoch": 7187} {"train_loss": -27.096471786499023, "global_step": 596543, "epoch": 7187} {"train_loss": -27.2955322265625, "global_step": 596544, "epoch": 7187} {"train_loss": -26.970773696899414, "global_step": 596545, "epoch": 7187} {"train_loss": -27.75140953063965, "global_step": 596546, "epoch": 7187} {"train_loss": -27.54266929626465, "global_step": 596547, "epoch": 7187} {"train_loss": -27.50507164001465, "global_step": 596548, "epoch": 7187} {"train_loss": -27.437036514282227, "global_step": 596549, "epoch": 7187} {"train_loss": -27.3886775970459, "global_step": 596550, "epoch": 7187} {"train_loss": -27.61025047302246, "global_step": 596551, "epoch": 7187} {"train_loss": -27.571752548217773, "global_step": 596552, "epoch": 7187} {"train_loss": -27.5070743560791, "global_step": 596553, "epoch": 7187} {"train_loss": -27.3295841217041, "global_step": 596554, "epoch": 7187} {"train_loss": -27.2689151763916, "global_step": 596555, "epoch": 7187} {"train_loss": -27.927738189697266, "global_step": 596556, "epoch": 7187} {"train_loss": -27.68336296081543, "global_step": 596557, "epoch": 7187} {"train_loss": -27.58100700378418, "global_step": 596558, "epoch": 7187} {"train_loss": -27.9858341217041, "global_step": 596559, "epoch": 7187} {"train_loss": -28.031339645385742, "global_step": 596560, "epoch": 7187} {"train_loss": -27.995107650756836, "global_step": 596561, "epoch": 7187} {"train_loss": -28.1220760345459, "global_step": 596562, "epoch": 7187} {"train_loss": -27.84636878967285, "global_step": 596563, "epoch": 7187} {"train_loss": -28.244613647460938, "global_step": 596564, "epoch": 7187} {"train_loss": -28.096601486206055, "global_step": 596565, "epoch": 7187} {"train_loss": -28.05405044555664, "global_step": 596566, "epoch": 7187} {"train_loss": -28.086149215698242, "global_step": 596567, "epoch": 7187} {"train_loss": -27.68861198425293, "global_step": 596568, "epoch": 7187} {"train_loss": -27.7918758392334, "global_step": 596569, "epoch": 7187} {"train_loss": -28.394704818725586, "global_step": 596570, "epoch": 7187} {"train_loss": -27.711111068725586, "global_step": 596571, "epoch": 7187} {"train_loss": -27.722455978393555, "global_step": 596572, "epoch": 7187} {"train_loss": -28.079465866088867, "global_step": 596573, "epoch": 7187} {"train_loss": -28.430511474609375, "global_step": 596574, "epoch": 7187} {"train_loss": -27.917804718017578, "global_step": 596575, "epoch": 7187} {"train_loss": -27.697052001953125, "global_step": 596576, "epoch": 7187} {"train_loss": -27.844406127929688, "global_step": 596577, "epoch": 7187} {"train_loss": -27.99078369140625, "global_step": 596578, "epoch": 7187} {"train_loss": -27.879972457885742, "global_step": 596579, "epoch": 7187} {"train_loss": -28.204395294189453, "global_step": 596580, "epoch": 7187} {"train_loss": -27.8438777923584, "global_step": 596581, "epoch": 7187} {"train_loss": -28.063955307006836, "global_step": 596582, "epoch": 7187} {"train_loss": -28.306562423706055, "global_step": 596583, "epoch": 7187} {"train_loss": -28.144311904907227, "global_step": 596584, "epoch": 7187} {"train_loss": -28.1889591217041, "global_step": 596585, "epoch": 7187} {"train_loss": -28.123472213745117, "global_step": 596586, "epoch": 7187} {"train_loss": -27.99249267578125, "global_step": 596587, "epoch": 7187} {"train_loss": -27.822162628173828, "global_step": 596588, "epoch": 7187} {"train_loss": -28.315387725830078, "global_step": 596589, "epoch": 7187} {"train_loss": -27.93645668029785, "global_step": 596590, "epoch": 7187} {"train_loss": -28.564990997314453, "global_step": 596591, "epoch": 7187} {"train_loss": -28.279987335205078, "global_step": 596592, "epoch": 7187} {"train_loss": -28.3503475189209, "global_step": 596593, "epoch": 7187} {"train_loss": -28.05695152282715, "global_step": 596594, "epoch": 7187} {"train_loss": -28.2797794342041, "global_step": 596595, "epoch": 7187} {"train_loss": -28.3889217376709, "global_step": 596596, "epoch": 7187} {"train_loss": -28.267492294311523, "global_step": 596597, "epoch": 7187} {"train_loss": -28.25079917907715, "global_step": 596598, "epoch": 7187} {"train_loss": -28.19117546081543, "global_step": 596599, "epoch": 7187} {"train_loss": -28.174604415893555, "global_step": 596600, "epoch": 7187} {"train_loss": -28.548538208007812, "global_step": 596601, "epoch": 7187} {"train_loss": -27.94498062133789, "global_step": 596602, "epoch": 7187} {"train_loss": -27.538090556500904, "global_step": 596603, "epoch": 7187, "val_loss": 6520867.5} {"train_loss": -27.954730987548828, "global_step": 596604, "epoch": 7188} {"train_loss": -27.74481201171875, "global_step": 596605, "epoch": 7188} {"train_loss": -27.61161231994629, "global_step": 596606, "epoch": 7188} {"train_loss": -28.08790397644043, "global_step": 596607, "epoch": 7188} {"train_loss": -27.241989135742188, "global_step": 596608, "epoch": 7188} {"train_loss": -28.23247718811035, "global_step": 596609, "epoch": 7188} {"train_loss": -27.499807357788086, "global_step": 596610, "epoch": 7188} {"train_loss": -27.588153839111328, "global_step": 596611, "epoch": 7188} {"train_loss": -27.646936416625977, "global_step": 596612, "epoch": 7188} {"train_loss": -27.720075607299805, "global_step": 596613, "epoch": 7188} {"train_loss": -27.479419708251953, "global_step": 596614, "epoch": 7188} {"train_loss": -27.7954158782959, "global_step": 596615, "epoch": 7188} {"train_loss": -27.847360610961914, "global_step": 596616, "epoch": 7188} {"train_loss": -27.916894912719727, "global_step": 596617, "epoch": 7188} {"train_loss": -27.651691436767578, "global_step": 596618, "epoch": 7188} {"train_loss": -27.605932235717773, "global_step": 596619, "epoch": 7188} {"train_loss": -27.802637100219727, "global_step": 596620, "epoch": 7188} {"train_loss": -27.687719345092773, "global_step": 596621, "epoch": 7188} {"train_loss": -28.05889320373535, "global_step": 596622, "epoch": 7188} {"train_loss": -27.86469841003418, "global_step": 596623, "epoch": 7188} {"train_loss": -27.975860595703125, "global_step": 596624, "epoch": 7188} {"train_loss": -28.096952438354492, "global_step": 596625, "epoch": 7188} {"train_loss": -28.016157150268555, "global_step": 596626, "epoch": 7188} {"train_loss": -28.03116226196289, "global_step": 596627, "epoch": 7188} {"train_loss": -27.729358673095703, "global_step": 596628, "epoch": 7188} {"train_loss": -27.996265411376953, "global_step": 596629, "epoch": 7188} {"train_loss": -28.34516716003418, "global_step": 596630, "epoch": 7188} {"train_loss": -27.82708168029785, "global_step": 596631, "epoch": 7188} {"train_loss": -28.040185928344727, "global_step": 596632, "epoch": 7188} {"train_loss": -27.92884635925293, "global_step": 596633, "epoch": 7188} {"train_loss": -28.388391494750977, "global_step": 596634, "epoch": 7188} {"train_loss": -28.033191680908203, "global_step": 596635, "epoch": 7188} {"train_loss": -28.241247177124023, "global_step": 596636, "epoch": 7188} {"train_loss": -27.865955352783203, "global_step": 596637, "epoch": 7188} {"train_loss": -28.26444435119629, "global_step": 596638, "epoch": 7188} {"train_loss": -27.871021270751953, "global_step": 596639, "epoch": 7188} {"train_loss": -27.79026222229004, "global_step": 596640, "epoch": 7188} {"train_loss": -27.957059860229492, "global_step": 596641, "epoch": 7188} {"train_loss": -28.214599609375, "global_step": 596642, "epoch": 7188} {"train_loss": -27.9331111907959, "global_step": 596643, "epoch": 7188} {"train_loss": -28.047338485717773, "global_step": 596644, "epoch": 7188} {"train_loss": -27.85917091369629, "global_step": 596645, "epoch": 7188} {"train_loss": -28.183881759643555, "global_step": 596646, "epoch": 7188} {"train_loss": -27.982318878173828, "global_step": 596647, "epoch": 7188} {"train_loss": -28.10573387145996, "global_step": 596648, "epoch": 7188} {"train_loss": -27.865158081054688, "global_step": 596649, "epoch": 7188} {"train_loss": -28.201324462890625, "global_step": 596650, "epoch": 7188} {"train_loss": -27.94679069519043, "global_step": 596651, "epoch": 7188} {"train_loss": -28.028106689453125, "global_step": 596652, "epoch": 7188} {"train_loss": -27.832275390625, "global_step": 596653, "epoch": 7188} {"train_loss": -28.155792236328125, "global_step": 596654, "epoch": 7188} {"train_loss": -27.995527267456055, "global_step": 596655, "epoch": 7188} {"train_loss": -28.049192428588867, "global_step": 596656, "epoch": 7188} {"train_loss": -28.012033462524414, "global_step": 596657, "epoch": 7188} {"train_loss": -27.765975952148438, "global_step": 596658, "epoch": 7188} {"train_loss": -27.670333862304688, "global_step": 596659, "epoch": 7188} {"train_loss": -28.056238174438477, "global_step": 596660, "epoch": 7188} {"train_loss": -28.116601943969727, "global_step": 596661, "epoch": 7188} {"train_loss": -27.780811309814453, "global_step": 596662, "epoch": 7188} {"train_loss": -28.345258712768555, "global_step": 596663, "epoch": 7188} {"train_loss": -27.972064971923828, "global_step": 596664, "epoch": 7188} {"train_loss": -27.879901885986328, "global_step": 596665, "epoch": 7188} {"train_loss": -28.050933837890625, "global_step": 596666, "epoch": 7188} {"train_loss": -28.20611000061035, "global_step": 596667, "epoch": 7188} {"train_loss": -28.2811279296875, "global_step": 596668, "epoch": 7188} {"train_loss": -27.688161849975586, "global_step": 596669, "epoch": 7188} {"train_loss": -28.203857421875, "global_step": 596670, "epoch": 7188} {"train_loss": -27.90399169921875, "global_step": 596671, "epoch": 7188} {"train_loss": -27.71101188659668, "global_step": 596672, "epoch": 7188} {"train_loss": -27.934057235717773, "global_step": 596673, "epoch": 7188} {"train_loss": -28.34119987487793, "global_step": 596674, "epoch": 7188} {"train_loss": -28.2548770904541, "global_step": 596675, "epoch": 7188} {"train_loss": -27.709447860717773, "global_step": 596676, "epoch": 7188} {"train_loss": -28.052722930908203, "global_step": 596677, "epoch": 7188} {"train_loss": -27.873205184936523, "global_step": 596678, "epoch": 7188} {"train_loss": -28.278549194335938, "global_step": 596679, "epoch": 7188} {"train_loss": -27.98713493347168, "global_step": 596680, "epoch": 7188} {"train_loss": -27.615406036376953, "global_step": 596681, "epoch": 7188} {"train_loss": -27.89006996154785, "global_step": 596682, "epoch": 7188} {"train_loss": -28.1859130859375, "global_step": 596683, "epoch": 7188} {"train_loss": -28.137083053588867, "global_step": 596684, "epoch": 7188} {"train_loss": -28.04910659790039, "global_step": 596685, "epoch": 7188} {"train_loss": -27.96127087236887, "global_step": 596686, "epoch": 7188, "val_loss": 6592417.0} {"train_loss": -26.556659698486328, "global_step": 596687, "epoch": 7189} {"train_loss": -25.523122787475586, "global_step": 596688, "epoch": 7189} {"train_loss": -25.77024269104004, "global_step": 596689, "epoch": 7189} {"train_loss": -26.3831729888916, "global_step": 596690, "epoch": 7189} {"train_loss": -26.78759765625, "global_step": 596691, "epoch": 7189} {"train_loss": -26.80030632019043, "global_step": 596692, "epoch": 7189} {"train_loss": -26.0858211517334, "global_step": 596693, "epoch": 7189} {"train_loss": -27.20476722717285, "global_step": 596694, "epoch": 7189} {"train_loss": -26.500720977783203, "global_step": 596695, "epoch": 7189} {"train_loss": -27.576261520385742, "global_step": 596696, "epoch": 7189} {"train_loss": -27.062265396118164, "global_step": 596697, "epoch": 7189} {"train_loss": -27.479990005493164, "global_step": 596698, "epoch": 7189} {"train_loss": -27.145429611206055, "global_step": 596699, "epoch": 7189} {"train_loss": -27.160322189331055, "global_step": 596700, "epoch": 7189} {"train_loss": -27.559173583984375, "global_step": 596701, "epoch": 7189} {"train_loss": -27.67581558227539, "global_step": 596702, "epoch": 7189} {"train_loss": -27.51923942565918, "global_step": 596703, "epoch": 7189} {"train_loss": -27.210498809814453, "global_step": 596704, "epoch": 7189} {"train_loss": -27.639745712280273, "global_step": 596705, "epoch": 7189} {"train_loss": -27.331314086914062, "global_step": 596706, "epoch": 7189} {"train_loss": -27.081445693969727, "global_step": 596707, "epoch": 7189} {"train_loss": -27.446577072143555, "global_step": 596708, "epoch": 7189} {"train_loss": -27.595678329467773, "global_step": 596709, "epoch": 7189} {"train_loss": -27.79610252380371, "global_step": 596710, "epoch": 7189} {"train_loss": -27.417333602905273, "global_step": 596711, "epoch": 7189} {"train_loss": -27.436304092407227, "global_step": 596712, "epoch": 7189} {"train_loss": -27.74896812438965, "global_step": 596713, "epoch": 7189} {"train_loss": -27.371992111206055, "global_step": 596714, "epoch": 7189} {"train_loss": -27.533857345581055, "global_step": 596715, "epoch": 7189} {"train_loss": -27.775104522705078, "global_step": 596716, "epoch": 7189} {"train_loss": -27.828779220581055, "global_step": 596717, "epoch": 7189} {"train_loss": -27.777952194213867, "global_step": 596718, "epoch": 7189} {"train_loss": -28.08051109313965, "global_step": 596719, "epoch": 7189} {"train_loss": -27.715368270874023, "global_step": 596720, "epoch": 7189} {"train_loss": -27.906951904296875, "global_step": 596721, "epoch": 7189} {"train_loss": -28.01434898376465, "global_step": 596722, "epoch": 7189} {"train_loss": -27.96516227722168, "global_step": 596723, "epoch": 7189} {"train_loss": -27.916534423828125, "global_step": 596724, "epoch": 7189} {"train_loss": -27.695697784423828, "global_step": 596725, "epoch": 7189} {"train_loss": -28.233015060424805, "global_step": 596726, "epoch": 7189} {"train_loss": -27.75214958190918, "global_step": 596727, "epoch": 7189} {"train_loss": -27.99365234375, "global_step": 596728, "epoch": 7189} {"train_loss": -28.2655086517334, "global_step": 596729, "epoch": 7189} {"train_loss": -28.182971954345703, "global_step": 596730, "epoch": 7189} {"train_loss": -27.912525177001953, "global_step": 596731, "epoch": 7189} {"train_loss": -28.06949806213379, "global_step": 596732, "epoch": 7189} {"train_loss": -28.520872116088867, "global_step": 596733, "epoch": 7189} {"train_loss": -28.137624740600586, "global_step": 596734, "epoch": 7189} {"train_loss": -28.005884170532227, "global_step": 596735, "epoch": 7189} {"train_loss": -27.992359161376953, "global_step": 596736, "epoch": 7189} {"train_loss": -27.813779830932617, "global_step": 596737, "epoch": 7189} {"train_loss": -28.198511123657227, "global_step": 596738, "epoch": 7189} {"train_loss": -28.051965713500977, "global_step": 596739, "epoch": 7189} {"train_loss": -28.334171295166016, "global_step": 596740, "epoch": 7189} {"train_loss": -27.692914962768555, "global_step": 596741, "epoch": 7189} {"train_loss": -28.219446182250977, "global_step": 596742, "epoch": 7189} {"train_loss": -28.232080459594727, "global_step": 596743, "epoch": 7189} {"train_loss": -28.356794357299805, "global_step": 596744, "epoch": 7189} {"train_loss": -27.946582794189453, "global_step": 596745, "epoch": 7189} {"train_loss": -28.10114097595215, "global_step": 596746, "epoch": 7189} {"train_loss": -28.37424659729004, "global_step": 596747, "epoch": 7189} {"train_loss": -28.26938819885254, "global_step": 596748, "epoch": 7189} {"train_loss": -27.880573272705078, "global_step": 596749, "epoch": 7189} {"train_loss": -28.524662017822266, "global_step": 596750, "epoch": 7189} {"train_loss": -27.940271377563477, "global_step": 596751, "epoch": 7189} {"train_loss": -28.138254165649414, "global_step": 596752, "epoch": 7189} {"train_loss": -27.91476821899414, "global_step": 596753, "epoch": 7189} {"train_loss": -28.33169937133789, "global_step": 596754, "epoch": 7189} {"train_loss": -28.605066299438477, "global_step": 596755, "epoch": 7189} {"train_loss": -27.999052047729492, "global_step": 596756, "epoch": 7189} {"train_loss": -28.53922462463379, "global_step": 596757, "epoch": 7189} {"train_loss": -27.9729061126709, "global_step": 596758, "epoch": 7189} {"train_loss": -27.97511100769043, "global_step": 596759, "epoch": 7189} {"train_loss": -27.9312801361084, "global_step": 596760, "epoch": 7189} {"train_loss": -28.0362606048584, "global_step": 596761, "epoch": 7189} {"train_loss": -28.0565242767334, "global_step": 596762, "epoch": 7189} {"train_loss": -27.518402099609375, "global_step": 596763, "epoch": 7189} {"train_loss": -27.6804141998291, "global_step": 596764, "epoch": 7189} {"train_loss": -28.00149917602539, "global_step": 596765, "epoch": 7189} {"train_loss": -27.991687774658203, "global_step": 596766, "epoch": 7189} {"train_loss": -28.119409561157227, "global_step": 596767, "epoch": 7189} {"train_loss": -28.135101318359375, "global_step": 596768, "epoch": 7189} {"train_loss": -27.72823949607022, "global_step": 596769, "epoch": 7189, "val_loss": 6567610.0} {"train_loss": -27.513568878173828, "global_step": 596770, "epoch": 7190} {"train_loss": -26.912677764892578, "global_step": 596771, "epoch": 7190} {"train_loss": -26.82996940612793, "global_step": 596772, "epoch": 7190} {"train_loss": -27.301197052001953, "global_step": 596773, "epoch": 7190} {"train_loss": -27.636341094970703, "global_step": 596774, "epoch": 7190} {"train_loss": -27.379962921142578, "global_step": 596775, "epoch": 7190} {"train_loss": -27.55657386779785, "global_step": 596776, "epoch": 7190} {"train_loss": -27.482946395874023, "global_step": 596777, "epoch": 7190} {"train_loss": -27.43988037109375, "global_step": 596778, "epoch": 7190} {"train_loss": -27.464426040649414, "global_step": 596779, "epoch": 7190} {"train_loss": -27.7828369140625, "global_step": 596780, "epoch": 7190} {"train_loss": -26.957813262939453, "global_step": 596781, "epoch": 7190} {"train_loss": -27.365034103393555, "global_step": 596782, "epoch": 7190} {"train_loss": -27.477493286132812, "global_step": 596783, "epoch": 7190} {"train_loss": -27.66192626953125, "global_step": 596784, "epoch": 7190} {"train_loss": -27.54499626159668, "global_step": 596785, "epoch": 7190} {"train_loss": -27.420307159423828, "global_step": 596786, "epoch": 7190} {"train_loss": -27.852209091186523, "global_step": 596787, "epoch": 7190} {"train_loss": -27.43255043029785, "global_step": 596788, "epoch": 7190} {"train_loss": -27.56324577331543, "global_step": 596789, "epoch": 7190} {"train_loss": -27.79324722290039, "global_step": 596790, "epoch": 7190} {"train_loss": -27.915287017822266, "global_step": 596791, "epoch": 7190} {"train_loss": -27.722705841064453, "global_step": 596792, "epoch": 7190} {"train_loss": -27.612232208251953, "global_step": 596793, "epoch": 7190} {"train_loss": -28.00564956665039, "global_step": 596794, "epoch": 7190} {"train_loss": -27.667821884155273, "global_step": 596795, "epoch": 7190} {"train_loss": -27.876317977905273, "global_step": 596796, "epoch": 7190} {"train_loss": -27.774763107299805, "global_step": 596797, "epoch": 7190} {"train_loss": -27.747812271118164, "global_step": 596798, "epoch": 7190} {"train_loss": -28.048933029174805, "global_step": 596799, "epoch": 7190} {"train_loss": -28.1396484375, "global_step": 596800, "epoch": 7190} {"train_loss": -27.80637550354004, "global_step": 596801, "epoch": 7190} {"train_loss": -27.95448112487793, "global_step": 596802, "epoch": 7190} {"train_loss": -27.861371994018555, "global_step": 596803, "epoch": 7190} {"train_loss": -27.898099899291992, "global_step": 596804, "epoch": 7190} {"train_loss": -27.99468994140625, "global_step": 596805, "epoch": 7190} {"train_loss": -27.805816650390625, "global_step": 596806, "epoch": 7190} {"train_loss": -27.774566650390625, "global_step": 596807, "epoch": 7190} {"train_loss": -28.014928817749023, "global_step": 596808, "epoch": 7190} {"train_loss": -27.979949951171875, "global_step": 596809, "epoch": 7190} {"train_loss": -27.9428653717041, "global_step": 596810, "epoch": 7190} {"train_loss": -27.749475479125977, "global_step": 596811, "epoch": 7190} {"train_loss": -27.70975685119629, "global_step": 596812, "epoch": 7190} {"train_loss": -27.92829704284668, "global_step": 596813, "epoch": 7190} {"train_loss": -28.06253433227539, "global_step": 596814, "epoch": 7190} {"train_loss": -27.692672729492188, "global_step": 596815, "epoch": 7190} {"train_loss": -28.071069717407227, "global_step": 596816, "epoch": 7190} {"train_loss": -28.02789306640625, "global_step": 596817, "epoch": 7190} {"train_loss": -28.04669189453125, "global_step": 596818, "epoch": 7190} {"train_loss": -28.270566940307617, "global_step": 596819, "epoch": 7190} {"train_loss": -27.812768936157227, "global_step": 596820, "epoch": 7190} {"train_loss": -27.701690673828125, "global_step": 596821, "epoch": 7190} {"train_loss": -28.085651397705078, "global_step": 596822, "epoch": 7190} {"train_loss": -28.348560333251953, "global_step": 596823, "epoch": 7190} {"train_loss": -27.842864990234375, "global_step": 596824, "epoch": 7190} {"train_loss": -27.934864044189453, "global_step": 596825, "epoch": 7190} {"train_loss": -28.48960304260254, "global_step": 596826, "epoch": 7190} {"train_loss": -28.019617080688477, "global_step": 596827, "epoch": 7190} {"train_loss": -27.821191787719727, "global_step": 596828, "epoch": 7190} {"train_loss": -28.32402992248535, "global_step": 596829, "epoch": 7190} {"train_loss": -28.320493698120117, "global_step": 596830, "epoch": 7190} {"train_loss": -28.474546432495117, "global_step": 596831, "epoch": 7190} {"train_loss": -28.07390785217285, "global_step": 596832, "epoch": 7190} {"train_loss": -27.788330078125, "global_step": 596833, "epoch": 7190} {"train_loss": -27.93073844909668, "global_step": 596834, "epoch": 7190} {"train_loss": -27.715717315673828, "global_step": 596835, "epoch": 7190} {"train_loss": -28.272729873657227, "global_step": 596836, "epoch": 7190} {"train_loss": -28.05598258972168, "global_step": 596837, "epoch": 7190} {"train_loss": -28.461225509643555, "global_step": 596838, "epoch": 7190} {"train_loss": -28.21717643737793, "global_step": 596839, "epoch": 7190} {"train_loss": -27.79060935974121, "global_step": 596840, "epoch": 7190} {"train_loss": -28.05061912536621, "global_step": 596841, "epoch": 7190} {"train_loss": -27.890310287475586, "global_step": 596842, "epoch": 7190} {"train_loss": -28.339859008789062, "global_step": 596843, "epoch": 7190} {"train_loss": -27.71337890625, "global_step": 596844, "epoch": 7190} {"train_loss": -27.912565231323242, "global_step": 596845, "epoch": 7190} {"train_loss": -28.07172966003418, "global_step": 596846, "epoch": 7190} {"train_loss": -28.124555587768555, "global_step": 596847, "epoch": 7190} {"train_loss": -27.779829025268555, "global_step": 596848, "epoch": 7190} {"train_loss": -27.990772247314453, "global_step": 596849, "epoch": 7190} {"train_loss": -28.03302574157715, "global_step": 596850, "epoch": 7190} {"train_loss": -28.016345977783203, "global_step": 596851, "epoch": 7190} {"train_loss": -27.8391136261354, "global_step": 596852, "epoch": 7190, "val_loss": 6588406.0} {"train_loss": -27.760150909423828, "global_step": 596853, "epoch": 7191} {"train_loss": -27.28165054321289, "global_step": 596854, "epoch": 7191} {"train_loss": -26.86775779724121, "global_step": 596855, "epoch": 7191} {"train_loss": -27.95016860961914, "global_step": 596856, "epoch": 7191} {"train_loss": -27.67439079284668, "global_step": 596857, "epoch": 7191} {"train_loss": -27.320636749267578, "global_step": 596858, "epoch": 7191} {"train_loss": -27.56440544128418, "global_step": 596859, "epoch": 7191} {"train_loss": -27.36785316467285, "global_step": 596860, "epoch": 7191} {"train_loss": -27.467966079711914, "global_step": 596861, "epoch": 7191} {"train_loss": -27.010547637939453, "global_step": 596862, "epoch": 7191} {"train_loss": -27.157032012939453, "global_step": 596863, "epoch": 7191} {"train_loss": -27.500720977783203, "global_step": 596864, "epoch": 7191} {"train_loss": -27.258737564086914, "global_step": 596865, "epoch": 7191} {"train_loss": -27.610218048095703, "global_step": 596866, "epoch": 7191} {"train_loss": -27.635541915893555, "global_step": 596867, "epoch": 7191} {"train_loss": -27.768814086914062, "global_step": 596868, "epoch": 7191} {"train_loss": -27.786970138549805, "global_step": 596869, "epoch": 7191} {"train_loss": -27.87214469909668, "global_step": 596870, "epoch": 7191} {"train_loss": -27.44949722290039, "global_step": 596871, "epoch": 7191} {"train_loss": -27.962894439697266, "global_step": 596872, "epoch": 7191} {"train_loss": -27.798017501831055, "global_step": 596873, "epoch": 7191} {"train_loss": -28.225889205932617, "global_step": 596874, "epoch": 7191} {"train_loss": -27.907262802124023, "global_step": 596875, "epoch": 7191} {"train_loss": -27.720136642456055, "global_step": 596876, "epoch": 7191} {"train_loss": -28.035003662109375, "global_step": 596877, "epoch": 7191} {"train_loss": -27.848684310913086, "global_step": 596878, "epoch": 7191} {"train_loss": -28.084577560424805, "global_step": 596879, "epoch": 7191} {"train_loss": -27.877044677734375, "global_step": 596880, "epoch": 7191} {"train_loss": -27.73392677307129, "global_step": 596881, "epoch": 7191} {"train_loss": -28.1341552734375, "global_step": 596882, "epoch": 7191} {"train_loss": -28.0526123046875, "global_step": 596883, "epoch": 7191} {"train_loss": -27.937604904174805, "global_step": 596884, "epoch": 7191} {"train_loss": -27.972015380859375, "global_step": 596885, "epoch": 7191} {"train_loss": -28.362918853759766, "global_step": 596886, "epoch": 7191} {"train_loss": -28.2064151763916, "global_step": 596887, "epoch": 7191} {"train_loss": -28.09979820251465, "global_step": 596888, "epoch": 7191} {"train_loss": -28.250614166259766, "global_step": 596889, "epoch": 7191} {"train_loss": -28.371143341064453, "global_step": 596890, "epoch": 7191} {"train_loss": -28.219837188720703, "global_step": 596891, "epoch": 7191} {"train_loss": -28.337955474853516, "global_step": 596892, "epoch": 7191} {"train_loss": -28.189748764038086, "global_step": 596893, "epoch": 7191} {"train_loss": -28.022424697875977, "global_step": 596894, "epoch": 7191} {"train_loss": -28.072052001953125, "global_step": 596895, "epoch": 7191} {"train_loss": -28.318286895751953, "global_step": 596896, "epoch": 7191} {"train_loss": -28.304548263549805, "global_step": 596897, "epoch": 7191} {"train_loss": -28.431543350219727, "global_step": 596898, "epoch": 7191} {"train_loss": -28.075363159179688, "global_step": 596899, "epoch": 7191} {"train_loss": -28.215749740600586, "global_step": 596900, "epoch": 7191} {"train_loss": -28.314359664916992, "global_step": 596901, "epoch": 7191} {"train_loss": -27.845956802368164, "global_step": 596902, "epoch": 7191} {"train_loss": -28.434524536132812, "global_step": 596903, "epoch": 7191} {"train_loss": -28.417646408081055, "global_step": 596904, "epoch": 7191} {"train_loss": -28.19582176208496, "global_step": 596905, "epoch": 7191} {"train_loss": -27.93659019470215, "global_step": 596906, "epoch": 7191} {"train_loss": -28.31281089782715, "global_step": 596907, "epoch": 7191} {"train_loss": -28.12042808532715, "global_step": 596908, "epoch": 7191} {"train_loss": -28.3781681060791, "global_step": 596909, "epoch": 7191} {"train_loss": -28.088397979736328, "global_step": 596910, "epoch": 7191} {"train_loss": -27.6926326751709, "global_step": 596911, "epoch": 7191} {"train_loss": -27.8143367767334, "global_step": 596912, "epoch": 7191} {"train_loss": -27.96944236755371, "global_step": 596913, "epoch": 7191} {"train_loss": -28.269216537475586, "global_step": 596914, "epoch": 7191} {"train_loss": -27.964147567749023, "global_step": 596915, "epoch": 7191} {"train_loss": -28.280364990234375, "global_step": 596916, "epoch": 7191} {"train_loss": -27.948469161987305, "global_step": 596917, "epoch": 7191} {"train_loss": -27.569061279296875, "global_step": 596918, "epoch": 7191} {"train_loss": -27.86639976501465, "global_step": 596919, "epoch": 7191} {"train_loss": -27.84357261657715, "global_step": 596920, "epoch": 7191} {"train_loss": -27.28619956970215, "global_step": 596921, "epoch": 7191} {"train_loss": -27.689289093017578, "global_step": 596922, "epoch": 7191} {"train_loss": -27.972137451171875, "global_step": 596923, "epoch": 7191} {"train_loss": -28.32295036315918, "global_step": 596924, "epoch": 7191} {"train_loss": -28.197385787963867, "global_step": 596925, "epoch": 7191} {"train_loss": -28.359058380126953, "global_step": 596926, "epoch": 7191} {"train_loss": -27.646366119384766, "global_step": 596927, "epoch": 7191} {"train_loss": -27.931665420532227, "global_step": 596928, "epoch": 7191} {"train_loss": -28.2860107421875, "global_step": 596929, "epoch": 7191} {"train_loss": -28.1406192779541, "global_step": 596930, "epoch": 7191} {"train_loss": -28.187833786010742, "global_step": 596931, "epoch": 7191} {"train_loss": -28.223419189453125, "global_step": 596932, "epoch": 7191} {"train_loss": -28.148345947265625, "global_step": 596933, "epoch": 7191} {"train_loss": -27.911273956298828, "global_step": 596934, "epoch": 7191} {"train_loss": -27.924061625836842, "global_step": 596935, "epoch": 7191, "val_loss": 6595652.5} {"train_loss": -27.032501220703125, "global_step": 596936, "epoch": 7192} {"train_loss": -26.812946319580078, "global_step": 596937, "epoch": 7192} {"train_loss": -27.078022003173828, "global_step": 596938, "epoch": 7192} {"train_loss": -25.590269088745117, "global_step": 596939, "epoch": 7192} {"train_loss": -26.872777938842773, "global_step": 596940, "epoch": 7192} {"train_loss": -26.92626953125, "global_step": 596941, "epoch": 7192} {"train_loss": -27.039072036743164, "global_step": 596942, "epoch": 7192} {"train_loss": -27.35965347290039, "global_step": 596943, "epoch": 7192} {"train_loss": -27.63979148864746, "global_step": 596944, "epoch": 7192} {"train_loss": -27.7707576751709, "global_step": 596945, "epoch": 7192} {"train_loss": -27.422046661376953, "global_step": 596946, "epoch": 7192} {"train_loss": -27.326807022094727, "global_step": 596947, "epoch": 7192} {"train_loss": -27.437768936157227, "global_step": 596948, "epoch": 7192} {"train_loss": -27.785663604736328, "global_step": 596949, "epoch": 7192} {"train_loss": -27.7467041015625, "global_step": 596950, "epoch": 7192} {"train_loss": -28.09521484375, "global_step": 596951, "epoch": 7192} {"train_loss": -27.517850875854492, "global_step": 596952, "epoch": 7192} {"train_loss": -27.899261474609375, "global_step": 596953, "epoch": 7192} {"train_loss": -27.65797996520996, "global_step": 596954, "epoch": 7192} {"train_loss": -27.67994499206543, "global_step": 596955, "epoch": 7192} {"train_loss": -28.065305709838867, "global_step": 596956, "epoch": 7192} {"train_loss": -27.7764949798584, "global_step": 596957, "epoch": 7192} {"train_loss": -27.934722900390625, "global_step": 596958, "epoch": 7192} {"train_loss": -28.07100486755371, "global_step": 596959, "epoch": 7192} {"train_loss": -27.72698402404785, "global_step": 596960, "epoch": 7192} {"train_loss": -27.466480255126953, "global_step": 596961, "epoch": 7192} {"train_loss": -28.022348403930664, "global_step": 596962, "epoch": 7192} {"train_loss": -27.853479385375977, "global_step": 596963, "epoch": 7192} {"train_loss": -27.82346534729004, "global_step": 596964, "epoch": 7192} {"train_loss": -27.855213165283203, "global_step": 596965, "epoch": 7192} {"train_loss": -27.969369888305664, "global_step": 596966, "epoch": 7192} {"train_loss": -27.920215606689453, "global_step": 596967, "epoch": 7192} {"train_loss": -28.08016014099121, "global_step": 596968, "epoch": 7192} {"train_loss": -28.226795196533203, "global_step": 596969, "epoch": 7192} {"train_loss": -28.18558120727539, "global_step": 596970, "epoch": 7192} {"train_loss": -28.4605655670166, "global_step": 596971, "epoch": 7192} {"train_loss": -28.375553131103516, "global_step": 596972, "epoch": 7192} {"train_loss": -28.27142906188965, "global_step": 596973, "epoch": 7192} {"train_loss": -28.591943740844727, "global_step": 596974, "epoch": 7192} {"train_loss": -28.1312313079834, "global_step": 596975, "epoch": 7192} {"train_loss": -28.152143478393555, "global_step": 596976, "epoch": 7192} {"train_loss": -28.473276138305664, "global_step": 596977, "epoch": 7192} {"train_loss": -28.293731689453125, "global_step": 596978, "epoch": 7192} {"train_loss": -28.243621826171875, "global_step": 596979, "epoch": 7192} {"train_loss": -28.2866153717041, "global_step": 596980, "epoch": 7192} {"train_loss": -28.342275619506836, "global_step": 596981, "epoch": 7192} {"train_loss": -28.118284225463867, "global_step": 596982, "epoch": 7192} {"train_loss": -28.033340454101562, "global_step": 596983, "epoch": 7192} {"train_loss": -28.05194664001465, "global_step": 596984, "epoch": 7192} {"train_loss": -28.206253051757812, "global_step": 596985, "epoch": 7192} {"train_loss": -27.898700714111328, "global_step": 596986, "epoch": 7192} {"train_loss": -27.233591079711914, "global_step": 596987, "epoch": 7192} {"train_loss": -26.12479019165039, "global_step": 596988, "epoch": 7192} {"train_loss": -25.13558006286621, "global_step": 596989, "epoch": 7192} {"train_loss": -23.805320739746094, "global_step": 596990, "epoch": 7192} {"train_loss": -22.99981689453125, "global_step": 596991, "epoch": 7192} {"train_loss": -27.467670440673828, "global_step": 596992, "epoch": 7192} {"train_loss": -25.4923038482666, "global_step": 596993, "epoch": 7192} {"train_loss": -27.631311416625977, "global_step": 596994, "epoch": 7192} {"train_loss": -26.267847061157227, "global_step": 596995, "epoch": 7192} {"train_loss": -27.06097984313965, "global_step": 596996, "epoch": 7192} {"train_loss": -26.9633846282959, "global_step": 596997, "epoch": 7192} {"train_loss": -26.910322189331055, "global_step": 596998, "epoch": 7192} {"train_loss": -27.166797637939453, "global_step": 596999, "epoch": 7192} {"train_loss": -27.446136474609375, "global_step": 597000, "epoch": 7192} {"train_loss": -27.280893325805664, "global_step": 597001, "epoch": 7192} {"train_loss": -27.310819625854492, "global_step": 597002, "epoch": 7192} {"train_loss": -27.384845733642578, "global_step": 597003, "epoch": 7192} {"train_loss": -27.367279052734375, "global_step": 597004, "epoch": 7192} {"train_loss": -27.367401123046875, "global_step": 597005, "epoch": 7192} {"train_loss": -27.160791397094727, "global_step": 597006, "epoch": 7192} {"train_loss": -27.246057510375977, "global_step": 597007, "epoch": 7192} {"train_loss": -27.679834365844727, "global_step": 597008, "epoch": 7192} {"train_loss": -27.299835205078125, "global_step": 597009, "epoch": 7192} {"train_loss": -27.524221420288086, "global_step": 597010, "epoch": 7192} {"train_loss": -27.388031005859375, "global_step": 597011, "epoch": 7192} {"train_loss": -27.476896286010742, "global_step": 597012, "epoch": 7192} {"train_loss": -27.566633224487305, "global_step": 597013, "epoch": 7192} {"train_loss": -27.204687118530273, "global_step": 597014, "epoch": 7192} {"train_loss": -27.447607040405273, "global_step": 597015, "epoch": 7192} {"train_loss": -27.917774200439453, "global_step": 597016, "epoch": 7192} {"train_loss": -27.516080856323242, "global_step": 597017, "epoch": 7192} {"train_loss": -27.466116824782038, "global_step": 597018, "epoch": 7192, "val_loss": 6720540.0} {"train_loss": -27.34906578063965, "global_step": 597019, "epoch": 7193} {"train_loss": -27.406003952026367, "global_step": 597020, "epoch": 7193} {"train_loss": -27.619131088256836, "global_step": 597021, "epoch": 7193} {"train_loss": -27.6044979095459, "global_step": 597022, "epoch": 7193} {"train_loss": -27.452239990234375, "global_step": 597023, "epoch": 7193} {"train_loss": -27.755191802978516, "global_step": 597024, "epoch": 7193} {"train_loss": -27.750843048095703, "global_step": 597025, "epoch": 7193} {"train_loss": -27.615280151367188, "global_step": 597026, "epoch": 7193} {"train_loss": -27.48455810546875, "global_step": 597027, "epoch": 7193} {"train_loss": -27.451461791992188, "global_step": 597028, "epoch": 7193} {"train_loss": -27.76506996154785, "global_step": 597029, "epoch": 7193} {"train_loss": -27.892797470092773, "global_step": 597030, "epoch": 7193} {"train_loss": -28.24146842956543, "global_step": 597031, "epoch": 7193} {"train_loss": -27.752105712890625, "global_step": 597032, "epoch": 7193} {"train_loss": -27.966333389282227, "global_step": 597033, "epoch": 7193} {"train_loss": -28.10695457458496, "global_step": 597034, "epoch": 7193} {"train_loss": -27.9482364654541, "global_step": 597035, "epoch": 7193} {"train_loss": -27.98552894592285, "global_step": 597036, "epoch": 7193} {"train_loss": -27.84494400024414, "global_step": 597037, "epoch": 7193} {"train_loss": -27.9606876373291, "global_step": 597038, "epoch": 7193} {"train_loss": -27.56268310546875, "global_step": 597039, "epoch": 7193} {"train_loss": -28.22150993347168, "global_step": 597040, "epoch": 7193} {"train_loss": -28.036325454711914, "global_step": 597041, "epoch": 7193} {"train_loss": -28.2635440826416, "global_step": 597042, "epoch": 7193} {"train_loss": -27.981525421142578, "global_step": 597043, "epoch": 7193} {"train_loss": -27.97079849243164, "global_step": 597044, "epoch": 7193} {"train_loss": -27.89935302734375, "global_step": 597045, "epoch": 7193} {"train_loss": -28.0715274810791, "global_step": 597046, "epoch": 7193} {"train_loss": -27.99921989440918, "global_step": 597047, "epoch": 7193} {"train_loss": -27.980976104736328, "global_step": 597048, "epoch": 7193} {"train_loss": -27.688535690307617, "global_step": 597049, "epoch": 7193} {"train_loss": -28.005329132080078, "global_step": 597050, "epoch": 7193} {"train_loss": -28.044387817382812, "global_step": 597051, "epoch": 7193} {"train_loss": -27.733320236206055, "global_step": 597052, "epoch": 7193} {"train_loss": -27.077533721923828, "global_step": 597053, "epoch": 7193} {"train_loss": -27.226285934448242, "global_step": 597054, "epoch": 7193} {"train_loss": -27.48004722595215, "global_step": 597055, "epoch": 7193} {"train_loss": -27.80979347229004, "global_step": 597056, "epoch": 7193} {"train_loss": -27.6569881439209, "global_step": 597057, "epoch": 7193} {"train_loss": -27.75042724609375, "global_step": 597058, "epoch": 7193} {"train_loss": -27.413990020751953, "global_step": 597059, "epoch": 7193} {"train_loss": -27.67575454711914, "global_step": 597060, "epoch": 7193} {"train_loss": -27.262720108032227, "global_step": 597061, "epoch": 7193} {"train_loss": -28.448801040649414, "global_step": 597062, "epoch": 7193} {"train_loss": -27.219058990478516, "global_step": 597063, "epoch": 7193} {"train_loss": -27.89226722717285, "global_step": 597064, "epoch": 7193} {"train_loss": -27.622028350830078, "global_step": 597065, "epoch": 7193} {"train_loss": -27.927490234375, "global_step": 597066, "epoch": 7193} {"train_loss": -27.56340980529785, "global_step": 597067, "epoch": 7193} {"train_loss": -27.612812042236328, "global_step": 597068, "epoch": 7193} {"train_loss": -27.771535873413086, "global_step": 597069, "epoch": 7193} {"train_loss": -27.991851806640625, "global_step": 597070, "epoch": 7193} {"train_loss": -27.679462432861328, "global_step": 597071, "epoch": 7193} {"train_loss": -27.9858455657959, "global_step": 597072, "epoch": 7193} {"train_loss": -27.95501708984375, "global_step": 597073, "epoch": 7193} {"train_loss": -27.779630661010742, "global_step": 597074, "epoch": 7193} {"train_loss": -27.90589714050293, "global_step": 597075, "epoch": 7193} {"train_loss": -28.097091674804688, "global_step": 597076, "epoch": 7193} {"train_loss": -28.15656852722168, "global_step": 597077, "epoch": 7193} {"train_loss": -28.179914474487305, "global_step": 597078, "epoch": 7193} {"train_loss": -28.028539657592773, "global_step": 597079, "epoch": 7193} {"train_loss": -27.7071533203125, "global_step": 597080, "epoch": 7193} {"train_loss": -28.186445236206055, "global_step": 597081, "epoch": 7193} {"train_loss": -28.075550079345703, "global_step": 597082, "epoch": 7193} {"train_loss": -28.17786979675293, "global_step": 597083, "epoch": 7193} {"train_loss": -27.8214054107666, "global_step": 597084, "epoch": 7193} {"train_loss": -28.2431583404541, "global_step": 597085, "epoch": 7193} {"train_loss": -28.028173446655273, "global_step": 597086, "epoch": 7193} {"train_loss": -28.558746337890625, "global_step": 597087, "epoch": 7193} {"train_loss": -28.036508560180664, "global_step": 597088, "epoch": 7193} {"train_loss": -28.0145206451416, "global_step": 597089, "epoch": 7193} {"train_loss": -28.165639877319336, "global_step": 597090, "epoch": 7193} {"train_loss": -28.278669357299805, "global_step": 597091, "epoch": 7193} {"train_loss": -27.9873046875, "global_step": 597092, "epoch": 7193} {"train_loss": -27.6619815826416, "global_step": 597093, "epoch": 7193} {"train_loss": -28.35664176940918, "global_step": 597094, "epoch": 7193} {"train_loss": -28.19540786743164, "global_step": 597095, "epoch": 7193} {"train_loss": -27.917938232421875, "global_step": 597096, "epoch": 7193} {"train_loss": -28.282123565673828, "global_step": 597097, "epoch": 7193} {"train_loss": -28.020002365112305, "global_step": 597098, "epoch": 7193} {"train_loss": -28.286773681640625, "global_step": 597099, "epoch": 7193} {"train_loss": -28.096708297729492, "global_step": 597100, "epoch": 7193} {"train_loss": -27.87988062939012, "global_step": 597101, "epoch": 7193, "val_loss": 6682925.0} {"train_loss": -27.90919303894043, "global_step": 597102, "epoch": 7194} {"train_loss": -27.930540084838867, "global_step": 597103, "epoch": 7194} {"train_loss": -27.993091583251953, "global_step": 597104, "epoch": 7194} {"train_loss": -27.931791305541992, "global_step": 597105, "epoch": 7194} {"train_loss": -27.607025146484375, "global_step": 597106, "epoch": 7194} {"train_loss": -27.76922607421875, "global_step": 597107, "epoch": 7194} {"train_loss": -27.943552017211914, "global_step": 597108, "epoch": 7194} {"train_loss": -27.986103057861328, "global_step": 597109, "epoch": 7194} {"train_loss": -27.84742546081543, "global_step": 597110, "epoch": 7194} {"train_loss": -28.03618812561035, "global_step": 597111, "epoch": 7194} {"train_loss": -28.120380401611328, "global_step": 597112, "epoch": 7194} {"train_loss": -27.933273315429688, "global_step": 597113, "epoch": 7194} {"train_loss": -28.253873825073242, "global_step": 597114, "epoch": 7194} {"train_loss": -27.749481201171875, "global_step": 597115, "epoch": 7194} {"train_loss": -27.58955192565918, "global_step": 597116, "epoch": 7194} {"train_loss": -27.857770919799805, "global_step": 597117, "epoch": 7194} {"train_loss": -27.585973739624023, "global_step": 597118, "epoch": 7194} {"train_loss": -28.089441299438477, "global_step": 597119, "epoch": 7194} {"train_loss": -28.051443099975586, "global_step": 597120, "epoch": 7194} {"train_loss": -28.17462158203125, "global_step": 597121, "epoch": 7194} {"train_loss": -27.51509666442871, "global_step": 597122, "epoch": 7194} {"train_loss": -27.529727935791016, "global_step": 597123, "epoch": 7194} {"train_loss": -27.641559600830078, "global_step": 597124, "epoch": 7194} {"train_loss": -28.039825439453125, "global_step": 597125, "epoch": 7194} {"train_loss": -27.856836318969727, "global_step": 597126, "epoch": 7194} {"train_loss": -28.02936363220215, "global_step": 597127, "epoch": 7194} {"train_loss": -27.51597023010254, "global_step": 597128, "epoch": 7194} {"train_loss": -27.7099609375, "global_step": 597129, "epoch": 7194} {"train_loss": -28.034040451049805, "global_step": 597130, "epoch": 7194} {"train_loss": -27.901472091674805, "global_step": 597131, "epoch": 7194} {"train_loss": -27.845701217651367, "global_step": 597132, "epoch": 7194} {"train_loss": -27.945966720581055, "global_step": 597133, "epoch": 7194} {"train_loss": -27.67280387878418, "global_step": 597134, "epoch": 7194} {"train_loss": -27.879581451416016, "global_step": 597135, "epoch": 7194} {"train_loss": -28.122480392456055, "global_step": 597136, "epoch": 7194} {"train_loss": -27.468366622924805, "global_step": 597137, "epoch": 7194} {"train_loss": -27.950397491455078, "global_step": 597138, "epoch": 7194} {"train_loss": -28.099618911743164, "global_step": 597139, "epoch": 7194} {"train_loss": -27.31208610534668, "global_step": 597140, "epoch": 7194} {"train_loss": -28.136920928955078, "global_step": 597141, "epoch": 7194} {"train_loss": -27.845142364501953, "global_step": 597142, "epoch": 7194} {"train_loss": -27.692825317382812, "global_step": 597143, "epoch": 7194} {"train_loss": -28.20256996154785, "global_step": 597144, "epoch": 7194} {"train_loss": -27.982681274414062, "global_step": 597145, "epoch": 7194} {"train_loss": -28.04164695739746, "global_step": 597146, "epoch": 7194} {"train_loss": -27.969213485717773, "global_step": 597147, "epoch": 7194} {"train_loss": -27.995893478393555, "global_step": 597148, "epoch": 7194} {"train_loss": -27.751102447509766, "global_step": 597149, "epoch": 7194} {"train_loss": -27.64878273010254, "global_step": 597150, "epoch": 7194} {"train_loss": -27.96671485900879, "global_step": 597151, "epoch": 7194} {"train_loss": -27.668432235717773, "global_step": 597152, "epoch": 7194} {"train_loss": -28.006149291992188, "global_step": 597153, "epoch": 7194} {"train_loss": -27.977649688720703, "global_step": 597154, "epoch": 7194} {"train_loss": -27.994861602783203, "global_step": 597155, "epoch": 7194} {"train_loss": -27.580896377563477, "global_step": 597156, "epoch": 7194} {"train_loss": -28.008955001831055, "global_step": 597157, "epoch": 7194} {"train_loss": -28.159109115600586, "global_step": 597158, "epoch": 7194} {"train_loss": -28.062414169311523, "global_step": 597159, "epoch": 7194} {"train_loss": -28.012527465820312, "global_step": 597160, "epoch": 7194} {"train_loss": -28.010116577148438, "global_step": 597161, "epoch": 7194} {"train_loss": -28.196813583374023, "global_step": 597162, "epoch": 7194} {"train_loss": -27.60113525390625, "global_step": 597163, "epoch": 7194} {"train_loss": -28.442853927612305, "global_step": 597164, "epoch": 7194} {"train_loss": -27.826889038085938, "global_step": 597165, "epoch": 7194} {"train_loss": -27.887205123901367, "global_step": 597166, "epoch": 7194} {"train_loss": -27.778335571289062, "global_step": 597167, "epoch": 7194} {"train_loss": -27.781845092773438, "global_step": 597168, "epoch": 7194} {"train_loss": -28.192092895507812, "global_step": 597169, "epoch": 7194} {"train_loss": -28.260061264038086, "global_step": 597170, "epoch": 7194} {"train_loss": -27.85672950744629, "global_step": 597171, "epoch": 7194} {"train_loss": -27.52019691467285, "global_step": 597172, "epoch": 7194} {"train_loss": -27.5944881439209, "global_step": 597173, "epoch": 7194} {"train_loss": -28.09493064880371, "global_step": 597174, "epoch": 7194} {"train_loss": -27.7974910736084, "global_step": 597175, "epoch": 7194} {"train_loss": -28.195199966430664, "global_step": 597176, "epoch": 7194} {"train_loss": -27.369918823242188, "global_step": 597177, "epoch": 7194} {"train_loss": -28.110992431640625, "global_step": 597178, "epoch": 7194} {"train_loss": -28.312665939331055, "global_step": 597179, "epoch": 7194} {"train_loss": -28.308263778686523, "global_step": 597180, "epoch": 7194} {"train_loss": -27.9958553314209, "global_step": 597181, "epoch": 7194} {"train_loss": -28.170841217041016, "global_step": 597182, "epoch": 7194} {"train_loss": -28.121063232421875, "global_step": 597183, "epoch": 7194} {"train_loss": -27.915085390389685, "global_step": 597184, "epoch": 7194, "val_loss": 6754780.5} {"train_loss": -26.92227554321289, "global_step": 597185, "epoch": 7195} {"train_loss": -27.13956642150879, "global_step": 597186, "epoch": 7195} {"train_loss": -26.992746353149414, "global_step": 597187, "epoch": 7195} {"train_loss": -27.0909423828125, "global_step": 597188, "epoch": 7195} {"train_loss": -27.332733154296875, "global_step": 597189, "epoch": 7195} {"train_loss": -27.60358238220215, "global_step": 597190, "epoch": 7195} {"train_loss": -27.427988052368164, "global_step": 597191, "epoch": 7195} {"train_loss": -27.25355339050293, "global_step": 597192, "epoch": 7195} {"train_loss": -27.536691665649414, "global_step": 597193, "epoch": 7195} {"train_loss": -27.397424697875977, "global_step": 597194, "epoch": 7195} {"train_loss": -27.640960693359375, "global_step": 597195, "epoch": 7195} {"train_loss": -27.408002853393555, "global_step": 597196, "epoch": 7195} {"train_loss": -27.647785186767578, "global_step": 597197, "epoch": 7195} {"train_loss": -28.063068389892578, "global_step": 597198, "epoch": 7195} {"train_loss": -27.956674575805664, "global_step": 597199, "epoch": 7195} {"train_loss": -27.898462295532227, "global_step": 597200, "epoch": 7195} {"train_loss": -27.79420280456543, "global_step": 597201, "epoch": 7195} {"train_loss": -27.497495651245117, "global_step": 597202, "epoch": 7195} {"train_loss": -27.937732696533203, "global_step": 597203, "epoch": 7195} {"train_loss": -27.96791648864746, "global_step": 597204, "epoch": 7195} {"train_loss": -27.57441520690918, "global_step": 597205, "epoch": 7195} {"train_loss": -27.89908790588379, "global_step": 597206, "epoch": 7195} {"train_loss": -28.131153106689453, "global_step": 597207, "epoch": 7195} {"train_loss": -27.643131256103516, "global_step": 597208, "epoch": 7195} {"train_loss": -27.546422958374023, "global_step": 597209, "epoch": 7195} {"train_loss": -27.966724395751953, "global_step": 597210, "epoch": 7195} {"train_loss": -28.319110870361328, "global_step": 597211, "epoch": 7195} {"train_loss": -28.200286865234375, "global_step": 597212, "epoch": 7195} {"train_loss": -27.667179107666016, "global_step": 597213, "epoch": 7195} {"train_loss": -28.067251205444336, "global_step": 597214, "epoch": 7195} {"train_loss": -27.998620986938477, "global_step": 597215, "epoch": 7195} {"train_loss": -27.8671875, "global_step": 597216, "epoch": 7195} {"train_loss": -27.805517196655273, "global_step": 597217, "epoch": 7195} {"train_loss": -27.795989990234375, "global_step": 597218, "epoch": 7195} {"train_loss": -28.140716552734375, "global_step": 597219, "epoch": 7195} {"train_loss": -27.939062118530273, "global_step": 597220, "epoch": 7195} {"train_loss": -28.022480010986328, "global_step": 597221, "epoch": 7195} {"train_loss": -28.110815048217773, "global_step": 597222, "epoch": 7195} {"train_loss": -28.268091201782227, "global_step": 597223, "epoch": 7195} {"train_loss": -27.86976432800293, "global_step": 597224, "epoch": 7195} {"train_loss": -28.117536544799805, "global_step": 597225, "epoch": 7195} {"train_loss": -28.092361450195312, "global_step": 597226, "epoch": 7195} {"train_loss": -28.160688400268555, "global_step": 597227, "epoch": 7195} {"train_loss": -28.155073165893555, "global_step": 597228, "epoch": 7195} {"train_loss": -27.80670738220215, "global_step": 597229, "epoch": 7195} {"train_loss": -28.14786148071289, "global_step": 597230, "epoch": 7195} {"train_loss": -27.85774040222168, "global_step": 597231, "epoch": 7195} {"train_loss": -28.228607177734375, "global_step": 597232, "epoch": 7195} {"train_loss": -28.138904571533203, "global_step": 597233, "epoch": 7195} {"train_loss": -28.10212516784668, "global_step": 597234, "epoch": 7195} {"train_loss": -27.910919189453125, "global_step": 597235, "epoch": 7195} {"train_loss": -28.459115982055664, "global_step": 597236, "epoch": 7195} {"train_loss": -27.767568588256836, "global_step": 597237, "epoch": 7195} {"train_loss": -28.092636108398438, "global_step": 597238, "epoch": 7195} {"train_loss": -27.877531051635742, "global_step": 597239, "epoch": 7195} {"train_loss": -28.399030685424805, "global_step": 597240, "epoch": 7195} {"train_loss": -28.122175216674805, "global_step": 597241, "epoch": 7195} {"train_loss": -28.091632843017578, "global_step": 597242, "epoch": 7195} {"train_loss": -28.637353897094727, "global_step": 597243, "epoch": 7195} {"train_loss": -28.118255615234375, "global_step": 597244, "epoch": 7195} {"train_loss": -28.241239547729492, "global_step": 597245, "epoch": 7195} {"train_loss": -27.94919204711914, "global_step": 597246, "epoch": 7195} {"train_loss": -28.039342880249023, "global_step": 597247, "epoch": 7195} {"train_loss": -28.00697898864746, "global_step": 597248, "epoch": 7195} {"train_loss": -28.488000869750977, "global_step": 597249, "epoch": 7195} {"train_loss": -27.96255874633789, "global_step": 597250, "epoch": 7195} {"train_loss": -28.1162166595459, "global_step": 597251, "epoch": 7195} {"train_loss": -27.790109634399414, "global_step": 597252, "epoch": 7195} {"train_loss": -28.27982521057129, "global_step": 597253, "epoch": 7195} {"train_loss": -28.063573837280273, "global_step": 597254, "epoch": 7195} {"train_loss": -28.06580924987793, "global_step": 597255, "epoch": 7195} {"train_loss": -28.067541122436523, "global_step": 597256, "epoch": 7195} {"train_loss": -28.14777183532715, "global_step": 597257, "epoch": 7195} {"train_loss": -28.095916748046875, "global_step": 597258, "epoch": 7195} {"train_loss": -28.29127311706543, "global_step": 597259, "epoch": 7195} {"train_loss": -28.23903465270996, "global_step": 597260, "epoch": 7195} {"train_loss": -27.88526725769043, "global_step": 597261, "epoch": 7195} {"train_loss": -27.81915855407715, "global_step": 597262, "epoch": 7195} {"train_loss": -27.874755859375, "global_step": 597263, "epoch": 7195} {"train_loss": -27.7384033203125, "global_step": 597264, "epoch": 7195} {"train_loss": -27.516721725463867, "global_step": 597265, "epoch": 7195} {"train_loss": -27.001646041870117, "global_step": 597266, "epoch": 7195} {"train_loss": -27.894974214484893, "global_step": 597267, "epoch": 7195, "val_loss": 6635951.5} {"train_loss": -27.454843521118164, "global_step": 597268, "epoch": 7196} {"train_loss": -27.150684356689453, "global_step": 597269, "epoch": 7196} {"train_loss": -27.264829635620117, "global_step": 597270, "epoch": 7196} {"train_loss": -26.9266357421875, "global_step": 597271, "epoch": 7196} {"train_loss": -27.688180923461914, "global_step": 597272, "epoch": 7196} {"train_loss": -27.28879165649414, "global_step": 597273, "epoch": 7196} {"train_loss": -27.574689865112305, "global_step": 597274, "epoch": 7196} {"train_loss": -27.407705307006836, "global_step": 597275, "epoch": 7196} {"train_loss": -27.321210861206055, "global_step": 597276, "epoch": 7196} {"train_loss": -27.407190322875977, "global_step": 597277, "epoch": 7196} {"train_loss": -27.468229293823242, "global_step": 597278, "epoch": 7196} {"train_loss": -27.55280876159668, "global_step": 597279, "epoch": 7196} {"train_loss": -27.188995361328125, "global_step": 597280, "epoch": 7196} {"train_loss": -28.08963966369629, "global_step": 597281, "epoch": 7196} {"train_loss": -27.476308822631836, "global_step": 597282, "epoch": 7196} {"train_loss": -27.630817413330078, "global_step": 597283, "epoch": 7196} {"train_loss": -27.62175941467285, "global_step": 597284, "epoch": 7196} {"train_loss": -27.454389572143555, "global_step": 597285, "epoch": 7196} {"train_loss": -27.44422721862793, "global_step": 597286, "epoch": 7196} {"train_loss": -27.506427764892578, "global_step": 597287, "epoch": 7196} {"train_loss": -27.729175567626953, "global_step": 597288, "epoch": 7196} {"train_loss": -27.832626342773438, "global_step": 597289, "epoch": 7196} {"train_loss": -27.718341827392578, "global_step": 597290, "epoch": 7196} {"train_loss": -27.854156494140625, "global_step": 597291, "epoch": 7196} {"train_loss": -27.98995018005371, "global_step": 597292, "epoch": 7196} {"train_loss": -27.927078247070312, "global_step": 597293, "epoch": 7196} {"train_loss": -27.925048828125, "global_step": 597294, "epoch": 7196} {"train_loss": -27.786975860595703, "global_step": 597295, "epoch": 7196} {"train_loss": -27.933813095092773, "global_step": 597296, "epoch": 7196} {"train_loss": -27.924787521362305, "global_step": 597297, "epoch": 7196} {"train_loss": -28.06064796447754, "global_step": 597298, "epoch": 7196} {"train_loss": -27.7883358001709, "global_step": 597299, "epoch": 7196} {"train_loss": -27.6888484954834, "global_step": 597300, "epoch": 7196} {"train_loss": -27.93548011779785, "global_step": 597301, "epoch": 7196} {"train_loss": -28.2375545501709, "global_step": 597302, "epoch": 7196} {"train_loss": -27.532018661499023, "global_step": 597303, "epoch": 7196} {"train_loss": -28.068578720092773, "global_step": 597304, "epoch": 7196} {"train_loss": -27.93633460998535, "global_step": 597305, "epoch": 7196} {"train_loss": -27.88026237487793, "global_step": 597306, "epoch": 7196} {"train_loss": -28.0297908782959, "global_step": 597307, "epoch": 7196} {"train_loss": -28.2139835357666, "global_step": 597308, "epoch": 7196} {"train_loss": -28.333850860595703, "global_step": 597309, "epoch": 7196} {"train_loss": -28.561391830444336, "global_step": 597310, "epoch": 7196} {"train_loss": -28.332605361938477, "global_step": 597311, "epoch": 7196} {"train_loss": -28.642810821533203, "global_step": 597312, "epoch": 7196} {"train_loss": -28.411359786987305, "global_step": 597313, "epoch": 7196} {"train_loss": -28.238676071166992, "global_step": 597314, "epoch": 7196} {"train_loss": -28.22810935974121, "global_step": 597315, "epoch": 7196} {"train_loss": -27.82330894470215, "global_step": 597316, "epoch": 7196} {"train_loss": -28.194189071655273, "global_step": 597317, "epoch": 7196} {"train_loss": -27.72287940979004, "global_step": 597318, "epoch": 7196} {"train_loss": -27.485212326049805, "global_step": 597319, "epoch": 7196} {"train_loss": -27.223037719726562, "global_step": 597320, "epoch": 7196} {"train_loss": -26.794164657592773, "global_step": 597321, "epoch": 7196} {"train_loss": -27.29707145690918, "global_step": 597322, "epoch": 7196} {"train_loss": -27.37565040588379, "global_step": 597323, "epoch": 7196} {"train_loss": -28.051776885986328, "global_step": 597324, "epoch": 7196} {"train_loss": -28.278030395507812, "global_step": 597325, "epoch": 7196} {"train_loss": -27.987573623657227, "global_step": 597326, "epoch": 7196} {"train_loss": -27.79628562927246, "global_step": 597327, "epoch": 7196} {"train_loss": -27.80741310119629, "global_step": 597328, "epoch": 7196} {"train_loss": -28.010412216186523, "global_step": 597329, "epoch": 7196} {"train_loss": -28.024457931518555, "global_step": 597330, "epoch": 7196} {"train_loss": -27.63164710998535, "global_step": 597331, "epoch": 7196} {"train_loss": -27.9906063079834, "global_step": 597332, "epoch": 7196} {"train_loss": -27.966053009033203, "global_step": 597333, "epoch": 7196} {"train_loss": -28.354251861572266, "global_step": 597334, "epoch": 7196} {"train_loss": -27.89021110534668, "global_step": 597335, "epoch": 7196} {"train_loss": -27.879608154296875, "global_step": 597336, "epoch": 7196} {"train_loss": -28.29473304748535, "global_step": 597337, "epoch": 7196} {"train_loss": -28.339771270751953, "global_step": 597338, "epoch": 7196} {"train_loss": -28.197265625, "global_step": 597339, "epoch": 7196} {"train_loss": -28.1220760345459, "global_step": 597340, "epoch": 7196} {"train_loss": -27.88508415222168, "global_step": 597341, "epoch": 7196} {"train_loss": -28.299108505249023, "global_step": 597342, "epoch": 7196} {"train_loss": -28.050806045532227, "global_step": 597343, "epoch": 7196} {"train_loss": -27.99306297302246, "global_step": 597344, "epoch": 7196} {"train_loss": -27.97431755065918, "global_step": 597345, "epoch": 7196} {"train_loss": -28.13092613220215, "global_step": 597346, "epoch": 7196} {"train_loss": -28.015262603759766, "global_step": 597347, "epoch": 7196} {"train_loss": -28.270893096923828, "global_step": 597348, "epoch": 7196} {"train_loss": -28.0870361328125, "global_step": 597349, "epoch": 7196} {"train_loss": -27.85123399941318, "global_step": 597350, "epoch": 7196, "val_loss": 6628498.0} {"train_loss": -27.453779220581055, "global_step": 597351, "epoch": 7197} {"train_loss": -27.313068389892578, "global_step": 597352, "epoch": 7197} {"train_loss": -26.93587303161621, "global_step": 597353, "epoch": 7197} {"train_loss": -27.171436309814453, "global_step": 597354, "epoch": 7197} {"train_loss": -26.703033447265625, "global_step": 597355, "epoch": 7197} {"train_loss": -27.196142196655273, "global_step": 597356, "epoch": 7197} {"train_loss": -27.483509063720703, "global_step": 597357, "epoch": 7197} {"train_loss": -27.553991317749023, "global_step": 597358, "epoch": 7197} {"train_loss": -27.382434844970703, "global_step": 597359, "epoch": 7197} {"train_loss": -27.612218856811523, "global_step": 597360, "epoch": 7197} {"train_loss": -27.698123931884766, "global_step": 597361, "epoch": 7197} {"train_loss": -27.38313102722168, "global_step": 597362, "epoch": 7197} {"train_loss": -27.588043212890625, "global_step": 597363, "epoch": 7197} {"train_loss": -27.5718994140625, "global_step": 597364, "epoch": 7197} {"train_loss": -27.216772079467773, "global_step": 597365, "epoch": 7197} {"train_loss": -28.0686092376709, "global_step": 597366, "epoch": 7197} {"train_loss": -27.599674224853516, "global_step": 597367, "epoch": 7197} {"train_loss": -27.844955444335938, "global_step": 597368, "epoch": 7197} {"train_loss": -27.924957275390625, "global_step": 597369, "epoch": 7197} {"train_loss": -28.11463737487793, "global_step": 597370, "epoch": 7197} {"train_loss": -27.650678634643555, "global_step": 597371, "epoch": 7197} {"train_loss": -28.0214900970459, "global_step": 597372, "epoch": 7197} {"train_loss": -27.9086856842041, "global_step": 597373, "epoch": 7197} {"train_loss": -28.239776611328125, "global_step": 597374, "epoch": 7197} {"train_loss": -28.141332626342773, "global_step": 597375, "epoch": 7197} {"train_loss": -27.829730987548828, "global_step": 597376, "epoch": 7197} {"train_loss": -27.94378089904785, "global_step": 597377, "epoch": 7197} {"train_loss": -27.871566772460938, "global_step": 597378, "epoch": 7197} {"train_loss": -27.865697860717773, "global_step": 597379, "epoch": 7197} {"train_loss": -28.241132736206055, "global_step": 597380, "epoch": 7197} {"train_loss": -28.339704513549805, "global_step": 597381, "epoch": 7197} {"train_loss": -27.891416549682617, "global_step": 597382, "epoch": 7197} {"train_loss": -28.072406768798828, "global_step": 597383, "epoch": 7197} {"train_loss": -28.052001953125, "global_step": 597384, "epoch": 7197} {"train_loss": -27.799245834350586, "global_step": 597385, "epoch": 7197} {"train_loss": -28.312976837158203, "global_step": 597386, "epoch": 7197} {"train_loss": -28.3588924407959, "global_step": 597387, "epoch": 7197} {"train_loss": -28.490896224975586, "global_step": 597388, "epoch": 7197} {"train_loss": -28.636449813842773, "global_step": 597389, "epoch": 7197} {"train_loss": -27.972412109375, "global_step": 597390, "epoch": 7197} {"train_loss": -27.68324089050293, "global_step": 597391, "epoch": 7197} {"train_loss": -28.311267852783203, "global_step": 597392, "epoch": 7197} {"train_loss": -28.129852294921875, "global_step": 597393, "epoch": 7197} {"train_loss": -28.340167999267578, "global_step": 597394, "epoch": 7197} {"train_loss": -27.96030044555664, "global_step": 597395, "epoch": 7197} {"train_loss": -28.374597549438477, "global_step": 597396, "epoch": 7197} {"train_loss": -28.420225143432617, "global_step": 597397, "epoch": 7197} {"train_loss": -27.996170043945312, "global_step": 597398, "epoch": 7197} {"train_loss": -28.02570915222168, "global_step": 597399, "epoch": 7197} {"train_loss": -28.59881591796875, "global_step": 597400, "epoch": 7197} {"train_loss": -28.3996524810791, "global_step": 597401, "epoch": 7197} {"train_loss": -27.998239517211914, "global_step": 597402, "epoch": 7197} {"train_loss": -28.388751983642578, "global_step": 597403, "epoch": 7197} {"train_loss": -28.239439010620117, "global_step": 597404, "epoch": 7197} {"train_loss": -28.271814346313477, "global_step": 597405, "epoch": 7197} {"train_loss": -28.28809928894043, "global_step": 597406, "epoch": 7197} {"train_loss": -28.226964950561523, "global_step": 597407, "epoch": 7197} {"train_loss": -28.274723052978516, "global_step": 597408, "epoch": 7197} {"train_loss": -27.932392120361328, "global_step": 597409, "epoch": 7197} {"train_loss": -27.34547233581543, "global_step": 597410, "epoch": 7197} {"train_loss": -26.827713012695312, "global_step": 597411, "epoch": 7197} {"train_loss": -26.8194522857666, "global_step": 597412, "epoch": 7197} {"train_loss": -27.621122360229492, "global_step": 597413, "epoch": 7197} {"train_loss": -27.86209487915039, "global_step": 597414, "epoch": 7197} {"train_loss": -27.294296264648438, "global_step": 597415, "epoch": 7197} {"train_loss": -27.06642723083496, "global_step": 597416, "epoch": 7197} {"train_loss": -27.359134674072266, "global_step": 597417, "epoch": 7197} {"train_loss": -27.537084579467773, "global_step": 597418, "epoch": 7197} {"train_loss": -27.400415420532227, "global_step": 597419, "epoch": 7197} {"train_loss": -28.06168556213379, "global_step": 597420, "epoch": 7197} {"train_loss": -27.81048011779785, "global_step": 597421, "epoch": 7197} {"train_loss": -28.1729736328125, "global_step": 597422, "epoch": 7197} {"train_loss": -27.758359909057617, "global_step": 597423, "epoch": 7197} {"train_loss": -27.55099868774414, "global_step": 597424, "epoch": 7197} {"train_loss": -27.755048751831055, "global_step": 597425, "epoch": 7197} {"train_loss": -27.935413360595703, "global_step": 597426, "epoch": 7197} {"train_loss": -28.039520263671875, "global_step": 597427, "epoch": 7197} {"train_loss": -27.9676456451416, "global_step": 597428, "epoch": 7197} {"train_loss": -28.28999137878418, "global_step": 597429, "epoch": 7197} {"train_loss": -28.105182647705078, "global_step": 597430, "epoch": 7197} {"train_loss": -28.5336971282959, "global_step": 597431, "epoch": 7197} {"train_loss": -27.979455947875977, "global_step": 597432, "epoch": 7197} {"train_loss": -27.859454924801746, "global_step": 597433, "epoch": 7197, "val_loss": 6597350.5} {"train_loss": -27.25189781188965, "global_step": 597434, "epoch": 7198} {"train_loss": -27.55165672302246, "global_step": 597435, "epoch": 7198} {"train_loss": -27.28024673461914, "global_step": 597436, "epoch": 7198} {"train_loss": -27.0531005859375, "global_step": 597437, "epoch": 7198} {"train_loss": -27.494321823120117, "global_step": 597438, "epoch": 7198} {"train_loss": -27.43560218811035, "global_step": 597439, "epoch": 7198} {"train_loss": -27.766143798828125, "global_step": 597440, "epoch": 7198} {"train_loss": -27.664403915405273, "global_step": 597441, "epoch": 7198} {"train_loss": -28.01011085510254, "global_step": 597442, "epoch": 7198} {"train_loss": -27.56122398376465, "global_step": 597443, "epoch": 7198} {"train_loss": -27.83607292175293, "global_step": 597444, "epoch": 7198} {"train_loss": -27.680524826049805, "global_step": 597445, "epoch": 7198} {"train_loss": -27.933454513549805, "global_step": 597446, "epoch": 7198} {"train_loss": -27.57356071472168, "global_step": 597447, "epoch": 7198} {"train_loss": -27.27618408203125, "global_step": 597448, "epoch": 7198} {"train_loss": -27.661609649658203, "global_step": 597449, "epoch": 7198} {"train_loss": -27.52858543395996, "global_step": 597450, "epoch": 7198} {"train_loss": -27.837514877319336, "global_step": 597451, "epoch": 7198} {"train_loss": -27.71845817565918, "global_step": 597452, "epoch": 7198} {"train_loss": -27.733652114868164, "global_step": 597453, "epoch": 7198} {"train_loss": -28.248083114624023, "global_step": 597454, "epoch": 7198} {"train_loss": -28.32842445373535, "global_step": 597455, "epoch": 7198} {"train_loss": -27.937747955322266, "global_step": 597456, "epoch": 7198} {"train_loss": -28.19171142578125, "global_step": 597457, "epoch": 7198} {"train_loss": -28.01202964782715, "global_step": 597458, "epoch": 7198} {"train_loss": -28.079294204711914, "global_step": 597459, "epoch": 7198} {"train_loss": -28.079198837280273, "global_step": 597460, "epoch": 7198} {"train_loss": -28.3779296875, "global_step": 597461, "epoch": 7198} {"train_loss": -28.452001571655273, "global_step": 597462, "epoch": 7198} {"train_loss": -28.242307662963867, "global_step": 597463, "epoch": 7198} {"train_loss": -28.3891544342041, "global_step": 597464, "epoch": 7198} {"train_loss": -27.998493194580078, "global_step": 597465, "epoch": 7198} {"train_loss": -28.103626251220703, "global_step": 597466, "epoch": 7198} {"train_loss": -27.943601608276367, "global_step": 597467, "epoch": 7198} {"train_loss": -27.79526710510254, "global_step": 597468, "epoch": 7198} {"train_loss": -28.0087947845459, "global_step": 597469, "epoch": 7198} {"train_loss": -28.294721603393555, "global_step": 597470, "epoch": 7198} {"train_loss": -27.81320571899414, "global_step": 597471, "epoch": 7198} {"train_loss": -27.977325439453125, "global_step": 597472, "epoch": 7198} {"train_loss": -28.381744384765625, "global_step": 597473, "epoch": 7198} {"train_loss": -28.193578720092773, "global_step": 597474, "epoch": 7198} {"train_loss": -28.341089248657227, "global_step": 597475, "epoch": 7198} {"train_loss": -28.124860763549805, "global_step": 597476, "epoch": 7198} {"train_loss": -28.19447135925293, "global_step": 597477, "epoch": 7198} {"train_loss": -27.7429256439209, "global_step": 597478, "epoch": 7198} {"train_loss": -27.77362632751465, "global_step": 597479, "epoch": 7198} {"train_loss": -28.189176559448242, "global_step": 597480, "epoch": 7198} {"train_loss": -28.017377853393555, "global_step": 597481, "epoch": 7198} {"train_loss": -27.70224952697754, "global_step": 597482, "epoch": 7198} {"train_loss": -27.45576286315918, "global_step": 597483, "epoch": 7198} {"train_loss": -28.1490478515625, "global_step": 597484, "epoch": 7198} {"train_loss": -27.692249298095703, "global_step": 597485, "epoch": 7198} {"train_loss": -27.870664596557617, "global_step": 597486, "epoch": 7198} {"train_loss": -27.669727325439453, "global_step": 597487, "epoch": 7198} {"train_loss": -27.64377784729004, "global_step": 597488, "epoch": 7198} {"train_loss": -28.373815536499023, "global_step": 597489, "epoch": 7198} {"train_loss": -27.82533073425293, "global_step": 597490, "epoch": 7198} {"train_loss": -27.467615127563477, "global_step": 597491, "epoch": 7198} {"train_loss": -27.836816787719727, "global_step": 597492, "epoch": 7198} {"train_loss": -27.86004066467285, "global_step": 597493, "epoch": 7198} {"train_loss": -27.666248321533203, "global_step": 597494, "epoch": 7198} {"train_loss": -27.903308868408203, "global_step": 597495, "epoch": 7198} {"train_loss": -27.864404678344727, "global_step": 597496, "epoch": 7198} {"train_loss": -28.021514892578125, "global_step": 597497, "epoch": 7198} {"train_loss": -28.177927017211914, "global_step": 597498, "epoch": 7198} {"train_loss": -27.778039932250977, "global_step": 597499, "epoch": 7198} {"train_loss": -27.92630386352539, "global_step": 597500, "epoch": 7198} {"train_loss": -28.186670303344727, "global_step": 597501, "epoch": 7198} {"train_loss": -28.23122215270996, "global_step": 597502, "epoch": 7198} {"train_loss": -28.008716583251953, "global_step": 597503, "epoch": 7198} {"train_loss": -28.124731063842773, "global_step": 597504, "epoch": 7198} {"train_loss": -27.789630889892578, "global_step": 597505, "epoch": 7198} {"train_loss": -28.198328018188477, "global_step": 597506, "epoch": 7198} {"train_loss": -28.168750762939453, "global_step": 597507, "epoch": 7198} {"train_loss": -28.337223052978516, "global_step": 597508, "epoch": 7198} {"train_loss": -27.7539005279541, "global_step": 597509, "epoch": 7198} {"train_loss": -28.030603408813477, "global_step": 597510, "epoch": 7198} {"train_loss": -28.235586166381836, "global_step": 597511, "epoch": 7198} {"train_loss": -27.64069938659668, "global_step": 597512, "epoch": 7198} {"train_loss": -28.060972213745117, "global_step": 597513, "epoch": 7198} {"train_loss": -27.939762115478516, "global_step": 597514, "epoch": 7198} {"train_loss": -27.89664077758789, "global_step": 597515, "epoch": 7198} {"train_loss": -27.921146806464137, "global_step": 597516, "epoch": 7198, "val_loss": 6541047.0} {"train_loss": -27.886499404907227, "global_step": 597517, "epoch": 7199} {"train_loss": -27.578388214111328, "global_step": 597518, "epoch": 7199} {"train_loss": -27.66094970703125, "global_step": 597519, "epoch": 7199} {"train_loss": -27.497594833374023, "global_step": 597520, "epoch": 7199} {"train_loss": -27.97307777404785, "global_step": 597521, "epoch": 7199} {"train_loss": -27.678205490112305, "global_step": 597522, "epoch": 7199} {"train_loss": -27.524280548095703, "global_step": 597523, "epoch": 7199} {"train_loss": -27.706579208374023, "global_step": 597524, "epoch": 7199} {"train_loss": -27.793684005737305, "global_step": 597525, "epoch": 7199} {"train_loss": -27.560184478759766, "global_step": 597526, "epoch": 7199} {"train_loss": -27.8829402923584, "global_step": 597527, "epoch": 7199} {"train_loss": -27.820514678955078, "global_step": 597528, "epoch": 7199} {"train_loss": -27.910755157470703, "global_step": 597529, "epoch": 7199} {"train_loss": -27.887479782104492, "global_step": 597530, "epoch": 7199} {"train_loss": -27.847265243530273, "global_step": 597531, "epoch": 7199} {"train_loss": -28.005664825439453, "global_step": 597532, "epoch": 7199} {"train_loss": -28.115005493164062, "global_step": 597533, "epoch": 7199} {"train_loss": -27.68867301940918, "global_step": 597534, "epoch": 7199} {"train_loss": -27.985599517822266, "global_step": 597535, "epoch": 7199} {"train_loss": -28.208209991455078, "global_step": 597536, "epoch": 7199} {"train_loss": -28.0648136138916, "global_step": 597537, "epoch": 7199} {"train_loss": -28.229413986206055, "global_step": 597538, "epoch": 7199} {"train_loss": -27.783599853515625, "global_step": 597539, "epoch": 7199} {"train_loss": -28.009626388549805, "global_step": 597540, "epoch": 7199} {"train_loss": -28.084152221679688, "global_step": 597541, "epoch": 7199} {"train_loss": -27.914081573486328, "global_step": 597542, "epoch": 7199} {"train_loss": -27.97028923034668, "global_step": 597543, "epoch": 7199} {"train_loss": -28.029102325439453, "global_step": 597544, "epoch": 7199} {"train_loss": -28.079687118530273, "global_step": 597545, "epoch": 7199} {"train_loss": -28.14572525024414, "global_step": 597546, "epoch": 7199} {"train_loss": -27.995136260986328, "global_step": 597547, "epoch": 7199} {"train_loss": -27.86100196838379, "global_step": 597548, "epoch": 7199} {"train_loss": -27.96860694885254, "global_step": 597549, "epoch": 7199} {"train_loss": -28.239866256713867, "global_step": 597550, "epoch": 7199} {"train_loss": -27.760705947875977, "global_step": 597551, "epoch": 7199} {"train_loss": -27.93906021118164, "global_step": 597552, "epoch": 7199} {"train_loss": -28.32570457458496, "global_step": 597553, "epoch": 7199} {"train_loss": -27.84649658203125, "global_step": 597554, "epoch": 7199} {"train_loss": -28.3272705078125, "global_step": 597555, "epoch": 7199} {"train_loss": -27.905988693237305, "global_step": 597556, "epoch": 7199} {"train_loss": -27.992712020874023, "global_step": 597557, "epoch": 7199} {"train_loss": -28.42609977722168, "global_step": 597558, "epoch": 7199} {"train_loss": -28.004669189453125, "global_step": 597559, "epoch": 7199} {"train_loss": -27.717519760131836, "global_step": 597560, "epoch": 7199} {"train_loss": -28.26095962524414, "global_step": 597561, "epoch": 7199} {"train_loss": -28.403141021728516, "global_step": 597562, "epoch": 7199} {"train_loss": -28.33698844909668, "global_step": 597563, "epoch": 7199} {"train_loss": -28.115570068359375, "global_step": 597564, "epoch": 7199} {"train_loss": -28.2191162109375, "global_step": 597565, "epoch": 7199} {"train_loss": -28.369482040405273, "global_step": 597566, "epoch": 7199} {"train_loss": -27.952438354492188, "global_step": 597567, "epoch": 7199} {"train_loss": -28.078027725219727, "global_step": 597568, "epoch": 7199} {"train_loss": -27.920093536376953, "global_step": 597569, "epoch": 7199} {"train_loss": -27.600692749023438, "global_step": 597570, "epoch": 7199} {"train_loss": -27.8259220123291, "global_step": 597571, "epoch": 7199} {"train_loss": -28.025243759155273, "global_step": 597572, "epoch": 7199} {"train_loss": -27.980131149291992, "global_step": 597573, "epoch": 7199} {"train_loss": -27.93671989440918, "global_step": 597574, "epoch": 7199} {"train_loss": -28.201902389526367, "global_step": 597575, "epoch": 7199} {"train_loss": -27.830102920532227, "global_step": 597576, "epoch": 7199} {"train_loss": -28.162954330444336, "global_step": 597577, "epoch": 7199} {"train_loss": -27.955575942993164, "global_step": 597578, "epoch": 7199} {"train_loss": -27.992170333862305, "global_step": 597579, "epoch": 7199} {"train_loss": -28.052326202392578, "global_step": 597580, "epoch": 7199} {"train_loss": -28.016021728515625, "global_step": 597581, "epoch": 7199} {"train_loss": -27.761688232421875, "global_step": 597582, "epoch": 7199} {"train_loss": -28.148578643798828, "global_step": 597583, "epoch": 7199} {"train_loss": -28.5351505279541, "global_step": 597584, "epoch": 7199} {"train_loss": -28.10883903503418, "global_step": 597585, "epoch": 7199} {"train_loss": -27.96481704711914, "global_step": 597586, "epoch": 7199} {"train_loss": -28.664936065673828, "global_step": 597587, "epoch": 7199} {"train_loss": -27.97543716430664, "global_step": 597588, "epoch": 7199} {"train_loss": -27.93265151977539, "global_step": 597589, "epoch": 7199} {"train_loss": -27.929296493530273, "global_step": 597590, "epoch": 7199} {"train_loss": -28.401880264282227, "global_step": 597591, "epoch": 7199} {"train_loss": -28.02569580078125, "global_step": 597592, "epoch": 7199} {"train_loss": -27.691511154174805, "global_step": 597593, "epoch": 7199} {"train_loss": -27.734811782836914, "global_step": 597594, "epoch": 7199} {"train_loss": -27.137235641479492, "global_step": 597595, "epoch": 7199} {"train_loss": -28.23369789123535, "global_step": 597596, "epoch": 7199} {"train_loss": -27.75641441345215, "global_step": 597597, "epoch": 7199} {"train_loss": -27.647796630859375, "global_step": 597598, "epoch": 7199} {"train_loss": -27.9830219084958, "global_step": 597599, "epoch": 7199, "val_loss": 6607496.0} {"train_loss": -27.492786407470703, "global_step": 597600, "epoch": 7200} {"train_loss": -27.587512969970703, "global_step": 597601, "epoch": 7200} {"train_loss": -27.624265670776367, "global_step": 597602, "epoch": 7200} {"train_loss": -27.954153060913086, "global_step": 597603, "epoch": 7200} {"train_loss": -27.832828521728516, "global_step": 597604, "epoch": 7200} {"train_loss": -27.532262802124023, "global_step": 597605, "epoch": 7200} {"train_loss": -27.957691192626953, "global_step": 597606, "epoch": 7200} {"train_loss": -27.1458683013916, "global_step": 597607, "epoch": 7200} {"train_loss": -27.50973892211914, "global_step": 597608, "epoch": 7200} {"train_loss": -27.754980087280273, "global_step": 597609, "epoch": 7200} {"train_loss": -27.6677188873291, "global_step": 597610, "epoch": 7200} {"train_loss": -27.777984619140625, "global_step": 597611, "epoch": 7200} {"train_loss": -28.005765914916992, "global_step": 597612, "epoch": 7200} {"train_loss": -27.749526977539062, "global_step": 597613, "epoch": 7200} {"train_loss": -27.958683013916016, "global_step": 597614, "epoch": 7200} {"train_loss": -27.8388729095459, "global_step": 597615, "epoch": 7200} {"train_loss": -27.786834716796875, "global_step": 597616, "epoch": 7200} {"train_loss": -28.057727813720703, "global_step": 597617, "epoch": 7200} {"train_loss": -27.957494735717773, "global_step": 597618, "epoch": 7200} {"train_loss": -27.889795303344727, "global_step": 597619, "epoch": 7200} {"train_loss": -28.113367080688477, "global_step": 597620, "epoch": 7200} {"train_loss": -28.170408248901367, "global_step": 597621, "epoch": 7200} {"train_loss": -27.912145614624023, "global_step": 597622, "epoch": 7200} {"train_loss": -28.17081069946289, "global_step": 597623, "epoch": 7200} {"train_loss": -27.958532333374023, "global_step": 597624, "epoch": 7200} {"train_loss": -28.211490631103516, "global_step": 597625, "epoch": 7200} {"train_loss": -27.91925048828125, "global_step": 597626, "epoch": 7200} {"train_loss": -27.808069229125977, "global_step": 597627, "epoch": 7200} {"train_loss": -27.794849395751953, "global_step": 597628, "epoch": 7200} {"train_loss": -28.111499786376953, "global_step": 597629, "epoch": 7200} {"train_loss": -27.800283432006836, "global_step": 597630, "epoch": 7200} {"train_loss": -27.903858184814453, "global_step": 597631, "epoch": 7200} {"train_loss": -27.976179122924805, "global_step": 597632, "epoch": 7200} {"train_loss": -28.085214614868164, "global_step": 597633, "epoch": 7200} {"train_loss": -27.65283203125, "global_step": 597634, "epoch": 7200} {"train_loss": -27.886667251586914, "global_step": 597635, "epoch": 7200} {"train_loss": -28.074934005737305, "global_step": 597636, "epoch": 7200} {"train_loss": -28.480192184448242, "global_step": 597637, "epoch": 7200} {"train_loss": -28.30610466003418, "global_step": 597638, "epoch": 7200} {"train_loss": -28.006208419799805, "global_step": 597639, "epoch": 7200} {"train_loss": -28.33343505859375, "global_step": 597640, "epoch": 7200} {"train_loss": -28.219898223876953, "global_step": 597641, "epoch": 7200} {"train_loss": -28.16008949279785, "global_step": 597642, "epoch": 7200} {"train_loss": -27.9163761138916, "global_step": 597643, "epoch": 7200} {"train_loss": -28.0947322845459, "global_step": 597644, "epoch": 7200} {"train_loss": -28.20684814453125, "global_step": 597645, "epoch": 7200} {"train_loss": -28.221710205078125, "global_step": 597646, "epoch": 7200} {"train_loss": -28.155500411987305, "global_step": 597647, "epoch": 7200} {"train_loss": -28.34649658203125, "global_step": 597648, "epoch": 7200} {"train_loss": -27.92218589782715, "global_step": 597649, "epoch": 7200} {"train_loss": -27.732370376586914, "global_step": 597650, "epoch": 7200} {"train_loss": -28.066791534423828, "global_step": 597651, "epoch": 7200} {"train_loss": -27.906946182250977, "global_step": 597652, "epoch": 7200} {"train_loss": -27.8417911529541, "global_step": 597653, "epoch": 7200} {"train_loss": -28.09943199157715, "global_step": 597654, "epoch": 7200} {"train_loss": -28.031702041625977, "global_step": 597655, "epoch": 7200} {"train_loss": -28.0023250579834, "global_step": 597656, "epoch": 7200} {"train_loss": -27.900665283203125, "global_step": 597657, "epoch": 7200} {"train_loss": -28.65009117126465, "global_step": 597658, "epoch": 7200} {"train_loss": -27.66192626953125, "global_step": 597659, "epoch": 7200} {"train_loss": -28.266149520874023, "global_step": 597660, "epoch": 7200} {"train_loss": -28.092060089111328, "global_step": 597661, "epoch": 7200} {"train_loss": -28.421125411987305, "global_step": 597662, "epoch": 7200} {"train_loss": -28.041223526000977, "global_step": 597663, "epoch": 7200} {"train_loss": -27.97943115234375, "global_step": 597664, "epoch": 7200} {"train_loss": -27.501020431518555, "global_step": 597665, "epoch": 7200} {"train_loss": -28.131622314453125, "global_step": 597666, "epoch": 7200} {"train_loss": -27.971288681030273, "global_step": 597667, "epoch": 7200} {"train_loss": -28.20599365234375, "global_step": 597668, "epoch": 7200} {"train_loss": -27.909133911132812, "global_step": 597669, "epoch": 7200} {"train_loss": -28.319055557250977, "global_step": 597670, "epoch": 7200} {"train_loss": -28.39103126525879, "global_step": 597671, "epoch": 7200} {"train_loss": -27.914749145507812, "global_step": 597672, "epoch": 7200} {"train_loss": -28.358991622924805, "global_step": 597673, "epoch": 7200} {"train_loss": -28.43890953063965, "global_step": 597674, "epoch": 7200} {"train_loss": -27.845901489257812, "global_step": 597675, "epoch": 7200} {"train_loss": -28.237518310546875, "global_step": 597676, "epoch": 7200} {"train_loss": -28.08051872253418, "global_step": 597677, "epoch": 7200} {"train_loss": -27.88923454284668, "global_step": 597678, "epoch": 7200} {"train_loss": -28.1874942779541, "global_step": 597679, "epoch": 7200} {"train_loss": -28.1510066986084, "global_step": 597680, "epoch": 7200} {"train_loss": -27.971023559570312, "global_step": 597681, "epoch": 7200} {"train_loss": -27.9785058814359, "global_step": 597682, "epoch": 7200, "train/sim_max_reward_0": 0.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4500000": 1.0, "test/sim_max_reward_4500001": 1.0, "test/sim_max_reward_4500002": 1.0, "test/sim_max_reward_4500003": 1.0, "test/sim_max_reward_4500004": 1.0, "test/sim_max_reward_4500005": 1.0, "test/sim_max_reward_4500006": 1.0, "test/sim_max_reward_4500007": 1.0, "test/sim_max_reward_4500008": 1.0, "test/sim_max_reward_4500009": 1.0, "test/sim_max_reward_4500010": 1.0, "test/sim_max_reward_4500011": 1.0, "test/sim_max_reward_4500012": 1.0, "test/sim_max_reward_4500013": 0.0, "test/sim_max_reward_4500014": 1.0, "test/sim_max_reward_4500015": 1.0, "test/sim_max_reward_4500016": 1.0, "test/sim_max_reward_4500017": 1.0, "test/sim_max_reward_4500018": 0.0, "test/sim_max_reward_4500019": 1.0, "test/sim_max_reward_4500020": 1.0, "test/sim_max_reward_4500021": 1.0, "train/mean_score": 0.8333333333333334, "test/mean_score": 0.9090909090909091, "val_loss": 6556879.0} {"train_loss": -27.441253662109375, "global_step": 597683, "epoch": 7201} {"train_loss": -26.873889923095703, "global_step": 597684, "epoch": 7201} {"train_loss": -27.6612491607666, "global_step": 597685, "epoch": 7201} {"train_loss": -27.871536254882812, "global_step": 597686, "epoch": 7201} {"train_loss": -27.385766983032227, "global_step": 597687, "epoch": 7201} {"train_loss": -27.314090728759766, "global_step": 597688, "epoch": 7201} {"train_loss": -27.369421005249023, "global_step": 597689, "epoch": 7201} {"train_loss": -27.521631240844727, "global_step": 597690, "epoch": 7201} {"train_loss": -27.295166015625, "global_step": 597691, "epoch": 7201} {"train_loss": -27.701770782470703, "global_step": 597692, "epoch": 7201} {"train_loss": -27.721790313720703, "global_step": 597693, "epoch": 7201} {"train_loss": -27.866621017456055, "global_step": 597694, "epoch": 7201} {"train_loss": -27.644201278686523, "global_step": 597695, "epoch": 7201} {"train_loss": -27.817626953125, "global_step": 597696, "epoch": 7201} {"train_loss": -27.540283203125, "global_step": 597697, "epoch": 7201} {"train_loss": -27.751840591430664, "global_step": 597698, "epoch": 7201} {"train_loss": -28.023679733276367, "global_step": 597699, "epoch": 7201} {"train_loss": -27.742507934570312, "global_step": 597700, "epoch": 7201} {"train_loss": -27.857635498046875, "global_step": 597701, "epoch": 7201} {"train_loss": -28.07990074157715, "global_step": 597702, "epoch": 7201} {"train_loss": -27.967863082885742, "global_step": 597703, "epoch": 7201} {"train_loss": -28.17618179321289, "global_step": 597704, "epoch": 7201} {"train_loss": -28.08481788635254, "global_step": 597705, "epoch": 7201} {"train_loss": -27.83233642578125, "global_step": 597706, "epoch": 7201} {"train_loss": -27.75146484375, "global_step": 597707, "epoch": 7201} {"train_loss": -28.191816329956055, "global_step": 597708, "epoch": 7201} {"train_loss": -28.366735458374023, "global_step": 597709, "epoch": 7201} {"train_loss": -27.88347816467285, "global_step": 597710, "epoch": 7201} {"train_loss": -28.097787857055664, "global_step": 597711, "epoch": 7201} {"train_loss": -28.315641403198242, "global_step": 597712, "epoch": 7201} {"train_loss": -28.0472469329834, "global_step": 597713, "epoch": 7201} {"train_loss": -27.841053009033203, "global_step": 597714, "epoch": 7201} {"train_loss": -28.061477661132812, "global_step": 597715, "epoch": 7201} {"train_loss": -28.27849769592285, "global_step": 597716, "epoch": 7201} {"train_loss": -27.95612907409668, "global_step": 597717, "epoch": 7201} {"train_loss": -27.98785972595215, "global_step": 597718, "epoch": 7201} {"train_loss": -28.14946937561035, "global_step": 597719, "epoch": 7201} {"train_loss": -28.268964767456055, "global_step": 597720, "epoch": 7201} {"train_loss": -28.0955867767334, "global_step": 597721, "epoch": 7201} {"train_loss": -27.8311767578125, "global_step": 597722, "epoch": 7201} {"train_loss": -27.540180206298828, "global_step": 597723, "epoch": 7201} {"train_loss": -28.350324630737305, "global_step": 597724, "epoch": 7201} {"train_loss": -27.84586524963379, "global_step": 597725, "epoch": 7201} {"train_loss": -27.617712020874023, "global_step": 597726, "epoch": 7201} {"train_loss": -27.987594604492188, "global_step": 597727, "epoch": 7201} {"train_loss": -27.82295799255371, "global_step": 597728, "epoch": 7201} {"train_loss": -27.7806453704834, "global_step": 597729, "epoch": 7201} {"train_loss": -28.029254913330078, "global_step": 597730, "epoch": 7201} {"train_loss": -27.902191162109375, "global_step": 597731, "epoch": 7201} {"train_loss": -27.651288986206055, "global_step": 597732, "epoch": 7201} {"train_loss": -28.06062889099121, "global_step": 597733, "epoch": 7201} {"train_loss": -27.90789794921875, "global_step": 597734, "epoch": 7201} {"train_loss": -27.91560173034668, "global_step": 597735, "epoch": 7201} {"train_loss": -28.257410049438477, "global_step": 597736, "epoch": 7201} {"train_loss": -28.09246826171875, "global_step": 597737, "epoch": 7201} {"train_loss": -27.743581771850586, "global_step": 597738, "epoch": 7201} {"train_loss": -27.934406280517578, "global_step": 597739, "epoch": 7201} {"train_loss": -27.968358993530273, "global_step": 597740, "epoch": 7201} {"train_loss": -27.744054794311523, "global_step": 597741, "epoch": 7201} {"train_loss": -27.599048614501953, "global_step": 597742, "epoch": 7201} {"train_loss": -28.28643798828125, "global_step": 597743, "epoch": 7201} {"train_loss": -27.9837589263916, "global_step": 597744, "epoch": 7201} {"train_loss": -27.628854751586914, "global_step": 597745, "epoch": 7201} {"train_loss": -27.719562530517578, "global_step": 597746, "epoch": 7201} {"train_loss": -27.786380767822266, "global_step": 597747, "epoch": 7201} {"train_loss": -28.414541244506836, "global_step": 597748, "epoch": 7201} {"train_loss": -27.92435073852539, "global_step": 597749, "epoch": 7201} {"train_loss": -28.001300811767578, "global_step": 597750, "epoch": 7201} {"train_loss": -27.600086212158203, "global_step": 597751, "epoch": 7201} {"train_loss": -27.825292587280273, "global_step": 597752, "epoch": 7201} {"train_loss": -27.78363037109375, "global_step": 597753, "epoch": 7201} {"train_loss": -28.043691635131836, "global_step": 597754, "epoch": 7201} {"train_loss": -27.944971084594727, "global_step": 597755, "epoch": 7201} {"train_loss": -27.90974235534668, "global_step": 597756, "epoch": 7201} {"train_loss": -27.899866104125977, "global_step": 597757, "epoch": 7201} {"train_loss": -28.01325035095215, "global_step": 597758, "epoch": 7201} {"train_loss": -28.570114135742188, "global_step": 597759, "epoch": 7201} {"train_loss": -28.36722755432129, "global_step": 597760, "epoch": 7201} {"train_loss": -27.921072006225586, "global_step": 597761, "epoch": 7201} {"train_loss": -28.31135368347168, "global_step": 597762, "epoch": 7201} {"train_loss": -28.196918487548828, "global_step": 597763, "epoch": 7201} {"train_loss": -28.200193405151367, "global_step": 597764, "epoch": 7201} {"train_loss": -27.916477846812054, "global_step": 597765, "epoch": 7201, "val_loss": 6638091.5} {"train_loss": -27.181238174438477, "global_step": 597766, "epoch": 7202} {"train_loss": -27.428543090820312, "global_step": 597767, "epoch": 7202} {"train_loss": -27.382465362548828, "global_step": 597768, "epoch": 7202} {"train_loss": -27.830322265625, "global_step": 597769, "epoch": 7202} {"train_loss": -27.98469352722168, "global_step": 597770, "epoch": 7202} {"train_loss": -27.65960121154785, "global_step": 597771, "epoch": 7202} {"train_loss": -27.80206298828125, "global_step": 597772, "epoch": 7202} {"train_loss": -27.961334228515625, "global_step": 597773, "epoch": 7202} {"train_loss": -27.75434684753418, "global_step": 597774, "epoch": 7202} {"train_loss": -28.06325340270996, "global_step": 597775, "epoch": 7202} {"train_loss": -27.82802391052246, "global_step": 597776, "epoch": 7202} {"train_loss": -27.92512321472168, "global_step": 597777, "epoch": 7202} {"train_loss": -28.105823516845703, "global_step": 597778, "epoch": 7202} {"train_loss": -28.124801635742188, "global_step": 597779, "epoch": 7202} {"train_loss": -27.92236328125, "global_step": 597780, "epoch": 7202} {"train_loss": -27.930694580078125, "global_step": 597781, "epoch": 7202} {"train_loss": -28.185699462890625, "global_step": 597782, "epoch": 7202} {"train_loss": -28.3719539642334, "global_step": 597783, "epoch": 7202} {"train_loss": -27.698383331298828, "global_step": 597784, "epoch": 7202} {"train_loss": -28.216215133666992, "global_step": 597785, "epoch": 7202} {"train_loss": -28.126373291015625, "global_step": 597786, "epoch": 7202} {"train_loss": -27.89396095275879, "global_step": 597787, "epoch": 7202} {"train_loss": -27.920175552368164, "global_step": 597788, "epoch": 7202} {"train_loss": -27.35723876953125, "global_step": 597789, "epoch": 7202} {"train_loss": -27.924463272094727, "global_step": 597790, "epoch": 7202} {"train_loss": -27.270109176635742, "global_step": 597791, "epoch": 7202} {"train_loss": -28.07508659362793, "global_step": 597792, "epoch": 7202} {"train_loss": -27.808629989624023, "global_step": 597793, "epoch": 7202} {"train_loss": -27.98084831237793, "global_step": 597794, "epoch": 7202} {"train_loss": -27.727344512939453, "global_step": 597795, "epoch": 7202} {"train_loss": -27.823978424072266, "global_step": 597796, "epoch": 7202} {"train_loss": -28.08609390258789, "global_step": 597797, "epoch": 7202} {"train_loss": -27.61859130859375, "global_step": 597798, "epoch": 7202} {"train_loss": -27.55521583557129, "global_step": 597799, "epoch": 7202} {"train_loss": -27.837865829467773, "global_step": 597800, "epoch": 7202} {"train_loss": -27.6483211517334, "global_step": 597801, "epoch": 7202} {"train_loss": -27.95234489440918, "global_step": 597802, "epoch": 7202} {"train_loss": -27.535913467407227, "global_step": 597803, "epoch": 7202} {"train_loss": -28.083850860595703, "global_step": 597804, "epoch": 7202} {"train_loss": -27.624948501586914, "global_step": 597805, "epoch": 7202} {"train_loss": -27.82990074157715, "global_step": 597806, "epoch": 7202} {"train_loss": -27.99246597290039, "global_step": 597807, "epoch": 7202} {"train_loss": -28.09381103515625, "global_step": 597808, "epoch": 7202} {"train_loss": -27.493698120117188, "global_step": 597809, "epoch": 7202} {"train_loss": -27.80010414123535, "global_step": 597810, "epoch": 7202} {"train_loss": -27.921899795532227, "global_step": 597811, "epoch": 7202} {"train_loss": -27.9602108001709, "global_step": 597812, "epoch": 7202} {"train_loss": -27.88123893737793, "global_step": 597813, "epoch": 7202} {"train_loss": -27.977075576782227, "global_step": 597814, "epoch": 7202} {"train_loss": -27.7502498626709, "global_step": 597815, "epoch": 7202} {"train_loss": -27.874704360961914, "global_step": 597816, "epoch": 7202} {"train_loss": -27.636932373046875, "global_step": 597817, "epoch": 7202} {"train_loss": -27.986059188842773, "global_step": 597818, "epoch": 7202} {"train_loss": -28.507959365844727, "global_step": 597819, "epoch": 7202} {"train_loss": -28.2556209564209, "global_step": 597820, "epoch": 7202} {"train_loss": -27.78188133239746, "global_step": 597821, "epoch": 7202} {"train_loss": -28.26761817932129, "global_step": 597822, "epoch": 7202} {"train_loss": -27.880369186401367, "global_step": 597823, "epoch": 7202} {"train_loss": -27.86481285095215, "global_step": 597824, "epoch": 7202} {"train_loss": -28.172849655151367, "global_step": 597825, "epoch": 7202} {"train_loss": -27.516681671142578, "global_step": 597826, "epoch": 7202} {"train_loss": -27.8992919921875, "global_step": 597827, "epoch": 7202} {"train_loss": -27.849430084228516, "global_step": 597828, "epoch": 7202} {"train_loss": -28.04963493347168, "global_step": 597829, "epoch": 7202} {"train_loss": -27.698389053344727, "global_step": 597830, "epoch": 7202} {"train_loss": -28.11689567565918, "global_step": 597831, "epoch": 7202} {"train_loss": -28.270156860351562, "global_step": 597832, "epoch": 7202} {"train_loss": -28.105337142944336, "global_step": 597833, "epoch": 7202} {"train_loss": -27.86602783203125, "global_step": 597834, "epoch": 7202} {"train_loss": -27.991901397705078, "global_step": 597835, "epoch": 7202} {"train_loss": -27.938528060913086, "global_step": 597836, "epoch": 7202} {"train_loss": -28.115076065063477, "global_step": 597837, "epoch": 7202} {"train_loss": -27.928119659423828, "global_step": 597838, "epoch": 7202} {"train_loss": -27.89764976501465, "global_step": 597839, "epoch": 7202} {"train_loss": -28.01340675354004, "global_step": 597840, "epoch": 7202} {"train_loss": -27.61795997619629, "global_step": 597841, "epoch": 7202} {"train_loss": -27.93305778503418, "global_step": 597842, "epoch": 7202} {"train_loss": -27.732099533081055, "global_step": 597843, "epoch": 7202} {"train_loss": -27.897079467773438, "global_step": 597844, "epoch": 7202} {"train_loss": -27.84992790222168, "global_step": 597845, "epoch": 7202} {"train_loss": -28.084699630737305, "global_step": 597846, "epoch": 7202} {"train_loss": -28.47991943359375, "global_step": 597847, "epoch": 7202} {"train_loss": -27.89983466734369, "global_step": 597848, "epoch": 7202, "val_loss": 6578255.0} {"train_loss": -24.635841369628906, "global_step": 597849, "epoch": 7203} {"train_loss": -25.295040130615234, "global_step": 597850, "epoch": 7203} {"train_loss": -26.786954879760742, "global_step": 597851, "epoch": 7203} {"train_loss": -25.857498168945312, "global_step": 597852, "epoch": 7203} {"train_loss": -26.811498641967773, "global_step": 597853, "epoch": 7203} {"train_loss": -26.161962509155273, "global_step": 597854, "epoch": 7203} {"train_loss": -26.6507568359375, "global_step": 597855, "epoch": 7203} {"train_loss": -26.357465744018555, "global_step": 597856, "epoch": 7203} {"train_loss": -26.95539665222168, "global_step": 597857, "epoch": 7203} {"train_loss": -26.623138427734375, "global_step": 597858, "epoch": 7203} {"train_loss": -26.856908798217773, "global_step": 597859, "epoch": 7203} {"train_loss": -27.081052780151367, "global_step": 597860, "epoch": 7203} {"train_loss": -27.195287704467773, "global_step": 597861, "epoch": 7203} {"train_loss": -27.12835693359375, "global_step": 597862, "epoch": 7203} {"train_loss": -26.96235466003418, "global_step": 597863, "epoch": 7203} {"train_loss": -27.20730972290039, "global_step": 597864, "epoch": 7203} {"train_loss": -27.220861434936523, "global_step": 597865, "epoch": 7203} {"train_loss": -27.117706298828125, "global_step": 597866, "epoch": 7203} {"train_loss": -27.58546257019043, "global_step": 597867, "epoch": 7203} {"train_loss": -27.646652221679688, "global_step": 597868, "epoch": 7203} {"train_loss": -26.98331069946289, "global_step": 597869, "epoch": 7203} {"train_loss": -27.449697494506836, "global_step": 597870, "epoch": 7203} {"train_loss": -27.53727149963379, "global_step": 597871, "epoch": 7203} {"train_loss": -27.364444732666016, "global_step": 597872, "epoch": 7203} {"train_loss": -27.215112686157227, "global_step": 597873, "epoch": 7203} {"train_loss": -27.47113609313965, "global_step": 597874, "epoch": 7203} {"train_loss": -27.610183715820312, "global_step": 597875, "epoch": 7203} {"train_loss": -27.344348907470703, "global_step": 597876, "epoch": 7203} {"train_loss": -27.51125144958496, "global_step": 597877, "epoch": 7203} {"train_loss": -27.6954402923584, "global_step": 597878, "epoch": 7203} {"train_loss": -27.539031982421875, "global_step": 597879, "epoch": 7203} {"train_loss": -27.872955322265625, "global_step": 597880, "epoch": 7203} {"train_loss": -27.683618545532227, "global_step": 597881, "epoch": 7203} {"train_loss": -27.471729278564453, "global_step": 597882, "epoch": 7203} {"train_loss": -27.6774959564209, "global_step": 597883, "epoch": 7203} {"train_loss": -27.68824577331543, "global_step": 597884, "epoch": 7203} {"train_loss": -28.162057876586914, "global_step": 597885, "epoch": 7203} {"train_loss": -27.674779891967773, "global_step": 597886, "epoch": 7203} {"train_loss": -27.605182647705078, "global_step": 597887, "epoch": 7203} {"train_loss": -27.905029296875, "global_step": 597888, "epoch": 7203} {"train_loss": -27.991840362548828, "global_step": 597889, "epoch": 7203} {"train_loss": -27.769073486328125, "global_step": 597890, "epoch": 7203} {"train_loss": -27.823596954345703, "global_step": 597891, "epoch": 7203} {"train_loss": -27.94172477722168, "global_step": 597892, "epoch": 7203} {"train_loss": -27.89664077758789, "global_step": 597893, "epoch": 7203} {"train_loss": -27.980865478515625, "global_step": 597894, "epoch": 7203} {"train_loss": -28.074573516845703, "global_step": 597895, "epoch": 7203} {"train_loss": -28.257434844970703, "global_step": 597896, "epoch": 7203} {"train_loss": -28.38495445251465, "global_step": 597897, "epoch": 7203} {"train_loss": -28.112884521484375, "global_step": 597898, "epoch": 7203} {"train_loss": -27.82899284362793, "global_step": 597899, "epoch": 7203} {"train_loss": -27.67982292175293, "global_step": 597900, "epoch": 7203} {"train_loss": -28.041105270385742, "global_step": 597901, "epoch": 7203} {"train_loss": -27.961822509765625, "global_step": 597902, "epoch": 7203} {"train_loss": -28.050048828125, "global_step": 597903, "epoch": 7203} {"train_loss": -27.9785213470459, "global_step": 597904, "epoch": 7203} {"train_loss": -28.466550827026367, "global_step": 597905, "epoch": 7203} {"train_loss": -28.017892837524414, "global_step": 597906, "epoch": 7203} {"train_loss": -28.15155601501465, "global_step": 597907, "epoch": 7203} {"train_loss": -27.899433135986328, "global_step": 597908, "epoch": 7203} {"train_loss": -28.30755043029785, "global_step": 597909, "epoch": 7203} {"train_loss": -28.115842819213867, "global_step": 597910, "epoch": 7203} {"train_loss": -28.044189453125, "global_step": 597911, "epoch": 7203} {"train_loss": -27.622594833374023, "global_step": 597912, "epoch": 7203} {"train_loss": -27.949872970581055, "global_step": 597913, "epoch": 7203} {"train_loss": -27.64361000061035, "global_step": 597914, "epoch": 7203} {"train_loss": -27.885009765625, "global_step": 597915, "epoch": 7203} {"train_loss": -27.683088302612305, "global_step": 597916, "epoch": 7203} {"train_loss": -27.768224716186523, "global_step": 597917, "epoch": 7203} {"train_loss": -28.121931076049805, "global_step": 597918, "epoch": 7203} {"train_loss": -27.84108543395996, "global_step": 597919, "epoch": 7203} {"train_loss": -27.712921142578125, "global_step": 597920, "epoch": 7203} {"train_loss": -28.127832412719727, "global_step": 597921, "epoch": 7203} {"train_loss": -27.92047691345215, "global_step": 597922, "epoch": 7203} {"train_loss": -28.124319076538086, "global_step": 597923, "epoch": 7203} {"train_loss": -28.400373458862305, "global_step": 597924, "epoch": 7203} {"train_loss": -27.93292808532715, "global_step": 597925, "epoch": 7203} {"train_loss": -27.798614501953125, "global_step": 597926, "epoch": 7203} {"train_loss": -28.010486602783203, "global_step": 597927, "epoch": 7203} {"train_loss": -28.514911651611328, "global_step": 597928, "epoch": 7203} {"train_loss": -28.133502960205078, "global_step": 597929, "epoch": 7203} {"train_loss": -27.99860191345215, "global_step": 597930, "epoch": 7203} {"train_loss": -27.571958403989495, "global_step": 597931, "epoch": 7203, "val_loss": 6479312.0} {"train_loss": -28.001184463500977, "global_step": 597932, "epoch": 7204} {"train_loss": -27.272693634033203, "global_step": 597933, "epoch": 7204} {"train_loss": -27.3616886138916, "global_step": 597934, "epoch": 7204} {"train_loss": -27.305273056030273, "global_step": 597935, "epoch": 7204} {"train_loss": -27.373273849487305, "global_step": 597936, "epoch": 7204} {"train_loss": -27.664005279541016, "global_step": 597937, "epoch": 7204} {"train_loss": -27.30620765686035, "global_step": 597938, "epoch": 7204} {"train_loss": -27.487363815307617, "global_step": 597939, "epoch": 7204} {"train_loss": -27.64678955078125, "global_step": 597940, "epoch": 7204} {"train_loss": -27.419885635375977, "global_step": 597941, "epoch": 7204} {"train_loss": -27.446725845336914, "global_step": 597942, "epoch": 7204} {"train_loss": -27.702945709228516, "global_step": 597943, "epoch": 7204} {"train_loss": -27.369953155517578, "global_step": 597944, "epoch": 7204} {"train_loss": -27.874942779541016, "global_step": 597945, "epoch": 7204} {"train_loss": -27.6024112701416, "global_step": 597946, "epoch": 7204} {"train_loss": -27.87613296508789, "global_step": 597947, "epoch": 7204} {"train_loss": -27.856765747070312, "global_step": 597948, "epoch": 7204} {"train_loss": -27.857421875, "global_step": 597949, "epoch": 7204} {"train_loss": -27.535633087158203, "global_step": 597950, "epoch": 7204} {"train_loss": -28.05161476135254, "global_step": 597951, "epoch": 7204} {"train_loss": -28.065237045288086, "global_step": 597952, "epoch": 7204} {"train_loss": -27.494489669799805, "global_step": 597953, "epoch": 7204} {"train_loss": -27.81623649597168, "global_step": 597954, "epoch": 7204} {"train_loss": -27.766965866088867, "global_step": 597955, "epoch": 7204} {"train_loss": -27.745681762695312, "global_step": 597956, "epoch": 7204} {"train_loss": -27.858875274658203, "global_step": 597957, "epoch": 7204} {"train_loss": -28.141510009765625, "global_step": 597958, "epoch": 7204} {"train_loss": -28.075037002563477, "global_step": 597959, "epoch": 7204} {"train_loss": -28.04456901550293, "global_step": 597960, "epoch": 7204} {"train_loss": -28.0897159576416, "global_step": 597961, "epoch": 7204} {"train_loss": -28.072797775268555, "global_step": 597962, "epoch": 7204} {"train_loss": -27.876678466796875, "global_step": 597963, "epoch": 7204} {"train_loss": -28.007801055908203, "global_step": 597964, "epoch": 7204} {"train_loss": -27.95973014831543, "global_step": 597965, "epoch": 7204} {"train_loss": -27.704864501953125, "global_step": 597966, "epoch": 7204} {"train_loss": -28.065433502197266, "global_step": 597967, "epoch": 7204} {"train_loss": -28.212839126586914, "global_step": 597968, "epoch": 7204} {"train_loss": -28.309797286987305, "global_step": 597969, "epoch": 7204} {"train_loss": -28.05389404296875, "global_step": 597970, "epoch": 7204} {"train_loss": -28.202762603759766, "global_step": 597971, "epoch": 7204} {"train_loss": -28.146514892578125, "global_step": 597972, "epoch": 7204} {"train_loss": -28.4525203704834, "global_step": 597973, "epoch": 7204} {"train_loss": -28.36832618713379, "global_step": 597974, "epoch": 7204} {"train_loss": -28.14021110534668, "global_step": 597975, "epoch": 7204} {"train_loss": -28.3759708404541, "global_step": 597976, "epoch": 7204} {"train_loss": -28.172149658203125, "global_step": 597977, "epoch": 7204} {"train_loss": -28.459577560424805, "global_step": 597978, "epoch": 7204} {"train_loss": -28.272497177124023, "global_step": 597979, "epoch": 7204} {"train_loss": -28.5897216796875, "global_step": 597980, "epoch": 7204} {"train_loss": -28.327768325805664, "global_step": 597981, "epoch": 7204} {"train_loss": -28.441242218017578, "global_step": 597982, "epoch": 7204} {"train_loss": -28.490575790405273, "global_step": 597983, "epoch": 7204} {"train_loss": -28.281782150268555, "global_step": 597984, "epoch": 7204} {"train_loss": -27.648218154907227, "global_step": 597985, "epoch": 7204} {"train_loss": -28.196182250976562, "global_step": 597986, "epoch": 7204} {"train_loss": -28.224796295166016, "global_step": 597987, "epoch": 7204} {"train_loss": -27.83442497253418, "global_step": 597988, "epoch": 7204} {"train_loss": -26.825763702392578, "global_step": 597989, "epoch": 7204} {"train_loss": -26.454431533813477, "global_step": 597990, "epoch": 7204} {"train_loss": -26.116613388061523, "global_step": 597991, "epoch": 7204} {"train_loss": -24.96384048461914, "global_step": 597992, "epoch": 7204} {"train_loss": -25.16098403930664, "global_step": 597993, "epoch": 7204} {"train_loss": -27.371795654296875, "global_step": 597994, "epoch": 7204} {"train_loss": -27.39845848083496, "global_step": 597995, "epoch": 7204} {"train_loss": -27.14149284362793, "global_step": 597996, "epoch": 7204} {"train_loss": -27.27703285217285, "global_step": 597997, "epoch": 7204} {"train_loss": -27.605792999267578, "global_step": 597998, "epoch": 7204} {"train_loss": -27.400732040405273, "global_step": 597999, "epoch": 7204} {"train_loss": -27.437301635742188, "global_step": 598000, "epoch": 7204} {"train_loss": -27.400999069213867, "global_step": 598001, "epoch": 7204} {"train_loss": -27.523807525634766, "global_step": 598002, "epoch": 7204} {"train_loss": -27.446557998657227, "global_step": 598003, "epoch": 7204} {"train_loss": -27.393259048461914, "global_step": 598004, "epoch": 7204} {"train_loss": -27.5073184967041, "global_step": 598005, "epoch": 7204} {"train_loss": -27.667377471923828, "global_step": 598006, "epoch": 7204} {"train_loss": -27.471637725830078, "global_step": 598007, "epoch": 7204} {"train_loss": -27.636249542236328, "global_step": 598008, "epoch": 7204} {"train_loss": -27.729963302612305, "global_step": 598009, "epoch": 7204} {"train_loss": -27.9320068359375, "global_step": 598010, "epoch": 7204} {"train_loss": -28.043792724609375, "global_step": 598011, "epoch": 7204} {"train_loss": -27.82313346862793, "global_step": 598012, "epoch": 7204} {"train_loss": -28.0772647857666, "global_step": 598013, "epoch": 7204} {"train_loss": -27.729639444006494, "global_step": 598014, "epoch": 7204, "val_loss": 6599258.5} {"train_loss": -27.128015518188477, "global_step": 598015, "epoch": 7205} {"train_loss": -27.420713424682617, "global_step": 598016, "epoch": 7205} {"train_loss": -27.292184829711914, "global_step": 598017, "epoch": 7205} {"train_loss": -27.32444190979004, "global_step": 598018, "epoch": 7205} {"train_loss": -27.9638614654541, "global_step": 598019, "epoch": 7205} {"train_loss": -28.123361587524414, "global_step": 598020, "epoch": 7205} {"train_loss": -27.491437911987305, "global_step": 598021, "epoch": 7205} {"train_loss": -28.05293083190918, "global_step": 598022, "epoch": 7205} {"train_loss": -27.541412353515625, "global_step": 598023, "epoch": 7205} {"train_loss": -27.8343448638916, "global_step": 598024, "epoch": 7205} {"train_loss": -27.950170516967773, "global_step": 598025, "epoch": 7205} {"train_loss": -27.1451473236084, "global_step": 598026, "epoch": 7205} {"train_loss": -27.87758445739746, "global_step": 598027, "epoch": 7205} {"train_loss": -27.496938705444336, "global_step": 598028, "epoch": 7205} {"train_loss": -27.96826171875, "global_step": 598029, "epoch": 7205} {"train_loss": -27.53071403503418, "global_step": 598030, "epoch": 7205} {"train_loss": -27.65300941467285, "global_step": 598031, "epoch": 7205} {"train_loss": -27.886768341064453, "global_step": 598032, "epoch": 7205} {"train_loss": -28.28339195251465, "global_step": 598033, "epoch": 7205} {"train_loss": -27.895322799682617, "global_step": 598034, "epoch": 7205} {"train_loss": -28.065414428710938, "global_step": 598035, "epoch": 7205} {"train_loss": -27.8909969329834, "global_step": 598036, "epoch": 7205} {"train_loss": -27.95526123046875, "global_step": 598037, "epoch": 7205} {"train_loss": -27.84699821472168, "global_step": 598038, "epoch": 7205} {"train_loss": -28.105289459228516, "global_step": 598039, "epoch": 7205} {"train_loss": -28.058536529541016, "global_step": 598040, "epoch": 7205} {"train_loss": -28.233312606811523, "global_step": 598041, "epoch": 7205} {"train_loss": -28.123544692993164, "global_step": 598042, "epoch": 7205} {"train_loss": -28.44159507751465, "global_step": 598043, "epoch": 7205} {"train_loss": -27.905670166015625, "global_step": 598044, "epoch": 7205} {"train_loss": -28.08220863342285, "global_step": 598045, "epoch": 7205} {"train_loss": -27.99232292175293, "global_step": 598046, "epoch": 7205} {"train_loss": -27.928823471069336, "global_step": 598047, "epoch": 7205} {"train_loss": -27.644683837890625, "global_step": 598048, "epoch": 7205} {"train_loss": -27.988739013671875, "global_step": 598049, "epoch": 7205} {"train_loss": -28.228219985961914, "global_step": 598050, "epoch": 7205} {"train_loss": -28.035558700561523, "global_step": 598051, "epoch": 7205} {"train_loss": -28.379119873046875, "global_step": 598052, "epoch": 7205} {"train_loss": -27.997283935546875, "global_step": 598053, "epoch": 7205} {"train_loss": -28.14190673828125, "global_step": 598054, "epoch": 7205} {"train_loss": -28.201831817626953, "global_step": 598055, "epoch": 7205} {"train_loss": -28.24399185180664, "global_step": 598056, "epoch": 7205} {"train_loss": -27.933218002319336, "global_step": 598057, "epoch": 7205} {"train_loss": -28.258544921875, "global_step": 598058, "epoch": 7205} {"train_loss": -28.16179847717285, "global_step": 598059, "epoch": 7205} {"train_loss": -28.290979385375977, "global_step": 598060, "epoch": 7205} {"train_loss": -27.50897216796875, "global_step": 598061, "epoch": 7205} {"train_loss": -28.187789916992188, "global_step": 598062, "epoch": 7205} {"train_loss": -27.971338272094727, "global_step": 598063, "epoch": 7205} {"train_loss": -28.18451499938965, "global_step": 598064, "epoch": 7205} {"train_loss": -27.642332077026367, "global_step": 598065, "epoch": 7205} {"train_loss": -28.14630699157715, "global_step": 598066, "epoch": 7205} {"train_loss": -28.168354034423828, "global_step": 598067, "epoch": 7205} {"train_loss": -27.975860595703125, "global_step": 598068, "epoch": 7205} {"train_loss": -28.31796646118164, "global_step": 598069, "epoch": 7205} {"train_loss": -28.09842300415039, "global_step": 598070, "epoch": 7205} {"train_loss": -28.27145767211914, "global_step": 598071, "epoch": 7205} {"train_loss": -28.14832878112793, "global_step": 598072, "epoch": 7205} {"train_loss": -27.9959659576416, "global_step": 598073, "epoch": 7205} {"train_loss": -28.06507682800293, "global_step": 598074, "epoch": 7205} {"train_loss": -28.000761032104492, "global_step": 598075, "epoch": 7205} {"train_loss": -28.269216537475586, "global_step": 598076, "epoch": 7205} {"train_loss": -28.291767120361328, "global_step": 598077, "epoch": 7205} {"train_loss": -28.29853630065918, "global_step": 598078, "epoch": 7205} {"train_loss": -27.801864624023438, "global_step": 598079, "epoch": 7205} {"train_loss": -27.71827507019043, "global_step": 598080, "epoch": 7205} {"train_loss": -28.18599510192871, "global_step": 598081, "epoch": 7205} {"train_loss": -27.764984130859375, "global_step": 598082, "epoch": 7205} {"train_loss": -28.081012725830078, "global_step": 598083, "epoch": 7205} {"train_loss": -28.084793090820312, "global_step": 598084, "epoch": 7205} {"train_loss": -28.374195098876953, "global_step": 598085, "epoch": 7205} {"train_loss": -27.71070671081543, "global_step": 598086, "epoch": 7205} {"train_loss": -27.954919815063477, "global_step": 598087, "epoch": 7205} {"train_loss": -27.329498291015625, "global_step": 598088, "epoch": 7205} {"train_loss": -27.035367965698242, "global_step": 598089, "epoch": 7205} {"train_loss": -27.321552276611328, "global_step": 598090, "epoch": 7205} {"train_loss": -28.003904342651367, "global_step": 598091, "epoch": 7205} {"train_loss": -27.8265380859375, "global_step": 598092, "epoch": 7205} {"train_loss": -27.928739547729492, "global_step": 598093, "epoch": 7205} {"train_loss": -28.03205680847168, "global_step": 598094, "epoch": 7205} {"train_loss": -27.838327407836914, "global_step": 598095, "epoch": 7205} {"train_loss": -27.484006881713867, "global_step": 598096, "epoch": 7205} {"train_loss": -27.90973513959402, "global_step": 598097, "epoch": 7205, "val_loss": 6584365.0} {"train_loss": -27.530750274658203, "global_step": 598098, "epoch": 7206} {"train_loss": -27.37653923034668, "global_step": 598099, "epoch": 7206} {"train_loss": -27.710830688476562, "global_step": 598100, "epoch": 7206} {"train_loss": -27.403079986572266, "global_step": 598101, "epoch": 7206} {"train_loss": -27.613386154174805, "global_step": 598102, "epoch": 7206} {"train_loss": -27.44356346130371, "global_step": 598103, "epoch": 7206} {"train_loss": -27.05521011352539, "global_step": 598104, "epoch": 7206} {"train_loss": -27.872678756713867, "global_step": 598105, "epoch": 7206} {"train_loss": -27.539037704467773, "global_step": 598106, "epoch": 7206} {"train_loss": -27.81511878967285, "global_step": 598107, "epoch": 7206} {"train_loss": -27.527692794799805, "global_step": 598108, "epoch": 7206} {"train_loss": -27.63569450378418, "global_step": 598109, "epoch": 7206} {"train_loss": -27.638538360595703, "global_step": 598110, "epoch": 7206} {"train_loss": -27.725921630859375, "global_step": 598111, "epoch": 7206} {"train_loss": -27.860641479492188, "global_step": 598112, "epoch": 7206} {"train_loss": -27.448566436767578, "global_step": 598113, "epoch": 7206} {"train_loss": -27.65157127380371, "global_step": 598114, "epoch": 7206} {"train_loss": -28.027191162109375, "global_step": 598115, "epoch": 7206} {"train_loss": -28.18781089782715, "global_step": 598116, "epoch": 7206} {"train_loss": -27.711084365844727, "global_step": 598117, "epoch": 7206} {"train_loss": -27.806659698486328, "global_step": 598118, "epoch": 7206} {"train_loss": -27.886327743530273, "global_step": 598119, "epoch": 7206} {"train_loss": -28.119327545166016, "global_step": 598120, "epoch": 7206} {"train_loss": -27.76374626159668, "global_step": 598121, "epoch": 7206} {"train_loss": -28.157880783081055, "global_step": 598122, "epoch": 7206} {"train_loss": -28.2614688873291, "global_step": 598123, "epoch": 7206} {"train_loss": -27.943084716796875, "global_step": 598124, "epoch": 7206} {"train_loss": -28.16410255432129, "global_step": 598125, "epoch": 7206} {"train_loss": -27.588857650756836, "global_step": 598126, "epoch": 7206} {"train_loss": -27.8981990814209, "global_step": 598127, "epoch": 7206} {"train_loss": -28.15570068359375, "global_step": 598128, "epoch": 7206} {"train_loss": -28.152204513549805, "global_step": 598129, "epoch": 7206} {"train_loss": -28.08966064453125, "global_step": 598130, "epoch": 7206} {"train_loss": -28.66814613342285, "global_step": 598131, "epoch": 7206} {"train_loss": -28.444345474243164, "global_step": 598132, "epoch": 7206} {"train_loss": -28.07098388671875, "global_step": 598133, "epoch": 7206} {"train_loss": -28.3853702545166, "global_step": 598134, "epoch": 7206} {"train_loss": -27.96236228942871, "global_step": 598135, "epoch": 7206} {"train_loss": -27.886310577392578, "global_step": 598136, "epoch": 7206} {"train_loss": -28.010107040405273, "global_step": 598137, "epoch": 7206} {"train_loss": -28.1508846282959, "global_step": 598138, "epoch": 7206} {"train_loss": -27.82581901550293, "global_step": 598139, "epoch": 7206} {"train_loss": -28.2160587310791, "global_step": 598140, "epoch": 7206} {"train_loss": -28.02750587463379, "global_step": 598141, "epoch": 7206} {"train_loss": -28.39581298828125, "global_step": 598142, "epoch": 7206} {"train_loss": -28.0731201171875, "global_step": 598143, "epoch": 7206} {"train_loss": -28.283491134643555, "global_step": 598144, "epoch": 7206} {"train_loss": -28.0648193359375, "global_step": 598145, "epoch": 7206} {"train_loss": -28.057321548461914, "global_step": 598146, "epoch": 7206} {"train_loss": -27.796194076538086, "global_step": 598147, "epoch": 7206} {"train_loss": -28.166635513305664, "global_step": 598148, "epoch": 7206} {"train_loss": -28.1765079498291, "global_step": 598149, "epoch": 7206} {"train_loss": -28.20631980895996, "global_step": 598150, "epoch": 7206} {"train_loss": -28.069055557250977, "global_step": 598151, "epoch": 7206} {"train_loss": -28.40974998474121, "global_step": 598152, "epoch": 7206} {"train_loss": -28.093420028686523, "global_step": 598153, "epoch": 7206} {"train_loss": -27.66895866394043, "global_step": 598154, "epoch": 7206} {"train_loss": -27.115127563476562, "global_step": 598155, "epoch": 7206} {"train_loss": -26.799367904663086, "global_step": 598156, "epoch": 7206} {"train_loss": -26.55914306640625, "global_step": 598157, "epoch": 7206} {"train_loss": -26.879419326782227, "global_step": 598158, "epoch": 7206} {"train_loss": -27.71478843688965, "global_step": 598159, "epoch": 7206} {"train_loss": -27.587717056274414, "global_step": 598160, "epoch": 7206} {"train_loss": -27.118207931518555, "global_step": 598161, "epoch": 7206} {"train_loss": -27.15478515625, "global_step": 598162, "epoch": 7206} {"train_loss": -27.180734634399414, "global_step": 598163, "epoch": 7206} {"train_loss": -27.399824142456055, "global_step": 598164, "epoch": 7206} {"train_loss": -27.044605255126953, "global_step": 598165, "epoch": 7206} {"train_loss": -27.877710342407227, "global_step": 598166, "epoch": 7206} {"train_loss": -27.538715362548828, "global_step": 598167, "epoch": 7206} {"train_loss": -27.055118560791016, "global_step": 598168, "epoch": 7206} {"train_loss": -27.271032333374023, "global_step": 598169, "epoch": 7206} {"train_loss": -27.54534339904785, "global_step": 598170, "epoch": 7206} {"train_loss": -27.2418212890625, "global_step": 598171, "epoch": 7206} {"train_loss": -27.46016502380371, "global_step": 598172, "epoch": 7206} {"train_loss": -27.496509552001953, "global_step": 598173, "epoch": 7206} {"train_loss": -27.08563232421875, "global_step": 598174, "epoch": 7206} {"train_loss": -27.32670021057129, "global_step": 598175, "epoch": 7206} {"train_loss": -27.517560958862305, "global_step": 598176, "epoch": 7206} {"train_loss": -27.6269588470459, "global_step": 598177, "epoch": 7206} {"train_loss": -27.722187042236328, "global_step": 598178, "epoch": 7206} {"train_loss": -27.726354598999023, "global_step": 598179, "epoch": 7206} {"train_loss": -27.765179875385332, "global_step": 598180, "epoch": 7206, "val_loss": 6575709.5} {"train_loss": -26.96381187438965, "global_step": 598181, "epoch": 7207} {"train_loss": -27.238224029541016, "global_step": 598182, "epoch": 7207} {"train_loss": -27.36444664001465, "global_step": 598183, "epoch": 7207} {"train_loss": -27.296253204345703, "global_step": 598184, "epoch": 7207} {"train_loss": -27.181737899780273, "global_step": 598185, "epoch": 7207} {"train_loss": -27.790624618530273, "global_step": 598186, "epoch": 7207} {"train_loss": -26.02849769592285, "global_step": 598187, "epoch": 7207} {"train_loss": -27.305133819580078, "global_step": 598188, "epoch": 7207} {"train_loss": -27.60398292541504, "global_step": 598189, "epoch": 7207} {"train_loss": -27.526586532592773, "global_step": 598190, "epoch": 7207} {"train_loss": -27.881372451782227, "global_step": 598191, "epoch": 7207} {"train_loss": -27.67657470703125, "global_step": 598192, "epoch": 7207} {"train_loss": -27.477148056030273, "global_step": 598193, "epoch": 7207} {"train_loss": -27.66278648376465, "global_step": 598194, "epoch": 7207} {"train_loss": -27.927942276000977, "global_step": 598195, "epoch": 7207} {"train_loss": -28.068069458007812, "global_step": 598196, "epoch": 7207} {"train_loss": -27.567224502563477, "global_step": 598197, "epoch": 7207} {"train_loss": -27.669971466064453, "global_step": 598198, "epoch": 7207} {"train_loss": -27.468786239624023, "global_step": 598199, "epoch": 7207} {"train_loss": -27.813751220703125, "global_step": 598200, "epoch": 7207} {"train_loss": -27.47686767578125, "global_step": 598201, "epoch": 7207} {"train_loss": -27.928388595581055, "global_step": 598202, "epoch": 7207} {"train_loss": -27.896581649780273, "global_step": 598203, "epoch": 7207} {"train_loss": -27.575611114501953, "global_step": 598204, "epoch": 7207} {"train_loss": -27.85613441467285, "global_step": 598205, "epoch": 7207} {"train_loss": -27.735437393188477, "global_step": 598206, "epoch": 7207} {"train_loss": -27.90667152404785, "global_step": 598207, "epoch": 7207} {"train_loss": -27.908905029296875, "global_step": 598208, "epoch": 7207} {"train_loss": -27.873403549194336, "global_step": 598209, "epoch": 7207} {"train_loss": -28.120397567749023, "global_step": 598210, "epoch": 7207} {"train_loss": -28.009571075439453, "global_step": 598211, "epoch": 7207} {"train_loss": -27.92054557800293, "global_step": 598212, "epoch": 7207} {"train_loss": -27.91871452331543, "global_step": 598213, "epoch": 7207} {"train_loss": -28.118366241455078, "global_step": 598214, "epoch": 7207} {"train_loss": -28.104421615600586, "global_step": 598215, "epoch": 7207} {"train_loss": -27.822235107421875, "global_step": 598216, "epoch": 7207} {"train_loss": -27.850534439086914, "global_step": 598217, "epoch": 7207} {"train_loss": -28.274072647094727, "global_step": 598218, "epoch": 7207} {"train_loss": -27.86737060546875, "global_step": 598219, "epoch": 7207} {"train_loss": -27.63271141052246, "global_step": 598220, "epoch": 7207} {"train_loss": -28.13715171813965, "global_step": 598221, "epoch": 7207} {"train_loss": -27.898157119750977, "global_step": 598222, "epoch": 7207} {"train_loss": -27.76858901977539, "global_step": 598223, "epoch": 7207} {"train_loss": -28.137189865112305, "global_step": 598224, "epoch": 7207} {"train_loss": -28.1500244140625, "global_step": 598225, "epoch": 7207} {"train_loss": -27.890039443969727, "global_step": 598226, "epoch": 7207} {"train_loss": -28.034515380859375, "global_step": 598227, "epoch": 7207} {"train_loss": -27.918231964111328, "global_step": 598228, "epoch": 7207} {"train_loss": -27.91510581970215, "global_step": 598229, "epoch": 7207} {"train_loss": -28.368749618530273, "global_step": 598230, "epoch": 7207} {"train_loss": -28.0614070892334, "global_step": 598231, "epoch": 7207} {"train_loss": -28.02022361755371, "global_step": 598232, "epoch": 7207} {"train_loss": -28.40494155883789, "global_step": 598233, "epoch": 7207} {"train_loss": -28.077444076538086, "global_step": 598234, "epoch": 7207} {"train_loss": -27.941028594970703, "global_step": 598235, "epoch": 7207} {"train_loss": -27.649404525756836, "global_step": 598236, "epoch": 7207} {"train_loss": -28.012104034423828, "global_step": 598237, "epoch": 7207} {"train_loss": -28.1310977935791, "global_step": 598238, "epoch": 7207} {"train_loss": -28.33454704284668, "global_step": 598239, "epoch": 7207} {"train_loss": -28.278152465820312, "global_step": 598240, "epoch": 7207} {"train_loss": -27.937353134155273, "global_step": 598241, "epoch": 7207} {"train_loss": -28.329740524291992, "global_step": 598242, "epoch": 7207} {"train_loss": -28.13294792175293, "global_step": 598243, "epoch": 7207} {"train_loss": -28.2381649017334, "global_step": 598244, "epoch": 7207} {"train_loss": -28.3150634765625, "global_step": 598245, "epoch": 7207} {"train_loss": -28.143707275390625, "global_step": 598246, "epoch": 7207} {"train_loss": -28.001758575439453, "global_step": 598247, "epoch": 7207} {"train_loss": -28.086170196533203, "global_step": 598248, "epoch": 7207} {"train_loss": -28.112470626831055, "global_step": 598249, "epoch": 7207} {"train_loss": -28.169219970703125, "global_step": 598250, "epoch": 7207} {"train_loss": -27.84332847595215, "global_step": 598251, "epoch": 7207} {"train_loss": -27.90449333190918, "global_step": 598252, "epoch": 7207} {"train_loss": -28.04312515258789, "global_step": 598253, "epoch": 7207} {"train_loss": -27.992212295532227, "global_step": 598254, "epoch": 7207} {"train_loss": -28.375720977783203, "global_step": 598255, "epoch": 7207} {"train_loss": -28.11347770690918, "global_step": 598256, "epoch": 7207} {"train_loss": -27.826780319213867, "global_step": 598257, "epoch": 7207} {"train_loss": -28.161890029907227, "global_step": 598258, "epoch": 7207} {"train_loss": -28.28963279724121, "global_step": 598259, "epoch": 7207} {"train_loss": -28.04874610900879, "global_step": 598260, "epoch": 7207} {"train_loss": -28.233417510986328, "global_step": 598261, "epoch": 7207} {"train_loss": -28.094959259033203, "global_step": 598262, "epoch": 7207} {"train_loss": -27.903179582343043, "global_step": 598263, "epoch": 7207, "val_loss": 6571207.0} {"train_loss": -26.742399215698242, "global_step": 598264, "epoch": 7208} {"train_loss": -26.7150936126709, "global_step": 598265, "epoch": 7208} {"train_loss": -27.488407135009766, "global_step": 598266, "epoch": 7208} {"train_loss": -27.29099464416504, "global_step": 598267, "epoch": 7208} {"train_loss": -26.936208724975586, "global_step": 598268, "epoch": 7208} {"train_loss": -26.52680015563965, "global_step": 598269, "epoch": 7208} {"train_loss": -27.637617111206055, "global_step": 598270, "epoch": 7208} {"train_loss": -27.65875244140625, "global_step": 598271, "epoch": 7208} {"train_loss": -27.220083236694336, "global_step": 598272, "epoch": 7208} {"train_loss": -26.9939022064209, "global_step": 598273, "epoch": 7208} {"train_loss": -27.02907371520996, "global_step": 598274, "epoch": 7208} {"train_loss": -27.00931739807129, "global_step": 598275, "epoch": 7208} {"train_loss": -27.623605728149414, "global_step": 598276, "epoch": 7208} {"train_loss": -26.98394775390625, "global_step": 598277, "epoch": 7208} {"train_loss": -27.499853134155273, "global_step": 598278, "epoch": 7208} {"train_loss": -27.413827896118164, "global_step": 598279, "epoch": 7208} {"train_loss": -27.50965690612793, "global_step": 598280, "epoch": 7208} {"train_loss": -27.61848258972168, "global_step": 598281, "epoch": 7208} {"train_loss": -27.29493522644043, "global_step": 598282, "epoch": 7208} {"train_loss": -27.54742431640625, "global_step": 598283, "epoch": 7208} {"train_loss": -27.4216251373291, "global_step": 598284, "epoch": 7208} {"train_loss": -27.8464412689209, "global_step": 598285, "epoch": 7208} {"train_loss": -27.507287979125977, "global_step": 598286, "epoch": 7208} {"train_loss": -27.457523345947266, "global_step": 598287, "epoch": 7208} {"train_loss": -27.5801944732666, "global_step": 598288, "epoch": 7208} {"train_loss": -27.86371421813965, "global_step": 598289, "epoch": 7208} {"train_loss": -27.608768463134766, "global_step": 598290, "epoch": 7208} {"train_loss": -27.954565048217773, "global_step": 598291, "epoch": 7208} {"train_loss": -28.104833602905273, "global_step": 598292, "epoch": 7208} {"train_loss": -27.706113815307617, "global_step": 598293, "epoch": 7208} {"train_loss": -27.74323844909668, "global_step": 598294, "epoch": 7208} {"train_loss": -27.915679931640625, "global_step": 598295, "epoch": 7208} {"train_loss": -27.801504135131836, "global_step": 598296, "epoch": 7208} {"train_loss": -28.010541915893555, "global_step": 598297, "epoch": 7208} {"train_loss": -28.2257137298584, "global_step": 598298, "epoch": 7208} {"train_loss": -27.86506462097168, "global_step": 598299, "epoch": 7208} {"train_loss": -28.060688018798828, "global_step": 598300, "epoch": 7208} {"train_loss": -28.096115112304688, "global_step": 598301, "epoch": 7208} {"train_loss": -27.663923263549805, "global_step": 598302, "epoch": 7208} {"train_loss": -28.180057525634766, "global_step": 598303, "epoch": 7208} {"train_loss": -28.138601303100586, "global_step": 598304, "epoch": 7208} {"train_loss": -28.15496826171875, "global_step": 598305, "epoch": 7208} {"train_loss": -27.71539878845215, "global_step": 598306, "epoch": 7208} {"train_loss": -27.91023826599121, "global_step": 598307, "epoch": 7208} {"train_loss": -27.963666915893555, "global_step": 598308, "epoch": 7208} {"train_loss": -27.880401611328125, "global_step": 598309, "epoch": 7208} {"train_loss": -28.03032875061035, "global_step": 598310, "epoch": 7208} {"train_loss": -28.06440544128418, "global_step": 598311, "epoch": 7208} {"train_loss": -28.55832862854004, "global_step": 598312, "epoch": 7208} {"train_loss": -28.063962936401367, "global_step": 598313, "epoch": 7208} {"train_loss": -27.829349517822266, "global_step": 598314, "epoch": 7208} {"train_loss": -28.1756649017334, "global_step": 598315, "epoch": 7208} {"train_loss": -28.13028907775879, "global_step": 598316, "epoch": 7208} {"train_loss": -28.620447158813477, "global_step": 598317, "epoch": 7208} {"train_loss": -28.23046875, "global_step": 598318, "epoch": 7208} {"train_loss": -28.261035919189453, "global_step": 598319, "epoch": 7208} {"train_loss": -28.28629493713379, "global_step": 598320, "epoch": 7208} {"train_loss": -28.5931339263916, "global_step": 598321, "epoch": 7208} {"train_loss": -28.3233699798584, "global_step": 598322, "epoch": 7208} {"train_loss": -28.05559730529785, "global_step": 598323, "epoch": 7208} {"train_loss": -28.17291259765625, "global_step": 598324, "epoch": 7208} {"train_loss": -28.339452743530273, "global_step": 598325, "epoch": 7208} {"train_loss": -28.449125289916992, "global_step": 598326, "epoch": 7208} {"train_loss": -28.20655632019043, "global_step": 598327, "epoch": 7208} {"train_loss": -27.925397872924805, "global_step": 598328, "epoch": 7208} {"train_loss": -28.493192672729492, "global_step": 598329, "epoch": 7208} {"train_loss": -27.999486923217773, "global_step": 598330, "epoch": 7208} {"train_loss": -28.0915584564209, "global_step": 598331, "epoch": 7208} {"train_loss": -27.980749130249023, "global_step": 598332, "epoch": 7208} {"train_loss": -27.455305099487305, "global_step": 598333, "epoch": 7208} {"train_loss": -27.40509033203125, "global_step": 598334, "epoch": 7208} {"train_loss": -28.270938873291016, "global_step": 598335, "epoch": 7208} {"train_loss": -27.930524826049805, "global_step": 598336, "epoch": 7208} {"train_loss": -27.72810173034668, "global_step": 598337, "epoch": 7208} {"train_loss": -27.382749557495117, "global_step": 598338, "epoch": 7208} {"train_loss": -27.3165340423584, "global_step": 598339, "epoch": 7208} {"train_loss": -27.91531753540039, "global_step": 598340, "epoch": 7208} {"train_loss": -27.888883590698242, "global_step": 598341, "epoch": 7208} {"train_loss": -27.659503936767578, "global_step": 598342, "epoch": 7208} {"train_loss": -27.95389747619629, "global_step": 598343, "epoch": 7208} {"train_loss": -27.90107536315918, "global_step": 598344, "epoch": 7208} {"train_loss": -27.883747100830078, "global_step": 598345, "epoch": 7208} {"train_loss": -27.793370786919652, "global_step": 598346, "epoch": 7208, "val_loss": 6635410.0} {"train_loss": -27.202350616455078, "global_step": 598347, "epoch": 7209} {"train_loss": -27.615575790405273, "global_step": 598348, "epoch": 7209} {"train_loss": -27.07586669921875, "global_step": 598349, "epoch": 7209} {"train_loss": -27.28285789489746, "global_step": 598350, "epoch": 7209} {"train_loss": -27.478490829467773, "global_step": 598351, "epoch": 7209} {"train_loss": -27.253149032592773, "global_step": 598352, "epoch": 7209} {"train_loss": -27.44673728942871, "global_step": 598353, "epoch": 7209} {"train_loss": -26.9229736328125, "global_step": 598354, "epoch": 7209} {"train_loss": -27.126392364501953, "global_step": 598355, "epoch": 7209} {"train_loss": -27.0610294342041, "global_step": 598356, "epoch": 7209} {"train_loss": -27.66581153869629, "global_step": 598357, "epoch": 7209} {"train_loss": -27.769351959228516, "global_step": 598358, "epoch": 7209} {"train_loss": -27.057880401611328, "global_step": 598359, "epoch": 7209} {"train_loss": -27.6932373046875, "global_step": 598360, "epoch": 7209} {"train_loss": -27.652868270874023, "global_step": 598361, "epoch": 7209} {"train_loss": -27.9302978515625, "global_step": 598362, "epoch": 7209} {"train_loss": -27.34351921081543, "global_step": 598363, "epoch": 7209} {"train_loss": -27.7167911529541, "global_step": 598364, "epoch": 7209} {"train_loss": -27.70472526550293, "global_step": 598365, "epoch": 7209} {"train_loss": -27.734302520751953, "global_step": 598366, "epoch": 7209} {"train_loss": -27.758670806884766, "global_step": 598367, "epoch": 7209} {"train_loss": -27.5723819732666, "global_step": 598368, "epoch": 7209} {"train_loss": -27.707204818725586, "global_step": 598369, "epoch": 7209} {"train_loss": -27.893102645874023, "global_step": 598370, "epoch": 7209} {"train_loss": -27.68379020690918, "global_step": 598371, "epoch": 7209} {"train_loss": -27.987146377563477, "global_step": 598372, "epoch": 7209} {"train_loss": -27.756811141967773, "global_step": 598373, "epoch": 7209} {"train_loss": -27.947467803955078, "global_step": 598374, "epoch": 7209} {"train_loss": -28.051122665405273, "global_step": 598375, "epoch": 7209} {"train_loss": -27.788894653320312, "global_step": 598376, "epoch": 7209} {"train_loss": -27.979482650756836, "global_step": 598377, "epoch": 7209} {"train_loss": -28.179183959960938, "global_step": 598378, "epoch": 7209} {"train_loss": -27.654767990112305, "global_step": 598379, "epoch": 7209} {"train_loss": -27.69392204284668, "global_step": 598380, "epoch": 7209} {"train_loss": -28.106908798217773, "global_step": 598381, "epoch": 7209} {"train_loss": -27.898040771484375, "global_step": 598382, "epoch": 7209} {"train_loss": -27.86065673828125, "global_step": 598383, "epoch": 7209} {"train_loss": -27.879077911376953, "global_step": 598384, "epoch": 7209} {"train_loss": -27.693384170532227, "global_step": 598385, "epoch": 7209} {"train_loss": -28.639862060546875, "global_step": 598386, "epoch": 7209} {"train_loss": -28.049055099487305, "global_step": 598387, "epoch": 7209} {"train_loss": -28.000885009765625, "global_step": 598388, "epoch": 7209} {"train_loss": -28.28998374938965, "global_step": 598389, "epoch": 7209} {"train_loss": -28.16916847229004, "global_step": 598390, "epoch": 7209} {"train_loss": -27.968908309936523, "global_step": 598391, "epoch": 7209} {"train_loss": -28.266498565673828, "global_step": 598392, "epoch": 7209} {"train_loss": -28.19061279296875, "global_step": 598393, "epoch": 7209} {"train_loss": -27.964080810546875, "global_step": 598394, "epoch": 7209} {"train_loss": -28.010679244995117, "global_step": 598395, "epoch": 7209} {"train_loss": -28.159582138061523, "global_step": 598396, "epoch": 7209} {"train_loss": -28.101591110229492, "global_step": 598397, "epoch": 7209} {"train_loss": -28.054534912109375, "global_step": 598398, "epoch": 7209} {"train_loss": -28.050573348999023, "global_step": 598399, "epoch": 7209} {"train_loss": -28.35686683654785, "global_step": 598400, "epoch": 7209} {"train_loss": -27.79029655456543, "global_step": 598401, "epoch": 7209} {"train_loss": -28.065017700195312, "global_step": 598402, "epoch": 7209} {"train_loss": -28.315265655517578, "global_step": 598403, "epoch": 7209} {"train_loss": -28.301321029663086, "global_step": 598404, "epoch": 7209} {"train_loss": -27.889646530151367, "global_step": 598405, "epoch": 7209} {"train_loss": -27.894851684570312, "global_step": 598406, "epoch": 7209} {"train_loss": -27.999540328979492, "global_step": 598407, "epoch": 7209} {"train_loss": -28.14235496520996, "global_step": 598408, "epoch": 7209} {"train_loss": -28.171600341796875, "global_step": 598409, "epoch": 7209} {"train_loss": -27.83740234375, "global_step": 598410, "epoch": 7209} {"train_loss": -28.226551055908203, "global_step": 598411, "epoch": 7209} {"train_loss": -28.010007858276367, "global_step": 598412, "epoch": 7209} {"train_loss": -28.195608139038086, "global_step": 598413, "epoch": 7209} {"train_loss": -28.078277587890625, "global_step": 598414, "epoch": 7209} {"train_loss": -28.343677520751953, "global_step": 598415, "epoch": 7209} {"train_loss": -28.10529136657715, "global_step": 598416, "epoch": 7209} {"train_loss": -28.2431583404541, "global_step": 598417, "epoch": 7209} {"train_loss": -27.941944122314453, "global_step": 598418, "epoch": 7209} {"train_loss": -28.11785316467285, "global_step": 598419, "epoch": 7209} {"train_loss": -28.09406089782715, "global_step": 598420, "epoch": 7209} {"train_loss": -27.821548461914062, "global_step": 598421, "epoch": 7209} {"train_loss": -27.88591957092285, "global_step": 598422, "epoch": 7209} {"train_loss": -27.755765914916992, "global_step": 598423, "epoch": 7209} {"train_loss": -27.81036376953125, "global_step": 598424, "epoch": 7209} {"train_loss": -28.1721134185791, "global_step": 598425, "epoch": 7209} {"train_loss": -27.9046630859375, "global_step": 598426, "epoch": 7209} {"train_loss": -27.9655818939209, "global_step": 598427, "epoch": 7209} {"train_loss": -28.168701171875, "global_step": 598428, "epoch": 7209} {"train_loss": -27.871967430574347, "global_step": 598429, "epoch": 7209, "val_loss": 6643764.0} {"train_loss": -27.008512496948242, "global_step": 598430, "epoch": 7210} {"train_loss": -26.89361572265625, "global_step": 598431, "epoch": 7210} {"train_loss": -26.96648597717285, "global_step": 598432, "epoch": 7210} {"train_loss": -27.342544555664062, "global_step": 598433, "epoch": 7210} {"train_loss": -26.63446044921875, "global_step": 598434, "epoch": 7210} {"train_loss": -26.63150978088379, "global_step": 598435, "epoch": 7210} {"train_loss": -26.476428985595703, "global_step": 598436, "epoch": 7210} {"train_loss": -27.60260581970215, "global_step": 598437, "epoch": 7210} {"train_loss": -26.591032028198242, "global_step": 598438, "epoch": 7210} {"train_loss": -27.425872802734375, "global_step": 598439, "epoch": 7210} {"train_loss": -27.0156192779541, "global_step": 598440, "epoch": 7210} {"train_loss": -27.614582061767578, "global_step": 598441, "epoch": 7210} {"train_loss": -27.44893455505371, "global_step": 598442, "epoch": 7210} {"train_loss": -27.487152099609375, "global_step": 598443, "epoch": 7210} {"train_loss": -27.45172691345215, "global_step": 598444, "epoch": 7210} {"train_loss": -27.344511032104492, "global_step": 598445, "epoch": 7210} {"train_loss": -27.58735466003418, "global_step": 598446, "epoch": 7210} {"train_loss": -27.575504302978516, "global_step": 598447, "epoch": 7210} {"train_loss": -27.027692794799805, "global_step": 598448, "epoch": 7210} {"train_loss": -27.426666259765625, "global_step": 598449, "epoch": 7210} {"train_loss": -27.833539962768555, "global_step": 598450, "epoch": 7210} {"train_loss": -27.995223999023438, "global_step": 598451, "epoch": 7210} {"train_loss": -27.501941680908203, "global_step": 598452, "epoch": 7210} {"train_loss": -28.03216552734375, "global_step": 598453, "epoch": 7210} {"train_loss": -27.8833065032959, "global_step": 598454, "epoch": 7210} {"train_loss": -27.349573135375977, "global_step": 598455, "epoch": 7210} {"train_loss": -27.724063873291016, "global_step": 598456, "epoch": 7210} {"train_loss": -28.20521354675293, "global_step": 598457, "epoch": 7210} {"train_loss": -27.78436279296875, "global_step": 598458, "epoch": 7210} {"train_loss": -27.932844161987305, "global_step": 598459, "epoch": 7210} {"train_loss": -27.84330177307129, "global_step": 598460, "epoch": 7210} {"train_loss": -28.034204483032227, "global_step": 598461, "epoch": 7210} {"train_loss": -27.877899169921875, "global_step": 598462, "epoch": 7210} {"train_loss": -28.09002113342285, "global_step": 598463, "epoch": 7210} {"train_loss": -28.154279708862305, "global_step": 598464, "epoch": 7210} {"train_loss": -27.986526489257812, "global_step": 598465, "epoch": 7210} {"train_loss": -28.050683975219727, "global_step": 598466, "epoch": 7210} {"train_loss": -28.0161190032959, "global_step": 598467, "epoch": 7210} {"train_loss": -28.615894317626953, "global_step": 598468, "epoch": 7210} {"train_loss": -28.295612335205078, "global_step": 598469, "epoch": 7210} {"train_loss": -27.772748947143555, "global_step": 598470, "epoch": 7210} {"train_loss": -28.289447784423828, "global_step": 598471, "epoch": 7210} {"train_loss": -28.423643112182617, "global_step": 598472, "epoch": 7210} {"train_loss": -28.498947143554688, "global_step": 598473, "epoch": 7210} {"train_loss": -28.07831382751465, "global_step": 598474, "epoch": 7210} {"train_loss": -28.187183380126953, "global_step": 598475, "epoch": 7210} {"train_loss": -28.282033920288086, "global_step": 598476, "epoch": 7210} {"train_loss": -28.332172393798828, "global_step": 598477, "epoch": 7210} {"train_loss": -28.832990646362305, "global_step": 598478, "epoch": 7210} {"train_loss": -28.505346298217773, "global_step": 598479, "epoch": 7210} {"train_loss": -28.219274520874023, "global_step": 598480, "epoch": 7210} {"train_loss": -27.95890235900879, "global_step": 598481, "epoch": 7210} {"train_loss": -27.981735229492188, "global_step": 598482, "epoch": 7210} {"train_loss": -27.99554443359375, "global_step": 598483, "epoch": 7210} {"train_loss": -27.63758659362793, "global_step": 598484, "epoch": 7210} {"train_loss": -27.780658721923828, "global_step": 598485, "epoch": 7210} {"train_loss": -28.16343116760254, "global_step": 598486, "epoch": 7210} {"train_loss": -27.972736358642578, "global_step": 598487, "epoch": 7210} {"train_loss": -28.46876335144043, "global_step": 598488, "epoch": 7210} {"train_loss": -28.365564346313477, "global_step": 598489, "epoch": 7210} {"train_loss": -28.013818740844727, "global_step": 598490, "epoch": 7210} {"train_loss": -28.51019287109375, "global_step": 598491, "epoch": 7210} {"train_loss": -27.908496856689453, "global_step": 598492, "epoch": 7210} {"train_loss": -27.925662994384766, "global_step": 598493, "epoch": 7210} {"train_loss": -27.806272506713867, "global_step": 598494, "epoch": 7210} {"train_loss": -28.017972946166992, "global_step": 598495, "epoch": 7210} {"train_loss": -28.019758224487305, "global_step": 598496, "epoch": 7210} {"train_loss": -28.573200225830078, "global_step": 598497, "epoch": 7210} {"train_loss": -27.97147560119629, "global_step": 598498, "epoch": 7210} {"train_loss": -28.359195709228516, "global_step": 598499, "epoch": 7210} {"train_loss": -27.838348388671875, "global_step": 598500, "epoch": 7210} {"train_loss": -28.1175537109375, "global_step": 598501, "epoch": 7210} {"train_loss": -28.006864547729492, "global_step": 598502, "epoch": 7210} {"train_loss": -28.19072914123535, "global_step": 598503, "epoch": 7210} {"train_loss": -28.408248901367188, "global_step": 598504, "epoch": 7210} {"train_loss": -28.18010902404785, "global_step": 598505, "epoch": 7210} {"train_loss": -28.167896270751953, "global_step": 598506, "epoch": 7210} {"train_loss": -28.094257354736328, "global_step": 598507, "epoch": 7210} {"train_loss": -27.896955490112305, "global_step": 598508, "epoch": 7210} {"train_loss": -27.925861358642578, "global_step": 598509, "epoch": 7210} {"train_loss": -28.25431251525879, "global_step": 598510, "epoch": 7210} {"train_loss": -28.3091983795166, "global_step": 598511, "epoch": 7210} {"train_loss": -27.867252051112164, "global_step": 598512, "epoch": 7210, "val_loss": 6512460.0} {"train_loss": -27.572385787963867, "global_step": 598513, "epoch": 7211} {"train_loss": -27.01569938659668, "global_step": 598514, "epoch": 7211} {"train_loss": -27.366926193237305, "global_step": 598515, "epoch": 7211} {"train_loss": -27.90604591369629, "global_step": 598516, "epoch": 7211} {"train_loss": -27.582250595092773, "global_step": 598517, "epoch": 7211} {"train_loss": -27.99249267578125, "global_step": 598518, "epoch": 7211} {"train_loss": -27.554697036743164, "global_step": 598519, "epoch": 7211} {"train_loss": -27.303510665893555, "global_step": 598520, "epoch": 7211} {"train_loss": -27.51772117614746, "global_step": 598521, "epoch": 7211} {"train_loss": -27.627973556518555, "global_step": 598522, "epoch": 7211} {"train_loss": -27.921283721923828, "global_step": 598523, "epoch": 7211} {"train_loss": -27.653839111328125, "global_step": 598524, "epoch": 7211} {"train_loss": -27.570932388305664, "global_step": 598525, "epoch": 7211} {"train_loss": -28.055830001831055, "global_step": 598526, "epoch": 7211} {"train_loss": -27.453134536743164, "global_step": 598527, "epoch": 7211} {"train_loss": -28.00404930114746, "global_step": 598528, "epoch": 7211} {"train_loss": -27.563501358032227, "global_step": 598529, "epoch": 7211} {"train_loss": -28.022491455078125, "global_step": 598530, "epoch": 7211} {"train_loss": -27.87298583984375, "global_step": 598531, "epoch": 7211} {"train_loss": -27.916767120361328, "global_step": 598532, "epoch": 7211} {"train_loss": -27.854650497436523, "global_step": 598533, "epoch": 7211} {"train_loss": -27.85597038269043, "global_step": 598534, "epoch": 7211} {"train_loss": -28.120508193969727, "global_step": 598535, "epoch": 7211} {"train_loss": -27.931583404541016, "global_step": 598536, "epoch": 7211} {"train_loss": -27.79300880432129, "global_step": 598537, "epoch": 7211} {"train_loss": -28.31174659729004, "global_step": 598538, "epoch": 7211} {"train_loss": -28.1654109954834, "global_step": 598539, "epoch": 7211} {"train_loss": -27.912073135375977, "global_step": 598540, "epoch": 7211} {"train_loss": -27.840656280517578, "global_step": 598541, "epoch": 7211} {"train_loss": -27.77781105041504, "global_step": 598542, "epoch": 7211} {"train_loss": -27.874780654907227, "global_step": 598543, "epoch": 7211} {"train_loss": -28.0434627532959, "global_step": 598544, "epoch": 7211} {"train_loss": -27.991018295288086, "global_step": 598545, "epoch": 7211} {"train_loss": -28.40673828125, "global_step": 598546, "epoch": 7211} {"train_loss": -28.038427352905273, "global_step": 598547, "epoch": 7211} {"train_loss": -27.94439697265625, "global_step": 598548, "epoch": 7211} {"train_loss": -27.83098793029785, "global_step": 598549, "epoch": 7211} {"train_loss": -28.29560661315918, "global_step": 598550, "epoch": 7211} {"train_loss": -27.977380752563477, "global_step": 598551, "epoch": 7211} {"train_loss": -28.167951583862305, "global_step": 598552, "epoch": 7211} {"train_loss": -27.86895751953125, "global_step": 598553, "epoch": 7211} {"train_loss": -28.20450782775879, "global_step": 598554, "epoch": 7211} {"train_loss": -28.011322021484375, "global_step": 598555, "epoch": 7211} {"train_loss": -27.689367294311523, "global_step": 598556, "epoch": 7211} {"train_loss": -27.965652465820312, "global_step": 598557, "epoch": 7211} {"train_loss": -27.935270309448242, "global_step": 598558, "epoch": 7211} {"train_loss": -27.795080184936523, "global_step": 598559, "epoch": 7211} {"train_loss": -27.912702560424805, "global_step": 598560, "epoch": 7211} {"train_loss": -28.430280685424805, "global_step": 598561, "epoch": 7211} {"train_loss": -28.119794845581055, "global_step": 598562, "epoch": 7211} {"train_loss": -28.171850204467773, "global_step": 598563, "epoch": 7211} {"train_loss": -28.114990234375, "global_step": 598564, "epoch": 7211} {"train_loss": -27.9530086517334, "global_step": 598565, "epoch": 7211} {"train_loss": -27.983993530273438, "global_step": 598566, "epoch": 7211} {"train_loss": -28.07880210876465, "global_step": 598567, "epoch": 7211} {"train_loss": -27.573989868164062, "global_step": 598568, "epoch": 7211} {"train_loss": -27.484268188476562, "global_step": 598569, "epoch": 7211} {"train_loss": -27.928253173828125, "global_step": 598570, "epoch": 7211} {"train_loss": -28.242359161376953, "global_step": 598571, "epoch": 7211} {"train_loss": -28.031309127807617, "global_step": 598572, "epoch": 7211} {"train_loss": -27.815881729125977, "global_step": 598573, "epoch": 7211} {"train_loss": -28.018951416015625, "global_step": 598574, "epoch": 7211} {"train_loss": -28.122711181640625, "global_step": 598575, "epoch": 7211} {"train_loss": -28.10605239868164, "global_step": 598576, "epoch": 7211} {"train_loss": -27.946563720703125, "global_step": 598577, "epoch": 7211} {"train_loss": -27.98531150817871, "global_step": 598578, "epoch": 7211} {"train_loss": -27.915821075439453, "global_step": 598579, "epoch": 7211} {"train_loss": -28.038427352905273, "global_step": 598580, "epoch": 7211} {"train_loss": -28.01178550720215, "global_step": 598581, "epoch": 7211} {"train_loss": -28.556684494018555, "global_step": 598582, "epoch": 7211} {"train_loss": -28.109582901000977, "global_step": 598583, "epoch": 7211} {"train_loss": -28.334308624267578, "global_step": 598584, "epoch": 7211} {"train_loss": -28.0443172454834, "global_step": 598585, "epoch": 7211} {"train_loss": -28.057538986206055, "global_step": 598586, "epoch": 7211} {"train_loss": -27.93732261657715, "global_step": 598587, "epoch": 7211} {"train_loss": -28.115726470947266, "global_step": 598588, "epoch": 7211} {"train_loss": -27.947900772094727, "global_step": 598589, "epoch": 7211} {"train_loss": -27.972272872924805, "global_step": 598590, "epoch": 7211} {"train_loss": -28.08961296081543, "global_step": 598591, "epoch": 7211} {"train_loss": -28.20111656188965, "global_step": 598592, "epoch": 7211} {"train_loss": -28.123931884765625, "global_step": 598593, "epoch": 7211} {"train_loss": -28.120874404907227, "global_step": 598594, "epoch": 7211} {"train_loss": -27.950852911156343, "global_step": 598595, "epoch": 7211, "val_loss": 6552716.0} {"train_loss": -26.997577667236328, "global_step": 598596, "epoch": 7212} {"train_loss": -27.420209884643555, "global_step": 598597, "epoch": 7212} {"train_loss": -27.21729850769043, "global_step": 598598, "epoch": 7212} {"train_loss": -26.701078414916992, "global_step": 598599, "epoch": 7212} {"train_loss": -27.738880157470703, "global_step": 598600, "epoch": 7212} {"train_loss": -27.449325561523438, "global_step": 598601, "epoch": 7212} {"train_loss": -27.503873825073242, "global_step": 598602, "epoch": 7212} {"train_loss": -26.93560791015625, "global_step": 598603, "epoch": 7212} {"train_loss": -27.326284408569336, "global_step": 598604, "epoch": 7212} {"train_loss": -27.53857421875, "global_step": 598605, "epoch": 7212} {"train_loss": -27.399036407470703, "global_step": 598606, "epoch": 7212} {"train_loss": -27.634246826171875, "global_step": 598607, "epoch": 7212} {"train_loss": -27.447988510131836, "global_step": 598608, "epoch": 7212} {"train_loss": -27.94569206237793, "global_step": 598609, "epoch": 7212} {"train_loss": -27.524551391601562, "global_step": 598610, "epoch": 7212} {"train_loss": -28.064477920532227, "global_step": 598611, "epoch": 7212} {"train_loss": -27.66827392578125, "global_step": 598612, "epoch": 7212} {"train_loss": -27.965116500854492, "global_step": 598613, "epoch": 7212} {"train_loss": -28.0922794342041, "global_step": 598614, "epoch": 7212} {"train_loss": -27.8649959564209, "global_step": 598615, "epoch": 7212} {"train_loss": -27.723907470703125, "global_step": 598616, "epoch": 7212} {"train_loss": -28.099172592163086, "global_step": 598617, "epoch": 7212} {"train_loss": -27.778894424438477, "global_step": 598618, "epoch": 7212} {"train_loss": -27.845203399658203, "global_step": 598619, "epoch": 7212} {"train_loss": -27.914392471313477, "global_step": 598620, "epoch": 7212} {"train_loss": -27.88067054748535, "global_step": 598621, "epoch": 7212} {"train_loss": -28.343454360961914, "global_step": 598622, "epoch": 7212} {"train_loss": -27.481000900268555, "global_step": 598623, "epoch": 7212} {"train_loss": -28.06316566467285, "global_step": 598624, "epoch": 7212} {"train_loss": -28.05350112915039, "global_step": 598625, "epoch": 7212} {"train_loss": -28.014942169189453, "global_step": 598626, "epoch": 7212} {"train_loss": -27.33831787109375, "global_step": 598627, "epoch": 7212} {"train_loss": -28.33121681213379, "global_step": 598628, "epoch": 7212} {"train_loss": -28.065689086914062, "global_step": 598629, "epoch": 7212} {"train_loss": -28.189096450805664, "global_step": 598630, "epoch": 7212} {"train_loss": -28.4842472076416, "global_step": 598631, "epoch": 7212} {"train_loss": -27.895139694213867, "global_step": 598632, "epoch": 7212} {"train_loss": -28.049713134765625, "global_step": 598633, "epoch": 7212} {"train_loss": -27.994016647338867, "global_step": 598634, "epoch": 7212} {"train_loss": -28.131256103515625, "global_step": 598635, "epoch": 7212} {"train_loss": -27.897741317749023, "global_step": 598636, "epoch": 7212} {"train_loss": -28.049463272094727, "global_step": 598637, "epoch": 7212} {"train_loss": -28.322214126586914, "global_step": 598638, "epoch": 7212} {"train_loss": -28.422277450561523, "global_step": 598639, "epoch": 7212} {"train_loss": -28.324438095092773, "global_step": 598640, "epoch": 7212} {"train_loss": -28.27664566040039, "global_step": 598641, "epoch": 7212} {"train_loss": -28.138158798217773, "global_step": 598642, "epoch": 7212} {"train_loss": -28.501989364624023, "global_step": 598643, "epoch": 7212} {"train_loss": -28.103723526000977, "global_step": 598644, "epoch": 7212} {"train_loss": -28.338430404663086, "global_step": 598645, "epoch": 7212} {"train_loss": -28.171100616455078, "global_step": 598646, "epoch": 7212} {"train_loss": -28.17254066467285, "global_step": 598647, "epoch": 7212} {"train_loss": -27.95524024963379, "global_step": 598648, "epoch": 7212} {"train_loss": -27.988691329956055, "global_step": 598649, "epoch": 7212} {"train_loss": -28.155038833618164, "global_step": 598650, "epoch": 7212} {"train_loss": -27.961505889892578, "global_step": 598651, "epoch": 7212} {"train_loss": -28.31904411315918, "global_step": 598652, "epoch": 7212} {"train_loss": -27.875137329101562, "global_step": 598653, "epoch": 7212} {"train_loss": -27.8509521484375, "global_step": 598654, "epoch": 7212} {"train_loss": -28.00446128845215, "global_step": 598655, "epoch": 7212} {"train_loss": -28.036727905273438, "global_step": 598656, "epoch": 7212} {"train_loss": -28.03651237487793, "global_step": 598657, "epoch": 7212} {"train_loss": -28.267669677734375, "global_step": 598658, "epoch": 7212} {"train_loss": -27.855207443237305, "global_step": 598659, "epoch": 7212} {"train_loss": -28.234943389892578, "global_step": 598660, "epoch": 7212} {"train_loss": -28.238412857055664, "global_step": 598661, "epoch": 7212} {"train_loss": -27.914670944213867, "global_step": 598662, "epoch": 7212} {"train_loss": -27.877038955688477, "global_step": 598663, "epoch": 7212} {"train_loss": -28.03862953186035, "global_step": 598664, "epoch": 7212} {"train_loss": -27.661344528198242, "global_step": 598665, "epoch": 7212} {"train_loss": -28.032865524291992, "global_step": 598666, "epoch": 7212} {"train_loss": -28.19672966003418, "global_step": 598667, "epoch": 7212} {"train_loss": -27.903961181640625, "global_step": 598668, "epoch": 7212} {"train_loss": -27.488433837890625, "global_step": 598669, "epoch": 7212} {"train_loss": -27.138553619384766, "global_step": 598670, "epoch": 7212} {"train_loss": -27.459671020507812, "global_step": 598671, "epoch": 7212} {"train_loss": -27.834640502929688, "global_step": 598672, "epoch": 7212} {"train_loss": -28.116012573242188, "global_step": 598673, "epoch": 7212} {"train_loss": -28.186498641967773, "global_step": 598674, "epoch": 7212} {"train_loss": -28.121307373046875, "global_step": 598675, "epoch": 7212} {"train_loss": -28.219635009765625, "global_step": 598676, "epoch": 7212} {"train_loss": -28.042871475219727, "global_step": 598677, "epoch": 7212} {"train_loss": -27.893944981586504, "global_step": 598678, "epoch": 7212, "val_loss": 6563892.5} {"train_loss": -27.47493553161621, "global_step": 598679, "epoch": 7213} {"train_loss": -27.31013298034668, "global_step": 598680, "epoch": 7213} {"train_loss": -27.350982666015625, "global_step": 598681, "epoch": 7213} {"train_loss": -27.34966468811035, "global_step": 598682, "epoch": 7213} {"train_loss": -26.760595321655273, "global_step": 598683, "epoch": 7213} {"train_loss": -26.89230728149414, "global_step": 598684, "epoch": 7213} {"train_loss": -26.60401725769043, "global_step": 598685, "epoch": 7213} {"train_loss": -27.55401611328125, "global_step": 598686, "epoch": 7213} {"train_loss": -27.057052612304688, "global_step": 598687, "epoch": 7213} {"train_loss": -27.284521102905273, "global_step": 598688, "epoch": 7213} {"train_loss": -26.979711532592773, "global_step": 598689, "epoch": 7213} {"train_loss": -27.273813247680664, "global_step": 598690, "epoch": 7213} {"train_loss": -27.508926391601562, "global_step": 598691, "epoch": 7213} {"train_loss": -27.120925903320312, "global_step": 598692, "epoch": 7213} {"train_loss": -27.27773094177246, "global_step": 598693, "epoch": 7213} {"train_loss": -27.27252769470215, "global_step": 598694, "epoch": 7213} {"train_loss": -27.26778221130371, "global_step": 598695, "epoch": 7213} {"train_loss": -27.317663192749023, "global_step": 598696, "epoch": 7213} {"train_loss": -27.383914947509766, "global_step": 598697, "epoch": 7213} {"train_loss": -27.559967041015625, "global_step": 598698, "epoch": 7213} {"train_loss": -27.467437744140625, "global_step": 598699, "epoch": 7213} {"train_loss": -27.402692794799805, "global_step": 598700, "epoch": 7213} {"train_loss": -27.317901611328125, "global_step": 598701, "epoch": 7213} {"train_loss": -27.736764907836914, "global_step": 598702, "epoch": 7213} {"train_loss": -27.50763511657715, "global_step": 598703, "epoch": 7213} {"train_loss": -27.840290069580078, "global_step": 598704, "epoch": 7213} {"train_loss": -27.740331649780273, "global_step": 598705, "epoch": 7213} {"train_loss": -27.9923152923584, "global_step": 598706, "epoch": 7213} {"train_loss": -27.82794761657715, "global_step": 598707, "epoch": 7213} {"train_loss": -27.678272247314453, "global_step": 598708, "epoch": 7213} {"train_loss": -28.149097442626953, "global_step": 598709, "epoch": 7213} {"train_loss": -27.973047256469727, "global_step": 598710, "epoch": 7213} {"train_loss": -27.65679359436035, "global_step": 598711, "epoch": 7213} {"train_loss": -28.0899658203125, "global_step": 598712, "epoch": 7213} {"train_loss": -27.681884765625, "global_step": 598713, "epoch": 7213} {"train_loss": -28.248584747314453, "global_step": 598714, "epoch": 7213} {"train_loss": -28.445240020751953, "global_step": 598715, "epoch": 7213} {"train_loss": -27.97187614440918, "global_step": 598716, "epoch": 7213} {"train_loss": -28.405231475830078, "global_step": 598717, "epoch": 7213} {"train_loss": -27.76971435546875, "global_step": 598718, "epoch": 7213} {"train_loss": -27.95871353149414, "global_step": 598719, "epoch": 7213} {"train_loss": -27.883691787719727, "global_step": 598720, "epoch": 7213} {"train_loss": -28.18515396118164, "global_step": 598721, "epoch": 7213} {"train_loss": -27.52838134765625, "global_step": 598722, "epoch": 7213} {"train_loss": -27.98469352722168, "global_step": 598723, "epoch": 7213} {"train_loss": -27.779861450195312, "global_step": 598724, "epoch": 7213} {"train_loss": -27.615314483642578, "global_step": 598725, "epoch": 7213} {"train_loss": -28.040998458862305, "global_step": 598726, "epoch": 7213} {"train_loss": -27.75385093688965, "global_step": 598727, "epoch": 7213} {"train_loss": -27.76337242126465, "global_step": 598728, "epoch": 7213} {"train_loss": -27.926925659179688, "global_step": 598729, "epoch": 7213} {"train_loss": -27.8695011138916, "global_step": 598730, "epoch": 7213} {"train_loss": -27.9400634765625, "global_step": 598731, "epoch": 7213} {"train_loss": -27.83066177368164, "global_step": 598732, "epoch": 7213} {"train_loss": -28.123334884643555, "global_step": 598733, "epoch": 7213} {"train_loss": -28.097517013549805, "global_step": 598734, "epoch": 7213} {"train_loss": -28.2907657623291, "global_step": 598735, "epoch": 7213} {"train_loss": -28.214879989624023, "global_step": 598736, "epoch": 7213} {"train_loss": -28.02973747253418, "global_step": 598737, "epoch": 7213} {"train_loss": -28.26315689086914, "global_step": 598738, "epoch": 7213} {"train_loss": -27.885358810424805, "global_step": 598739, "epoch": 7213} {"train_loss": -27.695932388305664, "global_step": 598740, "epoch": 7213} {"train_loss": -28.007299423217773, "global_step": 598741, "epoch": 7213} {"train_loss": -27.909915924072266, "global_step": 598742, "epoch": 7213} {"train_loss": -28.0532169342041, "global_step": 598743, "epoch": 7213} {"train_loss": -28.1429500579834, "global_step": 598744, "epoch": 7213} {"train_loss": -27.86701011657715, "global_step": 598745, "epoch": 7213} {"train_loss": -27.930286407470703, "global_step": 598746, "epoch": 7213} {"train_loss": -28.03352928161621, "global_step": 598747, "epoch": 7213} {"train_loss": -28.166534423828125, "global_step": 598748, "epoch": 7213} {"train_loss": -28.397247314453125, "global_step": 598749, "epoch": 7213} {"train_loss": -28.630659103393555, "global_step": 598750, "epoch": 7213} {"train_loss": -28.08526039123535, "global_step": 598751, "epoch": 7213} {"train_loss": -28.291580200195312, "global_step": 598752, "epoch": 7213} {"train_loss": -28.24787712097168, "global_step": 598753, "epoch": 7213} {"train_loss": -28.23046875, "global_step": 598754, "epoch": 7213} {"train_loss": -28.565271377563477, "global_step": 598755, "epoch": 7213} {"train_loss": -28.331701278686523, "global_step": 598756, "epoch": 7213} {"train_loss": -28.41997718811035, "global_step": 598757, "epoch": 7213} {"train_loss": -28.220111846923828, "global_step": 598758, "epoch": 7213} {"train_loss": -28.192626953125, "global_step": 598759, "epoch": 7213} {"train_loss": -27.98661231994629, "global_step": 598760, "epoch": 7213} {"train_loss": -27.81019355590085, "global_step": 598761, "epoch": 7213, "val_loss": 6584978.0} {"train_loss": -27.61856460571289, "global_step": 598762, "epoch": 7214} {"train_loss": -25.630481719970703, "global_step": 598763, "epoch": 7214} {"train_loss": -23.242237091064453, "global_step": 598764, "epoch": 7214} {"train_loss": -23.77865982055664, "global_step": 598765, "epoch": 7214} {"train_loss": -26.340124130249023, "global_step": 598766, "epoch": 7214} {"train_loss": -26.3907470703125, "global_step": 598767, "epoch": 7214} {"train_loss": -27.12226676940918, "global_step": 598768, "epoch": 7214} {"train_loss": -25.110258102416992, "global_step": 598769, "epoch": 7214} {"train_loss": -27.137866973876953, "global_step": 598770, "epoch": 7214} {"train_loss": -26.676483154296875, "global_step": 598771, "epoch": 7214} {"train_loss": -26.992034912109375, "global_step": 598772, "epoch": 7214} {"train_loss": -27.021442413330078, "global_step": 598773, "epoch": 7214} {"train_loss": -26.812091827392578, "global_step": 598774, "epoch": 7214} {"train_loss": -27.385223388671875, "global_step": 598775, "epoch": 7214} {"train_loss": -26.762914657592773, "global_step": 598776, "epoch": 7214} {"train_loss": -27.6431941986084, "global_step": 598777, "epoch": 7214} {"train_loss": -27.2840576171875, "global_step": 598778, "epoch": 7214} {"train_loss": -27.011396408081055, "global_step": 598779, "epoch": 7214} {"train_loss": -27.614139556884766, "global_step": 598780, "epoch": 7214} {"train_loss": -27.252859115600586, "global_step": 598781, "epoch": 7214} {"train_loss": -27.49738121032715, "global_step": 598782, "epoch": 7214} {"train_loss": -27.563901901245117, "global_step": 598783, "epoch": 7214} {"train_loss": -27.44373893737793, "global_step": 598784, "epoch": 7214} {"train_loss": -27.723907470703125, "global_step": 598785, "epoch": 7214} {"train_loss": -27.385766983032227, "global_step": 598786, "epoch": 7214} {"train_loss": -27.535058975219727, "global_step": 598787, "epoch": 7214} {"train_loss": -27.6231632232666, "global_step": 598788, "epoch": 7214} {"train_loss": -28.0103702545166, "global_step": 598789, "epoch": 7214} {"train_loss": -27.9261531829834, "global_step": 598790, "epoch": 7214} {"train_loss": -27.45094108581543, "global_step": 598791, "epoch": 7214} {"train_loss": -27.961231231689453, "global_step": 598792, "epoch": 7214} {"train_loss": -27.6824951171875, "global_step": 598793, "epoch": 7214} {"train_loss": -27.371789932250977, "global_step": 598794, "epoch": 7214} {"train_loss": -27.483434677124023, "global_step": 598795, "epoch": 7214} {"train_loss": -27.56715202331543, "global_step": 598796, "epoch": 7214} {"train_loss": -27.66756248474121, "global_step": 598797, "epoch": 7214} {"train_loss": -28.02033805847168, "global_step": 598798, "epoch": 7214} {"train_loss": -27.783935546875, "global_step": 598799, "epoch": 7214} {"train_loss": -27.860645294189453, "global_step": 598800, "epoch": 7214} {"train_loss": -27.697254180908203, "global_step": 598801, "epoch": 7214} {"train_loss": -27.71609878540039, "global_step": 598802, "epoch": 7214} {"train_loss": -27.87208366394043, "global_step": 598803, "epoch": 7214} {"train_loss": -27.6833553314209, "global_step": 598804, "epoch": 7214} {"train_loss": -28.322904586791992, "global_step": 598805, "epoch": 7214} {"train_loss": -27.949979782104492, "global_step": 598806, "epoch": 7214} {"train_loss": -28.51734733581543, "global_step": 598807, "epoch": 7214} {"train_loss": -27.961034774780273, "global_step": 598808, "epoch": 7214} {"train_loss": -28.009851455688477, "global_step": 598809, "epoch": 7214} {"train_loss": -28.14149284362793, "global_step": 598810, "epoch": 7214} {"train_loss": -27.835098266601562, "global_step": 598811, "epoch": 7214} {"train_loss": -27.908939361572266, "global_step": 598812, "epoch": 7214} {"train_loss": -28.322559356689453, "global_step": 598813, "epoch": 7214} {"train_loss": -28.49969482421875, "global_step": 598814, "epoch": 7214} {"train_loss": -27.824522018432617, "global_step": 598815, "epoch": 7214} {"train_loss": -28.120885848999023, "global_step": 598816, "epoch": 7214} {"train_loss": -28.165197372436523, "global_step": 598817, "epoch": 7214} {"train_loss": -27.987140655517578, "global_step": 598818, "epoch": 7214} {"train_loss": -28.125635147094727, "global_step": 598819, "epoch": 7214} {"train_loss": -28.024728775024414, "global_step": 598820, "epoch": 7214} {"train_loss": -28.324054718017578, "global_step": 598821, "epoch": 7214} {"train_loss": -27.9947566986084, "global_step": 598822, "epoch": 7214} {"train_loss": -27.793079376220703, "global_step": 598823, "epoch": 7214} {"train_loss": -27.955991744995117, "global_step": 598824, "epoch": 7214} {"train_loss": -27.972675323486328, "global_step": 598825, "epoch": 7214} {"train_loss": -27.848554611206055, "global_step": 598826, "epoch": 7214} {"train_loss": -27.797714233398438, "global_step": 598827, "epoch": 7214} {"train_loss": -28.058881759643555, "global_step": 598828, "epoch": 7214} {"train_loss": -28.230670928955078, "global_step": 598829, "epoch": 7214} {"train_loss": -28.1276798248291, "global_step": 598830, "epoch": 7214} {"train_loss": -28.470626831054688, "global_step": 598831, "epoch": 7214} {"train_loss": -27.89259147644043, "global_step": 598832, "epoch": 7214} {"train_loss": -27.871191024780273, "global_step": 598833, "epoch": 7214} {"train_loss": -27.919591903686523, "global_step": 598834, "epoch": 7214} {"train_loss": -28.0994873046875, "global_step": 598835, "epoch": 7214} {"train_loss": -28.223087310791016, "global_step": 598836, "epoch": 7214} {"train_loss": -28.1795711517334, "global_step": 598837, "epoch": 7214} {"train_loss": -28.092004776000977, "global_step": 598838, "epoch": 7214} {"train_loss": -28.40606117248535, "global_step": 598839, "epoch": 7214} {"train_loss": -28.072357177734375, "global_step": 598840, "epoch": 7214} {"train_loss": -28.374181747436523, "global_step": 598841, "epoch": 7214} {"train_loss": -28.40616798400879, "global_step": 598842, "epoch": 7214} {"train_loss": -28.128509521484375, "global_step": 598843, "epoch": 7214} {"train_loss": -27.59304515424981, "global_step": 598844, "epoch": 7214, "val_loss": 6573551.0} {"train_loss": -27.43609619140625, "global_step": 598845, "epoch": 7215} {"train_loss": -27.66761589050293, "global_step": 598846, "epoch": 7215} {"train_loss": -27.467742919921875, "global_step": 598847, "epoch": 7215} {"train_loss": -27.74973487854004, "global_step": 598848, "epoch": 7215} {"train_loss": -27.839269638061523, "global_step": 598849, "epoch": 7215} {"train_loss": -27.91251564025879, "global_step": 598850, "epoch": 7215} {"train_loss": -27.531396865844727, "global_step": 598851, "epoch": 7215} {"train_loss": -27.83614158630371, "global_step": 598852, "epoch": 7215} {"train_loss": -27.802066802978516, "global_step": 598853, "epoch": 7215} {"train_loss": -27.509124755859375, "global_step": 598854, "epoch": 7215} {"train_loss": -27.714279174804688, "global_step": 598855, "epoch": 7215} {"train_loss": -27.881500244140625, "global_step": 598856, "epoch": 7215} {"train_loss": -27.666732788085938, "global_step": 598857, "epoch": 7215} {"train_loss": -27.790307998657227, "global_step": 598858, "epoch": 7215} {"train_loss": -27.70355224609375, "global_step": 598859, "epoch": 7215} {"train_loss": -27.807880401611328, "global_step": 598860, "epoch": 7215} {"train_loss": -27.712717056274414, "global_step": 598861, "epoch": 7215} {"train_loss": -27.7435302734375, "global_step": 598862, "epoch": 7215} {"train_loss": -27.80965232849121, "global_step": 598863, "epoch": 7215} {"train_loss": -27.93515968322754, "global_step": 598864, "epoch": 7215} {"train_loss": -27.606565475463867, "global_step": 598865, "epoch": 7215} {"train_loss": -27.412378311157227, "global_step": 598866, "epoch": 7215} {"train_loss": -27.974119186401367, "global_step": 598867, "epoch": 7215} {"train_loss": -27.948104858398438, "global_step": 598868, "epoch": 7215} {"train_loss": -27.568103790283203, "global_step": 598869, "epoch": 7215} {"train_loss": -28.23648452758789, "global_step": 598870, "epoch": 7215} {"train_loss": -27.829944610595703, "global_step": 598871, "epoch": 7215} {"train_loss": -27.653091430664062, "global_step": 598872, "epoch": 7215} {"train_loss": -27.716665267944336, "global_step": 598873, "epoch": 7215} {"train_loss": -27.7305850982666, "global_step": 598874, "epoch": 7215} {"train_loss": -27.699865341186523, "global_step": 598875, "epoch": 7215} {"train_loss": -28.10797119140625, "global_step": 598876, "epoch": 7215} {"train_loss": -28.10626220703125, "global_step": 598877, "epoch": 7215} {"train_loss": -27.586545944213867, "global_step": 598878, "epoch": 7215} {"train_loss": -28.1501407623291, "global_step": 598879, "epoch": 7215} {"train_loss": -28.110105514526367, "global_step": 598880, "epoch": 7215} {"train_loss": -27.907928466796875, "global_step": 598881, "epoch": 7215} {"train_loss": -27.89756202697754, "global_step": 598882, "epoch": 7215} {"train_loss": -27.71661376953125, "global_step": 598883, "epoch": 7215} {"train_loss": -27.91644859313965, "global_step": 598884, "epoch": 7215} {"train_loss": -28.418258666992188, "global_step": 598885, "epoch": 7215} {"train_loss": -28.321130752563477, "global_step": 598886, "epoch": 7215} {"train_loss": -28.361236572265625, "global_step": 598887, "epoch": 7215} {"train_loss": -28.190113067626953, "global_step": 598888, "epoch": 7215} {"train_loss": -28.3795166015625, "global_step": 598889, "epoch": 7215} {"train_loss": -28.285226821899414, "global_step": 598890, "epoch": 7215} {"train_loss": -28.298898696899414, "global_step": 598891, "epoch": 7215} {"train_loss": -28.38770866394043, "global_step": 598892, "epoch": 7215} {"train_loss": -28.57832908630371, "global_step": 598893, "epoch": 7215} {"train_loss": -28.40485954284668, "global_step": 598894, "epoch": 7215} {"train_loss": -28.486669540405273, "global_step": 598895, "epoch": 7215} {"train_loss": -27.944482803344727, "global_step": 598896, "epoch": 7215} {"train_loss": -28.763898849487305, "global_step": 598897, "epoch": 7215} {"train_loss": -28.115192413330078, "global_step": 598898, "epoch": 7215} {"train_loss": -28.302900314331055, "global_step": 598899, "epoch": 7215} {"train_loss": -28.188617706298828, "global_step": 598900, "epoch": 7215} {"train_loss": -28.405176162719727, "global_step": 598901, "epoch": 7215} {"train_loss": -28.195545196533203, "global_step": 598902, "epoch": 7215} {"train_loss": -28.04135513305664, "global_step": 598903, "epoch": 7215} {"train_loss": -28.087141036987305, "global_step": 598904, "epoch": 7215} {"train_loss": -28.469770431518555, "global_step": 598905, "epoch": 7215} {"train_loss": -28.200239181518555, "global_step": 598906, "epoch": 7215} {"train_loss": -28.16812515258789, "global_step": 598907, "epoch": 7215} {"train_loss": -27.60955810546875, "global_step": 598908, "epoch": 7215} {"train_loss": -27.880212783813477, "global_step": 598909, "epoch": 7215} {"train_loss": -28.097492218017578, "global_step": 598910, "epoch": 7215} {"train_loss": -28.097400665283203, "global_step": 598911, "epoch": 7215} {"train_loss": -28.17241859436035, "global_step": 598912, "epoch": 7215} {"train_loss": -27.7106990814209, "global_step": 598913, "epoch": 7215} {"train_loss": -27.888227462768555, "global_step": 598914, "epoch": 7215} {"train_loss": -27.842126846313477, "global_step": 598915, "epoch": 7215} {"train_loss": -28.10019302368164, "global_step": 598916, "epoch": 7215} {"train_loss": -28.046289443969727, "global_step": 598917, "epoch": 7215} {"train_loss": -28.2333927154541, "global_step": 598918, "epoch": 7215} {"train_loss": -27.954792022705078, "global_step": 598919, "epoch": 7215} {"train_loss": -27.818191528320312, "global_step": 598920, "epoch": 7215} {"train_loss": -28.090295791625977, "global_step": 598921, "epoch": 7215} {"train_loss": -27.735742568969727, "global_step": 598922, "epoch": 7215} {"train_loss": -27.92720603942871, "global_step": 598923, "epoch": 7215} {"train_loss": -27.964941024780273, "global_step": 598924, "epoch": 7215} {"train_loss": -28.166488647460938, "global_step": 598925, "epoch": 7215} {"train_loss": -28.040496826171875, "global_step": 598926, "epoch": 7215} {"train_loss": -27.939807064561958, "global_step": 598927, "epoch": 7215, "val_loss": 6588049.0} {"train_loss": -26.370508193969727, "global_step": 598928, "epoch": 7216} {"train_loss": -27.137908935546875, "global_step": 598929, "epoch": 7216} {"train_loss": -27.144229888916016, "global_step": 598930, "epoch": 7216} {"train_loss": -25.72513771057129, "global_step": 598931, "epoch": 7216} {"train_loss": -27.023160934448242, "global_step": 598932, "epoch": 7216} {"train_loss": -26.206695556640625, "global_step": 598933, "epoch": 7216} {"train_loss": -27.349323272705078, "global_step": 598934, "epoch": 7216} {"train_loss": -26.307065963745117, "global_step": 598935, "epoch": 7216} {"train_loss": -27.539194107055664, "global_step": 598936, "epoch": 7216} {"train_loss": -27.2861270904541, "global_step": 598937, "epoch": 7216} {"train_loss": -26.772008895874023, "global_step": 598938, "epoch": 7216} {"train_loss": -27.510343551635742, "global_step": 598939, "epoch": 7216} {"train_loss": -27.288782119750977, "global_step": 598940, "epoch": 7216} {"train_loss": -26.8936710357666, "global_step": 598941, "epoch": 7216} {"train_loss": -27.365793228149414, "global_step": 598942, "epoch": 7216} {"train_loss": -27.55564308166504, "global_step": 598943, "epoch": 7216} {"train_loss": -27.4744930267334, "global_step": 598944, "epoch": 7216} {"train_loss": -27.402780532836914, "global_step": 598945, "epoch": 7216} {"train_loss": -27.63824462890625, "global_step": 598946, "epoch": 7216} {"train_loss": -27.446374893188477, "global_step": 598947, "epoch": 7216} {"train_loss": -28.085010528564453, "global_step": 598948, "epoch": 7216} {"train_loss": -27.701017379760742, "global_step": 598949, "epoch": 7216} {"train_loss": -27.5096492767334, "global_step": 598950, "epoch": 7216} {"train_loss": -27.7200984954834, "global_step": 598951, "epoch": 7216} {"train_loss": -27.5880069732666, "global_step": 598952, "epoch": 7216} {"train_loss": -27.745580673217773, "global_step": 598953, "epoch": 7216} {"train_loss": -27.849409103393555, "global_step": 598954, "epoch": 7216} {"train_loss": -27.86330223083496, "global_step": 598955, "epoch": 7216} {"train_loss": -27.966352462768555, "global_step": 598956, "epoch": 7216} {"train_loss": -28.042036056518555, "global_step": 598957, "epoch": 7216} {"train_loss": -28.056537628173828, "global_step": 598958, "epoch": 7216} {"train_loss": -27.8260555267334, "global_step": 598959, "epoch": 7216} {"train_loss": -27.88396644592285, "global_step": 598960, "epoch": 7216} {"train_loss": -27.84128761291504, "global_step": 598961, "epoch": 7216} {"train_loss": -28.05011558532715, "global_step": 598962, "epoch": 7216} {"train_loss": -28.103809356689453, "global_step": 598963, "epoch": 7216} {"train_loss": -27.835601806640625, "global_step": 598964, "epoch": 7216} {"train_loss": -28.108509063720703, "global_step": 598965, "epoch": 7216} {"train_loss": -27.70220375061035, "global_step": 598966, "epoch": 7216} {"train_loss": -27.922592163085938, "global_step": 598967, "epoch": 7216} {"train_loss": -27.963964462280273, "global_step": 598968, "epoch": 7216} {"train_loss": -27.548175811767578, "global_step": 598969, "epoch": 7216} {"train_loss": -28.0764217376709, "global_step": 598970, "epoch": 7216} {"train_loss": -28.12114906311035, "global_step": 598971, "epoch": 7216} {"train_loss": -28.43520164489746, "global_step": 598972, "epoch": 7216} {"train_loss": -27.95783805847168, "global_step": 598973, "epoch": 7216} {"train_loss": -28.132558822631836, "global_step": 598974, "epoch": 7216} {"train_loss": -27.746917724609375, "global_step": 598975, "epoch": 7216} {"train_loss": -28.28218650817871, "global_step": 598976, "epoch": 7216} {"train_loss": -28.096332550048828, "global_step": 598977, "epoch": 7216} {"train_loss": -28.4608211517334, "global_step": 598978, "epoch": 7216} {"train_loss": -28.471485137939453, "global_step": 598979, "epoch": 7216} {"train_loss": -28.29665184020996, "global_step": 598980, "epoch": 7216} {"train_loss": -27.88043212890625, "global_step": 598981, "epoch": 7216} {"train_loss": -27.761144638061523, "global_step": 598982, "epoch": 7216} {"train_loss": -27.591283798217773, "global_step": 598983, "epoch": 7216} {"train_loss": -27.312244415283203, "global_step": 598984, "epoch": 7216} {"train_loss": -27.393985748291016, "global_step": 598985, "epoch": 7216} {"train_loss": -28.000385284423828, "global_step": 598986, "epoch": 7216} {"train_loss": -27.9481201171875, "global_step": 598987, "epoch": 7216} {"train_loss": -28.080625534057617, "global_step": 598988, "epoch": 7216} {"train_loss": -27.822492599487305, "global_step": 598989, "epoch": 7216} {"train_loss": -28.038633346557617, "global_step": 598990, "epoch": 7216} {"train_loss": -28.1298828125, "global_step": 598991, "epoch": 7216} {"train_loss": -28.050281524658203, "global_step": 598992, "epoch": 7216} {"train_loss": -28.092060089111328, "global_step": 598993, "epoch": 7216} {"train_loss": -28.3292179107666, "global_step": 598994, "epoch": 7216} {"train_loss": -27.952117919921875, "global_step": 598995, "epoch": 7216} {"train_loss": -27.771825790405273, "global_step": 598996, "epoch": 7216} {"train_loss": -27.71345329284668, "global_step": 598997, "epoch": 7216} {"train_loss": -28.037073135375977, "global_step": 598998, "epoch": 7216} {"train_loss": -28.03944206237793, "global_step": 598999, "epoch": 7216} {"train_loss": -27.415822982788086, "global_step": 599000, "epoch": 7216} {"train_loss": -28.027429580688477, "global_step": 599001, "epoch": 7216} {"train_loss": -27.77326011657715, "global_step": 599002, "epoch": 7216} {"train_loss": -27.7418270111084, "global_step": 599003, "epoch": 7216} {"train_loss": -27.52585792541504, "global_step": 599004, "epoch": 7216} {"train_loss": -28.119129180908203, "global_step": 599005, "epoch": 7216} {"train_loss": -27.37981605529785, "global_step": 599006, "epoch": 7216} {"train_loss": -27.983505249023438, "global_step": 599007, "epoch": 7216} {"train_loss": -28.0147705078125, "global_step": 599008, "epoch": 7216} {"train_loss": -27.61225700378418, "global_step": 599009, "epoch": 7216} {"train_loss": -27.715716097728315, "global_step": 599010, "epoch": 7216, "val_loss": 6550292.0} {"train_loss": -27.457599639892578, "global_step": 599011, "epoch": 7217} {"train_loss": -27.56012535095215, "global_step": 599012, "epoch": 7217} {"train_loss": -27.260278701782227, "global_step": 599013, "epoch": 7217} {"train_loss": -26.906530380249023, "global_step": 599014, "epoch": 7217} {"train_loss": -27.308975219726562, "global_step": 599015, "epoch": 7217} {"train_loss": -27.433704376220703, "global_step": 599016, "epoch": 7217} {"train_loss": -27.7034912109375, "global_step": 599017, "epoch": 7217} {"train_loss": -26.989490509033203, "global_step": 599018, "epoch": 7217} {"train_loss": -27.530670166015625, "global_step": 599019, "epoch": 7217} {"train_loss": -27.399337768554688, "global_step": 599020, "epoch": 7217} {"train_loss": -27.179412841796875, "global_step": 599021, "epoch": 7217} {"train_loss": -27.509244918823242, "global_step": 599022, "epoch": 7217} {"train_loss": -27.40035057067871, "global_step": 599023, "epoch": 7217} {"train_loss": -27.631973266601562, "global_step": 599024, "epoch": 7217} {"train_loss": -27.549625396728516, "global_step": 599025, "epoch": 7217} {"train_loss": -27.671689987182617, "global_step": 599026, "epoch": 7217} {"train_loss": -27.91652488708496, "global_step": 599027, "epoch": 7217} {"train_loss": -27.84759521484375, "global_step": 599028, "epoch": 7217} {"train_loss": -27.76825523376465, "global_step": 599029, "epoch": 7217} {"train_loss": -27.45318603515625, "global_step": 599030, "epoch": 7217} {"train_loss": -27.502552032470703, "global_step": 599031, "epoch": 7217} {"train_loss": -27.891324996948242, "global_step": 599032, "epoch": 7217} {"train_loss": -27.778034210205078, "global_step": 599033, "epoch": 7217} {"train_loss": -27.829919815063477, "global_step": 599034, "epoch": 7217} {"train_loss": -27.85383415222168, "global_step": 599035, "epoch": 7217} {"train_loss": -27.964624404907227, "global_step": 599036, "epoch": 7217} {"train_loss": -27.81797218322754, "global_step": 599037, "epoch": 7217} {"train_loss": -27.548192977905273, "global_step": 599038, "epoch": 7217} {"train_loss": -27.702346801757812, "global_step": 599039, "epoch": 7217} {"train_loss": -28.077497482299805, "global_step": 599040, "epoch": 7217} {"train_loss": -27.954641342163086, "global_step": 599041, "epoch": 7217} {"train_loss": -28.028335571289062, "global_step": 599042, "epoch": 7217} {"train_loss": -28.0562686920166, "global_step": 599043, "epoch": 7217} {"train_loss": -28.2254638671875, "global_step": 599044, "epoch": 7217} {"train_loss": -27.843021392822266, "global_step": 599045, "epoch": 7217} {"train_loss": -28.021146774291992, "global_step": 599046, "epoch": 7217} {"train_loss": -27.722766876220703, "global_step": 599047, "epoch": 7217} {"train_loss": -28.235944747924805, "global_step": 599048, "epoch": 7217} {"train_loss": -28.414875030517578, "global_step": 599049, "epoch": 7217} {"train_loss": -28.205163955688477, "global_step": 599050, "epoch": 7217} {"train_loss": -28.078140258789062, "global_step": 599051, "epoch": 7217} {"train_loss": -28.34669303894043, "global_step": 599052, "epoch": 7217} {"train_loss": -28.468231201171875, "global_step": 599053, "epoch": 7217} {"train_loss": -28.312543869018555, "global_step": 599054, "epoch": 7217} {"train_loss": -28.328765869140625, "global_step": 599055, "epoch": 7217} {"train_loss": -28.062000274658203, "global_step": 599056, "epoch": 7217} {"train_loss": -28.51487159729004, "global_step": 599057, "epoch": 7217} {"train_loss": -28.02239418029785, "global_step": 599058, "epoch": 7217} {"train_loss": -28.399738311767578, "global_step": 599059, "epoch": 7217} {"train_loss": -28.04922866821289, "global_step": 599060, "epoch": 7217} {"train_loss": -28.376270294189453, "global_step": 599061, "epoch": 7217} {"train_loss": -28.240772247314453, "global_step": 599062, "epoch": 7217} {"train_loss": -28.396106719970703, "global_step": 599063, "epoch": 7217} {"train_loss": -28.351476669311523, "global_step": 599064, "epoch": 7217} {"train_loss": -28.21858024597168, "global_step": 599065, "epoch": 7217} {"train_loss": -28.163564682006836, "global_step": 599066, "epoch": 7217} {"train_loss": -28.007556915283203, "global_step": 599067, "epoch": 7217} {"train_loss": -28.306182861328125, "global_step": 599068, "epoch": 7217} {"train_loss": -28.408658981323242, "global_step": 599069, "epoch": 7217} {"train_loss": -28.272998809814453, "global_step": 599070, "epoch": 7217} {"train_loss": -27.85708999633789, "global_step": 599071, "epoch": 7217} {"train_loss": -27.84612464904785, "global_step": 599072, "epoch": 7217} {"train_loss": -27.58350944519043, "global_step": 599073, "epoch": 7217} {"train_loss": -28.23396873474121, "global_step": 599074, "epoch": 7217} {"train_loss": -28.326602935791016, "global_step": 599075, "epoch": 7217} {"train_loss": -27.973352432250977, "global_step": 599076, "epoch": 7217} {"train_loss": -27.949228286743164, "global_step": 599077, "epoch": 7217} {"train_loss": -27.74732780456543, "global_step": 599078, "epoch": 7217} {"train_loss": -27.88331413269043, "global_step": 599079, "epoch": 7217} {"train_loss": -27.754423141479492, "global_step": 599080, "epoch": 7217} {"train_loss": -27.645404815673828, "global_step": 599081, "epoch": 7217} {"train_loss": -28.006994247436523, "global_step": 599082, "epoch": 7217} {"train_loss": -28.036121368408203, "global_step": 599083, "epoch": 7217} {"train_loss": -28.23647117614746, "global_step": 599084, "epoch": 7217} {"train_loss": -27.954833984375, "global_step": 599085, "epoch": 7217} {"train_loss": -28.126617431640625, "global_step": 599086, "epoch": 7217} {"train_loss": -28.088220596313477, "global_step": 599087, "epoch": 7217} {"train_loss": -28.173755645751953, "global_step": 599088, "epoch": 7217} {"train_loss": -27.773054122924805, "global_step": 599089, "epoch": 7217} {"train_loss": -28.354459762573242, "global_step": 599090, "epoch": 7217} {"train_loss": -28.106571197509766, "global_step": 599091, "epoch": 7217} {"train_loss": -27.917011260986328, "global_step": 599092, "epoch": 7217} {"train_loss": -27.904523389885224, "global_step": 599093, "epoch": 7217, "val_loss": 6549154.5} {"train_loss": -28.007177352905273, "global_step": 599094, "epoch": 7218} {"train_loss": -27.815277099609375, "global_step": 599095, "epoch": 7218} {"train_loss": -27.761184692382812, "global_step": 599096, "epoch": 7218} {"train_loss": -27.632587432861328, "global_step": 599097, "epoch": 7218} {"train_loss": -28.066389083862305, "global_step": 599098, "epoch": 7218} {"train_loss": -27.89784812927246, "global_step": 599099, "epoch": 7218} {"train_loss": -28.011962890625, "global_step": 599100, "epoch": 7218} {"train_loss": -28.20503044128418, "global_step": 599101, "epoch": 7218} {"train_loss": -27.9296875, "global_step": 599102, "epoch": 7218} {"train_loss": -27.697921752929688, "global_step": 599103, "epoch": 7218} {"train_loss": -28.162500381469727, "global_step": 599104, "epoch": 7218} {"train_loss": -28.272918701171875, "global_step": 599105, "epoch": 7218} {"train_loss": -28.54734230041504, "global_step": 599106, "epoch": 7218} {"train_loss": -27.880844116210938, "global_step": 599107, "epoch": 7218} {"train_loss": -27.61199951171875, "global_step": 599108, "epoch": 7218} {"train_loss": -28.43206214904785, "global_step": 599109, "epoch": 7218} {"train_loss": -28.1594295501709, "global_step": 599110, "epoch": 7218} {"train_loss": -27.858312606811523, "global_step": 599111, "epoch": 7218} {"train_loss": -28.03675651550293, "global_step": 599112, "epoch": 7218} {"train_loss": -27.641035079956055, "global_step": 599113, "epoch": 7218} {"train_loss": -28.1005859375, "global_step": 599114, "epoch": 7218} {"train_loss": -27.917997360229492, "global_step": 599115, "epoch": 7218} {"train_loss": -27.727025985717773, "global_step": 599116, "epoch": 7218} {"train_loss": -27.8767032623291, "global_step": 599117, "epoch": 7218} {"train_loss": -27.86802101135254, "global_step": 599118, "epoch": 7218} {"train_loss": -27.833999633789062, "global_step": 599119, "epoch": 7218} {"train_loss": -27.723814010620117, "global_step": 599120, "epoch": 7218} {"train_loss": -27.918012619018555, "global_step": 599121, "epoch": 7218} {"train_loss": -27.65045166015625, "global_step": 599122, "epoch": 7218} {"train_loss": -27.373579025268555, "global_step": 599123, "epoch": 7218} {"train_loss": -28.130151748657227, "global_step": 599124, "epoch": 7218} {"train_loss": -27.54200553894043, "global_step": 599125, "epoch": 7218} {"train_loss": -27.742919921875, "global_step": 599126, "epoch": 7218} {"train_loss": -27.960351943969727, "global_step": 599127, "epoch": 7218} {"train_loss": -27.75958824157715, "global_step": 599128, "epoch": 7218} {"train_loss": -27.991443634033203, "global_step": 599129, "epoch": 7218} {"train_loss": -27.841537475585938, "global_step": 599130, "epoch": 7218} {"train_loss": -27.494281768798828, "global_step": 599131, "epoch": 7218} {"train_loss": -28.192113876342773, "global_step": 599132, "epoch": 7218} {"train_loss": -27.98435401916504, "global_step": 599133, "epoch": 7218} {"train_loss": -27.84222984313965, "global_step": 599134, "epoch": 7218} {"train_loss": -27.66511344909668, "global_step": 599135, "epoch": 7218} {"train_loss": -27.93107032775879, "global_step": 599136, "epoch": 7218} {"train_loss": -27.69898796081543, "global_step": 599137, "epoch": 7218} {"train_loss": -27.95781898498535, "global_step": 599138, "epoch": 7218} {"train_loss": -27.806310653686523, "global_step": 599139, "epoch": 7218} {"train_loss": -27.9990234375, "global_step": 599140, "epoch": 7218} {"train_loss": -28.192554473876953, "global_step": 599141, "epoch": 7218} {"train_loss": -28.0931396484375, "global_step": 599142, "epoch": 7218} {"train_loss": -28.166065216064453, "global_step": 599143, "epoch": 7218} {"train_loss": -28.077600479125977, "global_step": 599144, "epoch": 7218} {"train_loss": -27.816232681274414, "global_step": 599145, "epoch": 7218} {"train_loss": -28.10249900817871, "global_step": 599146, "epoch": 7218} {"train_loss": -28.282012939453125, "global_step": 599147, "epoch": 7218} {"train_loss": -27.803197860717773, "global_step": 599148, "epoch": 7218} {"train_loss": -27.73980140686035, "global_step": 599149, "epoch": 7218} {"train_loss": -28.263395309448242, "global_step": 599150, "epoch": 7218} {"train_loss": -28.338092803955078, "global_step": 599151, "epoch": 7218} {"train_loss": -28.15205955505371, "global_step": 599152, "epoch": 7218} {"train_loss": -28.129486083984375, "global_step": 599153, "epoch": 7218} {"train_loss": -28.16376304626465, "global_step": 599154, "epoch": 7218} {"train_loss": -27.78521728515625, "global_step": 599155, "epoch": 7218} {"train_loss": -28.18231773376465, "global_step": 599156, "epoch": 7218} {"train_loss": -28.18059730529785, "global_step": 599157, "epoch": 7218} {"train_loss": -27.990400314331055, "global_step": 599158, "epoch": 7218} {"train_loss": -28.336151123046875, "global_step": 599159, "epoch": 7218} {"train_loss": -28.17231559753418, "global_step": 599160, "epoch": 7218} {"train_loss": -28.21380615234375, "global_step": 599161, "epoch": 7218} {"train_loss": -27.92401123046875, "global_step": 599162, "epoch": 7218} {"train_loss": -28.136137008666992, "global_step": 599163, "epoch": 7218} {"train_loss": -28.20796012878418, "global_step": 599164, "epoch": 7218} {"train_loss": -27.717477798461914, "global_step": 599165, "epoch": 7218} {"train_loss": -28.025211334228516, "global_step": 599166, "epoch": 7218} {"train_loss": -27.734012603759766, "global_step": 599167, "epoch": 7218} {"train_loss": -28.003347396850586, "global_step": 599168, "epoch": 7218} {"train_loss": -27.938806533813477, "global_step": 599169, "epoch": 7218} {"train_loss": -28.329818725585938, "global_step": 599170, "epoch": 7218} {"train_loss": -28.444955825805664, "global_step": 599171, "epoch": 7218} {"train_loss": -27.839649200439453, "global_step": 599172, "epoch": 7218} {"train_loss": -28.16887855529785, "global_step": 599173, "epoch": 7218} {"train_loss": -27.79905128479004, "global_step": 599174, "epoch": 7218} {"train_loss": -27.826053619384766, "global_step": 599175, "epoch": 7218} {"train_loss": -27.990053199859986, "global_step": 599176, "epoch": 7218, "val_loss": 6659308.5} {"train_loss": -24.79121208190918, "global_step": 599177, "epoch": 7219} {"train_loss": -25.593090057373047, "global_step": 599178, "epoch": 7219} {"train_loss": -26.776891708374023, "global_step": 599179, "epoch": 7219} {"train_loss": -25.01381492614746, "global_step": 599180, "epoch": 7219} {"train_loss": -26.235387802124023, "global_step": 599181, "epoch": 7219} {"train_loss": -26.028472900390625, "global_step": 599182, "epoch": 7219} {"train_loss": -26.39507484436035, "global_step": 599183, "epoch": 7219} {"train_loss": -26.60199546813965, "global_step": 599184, "epoch": 7219} {"train_loss": -26.627084732055664, "global_step": 599185, "epoch": 7219} {"train_loss": -26.63883399963379, "global_step": 599186, "epoch": 7219} {"train_loss": -27.172922134399414, "global_step": 599187, "epoch": 7219} {"train_loss": -26.734350204467773, "global_step": 599188, "epoch": 7219} {"train_loss": -27.202184677124023, "global_step": 599189, "epoch": 7219} {"train_loss": -27.233306884765625, "global_step": 599190, "epoch": 7219} {"train_loss": -26.854894638061523, "global_step": 599191, "epoch": 7219} {"train_loss": -27.4434757232666, "global_step": 599192, "epoch": 7219} {"train_loss": -26.932783126831055, "global_step": 599193, "epoch": 7219} {"train_loss": -27.154560089111328, "global_step": 599194, "epoch": 7219} {"train_loss": -27.140790939331055, "global_step": 599195, "epoch": 7219} {"train_loss": -27.360654830932617, "global_step": 599196, "epoch": 7219} {"train_loss": -27.025243759155273, "global_step": 599197, "epoch": 7219} {"train_loss": -27.455646514892578, "global_step": 599198, "epoch": 7219} {"train_loss": -27.278242111206055, "global_step": 599199, "epoch": 7219} {"train_loss": -27.36329460144043, "global_step": 599200, "epoch": 7219} {"train_loss": -27.698379516601562, "global_step": 599201, "epoch": 7219} {"train_loss": -27.71441650390625, "global_step": 599202, "epoch": 7219} {"train_loss": -27.717321395874023, "global_step": 599203, "epoch": 7219} {"train_loss": -27.424072265625, "global_step": 599204, "epoch": 7219} {"train_loss": -27.56499671936035, "global_step": 599205, "epoch": 7219} {"train_loss": -27.299047470092773, "global_step": 599206, "epoch": 7219} {"train_loss": -27.477933883666992, "global_step": 599207, "epoch": 7219} {"train_loss": -27.82071876525879, "global_step": 599208, "epoch": 7219} {"train_loss": -27.437732696533203, "global_step": 599209, "epoch": 7219} {"train_loss": -27.67081642150879, "global_step": 599210, "epoch": 7219} {"train_loss": -27.64210319519043, "global_step": 599211, "epoch": 7219} {"train_loss": -27.913930892944336, "global_step": 599212, "epoch": 7219} {"train_loss": -28.04035758972168, "global_step": 599213, "epoch": 7219} {"train_loss": -28.16070556640625, "global_step": 599214, "epoch": 7219} {"train_loss": -27.634735107421875, "global_step": 599215, "epoch": 7219} {"train_loss": -27.81463050842285, "global_step": 599216, "epoch": 7219} {"train_loss": -27.8507137298584, "global_step": 599217, "epoch": 7219} {"train_loss": -27.524595260620117, "global_step": 599218, "epoch": 7219} {"train_loss": -28.167200088500977, "global_step": 599219, "epoch": 7219} {"train_loss": -27.862695693969727, "global_step": 599220, "epoch": 7219} {"train_loss": -28.329153060913086, "global_step": 599221, "epoch": 7219} {"train_loss": -28.330398559570312, "global_step": 599222, "epoch": 7219} {"train_loss": -27.85554313659668, "global_step": 599223, "epoch": 7219} {"train_loss": -28.350854873657227, "global_step": 599224, "epoch": 7219} {"train_loss": -28.269140243530273, "global_step": 599225, "epoch": 7219} {"train_loss": -27.8692684173584, "global_step": 599226, "epoch": 7219} {"train_loss": -28.152149200439453, "global_step": 599227, "epoch": 7219} {"train_loss": -28.149616241455078, "global_step": 599228, "epoch": 7219} {"train_loss": -28.049707412719727, "global_step": 599229, "epoch": 7219} {"train_loss": -28.060361862182617, "global_step": 599230, "epoch": 7219} {"train_loss": -27.575559616088867, "global_step": 599231, "epoch": 7219} {"train_loss": -28.62579345703125, "global_step": 599232, "epoch": 7219} {"train_loss": -28.035181045532227, "global_step": 599233, "epoch": 7219} {"train_loss": -28.523542404174805, "global_step": 599234, "epoch": 7219} {"train_loss": -28.38323974609375, "global_step": 599235, "epoch": 7219} {"train_loss": -28.61625099182129, "global_step": 599236, "epoch": 7219} {"train_loss": -28.294401168823242, "global_step": 599237, "epoch": 7219} {"train_loss": -28.309125900268555, "global_step": 599238, "epoch": 7219} {"train_loss": -28.295820236206055, "global_step": 599239, "epoch": 7219} {"train_loss": -28.547916412353516, "global_step": 599240, "epoch": 7219} {"train_loss": -28.193822860717773, "global_step": 599241, "epoch": 7219} {"train_loss": -28.00189781188965, "global_step": 599242, "epoch": 7219} {"train_loss": -28.10853385925293, "global_step": 599243, "epoch": 7219} {"train_loss": -27.440994262695312, "global_step": 599244, "epoch": 7219} {"train_loss": -27.141714096069336, "global_step": 599245, "epoch": 7219} {"train_loss": -26.7061824798584, "global_step": 599246, "epoch": 7219} {"train_loss": -27.915653228759766, "global_step": 599247, "epoch": 7219} {"train_loss": -28.239099502563477, "global_step": 599248, "epoch": 7219} {"train_loss": -27.92510414123535, "global_step": 599249, "epoch": 7219} {"train_loss": -28.136154174804688, "global_step": 599250, "epoch": 7219} {"train_loss": -27.617948532104492, "global_step": 599251, "epoch": 7219} {"train_loss": -27.658905029296875, "global_step": 599252, "epoch": 7219} {"train_loss": -27.801794052124023, "global_step": 599253, "epoch": 7219} {"train_loss": -27.71382713317871, "global_step": 599254, "epoch": 7219} {"train_loss": -27.738805770874023, "global_step": 599255, "epoch": 7219} {"train_loss": -27.621091842651367, "global_step": 599256, "epoch": 7219} {"train_loss": -27.384033203125, "global_step": 599257, "epoch": 7219} {"train_loss": -27.974878311157227, "global_step": 599258, "epoch": 7219} {"train_loss": -27.52078398738999, "global_step": 599259, "epoch": 7219, "val_loss": 6621861.0} {"train_loss": -26.00661277770996, "global_step": 599260, "epoch": 7220} {"train_loss": -23.818937301635742, "global_step": 599261, "epoch": 7220} {"train_loss": -26.16595458984375, "global_step": 599262, "epoch": 7220} {"train_loss": -25.69266700744629, "global_step": 599263, "epoch": 7220} {"train_loss": -26.683679580688477, "global_step": 599264, "epoch": 7220} {"train_loss": -26.44630241394043, "global_step": 599265, "epoch": 7220} {"train_loss": -26.814985275268555, "global_step": 599266, "epoch": 7220} {"train_loss": -26.206464767456055, "global_step": 599267, "epoch": 7220} {"train_loss": -27.03857421875, "global_step": 599268, "epoch": 7220} {"train_loss": -26.915307998657227, "global_step": 599269, "epoch": 7220} {"train_loss": -26.65382194519043, "global_step": 599270, "epoch": 7220} {"train_loss": -26.72967529296875, "global_step": 599271, "epoch": 7220} {"train_loss": -26.883636474609375, "global_step": 599272, "epoch": 7220} {"train_loss": -27.39068603515625, "global_step": 599273, "epoch": 7220} {"train_loss": -27.12856101989746, "global_step": 599274, "epoch": 7220} {"train_loss": -27.41962242126465, "global_step": 599275, "epoch": 7220} {"train_loss": -27.479339599609375, "global_step": 599276, "epoch": 7220} {"train_loss": -27.350341796875, "global_step": 599277, "epoch": 7220} {"train_loss": -27.30600929260254, "global_step": 599278, "epoch": 7220} {"train_loss": -27.616804122924805, "global_step": 599279, "epoch": 7220} {"train_loss": -27.7315731048584, "global_step": 599280, "epoch": 7220} {"train_loss": -27.155248641967773, "global_step": 599281, "epoch": 7220} {"train_loss": -27.6099796295166, "global_step": 599282, "epoch": 7220} {"train_loss": -27.687910079956055, "global_step": 599283, "epoch": 7220} {"train_loss": -27.678485870361328, "global_step": 599284, "epoch": 7220} {"train_loss": -27.18873405456543, "global_step": 599285, "epoch": 7220} {"train_loss": -27.572879791259766, "global_step": 599286, "epoch": 7220} {"train_loss": -27.7578125, "global_step": 599287, "epoch": 7220} {"train_loss": -28.051244735717773, "global_step": 599288, "epoch": 7220} {"train_loss": -27.454748153686523, "global_step": 599289, "epoch": 7220} {"train_loss": -27.791202545166016, "global_step": 599290, "epoch": 7220} {"train_loss": -27.945011138916016, "global_step": 599291, "epoch": 7220} {"train_loss": -27.999286651611328, "global_step": 599292, "epoch": 7220} {"train_loss": -27.60886573791504, "global_step": 599293, "epoch": 7220} {"train_loss": -27.896411895751953, "global_step": 599294, "epoch": 7220} {"train_loss": -27.904937744140625, "global_step": 599295, "epoch": 7220} {"train_loss": -27.737051010131836, "global_step": 599296, "epoch": 7220} {"train_loss": -28.047443389892578, "global_step": 599297, "epoch": 7220} {"train_loss": -28.234821319580078, "global_step": 599298, "epoch": 7220} {"train_loss": -28.379606246948242, "global_step": 599299, "epoch": 7220} {"train_loss": -28.123920440673828, "global_step": 599300, "epoch": 7220} {"train_loss": -27.726850509643555, "global_step": 599301, "epoch": 7220} {"train_loss": -28.067731857299805, "global_step": 599302, "epoch": 7220} {"train_loss": -27.740234375, "global_step": 599303, "epoch": 7220} {"train_loss": -28.184375762939453, "global_step": 599304, "epoch": 7220} {"train_loss": -28.00587272644043, "global_step": 599305, "epoch": 7220} {"train_loss": -27.795087814331055, "global_step": 599306, "epoch": 7220} {"train_loss": -28.35772705078125, "global_step": 599307, "epoch": 7220} {"train_loss": -28.358978271484375, "global_step": 599308, "epoch": 7220} {"train_loss": -27.936262130737305, "global_step": 599309, "epoch": 7220} {"train_loss": -28.123458862304688, "global_step": 599310, "epoch": 7220} {"train_loss": -28.50348472595215, "global_step": 599311, "epoch": 7220} {"train_loss": -28.095752716064453, "global_step": 599312, "epoch": 7220} {"train_loss": -28.152807235717773, "global_step": 599313, "epoch": 7220} {"train_loss": -28.24198341369629, "global_step": 599314, "epoch": 7220} {"train_loss": -27.903827667236328, "global_step": 599315, "epoch": 7220} {"train_loss": -27.56524658203125, "global_step": 599316, "epoch": 7220} {"train_loss": -27.823078155517578, "global_step": 599317, "epoch": 7220} {"train_loss": -27.57863426208496, "global_step": 599318, "epoch": 7220} {"train_loss": -27.870569229125977, "global_step": 599319, "epoch": 7220} {"train_loss": -27.960315704345703, "global_step": 599320, "epoch": 7220} {"train_loss": -27.813034057617188, "global_step": 599321, "epoch": 7220} {"train_loss": -27.59646987915039, "global_step": 599322, "epoch": 7220} {"train_loss": -27.574249267578125, "global_step": 599323, "epoch": 7220} {"train_loss": -27.614704132080078, "global_step": 599324, "epoch": 7220} {"train_loss": -27.95918083190918, "global_step": 599325, "epoch": 7220} {"train_loss": -28.1663761138916, "global_step": 599326, "epoch": 7220} {"train_loss": -27.803546905517578, "global_step": 599327, "epoch": 7220} {"train_loss": -28.220067977905273, "global_step": 599328, "epoch": 7220} {"train_loss": -27.739561080932617, "global_step": 599329, "epoch": 7220} {"train_loss": -28.0073184967041, "global_step": 599330, "epoch": 7220} {"train_loss": -27.773374557495117, "global_step": 599331, "epoch": 7220} {"train_loss": -27.96710777282715, "global_step": 599332, "epoch": 7220} {"train_loss": -27.874786376953125, "global_step": 599333, "epoch": 7220} {"train_loss": -28.123411178588867, "global_step": 599334, "epoch": 7220} {"train_loss": -27.89495849609375, "global_step": 599335, "epoch": 7220} {"train_loss": -28.24818229675293, "global_step": 599336, "epoch": 7220} {"train_loss": -28.011199951171875, "global_step": 599337, "epoch": 7220} {"train_loss": -28.107654571533203, "global_step": 599338, "epoch": 7220} {"train_loss": -27.91694450378418, "global_step": 599339, "epoch": 7220} {"train_loss": -27.975244522094727, "global_step": 599340, "epoch": 7220} {"train_loss": -28.16462516784668, "global_step": 599341, "epoch": 7220} {"train_loss": -27.616565865206432, "global_step": 599342, "epoch": 7220, "val_loss": 6558053.0} {"train_loss": -27.205137252807617, "global_step": 599343, "epoch": 7221} {"train_loss": -27.652708053588867, "global_step": 599344, "epoch": 7221} {"train_loss": -27.794523239135742, "global_step": 599345, "epoch": 7221} {"train_loss": -27.675363540649414, "global_step": 599346, "epoch": 7221} {"train_loss": -27.496414184570312, "global_step": 599347, "epoch": 7221} {"train_loss": -27.675657272338867, "global_step": 599348, "epoch": 7221} {"train_loss": -27.768890380859375, "global_step": 599349, "epoch": 7221} {"train_loss": -28.170639038085938, "global_step": 599350, "epoch": 7221} {"train_loss": -27.814685821533203, "global_step": 599351, "epoch": 7221} {"train_loss": -27.722681045532227, "global_step": 599352, "epoch": 7221} {"train_loss": -27.7528076171875, "global_step": 599353, "epoch": 7221} {"train_loss": -27.59364891052246, "global_step": 599354, "epoch": 7221} {"train_loss": -27.7206974029541, "global_step": 599355, "epoch": 7221} {"train_loss": -27.982019424438477, "global_step": 599356, "epoch": 7221} {"train_loss": -27.822681427001953, "global_step": 599357, "epoch": 7221} {"train_loss": -27.649524688720703, "global_step": 599358, "epoch": 7221} {"train_loss": -27.792139053344727, "global_step": 599359, "epoch": 7221} {"train_loss": -27.568586349487305, "global_step": 599360, "epoch": 7221} {"train_loss": -28.11964225769043, "global_step": 599361, "epoch": 7221} {"train_loss": -27.912763595581055, "global_step": 599362, "epoch": 7221} {"train_loss": -27.84107780456543, "global_step": 599363, "epoch": 7221} {"train_loss": -27.92172622680664, "global_step": 599364, "epoch": 7221} {"train_loss": -28.159870147705078, "global_step": 599365, "epoch": 7221} {"train_loss": -27.9813232421875, "global_step": 599366, "epoch": 7221} {"train_loss": -27.920270919799805, "global_step": 599367, "epoch": 7221} {"train_loss": -28.105457305908203, "global_step": 599368, "epoch": 7221} {"train_loss": -28.313093185424805, "global_step": 599369, "epoch": 7221} {"train_loss": -28.112548828125, "global_step": 599370, "epoch": 7221} {"train_loss": -27.97247314453125, "global_step": 599371, "epoch": 7221} {"train_loss": -28.001434326171875, "global_step": 599372, "epoch": 7221} {"train_loss": -27.94330406188965, "global_step": 599373, "epoch": 7221} {"train_loss": -27.834320068359375, "global_step": 599374, "epoch": 7221} {"train_loss": -27.660425186157227, "global_step": 599375, "epoch": 7221} {"train_loss": -27.673187255859375, "global_step": 599376, "epoch": 7221} {"train_loss": -27.825672149658203, "global_step": 599377, "epoch": 7221} {"train_loss": -27.906265258789062, "global_step": 599378, "epoch": 7221} {"train_loss": -27.888086318969727, "global_step": 599379, "epoch": 7221} {"train_loss": -27.405933380126953, "global_step": 599380, "epoch": 7221} {"train_loss": -27.443084716796875, "global_step": 599381, "epoch": 7221} {"train_loss": -28.165756225585938, "global_step": 599382, "epoch": 7221} {"train_loss": -27.437808990478516, "global_step": 599383, "epoch": 7221} {"train_loss": -27.914081573486328, "global_step": 599384, "epoch": 7221} {"train_loss": -27.908964157104492, "global_step": 599385, "epoch": 7221} {"train_loss": -27.831838607788086, "global_step": 599386, "epoch": 7221} {"train_loss": -28.033100128173828, "global_step": 599387, "epoch": 7221} {"train_loss": -27.604389190673828, "global_step": 599388, "epoch": 7221} {"train_loss": -28.086313247680664, "global_step": 599389, "epoch": 7221} {"train_loss": -28.049596786499023, "global_step": 599390, "epoch": 7221} {"train_loss": -27.775299072265625, "global_step": 599391, "epoch": 7221} {"train_loss": -27.695127487182617, "global_step": 599392, "epoch": 7221} {"train_loss": -27.32635498046875, "global_step": 599393, "epoch": 7221} {"train_loss": -27.501209259033203, "global_step": 599394, "epoch": 7221} {"train_loss": -28.056726455688477, "global_step": 599395, "epoch": 7221} {"train_loss": -28.2731876373291, "global_step": 599396, "epoch": 7221} {"train_loss": -27.892236709594727, "global_step": 599397, "epoch": 7221} {"train_loss": -28.0256404876709, "global_step": 599398, "epoch": 7221} {"train_loss": -27.933218002319336, "global_step": 599399, "epoch": 7221} {"train_loss": -27.944257736206055, "global_step": 599400, "epoch": 7221} {"train_loss": -27.758893966674805, "global_step": 599401, "epoch": 7221} {"train_loss": -27.883533477783203, "global_step": 599402, "epoch": 7221} {"train_loss": -27.842580795288086, "global_step": 599403, "epoch": 7221} {"train_loss": -27.86419105529785, "global_step": 599404, "epoch": 7221} {"train_loss": -27.937152862548828, "global_step": 599405, "epoch": 7221} {"train_loss": -28.01773452758789, "global_step": 599406, "epoch": 7221} {"train_loss": -28.069849014282227, "global_step": 599407, "epoch": 7221} {"train_loss": -27.92852210998535, "global_step": 599408, "epoch": 7221} {"train_loss": -28.125202178955078, "global_step": 599409, "epoch": 7221} {"train_loss": -28.3388614654541, "global_step": 599410, "epoch": 7221} {"train_loss": -28.424610137939453, "global_step": 599411, "epoch": 7221} {"train_loss": -28.03986930847168, "global_step": 599412, "epoch": 7221} {"train_loss": -28.0168514251709, "global_step": 599413, "epoch": 7221} {"train_loss": -28.234766006469727, "global_step": 599414, "epoch": 7221} {"train_loss": -28.364667892456055, "global_step": 599415, "epoch": 7221} {"train_loss": -27.913991928100586, "global_step": 599416, "epoch": 7221} {"train_loss": -28.449508666992188, "global_step": 599417, "epoch": 7221} {"train_loss": -28.33330726623535, "global_step": 599418, "epoch": 7221} {"train_loss": -28.127033233642578, "global_step": 599419, "epoch": 7221} {"train_loss": -28.617612838745117, "global_step": 599420, "epoch": 7221} {"train_loss": -28.17262840270996, "global_step": 599421, "epoch": 7221} {"train_loss": -28.3795223236084, "global_step": 599422, "epoch": 7221} {"train_loss": -27.988107681274414, "global_step": 599423, "epoch": 7221} {"train_loss": -28.484424591064453, "global_step": 599424, "epoch": 7221} {"train_loss": -27.926077348640167, "global_step": 599425, "epoch": 7221, "val_loss": 6520267.0} {"train_loss": -27.5798397064209, "global_step": 599426, "epoch": 7222} {"train_loss": -26.723825454711914, "global_step": 599427, "epoch": 7222} {"train_loss": -26.469884872436523, "global_step": 599428, "epoch": 7222} {"train_loss": -26.809904098510742, "global_step": 599429, "epoch": 7222} {"train_loss": -27.563995361328125, "global_step": 599430, "epoch": 7222} {"train_loss": -26.48553466796875, "global_step": 599431, "epoch": 7222} {"train_loss": -27.033832550048828, "global_step": 599432, "epoch": 7222} {"train_loss": -27.59051513671875, "global_step": 599433, "epoch": 7222} {"train_loss": -26.949466705322266, "global_step": 599434, "epoch": 7222} {"train_loss": -27.7470645904541, "global_step": 599435, "epoch": 7222} {"train_loss": -27.940637588500977, "global_step": 599436, "epoch": 7222} {"train_loss": -27.661386489868164, "global_step": 599437, "epoch": 7222} {"train_loss": -27.35831069946289, "global_step": 599438, "epoch": 7222} {"train_loss": -27.632110595703125, "global_step": 599439, "epoch": 7222} {"train_loss": -27.931751251220703, "global_step": 599440, "epoch": 7222} {"train_loss": -27.902490615844727, "global_step": 599441, "epoch": 7222} {"train_loss": -27.328277587890625, "global_step": 599442, "epoch": 7222} {"train_loss": -27.493234634399414, "global_step": 599443, "epoch": 7222} {"train_loss": -27.470849990844727, "global_step": 599444, "epoch": 7222} {"train_loss": -27.8475284576416, "global_step": 599445, "epoch": 7222} {"train_loss": -27.572790145874023, "global_step": 599446, "epoch": 7222} {"train_loss": -27.75678062438965, "global_step": 599447, "epoch": 7222} {"train_loss": -28.027856826782227, "global_step": 599448, "epoch": 7222} {"train_loss": -27.620929718017578, "global_step": 599449, "epoch": 7222} {"train_loss": -27.934045791625977, "global_step": 599450, "epoch": 7222} {"train_loss": -27.275136947631836, "global_step": 599451, "epoch": 7222} {"train_loss": -28.146467208862305, "global_step": 599452, "epoch": 7222} {"train_loss": -27.57179832458496, "global_step": 599453, "epoch": 7222} {"train_loss": -28.030902862548828, "global_step": 599454, "epoch": 7222} {"train_loss": -27.72262954711914, "global_step": 599455, "epoch": 7222} {"train_loss": -28.012113571166992, "global_step": 599456, "epoch": 7222} {"train_loss": -26.957883834838867, "global_step": 599457, "epoch": 7222} {"train_loss": -28.29884910583496, "global_step": 599458, "epoch": 7222} {"train_loss": -27.769428253173828, "global_step": 599459, "epoch": 7222} {"train_loss": -28.052734375, "global_step": 599460, "epoch": 7222} {"train_loss": -27.949371337890625, "global_step": 599461, "epoch": 7222} {"train_loss": -27.912464141845703, "global_step": 599462, "epoch": 7222} {"train_loss": -27.691938400268555, "global_step": 599463, "epoch": 7222} {"train_loss": -28.244522094726562, "global_step": 599464, "epoch": 7222} {"train_loss": -27.503326416015625, "global_step": 599465, "epoch": 7222} {"train_loss": -27.915327072143555, "global_step": 599466, "epoch": 7222} {"train_loss": -27.932905197143555, "global_step": 599467, "epoch": 7222} {"train_loss": -28.013940811157227, "global_step": 599468, "epoch": 7222} {"train_loss": -28.019763946533203, "global_step": 599469, "epoch": 7222} {"train_loss": -28.22654151916504, "global_step": 599470, "epoch": 7222} {"train_loss": -27.669492721557617, "global_step": 599471, "epoch": 7222} {"train_loss": -28.12824058532715, "global_step": 599472, "epoch": 7222} {"train_loss": -28.14466667175293, "global_step": 599473, "epoch": 7222} {"train_loss": -28.2128963470459, "global_step": 599474, "epoch": 7222} {"train_loss": -28.00977897644043, "global_step": 599475, "epoch": 7222} {"train_loss": -28.106237411499023, "global_step": 599476, "epoch": 7222} {"train_loss": -28.09771728515625, "global_step": 599477, "epoch": 7222} {"train_loss": -28.329858779907227, "global_step": 599478, "epoch": 7222} {"train_loss": -28.56683349609375, "global_step": 599479, "epoch": 7222} {"train_loss": -28.18198585510254, "global_step": 599480, "epoch": 7222} {"train_loss": -28.535425186157227, "global_step": 599481, "epoch": 7222} {"train_loss": -28.170324325561523, "global_step": 599482, "epoch": 7222} {"train_loss": -27.877166748046875, "global_step": 599483, "epoch": 7222} {"train_loss": -28.26508140563965, "global_step": 599484, "epoch": 7222} {"train_loss": -27.96307945251465, "global_step": 599485, "epoch": 7222} {"train_loss": -28.220630645751953, "global_step": 599486, "epoch": 7222} {"train_loss": -28.018299102783203, "global_step": 599487, "epoch": 7222} {"train_loss": -28.42084312438965, "global_step": 599488, "epoch": 7222} {"train_loss": -27.842004776000977, "global_step": 599489, "epoch": 7222} {"train_loss": -28.193531036376953, "global_step": 599490, "epoch": 7222} {"train_loss": -28.131214141845703, "global_step": 599491, "epoch": 7222} {"train_loss": -28.341577529907227, "global_step": 599492, "epoch": 7222} {"train_loss": -28.456655502319336, "global_step": 599493, "epoch": 7222} {"train_loss": -28.405170440673828, "global_step": 599494, "epoch": 7222} {"train_loss": -28.132917404174805, "global_step": 599495, "epoch": 7222} {"train_loss": -27.91261100769043, "global_step": 599496, "epoch": 7222} {"train_loss": -27.915983200073242, "global_step": 599497, "epoch": 7222} {"train_loss": -27.75953483581543, "global_step": 599498, "epoch": 7222} {"train_loss": -27.856348037719727, "global_step": 599499, "epoch": 7222} {"train_loss": -28.095373153686523, "global_step": 599500, "epoch": 7222} {"train_loss": -28.24616050720215, "global_step": 599501, "epoch": 7222} {"train_loss": -27.794342041015625, "global_step": 599502, "epoch": 7222} {"train_loss": -27.779205322265625, "global_step": 599503, "epoch": 7222} {"train_loss": -27.750146865844727, "global_step": 599504, "epoch": 7222} {"train_loss": -27.94990348815918, "global_step": 599505, "epoch": 7222} {"train_loss": -27.7799129486084, "global_step": 599506, "epoch": 7222} {"train_loss": -28.0498104095459, "global_step": 599507, "epoch": 7222} {"train_loss": -27.8576167233019, "global_step": 599508, "epoch": 7222, "val_loss": 6537761.0} {"train_loss": -27.44883155822754, "global_step": 599509, "epoch": 7223} {"train_loss": -26.66680908203125, "global_step": 599510, "epoch": 7223} {"train_loss": -27.0755672454834, "global_step": 599511, "epoch": 7223} {"train_loss": -27.95669937133789, "global_step": 599512, "epoch": 7223} {"train_loss": -26.741743087768555, "global_step": 599513, "epoch": 7223} {"train_loss": -27.559717178344727, "global_step": 599514, "epoch": 7223} {"train_loss": -27.396825790405273, "global_step": 599515, "epoch": 7223} {"train_loss": -27.541669845581055, "global_step": 599516, "epoch": 7223} {"train_loss": -27.20037841796875, "global_step": 599517, "epoch": 7223} {"train_loss": -27.4610652923584, "global_step": 599518, "epoch": 7223} {"train_loss": -27.448230743408203, "global_step": 599519, "epoch": 7223} {"train_loss": -27.654279708862305, "global_step": 599520, "epoch": 7223} {"train_loss": -27.471282958984375, "global_step": 599521, "epoch": 7223} {"train_loss": -27.102502822875977, "global_step": 599522, "epoch": 7223} {"train_loss": -27.56005859375, "global_step": 599523, "epoch": 7223} {"train_loss": -27.416854858398438, "global_step": 599524, "epoch": 7223} {"train_loss": -27.547122955322266, "global_step": 599525, "epoch": 7223} {"train_loss": -27.254453659057617, "global_step": 599526, "epoch": 7223} {"train_loss": -27.757909774780273, "global_step": 599527, "epoch": 7223} {"train_loss": -28.177255630493164, "global_step": 599528, "epoch": 7223} {"train_loss": -27.514307022094727, "global_step": 599529, "epoch": 7223} {"train_loss": -27.495092391967773, "global_step": 599530, "epoch": 7223} {"train_loss": -27.93622398376465, "global_step": 599531, "epoch": 7223} {"train_loss": -28.00213050842285, "global_step": 599532, "epoch": 7223} {"train_loss": -27.783222198486328, "global_step": 599533, "epoch": 7223} {"train_loss": -27.782873153686523, "global_step": 599534, "epoch": 7223} {"train_loss": -27.481760025024414, "global_step": 599535, "epoch": 7223} {"train_loss": -27.49981117248535, "global_step": 599536, "epoch": 7223} {"train_loss": -27.727828979492188, "global_step": 599537, "epoch": 7223} {"train_loss": -27.828922271728516, "global_step": 599538, "epoch": 7223} {"train_loss": -27.882080078125, "global_step": 599539, "epoch": 7223} {"train_loss": -27.868154525756836, "global_step": 599540, "epoch": 7223} {"train_loss": -27.988269805908203, "global_step": 599541, "epoch": 7223} {"train_loss": -27.62946891784668, "global_step": 599542, "epoch": 7223} {"train_loss": -27.93158531188965, "global_step": 599543, "epoch": 7223} {"train_loss": -28.105863571166992, "global_step": 599544, "epoch": 7223} {"train_loss": -28.33734703063965, "global_step": 599545, "epoch": 7223} {"train_loss": -28.191614151000977, "global_step": 599546, "epoch": 7223} {"train_loss": -28.019775390625, "global_step": 599547, "epoch": 7223} {"train_loss": -27.9478702545166, "global_step": 599548, "epoch": 7223} {"train_loss": -27.927417755126953, "global_step": 599549, "epoch": 7223} {"train_loss": -27.919126510620117, "global_step": 599550, "epoch": 7223} {"train_loss": -27.908369064331055, "global_step": 599551, "epoch": 7223} {"train_loss": -28.51617431640625, "global_step": 599552, "epoch": 7223} {"train_loss": -27.939794540405273, "global_step": 599553, "epoch": 7223} {"train_loss": -27.776947021484375, "global_step": 599554, "epoch": 7223} {"train_loss": -27.629236221313477, "global_step": 599555, "epoch": 7223} {"train_loss": -27.630163192749023, "global_step": 599556, "epoch": 7223} {"train_loss": -27.88496208190918, "global_step": 599557, "epoch": 7223} {"train_loss": -28.048847198486328, "global_step": 599558, "epoch": 7223} {"train_loss": -27.681167602539062, "global_step": 599559, "epoch": 7223} {"train_loss": -27.878149032592773, "global_step": 599560, "epoch": 7223} {"train_loss": -27.967451095581055, "global_step": 599561, "epoch": 7223} {"train_loss": -28.057043075561523, "global_step": 599562, "epoch": 7223} {"train_loss": -27.895278930664062, "global_step": 599563, "epoch": 7223} {"train_loss": -27.689661026000977, "global_step": 599564, "epoch": 7223} {"train_loss": -27.88480567932129, "global_step": 599565, "epoch": 7223} {"train_loss": -27.406147003173828, "global_step": 599566, "epoch": 7223} {"train_loss": -27.974817276000977, "global_step": 599567, "epoch": 7223} {"train_loss": -27.599567413330078, "global_step": 599568, "epoch": 7223} {"train_loss": -28.098867416381836, "global_step": 599569, "epoch": 7223} {"train_loss": -27.77423667907715, "global_step": 599570, "epoch": 7223} {"train_loss": -27.98292350769043, "global_step": 599571, "epoch": 7223} {"train_loss": -27.961313247680664, "global_step": 599572, "epoch": 7223} {"train_loss": -28.339752197265625, "global_step": 599573, "epoch": 7223} {"train_loss": -27.90911293029785, "global_step": 599574, "epoch": 7223} {"train_loss": -28.6275634765625, "global_step": 599575, "epoch": 7223} {"train_loss": -28.011816024780273, "global_step": 599576, "epoch": 7223} {"train_loss": -28.309375762939453, "global_step": 599577, "epoch": 7223} {"train_loss": -28.225650787353516, "global_step": 599578, "epoch": 7223} {"train_loss": -27.64133071899414, "global_step": 599579, "epoch": 7223} {"train_loss": -28.329883575439453, "global_step": 599580, "epoch": 7223} {"train_loss": -27.92923355102539, "global_step": 599581, "epoch": 7223} {"train_loss": -28.200244903564453, "global_step": 599582, "epoch": 7223} {"train_loss": -28.073644638061523, "global_step": 599583, "epoch": 7223} {"train_loss": -27.678647994995117, "global_step": 599584, "epoch": 7223} {"train_loss": -27.72947120666504, "global_step": 599585, "epoch": 7223} {"train_loss": -28.362646102905273, "global_step": 599586, "epoch": 7223} {"train_loss": -28.168033599853516, "global_step": 599587, "epoch": 7223} {"train_loss": -28.088788986206055, "global_step": 599588, "epoch": 7223} {"train_loss": -28.18379020690918, "global_step": 599589, "epoch": 7223} {"train_loss": -28.219324111938477, "global_step": 599590, "epoch": 7223} {"train_loss": -27.820281844541253, "global_step": 599591, "epoch": 7223, "val_loss": 6577402.0} {"train_loss": -27.528610229492188, "global_step": 599592, "epoch": 7224} {"train_loss": -27.55824089050293, "global_step": 599593, "epoch": 7224} {"train_loss": -27.5723819732666, "global_step": 599594, "epoch": 7224} {"train_loss": -27.718067169189453, "global_step": 599595, "epoch": 7224} {"train_loss": -27.4672908782959, "global_step": 599596, "epoch": 7224} {"train_loss": -27.325260162353516, "global_step": 599597, "epoch": 7224} {"train_loss": -27.118078231811523, "global_step": 599598, "epoch": 7224} {"train_loss": -27.21286964416504, "global_step": 599599, "epoch": 7224} {"train_loss": -27.466108322143555, "global_step": 599600, "epoch": 7224} {"train_loss": -26.934417724609375, "global_step": 599601, "epoch": 7224} {"train_loss": -27.374114990234375, "global_step": 599602, "epoch": 7224} {"train_loss": -27.826547622680664, "global_step": 599603, "epoch": 7224} {"train_loss": -27.86870765686035, "global_step": 599604, "epoch": 7224} {"train_loss": -27.566696166992188, "global_step": 599605, "epoch": 7224} {"train_loss": -27.65532875061035, "global_step": 599606, "epoch": 7224} {"train_loss": -27.779401779174805, "global_step": 599607, "epoch": 7224} {"train_loss": -27.806446075439453, "global_step": 599608, "epoch": 7224} {"train_loss": -27.669137954711914, "global_step": 599609, "epoch": 7224} {"train_loss": -27.658987045288086, "global_step": 599610, "epoch": 7224} {"train_loss": -28.00187110900879, "global_step": 599611, "epoch": 7224} {"train_loss": -27.68524169921875, "global_step": 599612, "epoch": 7224} {"train_loss": -27.987274169921875, "global_step": 599613, "epoch": 7224} {"train_loss": -27.974517822265625, "global_step": 599614, "epoch": 7224} {"train_loss": -27.914411544799805, "global_step": 599615, "epoch": 7224} {"train_loss": -28.085004806518555, "global_step": 599616, "epoch": 7224} {"train_loss": -27.821258544921875, "global_step": 599617, "epoch": 7224} {"train_loss": -27.90216636657715, "global_step": 599618, "epoch": 7224} {"train_loss": -27.956159591674805, "global_step": 599619, "epoch": 7224} {"train_loss": -27.945911407470703, "global_step": 599620, "epoch": 7224} {"train_loss": -28.13954734802246, "global_step": 599621, "epoch": 7224} {"train_loss": -27.944013595581055, "global_step": 599622, "epoch": 7224} {"train_loss": -27.987533569335938, "global_step": 599623, "epoch": 7224} {"train_loss": -27.88791847229004, "global_step": 599624, "epoch": 7224} {"train_loss": -28.154327392578125, "global_step": 599625, "epoch": 7224} {"train_loss": -28.119308471679688, "global_step": 599626, "epoch": 7224} {"train_loss": -28.01067543029785, "global_step": 599627, "epoch": 7224} {"train_loss": -28.057825088500977, "global_step": 599628, "epoch": 7224} {"train_loss": -28.2921085357666, "global_step": 599629, "epoch": 7224} {"train_loss": -28.053302764892578, "global_step": 599630, "epoch": 7224} {"train_loss": -28.375219345092773, "global_step": 599631, "epoch": 7224} {"train_loss": -28.087116241455078, "global_step": 599632, "epoch": 7224} {"train_loss": -28.12763023376465, "global_step": 599633, "epoch": 7224} {"train_loss": -28.158039093017578, "global_step": 599634, "epoch": 7224} {"train_loss": -28.371570587158203, "global_step": 599635, "epoch": 7224} {"train_loss": -28.240163803100586, "global_step": 599636, "epoch": 7224} {"train_loss": -28.375768661499023, "global_step": 599637, "epoch": 7224} {"train_loss": -28.178924560546875, "global_step": 599638, "epoch": 7224} {"train_loss": -27.96563148498535, "global_step": 599639, "epoch": 7224} {"train_loss": -28.160634994506836, "global_step": 599640, "epoch": 7224} {"train_loss": -28.3571720123291, "global_step": 599641, "epoch": 7224} {"train_loss": -28.2831974029541, "global_step": 599642, "epoch": 7224} {"train_loss": -27.87506675720215, "global_step": 599643, "epoch": 7224} {"train_loss": -28.438608169555664, "global_step": 599644, "epoch": 7224} {"train_loss": -28.191064834594727, "global_step": 599645, "epoch": 7224} {"train_loss": -28.320371627807617, "global_step": 599646, "epoch": 7224} {"train_loss": -28.622434616088867, "global_step": 599647, "epoch": 7224} {"train_loss": -28.1052188873291, "global_step": 599648, "epoch": 7224} {"train_loss": -28.194711685180664, "global_step": 599649, "epoch": 7224} {"train_loss": -27.792455673217773, "global_step": 599650, "epoch": 7224} {"train_loss": -28.150964736938477, "global_step": 599651, "epoch": 7224} {"train_loss": -28.06587791442871, "global_step": 599652, "epoch": 7224} {"train_loss": -28.165876388549805, "global_step": 599653, "epoch": 7224} {"train_loss": -28.204126358032227, "global_step": 599654, "epoch": 7224} {"train_loss": -27.8677921295166, "global_step": 599655, "epoch": 7224} {"train_loss": -27.85553550720215, "global_step": 599656, "epoch": 7224} {"train_loss": -27.59576416015625, "global_step": 599657, "epoch": 7224} {"train_loss": -27.580896377563477, "global_step": 599658, "epoch": 7224} {"train_loss": -27.453704833984375, "global_step": 599659, "epoch": 7224} {"train_loss": -28.166879653930664, "global_step": 599660, "epoch": 7224} {"train_loss": -28.150938034057617, "global_step": 599661, "epoch": 7224} {"train_loss": -27.841461181640625, "global_step": 599662, "epoch": 7224} {"train_loss": -27.35654067993164, "global_step": 599663, "epoch": 7224} {"train_loss": -27.328720092773438, "global_step": 599664, "epoch": 7224} {"train_loss": -27.44365882873535, "global_step": 599665, "epoch": 7224} {"train_loss": -28.234899520874023, "global_step": 599666, "epoch": 7224} {"train_loss": -27.426349639892578, "global_step": 599667, "epoch": 7224} {"train_loss": -28.09181022644043, "global_step": 599668, "epoch": 7224} {"train_loss": -27.736188888549805, "global_step": 599669, "epoch": 7224} {"train_loss": -28.33112144470215, "global_step": 599670, "epoch": 7224} {"train_loss": -27.811588287353516, "global_step": 599671, "epoch": 7224} {"train_loss": -28.045740127563477, "global_step": 599672, "epoch": 7224} {"train_loss": -27.902088165283203, "global_step": 599673, "epoch": 7224} {"train_loss": -27.899388140942676, "global_step": 599674, "epoch": 7224, "val_loss": 6567073.0} {"train_loss": -27.4163875579834, "global_step": 599675, "epoch": 7225} {"train_loss": -27.758804321289062, "global_step": 599676, "epoch": 7225} {"train_loss": -27.524988174438477, "global_step": 599677, "epoch": 7225} {"train_loss": -26.93519401550293, "global_step": 599678, "epoch": 7225} {"train_loss": -27.155302047729492, "global_step": 599679, "epoch": 7225} {"train_loss": -27.15604019165039, "global_step": 599680, "epoch": 7225} {"train_loss": -27.3977108001709, "global_step": 599681, "epoch": 7225} {"train_loss": -27.728839874267578, "global_step": 599682, "epoch": 7225} {"train_loss": -27.631072998046875, "global_step": 599683, "epoch": 7225} {"train_loss": -27.68265724182129, "global_step": 599684, "epoch": 7225} {"train_loss": -27.405975341796875, "global_step": 599685, "epoch": 7225} {"train_loss": -27.531513214111328, "global_step": 599686, "epoch": 7225} {"train_loss": -27.782886505126953, "global_step": 599687, "epoch": 7225} {"train_loss": -27.505176544189453, "global_step": 599688, "epoch": 7225} {"train_loss": -27.990076065063477, "global_step": 599689, "epoch": 7225} {"train_loss": -27.987104415893555, "global_step": 599690, "epoch": 7225} {"train_loss": -28.1793212890625, "global_step": 599691, "epoch": 7225} {"train_loss": -27.46356773376465, "global_step": 599692, "epoch": 7225} {"train_loss": -27.94135093688965, "global_step": 599693, "epoch": 7225} {"train_loss": -27.63319206237793, "global_step": 599694, "epoch": 7225} {"train_loss": -27.814416885375977, "global_step": 599695, "epoch": 7225} {"train_loss": -27.77962303161621, "global_step": 599696, "epoch": 7225} {"train_loss": -27.847442626953125, "global_step": 599697, "epoch": 7225} {"train_loss": -27.7307071685791, "global_step": 599698, "epoch": 7225} {"train_loss": -28.195898056030273, "global_step": 599699, "epoch": 7225} {"train_loss": -28.072223663330078, "global_step": 599700, "epoch": 7225} {"train_loss": -28.440885543823242, "global_step": 599701, "epoch": 7225} {"train_loss": -27.96480369567871, "global_step": 599702, "epoch": 7225} {"train_loss": -27.782705307006836, "global_step": 599703, "epoch": 7225} {"train_loss": -27.821462631225586, "global_step": 599704, "epoch": 7225} {"train_loss": -27.965238571166992, "global_step": 599705, "epoch": 7225} {"train_loss": -28.317041397094727, "global_step": 599706, "epoch": 7225} {"train_loss": -28.237852096557617, "global_step": 599707, "epoch": 7225} {"train_loss": -27.78741455078125, "global_step": 599708, "epoch": 7225} {"train_loss": -28.252338409423828, "global_step": 599709, "epoch": 7225} {"train_loss": -28.17897605895996, "global_step": 599710, "epoch": 7225} {"train_loss": -28.49239158630371, "global_step": 599711, "epoch": 7225} {"train_loss": -28.16770362854004, "global_step": 599712, "epoch": 7225} {"train_loss": -27.976642608642578, "global_step": 599713, "epoch": 7225} {"train_loss": -28.12592887878418, "global_step": 599714, "epoch": 7225} {"train_loss": -28.1256046295166, "global_step": 599715, "epoch": 7225} {"train_loss": -28.275409698486328, "global_step": 599716, "epoch": 7225} {"train_loss": -28.503854751586914, "global_step": 599717, "epoch": 7225} {"train_loss": -28.2169246673584, "global_step": 599718, "epoch": 7225} {"train_loss": -27.93288230895996, "global_step": 599719, "epoch": 7225} {"train_loss": -28.3653621673584, "global_step": 599720, "epoch": 7225} {"train_loss": -28.172956466674805, "global_step": 599721, "epoch": 7225} {"train_loss": -28.075536727905273, "global_step": 599722, "epoch": 7225} {"train_loss": -28.01416015625, "global_step": 599723, "epoch": 7225} {"train_loss": -28.499561309814453, "global_step": 599724, "epoch": 7225} {"train_loss": -28.34868812561035, "global_step": 599725, "epoch": 7225} {"train_loss": -28.0825138092041, "global_step": 599726, "epoch": 7225} {"train_loss": -27.612226486206055, "global_step": 599727, "epoch": 7225} {"train_loss": -28.0335693359375, "global_step": 599728, "epoch": 7225} {"train_loss": -28.01581382751465, "global_step": 599729, "epoch": 7225} {"train_loss": -27.874258041381836, "global_step": 599730, "epoch": 7225} {"train_loss": -27.91522789001465, "global_step": 599731, "epoch": 7225} {"train_loss": -27.41389274597168, "global_step": 599732, "epoch": 7225} {"train_loss": -28.2227725982666, "global_step": 599733, "epoch": 7225} {"train_loss": -28.175817489624023, "global_step": 599734, "epoch": 7225} {"train_loss": -28.334707260131836, "global_step": 599735, "epoch": 7225} {"train_loss": -28.368249893188477, "global_step": 599736, "epoch": 7225} {"train_loss": -27.996204376220703, "global_step": 599737, "epoch": 7225} {"train_loss": -28.366994857788086, "global_step": 599738, "epoch": 7225} {"train_loss": -27.74921226501465, "global_step": 599739, "epoch": 7225} {"train_loss": -28.132688522338867, "global_step": 599740, "epoch": 7225} {"train_loss": -28.0366153717041, "global_step": 599741, "epoch": 7225} {"train_loss": -28.1759033203125, "global_step": 599742, "epoch": 7225} {"train_loss": -28.091907501220703, "global_step": 599743, "epoch": 7225} {"train_loss": -27.969648361206055, "global_step": 599744, "epoch": 7225} {"train_loss": -28.43592643737793, "global_step": 599745, "epoch": 7225} {"train_loss": -28.1221923828125, "global_step": 599746, "epoch": 7225} {"train_loss": -28.659027099609375, "global_step": 599747, "epoch": 7225} {"train_loss": -28.4759464263916, "global_step": 599748, "epoch": 7225} {"train_loss": -28.132497787475586, "global_step": 599749, "epoch": 7225} {"train_loss": -28.10218620300293, "global_step": 599750, "epoch": 7225} {"train_loss": -27.90046501159668, "global_step": 599751, "epoch": 7225} {"train_loss": -27.909765243530273, "global_step": 599752, "epoch": 7225} {"train_loss": -28.121856689453125, "global_step": 599753, "epoch": 7225} {"train_loss": -27.797239303588867, "global_step": 599754, "epoch": 7225} {"train_loss": -28.05274772644043, "global_step": 599755, "epoch": 7225} {"train_loss": -27.971363067626953, "global_step": 599756, "epoch": 7225} {"train_loss": -27.978430782455995, "global_step": 599757, "epoch": 7225, "val_loss": 6583905.5} {"train_loss": -27.5518798828125, "global_step": 599758, "epoch": 7226} {"train_loss": -26.35175895690918, "global_step": 599759, "epoch": 7226} {"train_loss": -26.0767822265625, "global_step": 599760, "epoch": 7226} {"train_loss": -26.85016441345215, "global_step": 599761, "epoch": 7226} {"train_loss": -27.638671875, "global_step": 599762, "epoch": 7226} {"train_loss": -26.216867446899414, "global_step": 599763, "epoch": 7226} {"train_loss": -27.301794052124023, "global_step": 599764, "epoch": 7226} {"train_loss": -27.027984619140625, "global_step": 599765, "epoch": 7226} {"train_loss": -26.78803825378418, "global_step": 599766, "epoch": 7226} {"train_loss": -27.326339721679688, "global_step": 599767, "epoch": 7226} {"train_loss": -26.773849487304688, "global_step": 599768, "epoch": 7226} {"train_loss": -27.655929565429688, "global_step": 599769, "epoch": 7226} {"train_loss": -26.9302978515625, "global_step": 599770, "epoch": 7226} {"train_loss": -27.663110733032227, "global_step": 599771, "epoch": 7226} {"train_loss": -27.66043472290039, "global_step": 599772, "epoch": 7226} {"train_loss": -27.110986709594727, "global_step": 599773, "epoch": 7226} {"train_loss": -27.737201690673828, "global_step": 599774, "epoch": 7226} {"train_loss": -27.063459396362305, "global_step": 599775, "epoch": 7226} {"train_loss": -27.646137237548828, "global_step": 599776, "epoch": 7226} {"train_loss": -28.162647247314453, "global_step": 599777, "epoch": 7226} {"train_loss": -27.125715255737305, "global_step": 599778, "epoch": 7226} {"train_loss": -27.828271865844727, "global_step": 599779, "epoch": 7226} {"train_loss": -27.436492919921875, "global_step": 599780, "epoch": 7226} {"train_loss": -27.627912521362305, "global_step": 599781, "epoch": 7226} {"train_loss": -27.477935791015625, "global_step": 599782, "epoch": 7226} {"train_loss": -27.481689453125, "global_step": 599783, "epoch": 7226} {"train_loss": -27.733312606811523, "global_step": 599784, "epoch": 7226} {"train_loss": -27.669677734375, "global_step": 599785, "epoch": 7226} {"train_loss": -27.75518798828125, "global_step": 599786, "epoch": 7226} {"train_loss": -27.975305557250977, "global_step": 599787, "epoch": 7226} {"train_loss": -27.8345890045166, "global_step": 599788, "epoch": 7226} {"train_loss": -27.899768829345703, "global_step": 599789, "epoch": 7226} {"train_loss": -27.922657012939453, "global_step": 599790, "epoch": 7226} {"train_loss": -27.359350204467773, "global_step": 599791, "epoch": 7226} {"train_loss": -27.76470375061035, "global_step": 599792, "epoch": 7226} {"train_loss": -28.26080894470215, "global_step": 599793, "epoch": 7226} {"train_loss": -27.772741317749023, "global_step": 599794, "epoch": 7226} {"train_loss": -27.788236618041992, "global_step": 599795, "epoch": 7226} {"train_loss": -28.040237426757812, "global_step": 599796, "epoch": 7226} {"train_loss": -27.93882179260254, "global_step": 599797, "epoch": 7226} {"train_loss": -27.694091796875, "global_step": 599798, "epoch": 7226} {"train_loss": -27.648029327392578, "global_step": 599799, "epoch": 7226} {"train_loss": -27.8743896484375, "global_step": 599800, "epoch": 7226} {"train_loss": -27.39932632446289, "global_step": 599801, "epoch": 7226} {"train_loss": -27.43121337890625, "global_step": 599802, "epoch": 7226} {"train_loss": -27.27155876159668, "global_step": 599803, "epoch": 7226} {"train_loss": -27.279733657836914, "global_step": 599804, "epoch": 7226} {"train_loss": -28.16288185119629, "global_step": 599805, "epoch": 7226} {"train_loss": -27.9317684173584, "global_step": 599806, "epoch": 7226} {"train_loss": -28.05872917175293, "global_step": 599807, "epoch": 7226} {"train_loss": -27.74313735961914, "global_step": 599808, "epoch": 7226} {"train_loss": -28.103235244750977, "global_step": 599809, "epoch": 7226} {"train_loss": -27.52558708190918, "global_step": 599810, "epoch": 7226} {"train_loss": -27.610671997070312, "global_step": 599811, "epoch": 7226} {"train_loss": -28.072921752929688, "global_step": 599812, "epoch": 7226} {"train_loss": -27.950735092163086, "global_step": 599813, "epoch": 7226} {"train_loss": -28.2025146484375, "global_step": 599814, "epoch": 7226} {"train_loss": -28.243915557861328, "global_step": 599815, "epoch": 7226} {"train_loss": -27.763187408447266, "global_step": 599816, "epoch": 7226} {"train_loss": -28.12677001953125, "global_step": 599817, "epoch": 7226} {"train_loss": -28.349212646484375, "global_step": 599818, "epoch": 7226} {"train_loss": -28.286401748657227, "global_step": 599819, "epoch": 7226} {"train_loss": -28.152597427368164, "global_step": 599820, "epoch": 7226} {"train_loss": -28.35096549987793, "global_step": 599821, "epoch": 7226} {"train_loss": -28.353490829467773, "global_step": 599822, "epoch": 7226} {"train_loss": -28.2177677154541, "global_step": 599823, "epoch": 7226} {"train_loss": -28.334197998046875, "global_step": 599824, "epoch": 7226} {"train_loss": -28.45175552368164, "global_step": 599825, "epoch": 7226} {"train_loss": -28.167993545532227, "global_step": 599826, "epoch": 7226} {"train_loss": -27.88047218322754, "global_step": 599827, "epoch": 7226} {"train_loss": -27.822559356689453, "global_step": 599828, "epoch": 7226} {"train_loss": -28.30201530456543, "global_step": 599829, "epoch": 7226} {"train_loss": -28.09136390686035, "global_step": 599830, "epoch": 7226} {"train_loss": -28.267593383789062, "global_step": 599831, "epoch": 7226} {"train_loss": -27.907943725585938, "global_step": 599832, "epoch": 7226} {"train_loss": -28.335805892944336, "global_step": 599833, "epoch": 7226} {"train_loss": -27.82744789123535, "global_step": 599834, "epoch": 7226} {"train_loss": -28.080530166625977, "global_step": 599835, "epoch": 7226} {"train_loss": -28.225645065307617, "global_step": 599836, "epoch": 7226} {"train_loss": -28.129587173461914, "global_step": 599837, "epoch": 7226} {"train_loss": -28.322036743164062, "global_step": 599838, "epoch": 7226} {"train_loss": -27.647724151611328, "global_step": 599839, "epoch": 7226} {"train_loss": -27.73292293318783, "global_step": 599840, "epoch": 7226, "val_loss": 6604157.5} {"train_loss": -27.820343017578125, "global_step": 599841, "epoch": 7227} {"train_loss": -27.3323917388916, "global_step": 599842, "epoch": 7227} {"train_loss": -27.440326690673828, "global_step": 599843, "epoch": 7227} {"train_loss": -27.479536056518555, "global_step": 599844, "epoch": 7227} {"train_loss": -27.711776733398438, "global_step": 599845, "epoch": 7227} {"train_loss": -27.424896240234375, "global_step": 599846, "epoch": 7227} {"train_loss": -27.439359664916992, "global_step": 599847, "epoch": 7227} {"train_loss": -27.619840621948242, "global_step": 599848, "epoch": 7227} {"train_loss": -27.216094970703125, "global_step": 599849, "epoch": 7227} {"train_loss": -27.80096435546875, "global_step": 599850, "epoch": 7227} {"train_loss": -28.0821590423584, "global_step": 599851, "epoch": 7227} {"train_loss": -28.071044921875, "global_step": 599852, "epoch": 7227} {"train_loss": -27.8748779296875, "global_step": 599853, "epoch": 7227} {"train_loss": -27.960891723632812, "global_step": 599854, "epoch": 7227} {"train_loss": -27.84393882751465, "global_step": 599855, "epoch": 7227} {"train_loss": -27.96699333190918, "global_step": 599856, "epoch": 7227} {"train_loss": -27.98029136657715, "global_step": 599857, "epoch": 7227} {"train_loss": -27.907140731811523, "global_step": 599858, "epoch": 7227} {"train_loss": -27.752344131469727, "global_step": 599859, "epoch": 7227} {"train_loss": -27.742467880249023, "global_step": 599860, "epoch": 7227} {"train_loss": -27.81489372253418, "global_step": 599861, "epoch": 7227} {"train_loss": -27.986509323120117, "global_step": 599862, "epoch": 7227} {"train_loss": -27.97153091430664, "global_step": 599863, "epoch": 7227} {"train_loss": -28.198623657226562, "global_step": 599864, "epoch": 7227} {"train_loss": -27.998533248901367, "global_step": 599865, "epoch": 7227} {"train_loss": -28.03400993347168, "global_step": 599866, "epoch": 7227} {"train_loss": -27.640949249267578, "global_step": 599867, "epoch": 7227} {"train_loss": -28.154905319213867, "global_step": 599868, "epoch": 7227} {"train_loss": -27.923858642578125, "global_step": 599869, "epoch": 7227} {"train_loss": -28.20218849182129, "global_step": 599870, "epoch": 7227} {"train_loss": -27.845977783203125, "global_step": 599871, "epoch": 7227} {"train_loss": -27.878793716430664, "global_step": 599872, "epoch": 7227} {"train_loss": -28.157861709594727, "global_step": 599873, "epoch": 7227} {"train_loss": -28.394580841064453, "global_step": 599874, "epoch": 7227} {"train_loss": -28.167810440063477, "global_step": 599875, "epoch": 7227} {"train_loss": -28.091527938842773, "global_step": 599876, "epoch": 7227} {"train_loss": -28.56976890563965, "global_step": 599877, "epoch": 7227} {"train_loss": -28.268817901611328, "global_step": 599878, "epoch": 7227} {"train_loss": -28.34954261779785, "global_step": 599879, "epoch": 7227} {"train_loss": -28.21125602722168, "global_step": 599880, "epoch": 7227} {"train_loss": -28.38226318359375, "global_step": 599881, "epoch": 7227} {"train_loss": -27.889636993408203, "global_step": 599882, "epoch": 7227} {"train_loss": -28.013019561767578, "global_step": 599883, "epoch": 7227} {"train_loss": -27.926233291625977, "global_step": 599884, "epoch": 7227} {"train_loss": -27.855188369750977, "global_step": 599885, "epoch": 7227} {"train_loss": -27.741806030273438, "global_step": 599886, "epoch": 7227} {"train_loss": -28.0240478515625, "global_step": 599887, "epoch": 7227} {"train_loss": -28.10088539123535, "global_step": 599888, "epoch": 7227} {"train_loss": -27.890432357788086, "global_step": 599889, "epoch": 7227} {"train_loss": -28.063657760620117, "global_step": 599890, "epoch": 7227} {"train_loss": -28.068832397460938, "global_step": 599891, "epoch": 7227} {"train_loss": -28.232664108276367, "global_step": 599892, "epoch": 7227} {"train_loss": -28.370441436767578, "global_step": 599893, "epoch": 7227} {"train_loss": -28.058502197265625, "global_step": 599894, "epoch": 7227} {"train_loss": -28.363773345947266, "global_step": 599895, "epoch": 7227} {"train_loss": -28.2703800201416, "global_step": 599896, "epoch": 7227} {"train_loss": -28.401609420776367, "global_step": 599897, "epoch": 7227} {"train_loss": -28.037555694580078, "global_step": 599898, "epoch": 7227} {"train_loss": -28.3791446685791, "global_step": 599899, "epoch": 7227} {"train_loss": -28.235736846923828, "global_step": 599900, "epoch": 7227} {"train_loss": -28.268951416015625, "global_step": 599901, "epoch": 7227} {"train_loss": -28.356592178344727, "global_step": 599902, "epoch": 7227} {"train_loss": -28.11814308166504, "global_step": 599903, "epoch": 7227} {"train_loss": -28.27839469909668, "global_step": 599904, "epoch": 7227} {"train_loss": -28.32377052307129, "global_step": 599905, "epoch": 7227} {"train_loss": -27.969131469726562, "global_step": 599906, "epoch": 7227} {"train_loss": -28.201574325561523, "global_step": 599907, "epoch": 7227} {"train_loss": -28.177417755126953, "global_step": 599908, "epoch": 7227} {"train_loss": -28.420480728149414, "global_step": 599909, "epoch": 7227} {"train_loss": -28.33913230895996, "global_step": 599910, "epoch": 7227} {"train_loss": -28.2210693359375, "global_step": 599911, "epoch": 7227} {"train_loss": -27.802143096923828, "global_step": 599912, "epoch": 7227} {"train_loss": -28.08949089050293, "global_step": 599913, "epoch": 7227} {"train_loss": -27.947595596313477, "global_step": 599914, "epoch": 7227} {"train_loss": -27.581222534179688, "global_step": 599915, "epoch": 7227} {"train_loss": -27.019269943237305, "global_step": 599916, "epoch": 7227} {"train_loss": -27.526914596557617, "global_step": 599917, "epoch": 7227} {"train_loss": -27.396793365478516, "global_step": 599918, "epoch": 7227} {"train_loss": -28.082263946533203, "global_step": 599919, "epoch": 7227} {"train_loss": -27.98737144470215, "global_step": 599920, "epoch": 7227} {"train_loss": -27.739755630493164, "global_step": 599921, "epoch": 7227} {"train_loss": -27.7700138092041, "global_step": 599922, "epoch": 7227} {"train_loss": -28.00164158372994, "global_step": 599923, "epoch": 7227, "val_loss": 6537730.0} {"train_loss": -26.97047996520996, "global_step": 599924, "epoch": 7228} {"train_loss": -27.1420841217041, "global_step": 599925, "epoch": 7228} {"train_loss": -27.877582550048828, "global_step": 599926, "epoch": 7228} {"train_loss": -27.280149459838867, "global_step": 599927, "epoch": 7228} {"train_loss": -27.282201766967773, "global_step": 599928, "epoch": 7228} {"train_loss": -27.71209716796875, "global_step": 599929, "epoch": 7228} {"train_loss": -26.988849639892578, "global_step": 599930, "epoch": 7228} {"train_loss": -27.186431884765625, "global_step": 599931, "epoch": 7228} {"train_loss": -27.575536727905273, "global_step": 599932, "epoch": 7228} {"train_loss": -27.312183380126953, "global_step": 599933, "epoch": 7228} {"train_loss": -27.818151473999023, "global_step": 599934, "epoch": 7228} {"train_loss": -27.548803329467773, "global_step": 599935, "epoch": 7228} {"train_loss": -27.835126876831055, "global_step": 599936, "epoch": 7228} {"train_loss": -27.371875762939453, "global_step": 599937, "epoch": 7228} {"train_loss": -27.64600944519043, "global_step": 599938, "epoch": 7228} {"train_loss": -27.958139419555664, "global_step": 599939, "epoch": 7228} {"train_loss": -27.905364990234375, "global_step": 599940, "epoch": 7228} {"train_loss": -27.446313858032227, "global_step": 599941, "epoch": 7228} {"train_loss": -27.674665451049805, "global_step": 599942, "epoch": 7228} {"train_loss": -28.377363204956055, "global_step": 599943, "epoch": 7228} {"train_loss": -27.953351974487305, "global_step": 599944, "epoch": 7228} {"train_loss": -27.83219337463379, "global_step": 599945, "epoch": 7228} {"train_loss": -27.954395294189453, "global_step": 599946, "epoch": 7228} {"train_loss": -27.84144401550293, "global_step": 599947, "epoch": 7228} {"train_loss": -28.079456329345703, "global_step": 599948, "epoch": 7228} {"train_loss": -27.851682662963867, "global_step": 599949, "epoch": 7228} {"train_loss": -27.839040756225586, "global_step": 599950, "epoch": 7228} {"train_loss": -27.66167640686035, "global_step": 599951, "epoch": 7228} {"train_loss": -27.594165802001953, "global_step": 599952, "epoch": 7228} {"train_loss": -27.9317569732666, "global_step": 599953, "epoch": 7228} {"train_loss": -28.088544845581055, "global_step": 599954, "epoch": 7228} {"train_loss": -28.211767196655273, "global_step": 599955, "epoch": 7228} {"train_loss": -28.01936149597168, "global_step": 599956, "epoch": 7228} {"train_loss": -27.919767379760742, "global_step": 599957, "epoch": 7228} {"train_loss": -28.311908721923828, "global_step": 599958, "epoch": 7228} {"train_loss": -28.02908706665039, "global_step": 599959, "epoch": 7228} {"train_loss": -28.308658599853516, "global_step": 599960, "epoch": 7228} {"train_loss": -28.125497817993164, "global_step": 599961, "epoch": 7228} {"train_loss": -28.244504928588867, "global_step": 599962, "epoch": 7228} {"train_loss": -28.314422607421875, "global_step": 599963, "epoch": 7228} {"train_loss": -28.057449340820312, "global_step": 599964, "epoch": 7228} {"train_loss": -28.3256778717041, "global_step": 599965, "epoch": 7228} {"train_loss": -28.369359970092773, "global_step": 599966, "epoch": 7228} {"train_loss": -28.126676559448242, "global_step": 599967, "epoch": 7228} {"train_loss": -27.962377548217773, "global_step": 599968, "epoch": 7228} {"train_loss": -28.0858154296875, "global_step": 599969, "epoch": 7228} {"train_loss": -28.146636962890625, "global_step": 599970, "epoch": 7228} {"train_loss": -28.364938735961914, "global_step": 599971, "epoch": 7228} {"train_loss": -28.449750900268555, "global_step": 599972, "epoch": 7228} {"train_loss": -28.19806480407715, "global_step": 599973, "epoch": 7228} {"train_loss": -28.334829330444336, "global_step": 599974, "epoch": 7228} {"train_loss": -28.381763458251953, "global_step": 599975, "epoch": 7228} {"train_loss": -28.43552589416504, "global_step": 599976, "epoch": 7228} {"train_loss": -28.314701080322266, "global_step": 599977, "epoch": 7228} {"train_loss": -27.9729061126709, "global_step": 599978, "epoch": 7228} {"train_loss": -28.35384178161621, "global_step": 599979, "epoch": 7228} {"train_loss": -27.9820556640625, "global_step": 599980, "epoch": 7228} {"train_loss": -27.84027671813965, "global_step": 599981, "epoch": 7228} {"train_loss": -28.33896255493164, "global_step": 599982, "epoch": 7228} {"train_loss": -28.144006729125977, "global_step": 599983, "epoch": 7228} {"train_loss": -28.31396484375, "global_step": 599984, "epoch": 7228} {"train_loss": -27.952503204345703, "global_step": 599985, "epoch": 7228} {"train_loss": -28.3013858795166, "global_step": 599986, "epoch": 7228} {"train_loss": -27.83077049255371, "global_step": 599987, "epoch": 7228} {"train_loss": -28.282262802124023, "global_step": 599988, "epoch": 7228} {"train_loss": -28.375028610229492, "global_step": 599989, "epoch": 7228} {"train_loss": -27.6597957611084, "global_step": 599990, "epoch": 7228} {"train_loss": -28.064111709594727, "global_step": 599991, "epoch": 7228} {"train_loss": -28.300683975219727, "global_step": 599992, "epoch": 7228} {"train_loss": -27.807409286499023, "global_step": 599993, "epoch": 7228} {"train_loss": -28.352041244506836, "global_step": 599994, "epoch": 7228} {"train_loss": -28.053070068359375, "global_step": 599995, "epoch": 7228} {"train_loss": -28.20157241821289, "global_step": 599996, "epoch": 7228} {"train_loss": -28.017566680908203, "global_step": 599997, "epoch": 7228} {"train_loss": -28.107641220092773, "global_step": 599998, "epoch": 7228} {"train_loss": -28.268390655517578, "global_step": 599999, "epoch": 7228} {"train_loss": -27.947280883789062, "global_step": 600000, "epoch": 7228} {"train_loss": -28.022367477416992, "global_step": 600001, "epoch": 7228} {"train_loss": -28.35190200805664, "global_step": 600002, "epoch": 7228} {"train_loss": -27.8712158203125, "global_step": 600003, "epoch": 7228} {"train_loss": -27.921085357666016, "global_step": 600004, "epoch": 7228} {"train_loss": -28.4476375579834, "global_step": 600005, "epoch": 7228} {"train_loss": -27.964814565267908, "global_step": 600006, "epoch": 7228, "val_loss": 6565156.0} {"train_loss": -16.05146026611328, "global_step": 600007, "epoch": 7229} {"train_loss": -11.181879997253418, "global_step": 600008, "epoch": 7229} {"train_loss": -23.646839141845703, "global_step": 600009, "epoch": 7229} {"train_loss": -19.346736907958984, "global_step": 600010, "epoch": 7229} {"train_loss": -22.728961944580078, "global_step": 600011, "epoch": 7229} {"train_loss": -23.796985626220703, "global_step": 600012, "epoch": 7229} {"train_loss": -21.314695358276367, "global_step": 600013, "epoch": 7229} {"train_loss": -24.569143295288086, "global_step": 600014, "epoch": 7229} {"train_loss": -25.581741333007812, "global_step": 600015, "epoch": 7229} {"train_loss": -23.75055503845215, "global_step": 600016, "epoch": 7229} {"train_loss": -23.9173641204834, "global_step": 600017, "epoch": 7229} {"train_loss": -25.020654678344727, "global_step": 600018, "epoch": 7229} {"train_loss": -25.134366989135742, "global_step": 600019, "epoch": 7229} {"train_loss": -25.803821563720703, "global_step": 600020, "epoch": 7229} {"train_loss": -25.127222061157227, "global_step": 600021, "epoch": 7229} {"train_loss": -24.97540855407715, "global_step": 600022, "epoch": 7229} {"train_loss": -24.958974838256836, "global_step": 600023, "epoch": 7229} {"train_loss": -25.659626007080078, "global_step": 600024, "epoch": 7229} {"train_loss": -26.130590438842773, "global_step": 600025, "epoch": 7229} {"train_loss": -25.6881160736084, "global_step": 600026, "epoch": 7229} {"train_loss": -25.708398818969727, "global_step": 600027, "epoch": 7229} {"train_loss": -25.954389572143555, "global_step": 600028, "epoch": 7229} {"train_loss": -26.037927627563477, "global_step": 600029, "epoch": 7229} {"train_loss": -25.677148818969727, "global_step": 600030, "epoch": 7229} {"train_loss": -25.79054832458496, "global_step": 600031, "epoch": 7229} {"train_loss": -26.28238868713379, "global_step": 600032, "epoch": 7229} {"train_loss": -26.381071090698242, "global_step": 600033, "epoch": 7229} {"train_loss": -26.612680435180664, "global_step": 600034, "epoch": 7229} {"train_loss": -26.611434936523438, "global_step": 600035, "epoch": 7229} {"train_loss": -26.2946720123291, "global_step": 600036, "epoch": 7229} {"train_loss": -26.61383056640625, "global_step": 600037, "epoch": 7229} {"train_loss": -26.611835479736328, "global_step": 600038, "epoch": 7229} {"train_loss": -26.547021865844727, "global_step": 600039, "epoch": 7229} {"train_loss": -26.391454696655273, "global_step": 600040, "epoch": 7229} {"train_loss": -26.344318389892578, "global_step": 600041, "epoch": 7229} {"train_loss": -26.777591705322266, "global_step": 600042, "epoch": 7229} {"train_loss": -26.951507568359375, "global_step": 600043, "epoch": 7229} {"train_loss": -26.3731689453125, "global_step": 600044, "epoch": 7229} {"train_loss": -27.09368896484375, "global_step": 600045, "epoch": 7229} {"train_loss": -26.637907028198242, "global_step": 600046, "epoch": 7229} {"train_loss": -27.0674991607666, "global_step": 600047, "epoch": 7229} {"train_loss": -27.0880126953125, "global_step": 600048, "epoch": 7229} {"train_loss": -27.01980972290039, "global_step": 600049, "epoch": 7229} {"train_loss": -27.297887802124023, "global_step": 600050, "epoch": 7229} {"train_loss": -26.662439346313477, "global_step": 600051, "epoch": 7229} {"train_loss": -27.135419845581055, "global_step": 600052, "epoch": 7229} {"train_loss": -27.211591720581055, "global_step": 600053, "epoch": 7229} {"train_loss": -27.250354766845703, "global_step": 600054, "epoch": 7229} {"train_loss": -26.96619987487793, "global_step": 600055, "epoch": 7229} {"train_loss": -27.263275146484375, "global_step": 600056, "epoch": 7229} {"train_loss": -27.406614303588867, "global_step": 600057, "epoch": 7229} {"train_loss": -27.38831901550293, "global_step": 600058, "epoch": 7229} {"train_loss": -27.64594841003418, "global_step": 600059, "epoch": 7229} {"train_loss": -27.399688720703125, "global_step": 600060, "epoch": 7229} {"train_loss": -27.47113037109375, "global_step": 600061, "epoch": 7229} {"train_loss": -27.810596466064453, "global_step": 600062, "epoch": 7229} {"train_loss": -27.346914291381836, "global_step": 600063, "epoch": 7229} {"train_loss": -27.748929977416992, "global_step": 600064, "epoch": 7229} {"train_loss": -27.57623863220215, "global_step": 600065, "epoch": 7229} {"train_loss": -27.52949333190918, "global_step": 600066, "epoch": 7229} {"train_loss": -27.30291175842285, "global_step": 600067, "epoch": 7229} {"train_loss": -27.510028839111328, "global_step": 600068, "epoch": 7229} {"train_loss": -27.750226974487305, "global_step": 600069, "epoch": 7229} {"train_loss": -27.3817138671875, "global_step": 600070, "epoch": 7229} {"train_loss": -27.99390983581543, "global_step": 600071, "epoch": 7229} {"train_loss": -28.090234756469727, "global_step": 600072, "epoch": 7229} {"train_loss": -27.952972412109375, "global_step": 600073, "epoch": 7229} {"train_loss": -27.262014389038086, "global_step": 600074, "epoch": 7229} {"train_loss": -27.67542839050293, "global_step": 600075, "epoch": 7229} {"train_loss": -27.95197105407715, "global_step": 600076, "epoch": 7229} {"train_loss": -27.87417984008789, "global_step": 600077, "epoch": 7229} {"train_loss": -27.918298721313477, "global_step": 600078, "epoch": 7229} {"train_loss": -27.83881950378418, "global_step": 600079, "epoch": 7229} {"train_loss": -28.352018356323242, "global_step": 600080, "epoch": 7229} {"train_loss": -27.783716201782227, "global_step": 600081, "epoch": 7229} {"train_loss": -27.92888832092285, "global_step": 600082, "epoch": 7229} {"train_loss": -27.772958755493164, "global_step": 600083, "epoch": 7229} {"train_loss": -27.246234893798828, "global_step": 600084, "epoch": 7229} {"train_loss": -27.267683029174805, "global_step": 600085, "epoch": 7229} {"train_loss": -27.406164169311523, "global_step": 600086, "epoch": 7229} {"train_loss": -27.69537353515625, "global_step": 600087, "epoch": 7229} {"train_loss": -27.4484920501709, "global_step": 600088, "epoch": 7229} {"train_loss": -26.22665987819074, "global_step": 600089, "epoch": 7229, "val_loss": 6541640.0} {"train_loss": -27.206592559814453, "global_step": 600090, "epoch": 7230} {"train_loss": -25.018339157104492, "global_step": 600091, "epoch": 7230} {"train_loss": -26.864337921142578, "global_step": 600092, "epoch": 7230} {"train_loss": -27.189855575561523, "global_step": 600093, "epoch": 7230} {"train_loss": -26.7047119140625, "global_step": 600094, "epoch": 7230} {"train_loss": -27.041608810424805, "global_step": 600095, "epoch": 7230} {"train_loss": -27.057147979736328, "global_step": 600096, "epoch": 7230} {"train_loss": -27.731658935546875, "global_step": 600097, "epoch": 7230} {"train_loss": -26.69718360900879, "global_step": 600098, "epoch": 7230} {"train_loss": -27.563201904296875, "global_step": 600099, "epoch": 7230} {"train_loss": -27.046146392822266, "global_step": 600100, "epoch": 7230} {"train_loss": -27.682233810424805, "global_step": 600101, "epoch": 7230} {"train_loss": -27.1200008392334, "global_step": 600102, "epoch": 7230} {"train_loss": -27.500635147094727, "global_step": 600103, "epoch": 7230} {"train_loss": -27.40935707092285, "global_step": 600104, "epoch": 7230} {"train_loss": -27.796283721923828, "global_step": 600105, "epoch": 7230} {"train_loss": -27.388952255249023, "global_step": 600106, "epoch": 7230} {"train_loss": -27.349943161010742, "global_step": 600107, "epoch": 7230} {"train_loss": -27.501728057861328, "global_step": 600108, "epoch": 7230} {"train_loss": -27.178754806518555, "global_step": 600109, "epoch": 7230} {"train_loss": -27.19146728515625, "global_step": 600110, "epoch": 7230} {"train_loss": -27.17300796508789, "global_step": 600111, "epoch": 7230} {"train_loss": -27.151037216186523, "global_step": 600112, "epoch": 7230} {"train_loss": -27.737945556640625, "global_step": 600113, "epoch": 7230} {"train_loss": -27.55523681640625, "global_step": 600114, "epoch": 7230} {"train_loss": -27.571430206298828, "global_step": 600115, "epoch": 7230} {"train_loss": -27.547948837280273, "global_step": 600116, "epoch": 7230} {"train_loss": -27.53069496154785, "global_step": 600117, "epoch": 7230} {"train_loss": -27.44095802307129, "global_step": 600118, "epoch": 7230} {"train_loss": -27.1397647857666, "global_step": 600119, "epoch": 7230} {"train_loss": -27.192068099975586, "global_step": 600120, "epoch": 7230} {"train_loss": -28.037139892578125, "global_step": 600121, "epoch": 7230} {"train_loss": -27.492246627807617, "global_step": 600122, "epoch": 7230} {"train_loss": -27.9765625, "global_step": 600123, "epoch": 7230} {"train_loss": -27.662641525268555, "global_step": 600124, "epoch": 7230} {"train_loss": -27.970966339111328, "global_step": 600125, "epoch": 7230} {"train_loss": -27.8080997467041, "global_step": 600126, "epoch": 7230} {"train_loss": -27.6458683013916, "global_step": 600127, "epoch": 7230} {"train_loss": -27.749149322509766, "global_step": 600128, "epoch": 7230} {"train_loss": -27.54538345336914, "global_step": 600129, "epoch": 7230} {"train_loss": -27.722394943237305, "global_step": 600130, "epoch": 7230} {"train_loss": -27.83011245727539, "global_step": 600131, "epoch": 7230} {"train_loss": -28.082406997680664, "global_step": 600132, "epoch": 7230} {"train_loss": -27.4089412689209, "global_step": 600133, "epoch": 7230} {"train_loss": -27.940509796142578, "global_step": 600134, "epoch": 7230} {"train_loss": -27.836511611938477, "global_step": 600135, "epoch": 7230} {"train_loss": -28.1037654876709, "global_step": 600136, "epoch": 7230} {"train_loss": -27.99220085144043, "global_step": 600137, "epoch": 7230} {"train_loss": -27.7608585357666, "global_step": 600138, "epoch": 7230} {"train_loss": -28.277990341186523, "global_step": 600139, "epoch": 7230} {"train_loss": -27.84943199157715, "global_step": 600140, "epoch": 7230} {"train_loss": -27.760761260986328, "global_step": 600141, "epoch": 7230} {"train_loss": -28.04359245300293, "global_step": 600142, "epoch": 7230} {"train_loss": -27.98150634765625, "global_step": 600143, "epoch": 7230} {"train_loss": -27.9831600189209, "global_step": 600144, "epoch": 7230} {"train_loss": -28.058298110961914, "global_step": 600145, "epoch": 7230} {"train_loss": -28.226505279541016, "global_step": 600146, "epoch": 7230} {"train_loss": -28.117834091186523, "global_step": 600147, "epoch": 7230} {"train_loss": -28.217023849487305, "global_step": 600148, "epoch": 7230} {"train_loss": -28.156461715698242, "global_step": 600149, "epoch": 7230} {"train_loss": -27.80829429626465, "global_step": 600150, "epoch": 7230} {"train_loss": -28.1009578704834, "global_step": 600151, "epoch": 7230} {"train_loss": -28.073965072631836, "global_step": 600152, "epoch": 7230} {"train_loss": -28.23365592956543, "global_step": 600153, "epoch": 7230} {"train_loss": -28.074140548706055, "global_step": 600154, "epoch": 7230} {"train_loss": -27.881927490234375, "global_step": 600155, "epoch": 7230} {"train_loss": -28.016098022460938, "global_step": 600156, "epoch": 7230} {"train_loss": -27.904083251953125, "global_step": 600157, "epoch": 7230} {"train_loss": -28.018024444580078, "global_step": 600158, "epoch": 7230} {"train_loss": -28.382238388061523, "global_step": 600159, "epoch": 7230} {"train_loss": -27.787033081054688, "global_step": 600160, "epoch": 7230} {"train_loss": -28.03759765625, "global_step": 600161, "epoch": 7230} {"train_loss": -28.109699249267578, "global_step": 600162, "epoch": 7230} {"train_loss": -27.98029136657715, "global_step": 600163, "epoch": 7230} {"train_loss": -28.1501407623291, "global_step": 600164, "epoch": 7230} {"train_loss": -27.972455978393555, "global_step": 600165, "epoch": 7230} {"train_loss": -27.89228630065918, "global_step": 600166, "epoch": 7230} {"train_loss": -27.710071563720703, "global_step": 600167, "epoch": 7230} {"train_loss": -27.948938369750977, "global_step": 600168, "epoch": 7230} {"train_loss": -28.095020294189453, "global_step": 600169, "epoch": 7230} {"train_loss": -28.110876083374023, "global_step": 600170, "epoch": 7230} {"train_loss": -28.510751724243164, "global_step": 600171, "epoch": 7230} {"train_loss": -27.703306404941053, "global_step": 600172, "epoch": 7230, "val_loss": 6506999.0} {"train_loss": -25.97614097595215, "global_step": 600173, "epoch": 7231} {"train_loss": -26.177661895751953, "global_step": 600174, "epoch": 7231} {"train_loss": -26.801435470581055, "global_step": 600175, "epoch": 7231} {"train_loss": -26.15974235534668, "global_step": 600176, "epoch": 7231} {"train_loss": -27.13604164123535, "global_step": 600177, "epoch": 7231} {"train_loss": -26.8288516998291, "global_step": 600178, "epoch": 7231} {"train_loss": -26.926183700561523, "global_step": 600179, "epoch": 7231} {"train_loss": -27.31007194519043, "global_step": 600180, "epoch": 7231} {"train_loss": -27.049482345581055, "global_step": 600181, "epoch": 7231} {"train_loss": -27.18787956237793, "global_step": 600182, "epoch": 7231} {"train_loss": -27.34083366394043, "global_step": 600183, "epoch": 7231} {"train_loss": -27.1238956451416, "global_step": 600184, "epoch": 7231} {"train_loss": -27.42365074157715, "global_step": 600185, "epoch": 7231} {"train_loss": -27.546680450439453, "global_step": 600186, "epoch": 7231} {"train_loss": -27.52800941467285, "global_step": 600187, "epoch": 7231} {"train_loss": -27.659381866455078, "global_step": 600188, "epoch": 7231} {"train_loss": -27.316333770751953, "global_step": 600189, "epoch": 7231} {"train_loss": -27.4833984375, "global_step": 600190, "epoch": 7231} {"train_loss": -27.25038719177246, "global_step": 600191, "epoch": 7231} {"train_loss": -27.85907554626465, "global_step": 600192, "epoch": 7231} {"train_loss": -27.108627319335938, "global_step": 600193, "epoch": 7231} {"train_loss": -27.769323348999023, "global_step": 600194, "epoch": 7231} {"train_loss": -27.82708168029785, "global_step": 600195, "epoch": 7231} {"train_loss": -27.600461959838867, "global_step": 600196, "epoch": 7231} {"train_loss": -27.86890983581543, "global_step": 600197, "epoch": 7231} {"train_loss": -27.75360107421875, "global_step": 600198, "epoch": 7231} {"train_loss": -27.7895450592041, "global_step": 600199, "epoch": 7231} {"train_loss": -27.807851791381836, "global_step": 600200, "epoch": 7231} {"train_loss": -27.855133056640625, "global_step": 600201, "epoch": 7231} {"train_loss": -27.822996139526367, "global_step": 600202, "epoch": 7231} {"train_loss": -27.904516220092773, "global_step": 600203, "epoch": 7231} {"train_loss": -28.234045028686523, "global_step": 600204, "epoch": 7231} {"train_loss": -28.057004928588867, "global_step": 600205, "epoch": 7231} {"train_loss": -27.96660804748535, "global_step": 600206, "epoch": 7231} {"train_loss": -27.920515060424805, "global_step": 600207, "epoch": 7231} {"train_loss": -27.816999435424805, "global_step": 600208, "epoch": 7231} {"train_loss": -28.307035446166992, "global_step": 600209, "epoch": 7231} {"train_loss": -27.863065719604492, "global_step": 600210, "epoch": 7231} {"train_loss": -28.091413497924805, "global_step": 600211, "epoch": 7231} {"train_loss": -27.924341201782227, "global_step": 600212, "epoch": 7231} {"train_loss": -27.98032569885254, "global_step": 600213, "epoch": 7231} {"train_loss": -28.18220329284668, "global_step": 600214, "epoch": 7231} {"train_loss": -28.120126724243164, "global_step": 600215, "epoch": 7231} {"train_loss": -28.205646514892578, "global_step": 600216, "epoch": 7231} {"train_loss": -28.14692497253418, "global_step": 600217, "epoch": 7231} {"train_loss": -28.190290451049805, "global_step": 600218, "epoch": 7231} {"train_loss": -28.054014205932617, "global_step": 600219, "epoch": 7231} {"train_loss": -28.15150260925293, "global_step": 600220, "epoch": 7231} {"train_loss": -28.1818790435791, "global_step": 600221, "epoch": 7231} {"train_loss": -27.8349609375, "global_step": 600222, "epoch": 7231} {"train_loss": -28.16805076599121, "global_step": 600223, "epoch": 7231} {"train_loss": -28.300016403198242, "global_step": 600224, "epoch": 7231} {"train_loss": -28.126867294311523, "global_step": 600225, "epoch": 7231} {"train_loss": -28.278671264648438, "global_step": 600226, "epoch": 7231} {"train_loss": -28.290802001953125, "global_step": 600227, "epoch": 7231} {"train_loss": -28.27937126159668, "global_step": 600228, "epoch": 7231} {"train_loss": -28.3795108795166, "global_step": 600229, "epoch": 7231} {"train_loss": -28.425382614135742, "global_step": 600230, "epoch": 7231} {"train_loss": -28.056482315063477, "global_step": 600231, "epoch": 7231} {"train_loss": -28.405378341674805, "global_step": 600232, "epoch": 7231} {"train_loss": -28.1019229888916, "global_step": 600233, "epoch": 7231} {"train_loss": -28.302778244018555, "global_step": 600234, "epoch": 7231} {"train_loss": -28.42812156677246, "global_step": 600235, "epoch": 7231} {"train_loss": -28.33034324645996, "global_step": 600236, "epoch": 7231} {"train_loss": -28.50119972229004, "global_step": 600237, "epoch": 7231} {"train_loss": -27.9134464263916, "global_step": 600238, "epoch": 7231} {"train_loss": -27.991613388061523, "global_step": 600239, "epoch": 7231} {"train_loss": -27.934741973876953, "global_step": 600240, "epoch": 7231} {"train_loss": -28.010807037353516, "global_step": 600241, "epoch": 7231} {"train_loss": -28.1374454498291, "global_step": 600242, "epoch": 7231} {"train_loss": -28.124128341674805, "global_step": 600243, "epoch": 7231} {"train_loss": -27.924182891845703, "global_step": 600244, "epoch": 7231} {"train_loss": -28.223739624023438, "global_step": 600245, "epoch": 7231} {"train_loss": -28.317657470703125, "global_step": 600246, "epoch": 7231} {"train_loss": -27.598419189453125, "global_step": 600247, "epoch": 7231} {"train_loss": -27.660694122314453, "global_step": 600248, "epoch": 7231} {"train_loss": -28.133264541625977, "global_step": 600249, "epoch": 7231} {"train_loss": -28.013660430908203, "global_step": 600250, "epoch": 7231} {"train_loss": -27.90155601501465, "global_step": 600251, "epoch": 7231} {"train_loss": -27.859827041625977, "global_step": 600252, "epoch": 7231} {"train_loss": -27.9261474609375, "global_step": 600253, "epoch": 7231} {"train_loss": -28.037067413330078, "global_step": 600254, "epoch": 7231} {"train_loss": -27.798076307917217, "global_step": 600255, "epoch": 7231, "val_loss": 6570350.0} {"train_loss": -26.52229118347168, "global_step": 600256, "epoch": 7232} {"train_loss": -26.5096492767334, "global_step": 600257, "epoch": 7232} {"train_loss": -26.69182777404785, "global_step": 600258, "epoch": 7232} {"train_loss": -26.585729598999023, "global_step": 600259, "epoch": 7232} {"train_loss": -27.458545684814453, "global_step": 600260, "epoch": 7232} {"train_loss": -27.16265296936035, "global_step": 600261, "epoch": 7232} {"train_loss": -27.179813385009766, "global_step": 600262, "epoch": 7232} {"train_loss": -27.164642333984375, "global_step": 600263, "epoch": 7232} {"train_loss": -27.7779541015625, "global_step": 600264, "epoch": 7232} {"train_loss": -27.147342681884766, "global_step": 600265, "epoch": 7232} {"train_loss": -27.727039337158203, "global_step": 600266, "epoch": 7232} {"train_loss": -26.855920791625977, "global_step": 600267, "epoch": 7232} {"train_loss": -27.398635864257812, "global_step": 600268, "epoch": 7232} {"train_loss": -27.75934410095215, "global_step": 600269, "epoch": 7232} {"train_loss": -27.245075225830078, "global_step": 600270, "epoch": 7232} {"train_loss": -27.728185653686523, "global_step": 600271, "epoch": 7232} {"train_loss": -27.860748291015625, "global_step": 600272, "epoch": 7232} {"train_loss": -27.317209243774414, "global_step": 600273, "epoch": 7232} {"train_loss": -27.288898468017578, "global_step": 600274, "epoch": 7232} {"train_loss": -27.691919326782227, "global_step": 600275, "epoch": 7232} {"train_loss": -27.164997100830078, "global_step": 600276, "epoch": 7232} {"train_loss": -27.526235580444336, "global_step": 600277, "epoch": 7232} {"train_loss": -28.030725479125977, "global_step": 600278, "epoch": 7232} {"train_loss": -27.7042236328125, "global_step": 600279, "epoch": 7232} {"train_loss": -28.00178337097168, "global_step": 600280, "epoch": 7232} {"train_loss": -27.937116622924805, "global_step": 600281, "epoch": 7232} {"train_loss": -28.091415405273438, "global_step": 600282, "epoch": 7232} {"train_loss": -27.837631225585938, "global_step": 600283, "epoch": 7232} {"train_loss": -27.912633895874023, "global_step": 600284, "epoch": 7232} {"train_loss": -28.0537166595459, "global_step": 600285, "epoch": 7232} {"train_loss": -27.775297164916992, "global_step": 600286, "epoch": 7232} {"train_loss": -27.95907974243164, "global_step": 600287, "epoch": 7232} {"train_loss": -27.870588302612305, "global_step": 600288, "epoch": 7232} {"train_loss": -27.994897842407227, "global_step": 600289, "epoch": 7232} {"train_loss": -27.88996696472168, "global_step": 600290, "epoch": 7232} {"train_loss": -27.854278564453125, "global_step": 600291, "epoch": 7232} {"train_loss": -27.92671775817871, "global_step": 600292, "epoch": 7232} {"train_loss": -28.057783126831055, "global_step": 600293, "epoch": 7232} {"train_loss": -27.914960861206055, "global_step": 600294, "epoch": 7232} {"train_loss": -28.372343063354492, "global_step": 600295, "epoch": 7232} {"train_loss": -27.856245040893555, "global_step": 600296, "epoch": 7232} {"train_loss": -28.01187515258789, "global_step": 600297, "epoch": 7232} {"train_loss": -27.712289810180664, "global_step": 600298, "epoch": 7232} {"train_loss": -28.130050659179688, "global_step": 600299, "epoch": 7232} {"train_loss": -28.238691329956055, "global_step": 600300, "epoch": 7232} {"train_loss": -27.6749210357666, "global_step": 600301, "epoch": 7232} {"train_loss": -27.980627059936523, "global_step": 600302, "epoch": 7232} {"train_loss": -28.06134605407715, "global_step": 600303, "epoch": 7232} {"train_loss": -28.081037521362305, "global_step": 600304, "epoch": 7232} {"train_loss": -28.377126693725586, "global_step": 600305, "epoch": 7232} {"train_loss": -28.089323043823242, "global_step": 600306, "epoch": 7232} {"train_loss": -28.031423568725586, "global_step": 600307, "epoch": 7232} {"train_loss": -27.914722442626953, "global_step": 600308, "epoch": 7232} {"train_loss": -28.411962509155273, "global_step": 600309, "epoch": 7232} {"train_loss": -28.262022018432617, "global_step": 600310, "epoch": 7232} {"train_loss": -28.2431697845459, "global_step": 600311, "epoch": 7232} {"train_loss": -28.03318214416504, "global_step": 600312, "epoch": 7232} {"train_loss": -27.879901885986328, "global_step": 600313, "epoch": 7232} {"train_loss": -27.547910690307617, "global_step": 600314, "epoch": 7232} {"train_loss": -27.44337272644043, "global_step": 600315, "epoch": 7232} {"train_loss": -28.32157325744629, "global_step": 600316, "epoch": 7232} {"train_loss": -27.372583389282227, "global_step": 600317, "epoch": 7232} {"train_loss": -27.308095932006836, "global_step": 600318, "epoch": 7232} {"train_loss": -27.70542335510254, "global_step": 600319, "epoch": 7232} {"train_loss": -27.87897300720215, "global_step": 600320, "epoch": 7232} {"train_loss": -27.44806480407715, "global_step": 600321, "epoch": 7232} {"train_loss": -27.821517944335938, "global_step": 600322, "epoch": 7232} {"train_loss": -27.864715576171875, "global_step": 600323, "epoch": 7232} {"train_loss": -27.412128448486328, "global_step": 600324, "epoch": 7232} {"train_loss": -28.198328018188477, "global_step": 600325, "epoch": 7232} {"train_loss": -27.534671783447266, "global_step": 600326, "epoch": 7232} {"train_loss": -28.049362182617188, "global_step": 600327, "epoch": 7232} {"train_loss": -27.703723907470703, "global_step": 600328, "epoch": 7232} {"train_loss": -28.036529541015625, "global_step": 600329, "epoch": 7232} {"train_loss": -28.19110679626465, "global_step": 600330, "epoch": 7232} {"train_loss": -27.797576904296875, "global_step": 600331, "epoch": 7232} {"train_loss": -27.7376651763916, "global_step": 600332, "epoch": 7232} {"train_loss": -28.074819564819336, "global_step": 600333, "epoch": 7232} {"train_loss": -28.172809600830078, "global_step": 600334, "epoch": 7232} {"train_loss": -28.231184005737305, "global_step": 600335, "epoch": 7232} {"train_loss": -28.11580467224121, "global_step": 600336, "epoch": 7232} {"train_loss": -27.780221939086914, "global_step": 600337, "epoch": 7232} {"train_loss": -27.77080163610987, "global_step": 600338, "epoch": 7232, "val_loss": 6480719.0} {"train_loss": -26.058242797851562, "global_step": 600339, "epoch": 7233} {"train_loss": -27.23858070373535, "global_step": 600340, "epoch": 7233} {"train_loss": -27.00544548034668, "global_step": 600341, "epoch": 7233} {"train_loss": -26.811216354370117, "global_step": 600342, "epoch": 7233} {"train_loss": -26.91739273071289, "global_step": 600343, "epoch": 7233} {"train_loss": -27.06202507019043, "global_step": 600344, "epoch": 7233} {"train_loss": -26.893585205078125, "global_step": 600345, "epoch": 7233} {"train_loss": -27.35590934753418, "global_step": 600346, "epoch": 7233} {"train_loss": -27.638507843017578, "global_step": 600347, "epoch": 7233} {"train_loss": -27.288114547729492, "global_step": 600348, "epoch": 7233} {"train_loss": -27.355070114135742, "global_step": 600349, "epoch": 7233} {"train_loss": -26.938861846923828, "global_step": 600350, "epoch": 7233} {"train_loss": -27.320104598999023, "global_step": 600351, "epoch": 7233} {"train_loss": -26.927265167236328, "global_step": 600352, "epoch": 7233} {"train_loss": -27.21241569519043, "global_step": 600353, "epoch": 7233} {"train_loss": -27.2089786529541, "global_step": 600354, "epoch": 7233} {"train_loss": -27.351947784423828, "global_step": 600355, "epoch": 7233} {"train_loss": -27.55916404724121, "global_step": 600356, "epoch": 7233} {"train_loss": -27.397445678710938, "global_step": 600357, "epoch": 7233} {"train_loss": -27.504880905151367, "global_step": 600358, "epoch": 7233} {"train_loss": -27.816394805908203, "global_step": 600359, "epoch": 7233} {"train_loss": -27.643781661987305, "global_step": 600360, "epoch": 7233} {"train_loss": -27.857318878173828, "global_step": 600361, "epoch": 7233} {"train_loss": -27.818098068237305, "global_step": 600362, "epoch": 7233} {"train_loss": -27.597034454345703, "global_step": 600363, "epoch": 7233} {"train_loss": -27.932592391967773, "global_step": 600364, "epoch": 7233} {"train_loss": -27.861997604370117, "global_step": 600365, "epoch": 7233} {"train_loss": -27.730634689331055, "global_step": 600366, "epoch": 7233} {"train_loss": -27.874303817749023, "global_step": 600367, "epoch": 7233} {"train_loss": -27.523761749267578, "global_step": 600368, "epoch": 7233} {"train_loss": -28.15962028503418, "global_step": 600369, "epoch": 7233} {"train_loss": -27.940216064453125, "global_step": 600370, "epoch": 7233} {"train_loss": -27.983152389526367, "global_step": 600371, "epoch": 7233} {"train_loss": -28.07387351989746, "global_step": 600372, "epoch": 7233} {"train_loss": -27.868743896484375, "global_step": 600373, "epoch": 7233} {"train_loss": -28.065176010131836, "global_step": 600374, "epoch": 7233} {"train_loss": -27.9909725189209, "global_step": 600375, "epoch": 7233} {"train_loss": -28.121381759643555, "global_step": 600376, "epoch": 7233} {"train_loss": -28.069812774658203, "global_step": 600377, "epoch": 7233} {"train_loss": -28.020709991455078, "global_step": 600378, "epoch": 7233} {"train_loss": -28.165180206298828, "global_step": 600379, "epoch": 7233} {"train_loss": -27.97412109375, "global_step": 600380, "epoch": 7233} {"train_loss": -28.25306510925293, "global_step": 600381, "epoch": 7233} {"train_loss": -28.1462345123291, "global_step": 600382, "epoch": 7233} {"train_loss": -28.233983993530273, "global_step": 600383, "epoch": 7233} {"train_loss": -28.43257713317871, "global_step": 600384, "epoch": 7233} {"train_loss": -28.62989616394043, "global_step": 600385, "epoch": 7233} {"train_loss": -28.180784225463867, "global_step": 600386, "epoch": 7233} {"train_loss": -27.84685707092285, "global_step": 600387, "epoch": 7233} {"train_loss": -28.118972778320312, "global_step": 600388, "epoch": 7233} {"train_loss": -27.8166446685791, "global_step": 600389, "epoch": 7233} {"train_loss": -28.275806427001953, "global_step": 600390, "epoch": 7233} {"train_loss": -27.709747314453125, "global_step": 600391, "epoch": 7233} {"train_loss": -27.968564987182617, "global_step": 600392, "epoch": 7233} {"train_loss": -28.083044052124023, "global_step": 600393, "epoch": 7233} {"train_loss": -28.068817138671875, "global_step": 600394, "epoch": 7233} {"train_loss": -27.791248321533203, "global_step": 600395, "epoch": 7233} {"train_loss": -28.39361000061035, "global_step": 600396, "epoch": 7233} {"train_loss": -27.907520294189453, "global_step": 600397, "epoch": 7233} {"train_loss": -27.93141746520996, "global_step": 600398, "epoch": 7233} {"train_loss": -28.066089630126953, "global_step": 600399, "epoch": 7233} {"train_loss": -27.8790340423584, "global_step": 600400, "epoch": 7233} {"train_loss": -27.68417739868164, "global_step": 600401, "epoch": 7233} {"train_loss": -28.034164428710938, "global_step": 600402, "epoch": 7233} {"train_loss": -28.083784103393555, "global_step": 600403, "epoch": 7233} {"train_loss": -27.413068771362305, "global_step": 600404, "epoch": 7233} {"train_loss": -27.882843017578125, "global_step": 600405, "epoch": 7233} {"train_loss": -27.871109008789062, "global_step": 600406, "epoch": 7233} {"train_loss": -27.727842330932617, "global_step": 600407, "epoch": 7233} {"train_loss": -27.760297775268555, "global_step": 600408, "epoch": 7233} {"train_loss": -28.113157272338867, "global_step": 600409, "epoch": 7233} {"train_loss": -27.90081787109375, "global_step": 600410, "epoch": 7233} {"train_loss": -27.651294708251953, "global_step": 600411, "epoch": 7233} {"train_loss": -27.858936309814453, "global_step": 600412, "epoch": 7233} {"train_loss": -28.003570556640625, "global_step": 600413, "epoch": 7233} {"train_loss": -27.976043701171875, "global_step": 600414, "epoch": 7233} {"train_loss": -28.128332138061523, "global_step": 600415, "epoch": 7233} {"train_loss": -28.057117462158203, "global_step": 600416, "epoch": 7233} {"train_loss": -28.194486618041992, "global_step": 600417, "epoch": 7233} {"train_loss": -27.726667404174805, "global_step": 600418, "epoch": 7233} {"train_loss": -27.859411239624023, "global_step": 600419, "epoch": 7233} {"train_loss": -28.26875114440918, "global_step": 600420, "epoch": 7233} {"train_loss": -27.772684901593678, "global_step": 600421, "epoch": 7233, "val_loss": 6536640.0} {"train_loss": -27.588842391967773, "global_step": 600422, "epoch": 7234} {"train_loss": -27.8404483795166, "global_step": 600423, "epoch": 7234} {"train_loss": -27.690824508666992, "global_step": 600424, "epoch": 7234} {"train_loss": -27.8768310546875, "global_step": 600425, "epoch": 7234} {"train_loss": -27.821109771728516, "global_step": 600426, "epoch": 7234} {"train_loss": -27.478240966796875, "global_step": 600427, "epoch": 7234} {"train_loss": -27.634653091430664, "global_step": 600428, "epoch": 7234} {"train_loss": -27.79034996032715, "global_step": 600429, "epoch": 7234} {"train_loss": -28.256195068359375, "global_step": 600430, "epoch": 7234} {"train_loss": -27.793109893798828, "global_step": 600431, "epoch": 7234} {"train_loss": -27.795734405517578, "global_step": 600432, "epoch": 7234} {"train_loss": -27.85003662109375, "global_step": 600433, "epoch": 7234} {"train_loss": -28.38471031188965, "global_step": 600434, "epoch": 7234} {"train_loss": -28.086013793945312, "global_step": 600435, "epoch": 7234} {"train_loss": -28.31007194519043, "global_step": 600436, "epoch": 7234} {"train_loss": -27.953826904296875, "global_step": 600437, "epoch": 7234} {"train_loss": -28.08719253540039, "global_step": 600438, "epoch": 7234} {"train_loss": -27.984649658203125, "global_step": 600439, "epoch": 7234} {"train_loss": -28.0239200592041, "global_step": 600440, "epoch": 7234} {"train_loss": -28.176176071166992, "global_step": 600441, "epoch": 7234} {"train_loss": -28.036487579345703, "global_step": 600442, "epoch": 7234} {"train_loss": -27.767358779907227, "global_step": 600443, "epoch": 7234} {"train_loss": -28.065824508666992, "global_step": 600444, "epoch": 7234} {"train_loss": -28.009321212768555, "global_step": 600445, "epoch": 7234} {"train_loss": -27.86724853515625, "global_step": 600446, "epoch": 7234} {"train_loss": -28.031095504760742, "global_step": 600447, "epoch": 7234} {"train_loss": -28.18433952331543, "global_step": 600448, "epoch": 7234} {"train_loss": -27.89682388305664, "global_step": 600449, "epoch": 7234} {"train_loss": -28.330846786499023, "global_step": 600450, "epoch": 7234} {"train_loss": -27.73682975769043, "global_step": 600451, "epoch": 7234} {"train_loss": -27.918792724609375, "global_step": 600452, "epoch": 7234} {"train_loss": -28.065332412719727, "global_step": 600453, "epoch": 7234} {"train_loss": -28.08009147644043, "global_step": 600454, "epoch": 7234} {"train_loss": -28.109296798706055, "global_step": 600455, "epoch": 7234} {"train_loss": -28.285083770751953, "global_step": 600456, "epoch": 7234} {"train_loss": -28.16034507751465, "global_step": 600457, "epoch": 7234} {"train_loss": -28.093137741088867, "global_step": 600458, "epoch": 7234} {"train_loss": -28.359174728393555, "global_step": 600459, "epoch": 7234} {"train_loss": -28.094043731689453, "global_step": 600460, "epoch": 7234} {"train_loss": -28.010465621948242, "global_step": 600461, "epoch": 7234} {"train_loss": -27.803613662719727, "global_step": 600462, "epoch": 7234} {"train_loss": -28.529373168945312, "global_step": 600463, "epoch": 7234} {"train_loss": -28.318525314331055, "global_step": 600464, "epoch": 7234} {"train_loss": -28.630462646484375, "global_step": 600465, "epoch": 7234} {"train_loss": -28.339078903198242, "global_step": 600466, "epoch": 7234} {"train_loss": -28.085784912109375, "global_step": 600467, "epoch": 7234} {"train_loss": -28.411325454711914, "global_step": 600468, "epoch": 7234} {"train_loss": -27.892736434936523, "global_step": 600469, "epoch": 7234} {"train_loss": -27.958166122436523, "global_step": 600470, "epoch": 7234} {"train_loss": -27.768056869506836, "global_step": 600471, "epoch": 7234} {"train_loss": -28.246732711791992, "global_step": 600472, "epoch": 7234} {"train_loss": -27.674036026000977, "global_step": 600473, "epoch": 7234} {"train_loss": -28.188486099243164, "global_step": 600474, "epoch": 7234} {"train_loss": -28.132232666015625, "global_step": 600475, "epoch": 7234} {"train_loss": -27.32590675354004, "global_step": 600476, "epoch": 7234} {"train_loss": -27.631275177001953, "global_step": 600477, "epoch": 7234} {"train_loss": -27.0363712310791, "global_step": 600478, "epoch": 7234} {"train_loss": -27.47234535217285, "global_step": 600479, "epoch": 7234} {"train_loss": -27.776275634765625, "global_step": 600480, "epoch": 7234} {"train_loss": -27.637237548828125, "global_step": 600481, "epoch": 7234} {"train_loss": -27.719039916992188, "global_step": 600482, "epoch": 7234} {"train_loss": -27.8438720703125, "global_step": 600483, "epoch": 7234} {"train_loss": -27.435779571533203, "global_step": 600484, "epoch": 7234} {"train_loss": -28.076889038085938, "global_step": 600485, "epoch": 7234} {"train_loss": -28.05354118347168, "global_step": 600486, "epoch": 7234} {"train_loss": -28.049091339111328, "global_step": 600487, "epoch": 7234} {"train_loss": -28.248212814331055, "global_step": 600488, "epoch": 7234} {"train_loss": -27.714981079101562, "global_step": 600489, "epoch": 7234} {"train_loss": -27.610448837280273, "global_step": 600490, "epoch": 7234} {"train_loss": -27.997175216674805, "global_step": 600491, "epoch": 7234} {"train_loss": -27.779272079467773, "global_step": 600492, "epoch": 7234} {"train_loss": -27.777875900268555, "global_step": 600493, "epoch": 7234} {"train_loss": -27.986825942993164, "global_step": 600494, "epoch": 7234} {"train_loss": -27.343271255493164, "global_step": 600495, "epoch": 7234} {"train_loss": -27.503217697143555, "global_step": 600496, "epoch": 7234} {"train_loss": -27.51361656188965, "global_step": 600497, "epoch": 7234} {"train_loss": -27.770105361938477, "global_step": 600498, "epoch": 7234} {"train_loss": -27.573286056518555, "global_step": 600499, "epoch": 7234} {"train_loss": -27.43121337890625, "global_step": 600500, "epoch": 7234} {"train_loss": -27.512136459350586, "global_step": 600501, "epoch": 7234} {"train_loss": -28.339746475219727, "global_step": 600502, "epoch": 7234} {"train_loss": -27.903005599975586, "global_step": 600503, "epoch": 7234} {"train_loss": -27.93277542849621, "global_step": 600504, "epoch": 7234, "val_loss": 6604324.0} {"train_loss": -25.904760360717773, "global_step": 600505, "epoch": 7235} {"train_loss": -26.960554122924805, "global_step": 600506, "epoch": 7235} {"train_loss": -26.702884674072266, "global_step": 600507, "epoch": 7235} {"train_loss": -27.3123779296875, "global_step": 600508, "epoch": 7235} {"train_loss": -27.38306999206543, "global_step": 600509, "epoch": 7235} {"train_loss": -26.8594913482666, "global_step": 600510, "epoch": 7235} {"train_loss": -27.255170822143555, "global_step": 600511, "epoch": 7235} {"train_loss": -26.97781753540039, "global_step": 600512, "epoch": 7235} {"train_loss": -27.115009307861328, "global_step": 600513, "epoch": 7235} {"train_loss": -27.22773551940918, "global_step": 600514, "epoch": 7235} {"train_loss": -27.340574264526367, "global_step": 600515, "epoch": 7235} {"train_loss": -27.469085693359375, "global_step": 600516, "epoch": 7235} {"train_loss": -27.419225692749023, "global_step": 600517, "epoch": 7235} {"train_loss": -27.317935943603516, "global_step": 600518, "epoch": 7235} {"train_loss": -27.1402587890625, "global_step": 600519, "epoch": 7235} {"train_loss": -27.330495834350586, "global_step": 600520, "epoch": 7235} {"train_loss": -27.17359733581543, "global_step": 600521, "epoch": 7235} {"train_loss": -27.401426315307617, "global_step": 600522, "epoch": 7235} {"train_loss": -27.660724639892578, "global_step": 600523, "epoch": 7235} {"train_loss": -27.515857696533203, "global_step": 600524, "epoch": 7235} {"train_loss": -27.66950035095215, "global_step": 600525, "epoch": 7235} {"train_loss": -27.53533935546875, "global_step": 600526, "epoch": 7235} {"train_loss": -27.662586212158203, "global_step": 600527, "epoch": 7235} {"train_loss": -27.416522979736328, "global_step": 600528, "epoch": 7235} {"train_loss": -27.58260154724121, "global_step": 600529, "epoch": 7235} {"train_loss": -27.947736740112305, "global_step": 600530, "epoch": 7235} {"train_loss": -27.949071884155273, "global_step": 600531, "epoch": 7235} {"train_loss": -27.886550903320312, "global_step": 600532, "epoch": 7235} {"train_loss": -28.068832397460938, "global_step": 600533, "epoch": 7235} {"train_loss": -28.263355255126953, "global_step": 600534, "epoch": 7235} {"train_loss": -27.920576095581055, "global_step": 600535, "epoch": 7235} {"train_loss": -27.807096481323242, "global_step": 600536, "epoch": 7235} {"train_loss": -28.3247127532959, "global_step": 600537, "epoch": 7235} {"train_loss": -27.912185668945312, "global_step": 600538, "epoch": 7235} {"train_loss": -28.110010147094727, "global_step": 600539, "epoch": 7235} {"train_loss": -28.16205406188965, "global_step": 600540, "epoch": 7235} {"train_loss": -28.27939796447754, "global_step": 600541, "epoch": 7235} {"train_loss": -27.74881935119629, "global_step": 600542, "epoch": 7235} {"train_loss": -27.920856475830078, "global_step": 600543, "epoch": 7235} {"train_loss": -28.056686401367188, "global_step": 600544, "epoch": 7235} {"train_loss": -28.00172233581543, "global_step": 600545, "epoch": 7235} {"train_loss": -27.880496978759766, "global_step": 600546, "epoch": 7235} {"train_loss": -28.27675437927246, "global_step": 600547, "epoch": 7235} {"train_loss": -27.943037033081055, "global_step": 600548, "epoch": 7235} {"train_loss": -27.869131088256836, "global_step": 600549, "epoch": 7235} {"train_loss": -28.352148056030273, "global_step": 600550, "epoch": 7235} {"train_loss": -27.934675216674805, "global_step": 600551, "epoch": 7235} {"train_loss": -28.131290435791016, "global_step": 600552, "epoch": 7235} {"train_loss": -28.091955184936523, "global_step": 600553, "epoch": 7235} {"train_loss": -27.989770889282227, "global_step": 600554, "epoch": 7235} {"train_loss": -28.232410430908203, "global_step": 600555, "epoch": 7235} {"train_loss": -28.12232780456543, "global_step": 600556, "epoch": 7235} {"train_loss": -28.160058975219727, "global_step": 600557, "epoch": 7235} {"train_loss": -27.965423583984375, "global_step": 600558, "epoch": 7235} {"train_loss": -28.049182891845703, "global_step": 600559, "epoch": 7235} {"train_loss": -28.38990592956543, "global_step": 600560, "epoch": 7235} {"train_loss": -27.816816329956055, "global_step": 600561, "epoch": 7235} {"train_loss": -28.40913200378418, "global_step": 600562, "epoch": 7235} {"train_loss": -28.052148818969727, "global_step": 600563, "epoch": 7235} {"train_loss": -28.123188018798828, "global_step": 600564, "epoch": 7235} {"train_loss": -28.31397819519043, "global_step": 600565, "epoch": 7235} {"train_loss": -28.243854522705078, "global_step": 600566, "epoch": 7235} {"train_loss": -28.31073570251465, "global_step": 600567, "epoch": 7235} {"train_loss": -28.354999542236328, "global_step": 600568, "epoch": 7235} {"train_loss": -28.656726837158203, "global_step": 600569, "epoch": 7235} {"train_loss": -28.10874366760254, "global_step": 600570, "epoch": 7235} {"train_loss": -28.13165855407715, "global_step": 600571, "epoch": 7235} {"train_loss": -27.935388565063477, "global_step": 600572, "epoch": 7235} {"train_loss": -28.214941024780273, "global_step": 600573, "epoch": 7235} {"train_loss": -28.2445125579834, "global_step": 600574, "epoch": 7235} {"train_loss": -28.29974365234375, "global_step": 600575, "epoch": 7235} {"train_loss": -27.8492431640625, "global_step": 600576, "epoch": 7235} {"train_loss": -28.169036865234375, "global_step": 600577, "epoch": 7235} {"train_loss": -28.296222686767578, "global_step": 600578, "epoch": 7235} {"train_loss": -27.755146026611328, "global_step": 600579, "epoch": 7235} {"train_loss": -28.347394943237305, "global_step": 600580, "epoch": 7235} {"train_loss": -27.949121475219727, "global_step": 600581, "epoch": 7235} {"train_loss": -27.977298736572266, "global_step": 600582, "epoch": 7235} {"train_loss": -28.198974609375, "global_step": 600583, "epoch": 7235} {"train_loss": -27.995346069335938, "global_step": 600584, "epoch": 7235} {"train_loss": -27.841169357299805, "global_step": 600585, "epoch": 7235} {"train_loss": -28.452428817749023, "global_step": 600586, "epoch": 7235} {"train_loss": -27.856128692626953, "global_step": 600587, "epoch": 7235, "val_loss": 6571902.5} {"train_loss": -28.09197425842285, "global_step": 600588, "epoch": 7236} {"train_loss": -28.1019344329834, "global_step": 600589, "epoch": 7236} {"train_loss": -27.71547508239746, "global_step": 600590, "epoch": 7236} {"train_loss": -27.960163116455078, "global_step": 600591, "epoch": 7236} {"train_loss": -28.2058162689209, "global_step": 600592, "epoch": 7236} {"train_loss": -27.584997177124023, "global_step": 600593, "epoch": 7236} {"train_loss": -27.488147735595703, "global_step": 600594, "epoch": 7236} {"train_loss": -28.137304306030273, "global_step": 600595, "epoch": 7236} {"train_loss": -28.158472061157227, "global_step": 600596, "epoch": 7236} {"train_loss": -28.289447784423828, "global_step": 600597, "epoch": 7236} {"train_loss": -28.08827781677246, "global_step": 600598, "epoch": 7236} {"train_loss": -27.77800941467285, "global_step": 600599, "epoch": 7236} {"train_loss": -27.504425048828125, "global_step": 600600, "epoch": 7236} {"train_loss": -27.75459098815918, "global_step": 600601, "epoch": 7236} {"train_loss": -28.27765464782715, "global_step": 600602, "epoch": 7236} {"train_loss": -27.99025535583496, "global_step": 600603, "epoch": 7236} {"train_loss": -28.213520050048828, "global_step": 600604, "epoch": 7236} {"train_loss": -27.69369888305664, "global_step": 600605, "epoch": 7236} {"train_loss": -27.9685115814209, "global_step": 600606, "epoch": 7236} {"train_loss": -28.241437911987305, "global_step": 600607, "epoch": 7236} {"train_loss": -27.455488204956055, "global_step": 600608, "epoch": 7236} {"train_loss": -27.914457321166992, "global_step": 600609, "epoch": 7236} {"train_loss": -27.8328914642334, "global_step": 600610, "epoch": 7236} {"train_loss": -27.98195457458496, "global_step": 600611, "epoch": 7236} {"train_loss": -27.206546783447266, "global_step": 600612, "epoch": 7236} {"train_loss": -27.185962677001953, "global_step": 600613, "epoch": 7236} {"train_loss": -26.61738395690918, "global_step": 600614, "epoch": 7236} {"train_loss": -26.71504020690918, "global_step": 600615, "epoch": 7236} {"train_loss": -27.414535522460938, "global_step": 600616, "epoch": 7236} {"train_loss": -27.19887351989746, "global_step": 600617, "epoch": 7236} {"train_loss": -27.49500846862793, "global_step": 600618, "epoch": 7236} {"train_loss": -27.912586212158203, "global_step": 600619, "epoch": 7236} {"train_loss": -27.474872589111328, "global_step": 600620, "epoch": 7236} {"train_loss": -27.38941764831543, "global_step": 600621, "epoch": 7236} {"train_loss": -28.2817440032959, "global_step": 600622, "epoch": 7236} {"train_loss": -27.579578399658203, "global_step": 600623, "epoch": 7236} {"train_loss": -27.909841537475586, "global_step": 600624, "epoch": 7236} {"train_loss": -28.268041610717773, "global_step": 600625, "epoch": 7236} {"train_loss": -27.842992782592773, "global_step": 600626, "epoch": 7236} {"train_loss": -28.066864013671875, "global_step": 600627, "epoch": 7236} {"train_loss": -27.637298583984375, "global_step": 600628, "epoch": 7236} {"train_loss": -28.08797264099121, "global_step": 600629, "epoch": 7236} {"train_loss": -27.76210594177246, "global_step": 600630, "epoch": 7236} {"train_loss": -28.150802612304688, "global_step": 600631, "epoch": 7236} {"train_loss": -27.650787353515625, "global_step": 600632, "epoch": 7236} {"train_loss": -28.35810661315918, "global_step": 600633, "epoch": 7236} {"train_loss": -27.891103744506836, "global_step": 600634, "epoch": 7236} {"train_loss": -28.091230392456055, "global_step": 600635, "epoch": 7236} {"train_loss": -27.864459991455078, "global_step": 600636, "epoch": 7236} {"train_loss": -28.03864097595215, "global_step": 600637, "epoch": 7236} {"train_loss": -27.8223934173584, "global_step": 600638, "epoch": 7236} {"train_loss": -28.358478546142578, "global_step": 600639, "epoch": 7236} {"train_loss": -28.107208251953125, "global_step": 600640, "epoch": 7236} {"train_loss": -28.219562530517578, "global_step": 600641, "epoch": 7236} {"train_loss": -27.8817081451416, "global_step": 600642, "epoch": 7236} {"train_loss": -28.03407859802246, "global_step": 600643, "epoch": 7236} {"train_loss": -28.082494735717773, "global_step": 600644, "epoch": 7236} {"train_loss": -27.87753677368164, "global_step": 600645, "epoch": 7236} {"train_loss": -28.155658721923828, "global_step": 600646, "epoch": 7236} {"train_loss": -27.98895835876465, "global_step": 600647, "epoch": 7236} {"train_loss": -28.397201538085938, "global_step": 600648, "epoch": 7236} {"train_loss": -28.331409454345703, "global_step": 600649, "epoch": 7236} {"train_loss": -28.164459228515625, "global_step": 600650, "epoch": 7236} {"train_loss": -28.345870971679688, "global_step": 600651, "epoch": 7236} {"train_loss": -28.538610458374023, "global_step": 600652, "epoch": 7236} {"train_loss": -28.042072296142578, "global_step": 600653, "epoch": 7236} {"train_loss": -28.178455352783203, "global_step": 600654, "epoch": 7236} {"train_loss": -28.33290672302246, "global_step": 600655, "epoch": 7236} {"train_loss": -28.14015007019043, "global_step": 600656, "epoch": 7236} {"train_loss": -28.109088897705078, "global_step": 600657, "epoch": 7236} {"train_loss": -28.17632484436035, "global_step": 600658, "epoch": 7236} {"train_loss": -28.55752944946289, "global_step": 600659, "epoch": 7236} {"train_loss": -28.373682022094727, "global_step": 600660, "epoch": 7236} {"train_loss": -28.6653995513916, "global_step": 600661, "epoch": 7236} {"train_loss": -28.372589111328125, "global_step": 600662, "epoch": 7236} {"train_loss": -28.26296043395996, "global_step": 600663, "epoch": 7236} {"train_loss": -28.295169830322266, "global_step": 600664, "epoch": 7236} {"train_loss": -28.749052047729492, "global_step": 600665, "epoch": 7236} {"train_loss": -27.9609317779541, "global_step": 600666, "epoch": 7236} {"train_loss": -28.425891876220703, "global_step": 600667, "epoch": 7236} {"train_loss": -28.219812393188477, "global_step": 600668, "epoch": 7236} {"train_loss": -28.33513832092285, "global_step": 600669, "epoch": 7236} {"train_loss": -27.97604510295822, "global_step": 600670, "epoch": 7236, "val_loss": 6608370.0} {"train_loss": -27.29877281188965, "global_step": 600671, "epoch": 7237} {"train_loss": -26.064504623413086, "global_step": 600672, "epoch": 7237} {"train_loss": -23.8363037109375, "global_step": 600673, "epoch": 7237} {"train_loss": -26.339643478393555, "global_step": 600674, "epoch": 7237} {"train_loss": -27.169782638549805, "global_step": 600675, "epoch": 7237} {"train_loss": -24.375110626220703, "global_step": 600676, "epoch": 7237} {"train_loss": -25.49287986755371, "global_step": 600677, "epoch": 7237} {"train_loss": -25.57710838317871, "global_step": 600678, "epoch": 7237} {"train_loss": -27.028547286987305, "global_step": 600679, "epoch": 7237} {"train_loss": -25.03868293762207, "global_step": 600680, "epoch": 7237} {"train_loss": -26.783361434936523, "global_step": 600681, "epoch": 7237} {"train_loss": -26.495447158813477, "global_step": 600682, "epoch": 7237} {"train_loss": -26.2242374420166, "global_step": 600683, "epoch": 7237} {"train_loss": -26.9294376373291, "global_step": 600684, "epoch": 7237} {"train_loss": -26.555505752563477, "global_step": 600685, "epoch": 7237} {"train_loss": -27.259485244750977, "global_step": 600686, "epoch": 7237} {"train_loss": -26.6743221282959, "global_step": 600687, "epoch": 7237} {"train_loss": -26.735580444335938, "global_step": 600688, "epoch": 7237} {"train_loss": -26.93770408630371, "global_step": 600689, "epoch": 7237} {"train_loss": -27.17359733581543, "global_step": 600690, "epoch": 7237} {"train_loss": -27.015172958374023, "global_step": 600691, "epoch": 7237} {"train_loss": -27.139667510986328, "global_step": 600692, "epoch": 7237} {"train_loss": -27.40752601623535, "global_step": 600693, "epoch": 7237} {"train_loss": -27.841520309448242, "global_step": 600694, "epoch": 7237} {"train_loss": -27.220874786376953, "global_step": 600695, "epoch": 7237} {"train_loss": -27.261205673217773, "global_step": 600696, "epoch": 7237} {"train_loss": -26.945178985595703, "global_step": 600697, "epoch": 7237} {"train_loss": -26.923629760742188, "global_step": 600698, "epoch": 7237} {"train_loss": -27.727869033813477, "global_step": 600699, "epoch": 7237} {"train_loss": -27.646976470947266, "global_step": 600700, "epoch": 7237} {"train_loss": -27.787643432617188, "global_step": 600701, "epoch": 7237} {"train_loss": -27.49323081970215, "global_step": 600702, "epoch": 7237} {"train_loss": -27.92048454284668, "global_step": 600703, "epoch": 7237} {"train_loss": -27.668203353881836, "global_step": 600704, "epoch": 7237} {"train_loss": -27.502365112304688, "global_step": 600705, "epoch": 7237} {"train_loss": -27.495763778686523, "global_step": 600706, "epoch": 7237} {"train_loss": -27.567838668823242, "global_step": 600707, "epoch": 7237} {"train_loss": -27.570520401000977, "global_step": 600708, "epoch": 7237} {"train_loss": -27.79363441467285, "global_step": 600709, "epoch": 7237} {"train_loss": -27.751428604125977, "global_step": 600710, "epoch": 7237} {"train_loss": -27.892333984375, "global_step": 600711, "epoch": 7237} {"train_loss": -28.02479362487793, "global_step": 600712, "epoch": 7237} {"train_loss": -27.802494049072266, "global_step": 600713, "epoch": 7237} {"train_loss": -27.690656661987305, "global_step": 600714, "epoch": 7237} {"train_loss": -27.863204956054688, "global_step": 600715, "epoch": 7237} {"train_loss": -27.681644439697266, "global_step": 600716, "epoch": 7237} {"train_loss": -27.9956111907959, "global_step": 600717, "epoch": 7237} {"train_loss": -27.9510555267334, "global_step": 600718, "epoch": 7237} {"train_loss": -28.027257919311523, "global_step": 600719, "epoch": 7237} {"train_loss": -27.898700714111328, "global_step": 600720, "epoch": 7237} {"train_loss": -28.221044540405273, "global_step": 600721, "epoch": 7237} {"train_loss": -28.537519454956055, "global_step": 600722, "epoch": 7237} {"train_loss": -27.961999893188477, "global_step": 600723, "epoch": 7237} {"train_loss": -28.159912109375, "global_step": 600724, "epoch": 7237} {"train_loss": -27.885730743408203, "global_step": 600725, "epoch": 7237} {"train_loss": -28.325607299804688, "global_step": 600726, "epoch": 7237} {"train_loss": -28.11164665222168, "global_step": 600727, "epoch": 7237} {"train_loss": -27.925077438354492, "global_step": 600728, "epoch": 7237} {"train_loss": -28.240467071533203, "global_step": 600729, "epoch": 7237} {"train_loss": -27.867298126220703, "global_step": 600730, "epoch": 7237} {"train_loss": -27.99924659729004, "global_step": 600731, "epoch": 7237} {"train_loss": -27.931806564331055, "global_step": 600732, "epoch": 7237} {"train_loss": -28.085891723632812, "global_step": 600733, "epoch": 7237} {"train_loss": -28.364395141601562, "global_step": 600734, "epoch": 7237} {"train_loss": -28.213769912719727, "global_step": 600735, "epoch": 7237} {"train_loss": -27.814069747924805, "global_step": 600736, "epoch": 7237} {"train_loss": -28.127490997314453, "global_step": 600737, "epoch": 7237} {"train_loss": -28.431055068969727, "global_step": 600738, "epoch": 7237} {"train_loss": -28.143095016479492, "global_step": 600739, "epoch": 7237} {"train_loss": -28.341283798217773, "global_step": 600740, "epoch": 7237} {"train_loss": -28.448087692260742, "global_step": 600741, "epoch": 7237} {"train_loss": -28.640363693237305, "global_step": 600742, "epoch": 7237} {"train_loss": -28.200897216796875, "global_step": 600743, "epoch": 7237} {"train_loss": -28.341215133666992, "global_step": 600744, "epoch": 7237} {"train_loss": -28.436731338500977, "global_step": 600745, "epoch": 7237} {"train_loss": -28.189014434814453, "global_step": 600746, "epoch": 7237} {"train_loss": -28.268278121948242, "global_step": 600747, "epoch": 7237} {"train_loss": -27.968799591064453, "global_step": 600748, "epoch": 7237} {"train_loss": -28.30097007751465, "global_step": 600749, "epoch": 7237} {"train_loss": -27.906513214111328, "global_step": 600750, "epoch": 7237} {"train_loss": -28.322065353393555, "global_step": 600751, "epoch": 7237} {"train_loss": -28.058629989624023, "global_step": 600752, "epoch": 7237} {"train_loss": -27.522645054093328, "global_step": 600753, "epoch": 7237, "val_loss": 6510240.0} {"train_loss": -28.098072052001953, "global_step": 600754, "epoch": 7238} {"train_loss": -27.776275634765625, "global_step": 600755, "epoch": 7238} {"train_loss": -27.969526290893555, "global_step": 600756, "epoch": 7238} {"train_loss": -27.510650634765625, "global_step": 600757, "epoch": 7238} {"train_loss": -27.7371768951416, "global_step": 600758, "epoch": 7238} {"train_loss": -28.00494956970215, "global_step": 600759, "epoch": 7238} {"train_loss": -27.435306549072266, "global_step": 600760, "epoch": 7238} {"train_loss": -27.4611759185791, "global_step": 600761, "epoch": 7238} {"train_loss": -27.251489639282227, "global_step": 600762, "epoch": 7238} {"train_loss": -27.7974796295166, "global_step": 600763, "epoch": 7238} {"train_loss": -27.921222686767578, "global_step": 600764, "epoch": 7238} {"train_loss": -27.951385498046875, "global_step": 600765, "epoch": 7238} {"train_loss": -27.795148849487305, "global_step": 600766, "epoch": 7238} {"train_loss": -27.843250274658203, "global_step": 600767, "epoch": 7238} {"train_loss": -27.925058364868164, "global_step": 600768, "epoch": 7238} {"train_loss": -27.81403923034668, "global_step": 600769, "epoch": 7238} {"train_loss": -27.832128524780273, "global_step": 600770, "epoch": 7238} {"train_loss": -28.174213409423828, "global_step": 600771, "epoch": 7238} {"train_loss": -27.64912986755371, "global_step": 600772, "epoch": 7238} {"train_loss": -27.985876083374023, "global_step": 600773, "epoch": 7238} {"train_loss": -28.094228744506836, "global_step": 600774, "epoch": 7238} {"train_loss": -27.853805541992188, "global_step": 600775, "epoch": 7238} {"train_loss": -28.301788330078125, "global_step": 600776, "epoch": 7238} {"train_loss": -28.02166748046875, "global_step": 600777, "epoch": 7238} {"train_loss": -28.075977325439453, "global_step": 600778, "epoch": 7238} {"train_loss": -27.9898624420166, "global_step": 600779, "epoch": 7238} {"train_loss": -28.0802059173584, "global_step": 600780, "epoch": 7238} {"train_loss": -27.701642990112305, "global_step": 600781, "epoch": 7238} {"train_loss": -28.021448135375977, "global_step": 600782, "epoch": 7238} {"train_loss": -27.700815200805664, "global_step": 600783, "epoch": 7238} {"train_loss": -27.818201065063477, "global_step": 600784, "epoch": 7238} {"train_loss": -28.27402687072754, "global_step": 600785, "epoch": 7238} {"train_loss": -27.362340927124023, "global_step": 600786, "epoch": 7238} {"train_loss": -28.19854164123535, "global_step": 600787, "epoch": 7238} {"train_loss": -27.843366622924805, "global_step": 600788, "epoch": 7238} {"train_loss": -28.056720733642578, "global_step": 600789, "epoch": 7238} {"train_loss": -28.04802894592285, "global_step": 600790, "epoch": 7238} {"train_loss": -27.832782745361328, "global_step": 600791, "epoch": 7238} {"train_loss": -28.261350631713867, "global_step": 600792, "epoch": 7238} {"train_loss": -27.89838981628418, "global_step": 600793, "epoch": 7238} {"train_loss": -28.0970458984375, "global_step": 600794, "epoch": 7238} {"train_loss": -28.12470054626465, "global_step": 600795, "epoch": 7238} {"train_loss": -28.214704513549805, "global_step": 600796, "epoch": 7238} {"train_loss": -28.175992965698242, "global_step": 600797, "epoch": 7238} {"train_loss": -27.991809844970703, "global_step": 600798, "epoch": 7238} {"train_loss": -28.134130477905273, "global_step": 600799, "epoch": 7238} {"train_loss": -28.167306900024414, "global_step": 600800, "epoch": 7238} {"train_loss": -28.66261863708496, "global_step": 600801, "epoch": 7238} {"train_loss": -28.486303329467773, "global_step": 600802, "epoch": 7238} {"train_loss": -27.948633193969727, "global_step": 600803, "epoch": 7238} {"train_loss": -28.326797485351562, "global_step": 600804, "epoch": 7238} {"train_loss": -28.007123947143555, "global_step": 600805, "epoch": 7238} {"train_loss": -28.37074089050293, "global_step": 600806, "epoch": 7238} {"train_loss": -28.413806915283203, "global_step": 600807, "epoch": 7238} {"train_loss": -28.318836212158203, "global_step": 600808, "epoch": 7238} {"train_loss": -28.4279727935791, "global_step": 600809, "epoch": 7238} {"train_loss": -28.304479598999023, "global_step": 600810, "epoch": 7238} {"train_loss": -27.810705184936523, "global_step": 600811, "epoch": 7238} {"train_loss": -28.13457679748535, "global_step": 600812, "epoch": 7238} {"train_loss": -28.423559188842773, "global_step": 600813, "epoch": 7238} {"train_loss": -28.2385311126709, "global_step": 600814, "epoch": 7238} {"train_loss": -28.197736740112305, "global_step": 600815, "epoch": 7238} {"train_loss": -27.886341094970703, "global_step": 600816, "epoch": 7238} {"train_loss": -28.075836181640625, "global_step": 600817, "epoch": 7238} {"train_loss": -28.437885284423828, "global_step": 600818, "epoch": 7238} {"train_loss": -27.995380401611328, "global_step": 600819, "epoch": 7238} {"train_loss": -27.988422393798828, "global_step": 600820, "epoch": 7238} {"train_loss": -27.95953941345215, "global_step": 600821, "epoch": 7238} {"train_loss": -27.781225204467773, "global_step": 600822, "epoch": 7238} {"train_loss": -28.33796501159668, "global_step": 600823, "epoch": 7238} {"train_loss": -28.016021728515625, "global_step": 600824, "epoch": 7238} {"train_loss": -27.929065704345703, "global_step": 600825, "epoch": 7238} {"train_loss": -28.237323760986328, "global_step": 600826, "epoch": 7238} {"train_loss": -27.870512008666992, "global_step": 600827, "epoch": 7238} {"train_loss": -27.680105209350586, "global_step": 600828, "epoch": 7238} {"train_loss": -28.251434326171875, "global_step": 600829, "epoch": 7238} {"train_loss": -28.0001163482666, "global_step": 600830, "epoch": 7238} {"train_loss": -27.853214263916016, "global_step": 600831, "epoch": 7238} {"train_loss": -28.08123207092285, "global_step": 600832, "epoch": 7238} {"train_loss": -28.305713653564453, "global_step": 600833, "epoch": 7238} {"train_loss": -27.950519561767578, "global_step": 600834, "epoch": 7238} {"train_loss": -27.990467071533203, "global_step": 600835, "epoch": 7238} {"train_loss": -28.0270274058882, "global_step": 600836, "epoch": 7238, "val_loss": 6540065.0} {"train_loss": -25.92637062072754, "global_step": 600837, "epoch": 7239} {"train_loss": -25.934309005737305, "global_step": 600838, "epoch": 7239} {"train_loss": -26.130584716796875, "global_step": 600839, "epoch": 7239} {"train_loss": -24.732358932495117, "global_step": 600840, "epoch": 7239} {"train_loss": -26.439498901367188, "global_step": 600841, "epoch": 7239} {"train_loss": -27.075225830078125, "global_step": 600842, "epoch": 7239} {"train_loss": -26.26380729675293, "global_step": 600843, "epoch": 7239} {"train_loss": -27.195302963256836, "global_step": 600844, "epoch": 7239} {"train_loss": -26.295913696289062, "global_step": 600845, "epoch": 7239} {"train_loss": -27.298147201538086, "global_step": 600846, "epoch": 7239} {"train_loss": -27.235462188720703, "global_step": 600847, "epoch": 7239} {"train_loss": -27.10578727722168, "global_step": 600848, "epoch": 7239} {"train_loss": -27.358007431030273, "global_step": 600849, "epoch": 7239} {"train_loss": -27.246692657470703, "global_step": 600850, "epoch": 7239} {"train_loss": -27.16644287109375, "global_step": 600851, "epoch": 7239} {"train_loss": -27.378620147705078, "global_step": 600852, "epoch": 7239} {"train_loss": -27.748266220092773, "global_step": 600853, "epoch": 7239} {"train_loss": -27.765287399291992, "global_step": 600854, "epoch": 7239} {"train_loss": -27.54572868347168, "global_step": 600855, "epoch": 7239} {"train_loss": -27.59673500061035, "global_step": 600856, "epoch": 7239} {"train_loss": -27.75896644592285, "global_step": 600857, "epoch": 7239} {"train_loss": -27.83607292175293, "global_step": 600858, "epoch": 7239} {"train_loss": -27.75726318359375, "global_step": 600859, "epoch": 7239} {"train_loss": -27.82608985900879, "global_step": 600860, "epoch": 7239} {"train_loss": -27.780481338500977, "global_step": 600861, "epoch": 7239} {"train_loss": -27.713220596313477, "global_step": 600862, "epoch": 7239} {"train_loss": -27.791818618774414, "global_step": 600863, "epoch": 7239} {"train_loss": -27.67620849609375, "global_step": 600864, "epoch": 7239} {"train_loss": -27.724140167236328, "global_step": 600865, "epoch": 7239} {"train_loss": -27.931182861328125, "global_step": 600866, "epoch": 7239} {"train_loss": -27.940942764282227, "global_step": 600867, "epoch": 7239} {"train_loss": -27.736181259155273, "global_step": 600868, "epoch": 7239} {"train_loss": -27.705280303955078, "global_step": 600869, "epoch": 7239} {"train_loss": -27.938955307006836, "global_step": 600870, "epoch": 7239} {"train_loss": -28.222379684448242, "global_step": 600871, "epoch": 7239} {"train_loss": -27.73097801208496, "global_step": 600872, "epoch": 7239} {"train_loss": -28.273908615112305, "global_step": 600873, "epoch": 7239} {"train_loss": -28.080686569213867, "global_step": 600874, "epoch": 7239} {"train_loss": -27.946060180664062, "global_step": 600875, "epoch": 7239} {"train_loss": -28.028900146484375, "global_step": 600876, "epoch": 7239} {"train_loss": -28.113971710205078, "global_step": 600877, "epoch": 7239} {"train_loss": -28.37003517150879, "global_step": 600878, "epoch": 7239} {"train_loss": -28.479995727539062, "global_step": 600879, "epoch": 7239} {"train_loss": -28.05438232421875, "global_step": 600880, "epoch": 7239} {"train_loss": -28.15699577331543, "global_step": 600881, "epoch": 7239} {"train_loss": -28.084150314331055, "global_step": 600882, "epoch": 7239} {"train_loss": -28.006128311157227, "global_step": 600883, "epoch": 7239} {"train_loss": -27.711929321289062, "global_step": 600884, "epoch": 7239} {"train_loss": -27.844995498657227, "global_step": 600885, "epoch": 7239} {"train_loss": -28.162168502807617, "global_step": 600886, "epoch": 7239} {"train_loss": -28.37858009338379, "global_step": 600887, "epoch": 7239} {"train_loss": -27.758316040039062, "global_step": 600888, "epoch": 7239} {"train_loss": -27.812971115112305, "global_step": 600889, "epoch": 7239} {"train_loss": -27.589521408081055, "global_step": 600890, "epoch": 7239} {"train_loss": -27.932966232299805, "global_step": 600891, "epoch": 7239} {"train_loss": -27.401403427124023, "global_step": 600892, "epoch": 7239} {"train_loss": -27.9920654296875, "global_step": 600893, "epoch": 7239} {"train_loss": -28.0128116607666, "global_step": 600894, "epoch": 7239} {"train_loss": -27.472614288330078, "global_step": 600895, "epoch": 7239} {"train_loss": -27.69697380065918, "global_step": 600896, "epoch": 7239} {"train_loss": -27.771162033081055, "global_step": 600897, "epoch": 7239} {"train_loss": -27.653766632080078, "global_step": 600898, "epoch": 7239} {"train_loss": -28.045780181884766, "global_step": 600899, "epoch": 7239} {"train_loss": -27.821203231811523, "global_step": 600900, "epoch": 7239} {"train_loss": -27.869159698486328, "global_step": 600901, "epoch": 7239} {"train_loss": -27.81660270690918, "global_step": 600902, "epoch": 7239} {"train_loss": -27.87872886657715, "global_step": 600903, "epoch": 7239} {"train_loss": -27.812896728515625, "global_step": 600904, "epoch": 7239} {"train_loss": -27.502954483032227, "global_step": 600905, "epoch": 7239} {"train_loss": -27.69434928894043, "global_step": 600906, "epoch": 7239} {"train_loss": -27.810083389282227, "global_step": 600907, "epoch": 7239} {"train_loss": -28.094440460205078, "global_step": 600908, "epoch": 7239} {"train_loss": -27.905187606811523, "global_step": 600909, "epoch": 7239} {"train_loss": -28.229263305664062, "global_step": 600910, "epoch": 7239} {"train_loss": -27.96807861328125, "global_step": 600911, "epoch": 7239} {"train_loss": -27.96461296081543, "global_step": 600912, "epoch": 7239} {"train_loss": -27.875141143798828, "global_step": 600913, "epoch": 7239} {"train_loss": -28.083677291870117, "global_step": 600914, "epoch": 7239} {"train_loss": -28.11067008972168, "global_step": 600915, "epoch": 7239} {"train_loss": -28.090612411499023, "global_step": 600916, "epoch": 7239} {"train_loss": -28.12841796875, "global_step": 600917, "epoch": 7239} {"train_loss": -28.32447624206543, "global_step": 600918, "epoch": 7239} {"train_loss": -27.666544282292744, "global_step": 600919, "epoch": 7239, "val_loss": 6581721.0} {"train_loss": -27.474042892456055, "global_step": 600920, "epoch": 7240} {"train_loss": -27.488431930541992, "global_step": 600921, "epoch": 7240} {"train_loss": -27.390583038330078, "global_step": 600922, "epoch": 7240} {"train_loss": -27.656600952148438, "global_step": 600923, "epoch": 7240} {"train_loss": -27.703678131103516, "global_step": 600924, "epoch": 7240} {"train_loss": -27.8464298248291, "global_step": 600925, "epoch": 7240} {"train_loss": -27.4499568939209, "global_step": 600926, "epoch": 7240} {"train_loss": -27.765689849853516, "global_step": 600927, "epoch": 7240} {"train_loss": -27.85609245300293, "global_step": 600928, "epoch": 7240} {"train_loss": -28.03046989440918, "global_step": 600929, "epoch": 7240} {"train_loss": -27.730600357055664, "global_step": 600930, "epoch": 7240} {"train_loss": -27.57672119140625, "global_step": 600931, "epoch": 7240} {"train_loss": -27.700159072875977, "global_step": 600932, "epoch": 7240} {"train_loss": -28.000701904296875, "global_step": 600933, "epoch": 7240} {"train_loss": -28.20706558227539, "global_step": 600934, "epoch": 7240} {"train_loss": -27.907394409179688, "global_step": 600935, "epoch": 7240} {"train_loss": -27.833189010620117, "global_step": 600936, "epoch": 7240} {"train_loss": -27.75238609313965, "global_step": 600937, "epoch": 7240} {"train_loss": -27.867401123046875, "global_step": 600938, "epoch": 7240} {"train_loss": -27.952524185180664, "global_step": 600939, "epoch": 7240} {"train_loss": -28.06769371032715, "global_step": 600940, "epoch": 7240} {"train_loss": -28.188465118408203, "global_step": 600941, "epoch": 7240} {"train_loss": -27.88803482055664, "global_step": 600942, "epoch": 7240} {"train_loss": -28.130109786987305, "global_step": 600943, "epoch": 7240} {"train_loss": -28.595901489257812, "global_step": 600944, "epoch": 7240} {"train_loss": -28.151580810546875, "global_step": 600945, "epoch": 7240} {"train_loss": -28.236846923828125, "global_step": 600946, "epoch": 7240} {"train_loss": -28.2119197845459, "global_step": 600947, "epoch": 7240} {"train_loss": -28.447065353393555, "global_step": 600948, "epoch": 7240} {"train_loss": -28.082672119140625, "global_step": 600949, "epoch": 7240} {"train_loss": -28.803546905517578, "global_step": 600950, "epoch": 7240} {"train_loss": -28.123584747314453, "global_step": 600951, "epoch": 7240} {"train_loss": -28.122610092163086, "global_step": 600952, "epoch": 7240} {"train_loss": -28.05170249938965, "global_step": 600953, "epoch": 7240} {"train_loss": -28.00676918029785, "global_step": 600954, "epoch": 7240} {"train_loss": -28.200681686401367, "global_step": 600955, "epoch": 7240} {"train_loss": -27.956897735595703, "global_step": 600956, "epoch": 7240} {"train_loss": -28.08169937133789, "global_step": 600957, "epoch": 7240} {"train_loss": -28.137113571166992, "global_step": 600958, "epoch": 7240} {"train_loss": -28.501087188720703, "global_step": 600959, "epoch": 7240} {"train_loss": -28.182666778564453, "global_step": 600960, "epoch": 7240} {"train_loss": -27.652158737182617, "global_step": 600961, "epoch": 7240} {"train_loss": -27.819486618041992, "global_step": 600962, "epoch": 7240} {"train_loss": -27.787023544311523, "global_step": 600963, "epoch": 7240} {"train_loss": -28.154953002929688, "global_step": 600964, "epoch": 7240} {"train_loss": -28.206064224243164, "global_step": 600965, "epoch": 7240} {"train_loss": -28.08929443359375, "global_step": 600966, "epoch": 7240} {"train_loss": -28.16607093811035, "global_step": 600967, "epoch": 7240} {"train_loss": -28.18454360961914, "global_step": 600968, "epoch": 7240} {"train_loss": -27.794824600219727, "global_step": 600969, "epoch": 7240} {"train_loss": -27.971160888671875, "global_step": 600970, "epoch": 7240} {"train_loss": -28.30841636657715, "global_step": 600971, "epoch": 7240} {"train_loss": -28.390182495117188, "global_step": 600972, "epoch": 7240} {"train_loss": -28.074310302734375, "global_step": 600973, "epoch": 7240} {"train_loss": -28.036579132080078, "global_step": 600974, "epoch": 7240} {"train_loss": -28.568042755126953, "global_step": 600975, "epoch": 7240} {"train_loss": -28.262845993041992, "global_step": 600976, "epoch": 7240} {"train_loss": -28.014144897460938, "global_step": 600977, "epoch": 7240} {"train_loss": -27.7674617767334, "global_step": 600978, "epoch": 7240} {"train_loss": -27.6845703125, "global_step": 600979, "epoch": 7240} {"train_loss": -27.937219619750977, "global_step": 600980, "epoch": 7240} {"train_loss": -28.08941650390625, "global_step": 600981, "epoch": 7240} {"train_loss": -28.167394638061523, "global_step": 600982, "epoch": 7240} {"train_loss": -27.5814208984375, "global_step": 600983, "epoch": 7240} {"train_loss": -27.543537139892578, "global_step": 600984, "epoch": 7240} {"train_loss": -27.652551651000977, "global_step": 600985, "epoch": 7240} {"train_loss": -28.114978790283203, "global_step": 600986, "epoch": 7240} {"train_loss": -27.9760684967041, "global_step": 600987, "epoch": 7240} {"train_loss": -28.18265724182129, "global_step": 600988, "epoch": 7240} {"train_loss": -28.012704849243164, "global_step": 600989, "epoch": 7240} {"train_loss": -27.7127685546875, "global_step": 600990, "epoch": 7240} {"train_loss": -28.082426071166992, "global_step": 600991, "epoch": 7240} {"train_loss": -28.30364418029785, "global_step": 600992, "epoch": 7240} {"train_loss": -28.24163818359375, "global_step": 600993, "epoch": 7240} {"train_loss": -28.1773681640625, "global_step": 600994, "epoch": 7240} {"train_loss": -28.13155174255371, "global_step": 600995, "epoch": 7240} {"train_loss": -28.013050079345703, "global_step": 600996, "epoch": 7240} {"train_loss": -28.394561767578125, "global_step": 600997, "epoch": 7240} {"train_loss": -28.158823013305664, "global_step": 600998, "epoch": 7240} {"train_loss": -28.17771339416504, "global_step": 600999, "epoch": 7240} {"train_loss": -28.0288028717041, "global_step": 601000, "epoch": 7240} {"train_loss": -28.165069580078125, "global_step": 601001, "epoch": 7240} {"train_loss": -28.012711352612598, "global_step": 601002, "epoch": 7240, "val_loss": 6503137.0} {"train_loss": -27.7102108001709, "global_step": 601003, "epoch": 7241} {"train_loss": -27.9034423828125, "global_step": 601004, "epoch": 7241} {"train_loss": -28.04193115234375, "global_step": 601005, "epoch": 7241} {"train_loss": -27.9254093170166, "global_step": 601006, "epoch": 7241} {"train_loss": -27.932931900024414, "global_step": 601007, "epoch": 7241} {"train_loss": -27.629724502563477, "global_step": 601008, "epoch": 7241} {"train_loss": -27.845483779907227, "global_step": 601009, "epoch": 7241} {"train_loss": -27.884632110595703, "global_step": 601010, "epoch": 7241} {"train_loss": -27.712371826171875, "global_step": 601011, "epoch": 7241} {"train_loss": -27.9259033203125, "global_step": 601012, "epoch": 7241} {"train_loss": -27.709197998046875, "global_step": 601013, "epoch": 7241} {"train_loss": -28.120868682861328, "global_step": 601014, "epoch": 7241} {"train_loss": -27.998682022094727, "global_step": 601015, "epoch": 7241} {"train_loss": -27.97256851196289, "global_step": 601016, "epoch": 7241} {"train_loss": -27.9394474029541, "global_step": 601017, "epoch": 7241} {"train_loss": -27.675445556640625, "global_step": 601018, "epoch": 7241} {"train_loss": -28.093952178955078, "global_step": 601019, "epoch": 7241} {"train_loss": -28.2199764251709, "global_step": 601020, "epoch": 7241} {"train_loss": -27.908369064331055, "global_step": 601021, "epoch": 7241} {"train_loss": -27.903961181640625, "global_step": 601022, "epoch": 7241} {"train_loss": -28.080183029174805, "global_step": 601023, "epoch": 7241} {"train_loss": -28.192174911499023, "global_step": 601024, "epoch": 7241} {"train_loss": -28.020292282104492, "global_step": 601025, "epoch": 7241} {"train_loss": -27.607196807861328, "global_step": 601026, "epoch": 7241} {"train_loss": -28.16046142578125, "global_step": 601027, "epoch": 7241} {"train_loss": -28.07459831237793, "global_step": 601028, "epoch": 7241} {"train_loss": -28.1707820892334, "global_step": 601029, "epoch": 7241} {"train_loss": -27.777210235595703, "global_step": 601030, "epoch": 7241} {"train_loss": -28.22381591796875, "global_step": 601031, "epoch": 7241} {"train_loss": -28.383508682250977, "global_step": 601032, "epoch": 7241} {"train_loss": -28.321863174438477, "global_step": 601033, "epoch": 7241} {"train_loss": -27.930206298828125, "global_step": 601034, "epoch": 7241} {"train_loss": -27.73101806640625, "global_step": 601035, "epoch": 7241} {"train_loss": -27.69687271118164, "global_step": 601036, "epoch": 7241} {"train_loss": -27.69631004333496, "global_step": 601037, "epoch": 7241} {"train_loss": -28.007612228393555, "global_step": 601038, "epoch": 7241} {"train_loss": -27.7692928314209, "global_step": 601039, "epoch": 7241} {"train_loss": -28.106550216674805, "global_step": 601040, "epoch": 7241} {"train_loss": -28.118864059448242, "global_step": 601041, "epoch": 7241} {"train_loss": -27.724668502807617, "global_step": 601042, "epoch": 7241} {"train_loss": -28.07990837097168, "global_step": 601043, "epoch": 7241} {"train_loss": -28.143695831298828, "global_step": 601044, "epoch": 7241} {"train_loss": -27.994953155517578, "global_step": 601045, "epoch": 7241} {"train_loss": -27.66688346862793, "global_step": 601046, "epoch": 7241} {"train_loss": -28.0246639251709, "global_step": 601047, "epoch": 7241} {"train_loss": -27.635522842407227, "global_step": 601048, "epoch": 7241} {"train_loss": -28.19813346862793, "global_step": 601049, "epoch": 7241} {"train_loss": -27.854040145874023, "global_step": 601050, "epoch": 7241} {"train_loss": -27.742345809936523, "global_step": 601051, "epoch": 7241} {"train_loss": -27.96408462524414, "global_step": 601052, "epoch": 7241} {"train_loss": -28.126855850219727, "global_step": 601053, "epoch": 7241} {"train_loss": -28.081130981445312, "global_step": 601054, "epoch": 7241} {"train_loss": -27.6701717376709, "global_step": 601055, "epoch": 7241} {"train_loss": -28.209259033203125, "global_step": 601056, "epoch": 7241} {"train_loss": -28.101858139038086, "global_step": 601057, "epoch": 7241} {"train_loss": -27.493871688842773, "global_step": 601058, "epoch": 7241} {"train_loss": -27.962345123291016, "global_step": 601059, "epoch": 7241} {"train_loss": -27.610639572143555, "global_step": 601060, "epoch": 7241} {"train_loss": -28.122900009155273, "global_step": 601061, "epoch": 7241} {"train_loss": -27.97686195373535, "global_step": 601062, "epoch": 7241} {"train_loss": -27.861896514892578, "global_step": 601063, "epoch": 7241} {"train_loss": -27.92392349243164, "global_step": 601064, "epoch": 7241} {"train_loss": -27.73590660095215, "global_step": 601065, "epoch": 7241} {"train_loss": -27.883886337280273, "global_step": 601066, "epoch": 7241} {"train_loss": -27.987878799438477, "global_step": 601067, "epoch": 7241} {"train_loss": -28.151220321655273, "global_step": 601068, "epoch": 7241} {"train_loss": -27.83222770690918, "global_step": 601069, "epoch": 7241} {"train_loss": -28.050893783569336, "global_step": 601070, "epoch": 7241} {"train_loss": -28.040771484375, "global_step": 601071, "epoch": 7241} {"train_loss": -27.81363296508789, "global_step": 601072, "epoch": 7241} {"train_loss": -27.758441925048828, "global_step": 601073, "epoch": 7241} {"train_loss": -28.090723037719727, "global_step": 601074, "epoch": 7241} {"train_loss": -27.94099235534668, "global_step": 601075, "epoch": 7241} {"train_loss": -27.885177612304688, "global_step": 601076, "epoch": 7241} {"train_loss": -28.091339111328125, "global_step": 601077, "epoch": 7241} {"train_loss": -27.9981689453125, "global_step": 601078, "epoch": 7241} {"train_loss": -27.990493774414062, "global_step": 601079, "epoch": 7241} {"train_loss": -28.1014404296875, "global_step": 601080, "epoch": 7241} {"train_loss": -28.244089126586914, "global_step": 601081, "epoch": 7241} {"train_loss": -28.004087448120117, "global_step": 601082, "epoch": 7241} {"train_loss": -28.318754196166992, "global_step": 601083, "epoch": 7241} {"train_loss": -28.133899688720703, "global_step": 601084, "epoch": 7241} {"train_loss": -27.976094762962983, "global_step": 601085, "epoch": 7241, "val_loss": 6523554.0} {"train_loss": -27.90752601623535, "global_step": 601086, "epoch": 7242} {"train_loss": -28.228403091430664, "global_step": 601087, "epoch": 7242} {"train_loss": -28.18458366394043, "global_step": 601088, "epoch": 7242} {"train_loss": -27.913928985595703, "global_step": 601089, "epoch": 7242} {"train_loss": -28.289794921875, "global_step": 601090, "epoch": 7242} {"train_loss": -28.072296142578125, "global_step": 601091, "epoch": 7242} {"train_loss": -28.02947998046875, "global_step": 601092, "epoch": 7242} {"train_loss": -27.872058868408203, "global_step": 601093, "epoch": 7242} {"train_loss": -27.803380966186523, "global_step": 601094, "epoch": 7242} {"train_loss": -28.053634643554688, "global_step": 601095, "epoch": 7242} {"train_loss": -28.101118087768555, "global_step": 601096, "epoch": 7242} {"train_loss": -27.804426193237305, "global_step": 601097, "epoch": 7242} {"train_loss": -27.955488204956055, "global_step": 601098, "epoch": 7242} {"train_loss": -27.901447296142578, "global_step": 601099, "epoch": 7242} {"train_loss": -27.91314697265625, "global_step": 601100, "epoch": 7242} {"train_loss": -28.0032901763916, "global_step": 601101, "epoch": 7242} {"train_loss": -27.967426300048828, "global_step": 601102, "epoch": 7242} {"train_loss": -28.127756118774414, "global_step": 601103, "epoch": 7242} {"train_loss": -27.928125381469727, "global_step": 601104, "epoch": 7242} {"train_loss": -27.8623046875, "global_step": 601105, "epoch": 7242} {"train_loss": -28.05832862854004, "global_step": 601106, "epoch": 7242} {"train_loss": -28.147907257080078, "global_step": 601107, "epoch": 7242} {"train_loss": -27.82608985900879, "global_step": 601108, "epoch": 7242} {"train_loss": -28.114072799682617, "global_step": 601109, "epoch": 7242} {"train_loss": -28.306976318359375, "global_step": 601110, "epoch": 7242} {"train_loss": -27.916732788085938, "global_step": 601111, "epoch": 7242} {"train_loss": -28.1787052154541, "global_step": 601112, "epoch": 7242} {"train_loss": -27.738630294799805, "global_step": 601113, "epoch": 7242} {"train_loss": -28.038190841674805, "global_step": 601114, "epoch": 7242} {"train_loss": -27.818115234375, "global_step": 601115, "epoch": 7242} {"train_loss": -28.08631706237793, "global_step": 601116, "epoch": 7242} {"train_loss": -27.998693466186523, "global_step": 601117, "epoch": 7242} {"train_loss": -27.780689239501953, "global_step": 601118, "epoch": 7242} {"train_loss": -28.581235885620117, "global_step": 601119, "epoch": 7242} {"train_loss": -27.970233917236328, "global_step": 601120, "epoch": 7242} {"train_loss": -28.22401237487793, "global_step": 601121, "epoch": 7242} {"train_loss": -28.2125301361084, "global_step": 601122, "epoch": 7242} {"train_loss": -27.711349487304688, "global_step": 601123, "epoch": 7242} {"train_loss": -28.185291290283203, "global_step": 601124, "epoch": 7242} {"train_loss": -27.904829025268555, "global_step": 601125, "epoch": 7242} {"train_loss": -27.99224281311035, "global_step": 601126, "epoch": 7242} {"train_loss": -28.352008819580078, "global_step": 601127, "epoch": 7242} {"train_loss": -28.236347198486328, "global_step": 601128, "epoch": 7242} {"train_loss": -27.974252700805664, "global_step": 601129, "epoch": 7242} {"train_loss": -28.054935455322266, "global_step": 601130, "epoch": 7242} {"train_loss": -28.06770133972168, "global_step": 601131, "epoch": 7242} {"train_loss": -27.807798385620117, "global_step": 601132, "epoch": 7242} {"train_loss": -27.892301559448242, "global_step": 601133, "epoch": 7242} {"train_loss": -27.780603408813477, "global_step": 601134, "epoch": 7242} {"train_loss": -28.04538917541504, "global_step": 601135, "epoch": 7242} {"train_loss": -28.204669952392578, "global_step": 601136, "epoch": 7242} {"train_loss": -27.79790687561035, "global_step": 601137, "epoch": 7242} {"train_loss": -27.586088180541992, "global_step": 601138, "epoch": 7242} {"train_loss": -28.5650577545166, "global_step": 601139, "epoch": 7242} {"train_loss": -27.791763305664062, "global_step": 601140, "epoch": 7242} {"train_loss": -28.167621612548828, "global_step": 601141, "epoch": 7242} {"train_loss": -27.95830726623535, "global_step": 601142, "epoch": 7242} {"train_loss": -27.934436798095703, "global_step": 601143, "epoch": 7242} {"train_loss": -27.84244155883789, "global_step": 601144, "epoch": 7242} {"train_loss": -27.915735244750977, "global_step": 601145, "epoch": 7242} {"train_loss": -28.4422664642334, "global_step": 601146, "epoch": 7242} {"train_loss": -27.76974868774414, "global_step": 601147, "epoch": 7242} {"train_loss": -27.85994529724121, "global_step": 601148, "epoch": 7242} {"train_loss": -27.78741455078125, "global_step": 601149, "epoch": 7242} {"train_loss": -28.053754806518555, "global_step": 601150, "epoch": 7242} {"train_loss": -27.893991470336914, "global_step": 601151, "epoch": 7242} {"train_loss": -28.268238067626953, "global_step": 601152, "epoch": 7242} {"train_loss": -27.87446403503418, "global_step": 601153, "epoch": 7242} {"train_loss": -27.687971115112305, "global_step": 601154, "epoch": 7242} {"train_loss": -27.9002742767334, "global_step": 601155, "epoch": 7242} {"train_loss": -27.4129581451416, "global_step": 601156, "epoch": 7242} {"train_loss": -28.20503044128418, "global_step": 601157, "epoch": 7242} {"train_loss": -28.17996597290039, "global_step": 601158, "epoch": 7242} {"train_loss": -27.616291046142578, "global_step": 601159, "epoch": 7242} {"train_loss": -28.056766510009766, "global_step": 601160, "epoch": 7242} {"train_loss": -28.128446578979492, "global_step": 601161, "epoch": 7242} {"train_loss": -27.914051055908203, "global_step": 601162, "epoch": 7242} {"train_loss": -27.79250144958496, "global_step": 601163, "epoch": 7242} {"train_loss": -28.104785919189453, "global_step": 601164, "epoch": 7242} {"train_loss": -27.857568740844727, "global_step": 601165, "epoch": 7242} {"train_loss": -28.00006675720215, "global_step": 601166, "epoch": 7242} {"train_loss": -28.208698272705078, "global_step": 601167, "epoch": 7242} {"train_loss": -27.999636960316852, "global_step": 601168, "epoch": 7242, "val_loss": 6515637.5} {"train_loss": -27.69105339050293, "global_step": 601169, "epoch": 7243} {"train_loss": -27.786041259765625, "global_step": 601170, "epoch": 7243} {"train_loss": -27.742115020751953, "global_step": 601171, "epoch": 7243} {"train_loss": -27.41651725769043, "global_step": 601172, "epoch": 7243} {"train_loss": -27.841999053955078, "global_step": 601173, "epoch": 7243} {"train_loss": -27.889646530151367, "global_step": 601174, "epoch": 7243} {"train_loss": -27.76897621154785, "global_step": 601175, "epoch": 7243} {"train_loss": -27.463764190673828, "global_step": 601176, "epoch": 7243} {"train_loss": -27.577930450439453, "global_step": 601177, "epoch": 7243} {"train_loss": -28.033140182495117, "global_step": 601178, "epoch": 7243} {"train_loss": -28.25514030456543, "global_step": 601179, "epoch": 7243} {"train_loss": -27.937891006469727, "global_step": 601180, "epoch": 7243} {"train_loss": -28.089956283569336, "global_step": 601181, "epoch": 7243} {"train_loss": -28.138227462768555, "global_step": 601182, "epoch": 7243} {"train_loss": -27.93927001953125, "global_step": 601183, "epoch": 7243} {"train_loss": -28.22072410583496, "global_step": 601184, "epoch": 7243} {"train_loss": -28.04950523376465, "global_step": 601185, "epoch": 7243} {"train_loss": -27.811126708984375, "global_step": 601186, "epoch": 7243} {"train_loss": -27.945005416870117, "global_step": 601187, "epoch": 7243} {"train_loss": -27.830982208251953, "global_step": 601188, "epoch": 7243} {"train_loss": -27.8438663482666, "global_step": 601189, "epoch": 7243} {"train_loss": -27.998626708984375, "global_step": 601190, "epoch": 7243} {"train_loss": -28.125263214111328, "global_step": 601191, "epoch": 7243} {"train_loss": -27.725278854370117, "global_step": 601192, "epoch": 7243} {"train_loss": -27.7248477935791, "global_step": 601193, "epoch": 7243} {"train_loss": -28.265050888061523, "global_step": 601194, "epoch": 7243} {"train_loss": -28.055789947509766, "global_step": 601195, "epoch": 7243} {"train_loss": -28.2187442779541, "global_step": 601196, "epoch": 7243} {"train_loss": -28.03053092956543, "global_step": 601197, "epoch": 7243} {"train_loss": -27.75494384765625, "global_step": 601198, "epoch": 7243} {"train_loss": -28.1365909576416, "global_step": 601199, "epoch": 7243} {"train_loss": -28.312841415405273, "global_step": 601200, "epoch": 7243} {"train_loss": -27.78156089782715, "global_step": 601201, "epoch": 7243} {"train_loss": -27.71502685546875, "global_step": 601202, "epoch": 7243} {"train_loss": -27.924230575561523, "global_step": 601203, "epoch": 7243} {"train_loss": -27.755359649658203, "global_step": 601204, "epoch": 7243} {"train_loss": -27.60870361328125, "global_step": 601205, "epoch": 7243} {"train_loss": -28.15886878967285, "global_step": 601206, "epoch": 7243} {"train_loss": -27.709497451782227, "global_step": 601207, "epoch": 7243} {"train_loss": -27.75164222717285, "global_step": 601208, "epoch": 7243} {"train_loss": -27.89794921875, "global_step": 601209, "epoch": 7243} {"train_loss": -27.9932804107666, "global_step": 601210, "epoch": 7243} {"train_loss": -27.539840698242188, "global_step": 601211, "epoch": 7243} {"train_loss": -28.122119903564453, "global_step": 601212, "epoch": 7243} {"train_loss": -28.1583251953125, "global_step": 601213, "epoch": 7243} {"train_loss": -27.600854873657227, "global_step": 601214, "epoch": 7243} {"train_loss": -27.904569625854492, "global_step": 601215, "epoch": 7243} {"train_loss": -27.754474639892578, "global_step": 601216, "epoch": 7243} {"train_loss": -28.21058464050293, "global_step": 601217, "epoch": 7243} {"train_loss": -28.068206787109375, "global_step": 601218, "epoch": 7243} {"train_loss": -28.034717559814453, "global_step": 601219, "epoch": 7243} {"train_loss": -28.3833065032959, "global_step": 601220, "epoch": 7243} {"train_loss": -28.09211540222168, "global_step": 601221, "epoch": 7243} {"train_loss": -28.300861358642578, "global_step": 601222, "epoch": 7243} {"train_loss": -28.09930992126465, "global_step": 601223, "epoch": 7243} {"train_loss": -28.264570236206055, "global_step": 601224, "epoch": 7243} {"train_loss": -28.27561378479004, "global_step": 601225, "epoch": 7243} {"train_loss": -28.167993545532227, "global_step": 601226, "epoch": 7243} {"train_loss": -28.13154411315918, "global_step": 601227, "epoch": 7243} {"train_loss": -27.983068466186523, "global_step": 601228, "epoch": 7243} {"train_loss": -28.280736923217773, "global_step": 601229, "epoch": 7243} {"train_loss": -27.93983268737793, "global_step": 601230, "epoch": 7243} {"train_loss": -28.195798873901367, "global_step": 601231, "epoch": 7243} {"train_loss": -28.093961715698242, "global_step": 601232, "epoch": 7243} {"train_loss": -27.987152099609375, "global_step": 601233, "epoch": 7243} {"train_loss": -27.94060707092285, "global_step": 601234, "epoch": 7243} {"train_loss": -28.133960723876953, "global_step": 601235, "epoch": 7243} {"train_loss": -28.224023818969727, "global_step": 601236, "epoch": 7243} {"train_loss": -28.353076934814453, "global_step": 601237, "epoch": 7243} {"train_loss": -28.06568717956543, "global_step": 601238, "epoch": 7243} {"train_loss": -27.860395431518555, "global_step": 601239, "epoch": 7243} {"train_loss": -28.008996963500977, "global_step": 601240, "epoch": 7243} {"train_loss": -28.370969772338867, "global_step": 601241, "epoch": 7243} {"train_loss": -28.15638542175293, "global_step": 601242, "epoch": 7243} {"train_loss": -28.321060180664062, "global_step": 601243, "epoch": 7243} {"train_loss": -28.442087173461914, "global_step": 601244, "epoch": 7243} {"train_loss": -27.841772079467773, "global_step": 601245, "epoch": 7243} {"train_loss": -28.326343536376953, "global_step": 601246, "epoch": 7243} {"train_loss": -28.523496627807617, "global_step": 601247, "epoch": 7243} {"train_loss": -28.407175064086914, "global_step": 601248, "epoch": 7243} {"train_loss": -27.6423282623291, "global_step": 601249, "epoch": 7243} {"train_loss": -28.190473556518555, "global_step": 601250, "epoch": 7243} {"train_loss": -28.007770699190807, "global_step": 601251, "epoch": 7243, "val_loss": 6537927.5} {"train_loss": -27.382043838500977, "global_step": 601252, "epoch": 7244} {"train_loss": -26.669483184814453, "global_step": 601253, "epoch": 7244} {"train_loss": -25.813379287719727, "global_step": 601254, "epoch": 7244} {"train_loss": -25.23665428161621, "global_step": 601255, "epoch": 7244} {"train_loss": -25.3358097076416, "global_step": 601256, "epoch": 7244} {"train_loss": -27.52560806274414, "global_step": 601257, "epoch": 7244} {"train_loss": -24.920860290527344, "global_step": 601258, "epoch": 7244} {"train_loss": -27.108503341674805, "global_step": 601259, "epoch": 7244} {"train_loss": -25.68277359008789, "global_step": 601260, "epoch": 7244} {"train_loss": -27.172666549682617, "global_step": 601261, "epoch": 7244} {"train_loss": -25.944995880126953, "global_step": 601262, "epoch": 7244} {"train_loss": -27.045124053955078, "global_step": 601263, "epoch": 7244} {"train_loss": -26.68573570251465, "global_step": 601264, "epoch": 7244} {"train_loss": -26.994338989257812, "global_step": 601265, "epoch": 7244} {"train_loss": -26.96616554260254, "global_step": 601266, "epoch": 7244} {"train_loss": -27.439191818237305, "global_step": 601267, "epoch": 7244} {"train_loss": -27.539875030517578, "global_step": 601268, "epoch": 7244} {"train_loss": -26.91328239440918, "global_step": 601269, "epoch": 7244} {"train_loss": -27.455862045288086, "global_step": 601270, "epoch": 7244} {"train_loss": -27.37849998474121, "global_step": 601271, "epoch": 7244} {"train_loss": -27.284713745117188, "global_step": 601272, "epoch": 7244} {"train_loss": -27.436429977416992, "global_step": 601273, "epoch": 7244} {"train_loss": -27.48978042602539, "global_step": 601274, "epoch": 7244} {"train_loss": -27.505491256713867, "global_step": 601275, "epoch": 7244} {"train_loss": -27.3251953125, "global_step": 601276, "epoch": 7244} {"train_loss": -27.639877319335938, "global_step": 601277, "epoch": 7244} {"train_loss": -27.22352409362793, "global_step": 601278, "epoch": 7244} {"train_loss": -27.303625106811523, "global_step": 601279, "epoch": 7244} {"train_loss": -27.557987213134766, "global_step": 601280, "epoch": 7244} {"train_loss": -27.09571647644043, "global_step": 601281, "epoch": 7244} {"train_loss": -27.769947052001953, "global_step": 601282, "epoch": 7244} {"train_loss": -27.593875885009766, "global_step": 601283, "epoch": 7244} {"train_loss": -27.658857345581055, "global_step": 601284, "epoch": 7244} {"train_loss": -27.7658748626709, "global_step": 601285, "epoch": 7244} {"train_loss": -27.647947311401367, "global_step": 601286, "epoch": 7244} {"train_loss": -27.655414581298828, "global_step": 601287, "epoch": 7244} {"train_loss": -27.703842163085938, "global_step": 601288, "epoch": 7244} {"train_loss": -27.82819175720215, "global_step": 601289, "epoch": 7244} {"train_loss": -27.883596420288086, "global_step": 601290, "epoch": 7244} {"train_loss": -27.59754753112793, "global_step": 601291, "epoch": 7244} {"train_loss": -27.930479049682617, "global_step": 601292, "epoch": 7244} {"train_loss": -27.565631866455078, "global_step": 601293, "epoch": 7244} {"train_loss": -28.037811279296875, "global_step": 601294, "epoch": 7244} {"train_loss": -28.01539421081543, "global_step": 601295, "epoch": 7244} {"train_loss": -27.77735710144043, "global_step": 601296, "epoch": 7244} {"train_loss": -27.97938346862793, "global_step": 601297, "epoch": 7244} {"train_loss": -28.182220458984375, "global_step": 601298, "epoch": 7244} {"train_loss": -28.18807029724121, "global_step": 601299, "epoch": 7244} {"train_loss": -27.930770874023438, "global_step": 601300, "epoch": 7244} {"train_loss": -28.177520751953125, "global_step": 601301, "epoch": 7244} {"train_loss": -28.155813217163086, "global_step": 601302, "epoch": 7244} {"train_loss": -27.778793334960938, "global_step": 601303, "epoch": 7244} {"train_loss": -27.803434371948242, "global_step": 601304, "epoch": 7244} {"train_loss": -27.959426879882812, "global_step": 601305, "epoch": 7244} {"train_loss": -28.230518341064453, "global_step": 601306, "epoch": 7244} {"train_loss": -27.954669952392578, "global_step": 601307, "epoch": 7244} {"train_loss": -27.741607666015625, "global_step": 601308, "epoch": 7244} {"train_loss": -28.019712448120117, "global_step": 601309, "epoch": 7244} {"train_loss": -27.79922866821289, "global_step": 601310, "epoch": 7244} {"train_loss": -27.982755661010742, "global_step": 601311, "epoch": 7244} {"train_loss": -28.256696701049805, "global_step": 601312, "epoch": 7244} {"train_loss": -28.213354110717773, "global_step": 601313, "epoch": 7244} {"train_loss": -28.22831153869629, "global_step": 601314, "epoch": 7244} {"train_loss": -28.074481964111328, "global_step": 601315, "epoch": 7244} {"train_loss": -28.1087646484375, "global_step": 601316, "epoch": 7244} {"train_loss": -27.843124389648438, "global_step": 601317, "epoch": 7244} {"train_loss": -28.055130004882812, "global_step": 601318, "epoch": 7244} {"train_loss": -28.502399444580078, "global_step": 601319, "epoch": 7244} {"train_loss": -28.201257705688477, "global_step": 601320, "epoch": 7244} {"train_loss": -28.342529296875, "global_step": 601321, "epoch": 7244} {"train_loss": -28.118396759033203, "global_step": 601322, "epoch": 7244} {"train_loss": -27.922719955444336, "global_step": 601323, "epoch": 7244} {"train_loss": -28.576623916625977, "global_step": 601324, "epoch": 7244} {"train_loss": -28.28338050842285, "global_step": 601325, "epoch": 7244} {"train_loss": -28.731687545776367, "global_step": 601326, "epoch": 7244} {"train_loss": -27.9123477935791, "global_step": 601327, "epoch": 7244} {"train_loss": -28.107406616210938, "global_step": 601328, "epoch": 7244} {"train_loss": -28.106714248657227, "global_step": 601329, "epoch": 7244} {"train_loss": -28.2933349609375, "global_step": 601330, "epoch": 7244} {"train_loss": -28.104902267456055, "global_step": 601331, "epoch": 7244} {"train_loss": -28.597822189331055, "global_step": 601332, "epoch": 7244} {"train_loss": -28.180585861206055, "global_step": 601333, "epoch": 7244} {"train_loss": -27.600429787693255, "global_step": 601334, "epoch": 7244, "val_loss": 6492348.5} {"train_loss": -27.111133575439453, "global_step": 601335, "epoch": 7245} {"train_loss": -26.406147003173828, "global_step": 601336, "epoch": 7245} {"train_loss": -25.400226593017578, "global_step": 601337, "epoch": 7245} {"train_loss": -25.195833206176758, "global_step": 601338, "epoch": 7245} {"train_loss": -26.676013946533203, "global_step": 601339, "epoch": 7245} {"train_loss": -26.835556030273438, "global_step": 601340, "epoch": 7245} {"train_loss": -26.115198135375977, "global_step": 601341, "epoch": 7245} {"train_loss": -26.993375778198242, "global_step": 601342, "epoch": 7245} {"train_loss": -26.482946395874023, "global_step": 601343, "epoch": 7245} {"train_loss": -26.802261352539062, "global_step": 601344, "epoch": 7245} {"train_loss": -27.37212562561035, "global_step": 601345, "epoch": 7245} {"train_loss": -27.209197998046875, "global_step": 601346, "epoch": 7245} {"train_loss": -26.873138427734375, "global_step": 601347, "epoch": 7245} {"train_loss": -27.355255126953125, "global_step": 601348, "epoch": 7245} {"train_loss": -26.817834854125977, "global_step": 601349, "epoch": 7245} {"train_loss": -27.4160099029541, "global_step": 601350, "epoch": 7245} {"train_loss": -27.118860244750977, "global_step": 601351, "epoch": 7245} {"train_loss": -27.68535804748535, "global_step": 601352, "epoch": 7245} {"train_loss": -27.192914962768555, "global_step": 601353, "epoch": 7245} {"train_loss": -27.118167877197266, "global_step": 601354, "epoch": 7245} {"train_loss": -27.593168258666992, "global_step": 601355, "epoch": 7245} {"train_loss": -27.47222900390625, "global_step": 601356, "epoch": 7245} {"train_loss": -27.38129997253418, "global_step": 601357, "epoch": 7245} {"train_loss": -27.298986434936523, "global_step": 601358, "epoch": 7245} {"train_loss": -27.92030143737793, "global_step": 601359, "epoch": 7245} {"train_loss": -27.557086944580078, "global_step": 601360, "epoch": 7245} {"train_loss": -27.7094783782959, "global_step": 601361, "epoch": 7245} {"train_loss": -27.7432918548584, "global_step": 601362, "epoch": 7245} {"train_loss": -27.669342041015625, "global_step": 601363, "epoch": 7245} {"train_loss": -27.582111358642578, "global_step": 601364, "epoch": 7245} {"train_loss": -27.73484230041504, "global_step": 601365, "epoch": 7245} {"train_loss": -27.96732521057129, "global_step": 601366, "epoch": 7245} {"train_loss": -27.39007568359375, "global_step": 601367, "epoch": 7245} {"train_loss": -28.005645751953125, "global_step": 601368, "epoch": 7245} {"train_loss": -27.95855712890625, "global_step": 601369, "epoch": 7245} {"train_loss": -27.760025024414062, "global_step": 601370, "epoch": 7245} {"train_loss": -28.025592803955078, "global_step": 601371, "epoch": 7245} {"train_loss": -27.82415771484375, "global_step": 601372, "epoch": 7245} {"train_loss": -27.87395668029785, "global_step": 601373, "epoch": 7245} {"train_loss": -27.782245635986328, "global_step": 601374, "epoch": 7245} {"train_loss": -27.76580238342285, "global_step": 601375, "epoch": 7245} {"train_loss": -27.99725914001465, "global_step": 601376, "epoch": 7245} {"train_loss": -27.852020263671875, "global_step": 601377, "epoch": 7245} {"train_loss": -27.941864013671875, "global_step": 601378, "epoch": 7245} {"train_loss": -27.88178062438965, "global_step": 601379, "epoch": 7245} {"train_loss": -28.170312881469727, "global_step": 601380, "epoch": 7245} {"train_loss": -27.923877716064453, "global_step": 601381, "epoch": 7245} {"train_loss": -27.983877182006836, "global_step": 601382, "epoch": 7245} {"train_loss": -28.152801513671875, "global_step": 601383, "epoch": 7245} {"train_loss": -28.386520385742188, "global_step": 601384, "epoch": 7245} {"train_loss": -27.95347023010254, "global_step": 601385, "epoch": 7245} {"train_loss": -27.85691261291504, "global_step": 601386, "epoch": 7245} {"train_loss": -28.13007926940918, "global_step": 601387, "epoch": 7245} {"train_loss": -27.771167755126953, "global_step": 601388, "epoch": 7245} {"train_loss": -28.17890739440918, "global_step": 601389, "epoch": 7245} {"train_loss": -28.25189208984375, "global_step": 601390, "epoch": 7245} {"train_loss": -27.742389678955078, "global_step": 601391, "epoch": 7245} {"train_loss": -28.34528923034668, "global_step": 601392, "epoch": 7245} {"train_loss": -27.973180770874023, "global_step": 601393, "epoch": 7245} {"train_loss": -28.135732650756836, "global_step": 601394, "epoch": 7245} {"train_loss": -28.00922966003418, "global_step": 601395, "epoch": 7245} {"train_loss": -27.79071044921875, "global_step": 601396, "epoch": 7245} {"train_loss": -28.389850616455078, "global_step": 601397, "epoch": 7245} {"train_loss": -28.191415786743164, "global_step": 601398, "epoch": 7245} {"train_loss": -28.235559463500977, "global_step": 601399, "epoch": 7245} {"train_loss": -27.98383140563965, "global_step": 601400, "epoch": 7245} {"train_loss": -28.26873779296875, "global_step": 601401, "epoch": 7245} {"train_loss": -28.143386840820312, "global_step": 601402, "epoch": 7245} {"train_loss": -28.38149070739746, "global_step": 601403, "epoch": 7245} {"train_loss": -28.289335250854492, "global_step": 601404, "epoch": 7245} {"train_loss": -28.16303825378418, "global_step": 601405, "epoch": 7245} {"train_loss": -28.2628173828125, "global_step": 601406, "epoch": 7245} {"train_loss": -28.14381217956543, "global_step": 601407, "epoch": 7245} {"train_loss": -28.27813720703125, "global_step": 601408, "epoch": 7245} {"train_loss": -28.364423751831055, "global_step": 601409, "epoch": 7245} {"train_loss": -28.01479148864746, "global_step": 601410, "epoch": 7245} {"train_loss": -28.27508544921875, "global_step": 601411, "epoch": 7245} {"train_loss": -28.11677360534668, "global_step": 601412, "epoch": 7245} {"train_loss": -28.394460678100586, "global_step": 601413, "epoch": 7245} {"train_loss": -28.10111427307129, "global_step": 601414, "epoch": 7245} {"train_loss": -28.096288681030273, "global_step": 601415, "epoch": 7245} {"train_loss": -28.258466720581055, "global_step": 601416, "epoch": 7245} {"train_loss": -27.70749248366758, "global_step": 601417, "epoch": 7245, "val_loss": 6535294.5} {"train_loss": -27.683425903320312, "global_step": 601418, "epoch": 7246} {"train_loss": -27.224105834960938, "global_step": 601419, "epoch": 7246} {"train_loss": -26.6763973236084, "global_step": 601420, "epoch": 7246} {"train_loss": -27.512109756469727, "global_step": 601421, "epoch": 7246} {"train_loss": -27.58466911315918, "global_step": 601422, "epoch": 7246} {"train_loss": -27.17725944519043, "global_step": 601423, "epoch": 7246} {"train_loss": -27.382862091064453, "global_step": 601424, "epoch": 7246} {"train_loss": -26.9483642578125, "global_step": 601425, "epoch": 7246} {"train_loss": -27.913013458251953, "global_step": 601426, "epoch": 7246} {"train_loss": -27.517337799072266, "global_step": 601427, "epoch": 7246} {"train_loss": -27.45914077758789, "global_step": 601428, "epoch": 7246} {"train_loss": -27.650903701782227, "global_step": 601429, "epoch": 7246} {"train_loss": -27.61272621154785, "global_step": 601430, "epoch": 7246} {"train_loss": -27.71735954284668, "global_step": 601431, "epoch": 7246} {"train_loss": -27.58342933654785, "global_step": 601432, "epoch": 7246} {"train_loss": -27.98252296447754, "global_step": 601433, "epoch": 7246} {"train_loss": -27.831058502197266, "global_step": 601434, "epoch": 7246} {"train_loss": -27.96734619140625, "global_step": 601435, "epoch": 7246} {"train_loss": -27.832544326782227, "global_step": 601436, "epoch": 7246} {"train_loss": -28.18739128112793, "global_step": 601437, "epoch": 7246} {"train_loss": -27.768280029296875, "global_step": 601438, "epoch": 7246} {"train_loss": -27.960046768188477, "global_step": 601439, "epoch": 7246} {"train_loss": -28.017780303955078, "global_step": 601440, "epoch": 7246} {"train_loss": -27.833831787109375, "global_step": 601441, "epoch": 7246} {"train_loss": -28.03803062438965, "global_step": 601442, "epoch": 7246} {"train_loss": -27.674396514892578, "global_step": 601443, "epoch": 7246} {"train_loss": -27.863988876342773, "global_step": 601444, "epoch": 7246} {"train_loss": -28.01542091369629, "global_step": 601445, "epoch": 7246} {"train_loss": -27.92877769470215, "global_step": 601446, "epoch": 7246} {"train_loss": -28.152790069580078, "global_step": 601447, "epoch": 7246} {"train_loss": -28.16059684753418, "global_step": 601448, "epoch": 7246} {"train_loss": -28.2559757232666, "global_step": 601449, "epoch": 7246} {"train_loss": -27.975757598876953, "global_step": 601450, "epoch": 7246} {"train_loss": -27.91963768005371, "global_step": 601451, "epoch": 7246} {"train_loss": -27.84444236755371, "global_step": 601452, "epoch": 7246} {"train_loss": -27.943435668945312, "global_step": 601453, "epoch": 7246} {"train_loss": -28.378286361694336, "global_step": 601454, "epoch": 7246} {"train_loss": -28.088598251342773, "global_step": 601455, "epoch": 7246} {"train_loss": -27.8632869720459, "global_step": 601456, "epoch": 7246} {"train_loss": -28.209827423095703, "global_step": 601457, "epoch": 7246} {"train_loss": -28.0501651763916, "global_step": 601458, "epoch": 7246} {"train_loss": -28.351959228515625, "global_step": 601459, "epoch": 7246} {"train_loss": -27.924535751342773, "global_step": 601460, "epoch": 7246} {"train_loss": -28.46466636657715, "global_step": 601461, "epoch": 7246} {"train_loss": -28.479461669921875, "global_step": 601462, "epoch": 7246} {"train_loss": -27.52808952331543, "global_step": 601463, "epoch": 7246} {"train_loss": -27.3447208404541, "global_step": 601464, "epoch": 7246} {"train_loss": -27.79303550720215, "global_step": 601465, "epoch": 7246} {"train_loss": -28.079986572265625, "global_step": 601466, "epoch": 7246} {"train_loss": -28.1778507232666, "global_step": 601467, "epoch": 7246} {"train_loss": -27.65647315979004, "global_step": 601468, "epoch": 7246} {"train_loss": -28.112319946289062, "global_step": 601469, "epoch": 7246} {"train_loss": -28.449432373046875, "global_step": 601470, "epoch": 7246} {"train_loss": -28.2098331451416, "global_step": 601471, "epoch": 7246} {"train_loss": -28.108478546142578, "global_step": 601472, "epoch": 7246} {"train_loss": -28.174970626831055, "global_step": 601473, "epoch": 7246} {"train_loss": -27.960739135742188, "global_step": 601474, "epoch": 7246} {"train_loss": -27.872400283813477, "global_step": 601475, "epoch": 7246} {"train_loss": -28.20595359802246, "global_step": 601476, "epoch": 7246} {"train_loss": -28.098291397094727, "global_step": 601477, "epoch": 7246} {"train_loss": -27.99134635925293, "global_step": 601478, "epoch": 7246} {"train_loss": -28.364582061767578, "global_step": 601479, "epoch": 7246} {"train_loss": -27.67026138305664, "global_step": 601480, "epoch": 7246} {"train_loss": -28.18900489807129, "global_step": 601481, "epoch": 7246} {"train_loss": -27.84343910217285, "global_step": 601482, "epoch": 7246} {"train_loss": -28.388019561767578, "global_step": 601483, "epoch": 7246} {"train_loss": -27.884206771850586, "global_step": 601484, "epoch": 7246} {"train_loss": -28.094284057617188, "global_step": 601485, "epoch": 7246} {"train_loss": -28.41065788269043, "global_step": 601486, "epoch": 7246} {"train_loss": -28.251916885375977, "global_step": 601487, "epoch": 7246} {"train_loss": -27.97476577758789, "global_step": 601488, "epoch": 7246} {"train_loss": -27.860477447509766, "global_step": 601489, "epoch": 7246} {"train_loss": -28.06671714782715, "global_step": 601490, "epoch": 7246} {"train_loss": -28.08497428894043, "global_step": 601491, "epoch": 7246} {"train_loss": -28.604780197143555, "global_step": 601492, "epoch": 7246} {"train_loss": -28.31599235534668, "global_step": 601493, "epoch": 7246} {"train_loss": -28.374835968017578, "global_step": 601494, "epoch": 7246} {"train_loss": -28.198776245117188, "global_step": 601495, "epoch": 7246} {"train_loss": -27.99518394470215, "global_step": 601496, "epoch": 7246} {"train_loss": -28.375675201416016, "global_step": 601497, "epoch": 7246} {"train_loss": -28.522180557250977, "global_step": 601498, "epoch": 7246} {"train_loss": -28.389719009399414, "global_step": 601499, "epoch": 7246} {"train_loss": -27.973981673458972, "global_step": 601500, "epoch": 7246, "val_loss": 6450799.0} {"train_loss": -26.888898849487305, "global_step": 601501, "epoch": 7247} {"train_loss": -26.034597396850586, "global_step": 601502, "epoch": 7247} {"train_loss": -26.828948974609375, "global_step": 601503, "epoch": 7247} {"train_loss": -26.233047485351562, "global_step": 601504, "epoch": 7247} {"train_loss": -26.858030319213867, "global_step": 601505, "epoch": 7247} {"train_loss": -27.044281005859375, "global_step": 601506, "epoch": 7247} {"train_loss": -26.97687339782715, "global_step": 601507, "epoch": 7247} {"train_loss": -27.035520553588867, "global_step": 601508, "epoch": 7247} {"train_loss": -27.155729293823242, "global_step": 601509, "epoch": 7247} {"train_loss": -26.85445213317871, "global_step": 601510, "epoch": 7247} {"train_loss": -27.230255126953125, "global_step": 601511, "epoch": 7247} {"train_loss": -27.56201171875, "global_step": 601512, "epoch": 7247} {"train_loss": -27.097904205322266, "global_step": 601513, "epoch": 7247} {"train_loss": -26.938451766967773, "global_step": 601514, "epoch": 7247} {"train_loss": -26.860456466674805, "global_step": 601515, "epoch": 7247} {"train_loss": -27.198902130126953, "global_step": 601516, "epoch": 7247} {"train_loss": -26.5683650970459, "global_step": 601517, "epoch": 7247} {"train_loss": -27.21026039123535, "global_step": 601518, "epoch": 7247} {"train_loss": -27.159351348876953, "global_step": 601519, "epoch": 7247} {"train_loss": -27.42123794555664, "global_step": 601520, "epoch": 7247} {"train_loss": -27.069198608398438, "global_step": 601521, "epoch": 7247} {"train_loss": -27.302038192749023, "global_step": 601522, "epoch": 7247} {"train_loss": -27.102807998657227, "global_step": 601523, "epoch": 7247} {"train_loss": -27.48882484436035, "global_step": 601524, "epoch": 7247} {"train_loss": -27.71487808227539, "global_step": 601525, "epoch": 7247} {"train_loss": -27.671018600463867, "global_step": 601526, "epoch": 7247} {"train_loss": -27.529203414916992, "global_step": 601527, "epoch": 7247} {"train_loss": -27.60249137878418, "global_step": 601528, "epoch": 7247} {"train_loss": -27.674365997314453, "global_step": 601529, "epoch": 7247} {"train_loss": -27.648818969726562, "global_step": 601530, "epoch": 7247} {"train_loss": -27.56743812561035, "global_step": 601531, "epoch": 7247} {"train_loss": -27.66330337524414, "global_step": 601532, "epoch": 7247} {"train_loss": -27.771093368530273, "global_step": 601533, "epoch": 7247} {"train_loss": -27.795074462890625, "global_step": 601534, "epoch": 7247} {"train_loss": -27.601491928100586, "global_step": 601535, "epoch": 7247} {"train_loss": -27.4929141998291, "global_step": 601536, "epoch": 7247} {"train_loss": -27.664112091064453, "global_step": 601537, "epoch": 7247} {"train_loss": -27.638580322265625, "global_step": 601538, "epoch": 7247} {"train_loss": -27.5268497467041, "global_step": 601539, "epoch": 7247} {"train_loss": -27.989316940307617, "global_step": 601540, "epoch": 7247} {"train_loss": -27.911060333251953, "global_step": 601541, "epoch": 7247} {"train_loss": -28.105249404907227, "global_step": 601542, "epoch": 7247} {"train_loss": -28.247344970703125, "global_step": 601543, "epoch": 7247} {"train_loss": -28.251279830932617, "global_step": 601544, "epoch": 7247} {"train_loss": -28.113422393798828, "global_step": 601545, "epoch": 7247} {"train_loss": -28.162500381469727, "global_step": 601546, "epoch": 7247} {"train_loss": -28.399261474609375, "global_step": 601547, "epoch": 7247} {"train_loss": -28.171064376831055, "global_step": 601548, "epoch": 7247} {"train_loss": -28.112567901611328, "global_step": 601549, "epoch": 7247} {"train_loss": -27.996870040893555, "global_step": 601550, "epoch": 7247} {"train_loss": -28.002038955688477, "global_step": 601551, "epoch": 7247} {"train_loss": -27.8851261138916, "global_step": 601552, "epoch": 7247} {"train_loss": -28.292499542236328, "global_step": 601553, "epoch": 7247} {"train_loss": -28.308908462524414, "global_step": 601554, "epoch": 7247} {"train_loss": -27.9337158203125, "global_step": 601555, "epoch": 7247} {"train_loss": -28.175012588500977, "global_step": 601556, "epoch": 7247} {"train_loss": -28.368146896362305, "global_step": 601557, "epoch": 7247} {"train_loss": -28.379901885986328, "global_step": 601558, "epoch": 7247} {"train_loss": -28.2688045501709, "global_step": 601559, "epoch": 7247} {"train_loss": -28.06184959411621, "global_step": 601560, "epoch": 7247} {"train_loss": -28.1780948638916, "global_step": 601561, "epoch": 7247} {"train_loss": -28.203399658203125, "global_step": 601562, "epoch": 7247} {"train_loss": -28.48822021484375, "global_step": 601563, "epoch": 7247} {"train_loss": -28.407697677612305, "global_step": 601564, "epoch": 7247} {"train_loss": -27.69243812561035, "global_step": 601565, "epoch": 7247} {"train_loss": -28.377395629882812, "global_step": 601566, "epoch": 7247} {"train_loss": -28.193212509155273, "global_step": 601567, "epoch": 7247} {"train_loss": -28.158700942993164, "global_step": 601568, "epoch": 7247} {"train_loss": -27.924152374267578, "global_step": 601569, "epoch": 7247} {"train_loss": -27.83162498474121, "global_step": 601570, "epoch": 7247} {"train_loss": -27.571935653686523, "global_step": 601571, "epoch": 7247} {"train_loss": -28.36256217956543, "global_step": 601572, "epoch": 7247} {"train_loss": -27.569604873657227, "global_step": 601573, "epoch": 7247} {"train_loss": -28.29694175720215, "global_step": 601574, "epoch": 7247} {"train_loss": -27.891393661499023, "global_step": 601575, "epoch": 7247} {"train_loss": -27.94843864440918, "global_step": 601576, "epoch": 7247} {"train_loss": -28.064123153686523, "global_step": 601577, "epoch": 7247} {"train_loss": -28.611047744750977, "global_step": 601578, "epoch": 7247} {"train_loss": -28.47560691833496, "global_step": 601579, "epoch": 7247} {"train_loss": -27.895532608032227, "global_step": 601580, "epoch": 7247} {"train_loss": -28.521774291992188, "global_step": 601581, "epoch": 7247} {"train_loss": -28.0646915435791, "global_step": 601582, "epoch": 7247} {"train_loss": -27.724579133183124, "global_step": 601583, "epoch": 7247, "val_loss": 6833003.0} {"train_loss": -26.22711181640625, "global_step": 601584, "epoch": 7248} {"train_loss": -26.080219268798828, "global_step": 601585, "epoch": 7248} {"train_loss": -26.615081787109375, "global_step": 601586, "epoch": 7248} {"train_loss": -26.712570190429688, "global_step": 601587, "epoch": 7248} {"train_loss": -26.440631866455078, "global_step": 601588, "epoch": 7248} {"train_loss": -26.53287696838379, "global_step": 601589, "epoch": 7248} {"train_loss": -26.829877853393555, "global_step": 601590, "epoch": 7248} {"train_loss": -26.59765625, "global_step": 601591, "epoch": 7248} {"train_loss": -27.0358829498291, "global_step": 601592, "epoch": 7248} {"train_loss": -26.775177001953125, "global_step": 601593, "epoch": 7248} {"train_loss": -27.56201171875, "global_step": 601594, "epoch": 7248} {"train_loss": -27.234638214111328, "global_step": 601595, "epoch": 7248} {"train_loss": -27.33017921447754, "global_step": 601596, "epoch": 7248} {"train_loss": -27.352508544921875, "global_step": 601597, "epoch": 7248} {"train_loss": -27.121496200561523, "global_step": 601598, "epoch": 7248} {"train_loss": -27.69951820373535, "global_step": 601599, "epoch": 7248} {"train_loss": -27.591596603393555, "global_step": 601600, "epoch": 7248} {"train_loss": -27.4427433013916, "global_step": 601601, "epoch": 7248} {"train_loss": -27.663068771362305, "global_step": 601602, "epoch": 7248} {"train_loss": -27.37760353088379, "global_step": 601603, "epoch": 7248} {"train_loss": -27.480600357055664, "global_step": 601604, "epoch": 7248} {"train_loss": -27.747207641601562, "global_step": 601605, "epoch": 7248} {"train_loss": -27.487882614135742, "global_step": 601606, "epoch": 7248} {"train_loss": -27.713851928710938, "global_step": 601607, "epoch": 7248} {"train_loss": -27.587804794311523, "global_step": 601608, "epoch": 7248} {"train_loss": -27.8859920501709, "global_step": 601609, "epoch": 7248} {"train_loss": -27.825180053710938, "global_step": 601610, "epoch": 7248} {"train_loss": -27.947656631469727, "global_step": 601611, "epoch": 7248} {"train_loss": -27.90096092224121, "global_step": 601612, "epoch": 7248} {"train_loss": -27.590490341186523, "global_step": 601613, "epoch": 7248} {"train_loss": -27.780054092407227, "global_step": 601614, "epoch": 7248} {"train_loss": -27.969100952148438, "global_step": 601615, "epoch": 7248} {"train_loss": -27.92909812927246, "global_step": 601616, "epoch": 7248} {"train_loss": -27.902694702148438, "global_step": 601617, "epoch": 7248} {"train_loss": -27.802839279174805, "global_step": 601618, "epoch": 7248} {"train_loss": -27.877832412719727, "global_step": 601619, "epoch": 7248} {"train_loss": -28.121952056884766, "global_step": 601620, "epoch": 7248} {"train_loss": -27.504932403564453, "global_step": 601621, "epoch": 7248} {"train_loss": -28.047733306884766, "global_step": 601622, "epoch": 7248} {"train_loss": -28.390716552734375, "global_step": 601623, "epoch": 7248} {"train_loss": -28.011966705322266, "global_step": 601624, "epoch": 7248} {"train_loss": -28.0286865234375, "global_step": 601625, "epoch": 7248} {"train_loss": -27.976398468017578, "global_step": 601626, "epoch": 7248} {"train_loss": -28.181264877319336, "global_step": 601627, "epoch": 7248} {"train_loss": -27.7225399017334, "global_step": 601628, "epoch": 7248} {"train_loss": -28.168012619018555, "global_step": 601629, "epoch": 7248} {"train_loss": -28.37381935119629, "global_step": 601630, "epoch": 7248} {"train_loss": -27.77303123474121, "global_step": 601631, "epoch": 7248} {"train_loss": -27.9928035736084, "global_step": 601632, "epoch": 7248} {"train_loss": -28.38083267211914, "global_step": 601633, "epoch": 7248} {"train_loss": -28.05759048461914, "global_step": 601634, "epoch": 7248} {"train_loss": -28.41314125061035, "global_step": 601635, "epoch": 7248} {"train_loss": -28.018911361694336, "global_step": 601636, "epoch": 7248} {"train_loss": -28.026010513305664, "global_step": 601637, "epoch": 7248} {"train_loss": -28.027923583984375, "global_step": 601638, "epoch": 7248} {"train_loss": -28.3603515625, "global_step": 601639, "epoch": 7248} {"train_loss": -28.383108139038086, "global_step": 601640, "epoch": 7248} {"train_loss": -28.363019943237305, "global_step": 601641, "epoch": 7248} {"train_loss": -28.5683536529541, "global_step": 601642, "epoch": 7248} {"train_loss": -28.129507064819336, "global_step": 601643, "epoch": 7248} {"train_loss": -28.474491119384766, "global_step": 601644, "epoch": 7248} {"train_loss": -28.129608154296875, "global_step": 601645, "epoch": 7248} {"train_loss": -28.17506217956543, "global_step": 601646, "epoch": 7248} {"train_loss": -28.31854248046875, "global_step": 601647, "epoch": 7248} {"train_loss": -28.355146408081055, "global_step": 601648, "epoch": 7248} {"train_loss": -28.224212646484375, "global_step": 601649, "epoch": 7248} {"train_loss": -28.338659286499023, "global_step": 601650, "epoch": 7248} {"train_loss": -27.987760543823242, "global_step": 601651, "epoch": 7248} {"train_loss": -28.058752059936523, "global_step": 601652, "epoch": 7248} {"train_loss": -28.062713623046875, "global_step": 601653, "epoch": 7248} {"train_loss": -27.959430694580078, "global_step": 601654, "epoch": 7248} {"train_loss": -28.163660049438477, "global_step": 601655, "epoch": 7248} {"train_loss": -28.238784790039062, "global_step": 601656, "epoch": 7248} {"train_loss": -28.43657875061035, "global_step": 601657, "epoch": 7248} {"train_loss": -27.993396759033203, "global_step": 601658, "epoch": 7248} {"train_loss": -28.052038192749023, "global_step": 601659, "epoch": 7248} {"train_loss": -27.475698471069336, "global_step": 601660, "epoch": 7248} {"train_loss": -27.774694442749023, "global_step": 601661, "epoch": 7248} {"train_loss": -27.065488815307617, "global_step": 601662, "epoch": 7248} {"train_loss": -26.7746524810791, "global_step": 601663, "epoch": 7248} {"train_loss": -27.65926170349121, "global_step": 601664, "epoch": 7248} {"train_loss": -28.210508346557617, "global_step": 601665, "epoch": 7248} {"train_loss": -27.734487119927465, "global_step": 601666, "epoch": 7248, "val_loss": 6584328.5} {"train_loss": -26.717321395874023, "global_step": 601667, "epoch": 7249} {"train_loss": -27.23484230041504, "global_step": 601668, "epoch": 7249} {"train_loss": -26.702795028686523, "global_step": 601669, "epoch": 7249} {"train_loss": -27.280960083007812, "global_step": 601670, "epoch": 7249} {"train_loss": -26.420059204101562, "global_step": 601671, "epoch": 7249} {"train_loss": -27.14994239807129, "global_step": 601672, "epoch": 7249} {"train_loss": -26.54291343688965, "global_step": 601673, "epoch": 7249} {"train_loss": -27.41383171081543, "global_step": 601674, "epoch": 7249} {"train_loss": -27.24439811706543, "global_step": 601675, "epoch": 7249} {"train_loss": -26.898183822631836, "global_step": 601676, "epoch": 7249} {"train_loss": -27.518686294555664, "global_step": 601677, "epoch": 7249} {"train_loss": -27.00031852722168, "global_step": 601678, "epoch": 7249} {"train_loss": -27.5041446685791, "global_step": 601679, "epoch": 7249} {"train_loss": -26.95338249206543, "global_step": 601680, "epoch": 7249} {"train_loss": -27.272024154663086, "global_step": 601681, "epoch": 7249} {"train_loss": -27.9776554107666, "global_step": 601682, "epoch": 7249} {"train_loss": -27.581024169921875, "global_step": 601683, "epoch": 7249} {"train_loss": -27.806283950805664, "global_step": 601684, "epoch": 7249} {"train_loss": -27.857135772705078, "global_step": 601685, "epoch": 7249} {"train_loss": -27.295621871948242, "global_step": 601686, "epoch": 7249} {"train_loss": -27.821868896484375, "global_step": 601687, "epoch": 7249} {"train_loss": -27.730194091796875, "global_step": 601688, "epoch": 7249} {"train_loss": -27.69227409362793, "global_step": 601689, "epoch": 7249} {"train_loss": -28.0126953125, "global_step": 601690, "epoch": 7249} {"train_loss": -27.839574813842773, "global_step": 601691, "epoch": 7249} {"train_loss": -27.599592208862305, "global_step": 601692, "epoch": 7249} {"train_loss": -27.747507095336914, "global_step": 601693, "epoch": 7249} {"train_loss": -27.909137725830078, "global_step": 601694, "epoch": 7249} {"train_loss": -28.074512481689453, "global_step": 601695, "epoch": 7249} {"train_loss": -27.78092384338379, "global_step": 601696, "epoch": 7249} {"train_loss": -27.844701766967773, "global_step": 601697, "epoch": 7249} {"train_loss": -27.764062881469727, "global_step": 601698, "epoch": 7249} {"train_loss": -27.91497230529785, "global_step": 601699, "epoch": 7249} {"train_loss": -28.101953506469727, "global_step": 601700, "epoch": 7249} {"train_loss": -27.851913452148438, "global_step": 601701, "epoch": 7249} {"train_loss": -28.092315673828125, "global_step": 601702, "epoch": 7249} {"train_loss": -28.245319366455078, "global_step": 601703, "epoch": 7249} {"train_loss": -27.7602481842041, "global_step": 601704, "epoch": 7249} {"train_loss": -28.1176815032959, "global_step": 601705, "epoch": 7249} {"train_loss": -27.427764892578125, "global_step": 601706, "epoch": 7249} {"train_loss": -28.09946060180664, "global_step": 601707, "epoch": 7249} {"train_loss": -27.86154556274414, "global_step": 601708, "epoch": 7249} {"train_loss": -28.001312255859375, "global_step": 601709, "epoch": 7249} {"train_loss": -27.833759307861328, "global_step": 601710, "epoch": 7249} {"train_loss": -28.16107177734375, "global_step": 601711, "epoch": 7249} {"train_loss": -27.989395141601562, "global_step": 601712, "epoch": 7249} {"train_loss": -27.750965118408203, "global_step": 601713, "epoch": 7249} {"train_loss": -27.918609619140625, "global_step": 601714, "epoch": 7249} {"train_loss": -28.339685440063477, "global_step": 601715, "epoch": 7249} {"train_loss": -28.033437728881836, "global_step": 601716, "epoch": 7249} {"train_loss": -28.38172721862793, "global_step": 601717, "epoch": 7249} {"train_loss": -28.1427059173584, "global_step": 601718, "epoch": 7249} {"train_loss": -28.130842208862305, "global_step": 601719, "epoch": 7249} {"train_loss": -28.281518936157227, "global_step": 601720, "epoch": 7249} {"train_loss": -27.93463706970215, "global_step": 601721, "epoch": 7249} {"train_loss": -27.85052490234375, "global_step": 601722, "epoch": 7249} {"train_loss": -27.77515983581543, "global_step": 601723, "epoch": 7249} {"train_loss": -28.206302642822266, "global_step": 601724, "epoch": 7249} {"train_loss": -28.06623649597168, "global_step": 601725, "epoch": 7249} {"train_loss": -28.173078536987305, "global_step": 601726, "epoch": 7249} {"train_loss": -27.961328506469727, "global_step": 601727, "epoch": 7249} {"train_loss": -27.738067626953125, "global_step": 601728, "epoch": 7249} {"train_loss": -27.88722801208496, "global_step": 601729, "epoch": 7249} {"train_loss": -28.16109275817871, "global_step": 601730, "epoch": 7249} {"train_loss": -28.0885009765625, "global_step": 601731, "epoch": 7249} {"train_loss": -27.932453155517578, "global_step": 601732, "epoch": 7249} {"train_loss": -28.203283309936523, "global_step": 601733, "epoch": 7249} {"train_loss": -28.463056564331055, "global_step": 601734, "epoch": 7249} {"train_loss": -27.919233322143555, "global_step": 601735, "epoch": 7249} {"train_loss": -28.1157283782959, "global_step": 601736, "epoch": 7249} {"train_loss": -28.076467514038086, "global_step": 601737, "epoch": 7249} {"train_loss": -28.252201080322266, "global_step": 601738, "epoch": 7249} {"train_loss": -28.015012741088867, "global_step": 601739, "epoch": 7249} {"train_loss": -27.819416046142578, "global_step": 601740, "epoch": 7249} {"train_loss": -28.2601375579834, "global_step": 601741, "epoch": 7249} {"train_loss": -28.307037353515625, "global_step": 601742, "epoch": 7249} {"train_loss": -27.909738540649414, "global_step": 601743, "epoch": 7249} {"train_loss": -27.987060546875, "global_step": 601744, "epoch": 7249} {"train_loss": -27.7811222076416, "global_step": 601745, "epoch": 7249} {"train_loss": -28.671064376831055, "global_step": 601746, "epoch": 7249} {"train_loss": -28.132404327392578, "global_step": 601747, "epoch": 7249} {"train_loss": -28.11199951171875, "global_step": 601748, "epoch": 7249} {"train_loss": -27.805396045546935, "global_step": 601749, "epoch": 7249, "val_loss": 6588236.5} {"train_loss": -28.01171875, "global_step": 601750, "epoch": 7250} {"train_loss": -28.10003089904785, "global_step": 601751, "epoch": 7250} {"train_loss": -27.965911865234375, "global_step": 601752, "epoch": 7250} {"train_loss": -28.43233299255371, "global_step": 601753, "epoch": 7250} {"train_loss": -27.648813247680664, "global_step": 601754, "epoch": 7250} {"train_loss": -27.8299503326416, "global_step": 601755, "epoch": 7250} {"train_loss": -27.691858291625977, "global_step": 601756, "epoch": 7250} {"train_loss": -27.910253524780273, "global_step": 601757, "epoch": 7250} {"train_loss": -27.938154220581055, "global_step": 601758, "epoch": 7250} {"train_loss": -27.94795036315918, "global_step": 601759, "epoch": 7250} {"train_loss": -27.814558029174805, "global_step": 601760, "epoch": 7250} {"train_loss": -27.81732177734375, "global_step": 601761, "epoch": 7250} {"train_loss": -28.00507164001465, "global_step": 601762, "epoch": 7250} {"train_loss": -27.972869873046875, "global_step": 601763, "epoch": 7250} {"train_loss": -27.8880615234375, "global_step": 601764, "epoch": 7250} {"train_loss": -27.597503662109375, "global_step": 601765, "epoch": 7250} {"train_loss": -28.052001953125, "global_step": 601766, "epoch": 7250} {"train_loss": -27.567480087280273, "global_step": 601767, "epoch": 7250} {"train_loss": -28.46235466003418, "global_step": 601768, "epoch": 7250} {"train_loss": -28.153730392456055, "global_step": 601769, "epoch": 7250} {"train_loss": -28.175153732299805, "global_step": 601770, "epoch": 7250} {"train_loss": -28.254779815673828, "global_step": 601771, "epoch": 7250} {"train_loss": -28.028223037719727, "global_step": 601772, "epoch": 7250} {"train_loss": -28.074817657470703, "global_step": 601773, "epoch": 7250} {"train_loss": -28.192182540893555, "global_step": 601774, "epoch": 7250} {"train_loss": -27.785245895385742, "global_step": 601775, "epoch": 7250} {"train_loss": -28.115453720092773, "global_step": 601776, "epoch": 7250} {"train_loss": -27.78086280822754, "global_step": 601777, "epoch": 7250} {"train_loss": -28.04245376586914, "global_step": 601778, "epoch": 7250} {"train_loss": -28.270933151245117, "global_step": 601779, "epoch": 7250} {"train_loss": -28.138715744018555, "global_step": 601780, "epoch": 7250} {"train_loss": -28.287841796875, "global_step": 601781, "epoch": 7250} {"train_loss": -28.111988067626953, "global_step": 601782, "epoch": 7250} {"train_loss": -28.09722900390625, "global_step": 601783, "epoch": 7250} {"train_loss": -28.286279678344727, "global_step": 601784, "epoch": 7250} {"train_loss": -28.12839698791504, "global_step": 601785, "epoch": 7250} {"train_loss": -28.086523056030273, "global_step": 601786, "epoch": 7250} {"train_loss": -27.959741592407227, "global_step": 601787, "epoch": 7250} {"train_loss": -28.149763107299805, "global_step": 601788, "epoch": 7250} {"train_loss": -28.186216354370117, "global_step": 601789, "epoch": 7250} {"train_loss": -28.3029727935791, "global_step": 601790, "epoch": 7250} {"train_loss": -28.221715927124023, "global_step": 601791, "epoch": 7250} {"train_loss": -28.028583526611328, "global_step": 601792, "epoch": 7250} {"train_loss": -28.32988929748535, "global_step": 601793, "epoch": 7250} {"train_loss": -28.124069213867188, "global_step": 601794, "epoch": 7250} {"train_loss": -27.91742515563965, "global_step": 601795, "epoch": 7250} {"train_loss": -28.562978744506836, "global_step": 601796, "epoch": 7250} {"train_loss": -28.061695098876953, "global_step": 601797, "epoch": 7250} {"train_loss": -28.07441520690918, "global_step": 601798, "epoch": 7250} {"train_loss": -27.829090118408203, "global_step": 601799, "epoch": 7250} {"train_loss": -28.526798248291016, "global_step": 601800, "epoch": 7250} {"train_loss": -28.370441436767578, "global_step": 601801, "epoch": 7250} {"train_loss": -28.06903648376465, "global_step": 601802, "epoch": 7250} {"train_loss": -28.009626388549805, "global_step": 601803, "epoch": 7250} {"train_loss": -27.759897232055664, "global_step": 601804, "epoch": 7250} {"train_loss": -28.113819122314453, "global_step": 601805, "epoch": 7250} {"train_loss": -28.026769638061523, "global_step": 601806, "epoch": 7250} {"train_loss": -27.78287696838379, "global_step": 601807, "epoch": 7250} {"train_loss": -28.262048721313477, "global_step": 601808, "epoch": 7250} {"train_loss": -28.1475772857666, "global_step": 601809, "epoch": 7250} {"train_loss": -28.206872940063477, "global_step": 601810, "epoch": 7250} {"train_loss": -28.2473201751709, "global_step": 601811, "epoch": 7250} {"train_loss": -28.092016220092773, "global_step": 601812, "epoch": 7250} {"train_loss": -28.360641479492188, "global_step": 601813, "epoch": 7250} {"train_loss": -27.873926162719727, "global_step": 601814, "epoch": 7250} {"train_loss": -28.065235137939453, "global_step": 601815, "epoch": 7250} {"train_loss": -28.33681297302246, "global_step": 601816, "epoch": 7250} {"train_loss": -28.195423126220703, "global_step": 601817, "epoch": 7250} {"train_loss": -28.37494468688965, "global_step": 601818, "epoch": 7250} {"train_loss": -28.0097599029541, "global_step": 601819, "epoch": 7250} {"train_loss": -28.389862060546875, "global_step": 601820, "epoch": 7250} {"train_loss": -28.3301944732666, "global_step": 601821, "epoch": 7250} {"train_loss": -28.354429244995117, "global_step": 601822, "epoch": 7250} {"train_loss": -28.22052574157715, "global_step": 601823, "epoch": 7250} {"train_loss": -28.257429122924805, "global_step": 601824, "epoch": 7250} {"train_loss": -28.081195831298828, "global_step": 601825, "epoch": 7250} {"train_loss": -28.112842559814453, "global_step": 601826, "epoch": 7250} {"train_loss": -28.126989364624023, "global_step": 601827, "epoch": 7250} {"train_loss": -27.886518478393555, "global_step": 601828, "epoch": 7250} {"train_loss": -28.389801025390625, "global_step": 601829, "epoch": 7250} {"train_loss": -27.9678897857666, "global_step": 601830, "epoch": 7250} {"train_loss": -27.9478759765625, "global_step": 601831, "epoch": 7250} {"train_loss": -28.099136605320208, "global_step": 601832, "epoch": 7250, "train/sim_max_reward_0": 0.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 0.0, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4500000": 1.0, "test/sim_max_reward_4500001": 1.0, "test/sim_max_reward_4500002": 1.0, "test/sim_max_reward_4500003": 1.0, "test/sim_max_reward_4500004": 1.0, "test/sim_max_reward_4500005": 1.0, "test/sim_max_reward_4500006": 1.0, "test/sim_max_reward_4500007": 0.0, "test/sim_max_reward_4500008": 1.0, "test/sim_max_reward_4500009": 1.0, "test/sim_max_reward_4500010": 1.0, "test/sim_max_reward_4500011": 1.0, "test/sim_max_reward_4500012": 1.0, "test/sim_max_reward_4500013": 0.0, "test/sim_max_reward_4500014": 1.0, "test/sim_max_reward_4500015": 1.0, "test/sim_max_reward_4500016": 1.0, "test/sim_max_reward_4500017": 1.0, "test/sim_max_reward_4500018": 0.0, "test/sim_max_reward_4500019": 1.0, "test/sim_max_reward_4500020": 1.0, "test/sim_max_reward_4500021": 1.0, "train/mean_score": 0.6666666666666666, "test/mean_score": 0.8636363636363636, "val_loss": 6612152.0} {"train_loss": -27.437774658203125, "global_step": 601833, "epoch": 7251} {"train_loss": -26.71591567993164, "global_step": 601834, "epoch": 7251} {"train_loss": -25.12175941467285, "global_step": 601835, "epoch": 7251} {"train_loss": -25.263906478881836, "global_step": 601836, "epoch": 7251} {"train_loss": -26.74256706237793, "global_step": 601837, "epoch": 7251} {"train_loss": -26.85883903503418, "global_step": 601838, "epoch": 7251} {"train_loss": -27.23093032836914, "global_step": 601839, "epoch": 7251} {"train_loss": -26.722858428955078, "global_step": 601840, "epoch": 7251} {"train_loss": -27.285709381103516, "global_step": 601841, "epoch": 7251} {"train_loss": -27.341598510742188, "global_step": 601842, "epoch": 7251} {"train_loss": -27.3760929107666, "global_step": 601843, "epoch": 7251} {"train_loss": -27.5225772857666, "global_step": 601844, "epoch": 7251} {"train_loss": -27.59465980529785, "global_step": 601845, "epoch": 7251} {"train_loss": -27.505590438842773, "global_step": 601846, "epoch": 7251} {"train_loss": -27.52174186706543, "global_step": 601847, "epoch": 7251} {"train_loss": -27.439767837524414, "global_step": 601848, "epoch": 7251} {"train_loss": -27.54347038269043, "global_step": 601849, "epoch": 7251} {"train_loss": -27.74395751953125, "global_step": 601850, "epoch": 7251} {"train_loss": -27.55707359313965, "global_step": 601851, "epoch": 7251} {"train_loss": -27.81125259399414, "global_step": 601852, "epoch": 7251} {"train_loss": -27.831750869750977, "global_step": 601853, "epoch": 7251} {"train_loss": -27.878986358642578, "global_step": 601854, "epoch": 7251} {"train_loss": -27.781213760375977, "global_step": 601855, "epoch": 7251} {"train_loss": -28.054983139038086, "global_step": 601856, "epoch": 7251} {"train_loss": -27.640838623046875, "global_step": 601857, "epoch": 7251} {"train_loss": -27.71187400817871, "global_step": 601858, "epoch": 7251} {"train_loss": -28.03546714782715, "global_step": 601859, "epoch": 7251} {"train_loss": -27.94391441345215, "global_step": 601860, "epoch": 7251} {"train_loss": -27.47553825378418, "global_step": 601861, "epoch": 7251} {"train_loss": -27.83662986755371, "global_step": 601862, "epoch": 7251} {"train_loss": -28.110742568969727, "global_step": 601863, "epoch": 7251} {"train_loss": -28.089704513549805, "global_step": 601864, "epoch": 7251} {"train_loss": -27.619556427001953, "global_step": 601865, "epoch": 7251} {"train_loss": -27.829816818237305, "global_step": 601866, "epoch": 7251} {"train_loss": -28.14773941040039, "global_step": 601867, "epoch": 7251} {"train_loss": -28.117923736572266, "global_step": 601868, "epoch": 7251} {"train_loss": -28.169065475463867, "global_step": 601869, "epoch": 7251} {"train_loss": -28.191986083984375, "global_step": 601870, "epoch": 7251} {"train_loss": -27.617816925048828, "global_step": 601871, "epoch": 7251} {"train_loss": -28.193496704101562, "global_step": 601872, "epoch": 7251} {"train_loss": -28.102209091186523, "global_step": 601873, "epoch": 7251} {"train_loss": -27.847885131835938, "global_step": 601874, "epoch": 7251} {"train_loss": -28.079160690307617, "global_step": 601875, "epoch": 7251} {"train_loss": -28.207324981689453, "global_step": 601876, "epoch": 7251} {"train_loss": -27.979238510131836, "global_step": 601877, "epoch": 7251} {"train_loss": -28.32587242126465, "global_step": 601878, "epoch": 7251} {"train_loss": -27.770709991455078, "global_step": 601879, "epoch": 7251} {"train_loss": -28.626331329345703, "global_step": 601880, "epoch": 7251} {"train_loss": -28.48626136779785, "global_step": 601881, "epoch": 7251} {"train_loss": -28.158374786376953, "global_step": 601882, "epoch": 7251} {"train_loss": -28.34050941467285, "global_step": 601883, "epoch": 7251} {"train_loss": -28.224735260009766, "global_step": 601884, "epoch": 7251} {"train_loss": -27.996862411499023, "global_step": 601885, "epoch": 7251} {"train_loss": -28.224323272705078, "global_step": 601886, "epoch": 7251} {"train_loss": -28.380878448486328, "global_step": 601887, "epoch": 7251} {"train_loss": -28.406774520874023, "global_step": 601888, "epoch": 7251} {"train_loss": -28.3031005859375, "global_step": 601889, "epoch": 7251} {"train_loss": -27.84236717224121, "global_step": 601890, "epoch": 7251} {"train_loss": -28.088764190673828, "global_step": 601891, "epoch": 7251} {"train_loss": -27.735212326049805, "global_step": 601892, "epoch": 7251} {"train_loss": -28.219385147094727, "global_step": 601893, "epoch": 7251} {"train_loss": -28.450708389282227, "global_step": 601894, "epoch": 7251} {"train_loss": -27.78462028503418, "global_step": 601895, "epoch": 7251} {"train_loss": -27.884977340698242, "global_step": 601896, "epoch": 7251} {"train_loss": -28.198810577392578, "global_step": 601897, "epoch": 7251} {"train_loss": -27.932178497314453, "global_step": 601898, "epoch": 7251} {"train_loss": -28.0810546875, "global_step": 601899, "epoch": 7251} {"train_loss": -27.939105987548828, "global_step": 601900, "epoch": 7251} {"train_loss": -27.997419357299805, "global_step": 601901, "epoch": 7251} {"train_loss": -27.927778244018555, "global_step": 601902, "epoch": 7251} {"train_loss": -28.056798934936523, "global_step": 601903, "epoch": 7251} {"train_loss": -28.15175437927246, "global_step": 601904, "epoch": 7251} {"train_loss": -27.782270431518555, "global_step": 601905, "epoch": 7251} {"train_loss": -27.870929718017578, "global_step": 601906, "epoch": 7251} {"train_loss": -27.903827667236328, "global_step": 601907, "epoch": 7251} {"train_loss": -27.4256534576416, "global_step": 601908, "epoch": 7251} {"train_loss": -28.477161407470703, "global_step": 601909, "epoch": 7251} {"train_loss": -28.1530818939209, "global_step": 601910, "epoch": 7251} {"train_loss": -28.075946807861328, "global_step": 601911, "epoch": 7251} {"train_loss": -27.757171630859375, "global_step": 601912, "epoch": 7251} {"train_loss": -28.321781158447266, "global_step": 601913, "epoch": 7251} {"train_loss": -28.1444034576416, "global_step": 601914, "epoch": 7251} {"train_loss": -27.82534192556358, "global_step": 601915, "epoch": 7251, "val_loss": 6611546.0} {"train_loss": -27.248981475830078, "global_step": 601916, "epoch": 7252} {"train_loss": -27.39885902404785, "global_step": 601917, "epoch": 7252} {"train_loss": -27.662790298461914, "global_step": 601918, "epoch": 7252} {"train_loss": -27.698455810546875, "global_step": 601919, "epoch": 7252} {"train_loss": -27.767118453979492, "global_step": 601920, "epoch": 7252} {"train_loss": -27.5328369140625, "global_step": 601921, "epoch": 7252} {"train_loss": -27.459951400756836, "global_step": 601922, "epoch": 7252} {"train_loss": -27.630023956298828, "global_step": 601923, "epoch": 7252} {"train_loss": -27.816791534423828, "global_step": 601924, "epoch": 7252} {"train_loss": -28.00751304626465, "global_step": 601925, "epoch": 7252} {"train_loss": -27.53644371032715, "global_step": 601926, "epoch": 7252} {"train_loss": -27.900415420532227, "global_step": 601927, "epoch": 7252} {"train_loss": -27.376861572265625, "global_step": 601928, "epoch": 7252} {"train_loss": -27.82071304321289, "global_step": 601929, "epoch": 7252} {"train_loss": -27.866119384765625, "global_step": 601930, "epoch": 7252} {"train_loss": -27.695220947265625, "global_step": 601931, "epoch": 7252} {"train_loss": -27.699569702148438, "global_step": 601932, "epoch": 7252} {"train_loss": -27.659423828125, "global_step": 601933, "epoch": 7252} {"train_loss": -27.90170669555664, "global_step": 601934, "epoch": 7252} {"train_loss": -27.686410903930664, "global_step": 601935, "epoch": 7252} {"train_loss": -27.933446884155273, "global_step": 601936, "epoch": 7252} {"train_loss": -27.893173217773438, "global_step": 601937, "epoch": 7252} {"train_loss": -27.484607696533203, "global_step": 601938, "epoch": 7252} {"train_loss": -28.228397369384766, "global_step": 601939, "epoch": 7252} {"train_loss": -28.323444366455078, "global_step": 601940, "epoch": 7252} {"train_loss": -27.895429611206055, "global_step": 601941, "epoch": 7252} {"train_loss": -28.005598068237305, "global_step": 601942, "epoch": 7252} {"train_loss": -27.583114624023438, "global_step": 601943, "epoch": 7252} {"train_loss": -28.277143478393555, "global_step": 601944, "epoch": 7252} {"train_loss": -28.173154830932617, "global_step": 601945, "epoch": 7252} {"train_loss": -27.92714500427246, "global_step": 601946, "epoch": 7252} {"train_loss": -27.931976318359375, "global_step": 601947, "epoch": 7252} {"train_loss": -27.918720245361328, "global_step": 601948, "epoch": 7252} {"train_loss": -28.392114639282227, "global_step": 601949, "epoch": 7252} {"train_loss": -28.126428604125977, "global_step": 601950, "epoch": 7252} {"train_loss": -28.013031005859375, "global_step": 601951, "epoch": 7252} {"train_loss": -28.092493057250977, "global_step": 601952, "epoch": 7252} {"train_loss": -28.281070709228516, "global_step": 601953, "epoch": 7252} {"train_loss": -28.197010040283203, "global_step": 601954, "epoch": 7252} {"train_loss": -28.201303482055664, "global_step": 601955, "epoch": 7252} {"train_loss": -27.839994430541992, "global_step": 601956, "epoch": 7252} {"train_loss": -28.179258346557617, "global_step": 601957, "epoch": 7252} {"train_loss": -28.256799697875977, "global_step": 601958, "epoch": 7252} {"train_loss": -28.11701774597168, "global_step": 601959, "epoch": 7252} {"train_loss": -28.105148315429688, "global_step": 601960, "epoch": 7252} {"train_loss": -28.0754337310791, "global_step": 601961, "epoch": 7252} {"train_loss": -27.894916534423828, "global_step": 601962, "epoch": 7252} {"train_loss": -28.13701820373535, "global_step": 601963, "epoch": 7252} {"train_loss": -27.938339233398438, "global_step": 601964, "epoch": 7252} {"train_loss": -28.1272029876709, "global_step": 601965, "epoch": 7252} {"train_loss": -28.186552047729492, "global_step": 601966, "epoch": 7252} {"train_loss": -27.755081176757812, "global_step": 601967, "epoch": 7252} {"train_loss": -28.152551651000977, "global_step": 601968, "epoch": 7252} {"train_loss": -28.10454750061035, "global_step": 601969, "epoch": 7252} {"train_loss": -28.125585556030273, "global_step": 601970, "epoch": 7252} {"train_loss": -27.73353385925293, "global_step": 601971, "epoch": 7252} {"train_loss": -28.0231990814209, "global_step": 601972, "epoch": 7252} {"train_loss": -28.01958656311035, "global_step": 601973, "epoch": 7252} {"train_loss": -28.060842514038086, "global_step": 601974, "epoch": 7252} {"train_loss": -28.055850982666016, "global_step": 601975, "epoch": 7252} {"train_loss": -27.99533462524414, "global_step": 601976, "epoch": 7252} {"train_loss": -27.567646026611328, "global_step": 601977, "epoch": 7252} {"train_loss": -27.894458770751953, "global_step": 601978, "epoch": 7252} {"train_loss": -27.54443359375, "global_step": 601979, "epoch": 7252} {"train_loss": -27.83424186706543, "global_step": 601980, "epoch": 7252} {"train_loss": -28.070470809936523, "global_step": 601981, "epoch": 7252} {"train_loss": -28.05548667907715, "global_step": 601982, "epoch": 7252} {"train_loss": -28.078174591064453, "global_step": 601983, "epoch": 7252} {"train_loss": -28.445556640625, "global_step": 601984, "epoch": 7252} {"train_loss": -28.1287841796875, "global_step": 601985, "epoch": 7252} {"train_loss": -28.12565040588379, "global_step": 601986, "epoch": 7252} {"train_loss": -28.15738868713379, "global_step": 601987, "epoch": 7252} {"train_loss": -28.16546630859375, "global_step": 601988, "epoch": 7252} {"train_loss": -28.378326416015625, "global_step": 601989, "epoch": 7252} {"train_loss": -27.938032150268555, "global_step": 601990, "epoch": 7252} {"train_loss": -28.123889923095703, "global_step": 601991, "epoch": 7252} {"train_loss": -28.020299911499023, "global_step": 601992, "epoch": 7252} {"train_loss": -28.326675415039062, "global_step": 601993, "epoch": 7252} {"train_loss": -28.447492599487305, "global_step": 601994, "epoch": 7252} {"train_loss": -28.033100128173828, "global_step": 601995, "epoch": 7252} {"train_loss": -28.12849235534668, "global_step": 601996, "epoch": 7252} {"train_loss": -28.340612411499023, "global_step": 601997, "epoch": 7252} {"train_loss": -27.96392408623753, "global_step": 601998, "epoch": 7252, "val_loss": 6531338.0} {"train_loss": -27.217939376831055, "global_step": 601999, "epoch": 7253} {"train_loss": -27.431812286376953, "global_step": 602000, "epoch": 7253} {"train_loss": -27.694290161132812, "global_step": 602001, "epoch": 7253} {"train_loss": -27.68940544128418, "global_step": 602002, "epoch": 7253} {"train_loss": -27.386489868164062, "global_step": 602003, "epoch": 7253} {"train_loss": -27.77205467224121, "global_step": 602004, "epoch": 7253} {"train_loss": -27.171926498413086, "global_step": 602005, "epoch": 7253} {"train_loss": -28.242767333984375, "global_step": 602006, "epoch": 7253} {"train_loss": -27.26508140563965, "global_step": 602007, "epoch": 7253} {"train_loss": -28.2147216796875, "global_step": 602008, "epoch": 7253} {"train_loss": -27.63556480407715, "global_step": 602009, "epoch": 7253} {"train_loss": -27.99471092224121, "global_step": 602010, "epoch": 7253} {"train_loss": -27.876981735229492, "global_step": 602011, "epoch": 7253} {"train_loss": -27.84284782409668, "global_step": 602012, "epoch": 7253} {"train_loss": -27.758838653564453, "global_step": 602013, "epoch": 7253} {"train_loss": -27.9614200592041, "global_step": 602014, "epoch": 7253} {"train_loss": -27.71563148498535, "global_step": 602015, "epoch": 7253} {"train_loss": -28.030078887939453, "global_step": 602016, "epoch": 7253} {"train_loss": -27.895593643188477, "global_step": 602017, "epoch": 7253} {"train_loss": -28.13663673400879, "global_step": 602018, "epoch": 7253} {"train_loss": -27.8432559967041, "global_step": 602019, "epoch": 7253} {"train_loss": -27.826953887939453, "global_step": 602020, "epoch": 7253} {"train_loss": -28.274585723876953, "global_step": 602021, "epoch": 7253} {"train_loss": -28.061767578125, "global_step": 602022, "epoch": 7253} {"train_loss": -27.902395248413086, "global_step": 602023, "epoch": 7253} {"train_loss": -28.011566162109375, "global_step": 602024, "epoch": 7253} {"train_loss": -27.860105514526367, "global_step": 602025, "epoch": 7253} {"train_loss": -27.97052574157715, "global_step": 602026, "epoch": 7253} {"train_loss": -28.1411190032959, "global_step": 602027, "epoch": 7253} {"train_loss": -28.166101455688477, "global_step": 602028, "epoch": 7253} {"train_loss": -28.036575317382812, "global_step": 602029, "epoch": 7253} {"train_loss": -28.26214027404785, "global_step": 602030, "epoch": 7253} {"train_loss": -27.64892578125, "global_step": 602031, "epoch": 7253} {"train_loss": -27.944135665893555, "global_step": 602032, "epoch": 7253} {"train_loss": -28.16529655456543, "global_step": 602033, "epoch": 7253} {"train_loss": -28.20516014099121, "global_step": 602034, "epoch": 7253} {"train_loss": -27.765960693359375, "global_step": 602035, "epoch": 7253} {"train_loss": -28.31794548034668, "global_step": 602036, "epoch": 7253} {"train_loss": -28.136798858642578, "global_step": 602037, "epoch": 7253} {"train_loss": -27.999601364135742, "global_step": 602038, "epoch": 7253} {"train_loss": -27.907007217407227, "global_step": 602039, "epoch": 7253} {"train_loss": -27.903894424438477, "global_step": 602040, "epoch": 7253} {"train_loss": -28.39116859436035, "global_step": 602041, "epoch": 7253} {"train_loss": -27.54975700378418, "global_step": 602042, "epoch": 7253} {"train_loss": -27.938024520874023, "global_step": 602043, "epoch": 7253} {"train_loss": -28.343069076538086, "global_step": 602044, "epoch": 7253} {"train_loss": -27.92682456970215, "global_step": 602045, "epoch": 7253} {"train_loss": -27.879056930541992, "global_step": 602046, "epoch": 7253} {"train_loss": -27.96002197265625, "global_step": 602047, "epoch": 7253} {"train_loss": -28.189905166625977, "global_step": 602048, "epoch": 7253} {"train_loss": -28.071969985961914, "global_step": 602049, "epoch": 7253} {"train_loss": -28.23960304260254, "global_step": 602050, "epoch": 7253} {"train_loss": -28.121109008789062, "global_step": 602051, "epoch": 7253} {"train_loss": -28.1915340423584, "global_step": 602052, "epoch": 7253} {"train_loss": -28.048925399780273, "global_step": 602053, "epoch": 7253} {"train_loss": -28.269617080688477, "global_step": 602054, "epoch": 7253} {"train_loss": -28.308258056640625, "global_step": 602055, "epoch": 7253} {"train_loss": -28.181257247924805, "global_step": 602056, "epoch": 7253} {"train_loss": -27.93317985534668, "global_step": 602057, "epoch": 7253} {"train_loss": -28.382369995117188, "global_step": 602058, "epoch": 7253} {"train_loss": -27.89238929748535, "global_step": 602059, "epoch": 7253} {"train_loss": -28.438318252563477, "global_step": 602060, "epoch": 7253} {"train_loss": -27.8848934173584, "global_step": 602061, "epoch": 7253} {"train_loss": -27.962574005126953, "global_step": 602062, "epoch": 7253} {"train_loss": -28.174161911010742, "global_step": 602063, "epoch": 7253} {"train_loss": -28.299184799194336, "global_step": 602064, "epoch": 7253} {"train_loss": -28.130817413330078, "global_step": 602065, "epoch": 7253} {"train_loss": -28.107526779174805, "global_step": 602066, "epoch": 7253} {"train_loss": -28.028091430664062, "global_step": 602067, "epoch": 7253} {"train_loss": -28.02227783203125, "global_step": 602068, "epoch": 7253} {"train_loss": -28.15370750427246, "global_step": 602069, "epoch": 7253} {"train_loss": -28.376678466796875, "global_step": 602070, "epoch": 7253} {"train_loss": -28.302051544189453, "global_step": 602071, "epoch": 7253} {"train_loss": -28.599628448486328, "global_step": 602072, "epoch": 7253} {"train_loss": -28.037328720092773, "global_step": 602073, "epoch": 7253} {"train_loss": -28.188581466674805, "global_step": 602074, "epoch": 7253} {"train_loss": -28.066192626953125, "global_step": 602075, "epoch": 7253} {"train_loss": -28.118122100830078, "global_step": 602076, "epoch": 7253} {"train_loss": -28.018030166625977, "global_step": 602077, "epoch": 7253} {"train_loss": -27.747669219970703, "global_step": 602078, "epoch": 7253} {"train_loss": -28.73200798034668, "global_step": 602079, "epoch": 7253} {"train_loss": -27.962125778198242, "global_step": 602080, "epoch": 7253} {"train_loss": -27.997579183923193, "global_step": 602081, "epoch": 7253, "val_loss": 6654237.0} {"train_loss": -26.808820724487305, "global_step": 602082, "epoch": 7254} {"train_loss": -25.755659103393555, "global_step": 602083, "epoch": 7254} {"train_loss": -25.03135108947754, "global_step": 602084, "epoch": 7254} {"train_loss": -26.427021026611328, "global_step": 602085, "epoch": 7254} {"train_loss": -26.411222457885742, "global_step": 602086, "epoch": 7254} {"train_loss": -26.106475830078125, "global_step": 602087, "epoch": 7254} {"train_loss": -27.364004135131836, "global_step": 602088, "epoch": 7254} {"train_loss": -27.035694122314453, "global_step": 602089, "epoch": 7254} {"train_loss": -27.08722496032715, "global_step": 602090, "epoch": 7254} {"train_loss": -27.456684112548828, "global_step": 602091, "epoch": 7254} {"train_loss": -26.757892608642578, "global_step": 602092, "epoch": 7254} {"train_loss": -27.00275230407715, "global_step": 602093, "epoch": 7254} {"train_loss": -27.17506980895996, "global_step": 602094, "epoch": 7254} {"train_loss": -27.591522216796875, "global_step": 602095, "epoch": 7254} {"train_loss": -27.225988388061523, "global_step": 602096, "epoch": 7254} {"train_loss": -27.339359283447266, "global_step": 602097, "epoch": 7254} {"train_loss": -27.567304611206055, "global_step": 602098, "epoch": 7254} {"train_loss": -27.59098243713379, "global_step": 602099, "epoch": 7254} {"train_loss": -27.566059112548828, "global_step": 602100, "epoch": 7254} {"train_loss": -27.378583908081055, "global_step": 602101, "epoch": 7254} {"train_loss": -27.620553970336914, "global_step": 602102, "epoch": 7254} {"train_loss": -27.33367347717285, "global_step": 602103, "epoch": 7254} {"train_loss": -27.910322189331055, "global_step": 602104, "epoch": 7254} {"train_loss": -27.715972900390625, "global_step": 602105, "epoch": 7254} {"train_loss": -27.944412231445312, "global_step": 602106, "epoch": 7254} {"train_loss": -27.820890426635742, "global_step": 602107, "epoch": 7254} {"train_loss": -27.79340171813965, "global_step": 602108, "epoch": 7254} {"train_loss": -28.18513298034668, "global_step": 602109, "epoch": 7254} {"train_loss": -27.78841209411621, "global_step": 602110, "epoch": 7254} {"train_loss": -27.4725399017334, "global_step": 602111, "epoch": 7254} {"train_loss": -28.0269775390625, "global_step": 602112, "epoch": 7254} {"train_loss": -27.772390365600586, "global_step": 602113, "epoch": 7254} {"train_loss": -27.633514404296875, "global_step": 602114, "epoch": 7254} {"train_loss": -27.9560604095459, "global_step": 602115, "epoch": 7254} {"train_loss": -27.684789657592773, "global_step": 602116, "epoch": 7254} {"train_loss": -27.960712432861328, "global_step": 602117, "epoch": 7254} {"train_loss": -27.998920440673828, "global_step": 602118, "epoch": 7254} {"train_loss": -27.990568161010742, "global_step": 602119, "epoch": 7254} {"train_loss": -27.9354305267334, "global_step": 602120, "epoch": 7254} {"train_loss": -28.120615005493164, "global_step": 602121, "epoch": 7254} {"train_loss": -28.030292510986328, "global_step": 602122, "epoch": 7254} {"train_loss": -28.21034049987793, "global_step": 602123, "epoch": 7254} {"train_loss": -27.930505752563477, "global_step": 602124, "epoch": 7254} {"train_loss": -28.0031681060791, "global_step": 602125, "epoch": 7254} {"train_loss": -27.97206687927246, "global_step": 602126, "epoch": 7254} {"train_loss": -28.09058952331543, "global_step": 602127, "epoch": 7254} {"train_loss": -28.106311798095703, "global_step": 602128, "epoch": 7254} {"train_loss": -28.04957389831543, "global_step": 602129, "epoch": 7254} {"train_loss": -27.917236328125, "global_step": 602130, "epoch": 7254} {"train_loss": -27.798675537109375, "global_step": 602131, "epoch": 7254} {"train_loss": -28.050939559936523, "global_step": 602132, "epoch": 7254} {"train_loss": -28.047327041625977, "global_step": 602133, "epoch": 7254} {"train_loss": -28.225671768188477, "global_step": 602134, "epoch": 7254} {"train_loss": -28.205066680908203, "global_step": 602135, "epoch": 7254} {"train_loss": -28.350061416625977, "global_step": 602136, "epoch": 7254} {"train_loss": -28.211965560913086, "global_step": 602137, "epoch": 7254} {"train_loss": -27.8315486907959, "global_step": 602138, "epoch": 7254} {"train_loss": -28.072662353515625, "global_step": 602139, "epoch": 7254} {"train_loss": -27.98590660095215, "global_step": 602140, "epoch": 7254} {"train_loss": -28.472517013549805, "global_step": 602141, "epoch": 7254} {"train_loss": -28.06842041015625, "global_step": 602142, "epoch": 7254} {"train_loss": -28.583866119384766, "global_step": 602143, "epoch": 7254} {"train_loss": -28.117401123046875, "global_step": 602144, "epoch": 7254} {"train_loss": -28.111204147338867, "global_step": 602145, "epoch": 7254} {"train_loss": -28.193933486938477, "global_step": 602146, "epoch": 7254} {"train_loss": -28.44058609008789, "global_step": 602147, "epoch": 7254} {"train_loss": -27.92864418029785, "global_step": 602148, "epoch": 7254} {"train_loss": -28.415302276611328, "global_step": 602149, "epoch": 7254} {"train_loss": -28.05555534362793, "global_step": 602150, "epoch": 7254} {"train_loss": -28.71442985534668, "global_step": 602151, "epoch": 7254} {"train_loss": -28.080902099609375, "global_step": 602152, "epoch": 7254} {"train_loss": -28.14332389831543, "global_step": 602153, "epoch": 7254} {"train_loss": -28.3624267578125, "global_step": 602154, "epoch": 7254} {"train_loss": -28.248096466064453, "global_step": 602155, "epoch": 7254} {"train_loss": -28.255081176757812, "global_step": 602156, "epoch": 7254} {"train_loss": -27.850311279296875, "global_step": 602157, "epoch": 7254} {"train_loss": -28.457244873046875, "global_step": 602158, "epoch": 7254} {"train_loss": -28.035947799682617, "global_step": 602159, "epoch": 7254} {"train_loss": -28.641254425048828, "global_step": 602160, "epoch": 7254} {"train_loss": -28.222000122070312, "global_step": 602161, "epoch": 7254} {"train_loss": -28.335535049438477, "global_step": 602162, "epoch": 7254} {"train_loss": -28.124725341796875, "global_step": 602163, "epoch": 7254} {"train_loss": -27.763778089040734, "global_step": 602164, "epoch": 7254, "val_loss": 6518048.5} {"train_loss": -25.40779685974121, "global_step": 602165, "epoch": 7255} {"train_loss": -26.090484619140625, "global_step": 602166, "epoch": 7255} {"train_loss": -26.988967895507812, "global_step": 602167, "epoch": 7255} {"train_loss": -25.652257919311523, "global_step": 602168, "epoch": 7255} {"train_loss": -26.803449630737305, "global_step": 602169, "epoch": 7255} {"train_loss": -26.55816650390625, "global_step": 602170, "epoch": 7255} {"train_loss": -27.09920310974121, "global_step": 602171, "epoch": 7255} {"train_loss": -26.309829711914062, "global_step": 602172, "epoch": 7255} {"train_loss": -27.15632438659668, "global_step": 602173, "epoch": 7255} {"train_loss": -27.173696517944336, "global_step": 602174, "epoch": 7255} {"train_loss": -26.88469886779785, "global_step": 602175, "epoch": 7255} {"train_loss": -27.376195907592773, "global_step": 602176, "epoch": 7255} {"train_loss": -27.525522232055664, "global_step": 602177, "epoch": 7255} {"train_loss": -27.233219146728516, "global_step": 602178, "epoch": 7255} {"train_loss": -27.457693099975586, "global_step": 602179, "epoch": 7255} {"train_loss": -27.64838981628418, "global_step": 602180, "epoch": 7255} {"train_loss": -27.4126033782959, "global_step": 602181, "epoch": 7255} {"train_loss": -27.687152862548828, "global_step": 602182, "epoch": 7255} {"train_loss": -26.804428100585938, "global_step": 602183, "epoch": 7255} {"train_loss": -27.360380172729492, "global_step": 602184, "epoch": 7255} {"train_loss": -27.541706085205078, "global_step": 602185, "epoch": 7255} {"train_loss": -27.598926544189453, "global_step": 602186, "epoch": 7255} {"train_loss": -27.28839111328125, "global_step": 602187, "epoch": 7255} {"train_loss": -26.970600128173828, "global_step": 602188, "epoch": 7255} {"train_loss": -27.5907039642334, "global_step": 602189, "epoch": 7255} {"train_loss": -27.44367027282715, "global_step": 602190, "epoch": 7255} {"train_loss": -27.363611221313477, "global_step": 602191, "epoch": 7255} {"train_loss": -27.391881942749023, "global_step": 602192, "epoch": 7255} {"train_loss": -27.7657470703125, "global_step": 602193, "epoch": 7255} {"train_loss": -27.37763786315918, "global_step": 602194, "epoch": 7255} {"train_loss": -27.8759765625, "global_step": 602195, "epoch": 7255} {"train_loss": -27.820419311523438, "global_step": 602196, "epoch": 7255} {"train_loss": -27.665212631225586, "global_step": 602197, "epoch": 7255} {"train_loss": -27.714750289916992, "global_step": 602198, "epoch": 7255} {"train_loss": -27.530019760131836, "global_step": 602199, "epoch": 7255} {"train_loss": -27.79448890686035, "global_step": 602200, "epoch": 7255} {"train_loss": -27.628376007080078, "global_step": 602201, "epoch": 7255} {"train_loss": -28.206735610961914, "global_step": 602202, "epoch": 7255} {"train_loss": -27.600494384765625, "global_step": 602203, "epoch": 7255} {"train_loss": -27.588184356689453, "global_step": 602204, "epoch": 7255} {"train_loss": -27.911203384399414, "global_step": 602205, "epoch": 7255} {"train_loss": -28.07374382019043, "global_step": 602206, "epoch": 7255} {"train_loss": -28.06623649597168, "global_step": 602207, "epoch": 7255} {"train_loss": -27.907873153686523, "global_step": 602208, "epoch": 7255} {"train_loss": -27.77247428894043, "global_step": 602209, "epoch": 7255} {"train_loss": -27.7442569732666, "global_step": 602210, "epoch": 7255} {"train_loss": -27.95865821838379, "global_step": 602211, "epoch": 7255} {"train_loss": -27.94451332092285, "global_step": 602212, "epoch": 7255} {"train_loss": -27.710235595703125, "global_step": 602213, "epoch": 7255} {"train_loss": -28.048181533813477, "global_step": 602214, "epoch": 7255} {"train_loss": -28.324811935424805, "global_step": 602215, "epoch": 7255} {"train_loss": -27.972415924072266, "global_step": 602216, "epoch": 7255} {"train_loss": -27.694580078125, "global_step": 602217, "epoch": 7255} {"train_loss": -28.33562660217285, "global_step": 602218, "epoch": 7255} {"train_loss": -27.800867080688477, "global_step": 602219, "epoch": 7255} {"train_loss": -27.86677360534668, "global_step": 602220, "epoch": 7255} {"train_loss": -27.65986442565918, "global_step": 602221, "epoch": 7255} {"train_loss": -27.9721622467041, "global_step": 602222, "epoch": 7255} {"train_loss": -28.084457397460938, "global_step": 602223, "epoch": 7255} {"train_loss": -28.41035270690918, "global_step": 602224, "epoch": 7255} {"train_loss": -28.440673828125, "global_step": 602225, "epoch": 7255} {"train_loss": -27.714277267456055, "global_step": 602226, "epoch": 7255} {"train_loss": -27.9631404876709, "global_step": 602227, "epoch": 7255} {"train_loss": -27.773462295532227, "global_step": 602228, "epoch": 7255} {"train_loss": -28.137903213500977, "global_step": 602229, "epoch": 7255} {"train_loss": -28.18131446838379, "global_step": 602230, "epoch": 7255} {"train_loss": -28.518156051635742, "global_step": 602231, "epoch": 7255} {"train_loss": -28.21173667907715, "global_step": 602232, "epoch": 7255} {"train_loss": -28.279937744140625, "global_step": 602233, "epoch": 7255} {"train_loss": -28.266820907592773, "global_step": 602234, "epoch": 7255} {"train_loss": -27.912790298461914, "global_step": 602235, "epoch": 7255} {"train_loss": -28.191335678100586, "global_step": 602236, "epoch": 7255} {"train_loss": -28.294662475585938, "global_step": 602237, "epoch": 7255} {"train_loss": -27.838659286499023, "global_step": 602238, "epoch": 7255} {"train_loss": -27.631437301635742, "global_step": 602239, "epoch": 7255} {"train_loss": -28.17933464050293, "global_step": 602240, "epoch": 7255} {"train_loss": -27.865446090698242, "global_step": 602241, "epoch": 7255} {"train_loss": -28.061033248901367, "global_step": 602242, "epoch": 7255} {"train_loss": -27.86806297302246, "global_step": 602243, "epoch": 7255} {"train_loss": -27.939008712768555, "global_step": 602244, "epoch": 7255} {"train_loss": -27.8276309967041, "global_step": 602245, "epoch": 7255} {"train_loss": -27.5596981048584, "global_step": 602246, "epoch": 7255} {"train_loss": -27.624450499752918, "global_step": 602247, "epoch": 7255, "val_loss": 6553815.0} {"train_loss": -26.234130859375, "global_step": 602248, "epoch": 7256} {"train_loss": -26.717350006103516, "global_step": 602249, "epoch": 7256} {"train_loss": -27.267629623413086, "global_step": 602250, "epoch": 7256} {"train_loss": -27.198898315429688, "global_step": 602251, "epoch": 7256} {"train_loss": -26.912567138671875, "global_step": 602252, "epoch": 7256} {"train_loss": -27.218427658081055, "global_step": 602253, "epoch": 7256} {"train_loss": -27.240575790405273, "global_step": 602254, "epoch": 7256} {"train_loss": -27.793079376220703, "global_step": 602255, "epoch": 7256} {"train_loss": -27.137311935424805, "global_step": 602256, "epoch": 7256} {"train_loss": -27.565143585205078, "global_step": 602257, "epoch": 7256} {"train_loss": -27.3854923248291, "global_step": 602258, "epoch": 7256} {"train_loss": -28.0041446685791, "global_step": 602259, "epoch": 7256} {"train_loss": -27.32869529724121, "global_step": 602260, "epoch": 7256} {"train_loss": -27.19140625, "global_step": 602261, "epoch": 7256} {"train_loss": -27.733322143554688, "global_step": 602262, "epoch": 7256} {"train_loss": -27.319543838500977, "global_step": 602263, "epoch": 7256} {"train_loss": -27.746606826782227, "global_step": 602264, "epoch": 7256} {"train_loss": -27.955968856811523, "global_step": 602265, "epoch": 7256} {"train_loss": -27.908620834350586, "global_step": 602266, "epoch": 7256} {"train_loss": -27.372739791870117, "global_step": 602267, "epoch": 7256} {"train_loss": -28.064146041870117, "global_step": 602268, "epoch": 7256} {"train_loss": -27.4768009185791, "global_step": 602269, "epoch": 7256} {"train_loss": -27.931310653686523, "global_step": 602270, "epoch": 7256} {"train_loss": -28.0587215423584, "global_step": 602271, "epoch": 7256} {"train_loss": -27.814817428588867, "global_step": 602272, "epoch": 7256} {"train_loss": -27.967451095581055, "global_step": 602273, "epoch": 7256} {"train_loss": -27.81036949157715, "global_step": 602274, "epoch": 7256} {"train_loss": -27.7409725189209, "global_step": 602275, "epoch": 7256} {"train_loss": -27.960779190063477, "global_step": 602276, "epoch": 7256} {"train_loss": -27.86165428161621, "global_step": 602277, "epoch": 7256} {"train_loss": -27.87628173828125, "global_step": 602278, "epoch": 7256} {"train_loss": -27.955224990844727, "global_step": 602279, "epoch": 7256} {"train_loss": -28.152860641479492, "global_step": 602280, "epoch": 7256} {"train_loss": -27.719287872314453, "global_step": 602281, "epoch": 7256} {"train_loss": -28.2469482421875, "global_step": 602282, "epoch": 7256} {"train_loss": -28.088125228881836, "global_step": 602283, "epoch": 7256} {"train_loss": -28.20136833190918, "global_step": 602284, "epoch": 7256} {"train_loss": -28.067401885986328, "global_step": 602285, "epoch": 7256} {"train_loss": -28.42286491394043, "global_step": 602286, "epoch": 7256} {"train_loss": -28.1575927734375, "global_step": 602287, "epoch": 7256} {"train_loss": -28.65018081665039, "global_step": 602288, "epoch": 7256} {"train_loss": -28.293317794799805, "global_step": 602289, "epoch": 7256} {"train_loss": -28.23758316040039, "global_step": 602290, "epoch": 7256} {"train_loss": -28.227313995361328, "global_step": 602291, "epoch": 7256} {"train_loss": -27.87751579284668, "global_step": 602292, "epoch": 7256} {"train_loss": -28.009618759155273, "global_step": 602293, "epoch": 7256} {"train_loss": -28.298084259033203, "global_step": 602294, "epoch": 7256} {"train_loss": -28.169336318969727, "global_step": 602295, "epoch": 7256} {"train_loss": -28.02191734313965, "global_step": 602296, "epoch": 7256} {"train_loss": -28.371137619018555, "global_step": 602297, "epoch": 7256} {"train_loss": -28.5159854888916, "global_step": 602298, "epoch": 7256} {"train_loss": -28.279016494750977, "global_step": 602299, "epoch": 7256} {"train_loss": -27.5929012298584, "global_step": 602300, "epoch": 7256} {"train_loss": -28.171630859375, "global_step": 602301, "epoch": 7256} {"train_loss": -28.123559951782227, "global_step": 602302, "epoch": 7256} {"train_loss": -28.0321102142334, "global_step": 602303, "epoch": 7256} {"train_loss": -27.865753173828125, "global_step": 602304, "epoch": 7256} {"train_loss": -27.96413230895996, "global_step": 602305, "epoch": 7256} {"train_loss": -28.511478424072266, "global_step": 602306, "epoch": 7256} {"train_loss": -27.955846786499023, "global_step": 602307, "epoch": 7256} {"train_loss": -27.943450927734375, "global_step": 602308, "epoch": 7256} {"train_loss": -28.06439208984375, "global_step": 602309, "epoch": 7256} {"train_loss": -27.905424118041992, "global_step": 602310, "epoch": 7256} {"train_loss": -27.969181060791016, "global_step": 602311, "epoch": 7256} {"train_loss": -28.084997177124023, "global_step": 602312, "epoch": 7256} {"train_loss": -27.93509292602539, "global_step": 602313, "epoch": 7256} {"train_loss": -28.3798770904541, "global_step": 602314, "epoch": 7256} {"train_loss": -28.14857292175293, "global_step": 602315, "epoch": 7256} {"train_loss": -28.02127456665039, "global_step": 602316, "epoch": 7256} {"train_loss": -27.953353881835938, "global_step": 602317, "epoch": 7256} {"train_loss": -27.904199600219727, "global_step": 602318, "epoch": 7256} {"train_loss": -28.186975479125977, "global_step": 602319, "epoch": 7256} {"train_loss": -28.198074340820312, "global_step": 602320, "epoch": 7256} {"train_loss": -27.85918617248535, "global_step": 602321, "epoch": 7256} {"train_loss": -27.791202545166016, "global_step": 602322, "epoch": 7256} {"train_loss": -27.892988204956055, "global_step": 602323, "epoch": 7256} {"train_loss": -28.1822566986084, "global_step": 602324, "epoch": 7256} {"train_loss": -28.32588005065918, "global_step": 602325, "epoch": 7256} {"train_loss": -28.0184268951416, "global_step": 602326, "epoch": 7256} {"train_loss": -27.996061325073242, "global_step": 602327, "epoch": 7256} {"train_loss": -28.226160049438477, "global_step": 602328, "epoch": 7256} {"train_loss": -28.26798439025879, "global_step": 602329, "epoch": 7256} {"train_loss": -27.88752686833761, "global_step": 602330, "epoch": 7256, "val_loss": 6479802.0} {"train_loss": -27.96992301940918, "global_step": 602331, "epoch": 7257} {"train_loss": -27.457977294921875, "global_step": 602332, "epoch": 7257} {"train_loss": -26.997961044311523, "global_step": 602333, "epoch": 7257} {"train_loss": -27.57352066040039, "global_step": 602334, "epoch": 7257} {"train_loss": -27.54041862487793, "global_step": 602335, "epoch": 7257} {"train_loss": -27.588748931884766, "global_step": 602336, "epoch": 7257} {"train_loss": -27.139333724975586, "global_step": 602337, "epoch": 7257} {"train_loss": -27.611799240112305, "global_step": 602338, "epoch": 7257} {"train_loss": -27.396448135375977, "global_step": 602339, "epoch": 7257} {"train_loss": -27.61748695373535, "global_step": 602340, "epoch": 7257} {"train_loss": -27.52777099609375, "global_step": 602341, "epoch": 7257} {"train_loss": -27.791879653930664, "global_step": 602342, "epoch": 7257} {"train_loss": -27.707990646362305, "global_step": 602343, "epoch": 7257} {"train_loss": -27.810810089111328, "global_step": 602344, "epoch": 7257} {"train_loss": -27.645715713500977, "global_step": 602345, "epoch": 7257} {"train_loss": -27.709299087524414, "global_step": 602346, "epoch": 7257} {"train_loss": -27.73760986328125, "global_step": 602347, "epoch": 7257} {"train_loss": -27.73433494567871, "global_step": 602348, "epoch": 7257} {"train_loss": -27.4853572845459, "global_step": 602349, "epoch": 7257} {"train_loss": -27.726293563842773, "global_step": 602350, "epoch": 7257} {"train_loss": -27.884246826171875, "global_step": 602351, "epoch": 7257} {"train_loss": -27.77503776550293, "global_step": 602352, "epoch": 7257} {"train_loss": -28.066659927368164, "global_step": 602353, "epoch": 7257} {"train_loss": -27.7296142578125, "global_step": 602354, "epoch": 7257} {"train_loss": -28.005599975585938, "global_step": 602355, "epoch": 7257} {"train_loss": -28.302770614624023, "global_step": 602356, "epoch": 7257} {"train_loss": -28.016433715820312, "global_step": 602357, "epoch": 7257} {"train_loss": -27.913721084594727, "global_step": 602358, "epoch": 7257} {"train_loss": -27.96713638305664, "global_step": 602359, "epoch": 7257} {"train_loss": -28.066869735717773, "global_step": 602360, "epoch": 7257} {"train_loss": -27.858083724975586, "global_step": 602361, "epoch": 7257} {"train_loss": -28.070348739624023, "global_step": 602362, "epoch": 7257} {"train_loss": -28.042646408081055, "global_step": 602363, "epoch": 7257} {"train_loss": -27.899250030517578, "global_step": 602364, "epoch": 7257} {"train_loss": -28.425886154174805, "global_step": 602365, "epoch": 7257} {"train_loss": -28.088117599487305, "global_step": 602366, "epoch": 7257} {"train_loss": -28.123825073242188, "global_step": 602367, "epoch": 7257} {"train_loss": -28.09980583190918, "global_step": 602368, "epoch": 7257} {"train_loss": -28.23797035217285, "global_step": 602369, "epoch": 7257} {"train_loss": -27.928693771362305, "global_step": 602370, "epoch": 7257} {"train_loss": -28.183319091796875, "global_step": 602371, "epoch": 7257} {"train_loss": -27.754892349243164, "global_step": 602372, "epoch": 7257} {"train_loss": -28.071216583251953, "global_step": 602373, "epoch": 7257} {"train_loss": -28.70159912109375, "global_step": 602374, "epoch": 7257} {"train_loss": -28.340116500854492, "global_step": 602375, "epoch": 7257} {"train_loss": -28.289770126342773, "global_step": 602376, "epoch": 7257} {"train_loss": -27.6131649017334, "global_step": 602377, "epoch": 7257} {"train_loss": -27.517507553100586, "global_step": 602378, "epoch": 7257} {"train_loss": -27.270105361938477, "global_step": 602379, "epoch": 7257} {"train_loss": -28.024999618530273, "global_step": 602380, "epoch": 7257} {"train_loss": -28.170095443725586, "global_step": 602381, "epoch": 7257} {"train_loss": -28.101367950439453, "global_step": 602382, "epoch": 7257} {"train_loss": -28.217920303344727, "global_step": 602383, "epoch": 7257} {"train_loss": -27.83344078063965, "global_step": 602384, "epoch": 7257} {"train_loss": -27.666807174682617, "global_step": 602385, "epoch": 7257} {"train_loss": -28.09366226196289, "global_step": 602386, "epoch": 7257} {"train_loss": -28.192392349243164, "global_step": 602387, "epoch": 7257} {"train_loss": -28.01751708984375, "global_step": 602388, "epoch": 7257} {"train_loss": -28.374853134155273, "global_step": 602389, "epoch": 7257} {"train_loss": -28.22841453552246, "global_step": 602390, "epoch": 7257} {"train_loss": -27.956052780151367, "global_step": 602391, "epoch": 7257} {"train_loss": -28.441730499267578, "global_step": 602392, "epoch": 7257} {"train_loss": -28.396703720092773, "global_step": 602393, "epoch": 7257} {"train_loss": -28.235849380493164, "global_step": 602394, "epoch": 7257} {"train_loss": -27.893768310546875, "global_step": 602395, "epoch": 7257} {"train_loss": -28.22907829284668, "global_step": 602396, "epoch": 7257} {"train_loss": -28.14021110534668, "global_step": 602397, "epoch": 7257} {"train_loss": -27.910491943359375, "global_step": 602398, "epoch": 7257} {"train_loss": -28.44072914123535, "global_step": 602399, "epoch": 7257} {"train_loss": -28.345081329345703, "global_step": 602400, "epoch": 7257} {"train_loss": -28.248884201049805, "global_step": 602401, "epoch": 7257} {"train_loss": -28.045652389526367, "global_step": 602402, "epoch": 7257} {"train_loss": -27.6286678314209, "global_step": 602403, "epoch": 7257} {"train_loss": -28.09930419921875, "global_step": 602404, "epoch": 7257} {"train_loss": -28.269367218017578, "global_step": 602405, "epoch": 7257} {"train_loss": -28.245105743408203, "global_step": 602406, "epoch": 7257} {"train_loss": -27.94717788696289, "global_step": 602407, "epoch": 7257} {"train_loss": -28.049890518188477, "global_step": 602408, "epoch": 7257} {"train_loss": -28.292051315307617, "global_step": 602409, "epoch": 7257} {"train_loss": -28.256505966186523, "global_step": 602410, "epoch": 7257} {"train_loss": -28.320348739624023, "global_step": 602411, "epoch": 7257} {"train_loss": -28.462472915649414, "global_step": 602412, "epoch": 7257} {"train_loss": -27.968530471066394, "global_step": 602413, "epoch": 7257, "val_loss": 6554192.0} {"train_loss": -27.121610641479492, "global_step": 602414, "epoch": 7258} {"train_loss": -27.13912010192871, "global_step": 602415, "epoch": 7258} {"train_loss": -26.92624282836914, "global_step": 602416, "epoch": 7258} {"train_loss": -27.475751876831055, "global_step": 602417, "epoch": 7258} {"train_loss": -27.492406845092773, "global_step": 602418, "epoch": 7258} {"train_loss": -27.44270896911621, "global_step": 602419, "epoch": 7258} {"train_loss": -27.743988037109375, "global_step": 602420, "epoch": 7258} {"train_loss": -27.70380210876465, "global_step": 602421, "epoch": 7258} {"train_loss": -27.400976181030273, "global_step": 602422, "epoch": 7258} {"train_loss": -27.360488891601562, "global_step": 602423, "epoch": 7258} {"train_loss": -27.581043243408203, "global_step": 602424, "epoch": 7258} {"train_loss": -27.755313873291016, "global_step": 602425, "epoch": 7258} {"train_loss": -27.5983829498291, "global_step": 602426, "epoch": 7258} {"train_loss": -27.63995933532715, "global_step": 602427, "epoch": 7258} {"train_loss": -28.249755859375, "global_step": 602428, "epoch": 7258} {"train_loss": -27.791767120361328, "global_step": 602429, "epoch": 7258} {"train_loss": -27.9426326751709, "global_step": 602430, "epoch": 7258} {"train_loss": -27.954565048217773, "global_step": 602431, "epoch": 7258} {"train_loss": -28.225168228149414, "global_step": 602432, "epoch": 7258} {"train_loss": -28.080490112304688, "global_step": 602433, "epoch": 7258} {"train_loss": -27.919973373413086, "global_step": 602434, "epoch": 7258} {"train_loss": -27.951095581054688, "global_step": 602435, "epoch": 7258} {"train_loss": -27.79534912109375, "global_step": 602436, "epoch": 7258} {"train_loss": -27.517465591430664, "global_step": 602437, "epoch": 7258} {"train_loss": -27.4578800201416, "global_step": 602438, "epoch": 7258} {"train_loss": -27.620325088500977, "global_step": 602439, "epoch": 7258} {"train_loss": -27.933979034423828, "global_step": 602440, "epoch": 7258} {"train_loss": -27.654773712158203, "global_step": 602441, "epoch": 7258} {"train_loss": -27.7524471282959, "global_step": 602442, "epoch": 7258} {"train_loss": -27.98797035217285, "global_step": 602443, "epoch": 7258} {"train_loss": -28.158248901367188, "global_step": 602444, "epoch": 7258} {"train_loss": -28.507116317749023, "global_step": 602445, "epoch": 7258} {"train_loss": -28.055280685424805, "global_step": 602446, "epoch": 7258} {"train_loss": -27.950780868530273, "global_step": 602447, "epoch": 7258} {"train_loss": -27.750349044799805, "global_step": 602448, "epoch": 7258} {"train_loss": -28.089014053344727, "global_step": 602449, "epoch": 7258} {"train_loss": -28.112939834594727, "global_step": 602450, "epoch": 7258} {"train_loss": -27.75607681274414, "global_step": 602451, "epoch": 7258} {"train_loss": -28.412694931030273, "global_step": 602452, "epoch": 7258} {"train_loss": -28.384521484375, "global_step": 602453, "epoch": 7258} {"train_loss": -28.124841690063477, "global_step": 602454, "epoch": 7258} {"train_loss": -28.32191276550293, "global_step": 602455, "epoch": 7258} {"train_loss": -28.767236709594727, "global_step": 602456, "epoch": 7258} {"train_loss": -27.946002960205078, "global_step": 602457, "epoch": 7258} {"train_loss": -27.9137020111084, "global_step": 602458, "epoch": 7258} {"train_loss": -28.294544219970703, "global_step": 602459, "epoch": 7258} {"train_loss": -28.483652114868164, "global_step": 602460, "epoch": 7258} {"train_loss": -28.113096237182617, "global_step": 602461, "epoch": 7258} {"train_loss": -28.5537109375, "global_step": 602462, "epoch": 7258} {"train_loss": -28.168073654174805, "global_step": 602463, "epoch": 7258} {"train_loss": -28.234928131103516, "global_step": 602464, "epoch": 7258} {"train_loss": -28.194005966186523, "global_step": 602465, "epoch": 7258} {"train_loss": -27.962772369384766, "global_step": 602466, "epoch": 7258} {"train_loss": -28.24641227722168, "global_step": 602467, "epoch": 7258} {"train_loss": -28.23573875427246, "global_step": 602468, "epoch": 7258} {"train_loss": -28.12994956970215, "global_step": 602469, "epoch": 7258} {"train_loss": -28.546218872070312, "global_step": 602470, "epoch": 7258} {"train_loss": -28.548389434814453, "global_step": 602471, "epoch": 7258} {"train_loss": -28.3507137298584, "global_step": 602472, "epoch": 7258} {"train_loss": -28.03018569946289, "global_step": 602473, "epoch": 7258} {"train_loss": -27.988943099975586, "global_step": 602474, "epoch": 7258} {"train_loss": -28.3118896484375, "global_step": 602475, "epoch": 7258} {"train_loss": -28.067108154296875, "global_step": 602476, "epoch": 7258} {"train_loss": -27.904748916625977, "global_step": 602477, "epoch": 7258} {"train_loss": -27.71817970275879, "global_step": 602478, "epoch": 7258} {"train_loss": -26.69972801208496, "global_step": 602479, "epoch": 7258} {"train_loss": -25.048368453979492, "global_step": 602480, "epoch": 7258} {"train_loss": -24.273069381713867, "global_step": 602481, "epoch": 7258} {"train_loss": -25.89324378967285, "global_step": 602482, "epoch": 7258} {"train_loss": -26.5233211517334, "global_step": 602483, "epoch": 7258} {"train_loss": -24.738325119018555, "global_step": 602484, "epoch": 7258} {"train_loss": -26.7165584564209, "global_step": 602485, "epoch": 7258} {"train_loss": -26.480213165283203, "global_step": 602486, "epoch": 7258} {"train_loss": -26.87198829650879, "global_step": 602487, "epoch": 7258} {"train_loss": -26.8505916595459, "global_step": 602488, "epoch": 7258} {"train_loss": -26.7968692779541, "global_step": 602489, "epoch": 7258} {"train_loss": -26.190814971923828, "global_step": 602490, "epoch": 7258} {"train_loss": -27.05796241760254, "global_step": 602491, "epoch": 7258} {"train_loss": -26.705297470092773, "global_step": 602492, "epoch": 7258} {"train_loss": -26.627607345581055, "global_step": 602493, "epoch": 7258} {"train_loss": -27.352527618408203, "global_step": 602494, "epoch": 7258} {"train_loss": -26.629056930541992, "global_step": 602495, "epoch": 7258} {"train_loss": -27.59587356843144, "global_step": 602496, "epoch": 7258, "val_loss": 6604260.0} {"train_loss": -27.322921752929688, "global_step": 602497, "epoch": 7259} {"train_loss": -26.79422950744629, "global_step": 602498, "epoch": 7259} {"train_loss": -26.758224487304688, "global_step": 602499, "epoch": 7259} {"train_loss": -27.145360946655273, "global_step": 602500, "epoch": 7259} {"train_loss": -26.84450340270996, "global_step": 602501, "epoch": 7259} {"train_loss": -26.614212036132812, "global_step": 602502, "epoch": 7259} {"train_loss": -27.1873722076416, "global_step": 602503, "epoch": 7259} {"train_loss": -26.832082748413086, "global_step": 602504, "epoch": 7259} {"train_loss": -27.167139053344727, "global_step": 602505, "epoch": 7259} {"train_loss": -26.825551986694336, "global_step": 602506, "epoch": 7259} {"train_loss": -27.126611709594727, "global_step": 602507, "epoch": 7259} {"train_loss": -27.040189743041992, "global_step": 602508, "epoch": 7259} {"train_loss": -27.36859703063965, "global_step": 602509, "epoch": 7259} {"train_loss": -27.325971603393555, "global_step": 602510, "epoch": 7259} {"train_loss": -27.094757080078125, "global_step": 602511, "epoch": 7259} {"train_loss": -27.211872100830078, "global_step": 602512, "epoch": 7259} {"train_loss": -27.6949462890625, "global_step": 602513, "epoch": 7259} {"train_loss": -27.00446128845215, "global_step": 602514, "epoch": 7259} {"train_loss": -27.541202545166016, "global_step": 602515, "epoch": 7259} {"train_loss": -27.5057430267334, "global_step": 602516, "epoch": 7259} {"train_loss": -27.33855628967285, "global_step": 602517, "epoch": 7259} {"train_loss": -27.45908546447754, "global_step": 602518, "epoch": 7259} {"train_loss": -27.4080810546875, "global_step": 602519, "epoch": 7259} {"train_loss": -27.572580337524414, "global_step": 602520, "epoch": 7259} {"train_loss": -27.49506950378418, "global_step": 602521, "epoch": 7259} {"train_loss": -28.00446891784668, "global_step": 602522, "epoch": 7259} {"train_loss": -27.570547103881836, "global_step": 602523, "epoch": 7259} {"train_loss": -27.395099639892578, "global_step": 602524, "epoch": 7259} {"train_loss": -27.9423828125, "global_step": 602525, "epoch": 7259} {"train_loss": -27.629423141479492, "global_step": 602526, "epoch": 7259} {"train_loss": -27.88336181640625, "global_step": 602527, "epoch": 7259} {"train_loss": -27.713367462158203, "global_step": 602528, "epoch": 7259} {"train_loss": -27.87188720703125, "global_step": 602529, "epoch": 7259} {"train_loss": -27.690631866455078, "global_step": 602530, "epoch": 7259} {"train_loss": -27.89326286315918, "global_step": 602531, "epoch": 7259} {"train_loss": -28.149093627929688, "global_step": 602532, "epoch": 7259} {"train_loss": -27.79355812072754, "global_step": 602533, "epoch": 7259} {"train_loss": -28.112747192382812, "global_step": 602534, "epoch": 7259} {"train_loss": -28.05182456970215, "global_step": 602535, "epoch": 7259} {"train_loss": -28.0522518157959, "global_step": 602536, "epoch": 7259} {"train_loss": -28.004169464111328, "global_step": 602537, "epoch": 7259} {"train_loss": -28.576812744140625, "global_step": 602538, "epoch": 7259} {"train_loss": -28.37299919128418, "global_step": 602539, "epoch": 7259} {"train_loss": -28.052783966064453, "global_step": 602540, "epoch": 7259} {"train_loss": -27.95465660095215, "global_step": 602541, "epoch": 7259} {"train_loss": -28.0417537689209, "global_step": 602542, "epoch": 7259} {"train_loss": -28.221899032592773, "global_step": 602543, "epoch": 7259} {"train_loss": -28.111377716064453, "global_step": 602544, "epoch": 7259} {"train_loss": -28.21586036682129, "global_step": 602545, "epoch": 7259} {"train_loss": -28.066272735595703, "global_step": 602546, "epoch": 7259} {"train_loss": -27.995092391967773, "global_step": 602547, "epoch": 7259} {"train_loss": -28.1575927734375, "global_step": 602548, "epoch": 7259} {"train_loss": -28.249134063720703, "global_step": 602549, "epoch": 7259} {"train_loss": -27.913244247436523, "global_step": 602550, "epoch": 7259} {"train_loss": -28.113128662109375, "global_step": 602551, "epoch": 7259} {"train_loss": -28.25837516784668, "global_step": 602552, "epoch": 7259} {"train_loss": -28.31722068786621, "global_step": 602553, "epoch": 7259} {"train_loss": -28.291616439819336, "global_step": 602554, "epoch": 7259} {"train_loss": -28.1989688873291, "global_step": 602555, "epoch": 7259} {"train_loss": -28.31788444519043, "global_step": 602556, "epoch": 7259} {"train_loss": -28.3709716796875, "global_step": 602557, "epoch": 7259} {"train_loss": -28.611907958984375, "global_step": 602558, "epoch": 7259} {"train_loss": -28.20099449157715, "global_step": 602559, "epoch": 7259} {"train_loss": -28.033288955688477, "global_step": 602560, "epoch": 7259} {"train_loss": -28.15801429748535, "global_step": 602561, "epoch": 7259} {"train_loss": -28.094934463500977, "global_step": 602562, "epoch": 7259} {"train_loss": -27.6260929107666, "global_step": 602563, "epoch": 7259} {"train_loss": -28.053970336914062, "global_step": 602564, "epoch": 7259} {"train_loss": -28.370147705078125, "global_step": 602565, "epoch": 7259} {"train_loss": -28.077905654907227, "global_step": 602566, "epoch": 7259} {"train_loss": -27.682889938354492, "global_step": 602567, "epoch": 7259} {"train_loss": -27.731592178344727, "global_step": 602568, "epoch": 7259} {"train_loss": -28.414688110351562, "global_step": 602569, "epoch": 7259} {"train_loss": -27.872358322143555, "global_step": 602570, "epoch": 7259} {"train_loss": -27.855329513549805, "global_step": 602571, "epoch": 7259} {"train_loss": -28.19733238220215, "global_step": 602572, "epoch": 7259} {"train_loss": -28.247577667236328, "global_step": 602573, "epoch": 7259} {"train_loss": -28.372745513916016, "global_step": 602574, "epoch": 7259} {"train_loss": -28.119924545288086, "global_step": 602575, "epoch": 7259} {"train_loss": -28.1634464263916, "global_step": 602576, "epoch": 7259} {"train_loss": -28.226606369018555, "global_step": 602577, "epoch": 7259} {"train_loss": -28.518115997314453, "global_step": 602578, "epoch": 7259} {"train_loss": -27.81135053519743, "global_step": 602579, "epoch": 7259, "val_loss": 6602901.5} {"train_loss": -26.834375381469727, "global_step": 602580, "epoch": 7260} {"train_loss": -26.389184951782227, "global_step": 602581, "epoch": 7260} {"train_loss": -27.573637008666992, "global_step": 602582, "epoch": 7260} {"train_loss": -27.461669921875, "global_step": 602583, "epoch": 7260} {"train_loss": -27.35581398010254, "global_step": 602584, "epoch": 7260} {"train_loss": -27.25665855407715, "global_step": 602585, "epoch": 7260} {"train_loss": -27.30999755859375, "global_step": 602586, "epoch": 7260} {"train_loss": -27.065122604370117, "global_step": 602587, "epoch": 7260} {"train_loss": -27.157922744750977, "global_step": 602588, "epoch": 7260} {"train_loss": -27.451440811157227, "global_step": 602589, "epoch": 7260} {"train_loss": -27.345691680908203, "global_step": 602590, "epoch": 7260} {"train_loss": -27.405858993530273, "global_step": 602591, "epoch": 7260} {"train_loss": -27.2861270904541, "global_step": 602592, "epoch": 7260} {"train_loss": -27.546859741210938, "global_step": 602593, "epoch": 7260} {"train_loss": -27.970081329345703, "global_step": 602594, "epoch": 7260} {"train_loss": -27.44147300720215, "global_step": 602595, "epoch": 7260} {"train_loss": -27.62418556213379, "global_step": 602596, "epoch": 7260} {"train_loss": -27.762365341186523, "global_step": 602597, "epoch": 7260} {"train_loss": -27.59210777282715, "global_step": 602598, "epoch": 7260} {"train_loss": -27.428876876831055, "global_step": 602599, "epoch": 7260} {"train_loss": -27.813215255737305, "global_step": 602600, "epoch": 7260} {"train_loss": -27.911090850830078, "global_step": 602601, "epoch": 7260} {"train_loss": -27.588354110717773, "global_step": 602602, "epoch": 7260} {"train_loss": -27.824811935424805, "global_step": 602603, "epoch": 7260} {"train_loss": -28.13808250427246, "global_step": 602604, "epoch": 7260} {"train_loss": -27.946048736572266, "global_step": 602605, "epoch": 7260} {"train_loss": -27.74802589416504, "global_step": 602606, "epoch": 7260} {"train_loss": -27.849613189697266, "global_step": 602607, "epoch": 7260} {"train_loss": -27.7570743560791, "global_step": 602608, "epoch": 7260} {"train_loss": -27.957372665405273, "global_step": 602609, "epoch": 7260} {"train_loss": -27.896377563476562, "global_step": 602610, "epoch": 7260} {"train_loss": -28.050403594970703, "global_step": 602611, "epoch": 7260} {"train_loss": -27.81292152404785, "global_step": 602612, "epoch": 7260} {"train_loss": -28.103515625, "global_step": 602613, "epoch": 7260} {"train_loss": -28.254413604736328, "global_step": 602614, "epoch": 7260} {"train_loss": -28.28680992126465, "global_step": 602615, "epoch": 7260} {"train_loss": -28.11570167541504, "global_step": 602616, "epoch": 7260} {"train_loss": -28.08616065979004, "global_step": 602617, "epoch": 7260} {"train_loss": -27.990161895751953, "global_step": 602618, "epoch": 7260} {"train_loss": -28.160993576049805, "global_step": 602619, "epoch": 7260} {"train_loss": -28.443317413330078, "global_step": 602620, "epoch": 7260} {"train_loss": -28.15166664123535, "global_step": 602621, "epoch": 7260} {"train_loss": -27.672107696533203, "global_step": 602622, "epoch": 7260} {"train_loss": -27.78667640686035, "global_step": 602623, "epoch": 7260} {"train_loss": -28.320722579956055, "global_step": 602624, "epoch": 7260} {"train_loss": -28.274927139282227, "global_step": 602625, "epoch": 7260} {"train_loss": -28.088895797729492, "global_step": 602626, "epoch": 7260} {"train_loss": -28.17804527282715, "global_step": 602627, "epoch": 7260} {"train_loss": -27.926593780517578, "global_step": 602628, "epoch": 7260} {"train_loss": -28.23651695251465, "global_step": 602629, "epoch": 7260} {"train_loss": -28.14620018005371, "global_step": 602630, "epoch": 7260} {"train_loss": -27.972503662109375, "global_step": 602631, "epoch": 7260} {"train_loss": -28.166040420532227, "global_step": 602632, "epoch": 7260} {"train_loss": -28.03700065612793, "global_step": 602633, "epoch": 7260} {"train_loss": -28.183828353881836, "global_step": 602634, "epoch": 7260} {"train_loss": -28.09343910217285, "global_step": 602635, "epoch": 7260} {"train_loss": -28.54056167602539, "global_step": 602636, "epoch": 7260} {"train_loss": -28.261869430541992, "global_step": 602637, "epoch": 7260} {"train_loss": -28.282501220703125, "global_step": 602638, "epoch": 7260} {"train_loss": -28.4744930267334, "global_step": 602639, "epoch": 7260} {"train_loss": -28.364042282104492, "global_step": 602640, "epoch": 7260} {"train_loss": -28.372739791870117, "global_step": 602641, "epoch": 7260} {"train_loss": -28.217884063720703, "global_step": 602642, "epoch": 7260} {"train_loss": -27.995315551757812, "global_step": 602643, "epoch": 7260} {"train_loss": -28.2303409576416, "global_step": 602644, "epoch": 7260} {"train_loss": -28.046493530273438, "global_step": 602645, "epoch": 7260} {"train_loss": -27.79310417175293, "global_step": 602646, "epoch": 7260} {"train_loss": -28.158288955688477, "global_step": 602647, "epoch": 7260} {"train_loss": -28.192279815673828, "global_step": 602648, "epoch": 7260} {"train_loss": -28.140771865844727, "global_step": 602649, "epoch": 7260} {"train_loss": -28.23874855041504, "global_step": 602650, "epoch": 7260} {"train_loss": -28.30136489868164, "global_step": 602651, "epoch": 7260} {"train_loss": -27.91462516784668, "global_step": 602652, "epoch": 7260} {"train_loss": -28.2421817779541, "global_step": 602653, "epoch": 7260} {"train_loss": -28.33880615234375, "global_step": 602654, "epoch": 7260} {"train_loss": -28.32173728942871, "global_step": 602655, "epoch": 7260} {"train_loss": -28.04306983947754, "global_step": 602656, "epoch": 7260} {"train_loss": -28.192768096923828, "global_step": 602657, "epoch": 7260} {"train_loss": -28.0871639251709, "global_step": 602658, "epoch": 7260} {"train_loss": -28.318927764892578, "global_step": 602659, "epoch": 7260} {"train_loss": -28.254840850830078, "global_step": 602660, "epoch": 7260} {"train_loss": -27.857816696166992, "global_step": 602661, "epoch": 7260} {"train_loss": -27.913464626633978, "global_step": 602662, "epoch": 7260, "val_loss": 6704589.5} {"train_loss": -27.249013900756836, "global_step": 602663, "epoch": 7261} {"train_loss": -27.092832565307617, "global_step": 602664, "epoch": 7261} {"train_loss": -26.58392333984375, "global_step": 602665, "epoch": 7261} {"train_loss": -27.817190170288086, "global_step": 602666, "epoch": 7261} {"train_loss": -26.728656768798828, "global_step": 602667, "epoch": 7261} {"train_loss": -27.224334716796875, "global_step": 602668, "epoch": 7261} {"train_loss": -27.356481552124023, "global_step": 602669, "epoch": 7261} {"train_loss": -27.584426879882812, "global_step": 602670, "epoch": 7261} {"train_loss": -27.481739044189453, "global_step": 602671, "epoch": 7261} {"train_loss": -27.531042098999023, "global_step": 602672, "epoch": 7261} {"train_loss": -27.547626495361328, "global_step": 602673, "epoch": 7261} {"train_loss": -27.63934898376465, "global_step": 602674, "epoch": 7261} {"train_loss": -27.495893478393555, "global_step": 602675, "epoch": 7261} {"train_loss": -27.746936798095703, "global_step": 602676, "epoch": 7261} {"train_loss": -27.49395179748535, "global_step": 602677, "epoch": 7261} {"train_loss": -27.5069637298584, "global_step": 602678, "epoch": 7261} {"train_loss": -27.800199508666992, "global_step": 602679, "epoch": 7261} {"train_loss": -27.437597274780273, "global_step": 602680, "epoch": 7261} {"train_loss": -27.5552921295166, "global_step": 602681, "epoch": 7261} {"train_loss": -28.157306671142578, "global_step": 602682, "epoch": 7261} {"train_loss": -27.754486083984375, "global_step": 602683, "epoch": 7261} {"train_loss": -27.557493209838867, "global_step": 602684, "epoch": 7261} {"train_loss": -27.706785202026367, "global_step": 602685, "epoch": 7261} {"train_loss": -28.108417510986328, "global_step": 602686, "epoch": 7261} {"train_loss": -27.666528701782227, "global_step": 602687, "epoch": 7261} {"train_loss": -27.811132431030273, "global_step": 602688, "epoch": 7261} {"train_loss": -27.694446563720703, "global_step": 602689, "epoch": 7261} {"train_loss": -27.863391876220703, "global_step": 602690, "epoch": 7261} {"train_loss": -28.0021915435791, "global_step": 602691, "epoch": 7261} {"train_loss": -27.951404571533203, "global_step": 602692, "epoch": 7261} {"train_loss": -27.591205596923828, "global_step": 602693, "epoch": 7261} {"train_loss": -27.985158920288086, "global_step": 602694, "epoch": 7261} {"train_loss": -27.986310958862305, "global_step": 602695, "epoch": 7261} {"train_loss": -27.74783706665039, "global_step": 602696, "epoch": 7261} {"train_loss": -28.02385902404785, "global_step": 602697, "epoch": 7261} {"train_loss": -28.163135528564453, "global_step": 602698, "epoch": 7261} {"train_loss": -28.068084716796875, "global_step": 602699, "epoch": 7261} {"train_loss": -27.87030601501465, "global_step": 602700, "epoch": 7261} {"train_loss": -28.21125602722168, "global_step": 602701, "epoch": 7261} {"train_loss": -27.946216583251953, "global_step": 602702, "epoch": 7261} {"train_loss": -28.24078941345215, "global_step": 602703, "epoch": 7261} {"train_loss": -28.02479362487793, "global_step": 602704, "epoch": 7261} {"train_loss": -27.900915145874023, "global_step": 602705, "epoch": 7261} {"train_loss": -27.97690773010254, "global_step": 602706, "epoch": 7261} {"train_loss": -28.090198516845703, "global_step": 602707, "epoch": 7261} {"train_loss": -27.887659072875977, "global_step": 602708, "epoch": 7261} {"train_loss": -28.232458114624023, "global_step": 602709, "epoch": 7261} {"train_loss": -28.04096794128418, "global_step": 602710, "epoch": 7261} {"train_loss": -28.159292221069336, "global_step": 602711, "epoch": 7261} {"train_loss": -28.264081954956055, "global_step": 602712, "epoch": 7261} {"train_loss": -28.258132934570312, "global_step": 602713, "epoch": 7261} {"train_loss": -28.3018741607666, "global_step": 602714, "epoch": 7261} {"train_loss": -28.325403213500977, "global_step": 602715, "epoch": 7261} {"train_loss": -28.28373146057129, "global_step": 602716, "epoch": 7261} {"train_loss": -28.29123306274414, "global_step": 602717, "epoch": 7261} {"train_loss": -28.476606369018555, "global_step": 602718, "epoch": 7261} {"train_loss": -28.4658203125, "global_step": 602719, "epoch": 7261} {"train_loss": -28.53672218322754, "global_step": 602720, "epoch": 7261} {"train_loss": -28.392913818359375, "global_step": 602721, "epoch": 7261} {"train_loss": -28.094940185546875, "global_step": 602722, "epoch": 7261} {"train_loss": -28.18562126159668, "global_step": 602723, "epoch": 7261} {"train_loss": -28.27615737915039, "global_step": 602724, "epoch": 7261} {"train_loss": -28.300378799438477, "global_step": 602725, "epoch": 7261} {"train_loss": -28.42365837097168, "global_step": 602726, "epoch": 7261} {"train_loss": -28.323068618774414, "global_step": 602727, "epoch": 7261} {"train_loss": -27.965198516845703, "global_step": 602728, "epoch": 7261} {"train_loss": -28.121469497680664, "global_step": 602729, "epoch": 7261} {"train_loss": -28.06931495666504, "global_step": 602730, "epoch": 7261} {"train_loss": -27.984434127807617, "global_step": 602731, "epoch": 7261} {"train_loss": -28.180755615234375, "global_step": 602732, "epoch": 7261} {"train_loss": -27.991064071655273, "global_step": 602733, "epoch": 7261} {"train_loss": -27.826337814331055, "global_step": 602734, "epoch": 7261} {"train_loss": -28.06757164001465, "global_step": 602735, "epoch": 7261} {"train_loss": -28.067001342773438, "global_step": 602736, "epoch": 7261} {"train_loss": -27.70887565612793, "global_step": 602737, "epoch": 7261} {"train_loss": -27.55422019958496, "global_step": 602738, "epoch": 7261} {"train_loss": -27.886701583862305, "global_step": 602739, "epoch": 7261} {"train_loss": -27.654592514038086, "global_step": 602740, "epoch": 7261} {"train_loss": -28.3997859954834, "global_step": 602741, "epoch": 7261} {"train_loss": -27.819150924682617, "global_step": 602742, "epoch": 7261} {"train_loss": -28.199094772338867, "global_step": 602743, "epoch": 7261} {"train_loss": -27.3519229888916, "global_step": 602744, "epoch": 7261} {"train_loss": -27.873870458947607, "global_step": 602745, "epoch": 7261, "val_loss": 6639552.0} {"train_loss": -27.57366943359375, "global_step": 602746, "epoch": 7262} {"train_loss": -26.32697868347168, "global_step": 602747, "epoch": 7262} {"train_loss": -27.161548614501953, "global_step": 602748, "epoch": 7262} {"train_loss": -28.02263832092285, "global_step": 602749, "epoch": 7262} {"train_loss": -27.1079044342041, "global_step": 602750, "epoch": 7262} {"train_loss": -27.420032501220703, "global_step": 602751, "epoch": 7262} {"train_loss": -27.7771053314209, "global_step": 602752, "epoch": 7262} {"train_loss": -27.5883846282959, "global_step": 602753, "epoch": 7262} {"train_loss": -27.747644424438477, "global_step": 602754, "epoch": 7262} {"train_loss": -28.055524826049805, "global_step": 602755, "epoch": 7262} {"train_loss": -27.111087799072266, "global_step": 602756, "epoch": 7262} {"train_loss": -27.7152156829834, "global_step": 602757, "epoch": 7262} {"train_loss": -27.88408851623535, "global_step": 602758, "epoch": 7262} {"train_loss": -27.561264038085938, "global_step": 602759, "epoch": 7262} {"train_loss": -27.9869441986084, "global_step": 602760, "epoch": 7262} {"train_loss": -27.37823486328125, "global_step": 602761, "epoch": 7262} {"train_loss": -27.668378829956055, "global_step": 602762, "epoch": 7262} {"train_loss": -28.333776473999023, "global_step": 602763, "epoch": 7262} {"train_loss": -27.832555770874023, "global_step": 602764, "epoch": 7262} {"train_loss": -27.904653549194336, "global_step": 602765, "epoch": 7262} {"train_loss": -27.851667404174805, "global_step": 602766, "epoch": 7262} {"train_loss": -27.874887466430664, "global_step": 602767, "epoch": 7262} {"train_loss": -27.49250602722168, "global_step": 602768, "epoch": 7262} {"train_loss": -28.235929489135742, "global_step": 602769, "epoch": 7262} {"train_loss": -28.192365646362305, "global_step": 602770, "epoch": 7262} {"train_loss": -28.134552001953125, "global_step": 602771, "epoch": 7262} {"train_loss": -28.126373291015625, "global_step": 602772, "epoch": 7262} {"train_loss": -27.825586318969727, "global_step": 602773, "epoch": 7262} {"train_loss": -28.168439865112305, "global_step": 602774, "epoch": 7262} {"train_loss": -27.922163009643555, "global_step": 602775, "epoch": 7262} {"train_loss": -27.92683219909668, "global_step": 602776, "epoch": 7262} {"train_loss": -28.199350357055664, "global_step": 602777, "epoch": 7262} {"train_loss": -28.31873893737793, "global_step": 602778, "epoch": 7262} {"train_loss": -27.86345863342285, "global_step": 602779, "epoch": 7262} {"train_loss": -27.97385597229004, "global_step": 602780, "epoch": 7262} {"train_loss": -27.8852481842041, "global_step": 602781, "epoch": 7262} {"train_loss": -28.117023468017578, "global_step": 602782, "epoch": 7262} {"train_loss": -28.190113067626953, "global_step": 602783, "epoch": 7262} {"train_loss": -28.330474853515625, "global_step": 602784, "epoch": 7262} {"train_loss": -27.852157592773438, "global_step": 602785, "epoch": 7262} {"train_loss": -28.281116485595703, "global_step": 602786, "epoch": 7262} {"train_loss": -27.6907958984375, "global_step": 602787, "epoch": 7262} {"train_loss": -27.842077255249023, "global_step": 602788, "epoch": 7262} {"train_loss": -28.00608253479004, "global_step": 602789, "epoch": 7262} {"train_loss": -28.141937255859375, "global_step": 602790, "epoch": 7262} {"train_loss": -28.22711753845215, "global_step": 602791, "epoch": 7262} {"train_loss": -28.04194450378418, "global_step": 602792, "epoch": 7262} {"train_loss": -28.095657348632812, "global_step": 602793, "epoch": 7262} {"train_loss": -28.47699546813965, "global_step": 602794, "epoch": 7262} {"train_loss": -28.238386154174805, "global_step": 602795, "epoch": 7262} {"train_loss": -28.443796157836914, "global_step": 602796, "epoch": 7262} {"train_loss": -28.19392204284668, "global_step": 602797, "epoch": 7262} {"train_loss": -27.870147705078125, "global_step": 602798, "epoch": 7262} {"train_loss": -28.28252601623535, "global_step": 602799, "epoch": 7262} {"train_loss": -28.01930046081543, "global_step": 602800, "epoch": 7262} {"train_loss": -28.115161895751953, "global_step": 602801, "epoch": 7262} {"train_loss": -28.301755905151367, "global_step": 602802, "epoch": 7262} {"train_loss": -27.953479766845703, "global_step": 602803, "epoch": 7262} {"train_loss": -28.318567276000977, "global_step": 602804, "epoch": 7262} {"train_loss": -28.531024932861328, "global_step": 602805, "epoch": 7262} {"train_loss": -28.506994247436523, "global_step": 602806, "epoch": 7262} {"train_loss": -28.279287338256836, "global_step": 602807, "epoch": 7262} {"train_loss": -28.15034294128418, "global_step": 602808, "epoch": 7262} {"train_loss": -28.271564483642578, "global_step": 602809, "epoch": 7262} {"train_loss": -28.3195858001709, "global_step": 602810, "epoch": 7262} {"train_loss": -28.437957763671875, "global_step": 602811, "epoch": 7262} {"train_loss": -28.378955841064453, "global_step": 602812, "epoch": 7262} {"train_loss": -28.163700103759766, "global_step": 602813, "epoch": 7262} {"train_loss": -27.939197540283203, "global_step": 602814, "epoch": 7262} {"train_loss": -28.669538497924805, "global_step": 602815, "epoch": 7262} {"train_loss": -27.8872127532959, "global_step": 602816, "epoch": 7262} {"train_loss": -28.137165069580078, "global_step": 602817, "epoch": 7262} {"train_loss": -28.193817138671875, "global_step": 602818, "epoch": 7262} {"train_loss": -28.39447593688965, "global_step": 602819, "epoch": 7262} {"train_loss": -28.0278263092041, "global_step": 602820, "epoch": 7262} {"train_loss": -28.22987174987793, "global_step": 602821, "epoch": 7262} {"train_loss": -28.236785888671875, "global_step": 602822, "epoch": 7262} {"train_loss": -28.125207901000977, "global_step": 602823, "epoch": 7262} {"train_loss": -28.130395889282227, "global_step": 602824, "epoch": 7262} {"train_loss": -28.424732208251953, "global_step": 602825, "epoch": 7262} {"train_loss": -28.360279083251953, "global_step": 602826, "epoch": 7262} {"train_loss": -27.66887855529785, "global_step": 602827, "epoch": 7262} {"train_loss": -27.9986944773111, "global_step": 602828, "epoch": 7262, "val_loss": 6711215.0} {"train_loss": -27.640460968017578, "global_step": 602829, "epoch": 7263} {"train_loss": -25.53659439086914, "global_step": 602830, "epoch": 7263} {"train_loss": -26.616724014282227, "global_step": 602831, "epoch": 7263} {"train_loss": -27.613666534423828, "global_step": 602832, "epoch": 7263} {"train_loss": -26.668561935424805, "global_step": 602833, "epoch": 7263} {"train_loss": -27.677215576171875, "global_step": 602834, "epoch": 7263} {"train_loss": -27.0845947265625, "global_step": 602835, "epoch": 7263} {"train_loss": -27.551137924194336, "global_step": 602836, "epoch": 7263} {"train_loss": -27.77796745300293, "global_step": 602837, "epoch": 7263} {"train_loss": -27.446537017822266, "global_step": 602838, "epoch": 7263} {"train_loss": -27.62776756286621, "global_step": 602839, "epoch": 7263} {"train_loss": -27.995075225830078, "global_step": 602840, "epoch": 7263} {"train_loss": -27.447057723999023, "global_step": 602841, "epoch": 7263} {"train_loss": -27.809289932250977, "global_step": 602842, "epoch": 7263} {"train_loss": -27.702199935913086, "global_step": 602843, "epoch": 7263} {"train_loss": -27.0965633392334, "global_step": 602844, "epoch": 7263} {"train_loss": -27.808319091796875, "global_step": 602845, "epoch": 7263} {"train_loss": -27.40964126586914, "global_step": 602846, "epoch": 7263} {"train_loss": -27.78272819519043, "global_step": 602847, "epoch": 7263} {"train_loss": -27.95458984375, "global_step": 602848, "epoch": 7263} {"train_loss": -28.0892391204834, "global_step": 602849, "epoch": 7263} {"train_loss": -28.02971839904785, "global_step": 602850, "epoch": 7263} {"train_loss": -27.9641170501709, "global_step": 602851, "epoch": 7263} {"train_loss": -27.994647979736328, "global_step": 602852, "epoch": 7263} {"train_loss": -27.78251075744629, "global_step": 602853, "epoch": 7263} {"train_loss": -27.909372329711914, "global_step": 602854, "epoch": 7263} {"train_loss": -28.2384090423584, "global_step": 602855, "epoch": 7263} {"train_loss": -27.872018814086914, "global_step": 602856, "epoch": 7263} {"train_loss": -28.04981803894043, "global_step": 602857, "epoch": 7263} {"train_loss": -28.122272491455078, "global_step": 602858, "epoch": 7263} {"train_loss": -27.50288963317871, "global_step": 602859, "epoch": 7263} {"train_loss": -28.202173233032227, "global_step": 602860, "epoch": 7263} {"train_loss": -28.0106143951416, "global_step": 602861, "epoch": 7263} {"train_loss": -28.102890014648438, "global_step": 602862, "epoch": 7263} {"train_loss": -28.115949630737305, "global_step": 602863, "epoch": 7263} {"train_loss": -28.220556259155273, "global_step": 602864, "epoch": 7263} {"train_loss": -27.788257598876953, "global_step": 602865, "epoch": 7263} {"train_loss": -27.9743595123291, "global_step": 602866, "epoch": 7263} {"train_loss": -28.298904418945312, "global_step": 602867, "epoch": 7263} {"train_loss": -28.2917423248291, "global_step": 602868, "epoch": 7263} {"train_loss": -28.2075138092041, "global_step": 602869, "epoch": 7263} {"train_loss": -28.015899658203125, "global_step": 602870, "epoch": 7263} {"train_loss": -28.052038192749023, "global_step": 602871, "epoch": 7263} {"train_loss": -27.931396484375, "global_step": 602872, "epoch": 7263} {"train_loss": -28.227924346923828, "global_step": 602873, "epoch": 7263} {"train_loss": -27.840158462524414, "global_step": 602874, "epoch": 7263} {"train_loss": -28.194684982299805, "global_step": 602875, "epoch": 7263} {"train_loss": -28.040918350219727, "global_step": 602876, "epoch": 7263} {"train_loss": -28.452499389648438, "global_step": 602877, "epoch": 7263} {"train_loss": -28.241046905517578, "global_step": 602878, "epoch": 7263} {"train_loss": -27.771240234375, "global_step": 602879, "epoch": 7263} {"train_loss": -28.33204460144043, "global_step": 602880, "epoch": 7263} {"train_loss": -28.0258731842041, "global_step": 602881, "epoch": 7263} {"train_loss": -28.227115631103516, "global_step": 602882, "epoch": 7263} {"train_loss": -28.39063835144043, "global_step": 602883, "epoch": 7263} {"train_loss": -28.156131744384766, "global_step": 602884, "epoch": 7263} {"train_loss": -28.056737899780273, "global_step": 602885, "epoch": 7263} {"train_loss": -28.28032875061035, "global_step": 602886, "epoch": 7263} {"train_loss": -27.87835121154785, "global_step": 602887, "epoch": 7263} {"train_loss": -28.302413940429688, "global_step": 602888, "epoch": 7263} {"train_loss": -28.283477783203125, "global_step": 602889, "epoch": 7263} {"train_loss": -28.116357803344727, "global_step": 602890, "epoch": 7263} {"train_loss": -27.940099716186523, "global_step": 602891, "epoch": 7263} {"train_loss": -28.233600616455078, "global_step": 602892, "epoch": 7263} {"train_loss": -27.856842041015625, "global_step": 602893, "epoch": 7263} {"train_loss": -28.418371200561523, "global_step": 602894, "epoch": 7263} {"train_loss": -28.204608917236328, "global_step": 602895, "epoch": 7263} {"train_loss": -27.790170669555664, "global_step": 602896, "epoch": 7263} {"train_loss": -28.23740005493164, "global_step": 602897, "epoch": 7263} {"train_loss": -27.828580856323242, "global_step": 602898, "epoch": 7263} {"train_loss": -27.891687393188477, "global_step": 602899, "epoch": 7263} {"train_loss": -28.03241539001465, "global_step": 602900, "epoch": 7263} {"train_loss": -27.886693954467773, "global_step": 602901, "epoch": 7263} {"train_loss": -28.62603759765625, "global_step": 602902, "epoch": 7263} {"train_loss": -28.0467529296875, "global_step": 602903, "epoch": 7263} {"train_loss": -27.301305770874023, "global_step": 602904, "epoch": 7263} {"train_loss": -27.978759765625, "global_step": 602905, "epoch": 7263} {"train_loss": -28.050119400024414, "global_step": 602906, "epoch": 7263} {"train_loss": -27.760953903198242, "global_step": 602907, "epoch": 7263} {"train_loss": -27.764997482299805, "global_step": 602908, "epoch": 7263} {"train_loss": -27.252904891967773, "global_step": 602909, "epoch": 7263} {"train_loss": -28.059600830078125, "global_step": 602910, "epoch": 7263} {"train_loss": -27.897441358451385, "global_step": 602911, "epoch": 7263, "val_loss": 6679424.0} {"train_loss": -27.867130279541016, "global_step": 602912, "epoch": 7264} {"train_loss": -28.052265167236328, "global_step": 602913, "epoch": 7264} {"train_loss": -27.548261642456055, "global_step": 602914, "epoch": 7264} {"train_loss": -27.202356338500977, "global_step": 602915, "epoch": 7264} {"train_loss": -27.41329002380371, "global_step": 602916, "epoch": 7264} {"train_loss": -27.458847045898438, "global_step": 602917, "epoch": 7264} {"train_loss": -27.98676872253418, "global_step": 602918, "epoch": 7264} {"train_loss": -27.46497917175293, "global_step": 602919, "epoch": 7264} {"train_loss": -27.711212158203125, "global_step": 602920, "epoch": 7264} {"train_loss": -27.922962188720703, "global_step": 602921, "epoch": 7264} {"train_loss": -27.645822525024414, "global_step": 602922, "epoch": 7264} {"train_loss": -27.393033981323242, "global_step": 602923, "epoch": 7264} {"train_loss": -27.05204200744629, "global_step": 602924, "epoch": 7264} {"train_loss": -27.643268585205078, "global_step": 602925, "epoch": 7264} {"train_loss": -27.623586654663086, "global_step": 602926, "epoch": 7264} {"train_loss": -27.876712799072266, "global_step": 602927, "epoch": 7264} {"train_loss": -27.535663604736328, "global_step": 602928, "epoch": 7264} {"train_loss": -27.727371215820312, "global_step": 602929, "epoch": 7264} {"train_loss": -28.133285522460938, "global_step": 602930, "epoch": 7264} {"train_loss": -27.772327423095703, "global_step": 602931, "epoch": 7264} {"train_loss": -27.884061813354492, "global_step": 602932, "epoch": 7264} {"train_loss": -27.657196044921875, "global_step": 602933, "epoch": 7264} {"train_loss": -27.475934982299805, "global_step": 602934, "epoch": 7264} {"train_loss": -27.94919204711914, "global_step": 602935, "epoch": 7264} {"train_loss": -28.0059814453125, "global_step": 602936, "epoch": 7264} {"train_loss": -28.16888999938965, "global_step": 602937, "epoch": 7264} {"train_loss": -28.01576805114746, "global_step": 602938, "epoch": 7264} {"train_loss": -27.755521774291992, "global_step": 602939, "epoch": 7264} {"train_loss": -28.385665893554688, "global_step": 602940, "epoch": 7264} {"train_loss": -27.840864181518555, "global_step": 602941, "epoch": 7264} {"train_loss": -28.35009765625, "global_step": 602942, "epoch": 7264} {"train_loss": -28.081266403198242, "global_step": 602943, "epoch": 7264} {"train_loss": -28.15836524963379, "global_step": 602944, "epoch": 7264} {"train_loss": -27.98126792907715, "global_step": 602945, "epoch": 7264} {"train_loss": -28.20892906188965, "global_step": 602946, "epoch": 7264} {"train_loss": -27.932470321655273, "global_step": 602947, "epoch": 7264} {"train_loss": -28.128950119018555, "global_step": 602948, "epoch": 7264} {"train_loss": -28.177722930908203, "global_step": 602949, "epoch": 7264} {"train_loss": -28.247907638549805, "global_step": 602950, "epoch": 7264} {"train_loss": -28.102493286132812, "global_step": 602951, "epoch": 7264} {"train_loss": -27.868314743041992, "global_step": 602952, "epoch": 7264} {"train_loss": -27.992786407470703, "global_step": 602953, "epoch": 7264} {"train_loss": -28.14080238342285, "global_step": 602954, "epoch": 7264} {"train_loss": -27.92695426940918, "global_step": 602955, "epoch": 7264} {"train_loss": -28.18857192993164, "global_step": 602956, "epoch": 7264} {"train_loss": -28.148046493530273, "global_step": 602957, "epoch": 7264} {"train_loss": -28.12114906311035, "global_step": 602958, "epoch": 7264} {"train_loss": -27.68340492248535, "global_step": 602959, "epoch": 7264} {"train_loss": -27.869245529174805, "global_step": 602960, "epoch": 7264} {"train_loss": -28.50665283203125, "global_step": 602961, "epoch": 7264} {"train_loss": -27.644323348999023, "global_step": 602962, "epoch": 7264} {"train_loss": -28.312030792236328, "global_step": 602963, "epoch": 7264} {"train_loss": -28.104660034179688, "global_step": 602964, "epoch": 7264} {"train_loss": -27.6641788482666, "global_step": 602965, "epoch": 7264} {"train_loss": -28.346424102783203, "global_step": 602966, "epoch": 7264} {"train_loss": -28.34120750427246, "global_step": 602967, "epoch": 7264} {"train_loss": -28.190832138061523, "global_step": 602968, "epoch": 7264} {"train_loss": -27.871612548828125, "global_step": 602969, "epoch": 7264} {"train_loss": -28.009077072143555, "global_step": 602970, "epoch": 7264} {"train_loss": -28.05402183532715, "global_step": 602971, "epoch": 7264} {"train_loss": -28.295324325561523, "global_step": 602972, "epoch": 7264} {"train_loss": -27.593463897705078, "global_step": 602973, "epoch": 7264} {"train_loss": -28.322553634643555, "global_step": 602974, "epoch": 7264} {"train_loss": -27.740650177001953, "global_step": 602975, "epoch": 7264} {"train_loss": -27.857757568359375, "global_step": 602976, "epoch": 7264} {"train_loss": -27.64692497253418, "global_step": 602977, "epoch": 7264} {"train_loss": -27.671804428100586, "global_step": 602978, "epoch": 7264} {"train_loss": -27.877399444580078, "global_step": 602979, "epoch": 7264} {"train_loss": -27.91826820373535, "global_step": 602980, "epoch": 7264} {"train_loss": -28.324506759643555, "global_step": 602981, "epoch": 7264} {"train_loss": -27.861616134643555, "global_step": 602982, "epoch": 7264} {"train_loss": -27.94533348083496, "global_step": 602983, "epoch": 7264} {"train_loss": -28.0506591796875, "global_step": 602984, "epoch": 7264} {"train_loss": -27.755908966064453, "global_step": 602985, "epoch": 7264} {"train_loss": -28.080005645751953, "global_step": 602986, "epoch": 7264} {"train_loss": -27.96869468688965, "global_step": 602987, "epoch": 7264} {"train_loss": -27.822895050048828, "global_step": 602988, "epoch": 7264} {"train_loss": -28.227325439453125, "global_step": 602989, "epoch": 7264} {"train_loss": -28.38254737854004, "global_step": 602990, "epoch": 7264} {"train_loss": -27.950489044189453, "global_step": 602991, "epoch": 7264} {"train_loss": -28.2767276763916, "global_step": 602992, "epoch": 7264} {"train_loss": -28.198444366455078, "global_step": 602993, "epoch": 7264} {"train_loss": -27.94105196573648, "global_step": 602994, "epoch": 7264, "val_loss": 6730450.0} {"train_loss": -26.98884391784668, "global_step": 602995, "epoch": 7265} {"train_loss": -27.810407638549805, "global_step": 602996, "epoch": 7265} {"train_loss": -27.57352638244629, "global_step": 602997, "epoch": 7265} {"train_loss": -27.8603458404541, "global_step": 602998, "epoch": 7265} {"train_loss": -27.694183349609375, "global_step": 602999, "epoch": 7265} {"train_loss": -28.01289176940918, "global_step": 603000, "epoch": 7265} {"train_loss": -27.731876373291016, "global_step": 603001, "epoch": 7265} {"train_loss": -28.065114974975586, "global_step": 603002, "epoch": 7265} {"train_loss": -28.060596466064453, "global_step": 603003, "epoch": 7265} {"train_loss": -27.8759822845459, "global_step": 603004, "epoch": 7265} {"train_loss": -27.71146011352539, "global_step": 603005, "epoch": 7265} {"train_loss": -27.967605590820312, "global_step": 603006, "epoch": 7265} {"train_loss": -27.664697647094727, "global_step": 603007, "epoch": 7265} {"train_loss": -27.780126571655273, "global_step": 603008, "epoch": 7265} {"train_loss": -28.02094078063965, "global_step": 603009, "epoch": 7265} {"train_loss": -27.934579849243164, "global_step": 603010, "epoch": 7265} {"train_loss": -27.865751266479492, "global_step": 603011, "epoch": 7265} {"train_loss": -27.943586349487305, "global_step": 603012, "epoch": 7265} {"train_loss": -27.70343589782715, "global_step": 603013, "epoch": 7265} {"train_loss": -27.56549644470215, "global_step": 603014, "epoch": 7265} {"train_loss": -28.291690826416016, "global_step": 603015, "epoch": 7265} {"train_loss": -27.678640365600586, "global_step": 603016, "epoch": 7265} {"train_loss": -27.888504028320312, "global_step": 603017, "epoch": 7265} {"train_loss": -27.67118263244629, "global_step": 603018, "epoch": 7265} {"train_loss": -28.018640518188477, "global_step": 603019, "epoch": 7265} {"train_loss": -27.9208984375, "global_step": 603020, "epoch": 7265} {"train_loss": -28.073505401611328, "global_step": 603021, "epoch": 7265} {"train_loss": -27.8218936920166, "global_step": 603022, "epoch": 7265} {"train_loss": -27.799936294555664, "global_step": 603023, "epoch": 7265} {"train_loss": -27.839460372924805, "global_step": 603024, "epoch": 7265} {"train_loss": -27.962326049804688, "global_step": 603025, "epoch": 7265} {"train_loss": -27.70680046081543, "global_step": 603026, "epoch": 7265} {"train_loss": -28.18458366394043, "global_step": 603027, "epoch": 7265} {"train_loss": -27.706165313720703, "global_step": 603028, "epoch": 7265} {"train_loss": -27.828205108642578, "global_step": 603029, "epoch": 7265} {"train_loss": -27.938507080078125, "global_step": 603030, "epoch": 7265} {"train_loss": -27.888635635375977, "global_step": 603031, "epoch": 7265} {"train_loss": -27.723806381225586, "global_step": 603032, "epoch": 7265} {"train_loss": -28.023101806640625, "global_step": 603033, "epoch": 7265} {"train_loss": -27.875110626220703, "global_step": 603034, "epoch": 7265} {"train_loss": -28.18161392211914, "global_step": 603035, "epoch": 7265} {"train_loss": -28.084165573120117, "global_step": 603036, "epoch": 7265} {"train_loss": -27.997482299804688, "global_step": 603037, "epoch": 7265} {"train_loss": -28.441513061523438, "global_step": 603038, "epoch": 7265} {"train_loss": -27.74959373474121, "global_step": 603039, "epoch": 7265} {"train_loss": -27.99371910095215, "global_step": 603040, "epoch": 7265} {"train_loss": -27.77593421936035, "global_step": 603041, "epoch": 7265} {"train_loss": -27.36069679260254, "global_step": 603042, "epoch": 7265} {"train_loss": -27.760330200195312, "global_step": 603043, "epoch": 7265} {"train_loss": -27.885284423828125, "global_step": 603044, "epoch": 7265} {"train_loss": -27.74875831604004, "global_step": 603045, "epoch": 7265} {"train_loss": -27.11032485961914, "global_step": 603046, "epoch": 7265} {"train_loss": -27.74604606628418, "global_step": 603047, "epoch": 7265} {"train_loss": -28.126846313476562, "global_step": 603048, "epoch": 7265} {"train_loss": -27.648569107055664, "global_step": 603049, "epoch": 7265} {"train_loss": -27.356069564819336, "global_step": 603050, "epoch": 7265} {"train_loss": -27.1058406829834, "global_step": 603051, "epoch": 7265} {"train_loss": -27.802169799804688, "global_step": 603052, "epoch": 7265} {"train_loss": -27.64228630065918, "global_step": 603053, "epoch": 7265} {"train_loss": -28.01803970336914, "global_step": 603054, "epoch": 7265} {"train_loss": -28.064443588256836, "global_step": 603055, "epoch": 7265} {"train_loss": -27.955951690673828, "global_step": 603056, "epoch": 7265} {"train_loss": -28.042987823486328, "global_step": 603057, "epoch": 7265} {"train_loss": -27.766611099243164, "global_step": 603058, "epoch": 7265} {"train_loss": -28.235748291015625, "global_step": 603059, "epoch": 7265} {"train_loss": -27.8336124420166, "global_step": 603060, "epoch": 7265} {"train_loss": -27.755590438842773, "global_step": 603061, "epoch": 7265} {"train_loss": -28.24761962890625, "global_step": 603062, "epoch": 7265} {"train_loss": -27.93448829650879, "global_step": 603063, "epoch": 7265} {"train_loss": -28.055566787719727, "global_step": 603064, "epoch": 7265} {"train_loss": -27.889196395874023, "global_step": 603065, "epoch": 7265} {"train_loss": -28.081653594970703, "global_step": 603066, "epoch": 7265} {"train_loss": -28.0161190032959, "global_step": 603067, "epoch": 7265} {"train_loss": -28.205554962158203, "global_step": 603068, "epoch": 7265} {"train_loss": -28.10016441345215, "global_step": 603069, "epoch": 7265} {"train_loss": -27.87067985534668, "global_step": 603070, "epoch": 7265} {"train_loss": -28.0190486907959, "global_step": 603071, "epoch": 7265} {"train_loss": -27.844562530517578, "global_step": 603072, "epoch": 7265} {"train_loss": -27.707666397094727, "global_step": 603073, "epoch": 7265} {"train_loss": -28.373016357421875, "global_step": 603074, "epoch": 7265} {"train_loss": -28.244596481323242, "global_step": 603075, "epoch": 7265} {"train_loss": -28.35076332092285, "global_step": 603076, "epoch": 7265} {"train_loss": -27.8825660613646, "global_step": 603077, "epoch": 7265, "val_loss": 6683811.5} {"train_loss": -27.182371139526367, "global_step": 603078, "epoch": 7266} {"train_loss": -27.9383487701416, "global_step": 603079, "epoch": 7266} {"train_loss": -27.746679306030273, "global_step": 603080, "epoch": 7266} {"train_loss": -27.329914093017578, "global_step": 603081, "epoch": 7266} {"train_loss": -27.55091667175293, "global_step": 603082, "epoch": 7266} {"train_loss": -28.065387725830078, "global_step": 603083, "epoch": 7266} {"train_loss": -27.295398712158203, "global_step": 603084, "epoch": 7266} {"train_loss": -27.69703483581543, "global_step": 603085, "epoch": 7266} {"train_loss": -27.913436889648438, "global_step": 603086, "epoch": 7266} {"train_loss": -27.935880661010742, "global_step": 603087, "epoch": 7266} {"train_loss": -27.96567726135254, "global_step": 603088, "epoch": 7266} {"train_loss": -27.654010772705078, "global_step": 603089, "epoch": 7266} {"train_loss": -28.095327377319336, "global_step": 603090, "epoch": 7266} {"train_loss": -27.8356876373291, "global_step": 603091, "epoch": 7266} {"train_loss": -28.141645431518555, "global_step": 603092, "epoch": 7266} {"train_loss": -28.28285789489746, "global_step": 603093, "epoch": 7266} {"train_loss": -27.91937828063965, "global_step": 603094, "epoch": 7266} {"train_loss": -28.120868682861328, "global_step": 603095, "epoch": 7266} {"train_loss": -27.883344650268555, "global_step": 603096, "epoch": 7266} {"train_loss": -27.9464054107666, "global_step": 603097, "epoch": 7266} {"train_loss": -28.08989906311035, "global_step": 603098, "epoch": 7266} {"train_loss": -28.260482788085938, "global_step": 603099, "epoch": 7266} {"train_loss": -27.79507827758789, "global_step": 603100, "epoch": 7266} {"train_loss": -28.23187828063965, "global_step": 603101, "epoch": 7266} {"train_loss": -27.80147361755371, "global_step": 603102, "epoch": 7266} {"train_loss": -27.86048698425293, "global_step": 603103, "epoch": 7266} {"train_loss": -28.091171264648438, "global_step": 603104, "epoch": 7266} {"train_loss": -28.049640655517578, "global_step": 603105, "epoch": 7266} {"train_loss": -27.99102210998535, "global_step": 603106, "epoch": 7266} {"train_loss": -27.8680477142334, "global_step": 603107, "epoch": 7266} {"train_loss": -28.221588134765625, "global_step": 603108, "epoch": 7266} {"train_loss": -28.212677001953125, "global_step": 603109, "epoch": 7266} {"train_loss": -28.1345157623291, "global_step": 603110, "epoch": 7266} {"train_loss": -27.862974166870117, "global_step": 603111, "epoch": 7266} {"train_loss": -28.10902214050293, "global_step": 603112, "epoch": 7266} {"train_loss": -27.8024959564209, "global_step": 603113, "epoch": 7266} {"train_loss": -27.901296615600586, "global_step": 603114, "epoch": 7266} {"train_loss": -28.39118766784668, "global_step": 603115, "epoch": 7266} {"train_loss": -28.289886474609375, "global_step": 603116, "epoch": 7266} {"train_loss": -28.301191329956055, "global_step": 603117, "epoch": 7266} {"train_loss": -28.470794677734375, "global_step": 603118, "epoch": 7266} {"train_loss": -28.07936668395996, "global_step": 603119, "epoch": 7266} {"train_loss": -28.1695499420166, "global_step": 603120, "epoch": 7266} {"train_loss": -28.4610652923584, "global_step": 603121, "epoch": 7266} {"train_loss": -28.047595977783203, "global_step": 603122, "epoch": 7266} {"train_loss": -28.01858901977539, "global_step": 603123, "epoch": 7266} {"train_loss": -28.05121421813965, "global_step": 603124, "epoch": 7266} {"train_loss": -27.975421905517578, "global_step": 603125, "epoch": 7266} {"train_loss": -28.243322372436523, "global_step": 603126, "epoch": 7266} {"train_loss": -28.088897705078125, "global_step": 603127, "epoch": 7266} {"train_loss": -28.020172119140625, "global_step": 603128, "epoch": 7266} {"train_loss": -28.40500259399414, "global_step": 603129, "epoch": 7266} {"train_loss": -27.88457679748535, "global_step": 603130, "epoch": 7266} {"train_loss": -28.316986083984375, "global_step": 603131, "epoch": 7266} {"train_loss": -27.651920318603516, "global_step": 603132, "epoch": 7266} {"train_loss": -27.994054794311523, "global_step": 603133, "epoch": 7266} {"train_loss": -28.14375114440918, "global_step": 603134, "epoch": 7266} {"train_loss": -27.77836036682129, "global_step": 603135, "epoch": 7266} {"train_loss": -27.34498405456543, "global_step": 603136, "epoch": 7266} {"train_loss": -28.024457931518555, "global_step": 603137, "epoch": 7266} {"train_loss": -27.602680206298828, "global_step": 603138, "epoch": 7266} {"train_loss": -27.49159812927246, "global_step": 603139, "epoch": 7266} {"train_loss": -27.99526023864746, "global_step": 603140, "epoch": 7266} {"train_loss": -28.0786190032959, "global_step": 603141, "epoch": 7266} {"train_loss": -27.887908935546875, "global_step": 603142, "epoch": 7266} {"train_loss": -28.398298263549805, "global_step": 603143, "epoch": 7266} {"train_loss": -27.80543327331543, "global_step": 603144, "epoch": 7266} {"train_loss": -27.878992080688477, "global_step": 603145, "epoch": 7266} {"train_loss": -27.9573974609375, "global_step": 603146, "epoch": 7266} {"train_loss": -27.901123046875, "global_step": 603147, "epoch": 7266} {"train_loss": -27.735227584838867, "global_step": 603148, "epoch": 7266} {"train_loss": -27.326353073120117, "global_step": 603149, "epoch": 7266} {"train_loss": -28.111038208007812, "global_step": 603150, "epoch": 7266} {"train_loss": -28.097244262695312, "global_step": 603151, "epoch": 7266} {"train_loss": -28.28472328186035, "global_step": 603152, "epoch": 7266} {"train_loss": -27.897119522094727, "global_step": 603153, "epoch": 7266} {"train_loss": -27.868579864501953, "global_step": 603154, "epoch": 7266} {"train_loss": -28.21282386779785, "global_step": 603155, "epoch": 7266} {"train_loss": -27.80097007751465, "global_step": 603156, "epoch": 7266} {"train_loss": -28.042516708374023, "global_step": 603157, "epoch": 7266} {"train_loss": -28.068069458007812, "global_step": 603158, "epoch": 7266} {"train_loss": -27.926355361938477, "global_step": 603159, "epoch": 7266} {"train_loss": -27.965336834091737, "global_step": 603160, "epoch": 7266, "val_loss": 6725997.0} {"train_loss": -27.48811912536621, "global_step": 603161, "epoch": 7267} {"train_loss": -27.436002731323242, "global_step": 603162, "epoch": 7267} {"train_loss": -27.26589012145996, "global_step": 603163, "epoch": 7267} {"train_loss": -27.703832626342773, "global_step": 603164, "epoch": 7267} {"train_loss": -28.191654205322266, "global_step": 603165, "epoch": 7267} {"train_loss": -27.815881729125977, "global_step": 603166, "epoch": 7267} {"train_loss": -27.678171157836914, "global_step": 603167, "epoch": 7267} {"train_loss": -27.890827178955078, "global_step": 603168, "epoch": 7267} {"train_loss": -28.155981063842773, "global_step": 603169, "epoch": 7267} {"train_loss": -28.074472427368164, "global_step": 603170, "epoch": 7267} {"train_loss": -27.918426513671875, "global_step": 603171, "epoch": 7267} {"train_loss": -28.054702758789062, "global_step": 603172, "epoch": 7267} {"train_loss": -28.210355758666992, "global_step": 603173, "epoch": 7267} {"train_loss": -27.781558990478516, "global_step": 603174, "epoch": 7267} {"train_loss": -27.968530654907227, "global_step": 603175, "epoch": 7267} {"train_loss": -27.814130783081055, "global_step": 603176, "epoch": 7267} {"train_loss": -27.935606002807617, "global_step": 603177, "epoch": 7267} {"train_loss": -28.11061668395996, "global_step": 603178, "epoch": 7267} {"train_loss": -27.939544677734375, "global_step": 603179, "epoch": 7267} {"train_loss": -28.14702796936035, "global_step": 603180, "epoch": 7267} {"train_loss": -28.347797393798828, "global_step": 603181, "epoch": 7267} {"train_loss": -28.157394409179688, "global_step": 603182, "epoch": 7267} {"train_loss": -27.615005493164062, "global_step": 603183, "epoch": 7267} {"train_loss": -27.989721298217773, "global_step": 603184, "epoch": 7267} {"train_loss": -27.918365478515625, "global_step": 603185, "epoch": 7267} {"train_loss": -28.11086082458496, "global_step": 603186, "epoch": 7267} {"train_loss": -27.993200302124023, "global_step": 603187, "epoch": 7267} {"train_loss": -28.40736198425293, "global_step": 603188, "epoch": 7267} {"train_loss": -28.161508560180664, "global_step": 603189, "epoch": 7267} {"train_loss": -28.00972557067871, "global_step": 603190, "epoch": 7267} {"train_loss": -28.344263076782227, "global_step": 603191, "epoch": 7267} {"train_loss": -28.232446670532227, "global_step": 603192, "epoch": 7267} {"train_loss": -28.04681968688965, "global_step": 603193, "epoch": 7267} {"train_loss": -28.067358016967773, "global_step": 603194, "epoch": 7267} {"train_loss": -27.79408073425293, "global_step": 603195, "epoch": 7267} {"train_loss": -27.918521881103516, "global_step": 603196, "epoch": 7267} {"train_loss": -28.0218448638916, "global_step": 603197, "epoch": 7267} {"train_loss": -27.29774284362793, "global_step": 603198, "epoch": 7267} {"train_loss": -27.34808921813965, "global_step": 603199, "epoch": 7267} {"train_loss": -27.549299240112305, "global_step": 603200, "epoch": 7267} {"train_loss": -27.908411026000977, "global_step": 603201, "epoch": 7267} {"train_loss": -27.870275497436523, "global_step": 603202, "epoch": 7267} {"train_loss": -27.741239547729492, "global_step": 603203, "epoch": 7267} {"train_loss": -27.883380889892578, "global_step": 603204, "epoch": 7267} {"train_loss": -27.739850997924805, "global_step": 603205, "epoch": 7267} {"train_loss": -27.579740524291992, "global_step": 603206, "epoch": 7267} {"train_loss": -27.6106014251709, "global_step": 603207, "epoch": 7267} {"train_loss": -28.14985466003418, "global_step": 603208, "epoch": 7267} {"train_loss": -27.757694244384766, "global_step": 603209, "epoch": 7267} {"train_loss": -27.975982666015625, "global_step": 603210, "epoch": 7267} {"train_loss": -28.018667221069336, "global_step": 603211, "epoch": 7267} {"train_loss": -27.794864654541016, "global_step": 603212, "epoch": 7267} {"train_loss": -28.155241012573242, "global_step": 603213, "epoch": 7267} {"train_loss": -28.09027671813965, "global_step": 603214, "epoch": 7267} {"train_loss": -27.815204620361328, "global_step": 603215, "epoch": 7267} {"train_loss": -27.84248161315918, "global_step": 603216, "epoch": 7267} {"train_loss": -28.097705841064453, "global_step": 603217, "epoch": 7267} {"train_loss": -28.2740478515625, "global_step": 603218, "epoch": 7267} {"train_loss": -28.269140243530273, "global_step": 603219, "epoch": 7267} {"train_loss": -28.32452964782715, "global_step": 603220, "epoch": 7267} {"train_loss": -28.04193115234375, "global_step": 603221, "epoch": 7267} {"train_loss": -28.19508171081543, "global_step": 603222, "epoch": 7267} {"train_loss": -28.027572631835938, "global_step": 603223, "epoch": 7267} {"train_loss": -28.424957275390625, "global_step": 603224, "epoch": 7267} {"train_loss": -28.263427734375, "global_step": 603225, "epoch": 7267} {"train_loss": -28.05866050720215, "global_step": 603226, "epoch": 7267} {"train_loss": -27.876432418823242, "global_step": 603227, "epoch": 7267} {"train_loss": -28.001785278320312, "global_step": 603228, "epoch": 7267} {"train_loss": -27.85755729675293, "global_step": 603229, "epoch": 7267} {"train_loss": -28.101964950561523, "global_step": 603230, "epoch": 7267} {"train_loss": -28.1970157623291, "global_step": 603231, "epoch": 7267} {"train_loss": -28.03277015686035, "global_step": 603232, "epoch": 7267} {"train_loss": -28.072912216186523, "global_step": 603233, "epoch": 7267} {"train_loss": -27.88541603088379, "global_step": 603234, "epoch": 7267} {"train_loss": -28.349166870117188, "global_step": 603235, "epoch": 7267} {"train_loss": -28.045902252197266, "global_step": 603236, "epoch": 7267} {"train_loss": -27.9869441986084, "global_step": 603237, "epoch": 7267} {"train_loss": -27.973468780517578, "global_step": 603238, "epoch": 7267} {"train_loss": -27.91505241394043, "global_step": 603239, "epoch": 7267} {"train_loss": -28.2622013092041, "global_step": 603240, "epoch": 7267} {"train_loss": -28.278827667236328, "global_step": 603241, "epoch": 7267} {"train_loss": -28.14035415649414, "global_step": 603242, "epoch": 7267} {"train_loss": -27.96240622738758, "global_step": 603243, "epoch": 7267, "val_loss": 6771246.0} {"train_loss": -26.053876876831055, "global_step": 603244, "epoch": 7268} {"train_loss": -25.225961685180664, "global_step": 603245, "epoch": 7268} {"train_loss": -26.8110408782959, "global_step": 603246, "epoch": 7268} {"train_loss": -25.136615753173828, "global_step": 603247, "epoch": 7268} {"train_loss": -26.39971923828125, "global_step": 603248, "epoch": 7268} {"train_loss": -25.981632232666016, "global_step": 603249, "epoch": 7268} {"train_loss": -26.71185874938965, "global_step": 603250, "epoch": 7268} {"train_loss": -25.862768173217773, "global_step": 603251, "epoch": 7268} {"train_loss": -27.163190841674805, "global_step": 603252, "epoch": 7268} {"train_loss": -26.00457191467285, "global_step": 603253, "epoch": 7268} {"train_loss": -26.750104904174805, "global_step": 603254, "epoch": 7268} {"train_loss": -26.074331283569336, "global_step": 603255, "epoch": 7268} {"train_loss": -26.197927474975586, "global_step": 603256, "epoch": 7268} {"train_loss": -26.581008911132812, "global_step": 603257, "epoch": 7268} {"train_loss": -26.97608757019043, "global_step": 603258, "epoch": 7268} {"train_loss": -27.013385772705078, "global_step": 603259, "epoch": 7268} {"train_loss": -26.044809341430664, "global_step": 603260, "epoch": 7268} {"train_loss": -27.09027099609375, "global_step": 603261, "epoch": 7268} {"train_loss": -26.861780166625977, "global_step": 603262, "epoch": 7268} {"train_loss": -26.522247314453125, "global_step": 603263, "epoch": 7268} {"train_loss": -26.706701278686523, "global_step": 603264, "epoch": 7268} {"train_loss": -27.085174560546875, "global_step": 603265, "epoch": 7268} {"train_loss": -26.87090492248535, "global_step": 603266, "epoch": 7268} {"train_loss": -27.00933837890625, "global_step": 603267, "epoch": 7268} {"train_loss": -27.122055053710938, "global_step": 603268, "epoch": 7268} {"train_loss": -27.318628311157227, "global_step": 603269, "epoch": 7268} {"train_loss": -27.407257080078125, "global_step": 603270, "epoch": 7268} {"train_loss": -27.18570327758789, "global_step": 603271, "epoch": 7268} {"train_loss": -27.43839454650879, "global_step": 603272, "epoch": 7268} {"train_loss": -27.416723251342773, "global_step": 603273, "epoch": 7268} {"train_loss": -27.648971557617188, "global_step": 603274, "epoch": 7268} {"train_loss": -27.835241317749023, "global_step": 603275, "epoch": 7268} {"train_loss": -27.566740036010742, "global_step": 603276, "epoch": 7268} {"train_loss": -27.372159957885742, "global_step": 603277, "epoch": 7268} {"train_loss": -27.497217178344727, "global_step": 603278, "epoch": 7268} {"train_loss": -27.97450065612793, "global_step": 603279, "epoch": 7268} {"train_loss": -27.45789909362793, "global_step": 603280, "epoch": 7268} {"train_loss": -27.941238403320312, "global_step": 603281, "epoch": 7268} {"train_loss": -27.4243106842041, "global_step": 603282, "epoch": 7268} {"train_loss": -27.68204116821289, "global_step": 603283, "epoch": 7268} {"train_loss": -27.9279727935791, "global_step": 603284, "epoch": 7268} {"train_loss": -27.70619010925293, "global_step": 603285, "epoch": 7268} {"train_loss": -28.19439125061035, "global_step": 603286, "epoch": 7268} {"train_loss": -27.964139938354492, "global_step": 603287, "epoch": 7268} {"train_loss": -27.865482330322266, "global_step": 603288, "epoch": 7268} {"train_loss": -27.85199546813965, "global_step": 603289, "epoch": 7268} {"train_loss": -27.953388214111328, "global_step": 603290, "epoch": 7268} {"train_loss": -27.997058868408203, "global_step": 603291, "epoch": 7268} {"train_loss": -28.193317413330078, "global_step": 603292, "epoch": 7268} {"train_loss": -27.968549728393555, "global_step": 603293, "epoch": 7268} {"train_loss": -28.181228637695312, "global_step": 603294, "epoch": 7268} {"train_loss": -27.887121200561523, "global_step": 603295, "epoch": 7268} {"train_loss": -28.053659439086914, "global_step": 603296, "epoch": 7268} {"train_loss": -28.02960777282715, "global_step": 603297, "epoch": 7268} {"train_loss": -27.933795928955078, "global_step": 603298, "epoch": 7268} {"train_loss": -28.0782470703125, "global_step": 603299, "epoch": 7268} {"train_loss": -28.066699981689453, "global_step": 603300, "epoch": 7268} {"train_loss": -28.31268882751465, "global_step": 603301, "epoch": 7268} {"train_loss": -28.333404541015625, "global_step": 603302, "epoch": 7268} {"train_loss": -28.481489181518555, "global_step": 603303, "epoch": 7268} {"train_loss": -28.1855525970459, "global_step": 603304, "epoch": 7268} {"train_loss": -27.996185302734375, "global_step": 603305, "epoch": 7268} {"train_loss": -28.18610954284668, "global_step": 603306, "epoch": 7268} {"train_loss": -28.1457462310791, "global_step": 603307, "epoch": 7268} {"train_loss": -28.104217529296875, "global_step": 603308, "epoch": 7268} {"train_loss": -28.1088809967041, "global_step": 603309, "epoch": 7268} {"train_loss": -27.949447631835938, "global_step": 603310, "epoch": 7268} {"train_loss": -28.199567794799805, "global_step": 603311, "epoch": 7268} {"train_loss": -28.190021514892578, "global_step": 603312, "epoch": 7268} {"train_loss": -28.164575576782227, "global_step": 603313, "epoch": 7268} {"train_loss": -28.41448974609375, "global_step": 603314, "epoch": 7268} {"train_loss": -28.740570068359375, "global_step": 603315, "epoch": 7268} {"train_loss": -28.67685317993164, "global_step": 603316, "epoch": 7268} {"train_loss": -28.326215744018555, "global_step": 603317, "epoch": 7268} {"train_loss": -28.794580459594727, "global_step": 603318, "epoch": 7268} {"train_loss": -28.33881187438965, "global_step": 603319, "epoch": 7268} {"train_loss": -28.133996963500977, "global_step": 603320, "epoch": 7268} {"train_loss": -28.345123291015625, "global_step": 603321, "epoch": 7268} {"train_loss": -28.06943702697754, "global_step": 603322, "epoch": 7268} {"train_loss": -28.47019386291504, "global_step": 603323, "epoch": 7268} {"train_loss": -28.00504493713379, "global_step": 603324, "epoch": 7268} {"train_loss": -28.041763305664062, "global_step": 603325, "epoch": 7268} {"train_loss": -27.52784138415233, "global_step": 603326, "epoch": 7268, "val_loss": 6796726.0} {"train_loss": -26.908843994140625, "global_step": 603327, "epoch": 7269} {"train_loss": -26.603713989257812, "global_step": 603328, "epoch": 7269} {"train_loss": -27.1794490814209, "global_step": 603329, "epoch": 7269} {"train_loss": -27.40771484375, "global_step": 603330, "epoch": 7269} {"train_loss": -27.4168643951416, "global_step": 603331, "epoch": 7269} {"train_loss": -27.222387313842773, "global_step": 603332, "epoch": 7269} {"train_loss": -27.653284072875977, "global_step": 603333, "epoch": 7269} {"train_loss": -27.419885635375977, "global_step": 603334, "epoch": 7269} {"train_loss": -27.43537712097168, "global_step": 603335, "epoch": 7269} {"train_loss": -27.497852325439453, "global_step": 603336, "epoch": 7269} {"train_loss": -27.669973373413086, "global_step": 603337, "epoch": 7269} {"train_loss": -27.474557876586914, "global_step": 603338, "epoch": 7269} {"train_loss": -27.870275497436523, "global_step": 603339, "epoch": 7269} {"train_loss": -27.477222442626953, "global_step": 603340, "epoch": 7269} {"train_loss": -27.944204330444336, "global_step": 603341, "epoch": 7269} {"train_loss": -28.005659103393555, "global_step": 603342, "epoch": 7269} {"train_loss": -27.304967880249023, "global_step": 603343, "epoch": 7269} {"train_loss": -27.806625366210938, "global_step": 603344, "epoch": 7269} {"train_loss": -27.51521110534668, "global_step": 603345, "epoch": 7269} {"train_loss": -27.35587501525879, "global_step": 603346, "epoch": 7269} {"train_loss": -27.928390502929688, "global_step": 603347, "epoch": 7269} {"train_loss": -27.29833984375, "global_step": 603348, "epoch": 7269} {"train_loss": -27.603506088256836, "global_step": 603349, "epoch": 7269} {"train_loss": -27.960941314697266, "global_step": 603350, "epoch": 7269} {"train_loss": -27.527969360351562, "global_step": 603351, "epoch": 7269} {"train_loss": -27.983198165893555, "global_step": 603352, "epoch": 7269} {"train_loss": -27.69563865661621, "global_step": 603353, "epoch": 7269} {"train_loss": -27.86355972290039, "global_step": 603354, "epoch": 7269} {"train_loss": -27.706958770751953, "global_step": 603355, "epoch": 7269} {"train_loss": -27.896879196166992, "global_step": 603356, "epoch": 7269} {"train_loss": -28.055099487304688, "global_step": 603357, "epoch": 7269} {"train_loss": -27.50620460510254, "global_step": 603358, "epoch": 7269} {"train_loss": -28.105634689331055, "global_step": 603359, "epoch": 7269} {"train_loss": -27.308917999267578, "global_step": 603360, "epoch": 7269} {"train_loss": -27.77255630493164, "global_step": 603361, "epoch": 7269} {"train_loss": -27.720401763916016, "global_step": 603362, "epoch": 7269} {"train_loss": -28.0909366607666, "global_step": 603363, "epoch": 7269} {"train_loss": -27.948286056518555, "global_step": 603364, "epoch": 7269} {"train_loss": -28.01995849609375, "global_step": 603365, "epoch": 7269} {"train_loss": -28.159643173217773, "global_step": 603366, "epoch": 7269} {"train_loss": -27.83353042602539, "global_step": 603367, "epoch": 7269} {"train_loss": -27.675003051757812, "global_step": 603368, "epoch": 7269} {"train_loss": -28.131376266479492, "global_step": 603369, "epoch": 7269} {"train_loss": -28.12917137145996, "global_step": 603370, "epoch": 7269} {"train_loss": -28.44732666015625, "global_step": 603371, "epoch": 7269} {"train_loss": -28.2585506439209, "global_step": 603372, "epoch": 7269} {"train_loss": -28.00802993774414, "global_step": 603373, "epoch": 7269} {"train_loss": -27.932851791381836, "global_step": 603374, "epoch": 7269} {"train_loss": -28.10406494140625, "global_step": 603375, "epoch": 7269} {"train_loss": -28.221155166625977, "global_step": 603376, "epoch": 7269} {"train_loss": -27.922992706298828, "global_step": 603377, "epoch": 7269} {"train_loss": -28.127304077148438, "global_step": 603378, "epoch": 7269} {"train_loss": -28.249256134033203, "global_step": 603379, "epoch": 7269} {"train_loss": -28.195819854736328, "global_step": 603380, "epoch": 7269} {"train_loss": -27.847412109375, "global_step": 603381, "epoch": 7269} {"train_loss": -28.565458297729492, "global_step": 603382, "epoch": 7269} {"train_loss": -28.54194450378418, "global_step": 603383, "epoch": 7269} {"train_loss": -27.81267738342285, "global_step": 603384, "epoch": 7269} {"train_loss": -28.18360710144043, "global_step": 603385, "epoch": 7269} {"train_loss": -28.25008201599121, "global_step": 603386, "epoch": 7269} {"train_loss": -28.434799194335938, "global_step": 603387, "epoch": 7269} {"train_loss": -28.290058135986328, "global_step": 603388, "epoch": 7269} {"train_loss": -28.311803817749023, "global_step": 603389, "epoch": 7269} {"train_loss": -28.2922306060791, "global_step": 603390, "epoch": 7269} {"train_loss": -28.269495010375977, "global_step": 603391, "epoch": 7269} {"train_loss": -28.520116806030273, "global_step": 603392, "epoch": 7269} {"train_loss": -27.898574829101562, "global_step": 603393, "epoch": 7269} {"train_loss": -28.424222946166992, "global_step": 603394, "epoch": 7269} {"train_loss": -28.476404190063477, "global_step": 603395, "epoch": 7269} {"train_loss": -28.132795333862305, "global_step": 603396, "epoch": 7269} {"train_loss": -28.479841232299805, "global_step": 603397, "epoch": 7269} {"train_loss": -28.06255531311035, "global_step": 603398, "epoch": 7269} {"train_loss": -28.09730339050293, "global_step": 603399, "epoch": 7269} {"train_loss": -28.00918960571289, "global_step": 603400, "epoch": 7269} {"train_loss": -28.38996696472168, "global_step": 603401, "epoch": 7269} {"train_loss": -27.784122467041016, "global_step": 603402, "epoch": 7269} {"train_loss": -27.887744903564453, "global_step": 603403, "epoch": 7269} {"train_loss": -27.736896514892578, "global_step": 603404, "epoch": 7269} {"train_loss": -27.976511001586914, "global_step": 603405, "epoch": 7269} {"train_loss": -27.959070205688477, "global_step": 603406, "epoch": 7269} {"train_loss": -27.6608943939209, "global_step": 603407, "epoch": 7269} {"train_loss": -28.450347900390625, "global_step": 603408, "epoch": 7269} {"train_loss": -27.887700322162676, "global_step": 603409, "epoch": 7269, "val_loss": 6831088.5} {"train_loss": -27.84687614440918, "global_step": 603410, "epoch": 7270} {"train_loss": -27.625158309936523, "global_step": 603411, "epoch": 7270} {"train_loss": -26.923572540283203, "global_step": 603412, "epoch": 7270} {"train_loss": -26.18528175354004, "global_step": 603413, "epoch": 7270} {"train_loss": -26.995330810546875, "global_step": 603414, "epoch": 7270} {"train_loss": -27.728971481323242, "global_step": 603415, "epoch": 7270} {"train_loss": -26.85809326171875, "global_step": 603416, "epoch": 7270} {"train_loss": -27.066709518432617, "global_step": 603417, "epoch": 7270} {"train_loss": -27.95730972290039, "global_step": 603418, "epoch": 7270} {"train_loss": -27.491230010986328, "global_step": 603419, "epoch": 7270} {"train_loss": -27.351850509643555, "global_step": 603420, "epoch": 7270} {"train_loss": -27.207080841064453, "global_step": 603421, "epoch": 7270} {"train_loss": -27.22321891784668, "global_step": 603422, "epoch": 7270} {"train_loss": -28.051511764526367, "global_step": 603423, "epoch": 7270} {"train_loss": -27.436843872070312, "global_step": 603424, "epoch": 7270} {"train_loss": -27.622608184814453, "global_step": 603425, "epoch": 7270} {"train_loss": -27.19672966003418, "global_step": 603426, "epoch": 7270} {"train_loss": -27.62183952331543, "global_step": 603427, "epoch": 7270} {"train_loss": -27.592248916625977, "global_step": 603428, "epoch": 7270} {"train_loss": -27.5224609375, "global_step": 603429, "epoch": 7270} {"train_loss": -27.54499626159668, "global_step": 603430, "epoch": 7270} {"train_loss": -27.968236923217773, "global_step": 603431, "epoch": 7270} {"train_loss": -27.7705135345459, "global_step": 603432, "epoch": 7270} {"train_loss": -27.881052017211914, "global_step": 603433, "epoch": 7270} {"train_loss": -27.782983779907227, "global_step": 603434, "epoch": 7270} {"train_loss": -28.014373779296875, "global_step": 603435, "epoch": 7270} {"train_loss": -27.885726928710938, "global_step": 603436, "epoch": 7270} {"train_loss": -27.857404708862305, "global_step": 603437, "epoch": 7270} {"train_loss": -28.06272315979004, "global_step": 603438, "epoch": 7270} {"train_loss": -27.58455467224121, "global_step": 603439, "epoch": 7270} {"train_loss": -27.908971786499023, "global_step": 603440, "epoch": 7270} {"train_loss": -27.875900268554688, "global_step": 603441, "epoch": 7270} {"train_loss": -27.39667320251465, "global_step": 603442, "epoch": 7270} {"train_loss": -27.80356216430664, "global_step": 603443, "epoch": 7270} {"train_loss": -27.77349853515625, "global_step": 603444, "epoch": 7270} {"train_loss": -28.08370018005371, "global_step": 603445, "epoch": 7270} {"train_loss": -28.13681411743164, "global_step": 603446, "epoch": 7270} {"train_loss": -27.311803817749023, "global_step": 603447, "epoch": 7270} {"train_loss": -27.897428512573242, "global_step": 603448, "epoch": 7270} {"train_loss": -27.9647274017334, "global_step": 603449, "epoch": 7270} {"train_loss": -27.99489402770996, "global_step": 603450, "epoch": 7270} {"train_loss": -27.9929141998291, "global_step": 603451, "epoch": 7270} {"train_loss": -27.896427154541016, "global_step": 603452, "epoch": 7270} {"train_loss": -27.9901065826416, "global_step": 603453, "epoch": 7270} {"train_loss": -28.117919921875, "global_step": 603454, "epoch": 7270} {"train_loss": -28.18816566467285, "global_step": 603455, "epoch": 7270} {"train_loss": -28.0918025970459, "global_step": 603456, "epoch": 7270} {"train_loss": -28.625356674194336, "global_step": 603457, "epoch": 7270} {"train_loss": -28.169660568237305, "global_step": 603458, "epoch": 7270} {"train_loss": -27.89499855041504, "global_step": 603459, "epoch": 7270} {"train_loss": -27.602048873901367, "global_step": 603460, "epoch": 7270} {"train_loss": -28.171335220336914, "global_step": 603461, "epoch": 7270} {"train_loss": -28.232776641845703, "global_step": 603462, "epoch": 7270} {"train_loss": -28.11153221130371, "global_step": 603463, "epoch": 7270} {"train_loss": -28.550052642822266, "global_step": 603464, "epoch": 7270} {"train_loss": -28.243932723999023, "global_step": 603465, "epoch": 7270} {"train_loss": -28.050817489624023, "global_step": 603466, "epoch": 7270} {"train_loss": -28.25127601623535, "global_step": 603467, "epoch": 7270} {"train_loss": -28.176313400268555, "global_step": 603468, "epoch": 7270} {"train_loss": -28.264881134033203, "global_step": 603469, "epoch": 7270} {"train_loss": -28.026172637939453, "global_step": 603470, "epoch": 7270} {"train_loss": -28.42042350769043, "global_step": 603471, "epoch": 7270} {"train_loss": -27.966678619384766, "global_step": 603472, "epoch": 7270} {"train_loss": -28.228376388549805, "global_step": 603473, "epoch": 7270} {"train_loss": -28.29195213317871, "global_step": 603474, "epoch": 7270} {"train_loss": -28.25664710998535, "global_step": 603475, "epoch": 7270} {"train_loss": -28.61067771911621, "global_step": 603476, "epoch": 7270} {"train_loss": -28.478498458862305, "global_step": 603477, "epoch": 7270} {"train_loss": -27.9932918548584, "global_step": 603478, "epoch": 7270} {"train_loss": -28.40130615234375, "global_step": 603479, "epoch": 7270} {"train_loss": -28.453317642211914, "global_step": 603480, "epoch": 7270} {"train_loss": -28.33582878112793, "global_step": 603481, "epoch": 7270} {"train_loss": -28.294870376586914, "global_step": 603482, "epoch": 7270} {"train_loss": -28.47458267211914, "global_step": 603483, "epoch": 7270} {"train_loss": -28.422290802001953, "global_step": 603484, "epoch": 7270} {"train_loss": -28.01399040222168, "global_step": 603485, "epoch": 7270} {"train_loss": -28.425832748413086, "global_step": 603486, "epoch": 7270} {"train_loss": -28.047744750976562, "global_step": 603487, "epoch": 7270} {"train_loss": -27.606830596923828, "global_step": 603488, "epoch": 7270} {"train_loss": -28.151193618774414, "global_step": 603489, "epoch": 7270} {"train_loss": -27.748233795166016, "global_step": 603490, "epoch": 7270} {"train_loss": -27.529071807861328, "global_step": 603491, "epoch": 7270} {"train_loss": -27.86511276428958, "global_step": 603492, "epoch": 7270, "val_loss": 6786976.0} {"train_loss": -16.39434242248535, "global_step": 603493, "epoch": 7271} {"train_loss": -20.74867057800293, "global_step": 603494, "epoch": 7271} {"train_loss": -24.927366256713867, "global_step": 603495, "epoch": 7271} {"train_loss": -23.20499038696289, "global_step": 603496, "epoch": 7271} {"train_loss": -24.708330154418945, "global_step": 603497, "epoch": 7271} {"train_loss": -25.688507080078125, "global_step": 603498, "epoch": 7271} {"train_loss": -24.849679946899414, "global_step": 603499, "epoch": 7271} {"train_loss": -26.144092559814453, "global_step": 603500, "epoch": 7271} {"train_loss": -25.247560501098633, "global_step": 603501, "epoch": 7271} {"train_loss": -25.106287002563477, "global_step": 603502, "epoch": 7271} {"train_loss": -25.81064224243164, "global_step": 603503, "epoch": 7271} {"train_loss": -25.606231689453125, "global_step": 603504, "epoch": 7271} {"train_loss": -26.00017738342285, "global_step": 603505, "epoch": 7271} {"train_loss": -26.277942657470703, "global_step": 603506, "epoch": 7271} {"train_loss": -25.7559814453125, "global_step": 603507, "epoch": 7271} {"train_loss": -25.89588737487793, "global_step": 603508, "epoch": 7271} {"train_loss": -26.5343017578125, "global_step": 603509, "epoch": 7271} {"train_loss": -26.567075729370117, "global_step": 603510, "epoch": 7271} {"train_loss": -26.273712158203125, "global_step": 603511, "epoch": 7271} {"train_loss": -26.297216415405273, "global_step": 603512, "epoch": 7271} {"train_loss": -26.291141510009766, "global_step": 603513, "epoch": 7271} {"train_loss": -26.460363388061523, "global_step": 603514, "epoch": 7271} {"train_loss": -26.931936264038086, "global_step": 603515, "epoch": 7271} {"train_loss": -26.578338623046875, "global_step": 603516, "epoch": 7271} {"train_loss": -26.67408561706543, "global_step": 603517, "epoch": 7271} {"train_loss": -26.711669921875, "global_step": 603518, "epoch": 7271} {"train_loss": -26.95882225036621, "global_step": 603519, "epoch": 7271} {"train_loss": -26.921762466430664, "global_step": 603520, "epoch": 7271} {"train_loss": -26.741003036499023, "global_step": 603521, "epoch": 7271} {"train_loss": -26.98313331604004, "global_step": 603522, "epoch": 7271} {"train_loss": -27.184661865234375, "global_step": 603523, "epoch": 7271} {"train_loss": -27.028858184814453, "global_step": 603524, "epoch": 7271} {"train_loss": -27.361419677734375, "global_step": 603525, "epoch": 7271} {"train_loss": -26.89251708984375, "global_step": 603526, "epoch": 7271} {"train_loss": -27.00910758972168, "global_step": 603527, "epoch": 7271} {"train_loss": -27.32015037536621, "global_step": 603528, "epoch": 7271} {"train_loss": -26.806955337524414, "global_step": 603529, "epoch": 7271} {"train_loss": -27.05954933166504, "global_step": 603530, "epoch": 7271} {"train_loss": -27.260522842407227, "global_step": 603531, "epoch": 7271} {"train_loss": -27.6510066986084, "global_step": 603532, "epoch": 7271} {"train_loss": -27.19097900390625, "global_step": 603533, "epoch": 7271} {"train_loss": -27.243762969970703, "global_step": 603534, "epoch": 7271} {"train_loss": -27.434558868408203, "global_step": 603535, "epoch": 7271} {"train_loss": -27.7158145904541, "global_step": 603536, "epoch": 7271} {"train_loss": -27.72832679748535, "global_step": 603537, "epoch": 7271} {"train_loss": -27.32733154296875, "global_step": 603538, "epoch": 7271} {"train_loss": -27.57877540588379, "global_step": 603539, "epoch": 7271} {"train_loss": -27.610843658447266, "global_step": 603540, "epoch": 7271} {"train_loss": -28.13065528869629, "global_step": 603541, "epoch": 7271} {"train_loss": -27.623733520507812, "global_step": 603542, "epoch": 7271} {"train_loss": -27.593765258789062, "global_step": 603543, "epoch": 7271} {"train_loss": -27.9222412109375, "global_step": 603544, "epoch": 7271} {"train_loss": -27.864221572875977, "global_step": 603545, "epoch": 7271} {"train_loss": -27.49958610534668, "global_step": 603546, "epoch": 7271} {"train_loss": -28.025135040283203, "global_step": 603547, "epoch": 7271} {"train_loss": -28.076745986938477, "global_step": 603548, "epoch": 7271} {"train_loss": -27.498449325561523, "global_step": 603549, "epoch": 7271} {"train_loss": -27.68317985534668, "global_step": 603550, "epoch": 7271} {"train_loss": -28.008642196655273, "global_step": 603551, "epoch": 7271} {"train_loss": -27.62415885925293, "global_step": 603552, "epoch": 7271} {"train_loss": -28.110401153564453, "global_step": 603553, "epoch": 7271} {"train_loss": -27.959989547729492, "global_step": 603554, "epoch": 7271} {"train_loss": -27.754873275756836, "global_step": 603555, "epoch": 7271} {"train_loss": -28.13134765625, "global_step": 603556, "epoch": 7271} {"train_loss": -28.185440063476562, "global_step": 603557, "epoch": 7271} {"train_loss": -27.9538516998291, "global_step": 603558, "epoch": 7271} {"train_loss": -28.023962020874023, "global_step": 603559, "epoch": 7271} {"train_loss": -27.723188400268555, "global_step": 603560, "epoch": 7271} {"train_loss": -27.8308162689209, "global_step": 603561, "epoch": 7271} {"train_loss": -28.0064697265625, "global_step": 603562, "epoch": 7271} {"train_loss": -28.165395736694336, "global_step": 603563, "epoch": 7271} {"train_loss": -27.992822647094727, "global_step": 603564, "epoch": 7271} {"train_loss": -28.125951766967773, "global_step": 603565, "epoch": 7271} {"train_loss": -28.222705841064453, "global_step": 603566, "epoch": 7271} {"train_loss": -28.29218864440918, "global_step": 603567, "epoch": 7271} {"train_loss": -28.279890060424805, "global_step": 603568, "epoch": 7271} {"train_loss": -28.600330352783203, "global_step": 603569, "epoch": 7271} {"train_loss": -28.17132568359375, "global_step": 603570, "epoch": 7271} {"train_loss": -28.40935707092285, "global_step": 603571, "epoch": 7271} {"train_loss": -27.8106689453125, "global_step": 603572, "epoch": 7271} {"train_loss": -27.887792587280273, "global_step": 603573, "epoch": 7271} {"train_loss": -28.252790451049805, "global_step": 603574, "epoch": 7271} {"train_loss": -26.927415181355304, "global_step": 603575, "epoch": 7271, "val_loss": 6801397.5} {"train_loss": -27.504316329956055, "global_step": 603576, "epoch": 7272} {"train_loss": -27.622360229492188, "global_step": 603577, "epoch": 7272} {"train_loss": -27.51857566833496, "global_step": 603578, "epoch": 7272} {"train_loss": -28.067380905151367, "global_step": 603579, "epoch": 7272} {"train_loss": -27.93580436706543, "global_step": 603580, "epoch": 7272} {"train_loss": -27.463134765625, "global_step": 603581, "epoch": 7272} {"train_loss": -27.634687423706055, "global_step": 603582, "epoch": 7272} {"train_loss": -27.37733268737793, "global_step": 603583, "epoch": 7272} {"train_loss": -27.661346435546875, "global_step": 603584, "epoch": 7272} {"train_loss": -27.499088287353516, "global_step": 603585, "epoch": 7272} {"train_loss": -28.041095733642578, "global_step": 603586, "epoch": 7272} {"train_loss": -28.056684494018555, "global_step": 603587, "epoch": 7272} {"train_loss": -27.598413467407227, "global_step": 603588, "epoch": 7272} {"train_loss": -28.12750244140625, "global_step": 603589, "epoch": 7272} {"train_loss": -28.026901245117188, "global_step": 603590, "epoch": 7272} {"train_loss": -27.79524040222168, "global_step": 603591, "epoch": 7272} {"train_loss": -27.623987197875977, "global_step": 603592, "epoch": 7272} {"train_loss": -27.624744415283203, "global_step": 603593, "epoch": 7272} {"train_loss": -27.717069625854492, "global_step": 603594, "epoch": 7272} {"train_loss": -28.139652252197266, "global_step": 603595, "epoch": 7272} {"train_loss": -27.792606353759766, "global_step": 603596, "epoch": 7272} {"train_loss": -27.897741317749023, "global_step": 603597, "epoch": 7272} {"train_loss": -28.002899169921875, "global_step": 603598, "epoch": 7272} {"train_loss": -28.12000846862793, "global_step": 603599, "epoch": 7272} {"train_loss": -27.805587768554688, "global_step": 603600, "epoch": 7272} {"train_loss": -28.26445960998535, "global_step": 603601, "epoch": 7272} {"train_loss": -28.0018367767334, "global_step": 603602, "epoch": 7272} {"train_loss": -27.90744972229004, "global_step": 603603, "epoch": 7272} {"train_loss": -28.184656143188477, "global_step": 603604, "epoch": 7272} {"train_loss": -27.87019157409668, "global_step": 603605, "epoch": 7272} {"train_loss": -27.927417755126953, "global_step": 603606, "epoch": 7272} {"train_loss": -28.5228271484375, "global_step": 603607, "epoch": 7272} {"train_loss": -27.99125099182129, "global_step": 603608, "epoch": 7272} {"train_loss": -28.16835594177246, "global_step": 603609, "epoch": 7272} {"train_loss": -28.115957260131836, "global_step": 603610, "epoch": 7272} {"train_loss": -28.35517692565918, "global_step": 603611, "epoch": 7272} {"train_loss": -28.1475830078125, "global_step": 603612, "epoch": 7272} {"train_loss": -28.457319259643555, "global_step": 603613, "epoch": 7272} {"train_loss": -28.110126495361328, "global_step": 603614, "epoch": 7272} {"train_loss": -28.489465713500977, "global_step": 603615, "epoch": 7272} {"train_loss": -28.408843994140625, "global_step": 603616, "epoch": 7272} {"train_loss": -28.27617835998535, "global_step": 603617, "epoch": 7272} {"train_loss": -27.832538604736328, "global_step": 603618, "epoch": 7272} {"train_loss": -28.160263061523438, "global_step": 603619, "epoch": 7272} {"train_loss": -28.6290283203125, "global_step": 603620, "epoch": 7272} {"train_loss": -28.347808837890625, "global_step": 603621, "epoch": 7272} {"train_loss": -28.14938735961914, "global_step": 603622, "epoch": 7272} {"train_loss": -28.154224395751953, "global_step": 603623, "epoch": 7272} {"train_loss": -28.12379264831543, "global_step": 603624, "epoch": 7272} {"train_loss": -28.668912887573242, "global_step": 603625, "epoch": 7272} {"train_loss": -28.2863826751709, "global_step": 603626, "epoch": 7272} {"train_loss": -27.872766494750977, "global_step": 603627, "epoch": 7272} {"train_loss": -28.321014404296875, "global_step": 603628, "epoch": 7272} {"train_loss": -28.279150009155273, "global_step": 603629, "epoch": 7272} {"train_loss": -28.11585807800293, "global_step": 603630, "epoch": 7272} {"train_loss": -28.29033851623535, "global_step": 603631, "epoch": 7272} {"train_loss": -27.997617721557617, "global_step": 603632, "epoch": 7272} {"train_loss": -28.37274169921875, "global_step": 603633, "epoch": 7272} {"train_loss": -28.67999267578125, "global_step": 603634, "epoch": 7272} {"train_loss": -28.132604598999023, "global_step": 603635, "epoch": 7272} {"train_loss": -28.325117111206055, "global_step": 603636, "epoch": 7272} {"train_loss": -28.105823516845703, "global_step": 603637, "epoch": 7272} {"train_loss": -28.43851661682129, "global_step": 603638, "epoch": 7272} {"train_loss": -28.180011749267578, "global_step": 603639, "epoch": 7272} {"train_loss": -27.933637619018555, "global_step": 603640, "epoch": 7272} {"train_loss": -28.321958541870117, "global_step": 603641, "epoch": 7272} {"train_loss": -28.110437393188477, "global_step": 603642, "epoch": 7272} {"train_loss": -28.069089889526367, "global_step": 603643, "epoch": 7272} {"train_loss": -28.385528564453125, "global_step": 603644, "epoch": 7272} {"train_loss": -27.618927001953125, "global_step": 603645, "epoch": 7272} {"train_loss": -27.716629028320312, "global_step": 603646, "epoch": 7272} {"train_loss": -27.67170524597168, "global_step": 603647, "epoch": 7272} {"train_loss": -28.196630477905273, "global_step": 603648, "epoch": 7272} {"train_loss": -28.102069854736328, "global_step": 603649, "epoch": 7272} {"train_loss": -27.991376876831055, "global_step": 603650, "epoch": 7272} {"train_loss": -27.522506713867188, "global_step": 603651, "epoch": 7272} {"train_loss": -28.164770126342773, "global_step": 603652, "epoch": 7272} {"train_loss": -28.1015567779541, "global_step": 603653, "epoch": 7272} {"train_loss": -28.042139053344727, "global_step": 603654, "epoch": 7272} {"train_loss": -28.445032119750977, "global_step": 603655, "epoch": 7272} {"train_loss": -28.072834014892578, "global_step": 603656, "epoch": 7272} {"train_loss": -28.293684005737305, "global_step": 603657, "epoch": 7272} {"train_loss": -28.05228771071836, "global_step": 603658, "epoch": 7272, "val_loss": 6837461.0} {"train_loss": -27.534921646118164, "global_step": 603659, "epoch": 7273} {"train_loss": -27.723358154296875, "global_step": 603660, "epoch": 7273} {"train_loss": -27.810049057006836, "global_step": 603661, "epoch": 7273} {"train_loss": -27.28706169128418, "global_step": 603662, "epoch": 7273} {"train_loss": -27.798887252807617, "global_step": 603663, "epoch": 7273} {"train_loss": -27.4010066986084, "global_step": 603664, "epoch": 7273} {"train_loss": -27.743825912475586, "global_step": 603665, "epoch": 7273} {"train_loss": -27.9677677154541, "global_step": 603666, "epoch": 7273} {"train_loss": -27.722951889038086, "global_step": 603667, "epoch": 7273} {"train_loss": -27.713821411132812, "global_step": 603668, "epoch": 7273} {"train_loss": -27.53230094909668, "global_step": 603669, "epoch": 7273} {"train_loss": -27.5720272064209, "global_step": 603670, "epoch": 7273} {"train_loss": -27.865188598632812, "global_step": 603671, "epoch": 7273} {"train_loss": -27.834829330444336, "global_step": 603672, "epoch": 7273} {"train_loss": -27.945112228393555, "global_step": 603673, "epoch": 7273} {"train_loss": -27.737445831298828, "global_step": 603674, "epoch": 7273} {"train_loss": -27.897247314453125, "global_step": 603675, "epoch": 7273} {"train_loss": -27.927412033081055, "global_step": 603676, "epoch": 7273} {"train_loss": -27.782697677612305, "global_step": 603677, "epoch": 7273} {"train_loss": -28.081350326538086, "global_step": 603678, "epoch": 7273} {"train_loss": -28.154123306274414, "global_step": 603679, "epoch": 7273} {"train_loss": -28.009445190429688, "global_step": 603680, "epoch": 7273} {"train_loss": -27.832809448242188, "global_step": 603681, "epoch": 7273} {"train_loss": -28.093341827392578, "global_step": 603682, "epoch": 7273} {"train_loss": -27.988080978393555, "global_step": 603683, "epoch": 7273} {"train_loss": -28.13372230529785, "global_step": 603684, "epoch": 7273} {"train_loss": -28.300302505493164, "global_step": 603685, "epoch": 7273} {"train_loss": -28.626733779907227, "global_step": 603686, "epoch": 7273} {"train_loss": -27.72443199157715, "global_step": 603687, "epoch": 7273} {"train_loss": -28.3577880859375, "global_step": 603688, "epoch": 7273} {"train_loss": -28.29450035095215, "global_step": 603689, "epoch": 7273} {"train_loss": -27.990253448486328, "global_step": 603690, "epoch": 7273} {"train_loss": -28.050888061523438, "global_step": 603691, "epoch": 7273} {"train_loss": -28.47585105895996, "global_step": 603692, "epoch": 7273} {"train_loss": -28.218280792236328, "global_step": 603693, "epoch": 7273} {"train_loss": -28.167577743530273, "global_step": 603694, "epoch": 7273} {"train_loss": -28.43418312072754, "global_step": 603695, "epoch": 7273} {"train_loss": -28.16181755065918, "global_step": 603696, "epoch": 7273} {"train_loss": -27.997638702392578, "global_step": 603697, "epoch": 7273} {"train_loss": -28.288455963134766, "global_step": 603698, "epoch": 7273} {"train_loss": -28.076513290405273, "global_step": 603699, "epoch": 7273} {"train_loss": -27.72828483581543, "global_step": 603700, "epoch": 7273} {"train_loss": -28.123777389526367, "global_step": 603701, "epoch": 7273} {"train_loss": -27.9010066986084, "global_step": 603702, "epoch": 7273} {"train_loss": -28.189300537109375, "global_step": 603703, "epoch": 7273} {"train_loss": -27.708511352539062, "global_step": 603704, "epoch": 7273} {"train_loss": -27.79254150390625, "global_step": 603705, "epoch": 7273} {"train_loss": -28.05585289001465, "global_step": 603706, "epoch": 7273} {"train_loss": -28.382089614868164, "global_step": 603707, "epoch": 7273} {"train_loss": -27.8237247467041, "global_step": 603708, "epoch": 7273} {"train_loss": -27.707860946655273, "global_step": 603709, "epoch": 7273} {"train_loss": -28.172229766845703, "global_step": 603710, "epoch": 7273} {"train_loss": -28.351444244384766, "global_step": 603711, "epoch": 7273} {"train_loss": -28.36406898498535, "global_step": 603712, "epoch": 7273} {"train_loss": -28.129606246948242, "global_step": 603713, "epoch": 7273} {"train_loss": -28.188074111938477, "global_step": 603714, "epoch": 7273} {"train_loss": -28.53763771057129, "global_step": 603715, "epoch": 7273} {"train_loss": -27.951318740844727, "global_step": 603716, "epoch": 7273} {"train_loss": -28.13726234436035, "global_step": 603717, "epoch": 7273} {"train_loss": -28.107147216796875, "global_step": 603718, "epoch": 7273} {"train_loss": -28.134958267211914, "global_step": 603719, "epoch": 7273} {"train_loss": -28.21087646484375, "global_step": 603720, "epoch": 7273} {"train_loss": -28.111913681030273, "global_step": 603721, "epoch": 7273} {"train_loss": -28.2197208404541, "global_step": 603722, "epoch": 7273} {"train_loss": -28.063077926635742, "global_step": 603723, "epoch": 7273} {"train_loss": -27.883676528930664, "global_step": 603724, "epoch": 7273} {"train_loss": -28.156600952148438, "global_step": 603725, "epoch": 7273} {"train_loss": -28.07990837097168, "global_step": 603726, "epoch": 7273} {"train_loss": -28.347919464111328, "global_step": 603727, "epoch": 7273} {"train_loss": -28.3050479888916, "global_step": 603728, "epoch": 7273} {"train_loss": -28.605844497680664, "global_step": 603729, "epoch": 7273} {"train_loss": -28.130273818969727, "global_step": 603730, "epoch": 7273} {"train_loss": -28.386646270751953, "global_step": 603731, "epoch": 7273} {"train_loss": -28.211151123046875, "global_step": 603732, "epoch": 7273} {"train_loss": -28.16379165649414, "global_step": 603733, "epoch": 7273} {"train_loss": -28.123645782470703, "global_step": 603734, "epoch": 7273} {"train_loss": -28.34248924255371, "global_step": 603735, "epoch": 7273} {"train_loss": -28.109195709228516, "global_step": 603736, "epoch": 7273} {"train_loss": -28.285144805908203, "global_step": 603737, "epoch": 7273} {"train_loss": -27.88577651977539, "global_step": 603738, "epoch": 7273} {"train_loss": -27.920425415039062, "global_step": 603739, "epoch": 7273} {"train_loss": -27.837528228759766, "global_step": 603740, "epoch": 7273} {"train_loss": -28.050355336752283, "global_step": 603741, "epoch": 7273, "val_loss": 6863710.0} {"train_loss": -26.54620933532715, "global_step": 603742, "epoch": 7274} {"train_loss": -25.236459732055664, "global_step": 603743, "epoch": 7274} {"train_loss": -25.868560791015625, "global_step": 603744, "epoch": 7274} {"train_loss": -23.76263999938965, "global_step": 603745, "epoch": 7274} {"train_loss": -23.440793991088867, "global_step": 603746, "epoch": 7274} {"train_loss": -26.85000991821289, "global_step": 603747, "epoch": 7274} {"train_loss": -24.591970443725586, "global_step": 603748, "epoch": 7274} {"train_loss": -25.57948875427246, "global_step": 603749, "epoch": 7274} {"train_loss": -26.481618881225586, "global_step": 603750, "epoch": 7274} {"train_loss": -26.32097816467285, "global_step": 603751, "epoch": 7274} {"train_loss": -26.096017837524414, "global_step": 603752, "epoch": 7274} {"train_loss": -26.669620513916016, "global_step": 603753, "epoch": 7274} {"train_loss": -26.231586456298828, "global_step": 603754, "epoch": 7274} {"train_loss": -26.926071166992188, "global_step": 603755, "epoch": 7274} {"train_loss": -26.800521850585938, "global_step": 603756, "epoch": 7274} {"train_loss": -27.078527450561523, "global_step": 603757, "epoch": 7274} {"train_loss": -27.128814697265625, "global_step": 603758, "epoch": 7274} {"train_loss": -26.5953369140625, "global_step": 603759, "epoch": 7274} {"train_loss": -27.33355140686035, "global_step": 603760, "epoch": 7274} {"train_loss": -27.308191299438477, "global_step": 603761, "epoch": 7274} {"train_loss": -27.108945846557617, "global_step": 603762, "epoch": 7274} {"train_loss": -27.307342529296875, "global_step": 603763, "epoch": 7274} {"train_loss": -27.644739151000977, "global_step": 603764, "epoch": 7274} {"train_loss": -27.552274703979492, "global_step": 603765, "epoch": 7274} {"train_loss": -27.416522979736328, "global_step": 603766, "epoch": 7274} {"train_loss": -27.246597290039062, "global_step": 603767, "epoch": 7274} {"train_loss": -27.42854118347168, "global_step": 603768, "epoch": 7274} {"train_loss": -27.386816024780273, "global_step": 603769, "epoch": 7274} {"train_loss": -27.586530685424805, "global_step": 603770, "epoch": 7274} {"train_loss": -27.69244384765625, "global_step": 603771, "epoch": 7274} {"train_loss": -27.463232040405273, "global_step": 603772, "epoch": 7274} {"train_loss": -27.448322296142578, "global_step": 603773, "epoch": 7274} {"train_loss": -27.6463680267334, "global_step": 603774, "epoch": 7274} {"train_loss": -27.67288589477539, "global_step": 603775, "epoch": 7274} {"train_loss": -27.45249366760254, "global_step": 603776, "epoch": 7274} {"train_loss": -27.617185592651367, "global_step": 603777, "epoch": 7274} {"train_loss": -27.659955978393555, "global_step": 603778, "epoch": 7274} {"train_loss": -27.59437370300293, "global_step": 603779, "epoch": 7274} {"train_loss": -27.767499923706055, "global_step": 603780, "epoch": 7274} {"train_loss": -27.720911026000977, "global_step": 603781, "epoch": 7274} {"train_loss": -28.081314086914062, "global_step": 603782, "epoch": 7274} {"train_loss": -28.0363712310791, "global_step": 603783, "epoch": 7274} {"train_loss": -27.880111694335938, "global_step": 603784, "epoch": 7274} {"train_loss": -27.803937911987305, "global_step": 603785, "epoch": 7274} {"train_loss": -28.08635902404785, "global_step": 603786, "epoch": 7274} {"train_loss": -27.527435302734375, "global_step": 603787, "epoch": 7274} {"train_loss": -27.7174072265625, "global_step": 603788, "epoch": 7274} {"train_loss": -27.88922691345215, "global_step": 603789, "epoch": 7274} {"train_loss": -27.681640625, "global_step": 603790, "epoch": 7274} {"train_loss": -27.770856857299805, "global_step": 603791, "epoch": 7274} {"train_loss": -27.895029067993164, "global_step": 603792, "epoch": 7274} {"train_loss": -27.610565185546875, "global_step": 603793, "epoch": 7274} {"train_loss": -27.63350486755371, "global_step": 603794, "epoch": 7274} {"train_loss": -27.565763473510742, "global_step": 603795, "epoch": 7274} {"train_loss": -28.17245864868164, "global_step": 603796, "epoch": 7274} {"train_loss": -28.410140991210938, "global_step": 603797, "epoch": 7274} {"train_loss": -27.82972526550293, "global_step": 603798, "epoch": 7274} {"train_loss": -28.090290069580078, "global_step": 603799, "epoch": 7274} {"train_loss": -27.885486602783203, "global_step": 603800, "epoch": 7274} {"train_loss": -27.845102310180664, "global_step": 603801, "epoch": 7274} {"train_loss": -27.570566177368164, "global_step": 603802, "epoch": 7274} {"train_loss": -27.6863956451416, "global_step": 603803, "epoch": 7274} {"train_loss": -27.564855575561523, "global_step": 603804, "epoch": 7274} {"train_loss": -27.834299087524414, "global_step": 603805, "epoch": 7274} {"train_loss": -27.586267471313477, "global_step": 603806, "epoch": 7274} {"train_loss": -28.239843368530273, "global_step": 603807, "epoch": 7274} {"train_loss": -27.317768096923828, "global_step": 603808, "epoch": 7274} {"train_loss": -27.886402130126953, "global_step": 603809, "epoch": 7274} {"train_loss": -28.115680694580078, "global_step": 603810, "epoch": 7274} {"train_loss": -27.67645263671875, "global_step": 603811, "epoch": 7274} {"train_loss": -28.32257652282715, "global_step": 603812, "epoch": 7274} {"train_loss": -27.967147827148438, "global_step": 603813, "epoch": 7274} {"train_loss": -28.0634822845459, "global_step": 603814, "epoch": 7274} {"train_loss": -28.123706817626953, "global_step": 603815, "epoch": 7274} {"train_loss": -28.09207534790039, "global_step": 603816, "epoch": 7274} {"train_loss": -27.95496940612793, "global_step": 603817, "epoch": 7274} {"train_loss": -28.3160457611084, "global_step": 603818, "epoch": 7274} {"train_loss": -28.29754066467285, "global_step": 603819, "epoch": 7274} {"train_loss": -28.037189483642578, "global_step": 603820, "epoch": 7274} {"train_loss": -28.45844841003418, "global_step": 603821, "epoch": 7274} {"train_loss": -28.07025718688965, "global_step": 603822, "epoch": 7274} {"train_loss": -28.481481552124023, "global_step": 603823, "epoch": 7274} {"train_loss": -27.38492246420987, "global_step": 603824, "epoch": 7274, "val_loss": 6819588.5} {"train_loss": -27.52760887145996, "global_step": 603825, "epoch": 7275} {"train_loss": -27.89312171936035, "global_step": 603826, "epoch": 7275} {"train_loss": -27.73512840270996, "global_step": 603827, "epoch": 7275} {"train_loss": -28.139135360717773, "global_step": 603828, "epoch": 7275} {"train_loss": -27.92449951171875, "global_step": 603829, "epoch": 7275} {"train_loss": -27.732526779174805, "global_step": 603830, "epoch": 7275} {"train_loss": -27.91438102722168, "global_step": 603831, "epoch": 7275} {"train_loss": -28.450149536132812, "global_step": 603832, "epoch": 7275} {"train_loss": -27.816686630249023, "global_step": 603833, "epoch": 7275} {"train_loss": -27.85474967956543, "global_step": 603834, "epoch": 7275} {"train_loss": -27.756574630737305, "global_step": 603835, "epoch": 7275} {"train_loss": -27.8978214263916, "global_step": 603836, "epoch": 7275} {"train_loss": -27.744672775268555, "global_step": 603837, "epoch": 7275} {"train_loss": -28.19287109375, "global_step": 603838, "epoch": 7275} {"train_loss": -28.1337833404541, "global_step": 603839, "epoch": 7275} {"train_loss": -28.190473556518555, "global_step": 603840, "epoch": 7275} {"train_loss": -28.033252716064453, "global_step": 603841, "epoch": 7275} {"train_loss": -28.096908569335938, "global_step": 603842, "epoch": 7275} {"train_loss": -27.89301109313965, "global_step": 603843, "epoch": 7275} {"train_loss": -27.630151748657227, "global_step": 603844, "epoch": 7275} {"train_loss": -27.639413833618164, "global_step": 603845, "epoch": 7275} {"train_loss": -28.09527015686035, "global_step": 603846, "epoch": 7275} {"train_loss": -27.916461944580078, "global_step": 603847, "epoch": 7275} {"train_loss": -27.971317291259766, "global_step": 603848, "epoch": 7275} {"train_loss": -28.05030632019043, "global_step": 603849, "epoch": 7275} {"train_loss": -27.73687744140625, "global_step": 603850, "epoch": 7275} {"train_loss": -28.039960861206055, "global_step": 603851, "epoch": 7275} {"train_loss": -27.842443466186523, "global_step": 603852, "epoch": 7275} {"train_loss": -28.024396896362305, "global_step": 603853, "epoch": 7275} {"train_loss": -28.106454849243164, "global_step": 603854, "epoch": 7275} {"train_loss": -27.8731689453125, "global_step": 603855, "epoch": 7275} {"train_loss": -28.53790855407715, "global_step": 603856, "epoch": 7275} {"train_loss": -28.35479736328125, "global_step": 603857, "epoch": 7275} {"train_loss": -28.48199462890625, "global_step": 603858, "epoch": 7275} {"train_loss": -28.102527618408203, "global_step": 603859, "epoch": 7275} {"train_loss": -28.064773559570312, "global_step": 603860, "epoch": 7275} {"train_loss": -28.31366539001465, "global_step": 603861, "epoch": 7275} {"train_loss": -28.00162696838379, "global_step": 603862, "epoch": 7275} {"train_loss": -28.288198471069336, "global_step": 603863, "epoch": 7275} {"train_loss": -28.171789169311523, "global_step": 603864, "epoch": 7275} {"train_loss": -27.72455406188965, "global_step": 603865, "epoch": 7275} {"train_loss": -27.96912956237793, "global_step": 603866, "epoch": 7275} {"train_loss": -28.244680404663086, "global_step": 603867, "epoch": 7275} {"train_loss": -28.414518356323242, "global_step": 603868, "epoch": 7275} {"train_loss": -28.19384765625, "global_step": 603869, "epoch": 7275} {"train_loss": -28.238096237182617, "global_step": 603870, "epoch": 7275} {"train_loss": -28.17868423461914, "global_step": 603871, "epoch": 7275} {"train_loss": -28.2916259765625, "global_step": 603872, "epoch": 7275} {"train_loss": -27.821020126342773, "global_step": 603873, "epoch": 7275} {"train_loss": -28.412097930908203, "global_step": 603874, "epoch": 7275} {"train_loss": -28.62017250061035, "global_step": 603875, "epoch": 7275} {"train_loss": -28.311634063720703, "global_step": 603876, "epoch": 7275} {"train_loss": -28.000370025634766, "global_step": 603877, "epoch": 7275} {"train_loss": -27.927703857421875, "global_step": 603878, "epoch": 7275} {"train_loss": -28.026472091674805, "global_step": 603879, "epoch": 7275} {"train_loss": -27.779895782470703, "global_step": 603880, "epoch": 7275} {"train_loss": -28.275297164916992, "global_step": 603881, "epoch": 7275} {"train_loss": -28.176584243774414, "global_step": 603882, "epoch": 7275} {"train_loss": -27.98016357421875, "global_step": 603883, "epoch": 7275} {"train_loss": -28.212488174438477, "global_step": 603884, "epoch": 7275} {"train_loss": -27.963214874267578, "global_step": 603885, "epoch": 7275} {"train_loss": -28.05973243713379, "global_step": 603886, "epoch": 7275} {"train_loss": -28.11028480529785, "global_step": 603887, "epoch": 7275} {"train_loss": -28.270477294921875, "global_step": 603888, "epoch": 7275} {"train_loss": -27.784330368041992, "global_step": 603889, "epoch": 7275} {"train_loss": -27.595874786376953, "global_step": 603890, "epoch": 7275} {"train_loss": -27.857351303100586, "global_step": 603891, "epoch": 7275} {"train_loss": -28.33100700378418, "global_step": 603892, "epoch": 7275} {"train_loss": -27.790185928344727, "global_step": 603893, "epoch": 7275} {"train_loss": -27.72040367126465, "global_step": 603894, "epoch": 7275} {"train_loss": -28.009124755859375, "global_step": 603895, "epoch": 7275} {"train_loss": -27.768896102905273, "global_step": 603896, "epoch": 7275} {"train_loss": -28.14851951599121, "global_step": 603897, "epoch": 7275} {"train_loss": -27.518346786499023, "global_step": 603898, "epoch": 7275} {"train_loss": -28.234106063842773, "global_step": 603899, "epoch": 7275} {"train_loss": -27.593036651611328, "global_step": 603900, "epoch": 7275} {"train_loss": -27.9229793548584, "global_step": 603901, "epoch": 7275} {"train_loss": -28.133718490600586, "global_step": 603902, "epoch": 7275} {"train_loss": -28.016342163085938, "global_step": 603903, "epoch": 7275} {"train_loss": -27.79756736755371, "global_step": 603904, "epoch": 7275} {"train_loss": -27.997289657592773, "global_step": 603905, "epoch": 7275} {"train_loss": -28.215301513671875, "global_step": 603906, "epoch": 7275} {"train_loss": -28.017858872930688, "global_step": 603907, "epoch": 7275, "val_loss": 6887731.0} {"train_loss": -27.634084701538086, "global_step": 603908, "epoch": 7276} {"train_loss": -27.437124252319336, "global_step": 603909, "epoch": 7276} {"train_loss": -27.879531860351562, "global_step": 603910, "epoch": 7276} {"train_loss": -27.774646759033203, "global_step": 603911, "epoch": 7276} {"train_loss": -27.8301944732666, "global_step": 603912, "epoch": 7276} {"train_loss": -27.346500396728516, "global_step": 603913, "epoch": 7276} {"train_loss": -27.485885620117188, "global_step": 603914, "epoch": 7276} {"train_loss": -27.524694442749023, "global_step": 603915, "epoch": 7276} {"train_loss": -28.203283309936523, "global_step": 603916, "epoch": 7276} {"train_loss": -27.613178253173828, "global_step": 603917, "epoch": 7276} {"train_loss": -28.0389461517334, "global_step": 603918, "epoch": 7276} {"train_loss": -27.659650802612305, "global_step": 603919, "epoch": 7276} {"train_loss": -27.974079132080078, "global_step": 603920, "epoch": 7276} {"train_loss": -28.075927734375, "global_step": 603921, "epoch": 7276} {"train_loss": -27.828405380249023, "global_step": 603922, "epoch": 7276} {"train_loss": -27.886981964111328, "global_step": 603923, "epoch": 7276} {"train_loss": -28.044479370117188, "global_step": 603924, "epoch": 7276} {"train_loss": -28.129806518554688, "global_step": 603925, "epoch": 7276} {"train_loss": -27.949865341186523, "global_step": 603926, "epoch": 7276} {"train_loss": -27.87703514099121, "global_step": 603927, "epoch": 7276} {"train_loss": -28.01409912109375, "global_step": 603928, "epoch": 7276} {"train_loss": -28.25310707092285, "global_step": 603929, "epoch": 7276} {"train_loss": -28.42365074157715, "global_step": 603930, "epoch": 7276} {"train_loss": -27.641010284423828, "global_step": 603931, "epoch": 7276} {"train_loss": -27.74390983581543, "global_step": 603932, "epoch": 7276} {"train_loss": -27.795560836791992, "global_step": 603933, "epoch": 7276} {"train_loss": -28.0272216796875, "global_step": 603934, "epoch": 7276} {"train_loss": -28.069629669189453, "global_step": 603935, "epoch": 7276} {"train_loss": -28.04261589050293, "global_step": 603936, "epoch": 7276} {"train_loss": -27.5701847076416, "global_step": 603937, "epoch": 7276} {"train_loss": -28.054264068603516, "global_step": 603938, "epoch": 7276} {"train_loss": -27.926334381103516, "global_step": 603939, "epoch": 7276} {"train_loss": -27.834033966064453, "global_step": 603940, "epoch": 7276} {"train_loss": -28.038654327392578, "global_step": 603941, "epoch": 7276} {"train_loss": -28.23408317565918, "global_step": 603942, "epoch": 7276} {"train_loss": -28.174575805664062, "global_step": 603943, "epoch": 7276} {"train_loss": -28.1933536529541, "global_step": 603944, "epoch": 7276} {"train_loss": -28.106725692749023, "global_step": 603945, "epoch": 7276} {"train_loss": -27.7322940826416, "global_step": 603946, "epoch": 7276} {"train_loss": -27.902353286743164, "global_step": 603947, "epoch": 7276} {"train_loss": -28.256650924682617, "global_step": 603948, "epoch": 7276} {"train_loss": -28.326948165893555, "global_step": 603949, "epoch": 7276} {"train_loss": -27.945886611938477, "global_step": 603950, "epoch": 7276} {"train_loss": -28.16245460510254, "global_step": 603951, "epoch": 7276} {"train_loss": -28.05756187438965, "global_step": 603952, "epoch": 7276} {"train_loss": -28.093835830688477, "global_step": 603953, "epoch": 7276} {"train_loss": -28.21430778503418, "global_step": 603954, "epoch": 7276} {"train_loss": -28.13153076171875, "global_step": 603955, "epoch": 7276} {"train_loss": -28.087980270385742, "global_step": 603956, "epoch": 7276} {"train_loss": -28.1390380859375, "global_step": 603957, "epoch": 7276} {"train_loss": -27.95745277404785, "global_step": 603958, "epoch": 7276} {"train_loss": -27.819583892822266, "global_step": 603959, "epoch": 7276} {"train_loss": -27.906721115112305, "global_step": 603960, "epoch": 7276} {"train_loss": -28.459028244018555, "global_step": 603961, "epoch": 7276} {"train_loss": -28.368927001953125, "global_step": 603962, "epoch": 7276} {"train_loss": -28.20844078063965, "global_step": 603963, "epoch": 7276} {"train_loss": -28.26315689086914, "global_step": 603964, "epoch": 7276} {"train_loss": -28.291339874267578, "global_step": 603965, "epoch": 7276} {"train_loss": -28.049407958984375, "global_step": 603966, "epoch": 7276} {"train_loss": -28.017499923706055, "global_step": 603967, "epoch": 7276} {"train_loss": -28.128223419189453, "global_step": 603968, "epoch": 7276} {"train_loss": -27.960851669311523, "global_step": 603969, "epoch": 7276} {"train_loss": -27.84248161315918, "global_step": 603970, "epoch": 7276} {"train_loss": -28.155170440673828, "global_step": 603971, "epoch": 7276} {"train_loss": -27.7923641204834, "global_step": 603972, "epoch": 7276} {"train_loss": -27.87833595275879, "global_step": 603973, "epoch": 7276} {"train_loss": -28.042499542236328, "global_step": 603974, "epoch": 7276} {"train_loss": -28.491779327392578, "global_step": 603975, "epoch": 7276} {"train_loss": -28.05787467956543, "global_step": 603976, "epoch": 7276} {"train_loss": -28.16193199157715, "global_step": 603977, "epoch": 7276} {"train_loss": -28.010330200195312, "global_step": 603978, "epoch": 7276} {"train_loss": -28.182331085205078, "global_step": 603979, "epoch": 7276} {"train_loss": -28.451984405517578, "global_step": 603980, "epoch": 7276} {"train_loss": -28.146015167236328, "global_step": 603981, "epoch": 7276} {"train_loss": -28.598852157592773, "global_step": 603982, "epoch": 7276} {"train_loss": -28.465009689331055, "global_step": 603983, "epoch": 7276} {"train_loss": -28.461872100830078, "global_step": 603984, "epoch": 7276} {"train_loss": -28.127216339111328, "global_step": 603985, "epoch": 7276} {"train_loss": -28.239429473876953, "global_step": 603986, "epoch": 7276} {"train_loss": -28.101423263549805, "global_step": 603987, "epoch": 7276} {"train_loss": -28.556238174438477, "global_step": 603988, "epoch": 7276} {"train_loss": -28.206716537475586, "global_step": 603989, "epoch": 7276} {"train_loss": -28.059641022280037, "global_step": 603990, "epoch": 7276, "val_loss": 6826507.0} {"train_loss": -28.5772705078125, "global_step": 603991, "epoch": 7277} {"train_loss": -28.24806022644043, "global_step": 603992, "epoch": 7277} {"train_loss": -28.208398818969727, "global_step": 603993, "epoch": 7277} {"train_loss": -28.127782821655273, "global_step": 603994, "epoch": 7277} {"train_loss": -28.051523208618164, "global_step": 603995, "epoch": 7277} {"train_loss": -28.105016708374023, "global_step": 603996, "epoch": 7277} {"train_loss": -28.081043243408203, "global_step": 603997, "epoch": 7277} {"train_loss": -27.993589401245117, "global_step": 603998, "epoch": 7277} {"train_loss": -27.720752716064453, "global_step": 603999, "epoch": 7277} {"train_loss": -27.78717041015625, "global_step": 604000, "epoch": 7277} {"train_loss": -27.612869262695312, "global_step": 604001, "epoch": 7277} {"train_loss": -26.536727905273438, "global_step": 604002, "epoch": 7277} {"train_loss": -26.167150497436523, "global_step": 604003, "epoch": 7277} {"train_loss": -26.63409996032715, "global_step": 604004, "epoch": 7277} {"train_loss": -28.067188262939453, "global_step": 604005, "epoch": 7277} {"train_loss": -26.649564743041992, "global_step": 604006, "epoch": 7277} {"train_loss": -27.71534538269043, "global_step": 604007, "epoch": 7277} {"train_loss": -27.29060173034668, "global_step": 604008, "epoch": 7277} {"train_loss": -27.972314834594727, "global_step": 604009, "epoch": 7277} {"train_loss": -27.501495361328125, "global_step": 604010, "epoch": 7277} {"train_loss": -27.845355987548828, "global_step": 604011, "epoch": 7277} {"train_loss": -27.349897384643555, "global_step": 604012, "epoch": 7277} {"train_loss": -27.6004638671875, "global_step": 604013, "epoch": 7277} {"train_loss": -27.348718643188477, "global_step": 604014, "epoch": 7277} {"train_loss": -27.616287231445312, "global_step": 604015, "epoch": 7277} {"train_loss": -27.70574951171875, "global_step": 604016, "epoch": 7277} {"train_loss": -27.079965591430664, "global_step": 604017, "epoch": 7277} {"train_loss": -27.724035263061523, "global_step": 604018, "epoch": 7277} {"train_loss": -28.1900634765625, "global_step": 604019, "epoch": 7277} {"train_loss": -27.908750534057617, "global_step": 604020, "epoch": 7277} {"train_loss": -28.032012939453125, "global_step": 604021, "epoch": 7277} {"train_loss": -28.090087890625, "global_step": 604022, "epoch": 7277} {"train_loss": -27.69437599182129, "global_step": 604023, "epoch": 7277} {"train_loss": -28.02374839782715, "global_step": 604024, "epoch": 7277} {"train_loss": -27.890966415405273, "global_step": 604025, "epoch": 7277} {"train_loss": -27.721227645874023, "global_step": 604026, "epoch": 7277} {"train_loss": -28.096515655517578, "global_step": 604027, "epoch": 7277} {"train_loss": -28.097808837890625, "global_step": 604028, "epoch": 7277} {"train_loss": -27.773818969726562, "global_step": 604029, "epoch": 7277} {"train_loss": -27.885650634765625, "global_step": 604030, "epoch": 7277} {"train_loss": -28.062774658203125, "global_step": 604031, "epoch": 7277} {"train_loss": -27.858627319335938, "global_step": 604032, "epoch": 7277} {"train_loss": -28.3829345703125, "global_step": 604033, "epoch": 7277} {"train_loss": -28.203357696533203, "global_step": 604034, "epoch": 7277} {"train_loss": -28.276309967041016, "global_step": 604035, "epoch": 7277} {"train_loss": -27.936765670776367, "global_step": 604036, "epoch": 7277} {"train_loss": -28.063343048095703, "global_step": 604037, "epoch": 7277} {"train_loss": -27.9396915435791, "global_step": 604038, "epoch": 7277} {"train_loss": -27.911279678344727, "global_step": 604039, "epoch": 7277} {"train_loss": -27.993209838867188, "global_step": 604040, "epoch": 7277} {"train_loss": -27.70228385925293, "global_step": 604041, "epoch": 7277} {"train_loss": -27.990985870361328, "global_step": 604042, "epoch": 7277} {"train_loss": -28.27777099609375, "global_step": 604043, "epoch": 7277} {"train_loss": -28.082141876220703, "global_step": 604044, "epoch": 7277} {"train_loss": -28.23811149597168, "global_step": 604045, "epoch": 7277} {"train_loss": -28.282794952392578, "global_step": 604046, "epoch": 7277} {"train_loss": -28.16575050354004, "global_step": 604047, "epoch": 7277} {"train_loss": -28.111434936523438, "global_step": 604048, "epoch": 7277} {"train_loss": -28.28570556640625, "global_step": 604049, "epoch": 7277} {"train_loss": -28.091094970703125, "global_step": 604050, "epoch": 7277} {"train_loss": -28.1013240814209, "global_step": 604051, "epoch": 7277} {"train_loss": -27.966888427734375, "global_step": 604052, "epoch": 7277} {"train_loss": -28.22055435180664, "global_step": 604053, "epoch": 7277} {"train_loss": -28.20969009399414, "global_step": 604054, "epoch": 7277} {"train_loss": -28.464435577392578, "global_step": 604055, "epoch": 7277} {"train_loss": -27.99493408203125, "global_step": 604056, "epoch": 7277} {"train_loss": -28.351993560791016, "global_step": 604057, "epoch": 7277} {"train_loss": -28.198699951171875, "global_step": 604058, "epoch": 7277} {"train_loss": -28.203123092651367, "global_step": 604059, "epoch": 7277} {"train_loss": -27.9403076171875, "global_step": 604060, "epoch": 7277} {"train_loss": -28.4153995513916, "global_step": 604061, "epoch": 7277} {"train_loss": -28.289081573486328, "global_step": 604062, "epoch": 7277} {"train_loss": -28.051488876342773, "global_step": 604063, "epoch": 7277} {"train_loss": -28.4246768951416, "global_step": 604064, "epoch": 7277} {"train_loss": -28.19532585144043, "global_step": 604065, "epoch": 7277} {"train_loss": -27.91253662109375, "global_step": 604066, "epoch": 7277} {"train_loss": -27.582019805908203, "global_step": 604067, "epoch": 7277} {"train_loss": -27.704010009765625, "global_step": 604068, "epoch": 7277} {"train_loss": -28.15778160095215, "global_step": 604069, "epoch": 7277} {"train_loss": -28.046682357788086, "global_step": 604070, "epoch": 7277} {"train_loss": -27.713483810424805, "global_step": 604071, "epoch": 7277} {"train_loss": -28.104873657226562, "global_step": 604072, "epoch": 7277} {"train_loss": -27.906089920595466, "global_step": 604073, "epoch": 7277, "val_loss": 6877680.0} {"train_loss": -27.415515899658203, "global_step": 604074, "epoch": 7278} {"train_loss": -27.43548583984375, "global_step": 604075, "epoch": 7278} {"train_loss": -27.762771606445312, "global_step": 604076, "epoch": 7278} {"train_loss": -27.999486923217773, "global_step": 604077, "epoch": 7278} {"train_loss": -27.358551025390625, "global_step": 604078, "epoch": 7278} {"train_loss": -27.267383575439453, "global_step": 604079, "epoch": 7278} {"train_loss": -27.355863571166992, "global_step": 604080, "epoch": 7278} {"train_loss": -27.47357749938965, "global_step": 604081, "epoch": 7278} {"train_loss": -27.977832794189453, "global_step": 604082, "epoch": 7278} {"train_loss": -27.434900283813477, "global_step": 604083, "epoch": 7278} {"train_loss": -27.491186141967773, "global_step": 604084, "epoch": 7278} {"train_loss": -27.67111587524414, "global_step": 604085, "epoch": 7278} {"train_loss": -27.548233032226562, "global_step": 604086, "epoch": 7278} {"train_loss": -27.917566299438477, "global_step": 604087, "epoch": 7278} {"train_loss": -27.4448184967041, "global_step": 604088, "epoch": 7278} {"train_loss": -27.647785186767578, "global_step": 604089, "epoch": 7278} {"train_loss": -27.468469619750977, "global_step": 604090, "epoch": 7278} {"train_loss": -27.572660446166992, "global_step": 604091, "epoch": 7278} {"train_loss": -27.807632446289062, "global_step": 604092, "epoch": 7278} {"train_loss": -27.388513565063477, "global_step": 604093, "epoch": 7278} {"train_loss": -27.835439682006836, "global_step": 604094, "epoch": 7278} {"train_loss": -27.48797607421875, "global_step": 604095, "epoch": 7278} {"train_loss": -27.871023178100586, "global_step": 604096, "epoch": 7278} {"train_loss": -27.36178970336914, "global_step": 604097, "epoch": 7278} {"train_loss": -27.45728874206543, "global_step": 604098, "epoch": 7278} {"train_loss": -27.987390518188477, "global_step": 604099, "epoch": 7278} {"train_loss": -27.96314811706543, "global_step": 604100, "epoch": 7278} {"train_loss": -27.918542861938477, "global_step": 604101, "epoch": 7278} {"train_loss": -28.05525016784668, "global_step": 604102, "epoch": 7278} {"train_loss": -28.42095947265625, "global_step": 604103, "epoch": 7278} {"train_loss": -27.988622665405273, "global_step": 604104, "epoch": 7278} {"train_loss": -27.888565063476562, "global_step": 604105, "epoch": 7278} {"train_loss": -27.776172637939453, "global_step": 604106, "epoch": 7278} {"train_loss": -27.77931785583496, "global_step": 604107, "epoch": 7278} {"train_loss": -27.700429916381836, "global_step": 604108, "epoch": 7278} {"train_loss": -27.85141944885254, "global_step": 604109, "epoch": 7278} {"train_loss": -28.371313095092773, "global_step": 604110, "epoch": 7278} {"train_loss": -27.6547908782959, "global_step": 604111, "epoch": 7278} {"train_loss": -27.634733200073242, "global_step": 604112, "epoch": 7278} {"train_loss": -27.9432315826416, "global_step": 604113, "epoch": 7278} {"train_loss": -28.14597511291504, "global_step": 604114, "epoch": 7278} {"train_loss": -28.311246871948242, "global_step": 604115, "epoch": 7278} {"train_loss": -27.883291244506836, "global_step": 604116, "epoch": 7278} {"train_loss": -28.205289840698242, "global_step": 604117, "epoch": 7278} {"train_loss": -28.033863067626953, "global_step": 604118, "epoch": 7278} {"train_loss": -28.119421005249023, "global_step": 604119, "epoch": 7278} {"train_loss": -28.275394439697266, "global_step": 604120, "epoch": 7278} {"train_loss": -28.250324249267578, "global_step": 604121, "epoch": 7278} {"train_loss": -27.951093673706055, "global_step": 604122, "epoch": 7278} {"train_loss": -28.261438369750977, "global_step": 604123, "epoch": 7278} {"train_loss": -28.24798583984375, "global_step": 604124, "epoch": 7278} {"train_loss": -28.405517578125, "global_step": 604125, "epoch": 7278} {"train_loss": -28.407499313354492, "global_step": 604126, "epoch": 7278} {"train_loss": -28.31635856628418, "global_step": 604127, "epoch": 7278} {"train_loss": -27.89435386657715, "global_step": 604128, "epoch": 7278} {"train_loss": -28.0329647064209, "global_step": 604129, "epoch": 7278} {"train_loss": -28.498504638671875, "global_step": 604130, "epoch": 7278} {"train_loss": -27.971643447875977, "global_step": 604131, "epoch": 7278} {"train_loss": -28.020788192749023, "global_step": 604132, "epoch": 7278} {"train_loss": -28.168485641479492, "global_step": 604133, "epoch": 7278} {"train_loss": -28.053781509399414, "global_step": 604134, "epoch": 7278} {"train_loss": -28.377599716186523, "global_step": 604135, "epoch": 7278} {"train_loss": -28.120498657226562, "global_step": 604136, "epoch": 7278} {"train_loss": -28.554309844970703, "global_step": 604137, "epoch": 7278} {"train_loss": -28.18366813659668, "global_step": 604138, "epoch": 7278} {"train_loss": -27.83380126953125, "global_step": 604139, "epoch": 7278} {"train_loss": -27.7558650970459, "global_step": 604140, "epoch": 7278} {"train_loss": -28.178909301757812, "global_step": 604141, "epoch": 7278} {"train_loss": -28.105030059814453, "global_step": 604142, "epoch": 7278} {"train_loss": -27.875049591064453, "global_step": 604143, "epoch": 7278} {"train_loss": -27.947101593017578, "global_step": 604144, "epoch": 7278} {"train_loss": -28.150720596313477, "global_step": 604145, "epoch": 7278} {"train_loss": -27.909711837768555, "global_step": 604146, "epoch": 7278} {"train_loss": -28.00272560119629, "global_step": 604147, "epoch": 7278} {"train_loss": -28.27663230895996, "global_step": 604148, "epoch": 7278} {"train_loss": -28.232620239257812, "global_step": 604149, "epoch": 7278} {"train_loss": -28.046619415283203, "global_step": 604150, "epoch": 7278} {"train_loss": -28.09867286682129, "global_step": 604151, "epoch": 7278} {"train_loss": -27.952672958374023, "global_step": 604152, "epoch": 7278} {"train_loss": -27.906970977783203, "global_step": 604153, "epoch": 7278} {"train_loss": -27.973560333251953, "global_step": 604154, "epoch": 7278} {"train_loss": -27.978296279907227, "global_step": 604155, "epoch": 7278} {"train_loss": -27.912027404968995, "global_step": 604156, "epoch": 7278, "val_loss": 6847658.0} {"train_loss": -28.07208824157715, "global_step": 604157, "epoch": 7279} {"train_loss": -27.727752685546875, "global_step": 604158, "epoch": 7279} {"train_loss": -27.51175308227539, "global_step": 604159, "epoch": 7279} {"train_loss": -27.752548217773438, "global_step": 604160, "epoch": 7279} {"train_loss": -27.912076950073242, "global_step": 604161, "epoch": 7279} {"train_loss": -27.98872184753418, "global_step": 604162, "epoch": 7279} {"train_loss": -27.706714630126953, "global_step": 604163, "epoch": 7279} {"train_loss": -27.832199096679688, "global_step": 604164, "epoch": 7279} {"train_loss": -27.929901123046875, "global_step": 604165, "epoch": 7279} {"train_loss": -27.879806518554688, "global_step": 604166, "epoch": 7279} {"train_loss": -27.75994300842285, "global_step": 604167, "epoch": 7279} {"train_loss": -28.048248291015625, "global_step": 604168, "epoch": 7279} {"train_loss": -27.608692169189453, "global_step": 604169, "epoch": 7279} {"train_loss": -27.710514068603516, "global_step": 604170, "epoch": 7279} {"train_loss": -28.187088012695312, "global_step": 604171, "epoch": 7279} {"train_loss": -27.8145809173584, "global_step": 604172, "epoch": 7279} {"train_loss": -28.136579513549805, "global_step": 604173, "epoch": 7279} {"train_loss": -27.95538330078125, "global_step": 604174, "epoch": 7279} {"train_loss": -28.12057876586914, "global_step": 604175, "epoch": 7279} {"train_loss": -28.111236572265625, "global_step": 604176, "epoch": 7279} {"train_loss": -27.733734130859375, "global_step": 604177, "epoch": 7279} {"train_loss": -27.884082794189453, "global_step": 604178, "epoch": 7279} {"train_loss": -27.7426700592041, "global_step": 604179, "epoch": 7279} {"train_loss": -27.617938995361328, "global_step": 604180, "epoch": 7279} {"train_loss": -27.75770378112793, "global_step": 604181, "epoch": 7279} {"train_loss": -27.5338077545166, "global_step": 604182, "epoch": 7279} {"train_loss": -27.86649513244629, "global_step": 604183, "epoch": 7279} {"train_loss": -27.99102783203125, "global_step": 604184, "epoch": 7279} {"train_loss": -27.95947265625, "global_step": 604185, "epoch": 7279} {"train_loss": -27.650360107421875, "global_step": 604186, "epoch": 7279} {"train_loss": -27.955469131469727, "global_step": 604187, "epoch": 7279} {"train_loss": -27.914630889892578, "global_step": 604188, "epoch": 7279} {"train_loss": -27.917938232421875, "global_step": 604189, "epoch": 7279} {"train_loss": -27.632841110229492, "global_step": 604190, "epoch": 7279} {"train_loss": -27.946313858032227, "global_step": 604191, "epoch": 7279} {"train_loss": -27.6798038482666, "global_step": 604192, "epoch": 7279} {"train_loss": -28.0208740234375, "global_step": 604193, "epoch": 7279} {"train_loss": -28.01373291015625, "global_step": 604194, "epoch": 7279} {"train_loss": -28.07452392578125, "global_step": 604195, "epoch": 7279} {"train_loss": -27.91083335876465, "global_step": 604196, "epoch": 7279} {"train_loss": -28.070602416992188, "global_step": 604197, "epoch": 7279} {"train_loss": -27.917585372924805, "global_step": 604198, "epoch": 7279} {"train_loss": -27.948400497436523, "global_step": 604199, "epoch": 7279} {"train_loss": -28.293975830078125, "global_step": 604200, "epoch": 7279} {"train_loss": -28.12928581237793, "global_step": 604201, "epoch": 7279} {"train_loss": -27.967437744140625, "global_step": 604202, "epoch": 7279} {"train_loss": -28.115665435791016, "global_step": 604203, "epoch": 7279} {"train_loss": -28.21420669555664, "global_step": 604204, "epoch": 7279} {"train_loss": -28.12421226501465, "global_step": 604205, "epoch": 7279} {"train_loss": -28.40106201171875, "global_step": 604206, "epoch": 7279} {"train_loss": -28.278242111206055, "global_step": 604207, "epoch": 7279} {"train_loss": -28.08172035217285, "global_step": 604208, "epoch": 7279} {"train_loss": -28.259632110595703, "global_step": 604209, "epoch": 7279} {"train_loss": -28.395307540893555, "global_step": 604210, "epoch": 7279} {"train_loss": -28.325592041015625, "global_step": 604211, "epoch": 7279} {"train_loss": -28.26787757873535, "global_step": 604212, "epoch": 7279} {"train_loss": -28.24069595336914, "global_step": 604213, "epoch": 7279} {"train_loss": -28.123071670532227, "global_step": 604214, "epoch": 7279} {"train_loss": -28.052820205688477, "global_step": 604215, "epoch": 7279} {"train_loss": -28.183969497680664, "global_step": 604216, "epoch": 7279} {"train_loss": -27.608469009399414, "global_step": 604217, "epoch": 7279} {"train_loss": -26.740339279174805, "global_step": 604218, "epoch": 7279} {"train_loss": -25.61494255065918, "global_step": 604219, "epoch": 7279} {"train_loss": -27.055164337158203, "global_step": 604220, "epoch": 7279} {"train_loss": -27.845169067382812, "global_step": 604221, "epoch": 7279} {"train_loss": -27.44264793395996, "global_step": 604222, "epoch": 7279} {"train_loss": -27.64351463317871, "global_step": 604223, "epoch": 7279} {"train_loss": -27.630950927734375, "global_step": 604224, "epoch": 7279} {"train_loss": -27.78938102722168, "global_step": 604225, "epoch": 7279} {"train_loss": -27.7608699798584, "global_step": 604226, "epoch": 7279} {"train_loss": -27.85013771057129, "global_step": 604227, "epoch": 7279} {"train_loss": -27.673181533813477, "global_step": 604228, "epoch": 7279} {"train_loss": -28.1146240234375, "global_step": 604229, "epoch": 7279} {"train_loss": -27.988784790039062, "global_step": 604230, "epoch": 7279} {"train_loss": -27.757551193237305, "global_step": 604231, "epoch": 7279} {"train_loss": -27.779138565063477, "global_step": 604232, "epoch": 7279} {"train_loss": -27.88934898376465, "global_step": 604233, "epoch": 7279} {"train_loss": -27.998144149780273, "global_step": 604234, "epoch": 7279} {"train_loss": -28.075347900390625, "global_step": 604235, "epoch": 7279} {"train_loss": -27.523534774780273, "global_step": 604236, "epoch": 7279} {"train_loss": -28.25542640686035, "global_step": 604237, "epoch": 7279} {"train_loss": -27.681241989135742, "global_step": 604238, "epoch": 7279} {"train_loss": -27.874665271804993, "global_step": 604239, "epoch": 7279, "val_loss": 6909485.0} {"train_loss": -27.483182907104492, "global_step": 604240, "epoch": 7280} {"train_loss": -27.405807495117188, "global_step": 604241, "epoch": 7280} {"train_loss": -27.35615348815918, "global_step": 604242, "epoch": 7280} {"train_loss": -26.879535675048828, "global_step": 604243, "epoch": 7280} {"train_loss": -26.950525283813477, "global_step": 604244, "epoch": 7280} {"train_loss": -27.020654678344727, "global_step": 604245, "epoch": 7280} {"train_loss": -27.440052032470703, "global_step": 604246, "epoch": 7280} {"train_loss": -27.059961318969727, "global_step": 604247, "epoch": 7280} {"train_loss": -27.46063232421875, "global_step": 604248, "epoch": 7280} {"train_loss": -27.325611114501953, "global_step": 604249, "epoch": 7280} {"train_loss": -27.81168556213379, "global_step": 604250, "epoch": 7280} {"train_loss": -27.514862060546875, "global_step": 604251, "epoch": 7280} {"train_loss": -27.732099533081055, "global_step": 604252, "epoch": 7280} {"train_loss": -27.53140640258789, "global_step": 604253, "epoch": 7280} {"train_loss": -27.821760177612305, "global_step": 604254, "epoch": 7280} {"train_loss": -27.56361198425293, "global_step": 604255, "epoch": 7280} {"train_loss": -28.021299362182617, "global_step": 604256, "epoch": 7280} {"train_loss": -28.125904083251953, "global_step": 604257, "epoch": 7280} {"train_loss": -27.858530044555664, "global_step": 604258, "epoch": 7280} {"train_loss": -27.82648277282715, "global_step": 604259, "epoch": 7280} {"train_loss": -27.808063507080078, "global_step": 604260, "epoch": 7280} {"train_loss": -27.721328735351562, "global_step": 604261, "epoch": 7280} {"train_loss": -27.63490867614746, "global_step": 604262, "epoch": 7280} {"train_loss": -27.490530014038086, "global_step": 604263, "epoch": 7280} {"train_loss": -27.84998893737793, "global_step": 604264, "epoch": 7280} {"train_loss": -27.90730857849121, "global_step": 604265, "epoch": 7280} {"train_loss": -28.05183982849121, "global_step": 604266, "epoch": 7280} {"train_loss": -27.938146591186523, "global_step": 604267, "epoch": 7280} {"train_loss": -28.2065486907959, "global_step": 604268, "epoch": 7280} {"train_loss": -28.25433921813965, "global_step": 604269, "epoch": 7280} {"train_loss": -27.886199951171875, "global_step": 604270, "epoch": 7280} {"train_loss": -27.944202423095703, "global_step": 604271, "epoch": 7280} {"train_loss": -28.123498916625977, "global_step": 604272, "epoch": 7280} {"train_loss": -27.753284454345703, "global_step": 604273, "epoch": 7280} {"train_loss": -27.700977325439453, "global_step": 604274, "epoch": 7280} {"train_loss": -28.057920455932617, "global_step": 604275, "epoch": 7280} {"train_loss": -28.273273468017578, "global_step": 604276, "epoch": 7280} {"train_loss": -28.217870712280273, "global_step": 604277, "epoch": 7280} {"train_loss": -28.066186904907227, "global_step": 604278, "epoch": 7280} {"train_loss": -27.952585220336914, "global_step": 604279, "epoch": 7280} {"train_loss": -27.920652389526367, "global_step": 604280, "epoch": 7280} {"train_loss": -27.894201278686523, "global_step": 604281, "epoch": 7280} {"train_loss": -28.586048126220703, "global_step": 604282, "epoch": 7280} {"train_loss": -27.94980239868164, "global_step": 604283, "epoch": 7280} {"train_loss": -28.024633407592773, "global_step": 604284, "epoch": 7280} {"train_loss": -27.954431533813477, "global_step": 604285, "epoch": 7280} {"train_loss": -28.00174903869629, "global_step": 604286, "epoch": 7280} {"train_loss": -28.405963897705078, "global_step": 604287, "epoch": 7280} {"train_loss": -28.082014083862305, "global_step": 604288, "epoch": 7280} {"train_loss": -28.322492599487305, "global_step": 604289, "epoch": 7280} {"train_loss": -28.384374618530273, "global_step": 604290, "epoch": 7280} {"train_loss": -28.144948959350586, "global_step": 604291, "epoch": 7280} {"train_loss": -27.933887481689453, "global_step": 604292, "epoch": 7280} {"train_loss": -28.480243682861328, "global_step": 604293, "epoch": 7280} {"train_loss": -27.986459732055664, "global_step": 604294, "epoch": 7280} {"train_loss": -28.45224380493164, "global_step": 604295, "epoch": 7280} {"train_loss": -28.4917049407959, "global_step": 604296, "epoch": 7280} {"train_loss": -27.7360897064209, "global_step": 604297, "epoch": 7280} {"train_loss": -28.298643112182617, "global_step": 604298, "epoch": 7280} {"train_loss": -27.998828887939453, "global_step": 604299, "epoch": 7280} {"train_loss": -27.91888427734375, "global_step": 604300, "epoch": 7280} {"train_loss": -27.96644401550293, "global_step": 604301, "epoch": 7280} {"train_loss": -28.149982452392578, "global_step": 604302, "epoch": 7280} {"train_loss": -28.44696044921875, "global_step": 604303, "epoch": 7280} {"train_loss": -28.22406005859375, "global_step": 604304, "epoch": 7280} {"train_loss": -27.849451065063477, "global_step": 604305, "epoch": 7280} {"train_loss": -27.65802001953125, "global_step": 604306, "epoch": 7280} {"train_loss": -27.881799697875977, "global_step": 604307, "epoch": 7280} {"train_loss": -27.892057418823242, "global_step": 604308, "epoch": 7280} {"train_loss": -28.459070205688477, "global_step": 604309, "epoch": 7280} {"train_loss": -28.588104248046875, "global_step": 604310, "epoch": 7280} {"train_loss": -28.145893096923828, "global_step": 604311, "epoch": 7280} {"train_loss": -27.923828125, "global_step": 604312, "epoch": 7280} {"train_loss": -28.11958122253418, "global_step": 604313, "epoch": 7280} {"train_loss": -28.51152992248535, "global_step": 604314, "epoch": 7280} {"train_loss": -28.55938720703125, "global_step": 604315, "epoch": 7280} {"train_loss": -28.207727432250977, "global_step": 604316, "epoch": 7280} {"train_loss": -28.110410690307617, "global_step": 604317, "epoch": 7280} {"train_loss": -28.236173629760742, "global_step": 604318, "epoch": 7280} {"train_loss": -28.377410888671875, "global_step": 604319, "epoch": 7280} {"train_loss": -28.61871910095215, "global_step": 604320, "epoch": 7280} {"train_loss": -28.682172775268555, "global_step": 604321, "epoch": 7280} {"train_loss": -27.951938927891742, "global_step": 604322, "epoch": 7280, "val_loss": 6843716.0} {"train_loss": -27.942514419555664, "global_step": 604323, "epoch": 7281} {"train_loss": -27.507568359375, "global_step": 604324, "epoch": 7281} {"train_loss": -26.902952194213867, "global_step": 604325, "epoch": 7281} {"train_loss": -27.211658477783203, "global_step": 604326, "epoch": 7281} {"train_loss": -27.873260498046875, "global_step": 604327, "epoch": 7281} {"train_loss": -27.479633331298828, "global_step": 604328, "epoch": 7281} {"train_loss": -27.653778076171875, "global_step": 604329, "epoch": 7281} {"train_loss": -27.380435943603516, "global_step": 604330, "epoch": 7281} {"train_loss": -27.620746612548828, "global_step": 604331, "epoch": 7281} {"train_loss": -27.0022029876709, "global_step": 604332, "epoch": 7281} {"train_loss": -27.577482223510742, "global_step": 604333, "epoch": 7281} {"train_loss": -27.3470458984375, "global_step": 604334, "epoch": 7281} {"train_loss": -27.746734619140625, "global_step": 604335, "epoch": 7281} {"train_loss": -27.70938491821289, "global_step": 604336, "epoch": 7281} {"train_loss": -27.87274742126465, "global_step": 604337, "epoch": 7281} {"train_loss": -27.76917839050293, "global_step": 604338, "epoch": 7281} {"train_loss": -27.74049186706543, "global_step": 604339, "epoch": 7281} {"train_loss": -28.00030517578125, "global_step": 604340, "epoch": 7281} {"train_loss": -27.89223289489746, "global_step": 604341, "epoch": 7281} {"train_loss": -27.682950973510742, "global_step": 604342, "epoch": 7281} {"train_loss": -27.406494140625, "global_step": 604343, "epoch": 7281} {"train_loss": -27.831256866455078, "global_step": 604344, "epoch": 7281} {"train_loss": -27.95684814453125, "global_step": 604345, "epoch": 7281} {"train_loss": -27.78757095336914, "global_step": 604346, "epoch": 7281} {"train_loss": -27.657440185546875, "global_step": 604347, "epoch": 7281} {"train_loss": -27.740955352783203, "global_step": 604348, "epoch": 7281} {"train_loss": -28.0570068359375, "global_step": 604349, "epoch": 7281} {"train_loss": -27.83319091796875, "global_step": 604350, "epoch": 7281} {"train_loss": -28.174091339111328, "global_step": 604351, "epoch": 7281} {"train_loss": -27.808868408203125, "global_step": 604352, "epoch": 7281} {"train_loss": -28.330184936523438, "global_step": 604353, "epoch": 7281} {"train_loss": -27.979877471923828, "global_step": 604354, "epoch": 7281} {"train_loss": -28.05975914001465, "global_step": 604355, "epoch": 7281} {"train_loss": -27.613821029663086, "global_step": 604356, "epoch": 7281} {"train_loss": -28.182409286499023, "global_step": 604357, "epoch": 7281} {"train_loss": -28.05153465270996, "global_step": 604358, "epoch": 7281} {"train_loss": -28.325870513916016, "global_step": 604359, "epoch": 7281} {"train_loss": -28.142316818237305, "global_step": 604360, "epoch": 7281} {"train_loss": -27.620925903320312, "global_step": 604361, "epoch": 7281} {"train_loss": -27.7977294921875, "global_step": 604362, "epoch": 7281} {"train_loss": -27.64198875427246, "global_step": 604363, "epoch": 7281} {"train_loss": -28.253677368164062, "global_step": 604364, "epoch": 7281} {"train_loss": -28.15565299987793, "global_step": 604365, "epoch": 7281} {"train_loss": -27.82840347290039, "global_step": 604366, "epoch": 7281} {"train_loss": -27.622791290283203, "global_step": 604367, "epoch": 7281} {"train_loss": -27.861392974853516, "global_step": 604368, "epoch": 7281} {"train_loss": -28.26755714416504, "global_step": 604369, "epoch": 7281} {"train_loss": -27.479475021362305, "global_step": 604370, "epoch": 7281} {"train_loss": -27.744604110717773, "global_step": 604371, "epoch": 7281} {"train_loss": -28.133214950561523, "global_step": 604372, "epoch": 7281} {"train_loss": -27.995471954345703, "global_step": 604373, "epoch": 7281} {"train_loss": -28.031494140625, "global_step": 604374, "epoch": 7281} {"train_loss": -28.254419326782227, "global_step": 604375, "epoch": 7281} {"train_loss": -27.901294708251953, "global_step": 604376, "epoch": 7281} {"train_loss": -27.86063003540039, "global_step": 604377, "epoch": 7281} {"train_loss": -27.914371490478516, "global_step": 604378, "epoch": 7281} {"train_loss": -27.835500717163086, "global_step": 604379, "epoch": 7281} {"train_loss": -28.209028244018555, "global_step": 604380, "epoch": 7281} {"train_loss": -28.20289421081543, "global_step": 604381, "epoch": 7281} {"train_loss": -27.55499267578125, "global_step": 604382, "epoch": 7281} {"train_loss": -28.25482177734375, "global_step": 604383, "epoch": 7281} {"train_loss": -27.78998374938965, "global_step": 604384, "epoch": 7281} {"train_loss": -27.622961044311523, "global_step": 604385, "epoch": 7281} {"train_loss": -27.68781852722168, "global_step": 604386, "epoch": 7281} {"train_loss": -28.193517684936523, "global_step": 604387, "epoch": 7281} {"train_loss": -27.959394454956055, "global_step": 604388, "epoch": 7281} {"train_loss": -27.306964874267578, "global_step": 604389, "epoch": 7281} {"train_loss": -27.91632080078125, "global_step": 604390, "epoch": 7281} {"train_loss": -27.93365478515625, "global_step": 604391, "epoch": 7281} {"train_loss": -27.8944034576416, "global_step": 604392, "epoch": 7281} {"train_loss": -28.37571144104004, "global_step": 604393, "epoch": 7281} {"train_loss": -28.176380157470703, "global_step": 604394, "epoch": 7281} {"train_loss": -28.057703018188477, "global_step": 604395, "epoch": 7281} {"train_loss": -27.945220947265625, "global_step": 604396, "epoch": 7281} {"train_loss": -27.758771896362305, "global_step": 604397, "epoch": 7281} {"train_loss": -28.18096351623535, "global_step": 604398, "epoch": 7281} {"train_loss": -28.20118522644043, "global_step": 604399, "epoch": 7281} {"train_loss": -28.280248641967773, "global_step": 604400, "epoch": 7281} {"train_loss": -28.040454864501953, "global_step": 604401, "epoch": 7281} {"train_loss": -28.042749404907227, "global_step": 604402, "epoch": 7281} {"train_loss": -28.018310546875, "global_step": 604403, "epoch": 7281} {"train_loss": -27.958465576171875, "global_step": 604404, "epoch": 7281} {"train_loss": -27.874743220317793, "global_step": 604405, "epoch": 7281, "val_loss": 6815502.5} {"train_loss": -26.979827880859375, "global_step": 604406, "epoch": 7282} {"train_loss": -27.492385864257812, "global_step": 604407, "epoch": 7282} {"train_loss": -27.293405532836914, "global_step": 604408, "epoch": 7282} {"train_loss": -27.522663116455078, "global_step": 604409, "epoch": 7282} {"train_loss": -27.452245712280273, "global_step": 604410, "epoch": 7282} {"train_loss": -28.039899826049805, "global_step": 604411, "epoch": 7282} {"train_loss": -27.52507972717285, "global_step": 604412, "epoch": 7282} {"train_loss": -27.563440322875977, "global_step": 604413, "epoch": 7282} {"train_loss": -27.63441276550293, "global_step": 604414, "epoch": 7282} {"train_loss": -27.835372924804688, "global_step": 604415, "epoch": 7282} {"train_loss": -27.798486709594727, "global_step": 604416, "epoch": 7282} {"train_loss": -28.156660079956055, "global_step": 604417, "epoch": 7282} {"train_loss": -27.92286491394043, "global_step": 604418, "epoch": 7282} {"train_loss": -27.854406356811523, "global_step": 604419, "epoch": 7282} {"train_loss": -27.692153930664062, "global_step": 604420, "epoch": 7282} {"train_loss": -27.907180786132812, "global_step": 604421, "epoch": 7282} {"train_loss": -27.995269775390625, "global_step": 604422, "epoch": 7282} {"train_loss": -28.158740997314453, "global_step": 604423, "epoch": 7282} {"train_loss": -28.008716583251953, "global_step": 604424, "epoch": 7282} {"train_loss": -28.06406593322754, "global_step": 604425, "epoch": 7282} {"train_loss": -28.259031295776367, "global_step": 604426, "epoch": 7282} {"train_loss": -28.086994171142578, "global_step": 604427, "epoch": 7282} {"train_loss": -27.645490646362305, "global_step": 604428, "epoch": 7282} {"train_loss": -27.820688247680664, "global_step": 604429, "epoch": 7282} {"train_loss": -27.758453369140625, "global_step": 604430, "epoch": 7282} {"train_loss": -27.442678451538086, "global_step": 604431, "epoch": 7282} {"train_loss": -27.879135131835938, "global_step": 604432, "epoch": 7282} {"train_loss": -27.869245529174805, "global_step": 604433, "epoch": 7282} {"train_loss": -28.317358016967773, "global_step": 604434, "epoch": 7282} {"train_loss": -28.440433502197266, "global_step": 604435, "epoch": 7282} {"train_loss": -28.01535987854004, "global_step": 604436, "epoch": 7282} {"train_loss": -27.831268310546875, "global_step": 604437, "epoch": 7282} {"train_loss": -28.185876846313477, "global_step": 604438, "epoch": 7282} {"train_loss": -28.1112003326416, "global_step": 604439, "epoch": 7282} {"train_loss": -27.56366539001465, "global_step": 604440, "epoch": 7282} {"train_loss": -28.0573673248291, "global_step": 604441, "epoch": 7282} {"train_loss": -28.30445671081543, "global_step": 604442, "epoch": 7282} {"train_loss": -28.115198135375977, "global_step": 604443, "epoch": 7282} {"train_loss": -28.267972946166992, "global_step": 604444, "epoch": 7282} {"train_loss": -28.105199813842773, "global_step": 604445, "epoch": 7282} {"train_loss": -28.328048706054688, "global_step": 604446, "epoch": 7282} {"train_loss": -28.371381759643555, "global_step": 604447, "epoch": 7282} {"train_loss": -28.502241134643555, "global_step": 604448, "epoch": 7282} {"train_loss": -28.223114013671875, "global_step": 604449, "epoch": 7282} {"train_loss": -28.523365020751953, "global_step": 604450, "epoch": 7282} {"train_loss": -28.26649284362793, "global_step": 604451, "epoch": 7282} {"train_loss": -28.327747344970703, "global_step": 604452, "epoch": 7282} {"train_loss": -28.062849044799805, "global_step": 604453, "epoch": 7282} {"train_loss": -28.340951919555664, "global_step": 604454, "epoch": 7282} {"train_loss": -28.19110679626465, "global_step": 604455, "epoch": 7282} {"train_loss": -28.270126342773438, "global_step": 604456, "epoch": 7282} {"train_loss": -28.214990615844727, "global_step": 604457, "epoch": 7282} {"train_loss": -27.939868927001953, "global_step": 604458, "epoch": 7282} {"train_loss": -27.83206558227539, "global_step": 604459, "epoch": 7282} {"train_loss": -27.800445556640625, "global_step": 604460, "epoch": 7282} {"train_loss": -27.686660766601562, "global_step": 604461, "epoch": 7282} {"train_loss": -27.298603057861328, "global_step": 604462, "epoch": 7282} {"train_loss": -26.7983341217041, "global_step": 604463, "epoch": 7282} {"train_loss": -26.75058937072754, "global_step": 604464, "epoch": 7282} {"train_loss": -27.649450302124023, "global_step": 604465, "epoch": 7282} {"train_loss": -27.71925926208496, "global_step": 604466, "epoch": 7282} {"train_loss": -27.5579776763916, "global_step": 604467, "epoch": 7282} {"train_loss": -27.733905792236328, "global_step": 604468, "epoch": 7282} {"train_loss": -27.828861236572266, "global_step": 604469, "epoch": 7282} {"train_loss": -27.676313400268555, "global_step": 604470, "epoch": 7282} {"train_loss": -28.120229721069336, "global_step": 604471, "epoch": 7282} {"train_loss": -27.8007755279541, "global_step": 604472, "epoch": 7282} {"train_loss": -27.832202911376953, "global_step": 604473, "epoch": 7282} {"train_loss": -27.994470596313477, "global_step": 604474, "epoch": 7282} {"train_loss": -27.82687759399414, "global_step": 604475, "epoch": 7282} {"train_loss": -28.28466796875, "global_step": 604476, "epoch": 7282} {"train_loss": -27.652563095092773, "global_step": 604477, "epoch": 7282} {"train_loss": -27.819732666015625, "global_step": 604478, "epoch": 7282} {"train_loss": -27.962743759155273, "global_step": 604479, "epoch": 7282} {"train_loss": -27.729047775268555, "global_step": 604480, "epoch": 7282} {"train_loss": -28.351972579956055, "global_step": 604481, "epoch": 7282} {"train_loss": -28.044631958007812, "global_step": 604482, "epoch": 7282} {"train_loss": -28.21308708190918, "global_step": 604483, "epoch": 7282} {"train_loss": -27.961898803710938, "global_step": 604484, "epoch": 7282} {"train_loss": -27.870168685913086, "global_step": 604485, "epoch": 7282} {"train_loss": -28.288928985595703, "global_step": 604486, "epoch": 7282} {"train_loss": -28.045312881469727, "global_step": 604487, "epoch": 7282} {"train_loss": -27.91664392402373, "global_step": 604488, "epoch": 7282, "val_loss": 6807699.5} {"train_loss": -26.997739791870117, "global_step": 604489, "epoch": 7283} {"train_loss": -27.41367530822754, "global_step": 604490, "epoch": 7283} {"train_loss": -27.145919799804688, "global_step": 604491, "epoch": 7283} {"train_loss": -27.146530151367188, "global_step": 604492, "epoch": 7283} {"train_loss": -27.914403915405273, "global_step": 604493, "epoch": 7283} {"train_loss": -27.21492576599121, "global_step": 604494, "epoch": 7283} {"train_loss": -27.45693016052246, "global_step": 604495, "epoch": 7283} {"train_loss": -27.052350997924805, "global_step": 604496, "epoch": 7283} {"train_loss": -27.497638702392578, "global_step": 604497, "epoch": 7283} {"train_loss": -27.68412208557129, "global_step": 604498, "epoch": 7283} {"train_loss": -27.26543617248535, "global_step": 604499, "epoch": 7283} {"train_loss": -27.6464786529541, "global_step": 604500, "epoch": 7283} {"train_loss": -27.727304458618164, "global_step": 604501, "epoch": 7283} {"train_loss": -27.462726593017578, "global_step": 604502, "epoch": 7283} {"train_loss": -27.008459091186523, "global_step": 604503, "epoch": 7283} {"train_loss": -27.10831069946289, "global_step": 604504, "epoch": 7283} {"train_loss": -28.028533935546875, "global_step": 604505, "epoch": 7283} {"train_loss": -27.271163940429688, "global_step": 604506, "epoch": 7283} {"train_loss": -26.96148681640625, "global_step": 604507, "epoch": 7283} {"train_loss": -28.0369873046875, "global_step": 604508, "epoch": 7283} {"train_loss": -27.724573135375977, "global_step": 604509, "epoch": 7283} {"train_loss": -27.767663955688477, "global_step": 604510, "epoch": 7283} {"train_loss": -27.7058048248291, "global_step": 604511, "epoch": 7283} {"train_loss": -27.4744873046875, "global_step": 604512, "epoch": 7283} {"train_loss": -27.943918228149414, "global_step": 604513, "epoch": 7283} {"train_loss": -27.7093505859375, "global_step": 604514, "epoch": 7283} {"train_loss": -27.84710693359375, "global_step": 604515, "epoch": 7283} {"train_loss": -28.016088485717773, "global_step": 604516, "epoch": 7283} {"train_loss": -27.99911880493164, "global_step": 604517, "epoch": 7283} {"train_loss": -28.004791259765625, "global_step": 604518, "epoch": 7283} {"train_loss": -27.808151245117188, "global_step": 604519, "epoch": 7283} {"train_loss": -28.032550811767578, "global_step": 604520, "epoch": 7283} {"train_loss": -27.990381240844727, "global_step": 604521, "epoch": 7283} {"train_loss": -28.261335372924805, "global_step": 604522, "epoch": 7283} {"train_loss": -27.880773544311523, "global_step": 604523, "epoch": 7283} {"train_loss": -28.108320236206055, "global_step": 604524, "epoch": 7283} {"train_loss": -27.9641056060791, "global_step": 604525, "epoch": 7283} {"train_loss": -28.05312156677246, "global_step": 604526, "epoch": 7283} {"train_loss": -28.292226791381836, "global_step": 604527, "epoch": 7283} {"train_loss": -27.69382095336914, "global_step": 604528, "epoch": 7283} {"train_loss": -28.246007919311523, "global_step": 604529, "epoch": 7283} {"train_loss": -28.09400749206543, "global_step": 604530, "epoch": 7283} {"train_loss": -28.238174438476562, "global_step": 604531, "epoch": 7283} {"train_loss": -28.37957763671875, "global_step": 604532, "epoch": 7283} {"train_loss": -28.278522491455078, "global_step": 604533, "epoch": 7283} {"train_loss": -28.40839195251465, "global_step": 604534, "epoch": 7283} {"train_loss": -28.2985897064209, "global_step": 604535, "epoch": 7283} {"train_loss": -28.259824752807617, "global_step": 604536, "epoch": 7283} {"train_loss": -28.614276885986328, "global_step": 604537, "epoch": 7283} {"train_loss": -27.7143611907959, "global_step": 604538, "epoch": 7283} {"train_loss": -28.324710845947266, "global_step": 604539, "epoch": 7283} {"train_loss": -28.1807804107666, "global_step": 604540, "epoch": 7283} {"train_loss": -28.728662490844727, "global_step": 604541, "epoch": 7283} {"train_loss": -28.075971603393555, "global_step": 604542, "epoch": 7283} {"train_loss": -28.072235107421875, "global_step": 604543, "epoch": 7283} {"train_loss": -28.428186416625977, "global_step": 604544, "epoch": 7283} {"train_loss": -28.130435943603516, "global_step": 604545, "epoch": 7283} {"train_loss": -28.446125030517578, "global_step": 604546, "epoch": 7283} {"train_loss": -28.539051055908203, "global_step": 604547, "epoch": 7283} {"train_loss": -28.51449966430664, "global_step": 604548, "epoch": 7283} {"train_loss": -27.796903610229492, "global_step": 604549, "epoch": 7283} {"train_loss": -28.07733726501465, "global_step": 604550, "epoch": 7283} {"train_loss": -28.3215389251709, "global_step": 604551, "epoch": 7283} {"train_loss": -28.101852416992188, "global_step": 604552, "epoch": 7283} {"train_loss": -28.018606185913086, "global_step": 604553, "epoch": 7283} {"train_loss": -27.754871368408203, "global_step": 604554, "epoch": 7283} {"train_loss": -27.787220001220703, "global_step": 604555, "epoch": 7283} {"train_loss": -27.265674591064453, "global_step": 604556, "epoch": 7283} {"train_loss": -25.7286434173584, "global_step": 604557, "epoch": 7283} {"train_loss": -25.96583366394043, "global_step": 604558, "epoch": 7283} {"train_loss": -26.895187377929688, "global_step": 604559, "epoch": 7283} {"train_loss": -27.668859481811523, "global_step": 604560, "epoch": 7283} {"train_loss": -27.61725425720215, "global_step": 604561, "epoch": 7283} {"train_loss": -27.843585968017578, "global_step": 604562, "epoch": 7283} {"train_loss": -27.567167282104492, "global_step": 604563, "epoch": 7283} {"train_loss": -27.412179946899414, "global_step": 604564, "epoch": 7283} {"train_loss": -27.329696655273438, "global_step": 604565, "epoch": 7283} {"train_loss": -27.6552734375, "global_step": 604566, "epoch": 7283} {"train_loss": -27.895496368408203, "global_step": 604567, "epoch": 7283} {"train_loss": -27.741357803344727, "global_step": 604568, "epoch": 7283} {"train_loss": -27.826391220092773, "global_step": 604569, "epoch": 7283} {"train_loss": -27.689924240112305, "global_step": 604570, "epoch": 7283} {"train_loss": -27.792176832635718, "global_step": 604571, "epoch": 7283, "val_loss": 6714908.5} {"train_loss": -27.20212745666504, "global_step": 604572, "epoch": 7284} {"train_loss": -27.274335861206055, "global_step": 604573, "epoch": 7284} {"train_loss": -27.649356842041016, "global_step": 604574, "epoch": 7284} {"train_loss": -27.45720863342285, "global_step": 604575, "epoch": 7284} {"train_loss": -27.419879913330078, "global_step": 604576, "epoch": 7284} {"train_loss": -27.400848388671875, "global_step": 604577, "epoch": 7284} {"train_loss": -27.47503662109375, "global_step": 604578, "epoch": 7284} {"train_loss": -27.497119903564453, "global_step": 604579, "epoch": 7284} {"train_loss": -27.810815811157227, "global_step": 604580, "epoch": 7284} {"train_loss": -27.703367233276367, "global_step": 604581, "epoch": 7284} {"train_loss": -27.700733184814453, "global_step": 604582, "epoch": 7284} {"train_loss": -27.447046279907227, "global_step": 604583, "epoch": 7284} {"train_loss": -27.843036651611328, "global_step": 604584, "epoch": 7284} {"train_loss": -27.717151641845703, "global_step": 604585, "epoch": 7284} {"train_loss": -27.857831954956055, "global_step": 604586, "epoch": 7284} {"train_loss": -27.94684410095215, "global_step": 604587, "epoch": 7284} {"train_loss": -27.67756462097168, "global_step": 604588, "epoch": 7284} {"train_loss": -28.0288143157959, "global_step": 604589, "epoch": 7284} {"train_loss": -27.79501724243164, "global_step": 604590, "epoch": 7284} {"train_loss": -27.753803253173828, "global_step": 604591, "epoch": 7284} {"train_loss": -28.111648559570312, "global_step": 604592, "epoch": 7284} {"train_loss": -27.945791244506836, "global_step": 604593, "epoch": 7284} {"train_loss": -27.923202514648438, "global_step": 604594, "epoch": 7284} {"train_loss": -28.248632431030273, "global_step": 604595, "epoch": 7284} {"train_loss": -27.587430953979492, "global_step": 604596, "epoch": 7284} {"train_loss": -28.173755645751953, "global_step": 604597, "epoch": 7284} {"train_loss": -28.153339385986328, "global_step": 604598, "epoch": 7284} {"train_loss": -28.24418067932129, "global_step": 604599, "epoch": 7284} {"train_loss": -28.140213012695312, "global_step": 604600, "epoch": 7284} {"train_loss": -27.809110641479492, "global_step": 604601, "epoch": 7284} {"train_loss": -28.252912521362305, "global_step": 604602, "epoch": 7284} {"train_loss": -28.092187881469727, "global_step": 604603, "epoch": 7284} {"train_loss": -28.420013427734375, "global_step": 604604, "epoch": 7284} {"train_loss": -28.270605087280273, "global_step": 604605, "epoch": 7284} {"train_loss": -28.26318359375, "global_step": 604606, "epoch": 7284} {"train_loss": -28.1977481842041, "global_step": 604607, "epoch": 7284} {"train_loss": -28.390640258789062, "global_step": 604608, "epoch": 7284} {"train_loss": -28.320119857788086, "global_step": 604609, "epoch": 7284} {"train_loss": -28.33530616760254, "global_step": 604610, "epoch": 7284} {"train_loss": -28.075504302978516, "global_step": 604611, "epoch": 7284} {"train_loss": -28.238733291625977, "global_step": 604612, "epoch": 7284} {"train_loss": -28.12027931213379, "global_step": 604613, "epoch": 7284} {"train_loss": -27.873727798461914, "global_step": 604614, "epoch": 7284} {"train_loss": -28.17789649963379, "global_step": 604615, "epoch": 7284} {"train_loss": -28.147205352783203, "global_step": 604616, "epoch": 7284} {"train_loss": -28.219289779663086, "global_step": 604617, "epoch": 7284} {"train_loss": -28.395124435424805, "global_step": 604618, "epoch": 7284} {"train_loss": -27.970935821533203, "global_step": 604619, "epoch": 7284} {"train_loss": -28.1866397857666, "global_step": 604620, "epoch": 7284} {"train_loss": -28.28488540649414, "global_step": 604621, "epoch": 7284} {"train_loss": -28.22878074645996, "global_step": 604622, "epoch": 7284} {"train_loss": -28.53571128845215, "global_step": 604623, "epoch": 7284} {"train_loss": -28.00665855407715, "global_step": 604624, "epoch": 7284} {"train_loss": -27.937253952026367, "global_step": 604625, "epoch": 7284} {"train_loss": -27.94773292541504, "global_step": 604626, "epoch": 7284} {"train_loss": -28.061492919921875, "global_step": 604627, "epoch": 7284} {"train_loss": -28.317548751831055, "global_step": 604628, "epoch": 7284} {"train_loss": -27.777816772460938, "global_step": 604629, "epoch": 7284} {"train_loss": -27.674978256225586, "global_step": 604630, "epoch": 7284} {"train_loss": -27.947650909423828, "global_step": 604631, "epoch": 7284} {"train_loss": -27.92938804626465, "global_step": 604632, "epoch": 7284} {"train_loss": -28.269514083862305, "global_step": 604633, "epoch": 7284} {"train_loss": -28.196735382080078, "global_step": 604634, "epoch": 7284} {"train_loss": -28.279178619384766, "global_step": 604635, "epoch": 7284} {"train_loss": -27.97187614440918, "global_step": 604636, "epoch": 7284} {"train_loss": -27.97519874572754, "global_step": 604637, "epoch": 7284} {"train_loss": -28.321561813354492, "global_step": 604638, "epoch": 7284} {"train_loss": -28.445215225219727, "global_step": 604639, "epoch": 7284} {"train_loss": -28.322052001953125, "global_step": 604640, "epoch": 7284} {"train_loss": -28.3779239654541, "global_step": 604641, "epoch": 7284} {"train_loss": -27.8762264251709, "global_step": 604642, "epoch": 7284} {"train_loss": -27.982379913330078, "global_step": 604643, "epoch": 7284} {"train_loss": -27.815649032592773, "global_step": 604644, "epoch": 7284} {"train_loss": -28.231672286987305, "global_step": 604645, "epoch": 7284} {"train_loss": -28.1046199798584, "global_step": 604646, "epoch": 7284} {"train_loss": -27.88214111328125, "global_step": 604647, "epoch": 7284} {"train_loss": -28.16812515258789, "global_step": 604648, "epoch": 7284} {"train_loss": -27.909421920776367, "global_step": 604649, "epoch": 7284} {"train_loss": -27.90799903869629, "global_step": 604650, "epoch": 7284} {"train_loss": -27.34869384765625, "global_step": 604651, "epoch": 7284} {"train_loss": -27.505701065063477, "global_step": 604652, "epoch": 7284} {"train_loss": -28.13677406311035, "global_step": 604653, "epoch": 7284} {"train_loss": -27.994020599916755, "global_step": 604654, "epoch": 7284, "val_loss": 6783851.0} {"train_loss": -27.145862579345703, "global_step": 604655, "epoch": 7285} {"train_loss": -27.536376953125, "global_step": 604656, "epoch": 7285} {"train_loss": -26.672903060913086, "global_step": 604657, "epoch": 7285} {"train_loss": -27.30840492248535, "global_step": 604658, "epoch": 7285} {"train_loss": -27.354589462280273, "global_step": 604659, "epoch": 7285} {"train_loss": -27.474597930908203, "global_step": 604660, "epoch": 7285} {"train_loss": -27.007177352905273, "global_step": 604661, "epoch": 7285} {"train_loss": -27.25299072265625, "global_step": 604662, "epoch": 7285} {"train_loss": -27.618864059448242, "global_step": 604663, "epoch": 7285} {"train_loss": -27.347213745117188, "global_step": 604664, "epoch": 7285} {"train_loss": -27.489194869995117, "global_step": 604665, "epoch": 7285} {"train_loss": -27.209218978881836, "global_step": 604666, "epoch": 7285} {"train_loss": -27.582975387573242, "global_step": 604667, "epoch": 7285} {"train_loss": -27.620397567749023, "global_step": 604668, "epoch": 7285} {"train_loss": -27.442312240600586, "global_step": 604669, "epoch": 7285} {"train_loss": -27.133625030517578, "global_step": 604670, "epoch": 7285} {"train_loss": -27.773855209350586, "global_step": 604671, "epoch": 7285} {"train_loss": -27.6563720703125, "global_step": 604672, "epoch": 7285} {"train_loss": -27.442188262939453, "global_step": 604673, "epoch": 7285} {"train_loss": -27.79109001159668, "global_step": 604674, "epoch": 7285} {"train_loss": -27.54829216003418, "global_step": 604675, "epoch": 7285} {"train_loss": -27.364160537719727, "global_step": 604676, "epoch": 7285} {"train_loss": -27.597753524780273, "global_step": 604677, "epoch": 7285} {"train_loss": -27.704792022705078, "global_step": 604678, "epoch": 7285} {"train_loss": -27.805662155151367, "global_step": 604679, "epoch": 7285} {"train_loss": -27.448450088500977, "global_step": 604680, "epoch": 7285} {"train_loss": -27.885690689086914, "global_step": 604681, "epoch": 7285} {"train_loss": -27.56190299987793, "global_step": 604682, "epoch": 7285} {"train_loss": -27.820556640625, "global_step": 604683, "epoch": 7285} {"train_loss": -27.768726348876953, "global_step": 604684, "epoch": 7285} {"train_loss": -28.135852813720703, "global_step": 604685, "epoch": 7285} {"train_loss": -27.962804794311523, "global_step": 604686, "epoch": 7285} {"train_loss": -28.125274658203125, "global_step": 604687, "epoch": 7285} {"train_loss": -27.9916934967041, "global_step": 604688, "epoch": 7285} {"train_loss": -28.321212768554688, "global_step": 604689, "epoch": 7285} {"train_loss": -28.138946533203125, "global_step": 604690, "epoch": 7285} {"train_loss": -28.190473556518555, "global_step": 604691, "epoch": 7285} {"train_loss": -28.10639762878418, "global_step": 604692, "epoch": 7285} {"train_loss": -28.24375343322754, "global_step": 604693, "epoch": 7285} {"train_loss": -28.250213623046875, "global_step": 604694, "epoch": 7285} {"train_loss": -28.465612411499023, "global_step": 604695, "epoch": 7285} {"train_loss": -28.183414459228516, "global_step": 604696, "epoch": 7285} {"train_loss": -28.339094161987305, "global_step": 604697, "epoch": 7285} {"train_loss": -27.887985229492188, "global_step": 604698, "epoch": 7285} {"train_loss": -28.069162368774414, "global_step": 604699, "epoch": 7285} {"train_loss": -28.28668785095215, "global_step": 604700, "epoch": 7285} {"train_loss": -27.7558536529541, "global_step": 604701, "epoch": 7285} {"train_loss": -27.492216110229492, "global_step": 604702, "epoch": 7285} {"train_loss": -27.197330474853516, "global_step": 604703, "epoch": 7285} {"train_loss": -27.866718292236328, "global_step": 604704, "epoch": 7285} {"train_loss": -28.441818237304688, "global_step": 604705, "epoch": 7285} {"train_loss": -28.056528091430664, "global_step": 604706, "epoch": 7285} {"train_loss": -27.789880752563477, "global_step": 604707, "epoch": 7285} {"train_loss": -28.099050521850586, "global_step": 604708, "epoch": 7285} {"train_loss": -28.057348251342773, "global_step": 604709, "epoch": 7285} {"train_loss": -28.137042999267578, "global_step": 604710, "epoch": 7285} {"train_loss": -28.240934371948242, "global_step": 604711, "epoch": 7285} {"train_loss": -28.30364418029785, "global_step": 604712, "epoch": 7285} {"train_loss": -28.127344131469727, "global_step": 604713, "epoch": 7285} {"train_loss": -27.922271728515625, "global_step": 604714, "epoch": 7285} {"train_loss": -27.66493797302246, "global_step": 604715, "epoch": 7285} {"train_loss": -27.140960693359375, "global_step": 604716, "epoch": 7285} {"train_loss": -26.947467803955078, "global_step": 604717, "epoch": 7285} {"train_loss": -27.222518920898438, "global_step": 604718, "epoch": 7285} {"train_loss": -27.662250518798828, "global_step": 604719, "epoch": 7285} {"train_loss": -27.844404220581055, "global_step": 604720, "epoch": 7285} {"train_loss": -27.37558364868164, "global_step": 604721, "epoch": 7285} {"train_loss": -27.454137802124023, "global_step": 604722, "epoch": 7285} {"train_loss": -27.709054946899414, "global_step": 604723, "epoch": 7285} {"train_loss": -27.63555908203125, "global_step": 604724, "epoch": 7285} {"train_loss": -27.661590576171875, "global_step": 604725, "epoch": 7285} {"train_loss": -27.836145401000977, "global_step": 604726, "epoch": 7285} {"train_loss": -28.10169792175293, "global_step": 604727, "epoch": 7285} {"train_loss": -27.89276123046875, "global_step": 604728, "epoch": 7285} {"train_loss": -28.327804565429688, "global_step": 604729, "epoch": 7285} {"train_loss": -27.478235244750977, "global_step": 604730, "epoch": 7285} {"train_loss": -28.029844284057617, "global_step": 604731, "epoch": 7285} {"train_loss": -28.027271270751953, "global_step": 604732, "epoch": 7285} {"train_loss": -28.028425216674805, "global_step": 604733, "epoch": 7285} {"train_loss": -27.853240966796875, "global_step": 604734, "epoch": 7285} {"train_loss": -27.542800903320312, "global_step": 604735, "epoch": 7285} {"train_loss": -27.898590087890625, "global_step": 604736, "epoch": 7285} {"train_loss": -27.737253097166498, "global_step": 604737, "epoch": 7285, "val_loss": 6783192.0} {"train_loss": -26.317060470581055, "global_step": 604738, "epoch": 7286} {"train_loss": -25.610143661499023, "global_step": 604739, "epoch": 7286} {"train_loss": -27.37977409362793, "global_step": 604740, "epoch": 7286} {"train_loss": -25.797094345092773, "global_step": 604741, "epoch": 7286} {"train_loss": -27.007299423217773, "global_step": 604742, "epoch": 7286} {"train_loss": -26.781579971313477, "global_step": 604743, "epoch": 7286} {"train_loss": -27.36606216430664, "global_step": 604744, "epoch": 7286} {"train_loss": -26.9410457611084, "global_step": 604745, "epoch": 7286} {"train_loss": -26.601598739624023, "global_step": 604746, "epoch": 7286} {"train_loss": -27.453189849853516, "global_step": 604747, "epoch": 7286} {"train_loss": -27.497760772705078, "global_step": 604748, "epoch": 7286} {"train_loss": -27.576736450195312, "global_step": 604749, "epoch": 7286} {"train_loss": -27.498779296875, "global_step": 604750, "epoch": 7286} {"train_loss": -27.71047019958496, "global_step": 604751, "epoch": 7286} {"train_loss": -27.63447380065918, "global_step": 604752, "epoch": 7286} {"train_loss": -27.687692642211914, "global_step": 604753, "epoch": 7286} {"train_loss": -27.423513412475586, "global_step": 604754, "epoch": 7286} {"train_loss": -27.77386474609375, "global_step": 604755, "epoch": 7286} {"train_loss": -27.5827579498291, "global_step": 604756, "epoch": 7286} {"train_loss": -27.675586700439453, "global_step": 604757, "epoch": 7286} {"train_loss": -27.7418212890625, "global_step": 604758, "epoch": 7286} {"train_loss": -27.774412155151367, "global_step": 604759, "epoch": 7286} {"train_loss": -27.663818359375, "global_step": 604760, "epoch": 7286} {"train_loss": -27.999988555908203, "global_step": 604761, "epoch": 7286} {"train_loss": -27.813007354736328, "global_step": 604762, "epoch": 7286} {"train_loss": -27.897031784057617, "global_step": 604763, "epoch": 7286} {"train_loss": -27.83431053161621, "global_step": 604764, "epoch": 7286} {"train_loss": -27.89666175842285, "global_step": 604765, "epoch": 7286} {"train_loss": -28.0886173248291, "global_step": 604766, "epoch": 7286} {"train_loss": -28.10161781311035, "global_step": 604767, "epoch": 7286} {"train_loss": -27.83745765686035, "global_step": 604768, "epoch": 7286} {"train_loss": -28.188581466674805, "global_step": 604769, "epoch": 7286} {"train_loss": -27.81109619140625, "global_step": 604770, "epoch": 7286} {"train_loss": -27.753686904907227, "global_step": 604771, "epoch": 7286} {"train_loss": -28.313079833984375, "global_step": 604772, "epoch": 7286} {"train_loss": -27.72366714477539, "global_step": 604773, "epoch": 7286} {"train_loss": -27.909189224243164, "global_step": 604774, "epoch": 7286} {"train_loss": -27.73105812072754, "global_step": 604775, "epoch": 7286} {"train_loss": -28.154321670532227, "global_step": 604776, "epoch": 7286} {"train_loss": -28.319843292236328, "global_step": 604777, "epoch": 7286} {"train_loss": -28.30216407775879, "global_step": 604778, "epoch": 7286} {"train_loss": -27.6181640625, "global_step": 604779, "epoch": 7286} {"train_loss": -27.841873168945312, "global_step": 604780, "epoch": 7286} {"train_loss": -28.034992218017578, "global_step": 604781, "epoch": 7286} {"train_loss": -27.941308975219727, "global_step": 604782, "epoch": 7286} {"train_loss": -28.20939064025879, "global_step": 604783, "epoch": 7286} {"train_loss": -28.183935165405273, "global_step": 604784, "epoch": 7286} {"train_loss": -28.154462814331055, "global_step": 604785, "epoch": 7286} {"train_loss": -27.63995361328125, "global_step": 604786, "epoch": 7286} {"train_loss": -28.2656307220459, "global_step": 604787, "epoch": 7286} {"train_loss": -28.24799156188965, "global_step": 604788, "epoch": 7286} {"train_loss": -28.018085479736328, "global_step": 604789, "epoch": 7286} {"train_loss": -28.28959083557129, "global_step": 604790, "epoch": 7286} {"train_loss": -28.129987716674805, "global_step": 604791, "epoch": 7286} {"train_loss": -28.263784408569336, "global_step": 604792, "epoch": 7286} {"train_loss": -28.071308135986328, "global_step": 604793, "epoch": 7286} {"train_loss": -28.30668067932129, "global_step": 604794, "epoch": 7286} {"train_loss": -28.117572784423828, "global_step": 604795, "epoch": 7286} {"train_loss": -28.30018424987793, "global_step": 604796, "epoch": 7286} {"train_loss": -28.135839462280273, "global_step": 604797, "epoch": 7286} {"train_loss": -28.461496353149414, "global_step": 604798, "epoch": 7286} {"train_loss": -28.706274032592773, "global_step": 604799, "epoch": 7286} {"train_loss": -28.322830200195312, "global_step": 604800, "epoch": 7286} {"train_loss": -28.267227172851562, "global_step": 604801, "epoch": 7286} {"train_loss": -28.287572860717773, "global_step": 604802, "epoch": 7286} {"train_loss": -28.161895751953125, "global_step": 604803, "epoch": 7286} {"train_loss": -28.5034122467041, "global_step": 604804, "epoch": 7286} {"train_loss": -28.113489151000977, "global_step": 604805, "epoch": 7286} {"train_loss": -28.300521850585938, "global_step": 604806, "epoch": 7286} {"train_loss": -28.171524047851562, "global_step": 604807, "epoch": 7286} {"train_loss": -28.040796279907227, "global_step": 604808, "epoch": 7286} {"train_loss": -28.33485221862793, "global_step": 604809, "epoch": 7286} {"train_loss": -28.358579635620117, "global_step": 604810, "epoch": 7286} {"train_loss": -28.4562931060791, "global_step": 604811, "epoch": 7286} {"train_loss": -27.959716796875, "global_step": 604812, "epoch": 7286} {"train_loss": -28.273300170898438, "global_step": 604813, "epoch": 7286} {"train_loss": -28.404315948486328, "global_step": 604814, "epoch": 7286} {"train_loss": -28.286865234375, "global_step": 604815, "epoch": 7286} {"train_loss": -28.0146484375, "global_step": 604816, "epoch": 7286} {"train_loss": -27.675537109375, "global_step": 604817, "epoch": 7286} {"train_loss": -27.643848419189453, "global_step": 604818, "epoch": 7286} {"train_loss": -27.144550323486328, "global_step": 604819, "epoch": 7286} {"train_loss": -27.80788511253265, "global_step": 604820, "epoch": 7286, "val_loss": 6845947.0} {"train_loss": -23.684680938720703, "global_step": 604821, "epoch": 7287} {"train_loss": -25.713409423828125, "global_step": 604822, "epoch": 7287} {"train_loss": -24.25253677368164, "global_step": 604823, "epoch": 7287} {"train_loss": -24.15626335144043, "global_step": 604824, "epoch": 7287} {"train_loss": -25.40406608581543, "global_step": 604825, "epoch": 7287} {"train_loss": -25.767621994018555, "global_step": 604826, "epoch": 7287} {"train_loss": -25.8516845703125, "global_step": 604827, "epoch": 7287} {"train_loss": -25.793121337890625, "global_step": 604828, "epoch": 7287} {"train_loss": -26.40376853942871, "global_step": 604829, "epoch": 7287} {"train_loss": -26.27370262145996, "global_step": 604830, "epoch": 7287} {"train_loss": -26.416574478149414, "global_step": 604831, "epoch": 7287} {"train_loss": -26.189605712890625, "global_step": 604832, "epoch": 7287} {"train_loss": -26.406248092651367, "global_step": 604833, "epoch": 7287} {"train_loss": -26.297101974487305, "global_step": 604834, "epoch": 7287} {"train_loss": -26.89590835571289, "global_step": 604835, "epoch": 7287} {"train_loss": -26.312971115112305, "global_step": 604836, "epoch": 7287} {"train_loss": -26.82706069946289, "global_step": 604837, "epoch": 7287} {"train_loss": -26.968835830688477, "global_step": 604838, "epoch": 7287} {"train_loss": -26.586023330688477, "global_step": 604839, "epoch": 7287} {"train_loss": -26.712202072143555, "global_step": 604840, "epoch": 7287} {"train_loss": -27.07575035095215, "global_step": 604841, "epoch": 7287} {"train_loss": -26.61652183532715, "global_step": 604842, "epoch": 7287} {"train_loss": -27.22503089904785, "global_step": 604843, "epoch": 7287} {"train_loss": -27.302698135375977, "global_step": 604844, "epoch": 7287} {"train_loss": -27.10638999938965, "global_step": 604845, "epoch": 7287} {"train_loss": -26.89890480041504, "global_step": 604846, "epoch": 7287} {"train_loss": -27.254871368408203, "global_step": 604847, "epoch": 7287} {"train_loss": -27.498212814331055, "global_step": 604848, "epoch": 7287} {"train_loss": -27.147489547729492, "global_step": 604849, "epoch": 7287} {"train_loss": -27.459863662719727, "global_step": 604850, "epoch": 7287} {"train_loss": -27.366071701049805, "global_step": 604851, "epoch": 7287} {"train_loss": -27.491943359375, "global_step": 604852, "epoch": 7287} {"train_loss": -27.5075740814209, "global_step": 604853, "epoch": 7287} {"train_loss": -27.341272354125977, "global_step": 604854, "epoch": 7287} {"train_loss": -27.68988609313965, "global_step": 604855, "epoch": 7287} {"train_loss": -27.566389083862305, "global_step": 604856, "epoch": 7287} {"train_loss": -27.73368263244629, "global_step": 604857, "epoch": 7287} {"train_loss": -27.736560821533203, "global_step": 604858, "epoch": 7287} {"train_loss": -27.511188507080078, "global_step": 604859, "epoch": 7287} {"train_loss": -27.825651168823242, "global_step": 604860, "epoch": 7287} {"train_loss": -27.84531021118164, "global_step": 604861, "epoch": 7287} {"train_loss": -27.704517364501953, "global_step": 604862, "epoch": 7287} {"train_loss": -27.714126586914062, "global_step": 604863, "epoch": 7287} {"train_loss": -27.522998809814453, "global_step": 604864, "epoch": 7287} {"train_loss": -28.00677490234375, "global_step": 604865, "epoch": 7287} {"train_loss": -27.785903930664062, "global_step": 604866, "epoch": 7287} {"train_loss": -27.851856231689453, "global_step": 604867, "epoch": 7287} {"train_loss": -27.992353439331055, "global_step": 604868, "epoch": 7287} {"train_loss": -27.89679527282715, "global_step": 604869, "epoch": 7287} {"train_loss": -28.092283248901367, "global_step": 604870, "epoch": 7287} {"train_loss": -28.086851119995117, "global_step": 604871, "epoch": 7287} {"train_loss": -27.96525001525879, "global_step": 604872, "epoch": 7287} {"train_loss": -28.014429092407227, "global_step": 604873, "epoch": 7287} {"train_loss": -27.758289337158203, "global_step": 604874, "epoch": 7287} {"train_loss": -28.310651779174805, "global_step": 604875, "epoch": 7287} {"train_loss": -27.906370162963867, "global_step": 604876, "epoch": 7287} {"train_loss": -27.910627365112305, "global_step": 604877, "epoch": 7287} {"train_loss": -28.153722763061523, "global_step": 604878, "epoch": 7287} {"train_loss": -28.1029052734375, "global_step": 604879, "epoch": 7287} {"train_loss": -28.079282760620117, "global_step": 604880, "epoch": 7287} {"train_loss": -27.826147079467773, "global_step": 604881, "epoch": 7287} {"train_loss": -27.7850399017334, "global_step": 604882, "epoch": 7287} {"train_loss": -28.2210750579834, "global_step": 604883, "epoch": 7287} {"train_loss": -28.106603622436523, "global_step": 604884, "epoch": 7287} {"train_loss": -28.41206169128418, "global_step": 604885, "epoch": 7287} {"train_loss": -28.052001953125, "global_step": 604886, "epoch": 7287} {"train_loss": -28.48451042175293, "global_step": 604887, "epoch": 7287} {"train_loss": -27.95948600769043, "global_step": 604888, "epoch": 7287} {"train_loss": -28.122833251953125, "global_step": 604889, "epoch": 7287} {"train_loss": -28.05067253112793, "global_step": 604890, "epoch": 7287} {"train_loss": -28.26150894165039, "global_step": 604891, "epoch": 7287} {"train_loss": -28.12611961364746, "global_step": 604892, "epoch": 7287} {"train_loss": -27.880725860595703, "global_step": 604893, "epoch": 7287} {"train_loss": -27.780954360961914, "global_step": 604894, "epoch": 7287} {"train_loss": -27.282522201538086, "global_step": 604895, "epoch": 7287} {"train_loss": -26.986677169799805, "global_step": 604896, "epoch": 7287} {"train_loss": -26.665637969970703, "global_step": 604897, "epoch": 7287} {"train_loss": -27.38174819946289, "global_step": 604898, "epoch": 7287} {"train_loss": -27.339435577392578, "global_step": 604899, "epoch": 7287} {"train_loss": -26.81396484375, "global_step": 604900, "epoch": 7287} {"train_loss": -27.857690811157227, "global_step": 604901, "epoch": 7287} {"train_loss": -27.82718849182129, "global_step": 604902, "epoch": 7287} {"train_loss": -27.27673861492111, "global_step": 604903, "epoch": 7287, "val_loss": 6699669.0} {"train_loss": -27.051801681518555, "global_step": 604904, "epoch": 7288} {"train_loss": -27.256061553955078, "global_step": 604905, "epoch": 7288} {"train_loss": -27.00526237487793, "global_step": 604906, "epoch": 7288} {"train_loss": -27.167627334594727, "global_step": 604907, "epoch": 7288} {"train_loss": -26.86667823791504, "global_step": 604908, "epoch": 7288} {"train_loss": -27.381284713745117, "global_step": 604909, "epoch": 7288} {"train_loss": -26.927234649658203, "global_step": 604910, "epoch": 7288} {"train_loss": -27.482934951782227, "global_step": 604911, "epoch": 7288} {"train_loss": -27.433752059936523, "global_step": 604912, "epoch": 7288} {"train_loss": -27.248523712158203, "global_step": 604913, "epoch": 7288} {"train_loss": -27.359914779663086, "global_step": 604914, "epoch": 7288} {"train_loss": -27.616003036499023, "global_step": 604915, "epoch": 7288} {"train_loss": -27.558979034423828, "global_step": 604916, "epoch": 7288} {"train_loss": -27.382007598876953, "global_step": 604917, "epoch": 7288} {"train_loss": -27.349811553955078, "global_step": 604918, "epoch": 7288} {"train_loss": -27.430273056030273, "global_step": 604919, "epoch": 7288} {"train_loss": -27.62774085998535, "global_step": 604920, "epoch": 7288} {"train_loss": -27.599157333374023, "global_step": 604921, "epoch": 7288} {"train_loss": -27.817968368530273, "global_step": 604922, "epoch": 7288} {"train_loss": -27.502187728881836, "global_step": 604923, "epoch": 7288} {"train_loss": -28.06940269470215, "global_step": 604924, "epoch": 7288} {"train_loss": -27.565601348876953, "global_step": 604925, "epoch": 7288} {"train_loss": -27.652698516845703, "global_step": 604926, "epoch": 7288} {"train_loss": -27.56337547302246, "global_step": 604927, "epoch": 7288} {"train_loss": -27.80252456665039, "global_step": 604928, "epoch": 7288} {"train_loss": -27.840763092041016, "global_step": 604929, "epoch": 7288} {"train_loss": -27.608301162719727, "global_step": 604930, "epoch": 7288} {"train_loss": -27.787158966064453, "global_step": 604931, "epoch": 7288} {"train_loss": -27.737905502319336, "global_step": 604932, "epoch": 7288} {"train_loss": -27.91360855102539, "global_step": 604933, "epoch": 7288} {"train_loss": -27.9547176361084, "global_step": 604934, "epoch": 7288} {"train_loss": -27.382984161376953, "global_step": 604935, "epoch": 7288} {"train_loss": -27.987262725830078, "global_step": 604936, "epoch": 7288} {"train_loss": -28.310144424438477, "global_step": 604937, "epoch": 7288} {"train_loss": -27.92652702331543, "global_step": 604938, "epoch": 7288} {"train_loss": -27.925628662109375, "global_step": 604939, "epoch": 7288} {"train_loss": -27.825550079345703, "global_step": 604940, "epoch": 7288} {"train_loss": -28.214065551757812, "global_step": 604941, "epoch": 7288} {"train_loss": -28.230993270874023, "global_step": 604942, "epoch": 7288} {"train_loss": -27.970388412475586, "global_step": 604943, "epoch": 7288} {"train_loss": -28.29058265686035, "global_step": 604944, "epoch": 7288} {"train_loss": -27.946203231811523, "global_step": 604945, "epoch": 7288} {"train_loss": -28.470251083374023, "global_step": 604946, "epoch": 7288} {"train_loss": -28.10357093811035, "global_step": 604947, "epoch": 7288} {"train_loss": -28.604440689086914, "global_step": 604948, "epoch": 7288} {"train_loss": -28.071842193603516, "global_step": 604949, "epoch": 7288} {"train_loss": -27.933637619018555, "global_step": 604950, "epoch": 7288} {"train_loss": -27.81721305847168, "global_step": 604951, "epoch": 7288} {"train_loss": -28.161056518554688, "global_step": 604952, "epoch": 7288} {"train_loss": -28.445783615112305, "global_step": 604953, "epoch": 7288} {"train_loss": -28.082014083862305, "global_step": 604954, "epoch": 7288} {"train_loss": -28.159494400024414, "global_step": 604955, "epoch": 7288} {"train_loss": -28.2186279296875, "global_step": 604956, "epoch": 7288} {"train_loss": -27.969100952148438, "global_step": 604957, "epoch": 7288} {"train_loss": -27.84490966796875, "global_step": 604958, "epoch": 7288} {"train_loss": -28.02968406677246, "global_step": 604959, "epoch": 7288} {"train_loss": -28.5188045501709, "global_step": 604960, "epoch": 7288} {"train_loss": -27.873559951782227, "global_step": 604961, "epoch": 7288} {"train_loss": -28.17268943786621, "global_step": 604962, "epoch": 7288} {"train_loss": -28.07965660095215, "global_step": 604963, "epoch": 7288} {"train_loss": -28.340137481689453, "global_step": 604964, "epoch": 7288} {"train_loss": -28.265396118164062, "global_step": 604965, "epoch": 7288} {"train_loss": -27.593631744384766, "global_step": 604966, "epoch": 7288} {"train_loss": -28.060998916625977, "global_step": 604967, "epoch": 7288} {"train_loss": -28.0089168548584, "global_step": 604968, "epoch": 7288} {"train_loss": -28.30434226989746, "global_step": 604969, "epoch": 7288} {"train_loss": -28.242694854736328, "global_step": 604970, "epoch": 7288} {"train_loss": -27.58473014831543, "global_step": 604971, "epoch": 7288} {"train_loss": -27.71327018737793, "global_step": 604972, "epoch": 7288} {"train_loss": -28.0190486907959, "global_step": 604973, "epoch": 7288} {"train_loss": -28.086872100830078, "global_step": 604974, "epoch": 7288} {"train_loss": -28.117761611938477, "global_step": 604975, "epoch": 7288} {"train_loss": -27.955617904663086, "global_step": 604976, "epoch": 7288} {"train_loss": -27.528425216674805, "global_step": 604977, "epoch": 7288} {"train_loss": -28.377988815307617, "global_step": 604978, "epoch": 7288} {"train_loss": -28.204641342163086, "global_step": 604979, "epoch": 7288} {"train_loss": -28.275897979736328, "global_step": 604980, "epoch": 7288} {"train_loss": -28.1699275970459, "global_step": 604981, "epoch": 7288} {"train_loss": -28.35466957092285, "global_step": 604982, "epoch": 7288} {"train_loss": -28.169269561767578, "global_step": 604983, "epoch": 7288} {"train_loss": -27.871479034423828, "global_step": 604984, "epoch": 7288} {"train_loss": -27.909887313842773, "global_step": 604985, "epoch": 7288} {"train_loss": -27.85587071797934, "global_step": 604986, "epoch": 7288, "val_loss": 6818427.5} {"train_loss": -25.85066032409668, "global_step": 604987, "epoch": 7289} {"train_loss": -25.760974884033203, "global_step": 604988, "epoch": 7289} {"train_loss": -26.958709716796875, "global_step": 604989, "epoch": 7289} {"train_loss": -27.363855361938477, "global_step": 604990, "epoch": 7289} {"train_loss": -26.690673828125, "global_step": 604991, "epoch": 7289} {"train_loss": -27.554113388061523, "global_step": 604992, "epoch": 7289} {"train_loss": -27.472549438476562, "global_step": 604993, "epoch": 7289} {"train_loss": -27.45064353942871, "global_step": 604994, "epoch": 7289} {"train_loss": -27.243865966796875, "global_step": 604995, "epoch": 7289} {"train_loss": -27.60444450378418, "global_step": 604996, "epoch": 7289} {"train_loss": -27.30232810974121, "global_step": 604997, "epoch": 7289} {"train_loss": -27.017181396484375, "global_step": 604998, "epoch": 7289} {"train_loss": -27.732595443725586, "global_step": 604999, "epoch": 7289} {"train_loss": -27.50655174255371, "global_step": 605000, "epoch": 7289} {"train_loss": -27.746185302734375, "global_step": 605001, "epoch": 7289} {"train_loss": -28.153629302978516, "global_step": 605002, "epoch": 7289} {"train_loss": -27.500431060791016, "global_step": 605003, "epoch": 7289} {"train_loss": -27.517187118530273, "global_step": 605004, "epoch": 7289} {"train_loss": -27.6082706451416, "global_step": 605005, "epoch": 7289} {"train_loss": -27.53668212890625, "global_step": 605006, "epoch": 7289} {"train_loss": -27.644498825073242, "global_step": 605007, "epoch": 7289} {"train_loss": -27.3844051361084, "global_step": 605008, "epoch": 7289} {"train_loss": -27.890039443969727, "global_step": 605009, "epoch": 7289} {"train_loss": -27.4554386138916, "global_step": 605010, "epoch": 7289} {"train_loss": -27.83699607849121, "global_step": 605011, "epoch": 7289} {"train_loss": -27.480457305908203, "global_step": 605012, "epoch": 7289} {"train_loss": -28.04060173034668, "global_step": 605013, "epoch": 7289} {"train_loss": -27.609573364257812, "global_step": 605014, "epoch": 7289} {"train_loss": -28.006921768188477, "global_step": 605015, "epoch": 7289} {"train_loss": -27.798095703125, "global_step": 605016, "epoch": 7289} {"train_loss": -28.060489654541016, "global_step": 605017, "epoch": 7289} {"train_loss": -28.016742706298828, "global_step": 605018, "epoch": 7289} {"train_loss": -27.538867950439453, "global_step": 605019, "epoch": 7289} {"train_loss": -28.099050521850586, "global_step": 605020, "epoch": 7289} {"train_loss": -27.82952880859375, "global_step": 605021, "epoch": 7289} {"train_loss": -27.687658309936523, "global_step": 605022, "epoch": 7289} {"train_loss": -27.800189971923828, "global_step": 605023, "epoch": 7289} {"train_loss": -28.167261123657227, "global_step": 605024, "epoch": 7289} {"train_loss": -28.0228328704834, "global_step": 605025, "epoch": 7289} {"train_loss": -28.308462142944336, "global_step": 605026, "epoch": 7289} {"train_loss": -28.217529296875, "global_step": 605027, "epoch": 7289} {"train_loss": -27.9888916015625, "global_step": 605028, "epoch": 7289} {"train_loss": -28.29499626159668, "global_step": 605029, "epoch": 7289} {"train_loss": -28.04913330078125, "global_step": 605030, "epoch": 7289} {"train_loss": -27.571125030517578, "global_step": 605031, "epoch": 7289} {"train_loss": -28.183622360229492, "global_step": 605032, "epoch": 7289} {"train_loss": -27.882801055908203, "global_step": 605033, "epoch": 7289} {"train_loss": -28.231098175048828, "global_step": 605034, "epoch": 7289} {"train_loss": -28.168912887573242, "global_step": 605035, "epoch": 7289} {"train_loss": -27.937864303588867, "global_step": 605036, "epoch": 7289} {"train_loss": -28.006210327148438, "global_step": 605037, "epoch": 7289} {"train_loss": -28.039655685424805, "global_step": 605038, "epoch": 7289} {"train_loss": -28.043725967407227, "global_step": 605039, "epoch": 7289} {"train_loss": -28.147907257080078, "global_step": 605040, "epoch": 7289} {"train_loss": -28.340606689453125, "global_step": 605041, "epoch": 7289} {"train_loss": -28.582571029663086, "global_step": 605042, "epoch": 7289} {"train_loss": -28.09568214416504, "global_step": 605043, "epoch": 7289} {"train_loss": -28.314481735229492, "global_step": 605044, "epoch": 7289} {"train_loss": -28.127944946289062, "global_step": 605045, "epoch": 7289} {"train_loss": -28.162784576416016, "global_step": 605046, "epoch": 7289} {"train_loss": -28.241052627563477, "global_step": 605047, "epoch": 7289} {"train_loss": -28.51749610900879, "global_step": 605048, "epoch": 7289} {"train_loss": -28.37127113342285, "global_step": 605049, "epoch": 7289} {"train_loss": -28.190540313720703, "global_step": 605050, "epoch": 7289} {"train_loss": -28.43868064880371, "global_step": 605051, "epoch": 7289} {"train_loss": -28.44535255432129, "global_step": 605052, "epoch": 7289} {"train_loss": -28.50141716003418, "global_step": 605053, "epoch": 7289} {"train_loss": -28.401952743530273, "global_step": 605054, "epoch": 7289} {"train_loss": -28.033863067626953, "global_step": 605055, "epoch": 7289} {"train_loss": -27.904321670532227, "global_step": 605056, "epoch": 7289} {"train_loss": -28.217634201049805, "global_step": 605057, "epoch": 7289} {"train_loss": -28.050878524780273, "global_step": 605058, "epoch": 7289} {"train_loss": -28.1359806060791, "global_step": 605059, "epoch": 7289} {"train_loss": -27.888900756835938, "global_step": 605060, "epoch": 7289} {"train_loss": -27.927570343017578, "global_step": 605061, "epoch": 7289} {"train_loss": -28.523239135742188, "global_step": 605062, "epoch": 7289} {"train_loss": -28.055410385131836, "global_step": 605063, "epoch": 7289} {"train_loss": -28.56561851501465, "global_step": 605064, "epoch": 7289} {"train_loss": -27.786712646484375, "global_step": 605065, "epoch": 7289} {"train_loss": -27.648101806640625, "global_step": 605066, "epoch": 7289} {"train_loss": -27.98052406311035, "global_step": 605067, "epoch": 7289} {"train_loss": -28.579120635986328, "global_step": 605068, "epoch": 7289} {"train_loss": -27.878215858735235, "global_step": 605069, "epoch": 7289, "val_loss": 6858572.0} {"train_loss": -26.85357093811035, "global_step": 605070, "epoch": 7290} {"train_loss": -26.47041893005371, "global_step": 605071, "epoch": 7290} {"train_loss": -25.748600006103516, "global_step": 605072, "epoch": 7290} {"train_loss": -25.535579681396484, "global_step": 605073, "epoch": 7290} {"train_loss": -24.998788833618164, "global_step": 605074, "epoch": 7290} {"train_loss": -27.56093406677246, "global_step": 605075, "epoch": 7290} {"train_loss": -25.98653221130371, "global_step": 605076, "epoch": 7290} {"train_loss": -26.222000122070312, "global_step": 605077, "epoch": 7290} {"train_loss": -26.888532638549805, "global_step": 605078, "epoch": 7290} {"train_loss": -26.868640899658203, "global_step": 605079, "epoch": 7290} {"train_loss": -27.094945907592773, "global_step": 605080, "epoch": 7290} {"train_loss": -26.9738712310791, "global_step": 605081, "epoch": 7290} {"train_loss": -26.82508659362793, "global_step": 605082, "epoch": 7290} {"train_loss": -27.0611629486084, "global_step": 605083, "epoch": 7290} {"train_loss": -27.084552764892578, "global_step": 605084, "epoch": 7290} {"train_loss": -27.027912139892578, "global_step": 605085, "epoch": 7290} {"train_loss": -27.41322135925293, "global_step": 605086, "epoch": 7290} {"train_loss": -27.5953426361084, "global_step": 605087, "epoch": 7290} {"train_loss": -27.3995304107666, "global_step": 605088, "epoch": 7290} {"train_loss": -27.4117431640625, "global_step": 605089, "epoch": 7290} {"train_loss": -27.612567901611328, "global_step": 605090, "epoch": 7290} {"train_loss": -27.2110652923584, "global_step": 605091, "epoch": 7290} {"train_loss": -27.363000869750977, "global_step": 605092, "epoch": 7290} {"train_loss": -27.636356353759766, "global_step": 605093, "epoch": 7290} {"train_loss": -27.581008911132812, "global_step": 605094, "epoch": 7290} {"train_loss": -27.310754776000977, "global_step": 605095, "epoch": 7290} {"train_loss": -27.917743682861328, "global_step": 605096, "epoch": 7290} {"train_loss": -27.71760368347168, "global_step": 605097, "epoch": 7290} {"train_loss": -28.03846549987793, "global_step": 605098, "epoch": 7290} {"train_loss": -27.744190216064453, "global_step": 605099, "epoch": 7290} {"train_loss": -27.812482833862305, "global_step": 605100, "epoch": 7290} {"train_loss": -27.80573844909668, "global_step": 605101, "epoch": 7290} {"train_loss": -27.9340877532959, "global_step": 605102, "epoch": 7290} {"train_loss": -27.723112106323242, "global_step": 605103, "epoch": 7290} {"train_loss": -27.82233238220215, "global_step": 605104, "epoch": 7290} {"train_loss": -28.002084732055664, "global_step": 605105, "epoch": 7290} {"train_loss": -27.890119552612305, "global_step": 605106, "epoch": 7290} {"train_loss": -27.79619789123535, "global_step": 605107, "epoch": 7290} {"train_loss": -27.87226676940918, "global_step": 605108, "epoch": 7290} {"train_loss": -27.91997718811035, "global_step": 605109, "epoch": 7290} {"train_loss": -27.74759292602539, "global_step": 605110, "epoch": 7290} {"train_loss": -27.724613189697266, "global_step": 605111, "epoch": 7290} {"train_loss": -27.91228675842285, "global_step": 605112, "epoch": 7290} {"train_loss": -28.399200439453125, "global_step": 605113, "epoch": 7290} {"train_loss": -28.27823257446289, "global_step": 605114, "epoch": 7290} {"train_loss": -27.899215698242188, "global_step": 605115, "epoch": 7290} {"train_loss": -28.22137451171875, "global_step": 605116, "epoch": 7290} {"train_loss": -28.103097915649414, "global_step": 605117, "epoch": 7290} {"train_loss": -28.489370346069336, "global_step": 605118, "epoch": 7290} {"train_loss": -28.555978775024414, "global_step": 605119, "epoch": 7290} {"train_loss": -28.397825241088867, "global_step": 605120, "epoch": 7290} {"train_loss": -28.457889556884766, "global_step": 605121, "epoch": 7290} {"train_loss": -28.321142196655273, "global_step": 605122, "epoch": 7290} {"train_loss": -28.114084243774414, "global_step": 605123, "epoch": 7290} {"train_loss": -28.639026641845703, "global_step": 605124, "epoch": 7290} {"train_loss": -28.483219146728516, "global_step": 605125, "epoch": 7290} {"train_loss": -28.3624210357666, "global_step": 605126, "epoch": 7290} {"train_loss": -28.611682891845703, "global_step": 605127, "epoch": 7290} {"train_loss": -28.265317916870117, "global_step": 605128, "epoch": 7290} {"train_loss": -28.358692169189453, "global_step": 605129, "epoch": 7290} {"train_loss": -28.437854766845703, "global_step": 605130, "epoch": 7290} {"train_loss": -28.429981231689453, "global_step": 605131, "epoch": 7290} {"train_loss": -28.2053279876709, "global_step": 605132, "epoch": 7290} {"train_loss": -28.08148765563965, "global_step": 605133, "epoch": 7290} {"train_loss": -28.376758575439453, "global_step": 605134, "epoch": 7290} {"train_loss": -28.194875717163086, "global_step": 605135, "epoch": 7290} {"train_loss": -28.222803115844727, "global_step": 605136, "epoch": 7290} {"train_loss": -27.977354049682617, "global_step": 605137, "epoch": 7290} {"train_loss": -28.00090980529785, "global_step": 605138, "epoch": 7290} {"train_loss": -28.242584228515625, "global_step": 605139, "epoch": 7290} {"train_loss": -28.248342514038086, "global_step": 605140, "epoch": 7290} {"train_loss": -28.033552169799805, "global_step": 605141, "epoch": 7290} {"train_loss": -28.529220581054688, "global_step": 605142, "epoch": 7290} {"train_loss": -28.16948890686035, "global_step": 605143, "epoch": 7290} {"train_loss": -28.51492691040039, "global_step": 605144, "epoch": 7290} {"train_loss": -28.353723526000977, "global_step": 605145, "epoch": 7290} {"train_loss": -28.49564552307129, "global_step": 605146, "epoch": 7290} {"train_loss": -28.191144943237305, "global_step": 605147, "epoch": 7290} {"train_loss": -28.34588623046875, "global_step": 605148, "epoch": 7290} {"train_loss": -27.964563369750977, "global_step": 605149, "epoch": 7290} {"train_loss": -28.2869873046875, "global_step": 605150, "epoch": 7290} {"train_loss": -27.68184471130371, "global_step": 605151, "epoch": 7290} {"train_loss": -27.746222277721728, "global_step": 605152, "epoch": 7290, "val_loss": 6767391.0} {"train_loss": -27.363189697265625, "global_step": 605153, "epoch": 7291} {"train_loss": -26.889678955078125, "global_step": 605154, "epoch": 7291} {"train_loss": -27.54245376586914, "global_step": 605155, "epoch": 7291} {"train_loss": -26.26543617248535, "global_step": 605156, "epoch": 7291} {"train_loss": -26.86453628540039, "global_step": 605157, "epoch": 7291} {"train_loss": -27.602813720703125, "global_step": 605158, "epoch": 7291} {"train_loss": -26.031705856323242, "global_step": 605159, "epoch": 7291} {"train_loss": -26.51018714904785, "global_step": 605160, "epoch": 7291} {"train_loss": -26.550338745117188, "global_step": 605161, "epoch": 7291} {"train_loss": -27.141742706298828, "global_step": 605162, "epoch": 7291} {"train_loss": -26.822179794311523, "global_step": 605163, "epoch": 7291} {"train_loss": -27.110458374023438, "global_step": 605164, "epoch": 7291} {"train_loss": -27.1749210357666, "global_step": 605165, "epoch": 7291} {"train_loss": -27.533369064331055, "global_step": 605166, "epoch": 7291} {"train_loss": -27.124826431274414, "global_step": 605167, "epoch": 7291} {"train_loss": -27.43511390686035, "global_step": 605168, "epoch": 7291} {"train_loss": -27.363805770874023, "global_step": 605169, "epoch": 7291} {"train_loss": -27.591970443725586, "global_step": 605170, "epoch": 7291} {"train_loss": -27.509662628173828, "global_step": 605171, "epoch": 7291} {"train_loss": -27.486902236938477, "global_step": 605172, "epoch": 7291} {"train_loss": -27.392414093017578, "global_step": 605173, "epoch": 7291} {"train_loss": -27.48026466369629, "global_step": 605174, "epoch": 7291} {"train_loss": -27.7015323638916, "global_step": 605175, "epoch": 7291} {"train_loss": -27.883716583251953, "global_step": 605176, "epoch": 7291} {"train_loss": -27.80409812927246, "global_step": 605177, "epoch": 7291} {"train_loss": -27.60597801208496, "global_step": 605178, "epoch": 7291} {"train_loss": -27.98073387145996, "global_step": 605179, "epoch": 7291} {"train_loss": -27.83500099182129, "global_step": 605180, "epoch": 7291} {"train_loss": -27.843402862548828, "global_step": 605181, "epoch": 7291} {"train_loss": -27.562210083007812, "global_step": 605182, "epoch": 7291} {"train_loss": -27.653339385986328, "global_step": 605183, "epoch": 7291} {"train_loss": -28.060653686523438, "global_step": 605184, "epoch": 7291} {"train_loss": -28.110275268554688, "global_step": 605185, "epoch": 7291} {"train_loss": -27.9754638671875, "global_step": 605186, "epoch": 7291} {"train_loss": -27.779327392578125, "global_step": 605187, "epoch": 7291} {"train_loss": -27.969812393188477, "global_step": 605188, "epoch": 7291} {"train_loss": -27.722518920898438, "global_step": 605189, "epoch": 7291} {"train_loss": -27.889013290405273, "global_step": 605190, "epoch": 7291} {"train_loss": -27.744443893432617, "global_step": 605191, "epoch": 7291} {"train_loss": -27.796375274658203, "global_step": 605192, "epoch": 7291} {"train_loss": -28.02772331237793, "global_step": 605193, "epoch": 7291} {"train_loss": -28.11141014099121, "global_step": 605194, "epoch": 7291} {"train_loss": -28.428974151611328, "global_step": 605195, "epoch": 7291} {"train_loss": -28.009998321533203, "global_step": 605196, "epoch": 7291} {"train_loss": -28.02650260925293, "global_step": 605197, "epoch": 7291} {"train_loss": -27.841787338256836, "global_step": 605198, "epoch": 7291} {"train_loss": -28.11661720275879, "global_step": 605199, "epoch": 7291} {"train_loss": -28.308368682861328, "global_step": 605200, "epoch": 7291} {"train_loss": -28.198108673095703, "global_step": 605201, "epoch": 7291} {"train_loss": -27.883834838867188, "global_step": 605202, "epoch": 7291} {"train_loss": -28.063291549682617, "global_step": 605203, "epoch": 7291} {"train_loss": -28.083532333374023, "global_step": 605204, "epoch": 7291} {"train_loss": -28.350805282592773, "global_step": 605205, "epoch": 7291} {"train_loss": -28.27107048034668, "global_step": 605206, "epoch": 7291} {"train_loss": -27.999042510986328, "global_step": 605207, "epoch": 7291} {"train_loss": -28.001203536987305, "global_step": 605208, "epoch": 7291} {"train_loss": -28.03900718688965, "global_step": 605209, "epoch": 7291} {"train_loss": -28.28720474243164, "global_step": 605210, "epoch": 7291} {"train_loss": -28.092878341674805, "global_step": 605211, "epoch": 7291} {"train_loss": -28.183582305908203, "global_step": 605212, "epoch": 7291} {"train_loss": -28.57900047302246, "global_step": 605213, "epoch": 7291} {"train_loss": -27.813024520874023, "global_step": 605214, "epoch": 7291} {"train_loss": -27.9277286529541, "global_step": 605215, "epoch": 7291} {"train_loss": -28.379749298095703, "global_step": 605216, "epoch": 7291} {"train_loss": -28.00714683532715, "global_step": 605217, "epoch": 7291} {"train_loss": -28.676742553710938, "global_step": 605218, "epoch": 7291} {"train_loss": -28.45430564880371, "global_step": 605219, "epoch": 7291} {"train_loss": -28.12335205078125, "global_step": 605220, "epoch": 7291} {"train_loss": -28.352130889892578, "global_step": 605221, "epoch": 7291} {"train_loss": -28.461929321289062, "global_step": 605222, "epoch": 7291} {"train_loss": -28.268033981323242, "global_step": 605223, "epoch": 7291} {"train_loss": -28.163944244384766, "global_step": 605224, "epoch": 7291} {"train_loss": -28.322973251342773, "global_step": 605225, "epoch": 7291} {"train_loss": -28.016454696655273, "global_step": 605226, "epoch": 7291} {"train_loss": -28.110509872436523, "global_step": 605227, "epoch": 7291} {"train_loss": -28.315343856811523, "global_step": 605228, "epoch": 7291} {"train_loss": -28.272449493408203, "global_step": 605229, "epoch": 7291} {"train_loss": -28.03179359436035, "global_step": 605230, "epoch": 7291} {"train_loss": -28.135578155517578, "global_step": 605231, "epoch": 7291} {"train_loss": -28.09393882751465, "global_step": 605232, "epoch": 7291} {"train_loss": -28.605976104736328, "global_step": 605233, "epoch": 7291} {"train_loss": -28.50787353515625, "global_step": 605234, "epoch": 7291} {"train_loss": -27.820174113813653, "global_step": 605235, "epoch": 7291, "val_loss": 6699184.5} {"train_loss": -27.96952247619629, "global_step": 605236, "epoch": 7292} {"train_loss": -27.677404403686523, "global_step": 605237, "epoch": 7292} {"train_loss": -27.83139991760254, "global_step": 605238, "epoch": 7292} {"train_loss": -27.892719268798828, "global_step": 605239, "epoch": 7292} {"train_loss": -27.869586944580078, "global_step": 605240, "epoch": 7292} {"train_loss": -27.7992000579834, "global_step": 605241, "epoch": 7292} {"train_loss": -28.09412956237793, "global_step": 605242, "epoch": 7292} {"train_loss": -27.687286376953125, "global_step": 605243, "epoch": 7292} {"train_loss": -28.003620147705078, "global_step": 605244, "epoch": 7292} {"train_loss": -28.30645179748535, "global_step": 605245, "epoch": 7292} {"train_loss": -27.886640548706055, "global_step": 605246, "epoch": 7292} {"train_loss": -28.022510528564453, "global_step": 605247, "epoch": 7292} {"train_loss": -27.6552677154541, "global_step": 605248, "epoch": 7292} {"train_loss": -28.129663467407227, "global_step": 605249, "epoch": 7292} {"train_loss": -28.152109146118164, "global_step": 605250, "epoch": 7292} {"train_loss": -28.107025146484375, "global_step": 605251, "epoch": 7292} {"train_loss": -28.244403839111328, "global_step": 605252, "epoch": 7292} {"train_loss": -27.826892852783203, "global_step": 605253, "epoch": 7292} {"train_loss": -27.919952392578125, "global_step": 605254, "epoch": 7292} {"train_loss": -27.9715518951416, "global_step": 605255, "epoch": 7292} {"train_loss": -28.314441680908203, "global_step": 605256, "epoch": 7292} {"train_loss": -27.815658569335938, "global_step": 605257, "epoch": 7292} {"train_loss": -27.947341918945312, "global_step": 605258, "epoch": 7292} {"train_loss": -28.36855125427246, "global_step": 605259, "epoch": 7292} {"train_loss": -27.823043823242188, "global_step": 605260, "epoch": 7292} {"train_loss": -27.807214736938477, "global_step": 605261, "epoch": 7292} {"train_loss": -27.862674713134766, "global_step": 605262, "epoch": 7292} {"train_loss": -27.898710250854492, "global_step": 605263, "epoch": 7292} {"train_loss": -27.987049102783203, "global_step": 605264, "epoch": 7292} {"train_loss": -28.028467178344727, "global_step": 605265, "epoch": 7292} {"train_loss": -28.280073165893555, "global_step": 605266, "epoch": 7292} {"train_loss": -27.97516441345215, "global_step": 605267, "epoch": 7292} {"train_loss": -27.967329025268555, "global_step": 605268, "epoch": 7292} {"train_loss": -28.201862335205078, "global_step": 605269, "epoch": 7292} {"train_loss": -27.97919273376465, "global_step": 605270, "epoch": 7292} {"train_loss": -28.024038314819336, "global_step": 605271, "epoch": 7292} {"train_loss": -28.064733505249023, "global_step": 605272, "epoch": 7292} {"train_loss": -27.9249267578125, "global_step": 605273, "epoch": 7292} {"train_loss": -27.84864616394043, "global_step": 605274, "epoch": 7292} {"train_loss": -27.84539222717285, "global_step": 605275, "epoch": 7292} {"train_loss": -27.851850509643555, "global_step": 605276, "epoch": 7292} {"train_loss": -28.2374210357666, "global_step": 605277, "epoch": 7292} {"train_loss": -28.368886947631836, "global_step": 605278, "epoch": 7292} {"train_loss": -27.234222412109375, "global_step": 605279, "epoch": 7292} {"train_loss": -27.946226119995117, "global_step": 605280, "epoch": 7292} {"train_loss": -27.39606285095215, "global_step": 605281, "epoch": 7292} {"train_loss": -28.0634765625, "global_step": 605282, "epoch": 7292} {"train_loss": -27.80889892578125, "global_step": 605283, "epoch": 7292} {"train_loss": -27.33099937438965, "global_step": 605284, "epoch": 7292} {"train_loss": -28.122655868530273, "global_step": 605285, "epoch": 7292} {"train_loss": -27.492475509643555, "global_step": 605286, "epoch": 7292} {"train_loss": -27.5435791015625, "global_step": 605287, "epoch": 7292} {"train_loss": -27.795263290405273, "global_step": 605288, "epoch": 7292} {"train_loss": -27.829822540283203, "global_step": 605289, "epoch": 7292} {"train_loss": -27.71185302734375, "global_step": 605290, "epoch": 7292} {"train_loss": -27.81342887878418, "global_step": 605291, "epoch": 7292} {"train_loss": -27.693220138549805, "global_step": 605292, "epoch": 7292} {"train_loss": -28.070302963256836, "global_step": 605293, "epoch": 7292} {"train_loss": -27.886343002319336, "global_step": 605294, "epoch": 7292} {"train_loss": -27.70777702331543, "global_step": 605295, "epoch": 7292} {"train_loss": -27.812177658081055, "global_step": 605296, "epoch": 7292} {"train_loss": -28.0699462890625, "global_step": 605297, "epoch": 7292} {"train_loss": -27.890485763549805, "global_step": 605298, "epoch": 7292} {"train_loss": -28.15814781188965, "global_step": 605299, "epoch": 7292} {"train_loss": -28.2011775970459, "global_step": 605300, "epoch": 7292} {"train_loss": -28.102514266967773, "global_step": 605301, "epoch": 7292} {"train_loss": -28.1030216217041, "global_step": 605302, "epoch": 7292} {"train_loss": -28.196426391601562, "global_step": 605303, "epoch": 7292} {"train_loss": -28.178205490112305, "global_step": 605304, "epoch": 7292} {"train_loss": -28.21243667602539, "global_step": 605305, "epoch": 7292} {"train_loss": -28.34210777282715, "global_step": 605306, "epoch": 7292} {"train_loss": -27.8995361328125, "global_step": 605307, "epoch": 7292} {"train_loss": -28.1844482421875, "global_step": 605308, "epoch": 7292} {"train_loss": -28.1841983795166, "global_step": 605309, "epoch": 7292} {"train_loss": -28.213272094726562, "global_step": 605310, "epoch": 7292} {"train_loss": -28.302148818969727, "global_step": 605311, "epoch": 7292} {"train_loss": -28.37677001953125, "global_step": 605312, "epoch": 7292} {"train_loss": -28.32295036315918, "global_step": 605313, "epoch": 7292} {"train_loss": -28.257932662963867, "global_step": 605314, "epoch": 7292} {"train_loss": -28.294464111328125, "global_step": 605315, "epoch": 7292} {"train_loss": -28.3062801361084, "global_step": 605316, "epoch": 7292} {"train_loss": -28.173959732055664, "global_step": 605317, "epoch": 7292} {"train_loss": -27.98988266450813, "global_step": 605318, "epoch": 7292, "val_loss": 6727485.5} {"train_loss": -28.039213180541992, "global_step": 605319, "epoch": 7293} {"train_loss": -27.792490005493164, "global_step": 605320, "epoch": 7293} {"train_loss": -27.996597290039062, "global_step": 605321, "epoch": 7293} {"train_loss": -27.862628936767578, "global_step": 605322, "epoch": 7293} {"train_loss": -28.091318130493164, "global_step": 605323, "epoch": 7293} {"train_loss": -28.035245895385742, "global_step": 605324, "epoch": 7293} {"train_loss": -28.31585121154785, "global_step": 605325, "epoch": 7293} {"train_loss": -27.697620391845703, "global_step": 605326, "epoch": 7293} {"train_loss": -27.728729248046875, "global_step": 605327, "epoch": 7293} {"train_loss": -28.020376205444336, "global_step": 605328, "epoch": 7293} {"train_loss": -28.134122848510742, "global_step": 605329, "epoch": 7293} {"train_loss": -27.869415283203125, "global_step": 605330, "epoch": 7293} {"train_loss": -27.95965003967285, "global_step": 605331, "epoch": 7293} {"train_loss": -27.559234619140625, "global_step": 605332, "epoch": 7293} {"train_loss": -27.796955108642578, "global_step": 605333, "epoch": 7293} {"train_loss": -27.700586318969727, "global_step": 605334, "epoch": 7293} {"train_loss": -27.76966667175293, "global_step": 605335, "epoch": 7293} {"train_loss": -27.901132583618164, "global_step": 605336, "epoch": 7293} {"train_loss": -27.63275146484375, "global_step": 605337, "epoch": 7293} {"train_loss": -28.240650177001953, "global_step": 605338, "epoch": 7293} {"train_loss": -27.709104537963867, "global_step": 605339, "epoch": 7293} {"train_loss": -27.84583854675293, "global_step": 605340, "epoch": 7293} {"train_loss": -27.607208251953125, "global_step": 605341, "epoch": 7293} {"train_loss": -27.74806022644043, "global_step": 605342, "epoch": 7293} {"train_loss": -28.093875885009766, "global_step": 605343, "epoch": 7293} {"train_loss": -27.95819664001465, "global_step": 605344, "epoch": 7293} {"train_loss": -27.733688354492188, "global_step": 605345, "epoch": 7293} {"train_loss": -27.971342086791992, "global_step": 605346, "epoch": 7293} {"train_loss": -27.55398941040039, "global_step": 605347, "epoch": 7293} {"train_loss": -28.252408981323242, "global_step": 605348, "epoch": 7293} {"train_loss": -28.123388290405273, "global_step": 605349, "epoch": 7293} {"train_loss": -27.89522361755371, "global_step": 605350, "epoch": 7293} {"train_loss": -28.105344772338867, "global_step": 605351, "epoch": 7293} {"train_loss": -27.862476348876953, "global_step": 605352, "epoch": 7293} {"train_loss": -28.32349967956543, "global_step": 605353, "epoch": 7293} {"train_loss": -28.123388290405273, "global_step": 605354, "epoch": 7293} {"train_loss": -28.269968032836914, "global_step": 605355, "epoch": 7293} {"train_loss": -28.205236434936523, "global_step": 605356, "epoch": 7293} {"train_loss": -27.864063262939453, "global_step": 605357, "epoch": 7293} {"train_loss": -27.91400718688965, "global_step": 605358, "epoch": 7293} {"train_loss": -28.220233917236328, "global_step": 605359, "epoch": 7293} {"train_loss": -28.044042587280273, "global_step": 605360, "epoch": 7293} {"train_loss": -28.4044246673584, "global_step": 605361, "epoch": 7293} {"train_loss": -28.1121768951416, "global_step": 605362, "epoch": 7293} {"train_loss": -27.8726749420166, "global_step": 605363, "epoch": 7293} {"train_loss": -28.289783477783203, "global_step": 605364, "epoch": 7293} {"train_loss": -28.266864776611328, "global_step": 605365, "epoch": 7293} {"train_loss": -28.1002140045166, "global_step": 605366, "epoch": 7293} {"train_loss": -28.310510635375977, "global_step": 605367, "epoch": 7293} {"train_loss": -28.317468643188477, "global_step": 605368, "epoch": 7293} {"train_loss": -28.1158504486084, "global_step": 605369, "epoch": 7293} {"train_loss": -27.930891036987305, "global_step": 605370, "epoch": 7293} {"train_loss": -28.472564697265625, "global_step": 605371, "epoch": 7293} {"train_loss": -27.921483993530273, "global_step": 605372, "epoch": 7293} {"train_loss": -28.286258697509766, "global_step": 605373, "epoch": 7293} {"train_loss": -28.28577995300293, "global_step": 605374, "epoch": 7293} {"train_loss": -28.151264190673828, "global_step": 605375, "epoch": 7293} {"train_loss": -28.00067138671875, "global_step": 605376, "epoch": 7293} {"train_loss": -28.06317710876465, "global_step": 605377, "epoch": 7293} {"train_loss": -28.169477462768555, "global_step": 605378, "epoch": 7293} {"train_loss": -28.307764053344727, "global_step": 605379, "epoch": 7293} {"train_loss": -28.252613067626953, "global_step": 605380, "epoch": 7293} {"train_loss": -28.035785675048828, "global_step": 605381, "epoch": 7293} {"train_loss": -27.845233917236328, "global_step": 605382, "epoch": 7293} {"train_loss": -27.470556259155273, "global_step": 605383, "epoch": 7293} {"train_loss": -27.140356063842773, "global_step": 605384, "epoch": 7293} {"train_loss": -27.2658634185791, "global_step": 605385, "epoch": 7293} {"train_loss": -27.470111846923828, "global_step": 605386, "epoch": 7293} {"train_loss": -27.98089027404785, "global_step": 605387, "epoch": 7293} {"train_loss": -27.592666625976562, "global_step": 605388, "epoch": 7293} {"train_loss": -27.512548446655273, "global_step": 605389, "epoch": 7293} {"train_loss": -28.29317283630371, "global_step": 605390, "epoch": 7293} {"train_loss": -27.614593505859375, "global_step": 605391, "epoch": 7293} {"train_loss": -28.022607803344727, "global_step": 605392, "epoch": 7293} {"train_loss": -27.933629989624023, "global_step": 605393, "epoch": 7293} {"train_loss": -28.136579513549805, "global_step": 605394, "epoch": 7293} {"train_loss": -27.927017211914062, "global_step": 605395, "epoch": 7293} {"train_loss": -27.870630264282227, "global_step": 605396, "epoch": 7293} {"train_loss": -28.34626579284668, "global_step": 605397, "epoch": 7293} {"train_loss": -27.57709312438965, "global_step": 605398, "epoch": 7293} {"train_loss": -27.767608642578125, "global_step": 605399, "epoch": 7293} {"train_loss": -27.962324142456055, "global_step": 605400, "epoch": 7293} {"train_loss": -27.97108452578625, "global_step": 605401, "epoch": 7293, "val_loss": 6604892.0} {"train_loss": -27.638708114624023, "global_step": 605402, "epoch": 7294} {"train_loss": -27.206953048706055, "global_step": 605403, "epoch": 7294} {"train_loss": -27.110488891601562, "global_step": 605404, "epoch": 7294} {"train_loss": -27.2073917388916, "global_step": 605405, "epoch": 7294} {"train_loss": -27.362531661987305, "global_step": 605406, "epoch": 7294} {"train_loss": -27.639585494995117, "global_step": 605407, "epoch": 7294} {"train_loss": -27.489160537719727, "global_step": 605408, "epoch": 7294} {"train_loss": -27.317596435546875, "global_step": 605409, "epoch": 7294} {"train_loss": -27.322912216186523, "global_step": 605410, "epoch": 7294} {"train_loss": -27.5772705078125, "global_step": 605411, "epoch": 7294} {"train_loss": -27.379032135009766, "global_step": 605412, "epoch": 7294} {"train_loss": -27.26161003112793, "global_step": 605413, "epoch": 7294} {"train_loss": -27.308990478515625, "global_step": 605414, "epoch": 7294} {"train_loss": -27.40180015563965, "global_step": 605415, "epoch": 7294} {"train_loss": -27.610767364501953, "global_step": 605416, "epoch": 7294} {"train_loss": -27.73032569885254, "global_step": 605417, "epoch": 7294} {"train_loss": -27.13568687438965, "global_step": 605418, "epoch": 7294} {"train_loss": -27.034997940063477, "global_step": 605419, "epoch": 7294} {"train_loss": -27.783172607421875, "global_step": 605420, "epoch": 7294} {"train_loss": -27.472797393798828, "global_step": 605421, "epoch": 7294} {"train_loss": -27.521787643432617, "global_step": 605422, "epoch": 7294} {"train_loss": -27.75886344909668, "global_step": 605423, "epoch": 7294} {"train_loss": -27.930978775024414, "global_step": 605424, "epoch": 7294} {"train_loss": -27.764450073242188, "global_step": 605425, "epoch": 7294} {"train_loss": -27.6944580078125, "global_step": 605426, "epoch": 7294} {"train_loss": -27.81194496154785, "global_step": 605427, "epoch": 7294} {"train_loss": -27.953794479370117, "global_step": 605428, "epoch": 7294} {"train_loss": -27.788297653198242, "global_step": 605429, "epoch": 7294} {"train_loss": -27.935388565063477, "global_step": 605430, "epoch": 7294} {"train_loss": -28.0799617767334, "global_step": 605431, "epoch": 7294} {"train_loss": -27.73427391052246, "global_step": 605432, "epoch": 7294} {"train_loss": -28.06743812561035, "global_step": 605433, "epoch": 7294} {"train_loss": -28.26386833190918, "global_step": 605434, "epoch": 7294} {"train_loss": -28.317707061767578, "global_step": 605435, "epoch": 7294} {"train_loss": -27.868188858032227, "global_step": 605436, "epoch": 7294} {"train_loss": -27.959829330444336, "global_step": 605437, "epoch": 7294} {"train_loss": -27.800535202026367, "global_step": 605438, "epoch": 7294} {"train_loss": -27.892240524291992, "global_step": 605439, "epoch": 7294} {"train_loss": -28.326642990112305, "global_step": 605440, "epoch": 7294} {"train_loss": -27.951932907104492, "global_step": 605441, "epoch": 7294} {"train_loss": -28.5932559967041, "global_step": 605442, "epoch": 7294} {"train_loss": -28.3384952545166, "global_step": 605443, "epoch": 7294} {"train_loss": -27.89661979675293, "global_step": 605444, "epoch": 7294} {"train_loss": -28.2425479888916, "global_step": 605445, "epoch": 7294} {"train_loss": -28.11733055114746, "global_step": 605446, "epoch": 7294} {"train_loss": -28.241657257080078, "global_step": 605447, "epoch": 7294} {"train_loss": -28.27066421508789, "global_step": 605448, "epoch": 7294} {"train_loss": -28.438180923461914, "global_step": 605449, "epoch": 7294} {"train_loss": -27.96988868713379, "global_step": 605450, "epoch": 7294} {"train_loss": -27.978546142578125, "global_step": 605451, "epoch": 7294} {"train_loss": -27.9854736328125, "global_step": 605452, "epoch": 7294} {"train_loss": -28.220447540283203, "global_step": 605453, "epoch": 7294} {"train_loss": -28.090322494506836, "global_step": 605454, "epoch": 7294} {"train_loss": -28.666046142578125, "global_step": 605455, "epoch": 7294} {"train_loss": -28.22601890563965, "global_step": 605456, "epoch": 7294} {"train_loss": -28.25457191467285, "global_step": 605457, "epoch": 7294} {"train_loss": -28.44771385192871, "global_step": 605458, "epoch": 7294} {"train_loss": -28.07819938659668, "global_step": 605459, "epoch": 7294} {"train_loss": -28.23381996154785, "global_step": 605460, "epoch": 7294} {"train_loss": -27.966379165649414, "global_step": 605461, "epoch": 7294} {"train_loss": -28.304523468017578, "global_step": 605462, "epoch": 7294} {"train_loss": -27.43340492248535, "global_step": 605463, "epoch": 7294} {"train_loss": -27.91387367248535, "global_step": 605464, "epoch": 7294} {"train_loss": -28.356128692626953, "global_step": 605465, "epoch": 7294} {"train_loss": -28.319849014282227, "global_step": 605466, "epoch": 7294} {"train_loss": -28.11138343811035, "global_step": 605467, "epoch": 7294} {"train_loss": -28.334211349487305, "global_step": 605468, "epoch": 7294} {"train_loss": -28.260183334350586, "global_step": 605469, "epoch": 7294} {"train_loss": -28.07099723815918, "global_step": 605470, "epoch": 7294} {"train_loss": -27.681949615478516, "global_step": 605471, "epoch": 7294} {"train_loss": -27.830978393554688, "global_step": 605472, "epoch": 7294} {"train_loss": -28.3094482421875, "global_step": 605473, "epoch": 7294} {"train_loss": -28.204320907592773, "global_step": 605474, "epoch": 7294} {"train_loss": -27.727331161499023, "global_step": 605475, "epoch": 7294} {"train_loss": -28.010705947875977, "global_step": 605476, "epoch": 7294} {"train_loss": -28.243650436401367, "global_step": 605477, "epoch": 7294} {"train_loss": -27.700531005859375, "global_step": 605478, "epoch": 7294} {"train_loss": -28.337799072265625, "global_step": 605479, "epoch": 7294} {"train_loss": -28.06024169921875, "global_step": 605480, "epoch": 7294} {"train_loss": -27.512800216674805, "global_step": 605481, "epoch": 7294} {"train_loss": -27.331830978393555, "global_step": 605482, "epoch": 7294} {"train_loss": -27.834930419921875, "global_step": 605483, "epoch": 7294} {"train_loss": -27.872416140085242, "global_step": 605484, "epoch": 7294, "val_loss": 6744424.0} {"train_loss": -27.819738388061523, "global_step": 605485, "epoch": 7295} {"train_loss": -27.418664932250977, "global_step": 605486, "epoch": 7295} {"train_loss": -26.824542999267578, "global_step": 605487, "epoch": 7295} {"train_loss": -27.3113956451416, "global_step": 605488, "epoch": 7295} {"train_loss": -27.590900421142578, "global_step": 605489, "epoch": 7295} {"train_loss": -27.644855499267578, "global_step": 605490, "epoch": 7295} {"train_loss": -27.33560562133789, "global_step": 605491, "epoch": 7295} {"train_loss": -27.54816246032715, "global_step": 605492, "epoch": 7295} {"train_loss": -27.757816314697266, "global_step": 605493, "epoch": 7295} {"train_loss": -27.354745864868164, "global_step": 605494, "epoch": 7295} {"train_loss": -27.66510009765625, "global_step": 605495, "epoch": 7295} {"train_loss": -28.0765438079834, "global_step": 605496, "epoch": 7295} {"train_loss": -27.697559356689453, "global_step": 605497, "epoch": 7295} {"train_loss": -27.819080352783203, "global_step": 605498, "epoch": 7295} {"train_loss": -27.86916160583496, "global_step": 605499, "epoch": 7295} {"train_loss": -28.047998428344727, "global_step": 605500, "epoch": 7295} {"train_loss": -28.156850814819336, "global_step": 605501, "epoch": 7295} {"train_loss": -27.90887451171875, "global_step": 605502, "epoch": 7295} {"train_loss": -28.1400203704834, "global_step": 605503, "epoch": 7295} {"train_loss": -28.071491241455078, "global_step": 605504, "epoch": 7295} {"train_loss": -27.536901473999023, "global_step": 605505, "epoch": 7295} {"train_loss": -28.02973747253418, "global_step": 605506, "epoch": 7295} {"train_loss": -28.50594139099121, "global_step": 605507, "epoch": 7295} {"train_loss": -28.302167892456055, "global_step": 605508, "epoch": 7295} {"train_loss": -28.3048152923584, "global_step": 605509, "epoch": 7295} {"train_loss": -28.37957191467285, "global_step": 605510, "epoch": 7295} {"train_loss": -28.21199607849121, "global_step": 605511, "epoch": 7295} {"train_loss": -28.30109214782715, "global_step": 605512, "epoch": 7295} {"train_loss": -28.29353904724121, "global_step": 605513, "epoch": 7295} {"train_loss": -28.082334518432617, "global_step": 605514, "epoch": 7295} {"train_loss": -27.965290069580078, "global_step": 605515, "epoch": 7295} {"train_loss": -27.718122482299805, "global_step": 605516, "epoch": 7295} {"train_loss": -28.33819580078125, "global_step": 605517, "epoch": 7295} {"train_loss": -28.305784225463867, "global_step": 605518, "epoch": 7295} {"train_loss": -28.0697021484375, "global_step": 605519, "epoch": 7295} {"train_loss": -28.189069747924805, "global_step": 605520, "epoch": 7295} {"train_loss": -28.388446807861328, "global_step": 605521, "epoch": 7295} {"train_loss": -28.172321319580078, "global_step": 605522, "epoch": 7295} {"train_loss": -28.078460693359375, "global_step": 605523, "epoch": 7295} {"train_loss": -28.203216552734375, "global_step": 605524, "epoch": 7295} {"train_loss": -28.26490592956543, "global_step": 605525, "epoch": 7295} {"train_loss": -28.31727409362793, "global_step": 605526, "epoch": 7295} {"train_loss": -28.095579147338867, "global_step": 605527, "epoch": 7295} {"train_loss": -27.774877548217773, "global_step": 605528, "epoch": 7295} {"train_loss": -28.125049591064453, "global_step": 605529, "epoch": 7295} {"train_loss": -27.886972427368164, "global_step": 605530, "epoch": 7295} {"train_loss": -27.976598739624023, "global_step": 605531, "epoch": 7295} {"train_loss": -27.728803634643555, "global_step": 605532, "epoch": 7295} {"train_loss": -28.239776611328125, "global_step": 605533, "epoch": 7295} {"train_loss": -28.104339599609375, "global_step": 605534, "epoch": 7295} {"train_loss": -27.866376876831055, "global_step": 605535, "epoch": 7295} {"train_loss": -28.28724479675293, "global_step": 605536, "epoch": 7295} {"train_loss": -28.098257064819336, "global_step": 605537, "epoch": 7295} {"train_loss": -28.012983322143555, "global_step": 605538, "epoch": 7295} {"train_loss": -28.126312255859375, "global_step": 605539, "epoch": 7295} {"train_loss": -28.20745277404785, "global_step": 605540, "epoch": 7295} {"train_loss": -28.11037254333496, "global_step": 605541, "epoch": 7295} {"train_loss": -27.865869522094727, "global_step": 605542, "epoch": 7295} {"train_loss": -27.96571159362793, "global_step": 605543, "epoch": 7295} {"train_loss": -28.026769638061523, "global_step": 605544, "epoch": 7295} {"train_loss": -28.244476318359375, "global_step": 605545, "epoch": 7295} {"train_loss": -28.168970108032227, "global_step": 605546, "epoch": 7295} {"train_loss": -27.79425621032715, "global_step": 605547, "epoch": 7295} {"train_loss": -28.134963989257812, "global_step": 605548, "epoch": 7295} {"train_loss": -27.995283126831055, "global_step": 605549, "epoch": 7295} {"train_loss": -27.89063835144043, "global_step": 605550, "epoch": 7295} {"train_loss": -27.570526123046875, "global_step": 605551, "epoch": 7295} {"train_loss": -27.533206939697266, "global_step": 605552, "epoch": 7295} {"train_loss": -27.593801498413086, "global_step": 605553, "epoch": 7295} {"train_loss": -27.948896408081055, "global_step": 605554, "epoch": 7295} {"train_loss": -27.72259521484375, "global_step": 605555, "epoch": 7295} {"train_loss": -27.64289665222168, "global_step": 605556, "epoch": 7295} {"train_loss": -27.427169799804688, "global_step": 605557, "epoch": 7295} {"train_loss": -27.603153228759766, "global_step": 605558, "epoch": 7295} {"train_loss": -27.922515869140625, "global_step": 605559, "epoch": 7295} {"train_loss": -28.056900024414062, "global_step": 605560, "epoch": 7295} {"train_loss": -27.20949363708496, "global_step": 605561, "epoch": 7295} {"train_loss": -27.5965633392334, "global_step": 605562, "epoch": 7295} {"train_loss": -27.751150131225586, "global_step": 605563, "epoch": 7295} {"train_loss": -27.88416862487793, "global_step": 605564, "epoch": 7295} {"train_loss": -27.732837677001953, "global_step": 605565, "epoch": 7295} {"train_loss": -28.11567497253418, "global_step": 605566, "epoch": 7295} {"train_loss": -27.934306271104926, "global_step": 605567, "epoch": 7295, "val_loss": 6750591.0} {"train_loss": -27.525358200073242, "global_step": 605568, "epoch": 7296} {"train_loss": -27.9559326171875, "global_step": 605569, "epoch": 7296} {"train_loss": -27.524518966674805, "global_step": 605570, "epoch": 7296} {"train_loss": -27.440448760986328, "global_step": 605571, "epoch": 7296} {"train_loss": -27.5643310546875, "global_step": 605572, "epoch": 7296} {"train_loss": -27.82429313659668, "global_step": 605573, "epoch": 7296} {"train_loss": -27.885879516601562, "global_step": 605574, "epoch": 7296} {"train_loss": -27.54886245727539, "global_step": 605575, "epoch": 7296} {"train_loss": -27.459585189819336, "global_step": 605576, "epoch": 7296} {"train_loss": -27.372577667236328, "global_step": 605577, "epoch": 7296} {"train_loss": -27.68753433227539, "global_step": 605578, "epoch": 7296} {"train_loss": -27.75543785095215, "global_step": 605579, "epoch": 7296} {"train_loss": -27.700546264648438, "global_step": 605580, "epoch": 7296} {"train_loss": -27.408435821533203, "global_step": 605581, "epoch": 7296} {"train_loss": -28.133575439453125, "global_step": 605582, "epoch": 7296} {"train_loss": -27.4854736328125, "global_step": 605583, "epoch": 7296} {"train_loss": -27.904077529907227, "global_step": 605584, "epoch": 7296} {"train_loss": -27.733610153198242, "global_step": 605585, "epoch": 7296} {"train_loss": -27.75776481628418, "global_step": 605586, "epoch": 7296} {"train_loss": -27.668781280517578, "global_step": 605587, "epoch": 7296} {"train_loss": -27.844663619995117, "global_step": 605588, "epoch": 7296} {"train_loss": -28.019445419311523, "global_step": 605589, "epoch": 7296} {"train_loss": -27.96044921875, "global_step": 605590, "epoch": 7296} {"train_loss": -27.6297664642334, "global_step": 605591, "epoch": 7296} {"train_loss": -28.18463134765625, "global_step": 605592, "epoch": 7296} {"train_loss": -27.866104125976562, "global_step": 605593, "epoch": 7296} {"train_loss": -27.800939559936523, "global_step": 605594, "epoch": 7296} {"train_loss": -28.08078384399414, "global_step": 605595, "epoch": 7296} {"train_loss": -28.185077667236328, "global_step": 605596, "epoch": 7296} {"train_loss": -28.09473991394043, "global_step": 605597, "epoch": 7296} {"train_loss": -28.143753051757812, "global_step": 605598, "epoch": 7296} {"train_loss": -27.921125411987305, "global_step": 605599, "epoch": 7296} {"train_loss": -28.09504508972168, "global_step": 605600, "epoch": 7296} {"train_loss": -28.10416603088379, "global_step": 605601, "epoch": 7296} {"train_loss": -28.128238677978516, "global_step": 605602, "epoch": 7296} {"train_loss": -28.50445556640625, "global_step": 605603, "epoch": 7296} {"train_loss": -28.293821334838867, "global_step": 605604, "epoch": 7296} {"train_loss": -28.05020523071289, "global_step": 605605, "epoch": 7296} {"train_loss": -28.27338981628418, "global_step": 605606, "epoch": 7296} {"train_loss": -28.632190704345703, "global_step": 605607, "epoch": 7296} {"train_loss": -28.48345375061035, "global_step": 605608, "epoch": 7296} {"train_loss": -28.078962326049805, "global_step": 605609, "epoch": 7296} {"train_loss": -28.3287410736084, "global_step": 605610, "epoch": 7296} {"train_loss": -28.336780548095703, "global_step": 605611, "epoch": 7296} {"train_loss": -28.090734481811523, "global_step": 605612, "epoch": 7296} {"train_loss": -28.209348678588867, "global_step": 605613, "epoch": 7296} {"train_loss": -28.006689071655273, "global_step": 605614, "epoch": 7296} {"train_loss": -28.183584213256836, "global_step": 605615, "epoch": 7296} {"train_loss": -28.43220329284668, "global_step": 605616, "epoch": 7296} {"train_loss": -27.89505386352539, "global_step": 605617, "epoch": 7296} {"train_loss": -27.997278213500977, "global_step": 605618, "epoch": 7296} {"train_loss": -28.2038516998291, "global_step": 605619, "epoch": 7296} {"train_loss": -28.132715225219727, "global_step": 605620, "epoch": 7296} {"train_loss": -27.823041915893555, "global_step": 605621, "epoch": 7296} {"train_loss": -27.66156578063965, "global_step": 605622, "epoch": 7296} {"train_loss": -27.28314781188965, "global_step": 605623, "epoch": 7296} {"train_loss": -27.448110580444336, "global_step": 605624, "epoch": 7296} {"train_loss": -28.07402992248535, "global_step": 605625, "epoch": 7296} {"train_loss": -28.428503036499023, "global_step": 605626, "epoch": 7296} {"train_loss": -27.75233268737793, "global_step": 605627, "epoch": 7296} {"train_loss": -28.215879440307617, "global_step": 605628, "epoch": 7296} {"train_loss": -28.13883399963379, "global_step": 605629, "epoch": 7296} {"train_loss": -28.2233829498291, "global_step": 605630, "epoch": 7296} {"train_loss": -28.06235694885254, "global_step": 605631, "epoch": 7296} {"train_loss": -28.131519317626953, "global_step": 605632, "epoch": 7296} {"train_loss": -28.1751766204834, "global_step": 605633, "epoch": 7296} {"train_loss": -28.157739639282227, "global_step": 605634, "epoch": 7296} {"train_loss": -27.91086769104004, "global_step": 605635, "epoch": 7296} {"train_loss": -28.030349731445312, "global_step": 605636, "epoch": 7296} {"train_loss": -27.75238037109375, "global_step": 605637, "epoch": 7296} {"train_loss": -28.2783260345459, "global_step": 605638, "epoch": 7296} {"train_loss": -28.067899703979492, "global_step": 605639, "epoch": 7296} {"train_loss": -27.767465591430664, "global_step": 605640, "epoch": 7296} {"train_loss": -28.248701095581055, "global_step": 605641, "epoch": 7296} {"train_loss": -27.76704978942871, "global_step": 605642, "epoch": 7296} {"train_loss": -28.010053634643555, "global_step": 605643, "epoch": 7296} {"train_loss": -27.8756160736084, "global_step": 605644, "epoch": 7296} {"train_loss": -27.927738189697266, "global_step": 605645, "epoch": 7296} {"train_loss": -28.253965377807617, "global_step": 605646, "epoch": 7296} {"train_loss": -28.560028076171875, "global_step": 605647, "epoch": 7296} {"train_loss": -27.99723243713379, "global_step": 605648, "epoch": 7296} {"train_loss": -27.91584587097168, "global_step": 605649, "epoch": 7296} {"train_loss": -27.956170760005353, "global_step": 605650, "epoch": 7296, "val_loss": 6786984.0} {"train_loss": -26.19587516784668, "global_step": 605651, "epoch": 7297} {"train_loss": -25.945627212524414, "global_step": 605652, "epoch": 7297} {"train_loss": -26.677936553955078, "global_step": 605653, "epoch": 7297} {"train_loss": -27.2016658782959, "global_step": 605654, "epoch": 7297} {"train_loss": -27.398645401000977, "global_step": 605655, "epoch": 7297} {"train_loss": -26.98310661315918, "global_step": 605656, "epoch": 7297} {"train_loss": -27.246667861938477, "global_step": 605657, "epoch": 7297} {"train_loss": -27.621063232421875, "global_step": 605658, "epoch": 7297} {"train_loss": -27.664382934570312, "global_step": 605659, "epoch": 7297} {"train_loss": -27.329620361328125, "global_step": 605660, "epoch": 7297} {"train_loss": -27.01946449279785, "global_step": 605661, "epoch": 7297} {"train_loss": -27.676406860351562, "global_step": 605662, "epoch": 7297} {"train_loss": -26.967016220092773, "global_step": 605663, "epoch": 7297} {"train_loss": -27.445743560791016, "global_step": 605664, "epoch": 7297} {"train_loss": -27.442052841186523, "global_step": 605665, "epoch": 7297} {"train_loss": -27.3630313873291, "global_step": 605666, "epoch": 7297} {"train_loss": -27.5346736907959, "global_step": 605667, "epoch": 7297} {"train_loss": -27.660633087158203, "global_step": 605668, "epoch": 7297} {"train_loss": -27.737958908081055, "global_step": 605669, "epoch": 7297} {"train_loss": -27.8491268157959, "global_step": 605670, "epoch": 7297} {"train_loss": -27.72002601623535, "global_step": 605671, "epoch": 7297} {"train_loss": -27.934152603149414, "global_step": 605672, "epoch": 7297} {"train_loss": -27.94646644592285, "global_step": 605673, "epoch": 7297} {"train_loss": -27.882495880126953, "global_step": 605674, "epoch": 7297} {"train_loss": -27.628034591674805, "global_step": 605675, "epoch": 7297} {"train_loss": -27.932174682617188, "global_step": 605676, "epoch": 7297} {"train_loss": -28.25200843811035, "global_step": 605677, "epoch": 7297} {"train_loss": -27.732397079467773, "global_step": 605678, "epoch": 7297} {"train_loss": -28.00406265258789, "global_step": 605679, "epoch": 7297} {"train_loss": -27.925586700439453, "global_step": 605680, "epoch": 7297} {"train_loss": -27.78199577331543, "global_step": 605681, "epoch": 7297} {"train_loss": -28.058780670166016, "global_step": 605682, "epoch": 7297} {"train_loss": -27.749439239501953, "global_step": 605683, "epoch": 7297} {"train_loss": -28.19125747680664, "global_step": 605684, "epoch": 7297} {"train_loss": -28.5396785736084, "global_step": 605685, "epoch": 7297} {"train_loss": -27.9697208404541, "global_step": 605686, "epoch": 7297} {"train_loss": -27.881881713867188, "global_step": 605687, "epoch": 7297} {"train_loss": -28.159793853759766, "global_step": 605688, "epoch": 7297} {"train_loss": -28.127355575561523, "global_step": 605689, "epoch": 7297} {"train_loss": -27.969945907592773, "global_step": 605690, "epoch": 7297} {"train_loss": -27.947736740112305, "global_step": 605691, "epoch": 7297} {"train_loss": -28.45419692993164, "global_step": 605692, "epoch": 7297} {"train_loss": -27.881818771362305, "global_step": 605693, "epoch": 7297} {"train_loss": -28.082544326782227, "global_step": 605694, "epoch": 7297} {"train_loss": -28.122900009155273, "global_step": 605695, "epoch": 7297} {"train_loss": -28.273962020874023, "global_step": 605696, "epoch": 7297} {"train_loss": -28.247770309448242, "global_step": 605697, "epoch": 7297} {"train_loss": -28.474639892578125, "global_step": 605698, "epoch": 7297} {"train_loss": -28.290374755859375, "global_step": 605699, "epoch": 7297} {"train_loss": -28.297338485717773, "global_step": 605700, "epoch": 7297} {"train_loss": -28.192502975463867, "global_step": 605701, "epoch": 7297} {"train_loss": -28.373456954956055, "global_step": 605702, "epoch": 7297} {"train_loss": -27.944110870361328, "global_step": 605703, "epoch": 7297} {"train_loss": -28.006933212280273, "global_step": 605704, "epoch": 7297} {"train_loss": -28.28931999206543, "global_step": 605705, "epoch": 7297} {"train_loss": -28.305383682250977, "global_step": 605706, "epoch": 7297} {"train_loss": -28.005908966064453, "global_step": 605707, "epoch": 7297} {"train_loss": -28.128087997436523, "global_step": 605708, "epoch": 7297} {"train_loss": -27.947858810424805, "global_step": 605709, "epoch": 7297} {"train_loss": -27.762649536132812, "global_step": 605710, "epoch": 7297} {"train_loss": -28.036672592163086, "global_step": 605711, "epoch": 7297} {"train_loss": -28.372085571289062, "global_step": 605712, "epoch": 7297} {"train_loss": -28.24899673461914, "global_step": 605713, "epoch": 7297} {"train_loss": -27.969480514526367, "global_step": 605714, "epoch": 7297} {"train_loss": -28.388507843017578, "global_step": 605715, "epoch": 7297} {"train_loss": -28.37137222290039, "global_step": 605716, "epoch": 7297} {"train_loss": -28.25690269470215, "global_step": 605717, "epoch": 7297} {"train_loss": -28.123926162719727, "global_step": 605718, "epoch": 7297} {"train_loss": -28.23206901550293, "global_step": 605719, "epoch": 7297} {"train_loss": -28.014806747436523, "global_step": 605720, "epoch": 7297} {"train_loss": -28.058704376220703, "global_step": 605721, "epoch": 7297} {"train_loss": -28.091724395751953, "global_step": 605722, "epoch": 7297} {"train_loss": -28.1254825592041, "global_step": 605723, "epoch": 7297} {"train_loss": -27.991498947143555, "global_step": 605724, "epoch": 7297} {"train_loss": -28.184934616088867, "global_step": 605725, "epoch": 7297} {"train_loss": -28.265548706054688, "global_step": 605726, "epoch": 7297} {"train_loss": -28.125913619995117, "global_step": 605727, "epoch": 7297} {"train_loss": -27.90375328063965, "global_step": 605728, "epoch": 7297} {"train_loss": -27.49472999572754, "global_step": 605729, "epoch": 7297} {"train_loss": -28.039749145507812, "global_step": 605730, "epoch": 7297} {"train_loss": -27.834680557250977, "global_step": 605731, "epoch": 7297} {"train_loss": -28.389753341674805, "global_step": 605732, "epoch": 7297} {"train_loss": -27.887435200702715, "global_step": 605733, "epoch": 7297, "val_loss": 6826517.5} {"train_loss": -27.766620635986328, "global_step": 605734, "epoch": 7298} {"train_loss": -27.84724235534668, "global_step": 605735, "epoch": 7298} {"train_loss": -27.39900779724121, "global_step": 605736, "epoch": 7298} {"train_loss": -26.49246597290039, "global_step": 605737, "epoch": 7298} {"train_loss": -27.33026123046875, "global_step": 605738, "epoch": 7298} {"train_loss": -27.46736717224121, "global_step": 605739, "epoch": 7298} {"train_loss": -27.25748634338379, "global_step": 605740, "epoch": 7298} {"train_loss": -27.00323486328125, "global_step": 605741, "epoch": 7298} {"train_loss": -27.657094955444336, "global_step": 605742, "epoch": 7298} {"train_loss": -27.49116325378418, "global_step": 605743, "epoch": 7298} {"train_loss": -27.309900283813477, "global_step": 605744, "epoch": 7298} {"train_loss": -27.765949249267578, "global_step": 605745, "epoch": 7298} {"train_loss": -27.434879302978516, "global_step": 605746, "epoch": 7298} {"train_loss": -28.25959587097168, "global_step": 605747, "epoch": 7298} {"train_loss": -27.797748565673828, "global_step": 605748, "epoch": 7298} {"train_loss": -27.773523330688477, "global_step": 605749, "epoch": 7298} {"train_loss": -27.87860679626465, "global_step": 605750, "epoch": 7298} {"train_loss": -27.707029342651367, "global_step": 605751, "epoch": 7298} {"train_loss": -27.849750518798828, "global_step": 605752, "epoch": 7298} {"train_loss": -27.67535400390625, "global_step": 605753, "epoch": 7298} {"train_loss": -27.925769805908203, "global_step": 605754, "epoch": 7298} {"train_loss": -27.952112197875977, "global_step": 605755, "epoch": 7298} {"train_loss": -28.139509201049805, "global_step": 605756, "epoch": 7298} {"train_loss": -27.876373291015625, "global_step": 605757, "epoch": 7298} {"train_loss": -27.702245712280273, "global_step": 605758, "epoch": 7298} {"train_loss": -28.005762100219727, "global_step": 605759, "epoch": 7298} {"train_loss": -28.10780906677246, "global_step": 605760, "epoch": 7298} {"train_loss": -27.82758903503418, "global_step": 605761, "epoch": 7298} {"train_loss": -27.65229606628418, "global_step": 605762, "epoch": 7298} {"train_loss": -27.984405517578125, "global_step": 605763, "epoch": 7298} {"train_loss": -27.97369956970215, "global_step": 605764, "epoch": 7298} {"train_loss": -28.167388916015625, "global_step": 605765, "epoch": 7298} {"train_loss": -27.987258911132812, "global_step": 605766, "epoch": 7298} {"train_loss": -27.97527503967285, "global_step": 605767, "epoch": 7298} {"train_loss": -28.414600372314453, "global_step": 605768, "epoch": 7298} {"train_loss": -28.13254165649414, "global_step": 605769, "epoch": 7298} {"train_loss": -28.460229873657227, "global_step": 605770, "epoch": 7298} {"train_loss": -28.2695255279541, "global_step": 605771, "epoch": 7298} {"train_loss": -28.302967071533203, "global_step": 605772, "epoch": 7298} {"train_loss": -28.449674606323242, "global_step": 605773, "epoch": 7298} {"train_loss": -28.155609130859375, "global_step": 605774, "epoch": 7298} {"train_loss": -28.1796875, "global_step": 605775, "epoch": 7298} {"train_loss": -28.13150405883789, "global_step": 605776, "epoch": 7298} {"train_loss": -28.239898681640625, "global_step": 605777, "epoch": 7298} {"train_loss": -28.283981323242188, "global_step": 605778, "epoch": 7298} {"train_loss": -28.1369571685791, "global_step": 605779, "epoch": 7298} {"train_loss": -28.295515060424805, "global_step": 605780, "epoch": 7298} {"train_loss": -28.219192504882812, "global_step": 605781, "epoch": 7298} {"train_loss": -28.582868576049805, "global_step": 605782, "epoch": 7298} {"train_loss": -28.211048126220703, "global_step": 605783, "epoch": 7298} {"train_loss": -28.106000900268555, "global_step": 605784, "epoch": 7298} {"train_loss": -28.1820125579834, "global_step": 605785, "epoch": 7298} {"train_loss": -28.466562271118164, "global_step": 605786, "epoch": 7298} {"train_loss": -28.177038192749023, "global_step": 605787, "epoch": 7298} {"train_loss": -28.355085372924805, "global_step": 605788, "epoch": 7298} {"train_loss": -28.29648208618164, "global_step": 605789, "epoch": 7298} {"train_loss": -27.939075469970703, "global_step": 605790, "epoch": 7298} {"train_loss": -27.647119522094727, "global_step": 605791, "epoch": 7298} {"train_loss": -27.864730834960938, "global_step": 605792, "epoch": 7298} {"train_loss": -28.05195426940918, "global_step": 605793, "epoch": 7298} {"train_loss": -28.353418350219727, "global_step": 605794, "epoch": 7298} {"train_loss": -27.661802291870117, "global_step": 605795, "epoch": 7298} {"train_loss": -27.7119197845459, "global_step": 605796, "epoch": 7298} {"train_loss": -27.547992706298828, "global_step": 605797, "epoch": 7298} {"train_loss": -27.8373966217041, "global_step": 605798, "epoch": 7298} {"train_loss": -27.9222412109375, "global_step": 605799, "epoch": 7298} {"train_loss": -28.020282745361328, "global_step": 605800, "epoch": 7298} {"train_loss": -28.1645565032959, "global_step": 605801, "epoch": 7298} {"train_loss": -27.353742599487305, "global_step": 605802, "epoch": 7298} {"train_loss": -28.375089645385742, "global_step": 605803, "epoch": 7298} {"train_loss": -28.21442222595215, "global_step": 605804, "epoch": 7298} {"train_loss": -27.49603843688965, "global_step": 605805, "epoch": 7298} {"train_loss": -27.699237823486328, "global_step": 605806, "epoch": 7298} {"train_loss": -28.54108238220215, "global_step": 605807, "epoch": 7298} {"train_loss": -27.611480712890625, "global_step": 605808, "epoch": 7298} {"train_loss": -27.351709365844727, "global_step": 605809, "epoch": 7298} {"train_loss": -28.24359130859375, "global_step": 605810, "epoch": 7298} {"train_loss": -27.9019832611084, "global_step": 605811, "epoch": 7298} {"train_loss": -27.99808120727539, "global_step": 605812, "epoch": 7298} {"train_loss": -27.830142974853516, "global_step": 605813, "epoch": 7298} {"train_loss": -27.846708297729492, "global_step": 605814, "epoch": 7298} {"train_loss": -28.13099479675293, "global_step": 605815, "epoch": 7298} {"train_loss": -27.917158724313758, "global_step": 605816, "epoch": 7298, "val_loss": 6787462.0} {"train_loss": -26.808216094970703, "global_step": 605817, "epoch": 7299} {"train_loss": -27.167341232299805, "global_step": 605818, "epoch": 7299} {"train_loss": -27.36178970336914, "global_step": 605819, "epoch": 7299} {"train_loss": -26.72002601623535, "global_step": 605820, "epoch": 7299} {"train_loss": -27.456018447875977, "global_step": 605821, "epoch": 7299} {"train_loss": -26.917478561401367, "global_step": 605822, "epoch": 7299} {"train_loss": -27.41696548461914, "global_step": 605823, "epoch": 7299} {"train_loss": -27.312671661376953, "global_step": 605824, "epoch": 7299} {"train_loss": -27.018878936767578, "global_step": 605825, "epoch": 7299} {"train_loss": -27.694921493530273, "global_step": 605826, "epoch": 7299} {"train_loss": -27.32282066345215, "global_step": 605827, "epoch": 7299} {"train_loss": -27.6014461517334, "global_step": 605828, "epoch": 7299} {"train_loss": -27.43414878845215, "global_step": 605829, "epoch": 7299} {"train_loss": -27.58096694946289, "global_step": 605830, "epoch": 7299} {"train_loss": -27.23418617248535, "global_step": 605831, "epoch": 7299} {"train_loss": -27.318744659423828, "global_step": 605832, "epoch": 7299} {"train_loss": -27.931182861328125, "global_step": 605833, "epoch": 7299} {"train_loss": -27.509740829467773, "global_step": 605834, "epoch": 7299} {"train_loss": -27.59162712097168, "global_step": 605835, "epoch": 7299} {"train_loss": -27.4301700592041, "global_step": 605836, "epoch": 7299} {"train_loss": -27.459503173828125, "global_step": 605837, "epoch": 7299} {"train_loss": -27.36102294921875, "global_step": 605838, "epoch": 7299} {"train_loss": -27.901657104492188, "global_step": 605839, "epoch": 7299} {"train_loss": -27.747360229492188, "global_step": 605840, "epoch": 7299} {"train_loss": -27.6922550201416, "global_step": 605841, "epoch": 7299} {"train_loss": -28.282562255859375, "global_step": 605842, "epoch": 7299} {"train_loss": -27.99724769592285, "global_step": 605843, "epoch": 7299} {"train_loss": -27.747039794921875, "global_step": 605844, "epoch": 7299} {"train_loss": -27.692594528198242, "global_step": 605845, "epoch": 7299} {"train_loss": -27.587339401245117, "global_step": 605846, "epoch": 7299} {"train_loss": -28.12904930114746, "global_step": 605847, "epoch": 7299} {"train_loss": -27.892837524414062, "global_step": 605848, "epoch": 7299} {"train_loss": -28.09423828125, "global_step": 605849, "epoch": 7299} {"train_loss": -27.924823760986328, "global_step": 605850, "epoch": 7299} {"train_loss": -28.180240631103516, "global_step": 605851, "epoch": 7299} {"train_loss": -27.807300567626953, "global_step": 605852, "epoch": 7299} {"train_loss": -28.078744888305664, "global_step": 605853, "epoch": 7299} {"train_loss": -28.828168869018555, "global_step": 605854, "epoch": 7299} {"train_loss": -27.958148956298828, "global_step": 605855, "epoch": 7299} {"train_loss": -28.3317928314209, "global_step": 605856, "epoch": 7299} {"train_loss": -27.797698974609375, "global_step": 605857, "epoch": 7299} {"train_loss": -28.0756778717041, "global_step": 605858, "epoch": 7299} {"train_loss": -28.183551788330078, "global_step": 605859, "epoch": 7299} {"train_loss": -27.992008209228516, "global_step": 605860, "epoch": 7299} {"train_loss": -28.403671264648438, "global_step": 605861, "epoch": 7299} {"train_loss": -27.811649322509766, "global_step": 605862, "epoch": 7299} {"train_loss": -28.097700119018555, "global_step": 605863, "epoch": 7299} {"train_loss": -28.10576820373535, "global_step": 605864, "epoch": 7299} {"train_loss": -28.0576229095459, "global_step": 605865, "epoch": 7299} {"train_loss": -28.095834732055664, "global_step": 605866, "epoch": 7299} {"train_loss": -28.296873092651367, "global_step": 605867, "epoch": 7299} {"train_loss": -28.086835861206055, "global_step": 605868, "epoch": 7299} {"train_loss": -28.22625732421875, "global_step": 605869, "epoch": 7299} {"train_loss": -28.10926628112793, "global_step": 605870, "epoch": 7299} {"train_loss": -27.85298728942871, "global_step": 605871, "epoch": 7299} {"train_loss": -28.017230987548828, "global_step": 605872, "epoch": 7299} {"train_loss": -28.104955673217773, "global_step": 605873, "epoch": 7299} {"train_loss": -27.863754272460938, "global_step": 605874, "epoch": 7299} {"train_loss": -28.060256958007812, "global_step": 605875, "epoch": 7299} {"train_loss": -28.450414657592773, "global_step": 605876, "epoch": 7299} {"train_loss": -27.963855743408203, "global_step": 605877, "epoch": 7299} {"train_loss": -28.34807777404785, "global_step": 605878, "epoch": 7299} {"train_loss": -28.663883209228516, "global_step": 605879, "epoch": 7299} {"train_loss": -28.169055938720703, "global_step": 605880, "epoch": 7299} {"train_loss": -28.167638778686523, "global_step": 605881, "epoch": 7299} {"train_loss": -28.33469581604004, "global_step": 605882, "epoch": 7299} {"train_loss": -28.200735092163086, "global_step": 605883, "epoch": 7299} {"train_loss": -28.334142684936523, "global_step": 605884, "epoch": 7299} {"train_loss": -27.862791061401367, "global_step": 605885, "epoch": 7299} {"train_loss": -28.366809844970703, "global_step": 605886, "epoch": 7299} {"train_loss": -27.828092575073242, "global_step": 605887, "epoch": 7299} {"train_loss": -28.374250411987305, "global_step": 605888, "epoch": 7299} {"train_loss": -28.001989364624023, "global_step": 605889, "epoch": 7299} {"train_loss": -27.958036422729492, "global_step": 605890, "epoch": 7299} {"train_loss": -27.789169311523438, "global_step": 605891, "epoch": 7299} {"train_loss": -28.104597091674805, "global_step": 605892, "epoch": 7299} {"train_loss": -27.497055053710938, "global_step": 605893, "epoch": 7299} {"train_loss": -27.612878799438477, "global_step": 605894, "epoch": 7299} {"train_loss": -27.97821044921875, "global_step": 605895, "epoch": 7299} {"train_loss": -27.6481876373291, "global_step": 605896, "epoch": 7299} {"train_loss": -27.836957931518555, "global_step": 605897, "epoch": 7299} {"train_loss": -27.490753173828125, "global_step": 605898, "epoch": 7299} {"train_loss": -27.85469815817224, "global_step": 605899, "epoch": 7299, "val_loss": 6857122.0} {"train_loss": -27.49360466003418, "global_step": 605900, "epoch": 7300} {"train_loss": -27.700098037719727, "global_step": 605901, "epoch": 7300} {"train_loss": -27.48980712890625, "global_step": 605902, "epoch": 7300} {"train_loss": -27.0135555267334, "global_step": 605903, "epoch": 7300} {"train_loss": -27.064512252807617, "global_step": 605904, "epoch": 7300} {"train_loss": -27.361066818237305, "global_step": 605905, "epoch": 7300} {"train_loss": -27.179615020751953, "global_step": 605906, "epoch": 7300} {"train_loss": -27.701719284057617, "global_step": 605907, "epoch": 7300} {"train_loss": -27.545499801635742, "global_step": 605908, "epoch": 7300} {"train_loss": -27.27460289001465, "global_step": 605909, "epoch": 7300} {"train_loss": -27.0593204498291, "global_step": 605910, "epoch": 7300} {"train_loss": -27.215320587158203, "global_step": 605911, "epoch": 7300} {"train_loss": -27.254108428955078, "global_step": 605912, "epoch": 7300} {"train_loss": -27.498199462890625, "global_step": 605913, "epoch": 7300} {"train_loss": -27.66365623474121, "global_step": 605914, "epoch": 7300} {"train_loss": -27.37325096130371, "global_step": 605915, "epoch": 7300} {"train_loss": -27.202091217041016, "global_step": 605916, "epoch": 7300} {"train_loss": -27.8128719329834, "global_step": 605917, "epoch": 7300} {"train_loss": -27.688024520874023, "global_step": 605918, "epoch": 7300} {"train_loss": -27.447452545166016, "global_step": 605919, "epoch": 7300} {"train_loss": -28.03693962097168, "global_step": 605920, "epoch": 7300} {"train_loss": -27.7236328125, "global_step": 605921, "epoch": 7300} {"train_loss": -27.8604679107666, "global_step": 605922, "epoch": 7300} {"train_loss": -27.945392608642578, "global_step": 605923, "epoch": 7300} {"train_loss": -27.925390243530273, "global_step": 605924, "epoch": 7300} {"train_loss": -27.700037002563477, "global_step": 605925, "epoch": 7300} {"train_loss": -27.9371395111084, "global_step": 605926, "epoch": 7300} {"train_loss": -27.964252471923828, "global_step": 605927, "epoch": 7300} {"train_loss": -28.01197624206543, "global_step": 605928, "epoch": 7300} {"train_loss": -27.750385284423828, "global_step": 605929, "epoch": 7300} {"train_loss": -28.06743812561035, "global_step": 605930, "epoch": 7300} {"train_loss": -28.1285400390625, "global_step": 605931, "epoch": 7300} {"train_loss": -28.037256240844727, "global_step": 605932, "epoch": 7300} {"train_loss": -28.196395874023438, "global_step": 605933, "epoch": 7300} {"train_loss": -27.82108497619629, "global_step": 605934, "epoch": 7300} {"train_loss": -28.359670639038086, "global_step": 605935, "epoch": 7300} {"train_loss": -28.025466918945312, "global_step": 605936, "epoch": 7300} {"train_loss": -28.126989364624023, "global_step": 605937, "epoch": 7300} {"train_loss": -27.935592651367188, "global_step": 605938, "epoch": 7300} {"train_loss": -28.004117965698242, "global_step": 605939, "epoch": 7300} {"train_loss": -28.4505615234375, "global_step": 605940, "epoch": 7300} {"train_loss": -28.155914306640625, "global_step": 605941, "epoch": 7300} {"train_loss": -27.8284912109375, "global_step": 605942, "epoch": 7300} {"train_loss": -27.622556686401367, "global_step": 605943, "epoch": 7300} {"train_loss": -27.835285186767578, "global_step": 605944, "epoch": 7300} {"train_loss": -28.181753158569336, "global_step": 605945, "epoch": 7300} {"train_loss": -27.866052627563477, "global_step": 605946, "epoch": 7300} {"train_loss": -28.22552490234375, "global_step": 605947, "epoch": 7300} {"train_loss": -28.025604248046875, "global_step": 605948, "epoch": 7300} {"train_loss": -28.383167266845703, "global_step": 605949, "epoch": 7300} {"train_loss": -27.972448348999023, "global_step": 605950, "epoch": 7300} {"train_loss": -27.68267250061035, "global_step": 605951, "epoch": 7300} {"train_loss": -28.011388778686523, "global_step": 605952, "epoch": 7300} {"train_loss": -27.8171329498291, "global_step": 605953, "epoch": 7300} {"train_loss": -27.94923973083496, "global_step": 605954, "epoch": 7300} {"train_loss": -28.324371337890625, "global_step": 605955, "epoch": 7300} {"train_loss": -28.345483779907227, "global_step": 605956, "epoch": 7300} {"train_loss": -28.21564292907715, "global_step": 605957, "epoch": 7300} {"train_loss": -28.42181396484375, "global_step": 605958, "epoch": 7300} {"train_loss": -28.216455459594727, "global_step": 605959, "epoch": 7300} {"train_loss": -27.9746036529541, "global_step": 605960, "epoch": 7300} {"train_loss": -27.9667911529541, "global_step": 605961, "epoch": 7300} {"train_loss": -28.19837760925293, "global_step": 605962, "epoch": 7300} {"train_loss": -28.21453857421875, "global_step": 605963, "epoch": 7300} {"train_loss": -28.07586097717285, "global_step": 605964, "epoch": 7300} {"train_loss": -28.381982803344727, "global_step": 605965, "epoch": 7300} {"train_loss": -28.413379669189453, "global_step": 605966, "epoch": 7300} {"train_loss": -28.11602210998535, "global_step": 605967, "epoch": 7300} {"train_loss": -28.041278839111328, "global_step": 605968, "epoch": 7300} {"train_loss": -28.767414093017578, "global_step": 605969, "epoch": 7300} {"train_loss": -28.432477951049805, "global_step": 605970, "epoch": 7300} {"train_loss": -27.979156494140625, "global_step": 605971, "epoch": 7300} {"train_loss": -28.190139770507812, "global_step": 605972, "epoch": 7300} {"train_loss": -28.157873153686523, "global_step": 605973, "epoch": 7300} {"train_loss": -28.209104537963867, "global_step": 605974, "epoch": 7300} {"train_loss": -28.143957138061523, "global_step": 605975, "epoch": 7300} {"train_loss": -27.64667320251465, "global_step": 605976, "epoch": 7300} {"train_loss": -27.584720611572266, "global_step": 605977, "epoch": 7300} {"train_loss": -27.322235107421875, "global_step": 605978, "epoch": 7300} {"train_loss": -27.20820426940918, "global_step": 605979, "epoch": 7300} {"train_loss": -27.916784286499023, "global_step": 605980, "epoch": 7300} {"train_loss": -27.846099853515625, "global_step": 605981, "epoch": 7300} {"train_loss": -27.89023020181311, "global_step": 605982, "epoch": 7300, "train/sim_max_reward_0": 1.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4500000": 1.0, "test/sim_max_reward_4500001": 1.0, "test/sim_max_reward_4500002": 1.0, "test/sim_max_reward_4500003": 1.0, "test/sim_max_reward_4500004": 1.0, "test/sim_max_reward_4500005": 1.0, "test/sim_max_reward_4500006": 1.0, "test/sim_max_reward_4500007": 0.0, "test/sim_max_reward_4500008": 1.0, "test/sim_max_reward_4500009": 1.0, "test/sim_max_reward_4500010": 1.0, "test/sim_max_reward_4500011": 1.0, "test/sim_max_reward_4500012": 1.0, "test/sim_max_reward_4500013": 0.0, "test/sim_max_reward_4500014": 1.0, "test/sim_max_reward_4500015": 1.0, "test/sim_max_reward_4500016": 1.0, "test/sim_max_reward_4500017": 1.0, "test/sim_max_reward_4500018": 0.0, "test/sim_max_reward_4500019": 1.0, "test/sim_max_reward_4500020": 1.0, "test/sim_max_reward_4500021": 1.0, "train/mean_score": 1.0, "test/mean_score": 0.8636363636363636, "val_loss": 6769957.0} {"train_loss": -27.624618530273438, "global_step": 605983, "epoch": 7301} {"train_loss": -27.375898361206055, "global_step": 605984, "epoch": 7301} {"train_loss": -27.027990341186523, "global_step": 605985, "epoch": 7301} {"train_loss": -27.487354278564453, "global_step": 605986, "epoch": 7301} {"train_loss": -27.650836944580078, "global_step": 605987, "epoch": 7301} {"train_loss": -27.534133911132812, "global_step": 605988, "epoch": 7301} {"train_loss": -27.800174713134766, "global_step": 605989, "epoch": 7301} {"train_loss": -27.85927391052246, "global_step": 605990, "epoch": 7301} {"train_loss": -27.274511337280273, "global_step": 605991, "epoch": 7301} {"train_loss": -28.1953067779541, "global_step": 605992, "epoch": 7301} {"train_loss": -27.669086456298828, "global_step": 605993, "epoch": 7301} {"train_loss": -27.932098388671875, "global_step": 605994, "epoch": 7301} {"train_loss": -27.937463760375977, "global_step": 605995, "epoch": 7301} {"train_loss": -27.278888702392578, "global_step": 605996, "epoch": 7301} {"train_loss": -27.8794002532959, "global_step": 605997, "epoch": 7301} {"train_loss": -27.713003158569336, "global_step": 605998, "epoch": 7301} {"train_loss": -28.01165199279785, "global_step": 605999, "epoch": 7301} {"train_loss": -27.987674713134766, "global_step": 606000, "epoch": 7301} {"train_loss": -27.87275505065918, "global_step": 606001, "epoch": 7301} {"train_loss": -27.885343551635742, "global_step": 606002, "epoch": 7301} {"train_loss": -28.014638900756836, "global_step": 606003, "epoch": 7301} {"train_loss": -27.945920944213867, "global_step": 606004, "epoch": 7301} {"train_loss": -28.02239990234375, "global_step": 606005, "epoch": 7301} {"train_loss": -27.922407150268555, "global_step": 606006, "epoch": 7301} {"train_loss": -28.043750762939453, "global_step": 606007, "epoch": 7301} {"train_loss": -27.9664363861084, "global_step": 606008, "epoch": 7301} {"train_loss": -28.0526180267334, "global_step": 606009, "epoch": 7301} {"train_loss": -27.78791618347168, "global_step": 606010, "epoch": 7301} {"train_loss": -27.8172550201416, "global_step": 606011, "epoch": 7301} {"train_loss": -27.891128540039062, "global_step": 606012, "epoch": 7301} {"train_loss": -27.953662872314453, "global_step": 606013, "epoch": 7301} {"train_loss": -28.189712524414062, "global_step": 606014, "epoch": 7301} {"train_loss": -28.221540451049805, "global_step": 606015, "epoch": 7301} {"train_loss": -28.025548934936523, "global_step": 606016, "epoch": 7301} {"train_loss": -28.088354110717773, "global_step": 606017, "epoch": 7301} {"train_loss": -28.484045028686523, "global_step": 606018, "epoch": 7301} {"train_loss": -28.169464111328125, "global_step": 606019, "epoch": 7301} {"train_loss": -28.0445556640625, "global_step": 606020, "epoch": 7301} {"train_loss": -28.074203491210938, "global_step": 606021, "epoch": 7301} {"train_loss": -28.05398941040039, "global_step": 606022, "epoch": 7301} {"train_loss": -28.177875518798828, "global_step": 606023, "epoch": 7301} {"train_loss": -28.233795166015625, "global_step": 606024, "epoch": 7301} {"train_loss": -28.545019149780273, "global_step": 606025, "epoch": 7301} {"train_loss": -27.997480392456055, "global_step": 606026, "epoch": 7301} {"train_loss": -28.00819969177246, "global_step": 606027, "epoch": 7301} {"train_loss": -27.795385360717773, "global_step": 606028, "epoch": 7301} {"train_loss": -28.348407745361328, "global_step": 606029, "epoch": 7301} {"train_loss": -28.410770416259766, "global_step": 606030, "epoch": 7301} {"train_loss": -27.8215274810791, "global_step": 606031, "epoch": 7301} {"train_loss": -27.951765060424805, "global_step": 606032, "epoch": 7301} {"train_loss": -28.399351119995117, "global_step": 606033, "epoch": 7301} {"train_loss": -28.4719295501709, "global_step": 606034, "epoch": 7301} {"train_loss": -28.258344650268555, "global_step": 606035, "epoch": 7301} {"train_loss": -27.95077896118164, "global_step": 606036, "epoch": 7301} {"train_loss": -28.208423614501953, "global_step": 606037, "epoch": 7301} {"train_loss": -28.02752113342285, "global_step": 606038, "epoch": 7301} {"train_loss": -27.786975860595703, "global_step": 606039, "epoch": 7301} {"train_loss": -27.94434928894043, "global_step": 606040, "epoch": 7301} {"train_loss": -28.152240753173828, "global_step": 606041, "epoch": 7301} {"train_loss": -28.276758193969727, "global_step": 606042, "epoch": 7301} {"train_loss": -27.90175437927246, "global_step": 606043, "epoch": 7301} {"train_loss": -27.851232528686523, "global_step": 606044, "epoch": 7301} {"train_loss": -28.025333404541016, "global_step": 606045, "epoch": 7301} {"train_loss": -28.091772079467773, "global_step": 606046, "epoch": 7301} {"train_loss": -27.9375057220459, "global_step": 606047, "epoch": 7301} {"train_loss": -28.289276123046875, "global_step": 606048, "epoch": 7301} {"train_loss": -27.9521427154541, "global_step": 606049, "epoch": 7301} {"train_loss": -27.967361450195312, "global_step": 606050, "epoch": 7301} {"train_loss": -27.794235229492188, "global_step": 606051, "epoch": 7301} {"train_loss": -28.046472549438477, "global_step": 606052, "epoch": 7301} {"train_loss": -28.156442642211914, "global_step": 606053, "epoch": 7301} {"train_loss": -27.876127243041992, "global_step": 606054, "epoch": 7301} {"train_loss": -28.422338485717773, "global_step": 606055, "epoch": 7301} {"train_loss": -28.03584098815918, "global_step": 606056, "epoch": 7301} {"train_loss": -27.60797119140625, "global_step": 606057, "epoch": 7301} {"train_loss": -27.962249755859375, "global_step": 606058, "epoch": 7301} {"train_loss": -28.01763916015625, "global_step": 606059, "epoch": 7301} {"train_loss": -27.852514266967773, "global_step": 606060, "epoch": 7301} {"train_loss": -27.926233291625977, "global_step": 606061, "epoch": 7301} {"train_loss": -27.60981559753418, "global_step": 606062, "epoch": 7301} {"train_loss": -27.456838607788086, "global_step": 606063, "epoch": 7301} {"train_loss": -28.122516632080078, "global_step": 606064, "epoch": 7301} {"train_loss": -27.955845177891742, "global_step": 606065, "epoch": 7301, "val_loss": 6817356.5} {"train_loss": -26.618146896362305, "global_step": 606066, "epoch": 7302} {"train_loss": -27.29673194885254, "global_step": 606067, "epoch": 7302} {"train_loss": -26.97553825378418, "global_step": 606068, "epoch": 7302} {"train_loss": -27.14664649963379, "global_step": 606069, "epoch": 7302} {"train_loss": -26.826520919799805, "global_step": 606070, "epoch": 7302} {"train_loss": -27.2252254486084, "global_step": 606071, "epoch": 7302} {"train_loss": -26.834829330444336, "global_step": 606072, "epoch": 7302} {"train_loss": -27.16300392150879, "global_step": 606073, "epoch": 7302} {"train_loss": -27.41847038269043, "global_step": 606074, "epoch": 7302} {"train_loss": -27.425613403320312, "global_step": 606075, "epoch": 7302} {"train_loss": -27.618057250976562, "global_step": 606076, "epoch": 7302} {"train_loss": -27.198505401611328, "global_step": 606077, "epoch": 7302} {"train_loss": -27.526403427124023, "global_step": 606078, "epoch": 7302} {"train_loss": -27.494871139526367, "global_step": 606079, "epoch": 7302} {"train_loss": -27.58106803894043, "global_step": 606080, "epoch": 7302} {"train_loss": -27.383691787719727, "global_step": 606081, "epoch": 7302} {"train_loss": -27.507064819335938, "global_step": 606082, "epoch": 7302} {"train_loss": -27.791589736938477, "global_step": 606083, "epoch": 7302} {"train_loss": -27.672895431518555, "global_step": 606084, "epoch": 7302} {"train_loss": -27.479761123657227, "global_step": 606085, "epoch": 7302} {"train_loss": -27.529804229736328, "global_step": 606086, "epoch": 7302} {"train_loss": -27.739120483398438, "global_step": 606087, "epoch": 7302} {"train_loss": -27.945646286010742, "global_step": 606088, "epoch": 7302} {"train_loss": -27.859933853149414, "global_step": 606089, "epoch": 7302} {"train_loss": -27.82195472717285, "global_step": 606090, "epoch": 7302} {"train_loss": -28.150421142578125, "global_step": 606091, "epoch": 7302} {"train_loss": -27.990381240844727, "global_step": 606092, "epoch": 7302} {"train_loss": -27.473691940307617, "global_step": 606093, "epoch": 7302} {"train_loss": -28.201772689819336, "global_step": 606094, "epoch": 7302} {"train_loss": -27.915592193603516, "global_step": 606095, "epoch": 7302} {"train_loss": -27.971099853515625, "global_step": 606096, "epoch": 7302} {"train_loss": -27.937824249267578, "global_step": 606097, "epoch": 7302} {"train_loss": -28.117847442626953, "global_step": 606098, "epoch": 7302} {"train_loss": -27.83050537109375, "global_step": 606099, "epoch": 7302} {"train_loss": -28.341184616088867, "global_step": 606100, "epoch": 7302} {"train_loss": -28.05901527404785, "global_step": 606101, "epoch": 7302} {"train_loss": -28.184009552001953, "global_step": 606102, "epoch": 7302} {"train_loss": -27.98004150390625, "global_step": 606103, "epoch": 7302} {"train_loss": -28.1700439453125, "global_step": 606104, "epoch": 7302} {"train_loss": -28.312604904174805, "global_step": 606105, "epoch": 7302} {"train_loss": -28.217578887939453, "global_step": 606106, "epoch": 7302} {"train_loss": -28.488788604736328, "global_step": 606107, "epoch": 7302} {"train_loss": -28.511510848999023, "global_step": 606108, "epoch": 7302} {"train_loss": -27.937469482421875, "global_step": 606109, "epoch": 7302} {"train_loss": -28.21368408203125, "global_step": 606110, "epoch": 7302} {"train_loss": -28.266559600830078, "global_step": 606111, "epoch": 7302} {"train_loss": -28.25823402404785, "global_step": 606112, "epoch": 7302} {"train_loss": -28.69095230102539, "global_step": 606113, "epoch": 7302} {"train_loss": -28.243879318237305, "global_step": 606114, "epoch": 7302} {"train_loss": -28.529401779174805, "global_step": 606115, "epoch": 7302} {"train_loss": -28.129867553710938, "global_step": 606116, "epoch": 7302} {"train_loss": -27.9783992767334, "global_step": 606117, "epoch": 7302} {"train_loss": -28.43377113342285, "global_step": 606118, "epoch": 7302} {"train_loss": -28.274641036987305, "global_step": 606119, "epoch": 7302} {"train_loss": -28.0269718170166, "global_step": 606120, "epoch": 7302} {"train_loss": -27.7950439453125, "global_step": 606121, "epoch": 7302} {"train_loss": -28.146886825561523, "global_step": 606122, "epoch": 7302} {"train_loss": -28.24378776550293, "global_step": 606123, "epoch": 7302} {"train_loss": -27.880456924438477, "global_step": 606124, "epoch": 7302} {"train_loss": -28.021289825439453, "global_step": 606125, "epoch": 7302} {"train_loss": -27.715621948242188, "global_step": 606126, "epoch": 7302} {"train_loss": -27.847272872924805, "global_step": 606127, "epoch": 7302} {"train_loss": -27.688581466674805, "global_step": 606128, "epoch": 7302} {"train_loss": -28.12286949157715, "global_step": 606129, "epoch": 7302} {"train_loss": -28.19598960876465, "global_step": 606130, "epoch": 7302} {"train_loss": -27.497114181518555, "global_step": 606131, "epoch": 7302} {"train_loss": -28.066680908203125, "global_step": 606132, "epoch": 7302} {"train_loss": -27.79547691345215, "global_step": 606133, "epoch": 7302} {"train_loss": -27.48065185546875, "global_step": 606134, "epoch": 7302} {"train_loss": -27.475183486938477, "global_step": 606135, "epoch": 7302} {"train_loss": -27.837438583374023, "global_step": 606136, "epoch": 7302} {"train_loss": -28.0438289642334, "global_step": 606137, "epoch": 7302} {"train_loss": -28.244482040405273, "global_step": 606138, "epoch": 7302} {"train_loss": -28.11094093322754, "global_step": 606139, "epoch": 7302} {"train_loss": -28.44179344177246, "global_step": 606140, "epoch": 7302} {"train_loss": -28.01978874206543, "global_step": 606141, "epoch": 7302} {"train_loss": -28.446975708007812, "global_step": 606142, "epoch": 7302} {"train_loss": -28.288862228393555, "global_step": 606143, "epoch": 7302} {"train_loss": -28.385868072509766, "global_step": 606144, "epoch": 7302} {"train_loss": -27.995330810546875, "global_step": 606145, "epoch": 7302} {"train_loss": -28.002805709838867, "global_step": 606146, "epoch": 7302} {"train_loss": -28.122190475463867, "global_step": 606147, "epoch": 7302} {"train_loss": -27.889972962528827, "global_step": 606148, "epoch": 7302, "val_loss": 6717131.0} {"train_loss": -28.031951904296875, "global_step": 606149, "epoch": 7303} {"train_loss": -27.71270179748535, "global_step": 606150, "epoch": 7303} {"train_loss": -27.901187896728516, "global_step": 606151, "epoch": 7303} {"train_loss": -28.095067977905273, "global_step": 606152, "epoch": 7303} {"train_loss": -28.118762969970703, "global_step": 606153, "epoch": 7303} {"train_loss": -28.18310546875, "global_step": 606154, "epoch": 7303} {"train_loss": -27.920978546142578, "global_step": 606155, "epoch": 7303} {"train_loss": -27.9218807220459, "global_step": 606156, "epoch": 7303} {"train_loss": -28.415882110595703, "global_step": 606157, "epoch": 7303} {"train_loss": -28.0463924407959, "global_step": 606158, "epoch": 7303} {"train_loss": -27.950170516967773, "global_step": 606159, "epoch": 7303} {"train_loss": -27.455642700195312, "global_step": 606160, "epoch": 7303} {"train_loss": -27.141281127929688, "global_step": 606161, "epoch": 7303} {"train_loss": -27.17597007751465, "global_step": 606162, "epoch": 7303} {"train_loss": -26.987945556640625, "global_step": 606163, "epoch": 7303} {"train_loss": -27.608600616455078, "global_step": 606164, "epoch": 7303} {"train_loss": -27.812055587768555, "global_step": 606165, "epoch": 7303} {"train_loss": -28.155975341796875, "global_step": 606166, "epoch": 7303} {"train_loss": -27.976856231689453, "global_step": 606167, "epoch": 7303} {"train_loss": -28.05000877380371, "global_step": 606168, "epoch": 7303} {"train_loss": -28.224384307861328, "global_step": 606169, "epoch": 7303} {"train_loss": -27.5269775390625, "global_step": 606170, "epoch": 7303} {"train_loss": -27.558185577392578, "global_step": 606171, "epoch": 7303} {"train_loss": -27.819107055664062, "global_step": 606172, "epoch": 7303} {"train_loss": -28.2899112701416, "global_step": 606173, "epoch": 7303} {"train_loss": -27.879980087280273, "global_step": 606174, "epoch": 7303} {"train_loss": -27.982044219970703, "global_step": 606175, "epoch": 7303} {"train_loss": -27.758909225463867, "global_step": 606176, "epoch": 7303} {"train_loss": -27.855459213256836, "global_step": 606177, "epoch": 7303} {"train_loss": -28.032697677612305, "global_step": 606178, "epoch": 7303} {"train_loss": -27.688623428344727, "global_step": 606179, "epoch": 7303} {"train_loss": -27.8996639251709, "global_step": 606180, "epoch": 7303} {"train_loss": -28.02227210998535, "global_step": 606181, "epoch": 7303} {"train_loss": -27.791746139526367, "global_step": 606182, "epoch": 7303} {"train_loss": -28.40899658203125, "global_step": 606183, "epoch": 7303} {"train_loss": -27.888813018798828, "global_step": 606184, "epoch": 7303} {"train_loss": -27.79811668395996, "global_step": 606185, "epoch": 7303} {"train_loss": -27.95106315612793, "global_step": 606186, "epoch": 7303} {"train_loss": -28.339223861694336, "global_step": 606187, "epoch": 7303} {"train_loss": -28.212188720703125, "global_step": 606188, "epoch": 7303} {"train_loss": -28.104267120361328, "global_step": 606189, "epoch": 7303} {"train_loss": -28.203649520874023, "global_step": 606190, "epoch": 7303} {"train_loss": -27.98907470703125, "global_step": 606191, "epoch": 7303} {"train_loss": -28.754230499267578, "global_step": 606192, "epoch": 7303} {"train_loss": -28.146896362304688, "global_step": 606193, "epoch": 7303} {"train_loss": -28.426254272460938, "global_step": 606194, "epoch": 7303} {"train_loss": -28.252002716064453, "global_step": 606195, "epoch": 7303} {"train_loss": -28.19464683532715, "global_step": 606196, "epoch": 7303} {"train_loss": -28.21504020690918, "global_step": 606197, "epoch": 7303} {"train_loss": -28.236774444580078, "global_step": 606198, "epoch": 7303} {"train_loss": -28.326059341430664, "global_step": 606199, "epoch": 7303} {"train_loss": -27.922271728515625, "global_step": 606200, "epoch": 7303} {"train_loss": -28.1439208984375, "global_step": 606201, "epoch": 7303} {"train_loss": -28.829492568969727, "global_step": 606202, "epoch": 7303} {"train_loss": -28.031326293945312, "global_step": 606203, "epoch": 7303} {"train_loss": -28.573644638061523, "global_step": 606204, "epoch": 7303} {"train_loss": -28.086713790893555, "global_step": 606205, "epoch": 7303} {"train_loss": -27.942611694335938, "global_step": 606206, "epoch": 7303} {"train_loss": -27.85027503967285, "global_step": 606207, "epoch": 7303} {"train_loss": -27.064395904541016, "global_step": 606208, "epoch": 7303} {"train_loss": -27.44122314453125, "global_step": 606209, "epoch": 7303} {"train_loss": -28.021631240844727, "global_step": 606210, "epoch": 7303} {"train_loss": -27.7994441986084, "global_step": 606211, "epoch": 7303} {"train_loss": -27.87000846862793, "global_step": 606212, "epoch": 7303} {"train_loss": -27.555084228515625, "global_step": 606213, "epoch": 7303} {"train_loss": -27.218124389648438, "global_step": 606214, "epoch": 7303} {"train_loss": -27.513280868530273, "global_step": 606215, "epoch": 7303} {"train_loss": -28.151416778564453, "global_step": 606216, "epoch": 7303} {"train_loss": -27.564895629882812, "global_step": 606217, "epoch": 7303} {"train_loss": -27.381546020507812, "global_step": 606218, "epoch": 7303} {"train_loss": -27.8284969329834, "global_step": 606219, "epoch": 7303} {"train_loss": -27.362640380859375, "global_step": 606220, "epoch": 7303} {"train_loss": -27.85552406311035, "global_step": 606221, "epoch": 7303} {"train_loss": -27.74370765686035, "global_step": 606222, "epoch": 7303} {"train_loss": -27.49968910217285, "global_step": 606223, "epoch": 7303} {"train_loss": -27.81690788269043, "global_step": 606224, "epoch": 7303} {"train_loss": -27.96542739868164, "global_step": 606225, "epoch": 7303} {"train_loss": -27.469684600830078, "global_step": 606226, "epoch": 7303} {"train_loss": -27.9000244140625, "global_step": 606227, "epoch": 7303} {"train_loss": -27.774372100830078, "global_step": 606228, "epoch": 7303} {"train_loss": -27.869192123413086, "global_step": 606229, "epoch": 7303} {"train_loss": -28.18646240234375, "global_step": 606230, "epoch": 7303} {"train_loss": -27.91297142764172, "global_step": 606231, "epoch": 7303, "val_loss": 6815089.0} {"train_loss": -27.927087783813477, "global_step": 606232, "epoch": 7304} {"train_loss": -27.42415428161621, "global_step": 606233, "epoch": 7304} {"train_loss": -27.758834838867188, "global_step": 606234, "epoch": 7304} {"train_loss": -27.911895751953125, "global_step": 606235, "epoch": 7304} {"train_loss": -27.607816696166992, "global_step": 606236, "epoch": 7304} {"train_loss": -27.454242706298828, "global_step": 606237, "epoch": 7304} {"train_loss": -27.916269302368164, "global_step": 606238, "epoch": 7304} {"train_loss": -27.361347198486328, "global_step": 606239, "epoch": 7304} {"train_loss": -27.519128799438477, "global_step": 606240, "epoch": 7304} {"train_loss": -27.5650634765625, "global_step": 606241, "epoch": 7304} {"train_loss": -27.548492431640625, "global_step": 606242, "epoch": 7304} {"train_loss": -27.930448532104492, "global_step": 606243, "epoch": 7304} {"train_loss": -27.774688720703125, "global_step": 606244, "epoch": 7304} {"train_loss": -27.951526641845703, "global_step": 606245, "epoch": 7304} {"train_loss": -28.02862548828125, "global_step": 606246, "epoch": 7304} {"train_loss": -28.14167594909668, "global_step": 606247, "epoch": 7304} {"train_loss": -28.329069137573242, "global_step": 606248, "epoch": 7304} {"train_loss": -27.992786407470703, "global_step": 606249, "epoch": 7304} {"train_loss": -27.681488037109375, "global_step": 606250, "epoch": 7304} {"train_loss": -27.862096786499023, "global_step": 606251, "epoch": 7304} {"train_loss": -27.49126625061035, "global_step": 606252, "epoch": 7304} {"train_loss": -27.88214111328125, "global_step": 606253, "epoch": 7304} {"train_loss": -27.82049560546875, "global_step": 606254, "epoch": 7304} {"train_loss": -27.79836082458496, "global_step": 606255, "epoch": 7304} {"train_loss": -27.9067440032959, "global_step": 606256, "epoch": 7304} {"train_loss": -28.1256046295166, "global_step": 606257, "epoch": 7304} {"train_loss": -27.98164176940918, "global_step": 606258, "epoch": 7304} {"train_loss": -28.141773223876953, "global_step": 606259, "epoch": 7304} {"train_loss": -27.98724365234375, "global_step": 606260, "epoch": 7304} {"train_loss": -28.0015869140625, "global_step": 606261, "epoch": 7304} {"train_loss": -28.12774658203125, "global_step": 606262, "epoch": 7304} {"train_loss": -28.4355525970459, "global_step": 606263, "epoch": 7304} {"train_loss": -28.004236221313477, "global_step": 606264, "epoch": 7304} {"train_loss": -28.073917388916016, "global_step": 606265, "epoch": 7304} {"train_loss": -28.021814346313477, "global_step": 606266, "epoch": 7304} {"train_loss": -28.1973819732666, "global_step": 606267, "epoch": 7304} {"train_loss": -28.153913497924805, "global_step": 606268, "epoch": 7304} {"train_loss": -27.821073532104492, "global_step": 606269, "epoch": 7304} {"train_loss": -27.753828048706055, "global_step": 606270, "epoch": 7304} {"train_loss": -26.961111068725586, "global_step": 606271, "epoch": 7304} {"train_loss": -27.485437393188477, "global_step": 606272, "epoch": 7304} {"train_loss": -28.053131103515625, "global_step": 606273, "epoch": 7304} {"train_loss": -27.8458251953125, "global_step": 606274, "epoch": 7304} {"train_loss": -28.040571212768555, "global_step": 606275, "epoch": 7304} {"train_loss": -27.160816192626953, "global_step": 606276, "epoch": 7304} {"train_loss": -27.652301788330078, "global_step": 606277, "epoch": 7304} {"train_loss": -27.606220245361328, "global_step": 606278, "epoch": 7304} {"train_loss": -27.6762638092041, "global_step": 606279, "epoch": 7304} {"train_loss": -28.155364990234375, "global_step": 606280, "epoch": 7304} {"train_loss": -27.88270378112793, "global_step": 606281, "epoch": 7304} {"train_loss": -27.50286865234375, "global_step": 606282, "epoch": 7304} {"train_loss": -28.074594497680664, "global_step": 606283, "epoch": 7304} {"train_loss": -27.731042861938477, "global_step": 606284, "epoch": 7304} {"train_loss": -28.02676773071289, "global_step": 606285, "epoch": 7304} {"train_loss": -27.758283615112305, "global_step": 606286, "epoch": 7304} {"train_loss": -27.829639434814453, "global_step": 606287, "epoch": 7304} {"train_loss": -27.76896095275879, "global_step": 606288, "epoch": 7304} {"train_loss": -28.000476837158203, "global_step": 606289, "epoch": 7304} {"train_loss": -27.49260902404785, "global_step": 606290, "epoch": 7304} {"train_loss": -27.736419677734375, "global_step": 606291, "epoch": 7304} {"train_loss": -27.630102157592773, "global_step": 606292, "epoch": 7304} {"train_loss": -27.552112579345703, "global_step": 606293, "epoch": 7304} {"train_loss": -28.139184951782227, "global_step": 606294, "epoch": 7304} {"train_loss": -27.3597354888916, "global_step": 606295, "epoch": 7304} {"train_loss": -27.92572593688965, "global_step": 606296, "epoch": 7304} {"train_loss": -27.96512794494629, "global_step": 606297, "epoch": 7304} {"train_loss": -27.71091079711914, "global_step": 606298, "epoch": 7304} {"train_loss": -27.529132843017578, "global_step": 606299, "epoch": 7304} {"train_loss": -27.721099853515625, "global_step": 606300, "epoch": 7304} {"train_loss": -27.732038497924805, "global_step": 606301, "epoch": 7304} {"train_loss": -27.941564559936523, "global_step": 606302, "epoch": 7304} {"train_loss": -27.857526779174805, "global_step": 606303, "epoch": 7304} {"train_loss": -27.423187255859375, "global_step": 606304, "epoch": 7304} {"train_loss": -28.1292781829834, "global_step": 606305, "epoch": 7304} {"train_loss": -27.77555274963379, "global_step": 606306, "epoch": 7304} {"train_loss": -28.087400436401367, "global_step": 606307, "epoch": 7304} {"train_loss": -27.9252986907959, "global_step": 606308, "epoch": 7304} {"train_loss": -27.85671043395996, "global_step": 606309, "epoch": 7304} {"train_loss": -28.2529239654541, "global_step": 606310, "epoch": 7304} {"train_loss": -28.07209587097168, "global_step": 606311, "epoch": 7304} {"train_loss": -28.168378829956055, "global_step": 606312, "epoch": 7304} {"train_loss": -27.77432632446289, "global_step": 606313, "epoch": 7304} {"train_loss": -27.840228253100292, "global_step": 606314, "epoch": 7304, "val_loss": 6775949.0} {"train_loss": -27.88716697692871, "global_step": 606315, "epoch": 7305} {"train_loss": -27.776641845703125, "global_step": 606316, "epoch": 7305} {"train_loss": -27.652097702026367, "global_step": 606317, "epoch": 7305} {"train_loss": -27.62896728515625, "global_step": 606318, "epoch": 7305} {"train_loss": -27.44598960876465, "global_step": 606319, "epoch": 7305} {"train_loss": -27.54931640625, "global_step": 606320, "epoch": 7305} {"train_loss": -27.92048454284668, "global_step": 606321, "epoch": 7305} {"train_loss": -27.6632022857666, "global_step": 606322, "epoch": 7305} {"train_loss": -27.556798934936523, "global_step": 606323, "epoch": 7305} {"train_loss": -27.728790283203125, "global_step": 606324, "epoch": 7305} {"train_loss": -27.59539794921875, "global_step": 606325, "epoch": 7305} {"train_loss": -27.78529930114746, "global_step": 606326, "epoch": 7305} {"train_loss": -27.793121337890625, "global_step": 606327, "epoch": 7305} {"train_loss": -28.109830856323242, "global_step": 606328, "epoch": 7305} {"train_loss": -27.8282413482666, "global_step": 606329, "epoch": 7305} {"train_loss": -27.717615127563477, "global_step": 606330, "epoch": 7305} {"train_loss": -27.865991592407227, "global_step": 606331, "epoch": 7305} {"train_loss": -27.666574478149414, "global_step": 606332, "epoch": 7305} {"train_loss": -27.968305587768555, "global_step": 606333, "epoch": 7305} {"train_loss": -27.87836265563965, "global_step": 606334, "epoch": 7305} {"train_loss": -28.0300235748291, "global_step": 606335, "epoch": 7305} {"train_loss": -27.9904842376709, "global_step": 606336, "epoch": 7305} {"train_loss": -27.974456787109375, "global_step": 606337, "epoch": 7305} {"train_loss": -27.825376510620117, "global_step": 606338, "epoch": 7305} {"train_loss": -28.254383087158203, "global_step": 606339, "epoch": 7305} {"train_loss": -27.979232788085938, "global_step": 606340, "epoch": 7305} {"train_loss": -28.213775634765625, "global_step": 606341, "epoch": 7305} {"train_loss": -28.096078872680664, "global_step": 606342, "epoch": 7305} {"train_loss": -27.90650749206543, "global_step": 606343, "epoch": 7305} {"train_loss": -28.0709171295166, "global_step": 606344, "epoch": 7305} {"train_loss": -27.8988094329834, "global_step": 606345, "epoch": 7305} {"train_loss": -28.022907257080078, "global_step": 606346, "epoch": 7305} {"train_loss": -28.159955978393555, "global_step": 606347, "epoch": 7305} {"train_loss": -28.227420806884766, "global_step": 606348, "epoch": 7305} {"train_loss": -28.27931785583496, "global_step": 606349, "epoch": 7305} {"train_loss": -28.360248565673828, "global_step": 606350, "epoch": 7305} {"train_loss": -28.042776107788086, "global_step": 606351, "epoch": 7305} {"train_loss": -28.230924606323242, "global_step": 606352, "epoch": 7305} {"train_loss": -28.266950607299805, "global_step": 606353, "epoch": 7305} {"train_loss": -28.6724910736084, "global_step": 606354, "epoch": 7305} {"train_loss": -28.553030014038086, "global_step": 606355, "epoch": 7305} {"train_loss": -28.340280532836914, "global_step": 606356, "epoch": 7305} {"train_loss": -28.221698760986328, "global_step": 606357, "epoch": 7305} {"train_loss": -27.968891143798828, "global_step": 606358, "epoch": 7305} {"train_loss": -28.08771324157715, "global_step": 606359, "epoch": 7305} {"train_loss": -28.198583602905273, "global_step": 606360, "epoch": 7305} {"train_loss": -27.886722564697266, "global_step": 606361, "epoch": 7305} {"train_loss": -28.65469741821289, "global_step": 606362, "epoch": 7305} {"train_loss": -28.12476921081543, "global_step": 606363, "epoch": 7305} {"train_loss": -28.25809097290039, "global_step": 606364, "epoch": 7305} {"train_loss": -28.161483764648438, "global_step": 606365, "epoch": 7305} {"train_loss": -28.435041427612305, "global_step": 606366, "epoch": 7305} {"train_loss": -28.26767349243164, "global_step": 606367, "epoch": 7305} {"train_loss": -28.0212345123291, "global_step": 606368, "epoch": 7305} {"train_loss": -27.998361587524414, "global_step": 606369, "epoch": 7305} {"train_loss": -27.9202938079834, "global_step": 606370, "epoch": 7305} {"train_loss": -28.004032135009766, "global_step": 606371, "epoch": 7305} {"train_loss": -27.958728790283203, "global_step": 606372, "epoch": 7305} {"train_loss": -27.332233428955078, "global_step": 606373, "epoch": 7305} {"train_loss": -27.187829971313477, "global_step": 606374, "epoch": 7305} {"train_loss": -27.92766761779785, "global_step": 606375, "epoch": 7305} {"train_loss": -28.196964263916016, "global_step": 606376, "epoch": 7305} {"train_loss": -27.717008590698242, "global_step": 606377, "epoch": 7305} {"train_loss": -27.743295669555664, "global_step": 606378, "epoch": 7305} {"train_loss": -27.778833389282227, "global_step": 606379, "epoch": 7305} {"train_loss": -27.957361221313477, "global_step": 606380, "epoch": 7305} {"train_loss": -27.890216827392578, "global_step": 606381, "epoch": 7305} {"train_loss": -27.951536178588867, "global_step": 606382, "epoch": 7305} {"train_loss": -28.149250030517578, "global_step": 606383, "epoch": 7305} {"train_loss": -27.92072868347168, "global_step": 606384, "epoch": 7305} {"train_loss": -28.10467529296875, "global_step": 606385, "epoch": 7305} {"train_loss": -27.604639053344727, "global_step": 606386, "epoch": 7305} {"train_loss": -28.043060302734375, "global_step": 606387, "epoch": 7305} {"train_loss": -28.263946533203125, "global_step": 606388, "epoch": 7305} {"train_loss": -28.115467071533203, "global_step": 606389, "epoch": 7305} {"train_loss": -27.899093627929688, "global_step": 606390, "epoch": 7305} {"train_loss": -28.10633659362793, "global_step": 606391, "epoch": 7305} {"train_loss": -27.97144889831543, "global_step": 606392, "epoch": 7305} {"train_loss": -28.27569580078125, "global_step": 606393, "epoch": 7305} {"train_loss": -28.304731369018555, "global_step": 606394, "epoch": 7305} {"train_loss": -28.081008911132812, "global_step": 606395, "epoch": 7305} {"train_loss": -28.07439613342285, "global_step": 606396, "epoch": 7305} {"train_loss": -27.99774744424475, "global_step": 606397, "epoch": 7305, "val_loss": 6712095.0} {"train_loss": -26.30853843688965, "global_step": 606398, "epoch": 7306} {"train_loss": -26.698179244995117, "global_step": 606399, "epoch": 7306} {"train_loss": -27.23553466796875, "global_step": 606400, "epoch": 7306} {"train_loss": -27.163726806640625, "global_step": 606401, "epoch": 7306} {"train_loss": -26.765676498413086, "global_step": 606402, "epoch": 7306} {"train_loss": -26.851064682006836, "global_step": 606403, "epoch": 7306} {"train_loss": -27.51435661315918, "global_step": 606404, "epoch": 7306} {"train_loss": -27.79376220703125, "global_step": 606405, "epoch": 7306} {"train_loss": -27.53742027282715, "global_step": 606406, "epoch": 7306} {"train_loss": -27.617528915405273, "global_step": 606407, "epoch": 7306} {"train_loss": -27.8498592376709, "global_step": 606408, "epoch": 7306} {"train_loss": -27.53570556640625, "global_step": 606409, "epoch": 7306} {"train_loss": -27.43836784362793, "global_step": 606410, "epoch": 7306} {"train_loss": -27.689990997314453, "global_step": 606411, "epoch": 7306} {"train_loss": -27.481708526611328, "global_step": 606412, "epoch": 7306} {"train_loss": -27.692340850830078, "global_step": 606413, "epoch": 7306} {"train_loss": -27.84000015258789, "global_step": 606414, "epoch": 7306} {"train_loss": -27.930744171142578, "global_step": 606415, "epoch": 7306} {"train_loss": -27.7473087310791, "global_step": 606416, "epoch": 7306} {"train_loss": -28.087574005126953, "global_step": 606417, "epoch": 7306} {"train_loss": -27.7171630859375, "global_step": 606418, "epoch": 7306} {"train_loss": -27.96687126159668, "global_step": 606419, "epoch": 7306} {"train_loss": -28.150100708007812, "global_step": 606420, "epoch": 7306} {"train_loss": -28.07215690612793, "global_step": 606421, "epoch": 7306} {"train_loss": -28.016611099243164, "global_step": 606422, "epoch": 7306} {"train_loss": -27.768049240112305, "global_step": 606423, "epoch": 7306} {"train_loss": -27.547088623046875, "global_step": 606424, "epoch": 7306} {"train_loss": -28.155532836914062, "global_step": 606425, "epoch": 7306} {"train_loss": -27.801420211791992, "global_step": 606426, "epoch": 7306} {"train_loss": -27.946765899658203, "global_step": 606427, "epoch": 7306} {"train_loss": -27.8851318359375, "global_step": 606428, "epoch": 7306} {"train_loss": -28.24118995666504, "global_step": 606429, "epoch": 7306} {"train_loss": -27.8664608001709, "global_step": 606430, "epoch": 7306} {"train_loss": -28.346586227416992, "global_step": 606431, "epoch": 7306} {"train_loss": -28.389867782592773, "global_step": 606432, "epoch": 7306} {"train_loss": -28.450414657592773, "global_step": 606433, "epoch": 7306} {"train_loss": -27.943567276000977, "global_step": 606434, "epoch": 7306} {"train_loss": -28.19937515258789, "global_step": 606435, "epoch": 7306} {"train_loss": -28.072362899780273, "global_step": 606436, "epoch": 7306} {"train_loss": -28.231779098510742, "global_step": 606437, "epoch": 7306} {"train_loss": -27.87359619140625, "global_step": 606438, "epoch": 7306} {"train_loss": -28.424230575561523, "global_step": 606439, "epoch": 7306} {"train_loss": -27.90380859375, "global_step": 606440, "epoch": 7306} {"train_loss": -28.2236328125, "global_step": 606441, "epoch": 7306} {"train_loss": -28.15308952331543, "global_step": 606442, "epoch": 7306} {"train_loss": -28.207883834838867, "global_step": 606443, "epoch": 7306} {"train_loss": -28.532835006713867, "global_step": 606444, "epoch": 7306} {"train_loss": -28.520925521850586, "global_step": 606445, "epoch": 7306} {"train_loss": -28.105712890625, "global_step": 606446, "epoch": 7306} {"train_loss": -28.167531967163086, "global_step": 606447, "epoch": 7306} {"train_loss": -28.109867095947266, "global_step": 606448, "epoch": 7306} {"train_loss": -27.98099708557129, "global_step": 606449, "epoch": 7306} {"train_loss": -28.333728790283203, "global_step": 606450, "epoch": 7306} {"train_loss": -27.739185333251953, "global_step": 606451, "epoch": 7306} {"train_loss": -28.158315658569336, "global_step": 606452, "epoch": 7306} {"train_loss": -27.926727294921875, "global_step": 606453, "epoch": 7306} {"train_loss": -27.779462814331055, "global_step": 606454, "epoch": 7306} {"train_loss": -27.788190841674805, "global_step": 606455, "epoch": 7306} {"train_loss": -28.1036319732666, "global_step": 606456, "epoch": 7306} {"train_loss": -28.26517105102539, "global_step": 606457, "epoch": 7306} {"train_loss": -27.917911529541016, "global_step": 606458, "epoch": 7306} {"train_loss": -27.730634689331055, "global_step": 606459, "epoch": 7306} {"train_loss": -28.066099166870117, "global_step": 606460, "epoch": 7306} {"train_loss": -28.039358139038086, "global_step": 606461, "epoch": 7306} {"train_loss": -27.95514488220215, "global_step": 606462, "epoch": 7306} {"train_loss": -27.985910415649414, "global_step": 606463, "epoch": 7306} {"train_loss": -27.863758087158203, "global_step": 606464, "epoch": 7306} {"train_loss": -27.966827392578125, "global_step": 606465, "epoch": 7306} {"train_loss": -27.499868392944336, "global_step": 606466, "epoch": 7306} {"train_loss": -28.040210723876953, "global_step": 606467, "epoch": 7306} {"train_loss": -28.028400421142578, "global_step": 606468, "epoch": 7306} {"train_loss": -28.1084041595459, "global_step": 606469, "epoch": 7306} {"train_loss": -28.08368492126465, "global_step": 606470, "epoch": 7306} {"train_loss": -27.995542526245117, "global_step": 606471, "epoch": 7306} {"train_loss": -28.29241943359375, "global_step": 606472, "epoch": 7306} {"train_loss": -27.60500144958496, "global_step": 606473, "epoch": 7306} {"train_loss": -28.591724395751953, "global_step": 606474, "epoch": 7306} {"train_loss": -28.198545455932617, "global_step": 606475, "epoch": 7306} {"train_loss": -27.862619400024414, "global_step": 606476, "epoch": 7306} {"train_loss": -28.086780548095703, "global_step": 606477, "epoch": 7306} {"train_loss": -28.47245216369629, "global_step": 606478, "epoch": 7306} {"train_loss": -28.34921646118164, "global_step": 606479, "epoch": 7306} {"train_loss": -27.934814430144897, "global_step": 606480, "epoch": 7306, "val_loss": 6735279.0} {"train_loss": -27.371374130249023, "global_step": 606481, "epoch": 7307} {"train_loss": -28.05496597290039, "global_step": 606482, "epoch": 7307} {"train_loss": -27.633819580078125, "global_step": 606483, "epoch": 7307} {"train_loss": -28.12529945373535, "global_step": 606484, "epoch": 7307} {"train_loss": -27.991535186767578, "global_step": 606485, "epoch": 7307} {"train_loss": -27.671960830688477, "global_step": 606486, "epoch": 7307} {"train_loss": -27.7039852142334, "global_step": 606487, "epoch": 7307} {"train_loss": -27.896499633789062, "global_step": 606488, "epoch": 7307} {"train_loss": -27.67832374572754, "global_step": 606489, "epoch": 7307} {"train_loss": -27.933242797851562, "global_step": 606490, "epoch": 7307} {"train_loss": -28.103113174438477, "global_step": 606491, "epoch": 7307} {"train_loss": -28.020477294921875, "global_step": 606492, "epoch": 7307} {"train_loss": -27.972192764282227, "global_step": 606493, "epoch": 7307} {"train_loss": -28.062387466430664, "global_step": 606494, "epoch": 7307} {"train_loss": -27.958887100219727, "global_step": 606495, "epoch": 7307} {"train_loss": -27.54776382446289, "global_step": 606496, "epoch": 7307} {"train_loss": -27.855268478393555, "global_step": 606497, "epoch": 7307} {"train_loss": -27.339069366455078, "global_step": 606498, "epoch": 7307} {"train_loss": -27.567914962768555, "global_step": 606499, "epoch": 7307} {"train_loss": -28.1295223236084, "global_step": 606500, "epoch": 7307} {"train_loss": -27.9797420501709, "global_step": 606501, "epoch": 7307} {"train_loss": -28.024755477905273, "global_step": 606502, "epoch": 7307} {"train_loss": -27.946552276611328, "global_step": 606503, "epoch": 7307} {"train_loss": -27.763092041015625, "global_step": 606504, "epoch": 7307} {"train_loss": -27.1215877532959, "global_step": 606505, "epoch": 7307} {"train_loss": -27.0079402923584, "global_step": 606506, "epoch": 7307} {"train_loss": -27.94495964050293, "global_step": 606507, "epoch": 7307} {"train_loss": -27.70533561706543, "global_step": 606508, "epoch": 7307} {"train_loss": -27.83307456970215, "global_step": 606509, "epoch": 7307} {"train_loss": -28.283111572265625, "global_step": 606510, "epoch": 7307} {"train_loss": -27.33584976196289, "global_step": 606511, "epoch": 7307} {"train_loss": -27.70405387878418, "global_step": 606512, "epoch": 7307} {"train_loss": -27.891950607299805, "global_step": 606513, "epoch": 7307} {"train_loss": -28.206953048706055, "global_step": 606514, "epoch": 7307} {"train_loss": -27.884735107421875, "global_step": 606515, "epoch": 7307} {"train_loss": -27.627099990844727, "global_step": 606516, "epoch": 7307} {"train_loss": -28.152265548706055, "global_step": 606517, "epoch": 7307} {"train_loss": -27.656177520751953, "global_step": 606518, "epoch": 7307} {"train_loss": -27.86054801940918, "global_step": 606519, "epoch": 7307} {"train_loss": -27.827880859375, "global_step": 606520, "epoch": 7307} {"train_loss": -27.949121475219727, "global_step": 606521, "epoch": 7307} {"train_loss": -27.905628204345703, "global_step": 606522, "epoch": 7307} {"train_loss": -27.92832374572754, "global_step": 606523, "epoch": 7307} {"train_loss": -27.882648468017578, "global_step": 606524, "epoch": 7307} {"train_loss": -27.94535255432129, "global_step": 606525, "epoch": 7307} {"train_loss": -27.94733238220215, "global_step": 606526, "epoch": 7307} {"train_loss": -27.7789306640625, "global_step": 606527, "epoch": 7307} {"train_loss": -28.194589614868164, "global_step": 606528, "epoch": 7307} {"train_loss": -27.89068603515625, "global_step": 606529, "epoch": 7307} {"train_loss": -28.093841552734375, "global_step": 606530, "epoch": 7307} {"train_loss": -28.21087646484375, "global_step": 606531, "epoch": 7307} {"train_loss": -28.065244674682617, "global_step": 606532, "epoch": 7307} {"train_loss": -27.994123458862305, "global_step": 606533, "epoch": 7307} {"train_loss": -27.940231323242188, "global_step": 606534, "epoch": 7307} {"train_loss": -28.187381744384766, "global_step": 606535, "epoch": 7307} {"train_loss": -28.07008934020996, "global_step": 606536, "epoch": 7307} {"train_loss": -28.087080001831055, "global_step": 606537, "epoch": 7307} {"train_loss": -28.22430992126465, "global_step": 606538, "epoch": 7307} {"train_loss": -28.324905395507812, "global_step": 606539, "epoch": 7307} {"train_loss": -28.388837814331055, "global_step": 606540, "epoch": 7307} {"train_loss": -28.059377670288086, "global_step": 606541, "epoch": 7307} {"train_loss": -28.250715255737305, "global_step": 606542, "epoch": 7307} {"train_loss": -28.36603355407715, "global_step": 606543, "epoch": 7307} {"train_loss": -27.9397029876709, "global_step": 606544, "epoch": 7307} {"train_loss": -28.27699089050293, "global_step": 606545, "epoch": 7307} {"train_loss": -27.96392822265625, "global_step": 606546, "epoch": 7307} {"train_loss": -28.11518669128418, "global_step": 606547, "epoch": 7307} {"train_loss": -27.963443756103516, "global_step": 606548, "epoch": 7307} {"train_loss": -27.901830673217773, "global_step": 606549, "epoch": 7307} {"train_loss": -28.196155548095703, "global_step": 606550, "epoch": 7307} {"train_loss": -28.022363662719727, "global_step": 606551, "epoch": 7307} {"train_loss": -27.633825302124023, "global_step": 606552, "epoch": 7307} {"train_loss": -27.971303939819336, "global_step": 606553, "epoch": 7307} {"train_loss": -28.12221336364746, "global_step": 606554, "epoch": 7307} {"train_loss": -28.312076568603516, "global_step": 606555, "epoch": 7307} {"train_loss": -28.014373779296875, "global_step": 606556, "epoch": 7307} {"train_loss": -28.0654296875, "global_step": 606557, "epoch": 7307} {"train_loss": -27.975133895874023, "global_step": 606558, "epoch": 7307} {"train_loss": -27.714319229125977, "global_step": 606559, "epoch": 7307} {"train_loss": -28.04408073425293, "global_step": 606560, "epoch": 7307} {"train_loss": -27.62467384338379, "global_step": 606561, "epoch": 7307} {"train_loss": -28.208984375, "global_step": 606562, "epoch": 7307} {"train_loss": -27.9253594501909, "global_step": 606563, "epoch": 7307, "val_loss": 6735752.5} {"train_loss": -27.538043975830078, "global_step": 606564, "epoch": 7308} {"train_loss": -27.043323516845703, "global_step": 606565, "epoch": 7308} {"train_loss": -27.638341903686523, "global_step": 606566, "epoch": 7308} {"train_loss": -27.081003189086914, "global_step": 606567, "epoch": 7308} {"train_loss": -27.681854248046875, "global_step": 606568, "epoch": 7308} {"train_loss": -27.104400634765625, "global_step": 606569, "epoch": 7308} {"train_loss": -27.163793563842773, "global_step": 606570, "epoch": 7308} {"train_loss": -26.870813369750977, "global_step": 606571, "epoch": 7308} {"train_loss": -27.52768898010254, "global_step": 606572, "epoch": 7308} {"train_loss": -27.09332847595215, "global_step": 606573, "epoch": 7308} {"train_loss": -27.386396408081055, "global_step": 606574, "epoch": 7308} {"train_loss": -27.445953369140625, "global_step": 606575, "epoch": 7308} {"train_loss": -27.7775821685791, "global_step": 606576, "epoch": 7308} {"train_loss": -27.208276748657227, "global_step": 606577, "epoch": 7308} {"train_loss": -27.3985595703125, "global_step": 606578, "epoch": 7308} {"train_loss": -27.7810115814209, "global_step": 606579, "epoch": 7308} {"train_loss": -27.4638729095459, "global_step": 606580, "epoch": 7308} {"train_loss": -27.544418334960938, "global_step": 606581, "epoch": 7308} {"train_loss": -27.604938507080078, "global_step": 606582, "epoch": 7308} {"train_loss": -27.656930923461914, "global_step": 606583, "epoch": 7308} {"train_loss": -27.36056900024414, "global_step": 606584, "epoch": 7308} {"train_loss": -28.031721115112305, "global_step": 606585, "epoch": 7308} {"train_loss": -27.5808162689209, "global_step": 606586, "epoch": 7308} {"train_loss": -27.879858016967773, "global_step": 606587, "epoch": 7308} {"train_loss": -27.79325294494629, "global_step": 606588, "epoch": 7308} {"train_loss": -28.10260009765625, "global_step": 606589, "epoch": 7308} {"train_loss": -27.871875762939453, "global_step": 606590, "epoch": 7308} {"train_loss": -27.802478790283203, "global_step": 606591, "epoch": 7308} {"train_loss": -27.87811851501465, "global_step": 606592, "epoch": 7308} {"train_loss": -28.24812126159668, "global_step": 606593, "epoch": 7308} {"train_loss": -27.921875, "global_step": 606594, "epoch": 7308} {"train_loss": -28.1076717376709, "global_step": 606595, "epoch": 7308} {"train_loss": -27.802587509155273, "global_step": 606596, "epoch": 7308} {"train_loss": -28.149829864501953, "global_step": 606597, "epoch": 7308} {"train_loss": -28.216949462890625, "global_step": 606598, "epoch": 7308} {"train_loss": -28.088010787963867, "global_step": 606599, "epoch": 7308} {"train_loss": -27.88947105407715, "global_step": 606600, "epoch": 7308} {"train_loss": -28.232763290405273, "global_step": 606601, "epoch": 7308} {"train_loss": -28.188074111938477, "global_step": 606602, "epoch": 7308} {"train_loss": -28.335784912109375, "global_step": 606603, "epoch": 7308} {"train_loss": -27.953027725219727, "global_step": 606604, "epoch": 7308} {"train_loss": -28.30608558654785, "global_step": 606605, "epoch": 7308} {"train_loss": -28.34955406188965, "global_step": 606606, "epoch": 7308} {"train_loss": -27.784208297729492, "global_step": 606607, "epoch": 7308} {"train_loss": -28.223819732666016, "global_step": 606608, "epoch": 7308} {"train_loss": -27.923370361328125, "global_step": 606609, "epoch": 7308} {"train_loss": -28.477041244506836, "global_step": 606610, "epoch": 7308} {"train_loss": -28.2711124420166, "global_step": 606611, "epoch": 7308} {"train_loss": -28.41786003112793, "global_step": 606612, "epoch": 7308} {"train_loss": -28.133209228515625, "global_step": 606613, "epoch": 7308} {"train_loss": -28.0845890045166, "global_step": 606614, "epoch": 7308} {"train_loss": -27.993488311767578, "global_step": 606615, "epoch": 7308} {"train_loss": -28.309125900268555, "global_step": 606616, "epoch": 7308} {"train_loss": -27.884552001953125, "global_step": 606617, "epoch": 7308} {"train_loss": -28.35481071472168, "global_step": 606618, "epoch": 7308} {"train_loss": -28.29682731628418, "global_step": 606619, "epoch": 7308} {"train_loss": -28.101072311401367, "global_step": 606620, "epoch": 7308} {"train_loss": -28.345685958862305, "global_step": 606621, "epoch": 7308} {"train_loss": -27.902130126953125, "global_step": 606622, "epoch": 7308} {"train_loss": -28.068784713745117, "global_step": 606623, "epoch": 7308} {"train_loss": -28.238203048706055, "global_step": 606624, "epoch": 7308} {"train_loss": -28.20012855529785, "global_step": 606625, "epoch": 7308} {"train_loss": -28.185211181640625, "global_step": 606626, "epoch": 7308} {"train_loss": -28.051788330078125, "global_step": 606627, "epoch": 7308} {"train_loss": -28.098255157470703, "global_step": 606628, "epoch": 7308} {"train_loss": -28.300247192382812, "global_step": 606629, "epoch": 7308} {"train_loss": -27.851715087890625, "global_step": 606630, "epoch": 7308} {"train_loss": -27.786550521850586, "global_step": 606631, "epoch": 7308} {"train_loss": -27.583663940429688, "global_step": 606632, "epoch": 7308} {"train_loss": -27.298810958862305, "global_step": 606633, "epoch": 7308} {"train_loss": -26.62664222717285, "global_step": 606634, "epoch": 7308} {"train_loss": -26.68832778930664, "global_step": 606635, "epoch": 7308} {"train_loss": -27.341184616088867, "global_step": 606636, "epoch": 7308} {"train_loss": -28.10599136352539, "global_step": 606637, "epoch": 7308} {"train_loss": -27.852161407470703, "global_step": 606638, "epoch": 7308} {"train_loss": -28.171375274658203, "global_step": 606639, "epoch": 7308} {"train_loss": -28.121967315673828, "global_step": 606640, "epoch": 7308} {"train_loss": -27.919296264648438, "global_step": 606641, "epoch": 7308} {"train_loss": -28.235715866088867, "global_step": 606642, "epoch": 7308} {"train_loss": -27.877668380737305, "global_step": 606643, "epoch": 7308} {"train_loss": -28.373432159423828, "global_step": 606644, "epoch": 7308} {"train_loss": -28.008346557617188, "global_step": 606645, "epoch": 7308} {"train_loss": -27.864480328847126, "global_step": 606646, "epoch": 7308, "val_loss": 6730185.0} {"train_loss": -27.53375816345215, "global_step": 606647, "epoch": 7309} {"train_loss": -27.543237686157227, "global_step": 606648, "epoch": 7309} {"train_loss": -27.83681297302246, "global_step": 606649, "epoch": 7309} {"train_loss": -27.96851921081543, "global_step": 606650, "epoch": 7309} {"train_loss": -27.38336181640625, "global_step": 606651, "epoch": 7309} {"train_loss": -27.605640411376953, "global_step": 606652, "epoch": 7309} {"train_loss": -27.34830665588379, "global_step": 606653, "epoch": 7309} {"train_loss": -27.89960289001465, "global_step": 606654, "epoch": 7309} {"train_loss": -27.60487174987793, "global_step": 606655, "epoch": 7309} {"train_loss": -27.373580932617188, "global_step": 606656, "epoch": 7309} {"train_loss": -27.557819366455078, "global_step": 606657, "epoch": 7309} {"train_loss": -27.479333877563477, "global_step": 606658, "epoch": 7309} {"train_loss": -27.70294189453125, "global_step": 606659, "epoch": 7309} {"train_loss": -28.00892448425293, "global_step": 606660, "epoch": 7309} {"train_loss": -27.78938102722168, "global_step": 606661, "epoch": 7309} {"train_loss": -27.742212295532227, "global_step": 606662, "epoch": 7309} {"train_loss": -27.987506866455078, "global_step": 606663, "epoch": 7309} {"train_loss": -27.921228408813477, "global_step": 606664, "epoch": 7309} {"train_loss": -27.99354362487793, "global_step": 606665, "epoch": 7309} {"train_loss": -28.177473068237305, "global_step": 606666, "epoch": 7309} {"train_loss": -27.913864135742188, "global_step": 606667, "epoch": 7309} {"train_loss": -28.047225952148438, "global_step": 606668, "epoch": 7309} {"train_loss": -28.161733627319336, "global_step": 606669, "epoch": 7309} {"train_loss": -27.9306583404541, "global_step": 606670, "epoch": 7309} {"train_loss": -28.29801368713379, "global_step": 606671, "epoch": 7309} {"train_loss": -28.273096084594727, "global_step": 606672, "epoch": 7309} {"train_loss": -27.88446617126465, "global_step": 606673, "epoch": 7309} {"train_loss": -28.325658798217773, "global_step": 606674, "epoch": 7309} {"train_loss": -28.40455436706543, "global_step": 606675, "epoch": 7309} {"train_loss": -28.2431583404541, "global_step": 606676, "epoch": 7309} {"train_loss": -28.3100528717041, "global_step": 606677, "epoch": 7309} {"train_loss": -28.114328384399414, "global_step": 606678, "epoch": 7309} {"train_loss": -28.419965744018555, "global_step": 606679, "epoch": 7309} {"train_loss": -28.3370418548584, "global_step": 606680, "epoch": 7309} {"train_loss": -28.100767135620117, "global_step": 606681, "epoch": 7309} {"train_loss": -27.966888427734375, "global_step": 606682, "epoch": 7309} {"train_loss": -28.17632484436035, "global_step": 606683, "epoch": 7309} {"train_loss": -28.410505294799805, "global_step": 606684, "epoch": 7309} {"train_loss": -28.142688751220703, "global_step": 606685, "epoch": 7309} {"train_loss": -28.10255241394043, "global_step": 606686, "epoch": 7309} {"train_loss": -28.210403442382812, "global_step": 606687, "epoch": 7309} {"train_loss": -28.02351188659668, "global_step": 606688, "epoch": 7309} {"train_loss": -28.384729385375977, "global_step": 606689, "epoch": 7309} {"train_loss": -28.255176544189453, "global_step": 606690, "epoch": 7309} {"train_loss": -27.665958404541016, "global_step": 606691, "epoch": 7309} {"train_loss": -28.527490615844727, "global_step": 606692, "epoch": 7309} {"train_loss": -27.681371688842773, "global_step": 606693, "epoch": 7309} {"train_loss": -28.185041427612305, "global_step": 606694, "epoch": 7309} {"train_loss": -28.125186920166016, "global_step": 606695, "epoch": 7309} {"train_loss": -28.093610763549805, "global_step": 606696, "epoch": 7309} {"train_loss": -28.323318481445312, "global_step": 606697, "epoch": 7309} {"train_loss": -28.08808708190918, "global_step": 606698, "epoch": 7309} {"train_loss": -27.93037223815918, "global_step": 606699, "epoch": 7309} {"train_loss": -27.739627838134766, "global_step": 606700, "epoch": 7309} {"train_loss": -27.317138671875, "global_step": 606701, "epoch": 7309} {"train_loss": -27.029504776000977, "global_step": 606702, "epoch": 7309} {"train_loss": -27.445188522338867, "global_step": 606703, "epoch": 7309} {"train_loss": -28.106616973876953, "global_step": 606704, "epoch": 7309} {"train_loss": -28.156177520751953, "global_step": 606705, "epoch": 7309} {"train_loss": -27.757238388061523, "global_step": 606706, "epoch": 7309} {"train_loss": -28.41724967956543, "global_step": 606707, "epoch": 7309} {"train_loss": -28.187347412109375, "global_step": 606708, "epoch": 7309} {"train_loss": -28.232587814331055, "global_step": 606709, "epoch": 7309} {"train_loss": -28.276208877563477, "global_step": 606710, "epoch": 7309} {"train_loss": -28.286529541015625, "global_step": 606711, "epoch": 7309} {"train_loss": -28.317853927612305, "global_step": 606712, "epoch": 7309} {"train_loss": -28.154525756835938, "global_step": 606713, "epoch": 7309} {"train_loss": -28.57989501953125, "global_step": 606714, "epoch": 7309} {"train_loss": -28.300662994384766, "global_step": 606715, "epoch": 7309} {"train_loss": -28.439599990844727, "global_step": 606716, "epoch": 7309} {"train_loss": -28.434900283813477, "global_step": 606717, "epoch": 7309} {"train_loss": -28.434247970581055, "global_step": 606718, "epoch": 7309} {"train_loss": -28.04436683654785, "global_step": 606719, "epoch": 7309} {"train_loss": -28.203521728515625, "global_step": 606720, "epoch": 7309} {"train_loss": -28.19793701171875, "global_step": 606721, "epoch": 7309} {"train_loss": -28.029617309570312, "global_step": 606722, "epoch": 7309} {"train_loss": -28.585453033447266, "global_step": 606723, "epoch": 7309} {"train_loss": -27.85279655456543, "global_step": 606724, "epoch": 7309} {"train_loss": -27.90216064453125, "global_step": 606725, "epoch": 7309} {"train_loss": -27.518110275268555, "global_step": 606726, "epoch": 7309} {"train_loss": -27.741641998291016, "global_step": 606727, "epoch": 7309} {"train_loss": -27.734960556030273, "global_step": 606728, "epoch": 7309} {"train_loss": -28.012856609850044, "global_step": 606729, "epoch": 7309, "val_loss": 6562310.5} {"train_loss": -27.062458038330078, "global_step": 606730, "epoch": 7310} {"train_loss": -27.099533081054688, "global_step": 606731, "epoch": 7310} {"train_loss": -27.486997604370117, "global_step": 606732, "epoch": 7310} {"train_loss": -27.080341339111328, "global_step": 606733, "epoch": 7310} {"train_loss": -27.362836837768555, "global_step": 606734, "epoch": 7310} {"train_loss": -27.517684936523438, "global_step": 606735, "epoch": 7310} {"train_loss": -27.45157814025879, "global_step": 606736, "epoch": 7310} {"train_loss": -28.0091609954834, "global_step": 606737, "epoch": 7310} {"train_loss": -27.87978172302246, "global_step": 606738, "epoch": 7310} {"train_loss": -27.77685546875, "global_step": 606739, "epoch": 7310} {"train_loss": -27.4681396484375, "global_step": 606740, "epoch": 7310} {"train_loss": -27.8005313873291, "global_step": 606741, "epoch": 7310} {"train_loss": -27.434255599975586, "global_step": 606742, "epoch": 7310} {"train_loss": -27.66815185546875, "global_step": 606743, "epoch": 7310} {"train_loss": -27.171293258666992, "global_step": 606744, "epoch": 7310} {"train_loss": -28.02284049987793, "global_step": 606745, "epoch": 7310} {"train_loss": -27.4189453125, "global_step": 606746, "epoch": 7310} {"train_loss": -27.53207778930664, "global_step": 606747, "epoch": 7310} {"train_loss": -27.8515625, "global_step": 606748, "epoch": 7310} {"train_loss": -27.64963722229004, "global_step": 606749, "epoch": 7310} {"train_loss": -27.959211349487305, "global_step": 606750, "epoch": 7310} {"train_loss": -27.86333656311035, "global_step": 606751, "epoch": 7310} {"train_loss": -28.280487060546875, "global_step": 606752, "epoch": 7310} {"train_loss": -27.570758819580078, "global_step": 606753, "epoch": 7310} {"train_loss": -28.236312866210938, "global_step": 606754, "epoch": 7310} {"train_loss": -27.782251358032227, "global_step": 606755, "epoch": 7310} {"train_loss": -28.161386489868164, "global_step": 606756, "epoch": 7310} {"train_loss": -27.716739654541016, "global_step": 606757, "epoch": 7310} {"train_loss": -27.75660514831543, "global_step": 606758, "epoch": 7310} {"train_loss": -28.227924346923828, "global_step": 606759, "epoch": 7310} {"train_loss": -27.907657623291016, "global_step": 606760, "epoch": 7310} {"train_loss": -27.9872989654541, "global_step": 606761, "epoch": 7310} {"train_loss": -28.210119247436523, "global_step": 606762, "epoch": 7310} {"train_loss": -27.822797775268555, "global_step": 606763, "epoch": 7310} {"train_loss": -28.10369873046875, "global_step": 606764, "epoch": 7310} {"train_loss": -28.0765323638916, "global_step": 606765, "epoch": 7310} {"train_loss": -28.085432052612305, "global_step": 606766, "epoch": 7310} {"train_loss": -27.968725204467773, "global_step": 606767, "epoch": 7310} {"train_loss": -28.288318634033203, "global_step": 606768, "epoch": 7310} {"train_loss": -28.214496612548828, "global_step": 606769, "epoch": 7310} {"train_loss": -28.301868438720703, "global_step": 606770, "epoch": 7310} {"train_loss": -28.070180892944336, "global_step": 606771, "epoch": 7310} {"train_loss": -27.89996910095215, "global_step": 606772, "epoch": 7310} {"train_loss": -28.13848304748535, "global_step": 606773, "epoch": 7310} {"train_loss": -28.4821834564209, "global_step": 606774, "epoch": 7310} {"train_loss": -28.0567626953125, "global_step": 606775, "epoch": 7310} {"train_loss": -27.93699073791504, "global_step": 606776, "epoch": 7310} {"train_loss": -28.201948165893555, "global_step": 606777, "epoch": 7310} {"train_loss": -27.71994972229004, "global_step": 606778, "epoch": 7310} {"train_loss": -28.214929580688477, "global_step": 606779, "epoch": 7310} {"train_loss": -27.960607528686523, "global_step": 606780, "epoch": 7310} {"train_loss": -28.087921142578125, "global_step": 606781, "epoch": 7310} {"train_loss": -27.99237632751465, "global_step": 606782, "epoch": 7310} {"train_loss": -28.225194931030273, "global_step": 606783, "epoch": 7310} {"train_loss": -28.13003921508789, "global_step": 606784, "epoch": 7310} {"train_loss": -28.090490341186523, "global_step": 606785, "epoch": 7310} {"train_loss": -28.04660987854004, "global_step": 606786, "epoch": 7310} {"train_loss": -28.53387451171875, "global_step": 606787, "epoch": 7310} {"train_loss": -28.33184814453125, "global_step": 606788, "epoch": 7310} {"train_loss": -28.410078048706055, "global_step": 606789, "epoch": 7310} {"train_loss": -28.406286239624023, "global_step": 606790, "epoch": 7310} {"train_loss": -28.12837028503418, "global_step": 606791, "epoch": 7310} {"train_loss": -28.26063346862793, "global_step": 606792, "epoch": 7310} {"train_loss": -28.048490524291992, "global_step": 606793, "epoch": 7310} {"train_loss": -28.401636123657227, "global_step": 606794, "epoch": 7310} {"train_loss": -28.579599380493164, "global_step": 606795, "epoch": 7310} {"train_loss": -27.971698760986328, "global_step": 606796, "epoch": 7310} {"train_loss": -28.202672958374023, "global_step": 606797, "epoch": 7310} {"train_loss": -28.446704864501953, "global_step": 606798, "epoch": 7310} {"train_loss": -28.00355339050293, "global_step": 606799, "epoch": 7310} {"train_loss": -28.373205184936523, "global_step": 606800, "epoch": 7310} {"train_loss": -28.066757202148438, "global_step": 606801, "epoch": 7310} {"train_loss": -28.152835845947266, "global_step": 606802, "epoch": 7310} {"train_loss": -28.09028434753418, "global_step": 606803, "epoch": 7310} {"train_loss": -28.321521759033203, "global_step": 606804, "epoch": 7310} {"train_loss": -28.150598526000977, "global_step": 606805, "epoch": 7310} {"train_loss": -27.76006507873535, "global_step": 606806, "epoch": 7310} {"train_loss": -28.287128448486328, "global_step": 606807, "epoch": 7310} {"train_loss": -28.36127281188965, "global_step": 606808, "epoch": 7310} {"train_loss": -28.513843536376953, "global_step": 606809, "epoch": 7310} {"train_loss": -28.419721603393555, "global_step": 606810, "epoch": 7310} {"train_loss": -28.16200065612793, "global_step": 606811, "epoch": 7310} {"train_loss": -27.982791464012788, "global_step": 606812, "epoch": 7310, "val_loss": 6576291.0} {"train_loss": -27.40143394470215, "global_step": 606813, "epoch": 7311} {"train_loss": -27.4390811920166, "global_step": 606814, "epoch": 7311} {"train_loss": -27.507415771484375, "global_step": 606815, "epoch": 7311} {"train_loss": -27.580347061157227, "global_step": 606816, "epoch": 7311} {"train_loss": -27.562185287475586, "global_step": 606817, "epoch": 7311} {"train_loss": -27.646575927734375, "global_step": 606818, "epoch": 7311} {"train_loss": -27.93854331970215, "global_step": 606819, "epoch": 7311} {"train_loss": -27.683338165283203, "global_step": 606820, "epoch": 7311} {"train_loss": -28.04640769958496, "global_step": 606821, "epoch": 7311} {"train_loss": -27.992185592651367, "global_step": 606822, "epoch": 7311} {"train_loss": -27.769861221313477, "global_step": 606823, "epoch": 7311} {"train_loss": -27.8375244140625, "global_step": 606824, "epoch": 7311} {"train_loss": -27.795398712158203, "global_step": 606825, "epoch": 7311} {"train_loss": -27.373889923095703, "global_step": 606826, "epoch": 7311} {"train_loss": -27.025272369384766, "global_step": 606827, "epoch": 7311} {"train_loss": -27.575788497924805, "global_step": 606828, "epoch": 7311} {"train_loss": -27.5921573638916, "global_step": 606829, "epoch": 7311} {"train_loss": -28.03067398071289, "global_step": 606830, "epoch": 7311} {"train_loss": -27.672033309936523, "global_step": 606831, "epoch": 7311} {"train_loss": -27.428869247436523, "global_step": 606832, "epoch": 7311} {"train_loss": -27.9602108001709, "global_step": 606833, "epoch": 7311} {"train_loss": -27.628149032592773, "global_step": 606834, "epoch": 7311} {"train_loss": -27.98215103149414, "global_step": 606835, "epoch": 7311} {"train_loss": -27.78285026550293, "global_step": 606836, "epoch": 7311} {"train_loss": -27.986539840698242, "global_step": 606837, "epoch": 7311} {"train_loss": -28.111902236938477, "global_step": 606838, "epoch": 7311} {"train_loss": -27.900955200195312, "global_step": 606839, "epoch": 7311} {"train_loss": -28.17966651916504, "global_step": 606840, "epoch": 7311} {"train_loss": -28.16347312927246, "global_step": 606841, "epoch": 7311} {"train_loss": -27.593698501586914, "global_step": 606842, "epoch": 7311} {"train_loss": -28.19757080078125, "global_step": 606843, "epoch": 7311} {"train_loss": -27.84220314025879, "global_step": 606844, "epoch": 7311} {"train_loss": -28.233203887939453, "global_step": 606845, "epoch": 7311} {"train_loss": -28.075927734375, "global_step": 606846, "epoch": 7311} {"train_loss": -28.286941528320312, "global_step": 606847, "epoch": 7311} {"train_loss": -28.26323890686035, "global_step": 606848, "epoch": 7311} {"train_loss": -28.32679557800293, "global_step": 606849, "epoch": 7311} {"train_loss": -28.339996337890625, "global_step": 606850, "epoch": 7311} {"train_loss": -28.0649471282959, "global_step": 606851, "epoch": 7311} {"train_loss": -28.064077377319336, "global_step": 606852, "epoch": 7311} {"train_loss": -28.159259796142578, "global_step": 606853, "epoch": 7311} {"train_loss": -28.049924850463867, "global_step": 606854, "epoch": 7311} {"train_loss": -27.845605850219727, "global_step": 606855, "epoch": 7311} {"train_loss": -27.820463180541992, "global_step": 606856, "epoch": 7311} {"train_loss": -27.526647567749023, "global_step": 606857, "epoch": 7311} {"train_loss": -27.051239013671875, "global_step": 606858, "epoch": 7311} {"train_loss": -26.459318161010742, "global_step": 606859, "epoch": 7311} {"train_loss": -27.975412368774414, "global_step": 606860, "epoch": 7311} {"train_loss": -27.72956657409668, "global_step": 606861, "epoch": 7311} {"train_loss": -27.442340850830078, "global_step": 606862, "epoch": 7311} {"train_loss": -27.94465446472168, "global_step": 606863, "epoch": 7311} {"train_loss": -27.468420028686523, "global_step": 606864, "epoch": 7311} {"train_loss": -28.1245059967041, "global_step": 606865, "epoch": 7311} {"train_loss": -27.80746841430664, "global_step": 606866, "epoch": 7311} {"train_loss": -27.895925521850586, "global_step": 606867, "epoch": 7311} {"train_loss": -27.90389060974121, "global_step": 606868, "epoch": 7311} {"train_loss": -27.969470977783203, "global_step": 606869, "epoch": 7311} {"train_loss": -27.94598960876465, "global_step": 606870, "epoch": 7311} {"train_loss": -27.52701759338379, "global_step": 606871, "epoch": 7311} {"train_loss": -27.728302001953125, "global_step": 606872, "epoch": 7311} {"train_loss": -27.908628463745117, "global_step": 606873, "epoch": 7311} {"train_loss": -28.05316734313965, "global_step": 606874, "epoch": 7311} {"train_loss": -27.80517578125, "global_step": 606875, "epoch": 7311} {"train_loss": -28.030378341674805, "global_step": 606876, "epoch": 7311} {"train_loss": -28.087011337280273, "global_step": 606877, "epoch": 7311} {"train_loss": -28.142135620117188, "global_step": 606878, "epoch": 7311} {"train_loss": -27.974079132080078, "global_step": 606879, "epoch": 7311} {"train_loss": -27.916025161743164, "global_step": 606880, "epoch": 7311} {"train_loss": -27.54425621032715, "global_step": 606881, "epoch": 7311} {"train_loss": -27.84868812561035, "global_step": 606882, "epoch": 7311} {"train_loss": -27.791519165039062, "global_step": 606883, "epoch": 7311} {"train_loss": -27.534570693969727, "global_step": 606884, "epoch": 7311} {"train_loss": -27.83039665222168, "global_step": 606885, "epoch": 7311} {"train_loss": -27.886072158813477, "global_step": 606886, "epoch": 7311} {"train_loss": -28.354999542236328, "global_step": 606887, "epoch": 7311} {"train_loss": -28.219541549682617, "global_step": 606888, "epoch": 7311} {"train_loss": -27.76771354675293, "global_step": 606889, "epoch": 7311} {"train_loss": -28.160858154296875, "global_step": 606890, "epoch": 7311} {"train_loss": -28.071317672729492, "global_step": 606891, "epoch": 7311} {"train_loss": -28.62322998046875, "global_step": 606892, "epoch": 7311} {"train_loss": -27.855863571166992, "global_step": 606893, "epoch": 7311} {"train_loss": -28.029376983642578, "global_step": 606894, "epoch": 7311} {"train_loss": -27.861271479043616, "global_step": 606895, "epoch": 7311, "val_loss": 6561127.5} {"train_loss": -27.32234001159668, "global_step": 606896, "epoch": 7312} {"train_loss": -27.722110748291016, "global_step": 606897, "epoch": 7312} {"train_loss": -27.231077194213867, "global_step": 606898, "epoch": 7312} {"train_loss": -27.920984268188477, "global_step": 606899, "epoch": 7312} {"train_loss": -27.590551376342773, "global_step": 606900, "epoch": 7312} {"train_loss": -27.60538101196289, "global_step": 606901, "epoch": 7312} {"train_loss": -27.64455223083496, "global_step": 606902, "epoch": 7312} {"train_loss": -27.175947189331055, "global_step": 606903, "epoch": 7312} {"train_loss": -27.804962158203125, "global_step": 606904, "epoch": 7312} {"train_loss": -27.955371856689453, "global_step": 606905, "epoch": 7312} {"train_loss": -27.621931076049805, "global_step": 606906, "epoch": 7312} {"train_loss": -27.328266143798828, "global_step": 606907, "epoch": 7312} {"train_loss": -27.738662719726562, "global_step": 606908, "epoch": 7312} {"train_loss": -27.676544189453125, "global_step": 606909, "epoch": 7312} {"train_loss": -27.634862899780273, "global_step": 606910, "epoch": 7312} {"train_loss": -28.133544921875, "global_step": 606911, "epoch": 7312} {"train_loss": -27.923322677612305, "global_step": 606912, "epoch": 7312} {"train_loss": -27.86993980407715, "global_step": 606913, "epoch": 7312} {"train_loss": -27.691131591796875, "global_step": 606914, "epoch": 7312} {"train_loss": -27.709630966186523, "global_step": 606915, "epoch": 7312} {"train_loss": -27.976165771484375, "global_step": 606916, "epoch": 7312} {"train_loss": -27.996870040893555, "global_step": 606917, "epoch": 7312} {"train_loss": -27.88144874572754, "global_step": 606918, "epoch": 7312} {"train_loss": -28.13897705078125, "global_step": 606919, "epoch": 7312} {"train_loss": -28.111169815063477, "global_step": 606920, "epoch": 7312} {"train_loss": -28.015356063842773, "global_step": 606921, "epoch": 7312} {"train_loss": -28.016550064086914, "global_step": 606922, "epoch": 7312} {"train_loss": -28.404895782470703, "global_step": 606923, "epoch": 7312} {"train_loss": -28.194433212280273, "global_step": 606924, "epoch": 7312} {"train_loss": -28.00775718688965, "global_step": 606925, "epoch": 7312} {"train_loss": -28.32688331604004, "global_step": 606926, "epoch": 7312} {"train_loss": -28.025360107421875, "global_step": 606927, "epoch": 7312} {"train_loss": -28.251190185546875, "global_step": 606928, "epoch": 7312} {"train_loss": -27.949445724487305, "global_step": 606929, "epoch": 7312} {"train_loss": -28.081953048706055, "global_step": 606930, "epoch": 7312} {"train_loss": -28.1209716796875, "global_step": 606931, "epoch": 7312} {"train_loss": -28.46082878112793, "global_step": 606932, "epoch": 7312} {"train_loss": -28.232959747314453, "global_step": 606933, "epoch": 7312} {"train_loss": -28.171316146850586, "global_step": 606934, "epoch": 7312} {"train_loss": -28.105138778686523, "global_step": 606935, "epoch": 7312} {"train_loss": -28.400558471679688, "global_step": 606936, "epoch": 7312} {"train_loss": -28.346342086791992, "global_step": 606937, "epoch": 7312} {"train_loss": -28.41065788269043, "global_step": 606938, "epoch": 7312} {"train_loss": -28.315399169921875, "global_step": 606939, "epoch": 7312} {"train_loss": -28.301366806030273, "global_step": 606940, "epoch": 7312} {"train_loss": -28.46148109436035, "global_step": 606941, "epoch": 7312} {"train_loss": -28.08151626586914, "global_step": 606942, "epoch": 7312} {"train_loss": -28.568151473999023, "global_step": 606943, "epoch": 7312} {"train_loss": -27.9633846282959, "global_step": 606944, "epoch": 7312} {"train_loss": -28.282129287719727, "global_step": 606945, "epoch": 7312} {"train_loss": -28.283477783203125, "global_step": 606946, "epoch": 7312} {"train_loss": -28.238113403320312, "global_step": 606947, "epoch": 7312} {"train_loss": -28.591480255126953, "global_step": 606948, "epoch": 7312} {"train_loss": -28.357297897338867, "global_step": 606949, "epoch": 7312} {"train_loss": -28.486831665039062, "global_step": 606950, "epoch": 7312} {"train_loss": -28.194616317749023, "global_step": 606951, "epoch": 7312} {"train_loss": -28.502079010009766, "global_step": 606952, "epoch": 7312} {"train_loss": -27.829187393188477, "global_step": 606953, "epoch": 7312} {"train_loss": -27.69746971130371, "global_step": 606954, "epoch": 7312} {"train_loss": -26.92449951171875, "global_step": 606955, "epoch": 7312} {"train_loss": -26.136951446533203, "global_step": 606956, "epoch": 7312} {"train_loss": -25.18708610534668, "global_step": 606957, "epoch": 7312} {"train_loss": -27.93099021911621, "global_step": 606958, "epoch": 7312} {"train_loss": -27.57221794128418, "global_step": 606959, "epoch": 7312} {"train_loss": -27.43158531188965, "global_step": 606960, "epoch": 7312} {"train_loss": -27.501569747924805, "global_step": 606961, "epoch": 7312} {"train_loss": -27.2989501953125, "global_step": 606962, "epoch": 7312} {"train_loss": -28.04607582092285, "global_step": 606963, "epoch": 7312} {"train_loss": -27.253705978393555, "global_step": 606964, "epoch": 7312} {"train_loss": -27.902252197265625, "global_step": 606965, "epoch": 7312} {"train_loss": -27.913532257080078, "global_step": 606966, "epoch": 7312} {"train_loss": -27.340503692626953, "global_step": 606967, "epoch": 7312} {"train_loss": -28.021570205688477, "global_step": 606968, "epoch": 7312} {"train_loss": -27.3836612701416, "global_step": 606969, "epoch": 7312} {"train_loss": -27.805601119995117, "global_step": 606970, "epoch": 7312} {"train_loss": -27.9819393157959, "global_step": 606971, "epoch": 7312} {"train_loss": -27.75885009765625, "global_step": 606972, "epoch": 7312} {"train_loss": -27.878244400024414, "global_step": 606973, "epoch": 7312} {"train_loss": -27.95423698425293, "global_step": 606974, "epoch": 7312} {"train_loss": -27.915924072265625, "global_step": 606975, "epoch": 7312} {"train_loss": -27.97663688659668, "global_step": 606976, "epoch": 7312} {"train_loss": -27.654102325439453, "global_step": 606977, "epoch": 7312} {"train_loss": -27.88246481102633, "global_step": 606978, "epoch": 7312, "val_loss": 6651011.0} {"train_loss": -27.865234375, "global_step": 606979, "epoch": 7313} {"train_loss": -27.8287353515625, "global_step": 606980, "epoch": 7313} {"train_loss": -27.593994140625, "global_step": 606981, "epoch": 7313} {"train_loss": -27.636688232421875, "global_step": 606982, "epoch": 7313} {"train_loss": -27.579084396362305, "global_step": 606983, "epoch": 7313} {"train_loss": -27.154998779296875, "global_step": 606984, "epoch": 7313} {"train_loss": -27.368728637695312, "global_step": 606985, "epoch": 7313} {"train_loss": -27.5607967376709, "global_step": 606986, "epoch": 7313} {"train_loss": -27.249866485595703, "global_step": 606987, "epoch": 7313} {"train_loss": -27.606054306030273, "global_step": 606988, "epoch": 7313} {"train_loss": -27.5263614654541, "global_step": 606989, "epoch": 7313} {"train_loss": -27.86566734313965, "global_step": 606990, "epoch": 7313} {"train_loss": -27.690673828125, "global_step": 606991, "epoch": 7313} {"train_loss": -27.819494247436523, "global_step": 606992, "epoch": 7313} {"train_loss": -27.894453048706055, "global_step": 606993, "epoch": 7313} {"train_loss": -27.894306182861328, "global_step": 606994, "epoch": 7313} {"train_loss": -27.73470115661621, "global_step": 606995, "epoch": 7313} {"train_loss": -27.739913940429688, "global_step": 606996, "epoch": 7313} {"train_loss": -28.191755294799805, "global_step": 606997, "epoch": 7313} {"train_loss": -27.680673599243164, "global_step": 606998, "epoch": 7313} {"train_loss": -27.8622989654541, "global_step": 606999, "epoch": 7313} {"train_loss": -28.11750602722168, "global_step": 607000, "epoch": 7313} {"train_loss": -28.18939781188965, "global_step": 607001, "epoch": 7313} {"train_loss": -28.008563995361328, "global_step": 607002, "epoch": 7313} {"train_loss": -27.853296279907227, "global_step": 607003, "epoch": 7313} {"train_loss": -27.9038028717041, "global_step": 607004, "epoch": 7313} {"train_loss": -28.015625, "global_step": 607005, "epoch": 7313} {"train_loss": -28.2995662689209, "global_step": 607006, "epoch": 7313} {"train_loss": -28.173110961914062, "global_step": 607007, "epoch": 7313} {"train_loss": -27.95147132873535, "global_step": 607008, "epoch": 7313} {"train_loss": -28.130598068237305, "global_step": 607009, "epoch": 7313} {"train_loss": -28.286407470703125, "global_step": 607010, "epoch": 7313} {"train_loss": -28.148193359375, "global_step": 607011, "epoch": 7313} {"train_loss": -28.259626388549805, "global_step": 607012, "epoch": 7313} {"train_loss": -28.100584030151367, "global_step": 607013, "epoch": 7313} {"train_loss": -28.17366600036621, "global_step": 607014, "epoch": 7313} {"train_loss": -28.397144317626953, "global_step": 607015, "epoch": 7313} {"train_loss": -28.0419921875, "global_step": 607016, "epoch": 7313} {"train_loss": -27.95417594909668, "global_step": 607017, "epoch": 7313} {"train_loss": -28.092548370361328, "global_step": 607018, "epoch": 7313} {"train_loss": -28.024646759033203, "global_step": 607019, "epoch": 7313} {"train_loss": -28.036209106445312, "global_step": 607020, "epoch": 7313} {"train_loss": -28.16639518737793, "global_step": 607021, "epoch": 7313} {"train_loss": -27.895893096923828, "global_step": 607022, "epoch": 7313} {"train_loss": -27.49347496032715, "global_step": 607023, "epoch": 7313} {"train_loss": -28.131811141967773, "global_step": 607024, "epoch": 7313} {"train_loss": -28.320226669311523, "global_step": 607025, "epoch": 7313} {"train_loss": -28.033544540405273, "global_step": 607026, "epoch": 7313} {"train_loss": -27.845169067382812, "global_step": 607027, "epoch": 7313} {"train_loss": -28.118879318237305, "global_step": 607028, "epoch": 7313} {"train_loss": -27.983312606811523, "global_step": 607029, "epoch": 7313} {"train_loss": -27.557025909423828, "global_step": 607030, "epoch": 7313} {"train_loss": -27.698026657104492, "global_step": 607031, "epoch": 7313} {"train_loss": -27.683670043945312, "global_step": 607032, "epoch": 7313} {"train_loss": -28.498931884765625, "global_step": 607033, "epoch": 7313} {"train_loss": -27.914783477783203, "global_step": 607034, "epoch": 7313} {"train_loss": -27.817731857299805, "global_step": 607035, "epoch": 7313} {"train_loss": -27.9405517578125, "global_step": 607036, "epoch": 7313} {"train_loss": -28.211761474609375, "global_step": 607037, "epoch": 7313} {"train_loss": -27.8637752532959, "global_step": 607038, "epoch": 7313} {"train_loss": -27.720666885375977, "global_step": 607039, "epoch": 7313} {"train_loss": -27.802282333374023, "global_step": 607040, "epoch": 7313} {"train_loss": -27.844385147094727, "global_step": 607041, "epoch": 7313} {"train_loss": -28.108020782470703, "global_step": 607042, "epoch": 7313} {"train_loss": -27.581384658813477, "global_step": 607043, "epoch": 7313} {"train_loss": -28.290054321289062, "global_step": 607044, "epoch": 7313} {"train_loss": -28.501739501953125, "global_step": 607045, "epoch": 7313} {"train_loss": -28.312549591064453, "global_step": 607046, "epoch": 7313} {"train_loss": -27.88800621032715, "global_step": 607047, "epoch": 7313} {"train_loss": -28.731525421142578, "global_step": 607048, "epoch": 7313} {"train_loss": -28.153051376342773, "global_step": 607049, "epoch": 7313} {"train_loss": -28.253101348876953, "global_step": 607050, "epoch": 7313} {"train_loss": -28.028051376342773, "global_step": 607051, "epoch": 7313} {"train_loss": -28.381610870361328, "global_step": 607052, "epoch": 7313} {"train_loss": -28.088109970092773, "global_step": 607053, "epoch": 7313} {"train_loss": -27.834760665893555, "global_step": 607054, "epoch": 7313} {"train_loss": -27.905790328979492, "global_step": 607055, "epoch": 7313} {"train_loss": -28.2432861328125, "global_step": 607056, "epoch": 7313} {"train_loss": -28.181930541992188, "global_step": 607057, "epoch": 7313} {"train_loss": -28.506427764892578, "global_step": 607058, "epoch": 7313} {"train_loss": -28.15359878540039, "global_step": 607059, "epoch": 7313} {"train_loss": -28.183557510375977, "global_step": 607060, "epoch": 7313} {"train_loss": -27.98781521349068, "global_step": 607061, "epoch": 7313, "val_loss": 6621038.0} {"train_loss": -27.838735580444336, "global_step": 607062, "epoch": 7314} {"train_loss": -28.36931800842285, "global_step": 607063, "epoch": 7314} {"train_loss": -27.324979782104492, "global_step": 607064, "epoch": 7314} {"train_loss": -27.472509384155273, "global_step": 607065, "epoch": 7314} {"train_loss": -27.723974227905273, "global_step": 607066, "epoch": 7314} {"train_loss": -27.258167266845703, "global_step": 607067, "epoch": 7314} {"train_loss": -28.2183780670166, "global_step": 607068, "epoch": 7314} {"train_loss": -27.26123046875, "global_step": 607069, "epoch": 7314} {"train_loss": -27.516590118408203, "global_step": 607070, "epoch": 7314} {"train_loss": -27.723651885986328, "global_step": 607071, "epoch": 7314} {"train_loss": -27.861806869506836, "global_step": 607072, "epoch": 7314} {"train_loss": -27.708271026611328, "global_step": 607073, "epoch": 7314} {"train_loss": -27.97809410095215, "global_step": 607074, "epoch": 7314} {"train_loss": -28.083759307861328, "global_step": 607075, "epoch": 7314} {"train_loss": -27.852888107299805, "global_step": 607076, "epoch": 7314} {"train_loss": -27.528766632080078, "global_step": 607077, "epoch": 7314} {"train_loss": -27.5505313873291, "global_step": 607078, "epoch": 7314} {"train_loss": -28.097183227539062, "global_step": 607079, "epoch": 7314} {"train_loss": -28.12678337097168, "global_step": 607080, "epoch": 7314} {"train_loss": -27.952289581298828, "global_step": 607081, "epoch": 7314} {"train_loss": -27.379566192626953, "global_step": 607082, "epoch": 7314} {"train_loss": -27.98651123046875, "global_step": 607083, "epoch": 7314} {"train_loss": -27.55719566345215, "global_step": 607084, "epoch": 7314} {"train_loss": -27.884733200073242, "global_step": 607085, "epoch": 7314} {"train_loss": -28.180572509765625, "global_step": 607086, "epoch": 7314} {"train_loss": -28.1386661529541, "global_step": 607087, "epoch": 7314} {"train_loss": -28.018823623657227, "global_step": 607088, "epoch": 7314} {"train_loss": -28.278440475463867, "global_step": 607089, "epoch": 7314} {"train_loss": -28.297021865844727, "global_step": 607090, "epoch": 7314} {"train_loss": -28.190271377563477, "global_step": 607091, "epoch": 7314} {"train_loss": -27.6935977935791, "global_step": 607092, "epoch": 7314} {"train_loss": -27.94122886657715, "global_step": 607093, "epoch": 7314} {"train_loss": -28.1661319732666, "global_step": 607094, "epoch": 7314} {"train_loss": -28.116230010986328, "global_step": 607095, "epoch": 7314} {"train_loss": -28.251937866210938, "global_step": 607096, "epoch": 7314} {"train_loss": -28.00665855407715, "global_step": 607097, "epoch": 7314} {"train_loss": -28.08199119567871, "global_step": 607098, "epoch": 7314} {"train_loss": -27.688871383666992, "global_step": 607099, "epoch": 7314} {"train_loss": -28.460437774658203, "global_step": 607100, "epoch": 7314} {"train_loss": -28.027027130126953, "global_step": 607101, "epoch": 7314} {"train_loss": -28.4207763671875, "global_step": 607102, "epoch": 7314} {"train_loss": -28.534351348876953, "global_step": 607103, "epoch": 7314} {"train_loss": -28.119098663330078, "global_step": 607104, "epoch": 7314} {"train_loss": -28.143491744995117, "global_step": 607105, "epoch": 7314} {"train_loss": -27.939502716064453, "global_step": 607106, "epoch": 7314} {"train_loss": -28.230825424194336, "global_step": 607107, "epoch": 7314} {"train_loss": -28.064054489135742, "global_step": 607108, "epoch": 7314} {"train_loss": -28.03053092956543, "global_step": 607109, "epoch": 7314} {"train_loss": -27.906171798706055, "global_step": 607110, "epoch": 7314} {"train_loss": -27.80122947692871, "global_step": 607111, "epoch": 7314} {"train_loss": -28.076223373413086, "global_step": 607112, "epoch": 7314} {"train_loss": -28.019872665405273, "global_step": 607113, "epoch": 7314} {"train_loss": -28.288166046142578, "global_step": 607114, "epoch": 7314} {"train_loss": -28.229726791381836, "global_step": 607115, "epoch": 7314} {"train_loss": -27.92180824279785, "global_step": 607116, "epoch": 7314} {"train_loss": -28.027790069580078, "global_step": 607117, "epoch": 7314} {"train_loss": -27.804189682006836, "global_step": 607118, "epoch": 7314} {"train_loss": -27.894271850585938, "global_step": 607119, "epoch": 7314} {"train_loss": -28.406696319580078, "global_step": 607120, "epoch": 7314} {"train_loss": -28.029666900634766, "global_step": 607121, "epoch": 7314} {"train_loss": -28.40846061706543, "global_step": 607122, "epoch": 7314} {"train_loss": -28.262319564819336, "global_step": 607123, "epoch": 7314} {"train_loss": -27.79526138305664, "global_step": 607124, "epoch": 7314} {"train_loss": -27.53309440612793, "global_step": 607125, "epoch": 7314} {"train_loss": -28.225723266601562, "global_step": 607126, "epoch": 7314} {"train_loss": -27.716257095336914, "global_step": 607127, "epoch": 7314} {"train_loss": -27.46954917907715, "global_step": 607128, "epoch": 7314} {"train_loss": -28.05560302734375, "global_step": 607129, "epoch": 7314} {"train_loss": -28.00713539123535, "global_step": 607130, "epoch": 7314} {"train_loss": -28.157489776611328, "global_step": 607131, "epoch": 7314} {"train_loss": -28.496814727783203, "global_step": 607132, "epoch": 7314} {"train_loss": -28.2476806640625, "global_step": 607133, "epoch": 7314} {"train_loss": -27.77410888671875, "global_step": 607134, "epoch": 7314} {"train_loss": -27.910444259643555, "global_step": 607135, "epoch": 7314} {"train_loss": -27.978307723999023, "global_step": 607136, "epoch": 7314} {"train_loss": -27.97930335998535, "global_step": 607137, "epoch": 7314} {"train_loss": -28.029739379882812, "global_step": 607138, "epoch": 7314} {"train_loss": -28.02685546875, "global_step": 607139, "epoch": 7314} {"train_loss": -27.240646362304688, "global_step": 607140, "epoch": 7314} {"train_loss": -28.055225372314453, "global_step": 607141, "epoch": 7314} {"train_loss": -27.8184757232666, "global_step": 607142, "epoch": 7314} {"train_loss": -27.554656982421875, "global_step": 607143, "epoch": 7314} {"train_loss": -27.963393475635943, "global_step": 607144, "epoch": 7314, "val_loss": 6593584.5} {"train_loss": -27.509103775024414, "global_step": 607145, "epoch": 7315} {"train_loss": -28.218900680541992, "global_step": 607146, "epoch": 7315} {"train_loss": -27.52166748046875, "global_step": 607147, "epoch": 7315} {"train_loss": -27.458698272705078, "global_step": 607148, "epoch": 7315} {"train_loss": -27.718114852905273, "global_step": 607149, "epoch": 7315} {"train_loss": -27.23713493347168, "global_step": 607150, "epoch": 7315} {"train_loss": -27.358600616455078, "global_step": 607151, "epoch": 7315} {"train_loss": -27.556198120117188, "global_step": 607152, "epoch": 7315} {"train_loss": -27.70830726623535, "global_step": 607153, "epoch": 7315} {"train_loss": -27.559118270874023, "global_step": 607154, "epoch": 7315} {"train_loss": -27.850000381469727, "global_step": 607155, "epoch": 7315} {"train_loss": -28.011627197265625, "global_step": 607156, "epoch": 7315} {"train_loss": -27.587087631225586, "global_step": 607157, "epoch": 7315} {"train_loss": -27.288593292236328, "global_step": 607158, "epoch": 7315} {"train_loss": -27.55316734313965, "global_step": 607159, "epoch": 7315} {"train_loss": -27.540332794189453, "global_step": 607160, "epoch": 7315} {"train_loss": -27.592382431030273, "global_step": 607161, "epoch": 7315} {"train_loss": -27.045751571655273, "global_step": 607162, "epoch": 7315} {"train_loss": -27.582117080688477, "global_step": 607163, "epoch": 7315} {"train_loss": -27.723386764526367, "global_step": 607164, "epoch": 7315} {"train_loss": -27.2372989654541, "global_step": 607165, "epoch": 7315} {"train_loss": -27.275449752807617, "global_step": 607166, "epoch": 7315} {"train_loss": -26.934253692626953, "global_step": 607167, "epoch": 7315} {"train_loss": -27.734241485595703, "global_step": 607168, "epoch": 7315} {"train_loss": -27.610193252563477, "global_step": 607169, "epoch": 7315} {"train_loss": -27.6494197845459, "global_step": 607170, "epoch": 7315} {"train_loss": -27.99732780456543, "global_step": 607171, "epoch": 7315} {"train_loss": -27.2381649017334, "global_step": 607172, "epoch": 7315} {"train_loss": -27.55718421936035, "global_step": 607173, "epoch": 7315} {"train_loss": -28.14198875427246, "global_step": 607174, "epoch": 7315} {"train_loss": -27.7711181640625, "global_step": 607175, "epoch": 7315} {"train_loss": -27.46986198425293, "global_step": 607176, "epoch": 7315} {"train_loss": -27.671512603759766, "global_step": 607177, "epoch": 7315} {"train_loss": -28.047073364257812, "global_step": 607178, "epoch": 7315} {"train_loss": -27.771268844604492, "global_step": 607179, "epoch": 7315} {"train_loss": -28.061050415039062, "global_step": 607180, "epoch": 7315} {"train_loss": -28.2343692779541, "global_step": 607181, "epoch": 7315} {"train_loss": -27.708967208862305, "global_step": 607182, "epoch": 7315} {"train_loss": -27.947956085205078, "global_step": 607183, "epoch": 7315} {"train_loss": -28.172626495361328, "global_step": 607184, "epoch": 7315} {"train_loss": -27.95100212097168, "global_step": 607185, "epoch": 7315} {"train_loss": -27.821889877319336, "global_step": 607186, "epoch": 7315} {"train_loss": -28.056629180908203, "global_step": 607187, "epoch": 7315} {"train_loss": -28.35540771484375, "global_step": 607188, "epoch": 7315} {"train_loss": -28.050861358642578, "global_step": 607189, "epoch": 7315} {"train_loss": -28.260549545288086, "global_step": 607190, "epoch": 7315} {"train_loss": -28.430505752563477, "global_step": 607191, "epoch": 7315} {"train_loss": -28.275083541870117, "global_step": 607192, "epoch": 7315} {"train_loss": -28.511911392211914, "global_step": 607193, "epoch": 7315} {"train_loss": -28.135242462158203, "global_step": 607194, "epoch": 7315} {"train_loss": -28.03609275817871, "global_step": 607195, "epoch": 7315} {"train_loss": -27.987394332885742, "global_step": 607196, "epoch": 7315} {"train_loss": -28.496015548706055, "global_step": 607197, "epoch": 7315} {"train_loss": -28.344100952148438, "global_step": 607198, "epoch": 7315} {"train_loss": -28.0819091796875, "global_step": 607199, "epoch": 7315} {"train_loss": -28.546655654907227, "global_step": 607200, "epoch": 7315} {"train_loss": -28.164386749267578, "global_step": 607201, "epoch": 7315} {"train_loss": -28.10468101501465, "global_step": 607202, "epoch": 7315} {"train_loss": -28.324140548706055, "global_step": 607203, "epoch": 7315} {"train_loss": -28.645099639892578, "global_step": 607204, "epoch": 7315} {"train_loss": -28.583515167236328, "global_step": 607205, "epoch": 7315} {"train_loss": -28.334381103515625, "global_step": 607206, "epoch": 7315} {"train_loss": -28.58564567565918, "global_step": 607207, "epoch": 7315} {"train_loss": -28.153095245361328, "global_step": 607208, "epoch": 7315} {"train_loss": -28.070280075073242, "global_step": 607209, "epoch": 7315} {"train_loss": -28.08856201171875, "global_step": 607210, "epoch": 7315} {"train_loss": -28.5136661529541, "global_step": 607211, "epoch": 7315} {"train_loss": -28.444473266601562, "global_step": 607212, "epoch": 7315} {"train_loss": -28.31719398498535, "global_step": 607213, "epoch": 7315} {"train_loss": -28.424840927124023, "global_step": 607214, "epoch": 7315} {"train_loss": -27.937192916870117, "global_step": 607215, "epoch": 7315} {"train_loss": -28.220169067382812, "global_step": 607216, "epoch": 7315} {"train_loss": -28.384693145751953, "global_step": 607217, "epoch": 7315} {"train_loss": -27.9271240234375, "global_step": 607218, "epoch": 7315} {"train_loss": -28.05462646484375, "global_step": 607219, "epoch": 7315} {"train_loss": -27.85931968688965, "global_step": 607220, "epoch": 7315} {"train_loss": -27.37967872619629, "global_step": 607221, "epoch": 7315} {"train_loss": -28.21272087097168, "global_step": 607222, "epoch": 7315} {"train_loss": -28.2210750579834, "global_step": 607223, "epoch": 7315} {"train_loss": -28.089447021484375, "global_step": 607224, "epoch": 7315} {"train_loss": -27.200489044189453, "global_step": 607225, "epoch": 7315} {"train_loss": -27.08399772644043, "global_step": 607226, "epoch": 7315} {"train_loss": -27.891669583607868, "global_step": 607227, "epoch": 7315, "val_loss": 6660864.0} {"train_loss": -26.502161026000977, "global_step": 607228, "epoch": 7316} {"train_loss": -26.82538414001465, "global_step": 607229, "epoch": 7316} {"train_loss": -27.187475204467773, "global_step": 607230, "epoch": 7316} {"train_loss": -27.045700073242188, "global_step": 607231, "epoch": 7316} {"train_loss": -27.011768341064453, "global_step": 607232, "epoch": 7316} {"train_loss": -26.909774780273438, "global_step": 607233, "epoch": 7316} {"train_loss": -27.25249671936035, "global_step": 607234, "epoch": 7316} {"train_loss": -27.231779098510742, "global_step": 607235, "epoch": 7316} {"train_loss": -27.053802490234375, "global_step": 607236, "epoch": 7316} {"train_loss": -27.13483238220215, "global_step": 607237, "epoch": 7316} {"train_loss": -27.155017852783203, "global_step": 607238, "epoch": 7316} {"train_loss": -27.615726470947266, "global_step": 607239, "epoch": 7316} {"train_loss": -27.184783935546875, "global_step": 607240, "epoch": 7316} {"train_loss": -27.560964584350586, "global_step": 607241, "epoch": 7316} {"train_loss": -27.569732666015625, "global_step": 607242, "epoch": 7316} {"train_loss": -27.283666610717773, "global_step": 607243, "epoch": 7316} {"train_loss": -27.248456954956055, "global_step": 607244, "epoch": 7316} {"train_loss": -27.339157104492188, "global_step": 607245, "epoch": 7316} {"train_loss": -27.727191925048828, "global_step": 607246, "epoch": 7316} {"train_loss": -27.56733512878418, "global_step": 607247, "epoch": 7316} {"train_loss": -27.51431655883789, "global_step": 607248, "epoch": 7316} {"train_loss": -27.978321075439453, "global_step": 607249, "epoch": 7316} {"train_loss": -27.878320693969727, "global_step": 607250, "epoch": 7316} {"train_loss": -28.023656845092773, "global_step": 607251, "epoch": 7316} {"train_loss": -28.05632972717285, "global_step": 607252, "epoch": 7316} {"train_loss": -27.887216567993164, "global_step": 607253, "epoch": 7316} {"train_loss": -28.26527214050293, "global_step": 607254, "epoch": 7316} {"train_loss": -27.924055099487305, "global_step": 607255, "epoch": 7316} {"train_loss": -28.0778751373291, "global_step": 607256, "epoch": 7316} {"train_loss": -28.075225830078125, "global_step": 607257, "epoch": 7316} {"train_loss": -27.656896591186523, "global_step": 607258, "epoch": 7316} {"train_loss": -27.9822940826416, "global_step": 607259, "epoch": 7316} {"train_loss": -27.900182723999023, "global_step": 607260, "epoch": 7316} {"train_loss": -28.370832443237305, "global_step": 607261, "epoch": 7316} {"train_loss": -28.075342178344727, "global_step": 607262, "epoch": 7316} {"train_loss": -28.237150192260742, "global_step": 607263, "epoch": 7316} {"train_loss": -28.108179092407227, "global_step": 607264, "epoch": 7316} {"train_loss": -27.892520904541016, "global_step": 607265, "epoch": 7316} {"train_loss": -27.82538414001465, "global_step": 607266, "epoch": 7316} {"train_loss": -28.32464599609375, "global_step": 607267, "epoch": 7316} {"train_loss": -27.97226905822754, "global_step": 607268, "epoch": 7316} {"train_loss": -28.310672760009766, "global_step": 607269, "epoch": 7316} {"train_loss": -28.438312530517578, "global_step": 607270, "epoch": 7316} {"train_loss": -28.359256744384766, "global_step": 607271, "epoch": 7316} {"train_loss": -27.974140167236328, "global_step": 607272, "epoch": 7316} {"train_loss": -28.367328643798828, "global_step": 607273, "epoch": 7316} {"train_loss": -28.375707626342773, "global_step": 607274, "epoch": 7316} {"train_loss": -27.841964721679688, "global_step": 607275, "epoch": 7316} {"train_loss": -28.341455459594727, "global_step": 607276, "epoch": 7316} {"train_loss": -28.401641845703125, "global_step": 607277, "epoch": 7316} {"train_loss": -28.14771842956543, "global_step": 607278, "epoch": 7316} {"train_loss": -27.959732055664062, "global_step": 607279, "epoch": 7316} {"train_loss": -28.375329971313477, "global_step": 607280, "epoch": 7316} {"train_loss": -28.219106674194336, "global_step": 607281, "epoch": 7316} {"train_loss": -28.011133193969727, "global_step": 607282, "epoch": 7316} {"train_loss": -28.070215225219727, "global_step": 607283, "epoch": 7316} {"train_loss": -27.990991592407227, "global_step": 607284, "epoch": 7316} {"train_loss": -27.73944664001465, "global_step": 607285, "epoch": 7316} {"train_loss": -27.91546058654785, "global_step": 607286, "epoch": 7316} {"train_loss": -27.549585342407227, "global_step": 607287, "epoch": 7316} {"train_loss": -27.5400390625, "global_step": 607288, "epoch": 7316} {"train_loss": -27.108251571655273, "global_step": 607289, "epoch": 7316} {"train_loss": -27.51368522644043, "global_step": 607290, "epoch": 7316} {"train_loss": -28.069000244140625, "global_step": 607291, "epoch": 7316} {"train_loss": -28.215927124023438, "global_step": 607292, "epoch": 7316} {"train_loss": -28.016889572143555, "global_step": 607293, "epoch": 7316} {"train_loss": -28.352920532226562, "global_step": 607294, "epoch": 7316} {"train_loss": -27.721899032592773, "global_step": 607295, "epoch": 7316} {"train_loss": -28.302885055541992, "global_step": 607296, "epoch": 7316} {"train_loss": -28.08003807067871, "global_step": 607297, "epoch": 7316} {"train_loss": -27.882925033569336, "global_step": 607298, "epoch": 7316} {"train_loss": -28.240970611572266, "global_step": 607299, "epoch": 7316} {"train_loss": -28.04096794128418, "global_step": 607300, "epoch": 7316} {"train_loss": -28.08953285217285, "global_step": 607301, "epoch": 7316} {"train_loss": -27.588241577148438, "global_step": 607302, "epoch": 7316} {"train_loss": -28.192224502563477, "global_step": 607303, "epoch": 7316} {"train_loss": -27.926620483398438, "global_step": 607304, "epoch": 7316} {"train_loss": -27.905563354492188, "global_step": 607305, "epoch": 7316} {"train_loss": -28.16590690612793, "global_step": 607306, "epoch": 7316} {"train_loss": -28.34078025817871, "global_step": 607307, "epoch": 7316} {"train_loss": -27.934295654296875, "global_step": 607308, "epoch": 7316} {"train_loss": -28.02017593383789, "global_step": 607309, "epoch": 7316} {"train_loss": -27.827118540384685, "global_step": 607310, "epoch": 7316, "val_loss": 6610187.0} {"train_loss": -27.835615158081055, "global_step": 607311, "epoch": 7317} {"train_loss": -27.621994018554688, "global_step": 607312, "epoch": 7317} {"train_loss": -26.806659698486328, "global_step": 607313, "epoch": 7317} {"train_loss": -26.2133731842041, "global_step": 607314, "epoch": 7317} {"train_loss": -26.215503692626953, "global_step": 607315, "epoch": 7317} {"train_loss": -26.898344039916992, "global_step": 607316, "epoch": 7317} {"train_loss": -27.415613174438477, "global_step": 607317, "epoch": 7317} {"train_loss": -27.53486442565918, "global_step": 607318, "epoch": 7317} {"train_loss": -27.583112716674805, "global_step": 607319, "epoch": 7317} {"train_loss": -27.679426193237305, "global_step": 607320, "epoch": 7317} {"train_loss": -27.96571159362793, "global_step": 607321, "epoch": 7317} {"train_loss": -27.571996688842773, "global_step": 607322, "epoch": 7317} {"train_loss": -27.925939559936523, "global_step": 607323, "epoch": 7317} {"train_loss": -28.123212814331055, "global_step": 607324, "epoch": 7317} {"train_loss": -27.988391876220703, "global_step": 607325, "epoch": 7317} {"train_loss": -28.190027236938477, "global_step": 607326, "epoch": 7317} {"train_loss": -27.8428955078125, "global_step": 607327, "epoch": 7317} {"train_loss": -28.044391632080078, "global_step": 607328, "epoch": 7317} {"train_loss": -27.978872299194336, "global_step": 607329, "epoch": 7317} {"train_loss": -28.0266170501709, "global_step": 607330, "epoch": 7317} {"train_loss": -27.84589195251465, "global_step": 607331, "epoch": 7317} {"train_loss": -27.944318771362305, "global_step": 607332, "epoch": 7317} {"train_loss": -27.99983787536621, "global_step": 607333, "epoch": 7317} {"train_loss": -28.14886474609375, "global_step": 607334, "epoch": 7317} {"train_loss": -27.977685928344727, "global_step": 607335, "epoch": 7317} {"train_loss": -28.036518096923828, "global_step": 607336, "epoch": 7317} {"train_loss": -28.127099990844727, "global_step": 607337, "epoch": 7317} {"train_loss": -28.059240341186523, "global_step": 607338, "epoch": 7317} {"train_loss": -28.45468521118164, "global_step": 607339, "epoch": 7317} {"train_loss": -28.178979873657227, "global_step": 607340, "epoch": 7317} {"train_loss": -28.0195369720459, "global_step": 607341, "epoch": 7317} {"train_loss": -28.494958877563477, "global_step": 607342, "epoch": 7317} {"train_loss": -27.976591110229492, "global_step": 607343, "epoch": 7317} {"train_loss": -28.34065055847168, "global_step": 607344, "epoch": 7317} {"train_loss": -27.598485946655273, "global_step": 607345, "epoch": 7317} {"train_loss": -28.248838424682617, "global_step": 607346, "epoch": 7317} {"train_loss": -27.818973541259766, "global_step": 607347, "epoch": 7317} {"train_loss": -27.88886833190918, "global_step": 607348, "epoch": 7317} {"train_loss": -28.231916427612305, "global_step": 607349, "epoch": 7317} {"train_loss": -28.271467208862305, "global_step": 607350, "epoch": 7317} {"train_loss": -28.399158477783203, "global_step": 607351, "epoch": 7317} {"train_loss": -27.931751251220703, "global_step": 607352, "epoch": 7317} {"train_loss": -28.226362228393555, "global_step": 607353, "epoch": 7317} {"train_loss": -28.402597427368164, "global_step": 607354, "epoch": 7317} {"train_loss": -28.197803497314453, "global_step": 607355, "epoch": 7317} {"train_loss": -28.0690860748291, "global_step": 607356, "epoch": 7317} {"train_loss": -27.749927520751953, "global_step": 607357, "epoch": 7317} {"train_loss": -27.868558883666992, "global_step": 607358, "epoch": 7317} {"train_loss": -28.10957908630371, "global_step": 607359, "epoch": 7317} {"train_loss": -27.804718017578125, "global_step": 607360, "epoch": 7317} {"train_loss": -27.959217071533203, "global_step": 607361, "epoch": 7317} {"train_loss": -28.22941017150879, "global_step": 607362, "epoch": 7317} {"train_loss": -28.10736656188965, "global_step": 607363, "epoch": 7317} {"train_loss": -28.153417587280273, "global_step": 607364, "epoch": 7317} {"train_loss": -28.263580322265625, "global_step": 607365, "epoch": 7317} {"train_loss": -28.405664443969727, "global_step": 607366, "epoch": 7317} {"train_loss": -28.0882568359375, "global_step": 607367, "epoch": 7317} {"train_loss": -28.046003341674805, "global_step": 607368, "epoch": 7317} {"train_loss": -28.16766357421875, "global_step": 607369, "epoch": 7317} {"train_loss": -27.7193603515625, "global_step": 607370, "epoch": 7317} {"train_loss": -27.926671981811523, "global_step": 607371, "epoch": 7317} {"train_loss": -27.160139083862305, "global_step": 607372, "epoch": 7317} {"train_loss": -27.422657012939453, "global_step": 607373, "epoch": 7317} {"train_loss": -27.7172794342041, "global_step": 607374, "epoch": 7317} {"train_loss": -28.234846115112305, "global_step": 607375, "epoch": 7317} {"train_loss": -27.656543731689453, "global_step": 607376, "epoch": 7317} {"train_loss": -28.430654525756836, "global_step": 607377, "epoch": 7317} {"train_loss": -27.80402946472168, "global_step": 607378, "epoch": 7317} {"train_loss": -27.50589942932129, "global_step": 607379, "epoch": 7317} {"train_loss": -27.528095245361328, "global_step": 607380, "epoch": 7317} {"train_loss": -28.100622177124023, "global_step": 607381, "epoch": 7317} {"train_loss": -27.820526123046875, "global_step": 607382, "epoch": 7317} {"train_loss": -28.256383895874023, "global_step": 607383, "epoch": 7317} {"train_loss": -27.973188400268555, "global_step": 607384, "epoch": 7317} {"train_loss": -27.711782455444336, "global_step": 607385, "epoch": 7317} {"train_loss": -27.909133911132812, "global_step": 607386, "epoch": 7317} {"train_loss": -27.83037757873535, "global_step": 607387, "epoch": 7317} {"train_loss": -27.7684383392334, "global_step": 607388, "epoch": 7317} {"train_loss": -27.928665161132812, "global_step": 607389, "epoch": 7317} {"train_loss": -28.16683006286621, "global_step": 607390, "epoch": 7317} {"train_loss": -27.810611724853516, "global_step": 607391, "epoch": 7317} {"train_loss": -27.930084228515625, "global_step": 607392, "epoch": 7317} {"train_loss": -27.897217394357703, "global_step": 607393, "epoch": 7317, "val_loss": 6641412.0} {"train_loss": -27.392255783081055, "global_step": 607394, "epoch": 7318} {"train_loss": -27.301605224609375, "global_step": 607395, "epoch": 7318} {"train_loss": -27.201322555541992, "global_step": 607396, "epoch": 7318} {"train_loss": -26.992090225219727, "global_step": 607397, "epoch": 7318} {"train_loss": -27.759153366088867, "global_step": 607398, "epoch": 7318} {"train_loss": -27.1517276763916, "global_step": 607399, "epoch": 7318} {"train_loss": -27.4550724029541, "global_step": 607400, "epoch": 7318} {"train_loss": -27.479385375976562, "global_step": 607401, "epoch": 7318} {"train_loss": -27.206588745117188, "global_step": 607402, "epoch": 7318} {"train_loss": -27.533660888671875, "global_step": 607403, "epoch": 7318} {"train_loss": -27.898962020874023, "global_step": 607404, "epoch": 7318} {"train_loss": -27.88740348815918, "global_step": 607405, "epoch": 7318} {"train_loss": -27.79424476623535, "global_step": 607406, "epoch": 7318} {"train_loss": -27.228971481323242, "global_step": 607407, "epoch": 7318} {"train_loss": -27.926654815673828, "global_step": 607408, "epoch": 7318} {"train_loss": -27.983972549438477, "global_step": 607409, "epoch": 7318} {"train_loss": -27.71296501159668, "global_step": 607410, "epoch": 7318} {"train_loss": -27.6874942779541, "global_step": 607411, "epoch": 7318} {"train_loss": -28.037525177001953, "global_step": 607412, "epoch": 7318} {"train_loss": -28.25677490234375, "global_step": 607413, "epoch": 7318} {"train_loss": -28.0305118560791, "global_step": 607414, "epoch": 7318} {"train_loss": -28.061254501342773, "global_step": 607415, "epoch": 7318} {"train_loss": -27.614988327026367, "global_step": 607416, "epoch": 7318} {"train_loss": -27.933923721313477, "global_step": 607417, "epoch": 7318} {"train_loss": -28.1024112701416, "global_step": 607418, "epoch": 7318} {"train_loss": -28.315744400024414, "global_step": 607419, "epoch": 7318} {"train_loss": -28.330671310424805, "global_step": 607420, "epoch": 7318} {"train_loss": -28.257837295532227, "global_step": 607421, "epoch": 7318} {"train_loss": -27.91949462890625, "global_step": 607422, "epoch": 7318} {"train_loss": -28.125141143798828, "global_step": 607423, "epoch": 7318} {"train_loss": -28.11529541015625, "global_step": 607424, "epoch": 7318} {"train_loss": -28.2988338470459, "global_step": 607425, "epoch": 7318} {"train_loss": -28.25832176208496, "global_step": 607426, "epoch": 7318} {"train_loss": -27.878311157226562, "global_step": 607427, "epoch": 7318} {"train_loss": -28.069425582885742, "global_step": 607428, "epoch": 7318} {"train_loss": -27.754535675048828, "global_step": 607429, "epoch": 7318} {"train_loss": -28.722257614135742, "global_step": 607430, "epoch": 7318} {"train_loss": -27.92034339904785, "global_step": 607431, "epoch": 7318} {"train_loss": -28.162647247314453, "global_step": 607432, "epoch": 7318} {"train_loss": -28.056318283081055, "global_step": 607433, "epoch": 7318} {"train_loss": -28.368764877319336, "global_step": 607434, "epoch": 7318} {"train_loss": -28.485427856445312, "global_step": 607435, "epoch": 7318} {"train_loss": -28.202375411987305, "global_step": 607436, "epoch": 7318} {"train_loss": -27.931293487548828, "global_step": 607437, "epoch": 7318} {"train_loss": -28.26673698425293, "global_step": 607438, "epoch": 7318} {"train_loss": -27.773975372314453, "global_step": 607439, "epoch": 7318} {"train_loss": -28.402359008789062, "global_step": 607440, "epoch": 7318} {"train_loss": -28.22718620300293, "global_step": 607441, "epoch": 7318} {"train_loss": -28.165878295898438, "global_step": 607442, "epoch": 7318} {"train_loss": -28.466089248657227, "global_step": 607443, "epoch": 7318} {"train_loss": -28.16487693786621, "global_step": 607444, "epoch": 7318} {"train_loss": -28.284902572631836, "global_step": 607445, "epoch": 7318} {"train_loss": -28.1276798248291, "global_step": 607446, "epoch": 7318} {"train_loss": -27.709012985229492, "global_step": 607447, "epoch": 7318} {"train_loss": -27.47101402282715, "global_step": 607448, "epoch": 7318} {"train_loss": -27.31361198425293, "global_step": 607449, "epoch": 7318} {"train_loss": -27.012693405151367, "global_step": 607450, "epoch": 7318} {"train_loss": -25.990217208862305, "global_step": 607451, "epoch": 7318} {"train_loss": -25.5633544921875, "global_step": 607452, "epoch": 7318} {"train_loss": -25.98357582092285, "global_step": 607453, "epoch": 7318} {"train_loss": -27.200305938720703, "global_step": 607454, "epoch": 7318} {"train_loss": -27.308683395385742, "global_step": 607455, "epoch": 7318} {"train_loss": -26.637556076049805, "global_step": 607456, "epoch": 7318} {"train_loss": -27.560562133789062, "global_step": 607457, "epoch": 7318} {"train_loss": -27.316736221313477, "global_step": 607458, "epoch": 7318} {"train_loss": -27.023944854736328, "global_step": 607459, "epoch": 7318} {"train_loss": -27.515710830688477, "global_step": 607460, "epoch": 7318} {"train_loss": -27.117084503173828, "global_step": 607461, "epoch": 7318} {"train_loss": -27.21002197265625, "global_step": 607462, "epoch": 7318} {"train_loss": -27.503482818603516, "global_step": 607463, "epoch": 7318} {"train_loss": -27.0390625, "global_step": 607464, "epoch": 7318} {"train_loss": -27.26112174987793, "global_step": 607465, "epoch": 7318} {"train_loss": -27.653522491455078, "global_step": 607466, "epoch": 7318} {"train_loss": -27.1206111907959, "global_step": 607467, "epoch": 7318} {"train_loss": -27.971160888671875, "global_step": 607468, "epoch": 7318} {"train_loss": -27.32777976989746, "global_step": 607469, "epoch": 7318} {"train_loss": -27.761962890625, "global_step": 607470, "epoch": 7318} {"train_loss": -27.607162475585938, "global_step": 607471, "epoch": 7318} {"train_loss": -27.64161491394043, "global_step": 607472, "epoch": 7318} {"train_loss": -27.73784828186035, "global_step": 607473, "epoch": 7318} {"train_loss": -28.01936912536621, "global_step": 607474, "epoch": 7318} {"train_loss": -27.636133193969727, "global_step": 607475, "epoch": 7318} {"train_loss": -27.678184578217657, "global_step": 607476, "epoch": 7318, "val_loss": 6544073.0} {"train_loss": -27.300710678100586, "global_step": 607477, "epoch": 7319} {"train_loss": -27.360248565673828, "global_step": 607478, "epoch": 7319} {"train_loss": -27.174535751342773, "global_step": 607479, "epoch": 7319} {"train_loss": -27.302831649780273, "global_step": 607480, "epoch": 7319} {"train_loss": -27.487506866455078, "global_step": 607481, "epoch": 7319} {"train_loss": -27.29866600036621, "global_step": 607482, "epoch": 7319} {"train_loss": -27.451587677001953, "global_step": 607483, "epoch": 7319} {"train_loss": -27.5153865814209, "global_step": 607484, "epoch": 7319} {"train_loss": -27.525232315063477, "global_step": 607485, "epoch": 7319} {"train_loss": -27.89283561706543, "global_step": 607486, "epoch": 7319} {"train_loss": -27.67258644104004, "global_step": 607487, "epoch": 7319} {"train_loss": -27.77583885192871, "global_step": 607488, "epoch": 7319} {"train_loss": -27.724002838134766, "global_step": 607489, "epoch": 7319} {"train_loss": -27.628931045532227, "global_step": 607490, "epoch": 7319} {"train_loss": -27.771772384643555, "global_step": 607491, "epoch": 7319} {"train_loss": -27.929492950439453, "global_step": 607492, "epoch": 7319} {"train_loss": -27.519107818603516, "global_step": 607493, "epoch": 7319} {"train_loss": -27.87800407409668, "global_step": 607494, "epoch": 7319} {"train_loss": -27.906055450439453, "global_step": 607495, "epoch": 7319} {"train_loss": -28.074514389038086, "global_step": 607496, "epoch": 7319} {"train_loss": -27.743906021118164, "global_step": 607497, "epoch": 7319} {"train_loss": -28.0788516998291, "global_step": 607498, "epoch": 7319} {"train_loss": -28.309741973876953, "global_step": 607499, "epoch": 7319} {"train_loss": -28.03948402404785, "global_step": 607500, "epoch": 7319} {"train_loss": -28.193771362304688, "global_step": 607501, "epoch": 7319} {"train_loss": -28.007080078125, "global_step": 607502, "epoch": 7319} {"train_loss": -28.248376846313477, "global_step": 607503, "epoch": 7319} {"train_loss": -28.074462890625, "global_step": 607504, "epoch": 7319} {"train_loss": -28.225605010986328, "global_step": 607505, "epoch": 7319} {"train_loss": -27.943710327148438, "global_step": 607506, "epoch": 7319} {"train_loss": -27.86777114868164, "global_step": 607507, "epoch": 7319} {"train_loss": -28.135976791381836, "global_step": 607508, "epoch": 7319} {"train_loss": -28.323047637939453, "global_step": 607509, "epoch": 7319} {"train_loss": -28.012866973876953, "global_step": 607510, "epoch": 7319} {"train_loss": -28.192066192626953, "global_step": 607511, "epoch": 7319} {"train_loss": -28.171009063720703, "global_step": 607512, "epoch": 7319} {"train_loss": -28.46453857421875, "global_step": 607513, "epoch": 7319} {"train_loss": -28.1586856842041, "global_step": 607514, "epoch": 7319} {"train_loss": -28.215957641601562, "global_step": 607515, "epoch": 7319} {"train_loss": -27.74370765686035, "global_step": 607516, "epoch": 7319} {"train_loss": -28.044626235961914, "global_step": 607517, "epoch": 7319} {"train_loss": -27.742462158203125, "global_step": 607518, "epoch": 7319} {"train_loss": -27.785486221313477, "global_step": 607519, "epoch": 7319} {"train_loss": -28.083667755126953, "global_step": 607520, "epoch": 7319} {"train_loss": -28.036542892456055, "global_step": 607521, "epoch": 7319} {"train_loss": -27.98211669921875, "global_step": 607522, "epoch": 7319} {"train_loss": -28.35696792602539, "global_step": 607523, "epoch": 7319} {"train_loss": -28.141393661499023, "global_step": 607524, "epoch": 7319} {"train_loss": -27.880054473876953, "global_step": 607525, "epoch": 7319} {"train_loss": -28.197071075439453, "global_step": 607526, "epoch": 7319} {"train_loss": -28.35786247253418, "global_step": 607527, "epoch": 7319} {"train_loss": -28.405231475830078, "global_step": 607528, "epoch": 7319} {"train_loss": -28.277231216430664, "global_step": 607529, "epoch": 7319} {"train_loss": -28.452482223510742, "global_step": 607530, "epoch": 7319} {"train_loss": -28.340116500854492, "global_step": 607531, "epoch": 7319} {"train_loss": -28.082441329956055, "global_step": 607532, "epoch": 7319} {"train_loss": -28.348703384399414, "global_step": 607533, "epoch": 7319} {"train_loss": -28.240386962890625, "global_step": 607534, "epoch": 7319} {"train_loss": -28.572912216186523, "global_step": 607535, "epoch": 7319} {"train_loss": -28.183013916015625, "global_step": 607536, "epoch": 7319} {"train_loss": -28.3675594329834, "global_step": 607537, "epoch": 7319} {"train_loss": -28.40030860900879, "global_step": 607538, "epoch": 7319} {"train_loss": -28.508447647094727, "global_step": 607539, "epoch": 7319} {"train_loss": -28.15353775024414, "global_step": 607540, "epoch": 7319} {"train_loss": -28.635488510131836, "global_step": 607541, "epoch": 7319} {"train_loss": -28.527944564819336, "global_step": 607542, "epoch": 7319} {"train_loss": -28.2288875579834, "global_step": 607543, "epoch": 7319} {"train_loss": -27.775449752807617, "global_step": 607544, "epoch": 7319} {"train_loss": -27.88630485534668, "global_step": 607545, "epoch": 7319} {"train_loss": -28.468158721923828, "global_step": 607546, "epoch": 7319} {"train_loss": -28.030115127563477, "global_step": 607547, "epoch": 7319} {"train_loss": -27.854217529296875, "global_step": 607548, "epoch": 7319} {"train_loss": -27.979236602783203, "global_step": 607549, "epoch": 7319} {"train_loss": -28.209152221679688, "global_step": 607550, "epoch": 7319} {"train_loss": -28.227243423461914, "global_step": 607551, "epoch": 7319} {"train_loss": -27.651227951049805, "global_step": 607552, "epoch": 7319} {"train_loss": -28.149845123291016, "global_step": 607553, "epoch": 7319} {"train_loss": -28.0076847076416, "global_step": 607554, "epoch": 7319} {"train_loss": -28.10009765625, "global_step": 607555, "epoch": 7319} {"train_loss": -27.7984561920166, "global_step": 607556, "epoch": 7319} {"train_loss": -27.86443519592285, "global_step": 607557, "epoch": 7319} {"train_loss": -28.163965225219727, "global_step": 607558, "epoch": 7319} {"train_loss": -28.022061910973974, "global_step": 607559, "epoch": 7319, "val_loss": 6634427.0} {"train_loss": -27.447919845581055, "global_step": 607560, "epoch": 7320} {"train_loss": -27.183917999267578, "global_step": 607561, "epoch": 7320} {"train_loss": -27.413288116455078, "global_step": 607562, "epoch": 7320} {"train_loss": -27.458282470703125, "global_step": 607563, "epoch": 7320} {"train_loss": -26.494384765625, "global_step": 607564, "epoch": 7320} {"train_loss": -27.71563720703125, "global_step": 607565, "epoch": 7320} {"train_loss": -27.790937423706055, "global_step": 607566, "epoch": 7320} {"train_loss": -27.101972579956055, "global_step": 607567, "epoch": 7320} {"train_loss": -27.414722442626953, "global_step": 607568, "epoch": 7320} {"train_loss": -27.93952751159668, "global_step": 607569, "epoch": 7320} {"train_loss": -27.720844268798828, "global_step": 607570, "epoch": 7320} {"train_loss": -27.782957077026367, "global_step": 607571, "epoch": 7320} {"train_loss": -27.406482696533203, "global_step": 607572, "epoch": 7320} {"train_loss": -27.709985733032227, "global_step": 607573, "epoch": 7320} {"train_loss": -27.621337890625, "global_step": 607574, "epoch": 7320} {"train_loss": -27.710865020751953, "global_step": 607575, "epoch": 7320} {"train_loss": -27.5361270904541, "global_step": 607576, "epoch": 7320} {"train_loss": -28.02887535095215, "global_step": 607577, "epoch": 7320} {"train_loss": -27.960098266601562, "global_step": 607578, "epoch": 7320} {"train_loss": -27.9439697265625, "global_step": 607579, "epoch": 7320} {"train_loss": -27.75310707092285, "global_step": 607580, "epoch": 7320} {"train_loss": -27.63400650024414, "global_step": 607581, "epoch": 7320} {"train_loss": -27.874547958374023, "global_step": 607582, "epoch": 7320} {"train_loss": -28.0988712310791, "global_step": 607583, "epoch": 7320} {"train_loss": -27.873788833618164, "global_step": 607584, "epoch": 7320} {"train_loss": -27.9227294921875, "global_step": 607585, "epoch": 7320} {"train_loss": -27.980798721313477, "global_step": 607586, "epoch": 7320} {"train_loss": -27.915678024291992, "global_step": 607587, "epoch": 7320} {"train_loss": -28.132471084594727, "global_step": 607588, "epoch": 7320} {"train_loss": -27.832015991210938, "global_step": 607589, "epoch": 7320} {"train_loss": -28.147321701049805, "global_step": 607590, "epoch": 7320} {"train_loss": -27.90576171875, "global_step": 607591, "epoch": 7320} {"train_loss": -27.826337814331055, "global_step": 607592, "epoch": 7320} {"train_loss": -28.50244140625, "global_step": 607593, "epoch": 7320} {"train_loss": -28.110376358032227, "global_step": 607594, "epoch": 7320} {"train_loss": -28.479766845703125, "global_step": 607595, "epoch": 7320} {"train_loss": -28.391469955444336, "global_step": 607596, "epoch": 7320} {"train_loss": -28.160367965698242, "global_step": 607597, "epoch": 7320} {"train_loss": -27.87127113342285, "global_step": 607598, "epoch": 7320} {"train_loss": -28.024215698242188, "global_step": 607599, "epoch": 7320} {"train_loss": -28.485580444335938, "global_step": 607600, "epoch": 7320} {"train_loss": -28.134693145751953, "global_step": 607601, "epoch": 7320} {"train_loss": -28.309906005859375, "global_step": 607602, "epoch": 7320} {"train_loss": -28.173877716064453, "global_step": 607603, "epoch": 7320} {"train_loss": -28.418731689453125, "global_step": 607604, "epoch": 7320} {"train_loss": -28.52201271057129, "global_step": 607605, "epoch": 7320} {"train_loss": -28.20843505859375, "global_step": 607606, "epoch": 7320} {"train_loss": -28.31625747680664, "global_step": 607607, "epoch": 7320} {"train_loss": -28.321176528930664, "global_step": 607608, "epoch": 7320} {"train_loss": -28.313989639282227, "global_step": 607609, "epoch": 7320} {"train_loss": -28.700546264648438, "global_step": 607610, "epoch": 7320} {"train_loss": -27.701038360595703, "global_step": 607611, "epoch": 7320} {"train_loss": -28.44001579284668, "global_step": 607612, "epoch": 7320} {"train_loss": -28.331130981445312, "global_step": 607613, "epoch": 7320} {"train_loss": -27.922027587890625, "global_step": 607614, "epoch": 7320} {"train_loss": -27.593433380126953, "global_step": 607615, "epoch": 7320} {"train_loss": -27.185163497924805, "global_step": 607616, "epoch": 7320} {"train_loss": -26.730789184570312, "global_step": 607617, "epoch": 7320} {"train_loss": -27.268646240234375, "global_step": 607618, "epoch": 7320} {"train_loss": -28.347421646118164, "global_step": 607619, "epoch": 7320} {"train_loss": -27.741422653198242, "global_step": 607620, "epoch": 7320} {"train_loss": -27.762258529663086, "global_step": 607621, "epoch": 7320} {"train_loss": -28.21393394470215, "global_step": 607622, "epoch": 7320} {"train_loss": -27.99835205078125, "global_step": 607623, "epoch": 7320} {"train_loss": -27.862707138061523, "global_step": 607624, "epoch": 7320} {"train_loss": -27.702680587768555, "global_step": 607625, "epoch": 7320} {"train_loss": -28.216644287109375, "global_step": 607626, "epoch": 7320} {"train_loss": -28.1778564453125, "global_step": 607627, "epoch": 7320} {"train_loss": -28.14691734313965, "global_step": 607628, "epoch": 7320} {"train_loss": -28.349781036376953, "global_step": 607629, "epoch": 7320} {"train_loss": -28.326618194580078, "global_step": 607630, "epoch": 7320} {"train_loss": -28.33835792541504, "global_step": 607631, "epoch": 7320} {"train_loss": -27.988615036010742, "global_step": 607632, "epoch": 7320} {"train_loss": -28.166126251220703, "global_step": 607633, "epoch": 7320} {"train_loss": -28.392202377319336, "global_step": 607634, "epoch": 7320} {"train_loss": -28.26569938659668, "global_step": 607635, "epoch": 7320} {"train_loss": -28.08241844177246, "global_step": 607636, "epoch": 7320} {"train_loss": -27.692808151245117, "global_step": 607637, "epoch": 7320} {"train_loss": -28.171110153198242, "global_step": 607638, "epoch": 7320} {"train_loss": -27.463232040405273, "global_step": 607639, "epoch": 7320} {"train_loss": -28.210275650024414, "global_step": 607640, "epoch": 7320} {"train_loss": -28.328704833984375, "global_step": 607641, "epoch": 7320} {"train_loss": -27.925703163606574, "global_step": 607642, "epoch": 7320, "val_loss": 6651965.5} {"train_loss": -28.09186363220215, "global_step": 607643, "epoch": 7321} {"train_loss": -28.129926681518555, "global_step": 607644, "epoch": 7321} {"train_loss": -27.70448875427246, "global_step": 607645, "epoch": 7321} {"train_loss": -27.731412887573242, "global_step": 607646, "epoch": 7321} {"train_loss": -27.427480697631836, "global_step": 607647, "epoch": 7321} {"train_loss": -27.634119033813477, "global_step": 607648, "epoch": 7321} {"train_loss": -27.751911163330078, "global_step": 607649, "epoch": 7321} {"train_loss": -27.615707397460938, "global_step": 607650, "epoch": 7321} {"train_loss": -27.650089263916016, "global_step": 607651, "epoch": 7321} {"train_loss": -27.68276023864746, "global_step": 607652, "epoch": 7321} {"train_loss": -27.8312931060791, "global_step": 607653, "epoch": 7321} {"train_loss": -27.946157455444336, "global_step": 607654, "epoch": 7321} {"train_loss": -27.669946670532227, "global_step": 607655, "epoch": 7321} {"train_loss": -27.507368087768555, "global_step": 607656, "epoch": 7321} {"train_loss": -27.929920196533203, "global_step": 607657, "epoch": 7321} {"train_loss": -27.670013427734375, "global_step": 607658, "epoch": 7321} {"train_loss": -27.59638786315918, "global_step": 607659, "epoch": 7321} {"train_loss": -28.255966186523438, "global_step": 607660, "epoch": 7321} {"train_loss": -27.8221492767334, "global_step": 607661, "epoch": 7321} {"train_loss": -28.140356063842773, "global_step": 607662, "epoch": 7321} {"train_loss": -28.172449111938477, "global_step": 607663, "epoch": 7321} {"train_loss": -28.17023277282715, "global_step": 607664, "epoch": 7321} {"train_loss": -28.039779663085938, "global_step": 607665, "epoch": 7321} {"train_loss": -27.988134384155273, "global_step": 607666, "epoch": 7321} {"train_loss": -28.21240234375, "global_step": 607667, "epoch": 7321} {"train_loss": -28.203222274780273, "global_step": 607668, "epoch": 7321} {"train_loss": -27.939289093017578, "global_step": 607669, "epoch": 7321} {"train_loss": -28.089237213134766, "global_step": 607670, "epoch": 7321} {"train_loss": -28.351667404174805, "global_step": 607671, "epoch": 7321} {"train_loss": -28.007715225219727, "global_step": 607672, "epoch": 7321} {"train_loss": -27.855743408203125, "global_step": 607673, "epoch": 7321} {"train_loss": -28.20098876953125, "global_step": 607674, "epoch": 7321} {"train_loss": -28.0098819732666, "global_step": 607675, "epoch": 7321} {"train_loss": -27.93171501159668, "global_step": 607676, "epoch": 7321} {"train_loss": -27.9436092376709, "global_step": 607677, "epoch": 7321} {"train_loss": -28.433813095092773, "global_step": 607678, "epoch": 7321} {"train_loss": -28.2794246673584, "global_step": 607679, "epoch": 7321} {"train_loss": -28.087493896484375, "global_step": 607680, "epoch": 7321} {"train_loss": -27.92487144470215, "global_step": 607681, "epoch": 7321} {"train_loss": -28.25636100769043, "global_step": 607682, "epoch": 7321} {"train_loss": -27.581430435180664, "global_step": 607683, "epoch": 7321} {"train_loss": -28.551538467407227, "global_step": 607684, "epoch": 7321} {"train_loss": -27.981679916381836, "global_step": 607685, "epoch": 7321} {"train_loss": -27.855316162109375, "global_step": 607686, "epoch": 7321} {"train_loss": -28.243515014648438, "global_step": 607687, "epoch": 7321} {"train_loss": -28.251813888549805, "global_step": 607688, "epoch": 7321} {"train_loss": -27.84234046936035, "global_step": 607689, "epoch": 7321} {"train_loss": -28.340795516967773, "global_step": 607690, "epoch": 7321} {"train_loss": -27.9298152923584, "global_step": 607691, "epoch": 7321} {"train_loss": -28.365528106689453, "global_step": 607692, "epoch": 7321} {"train_loss": -28.199848175048828, "global_step": 607693, "epoch": 7321} {"train_loss": -28.319355010986328, "global_step": 607694, "epoch": 7321} {"train_loss": -27.786212921142578, "global_step": 607695, "epoch": 7321} {"train_loss": -28.19329833984375, "global_step": 607696, "epoch": 7321} {"train_loss": -28.311203002929688, "global_step": 607697, "epoch": 7321} {"train_loss": -28.376117706298828, "global_step": 607698, "epoch": 7321} {"train_loss": -28.10834312438965, "global_step": 607699, "epoch": 7321} {"train_loss": -28.2645206451416, "global_step": 607700, "epoch": 7321} {"train_loss": -27.841094970703125, "global_step": 607701, "epoch": 7321} {"train_loss": -28.242340087890625, "global_step": 607702, "epoch": 7321} {"train_loss": -28.51068687438965, "global_step": 607703, "epoch": 7321} {"train_loss": -27.916397094726562, "global_step": 607704, "epoch": 7321} {"train_loss": -28.534992218017578, "global_step": 607705, "epoch": 7321} {"train_loss": -28.71584129333496, "global_step": 607706, "epoch": 7321} {"train_loss": -28.129077911376953, "global_step": 607707, "epoch": 7321} {"train_loss": -28.29310417175293, "global_step": 607708, "epoch": 7321} {"train_loss": -28.452075958251953, "global_step": 607709, "epoch": 7321} {"train_loss": -27.9664306640625, "global_step": 607710, "epoch": 7321} {"train_loss": -27.996408462524414, "global_step": 607711, "epoch": 7321} {"train_loss": -28.156784057617188, "global_step": 607712, "epoch": 7321} {"train_loss": -28.058368682861328, "global_step": 607713, "epoch": 7321} {"train_loss": -27.60214614868164, "global_step": 607714, "epoch": 7321} {"train_loss": -28.1646785736084, "global_step": 607715, "epoch": 7321} {"train_loss": -27.8282470703125, "global_step": 607716, "epoch": 7321} {"train_loss": -27.688974380493164, "global_step": 607717, "epoch": 7321} {"train_loss": -27.734460830688477, "global_step": 607718, "epoch": 7321} {"train_loss": -28.069547653198242, "global_step": 607719, "epoch": 7321} {"train_loss": -28.36530876159668, "global_step": 607720, "epoch": 7321} {"train_loss": -28.040637969970703, "global_step": 607721, "epoch": 7321} {"train_loss": -28.313369750976562, "global_step": 607722, "epoch": 7321} {"train_loss": -27.7938232421875, "global_step": 607723, "epoch": 7321} {"train_loss": -27.78413200378418, "global_step": 607724, "epoch": 7321} {"train_loss": -28.033296631043214, "global_step": 607725, "epoch": 7321, "val_loss": 6644980.0} {"train_loss": -27.29157066345215, "global_step": 607726, "epoch": 7322} {"train_loss": -26.1294002532959, "global_step": 607727, "epoch": 7322} {"train_loss": -24.387311935424805, "global_step": 607728, "epoch": 7322} {"train_loss": -25.643335342407227, "global_step": 607729, "epoch": 7322} {"train_loss": -26.713397979736328, "global_step": 607730, "epoch": 7322} {"train_loss": -27.133548736572266, "global_step": 607731, "epoch": 7322} {"train_loss": -26.80914878845215, "global_step": 607732, "epoch": 7322} {"train_loss": -26.963598251342773, "global_step": 607733, "epoch": 7322} {"train_loss": -27.088897705078125, "global_step": 607734, "epoch": 7322} {"train_loss": -26.8585262298584, "global_step": 607735, "epoch": 7322} {"train_loss": -27.5246524810791, "global_step": 607736, "epoch": 7322} {"train_loss": -26.7370548248291, "global_step": 607737, "epoch": 7322} {"train_loss": -26.90143394470215, "global_step": 607738, "epoch": 7322} {"train_loss": -27.101552963256836, "global_step": 607739, "epoch": 7322} {"train_loss": -26.963123321533203, "global_step": 607740, "epoch": 7322} {"train_loss": -27.043848037719727, "global_step": 607741, "epoch": 7322} {"train_loss": -27.451757431030273, "global_step": 607742, "epoch": 7322} {"train_loss": -26.880964279174805, "global_step": 607743, "epoch": 7322} {"train_loss": -27.112289428710938, "global_step": 607744, "epoch": 7322} {"train_loss": -27.3223819732666, "global_step": 607745, "epoch": 7322} {"train_loss": -27.3393611907959, "global_step": 607746, "epoch": 7322} {"train_loss": -27.70334815979004, "global_step": 607747, "epoch": 7322} {"train_loss": -27.63169288635254, "global_step": 607748, "epoch": 7322} {"train_loss": -27.691049575805664, "global_step": 607749, "epoch": 7322} {"train_loss": -27.648700714111328, "global_step": 607750, "epoch": 7322} {"train_loss": -27.399927139282227, "global_step": 607751, "epoch": 7322} {"train_loss": -27.904434204101562, "global_step": 607752, "epoch": 7322} {"train_loss": -27.723987579345703, "global_step": 607753, "epoch": 7322} {"train_loss": -27.824020385742188, "global_step": 607754, "epoch": 7322} {"train_loss": -27.61408042907715, "global_step": 607755, "epoch": 7322} {"train_loss": -27.92258071899414, "global_step": 607756, "epoch": 7322} {"train_loss": -27.59797477722168, "global_step": 607757, "epoch": 7322} {"train_loss": -27.62449073791504, "global_step": 607758, "epoch": 7322} {"train_loss": -27.837055206298828, "global_step": 607759, "epoch": 7322} {"train_loss": -28.104345321655273, "global_step": 607760, "epoch": 7322} {"train_loss": -27.924768447875977, "global_step": 607761, "epoch": 7322} {"train_loss": -28.13837242126465, "global_step": 607762, "epoch": 7322} {"train_loss": -27.76197624206543, "global_step": 607763, "epoch": 7322} {"train_loss": -27.9520320892334, "global_step": 607764, "epoch": 7322} {"train_loss": -27.928924560546875, "global_step": 607765, "epoch": 7322} {"train_loss": -28.068090438842773, "global_step": 607766, "epoch": 7322} {"train_loss": -28.085180282592773, "global_step": 607767, "epoch": 7322} {"train_loss": -28.093265533447266, "global_step": 607768, "epoch": 7322} {"train_loss": -28.17702293395996, "global_step": 607769, "epoch": 7322} {"train_loss": -28.10272789001465, "global_step": 607770, "epoch": 7322} {"train_loss": -27.79558753967285, "global_step": 607771, "epoch": 7322} {"train_loss": -28.162939071655273, "global_step": 607772, "epoch": 7322} {"train_loss": -28.021915435791016, "global_step": 607773, "epoch": 7322} {"train_loss": -28.357440948486328, "global_step": 607774, "epoch": 7322} {"train_loss": -28.395278930664062, "global_step": 607775, "epoch": 7322} {"train_loss": -28.071949005126953, "global_step": 607776, "epoch": 7322} {"train_loss": -28.195920944213867, "global_step": 607777, "epoch": 7322} {"train_loss": -28.267969131469727, "global_step": 607778, "epoch": 7322} {"train_loss": -27.870407104492188, "global_step": 607779, "epoch": 7322} {"train_loss": -28.091156005859375, "global_step": 607780, "epoch": 7322} {"train_loss": -28.08405876159668, "global_step": 607781, "epoch": 7322} {"train_loss": -28.06183433532715, "global_step": 607782, "epoch": 7322} {"train_loss": -28.750568389892578, "global_step": 607783, "epoch": 7322} {"train_loss": -28.11211585998535, "global_step": 607784, "epoch": 7322} {"train_loss": -28.31853675842285, "global_step": 607785, "epoch": 7322} {"train_loss": -28.212493896484375, "global_step": 607786, "epoch": 7322} {"train_loss": -28.2277774810791, "global_step": 607787, "epoch": 7322} {"train_loss": -28.462509155273438, "global_step": 607788, "epoch": 7322} {"train_loss": -27.91080665588379, "global_step": 607789, "epoch": 7322} {"train_loss": -28.306737899780273, "global_step": 607790, "epoch": 7322} {"train_loss": -28.299182891845703, "global_step": 607791, "epoch": 7322} {"train_loss": -28.124317169189453, "global_step": 607792, "epoch": 7322} {"train_loss": -28.297849655151367, "global_step": 607793, "epoch": 7322} {"train_loss": -28.148487091064453, "global_step": 607794, "epoch": 7322} {"train_loss": -28.23003578186035, "global_step": 607795, "epoch": 7322} {"train_loss": -28.176801681518555, "global_step": 607796, "epoch": 7322} {"train_loss": -28.1525821685791, "global_step": 607797, "epoch": 7322} {"train_loss": -28.170663833618164, "global_step": 607798, "epoch": 7322} {"train_loss": -28.09566307067871, "global_step": 607799, "epoch": 7322} {"train_loss": -28.51999855041504, "global_step": 607800, "epoch": 7322} {"train_loss": -28.087324142456055, "global_step": 607801, "epoch": 7322} {"train_loss": -28.226287841796875, "global_step": 607802, "epoch": 7322} {"train_loss": -28.546117782592773, "global_step": 607803, "epoch": 7322} {"train_loss": -28.13163185119629, "global_step": 607804, "epoch": 7322} {"train_loss": -28.18695068359375, "global_step": 607805, "epoch": 7322} {"train_loss": -28.377517700195312, "global_step": 607806, "epoch": 7322} {"train_loss": -28.187009811401367, "global_step": 607807, "epoch": 7322} {"train_loss": -27.753819178385907, "global_step": 607808, "epoch": 7322, "val_loss": 6638165.0} {"train_loss": -27.668582916259766, "global_step": 607809, "epoch": 7323} {"train_loss": -27.696552276611328, "global_step": 607810, "epoch": 7323} {"train_loss": -27.954681396484375, "global_step": 607811, "epoch": 7323} {"train_loss": -27.659589767456055, "global_step": 607812, "epoch": 7323} {"train_loss": -27.364294052124023, "global_step": 607813, "epoch": 7323} {"train_loss": -27.387359619140625, "global_step": 607814, "epoch": 7323} {"train_loss": -26.442541122436523, "global_step": 607815, "epoch": 7323} {"train_loss": -26.017608642578125, "global_step": 607816, "epoch": 7323} {"train_loss": -26.907684326171875, "global_step": 607817, "epoch": 7323} {"train_loss": -27.768268585205078, "global_step": 607818, "epoch": 7323} {"train_loss": -27.144750595092773, "global_step": 607819, "epoch": 7323} {"train_loss": -27.581085205078125, "global_step": 607820, "epoch": 7323} {"train_loss": -27.60772132873535, "global_step": 607821, "epoch": 7323} {"train_loss": -27.030942916870117, "global_step": 607822, "epoch": 7323} {"train_loss": -27.706710815429688, "global_step": 607823, "epoch": 7323} {"train_loss": -26.973661422729492, "global_step": 607824, "epoch": 7323} {"train_loss": -27.61220359802246, "global_step": 607825, "epoch": 7323} {"train_loss": -27.640729904174805, "global_step": 607826, "epoch": 7323} {"train_loss": -27.80049705505371, "global_step": 607827, "epoch": 7323} {"train_loss": -27.220251083374023, "global_step": 607828, "epoch": 7323} {"train_loss": -27.82012939453125, "global_step": 607829, "epoch": 7323} {"train_loss": -27.250904083251953, "global_step": 607830, "epoch": 7323} {"train_loss": -27.84506607055664, "global_step": 607831, "epoch": 7323} {"train_loss": -27.571191787719727, "global_step": 607832, "epoch": 7323} {"train_loss": -27.649185180664062, "global_step": 607833, "epoch": 7323} {"train_loss": -27.808935165405273, "global_step": 607834, "epoch": 7323} {"train_loss": -27.673816680908203, "global_step": 607835, "epoch": 7323} {"train_loss": -27.8245906829834, "global_step": 607836, "epoch": 7323} {"train_loss": -27.739089965820312, "global_step": 607837, "epoch": 7323} {"train_loss": -27.84670066833496, "global_step": 607838, "epoch": 7323} {"train_loss": -27.538312911987305, "global_step": 607839, "epoch": 7323} {"train_loss": -27.9883975982666, "global_step": 607840, "epoch": 7323} {"train_loss": -28.4366512298584, "global_step": 607841, "epoch": 7323} {"train_loss": -27.717254638671875, "global_step": 607842, "epoch": 7323} {"train_loss": -27.965457916259766, "global_step": 607843, "epoch": 7323} {"train_loss": -27.8878231048584, "global_step": 607844, "epoch": 7323} {"train_loss": -28.270078659057617, "global_step": 607845, "epoch": 7323} {"train_loss": -28.051258087158203, "global_step": 607846, "epoch": 7323} {"train_loss": -28.288806915283203, "global_step": 607847, "epoch": 7323} {"train_loss": -27.99445915222168, "global_step": 607848, "epoch": 7323} {"train_loss": -28.11305046081543, "global_step": 607849, "epoch": 7323} {"train_loss": -28.197336196899414, "global_step": 607850, "epoch": 7323} {"train_loss": -28.079029083251953, "global_step": 607851, "epoch": 7323} {"train_loss": -28.19822120666504, "global_step": 607852, "epoch": 7323} {"train_loss": -28.27461051940918, "global_step": 607853, "epoch": 7323} {"train_loss": -28.071914672851562, "global_step": 607854, "epoch": 7323} {"train_loss": -28.113073348999023, "global_step": 607855, "epoch": 7323} {"train_loss": -28.321075439453125, "global_step": 607856, "epoch": 7323} {"train_loss": -28.0613956451416, "global_step": 607857, "epoch": 7323} {"train_loss": -28.43155860900879, "global_step": 607858, "epoch": 7323} {"train_loss": -28.219091415405273, "global_step": 607859, "epoch": 7323} {"train_loss": -28.17140007019043, "global_step": 607860, "epoch": 7323} {"train_loss": -28.19874382019043, "global_step": 607861, "epoch": 7323} {"train_loss": -28.369375228881836, "global_step": 607862, "epoch": 7323} {"train_loss": -28.274215698242188, "global_step": 607863, "epoch": 7323} {"train_loss": -28.31966209411621, "global_step": 607864, "epoch": 7323} {"train_loss": -28.29668617248535, "global_step": 607865, "epoch": 7323} {"train_loss": -28.623615264892578, "global_step": 607866, "epoch": 7323} {"train_loss": -28.262975692749023, "global_step": 607867, "epoch": 7323} {"train_loss": -28.215518951416016, "global_step": 607868, "epoch": 7323} {"train_loss": -28.2713680267334, "global_step": 607869, "epoch": 7323} {"train_loss": -28.20879554748535, "global_step": 607870, "epoch": 7323} {"train_loss": -28.4295711517334, "global_step": 607871, "epoch": 7323} {"train_loss": -28.402387619018555, "global_step": 607872, "epoch": 7323} {"train_loss": -28.325611114501953, "global_step": 607873, "epoch": 7323} {"train_loss": -28.480520248413086, "global_step": 607874, "epoch": 7323} {"train_loss": -28.038593292236328, "global_step": 607875, "epoch": 7323} {"train_loss": -27.987462997436523, "global_step": 607876, "epoch": 7323} {"train_loss": -28.321813583374023, "global_step": 607877, "epoch": 7323} {"train_loss": -27.776214599609375, "global_step": 607878, "epoch": 7323} {"train_loss": -27.969213485717773, "global_step": 607879, "epoch": 7323} {"train_loss": -28.2416934967041, "global_step": 607880, "epoch": 7323} {"train_loss": -28.395923614501953, "global_step": 607881, "epoch": 7323} {"train_loss": -27.81247901916504, "global_step": 607882, "epoch": 7323} {"train_loss": -28.136579513549805, "global_step": 607883, "epoch": 7323} {"train_loss": -27.88759422302246, "global_step": 607884, "epoch": 7323} {"train_loss": -28.166889190673828, "global_step": 607885, "epoch": 7323} {"train_loss": -28.37018394470215, "global_step": 607886, "epoch": 7323} {"train_loss": -27.908538818359375, "global_step": 607887, "epoch": 7323} {"train_loss": -28.216659545898438, "global_step": 607888, "epoch": 7323} {"train_loss": -27.6966609954834, "global_step": 607889, "epoch": 7323} {"train_loss": -27.801227569580078, "global_step": 607890, "epoch": 7323} {"train_loss": -27.8971440188856, "global_step": 607891, "epoch": 7323, "val_loss": 6590918.0} {"train_loss": -25.798084259033203, "global_step": 607892, "epoch": 7324} {"train_loss": -23.424776077270508, "global_step": 607893, "epoch": 7324} {"train_loss": -24.441131591796875, "global_step": 607894, "epoch": 7324} {"train_loss": -26.37762451171875, "global_step": 607895, "epoch": 7324} {"train_loss": -25.377302169799805, "global_step": 607896, "epoch": 7324} {"train_loss": -25.185810089111328, "global_step": 607897, "epoch": 7324} {"train_loss": -25.8878116607666, "global_step": 607898, "epoch": 7324} {"train_loss": -26.646982192993164, "global_step": 607899, "epoch": 7324} {"train_loss": -26.1086368560791, "global_step": 607900, "epoch": 7324} {"train_loss": -26.049463272094727, "global_step": 607901, "epoch": 7324} {"train_loss": -26.41727638244629, "global_step": 607902, "epoch": 7324} {"train_loss": -26.21925163269043, "global_step": 607903, "epoch": 7324} {"train_loss": -26.7193603515625, "global_step": 607904, "epoch": 7324} {"train_loss": -26.34282875061035, "global_step": 607905, "epoch": 7324} {"train_loss": -26.435850143432617, "global_step": 607906, "epoch": 7324} {"train_loss": -26.921255111694336, "global_step": 607907, "epoch": 7324} {"train_loss": -26.361865997314453, "global_step": 607908, "epoch": 7324} {"train_loss": -26.73969841003418, "global_step": 607909, "epoch": 7324} {"train_loss": -27.092315673828125, "global_step": 607910, "epoch": 7324} {"train_loss": -26.72769546508789, "global_step": 607911, "epoch": 7324} {"train_loss": -27.019819259643555, "global_step": 607912, "epoch": 7324} {"train_loss": -26.738616943359375, "global_step": 607913, "epoch": 7324} {"train_loss": -26.960168838500977, "global_step": 607914, "epoch": 7324} {"train_loss": -27.183746337890625, "global_step": 607915, "epoch": 7324} {"train_loss": -26.9783935546875, "global_step": 607916, "epoch": 7324} {"train_loss": -27.08308219909668, "global_step": 607917, "epoch": 7324} {"train_loss": -27.61292839050293, "global_step": 607918, "epoch": 7324} {"train_loss": -27.33363914489746, "global_step": 607919, "epoch": 7324} {"train_loss": -27.035266876220703, "global_step": 607920, "epoch": 7324} {"train_loss": -27.530500411987305, "global_step": 607921, "epoch": 7324} {"train_loss": -27.559045791625977, "global_step": 607922, "epoch": 7324} {"train_loss": -27.288129806518555, "global_step": 607923, "epoch": 7324} {"train_loss": -27.65484619140625, "global_step": 607924, "epoch": 7324} {"train_loss": -27.681745529174805, "global_step": 607925, "epoch": 7324} {"train_loss": -27.676115036010742, "global_step": 607926, "epoch": 7324} {"train_loss": -27.71491813659668, "global_step": 607927, "epoch": 7324} {"train_loss": -27.58523941040039, "global_step": 607928, "epoch": 7324} {"train_loss": -27.70953369140625, "global_step": 607929, "epoch": 7324} {"train_loss": -27.70966911315918, "global_step": 607930, "epoch": 7324} {"train_loss": -27.721893310546875, "global_step": 607931, "epoch": 7324} {"train_loss": -27.891681671142578, "global_step": 607932, "epoch": 7324} {"train_loss": -27.743154525756836, "global_step": 607933, "epoch": 7324} {"train_loss": -27.940921783447266, "global_step": 607934, "epoch": 7324} {"train_loss": -27.762174606323242, "global_step": 607935, "epoch": 7324} {"train_loss": -28.11639976501465, "global_step": 607936, "epoch": 7324} {"train_loss": -27.73792839050293, "global_step": 607937, "epoch": 7324} {"train_loss": -28.05860710144043, "global_step": 607938, "epoch": 7324} {"train_loss": -27.968103408813477, "global_step": 607939, "epoch": 7324} {"train_loss": -28.129535675048828, "global_step": 607940, "epoch": 7324} {"train_loss": -28.097137451171875, "global_step": 607941, "epoch": 7324} {"train_loss": -28.064008712768555, "global_step": 607942, "epoch": 7324} {"train_loss": -28.010473251342773, "global_step": 607943, "epoch": 7324} {"train_loss": -28.308765411376953, "global_step": 607944, "epoch": 7324} {"train_loss": -28.247913360595703, "global_step": 607945, "epoch": 7324} {"train_loss": -28.463714599609375, "global_step": 607946, "epoch": 7324} {"train_loss": -28.479902267456055, "global_step": 607947, "epoch": 7324} {"train_loss": -28.462833404541016, "global_step": 607948, "epoch": 7324} {"train_loss": -28.370187759399414, "global_step": 607949, "epoch": 7324} {"train_loss": -28.419178009033203, "global_step": 607950, "epoch": 7324} {"train_loss": -28.417510986328125, "global_step": 607951, "epoch": 7324} {"train_loss": -28.193561553955078, "global_step": 607952, "epoch": 7324} {"train_loss": -28.1103458404541, "global_step": 607953, "epoch": 7324} {"train_loss": -28.382287979125977, "global_step": 607954, "epoch": 7324} {"train_loss": -28.253437042236328, "global_step": 607955, "epoch": 7324} {"train_loss": -27.99368667602539, "global_step": 607956, "epoch": 7324} {"train_loss": -28.1337890625, "global_step": 607957, "epoch": 7324} {"train_loss": -28.218612670898438, "global_step": 607958, "epoch": 7324} {"train_loss": -28.5078067779541, "global_step": 607959, "epoch": 7324} {"train_loss": -28.093149185180664, "global_step": 607960, "epoch": 7324} {"train_loss": -27.659442901611328, "global_step": 607961, "epoch": 7324} {"train_loss": -27.800512313842773, "global_step": 607962, "epoch": 7324} {"train_loss": -27.619260787963867, "global_step": 607963, "epoch": 7324} {"train_loss": -27.994903564453125, "global_step": 607964, "epoch": 7324} {"train_loss": -28.192106246948242, "global_step": 607965, "epoch": 7324} {"train_loss": -28.048864364624023, "global_step": 607966, "epoch": 7324} {"train_loss": -28.397750854492188, "global_step": 607967, "epoch": 7324} {"train_loss": -28.23746109008789, "global_step": 607968, "epoch": 7324} {"train_loss": -28.202762603759766, "global_step": 607969, "epoch": 7324} {"train_loss": -28.127674102783203, "global_step": 607970, "epoch": 7324} {"train_loss": -28.101837158203125, "global_step": 607971, "epoch": 7324} {"train_loss": -28.30039405822754, "global_step": 607972, "epoch": 7324} {"train_loss": -28.02982521057129, "global_step": 607973, "epoch": 7324} {"train_loss": -27.43505732984428, "global_step": 607974, "epoch": 7324, "val_loss": 6738593.0} {"train_loss": -27.381637573242188, "global_step": 607975, "epoch": 7325} {"train_loss": -27.799468994140625, "global_step": 607976, "epoch": 7325} {"train_loss": -27.114770889282227, "global_step": 607977, "epoch": 7325} {"train_loss": -27.13763999938965, "global_step": 607978, "epoch": 7325} {"train_loss": -27.5327091217041, "global_step": 607979, "epoch": 7325} {"train_loss": -27.463232040405273, "global_step": 607980, "epoch": 7325} {"train_loss": -27.10548210144043, "global_step": 607981, "epoch": 7325} {"train_loss": -27.528303146362305, "global_step": 607982, "epoch": 7325} {"train_loss": -27.45330810546875, "global_step": 607983, "epoch": 7325} {"train_loss": -27.363311767578125, "global_step": 607984, "epoch": 7325} {"train_loss": -27.347320556640625, "global_step": 607985, "epoch": 7325} {"train_loss": -27.452306747436523, "global_step": 607986, "epoch": 7325} {"train_loss": -27.703786849975586, "global_step": 607987, "epoch": 7325} {"train_loss": -27.865554809570312, "global_step": 607988, "epoch": 7325} {"train_loss": -27.498891830444336, "global_step": 607989, "epoch": 7325} {"train_loss": -27.66708755493164, "global_step": 607990, "epoch": 7325} {"train_loss": -27.663604736328125, "global_step": 607991, "epoch": 7325} {"train_loss": -28.107892990112305, "global_step": 607992, "epoch": 7325} {"train_loss": -27.681798934936523, "global_step": 607993, "epoch": 7325} {"train_loss": -27.719573974609375, "global_step": 607994, "epoch": 7325} {"train_loss": -27.79498863220215, "global_step": 607995, "epoch": 7325} {"train_loss": -27.86591911315918, "global_step": 607996, "epoch": 7325} {"train_loss": -27.783262252807617, "global_step": 607997, "epoch": 7325} {"train_loss": -28.05156898498535, "global_step": 607998, "epoch": 7325} {"train_loss": -27.911108016967773, "global_step": 607999, "epoch": 7325} {"train_loss": -27.92713737487793, "global_step": 608000, "epoch": 7325} {"train_loss": -28.157001495361328, "global_step": 608001, "epoch": 7325} {"train_loss": -27.791839599609375, "global_step": 608002, "epoch": 7325} {"train_loss": -27.766271591186523, "global_step": 608003, "epoch": 7325} {"train_loss": -27.973773956298828, "global_step": 608004, "epoch": 7325} {"train_loss": -28.163238525390625, "global_step": 608005, "epoch": 7325} {"train_loss": -28.160873413085938, "global_step": 608006, "epoch": 7325} {"train_loss": -27.88667106628418, "global_step": 608007, "epoch": 7325} {"train_loss": -28.0986328125, "global_step": 608008, "epoch": 7325} {"train_loss": -28.074167251586914, "global_step": 608009, "epoch": 7325} {"train_loss": -28.061986923217773, "global_step": 608010, "epoch": 7325} {"train_loss": -27.933094024658203, "global_step": 608011, "epoch": 7325} {"train_loss": -28.236316680908203, "global_step": 608012, "epoch": 7325} {"train_loss": -28.28554344177246, "global_step": 608013, "epoch": 7325} {"train_loss": -28.398038864135742, "global_step": 608014, "epoch": 7325} {"train_loss": -28.349767684936523, "global_step": 608015, "epoch": 7325} {"train_loss": -28.42181968688965, "global_step": 608016, "epoch": 7325} {"train_loss": -28.152841567993164, "global_step": 608017, "epoch": 7325} {"train_loss": -28.32977867126465, "global_step": 608018, "epoch": 7325} {"train_loss": -28.626117706298828, "global_step": 608019, "epoch": 7325} {"train_loss": -28.255578994750977, "global_step": 608020, "epoch": 7325} {"train_loss": -28.295202255249023, "global_step": 608021, "epoch": 7325} {"train_loss": -28.33806800842285, "global_step": 608022, "epoch": 7325} {"train_loss": -28.39902114868164, "global_step": 608023, "epoch": 7325} {"train_loss": -28.34832763671875, "global_step": 608024, "epoch": 7325} {"train_loss": -27.9954833984375, "global_step": 608025, "epoch": 7325} {"train_loss": -28.17469596862793, "global_step": 608026, "epoch": 7325} {"train_loss": -28.065580368041992, "global_step": 608027, "epoch": 7325} {"train_loss": -27.808130264282227, "global_step": 608028, "epoch": 7325} {"train_loss": -28.030969619750977, "global_step": 608029, "epoch": 7325} {"train_loss": -28.299713134765625, "global_step": 608030, "epoch": 7325} {"train_loss": -28.1049747467041, "global_step": 608031, "epoch": 7325} {"train_loss": -27.945545196533203, "global_step": 608032, "epoch": 7325} {"train_loss": -27.864486694335938, "global_step": 608033, "epoch": 7325} {"train_loss": -27.881122589111328, "global_step": 608034, "epoch": 7325} {"train_loss": -28.107318878173828, "global_step": 608035, "epoch": 7325} {"train_loss": -28.287694931030273, "global_step": 608036, "epoch": 7325} {"train_loss": -28.241357803344727, "global_step": 608037, "epoch": 7325} {"train_loss": -28.15192222595215, "global_step": 608038, "epoch": 7325} {"train_loss": -27.518070220947266, "global_step": 608039, "epoch": 7325} {"train_loss": -28.0801944732666, "global_step": 608040, "epoch": 7325} {"train_loss": -27.923139572143555, "global_step": 608041, "epoch": 7325} {"train_loss": -27.97124671936035, "global_step": 608042, "epoch": 7325} {"train_loss": -28.0948543548584, "global_step": 608043, "epoch": 7325} {"train_loss": -28.170578002929688, "global_step": 608044, "epoch": 7325} {"train_loss": -28.4865665435791, "global_step": 608045, "epoch": 7325} {"train_loss": -27.8775634765625, "global_step": 608046, "epoch": 7325} {"train_loss": -28.431726455688477, "global_step": 608047, "epoch": 7325} {"train_loss": -28.451995849609375, "global_step": 608048, "epoch": 7325} {"train_loss": -28.295988082885742, "global_step": 608049, "epoch": 7325} {"train_loss": -28.202228546142578, "global_step": 608050, "epoch": 7325} {"train_loss": -28.10796546936035, "global_step": 608051, "epoch": 7325} {"train_loss": -27.911916732788086, "global_step": 608052, "epoch": 7325} {"train_loss": -28.104663848876953, "global_step": 608053, "epoch": 7325} {"train_loss": -28.191370010375977, "global_step": 608054, "epoch": 7325} {"train_loss": -28.406885147094727, "global_step": 608055, "epoch": 7325} {"train_loss": -28.714197158813477, "global_step": 608056, "epoch": 7325} {"train_loss": -27.977841158947314, "global_step": 608057, "epoch": 7325, "val_loss": 6623426.0} {"train_loss": -26.8633975982666, "global_step": 608058, "epoch": 7326} {"train_loss": -27.3853816986084, "global_step": 608059, "epoch": 7326} {"train_loss": -27.419275283813477, "global_step": 608060, "epoch": 7326} {"train_loss": -28.03370475769043, "global_step": 608061, "epoch": 7326} {"train_loss": -26.485153198242188, "global_step": 608062, "epoch": 7326} {"train_loss": -27.684301376342773, "global_step": 608063, "epoch": 7326} {"train_loss": -27.543867111206055, "global_step": 608064, "epoch": 7326} {"train_loss": -27.610946655273438, "global_step": 608065, "epoch": 7326} {"train_loss": -27.634851455688477, "global_step": 608066, "epoch": 7326} {"train_loss": -27.976245880126953, "global_step": 608067, "epoch": 7326} {"train_loss": -27.40174674987793, "global_step": 608068, "epoch": 7326} {"train_loss": -28.120086669921875, "global_step": 608069, "epoch": 7326} {"train_loss": -27.902393341064453, "global_step": 608070, "epoch": 7326} {"train_loss": -27.845626831054688, "global_step": 608071, "epoch": 7326} {"train_loss": -27.849945068359375, "global_step": 608072, "epoch": 7326} {"train_loss": -27.821706771850586, "global_step": 608073, "epoch": 7326} {"train_loss": -27.91240882873535, "global_step": 608074, "epoch": 7326} {"train_loss": -27.678064346313477, "global_step": 608075, "epoch": 7326} {"train_loss": -27.8356990814209, "global_step": 608076, "epoch": 7326} {"train_loss": -28.323089599609375, "global_step": 608077, "epoch": 7326} {"train_loss": -27.993616104125977, "global_step": 608078, "epoch": 7326} {"train_loss": -27.999805450439453, "global_step": 608079, "epoch": 7326} {"train_loss": -27.767858505249023, "global_step": 608080, "epoch": 7326} {"train_loss": -28.19919204711914, "global_step": 608081, "epoch": 7326} {"train_loss": -27.92989158630371, "global_step": 608082, "epoch": 7326} {"train_loss": -27.920324325561523, "global_step": 608083, "epoch": 7326} {"train_loss": -28.0833797454834, "global_step": 608084, "epoch": 7326} {"train_loss": -27.884130477905273, "global_step": 608085, "epoch": 7326} {"train_loss": -28.072961807250977, "global_step": 608086, "epoch": 7326} {"train_loss": -28.134077072143555, "global_step": 608087, "epoch": 7326} {"train_loss": -28.158111572265625, "global_step": 608088, "epoch": 7326} {"train_loss": -28.150836944580078, "global_step": 608089, "epoch": 7326} {"train_loss": -28.108121871948242, "global_step": 608090, "epoch": 7326} {"train_loss": -28.13864517211914, "global_step": 608091, "epoch": 7326} {"train_loss": -28.10611915588379, "global_step": 608092, "epoch": 7326} {"train_loss": -28.26991081237793, "global_step": 608093, "epoch": 7326} {"train_loss": -27.923742294311523, "global_step": 608094, "epoch": 7326} {"train_loss": -27.7039737701416, "global_step": 608095, "epoch": 7326} {"train_loss": -27.589309692382812, "global_step": 608096, "epoch": 7326} {"train_loss": -28.080413818359375, "global_step": 608097, "epoch": 7326} {"train_loss": -27.708850860595703, "global_step": 608098, "epoch": 7326} {"train_loss": -27.87776756286621, "global_step": 608099, "epoch": 7326} {"train_loss": -27.68680191040039, "global_step": 608100, "epoch": 7326} {"train_loss": -28.374059677124023, "global_step": 608101, "epoch": 7326} {"train_loss": -27.997344970703125, "global_step": 608102, "epoch": 7326} {"train_loss": -28.245849609375, "global_step": 608103, "epoch": 7326} {"train_loss": -27.476118087768555, "global_step": 608104, "epoch": 7326} {"train_loss": -27.730432510375977, "global_step": 608105, "epoch": 7326} {"train_loss": -27.974767684936523, "global_step": 608106, "epoch": 7326} {"train_loss": -28.452133178710938, "global_step": 608107, "epoch": 7326} {"train_loss": -28.116504669189453, "global_step": 608108, "epoch": 7326} {"train_loss": -27.91814613342285, "global_step": 608109, "epoch": 7326} {"train_loss": -27.888248443603516, "global_step": 608110, "epoch": 7326} {"train_loss": -28.02141761779785, "global_step": 608111, "epoch": 7326} {"train_loss": -28.087005615234375, "global_step": 608112, "epoch": 7326} {"train_loss": -28.020715713500977, "global_step": 608113, "epoch": 7326} {"train_loss": -27.997201919555664, "global_step": 608114, "epoch": 7326} {"train_loss": -28.233673095703125, "global_step": 608115, "epoch": 7326} {"train_loss": -28.146514892578125, "global_step": 608116, "epoch": 7326} {"train_loss": -28.1123104095459, "global_step": 608117, "epoch": 7326} {"train_loss": -28.11983299255371, "global_step": 608118, "epoch": 7326} {"train_loss": -28.302053451538086, "global_step": 608119, "epoch": 7326} {"train_loss": -28.24106788635254, "global_step": 608120, "epoch": 7326} {"train_loss": -28.178695678710938, "global_step": 608121, "epoch": 7326} {"train_loss": -28.17717933654785, "global_step": 608122, "epoch": 7326} {"train_loss": -28.403486251831055, "global_step": 608123, "epoch": 7326} {"train_loss": -28.29355812072754, "global_step": 608124, "epoch": 7326} {"train_loss": -28.237506866455078, "global_step": 608125, "epoch": 7326} {"train_loss": -28.342071533203125, "global_step": 608126, "epoch": 7326} {"train_loss": -28.32526969909668, "global_step": 608127, "epoch": 7326} {"train_loss": -28.0664119720459, "global_step": 608128, "epoch": 7326} {"train_loss": -28.570648193359375, "global_step": 608129, "epoch": 7326} {"train_loss": -28.05734634399414, "global_step": 608130, "epoch": 7326} {"train_loss": -28.102380752563477, "global_step": 608131, "epoch": 7326} {"train_loss": -28.361572265625, "global_step": 608132, "epoch": 7326} {"train_loss": -28.265966415405273, "global_step": 608133, "epoch": 7326} {"train_loss": -27.68597412109375, "global_step": 608134, "epoch": 7326} {"train_loss": -27.46876335144043, "global_step": 608135, "epoch": 7326} {"train_loss": -27.606420516967773, "global_step": 608136, "epoch": 7326} {"train_loss": -27.92939567565918, "global_step": 608137, "epoch": 7326} {"train_loss": -27.7960205078125, "global_step": 608138, "epoch": 7326} {"train_loss": -27.247976303100586, "global_step": 608139, "epoch": 7326} {"train_loss": -27.923500061035156, "global_step": 608140, "epoch": 7326, "val_loss": 6617968.0} {"train_loss": -26.452939987182617, "global_step": 608141, "epoch": 7327} {"train_loss": -20.49895477294922, "global_step": 608142, "epoch": 7327} {"train_loss": -23.476009368896484, "global_step": 608143, "epoch": 7327} {"train_loss": -25.83323097229004, "global_step": 608144, "epoch": 7327} {"train_loss": -24.718820571899414, "global_step": 608145, "epoch": 7327} {"train_loss": -25.667444229125977, "global_step": 608146, "epoch": 7327} {"train_loss": -26.261157989501953, "global_step": 608147, "epoch": 7327} {"train_loss": -25.50276756286621, "global_step": 608148, "epoch": 7327} {"train_loss": -26.426244735717773, "global_step": 608149, "epoch": 7327} {"train_loss": -26.091724395751953, "global_step": 608150, "epoch": 7327} {"train_loss": -26.0269775390625, "global_step": 608151, "epoch": 7327} {"train_loss": -26.482847213745117, "global_step": 608152, "epoch": 7327} {"train_loss": -26.80606460571289, "global_step": 608153, "epoch": 7327} {"train_loss": -26.16522789001465, "global_step": 608154, "epoch": 7327} {"train_loss": -26.81159782409668, "global_step": 608155, "epoch": 7327} {"train_loss": -26.661457061767578, "global_step": 608156, "epoch": 7327} {"train_loss": -26.171707153320312, "global_step": 608157, "epoch": 7327} {"train_loss": -27.079496383666992, "global_step": 608158, "epoch": 7327} {"train_loss": -26.989709854125977, "global_step": 608159, "epoch": 7327} {"train_loss": -26.754413604736328, "global_step": 608160, "epoch": 7327} {"train_loss": -27.3572998046875, "global_step": 608161, "epoch": 7327} {"train_loss": -27.01358985900879, "global_step": 608162, "epoch": 7327} {"train_loss": -27.100183486938477, "global_step": 608163, "epoch": 7327} {"train_loss": -26.961456298828125, "global_step": 608164, "epoch": 7327} {"train_loss": -26.968957901000977, "global_step": 608165, "epoch": 7327} {"train_loss": -27.0809268951416, "global_step": 608166, "epoch": 7327} {"train_loss": -26.927595138549805, "global_step": 608167, "epoch": 7327} {"train_loss": -27.478429794311523, "global_step": 608168, "epoch": 7327} {"train_loss": -27.078046798706055, "global_step": 608169, "epoch": 7327} {"train_loss": -27.32574462890625, "global_step": 608170, "epoch": 7327} {"train_loss": -27.498077392578125, "global_step": 608171, "epoch": 7327} {"train_loss": -27.596057891845703, "global_step": 608172, "epoch": 7327} {"train_loss": -27.429874420166016, "global_step": 608173, "epoch": 7327} {"train_loss": -27.755634307861328, "global_step": 608174, "epoch": 7327} {"train_loss": -27.62017822265625, "global_step": 608175, "epoch": 7327} {"train_loss": -27.0790958404541, "global_step": 608176, "epoch": 7327} {"train_loss": -27.471832275390625, "global_step": 608177, "epoch": 7327} {"train_loss": -27.31585693359375, "global_step": 608178, "epoch": 7327} {"train_loss": -27.4205379486084, "global_step": 608179, "epoch": 7327} {"train_loss": -27.40166664123535, "global_step": 608180, "epoch": 7327} {"train_loss": -27.533910751342773, "global_step": 608181, "epoch": 7327} {"train_loss": -27.55515480041504, "global_step": 608182, "epoch": 7327} {"train_loss": -27.62528419494629, "global_step": 608183, "epoch": 7327} {"train_loss": -27.612030029296875, "global_step": 608184, "epoch": 7327} {"train_loss": -27.89056968688965, "global_step": 608185, "epoch": 7327} {"train_loss": -27.902542114257812, "global_step": 608186, "epoch": 7327} {"train_loss": -27.54007339477539, "global_step": 608187, "epoch": 7327} {"train_loss": -28.047574996948242, "global_step": 608188, "epoch": 7327} {"train_loss": -27.86688232421875, "global_step": 608189, "epoch": 7327} {"train_loss": -27.92083740234375, "global_step": 608190, "epoch": 7327} {"train_loss": -27.66033935546875, "global_step": 608191, "epoch": 7327} {"train_loss": -27.939849853515625, "global_step": 608192, "epoch": 7327} {"train_loss": -27.7305908203125, "global_step": 608193, "epoch": 7327} {"train_loss": -27.31965446472168, "global_step": 608194, "epoch": 7327} {"train_loss": -27.501073837280273, "global_step": 608195, "epoch": 7327} {"train_loss": -28.12702751159668, "global_step": 608196, "epoch": 7327} {"train_loss": -27.52742576599121, "global_step": 608197, "epoch": 7327} {"train_loss": -27.593114852905273, "global_step": 608198, "epoch": 7327} {"train_loss": -28.227521896362305, "global_step": 608199, "epoch": 7327} {"train_loss": -27.69719886779785, "global_step": 608200, "epoch": 7327} {"train_loss": -27.919301986694336, "global_step": 608201, "epoch": 7327} {"train_loss": -27.789621353149414, "global_step": 608202, "epoch": 7327} {"train_loss": -27.660175323486328, "global_step": 608203, "epoch": 7327} {"train_loss": -28.0742244720459, "global_step": 608204, "epoch": 7327} {"train_loss": -28.156320571899414, "global_step": 608205, "epoch": 7327} {"train_loss": -27.848722457885742, "global_step": 608206, "epoch": 7327} {"train_loss": -28.16644287109375, "global_step": 608207, "epoch": 7327} {"train_loss": -27.72019386291504, "global_step": 608208, "epoch": 7327} {"train_loss": -27.587615966796875, "global_step": 608209, "epoch": 7327} {"train_loss": -27.990558624267578, "global_step": 608210, "epoch": 7327} {"train_loss": -28.150476455688477, "global_step": 608211, "epoch": 7327} {"train_loss": -28.20574378967285, "global_step": 608212, "epoch": 7327} {"train_loss": -27.853546142578125, "global_step": 608213, "epoch": 7327} {"train_loss": -27.725446701049805, "global_step": 608214, "epoch": 7327} {"train_loss": -28.116682052612305, "global_step": 608215, "epoch": 7327} {"train_loss": -28.064733505249023, "global_step": 608216, "epoch": 7327} {"train_loss": -27.97452735900879, "global_step": 608217, "epoch": 7327} {"train_loss": -27.970396041870117, "global_step": 608218, "epoch": 7327} {"train_loss": -28.38722038269043, "global_step": 608219, "epoch": 7327} {"train_loss": -28.4034366607666, "global_step": 608220, "epoch": 7327} {"train_loss": -28.272663116455078, "global_step": 608221, "epoch": 7327} {"train_loss": -27.89212417602539, "global_step": 608222, "epoch": 7327} {"train_loss": -27.24441330691418, "global_step": 608223, "epoch": 7327, "val_loss": 6555550.0} {"train_loss": -27.379377365112305, "global_step": 608224, "epoch": 7328} {"train_loss": -27.076679229736328, "global_step": 608225, "epoch": 7328} {"train_loss": -25.711811065673828, "global_step": 608226, "epoch": 7328} {"train_loss": -25.526723861694336, "global_step": 608227, "epoch": 7328} {"train_loss": -25.727081298828125, "global_step": 608228, "epoch": 7328} {"train_loss": -26.938016891479492, "global_step": 608229, "epoch": 7328} {"train_loss": -26.808032989501953, "global_step": 608230, "epoch": 7328} {"train_loss": -27.199560165405273, "global_step": 608231, "epoch": 7328} {"train_loss": -27.481531143188477, "global_step": 608232, "epoch": 7328} {"train_loss": -26.92626953125, "global_step": 608233, "epoch": 7328} {"train_loss": -27.311492919921875, "global_step": 608234, "epoch": 7328} {"train_loss": -27.050695419311523, "global_step": 608235, "epoch": 7328} {"train_loss": -27.49598503112793, "global_step": 608236, "epoch": 7328} {"train_loss": -27.075788497924805, "global_step": 608237, "epoch": 7328} {"train_loss": -27.4398136138916, "global_step": 608238, "epoch": 7328} {"train_loss": -27.16168785095215, "global_step": 608239, "epoch": 7328} {"train_loss": -27.516321182250977, "global_step": 608240, "epoch": 7328} {"train_loss": -27.56503677368164, "global_step": 608241, "epoch": 7328} {"train_loss": -27.378767013549805, "global_step": 608242, "epoch": 7328} {"train_loss": -27.351150512695312, "global_step": 608243, "epoch": 7328} {"train_loss": -27.3170166015625, "global_step": 608244, "epoch": 7328} {"train_loss": -27.836334228515625, "global_step": 608245, "epoch": 7328} {"train_loss": -27.639846801757812, "global_step": 608246, "epoch": 7328} {"train_loss": -27.722442626953125, "global_step": 608247, "epoch": 7328} {"train_loss": -27.323017120361328, "global_step": 608248, "epoch": 7328} {"train_loss": -28.246191024780273, "global_step": 608249, "epoch": 7328} {"train_loss": -27.506317138671875, "global_step": 608250, "epoch": 7328} {"train_loss": -27.62261962890625, "global_step": 608251, "epoch": 7328} {"train_loss": -27.523344039916992, "global_step": 608252, "epoch": 7328} {"train_loss": -27.950708389282227, "global_step": 608253, "epoch": 7328} {"train_loss": -27.68296241760254, "global_step": 608254, "epoch": 7328} {"train_loss": -27.41619300842285, "global_step": 608255, "epoch": 7328} {"train_loss": -27.81989860534668, "global_step": 608256, "epoch": 7328} {"train_loss": -27.659454345703125, "global_step": 608257, "epoch": 7328} {"train_loss": -27.65390396118164, "global_step": 608258, "epoch": 7328} {"train_loss": -28.02754020690918, "global_step": 608259, "epoch": 7328} {"train_loss": -28.197296142578125, "global_step": 608260, "epoch": 7328} {"train_loss": -28.488386154174805, "global_step": 608261, "epoch": 7328} {"train_loss": -27.969205856323242, "global_step": 608262, "epoch": 7328} {"train_loss": -28.1474666595459, "global_step": 608263, "epoch": 7328} {"train_loss": -28.025747299194336, "global_step": 608264, "epoch": 7328} {"train_loss": -28.154855728149414, "global_step": 608265, "epoch": 7328} {"train_loss": -28.0703182220459, "global_step": 608266, "epoch": 7328} {"train_loss": -27.82659339904785, "global_step": 608267, "epoch": 7328} {"train_loss": -28.150930404663086, "global_step": 608268, "epoch": 7328} {"train_loss": -28.422693252563477, "global_step": 608269, "epoch": 7328} {"train_loss": -28.29058265686035, "global_step": 608270, "epoch": 7328} {"train_loss": -28.1776065826416, "global_step": 608271, "epoch": 7328} {"train_loss": -28.37733268737793, "global_step": 608272, "epoch": 7328} {"train_loss": -27.867151260375977, "global_step": 608273, "epoch": 7328} {"train_loss": -28.412572860717773, "global_step": 608274, "epoch": 7328} {"train_loss": -28.16806411743164, "global_step": 608275, "epoch": 7328} {"train_loss": -28.215723037719727, "global_step": 608276, "epoch": 7328} {"train_loss": -28.146991729736328, "global_step": 608277, "epoch": 7328} {"train_loss": -28.05890464782715, "global_step": 608278, "epoch": 7328} {"train_loss": -28.335315704345703, "global_step": 608279, "epoch": 7328} {"train_loss": -28.05812644958496, "global_step": 608280, "epoch": 7328} {"train_loss": -28.125213623046875, "global_step": 608281, "epoch": 7328} {"train_loss": -28.2586727142334, "global_step": 608282, "epoch": 7328} {"train_loss": -28.064762115478516, "global_step": 608283, "epoch": 7328} {"train_loss": -27.81546401977539, "global_step": 608284, "epoch": 7328} {"train_loss": -28.00445556640625, "global_step": 608285, "epoch": 7328} {"train_loss": -28.437185287475586, "global_step": 608286, "epoch": 7328} {"train_loss": -27.732501983642578, "global_step": 608287, "epoch": 7328} {"train_loss": -27.566755294799805, "global_step": 608288, "epoch": 7328} {"train_loss": -27.920745849609375, "global_step": 608289, "epoch": 7328} {"train_loss": -28.064105987548828, "global_step": 608290, "epoch": 7328} {"train_loss": -28.02886962890625, "global_step": 608291, "epoch": 7328} {"train_loss": -27.869665145874023, "global_step": 608292, "epoch": 7328} {"train_loss": -28.1795654296875, "global_step": 608293, "epoch": 7328} {"train_loss": -27.99300193786621, "global_step": 608294, "epoch": 7328} {"train_loss": -28.1828556060791, "global_step": 608295, "epoch": 7328} {"train_loss": -28.299503326416016, "global_step": 608296, "epoch": 7328} {"train_loss": -28.210790634155273, "global_step": 608297, "epoch": 7328} {"train_loss": -28.073383331298828, "global_step": 608298, "epoch": 7328} {"train_loss": -28.168872833251953, "global_step": 608299, "epoch": 7328} {"train_loss": -28.142011642456055, "global_step": 608300, "epoch": 7328} {"train_loss": -28.219472885131836, "global_step": 608301, "epoch": 7328} {"train_loss": -28.054901123046875, "global_step": 608302, "epoch": 7328} {"train_loss": -28.110126495361328, "global_step": 608303, "epoch": 7328} {"train_loss": -28.067529678344727, "global_step": 608304, "epoch": 7328} {"train_loss": -28.365814208984375, "global_step": 608305, "epoch": 7328} {"train_loss": -27.77083075190165, "global_step": 608306, "epoch": 7328, "val_loss": 6565458.0} {"train_loss": -27.065942764282227, "global_step": 608307, "epoch": 7329} {"train_loss": -27.712833404541016, "global_step": 608308, "epoch": 7329} {"train_loss": -27.53940773010254, "global_step": 608309, "epoch": 7329} {"train_loss": -27.45377540588379, "global_step": 608310, "epoch": 7329} {"train_loss": -27.464792251586914, "global_step": 608311, "epoch": 7329} {"train_loss": -26.544153213500977, "global_step": 608312, "epoch": 7329} {"train_loss": -27.547576904296875, "global_step": 608313, "epoch": 7329} {"train_loss": -27.860822677612305, "global_step": 608314, "epoch": 7329} {"train_loss": -27.5910587310791, "global_step": 608315, "epoch": 7329} {"train_loss": -26.907629013061523, "global_step": 608316, "epoch": 7329} {"train_loss": -27.541166305541992, "global_step": 608317, "epoch": 7329} {"train_loss": -27.332550048828125, "global_step": 608318, "epoch": 7329} {"train_loss": -27.60479736328125, "global_step": 608319, "epoch": 7329} {"train_loss": -27.65667724609375, "global_step": 608320, "epoch": 7329} {"train_loss": -27.319799423217773, "global_step": 608321, "epoch": 7329} {"train_loss": -27.551055908203125, "global_step": 608322, "epoch": 7329} {"train_loss": -28.25323486328125, "global_step": 608323, "epoch": 7329} {"train_loss": -28.01424217224121, "global_step": 608324, "epoch": 7329} {"train_loss": -27.72541618347168, "global_step": 608325, "epoch": 7329} {"train_loss": -27.828643798828125, "global_step": 608326, "epoch": 7329} {"train_loss": -27.825485229492188, "global_step": 608327, "epoch": 7329} {"train_loss": -28.245685577392578, "global_step": 608328, "epoch": 7329} {"train_loss": -28.034399032592773, "global_step": 608329, "epoch": 7329} {"train_loss": -27.641077041625977, "global_step": 608330, "epoch": 7329} {"train_loss": -28.04115104675293, "global_step": 608331, "epoch": 7329} {"train_loss": -27.653162002563477, "global_step": 608332, "epoch": 7329} {"train_loss": -27.95452880859375, "global_step": 608333, "epoch": 7329} {"train_loss": -27.926923751831055, "global_step": 608334, "epoch": 7329} {"train_loss": -27.945993423461914, "global_step": 608335, "epoch": 7329} {"train_loss": -28.209522247314453, "global_step": 608336, "epoch": 7329} {"train_loss": -27.808019638061523, "global_step": 608337, "epoch": 7329} {"train_loss": -28.268762588500977, "global_step": 608338, "epoch": 7329} {"train_loss": -28.203420639038086, "global_step": 608339, "epoch": 7329} {"train_loss": -28.35470962524414, "global_step": 608340, "epoch": 7329} {"train_loss": -28.14462661743164, "global_step": 608341, "epoch": 7329} {"train_loss": -28.588693618774414, "global_step": 608342, "epoch": 7329} {"train_loss": -27.94928550720215, "global_step": 608343, "epoch": 7329} {"train_loss": -28.517719268798828, "global_step": 608344, "epoch": 7329} {"train_loss": -28.404632568359375, "global_step": 608345, "epoch": 7329} {"train_loss": -28.7434024810791, "global_step": 608346, "epoch": 7329} {"train_loss": -28.196165084838867, "global_step": 608347, "epoch": 7329} {"train_loss": -28.067541122436523, "global_step": 608348, "epoch": 7329} {"train_loss": -27.670989990234375, "global_step": 608349, "epoch": 7329} {"train_loss": -27.515033721923828, "global_step": 608350, "epoch": 7329} {"train_loss": -27.612226486206055, "global_step": 608351, "epoch": 7329} {"train_loss": -28.15439224243164, "global_step": 608352, "epoch": 7329} {"train_loss": -28.213260650634766, "global_step": 608353, "epoch": 7329} {"train_loss": -28.345264434814453, "global_step": 608354, "epoch": 7329} {"train_loss": -28.066238403320312, "global_step": 608355, "epoch": 7329} {"train_loss": -28.396631240844727, "global_step": 608356, "epoch": 7329} {"train_loss": -28.263477325439453, "global_step": 608357, "epoch": 7329} {"train_loss": -28.578535079956055, "global_step": 608358, "epoch": 7329} {"train_loss": -27.96143913269043, "global_step": 608359, "epoch": 7329} {"train_loss": -28.150482177734375, "global_step": 608360, "epoch": 7329} {"train_loss": -28.029754638671875, "global_step": 608361, "epoch": 7329} {"train_loss": -28.305953979492188, "global_step": 608362, "epoch": 7329} {"train_loss": -28.0189151763916, "global_step": 608363, "epoch": 7329} {"train_loss": -28.093719482421875, "global_step": 608364, "epoch": 7329} {"train_loss": -27.743921279907227, "global_step": 608365, "epoch": 7329} {"train_loss": -27.985504150390625, "global_step": 608366, "epoch": 7329} {"train_loss": -27.939420700073242, "global_step": 608367, "epoch": 7329} {"train_loss": -28.53754997253418, "global_step": 608368, "epoch": 7329} {"train_loss": -27.809534072875977, "global_step": 608369, "epoch": 7329} {"train_loss": -28.23978614807129, "global_step": 608370, "epoch": 7329} {"train_loss": -28.632923126220703, "global_step": 608371, "epoch": 7329} {"train_loss": -28.48431396484375, "global_step": 608372, "epoch": 7329} {"train_loss": -28.067068099975586, "global_step": 608373, "epoch": 7329} {"train_loss": -28.442548751831055, "global_step": 608374, "epoch": 7329} {"train_loss": -28.037372589111328, "global_step": 608375, "epoch": 7329} {"train_loss": -27.94901466369629, "global_step": 608376, "epoch": 7329} {"train_loss": -28.37550163269043, "global_step": 608377, "epoch": 7329} {"train_loss": -28.2805118560791, "global_step": 608378, "epoch": 7329} {"train_loss": -27.736921310424805, "global_step": 608379, "epoch": 7329} {"train_loss": -27.685514450073242, "global_step": 608380, "epoch": 7329} {"train_loss": -28.51881217956543, "global_step": 608381, "epoch": 7329} {"train_loss": -28.001190185546875, "global_step": 608382, "epoch": 7329} {"train_loss": -28.002843856811523, "global_step": 608383, "epoch": 7329} {"train_loss": -27.868066787719727, "global_step": 608384, "epoch": 7329} {"train_loss": -27.5164794921875, "global_step": 608385, "epoch": 7329} {"train_loss": -27.584491729736328, "global_step": 608386, "epoch": 7329} {"train_loss": -27.884729385375977, "global_step": 608387, "epoch": 7329} {"train_loss": -27.80610466003418, "global_step": 608388, "epoch": 7329} {"train_loss": -27.956603176622504, "global_step": 608389, "epoch": 7329, "val_loss": 6559672.5} {"train_loss": -27.582401275634766, "global_step": 608390, "epoch": 7330} {"train_loss": -27.56036376953125, "global_step": 608391, "epoch": 7330} {"train_loss": -27.4913272857666, "global_step": 608392, "epoch": 7330} {"train_loss": -27.435516357421875, "global_step": 608393, "epoch": 7330} {"train_loss": -26.8819580078125, "global_step": 608394, "epoch": 7330} {"train_loss": -27.0201416015625, "global_step": 608395, "epoch": 7330} {"train_loss": -27.588397979736328, "global_step": 608396, "epoch": 7330} {"train_loss": -27.338642120361328, "global_step": 608397, "epoch": 7330} {"train_loss": -26.455785751342773, "global_step": 608398, "epoch": 7330} {"train_loss": -27.494531631469727, "global_step": 608399, "epoch": 7330} {"train_loss": -26.83148193359375, "global_step": 608400, "epoch": 7330} {"train_loss": -27.29474449157715, "global_step": 608401, "epoch": 7330} {"train_loss": -27.369220733642578, "global_step": 608402, "epoch": 7330} {"train_loss": -27.521032333374023, "global_step": 608403, "epoch": 7330} {"train_loss": -27.332733154296875, "global_step": 608404, "epoch": 7330} {"train_loss": -27.915952682495117, "global_step": 608405, "epoch": 7330} {"train_loss": -27.36835289001465, "global_step": 608406, "epoch": 7330} {"train_loss": -27.950571060180664, "global_step": 608407, "epoch": 7330} {"train_loss": -27.385284423828125, "global_step": 608408, "epoch": 7330} {"train_loss": -27.330646514892578, "global_step": 608409, "epoch": 7330} {"train_loss": -27.14484214782715, "global_step": 608410, "epoch": 7330} {"train_loss": -28.16956901550293, "global_step": 608411, "epoch": 7330} {"train_loss": -27.7553653717041, "global_step": 608412, "epoch": 7330} {"train_loss": -27.30429458618164, "global_step": 608413, "epoch": 7330} {"train_loss": -27.697851181030273, "global_step": 608414, "epoch": 7330} {"train_loss": -28.171010971069336, "global_step": 608415, "epoch": 7330} {"train_loss": -27.8735294342041, "global_step": 608416, "epoch": 7330} {"train_loss": -27.88654136657715, "global_step": 608417, "epoch": 7330} {"train_loss": -28.214324951171875, "global_step": 608418, "epoch": 7330} {"train_loss": -27.855321884155273, "global_step": 608419, "epoch": 7330} {"train_loss": -28.02814292907715, "global_step": 608420, "epoch": 7330} {"train_loss": -27.935766220092773, "global_step": 608421, "epoch": 7330} {"train_loss": -27.559228897094727, "global_step": 608422, "epoch": 7330} {"train_loss": -28.018400192260742, "global_step": 608423, "epoch": 7330} {"train_loss": -28.017480850219727, "global_step": 608424, "epoch": 7330} {"train_loss": -28.025182723999023, "global_step": 608425, "epoch": 7330} {"train_loss": -27.93482780456543, "global_step": 608426, "epoch": 7330} {"train_loss": -28.023786544799805, "global_step": 608427, "epoch": 7330} {"train_loss": -28.12101173400879, "global_step": 608428, "epoch": 7330} {"train_loss": -27.691205978393555, "global_step": 608429, "epoch": 7330} {"train_loss": -27.869543075561523, "global_step": 608430, "epoch": 7330} {"train_loss": -28.26222038269043, "global_step": 608431, "epoch": 7330} {"train_loss": -28.111541748046875, "global_step": 608432, "epoch": 7330} {"train_loss": -27.878992080688477, "global_step": 608433, "epoch": 7330} {"train_loss": -28.207563400268555, "global_step": 608434, "epoch": 7330} {"train_loss": -28.048904418945312, "global_step": 608435, "epoch": 7330} {"train_loss": -27.928983688354492, "global_step": 608436, "epoch": 7330} {"train_loss": -28.397668838500977, "global_step": 608437, "epoch": 7330} {"train_loss": -28.021581649780273, "global_step": 608438, "epoch": 7330} {"train_loss": -28.033157348632812, "global_step": 608439, "epoch": 7330} {"train_loss": -28.18257713317871, "global_step": 608440, "epoch": 7330} {"train_loss": -28.19645118713379, "global_step": 608441, "epoch": 7330} {"train_loss": -28.10428237915039, "global_step": 608442, "epoch": 7330} {"train_loss": -28.029321670532227, "global_step": 608443, "epoch": 7330} {"train_loss": -28.339277267456055, "global_step": 608444, "epoch": 7330} {"train_loss": -28.163476943969727, "global_step": 608445, "epoch": 7330} {"train_loss": -28.315826416015625, "global_step": 608446, "epoch": 7330} {"train_loss": -28.284902572631836, "global_step": 608447, "epoch": 7330} {"train_loss": -28.6553955078125, "global_step": 608448, "epoch": 7330} {"train_loss": -28.479278564453125, "global_step": 608449, "epoch": 7330} {"train_loss": -28.084583282470703, "global_step": 608450, "epoch": 7330} {"train_loss": -28.107877731323242, "global_step": 608451, "epoch": 7330} {"train_loss": -28.026498794555664, "global_step": 608452, "epoch": 7330} {"train_loss": -28.24299430847168, "global_step": 608453, "epoch": 7330} {"train_loss": -28.250137329101562, "global_step": 608454, "epoch": 7330} {"train_loss": -28.528812408447266, "global_step": 608455, "epoch": 7330} {"train_loss": -28.439184188842773, "global_step": 608456, "epoch": 7330} {"train_loss": -28.565082550048828, "global_step": 608457, "epoch": 7330} {"train_loss": -28.217761993408203, "global_step": 608458, "epoch": 7330} {"train_loss": -28.250274658203125, "global_step": 608459, "epoch": 7330} {"train_loss": -28.66781997680664, "global_step": 608460, "epoch": 7330} {"train_loss": -28.253284454345703, "global_step": 608461, "epoch": 7330} {"train_loss": -28.1738224029541, "global_step": 608462, "epoch": 7330} {"train_loss": -28.43896484375, "global_step": 608463, "epoch": 7330} {"train_loss": -28.072423934936523, "global_step": 608464, "epoch": 7330} {"train_loss": -28.345468521118164, "global_step": 608465, "epoch": 7330} {"train_loss": -28.34083366394043, "global_step": 608466, "epoch": 7330} {"train_loss": -28.6176815032959, "global_step": 608467, "epoch": 7330} {"train_loss": -28.46143913269043, "global_step": 608468, "epoch": 7330} {"train_loss": -28.444177627563477, "global_step": 608469, "epoch": 7330} {"train_loss": -28.278228759765625, "global_step": 608470, "epoch": 7330} {"train_loss": -28.13797378540039, "global_step": 608471, "epoch": 7330} {"train_loss": -27.933620774602314, "global_step": 608472, "epoch": 7330, "val_loss": 6562980.0} {"train_loss": -27.367517471313477, "global_step": 608473, "epoch": 7331} {"train_loss": -27.244653701782227, "global_step": 608474, "epoch": 7331} {"train_loss": -26.87421989440918, "global_step": 608475, "epoch": 7331} {"train_loss": -26.582244873046875, "global_step": 608476, "epoch": 7331} {"train_loss": -27.611221313476562, "global_step": 608477, "epoch": 7331} {"train_loss": -27.568689346313477, "global_step": 608478, "epoch": 7331} {"train_loss": -27.31385612487793, "global_step": 608479, "epoch": 7331} {"train_loss": -27.799463272094727, "global_step": 608480, "epoch": 7331} {"train_loss": -27.610706329345703, "global_step": 608481, "epoch": 7331} {"train_loss": -27.660947799682617, "global_step": 608482, "epoch": 7331} {"train_loss": -27.530475616455078, "global_step": 608483, "epoch": 7331} {"train_loss": -27.4124698638916, "global_step": 608484, "epoch": 7331} {"train_loss": -27.60700035095215, "global_step": 608485, "epoch": 7331} {"train_loss": -27.808231353759766, "global_step": 608486, "epoch": 7331} {"train_loss": -27.420440673828125, "global_step": 608487, "epoch": 7331} {"train_loss": -27.787317276000977, "global_step": 608488, "epoch": 7331} {"train_loss": -27.84723472595215, "global_step": 608489, "epoch": 7331} {"train_loss": -27.692880630493164, "global_step": 608490, "epoch": 7331} {"train_loss": -27.958349227905273, "global_step": 608491, "epoch": 7331} {"train_loss": -27.589441299438477, "global_step": 608492, "epoch": 7331} {"train_loss": -28.265661239624023, "global_step": 608493, "epoch": 7331} {"train_loss": -27.901092529296875, "global_step": 608494, "epoch": 7331} {"train_loss": -28.087656021118164, "global_step": 608495, "epoch": 7331} {"train_loss": -27.85725212097168, "global_step": 608496, "epoch": 7331} {"train_loss": -27.58056640625, "global_step": 608497, "epoch": 7331} {"train_loss": -27.898334503173828, "global_step": 608498, "epoch": 7331} {"train_loss": -27.929670333862305, "global_step": 608499, "epoch": 7331} {"train_loss": -28.344635009765625, "global_step": 608500, "epoch": 7331} {"train_loss": -28.35520362854004, "global_step": 608501, "epoch": 7331} {"train_loss": -28.21747398376465, "global_step": 608502, "epoch": 7331} {"train_loss": -28.12530517578125, "global_step": 608503, "epoch": 7331} {"train_loss": -28.1012020111084, "global_step": 608504, "epoch": 7331} {"train_loss": -28.429182052612305, "global_step": 608505, "epoch": 7331} {"train_loss": -28.266443252563477, "global_step": 608506, "epoch": 7331} {"train_loss": -28.313617706298828, "global_step": 608507, "epoch": 7331} {"train_loss": -28.263294219970703, "global_step": 608508, "epoch": 7331} {"train_loss": -27.975683212280273, "global_step": 608509, "epoch": 7331} {"train_loss": -28.06537437438965, "global_step": 608510, "epoch": 7331} {"train_loss": -28.428876876831055, "global_step": 608511, "epoch": 7331} {"train_loss": -28.368820190429688, "global_step": 608512, "epoch": 7331} {"train_loss": -28.324268341064453, "global_step": 608513, "epoch": 7331} {"train_loss": -28.001047134399414, "global_step": 608514, "epoch": 7331} {"train_loss": -28.406009674072266, "global_step": 608515, "epoch": 7331} {"train_loss": -28.052051544189453, "global_step": 608516, "epoch": 7331} {"train_loss": -28.355188369750977, "global_step": 608517, "epoch": 7331} {"train_loss": -28.078460693359375, "global_step": 608518, "epoch": 7331} {"train_loss": -28.03126335144043, "global_step": 608519, "epoch": 7331} {"train_loss": -28.314725875854492, "global_step": 608520, "epoch": 7331} {"train_loss": -28.137256622314453, "global_step": 608521, "epoch": 7331} {"train_loss": -28.333234786987305, "global_step": 608522, "epoch": 7331} {"train_loss": -28.165319442749023, "global_step": 608523, "epoch": 7331} {"train_loss": -27.878843307495117, "global_step": 608524, "epoch": 7331} {"train_loss": -28.183042526245117, "global_step": 608525, "epoch": 7331} {"train_loss": -28.24728775024414, "global_step": 608526, "epoch": 7331} {"train_loss": -28.49654197692871, "global_step": 608527, "epoch": 7331} {"train_loss": -28.280261993408203, "global_step": 608528, "epoch": 7331} {"train_loss": -28.129018783569336, "global_step": 608529, "epoch": 7331} {"train_loss": -28.39690589904785, "global_step": 608530, "epoch": 7331} {"train_loss": -27.772357940673828, "global_step": 608531, "epoch": 7331} {"train_loss": -27.84370994567871, "global_step": 608532, "epoch": 7331} {"train_loss": -27.5087947845459, "global_step": 608533, "epoch": 7331} {"train_loss": -27.951751708984375, "global_step": 608534, "epoch": 7331} {"train_loss": -28.294300079345703, "global_step": 608535, "epoch": 7331} {"train_loss": -28.350797653198242, "global_step": 608536, "epoch": 7331} {"train_loss": -27.81990623474121, "global_step": 608537, "epoch": 7331} {"train_loss": -28.32198143005371, "global_step": 608538, "epoch": 7331} {"train_loss": -28.22589111328125, "global_step": 608539, "epoch": 7331} {"train_loss": -27.924652099609375, "global_step": 608540, "epoch": 7331} {"train_loss": -28.333646774291992, "global_step": 608541, "epoch": 7331} {"train_loss": -27.74747657775879, "global_step": 608542, "epoch": 7331} {"train_loss": -27.825641632080078, "global_step": 608543, "epoch": 7331} {"train_loss": -27.66092872619629, "global_step": 608544, "epoch": 7331} {"train_loss": -27.89763832092285, "global_step": 608545, "epoch": 7331} {"train_loss": -28.241159439086914, "global_step": 608546, "epoch": 7331} {"train_loss": -27.747114181518555, "global_step": 608547, "epoch": 7331} {"train_loss": -28.312570571899414, "global_step": 608548, "epoch": 7331} {"train_loss": -28.15899085998535, "global_step": 608549, "epoch": 7331} {"train_loss": -27.590133666992188, "global_step": 608550, "epoch": 7331} {"train_loss": -28.095319747924805, "global_step": 608551, "epoch": 7331} {"train_loss": -27.823638916015625, "global_step": 608552, "epoch": 7331} {"train_loss": -28.15537452697754, "global_step": 608553, "epoch": 7331} {"train_loss": -28.301191329956055, "global_step": 608554, "epoch": 7331} {"train_loss": -27.977379373757238, "global_step": 608555, "epoch": 7331, "val_loss": 6519304.0} {"train_loss": -26.931547164916992, "global_step": 608556, "epoch": 7332} {"train_loss": -27.72132682800293, "global_step": 608557, "epoch": 7332} {"train_loss": -27.031513214111328, "global_step": 608558, "epoch": 7332} {"train_loss": -27.403905868530273, "global_step": 608559, "epoch": 7332} {"train_loss": -27.341766357421875, "global_step": 608560, "epoch": 7332} {"train_loss": -27.067310333251953, "global_step": 608561, "epoch": 7332} {"train_loss": -27.25565528869629, "global_step": 608562, "epoch": 7332} {"train_loss": -28.048450469970703, "global_step": 608563, "epoch": 7332} {"train_loss": -27.248239517211914, "global_step": 608564, "epoch": 7332} {"train_loss": -27.607940673828125, "global_step": 608565, "epoch": 7332} {"train_loss": -27.626794815063477, "global_step": 608566, "epoch": 7332} {"train_loss": -27.684402465820312, "global_step": 608567, "epoch": 7332} {"train_loss": -27.447118759155273, "global_step": 608568, "epoch": 7332} {"train_loss": -27.940900802612305, "global_step": 608569, "epoch": 7332} {"train_loss": -27.671232223510742, "global_step": 608570, "epoch": 7332} {"train_loss": -27.3393497467041, "global_step": 608571, "epoch": 7332} {"train_loss": -27.79355812072754, "global_step": 608572, "epoch": 7332} {"train_loss": -27.70562744140625, "global_step": 608573, "epoch": 7332} {"train_loss": -28.02144432067871, "global_step": 608574, "epoch": 7332} {"train_loss": -27.82874870300293, "global_step": 608575, "epoch": 7332} {"train_loss": -27.6646671295166, "global_step": 608576, "epoch": 7332} {"train_loss": -27.633581161499023, "global_step": 608577, "epoch": 7332} {"train_loss": -27.771331787109375, "global_step": 608578, "epoch": 7332} {"train_loss": -27.990018844604492, "global_step": 608579, "epoch": 7332} {"train_loss": -27.67049217224121, "global_step": 608580, "epoch": 7332} {"train_loss": -28.070636749267578, "global_step": 608581, "epoch": 7332} {"train_loss": -28.213623046875, "global_step": 608582, "epoch": 7332} {"train_loss": -28.027740478515625, "global_step": 608583, "epoch": 7332} {"train_loss": -28.1799259185791, "global_step": 608584, "epoch": 7332} {"train_loss": -27.90045738220215, "global_step": 608585, "epoch": 7332} {"train_loss": -28.034948348999023, "global_step": 608586, "epoch": 7332} {"train_loss": -28.300006866455078, "global_step": 608587, "epoch": 7332} {"train_loss": -28.40375328063965, "global_step": 608588, "epoch": 7332} {"train_loss": -27.912626266479492, "global_step": 608589, "epoch": 7332} {"train_loss": -28.39534568786621, "global_step": 608590, "epoch": 7332} {"train_loss": -28.129779815673828, "global_step": 608591, "epoch": 7332} {"train_loss": -28.094202041625977, "global_step": 608592, "epoch": 7332} {"train_loss": -28.24188804626465, "global_step": 608593, "epoch": 7332} {"train_loss": -27.975637435913086, "global_step": 608594, "epoch": 7332} {"train_loss": -27.6602840423584, "global_step": 608595, "epoch": 7332} {"train_loss": -27.73349952697754, "global_step": 608596, "epoch": 7332} {"train_loss": -27.923206329345703, "global_step": 608597, "epoch": 7332} {"train_loss": -27.661584854125977, "global_step": 608598, "epoch": 7332} {"train_loss": -28.397851943969727, "global_step": 608599, "epoch": 7332} {"train_loss": -27.80543327331543, "global_step": 608600, "epoch": 7332} {"train_loss": -27.387344360351562, "global_step": 608601, "epoch": 7332} {"train_loss": -27.705175399780273, "global_step": 608602, "epoch": 7332} {"train_loss": -28.051742553710938, "global_step": 608603, "epoch": 7332} {"train_loss": -28.7368221282959, "global_step": 608604, "epoch": 7332} {"train_loss": -28.367767333984375, "global_step": 608605, "epoch": 7332} {"train_loss": -28.09107780456543, "global_step": 608606, "epoch": 7332} {"train_loss": -28.232446670532227, "global_step": 608607, "epoch": 7332} {"train_loss": -27.953144073486328, "global_step": 608608, "epoch": 7332} {"train_loss": -28.425220489501953, "global_step": 608609, "epoch": 7332} {"train_loss": -28.095483779907227, "global_step": 608610, "epoch": 7332} {"train_loss": -28.214231491088867, "global_step": 608611, "epoch": 7332} {"train_loss": -28.44013786315918, "global_step": 608612, "epoch": 7332} {"train_loss": -28.12200355529785, "global_step": 608613, "epoch": 7332} {"train_loss": -28.208377838134766, "global_step": 608614, "epoch": 7332} {"train_loss": -28.33544921875, "global_step": 608615, "epoch": 7332} {"train_loss": -28.554046630859375, "global_step": 608616, "epoch": 7332} {"train_loss": -28.283933639526367, "global_step": 608617, "epoch": 7332} {"train_loss": -28.148595809936523, "global_step": 608618, "epoch": 7332} {"train_loss": -28.2043514251709, "global_step": 608619, "epoch": 7332} {"train_loss": -28.29102897644043, "global_step": 608620, "epoch": 7332} {"train_loss": -28.061071395874023, "global_step": 608621, "epoch": 7332} {"train_loss": -27.929895401000977, "global_step": 608622, "epoch": 7332} {"train_loss": -28.021209716796875, "global_step": 608623, "epoch": 7332} {"train_loss": -28.312116622924805, "global_step": 608624, "epoch": 7332} {"train_loss": -28.122995376586914, "global_step": 608625, "epoch": 7332} {"train_loss": -28.04578971862793, "global_step": 608626, "epoch": 7332} {"train_loss": -28.05747413635254, "global_step": 608627, "epoch": 7332} {"train_loss": -27.86391258239746, "global_step": 608628, "epoch": 7332} {"train_loss": -27.744409561157227, "global_step": 608629, "epoch": 7332} {"train_loss": -28.072193145751953, "global_step": 608630, "epoch": 7332} {"train_loss": -27.844898223876953, "global_step": 608631, "epoch": 7332} {"train_loss": -28.260709762573242, "global_step": 608632, "epoch": 7332} {"train_loss": -28.220991134643555, "global_step": 608633, "epoch": 7332} {"train_loss": -28.240325927734375, "global_step": 608634, "epoch": 7332} {"train_loss": -27.770782470703125, "global_step": 608635, "epoch": 7332} {"train_loss": -28.090707778930664, "global_step": 608636, "epoch": 7332} {"train_loss": -27.746763229370117, "global_step": 608637, "epoch": 7332} {"train_loss": -27.93800749261695, "global_step": 608638, "epoch": 7332, "val_loss": 6563148.5} {"train_loss": -27.49482536315918, "global_step": 608639, "epoch": 7333} {"train_loss": -27.45914077758789, "global_step": 608640, "epoch": 7333} {"train_loss": -28.050128936767578, "global_step": 608641, "epoch": 7333} {"train_loss": -27.19228172302246, "global_step": 608642, "epoch": 7333} {"train_loss": -27.165618896484375, "global_step": 608643, "epoch": 7333} {"train_loss": -27.711374282836914, "global_step": 608644, "epoch": 7333} {"train_loss": -27.506147384643555, "global_step": 608645, "epoch": 7333} {"train_loss": -27.312910079956055, "global_step": 608646, "epoch": 7333} {"train_loss": -27.682296752929688, "global_step": 608647, "epoch": 7333} {"train_loss": -27.3454532623291, "global_step": 608648, "epoch": 7333} {"train_loss": -27.752683639526367, "global_step": 608649, "epoch": 7333} {"train_loss": -27.491565704345703, "global_step": 608650, "epoch": 7333} {"train_loss": -27.470300674438477, "global_step": 608651, "epoch": 7333} {"train_loss": -27.757410049438477, "global_step": 608652, "epoch": 7333} {"train_loss": -27.654190063476562, "global_step": 608653, "epoch": 7333} {"train_loss": -27.590742111206055, "global_step": 608654, "epoch": 7333} {"train_loss": -27.895938873291016, "global_step": 608655, "epoch": 7333} {"train_loss": -28.2242374420166, "global_step": 608656, "epoch": 7333} {"train_loss": -27.78657341003418, "global_step": 608657, "epoch": 7333} {"train_loss": -27.980850219726562, "global_step": 608658, "epoch": 7333} {"train_loss": -28.120208740234375, "global_step": 608659, "epoch": 7333} {"train_loss": -27.434955596923828, "global_step": 608660, "epoch": 7333} {"train_loss": -27.899993896484375, "global_step": 608661, "epoch": 7333} {"train_loss": -27.66739273071289, "global_step": 608662, "epoch": 7333} {"train_loss": -27.872053146362305, "global_step": 608663, "epoch": 7333} {"train_loss": -28.151865005493164, "global_step": 608664, "epoch": 7333} {"train_loss": -27.93695068359375, "global_step": 608665, "epoch": 7333} {"train_loss": -28.0862979888916, "global_step": 608666, "epoch": 7333} {"train_loss": -27.94233512878418, "global_step": 608667, "epoch": 7333} {"train_loss": -27.715295791625977, "global_step": 608668, "epoch": 7333} {"train_loss": -28.19083595275879, "global_step": 608669, "epoch": 7333} {"train_loss": -28.004262924194336, "global_step": 608670, "epoch": 7333} {"train_loss": -27.9289493560791, "global_step": 608671, "epoch": 7333} {"train_loss": -28.158803939819336, "global_step": 608672, "epoch": 7333} {"train_loss": -27.983572006225586, "global_step": 608673, "epoch": 7333} {"train_loss": -28.433027267456055, "global_step": 608674, "epoch": 7333} {"train_loss": -28.312307357788086, "global_step": 608675, "epoch": 7333} {"train_loss": -28.056440353393555, "global_step": 608676, "epoch": 7333} {"train_loss": -28.276901245117188, "global_step": 608677, "epoch": 7333} {"train_loss": -28.268423080444336, "global_step": 608678, "epoch": 7333} {"train_loss": -28.0771541595459, "global_step": 608679, "epoch": 7333} {"train_loss": -28.361291885375977, "global_step": 608680, "epoch": 7333} {"train_loss": -28.50618553161621, "global_step": 608681, "epoch": 7333} {"train_loss": -28.077198028564453, "global_step": 608682, "epoch": 7333} {"train_loss": -28.2817440032959, "global_step": 608683, "epoch": 7333} {"train_loss": -28.5086669921875, "global_step": 608684, "epoch": 7333} {"train_loss": -28.43692398071289, "global_step": 608685, "epoch": 7333} {"train_loss": -28.41241455078125, "global_step": 608686, "epoch": 7333} {"train_loss": -28.375471115112305, "global_step": 608687, "epoch": 7333} {"train_loss": -28.1335506439209, "global_step": 608688, "epoch": 7333} {"train_loss": -28.244449615478516, "global_step": 608689, "epoch": 7333} {"train_loss": -28.329736709594727, "global_step": 608690, "epoch": 7333} {"train_loss": -28.498258590698242, "global_step": 608691, "epoch": 7333} {"train_loss": -27.881635665893555, "global_step": 608692, "epoch": 7333} {"train_loss": -28.349634170532227, "global_step": 608693, "epoch": 7333} {"train_loss": -27.93446159362793, "global_step": 608694, "epoch": 7333} {"train_loss": -27.47535514831543, "global_step": 608695, "epoch": 7333} {"train_loss": -28.103546142578125, "global_step": 608696, "epoch": 7333} {"train_loss": -27.938495635986328, "global_step": 608697, "epoch": 7333} {"train_loss": -27.818628311157227, "global_step": 608698, "epoch": 7333} {"train_loss": -27.603412628173828, "global_step": 608699, "epoch": 7333} {"train_loss": -27.31991958618164, "global_step": 608700, "epoch": 7333} {"train_loss": -27.742979049682617, "global_step": 608701, "epoch": 7333} {"train_loss": -27.930988311767578, "global_step": 608702, "epoch": 7333} {"train_loss": -28.047760009765625, "global_step": 608703, "epoch": 7333} {"train_loss": -28.42921257019043, "global_step": 608704, "epoch": 7333} {"train_loss": -28.008987426757812, "global_step": 608705, "epoch": 7333} {"train_loss": -27.736804962158203, "global_step": 608706, "epoch": 7333} {"train_loss": -28.1234073638916, "global_step": 608707, "epoch": 7333} {"train_loss": -28.281309127807617, "global_step": 608708, "epoch": 7333} {"train_loss": -27.98578453063965, "global_step": 608709, "epoch": 7333} {"train_loss": -28.464033126831055, "global_step": 608710, "epoch": 7333} {"train_loss": -28.178180694580078, "global_step": 608711, "epoch": 7333} {"train_loss": -27.893156051635742, "global_step": 608712, "epoch": 7333} {"train_loss": -28.0341739654541, "global_step": 608713, "epoch": 7333} {"train_loss": -28.29390525817871, "global_step": 608714, "epoch": 7333} {"train_loss": -28.180723190307617, "global_step": 608715, "epoch": 7333} {"train_loss": -27.99824333190918, "global_step": 608716, "epoch": 7333} {"train_loss": -28.149381637573242, "global_step": 608717, "epoch": 7333} {"train_loss": -28.1157169342041, "global_step": 608718, "epoch": 7333} {"train_loss": -28.428930282592773, "global_step": 608719, "epoch": 7333} {"train_loss": -28.27727699279785, "global_step": 608720, "epoch": 7333} {"train_loss": -27.97950942257801, "global_step": 608721, "epoch": 7333, "val_loss": 6571360.0} {"train_loss": -27.77617835998535, "global_step": 608722, "epoch": 7334} {"train_loss": -27.811283111572266, "global_step": 608723, "epoch": 7334} {"train_loss": -27.886083602905273, "global_step": 608724, "epoch": 7334} {"train_loss": -28.10679054260254, "global_step": 608725, "epoch": 7334} {"train_loss": -28.204519271850586, "global_step": 608726, "epoch": 7334} {"train_loss": -27.973602294921875, "global_step": 608727, "epoch": 7334} {"train_loss": -27.8114070892334, "global_step": 608728, "epoch": 7334} {"train_loss": -27.6778621673584, "global_step": 608729, "epoch": 7334} {"train_loss": -27.7518310546875, "global_step": 608730, "epoch": 7334} {"train_loss": -27.776931762695312, "global_step": 608731, "epoch": 7334} {"train_loss": -27.918201446533203, "global_step": 608732, "epoch": 7334} {"train_loss": -27.206274032592773, "global_step": 608733, "epoch": 7334} {"train_loss": -27.411115646362305, "global_step": 608734, "epoch": 7334} {"train_loss": -27.66541862487793, "global_step": 608735, "epoch": 7334} {"train_loss": -28.22467041015625, "global_step": 608736, "epoch": 7334} {"train_loss": -27.699329376220703, "global_step": 608737, "epoch": 7334} {"train_loss": -27.88909339904785, "global_step": 608738, "epoch": 7334} {"train_loss": -27.45136070251465, "global_step": 608739, "epoch": 7334} {"train_loss": -27.784101486206055, "global_step": 608740, "epoch": 7334} {"train_loss": -28.180500030517578, "global_step": 608741, "epoch": 7334} {"train_loss": -27.6674747467041, "global_step": 608742, "epoch": 7334} {"train_loss": -27.873703002929688, "global_step": 608743, "epoch": 7334} {"train_loss": -27.995702743530273, "global_step": 608744, "epoch": 7334} {"train_loss": -27.60934829711914, "global_step": 608745, "epoch": 7334} {"train_loss": -27.92325782775879, "global_step": 608746, "epoch": 7334} {"train_loss": -27.9588565826416, "global_step": 608747, "epoch": 7334} {"train_loss": -28.254871368408203, "global_step": 608748, "epoch": 7334} {"train_loss": -27.880359649658203, "global_step": 608749, "epoch": 7334} {"train_loss": -28.339670181274414, "global_step": 608750, "epoch": 7334} {"train_loss": -28.402685165405273, "global_step": 608751, "epoch": 7334} {"train_loss": -27.808507919311523, "global_step": 608752, "epoch": 7334} {"train_loss": -28.0236759185791, "global_step": 608753, "epoch": 7334} {"train_loss": -27.97759437561035, "global_step": 608754, "epoch": 7334} {"train_loss": -27.879425048828125, "global_step": 608755, "epoch": 7334} {"train_loss": -28.184955596923828, "global_step": 608756, "epoch": 7334} {"train_loss": -28.158782958984375, "global_step": 608757, "epoch": 7334} {"train_loss": -27.793670654296875, "global_step": 608758, "epoch": 7334} {"train_loss": -27.928007125854492, "global_step": 608759, "epoch": 7334} {"train_loss": -27.892120361328125, "global_step": 608760, "epoch": 7334} {"train_loss": -28.302377700805664, "global_step": 608761, "epoch": 7334} {"train_loss": -28.274946212768555, "global_step": 608762, "epoch": 7334} {"train_loss": -27.609695434570312, "global_step": 608763, "epoch": 7334} {"train_loss": -27.488788604736328, "global_step": 608764, "epoch": 7334} {"train_loss": -27.095190048217773, "global_step": 608765, "epoch": 7334} {"train_loss": -27.567060470581055, "global_step": 608766, "epoch": 7334} {"train_loss": -28.14143943786621, "global_step": 608767, "epoch": 7334} {"train_loss": -28.355148315429688, "global_step": 608768, "epoch": 7334} {"train_loss": -28.525049209594727, "global_step": 608769, "epoch": 7334} {"train_loss": -28.18959617614746, "global_step": 608770, "epoch": 7334} {"train_loss": -27.929845809936523, "global_step": 608771, "epoch": 7334} {"train_loss": -28.097333908081055, "global_step": 608772, "epoch": 7334} {"train_loss": -28.308170318603516, "global_step": 608773, "epoch": 7334} {"train_loss": -28.278583526611328, "global_step": 608774, "epoch": 7334} {"train_loss": -28.221708297729492, "global_step": 608775, "epoch": 7334} {"train_loss": -28.322912216186523, "global_step": 608776, "epoch": 7334} {"train_loss": -28.18402671813965, "global_step": 608777, "epoch": 7334} {"train_loss": -28.0242919921875, "global_step": 608778, "epoch": 7334} {"train_loss": -28.27387046813965, "global_step": 608779, "epoch": 7334} {"train_loss": -27.9079647064209, "global_step": 608780, "epoch": 7334} {"train_loss": -27.938892364501953, "global_step": 608781, "epoch": 7334} {"train_loss": -28.247751235961914, "global_step": 608782, "epoch": 7334} {"train_loss": -28.52045249938965, "global_step": 608783, "epoch": 7334} {"train_loss": -28.183908462524414, "global_step": 608784, "epoch": 7334} {"train_loss": -28.4622802734375, "global_step": 608785, "epoch": 7334} {"train_loss": -28.199777603149414, "global_step": 608786, "epoch": 7334} {"train_loss": -28.228662490844727, "global_step": 608787, "epoch": 7334} {"train_loss": -28.1728572845459, "global_step": 608788, "epoch": 7334} {"train_loss": -28.271127700805664, "global_step": 608789, "epoch": 7334} {"train_loss": -28.217853546142578, "global_step": 608790, "epoch": 7334} {"train_loss": -28.100997924804688, "global_step": 608791, "epoch": 7334} {"train_loss": -28.028385162353516, "global_step": 608792, "epoch": 7334} {"train_loss": -27.897705078125, "global_step": 608793, "epoch": 7334} {"train_loss": -28.254535675048828, "global_step": 608794, "epoch": 7334} {"train_loss": -28.259784698486328, "global_step": 608795, "epoch": 7334} {"train_loss": -28.050506591796875, "global_step": 608796, "epoch": 7334} {"train_loss": -28.04262351989746, "global_step": 608797, "epoch": 7334} {"train_loss": -28.33233642578125, "global_step": 608798, "epoch": 7334} {"train_loss": -28.106225967407227, "global_step": 608799, "epoch": 7334} {"train_loss": -28.15631675720215, "global_step": 608800, "epoch": 7334} {"train_loss": -28.24724769592285, "global_step": 608801, "epoch": 7334} {"train_loss": -28.164703369140625, "global_step": 608802, "epoch": 7334} {"train_loss": -28.13252067565918, "global_step": 608803, "epoch": 7334} {"train_loss": -28.010827719447125, "global_step": 608804, "epoch": 7334, "val_loss": 6499860.0} {"train_loss": -25.969297409057617, "global_step": 608805, "epoch": 7335} {"train_loss": -25.57404136657715, "global_step": 608806, "epoch": 7335} {"train_loss": -27.3859806060791, "global_step": 608807, "epoch": 7335} {"train_loss": -25.93195152282715, "global_step": 608808, "epoch": 7335} {"train_loss": -26.606781005859375, "global_step": 608809, "epoch": 7335} {"train_loss": -27.429229736328125, "global_step": 608810, "epoch": 7335} {"train_loss": -27.127721786499023, "global_step": 608811, "epoch": 7335} {"train_loss": -27.574499130249023, "global_step": 608812, "epoch": 7335} {"train_loss": -27.777074813842773, "global_step": 608813, "epoch": 7335} {"train_loss": -27.507465362548828, "global_step": 608814, "epoch": 7335} {"train_loss": -27.61017417907715, "global_step": 608815, "epoch": 7335} {"train_loss": -27.78940200805664, "global_step": 608816, "epoch": 7335} {"train_loss": -27.721593856811523, "global_step": 608817, "epoch": 7335} {"train_loss": -27.876169204711914, "global_step": 608818, "epoch": 7335} {"train_loss": -27.197906494140625, "global_step": 608819, "epoch": 7335} {"train_loss": -27.7723445892334, "global_step": 608820, "epoch": 7335} {"train_loss": -27.756757736206055, "global_step": 608821, "epoch": 7335} {"train_loss": -27.5029239654541, "global_step": 608822, "epoch": 7335} {"train_loss": -27.904727935791016, "global_step": 608823, "epoch": 7335} {"train_loss": -27.72068214416504, "global_step": 608824, "epoch": 7335} {"train_loss": -28.072803497314453, "global_step": 608825, "epoch": 7335} {"train_loss": -28.009244918823242, "global_step": 608826, "epoch": 7335} {"train_loss": -28.02069091796875, "global_step": 608827, "epoch": 7335} {"train_loss": -27.8474178314209, "global_step": 608828, "epoch": 7335} {"train_loss": -27.899982452392578, "global_step": 608829, "epoch": 7335} {"train_loss": -27.9671573638916, "global_step": 608830, "epoch": 7335} {"train_loss": -27.636465072631836, "global_step": 608831, "epoch": 7335} {"train_loss": -27.99370765686035, "global_step": 608832, "epoch": 7335} {"train_loss": -27.997953414916992, "global_step": 608833, "epoch": 7335} {"train_loss": -28.064016342163086, "global_step": 608834, "epoch": 7335} {"train_loss": -28.154272079467773, "global_step": 608835, "epoch": 7335} {"train_loss": -28.273874282836914, "global_step": 608836, "epoch": 7335} {"train_loss": -28.01263427734375, "global_step": 608837, "epoch": 7335} {"train_loss": -27.830434799194336, "global_step": 608838, "epoch": 7335} {"train_loss": -27.974048614501953, "global_step": 608839, "epoch": 7335} {"train_loss": -28.11594581604004, "global_step": 608840, "epoch": 7335} {"train_loss": -27.94526481628418, "global_step": 608841, "epoch": 7335} {"train_loss": -27.920230865478516, "global_step": 608842, "epoch": 7335} {"train_loss": -28.392780303955078, "global_step": 608843, "epoch": 7335} {"train_loss": -28.331817626953125, "global_step": 608844, "epoch": 7335} {"train_loss": -28.143796920776367, "global_step": 608845, "epoch": 7335} {"train_loss": -28.212976455688477, "global_step": 608846, "epoch": 7335} {"train_loss": -27.8963680267334, "global_step": 608847, "epoch": 7335} {"train_loss": -28.318134307861328, "global_step": 608848, "epoch": 7335} {"train_loss": -28.172012329101562, "global_step": 608849, "epoch": 7335} {"train_loss": -28.151447296142578, "global_step": 608850, "epoch": 7335} {"train_loss": -28.092548370361328, "global_step": 608851, "epoch": 7335} {"train_loss": -27.969846725463867, "global_step": 608852, "epoch": 7335} {"train_loss": -28.230634689331055, "global_step": 608853, "epoch": 7335} {"train_loss": -28.448047637939453, "global_step": 608854, "epoch": 7335} {"train_loss": -28.23639488220215, "global_step": 608855, "epoch": 7335} {"train_loss": -28.23086929321289, "global_step": 608856, "epoch": 7335} {"train_loss": -28.238317489624023, "global_step": 608857, "epoch": 7335} {"train_loss": -28.557220458984375, "global_step": 608858, "epoch": 7335} {"train_loss": -28.542287826538086, "global_step": 608859, "epoch": 7335} {"train_loss": -28.116281509399414, "global_step": 608860, "epoch": 7335} {"train_loss": -27.980188369750977, "global_step": 608861, "epoch": 7335} {"train_loss": -28.2432861328125, "global_step": 608862, "epoch": 7335} {"train_loss": -27.909912109375, "global_step": 608863, "epoch": 7335} {"train_loss": -28.249670028686523, "global_step": 608864, "epoch": 7335} {"train_loss": -28.115880966186523, "global_step": 608865, "epoch": 7335} {"train_loss": -28.26551628112793, "global_step": 608866, "epoch": 7335} {"train_loss": -28.639760971069336, "global_step": 608867, "epoch": 7335} {"train_loss": -28.42842674255371, "global_step": 608868, "epoch": 7335} {"train_loss": -27.538959503173828, "global_step": 608869, "epoch": 7335} {"train_loss": -28.134687423706055, "global_step": 608870, "epoch": 7335} {"train_loss": -28.35645866394043, "global_step": 608871, "epoch": 7335} {"train_loss": -28.214963912963867, "global_step": 608872, "epoch": 7335} {"train_loss": -28.30282974243164, "global_step": 608873, "epoch": 7335} {"train_loss": -27.972869873046875, "global_step": 608874, "epoch": 7335} {"train_loss": -28.09002113342285, "global_step": 608875, "epoch": 7335} {"train_loss": -28.93110466003418, "global_step": 608876, "epoch": 7335} {"train_loss": -28.132617950439453, "global_step": 608877, "epoch": 7335} {"train_loss": -28.057880401611328, "global_step": 608878, "epoch": 7335} {"train_loss": -28.1823787689209, "global_step": 608879, "epoch": 7335} {"train_loss": -28.19940757751465, "global_step": 608880, "epoch": 7335} {"train_loss": -28.09392738342285, "global_step": 608881, "epoch": 7335} {"train_loss": -28.0673828125, "global_step": 608882, "epoch": 7335} {"train_loss": -28.041616439819336, "global_step": 608883, "epoch": 7335} {"train_loss": -27.288862228393555, "global_step": 608884, "epoch": 7335} {"train_loss": -26.214319229125977, "global_step": 608885, "epoch": 7335} {"train_loss": -25.6994571685791, "global_step": 608886, "epoch": 7335} {"train_loss": -27.866876211511084, "global_step": 608887, "epoch": 7335, "val_loss": 6548683.0} {"train_loss": -26.032033920288086, "global_step": 608888, "epoch": 7336} {"train_loss": -25.639310836791992, "global_step": 608889, "epoch": 7336} {"train_loss": -26.708484649658203, "global_step": 608890, "epoch": 7336} {"train_loss": -25.23667335510254, "global_step": 608891, "epoch": 7336} {"train_loss": -26.9182186126709, "global_step": 608892, "epoch": 7336} {"train_loss": -26.910999298095703, "global_step": 608893, "epoch": 7336} {"train_loss": -27.273054122924805, "global_step": 608894, "epoch": 7336} {"train_loss": -26.835607528686523, "global_step": 608895, "epoch": 7336} {"train_loss": -27.099390029907227, "global_step": 608896, "epoch": 7336} {"train_loss": -26.792224884033203, "global_step": 608897, "epoch": 7336} {"train_loss": -26.955341339111328, "global_step": 608898, "epoch": 7336} {"train_loss": -27.127721786499023, "global_step": 608899, "epoch": 7336} {"train_loss": -27.523303985595703, "global_step": 608900, "epoch": 7336} {"train_loss": -26.966962814331055, "global_step": 608901, "epoch": 7336} {"train_loss": -27.226654052734375, "global_step": 608902, "epoch": 7336} {"train_loss": -27.3751163482666, "global_step": 608903, "epoch": 7336} {"train_loss": -27.815570831298828, "global_step": 608904, "epoch": 7336} {"train_loss": -27.664648056030273, "global_step": 608905, "epoch": 7336} {"train_loss": -27.18379020690918, "global_step": 608906, "epoch": 7336} {"train_loss": -27.207290649414062, "global_step": 608907, "epoch": 7336} {"train_loss": -27.395965576171875, "global_step": 608908, "epoch": 7336} {"train_loss": -27.834203720092773, "global_step": 608909, "epoch": 7336} {"train_loss": -27.45883560180664, "global_step": 608910, "epoch": 7336} {"train_loss": -27.599767684936523, "global_step": 608911, "epoch": 7336} {"train_loss": -27.78339958190918, "global_step": 608912, "epoch": 7336} {"train_loss": -27.825607299804688, "global_step": 608913, "epoch": 7336} {"train_loss": -27.96304702758789, "global_step": 608914, "epoch": 7336} {"train_loss": -27.74420166015625, "global_step": 608915, "epoch": 7336} {"train_loss": -27.586505889892578, "global_step": 608916, "epoch": 7336} {"train_loss": -27.893341064453125, "global_step": 608917, "epoch": 7336} {"train_loss": -28.120935440063477, "global_step": 608918, "epoch": 7336} {"train_loss": -27.66745948791504, "global_step": 608919, "epoch": 7336} {"train_loss": -28.08806800842285, "global_step": 608920, "epoch": 7336} {"train_loss": -28.0517520904541, "global_step": 608921, "epoch": 7336} {"train_loss": -27.663593292236328, "global_step": 608922, "epoch": 7336} {"train_loss": -28.117969512939453, "global_step": 608923, "epoch": 7336} {"train_loss": -27.547077178955078, "global_step": 608924, "epoch": 7336} {"train_loss": -27.986326217651367, "global_step": 608925, "epoch": 7336} {"train_loss": -27.624958038330078, "global_step": 608926, "epoch": 7336} {"train_loss": -27.660329818725586, "global_step": 608927, "epoch": 7336} {"train_loss": -27.98944664001465, "global_step": 608928, "epoch": 7336} {"train_loss": -28.256189346313477, "global_step": 608929, "epoch": 7336} {"train_loss": -27.743417739868164, "global_step": 608930, "epoch": 7336} {"train_loss": -27.93585777282715, "global_step": 608931, "epoch": 7336} {"train_loss": -28.16200065612793, "global_step": 608932, "epoch": 7336} {"train_loss": -28.022336959838867, "global_step": 608933, "epoch": 7336} {"train_loss": -28.08760643005371, "global_step": 608934, "epoch": 7336} {"train_loss": -28.155866622924805, "global_step": 608935, "epoch": 7336} {"train_loss": -27.884923934936523, "global_step": 608936, "epoch": 7336} {"train_loss": -27.992944717407227, "global_step": 608937, "epoch": 7336} {"train_loss": -27.975025177001953, "global_step": 608938, "epoch": 7336} {"train_loss": -28.020904541015625, "global_step": 608939, "epoch": 7336} {"train_loss": -28.291446685791016, "global_step": 608940, "epoch": 7336} {"train_loss": -27.795928955078125, "global_step": 608941, "epoch": 7336} {"train_loss": -28.2916259765625, "global_step": 608942, "epoch": 7336} {"train_loss": -28.171804428100586, "global_step": 608943, "epoch": 7336} {"train_loss": -28.059934616088867, "global_step": 608944, "epoch": 7336} {"train_loss": -27.984418869018555, "global_step": 608945, "epoch": 7336} {"train_loss": -27.937231063842773, "global_step": 608946, "epoch": 7336} {"train_loss": -28.127567291259766, "global_step": 608947, "epoch": 7336} {"train_loss": -28.214406967163086, "global_step": 608948, "epoch": 7336} {"train_loss": -28.160669326782227, "global_step": 608949, "epoch": 7336} {"train_loss": -28.279626846313477, "global_step": 608950, "epoch": 7336} {"train_loss": -28.45014762878418, "global_step": 608951, "epoch": 7336} {"train_loss": -28.2846736907959, "global_step": 608952, "epoch": 7336} {"train_loss": -28.285572052001953, "global_step": 608953, "epoch": 7336} {"train_loss": -27.84769630432129, "global_step": 608954, "epoch": 7336} {"train_loss": -28.080419540405273, "global_step": 608955, "epoch": 7336} {"train_loss": -28.295202255249023, "global_step": 608956, "epoch": 7336} {"train_loss": -28.032550811767578, "global_step": 608957, "epoch": 7336} {"train_loss": -27.69675064086914, "global_step": 608958, "epoch": 7336} {"train_loss": -28.589111328125, "global_step": 608959, "epoch": 7336} {"train_loss": -28.213647842407227, "global_step": 608960, "epoch": 7336} {"train_loss": -28.1774959564209, "global_step": 608961, "epoch": 7336} {"train_loss": -28.08363914489746, "global_step": 608962, "epoch": 7336} {"train_loss": -28.315765380859375, "global_step": 608963, "epoch": 7336} {"train_loss": -28.279727935791016, "global_step": 608964, "epoch": 7336} {"train_loss": -28.129730224609375, "global_step": 608965, "epoch": 7336} {"train_loss": -28.414688110351562, "global_step": 608966, "epoch": 7336} {"train_loss": -28.139123916625977, "global_step": 608967, "epoch": 7336} {"train_loss": -28.085065841674805, "global_step": 608968, "epoch": 7336} {"train_loss": -28.112775802612305, "global_step": 608969, "epoch": 7336} {"train_loss": -27.752780270863727, "global_step": 608970, "epoch": 7336, "val_loss": 6596602.0} {"train_loss": -28.009103775024414, "global_step": 608971, "epoch": 7337} {"train_loss": -27.9963436126709, "global_step": 608972, "epoch": 7337} {"train_loss": -27.70118522644043, "global_step": 608973, "epoch": 7337} {"train_loss": -28.037174224853516, "global_step": 608974, "epoch": 7337} {"train_loss": -27.886754989624023, "global_step": 608975, "epoch": 7337} {"train_loss": -27.652973175048828, "global_step": 608976, "epoch": 7337} {"train_loss": -27.995325088500977, "global_step": 608977, "epoch": 7337} {"train_loss": -27.495405197143555, "global_step": 608978, "epoch": 7337} {"train_loss": -28.053714752197266, "global_step": 608979, "epoch": 7337} {"train_loss": -27.473352432250977, "global_step": 608980, "epoch": 7337} {"train_loss": -27.739948272705078, "global_step": 608981, "epoch": 7337} {"train_loss": -28.09781265258789, "global_step": 608982, "epoch": 7337} {"train_loss": -28.14400291442871, "global_step": 608983, "epoch": 7337} {"train_loss": -27.84762954711914, "global_step": 608984, "epoch": 7337} {"train_loss": -27.603729248046875, "global_step": 608985, "epoch": 7337} {"train_loss": -27.888473510742188, "global_step": 608986, "epoch": 7337} {"train_loss": -28.16765785217285, "global_step": 608987, "epoch": 7337} {"train_loss": -27.887313842773438, "global_step": 608988, "epoch": 7337} {"train_loss": -28.20038414001465, "global_step": 608989, "epoch": 7337} {"train_loss": -27.842130661010742, "global_step": 608990, "epoch": 7337} {"train_loss": -27.76011085510254, "global_step": 608991, "epoch": 7337} {"train_loss": -27.84821128845215, "global_step": 608992, "epoch": 7337} {"train_loss": -28.0831298828125, "global_step": 608993, "epoch": 7337} {"train_loss": -28.032785415649414, "global_step": 608994, "epoch": 7337} {"train_loss": -28.149988174438477, "global_step": 608995, "epoch": 7337} {"train_loss": -28.108152389526367, "global_step": 608996, "epoch": 7337} {"train_loss": -28.6190242767334, "global_step": 608997, "epoch": 7337} {"train_loss": -28.287673950195312, "global_step": 608998, "epoch": 7337} {"train_loss": -28.421630859375, "global_step": 608999, "epoch": 7337} {"train_loss": -28.17725944519043, "global_step": 609000, "epoch": 7337} {"train_loss": -28.130050659179688, "global_step": 609001, "epoch": 7337} {"train_loss": -27.738372802734375, "global_step": 609002, "epoch": 7337} {"train_loss": -28.083627700805664, "global_step": 609003, "epoch": 7337} {"train_loss": -27.755186080932617, "global_step": 609004, "epoch": 7337} {"train_loss": -27.9750919342041, "global_step": 609005, "epoch": 7337} {"train_loss": -28.29391860961914, "global_step": 609006, "epoch": 7337} {"train_loss": -28.129016876220703, "global_step": 609007, "epoch": 7337} {"train_loss": -28.171903610229492, "global_step": 609008, "epoch": 7337} {"train_loss": -28.074472427368164, "global_step": 609009, "epoch": 7337} {"train_loss": -28.122360229492188, "global_step": 609010, "epoch": 7337} {"train_loss": -28.171167373657227, "global_step": 609011, "epoch": 7337} {"train_loss": -28.109710693359375, "global_step": 609012, "epoch": 7337} {"train_loss": -28.20063591003418, "global_step": 609013, "epoch": 7337} {"train_loss": -27.85780143737793, "global_step": 609014, "epoch": 7337} {"train_loss": -28.379186630249023, "global_step": 609015, "epoch": 7337} {"train_loss": -27.93979835510254, "global_step": 609016, "epoch": 7337} {"train_loss": -28.037137985229492, "global_step": 609017, "epoch": 7337} {"train_loss": -28.092517852783203, "global_step": 609018, "epoch": 7337} {"train_loss": -27.927169799804688, "global_step": 609019, "epoch": 7337} {"train_loss": -28.019062042236328, "global_step": 609020, "epoch": 7337} {"train_loss": -27.95757484436035, "global_step": 609021, "epoch": 7337} {"train_loss": -28.142623901367188, "global_step": 609022, "epoch": 7337} {"train_loss": -28.538171768188477, "global_step": 609023, "epoch": 7337} {"train_loss": -27.786664962768555, "global_step": 609024, "epoch": 7337} {"train_loss": -28.058420181274414, "global_step": 609025, "epoch": 7337} {"train_loss": -27.714725494384766, "global_step": 609026, "epoch": 7337} {"train_loss": -28.05910301208496, "global_step": 609027, "epoch": 7337} {"train_loss": -28.221960067749023, "global_step": 609028, "epoch": 7337} {"train_loss": -28.150426864624023, "global_step": 609029, "epoch": 7337} {"train_loss": -28.29298973083496, "global_step": 609030, "epoch": 7337} {"train_loss": -28.444320678710938, "global_step": 609031, "epoch": 7337} {"train_loss": -27.913196563720703, "global_step": 609032, "epoch": 7337} {"train_loss": -28.303607940673828, "global_step": 609033, "epoch": 7337} {"train_loss": -28.20038414001465, "global_step": 609034, "epoch": 7337} {"train_loss": -28.226165771484375, "global_step": 609035, "epoch": 7337} {"train_loss": -28.338388442993164, "global_step": 609036, "epoch": 7337} {"train_loss": -28.49566650390625, "global_step": 609037, "epoch": 7337} {"train_loss": -28.45551109313965, "global_step": 609038, "epoch": 7337} {"train_loss": -28.164037704467773, "global_step": 609039, "epoch": 7337} {"train_loss": -28.200239181518555, "global_step": 609040, "epoch": 7337} {"train_loss": -27.98789405822754, "global_step": 609041, "epoch": 7337} {"train_loss": -27.66145133972168, "global_step": 609042, "epoch": 7337} {"train_loss": -28.243316650390625, "global_step": 609043, "epoch": 7337} {"train_loss": -28.236648559570312, "global_step": 609044, "epoch": 7337} {"train_loss": -28.1439151763916, "global_step": 609045, "epoch": 7337} {"train_loss": -27.94746208190918, "global_step": 609046, "epoch": 7337} {"train_loss": -28.137845993041992, "global_step": 609047, "epoch": 7337} {"train_loss": -28.25439453125, "global_step": 609048, "epoch": 7337} {"train_loss": -28.05782127380371, "global_step": 609049, "epoch": 7337} {"train_loss": -28.232162475585938, "global_step": 609050, "epoch": 7337} {"train_loss": -27.75684928894043, "global_step": 609051, "epoch": 7337} {"train_loss": -27.988080978393555, "global_step": 609052, "epoch": 7337} {"train_loss": -28.052397555615528, "global_step": 609053, "epoch": 7337, "val_loss": 6591769.5} {"train_loss": -25.737401962280273, "global_step": 609054, "epoch": 7338} {"train_loss": -23.740482330322266, "global_step": 609055, "epoch": 7338} {"train_loss": -25.98394775390625, "global_step": 609056, "epoch": 7338} {"train_loss": -26.788532257080078, "global_step": 609057, "epoch": 7338} {"train_loss": -25.325424194335938, "global_step": 609058, "epoch": 7338} {"train_loss": -26.58389663696289, "global_step": 609059, "epoch": 7338} {"train_loss": -26.664154052734375, "global_step": 609060, "epoch": 7338} {"train_loss": -25.625783920288086, "global_step": 609061, "epoch": 7338} {"train_loss": -27.066253662109375, "global_step": 609062, "epoch": 7338} {"train_loss": -26.214019775390625, "global_step": 609063, "epoch": 7338} {"train_loss": -26.966650009155273, "global_step": 609064, "epoch": 7338} {"train_loss": -26.950626373291016, "global_step": 609065, "epoch": 7338} {"train_loss": -26.800146102905273, "global_step": 609066, "epoch": 7338} {"train_loss": -27.128381729125977, "global_step": 609067, "epoch": 7338} {"train_loss": -27.23154067993164, "global_step": 609068, "epoch": 7338} {"train_loss": -27.486709594726562, "global_step": 609069, "epoch": 7338} {"train_loss": -27.0826473236084, "global_step": 609070, "epoch": 7338} {"train_loss": -27.4163761138916, "global_step": 609071, "epoch": 7338} {"train_loss": -27.233495712280273, "global_step": 609072, "epoch": 7338} {"train_loss": -27.1976261138916, "global_step": 609073, "epoch": 7338} {"train_loss": -27.459836959838867, "global_step": 609074, "epoch": 7338} {"train_loss": -26.99220848083496, "global_step": 609075, "epoch": 7338} {"train_loss": -27.67982292175293, "global_step": 609076, "epoch": 7338} {"train_loss": -27.612701416015625, "global_step": 609077, "epoch": 7338} {"train_loss": -27.3671817779541, "global_step": 609078, "epoch": 7338} {"train_loss": -27.2608699798584, "global_step": 609079, "epoch": 7338} {"train_loss": -27.68328857421875, "global_step": 609080, "epoch": 7338} {"train_loss": -27.590229034423828, "global_step": 609081, "epoch": 7338} {"train_loss": -27.66961097717285, "global_step": 609082, "epoch": 7338} {"train_loss": -27.446985244750977, "global_step": 609083, "epoch": 7338} {"train_loss": -27.520593643188477, "global_step": 609084, "epoch": 7338} {"train_loss": -27.8171443939209, "global_step": 609085, "epoch": 7338} {"train_loss": -27.858570098876953, "global_step": 609086, "epoch": 7338} {"train_loss": -27.756805419921875, "global_step": 609087, "epoch": 7338} {"train_loss": -27.893274307250977, "global_step": 609088, "epoch": 7338} {"train_loss": -27.422582626342773, "global_step": 609089, "epoch": 7338} {"train_loss": -27.732975006103516, "global_step": 609090, "epoch": 7338} {"train_loss": -27.974462509155273, "global_step": 609091, "epoch": 7338} {"train_loss": -27.650665283203125, "global_step": 609092, "epoch": 7338} {"train_loss": -27.880130767822266, "global_step": 609093, "epoch": 7338} {"train_loss": -27.86750602722168, "global_step": 609094, "epoch": 7338} {"train_loss": -27.420095443725586, "global_step": 609095, "epoch": 7338} {"train_loss": -28.173330307006836, "global_step": 609096, "epoch": 7338} {"train_loss": -27.805204391479492, "global_step": 609097, "epoch": 7338} {"train_loss": -28.26607322692871, "global_step": 609098, "epoch": 7338} {"train_loss": -27.999408721923828, "global_step": 609099, "epoch": 7338} {"train_loss": -28.02838706970215, "global_step": 609100, "epoch": 7338} {"train_loss": -27.92317008972168, "global_step": 609101, "epoch": 7338} {"train_loss": -28.204431533813477, "global_step": 609102, "epoch": 7338} {"train_loss": -28.337249755859375, "global_step": 609103, "epoch": 7338} {"train_loss": -28.274600982666016, "global_step": 609104, "epoch": 7338} {"train_loss": -28.36695671081543, "global_step": 609105, "epoch": 7338} {"train_loss": -28.150293350219727, "global_step": 609106, "epoch": 7338} {"train_loss": -27.793012619018555, "global_step": 609107, "epoch": 7338} {"train_loss": -28.120996475219727, "global_step": 609108, "epoch": 7338} {"train_loss": -28.383466720581055, "global_step": 609109, "epoch": 7338} {"train_loss": -27.871051788330078, "global_step": 609110, "epoch": 7338} {"train_loss": -28.339380264282227, "global_step": 609111, "epoch": 7338} {"train_loss": -28.390750885009766, "global_step": 609112, "epoch": 7338} {"train_loss": -28.00745964050293, "global_step": 609113, "epoch": 7338} {"train_loss": -28.34063720703125, "global_step": 609114, "epoch": 7338} {"train_loss": -28.249439239501953, "global_step": 609115, "epoch": 7338} {"train_loss": -28.35986328125, "global_step": 609116, "epoch": 7338} {"train_loss": -28.2567081451416, "global_step": 609117, "epoch": 7338} {"train_loss": -28.09671401977539, "global_step": 609118, "epoch": 7338} {"train_loss": -27.9510440826416, "global_step": 609119, "epoch": 7338} {"train_loss": -27.906570434570312, "global_step": 609120, "epoch": 7338} {"train_loss": -28.462244033813477, "global_step": 609121, "epoch": 7338} {"train_loss": -28.19921875, "global_step": 609122, "epoch": 7338} {"train_loss": -28.209735870361328, "global_step": 609123, "epoch": 7338} {"train_loss": -28.510406494140625, "global_step": 609124, "epoch": 7338} {"train_loss": -27.748336791992188, "global_step": 609125, "epoch": 7338} {"train_loss": -28.201749801635742, "global_step": 609126, "epoch": 7338} {"train_loss": -28.18698501586914, "global_step": 609127, "epoch": 7338} {"train_loss": -27.524658203125, "global_step": 609128, "epoch": 7338} {"train_loss": -26.979705810546875, "global_step": 609129, "epoch": 7338} {"train_loss": -26.387964248657227, "global_step": 609130, "epoch": 7338} {"train_loss": -25.063880920410156, "global_step": 609131, "epoch": 7338} {"train_loss": -24.90492057800293, "global_step": 609132, "epoch": 7338} {"train_loss": -25.929174423217773, "global_step": 609133, "epoch": 7338} {"train_loss": -27.168249130249023, "global_step": 609134, "epoch": 7338} {"train_loss": -27.292587280273438, "global_step": 609135, "epoch": 7338} {"train_loss": -27.44606974038733, "global_step": 609136, "epoch": 7338, "val_loss": 6661415.0} {"train_loss": -25.162029266357422, "global_step": 609137, "epoch": 7339} {"train_loss": -26.231042861938477, "global_step": 609138, "epoch": 7339} {"train_loss": -25.766788482666016, "global_step": 609139, "epoch": 7339} {"train_loss": -26.491422653198242, "global_step": 609140, "epoch": 7339} {"train_loss": -25.302927017211914, "global_step": 609141, "epoch": 7339} {"train_loss": -26.444181442260742, "global_step": 609142, "epoch": 7339} {"train_loss": -26.49210548400879, "global_step": 609143, "epoch": 7339} {"train_loss": -26.727191925048828, "global_step": 609144, "epoch": 7339} {"train_loss": -26.429340362548828, "global_step": 609145, "epoch": 7339} {"train_loss": -26.65311622619629, "global_step": 609146, "epoch": 7339} {"train_loss": -26.913110733032227, "global_step": 609147, "epoch": 7339} {"train_loss": -26.507169723510742, "global_step": 609148, "epoch": 7339} {"train_loss": -26.98101234436035, "global_step": 609149, "epoch": 7339} {"train_loss": -26.630651473999023, "global_step": 609150, "epoch": 7339} {"train_loss": -27.22443199157715, "global_step": 609151, "epoch": 7339} {"train_loss": -26.935989379882812, "global_step": 609152, "epoch": 7339} {"train_loss": -27.340646743774414, "global_step": 609153, "epoch": 7339} {"train_loss": -26.664764404296875, "global_step": 609154, "epoch": 7339} {"train_loss": -27.237445831298828, "global_step": 609155, "epoch": 7339} {"train_loss": -27.062545776367188, "global_step": 609156, "epoch": 7339} {"train_loss": -27.568723678588867, "global_step": 609157, "epoch": 7339} {"train_loss": -27.312223434448242, "global_step": 609158, "epoch": 7339} {"train_loss": -27.21913719177246, "global_step": 609159, "epoch": 7339} {"train_loss": -27.316083908081055, "global_step": 609160, "epoch": 7339} {"train_loss": -27.132160186767578, "global_step": 609161, "epoch": 7339} {"train_loss": -27.736499786376953, "global_step": 609162, "epoch": 7339} {"train_loss": -27.55854606628418, "global_step": 609163, "epoch": 7339} {"train_loss": -27.8055362701416, "global_step": 609164, "epoch": 7339} {"train_loss": -27.682653427124023, "global_step": 609165, "epoch": 7339} {"train_loss": -27.461267471313477, "global_step": 609166, "epoch": 7339} {"train_loss": -27.444265365600586, "global_step": 609167, "epoch": 7339} {"train_loss": -27.903207778930664, "global_step": 609168, "epoch": 7339} {"train_loss": -27.71184730529785, "global_step": 609169, "epoch": 7339} {"train_loss": -28.367568969726562, "global_step": 609170, "epoch": 7339} {"train_loss": -27.689374923706055, "global_step": 609171, "epoch": 7339} {"train_loss": -27.654407501220703, "global_step": 609172, "epoch": 7339} {"train_loss": -27.790985107421875, "global_step": 609173, "epoch": 7339} {"train_loss": -27.88422203063965, "global_step": 609174, "epoch": 7339} {"train_loss": -28.102527618408203, "global_step": 609175, "epoch": 7339} {"train_loss": -28.00684928894043, "global_step": 609176, "epoch": 7339} {"train_loss": -28.07612419128418, "global_step": 609177, "epoch": 7339} {"train_loss": -27.7947940826416, "global_step": 609178, "epoch": 7339} {"train_loss": -28.199848175048828, "global_step": 609179, "epoch": 7339} {"train_loss": -28.01849937438965, "global_step": 609180, "epoch": 7339} {"train_loss": -27.81544303894043, "global_step": 609181, "epoch": 7339} {"train_loss": -28.34773063659668, "global_step": 609182, "epoch": 7339} {"train_loss": -27.93494987487793, "global_step": 609183, "epoch": 7339} {"train_loss": -28.354970932006836, "global_step": 609184, "epoch": 7339} {"train_loss": -28.095731735229492, "global_step": 609185, "epoch": 7339} {"train_loss": -28.221555709838867, "global_step": 609186, "epoch": 7339} {"train_loss": -28.298938751220703, "global_step": 609187, "epoch": 7339} {"train_loss": -28.171411514282227, "global_step": 609188, "epoch": 7339} {"train_loss": -28.220319747924805, "global_step": 609189, "epoch": 7339} {"train_loss": -28.221221923828125, "global_step": 609190, "epoch": 7339} {"train_loss": -28.025543212890625, "global_step": 609191, "epoch": 7339} {"train_loss": -28.40680503845215, "global_step": 609192, "epoch": 7339} {"train_loss": -28.073266983032227, "global_step": 609193, "epoch": 7339} {"train_loss": -28.225879669189453, "global_step": 609194, "epoch": 7339} {"train_loss": -28.05393409729004, "global_step": 609195, "epoch": 7339} {"train_loss": -28.335250854492188, "global_step": 609196, "epoch": 7339} {"train_loss": -28.175113677978516, "global_step": 609197, "epoch": 7339} {"train_loss": -28.246490478515625, "global_step": 609198, "epoch": 7339} {"train_loss": -28.2065372467041, "global_step": 609199, "epoch": 7339} {"train_loss": -28.084680557250977, "global_step": 609200, "epoch": 7339} {"train_loss": -28.434064865112305, "global_step": 609201, "epoch": 7339} {"train_loss": -28.361007690429688, "global_step": 609202, "epoch": 7339} {"train_loss": -28.24945640563965, "global_step": 609203, "epoch": 7339} {"train_loss": -28.049169540405273, "global_step": 609204, "epoch": 7339} {"train_loss": -28.165359497070312, "global_step": 609205, "epoch": 7339} {"train_loss": -28.133365631103516, "global_step": 609206, "epoch": 7339} {"train_loss": -28.2688045501709, "global_step": 609207, "epoch": 7339} {"train_loss": -27.889307022094727, "global_step": 609208, "epoch": 7339} {"train_loss": -28.07375144958496, "global_step": 609209, "epoch": 7339} {"train_loss": -28.227802276611328, "global_step": 609210, "epoch": 7339} {"train_loss": -28.09588623046875, "global_step": 609211, "epoch": 7339} {"train_loss": -27.879135131835938, "global_step": 609212, "epoch": 7339} {"train_loss": -27.98687744140625, "global_step": 609213, "epoch": 7339} {"train_loss": -28.648595809936523, "global_step": 609214, "epoch": 7339} {"train_loss": -28.31288719177246, "global_step": 609215, "epoch": 7339} {"train_loss": -28.428253173828125, "global_step": 609216, "epoch": 7339} {"train_loss": -28.405866622924805, "global_step": 609217, "epoch": 7339} {"train_loss": -28.43904685974121, "global_step": 609218, "epoch": 7339} {"train_loss": -27.66425764704325, "global_step": 609219, "epoch": 7339, "val_loss": 6723769.0} {"train_loss": -25.675216674804688, "global_step": 609220, "epoch": 7340} {"train_loss": -22.77411460876465, "global_step": 609221, "epoch": 7340} {"train_loss": -22.71791648864746, "global_step": 609222, "epoch": 7340} {"train_loss": -25.659793853759766, "global_step": 609223, "epoch": 7340} {"train_loss": -26.867206573486328, "global_step": 609224, "epoch": 7340} {"train_loss": -26.1219425201416, "global_step": 609225, "epoch": 7340} {"train_loss": -26.54249382019043, "global_step": 609226, "epoch": 7340} {"train_loss": -26.390533447265625, "global_step": 609227, "epoch": 7340} {"train_loss": -26.70404052734375, "global_step": 609228, "epoch": 7340} {"train_loss": -26.750308990478516, "global_step": 609229, "epoch": 7340} {"train_loss": -26.822675704956055, "global_step": 609230, "epoch": 7340} {"train_loss": -26.969770431518555, "global_step": 609231, "epoch": 7340} {"train_loss": -27.26639747619629, "global_step": 609232, "epoch": 7340} {"train_loss": -27.0837345123291, "global_step": 609233, "epoch": 7340} {"train_loss": -27.039941787719727, "global_step": 609234, "epoch": 7340} {"train_loss": -27.442819595336914, "global_step": 609235, "epoch": 7340} {"train_loss": -27.506671905517578, "global_step": 609236, "epoch": 7340} {"train_loss": -27.52504539489746, "global_step": 609237, "epoch": 7340} {"train_loss": -27.167221069335938, "global_step": 609238, "epoch": 7340} {"train_loss": -27.598621368408203, "global_step": 609239, "epoch": 7340} {"train_loss": -27.663623809814453, "global_step": 609240, "epoch": 7340} {"train_loss": -27.36957359313965, "global_step": 609241, "epoch": 7340} {"train_loss": -27.505903244018555, "global_step": 609242, "epoch": 7340} {"train_loss": -27.184890747070312, "global_step": 609243, "epoch": 7340} {"train_loss": -27.30597496032715, "global_step": 609244, "epoch": 7340} {"train_loss": -27.46929931640625, "global_step": 609245, "epoch": 7340} {"train_loss": -27.358840942382812, "global_step": 609246, "epoch": 7340} {"train_loss": -27.494043350219727, "global_step": 609247, "epoch": 7340} {"train_loss": -27.540557861328125, "global_step": 609248, "epoch": 7340} {"train_loss": -27.674774169921875, "global_step": 609249, "epoch": 7340} {"train_loss": -27.40934181213379, "global_step": 609250, "epoch": 7340} {"train_loss": -27.81321144104004, "global_step": 609251, "epoch": 7340} {"train_loss": -27.87587547302246, "global_step": 609252, "epoch": 7340} {"train_loss": -27.824005126953125, "global_step": 609253, "epoch": 7340} {"train_loss": -27.92958641052246, "global_step": 609254, "epoch": 7340} {"train_loss": -27.853321075439453, "global_step": 609255, "epoch": 7340} {"train_loss": -27.978891372680664, "global_step": 609256, "epoch": 7340} {"train_loss": -27.934972763061523, "global_step": 609257, "epoch": 7340} {"train_loss": -27.925153732299805, "global_step": 609258, "epoch": 7340} {"train_loss": -27.6136474609375, "global_step": 609259, "epoch": 7340} {"train_loss": -27.955244064331055, "global_step": 609260, "epoch": 7340} {"train_loss": -27.894119262695312, "global_step": 609261, "epoch": 7340} {"train_loss": -27.6054630279541, "global_step": 609262, "epoch": 7340} {"train_loss": -28.036474227905273, "global_step": 609263, "epoch": 7340} {"train_loss": -28.165796279907227, "global_step": 609264, "epoch": 7340} {"train_loss": -28.3411808013916, "global_step": 609265, "epoch": 7340} {"train_loss": -27.90070152282715, "global_step": 609266, "epoch": 7340} {"train_loss": -27.643085479736328, "global_step": 609267, "epoch": 7340} {"train_loss": -28.100845336914062, "global_step": 609268, "epoch": 7340} {"train_loss": -28.339466094970703, "global_step": 609269, "epoch": 7340} {"train_loss": -28.20193862915039, "global_step": 609270, "epoch": 7340} {"train_loss": -28.172992706298828, "global_step": 609271, "epoch": 7340} {"train_loss": -27.861083984375, "global_step": 609272, "epoch": 7340} {"train_loss": -28.191736221313477, "global_step": 609273, "epoch": 7340} {"train_loss": -27.78032875061035, "global_step": 609274, "epoch": 7340} {"train_loss": -28.33295249938965, "global_step": 609275, "epoch": 7340} {"train_loss": -28.135583877563477, "global_step": 609276, "epoch": 7340} {"train_loss": -27.960275650024414, "global_step": 609277, "epoch": 7340} {"train_loss": -28.23101806640625, "global_step": 609278, "epoch": 7340} {"train_loss": -28.059162139892578, "global_step": 609279, "epoch": 7340} {"train_loss": -28.29520034790039, "global_step": 609280, "epoch": 7340} {"train_loss": -27.968555450439453, "global_step": 609281, "epoch": 7340} {"train_loss": -28.1552791595459, "global_step": 609282, "epoch": 7340} {"train_loss": -28.224048614501953, "global_step": 609283, "epoch": 7340} {"train_loss": -28.427534103393555, "global_step": 609284, "epoch": 7340} {"train_loss": -28.125843048095703, "global_step": 609285, "epoch": 7340} {"train_loss": -28.03608512878418, "global_step": 609286, "epoch": 7340} {"train_loss": -28.480390548706055, "global_step": 609287, "epoch": 7340} {"train_loss": -28.240095138549805, "global_step": 609288, "epoch": 7340} {"train_loss": -28.346593856811523, "global_step": 609289, "epoch": 7340} {"train_loss": -28.506885528564453, "global_step": 609290, "epoch": 7340} {"train_loss": -28.33837890625, "global_step": 609291, "epoch": 7340} {"train_loss": -28.1247615814209, "global_step": 609292, "epoch": 7340} {"train_loss": -28.0291805267334, "global_step": 609293, "epoch": 7340} {"train_loss": -28.131315231323242, "global_step": 609294, "epoch": 7340} {"train_loss": -27.716291427612305, "global_step": 609295, "epoch": 7340} {"train_loss": -28.22200584411621, "global_step": 609296, "epoch": 7340} {"train_loss": -27.955780029296875, "global_step": 609297, "epoch": 7340} {"train_loss": -28.023670196533203, "global_step": 609298, "epoch": 7340} {"train_loss": -28.05391502380371, "global_step": 609299, "epoch": 7340} {"train_loss": -27.6408748626709, "global_step": 609300, "epoch": 7340} {"train_loss": -27.640344619750977, "global_step": 609301, "epoch": 7340} {"train_loss": -27.584293779120387, "global_step": 609302, "epoch": 7340, "val_loss": 6722032.5} {"train_loss": -27.54108238220215, "global_step": 609303, "epoch": 7341} {"train_loss": -27.42305564880371, "global_step": 609304, "epoch": 7341} {"train_loss": -27.75729751586914, "global_step": 609305, "epoch": 7341} {"train_loss": -27.20712661743164, "global_step": 609306, "epoch": 7341} {"train_loss": -27.614093780517578, "global_step": 609307, "epoch": 7341} {"train_loss": -27.434696197509766, "global_step": 609308, "epoch": 7341} {"train_loss": -27.7008113861084, "global_step": 609309, "epoch": 7341} {"train_loss": -27.715253829956055, "global_step": 609310, "epoch": 7341} {"train_loss": -27.712818145751953, "global_step": 609311, "epoch": 7341} {"train_loss": -28.099903106689453, "global_step": 609312, "epoch": 7341} {"train_loss": -27.922433853149414, "global_step": 609313, "epoch": 7341} {"train_loss": -27.798431396484375, "global_step": 609314, "epoch": 7341} {"train_loss": -27.8209228515625, "global_step": 609315, "epoch": 7341} {"train_loss": -27.483169555664062, "global_step": 609316, "epoch": 7341} {"train_loss": -28.1511173248291, "global_step": 609317, "epoch": 7341} {"train_loss": -28.0253963470459, "global_step": 609318, "epoch": 7341} {"train_loss": -27.84938621520996, "global_step": 609319, "epoch": 7341} {"train_loss": -28.0048770904541, "global_step": 609320, "epoch": 7341} {"train_loss": -27.921878814697266, "global_step": 609321, "epoch": 7341} {"train_loss": -28.142414093017578, "global_step": 609322, "epoch": 7341} {"train_loss": -28.048389434814453, "global_step": 609323, "epoch": 7341} {"train_loss": -28.189184188842773, "global_step": 609324, "epoch": 7341} {"train_loss": -28.1806583404541, "global_step": 609325, "epoch": 7341} {"train_loss": -28.19940185546875, "global_step": 609326, "epoch": 7341} {"train_loss": -28.36323356628418, "global_step": 609327, "epoch": 7341} {"train_loss": -28.461750030517578, "global_step": 609328, "epoch": 7341} {"train_loss": -28.0598201751709, "global_step": 609329, "epoch": 7341} {"train_loss": -28.213300704956055, "global_step": 609330, "epoch": 7341} {"train_loss": -28.461200714111328, "global_step": 609331, "epoch": 7341} {"train_loss": -28.215106964111328, "global_step": 609332, "epoch": 7341} {"train_loss": -28.2650146484375, "global_step": 609333, "epoch": 7341} {"train_loss": -28.18001365661621, "global_step": 609334, "epoch": 7341} {"train_loss": -28.3823184967041, "global_step": 609335, "epoch": 7341} {"train_loss": -28.33548355102539, "global_step": 609336, "epoch": 7341} {"train_loss": -28.076093673706055, "global_step": 609337, "epoch": 7341} {"train_loss": -28.163816452026367, "global_step": 609338, "epoch": 7341} {"train_loss": -28.113224029541016, "global_step": 609339, "epoch": 7341} {"train_loss": -28.232648849487305, "global_step": 609340, "epoch": 7341} {"train_loss": -28.297971725463867, "global_step": 609341, "epoch": 7341} {"train_loss": -28.318958282470703, "global_step": 609342, "epoch": 7341} {"train_loss": -28.710525512695312, "global_step": 609343, "epoch": 7341} {"train_loss": -28.461584091186523, "global_step": 609344, "epoch": 7341} {"train_loss": -28.04254150390625, "global_step": 609345, "epoch": 7341} {"train_loss": -28.22382164001465, "global_step": 609346, "epoch": 7341} {"train_loss": -28.15752601623535, "global_step": 609347, "epoch": 7341} {"train_loss": -27.925708770751953, "global_step": 609348, "epoch": 7341} {"train_loss": -28.20184898376465, "global_step": 609349, "epoch": 7341} {"train_loss": -28.06898307800293, "global_step": 609350, "epoch": 7341} {"train_loss": -28.378101348876953, "global_step": 609351, "epoch": 7341} {"train_loss": -27.907180786132812, "global_step": 609352, "epoch": 7341} {"train_loss": -28.143247604370117, "global_step": 609353, "epoch": 7341} {"train_loss": -28.026569366455078, "global_step": 609354, "epoch": 7341} {"train_loss": -27.971525192260742, "global_step": 609355, "epoch": 7341} {"train_loss": -28.078765869140625, "global_step": 609356, "epoch": 7341} {"train_loss": -28.52039909362793, "global_step": 609357, "epoch": 7341} {"train_loss": -28.34461784362793, "global_step": 609358, "epoch": 7341} {"train_loss": -28.288236618041992, "global_step": 609359, "epoch": 7341} {"train_loss": -28.58930778503418, "global_step": 609360, "epoch": 7341} {"train_loss": -27.600936889648438, "global_step": 609361, "epoch": 7341} {"train_loss": -28.382587432861328, "global_step": 609362, "epoch": 7341} {"train_loss": -27.91036033630371, "global_step": 609363, "epoch": 7341} {"train_loss": -27.693912506103516, "global_step": 609364, "epoch": 7341} {"train_loss": -28.19721031188965, "global_step": 609365, "epoch": 7341} {"train_loss": -27.989709854125977, "global_step": 609366, "epoch": 7341} {"train_loss": -27.836530685424805, "global_step": 609367, "epoch": 7341} {"train_loss": -27.927764892578125, "global_step": 609368, "epoch": 7341} {"train_loss": -27.869022369384766, "global_step": 609369, "epoch": 7341} {"train_loss": -28.08674430847168, "global_step": 609370, "epoch": 7341} {"train_loss": -28.288320541381836, "global_step": 609371, "epoch": 7341} {"train_loss": -28.15777587890625, "global_step": 609372, "epoch": 7341} {"train_loss": -27.589719772338867, "global_step": 609373, "epoch": 7341} {"train_loss": -28.393957138061523, "global_step": 609374, "epoch": 7341} {"train_loss": -28.30091667175293, "global_step": 609375, "epoch": 7341} {"train_loss": -28.412921905517578, "global_step": 609376, "epoch": 7341} {"train_loss": -28.343175888061523, "global_step": 609377, "epoch": 7341} {"train_loss": -28.065357208251953, "global_step": 609378, "epoch": 7341} {"train_loss": -28.133228302001953, "global_step": 609379, "epoch": 7341} {"train_loss": -28.342269897460938, "global_step": 609380, "epoch": 7341} {"train_loss": -28.201446533203125, "global_step": 609381, "epoch": 7341} {"train_loss": -28.1462345123291, "global_step": 609382, "epoch": 7341} {"train_loss": -28.1285343170166, "global_step": 609383, "epoch": 7341} {"train_loss": -28.0755615234375, "global_step": 609384, "epoch": 7341} {"train_loss": -28.078832281641212, "global_step": 609385, "epoch": 7341, "val_loss": 6700210.5} {"train_loss": -28.041711807250977, "global_step": 609386, "epoch": 7342} {"train_loss": -28.408645629882812, "global_step": 609387, "epoch": 7342} {"train_loss": -27.493555068969727, "global_step": 609388, "epoch": 7342} {"train_loss": -27.751035690307617, "global_step": 609389, "epoch": 7342} {"train_loss": -27.877674102783203, "global_step": 609390, "epoch": 7342} {"train_loss": -27.9710636138916, "global_step": 609391, "epoch": 7342} {"train_loss": -27.835041046142578, "global_step": 609392, "epoch": 7342} {"train_loss": -28.11356544494629, "global_step": 609393, "epoch": 7342} {"train_loss": -27.47271728515625, "global_step": 609394, "epoch": 7342} {"train_loss": -28.135038375854492, "global_step": 609395, "epoch": 7342} {"train_loss": -28.35382652282715, "global_step": 609396, "epoch": 7342} {"train_loss": -28.090848922729492, "global_step": 609397, "epoch": 7342} {"train_loss": -28.08363151550293, "global_step": 609398, "epoch": 7342} {"train_loss": -27.824934005737305, "global_step": 609399, "epoch": 7342} {"train_loss": -28.184528350830078, "global_step": 609400, "epoch": 7342} {"train_loss": -28.245746612548828, "global_step": 609401, "epoch": 7342} {"train_loss": -28.107818603515625, "global_step": 609402, "epoch": 7342} {"train_loss": -27.702911376953125, "global_step": 609403, "epoch": 7342} {"train_loss": -27.71943473815918, "global_step": 609404, "epoch": 7342} {"train_loss": -28.065383911132812, "global_step": 609405, "epoch": 7342} {"train_loss": -28.121994018554688, "global_step": 609406, "epoch": 7342} {"train_loss": -27.97633171081543, "global_step": 609407, "epoch": 7342} {"train_loss": -28.095111846923828, "global_step": 609408, "epoch": 7342} {"train_loss": -27.647445678710938, "global_step": 609409, "epoch": 7342} {"train_loss": -27.501081466674805, "global_step": 609410, "epoch": 7342} {"train_loss": -28.175251007080078, "global_step": 609411, "epoch": 7342} {"train_loss": -28.052560806274414, "global_step": 609412, "epoch": 7342} {"train_loss": -28.075580596923828, "global_step": 609413, "epoch": 7342} {"train_loss": -27.91373062133789, "global_step": 609414, "epoch": 7342} {"train_loss": -27.773193359375, "global_step": 609415, "epoch": 7342} {"train_loss": -27.886199951171875, "global_step": 609416, "epoch": 7342} {"train_loss": -27.923099517822266, "global_step": 609417, "epoch": 7342} {"train_loss": -28.343067169189453, "global_step": 609418, "epoch": 7342} {"train_loss": -28.09112548828125, "global_step": 609419, "epoch": 7342} {"train_loss": -28.063501358032227, "global_step": 609420, "epoch": 7342} {"train_loss": -28.112594604492188, "global_step": 609421, "epoch": 7342} {"train_loss": -27.946619033813477, "global_step": 609422, "epoch": 7342} {"train_loss": -28.196767807006836, "global_step": 609423, "epoch": 7342} {"train_loss": -28.10933494567871, "global_step": 609424, "epoch": 7342} {"train_loss": -28.221792221069336, "global_step": 609425, "epoch": 7342} {"train_loss": -27.990400314331055, "global_step": 609426, "epoch": 7342} {"train_loss": -28.382596969604492, "global_step": 609427, "epoch": 7342} {"train_loss": -27.940351486206055, "global_step": 609428, "epoch": 7342} {"train_loss": -28.19288444519043, "global_step": 609429, "epoch": 7342} {"train_loss": -28.5291690826416, "global_step": 609430, "epoch": 7342} {"train_loss": -28.591400146484375, "global_step": 609431, "epoch": 7342} {"train_loss": -28.49098014831543, "global_step": 609432, "epoch": 7342} {"train_loss": -28.14564323425293, "global_step": 609433, "epoch": 7342} {"train_loss": -28.442880630493164, "global_step": 609434, "epoch": 7342} {"train_loss": -28.6533260345459, "global_step": 609435, "epoch": 7342} {"train_loss": -28.342370986938477, "global_step": 609436, "epoch": 7342} {"train_loss": -28.21601676940918, "global_step": 609437, "epoch": 7342} {"train_loss": -28.06562614440918, "global_step": 609438, "epoch": 7342} {"train_loss": -27.92694664001465, "global_step": 609439, "epoch": 7342} {"train_loss": -28.35040855407715, "global_step": 609440, "epoch": 7342} {"train_loss": -27.939258575439453, "global_step": 609441, "epoch": 7342} {"train_loss": -28.06574821472168, "global_step": 609442, "epoch": 7342} {"train_loss": -27.764694213867188, "global_step": 609443, "epoch": 7342} {"train_loss": -28.061132431030273, "global_step": 609444, "epoch": 7342} {"train_loss": -28.03504753112793, "global_step": 609445, "epoch": 7342} {"train_loss": -28.126846313476562, "global_step": 609446, "epoch": 7342} {"train_loss": -27.801076889038086, "global_step": 609447, "epoch": 7342} {"train_loss": -27.928821563720703, "global_step": 609448, "epoch": 7342} {"train_loss": -28.089954376220703, "global_step": 609449, "epoch": 7342} {"train_loss": -28.474340438842773, "global_step": 609450, "epoch": 7342} {"train_loss": -28.3729248046875, "global_step": 609451, "epoch": 7342} {"train_loss": -28.443307876586914, "global_step": 609452, "epoch": 7342} {"train_loss": -28.561298370361328, "global_step": 609453, "epoch": 7342} {"train_loss": -28.26755142211914, "global_step": 609454, "epoch": 7342} {"train_loss": -28.4774227142334, "global_step": 609455, "epoch": 7342} {"train_loss": -27.98618507385254, "global_step": 609456, "epoch": 7342} {"train_loss": -28.04166603088379, "global_step": 609457, "epoch": 7342} {"train_loss": -28.203857421875, "global_step": 609458, "epoch": 7342} {"train_loss": -27.94118309020996, "global_step": 609459, "epoch": 7342} {"train_loss": -28.025131225585938, "global_step": 609460, "epoch": 7342} {"train_loss": -28.177698135375977, "global_step": 609461, "epoch": 7342} {"train_loss": -27.978673934936523, "global_step": 609462, "epoch": 7342} {"train_loss": -28.317035675048828, "global_step": 609463, "epoch": 7342} {"train_loss": -28.109155654907227, "global_step": 609464, "epoch": 7342} {"train_loss": -28.51643180847168, "global_step": 609465, "epoch": 7342} {"train_loss": -28.152429580688477, "global_step": 609466, "epoch": 7342} {"train_loss": -27.97119140625, "global_step": 609467, "epoch": 7342} {"train_loss": -28.09198983893337, "global_step": 609468, "epoch": 7342, "val_loss": 6637179.0} {"train_loss": -25.7780818939209, "global_step": 609469, "epoch": 7343} {"train_loss": -24.824121475219727, "global_step": 609470, "epoch": 7343} {"train_loss": -27.01117515563965, "global_step": 609471, "epoch": 7343} {"train_loss": -26.777639389038086, "global_step": 609472, "epoch": 7343} {"train_loss": -26.006994247436523, "global_step": 609473, "epoch": 7343} {"train_loss": -26.415861129760742, "global_step": 609474, "epoch": 7343} {"train_loss": -27.085739135742188, "global_step": 609475, "epoch": 7343} {"train_loss": -26.780242919921875, "global_step": 609476, "epoch": 7343} {"train_loss": -26.50640296936035, "global_step": 609477, "epoch": 7343} {"train_loss": -27.174869537353516, "global_step": 609478, "epoch": 7343} {"train_loss": -26.756040573120117, "global_step": 609479, "epoch": 7343} {"train_loss": -27.77008628845215, "global_step": 609480, "epoch": 7343} {"train_loss": -27.30316734313965, "global_step": 609481, "epoch": 7343} {"train_loss": -27.433683395385742, "global_step": 609482, "epoch": 7343} {"train_loss": -27.431671142578125, "global_step": 609483, "epoch": 7343} {"train_loss": -27.572895050048828, "global_step": 609484, "epoch": 7343} {"train_loss": -27.4025936126709, "global_step": 609485, "epoch": 7343} {"train_loss": -27.451635360717773, "global_step": 609486, "epoch": 7343} {"train_loss": -27.56119728088379, "global_step": 609487, "epoch": 7343} {"train_loss": -27.4625186920166, "global_step": 609488, "epoch": 7343} {"train_loss": -27.996850967407227, "global_step": 609489, "epoch": 7343} {"train_loss": -27.219242095947266, "global_step": 609490, "epoch": 7343} {"train_loss": -28.1272029876709, "global_step": 609491, "epoch": 7343} {"train_loss": -27.7537784576416, "global_step": 609492, "epoch": 7343} {"train_loss": -27.868270874023438, "global_step": 609493, "epoch": 7343} {"train_loss": -27.897052764892578, "global_step": 609494, "epoch": 7343} {"train_loss": -28.12263298034668, "global_step": 609495, "epoch": 7343} {"train_loss": -27.867904663085938, "global_step": 609496, "epoch": 7343} {"train_loss": -27.782819747924805, "global_step": 609497, "epoch": 7343} {"train_loss": -27.82362937927246, "global_step": 609498, "epoch": 7343} {"train_loss": -27.667041778564453, "global_step": 609499, "epoch": 7343} {"train_loss": -27.786376953125, "global_step": 609500, "epoch": 7343} {"train_loss": -27.73282241821289, "global_step": 609501, "epoch": 7343} {"train_loss": -27.761417388916016, "global_step": 609502, "epoch": 7343} {"train_loss": -27.85804557800293, "global_step": 609503, "epoch": 7343} {"train_loss": -27.774747848510742, "global_step": 609504, "epoch": 7343} {"train_loss": -28.003061294555664, "global_step": 609505, "epoch": 7343} {"train_loss": -28.036767959594727, "global_step": 609506, "epoch": 7343} {"train_loss": -27.76145362854004, "global_step": 609507, "epoch": 7343} {"train_loss": -28.024402618408203, "global_step": 609508, "epoch": 7343} {"train_loss": -27.9009952545166, "global_step": 609509, "epoch": 7343} {"train_loss": -28.047657012939453, "global_step": 609510, "epoch": 7343} {"train_loss": -28.123815536499023, "global_step": 609511, "epoch": 7343} {"train_loss": -27.801807403564453, "global_step": 609512, "epoch": 7343} {"train_loss": -28.152923583984375, "global_step": 609513, "epoch": 7343} {"train_loss": -27.909765243530273, "global_step": 609514, "epoch": 7343} {"train_loss": -28.041034698486328, "global_step": 609515, "epoch": 7343} {"train_loss": -28.311330795288086, "global_step": 609516, "epoch": 7343} {"train_loss": -27.912647247314453, "global_step": 609517, "epoch": 7343} {"train_loss": -27.895849227905273, "global_step": 609518, "epoch": 7343} {"train_loss": -28.171842575073242, "global_step": 609519, "epoch": 7343} {"train_loss": -28.16518211364746, "global_step": 609520, "epoch": 7343} {"train_loss": -28.06973648071289, "global_step": 609521, "epoch": 7343} {"train_loss": -28.077680587768555, "global_step": 609522, "epoch": 7343} {"train_loss": -28.262725830078125, "global_step": 609523, "epoch": 7343} {"train_loss": -27.851613998413086, "global_step": 609524, "epoch": 7343} {"train_loss": -28.47663688659668, "global_step": 609525, "epoch": 7343} {"train_loss": -28.405065536499023, "global_step": 609526, "epoch": 7343} {"train_loss": -28.34814453125, "global_step": 609527, "epoch": 7343} {"train_loss": -27.912412643432617, "global_step": 609528, "epoch": 7343} {"train_loss": -27.963979721069336, "global_step": 609529, "epoch": 7343} {"train_loss": -28.25532341003418, "global_step": 609530, "epoch": 7343} {"train_loss": -28.170337677001953, "global_step": 609531, "epoch": 7343} {"train_loss": -28.06272315979004, "global_step": 609532, "epoch": 7343} {"train_loss": -27.884851455688477, "global_step": 609533, "epoch": 7343} {"train_loss": -27.955106735229492, "global_step": 609534, "epoch": 7343} {"train_loss": -28.25522804260254, "global_step": 609535, "epoch": 7343} {"train_loss": -28.15813636779785, "global_step": 609536, "epoch": 7343} {"train_loss": -28.205808639526367, "global_step": 609537, "epoch": 7343} {"train_loss": -28.563541412353516, "global_step": 609538, "epoch": 7343} {"train_loss": -28.323816299438477, "global_step": 609539, "epoch": 7343} {"train_loss": -28.59465980529785, "global_step": 609540, "epoch": 7343} {"train_loss": -27.92756462097168, "global_step": 609541, "epoch": 7343} {"train_loss": -28.0880069732666, "global_step": 609542, "epoch": 7343} {"train_loss": -28.29842185974121, "global_step": 609543, "epoch": 7343} {"train_loss": -27.778249740600586, "global_step": 609544, "epoch": 7343} {"train_loss": -27.87586784362793, "global_step": 609545, "epoch": 7343} {"train_loss": -28.152379989624023, "global_step": 609546, "epoch": 7343} {"train_loss": -27.9788818359375, "global_step": 609547, "epoch": 7343} {"train_loss": -28.335886001586914, "global_step": 609548, "epoch": 7343} {"train_loss": -28.234922409057617, "global_step": 609549, "epoch": 7343} {"train_loss": -28.36627197265625, "global_step": 609550, "epoch": 7343} {"train_loss": -27.76727253557688, "global_step": 609551, "epoch": 7343, "val_loss": 6657079.0} {"train_loss": -27.205678939819336, "global_step": 609552, "epoch": 7344} {"train_loss": -27.770660400390625, "global_step": 609553, "epoch": 7344} {"train_loss": -27.351057052612305, "global_step": 609554, "epoch": 7344} {"train_loss": -27.612701416015625, "global_step": 609555, "epoch": 7344} {"train_loss": -27.46076011657715, "global_step": 609556, "epoch": 7344} {"train_loss": -27.640790939331055, "global_step": 609557, "epoch": 7344} {"train_loss": -27.51495361328125, "global_step": 609558, "epoch": 7344} {"train_loss": -27.589628219604492, "global_step": 609559, "epoch": 7344} {"train_loss": -27.661466598510742, "global_step": 609560, "epoch": 7344} {"train_loss": -27.62052345275879, "global_step": 609561, "epoch": 7344} {"train_loss": -27.932220458984375, "global_step": 609562, "epoch": 7344} {"train_loss": -28.27613639831543, "global_step": 609563, "epoch": 7344} {"train_loss": -27.622222900390625, "global_step": 609564, "epoch": 7344} {"train_loss": -27.707197189331055, "global_step": 609565, "epoch": 7344} {"train_loss": -27.831552505493164, "global_step": 609566, "epoch": 7344} {"train_loss": -28.095380783081055, "global_step": 609567, "epoch": 7344} {"train_loss": -28.13226890563965, "global_step": 609568, "epoch": 7344} {"train_loss": -28.10126304626465, "global_step": 609569, "epoch": 7344} {"train_loss": -28.035892486572266, "global_step": 609570, "epoch": 7344} {"train_loss": -28.020002365112305, "global_step": 609571, "epoch": 7344} {"train_loss": -28.36690330505371, "global_step": 609572, "epoch": 7344} {"train_loss": -27.892587661743164, "global_step": 609573, "epoch": 7344} {"train_loss": -28.028722763061523, "global_step": 609574, "epoch": 7344} {"train_loss": -28.11420249938965, "global_step": 609575, "epoch": 7344} {"train_loss": -27.6334228515625, "global_step": 609576, "epoch": 7344} {"train_loss": -27.600614547729492, "global_step": 609577, "epoch": 7344} {"train_loss": -28.20831871032715, "global_step": 609578, "epoch": 7344} {"train_loss": -28.2912540435791, "global_step": 609579, "epoch": 7344} {"train_loss": -27.801450729370117, "global_step": 609580, "epoch": 7344} {"train_loss": -28.256763458251953, "global_step": 609581, "epoch": 7344} {"train_loss": -28.11260414123535, "global_step": 609582, "epoch": 7344} {"train_loss": -27.9397029876709, "global_step": 609583, "epoch": 7344} {"train_loss": -28.028076171875, "global_step": 609584, "epoch": 7344} {"train_loss": -28.048309326171875, "global_step": 609585, "epoch": 7344} {"train_loss": -27.960803985595703, "global_step": 609586, "epoch": 7344} {"train_loss": -28.104944229125977, "global_step": 609587, "epoch": 7344} {"train_loss": -28.008472442626953, "global_step": 609588, "epoch": 7344} {"train_loss": -27.947677612304688, "global_step": 609589, "epoch": 7344} {"train_loss": -28.39011573791504, "global_step": 609590, "epoch": 7344} {"train_loss": -28.26515007019043, "global_step": 609591, "epoch": 7344} {"train_loss": -27.7607479095459, "global_step": 609592, "epoch": 7344} {"train_loss": -27.7119083404541, "global_step": 609593, "epoch": 7344} {"train_loss": -28.245620727539062, "global_step": 609594, "epoch": 7344} {"train_loss": -28.140064239501953, "global_step": 609595, "epoch": 7344} {"train_loss": -27.850141525268555, "global_step": 609596, "epoch": 7344} {"train_loss": -28.14113426208496, "global_step": 609597, "epoch": 7344} {"train_loss": -28.47480583190918, "global_step": 609598, "epoch": 7344} {"train_loss": -28.34564781188965, "global_step": 609599, "epoch": 7344} {"train_loss": -28.652612686157227, "global_step": 609600, "epoch": 7344} {"train_loss": -28.189315795898438, "global_step": 609601, "epoch": 7344} {"train_loss": -28.51807975769043, "global_step": 609602, "epoch": 7344} {"train_loss": -28.481420516967773, "global_step": 609603, "epoch": 7344} {"train_loss": -28.278356552124023, "global_step": 609604, "epoch": 7344} {"train_loss": -28.156599044799805, "global_step": 609605, "epoch": 7344} {"train_loss": -28.50751304626465, "global_step": 609606, "epoch": 7344} {"train_loss": -28.17868423461914, "global_step": 609607, "epoch": 7344} {"train_loss": -28.264062881469727, "global_step": 609608, "epoch": 7344} {"train_loss": -28.036588668823242, "global_step": 609609, "epoch": 7344} {"train_loss": -28.30757713317871, "global_step": 609610, "epoch": 7344} {"train_loss": -28.180938720703125, "global_step": 609611, "epoch": 7344} {"train_loss": -27.99384117126465, "global_step": 609612, "epoch": 7344} {"train_loss": -28.091663360595703, "global_step": 609613, "epoch": 7344} {"train_loss": -28.34527587890625, "global_step": 609614, "epoch": 7344} {"train_loss": -27.76385498046875, "global_step": 609615, "epoch": 7344} {"train_loss": -27.657068252563477, "global_step": 609616, "epoch": 7344} {"train_loss": -27.49981689453125, "global_step": 609617, "epoch": 7344} {"train_loss": -28.274890899658203, "global_step": 609618, "epoch": 7344} {"train_loss": -28.08363914489746, "global_step": 609619, "epoch": 7344} {"train_loss": -27.99651527404785, "global_step": 609620, "epoch": 7344} {"train_loss": -28.13931655883789, "global_step": 609621, "epoch": 7344} {"train_loss": -28.215484619140625, "global_step": 609622, "epoch": 7344} {"train_loss": -28.18073081970215, "global_step": 609623, "epoch": 7344} {"train_loss": -27.719404220581055, "global_step": 609624, "epoch": 7344} {"train_loss": -27.702320098876953, "global_step": 609625, "epoch": 7344} {"train_loss": -27.646936416625977, "global_step": 609626, "epoch": 7344} {"train_loss": -27.909467697143555, "global_step": 609627, "epoch": 7344} {"train_loss": -27.918975830078125, "global_step": 609628, "epoch": 7344} {"train_loss": -28.332538604736328, "global_step": 609629, "epoch": 7344} {"train_loss": -28.297330856323242, "global_step": 609630, "epoch": 7344} {"train_loss": -27.85959815979004, "global_step": 609631, "epoch": 7344} {"train_loss": -28.07733726501465, "global_step": 609632, "epoch": 7344} {"train_loss": -27.976490020751953, "global_step": 609633, "epoch": 7344} {"train_loss": -28.010276518672345, "global_step": 609634, "epoch": 7344, "val_loss": 6722491.0} {"train_loss": -27.1503963470459, "global_step": 609635, "epoch": 7345} {"train_loss": -26.773223876953125, "global_step": 609636, "epoch": 7345} {"train_loss": -27.594053268432617, "global_step": 609637, "epoch": 7345} {"train_loss": -26.241165161132812, "global_step": 609638, "epoch": 7345} {"train_loss": -27.25115966796875, "global_step": 609639, "epoch": 7345} {"train_loss": -27.098682403564453, "global_step": 609640, "epoch": 7345} {"train_loss": -26.5902156829834, "global_step": 609641, "epoch": 7345} {"train_loss": -27.13555908203125, "global_step": 609642, "epoch": 7345} {"train_loss": -26.44331169128418, "global_step": 609643, "epoch": 7345} {"train_loss": -27.208295822143555, "global_step": 609644, "epoch": 7345} {"train_loss": -26.854389190673828, "global_step": 609645, "epoch": 7345} {"train_loss": -27.45536231994629, "global_step": 609646, "epoch": 7345} {"train_loss": -27.312829971313477, "global_step": 609647, "epoch": 7345} {"train_loss": -27.178558349609375, "global_step": 609648, "epoch": 7345} {"train_loss": -27.07583999633789, "global_step": 609649, "epoch": 7345} {"train_loss": -27.63743019104004, "global_step": 609650, "epoch": 7345} {"train_loss": -27.1354923248291, "global_step": 609651, "epoch": 7345} {"train_loss": -27.410003662109375, "global_step": 609652, "epoch": 7345} {"train_loss": -27.4016170501709, "global_step": 609653, "epoch": 7345} {"train_loss": -27.91261863708496, "global_step": 609654, "epoch": 7345} {"train_loss": -27.602628707885742, "global_step": 609655, "epoch": 7345} {"train_loss": -27.74130630493164, "global_step": 609656, "epoch": 7345} {"train_loss": -27.8292293548584, "global_step": 609657, "epoch": 7345} {"train_loss": -27.707807540893555, "global_step": 609658, "epoch": 7345} {"train_loss": -28.281965255737305, "global_step": 609659, "epoch": 7345} {"train_loss": -27.529224395751953, "global_step": 609660, "epoch": 7345} {"train_loss": -27.5014705657959, "global_step": 609661, "epoch": 7345} {"train_loss": -27.700281143188477, "global_step": 609662, "epoch": 7345} {"train_loss": -27.973859786987305, "global_step": 609663, "epoch": 7345} {"train_loss": -27.47965431213379, "global_step": 609664, "epoch": 7345} {"train_loss": -27.774078369140625, "global_step": 609665, "epoch": 7345} {"train_loss": -27.80560302734375, "global_step": 609666, "epoch": 7345} {"train_loss": -27.876911163330078, "global_step": 609667, "epoch": 7345} {"train_loss": -27.737812042236328, "global_step": 609668, "epoch": 7345} {"train_loss": -27.962085723876953, "global_step": 609669, "epoch": 7345} {"train_loss": -27.710779190063477, "global_step": 609670, "epoch": 7345} {"train_loss": -27.663908004760742, "global_step": 609671, "epoch": 7345} {"train_loss": -28.165546417236328, "global_step": 609672, "epoch": 7345} {"train_loss": -27.9210262298584, "global_step": 609673, "epoch": 7345} {"train_loss": -28.105566024780273, "global_step": 609674, "epoch": 7345} {"train_loss": -28.129179000854492, "global_step": 609675, "epoch": 7345} {"train_loss": -28.012161254882812, "global_step": 609676, "epoch": 7345} {"train_loss": -27.869779586791992, "global_step": 609677, "epoch": 7345} {"train_loss": -28.476438522338867, "global_step": 609678, "epoch": 7345} {"train_loss": -28.051618576049805, "global_step": 609679, "epoch": 7345} {"train_loss": -28.24161148071289, "global_step": 609680, "epoch": 7345} {"train_loss": -28.11984634399414, "global_step": 609681, "epoch": 7345} {"train_loss": -27.916717529296875, "global_step": 609682, "epoch": 7345} {"train_loss": -28.344867706298828, "global_step": 609683, "epoch": 7345} {"train_loss": -28.3458251953125, "global_step": 609684, "epoch": 7345} {"train_loss": -28.42513084411621, "global_step": 609685, "epoch": 7345} {"train_loss": -28.457128524780273, "global_step": 609686, "epoch": 7345} {"train_loss": -28.038467407226562, "global_step": 609687, "epoch": 7345} {"train_loss": -28.229385375976562, "global_step": 609688, "epoch": 7345} {"train_loss": -28.157285690307617, "global_step": 609689, "epoch": 7345} {"train_loss": -28.349822998046875, "global_step": 609690, "epoch": 7345} {"train_loss": -27.816640853881836, "global_step": 609691, "epoch": 7345} {"train_loss": -28.11048698425293, "global_step": 609692, "epoch": 7345} {"train_loss": -28.325361251831055, "global_step": 609693, "epoch": 7345} {"train_loss": -28.43372917175293, "global_step": 609694, "epoch": 7345} {"train_loss": -28.190160751342773, "global_step": 609695, "epoch": 7345} {"train_loss": -28.34552001953125, "global_step": 609696, "epoch": 7345} {"train_loss": -28.063251495361328, "global_step": 609697, "epoch": 7345} {"train_loss": -28.455183029174805, "global_step": 609698, "epoch": 7345} {"train_loss": -28.22955322265625, "global_step": 609699, "epoch": 7345} {"train_loss": -28.09088134765625, "global_step": 609700, "epoch": 7345} {"train_loss": -28.079675674438477, "global_step": 609701, "epoch": 7345} {"train_loss": -28.124313354492188, "global_step": 609702, "epoch": 7345} {"train_loss": -27.897449493408203, "global_step": 609703, "epoch": 7345} {"train_loss": -28.07301139831543, "global_step": 609704, "epoch": 7345} {"train_loss": -28.304615020751953, "global_step": 609705, "epoch": 7345} {"train_loss": -27.989547729492188, "global_step": 609706, "epoch": 7345} {"train_loss": -28.337310791015625, "global_step": 609707, "epoch": 7345} {"train_loss": -28.586231231689453, "global_step": 609708, "epoch": 7345} {"train_loss": -28.258045196533203, "global_step": 609709, "epoch": 7345} {"train_loss": -28.04560661315918, "global_step": 609710, "epoch": 7345} {"train_loss": -28.23834228515625, "global_step": 609711, "epoch": 7345} {"train_loss": -28.197912216186523, "global_step": 609712, "epoch": 7345} {"train_loss": -28.0898380279541, "global_step": 609713, "epoch": 7345} {"train_loss": -28.146442413330078, "global_step": 609714, "epoch": 7345} {"train_loss": -28.045703887939453, "global_step": 609715, "epoch": 7345} {"train_loss": -28.48237419128418, "global_step": 609716, "epoch": 7345} {"train_loss": -27.841778467936688, "global_step": 609717, "epoch": 7345, "val_loss": 6752069.0} {"train_loss": -27.769153594970703, "global_step": 609718, "epoch": 7346} {"train_loss": -26.719282150268555, "global_step": 609719, "epoch": 7346} {"train_loss": -26.82562828063965, "global_step": 609720, "epoch": 7346} {"train_loss": -26.9326229095459, "global_step": 609721, "epoch": 7346} {"train_loss": -27.819107055664062, "global_step": 609722, "epoch": 7346} {"train_loss": -27.975919723510742, "global_step": 609723, "epoch": 7346} {"train_loss": -27.648740768432617, "global_step": 609724, "epoch": 7346} {"train_loss": -28.0482177734375, "global_step": 609725, "epoch": 7346} {"train_loss": -27.55018424987793, "global_step": 609726, "epoch": 7346} {"train_loss": -27.855154037475586, "global_step": 609727, "epoch": 7346} {"train_loss": -28.02239990234375, "global_step": 609728, "epoch": 7346} {"train_loss": -27.774534225463867, "global_step": 609729, "epoch": 7346} {"train_loss": -28.174955368041992, "global_step": 609730, "epoch": 7346} {"train_loss": -28.35419273376465, "global_step": 609731, "epoch": 7346} {"train_loss": -27.89011001586914, "global_step": 609732, "epoch": 7346} {"train_loss": -27.636432647705078, "global_step": 609733, "epoch": 7346} {"train_loss": -28.191232681274414, "global_step": 609734, "epoch": 7346} {"train_loss": -27.515554428100586, "global_step": 609735, "epoch": 7346} {"train_loss": -27.50263023376465, "global_step": 609736, "epoch": 7346} {"train_loss": -27.82941246032715, "global_step": 609737, "epoch": 7346} {"train_loss": -28.324594497680664, "global_step": 609738, "epoch": 7346} {"train_loss": -27.733551025390625, "global_step": 609739, "epoch": 7346} {"train_loss": -27.931018829345703, "global_step": 609740, "epoch": 7346} {"train_loss": -28.00530433654785, "global_step": 609741, "epoch": 7346} {"train_loss": -27.78965187072754, "global_step": 609742, "epoch": 7346} {"train_loss": -28.059972763061523, "global_step": 609743, "epoch": 7346} {"train_loss": -28.12286949157715, "global_step": 609744, "epoch": 7346} {"train_loss": -28.2441463470459, "global_step": 609745, "epoch": 7346} {"train_loss": -27.849353790283203, "global_step": 609746, "epoch": 7346} {"train_loss": -28.348480224609375, "global_step": 609747, "epoch": 7346} {"train_loss": -28.094806671142578, "global_step": 609748, "epoch": 7346} {"train_loss": -28.17041015625, "global_step": 609749, "epoch": 7346} {"train_loss": -27.7239933013916, "global_step": 609750, "epoch": 7346} {"train_loss": -27.861303329467773, "global_step": 609751, "epoch": 7346} {"train_loss": -27.884979248046875, "global_step": 609752, "epoch": 7346} {"train_loss": -28.24562644958496, "global_step": 609753, "epoch": 7346} {"train_loss": -28.2270565032959, "global_step": 609754, "epoch": 7346} {"train_loss": -27.749805450439453, "global_step": 609755, "epoch": 7346} {"train_loss": -28.351999282836914, "global_step": 609756, "epoch": 7346} {"train_loss": -27.989948272705078, "global_step": 609757, "epoch": 7346} {"train_loss": -28.27068519592285, "global_step": 609758, "epoch": 7346} {"train_loss": -28.01136589050293, "global_step": 609759, "epoch": 7346} {"train_loss": -28.325363159179688, "global_step": 609760, "epoch": 7346} {"train_loss": -28.310626983642578, "global_step": 609761, "epoch": 7346} {"train_loss": -28.34280776977539, "global_step": 609762, "epoch": 7346} {"train_loss": -28.218250274658203, "global_step": 609763, "epoch": 7346} {"train_loss": -28.3425235748291, "global_step": 609764, "epoch": 7346} {"train_loss": -28.27605628967285, "global_step": 609765, "epoch": 7346} {"train_loss": -27.95223045349121, "global_step": 609766, "epoch": 7346} {"train_loss": -28.054113388061523, "global_step": 609767, "epoch": 7346} {"train_loss": -27.82891845703125, "global_step": 609768, "epoch": 7346} {"train_loss": -27.508350372314453, "global_step": 609769, "epoch": 7346} {"train_loss": -27.91535758972168, "global_step": 609770, "epoch": 7346} {"train_loss": -28.299468994140625, "global_step": 609771, "epoch": 7346} {"train_loss": -27.89100456237793, "global_step": 609772, "epoch": 7346} {"train_loss": -27.86344337463379, "global_step": 609773, "epoch": 7346} {"train_loss": -28.429487228393555, "global_step": 609774, "epoch": 7346} {"train_loss": -27.756696701049805, "global_step": 609775, "epoch": 7346} {"train_loss": -28.12582778930664, "global_step": 609776, "epoch": 7346} {"train_loss": -27.93597412109375, "global_step": 609777, "epoch": 7346} {"train_loss": -28.22844886779785, "global_step": 609778, "epoch": 7346} {"train_loss": -27.873655319213867, "global_step": 609779, "epoch": 7346} {"train_loss": -27.941083908081055, "global_step": 609780, "epoch": 7346} {"train_loss": -28.380878448486328, "global_step": 609781, "epoch": 7346} {"train_loss": -28.055601119995117, "global_step": 609782, "epoch": 7346} {"train_loss": -27.458988189697266, "global_step": 609783, "epoch": 7346} {"train_loss": -27.64179039001465, "global_step": 609784, "epoch": 7346} {"train_loss": -27.66798210144043, "global_step": 609785, "epoch": 7346} {"train_loss": -27.882177352905273, "global_step": 609786, "epoch": 7346} {"train_loss": -27.936309814453125, "global_step": 609787, "epoch": 7346} {"train_loss": -27.806751251220703, "global_step": 609788, "epoch": 7346} {"train_loss": -28.044330596923828, "global_step": 609789, "epoch": 7346} {"train_loss": -28.387922286987305, "global_step": 609790, "epoch": 7346} {"train_loss": -27.977277755737305, "global_step": 609791, "epoch": 7346} {"train_loss": -28.090612411499023, "global_step": 609792, "epoch": 7346} {"train_loss": -27.97649574279785, "global_step": 609793, "epoch": 7346} {"train_loss": -28.1871395111084, "global_step": 609794, "epoch": 7346} {"train_loss": -28.21770668029785, "global_step": 609795, "epoch": 7346} {"train_loss": -28.18320083618164, "global_step": 609796, "epoch": 7346} {"train_loss": -28.22943687438965, "global_step": 609797, "epoch": 7346} {"train_loss": -28.226730346679688, "global_step": 609798, "epoch": 7346} {"train_loss": -28.083576202392578, "global_step": 609799, "epoch": 7346} {"train_loss": -27.954820678894777, "global_step": 609800, "epoch": 7346, "val_loss": 6711272.0} {"train_loss": -28.433568954467773, "global_step": 609801, "epoch": 7347} {"train_loss": -27.806867599487305, "global_step": 609802, "epoch": 7347} {"train_loss": -27.890518188476562, "global_step": 609803, "epoch": 7347} {"train_loss": -28.173770904541016, "global_step": 609804, "epoch": 7347} {"train_loss": -28.22812843322754, "global_step": 609805, "epoch": 7347} {"train_loss": -28.199838638305664, "global_step": 609806, "epoch": 7347} {"train_loss": -27.8364200592041, "global_step": 609807, "epoch": 7347} {"train_loss": -28.058063507080078, "global_step": 609808, "epoch": 7347} {"train_loss": -28.360675811767578, "global_step": 609809, "epoch": 7347} {"train_loss": -27.975326538085938, "global_step": 609810, "epoch": 7347} {"train_loss": -28.04595375061035, "global_step": 609811, "epoch": 7347} {"train_loss": -28.28095817565918, "global_step": 609812, "epoch": 7347} {"train_loss": -28.229345321655273, "global_step": 609813, "epoch": 7347} {"train_loss": -27.810901641845703, "global_step": 609814, "epoch": 7347} {"train_loss": -27.86810874938965, "global_step": 609815, "epoch": 7347} {"train_loss": -28.004993438720703, "global_step": 609816, "epoch": 7347} {"train_loss": -28.41266441345215, "global_step": 609817, "epoch": 7347} {"train_loss": -28.135107040405273, "global_step": 609818, "epoch": 7347} {"train_loss": -27.960590362548828, "global_step": 609819, "epoch": 7347} {"train_loss": -28.367258071899414, "global_step": 609820, "epoch": 7347} {"train_loss": -28.232868194580078, "global_step": 609821, "epoch": 7347} {"train_loss": -28.353958129882812, "global_step": 609822, "epoch": 7347} {"train_loss": -28.2082576751709, "global_step": 609823, "epoch": 7347} {"train_loss": -28.353534698486328, "global_step": 609824, "epoch": 7347} {"train_loss": -27.88346290588379, "global_step": 609825, "epoch": 7347} {"train_loss": -28.1044864654541, "global_step": 609826, "epoch": 7347} {"train_loss": -28.31353759765625, "global_step": 609827, "epoch": 7347} {"train_loss": -28.189268112182617, "global_step": 609828, "epoch": 7347} {"train_loss": -27.83414077758789, "global_step": 609829, "epoch": 7347} {"train_loss": -27.87558364868164, "global_step": 609830, "epoch": 7347} {"train_loss": -27.7164306640625, "global_step": 609831, "epoch": 7347} {"train_loss": -28.358243942260742, "global_step": 609832, "epoch": 7347} {"train_loss": -28.153888702392578, "global_step": 609833, "epoch": 7347} {"train_loss": -27.57318687438965, "global_step": 609834, "epoch": 7347} {"train_loss": -27.445056915283203, "global_step": 609835, "epoch": 7347} {"train_loss": -27.860448837280273, "global_step": 609836, "epoch": 7347} {"train_loss": -28.1710262298584, "global_step": 609837, "epoch": 7347} {"train_loss": -27.337570190429688, "global_step": 609838, "epoch": 7347} {"train_loss": -27.5603084564209, "global_step": 609839, "epoch": 7347} {"train_loss": -28.273059844970703, "global_step": 609840, "epoch": 7347} {"train_loss": -28.295745849609375, "global_step": 609841, "epoch": 7347} {"train_loss": -28.440053939819336, "global_step": 609842, "epoch": 7347} {"train_loss": -28.180267333984375, "global_step": 609843, "epoch": 7347} {"train_loss": -28.021717071533203, "global_step": 609844, "epoch": 7347} {"train_loss": -28.155914306640625, "global_step": 609845, "epoch": 7347} {"train_loss": -28.343183517456055, "global_step": 609846, "epoch": 7347} {"train_loss": -28.61083984375, "global_step": 609847, "epoch": 7347} {"train_loss": -28.164342880249023, "global_step": 609848, "epoch": 7347} {"train_loss": -27.862451553344727, "global_step": 609849, "epoch": 7347} {"train_loss": -28.1069278717041, "global_step": 609850, "epoch": 7347} {"train_loss": -28.34388542175293, "global_step": 609851, "epoch": 7347} {"train_loss": -28.095916748046875, "global_step": 609852, "epoch": 7347} {"train_loss": -28.141284942626953, "global_step": 609853, "epoch": 7347} {"train_loss": -28.383153915405273, "global_step": 609854, "epoch": 7347} {"train_loss": -28.0970401763916, "global_step": 609855, "epoch": 7347} {"train_loss": -28.010791778564453, "global_step": 609856, "epoch": 7347} {"train_loss": -28.327402114868164, "global_step": 609857, "epoch": 7347} {"train_loss": -27.830280303955078, "global_step": 609858, "epoch": 7347} {"train_loss": -27.646772384643555, "global_step": 609859, "epoch": 7347} {"train_loss": -27.196805953979492, "global_step": 609860, "epoch": 7347} {"train_loss": -27.19402503967285, "global_step": 609861, "epoch": 7347} {"train_loss": -27.3730525970459, "global_step": 609862, "epoch": 7347} {"train_loss": -27.585006713867188, "global_step": 609863, "epoch": 7347} {"train_loss": -28.135114669799805, "global_step": 609864, "epoch": 7347} {"train_loss": -28.063459396362305, "global_step": 609865, "epoch": 7347} {"train_loss": -28.37558364868164, "global_step": 609866, "epoch": 7347} {"train_loss": -28.1514892578125, "global_step": 609867, "epoch": 7347} {"train_loss": -28.173919677734375, "global_step": 609868, "epoch": 7347} {"train_loss": -27.89621353149414, "global_step": 609869, "epoch": 7347} {"train_loss": -27.980817794799805, "global_step": 609870, "epoch": 7347} {"train_loss": -28.353200912475586, "global_step": 609871, "epoch": 7347} {"train_loss": -27.909408569335938, "global_step": 609872, "epoch": 7347} {"train_loss": -27.58302879333496, "global_step": 609873, "epoch": 7347} {"train_loss": -27.973285675048828, "global_step": 609874, "epoch": 7347} {"train_loss": -28.251394271850586, "global_step": 609875, "epoch": 7347} {"train_loss": -28.12750244140625, "global_step": 609876, "epoch": 7347} {"train_loss": -28.230533599853516, "global_step": 609877, "epoch": 7347} {"train_loss": -28.09796714782715, "global_step": 609878, "epoch": 7347} {"train_loss": -28.0564022064209, "global_step": 609879, "epoch": 7347} {"train_loss": -28.211353302001953, "global_step": 609880, "epoch": 7347} {"train_loss": -28.04585075378418, "global_step": 609881, "epoch": 7347} {"train_loss": -28.56768226623535, "global_step": 609882, "epoch": 7347} {"train_loss": -28.068336831517968, "global_step": 609883, "epoch": 7347, "val_loss": 6757550.0} {"train_loss": -27.496082305908203, "global_step": 609884, "epoch": 7348} {"train_loss": -27.5952205657959, "global_step": 609885, "epoch": 7348} {"train_loss": -27.803359985351562, "global_step": 609886, "epoch": 7348} {"train_loss": -27.79143714904785, "global_step": 609887, "epoch": 7348} {"train_loss": -27.737180709838867, "global_step": 609888, "epoch": 7348} {"train_loss": -27.827056884765625, "global_step": 609889, "epoch": 7348} {"train_loss": -27.678192138671875, "global_step": 609890, "epoch": 7348} {"train_loss": -27.63419532775879, "global_step": 609891, "epoch": 7348} {"train_loss": -27.975666046142578, "global_step": 609892, "epoch": 7348} {"train_loss": -27.7053279876709, "global_step": 609893, "epoch": 7348} {"train_loss": -27.19270133972168, "global_step": 609894, "epoch": 7348} {"train_loss": -27.57386589050293, "global_step": 609895, "epoch": 7348} {"train_loss": -27.980138778686523, "global_step": 609896, "epoch": 7348} {"train_loss": -27.728445053100586, "global_step": 609897, "epoch": 7348} {"train_loss": -27.677526473999023, "global_step": 609898, "epoch": 7348} {"train_loss": -27.956090927124023, "global_step": 609899, "epoch": 7348} {"train_loss": -27.7515811920166, "global_step": 609900, "epoch": 7348} {"train_loss": -27.52178955078125, "global_step": 609901, "epoch": 7348} {"train_loss": -28.334177017211914, "global_step": 609902, "epoch": 7348} {"train_loss": -28.25943946838379, "global_step": 609903, "epoch": 7348} {"train_loss": -27.500120162963867, "global_step": 609904, "epoch": 7348} {"train_loss": -28.11634635925293, "global_step": 609905, "epoch": 7348} {"train_loss": -28.052783966064453, "global_step": 609906, "epoch": 7348} {"train_loss": -27.984777450561523, "global_step": 609907, "epoch": 7348} {"train_loss": -28.160919189453125, "global_step": 609908, "epoch": 7348} {"train_loss": -28.41546058654785, "global_step": 609909, "epoch": 7348} {"train_loss": -28.094587326049805, "global_step": 609910, "epoch": 7348} {"train_loss": -28.105566024780273, "global_step": 609911, "epoch": 7348} {"train_loss": -28.492298126220703, "global_step": 609912, "epoch": 7348} {"train_loss": -28.483320236206055, "global_step": 609913, "epoch": 7348} {"train_loss": -28.29267692565918, "global_step": 609914, "epoch": 7348} {"train_loss": -28.263731002807617, "global_step": 609915, "epoch": 7348} {"train_loss": -28.36444664001465, "global_step": 609916, "epoch": 7348} {"train_loss": -28.058441162109375, "global_step": 609917, "epoch": 7348} {"train_loss": -28.57573890686035, "global_step": 609918, "epoch": 7348} {"train_loss": -28.326969146728516, "global_step": 609919, "epoch": 7348} {"train_loss": -28.442670822143555, "global_step": 609920, "epoch": 7348} {"train_loss": -28.1336669921875, "global_step": 609921, "epoch": 7348} {"train_loss": -28.453125, "global_step": 609922, "epoch": 7348} {"train_loss": -28.595916748046875, "global_step": 609923, "epoch": 7348} {"train_loss": -28.23794937133789, "global_step": 609924, "epoch": 7348} {"train_loss": -28.32219886779785, "global_step": 609925, "epoch": 7348} {"train_loss": -28.213903427124023, "global_step": 609926, "epoch": 7348} {"train_loss": -28.376371383666992, "global_step": 609927, "epoch": 7348} {"train_loss": -28.211652755737305, "global_step": 609928, "epoch": 7348} {"train_loss": -28.354923248291016, "global_step": 609929, "epoch": 7348} {"train_loss": -28.2716121673584, "global_step": 609930, "epoch": 7348} {"train_loss": -28.392810821533203, "global_step": 609931, "epoch": 7348} {"train_loss": -28.2864933013916, "global_step": 609932, "epoch": 7348} {"train_loss": -27.93963050842285, "global_step": 609933, "epoch": 7348} {"train_loss": -28.044885635375977, "global_step": 609934, "epoch": 7348} {"train_loss": -27.99336051940918, "global_step": 609935, "epoch": 7348} {"train_loss": -27.808103561401367, "global_step": 609936, "epoch": 7348} {"train_loss": -28.247146606445312, "global_step": 609937, "epoch": 7348} {"train_loss": -27.959936141967773, "global_step": 609938, "epoch": 7348} {"train_loss": -28.546722412109375, "global_step": 609939, "epoch": 7348} {"train_loss": -27.751968383789062, "global_step": 609940, "epoch": 7348} {"train_loss": -27.9897518157959, "global_step": 609941, "epoch": 7348} {"train_loss": -27.8418025970459, "global_step": 609942, "epoch": 7348} {"train_loss": -27.551197052001953, "global_step": 609943, "epoch": 7348} {"train_loss": -27.83033561706543, "global_step": 609944, "epoch": 7348} {"train_loss": -28.137195587158203, "global_step": 609945, "epoch": 7348} {"train_loss": -27.978687286376953, "global_step": 609946, "epoch": 7348} {"train_loss": -28.400609970092773, "global_step": 609947, "epoch": 7348} {"train_loss": -28.070804595947266, "global_step": 609948, "epoch": 7348} {"train_loss": -27.948841094970703, "global_step": 609949, "epoch": 7348} {"train_loss": -28.214569091796875, "global_step": 609950, "epoch": 7348} {"train_loss": -27.916614532470703, "global_step": 609951, "epoch": 7348} {"train_loss": -28.072473526000977, "global_step": 609952, "epoch": 7348} {"train_loss": -28.073993682861328, "global_step": 609953, "epoch": 7348} {"train_loss": -27.878835678100586, "global_step": 609954, "epoch": 7348} {"train_loss": -28.35731315612793, "global_step": 609955, "epoch": 7348} {"train_loss": -28.052448272705078, "global_step": 609956, "epoch": 7348} {"train_loss": -28.052738189697266, "global_step": 609957, "epoch": 7348} {"train_loss": -27.772504806518555, "global_step": 609958, "epoch": 7348} {"train_loss": -28.26081657409668, "global_step": 609959, "epoch": 7348} {"train_loss": -27.930770874023438, "global_step": 609960, "epoch": 7348} {"train_loss": -28.417072296142578, "global_step": 609961, "epoch": 7348} {"train_loss": -27.820831298828125, "global_step": 609962, "epoch": 7348} {"train_loss": -28.325225830078125, "global_step": 609963, "epoch": 7348} {"train_loss": -27.72308349609375, "global_step": 609964, "epoch": 7348} {"train_loss": -27.862436294555664, "global_step": 609965, "epoch": 7348} {"train_loss": -28.042072388062994, "global_step": 609966, "epoch": 7348, "val_loss": 6732406.0} {"train_loss": -27.3411808013916, "global_step": 609967, "epoch": 7349} {"train_loss": -27.015283584594727, "global_step": 609968, "epoch": 7349} {"train_loss": -27.70627212524414, "global_step": 609969, "epoch": 7349} {"train_loss": -27.665571212768555, "global_step": 609970, "epoch": 7349} {"train_loss": -27.460830688476562, "global_step": 609971, "epoch": 7349} {"train_loss": -27.26177406311035, "global_step": 609972, "epoch": 7349} {"train_loss": -27.128225326538086, "global_step": 609973, "epoch": 7349} {"train_loss": -26.934711456298828, "global_step": 609974, "epoch": 7349} {"train_loss": -27.942975997924805, "global_step": 609975, "epoch": 7349} {"train_loss": -27.725366592407227, "global_step": 609976, "epoch": 7349} {"train_loss": -27.8023624420166, "global_step": 609977, "epoch": 7349} {"train_loss": -27.97178077697754, "global_step": 609978, "epoch": 7349} {"train_loss": -27.765716552734375, "global_step": 609979, "epoch": 7349} {"train_loss": -27.423999786376953, "global_step": 609980, "epoch": 7349} {"train_loss": -27.455785751342773, "global_step": 609981, "epoch": 7349} {"train_loss": -28.013071060180664, "global_step": 609982, "epoch": 7349} {"train_loss": -27.568927764892578, "global_step": 609983, "epoch": 7349} {"train_loss": -28.19904136657715, "global_step": 609984, "epoch": 7349} {"train_loss": -28.071964263916016, "global_step": 609985, "epoch": 7349} {"train_loss": -27.741718292236328, "global_step": 609986, "epoch": 7349} {"train_loss": -28.044321060180664, "global_step": 609987, "epoch": 7349} {"train_loss": -27.713916778564453, "global_step": 609988, "epoch": 7349} {"train_loss": -28.018041610717773, "global_step": 609989, "epoch": 7349} {"train_loss": -27.695819854736328, "global_step": 609990, "epoch": 7349} {"train_loss": -27.656631469726562, "global_step": 609991, "epoch": 7349} {"train_loss": -27.73615074157715, "global_step": 609992, "epoch": 7349} {"train_loss": -27.45856285095215, "global_step": 609993, "epoch": 7349} {"train_loss": -28.101764678955078, "global_step": 609994, "epoch": 7349} {"train_loss": -27.759342193603516, "global_step": 609995, "epoch": 7349} {"train_loss": -27.553119659423828, "global_step": 609996, "epoch": 7349} {"train_loss": -27.825529098510742, "global_step": 609997, "epoch": 7349} {"train_loss": -27.89691162109375, "global_step": 609998, "epoch": 7349} {"train_loss": -28.062408447265625, "global_step": 609999, "epoch": 7349} {"train_loss": -27.899932861328125, "global_step": 610000, "epoch": 7349} {"train_loss": -27.9434871673584, "global_step": 610001, "epoch": 7349} {"train_loss": -28.29831314086914, "global_step": 610002, "epoch": 7349} {"train_loss": -28.0618896484375, "global_step": 610003, "epoch": 7349} {"train_loss": -27.660770416259766, "global_step": 610004, "epoch": 7349} {"train_loss": -28.155542373657227, "global_step": 610005, "epoch": 7349} {"train_loss": -27.91291618347168, "global_step": 610006, "epoch": 7349} {"train_loss": -28.343158721923828, "global_step": 610007, "epoch": 7349} {"train_loss": -28.07142448425293, "global_step": 610008, "epoch": 7349} {"train_loss": -28.034955978393555, "global_step": 610009, "epoch": 7349} {"train_loss": -28.094242095947266, "global_step": 610010, "epoch": 7349} {"train_loss": -28.181055068969727, "global_step": 610011, "epoch": 7349} {"train_loss": -28.168310165405273, "global_step": 610012, "epoch": 7349} {"train_loss": -28.21811866760254, "global_step": 610013, "epoch": 7349} {"train_loss": -28.2960262298584, "global_step": 610014, "epoch": 7349} {"train_loss": -28.186786651611328, "global_step": 610015, "epoch": 7349} {"train_loss": -28.30155372619629, "global_step": 610016, "epoch": 7349} {"train_loss": -28.217676162719727, "global_step": 610017, "epoch": 7349} {"train_loss": -27.90616798400879, "global_step": 610018, "epoch": 7349} {"train_loss": -28.354782104492188, "global_step": 610019, "epoch": 7349} {"train_loss": -28.5813045501709, "global_step": 610020, "epoch": 7349} {"train_loss": -27.96771240234375, "global_step": 610021, "epoch": 7349} {"train_loss": -28.290485382080078, "global_step": 610022, "epoch": 7349} {"train_loss": -28.2211971282959, "global_step": 610023, "epoch": 7349} {"train_loss": -28.116613388061523, "global_step": 610024, "epoch": 7349} {"train_loss": -28.089529037475586, "global_step": 610025, "epoch": 7349} {"train_loss": -28.431650161743164, "global_step": 610026, "epoch": 7349} {"train_loss": -28.01969337463379, "global_step": 610027, "epoch": 7349} {"train_loss": -28.348724365234375, "global_step": 610028, "epoch": 7349} {"train_loss": -28.0518798828125, "global_step": 610029, "epoch": 7349} {"train_loss": -28.018707275390625, "global_step": 610030, "epoch": 7349} {"train_loss": -28.171606063842773, "global_step": 610031, "epoch": 7349} {"train_loss": -28.205835342407227, "global_step": 610032, "epoch": 7349} {"train_loss": -28.160573959350586, "global_step": 610033, "epoch": 7349} {"train_loss": -27.702362060546875, "global_step": 610034, "epoch": 7349} {"train_loss": -28.3111629486084, "global_step": 610035, "epoch": 7349} {"train_loss": -27.735462188720703, "global_step": 610036, "epoch": 7349} {"train_loss": -28.575063705444336, "global_step": 610037, "epoch": 7349} {"train_loss": -28.17693519592285, "global_step": 610038, "epoch": 7349} {"train_loss": -28.488004684448242, "global_step": 610039, "epoch": 7349} {"train_loss": -27.712671279907227, "global_step": 610040, "epoch": 7349} {"train_loss": -28.462509155273438, "global_step": 610041, "epoch": 7349} {"train_loss": -27.896652221679688, "global_step": 610042, "epoch": 7349} {"train_loss": -28.3941593170166, "global_step": 610043, "epoch": 7349} {"train_loss": -28.146686553955078, "global_step": 610044, "epoch": 7349} {"train_loss": -27.977659225463867, "global_step": 610045, "epoch": 7349} {"train_loss": -27.86591148376465, "global_step": 610046, "epoch": 7349} {"train_loss": -27.916095733642578, "global_step": 610047, "epoch": 7349} {"train_loss": -27.9588565826416, "global_step": 610048, "epoch": 7349} {"train_loss": -27.94353204750153, "global_step": 610049, "epoch": 7349, "val_loss": 6718995.0} {"train_loss": -26.9671573638916, "global_step": 610050, "epoch": 7350} {"train_loss": -27.422138214111328, "global_step": 610051, "epoch": 7350} {"train_loss": -27.02827262878418, "global_step": 610052, "epoch": 7350} {"train_loss": -27.06879997253418, "global_step": 610053, "epoch": 7350} {"train_loss": -27.268310546875, "global_step": 610054, "epoch": 7350} {"train_loss": -27.39063835144043, "global_step": 610055, "epoch": 7350} {"train_loss": -27.786630630493164, "global_step": 610056, "epoch": 7350} {"train_loss": -27.515213012695312, "global_step": 610057, "epoch": 7350} {"train_loss": -28.10097312927246, "global_step": 610058, "epoch": 7350} {"train_loss": -27.63140296936035, "global_step": 610059, "epoch": 7350} {"train_loss": -27.742639541625977, "global_step": 610060, "epoch": 7350} {"train_loss": -27.466306686401367, "global_step": 610061, "epoch": 7350} {"train_loss": -27.724075317382812, "global_step": 610062, "epoch": 7350} {"train_loss": -27.534534454345703, "global_step": 610063, "epoch": 7350} {"train_loss": -27.806116104125977, "global_step": 610064, "epoch": 7350} {"train_loss": -27.57649040222168, "global_step": 610065, "epoch": 7350} {"train_loss": -27.931318283081055, "global_step": 610066, "epoch": 7350} {"train_loss": -28.017541885375977, "global_step": 610067, "epoch": 7350} {"train_loss": -27.822736740112305, "global_step": 610068, "epoch": 7350} {"train_loss": -27.711181640625, "global_step": 610069, "epoch": 7350} {"train_loss": -28.458011627197266, "global_step": 610070, "epoch": 7350} {"train_loss": -28.43366050720215, "global_step": 610071, "epoch": 7350} {"train_loss": -28.083093643188477, "global_step": 610072, "epoch": 7350} {"train_loss": -28.07674217224121, "global_step": 610073, "epoch": 7350} {"train_loss": -27.88309669494629, "global_step": 610074, "epoch": 7350} {"train_loss": -28.068073272705078, "global_step": 610075, "epoch": 7350} {"train_loss": -28.018468856811523, "global_step": 610076, "epoch": 7350} {"train_loss": -27.997289657592773, "global_step": 610077, "epoch": 7350} {"train_loss": -28.216400146484375, "global_step": 610078, "epoch": 7350} {"train_loss": -28.224470138549805, "global_step": 610079, "epoch": 7350} {"train_loss": -28.000219345092773, "global_step": 610080, "epoch": 7350} {"train_loss": -28.1590576171875, "global_step": 610081, "epoch": 7350} {"train_loss": -28.23006248474121, "global_step": 610082, "epoch": 7350} {"train_loss": -28.08723258972168, "global_step": 610083, "epoch": 7350} {"train_loss": -27.776779174804688, "global_step": 610084, "epoch": 7350} {"train_loss": -27.990575790405273, "global_step": 610085, "epoch": 7350} {"train_loss": -28.18668556213379, "global_step": 610086, "epoch": 7350} {"train_loss": -28.222570419311523, "global_step": 610087, "epoch": 7350} {"train_loss": -28.0827693939209, "global_step": 610088, "epoch": 7350} {"train_loss": -28.076078414916992, "global_step": 610089, "epoch": 7350} {"train_loss": -28.431344985961914, "global_step": 610090, "epoch": 7350} {"train_loss": -27.927265167236328, "global_step": 610091, "epoch": 7350} {"train_loss": -28.397632598876953, "global_step": 610092, "epoch": 7350} {"train_loss": -27.96993064880371, "global_step": 610093, "epoch": 7350} {"train_loss": -28.2309513092041, "global_step": 610094, "epoch": 7350} {"train_loss": -28.318151473999023, "global_step": 610095, "epoch": 7350} {"train_loss": -28.401824951171875, "global_step": 610096, "epoch": 7350} {"train_loss": -27.957839965820312, "global_step": 610097, "epoch": 7350} {"train_loss": -27.91180419921875, "global_step": 610098, "epoch": 7350} {"train_loss": -27.872760772705078, "global_step": 610099, "epoch": 7350} {"train_loss": -28.185413360595703, "global_step": 610100, "epoch": 7350} {"train_loss": -28.675146102905273, "global_step": 610101, "epoch": 7350} {"train_loss": -27.78192138671875, "global_step": 610102, "epoch": 7350} {"train_loss": -28.376861572265625, "global_step": 610103, "epoch": 7350} {"train_loss": -28.239215850830078, "global_step": 610104, "epoch": 7350} {"train_loss": -28.002622604370117, "global_step": 610105, "epoch": 7350} {"train_loss": -28.246320724487305, "global_step": 610106, "epoch": 7350} {"train_loss": -28.170942306518555, "global_step": 610107, "epoch": 7350} {"train_loss": -28.321380615234375, "global_step": 610108, "epoch": 7350} {"train_loss": -27.922687530517578, "global_step": 610109, "epoch": 7350} {"train_loss": -28.138410568237305, "global_step": 610110, "epoch": 7350} {"train_loss": -28.220691680908203, "global_step": 610111, "epoch": 7350} {"train_loss": -28.236936569213867, "global_step": 610112, "epoch": 7350} {"train_loss": -28.079557418823242, "global_step": 610113, "epoch": 7350} {"train_loss": -28.287397384643555, "global_step": 610114, "epoch": 7350} {"train_loss": -28.303253173828125, "global_step": 610115, "epoch": 7350} {"train_loss": -28.256006240844727, "global_step": 610116, "epoch": 7350} {"train_loss": -28.126874923706055, "global_step": 610117, "epoch": 7350} {"train_loss": -28.5196590423584, "global_step": 610118, "epoch": 7350} {"train_loss": -28.321807861328125, "global_step": 610119, "epoch": 7350} {"train_loss": -28.307769775390625, "global_step": 610120, "epoch": 7350} {"train_loss": -28.329273223876953, "global_step": 610121, "epoch": 7350} {"train_loss": -28.070371627807617, "global_step": 610122, "epoch": 7350} {"train_loss": -28.008529663085938, "global_step": 610123, "epoch": 7350} {"train_loss": -28.30441665649414, "global_step": 610124, "epoch": 7350} {"train_loss": -28.213659286499023, "global_step": 610125, "epoch": 7350} {"train_loss": -28.220352172851562, "global_step": 610126, "epoch": 7350} {"train_loss": -28.640501022338867, "global_step": 610127, "epoch": 7350} {"train_loss": -28.48616600036621, "global_step": 610128, "epoch": 7350} {"train_loss": -28.416107177734375, "global_step": 610129, "epoch": 7350} {"train_loss": -28.075000762939453, "global_step": 610130, "epoch": 7350} {"train_loss": -28.11044692993164, "global_step": 610131, "epoch": 7350} {"train_loss": -28.038792024175805, "global_step": 610132, "epoch": 7350, "train/sim_max_reward_0": 1.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4500000": 1.0, "test/sim_max_reward_4500001": 1.0, "test/sim_max_reward_4500002": 1.0, "test/sim_max_reward_4500003": 1.0, "test/sim_max_reward_4500004": 1.0, "test/sim_max_reward_4500005": 1.0, "test/sim_max_reward_4500006": 1.0, "test/sim_max_reward_4500007": 0.0, "test/sim_max_reward_4500008": 1.0, "test/sim_max_reward_4500009": 1.0, "test/sim_max_reward_4500010": 1.0, "test/sim_max_reward_4500011": 1.0, "test/sim_max_reward_4500012": 1.0, "test/sim_max_reward_4500013": 1.0, "test/sim_max_reward_4500014": 1.0, "test/sim_max_reward_4500015": 1.0, "test/sim_max_reward_4500016": 1.0, "test/sim_max_reward_4500017": 1.0, "test/sim_max_reward_4500018": 1.0, "test/sim_max_reward_4500019": 0.0, "test/sim_max_reward_4500020": 1.0, "test/sim_max_reward_4500021": 1.0, "train/mean_score": 1.0, "test/mean_score": 0.9090909090909091, "val_loss": 6636459.5} {"train_loss": -27.579389572143555, "global_step": 610133, "epoch": 7351} {"train_loss": -27.25648307800293, "global_step": 610134, "epoch": 7351} {"train_loss": -27.911924362182617, "global_step": 610135, "epoch": 7351} {"train_loss": -27.9692440032959, "global_step": 610136, "epoch": 7351} {"train_loss": -27.353437423706055, "global_step": 610137, "epoch": 7351} {"train_loss": -27.344274520874023, "global_step": 610138, "epoch": 7351} {"train_loss": -27.329776763916016, "global_step": 610139, "epoch": 7351} {"train_loss": -27.78592300415039, "global_step": 610140, "epoch": 7351} {"train_loss": -27.24220085144043, "global_step": 610141, "epoch": 7351} {"train_loss": -27.748645782470703, "global_step": 610142, "epoch": 7351} {"train_loss": -27.631879806518555, "global_step": 610143, "epoch": 7351} {"train_loss": -27.515546798706055, "global_step": 610144, "epoch": 7351} {"train_loss": -27.49995231628418, "global_step": 610145, "epoch": 7351} {"train_loss": -27.53449058532715, "global_step": 610146, "epoch": 7351} {"train_loss": -27.795013427734375, "global_step": 610147, "epoch": 7351} {"train_loss": -27.757373809814453, "global_step": 610148, "epoch": 7351} {"train_loss": -28.162769317626953, "global_step": 610149, "epoch": 7351} {"train_loss": -27.51869773864746, "global_step": 610150, "epoch": 7351} {"train_loss": -27.2587947845459, "global_step": 610151, "epoch": 7351} {"train_loss": -27.5845947265625, "global_step": 610152, "epoch": 7351} {"train_loss": -27.427356719970703, "global_step": 610153, "epoch": 7351} {"train_loss": -27.909442901611328, "global_step": 610154, "epoch": 7351} {"train_loss": -27.618261337280273, "global_step": 610155, "epoch": 7351} {"train_loss": -27.748138427734375, "global_step": 610156, "epoch": 7351} {"train_loss": -27.568540573120117, "global_step": 610157, "epoch": 7351} {"train_loss": -27.77250099182129, "global_step": 610158, "epoch": 7351} {"train_loss": -27.908599853515625, "global_step": 610159, "epoch": 7351} {"train_loss": -28.038471221923828, "global_step": 610160, "epoch": 7351} {"train_loss": -27.539648056030273, "global_step": 610161, "epoch": 7351} {"train_loss": -28.219518661499023, "global_step": 610162, "epoch": 7351} {"train_loss": -27.83595085144043, "global_step": 610163, "epoch": 7351} {"train_loss": -27.99183464050293, "global_step": 610164, "epoch": 7351} {"train_loss": -28.245206832885742, "global_step": 610165, "epoch": 7351} {"train_loss": -28.38816261291504, "global_step": 610166, "epoch": 7351} {"train_loss": -27.916086196899414, "global_step": 610167, "epoch": 7351} {"train_loss": -27.933507919311523, "global_step": 610168, "epoch": 7351} {"train_loss": -28.025548934936523, "global_step": 610169, "epoch": 7351} {"train_loss": -28.0122127532959, "global_step": 610170, "epoch": 7351} {"train_loss": -27.755207061767578, "global_step": 610171, "epoch": 7351} {"train_loss": -27.824934005737305, "global_step": 610172, "epoch": 7351} {"train_loss": -28.183515548706055, "global_step": 610173, "epoch": 7351} {"train_loss": -28.12213706970215, "global_step": 610174, "epoch": 7351} {"train_loss": -27.953601837158203, "global_step": 610175, "epoch": 7351} {"train_loss": -28.13504409790039, "global_step": 610176, "epoch": 7351} {"train_loss": -28.15369987487793, "global_step": 610177, "epoch": 7351} {"train_loss": -27.97028160095215, "global_step": 610178, "epoch": 7351} {"train_loss": -28.341779708862305, "global_step": 610179, "epoch": 7351} {"train_loss": -27.994047164916992, "global_step": 610180, "epoch": 7351} {"train_loss": -28.094165802001953, "global_step": 610181, "epoch": 7351} {"train_loss": -28.35392189025879, "global_step": 610182, "epoch": 7351} {"train_loss": -28.32211685180664, "global_step": 610183, "epoch": 7351} {"train_loss": -28.290908813476562, "global_step": 610184, "epoch": 7351} {"train_loss": -28.10041618347168, "global_step": 610185, "epoch": 7351} {"train_loss": -28.14251136779785, "global_step": 610186, "epoch": 7351} {"train_loss": -28.107648849487305, "global_step": 610187, "epoch": 7351} {"train_loss": -27.98868751525879, "global_step": 610188, "epoch": 7351} {"train_loss": -28.3652400970459, "global_step": 610189, "epoch": 7351} {"train_loss": -28.171621322631836, "global_step": 610190, "epoch": 7351} {"train_loss": -28.13114356994629, "global_step": 610191, "epoch": 7351} {"train_loss": -28.288970947265625, "global_step": 610192, "epoch": 7351} {"train_loss": -28.03973960876465, "global_step": 610193, "epoch": 7351} {"train_loss": -28.42592430114746, "global_step": 610194, "epoch": 7351} {"train_loss": -28.332294464111328, "global_step": 610195, "epoch": 7351} {"train_loss": -28.078174591064453, "global_step": 610196, "epoch": 7351} {"train_loss": -28.374670028686523, "global_step": 610197, "epoch": 7351} {"train_loss": -27.817556381225586, "global_step": 610198, "epoch": 7351} {"train_loss": -28.159067153930664, "global_step": 610199, "epoch": 7351} {"train_loss": -27.988874435424805, "global_step": 610200, "epoch": 7351} {"train_loss": -28.31694984436035, "global_step": 610201, "epoch": 7351} {"train_loss": -27.818777084350586, "global_step": 610202, "epoch": 7351} {"train_loss": -27.986230850219727, "global_step": 610203, "epoch": 7351} {"train_loss": -28.311904907226562, "global_step": 610204, "epoch": 7351} {"train_loss": -27.718976974487305, "global_step": 610205, "epoch": 7351} {"train_loss": -28.2119083404541, "global_step": 610206, "epoch": 7351} {"train_loss": -28.144866943359375, "global_step": 610207, "epoch": 7351} {"train_loss": -28.49560546875, "global_step": 610208, "epoch": 7351} {"train_loss": -28.20456314086914, "global_step": 610209, "epoch": 7351} {"train_loss": -28.49883460998535, "global_step": 610210, "epoch": 7351} {"train_loss": -28.41046714782715, "global_step": 610211, "epoch": 7351} {"train_loss": -27.85283851623535, "global_step": 610212, "epoch": 7351} {"train_loss": -27.807708740234375, "global_step": 610213, "epoch": 7351} {"train_loss": -28.07343864440918, "global_step": 610214, "epoch": 7351} {"train_loss": -27.951113436595502, "global_step": 610215, "epoch": 7351, "val_loss": 6603539.0} {"train_loss": -28.049793243408203, "global_step": 610216, "epoch": 7352} {"train_loss": -27.093994140625, "global_step": 610217, "epoch": 7352} {"train_loss": -26.7388916015625, "global_step": 610218, "epoch": 7352} {"train_loss": -26.724599838256836, "global_step": 610219, "epoch": 7352} {"train_loss": -27.743438720703125, "global_step": 610220, "epoch": 7352} {"train_loss": -27.949819564819336, "global_step": 610221, "epoch": 7352} {"train_loss": -27.878711700439453, "global_step": 610222, "epoch": 7352} {"train_loss": -27.023834228515625, "global_step": 610223, "epoch": 7352} {"train_loss": -27.52516746520996, "global_step": 610224, "epoch": 7352} {"train_loss": -27.705808639526367, "global_step": 610225, "epoch": 7352} {"train_loss": -27.50189208984375, "global_step": 610226, "epoch": 7352} {"train_loss": -27.87556266784668, "global_step": 610227, "epoch": 7352} {"train_loss": -27.436933517456055, "global_step": 610228, "epoch": 7352} {"train_loss": -27.75689125061035, "global_step": 610229, "epoch": 7352} {"train_loss": -27.74627685546875, "global_step": 610230, "epoch": 7352} {"train_loss": -27.89004898071289, "global_step": 610231, "epoch": 7352} {"train_loss": -27.99945640563965, "global_step": 610232, "epoch": 7352} {"train_loss": -27.562002182006836, "global_step": 610233, "epoch": 7352} {"train_loss": -28.004154205322266, "global_step": 610234, "epoch": 7352} {"train_loss": -28.083478927612305, "global_step": 610235, "epoch": 7352} {"train_loss": -27.535404205322266, "global_step": 610236, "epoch": 7352} {"train_loss": -27.801843643188477, "global_step": 610237, "epoch": 7352} {"train_loss": -27.921857833862305, "global_step": 610238, "epoch": 7352} {"train_loss": -27.97688102722168, "global_step": 610239, "epoch": 7352} {"train_loss": -28.182071685791016, "global_step": 610240, "epoch": 7352} {"train_loss": -27.988706588745117, "global_step": 610241, "epoch": 7352} {"train_loss": -27.8596248626709, "global_step": 610242, "epoch": 7352} {"train_loss": -27.891326904296875, "global_step": 610243, "epoch": 7352} {"train_loss": -27.888996124267578, "global_step": 610244, "epoch": 7352} {"train_loss": -27.932050704956055, "global_step": 610245, "epoch": 7352} {"train_loss": -27.88264274597168, "global_step": 610246, "epoch": 7352} {"train_loss": -27.981433868408203, "global_step": 610247, "epoch": 7352} {"train_loss": -27.946348190307617, "global_step": 610248, "epoch": 7352} {"train_loss": -28.033178329467773, "global_step": 610249, "epoch": 7352} {"train_loss": -28.312335968017578, "global_step": 610250, "epoch": 7352} {"train_loss": -28.3255558013916, "global_step": 610251, "epoch": 7352} {"train_loss": -27.87534523010254, "global_step": 610252, "epoch": 7352} {"train_loss": -28.0267391204834, "global_step": 610253, "epoch": 7352} {"train_loss": -28.13934898376465, "global_step": 610254, "epoch": 7352} {"train_loss": -28.14503288269043, "global_step": 610255, "epoch": 7352} {"train_loss": -28.43787956237793, "global_step": 610256, "epoch": 7352} {"train_loss": -28.218616485595703, "global_step": 610257, "epoch": 7352} {"train_loss": -27.829809188842773, "global_step": 610258, "epoch": 7352} {"train_loss": -27.79205322265625, "global_step": 610259, "epoch": 7352} {"train_loss": -27.842498779296875, "global_step": 610260, "epoch": 7352} {"train_loss": -27.77777099609375, "global_step": 610261, "epoch": 7352} {"train_loss": -27.163604736328125, "global_step": 610262, "epoch": 7352} {"train_loss": -27.846960067749023, "global_step": 610263, "epoch": 7352} {"train_loss": -28.061208724975586, "global_step": 610264, "epoch": 7352} {"train_loss": -27.916187286376953, "global_step": 610265, "epoch": 7352} {"train_loss": -27.965909957885742, "global_step": 610266, "epoch": 7352} {"train_loss": -28.2543888092041, "global_step": 610267, "epoch": 7352} {"train_loss": -27.82502555847168, "global_step": 610268, "epoch": 7352} {"train_loss": -28.134546279907227, "global_step": 610269, "epoch": 7352} {"train_loss": -27.863901138305664, "global_step": 610270, "epoch": 7352} {"train_loss": -28.381437301635742, "global_step": 610271, "epoch": 7352} {"train_loss": -27.628894805908203, "global_step": 610272, "epoch": 7352} {"train_loss": -27.66269302368164, "global_step": 610273, "epoch": 7352} {"train_loss": -28.249114990234375, "global_step": 610274, "epoch": 7352} {"train_loss": -28.051740646362305, "global_step": 610275, "epoch": 7352} {"train_loss": -27.893421173095703, "global_step": 610276, "epoch": 7352} {"train_loss": -27.837329864501953, "global_step": 610277, "epoch": 7352} {"train_loss": -27.952924728393555, "global_step": 610278, "epoch": 7352} {"train_loss": -27.892507553100586, "global_step": 610279, "epoch": 7352} {"train_loss": -28.108469009399414, "global_step": 610280, "epoch": 7352} {"train_loss": -28.7113037109375, "global_step": 610281, "epoch": 7352} {"train_loss": -27.8253231048584, "global_step": 610282, "epoch": 7352} {"train_loss": -28.110004425048828, "global_step": 610283, "epoch": 7352} {"train_loss": -27.803913116455078, "global_step": 610284, "epoch": 7352} {"train_loss": -27.54277992248535, "global_step": 610285, "epoch": 7352} {"train_loss": -28.275466918945312, "global_step": 610286, "epoch": 7352} {"train_loss": -27.89143180847168, "global_step": 610287, "epoch": 7352} {"train_loss": -28.195653915405273, "global_step": 610288, "epoch": 7352} {"train_loss": -28.274389266967773, "global_step": 610289, "epoch": 7352} {"train_loss": -28.2205753326416, "global_step": 610290, "epoch": 7352} {"train_loss": -28.043298721313477, "global_step": 610291, "epoch": 7352} {"train_loss": -28.119394302368164, "global_step": 610292, "epoch": 7352} {"train_loss": -27.689550399780273, "global_step": 610293, "epoch": 7352} {"train_loss": -27.87562370300293, "global_step": 610294, "epoch": 7352} {"train_loss": -28.341720581054688, "global_step": 610295, "epoch": 7352} {"train_loss": -27.941059112548828, "global_step": 610296, "epoch": 7352} {"train_loss": -28.411544799804688, "global_step": 610297, "epoch": 7352} {"train_loss": -27.899561663708056, "global_step": 610298, "epoch": 7352, "val_loss": 6708133.0} {"train_loss": -27.455915451049805, "global_step": 610299, "epoch": 7353} {"train_loss": -27.13727378845215, "global_step": 610300, "epoch": 7353} {"train_loss": -27.040525436401367, "global_step": 610301, "epoch": 7353} {"train_loss": -27.179601669311523, "global_step": 610302, "epoch": 7353} {"train_loss": -26.95399284362793, "global_step": 610303, "epoch": 7353} {"train_loss": -27.492919921875, "global_step": 610304, "epoch": 7353} {"train_loss": -27.62957191467285, "global_step": 610305, "epoch": 7353} {"train_loss": -27.564252853393555, "global_step": 610306, "epoch": 7353} {"train_loss": -27.571044921875, "global_step": 610307, "epoch": 7353} {"train_loss": -27.27454948425293, "global_step": 610308, "epoch": 7353} {"train_loss": -27.47696304321289, "global_step": 610309, "epoch": 7353} {"train_loss": -27.64948844909668, "global_step": 610310, "epoch": 7353} {"train_loss": -27.432220458984375, "global_step": 610311, "epoch": 7353} {"train_loss": -27.311323165893555, "global_step": 610312, "epoch": 7353} {"train_loss": -27.745452880859375, "global_step": 610313, "epoch": 7353} {"train_loss": -27.911767959594727, "global_step": 610314, "epoch": 7353} {"train_loss": -27.26423454284668, "global_step": 610315, "epoch": 7353} {"train_loss": -27.30451011657715, "global_step": 610316, "epoch": 7353} {"train_loss": -27.585973739624023, "global_step": 610317, "epoch": 7353} {"train_loss": -27.63936424255371, "global_step": 610318, "epoch": 7353} {"train_loss": -27.4654483795166, "global_step": 610319, "epoch": 7353} {"train_loss": -27.24676513671875, "global_step": 610320, "epoch": 7353} {"train_loss": -28.078092575073242, "global_step": 610321, "epoch": 7353} {"train_loss": -27.45147705078125, "global_step": 610322, "epoch": 7353} {"train_loss": -27.597305297851562, "global_step": 610323, "epoch": 7353} {"train_loss": -27.49899673461914, "global_step": 610324, "epoch": 7353} {"train_loss": -27.636816024780273, "global_step": 610325, "epoch": 7353} {"train_loss": -27.98264503479004, "global_step": 610326, "epoch": 7353} {"train_loss": -27.837976455688477, "global_step": 610327, "epoch": 7353} {"train_loss": -28.12912940979004, "global_step": 610328, "epoch": 7353} {"train_loss": -27.974578857421875, "global_step": 610329, "epoch": 7353} {"train_loss": -27.960546493530273, "global_step": 610330, "epoch": 7353} {"train_loss": -28.504928588867188, "global_step": 610331, "epoch": 7353} {"train_loss": -28.24139404296875, "global_step": 610332, "epoch": 7353} {"train_loss": -27.63678550720215, "global_step": 610333, "epoch": 7353} {"train_loss": -27.731586456298828, "global_step": 610334, "epoch": 7353} {"train_loss": -28.1027889251709, "global_step": 610335, "epoch": 7353} {"train_loss": -28.041593551635742, "global_step": 610336, "epoch": 7353} {"train_loss": -28.082422256469727, "global_step": 610337, "epoch": 7353} {"train_loss": -27.966888427734375, "global_step": 610338, "epoch": 7353} {"train_loss": -28.192941665649414, "global_step": 610339, "epoch": 7353} {"train_loss": -28.3743953704834, "global_step": 610340, "epoch": 7353} {"train_loss": -28.0963191986084, "global_step": 610341, "epoch": 7353} {"train_loss": -28.248565673828125, "global_step": 610342, "epoch": 7353} {"train_loss": -27.951642990112305, "global_step": 610343, "epoch": 7353} {"train_loss": -28.06368064880371, "global_step": 610344, "epoch": 7353} {"train_loss": -28.148916244506836, "global_step": 610345, "epoch": 7353} {"train_loss": -28.15644645690918, "global_step": 610346, "epoch": 7353} {"train_loss": -28.5820369720459, "global_step": 610347, "epoch": 7353} {"train_loss": -28.12034034729004, "global_step": 610348, "epoch": 7353} {"train_loss": -28.376142501831055, "global_step": 610349, "epoch": 7353} {"train_loss": -27.99169921875, "global_step": 610350, "epoch": 7353} {"train_loss": -28.64261245727539, "global_step": 610351, "epoch": 7353} {"train_loss": -28.193740844726562, "global_step": 610352, "epoch": 7353} {"train_loss": -28.389448165893555, "global_step": 610353, "epoch": 7353} {"train_loss": -28.201034545898438, "global_step": 610354, "epoch": 7353} {"train_loss": -28.21466064453125, "global_step": 610355, "epoch": 7353} {"train_loss": -28.580921173095703, "global_step": 610356, "epoch": 7353} {"train_loss": -28.346420288085938, "global_step": 610357, "epoch": 7353} {"train_loss": -28.1376895904541, "global_step": 610358, "epoch": 7353} {"train_loss": -28.517072677612305, "global_step": 610359, "epoch": 7353} {"train_loss": -28.19891929626465, "global_step": 610360, "epoch": 7353} {"train_loss": -28.135425567626953, "global_step": 610361, "epoch": 7353} {"train_loss": -27.791431427001953, "global_step": 610362, "epoch": 7353} {"train_loss": -28.17331886291504, "global_step": 610363, "epoch": 7353} {"train_loss": -28.226354598999023, "global_step": 610364, "epoch": 7353} {"train_loss": -28.2974796295166, "global_step": 610365, "epoch": 7353} {"train_loss": -28.142318725585938, "global_step": 610366, "epoch": 7353} {"train_loss": -28.14520835876465, "global_step": 610367, "epoch": 7353} {"train_loss": -28.3293399810791, "global_step": 610368, "epoch": 7353} {"train_loss": -28.352649688720703, "global_step": 610369, "epoch": 7353} {"train_loss": -28.193866729736328, "global_step": 610370, "epoch": 7353} {"train_loss": -27.689924240112305, "global_step": 610371, "epoch": 7353} {"train_loss": -27.601972579956055, "global_step": 610372, "epoch": 7353} {"train_loss": -27.283689498901367, "global_step": 610373, "epoch": 7353} {"train_loss": -26.625219345092773, "global_step": 610374, "epoch": 7353} {"train_loss": -26.413318634033203, "global_step": 610375, "epoch": 7353} {"train_loss": -27.646453857421875, "global_step": 610376, "epoch": 7353} {"train_loss": -27.7652645111084, "global_step": 610377, "epoch": 7353} {"train_loss": -27.613357543945312, "global_step": 610378, "epoch": 7353} {"train_loss": -27.852874755859375, "global_step": 610379, "epoch": 7353} {"train_loss": -27.509662628173828, "global_step": 610380, "epoch": 7353} {"train_loss": -27.831413498844007, "global_step": 610381, "epoch": 7353, "val_loss": 6605671.0} {"train_loss": -27.26410484313965, "global_step": 610382, "epoch": 7354} {"train_loss": -27.555200576782227, "global_step": 610383, "epoch": 7354} {"train_loss": -27.411991119384766, "global_step": 610384, "epoch": 7354} {"train_loss": -26.95997428894043, "global_step": 610385, "epoch": 7354} {"train_loss": -26.648813247680664, "global_step": 610386, "epoch": 7354} {"train_loss": -26.838773727416992, "global_step": 610387, "epoch": 7354} {"train_loss": -27.65789222717285, "global_step": 610388, "epoch": 7354} {"train_loss": -27.4237117767334, "global_step": 610389, "epoch": 7354} {"train_loss": -27.894458770751953, "global_step": 610390, "epoch": 7354} {"train_loss": -27.566608428955078, "global_step": 610391, "epoch": 7354} {"train_loss": -27.2012939453125, "global_step": 610392, "epoch": 7354} {"train_loss": -27.109975814819336, "global_step": 610393, "epoch": 7354} {"train_loss": -27.90431022644043, "global_step": 610394, "epoch": 7354} {"train_loss": -27.290014266967773, "global_step": 610395, "epoch": 7354} {"train_loss": -28.176794052124023, "global_step": 610396, "epoch": 7354} {"train_loss": -27.525054931640625, "global_step": 610397, "epoch": 7354} {"train_loss": -27.683258056640625, "global_step": 610398, "epoch": 7354} {"train_loss": -27.92877769470215, "global_step": 610399, "epoch": 7354} {"train_loss": -27.753503799438477, "global_step": 610400, "epoch": 7354} {"train_loss": -27.578516006469727, "global_step": 610401, "epoch": 7354} {"train_loss": -28.3559627532959, "global_step": 610402, "epoch": 7354} {"train_loss": -27.641775131225586, "global_step": 610403, "epoch": 7354} {"train_loss": -28.06146240234375, "global_step": 610404, "epoch": 7354} {"train_loss": -27.98663330078125, "global_step": 610405, "epoch": 7354} {"train_loss": -27.738813400268555, "global_step": 610406, "epoch": 7354} {"train_loss": -28.184919357299805, "global_step": 610407, "epoch": 7354} {"train_loss": -28.112951278686523, "global_step": 610408, "epoch": 7354} {"train_loss": -28.191268920898438, "global_step": 610409, "epoch": 7354} {"train_loss": -27.79172134399414, "global_step": 610410, "epoch": 7354} {"train_loss": -28.0479736328125, "global_step": 610411, "epoch": 7354} {"train_loss": -28.04103660583496, "global_step": 610412, "epoch": 7354} {"train_loss": -27.936208724975586, "global_step": 610413, "epoch": 7354} {"train_loss": -28.23646354675293, "global_step": 610414, "epoch": 7354} {"train_loss": -28.1502742767334, "global_step": 610415, "epoch": 7354} {"train_loss": -28.510473251342773, "global_step": 610416, "epoch": 7354} {"train_loss": -28.234216690063477, "global_step": 610417, "epoch": 7354} {"train_loss": -28.321996688842773, "global_step": 610418, "epoch": 7354} {"train_loss": -27.98638343811035, "global_step": 610419, "epoch": 7354} {"train_loss": -28.33088493347168, "global_step": 610420, "epoch": 7354} {"train_loss": -28.153934478759766, "global_step": 610421, "epoch": 7354} {"train_loss": -28.437381744384766, "global_step": 610422, "epoch": 7354} {"train_loss": -28.15064811706543, "global_step": 610423, "epoch": 7354} {"train_loss": -28.28181266784668, "global_step": 610424, "epoch": 7354} {"train_loss": -28.10646629333496, "global_step": 610425, "epoch": 7354} {"train_loss": -27.892377853393555, "global_step": 610426, "epoch": 7354} {"train_loss": -28.307531356811523, "global_step": 610427, "epoch": 7354} {"train_loss": -27.8861141204834, "global_step": 610428, "epoch": 7354} {"train_loss": -28.0953426361084, "global_step": 610429, "epoch": 7354} {"train_loss": -28.06447410583496, "global_step": 610430, "epoch": 7354} {"train_loss": -28.239797592163086, "global_step": 610431, "epoch": 7354} {"train_loss": -27.76717185974121, "global_step": 610432, "epoch": 7354} {"train_loss": -28.44683265686035, "global_step": 610433, "epoch": 7354} {"train_loss": -28.013547897338867, "global_step": 610434, "epoch": 7354} {"train_loss": -28.206058502197266, "global_step": 610435, "epoch": 7354} {"train_loss": -28.03957176208496, "global_step": 610436, "epoch": 7354} {"train_loss": -28.171722412109375, "global_step": 610437, "epoch": 7354} {"train_loss": -28.239795684814453, "global_step": 610438, "epoch": 7354} {"train_loss": -27.660160064697266, "global_step": 610439, "epoch": 7354} {"train_loss": -27.933475494384766, "global_step": 610440, "epoch": 7354} {"train_loss": -27.80097770690918, "global_step": 610441, "epoch": 7354} {"train_loss": -28.0535945892334, "global_step": 610442, "epoch": 7354} {"train_loss": -28.272480010986328, "global_step": 610443, "epoch": 7354} {"train_loss": -27.982513427734375, "global_step": 610444, "epoch": 7354} {"train_loss": -28.084442138671875, "global_step": 610445, "epoch": 7354} {"train_loss": -28.412561416625977, "global_step": 610446, "epoch": 7354} {"train_loss": -28.0830020904541, "global_step": 610447, "epoch": 7354} {"train_loss": -27.881153106689453, "global_step": 610448, "epoch": 7354} {"train_loss": -28.262516021728516, "global_step": 610449, "epoch": 7354} {"train_loss": -28.059650421142578, "global_step": 610450, "epoch": 7354} {"train_loss": -28.233488082885742, "global_step": 610451, "epoch": 7354} {"train_loss": -28.13181495666504, "global_step": 610452, "epoch": 7354} {"train_loss": -28.359121322631836, "global_step": 610453, "epoch": 7354} {"train_loss": -28.27973747253418, "global_step": 610454, "epoch": 7354} {"train_loss": -28.398523330688477, "global_step": 610455, "epoch": 7354} {"train_loss": -28.424314498901367, "global_step": 610456, "epoch": 7354} {"train_loss": -27.939285278320312, "global_step": 610457, "epoch": 7354} {"train_loss": -28.11569595336914, "global_step": 610458, "epoch": 7354} {"train_loss": -28.428302764892578, "global_step": 610459, "epoch": 7354} {"train_loss": -27.937824249267578, "global_step": 610460, "epoch": 7354} {"train_loss": -28.032800674438477, "global_step": 610461, "epoch": 7354} {"train_loss": -27.830657958984375, "global_step": 610462, "epoch": 7354} {"train_loss": -28.057952880859375, "global_step": 610463, "epoch": 7354} {"train_loss": -27.947076291923064, "global_step": 610464, "epoch": 7354, "val_loss": 6673362.0} {"train_loss": -27.745075225830078, "global_step": 610465, "epoch": 7355} {"train_loss": -27.2210636138916, "global_step": 610466, "epoch": 7355} {"train_loss": -26.6270809173584, "global_step": 610467, "epoch": 7355} {"train_loss": -26.93474769592285, "global_step": 610468, "epoch": 7355} {"train_loss": -27.285192489624023, "global_step": 610469, "epoch": 7355} {"train_loss": -27.2710018157959, "global_step": 610470, "epoch": 7355} {"train_loss": -27.44721031188965, "global_step": 610471, "epoch": 7355} {"train_loss": -27.752197265625, "global_step": 610472, "epoch": 7355} {"train_loss": -27.412860870361328, "global_step": 610473, "epoch": 7355} {"train_loss": -27.4255428314209, "global_step": 610474, "epoch": 7355} {"train_loss": -27.7600040435791, "global_step": 610475, "epoch": 7355} {"train_loss": -28.043161392211914, "global_step": 610476, "epoch": 7355} {"train_loss": -27.811634063720703, "global_step": 610477, "epoch": 7355} {"train_loss": -27.80170249938965, "global_step": 610478, "epoch": 7355} {"train_loss": -27.92457389831543, "global_step": 610479, "epoch": 7355} {"train_loss": -27.830551147460938, "global_step": 610480, "epoch": 7355} {"train_loss": -27.661056518554688, "global_step": 610481, "epoch": 7355} {"train_loss": -27.997480392456055, "global_step": 610482, "epoch": 7355} {"train_loss": -27.88641357421875, "global_step": 610483, "epoch": 7355} {"train_loss": -28.117095947265625, "global_step": 610484, "epoch": 7355} {"train_loss": -27.966938018798828, "global_step": 610485, "epoch": 7355} {"train_loss": -28.027679443359375, "global_step": 610486, "epoch": 7355} {"train_loss": -27.729429244995117, "global_step": 610487, "epoch": 7355} {"train_loss": -27.659345626831055, "global_step": 610488, "epoch": 7355} {"train_loss": -27.849645614624023, "global_step": 610489, "epoch": 7355} {"train_loss": -28.202192306518555, "global_step": 610490, "epoch": 7355} {"train_loss": -27.79741859436035, "global_step": 610491, "epoch": 7355} {"train_loss": -28.238550186157227, "global_step": 610492, "epoch": 7355} {"train_loss": -28.05609130859375, "global_step": 610493, "epoch": 7355} {"train_loss": -27.961130142211914, "global_step": 610494, "epoch": 7355} {"train_loss": -28.089019775390625, "global_step": 610495, "epoch": 7355} {"train_loss": -27.831247329711914, "global_step": 610496, "epoch": 7355} {"train_loss": -28.196264266967773, "global_step": 610497, "epoch": 7355} {"train_loss": -27.85146141052246, "global_step": 610498, "epoch": 7355} {"train_loss": -28.096906661987305, "global_step": 610499, "epoch": 7355} {"train_loss": -27.958332061767578, "global_step": 610500, "epoch": 7355} {"train_loss": -28.271869659423828, "global_step": 610501, "epoch": 7355} {"train_loss": -27.98111915588379, "global_step": 610502, "epoch": 7355} {"train_loss": -27.926916122436523, "global_step": 610503, "epoch": 7355} {"train_loss": -27.660907745361328, "global_step": 610504, "epoch": 7355} {"train_loss": -28.091333389282227, "global_step": 610505, "epoch": 7355} {"train_loss": -27.99591636657715, "global_step": 610506, "epoch": 7355} {"train_loss": -28.336078643798828, "global_step": 610507, "epoch": 7355} {"train_loss": -27.81500244140625, "global_step": 610508, "epoch": 7355} {"train_loss": -27.983564376831055, "global_step": 610509, "epoch": 7355} {"train_loss": -28.417951583862305, "global_step": 610510, "epoch": 7355} {"train_loss": -27.939105987548828, "global_step": 610511, "epoch": 7355} {"train_loss": -27.862634658813477, "global_step": 610512, "epoch": 7355} {"train_loss": -28.059955596923828, "global_step": 610513, "epoch": 7355} {"train_loss": -27.425817489624023, "global_step": 610514, "epoch": 7355} {"train_loss": -27.74505615234375, "global_step": 610515, "epoch": 7355} {"train_loss": -27.78272819519043, "global_step": 610516, "epoch": 7355} {"train_loss": -27.895750045776367, "global_step": 610517, "epoch": 7355} {"train_loss": -28.208209991455078, "global_step": 610518, "epoch": 7355} {"train_loss": -27.9166202545166, "global_step": 610519, "epoch": 7355} {"train_loss": -28.14569091796875, "global_step": 610520, "epoch": 7355} {"train_loss": -28.104089736938477, "global_step": 610521, "epoch": 7355} {"train_loss": -28.0606746673584, "global_step": 610522, "epoch": 7355} {"train_loss": -28.254058837890625, "global_step": 610523, "epoch": 7355} {"train_loss": -28.10639762878418, "global_step": 610524, "epoch": 7355} {"train_loss": -27.9873104095459, "global_step": 610525, "epoch": 7355} {"train_loss": -28.8670654296875, "global_step": 610526, "epoch": 7355} {"train_loss": -28.340906143188477, "global_step": 610527, "epoch": 7355} {"train_loss": -28.27329444885254, "global_step": 610528, "epoch": 7355} {"train_loss": -28.37904167175293, "global_step": 610529, "epoch": 7355} {"train_loss": -28.09183120727539, "global_step": 610530, "epoch": 7355} {"train_loss": -27.933795928955078, "global_step": 610531, "epoch": 7355} {"train_loss": -28.30445671081543, "global_step": 610532, "epoch": 7355} {"train_loss": -28.22635841369629, "global_step": 610533, "epoch": 7355} {"train_loss": -27.930973052978516, "global_step": 610534, "epoch": 7355} {"train_loss": -28.16798210144043, "global_step": 610535, "epoch": 7355} {"train_loss": -27.83515739440918, "global_step": 610536, "epoch": 7355} {"train_loss": -27.86532974243164, "global_step": 610537, "epoch": 7355} {"train_loss": -28.35944175720215, "global_step": 610538, "epoch": 7355} {"train_loss": -28.2882080078125, "global_step": 610539, "epoch": 7355} {"train_loss": -28.346471786499023, "global_step": 610540, "epoch": 7355} {"train_loss": -28.134489059448242, "global_step": 610541, "epoch": 7355} {"train_loss": -28.220458984375, "global_step": 610542, "epoch": 7355} {"train_loss": -28.258045196533203, "global_step": 610543, "epoch": 7355} {"train_loss": -28.2801513671875, "global_step": 610544, "epoch": 7355} {"train_loss": -27.8380184173584, "global_step": 610545, "epoch": 7355} {"train_loss": -28.464523315429688, "global_step": 610546, "epoch": 7355} {"train_loss": -27.943726872823323, "global_step": 610547, "epoch": 7355, "val_loss": 6612171.0} {"train_loss": -27.13163185119629, "global_step": 610548, "epoch": 7356} {"train_loss": -24.959535598754883, "global_step": 610549, "epoch": 7356} {"train_loss": -23.650814056396484, "global_step": 610550, "epoch": 7356} {"train_loss": -25.127777099609375, "global_step": 610551, "epoch": 7356} {"train_loss": -25.99945640563965, "global_step": 610552, "epoch": 7356} {"train_loss": -24.864850997924805, "global_step": 610553, "epoch": 7356} {"train_loss": -26.403430938720703, "global_step": 610554, "epoch": 7356} {"train_loss": -26.055831909179688, "global_step": 610555, "epoch": 7356} {"train_loss": -27.116605758666992, "global_step": 610556, "epoch": 7356} {"train_loss": -26.53751564025879, "global_step": 610557, "epoch": 7356} {"train_loss": -27.294219970703125, "global_step": 610558, "epoch": 7356} {"train_loss": -26.709705352783203, "global_step": 610559, "epoch": 7356} {"train_loss": -26.951171875, "global_step": 610560, "epoch": 7356} {"train_loss": -27.365121841430664, "global_step": 610561, "epoch": 7356} {"train_loss": -26.9766902923584, "global_step": 610562, "epoch": 7356} {"train_loss": -26.887847900390625, "global_step": 610563, "epoch": 7356} {"train_loss": -27.068634033203125, "global_step": 610564, "epoch": 7356} {"train_loss": -27.015119552612305, "global_step": 610565, "epoch": 7356} {"train_loss": -27.018522262573242, "global_step": 610566, "epoch": 7356} {"train_loss": -27.1756534576416, "global_step": 610567, "epoch": 7356} {"train_loss": -27.19691276550293, "global_step": 610568, "epoch": 7356} {"train_loss": -27.801313400268555, "global_step": 610569, "epoch": 7356} {"train_loss": -27.25959587097168, "global_step": 610570, "epoch": 7356} {"train_loss": -27.21943473815918, "global_step": 610571, "epoch": 7356} {"train_loss": -27.482284545898438, "global_step": 610572, "epoch": 7356} {"train_loss": -27.54578971862793, "global_step": 610573, "epoch": 7356} {"train_loss": -27.446081161499023, "global_step": 610574, "epoch": 7356} {"train_loss": -27.471921920776367, "global_step": 610575, "epoch": 7356} {"train_loss": -27.524433135986328, "global_step": 610576, "epoch": 7356} {"train_loss": -27.770238876342773, "global_step": 610577, "epoch": 7356} {"train_loss": -27.40478515625, "global_step": 610578, "epoch": 7356} {"train_loss": -27.875930786132812, "global_step": 610579, "epoch": 7356} {"train_loss": -27.552122116088867, "global_step": 610580, "epoch": 7356} {"train_loss": -28.2353515625, "global_step": 610581, "epoch": 7356} {"train_loss": -27.59950065612793, "global_step": 610582, "epoch": 7356} {"train_loss": -27.551593780517578, "global_step": 610583, "epoch": 7356} {"train_loss": -27.58314323425293, "global_step": 610584, "epoch": 7356} {"train_loss": -27.9469051361084, "global_step": 610585, "epoch": 7356} {"train_loss": -27.737747192382812, "global_step": 610586, "epoch": 7356} {"train_loss": -27.96686363220215, "global_step": 610587, "epoch": 7356} {"train_loss": -27.9843807220459, "global_step": 610588, "epoch": 7356} {"train_loss": -27.905439376831055, "global_step": 610589, "epoch": 7356} {"train_loss": -27.608057022094727, "global_step": 610590, "epoch": 7356} {"train_loss": -28.312408447265625, "global_step": 610591, "epoch": 7356} {"train_loss": -27.774259567260742, "global_step": 610592, "epoch": 7356} {"train_loss": -27.995203018188477, "global_step": 610593, "epoch": 7356} {"train_loss": -27.967731475830078, "global_step": 610594, "epoch": 7356} {"train_loss": -27.662857055664062, "global_step": 610595, "epoch": 7356} {"train_loss": -27.699859619140625, "global_step": 610596, "epoch": 7356} {"train_loss": -27.602521896362305, "global_step": 610597, "epoch": 7356} {"train_loss": -26.482873916625977, "global_step": 610598, "epoch": 7356} {"train_loss": -25.892166137695312, "global_step": 610599, "epoch": 7356} {"train_loss": -27.482303619384766, "global_step": 610600, "epoch": 7356} {"train_loss": -27.970779418945312, "global_step": 610601, "epoch": 7356} {"train_loss": -26.93055534362793, "global_step": 610602, "epoch": 7356} {"train_loss": -28.26363182067871, "global_step": 610603, "epoch": 7356} {"train_loss": -27.44403076171875, "global_step": 610604, "epoch": 7356} {"train_loss": -27.855337142944336, "global_step": 610605, "epoch": 7356} {"train_loss": -27.493061065673828, "global_step": 610606, "epoch": 7356} {"train_loss": -27.826581954956055, "global_step": 610607, "epoch": 7356} {"train_loss": -27.281442642211914, "global_step": 610608, "epoch": 7356} {"train_loss": -27.88882827758789, "global_step": 610609, "epoch": 7356} {"train_loss": -28.07218360900879, "global_step": 610610, "epoch": 7356} {"train_loss": -28.03643226623535, "global_step": 610611, "epoch": 7356} {"train_loss": -27.35194206237793, "global_step": 610612, "epoch": 7356} {"train_loss": -27.704864501953125, "global_step": 610613, "epoch": 7356} {"train_loss": -28.00263023376465, "global_step": 610614, "epoch": 7356} {"train_loss": -27.705825805664062, "global_step": 610615, "epoch": 7356} {"train_loss": -27.971052169799805, "global_step": 610616, "epoch": 7356} {"train_loss": -27.843847274780273, "global_step": 610617, "epoch": 7356} {"train_loss": -28.012954711914062, "global_step": 610618, "epoch": 7356} {"train_loss": -28.16827964782715, "global_step": 610619, "epoch": 7356} {"train_loss": -27.886587142944336, "global_step": 610620, "epoch": 7356} {"train_loss": -28.114063262939453, "global_step": 610621, "epoch": 7356} {"train_loss": -28.148380279541016, "global_step": 610622, "epoch": 7356} {"train_loss": -28.0932559967041, "global_step": 610623, "epoch": 7356} {"train_loss": -28.001935958862305, "global_step": 610624, "epoch": 7356} {"train_loss": -27.97891616821289, "global_step": 610625, "epoch": 7356} {"train_loss": -28.375659942626953, "global_step": 610626, "epoch": 7356} {"train_loss": -27.87102699279785, "global_step": 610627, "epoch": 7356} {"train_loss": -28.026691436767578, "global_step": 610628, "epoch": 7356} {"train_loss": -28.005781173706055, "global_step": 610629, "epoch": 7356} {"train_loss": -27.404274653239423, "global_step": 610630, "epoch": 7356, "val_loss": 6531247.0} {"train_loss": -27.93638038635254, "global_step": 610631, "epoch": 7357} {"train_loss": -27.751127243041992, "global_step": 610632, "epoch": 7357} {"train_loss": -27.55915641784668, "global_step": 610633, "epoch": 7357} {"train_loss": -28.077728271484375, "global_step": 610634, "epoch": 7357} {"train_loss": -28.0164852142334, "global_step": 610635, "epoch": 7357} {"train_loss": -28.03409194946289, "global_step": 610636, "epoch": 7357} {"train_loss": -28.129047393798828, "global_step": 610637, "epoch": 7357} {"train_loss": -28.0988712310791, "global_step": 610638, "epoch": 7357} {"train_loss": -28.120838165283203, "global_step": 610639, "epoch": 7357} {"train_loss": -27.808019638061523, "global_step": 610640, "epoch": 7357} {"train_loss": -27.98377799987793, "global_step": 610641, "epoch": 7357} {"train_loss": -28.331857681274414, "global_step": 610642, "epoch": 7357} {"train_loss": -27.79640769958496, "global_step": 610643, "epoch": 7357} {"train_loss": -27.707279205322266, "global_step": 610644, "epoch": 7357} {"train_loss": -27.413562774658203, "global_step": 610645, "epoch": 7357} {"train_loss": -27.911962509155273, "global_step": 610646, "epoch": 7357} {"train_loss": -27.80929946899414, "global_step": 610647, "epoch": 7357} {"train_loss": -26.9708251953125, "global_step": 610648, "epoch": 7357} {"train_loss": -27.941497802734375, "global_step": 610649, "epoch": 7357} {"train_loss": -27.844263076782227, "global_step": 610650, "epoch": 7357} {"train_loss": -27.51338005065918, "global_step": 610651, "epoch": 7357} {"train_loss": -27.810510635375977, "global_step": 610652, "epoch": 7357} {"train_loss": -27.931884765625, "global_step": 610653, "epoch": 7357} {"train_loss": -28.03851890563965, "global_step": 610654, "epoch": 7357} {"train_loss": -27.728437423706055, "global_step": 610655, "epoch": 7357} {"train_loss": -28.12234878540039, "global_step": 610656, "epoch": 7357} {"train_loss": -28.378103256225586, "global_step": 610657, "epoch": 7357} {"train_loss": -27.92557144165039, "global_step": 610658, "epoch": 7357} {"train_loss": -27.752384185791016, "global_step": 610659, "epoch": 7357} {"train_loss": -28.243518829345703, "global_step": 610660, "epoch": 7357} {"train_loss": -27.699560165405273, "global_step": 610661, "epoch": 7357} {"train_loss": -28.239667892456055, "global_step": 610662, "epoch": 7357} {"train_loss": -28.298009872436523, "global_step": 610663, "epoch": 7357} {"train_loss": -27.964155197143555, "global_step": 610664, "epoch": 7357} {"train_loss": -28.180234909057617, "global_step": 610665, "epoch": 7357} {"train_loss": -27.760229110717773, "global_step": 610666, "epoch": 7357} {"train_loss": -28.163543701171875, "global_step": 610667, "epoch": 7357} {"train_loss": -28.073530197143555, "global_step": 610668, "epoch": 7357} {"train_loss": -28.275043487548828, "global_step": 610669, "epoch": 7357} {"train_loss": -28.101730346679688, "global_step": 610670, "epoch": 7357} {"train_loss": -28.294294357299805, "global_step": 610671, "epoch": 7357} {"train_loss": -28.195709228515625, "global_step": 610672, "epoch": 7357} {"train_loss": -28.132848739624023, "global_step": 610673, "epoch": 7357} {"train_loss": -28.397541046142578, "global_step": 610674, "epoch": 7357} {"train_loss": -28.257068634033203, "global_step": 610675, "epoch": 7357} {"train_loss": -28.43147087097168, "global_step": 610676, "epoch": 7357} {"train_loss": -28.538915634155273, "global_step": 610677, "epoch": 7357} {"train_loss": -28.18033218383789, "global_step": 610678, "epoch": 7357} {"train_loss": -28.21714210510254, "global_step": 610679, "epoch": 7357} {"train_loss": -28.060413360595703, "global_step": 610680, "epoch": 7357} {"train_loss": -28.489959716796875, "global_step": 610681, "epoch": 7357} {"train_loss": -28.604785919189453, "global_step": 610682, "epoch": 7357} {"train_loss": -28.20338249206543, "global_step": 610683, "epoch": 7357} {"train_loss": -28.175342559814453, "global_step": 610684, "epoch": 7357} {"train_loss": -28.230926513671875, "global_step": 610685, "epoch": 7357} {"train_loss": -28.143293380737305, "global_step": 610686, "epoch": 7357} {"train_loss": -28.344762802124023, "global_step": 610687, "epoch": 7357} {"train_loss": -28.104938507080078, "global_step": 610688, "epoch": 7357} {"train_loss": -28.201318740844727, "global_step": 610689, "epoch": 7357} {"train_loss": -28.557144165039062, "global_step": 610690, "epoch": 7357} {"train_loss": -28.289844512939453, "global_step": 610691, "epoch": 7357} {"train_loss": -28.371992111206055, "global_step": 610692, "epoch": 7357} {"train_loss": -28.02912712097168, "global_step": 610693, "epoch": 7357} {"train_loss": -27.752511978149414, "global_step": 610694, "epoch": 7357} {"train_loss": -27.572492599487305, "global_step": 610695, "epoch": 7357} {"train_loss": -28.096637725830078, "global_step": 610696, "epoch": 7357} {"train_loss": -28.110244750976562, "global_step": 610697, "epoch": 7357} {"train_loss": -27.849740982055664, "global_step": 610698, "epoch": 7357} {"train_loss": -28.13458251953125, "global_step": 610699, "epoch": 7357} {"train_loss": -28.214231491088867, "global_step": 610700, "epoch": 7357} {"train_loss": -27.770856857299805, "global_step": 610701, "epoch": 7357} {"train_loss": -27.91583251953125, "global_step": 610702, "epoch": 7357} {"train_loss": -27.924219131469727, "global_step": 610703, "epoch": 7357} {"train_loss": -28.12725830078125, "global_step": 610704, "epoch": 7357} {"train_loss": -28.404937744140625, "global_step": 610705, "epoch": 7357} {"train_loss": -28.19390869140625, "global_step": 610706, "epoch": 7357} {"train_loss": -28.28993034362793, "global_step": 610707, "epoch": 7357} {"train_loss": -27.972370147705078, "global_step": 610708, "epoch": 7357} {"train_loss": -27.817646026611328, "global_step": 610709, "epoch": 7357} {"train_loss": -28.205387115478516, "global_step": 610710, "epoch": 7357} {"train_loss": -28.424793243408203, "global_step": 610711, "epoch": 7357} {"train_loss": -28.197168350219727, "global_step": 610712, "epoch": 7357} {"train_loss": -28.047864155596997, "global_step": 610713, "epoch": 7357, "val_loss": 6514596.0} {"train_loss": -27.719696044921875, "global_step": 610714, "epoch": 7358} {"train_loss": -27.775766372680664, "global_step": 610715, "epoch": 7358} {"train_loss": -27.735021591186523, "global_step": 610716, "epoch": 7358} {"train_loss": -27.60929298400879, "global_step": 610717, "epoch": 7358} {"train_loss": -27.646564483642578, "global_step": 610718, "epoch": 7358} {"train_loss": -28.046865463256836, "global_step": 610719, "epoch": 7358} {"train_loss": -27.87286949157715, "global_step": 610720, "epoch": 7358} {"train_loss": -27.922836303710938, "global_step": 610721, "epoch": 7358} {"train_loss": -27.522907257080078, "global_step": 610722, "epoch": 7358} {"train_loss": -27.840375900268555, "global_step": 610723, "epoch": 7358} {"train_loss": -27.672582626342773, "global_step": 610724, "epoch": 7358} {"train_loss": -27.582563400268555, "global_step": 610725, "epoch": 7358} {"train_loss": -27.721881866455078, "global_step": 610726, "epoch": 7358} {"train_loss": -27.837003707885742, "global_step": 610727, "epoch": 7358} {"train_loss": -27.873214721679688, "global_step": 610728, "epoch": 7358} {"train_loss": -28.218088150024414, "global_step": 610729, "epoch": 7358} {"train_loss": -27.6380558013916, "global_step": 610730, "epoch": 7358} {"train_loss": -27.737796783447266, "global_step": 610731, "epoch": 7358} {"train_loss": -27.744123458862305, "global_step": 610732, "epoch": 7358} {"train_loss": -28.109149932861328, "global_step": 610733, "epoch": 7358} {"train_loss": -27.89522361755371, "global_step": 610734, "epoch": 7358} {"train_loss": -28.122709274291992, "global_step": 610735, "epoch": 7358} {"train_loss": -27.764150619506836, "global_step": 610736, "epoch": 7358} {"train_loss": -27.8735294342041, "global_step": 610737, "epoch": 7358} {"train_loss": -27.794788360595703, "global_step": 610738, "epoch": 7358} {"train_loss": -28.263080596923828, "global_step": 610739, "epoch": 7358} {"train_loss": -27.691471099853516, "global_step": 610740, "epoch": 7358} {"train_loss": -27.935922622680664, "global_step": 610741, "epoch": 7358} {"train_loss": -28.110889434814453, "global_step": 610742, "epoch": 7358} {"train_loss": -28.052221298217773, "global_step": 610743, "epoch": 7358} {"train_loss": -27.94911003112793, "global_step": 610744, "epoch": 7358} {"train_loss": -27.926511764526367, "global_step": 610745, "epoch": 7358} {"train_loss": -28.1790828704834, "global_step": 610746, "epoch": 7358} {"train_loss": -27.87957763671875, "global_step": 610747, "epoch": 7358} {"train_loss": -28.026763916015625, "global_step": 610748, "epoch": 7358} {"train_loss": -28.108020782470703, "global_step": 610749, "epoch": 7358} {"train_loss": -28.287240982055664, "global_step": 610750, "epoch": 7358} {"train_loss": -28.477710723876953, "global_step": 610751, "epoch": 7358} {"train_loss": -28.2357177734375, "global_step": 610752, "epoch": 7358} {"train_loss": -28.48392677307129, "global_step": 610753, "epoch": 7358} {"train_loss": -28.056217193603516, "global_step": 610754, "epoch": 7358} {"train_loss": -28.092849731445312, "global_step": 610755, "epoch": 7358} {"train_loss": -28.62354850769043, "global_step": 610756, "epoch": 7358} {"train_loss": -28.385848999023438, "global_step": 610757, "epoch": 7358} {"train_loss": -27.933996200561523, "global_step": 610758, "epoch": 7358} {"train_loss": -28.071557998657227, "global_step": 610759, "epoch": 7358} {"train_loss": -28.610076904296875, "global_step": 610760, "epoch": 7358} {"train_loss": -28.1260929107666, "global_step": 610761, "epoch": 7358} {"train_loss": -28.52792739868164, "global_step": 610762, "epoch": 7358} {"train_loss": -28.352005004882812, "global_step": 610763, "epoch": 7358} {"train_loss": -28.25839614868164, "global_step": 610764, "epoch": 7358} {"train_loss": -28.144866943359375, "global_step": 610765, "epoch": 7358} {"train_loss": -27.68829345703125, "global_step": 610766, "epoch": 7358} {"train_loss": -28.2193603515625, "global_step": 610767, "epoch": 7358} {"train_loss": -27.999425888061523, "global_step": 610768, "epoch": 7358} {"train_loss": -28.089862823486328, "global_step": 610769, "epoch": 7358} {"train_loss": -28.398040771484375, "global_step": 610770, "epoch": 7358} {"train_loss": -27.815366744995117, "global_step": 610771, "epoch": 7358} {"train_loss": -28.010141372680664, "global_step": 610772, "epoch": 7358} {"train_loss": -28.112714767456055, "global_step": 610773, "epoch": 7358} {"train_loss": -28.067853927612305, "global_step": 610774, "epoch": 7358} {"train_loss": -28.171783447265625, "global_step": 610775, "epoch": 7358} {"train_loss": -27.987329483032227, "global_step": 610776, "epoch": 7358} {"train_loss": -28.104846954345703, "global_step": 610777, "epoch": 7358} {"train_loss": -28.447118759155273, "global_step": 610778, "epoch": 7358} {"train_loss": -28.127700805664062, "global_step": 610779, "epoch": 7358} {"train_loss": -28.196735382080078, "global_step": 610780, "epoch": 7358} {"train_loss": -28.450592041015625, "global_step": 610781, "epoch": 7358} {"train_loss": -28.0046443939209, "global_step": 610782, "epoch": 7358} {"train_loss": -28.047672271728516, "global_step": 610783, "epoch": 7358} {"train_loss": -28.404882431030273, "global_step": 610784, "epoch": 7358} {"train_loss": -28.152708053588867, "global_step": 610785, "epoch": 7358} {"train_loss": -28.448057174682617, "global_step": 610786, "epoch": 7358} {"train_loss": -28.230335235595703, "global_step": 610787, "epoch": 7358} {"train_loss": -27.766809463500977, "global_step": 610788, "epoch": 7358} {"train_loss": -28.014801025390625, "global_step": 610789, "epoch": 7358} {"train_loss": -27.52545166015625, "global_step": 610790, "epoch": 7358} {"train_loss": -27.462377548217773, "global_step": 610791, "epoch": 7358} {"train_loss": -27.928985595703125, "global_step": 610792, "epoch": 7358} {"train_loss": -27.8994140625, "global_step": 610793, "epoch": 7358} {"train_loss": -28.045225143432617, "global_step": 610794, "epoch": 7358} {"train_loss": -28.220346450805664, "global_step": 610795, "epoch": 7358} {"train_loss": -28.025532550122364, "global_step": 610796, "epoch": 7358, "val_loss": 6632560.0} {"train_loss": -27.697769165039062, "global_step": 610797, "epoch": 7359} {"train_loss": -25.93939781188965, "global_step": 610798, "epoch": 7359} {"train_loss": -26.531110763549805, "global_step": 610799, "epoch": 7359} {"train_loss": -26.99774742126465, "global_step": 610800, "epoch": 7359} {"train_loss": -26.310089111328125, "global_step": 610801, "epoch": 7359} {"train_loss": -27.446420669555664, "global_step": 610802, "epoch": 7359} {"train_loss": -26.68036460876465, "global_step": 610803, "epoch": 7359} {"train_loss": -27.3027286529541, "global_step": 610804, "epoch": 7359} {"train_loss": -27.613494873046875, "global_step": 610805, "epoch": 7359} {"train_loss": -27.31159782409668, "global_step": 610806, "epoch": 7359} {"train_loss": -27.641998291015625, "global_step": 610807, "epoch": 7359} {"train_loss": -27.923669815063477, "global_step": 610808, "epoch": 7359} {"train_loss": -27.499624252319336, "global_step": 610809, "epoch": 7359} {"train_loss": -27.55792808532715, "global_step": 610810, "epoch": 7359} {"train_loss": -27.58576011657715, "global_step": 610811, "epoch": 7359} {"train_loss": -27.546478271484375, "global_step": 610812, "epoch": 7359} {"train_loss": -27.696760177612305, "global_step": 610813, "epoch": 7359} {"train_loss": -27.760761260986328, "global_step": 610814, "epoch": 7359} {"train_loss": -27.67738151550293, "global_step": 610815, "epoch": 7359} {"train_loss": -27.92096519470215, "global_step": 610816, "epoch": 7359} {"train_loss": -27.505680084228516, "global_step": 610817, "epoch": 7359} {"train_loss": -27.542133331298828, "global_step": 610818, "epoch": 7359} {"train_loss": -27.68951988220215, "global_step": 610819, "epoch": 7359} {"train_loss": -27.46941566467285, "global_step": 610820, "epoch": 7359} {"train_loss": -28.078948974609375, "global_step": 610821, "epoch": 7359} {"train_loss": -27.915912628173828, "global_step": 610822, "epoch": 7359} {"train_loss": -27.696868896484375, "global_step": 610823, "epoch": 7359} {"train_loss": -27.927478790283203, "global_step": 610824, "epoch": 7359} {"train_loss": -27.8819637298584, "global_step": 610825, "epoch": 7359} {"train_loss": -27.904203414916992, "global_step": 610826, "epoch": 7359} {"train_loss": -27.8862247467041, "global_step": 610827, "epoch": 7359} {"train_loss": -28.14324378967285, "global_step": 610828, "epoch": 7359} {"train_loss": -28.152280807495117, "global_step": 610829, "epoch": 7359} {"train_loss": -27.988988876342773, "global_step": 610830, "epoch": 7359} {"train_loss": -27.908300399780273, "global_step": 610831, "epoch": 7359} {"train_loss": -28.082029342651367, "global_step": 610832, "epoch": 7359} {"train_loss": -27.77764892578125, "global_step": 610833, "epoch": 7359} {"train_loss": -28.191818237304688, "global_step": 610834, "epoch": 7359} {"train_loss": -28.261463165283203, "global_step": 610835, "epoch": 7359} {"train_loss": -28.00738525390625, "global_step": 610836, "epoch": 7359} {"train_loss": -28.269086837768555, "global_step": 610837, "epoch": 7359} {"train_loss": -28.41461181640625, "global_step": 610838, "epoch": 7359} {"train_loss": -28.349796295166016, "global_step": 610839, "epoch": 7359} {"train_loss": -27.712182998657227, "global_step": 610840, "epoch": 7359} {"train_loss": -27.87800407409668, "global_step": 610841, "epoch": 7359} {"train_loss": -28.589929580688477, "global_step": 610842, "epoch": 7359} {"train_loss": -28.29249382019043, "global_step": 610843, "epoch": 7359} {"train_loss": -28.05472183227539, "global_step": 610844, "epoch": 7359} {"train_loss": -28.49005126953125, "global_step": 610845, "epoch": 7359} {"train_loss": -28.17041015625, "global_step": 610846, "epoch": 7359} {"train_loss": -27.95108413696289, "global_step": 610847, "epoch": 7359} {"train_loss": -28.576257705688477, "global_step": 610848, "epoch": 7359} {"train_loss": -28.484472274780273, "global_step": 610849, "epoch": 7359} {"train_loss": -28.364898681640625, "global_step": 610850, "epoch": 7359} {"train_loss": -28.1355037689209, "global_step": 610851, "epoch": 7359} {"train_loss": -28.551340103149414, "global_step": 610852, "epoch": 7359} {"train_loss": -28.587385177612305, "global_step": 610853, "epoch": 7359} {"train_loss": -27.96906089782715, "global_step": 610854, "epoch": 7359} {"train_loss": -28.45106315612793, "global_step": 610855, "epoch": 7359} {"train_loss": -27.8099308013916, "global_step": 610856, "epoch": 7359} {"train_loss": -27.866186141967773, "global_step": 610857, "epoch": 7359} {"train_loss": -28.166723251342773, "global_step": 610858, "epoch": 7359} {"train_loss": -28.054895401000977, "global_step": 610859, "epoch": 7359} {"train_loss": -27.185155868530273, "global_step": 610860, "epoch": 7359} {"train_loss": -27.560148239135742, "global_step": 610861, "epoch": 7359} {"train_loss": -26.582178115844727, "global_step": 610862, "epoch": 7359} {"train_loss": -26.897119522094727, "global_step": 610863, "epoch": 7359} {"train_loss": -28.070707321166992, "global_step": 610864, "epoch": 7359} {"train_loss": -27.351276397705078, "global_step": 610865, "epoch": 7359} {"train_loss": -27.359756469726562, "global_step": 610866, "epoch": 7359} {"train_loss": -27.32991600036621, "global_step": 610867, "epoch": 7359} {"train_loss": -27.76861572265625, "global_step": 610868, "epoch": 7359} {"train_loss": -27.838611602783203, "global_step": 610869, "epoch": 7359} {"train_loss": -27.749296188354492, "global_step": 610870, "epoch": 7359} {"train_loss": -27.291894912719727, "global_step": 610871, "epoch": 7359} {"train_loss": -27.97366714477539, "global_step": 610872, "epoch": 7359} {"train_loss": -27.878021240234375, "global_step": 610873, "epoch": 7359} {"train_loss": -27.519378662109375, "global_step": 610874, "epoch": 7359} {"train_loss": -28.008731842041016, "global_step": 610875, "epoch": 7359} {"train_loss": -27.899829864501953, "global_step": 610876, "epoch": 7359} {"train_loss": -28.091882705688477, "global_step": 610877, "epoch": 7359} {"train_loss": -27.833911895751953, "global_step": 610878, "epoch": 7359} {"train_loss": -27.786788526787817, "global_step": 610879, "epoch": 7359, "val_loss": 6576051.0} {"train_loss": -27.33710289001465, "global_step": 610880, "epoch": 7360} {"train_loss": -27.378087997436523, "global_step": 610881, "epoch": 7360} {"train_loss": -27.691205978393555, "global_step": 610882, "epoch": 7360} {"train_loss": -27.549436569213867, "global_step": 610883, "epoch": 7360} {"train_loss": -27.0922908782959, "global_step": 610884, "epoch": 7360} {"train_loss": -27.434345245361328, "global_step": 610885, "epoch": 7360} {"train_loss": -27.31537437438965, "global_step": 610886, "epoch": 7360} {"train_loss": -27.33213233947754, "global_step": 610887, "epoch": 7360} {"train_loss": -27.845294952392578, "global_step": 610888, "epoch": 7360} {"train_loss": -27.649280548095703, "global_step": 610889, "epoch": 7360} {"train_loss": -27.831735610961914, "global_step": 610890, "epoch": 7360} {"train_loss": -28.150659561157227, "global_step": 610891, "epoch": 7360} {"train_loss": -27.77850341796875, "global_step": 610892, "epoch": 7360} {"train_loss": -27.68031120300293, "global_step": 610893, "epoch": 7360} {"train_loss": -27.8313045501709, "global_step": 610894, "epoch": 7360} {"train_loss": -28.34356117248535, "global_step": 610895, "epoch": 7360} {"train_loss": -28.034442901611328, "global_step": 610896, "epoch": 7360} {"train_loss": -27.719196319580078, "global_step": 610897, "epoch": 7360} {"train_loss": -27.851804733276367, "global_step": 610898, "epoch": 7360} {"train_loss": -27.98368263244629, "global_step": 610899, "epoch": 7360} {"train_loss": -28.2872257232666, "global_step": 610900, "epoch": 7360} {"train_loss": -28.130298614501953, "global_step": 610901, "epoch": 7360} {"train_loss": -28.050891876220703, "global_step": 610902, "epoch": 7360} {"train_loss": -28.121747970581055, "global_step": 610903, "epoch": 7360} {"train_loss": -27.862472534179688, "global_step": 610904, "epoch": 7360} {"train_loss": -28.280792236328125, "global_step": 610905, "epoch": 7360} {"train_loss": -28.17880630493164, "global_step": 610906, "epoch": 7360} {"train_loss": -28.093168258666992, "global_step": 610907, "epoch": 7360} {"train_loss": -27.99928092956543, "global_step": 610908, "epoch": 7360} {"train_loss": -28.199766159057617, "global_step": 610909, "epoch": 7360} {"train_loss": -28.17374038696289, "global_step": 610910, "epoch": 7360} {"train_loss": -27.99843406677246, "global_step": 610911, "epoch": 7360} {"train_loss": -28.295209884643555, "global_step": 610912, "epoch": 7360} {"train_loss": -28.50251579284668, "global_step": 610913, "epoch": 7360} {"train_loss": -27.960988998413086, "global_step": 610914, "epoch": 7360} {"train_loss": -28.13844108581543, "global_step": 610915, "epoch": 7360} {"train_loss": -28.03131103515625, "global_step": 610916, "epoch": 7360} {"train_loss": -27.790348052978516, "global_step": 610917, "epoch": 7360} {"train_loss": -28.032270431518555, "global_step": 610918, "epoch": 7360} {"train_loss": -28.192157745361328, "global_step": 610919, "epoch": 7360} {"train_loss": -28.033788681030273, "global_step": 610920, "epoch": 7360} {"train_loss": -28.131900787353516, "global_step": 610921, "epoch": 7360} {"train_loss": -28.25789451599121, "global_step": 610922, "epoch": 7360} {"train_loss": -27.908594131469727, "global_step": 610923, "epoch": 7360} {"train_loss": -28.17426109313965, "global_step": 610924, "epoch": 7360} {"train_loss": -28.494461059570312, "global_step": 610925, "epoch": 7360} {"train_loss": -28.5021915435791, "global_step": 610926, "epoch": 7360} {"train_loss": -28.1840763092041, "global_step": 610927, "epoch": 7360} {"train_loss": -28.173368453979492, "global_step": 610928, "epoch": 7360} {"train_loss": -28.452957153320312, "global_step": 610929, "epoch": 7360} {"train_loss": -28.316137313842773, "global_step": 610930, "epoch": 7360} {"train_loss": -28.28659439086914, "global_step": 610931, "epoch": 7360} {"train_loss": -28.347412109375, "global_step": 610932, "epoch": 7360} {"train_loss": -28.248138427734375, "global_step": 610933, "epoch": 7360} {"train_loss": -28.344079971313477, "global_step": 610934, "epoch": 7360} {"train_loss": -28.558435440063477, "global_step": 610935, "epoch": 7360} {"train_loss": -28.261554718017578, "global_step": 610936, "epoch": 7360} {"train_loss": -27.917043685913086, "global_step": 610937, "epoch": 7360} {"train_loss": -28.25018310546875, "global_step": 610938, "epoch": 7360} {"train_loss": -28.373046875, "global_step": 610939, "epoch": 7360} {"train_loss": -28.3686466217041, "global_step": 610940, "epoch": 7360} {"train_loss": -28.25153923034668, "global_step": 610941, "epoch": 7360} {"train_loss": -27.827680587768555, "global_step": 610942, "epoch": 7360} {"train_loss": -28.240819931030273, "global_step": 610943, "epoch": 7360} {"train_loss": -28.116132736206055, "global_step": 610944, "epoch": 7360} {"train_loss": -27.977005004882812, "global_step": 610945, "epoch": 7360} {"train_loss": -28.085235595703125, "global_step": 610946, "epoch": 7360} {"train_loss": -28.023914337158203, "global_step": 610947, "epoch": 7360} {"train_loss": -28.148054122924805, "global_step": 610948, "epoch": 7360} {"train_loss": -28.42009925842285, "global_step": 610949, "epoch": 7360} {"train_loss": -28.2385311126709, "global_step": 610950, "epoch": 7360} {"train_loss": -28.082263946533203, "global_step": 610951, "epoch": 7360} {"train_loss": -28.087270736694336, "global_step": 610952, "epoch": 7360} {"train_loss": -27.997140884399414, "global_step": 610953, "epoch": 7360} {"train_loss": -27.743927001953125, "global_step": 610954, "epoch": 7360} {"train_loss": -27.942276000976562, "global_step": 610955, "epoch": 7360} {"train_loss": -28.289703369140625, "global_step": 610956, "epoch": 7360} {"train_loss": -28.17938804626465, "global_step": 610957, "epoch": 7360} {"train_loss": -27.774951934814453, "global_step": 610958, "epoch": 7360} {"train_loss": -28.010705947875977, "global_step": 610959, "epoch": 7360} {"train_loss": -28.4440860748291, "global_step": 610960, "epoch": 7360} {"train_loss": -27.752368927001953, "global_step": 610961, "epoch": 7360} {"train_loss": -28.0385810898011, "global_step": 610962, "epoch": 7360, "val_loss": 6663036.0} {"train_loss": -28.1208438873291, "global_step": 610963, "epoch": 7361} {"train_loss": -27.96430778503418, "global_step": 610964, "epoch": 7361} {"train_loss": -27.779516220092773, "global_step": 610965, "epoch": 7361} {"train_loss": -28.288955688476562, "global_step": 610966, "epoch": 7361} {"train_loss": -27.872821807861328, "global_step": 610967, "epoch": 7361} {"train_loss": -27.737462997436523, "global_step": 610968, "epoch": 7361} {"train_loss": -28.142383575439453, "global_step": 610969, "epoch": 7361} {"train_loss": -27.724267959594727, "global_step": 610970, "epoch": 7361} {"train_loss": -28.261810302734375, "global_step": 610971, "epoch": 7361} {"train_loss": -28.02119255065918, "global_step": 610972, "epoch": 7361} {"train_loss": -27.95050048828125, "global_step": 610973, "epoch": 7361} {"train_loss": -28.005949020385742, "global_step": 610974, "epoch": 7361} {"train_loss": -27.96662712097168, "global_step": 610975, "epoch": 7361} {"train_loss": -27.678274154663086, "global_step": 610976, "epoch": 7361} {"train_loss": -27.72182273864746, "global_step": 610977, "epoch": 7361} {"train_loss": -28.23016357421875, "global_step": 610978, "epoch": 7361} {"train_loss": -27.694293975830078, "global_step": 610979, "epoch": 7361} {"train_loss": -27.75349235534668, "global_step": 610980, "epoch": 7361} {"train_loss": -28.131946563720703, "global_step": 610981, "epoch": 7361} {"train_loss": -27.418813705444336, "global_step": 610982, "epoch": 7361} {"train_loss": -27.58450698852539, "global_step": 610983, "epoch": 7361} {"train_loss": -27.570892333984375, "global_step": 610984, "epoch": 7361} {"train_loss": -28.000883102416992, "global_step": 610985, "epoch": 7361} {"train_loss": -27.744159698486328, "global_step": 610986, "epoch": 7361} {"train_loss": -27.788625717163086, "global_step": 610987, "epoch": 7361} {"train_loss": -27.42815589904785, "global_step": 610988, "epoch": 7361} {"train_loss": -27.772329330444336, "global_step": 610989, "epoch": 7361} {"train_loss": -27.869054794311523, "global_step": 610990, "epoch": 7361} {"train_loss": -27.87367057800293, "global_step": 610991, "epoch": 7361} {"train_loss": -27.717145919799805, "global_step": 610992, "epoch": 7361} {"train_loss": -27.9992733001709, "global_step": 610993, "epoch": 7361} {"train_loss": -28.030933380126953, "global_step": 610994, "epoch": 7361} {"train_loss": -28.050962448120117, "global_step": 610995, "epoch": 7361} {"train_loss": -27.988407135009766, "global_step": 610996, "epoch": 7361} {"train_loss": -28.0819149017334, "global_step": 610997, "epoch": 7361} {"train_loss": -27.985563278198242, "global_step": 610998, "epoch": 7361} {"train_loss": -27.974201202392578, "global_step": 610999, "epoch": 7361} {"train_loss": -27.76557731628418, "global_step": 611000, "epoch": 7361} {"train_loss": -28.278064727783203, "global_step": 611001, "epoch": 7361} {"train_loss": -27.784164428710938, "global_step": 611002, "epoch": 7361} {"train_loss": -28.01340675354004, "global_step": 611003, "epoch": 7361} {"train_loss": -28.23333168029785, "global_step": 611004, "epoch": 7361} {"train_loss": -28.28660011291504, "global_step": 611005, "epoch": 7361} {"train_loss": -28.143850326538086, "global_step": 611006, "epoch": 7361} {"train_loss": -28.161487579345703, "global_step": 611007, "epoch": 7361} {"train_loss": -28.281116485595703, "global_step": 611008, "epoch": 7361} {"train_loss": -27.52668571472168, "global_step": 611009, "epoch": 7361} {"train_loss": -28.171594619750977, "global_step": 611010, "epoch": 7361} {"train_loss": -28.35049819946289, "global_step": 611011, "epoch": 7361} {"train_loss": -28.644922256469727, "global_step": 611012, "epoch": 7361} {"train_loss": -27.982620239257812, "global_step": 611013, "epoch": 7361} {"train_loss": -28.345321655273438, "global_step": 611014, "epoch": 7361} {"train_loss": -28.471181869506836, "global_step": 611015, "epoch": 7361} {"train_loss": -28.0747127532959, "global_step": 611016, "epoch": 7361} {"train_loss": -27.712934494018555, "global_step": 611017, "epoch": 7361} {"train_loss": -27.693933486938477, "global_step": 611018, "epoch": 7361} {"train_loss": -28.409387588500977, "global_step": 611019, "epoch": 7361} {"train_loss": -28.1887149810791, "global_step": 611020, "epoch": 7361} {"train_loss": -28.25421142578125, "global_step": 611021, "epoch": 7361} {"train_loss": -27.933074951171875, "global_step": 611022, "epoch": 7361} {"train_loss": -28.05940055847168, "global_step": 611023, "epoch": 7361} {"train_loss": -28.248233795166016, "global_step": 611024, "epoch": 7361} {"train_loss": -28.131240844726562, "global_step": 611025, "epoch": 7361} {"train_loss": -28.075305938720703, "global_step": 611026, "epoch": 7361} {"train_loss": -28.388198852539062, "global_step": 611027, "epoch": 7361} {"train_loss": -27.62763786315918, "global_step": 611028, "epoch": 7361} {"train_loss": -28.2575740814209, "global_step": 611029, "epoch": 7361} {"train_loss": -27.839984893798828, "global_step": 611030, "epoch": 7361} {"train_loss": -28.290912628173828, "global_step": 611031, "epoch": 7361} {"train_loss": -28.227497100830078, "global_step": 611032, "epoch": 7361} {"train_loss": -28.02058219909668, "global_step": 611033, "epoch": 7361} {"train_loss": -28.219892501831055, "global_step": 611034, "epoch": 7361} {"train_loss": -28.03510856628418, "global_step": 611035, "epoch": 7361} {"train_loss": -28.0972843170166, "global_step": 611036, "epoch": 7361} {"train_loss": -28.24635124206543, "global_step": 611037, "epoch": 7361} {"train_loss": -27.984975814819336, "global_step": 611038, "epoch": 7361} {"train_loss": -27.581317901611328, "global_step": 611039, "epoch": 7361} {"train_loss": -27.978336334228516, "global_step": 611040, "epoch": 7361} {"train_loss": -27.962844848632812, "global_step": 611041, "epoch": 7361} {"train_loss": -28.24112892150879, "global_step": 611042, "epoch": 7361} {"train_loss": -27.96815299987793, "global_step": 611043, "epoch": 7361} {"train_loss": -28.35249137878418, "global_step": 611044, "epoch": 7361} {"train_loss": -28.00797131549881, "global_step": 611045, "epoch": 7361, "val_loss": 6647778.0} {"train_loss": -27.465551376342773, "global_step": 611046, "epoch": 7362} {"train_loss": -27.34345054626465, "global_step": 611047, "epoch": 7362} {"train_loss": -27.64998435974121, "global_step": 611048, "epoch": 7362} {"train_loss": -27.38539695739746, "global_step": 611049, "epoch": 7362} {"train_loss": -27.06953239440918, "global_step": 611050, "epoch": 7362} {"train_loss": -27.10408592224121, "global_step": 611051, "epoch": 7362} {"train_loss": -27.733083724975586, "global_step": 611052, "epoch": 7362} {"train_loss": -27.135534286499023, "global_step": 611053, "epoch": 7362} {"train_loss": -27.29664421081543, "global_step": 611054, "epoch": 7362} {"train_loss": -27.70026969909668, "global_step": 611055, "epoch": 7362} {"train_loss": -27.707494735717773, "global_step": 611056, "epoch": 7362} {"train_loss": -27.329303741455078, "global_step": 611057, "epoch": 7362} {"train_loss": -27.957067489624023, "global_step": 611058, "epoch": 7362} {"train_loss": -27.6082763671875, "global_step": 611059, "epoch": 7362} {"train_loss": -27.92374038696289, "global_step": 611060, "epoch": 7362} {"train_loss": -27.461639404296875, "global_step": 611061, "epoch": 7362} {"train_loss": -27.44373893737793, "global_step": 611062, "epoch": 7362} {"train_loss": -27.918964385986328, "global_step": 611063, "epoch": 7362} {"train_loss": -28.024646759033203, "global_step": 611064, "epoch": 7362} {"train_loss": -28.273651123046875, "global_step": 611065, "epoch": 7362} {"train_loss": -27.643695831298828, "global_step": 611066, "epoch": 7362} {"train_loss": -28.10871696472168, "global_step": 611067, "epoch": 7362} {"train_loss": -27.491806030273438, "global_step": 611068, "epoch": 7362} {"train_loss": -27.480960845947266, "global_step": 611069, "epoch": 7362} {"train_loss": -27.88346290588379, "global_step": 611070, "epoch": 7362} {"train_loss": -28.091794967651367, "global_step": 611071, "epoch": 7362} {"train_loss": -28.19268798828125, "global_step": 611072, "epoch": 7362} {"train_loss": -27.870080947875977, "global_step": 611073, "epoch": 7362} {"train_loss": -27.945947647094727, "global_step": 611074, "epoch": 7362} {"train_loss": -27.807214736938477, "global_step": 611075, "epoch": 7362} {"train_loss": -28.33917236328125, "global_step": 611076, "epoch": 7362} {"train_loss": -27.767566680908203, "global_step": 611077, "epoch": 7362} {"train_loss": -28.21796226501465, "global_step": 611078, "epoch": 7362} {"train_loss": -27.980539321899414, "global_step": 611079, "epoch": 7362} {"train_loss": -27.975635528564453, "global_step": 611080, "epoch": 7362} {"train_loss": -28.228519439697266, "global_step": 611081, "epoch": 7362} {"train_loss": -28.024805068969727, "global_step": 611082, "epoch": 7362} {"train_loss": -28.3637752532959, "global_step": 611083, "epoch": 7362} {"train_loss": -27.837182998657227, "global_step": 611084, "epoch": 7362} {"train_loss": -28.196455001831055, "global_step": 611085, "epoch": 7362} {"train_loss": -28.265899658203125, "global_step": 611086, "epoch": 7362} {"train_loss": -28.072248458862305, "global_step": 611087, "epoch": 7362} {"train_loss": -27.957366943359375, "global_step": 611088, "epoch": 7362} {"train_loss": -28.366043090820312, "global_step": 611089, "epoch": 7362} {"train_loss": -27.945343017578125, "global_step": 611090, "epoch": 7362} {"train_loss": -28.048147201538086, "global_step": 611091, "epoch": 7362} {"train_loss": -28.24979019165039, "global_step": 611092, "epoch": 7362} {"train_loss": -28.057632446289062, "global_step": 611093, "epoch": 7362} {"train_loss": -28.373624801635742, "global_step": 611094, "epoch": 7362} {"train_loss": -28.164459228515625, "global_step": 611095, "epoch": 7362} {"train_loss": -28.19256591796875, "global_step": 611096, "epoch": 7362} {"train_loss": -28.26954460144043, "global_step": 611097, "epoch": 7362} {"train_loss": -28.005783081054688, "global_step": 611098, "epoch": 7362} {"train_loss": -28.263818740844727, "global_step": 611099, "epoch": 7362} {"train_loss": -27.79275894165039, "global_step": 611100, "epoch": 7362} {"train_loss": -28.332700729370117, "global_step": 611101, "epoch": 7362} {"train_loss": -27.741119384765625, "global_step": 611102, "epoch": 7362} {"train_loss": -28.197498321533203, "global_step": 611103, "epoch": 7362} {"train_loss": -28.25514030456543, "global_step": 611104, "epoch": 7362} {"train_loss": -28.23516845703125, "global_step": 611105, "epoch": 7362} {"train_loss": -28.080575942993164, "global_step": 611106, "epoch": 7362} {"train_loss": -27.953388214111328, "global_step": 611107, "epoch": 7362} {"train_loss": -27.866260528564453, "global_step": 611108, "epoch": 7362} {"train_loss": -28.780303955078125, "global_step": 611109, "epoch": 7362} {"train_loss": -28.550464630126953, "global_step": 611110, "epoch": 7362} {"train_loss": -28.22401237487793, "global_step": 611111, "epoch": 7362} {"train_loss": -28.186176300048828, "global_step": 611112, "epoch": 7362} {"train_loss": -28.017242431640625, "global_step": 611113, "epoch": 7362} {"train_loss": -28.573545455932617, "global_step": 611114, "epoch": 7362} {"train_loss": -28.06707763671875, "global_step": 611115, "epoch": 7362} {"train_loss": -28.329010009765625, "global_step": 611116, "epoch": 7362} {"train_loss": -27.953479766845703, "global_step": 611117, "epoch": 7362} {"train_loss": -27.839344024658203, "global_step": 611118, "epoch": 7362} {"train_loss": -27.905582427978516, "global_step": 611119, "epoch": 7362} {"train_loss": -28.545995712280273, "global_step": 611120, "epoch": 7362} {"train_loss": -27.639814376831055, "global_step": 611121, "epoch": 7362} {"train_loss": -28.20587158203125, "global_step": 611122, "epoch": 7362} {"train_loss": -28.196317672729492, "global_step": 611123, "epoch": 7362} {"train_loss": -28.206811904907227, "global_step": 611124, "epoch": 7362} {"train_loss": -28.481815338134766, "global_step": 611125, "epoch": 7362} {"train_loss": -28.076364517211914, "global_step": 611126, "epoch": 7362} {"train_loss": -28.341550827026367, "global_step": 611127, "epoch": 7362} {"train_loss": -27.964346598429852, "global_step": 611128, "epoch": 7362, "val_loss": 6639698.0} {"train_loss": -27.7053279876709, "global_step": 611129, "epoch": 7363} {"train_loss": -27.20220375061035, "global_step": 611130, "epoch": 7363} {"train_loss": -26.602218627929688, "global_step": 611131, "epoch": 7363} {"train_loss": -26.664060592651367, "global_step": 611132, "epoch": 7363} {"train_loss": -27.49663734436035, "global_step": 611133, "epoch": 7363} {"train_loss": -26.950763702392578, "global_step": 611134, "epoch": 7363} {"train_loss": -27.22745704650879, "global_step": 611135, "epoch": 7363} {"train_loss": -27.567218780517578, "global_step": 611136, "epoch": 7363} {"train_loss": -27.54572105407715, "global_step": 611137, "epoch": 7363} {"train_loss": -27.935617446899414, "global_step": 611138, "epoch": 7363} {"train_loss": -27.400251388549805, "global_step": 611139, "epoch": 7363} {"train_loss": -27.403858184814453, "global_step": 611140, "epoch": 7363} {"train_loss": -27.9315242767334, "global_step": 611141, "epoch": 7363} {"train_loss": -27.387907028198242, "global_step": 611142, "epoch": 7363} {"train_loss": -27.604185104370117, "global_step": 611143, "epoch": 7363} {"train_loss": -27.6911678314209, "global_step": 611144, "epoch": 7363} {"train_loss": -27.90582275390625, "global_step": 611145, "epoch": 7363} {"train_loss": -27.892255783081055, "global_step": 611146, "epoch": 7363} {"train_loss": -27.758285522460938, "global_step": 611147, "epoch": 7363} {"train_loss": -28.184362411499023, "global_step": 611148, "epoch": 7363} {"train_loss": -27.77362060546875, "global_step": 611149, "epoch": 7363} {"train_loss": -28.005666732788086, "global_step": 611150, "epoch": 7363} {"train_loss": -27.72210121154785, "global_step": 611151, "epoch": 7363} {"train_loss": -28.007299423217773, "global_step": 611152, "epoch": 7363} {"train_loss": -27.881977081298828, "global_step": 611153, "epoch": 7363} {"train_loss": -28.107152938842773, "global_step": 611154, "epoch": 7363} {"train_loss": -28.087507247924805, "global_step": 611155, "epoch": 7363} {"train_loss": -28.1090030670166, "global_step": 611156, "epoch": 7363} {"train_loss": -28.152524948120117, "global_step": 611157, "epoch": 7363} {"train_loss": -27.67158317565918, "global_step": 611158, "epoch": 7363} {"train_loss": -27.949392318725586, "global_step": 611159, "epoch": 7363} {"train_loss": -27.857776641845703, "global_step": 611160, "epoch": 7363} {"train_loss": -28.40976905822754, "global_step": 611161, "epoch": 7363} {"train_loss": -27.8781795501709, "global_step": 611162, "epoch": 7363} {"train_loss": -28.01738929748535, "global_step": 611163, "epoch": 7363} {"train_loss": -28.24177360534668, "global_step": 611164, "epoch": 7363} {"train_loss": -27.960912704467773, "global_step": 611165, "epoch": 7363} {"train_loss": -27.963764190673828, "global_step": 611166, "epoch": 7363} {"train_loss": -28.362350463867188, "global_step": 611167, "epoch": 7363} {"train_loss": -28.29599380493164, "global_step": 611168, "epoch": 7363} {"train_loss": -28.202716827392578, "global_step": 611169, "epoch": 7363} {"train_loss": -28.24469566345215, "global_step": 611170, "epoch": 7363} {"train_loss": -28.51846694946289, "global_step": 611171, "epoch": 7363} {"train_loss": -28.323963165283203, "global_step": 611172, "epoch": 7363} {"train_loss": -28.033517837524414, "global_step": 611173, "epoch": 7363} {"train_loss": -27.8961124420166, "global_step": 611174, "epoch": 7363} {"train_loss": -28.294336318969727, "global_step": 611175, "epoch": 7363} {"train_loss": -28.05889320373535, "global_step": 611176, "epoch": 7363} {"train_loss": -28.308425903320312, "global_step": 611177, "epoch": 7363} {"train_loss": -28.000629425048828, "global_step": 611178, "epoch": 7363} {"train_loss": -28.378082275390625, "global_step": 611179, "epoch": 7363} {"train_loss": -28.11838722229004, "global_step": 611180, "epoch": 7363} {"train_loss": -27.97153663635254, "global_step": 611181, "epoch": 7363} {"train_loss": -27.974760055541992, "global_step": 611182, "epoch": 7363} {"train_loss": -28.7401180267334, "global_step": 611183, "epoch": 7363} {"train_loss": -28.331104278564453, "global_step": 611184, "epoch": 7363} {"train_loss": -28.002288818359375, "global_step": 611185, "epoch": 7363} {"train_loss": -28.26558494567871, "global_step": 611186, "epoch": 7363} {"train_loss": -28.33306884765625, "global_step": 611187, "epoch": 7363} {"train_loss": -28.226215362548828, "global_step": 611188, "epoch": 7363} {"train_loss": -27.85504150390625, "global_step": 611189, "epoch": 7363} {"train_loss": -27.789167404174805, "global_step": 611190, "epoch": 7363} {"train_loss": -28.218053817749023, "global_step": 611191, "epoch": 7363} {"train_loss": -28.39908218383789, "global_step": 611192, "epoch": 7363} {"train_loss": -28.024511337280273, "global_step": 611193, "epoch": 7363} {"train_loss": -28.155826568603516, "global_step": 611194, "epoch": 7363} {"train_loss": -28.08637809753418, "global_step": 611195, "epoch": 7363} {"train_loss": -28.0218505859375, "global_step": 611196, "epoch": 7363} {"train_loss": -28.318313598632812, "global_step": 611197, "epoch": 7363} {"train_loss": -28.075414657592773, "global_step": 611198, "epoch": 7363} {"train_loss": -28.094284057617188, "global_step": 611199, "epoch": 7363} {"train_loss": -28.24012565612793, "global_step": 611200, "epoch": 7363} {"train_loss": -28.6309757232666, "global_step": 611201, "epoch": 7363} {"train_loss": -27.9089412689209, "global_step": 611202, "epoch": 7363} {"train_loss": -28.531457901000977, "global_step": 611203, "epoch": 7363} {"train_loss": -28.064970016479492, "global_step": 611204, "epoch": 7363} {"train_loss": -27.85127067565918, "global_step": 611205, "epoch": 7363} {"train_loss": -27.958240509033203, "global_step": 611206, "epoch": 7363} {"train_loss": -27.893707275390625, "global_step": 611207, "epoch": 7363} {"train_loss": -28.246572494506836, "global_step": 611208, "epoch": 7363} {"train_loss": -27.896291732788086, "global_step": 611209, "epoch": 7363} {"train_loss": -28.246740341186523, "global_step": 611210, "epoch": 7363} {"train_loss": -27.949523029557195, "global_step": 611211, "epoch": 7363, "val_loss": 6603608.0} {"train_loss": -27.99713706970215, "global_step": 611212, "epoch": 7364} {"train_loss": -27.995771408081055, "global_step": 611213, "epoch": 7364} {"train_loss": -27.831876754760742, "global_step": 611214, "epoch": 7364} {"train_loss": -28.1118106842041, "global_step": 611215, "epoch": 7364} {"train_loss": -28.1132869720459, "global_step": 611216, "epoch": 7364} {"train_loss": -28.2104549407959, "global_step": 611217, "epoch": 7364} {"train_loss": -27.651996612548828, "global_step": 611218, "epoch": 7364} {"train_loss": -27.95574378967285, "global_step": 611219, "epoch": 7364} {"train_loss": -28.033777236938477, "global_step": 611220, "epoch": 7364} {"train_loss": -27.45941162109375, "global_step": 611221, "epoch": 7364} {"train_loss": -28.131322860717773, "global_step": 611222, "epoch": 7364} {"train_loss": -27.758209228515625, "global_step": 611223, "epoch": 7364} {"train_loss": -27.74765968322754, "global_step": 611224, "epoch": 7364} {"train_loss": -28.111066818237305, "global_step": 611225, "epoch": 7364} {"train_loss": -27.880529403686523, "global_step": 611226, "epoch": 7364} {"train_loss": -28.1477108001709, "global_step": 611227, "epoch": 7364} {"train_loss": -27.955442428588867, "global_step": 611228, "epoch": 7364} {"train_loss": -28.20868492126465, "global_step": 611229, "epoch": 7364} {"train_loss": -28.075143814086914, "global_step": 611230, "epoch": 7364} {"train_loss": -28.43275260925293, "global_step": 611231, "epoch": 7364} {"train_loss": -27.9741153717041, "global_step": 611232, "epoch": 7364} {"train_loss": -28.060964584350586, "global_step": 611233, "epoch": 7364} {"train_loss": -27.92201042175293, "global_step": 611234, "epoch": 7364} {"train_loss": -28.2040958404541, "global_step": 611235, "epoch": 7364} {"train_loss": -27.9716796875, "global_step": 611236, "epoch": 7364} {"train_loss": -27.64558219909668, "global_step": 611237, "epoch": 7364} {"train_loss": -28.22479248046875, "global_step": 611238, "epoch": 7364} {"train_loss": -27.959014892578125, "global_step": 611239, "epoch": 7364} {"train_loss": -28.592588424682617, "global_step": 611240, "epoch": 7364} {"train_loss": -28.037158966064453, "global_step": 611241, "epoch": 7364} {"train_loss": -28.04132652282715, "global_step": 611242, "epoch": 7364} {"train_loss": -28.131505966186523, "global_step": 611243, "epoch": 7364} {"train_loss": -28.28411865234375, "global_step": 611244, "epoch": 7364} {"train_loss": -28.407196044921875, "global_step": 611245, "epoch": 7364} {"train_loss": -28.214086532592773, "global_step": 611246, "epoch": 7364} {"train_loss": -28.249658584594727, "global_step": 611247, "epoch": 7364} {"train_loss": -28.134531021118164, "global_step": 611248, "epoch": 7364} {"train_loss": -28.29296875, "global_step": 611249, "epoch": 7364} {"train_loss": -28.050128936767578, "global_step": 611250, "epoch": 7364} {"train_loss": -28.187274932861328, "global_step": 611251, "epoch": 7364} {"train_loss": -28.118438720703125, "global_step": 611252, "epoch": 7364} {"train_loss": -27.71186637878418, "global_step": 611253, "epoch": 7364} {"train_loss": -28.565296173095703, "global_step": 611254, "epoch": 7364} {"train_loss": -27.890396118164062, "global_step": 611255, "epoch": 7364} {"train_loss": -28.390554428100586, "global_step": 611256, "epoch": 7364} {"train_loss": -28.021991729736328, "global_step": 611257, "epoch": 7364} {"train_loss": -28.031818389892578, "global_step": 611258, "epoch": 7364} {"train_loss": -28.375097274780273, "global_step": 611259, "epoch": 7364} {"train_loss": -28.465789794921875, "global_step": 611260, "epoch": 7364} {"train_loss": -28.152877807617188, "global_step": 611261, "epoch": 7364} {"train_loss": -28.2506103515625, "global_step": 611262, "epoch": 7364} {"train_loss": -27.722980499267578, "global_step": 611263, "epoch": 7364} {"train_loss": -27.8743896484375, "global_step": 611264, "epoch": 7364} {"train_loss": -28.1687068939209, "global_step": 611265, "epoch": 7364} {"train_loss": -28.320703506469727, "global_step": 611266, "epoch": 7364} {"train_loss": -28.147485733032227, "global_step": 611267, "epoch": 7364} {"train_loss": -27.668415069580078, "global_step": 611268, "epoch": 7364} {"train_loss": -28.124120712280273, "global_step": 611269, "epoch": 7364} {"train_loss": -28.138687133789062, "global_step": 611270, "epoch": 7364} {"train_loss": -27.90083885192871, "global_step": 611271, "epoch": 7364} {"train_loss": -28.450647354125977, "global_step": 611272, "epoch": 7364} {"train_loss": -28.154315948486328, "global_step": 611273, "epoch": 7364} {"train_loss": -27.8948974609375, "global_step": 611274, "epoch": 7364} {"train_loss": -27.453479766845703, "global_step": 611275, "epoch": 7364} {"train_loss": -27.97352409362793, "global_step": 611276, "epoch": 7364} {"train_loss": -28.37109375, "global_step": 611277, "epoch": 7364} {"train_loss": -28.133481979370117, "global_step": 611278, "epoch": 7364} {"train_loss": -28.258182525634766, "global_step": 611279, "epoch": 7364} {"train_loss": -27.888837814331055, "global_step": 611280, "epoch": 7364} {"train_loss": -28.315534591674805, "global_step": 611281, "epoch": 7364} {"train_loss": -28.43121910095215, "global_step": 611282, "epoch": 7364} {"train_loss": -28.09589958190918, "global_step": 611283, "epoch": 7364} {"train_loss": -28.352142333984375, "global_step": 611284, "epoch": 7364} {"train_loss": -28.28120231628418, "global_step": 611285, "epoch": 7364} {"train_loss": -28.063745498657227, "global_step": 611286, "epoch": 7364} {"train_loss": -28.56673240661621, "global_step": 611287, "epoch": 7364} {"train_loss": -28.3643741607666, "global_step": 611288, "epoch": 7364} {"train_loss": -28.534894943237305, "global_step": 611289, "epoch": 7364} {"train_loss": -28.113866806030273, "global_step": 611290, "epoch": 7364} {"train_loss": -28.324371337890625, "global_step": 611291, "epoch": 7364} {"train_loss": -27.648273468017578, "global_step": 611292, "epoch": 7364} {"train_loss": -27.724781036376953, "global_step": 611293, "epoch": 7364} {"train_loss": -28.062083026012743, "global_step": 611294, "epoch": 7364, "val_loss": 6602031.0} {"train_loss": -26.623266220092773, "global_step": 611295, "epoch": 7365} {"train_loss": -27.70937156677246, "global_step": 611296, "epoch": 7365} {"train_loss": -28.113622665405273, "global_step": 611297, "epoch": 7365} {"train_loss": -26.994245529174805, "global_step": 611298, "epoch": 7365} {"train_loss": -27.092138290405273, "global_step": 611299, "epoch": 7365} {"train_loss": -27.508344650268555, "global_step": 611300, "epoch": 7365} {"train_loss": -27.252660751342773, "global_step": 611301, "epoch": 7365} {"train_loss": -27.285451889038086, "global_step": 611302, "epoch": 7365} {"train_loss": -27.81694984436035, "global_step": 611303, "epoch": 7365} {"train_loss": -27.2780704498291, "global_step": 611304, "epoch": 7365} {"train_loss": -27.199201583862305, "global_step": 611305, "epoch": 7365} {"train_loss": -27.694448471069336, "global_step": 611306, "epoch": 7365} {"train_loss": -27.40423583984375, "global_step": 611307, "epoch": 7365} {"train_loss": -27.608373641967773, "global_step": 611308, "epoch": 7365} {"train_loss": -27.76692008972168, "global_step": 611309, "epoch": 7365} {"train_loss": -27.74281120300293, "global_step": 611310, "epoch": 7365} {"train_loss": -28.02972412109375, "global_step": 611311, "epoch": 7365} {"train_loss": -27.677677154541016, "global_step": 611312, "epoch": 7365} {"train_loss": -27.447729110717773, "global_step": 611313, "epoch": 7365} {"train_loss": -27.790098190307617, "global_step": 611314, "epoch": 7365} {"train_loss": -27.828704833984375, "global_step": 611315, "epoch": 7365} {"train_loss": -27.72051429748535, "global_step": 611316, "epoch": 7365} {"train_loss": -28.092077255249023, "global_step": 611317, "epoch": 7365} {"train_loss": -27.82228660583496, "global_step": 611318, "epoch": 7365} {"train_loss": -28.237079620361328, "global_step": 611319, "epoch": 7365} {"train_loss": -27.861478805541992, "global_step": 611320, "epoch": 7365} {"train_loss": -27.958845138549805, "global_step": 611321, "epoch": 7365} {"train_loss": -27.7871036529541, "global_step": 611322, "epoch": 7365} {"train_loss": -27.68597984313965, "global_step": 611323, "epoch": 7365} {"train_loss": -27.885761260986328, "global_step": 611324, "epoch": 7365} {"train_loss": -27.690418243408203, "global_step": 611325, "epoch": 7365} {"train_loss": -27.92646598815918, "global_step": 611326, "epoch": 7365} {"train_loss": -27.78571891784668, "global_step": 611327, "epoch": 7365} {"train_loss": -27.74652671813965, "global_step": 611328, "epoch": 7365} {"train_loss": -28.244016647338867, "global_step": 611329, "epoch": 7365} {"train_loss": -28.14161491394043, "global_step": 611330, "epoch": 7365} {"train_loss": -28.036273956298828, "global_step": 611331, "epoch": 7365} {"train_loss": -27.985626220703125, "global_step": 611332, "epoch": 7365} {"train_loss": -28.307275772094727, "global_step": 611333, "epoch": 7365} {"train_loss": -27.93610954284668, "global_step": 611334, "epoch": 7365} {"train_loss": -28.222028732299805, "global_step": 611335, "epoch": 7365} {"train_loss": -27.824359893798828, "global_step": 611336, "epoch": 7365} {"train_loss": -28.25545310974121, "global_step": 611337, "epoch": 7365} {"train_loss": -28.1068172454834, "global_step": 611338, "epoch": 7365} {"train_loss": -27.930212020874023, "global_step": 611339, "epoch": 7365} {"train_loss": -28.0491886138916, "global_step": 611340, "epoch": 7365} {"train_loss": -28.2960205078125, "global_step": 611341, "epoch": 7365} {"train_loss": -28.316131591796875, "global_step": 611342, "epoch": 7365} {"train_loss": -27.891408920288086, "global_step": 611343, "epoch": 7365} {"train_loss": -27.99265480041504, "global_step": 611344, "epoch": 7365} {"train_loss": -28.173568725585938, "global_step": 611345, "epoch": 7365} {"train_loss": -27.970779418945312, "global_step": 611346, "epoch": 7365} {"train_loss": -27.96299171447754, "global_step": 611347, "epoch": 7365} {"train_loss": -28.323495864868164, "global_step": 611348, "epoch": 7365} {"train_loss": -28.276037216186523, "global_step": 611349, "epoch": 7365} {"train_loss": -27.95661735534668, "global_step": 611350, "epoch": 7365} {"train_loss": -28.157882690429688, "global_step": 611351, "epoch": 7365} {"train_loss": -28.36728858947754, "global_step": 611352, "epoch": 7365} {"train_loss": -27.9235782623291, "global_step": 611353, "epoch": 7365} {"train_loss": -27.789587020874023, "global_step": 611354, "epoch": 7365} {"train_loss": -28.295703887939453, "global_step": 611355, "epoch": 7365} {"train_loss": -28.460906982421875, "global_step": 611356, "epoch": 7365} {"train_loss": -28.072187423706055, "global_step": 611357, "epoch": 7365} {"train_loss": -28.560373306274414, "global_step": 611358, "epoch": 7365} {"train_loss": -28.250593185424805, "global_step": 611359, "epoch": 7365} {"train_loss": -28.152307510375977, "global_step": 611360, "epoch": 7365} {"train_loss": -28.326200485229492, "global_step": 611361, "epoch": 7365} {"train_loss": -28.26197624206543, "global_step": 611362, "epoch": 7365} {"train_loss": -28.09512710571289, "global_step": 611363, "epoch": 7365} {"train_loss": -28.444671630859375, "global_step": 611364, "epoch": 7365} {"train_loss": -28.208261489868164, "global_step": 611365, "epoch": 7365} {"train_loss": -27.876672744750977, "global_step": 611366, "epoch": 7365} {"train_loss": -27.85725212097168, "global_step": 611367, "epoch": 7365} {"train_loss": -28.41213035583496, "global_step": 611368, "epoch": 7365} {"train_loss": -27.972122192382812, "global_step": 611369, "epoch": 7365} {"train_loss": -27.736328125, "global_step": 611370, "epoch": 7365} {"train_loss": -27.57354164123535, "global_step": 611371, "epoch": 7365} {"train_loss": -27.525226593017578, "global_step": 611372, "epoch": 7365} {"train_loss": -27.91788101196289, "global_step": 611373, "epoch": 7365} {"train_loss": -28.260046005249023, "global_step": 611374, "epoch": 7365} {"train_loss": -26.836042404174805, "global_step": 611375, "epoch": 7365} {"train_loss": -26.989011764526367, "global_step": 611376, "epoch": 7365} {"train_loss": -27.894503995596644, "global_step": 611377, "epoch": 7365, "val_loss": 6565700.0} {"train_loss": -27.081069946289062, "global_step": 611378, "epoch": 7366} {"train_loss": -26.09266471862793, "global_step": 611379, "epoch": 7366} {"train_loss": -26.376752853393555, "global_step": 611380, "epoch": 7366} {"train_loss": -27.098318099975586, "global_step": 611381, "epoch": 7366} {"train_loss": -27.494619369506836, "global_step": 611382, "epoch": 7366} {"train_loss": -26.765024185180664, "global_step": 611383, "epoch": 7366} {"train_loss": -26.994403839111328, "global_step": 611384, "epoch": 7366} {"train_loss": -27.232526779174805, "global_step": 611385, "epoch": 7366} {"train_loss": -27.27857780456543, "global_step": 611386, "epoch": 7366} {"train_loss": -27.5899600982666, "global_step": 611387, "epoch": 7366} {"train_loss": -27.094501495361328, "global_step": 611388, "epoch": 7366} {"train_loss": -27.620229721069336, "global_step": 611389, "epoch": 7366} {"train_loss": -27.6684627532959, "global_step": 611390, "epoch": 7366} {"train_loss": -27.709949493408203, "global_step": 611391, "epoch": 7366} {"train_loss": -27.497655868530273, "global_step": 611392, "epoch": 7366} {"train_loss": -27.834264755249023, "global_step": 611393, "epoch": 7366} {"train_loss": -27.9268798828125, "global_step": 611394, "epoch": 7366} {"train_loss": -27.637195587158203, "global_step": 611395, "epoch": 7366} {"train_loss": -27.556781768798828, "global_step": 611396, "epoch": 7366} {"train_loss": -28.083515167236328, "global_step": 611397, "epoch": 7366} {"train_loss": -27.845829010009766, "global_step": 611398, "epoch": 7366} {"train_loss": -27.786142349243164, "global_step": 611399, "epoch": 7366} {"train_loss": -27.876440048217773, "global_step": 611400, "epoch": 7366} {"train_loss": -27.69533348083496, "global_step": 611401, "epoch": 7366} {"train_loss": -28.197660446166992, "global_step": 611402, "epoch": 7366} {"train_loss": -27.93267250061035, "global_step": 611403, "epoch": 7366} {"train_loss": -27.86942481994629, "global_step": 611404, "epoch": 7366} {"train_loss": -28.246448516845703, "global_step": 611405, "epoch": 7366} {"train_loss": -28.062274932861328, "global_step": 611406, "epoch": 7366} {"train_loss": -27.961978912353516, "global_step": 611407, "epoch": 7366} {"train_loss": -27.937408447265625, "global_step": 611408, "epoch": 7366} {"train_loss": -28.111291885375977, "global_step": 611409, "epoch": 7366} {"train_loss": -27.952350616455078, "global_step": 611410, "epoch": 7366} {"train_loss": -28.401731491088867, "global_step": 611411, "epoch": 7366} {"train_loss": -28.019392013549805, "global_step": 611412, "epoch": 7366} {"train_loss": -28.134084701538086, "global_step": 611413, "epoch": 7366} {"train_loss": -28.083703994750977, "global_step": 611414, "epoch": 7366} {"train_loss": -28.168798446655273, "global_step": 611415, "epoch": 7366} {"train_loss": -28.04091453552246, "global_step": 611416, "epoch": 7366} {"train_loss": -28.536008834838867, "global_step": 611417, "epoch": 7366} {"train_loss": -28.103683471679688, "global_step": 611418, "epoch": 7366} {"train_loss": -28.15667724609375, "global_step": 611419, "epoch": 7366} {"train_loss": -28.257080078125, "global_step": 611420, "epoch": 7366} {"train_loss": -27.866703033447266, "global_step": 611421, "epoch": 7366} {"train_loss": -27.98773193359375, "global_step": 611422, "epoch": 7366} {"train_loss": -27.81622314453125, "global_step": 611423, "epoch": 7366} {"train_loss": -27.987308502197266, "global_step": 611424, "epoch": 7366} {"train_loss": -28.13201332092285, "global_step": 611425, "epoch": 7366} {"train_loss": -27.840839385986328, "global_step": 611426, "epoch": 7366} {"train_loss": -27.869632720947266, "global_step": 611427, "epoch": 7366} {"train_loss": -28.6365909576416, "global_step": 611428, "epoch": 7366} {"train_loss": -28.013565063476562, "global_step": 611429, "epoch": 7366} {"train_loss": -27.902450561523438, "global_step": 611430, "epoch": 7366} {"train_loss": -28.148300170898438, "global_step": 611431, "epoch": 7366} {"train_loss": -28.200702667236328, "global_step": 611432, "epoch": 7366} {"train_loss": -28.09160804748535, "global_step": 611433, "epoch": 7366} {"train_loss": -28.16462516784668, "global_step": 611434, "epoch": 7366} {"train_loss": -28.506610870361328, "global_step": 611435, "epoch": 7366} {"train_loss": -28.05143165588379, "global_step": 611436, "epoch": 7366} {"train_loss": -28.483612060546875, "global_step": 611437, "epoch": 7366} {"train_loss": -28.35365867614746, "global_step": 611438, "epoch": 7366} {"train_loss": -28.392797470092773, "global_step": 611439, "epoch": 7366} {"train_loss": -28.583667755126953, "global_step": 611440, "epoch": 7366} {"train_loss": -28.11530113220215, "global_step": 611441, "epoch": 7366} {"train_loss": -28.425521850585938, "global_step": 611442, "epoch": 7366} {"train_loss": -28.141706466674805, "global_step": 611443, "epoch": 7366} {"train_loss": -27.76947021484375, "global_step": 611444, "epoch": 7366} {"train_loss": -28.428640365600586, "global_step": 611445, "epoch": 7366} {"train_loss": -28.038074493408203, "global_step": 611446, "epoch": 7366} {"train_loss": -28.22719383239746, "global_step": 611447, "epoch": 7366} {"train_loss": -28.127561569213867, "global_step": 611448, "epoch": 7366} {"train_loss": -27.901403427124023, "global_step": 611449, "epoch": 7366} {"train_loss": -27.856250762939453, "global_step": 611450, "epoch": 7366} {"train_loss": -28.34852409362793, "global_step": 611451, "epoch": 7366} {"train_loss": -27.824392318725586, "global_step": 611452, "epoch": 7366} {"train_loss": -28.087305068969727, "global_step": 611453, "epoch": 7366} {"train_loss": -27.847537994384766, "global_step": 611454, "epoch": 7366} {"train_loss": -28.227008819580078, "global_step": 611455, "epoch": 7366} {"train_loss": -27.635313034057617, "global_step": 611456, "epoch": 7366} {"train_loss": -27.925373077392578, "global_step": 611457, "epoch": 7366} {"train_loss": -28.039716720581055, "global_step": 611458, "epoch": 7366} {"train_loss": -27.591779708862305, "global_step": 611459, "epoch": 7366} {"train_loss": -27.88216885026679, "global_step": 611460, "epoch": 7366, "val_loss": 6621606.0} {"train_loss": -27.021528244018555, "global_step": 611461, "epoch": 7367} {"train_loss": -25.812942504882812, "global_step": 611462, "epoch": 7367} {"train_loss": -25.88763999938965, "global_step": 611463, "epoch": 7367} {"train_loss": -27.647754669189453, "global_step": 611464, "epoch": 7367} {"train_loss": -26.07404899597168, "global_step": 611465, "epoch": 7367} {"train_loss": -27.036157608032227, "global_step": 611466, "epoch": 7367} {"train_loss": -27.31696128845215, "global_step": 611467, "epoch": 7367} {"train_loss": -27.07423210144043, "global_step": 611468, "epoch": 7367} {"train_loss": -27.08479118347168, "global_step": 611469, "epoch": 7367} {"train_loss": -27.2183895111084, "global_step": 611470, "epoch": 7367} {"train_loss": -27.0734920501709, "global_step": 611471, "epoch": 7367} {"train_loss": -27.699506759643555, "global_step": 611472, "epoch": 7367} {"train_loss": -27.4674072265625, "global_step": 611473, "epoch": 7367} {"train_loss": -27.475788116455078, "global_step": 611474, "epoch": 7367} {"train_loss": -27.623998641967773, "global_step": 611475, "epoch": 7367} {"train_loss": -27.65177345275879, "global_step": 611476, "epoch": 7367} {"train_loss": -27.524871826171875, "global_step": 611477, "epoch": 7367} {"train_loss": -27.470062255859375, "global_step": 611478, "epoch": 7367} {"train_loss": -27.13848304748535, "global_step": 611479, "epoch": 7367} {"train_loss": -27.66815185546875, "global_step": 611480, "epoch": 7367} {"train_loss": -27.196918487548828, "global_step": 611481, "epoch": 7367} {"train_loss": -27.76963233947754, "global_step": 611482, "epoch": 7367} {"train_loss": -27.629987716674805, "global_step": 611483, "epoch": 7367} {"train_loss": -27.76588249206543, "global_step": 611484, "epoch": 7367} {"train_loss": -27.810583114624023, "global_step": 611485, "epoch": 7367} {"train_loss": -28.033151626586914, "global_step": 611486, "epoch": 7367} {"train_loss": -27.794172286987305, "global_step": 611487, "epoch": 7367} {"train_loss": -28.023000717163086, "global_step": 611488, "epoch": 7367} {"train_loss": -27.885086059570312, "global_step": 611489, "epoch": 7367} {"train_loss": -27.83662223815918, "global_step": 611490, "epoch": 7367} {"train_loss": -27.95088768005371, "global_step": 611491, "epoch": 7367} {"train_loss": -28.048904418945312, "global_step": 611492, "epoch": 7367} {"train_loss": -27.70989990234375, "global_step": 611493, "epoch": 7367} {"train_loss": -27.770130157470703, "global_step": 611494, "epoch": 7367} {"train_loss": -28.360610961914062, "global_step": 611495, "epoch": 7367} {"train_loss": -27.99859619140625, "global_step": 611496, "epoch": 7367} {"train_loss": -28.345661163330078, "global_step": 611497, "epoch": 7367} {"train_loss": -27.70318603515625, "global_step": 611498, "epoch": 7367} {"train_loss": -28.101245880126953, "global_step": 611499, "epoch": 7367} {"train_loss": -28.086669921875, "global_step": 611500, "epoch": 7367} {"train_loss": -27.947141647338867, "global_step": 611501, "epoch": 7367} {"train_loss": -28.178924560546875, "global_step": 611502, "epoch": 7367} {"train_loss": -28.073720932006836, "global_step": 611503, "epoch": 7367} {"train_loss": -28.156967163085938, "global_step": 611504, "epoch": 7367} {"train_loss": -28.203393936157227, "global_step": 611505, "epoch": 7367} {"train_loss": -28.021472930908203, "global_step": 611506, "epoch": 7367} {"train_loss": -28.284900665283203, "global_step": 611507, "epoch": 7367} {"train_loss": -28.498746871948242, "global_step": 611508, "epoch": 7367} {"train_loss": -27.987768173217773, "global_step": 611509, "epoch": 7367} {"train_loss": -28.106525421142578, "global_step": 611510, "epoch": 7367} {"train_loss": -28.07966423034668, "global_step": 611511, "epoch": 7367} {"train_loss": -27.6883487701416, "global_step": 611512, "epoch": 7367} {"train_loss": -27.510726928710938, "global_step": 611513, "epoch": 7367} {"train_loss": -27.500513076782227, "global_step": 611514, "epoch": 7367} {"train_loss": -27.791296005249023, "global_step": 611515, "epoch": 7367} {"train_loss": -27.827756881713867, "global_step": 611516, "epoch": 7367} {"train_loss": -27.684890747070312, "global_step": 611517, "epoch": 7367} {"train_loss": -28.32329750061035, "global_step": 611518, "epoch": 7367} {"train_loss": -27.965147018432617, "global_step": 611519, "epoch": 7367} {"train_loss": -27.751867294311523, "global_step": 611520, "epoch": 7367} {"train_loss": -27.9627742767334, "global_step": 611521, "epoch": 7367} {"train_loss": -27.72039794921875, "global_step": 611522, "epoch": 7367} {"train_loss": -27.750701904296875, "global_step": 611523, "epoch": 7367} {"train_loss": -27.0483341217041, "global_step": 611524, "epoch": 7367} {"train_loss": -28.214879989624023, "global_step": 611525, "epoch": 7367} {"train_loss": -27.798694610595703, "global_step": 611526, "epoch": 7367} {"train_loss": -27.77017593383789, "global_step": 611527, "epoch": 7367} {"train_loss": -27.9279842376709, "global_step": 611528, "epoch": 7367} {"train_loss": -27.55950927734375, "global_step": 611529, "epoch": 7367} {"train_loss": -27.80548095703125, "global_step": 611530, "epoch": 7367} {"train_loss": -27.509241104125977, "global_step": 611531, "epoch": 7367} {"train_loss": -28.145771026611328, "global_step": 611532, "epoch": 7367} {"train_loss": -28.271055221557617, "global_step": 611533, "epoch": 7367} {"train_loss": -27.92475700378418, "global_step": 611534, "epoch": 7367} {"train_loss": -27.870574951171875, "global_step": 611535, "epoch": 7367} {"train_loss": -28.19781494140625, "global_step": 611536, "epoch": 7367} {"train_loss": -28.22149085998535, "global_step": 611537, "epoch": 7367} {"train_loss": -27.829681396484375, "global_step": 611538, "epoch": 7367} {"train_loss": -28.231597900390625, "global_step": 611539, "epoch": 7367} {"train_loss": -27.997116088867188, "global_step": 611540, "epoch": 7367} {"train_loss": -28.2962703704834, "global_step": 611541, "epoch": 7367} {"train_loss": -28.1466064453125, "global_step": 611542, "epoch": 7367} {"train_loss": -27.75144845893584, "global_step": 611543, "epoch": 7367, "val_loss": 6616650.5} {"train_loss": -27.301010131835938, "global_step": 611544, "epoch": 7368} {"train_loss": -27.796655654907227, "global_step": 611545, "epoch": 7368} {"train_loss": -27.663705825805664, "global_step": 611546, "epoch": 7368} {"train_loss": -27.544580459594727, "global_step": 611547, "epoch": 7368} {"train_loss": -28.0819091796875, "global_step": 611548, "epoch": 7368} {"train_loss": -27.951663970947266, "global_step": 611549, "epoch": 7368} {"train_loss": -27.793371200561523, "global_step": 611550, "epoch": 7368} {"train_loss": -27.936416625976562, "global_step": 611551, "epoch": 7368} {"train_loss": -27.71992301940918, "global_step": 611552, "epoch": 7368} {"train_loss": -27.73805046081543, "global_step": 611553, "epoch": 7368} {"train_loss": -27.705890655517578, "global_step": 611554, "epoch": 7368} {"train_loss": -27.995834350585938, "global_step": 611555, "epoch": 7368} {"train_loss": -27.730886459350586, "global_step": 611556, "epoch": 7368} {"train_loss": -27.93853759765625, "global_step": 611557, "epoch": 7368} {"train_loss": -28.18597984313965, "global_step": 611558, "epoch": 7368} {"train_loss": -28.036401748657227, "global_step": 611559, "epoch": 7368} {"train_loss": -28.2713565826416, "global_step": 611560, "epoch": 7368} {"train_loss": -27.873640060424805, "global_step": 611561, "epoch": 7368} {"train_loss": -28.055816650390625, "global_step": 611562, "epoch": 7368} {"train_loss": -28.1330623626709, "global_step": 611563, "epoch": 7368} {"train_loss": -28.386640548706055, "global_step": 611564, "epoch": 7368} {"train_loss": -28.099292755126953, "global_step": 611565, "epoch": 7368} {"train_loss": -28.278833389282227, "global_step": 611566, "epoch": 7368} {"train_loss": -27.850482940673828, "global_step": 611567, "epoch": 7368} {"train_loss": -28.12839698791504, "global_step": 611568, "epoch": 7368} {"train_loss": -28.158985137939453, "global_step": 611569, "epoch": 7368} {"train_loss": -28.019582748413086, "global_step": 611570, "epoch": 7368} {"train_loss": -28.300277709960938, "global_step": 611571, "epoch": 7368} {"train_loss": -28.0640926361084, "global_step": 611572, "epoch": 7368} {"train_loss": -27.78618812561035, "global_step": 611573, "epoch": 7368} {"train_loss": -28.318998336791992, "global_step": 611574, "epoch": 7368} {"train_loss": -28.00886344909668, "global_step": 611575, "epoch": 7368} {"train_loss": -28.521345138549805, "global_step": 611576, "epoch": 7368} {"train_loss": -28.02021598815918, "global_step": 611577, "epoch": 7368} {"train_loss": -27.941781997680664, "global_step": 611578, "epoch": 7368} {"train_loss": -28.071060180664062, "global_step": 611579, "epoch": 7368} {"train_loss": -27.8980770111084, "global_step": 611580, "epoch": 7368} {"train_loss": -28.558734893798828, "global_step": 611581, "epoch": 7368} {"train_loss": -28.23419189453125, "global_step": 611582, "epoch": 7368} {"train_loss": -28.373706817626953, "global_step": 611583, "epoch": 7368} {"train_loss": -28.212940216064453, "global_step": 611584, "epoch": 7368} {"train_loss": -28.20490074157715, "global_step": 611585, "epoch": 7368} {"train_loss": -27.9703426361084, "global_step": 611586, "epoch": 7368} {"train_loss": -28.632450103759766, "global_step": 611587, "epoch": 7368} {"train_loss": -28.4129581451416, "global_step": 611588, "epoch": 7368} {"train_loss": -28.369165420532227, "global_step": 611589, "epoch": 7368} {"train_loss": -28.499847412109375, "global_step": 611590, "epoch": 7368} {"train_loss": -28.173694610595703, "global_step": 611591, "epoch": 7368} {"train_loss": -28.262012481689453, "global_step": 611592, "epoch": 7368} {"train_loss": -28.313337326049805, "global_step": 611593, "epoch": 7368} {"train_loss": -28.087905883789062, "global_step": 611594, "epoch": 7368} {"train_loss": -28.43000602722168, "global_step": 611595, "epoch": 7368} {"train_loss": -27.863019943237305, "global_step": 611596, "epoch": 7368} {"train_loss": -28.358381271362305, "global_step": 611597, "epoch": 7368} {"train_loss": -28.276092529296875, "global_step": 611598, "epoch": 7368} {"train_loss": -28.392105102539062, "global_step": 611599, "epoch": 7368} {"train_loss": -28.224451065063477, "global_step": 611600, "epoch": 7368} {"train_loss": -27.751331329345703, "global_step": 611601, "epoch": 7368} {"train_loss": -27.823755264282227, "global_step": 611602, "epoch": 7368} {"train_loss": -27.64804458618164, "global_step": 611603, "epoch": 7368} {"train_loss": -27.672046661376953, "global_step": 611604, "epoch": 7368} {"train_loss": -27.807973861694336, "global_step": 611605, "epoch": 7368} {"train_loss": -27.97083854675293, "global_step": 611606, "epoch": 7368} {"train_loss": -28.127399444580078, "global_step": 611607, "epoch": 7368} {"train_loss": -28.027759552001953, "global_step": 611608, "epoch": 7368} {"train_loss": -27.887073516845703, "global_step": 611609, "epoch": 7368} {"train_loss": -28.038114547729492, "global_step": 611610, "epoch": 7368} {"train_loss": -27.533203125, "global_step": 611611, "epoch": 7368} {"train_loss": -27.471832275390625, "global_step": 611612, "epoch": 7368} {"train_loss": -27.229328155517578, "global_step": 611613, "epoch": 7368} {"train_loss": -27.681943893432617, "global_step": 611614, "epoch": 7368} {"train_loss": -27.83255958557129, "global_step": 611615, "epoch": 7368} {"train_loss": -27.842117309570312, "global_step": 611616, "epoch": 7368} {"train_loss": -28.018497467041016, "global_step": 611617, "epoch": 7368} {"train_loss": -27.743152618408203, "global_step": 611618, "epoch": 7368} {"train_loss": -27.993677139282227, "global_step": 611619, "epoch": 7368} {"train_loss": -28.18427848815918, "global_step": 611620, "epoch": 7368} {"train_loss": -27.888992309570312, "global_step": 611621, "epoch": 7368} {"train_loss": -28.159948348999023, "global_step": 611622, "epoch": 7368} {"train_loss": -27.830602645874023, "global_step": 611623, "epoch": 7368} {"train_loss": -27.96339225769043, "global_step": 611624, "epoch": 7368} {"train_loss": -28.242252349853516, "global_step": 611625, "epoch": 7368} {"train_loss": -28.022759586931713, "global_step": 611626, "epoch": 7368, "val_loss": 6675585.0} {"train_loss": -27.505786895751953, "global_step": 611627, "epoch": 7369} {"train_loss": -27.890640258789062, "global_step": 611628, "epoch": 7369} {"train_loss": -27.75025749206543, "global_step": 611629, "epoch": 7369} {"train_loss": -27.699254989624023, "global_step": 611630, "epoch": 7369} {"train_loss": -27.7286376953125, "global_step": 611631, "epoch": 7369} {"train_loss": -27.77166748046875, "global_step": 611632, "epoch": 7369} {"train_loss": -27.818777084350586, "global_step": 611633, "epoch": 7369} {"train_loss": -27.871662139892578, "global_step": 611634, "epoch": 7369} {"train_loss": -27.53951072692871, "global_step": 611635, "epoch": 7369} {"train_loss": -27.886493682861328, "global_step": 611636, "epoch": 7369} {"train_loss": -27.600107192993164, "global_step": 611637, "epoch": 7369} {"train_loss": -28.063098907470703, "global_step": 611638, "epoch": 7369} {"train_loss": -28.366992950439453, "global_step": 611639, "epoch": 7369} {"train_loss": -27.967376708984375, "global_step": 611640, "epoch": 7369} {"train_loss": -27.8007869720459, "global_step": 611641, "epoch": 7369} {"train_loss": -28.277997970581055, "global_step": 611642, "epoch": 7369} {"train_loss": -27.120817184448242, "global_step": 611643, "epoch": 7369} {"train_loss": -28.318313598632812, "global_step": 611644, "epoch": 7369} {"train_loss": -28.116918563842773, "global_step": 611645, "epoch": 7369} {"train_loss": -27.77625846862793, "global_step": 611646, "epoch": 7369} {"train_loss": -28.078277587890625, "global_step": 611647, "epoch": 7369} {"train_loss": -28.070068359375, "global_step": 611648, "epoch": 7369} {"train_loss": -28.308155059814453, "global_step": 611649, "epoch": 7369} {"train_loss": -27.989973068237305, "global_step": 611650, "epoch": 7369} {"train_loss": -28.151172637939453, "global_step": 611651, "epoch": 7369} {"train_loss": -27.675907135009766, "global_step": 611652, "epoch": 7369} {"train_loss": -28.15189552307129, "global_step": 611653, "epoch": 7369} {"train_loss": -28.088790893554688, "global_step": 611654, "epoch": 7369} {"train_loss": -28.25798988342285, "global_step": 611655, "epoch": 7369} {"train_loss": -27.661054611206055, "global_step": 611656, "epoch": 7369} {"train_loss": -28.220367431640625, "global_step": 611657, "epoch": 7369} {"train_loss": -28.08536148071289, "global_step": 611658, "epoch": 7369} {"train_loss": -27.884674072265625, "global_step": 611659, "epoch": 7369} {"train_loss": -28.058547973632812, "global_step": 611660, "epoch": 7369} {"train_loss": -28.531248092651367, "global_step": 611661, "epoch": 7369} {"train_loss": -28.076400756835938, "global_step": 611662, "epoch": 7369} {"train_loss": -28.121124267578125, "global_step": 611663, "epoch": 7369} {"train_loss": -28.07620620727539, "global_step": 611664, "epoch": 7369} {"train_loss": -28.25629997253418, "global_step": 611665, "epoch": 7369} {"train_loss": -28.125202178955078, "global_step": 611666, "epoch": 7369} {"train_loss": -27.71235466003418, "global_step": 611667, "epoch": 7369} {"train_loss": -28.18524169921875, "global_step": 611668, "epoch": 7369} {"train_loss": -28.2504940032959, "global_step": 611669, "epoch": 7369} {"train_loss": -27.980398178100586, "global_step": 611670, "epoch": 7369} {"train_loss": -27.447431564331055, "global_step": 611671, "epoch": 7369} {"train_loss": -27.513635635375977, "global_step": 611672, "epoch": 7369} {"train_loss": -27.67411231994629, "global_step": 611673, "epoch": 7369} {"train_loss": -27.863727569580078, "global_step": 611674, "epoch": 7369} {"train_loss": -27.190954208374023, "global_step": 611675, "epoch": 7369} {"train_loss": -27.991992950439453, "global_step": 611676, "epoch": 7369} {"train_loss": -27.907957077026367, "global_step": 611677, "epoch": 7369} {"train_loss": -27.41657829284668, "global_step": 611678, "epoch": 7369} {"train_loss": -28.566125869750977, "global_step": 611679, "epoch": 7369} {"train_loss": -27.2941837310791, "global_step": 611680, "epoch": 7369} {"train_loss": -28.003934860229492, "global_step": 611681, "epoch": 7369} {"train_loss": -28.0250301361084, "global_step": 611682, "epoch": 7369} {"train_loss": -28.133214950561523, "global_step": 611683, "epoch": 7369} {"train_loss": -28.1272029876709, "global_step": 611684, "epoch": 7369} {"train_loss": -27.812335968017578, "global_step": 611685, "epoch": 7369} {"train_loss": -27.948440551757812, "global_step": 611686, "epoch": 7369} {"train_loss": -27.755584716796875, "global_step": 611687, "epoch": 7369} {"train_loss": -28.140857696533203, "global_step": 611688, "epoch": 7369} {"train_loss": -28.15264892578125, "global_step": 611689, "epoch": 7369} {"train_loss": -28.18329429626465, "global_step": 611690, "epoch": 7369} {"train_loss": -28.49875259399414, "global_step": 611691, "epoch": 7369} {"train_loss": -28.251977920532227, "global_step": 611692, "epoch": 7369} {"train_loss": -28.28913688659668, "global_step": 611693, "epoch": 7369} {"train_loss": -27.894134521484375, "global_step": 611694, "epoch": 7369} {"train_loss": -28.16643714904785, "global_step": 611695, "epoch": 7369} {"train_loss": -28.041223526000977, "global_step": 611696, "epoch": 7369} {"train_loss": -28.1850528717041, "global_step": 611697, "epoch": 7369} {"train_loss": -28.312856674194336, "global_step": 611698, "epoch": 7369} {"train_loss": -28.236358642578125, "global_step": 611699, "epoch": 7369} {"train_loss": -28.132104873657227, "global_step": 611700, "epoch": 7369} {"train_loss": -28.012861251831055, "global_step": 611701, "epoch": 7369} {"train_loss": -28.062116622924805, "global_step": 611702, "epoch": 7369} {"train_loss": -28.117919921875, "global_step": 611703, "epoch": 7369} {"train_loss": -28.157018661499023, "global_step": 611704, "epoch": 7369} {"train_loss": -28.311426162719727, "global_step": 611705, "epoch": 7369} {"train_loss": -28.4235897064209, "global_step": 611706, "epoch": 7369} {"train_loss": -28.298673629760742, "global_step": 611707, "epoch": 7369} {"train_loss": -28.33868980407715, "global_step": 611708, "epoch": 7369} {"train_loss": -28.009902908141356, "global_step": 611709, "epoch": 7369, "val_loss": 6655713.0} {"train_loss": -27.25152587890625, "global_step": 611710, "epoch": 7370} {"train_loss": -26.57325553894043, "global_step": 611711, "epoch": 7370} {"train_loss": -27.22364616394043, "global_step": 611712, "epoch": 7370} {"train_loss": -27.348285675048828, "global_step": 611713, "epoch": 7370} {"train_loss": -26.583133697509766, "global_step": 611714, "epoch": 7370} {"train_loss": -27.02117347717285, "global_step": 611715, "epoch": 7370} {"train_loss": -26.945043563842773, "global_step": 611716, "epoch": 7370} {"train_loss": -27.322290420532227, "global_step": 611717, "epoch": 7370} {"train_loss": -27.552900314331055, "global_step": 611718, "epoch": 7370} {"train_loss": -27.365087509155273, "global_step": 611719, "epoch": 7370} {"train_loss": -27.862781524658203, "global_step": 611720, "epoch": 7370} {"train_loss": -27.617517471313477, "global_step": 611721, "epoch": 7370} {"train_loss": -27.26099967956543, "global_step": 611722, "epoch": 7370} {"train_loss": -27.636999130249023, "global_step": 611723, "epoch": 7370} {"train_loss": -27.646459579467773, "global_step": 611724, "epoch": 7370} {"train_loss": -27.830698013305664, "global_step": 611725, "epoch": 7370} {"train_loss": -27.710309982299805, "global_step": 611726, "epoch": 7370} {"train_loss": -27.84610939025879, "global_step": 611727, "epoch": 7370} {"train_loss": -27.585485458374023, "global_step": 611728, "epoch": 7370} {"train_loss": -27.544910430908203, "global_step": 611729, "epoch": 7370} {"train_loss": -27.861652374267578, "global_step": 611730, "epoch": 7370} {"train_loss": -27.9058895111084, "global_step": 611731, "epoch": 7370} {"train_loss": -27.737018585205078, "global_step": 611732, "epoch": 7370} {"train_loss": -28.081134796142578, "global_step": 611733, "epoch": 7370} {"train_loss": -28.186899185180664, "global_step": 611734, "epoch": 7370} {"train_loss": -27.969797134399414, "global_step": 611735, "epoch": 7370} {"train_loss": -27.71229362487793, "global_step": 611736, "epoch": 7370} {"train_loss": -27.98672866821289, "global_step": 611737, "epoch": 7370} {"train_loss": -28.0582275390625, "global_step": 611738, "epoch": 7370} {"train_loss": -27.90106201171875, "global_step": 611739, "epoch": 7370} {"train_loss": -27.747745513916016, "global_step": 611740, "epoch": 7370} {"train_loss": -27.989103317260742, "global_step": 611741, "epoch": 7370} {"train_loss": -27.82484245300293, "global_step": 611742, "epoch": 7370} {"train_loss": -27.992063522338867, "global_step": 611743, "epoch": 7370} {"train_loss": -28.27948570251465, "global_step": 611744, "epoch": 7370} {"train_loss": -27.864093780517578, "global_step": 611745, "epoch": 7370} {"train_loss": -27.639379501342773, "global_step": 611746, "epoch": 7370} {"train_loss": -28.115497589111328, "global_step": 611747, "epoch": 7370} {"train_loss": -28.298791885375977, "global_step": 611748, "epoch": 7370} {"train_loss": -28.220504760742188, "global_step": 611749, "epoch": 7370} {"train_loss": -28.00153160095215, "global_step": 611750, "epoch": 7370} {"train_loss": -28.40860366821289, "global_step": 611751, "epoch": 7370} {"train_loss": -28.202184677124023, "global_step": 611752, "epoch": 7370} {"train_loss": -28.282012939453125, "global_step": 611753, "epoch": 7370} {"train_loss": -28.18583106994629, "global_step": 611754, "epoch": 7370} {"train_loss": -28.116113662719727, "global_step": 611755, "epoch": 7370} {"train_loss": -27.859792709350586, "global_step": 611756, "epoch": 7370} {"train_loss": -28.09308433532715, "global_step": 611757, "epoch": 7370} {"train_loss": -28.41582679748535, "global_step": 611758, "epoch": 7370} {"train_loss": -28.477710723876953, "global_step": 611759, "epoch": 7370} {"train_loss": -28.648588180541992, "global_step": 611760, "epoch": 7370} {"train_loss": -28.43621253967285, "global_step": 611761, "epoch": 7370} {"train_loss": -28.40302848815918, "global_step": 611762, "epoch": 7370} {"train_loss": -28.687183380126953, "global_step": 611763, "epoch": 7370} {"train_loss": -28.454370498657227, "global_step": 611764, "epoch": 7370} {"train_loss": -28.160924911499023, "global_step": 611765, "epoch": 7370} {"train_loss": -28.37652015686035, "global_step": 611766, "epoch": 7370} {"train_loss": -28.33927345275879, "global_step": 611767, "epoch": 7370} {"train_loss": -28.433080673217773, "global_step": 611768, "epoch": 7370} {"train_loss": -28.155298233032227, "global_step": 611769, "epoch": 7370} {"train_loss": -28.430648803710938, "global_step": 611770, "epoch": 7370} {"train_loss": -28.328840255737305, "global_step": 611771, "epoch": 7370} {"train_loss": -28.316268920898438, "global_step": 611772, "epoch": 7370} {"train_loss": -28.399229049682617, "global_step": 611773, "epoch": 7370} {"train_loss": -28.542638778686523, "global_step": 611774, "epoch": 7370} {"train_loss": -28.062665939331055, "global_step": 611775, "epoch": 7370} {"train_loss": -28.439105987548828, "global_step": 611776, "epoch": 7370} {"train_loss": -27.917463302612305, "global_step": 611777, "epoch": 7370} {"train_loss": -27.47462272644043, "global_step": 611778, "epoch": 7370} {"train_loss": -26.9744873046875, "global_step": 611779, "epoch": 7370} {"train_loss": -27.685352325439453, "global_step": 611780, "epoch": 7370} {"train_loss": -27.761625289916992, "global_step": 611781, "epoch": 7370} {"train_loss": -28.0504093170166, "global_step": 611782, "epoch": 7370} {"train_loss": -28.068836212158203, "global_step": 611783, "epoch": 7370} {"train_loss": -27.52490234375, "global_step": 611784, "epoch": 7370} {"train_loss": -27.666051864624023, "global_step": 611785, "epoch": 7370} {"train_loss": -28.124853134155273, "global_step": 611786, "epoch": 7370} {"train_loss": -27.90122413635254, "global_step": 611787, "epoch": 7370} {"train_loss": -27.950559616088867, "global_step": 611788, "epoch": 7370} {"train_loss": -27.84674644470215, "global_step": 611789, "epoch": 7370} {"train_loss": -27.534515380859375, "global_step": 611790, "epoch": 7370} {"train_loss": -27.847497940063477, "global_step": 611791, "epoch": 7370} {"train_loss": -27.900559367903742, "global_step": 611792, "epoch": 7370, "val_loss": 6592063.5} {"train_loss": -27.616077423095703, "global_step": 611793, "epoch": 7371} {"train_loss": -27.256702423095703, "global_step": 611794, "epoch": 7371} {"train_loss": -27.325048446655273, "global_step": 611795, "epoch": 7371} {"train_loss": -27.64788818359375, "global_step": 611796, "epoch": 7371} {"train_loss": -27.153650283813477, "global_step": 611797, "epoch": 7371} {"train_loss": -26.6997013092041, "global_step": 611798, "epoch": 7371} {"train_loss": -28.079498291015625, "global_step": 611799, "epoch": 7371} {"train_loss": -27.068639755249023, "global_step": 611800, "epoch": 7371} {"train_loss": -26.656057357788086, "global_step": 611801, "epoch": 7371} {"train_loss": -27.3708438873291, "global_step": 611802, "epoch": 7371} {"train_loss": -26.961902618408203, "global_step": 611803, "epoch": 7371} {"train_loss": -27.085790634155273, "global_step": 611804, "epoch": 7371} {"train_loss": -27.574182510375977, "global_step": 611805, "epoch": 7371} {"train_loss": -27.53895378112793, "global_step": 611806, "epoch": 7371} {"train_loss": -27.296741485595703, "global_step": 611807, "epoch": 7371} {"train_loss": -27.545368194580078, "global_step": 611808, "epoch": 7371} {"train_loss": -27.26319694519043, "global_step": 611809, "epoch": 7371} {"train_loss": -27.732019424438477, "global_step": 611810, "epoch": 7371} {"train_loss": -27.746322631835938, "global_step": 611811, "epoch": 7371} {"train_loss": -27.84308433532715, "global_step": 611812, "epoch": 7371} {"train_loss": -27.591650009155273, "global_step": 611813, "epoch": 7371} {"train_loss": -27.68851661682129, "global_step": 611814, "epoch": 7371} {"train_loss": -27.540380477905273, "global_step": 611815, "epoch": 7371} {"train_loss": -27.61029624938965, "global_step": 611816, "epoch": 7371} {"train_loss": -27.648361206054688, "global_step": 611817, "epoch": 7371} {"train_loss": -27.741016387939453, "global_step": 611818, "epoch": 7371} {"train_loss": -27.94242286682129, "global_step": 611819, "epoch": 7371} {"train_loss": -27.743066787719727, "global_step": 611820, "epoch": 7371} {"train_loss": -28.180517196655273, "global_step": 611821, "epoch": 7371} {"train_loss": -27.874189376831055, "global_step": 611822, "epoch": 7371} {"train_loss": -27.74942398071289, "global_step": 611823, "epoch": 7371} {"train_loss": -28.07671546936035, "global_step": 611824, "epoch": 7371} {"train_loss": -27.732925415039062, "global_step": 611825, "epoch": 7371} {"train_loss": -27.7667179107666, "global_step": 611826, "epoch": 7371} {"train_loss": -28.307941436767578, "global_step": 611827, "epoch": 7371} {"train_loss": -28.006103515625, "global_step": 611828, "epoch": 7371} {"train_loss": -28.119901657104492, "global_step": 611829, "epoch": 7371} {"train_loss": -28.006103515625, "global_step": 611830, "epoch": 7371} {"train_loss": -28.182723999023438, "global_step": 611831, "epoch": 7371} {"train_loss": -28.258127212524414, "global_step": 611832, "epoch": 7371} {"train_loss": -28.306049346923828, "global_step": 611833, "epoch": 7371} {"train_loss": -28.1058349609375, "global_step": 611834, "epoch": 7371} {"train_loss": -28.2347412109375, "global_step": 611835, "epoch": 7371} {"train_loss": -27.877573013305664, "global_step": 611836, "epoch": 7371} {"train_loss": -28.1365909576416, "global_step": 611837, "epoch": 7371} {"train_loss": -28.116247177124023, "global_step": 611838, "epoch": 7371} {"train_loss": -28.312711715698242, "global_step": 611839, "epoch": 7371} {"train_loss": -28.172815322875977, "global_step": 611840, "epoch": 7371} {"train_loss": -28.814599990844727, "global_step": 611841, "epoch": 7371} {"train_loss": -28.49541664123535, "global_step": 611842, "epoch": 7371} {"train_loss": -27.958240509033203, "global_step": 611843, "epoch": 7371} {"train_loss": -28.252521514892578, "global_step": 611844, "epoch": 7371} {"train_loss": -28.208948135375977, "global_step": 611845, "epoch": 7371} {"train_loss": -28.547582626342773, "global_step": 611846, "epoch": 7371} {"train_loss": -28.222883224487305, "global_step": 611847, "epoch": 7371} {"train_loss": -27.953733444213867, "global_step": 611848, "epoch": 7371} {"train_loss": -28.25420570373535, "global_step": 611849, "epoch": 7371} {"train_loss": -28.461950302124023, "global_step": 611850, "epoch": 7371} {"train_loss": -28.368017196655273, "global_step": 611851, "epoch": 7371} {"train_loss": -27.817138671875, "global_step": 611852, "epoch": 7371} {"train_loss": -28.149641036987305, "global_step": 611853, "epoch": 7371} {"train_loss": -28.351057052612305, "global_step": 611854, "epoch": 7371} {"train_loss": -28.33713150024414, "global_step": 611855, "epoch": 7371} {"train_loss": -28.077157974243164, "global_step": 611856, "epoch": 7371} {"train_loss": -28.21603775024414, "global_step": 611857, "epoch": 7371} {"train_loss": -28.41829490661621, "global_step": 611858, "epoch": 7371} {"train_loss": -28.083087921142578, "global_step": 611859, "epoch": 7371} {"train_loss": -28.225757598876953, "global_step": 611860, "epoch": 7371} {"train_loss": -28.479150772094727, "global_step": 611861, "epoch": 7371} {"train_loss": -28.155399322509766, "global_step": 611862, "epoch": 7371} {"train_loss": -28.429824829101562, "global_step": 611863, "epoch": 7371} {"train_loss": -28.528583526611328, "global_step": 611864, "epoch": 7371} {"train_loss": -28.348896026611328, "global_step": 611865, "epoch": 7371} {"train_loss": -28.255374908447266, "global_step": 611866, "epoch": 7371} {"train_loss": -28.397974014282227, "global_step": 611867, "epoch": 7371} {"train_loss": -28.40386962890625, "global_step": 611868, "epoch": 7371} {"train_loss": -28.59341812133789, "global_step": 611869, "epoch": 7371} {"train_loss": -28.247888565063477, "global_step": 611870, "epoch": 7371} {"train_loss": -28.333887100219727, "global_step": 611871, "epoch": 7371} {"train_loss": -28.314258575439453, "global_step": 611872, "epoch": 7371} {"train_loss": -28.550369262695312, "global_step": 611873, "epoch": 7371} {"train_loss": -28.32155418395996, "global_step": 611874, "epoch": 7371} {"train_loss": -27.96010552831443, "global_step": 611875, "epoch": 7371, "val_loss": 6645315.0} {"train_loss": -27.235563278198242, "global_step": 611876, "epoch": 7372} {"train_loss": -26.342334747314453, "global_step": 611877, "epoch": 7372} {"train_loss": -26.08970069885254, "global_step": 611878, "epoch": 7372} {"train_loss": -26.818374633789062, "global_step": 611879, "epoch": 7372} {"train_loss": -27.237445831298828, "global_step": 611880, "epoch": 7372} {"train_loss": -27.197275161743164, "global_step": 611881, "epoch": 7372} {"train_loss": -27.491968154907227, "global_step": 611882, "epoch": 7372} {"train_loss": -27.599231719970703, "global_step": 611883, "epoch": 7372} {"train_loss": -27.3437442779541, "global_step": 611884, "epoch": 7372} {"train_loss": -28.04889488220215, "global_step": 611885, "epoch": 7372} {"train_loss": -27.01917839050293, "global_step": 611886, "epoch": 7372} {"train_loss": -27.461633682250977, "global_step": 611887, "epoch": 7372} {"train_loss": -27.065359115600586, "global_step": 611888, "epoch": 7372} {"train_loss": -27.606433868408203, "global_step": 611889, "epoch": 7372} {"train_loss": -27.613733291625977, "global_step": 611890, "epoch": 7372} {"train_loss": -27.702655792236328, "global_step": 611891, "epoch": 7372} {"train_loss": -27.564807891845703, "global_step": 611892, "epoch": 7372} {"train_loss": -27.511016845703125, "global_step": 611893, "epoch": 7372} {"train_loss": -27.73407554626465, "global_step": 611894, "epoch": 7372} {"train_loss": -27.543476104736328, "global_step": 611895, "epoch": 7372} {"train_loss": -27.8705997467041, "global_step": 611896, "epoch": 7372} {"train_loss": -27.393896102905273, "global_step": 611897, "epoch": 7372} {"train_loss": -27.72989845275879, "global_step": 611898, "epoch": 7372} {"train_loss": -27.81781578063965, "global_step": 611899, "epoch": 7372} {"train_loss": -27.562335968017578, "global_step": 611900, "epoch": 7372} {"train_loss": -27.93488121032715, "global_step": 611901, "epoch": 7372} {"train_loss": -28.203397750854492, "global_step": 611902, "epoch": 7372} {"train_loss": -27.767004013061523, "global_step": 611903, "epoch": 7372} {"train_loss": -27.884191513061523, "global_step": 611904, "epoch": 7372} {"train_loss": -27.68057632446289, "global_step": 611905, "epoch": 7372} {"train_loss": -28.0697078704834, "global_step": 611906, "epoch": 7372} {"train_loss": -28.011199951171875, "global_step": 611907, "epoch": 7372} {"train_loss": -28.114429473876953, "global_step": 611908, "epoch": 7372} {"train_loss": -28.11176872253418, "global_step": 611909, "epoch": 7372} {"train_loss": -28.085529327392578, "global_step": 611910, "epoch": 7372} {"train_loss": -28.108083724975586, "global_step": 611911, "epoch": 7372} {"train_loss": -28.309295654296875, "global_step": 611912, "epoch": 7372} {"train_loss": -28.395431518554688, "global_step": 611913, "epoch": 7372} {"train_loss": -27.94989585876465, "global_step": 611914, "epoch": 7372} {"train_loss": -28.42998695373535, "global_step": 611915, "epoch": 7372} {"train_loss": -28.115070343017578, "global_step": 611916, "epoch": 7372} {"train_loss": -28.106903076171875, "global_step": 611917, "epoch": 7372} {"train_loss": -27.981842041015625, "global_step": 611918, "epoch": 7372} {"train_loss": -27.941211700439453, "global_step": 611919, "epoch": 7372} {"train_loss": -28.0250301361084, "global_step": 611920, "epoch": 7372} {"train_loss": -27.556615829467773, "global_step": 611921, "epoch": 7372} {"train_loss": -27.745691299438477, "global_step": 611922, "epoch": 7372} {"train_loss": -28.09229850769043, "global_step": 611923, "epoch": 7372} {"train_loss": -28.344654083251953, "global_step": 611924, "epoch": 7372} {"train_loss": -28.27364158630371, "global_step": 611925, "epoch": 7372} {"train_loss": -28.222333908081055, "global_step": 611926, "epoch": 7372} {"train_loss": -28.036087036132812, "global_step": 611927, "epoch": 7372} {"train_loss": -27.925195693969727, "global_step": 611928, "epoch": 7372} {"train_loss": -28.186370849609375, "global_step": 611929, "epoch": 7372} {"train_loss": -27.994382858276367, "global_step": 611930, "epoch": 7372} {"train_loss": -28.024961471557617, "global_step": 611931, "epoch": 7372} {"train_loss": -27.828115463256836, "global_step": 611932, "epoch": 7372} {"train_loss": -28.028167724609375, "global_step": 611933, "epoch": 7372} {"train_loss": -27.536579132080078, "global_step": 611934, "epoch": 7372} {"train_loss": -28.33991050720215, "global_step": 611935, "epoch": 7372} {"train_loss": -27.636022567749023, "global_step": 611936, "epoch": 7372} {"train_loss": -27.945972442626953, "global_step": 611937, "epoch": 7372} {"train_loss": -28.155853271484375, "global_step": 611938, "epoch": 7372} {"train_loss": -27.57818603515625, "global_step": 611939, "epoch": 7372} {"train_loss": -28.2636775970459, "global_step": 611940, "epoch": 7372} {"train_loss": -27.50286865234375, "global_step": 611941, "epoch": 7372} {"train_loss": -27.59998893737793, "global_step": 611942, "epoch": 7372} {"train_loss": -28.15217399597168, "global_step": 611943, "epoch": 7372} {"train_loss": -28.068206787109375, "global_step": 611944, "epoch": 7372} {"train_loss": -28.2431697845459, "global_step": 611945, "epoch": 7372} {"train_loss": -28.168609619140625, "global_step": 611946, "epoch": 7372} {"train_loss": -28.12714958190918, "global_step": 611947, "epoch": 7372} {"train_loss": -28.140094757080078, "global_step": 611948, "epoch": 7372} {"train_loss": -28.183256149291992, "global_step": 611949, "epoch": 7372} {"train_loss": -28.24201011657715, "global_step": 611950, "epoch": 7372} {"train_loss": -28.183874130249023, "global_step": 611951, "epoch": 7372} {"train_loss": -27.95380210876465, "global_step": 611952, "epoch": 7372} {"train_loss": -28.273157119750977, "global_step": 611953, "epoch": 7372} {"train_loss": -27.749210357666016, "global_step": 611954, "epoch": 7372} {"train_loss": -27.847366333007812, "global_step": 611955, "epoch": 7372} {"train_loss": -28.1785831451416, "global_step": 611956, "epoch": 7372} {"train_loss": -28.331403732299805, "global_step": 611957, "epoch": 7372} {"train_loss": -27.824936418648225, "global_step": 611958, "epoch": 7372, "val_loss": 6656230.5} {"train_loss": -27.585859298706055, "global_step": 611959, "epoch": 7373} {"train_loss": -27.24273109436035, "global_step": 611960, "epoch": 7373} {"train_loss": -27.584482192993164, "global_step": 611961, "epoch": 7373} {"train_loss": -27.04731559753418, "global_step": 611962, "epoch": 7373} {"train_loss": -27.1739444732666, "global_step": 611963, "epoch": 7373} {"train_loss": -27.794116973876953, "global_step": 611964, "epoch": 7373} {"train_loss": -27.27528953552246, "global_step": 611965, "epoch": 7373} {"train_loss": -27.658777236938477, "global_step": 611966, "epoch": 7373} {"train_loss": -27.71933937072754, "global_step": 611967, "epoch": 7373} {"train_loss": -27.740528106689453, "global_step": 611968, "epoch": 7373} {"train_loss": -27.869596481323242, "global_step": 611969, "epoch": 7373} {"train_loss": -27.635976791381836, "global_step": 611970, "epoch": 7373} {"train_loss": -27.785364151000977, "global_step": 611971, "epoch": 7373} {"train_loss": -28.080411911010742, "global_step": 611972, "epoch": 7373} {"train_loss": -27.73345375061035, "global_step": 611973, "epoch": 7373} {"train_loss": -27.732269287109375, "global_step": 611974, "epoch": 7373} {"train_loss": -27.7409610748291, "global_step": 611975, "epoch": 7373} {"train_loss": -27.829975128173828, "global_step": 611976, "epoch": 7373} {"train_loss": -27.892866134643555, "global_step": 611977, "epoch": 7373} {"train_loss": -27.781156539916992, "global_step": 611978, "epoch": 7373} {"train_loss": -28.326847076416016, "global_step": 611979, "epoch": 7373} {"train_loss": -27.955617904663086, "global_step": 611980, "epoch": 7373} {"train_loss": -28.009000778198242, "global_step": 611981, "epoch": 7373} {"train_loss": -28.149160385131836, "global_step": 611982, "epoch": 7373} {"train_loss": -27.99152183532715, "global_step": 611983, "epoch": 7373} {"train_loss": -28.0880126953125, "global_step": 611984, "epoch": 7373} {"train_loss": -28.0472412109375, "global_step": 611985, "epoch": 7373} {"train_loss": -27.86944007873535, "global_step": 611986, "epoch": 7373} {"train_loss": -27.712940216064453, "global_step": 611987, "epoch": 7373} {"train_loss": -28.368864059448242, "global_step": 611988, "epoch": 7373} {"train_loss": -28.03670310974121, "global_step": 611989, "epoch": 7373} {"train_loss": -28.130552291870117, "global_step": 611990, "epoch": 7373} {"train_loss": -28.46315574645996, "global_step": 611991, "epoch": 7373} {"train_loss": -28.224639892578125, "global_step": 611992, "epoch": 7373} {"train_loss": -27.89007568359375, "global_step": 611993, "epoch": 7373} {"train_loss": -28.285709381103516, "global_step": 611994, "epoch": 7373} {"train_loss": -27.7553653717041, "global_step": 611995, "epoch": 7373} {"train_loss": -28.419971466064453, "global_step": 611996, "epoch": 7373} {"train_loss": -28.245649337768555, "global_step": 611997, "epoch": 7373} {"train_loss": -28.402973175048828, "global_step": 611998, "epoch": 7373} {"train_loss": -28.47063636779785, "global_step": 611999, "epoch": 7373} {"train_loss": -28.578754425048828, "global_step": 612000, "epoch": 7373} {"train_loss": -27.92176628112793, "global_step": 612001, "epoch": 7373} {"train_loss": -28.15126609802246, "global_step": 612002, "epoch": 7373} {"train_loss": -28.330907821655273, "global_step": 612003, "epoch": 7373} {"train_loss": -28.503650665283203, "global_step": 612004, "epoch": 7373} {"train_loss": -28.265933990478516, "global_step": 612005, "epoch": 7373} {"train_loss": -28.4908504486084, "global_step": 612006, "epoch": 7373} {"train_loss": -28.261234283447266, "global_step": 612007, "epoch": 7373} {"train_loss": -28.03252601623535, "global_step": 612008, "epoch": 7373} {"train_loss": -28.31298828125, "global_step": 612009, "epoch": 7373} {"train_loss": -28.00881004333496, "global_step": 612010, "epoch": 7373} {"train_loss": -27.868635177612305, "global_step": 612011, "epoch": 7373} {"train_loss": -27.590805053710938, "global_step": 612012, "epoch": 7373} {"train_loss": -27.640079498291016, "global_step": 612013, "epoch": 7373} {"train_loss": -28.347761154174805, "global_step": 612014, "epoch": 7373} {"train_loss": -27.828445434570312, "global_step": 612015, "epoch": 7373} {"train_loss": -27.849401473999023, "global_step": 612016, "epoch": 7373} {"train_loss": -27.71010398864746, "global_step": 612017, "epoch": 7373} {"train_loss": -28.041950225830078, "global_step": 612018, "epoch": 7373} {"train_loss": -28.12293815612793, "global_step": 612019, "epoch": 7373} {"train_loss": -27.870635986328125, "global_step": 612020, "epoch": 7373} {"train_loss": -28.08424186706543, "global_step": 612021, "epoch": 7373} {"train_loss": -28.242923736572266, "global_step": 612022, "epoch": 7373} {"train_loss": -28.046594619750977, "global_step": 612023, "epoch": 7373} {"train_loss": -28.292306900024414, "global_step": 612024, "epoch": 7373} {"train_loss": -28.248748779296875, "global_step": 612025, "epoch": 7373} {"train_loss": -27.764606475830078, "global_step": 612026, "epoch": 7373} {"train_loss": -27.976667404174805, "global_step": 612027, "epoch": 7373} {"train_loss": -28.11374855041504, "global_step": 612028, "epoch": 7373} {"train_loss": -27.86307716369629, "global_step": 612029, "epoch": 7373} {"train_loss": -28.374414443969727, "global_step": 612030, "epoch": 7373} {"train_loss": -28.146154403686523, "global_step": 612031, "epoch": 7373} {"train_loss": -28.215301513671875, "global_step": 612032, "epoch": 7373} {"train_loss": -28.134109497070312, "global_step": 612033, "epoch": 7373} {"train_loss": -27.82025718688965, "global_step": 612034, "epoch": 7373} {"train_loss": -28.15302085876465, "global_step": 612035, "epoch": 7373} {"train_loss": -28.22629165649414, "global_step": 612036, "epoch": 7373} {"train_loss": -27.94597816467285, "global_step": 612037, "epoch": 7373} {"train_loss": -28.197702407836914, "global_step": 612038, "epoch": 7373} {"train_loss": -28.3189754486084, "global_step": 612039, "epoch": 7373} {"train_loss": -28.265356063842773, "global_step": 612040, "epoch": 7373} {"train_loss": -27.983582668993847, "global_step": 612041, "epoch": 7373, "val_loss": 6705569.0} {"train_loss": -27.482309341430664, "global_step": 612042, "epoch": 7374} {"train_loss": -27.0980281829834, "global_step": 612043, "epoch": 7374} {"train_loss": -27.608152389526367, "global_step": 612044, "epoch": 7374} {"train_loss": -27.793472290039062, "global_step": 612045, "epoch": 7374} {"train_loss": -27.431955337524414, "global_step": 612046, "epoch": 7374} {"train_loss": -27.541913986206055, "global_step": 612047, "epoch": 7374} {"train_loss": -27.830102920532227, "global_step": 612048, "epoch": 7374} {"train_loss": -27.418012619018555, "global_step": 612049, "epoch": 7374} {"train_loss": -27.926376342773438, "global_step": 612050, "epoch": 7374} {"train_loss": -27.541229248046875, "global_step": 612051, "epoch": 7374} {"train_loss": -27.760297775268555, "global_step": 612052, "epoch": 7374} {"train_loss": -27.8704833984375, "global_step": 612053, "epoch": 7374} {"train_loss": -27.391504287719727, "global_step": 612054, "epoch": 7374} {"train_loss": -27.714147567749023, "global_step": 612055, "epoch": 7374} {"train_loss": -27.982995986938477, "global_step": 612056, "epoch": 7374} {"train_loss": -27.766321182250977, "global_step": 612057, "epoch": 7374} {"train_loss": -27.682615280151367, "global_step": 612058, "epoch": 7374} {"train_loss": -27.851224899291992, "global_step": 612059, "epoch": 7374} {"train_loss": -28.10210609436035, "global_step": 612060, "epoch": 7374} {"train_loss": -27.685495376586914, "global_step": 612061, "epoch": 7374} {"train_loss": -28.06890869140625, "global_step": 612062, "epoch": 7374} {"train_loss": -27.878631591796875, "global_step": 612063, "epoch": 7374} {"train_loss": -27.956134796142578, "global_step": 612064, "epoch": 7374} {"train_loss": -28.22476577758789, "global_step": 612065, "epoch": 7374} {"train_loss": -27.568647384643555, "global_step": 612066, "epoch": 7374} {"train_loss": -27.801862716674805, "global_step": 612067, "epoch": 7374} {"train_loss": -28.160816192626953, "global_step": 612068, "epoch": 7374} {"train_loss": -27.70465660095215, "global_step": 612069, "epoch": 7374} {"train_loss": -27.826541900634766, "global_step": 612070, "epoch": 7374} {"train_loss": -27.832427978515625, "global_step": 612071, "epoch": 7374} {"train_loss": -28.04056167602539, "global_step": 612072, "epoch": 7374} {"train_loss": -28.645233154296875, "global_step": 612073, "epoch": 7374} {"train_loss": -28.084049224853516, "global_step": 612074, "epoch": 7374} {"train_loss": -28.00058364868164, "global_step": 612075, "epoch": 7374} {"train_loss": -27.614398956298828, "global_step": 612076, "epoch": 7374} {"train_loss": -28.540985107421875, "global_step": 612077, "epoch": 7374} {"train_loss": -28.216144561767578, "global_step": 612078, "epoch": 7374} {"train_loss": -27.9531192779541, "global_step": 612079, "epoch": 7374} {"train_loss": -28.512100219726562, "global_step": 612080, "epoch": 7374} {"train_loss": -27.324430465698242, "global_step": 612081, "epoch": 7374} {"train_loss": -28.27048110961914, "global_step": 612082, "epoch": 7374} {"train_loss": -28.183263778686523, "global_step": 612083, "epoch": 7374} {"train_loss": -28.109460830688477, "global_step": 612084, "epoch": 7374} {"train_loss": -27.840585708618164, "global_step": 612085, "epoch": 7374} {"train_loss": -28.182910919189453, "global_step": 612086, "epoch": 7374} {"train_loss": -28.236419677734375, "global_step": 612087, "epoch": 7374} {"train_loss": -27.845325469970703, "global_step": 612088, "epoch": 7374} {"train_loss": -28.103546142578125, "global_step": 612089, "epoch": 7374} {"train_loss": -27.855945587158203, "global_step": 612090, "epoch": 7374} {"train_loss": -27.971607208251953, "global_step": 612091, "epoch": 7374} {"train_loss": -27.571760177612305, "global_step": 612092, "epoch": 7374} {"train_loss": -28.449478149414062, "global_step": 612093, "epoch": 7374} {"train_loss": -28.120899200439453, "global_step": 612094, "epoch": 7374} {"train_loss": -28.120351791381836, "global_step": 612095, "epoch": 7374} {"train_loss": -28.09397315979004, "global_step": 612096, "epoch": 7374} {"train_loss": -28.187829971313477, "global_step": 612097, "epoch": 7374} {"train_loss": -28.034570693969727, "global_step": 612098, "epoch": 7374} {"train_loss": -28.039703369140625, "global_step": 612099, "epoch": 7374} {"train_loss": -28.01369285583496, "global_step": 612100, "epoch": 7374} {"train_loss": -28.443618774414062, "global_step": 612101, "epoch": 7374} {"train_loss": -28.149856567382812, "global_step": 612102, "epoch": 7374} {"train_loss": -28.069061279296875, "global_step": 612103, "epoch": 7374} {"train_loss": -28.042617797851562, "global_step": 612104, "epoch": 7374} {"train_loss": -28.475698471069336, "global_step": 612105, "epoch": 7374} {"train_loss": -27.9632511138916, "global_step": 612106, "epoch": 7374} {"train_loss": -27.558151245117188, "global_step": 612107, "epoch": 7374} {"train_loss": -28.03974723815918, "global_step": 612108, "epoch": 7374} {"train_loss": -28.052387237548828, "global_step": 612109, "epoch": 7374} {"train_loss": -28.0137882232666, "global_step": 612110, "epoch": 7374} {"train_loss": -28.262603759765625, "global_step": 612111, "epoch": 7374} {"train_loss": -28.263025283813477, "global_step": 612112, "epoch": 7374} {"train_loss": -28.066314697265625, "global_step": 612113, "epoch": 7374} {"train_loss": -27.721012115478516, "global_step": 612114, "epoch": 7374} {"train_loss": -28.223495483398438, "global_step": 612115, "epoch": 7374} {"train_loss": -28.010908126831055, "global_step": 612116, "epoch": 7374} {"train_loss": -27.63330078125, "global_step": 612117, "epoch": 7374} {"train_loss": -27.995975494384766, "global_step": 612118, "epoch": 7374} {"train_loss": -27.648529052734375, "global_step": 612119, "epoch": 7374} {"train_loss": -28.06145668029785, "global_step": 612120, "epoch": 7374} {"train_loss": -27.867523193359375, "global_step": 612121, "epoch": 7374} {"train_loss": -28.08636474609375, "global_step": 612122, "epoch": 7374} {"train_loss": -28.368024826049805, "global_step": 612123, "epoch": 7374} {"train_loss": -27.928398660866613, "global_step": 612124, "epoch": 7374, "val_loss": 6602579.0} {"train_loss": -27.680816650390625, "global_step": 612125, "epoch": 7375} {"train_loss": -27.881879806518555, "global_step": 612126, "epoch": 7375} {"train_loss": -27.6555118560791, "global_step": 612127, "epoch": 7375} {"train_loss": -28.121612548828125, "global_step": 612128, "epoch": 7375} {"train_loss": -27.652103424072266, "global_step": 612129, "epoch": 7375} {"train_loss": -27.674009323120117, "global_step": 612130, "epoch": 7375} {"train_loss": -28.101058959960938, "global_step": 612131, "epoch": 7375} {"train_loss": -27.90234375, "global_step": 612132, "epoch": 7375} {"train_loss": -27.68526268005371, "global_step": 612133, "epoch": 7375} {"train_loss": -27.60114860534668, "global_step": 612134, "epoch": 7375} {"train_loss": -27.738422393798828, "global_step": 612135, "epoch": 7375} {"train_loss": -27.853260040283203, "global_step": 612136, "epoch": 7375} {"train_loss": -27.672958374023438, "global_step": 612137, "epoch": 7375} {"train_loss": -28.04340934753418, "global_step": 612138, "epoch": 7375} {"train_loss": -27.92494010925293, "global_step": 612139, "epoch": 7375} {"train_loss": -27.993179321289062, "global_step": 612140, "epoch": 7375} {"train_loss": -28.208993911743164, "global_step": 612141, "epoch": 7375} {"train_loss": -27.915369033813477, "global_step": 612142, "epoch": 7375} {"train_loss": -28.043655395507812, "global_step": 612143, "epoch": 7375} {"train_loss": -28.21546745300293, "global_step": 612144, "epoch": 7375} {"train_loss": -28.425403594970703, "global_step": 612145, "epoch": 7375} {"train_loss": -28.406797409057617, "global_step": 612146, "epoch": 7375} {"train_loss": -27.90433120727539, "global_step": 612147, "epoch": 7375} {"train_loss": -28.38831901550293, "global_step": 612148, "epoch": 7375} {"train_loss": -28.35685157775879, "global_step": 612149, "epoch": 7375} {"train_loss": -28.38508415222168, "global_step": 612150, "epoch": 7375} {"train_loss": -28.376983642578125, "global_step": 612151, "epoch": 7375} {"train_loss": -28.07236671447754, "global_step": 612152, "epoch": 7375} {"train_loss": -28.550811767578125, "global_step": 612153, "epoch": 7375} {"train_loss": -28.769025802612305, "global_step": 612154, "epoch": 7375} {"train_loss": -28.26869010925293, "global_step": 612155, "epoch": 7375} {"train_loss": -28.475116729736328, "global_step": 612156, "epoch": 7375} {"train_loss": -27.9729061126709, "global_step": 612157, "epoch": 7375} {"train_loss": -28.09868812561035, "global_step": 612158, "epoch": 7375} {"train_loss": -28.35817527770996, "global_step": 612159, "epoch": 7375} {"train_loss": -28.101806640625, "global_step": 612160, "epoch": 7375} {"train_loss": -28.442184448242188, "global_step": 612161, "epoch": 7375} {"train_loss": -27.88667106628418, "global_step": 612162, "epoch": 7375} {"train_loss": -28.052648544311523, "global_step": 612163, "epoch": 7375} {"train_loss": -28.139759063720703, "global_step": 612164, "epoch": 7375} {"train_loss": -28.43623924255371, "global_step": 612165, "epoch": 7375} {"train_loss": -28.060338973999023, "global_step": 612166, "epoch": 7375} {"train_loss": -28.232379913330078, "global_step": 612167, "epoch": 7375} {"train_loss": -28.6669979095459, "global_step": 612168, "epoch": 7375} {"train_loss": -28.157712936401367, "global_step": 612169, "epoch": 7375} {"train_loss": -28.052560806274414, "global_step": 612170, "epoch": 7375} {"train_loss": -27.744237899780273, "global_step": 612171, "epoch": 7375} {"train_loss": -27.894271850585938, "global_step": 612172, "epoch": 7375} {"train_loss": -27.959869384765625, "global_step": 612173, "epoch": 7375} {"train_loss": -27.98347282409668, "global_step": 612174, "epoch": 7375} {"train_loss": -28.289535522460938, "global_step": 612175, "epoch": 7375} {"train_loss": -27.98193359375, "global_step": 612176, "epoch": 7375} {"train_loss": -27.912221908569336, "global_step": 612177, "epoch": 7375} {"train_loss": -28.018798828125, "global_step": 612178, "epoch": 7375} {"train_loss": -28.355701446533203, "global_step": 612179, "epoch": 7375} {"train_loss": -27.986480712890625, "global_step": 612180, "epoch": 7375} {"train_loss": -27.728971481323242, "global_step": 612181, "epoch": 7375} {"train_loss": -27.50494384765625, "global_step": 612182, "epoch": 7375} {"train_loss": -27.878686904907227, "global_step": 612183, "epoch": 7375} {"train_loss": -28.402820587158203, "global_step": 612184, "epoch": 7375} {"train_loss": -27.55103874206543, "global_step": 612185, "epoch": 7375} {"train_loss": -27.410186767578125, "global_step": 612186, "epoch": 7375} {"train_loss": -28.031774520874023, "global_step": 612187, "epoch": 7375} {"train_loss": -27.493350982666016, "global_step": 612188, "epoch": 7375} {"train_loss": -27.91473960876465, "global_step": 612189, "epoch": 7375} {"train_loss": -27.284372329711914, "global_step": 612190, "epoch": 7375} {"train_loss": -27.892608642578125, "global_step": 612191, "epoch": 7375} {"train_loss": -27.584014892578125, "global_step": 612192, "epoch": 7375} {"train_loss": -28.11328125, "global_step": 612193, "epoch": 7375} {"train_loss": -28.181806564331055, "global_step": 612194, "epoch": 7375} {"train_loss": -27.810958862304688, "global_step": 612195, "epoch": 7375} {"train_loss": -27.98504066467285, "global_step": 612196, "epoch": 7375} {"train_loss": -27.96856689453125, "global_step": 612197, "epoch": 7375} {"train_loss": -28.13703727722168, "global_step": 612198, "epoch": 7375} {"train_loss": -27.887571334838867, "global_step": 612199, "epoch": 7375} {"train_loss": -27.943811416625977, "global_step": 612200, "epoch": 7375} {"train_loss": -27.917041778564453, "global_step": 612201, "epoch": 7375} {"train_loss": -28.021093368530273, "global_step": 612202, "epoch": 7375} {"train_loss": -27.8031063079834, "global_step": 612203, "epoch": 7375} {"train_loss": -28.3597354888916, "global_step": 612204, "epoch": 7375} {"train_loss": -28.16721534729004, "global_step": 612205, "epoch": 7375} {"train_loss": -27.88726234436035, "global_step": 612206, "epoch": 7375} {"train_loss": -27.997179536934357, "global_step": 612207, "epoch": 7375, "val_loss": 6541495.5} {"train_loss": -27.4860897064209, "global_step": 612208, "epoch": 7376} {"train_loss": -27.193017959594727, "global_step": 612209, "epoch": 7376} {"train_loss": -27.443115234375, "global_step": 612210, "epoch": 7376} {"train_loss": -27.894392013549805, "global_step": 612211, "epoch": 7376} {"train_loss": -27.285476684570312, "global_step": 612212, "epoch": 7376} {"train_loss": -27.557077407836914, "global_step": 612213, "epoch": 7376} {"train_loss": -27.688257217407227, "global_step": 612214, "epoch": 7376} {"train_loss": -27.424030303955078, "global_step": 612215, "epoch": 7376} {"train_loss": -28.301523208618164, "global_step": 612216, "epoch": 7376} {"train_loss": -27.741657257080078, "global_step": 612217, "epoch": 7376} {"train_loss": -27.9976806640625, "global_step": 612218, "epoch": 7376} {"train_loss": -27.623376846313477, "global_step": 612219, "epoch": 7376} {"train_loss": -27.820972442626953, "global_step": 612220, "epoch": 7376} {"train_loss": -28.105085372924805, "global_step": 612221, "epoch": 7376} {"train_loss": -27.850616455078125, "global_step": 612222, "epoch": 7376} {"train_loss": -27.874256134033203, "global_step": 612223, "epoch": 7376} {"train_loss": -28.084564208984375, "global_step": 612224, "epoch": 7376} {"train_loss": -27.820348739624023, "global_step": 612225, "epoch": 7376} {"train_loss": -28.024938583374023, "global_step": 612226, "epoch": 7376} {"train_loss": -27.959598541259766, "global_step": 612227, "epoch": 7376} {"train_loss": -27.973737716674805, "global_step": 612228, "epoch": 7376} {"train_loss": -27.652921676635742, "global_step": 612229, "epoch": 7376} {"train_loss": -28.024084091186523, "global_step": 612230, "epoch": 7376} {"train_loss": -27.811477661132812, "global_step": 612231, "epoch": 7376} {"train_loss": -28.30914306640625, "global_step": 612232, "epoch": 7376} {"train_loss": -28.08399772644043, "global_step": 612233, "epoch": 7376} {"train_loss": -28.32972526550293, "global_step": 612234, "epoch": 7376} {"train_loss": -28.182147979736328, "global_step": 612235, "epoch": 7376} {"train_loss": -28.138219833374023, "global_step": 612236, "epoch": 7376} {"train_loss": -28.01087760925293, "global_step": 612237, "epoch": 7376} {"train_loss": -28.126264572143555, "global_step": 612238, "epoch": 7376} {"train_loss": -28.224445343017578, "global_step": 612239, "epoch": 7376} {"train_loss": -28.533843994140625, "global_step": 612240, "epoch": 7376} {"train_loss": -28.185455322265625, "global_step": 612241, "epoch": 7376} {"train_loss": -28.451278686523438, "global_step": 612242, "epoch": 7376} {"train_loss": -28.280471801757812, "global_step": 612243, "epoch": 7376} {"train_loss": -28.194738388061523, "global_step": 612244, "epoch": 7376} {"train_loss": -28.240957260131836, "global_step": 612245, "epoch": 7376} {"train_loss": -28.07301139831543, "global_step": 612246, "epoch": 7376} {"train_loss": -28.272031784057617, "global_step": 612247, "epoch": 7376} {"train_loss": -27.960691452026367, "global_step": 612248, "epoch": 7376} {"train_loss": -28.424762725830078, "global_step": 612249, "epoch": 7376} {"train_loss": -28.279279708862305, "global_step": 612250, "epoch": 7376} {"train_loss": -28.230737686157227, "global_step": 612251, "epoch": 7376} {"train_loss": -28.211261749267578, "global_step": 612252, "epoch": 7376} {"train_loss": -28.427154541015625, "global_step": 612253, "epoch": 7376} {"train_loss": -28.106306076049805, "global_step": 612254, "epoch": 7376} {"train_loss": -28.438318252563477, "global_step": 612255, "epoch": 7376} {"train_loss": -28.20466423034668, "global_step": 612256, "epoch": 7376} {"train_loss": -27.549535751342773, "global_step": 612257, "epoch": 7376} {"train_loss": -27.054096221923828, "global_step": 612258, "epoch": 7376} {"train_loss": -26.88923454284668, "global_step": 612259, "epoch": 7376} {"train_loss": -26.47495460510254, "global_step": 612260, "epoch": 7376} {"train_loss": -27.373748779296875, "global_step": 612261, "epoch": 7376} {"train_loss": -27.84100914001465, "global_step": 612262, "epoch": 7376} {"train_loss": -27.50306510925293, "global_step": 612263, "epoch": 7376} {"train_loss": -27.810718536376953, "global_step": 612264, "epoch": 7376} {"train_loss": -27.548847198486328, "global_step": 612265, "epoch": 7376} {"train_loss": -27.279144287109375, "global_step": 612266, "epoch": 7376} {"train_loss": -28.15988540649414, "global_step": 612267, "epoch": 7376} {"train_loss": -27.770309448242188, "global_step": 612268, "epoch": 7376} {"train_loss": -27.97572135925293, "global_step": 612269, "epoch": 7376} {"train_loss": -28.071338653564453, "global_step": 612270, "epoch": 7376} {"train_loss": -28.079151153564453, "global_step": 612271, "epoch": 7376} {"train_loss": -27.9521541595459, "global_step": 612272, "epoch": 7376} {"train_loss": -28.152679443359375, "global_step": 612273, "epoch": 7376} {"train_loss": -28.077564239501953, "global_step": 612274, "epoch": 7376} {"train_loss": -27.988630294799805, "global_step": 612275, "epoch": 7376} {"train_loss": -27.950021743774414, "global_step": 612276, "epoch": 7376} {"train_loss": -27.610702514648438, "global_step": 612277, "epoch": 7376} {"train_loss": -27.571752548217773, "global_step": 612278, "epoch": 7376} {"train_loss": -27.985706329345703, "global_step": 612279, "epoch": 7376} {"train_loss": -28.21584129333496, "global_step": 612280, "epoch": 7376} {"train_loss": -27.89410400390625, "global_step": 612281, "epoch": 7376} {"train_loss": -28.005041122436523, "global_step": 612282, "epoch": 7376} {"train_loss": -27.89271354675293, "global_step": 612283, "epoch": 7376} {"train_loss": -28.14832878112793, "global_step": 612284, "epoch": 7376} {"train_loss": -28.141651153564453, "global_step": 612285, "epoch": 7376} {"train_loss": -28.077993392944336, "global_step": 612286, "epoch": 7376} {"train_loss": -28.246984481811523, "global_step": 612287, "epoch": 7376} {"train_loss": -28.11832046508789, "global_step": 612288, "epoch": 7376} {"train_loss": -28.01447105407715, "global_step": 612289, "epoch": 7376} {"train_loss": -27.92598591080631, "global_step": 612290, "epoch": 7376, "val_loss": 6478433.5} {"train_loss": -27.36774253845215, "global_step": 612291, "epoch": 7377} {"train_loss": -27.969852447509766, "global_step": 612292, "epoch": 7377} {"train_loss": -27.844024658203125, "global_step": 612293, "epoch": 7377} {"train_loss": -27.60013198852539, "global_step": 612294, "epoch": 7377} {"train_loss": -28.032957077026367, "global_step": 612295, "epoch": 7377} {"train_loss": -27.70749282836914, "global_step": 612296, "epoch": 7377} {"train_loss": -27.831037521362305, "global_step": 612297, "epoch": 7377} {"train_loss": -28.321537017822266, "global_step": 612298, "epoch": 7377} {"train_loss": -27.842344284057617, "global_step": 612299, "epoch": 7377} {"train_loss": -27.922428131103516, "global_step": 612300, "epoch": 7377} {"train_loss": -28.13278579711914, "global_step": 612301, "epoch": 7377} {"train_loss": -27.9903621673584, "global_step": 612302, "epoch": 7377} {"train_loss": -27.99942970275879, "global_step": 612303, "epoch": 7377} {"train_loss": -28.3132266998291, "global_step": 612304, "epoch": 7377} {"train_loss": -28.12603759765625, "global_step": 612305, "epoch": 7377} {"train_loss": -28.223066329956055, "global_step": 612306, "epoch": 7377} {"train_loss": -28.179523468017578, "global_step": 612307, "epoch": 7377} {"train_loss": -28.35870933532715, "global_step": 612308, "epoch": 7377} {"train_loss": -28.14983558654785, "global_step": 612309, "epoch": 7377} {"train_loss": -28.192792892456055, "global_step": 612310, "epoch": 7377} {"train_loss": -28.14788246154785, "global_step": 612311, "epoch": 7377} {"train_loss": -28.077245712280273, "global_step": 612312, "epoch": 7377} {"train_loss": -28.291479110717773, "global_step": 612313, "epoch": 7377} {"train_loss": -28.466089248657227, "global_step": 612314, "epoch": 7377} {"train_loss": -27.8690185546875, "global_step": 612315, "epoch": 7377} {"train_loss": -27.838430404663086, "global_step": 612316, "epoch": 7377} {"train_loss": -27.81199073791504, "global_step": 612317, "epoch": 7377} {"train_loss": -28.17835807800293, "global_step": 612318, "epoch": 7377} {"train_loss": -27.706008911132812, "global_step": 612319, "epoch": 7377} {"train_loss": -27.909000396728516, "global_step": 612320, "epoch": 7377} {"train_loss": -27.844085693359375, "global_step": 612321, "epoch": 7377} {"train_loss": -28.250280380249023, "global_step": 612322, "epoch": 7377} {"train_loss": -28.41988182067871, "global_step": 612323, "epoch": 7377} {"train_loss": -28.23604393005371, "global_step": 612324, "epoch": 7377} {"train_loss": -28.09209632873535, "global_step": 612325, "epoch": 7377} {"train_loss": -28.157596588134766, "global_step": 612326, "epoch": 7377} {"train_loss": -28.181074142456055, "global_step": 612327, "epoch": 7377} {"train_loss": -28.539575576782227, "global_step": 612328, "epoch": 7377} {"train_loss": -27.698719024658203, "global_step": 612329, "epoch": 7377} {"train_loss": -27.92024040222168, "global_step": 612330, "epoch": 7377} {"train_loss": -28.273717880249023, "global_step": 612331, "epoch": 7377} {"train_loss": -28.493438720703125, "global_step": 612332, "epoch": 7377} {"train_loss": -28.195911407470703, "global_step": 612333, "epoch": 7377} {"train_loss": -28.306564331054688, "global_step": 612334, "epoch": 7377} {"train_loss": -28.025724411010742, "global_step": 612335, "epoch": 7377} {"train_loss": -27.719648361206055, "global_step": 612336, "epoch": 7377} {"train_loss": -27.48883056640625, "global_step": 612337, "epoch": 7377} {"train_loss": -27.926183700561523, "global_step": 612338, "epoch": 7377} {"train_loss": -27.97926139831543, "global_step": 612339, "epoch": 7377} {"train_loss": -28.198047637939453, "global_step": 612340, "epoch": 7377} {"train_loss": -27.850921630859375, "global_step": 612341, "epoch": 7377} {"train_loss": -27.3579044342041, "global_step": 612342, "epoch": 7377} {"train_loss": -27.41314697265625, "global_step": 612343, "epoch": 7377} {"train_loss": -27.667194366455078, "global_step": 612344, "epoch": 7377} {"train_loss": -28.256879806518555, "global_step": 612345, "epoch": 7377} {"train_loss": -27.591833114624023, "global_step": 612346, "epoch": 7377} {"train_loss": -27.7344970703125, "global_step": 612347, "epoch": 7377} {"train_loss": -28.0137939453125, "global_step": 612348, "epoch": 7377} {"train_loss": -28.03798484802246, "global_step": 612349, "epoch": 7377} {"train_loss": -27.644622802734375, "global_step": 612350, "epoch": 7377} {"train_loss": -27.907392501831055, "global_step": 612351, "epoch": 7377} {"train_loss": -27.767499923706055, "global_step": 612352, "epoch": 7377} {"train_loss": -28.031164169311523, "global_step": 612353, "epoch": 7377} {"train_loss": -27.990985870361328, "global_step": 612354, "epoch": 7377} {"train_loss": -27.878732681274414, "global_step": 612355, "epoch": 7377} {"train_loss": -28.139989852905273, "global_step": 612356, "epoch": 7377} {"train_loss": -27.861921310424805, "global_step": 612357, "epoch": 7377} {"train_loss": -28.088382720947266, "global_step": 612358, "epoch": 7377} {"train_loss": -27.605133056640625, "global_step": 612359, "epoch": 7377} {"train_loss": -28.155231475830078, "global_step": 612360, "epoch": 7377} {"train_loss": -27.848480224609375, "global_step": 612361, "epoch": 7377} {"train_loss": -28.254474639892578, "global_step": 612362, "epoch": 7377} {"train_loss": -28.172138214111328, "global_step": 612363, "epoch": 7377} {"train_loss": -28.0419864654541, "global_step": 612364, "epoch": 7377} {"train_loss": -28.054431915283203, "global_step": 612365, "epoch": 7377} {"train_loss": -27.998701095581055, "global_step": 612366, "epoch": 7377} {"train_loss": -27.95479393005371, "global_step": 612367, "epoch": 7377} {"train_loss": -28.083398818969727, "global_step": 612368, "epoch": 7377} {"train_loss": -27.918420791625977, "global_step": 612369, "epoch": 7377} {"train_loss": -28.2515869140625, "global_step": 612370, "epoch": 7377} {"train_loss": -28.10394859313965, "global_step": 612371, "epoch": 7377} {"train_loss": -28.075275421142578, "global_step": 612372, "epoch": 7377} {"train_loss": -28.01402599840279, "global_step": 612373, "epoch": 7377, "val_loss": 6562144.0} {"train_loss": -27.594446182250977, "global_step": 612374, "epoch": 7378} {"train_loss": -28.172941207885742, "global_step": 612375, "epoch": 7378} {"train_loss": -26.644880294799805, "global_step": 612376, "epoch": 7378} {"train_loss": -25.70501708984375, "global_step": 612377, "epoch": 7378} {"train_loss": -25.683801651000977, "global_step": 612378, "epoch": 7378} {"train_loss": -27.500324249267578, "global_step": 612379, "epoch": 7378} {"train_loss": -26.3176326751709, "global_step": 612380, "epoch": 7378} {"train_loss": -26.881927490234375, "global_step": 612381, "epoch": 7378} {"train_loss": -27.479480743408203, "global_step": 612382, "epoch": 7378} {"train_loss": -26.49506187438965, "global_step": 612383, "epoch": 7378} {"train_loss": -27.670673370361328, "global_step": 612384, "epoch": 7378} {"train_loss": -27.246641159057617, "global_step": 612385, "epoch": 7378} {"train_loss": -26.921682357788086, "global_step": 612386, "epoch": 7378} {"train_loss": -27.4867000579834, "global_step": 612387, "epoch": 7378} {"train_loss": -27.14008140563965, "global_step": 612388, "epoch": 7378} {"train_loss": -27.127033233642578, "global_step": 612389, "epoch": 7378} {"train_loss": -27.549823760986328, "global_step": 612390, "epoch": 7378} {"train_loss": -27.382505416870117, "global_step": 612391, "epoch": 7378} {"train_loss": -27.498315811157227, "global_step": 612392, "epoch": 7378} {"train_loss": -27.52292823791504, "global_step": 612393, "epoch": 7378} {"train_loss": -27.593549728393555, "global_step": 612394, "epoch": 7378} {"train_loss": -27.457508087158203, "global_step": 612395, "epoch": 7378} {"train_loss": -27.531665802001953, "global_step": 612396, "epoch": 7378} {"train_loss": -27.907217025756836, "global_step": 612397, "epoch": 7378} {"train_loss": -27.397165298461914, "global_step": 612398, "epoch": 7378} {"train_loss": -27.63128089904785, "global_step": 612399, "epoch": 7378} {"train_loss": -28.031936645507812, "global_step": 612400, "epoch": 7378} {"train_loss": -27.410181045532227, "global_step": 612401, "epoch": 7378} {"train_loss": -27.850004196166992, "global_step": 612402, "epoch": 7378} {"train_loss": -27.808385848999023, "global_step": 612403, "epoch": 7378} {"train_loss": -27.738794326782227, "global_step": 612404, "epoch": 7378} {"train_loss": -28.000638961791992, "global_step": 612405, "epoch": 7378} {"train_loss": -28.199268341064453, "global_step": 612406, "epoch": 7378} {"train_loss": -27.774505615234375, "global_step": 612407, "epoch": 7378} {"train_loss": -27.915258407592773, "global_step": 612408, "epoch": 7378} {"train_loss": -28.05194664001465, "global_step": 612409, "epoch": 7378} {"train_loss": -27.978803634643555, "global_step": 612410, "epoch": 7378} {"train_loss": -28.274250030517578, "global_step": 612411, "epoch": 7378} {"train_loss": -27.621244430541992, "global_step": 612412, "epoch": 7378} {"train_loss": -27.806421279907227, "global_step": 612413, "epoch": 7378} {"train_loss": -27.96589469909668, "global_step": 612414, "epoch": 7378} {"train_loss": -27.98500633239746, "global_step": 612415, "epoch": 7378} {"train_loss": -27.951496124267578, "global_step": 612416, "epoch": 7378} {"train_loss": -28.165685653686523, "global_step": 612417, "epoch": 7378} {"train_loss": -27.848508834838867, "global_step": 612418, "epoch": 7378} {"train_loss": -27.926904678344727, "global_step": 612419, "epoch": 7378} {"train_loss": -27.84107780456543, "global_step": 612420, "epoch": 7378} {"train_loss": -28.130537033081055, "global_step": 612421, "epoch": 7378} {"train_loss": -28.032333374023438, "global_step": 612422, "epoch": 7378} {"train_loss": -28.2174072265625, "global_step": 612423, "epoch": 7378} {"train_loss": -28.09865379333496, "global_step": 612424, "epoch": 7378} {"train_loss": -28.37123680114746, "global_step": 612425, "epoch": 7378} {"train_loss": -28.411396026611328, "global_step": 612426, "epoch": 7378} {"train_loss": -28.057249069213867, "global_step": 612427, "epoch": 7378} {"train_loss": -28.11688804626465, "global_step": 612428, "epoch": 7378} {"train_loss": -28.176965713500977, "global_step": 612429, "epoch": 7378} {"train_loss": -28.14288902282715, "global_step": 612430, "epoch": 7378} {"train_loss": -27.982593536376953, "global_step": 612431, "epoch": 7378} {"train_loss": -28.530059814453125, "global_step": 612432, "epoch": 7378} {"train_loss": -28.240446090698242, "global_step": 612433, "epoch": 7378} {"train_loss": -28.062179565429688, "global_step": 612434, "epoch": 7378} {"train_loss": -28.0313777923584, "global_step": 612435, "epoch": 7378} {"train_loss": -28.32038688659668, "global_step": 612436, "epoch": 7378} {"train_loss": -28.666580200195312, "global_step": 612437, "epoch": 7378} {"train_loss": -28.036123275756836, "global_step": 612438, "epoch": 7378} {"train_loss": -28.263412475585938, "global_step": 612439, "epoch": 7378} {"train_loss": -28.200109481811523, "global_step": 612440, "epoch": 7378} {"train_loss": -28.083484649658203, "global_step": 612441, "epoch": 7378} {"train_loss": -27.972578048706055, "global_step": 612442, "epoch": 7378} {"train_loss": -28.02251625061035, "global_step": 612443, "epoch": 7378} {"train_loss": -27.799657821655273, "global_step": 612444, "epoch": 7378} {"train_loss": -26.811994552612305, "global_step": 612445, "epoch": 7378} {"train_loss": -27.31061363220215, "global_step": 612446, "epoch": 7378} {"train_loss": -27.671064376831055, "global_step": 612447, "epoch": 7378} {"train_loss": -27.606351852416992, "global_step": 612448, "epoch": 7378} {"train_loss": -28.137205123901367, "global_step": 612449, "epoch": 7378} {"train_loss": -27.10694694519043, "global_step": 612450, "epoch": 7378} {"train_loss": -27.142480850219727, "global_step": 612451, "epoch": 7378} {"train_loss": -27.780118942260742, "global_step": 612452, "epoch": 7378} {"train_loss": -27.687971115112305, "global_step": 612453, "epoch": 7378} {"train_loss": -27.193592071533203, "global_step": 612454, "epoch": 7378} {"train_loss": -27.2739315032959, "global_step": 612455, "epoch": 7378} {"train_loss": -27.703926109405884, "global_step": 612456, "epoch": 7378, "val_loss": 6639488.0} {"train_loss": -26.651525497436523, "global_step": 612457, "epoch": 7379} {"train_loss": -27.000534057617188, "global_step": 612458, "epoch": 7379} {"train_loss": -27.0274600982666, "global_step": 612459, "epoch": 7379} {"train_loss": -27.322452545166016, "global_step": 612460, "epoch": 7379} {"train_loss": -26.797927856445312, "global_step": 612461, "epoch": 7379} {"train_loss": -27.08259391784668, "global_step": 612462, "epoch": 7379} {"train_loss": -27.84943199157715, "global_step": 612463, "epoch": 7379} {"train_loss": -27.150522232055664, "global_step": 612464, "epoch": 7379} {"train_loss": -27.007715225219727, "global_step": 612465, "epoch": 7379} {"train_loss": -27.312814712524414, "global_step": 612466, "epoch": 7379} {"train_loss": -27.362333297729492, "global_step": 612467, "epoch": 7379} {"train_loss": -27.256591796875, "global_step": 612468, "epoch": 7379} {"train_loss": -27.50665283203125, "global_step": 612469, "epoch": 7379} {"train_loss": -27.745990753173828, "global_step": 612470, "epoch": 7379} {"train_loss": -27.946447372436523, "global_step": 612471, "epoch": 7379} {"train_loss": -28.007648468017578, "global_step": 612472, "epoch": 7379} {"train_loss": -27.645795822143555, "global_step": 612473, "epoch": 7379} {"train_loss": -27.628019332885742, "global_step": 612474, "epoch": 7379} {"train_loss": -27.953428268432617, "global_step": 612475, "epoch": 7379} {"train_loss": -27.957609176635742, "global_step": 612476, "epoch": 7379} {"train_loss": -28.1364803314209, "global_step": 612477, "epoch": 7379} {"train_loss": -27.954614639282227, "global_step": 612478, "epoch": 7379} {"train_loss": -27.868122100830078, "global_step": 612479, "epoch": 7379} {"train_loss": -28.01171875, "global_step": 612480, "epoch": 7379} {"train_loss": -27.76413345336914, "global_step": 612481, "epoch": 7379} {"train_loss": -28.128271102905273, "global_step": 612482, "epoch": 7379} {"train_loss": -27.9285831451416, "global_step": 612483, "epoch": 7379} {"train_loss": -28.00843620300293, "global_step": 612484, "epoch": 7379} {"train_loss": -27.869068145751953, "global_step": 612485, "epoch": 7379} {"train_loss": -27.624149322509766, "global_step": 612486, "epoch": 7379} {"train_loss": -27.899097442626953, "global_step": 612487, "epoch": 7379} {"train_loss": -28.244632720947266, "global_step": 612488, "epoch": 7379} {"train_loss": -28.315603256225586, "global_step": 612489, "epoch": 7379} {"train_loss": -27.9859676361084, "global_step": 612490, "epoch": 7379} {"train_loss": -27.990131378173828, "global_step": 612491, "epoch": 7379} {"train_loss": -28.116804122924805, "global_step": 612492, "epoch": 7379} {"train_loss": -28.139041900634766, "global_step": 612493, "epoch": 7379} {"train_loss": -28.133655548095703, "global_step": 612494, "epoch": 7379} {"train_loss": -28.24481201171875, "global_step": 612495, "epoch": 7379} {"train_loss": -28.396759033203125, "global_step": 612496, "epoch": 7379} {"train_loss": -28.199970245361328, "global_step": 612497, "epoch": 7379} {"train_loss": -28.29660415649414, "global_step": 612498, "epoch": 7379} {"train_loss": -28.229516983032227, "global_step": 612499, "epoch": 7379} {"train_loss": -28.225698471069336, "global_step": 612500, "epoch": 7379} {"train_loss": -27.85357093811035, "global_step": 612501, "epoch": 7379} {"train_loss": -27.92620849609375, "global_step": 612502, "epoch": 7379} {"train_loss": -27.833209991455078, "global_step": 612503, "epoch": 7379} {"train_loss": -28.104598999023438, "global_step": 612504, "epoch": 7379} {"train_loss": -27.905216217041016, "global_step": 612505, "epoch": 7379} {"train_loss": -28.263996124267578, "global_step": 612506, "epoch": 7379} {"train_loss": -28.063108444213867, "global_step": 612507, "epoch": 7379} {"train_loss": -27.88519287109375, "global_step": 612508, "epoch": 7379} {"train_loss": -27.90723991394043, "global_step": 612509, "epoch": 7379} {"train_loss": -27.927549362182617, "global_step": 612510, "epoch": 7379} {"train_loss": -27.798816680908203, "global_step": 612511, "epoch": 7379} {"train_loss": -27.981281280517578, "global_step": 612512, "epoch": 7379} {"train_loss": -28.3525447845459, "global_step": 612513, "epoch": 7379} {"train_loss": -27.625707626342773, "global_step": 612514, "epoch": 7379} {"train_loss": -28.003183364868164, "global_step": 612515, "epoch": 7379} {"train_loss": -28.6564884185791, "global_step": 612516, "epoch": 7379} {"train_loss": -27.548139572143555, "global_step": 612517, "epoch": 7379} {"train_loss": -27.62751579284668, "global_step": 612518, "epoch": 7379} {"train_loss": -27.238309860229492, "global_step": 612519, "epoch": 7379} {"train_loss": -27.901037216186523, "global_step": 612520, "epoch": 7379} {"train_loss": -27.537137985229492, "global_step": 612521, "epoch": 7379} {"train_loss": -27.369369506835938, "global_step": 612522, "epoch": 7379} {"train_loss": -27.670963287353516, "global_step": 612523, "epoch": 7379} {"train_loss": -27.39984130859375, "global_step": 612524, "epoch": 7379} {"train_loss": -27.64670181274414, "global_step": 612525, "epoch": 7379} {"train_loss": -27.604156494140625, "global_step": 612526, "epoch": 7379} {"train_loss": -28.098173141479492, "global_step": 612527, "epoch": 7379} {"train_loss": -27.698486328125, "global_step": 612528, "epoch": 7379} {"train_loss": -28.264387130737305, "global_step": 612529, "epoch": 7379} {"train_loss": -27.602420806884766, "global_step": 612530, "epoch": 7379} {"train_loss": -27.92573356628418, "global_step": 612531, "epoch": 7379} {"train_loss": -28.03311538696289, "global_step": 612532, "epoch": 7379} {"train_loss": -28.02495765686035, "global_step": 612533, "epoch": 7379} {"train_loss": -28.041624069213867, "global_step": 612534, "epoch": 7379} {"train_loss": -28.173053741455078, "global_step": 612535, "epoch": 7379} {"train_loss": -28.02094078063965, "global_step": 612536, "epoch": 7379} {"train_loss": -27.913049697875977, "global_step": 612537, "epoch": 7379} {"train_loss": -28.1735897064209, "global_step": 612538, "epoch": 7379} {"train_loss": -27.839221954345703, "global_step": 612539, "epoch": 7379, "val_loss": 6672452.0} {"train_loss": -27.577524185180664, "global_step": 612540, "epoch": 7380} {"train_loss": -27.463043212890625, "global_step": 612541, "epoch": 7380} {"train_loss": -26.885650634765625, "global_step": 612542, "epoch": 7380} {"train_loss": -27.872577667236328, "global_step": 612543, "epoch": 7380} {"train_loss": -27.3637638092041, "global_step": 612544, "epoch": 7380} {"train_loss": -27.341999053955078, "global_step": 612545, "epoch": 7380} {"train_loss": -27.965015411376953, "global_step": 612546, "epoch": 7380} {"train_loss": -27.4477596282959, "global_step": 612547, "epoch": 7380} {"train_loss": -27.450464248657227, "global_step": 612548, "epoch": 7380} {"train_loss": -27.436664581298828, "global_step": 612549, "epoch": 7380} {"train_loss": -28.04856300354004, "global_step": 612550, "epoch": 7380} {"train_loss": -28.03508949279785, "global_step": 612551, "epoch": 7380} {"train_loss": -28.097936630249023, "global_step": 612552, "epoch": 7380} {"train_loss": -27.73980712890625, "global_step": 612553, "epoch": 7380} {"train_loss": -27.769994735717773, "global_step": 612554, "epoch": 7380} {"train_loss": -28.035078048706055, "global_step": 612555, "epoch": 7380} {"train_loss": -27.730209350585938, "global_step": 612556, "epoch": 7380} {"train_loss": -27.680877685546875, "global_step": 612557, "epoch": 7380} {"train_loss": -27.860355377197266, "global_step": 612558, "epoch": 7380} {"train_loss": -27.846282958984375, "global_step": 612559, "epoch": 7380} {"train_loss": -28.08405876159668, "global_step": 612560, "epoch": 7380} {"train_loss": -28.32343864440918, "global_step": 612561, "epoch": 7380} {"train_loss": -28.061681747436523, "global_step": 612562, "epoch": 7380} {"train_loss": -28.137866973876953, "global_step": 612563, "epoch": 7380} {"train_loss": -28.1363582611084, "global_step": 612564, "epoch": 7380} {"train_loss": -28.34528160095215, "global_step": 612565, "epoch": 7380} {"train_loss": -27.951435089111328, "global_step": 612566, "epoch": 7380} {"train_loss": -28.358179092407227, "global_step": 612567, "epoch": 7380} {"train_loss": -28.098241806030273, "global_step": 612568, "epoch": 7380} {"train_loss": -28.222578048706055, "global_step": 612569, "epoch": 7380} {"train_loss": -28.1167049407959, "global_step": 612570, "epoch": 7380} {"train_loss": -28.234695434570312, "global_step": 612571, "epoch": 7380} {"train_loss": -28.322509765625, "global_step": 612572, "epoch": 7380} {"train_loss": -27.856124877929688, "global_step": 612573, "epoch": 7380} {"train_loss": -28.1715030670166, "global_step": 612574, "epoch": 7380} {"train_loss": -28.300642013549805, "global_step": 612575, "epoch": 7380} {"train_loss": -28.125564575195312, "global_step": 612576, "epoch": 7380} {"train_loss": -28.262802124023438, "global_step": 612577, "epoch": 7380} {"train_loss": -28.239730834960938, "global_step": 612578, "epoch": 7380} {"train_loss": -28.037216186523438, "global_step": 612579, "epoch": 7380} {"train_loss": -28.097579956054688, "global_step": 612580, "epoch": 7380} {"train_loss": -27.55885124206543, "global_step": 612581, "epoch": 7380} {"train_loss": -27.96027183532715, "global_step": 612582, "epoch": 7380} {"train_loss": -27.988239288330078, "global_step": 612583, "epoch": 7380} {"train_loss": -28.139801025390625, "global_step": 612584, "epoch": 7380} {"train_loss": -28.332172393798828, "global_step": 612585, "epoch": 7380} {"train_loss": -28.076963424682617, "global_step": 612586, "epoch": 7380} {"train_loss": -27.79640007019043, "global_step": 612587, "epoch": 7380} {"train_loss": -27.45979118347168, "global_step": 612588, "epoch": 7380} {"train_loss": -28.382205963134766, "global_step": 612589, "epoch": 7380} {"train_loss": -28.283008575439453, "global_step": 612590, "epoch": 7380} {"train_loss": -27.83391761779785, "global_step": 612591, "epoch": 7380} {"train_loss": -28.2315616607666, "global_step": 612592, "epoch": 7380} {"train_loss": -28.008535385131836, "global_step": 612593, "epoch": 7380} {"train_loss": -28.11060905456543, "global_step": 612594, "epoch": 7380} {"train_loss": -28.241657257080078, "global_step": 612595, "epoch": 7380} {"train_loss": -28.492902755737305, "global_step": 612596, "epoch": 7380} {"train_loss": -28.218862533569336, "global_step": 612597, "epoch": 7380} {"train_loss": -28.2468204498291, "global_step": 612598, "epoch": 7380} {"train_loss": -28.095640182495117, "global_step": 612599, "epoch": 7380} {"train_loss": -28.061309814453125, "global_step": 612600, "epoch": 7380} {"train_loss": -28.11285400390625, "global_step": 612601, "epoch": 7380} {"train_loss": -28.149961471557617, "global_step": 612602, "epoch": 7380} {"train_loss": -28.003149032592773, "global_step": 612603, "epoch": 7380} {"train_loss": -28.438230514526367, "global_step": 612604, "epoch": 7380} {"train_loss": -28.052997589111328, "global_step": 612605, "epoch": 7380} {"train_loss": -28.184961318969727, "global_step": 612606, "epoch": 7380} {"train_loss": -28.185956954956055, "global_step": 612607, "epoch": 7380} {"train_loss": -27.697473526000977, "global_step": 612608, "epoch": 7380} {"train_loss": -27.95415687561035, "global_step": 612609, "epoch": 7380} {"train_loss": -27.970142364501953, "global_step": 612610, "epoch": 7380} {"train_loss": -28.012775421142578, "global_step": 612611, "epoch": 7380} {"train_loss": -28.2801513671875, "global_step": 612612, "epoch": 7380} {"train_loss": -27.88473892211914, "global_step": 612613, "epoch": 7380} {"train_loss": -27.854944229125977, "global_step": 612614, "epoch": 7380} {"train_loss": -27.944211959838867, "global_step": 612615, "epoch": 7380} {"train_loss": -27.903242111206055, "global_step": 612616, "epoch": 7380} {"train_loss": -28.119897842407227, "global_step": 612617, "epoch": 7380} {"train_loss": -28.32257080078125, "global_step": 612618, "epoch": 7380} {"train_loss": -28.371435165405273, "global_step": 612619, "epoch": 7380} {"train_loss": -27.942304611206055, "global_step": 612620, "epoch": 7380} {"train_loss": -28.06103515625, "global_step": 612621, "epoch": 7380} {"train_loss": -28.01213338001665, "global_step": 612622, "epoch": 7380, "val_loss": 6612546.0} {"train_loss": -27.80034828186035, "global_step": 612623, "epoch": 7381} {"train_loss": -27.55141258239746, "global_step": 612624, "epoch": 7381} {"train_loss": -27.441558837890625, "global_step": 612625, "epoch": 7381} {"train_loss": -27.638900756835938, "global_step": 612626, "epoch": 7381} {"train_loss": -27.60703468322754, "global_step": 612627, "epoch": 7381} {"train_loss": -27.686365127563477, "global_step": 612628, "epoch": 7381} {"train_loss": -27.860937118530273, "global_step": 612629, "epoch": 7381} {"train_loss": -27.62494468688965, "global_step": 612630, "epoch": 7381} {"train_loss": -27.55933952331543, "global_step": 612631, "epoch": 7381} {"train_loss": -27.822513580322266, "global_step": 612632, "epoch": 7381} {"train_loss": -27.94526481628418, "global_step": 612633, "epoch": 7381} {"train_loss": -27.890684127807617, "global_step": 612634, "epoch": 7381} {"train_loss": -28.199567794799805, "global_step": 612635, "epoch": 7381} {"train_loss": -27.807758331298828, "global_step": 612636, "epoch": 7381} {"train_loss": -27.777326583862305, "global_step": 612637, "epoch": 7381} {"train_loss": -27.95623207092285, "global_step": 612638, "epoch": 7381} {"train_loss": -27.77849769592285, "global_step": 612639, "epoch": 7381} {"train_loss": -27.89918327331543, "global_step": 612640, "epoch": 7381} {"train_loss": -28.123458862304688, "global_step": 612641, "epoch": 7381} {"train_loss": -27.8629150390625, "global_step": 612642, "epoch": 7381} {"train_loss": -28.09132194519043, "global_step": 612643, "epoch": 7381} {"train_loss": -28.3621883392334, "global_step": 612644, "epoch": 7381} {"train_loss": -27.99525260925293, "global_step": 612645, "epoch": 7381} {"train_loss": -28.038501739501953, "global_step": 612646, "epoch": 7381} {"train_loss": -28.132659912109375, "global_step": 612647, "epoch": 7381} {"train_loss": -28.03496742248535, "global_step": 612648, "epoch": 7381} {"train_loss": -28.199934005737305, "global_step": 612649, "epoch": 7381} {"train_loss": -27.914081573486328, "global_step": 612650, "epoch": 7381} {"train_loss": -28.317874908447266, "global_step": 612651, "epoch": 7381} {"train_loss": -28.416101455688477, "global_step": 612652, "epoch": 7381} {"train_loss": -28.00154685974121, "global_step": 612653, "epoch": 7381} {"train_loss": -28.211273193359375, "global_step": 612654, "epoch": 7381} {"train_loss": -27.976181030273438, "global_step": 612655, "epoch": 7381} {"train_loss": -28.123010635375977, "global_step": 612656, "epoch": 7381} {"train_loss": -28.2587947845459, "global_step": 612657, "epoch": 7381} {"train_loss": -27.922475814819336, "global_step": 612658, "epoch": 7381} {"train_loss": -28.261917114257812, "global_step": 612659, "epoch": 7381} {"train_loss": -28.478097915649414, "global_step": 612660, "epoch": 7381} {"train_loss": -27.75806999206543, "global_step": 612661, "epoch": 7381} {"train_loss": -28.42469596862793, "global_step": 612662, "epoch": 7381} {"train_loss": -28.096426010131836, "global_step": 612663, "epoch": 7381} {"train_loss": -28.24933433532715, "global_step": 612664, "epoch": 7381} {"train_loss": -28.26434898376465, "global_step": 612665, "epoch": 7381} {"train_loss": -28.47505760192871, "global_step": 612666, "epoch": 7381} {"train_loss": -28.1942195892334, "global_step": 612667, "epoch": 7381} {"train_loss": -27.61643409729004, "global_step": 612668, "epoch": 7381} {"train_loss": -27.53535270690918, "global_step": 612669, "epoch": 7381} {"train_loss": -26.694995880126953, "global_step": 612670, "epoch": 7381} {"train_loss": -25.8195858001709, "global_step": 612671, "epoch": 7381} {"train_loss": -26.75214958190918, "global_step": 612672, "epoch": 7381} {"train_loss": -27.907739639282227, "global_step": 612673, "epoch": 7381} {"train_loss": -27.512531280517578, "global_step": 612674, "epoch": 7381} {"train_loss": -27.803985595703125, "global_step": 612675, "epoch": 7381} {"train_loss": -27.501447677612305, "global_step": 612676, "epoch": 7381} {"train_loss": -28.020612716674805, "global_step": 612677, "epoch": 7381} {"train_loss": -27.307336807250977, "global_step": 612678, "epoch": 7381} {"train_loss": -27.901447296142578, "global_step": 612679, "epoch": 7381} {"train_loss": -27.289304733276367, "global_step": 612680, "epoch": 7381} {"train_loss": -27.963048934936523, "global_step": 612681, "epoch": 7381} {"train_loss": -27.845884323120117, "global_step": 612682, "epoch": 7381} {"train_loss": -27.81768798828125, "global_step": 612683, "epoch": 7381} {"train_loss": -28.12271499633789, "global_step": 612684, "epoch": 7381} {"train_loss": -27.4154109954834, "global_step": 612685, "epoch": 7381} {"train_loss": -28.162887573242188, "global_step": 612686, "epoch": 7381} {"train_loss": -27.590147018432617, "global_step": 612687, "epoch": 7381} {"train_loss": -27.81965446472168, "global_step": 612688, "epoch": 7381} {"train_loss": -27.971403121948242, "global_step": 612689, "epoch": 7381} {"train_loss": -27.8007755279541, "global_step": 612690, "epoch": 7381} {"train_loss": -28.257160186767578, "global_step": 612691, "epoch": 7381} {"train_loss": -27.93771743774414, "global_step": 612692, "epoch": 7381} {"train_loss": -27.877843856811523, "global_step": 612693, "epoch": 7381} {"train_loss": -27.90130043029785, "global_step": 612694, "epoch": 7381} {"train_loss": -27.988508224487305, "global_step": 612695, "epoch": 7381} {"train_loss": -27.79524040222168, "global_step": 612696, "epoch": 7381} {"train_loss": -28.166677474975586, "global_step": 612697, "epoch": 7381} {"train_loss": -27.946014404296875, "global_step": 612698, "epoch": 7381} {"train_loss": -27.885608673095703, "global_step": 612699, "epoch": 7381} {"train_loss": -27.89288902282715, "global_step": 612700, "epoch": 7381} {"train_loss": -28.080305099487305, "global_step": 612701, "epoch": 7381} {"train_loss": -28.201711654663086, "global_step": 612702, "epoch": 7381} {"train_loss": -28.137622833251953, "global_step": 612703, "epoch": 7381} {"train_loss": -27.95956802368164, "global_step": 612704, "epoch": 7381} {"train_loss": -27.882650145565172, "global_step": 612705, "epoch": 7381, "val_loss": 6635324.5} {"train_loss": -28.21588706970215, "global_step": 612706, "epoch": 7382} {"train_loss": -27.837438583374023, "global_step": 612707, "epoch": 7382} {"train_loss": -27.6270751953125, "global_step": 612708, "epoch": 7382} {"train_loss": -27.958250045776367, "global_step": 612709, "epoch": 7382} {"train_loss": -27.59185791015625, "global_step": 612710, "epoch": 7382} {"train_loss": -27.76348304748535, "global_step": 612711, "epoch": 7382} {"train_loss": -28.13150978088379, "global_step": 612712, "epoch": 7382} {"train_loss": -28.428415298461914, "global_step": 612713, "epoch": 7382} {"train_loss": -28.323209762573242, "global_step": 612714, "epoch": 7382} {"train_loss": -28.289945602416992, "global_step": 612715, "epoch": 7382} {"train_loss": -27.921112060546875, "global_step": 612716, "epoch": 7382} {"train_loss": -27.855321884155273, "global_step": 612717, "epoch": 7382} {"train_loss": -28.238004684448242, "global_step": 612718, "epoch": 7382} {"train_loss": -28.201391220092773, "global_step": 612719, "epoch": 7382} {"train_loss": -28.207828521728516, "global_step": 612720, "epoch": 7382} {"train_loss": -27.86768913269043, "global_step": 612721, "epoch": 7382} {"train_loss": -28.025739669799805, "global_step": 612722, "epoch": 7382} {"train_loss": -28.23317527770996, "global_step": 612723, "epoch": 7382} {"train_loss": -28.13075065612793, "global_step": 612724, "epoch": 7382} {"train_loss": -28.08576774597168, "global_step": 612725, "epoch": 7382} {"train_loss": -28.282257080078125, "global_step": 612726, "epoch": 7382} {"train_loss": -28.407514572143555, "global_step": 612727, "epoch": 7382} {"train_loss": -28.293066024780273, "global_step": 612728, "epoch": 7382} {"train_loss": -28.39290428161621, "global_step": 612729, "epoch": 7382} {"train_loss": -28.30503273010254, "global_step": 612730, "epoch": 7382} {"train_loss": -28.057336807250977, "global_step": 612731, "epoch": 7382} {"train_loss": -28.37346839904785, "global_step": 612732, "epoch": 7382} {"train_loss": -28.0043888092041, "global_step": 612733, "epoch": 7382} {"train_loss": -28.24232292175293, "global_step": 612734, "epoch": 7382} {"train_loss": -28.213775634765625, "global_step": 612735, "epoch": 7382} {"train_loss": -28.4102840423584, "global_step": 612736, "epoch": 7382} {"train_loss": -28.655364990234375, "global_step": 612737, "epoch": 7382} {"train_loss": -28.461042404174805, "global_step": 612738, "epoch": 7382} {"train_loss": -28.472888946533203, "global_step": 612739, "epoch": 7382} {"train_loss": -28.190160751342773, "global_step": 612740, "epoch": 7382} {"train_loss": -28.286218643188477, "global_step": 612741, "epoch": 7382} {"train_loss": -28.2364501953125, "global_step": 612742, "epoch": 7382} {"train_loss": -28.330875396728516, "global_step": 612743, "epoch": 7382} {"train_loss": -28.530914306640625, "global_step": 612744, "epoch": 7382} {"train_loss": -28.244970321655273, "global_step": 612745, "epoch": 7382} {"train_loss": -28.175806045532227, "global_step": 612746, "epoch": 7382} {"train_loss": -28.533384323120117, "global_step": 612747, "epoch": 7382} {"train_loss": -28.02046775817871, "global_step": 612748, "epoch": 7382} {"train_loss": -28.07440185546875, "global_step": 612749, "epoch": 7382} {"train_loss": -27.9196720123291, "global_step": 612750, "epoch": 7382} {"train_loss": -28.140247344970703, "global_step": 612751, "epoch": 7382} {"train_loss": -28.277130126953125, "global_step": 612752, "epoch": 7382} {"train_loss": -27.56217384338379, "global_step": 612753, "epoch": 7382} {"train_loss": -26.519397735595703, "global_step": 612754, "epoch": 7382} {"train_loss": -26.8950252532959, "global_step": 612755, "epoch": 7382} {"train_loss": -27.54810905456543, "global_step": 612756, "epoch": 7382} {"train_loss": -27.91749382019043, "global_step": 612757, "epoch": 7382} {"train_loss": -27.478992462158203, "global_step": 612758, "epoch": 7382} {"train_loss": -27.57610511779785, "global_step": 612759, "epoch": 7382} {"train_loss": -27.820737838745117, "global_step": 612760, "epoch": 7382} {"train_loss": -27.973892211914062, "global_step": 612761, "epoch": 7382} {"train_loss": -27.85462760925293, "global_step": 612762, "epoch": 7382} {"train_loss": -27.779666900634766, "global_step": 612763, "epoch": 7382} {"train_loss": -27.791290283203125, "global_step": 612764, "epoch": 7382} {"train_loss": -28.20880126953125, "global_step": 612765, "epoch": 7382} {"train_loss": -27.62470054626465, "global_step": 612766, "epoch": 7382} {"train_loss": -27.806161880493164, "global_step": 612767, "epoch": 7382} {"train_loss": -27.54152488708496, "global_step": 612768, "epoch": 7382} {"train_loss": -28.14320945739746, "global_step": 612769, "epoch": 7382} {"train_loss": -28.002111434936523, "global_step": 612770, "epoch": 7382} {"train_loss": -27.956695556640625, "global_step": 612771, "epoch": 7382} {"train_loss": -27.852813720703125, "global_step": 612772, "epoch": 7382} {"train_loss": -28.303869247436523, "global_step": 612773, "epoch": 7382} {"train_loss": -27.92231559753418, "global_step": 612774, "epoch": 7382} {"train_loss": -27.994827270507812, "global_step": 612775, "epoch": 7382} {"train_loss": -27.936553955078125, "global_step": 612776, "epoch": 7382} {"train_loss": -28.35591697692871, "global_step": 612777, "epoch": 7382} {"train_loss": -28.390583038330078, "global_step": 612778, "epoch": 7382} {"train_loss": -27.926483154296875, "global_step": 612779, "epoch": 7382} {"train_loss": -28.078754425048828, "global_step": 612780, "epoch": 7382} {"train_loss": -28.690153121948242, "global_step": 612781, "epoch": 7382} {"train_loss": -27.913436889648438, "global_step": 612782, "epoch": 7382} {"train_loss": -28.074298858642578, "global_step": 612783, "epoch": 7382} {"train_loss": -28.18726921081543, "global_step": 612784, "epoch": 7382} {"train_loss": -27.770856857299805, "global_step": 612785, "epoch": 7382} {"train_loss": -28.18707847595215, "global_step": 612786, "epoch": 7382} {"train_loss": -28.367502212524414, "global_step": 612787, "epoch": 7382} {"train_loss": -28.05070571439812, "global_step": 612788, "epoch": 7382, "val_loss": 6645572.5} {"train_loss": -27.540353775024414, "global_step": 612789, "epoch": 7383} {"train_loss": -27.207563400268555, "global_step": 612790, "epoch": 7383} {"train_loss": -28.188251495361328, "global_step": 612791, "epoch": 7383} {"train_loss": -27.124897003173828, "global_step": 612792, "epoch": 7383} {"train_loss": -27.307586669921875, "global_step": 612793, "epoch": 7383} {"train_loss": -27.67828941345215, "global_step": 612794, "epoch": 7383} {"train_loss": -27.976770401000977, "global_step": 612795, "epoch": 7383} {"train_loss": -27.696699142456055, "global_step": 612796, "epoch": 7383} {"train_loss": -27.361907958984375, "global_step": 612797, "epoch": 7383} {"train_loss": -27.874908447265625, "global_step": 612798, "epoch": 7383} {"train_loss": -27.702905654907227, "global_step": 612799, "epoch": 7383} {"train_loss": -27.86970329284668, "global_step": 612800, "epoch": 7383} {"train_loss": -27.577743530273438, "global_step": 612801, "epoch": 7383} {"train_loss": -27.58851432800293, "global_step": 612802, "epoch": 7383} {"train_loss": -28.262012481689453, "global_step": 612803, "epoch": 7383} {"train_loss": -28.029296875, "global_step": 612804, "epoch": 7383} {"train_loss": -27.897104263305664, "global_step": 612805, "epoch": 7383} {"train_loss": -28.08411979675293, "global_step": 612806, "epoch": 7383} {"train_loss": -27.77589988708496, "global_step": 612807, "epoch": 7383} {"train_loss": -28.439184188842773, "global_step": 612808, "epoch": 7383} {"train_loss": -28.44512367248535, "global_step": 612809, "epoch": 7383} {"train_loss": -28.31941032409668, "global_step": 612810, "epoch": 7383} {"train_loss": -28.422199249267578, "global_step": 612811, "epoch": 7383} {"train_loss": -28.119543075561523, "global_step": 612812, "epoch": 7383} {"train_loss": -27.843585968017578, "global_step": 612813, "epoch": 7383} {"train_loss": -28.201208114624023, "global_step": 612814, "epoch": 7383} {"train_loss": -28.1699275970459, "global_step": 612815, "epoch": 7383} {"train_loss": -28.291107177734375, "global_step": 612816, "epoch": 7383} {"train_loss": -27.85991859436035, "global_step": 612817, "epoch": 7383} {"train_loss": -28.02703285217285, "global_step": 612818, "epoch": 7383} {"train_loss": -28.113977432250977, "global_step": 612819, "epoch": 7383} {"train_loss": -28.09765625, "global_step": 612820, "epoch": 7383} {"train_loss": -28.467527389526367, "global_step": 612821, "epoch": 7383} {"train_loss": -28.1259765625, "global_step": 612822, "epoch": 7383} {"train_loss": -27.916584014892578, "global_step": 612823, "epoch": 7383} {"train_loss": -27.86774253845215, "global_step": 612824, "epoch": 7383} {"train_loss": -27.529272079467773, "global_step": 612825, "epoch": 7383} {"train_loss": -28.0752010345459, "global_step": 612826, "epoch": 7383} {"train_loss": -27.95524024963379, "global_step": 612827, "epoch": 7383} {"train_loss": -28.264514923095703, "global_step": 612828, "epoch": 7383} {"train_loss": -28.38410758972168, "global_step": 612829, "epoch": 7383} {"train_loss": -28.010007858276367, "global_step": 612830, "epoch": 7383} {"train_loss": -28.299652099609375, "global_step": 612831, "epoch": 7383} {"train_loss": -28.1489315032959, "global_step": 612832, "epoch": 7383} {"train_loss": -27.751880645751953, "global_step": 612833, "epoch": 7383} {"train_loss": -28.070545196533203, "global_step": 612834, "epoch": 7383} {"train_loss": -28.018091201782227, "global_step": 612835, "epoch": 7383} {"train_loss": -28.10503578186035, "global_step": 612836, "epoch": 7383} {"train_loss": -28.123640060424805, "global_step": 612837, "epoch": 7383} {"train_loss": -28.118650436401367, "global_step": 612838, "epoch": 7383} {"train_loss": -28.22956657409668, "global_step": 612839, "epoch": 7383} {"train_loss": -28.662450790405273, "global_step": 612840, "epoch": 7383} {"train_loss": -28.46392822265625, "global_step": 612841, "epoch": 7383} {"train_loss": -28.167814254760742, "global_step": 612842, "epoch": 7383} {"train_loss": -28.658533096313477, "global_step": 612843, "epoch": 7383} {"train_loss": -28.21567153930664, "global_step": 612844, "epoch": 7383} {"train_loss": -28.205358505249023, "global_step": 612845, "epoch": 7383} {"train_loss": -27.99104118347168, "global_step": 612846, "epoch": 7383} {"train_loss": -27.9456844329834, "global_step": 612847, "epoch": 7383} {"train_loss": -28.357288360595703, "global_step": 612848, "epoch": 7383} {"train_loss": -28.33540153503418, "global_step": 612849, "epoch": 7383} {"train_loss": -28.446805953979492, "global_step": 612850, "epoch": 7383} {"train_loss": -28.1351318359375, "global_step": 612851, "epoch": 7383} {"train_loss": -27.58356285095215, "global_step": 612852, "epoch": 7383} {"train_loss": -28.0640926361084, "global_step": 612853, "epoch": 7383} {"train_loss": -28.015899658203125, "global_step": 612854, "epoch": 7383} {"train_loss": -27.599273681640625, "global_step": 612855, "epoch": 7383} {"train_loss": -28.27326774597168, "global_step": 612856, "epoch": 7383} {"train_loss": -28.013965606689453, "global_step": 612857, "epoch": 7383} {"train_loss": -27.916540145874023, "global_step": 612858, "epoch": 7383} {"train_loss": -27.87980079650879, "global_step": 612859, "epoch": 7383} {"train_loss": -28.091028213500977, "global_step": 612860, "epoch": 7383} {"train_loss": -27.878509521484375, "global_step": 612861, "epoch": 7383} {"train_loss": -28.1230525970459, "global_step": 612862, "epoch": 7383} {"train_loss": -27.994043350219727, "global_step": 612863, "epoch": 7383} {"train_loss": -28.261560440063477, "global_step": 612864, "epoch": 7383} {"train_loss": -28.225650787353516, "global_step": 612865, "epoch": 7383} {"train_loss": -28.11236000061035, "global_step": 612866, "epoch": 7383} {"train_loss": -28.049640655517578, "global_step": 612867, "epoch": 7383} {"train_loss": -27.892822265625, "global_step": 612868, "epoch": 7383} {"train_loss": -28.300262451171875, "global_step": 612869, "epoch": 7383} {"train_loss": -27.81247329711914, "global_step": 612870, "epoch": 7383} {"train_loss": -28.022164884820043, "global_step": 612871, "epoch": 7383, "val_loss": 6553819.0} {"train_loss": -27.974332809448242, "global_step": 612872, "epoch": 7384} {"train_loss": -27.30914878845215, "global_step": 612873, "epoch": 7384} {"train_loss": -27.37542724609375, "global_step": 612874, "epoch": 7384} {"train_loss": -27.13820457458496, "global_step": 612875, "epoch": 7384} {"train_loss": -27.74427604675293, "global_step": 612876, "epoch": 7384} {"train_loss": -28.065826416015625, "global_step": 612877, "epoch": 7384} {"train_loss": -27.831235885620117, "global_step": 612878, "epoch": 7384} {"train_loss": -28.13232421875, "global_step": 612879, "epoch": 7384} {"train_loss": -27.548084259033203, "global_step": 612880, "epoch": 7384} {"train_loss": -27.837234497070312, "global_step": 612881, "epoch": 7384} {"train_loss": -27.58086585998535, "global_step": 612882, "epoch": 7384} {"train_loss": -27.98627281188965, "global_step": 612883, "epoch": 7384} {"train_loss": -27.783491134643555, "global_step": 612884, "epoch": 7384} {"train_loss": -27.91764259338379, "global_step": 612885, "epoch": 7384} {"train_loss": -28.023645401000977, "global_step": 612886, "epoch": 7384} {"train_loss": -27.764652252197266, "global_step": 612887, "epoch": 7384} {"train_loss": -28.009241104125977, "global_step": 612888, "epoch": 7384} {"train_loss": -27.832788467407227, "global_step": 612889, "epoch": 7384} {"train_loss": -28.02875328063965, "global_step": 612890, "epoch": 7384} {"train_loss": -28.370824813842773, "global_step": 612891, "epoch": 7384} {"train_loss": -27.946374893188477, "global_step": 612892, "epoch": 7384} {"train_loss": -28.167551040649414, "global_step": 612893, "epoch": 7384} {"train_loss": -28.17547035217285, "global_step": 612894, "epoch": 7384} {"train_loss": -28.027318954467773, "global_step": 612895, "epoch": 7384} {"train_loss": -27.909997940063477, "global_step": 612896, "epoch": 7384} {"train_loss": -28.285755157470703, "global_step": 612897, "epoch": 7384} {"train_loss": -28.13826560974121, "global_step": 612898, "epoch": 7384} {"train_loss": -28.156238555908203, "global_step": 612899, "epoch": 7384} {"train_loss": -27.96796226501465, "global_step": 612900, "epoch": 7384} {"train_loss": -28.15531349182129, "global_step": 612901, "epoch": 7384} {"train_loss": -28.339954376220703, "global_step": 612902, "epoch": 7384} {"train_loss": -28.008941650390625, "global_step": 612903, "epoch": 7384} {"train_loss": -28.12090492248535, "global_step": 612904, "epoch": 7384} {"train_loss": -27.982269287109375, "global_step": 612905, "epoch": 7384} {"train_loss": -27.947540283203125, "global_step": 612906, "epoch": 7384} {"train_loss": -28.208723068237305, "global_step": 612907, "epoch": 7384} {"train_loss": -28.051727294921875, "global_step": 612908, "epoch": 7384} {"train_loss": -28.069623947143555, "global_step": 612909, "epoch": 7384} {"train_loss": -28.136396408081055, "global_step": 612910, "epoch": 7384} {"train_loss": -28.072956085205078, "global_step": 612911, "epoch": 7384} {"train_loss": -28.05385398864746, "global_step": 612912, "epoch": 7384} {"train_loss": -28.072845458984375, "global_step": 612913, "epoch": 7384} {"train_loss": -28.09842872619629, "global_step": 612914, "epoch": 7384} {"train_loss": -28.0577335357666, "global_step": 612915, "epoch": 7384} {"train_loss": -28.302831649780273, "global_step": 612916, "epoch": 7384} {"train_loss": -27.99738883972168, "global_step": 612917, "epoch": 7384} {"train_loss": -28.318490982055664, "global_step": 612918, "epoch": 7384} {"train_loss": -28.520593643188477, "global_step": 612919, "epoch": 7384} {"train_loss": -28.24027442932129, "global_step": 612920, "epoch": 7384} {"train_loss": -28.30426597595215, "global_step": 612921, "epoch": 7384} {"train_loss": -28.275711059570312, "global_step": 612922, "epoch": 7384} {"train_loss": -28.045927047729492, "global_step": 612923, "epoch": 7384} {"train_loss": -28.145862579345703, "global_step": 612924, "epoch": 7384} {"train_loss": -28.340551376342773, "global_step": 612925, "epoch": 7384} {"train_loss": -28.150836944580078, "global_step": 612926, "epoch": 7384} {"train_loss": -28.364715576171875, "global_step": 612927, "epoch": 7384} {"train_loss": -27.882841110229492, "global_step": 612928, "epoch": 7384} {"train_loss": -27.931119918823242, "global_step": 612929, "epoch": 7384} {"train_loss": -26.971288681030273, "global_step": 612930, "epoch": 7384} {"train_loss": -25.668415069580078, "global_step": 612931, "epoch": 7384} {"train_loss": -26.002029418945312, "global_step": 612932, "epoch": 7384} {"train_loss": -26.919891357421875, "global_step": 612933, "epoch": 7384} {"train_loss": -27.735769271850586, "global_step": 612934, "epoch": 7384} {"train_loss": -26.83881950378418, "global_step": 612935, "epoch": 7384} {"train_loss": -27.512271881103516, "global_step": 612936, "epoch": 7384} {"train_loss": -27.491601943969727, "global_step": 612937, "epoch": 7384} {"train_loss": -27.750141143798828, "global_step": 612938, "epoch": 7384} {"train_loss": -26.969152450561523, "global_step": 612939, "epoch": 7384} {"train_loss": -27.771625518798828, "global_step": 612940, "epoch": 7384} {"train_loss": -27.540502548217773, "global_step": 612941, "epoch": 7384} {"train_loss": -27.324472427368164, "global_step": 612942, "epoch": 7384} {"train_loss": -27.820356369018555, "global_step": 612943, "epoch": 7384} {"train_loss": -27.887542724609375, "global_step": 612944, "epoch": 7384} {"train_loss": -27.260404586791992, "global_step": 612945, "epoch": 7384} {"train_loss": -27.264135360717773, "global_step": 612946, "epoch": 7384} {"train_loss": -27.818286895751953, "global_step": 612947, "epoch": 7384} {"train_loss": -27.6903018951416, "global_step": 612948, "epoch": 7384} {"train_loss": -27.60318946838379, "global_step": 612949, "epoch": 7384} {"train_loss": -27.560632705688477, "global_step": 612950, "epoch": 7384} {"train_loss": -27.58637809753418, "global_step": 612951, "epoch": 7384} {"train_loss": -27.735122680664062, "global_step": 612952, "epoch": 7384} {"train_loss": -27.835962295532227, "global_step": 612953, "epoch": 7384} {"train_loss": -27.832469250782427, "global_step": 612954, "epoch": 7384, "val_loss": 6646072.5} {"train_loss": -27.1422119140625, "global_step": 612955, "epoch": 7385} {"train_loss": -27.466337203979492, "global_step": 612956, "epoch": 7385} {"train_loss": -27.20319938659668, "global_step": 612957, "epoch": 7385} {"train_loss": -28.09589195251465, "global_step": 612958, "epoch": 7385} {"train_loss": -27.695600509643555, "global_step": 612959, "epoch": 7385} {"train_loss": -28.093952178955078, "global_step": 612960, "epoch": 7385} {"train_loss": -27.855817794799805, "global_step": 612961, "epoch": 7385} {"train_loss": -28.073902130126953, "global_step": 612962, "epoch": 7385} {"train_loss": -28.077402114868164, "global_step": 612963, "epoch": 7385} {"train_loss": -27.713058471679688, "global_step": 612964, "epoch": 7385} {"train_loss": -28.005481719970703, "global_step": 612965, "epoch": 7385} {"train_loss": -27.9306640625, "global_step": 612966, "epoch": 7385} {"train_loss": -28.076221466064453, "global_step": 612967, "epoch": 7385} {"train_loss": -27.634302139282227, "global_step": 612968, "epoch": 7385} {"train_loss": -27.962390899658203, "global_step": 612969, "epoch": 7385} {"train_loss": -27.984100341796875, "global_step": 612970, "epoch": 7385} {"train_loss": -28.2133846282959, "global_step": 612971, "epoch": 7385} {"train_loss": -27.635242462158203, "global_step": 612972, "epoch": 7385} {"train_loss": -27.712360382080078, "global_step": 612973, "epoch": 7385} {"train_loss": -28.6113224029541, "global_step": 612974, "epoch": 7385} {"train_loss": -28.175344467163086, "global_step": 612975, "epoch": 7385} {"train_loss": -28.237979888916016, "global_step": 612976, "epoch": 7385} {"train_loss": -28.037572860717773, "global_step": 612977, "epoch": 7385} {"train_loss": -27.999114990234375, "global_step": 612978, "epoch": 7385} {"train_loss": -28.121381759643555, "global_step": 612979, "epoch": 7385} {"train_loss": -28.191740036010742, "global_step": 612980, "epoch": 7385} {"train_loss": -28.45068359375, "global_step": 612981, "epoch": 7385} {"train_loss": -27.798627853393555, "global_step": 612982, "epoch": 7385} {"train_loss": -28.209211349487305, "global_step": 612983, "epoch": 7385} {"train_loss": -28.30068016052246, "global_step": 612984, "epoch": 7385} {"train_loss": -28.3958740234375, "global_step": 612985, "epoch": 7385} {"train_loss": -28.313074111938477, "global_step": 612986, "epoch": 7385} {"train_loss": -28.248722076416016, "global_step": 612987, "epoch": 7385} {"train_loss": -28.488683700561523, "global_step": 612988, "epoch": 7385} {"train_loss": -28.05322265625, "global_step": 612989, "epoch": 7385} {"train_loss": -28.248580932617188, "global_step": 612990, "epoch": 7385} {"train_loss": -28.020231246948242, "global_step": 612991, "epoch": 7385} {"train_loss": -28.269262313842773, "global_step": 612992, "epoch": 7385} {"train_loss": -28.750492095947266, "global_step": 612993, "epoch": 7385} {"train_loss": -27.844043731689453, "global_step": 612994, "epoch": 7385} {"train_loss": -28.177759170532227, "global_step": 612995, "epoch": 7385} {"train_loss": -28.316497802734375, "global_step": 612996, "epoch": 7385} {"train_loss": -28.62078285217285, "global_step": 612997, "epoch": 7385} {"train_loss": -28.297651290893555, "global_step": 612998, "epoch": 7385} {"train_loss": -28.716352462768555, "global_step": 612999, "epoch": 7385} {"train_loss": -28.59848403930664, "global_step": 613000, "epoch": 7385} {"train_loss": -28.608835220336914, "global_step": 613001, "epoch": 7385} {"train_loss": -28.234277725219727, "global_step": 613002, "epoch": 7385} {"train_loss": -28.152118682861328, "global_step": 613003, "epoch": 7385} {"train_loss": -28.495590209960938, "global_step": 613004, "epoch": 7385} {"train_loss": -28.4277286529541, "global_step": 613005, "epoch": 7385} {"train_loss": -28.38443374633789, "global_step": 613006, "epoch": 7385} {"train_loss": -28.400659561157227, "global_step": 613007, "epoch": 7385} {"train_loss": -27.7856388092041, "global_step": 613008, "epoch": 7385} {"train_loss": -28.389795303344727, "global_step": 613009, "epoch": 7385} {"train_loss": -28.38325309753418, "global_step": 613010, "epoch": 7385} {"train_loss": -28.088973999023438, "global_step": 613011, "epoch": 7385} {"train_loss": -27.95118522644043, "global_step": 613012, "epoch": 7385} {"train_loss": -27.6416072845459, "global_step": 613013, "epoch": 7385} {"train_loss": -26.791156768798828, "global_step": 613014, "epoch": 7385} {"train_loss": -26.72931480407715, "global_step": 613015, "epoch": 7385} {"train_loss": -26.719755172729492, "global_step": 613016, "epoch": 7385} {"train_loss": -25.448505401611328, "global_step": 613017, "epoch": 7385} {"train_loss": -24.94057273864746, "global_step": 613018, "epoch": 7385} {"train_loss": -27.586023330688477, "global_step": 613019, "epoch": 7385} {"train_loss": -26.311767578125, "global_step": 613020, "epoch": 7385} {"train_loss": -27.260541915893555, "global_step": 613021, "epoch": 7385} {"train_loss": -27.01246452331543, "global_step": 613022, "epoch": 7385} {"train_loss": -26.974323272705078, "global_step": 613023, "epoch": 7385} {"train_loss": -27.021575927734375, "global_step": 613024, "epoch": 7385} {"train_loss": -27.129093170166016, "global_step": 613025, "epoch": 7385} {"train_loss": -27.0284366607666, "global_step": 613026, "epoch": 7385} {"train_loss": -27.3625431060791, "global_step": 613027, "epoch": 7385} {"train_loss": -27.33601951599121, "global_step": 613028, "epoch": 7385} {"train_loss": -26.985248565673828, "global_step": 613029, "epoch": 7385} {"train_loss": -27.56855583190918, "global_step": 613030, "epoch": 7385} {"train_loss": -27.2718505859375, "global_step": 613031, "epoch": 7385} {"train_loss": -27.109960556030273, "global_step": 613032, "epoch": 7385} {"train_loss": -27.44622802734375, "global_step": 613033, "epoch": 7385} {"train_loss": -26.9979248046875, "global_step": 613034, "epoch": 7385} {"train_loss": -27.39715576171875, "global_step": 613035, "epoch": 7385} {"train_loss": -27.581884384155273, "global_step": 613036, "epoch": 7385} {"train_loss": -27.79497815327472, "global_step": 613037, "epoch": 7385, "val_loss": 6557902.0} {"train_loss": -26.896015167236328, "global_step": 613038, "epoch": 7386} {"train_loss": -27.70172119140625, "global_step": 613039, "epoch": 7386} {"train_loss": -26.85276222229004, "global_step": 613040, "epoch": 7386} {"train_loss": -27.4658260345459, "global_step": 613041, "epoch": 7386} {"train_loss": -27.209360122680664, "global_step": 613042, "epoch": 7386} {"train_loss": -27.5725154876709, "global_step": 613043, "epoch": 7386} {"train_loss": -27.0543270111084, "global_step": 613044, "epoch": 7386} {"train_loss": -27.25200843811035, "global_step": 613045, "epoch": 7386} {"train_loss": -26.783935546875, "global_step": 613046, "epoch": 7386} {"train_loss": -27.686071395874023, "global_step": 613047, "epoch": 7386} {"train_loss": -27.327716827392578, "global_step": 613048, "epoch": 7386} {"train_loss": -27.65704917907715, "global_step": 613049, "epoch": 7386} {"train_loss": -27.17127799987793, "global_step": 613050, "epoch": 7386} {"train_loss": -27.62677574157715, "global_step": 613051, "epoch": 7386} {"train_loss": -27.4158878326416, "global_step": 613052, "epoch": 7386} {"train_loss": -27.716297149658203, "global_step": 613053, "epoch": 7386} {"train_loss": -27.513111114501953, "global_step": 613054, "epoch": 7386} {"train_loss": -27.77268409729004, "global_step": 613055, "epoch": 7386} {"train_loss": -27.866193771362305, "global_step": 613056, "epoch": 7386} {"train_loss": -27.3476505279541, "global_step": 613057, "epoch": 7386} {"train_loss": -27.7426815032959, "global_step": 613058, "epoch": 7386} {"train_loss": -27.93744468688965, "global_step": 613059, "epoch": 7386} {"train_loss": -27.866003036499023, "global_step": 613060, "epoch": 7386} {"train_loss": -28.037649154663086, "global_step": 613061, "epoch": 7386} {"train_loss": -28.209009170532227, "global_step": 613062, "epoch": 7386} {"train_loss": -27.553760528564453, "global_step": 613063, "epoch": 7386} {"train_loss": -27.895307540893555, "global_step": 613064, "epoch": 7386} {"train_loss": -27.776594161987305, "global_step": 613065, "epoch": 7386} {"train_loss": -28.046751022338867, "global_step": 613066, "epoch": 7386} {"train_loss": -27.504291534423828, "global_step": 613067, "epoch": 7386} {"train_loss": -27.86927604675293, "global_step": 613068, "epoch": 7386} {"train_loss": -27.973031997680664, "global_step": 613069, "epoch": 7386} {"train_loss": -28.4617977142334, "global_step": 613070, "epoch": 7386} {"train_loss": -28.043264389038086, "global_step": 613071, "epoch": 7386} {"train_loss": -27.84392738342285, "global_step": 613072, "epoch": 7386} {"train_loss": -28.10560417175293, "global_step": 613073, "epoch": 7386} {"train_loss": -28.105960845947266, "global_step": 613074, "epoch": 7386} {"train_loss": -28.102436065673828, "global_step": 613075, "epoch": 7386} {"train_loss": -27.724258422851562, "global_step": 613076, "epoch": 7386} {"train_loss": -27.8384952545166, "global_step": 613077, "epoch": 7386} {"train_loss": -28.42024040222168, "global_step": 613078, "epoch": 7386} {"train_loss": -28.353351593017578, "global_step": 613079, "epoch": 7386} {"train_loss": -28.203857421875, "global_step": 613080, "epoch": 7386} {"train_loss": -28.36431312561035, "global_step": 613081, "epoch": 7386} {"train_loss": -28.330978393554688, "global_step": 613082, "epoch": 7386} {"train_loss": -28.118982315063477, "global_step": 613083, "epoch": 7386} {"train_loss": -28.62055015563965, "global_step": 613084, "epoch": 7386} {"train_loss": -28.43705177307129, "global_step": 613085, "epoch": 7386} {"train_loss": -28.169591903686523, "global_step": 613086, "epoch": 7386} {"train_loss": -28.187021255493164, "global_step": 613087, "epoch": 7386} {"train_loss": -28.130109786987305, "global_step": 613088, "epoch": 7386} {"train_loss": -28.241865158081055, "global_step": 613089, "epoch": 7386} {"train_loss": -28.278364181518555, "global_step": 613090, "epoch": 7386} {"train_loss": -28.20830726623535, "global_step": 613091, "epoch": 7386} {"train_loss": -28.268081665039062, "global_step": 613092, "epoch": 7386} {"train_loss": -28.42156982421875, "global_step": 613093, "epoch": 7386} {"train_loss": -28.050622940063477, "global_step": 613094, "epoch": 7386} {"train_loss": -28.27069091796875, "global_step": 613095, "epoch": 7386} {"train_loss": -28.415449142456055, "global_step": 613096, "epoch": 7386} {"train_loss": -28.046171188354492, "global_step": 613097, "epoch": 7386} {"train_loss": -28.033267974853516, "global_step": 613098, "epoch": 7386} {"train_loss": -27.476776123046875, "global_step": 613099, "epoch": 7386} {"train_loss": -26.674924850463867, "global_step": 613100, "epoch": 7386} {"train_loss": -26.469411849975586, "global_step": 613101, "epoch": 7386} {"train_loss": -26.6109676361084, "global_step": 613102, "epoch": 7386} {"train_loss": -28.007909774780273, "global_step": 613103, "epoch": 7386} {"train_loss": -28.290390014648438, "global_step": 613104, "epoch": 7386} {"train_loss": -27.670881271362305, "global_step": 613105, "epoch": 7386} {"train_loss": -28.241378784179688, "global_step": 613106, "epoch": 7386} {"train_loss": -27.916086196899414, "global_step": 613107, "epoch": 7386} {"train_loss": -28.314899444580078, "global_step": 613108, "epoch": 7386} {"train_loss": -28.37653160095215, "global_step": 613109, "epoch": 7386} {"train_loss": -27.785369873046875, "global_step": 613110, "epoch": 7386} {"train_loss": -28.04852867126465, "global_step": 613111, "epoch": 7386} {"train_loss": -28.004480361938477, "global_step": 613112, "epoch": 7386} {"train_loss": -27.990493774414062, "global_step": 613113, "epoch": 7386} {"train_loss": -28.150043487548828, "global_step": 613114, "epoch": 7386} {"train_loss": -27.781005859375, "global_step": 613115, "epoch": 7386} {"train_loss": -27.924640655517578, "global_step": 613116, "epoch": 7386} {"train_loss": -28.340391159057617, "global_step": 613117, "epoch": 7386} {"train_loss": -28.046234130859375, "global_step": 613118, "epoch": 7386} {"train_loss": -27.990036010742188, "global_step": 613119, "epoch": 7386} {"train_loss": -27.859337542430463, "global_step": 613120, "epoch": 7386, "val_loss": 6652010.0} {"train_loss": -26.61060905456543, "global_step": 613121, "epoch": 7387} {"train_loss": -27.042287826538086, "global_step": 613122, "epoch": 7387} {"train_loss": -26.080341339111328, "global_step": 613123, "epoch": 7387} {"train_loss": -27.63752555847168, "global_step": 613124, "epoch": 7387} {"train_loss": -26.62482261657715, "global_step": 613125, "epoch": 7387} {"train_loss": -26.95305824279785, "global_step": 613126, "epoch": 7387} {"train_loss": -26.73036003112793, "global_step": 613127, "epoch": 7387} {"train_loss": -27.355432510375977, "global_step": 613128, "epoch": 7387} {"train_loss": -26.64678955078125, "global_step": 613129, "epoch": 7387} {"train_loss": -27.639575958251953, "global_step": 613130, "epoch": 7387} {"train_loss": -27.714197158813477, "global_step": 613131, "epoch": 7387} {"train_loss": -27.650272369384766, "global_step": 613132, "epoch": 7387} {"train_loss": -28.011962890625, "global_step": 613133, "epoch": 7387} {"train_loss": -27.345190048217773, "global_step": 613134, "epoch": 7387} {"train_loss": -28.06744384765625, "global_step": 613135, "epoch": 7387} {"train_loss": -27.546430587768555, "global_step": 613136, "epoch": 7387} {"train_loss": -28.14414405822754, "global_step": 613137, "epoch": 7387} {"train_loss": -27.583349227905273, "global_step": 613138, "epoch": 7387} {"train_loss": -27.9515438079834, "global_step": 613139, "epoch": 7387} {"train_loss": -27.78218650817871, "global_step": 613140, "epoch": 7387} {"train_loss": -27.76250648498535, "global_step": 613141, "epoch": 7387} {"train_loss": -27.8349552154541, "global_step": 613142, "epoch": 7387} {"train_loss": -27.964269638061523, "global_step": 613143, "epoch": 7387} {"train_loss": -27.721261978149414, "global_step": 613144, "epoch": 7387} {"train_loss": -27.870346069335938, "global_step": 613145, "epoch": 7387} {"train_loss": -28.01730728149414, "global_step": 613146, "epoch": 7387} {"train_loss": -28.211782455444336, "global_step": 613147, "epoch": 7387} {"train_loss": -27.820953369140625, "global_step": 613148, "epoch": 7387} {"train_loss": -27.847257614135742, "global_step": 613149, "epoch": 7387} {"train_loss": -27.817916870117188, "global_step": 613150, "epoch": 7387} {"train_loss": -28.326223373413086, "global_step": 613151, "epoch": 7387} {"train_loss": -27.87200927734375, "global_step": 613152, "epoch": 7387} {"train_loss": -28.265827178955078, "global_step": 613153, "epoch": 7387} {"train_loss": -28.472806930541992, "global_step": 613154, "epoch": 7387} {"train_loss": -28.046218872070312, "global_step": 613155, "epoch": 7387} {"train_loss": -28.224775314331055, "global_step": 613156, "epoch": 7387} {"train_loss": -28.26368522644043, "global_step": 613157, "epoch": 7387} {"train_loss": -28.296539306640625, "global_step": 613158, "epoch": 7387} {"train_loss": -28.459125518798828, "global_step": 613159, "epoch": 7387} {"train_loss": -28.368717193603516, "global_step": 613160, "epoch": 7387} {"train_loss": -28.636005401611328, "global_step": 613161, "epoch": 7387} {"train_loss": -28.2849178314209, "global_step": 613162, "epoch": 7387} {"train_loss": -28.297607421875, "global_step": 613163, "epoch": 7387} {"train_loss": -28.158782958984375, "global_step": 613164, "epoch": 7387} {"train_loss": -28.46466064453125, "global_step": 613165, "epoch": 7387} {"train_loss": -28.33042335510254, "global_step": 613166, "epoch": 7387} {"train_loss": -28.23494529724121, "global_step": 613167, "epoch": 7387} {"train_loss": -28.25396156311035, "global_step": 613168, "epoch": 7387} {"train_loss": -28.46539306640625, "global_step": 613169, "epoch": 7387} {"train_loss": -28.206403732299805, "global_step": 613170, "epoch": 7387} {"train_loss": -28.514118194580078, "global_step": 613171, "epoch": 7387} {"train_loss": -28.21173667907715, "global_step": 613172, "epoch": 7387} {"train_loss": -27.967517852783203, "global_step": 613173, "epoch": 7387} {"train_loss": -28.32169532775879, "global_step": 613174, "epoch": 7387} {"train_loss": -28.6376953125, "global_step": 613175, "epoch": 7387} {"train_loss": -28.2586727142334, "global_step": 613176, "epoch": 7387} {"train_loss": -28.515018463134766, "global_step": 613177, "epoch": 7387} {"train_loss": -28.043167114257812, "global_step": 613178, "epoch": 7387} {"train_loss": -28.25721549987793, "global_step": 613179, "epoch": 7387} {"train_loss": -28.02302360534668, "global_step": 613180, "epoch": 7387} {"train_loss": -27.628814697265625, "global_step": 613181, "epoch": 7387} {"train_loss": -27.216039657592773, "global_step": 613182, "epoch": 7387} {"train_loss": -26.784086227416992, "global_step": 613183, "epoch": 7387} {"train_loss": -27.160852432250977, "global_step": 613184, "epoch": 7387} {"train_loss": -27.700448989868164, "global_step": 613185, "epoch": 7387} {"train_loss": -27.692890167236328, "global_step": 613186, "epoch": 7387} {"train_loss": -27.92698097229004, "global_step": 613187, "epoch": 7387} {"train_loss": -27.9938907623291, "global_step": 613188, "epoch": 7387} {"train_loss": -27.72086524963379, "global_step": 613189, "epoch": 7387} {"train_loss": -28.277658462524414, "global_step": 613190, "epoch": 7387} {"train_loss": -28.267988204956055, "global_step": 613191, "epoch": 7387} {"train_loss": -27.660032272338867, "global_step": 613192, "epoch": 7387} {"train_loss": -27.901599884033203, "global_step": 613193, "epoch": 7387} {"train_loss": -28.002338409423828, "global_step": 613194, "epoch": 7387} {"train_loss": -27.742666244506836, "global_step": 613195, "epoch": 7387} {"train_loss": -28.269094467163086, "global_step": 613196, "epoch": 7387} {"train_loss": -27.7291259765625, "global_step": 613197, "epoch": 7387} {"train_loss": -27.7008056640625, "global_step": 613198, "epoch": 7387} {"train_loss": -27.739599227905273, "global_step": 613199, "epoch": 7387} {"train_loss": -27.58424949645996, "global_step": 613200, "epoch": 7387} {"train_loss": -28.194477081298828, "global_step": 613201, "epoch": 7387} {"train_loss": -27.838489532470703, "global_step": 613202, "epoch": 7387} {"train_loss": -27.875832730029003, "global_step": 613203, "epoch": 7387, "val_loss": 6569469.0} {"train_loss": -26.962390899658203, "global_step": 613204, "epoch": 7388} {"train_loss": -27.114643096923828, "global_step": 613205, "epoch": 7388} {"train_loss": -27.548810958862305, "global_step": 613206, "epoch": 7388} {"train_loss": -27.330671310424805, "global_step": 613207, "epoch": 7388} {"train_loss": -27.042591094970703, "global_step": 613208, "epoch": 7388} {"train_loss": -27.438888549804688, "global_step": 613209, "epoch": 7388} {"train_loss": -27.303466796875, "global_step": 613210, "epoch": 7388} {"train_loss": -27.063751220703125, "global_step": 613211, "epoch": 7388} {"train_loss": -27.46295166015625, "global_step": 613212, "epoch": 7388} {"train_loss": -27.209115982055664, "global_step": 613213, "epoch": 7388} {"train_loss": -27.55071449279785, "global_step": 613214, "epoch": 7388} {"train_loss": -27.455724716186523, "global_step": 613215, "epoch": 7388} {"train_loss": -27.845914840698242, "global_step": 613216, "epoch": 7388} {"train_loss": -27.7805118560791, "global_step": 613217, "epoch": 7388} {"train_loss": -27.840829849243164, "global_step": 613218, "epoch": 7388} {"train_loss": -27.95895767211914, "global_step": 613219, "epoch": 7388} {"train_loss": -27.552051544189453, "global_step": 613220, "epoch": 7388} {"train_loss": -27.7323055267334, "global_step": 613221, "epoch": 7388} {"train_loss": -28.1611270904541, "global_step": 613222, "epoch": 7388} {"train_loss": -27.74005126953125, "global_step": 613223, "epoch": 7388} {"train_loss": -27.923948287963867, "global_step": 613224, "epoch": 7388} {"train_loss": -28.04296875, "global_step": 613225, "epoch": 7388} {"train_loss": -28.188037872314453, "global_step": 613226, "epoch": 7388} {"train_loss": -27.941864013671875, "global_step": 613227, "epoch": 7388} {"train_loss": -27.813669204711914, "global_step": 613228, "epoch": 7388} {"train_loss": -27.8666934967041, "global_step": 613229, "epoch": 7388} {"train_loss": -28.267059326171875, "global_step": 613230, "epoch": 7388} {"train_loss": -28.006881713867188, "global_step": 613231, "epoch": 7388} {"train_loss": -28.04790687561035, "global_step": 613232, "epoch": 7388} {"train_loss": -27.91131019592285, "global_step": 613233, "epoch": 7388} {"train_loss": -28.04453468322754, "global_step": 613234, "epoch": 7388} {"train_loss": -28.30380630493164, "global_step": 613235, "epoch": 7388} {"train_loss": -28.289112091064453, "global_step": 613236, "epoch": 7388} {"train_loss": -27.822473526000977, "global_step": 613237, "epoch": 7388} {"train_loss": -28.6348819732666, "global_step": 613238, "epoch": 7388} {"train_loss": -28.170251846313477, "global_step": 613239, "epoch": 7388} {"train_loss": -28.459943771362305, "global_step": 613240, "epoch": 7388} {"train_loss": -28.163650512695312, "global_step": 613241, "epoch": 7388} {"train_loss": -28.234643936157227, "global_step": 613242, "epoch": 7388} {"train_loss": -28.163740158081055, "global_step": 613243, "epoch": 7388} {"train_loss": -28.343082427978516, "global_step": 613244, "epoch": 7388} {"train_loss": -28.133310317993164, "global_step": 613245, "epoch": 7388} {"train_loss": -28.14996910095215, "global_step": 613246, "epoch": 7388} {"train_loss": -27.851266860961914, "global_step": 613247, "epoch": 7388} {"train_loss": -28.28018569946289, "global_step": 613248, "epoch": 7388} {"train_loss": -28.12265396118164, "global_step": 613249, "epoch": 7388} {"train_loss": -27.871246337890625, "global_step": 613250, "epoch": 7388} {"train_loss": -28.1976318359375, "global_step": 613251, "epoch": 7388} {"train_loss": -27.964365005493164, "global_step": 613252, "epoch": 7388} {"train_loss": -28.41827964782715, "global_step": 613253, "epoch": 7388} {"train_loss": -28.1717529296875, "global_step": 613254, "epoch": 7388} {"train_loss": -28.131988525390625, "global_step": 613255, "epoch": 7388} {"train_loss": -28.239404678344727, "global_step": 613256, "epoch": 7388} {"train_loss": -28.518970489501953, "global_step": 613257, "epoch": 7388} {"train_loss": -28.680633544921875, "global_step": 613258, "epoch": 7388} {"train_loss": -28.343067169189453, "global_step": 613259, "epoch": 7388} {"train_loss": -28.445486068725586, "global_step": 613260, "epoch": 7388} {"train_loss": -28.46613883972168, "global_step": 613261, "epoch": 7388} {"train_loss": -28.597949981689453, "global_step": 613262, "epoch": 7388} {"train_loss": -28.100330352783203, "global_step": 613263, "epoch": 7388} {"train_loss": -28.683929443359375, "global_step": 613264, "epoch": 7388} {"train_loss": -28.095190048217773, "global_step": 613265, "epoch": 7388} {"train_loss": -28.343753814697266, "global_step": 613266, "epoch": 7388} {"train_loss": -28.31142234802246, "global_step": 613267, "epoch": 7388} {"train_loss": -27.783063888549805, "global_step": 613268, "epoch": 7388} {"train_loss": -28.50042152404785, "global_step": 613269, "epoch": 7388} {"train_loss": -27.861967086791992, "global_step": 613270, "epoch": 7388} {"train_loss": -28.08680534362793, "global_step": 613271, "epoch": 7388} {"train_loss": -28.322961807250977, "global_step": 613272, "epoch": 7388} {"train_loss": -28.097671508789062, "global_step": 613273, "epoch": 7388} {"train_loss": -27.896459579467773, "global_step": 613274, "epoch": 7388} {"train_loss": -27.99505615234375, "global_step": 613275, "epoch": 7388} {"train_loss": -27.81907081604004, "global_step": 613276, "epoch": 7388} {"train_loss": -27.676427841186523, "global_step": 613277, "epoch": 7388} {"train_loss": -27.99822425842285, "global_step": 613278, "epoch": 7388} {"train_loss": -28.09819984436035, "global_step": 613279, "epoch": 7388} {"train_loss": -27.559106826782227, "global_step": 613280, "epoch": 7388} {"train_loss": -27.906518936157227, "global_step": 613281, "epoch": 7388} {"train_loss": -28.32256507873535, "global_step": 613282, "epoch": 7388} {"train_loss": -27.808948516845703, "global_step": 613283, "epoch": 7388} {"train_loss": -28.216827392578125, "global_step": 613284, "epoch": 7388} {"train_loss": -27.735279083251953, "global_step": 613285, "epoch": 7388} {"train_loss": -27.986925653664464, "global_step": 613286, "epoch": 7388, "val_loss": 6688853.5} {"train_loss": -23.62312126159668, "global_step": 613287, "epoch": 7389} {"train_loss": -20.84461784362793, "global_step": 613288, "epoch": 7389} {"train_loss": -26.193897247314453, "global_step": 613289, "epoch": 7389} {"train_loss": -24.88163185119629, "global_step": 613290, "epoch": 7389} {"train_loss": -26.21906089782715, "global_step": 613291, "epoch": 7389} {"train_loss": -25.776611328125, "global_step": 613292, "epoch": 7389} {"train_loss": -26.42854881286621, "global_step": 613293, "epoch": 7389} {"train_loss": -26.4348087310791, "global_step": 613294, "epoch": 7389} {"train_loss": -26.982303619384766, "global_step": 613295, "epoch": 7389} {"train_loss": -26.9658203125, "global_step": 613296, "epoch": 7389} {"train_loss": -26.75404167175293, "global_step": 613297, "epoch": 7389} {"train_loss": -27.05828857421875, "global_step": 613298, "epoch": 7389} {"train_loss": -27.046247482299805, "global_step": 613299, "epoch": 7389} {"train_loss": -26.581867218017578, "global_step": 613300, "epoch": 7389} {"train_loss": -27.28607177734375, "global_step": 613301, "epoch": 7389} {"train_loss": -27.2458553314209, "global_step": 613302, "epoch": 7389} {"train_loss": -27.431421279907227, "global_step": 613303, "epoch": 7389} {"train_loss": -27.096433639526367, "global_step": 613304, "epoch": 7389} {"train_loss": -27.456830978393555, "global_step": 613305, "epoch": 7389} {"train_loss": -27.611249923706055, "global_step": 613306, "epoch": 7389} {"train_loss": -27.4180850982666, "global_step": 613307, "epoch": 7389} {"train_loss": -27.349002838134766, "global_step": 613308, "epoch": 7389} {"train_loss": -27.723220825195312, "global_step": 613309, "epoch": 7389} {"train_loss": -27.343246459960938, "global_step": 613310, "epoch": 7389} {"train_loss": -27.54718017578125, "global_step": 613311, "epoch": 7389} {"train_loss": -27.48967933654785, "global_step": 613312, "epoch": 7389} {"train_loss": -27.63741111755371, "global_step": 613313, "epoch": 7389} {"train_loss": -27.625446319580078, "global_step": 613314, "epoch": 7389} {"train_loss": -27.37830924987793, "global_step": 613315, "epoch": 7389} {"train_loss": -27.61768913269043, "global_step": 613316, "epoch": 7389} {"train_loss": -27.487598419189453, "global_step": 613317, "epoch": 7389} {"train_loss": -27.957183837890625, "global_step": 613318, "epoch": 7389} {"train_loss": -27.645401000976562, "global_step": 613319, "epoch": 7389} {"train_loss": -27.449644088745117, "global_step": 613320, "epoch": 7389} {"train_loss": -27.89765739440918, "global_step": 613321, "epoch": 7389} {"train_loss": -27.4503231048584, "global_step": 613322, "epoch": 7389} {"train_loss": -27.667327880859375, "global_step": 613323, "epoch": 7389} {"train_loss": -27.236896514892578, "global_step": 613324, "epoch": 7389} {"train_loss": -27.7759952545166, "global_step": 613325, "epoch": 7389} {"train_loss": -27.79933738708496, "global_step": 613326, "epoch": 7389} {"train_loss": -27.639362335205078, "global_step": 613327, "epoch": 7389} {"train_loss": -28.085275650024414, "global_step": 613328, "epoch": 7389} {"train_loss": -28.04974937438965, "global_step": 613329, "epoch": 7389} {"train_loss": -27.92030143737793, "global_step": 613330, "epoch": 7389} {"train_loss": -27.728134155273438, "global_step": 613331, "epoch": 7389} {"train_loss": -27.844449996948242, "global_step": 613332, "epoch": 7389} {"train_loss": -28.029428482055664, "global_step": 613333, "epoch": 7389} {"train_loss": -27.878366470336914, "global_step": 613334, "epoch": 7389} {"train_loss": -28.091352462768555, "global_step": 613335, "epoch": 7389} {"train_loss": -28.1611328125, "global_step": 613336, "epoch": 7389} {"train_loss": -27.815582275390625, "global_step": 613337, "epoch": 7389} {"train_loss": -27.94952392578125, "global_step": 613338, "epoch": 7389} {"train_loss": -27.966291427612305, "global_step": 613339, "epoch": 7389} {"train_loss": -28.123218536376953, "global_step": 613340, "epoch": 7389} {"train_loss": -28.5351619720459, "global_step": 613341, "epoch": 7389} {"train_loss": -28.082672119140625, "global_step": 613342, "epoch": 7389} {"train_loss": -28.143518447875977, "global_step": 613343, "epoch": 7389} {"train_loss": -28.606689453125, "global_step": 613344, "epoch": 7389} {"train_loss": -28.35688591003418, "global_step": 613345, "epoch": 7389} {"train_loss": -27.62080192565918, "global_step": 613346, "epoch": 7389} {"train_loss": -28.308856964111328, "global_step": 613347, "epoch": 7389} {"train_loss": -27.9475154876709, "global_step": 613348, "epoch": 7389} {"train_loss": -28.43125343322754, "global_step": 613349, "epoch": 7389} {"train_loss": -28.09406852722168, "global_step": 613350, "epoch": 7389} {"train_loss": -28.49041748046875, "global_step": 613351, "epoch": 7389} {"train_loss": -28.392078399658203, "global_step": 613352, "epoch": 7389} {"train_loss": -28.57904052734375, "global_step": 613353, "epoch": 7389} {"train_loss": -28.142871856689453, "global_step": 613354, "epoch": 7389} {"train_loss": -28.282087326049805, "global_step": 613355, "epoch": 7389} {"train_loss": -28.479719161987305, "global_step": 613356, "epoch": 7389} {"train_loss": -28.035327911376953, "global_step": 613357, "epoch": 7389} {"train_loss": -27.854969024658203, "global_step": 613358, "epoch": 7389} {"train_loss": -27.84320068359375, "global_step": 613359, "epoch": 7389} {"train_loss": -27.779006958007812, "global_step": 613360, "epoch": 7389} {"train_loss": -27.94757652282715, "global_step": 613361, "epoch": 7389} {"train_loss": -27.902395248413086, "global_step": 613362, "epoch": 7389} {"train_loss": -27.772296905517578, "global_step": 613363, "epoch": 7389} {"train_loss": -27.98931312561035, "global_step": 613364, "epoch": 7389} {"train_loss": -27.924680709838867, "global_step": 613365, "epoch": 7389} {"train_loss": -27.718088150024414, "global_step": 613366, "epoch": 7389} {"train_loss": -27.88978385925293, "global_step": 613367, "epoch": 7389} {"train_loss": -27.844202041625977, "global_step": 613368, "epoch": 7389} {"train_loss": -27.495672892375165, "global_step": 613369, "epoch": 7389, "val_loss": 6771132.0} {"train_loss": -27.23090171813965, "global_step": 613370, "epoch": 7390} {"train_loss": -26.725229263305664, "global_step": 613371, "epoch": 7390} {"train_loss": -26.770910263061523, "global_step": 613372, "epoch": 7390} {"train_loss": -26.930959701538086, "global_step": 613373, "epoch": 7390} {"train_loss": -26.364124298095703, "global_step": 613374, "epoch": 7390} {"train_loss": -27.487680435180664, "global_step": 613375, "epoch": 7390} {"train_loss": -27.02998924255371, "global_step": 613376, "epoch": 7390} {"train_loss": -27.2362003326416, "global_step": 613377, "epoch": 7390} {"train_loss": -26.958242416381836, "global_step": 613378, "epoch": 7390} {"train_loss": -27.140247344970703, "global_step": 613379, "epoch": 7390} {"train_loss": -27.280017852783203, "global_step": 613380, "epoch": 7390} {"train_loss": -27.219776153564453, "global_step": 613381, "epoch": 7390} {"train_loss": -27.52789306640625, "global_step": 613382, "epoch": 7390} {"train_loss": -27.160400390625, "global_step": 613383, "epoch": 7390} {"train_loss": -27.320188522338867, "global_step": 613384, "epoch": 7390} {"train_loss": -27.233951568603516, "global_step": 613385, "epoch": 7390} {"train_loss": -27.612340927124023, "global_step": 613386, "epoch": 7390} {"train_loss": -27.760650634765625, "global_step": 613387, "epoch": 7390} {"train_loss": -27.561786651611328, "global_step": 613388, "epoch": 7390} {"train_loss": -27.29609489440918, "global_step": 613389, "epoch": 7390} {"train_loss": -27.541385650634766, "global_step": 613390, "epoch": 7390} {"train_loss": -27.628934860229492, "global_step": 613391, "epoch": 7390} {"train_loss": -27.5985107421875, "global_step": 613392, "epoch": 7390} {"train_loss": -27.551050186157227, "global_step": 613393, "epoch": 7390} {"train_loss": -27.86331558227539, "global_step": 613394, "epoch": 7390} {"train_loss": -28.005741119384766, "global_step": 613395, "epoch": 7390} {"train_loss": -28.136335372924805, "global_step": 613396, "epoch": 7390} {"train_loss": -27.97052574157715, "global_step": 613397, "epoch": 7390} {"train_loss": -28.09832191467285, "global_step": 613398, "epoch": 7390} {"train_loss": -28.14069175720215, "global_step": 613399, "epoch": 7390} {"train_loss": -27.691991806030273, "global_step": 613400, "epoch": 7390} {"train_loss": -27.883649826049805, "global_step": 613401, "epoch": 7390} {"train_loss": -27.966739654541016, "global_step": 613402, "epoch": 7390} {"train_loss": -28.51685905456543, "global_step": 613403, "epoch": 7390} {"train_loss": -28.03156089782715, "global_step": 613404, "epoch": 7390} {"train_loss": -27.987497329711914, "global_step": 613405, "epoch": 7390} {"train_loss": -28.026081085205078, "global_step": 613406, "epoch": 7390} {"train_loss": -28.06504249572754, "global_step": 613407, "epoch": 7390} {"train_loss": -27.783130645751953, "global_step": 613408, "epoch": 7390} {"train_loss": -28.196836471557617, "global_step": 613409, "epoch": 7390} {"train_loss": -28.44886589050293, "global_step": 613410, "epoch": 7390} {"train_loss": -28.30828285217285, "global_step": 613411, "epoch": 7390} {"train_loss": -28.107757568359375, "global_step": 613412, "epoch": 7390} {"train_loss": -28.39705467224121, "global_step": 613413, "epoch": 7390} {"train_loss": -28.064483642578125, "global_step": 613414, "epoch": 7390} {"train_loss": -28.19965934753418, "global_step": 613415, "epoch": 7390} {"train_loss": -28.38347816467285, "global_step": 613416, "epoch": 7390} {"train_loss": -28.181396484375, "global_step": 613417, "epoch": 7390} {"train_loss": -28.14398765563965, "global_step": 613418, "epoch": 7390} {"train_loss": -28.103940963745117, "global_step": 613419, "epoch": 7390} {"train_loss": -28.59515380859375, "global_step": 613420, "epoch": 7390} {"train_loss": -28.348957061767578, "global_step": 613421, "epoch": 7390} {"train_loss": -28.238636016845703, "global_step": 613422, "epoch": 7390} {"train_loss": -28.365583419799805, "global_step": 613423, "epoch": 7390} {"train_loss": -28.462331771850586, "global_step": 613424, "epoch": 7390} {"train_loss": -28.346088409423828, "global_step": 613425, "epoch": 7390} {"train_loss": -28.576642990112305, "global_step": 613426, "epoch": 7390} {"train_loss": -28.692047119140625, "global_step": 613427, "epoch": 7390} {"train_loss": -28.610666275024414, "global_step": 613428, "epoch": 7390} {"train_loss": -28.094823837280273, "global_step": 613429, "epoch": 7390} {"train_loss": -28.176651000976562, "global_step": 613430, "epoch": 7390} {"train_loss": -28.110437393188477, "global_step": 613431, "epoch": 7390} {"train_loss": -28.641687393188477, "global_step": 613432, "epoch": 7390} {"train_loss": -28.3169002532959, "global_step": 613433, "epoch": 7390} {"train_loss": -28.375288009643555, "global_step": 613434, "epoch": 7390} {"train_loss": -28.897705078125, "global_step": 613435, "epoch": 7390} {"train_loss": -28.394079208374023, "global_step": 613436, "epoch": 7390} {"train_loss": -27.912153244018555, "global_step": 613437, "epoch": 7390} {"train_loss": -27.855426788330078, "global_step": 613438, "epoch": 7390} {"train_loss": -28.19733238220215, "global_step": 613439, "epoch": 7390} {"train_loss": -28.282001495361328, "global_step": 613440, "epoch": 7390} {"train_loss": -28.217992782592773, "global_step": 613441, "epoch": 7390} {"train_loss": -28.035409927368164, "global_step": 613442, "epoch": 7390} {"train_loss": -28.0579833984375, "global_step": 613443, "epoch": 7390} {"train_loss": -28.339874267578125, "global_step": 613444, "epoch": 7390} {"train_loss": -28.201251983642578, "global_step": 613445, "epoch": 7390} {"train_loss": -28.273950576782227, "global_step": 613446, "epoch": 7390} {"train_loss": -28.119775772094727, "global_step": 613447, "epoch": 7390} {"train_loss": -28.256887435913086, "global_step": 613448, "epoch": 7390} {"train_loss": -28.17964744567871, "global_step": 613449, "epoch": 7390} {"train_loss": -27.96759033203125, "global_step": 613450, "epoch": 7390} {"train_loss": -28.62397575378418, "global_step": 613451, "epoch": 7390} {"train_loss": -27.940376925181194, "global_step": 613452, "epoch": 7390, "val_loss": 6597896.0} {"train_loss": -28.031818389892578, "global_step": 613453, "epoch": 7391} {"train_loss": -27.745941162109375, "global_step": 613454, "epoch": 7391} {"train_loss": -27.799283981323242, "global_step": 613455, "epoch": 7391} {"train_loss": -28.008169174194336, "global_step": 613456, "epoch": 7391} {"train_loss": -27.93665885925293, "global_step": 613457, "epoch": 7391} {"train_loss": -27.506122589111328, "global_step": 613458, "epoch": 7391} {"train_loss": -27.924213409423828, "global_step": 613459, "epoch": 7391} {"train_loss": -28.145416259765625, "global_step": 613460, "epoch": 7391} {"train_loss": -27.898035049438477, "global_step": 613461, "epoch": 7391} {"train_loss": -27.98333168029785, "global_step": 613462, "epoch": 7391} {"train_loss": -27.9130802154541, "global_step": 613463, "epoch": 7391} {"train_loss": -27.813949584960938, "global_step": 613464, "epoch": 7391} {"train_loss": -27.837451934814453, "global_step": 613465, "epoch": 7391} {"train_loss": -27.930028915405273, "global_step": 613466, "epoch": 7391} {"train_loss": -27.89894676208496, "global_step": 613467, "epoch": 7391} {"train_loss": -27.7557373046875, "global_step": 613468, "epoch": 7391} {"train_loss": -27.881610870361328, "global_step": 613469, "epoch": 7391} {"train_loss": -27.832380294799805, "global_step": 613470, "epoch": 7391} {"train_loss": -28.103124618530273, "global_step": 613471, "epoch": 7391} {"train_loss": -27.758914947509766, "global_step": 613472, "epoch": 7391} {"train_loss": -28.153966903686523, "global_step": 613473, "epoch": 7391} {"train_loss": -27.74224281311035, "global_step": 613474, "epoch": 7391} {"train_loss": -28.009389877319336, "global_step": 613475, "epoch": 7391} {"train_loss": -27.943012237548828, "global_step": 613476, "epoch": 7391} {"train_loss": -28.071847915649414, "global_step": 613477, "epoch": 7391} {"train_loss": -28.032867431640625, "global_step": 613478, "epoch": 7391} {"train_loss": -27.93562126159668, "global_step": 613479, "epoch": 7391} {"train_loss": -28.2864933013916, "global_step": 613480, "epoch": 7391} {"train_loss": -28.422842025756836, "global_step": 613481, "epoch": 7391} {"train_loss": -28.021198272705078, "global_step": 613482, "epoch": 7391} {"train_loss": -28.120737075805664, "global_step": 613483, "epoch": 7391} {"train_loss": -27.541608810424805, "global_step": 613484, "epoch": 7391} {"train_loss": -28.535547256469727, "global_step": 613485, "epoch": 7391} {"train_loss": -27.70338249206543, "global_step": 613486, "epoch": 7391} {"train_loss": -28.14618492126465, "global_step": 613487, "epoch": 7391} {"train_loss": -27.925596237182617, "global_step": 613488, "epoch": 7391} {"train_loss": -28.334152221679688, "global_step": 613489, "epoch": 7391} {"train_loss": -28.11415672302246, "global_step": 613490, "epoch": 7391} {"train_loss": -27.82517433166504, "global_step": 613491, "epoch": 7391} {"train_loss": -28.50613784790039, "global_step": 613492, "epoch": 7391} {"train_loss": -28.474761962890625, "global_step": 613493, "epoch": 7391} {"train_loss": -28.036563873291016, "global_step": 613494, "epoch": 7391} {"train_loss": -28.438703536987305, "global_step": 613495, "epoch": 7391} {"train_loss": -27.895721435546875, "global_step": 613496, "epoch": 7391} {"train_loss": -27.9635009765625, "global_step": 613497, "epoch": 7391} {"train_loss": -28.007909774780273, "global_step": 613498, "epoch": 7391} {"train_loss": -27.65875816345215, "global_step": 613499, "epoch": 7391} {"train_loss": -28.32742691040039, "global_step": 613500, "epoch": 7391} {"train_loss": -27.866647720336914, "global_step": 613501, "epoch": 7391} {"train_loss": -27.669187545776367, "global_step": 613502, "epoch": 7391} {"train_loss": -27.859960556030273, "global_step": 613503, "epoch": 7391} {"train_loss": -28.329273223876953, "global_step": 613504, "epoch": 7391} {"train_loss": -28.0106143951416, "global_step": 613505, "epoch": 7391} {"train_loss": -28.0671329498291, "global_step": 613506, "epoch": 7391} {"train_loss": -28.343664169311523, "global_step": 613507, "epoch": 7391} {"train_loss": -28.19879150390625, "global_step": 613508, "epoch": 7391} {"train_loss": -28.243579864501953, "global_step": 613509, "epoch": 7391} {"train_loss": -28.06110954284668, "global_step": 613510, "epoch": 7391} {"train_loss": -28.23431968688965, "global_step": 613511, "epoch": 7391} {"train_loss": -28.357379913330078, "global_step": 613512, "epoch": 7391} {"train_loss": -28.161176681518555, "global_step": 613513, "epoch": 7391} {"train_loss": -28.275461196899414, "global_step": 613514, "epoch": 7391} {"train_loss": -28.134855270385742, "global_step": 613515, "epoch": 7391} {"train_loss": -28.17998695373535, "global_step": 613516, "epoch": 7391} {"train_loss": -27.939239501953125, "global_step": 613517, "epoch": 7391} {"train_loss": -28.440153121948242, "global_step": 613518, "epoch": 7391} {"train_loss": -28.086095809936523, "global_step": 613519, "epoch": 7391} {"train_loss": -28.279067993164062, "global_step": 613520, "epoch": 7391} {"train_loss": -28.463470458984375, "global_step": 613521, "epoch": 7391} {"train_loss": -28.31903076171875, "global_step": 613522, "epoch": 7391} {"train_loss": -28.262929916381836, "global_step": 613523, "epoch": 7391} {"train_loss": -28.07966423034668, "global_step": 613524, "epoch": 7391} {"train_loss": -28.092147827148438, "global_step": 613525, "epoch": 7391} {"train_loss": -27.880905151367188, "global_step": 613526, "epoch": 7391} {"train_loss": -28.362945556640625, "global_step": 613527, "epoch": 7391} {"train_loss": -28.377140045166016, "global_step": 613528, "epoch": 7391} {"train_loss": -28.34722328186035, "global_step": 613529, "epoch": 7391} {"train_loss": -28.38225746154785, "global_step": 613530, "epoch": 7391} {"train_loss": -28.162824630737305, "global_step": 613531, "epoch": 7391} {"train_loss": -28.321210861206055, "global_step": 613532, "epoch": 7391} {"train_loss": -28.552881240844727, "global_step": 613533, "epoch": 7391} {"train_loss": -28.247711181640625, "global_step": 613534, "epoch": 7391} {"train_loss": -28.09331645735775, "global_step": 613535, "epoch": 7391, "val_loss": 6676196.0} {"train_loss": -27.794727325439453, "global_step": 613536, "epoch": 7392} {"train_loss": -27.786441802978516, "global_step": 613537, "epoch": 7392} {"train_loss": -27.754785537719727, "global_step": 613538, "epoch": 7392} {"train_loss": -27.59018325805664, "global_step": 613539, "epoch": 7392} {"train_loss": -28.206531524658203, "global_step": 613540, "epoch": 7392} {"train_loss": -27.8057804107666, "global_step": 613541, "epoch": 7392} {"train_loss": -27.5613956451416, "global_step": 613542, "epoch": 7392} {"train_loss": -27.4953670501709, "global_step": 613543, "epoch": 7392} {"train_loss": -27.60869789123535, "global_step": 613544, "epoch": 7392} {"train_loss": -27.721811294555664, "global_step": 613545, "epoch": 7392} {"train_loss": -28.0150089263916, "global_step": 613546, "epoch": 7392} {"train_loss": -27.618444442749023, "global_step": 613547, "epoch": 7392} {"train_loss": -28.181135177612305, "global_step": 613548, "epoch": 7392} {"train_loss": -27.887311935424805, "global_step": 613549, "epoch": 7392} {"train_loss": -27.893686294555664, "global_step": 613550, "epoch": 7392} {"train_loss": -27.765775680541992, "global_step": 613551, "epoch": 7392} {"train_loss": -27.689748764038086, "global_step": 613552, "epoch": 7392} {"train_loss": -28.065732955932617, "global_step": 613553, "epoch": 7392} {"train_loss": -27.44158935546875, "global_step": 613554, "epoch": 7392} {"train_loss": -27.74041175842285, "global_step": 613555, "epoch": 7392} {"train_loss": -27.817279815673828, "global_step": 613556, "epoch": 7392} {"train_loss": -28.034326553344727, "global_step": 613557, "epoch": 7392} {"train_loss": -27.871646881103516, "global_step": 613558, "epoch": 7392} {"train_loss": -28.033008575439453, "global_step": 613559, "epoch": 7392} {"train_loss": -28.24110221862793, "global_step": 613560, "epoch": 7392} {"train_loss": -27.594369888305664, "global_step": 613561, "epoch": 7392} {"train_loss": -27.617795944213867, "global_step": 613562, "epoch": 7392} {"train_loss": -27.939664840698242, "global_step": 613563, "epoch": 7392} {"train_loss": -28.019006729125977, "global_step": 613564, "epoch": 7392} {"train_loss": -27.94111442565918, "global_step": 613565, "epoch": 7392} {"train_loss": -28.242237091064453, "global_step": 613566, "epoch": 7392} {"train_loss": -27.99393081665039, "global_step": 613567, "epoch": 7392} {"train_loss": -28.521982192993164, "global_step": 613568, "epoch": 7392} {"train_loss": -28.316650390625, "global_step": 613569, "epoch": 7392} {"train_loss": -28.20269203186035, "global_step": 613570, "epoch": 7392} {"train_loss": -28.32720947265625, "global_step": 613571, "epoch": 7392} {"train_loss": -28.189178466796875, "global_step": 613572, "epoch": 7392} {"train_loss": -28.233722686767578, "global_step": 613573, "epoch": 7392} {"train_loss": -28.10809326171875, "global_step": 613574, "epoch": 7392} {"train_loss": -28.47013282775879, "global_step": 613575, "epoch": 7392} {"train_loss": -28.034793853759766, "global_step": 613576, "epoch": 7392} {"train_loss": -27.987462997436523, "global_step": 613577, "epoch": 7392} {"train_loss": -28.05621910095215, "global_step": 613578, "epoch": 7392} {"train_loss": -28.552173614501953, "global_step": 613579, "epoch": 7392} {"train_loss": -28.5226993560791, "global_step": 613580, "epoch": 7392} {"train_loss": -28.518293380737305, "global_step": 613581, "epoch": 7392} {"train_loss": -28.32513427734375, "global_step": 613582, "epoch": 7392} {"train_loss": -28.056447982788086, "global_step": 613583, "epoch": 7392} {"train_loss": -28.438873291015625, "global_step": 613584, "epoch": 7392} {"train_loss": -28.138025283813477, "global_step": 613585, "epoch": 7392} {"train_loss": -28.5365047454834, "global_step": 613586, "epoch": 7392} {"train_loss": -27.9885196685791, "global_step": 613587, "epoch": 7392} {"train_loss": -28.322839736938477, "global_step": 613588, "epoch": 7392} {"train_loss": -28.2420654296875, "global_step": 613589, "epoch": 7392} {"train_loss": -28.019092559814453, "global_step": 613590, "epoch": 7392} {"train_loss": -28.042509078979492, "global_step": 613591, "epoch": 7392} {"train_loss": -28.510452270507812, "global_step": 613592, "epoch": 7392} {"train_loss": -28.458194732666016, "global_step": 613593, "epoch": 7392} {"train_loss": -28.489187240600586, "global_step": 613594, "epoch": 7392} {"train_loss": -27.944629669189453, "global_step": 613595, "epoch": 7392} {"train_loss": -28.331998825073242, "global_step": 613596, "epoch": 7392} {"train_loss": -28.17537498474121, "global_step": 613597, "epoch": 7392} {"train_loss": -28.496191024780273, "global_step": 613598, "epoch": 7392} {"train_loss": -27.580078125, "global_step": 613599, "epoch": 7392} {"train_loss": -27.945531845092773, "global_step": 613600, "epoch": 7392} {"train_loss": -27.916257858276367, "global_step": 613601, "epoch": 7392} {"train_loss": -27.592248916625977, "global_step": 613602, "epoch": 7392} {"train_loss": -27.75211524963379, "global_step": 613603, "epoch": 7392} {"train_loss": -27.595556259155273, "global_step": 613604, "epoch": 7392} {"train_loss": -27.473392486572266, "global_step": 613605, "epoch": 7392} {"train_loss": -27.63385009765625, "global_step": 613606, "epoch": 7392} {"train_loss": -28.01966667175293, "global_step": 613607, "epoch": 7392} {"train_loss": -27.2705020904541, "global_step": 613608, "epoch": 7392} {"train_loss": -27.686918258666992, "global_step": 613609, "epoch": 7392} {"train_loss": -28.247922897338867, "global_step": 613610, "epoch": 7392} {"train_loss": -27.376081466674805, "global_step": 613611, "epoch": 7392} {"train_loss": -28.21601676940918, "global_step": 613612, "epoch": 7392} {"train_loss": -27.77910804748535, "global_step": 613613, "epoch": 7392} {"train_loss": -28.1767520904541, "global_step": 613614, "epoch": 7392} {"train_loss": -27.92276382446289, "global_step": 613615, "epoch": 7392} {"train_loss": -27.7383975982666, "global_step": 613616, "epoch": 7392} {"train_loss": -27.623498916625977, "global_step": 613617, "epoch": 7392} {"train_loss": -27.996591292231916, "global_step": 613618, "epoch": 7392, "val_loss": 6698679.0} {"train_loss": -26.56719398498535, "global_step": 613619, "epoch": 7393} {"train_loss": -25.855924606323242, "global_step": 613620, "epoch": 7393} {"train_loss": -26.934247970581055, "global_step": 613621, "epoch": 7393} {"train_loss": -26.536619186401367, "global_step": 613622, "epoch": 7393} {"train_loss": -26.847232818603516, "global_step": 613623, "epoch": 7393} {"train_loss": -27.259775161743164, "global_step": 613624, "epoch": 7393} {"train_loss": -26.898462295532227, "global_step": 613625, "epoch": 7393} {"train_loss": -27.238983154296875, "global_step": 613626, "epoch": 7393} {"train_loss": -27.221038818359375, "global_step": 613627, "epoch": 7393} {"train_loss": -27.316375732421875, "global_step": 613628, "epoch": 7393} {"train_loss": -26.967313766479492, "global_step": 613629, "epoch": 7393} {"train_loss": -27.424640655517578, "global_step": 613630, "epoch": 7393} {"train_loss": -27.05329704284668, "global_step": 613631, "epoch": 7393} {"train_loss": -27.010589599609375, "global_step": 613632, "epoch": 7393} {"train_loss": -27.453413009643555, "global_step": 613633, "epoch": 7393} {"train_loss": -27.541584014892578, "global_step": 613634, "epoch": 7393} {"train_loss": -27.368009567260742, "global_step": 613635, "epoch": 7393} {"train_loss": -27.52447509765625, "global_step": 613636, "epoch": 7393} {"train_loss": -27.257659912109375, "global_step": 613637, "epoch": 7393} {"train_loss": -27.503416061401367, "global_step": 613638, "epoch": 7393} {"train_loss": -27.25843620300293, "global_step": 613639, "epoch": 7393} {"train_loss": -27.859149932861328, "global_step": 613640, "epoch": 7393} {"train_loss": -27.80029296875, "global_step": 613641, "epoch": 7393} {"train_loss": -27.835920333862305, "global_step": 613642, "epoch": 7393} {"train_loss": -27.423114776611328, "global_step": 613643, "epoch": 7393} {"train_loss": -27.59718894958496, "global_step": 613644, "epoch": 7393} {"train_loss": -27.742563247680664, "global_step": 613645, "epoch": 7393} {"train_loss": -27.795703887939453, "global_step": 613646, "epoch": 7393} {"train_loss": -27.801776885986328, "global_step": 613647, "epoch": 7393} {"train_loss": -27.795719146728516, "global_step": 613648, "epoch": 7393} {"train_loss": -27.54534339904785, "global_step": 613649, "epoch": 7393} {"train_loss": -27.796920776367188, "global_step": 613650, "epoch": 7393} {"train_loss": -28.098541259765625, "global_step": 613651, "epoch": 7393} {"train_loss": -28.09869384765625, "global_step": 613652, "epoch": 7393} {"train_loss": -27.7586669921875, "global_step": 613653, "epoch": 7393} {"train_loss": -28.10096549987793, "global_step": 613654, "epoch": 7393} {"train_loss": -27.991437911987305, "global_step": 613655, "epoch": 7393} {"train_loss": -27.646137237548828, "global_step": 613656, "epoch": 7393} {"train_loss": -27.842382431030273, "global_step": 613657, "epoch": 7393} {"train_loss": -28.024038314819336, "global_step": 613658, "epoch": 7393} {"train_loss": -28.18816566467285, "global_step": 613659, "epoch": 7393} {"train_loss": -28.007553100585938, "global_step": 613660, "epoch": 7393} {"train_loss": -28.29392433166504, "global_step": 613661, "epoch": 7393} {"train_loss": -28.146955490112305, "global_step": 613662, "epoch": 7393} {"train_loss": -28.261367797851562, "global_step": 613663, "epoch": 7393} {"train_loss": -27.679656982421875, "global_step": 613664, "epoch": 7393} {"train_loss": -27.99115562438965, "global_step": 613665, "epoch": 7393} {"train_loss": -28.024311065673828, "global_step": 613666, "epoch": 7393} {"train_loss": -27.928775787353516, "global_step": 613667, "epoch": 7393} {"train_loss": -28.3084774017334, "global_step": 613668, "epoch": 7393} {"train_loss": -28.07649040222168, "global_step": 613669, "epoch": 7393} {"train_loss": -27.817249298095703, "global_step": 613670, "epoch": 7393} {"train_loss": -28.404266357421875, "global_step": 613671, "epoch": 7393} {"train_loss": -28.271615982055664, "global_step": 613672, "epoch": 7393} {"train_loss": -28.141504287719727, "global_step": 613673, "epoch": 7393} {"train_loss": -28.361928939819336, "global_step": 613674, "epoch": 7393} {"train_loss": -28.07613182067871, "global_step": 613675, "epoch": 7393} {"train_loss": -28.058202743530273, "global_step": 613676, "epoch": 7393} {"train_loss": -28.296005249023438, "global_step": 613677, "epoch": 7393} {"train_loss": -28.00958251953125, "global_step": 613678, "epoch": 7393} {"train_loss": -27.941442489624023, "global_step": 613679, "epoch": 7393} {"train_loss": -28.00861930847168, "global_step": 613680, "epoch": 7393} {"train_loss": -28.400121688842773, "global_step": 613681, "epoch": 7393} {"train_loss": -28.297332763671875, "global_step": 613682, "epoch": 7393} {"train_loss": -28.207258224487305, "global_step": 613683, "epoch": 7393} {"train_loss": -27.9810791015625, "global_step": 613684, "epoch": 7393} {"train_loss": -28.54359245300293, "global_step": 613685, "epoch": 7393} {"train_loss": -27.7565975189209, "global_step": 613686, "epoch": 7393} {"train_loss": -28.044729232788086, "global_step": 613687, "epoch": 7393} {"train_loss": -28.68033218383789, "global_step": 613688, "epoch": 7393} {"train_loss": -28.325244903564453, "global_step": 613689, "epoch": 7393} {"train_loss": -28.60308837890625, "global_step": 613690, "epoch": 7393} {"train_loss": -27.94964027404785, "global_step": 613691, "epoch": 7393} {"train_loss": -28.13959312438965, "global_step": 613692, "epoch": 7393} {"train_loss": -28.41845703125, "global_step": 613693, "epoch": 7393} {"train_loss": -28.254873275756836, "global_step": 613694, "epoch": 7393} {"train_loss": -28.17264175415039, "global_step": 613695, "epoch": 7393} {"train_loss": -28.059616088867188, "global_step": 613696, "epoch": 7393} {"train_loss": -28.3992862701416, "global_step": 613697, "epoch": 7393} {"train_loss": -28.615116119384766, "global_step": 613698, "epoch": 7393} {"train_loss": -28.44388198852539, "global_step": 613699, "epoch": 7393} {"train_loss": -28.378820419311523, "global_step": 613700, "epoch": 7393} {"train_loss": -27.85555977419198, "global_step": 613701, "epoch": 7393, "val_loss": 6663813.0} {"train_loss": -27.223041534423828, "global_step": 613702, "epoch": 7394} {"train_loss": -27.13431739807129, "global_step": 613703, "epoch": 7394} {"train_loss": -26.9041690826416, "global_step": 613704, "epoch": 7394} {"train_loss": -26.73798942565918, "global_step": 613705, "epoch": 7394} {"train_loss": -27.535322189331055, "global_step": 613706, "epoch": 7394} {"train_loss": -27.512006759643555, "global_step": 613707, "epoch": 7394} {"train_loss": -27.930744171142578, "global_step": 613708, "epoch": 7394} {"train_loss": -27.3648738861084, "global_step": 613709, "epoch": 7394} {"train_loss": -28.117456436157227, "global_step": 613710, "epoch": 7394} {"train_loss": -27.230487823486328, "global_step": 613711, "epoch": 7394} {"train_loss": -27.891239166259766, "global_step": 613712, "epoch": 7394} {"train_loss": -27.353443145751953, "global_step": 613713, "epoch": 7394} {"train_loss": -27.706653594970703, "global_step": 613714, "epoch": 7394} {"train_loss": -27.521833419799805, "global_step": 613715, "epoch": 7394} {"train_loss": -27.557235717773438, "global_step": 613716, "epoch": 7394} {"train_loss": -27.67691421508789, "global_step": 613717, "epoch": 7394} {"train_loss": -27.789417266845703, "global_step": 613718, "epoch": 7394} {"train_loss": -27.521337509155273, "global_step": 613719, "epoch": 7394} {"train_loss": -27.71600341796875, "global_step": 613720, "epoch": 7394} {"train_loss": -27.708276748657227, "global_step": 613721, "epoch": 7394} {"train_loss": -27.701902389526367, "global_step": 613722, "epoch": 7394} {"train_loss": -28.091161727905273, "global_step": 613723, "epoch": 7394} {"train_loss": -27.801471710205078, "global_step": 613724, "epoch": 7394} {"train_loss": -27.7161808013916, "global_step": 613725, "epoch": 7394} {"train_loss": -28.081228256225586, "global_step": 613726, "epoch": 7394} {"train_loss": -27.618627548217773, "global_step": 613727, "epoch": 7394} {"train_loss": -27.868762969970703, "global_step": 613728, "epoch": 7394} {"train_loss": -28.07185935974121, "global_step": 613729, "epoch": 7394} {"train_loss": -27.963544845581055, "global_step": 613730, "epoch": 7394} {"train_loss": -28.338443756103516, "global_step": 613731, "epoch": 7394} {"train_loss": -28.092288970947266, "global_step": 613732, "epoch": 7394} {"train_loss": -27.79804039001465, "global_step": 613733, "epoch": 7394} {"train_loss": -27.75074577331543, "global_step": 613734, "epoch": 7394} {"train_loss": -28.27992057800293, "global_step": 613735, "epoch": 7394} {"train_loss": -27.66739845275879, "global_step": 613736, "epoch": 7394} {"train_loss": -28.140079498291016, "global_step": 613737, "epoch": 7394} {"train_loss": -28.148895263671875, "global_step": 613738, "epoch": 7394} {"train_loss": -28.076343536376953, "global_step": 613739, "epoch": 7394} {"train_loss": -27.8338565826416, "global_step": 613740, "epoch": 7394} {"train_loss": -28.521642684936523, "global_step": 613741, "epoch": 7394} {"train_loss": -28.000524520874023, "global_step": 613742, "epoch": 7394} {"train_loss": -28.3767147064209, "global_step": 613743, "epoch": 7394} {"train_loss": -28.4390926361084, "global_step": 613744, "epoch": 7394} {"train_loss": -28.03460121154785, "global_step": 613745, "epoch": 7394} {"train_loss": -28.440641403198242, "global_step": 613746, "epoch": 7394} {"train_loss": -28.495101928710938, "global_step": 613747, "epoch": 7394} {"train_loss": -28.17838478088379, "global_step": 613748, "epoch": 7394} {"train_loss": -28.212661743164062, "global_step": 613749, "epoch": 7394} {"train_loss": -28.52436637878418, "global_step": 613750, "epoch": 7394} {"train_loss": -28.276493072509766, "global_step": 613751, "epoch": 7394} {"train_loss": -28.462265014648438, "global_step": 613752, "epoch": 7394} {"train_loss": -28.065454483032227, "global_step": 613753, "epoch": 7394} {"train_loss": -28.028675079345703, "global_step": 613754, "epoch": 7394} {"train_loss": -28.445463180541992, "global_step": 613755, "epoch": 7394} {"train_loss": -28.549707412719727, "global_step": 613756, "epoch": 7394} {"train_loss": -28.590497970581055, "global_step": 613757, "epoch": 7394} {"train_loss": -28.349884033203125, "global_step": 613758, "epoch": 7394} {"train_loss": -28.35053825378418, "global_step": 613759, "epoch": 7394} {"train_loss": -28.36030387878418, "global_step": 613760, "epoch": 7394} {"train_loss": -28.397260665893555, "global_step": 613761, "epoch": 7394} {"train_loss": -28.467254638671875, "global_step": 613762, "epoch": 7394} {"train_loss": -28.398874282836914, "global_step": 613763, "epoch": 7394} {"train_loss": -28.18976402282715, "global_step": 613764, "epoch": 7394} {"train_loss": -27.50568962097168, "global_step": 613765, "epoch": 7394} {"train_loss": -27.71821403503418, "global_step": 613766, "epoch": 7394} {"train_loss": -27.583703994750977, "global_step": 613767, "epoch": 7394} {"train_loss": -27.343311309814453, "global_step": 613768, "epoch": 7394} {"train_loss": -27.906721115112305, "global_step": 613769, "epoch": 7394} {"train_loss": -27.868244171142578, "global_step": 613770, "epoch": 7394} {"train_loss": -27.938323974609375, "global_step": 613771, "epoch": 7394} {"train_loss": -27.866186141967773, "global_step": 613772, "epoch": 7394} {"train_loss": -27.640518188476562, "global_step": 613773, "epoch": 7394} {"train_loss": -27.789810180664062, "global_step": 613774, "epoch": 7394} {"train_loss": -27.35881996154785, "global_step": 613775, "epoch": 7394} {"train_loss": -26.84962272644043, "global_step": 613776, "epoch": 7394} {"train_loss": -27.865598678588867, "global_step": 613777, "epoch": 7394} {"train_loss": -27.870807647705078, "global_step": 613778, "epoch": 7394} {"train_loss": -27.728946685791016, "global_step": 613779, "epoch": 7394} {"train_loss": -27.620832443237305, "global_step": 613780, "epoch": 7394} {"train_loss": -28.053730010986328, "global_step": 613781, "epoch": 7394} {"train_loss": -27.794189453125, "global_step": 613782, "epoch": 7394} {"train_loss": -27.989126205444336, "global_step": 613783, "epoch": 7394} {"train_loss": -27.905775828533862, "global_step": 613784, "epoch": 7394, "val_loss": 6658628.0} {"train_loss": -27.803647994995117, "global_step": 613785, "epoch": 7395} {"train_loss": -27.640668869018555, "global_step": 613786, "epoch": 7395} {"train_loss": -27.844268798828125, "global_step": 613787, "epoch": 7395} {"train_loss": -28.075733184814453, "global_step": 613788, "epoch": 7395} {"train_loss": -27.807172775268555, "global_step": 613789, "epoch": 7395} {"train_loss": -27.94925308227539, "global_step": 613790, "epoch": 7395} {"train_loss": -27.79544448852539, "global_step": 613791, "epoch": 7395} {"train_loss": -27.429723739624023, "global_step": 613792, "epoch": 7395} {"train_loss": -27.725025177001953, "global_step": 613793, "epoch": 7395} {"train_loss": -27.4683895111084, "global_step": 613794, "epoch": 7395} {"train_loss": -27.729095458984375, "global_step": 613795, "epoch": 7395} {"train_loss": -28.142393112182617, "global_step": 613796, "epoch": 7395} {"train_loss": -27.849720001220703, "global_step": 613797, "epoch": 7395} {"train_loss": -28.192052841186523, "global_step": 613798, "epoch": 7395} {"train_loss": -27.830373764038086, "global_step": 613799, "epoch": 7395} {"train_loss": -27.828372955322266, "global_step": 613800, "epoch": 7395} {"train_loss": -27.865278244018555, "global_step": 613801, "epoch": 7395} {"train_loss": -28.016733169555664, "global_step": 613802, "epoch": 7395} {"train_loss": -28.247663497924805, "global_step": 613803, "epoch": 7395} {"train_loss": -27.950000762939453, "global_step": 613804, "epoch": 7395} {"train_loss": -28.126998901367188, "global_step": 613805, "epoch": 7395} {"train_loss": -28.083755493164062, "global_step": 613806, "epoch": 7395} {"train_loss": -27.905029296875, "global_step": 613807, "epoch": 7395} {"train_loss": -28.287372589111328, "global_step": 613808, "epoch": 7395} {"train_loss": -28.2205867767334, "global_step": 613809, "epoch": 7395} {"train_loss": -27.89751625061035, "global_step": 613810, "epoch": 7395} {"train_loss": -28.463525772094727, "global_step": 613811, "epoch": 7395} {"train_loss": -28.39641761779785, "global_step": 613812, "epoch": 7395} {"train_loss": -28.068754196166992, "global_step": 613813, "epoch": 7395} {"train_loss": -28.1481990814209, "global_step": 613814, "epoch": 7395} {"train_loss": -28.211206436157227, "global_step": 613815, "epoch": 7395} {"train_loss": -27.868749618530273, "global_step": 613816, "epoch": 7395} {"train_loss": -27.983367919921875, "global_step": 613817, "epoch": 7395} {"train_loss": -28.316259384155273, "global_step": 613818, "epoch": 7395} {"train_loss": -28.21735191345215, "global_step": 613819, "epoch": 7395} {"train_loss": -28.40276527404785, "global_step": 613820, "epoch": 7395} {"train_loss": -28.213287353515625, "global_step": 613821, "epoch": 7395} {"train_loss": -28.03900146484375, "global_step": 613822, "epoch": 7395} {"train_loss": -28.084491729736328, "global_step": 613823, "epoch": 7395} {"train_loss": -28.354923248291016, "global_step": 613824, "epoch": 7395} {"train_loss": -28.051877975463867, "global_step": 613825, "epoch": 7395} {"train_loss": -28.155292510986328, "global_step": 613826, "epoch": 7395} {"train_loss": -28.388263702392578, "global_step": 613827, "epoch": 7395} {"train_loss": -28.530048370361328, "global_step": 613828, "epoch": 7395} {"train_loss": -28.230331420898438, "global_step": 613829, "epoch": 7395} {"train_loss": -27.93043327331543, "global_step": 613830, "epoch": 7395} {"train_loss": -28.081430435180664, "global_step": 613831, "epoch": 7395} {"train_loss": -28.217687606811523, "global_step": 613832, "epoch": 7395} {"train_loss": -27.94091796875, "global_step": 613833, "epoch": 7395} {"train_loss": -28.3596134185791, "global_step": 613834, "epoch": 7395} {"train_loss": -28.333993911743164, "global_step": 613835, "epoch": 7395} {"train_loss": -28.003061294555664, "global_step": 613836, "epoch": 7395} {"train_loss": -28.584936141967773, "global_step": 613837, "epoch": 7395} {"train_loss": -27.795124053955078, "global_step": 613838, "epoch": 7395} {"train_loss": -28.392072677612305, "global_step": 613839, "epoch": 7395} {"train_loss": -28.39628028869629, "global_step": 613840, "epoch": 7395} {"train_loss": -28.8448486328125, "global_step": 613841, "epoch": 7395} {"train_loss": -28.378698348999023, "global_step": 613842, "epoch": 7395} {"train_loss": -28.28163719177246, "global_step": 613843, "epoch": 7395} {"train_loss": -28.349822998046875, "global_step": 613844, "epoch": 7395} {"train_loss": -28.2735538482666, "global_step": 613845, "epoch": 7395} {"train_loss": -28.30767822265625, "global_step": 613846, "epoch": 7395} {"train_loss": -28.2082462310791, "global_step": 613847, "epoch": 7395} {"train_loss": -28.369434356689453, "global_step": 613848, "epoch": 7395} {"train_loss": -28.18130874633789, "global_step": 613849, "epoch": 7395} {"train_loss": -28.43012809753418, "global_step": 613850, "epoch": 7395} {"train_loss": -28.074996948242188, "global_step": 613851, "epoch": 7395} {"train_loss": -28.35041618347168, "global_step": 613852, "epoch": 7395} {"train_loss": -28.397369384765625, "global_step": 613853, "epoch": 7395} {"train_loss": -28.22150230407715, "global_step": 613854, "epoch": 7395} {"train_loss": -28.202367782592773, "global_step": 613855, "epoch": 7395} {"train_loss": -28.231611251831055, "global_step": 613856, "epoch": 7395} {"train_loss": -28.1998233795166, "global_step": 613857, "epoch": 7395} {"train_loss": -28.136011123657227, "global_step": 613858, "epoch": 7395} {"train_loss": -28.67145347595215, "global_step": 613859, "epoch": 7395} {"train_loss": -28.44561195373535, "global_step": 613860, "epoch": 7395} {"train_loss": -27.98685646057129, "global_step": 613861, "epoch": 7395} {"train_loss": -27.628625869750977, "global_step": 613862, "epoch": 7395} {"train_loss": -27.19233512878418, "global_step": 613863, "epoch": 7395} {"train_loss": -26.309972763061523, "global_step": 613864, "epoch": 7395} {"train_loss": -27.639118194580078, "global_step": 613865, "epoch": 7395} {"train_loss": -27.722463607788086, "global_step": 613866, "epoch": 7395} {"train_loss": -28.085983896829998, "global_step": 613867, "epoch": 7395, "val_loss": 6659626.0} {"train_loss": -25.963281631469727, "global_step": 613868, "epoch": 7396} {"train_loss": -26.328596115112305, "global_step": 613869, "epoch": 7396} {"train_loss": -26.83319664001465, "global_step": 613870, "epoch": 7396} {"train_loss": -26.826810836791992, "global_step": 613871, "epoch": 7396} {"train_loss": -26.52292251586914, "global_step": 613872, "epoch": 7396} {"train_loss": -27.0212345123291, "global_step": 613873, "epoch": 7396} {"train_loss": -26.944599151611328, "global_step": 613874, "epoch": 7396} {"train_loss": -26.775104522705078, "global_step": 613875, "epoch": 7396} {"train_loss": -27.063901901245117, "global_step": 613876, "epoch": 7396} {"train_loss": -27.076263427734375, "global_step": 613877, "epoch": 7396} {"train_loss": -27.153310775756836, "global_step": 613878, "epoch": 7396} {"train_loss": -27.47718620300293, "global_step": 613879, "epoch": 7396} {"train_loss": -27.53252601623535, "global_step": 613880, "epoch": 7396} {"train_loss": -27.40950584411621, "global_step": 613881, "epoch": 7396} {"train_loss": -27.36704444885254, "global_step": 613882, "epoch": 7396} {"train_loss": -27.574743270874023, "global_step": 613883, "epoch": 7396} {"train_loss": -27.443328857421875, "global_step": 613884, "epoch": 7396} {"train_loss": -27.46687126159668, "global_step": 613885, "epoch": 7396} {"train_loss": -28.01275634765625, "global_step": 613886, "epoch": 7396} {"train_loss": -27.290014266967773, "global_step": 613887, "epoch": 7396} {"train_loss": -27.601333618164062, "global_step": 613888, "epoch": 7396} {"train_loss": -27.54349708557129, "global_step": 613889, "epoch": 7396} {"train_loss": -27.860082626342773, "global_step": 613890, "epoch": 7396} {"train_loss": -27.711181640625, "global_step": 613891, "epoch": 7396} {"train_loss": -27.3939151763916, "global_step": 613892, "epoch": 7396} {"train_loss": -27.691831588745117, "global_step": 613893, "epoch": 7396} {"train_loss": -27.5395565032959, "global_step": 613894, "epoch": 7396} {"train_loss": -28.01312255859375, "global_step": 613895, "epoch": 7396} {"train_loss": -27.885984420776367, "global_step": 613896, "epoch": 7396} {"train_loss": -28.14151382446289, "global_step": 613897, "epoch": 7396} {"train_loss": -28.09125328063965, "global_step": 613898, "epoch": 7396} {"train_loss": -28.104461669921875, "global_step": 613899, "epoch": 7396} {"train_loss": -27.894758224487305, "global_step": 613900, "epoch": 7396} {"train_loss": -27.695127487182617, "global_step": 613901, "epoch": 7396} {"train_loss": -27.999805450439453, "global_step": 613902, "epoch": 7396} {"train_loss": -28.13779067993164, "global_step": 613903, "epoch": 7396} {"train_loss": -28.09601402282715, "global_step": 613904, "epoch": 7396} {"train_loss": -28.65887451171875, "global_step": 613905, "epoch": 7396} {"train_loss": -27.959619522094727, "global_step": 613906, "epoch": 7396} {"train_loss": -27.9573917388916, "global_step": 613907, "epoch": 7396} {"train_loss": -28.2791748046875, "global_step": 613908, "epoch": 7396} {"train_loss": -28.151844024658203, "global_step": 613909, "epoch": 7396} {"train_loss": -28.030790328979492, "global_step": 613910, "epoch": 7396} {"train_loss": -27.771209716796875, "global_step": 613911, "epoch": 7396} {"train_loss": -28.34681510925293, "global_step": 613912, "epoch": 7396} {"train_loss": -27.941232681274414, "global_step": 613913, "epoch": 7396} {"train_loss": -28.40717887878418, "global_step": 613914, "epoch": 7396} {"train_loss": -28.269454956054688, "global_step": 613915, "epoch": 7396} {"train_loss": -28.10914421081543, "global_step": 613916, "epoch": 7396} {"train_loss": -28.148767471313477, "global_step": 613917, "epoch": 7396} {"train_loss": -27.918298721313477, "global_step": 613918, "epoch": 7396} {"train_loss": -28.035314559936523, "global_step": 613919, "epoch": 7396} {"train_loss": -27.79021644592285, "global_step": 613920, "epoch": 7396} {"train_loss": -27.650007247924805, "global_step": 613921, "epoch": 7396} {"train_loss": -28.094892501831055, "global_step": 613922, "epoch": 7396} {"train_loss": -28.276697158813477, "global_step": 613923, "epoch": 7396} {"train_loss": -28.066556930541992, "global_step": 613924, "epoch": 7396} {"train_loss": -27.90510368347168, "global_step": 613925, "epoch": 7396} {"train_loss": -28.0451717376709, "global_step": 613926, "epoch": 7396} {"train_loss": -28.396509170532227, "global_step": 613927, "epoch": 7396} {"train_loss": -27.71173667907715, "global_step": 613928, "epoch": 7396} {"train_loss": -27.899038314819336, "global_step": 613929, "epoch": 7396} {"train_loss": -27.41094970703125, "global_step": 613930, "epoch": 7396} {"train_loss": -27.532745361328125, "global_step": 613931, "epoch": 7396} {"train_loss": -27.283588409423828, "global_step": 613932, "epoch": 7396} {"train_loss": -27.379796981811523, "global_step": 613933, "epoch": 7396} {"train_loss": -27.559263229370117, "global_step": 613934, "epoch": 7396} {"train_loss": -28.360910415649414, "global_step": 613935, "epoch": 7396} {"train_loss": -27.6019344329834, "global_step": 613936, "epoch": 7396} {"train_loss": -28.260141372680664, "global_step": 613937, "epoch": 7396} {"train_loss": -28.1251163482666, "global_step": 613938, "epoch": 7396} {"train_loss": -28.2762508392334, "global_step": 613939, "epoch": 7396} {"train_loss": -28.51006507873535, "global_step": 613940, "epoch": 7396} {"train_loss": -28.264631271362305, "global_step": 613941, "epoch": 7396} {"train_loss": -28.03769302368164, "global_step": 613942, "epoch": 7396} {"train_loss": -27.76942253112793, "global_step": 613943, "epoch": 7396} {"train_loss": -28.282306671142578, "global_step": 613944, "epoch": 7396} {"train_loss": -27.97173500061035, "global_step": 613945, "epoch": 7396} {"train_loss": -28.199798583984375, "global_step": 613946, "epoch": 7396} {"train_loss": -28.161230087280273, "global_step": 613947, "epoch": 7396} {"train_loss": -28.16230583190918, "global_step": 613948, "epoch": 7396} {"train_loss": -28.246957778930664, "global_step": 613949, "epoch": 7396} {"train_loss": -27.762185912534417, "global_step": 613950, "epoch": 7396, "val_loss": 6690034.0} {"train_loss": -27.61761474609375, "global_step": 613951, "epoch": 7397} {"train_loss": -27.801023483276367, "global_step": 613952, "epoch": 7397} {"train_loss": -27.411401748657227, "global_step": 613953, "epoch": 7397} {"train_loss": -27.9553165435791, "global_step": 613954, "epoch": 7397} {"train_loss": -28.081640243530273, "global_step": 613955, "epoch": 7397} {"train_loss": -28.025482177734375, "global_step": 613956, "epoch": 7397} {"train_loss": -27.89533805847168, "global_step": 613957, "epoch": 7397} {"train_loss": -27.970556259155273, "global_step": 613958, "epoch": 7397} {"train_loss": -28.080732345581055, "global_step": 613959, "epoch": 7397} {"train_loss": -27.54522705078125, "global_step": 613960, "epoch": 7397} {"train_loss": -28.261062622070312, "global_step": 613961, "epoch": 7397} {"train_loss": -27.856985092163086, "global_step": 613962, "epoch": 7397} {"train_loss": -28.131214141845703, "global_step": 613963, "epoch": 7397} {"train_loss": -27.670698165893555, "global_step": 613964, "epoch": 7397} {"train_loss": -28.266265869140625, "global_step": 613965, "epoch": 7397} {"train_loss": -28.063709259033203, "global_step": 613966, "epoch": 7397} {"train_loss": -28.065542221069336, "global_step": 613967, "epoch": 7397} {"train_loss": -28.286218643188477, "global_step": 613968, "epoch": 7397} {"train_loss": -28.573139190673828, "global_step": 613969, "epoch": 7397} {"train_loss": -28.256147384643555, "global_step": 613970, "epoch": 7397} {"train_loss": -28.469343185424805, "global_step": 613971, "epoch": 7397} {"train_loss": -28.4773006439209, "global_step": 613972, "epoch": 7397} {"train_loss": -28.431385040283203, "global_step": 613973, "epoch": 7397} {"train_loss": -28.662378311157227, "global_step": 613974, "epoch": 7397} {"train_loss": -28.604419708251953, "global_step": 613975, "epoch": 7397} {"train_loss": -28.283222198486328, "global_step": 613976, "epoch": 7397} {"train_loss": -28.158771514892578, "global_step": 613977, "epoch": 7397} {"train_loss": -28.30181312561035, "global_step": 613978, "epoch": 7397} {"train_loss": -28.279821395874023, "global_step": 613979, "epoch": 7397} {"train_loss": -28.3583927154541, "global_step": 613980, "epoch": 7397} {"train_loss": -28.126768112182617, "global_step": 613981, "epoch": 7397} {"train_loss": -28.1122989654541, "global_step": 613982, "epoch": 7397} {"train_loss": -28.62799072265625, "global_step": 613983, "epoch": 7397} {"train_loss": -28.2885684967041, "global_step": 613984, "epoch": 7397} {"train_loss": -28.081531524658203, "global_step": 613985, "epoch": 7397} {"train_loss": -27.902257919311523, "global_step": 613986, "epoch": 7397} {"train_loss": -27.999181747436523, "global_step": 613987, "epoch": 7397} {"train_loss": -28.36319351196289, "global_step": 613988, "epoch": 7397} {"train_loss": -28.292102813720703, "global_step": 613989, "epoch": 7397} {"train_loss": -27.66921043395996, "global_step": 613990, "epoch": 7397} {"train_loss": -27.300674438476562, "global_step": 613991, "epoch": 7397} {"train_loss": -26.416852951049805, "global_step": 613992, "epoch": 7397} {"train_loss": -26.192489624023438, "global_step": 613993, "epoch": 7397} {"train_loss": -27.764545440673828, "global_step": 613994, "epoch": 7397} {"train_loss": -27.615293502807617, "global_step": 613995, "epoch": 7397} {"train_loss": -26.972492218017578, "global_step": 613996, "epoch": 7397} {"train_loss": -27.699853897094727, "global_step": 613997, "epoch": 7397} {"train_loss": -27.524633407592773, "global_step": 613998, "epoch": 7397} {"train_loss": -27.959577560424805, "global_step": 613999, "epoch": 7397} {"train_loss": -27.64484977722168, "global_step": 614000, "epoch": 7397} {"train_loss": -28.0998477935791, "global_step": 614001, "epoch": 7397} {"train_loss": -27.793832778930664, "global_step": 614002, "epoch": 7397} {"train_loss": -27.557348251342773, "global_step": 614003, "epoch": 7397} {"train_loss": -27.964405059814453, "global_step": 614004, "epoch": 7397} {"train_loss": -28.06789207458496, "global_step": 614005, "epoch": 7397} {"train_loss": -27.991209030151367, "global_step": 614006, "epoch": 7397} {"train_loss": -27.726470947265625, "global_step": 614007, "epoch": 7397} {"train_loss": -28.204132080078125, "global_step": 614008, "epoch": 7397} {"train_loss": -27.759424209594727, "global_step": 614009, "epoch": 7397} {"train_loss": -27.91254234313965, "global_step": 614010, "epoch": 7397} {"train_loss": -27.809850692749023, "global_step": 614011, "epoch": 7397} {"train_loss": -27.9558048248291, "global_step": 614012, "epoch": 7397} {"train_loss": -28.0148983001709, "global_step": 614013, "epoch": 7397} {"train_loss": -27.962942123413086, "global_step": 614014, "epoch": 7397} {"train_loss": -27.9498291015625, "global_step": 614015, "epoch": 7397} {"train_loss": -27.949039459228516, "global_step": 614016, "epoch": 7397} {"train_loss": -27.8424072265625, "global_step": 614017, "epoch": 7397} {"train_loss": -28.108808517456055, "global_step": 614018, "epoch": 7397} {"train_loss": -27.49847412109375, "global_step": 614019, "epoch": 7397} {"train_loss": -28.026233673095703, "global_step": 614020, "epoch": 7397} {"train_loss": -28.159772872924805, "global_step": 614021, "epoch": 7397} {"train_loss": -27.53753089904785, "global_step": 614022, "epoch": 7397} {"train_loss": -27.900909423828125, "global_step": 614023, "epoch": 7397} {"train_loss": -27.807525634765625, "global_step": 614024, "epoch": 7397} {"train_loss": -27.732358932495117, "global_step": 614025, "epoch": 7397} {"train_loss": -27.326757431030273, "global_step": 614026, "epoch": 7397} {"train_loss": -27.748586654663086, "global_step": 614027, "epoch": 7397} {"train_loss": -27.119796752929688, "global_step": 614028, "epoch": 7397} {"train_loss": -27.661691665649414, "global_step": 614029, "epoch": 7397} {"train_loss": -28.037860870361328, "global_step": 614030, "epoch": 7397} {"train_loss": -27.607074737548828, "global_step": 614031, "epoch": 7397} {"train_loss": -28.135650634765625, "global_step": 614032, "epoch": 7397} {"train_loss": -27.912907726793403, "global_step": 614033, "epoch": 7397, "val_loss": 6705275.0} {"train_loss": -27.26747703552246, "global_step": 614034, "epoch": 7398} {"train_loss": -27.05506706237793, "global_step": 614035, "epoch": 7398} {"train_loss": -27.538232803344727, "global_step": 614036, "epoch": 7398} {"train_loss": -27.241979598999023, "global_step": 614037, "epoch": 7398} {"train_loss": -27.2703800201416, "global_step": 614038, "epoch": 7398} {"train_loss": -27.4620304107666, "global_step": 614039, "epoch": 7398} {"train_loss": -27.521387100219727, "global_step": 614040, "epoch": 7398} {"train_loss": -27.650434494018555, "global_step": 614041, "epoch": 7398} {"train_loss": -27.553266525268555, "global_step": 614042, "epoch": 7398} {"train_loss": -27.324804306030273, "global_step": 614043, "epoch": 7398} {"train_loss": -27.8226261138916, "global_step": 614044, "epoch": 7398} {"train_loss": -27.8323974609375, "global_step": 614045, "epoch": 7398} {"train_loss": -27.766759872436523, "global_step": 614046, "epoch": 7398} {"train_loss": -27.941425323486328, "global_step": 614047, "epoch": 7398} {"train_loss": -27.676984786987305, "global_step": 614048, "epoch": 7398} {"train_loss": -27.750823974609375, "global_step": 614049, "epoch": 7398} {"train_loss": -27.826770782470703, "global_step": 614050, "epoch": 7398} {"train_loss": -27.7382755279541, "global_step": 614051, "epoch": 7398} {"train_loss": -27.736469268798828, "global_step": 614052, "epoch": 7398} {"train_loss": -27.75217056274414, "global_step": 614053, "epoch": 7398} {"train_loss": -27.7055721282959, "global_step": 614054, "epoch": 7398} {"train_loss": -27.623205184936523, "global_step": 614055, "epoch": 7398} {"train_loss": -28.274621963500977, "global_step": 614056, "epoch": 7398} {"train_loss": -28.18896484375, "global_step": 614057, "epoch": 7398} {"train_loss": -28.246320724487305, "global_step": 614058, "epoch": 7398} {"train_loss": -27.901208877563477, "global_step": 614059, "epoch": 7398} {"train_loss": -27.923664093017578, "global_step": 614060, "epoch": 7398} {"train_loss": -28.017093658447266, "global_step": 614061, "epoch": 7398} {"train_loss": -27.989591598510742, "global_step": 614062, "epoch": 7398} {"train_loss": -28.024932861328125, "global_step": 614063, "epoch": 7398} {"train_loss": -28.238861083984375, "global_step": 614064, "epoch": 7398} {"train_loss": -28.337812423706055, "global_step": 614065, "epoch": 7398} {"train_loss": -28.423969268798828, "global_step": 614066, "epoch": 7398} {"train_loss": -28.102203369140625, "global_step": 614067, "epoch": 7398} {"train_loss": -27.942035675048828, "global_step": 614068, "epoch": 7398} {"train_loss": -28.661779403686523, "global_step": 614069, "epoch": 7398} {"train_loss": -28.2167911529541, "global_step": 614070, "epoch": 7398} {"train_loss": -27.62529945373535, "global_step": 614071, "epoch": 7398} {"train_loss": -27.832014083862305, "global_step": 614072, "epoch": 7398} {"train_loss": -28.40638542175293, "global_step": 614073, "epoch": 7398} {"train_loss": -28.63116455078125, "global_step": 614074, "epoch": 7398} {"train_loss": -27.782215118408203, "global_step": 614075, "epoch": 7398} {"train_loss": -28.43826675415039, "global_step": 614076, "epoch": 7398} {"train_loss": -27.9888916015625, "global_step": 614077, "epoch": 7398} {"train_loss": -28.650182723999023, "global_step": 614078, "epoch": 7398} {"train_loss": -28.148107528686523, "global_step": 614079, "epoch": 7398} {"train_loss": -28.633691787719727, "global_step": 614080, "epoch": 7398} {"train_loss": -28.400190353393555, "global_step": 614081, "epoch": 7398} {"train_loss": -27.77790641784668, "global_step": 614082, "epoch": 7398} {"train_loss": -28.093420028686523, "global_step": 614083, "epoch": 7398} {"train_loss": -28.497777938842773, "global_step": 614084, "epoch": 7398} {"train_loss": -28.269983291625977, "global_step": 614085, "epoch": 7398} {"train_loss": -28.3240909576416, "global_step": 614086, "epoch": 7398} {"train_loss": -28.27717399597168, "global_step": 614087, "epoch": 7398} {"train_loss": -28.07110023498535, "global_step": 614088, "epoch": 7398} {"train_loss": -27.982946395874023, "global_step": 614089, "epoch": 7398} {"train_loss": -28.35056495666504, "global_step": 614090, "epoch": 7398} {"train_loss": -28.527753829956055, "global_step": 614091, "epoch": 7398} {"train_loss": -28.4550724029541, "global_step": 614092, "epoch": 7398} {"train_loss": -28.257307052612305, "global_step": 614093, "epoch": 7398} {"train_loss": -28.187824249267578, "global_step": 614094, "epoch": 7398} {"train_loss": -28.295623779296875, "global_step": 614095, "epoch": 7398} {"train_loss": -28.334964752197266, "global_step": 614096, "epoch": 7398} {"train_loss": -28.117136001586914, "global_step": 614097, "epoch": 7398} {"train_loss": -28.5843448638916, "global_step": 614098, "epoch": 7398} {"train_loss": -28.209217071533203, "global_step": 614099, "epoch": 7398} {"train_loss": -28.53167152404785, "global_step": 614100, "epoch": 7398} {"train_loss": -28.40736961364746, "global_step": 614101, "epoch": 7398} {"train_loss": -28.319101333618164, "global_step": 614102, "epoch": 7398} {"train_loss": -28.191089630126953, "global_step": 614103, "epoch": 7398} {"train_loss": -28.597461700439453, "global_step": 614104, "epoch": 7398} {"train_loss": -28.819290161132812, "global_step": 614105, "epoch": 7398} {"train_loss": -28.231067657470703, "global_step": 614106, "epoch": 7398} {"train_loss": -28.28643226623535, "global_step": 614107, "epoch": 7398} {"train_loss": -28.166091918945312, "global_step": 614108, "epoch": 7398} {"train_loss": -28.40985679626465, "global_step": 614109, "epoch": 7398} {"train_loss": -27.8803653717041, "global_step": 614110, "epoch": 7398} {"train_loss": -28.3653564453125, "global_step": 614111, "epoch": 7398} {"train_loss": -28.2616024017334, "global_step": 614112, "epoch": 7398} {"train_loss": -28.244098663330078, "global_step": 614113, "epoch": 7398} {"train_loss": -28.372879028320312, "global_step": 614114, "epoch": 7398} {"train_loss": -28.006513595581055, "global_step": 614115, "epoch": 7398} {"train_loss": -28.068126793367316, "global_step": 614116, "epoch": 7398, "val_loss": 6686685.0} {"train_loss": -27.806278228759766, "global_step": 614117, "epoch": 7399} {"train_loss": -27.95411491394043, "global_step": 614118, "epoch": 7399} {"train_loss": -27.85145378112793, "global_step": 614119, "epoch": 7399} {"train_loss": -27.4097843170166, "global_step": 614120, "epoch": 7399} {"train_loss": -27.27801513671875, "global_step": 614121, "epoch": 7399} {"train_loss": -27.91388511657715, "global_step": 614122, "epoch": 7399} {"train_loss": -27.424345016479492, "global_step": 614123, "epoch": 7399} {"train_loss": -27.477529525756836, "global_step": 614124, "epoch": 7399} {"train_loss": -27.360443115234375, "global_step": 614125, "epoch": 7399} {"train_loss": -27.644392013549805, "global_step": 614126, "epoch": 7399} {"train_loss": -27.470617294311523, "global_step": 614127, "epoch": 7399} {"train_loss": -28.39495849609375, "global_step": 614128, "epoch": 7399} {"train_loss": -27.427289962768555, "global_step": 614129, "epoch": 7399} {"train_loss": -28.013614654541016, "global_step": 614130, "epoch": 7399} {"train_loss": -27.4428653717041, "global_step": 614131, "epoch": 7399} {"train_loss": -27.6466121673584, "global_step": 614132, "epoch": 7399} {"train_loss": -27.54119300842285, "global_step": 614133, "epoch": 7399} {"train_loss": -27.831756591796875, "global_step": 614134, "epoch": 7399} {"train_loss": -27.732177734375, "global_step": 614135, "epoch": 7399} {"train_loss": -28.00592041015625, "global_step": 614136, "epoch": 7399} {"train_loss": -27.964435577392578, "global_step": 614137, "epoch": 7399} {"train_loss": -27.453994750976562, "global_step": 614138, "epoch": 7399} {"train_loss": -27.49641227722168, "global_step": 614139, "epoch": 7399} {"train_loss": -27.862512588500977, "global_step": 614140, "epoch": 7399} {"train_loss": -27.710081100463867, "global_step": 614141, "epoch": 7399} {"train_loss": -28.260038375854492, "global_step": 614142, "epoch": 7399} {"train_loss": -27.90935707092285, "global_step": 614143, "epoch": 7399} {"train_loss": -28.1593074798584, "global_step": 614144, "epoch": 7399} {"train_loss": -27.7657413482666, "global_step": 614145, "epoch": 7399} {"train_loss": -28.101978302001953, "global_step": 614146, "epoch": 7399} {"train_loss": -28.09393310546875, "global_step": 614147, "epoch": 7399} {"train_loss": -27.378931045532227, "global_step": 614148, "epoch": 7399} {"train_loss": -27.801069259643555, "global_step": 614149, "epoch": 7399} {"train_loss": -27.773107528686523, "global_step": 614150, "epoch": 7399} {"train_loss": -28.158599853515625, "global_step": 614151, "epoch": 7399} {"train_loss": -27.672748565673828, "global_step": 614152, "epoch": 7399} {"train_loss": -28.089567184448242, "global_step": 614153, "epoch": 7399} {"train_loss": -27.857074737548828, "global_step": 614154, "epoch": 7399} {"train_loss": -28.366500854492188, "global_step": 614155, "epoch": 7399} {"train_loss": -28.00953483581543, "global_step": 614156, "epoch": 7399} {"train_loss": -27.834630966186523, "global_step": 614157, "epoch": 7399} {"train_loss": -27.761672973632812, "global_step": 614158, "epoch": 7399} {"train_loss": -27.971149444580078, "global_step": 614159, "epoch": 7399} {"train_loss": -28.223718643188477, "global_step": 614160, "epoch": 7399} {"train_loss": -27.873437881469727, "global_step": 614161, "epoch": 7399} {"train_loss": -28.294836044311523, "global_step": 614162, "epoch": 7399} {"train_loss": -28.18343162536621, "global_step": 614163, "epoch": 7399} {"train_loss": -27.933561325073242, "global_step": 614164, "epoch": 7399} {"train_loss": -28.419769287109375, "global_step": 614165, "epoch": 7399} {"train_loss": -27.983905792236328, "global_step": 614166, "epoch": 7399} {"train_loss": -28.332111358642578, "global_step": 614167, "epoch": 7399} {"train_loss": -28.116352081298828, "global_step": 614168, "epoch": 7399} {"train_loss": -28.344419479370117, "global_step": 614169, "epoch": 7399} {"train_loss": -28.070276260375977, "global_step": 614170, "epoch": 7399} {"train_loss": -28.573001861572266, "global_step": 614171, "epoch": 7399} {"train_loss": -28.27901268005371, "global_step": 614172, "epoch": 7399} {"train_loss": -28.7510929107666, "global_step": 614173, "epoch": 7399} {"train_loss": -28.424957275390625, "global_step": 614174, "epoch": 7399} {"train_loss": -28.150253295898438, "global_step": 614175, "epoch": 7399} {"train_loss": -28.19659423828125, "global_step": 614176, "epoch": 7399} {"train_loss": -28.218107223510742, "global_step": 614177, "epoch": 7399} {"train_loss": -28.39522361755371, "global_step": 614178, "epoch": 7399} {"train_loss": -28.40744972229004, "global_step": 614179, "epoch": 7399} {"train_loss": -28.85028648376465, "global_step": 614180, "epoch": 7399} {"train_loss": -28.385025024414062, "global_step": 614181, "epoch": 7399} {"train_loss": -28.440353393554688, "global_step": 614182, "epoch": 7399} {"train_loss": -28.178760528564453, "global_step": 614183, "epoch": 7399} {"train_loss": -28.369709014892578, "global_step": 614184, "epoch": 7399} {"train_loss": -28.555967330932617, "global_step": 614185, "epoch": 7399} {"train_loss": -28.321624755859375, "global_step": 614186, "epoch": 7399} {"train_loss": -28.34535026550293, "global_step": 614187, "epoch": 7399} {"train_loss": -28.487781524658203, "global_step": 614188, "epoch": 7399} {"train_loss": -28.54229736328125, "global_step": 614189, "epoch": 7399} {"train_loss": -28.331823348999023, "global_step": 614190, "epoch": 7399} {"train_loss": -28.139001846313477, "global_step": 614191, "epoch": 7399} {"train_loss": -28.542219161987305, "global_step": 614192, "epoch": 7399} {"train_loss": -28.450607299804688, "global_step": 614193, "epoch": 7399} {"train_loss": -28.21774673461914, "global_step": 614194, "epoch": 7399} {"train_loss": -28.225061416625977, "global_step": 614195, "epoch": 7399} {"train_loss": -27.98847007751465, "global_step": 614196, "epoch": 7399} {"train_loss": -28.254526138305664, "global_step": 614197, "epoch": 7399} {"train_loss": -27.89595603942871, "global_step": 614198, "epoch": 7399} {"train_loss": -28.03128617068371, "global_step": 614199, "epoch": 7399, "val_loss": 6664337.5} {"train_loss": -25.693262100219727, "global_step": 614200, "epoch": 7400} {"train_loss": -24.903676986694336, "global_step": 614201, "epoch": 7400} {"train_loss": -26.22150230407715, "global_step": 614202, "epoch": 7400} {"train_loss": -26.201831817626953, "global_step": 614203, "epoch": 7400} {"train_loss": -26.186933517456055, "global_step": 614204, "epoch": 7400} {"train_loss": -25.059823989868164, "global_step": 614205, "epoch": 7400} {"train_loss": -25.75812339782715, "global_step": 614206, "epoch": 7400} {"train_loss": -25.890777587890625, "global_step": 614207, "epoch": 7400} {"train_loss": -26.582351684570312, "global_step": 614208, "epoch": 7400} {"train_loss": -26.36649513244629, "global_step": 614209, "epoch": 7400} {"train_loss": -26.674072265625, "global_step": 614210, "epoch": 7400} {"train_loss": -26.401105880737305, "global_step": 614211, "epoch": 7400} {"train_loss": -27.13605308532715, "global_step": 614212, "epoch": 7400} {"train_loss": -26.283859252929688, "global_step": 614213, "epoch": 7400} {"train_loss": -27.242963790893555, "global_step": 614214, "epoch": 7400} {"train_loss": -26.953250885009766, "global_step": 614215, "epoch": 7400} {"train_loss": -26.164127349853516, "global_step": 614216, "epoch": 7400} {"train_loss": -27.247949600219727, "global_step": 614217, "epoch": 7400} {"train_loss": -26.79627799987793, "global_step": 614218, "epoch": 7400} {"train_loss": -27.025714874267578, "global_step": 614219, "epoch": 7400} {"train_loss": -27.534870147705078, "global_step": 614220, "epoch": 7400} {"train_loss": -27.154693603515625, "global_step": 614221, "epoch": 7400} {"train_loss": -27.13543128967285, "global_step": 614222, "epoch": 7400} {"train_loss": -27.414356231689453, "global_step": 614223, "epoch": 7400} {"train_loss": -27.31402587890625, "global_step": 614224, "epoch": 7400} {"train_loss": -27.1634521484375, "global_step": 614225, "epoch": 7400} {"train_loss": -27.398191452026367, "global_step": 614226, "epoch": 7400} {"train_loss": -27.59990882873535, "global_step": 614227, "epoch": 7400} {"train_loss": -27.16071128845215, "global_step": 614228, "epoch": 7400} {"train_loss": -27.62361717224121, "global_step": 614229, "epoch": 7400} {"train_loss": -27.5086612701416, "global_step": 614230, "epoch": 7400} {"train_loss": -27.5020751953125, "global_step": 614231, "epoch": 7400} {"train_loss": -28.09134292602539, "global_step": 614232, "epoch": 7400} {"train_loss": -27.95196533203125, "global_step": 614233, "epoch": 7400} {"train_loss": -27.538318634033203, "global_step": 614234, "epoch": 7400} {"train_loss": -27.989212036132812, "global_step": 614235, "epoch": 7400} {"train_loss": -27.719457626342773, "global_step": 614236, "epoch": 7400} {"train_loss": -27.622589111328125, "global_step": 614237, "epoch": 7400} {"train_loss": -27.792083740234375, "global_step": 614238, "epoch": 7400} {"train_loss": -27.72124671936035, "global_step": 614239, "epoch": 7400} {"train_loss": -27.82802391052246, "global_step": 614240, "epoch": 7400} {"train_loss": -27.560230255126953, "global_step": 614241, "epoch": 7400} {"train_loss": -27.733428955078125, "global_step": 614242, "epoch": 7400} {"train_loss": -27.820417404174805, "global_step": 614243, "epoch": 7400} {"train_loss": -27.881439208984375, "global_step": 614244, "epoch": 7400} {"train_loss": -27.8945255279541, "global_step": 614245, "epoch": 7400} {"train_loss": -27.67645263671875, "global_step": 614246, "epoch": 7400} {"train_loss": -27.838455200195312, "global_step": 614247, "epoch": 7400} {"train_loss": -27.77521324157715, "global_step": 614248, "epoch": 7400} {"train_loss": -28.164154052734375, "global_step": 614249, "epoch": 7400} {"train_loss": -28.101755142211914, "global_step": 614250, "epoch": 7400} {"train_loss": -27.83514976501465, "global_step": 614251, "epoch": 7400} {"train_loss": -27.9843807220459, "global_step": 614252, "epoch": 7400} {"train_loss": -27.907079696655273, "global_step": 614253, "epoch": 7400} {"train_loss": -27.648666381835938, "global_step": 614254, "epoch": 7400} {"train_loss": -28.121963500976562, "global_step": 614255, "epoch": 7400} {"train_loss": -27.73186683654785, "global_step": 614256, "epoch": 7400} {"train_loss": -27.742517471313477, "global_step": 614257, "epoch": 7400} {"train_loss": -28.2534236907959, "global_step": 614258, "epoch": 7400} {"train_loss": -28.093366622924805, "global_step": 614259, "epoch": 7400} {"train_loss": -27.887420654296875, "global_step": 614260, "epoch": 7400} {"train_loss": -27.839750289916992, "global_step": 614261, "epoch": 7400} {"train_loss": -28.110584259033203, "global_step": 614262, "epoch": 7400} {"train_loss": -28.2240047454834, "global_step": 614263, "epoch": 7400} {"train_loss": -28.402551651000977, "global_step": 614264, "epoch": 7400} {"train_loss": -28.240446090698242, "global_step": 614265, "epoch": 7400} {"train_loss": -28.019445419311523, "global_step": 614266, "epoch": 7400} {"train_loss": -28.16859245300293, "global_step": 614267, "epoch": 7400} {"train_loss": -27.988037109375, "global_step": 614268, "epoch": 7400} {"train_loss": -27.891626358032227, "global_step": 614269, "epoch": 7400} {"train_loss": -28.00028419494629, "global_step": 614270, "epoch": 7400} {"train_loss": -27.885971069335938, "global_step": 614271, "epoch": 7400} {"train_loss": -27.664352416992188, "global_step": 614272, "epoch": 7400} {"train_loss": -28.135461807250977, "global_step": 614273, "epoch": 7400} {"train_loss": -28.161060333251953, "global_step": 614274, "epoch": 7400} {"train_loss": -28.1478271484375, "global_step": 614275, "epoch": 7400} {"train_loss": -28.179548263549805, "global_step": 614276, "epoch": 7400} {"train_loss": -28.104267120361328, "global_step": 614277, "epoch": 7400} {"train_loss": -28.059240341186523, "global_step": 614278, "epoch": 7400} {"train_loss": -28.18654441833496, "global_step": 614279, "epoch": 7400} {"train_loss": -28.47332763671875, "global_step": 614280, "epoch": 7400} {"train_loss": -28.25738525390625, "global_step": 614281, "epoch": 7400} {"train_loss": -27.494081451232177, "global_step": 614282, "epoch": 7400, "train/sim_max_reward_0": 1.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4500000": 1.0, "test/sim_max_reward_4500001": 1.0, "test/sim_max_reward_4500002": 1.0, "test/sim_max_reward_4500003": 1.0, "test/sim_max_reward_4500004": 1.0, "test/sim_max_reward_4500005": 1.0, "test/sim_max_reward_4500006": 1.0, "test/sim_max_reward_4500007": 0.0, "test/sim_max_reward_4500008": 1.0, "test/sim_max_reward_4500009": 1.0, "test/sim_max_reward_4500010": 1.0, "test/sim_max_reward_4500011": 1.0, "test/sim_max_reward_4500012": 1.0, "test/sim_max_reward_4500013": 0.0, "test/sim_max_reward_4500014": 1.0, "test/sim_max_reward_4500015": 1.0, "test/sim_max_reward_4500016": 1.0, "test/sim_max_reward_4500017": 1.0, "test/sim_max_reward_4500018": 1.0, "test/sim_max_reward_4500019": 0.0, "test/sim_max_reward_4500020": 1.0, "test/sim_max_reward_4500021": 1.0, "train/mean_score": 1.0, "test/mean_score": 0.8636363636363636, "val_loss": 6667390.0} {"train_loss": -28.02717399597168, "global_step": 614283, "epoch": 7401} {"train_loss": -27.675073623657227, "global_step": 614284, "epoch": 7401} {"train_loss": -27.633771896362305, "global_step": 614285, "epoch": 7401} {"train_loss": -27.923791885375977, "global_step": 614286, "epoch": 7401} {"train_loss": -26.814062118530273, "global_step": 614287, "epoch": 7401} {"train_loss": -27.669696807861328, "global_step": 614288, "epoch": 7401} {"train_loss": -27.498685836791992, "global_step": 614289, "epoch": 7401} {"train_loss": -27.15341567993164, "global_step": 614290, "epoch": 7401} {"train_loss": -27.30708885192871, "global_step": 614291, "epoch": 7401} {"train_loss": -27.168798446655273, "global_step": 614292, "epoch": 7401} {"train_loss": -27.503910064697266, "global_step": 614293, "epoch": 7401} {"train_loss": -27.794055938720703, "global_step": 614294, "epoch": 7401} {"train_loss": -27.710407257080078, "global_step": 614295, "epoch": 7401} {"train_loss": -28.032148361206055, "global_step": 614296, "epoch": 7401} {"train_loss": -27.5346736907959, "global_step": 614297, "epoch": 7401} {"train_loss": -27.735015869140625, "global_step": 614298, "epoch": 7401} {"train_loss": -27.89499282836914, "global_step": 614299, "epoch": 7401} {"train_loss": -27.76175308227539, "global_step": 614300, "epoch": 7401} {"train_loss": -27.842761993408203, "global_step": 614301, "epoch": 7401} {"train_loss": -27.72724723815918, "global_step": 614302, "epoch": 7401} {"train_loss": -27.826955795288086, "global_step": 614303, "epoch": 7401} {"train_loss": -28.05914306640625, "global_step": 614304, "epoch": 7401} {"train_loss": -27.433307647705078, "global_step": 614305, "epoch": 7401} {"train_loss": -28.050573348999023, "global_step": 614306, "epoch": 7401} {"train_loss": -28.04738426208496, "global_step": 614307, "epoch": 7401} {"train_loss": -28.170923233032227, "global_step": 614308, "epoch": 7401} {"train_loss": -27.823333740234375, "global_step": 614309, "epoch": 7401} {"train_loss": -28.030858993530273, "global_step": 614310, "epoch": 7401} {"train_loss": -28.30977439880371, "global_step": 614311, "epoch": 7401} {"train_loss": -28.15325927734375, "global_step": 614312, "epoch": 7401} {"train_loss": -27.81342887878418, "global_step": 614313, "epoch": 7401} {"train_loss": -28.304174423217773, "global_step": 614314, "epoch": 7401} {"train_loss": -28.139890670776367, "global_step": 614315, "epoch": 7401} {"train_loss": -27.810348510742188, "global_step": 614316, "epoch": 7401} {"train_loss": -27.837594985961914, "global_step": 614317, "epoch": 7401} {"train_loss": -27.842315673828125, "global_step": 614318, "epoch": 7401} {"train_loss": -28.218542098999023, "global_step": 614319, "epoch": 7401} {"train_loss": -28.10459327697754, "global_step": 614320, "epoch": 7401} {"train_loss": -28.563764572143555, "global_step": 614321, "epoch": 7401} {"train_loss": -27.8106632232666, "global_step": 614322, "epoch": 7401} {"train_loss": -28.420801162719727, "global_step": 614323, "epoch": 7401} {"train_loss": -27.773330688476562, "global_step": 614324, "epoch": 7401} {"train_loss": -28.144208908081055, "global_step": 614325, "epoch": 7401} {"train_loss": -28.268558502197266, "global_step": 614326, "epoch": 7401} {"train_loss": -28.23647117614746, "global_step": 614327, "epoch": 7401} {"train_loss": -28.037382125854492, "global_step": 614328, "epoch": 7401} {"train_loss": -28.252994537353516, "global_step": 614329, "epoch": 7401} {"train_loss": -28.12444496154785, "global_step": 614330, "epoch": 7401} {"train_loss": -27.724538803100586, "global_step": 614331, "epoch": 7401} {"train_loss": -28.316150665283203, "global_step": 614332, "epoch": 7401} {"train_loss": -27.919830322265625, "global_step": 614333, "epoch": 7401} {"train_loss": -28.4585018157959, "global_step": 614334, "epoch": 7401} {"train_loss": -28.286474227905273, "global_step": 614335, "epoch": 7401} {"train_loss": -28.656391143798828, "global_step": 614336, "epoch": 7401} {"train_loss": -28.015783309936523, "global_step": 614337, "epoch": 7401} {"train_loss": -28.02296257019043, "global_step": 614338, "epoch": 7401} {"train_loss": -28.295034408569336, "global_step": 614339, "epoch": 7401} {"train_loss": -28.2614688873291, "global_step": 614340, "epoch": 7401} {"train_loss": -28.291996002197266, "global_step": 614341, "epoch": 7401} {"train_loss": -27.796894073486328, "global_step": 614342, "epoch": 7401} {"train_loss": -28.44959831237793, "global_step": 614343, "epoch": 7401} {"train_loss": -28.333606719970703, "global_step": 614344, "epoch": 7401} {"train_loss": -27.989282608032227, "global_step": 614345, "epoch": 7401} {"train_loss": -28.35518455505371, "global_step": 614346, "epoch": 7401} {"train_loss": -28.149738311767578, "global_step": 614347, "epoch": 7401} {"train_loss": -28.244888305664062, "global_step": 614348, "epoch": 7401} {"train_loss": -28.0869083404541, "global_step": 614349, "epoch": 7401} {"train_loss": -28.301111221313477, "global_step": 614350, "epoch": 7401} {"train_loss": -28.124866485595703, "global_step": 614351, "epoch": 7401} {"train_loss": -27.924192428588867, "global_step": 614352, "epoch": 7401} {"train_loss": -28.108911514282227, "global_step": 614353, "epoch": 7401} {"train_loss": -27.97808265686035, "global_step": 614354, "epoch": 7401} {"train_loss": -28.07691764831543, "global_step": 614355, "epoch": 7401} {"train_loss": -28.344091415405273, "global_step": 614356, "epoch": 7401} {"train_loss": -28.374731063842773, "global_step": 614357, "epoch": 7401} {"train_loss": -28.12811279296875, "global_step": 614358, "epoch": 7401} {"train_loss": -28.368986129760742, "global_step": 614359, "epoch": 7401} {"train_loss": -28.372411727905273, "global_step": 614360, "epoch": 7401} {"train_loss": -28.494415283203125, "global_step": 614361, "epoch": 7401} {"train_loss": -27.74017906188965, "global_step": 614362, "epoch": 7401} {"train_loss": -28.0191707611084, "global_step": 614363, "epoch": 7401} {"train_loss": -28.1876277923584, "global_step": 614364, "epoch": 7401} {"train_loss": -27.999993841332124, "global_step": 614365, "epoch": 7401, "val_loss": 6748006.5} {"train_loss": -26.5484676361084, "global_step": 614366, "epoch": 7402} {"train_loss": -26.225446701049805, "global_step": 614367, "epoch": 7402} {"train_loss": -26.563373565673828, "global_step": 614368, "epoch": 7402} {"train_loss": -27.595279693603516, "global_step": 614369, "epoch": 7402} {"train_loss": -26.6309871673584, "global_step": 614370, "epoch": 7402} {"train_loss": -27.185638427734375, "global_step": 614371, "epoch": 7402} {"train_loss": -27.262653350830078, "global_step": 614372, "epoch": 7402} {"train_loss": -26.817859649658203, "global_step": 614373, "epoch": 7402} {"train_loss": -27.196760177612305, "global_step": 614374, "epoch": 7402} {"train_loss": -27.832509994506836, "global_step": 614375, "epoch": 7402} {"train_loss": -27.099273681640625, "global_step": 614376, "epoch": 7402} {"train_loss": -27.6353816986084, "global_step": 614377, "epoch": 7402} {"train_loss": -27.719314575195312, "global_step": 614378, "epoch": 7402} {"train_loss": -27.666051864624023, "global_step": 614379, "epoch": 7402} {"train_loss": -27.389448165893555, "global_step": 614380, "epoch": 7402} {"train_loss": -27.7099609375, "global_step": 614381, "epoch": 7402} {"train_loss": -27.87822914123535, "global_step": 614382, "epoch": 7402} {"train_loss": -27.784912109375, "global_step": 614383, "epoch": 7402} {"train_loss": -27.741403579711914, "global_step": 614384, "epoch": 7402} {"train_loss": -28.07065773010254, "global_step": 614385, "epoch": 7402} {"train_loss": -27.763158798217773, "global_step": 614386, "epoch": 7402} {"train_loss": -27.73097038269043, "global_step": 614387, "epoch": 7402} {"train_loss": -27.86991310119629, "global_step": 614388, "epoch": 7402} {"train_loss": -27.847497940063477, "global_step": 614389, "epoch": 7402} {"train_loss": -27.716501235961914, "global_step": 614390, "epoch": 7402} {"train_loss": -28.158660888671875, "global_step": 614391, "epoch": 7402} {"train_loss": -27.83367919921875, "global_step": 614392, "epoch": 7402} {"train_loss": -27.7403507232666, "global_step": 614393, "epoch": 7402} {"train_loss": -27.959674835205078, "global_step": 614394, "epoch": 7402} {"train_loss": -28.18377685546875, "global_step": 614395, "epoch": 7402} {"train_loss": -28.056629180908203, "global_step": 614396, "epoch": 7402} {"train_loss": -28.12249183654785, "global_step": 614397, "epoch": 7402} {"train_loss": -28.19317054748535, "global_step": 614398, "epoch": 7402} {"train_loss": -28.191858291625977, "global_step": 614399, "epoch": 7402} {"train_loss": -28.128814697265625, "global_step": 614400, "epoch": 7402} {"train_loss": -27.8580265045166, "global_step": 614401, "epoch": 7402} {"train_loss": -28.149267196655273, "global_step": 614402, "epoch": 7402} {"train_loss": -28.182693481445312, "global_step": 614403, "epoch": 7402} {"train_loss": -28.47869300842285, "global_step": 614404, "epoch": 7402} {"train_loss": -28.420852661132812, "global_step": 614405, "epoch": 7402} {"train_loss": -28.295286178588867, "global_step": 614406, "epoch": 7402} {"train_loss": -28.33917236328125, "global_step": 614407, "epoch": 7402} {"train_loss": -28.318099975585938, "global_step": 614408, "epoch": 7402} {"train_loss": -28.56659507751465, "global_step": 614409, "epoch": 7402} {"train_loss": -28.327295303344727, "global_step": 614410, "epoch": 7402} {"train_loss": -28.329761505126953, "global_step": 614411, "epoch": 7402} {"train_loss": -28.088123321533203, "global_step": 614412, "epoch": 7402} {"train_loss": -27.96335792541504, "global_step": 614413, "epoch": 7402} {"train_loss": -28.08159828186035, "global_step": 614414, "epoch": 7402} {"train_loss": -28.20098876953125, "global_step": 614415, "epoch": 7402} {"train_loss": -28.048913955688477, "global_step": 614416, "epoch": 7402} {"train_loss": -28.34051513671875, "global_step": 614417, "epoch": 7402} {"train_loss": -28.04974365234375, "global_step": 614418, "epoch": 7402} {"train_loss": -28.188190460205078, "global_step": 614419, "epoch": 7402} {"train_loss": -28.474918365478516, "global_step": 614420, "epoch": 7402} {"train_loss": -28.355329513549805, "global_step": 614421, "epoch": 7402} {"train_loss": -28.230194091796875, "global_step": 614422, "epoch": 7402} {"train_loss": -28.373279571533203, "global_step": 614423, "epoch": 7402} {"train_loss": -28.62178611755371, "global_step": 614424, "epoch": 7402} {"train_loss": -28.249120712280273, "global_step": 614425, "epoch": 7402} {"train_loss": -28.224863052368164, "global_step": 614426, "epoch": 7402} {"train_loss": -27.544347763061523, "global_step": 614427, "epoch": 7402} {"train_loss": -27.864221572875977, "global_step": 614428, "epoch": 7402} {"train_loss": -27.461429595947266, "global_step": 614429, "epoch": 7402} {"train_loss": -27.647918701171875, "global_step": 614430, "epoch": 7402} {"train_loss": -28.113569259643555, "global_step": 614431, "epoch": 7402} {"train_loss": -28.106603622436523, "global_step": 614432, "epoch": 7402} {"train_loss": -27.854907989501953, "global_step": 614433, "epoch": 7402} {"train_loss": -28.201644897460938, "global_step": 614434, "epoch": 7402} {"train_loss": -28.255573272705078, "global_step": 614435, "epoch": 7402} {"train_loss": -28.092329025268555, "global_step": 614436, "epoch": 7402} {"train_loss": -27.737722396850586, "global_step": 614437, "epoch": 7402} {"train_loss": -27.670801162719727, "global_step": 614438, "epoch": 7402} {"train_loss": -28.18128776550293, "global_step": 614439, "epoch": 7402} {"train_loss": -28.29925537109375, "global_step": 614440, "epoch": 7402} {"train_loss": -28.041662216186523, "global_step": 614441, "epoch": 7402} {"train_loss": -27.927759170532227, "global_step": 614442, "epoch": 7402} {"train_loss": -27.9952392578125, "global_step": 614443, "epoch": 7402} {"train_loss": -27.91993522644043, "global_step": 614444, "epoch": 7402} {"train_loss": -28.268604278564453, "global_step": 614445, "epoch": 7402} {"train_loss": -28.235809326171875, "global_step": 614446, "epoch": 7402} {"train_loss": -27.78670310974121, "global_step": 614447, "epoch": 7402} {"train_loss": -27.91637243707496, "global_step": 614448, "epoch": 7402, "val_loss": 6685962.5} {"train_loss": -27.763885498046875, "global_step": 614449, "epoch": 7403} {"train_loss": -27.785531997680664, "global_step": 614450, "epoch": 7403} {"train_loss": -28.225061416625977, "global_step": 614451, "epoch": 7403} {"train_loss": -28.041040420532227, "global_step": 614452, "epoch": 7403} {"train_loss": -28.08672523498535, "global_step": 614453, "epoch": 7403} {"train_loss": -27.55784034729004, "global_step": 614454, "epoch": 7403} {"train_loss": -28.160131454467773, "global_step": 614455, "epoch": 7403} {"train_loss": -28.160511016845703, "global_step": 614456, "epoch": 7403} {"train_loss": -27.713958740234375, "global_step": 614457, "epoch": 7403} {"train_loss": -27.498804092407227, "global_step": 614458, "epoch": 7403} {"train_loss": -27.883777618408203, "global_step": 614459, "epoch": 7403} {"train_loss": -28.033090591430664, "global_step": 614460, "epoch": 7403} {"train_loss": -27.678503036499023, "global_step": 614461, "epoch": 7403} {"train_loss": -27.881193161010742, "global_step": 614462, "epoch": 7403} {"train_loss": -27.931995391845703, "global_step": 614463, "epoch": 7403} {"train_loss": -27.77467155456543, "global_step": 614464, "epoch": 7403} {"train_loss": -27.796972274780273, "global_step": 614465, "epoch": 7403} {"train_loss": -28.13553237915039, "global_step": 614466, "epoch": 7403} {"train_loss": -27.863422393798828, "global_step": 614467, "epoch": 7403} {"train_loss": -27.890146255493164, "global_step": 614468, "epoch": 7403} {"train_loss": -28.006946563720703, "global_step": 614469, "epoch": 7403} {"train_loss": -27.452238082885742, "global_step": 614470, "epoch": 7403} {"train_loss": -27.55076026916504, "global_step": 614471, "epoch": 7403} {"train_loss": -27.971973419189453, "global_step": 614472, "epoch": 7403} {"train_loss": -27.840925216674805, "global_step": 614473, "epoch": 7403} {"train_loss": -27.80902099609375, "global_step": 614474, "epoch": 7403} {"train_loss": -28.0705509185791, "global_step": 614475, "epoch": 7403} {"train_loss": -28.151411056518555, "global_step": 614476, "epoch": 7403} {"train_loss": -28.177398681640625, "global_step": 614477, "epoch": 7403} {"train_loss": -28.05487632751465, "global_step": 614478, "epoch": 7403} {"train_loss": -28.034347534179688, "global_step": 614479, "epoch": 7403} {"train_loss": -28.292465209960938, "global_step": 614480, "epoch": 7403} {"train_loss": -27.9227294921875, "global_step": 614481, "epoch": 7403} {"train_loss": -28.281042098999023, "global_step": 614482, "epoch": 7403} {"train_loss": -28.18143653869629, "global_step": 614483, "epoch": 7403} {"train_loss": -28.193525314331055, "global_step": 614484, "epoch": 7403} {"train_loss": -28.227039337158203, "global_step": 614485, "epoch": 7403} {"train_loss": -28.171436309814453, "global_step": 614486, "epoch": 7403} {"train_loss": -28.08096694946289, "global_step": 614487, "epoch": 7403} {"train_loss": -28.099164962768555, "global_step": 614488, "epoch": 7403} {"train_loss": -28.270360946655273, "global_step": 614489, "epoch": 7403} {"train_loss": -28.28154945373535, "global_step": 614490, "epoch": 7403} {"train_loss": -28.005273818969727, "global_step": 614491, "epoch": 7403} {"train_loss": -28.192434310913086, "global_step": 614492, "epoch": 7403} {"train_loss": -28.398832321166992, "global_step": 614493, "epoch": 7403} {"train_loss": -28.041980743408203, "global_step": 614494, "epoch": 7403} {"train_loss": -28.19913673400879, "global_step": 614495, "epoch": 7403} {"train_loss": -28.159347534179688, "global_step": 614496, "epoch": 7403} {"train_loss": -28.049753189086914, "global_step": 614497, "epoch": 7403} {"train_loss": -28.320409774780273, "global_step": 614498, "epoch": 7403} {"train_loss": -28.14756202697754, "global_step": 614499, "epoch": 7403} {"train_loss": -28.423608779907227, "global_step": 614500, "epoch": 7403} {"train_loss": -28.150278091430664, "global_step": 614501, "epoch": 7403} {"train_loss": -28.314407348632812, "global_step": 614502, "epoch": 7403} {"train_loss": -28.120925903320312, "global_step": 614503, "epoch": 7403} {"train_loss": -28.006057739257812, "global_step": 614504, "epoch": 7403} {"train_loss": -28.297224044799805, "global_step": 614505, "epoch": 7403} {"train_loss": -27.849720001220703, "global_step": 614506, "epoch": 7403} {"train_loss": -28.175519943237305, "global_step": 614507, "epoch": 7403} {"train_loss": -28.048786163330078, "global_step": 614508, "epoch": 7403} {"train_loss": -28.354360580444336, "global_step": 614509, "epoch": 7403} {"train_loss": -28.34736442565918, "global_step": 614510, "epoch": 7403} {"train_loss": -28.4293270111084, "global_step": 614511, "epoch": 7403} {"train_loss": -28.18829917907715, "global_step": 614512, "epoch": 7403} {"train_loss": -28.3550968170166, "global_step": 614513, "epoch": 7403} {"train_loss": -28.051715850830078, "global_step": 614514, "epoch": 7403} {"train_loss": -28.03913688659668, "global_step": 614515, "epoch": 7403} {"train_loss": -27.808332443237305, "global_step": 614516, "epoch": 7403} {"train_loss": -28.062170028686523, "global_step": 614517, "epoch": 7403} {"train_loss": -28.000234603881836, "global_step": 614518, "epoch": 7403} {"train_loss": -28.35000991821289, "global_step": 614519, "epoch": 7403} {"train_loss": -27.928098678588867, "global_step": 614520, "epoch": 7403} {"train_loss": -27.72371482849121, "global_step": 614521, "epoch": 7403} {"train_loss": -27.870361328125, "global_step": 614522, "epoch": 7403} {"train_loss": -27.916522979736328, "global_step": 614523, "epoch": 7403} {"train_loss": -27.984582901000977, "global_step": 614524, "epoch": 7403} {"train_loss": -28.0126895904541, "global_step": 614525, "epoch": 7403} {"train_loss": -27.391559600830078, "global_step": 614526, "epoch": 7403} {"train_loss": -27.738494873046875, "global_step": 614527, "epoch": 7403} {"train_loss": -27.562530517578125, "global_step": 614528, "epoch": 7403} {"train_loss": -27.845123291015625, "global_step": 614529, "epoch": 7403} {"train_loss": -27.7919921875, "global_step": 614530, "epoch": 7403} {"train_loss": -28.036864912653545, "global_step": 614531, "epoch": 7403, "val_loss": 6688942.0} {"train_loss": -27.036090850830078, "global_step": 614532, "epoch": 7404} {"train_loss": -26.77546501159668, "global_step": 614533, "epoch": 7404} {"train_loss": -26.802209854125977, "global_step": 614534, "epoch": 7404} {"train_loss": -26.935199737548828, "global_step": 614535, "epoch": 7404} {"train_loss": -26.691770553588867, "global_step": 614536, "epoch": 7404} {"train_loss": -26.975116729736328, "global_step": 614537, "epoch": 7404} {"train_loss": -27.02899742126465, "global_step": 614538, "epoch": 7404} {"train_loss": -26.420856475830078, "global_step": 614539, "epoch": 7404} {"train_loss": -27.574132919311523, "global_step": 614540, "epoch": 7404} {"train_loss": -26.463117599487305, "global_step": 614541, "epoch": 7404} {"train_loss": -27.14143943786621, "global_step": 614542, "epoch": 7404} {"train_loss": -27.301252365112305, "global_step": 614543, "epoch": 7404} {"train_loss": -26.93033790588379, "global_step": 614544, "epoch": 7404} {"train_loss": -27.644989013671875, "global_step": 614545, "epoch": 7404} {"train_loss": -27.003767013549805, "global_step": 614546, "epoch": 7404} {"train_loss": -27.50969886779785, "global_step": 614547, "epoch": 7404} {"train_loss": -27.01936149597168, "global_step": 614548, "epoch": 7404} {"train_loss": -27.733808517456055, "global_step": 614549, "epoch": 7404} {"train_loss": -27.791608810424805, "global_step": 614550, "epoch": 7404} {"train_loss": -27.739627838134766, "global_step": 614551, "epoch": 7404} {"train_loss": -27.466848373413086, "global_step": 614552, "epoch": 7404} {"train_loss": -27.42070960998535, "global_step": 614553, "epoch": 7404} {"train_loss": -27.684558868408203, "global_step": 614554, "epoch": 7404} {"train_loss": -27.7831974029541, "global_step": 614555, "epoch": 7404} {"train_loss": -28.021198272705078, "global_step": 614556, "epoch": 7404} {"train_loss": -27.568008422851562, "global_step": 614557, "epoch": 7404} {"train_loss": -28.166654586791992, "global_step": 614558, "epoch": 7404} {"train_loss": -28.01787757873535, "global_step": 614559, "epoch": 7404} {"train_loss": -28.097970962524414, "global_step": 614560, "epoch": 7404} {"train_loss": -28.162572860717773, "global_step": 614561, "epoch": 7404} {"train_loss": -27.91697120666504, "global_step": 614562, "epoch": 7404} {"train_loss": -27.8239688873291, "global_step": 614563, "epoch": 7404} {"train_loss": -27.945632934570312, "global_step": 614564, "epoch": 7404} {"train_loss": -28.067895889282227, "global_step": 614565, "epoch": 7404} {"train_loss": -27.92254638671875, "global_step": 614566, "epoch": 7404} {"train_loss": -27.992156982421875, "global_step": 614567, "epoch": 7404} {"train_loss": -28.384506225585938, "global_step": 614568, "epoch": 7404} {"train_loss": -27.699975967407227, "global_step": 614569, "epoch": 7404} {"train_loss": -28.271997451782227, "global_step": 614570, "epoch": 7404} {"train_loss": -27.941726684570312, "global_step": 614571, "epoch": 7404} {"train_loss": -28.479248046875, "global_step": 614572, "epoch": 7404} {"train_loss": -28.690088272094727, "global_step": 614573, "epoch": 7404} {"train_loss": -27.902801513671875, "global_step": 614574, "epoch": 7404} {"train_loss": -28.400854110717773, "global_step": 614575, "epoch": 7404} {"train_loss": -28.01028823852539, "global_step": 614576, "epoch": 7404} {"train_loss": -27.991912841796875, "global_step": 614577, "epoch": 7404} {"train_loss": -28.121606826782227, "global_step": 614578, "epoch": 7404} {"train_loss": -28.25674819946289, "global_step": 614579, "epoch": 7404} {"train_loss": -28.305694580078125, "global_step": 614580, "epoch": 7404} {"train_loss": -28.404590606689453, "global_step": 614581, "epoch": 7404} {"train_loss": -28.43085289001465, "global_step": 614582, "epoch": 7404} {"train_loss": -28.225988388061523, "global_step": 614583, "epoch": 7404} {"train_loss": -28.417234420776367, "global_step": 614584, "epoch": 7404} {"train_loss": -28.19873046875, "global_step": 614585, "epoch": 7404} {"train_loss": -28.571533203125, "global_step": 614586, "epoch": 7404} {"train_loss": -28.260068893432617, "global_step": 614587, "epoch": 7404} {"train_loss": -28.314041137695312, "global_step": 614588, "epoch": 7404} {"train_loss": -28.283599853515625, "global_step": 614589, "epoch": 7404} {"train_loss": -28.423078536987305, "global_step": 614590, "epoch": 7404} {"train_loss": -28.28525161743164, "global_step": 614591, "epoch": 7404} {"train_loss": -28.1740665435791, "global_step": 614592, "epoch": 7404} {"train_loss": -28.343048095703125, "global_step": 614593, "epoch": 7404} {"train_loss": -28.066253662109375, "global_step": 614594, "epoch": 7404} {"train_loss": -28.103891372680664, "global_step": 614595, "epoch": 7404} {"train_loss": -27.704181671142578, "global_step": 614596, "epoch": 7404} {"train_loss": -27.90083122253418, "global_step": 614597, "epoch": 7404} {"train_loss": -27.972543716430664, "global_step": 614598, "epoch": 7404} {"train_loss": -27.636962890625, "global_step": 614599, "epoch": 7404} {"train_loss": -27.98456382751465, "global_step": 614600, "epoch": 7404} {"train_loss": -28.045124053955078, "global_step": 614601, "epoch": 7404} {"train_loss": -28.32085609436035, "global_step": 614602, "epoch": 7404} {"train_loss": -28.100996017456055, "global_step": 614603, "epoch": 7404} {"train_loss": -28.354284286499023, "global_step": 614604, "epoch": 7404} {"train_loss": -27.999509811401367, "global_step": 614605, "epoch": 7404} {"train_loss": -28.11262321472168, "global_step": 614606, "epoch": 7404} {"train_loss": -28.112964630126953, "global_step": 614607, "epoch": 7404} {"train_loss": -28.37338638305664, "global_step": 614608, "epoch": 7404} {"train_loss": -27.921125411987305, "global_step": 614609, "epoch": 7404} {"train_loss": -28.304031372070312, "global_step": 614610, "epoch": 7404} {"train_loss": -27.7851505279541, "global_step": 614611, "epoch": 7404} {"train_loss": -28.454395294189453, "global_step": 614612, "epoch": 7404} {"train_loss": -28.002735137939453, "global_step": 614613, "epoch": 7404} {"train_loss": -27.8635975941118, "global_step": 614614, "epoch": 7404, "val_loss": 6707144.5} {"train_loss": -27.919525146484375, "global_step": 614615, "epoch": 7405} {"train_loss": -27.96817970275879, "global_step": 614616, "epoch": 7405} {"train_loss": -28.283161163330078, "global_step": 614617, "epoch": 7405} {"train_loss": -27.54884147644043, "global_step": 614618, "epoch": 7405} {"train_loss": -27.918996810913086, "global_step": 614619, "epoch": 7405} {"train_loss": -27.77837562561035, "global_step": 614620, "epoch": 7405} {"train_loss": -28.366453170776367, "global_step": 614621, "epoch": 7405} {"train_loss": -28.026031494140625, "global_step": 614622, "epoch": 7405} {"train_loss": -28.226125717163086, "global_step": 614623, "epoch": 7405} {"train_loss": -27.79218864440918, "global_step": 614624, "epoch": 7405} {"train_loss": -27.993030548095703, "global_step": 614625, "epoch": 7405} {"train_loss": -28.281787872314453, "global_step": 614626, "epoch": 7405} {"train_loss": -27.881717681884766, "global_step": 614627, "epoch": 7405} {"train_loss": -28.447479248046875, "global_step": 614628, "epoch": 7405} {"train_loss": -28.012516021728516, "global_step": 614629, "epoch": 7405} {"train_loss": -28.131940841674805, "global_step": 614630, "epoch": 7405} {"train_loss": -27.967626571655273, "global_step": 614631, "epoch": 7405} {"train_loss": -28.137357711791992, "global_step": 614632, "epoch": 7405} {"train_loss": -28.107526779174805, "global_step": 614633, "epoch": 7405} {"train_loss": -28.12249183654785, "global_step": 614634, "epoch": 7405} {"train_loss": -27.90630531311035, "global_step": 614635, "epoch": 7405} {"train_loss": -28.022567749023438, "global_step": 614636, "epoch": 7405} {"train_loss": -27.967954635620117, "global_step": 614637, "epoch": 7405} {"train_loss": -28.080907821655273, "global_step": 614638, "epoch": 7405} {"train_loss": -28.454328536987305, "global_step": 614639, "epoch": 7405} {"train_loss": -28.47065544128418, "global_step": 614640, "epoch": 7405} {"train_loss": -28.08722496032715, "global_step": 614641, "epoch": 7405} {"train_loss": -28.395343780517578, "global_step": 614642, "epoch": 7405} {"train_loss": -27.656538009643555, "global_step": 614643, "epoch": 7405} {"train_loss": -27.91316032409668, "global_step": 614644, "epoch": 7405} {"train_loss": -28.37635612487793, "global_step": 614645, "epoch": 7405} {"train_loss": -27.869232177734375, "global_step": 614646, "epoch": 7405} {"train_loss": -27.571943283081055, "global_step": 614647, "epoch": 7405} {"train_loss": -27.8268985748291, "global_step": 614648, "epoch": 7405} {"train_loss": -27.990036010742188, "global_step": 614649, "epoch": 7405} {"train_loss": -28.1800479888916, "global_step": 614650, "epoch": 7405} {"train_loss": -28.203466415405273, "global_step": 614651, "epoch": 7405} {"train_loss": -28.153318405151367, "global_step": 614652, "epoch": 7405} {"train_loss": -28.048322677612305, "global_step": 614653, "epoch": 7405} {"train_loss": -28.096099853515625, "global_step": 614654, "epoch": 7405} {"train_loss": -28.214818954467773, "global_step": 614655, "epoch": 7405} {"train_loss": -28.131250381469727, "global_step": 614656, "epoch": 7405} {"train_loss": -27.864484786987305, "global_step": 614657, "epoch": 7405} {"train_loss": -28.123111724853516, "global_step": 614658, "epoch": 7405} {"train_loss": -28.368122100830078, "global_step": 614659, "epoch": 7405} {"train_loss": -28.287952423095703, "global_step": 614660, "epoch": 7405} {"train_loss": -28.2059326171875, "global_step": 614661, "epoch": 7405} {"train_loss": -28.223608016967773, "global_step": 614662, "epoch": 7405} {"train_loss": -28.258188247680664, "global_step": 614663, "epoch": 7405} {"train_loss": -27.877994537353516, "global_step": 614664, "epoch": 7405} {"train_loss": -28.2828369140625, "global_step": 614665, "epoch": 7405} {"train_loss": -28.07838249206543, "global_step": 614666, "epoch": 7405} {"train_loss": -28.34737205505371, "global_step": 614667, "epoch": 7405} {"train_loss": -27.91756248474121, "global_step": 614668, "epoch": 7405} {"train_loss": -28.09408950805664, "global_step": 614669, "epoch": 7405} {"train_loss": -27.998437881469727, "global_step": 614670, "epoch": 7405} {"train_loss": -27.670461654663086, "global_step": 614671, "epoch": 7405} {"train_loss": -27.973615646362305, "global_step": 614672, "epoch": 7405} {"train_loss": -28.086627960205078, "global_step": 614673, "epoch": 7405} {"train_loss": -27.950881958007812, "global_step": 614674, "epoch": 7405} {"train_loss": -27.95502281188965, "global_step": 614675, "epoch": 7405} {"train_loss": -27.677326202392578, "global_step": 614676, "epoch": 7405} {"train_loss": -27.860559463500977, "global_step": 614677, "epoch": 7405} {"train_loss": -28.304845809936523, "global_step": 614678, "epoch": 7405} {"train_loss": -27.9443359375, "global_step": 614679, "epoch": 7405} {"train_loss": -27.934967041015625, "global_step": 614680, "epoch": 7405} {"train_loss": -28.01047706604004, "global_step": 614681, "epoch": 7405} {"train_loss": -27.951690673828125, "global_step": 614682, "epoch": 7405} {"train_loss": -27.949893951416016, "global_step": 614683, "epoch": 7405} {"train_loss": -28.08733558654785, "global_step": 614684, "epoch": 7405} {"train_loss": -28.027240753173828, "global_step": 614685, "epoch": 7405} {"train_loss": -28.47932243347168, "global_step": 614686, "epoch": 7405} {"train_loss": -28.311872482299805, "global_step": 614687, "epoch": 7405} {"train_loss": -27.973358154296875, "global_step": 614688, "epoch": 7405} {"train_loss": -27.934118270874023, "global_step": 614689, "epoch": 7405} {"train_loss": -28.3150634765625, "global_step": 614690, "epoch": 7405} {"train_loss": -28.358295440673828, "global_step": 614691, "epoch": 7405} {"train_loss": -28.353464126586914, "global_step": 614692, "epoch": 7405} {"train_loss": -28.39108657836914, "global_step": 614693, "epoch": 7405} {"train_loss": -27.987939834594727, "global_step": 614694, "epoch": 7405} {"train_loss": -27.930768966674805, "global_step": 614695, "epoch": 7405} {"train_loss": -28.392547607421875, "global_step": 614696, "epoch": 7405} {"train_loss": -28.094102353934783, "global_step": 614697, "epoch": 7405, "val_loss": 6735767.0} {"train_loss": -28.229307174682617, "global_step": 614698, "epoch": 7406} {"train_loss": -27.9423885345459, "global_step": 614699, "epoch": 7406} {"train_loss": -27.98797607421875, "global_step": 614700, "epoch": 7406} {"train_loss": -27.483078002929688, "global_step": 614701, "epoch": 7406} {"train_loss": -27.508817672729492, "global_step": 614702, "epoch": 7406} {"train_loss": -28.110937118530273, "global_step": 614703, "epoch": 7406} {"train_loss": -27.390356063842773, "global_step": 614704, "epoch": 7406} {"train_loss": -27.638586044311523, "global_step": 614705, "epoch": 7406} {"train_loss": -27.907888412475586, "global_step": 614706, "epoch": 7406} {"train_loss": -27.90778923034668, "global_step": 614707, "epoch": 7406} {"train_loss": -27.834095001220703, "global_step": 614708, "epoch": 7406} {"train_loss": -28.15473747253418, "global_step": 614709, "epoch": 7406} {"train_loss": -27.555011749267578, "global_step": 614710, "epoch": 7406} {"train_loss": -27.982145309448242, "global_step": 614711, "epoch": 7406} {"train_loss": -27.883031845092773, "global_step": 614712, "epoch": 7406} {"train_loss": -27.600341796875, "global_step": 614713, "epoch": 7406} {"train_loss": -28.18121910095215, "global_step": 614714, "epoch": 7406} {"train_loss": -27.87251091003418, "global_step": 614715, "epoch": 7406} {"train_loss": -27.5708065032959, "global_step": 614716, "epoch": 7406} {"train_loss": -27.545913696289062, "global_step": 614717, "epoch": 7406} {"train_loss": -28.329862594604492, "global_step": 614718, "epoch": 7406} {"train_loss": -27.817968368530273, "global_step": 614719, "epoch": 7406} {"train_loss": -28.05438232421875, "global_step": 614720, "epoch": 7406} {"train_loss": -27.911359786987305, "global_step": 614721, "epoch": 7406} {"train_loss": -27.936613082885742, "global_step": 614722, "epoch": 7406} {"train_loss": -28.009885787963867, "global_step": 614723, "epoch": 7406} {"train_loss": -28.129003524780273, "global_step": 614724, "epoch": 7406} {"train_loss": -27.731779098510742, "global_step": 614725, "epoch": 7406} {"train_loss": -28.27149772644043, "global_step": 614726, "epoch": 7406} {"train_loss": -27.66318130493164, "global_step": 614727, "epoch": 7406} {"train_loss": -28.199615478515625, "global_step": 614728, "epoch": 7406} {"train_loss": -28.287214279174805, "global_step": 614729, "epoch": 7406} {"train_loss": -28.20488929748535, "global_step": 614730, "epoch": 7406} {"train_loss": -28.078693389892578, "global_step": 614731, "epoch": 7406} {"train_loss": -27.847700119018555, "global_step": 614732, "epoch": 7406} {"train_loss": -28.216894149780273, "global_step": 614733, "epoch": 7406} {"train_loss": -27.890064239501953, "global_step": 614734, "epoch": 7406} {"train_loss": -28.442670822143555, "global_step": 614735, "epoch": 7406} {"train_loss": -28.26171875, "global_step": 614736, "epoch": 7406} {"train_loss": -28.4570369720459, "global_step": 614737, "epoch": 7406} {"train_loss": -28.619403839111328, "global_step": 614738, "epoch": 7406} {"train_loss": -28.35780143737793, "global_step": 614739, "epoch": 7406} {"train_loss": -27.979663848876953, "global_step": 614740, "epoch": 7406} {"train_loss": -27.8640079498291, "global_step": 614741, "epoch": 7406} {"train_loss": -28.16517448425293, "global_step": 614742, "epoch": 7406} {"train_loss": -28.114551544189453, "global_step": 614743, "epoch": 7406} {"train_loss": -28.574277877807617, "global_step": 614744, "epoch": 7406} {"train_loss": -28.2440185546875, "global_step": 614745, "epoch": 7406} {"train_loss": -28.416086196899414, "global_step": 614746, "epoch": 7406} {"train_loss": -28.5454044342041, "global_step": 614747, "epoch": 7406} {"train_loss": -27.916706085205078, "global_step": 614748, "epoch": 7406} {"train_loss": -28.13627052307129, "global_step": 614749, "epoch": 7406} {"train_loss": -28.2487735748291, "global_step": 614750, "epoch": 7406} {"train_loss": -28.1879825592041, "global_step": 614751, "epoch": 7406} {"train_loss": -28.035877227783203, "global_step": 614752, "epoch": 7406} {"train_loss": -28.29170799255371, "global_step": 614753, "epoch": 7406} {"train_loss": -28.576013565063477, "global_step": 614754, "epoch": 7406} {"train_loss": -28.58893394470215, "global_step": 614755, "epoch": 7406} {"train_loss": -28.127246856689453, "global_step": 614756, "epoch": 7406} {"train_loss": -28.3543643951416, "global_step": 614757, "epoch": 7406} {"train_loss": -28.37721061706543, "global_step": 614758, "epoch": 7406} {"train_loss": -28.202381134033203, "global_step": 614759, "epoch": 7406} {"train_loss": -28.350568771362305, "global_step": 614760, "epoch": 7406} {"train_loss": -28.454858779907227, "global_step": 614761, "epoch": 7406} {"train_loss": -28.242767333984375, "global_step": 614762, "epoch": 7406} {"train_loss": -28.027856826782227, "global_step": 614763, "epoch": 7406} {"train_loss": -28.46854591369629, "global_step": 614764, "epoch": 7406} {"train_loss": -28.07527732849121, "global_step": 614765, "epoch": 7406} {"train_loss": -28.23674964904785, "global_step": 614766, "epoch": 7406} {"train_loss": -28.12497329711914, "global_step": 614767, "epoch": 7406} {"train_loss": -27.977508544921875, "global_step": 614768, "epoch": 7406} {"train_loss": -27.991641998291016, "global_step": 614769, "epoch": 7406} {"train_loss": -27.714208602905273, "global_step": 614770, "epoch": 7406} {"train_loss": -28.098987579345703, "global_step": 614771, "epoch": 7406} {"train_loss": -27.876602172851562, "global_step": 614772, "epoch": 7406} {"train_loss": -27.703388214111328, "global_step": 614773, "epoch": 7406} {"train_loss": -27.778833389282227, "global_step": 614774, "epoch": 7406} {"train_loss": -28.117420196533203, "global_step": 614775, "epoch": 7406} {"train_loss": -27.940277099609375, "global_step": 614776, "epoch": 7406} {"train_loss": -27.305404663085938, "global_step": 614777, "epoch": 7406} {"train_loss": -27.697296142578125, "global_step": 614778, "epoch": 7406} {"train_loss": -28.378793716430664, "global_step": 614779, "epoch": 7406} {"train_loss": -28.043083834360882, "global_step": 614780, "epoch": 7406, "val_loss": 6646740.0} {"train_loss": -27.468475341796875, "global_step": 614781, "epoch": 7407} {"train_loss": -26.14176368713379, "global_step": 614782, "epoch": 7407} {"train_loss": -25.806781768798828, "global_step": 614783, "epoch": 7407} {"train_loss": -26.577970504760742, "global_step": 614784, "epoch": 7407} {"train_loss": -26.51190185546875, "global_step": 614785, "epoch": 7407} {"train_loss": -26.679828643798828, "global_step": 614786, "epoch": 7407} {"train_loss": -26.973447799682617, "global_step": 614787, "epoch": 7407} {"train_loss": -27.026824951171875, "global_step": 614788, "epoch": 7407} {"train_loss": -27.3812313079834, "global_step": 614789, "epoch": 7407} {"train_loss": -27.086877822875977, "global_step": 614790, "epoch": 7407} {"train_loss": -27.34688377380371, "global_step": 614791, "epoch": 7407} {"train_loss": -27.373205184936523, "global_step": 614792, "epoch": 7407} {"train_loss": -27.453857421875, "global_step": 614793, "epoch": 7407} {"train_loss": -27.310546875, "global_step": 614794, "epoch": 7407} {"train_loss": -27.342376708984375, "global_step": 614795, "epoch": 7407} {"train_loss": -27.444931030273438, "global_step": 614796, "epoch": 7407} {"train_loss": -27.48369789123535, "global_step": 614797, "epoch": 7407} {"train_loss": -27.7733211517334, "global_step": 614798, "epoch": 7407} {"train_loss": -27.597753524780273, "global_step": 614799, "epoch": 7407} {"train_loss": -27.563318252563477, "global_step": 614800, "epoch": 7407} {"train_loss": -27.688581466674805, "global_step": 614801, "epoch": 7407} {"train_loss": -27.540929794311523, "global_step": 614802, "epoch": 7407} {"train_loss": -27.666522979736328, "global_step": 614803, "epoch": 7407} {"train_loss": -27.927356719970703, "global_step": 614804, "epoch": 7407} {"train_loss": -28.088275909423828, "global_step": 614805, "epoch": 7407} {"train_loss": -28.158559799194336, "global_step": 614806, "epoch": 7407} {"train_loss": -27.999704360961914, "global_step": 614807, "epoch": 7407} {"train_loss": -27.936094284057617, "global_step": 614808, "epoch": 7407} {"train_loss": -27.687671661376953, "global_step": 614809, "epoch": 7407} {"train_loss": -27.880407333374023, "global_step": 614810, "epoch": 7407} {"train_loss": -27.718311309814453, "global_step": 614811, "epoch": 7407} {"train_loss": -27.744653701782227, "global_step": 614812, "epoch": 7407} {"train_loss": -27.63868522644043, "global_step": 614813, "epoch": 7407} {"train_loss": -28.021066665649414, "global_step": 614814, "epoch": 7407} {"train_loss": -27.922407150268555, "global_step": 614815, "epoch": 7407} {"train_loss": -27.808252334594727, "global_step": 614816, "epoch": 7407} {"train_loss": -27.99798583984375, "global_step": 614817, "epoch": 7407} {"train_loss": -28.027023315429688, "global_step": 614818, "epoch": 7407} {"train_loss": -28.063825607299805, "global_step": 614819, "epoch": 7407} {"train_loss": -28.31134033203125, "global_step": 614820, "epoch": 7407} {"train_loss": -28.02054786682129, "global_step": 614821, "epoch": 7407} {"train_loss": -28.012537002563477, "global_step": 614822, "epoch": 7407} {"train_loss": -28.29243278503418, "global_step": 614823, "epoch": 7407} {"train_loss": -28.331750869750977, "global_step": 614824, "epoch": 7407} {"train_loss": -28.41403579711914, "global_step": 614825, "epoch": 7407} {"train_loss": -28.14404296875, "global_step": 614826, "epoch": 7407} {"train_loss": -28.122970581054688, "global_step": 614827, "epoch": 7407} {"train_loss": -28.328332901000977, "global_step": 614828, "epoch": 7407} {"train_loss": -28.230350494384766, "global_step": 614829, "epoch": 7407} {"train_loss": -28.12831687927246, "global_step": 614830, "epoch": 7407} {"train_loss": -28.1942081451416, "global_step": 614831, "epoch": 7407} {"train_loss": -28.3516845703125, "global_step": 614832, "epoch": 7407} {"train_loss": -28.293212890625, "global_step": 614833, "epoch": 7407} {"train_loss": -28.504179000854492, "global_step": 614834, "epoch": 7407} {"train_loss": -28.48004150390625, "global_step": 614835, "epoch": 7407} {"train_loss": -28.052112579345703, "global_step": 614836, "epoch": 7407} {"train_loss": -28.286392211914062, "global_step": 614837, "epoch": 7407} {"train_loss": -28.280353546142578, "global_step": 614838, "epoch": 7407} {"train_loss": -28.3527774810791, "global_step": 614839, "epoch": 7407} {"train_loss": -28.424264907836914, "global_step": 614840, "epoch": 7407} {"train_loss": -28.386030197143555, "global_step": 614841, "epoch": 7407} {"train_loss": -28.151647567749023, "global_step": 614842, "epoch": 7407} {"train_loss": -28.030027389526367, "global_step": 614843, "epoch": 7407} {"train_loss": -28.350976943969727, "global_step": 614844, "epoch": 7407} {"train_loss": -28.287281036376953, "global_step": 614845, "epoch": 7407} {"train_loss": -27.94476318359375, "global_step": 614846, "epoch": 7407} {"train_loss": -28.0977783203125, "global_step": 614847, "epoch": 7407} {"train_loss": -27.996356964111328, "global_step": 614848, "epoch": 7407} {"train_loss": -27.8006591796875, "global_step": 614849, "epoch": 7407} {"train_loss": -28.278766632080078, "global_step": 614850, "epoch": 7407} {"train_loss": -28.480234146118164, "global_step": 614851, "epoch": 7407} {"train_loss": -28.437597274780273, "global_step": 614852, "epoch": 7407} {"train_loss": -27.753650665283203, "global_step": 614853, "epoch": 7407} {"train_loss": -28.48309326171875, "global_step": 614854, "epoch": 7407} {"train_loss": -28.33807945251465, "global_step": 614855, "epoch": 7407} {"train_loss": -28.201452255249023, "global_step": 614856, "epoch": 7407} {"train_loss": -28.23953628540039, "global_step": 614857, "epoch": 7407} {"train_loss": -28.411123275756836, "global_step": 614858, "epoch": 7407} {"train_loss": -28.521982192993164, "global_step": 614859, "epoch": 7407} {"train_loss": -28.00136375427246, "global_step": 614860, "epoch": 7407} {"train_loss": -28.380691528320312, "global_step": 614861, "epoch": 7407} {"train_loss": -28.716455459594727, "global_step": 614862, "epoch": 7407} {"train_loss": -27.90656393120088, "global_step": 614863, "epoch": 7407, "val_loss": 6673592.5} {"train_loss": -25.625349044799805, "global_step": 614864, "epoch": 7408} {"train_loss": -25.877843856811523, "global_step": 614865, "epoch": 7408} {"train_loss": -25.88568115234375, "global_step": 614866, "epoch": 7408} {"train_loss": -25.6293888092041, "global_step": 614867, "epoch": 7408} {"train_loss": -26.187488555908203, "global_step": 614868, "epoch": 7408} {"train_loss": -27.03781509399414, "global_step": 614869, "epoch": 7408} {"train_loss": -27.120655059814453, "global_step": 614870, "epoch": 7408} {"train_loss": -26.79523277282715, "global_step": 614871, "epoch": 7408} {"train_loss": -27.400238037109375, "global_step": 614872, "epoch": 7408} {"train_loss": -27.31922721862793, "global_step": 614873, "epoch": 7408} {"train_loss": -27.438337326049805, "global_step": 614874, "epoch": 7408} {"train_loss": -27.191503524780273, "global_step": 614875, "epoch": 7408} {"train_loss": -27.310632705688477, "global_step": 614876, "epoch": 7408} {"train_loss": -27.750614166259766, "global_step": 614877, "epoch": 7408} {"train_loss": -27.555957794189453, "global_step": 614878, "epoch": 7408} {"train_loss": -27.536848068237305, "global_step": 614879, "epoch": 7408} {"train_loss": -27.46720314025879, "global_step": 614880, "epoch": 7408} {"train_loss": -27.672840118408203, "global_step": 614881, "epoch": 7408} {"train_loss": -27.424591064453125, "global_step": 614882, "epoch": 7408} {"train_loss": -27.920978546142578, "global_step": 614883, "epoch": 7408} {"train_loss": -27.6207332611084, "global_step": 614884, "epoch": 7408} {"train_loss": -27.560047149658203, "global_step": 614885, "epoch": 7408} {"train_loss": -27.68159294128418, "global_step": 614886, "epoch": 7408} {"train_loss": -27.725940704345703, "global_step": 614887, "epoch": 7408} {"train_loss": -27.909927368164062, "global_step": 614888, "epoch": 7408} {"train_loss": -27.722126007080078, "global_step": 614889, "epoch": 7408} {"train_loss": -28.048583984375, "global_step": 614890, "epoch": 7408} {"train_loss": -27.769147872924805, "global_step": 614891, "epoch": 7408} {"train_loss": -28.021224975585938, "global_step": 614892, "epoch": 7408} {"train_loss": -27.99895668029785, "global_step": 614893, "epoch": 7408} {"train_loss": -27.992019653320312, "global_step": 614894, "epoch": 7408} {"train_loss": -28.158422470092773, "global_step": 614895, "epoch": 7408} {"train_loss": -27.616378784179688, "global_step": 614896, "epoch": 7408} {"train_loss": -28.292688369750977, "global_step": 614897, "epoch": 7408} {"train_loss": -28.054121017456055, "global_step": 614898, "epoch": 7408} {"train_loss": -28.026098251342773, "global_step": 614899, "epoch": 7408} {"train_loss": -27.82741355895996, "global_step": 614900, "epoch": 7408} {"train_loss": -28.17110252380371, "global_step": 614901, "epoch": 7408} {"train_loss": -28.03369140625, "global_step": 614902, "epoch": 7408} {"train_loss": -28.2917537689209, "global_step": 614903, "epoch": 7408} {"train_loss": -27.893115997314453, "global_step": 614904, "epoch": 7408} {"train_loss": -28.221410751342773, "global_step": 614905, "epoch": 7408} {"train_loss": -28.419050216674805, "global_step": 614906, "epoch": 7408} {"train_loss": -28.275541305541992, "global_step": 614907, "epoch": 7408} {"train_loss": -28.129901885986328, "global_step": 614908, "epoch": 7408} {"train_loss": -27.986499786376953, "global_step": 614909, "epoch": 7408} {"train_loss": -28.1252384185791, "global_step": 614910, "epoch": 7408} {"train_loss": -28.050199508666992, "global_step": 614911, "epoch": 7408} {"train_loss": -28.468603134155273, "global_step": 614912, "epoch": 7408} {"train_loss": -28.1644344329834, "global_step": 614913, "epoch": 7408} {"train_loss": -28.258838653564453, "global_step": 614914, "epoch": 7408} {"train_loss": -28.46604347229004, "global_step": 614915, "epoch": 7408} {"train_loss": -28.57232666015625, "global_step": 614916, "epoch": 7408} {"train_loss": -28.2545166015625, "global_step": 614917, "epoch": 7408} {"train_loss": -28.145130157470703, "global_step": 614918, "epoch": 7408} {"train_loss": -28.329626083374023, "global_step": 614919, "epoch": 7408} {"train_loss": -28.256256103515625, "global_step": 614920, "epoch": 7408} {"train_loss": -28.285083770751953, "global_step": 614921, "epoch": 7408} {"train_loss": -28.480945587158203, "global_step": 614922, "epoch": 7408} {"train_loss": -28.460376739501953, "global_step": 614923, "epoch": 7408} {"train_loss": -28.188629150390625, "global_step": 614924, "epoch": 7408} {"train_loss": -28.287900924682617, "global_step": 614925, "epoch": 7408} {"train_loss": -28.251291275024414, "global_step": 614926, "epoch": 7408} {"train_loss": -28.34499168395996, "global_step": 614927, "epoch": 7408} {"train_loss": -28.287134170532227, "global_step": 614928, "epoch": 7408} {"train_loss": -28.222497940063477, "global_step": 614929, "epoch": 7408} {"train_loss": -28.25514793395996, "global_step": 614930, "epoch": 7408} {"train_loss": -27.533212661743164, "global_step": 614931, "epoch": 7408} {"train_loss": -26.993268966674805, "global_step": 614932, "epoch": 7408} {"train_loss": -27.367849349975586, "global_step": 614933, "epoch": 7408} {"train_loss": -28.12892723083496, "global_step": 614934, "epoch": 7408} {"train_loss": -27.94868278503418, "global_step": 614935, "epoch": 7408} {"train_loss": -27.851545333862305, "global_step": 614936, "epoch": 7408} {"train_loss": -28.17835807800293, "global_step": 614937, "epoch": 7408} {"train_loss": -28.02837562561035, "global_step": 614938, "epoch": 7408} {"train_loss": -28.245161056518555, "global_step": 614939, "epoch": 7408} {"train_loss": -27.756406784057617, "global_step": 614940, "epoch": 7408} {"train_loss": -28.064367294311523, "global_step": 614941, "epoch": 7408} {"train_loss": -27.878204345703125, "global_step": 614942, "epoch": 7408} {"train_loss": -27.947935104370117, "global_step": 614943, "epoch": 7408} {"train_loss": -28.0661678314209, "global_step": 614944, "epoch": 7408} {"train_loss": -27.982995986938477, "global_step": 614945, "epoch": 7408} {"train_loss": -27.80841620571642, "global_step": 614946, "epoch": 7408, "val_loss": 6633691.0} {"train_loss": -27.379993438720703, "global_step": 614947, "epoch": 7409} {"train_loss": -27.716140747070312, "global_step": 614948, "epoch": 7409} {"train_loss": -27.518783569335938, "global_step": 614949, "epoch": 7409} {"train_loss": -27.435556411743164, "global_step": 614950, "epoch": 7409} {"train_loss": -28.137067794799805, "global_step": 614951, "epoch": 7409} {"train_loss": -27.147428512573242, "global_step": 614952, "epoch": 7409} {"train_loss": -27.335651397705078, "global_step": 614953, "epoch": 7409} {"train_loss": -26.221729278564453, "global_step": 614954, "epoch": 7409} {"train_loss": -27.226409912109375, "global_step": 614955, "epoch": 7409} {"train_loss": -27.7045841217041, "global_step": 614956, "epoch": 7409} {"train_loss": -27.539533615112305, "global_step": 614957, "epoch": 7409} {"train_loss": -27.45526695251465, "global_step": 614958, "epoch": 7409} {"train_loss": -27.64496421813965, "global_step": 614959, "epoch": 7409} {"train_loss": -27.61948585510254, "global_step": 614960, "epoch": 7409} {"train_loss": -27.90764808654785, "global_step": 614961, "epoch": 7409} {"train_loss": -27.726730346679688, "global_step": 614962, "epoch": 7409} {"train_loss": -27.56903648376465, "global_step": 614963, "epoch": 7409} {"train_loss": -27.776220321655273, "global_step": 614964, "epoch": 7409} {"train_loss": -28.290796279907227, "global_step": 614965, "epoch": 7409} {"train_loss": -27.880491256713867, "global_step": 614966, "epoch": 7409} {"train_loss": -28.290647506713867, "global_step": 614967, "epoch": 7409} {"train_loss": -27.869638442993164, "global_step": 614968, "epoch": 7409} {"train_loss": -28.231964111328125, "global_step": 614969, "epoch": 7409} {"train_loss": -27.858173370361328, "global_step": 614970, "epoch": 7409} {"train_loss": -27.910810470581055, "global_step": 614971, "epoch": 7409} {"train_loss": -28.176767349243164, "global_step": 614972, "epoch": 7409} {"train_loss": -27.8413028717041, "global_step": 614973, "epoch": 7409} {"train_loss": -28.374393463134766, "global_step": 614974, "epoch": 7409} {"train_loss": -28.0833683013916, "global_step": 614975, "epoch": 7409} {"train_loss": -28.178701400756836, "global_step": 614976, "epoch": 7409} {"train_loss": -28.254343032836914, "global_step": 614977, "epoch": 7409} {"train_loss": -28.13018798828125, "global_step": 614978, "epoch": 7409} {"train_loss": -27.9985294342041, "global_step": 614979, "epoch": 7409} {"train_loss": -28.270917892456055, "global_step": 614980, "epoch": 7409} {"train_loss": -28.442108154296875, "global_step": 614981, "epoch": 7409} {"train_loss": -27.812061309814453, "global_step": 614982, "epoch": 7409} {"train_loss": -28.42661476135254, "global_step": 614983, "epoch": 7409} {"train_loss": -28.270191192626953, "global_step": 614984, "epoch": 7409} {"train_loss": -28.502721786499023, "global_step": 614985, "epoch": 7409} {"train_loss": -28.69548988342285, "global_step": 614986, "epoch": 7409} {"train_loss": -28.39790153503418, "global_step": 614987, "epoch": 7409} {"train_loss": -28.329710006713867, "global_step": 614988, "epoch": 7409} {"train_loss": -28.428192138671875, "global_step": 614989, "epoch": 7409} {"train_loss": -28.28580665588379, "global_step": 614990, "epoch": 7409} {"train_loss": -28.564878463745117, "global_step": 614991, "epoch": 7409} {"train_loss": -28.14594841003418, "global_step": 614992, "epoch": 7409} {"train_loss": -28.374664306640625, "global_step": 614993, "epoch": 7409} {"train_loss": -28.44952964782715, "global_step": 614994, "epoch": 7409} {"train_loss": -28.02130699157715, "global_step": 614995, "epoch": 7409} {"train_loss": -28.1809024810791, "global_step": 614996, "epoch": 7409} {"train_loss": -28.16090202331543, "global_step": 614997, "epoch": 7409} {"train_loss": -28.33432960510254, "global_step": 614998, "epoch": 7409} {"train_loss": -28.16216468811035, "global_step": 614999, "epoch": 7409} {"train_loss": -28.030988693237305, "global_step": 615000, "epoch": 7409} {"train_loss": -28.12904167175293, "global_step": 615001, "epoch": 7409} {"train_loss": -28.187271118164062, "global_step": 615002, "epoch": 7409} {"train_loss": -28.526031494140625, "global_step": 615003, "epoch": 7409} {"train_loss": -28.47791862487793, "global_step": 615004, "epoch": 7409} {"train_loss": -28.17953872680664, "global_step": 615005, "epoch": 7409} {"train_loss": -28.306079864501953, "global_step": 615006, "epoch": 7409} {"train_loss": -28.504444122314453, "global_step": 615007, "epoch": 7409} {"train_loss": -28.516843795776367, "global_step": 615008, "epoch": 7409} {"train_loss": -28.25642204284668, "global_step": 615009, "epoch": 7409} {"train_loss": -28.3371524810791, "global_step": 615010, "epoch": 7409} {"train_loss": -28.40606117248535, "global_step": 615011, "epoch": 7409} {"train_loss": -28.1584415435791, "global_step": 615012, "epoch": 7409} {"train_loss": -28.04792594909668, "global_step": 615013, "epoch": 7409} {"train_loss": -27.6314640045166, "global_step": 615014, "epoch": 7409} {"train_loss": -26.73430824279785, "global_step": 615015, "epoch": 7409} {"train_loss": -26.789297103881836, "global_step": 615016, "epoch": 7409} {"train_loss": -27.751867294311523, "global_step": 615017, "epoch": 7409} {"train_loss": -28.02667236328125, "global_step": 615018, "epoch": 7409} {"train_loss": -28.147541046142578, "global_step": 615019, "epoch": 7409} {"train_loss": -27.416955947875977, "global_step": 615020, "epoch": 7409} {"train_loss": -27.983657836914062, "global_step": 615021, "epoch": 7409} {"train_loss": -27.9384822845459, "global_step": 615022, "epoch": 7409} {"train_loss": -28.197900772094727, "global_step": 615023, "epoch": 7409} {"train_loss": -28.049102783203125, "global_step": 615024, "epoch": 7409} {"train_loss": -28.23841667175293, "global_step": 615025, "epoch": 7409} {"train_loss": -28.181554794311523, "global_step": 615026, "epoch": 7409} {"train_loss": -27.937973022460938, "global_step": 615027, "epoch": 7409} {"train_loss": -28.216068267822266, "global_step": 615028, "epoch": 7409} {"train_loss": -28.011863317834326, "global_step": 615029, "epoch": 7409, "val_loss": 6605488.0} {"train_loss": -27.957489013671875, "global_step": 615030, "epoch": 7410} {"train_loss": -28.08572769165039, "global_step": 615031, "epoch": 7410} {"train_loss": -28.093015670776367, "global_step": 615032, "epoch": 7410} {"train_loss": -27.556934356689453, "global_step": 615033, "epoch": 7410} {"train_loss": -27.899641036987305, "global_step": 615034, "epoch": 7410} {"train_loss": -27.795923233032227, "global_step": 615035, "epoch": 7410} {"train_loss": -28.0660343170166, "global_step": 615036, "epoch": 7410} {"train_loss": -27.882953643798828, "global_step": 615037, "epoch": 7410} {"train_loss": -28.32338523864746, "global_step": 615038, "epoch": 7410} {"train_loss": -28.23097801208496, "global_step": 615039, "epoch": 7410} {"train_loss": -27.815656661987305, "global_step": 615040, "epoch": 7410} {"train_loss": -27.75798988342285, "global_step": 615041, "epoch": 7410} {"train_loss": -27.90620231628418, "global_step": 615042, "epoch": 7410} {"train_loss": -28.103652954101562, "global_step": 615043, "epoch": 7410} {"train_loss": -28.28500747680664, "global_step": 615044, "epoch": 7410} {"train_loss": -28.320478439331055, "global_step": 615045, "epoch": 7410} {"train_loss": -27.643741607666016, "global_step": 615046, "epoch": 7410} {"train_loss": -28.003767013549805, "global_step": 615047, "epoch": 7410} {"train_loss": -27.895666122436523, "global_step": 615048, "epoch": 7410} {"train_loss": -28.15851402282715, "global_step": 615049, "epoch": 7410} {"train_loss": -28.579694747924805, "global_step": 615050, "epoch": 7410} {"train_loss": -27.84271812438965, "global_step": 615051, "epoch": 7410} {"train_loss": -28.046899795532227, "global_step": 615052, "epoch": 7410} {"train_loss": -28.116138458251953, "global_step": 615053, "epoch": 7410} {"train_loss": -28.11115074157715, "global_step": 615054, "epoch": 7410} {"train_loss": -28.562164306640625, "global_step": 615055, "epoch": 7410} {"train_loss": -28.416120529174805, "global_step": 615056, "epoch": 7410} {"train_loss": -27.8195858001709, "global_step": 615057, "epoch": 7410} {"train_loss": -27.77730369567871, "global_step": 615058, "epoch": 7410} {"train_loss": -27.498132705688477, "global_step": 615059, "epoch": 7410} {"train_loss": -27.104928970336914, "global_step": 615060, "epoch": 7410} {"train_loss": -27.293973922729492, "global_step": 615061, "epoch": 7410} {"train_loss": -27.957433700561523, "global_step": 615062, "epoch": 7410} {"train_loss": -28.177570343017578, "global_step": 615063, "epoch": 7410} {"train_loss": -27.558942794799805, "global_step": 615064, "epoch": 7410} {"train_loss": -27.458911895751953, "global_step": 615065, "epoch": 7410} {"train_loss": -28.024717330932617, "global_step": 615066, "epoch": 7410} {"train_loss": -27.970478057861328, "global_step": 615067, "epoch": 7410} {"train_loss": -28.12237548828125, "global_step": 615068, "epoch": 7410} {"train_loss": -27.88580894470215, "global_step": 615069, "epoch": 7410} {"train_loss": -28.18878173828125, "global_step": 615070, "epoch": 7410} {"train_loss": -27.890405654907227, "global_step": 615071, "epoch": 7410} {"train_loss": -28.152753829956055, "global_step": 615072, "epoch": 7410} {"train_loss": -27.85285758972168, "global_step": 615073, "epoch": 7410} {"train_loss": -28.336801528930664, "global_step": 615074, "epoch": 7410} {"train_loss": -28.19818115234375, "global_step": 615075, "epoch": 7410} {"train_loss": -27.899702072143555, "global_step": 615076, "epoch": 7410} {"train_loss": -28.2442684173584, "global_step": 615077, "epoch": 7410} {"train_loss": -28.211383819580078, "global_step": 615078, "epoch": 7410} {"train_loss": -28.0440731048584, "global_step": 615079, "epoch": 7410} {"train_loss": -28.246078491210938, "global_step": 615080, "epoch": 7410} {"train_loss": -28.05657386779785, "global_step": 615081, "epoch": 7410} {"train_loss": -28.735702514648438, "global_step": 615082, "epoch": 7410} {"train_loss": -28.055952072143555, "global_step": 615083, "epoch": 7410} {"train_loss": -28.2320499420166, "global_step": 615084, "epoch": 7410} {"train_loss": -28.085966110229492, "global_step": 615085, "epoch": 7410} {"train_loss": -28.462156295776367, "global_step": 615086, "epoch": 7410} {"train_loss": -28.40033531188965, "global_step": 615087, "epoch": 7410} {"train_loss": -27.752241134643555, "global_step": 615088, "epoch": 7410} {"train_loss": -27.9609432220459, "global_step": 615089, "epoch": 7410} {"train_loss": -28.351394653320312, "global_step": 615090, "epoch": 7410} {"train_loss": -28.38869285583496, "global_step": 615091, "epoch": 7410} {"train_loss": -27.90447425842285, "global_step": 615092, "epoch": 7410} {"train_loss": -28.073333740234375, "global_step": 615093, "epoch": 7410} {"train_loss": -28.459339141845703, "global_step": 615094, "epoch": 7410} {"train_loss": -28.209516525268555, "global_step": 615095, "epoch": 7410} {"train_loss": -27.93977165222168, "global_step": 615096, "epoch": 7410} {"train_loss": -28.070409774780273, "global_step": 615097, "epoch": 7410} {"train_loss": -27.772785186767578, "global_step": 615098, "epoch": 7410} {"train_loss": -28.209095001220703, "global_step": 615099, "epoch": 7410} {"train_loss": -28.405181884765625, "global_step": 615100, "epoch": 7410} {"train_loss": -28.287580490112305, "global_step": 615101, "epoch": 7410} {"train_loss": -28.325414657592773, "global_step": 615102, "epoch": 7410} {"train_loss": -27.945941925048828, "global_step": 615103, "epoch": 7410} {"train_loss": -28.334247589111328, "global_step": 615104, "epoch": 7410} {"train_loss": -28.320287704467773, "global_step": 615105, "epoch": 7410} {"train_loss": -28.13984489440918, "global_step": 615106, "epoch": 7410} {"train_loss": -27.875762939453125, "global_step": 615107, "epoch": 7410} {"train_loss": -28.302221298217773, "global_step": 615108, "epoch": 7410} {"train_loss": -28.18231773376465, "global_step": 615109, "epoch": 7410} {"train_loss": -28.033349990844727, "global_step": 615110, "epoch": 7410} {"train_loss": -28.26582908630371, "global_step": 615111, "epoch": 7410} {"train_loss": -28.054108952901448, "global_step": 615112, "epoch": 7410, "val_loss": 6636027.0} {"train_loss": -27.952444076538086, "global_step": 615113, "epoch": 7411} {"train_loss": -27.90669059753418, "global_step": 615114, "epoch": 7411} {"train_loss": -27.76520347595215, "global_step": 615115, "epoch": 7411} {"train_loss": -27.535110473632812, "global_step": 615116, "epoch": 7411} {"train_loss": -27.855527877807617, "global_step": 615117, "epoch": 7411} {"train_loss": -27.827056884765625, "global_step": 615118, "epoch": 7411} {"train_loss": -27.788660049438477, "global_step": 615119, "epoch": 7411} {"train_loss": -28.006500244140625, "global_step": 615120, "epoch": 7411} {"train_loss": -27.7533016204834, "global_step": 615121, "epoch": 7411} {"train_loss": -27.806570053100586, "global_step": 615122, "epoch": 7411} {"train_loss": -27.749542236328125, "global_step": 615123, "epoch": 7411} {"train_loss": -27.933191299438477, "global_step": 615124, "epoch": 7411} {"train_loss": -28.321475982666016, "global_step": 615125, "epoch": 7411} {"train_loss": -27.623859405517578, "global_step": 615126, "epoch": 7411} {"train_loss": -28.326120376586914, "global_step": 615127, "epoch": 7411} {"train_loss": -27.74896812438965, "global_step": 615128, "epoch": 7411} {"train_loss": -27.939191818237305, "global_step": 615129, "epoch": 7411} {"train_loss": -27.828632354736328, "global_step": 615130, "epoch": 7411} {"train_loss": -27.879404067993164, "global_step": 615131, "epoch": 7411} {"train_loss": -28.389760971069336, "global_step": 615132, "epoch": 7411} {"train_loss": -27.919904708862305, "global_step": 615133, "epoch": 7411} {"train_loss": -27.897857666015625, "global_step": 615134, "epoch": 7411} {"train_loss": -27.503173828125, "global_step": 615135, "epoch": 7411} {"train_loss": -28.500030517578125, "global_step": 615136, "epoch": 7411} {"train_loss": -27.77950096130371, "global_step": 615137, "epoch": 7411} {"train_loss": -27.69207191467285, "global_step": 615138, "epoch": 7411} {"train_loss": -28.054128646850586, "global_step": 615139, "epoch": 7411} {"train_loss": -28.1214542388916, "global_step": 615140, "epoch": 7411} {"train_loss": -28.136098861694336, "global_step": 615141, "epoch": 7411} {"train_loss": -28.165271759033203, "global_step": 615142, "epoch": 7411} {"train_loss": -27.809906005859375, "global_step": 615143, "epoch": 7411} {"train_loss": -27.888147354125977, "global_step": 615144, "epoch": 7411} {"train_loss": -27.924421310424805, "global_step": 615145, "epoch": 7411} {"train_loss": -27.921247482299805, "global_step": 615146, "epoch": 7411} {"train_loss": -28.017841339111328, "global_step": 615147, "epoch": 7411} {"train_loss": -27.656030654907227, "global_step": 615148, "epoch": 7411} {"train_loss": -28.077505111694336, "global_step": 615149, "epoch": 7411} {"train_loss": -27.948394775390625, "global_step": 615150, "epoch": 7411} {"train_loss": -27.883459091186523, "global_step": 615151, "epoch": 7411} {"train_loss": -27.640899658203125, "global_step": 615152, "epoch": 7411} {"train_loss": -27.6787052154541, "global_step": 615153, "epoch": 7411} {"train_loss": -27.93292808532715, "global_step": 615154, "epoch": 7411} {"train_loss": -28.1671142578125, "global_step": 615155, "epoch": 7411} {"train_loss": -28.1221981048584, "global_step": 615156, "epoch": 7411} {"train_loss": -28.017004013061523, "global_step": 615157, "epoch": 7411} {"train_loss": -27.993545532226562, "global_step": 615158, "epoch": 7411} {"train_loss": -27.856433868408203, "global_step": 615159, "epoch": 7411} {"train_loss": -27.951276779174805, "global_step": 615160, "epoch": 7411} {"train_loss": -28.270959854125977, "global_step": 615161, "epoch": 7411} {"train_loss": -27.93902587890625, "global_step": 615162, "epoch": 7411} {"train_loss": -27.953643798828125, "global_step": 615163, "epoch": 7411} {"train_loss": -28.585065841674805, "global_step": 615164, "epoch": 7411} {"train_loss": -28.23697280883789, "global_step": 615165, "epoch": 7411} {"train_loss": -28.325366973876953, "global_step": 615166, "epoch": 7411} {"train_loss": -28.023828506469727, "global_step": 615167, "epoch": 7411} {"train_loss": -27.921361923217773, "global_step": 615168, "epoch": 7411} {"train_loss": -28.1709041595459, "global_step": 615169, "epoch": 7411} {"train_loss": -28.262073516845703, "global_step": 615170, "epoch": 7411} {"train_loss": -28.128644943237305, "global_step": 615171, "epoch": 7411} {"train_loss": -28.239917755126953, "global_step": 615172, "epoch": 7411} {"train_loss": -28.195592880249023, "global_step": 615173, "epoch": 7411} {"train_loss": -28.222736358642578, "global_step": 615174, "epoch": 7411} {"train_loss": -28.3369140625, "global_step": 615175, "epoch": 7411} {"train_loss": -28.07196617126465, "global_step": 615176, "epoch": 7411} {"train_loss": -28.06459617614746, "global_step": 615177, "epoch": 7411} {"train_loss": -28.088043212890625, "global_step": 615178, "epoch": 7411} {"train_loss": -28.061487197875977, "global_step": 615179, "epoch": 7411} {"train_loss": -28.002243041992188, "global_step": 615180, "epoch": 7411} {"train_loss": -28.31353759765625, "global_step": 615181, "epoch": 7411} {"train_loss": -27.94449806213379, "global_step": 615182, "epoch": 7411} {"train_loss": -28.20718765258789, "global_step": 615183, "epoch": 7411} {"train_loss": -28.23007583618164, "global_step": 615184, "epoch": 7411} {"train_loss": -27.96729850769043, "global_step": 615185, "epoch": 7411} {"train_loss": -28.14426612854004, "global_step": 615186, "epoch": 7411} {"train_loss": -27.758255004882812, "global_step": 615187, "epoch": 7411} {"train_loss": -27.441457748413086, "global_step": 615188, "epoch": 7411} {"train_loss": -26.971466064453125, "global_step": 615189, "epoch": 7411} {"train_loss": -27.590036392211914, "global_step": 615190, "epoch": 7411} {"train_loss": -28.124744415283203, "global_step": 615191, "epoch": 7411} {"train_loss": -27.8013858795166, "global_step": 615192, "epoch": 7411} {"train_loss": -27.7497615814209, "global_step": 615193, "epoch": 7411} {"train_loss": -28.01458168029785, "global_step": 615194, "epoch": 7411} {"train_loss": -27.978026217724903, "global_step": 615195, "epoch": 7411, "val_loss": 6608058.0} {"train_loss": -27.82761573791504, "global_step": 615196, "epoch": 7412} {"train_loss": -27.450544357299805, "global_step": 615197, "epoch": 7412} {"train_loss": -27.116565704345703, "global_step": 615198, "epoch": 7412} {"train_loss": -27.410104751586914, "global_step": 615199, "epoch": 7412} {"train_loss": -27.496337890625, "global_step": 615200, "epoch": 7412} {"train_loss": -27.339391708374023, "global_step": 615201, "epoch": 7412} {"train_loss": -27.269607543945312, "global_step": 615202, "epoch": 7412} {"train_loss": -27.79290771484375, "global_step": 615203, "epoch": 7412} {"train_loss": -27.801916122436523, "global_step": 615204, "epoch": 7412} {"train_loss": -27.98990249633789, "global_step": 615205, "epoch": 7412} {"train_loss": -27.688024520874023, "global_step": 615206, "epoch": 7412} {"train_loss": -27.494619369506836, "global_step": 615207, "epoch": 7412} {"train_loss": -27.49965476989746, "global_step": 615208, "epoch": 7412} {"train_loss": -27.668212890625, "global_step": 615209, "epoch": 7412} {"train_loss": -27.762380599975586, "global_step": 615210, "epoch": 7412} {"train_loss": -27.37241554260254, "global_step": 615211, "epoch": 7412} {"train_loss": -27.8150691986084, "global_step": 615212, "epoch": 7412} {"train_loss": -28.189838409423828, "global_step": 615213, "epoch": 7412} {"train_loss": -28.068689346313477, "global_step": 615214, "epoch": 7412} {"train_loss": -27.68717384338379, "global_step": 615215, "epoch": 7412} {"train_loss": -28.147607803344727, "global_step": 615216, "epoch": 7412} {"train_loss": -28.02007484436035, "global_step": 615217, "epoch": 7412} {"train_loss": -27.893707275390625, "global_step": 615218, "epoch": 7412} {"train_loss": -28.008411407470703, "global_step": 615219, "epoch": 7412} {"train_loss": -27.880573272705078, "global_step": 615220, "epoch": 7412} {"train_loss": -28.16950798034668, "global_step": 615221, "epoch": 7412} {"train_loss": -27.758941650390625, "global_step": 615222, "epoch": 7412} {"train_loss": -28.083555221557617, "global_step": 615223, "epoch": 7412} {"train_loss": -28.536603927612305, "global_step": 615224, "epoch": 7412} {"train_loss": -27.729618072509766, "global_step": 615225, "epoch": 7412} {"train_loss": -27.958023071289062, "global_step": 615226, "epoch": 7412} {"train_loss": -28.13722038269043, "global_step": 615227, "epoch": 7412} {"train_loss": -28.336999893188477, "global_step": 615228, "epoch": 7412} {"train_loss": -27.974140167236328, "global_step": 615229, "epoch": 7412} {"train_loss": -28.340482711791992, "global_step": 615230, "epoch": 7412} {"train_loss": -28.426727294921875, "global_step": 615231, "epoch": 7412} {"train_loss": -28.136859893798828, "global_step": 615232, "epoch": 7412} {"train_loss": -27.784042358398438, "global_step": 615233, "epoch": 7412} {"train_loss": -28.115766525268555, "global_step": 615234, "epoch": 7412} {"train_loss": -28.241077423095703, "global_step": 615235, "epoch": 7412} {"train_loss": -27.755401611328125, "global_step": 615236, "epoch": 7412} {"train_loss": -28.36652183532715, "global_step": 615237, "epoch": 7412} {"train_loss": -28.2116641998291, "global_step": 615238, "epoch": 7412} {"train_loss": -28.505857467651367, "global_step": 615239, "epoch": 7412} {"train_loss": -28.299726486206055, "global_step": 615240, "epoch": 7412} {"train_loss": -28.144346237182617, "global_step": 615241, "epoch": 7412} {"train_loss": -28.38034439086914, "global_step": 615242, "epoch": 7412} {"train_loss": -28.127948760986328, "global_step": 615243, "epoch": 7412} {"train_loss": -28.394973754882812, "global_step": 615244, "epoch": 7412} {"train_loss": -28.15284538269043, "global_step": 615245, "epoch": 7412} {"train_loss": -28.424930572509766, "global_step": 615246, "epoch": 7412} {"train_loss": -28.372175216674805, "global_step": 615247, "epoch": 7412} {"train_loss": -28.255502700805664, "global_step": 615248, "epoch": 7412} {"train_loss": -28.117719650268555, "global_step": 615249, "epoch": 7412} {"train_loss": -28.174942016601562, "global_step": 615250, "epoch": 7412} {"train_loss": -27.940710067749023, "global_step": 615251, "epoch": 7412} {"train_loss": -28.356536865234375, "global_step": 615252, "epoch": 7412} {"train_loss": -27.933597564697266, "global_step": 615253, "epoch": 7412} {"train_loss": -27.93153190612793, "global_step": 615254, "epoch": 7412} {"train_loss": -28.098413467407227, "global_step": 615255, "epoch": 7412} {"train_loss": -28.09324073791504, "global_step": 615256, "epoch": 7412} {"train_loss": -28.271265029907227, "global_step": 615257, "epoch": 7412} {"train_loss": -28.056201934814453, "global_step": 615258, "epoch": 7412} {"train_loss": -28.3109188079834, "global_step": 615259, "epoch": 7412} {"train_loss": -28.27699089050293, "global_step": 615260, "epoch": 7412} {"train_loss": -28.02880859375, "global_step": 615261, "epoch": 7412} {"train_loss": -28.095468521118164, "global_step": 615262, "epoch": 7412} {"train_loss": -27.94953727722168, "global_step": 615263, "epoch": 7412} {"train_loss": -27.788007736206055, "global_step": 615264, "epoch": 7412} {"train_loss": -28.757904052734375, "global_step": 615265, "epoch": 7412} {"train_loss": -28.461576461791992, "global_step": 615266, "epoch": 7412} {"train_loss": -27.95985221862793, "global_step": 615267, "epoch": 7412} {"train_loss": -28.084386825561523, "global_step": 615268, "epoch": 7412} {"train_loss": -27.606958389282227, "global_step": 615269, "epoch": 7412} {"train_loss": -28.2728214263916, "global_step": 615270, "epoch": 7412} {"train_loss": -27.766332626342773, "global_step": 615271, "epoch": 7412} {"train_loss": -28.001373291015625, "global_step": 615272, "epoch": 7412} {"train_loss": -27.858081817626953, "global_step": 615273, "epoch": 7412} {"train_loss": -28.123443603515625, "global_step": 615274, "epoch": 7412} {"train_loss": -27.845417022705078, "global_step": 615275, "epoch": 7412} {"train_loss": -27.6336612701416, "global_step": 615276, "epoch": 7412} {"train_loss": -27.810623168945312, "global_step": 615277, "epoch": 7412} {"train_loss": -27.98255833085761, "global_step": 615278, "epoch": 7412, "val_loss": 6667010.0} {"train_loss": -26.636754989624023, "global_step": 615279, "epoch": 7413} {"train_loss": -26.9100341796875, "global_step": 615280, "epoch": 7413} {"train_loss": -26.83131217956543, "global_step": 615281, "epoch": 7413} {"train_loss": -27.10015869140625, "global_step": 615282, "epoch": 7413} {"train_loss": -27.13490867614746, "global_step": 615283, "epoch": 7413} {"train_loss": -26.310379028320312, "global_step": 615284, "epoch": 7413} {"train_loss": -27.59255027770996, "global_step": 615285, "epoch": 7413} {"train_loss": -27.024072647094727, "global_step": 615286, "epoch": 7413} {"train_loss": -27.417078018188477, "global_step": 615287, "epoch": 7413} {"train_loss": -27.48296546936035, "global_step": 615288, "epoch": 7413} {"train_loss": -27.336200714111328, "global_step": 615289, "epoch": 7413} {"train_loss": -27.0267391204834, "global_step": 615290, "epoch": 7413} {"train_loss": -27.273941040039062, "global_step": 615291, "epoch": 7413} {"train_loss": -27.532384872436523, "global_step": 615292, "epoch": 7413} {"train_loss": -27.386661529541016, "global_step": 615293, "epoch": 7413} {"train_loss": -27.35284996032715, "global_step": 615294, "epoch": 7413} {"train_loss": -28.056909561157227, "global_step": 615295, "epoch": 7413} {"train_loss": -27.6881160736084, "global_step": 615296, "epoch": 7413} {"train_loss": -27.85685157775879, "global_step": 615297, "epoch": 7413} {"train_loss": -27.851171493530273, "global_step": 615298, "epoch": 7413} {"train_loss": -27.880773544311523, "global_step": 615299, "epoch": 7413} {"train_loss": -27.569684982299805, "global_step": 615300, "epoch": 7413} {"train_loss": -27.770654678344727, "global_step": 615301, "epoch": 7413} {"train_loss": -27.747699737548828, "global_step": 615302, "epoch": 7413} {"train_loss": -28.201416015625, "global_step": 615303, "epoch": 7413} {"train_loss": -27.88962173461914, "global_step": 615304, "epoch": 7413} {"train_loss": -27.687000274658203, "global_step": 615305, "epoch": 7413} {"train_loss": -27.832061767578125, "global_step": 615306, "epoch": 7413} {"train_loss": -27.930572509765625, "global_step": 615307, "epoch": 7413} {"train_loss": -28.051733016967773, "global_step": 615308, "epoch": 7413} {"train_loss": -27.801334381103516, "global_step": 615309, "epoch": 7413} {"train_loss": -28.04115867614746, "global_step": 615310, "epoch": 7413} {"train_loss": -28.247419357299805, "global_step": 615311, "epoch": 7413} {"train_loss": -28.035491943359375, "global_step": 615312, "epoch": 7413} {"train_loss": -28.293411254882812, "global_step": 615313, "epoch": 7413} {"train_loss": -27.806249618530273, "global_step": 615314, "epoch": 7413} {"train_loss": -28.563861846923828, "global_step": 615315, "epoch": 7413} {"train_loss": -28.340045928955078, "global_step": 615316, "epoch": 7413} {"train_loss": -27.89682960510254, "global_step": 615317, "epoch": 7413} {"train_loss": -28.118595123291016, "global_step": 615318, "epoch": 7413} {"train_loss": -28.033294677734375, "global_step": 615319, "epoch": 7413} {"train_loss": -28.347412109375, "global_step": 615320, "epoch": 7413} {"train_loss": -28.0301456451416, "global_step": 615321, "epoch": 7413} {"train_loss": -28.35748291015625, "global_step": 615322, "epoch": 7413} {"train_loss": -28.10169792175293, "global_step": 615323, "epoch": 7413} {"train_loss": -28.54720115661621, "global_step": 615324, "epoch": 7413} {"train_loss": -28.14771842956543, "global_step": 615325, "epoch": 7413} {"train_loss": -28.2042179107666, "global_step": 615326, "epoch": 7413} {"train_loss": -28.002111434936523, "global_step": 615327, "epoch": 7413} {"train_loss": -27.929981231689453, "global_step": 615328, "epoch": 7413} {"train_loss": -27.99354362487793, "global_step": 615329, "epoch": 7413} {"train_loss": -28.316686630249023, "global_step": 615330, "epoch": 7413} {"train_loss": -28.53828239440918, "global_step": 615331, "epoch": 7413} {"train_loss": -28.210163116455078, "global_step": 615332, "epoch": 7413} {"train_loss": -28.328842163085938, "global_step": 615333, "epoch": 7413} {"train_loss": -28.13728141784668, "global_step": 615334, "epoch": 7413} {"train_loss": -28.15888786315918, "global_step": 615335, "epoch": 7413} {"train_loss": -28.81830406188965, "global_step": 615336, "epoch": 7413} {"train_loss": -28.372222900390625, "global_step": 615337, "epoch": 7413} {"train_loss": -28.4765625, "global_step": 615338, "epoch": 7413} {"train_loss": -28.367475509643555, "global_step": 615339, "epoch": 7413} {"train_loss": -28.2940673828125, "global_step": 615340, "epoch": 7413} {"train_loss": -28.22907066345215, "global_step": 615341, "epoch": 7413} {"train_loss": -28.487768173217773, "global_step": 615342, "epoch": 7413} {"train_loss": -27.7733211517334, "global_step": 615343, "epoch": 7413} {"train_loss": -28.185916900634766, "global_step": 615344, "epoch": 7413} {"train_loss": -27.410064697265625, "global_step": 615345, "epoch": 7413} {"train_loss": -28.106603622436523, "global_step": 615346, "epoch": 7413} {"train_loss": -27.88361930847168, "global_step": 615347, "epoch": 7413} {"train_loss": -27.748920440673828, "global_step": 615348, "epoch": 7413} {"train_loss": -28.031415939331055, "global_step": 615349, "epoch": 7413} {"train_loss": -28.271198272705078, "global_step": 615350, "epoch": 7413} {"train_loss": -28.118854522705078, "global_step": 615351, "epoch": 7413} {"train_loss": -28.160980224609375, "global_step": 615352, "epoch": 7413} {"train_loss": -28.09027671813965, "global_step": 615353, "epoch": 7413} {"train_loss": -28.078094482421875, "global_step": 615354, "epoch": 7413} {"train_loss": -28.568037033081055, "global_step": 615355, "epoch": 7413} {"train_loss": -27.929508209228516, "global_step": 615356, "epoch": 7413} {"train_loss": -28.385395050048828, "global_step": 615357, "epoch": 7413} {"train_loss": -28.03533363342285, "global_step": 615358, "epoch": 7413} {"train_loss": -28.546707153320312, "global_step": 615359, "epoch": 7413} {"train_loss": -28.041370391845703, "global_step": 615360, "epoch": 7413} {"train_loss": -27.922102939651673, "global_step": 615361, "epoch": 7413, "val_loss": 6720041.0} {"train_loss": -28.063379287719727, "global_step": 615362, "epoch": 7414} {"train_loss": -27.7240047454834, "global_step": 615363, "epoch": 7414} {"train_loss": -28.07118034362793, "global_step": 615364, "epoch": 7414} {"train_loss": -28.10491943359375, "global_step": 615365, "epoch": 7414} {"train_loss": -27.557973861694336, "global_step": 615366, "epoch": 7414} {"train_loss": -27.531991958618164, "global_step": 615367, "epoch": 7414} {"train_loss": -27.842737197875977, "global_step": 615368, "epoch": 7414} {"train_loss": -27.934064865112305, "global_step": 615369, "epoch": 7414} {"train_loss": -28.285633087158203, "global_step": 615370, "epoch": 7414} {"train_loss": -28.162317276000977, "global_step": 615371, "epoch": 7414} {"train_loss": -27.95502281188965, "global_step": 615372, "epoch": 7414} {"train_loss": -28.10748863220215, "global_step": 615373, "epoch": 7414} {"train_loss": -28.100675582885742, "global_step": 615374, "epoch": 7414} {"train_loss": -28.1677188873291, "global_step": 615375, "epoch": 7414} {"train_loss": -27.991003036499023, "global_step": 615376, "epoch": 7414} {"train_loss": -28.200132369995117, "global_step": 615377, "epoch": 7414} {"train_loss": -28.01966667175293, "global_step": 615378, "epoch": 7414} {"train_loss": -28.072528839111328, "global_step": 615379, "epoch": 7414} {"train_loss": -27.955982208251953, "global_step": 615380, "epoch": 7414} {"train_loss": -27.89899253845215, "global_step": 615381, "epoch": 7414} {"train_loss": -27.950382232666016, "global_step": 615382, "epoch": 7414} {"train_loss": -27.99567985534668, "global_step": 615383, "epoch": 7414} {"train_loss": -28.1440372467041, "global_step": 615384, "epoch": 7414} {"train_loss": -28.36458396911621, "global_step": 615385, "epoch": 7414} {"train_loss": -28.169544219970703, "global_step": 615386, "epoch": 7414} {"train_loss": -28.269763946533203, "global_step": 615387, "epoch": 7414} {"train_loss": -28.15997886657715, "global_step": 615388, "epoch": 7414} {"train_loss": -28.525196075439453, "global_step": 615389, "epoch": 7414} {"train_loss": -28.319067001342773, "global_step": 615390, "epoch": 7414} {"train_loss": -28.4029541015625, "global_step": 615391, "epoch": 7414} {"train_loss": -28.400915145874023, "global_step": 615392, "epoch": 7414} {"train_loss": -28.244855880737305, "global_step": 615393, "epoch": 7414} {"train_loss": -28.425642013549805, "global_step": 615394, "epoch": 7414} {"train_loss": -28.3707332611084, "global_step": 615395, "epoch": 7414} {"train_loss": -28.489877700805664, "global_step": 615396, "epoch": 7414} {"train_loss": -28.23236656188965, "global_step": 615397, "epoch": 7414} {"train_loss": -28.478429794311523, "global_step": 615398, "epoch": 7414} {"train_loss": -28.292200088500977, "global_step": 615399, "epoch": 7414} {"train_loss": -28.402074813842773, "global_step": 615400, "epoch": 7414} {"train_loss": -28.364347457885742, "global_step": 615401, "epoch": 7414} {"train_loss": -28.47271728515625, "global_step": 615402, "epoch": 7414} {"train_loss": -27.98969841003418, "global_step": 615403, "epoch": 7414} {"train_loss": -28.021818161010742, "global_step": 615404, "epoch": 7414} {"train_loss": -28.183094024658203, "global_step": 615405, "epoch": 7414} {"train_loss": -27.579425811767578, "global_step": 615406, "epoch": 7414} {"train_loss": -27.058109283447266, "global_step": 615407, "epoch": 7414} {"train_loss": -27.047712326049805, "global_step": 615408, "epoch": 7414} {"train_loss": -27.284643173217773, "global_step": 615409, "epoch": 7414} {"train_loss": -27.960693359375, "global_step": 615410, "epoch": 7414} {"train_loss": -27.58817481994629, "global_step": 615411, "epoch": 7414} {"train_loss": -27.856176376342773, "global_step": 615412, "epoch": 7414} {"train_loss": -28.33490562438965, "global_step": 615413, "epoch": 7414} {"train_loss": -27.998029708862305, "global_step": 615414, "epoch": 7414} {"train_loss": -28.0711727142334, "global_step": 615415, "epoch": 7414} {"train_loss": -28.02912712097168, "global_step": 615416, "epoch": 7414} {"train_loss": -28.044208526611328, "global_step": 615417, "epoch": 7414} {"train_loss": -27.647119522094727, "global_step": 615418, "epoch": 7414} {"train_loss": -27.863107681274414, "global_step": 615419, "epoch": 7414} {"train_loss": -28.149219512939453, "global_step": 615420, "epoch": 7414} {"train_loss": -28.229278564453125, "global_step": 615421, "epoch": 7414} {"train_loss": -27.887571334838867, "global_step": 615422, "epoch": 7414} {"train_loss": -28.072174072265625, "global_step": 615423, "epoch": 7414} {"train_loss": -27.93650245666504, "global_step": 615424, "epoch": 7414} {"train_loss": -28.327823638916016, "global_step": 615425, "epoch": 7414} {"train_loss": -27.898792266845703, "global_step": 615426, "epoch": 7414} {"train_loss": -27.945974349975586, "global_step": 615427, "epoch": 7414} {"train_loss": -27.892419815063477, "global_step": 615428, "epoch": 7414} {"train_loss": -28.166913986206055, "global_step": 615429, "epoch": 7414} {"train_loss": -28.220478057861328, "global_step": 615430, "epoch": 7414} {"train_loss": -28.279600143432617, "global_step": 615431, "epoch": 7414} {"train_loss": -27.712207794189453, "global_step": 615432, "epoch": 7414} {"train_loss": -28.401813507080078, "global_step": 615433, "epoch": 7414} {"train_loss": -27.845197677612305, "global_step": 615434, "epoch": 7414} {"train_loss": -28.05207633972168, "global_step": 615435, "epoch": 7414} {"train_loss": -28.003942489624023, "global_step": 615436, "epoch": 7414} {"train_loss": -27.852264404296875, "global_step": 615437, "epoch": 7414} {"train_loss": -28.383264541625977, "global_step": 615438, "epoch": 7414} {"train_loss": -28.16924476623535, "global_step": 615439, "epoch": 7414} {"train_loss": -28.525348663330078, "global_step": 615440, "epoch": 7414} {"train_loss": -27.931806564331055, "global_step": 615441, "epoch": 7414} {"train_loss": -28.510595321655273, "global_step": 615442, "epoch": 7414} {"train_loss": -27.899658203125, "global_step": 615443, "epoch": 7414} {"train_loss": -28.060940914843457, "global_step": 615444, "epoch": 7414, "val_loss": 6729352.5} {"train_loss": -27.50702476501465, "global_step": 615445, "epoch": 7415} {"train_loss": -27.68121910095215, "global_step": 615446, "epoch": 7415} {"train_loss": -28.000141143798828, "global_step": 615447, "epoch": 7415} {"train_loss": -27.33026695251465, "global_step": 615448, "epoch": 7415} {"train_loss": -27.4733943939209, "global_step": 615449, "epoch": 7415} {"train_loss": -27.609933853149414, "global_step": 615450, "epoch": 7415} {"train_loss": -27.858123779296875, "global_step": 615451, "epoch": 7415} {"train_loss": -27.39356803894043, "global_step": 615452, "epoch": 7415} {"train_loss": -27.659894943237305, "global_step": 615453, "epoch": 7415} {"train_loss": -27.978424072265625, "global_step": 615454, "epoch": 7415} {"train_loss": -27.605743408203125, "global_step": 615455, "epoch": 7415} {"train_loss": -27.540790557861328, "global_step": 615456, "epoch": 7415} {"train_loss": -27.723712921142578, "global_step": 615457, "epoch": 7415} {"train_loss": -28.098957061767578, "global_step": 615458, "epoch": 7415} {"train_loss": -28.1946964263916, "global_step": 615459, "epoch": 7415} {"train_loss": -28.1466007232666, "global_step": 615460, "epoch": 7415} {"train_loss": -28.110525131225586, "global_step": 615461, "epoch": 7415} {"train_loss": -28.19771385192871, "global_step": 615462, "epoch": 7415} {"train_loss": -27.6577205657959, "global_step": 615463, "epoch": 7415} {"train_loss": -28.137847900390625, "global_step": 615464, "epoch": 7415} {"train_loss": -28.106185913085938, "global_step": 615465, "epoch": 7415} {"train_loss": -28.0750675201416, "global_step": 615466, "epoch": 7415} {"train_loss": -28.4011287689209, "global_step": 615467, "epoch": 7415} {"train_loss": -27.950056076049805, "global_step": 615468, "epoch": 7415} {"train_loss": -27.9443302154541, "global_step": 615469, "epoch": 7415} {"train_loss": -28.0374813079834, "global_step": 615470, "epoch": 7415} {"train_loss": -27.70171546936035, "global_step": 615471, "epoch": 7415} {"train_loss": -27.36948585510254, "global_step": 615472, "epoch": 7415} {"train_loss": -27.156600952148438, "global_step": 615473, "epoch": 7415} {"train_loss": -28.034198760986328, "global_step": 615474, "epoch": 7415} {"train_loss": -28.31890296936035, "global_step": 615475, "epoch": 7415} {"train_loss": -27.923267364501953, "global_step": 615476, "epoch": 7415} {"train_loss": -27.761066436767578, "global_step": 615477, "epoch": 7415} {"train_loss": -28.1740779876709, "global_step": 615478, "epoch": 7415} {"train_loss": -27.6712703704834, "global_step": 615479, "epoch": 7415} {"train_loss": -28.19544792175293, "global_step": 615480, "epoch": 7415} {"train_loss": -27.873044967651367, "global_step": 615481, "epoch": 7415} {"train_loss": -27.971094131469727, "global_step": 615482, "epoch": 7415} {"train_loss": -28.11859703063965, "global_step": 615483, "epoch": 7415} {"train_loss": -28.27337074279785, "global_step": 615484, "epoch": 7415} {"train_loss": -28.207990646362305, "global_step": 615485, "epoch": 7415} {"train_loss": -28.259740829467773, "global_step": 615486, "epoch": 7415} {"train_loss": -28.397613525390625, "global_step": 615487, "epoch": 7415} {"train_loss": -28.02469825744629, "global_step": 615488, "epoch": 7415} {"train_loss": -28.11383056640625, "global_step": 615489, "epoch": 7415} {"train_loss": -28.367145538330078, "global_step": 615490, "epoch": 7415} {"train_loss": -27.822492599487305, "global_step": 615491, "epoch": 7415} {"train_loss": -28.222610473632812, "global_step": 615492, "epoch": 7415} {"train_loss": -28.140485763549805, "global_step": 615493, "epoch": 7415} {"train_loss": -28.09480857849121, "global_step": 615494, "epoch": 7415} {"train_loss": -28.235031127929688, "global_step": 615495, "epoch": 7415} {"train_loss": -28.052692413330078, "global_step": 615496, "epoch": 7415} {"train_loss": -27.981719970703125, "global_step": 615497, "epoch": 7415} {"train_loss": -28.119129180908203, "global_step": 615498, "epoch": 7415} {"train_loss": -28.16036033630371, "global_step": 615499, "epoch": 7415} {"train_loss": -27.74994468688965, "global_step": 615500, "epoch": 7415} {"train_loss": -27.069467544555664, "global_step": 615501, "epoch": 7415} {"train_loss": -26.0421199798584, "global_step": 615502, "epoch": 7415} {"train_loss": -26.3325138092041, "global_step": 615503, "epoch": 7415} {"train_loss": -26.016082763671875, "global_step": 615504, "epoch": 7415} {"train_loss": -26.991147994995117, "global_step": 615505, "epoch": 7415} {"train_loss": -28.06988525390625, "global_step": 615506, "epoch": 7415} {"train_loss": -27.330961227416992, "global_step": 615507, "epoch": 7415} {"train_loss": -27.804895401000977, "global_step": 615508, "epoch": 7415} {"train_loss": -27.581512451171875, "global_step": 615509, "epoch": 7415} {"train_loss": -27.856552124023438, "global_step": 615510, "epoch": 7415} {"train_loss": -27.825885772705078, "global_step": 615511, "epoch": 7415} {"train_loss": -27.87190818786621, "global_step": 615512, "epoch": 7415} {"train_loss": -27.837970733642578, "global_step": 615513, "epoch": 7415} {"train_loss": -27.937528610229492, "global_step": 615514, "epoch": 7415} {"train_loss": -27.8006649017334, "global_step": 615515, "epoch": 7415} {"train_loss": -27.835235595703125, "global_step": 615516, "epoch": 7415} {"train_loss": -27.765172958374023, "global_step": 615517, "epoch": 7415} {"train_loss": -28.097900390625, "global_step": 615518, "epoch": 7415} {"train_loss": -27.678091049194336, "global_step": 615519, "epoch": 7415} {"train_loss": -28.332183837890625, "global_step": 615520, "epoch": 7415} {"train_loss": -27.946985244750977, "global_step": 615521, "epoch": 7415} {"train_loss": -28.527257919311523, "global_step": 615522, "epoch": 7415} {"train_loss": -27.957427978515625, "global_step": 615523, "epoch": 7415} {"train_loss": -28.047651290893555, "global_step": 615524, "epoch": 7415} {"train_loss": -27.842517852783203, "global_step": 615525, "epoch": 7415} {"train_loss": -28.100549697875977, "global_step": 615526, "epoch": 7415} {"train_loss": -27.838509525161193, "global_step": 615527, "epoch": 7415, "val_loss": 6666274.5} {"train_loss": -27.770599365234375, "global_step": 615528, "epoch": 7416} {"train_loss": -27.745990753173828, "global_step": 615529, "epoch": 7416} {"train_loss": -27.303449630737305, "global_step": 615530, "epoch": 7416} {"train_loss": -27.39934730529785, "global_step": 615531, "epoch": 7416} {"train_loss": -27.6004638671875, "global_step": 615532, "epoch": 7416} {"train_loss": -27.28571128845215, "global_step": 615533, "epoch": 7416} {"train_loss": -27.16182518005371, "global_step": 615534, "epoch": 7416} {"train_loss": -27.722970962524414, "global_step": 615535, "epoch": 7416} {"train_loss": -27.385894775390625, "global_step": 615536, "epoch": 7416} {"train_loss": -27.748172760009766, "global_step": 615537, "epoch": 7416} {"train_loss": -27.735132217407227, "global_step": 615538, "epoch": 7416} {"train_loss": -27.623083114624023, "global_step": 615539, "epoch": 7416} {"train_loss": -27.401779174804688, "global_step": 615540, "epoch": 7416} {"train_loss": -27.766326904296875, "global_step": 615541, "epoch": 7416} {"train_loss": -27.79767417907715, "global_step": 615542, "epoch": 7416} {"train_loss": -27.85725975036621, "global_step": 615543, "epoch": 7416} {"train_loss": -28.06662940979004, "global_step": 615544, "epoch": 7416} {"train_loss": -27.974462509155273, "global_step": 615545, "epoch": 7416} {"train_loss": -27.890165328979492, "global_step": 615546, "epoch": 7416} {"train_loss": -27.927106857299805, "global_step": 615547, "epoch": 7416} {"train_loss": -28.284719467163086, "global_step": 615548, "epoch": 7416} {"train_loss": -27.993818283081055, "global_step": 615549, "epoch": 7416} {"train_loss": -27.92909812927246, "global_step": 615550, "epoch": 7416} {"train_loss": -28.062198638916016, "global_step": 615551, "epoch": 7416} {"train_loss": -28.201313018798828, "global_step": 615552, "epoch": 7416} {"train_loss": -27.700180053710938, "global_step": 615553, "epoch": 7416} {"train_loss": -27.855749130249023, "global_step": 615554, "epoch": 7416} {"train_loss": -28.202136993408203, "global_step": 615555, "epoch": 7416} {"train_loss": -28.16779136657715, "global_step": 615556, "epoch": 7416} {"train_loss": -28.323514938354492, "global_step": 615557, "epoch": 7416} {"train_loss": -28.240583419799805, "global_step": 615558, "epoch": 7416} {"train_loss": -28.12476921081543, "global_step": 615559, "epoch": 7416} {"train_loss": -28.3613224029541, "global_step": 615560, "epoch": 7416} {"train_loss": -28.298511505126953, "global_step": 615561, "epoch": 7416} {"train_loss": -27.998096466064453, "global_step": 615562, "epoch": 7416} {"train_loss": -28.336414337158203, "global_step": 615563, "epoch": 7416} {"train_loss": -28.244281768798828, "global_step": 615564, "epoch": 7416} {"train_loss": -28.72098731994629, "global_step": 615565, "epoch": 7416} {"train_loss": -28.0481014251709, "global_step": 615566, "epoch": 7416} {"train_loss": -28.239398956298828, "global_step": 615567, "epoch": 7416} {"train_loss": -28.2502384185791, "global_step": 615568, "epoch": 7416} {"train_loss": -28.339019775390625, "global_step": 615569, "epoch": 7416} {"train_loss": -28.144575119018555, "global_step": 615570, "epoch": 7416} {"train_loss": -28.61639976501465, "global_step": 615571, "epoch": 7416} {"train_loss": -27.907562255859375, "global_step": 615572, "epoch": 7416} {"train_loss": -28.227161407470703, "global_step": 615573, "epoch": 7416} {"train_loss": -27.996124267578125, "global_step": 615574, "epoch": 7416} {"train_loss": -27.81669044494629, "global_step": 615575, "epoch": 7416} {"train_loss": -27.918609619140625, "global_step": 615576, "epoch": 7416} {"train_loss": -28.168249130249023, "global_step": 615577, "epoch": 7416} {"train_loss": -28.190338134765625, "global_step": 615578, "epoch": 7416} {"train_loss": -28.054044723510742, "global_step": 615579, "epoch": 7416} {"train_loss": -28.18207359313965, "global_step": 615580, "epoch": 7416} {"train_loss": -27.998910903930664, "global_step": 615581, "epoch": 7416} {"train_loss": -28.105682373046875, "global_step": 615582, "epoch": 7416} {"train_loss": -28.06545066833496, "global_step": 615583, "epoch": 7416} {"train_loss": -27.905725479125977, "global_step": 615584, "epoch": 7416} {"train_loss": -28.017074584960938, "global_step": 615585, "epoch": 7416} {"train_loss": -27.88431167602539, "global_step": 615586, "epoch": 7416} {"train_loss": -28.337051391601562, "global_step": 615587, "epoch": 7416} {"train_loss": -28.035552978515625, "global_step": 615588, "epoch": 7416} {"train_loss": -28.32505226135254, "global_step": 615589, "epoch": 7416} {"train_loss": -28.204381942749023, "global_step": 615590, "epoch": 7416} {"train_loss": -28.102243423461914, "global_step": 615591, "epoch": 7416} {"train_loss": -27.973752975463867, "global_step": 615592, "epoch": 7416} {"train_loss": -28.097265243530273, "global_step": 615593, "epoch": 7416} {"train_loss": -28.17146110534668, "global_step": 615594, "epoch": 7416} {"train_loss": -28.3079833984375, "global_step": 615595, "epoch": 7416} {"train_loss": -28.46846580505371, "global_step": 615596, "epoch": 7416} {"train_loss": -28.19696044921875, "global_step": 615597, "epoch": 7416} {"train_loss": -27.604455947875977, "global_step": 615598, "epoch": 7416} {"train_loss": -28.191884994506836, "global_step": 615599, "epoch": 7416} {"train_loss": -27.826841354370117, "global_step": 615600, "epoch": 7416} {"train_loss": -28.65533447265625, "global_step": 615601, "epoch": 7416} {"train_loss": -28.102750778198242, "global_step": 615602, "epoch": 7416} {"train_loss": -28.218297958374023, "global_step": 615603, "epoch": 7416} {"train_loss": -28.43050193786621, "global_step": 615604, "epoch": 7416} {"train_loss": -28.401220321655273, "global_step": 615605, "epoch": 7416} {"train_loss": -27.941465377807617, "global_step": 615606, "epoch": 7416} {"train_loss": -28.312467575073242, "global_step": 615607, "epoch": 7416} {"train_loss": -28.268695831298828, "global_step": 615608, "epoch": 7416} {"train_loss": -28.21295738220215, "global_step": 615609, "epoch": 7416} {"train_loss": -28.038951138415968, "global_step": 615610, "epoch": 7416, "val_loss": 6668549.0} {"train_loss": -27.61429786682129, "global_step": 615611, "epoch": 7417} {"train_loss": -26.2772274017334, "global_step": 615612, "epoch": 7417} {"train_loss": -26.332763671875, "global_step": 615613, "epoch": 7417} {"train_loss": -26.842527389526367, "global_step": 615614, "epoch": 7417} {"train_loss": -27.21881103515625, "global_step": 615615, "epoch": 7417} {"train_loss": -25.76690673828125, "global_step": 615616, "epoch": 7417} {"train_loss": -27.35003089904785, "global_step": 615617, "epoch": 7417} {"train_loss": -27.084537506103516, "global_step": 615618, "epoch": 7417} {"train_loss": -26.38747215270996, "global_step": 615619, "epoch": 7417} {"train_loss": -26.842254638671875, "global_step": 615620, "epoch": 7417} {"train_loss": -27.939117431640625, "global_step": 615621, "epoch": 7417} {"train_loss": -26.95279884338379, "global_step": 615622, "epoch": 7417} {"train_loss": -27.609556198120117, "global_step": 615623, "epoch": 7417} {"train_loss": -27.58741569519043, "global_step": 615624, "epoch": 7417} {"train_loss": -27.676767349243164, "global_step": 615625, "epoch": 7417} {"train_loss": -27.408863067626953, "global_step": 615626, "epoch": 7417} {"train_loss": -27.634733200073242, "global_step": 615627, "epoch": 7417} {"train_loss": -27.52029800415039, "global_step": 615628, "epoch": 7417} {"train_loss": -27.84232521057129, "global_step": 615629, "epoch": 7417} {"train_loss": -27.5548038482666, "global_step": 615630, "epoch": 7417} {"train_loss": -27.696277618408203, "global_step": 615631, "epoch": 7417} {"train_loss": -27.509687423706055, "global_step": 615632, "epoch": 7417} {"train_loss": -28.102497100830078, "global_step": 615633, "epoch": 7417} {"train_loss": -27.64594078063965, "global_step": 615634, "epoch": 7417} {"train_loss": -27.910446166992188, "global_step": 615635, "epoch": 7417} {"train_loss": -27.751453399658203, "global_step": 615636, "epoch": 7417} {"train_loss": -27.49500846862793, "global_step": 615637, "epoch": 7417} {"train_loss": -27.894397735595703, "global_step": 615638, "epoch": 7417} {"train_loss": -27.67311668395996, "global_step": 615639, "epoch": 7417} {"train_loss": -27.959339141845703, "global_step": 615640, "epoch": 7417} {"train_loss": -28.011127471923828, "global_step": 615641, "epoch": 7417} {"train_loss": -28.241382598876953, "global_step": 615642, "epoch": 7417} {"train_loss": -27.99680519104004, "global_step": 615643, "epoch": 7417} {"train_loss": -28.221954345703125, "global_step": 615644, "epoch": 7417} {"train_loss": -28.04669761657715, "global_step": 615645, "epoch": 7417} {"train_loss": -27.944772720336914, "global_step": 615646, "epoch": 7417} {"train_loss": -27.9846248626709, "global_step": 615647, "epoch": 7417} {"train_loss": -28.39303970336914, "global_step": 615648, "epoch": 7417} {"train_loss": -28.03076171875, "global_step": 615649, "epoch": 7417} {"train_loss": -28.10931396484375, "global_step": 615650, "epoch": 7417} {"train_loss": -28.15985107421875, "global_step": 615651, "epoch": 7417} {"train_loss": -28.232501983642578, "global_step": 615652, "epoch": 7417} {"train_loss": -28.165512084960938, "global_step": 615653, "epoch": 7417} {"train_loss": -28.143692016601562, "global_step": 615654, "epoch": 7417} {"train_loss": -28.221893310546875, "global_step": 615655, "epoch": 7417} {"train_loss": -28.524221420288086, "global_step": 615656, "epoch": 7417} {"train_loss": -27.993284225463867, "global_step": 615657, "epoch": 7417} {"train_loss": -28.371000289916992, "global_step": 615658, "epoch": 7417} {"train_loss": -28.214523315429688, "global_step": 615659, "epoch": 7417} {"train_loss": -28.33564567565918, "global_step": 615660, "epoch": 7417} {"train_loss": -28.327301025390625, "global_step": 615661, "epoch": 7417} {"train_loss": -28.67365837097168, "global_step": 615662, "epoch": 7417} {"train_loss": -28.28302001953125, "global_step": 615663, "epoch": 7417} {"train_loss": -28.336999893188477, "global_step": 615664, "epoch": 7417} {"train_loss": -28.60787010192871, "global_step": 615665, "epoch": 7417} {"train_loss": -28.441425323486328, "global_step": 615666, "epoch": 7417} {"train_loss": -28.5814208984375, "global_step": 615667, "epoch": 7417} {"train_loss": -28.21827507019043, "global_step": 615668, "epoch": 7417} {"train_loss": -28.537290573120117, "global_step": 615669, "epoch": 7417} {"train_loss": -28.277379989624023, "global_step": 615670, "epoch": 7417} {"train_loss": -28.239673614501953, "global_step": 615671, "epoch": 7417} {"train_loss": -28.209272384643555, "global_step": 615672, "epoch": 7417} {"train_loss": -28.093591690063477, "global_step": 615673, "epoch": 7417} {"train_loss": -28.614145278930664, "global_step": 615674, "epoch": 7417} {"train_loss": -28.4130916595459, "global_step": 615675, "epoch": 7417} {"train_loss": -28.265531539916992, "global_step": 615676, "epoch": 7417} {"train_loss": -27.772924423217773, "global_step": 615677, "epoch": 7417} {"train_loss": -27.88496971130371, "global_step": 615678, "epoch": 7417} {"train_loss": -27.61048698425293, "global_step": 615679, "epoch": 7417} {"train_loss": -26.387720108032227, "global_step": 615680, "epoch": 7417} {"train_loss": -26.71405029296875, "global_step": 615681, "epoch": 7417} {"train_loss": -27.985265731811523, "global_step": 615682, "epoch": 7417} {"train_loss": -27.59442138671875, "global_step": 615683, "epoch": 7417} {"train_loss": -27.6833553314209, "global_step": 615684, "epoch": 7417} {"train_loss": -27.89752769470215, "global_step": 615685, "epoch": 7417} {"train_loss": -28.127185821533203, "global_step": 615686, "epoch": 7417} {"train_loss": -27.59518814086914, "global_step": 615687, "epoch": 7417} {"train_loss": -27.646320343017578, "global_step": 615688, "epoch": 7417} {"train_loss": -27.615325927734375, "global_step": 615689, "epoch": 7417} {"train_loss": -27.997425079345703, "global_step": 615690, "epoch": 7417} {"train_loss": -27.8270263671875, "global_step": 615691, "epoch": 7417} {"train_loss": -27.752050399780273, "global_step": 615692, "epoch": 7417} {"train_loss": -27.803967717182207, "global_step": 615693, "epoch": 7417, "val_loss": 6623452.5} {"train_loss": -27.434850692749023, "global_step": 615694, "epoch": 7418} {"train_loss": -28.01909828186035, "global_step": 615695, "epoch": 7418} {"train_loss": -26.769556045532227, "global_step": 615696, "epoch": 7418} {"train_loss": -27.15802001953125, "global_step": 615697, "epoch": 7418} {"train_loss": -26.71945571899414, "global_step": 615698, "epoch": 7418} {"train_loss": -26.653045654296875, "global_step": 615699, "epoch": 7418} {"train_loss": -27.030139923095703, "global_step": 615700, "epoch": 7418} {"train_loss": -27.279855728149414, "global_step": 615701, "epoch": 7418} {"train_loss": -27.03023338317871, "global_step": 615702, "epoch": 7418} {"train_loss": -26.992069244384766, "global_step": 615703, "epoch": 7418} {"train_loss": -27.26056480407715, "global_step": 615704, "epoch": 7418} {"train_loss": -27.481657028198242, "global_step": 615705, "epoch": 7418} {"train_loss": -27.43484878540039, "global_step": 615706, "epoch": 7418} {"train_loss": -27.50042152404785, "global_step": 615707, "epoch": 7418} {"train_loss": -27.384429931640625, "global_step": 615708, "epoch": 7418} {"train_loss": -27.830469131469727, "global_step": 615709, "epoch": 7418} {"train_loss": -27.257211685180664, "global_step": 615710, "epoch": 7418} {"train_loss": -27.373178482055664, "global_step": 615711, "epoch": 7418} {"train_loss": -27.612960815429688, "global_step": 615712, "epoch": 7418} {"train_loss": -27.715484619140625, "global_step": 615713, "epoch": 7418} {"train_loss": -27.924924850463867, "global_step": 615714, "epoch": 7418} {"train_loss": -27.7109317779541, "global_step": 615715, "epoch": 7418} {"train_loss": -27.43487548828125, "global_step": 615716, "epoch": 7418} {"train_loss": -27.83051109313965, "global_step": 615717, "epoch": 7418} {"train_loss": -27.826913833618164, "global_step": 615718, "epoch": 7418} {"train_loss": -27.69989013671875, "global_step": 615719, "epoch": 7418} {"train_loss": -28.050582885742188, "global_step": 615720, "epoch": 7418} {"train_loss": -28.002256393432617, "global_step": 615721, "epoch": 7418} {"train_loss": -27.954498291015625, "global_step": 615722, "epoch": 7418} {"train_loss": -28.067123413085938, "global_step": 615723, "epoch": 7418} {"train_loss": -27.480451583862305, "global_step": 615724, "epoch": 7418} {"train_loss": -28.169757843017578, "global_step": 615725, "epoch": 7418} {"train_loss": -28.101444244384766, "global_step": 615726, "epoch": 7418} {"train_loss": -28.014408111572266, "global_step": 615727, "epoch": 7418} {"train_loss": -28.058944702148438, "global_step": 615728, "epoch": 7418} {"train_loss": -27.871124267578125, "global_step": 615729, "epoch": 7418} {"train_loss": -27.827529907226562, "global_step": 615730, "epoch": 7418} {"train_loss": -28.47871208190918, "global_step": 615731, "epoch": 7418} {"train_loss": -28.100448608398438, "global_step": 615732, "epoch": 7418} {"train_loss": -28.264501571655273, "global_step": 615733, "epoch": 7418} {"train_loss": -28.45838737487793, "global_step": 615734, "epoch": 7418} {"train_loss": -28.0499324798584, "global_step": 615735, "epoch": 7418} {"train_loss": -28.36292839050293, "global_step": 615736, "epoch": 7418} {"train_loss": -28.28157615661621, "global_step": 615737, "epoch": 7418} {"train_loss": -28.30048179626465, "global_step": 615738, "epoch": 7418} {"train_loss": -28.09897232055664, "global_step": 615739, "epoch": 7418} {"train_loss": -28.209402084350586, "global_step": 615740, "epoch": 7418} {"train_loss": -28.26173210144043, "global_step": 615741, "epoch": 7418} {"train_loss": -28.14420509338379, "global_step": 615742, "epoch": 7418} {"train_loss": -28.526609420776367, "global_step": 615743, "epoch": 7418} {"train_loss": -28.267364501953125, "global_step": 615744, "epoch": 7418} {"train_loss": -28.318647384643555, "global_step": 615745, "epoch": 7418} {"train_loss": -28.6083927154541, "global_step": 615746, "epoch": 7418} {"train_loss": -28.562686920166016, "global_step": 615747, "epoch": 7418} {"train_loss": -28.0041561126709, "global_step": 615748, "epoch": 7418} {"train_loss": -28.487659454345703, "global_step": 615749, "epoch": 7418} {"train_loss": -28.19125747680664, "global_step": 615750, "epoch": 7418} {"train_loss": -27.888553619384766, "global_step": 615751, "epoch": 7418} {"train_loss": -28.4091796875, "global_step": 615752, "epoch": 7418} {"train_loss": -27.785083770751953, "global_step": 615753, "epoch": 7418} {"train_loss": -28.47223472595215, "global_step": 615754, "epoch": 7418} {"train_loss": -27.855127334594727, "global_step": 615755, "epoch": 7418} {"train_loss": -28.642383575439453, "global_step": 615756, "epoch": 7418} {"train_loss": -28.509201049804688, "global_step": 615757, "epoch": 7418} {"train_loss": -28.337167739868164, "global_step": 615758, "epoch": 7418} {"train_loss": -28.402936935424805, "global_step": 615759, "epoch": 7418} {"train_loss": -28.3054256439209, "global_step": 615760, "epoch": 7418} {"train_loss": -28.185760498046875, "global_step": 615761, "epoch": 7418} {"train_loss": -27.71392250061035, "global_step": 615762, "epoch": 7418} {"train_loss": -27.556259155273438, "global_step": 615763, "epoch": 7418} {"train_loss": -28.079923629760742, "global_step": 615764, "epoch": 7418} {"train_loss": -28.226099014282227, "global_step": 615765, "epoch": 7418} {"train_loss": -28.015384674072266, "global_step": 615766, "epoch": 7418} {"train_loss": -28.048385620117188, "global_step": 615767, "epoch": 7418} {"train_loss": -28.293750762939453, "global_step": 615768, "epoch": 7418} {"train_loss": -28.318450927734375, "global_step": 615769, "epoch": 7418} {"train_loss": -27.809289932250977, "global_step": 615770, "epoch": 7418} {"train_loss": -28.0234432220459, "global_step": 615771, "epoch": 7418} {"train_loss": -28.36103630065918, "global_step": 615772, "epoch": 7418} {"train_loss": -28.424976348876953, "global_step": 615773, "epoch": 7418} {"train_loss": -28.576120376586914, "global_step": 615774, "epoch": 7418} {"train_loss": -28.119775772094727, "global_step": 615775, "epoch": 7418} {"train_loss": -27.92551504847515, "global_step": 615776, "epoch": 7418, "val_loss": 6687188.0} {"train_loss": -26.840167999267578, "global_step": 615777, "epoch": 7419} {"train_loss": -27.05303955078125, "global_step": 615778, "epoch": 7419} {"train_loss": -26.84456443786621, "global_step": 615779, "epoch": 7419} {"train_loss": -26.2434024810791, "global_step": 615780, "epoch": 7419} {"train_loss": -26.859375, "global_step": 615781, "epoch": 7419} {"train_loss": -27.3465633392334, "global_step": 615782, "epoch": 7419} {"train_loss": -27.839141845703125, "global_step": 615783, "epoch": 7419} {"train_loss": -26.683135986328125, "global_step": 615784, "epoch": 7419} {"train_loss": -27.40675926208496, "global_step": 615785, "epoch": 7419} {"train_loss": -27.49151611328125, "global_step": 615786, "epoch": 7419} {"train_loss": -27.51295280456543, "global_step": 615787, "epoch": 7419} {"train_loss": -27.247278213500977, "global_step": 615788, "epoch": 7419} {"train_loss": -27.9150333404541, "global_step": 615789, "epoch": 7419} {"train_loss": -26.87727928161621, "global_step": 615790, "epoch": 7419} {"train_loss": -27.60931968688965, "global_step": 615791, "epoch": 7419} {"train_loss": -27.953704833984375, "global_step": 615792, "epoch": 7419} {"train_loss": -27.544702529907227, "global_step": 615793, "epoch": 7419} {"train_loss": -27.66361427307129, "global_step": 615794, "epoch": 7419} {"train_loss": -27.6085205078125, "global_step": 615795, "epoch": 7419} {"train_loss": -27.94772720336914, "global_step": 615796, "epoch": 7419} {"train_loss": -27.95086097717285, "global_step": 615797, "epoch": 7419} {"train_loss": -28.207569122314453, "global_step": 615798, "epoch": 7419} {"train_loss": -27.518625259399414, "global_step": 615799, "epoch": 7419} {"train_loss": -28.246320724487305, "global_step": 615800, "epoch": 7419} {"train_loss": -28.084482192993164, "global_step": 615801, "epoch": 7419} {"train_loss": -27.66849708557129, "global_step": 615802, "epoch": 7419} {"train_loss": -28.053327560424805, "global_step": 615803, "epoch": 7419} {"train_loss": -28.062829971313477, "global_step": 615804, "epoch": 7419} {"train_loss": -27.837305068969727, "global_step": 615805, "epoch": 7419} {"train_loss": -27.56488037109375, "global_step": 615806, "epoch": 7419} {"train_loss": -27.9875431060791, "global_step": 615807, "epoch": 7419} {"train_loss": -28.136518478393555, "global_step": 615808, "epoch": 7419} {"train_loss": -28.026611328125, "global_step": 615809, "epoch": 7419} {"train_loss": -28.2658748626709, "global_step": 615810, "epoch": 7419} {"train_loss": -27.8876953125, "global_step": 615811, "epoch": 7419} {"train_loss": -28.0026798248291, "global_step": 615812, "epoch": 7419} {"train_loss": -28.318876266479492, "global_step": 615813, "epoch": 7419} {"train_loss": -28.131311416625977, "global_step": 615814, "epoch": 7419} {"train_loss": -28.2567195892334, "global_step": 615815, "epoch": 7419} {"train_loss": -28.24688148498535, "global_step": 615816, "epoch": 7419} {"train_loss": -27.784107208251953, "global_step": 615817, "epoch": 7419} {"train_loss": -28.38071632385254, "global_step": 615818, "epoch": 7419} {"train_loss": -28.100265502929688, "global_step": 615819, "epoch": 7419} {"train_loss": -28.585432052612305, "global_step": 615820, "epoch": 7419} {"train_loss": -27.69584083557129, "global_step": 615821, "epoch": 7419} {"train_loss": -28.15589714050293, "global_step": 615822, "epoch": 7419} {"train_loss": -28.73247718811035, "global_step": 615823, "epoch": 7419} {"train_loss": -28.255395889282227, "global_step": 615824, "epoch": 7419} {"train_loss": -28.37806510925293, "global_step": 615825, "epoch": 7419} {"train_loss": -28.433095932006836, "global_step": 615826, "epoch": 7419} {"train_loss": -27.9453125, "global_step": 615827, "epoch": 7419} {"train_loss": -28.349084854125977, "global_step": 615828, "epoch": 7419} {"train_loss": -28.44451904296875, "global_step": 615829, "epoch": 7419} {"train_loss": -28.200016021728516, "global_step": 615830, "epoch": 7419} {"train_loss": -28.204029083251953, "global_step": 615831, "epoch": 7419} {"train_loss": -28.399778366088867, "global_step": 615832, "epoch": 7419} {"train_loss": -27.947113037109375, "global_step": 615833, "epoch": 7419} {"train_loss": -28.288496017456055, "global_step": 615834, "epoch": 7419} {"train_loss": -28.45586585998535, "global_step": 615835, "epoch": 7419} {"train_loss": -27.707218170166016, "global_step": 615836, "epoch": 7419} {"train_loss": -27.924972534179688, "global_step": 615837, "epoch": 7419} {"train_loss": -28.014392852783203, "global_step": 615838, "epoch": 7419} {"train_loss": -28.21257972717285, "global_step": 615839, "epoch": 7419} {"train_loss": -28.136083602905273, "global_step": 615840, "epoch": 7419} {"train_loss": -28.031641006469727, "global_step": 615841, "epoch": 7419} {"train_loss": -28.058212280273438, "global_step": 615842, "epoch": 7419} {"train_loss": -28.31318473815918, "global_step": 615843, "epoch": 7419} {"train_loss": -27.803823471069336, "global_step": 615844, "epoch": 7419} {"train_loss": -28.165271759033203, "global_step": 615845, "epoch": 7419} {"train_loss": -27.734472274780273, "global_step": 615846, "epoch": 7419} {"train_loss": -28.522796630859375, "global_step": 615847, "epoch": 7419} {"train_loss": -27.761423110961914, "global_step": 615848, "epoch": 7419} {"train_loss": -27.366077423095703, "global_step": 615849, "epoch": 7419} {"train_loss": -26.369375228881836, "global_step": 615850, "epoch": 7419} {"train_loss": -27.176950454711914, "global_step": 615851, "epoch": 7419} {"train_loss": -28.075998306274414, "global_step": 615852, "epoch": 7419} {"train_loss": -27.38633155822754, "global_step": 615853, "epoch": 7419} {"train_loss": -27.399646759033203, "global_step": 615854, "epoch": 7419} {"train_loss": -27.480539321899414, "global_step": 615855, "epoch": 7419} {"train_loss": -27.51165199279785, "global_step": 615856, "epoch": 7419} {"train_loss": -27.681015014648438, "global_step": 615857, "epoch": 7419} {"train_loss": -27.363880157470703, "global_step": 615858, "epoch": 7419} {"train_loss": -27.817958647946277, "global_step": 615859, "epoch": 7419, "val_loss": 6735800.0} {"train_loss": -26.823715209960938, "global_step": 615860, "epoch": 7420} {"train_loss": -26.0721492767334, "global_step": 615861, "epoch": 7420} {"train_loss": -26.496747970581055, "global_step": 615862, "epoch": 7420} {"train_loss": -26.5198917388916, "global_step": 615863, "epoch": 7420} {"train_loss": -27.214689254760742, "global_step": 615864, "epoch": 7420} {"train_loss": -26.92010498046875, "global_step": 615865, "epoch": 7420} {"train_loss": -27.43804931640625, "global_step": 615866, "epoch": 7420} {"train_loss": -27.095783233642578, "global_step": 615867, "epoch": 7420} {"train_loss": -27.415796279907227, "global_step": 615868, "epoch": 7420} {"train_loss": -27.387136459350586, "global_step": 615869, "epoch": 7420} {"train_loss": -27.438220977783203, "global_step": 615870, "epoch": 7420} {"train_loss": -27.2363224029541, "global_step": 615871, "epoch": 7420} {"train_loss": -27.74403190612793, "global_step": 615872, "epoch": 7420} {"train_loss": -27.315475463867188, "global_step": 615873, "epoch": 7420} {"train_loss": -27.77530288696289, "global_step": 615874, "epoch": 7420} {"train_loss": -27.2523193359375, "global_step": 615875, "epoch": 7420} {"train_loss": -27.562347412109375, "global_step": 615876, "epoch": 7420} {"train_loss": -27.774978637695312, "global_step": 615877, "epoch": 7420} {"train_loss": -27.65055274963379, "global_step": 615878, "epoch": 7420} {"train_loss": -27.237512588500977, "global_step": 615879, "epoch": 7420} {"train_loss": -27.67887306213379, "global_step": 615880, "epoch": 7420} {"train_loss": -27.796674728393555, "global_step": 615881, "epoch": 7420} {"train_loss": -27.540700912475586, "global_step": 615882, "epoch": 7420} {"train_loss": -27.765417098999023, "global_step": 615883, "epoch": 7420} {"train_loss": -27.95696449279785, "global_step": 615884, "epoch": 7420} {"train_loss": -28.098535537719727, "global_step": 615885, "epoch": 7420} {"train_loss": -27.73414421081543, "global_step": 615886, "epoch": 7420} {"train_loss": -27.78668785095215, "global_step": 615887, "epoch": 7420} {"train_loss": -28.012332916259766, "global_step": 615888, "epoch": 7420} {"train_loss": -27.981433868408203, "global_step": 615889, "epoch": 7420} {"train_loss": -28.070707321166992, "global_step": 615890, "epoch": 7420} {"train_loss": -28.130390167236328, "global_step": 615891, "epoch": 7420} {"train_loss": -28.012121200561523, "global_step": 615892, "epoch": 7420} {"train_loss": -28.20685386657715, "global_step": 615893, "epoch": 7420} {"train_loss": -27.8682804107666, "global_step": 615894, "epoch": 7420} {"train_loss": -28.208707809448242, "global_step": 615895, "epoch": 7420} {"train_loss": -28.254159927368164, "global_step": 615896, "epoch": 7420} {"train_loss": -28.627334594726562, "global_step": 615897, "epoch": 7420} {"train_loss": -27.975921630859375, "global_step": 615898, "epoch": 7420} {"train_loss": -27.83349609375, "global_step": 615899, "epoch": 7420} {"train_loss": -28.124113082885742, "global_step": 615900, "epoch": 7420} {"train_loss": -28.04306983947754, "global_step": 615901, "epoch": 7420} {"train_loss": -28.134723663330078, "global_step": 615902, "epoch": 7420} {"train_loss": -28.326171875, "global_step": 615903, "epoch": 7420} {"train_loss": -28.1215877532959, "global_step": 615904, "epoch": 7420} {"train_loss": -28.069059371948242, "global_step": 615905, "epoch": 7420} {"train_loss": -28.165327072143555, "global_step": 615906, "epoch": 7420} {"train_loss": -28.327436447143555, "global_step": 615907, "epoch": 7420} {"train_loss": -28.242246627807617, "global_step": 615908, "epoch": 7420} {"train_loss": -28.200210571289062, "global_step": 615909, "epoch": 7420} {"train_loss": -28.257917404174805, "global_step": 615910, "epoch": 7420} {"train_loss": -28.435163497924805, "global_step": 615911, "epoch": 7420} {"train_loss": -28.22254753112793, "global_step": 615912, "epoch": 7420} {"train_loss": -28.403533935546875, "global_step": 615913, "epoch": 7420} {"train_loss": -28.522558212280273, "global_step": 615914, "epoch": 7420} {"train_loss": -28.0885009765625, "global_step": 615915, "epoch": 7420} {"train_loss": -28.239139556884766, "global_step": 615916, "epoch": 7420} {"train_loss": -28.218236923217773, "global_step": 615917, "epoch": 7420} {"train_loss": -28.247934341430664, "global_step": 615918, "epoch": 7420} {"train_loss": -28.23291015625, "global_step": 615919, "epoch": 7420} {"train_loss": -28.108983993530273, "global_step": 615920, "epoch": 7420} {"train_loss": -27.907154083251953, "global_step": 615921, "epoch": 7420} {"train_loss": -28.095006942749023, "global_step": 615922, "epoch": 7420} {"train_loss": -28.1480655670166, "global_step": 615923, "epoch": 7420} {"train_loss": -28.091840744018555, "global_step": 615924, "epoch": 7420} {"train_loss": -28.045713424682617, "global_step": 615925, "epoch": 7420} {"train_loss": -27.7708740234375, "global_step": 615926, "epoch": 7420} {"train_loss": -28.466089248657227, "global_step": 615927, "epoch": 7420} {"train_loss": -28.39093017578125, "global_step": 615928, "epoch": 7420} {"train_loss": -27.906482696533203, "global_step": 615929, "epoch": 7420} {"train_loss": -28.1353759765625, "global_step": 615930, "epoch": 7420} {"train_loss": -27.404266357421875, "global_step": 615931, "epoch": 7420} {"train_loss": -27.455677032470703, "global_step": 615932, "epoch": 7420} {"train_loss": -28.07301902770996, "global_step": 615933, "epoch": 7420} {"train_loss": -28.11393165588379, "global_step": 615934, "epoch": 7420} {"train_loss": -28.154401779174805, "global_step": 615935, "epoch": 7420} {"train_loss": -27.911352157592773, "global_step": 615936, "epoch": 7420} {"train_loss": -27.6716251373291, "global_step": 615937, "epoch": 7420} {"train_loss": -27.813074111938477, "global_step": 615938, "epoch": 7420} {"train_loss": -27.74481773376465, "global_step": 615939, "epoch": 7420} {"train_loss": -28.046777725219727, "global_step": 615940, "epoch": 7420} {"train_loss": -28.02369499206543, "global_step": 615941, "epoch": 7420} {"train_loss": -27.862489608396967, "global_step": 615942, "epoch": 7420, "val_loss": 6636904.5} {"train_loss": -26.318897247314453, "global_step": 615943, "epoch": 7421} {"train_loss": -26.769773483276367, "global_step": 615944, "epoch": 7421} {"train_loss": -25.60821533203125, "global_step": 615945, "epoch": 7421} {"train_loss": -27.1112003326416, "global_step": 615946, "epoch": 7421} {"train_loss": -26.124576568603516, "global_step": 615947, "epoch": 7421} {"train_loss": -26.63299560546875, "global_step": 615948, "epoch": 7421} {"train_loss": -26.38992691040039, "global_step": 615949, "epoch": 7421} {"train_loss": -27.20318031311035, "global_step": 615950, "epoch": 7421} {"train_loss": -26.653100967407227, "global_step": 615951, "epoch": 7421} {"train_loss": -26.693359375, "global_step": 615952, "epoch": 7421} {"train_loss": -27.098108291625977, "global_step": 615953, "epoch": 7421} {"train_loss": -26.876667022705078, "global_step": 615954, "epoch": 7421} {"train_loss": -26.733295440673828, "global_step": 615955, "epoch": 7421} {"train_loss": -27.092437744140625, "global_step": 615956, "epoch": 7421} {"train_loss": -27.213071823120117, "global_step": 615957, "epoch": 7421} {"train_loss": -26.9981746673584, "global_step": 615958, "epoch": 7421} {"train_loss": -27.10271644592285, "global_step": 615959, "epoch": 7421} {"train_loss": -27.150115966796875, "global_step": 615960, "epoch": 7421} {"train_loss": -27.20069694519043, "global_step": 615961, "epoch": 7421} {"train_loss": -27.165603637695312, "global_step": 615962, "epoch": 7421} {"train_loss": -27.092395782470703, "global_step": 615963, "epoch": 7421} {"train_loss": -27.560094833374023, "global_step": 615964, "epoch": 7421} {"train_loss": -27.338180541992188, "global_step": 615965, "epoch": 7421} {"train_loss": -27.48870849609375, "global_step": 615966, "epoch": 7421} {"train_loss": -27.508697509765625, "global_step": 615967, "epoch": 7421} {"train_loss": -27.4595890045166, "global_step": 615968, "epoch": 7421} {"train_loss": -27.616392135620117, "global_step": 615969, "epoch": 7421} {"train_loss": -27.373998641967773, "global_step": 615970, "epoch": 7421} {"train_loss": -27.78577995300293, "global_step": 615971, "epoch": 7421} {"train_loss": -27.753610610961914, "global_step": 615972, "epoch": 7421} {"train_loss": -27.747318267822266, "global_step": 615973, "epoch": 7421} {"train_loss": -27.869916915893555, "global_step": 615974, "epoch": 7421} {"train_loss": -27.76296043395996, "global_step": 615975, "epoch": 7421} {"train_loss": -28.18812370300293, "global_step": 615976, "epoch": 7421} {"train_loss": -27.904218673706055, "global_step": 615977, "epoch": 7421} {"train_loss": -27.750425338745117, "global_step": 615978, "epoch": 7421} {"train_loss": -27.761096954345703, "global_step": 615979, "epoch": 7421} {"train_loss": -27.7844181060791, "global_step": 615980, "epoch": 7421} {"train_loss": -27.92389488220215, "global_step": 615981, "epoch": 7421} {"train_loss": -28.302810668945312, "global_step": 615982, "epoch": 7421} {"train_loss": -28.297895431518555, "global_step": 615983, "epoch": 7421} {"train_loss": -28.205982208251953, "global_step": 615984, "epoch": 7421} {"train_loss": -28.280759811401367, "global_step": 615985, "epoch": 7421} {"train_loss": -27.77630615234375, "global_step": 615986, "epoch": 7421} {"train_loss": -28.037311553955078, "global_step": 615987, "epoch": 7421} {"train_loss": -28.269742965698242, "global_step": 615988, "epoch": 7421} {"train_loss": -28.16117286682129, "global_step": 615989, "epoch": 7421} {"train_loss": -28.367773056030273, "global_step": 615990, "epoch": 7421} {"train_loss": -28.28204345703125, "global_step": 615991, "epoch": 7421} {"train_loss": -28.583337783813477, "global_step": 615992, "epoch": 7421} {"train_loss": -28.797122955322266, "global_step": 615993, "epoch": 7421} {"train_loss": -27.751615524291992, "global_step": 615994, "epoch": 7421} {"train_loss": -28.302682876586914, "global_step": 615995, "epoch": 7421} {"train_loss": -28.0247802734375, "global_step": 615996, "epoch": 7421} {"train_loss": -28.285741806030273, "global_step": 615997, "epoch": 7421} {"train_loss": -28.470205307006836, "global_step": 615998, "epoch": 7421} {"train_loss": -28.39666175842285, "global_step": 615999, "epoch": 7421} {"train_loss": -28.432926177978516, "global_step": 616000, "epoch": 7421} {"train_loss": -28.02446937561035, "global_step": 616001, "epoch": 7421} {"train_loss": -28.197919845581055, "global_step": 616002, "epoch": 7421} {"train_loss": -28.229345321655273, "global_step": 616003, "epoch": 7421} {"train_loss": -28.384262084960938, "global_step": 616004, "epoch": 7421} {"train_loss": -28.449506759643555, "global_step": 616005, "epoch": 7421} {"train_loss": -28.32439613342285, "global_step": 616006, "epoch": 7421} {"train_loss": -28.453351974487305, "global_step": 616007, "epoch": 7421} {"train_loss": -28.0570125579834, "global_step": 616008, "epoch": 7421} {"train_loss": -28.304126739501953, "global_step": 616009, "epoch": 7421} {"train_loss": -28.085355758666992, "global_step": 616010, "epoch": 7421} {"train_loss": -28.27747917175293, "global_step": 616011, "epoch": 7421} {"train_loss": -28.18267250061035, "global_step": 616012, "epoch": 7421} {"train_loss": -28.05496597290039, "global_step": 616013, "epoch": 7421} {"train_loss": -27.866769790649414, "global_step": 616014, "epoch": 7421} {"train_loss": -26.703800201416016, "global_step": 616015, "epoch": 7421} {"train_loss": -25.81035804748535, "global_step": 616016, "epoch": 7421} {"train_loss": -26.188322067260742, "global_step": 616017, "epoch": 7421} {"train_loss": -27.903640747070312, "global_step": 616018, "epoch": 7421} {"train_loss": -27.7053279876709, "global_step": 616019, "epoch": 7421} {"train_loss": -27.6374454498291, "global_step": 616020, "epoch": 7421} {"train_loss": -27.977954864501953, "global_step": 616021, "epoch": 7421} {"train_loss": -27.26593017578125, "global_step": 616022, "epoch": 7421} {"train_loss": -27.866918563842773, "global_step": 616023, "epoch": 7421} {"train_loss": -27.552988052368164, "global_step": 616024, "epoch": 7421} {"train_loss": -27.649201289716974, "global_step": 616025, "epoch": 7421, "val_loss": 6629866.0} {"train_loss": -26.741750717163086, "global_step": 616026, "epoch": 7422} {"train_loss": -27.022403717041016, "global_step": 616027, "epoch": 7422} {"train_loss": -27.17341423034668, "global_step": 616028, "epoch": 7422} {"train_loss": -27.198230743408203, "global_step": 616029, "epoch": 7422} {"train_loss": -27.807397842407227, "global_step": 616030, "epoch": 7422} {"train_loss": -27.318866729736328, "global_step": 616031, "epoch": 7422} {"train_loss": -27.62314224243164, "global_step": 616032, "epoch": 7422} {"train_loss": -27.383838653564453, "global_step": 616033, "epoch": 7422} {"train_loss": -27.43116569519043, "global_step": 616034, "epoch": 7422} {"train_loss": -27.429086685180664, "global_step": 616035, "epoch": 7422} {"train_loss": -27.60231590270996, "global_step": 616036, "epoch": 7422} {"train_loss": -27.186147689819336, "global_step": 616037, "epoch": 7422} {"train_loss": -27.60664176940918, "global_step": 616038, "epoch": 7422} {"train_loss": -28.111623764038086, "global_step": 616039, "epoch": 7422} {"train_loss": -27.6148624420166, "global_step": 616040, "epoch": 7422} {"train_loss": -27.916980743408203, "global_step": 616041, "epoch": 7422} {"train_loss": -27.433673858642578, "global_step": 616042, "epoch": 7422} {"train_loss": -27.473058700561523, "global_step": 616043, "epoch": 7422} {"train_loss": -27.585693359375, "global_step": 616044, "epoch": 7422} {"train_loss": -27.666854858398438, "global_step": 616045, "epoch": 7422} {"train_loss": -27.431716918945312, "global_step": 616046, "epoch": 7422} {"train_loss": -27.839365005493164, "global_step": 616047, "epoch": 7422} {"train_loss": -27.93878746032715, "global_step": 616048, "epoch": 7422} {"train_loss": -28.172842025756836, "global_step": 616049, "epoch": 7422} {"train_loss": -27.615514755249023, "global_step": 616050, "epoch": 7422} {"train_loss": -27.88519859313965, "global_step": 616051, "epoch": 7422} {"train_loss": -27.906112670898438, "global_step": 616052, "epoch": 7422} {"train_loss": -27.75689697265625, "global_step": 616053, "epoch": 7422} {"train_loss": -28.03238296508789, "global_step": 616054, "epoch": 7422} {"train_loss": -28.03702163696289, "global_step": 616055, "epoch": 7422} {"train_loss": -27.75726890563965, "global_step": 616056, "epoch": 7422} {"train_loss": -27.92557716369629, "global_step": 616057, "epoch": 7422} {"train_loss": -27.765607833862305, "global_step": 616058, "epoch": 7422} {"train_loss": -28.150922775268555, "global_step": 616059, "epoch": 7422} {"train_loss": -28.155698776245117, "global_step": 616060, "epoch": 7422} {"train_loss": -28.21746253967285, "global_step": 616061, "epoch": 7422} {"train_loss": -27.795642852783203, "global_step": 616062, "epoch": 7422} {"train_loss": -28.18202018737793, "global_step": 616063, "epoch": 7422} {"train_loss": -28.253082275390625, "global_step": 616064, "epoch": 7422} {"train_loss": -27.88966178894043, "global_step": 616065, "epoch": 7422} {"train_loss": -27.885141372680664, "global_step": 616066, "epoch": 7422} {"train_loss": -28.579198837280273, "global_step": 616067, "epoch": 7422} {"train_loss": -28.27121353149414, "global_step": 616068, "epoch": 7422} {"train_loss": -28.615880966186523, "global_step": 616069, "epoch": 7422} {"train_loss": -28.071218490600586, "global_step": 616070, "epoch": 7422} {"train_loss": -28.22736167907715, "global_step": 616071, "epoch": 7422} {"train_loss": -28.232187271118164, "global_step": 616072, "epoch": 7422} {"train_loss": -28.187015533447266, "global_step": 616073, "epoch": 7422} {"train_loss": -28.279699325561523, "global_step": 616074, "epoch": 7422} {"train_loss": -28.42396354675293, "global_step": 616075, "epoch": 7422} {"train_loss": -28.144800186157227, "global_step": 616076, "epoch": 7422} {"train_loss": -28.525806427001953, "global_step": 616077, "epoch": 7422} {"train_loss": -28.399877548217773, "global_step": 616078, "epoch": 7422} {"train_loss": -28.193700790405273, "global_step": 616079, "epoch": 7422} {"train_loss": -28.4408016204834, "global_step": 616080, "epoch": 7422} {"train_loss": -28.211423873901367, "global_step": 616081, "epoch": 7422} {"train_loss": -28.138687133789062, "global_step": 616082, "epoch": 7422} {"train_loss": -27.69063377380371, "global_step": 616083, "epoch": 7422} {"train_loss": -27.95111083984375, "global_step": 616084, "epoch": 7422} {"train_loss": -28.220773696899414, "global_step": 616085, "epoch": 7422} {"train_loss": -28.233854293823242, "global_step": 616086, "epoch": 7422} {"train_loss": -28.157419204711914, "global_step": 616087, "epoch": 7422} {"train_loss": -28.194812774658203, "global_step": 616088, "epoch": 7422} {"train_loss": -27.945337295532227, "global_step": 616089, "epoch": 7422} {"train_loss": -28.311426162719727, "global_step": 616090, "epoch": 7422} {"train_loss": -27.942123413085938, "global_step": 616091, "epoch": 7422} {"train_loss": -28.041980743408203, "global_step": 616092, "epoch": 7422} {"train_loss": -28.17738914489746, "global_step": 616093, "epoch": 7422} {"train_loss": -28.187353134155273, "global_step": 616094, "epoch": 7422} {"train_loss": -28.02345848083496, "global_step": 616095, "epoch": 7422} {"train_loss": -27.992773056030273, "global_step": 616096, "epoch": 7422} {"train_loss": -28.0839900970459, "global_step": 616097, "epoch": 7422} {"train_loss": -28.221820831298828, "global_step": 616098, "epoch": 7422} {"train_loss": -28.347803115844727, "global_step": 616099, "epoch": 7422} {"train_loss": -28.505538940429688, "global_step": 616100, "epoch": 7422} {"train_loss": -28.141027450561523, "global_step": 616101, "epoch": 7422} {"train_loss": -28.064550399780273, "global_step": 616102, "epoch": 7422} {"train_loss": -27.903913497924805, "global_step": 616103, "epoch": 7422} {"train_loss": -28.103439331054688, "global_step": 616104, "epoch": 7422} {"train_loss": -27.64151382446289, "global_step": 616105, "epoch": 7422} {"train_loss": -27.79559326171875, "global_step": 616106, "epoch": 7422} {"train_loss": -28.18391227722168, "global_step": 616107, "epoch": 7422} {"train_loss": -27.950280844447125, "global_step": 616108, "epoch": 7422, "val_loss": 6592166.5} {"train_loss": -26.637365341186523, "global_step": 616109, "epoch": 7423} {"train_loss": -26.960424423217773, "global_step": 616110, "epoch": 7423} {"train_loss": -26.66766929626465, "global_step": 616111, "epoch": 7423} {"train_loss": -27.056690216064453, "global_step": 616112, "epoch": 7423} {"train_loss": -27.3909912109375, "global_step": 616113, "epoch": 7423} {"train_loss": -26.912799835205078, "global_step": 616114, "epoch": 7423} {"train_loss": -27.557886123657227, "global_step": 616115, "epoch": 7423} {"train_loss": -27.262800216674805, "global_step": 616116, "epoch": 7423} {"train_loss": -27.327728271484375, "global_step": 616117, "epoch": 7423} {"train_loss": -27.293415069580078, "global_step": 616118, "epoch": 7423} {"train_loss": -27.24203872680664, "global_step": 616119, "epoch": 7423} {"train_loss": -27.341909408569336, "global_step": 616120, "epoch": 7423} {"train_loss": -27.268415451049805, "global_step": 616121, "epoch": 7423} {"train_loss": -27.574756622314453, "global_step": 616122, "epoch": 7423} {"train_loss": -27.596817016601562, "global_step": 616123, "epoch": 7423} {"train_loss": -27.328460693359375, "global_step": 616124, "epoch": 7423} {"train_loss": -27.88237953186035, "global_step": 616125, "epoch": 7423} {"train_loss": -27.403600692749023, "global_step": 616126, "epoch": 7423} {"train_loss": -27.105321884155273, "global_step": 616127, "epoch": 7423} {"train_loss": -27.763141632080078, "global_step": 616128, "epoch": 7423} {"train_loss": -27.700376510620117, "global_step": 616129, "epoch": 7423} {"train_loss": -27.586252212524414, "global_step": 616130, "epoch": 7423} {"train_loss": -28.243616104125977, "global_step": 616131, "epoch": 7423} {"train_loss": -27.776874542236328, "global_step": 616132, "epoch": 7423} {"train_loss": -27.89679527282715, "global_step": 616133, "epoch": 7423} {"train_loss": -27.827478408813477, "global_step": 616134, "epoch": 7423} {"train_loss": -27.852685928344727, "global_step": 616135, "epoch": 7423} {"train_loss": -27.891162872314453, "global_step": 616136, "epoch": 7423} {"train_loss": -28.121015548706055, "global_step": 616137, "epoch": 7423} {"train_loss": -28.39520263671875, "global_step": 616138, "epoch": 7423} {"train_loss": -27.876874923706055, "global_step": 616139, "epoch": 7423} {"train_loss": -28.276517868041992, "global_step": 616140, "epoch": 7423} {"train_loss": -28.041784286499023, "global_step": 616141, "epoch": 7423} {"train_loss": -28.227893829345703, "global_step": 616142, "epoch": 7423} {"train_loss": -28.241926193237305, "global_step": 616143, "epoch": 7423} {"train_loss": -27.975751876831055, "global_step": 616144, "epoch": 7423} {"train_loss": -28.382495880126953, "global_step": 616145, "epoch": 7423} {"train_loss": -28.379114151000977, "global_step": 616146, "epoch": 7423} {"train_loss": -28.2750186920166, "global_step": 616147, "epoch": 7423} {"train_loss": -28.008182525634766, "global_step": 616148, "epoch": 7423} {"train_loss": -28.114667892456055, "global_step": 616149, "epoch": 7423} {"train_loss": -28.781217575073242, "global_step": 616150, "epoch": 7423} {"train_loss": -28.21064567565918, "global_step": 616151, "epoch": 7423} {"train_loss": -28.62409019470215, "global_step": 616152, "epoch": 7423} {"train_loss": -28.3646297454834, "global_step": 616153, "epoch": 7423} {"train_loss": -28.2604923248291, "global_step": 616154, "epoch": 7423} {"train_loss": -28.200794219970703, "global_step": 616155, "epoch": 7423} {"train_loss": -28.559309005737305, "global_step": 616156, "epoch": 7423} {"train_loss": -28.19508171081543, "global_step": 616157, "epoch": 7423} {"train_loss": -28.4533634185791, "global_step": 616158, "epoch": 7423} {"train_loss": -28.291296005249023, "global_step": 616159, "epoch": 7423} {"train_loss": -28.31146240234375, "global_step": 616160, "epoch": 7423} {"train_loss": -28.3487606048584, "global_step": 616161, "epoch": 7423} {"train_loss": -28.169681549072266, "global_step": 616162, "epoch": 7423} {"train_loss": -28.16552734375, "global_step": 616163, "epoch": 7423} {"train_loss": -28.091175079345703, "global_step": 616164, "epoch": 7423} {"train_loss": -28.317707061767578, "global_step": 616165, "epoch": 7423} {"train_loss": -28.057783126831055, "global_step": 616166, "epoch": 7423} {"train_loss": -28.0584716796875, "global_step": 616167, "epoch": 7423} {"train_loss": -27.797687530517578, "global_step": 616168, "epoch": 7423} {"train_loss": -27.84218406677246, "global_step": 616169, "epoch": 7423} {"train_loss": -27.962432861328125, "global_step": 616170, "epoch": 7423} {"train_loss": -28.1320743560791, "global_step": 616171, "epoch": 7423} {"train_loss": -27.981271743774414, "global_step": 616172, "epoch": 7423} {"train_loss": -27.676584243774414, "global_step": 616173, "epoch": 7423} {"train_loss": -27.6845760345459, "global_step": 616174, "epoch": 7423} {"train_loss": -26.715295791625977, "global_step": 616175, "epoch": 7423} {"train_loss": -26.035968780517578, "global_step": 616176, "epoch": 7423} {"train_loss": -26.264875411987305, "global_step": 616177, "epoch": 7423} {"train_loss": -27.868452072143555, "global_step": 616178, "epoch": 7423} {"train_loss": -26.9686222076416, "global_step": 616179, "epoch": 7423} {"train_loss": -27.9986572265625, "global_step": 616180, "epoch": 7423} {"train_loss": -27.621505737304688, "global_step": 616181, "epoch": 7423} {"train_loss": -27.506458282470703, "global_step": 616182, "epoch": 7423} {"train_loss": -27.740198135375977, "global_step": 616183, "epoch": 7423} {"train_loss": -27.90070915222168, "global_step": 616184, "epoch": 7423} {"train_loss": -27.736371994018555, "global_step": 616185, "epoch": 7423} {"train_loss": -27.991437911987305, "global_step": 616186, "epoch": 7423} {"train_loss": -27.6451473236084, "global_step": 616187, "epoch": 7423} {"train_loss": -27.896203994750977, "global_step": 616188, "epoch": 7423} {"train_loss": -27.96869468688965, "global_step": 616189, "epoch": 7423} {"train_loss": -28.0869083404541, "global_step": 616190, "epoch": 7423} {"train_loss": -27.81203223998288, "global_step": 616191, "epoch": 7423, "val_loss": 6612339.0} {"train_loss": -27.194501876831055, "global_step": 616192, "epoch": 7424} {"train_loss": -27.5699520111084, "global_step": 616193, "epoch": 7424} {"train_loss": -27.121740341186523, "global_step": 616194, "epoch": 7424} {"train_loss": -27.60601234436035, "global_step": 616195, "epoch": 7424} {"train_loss": -27.40555191040039, "global_step": 616196, "epoch": 7424} {"train_loss": -27.518115997314453, "global_step": 616197, "epoch": 7424} {"train_loss": -27.539264678955078, "global_step": 616198, "epoch": 7424} {"train_loss": -27.047351837158203, "global_step": 616199, "epoch": 7424} {"train_loss": -27.447824478149414, "global_step": 616200, "epoch": 7424} {"train_loss": -27.429828643798828, "global_step": 616201, "epoch": 7424} {"train_loss": -27.534711837768555, "global_step": 616202, "epoch": 7424} {"train_loss": -27.028553009033203, "global_step": 616203, "epoch": 7424} {"train_loss": -27.28619956970215, "global_step": 616204, "epoch": 7424} {"train_loss": -27.54876708984375, "global_step": 616205, "epoch": 7424} {"train_loss": -27.35809898376465, "global_step": 616206, "epoch": 7424} {"train_loss": -27.204771041870117, "global_step": 616207, "epoch": 7424} {"train_loss": -27.60321617126465, "global_step": 616208, "epoch": 7424} {"train_loss": -27.25518226623535, "global_step": 616209, "epoch": 7424} {"train_loss": -27.784711837768555, "global_step": 616210, "epoch": 7424} {"train_loss": -27.49419593811035, "global_step": 616211, "epoch": 7424} {"train_loss": -27.737125396728516, "global_step": 616212, "epoch": 7424} {"train_loss": -27.94760513305664, "global_step": 616213, "epoch": 7424} {"train_loss": -27.942686080932617, "global_step": 616214, "epoch": 7424} {"train_loss": -27.970861434936523, "global_step": 616215, "epoch": 7424} {"train_loss": -27.58411979675293, "global_step": 616216, "epoch": 7424} {"train_loss": -27.456212997436523, "global_step": 616217, "epoch": 7424} {"train_loss": -28.023075103759766, "global_step": 616218, "epoch": 7424} {"train_loss": -27.93556022644043, "global_step": 616219, "epoch": 7424} {"train_loss": -27.952423095703125, "global_step": 616220, "epoch": 7424} {"train_loss": -28.1392822265625, "global_step": 616221, "epoch": 7424} {"train_loss": -28.093082427978516, "global_step": 616222, "epoch": 7424} {"train_loss": -28.333118438720703, "global_step": 616223, "epoch": 7424} {"train_loss": -28.31064796447754, "global_step": 616224, "epoch": 7424} {"train_loss": -28.060470581054688, "global_step": 616225, "epoch": 7424} {"train_loss": -28.11488914489746, "global_step": 616226, "epoch": 7424} {"train_loss": -28.06544303894043, "global_step": 616227, "epoch": 7424} {"train_loss": -28.1721248626709, "global_step": 616228, "epoch": 7424} {"train_loss": -28.20537757873535, "global_step": 616229, "epoch": 7424} {"train_loss": -28.0126895904541, "global_step": 616230, "epoch": 7424} {"train_loss": -28.18220329284668, "global_step": 616231, "epoch": 7424} {"train_loss": -28.139663696289062, "global_step": 616232, "epoch": 7424} {"train_loss": -28.22308349609375, "global_step": 616233, "epoch": 7424} {"train_loss": -28.364887237548828, "global_step": 616234, "epoch": 7424} {"train_loss": -27.999195098876953, "global_step": 616235, "epoch": 7424} {"train_loss": -28.387479782104492, "global_step": 616236, "epoch": 7424} {"train_loss": -27.906278610229492, "global_step": 616237, "epoch": 7424} {"train_loss": -28.119556427001953, "global_step": 616238, "epoch": 7424} {"train_loss": -28.572980880737305, "global_step": 616239, "epoch": 7424} {"train_loss": -28.224042892456055, "global_step": 616240, "epoch": 7424} {"train_loss": -28.122699737548828, "global_step": 616241, "epoch": 7424} {"train_loss": -28.274511337280273, "global_step": 616242, "epoch": 7424} {"train_loss": -28.086048126220703, "global_step": 616243, "epoch": 7424} {"train_loss": -28.15704917907715, "global_step": 616244, "epoch": 7424} {"train_loss": -28.372766494750977, "global_step": 616245, "epoch": 7424} {"train_loss": -28.186283111572266, "global_step": 616246, "epoch": 7424} {"train_loss": -27.75811195373535, "global_step": 616247, "epoch": 7424} {"train_loss": -27.842803955078125, "global_step": 616248, "epoch": 7424} {"train_loss": -28.070737838745117, "global_step": 616249, "epoch": 7424} {"train_loss": -28.058813095092773, "global_step": 616250, "epoch": 7424} {"train_loss": -28.53020668029785, "global_step": 616251, "epoch": 7424} {"train_loss": -27.924314498901367, "global_step": 616252, "epoch": 7424} {"train_loss": -28.15827751159668, "global_step": 616253, "epoch": 7424} {"train_loss": -28.39735221862793, "global_step": 616254, "epoch": 7424} {"train_loss": -28.333908081054688, "global_step": 616255, "epoch": 7424} {"train_loss": -28.318471908569336, "global_step": 616256, "epoch": 7424} {"train_loss": -28.2393856048584, "global_step": 616257, "epoch": 7424} {"train_loss": -28.082727432250977, "global_step": 616258, "epoch": 7424} {"train_loss": -28.345178604125977, "global_step": 616259, "epoch": 7424} {"train_loss": -28.43342399597168, "global_step": 616260, "epoch": 7424} {"train_loss": -28.107746124267578, "global_step": 616261, "epoch": 7424} {"train_loss": -28.008874893188477, "global_step": 616262, "epoch": 7424} {"train_loss": -28.3587703704834, "global_step": 616263, "epoch": 7424} {"train_loss": -28.452930450439453, "global_step": 616264, "epoch": 7424} {"train_loss": -28.42120361328125, "global_step": 616265, "epoch": 7424} {"train_loss": -28.66636085510254, "global_step": 616266, "epoch": 7424} {"train_loss": -28.663253784179688, "global_step": 616267, "epoch": 7424} {"train_loss": -27.96819496154785, "global_step": 616268, "epoch": 7424} {"train_loss": -28.526708602905273, "global_step": 616269, "epoch": 7424} {"train_loss": -28.377395629882812, "global_step": 616270, "epoch": 7424} {"train_loss": -28.130569458007812, "global_step": 616271, "epoch": 7424} {"train_loss": -27.947614669799805, "global_step": 616272, "epoch": 7424} {"train_loss": -27.1376895904541, "global_step": 616273, "epoch": 7424} {"train_loss": -27.92545601258795, "global_step": 616274, "epoch": 7424, "val_loss": 6655418.5} {"train_loss": -20.646177291870117, "global_step": 616275, "epoch": 7425} {"train_loss": -23.73078155517578, "global_step": 616276, "epoch": 7425} {"train_loss": -26.12933921813965, "global_step": 616277, "epoch": 7425} {"train_loss": -24.232297897338867, "global_step": 616278, "epoch": 7425} {"train_loss": -25.33412742614746, "global_step": 616279, "epoch": 7425} {"train_loss": -25.9359130859375, "global_step": 616280, "epoch": 7425} {"train_loss": -25.178197860717773, "global_step": 616281, "epoch": 7425} {"train_loss": -26.593671798706055, "global_step": 616282, "epoch": 7425} {"train_loss": -25.35628318786621, "global_step": 616283, "epoch": 7425} {"train_loss": -26.302831649780273, "global_step": 616284, "epoch": 7425} {"train_loss": -26.154661178588867, "global_step": 616285, "epoch": 7425} {"train_loss": -26.684249877929688, "global_step": 616286, "epoch": 7425} {"train_loss": -25.9460506439209, "global_step": 616287, "epoch": 7425} {"train_loss": -26.442596435546875, "global_step": 616288, "epoch": 7425} {"train_loss": -26.548017501831055, "global_step": 616289, "epoch": 7425} {"train_loss": -26.680648803710938, "global_step": 616290, "epoch": 7425} {"train_loss": -26.223169326782227, "global_step": 616291, "epoch": 7425} {"train_loss": -26.34527587890625, "global_step": 616292, "epoch": 7425} {"train_loss": -26.73676872253418, "global_step": 616293, "epoch": 7425} {"train_loss": -27.160282135009766, "global_step": 616294, "epoch": 7425} {"train_loss": -26.85330581665039, "global_step": 616295, "epoch": 7425} {"train_loss": -26.981504440307617, "global_step": 616296, "epoch": 7425} {"train_loss": -26.484968185424805, "global_step": 616297, "epoch": 7425} {"train_loss": -27.52045249938965, "global_step": 616298, "epoch": 7425} {"train_loss": -27.074478149414062, "global_step": 616299, "epoch": 7425} {"train_loss": -27.212921142578125, "global_step": 616300, "epoch": 7425} {"train_loss": -27.201704025268555, "global_step": 616301, "epoch": 7425} {"train_loss": -26.59132194519043, "global_step": 616302, "epoch": 7425} {"train_loss": -26.730844497680664, "global_step": 616303, "epoch": 7425} {"train_loss": -26.693470001220703, "global_step": 616304, "epoch": 7425} {"train_loss": -27.249195098876953, "global_step": 616305, "epoch": 7425} {"train_loss": -27.26746940612793, "global_step": 616306, "epoch": 7425} {"train_loss": -27.225112915039062, "global_step": 616307, "epoch": 7425} {"train_loss": -27.844266891479492, "global_step": 616308, "epoch": 7425} {"train_loss": -27.030675888061523, "global_step": 616309, "epoch": 7425} {"train_loss": -27.238433837890625, "global_step": 616310, "epoch": 7425} {"train_loss": -27.820953369140625, "global_step": 616311, "epoch": 7425} {"train_loss": -27.3546199798584, "global_step": 616312, "epoch": 7425} {"train_loss": -27.3516788482666, "global_step": 616313, "epoch": 7425} {"train_loss": -27.776752471923828, "global_step": 616314, "epoch": 7425} {"train_loss": -27.518888473510742, "global_step": 616315, "epoch": 7425} {"train_loss": -27.61260986328125, "global_step": 616316, "epoch": 7425} {"train_loss": -27.498220443725586, "global_step": 616317, "epoch": 7425} {"train_loss": -27.521747589111328, "global_step": 616318, "epoch": 7425} {"train_loss": -27.8070068359375, "global_step": 616319, "epoch": 7425} {"train_loss": -27.608356475830078, "global_step": 616320, "epoch": 7425} {"train_loss": -27.846954345703125, "global_step": 616321, "epoch": 7425} {"train_loss": -27.9720458984375, "global_step": 616322, "epoch": 7425} {"train_loss": -27.76807975769043, "global_step": 616323, "epoch": 7425} {"train_loss": -27.446863174438477, "global_step": 616324, "epoch": 7425} {"train_loss": -27.770843505859375, "global_step": 616325, "epoch": 7425} {"train_loss": -27.855539321899414, "global_step": 616326, "epoch": 7425} {"train_loss": -27.957311630249023, "global_step": 616327, "epoch": 7425} {"train_loss": -27.594018936157227, "global_step": 616328, "epoch": 7425} {"train_loss": -28.136457443237305, "global_step": 616329, "epoch": 7425} {"train_loss": -28.07441520690918, "global_step": 616330, "epoch": 7425} {"train_loss": -28.351667404174805, "global_step": 616331, "epoch": 7425} {"train_loss": -28.0556697845459, "global_step": 616332, "epoch": 7425} {"train_loss": -27.81675148010254, "global_step": 616333, "epoch": 7425} {"train_loss": -27.929075241088867, "global_step": 616334, "epoch": 7425} {"train_loss": -27.899566650390625, "global_step": 616335, "epoch": 7425} {"train_loss": -27.96308708190918, "global_step": 616336, "epoch": 7425} {"train_loss": -28.03438377380371, "global_step": 616337, "epoch": 7425} {"train_loss": -28.441980361938477, "global_step": 616338, "epoch": 7425} {"train_loss": -28.0372371673584, "global_step": 616339, "epoch": 7425} {"train_loss": -28.227746963500977, "global_step": 616340, "epoch": 7425} {"train_loss": -27.6684513092041, "global_step": 616341, "epoch": 7425} {"train_loss": -27.854047775268555, "global_step": 616342, "epoch": 7425} {"train_loss": -27.43756675720215, "global_step": 616343, "epoch": 7425} {"train_loss": -27.482309341430664, "global_step": 616344, "epoch": 7425} {"train_loss": -27.805479049682617, "global_step": 616345, "epoch": 7425} {"train_loss": -28.500823974609375, "global_step": 616346, "epoch": 7425} {"train_loss": -27.876874923706055, "global_step": 616347, "epoch": 7425} {"train_loss": -27.98359489440918, "global_step": 616348, "epoch": 7425} {"train_loss": -28.355859756469727, "global_step": 616349, "epoch": 7425} {"train_loss": -28.37566566467285, "global_step": 616350, "epoch": 7425} {"train_loss": -28.06549072265625, "global_step": 616351, "epoch": 7425} {"train_loss": -28.228742599487305, "global_step": 616352, "epoch": 7425} {"train_loss": -28.05035400390625, "global_step": 616353, "epoch": 7425} {"train_loss": -27.884048461914062, "global_step": 616354, "epoch": 7425} {"train_loss": -27.78386878967285, "global_step": 616355, "epoch": 7425} {"train_loss": -28.2535343170166, "global_step": 616356, "epoch": 7425} {"train_loss": -27.219550810664533, "global_step": 616357, "epoch": 7425, "val_loss": 6603969.0} {"train_loss": -27.574737548828125, "global_step": 616358, "epoch": 7426} {"train_loss": -27.424365997314453, "global_step": 616359, "epoch": 7426} {"train_loss": -27.875568389892578, "global_step": 616360, "epoch": 7426} {"train_loss": -27.943750381469727, "global_step": 616361, "epoch": 7426} {"train_loss": -27.39532470703125, "global_step": 616362, "epoch": 7426} {"train_loss": -27.9437255859375, "global_step": 616363, "epoch": 7426} {"train_loss": -27.5349178314209, "global_step": 616364, "epoch": 7426} {"train_loss": -28.1807918548584, "global_step": 616365, "epoch": 7426} {"train_loss": -27.482458114624023, "global_step": 616366, "epoch": 7426} {"train_loss": -27.85370445251465, "global_step": 616367, "epoch": 7426} {"train_loss": -27.894983291625977, "global_step": 616368, "epoch": 7426} {"train_loss": -27.66400146484375, "global_step": 616369, "epoch": 7426} {"train_loss": -27.902807235717773, "global_step": 616370, "epoch": 7426} {"train_loss": -28.0981388092041, "global_step": 616371, "epoch": 7426} {"train_loss": -27.857954025268555, "global_step": 616372, "epoch": 7426} {"train_loss": -27.813261032104492, "global_step": 616373, "epoch": 7426} {"train_loss": -27.898578643798828, "global_step": 616374, "epoch": 7426} {"train_loss": -28.122058868408203, "global_step": 616375, "epoch": 7426} {"train_loss": -27.963830947875977, "global_step": 616376, "epoch": 7426} {"train_loss": -28.24936294555664, "global_step": 616377, "epoch": 7426} {"train_loss": -27.64276123046875, "global_step": 616378, "epoch": 7426} {"train_loss": -28.18475341796875, "global_step": 616379, "epoch": 7426} {"train_loss": -28.321151733398438, "global_step": 616380, "epoch": 7426} {"train_loss": -27.95304298400879, "global_step": 616381, "epoch": 7426} {"train_loss": -27.77899169921875, "global_step": 616382, "epoch": 7426} {"train_loss": -27.93548583984375, "global_step": 616383, "epoch": 7426} {"train_loss": -27.904632568359375, "global_step": 616384, "epoch": 7426} {"train_loss": -27.94427490234375, "global_step": 616385, "epoch": 7426} {"train_loss": -28.221649169921875, "global_step": 616386, "epoch": 7426} {"train_loss": -28.101842880249023, "global_step": 616387, "epoch": 7426} {"train_loss": -28.040393829345703, "global_step": 616388, "epoch": 7426} {"train_loss": -28.323415756225586, "global_step": 616389, "epoch": 7426} {"train_loss": -28.092390060424805, "global_step": 616390, "epoch": 7426} {"train_loss": -28.320331573486328, "global_step": 616391, "epoch": 7426} {"train_loss": -27.780515670776367, "global_step": 616392, "epoch": 7426} {"train_loss": -27.997838973999023, "global_step": 616393, "epoch": 7426} {"train_loss": -28.159870147705078, "global_step": 616394, "epoch": 7426} {"train_loss": -28.122791290283203, "global_step": 616395, "epoch": 7426} {"train_loss": -27.972013473510742, "global_step": 616396, "epoch": 7426} {"train_loss": -28.353376388549805, "global_step": 616397, "epoch": 7426} {"train_loss": -27.890439987182617, "global_step": 616398, "epoch": 7426} {"train_loss": -28.294784545898438, "global_step": 616399, "epoch": 7426} {"train_loss": -27.8807373046875, "global_step": 616400, "epoch": 7426} {"train_loss": -28.116962432861328, "global_step": 616401, "epoch": 7426} {"train_loss": -28.33438491821289, "global_step": 616402, "epoch": 7426} {"train_loss": -28.326374053955078, "global_step": 616403, "epoch": 7426} {"train_loss": -28.07305335998535, "global_step": 616404, "epoch": 7426} {"train_loss": -28.487646102905273, "global_step": 616405, "epoch": 7426} {"train_loss": -28.08941650390625, "global_step": 616406, "epoch": 7426} {"train_loss": -28.486392974853516, "global_step": 616407, "epoch": 7426} {"train_loss": -28.23421287536621, "global_step": 616408, "epoch": 7426} {"train_loss": -28.23175621032715, "global_step": 616409, "epoch": 7426} {"train_loss": -28.218164443969727, "global_step": 616410, "epoch": 7426} {"train_loss": -28.493362426757812, "global_step": 616411, "epoch": 7426} {"train_loss": -28.297815322875977, "global_step": 616412, "epoch": 7426} {"train_loss": -28.274890899658203, "global_step": 616413, "epoch": 7426} {"train_loss": -28.497472763061523, "global_step": 616414, "epoch": 7426} {"train_loss": -28.551727294921875, "global_step": 616415, "epoch": 7426} {"train_loss": -28.2745418548584, "global_step": 616416, "epoch": 7426} {"train_loss": -28.472137451171875, "global_step": 616417, "epoch": 7426} {"train_loss": -28.495590209960938, "global_step": 616418, "epoch": 7426} {"train_loss": -28.328781127929688, "global_step": 616419, "epoch": 7426} {"train_loss": -28.411880493164062, "global_step": 616420, "epoch": 7426} {"train_loss": -28.43086051940918, "global_step": 616421, "epoch": 7426} {"train_loss": -28.168684005737305, "global_step": 616422, "epoch": 7426} {"train_loss": -27.579023361206055, "global_step": 616423, "epoch": 7426} {"train_loss": -28.460973739624023, "global_step": 616424, "epoch": 7426} {"train_loss": -27.990406036376953, "global_step": 616425, "epoch": 7426} {"train_loss": -28.395307540893555, "global_step": 616426, "epoch": 7426} {"train_loss": -28.244504928588867, "global_step": 616427, "epoch": 7426} {"train_loss": -28.42486572265625, "global_step": 616428, "epoch": 7426} {"train_loss": -28.264556884765625, "global_step": 616429, "epoch": 7426} {"train_loss": -28.399127960205078, "global_step": 616430, "epoch": 7426} {"train_loss": -28.498855590820312, "global_step": 616431, "epoch": 7426} {"train_loss": -28.51362419128418, "global_step": 616432, "epoch": 7426} {"train_loss": -28.180639266967773, "global_step": 616433, "epoch": 7426} {"train_loss": -28.316282272338867, "global_step": 616434, "epoch": 7426} {"train_loss": -28.170438766479492, "global_step": 616435, "epoch": 7426} {"train_loss": -28.406402587890625, "global_step": 616436, "epoch": 7426} {"train_loss": -28.67762565612793, "global_step": 616437, "epoch": 7426} {"train_loss": -28.267898559570312, "global_step": 616438, "epoch": 7426} {"train_loss": -28.53981590270996, "global_step": 616439, "epoch": 7426} {"train_loss": -28.140028275639178, "global_step": 616440, "epoch": 7426, "val_loss": 6574326.0} {"train_loss": -27.107709884643555, "global_step": 616441, "epoch": 7427} {"train_loss": -27.28230094909668, "global_step": 616442, "epoch": 7427} {"train_loss": -28.0064697265625, "global_step": 616443, "epoch": 7427} {"train_loss": -27.422454833984375, "global_step": 616444, "epoch": 7427} {"train_loss": -27.924121856689453, "global_step": 616445, "epoch": 7427} {"train_loss": -27.428693771362305, "global_step": 616446, "epoch": 7427} {"train_loss": -27.23878288269043, "global_step": 616447, "epoch": 7427} {"train_loss": -26.879016876220703, "global_step": 616448, "epoch": 7427} {"train_loss": -26.910192489624023, "global_step": 616449, "epoch": 7427} {"train_loss": -26.636127471923828, "global_step": 616450, "epoch": 7427} {"train_loss": -26.277647018432617, "global_step": 616451, "epoch": 7427} {"train_loss": -26.4261474609375, "global_step": 616452, "epoch": 7427} {"train_loss": -27.285511016845703, "global_step": 616453, "epoch": 7427} {"train_loss": -27.6954345703125, "global_step": 616454, "epoch": 7427} {"train_loss": -27.5017147064209, "global_step": 616455, "epoch": 7427} {"train_loss": -27.39339256286621, "global_step": 616456, "epoch": 7427} {"train_loss": -27.311542510986328, "global_step": 616457, "epoch": 7427} {"train_loss": -27.862817764282227, "global_step": 616458, "epoch": 7427} {"train_loss": -27.796598434448242, "global_step": 616459, "epoch": 7427} {"train_loss": -27.469282150268555, "global_step": 616460, "epoch": 7427} {"train_loss": -27.942182540893555, "global_step": 616461, "epoch": 7427} {"train_loss": -27.508161544799805, "global_step": 616462, "epoch": 7427} {"train_loss": -27.98250389099121, "global_step": 616463, "epoch": 7427} {"train_loss": -27.79449462890625, "global_step": 616464, "epoch": 7427} {"train_loss": -27.89072036743164, "global_step": 616465, "epoch": 7427} {"train_loss": -27.574695587158203, "global_step": 616466, "epoch": 7427} {"train_loss": -28.15178871154785, "global_step": 616467, "epoch": 7427} {"train_loss": -27.8707275390625, "global_step": 616468, "epoch": 7427} {"train_loss": -27.8356876373291, "global_step": 616469, "epoch": 7427} {"train_loss": -28.002471923828125, "global_step": 616470, "epoch": 7427} {"train_loss": -27.826251983642578, "global_step": 616471, "epoch": 7427} {"train_loss": -28.173065185546875, "global_step": 616472, "epoch": 7427} {"train_loss": -28.034088134765625, "global_step": 616473, "epoch": 7427} {"train_loss": -28.10395622253418, "global_step": 616474, "epoch": 7427} {"train_loss": -28.3984317779541, "global_step": 616475, "epoch": 7427} {"train_loss": -27.84449577331543, "global_step": 616476, "epoch": 7427} {"train_loss": -27.96620750427246, "global_step": 616477, "epoch": 7427} {"train_loss": -28.380823135375977, "global_step": 616478, "epoch": 7427} {"train_loss": -27.991331100463867, "global_step": 616479, "epoch": 7427} {"train_loss": -28.218994140625, "global_step": 616480, "epoch": 7427} {"train_loss": -28.4035587310791, "global_step": 616481, "epoch": 7427} {"train_loss": -28.205596923828125, "global_step": 616482, "epoch": 7427} {"train_loss": -28.4382381439209, "global_step": 616483, "epoch": 7427} {"train_loss": -28.19034194946289, "global_step": 616484, "epoch": 7427} {"train_loss": -28.516626358032227, "global_step": 616485, "epoch": 7427} {"train_loss": -27.88628578186035, "global_step": 616486, "epoch": 7427} {"train_loss": -28.198501586914062, "global_step": 616487, "epoch": 7427} {"train_loss": -28.0603084564209, "global_step": 616488, "epoch": 7427} {"train_loss": -28.152738571166992, "global_step": 616489, "epoch": 7427} {"train_loss": -28.064077377319336, "global_step": 616490, "epoch": 7427} {"train_loss": -28.589223861694336, "global_step": 616491, "epoch": 7427} {"train_loss": -28.257694244384766, "global_step": 616492, "epoch": 7427} {"train_loss": -28.337060928344727, "global_step": 616493, "epoch": 7427} {"train_loss": -28.36305046081543, "global_step": 616494, "epoch": 7427} {"train_loss": -28.204092025756836, "global_step": 616495, "epoch": 7427} {"train_loss": -28.211816787719727, "global_step": 616496, "epoch": 7427} {"train_loss": -28.609949111938477, "global_step": 616497, "epoch": 7427} {"train_loss": -28.27272605895996, "global_step": 616498, "epoch": 7427} {"train_loss": -28.197484970092773, "global_step": 616499, "epoch": 7427} {"train_loss": -28.413949966430664, "global_step": 616500, "epoch": 7427} {"train_loss": -28.170516967773438, "global_step": 616501, "epoch": 7427} {"train_loss": -28.31284523010254, "global_step": 616502, "epoch": 7427} {"train_loss": -28.39937400817871, "global_step": 616503, "epoch": 7427} {"train_loss": -28.286191940307617, "global_step": 616504, "epoch": 7427} {"train_loss": -28.087299346923828, "global_step": 616505, "epoch": 7427} {"train_loss": -28.40726661682129, "global_step": 616506, "epoch": 7427} {"train_loss": -28.47918128967285, "global_step": 616507, "epoch": 7427} {"train_loss": -28.37415885925293, "global_step": 616508, "epoch": 7427} {"train_loss": -28.359760284423828, "global_step": 616509, "epoch": 7427} {"train_loss": -28.448877334594727, "global_step": 616510, "epoch": 7427} {"train_loss": -28.0042781829834, "global_step": 616511, "epoch": 7427} {"train_loss": -28.25433349609375, "global_step": 616512, "epoch": 7427} {"train_loss": -28.325016021728516, "global_step": 616513, "epoch": 7427} {"train_loss": -28.413610458374023, "global_step": 616514, "epoch": 7427} {"train_loss": -28.05216407775879, "global_step": 616515, "epoch": 7427} {"train_loss": -28.2634334564209, "global_step": 616516, "epoch": 7427} {"train_loss": -28.4466552734375, "global_step": 616517, "epoch": 7427} {"train_loss": -28.53333854675293, "global_step": 616518, "epoch": 7427} {"train_loss": -28.71535301208496, "global_step": 616519, "epoch": 7427} {"train_loss": -28.18497657775879, "global_step": 616520, "epoch": 7427} {"train_loss": -28.222143173217773, "global_step": 616521, "epoch": 7427} {"train_loss": -28.305017471313477, "global_step": 616522, "epoch": 7427} {"train_loss": -27.975452423095703, "global_step": 616523, "epoch": 7427, "val_loss": 6601699.5} {"train_loss": -27.334796905517578, "global_step": 616524, "epoch": 7428} {"train_loss": -27.382654190063477, "global_step": 616525, "epoch": 7428} {"train_loss": -27.70900535583496, "global_step": 616526, "epoch": 7428} {"train_loss": -27.507144927978516, "global_step": 616527, "epoch": 7428} {"train_loss": -27.184925079345703, "global_step": 616528, "epoch": 7428} {"train_loss": -28.12628173828125, "global_step": 616529, "epoch": 7428} {"train_loss": -27.53700065612793, "global_step": 616530, "epoch": 7428} {"train_loss": -27.49899673461914, "global_step": 616531, "epoch": 7428} {"train_loss": -27.832794189453125, "global_step": 616532, "epoch": 7428} {"train_loss": -27.573993682861328, "global_step": 616533, "epoch": 7428} {"train_loss": -27.452966690063477, "global_step": 616534, "epoch": 7428} {"train_loss": -27.363388061523438, "global_step": 616535, "epoch": 7428} {"train_loss": -27.683813095092773, "global_step": 616536, "epoch": 7428} {"train_loss": -27.712549209594727, "global_step": 616537, "epoch": 7428} {"train_loss": -27.590774536132812, "global_step": 616538, "epoch": 7428} {"train_loss": -27.534067153930664, "global_step": 616539, "epoch": 7428} {"train_loss": -27.75544548034668, "global_step": 616540, "epoch": 7428} {"train_loss": -27.827457427978516, "global_step": 616541, "epoch": 7428} {"train_loss": -27.77162742614746, "global_step": 616542, "epoch": 7428} {"train_loss": -27.481124877929688, "global_step": 616543, "epoch": 7428} {"train_loss": -27.682220458984375, "global_step": 616544, "epoch": 7428} {"train_loss": -27.734479904174805, "global_step": 616545, "epoch": 7428} {"train_loss": -27.608795166015625, "global_step": 616546, "epoch": 7428} {"train_loss": -27.55169677734375, "global_step": 616547, "epoch": 7428} {"train_loss": -27.918548583984375, "global_step": 616548, "epoch": 7428} {"train_loss": -27.897140502929688, "global_step": 616549, "epoch": 7428} {"train_loss": -28.337797164916992, "global_step": 616550, "epoch": 7428} {"train_loss": -28.217554092407227, "global_step": 616551, "epoch": 7428} {"train_loss": -28.05989646911621, "global_step": 616552, "epoch": 7428} {"train_loss": -27.982181549072266, "global_step": 616553, "epoch": 7428} {"train_loss": -28.43827247619629, "global_step": 616554, "epoch": 7428} {"train_loss": -28.252416610717773, "global_step": 616555, "epoch": 7428} {"train_loss": -28.174585342407227, "global_step": 616556, "epoch": 7428} {"train_loss": -28.51631736755371, "global_step": 616557, "epoch": 7428} {"train_loss": -28.208511352539062, "global_step": 616558, "epoch": 7428} {"train_loss": -28.25958251953125, "global_step": 616559, "epoch": 7428} {"train_loss": -28.25019645690918, "global_step": 616560, "epoch": 7428} {"train_loss": -28.69449234008789, "global_step": 616561, "epoch": 7428} {"train_loss": -28.073104858398438, "global_step": 616562, "epoch": 7428} {"train_loss": -27.850086212158203, "global_step": 616563, "epoch": 7428} {"train_loss": -28.22858238220215, "global_step": 616564, "epoch": 7428} {"train_loss": -28.178466796875, "global_step": 616565, "epoch": 7428} {"train_loss": -28.348663330078125, "global_step": 616566, "epoch": 7428} {"train_loss": -28.296066284179688, "global_step": 616567, "epoch": 7428} {"train_loss": -28.062047958374023, "global_step": 616568, "epoch": 7428} {"train_loss": -27.802936553955078, "global_step": 616569, "epoch": 7428} {"train_loss": -27.515424728393555, "global_step": 616570, "epoch": 7428} {"train_loss": -27.516382217407227, "global_step": 616571, "epoch": 7428} {"train_loss": -27.961179733276367, "global_step": 616572, "epoch": 7428} {"train_loss": -28.105863571166992, "global_step": 616573, "epoch": 7428} {"train_loss": -27.856525421142578, "global_step": 616574, "epoch": 7428} {"train_loss": -27.88557243347168, "global_step": 616575, "epoch": 7428} {"train_loss": -28.265470504760742, "global_step": 616576, "epoch": 7428} {"train_loss": -27.8298282623291, "global_step": 616577, "epoch": 7428} {"train_loss": -28.3465518951416, "global_step": 616578, "epoch": 7428} {"train_loss": -28.431482315063477, "global_step": 616579, "epoch": 7428} {"train_loss": -27.907546997070312, "global_step": 616580, "epoch": 7428} {"train_loss": -28.092426300048828, "global_step": 616581, "epoch": 7428} {"train_loss": -28.071247100830078, "global_step": 616582, "epoch": 7428} {"train_loss": -28.04328727722168, "global_step": 616583, "epoch": 7428} {"train_loss": -27.887134552001953, "global_step": 616584, "epoch": 7428} {"train_loss": -28.307714462280273, "global_step": 616585, "epoch": 7428} {"train_loss": -28.287067413330078, "global_step": 616586, "epoch": 7428} {"train_loss": -28.372343063354492, "global_step": 616587, "epoch": 7428} {"train_loss": -27.93646240234375, "global_step": 616588, "epoch": 7428} {"train_loss": -27.640094757080078, "global_step": 616589, "epoch": 7428} {"train_loss": -28.0042781829834, "global_step": 616590, "epoch": 7428} {"train_loss": -27.964981079101562, "global_step": 616591, "epoch": 7428} {"train_loss": -28.031478881835938, "global_step": 616592, "epoch": 7428} {"train_loss": -28.248779296875, "global_step": 616593, "epoch": 7428} {"train_loss": -27.975683212280273, "global_step": 616594, "epoch": 7428} {"train_loss": -27.968881607055664, "global_step": 616595, "epoch": 7428} {"train_loss": -27.85926628112793, "global_step": 616596, "epoch": 7428} {"train_loss": -27.781784057617188, "global_step": 616597, "epoch": 7428} {"train_loss": -27.580175399780273, "global_step": 616598, "epoch": 7428} {"train_loss": -27.925878524780273, "global_step": 616599, "epoch": 7428} {"train_loss": -28.219085693359375, "global_step": 616600, "epoch": 7428} {"train_loss": -28.148202896118164, "global_step": 616601, "epoch": 7428} {"train_loss": -28.35780143737793, "global_step": 616602, "epoch": 7428} {"train_loss": -28.245328903198242, "global_step": 616603, "epoch": 7428} {"train_loss": -28.2676944732666, "global_step": 616604, "epoch": 7428} {"train_loss": -28.25766944885254, "global_step": 616605, "epoch": 7428} {"train_loss": -27.955890908298723, "global_step": 616606, "epoch": 7428, "val_loss": 6607620.0} {"train_loss": -27.54157829284668, "global_step": 616607, "epoch": 7429} {"train_loss": -27.34366226196289, "global_step": 616608, "epoch": 7429} {"train_loss": -27.9855899810791, "global_step": 616609, "epoch": 7429} {"train_loss": -27.90059471130371, "global_step": 616610, "epoch": 7429} {"train_loss": -27.683216094970703, "global_step": 616611, "epoch": 7429} {"train_loss": -27.565265655517578, "global_step": 616612, "epoch": 7429} {"train_loss": -27.597742080688477, "global_step": 616613, "epoch": 7429} {"train_loss": -27.779541015625, "global_step": 616614, "epoch": 7429} {"train_loss": -27.669652938842773, "global_step": 616615, "epoch": 7429} {"train_loss": -27.60809898376465, "global_step": 616616, "epoch": 7429} {"train_loss": -27.559925079345703, "global_step": 616617, "epoch": 7429} {"train_loss": -27.726343154907227, "global_step": 616618, "epoch": 7429} {"train_loss": -27.760801315307617, "global_step": 616619, "epoch": 7429} {"train_loss": -27.821592330932617, "global_step": 616620, "epoch": 7429} {"train_loss": -28.112918853759766, "global_step": 616621, "epoch": 7429} {"train_loss": -27.860443115234375, "global_step": 616622, "epoch": 7429} {"train_loss": -27.659912109375, "global_step": 616623, "epoch": 7429} {"train_loss": -26.99993324279785, "global_step": 616624, "epoch": 7429} {"train_loss": -27.8289737701416, "global_step": 616625, "epoch": 7429} {"train_loss": -27.555652618408203, "global_step": 616626, "epoch": 7429} {"train_loss": -27.62060546875, "global_step": 616627, "epoch": 7429} {"train_loss": -27.798099517822266, "global_step": 616628, "epoch": 7429} {"train_loss": -27.65057373046875, "global_step": 616629, "epoch": 7429} {"train_loss": -28.37217140197754, "global_step": 616630, "epoch": 7429} {"train_loss": -28.261444091796875, "global_step": 616631, "epoch": 7429} {"train_loss": -28.038101196289062, "global_step": 616632, "epoch": 7429} {"train_loss": -28.046890258789062, "global_step": 616633, "epoch": 7429} {"train_loss": -28.3592586517334, "global_step": 616634, "epoch": 7429} {"train_loss": -28.191547393798828, "global_step": 616635, "epoch": 7429} {"train_loss": -27.979413986206055, "global_step": 616636, "epoch": 7429} {"train_loss": -28.063989639282227, "global_step": 616637, "epoch": 7429} {"train_loss": -28.221052169799805, "global_step": 616638, "epoch": 7429} {"train_loss": -28.10120964050293, "global_step": 616639, "epoch": 7429} {"train_loss": -27.80478858947754, "global_step": 616640, "epoch": 7429} {"train_loss": -27.951618194580078, "global_step": 616641, "epoch": 7429} {"train_loss": -28.164459228515625, "global_step": 616642, "epoch": 7429} {"train_loss": -28.450841903686523, "global_step": 616643, "epoch": 7429} {"train_loss": -28.30855369567871, "global_step": 616644, "epoch": 7429} {"train_loss": -28.187973022460938, "global_step": 616645, "epoch": 7429} {"train_loss": -28.17255210876465, "global_step": 616646, "epoch": 7429} {"train_loss": -28.61405372619629, "global_step": 616647, "epoch": 7429} {"train_loss": -27.935331344604492, "global_step": 616648, "epoch": 7429} {"train_loss": -28.50673484802246, "global_step": 616649, "epoch": 7429} {"train_loss": -28.438337326049805, "global_step": 616650, "epoch": 7429} {"train_loss": -28.584796905517578, "global_step": 616651, "epoch": 7429} {"train_loss": -28.45099449157715, "global_step": 616652, "epoch": 7429} {"train_loss": -28.22216796875, "global_step": 616653, "epoch": 7429} {"train_loss": -28.413650512695312, "global_step": 616654, "epoch": 7429} {"train_loss": -28.180206298828125, "global_step": 616655, "epoch": 7429} {"train_loss": -27.88929557800293, "global_step": 616656, "epoch": 7429} {"train_loss": -28.566699981689453, "global_step": 616657, "epoch": 7429} {"train_loss": -28.50809097290039, "global_step": 616658, "epoch": 7429} {"train_loss": -27.8723201751709, "global_step": 616659, "epoch": 7429} {"train_loss": -28.07021141052246, "global_step": 616660, "epoch": 7429} {"train_loss": -27.931140899658203, "global_step": 616661, "epoch": 7429} {"train_loss": -28.130788803100586, "global_step": 616662, "epoch": 7429} {"train_loss": -27.647445678710938, "global_step": 616663, "epoch": 7429} {"train_loss": -28.040307998657227, "global_step": 616664, "epoch": 7429} {"train_loss": -28.386438369750977, "global_step": 616665, "epoch": 7429} {"train_loss": -28.15720558166504, "global_step": 616666, "epoch": 7429} {"train_loss": -28.470569610595703, "global_step": 616667, "epoch": 7429} {"train_loss": -28.075544357299805, "global_step": 616668, "epoch": 7429} {"train_loss": -28.34333610534668, "global_step": 616669, "epoch": 7429} {"train_loss": -28.33111000061035, "global_step": 616670, "epoch": 7429} {"train_loss": -28.16175651550293, "global_step": 616671, "epoch": 7429} {"train_loss": -28.312368392944336, "global_step": 616672, "epoch": 7429} {"train_loss": -28.40981101989746, "global_step": 616673, "epoch": 7429} {"train_loss": -27.968542098999023, "global_step": 616674, "epoch": 7429} {"train_loss": -27.964801788330078, "global_step": 616675, "epoch": 7429} {"train_loss": -27.40962791442871, "global_step": 616676, "epoch": 7429} {"train_loss": -27.743881225585938, "global_step": 616677, "epoch": 7429} {"train_loss": -27.61572265625, "global_step": 616678, "epoch": 7429} {"train_loss": -27.735761642456055, "global_step": 616679, "epoch": 7429} {"train_loss": -26.986663818359375, "global_step": 616680, "epoch": 7429} {"train_loss": -27.090055465698242, "global_step": 616681, "epoch": 7429} {"train_loss": -27.808429718017578, "global_step": 616682, "epoch": 7429} {"train_loss": -28.13373374938965, "global_step": 616683, "epoch": 7429} {"train_loss": -27.518829345703125, "global_step": 616684, "epoch": 7429} {"train_loss": -27.630325317382812, "global_step": 616685, "epoch": 7429} {"train_loss": -28.130834579467773, "global_step": 616686, "epoch": 7429} {"train_loss": -27.399444580078125, "global_step": 616687, "epoch": 7429} {"train_loss": -27.995105743408203, "global_step": 616688, "epoch": 7429} {"train_loss": -27.955721958574042, "global_step": 616689, "epoch": 7429, "val_loss": 6631594.0} {"train_loss": -26.211231231689453, "global_step": 616690, "epoch": 7430} {"train_loss": -26.876495361328125, "global_step": 616691, "epoch": 7430} {"train_loss": -26.515378952026367, "global_step": 616692, "epoch": 7430} {"train_loss": -26.959503173828125, "global_step": 616693, "epoch": 7430} {"train_loss": -26.408649444580078, "global_step": 616694, "epoch": 7430} {"train_loss": -26.85218620300293, "global_step": 616695, "epoch": 7430} {"train_loss": -26.976551055908203, "global_step": 616696, "epoch": 7430} {"train_loss": -27.050434112548828, "global_step": 616697, "epoch": 7430} {"train_loss": -27.2871036529541, "global_step": 616698, "epoch": 7430} {"train_loss": -27.61646842956543, "global_step": 616699, "epoch": 7430} {"train_loss": -27.740121841430664, "global_step": 616700, "epoch": 7430} {"train_loss": -27.196874618530273, "global_step": 616701, "epoch": 7430} {"train_loss": -27.56244468688965, "global_step": 616702, "epoch": 7430} {"train_loss": -27.498998641967773, "global_step": 616703, "epoch": 7430} {"train_loss": -27.472936630249023, "global_step": 616704, "epoch": 7430} {"train_loss": -27.977136611938477, "global_step": 616705, "epoch": 7430} {"train_loss": -28.0967960357666, "global_step": 616706, "epoch": 7430} {"train_loss": -27.740436553955078, "global_step": 616707, "epoch": 7430} {"train_loss": -27.825780868530273, "global_step": 616708, "epoch": 7430} {"train_loss": -27.92009925842285, "global_step": 616709, "epoch": 7430} {"train_loss": -27.780134201049805, "global_step": 616710, "epoch": 7430} {"train_loss": -27.859708786010742, "global_step": 616711, "epoch": 7430} {"train_loss": -27.753265380859375, "global_step": 616712, "epoch": 7430} {"train_loss": -28.300933837890625, "global_step": 616713, "epoch": 7430} {"train_loss": -27.956506729125977, "global_step": 616714, "epoch": 7430} {"train_loss": -27.698211669921875, "global_step": 616715, "epoch": 7430} {"train_loss": -27.907148361206055, "global_step": 616716, "epoch": 7430} {"train_loss": -27.9202938079834, "global_step": 616717, "epoch": 7430} {"train_loss": -28.179248809814453, "global_step": 616718, "epoch": 7430} {"train_loss": -28.188602447509766, "global_step": 616719, "epoch": 7430} {"train_loss": -28.09600830078125, "global_step": 616720, "epoch": 7430} {"train_loss": -28.008481979370117, "global_step": 616721, "epoch": 7430} {"train_loss": -28.209949493408203, "global_step": 616722, "epoch": 7430} {"train_loss": -28.165607452392578, "global_step": 616723, "epoch": 7430} {"train_loss": -28.231542587280273, "global_step": 616724, "epoch": 7430} {"train_loss": -27.955236434936523, "global_step": 616725, "epoch": 7430} {"train_loss": -28.201452255249023, "global_step": 616726, "epoch": 7430} {"train_loss": -28.16535758972168, "global_step": 616727, "epoch": 7430} {"train_loss": -28.4395694732666, "global_step": 616728, "epoch": 7430} {"train_loss": -28.167524337768555, "global_step": 616729, "epoch": 7430} {"train_loss": -28.640058517456055, "global_step": 616730, "epoch": 7430} {"train_loss": -28.548446655273438, "global_step": 616731, "epoch": 7430} {"train_loss": -28.38785171508789, "global_step": 616732, "epoch": 7430} {"train_loss": -28.269323348999023, "global_step": 616733, "epoch": 7430} {"train_loss": -28.395313262939453, "global_step": 616734, "epoch": 7430} {"train_loss": -28.414060592651367, "global_step": 616735, "epoch": 7430} {"train_loss": -28.36334800720215, "global_step": 616736, "epoch": 7430} {"train_loss": -28.236886978149414, "global_step": 616737, "epoch": 7430} {"train_loss": -28.127044677734375, "global_step": 616738, "epoch": 7430} {"train_loss": -28.251789093017578, "global_step": 616739, "epoch": 7430} {"train_loss": -28.346654891967773, "global_step": 616740, "epoch": 7430} {"train_loss": -28.600439071655273, "global_step": 616741, "epoch": 7430} {"train_loss": -28.154464721679688, "global_step": 616742, "epoch": 7430} {"train_loss": -27.934772491455078, "global_step": 616743, "epoch": 7430} {"train_loss": -28.479894638061523, "global_step": 616744, "epoch": 7430} {"train_loss": -28.256458282470703, "global_step": 616745, "epoch": 7430} {"train_loss": -28.227203369140625, "global_step": 616746, "epoch": 7430} {"train_loss": -28.31886863708496, "global_step": 616747, "epoch": 7430} {"train_loss": -28.12868309020996, "global_step": 616748, "epoch": 7430} {"train_loss": -28.11631202697754, "global_step": 616749, "epoch": 7430} {"train_loss": -28.279224395751953, "global_step": 616750, "epoch": 7430} {"train_loss": -27.956594467163086, "global_step": 616751, "epoch": 7430} {"train_loss": -27.84524917602539, "global_step": 616752, "epoch": 7430} {"train_loss": -27.6411190032959, "global_step": 616753, "epoch": 7430} {"train_loss": -27.397693634033203, "global_step": 616754, "epoch": 7430} {"train_loss": -27.194339752197266, "global_step": 616755, "epoch": 7430} {"train_loss": -27.59711265563965, "global_step": 616756, "epoch": 7430} {"train_loss": -28.086563110351562, "global_step": 616757, "epoch": 7430} {"train_loss": -28.024158477783203, "global_step": 616758, "epoch": 7430} {"train_loss": -27.768360137939453, "global_step": 616759, "epoch": 7430} {"train_loss": -27.824512481689453, "global_step": 616760, "epoch": 7430} {"train_loss": -27.818708419799805, "global_step": 616761, "epoch": 7430} {"train_loss": -28.000873565673828, "global_step": 616762, "epoch": 7430} {"train_loss": -27.559484481811523, "global_step": 616763, "epoch": 7430} {"train_loss": -28.12684440612793, "global_step": 616764, "epoch": 7430} {"train_loss": -27.776288986206055, "global_step": 616765, "epoch": 7430} {"train_loss": -27.905675888061523, "global_step": 616766, "epoch": 7430} {"train_loss": -28.032424926757812, "global_step": 616767, "epoch": 7430} {"train_loss": -28.19654655456543, "global_step": 616768, "epoch": 7430} {"train_loss": -27.99408531188965, "global_step": 616769, "epoch": 7430} {"train_loss": -28.018299102783203, "global_step": 616770, "epoch": 7430} {"train_loss": -28.167510986328125, "global_step": 616771, "epoch": 7430} {"train_loss": -27.905986510127423, "global_step": 616772, "epoch": 7430, "val_loss": 6594625.0} {"train_loss": -27.914005279541016, "global_step": 616773, "epoch": 7431} {"train_loss": -28.334095001220703, "global_step": 616774, "epoch": 7431} {"train_loss": -27.81559181213379, "global_step": 616775, "epoch": 7431} {"train_loss": -28.38722038269043, "global_step": 616776, "epoch": 7431} {"train_loss": -27.55120849609375, "global_step": 616777, "epoch": 7431} {"train_loss": -27.94648551940918, "global_step": 616778, "epoch": 7431} {"train_loss": -27.926549911499023, "global_step": 616779, "epoch": 7431} {"train_loss": -27.6827449798584, "global_step": 616780, "epoch": 7431} {"train_loss": -27.798940658569336, "global_step": 616781, "epoch": 7431} {"train_loss": -27.58016014099121, "global_step": 616782, "epoch": 7431} {"train_loss": -28.148956298828125, "global_step": 616783, "epoch": 7431} {"train_loss": -28.080102920532227, "global_step": 616784, "epoch": 7431} {"train_loss": -27.76188087463379, "global_step": 616785, "epoch": 7431} {"train_loss": -28.06043815612793, "global_step": 616786, "epoch": 7431} {"train_loss": -27.96656608581543, "global_step": 616787, "epoch": 7431} {"train_loss": -28.224964141845703, "global_step": 616788, "epoch": 7431} {"train_loss": -28.173023223876953, "global_step": 616789, "epoch": 7431} {"train_loss": -28.215835571289062, "global_step": 616790, "epoch": 7431} {"train_loss": -27.957508087158203, "global_step": 616791, "epoch": 7431} {"train_loss": -28.050540924072266, "global_step": 616792, "epoch": 7431} {"train_loss": -28.201017379760742, "global_step": 616793, "epoch": 7431} {"train_loss": -27.86159324645996, "global_step": 616794, "epoch": 7431} {"train_loss": -27.956348419189453, "global_step": 616795, "epoch": 7431} {"train_loss": -28.060171127319336, "global_step": 616796, "epoch": 7431} {"train_loss": -27.82716941833496, "global_step": 616797, "epoch": 7431} {"train_loss": -28.540430068969727, "global_step": 616798, "epoch": 7431} {"train_loss": -28.25092887878418, "global_step": 616799, "epoch": 7431} {"train_loss": -28.621015548706055, "global_step": 616800, "epoch": 7431} {"train_loss": -28.41329002380371, "global_step": 616801, "epoch": 7431} {"train_loss": -28.08063316345215, "global_step": 616802, "epoch": 7431} {"train_loss": -28.3786563873291, "global_step": 616803, "epoch": 7431} {"train_loss": -27.9935302734375, "global_step": 616804, "epoch": 7431} {"train_loss": -28.06837272644043, "global_step": 616805, "epoch": 7431} {"train_loss": -28.2823486328125, "global_step": 616806, "epoch": 7431} {"train_loss": -28.30507469177246, "global_step": 616807, "epoch": 7431} {"train_loss": -28.409753799438477, "global_step": 616808, "epoch": 7431} {"train_loss": -28.670026779174805, "global_step": 616809, "epoch": 7431} {"train_loss": -28.44547462463379, "global_step": 616810, "epoch": 7431} {"train_loss": -28.363428115844727, "global_step": 616811, "epoch": 7431} {"train_loss": -28.072919845581055, "global_step": 616812, "epoch": 7431} {"train_loss": -28.01580238342285, "global_step": 616813, "epoch": 7431} {"train_loss": -27.974782943725586, "global_step": 616814, "epoch": 7431} {"train_loss": -27.84877586364746, "global_step": 616815, "epoch": 7431} {"train_loss": -28.0803279876709, "global_step": 616816, "epoch": 7431} {"train_loss": -28.166004180908203, "global_step": 616817, "epoch": 7431} {"train_loss": -28.43879508972168, "global_step": 616818, "epoch": 7431} {"train_loss": -28.26068115234375, "global_step": 616819, "epoch": 7431} {"train_loss": -27.75587272644043, "global_step": 616820, "epoch": 7431} {"train_loss": -28.147424697875977, "global_step": 616821, "epoch": 7431} {"train_loss": -27.84235191345215, "global_step": 616822, "epoch": 7431} {"train_loss": -27.351537704467773, "global_step": 616823, "epoch": 7431} {"train_loss": -27.7966365814209, "global_step": 616824, "epoch": 7431} {"train_loss": -28.221715927124023, "global_step": 616825, "epoch": 7431} {"train_loss": -27.918811798095703, "global_step": 616826, "epoch": 7431} {"train_loss": -28.147342681884766, "global_step": 616827, "epoch": 7431} {"train_loss": -27.919240951538086, "global_step": 616828, "epoch": 7431} {"train_loss": -28.0035457611084, "global_step": 616829, "epoch": 7431} {"train_loss": -28.295654296875, "global_step": 616830, "epoch": 7431} {"train_loss": -28.041269302368164, "global_step": 616831, "epoch": 7431} {"train_loss": -28.309619903564453, "global_step": 616832, "epoch": 7431} {"train_loss": -27.959033966064453, "global_step": 616833, "epoch": 7431} {"train_loss": -28.042926788330078, "global_step": 616834, "epoch": 7431} {"train_loss": -28.53162956237793, "global_step": 616835, "epoch": 7431} {"train_loss": -28.109312057495117, "global_step": 616836, "epoch": 7431} {"train_loss": -27.96990966796875, "global_step": 616837, "epoch": 7431} {"train_loss": -28.12822914123535, "global_step": 616838, "epoch": 7431} {"train_loss": -27.956851959228516, "global_step": 616839, "epoch": 7431} {"train_loss": -27.649066925048828, "global_step": 616840, "epoch": 7431} {"train_loss": -27.90569496154785, "global_step": 616841, "epoch": 7431} {"train_loss": -28.2091064453125, "global_step": 616842, "epoch": 7431} {"train_loss": -28.16179847717285, "global_step": 616843, "epoch": 7431} {"train_loss": -28.178070068359375, "global_step": 616844, "epoch": 7431} {"train_loss": -28.17530632019043, "global_step": 616845, "epoch": 7431} {"train_loss": -28.228418350219727, "global_step": 616846, "epoch": 7431} {"train_loss": -28.099380493164062, "global_step": 616847, "epoch": 7431} {"train_loss": -28.059085845947266, "global_step": 616848, "epoch": 7431} {"train_loss": -28.148237228393555, "global_step": 616849, "epoch": 7431} {"train_loss": -28.14353370666504, "global_step": 616850, "epoch": 7431} {"train_loss": -28.377857208251953, "global_step": 616851, "epoch": 7431} {"train_loss": -28.30231285095215, "global_step": 616852, "epoch": 7431} {"train_loss": -28.400808334350586, "global_step": 616853, "epoch": 7431} {"train_loss": -28.261157989501953, "global_step": 616854, "epoch": 7431} {"train_loss": -28.105198848678405, "global_step": 616855, "epoch": 7431, "val_loss": 6587112.5} {"train_loss": -27.57196617126465, "global_step": 616856, "epoch": 7432} {"train_loss": -27.91861915588379, "global_step": 616857, "epoch": 7432} {"train_loss": -27.794889450073242, "global_step": 616858, "epoch": 7432} {"train_loss": -27.9848575592041, "global_step": 616859, "epoch": 7432} {"train_loss": -27.74207878112793, "global_step": 616860, "epoch": 7432} {"train_loss": -27.95110511779785, "global_step": 616861, "epoch": 7432} {"train_loss": -28.161731719970703, "global_step": 616862, "epoch": 7432} {"train_loss": -28.19318962097168, "global_step": 616863, "epoch": 7432} {"train_loss": -28.08595085144043, "global_step": 616864, "epoch": 7432} {"train_loss": -28.27680778503418, "global_step": 616865, "epoch": 7432} {"train_loss": -27.928144454956055, "global_step": 616866, "epoch": 7432} {"train_loss": -28.489294052124023, "global_step": 616867, "epoch": 7432} {"train_loss": -27.29233169555664, "global_step": 616868, "epoch": 7432} {"train_loss": -27.959918975830078, "global_step": 616869, "epoch": 7432} {"train_loss": -27.081613540649414, "global_step": 616870, "epoch": 7432} {"train_loss": -27.572662353515625, "global_step": 616871, "epoch": 7432} {"train_loss": -28.0653018951416, "global_step": 616872, "epoch": 7432} {"train_loss": -28.27535057067871, "global_step": 616873, "epoch": 7432} {"train_loss": -28.115949630737305, "global_step": 616874, "epoch": 7432} {"train_loss": -27.982894897460938, "global_step": 616875, "epoch": 7432} {"train_loss": -27.8015079498291, "global_step": 616876, "epoch": 7432} {"train_loss": -28.025583267211914, "global_step": 616877, "epoch": 7432} {"train_loss": -28.08392906188965, "global_step": 616878, "epoch": 7432} {"train_loss": -28.139028549194336, "global_step": 616879, "epoch": 7432} {"train_loss": -28.338537216186523, "global_step": 616880, "epoch": 7432} {"train_loss": -28.04486656188965, "global_step": 616881, "epoch": 7432} {"train_loss": -28.064611434936523, "global_step": 616882, "epoch": 7432} {"train_loss": -27.96332359313965, "global_step": 616883, "epoch": 7432} {"train_loss": -28.00567054748535, "global_step": 616884, "epoch": 7432} {"train_loss": -28.080982208251953, "global_step": 616885, "epoch": 7432} {"train_loss": -27.8248348236084, "global_step": 616886, "epoch": 7432} {"train_loss": -27.793872833251953, "global_step": 616887, "epoch": 7432} {"train_loss": -28.66715431213379, "global_step": 616888, "epoch": 7432} {"train_loss": -28.07866859436035, "global_step": 616889, "epoch": 7432} {"train_loss": -28.352930068969727, "global_step": 616890, "epoch": 7432} {"train_loss": -28.006994247436523, "global_step": 616891, "epoch": 7432} {"train_loss": -28.059843063354492, "global_step": 616892, "epoch": 7432} {"train_loss": -28.06180763244629, "global_step": 616893, "epoch": 7432} {"train_loss": -27.911304473876953, "global_step": 616894, "epoch": 7432} {"train_loss": -27.79345703125, "global_step": 616895, "epoch": 7432} {"train_loss": -28.331390380859375, "global_step": 616896, "epoch": 7432} {"train_loss": -28.201440811157227, "global_step": 616897, "epoch": 7432} {"train_loss": -28.296680450439453, "global_step": 616898, "epoch": 7432} {"train_loss": -28.01468849182129, "global_step": 616899, "epoch": 7432} {"train_loss": -28.239038467407227, "global_step": 616900, "epoch": 7432} {"train_loss": -27.8173885345459, "global_step": 616901, "epoch": 7432} {"train_loss": -28.3242130279541, "global_step": 616902, "epoch": 7432} {"train_loss": -28.096012115478516, "global_step": 616903, "epoch": 7432} {"train_loss": -28.302093505859375, "global_step": 616904, "epoch": 7432} {"train_loss": -27.69816017150879, "global_step": 616905, "epoch": 7432} {"train_loss": -28.342823028564453, "global_step": 616906, "epoch": 7432} {"train_loss": -28.426008224487305, "global_step": 616907, "epoch": 7432} {"train_loss": -28.221479415893555, "global_step": 616908, "epoch": 7432} {"train_loss": -28.376300811767578, "global_step": 616909, "epoch": 7432} {"train_loss": -28.297163009643555, "global_step": 616910, "epoch": 7432} {"train_loss": -28.313772201538086, "global_step": 616911, "epoch": 7432} {"train_loss": -28.230987548828125, "global_step": 616912, "epoch": 7432} {"train_loss": -28.575735092163086, "global_step": 616913, "epoch": 7432} {"train_loss": -28.21172523498535, "global_step": 616914, "epoch": 7432} {"train_loss": -27.939380645751953, "global_step": 616915, "epoch": 7432} {"train_loss": -27.95993995666504, "global_step": 616916, "epoch": 7432} {"train_loss": -27.840137481689453, "global_step": 616917, "epoch": 7432} {"train_loss": -27.965728759765625, "global_step": 616918, "epoch": 7432} {"train_loss": -27.950796127319336, "global_step": 616919, "epoch": 7432} {"train_loss": -27.981931686401367, "global_step": 616920, "epoch": 7432} {"train_loss": -28.35304069519043, "global_step": 616921, "epoch": 7432} {"train_loss": -28.07744789123535, "global_step": 616922, "epoch": 7432} {"train_loss": -28.3824520111084, "global_step": 616923, "epoch": 7432} {"train_loss": -27.800861358642578, "global_step": 616924, "epoch": 7432} {"train_loss": -28.277179718017578, "global_step": 616925, "epoch": 7432} {"train_loss": -27.920469284057617, "global_step": 616926, "epoch": 7432} {"train_loss": -27.941797256469727, "global_step": 616927, "epoch": 7432} {"train_loss": -27.70767593383789, "global_step": 616928, "epoch": 7432} {"train_loss": -28.2796573638916, "global_step": 616929, "epoch": 7432} {"train_loss": -28.0477294921875, "global_step": 616930, "epoch": 7432} {"train_loss": -28.224462509155273, "global_step": 616931, "epoch": 7432} {"train_loss": -27.82413673400879, "global_step": 616932, "epoch": 7432} {"train_loss": -28.327106475830078, "global_step": 616933, "epoch": 7432} {"train_loss": -28.04444694519043, "global_step": 616934, "epoch": 7432} {"train_loss": -28.089679718017578, "global_step": 616935, "epoch": 7432} {"train_loss": -28.115222930908203, "global_step": 616936, "epoch": 7432} {"train_loss": -27.818206787109375, "global_step": 616937, "epoch": 7432} {"train_loss": -28.05807830626706, "global_step": 616938, "epoch": 7432, "val_loss": 6553765.0} {"train_loss": -27.7476749420166, "global_step": 616939, "epoch": 7433} {"train_loss": -27.313634872436523, "global_step": 616940, "epoch": 7433} {"train_loss": -27.114913940429688, "global_step": 616941, "epoch": 7433} {"train_loss": -26.912145614624023, "global_step": 616942, "epoch": 7433} {"train_loss": -26.900348663330078, "global_step": 616943, "epoch": 7433} {"train_loss": -27.431005477905273, "global_step": 616944, "epoch": 7433} {"train_loss": -27.694690704345703, "global_step": 616945, "epoch": 7433} {"train_loss": -27.32172203063965, "global_step": 616946, "epoch": 7433} {"train_loss": -27.946063995361328, "global_step": 616947, "epoch": 7433} {"train_loss": -27.697412490844727, "global_step": 616948, "epoch": 7433} {"train_loss": -28.009021759033203, "global_step": 616949, "epoch": 7433} {"train_loss": -27.548233032226562, "global_step": 616950, "epoch": 7433} {"train_loss": -27.95572853088379, "global_step": 616951, "epoch": 7433} {"train_loss": -27.89383888244629, "global_step": 616952, "epoch": 7433} {"train_loss": -28.018579483032227, "global_step": 616953, "epoch": 7433} {"train_loss": -27.5594482421875, "global_step": 616954, "epoch": 7433} {"train_loss": -28.062240600585938, "global_step": 616955, "epoch": 7433} {"train_loss": -27.7410888671875, "global_step": 616956, "epoch": 7433} {"train_loss": -28.025222778320312, "global_step": 616957, "epoch": 7433} {"train_loss": -28.023284912109375, "global_step": 616958, "epoch": 7433} {"train_loss": -27.88193702697754, "global_step": 616959, "epoch": 7433} {"train_loss": -27.98575210571289, "global_step": 616960, "epoch": 7433} {"train_loss": -27.862546920776367, "global_step": 616961, "epoch": 7433} {"train_loss": -27.986194610595703, "global_step": 616962, "epoch": 7433} {"train_loss": -28.192346572875977, "global_step": 616963, "epoch": 7433} {"train_loss": -28.23282241821289, "global_step": 616964, "epoch": 7433} {"train_loss": -28.3681583404541, "global_step": 616965, "epoch": 7433} {"train_loss": -28.18389320373535, "global_step": 616966, "epoch": 7433} {"train_loss": -28.042221069335938, "global_step": 616967, "epoch": 7433} {"train_loss": -28.27666664123535, "global_step": 616968, "epoch": 7433} {"train_loss": -28.259479522705078, "global_step": 616969, "epoch": 7433} {"train_loss": -28.632238388061523, "global_step": 616970, "epoch": 7433} {"train_loss": -28.26759910583496, "global_step": 616971, "epoch": 7433} {"train_loss": -28.320661544799805, "global_step": 616972, "epoch": 7433} {"train_loss": -28.163557052612305, "global_step": 616973, "epoch": 7433} {"train_loss": -28.221923828125, "global_step": 616974, "epoch": 7433} {"train_loss": -28.344715118408203, "global_step": 616975, "epoch": 7433} {"train_loss": -28.4055118560791, "global_step": 616976, "epoch": 7433} {"train_loss": -28.378768920898438, "global_step": 616977, "epoch": 7433} {"train_loss": -28.430267333984375, "global_step": 616978, "epoch": 7433} {"train_loss": -28.30132484436035, "global_step": 616979, "epoch": 7433} {"train_loss": -28.503671646118164, "global_step": 616980, "epoch": 7433} {"train_loss": -27.973712921142578, "global_step": 616981, "epoch": 7433} {"train_loss": -28.089466094970703, "global_step": 616982, "epoch": 7433} {"train_loss": -28.389432907104492, "global_step": 616983, "epoch": 7433} {"train_loss": -27.796344757080078, "global_step": 616984, "epoch": 7433} {"train_loss": -28.20985221862793, "global_step": 616985, "epoch": 7433} {"train_loss": -28.174951553344727, "global_step": 616986, "epoch": 7433} {"train_loss": -28.422388076782227, "global_step": 616987, "epoch": 7433} {"train_loss": -28.343738555908203, "global_step": 616988, "epoch": 7433} {"train_loss": -28.43302345275879, "global_step": 616989, "epoch": 7433} {"train_loss": -28.37928581237793, "global_step": 616990, "epoch": 7433} {"train_loss": -28.27435302734375, "global_step": 616991, "epoch": 7433} {"train_loss": -28.33967399597168, "global_step": 616992, "epoch": 7433} {"train_loss": -28.39373207092285, "global_step": 616993, "epoch": 7433} {"train_loss": -27.92842674255371, "global_step": 616994, "epoch": 7433} {"train_loss": -27.782743453979492, "global_step": 616995, "epoch": 7433} {"train_loss": -27.977375030517578, "global_step": 616996, "epoch": 7433} {"train_loss": -28.17950439453125, "global_step": 616997, "epoch": 7433} {"train_loss": -27.686033248901367, "global_step": 616998, "epoch": 7433} {"train_loss": -27.476850509643555, "global_step": 616999, "epoch": 7433} {"train_loss": -26.588464736938477, "global_step": 617000, "epoch": 7433} {"train_loss": -27.42011070251465, "global_step": 617001, "epoch": 7433} {"train_loss": -27.70912742614746, "global_step": 617002, "epoch": 7433} {"train_loss": -27.393911361694336, "global_step": 617003, "epoch": 7433} {"train_loss": -27.31951332092285, "global_step": 617004, "epoch": 7433} {"train_loss": -27.811676025390625, "global_step": 617005, "epoch": 7433} {"train_loss": -27.682422637939453, "global_step": 617006, "epoch": 7433} {"train_loss": -28.1441707611084, "global_step": 617007, "epoch": 7433} {"train_loss": -28.064319610595703, "global_step": 617008, "epoch": 7433} {"train_loss": -27.866907119750977, "global_step": 617009, "epoch": 7433} {"train_loss": -28.067590713500977, "global_step": 617010, "epoch": 7433} {"train_loss": -28.38681983947754, "global_step": 617011, "epoch": 7433} {"train_loss": -27.842565536499023, "global_step": 617012, "epoch": 7433} {"train_loss": -27.752904891967773, "global_step": 617013, "epoch": 7433} {"train_loss": -27.622732162475586, "global_step": 617014, "epoch": 7433} {"train_loss": -28.515064239501953, "global_step": 617015, "epoch": 7433} {"train_loss": -28.152929306030273, "global_step": 617016, "epoch": 7433} {"train_loss": -27.985748291015625, "global_step": 617017, "epoch": 7433} {"train_loss": -27.930435180664062, "global_step": 617018, "epoch": 7433} {"train_loss": -27.77558708190918, "global_step": 617019, "epoch": 7433} {"train_loss": -28.209156036376953, "global_step": 617020, "epoch": 7433} {"train_loss": -27.979302004159216, "global_step": 617021, "epoch": 7433, "val_loss": 6563471.0} {"train_loss": -27.759668350219727, "global_step": 617022, "epoch": 7434} {"train_loss": -27.19955825805664, "global_step": 617023, "epoch": 7434} {"train_loss": -27.41213035583496, "global_step": 617024, "epoch": 7434} {"train_loss": -27.0566349029541, "global_step": 617025, "epoch": 7434} {"train_loss": -27.09469985961914, "global_step": 617026, "epoch": 7434} {"train_loss": -27.489582061767578, "global_step": 617027, "epoch": 7434} {"train_loss": -27.372833251953125, "global_step": 617028, "epoch": 7434} {"train_loss": -26.97953224182129, "global_step": 617029, "epoch": 7434} {"train_loss": -27.19121742248535, "global_step": 617030, "epoch": 7434} {"train_loss": -27.48261070251465, "global_step": 617031, "epoch": 7434} {"train_loss": -27.325641632080078, "global_step": 617032, "epoch": 7434} {"train_loss": -27.362024307250977, "global_step": 617033, "epoch": 7434} {"train_loss": -27.863370895385742, "global_step": 617034, "epoch": 7434} {"train_loss": -27.65668296813965, "global_step": 617035, "epoch": 7434} {"train_loss": -27.569318771362305, "global_step": 617036, "epoch": 7434} {"train_loss": -27.949264526367188, "global_step": 617037, "epoch": 7434} {"train_loss": -27.90865135192871, "global_step": 617038, "epoch": 7434} {"train_loss": -28.2033748626709, "global_step": 617039, "epoch": 7434} {"train_loss": -28.018543243408203, "global_step": 617040, "epoch": 7434} {"train_loss": -27.72723960876465, "global_step": 617041, "epoch": 7434} {"train_loss": -27.73577308654785, "global_step": 617042, "epoch": 7434} {"train_loss": -28.233673095703125, "global_step": 617043, "epoch": 7434} {"train_loss": -27.92935562133789, "global_step": 617044, "epoch": 7434} {"train_loss": -27.96345329284668, "global_step": 617045, "epoch": 7434} {"train_loss": -28.14914894104004, "global_step": 617046, "epoch": 7434} {"train_loss": -27.659032821655273, "global_step": 617047, "epoch": 7434} {"train_loss": -28.270578384399414, "global_step": 617048, "epoch": 7434} {"train_loss": -28.001678466796875, "global_step": 617049, "epoch": 7434} {"train_loss": -28.307830810546875, "global_step": 617050, "epoch": 7434} {"train_loss": -28.12347412109375, "global_step": 617051, "epoch": 7434} {"train_loss": -27.936609268188477, "global_step": 617052, "epoch": 7434} {"train_loss": -28.18697166442871, "global_step": 617053, "epoch": 7434} {"train_loss": -28.258716583251953, "global_step": 617054, "epoch": 7434} {"train_loss": -28.2099666595459, "global_step": 617055, "epoch": 7434} {"train_loss": -27.963668823242188, "global_step": 617056, "epoch": 7434} {"train_loss": -28.48227882385254, "global_step": 617057, "epoch": 7434} {"train_loss": -28.184173583984375, "global_step": 617058, "epoch": 7434} {"train_loss": -28.202543258666992, "global_step": 617059, "epoch": 7434} {"train_loss": -27.896081924438477, "global_step": 617060, "epoch": 7434} {"train_loss": -28.020965576171875, "global_step": 617061, "epoch": 7434} {"train_loss": -28.124547958374023, "global_step": 617062, "epoch": 7434} {"train_loss": -28.260272979736328, "global_step": 617063, "epoch": 7434} {"train_loss": -28.235754013061523, "global_step": 617064, "epoch": 7434} {"train_loss": -28.39166259765625, "global_step": 617065, "epoch": 7434} {"train_loss": -27.90297508239746, "global_step": 617066, "epoch": 7434} {"train_loss": -28.014007568359375, "global_step": 617067, "epoch": 7434} {"train_loss": -27.70880699157715, "global_step": 617068, "epoch": 7434} {"train_loss": -27.947818756103516, "global_step": 617069, "epoch": 7434} {"train_loss": -27.7318115234375, "global_step": 617070, "epoch": 7434} {"train_loss": -27.53595542907715, "global_step": 617071, "epoch": 7434} {"train_loss": -27.714139938354492, "global_step": 617072, "epoch": 7434} {"train_loss": -27.855976104736328, "global_step": 617073, "epoch": 7434} {"train_loss": -27.806493759155273, "global_step": 617074, "epoch": 7434} {"train_loss": -28.477392196655273, "global_step": 617075, "epoch": 7434} {"train_loss": -27.97505760192871, "global_step": 617076, "epoch": 7434} {"train_loss": -27.4268856048584, "global_step": 617077, "epoch": 7434} {"train_loss": -27.883426666259766, "global_step": 617078, "epoch": 7434} {"train_loss": -28.0336971282959, "global_step": 617079, "epoch": 7434} {"train_loss": -27.688405990600586, "global_step": 617080, "epoch": 7434} {"train_loss": -27.560949325561523, "global_step": 617081, "epoch": 7434} {"train_loss": -28.280237197875977, "global_step": 617082, "epoch": 7434} {"train_loss": -28.0648250579834, "global_step": 617083, "epoch": 7434} {"train_loss": -28.170166015625, "global_step": 617084, "epoch": 7434} {"train_loss": -27.85066032409668, "global_step": 617085, "epoch": 7434} {"train_loss": -28.20206642150879, "global_step": 617086, "epoch": 7434} {"train_loss": -28.288787841796875, "global_step": 617087, "epoch": 7434} {"train_loss": -27.995574951171875, "global_step": 617088, "epoch": 7434} {"train_loss": -28.170379638671875, "global_step": 617089, "epoch": 7434} {"train_loss": -28.128494262695312, "global_step": 617090, "epoch": 7434} {"train_loss": -28.53643226623535, "global_step": 617091, "epoch": 7434} {"train_loss": -28.335790634155273, "global_step": 617092, "epoch": 7434} {"train_loss": -28.327869415283203, "global_step": 617093, "epoch": 7434} {"train_loss": -27.685998916625977, "global_step": 617094, "epoch": 7434} {"train_loss": -28.105091094970703, "global_step": 617095, "epoch": 7434} {"train_loss": -27.717931747436523, "global_step": 617096, "epoch": 7434} {"train_loss": -28.29387855529785, "global_step": 617097, "epoch": 7434} {"train_loss": -27.890777587890625, "global_step": 617098, "epoch": 7434} {"train_loss": -28.325712203979492, "global_step": 617099, "epoch": 7434} {"train_loss": -28.260467529296875, "global_step": 617100, "epoch": 7434} {"train_loss": -27.748029708862305, "global_step": 617101, "epoch": 7434} {"train_loss": -27.778217315673828, "global_step": 617102, "epoch": 7434} {"train_loss": -27.65192985534668, "global_step": 617103, "epoch": 7434} {"train_loss": -27.899235644972467, "global_step": 617104, "epoch": 7434, "val_loss": 6636672.5} {"train_loss": -27.411218643188477, "global_step": 617105, "epoch": 7435} {"train_loss": -27.185224533081055, "global_step": 617106, "epoch": 7435} {"train_loss": -27.335620880126953, "global_step": 617107, "epoch": 7435} {"train_loss": -27.1762752532959, "global_step": 617108, "epoch": 7435} {"train_loss": -27.39163589477539, "global_step": 617109, "epoch": 7435} {"train_loss": -27.138967514038086, "global_step": 617110, "epoch": 7435} {"train_loss": -27.160547256469727, "global_step": 617111, "epoch": 7435} {"train_loss": -26.79501724243164, "global_step": 617112, "epoch": 7435} {"train_loss": -27.793100357055664, "global_step": 617113, "epoch": 7435} {"train_loss": -27.291126251220703, "global_step": 617114, "epoch": 7435} {"train_loss": -27.709857940673828, "global_step": 617115, "epoch": 7435} {"train_loss": -27.670499801635742, "global_step": 617116, "epoch": 7435} {"train_loss": -27.704092025756836, "global_step": 617117, "epoch": 7435} {"train_loss": -27.572433471679688, "global_step": 617118, "epoch": 7435} {"train_loss": -27.679086685180664, "global_step": 617119, "epoch": 7435} {"train_loss": -27.67732810974121, "global_step": 617120, "epoch": 7435} {"train_loss": -27.858585357666016, "global_step": 617121, "epoch": 7435} {"train_loss": -27.856603622436523, "global_step": 617122, "epoch": 7435} {"train_loss": -27.659772872924805, "global_step": 617123, "epoch": 7435} {"train_loss": -27.7448787689209, "global_step": 617124, "epoch": 7435} {"train_loss": -27.93169593811035, "global_step": 617125, "epoch": 7435} {"train_loss": -27.496801376342773, "global_step": 617126, "epoch": 7435} {"train_loss": -27.789587020874023, "global_step": 617127, "epoch": 7435} {"train_loss": -27.965551376342773, "global_step": 617128, "epoch": 7435} {"train_loss": -27.738065719604492, "global_step": 617129, "epoch": 7435} {"train_loss": -27.78964614868164, "global_step": 617130, "epoch": 7435} {"train_loss": -27.9639835357666, "global_step": 617131, "epoch": 7435} {"train_loss": -27.6375789642334, "global_step": 617132, "epoch": 7435} {"train_loss": -28.160205841064453, "global_step": 617133, "epoch": 7435} {"train_loss": -27.550199508666992, "global_step": 617134, "epoch": 7435} {"train_loss": -27.990182876586914, "global_step": 617135, "epoch": 7435} {"train_loss": -27.853071212768555, "global_step": 617136, "epoch": 7435} {"train_loss": -28.224950790405273, "global_step": 617137, "epoch": 7435} {"train_loss": -28.453027725219727, "global_step": 617138, "epoch": 7435} {"train_loss": -27.92002296447754, "global_step": 617139, "epoch": 7435} {"train_loss": -28.312820434570312, "global_step": 617140, "epoch": 7435} {"train_loss": -27.935728073120117, "global_step": 617141, "epoch": 7435} {"train_loss": -27.921918869018555, "global_step": 617142, "epoch": 7435} {"train_loss": -27.640310287475586, "global_step": 617143, "epoch": 7435} {"train_loss": -28.349323272705078, "global_step": 617144, "epoch": 7435} {"train_loss": -28.201452255249023, "global_step": 617145, "epoch": 7435} {"train_loss": -27.97393798828125, "global_step": 617146, "epoch": 7435} {"train_loss": -28.471725463867188, "global_step": 617147, "epoch": 7435} {"train_loss": -28.537200927734375, "global_step": 617148, "epoch": 7435} {"train_loss": -28.229461669921875, "global_step": 617149, "epoch": 7435} {"train_loss": -28.472143173217773, "global_step": 617150, "epoch": 7435} {"train_loss": -28.273517608642578, "global_step": 617151, "epoch": 7435} {"train_loss": -28.1715087890625, "global_step": 617152, "epoch": 7435} {"train_loss": -28.21488380432129, "global_step": 617153, "epoch": 7435} {"train_loss": -27.958770751953125, "global_step": 617154, "epoch": 7435} {"train_loss": -28.414148330688477, "global_step": 617155, "epoch": 7435} {"train_loss": -28.322681427001953, "global_step": 617156, "epoch": 7435} {"train_loss": -28.7308292388916, "global_step": 617157, "epoch": 7435} {"train_loss": -28.06267738342285, "global_step": 617158, "epoch": 7435} {"train_loss": -28.33868408203125, "global_step": 617159, "epoch": 7435} {"train_loss": -28.615528106689453, "global_step": 617160, "epoch": 7435} {"train_loss": -27.88232421875, "global_step": 617161, "epoch": 7435} {"train_loss": -28.0446720123291, "global_step": 617162, "epoch": 7435} {"train_loss": -27.775049209594727, "global_step": 617163, "epoch": 7435} {"train_loss": -27.793424606323242, "global_step": 617164, "epoch": 7435} {"train_loss": -28.27142333984375, "global_step": 617165, "epoch": 7435} {"train_loss": -28.121973037719727, "global_step": 617166, "epoch": 7435} {"train_loss": -28.074377059936523, "global_step": 617167, "epoch": 7435} {"train_loss": -27.565555572509766, "global_step": 617168, "epoch": 7435} {"train_loss": -28.17249870300293, "global_step": 617169, "epoch": 7435} {"train_loss": -28.285879135131836, "global_step": 617170, "epoch": 7435} {"train_loss": -27.87935447692871, "global_step": 617171, "epoch": 7435} {"train_loss": -28.064802169799805, "global_step": 617172, "epoch": 7435} {"train_loss": -28.128488540649414, "global_step": 617173, "epoch": 7435} {"train_loss": -28.75762939453125, "global_step": 617174, "epoch": 7435} {"train_loss": -27.93572998046875, "global_step": 617175, "epoch": 7435} {"train_loss": -28.15576171875, "global_step": 617176, "epoch": 7435} {"train_loss": -28.199878692626953, "global_step": 617177, "epoch": 7435} {"train_loss": -28.366779327392578, "global_step": 617178, "epoch": 7435} {"train_loss": -28.23981285095215, "global_step": 617179, "epoch": 7435} {"train_loss": -28.262842178344727, "global_step": 617180, "epoch": 7435} {"train_loss": -28.487478256225586, "global_step": 617181, "epoch": 7435} {"train_loss": -28.53857421875, "global_step": 617182, "epoch": 7435} {"train_loss": -28.190046310424805, "global_step": 617183, "epoch": 7435} {"train_loss": -28.323949813842773, "global_step": 617184, "epoch": 7435} {"train_loss": -28.3074893951416, "global_step": 617185, "epoch": 7435} {"train_loss": -28.247800827026367, "global_step": 617186, "epoch": 7435} {"train_loss": -27.980423548135413, "global_step": 617187, "epoch": 7435, "val_loss": 6560421.0} {"train_loss": -27.182926177978516, "global_step": 617188, "epoch": 7436} {"train_loss": -27.76511001586914, "global_step": 617189, "epoch": 7436} {"train_loss": -28.15555763244629, "global_step": 617190, "epoch": 7436} {"train_loss": -27.730209350585938, "global_step": 617191, "epoch": 7436} {"train_loss": -27.91578483581543, "global_step": 617192, "epoch": 7436} {"train_loss": -27.72127342224121, "global_step": 617193, "epoch": 7436} {"train_loss": -27.266157150268555, "global_step": 617194, "epoch": 7436} {"train_loss": -27.0147762298584, "global_step": 617195, "epoch": 7436} {"train_loss": -26.412139892578125, "global_step": 617196, "epoch": 7436} {"train_loss": -27.574750900268555, "global_step": 617197, "epoch": 7436} {"train_loss": -27.1358642578125, "global_step": 617198, "epoch": 7436} {"train_loss": -27.37833023071289, "global_step": 617199, "epoch": 7436} {"train_loss": -27.673542022705078, "global_step": 617200, "epoch": 7436} {"train_loss": -27.477069854736328, "global_step": 617201, "epoch": 7436} {"train_loss": -27.622812271118164, "global_step": 617202, "epoch": 7436} {"train_loss": -27.995990753173828, "global_step": 617203, "epoch": 7436} {"train_loss": -28.0401554107666, "global_step": 617204, "epoch": 7436} {"train_loss": -27.6009521484375, "global_step": 617205, "epoch": 7436} {"train_loss": -27.682294845581055, "global_step": 617206, "epoch": 7436} {"train_loss": -27.81573486328125, "global_step": 617207, "epoch": 7436} {"train_loss": -27.540510177612305, "global_step": 617208, "epoch": 7436} {"train_loss": -27.653711318969727, "global_step": 617209, "epoch": 7436} {"train_loss": -27.659687042236328, "global_step": 617210, "epoch": 7436} {"train_loss": -27.69484519958496, "global_step": 617211, "epoch": 7436} {"train_loss": -27.690185546875, "global_step": 617212, "epoch": 7436} {"train_loss": -28.004867553710938, "global_step": 617213, "epoch": 7436} {"train_loss": -27.925378799438477, "global_step": 617214, "epoch": 7436} {"train_loss": -27.81074333190918, "global_step": 617215, "epoch": 7436} {"train_loss": -28.34221839904785, "global_step": 617216, "epoch": 7436} {"train_loss": -27.678064346313477, "global_step": 617217, "epoch": 7436} {"train_loss": -28.45224952697754, "global_step": 617218, "epoch": 7436} {"train_loss": -27.785444259643555, "global_step": 617219, "epoch": 7436} {"train_loss": -27.420948028564453, "global_step": 617220, "epoch": 7436} {"train_loss": -28.222198486328125, "global_step": 617221, "epoch": 7436} {"train_loss": -28.042144775390625, "global_step": 617222, "epoch": 7436} {"train_loss": -28.013275146484375, "global_step": 617223, "epoch": 7436} {"train_loss": -27.929595947265625, "global_step": 617224, "epoch": 7436} {"train_loss": -28.182859420776367, "global_step": 617225, "epoch": 7436} {"train_loss": -28.137113571166992, "global_step": 617226, "epoch": 7436} {"train_loss": -28.18497657775879, "global_step": 617227, "epoch": 7436} {"train_loss": -27.994922637939453, "global_step": 617228, "epoch": 7436} {"train_loss": -28.522659301757812, "global_step": 617229, "epoch": 7436} {"train_loss": -27.819101333618164, "global_step": 617230, "epoch": 7436} {"train_loss": -28.22879409790039, "global_step": 617231, "epoch": 7436} {"train_loss": -27.824298858642578, "global_step": 617232, "epoch": 7436} {"train_loss": -28.4598445892334, "global_step": 617233, "epoch": 7436} {"train_loss": -28.438199996948242, "global_step": 617234, "epoch": 7436} {"train_loss": -28.577606201171875, "global_step": 617235, "epoch": 7436} {"train_loss": -28.384912490844727, "global_step": 617236, "epoch": 7436} {"train_loss": -28.21969985961914, "global_step": 617237, "epoch": 7436} {"train_loss": -28.28688621520996, "global_step": 617238, "epoch": 7436} {"train_loss": -28.51836585998535, "global_step": 617239, "epoch": 7436} {"train_loss": -28.2584228515625, "global_step": 617240, "epoch": 7436} {"train_loss": -28.273212432861328, "global_step": 617241, "epoch": 7436} {"train_loss": -28.387983322143555, "global_step": 617242, "epoch": 7436} {"train_loss": -28.235326766967773, "global_step": 617243, "epoch": 7436} {"train_loss": -28.57221031188965, "global_step": 617244, "epoch": 7436} {"train_loss": -28.175525665283203, "global_step": 617245, "epoch": 7436} {"train_loss": -28.12973976135254, "global_step": 617246, "epoch": 7436} {"train_loss": -28.623279571533203, "global_step": 617247, "epoch": 7436} {"train_loss": -28.17854881286621, "global_step": 617248, "epoch": 7436} {"train_loss": -27.8509521484375, "global_step": 617249, "epoch": 7436} {"train_loss": -27.85711097717285, "global_step": 617250, "epoch": 7436} {"train_loss": -27.571277618408203, "global_step": 617251, "epoch": 7436} {"train_loss": -28.05478858947754, "global_step": 617252, "epoch": 7436} {"train_loss": -28.116125106811523, "global_step": 617253, "epoch": 7436} {"train_loss": -28.19378089904785, "global_step": 617254, "epoch": 7436} {"train_loss": -27.649311065673828, "global_step": 617255, "epoch": 7436} {"train_loss": -28.296344757080078, "global_step": 617256, "epoch": 7436} {"train_loss": -27.798688888549805, "global_step": 617257, "epoch": 7436} {"train_loss": -27.63230323791504, "global_step": 617258, "epoch": 7436} {"train_loss": -27.9173641204834, "global_step": 617259, "epoch": 7436} {"train_loss": -27.67083740234375, "global_step": 617260, "epoch": 7436} {"train_loss": -28.432493209838867, "global_step": 617261, "epoch": 7436} {"train_loss": -28.10687255859375, "global_step": 617262, "epoch": 7436} {"train_loss": -27.9702091217041, "global_step": 617263, "epoch": 7436} {"train_loss": -28.0604305267334, "global_step": 617264, "epoch": 7436} {"train_loss": -28.0008544921875, "global_step": 617265, "epoch": 7436} {"train_loss": -28.13103675842285, "global_step": 617266, "epoch": 7436} {"train_loss": -28.006025314331055, "global_step": 617267, "epoch": 7436} {"train_loss": -28.081924438476562, "global_step": 617268, "epoch": 7436} {"train_loss": -27.74220085144043, "global_step": 617269, "epoch": 7436} {"train_loss": -27.94433072101639, "global_step": 617270, "epoch": 7436, "val_loss": 6598550.0} {"train_loss": -28.040130615234375, "global_step": 617271, "epoch": 7437} {"train_loss": -27.600122451782227, "global_step": 617272, "epoch": 7437} {"train_loss": -28.133636474609375, "global_step": 617273, "epoch": 7437} {"train_loss": -27.958301544189453, "global_step": 617274, "epoch": 7437} {"train_loss": -27.838468551635742, "global_step": 617275, "epoch": 7437} {"train_loss": -27.925092697143555, "global_step": 617276, "epoch": 7437} {"train_loss": -28.19373893737793, "global_step": 617277, "epoch": 7437} {"train_loss": -27.769886016845703, "global_step": 617278, "epoch": 7437} {"train_loss": -28.061105728149414, "global_step": 617279, "epoch": 7437} {"train_loss": -28.014307022094727, "global_step": 617280, "epoch": 7437} {"train_loss": -27.991636276245117, "global_step": 617281, "epoch": 7437} {"train_loss": -28.163837432861328, "global_step": 617282, "epoch": 7437} {"train_loss": -28.478168487548828, "global_step": 617283, "epoch": 7437} {"train_loss": -28.29400634765625, "global_step": 617284, "epoch": 7437} {"train_loss": -28.279754638671875, "global_step": 617285, "epoch": 7437} {"train_loss": -28.314727783203125, "global_step": 617286, "epoch": 7437} {"train_loss": -28.342697143554688, "global_step": 617287, "epoch": 7437} {"train_loss": -27.905622482299805, "global_step": 617288, "epoch": 7437} {"train_loss": -28.0533504486084, "global_step": 617289, "epoch": 7437} {"train_loss": -28.11567497253418, "global_step": 617290, "epoch": 7437} {"train_loss": -27.937469482421875, "global_step": 617291, "epoch": 7437} {"train_loss": -28.108814239501953, "global_step": 617292, "epoch": 7437} {"train_loss": -28.3497314453125, "global_step": 617293, "epoch": 7437} {"train_loss": -28.21044921875, "global_step": 617294, "epoch": 7437} {"train_loss": -28.211145401000977, "global_step": 617295, "epoch": 7437} {"train_loss": -28.09712791442871, "global_step": 617296, "epoch": 7437} {"train_loss": -28.5574951171875, "global_step": 617297, "epoch": 7437} {"train_loss": -28.355688095092773, "global_step": 617298, "epoch": 7437} {"train_loss": -28.458423614501953, "global_step": 617299, "epoch": 7437} {"train_loss": -28.177209854125977, "global_step": 617300, "epoch": 7437} {"train_loss": -28.2570743560791, "global_step": 617301, "epoch": 7437} {"train_loss": -28.309606552124023, "global_step": 617302, "epoch": 7437} {"train_loss": -28.166746139526367, "global_step": 617303, "epoch": 7437} {"train_loss": -28.489261627197266, "global_step": 617304, "epoch": 7437} {"train_loss": -28.231107711791992, "global_step": 617305, "epoch": 7437} {"train_loss": -28.349523544311523, "global_step": 617306, "epoch": 7437} {"train_loss": -28.389944076538086, "global_step": 617307, "epoch": 7437} {"train_loss": -28.449872970581055, "global_step": 617308, "epoch": 7437} {"train_loss": -28.289840698242188, "global_step": 617309, "epoch": 7437} {"train_loss": -28.074146270751953, "global_step": 617310, "epoch": 7437} {"train_loss": -28.417036056518555, "global_step": 617311, "epoch": 7437} {"train_loss": -28.400482177734375, "global_step": 617312, "epoch": 7437} {"train_loss": -28.291980743408203, "global_step": 617313, "epoch": 7437} {"train_loss": -28.486572265625, "global_step": 617314, "epoch": 7437} {"train_loss": -28.078031539916992, "global_step": 617315, "epoch": 7437} {"train_loss": -27.993610382080078, "global_step": 617316, "epoch": 7437} {"train_loss": -28.214054107666016, "global_step": 617317, "epoch": 7437} {"train_loss": -27.90802001953125, "global_step": 617318, "epoch": 7437} {"train_loss": -28.192121505737305, "global_step": 617319, "epoch": 7437} {"train_loss": -27.931135177612305, "global_step": 617320, "epoch": 7437} {"train_loss": -28.44141960144043, "global_step": 617321, "epoch": 7437} {"train_loss": -28.844274520874023, "global_step": 617322, "epoch": 7437} {"train_loss": -28.13522720336914, "global_step": 617323, "epoch": 7437} {"train_loss": -28.432336807250977, "global_step": 617324, "epoch": 7437} {"train_loss": -28.16623878479004, "global_step": 617325, "epoch": 7437} {"train_loss": -28.066598892211914, "global_step": 617326, "epoch": 7437} {"train_loss": -27.660480499267578, "global_step": 617327, "epoch": 7437} {"train_loss": -28.091999053955078, "global_step": 617328, "epoch": 7437} {"train_loss": -27.431791305541992, "global_step": 617329, "epoch": 7437} {"train_loss": -27.51629066467285, "global_step": 617330, "epoch": 7437} {"train_loss": -27.998056411743164, "global_step": 617331, "epoch": 7437} {"train_loss": -28.104421615600586, "global_step": 617332, "epoch": 7437} {"train_loss": -28.091068267822266, "global_step": 617333, "epoch": 7437} {"train_loss": -27.61575698852539, "global_step": 617334, "epoch": 7437} {"train_loss": -27.9561710357666, "global_step": 617335, "epoch": 7437} {"train_loss": -27.9742488861084, "global_step": 617336, "epoch": 7437} {"train_loss": -27.79108238220215, "global_step": 617337, "epoch": 7437} {"train_loss": -27.959461212158203, "global_step": 617338, "epoch": 7437} {"train_loss": -27.914230346679688, "global_step": 617339, "epoch": 7437} {"train_loss": -28.062641143798828, "global_step": 617340, "epoch": 7437} {"train_loss": -28.066574096679688, "global_step": 617341, "epoch": 7437} {"train_loss": -28.012256622314453, "global_step": 617342, "epoch": 7437} {"train_loss": -28.3546142578125, "global_step": 617343, "epoch": 7437} {"train_loss": -28.173933029174805, "global_step": 617344, "epoch": 7437} {"train_loss": -28.426115036010742, "global_step": 617345, "epoch": 7437} {"train_loss": -28.043701171875, "global_step": 617346, "epoch": 7437} {"train_loss": -28.12360191345215, "global_step": 617347, "epoch": 7437} {"train_loss": -27.97531509399414, "global_step": 617348, "epoch": 7437} {"train_loss": -28.20850944519043, "global_step": 617349, "epoch": 7437} {"train_loss": -28.264463424682617, "global_step": 617350, "epoch": 7437} {"train_loss": -28.199201583862305, "global_step": 617351, "epoch": 7437} {"train_loss": -28.1368408203125, "global_step": 617352, "epoch": 7437} {"train_loss": -28.12448885354651, "global_step": 617353, "epoch": 7437, "val_loss": 6570472.0} {"train_loss": -27.925989151000977, "global_step": 617354, "epoch": 7438} {"train_loss": -27.891143798828125, "global_step": 617355, "epoch": 7438} {"train_loss": -27.4824275970459, "global_step": 617356, "epoch": 7438} {"train_loss": -28.193359375, "global_step": 617357, "epoch": 7438} {"train_loss": -27.81879997253418, "global_step": 617358, "epoch": 7438} {"train_loss": -28.36224365234375, "global_step": 617359, "epoch": 7438} {"train_loss": -27.909021377563477, "global_step": 617360, "epoch": 7438} {"train_loss": -27.857587814331055, "global_step": 617361, "epoch": 7438} {"train_loss": -28.34457778930664, "global_step": 617362, "epoch": 7438} {"train_loss": -28.22015953063965, "global_step": 617363, "epoch": 7438} {"train_loss": -28.049901962280273, "global_step": 617364, "epoch": 7438} {"train_loss": -28.36712646484375, "global_step": 617365, "epoch": 7438} {"train_loss": -28.232147216796875, "global_step": 617366, "epoch": 7438} {"train_loss": -27.957544326782227, "global_step": 617367, "epoch": 7438} {"train_loss": -27.861103057861328, "global_step": 617368, "epoch": 7438} {"train_loss": -28.167795181274414, "global_step": 617369, "epoch": 7438} {"train_loss": -28.361753463745117, "global_step": 617370, "epoch": 7438} {"train_loss": -28.224628448486328, "global_step": 617371, "epoch": 7438} {"train_loss": -28.265024185180664, "global_step": 617372, "epoch": 7438} {"train_loss": -28.688034057617188, "global_step": 617373, "epoch": 7438} {"train_loss": -28.061986923217773, "global_step": 617374, "epoch": 7438} {"train_loss": -28.324970245361328, "global_step": 617375, "epoch": 7438} {"train_loss": -28.397720336914062, "global_step": 617376, "epoch": 7438} {"train_loss": -28.282617568969727, "global_step": 617377, "epoch": 7438} {"train_loss": -27.99798011779785, "global_step": 617378, "epoch": 7438} {"train_loss": -28.559179306030273, "global_step": 617379, "epoch": 7438} {"train_loss": -28.238866806030273, "global_step": 617380, "epoch": 7438} {"train_loss": -28.381750106811523, "global_step": 617381, "epoch": 7438} {"train_loss": -28.505247116088867, "global_step": 617382, "epoch": 7438} {"train_loss": -28.172250747680664, "global_step": 617383, "epoch": 7438} {"train_loss": -28.441192626953125, "global_step": 617384, "epoch": 7438} {"train_loss": -28.479856491088867, "global_step": 617385, "epoch": 7438} {"train_loss": -28.11866569519043, "global_step": 617386, "epoch": 7438} {"train_loss": -27.89285659790039, "global_step": 617387, "epoch": 7438} {"train_loss": -27.703237533569336, "global_step": 617388, "epoch": 7438} {"train_loss": -27.416223526000977, "global_step": 617389, "epoch": 7438} {"train_loss": -27.434680938720703, "global_step": 617390, "epoch": 7438} {"train_loss": -28.112030029296875, "global_step": 617391, "epoch": 7438} {"train_loss": -28.31928825378418, "global_step": 617392, "epoch": 7438} {"train_loss": -27.064252853393555, "global_step": 617393, "epoch": 7438} {"train_loss": -27.221948623657227, "global_step": 617394, "epoch": 7438} {"train_loss": -27.849334716796875, "global_step": 617395, "epoch": 7438} {"train_loss": -27.267724990844727, "global_step": 617396, "epoch": 7438} {"train_loss": -28.1458740234375, "global_step": 617397, "epoch": 7438} {"train_loss": -27.871631622314453, "global_step": 617398, "epoch": 7438} {"train_loss": -27.865827560424805, "global_step": 617399, "epoch": 7438} {"train_loss": -28.406103134155273, "global_step": 617400, "epoch": 7438} {"train_loss": -27.7918643951416, "global_step": 617401, "epoch": 7438} {"train_loss": -27.555707931518555, "global_step": 617402, "epoch": 7438} {"train_loss": -28.038694381713867, "global_step": 617403, "epoch": 7438} {"train_loss": -27.772979736328125, "global_step": 617404, "epoch": 7438} {"train_loss": -27.951953887939453, "global_step": 617405, "epoch": 7438} {"train_loss": -27.846302032470703, "global_step": 617406, "epoch": 7438} {"train_loss": -28.180438995361328, "global_step": 617407, "epoch": 7438} {"train_loss": -28.040746688842773, "global_step": 617408, "epoch": 7438} {"train_loss": -27.869958877563477, "global_step": 617409, "epoch": 7438} {"train_loss": -27.982458114624023, "global_step": 617410, "epoch": 7438} {"train_loss": -28.022729873657227, "global_step": 617411, "epoch": 7438} {"train_loss": -28.122608184814453, "global_step": 617412, "epoch": 7438} {"train_loss": -27.898229598999023, "global_step": 617413, "epoch": 7438} {"train_loss": -27.86701011657715, "global_step": 617414, "epoch": 7438} {"train_loss": -27.653196334838867, "global_step": 617415, "epoch": 7438} {"train_loss": -27.2938289642334, "global_step": 617416, "epoch": 7438} {"train_loss": -27.77046012878418, "global_step": 617417, "epoch": 7438} {"train_loss": -27.9428653717041, "global_step": 617418, "epoch": 7438} {"train_loss": -27.383840560913086, "global_step": 617419, "epoch": 7438} {"train_loss": -27.62409782409668, "global_step": 617420, "epoch": 7438} {"train_loss": -28.495269775390625, "global_step": 617421, "epoch": 7438} {"train_loss": -27.917465209960938, "global_step": 617422, "epoch": 7438} {"train_loss": -28.0405216217041, "global_step": 617423, "epoch": 7438} {"train_loss": -27.924097061157227, "global_step": 617424, "epoch": 7438} {"train_loss": -28.021869659423828, "global_step": 617425, "epoch": 7438} {"train_loss": -28.2139949798584, "global_step": 617426, "epoch": 7438} {"train_loss": -27.7746639251709, "global_step": 617427, "epoch": 7438} {"train_loss": -27.9451847076416, "global_step": 617428, "epoch": 7438} {"train_loss": -28.403512954711914, "global_step": 617429, "epoch": 7438} {"train_loss": -27.834522247314453, "global_step": 617430, "epoch": 7438} {"train_loss": -28.28415298461914, "global_step": 617431, "epoch": 7438} {"train_loss": -27.944616317749023, "global_step": 617432, "epoch": 7438} {"train_loss": -27.82892417907715, "global_step": 617433, "epoch": 7438} {"train_loss": -28.140050888061523, "global_step": 617434, "epoch": 7438} {"train_loss": -27.738849639892578, "global_step": 617435, "epoch": 7438} {"train_loss": -27.99487681561206, "global_step": 617436, "epoch": 7438, "val_loss": 6610864.0} {"train_loss": -27.189664840698242, "global_step": 617437, "epoch": 7439} {"train_loss": -25.026042938232422, "global_step": 617438, "epoch": 7439} {"train_loss": -23.35822296142578, "global_step": 617439, "epoch": 7439} {"train_loss": -24.39174461364746, "global_step": 617440, "epoch": 7439} {"train_loss": -26.450916290283203, "global_step": 617441, "epoch": 7439} {"train_loss": -26.180448532104492, "global_step": 617442, "epoch": 7439} {"train_loss": -25.842191696166992, "global_step": 617443, "epoch": 7439} {"train_loss": -26.331777572631836, "global_step": 617444, "epoch": 7439} {"train_loss": -26.771121978759766, "global_step": 617445, "epoch": 7439} {"train_loss": -26.321063995361328, "global_step": 617446, "epoch": 7439} {"train_loss": -27.38237953186035, "global_step": 617447, "epoch": 7439} {"train_loss": -27.04237174987793, "global_step": 617448, "epoch": 7439} {"train_loss": -27.03243064880371, "global_step": 617449, "epoch": 7439} {"train_loss": -27.534423828125, "global_step": 617450, "epoch": 7439} {"train_loss": -27.206085205078125, "global_step": 617451, "epoch": 7439} {"train_loss": -26.70851707458496, "global_step": 617452, "epoch": 7439} {"train_loss": -27.615137100219727, "global_step": 617453, "epoch": 7439} {"train_loss": -27.3991641998291, "global_step": 617454, "epoch": 7439} {"train_loss": -27.151418685913086, "global_step": 617455, "epoch": 7439} {"train_loss": -27.08729362487793, "global_step": 617456, "epoch": 7439} {"train_loss": -27.470264434814453, "global_step": 617457, "epoch": 7439} {"train_loss": -27.565153121948242, "global_step": 617458, "epoch": 7439} {"train_loss": -27.392621994018555, "global_step": 617459, "epoch": 7439} {"train_loss": -27.470945358276367, "global_step": 617460, "epoch": 7439} {"train_loss": -27.641382217407227, "global_step": 617461, "epoch": 7439} {"train_loss": -27.51999855041504, "global_step": 617462, "epoch": 7439} {"train_loss": -27.495710372924805, "global_step": 617463, "epoch": 7439} {"train_loss": -27.451663970947266, "global_step": 617464, "epoch": 7439} {"train_loss": -27.29803466796875, "global_step": 617465, "epoch": 7439} {"train_loss": -27.917638778686523, "global_step": 617466, "epoch": 7439} {"train_loss": -27.72212028503418, "global_step": 617467, "epoch": 7439} {"train_loss": -27.733503341674805, "global_step": 617468, "epoch": 7439} {"train_loss": -28.06331443786621, "global_step": 617469, "epoch": 7439} {"train_loss": -27.716083526611328, "global_step": 617470, "epoch": 7439} {"train_loss": -27.894006729125977, "global_step": 617471, "epoch": 7439} {"train_loss": -27.777515411376953, "global_step": 617472, "epoch": 7439} {"train_loss": -28.186277389526367, "global_step": 617473, "epoch": 7439} {"train_loss": -27.95631217956543, "global_step": 617474, "epoch": 7439} {"train_loss": -27.609649658203125, "global_step": 617475, "epoch": 7439} {"train_loss": -28.50789451599121, "global_step": 617476, "epoch": 7439} {"train_loss": -27.764453887939453, "global_step": 617477, "epoch": 7439} {"train_loss": -27.4979248046875, "global_step": 617478, "epoch": 7439} {"train_loss": -27.91107749938965, "global_step": 617479, "epoch": 7439} {"train_loss": -27.901212692260742, "global_step": 617480, "epoch": 7439} {"train_loss": -27.825336456298828, "global_step": 617481, "epoch": 7439} {"train_loss": -28.001951217651367, "global_step": 617482, "epoch": 7439} {"train_loss": -27.95475196838379, "global_step": 617483, "epoch": 7439} {"train_loss": -28.318532943725586, "global_step": 617484, "epoch": 7439} {"train_loss": -28.383209228515625, "global_step": 617485, "epoch": 7439} {"train_loss": -28.12019157409668, "global_step": 617486, "epoch": 7439} {"train_loss": -27.50750732421875, "global_step": 617487, "epoch": 7439} {"train_loss": -27.507226943969727, "global_step": 617488, "epoch": 7439} {"train_loss": -27.56296157836914, "global_step": 617489, "epoch": 7439} {"train_loss": -27.258161544799805, "global_step": 617490, "epoch": 7439} {"train_loss": -27.66643714904785, "global_step": 617491, "epoch": 7439} {"train_loss": -27.73982048034668, "global_step": 617492, "epoch": 7439} {"train_loss": -27.9137020111084, "global_step": 617493, "epoch": 7439} {"train_loss": -27.711780548095703, "global_step": 617494, "epoch": 7439} {"train_loss": -27.72568130493164, "global_step": 617495, "epoch": 7439} {"train_loss": -28.18561363220215, "global_step": 617496, "epoch": 7439} {"train_loss": -28.425735473632812, "global_step": 617497, "epoch": 7439} {"train_loss": -27.889562606811523, "global_step": 617498, "epoch": 7439} {"train_loss": -27.811506271362305, "global_step": 617499, "epoch": 7439} {"train_loss": -27.959888458251953, "global_step": 617500, "epoch": 7439} {"train_loss": -28.208515167236328, "global_step": 617501, "epoch": 7439} {"train_loss": -28.001081466674805, "global_step": 617502, "epoch": 7439} {"train_loss": -28.198720932006836, "global_step": 617503, "epoch": 7439} {"train_loss": -28.1866455078125, "global_step": 617504, "epoch": 7439} {"train_loss": -27.995702743530273, "global_step": 617505, "epoch": 7439} {"train_loss": -28.196439743041992, "global_step": 617506, "epoch": 7439} {"train_loss": -28.0869083404541, "global_step": 617507, "epoch": 7439} {"train_loss": -27.784290313720703, "global_step": 617508, "epoch": 7439} {"train_loss": -28.260229110717773, "global_step": 617509, "epoch": 7439} {"train_loss": -27.955480575561523, "global_step": 617510, "epoch": 7439} {"train_loss": -27.812360763549805, "global_step": 617511, "epoch": 7439} {"train_loss": -27.95509910583496, "global_step": 617512, "epoch": 7439} {"train_loss": -28.443838119506836, "global_step": 617513, "epoch": 7439} {"train_loss": -27.78070640563965, "global_step": 617514, "epoch": 7439} {"train_loss": -27.971176147460938, "global_step": 617515, "epoch": 7439} {"train_loss": -28.69345474243164, "global_step": 617516, "epoch": 7439} {"train_loss": -27.81162452697754, "global_step": 617517, "epoch": 7439} {"train_loss": -27.924612045288086, "global_step": 617518, "epoch": 7439} {"train_loss": -27.538857908134002, "global_step": 617519, "epoch": 7439, "val_loss": 6553031.0} {"train_loss": -26.251684188842773, "global_step": 617520, "epoch": 7440} {"train_loss": -25.2730712890625, "global_step": 617521, "epoch": 7440} {"train_loss": -26.874225616455078, "global_step": 617522, "epoch": 7440} {"train_loss": -27.11211585998535, "global_step": 617523, "epoch": 7440} {"train_loss": -27.434064865112305, "global_step": 617524, "epoch": 7440} {"train_loss": -27.126943588256836, "global_step": 617525, "epoch": 7440} {"train_loss": -27.371007919311523, "global_step": 617526, "epoch": 7440} {"train_loss": -27.44777488708496, "global_step": 617527, "epoch": 7440} {"train_loss": -27.51045036315918, "global_step": 617528, "epoch": 7440} {"train_loss": -27.145299911499023, "global_step": 617529, "epoch": 7440} {"train_loss": -27.4530029296875, "global_step": 617530, "epoch": 7440} {"train_loss": -27.3931827545166, "global_step": 617531, "epoch": 7440} {"train_loss": -27.64816665649414, "global_step": 617532, "epoch": 7440} {"train_loss": -27.657806396484375, "global_step": 617533, "epoch": 7440} {"train_loss": -27.376317977905273, "global_step": 617534, "epoch": 7440} {"train_loss": -27.853124618530273, "global_step": 617535, "epoch": 7440} {"train_loss": -27.787891387939453, "global_step": 617536, "epoch": 7440} {"train_loss": -27.555038452148438, "global_step": 617537, "epoch": 7440} {"train_loss": -27.63124656677246, "global_step": 617538, "epoch": 7440} {"train_loss": -27.935842514038086, "global_step": 617539, "epoch": 7440} {"train_loss": -28.06536865234375, "global_step": 617540, "epoch": 7440} {"train_loss": -27.6734619140625, "global_step": 617541, "epoch": 7440} {"train_loss": -27.996610641479492, "global_step": 617542, "epoch": 7440} {"train_loss": -27.7834415435791, "global_step": 617543, "epoch": 7440} {"train_loss": -28.080961227416992, "global_step": 617544, "epoch": 7440} {"train_loss": -28.15595817565918, "global_step": 617545, "epoch": 7440} {"train_loss": -27.78500747680664, "global_step": 617546, "epoch": 7440} {"train_loss": -27.969928741455078, "global_step": 617547, "epoch": 7440} {"train_loss": -27.7264404296875, "global_step": 617548, "epoch": 7440} {"train_loss": -28.185861587524414, "global_step": 617549, "epoch": 7440} {"train_loss": -27.715015411376953, "global_step": 617550, "epoch": 7440} {"train_loss": -27.523412704467773, "global_step": 617551, "epoch": 7440} {"train_loss": -28.121992111206055, "global_step": 617552, "epoch": 7440} {"train_loss": -28.010656356811523, "global_step": 617553, "epoch": 7440} {"train_loss": -28.0101375579834, "global_step": 617554, "epoch": 7440} {"train_loss": -28.207563400268555, "global_step": 617555, "epoch": 7440} {"train_loss": -27.884952545166016, "global_step": 617556, "epoch": 7440} {"train_loss": -28.18634033203125, "global_step": 617557, "epoch": 7440} {"train_loss": -28.224414825439453, "global_step": 617558, "epoch": 7440} {"train_loss": -28.112478256225586, "global_step": 617559, "epoch": 7440} {"train_loss": -28.375946044921875, "global_step": 617560, "epoch": 7440} {"train_loss": -28.48480796813965, "global_step": 617561, "epoch": 7440} {"train_loss": -28.16236686706543, "global_step": 617562, "epoch": 7440} {"train_loss": -27.578399658203125, "global_step": 617563, "epoch": 7440} {"train_loss": -28.198251724243164, "global_step": 617564, "epoch": 7440} {"train_loss": -28.195409774780273, "global_step": 617565, "epoch": 7440} {"train_loss": -28.08979606628418, "global_step": 617566, "epoch": 7440} {"train_loss": -28.146381378173828, "global_step": 617567, "epoch": 7440} {"train_loss": -27.96046257019043, "global_step": 617568, "epoch": 7440} {"train_loss": -27.977216720581055, "global_step": 617569, "epoch": 7440} {"train_loss": -28.119049072265625, "global_step": 617570, "epoch": 7440} {"train_loss": -28.104909896850586, "global_step": 617571, "epoch": 7440} {"train_loss": -28.20088005065918, "global_step": 617572, "epoch": 7440} {"train_loss": -28.1110782623291, "global_step": 617573, "epoch": 7440} {"train_loss": -28.0924129486084, "global_step": 617574, "epoch": 7440} {"train_loss": -28.02493667602539, "global_step": 617575, "epoch": 7440} {"train_loss": -27.57904052734375, "global_step": 617576, "epoch": 7440} {"train_loss": -27.97871208190918, "global_step": 617577, "epoch": 7440} {"train_loss": -27.72051429748535, "global_step": 617578, "epoch": 7440} {"train_loss": -27.794692993164062, "global_step": 617579, "epoch": 7440} {"train_loss": -27.857343673706055, "global_step": 617580, "epoch": 7440} {"train_loss": -28.146459579467773, "global_step": 617581, "epoch": 7440} {"train_loss": -28.490070343017578, "global_step": 617582, "epoch": 7440} {"train_loss": -28.420135498046875, "global_step": 617583, "epoch": 7440} {"train_loss": -28.0245418548584, "global_step": 617584, "epoch": 7440} {"train_loss": -28.28655433654785, "global_step": 617585, "epoch": 7440} {"train_loss": -27.966663360595703, "global_step": 617586, "epoch": 7440} {"train_loss": -28.298131942749023, "global_step": 617587, "epoch": 7440} {"train_loss": -28.214365005493164, "global_step": 617588, "epoch": 7440} {"train_loss": -28.298675537109375, "global_step": 617589, "epoch": 7440} {"train_loss": -28.171979904174805, "global_step": 617590, "epoch": 7440} {"train_loss": -28.68280601501465, "global_step": 617591, "epoch": 7440} {"train_loss": -27.965576171875, "global_step": 617592, "epoch": 7440} {"train_loss": -27.90582275390625, "global_step": 617593, "epoch": 7440} {"train_loss": -27.924108505249023, "global_step": 617594, "epoch": 7440} {"train_loss": -27.6761531829834, "global_step": 617595, "epoch": 7440} {"train_loss": -28.420669555664062, "global_step": 617596, "epoch": 7440} {"train_loss": -28.429691314697266, "global_step": 617597, "epoch": 7440} {"train_loss": -28.195898056030273, "global_step": 617598, "epoch": 7440} {"train_loss": -27.99268913269043, "global_step": 617599, "epoch": 7440} {"train_loss": -28.011091232299805, "global_step": 617600, "epoch": 7440} {"train_loss": -27.858722686767578, "global_step": 617601, "epoch": 7440} {"train_loss": -27.8887927963073, "global_step": 617602, "epoch": 7440, "val_loss": 6578186.0} {"train_loss": -28.158536911010742, "global_step": 617603, "epoch": 7441} {"train_loss": -27.655292510986328, "global_step": 617604, "epoch": 7441} {"train_loss": -27.86188316345215, "global_step": 617605, "epoch": 7441} {"train_loss": -27.8090877532959, "global_step": 617606, "epoch": 7441} {"train_loss": -28.504907608032227, "global_step": 617607, "epoch": 7441} {"train_loss": -28.01785659790039, "global_step": 617608, "epoch": 7441} {"train_loss": -27.82954978942871, "global_step": 617609, "epoch": 7441} {"train_loss": -27.99061393737793, "global_step": 617610, "epoch": 7441} {"train_loss": -27.736841201782227, "global_step": 617611, "epoch": 7441} {"train_loss": -28.101221084594727, "global_step": 617612, "epoch": 7441} {"train_loss": -27.88357925415039, "global_step": 617613, "epoch": 7441} {"train_loss": -28.50337028503418, "global_step": 617614, "epoch": 7441} {"train_loss": -27.731719970703125, "global_step": 617615, "epoch": 7441} {"train_loss": -27.678735733032227, "global_step": 617616, "epoch": 7441} {"train_loss": -28.048490524291992, "global_step": 617617, "epoch": 7441} {"train_loss": -28.11087417602539, "global_step": 617618, "epoch": 7441} {"train_loss": -28.506275177001953, "global_step": 617619, "epoch": 7441} {"train_loss": -28.14691162109375, "global_step": 617620, "epoch": 7441} {"train_loss": -28.135812759399414, "global_step": 617621, "epoch": 7441} {"train_loss": -27.9827880859375, "global_step": 617622, "epoch": 7441} {"train_loss": -27.697660446166992, "global_step": 617623, "epoch": 7441} {"train_loss": -28.0617733001709, "global_step": 617624, "epoch": 7441} {"train_loss": -27.635129928588867, "global_step": 617625, "epoch": 7441} {"train_loss": -28.301366806030273, "global_step": 617626, "epoch": 7441} {"train_loss": -27.685827255249023, "global_step": 617627, "epoch": 7441} {"train_loss": -27.99640464782715, "global_step": 617628, "epoch": 7441} {"train_loss": -28.031787872314453, "global_step": 617629, "epoch": 7441} {"train_loss": -28.113819122314453, "global_step": 617630, "epoch": 7441} {"train_loss": -28.17576026916504, "global_step": 617631, "epoch": 7441} {"train_loss": -27.987462997436523, "global_step": 617632, "epoch": 7441} {"train_loss": -27.749164581298828, "global_step": 617633, "epoch": 7441} {"train_loss": -27.78468894958496, "global_step": 617634, "epoch": 7441} {"train_loss": -27.948633193969727, "global_step": 617635, "epoch": 7441} {"train_loss": -27.681903839111328, "global_step": 617636, "epoch": 7441} {"train_loss": -28.20826530456543, "global_step": 617637, "epoch": 7441} {"train_loss": -27.90988540649414, "global_step": 617638, "epoch": 7441} {"train_loss": -27.98823356628418, "global_step": 617639, "epoch": 7441} {"train_loss": -28.170988082885742, "global_step": 617640, "epoch": 7441} {"train_loss": -28.072641372680664, "global_step": 617641, "epoch": 7441} {"train_loss": -28.4180850982666, "global_step": 617642, "epoch": 7441} {"train_loss": -27.74431800842285, "global_step": 617643, "epoch": 7441} {"train_loss": -28.187061309814453, "global_step": 617644, "epoch": 7441} {"train_loss": -27.99650001525879, "global_step": 617645, "epoch": 7441} {"train_loss": -28.134952545166016, "global_step": 617646, "epoch": 7441} {"train_loss": -27.959924697875977, "global_step": 617647, "epoch": 7441} {"train_loss": -28.281696319580078, "global_step": 617648, "epoch": 7441} {"train_loss": -28.200071334838867, "global_step": 617649, "epoch": 7441} {"train_loss": -28.31109046936035, "global_step": 617650, "epoch": 7441} {"train_loss": -28.16828727722168, "global_step": 617651, "epoch": 7441} {"train_loss": -28.099536895751953, "global_step": 617652, "epoch": 7441} {"train_loss": -28.292394638061523, "global_step": 617653, "epoch": 7441} {"train_loss": -28.14508628845215, "global_step": 617654, "epoch": 7441} {"train_loss": -28.409229278564453, "global_step": 617655, "epoch": 7441} {"train_loss": -28.242279052734375, "global_step": 617656, "epoch": 7441} {"train_loss": -28.420124053955078, "global_step": 617657, "epoch": 7441} {"train_loss": -28.26655387878418, "global_step": 617658, "epoch": 7441} {"train_loss": -27.938501358032227, "global_step": 617659, "epoch": 7441} {"train_loss": -28.764245986938477, "global_step": 617660, "epoch": 7441} {"train_loss": -28.14886474609375, "global_step": 617661, "epoch": 7441} {"train_loss": -28.62128257751465, "global_step": 617662, "epoch": 7441} {"train_loss": -28.361053466796875, "global_step": 617663, "epoch": 7441} {"train_loss": -28.18027114868164, "global_step": 617664, "epoch": 7441} {"train_loss": -28.429792404174805, "global_step": 617665, "epoch": 7441} {"train_loss": -28.559534072875977, "global_step": 617666, "epoch": 7441} {"train_loss": -28.0736083984375, "global_step": 617667, "epoch": 7441} {"train_loss": -28.0953369140625, "global_step": 617668, "epoch": 7441} {"train_loss": -27.797748565673828, "global_step": 617669, "epoch": 7441} {"train_loss": -27.80820083618164, "global_step": 617670, "epoch": 7441} {"train_loss": -27.922454833984375, "global_step": 617671, "epoch": 7441} {"train_loss": -28.322057723999023, "global_step": 617672, "epoch": 7441} {"train_loss": -28.36414909362793, "global_step": 617673, "epoch": 7441} {"train_loss": -27.908674240112305, "global_step": 617674, "epoch": 7441} {"train_loss": -28.430789947509766, "global_step": 617675, "epoch": 7441} {"train_loss": -28.089462280273438, "global_step": 617676, "epoch": 7441} {"train_loss": -28.32792091369629, "global_step": 617677, "epoch": 7441} {"train_loss": -27.992841720581055, "global_step": 617678, "epoch": 7441} {"train_loss": -28.38772964477539, "global_step": 617679, "epoch": 7441} {"train_loss": -28.700366973876953, "global_step": 617680, "epoch": 7441} {"train_loss": -28.205890655517578, "global_step": 617681, "epoch": 7441} {"train_loss": -27.914779663085938, "global_step": 617682, "epoch": 7441} {"train_loss": -28.2850284576416, "global_step": 617683, "epoch": 7441} {"train_loss": -27.944089889526367, "global_step": 617684, "epoch": 7441} {"train_loss": -28.10925957093756, "global_step": 617685, "epoch": 7441, "val_loss": 6616994.0} {"train_loss": -27.639007568359375, "global_step": 617686, "epoch": 7442} {"train_loss": -27.542280197143555, "global_step": 617687, "epoch": 7442} {"train_loss": -27.502721786499023, "global_step": 617688, "epoch": 7442} {"train_loss": -27.40378189086914, "global_step": 617689, "epoch": 7442} {"train_loss": -27.3732852935791, "global_step": 617690, "epoch": 7442} {"train_loss": -27.050933837890625, "global_step": 617691, "epoch": 7442} {"train_loss": -27.551374435424805, "global_step": 617692, "epoch": 7442} {"train_loss": -27.758691787719727, "global_step": 617693, "epoch": 7442} {"train_loss": -27.750354766845703, "global_step": 617694, "epoch": 7442} {"train_loss": -27.437397003173828, "global_step": 617695, "epoch": 7442} {"train_loss": -27.8332462310791, "global_step": 617696, "epoch": 7442} {"train_loss": -27.170530319213867, "global_step": 617697, "epoch": 7442} {"train_loss": -27.76242446899414, "global_step": 617698, "epoch": 7442} {"train_loss": -27.990015029907227, "global_step": 617699, "epoch": 7442} {"train_loss": -27.9162540435791, "global_step": 617700, "epoch": 7442} {"train_loss": -27.94742202758789, "global_step": 617701, "epoch": 7442} {"train_loss": -28.036725997924805, "global_step": 617702, "epoch": 7442} {"train_loss": -27.84913444519043, "global_step": 617703, "epoch": 7442} {"train_loss": -27.51629638671875, "global_step": 617704, "epoch": 7442} {"train_loss": -27.60016441345215, "global_step": 617705, "epoch": 7442} {"train_loss": -28.442829132080078, "global_step": 617706, "epoch": 7442} {"train_loss": -28.22096061706543, "global_step": 617707, "epoch": 7442} {"train_loss": -27.997486114501953, "global_step": 617708, "epoch": 7442} {"train_loss": -28.33163833618164, "global_step": 617709, "epoch": 7442} {"train_loss": -28.11138343811035, "global_step": 617710, "epoch": 7442} {"train_loss": -28.29082679748535, "global_step": 617711, "epoch": 7442} {"train_loss": -28.29182243347168, "global_step": 617712, "epoch": 7442} {"train_loss": -27.899084091186523, "global_step": 617713, "epoch": 7442} {"train_loss": -28.01816749572754, "global_step": 617714, "epoch": 7442} {"train_loss": -28.276763916015625, "global_step": 617715, "epoch": 7442} {"train_loss": -28.131696701049805, "global_step": 617716, "epoch": 7442} {"train_loss": -28.117450714111328, "global_step": 617717, "epoch": 7442} {"train_loss": -28.10089111328125, "global_step": 617718, "epoch": 7442} {"train_loss": -27.984577178955078, "global_step": 617719, "epoch": 7442} {"train_loss": -27.986536026000977, "global_step": 617720, "epoch": 7442} {"train_loss": -28.212186813354492, "global_step": 617721, "epoch": 7442} {"train_loss": -28.205053329467773, "global_step": 617722, "epoch": 7442} {"train_loss": -28.106616973876953, "global_step": 617723, "epoch": 7442} {"train_loss": -28.319839477539062, "global_step": 617724, "epoch": 7442} {"train_loss": -28.117095947265625, "global_step": 617725, "epoch": 7442} {"train_loss": -28.37470054626465, "global_step": 617726, "epoch": 7442} {"train_loss": -28.11102867126465, "global_step": 617727, "epoch": 7442} {"train_loss": -28.2752628326416, "global_step": 617728, "epoch": 7442} {"train_loss": -28.13018226623535, "global_step": 617729, "epoch": 7442} {"train_loss": -28.473651885986328, "global_step": 617730, "epoch": 7442} {"train_loss": -28.368671417236328, "global_step": 617731, "epoch": 7442} {"train_loss": -28.483016967773438, "global_step": 617732, "epoch": 7442} {"train_loss": -28.213144302368164, "global_step": 617733, "epoch": 7442} {"train_loss": -28.24469566345215, "global_step": 617734, "epoch": 7442} {"train_loss": -27.935354232788086, "global_step": 617735, "epoch": 7442} {"train_loss": -28.031509399414062, "global_step": 617736, "epoch": 7442} {"train_loss": -28.213092803955078, "global_step": 617737, "epoch": 7442} {"train_loss": -27.753293991088867, "global_step": 617738, "epoch": 7442} {"train_loss": -28.35782241821289, "global_step": 617739, "epoch": 7442} {"train_loss": -27.836200714111328, "global_step": 617740, "epoch": 7442} {"train_loss": -28.314905166625977, "global_step": 617741, "epoch": 7442} {"train_loss": -28.088027954101562, "global_step": 617742, "epoch": 7442} {"train_loss": -28.021198272705078, "global_step": 617743, "epoch": 7442} {"train_loss": -27.931488037109375, "global_step": 617744, "epoch": 7442} {"train_loss": -27.571109771728516, "global_step": 617745, "epoch": 7442} {"train_loss": -27.916311264038086, "global_step": 617746, "epoch": 7442} {"train_loss": -28.216482162475586, "global_step": 617747, "epoch": 7442} {"train_loss": -28.080347061157227, "global_step": 617748, "epoch": 7442} {"train_loss": -27.980182647705078, "global_step": 617749, "epoch": 7442} {"train_loss": -27.898258209228516, "global_step": 617750, "epoch": 7442} {"train_loss": -28.034332275390625, "global_step": 617751, "epoch": 7442} {"train_loss": -28.328231811523438, "global_step": 617752, "epoch": 7442} {"train_loss": -28.214282989501953, "global_step": 617753, "epoch": 7442} {"train_loss": -28.529272079467773, "global_step": 617754, "epoch": 7442} {"train_loss": -28.392316818237305, "global_step": 617755, "epoch": 7442} {"train_loss": -27.920827865600586, "global_step": 617756, "epoch": 7442} {"train_loss": -28.216327667236328, "global_step": 617757, "epoch": 7442} {"train_loss": -28.47272300720215, "global_step": 617758, "epoch": 7442} {"train_loss": -28.027097702026367, "global_step": 617759, "epoch": 7442} {"train_loss": -28.262908935546875, "global_step": 617760, "epoch": 7442} {"train_loss": -27.90205192565918, "global_step": 617761, "epoch": 7442} {"train_loss": -28.0625057220459, "global_step": 617762, "epoch": 7442} {"train_loss": -28.064115524291992, "global_step": 617763, "epoch": 7442} {"train_loss": -27.803983688354492, "global_step": 617764, "epoch": 7442} {"train_loss": -28.139240264892578, "global_step": 617765, "epoch": 7442} {"train_loss": -28.1965389251709, "global_step": 617766, "epoch": 7442} {"train_loss": -28.344892501831055, "global_step": 617767, "epoch": 7442} {"train_loss": -28.024242561983776, "global_step": 617768, "epoch": 7442, "val_loss": 6599080.0} {"train_loss": -28.1547794342041, "global_step": 617769, "epoch": 7443} {"train_loss": -27.80877113342285, "global_step": 617770, "epoch": 7443} {"train_loss": -27.543869018554688, "global_step": 617771, "epoch": 7443} {"train_loss": -27.681509017944336, "global_step": 617772, "epoch": 7443} {"train_loss": -27.8990421295166, "global_step": 617773, "epoch": 7443} {"train_loss": -27.732614517211914, "global_step": 617774, "epoch": 7443} {"train_loss": -27.755935668945312, "global_step": 617775, "epoch": 7443} {"train_loss": -28.19746208190918, "global_step": 617776, "epoch": 7443} {"train_loss": -28.146642684936523, "global_step": 617777, "epoch": 7443} {"train_loss": -27.72646141052246, "global_step": 617778, "epoch": 7443} {"train_loss": -28.19048500061035, "global_step": 617779, "epoch": 7443} {"train_loss": -28.06396484375, "global_step": 617780, "epoch": 7443} {"train_loss": -28.016849517822266, "global_step": 617781, "epoch": 7443} {"train_loss": -27.97354507446289, "global_step": 617782, "epoch": 7443} {"train_loss": -27.82039451599121, "global_step": 617783, "epoch": 7443} {"train_loss": -27.81595230102539, "global_step": 617784, "epoch": 7443} {"train_loss": -28.0410213470459, "global_step": 617785, "epoch": 7443} {"train_loss": -28.09556007385254, "global_step": 617786, "epoch": 7443} {"train_loss": -27.97743034362793, "global_step": 617787, "epoch": 7443} {"train_loss": -27.9892520904541, "global_step": 617788, "epoch": 7443} {"train_loss": -27.873565673828125, "global_step": 617789, "epoch": 7443} {"train_loss": -28.237945556640625, "global_step": 617790, "epoch": 7443} {"train_loss": -27.882062911987305, "global_step": 617791, "epoch": 7443} {"train_loss": -28.194421768188477, "global_step": 617792, "epoch": 7443} {"train_loss": -28.321857452392578, "global_step": 617793, "epoch": 7443} {"train_loss": -28.1497745513916, "global_step": 617794, "epoch": 7443} {"train_loss": -28.317890167236328, "global_step": 617795, "epoch": 7443} {"train_loss": -27.891223907470703, "global_step": 617796, "epoch": 7443} {"train_loss": -28.05219841003418, "global_step": 617797, "epoch": 7443} {"train_loss": -28.076587677001953, "global_step": 617798, "epoch": 7443} {"train_loss": -27.849843978881836, "global_step": 617799, "epoch": 7443} {"train_loss": -28.275440216064453, "global_step": 617800, "epoch": 7443} {"train_loss": -28.217487335205078, "global_step": 617801, "epoch": 7443} {"train_loss": -27.7905216217041, "global_step": 617802, "epoch": 7443} {"train_loss": -28.4509220123291, "global_step": 617803, "epoch": 7443} {"train_loss": -28.234464645385742, "global_step": 617804, "epoch": 7443} {"train_loss": -28.072223663330078, "global_step": 617805, "epoch": 7443} {"train_loss": -28.537084579467773, "global_step": 617806, "epoch": 7443} {"train_loss": -28.072423934936523, "global_step": 617807, "epoch": 7443} {"train_loss": -28.402692794799805, "global_step": 617808, "epoch": 7443} {"train_loss": -28.0760440826416, "global_step": 617809, "epoch": 7443} {"train_loss": -27.82024574279785, "global_step": 617810, "epoch": 7443} {"train_loss": -28.247074127197266, "global_step": 617811, "epoch": 7443} {"train_loss": -27.99081802368164, "global_step": 617812, "epoch": 7443} {"train_loss": -28.154987335205078, "global_step": 617813, "epoch": 7443} {"train_loss": -28.331464767456055, "global_step": 617814, "epoch": 7443} {"train_loss": -27.84787368774414, "global_step": 617815, "epoch": 7443} {"train_loss": -28.266584396362305, "global_step": 617816, "epoch": 7443} {"train_loss": -28.10515785217285, "global_step": 617817, "epoch": 7443} {"train_loss": -28.36014175415039, "global_step": 617818, "epoch": 7443} {"train_loss": -28.205402374267578, "global_step": 617819, "epoch": 7443} {"train_loss": -27.850818634033203, "global_step": 617820, "epoch": 7443} {"train_loss": -27.85114860534668, "global_step": 617821, "epoch": 7443} {"train_loss": -28.260351181030273, "global_step": 617822, "epoch": 7443} {"train_loss": -27.98394775390625, "global_step": 617823, "epoch": 7443} {"train_loss": -28.109952926635742, "global_step": 617824, "epoch": 7443} {"train_loss": -28.625812530517578, "global_step": 617825, "epoch": 7443} {"train_loss": -27.993513107299805, "global_step": 617826, "epoch": 7443} {"train_loss": -28.077722549438477, "global_step": 617827, "epoch": 7443} {"train_loss": -28.723285675048828, "global_step": 617828, "epoch": 7443} {"train_loss": -28.35163688659668, "global_step": 617829, "epoch": 7443} {"train_loss": -28.382871627807617, "global_step": 617830, "epoch": 7443} {"train_loss": -28.54994010925293, "global_step": 617831, "epoch": 7443} {"train_loss": -28.128026962280273, "global_step": 617832, "epoch": 7443} {"train_loss": -27.956838607788086, "global_step": 617833, "epoch": 7443} {"train_loss": -28.479846954345703, "global_step": 617834, "epoch": 7443} {"train_loss": -28.318313598632812, "global_step": 617835, "epoch": 7443} {"train_loss": -28.03677749633789, "global_step": 617836, "epoch": 7443} {"train_loss": -28.521533966064453, "global_step": 617837, "epoch": 7443} {"train_loss": -28.329008102416992, "global_step": 617838, "epoch": 7443} {"train_loss": -28.285593032836914, "global_step": 617839, "epoch": 7443} {"train_loss": -28.25592041015625, "global_step": 617840, "epoch": 7443} {"train_loss": -28.2613582611084, "global_step": 617841, "epoch": 7443} {"train_loss": -28.27789878845215, "global_step": 617842, "epoch": 7443} {"train_loss": -28.29230308532715, "global_step": 617843, "epoch": 7443} {"train_loss": -28.649343490600586, "global_step": 617844, "epoch": 7443} {"train_loss": -28.012210845947266, "global_step": 617845, "epoch": 7443} {"train_loss": -28.2246150970459, "global_step": 617846, "epoch": 7443} {"train_loss": -28.27522087097168, "global_step": 617847, "epoch": 7443} {"train_loss": -28.20789909362793, "global_step": 617848, "epoch": 7443} {"train_loss": -28.236474990844727, "global_step": 617849, "epoch": 7443} {"train_loss": -27.997793197631836, "global_step": 617850, "epoch": 7443} {"train_loss": -28.1319064404591, "global_step": 617851, "epoch": 7443, "val_loss": 6664325.0} {"train_loss": -27.231143951416016, "global_step": 617852, "epoch": 7444} {"train_loss": -26.666467666625977, "global_step": 617853, "epoch": 7444} {"train_loss": -27.761478424072266, "global_step": 617854, "epoch": 7444} {"train_loss": -27.287500381469727, "global_step": 617855, "epoch": 7444} {"train_loss": -26.85498046875, "global_step": 617856, "epoch": 7444} {"train_loss": -27.170154571533203, "global_step": 617857, "epoch": 7444} {"train_loss": -24.787662506103516, "global_step": 617858, "epoch": 7444} {"train_loss": -26.701431274414062, "global_step": 617859, "epoch": 7444} {"train_loss": -26.323156356811523, "global_step": 617860, "epoch": 7444} {"train_loss": -25.923120498657227, "global_step": 617861, "epoch": 7444} {"train_loss": -27.28558921813965, "global_step": 617862, "epoch": 7444} {"train_loss": -26.811269760131836, "global_step": 617863, "epoch": 7444} {"train_loss": -26.798009872436523, "global_step": 617864, "epoch": 7444} {"train_loss": -26.509143829345703, "global_step": 617865, "epoch": 7444} {"train_loss": -27.36663818359375, "global_step": 617866, "epoch": 7444} {"train_loss": -26.1784725189209, "global_step": 617867, "epoch": 7444} {"train_loss": -27.229703903198242, "global_step": 617868, "epoch": 7444} {"train_loss": -27.25394058227539, "global_step": 617869, "epoch": 7444} {"train_loss": -27.52032470703125, "global_step": 617870, "epoch": 7444} {"train_loss": -27.441604614257812, "global_step": 617871, "epoch": 7444} {"train_loss": -27.684728622436523, "global_step": 617872, "epoch": 7444} {"train_loss": -27.430316925048828, "global_step": 617873, "epoch": 7444} {"train_loss": -26.97149085998535, "global_step": 617874, "epoch": 7444} {"train_loss": -27.421875, "global_step": 617875, "epoch": 7444} {"train_loss": -27.248157501220703, "global_step": 617876, "epoch": 7444} {"train_loss": -27.40203857421875, "global_step": 617877, "epoch": 7444} {"train_loss": -27.30380630493164, "global_step": 617878, "epoch": 7444} {"train_loss": -27.545515060424805, "global_step": 617879, "epoch": 7444} {"train_loss": -27.426069259643555, "global_step": 617880, "epoch": 7444} {"train_loss": -27.550262451171875, "global_step": 617881, "epoch": 7444} {"train_loss": -27.91376304626465, "global_step": 617882, "epoch": 7444} {"train_loss": -27.70075035095215, "global_step": 617883, "epoch": 7444} {"train_loss": -28.05841064453125, "global_step": 617884, "epoch": 7444} {"train_loss": -27.605127334594727, "global_step": 617885, "epoch": 7444} {"train_loss": -27.753360748291016, "global_step": 617886, "epoch": 7444} {"train_loss": -27.942197799682617, "global_step": 617887, "epoch": 7444} {"train_loss": -28.0189266204834, "global_step": 617888, "epoch": 7444} {"train_loss": -28.016637802124023, "global_step": 617889, "epoch": 7444} {"train_loss": -27.94610023498535, "global_step": 617890, "epoch": 7444} {"train_loss": -27.774518966674805, "global_step": 617891, "epoch": 7444} {"train_loss": -27.94490623474121, "global_step": 617892, "epoch": 7444} {"train_loss": -27.809707641601562, "global_step": 617893, "epoch": 7444} {"train_loss": -27.861841201782227, "global_step": 617894, "epoch": 7444} {"train_loss": -27.85676383972168, "global_step": 617895, "epoch": 7444} {"train_loss": -28.12969398498535, "global_step": 617896, "epoch": 7444} {"train_loss": -28.387908935546875, "global_step": 617897, "epoch": 7444} {"train_loss": -28.03704261779785, "global_step": 617898, "epoch": 7444} {"train_loss": -28.283557891845703, "global_step": 617899, "epoch": 7444} {"train_loss": -28.123870849609375, "global_step": 617900, "epoch": 7444} {"train_loss": -28.025564193725586, "global_step": 617901, "epoch": 7444} {"train_loss": -28.09738540649414, "global_step": 617902, "epoch": 7444} {"train_loss": -28.228357315063477, "global_step": 617903, "epoch": 7444} {"train_loss": -28.255598068237305, "global_step": 617904, "epoch": 7444} {"train_loss": -28.653776168823242, "global_step": 617905, "epoch": 7444} {"train_loss": -28.285276412963867, "global_step": 617906, "epoch": 7444} {"train_loss": -28.32915687561035, "global_step": 617907, "epoch": 7444} {"train_loss": -28.357086181640625, "global_step": 617908, "epoch": 7444} {"train_loss": -28.381229400634766, "global_step": 617909, "epoch": 7444} {"train_loss": -28.049962997436523, "global_step": 617910, "epoch": 7444} {"train_loss": -28.72210693359375, "global_step": 617911, "epoch": 7444} {"train_loss": -28.2906551361084, "global_step": 617912, "epoch": 7444} {"train_loss": -28.403976440429688, "global_step": 617913, "epoch": 7444} {"train_loss": -28.3364315032959, "global_step": 617914, "epoch": 7444} {"train_loss": -28.09845542907715, "global_step": 617915, "epoch": 7444} {"train_loss": -28.231658935546875, "global_step": 617916, "epoch": 7444} {"train_loss": -28.27146339416504, "global_step": 617917, "epoch": 7444} {"train_loss": -28.132505416870117, "global_step": 617918, "epoch": 7444} {"train_loss": -28.030853271484375, "global_step": 617919, "epoch": 7444} {"train_loss": -27.923398971557617, "global_step": 617920, "epoch": 7444} {"train_loss": -28.223363876342773, "global_step": 617921, "epoch": 7444} {"train_loss": -27.615636825561523, "global_step": 617922, "epoch": 7444} {"train_loss": -27.683813095092773, "global_step": 617923, "epoch": 7444} {"train_loss": -27.991830825805664, "global_step": 617924, "epoch": 7444} {"train_loss": -27.80659294128418, "global_step": 617925, "epoch": 7444} {"train_loss": -27.555866241455078, "global_step": 617926, "epoch": 7444} {"train_loss": -28.179157257080078, "global_step": 617927, "epoch": 7444} {"train_loss": -27.584707260131836, "global_step": 617928, "epoch": 7444} {"train_loss": -28.21243667602539, "global_step": 617929, "epoch": 7444} {"train_loss": -27.99185562133789, "global_step": 617930, "epoch": 7444} {"train_loss": -27.716764450073242, "global_step": 617931, "epoch": 7444} {"train_loss": -27.8680362701416, "global_step": 617932, "epoch": 7444} {"train_loss": -28.009662628173828, "global_step": 617933, "epoch": 7444} {"train_loss": -27.681323913206537, "global_step": 617934, "epoch": 7444, "val_loss": 6613361.5} {"train_loss": -26.715002059936523, "global_step": 617935, "epoch": 7445} {"train_loss": -25.383508682250977, "global_step": 617936, "epoch": 7445} {"train_loss": -26.489465713500977, "global_step": 617937, "epoch": 7445} {"train_loss": -27.553552627563477, "global_step": 617938, "epoch": 7445} {"train_loss": -26.3783016204834, "global_step": 617939, "epoch": 7445} {"train_loss": -27.631433486938477, "global_step": 617940, "epoch": 7445} {"train_loss": -27.1939697265625, "global_step": 617941, "epoch": 7445} {"train_loss": -27.596426010131836, "global_step": 617942, "epoch": 7445} {"train_loss": -26.945783615112305, "global_step": 617943, "epoch": 7445} {"train_loss": -28.163373947143555, "global_step": 617944, "epoch": 7445} {"train_loss": -27.195341110229492, "global_step": 617945, "epoch": 7445} {"train_loss": -28.002246856689453, "global_step": 617946, "epoch": 7445} {"train_loss": -27.50445556640625, "global_step": 617947, "epoch": 7445} {"train_loss": -27.770944595336914, "global_step": 617948, "epoch": 7445} {"train_loss": -27.548749923706055, "global_step": 617949, "epoch": 7445} {"train_loss": -27.32618522644043, "global_step": 617950, "epoch": 7445} {"train_loss": -28.02473258972168, "global_step": 617951, "epoch": 7445} {"train_loss": -27.850147247314453, "global_step": 617952, "epoch": 7445} {"train_loss": -27.86724281311035, "global_step": 617953, "epoch": 7445} {"train_loss": -27.607648849487305, "global_step": 617954, "epoch": 7445} {"train_loss": -27.805435180664062, "global_step": 617955, "epoch": 7445} {"train_loss": -27.666736602783203, "global_step": 617956, "epoch": 7445} {"train_loss": -27.914709091186523, "global_step": 617957, "epoch": 7445} {"train_loss": -27.8734073638916, "global_step": 617958, "epoch": 7445} {"train_loss": -27.495542526245117, "global_step": 617959, "epoch": 7445} {"train_loss": -27.76702308654785, "global_step": 617960, "epoch": 7445} {"train_loss": -27.81744956970215, "global_step": 617961, "epoch": 7445} {"train_loss": -27.857309341430664, "global_step": 617962, "epoch": 7445} {"train_loss": -28.005414962768555, "global_step": 617963, "epoch": 7445} {"train_loss": -27.458057403564453, "global_step": 617964, "epoch": 7445} {"train_loss": -27.872283935546875, "global_step": 617965, "epoch": 7445} {"train_loss": -28.056232452392578, "global_step": 617966, "epoch": 7445} {"train_loss": -28.08330726623535, "global_step": 617967, "epoch": 7445} {"train_loss": -28.02410316467285, "global_step": 617968, "epoch": 7445} {"train_loss": -28.047470092773438, "global_step": 617969, "epoch": 7445} {"train_loss": -28.60028076171875, "global_step": 617970, "epoch": 7445} {"train_loss": -28.100971221923828, "global_step": 617971, "epoch": 7445} {"train_loss": -28.208459854125977, "global_step": 617972, "epoch": 7445} {"train_loss": -28.196563720703125, "global_step": 617973, "epoch": 7445} {"train_loss": -27.976276397705078, "global_step": 617974, "epoch": 7445} {"train_loss": -28.272451400756836, "global_step": 617975, "epoch": 7445} {"train_loss": -28.4294490814209, "global_step": 617976, "epoch": 7445} {"train_loss": -27.981794357299805, "global_step": 617977, "epoch": 7445} {"train_loss": -27.848493576049805, "global_step": 617978, "epoch": 7445} {"train_loss": -28.3088321685791, "global_step": 617979, "epoch": 7445} {"train_loss": -28.33949089050293, "global_step": 617980, "epoch": 7445} {"train_loss": -28.004718780517578, "global_step": 617981, "epoch": 7445} {"train_loss": -28.359968185424805, "global_step": 617982, "epoch": 7445} {"train_loss": -28.309696197509766, "global_step": 617983, "epoch": 7445} {"train_loss": -28.397199630737305, "global_step": 617984, "epoch": 7445} {"train_loss": -28.49811363220215, "global_step": 617985, "epoch": 7445} {"train_loss": -27.934356689453125, "global_step": 617986, "epoch": 7445} {"train_loss": -28.211029052734375, "global_step": 617987, "epoch": 7445} {"train_loss": -28.361295700073242, "global_step": 617988, "epoch": 7445} {"train_loss": -27.69232749938965, "global_step": 617989, "epoch": 7445} {"train_loss": -27.99611473083496, "global_step": 617990, "epoch": 7445} {"train_loss": -28.236114501953125, "global_step": 617991, "epoch": 7445} {"train_loss": -28.046035766601562, "global_step": 617992, "epoch": 7445} {"train_loss": -28.489538192749023, "global_step": 617993, "epoch": 7445} {"train_loss": -28.21457290649414, "global_step": 617994, "epoch": 7445} {"train_loss": -28.33478355407715, "global_step": 617995, "epoch": 7445} {"train_loss": -28.053577423095703, "global_step": 617996, "epoch": 7445} {"train_loss": -28.021997451782227, "global_step": 617997, "epoch": 7445} {"train_loss": -28.522876739501953, "global_step": 617998, "epoch": 7445} {"train_loss": -28.32984733581543, "global_step": 617999, "epoch": 7445} {"train_loss": -28.195898056030273, "global_step": 618000, "epoch": 7445} {"train_loss": -27.726255416870117, "global_step": 618001, "epoch": 7445} {"train_loss": -28.646310806274414, "global_step": 618002, "epoch": 7445} {"train_loss": -27.863147735595703, "global_step": 618003, "epoch": 7445} {"train_loss": -28.153125762939453, "global_step": 618004, "epoch": 7445} {"train_loss": -28.134122848510742, "global_step": 618005, "epoch": 7445} {"train_loss": -28.013830184936523, "global_step": 618006, "epoch": 7445} {"train_loss": -27.888586044311523, "global_step": 618007, "epoch": 7445} {"train_loss": -27.730188369750977, "global_step": 618008, "epoch": 7445} {"train_loss": -27.704055786132812, "global_step": 618009, "epoch": 7445} {"train_loss": -27.662445068359375, "global_step": 618010, "epoch": 7445} {"train_loss": -28.091053009033203, "global_step": 618011, "epoch": 7445} {"train_loss": -27.989782333374023, "global_step": 618012, "epoch": 7445} {"train_loss": -28.33979606628418, "global_step": 618013, "epoch": 7445} {"train_loss": -28.091705322265625, "global_step": 618014, "epoch": 7445} {"train_loss": -27.6843318939209, "global_step": 618015, "epoch": 7445} {"train_loss": -28.31595230102539, "global_step": 618016, "epoch": 7445} {"train_loss": -27.901322698018635, "global_step": 618017, "epoch": 7445, "val_loss": 6715193.0} {"train_loss": -26.834674835205078, "global_step": 618018, "epoch": 7446} {"train_loss": -27.244516372680664, "global_step": 618019, "epoch": 7446} {"train_loss": -27.373693466186523, "global_step": 618020, "epoch": 7446} {"train_loss": -27.217267990112305, "global_step": 618021, "epoch": 7446} {"train_loss": -27.356536865234375, "global_step": 618022, "epoch": 7446} {"train_loss": -27.483118057250977, "global_step": 618023, "epoch": 7446} {"train_loss": -27.763906478881836, "global_step": 618024, "epoch": 7446} {"train_loss": -27.708526611328125, "global_step": 618025, "epoch": 7446} {"train_loss": -27.530059814453125, "global_step": 618026, "epoch": 7446} {"train_loss": -27.9041690826416, "global_step": 618027, "epoch": 7446} {"train_loss": -27.79890251159668, "global_step": 618028, "epoch": 7446} {"train_loss": -27.583402633666992, "global_step": 618029, "epoch": 7446} {"train_loss": -27.556915283203125, "global_step": 618030, "epoch": 7446} {"train_loss": -27.687469482421875, "global_step": 618031, "epoch": 7446} {"train_loss": -27.845930099487305, "global_step": 618032, "epoch": 7446} {"train_loss": -27.6993350982666, "global_step": 618033, "epoch": 7446} {"train_loss": -27.70180320739746, "global_step": 618034, "epoch": 7446} {"train_loss": -27.81092643737793, "global_step": 618035, "epoch": 7446} {"train_loss": -28.164941787719727, "global_step": 618036, "epoch": 7446} {"train_loss": -27.91098976135254, "global_step": 618037, "epoch": 7446} {"train_loss": -28.205474853515625, "global_step": 618038, "epoch": 7446} {"train_loss": -28.057708740234375, "global_step": 618039, "epoch": 7446} {"train_loss": -28.113346099853516, "global_step": 618040, "epoch": 7446} {"train_loss": -27.838916778564453, "global_step": 618041, "epoch": 7446} {"train_loss": -28.02667808532715, "global_step": 618042, "epoch": 7446} {"train_loss": -28.119287490844727, "global_step": 618043, "epoch": 7446} {"train_loss": -27.984893798828125, "global_step": 618044, "epoch": 7446} {"train_loss": -28.351184844970703, "global_step": 618045, "epoch": 7446} {"train_loss": -28.50886344909668, "global_step": 618046, "epoch": 7446} {"train_loss": -28.17193603515625, "global_step": 618047, "epoch": 7446} {"train_loss": -28.225830078125, "global_step": 618048, "epoch": 7446} {"train_loss": -28.3160400390625, "global_step": 618049, "epoch": 7446} {"train_loss": -28.161834716796875, "global_step": 618050, "epoch": 7446} {"train_loss": -28.37778091430664, "global_step": 618051, "epoch": 7446} {"train_loss": -28.3166561126709, "global_step": 618052, "epoch": 7446} {"train_loss": -28.12519645690918, "global_step": 618053, "epoch": 7446} {"train_loss": -28.183124542236328, "global_step": 618054, "epoch": 7446} {"train_loss": -27.91328239440918, "global_step": 618055, "epoch": 7446} {"train_loss": -28.117292404174805, "global_step": 618056, "epoch": 7446} {"train_loss": -28.359298706054688, "global_step": 618057, "epoch": 7446} {"train_loss": -28.160009384155273, "global_step": 618058, "epoch": 7446} {"train_loss": -28.40447998046875, "global_step": 618059, "epoch": 7446} {"train_loss": -28.35733985900879, "global_step": 618060, "epoch": 7446} {"train_loss": -28.505340576171875, "global_step": 618061, "epoch": 7446} {"train_loss": -28.393308639526367, "global_step": 618062, "epoch": 7446} {"train_loss": -28.054920196533203, "global_step": 618063, "epoch": 7446} {"train_loss": -28.347736358642578, "global_step": 618064, "epoch": 7446} {"train_loss": -28.021347045898438, "global_step": 618065, "epoch": 7446} {"train_loss": -28.388248443603516, "global_step": 618066, "epoch": 7446} {"train_loss": -28.3280029296875, "global_step": 618067, "epoch": 7446} {"train_loss": -27.926801681518555, "global_step": 618068, "epoch": 7446} {"train_loss": -28.20257568359375, "global_step": 618069, "epoch": 7446} {"train_loss": -28.168415069580078, "global_step": 618070, "epoch": 7446} {"train_loss": -27.922216415405273, "global_step": 618071, "epoch": 7446} {"train_loss": -28.46262550354004, "global_step": 618072, "epoch": 7446} {"train_loss": -28.27703285217285, "global_step": 618073, "epoch": 7446} {"train_loss": -28.506689071655273, "global_step": 618074, "epoch": 7446} {"train_loss": -28.218952178955078, "global_step": 618075, "epoch": 7446} {"train_loss": -27.631677627563477, "global_step": 618076, "epoch": 7446} {"train_loss": -27.91901206970215, "global_step": 618077, "epoch": 7446} {"train_loss": -28.262744903564453, "global_step": 618078, "epoch": 7446} {"train_loss": -28.009449005126953, "global_step": 618079, "epoch": 7446} {"train_loss": -27.774824142456055, "global_step": 618080, "epoch": 7446} {"train_loss": -27.407312393188477, "global_step": 618081, "epoch": 7446} {"train_loss": -27.315048217773438, "global_step": 618082, "epoch": 7446} {"train_loss": -27.023731231689453, "global_step": 618083, "epoch": 7446} {"train_loss": -26.87421989440918, "global_step": 618084, "epoch": 7446} {"train_loss": -27.85957145690918, "global_step": 618085, "epoch": 7446} {"train_loss": -27.7258243560791, "global_step": 618086, "epoch": 7446} {"train_loss": -27.262434005737305, "global_step": 618087, "epoch": 7446} {"train_loss": -26.528888702392578, "global_step": 618088, "epoch": 7446} {"train_loss": -27.436735153198242, "global_step": 618089, "epoch": 7446} {"train_loss": -27.520994186401367, "global_step": 618090, "epoch": 7446} {"train_loss": -27.194005966186523, "global_step": 618091, "epoch": 7446} {"train_loss": -27.56926918029785, "global_step": 618092, "epoch": 7446} {"train_loss": -28.1448917388916, "global_step": 618093, "epoch": 7446} {"train_loss": -27.52655029296875, "global_step": 618094, "epoch": 7446} {"train_loss": -27.65057945251465, "global_step": 618095, "epoch": 7446} {"train_loss": -27.5662899017334, "global_step": 618096, "epoch": 7446} {"train_loss": -27.70192527770996, "global_step": 618097, "epoch": 7446} {"train_loss": -27.766401290893555, "global_step": 618098, "epoch": 7446} {"train_loss": -27.481470108032227, "global_step": 618099, "epoch": 7446} {"train_loss": -27.85304007472762, "global_step": 618100, "epoch": 7446, "val_loss": 6834435.0} {"train_loss": -27.36573600769043, "global_step": 618101, "epoch": 7447} {"train_loss": -27.817407608032227, "global_step": 618102, "epoch": 7447} {"train_loss": -27.549070358276367, "global_step": 618103, "epoch": 7447} {"train_loss": -28.004430770874023, "global_step": 618104, "epoch": 7447} {"train_loss": -27.316068649291992, "global_step": 618105, "epoch": 7447} {"train_loss": -27.818500518798828, "global_step": 618106, "epoch": 7447} {"train_loss": -27.72015953063965, "global_step": 618107, "epoch": 7447} {"train_loss": -27.656055450439453, "global_step": 618108, "epoch": 7447} {"train_loss": -27.85316276550293, "global_step": 618109, "epoch": 7447} {"train_loss": -28.15457534790039, "global_step": 618110, "epoch": 7447} {"train_loss": -27.9283390045166, "global_step": 618111, "epoch": 7447} {"train_loss": -27.835180282592773, "global_step": 618112, "epoch": 7447} {"train_loss": -28.413358688354492, "global_step": 618113, "epoch": 7447} {"train_loss": -28.07515525817871, "global_step": 618114, "epoch": 7447} {"train_loss": -27.771326065063477, "global_step": 618115, "epoch": 7447} {"train_loss": -28.073333740234375, "global_step": 618116, "epoch": 7447} {"train_loss": -28.52350425720215, "global_step": 618117, "epoch": 7447} {"train_loss": -28.39655113220215, "global_step": 618118, "epoch": 7447} {"train_loss": -28.14585304260254, "global_step": 618119, "epoch": 7447} {"train_loss": -27.936628341674805, "global_step": 618120, "epoch": 7447} {"train_loss": -28.337255477905273, "global_step": 618121, "epoch": 7447} {"train_loss": -28.472171783447266, "global_step": 618122, "epoch": 7447} {"train_loss": -28.429950714111328, "global_step": 618123, "epoch": 7447} {"train_loss": -28.17769432067871, "global_step": 618124, "epoch": 7447} {"train_loss": -28.296518325805664, "global_step": 618125, "epoch": 7447} {"train_loss": -28.206384658813477, "global_step": 618126, "epoch": 7447} {"train_loss": -28.397613525390625, "global_step": 618127, "epoch": 7447} {"train_loss": -28.167444229125977, "global_step": 618128, "epoch": 7447} {"train_loss": -28.209136962890625, "global_step": 618129, "epoch": 7447} {"train_loss": -28.2552547454834, "global_step": 618130, "epoch": 7447} {"train_loss": -28.09198570251465, "global_step": 618131, "epoch": 7447} {"train_loss": -28.105213165283203, "global_step": 618132, "epoch": 7447} {"train_loss": -28.141677856445312, "global_step": 618133, "epoch": 7447} {"train_loss": -28.51031494140625, "global_step": 618134, "epoch": 7447} {"train_loss": -28.96698570251465, "global_step": 618135, "epoch": 7447} {"train_loss": -27.9833927154541, "global_step": 618136, "epoch": 7447} {"train_loss": -28.399145126342773, "global_step": 618137, "epoch": 7447} {"train_loss": -28.100732803344727, "global_step": 618138, "epoch": 7447} {"train_loss": -28.598587036132812, "global_step": 618139, "epoch": 7447} {"train_loss": -28.089191436767578, "global_step": 618140, "epoch": 7447} {"train_loss": -27.990142822265625, "global_step": 618141, "epoch": 7447} {"train_loss": -28.043622970581055, "global_step": 618142, "epoch": 7447} {"train_loss": -27.986495971679688, "global_step": 618143, "epoch": 7447} {"train_loss": -28.25385856628418, "global_step": 618144, "epoch": 7447} {"train_loss": -28.12247085571289, "global_step": 618145, "epoch": 7447} {"train_loss": -28.465015411376953, "global_step": 618146, "epoch": 7447} {"train_loss": -28.1907958984375, "global_step": 618147, "epoch": 7447} {"train_loss": -28.547382354736328, "global_step": 618148, "epoch": 7447} {"train_loss": -28.112186431884766, "global_step": 618149, "epoch": 7447} {"train_loss": -28.57122802734375, "global_step": 618150, "epoch": 7447} {"train_loss": -28.13490104675293, "global_step": 618151, "epoch": 7447} {"train_loss": -28.549575805664062, "global_step": 618152, "epoch": 7447} {"train_loss": -28.522857666015625, "global_step": 618153, "epoch": 7447} {"train_loss": -28.273468017578125, "global_step": 618154, "epoch": 7447} {"train_loss": -28.464649200439453, "global_step": 618155, "epoch": 7447} {"train_loss": -28.221637725830078, "global_step": 618156, "epoch": 7447} {"train_loss": -27.83369255065918, "global_step": 618157, "epoch": 7447} {"train_loss": -27.880834579467773, "global_step": 618158, "epoch": 7447} {"train_loss": -27.76616859436035, "global_step": 618159, "epoch": 7447} {"train_loss": -27.47315788269043, "global_step": 618160, "epoch": 7447} {"train_loss": -27.119916915893555, "global_step": 618161, "epoch": 7447} {"train_loss": -27.910968780517578, "global_step": 618162, "epoch": 7447} {"train_loss": -27.715717315673828, "global_step": 618163, "epoch": 7447} {"train_loss": -27.836027145385742, "global_step": 618164, "epoch": 7447} {"train_loss": -27.87678337097168, "global_step": 618165, "epoch": 7447} {"train_loss": -28.196125030517578, "global_step": 618166, "epoch": 7447} {"train_loss": -27.991718292236328, "global_step": 618167, "epoch": 7447} {"train_loss": -28.006702423095703, "global_step": 618168, "epoch": 7447} {"train_loss": -28.081470489501953, "global_step": 618169, "epoch": 7447} {"train_loss": -28.369054794311523, "global_step": 618170, "epoch": 7447} {"train_loss": -28.290124893188477, "global_step": 618171, "epoch": 7447} {"train_loss": -27.64594841003418, "global_step": 618172, "epoch": 7447} {"train_loss": -28.2670841217041, "global_step": 618173, "epoch": 7447} {"train_loss": -28.115991592407227, "global_step": 618174, "epoch": 7447} {"train_loss": -28.11982536315918, "global_step": 618175, "epoch": 7447} {"train_loss": -27.976072311401367, "global_step": 618176, "epoch": 7447} {"train_loss": -27.978673934936523, "global_step": 618177, "epoch": 7447} {"train_loss": -28.19512367248535, "global_step": 618178, "epoch": 7447} {"train_loss": -28.65082359313965, "global_step": 618179, "epoch": 7447} {"train_loss": -28.243101119995117, "global_step": 618180, "epoch": 7447} {"train_loss": -27.8829402923584, "global_step": 618181, "epoch": 7447} {"train_loss": -28.185749053955078, "global_step": 618182, "epoch": 7447} {"train_loss": -28.116189657923687, "global_step": 618183, "epoch": 7447, "val_loss": 6772921.5} {"train_loss": -27.509933471679688, "global_step": 618184, "epoch": 7448} {"train_loss": -27.477832794189453, "global_step": 618185, "epoch": 7448} {"train_loss": -27.8714599609375, "global_step": 618186, "epoch": 7448} {"train_loss": -27.53887367248535, "global_step": 618187, "epoch": 7448} {"train_loss": -27.941741943359375, "global_step": 618188, "epoch": 7448} {"train_loss": -27.930648803710938, "global_step": 618189, "epoch": 7448} {"train_loss": -27.52730369567871, "global_step": 618190, "epoch": 7448} {"train_loss": -27.419189453125, "global_step": 618191, "epoch": 7448} {"train_loss": -27.9014835357666, "global_step": 618192, "epoch": 7448} {"train_loss": -27.969099044799805, "global_step": 618193, "epoch": 7448} {"train_loss": -28.057531356811523, "global_step": 618194, "epoch": 7448} {"train_loss": -27.89862060546875, "global_step": 618195, "epoch": 7448} {"train_loss": -28.012693405151367, "global_step": 618196, "epoch": 7448} {"train_loss": -27.900754928588867, "global_step": 618197, "epoch": 7448} {"train_loss": -28.001367568969727, "global_step": 618198, "epoch": 7448} {"train_loss": -28.0518856048584, "global_step": 618199, "epoch": 7448} {"train_loss": -28.156171798706055, "global_step": 618200, "epoch": 7448} {"train_loss": -28.263059616088867, "global_step": 618201, "epoch": 7448} {"train_loss": -27.963422775268555, "global_step": 618202, "epoch": 7448} {"train_loss": -27.9447078704834, "global_step": 618203, "epoch": 7448} {"train_loss": -27.795562744140625, "global_step": 618204, "epoch": 7448} {"train_loss": -27.96455192565918, "global_step": 618205, "epoch": 7448} {"train_loss": -28.182147979736328, "global_step": 618206, "epoch": 7448} {"train_loss": -28.42620849609375, "global_step": 618207, "epoch": 7448} {"train_loss": -28.13734245300293, "global_step": 618208, "epoch": 7448} {"train_loss": -28.136926651000977, "global_step": 618209, "epoch": 7448} {"train_loss": -28.11163330078125, "global_step": 618210, "epoch": 7448} {"train_loss": -28.09955406188965, "global_step": 618211, "epoch": 7448} {"train_loss": -28.34559440612793, "global_step": 618212, "epoch": 7448} {"train_loss": -28.204925537109375, "global_step": 618213, "epoch": 7448} {"train_loss": -28.480865478515625, "global_step": 618214, "epoch": 7448} {"train_loss": -28.263513565063477, "global_step": 618215, "epoch": 7448} {"train_loss": -27.954914093017578, "global_step": 618216, "epoch": 7448} {"train_loss": -28.031553268432617, "global_step": 618217, "epoch": 7448} {"train_loss": -28.01796531677246, "global_step": 618218, "epoch": 7448} {"train_loss": -28.2221622467041, "global_step": 618219, "epoch": 7448} {"train_loss": -28.0364933013916, "global_step": 618220, "epoch": 7448} {"train_loss": -27.9270076751709, "global_step": 618221, "epoch": 7448} {"train_loss": -28.080732345581055, "global_step": 618222, "epoch": 7448} {"train_loss": -28.152240753173828, "global_step": 618223, "epoch": 7448} {"train_loss": -28.046789169311523, "global_step": 618224, "epoch": 7448} {"train_loss": -28.300806045532227, "global_step": 618225, "epoch": 7448} {"train_loss": -28.22902488708496, "global_step": 618226, "epoch": 7448} {"train_loss": -27.7642822265625, "global_step": 618227, "epoch": 7448} {"train_loss": -28.108373641967773, "global_step": 618228, "epoch": 7448} {"train_loss": -27.981367111206055, "global_step": 618229, "epoch": 7448} {"train_loss": -28.102514266967773, "global_step": 618230, "epoch": 7448} {"train_loss": -28.015432357788086, "global_step": 618231, "epoch": 7448} {"train_loss": -28.476093292236328, "global_step": 618232, "epoch": 7448} {"train_loss": -27.961322784423828, "global_step": 618233, "epoch": 7448} {"train_loss": -27.93995475769043, "global_step": 618234, "epoch": 7448} {"train_loss": -28.27217674255371, "global_step": 618235, "epoch": 7448} {"train_loss": -28.210317611694336, "global_step": 618236, "epoch": 7448} {"train_loss": -28.09402847290039, "global_step": 618237, "epoch": 7448} {"train_loss": -28.320722579956055, "global_step": 618238, "epoch": 7448} {"train_loss": -27.929920196533203, "global_step": 618239, "epoch": 7448} {"train_loss": -28.26922607421875, "global_step": 618240, "epoch": 7448} {"train_loss": -27.92279624938965, "global_step": 618241, "epoch": 7448} {"train_loss": -28.008163452148438, "global_step": 618242, "epoch": 7448} {"train_loss": -28.203296661376953, "global_step": 618243, "epoch": 7448} {"train_loss": -28.412290573120117, "global_step": 618244, "epoch": 7448} {"train_loss": -28.02471923828125, "global_step": 618245, "epoch": 7448} {"train_loss": -27.978363037109375, "global_step": 618246, "epoch": 7448} {"train_loss": -28.241811752319336, "global_step": 618247, "epoch": 7448} {"train_loss": -28.01129150390625, "global_step": 618248, "epoch": 7448} {"train_loss": -28.632490158081055, "global_step": 618249, "epoch": 7448} {"train_loss": -28.27888298034668, "global_step": 618250, "epoch": 7448} {"train_loss": -28.197174072265625, "global_step": 618251, "epoch": 7448} {"train_loss": -28.27973747253418, "global_step": 618252, "epoch": 7448} {"train_loss": -27.88898277282715, "global_step": 618253, "epoch": 7448} {"train_loss": -27.960580825805664, "global_step": 618254, "epoch": 7448} {"train_loss": -28.56113624572754, "global_step": 618255, "epoch": 7448} {"train_loss": -28.294031143188477, "global_step": 618256, "epoch": 7448} {"train_loss": -28.011423110961914, "global_step": 618257, "epoch": 7448} {"train_loss": -28.383529663085938, "global_step": 618258, "epoch": 7448} {"train_loss": -28.13300895690918, "global_step": 618259, "epoch": 7448} {"train_loss": -27.89751625061035, "global_step": 618260, "epoch": 7448} {"train_loss": -28.030994415283203, "global_step": 618261, "epoch": 7448} {"train_loss": -28.312824249267578, "global_step": 618262, "epoch": 7448} {"train_loss": -28.117101669311523, "global_step": 618263, "epoch": 7448} {"train_loss": -28.0760498046875, "global_step": 618264, "epoch": 7448} {"train_loss": -28.25249671936035, "global_step": 618265, "epoch": 7448} {"train_loss": -28.08192839105445, "global_step": 618266, "epoch": 7448, "val_loss": 6831897.0} {"train_loss": -28.08420753479004, "global_step": 618267, "epoch": 7449} {"train_loss": -27.955602645874023, "global_step": 618268, "epoch": 7449} {"train_loss": -28.182804107666016, "global_step": 618269, "epoch": 7449} {"train_loss": -27.737030029296875, "global_step": 618270, "epoch": 7449} {"train_loss": -28.4912166595459, "global_step": 618271, "epoch": 7449} {"train_loss": -27.65419578552246, "global_step": 618272, "epoch": 7449} {"train_loss": -27.97120475769043, "global_step": 618273, "epoch": 7449} {"train_loss": -28.13602066040039, "global_step": 618274, "epoch": 7449} {"train_loss": -28.079755783081055, "global_step": 618275, "epoch": 7449} {"train_loss": -27.86164665222168, "global_step": 618276, "epoch": 7449} {"train_loss": -28.043989181518555, "global_step": 618277, "epoch": 7449} {"train_loss": -28.49201774597168, "global_step": 618278, "epoch": 7449} {"train_loss": -28.07671546936035, "global_step": 618279, "epoch": 7449} {"train_loss": -28.148168563842773, "global_step": 618280, "epoch": 7449} {"train_loss": -27.950849533081055, "global_step": 618281, "epoch": 7449} {"train_loss": -27.960784912109375, "global_step": 618282, "epoch": 7449} {"train_loss": -27.733966827392578, "global_step": 618283, "epoch": 7449} {"train_loss": -27.52445411682129, "global_step": 618284, "epoch": 7449} {"train_loss": -28.08099937438965, "global_step": 618285, "epoch": 7449} {"train_loss": -28.138086318969727, "global_step": 618286, "epoch": 7449} {"train_loss": -28.392597198486328, "global_step": 618287, "epoch": 7449} {"train_loss": -27.897476196289062, "global_step": 618288, "epoch": 7449} {"train_loss": -27.9744930267334, "global_step": 618289, "epoch": 7449} {"train_loss": -28.468652725219727, "global_step": 618290, "epoch": 7449} {"train_loss": -28.100919723510742, "global_step": 618291, "epoch": 7449} {"train_loss": -28.047107696533203, "global_step": 618292, "epoch": 7449} {"train_loss": -27.855030059814453, "global_step": 618293, "epoch": 7449} {"train_loss": -28.220544815063477, "global_step": 618294, "epoch": 7449} {"train_loss": -28.442432403564453, "global_step": 618295, "epoch": 7449} {"train_loss": -28.393661499023438, "global_step": 618296, "epoch": 7449} {"train_loss": -28.010501861572266, "global_step": 618297, "epoch": 7449} {"train_loss": -28.28700065612793, "global_step": 618298, "epoch": 7449} {"train_loss": -28.29656982421875, "global_step": 618299, "epoch": 7449} {"train_loss": -28.52913475036621, "global_step": 618300, "epoch": 7449} {"train_loss": -28.438398361206055, "global_step": 618301, "epoch": 7449} {"train_loss": -28.236459732055664, "global_step": 618302, "epoch": 7449} {"train_loss": -28.15457534790039, "global_step": 618303, "epoch": 7449} {"train_loss": -28.348377227783203, "global_step": 618304, "epoch": 7449} {"train_loss": -27.835546493530273, "global_step": 618305, "epoch": 7449} {"train_loss": -28.017484664916992, "global_step": 618306, "epoch": 7449} {"train_loss": -27.3288516998291, "global_step": 618307, "epoch": 7449} {"train_loss": -28.254301071166992, "global_step": 618308, "epoch": 7449} {"train_loss": -28.359832763671875, "global_step": 618309, "epoch": 7449} {"train_loss": -28.278690338134766, "global_step": 618310, "epoch": 7449} {"train_loss": -27.92227554321289, "global_step": 618311, "epoch": 7449} {"train_loss": -28.108524322509766, "global_step": 618312, "epoch": 7449} {"train_loss": -28.429670333862305, "global_step": 618313, "epoch": 7449} {"train_loss": -27.918991088867188, "global_step": 618314, "epoch": 7449} {"train_loss": -28.16033935546875, "global_step": 618315, "epoch": 7449} {"train_loss": -28.077777862548828, "global_step": 618316, "epoch": 7449} {"train_loss": -28.343420028686523, "global_step": 618317, "epoch": 7449} {"train_loss": -27.95887565612793, "global_step": 618318, "epoch": 7449} {"train_loss": -28.252197265625, "global_step": 618319, "epoch": 7449} {"train_loss": -28.2302188873291, "global_step": 618320, "epoch": 7449} {"train_loss": -28.094482421875, "global_step": 618321, "epoch": 7449} {"train_loss": -28.21169090270996, "global_step": 618322, "epoch": 7449} {"train_loss": -28.154010772705078, "global_step": 618323, "epoch": 7449} {"train_loss": -27.8732967376709, "global_step": 618324, "epoch": 7449} {"train_loss": -28.279531478881836, "global_step": 618325, "epoch": 7449} {"train_loss": -28.303159713745117, "global_step": 618326, "epoch": 7449} {"train_loss": -28.258718490600586, "global_step": 618327, "epoch": 7449} {"train_loss": -28.105863571166992, "global_step": 618328, "epoch": 7449} {"train_loss": -28.157794952392578, "global_step": 618329, "epoch": 7449} {"train_loss": -28.54133415222168, "global_step": 618330, "epoch": 7449} {"train_loss": -28.43646240234375, "global_step": 618331, "epoch": 7449} {"train_loss": -27.99732780456543, "global_step": 618332, "epoch": 7449} {"train_loss": -27.840482711791992, "global_step": 618333, "epoch": 7449} {"train_loss": -28.405261993408203, "global_step": 618334, "epoch": 7449} {"train_loss": -28.355558395385742, "global_step": 618335, "epoch": 7449} {"train_loss": -28.212244033813477, "global_step": 618336, "epoch": 7449} {"train_loss": -28.39143943786621, "global_step": 618337, "epoch": 7449} {"train_loss": -28.3845272064209, "global_step": 618338, "epoch": 7449} {"train_loss": -28.202667236328125, "global_step": 618339, "epoch": 7449} {"train_loss": -28.086816787719727, "global_step": 618340, "epoch": 7449} {"train_loss": -27.713470458984375, "global_step": 618341, "epoch": 7449} {"train_loss": -27.799802780151367, "global_step": 618342, "epoch": 7449} {"train_loss": -28.156057357788086, "global_step": 618343, "epoch": 7449} {"train_loss": -28.10096549987793, "global_step": 618344, "epoch": 7449} {"train_loss": -28.05576515197754, "global_step": 618345, "epoch": 7449} {"train_loss": -27.8770694732666, "global_step": 618346, "epoch": 7449} {"train_loss": -28.2587947845459, "global_step": 618347, "epoch": 7449} {"train_loss": -27.92054557800293, "global_step": 618348, "epoch": 7449} {"train_loss": -28.11955102667751, "global_step": 618349, "epoch": 7449, "val_loss": 6779521.0} {"train_loss": -25.62735939025879, "global_step": 618350, "epoch": 7450} {"train_loss": -25.09342384338379, "global_step": 618351, "epoch": 7450} {"train_loss": -27.38776206970215, "global_step": 618352, "epoch": 7450} {"train_loss": -26.562116622924805, "global_step": 618353, "epoch": 7450} {"train_loss": -25.754348754882812, "global_step": 618354, "epoch": 7450} {"train_loss": -27.41697120666504, "global_step": 618355, "epoch": 7450} {"train_loss": -26.464630126953125, "global_step": 618356, "epoch": 7450} {"train_loss": -26.62312889099121, "global_step": 618357, "epoch": 7450} {"train_loss": -26.705163955688477, "global_step": 618358, "epoch": 7450} {"train_loss": -26.97759437561035, "global_step": 618359, "epoch": 7450} {"train_loss": -27.029666900634766, "global_step": 618360, "epoch": 7450} {"train_loss": -27.191028594970703, "global_step": 618361, "epoch": 7450} {"train_loss": -27.203521728515625, "global_step": 618362, "epoch": 7450} {"train_loss": -27.28510093688965, "global_step": 618363, "epoch": 7450} {"train_loss": -27.253034591674805, "global_step": 618364, "epoch": 7450} {"train_loss": -27.584028244018555, "global_step": 618365, "epoch": 7450} {"train_loss": -27.489267349243164, "global_step": 618366, "epoch": 7450} {"train_loss": -27.050745010375977, "global_step": 618367, "epoch": 7450} {"train_loss": -27.608945846557617, "global_step": 618368, "epoch": 7450} {"train_loss": -27.263141632080078, "global_step": 618369, "epoch": 7450} {"train_loss": -27.657196044921875, "global_step": 618370, "epoch": 7450} {"train_loss": -27.63514518737793, "global_step": 618371, "epoch": 7450} {"train_loss": -27.471715927124023, "global_step": 618372, "epoch": 7450} {"train_loss": -27.638341903686523, "global_step": 618373, "epoch": 7450} {"train_loss": -27.90272331237793, "global_step": 618374, "epoch": 7450} {"train_loss": -27.89451026916504, "global_step": 618375, "epoch": 7450} {"train_loss": -28.253393173217773, "global_step": 618376, "epoch": 7450} {"train_loss": -27.533227920532227, "global_step": 618377, "epoch": 7450} {"train_loss": -27.763879776000977, "global_step": 618378, "epoch": 7450} {"train_loss": -27.948347091674805, "global_step": 618379, "epoch": 7450} {"train_loss": -27.975271224975586, "global_step": 618380, "epoch": 7450} {"train_loss": -27.740888595581055, "global_step": 618381, "epoch": 7450} {"train_loss": -27.72829246520996, "global_step": 618382, "epoch": 7450} {"train_loss": -27.905914306640625, "global_step": 618383, "epoch": 7450} {"train_loss": -28.270435333251953, "global_step": 618384, "epoch": 7450} {"train_loss": -28.177383422851562, "global_step": 618385, "epoch": 7450} {"train_loss": -27.99128532409668, "global_step": 618386, "epoch": 7450} {"train_loss": -28.006689071655273, "global_step": 618387, "epoch": 7450} {"train_loss": -28.184051513671875, "global_step": 618388, "epoch": 7450} {"train_loss": -28.224567413330078, "global_step": 618389, "epoch": 7450} {"train_loss": -28.02996253967285, "global_step": 618390, "epoch": 7450} {"train_loss": -28.343154907226562, "global_step": 618391, "epoch": 7450} {"train_loss": -28.22322654724121, "global_step": 618392, "epoch": 7450} {"train_loss": -28.458627700805664, "global_step": 618393, "epoch": 7450} {"train_loss": -28.1943302154541, "global_step": 618394, "epoch": 7450} {"train_loss": -28.636682510375977, "global_step": 618395, "epoch": 7450} {"train_loss": -28.355825424194336, "global_step": 618396, "epoch": 7450} {"train_loss": -28.485050201416016, "global_step": 618397, "epoch": 7450} {"train_loss": -28.327106475830078, "global_step": 618398, "epoch": 7450} {"train_loss": -28.101606369018555, "global_step": 618399, "epoch": 7450} {"train_loss": -28.402027130126953, "global_step": 618400, "epoch": 7450} {"train_loss": -27.984130859375, "global_step": 618401, "epoch": 7450} {"train_loss": -28.144535064697266, "global_step": 618402, "epoch": 7450} {"train_loss": -28.242202758789062, "global_step": 618403, "epoch": 7450} {"train_loss": -28.35978126525879, "global_step": 618404, "epoch": 7450} {"train_loss": -27.980131149291992, "global_step": 618405, "epoch": 7450} {"train_loss": -28.255945205688477, "global_step": 618406, "epoch": 7450} {"train_loss": -28.1821346282959, "global_step": 618407, "epoch": 7450} {"train_loss": -28.362211227416992, "global_step": 618408, "epoch": 7450} {"train_loss": -27.8389892578125, "global_step": 618409, "epoch": 7450} {"train_loss": -28.232406616210938, "global_step": 618410, "epoch": 7450} {"train_loss": -27.71949577331543, "global_step": 618411, "epoch": 7450} {"train_loss": -28.007648468017578, "global_step": 618412, "epoch": 7450} {"train_loss": -27.993350982666016, "global_step": 618413, "epoch": 7450} {"train_loss": -28.362268447875977, "global_step": 618414, "epoch": 7450} {"train_loss": -28.514440536499023, "global_step": 618415, "epoch": 7450} {"train_loss": -27.887048721313477, "global_step": 618416, "epoch": 7450} {"train_loss": -28.411178588867188, "global_step": 618417, "epoch": 7450} {"train_loss": -28.09395408630371, "global_step": 618418, "epoch": 7450} {"train_loss": -28.284637451171875, "global_step": 618419, "epoch": 7450} {"train_loss": -28.394018173217773, "global_step": 618420, "epoch": 7450} {"train_loss": -28.11993980407715, "global_step": 618421, "epoch": 7450} {"train_loss": -28.258710861206055, "global_step": 618422, "epoch": 7450} {"train_loss": -28.058685302734375, "global_step": 618423, "epoch": 7450} {"train_loss": -27.91777992248535, "global_step": 618424, "epoch": 7450} {"train_loss": -28.051427841186523, "global_step": 618425, "epoch": 7450} {"train_loss": -28.082504272460938, "global_step": 618426, "epoch": 7450} {"train_loss": -28.151208877563477, "global_step": 618427, "epoch": 7450} {"train_loss": -28.309839248657227, "global_step": 618428, "epoch": 7450} {"train_loss": -28.5882625579834, "global_step": 618429, "epoch": 7450} {"train_loss": -28.24348258972168, "global_step": 618430, "epoch": 7450} {"train_loss": -27.978397369384766, "global_step": 618431, "epoch": 7450} {"train_loss": -27.829513549804688, "global_step": 618432, "epoch": 7450, "train/sim_max_reward_0": 1.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 0.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4500000": 1.0, "test/sim_max_reward_4500001": 1.0, "test/sim_max_reward_4500002": 1.0, "test/sim_max_reward_4500003": 1.0, "test/sim_max_reward_4500004": 1.0, "test/sim_max_reward_4500005": 1.0, "test/sim_max_reward_4500006": 1.0, "test/sim_max_reward_4500007": 0.0, "test/sim_max_reward_4500008": 1.0, "test/sim_max_reward_4500009": 1.0, "test/sim_max_reward_4500010": 1.0, "test/sim_max_reward_4500011": 1.0, "test/sim_max_reward_4500012": 1.0, "test/sim_max_reward_4500013": 1.0, "test/sim_max_reward_4500014": 1.0, "test/sim_max_reward_4500015": 1.0, "test/sim_max_reward_4500016": 1.0, "test/sim_max_reward_4500017": 1.0, "test/sim_max_reward_4500018": 1.0, "test/sim_max_reward_4500019": 1.0, "test/sim_max_reward_4500020": 1.0, "test/sim_max_reward_4500021": 1.0, "train/mean_score": 0.8333333333333334, "test/mean_score": 0.9545454545454546, "val_loss": 6808167.0} {"train_loss": -27.549428939819336, "global_step": 618433, "epoch": 7451} {"train_loss": -27.15888786315918, "global_step": 618434, "epoch": 7451} {"train_loss": -26.9493350982666, "global_step": 618435, "epoch": 7451} {"train_loss": -26.933948516845703, "global_step": 618436, "epoch": 7451} {"train_loss": -26.204145431518555, "global_step": 618437, "epoch": 7451} {"train_loss": -27.539291381835938, "global_step": 618438, "epoch": 7451} {"train_loss": -27.22028160095215, "global_step": 618439, "epoch": 7451} {"train_loss": -27.604711532592773, "global_step": 618440, "epoch": 7451} {"train_loss": -27.55215835571289, "global_step": 618441, "epoch": 7451} {"train_loss": -27.51848793029785, "global_step": 618442, "epoch": 7451} {"train_loss": -27.781213760375977, "global_step": 618443, "epoch": 7451} {"train_loss": -27.899404525756836, "global_step": 618444, "epoch": 7451} {"train_loss": -27.631153106689453, "global_step": 618445, "epoch": 7451} {"train_loss": -28.003326416015625, "global_step": 618446, "epoch": 7451} {"train_loss": -27.59527587890625, "global_step": 618447, "epoch": 7451} {"train_loss": -27.660009384155273, "global_step": 618448, "epoch": 7451} {"train_loss": -27.781452178955078, "global_step": 618449, "epoch": 7451} {"train_loss": -27.678686141967773, "global_step": 618450, "epoch": 7451} {"train_loss": -27.68212890625, "global_step": 618451, "epoch": 7451} {"train_loss": -27.653898239135742, "global_step": 618452, "epoch": 7451} {"train_loss": -27.99371337890625, "global_step": 618453, "epoch": 7451} {"train_loss": -27.9661808013916, "global_step": 618454, "epoch": 7451} {"train_loss": -28.003448486328125, "global_step": 618455, "epoch": 7451} {"train_loss": -27.69426918029785, "global_step": 618456, "epoch": 7451} {"train_loss": -27.714801788330078, "global_step": 618457, "epoch": 7451} {"train_loss": -28.234302520751953, "global_step": 618458, "epoch": 7451} {"train_loss": -28.095203399658203, "global_step": 618459, "epoch": 7451} {"train_loss": -28.114715576171875, "global_step": 618460, "epoch": 7451} {"train_loss": -28.0794734954834, "global_step": 618461, "epoch": 7451} {"train_loss": -28.32288932800293, "global_step": 618462, "epoch": 7451} {"train_loss": -27.98748207092285, "global_step": 618463, "epoch": 7451} {"train_loss": -28.271757125854492, "global_step": 618464, "epoch": 7451} {"train_loss": -28.103788375854492, "global_step": 618465, "epoch": 7451} {"train_loss": -28.420690536499023, "global_step": 618466, "epoch": 7451} {"train_loss": -28.1318359375, "global_step": 618467, "epoch": 7451} {"train_loss": -28.44300651550293, "global_step": 618468, "epoch": 7451} {"train_loss": -28.376590728759766, "global_step": 618469, "epoch": 7451} {"train_loss": -28.30242919921875, "global_step": 618470, "epoch": 7451} {"train_loss": -28.34185218811035, "global_step": 618471, "epoch": 7451} {"train_loss": -28.446035385131836, "global_step": 618472, "epoch": 7451} {"train_loss": -28.47201919555664, "global_step": 618473, "epoch": 7451} {"train_loss": -28.42957878112793, "global_step": 618474, "epoch": 7451} {"train_loss": -28.126184463500977, "global_step": 618475, "epoch": 7451} {"train_loss": -28.11224365234375, "global_step": 618476, "epoch": 7451} {"train_loss": -28.3912410736084, "global_step": 618477, "epoch": 7451} {"train_loss": -28.175994873046875, "global_step": 618478, "epoch": 7451} {"train_loss": -28.057870864868164, "global_step": 618479, "epoch": 7451} {"train_loss": -27.92371940612793, "global_step": 618480, "epoch": 7451} {"train_loss": -28.194442749023438, "global_step": 618481, "epoch": 7451} {"train_loss": -28.33636474609375, "global_step": 618482, "epoch": 7451} {"train_loss": -28.071786880493164, "global_step": 618483, "epoch": 7451} {"train_loss": -27.938323974609375, "global_step": 618484, "epoch": 7451} {"train_loss": -28.340452194213867, "global_step": 618485, "epoch": 7451} {"train_loss": -28.06298828125, "global_step": 618486, "epoch": 7451} {"train_loss": -28.406965255737305, "global_step": 618487, "epoch": 7451} {"train_loss": -28.0565242767334, "global_step": 618488, "epoch": 7451} {"train_loss": -27.834829330444336, "global_step": 618489, "epoch": 7451} {"train_loss": -27.81376075744629, "global_step": 618490, "epoch": 7451} {"train_loss": -28.334640502929688, "global_step": 618491, "epoch": 7451} {"train_loss": -28.140283584594727, "global_step": 618492, "epoch": 7451} {"train_loss": -28.238515853881836, "global_step": 618493, "epoch": 7451} {"train_loss": -28.070556640625, "global_step": 618494, "epoch": 7451} {"train_loss": -28.281707763671875, "global_step": 618495, "epoch": 7451} {"train_loss": -27.806798934936523, "global_step": 618496, "epoch": 7451} {"train_loss": -27.93459129333496, "global_step": 618497, "epoch": 7451} {"train_loss": -28.476972579956055, "global_step": 618498, "epoch": 7451} {"train_loss": -28.13645362854004, "global_step": 618499, "epoch": 7451} {"train_loss": -28.103912353515625, "global_step": 618500, "epoch": 7451} {"train_loss": -28.14404296875, "global_step": 618501, "epoch": 7451} {"train_loss": -28.071271896362305, "global_step": 618502, "epoch": 7451} {"train_loss": -28.07293701171875, "global_step": 618503, "epoch": 7451} {"train_loss": -28.110204696655273, "global_step": 618504, "epoch": 7451} {"train_loss": -28.323352813720703, "global_step": 618505, "epoch": 7451} {"train_loss": -27.767919540405273, "global_step": 618506, "epoch": 7451} {"train_loss": -27.699893951416016, "global_step": 618507, "epoch": 7451} {"train_loss": -28.149816513061523, "global_step": 618508, "epoch": 7451} {"train_loss": -28.401214599609375, "global_step": 618509, "epoch": 7451} {"train_loss": -28.362934112548828, "global_step": 618510, "epoch": 7451} {"train_loss": -27.883838653564453, "global_step": 618511, "epoch": 7451} {"train_loss": -28.12178611755371, "global_step": 618512, "epoch": 7451} {"train_loss": -28.156757354736328, "global_step": 618513, "epoch": 7451} {"train_loss": -28.14703369140625, "global_step": 618514, "epoch": 7451} {"train_loss": -27.983896416353893, "global_step": 618515, "epoch": 7451, "val_loss": 6742836.0} {"train_loss": -27.590368270874023, "global_step": 618516, "epoch": 7452} {"train_loss": -27.173147201538086, "global_step": 618517, "epoch": 7452} {"train_loss": -27.552337646484375, "global_step": 618518, "epoch": 7452} {"train_loss": -27.94318199157715, "global_step": 618519, "epoch": 7452} {"train_loss": -27.73792839050293, "global_step": 618520, "epoch": 7452} {"train_loss": -27.43727684020996, "global_step": 618521, "epoch": 7452} {"train_loss": -27.593027114868164, "global_step": 618522, "epoch": 7452} {"train_loss": -27.487241744995117, "global_step": 618523, "epoch": 7452} {"train_loss": -27.959482192993164, "global_step": 618524, "epoch": 7452} {"train_loss": -27.8105411529541, "global_step": 618525, "epoch": 7452} {"train_loss": -28.014814376831055, "global_step": 618526, "epoch": 7452} {"train_loss": -27.73978042602539, "global_step": 618527, "epoch": 7452} {"train_loss": -27.878904342651367, "global_step": 618528, "epoch": 7452} {"train_loss": -27.94306755065918, "global_step": 618529, "epoch": 7452} {"train_loss": -27.608341217041016, "global_step": 618530, "epoch": 7452} {"train_loss": -27.461111068725586, "global_step": 618531, "epoch": 7452} {"train_loss": -27.91120719909668, "global_step": 618532, "epoch": 7452} {"train_loss": -27.97686767578125, "global_step": 618533, "epoch": 7452} {"train_loss": -27.385068893432617, "global_step": 618534, "epoch": 7452} {"train_loss": -27.83331298828125, "global_step": 618535, "epoch": 7452} {"train_loss": -27.675907135009766, "global_step": 618536, "epoch": 7452} {"train_loss": -27.9653377532959, "global_step": 618537, "epoch": 7452} {"train_loss": -27.69318199157715, "global_step": 618538, "epoch": 7452} {"train_loss": -28.19972801208496, "global_step": 618539, "epoch": 7452} {"train_loss": -27.95011329650879, "global_step": 618540, "epoch": 7452} {"train_loss": -27.846393585205078, "global_step": 618541, "epoch": 7452} {"train_loss": -28.101369857788086, "global_step": 618542, "epoch": 7452} {"train_loss": -28.185256958007812, "global_step": 618543, "epoch": 7452} {"train_loss": -27.85109519958496, "global_step": 618544, "epoch": 7452} {"train_loss": -28.374921798706055, "global_step": 618545, "epoch": 7452} {"train_loss": -28.42494010925293, "global_step": 618546, "epoch": 7452} {"train_loss": -28.342350006103516, "global_step": 618547, "epoch": 7452} {"train_loss": -28.200687408447266, "global_step": 618548, "epoch": 7452} {"train_loss": -27.911935806274414, "global_step": 618549, "epoch": 7452} {"train_loss": -28.25270652770996, "global_step": 618550, "epoch": 7452} {"train_loss": -27.961618423461914, "global_step": 618551, "epoch": 7452} {"train_loss": -28.033782958984375, "global_step": 618552, "epoch": 7452} {"train_loss": -28.128402709960938, "global_step": 618553, "epoch": 7452} {"train_loss": -28.214696884155273, "global_step": 618554, "epoch": 7452} {"train_loss": -28.143285751342773, "global_step": 618555, "epoch": 7452} {"train_loss": -28.192371368408203, "global_step": 618556, "epoch": 7452} {"train_loss": -28.44146156311035, "global_step": 618557, "epoch": 7452} {"train_loss": -28.34852409362793, "global_step": 618558, "epoch": 7452} {"train_loss": -28.37847328186035, "global_step": 618559, "epoch": 7452} {"train_loss": -28.115488052368164, "global_step": 618560, "epoch": 7452} {"train_loss": -28.098316192626953, "global_step": 618561, "epoch": 7452} {"train_loss": -28.416675567626953, "global_step": 618562, "epoch": 7452} {"train_loss": -28.26016616821289, "global_step": 618563, "epoch": 7452} {"train_loss": -28.211811065673828, "global_step": 618564, "epoch": 7452} {"train_loss": -28.00691795349121, "global_step": 618565, "epoch": 7452} {"train_loss": -28.485992431640625, "global_step": 618566, "epoch": 7452} {"train_loss": -27.939619064331055, "global_step": 618567, "epoch": 7452} {"train_loss": -28.18658447265625, "global_step": 618568, "epoch": 7452} {"train_loss": -28.062986373901367, "global_step": 618569, "epoch": 7452} {"train_loss": -27.966394424438477, "global_step": 618570, "epoch": 7452} {"train_loss": -28.237701416015625, "global_step": 618571, "epoch": 7452} {"train_loss": -28.107465744018555, "global_step": 618572, "epoch": 7452} {"train_loss": -28.337438583374023, "global_step": 618573, "epoch": 7452} {"train_loss": -28.134445190429688, "global_step": 618574, "epoch": 7452} {"train_loss": -28.242822647094727, "global_step": 618575, "epoch": 7452} {"train_loss": -27.63046646118164, "global_step": 618576, "epoch": 7452} {"train_loss": -28.214710235595703, "global_step": 618577, "epoch": 7452} {"train_loss": -28.097272872924805, "global_step": 618578, "epoch": 7452} {"train_loss": -27.975645065307617, "global_step": 618579, "epoch": 7452} {"train_loss": -28.4537410736084, "global_step": 618580, "epoch": 7452} {"train_loss": -27.8468074798584, "global_step": 618581, "epoch": 7452} {"train_loss": -28.27484130859375, "global_step": 618582, "epoch": 7452} {"train_loss": -28.239728927612305, "global_step": 618583, "epoch": 7452} {"train_loss": -28.371000289916992, "global_step": 618584, "epoch": 7452} {"train_loss": -28.29536247253418, "global_step": 618585, "epoch": 7452} {"train_loss": -28.465625762939453, "global_step": 618586, "epoch": 7452} {"train_loss": -28.103992462158203, "global_step": 618587, "epoch": 7452} {"train_loss": -27.90156364440918, "global_step": 618588, "epoch": 7452} {"train_loss": -28.142486572265625, "global_step": 618589, "epoch": 7452} {"train_loss": -28.15748405456543, "global_step": 618590, "epoch": 7452} {"train_loss": -28.430845260620117, "global_step": 618591, "epoch": 7452} {"train_loss": -28.517980575561523, "global_step": 618592, "epoch": 7452} {"train_loss": -28.18348503112793, "global_step": 618593, "epoch": 7452} {"train_loss": -28.366113662719727, "global_step": 618594, "epoch": 7452} {"train_loss": -28.153827667236328, "global_step": 618595, "epoch": 7452} {"train_loss": -28.1765079498291, "global_step": 618596, "epoch": 7452} {"train_loss": -28.165409088134766, "global_step": 618597, "epoch": 7452} {"train_loss": -28.064511609364704, "global_step": 618598, "epoch": 7452, "val_loss": 6653581.0} {"train_loss": -27.973876953125, "global_step": 618599, "epoch": 7453} {"train_loss": -27.28678321838379, "global_step": 618600, "epoch": 7453} {"train_loss": -28.05986976623535, "global_step": 618601, "epoch": 7453} {"train_loss": -27.716480255126953, "global_step": 618602, "epoch": 7453} {"train_loss": -27.694272994995117, "global_step": 618603, "epoch": 7453} {"train_loss": -27.79022216796875, "global_step": 618604, "epoch": 7453} {"train_loss": -27.591358184814453, "global_step": 618605, "epoch": 7453} {"train_loss": -28.027387619018555, "global_step": 618606, "epoch": 7453} {"train_loss": -27.952972412109375, "global_step": 618607, "epoch": 7453} {"train_loss": -27.79123306274414, "global_step": 618608, "epoch": 7453} {"train_loss": -27.84600257873535, "global_step": 618609, "epoch": 7453} {"train_loss": -27.92475700378418, "global_step": 618610, "epoch": 7453} {"train_loss": -28.200021743774414, "global_step": 618611, "epoch": 7453} {"train_loss": -28.108108520507812, "global_step": 618612, "epoch": 7453} {"train_loss": -28.168060302734375, "global_step": 618613, "epoch": 7453} {"train_loss": -27.906591415405273, "global_step": 618614, "epoch": 7453} {"train_loss": -27.817646026611328, "global_step": 618615, "epoch": 7453} {"train_loss": -27.942655563354492, "global_step": 618616, "epoch": 7453} {"train_loss": -27.82923698425293, "global_step": 618617, "epoch": 7453} {"train_loss": -27.681640625, "global_step": 618618, "epoch": 7453} {"train_loss": -27.940723419189453, "global_step": 618619, "epoch": 7453} {"train_loss": -28.47121238708496, "global_step": 618620, "epoch": 7453} {"train_loss": -28.316303253173828, "global_step": 618621, "epoch": 7453} {"train_loss": -28.02790641784668, "global_step": 618622, "epoch": 7453} {"train_loss": -28.07990837097168, "global_step": 618623, "epoch": 7453} {"train_loss": -28.341724395751953, "global_step": 618624, "epoch": 7453} {"train_loss": -28.151752471923828, "global_step": 618625, "epoch": 7453} {"train_loss": -28.176855087280273, "global_step": 618626, "epoch": 7453} {"train_loss": -27.819345474243164, "global_step": 618627, "epoch": 7453} {"train_loss": -27.958179473876953, "global_step": 618628, "epoch": 7453} {"train_loss": -28.281457901000977, "global_step": 618629, "epoch": 7453} {"train_loss": -27.866546630859375, "global_step": 618630, "epoch": 7453} {"train_loss": -28.01503562927246, "global_step": 618631, "epoch": 7453} {"train_loss": -28.191680908203125, "global_step": 618632, "epoch": 7453} {"train_loss": -28.177413940429688, "global_step": 618633, "epoch": 7453} {"train_loss": -28.2069091796875, "global_step": 618634, "epoch": 7453} {"train_loss": -28.063690185546875, "global_step": 618635, "epoch": 7453} {"train_loss": -28.133304595947266, "global_step": 618636, "epoch": 7453} {"train_loss": -28.201154708862305, "global_step": 618637, "epoch": 7453} {"train_loss": -28.143218994140625, "global_step": 618638, "epoch": 7453} {"train_loss": -28.049610137939453, "global_step": 618639, "epoch": 7453} {"train_loss": -28.197412490844727, "global_step": 618640, "epoch": 7453} {"train_loss": -28.21327018737793, "global_step": 618641, "epoch": 7453} {"train_loss": -27.983556747436523, "global_step": 618642, "epoch": 7453} {"train_loss": -28.508695602416992, "global_step": 618643, "epoch": 7453} {"train_loss": -28.06511878967285, "global_step": 618644, "epoch": 7453} {"train_loss": -28.468433380126953, "global_step": 618645, "epoch": 7453} {"train_loss": -28.013717651367188, "global_step": 618646, "epoch": 7453} {"train_loss": -28.38641929626465, "global_step": 618647, "epoch": 7453} {"train_loss": -28.559452056884766, "global_step": 618648, "epoch": 7453} {"train_loss": -28.56805419921875, "global_step": 618649, "epoch": 7453} {"train_loss": -28.1768798828125, "global_step": 618650, "epoch": 7453} {"train_loss": -28.18548583984375, "global_step": 618651, "epoch": 7453} {"train_loss": -28.329345703125, "global_step": 618652, "epoch": 7453} {"train_loss": -28.380878448486328, "global_step": 618653, "epoch": 7453} {"train_loss": -28.561817169189453, "global_step": 618654, "epoch": 7453} {"train_loss": -28.18464469909668, "global_step": 618655, "epoch": 7453} {"train_loss": -28.2264461517334, "global_step": 618656, "epoch": 7453} {"train_loss": -28.53558921813965, "global_step": 618657, "epoch": 7453} {"train_loss": -28.469207763671875, "global_step": 618658, "epoch": 7453} {"train_loss": -28.482080459594727, "global_step": 618659, "epoch": 7453} {"train_loss": -28.1933536529541, "global_step": 618660, "epoch": 7453} {"train_loss": -28.178796768188477, "global_step": 618661, "epoch": 7453} {"train_loss": -28.1616268157959, "global_step": 618662, "epoch": 7453} {"train_loss": -27.694372177124023, "global_step": 618663, "epoch": 7453} {"train_loss": -27.836368560791016, "global_step": 618664, "epoch": 7453} {"train_loss": -27.78761100769043, "global_step": 618665, "epoch": 7453} {"train_loss": -27.049768447875977, "global_step": 618666, "epoch": 7453} {"train_loss": -27.140594482421875, "global_step": 618667, "epoch": 7453} {"train_loss": -26.937047958374023, "global_step": 618668, "epoch": 7453} {"train_loss": -27.964136123657227, "global_step": 618669, "epoch": 7453} {"train_loss": -27.780431747436523, "global_step": 618670, "epoch": 7453} {"train_loss": -27.616668701171875, "global_step": 618671, "epoch": 7453} {"train_loss": -27.5169734954834, "global_step": 618672, "epoch": 7453} {"train_loss": -27.9877872467041, "global_step": 618673, "epoch": 7453} {"train_loss": -27.8411922454834, "global_step": 618674, "epoch": 7453} {"train_loss": -27.71576499938965, "global_step": 618675, "epoch": 7453} {"train_loss": -28.143035888671875, "global_step": 618676, "epoch": 7453} {"train_loss": -27.91584587097168, "global_step": 618677, "epoch": 7453} {"train_loss": -28.321928024291992, "global_step": 618678, "epoch": 7453} {"train_loss": -28.426267623901367, "global_step": 618679, "epoch": 7453} {"train_loss": -28.02296257019043, "global_step": 618680, "epoch": 7453} {"train_loss": -28.01802812139672, "global_step": 618681, "epoch": 7453, "val_loss": 6741539.0} {"train_loss": -27.662673950195312, "global_step": 618682, "epoch": 7454} {"train_loss": -27.73968505859375, "global_step": 618683, "epoch": 7454} {"train_loss": -27.603504180908203, "global_step": 618684, "epoch": 7454} {"train_loss": -27.683141708374023, "global_step": 618685, "epoch": 7454} {"train_loss": -27.306074142456055, "global_step": 618686, "epoch": 7454} {"train_loss": -27.779102325439453, "global_step": 618687, "epoch": 7454} {"train_loss": -28.0272216796875, "global_step": 618688, "epoch": 7454} {"train_loss": -27.473379135131836, "global_step": 618689, "epoch": 7454} {"train_loss": -28.14300537109375, "global_step": 618690, "epoch": 7454} {"train_loss": -28.07065773010254, "global_step": 618691, "epoch": 7454} {"train_loss": -28.079776763916016, "global_step": 618692, "epoch": 7454} {"train_loss": -28.097360610961914, "global_step": 618693, "epoch": 7454} {"train_loss": -27.842679977416992, "global_step": 618694, "epoch": 7454} {"train_loss": -28.184900283813477, "global_step": 618695, "epoch": 7454} {"train_loss": -28.188379287719727, "global_step": 618696, "epoch": 7454} {"train_loss": -28.391355514526367, "global_step": 618697, "epoch": 7454} {"train_loss": -28.019561767578125, "global_step": 618698, "epoch": 7454} {"train_loss": -28.161956787109375, "global_step": 618699, "epoch": 7454} {"train_loss": -28.139041900634766, "global_step": 618700, "epoch": 7454} {"train_loss": -27.9140625, "global_step": 618701, "epoch": 7454} {"train_loss": -28.391525268554688, "global_step": 618702, "epoch": 7454} {"train_loss": -28.147022247314453, "global_step": 618703, "epoch": 7454} {"train_loss": -28.183807373046875, "global_step": 618704, "epoch": 7454} {"train_loss": -27.790369033813477, "global_step": 618705, "epoch": 7454} {"train_loss": -28.210840225219727, "global_step": 618706, "epoch": 7454} {"train_loss": -28.07929801940918, "global_step": 618707, "epoch": 7454} {"train_loss": -28.54860496520996, "global_step": 618708, "epoch": 7454} {"train_loss": -28.239913940429688, "global_step": 618709, "epoch": 7454} {"train_loss": -28.323984146118164, "global_step": 618710, "epoch": 7454} {"train_loss": -28.222936630249023, "global_step": 618711, "epoch": 7454} {"train_loss": -28.25577735900879, "global_step": 618712, "epoch": 7454} {"train_loss": -28.244739532470703, "global_step": 618713, "epoch": 7454} {"train_loss": -28.069507598876953, "global_step": 618714, "epoch": 7454} {"train_loss": -27.957448959350586, "global_step": 618715, "epoch": 7454} {"train_loss": -28.43732261657715, "global_step": 618716, "epoch": 7454} {"train_loss": -28.09929847717285, "global_step": 618717, "epoch": 7454} {"train_loss": -28.009601593017578, "global_step": 618718, "epoch": 7454} {"train_loss": -28.57911491394043, "global_step": 618719, "epoch": 7454} {"train_loss": -28.0875301361084, "global_step": 618720, "epoch": 7454} {"train_loss": -27.867385864257812, "global_step": 618721, "epoch": 7454} {"train_loss": -28.29776954650879, "global_step": 618722, "epoch": 7454} {"train_loss": -28.2971248626709, "global_step": 618723, "epoch": 7454} {"train_loss": -27.95600700378418, "global_step": 618724, "epoch": 7454} {"train_loss": -28.27528953552246, "global_step": 618725, "epoch": 7454} {"train_loss": -28.222803115844727, "global_step": 618726, "epoch": 7454} {"train_loss": -28.050567626953125, "global_step": 618727, "epoch": 7454} {"train_loss": -28.30316162109375, "global_step": 618728, "epoch": 7454} {"train_loss": -27.897781372070312, "global_step": 618729, "epoch": 7454} {"train_loss": -27.920263290405273, "global_step": 618730, "epoch": 7454} {"train_loss": -27.829578399658203, "global_step": 618731, "epoch": 7454} {"train_loss": -27.966064453125, "global_step": 618732, "epoch": 7454} {"train_loss": -28.221654891967773, "global_step": 618733, "epoch": 7454} {"train_loss": -28.125839233398438, "global_step": 618734, "epoch": 7454} {"train_loss": -28.408985137939453, "global_step": 618735, "epoch": 7454} {"train_loss": -28.356809616088867, "global_step": 618736, "epoch": 7454} {"train_loss": -27.445459365844727, "global_step": 618737, "epoch": 7454} {"train_loss": -28.082468032836914, "global_step": 618738, "epoch": 7454} {"train_loss": -27.854812622070312, "global_step": 618739, "epoch": 7454} {"train_loss": -27.868579864501953, "global_step": 618740, "epoch": 7454} {"train_loss": -28.169727325439453, "global_step": 618741, "epoch": 7454} {"train_loss": -28.087554931640625, "global_step": 618742, "epoch": 7454} {"train_loss": -27.75147819519043, "global_step": 618743, "epoch": 7454} {"train_loss": -27.824365615844727, "global_step": 618744, "epoch": 7454} {"train_loss": -27.92384147644043, "global_step": 618745, "epoch": 7454} {"train_loss": -27.906660079956055, "global_step": 618746, "epoch": 7454} {"train_loss": -27.334936141967773, "global_step": 618747, "epoch": 7454} {"train_loss": -28.0721435546875, "global_step": 618748, "epoch": 7454} {"train_loss": -27.868072509765625, "global_step": 618749, "epoch": 7454} {"train_loss": -28.100067138671875, "global_step": 618750, "epoch": 7454} {"train_loss": -27.48408317565918, "global_step": 618751, "epoch": 7454} {"train_loss": -27.9901180267334, "global_step": 618752, "epoch": 7454} {"train_loss": -28.099231719970703, "global_step": 618753, "epoch": 7454} {"train_loss": -28.264982223510742, "global_step": 618754, "epoch": 7454} {"train_loss": -28.07477378845215, "global_step": 618755, "epoch": 7454} {"train_loss": -28.40693473815918, "global_step": 618756, "epoch": 7454} {"train_loss": -28.309101104736328, "global_step": 618757, "epoch": 7454} {"train_loss": -28.187891006469727, "global_step": 618758, "epoch": 7454} {"train_loss": -28.48260498046875, "global_step": 618759, "epoch": 7454} {"train_loss": -28.275068283081055, "global_step": 618760, "epoch": 7454} {"train_loss": -28.3134708404541, "global_step": 618761, "epoch": 7454} {"train_loss": -28.634571075439453, "global_step": 618762, "epoch": 7454} {"train_loss": -28.249475479125977, "global_step": 618763, "epoch": 7454} {"train_loss": -28.05827848595309, "global_step": 618764, "epoch": 7454, "val_loss": 6814061.0} {"train_loss": -27.537839889526367, "global_step": 618765, "epoch": 7455} {"train_loss": -27.626150131225586, "global_step": 618766, "epoch": 7455} {"train_loss": -27.58674430847168, "global_step": 618767, "epoch": 7455} {"train_loss": -27.414331436157227, "global_step": 618768, "epoch": 7455} {"train_loss": -27.693883895874023, "global_step": 618769, "epoch": 7455} {"train_loss": -28.2200927734375, "global_step": 618770, "epoch": 7455} {"train_loss": -27.248905181884766, "global_step": 618771, "epoch": 7455} {"train_loss": -27.0245304107666, "global_step": 618772, "epoch": 7455} {"train_loss": -27.67913818359375, "global_step": 618773, "epoch": 7455} {"train_loss": -27.59431266784668, "global_step": 618774, "epoch": 7455} {"train_loss": -27.700977325439453, "global_step": 618775, "epoch": 7455} {"train_loss": -27.385364532470703, "global_step": 618776, "epoch": 7455} {"train_loss": -27.684309005737305, "global_step": 618777, "epoch": 7455} {"train_loss": -28.103351593017578, "global_step": 618778, "epoch": 7455} {"train_loss": -27.708288192749023, "global_step": 618779, "epoch": 7455} {"train_loss": -27.631805419921875, "global_step": 618780, "epoch": 7455} {"train_loss": -27.658252716064453, "global_step": 618781, "epoch": 7455} {"train_loss": -27.584989547729492, "global_step": 618782, "epoch": 7455} {"train_loss": -28.052978515625, "global_step": 618783, "epoch": 7455} {"train_loss": -27.930810928344727, "global_step": 618784, "epoch": 7455} {"train_loss": -27.86358070373535, "global_step": 618785, "epoch": 7455} {"train_loss": -28.006921768188477, "global_step": 618786, "epoch": 7455} {"train_loss": -27.949630737304688, "global_step": 618787, "epoch": 7455} {"train_loss": -27.98432731628418, "global_step": 618788, "epoch": 7455} {"train_loss": -27.986114501953125, "global_step": 618789, "epoch": 7455} {"train_loss": -27.718870162963867, "global_step": 618790, "epoch": 7455} {"train_loss": -28.00739860534668, "global_step": 618791, "epoch": 7455} {"train_loss": -28.205978393554688, "global_step": 618792, "epoch": 7455} {"train_loss": -27.982501983642578, "global_step": 618793, "epoch": 7455} {"train_loss": -28.123010635375977, "global_step": 618794, "epoch": 7455} {"train_loss": -28.28669548034668, "global_step": 618795, "epoch": 7455} {"train_loss": -28.124134063720703, "global_step": 618796, "epoch": 7455} {"train_loss": -28.39918327331543, "global_step": 618797, "epoch": 7455} {"train_loss": -28.258987426757812, "global_step": 618798, "epoch": 7455} {"train_loss": -28.22342300415039, "global_step": 618799, "epoch": 7455} {"train_loss": -27.9967098236084, "global_step": 618800, "epoch": 7455} {"train_loss": -28.25298500061035, "global_step": 618801, "epoch": 7455} {"train_loss": -28.448583602905273, "global_step": 618802, "epoch": 7455} {"train_loss": -28.224212646484375, "global_step": 618803, "epoch": 7455} {"train_loss": -27.983572006225586, "global_step": 618804, "epoch": 7455} {"train_loss": -28.348230361938477, "global_step": 618805, "epoch": 7455} {"train_loss": -28.413061141967773, "global_step": 618806, "epoch": 7455} {"train_loss": -27.998523712158203, "global_step": 618807, "epoch": 7455} {"train_loss": -28.163833618164062, "global_step": 618808, "epoch": 7455} {"train_loss": -28.086593627929688, "global_step": 618809, "epoch": 7455} {"train_loss": -28.615888595581055, "global_step": 618810, "epoch": 7455} {"train_loss": -28.176382064819336, "global_step": 618811, "epoch": 7455} {"train_loss": -27.740148544311523, "global_step": 618812, "epoch": 7455} {"train_loss": -28.184680938720703, "global_step": 618813, "epoch": 7455} {"train_loss": -27.837045669555664, "global_step": 618814, "epoch": 7455} {"train_loss": -27.870691299438477, "global_step": 618815, "epoch": 7455} {"train_loss": -28.198410034179688, "global_step": 618816, "epoch": 7455} {"train_loss": -27.58786392211914, "global_step": 618817, "epoch": 7455} {"train_loss": -28.239850997924805, "global_step": 618818, "epoch": 7455} {"train_loss": -27.7044677734375, "global_step": 618819, "epoch": 7455} {"train_loss": -28.222753524780273, "global_step": 618820, "epoch": 7455} {"train_loss": -28.16082763671875, "global_step": 618821, "epoch": 7455} {"train_loss": -28.330341339111328, "global_step": 618822, "epoch": 7455} {"train_loss": -28.14755630493164, "global_step": 618823, "epoch": 7455} {"train_loss": -28.534469604492188, "global_step": 618824, "epoch": 7455} {"train_loss": -28.189807891845703, "global_step": 618825, "epoch": 7455} {"train_loss": -28.07731056213379, "global_step": 618826, "epoch": 7455} {"train_loss": -28.023441314697266, "global_step": 618827, "epoch": 7455} {"train_loss": -28.07474136352539, "global_step": 618828, "epoch": 7455} {"train_loss": -28.287841796875, "global_step": 618829, "epoch": 7455} {"train_loss": -28.246545791625977, "global_step": 618830, "epoch": 7455} {"train_loss": -28.170166015625, "global_step": 618831, "epoch": 7455} {"train_loss": -28.108062744140625, "global_step": 618832, "epoch": 7455} {"train_loss": -27.8040714263916, "global_step": 618833, "epoch": 7455} {"train_loss": -27.930374145507812, "global_step": 618834, "epoch": 7455} {"train_loss": -28.168241500854492, "global_step": 618835, "epoch": 7455} {"train_loss": -28.1501522064209, "global_step": 618836, "epoch": 7455} {"train_loss": -27.61467933654785, "global_step": 618837, "epoch": 7455} {"train_loss": -28.046628952026367, "global_step": 618838, "epoch": 7455} {"train_loss": -28.06304359436035, "global_step": 618839, "epoch": 7455} {"train_loss": -27.811750411987305, "global_step": 618840, "epoch": 7455} {"train_loss": -27.72556495666504, "global_step": 618841, "epoch": 7455} {"train_loss": -27.8684139251709, "global_step": 618842, "epoch": 7455} {"train_loss": -27.823583602905273, "global_step": 618843, "epoch": 7455} {"train_loss": -27.798419952392578, "global_step": 618844, "epoch": 7455} {"train_loss": -28.185461044311523, "global_step": 618845, "epoch": 7455} {"train_loss": -28.420568466186523, "global_step": 618846, "epoch": 7455} {"train_loss": -27.966985633574335, "global_step": 618847, "epoch": 7455, "val_loss": 6846102.0} {"train_loss": -26.899057388305664, "global_step": 618848, "epoch": 7456} {"train_loss": -26.535932540893555, "global_step": 618849, "epoch": 7456} {"train_loss": -27.509963989257812, "global_step": 618850, "epoch": 7456} {"train_loss": -26.84683609008789, "global_step": 618851, "epoch": 7456} {"train_loss": -26.764982223510742, "global_step": 618852, "epoch": 7456} {"train_loss": -27.40756607055664, "global_step": 618853, "epoch": 7456} {"train_loss": -27.302433013916016, "global_step": 618854, "epoch": 7456} {"train_loss": -27.257360458374023, "global_step": 618855, "epoch": 7456} {"train_loss": -26.78536033630371, "global_step": 618856, "epoch": 7456} {"train_loss": -27.67641258239746, "global_step": 618857, "epoch": 7456} {"train_loss": -27.025135040283203, "global_step": 618858, "epoch": 7456} {"train_loss": -27.808008193969727, "global_step": 618859, "epoch": 7456} {"train_loss": -26.8455810546875, "global_step": 618860, "epoch": 7456} {"train_loss": -27.843551635742188, "global_step": 618861, "epoch": 7456} {"train_loss": -27.246923446655273, "global_step": 618862, "epoch": 7456} {"train_loss": -28.032419204711914, "global_step": 618863, "epoch": 7456} {"train_loss": -27.49323081970215, "global_step": 618864, "epoch": 7456} {"train_loss": -27.551237106323242, "global_step": 618865, "epoch": 7456} {"train_loss": -27.373517990112305, "global_step": 618866, "epoch": 7456} {"train_loss": -27.71673011779785, "global_step": 618867, "epoch": 7456} {"train_loss": -28.181486129760742, "global_step": 618868, "epoch": 7456} {"train_loss": -27.68206214904785, "global_step": 618869, "epoch": 7456} {"train_loss": -27.802677154541016, "global_step": 618870, "epoch": 7456} {"train_loss": -27.740781784057617, "global_step": 618871, "epoch": 7456} {"train_loss": -28.101322174072266, "global_step": 618872, "epoch": 7456} {"train_loss": -27.82496452331543, "global_step": 618873, "epoch": 7456} {"train_loss": -27.942142486572266, "global_step": 618874, "epoch": 7456} {"train_loss": -28.402740478515625, "global_step": 618875, "epoch": 7456} {"train_loss": -27.866016387939453, "global_step": 618876, "epoch": 7456} {"train_loss": -28.11578369140625, "global_step": 618877, "epoch": 7456} {"train_loss": -27.80743408203125, "global_step": 618878, "epoch": 7456} {"train_loss": -28.4847469329834, "global_step": 618879, "epoch": 7456} {"train_loss": -28.20220947265625, "global_step": 618880, "epoch": 7456} {"train_loss": -28.271570205688477, "global_step": 618881, "epoch": 7456} {"train_loss": -28.00091552734375, "global_step": 618882, "epoch": 7456} {"train_loss": -28.31007194519043, "global_step": 618883, "epoch": 7456} {"train_loss": -28.12458610534668, "global_step": 618884, "epoch": 7456} {"train_loss": -28.23578453063965, "global_step": 618885, "epoch": 7456} {"train_loss": -28.038009643554688, "global_step": 618886, "epoch": 7456} {"train_loss": -28.359350204467773, "global_step": 618887, "epoch": 7456} {"train_loss": -28.30755043029785, "global_step": 618888, "epoch": 7456} {"train_loss": -28.340045928955078, "global_step": 618889, "epoch": 7456} {"train_loss": -28.442047119140625, "global_step": 618890, "epoch": 7456} {"train_loss": -28.141983032226562, "global_step": 618891, "epoch": 7456} {"train_loss": -28.268783569335938, "global_step": 618892, "epoch": 7456} {"train_loss": -28.3388729095459, "global_step": 618893, "epoch": 7456} {"train_loss": -28.1050968170166, "global_step": 618894, "epoch": 7456} {"train_loss": -28.53571891784668, "global_step": 618895, "epoch": 7456} {"train_loss": -28.36664390563965, "global_step": 618896, "epoch": 7456} {"train_loss": -28.181440353393555, "global_step": 618897, "epoch": 7456} {"train_loss": -28.368906021118164, "global_step": 618898, "epoch": 7456} {"train_loss": -28.409643173217773, "global_step": 618899, "epoch": 7456} {"train_loss": -28.27195167541504, "global_step": 618900, "epoch": 7456} {"train_loss": -28.013751983642578, "global_step": 618901, "epoch": 7456} {"train_loss": -28.092920303344727, "global_step": 618902, "epoch": 7456} {"train_loss": -28.02515983581543, "global_step": 618903, "epoch": 7456} {"train_loss": -28.248157501220703, "global_step": 618904, "epoch": 7456} {"train_loss": -28.40901756286621, "global_step": 618905, "epoch": 7456} {"train_loss": -28.423553466796875, "global_step": 618906, "epoch": 7456} {"train_loss": -28.262298583984375, "global_step": 618907, "epoch": 7456} {"train_loss": -28.49014663696289, "global_step": 618908, "epoch": 7456} {"train_loss": -28.363250732421875, "global_step": 618909, "epoch": 7456} {"train_loss": -28.445913314819336, "global_step": 618910, "epoch": 7456} {"train_loss": -28.24457359313965, "global_step": 618911, "epoch": 7456} {"train_loss": -28.5985050201416, "global_step": 618912, "epoch": 7456} {"train_loss": -28.4526424407959, "global_step": 618913, "epoch": 7456} {"train_loss": -28.2265682220459, "global_step": 618914, "epoch": 7456} {"train_loss": -28.179309844970703, "global_step": 618915, "epoch": 7456} {"train_loss": -28.211706161499023, "global_step": 618916, "epoch": 7456} {"train_loss": -27.592687606811523, "global_step": 618917, "epoch": 7456} {"train_loss": -27.763507843017578, "global_step": 618918, "epoch": 7456} {"train_loss": -27.47235107421875, "global_step": 618919, "epoch": 7456} {"train_loss": -27.18453025817871, "global_step": 618920, "epoch": 7456} {"train_loss": -27.332021713256836, "global_step": 618921, "epoch": 7456} {"train_loss": -27.627887725830078, "global_step": 618922, "epoch": 7456} {"train_loss": -26.71701431274414, "global_step": 618923, "epoch": 7456} {"train_loss": -27.2583065032959, "global_step": 618924, "epoch": 7456} {"train_loss": -27.954303741455078, "global_step": 618925, "epoch": 7456} {"train_loss": -27.29420280456543, "global_step": 618926, "epoch": 7456} {"train_loss": -27.262922286987305, "global_step": 618927, "epoch": 7456} {"train_loss": -27.391141891479492, "global_step": 618928, "epoch": 7456} {"train_loss": -27.82166862487793, "global_step": 618929, "epoch": 7456} {"train_loss": -27.864123172070606, "global_step": 618930, "epoch": 7456, "val_loss": 6778796.5} {"train_loss": -27.09209632873535, "global_step": 618931, "epoch": 7457} {"train_loss": -27.045923233032227, "global_step": 618932, "epoch": 7457} {"train_loss": -26.699981689453125, "global_step": 618933, "epoch": 7457} {"train_loss": -26.80085563659668, "global_step": 618934, "epoch": 7457} {"train_loss": -26.696094512939453, "global_step": 618935, "epoch": 7457} {"train_loss": -27.28573989868164, "global_step": 618936, "epoch": 7457} {"train_loss": -27.1025447845459, "global_step": 618937, "epoch": 7457} {"train_loss": -26.6498966217041, "global_step": 618938, "epoch": 7457} {"train_loss": -26.968311309814453, "global_step": 618939, "epoch": 7457} {"train_loss": -27.120458602905273, "global_step": 618940, "epoch": 7457} {"train_loss": -27.2238712310791, "global_step": 618941, "epoch": 7457} {"train_loss": -27.13636589050293, "global_step": 618942, "epoch": 7457} {"train_loss": -27.423755645751953, "global_step": 618943, "epoch": 7457} {"train_loss": -27.368473052978516, "global_step": 618944, "epoch": 7457} {"train_loss": -27.17571449279785, "global_step": 618945, "epoch": 7457} {"train_loss": -27.61004066467285, "global_step": 618946, "epoch": 7457} {"train_loss": -27.243000030517578, "global_step": 618947, "epoch": 7457} {"train_loss": -27.215112686157227, "global_step": 618948, "epoch": 7457} {"train_loss": -27.258163452148438, "global_step": 618949, "epoch": 7457} {"train_loss": -27.593847274780273, "global_step": 618950, "epoch": 7457} {"train_loss": -27.50374412536621, "global_step": 618951, "epoch": 7457} {"train_loss": -27.512235641479492, "global_step": 618952, "epoch": 7457} {"train_loss": -27.75211524963379, "global_step": 618953, "epoch": 7457} {"train_loss": -27.63618278503418, "global_step": 618954, "epoch": 7457} {"train_loss": -27.6267147064209, "global_step": 618955, "epoch": 7457} {"train_loss": -27.505126953125, "global_step": 618956, "epoch": 7457} {"train_loss": -27.614669799804688, "global_step": 618957, "epoch": 7457} {"train_loss": -27.798444747924805, "global_step": 618958, "epoch": 7457} {"train_loss": -27.849714279174805, "global_step": 618959, "epoch": 7457} {"train_loss": -27.827733993530273, "global_step": 618960, "epoch": 7457} {"train_loss": -28.011627197265625, "global_step": 618961, "epoch": 7457} {"train_loss": -27.92059326171875, "global_step": 618962, "epoch": 7457} {"train_loss": -28.14167594909668, "global_step": 618963, "epoch": 7457} {"train_loss": -27.976886749267578, "global_step": 618964, "epoch": 7457} {"train_loss": -28.010746002197266, "global_step": 618965, "epoch": 7457} {"train_loss": -27.828781127929688, "global_step": 618966, "epoch": 7457} {"train_loss": -27.939783096313477, "global_step": 618967, "epoch": 7457} {"train_loss": -27.798994064331055, "global_step": 618968, "epoch": 7457} {"train_loss": -27.846221923828125, "global_step": 618969, "epoch": 7457} {"train_loss": -27.63739585876465, "global_step": 618970, "epoch": 7457} {"train_loss": -27.939477920532227, "global_step": 618971, "epoch": 7457} {"train_loss": -28.060592651367188, "global_step": 618972, "epoch": 7457} {"train_loss": -28.446393966674805, "global_step": 618973, "epoch": 7457} {"train_loss": -27.867971420288086, "global_step": 618974, "epoch": 7457} {"train_loss": -28.2087345123291, "global_step": 618975, "epoch": 7457} {"train_loss": -28.60447120666504, "global_step": 618976, "epoch": 7457} {"train_loss": -28.4001407623291, "global_step": 618977, "epoch": 7457} {"train_loss": -28.0051326751709, "global_step": 618978, "epoch": 7457} {"train_loss": -28.38477897644043, "global_step": 618979, "epoch": 7457} {"train_loss": -28.14222526550293, "global_step": 618980, "epoch": 7457} {"train_loss": -28.095245361328125, "global_step": 618981, "epoch": 7457} {"train_loss": -28.2414608001709, "global_step": 618982, "epoch": 7457} {"train_loss": -28.26496696472168, "global_step": 618983, "epoch": 7457} {"train_loss": -28.26291847229004, "global_step": 618984, "epoch": 7457} {"train_loss": -28.229394912719727, "global_step": 618985, "epoch": 7457} {"train_loss": -28.356475830078125, "global_step": 618986, "epoch": 7457} {"train_loss": -28.155561447143555, "global_step": 618987, "epoch": 7457} {"train_loss": -28.24761962890625, "global_step": 618988, "epoch": 7457} {"train_loss": -28.2640380859375, "global_step": 618989, "epoch": 7457} {"train_loss": -28.541492462158203, "global_step": 618990, "epoch": 7457} {"train_loss": -28.100351333618164, "global_step": 618991, "epoch": 7457} {"train_loss": -27.87166404724121, "global_step": 618992, "epoch": 7457} {"train_loss": -28.033422470092773, "global_step": 618993, "epoch": 7457} {"train_loss": -28.173368453979492, "global_step": 618994, "epoch": 7457} {"train_loss": -28.34156608581543, "global_step": 618995, "epoch": 7457} {"train_loss": -27.866186141967773, "global_step": 618996, "epoch": 7457} {"train_loss": -28.256704330444336, "global_step": 618997, "epoch": 7457} {"train_loss": -28.38925552368164, "global_step": 618998, "epoch": 7457} {"train_loss": -27.76373291015625, "global_step": 618999, "epoch": 7457} {"train_loss": -27.922590255737305, "global_step": 619000, "epoch": 7457} {"train_loss": -27.160430908203125, "global_step": 619001, "epoch": 7457} {"train_loss": -27.726715087890625, "global_step": 619002, "epoch": 7457} {"train_loss": -27.898778915405273, "global_step": 619003, "epoch": 7457} {"train_loss": -27.91547203063965, "global_step": 619004, "epoch": 7457} {"train_loss": -28.476621627807617, "global_step": 619005, "epoch": 7457} {"train_loss": -28.231342315673828, "global_step": 619006, "epoch": 7457} {"train_loss": -28.029035568237305, "global_step": 619007, "epoch": 7457} {"train_loss": -28.178119659423828, "global_step": 619008, "epoch": 7457} {"train_loss": -27.92696189880371, "global_step": 619009, "epoch": 7457} {"train_loss": -27.87771987915039, "global_step": 619010, "epoch": 7457} {"train_loss": -27.6734561920166, "global_step": 619011, "epoch": 7457} {"train_loss": -28.45534324645996, "global_step": 619012, "epoch": 7457} {"train_loss": -27.81131160690124, "global_step": 619013, "epoch": 7457, "val_loss": 6708276.0} {"train_loss": -27.5981388092041, "global_step": 619014, "epoch": 7458} {"train_loss": -27.837018966674805, "global_step": 619015, "epoch": 7458} {"train_loss": -27.85943031311035, "global_step": 619016, "epoch": 7458} {"train_loss": -27.955341339111328, "global_step": 619017, "epoch": 7458} {"train_loss": -27.773263931274414, "global_step": 619018, "epoch": 7458} {"train_loss": -27.852951049804688, "global_step": 619019, "epoch": 7458} {"train_loss": -28.163114547729492, "global_step": 619020, "epoch": 7458} {"train_loss": -28.0904598236084, "global_step": 619021, "epoch": 7458} {"train_loss": -27.810455322265625, "global_step": 619022, "epoch": 7458} {"train_loss": -27.777908325195312, "global_step": 619023, "epoch": 7458} {"train_loss": -27.911279678344727, "global_step": 619024, "epoch": 7458} {"train_loss": -27.547164916992188, "global_step": 619025, "epoch": 7458} {"train_loss": -28.06178092956543, "global_step": 619026, "epoch": 7458} {"train_loss": -28.043731689453125, "global_step": 619027, "epoch": 7458} {"train_loss": -27.87477684020996, "global_step": 619028, "epoch": 7458} {"train_loss": -28.074209213256836, "global_step": 619029, "epoch": 7458} {"train_loss": -28.003707885742188, "global_step": 619030, "epoch": 7458} {"train_loss": -28.098163604736328, "global_step": 619031, "epoch": 7458} {"train_loss": -28.423681259155273, "global_step": 619032, "epoch": 7458} {"train_loss": -27.75409507751465, "global_step": 619033, "epoch": 7458} {"train_loss": -28.14912223815918, "global_step": 619034, "epoch": 7458} {"train_loss": -28.125646591186523, "global_step": 619035, "epoch": 7458} {"train_loss": -27.923938751220703, "global_step": 619036, "epoch": 7458} {"train_loss": -27.677499771118164, "global_step": 619037, "epoch": 7458} {"train_loss": -27.759042739868164, "global_step": 619038, "epoch": 7458} {"train_loss": -28.22759437561035, "global_step": 619039, "epoch": 7458} {"train_loss": -28.05621910095215, "global_step": 619040, "epoch": 7458} {"train_loss": -27.632343292236328, "global_step": 619041, "epoch": 7458} {"train_loss": -28.33289909362793, "global_step": 619042, "epoch": 7458} {"train_loss": -28.067920684814453, "global_step": 619043, "epoch": 7458} {"train_loss": -28.30988883972168, "global_step": 619044, "epoch": 7458} {"train_loss": -28.03511619567871, "global_step": 619045, "epoch": 7458} {"train_loss": -28.087583541870117, "global_step": 619046, "epoch": 7458} {"train_loss": -28.02213478088379, "global_step": 619047, "epoch": 7458} {"train_loss": -27.9739933013916, "global_step": 619048, "epoch": 7458} {"train_loss": -27.730215072631836, "global_step": 619049, "epoch": 7458} {"train_loss": -27.9932861328125, "global_step": 619050, "epoch": 7458} {"train_loss": -27.89898109436035, "global_step": 619051, "epoch": 7458} {"train_loss": -27.8833065032959, "global_step": 619052, "epoch": 7458} {"train_loss": -28.09857749938965, "global_step": 619053, "epoch": 7458} {"train_loss": -28.593252182006836, "global_step": 619054, "epoch": 7458} {"train_loss": -27.932132720947266, "global_step": 619055, "epoch": 7458} {"train_loss": -28.148969650268555, "global_step": 619056, "epoch": 7458} {"train_loss": -28.25467300415039, "global_step": 619057, "epoch": 7458} {"train_loss": -28.457563400268555, "global_step": 619058, "epoch": 7458} {"train_loss": -28.001386642456055, "global_step": 619059, "epoch": 7458} {"train_loss": -28.142332077026367, "global_step": 619060, "epoch": 7458} {"train_loss": -27.957117080688477, "global_step": 619061, "epoch": 7458} {"train_loss": -27.702463150024414, "global_step": 619062, "epoch": 7458} {"train_loss": -28.2554988861084, "global_step": 619063, "epoch": 7458} {"train_loss": -27.986555099487305, "global_step": 619064, "epoch": 7458} {"train_loss": -28.6203556060791, "global_step": 619065, "epoch": 7458} {"train_loss": -28.0045108795166, "global_step": 619066, "epoch": 7458} {"train_loss": -27.954248428344727, "global_step": 619067, "epoch": 7458} {"train_loss": -28.102079391479492, "global_step": 619068, "epoch": 7458} {"train_loss": -28.240615844726562, "global_step": 619069, "epoch": 7458} {"train_loss": -27.9522762298584, "global_step": 619070, "epoch": 7458} {"train_loss": -28.167591094970703, "global_step": 619071, "epoch": 7458} {"train_loss": -28.178266525268555, "global_step": 619072, "epoch": 7458} {"train_loss": -27.939605712890625, "global_step": 619073, "epoch": 7458} {"train_loss": -28.2360782623291, "global_step": 619074, "epoch": 7458} {"train_loss": -28.19317626953125, "global_step": 619075, "epoch": 7458} {"train_loss": -28.325998306274414, "global_step": 619076, "epoch": 7458} {"train_loss": -28.114660263061523, "global_step": 619077, "epoch": 7458} {"train_loss": -28.27206802368164, "global_step": 619078, "epoch": 7458} {"train_loss": -28.31692886352539, "global_step": 619079, "epoch": 7458} {"train_loss": -28.438995361328125, "global_step": 619080, "epoch": 7458} {"train_loss": -27.937238693237305, "global_step": 619081, "epoch": 7458} {"train_loss": -28.294042587280273, "global_step": 619082, "epoch": 7458} {"train_loss": -28.130712509155273, "global_step": 619083, "epoch": 7458} {"train_loss": -28.272022247314453, "global_step": 619084, "epoch": 7458} {"train_loss": -28.221601486206055, "global_step": 619085, "epoch": 7458} {"train_loss": -27.884546279907227, "global_step": 619086, "epoch": 7458} {"train_loss": -28.4102725982666, "global_step": 619087, "epoch": 7458} {"train_loss": -28.088850021362305, "global_step": 619088, "epoch": 7458} {"train_loss": -28.207965850830078, "global_step": 619089, "epoch": 7458} {"train_loss": -28.409162521362305, "global_step": 619090, "epoch": 7458} {"train_loss": -28.267990112304688, "global_step": 619091, "epoch": 7458} {"train_loss": -28.1216983795166, "global_step": 619092, "epoch": 7458} {"train_loss": -28.03829002380371, "global_step": 619093, "epoch": 7458} {"train_loss": -28.319595336914062, "global_step": 619094, "epoch": 7458} {"train_loss": -28.280302047729492, "global_step": 619095, "epoch": 7458} {"train_loss": -28.06667923065553, "global_step": 619096, "epoch": 7458, "val_loss": 6713247.0} {"train_loss": -27.342487335205078, "global_step": 619097, "epoch": 7459} {"train_loss": -27.886316299438477, "global_step": 619098, "epoch": 7459} {"train_loss": -27.455322265625, "global_step": 619099, "epoch": 7459} {"train_loss": -27.574838638305664, "global_step": 619100, "epoch": 7459} {"train_loss": -27.2127685546875, "global_step": 619101, "epoch": 7459} {"train_loss": -27.271215438842773, "global_step": 619102, "epoch": 7459} {"train_loss": -27.9378662109375, "global_step": 619103, "epoch": 7459} {"train_loss": -27.855260848999023, "global_step": 619104, "epoch": 7459} {"train_loss": -27.335500717163086, "global_step": 619105, "epoch": 7459} {"train_loss": -27.931509017944336, "global_step": 619106, "epoch": 7459} {"train_loss": -27.575414657592773, "global_step": 619107, "epoch": 7459} {"train_loss": -27.58571434020996, "global_step": 619108, "epoch": 7459} {"train_loss": -27.500869750976562, "global_step": 619109, "epoch": 7459} {"train_loss": -27.796213150024414, "global_step": 619110, "epoch": 7459} {"train_loss": -27.827747344970703, "global_step": 619111, "epoch": 7459} {"train_loss": -27.439258575439453, "global_step": 619112, "epoch": 7459} {"train_loss": -27.565149307250977, "global_step": 619113, "epoch": 7459} {"train_loss": -28.082324981689453, "global_step": 619114, "epoch": 7459} {"train_loss": -28.010486602783203, "global_step": 619115, "epoch": 7459} {"train_loss": -27.804452896118164, "global_step": 619116, "epoch": 7459} {"train_loss": -27.463275909423828, "global_step": 619117, "epoch": 7459} {"train_loss": -27.696462631225586, "global_step": 619118, "epoch": 7459} {"train_loss": -28.405263900756836, "global_step": 619119, "epoch": 7459} {"train_loss": -27.957061767578125, "global_step": 619120, "epoch": 7459} {"train_loss": -28.01185417175293, "global_step": 619121, "epoch": 7459} {"train_loss": -28.38484001159668, "global_step": 619122, "epoch": 7459} {"train_loss": -28.2416934967041, "global_step": 619123, "epoch": 7459} {"train_loss": -28.08161735534668, "global_step": 619124, "epoch": 7459} {"train_loss": -28.18540382385254, "global_step": 619125, "epoch": 7459} {"train_loss": -27.94370460510254, "global_step": 619126, "epoch": 7459} {"train_loss": -28.072376251220703, "global_step": 619127, "epoch": 7459} {"train_loss": -28.071826934814453, "global_step": 619128, "epoch": 7459} {"train_loss": -28.19925308227539, "global_step": 619129, "epoch": 7459} {"train_loss": -28.053466796875, "global_step": 619130, "epoch": 7459} {"train_loss": -28.154870986938477, "global_step": 619131, "epoch": 7459} {"train_loss": -28.57329750061035, "global_step": 619132, "epoch": 7459} {"train_loss": -28.716794967651367, "global_step": 619133, "epoch": 7459} {"train_loss": -28.2247257232666, "global_step": 619134, "epoch": 7459} {"train_loss": -27.97955894470215, "global_step": 619135, "epoch": 7459} {"train_loss": -28.419397354125977, "global_step": 619136, "epoch": 7459} {"train_loss": -28.18355369567871, "global_step": 619137, "epoch": 7459} {"train_loss": -28.26991844177246, "global_step": 619138, "epoch": 7459} {"train_loss": -28.6151065826416, "global_step": 619139, "epoch": 7459} {"train_loss": -28.29526138305664, "global_step": 619140, "epoch": 7459} {"train_loss": -28.518640518188477, "global_step": 619141, "epoch": 7459} {"train_loss": -28.16792869567871, "global_step": 619142, "epoch": 7459} {"train_loss": -27.331769943237305, "global_step": 619143, "epoch": 7459} {"train_loss": -27.312347412109375, "global_step": 619144, "epoch": 7459} {"train_loss": -27.681995391845703, "global_step": 619145, "epoch": 7459} {"train_loss": -27.646650314331055, "global_step": 619146, "epoch": 7459} {"train_loss": -27.876447677612305, "global_step": 619147, "epoch": 7459} {"train_loss": -27.946765899658203, "global_step": 619148, "epoch": 7459} {"train_loss": -27.882795333862305, "global_step": 619149, "epoch": 7459} {"train_loss": -27.808349609375, "global_step": 619150, "epoch": 7459} {"train_loss": -27.804712295532227, "global_step": 619151, "epoch": 7459} {"train_loss": -27.645639419555664, "global_step": 619152, "epoch": 7459} {"train_loss": -27.79562759399414, "global_step": 619153, "epoch": 7459} {"train_loss": -27.432373046875, "global_step": 619154, "epoch": 7459} {"train_loss": -28.081634521484375, "global_step": 619155, "epoch": 7459} {"train_loss": -27.598825454711914, "global_step": 619156, "epoch": 7459} {"train_loss": -27.5391845703125, "global_step": 619157, "epoch": 7459} {"train_loss": -28.030349731445312, "global_step": 619158, "epoch": 7459} {"train_loss": -27.576047897338867, "global_step": 619159, "epoch": 7459} {"train_loss": -27.99177360534668, "global_step": 619160, "epoch": 7459} {"train_loss": -27.899677276611328, "global_step": 619161, "epoch": 7459} {"train_loss": -27.75050926208496, "global_step": 619162, "epoch": 7459} {"train_loss": -27.80866050720215, "global_step": 619163, "epoch": 7459} {"train_loss": -28.217004776000977, "global_step": 619164, "epoch": 7459} {"train_loss": -28.058378219604492, "global_step": 619165, "epoch": 7459} {"train_loss": -28.3710880279541, "global_step": 619166, "epoch": 7459} {"train_loss": -27.9793701171875, "global_step": 619167, "epoch": 7459} {"train_loss": -27.6809024810791, "global_step": 619168, "epoch": 7459} {"train_loss": -28.329626083374023, "global_step": 619169, "epoch": 7459} {"train_loss": -27.835702896118164, "global_step": 619170, "epoch": 7459} {"train_loss": -27.731555938720703, "global_step": 619171, "epoch": 7459} {"train_loss": -27.938770294189453, "global_step": 619172, "epoch": 7459} {"train_loss": -28.236398696899414, "global_step": 619173, "epoch": 7459} {"train_loss": -28.255834579467773, "global_step": 619174, "epoch": 7459} {"train_loss": -27.986846923828125, "global_step": 619175, "epoch": 7459} {"train_loss": -28.303726196289062, "global_step": 619176, "epoch": 7459} {"train_loss": -28.09943962097168, "global_step": 619177, "epoch": 7459} {"train_loss": -28.117156982421875, "global_step": 619178, "epoch": 7459} {"train_loss": -27.9188622164439, "global_step": 619179, "epoch": 7459, "val_loss": 6766407.0} {"train_loss": -27.17170524597168, "global_step": 619180, "epoch": 7460} {"train_loss": -26.71052360534668, "global_step": 619181, "epoch": 7460} {"train_loss": -27.621679306030273, "global_step": 619182, "epoch": 7460} {"train_loss": -27.55368995666504, "global_step": 619183, "epoch": 7460} {"train_loss": -27.23097801208496, "global_step": 619184, "epoch": 7460} {"train_loss": -27.679189682006836, "global_step": 619185, "epoch": 7460} {"train_loss": -27.499265670776367, "global_step": 619186, "epoch": 7460} {"train_loss": -27.44765281677246, "global_step": 619187, "epoch": 7460} {"train_loss": -27.0297908782959, "global_step": 619188, "epoch": 7460} {"train_loss": -27.668292999267578, "global_step": 619189, "epoch": 7460} {"train_loss": -27.58112144470215, "global_step": 619190, "epoch": 7460} {"train_loss": -27.69636344909668, "global_step": 619191, "epoch": 7460} {"train_loss": -28.03399085998535, "global_step": 619192, "epoch": 7460} {"train_loss": -27.639184951782227, "global_step": 619193, "epoch": 7460} {"train_loss": -27.274938583374023, "global_step": 619194, "epoch": 7460} {"train_loss": -28.11111831665039, "global_step": 619195, "epoch": 7460} {"train_loss": -28.108320236206055, "global_step": 619196, "epoch": 7460} {"train_loss": -27.854028701782227, "global_step": 619197, "epoch": 7460} {"train_loss": -28.09442138671875, "global_step": 619198, "epoch": 7460} {"train_loss": -27.184354782104492, "global_step": 619199, "epoch": 7460} {"train_loss": -27.636075973510742, "global_step": 619200, "epoch": 7460} {"train_loss": -27.5994815826416, "global_step": 619201, "epoch": 7460} {"train_loss": -28.157758712768555, "global_step": 619202, "epoch": 7460} {"train_loss": -28.088354110717773, "global_step": 619203, "epoch": 7460} {"train_loss": -28.055994033813477, "global_step": 619204, "epoch": 7460} {"train_loss": -27.77031898498535, "global_step": 619205, "epoch": 7460} {"train_loss": -27.56959342956543, "global_step": 619206, "epoch": 7460} {"train_loss": -28.11246681213379, "global_step": 619207, "epoch": 7460} {"train_loss": -27.92351722717285, "global_step": 619208, "epoch": 7460} {"train_loss": -28.062652587890625, "global_step": 619209, "epoch": 7460} {"train_loss": -27.819732666015625, "global_step": 619210, "epoch": 7460} {"train_loss": -27.71258544921875, "global_step": 619211, "epoch": 7460} {"train_loss": -27.779239654541016, "global_step": 619212, "epoch": 7460} {"train_loss": -27.66594886779785, "global_step": 619213, "epoch": 7460} {"train_loss": -27.930816650390625, "global_step": 619214, "epoch": 7460} {"train_loss": -27.866613388061523, "global_step": 619215, "epoch": 7460} {"train_loss": -28.041738510131836, "global_step": 619216, "epoch": 7460} {"train_loss": -28.6875, "global_step": 619217, "epoch": 7460} {"train_loss": -28.091978073120117, "global_step": 619218, "epoch": 7460} {"train_loss": -28.210620880126953, "global_step": 619219, "epoch": 7460} {"train_loss": -28.152677536010742, "global_step": 619220, "epoch": 7460} {"train_loss": -28.157339096069336, "global_step": 619221, "epoch": 7460} {"train_loss": -28.14816665649414, "global_step": 619222, "epoch": 7460} {"train_loss": -28.231164932250977, "global_step": 619223, "epoch": 7460} {"train_loss": -27.64847183227539, "global_step": 619224, "epoch": 7460} {"train_loss": -28.066503524780273, "global_step": 619225, "epoch": 7460} {"train_loss": -28.384784698486328, "global_step": 619226, "epoch": 7460} {"train_loss": -28.071685791015625, "global_step": 619227, "epoch": 7460} {"train_loss": -28.210102081298828, "global_step": 619228, "epoch": 7460} {"train_loss": -28.138837814331055, "global_step": 619229, "epoch": 7460} {"train_loss": -28.155927658081055, "global_step": 619230, "epoch": 7460} {"train_loss": -28.023900985717773, "global_step": 619231, "epoch": 7460} {"train_loss": -28.034168243408203, "global_step": 619232, "epoch": 7460} {"train_loss": -28.451990127563477, "global_step": 619233, "epoch": 7460} {"train_loss": -27.853057861328125, "global_step": 619234, "epoch": 7460} {"train_loss": -28.502273559570312, "global_step": 619235, "epoch": 7460} {"train_loss": -28.1817626953125, "global_step": 619236, "epoch": 7460} {"train_loss": -28.598224639892578, "global_step": 619237, "epoch": 7460} {"train_loss": -28.030048370361328, "global_step": 619238, "epoch": 7460} {"train_loss": -28.114850997924805, "global_step": 619239, "epoch": 7460} {"train_loss": -28.203210830688477, "global_step": 619240, "epoch": 7460} {"train_loss": -28.362873077392578, "global_step": 619241, "epoch": 7460} {"train_loss": -28.118671417236328, "global_step": 619242, "epoch": 7460} {"train_loss": -28.06165885925293, "global_step": 619243, "epoch": 7460} {"train_loss": -28.398340225219727, "global_step": 619244, "epoch": 7460} {"train_loss": -28.2977352142334, "global_step": 619245, "epoch": 7460} {"train_loss": -28.227249145507812, "global_step": 619246, "epoch": 7460} {"train_loss": -28.593542098999023, "global_step": 619247, "epoch": 7460} {"train_loss": -28.2858943939209, "global_step": 619248, "epoch": 7460} {"train_loss": -28.122406005859375, "global_step": 619249, "epoch": 7460} {"train_loss": -28.12794303894043, "global_step": 619250, "epoch": 7460} {"train_loss": -28.172292709350586, "global_step": 619251, "epoch": 7460} {"train_loss": -28.344945907592773, "global_step": 619252, "epoch": 7460} {"train_loss": -28.559675216674805, "global_step": 619253, "epoch": 7460} {"train_loss": -28.370702743530273, "global_step": 619254, "epoch": 7460} {"train_loss": -28.478734970092773, "global_step": 619255, "epoch": 7460} {"train_loss": -28.402301788330078, "global_step": 619256, "epoch": 7460} {"train_loss": -28.25117301940918, "global_step": 619257, "epoch": 7460} {"train_loss": -28.250783920288086, "global_step": 619258, "epoch": 7460} {"train_loss": -28.217016220092773, "global_step": 619259, "epoch": 7460} {"train_loss": -28.48919677734375, "global_step": 619260, "epoch": 7460} {"train_loss": -28.235681533813477, "global_step": 619261, "epoch": 7460} {"train_loss": -28.004501227872918, "global_step": 619262, "epoch": 7460, "val_loss": 6728325.0} {"train_loss": -26.735092163085938, "global_step": 619263, "epoch": 7461} {"train_loss": -26.04787254333496, "global_step": 619264, "epoch": 7461} {"train_loss": -26.835739135742188, "global_step": 619265, "epoch": 7461} {"train_loss": -26.721805572509766, "global_step": 619266, "epoch": 7461} {"train_loss": -26.325544357299805, "global_step": 619267, "epoch": 7461} {"train_loss": -25.914899826049805, "global_step": 619268, "epoch": 7461} {"train_loss": -27.432636260986328, "global_step": 619269, "epoch": 7461} {"train_loss": -27.526660919189453, "global_step": 619270, "epoch": 7461} {"train_loss": -27.261676788330078, "global_step": 619271, "epoch": 7461} {"train_loss": -27.530353546142578, "global_step": 619272, "epoch": 7461} {"train_loss": -27.32208824157715, "global_step": 619273, "epoch": 7461} {"train_loss": -27.445158004760742, "global_step": 619274, "epoch": 7461} {"train_loss": -27.256704330444336, "global_step": 619275, "epoch": 7461} {"train_loss": -27.489118576049805, "global_step": 619276, "epoch": 7461} {"train_loss": -27.81183433532715, "global_step": 619277, "epoch": 7461} {"train_loss": -27.773468017578125, "global_step": 619278, "epoch": 7461} {"train_loss": -27.709552764892578, "global_step": 619279, "epoch": 7461} {"train_loss": -27.587146759033203, "global_step": 619280, "epoch": 7461} {"train_loss": -27.806381225585938, "global_step": 619281, "epoch": 7461} {"train_loss": -27.911481857299805, "global_step": 619282, "epoch": 7461} {"train_loss": -27.643476486206055, "global_step": 619283, "epoch": 7461} {"train_loss": -28.1055965423584, "global_step": 619284, "epoch": 7461} {"train_loss": -27.79266929626465, "global_step": 619285, "epoch": 7461} {"train_loss": -27.37099266052246, "global_step": 619286, "epoch": 7461} {"train_loss": -28.08338737487793, "global_step": 619287, "epoch": 7461} {"train_loss": -27.739032745361328, "global_step": 619288, "epoch": 7461} {"train_loss": -27.689727783203125, "global_step": 619289, "epoch": 7461} {"train_loss": -28.34079360961914, "global_step": 619290, "epoch": 7461} {"train_loss": -27.6875, "global_step": 619291, "epoch": 7461} {"train_loss": -28.053607940673828, "global_step": 619292, "epoch": 7461} {"train_loss": -27.681396484375, "global_step": 619293, "epoch": 7461} {"train_loss": -27.98726463317871, "global_step": 619294, "epoch": 7461} {"train_loss": -27.9050350189209, "global_step": 619295, "epoch": 7461} {"train_loss": -27.82431411743164, "global_step": 619296, "epoch": 7461} {"train_loss": -28.042789459228516, "global_step": 619297, "epoch": 7461} {"train_loss": -27.66208839416504, "global_step": 619298, "epoch": 7461} {"train_loss": -27.934240341186523, "global_step": 619299, "epoch": 7461} {"train_loss": -27.9325008392334, "global_step": 619300, "epoch": 7461} {"train_loss": -28.088953018188477, "global_step": 619301, "epoch": 7461} {"train_loss": -28.009613037109375, "global_step": 619302, "epoch": 7461} {"train_loss": -28.21565818786621, "global_step": 619303, "epoch": 7461} {"train_loss": -27.786087036132812, "global_step": 619304, "epoch": 7461} {"train_loss": -27.996091842651367, "global_step": 619305, "epoch": 7461} {"train_loss": -28.3015079498291, "global_step": 619306, "epoch": 7461} {"train_loss": -28.05120849609375, "global_step": 619307, "epoch": 7461} {"train_loss": -28.1259822845459, "global_step": 619308, "epoch": 7461} {"train_loss": -28.448705673217773, "global_step": 619309, "epoch": 7461} {"train_loss": -28.026336669921875, "global_step": 619310, "epoch": 7461} {"train_loss": -27.955814361572266, "global_step": 619311, "epoch": 7461} {"train_loss": -28.3056640625, "global_step": 619312, "epoch": 7461} {"train_loss": -28.000751495361328, "global_step": 619313, "epoch": 7461} {"train_loss": -27.922574996948242, "global_step": 619314, "epoch": 7461} {"train_loss": -28.092166900634766, "global_step": 619315, "epoch": 7461} {"train_loss": -28.272504806518555, "global_step": 619316, "epoch": 7461} {"train_loss": -28.168188095092773, "global_step": 619317, "epoch": 7461} {"train_loss": -28.22376823425293, "global_step": 619318, "epoch": 7461} {"train_loss": -27.954450607299805, "global_step": 619319, "epoch": 7461} {"train_loss": -28.174829483032227, "global_step": 619320, "epoch": 7461} {"train_loss": -28.515583038330078, "global_step": 619321, "epoch": 7461} {"train_loss": -28.086698532104492, "global_step": 619322, "epoch": 7461} {"train_loss": -28.349889755249023, "global_step": 619323, "epoch": 7461} {"train_loss": -27.662511825561523, "global_step": 619324, "epoch": 7461} {"train_loss": -27.932682037353516, "global_step": 619325, "epoch": 7461} {"train_loss": -28.084518432617188, "global_step": 619326, "epoch": 7461} {"train_loss": -27.887191772460938, "global_step": 619327, "epoch": 7461} {"train_loss": -28.004474639892578, "global_step": 619328, "epoch": 7461} {"train_loss": -27.810302734375, "global_step": 619329, "epoch": 7461} {"train_loss": -27.992542266845703, "global_step": 619330, "epoch": 7461} {"train_loss": -28.1939697265625, "global_step": 619331, "epoch": 7461} {"train_loss": -28.310941696166992, "global_step": 619332, "epoch": 7461} {"train_loss": -28.43585205078125, "global_step": 619333, "epoch": 7461} {"train_loss": -27.936737060546875, "global_step": 619334, "epoch": 7461} {"train_loss": -28.149572372436523, "global_step": 619335, "epoch": 7461} {"train_loss": -28.191181182861328, "global_step": 619336, "epoch": 7461} {"train_loss": -28.114887237548828, "global_step": 619337, "epoch": 7461} {"train_loss": -28.327123641967773, "global_step": 619338, "epoch": 7461} {"train_loss": -28.16423988342285, "global_step": 619339, "epoch": 7461} {"train_loss": -28.47100257873535, "global_step": 619340, "epoch": 7461} {"train_loss": -28.46626091003418, "global_step": 619341, "epoch": 7461} {"train_loss": -28.297210693359375, "global_step": 619342, "epoch": 7461} {"train_loss": -28.1396541595459, "global_step": 619343, "epoch": 7461} {"train_loss": -27.9494686126709, "global_step": 619344, "epoch": 7461} {"train_loss": -27.84604532172881, "global_step": 619345, "epoch": 7461, "val_loss": 6705927.0} {"train_loss": -28.476964950561523, "global_step": 619346, "epoch": 7462} {"train_loss": -27.79737663269043, "global_step": 619347, "epoch": 7462} {"train_loss": -27.971418380737305, "global_step": 619348, "epoch": 7462} {"train_loss": -28.233808517456055, "global_step": 619349, "epoch": 7462} {"train_loss": -28.100799560546875, "global_step": 619350, "epoch": 7462} {"train_loss": -27.576019287109375, "global_step": 619351, "epoch": 7462} {"train_loss": -27.868976593017578, "global_step": 619352, "epoch": 7462} {"train_loss": -28.126150131225586, "global_step": 619353, "epoch": 7462} {"train_loss": -27.9619140625, "global_step": 619354, "epoch": 7462} {"train_loss": -28.161413192749023, "global_step": 619355, "epoch": 7462} {"train_loss": -28.02326011657715, "global_step": 619356, "epoch": 7462} {"train_loss": -27.634389877319336, "global_step": 619357, "epoch": 7462} {"train_loss": -27.982507705688477, "global_step": 619358, "epoch": 7462} {"train_loss": -28.07826042175293, "global_step": 619359, "epoch": 7462} {"train_loss": -27.886022567749023, "global_step": 619360, "epoch": 7462} {"train_loss": -27.6612548828125, "global_step": 619361, "epoch": 7462} {"train_loss": -27.9987850189209, "global_step": 619362, "epoch": 7462} {"train_loss": -27.724445343017578, "global_step": 619363, "epoch": 7462} {"train_loss": -28.116239547729492, "global_step": 619364, "epoch": 7462} {"train_loss": -28.030393600463867, "global_step": 619365, "epoch": 7462} {"train_loss": -28.051244735717773, "global_step": 619366, "epoch": 7462} {"train_loss": -27.931976318359375, "global_step": 619367, "epoch": 7462} {"train_loss": -28.338581085205078, "global_step": 619368, "epoch": 7462} {"train_loss": -27.714221954345703, "global_step": 619369, "epoch": 7462} {"train_loss": -27.89105796813965, "global_step": 619370, "epoch": 7462} {"train_loss": -27.85013771057129, "global_step": 619371, "epoch": 7462} {"train_loss": -27.997455596923828, "global_step": 619372, "epoch": 7462} {"train_loss": -27.960973739624023, "global_step": 619373, "epoch": 7462} {"train_loss": -28.235132217407227, "global_step": 619374, "epoch": 7462} {"train_loss": -28.108823776245117, "global_step": 619375, "epoch": 7462} {"train_loss": -28.264129638671875, "global_step": 619376, "epoch": 7462} {"train_loss": -28.256046295166016, "global_step": 619377, "epoch": 7462} {"train_loss": -28.154932022094727, "global_step": 619378, "epoch": 7462} {"train_loss": -28.195493698120117, "global_step": 619379, "epoch": 7462} {"train_loss": -28.04987144470215, "global_step": 619380, "epoch": 7462} {"train_loss": -28.265180587768555, "global_step": 619381, "epoch": 7462} {"train_loss": -28.311796188354492, "global_step": 619382, "epoch": 7462} {"train_loss": -28.311176300048828, "global_step": 619383, "epoch": 7462} {"train_loss": -28.285297393798828, "global_step": 619384, "epoch": 7462} {"train_loss": -28.005666732788086, "global_step": 619385, "epoch": 7462} {"train_loss": -28.388092041015625, "global_step": 619386, "epoch": 7462} {"train_loss": -28.122827529907227, "global_step": 619387, "epoch": 7462} {"train_loss": -28.178556442260742, "global_step": 619388, "epoch": 7462} {"train_loss": -27.89103126525879, "global_step": 619389, "epoch": 7462} {"train_loss": -28.363483428955078, "global_step": 619390, "epoch": 7462} {"train_loss": -28.029727935791016, "global_step": 619391, "epoch": 7462} {"train_loss": -27.985754013061523, "global_step": 619392, "epoch": 7462} {"train_loss": -27.986316680908203, "global_step": 619393, "epoch": 7462} {"train_loss": -28.419958114624023, "global_step": 619394, "epoch": 7462} {"train_loss": -28.116315841674805, "global_step": 619395, "epoch": 7462} {"train_loss": -28.466562271118164, "global_step": 619396, "epoch": 7462} {"train_loss": -28.282236099243164, "global_step": 619397, "epoch": 7462} {"train_loss": -27.936237335205078, "global_step": 619398, "epoch": 7462} {"train_loss": -28.46466064453125, "global_step": 619399, "epoch": 7462} {"train_loss": -28.279560089111328, "global_step": 619400, "epoch": 7462} {"train_loss": -28.2484073638916, "global_step": 619401, "epoch": 7462} {"train_loss": -28.706884384155273, "global_step": 619402, "epoch": 7462} {"train_loss": -28.243000030517578, "global_step": 619403, "epoch": 7462} {"train_loss": -28.423969268798828, "global_step": 619404, "epoch": 7462} {"train_loss": -28.268909454345703, "global_step": 619405, "epoch": 7462} {"train_loss": -28.558277130126953, "global_step": 619406, "epoch": 7462} {"train_loss": -28.118122100830078, "global_step": 619407, "epoch": 7462} {"train_loss": -27.7192325592041, "global_step": 619408, "epoch": 7462} {"train_loss": -28.009775161743164, "global_step": 619409, "epoch": 7462} {"train_loss": -28.10629653930664, "global_step": 619410, "epoch": 7462} {"train_loss": -28.424396514892578, "global_step": 619411, "epoch": 7462} {"train_loss": -28.55439567565918, "global_step": 619412, "epoch": 7462} {"train_loss": -27.96144676208496, "global_step": 619413, "epoch": 7462} {"train_loss": -28.197376251220703, "global_step": 619414, "epoch": 7462} {"train_loss": -28.451223373413086, "global_step": 619415, "epoch": 7462} {"train_loss": -27.92336082458496, "global_step": 619416, "epoch": 7462} {"train_loss": -28.00994300842285, "global_step": 619417, "epoch": 7462} {"train_loss": -28.220956802368164, "global_step": 619418, "epoch": 7462} {"train_loss": -28.58516502380371, "global_step": 619419, "epoch": 7462} {"train_loss": -27.711156845092773, "global_step": 619420, "epoch": 7462} {"train_loss": -28.2305965423584, "global_step": 619421, "epoch": 7462} {"train_loss": -27.8980655670166, "global_step": 619422, "epoch": 7462} {"train_loss": -28.250314712524414, "global_step": 619423, "epoch": 7462} {"train_loss": -28.229963302612305, "global_step": 619424, "epoch": 7462} {"train_loss": -28.195419311523438, "global_step": 619425, "epoch": 7462} {"train_loss": -28.182342529296875, "global_step": 619426, "epoch": 7462} {"train_loss": -28.003747940063477, "global_step": 619427, "epoch": 7462} {"train_loss": -28.116931478661225, "global_step": 619428, "epoch": 7462, "val_loss": 6684162.0} {"train_loss": -28.242826461791992, "global_step": 619429, "epoch": 7463} {"train_loss": -27.512069702148438, "global_step": 619430, "epoch": 7463} {"train_loss": -26.722858428955078, "global_step": 619431, "epoch": 7463} {"train_loss": -26.951934814453125, "global_step": 619432, "epoch": 7463} {"train_loss": -27.884510040283203, "global_step": 619433, "epoch": 7463} {"train_loss": -27.524738311767578, "global_step": 619434, "epoch": 7463} {"train_loss": -27.400421142578125, "global_step": 619435, "epoch": 7463} {"train_loss": -28.0365047454834, "global_step": 619436, "epoch": 7463} {"train_loss": -27.808454513549805, "global_step": 619437, "epoch": 7463} {"train_loss": -27.934309005737305, "global_step": 619438, "epoch": 7463} {"train_loss": -27.735563278198242, "global_step": 619439, "epoch": 7463} {"train_loss": -27.891021728515625, "global_step": 619440, "epoch": 7463} {"train_loss": -27.94915771484375, "global_step": 619441, "epoch": 7463} {"train_loss": -28.0538330078125, "global_step": 619442, "epoch": 7463} {"train_loss": -28.0843505859375, "global_step": 619443, "epoch": 7463} {"train_loss": -28.081281661987305, "global_step": 619444, "epoch": 7463} {"train_loss": -28.03521728515625, "global_step": 619445, "epoch": 7463} {"train_loss": -28.049991607666016, "global_step": 619446, "epoch": 7463} {"train_loss": -28.2908992767334, "global_step": 619447, "epoch": 7463} {"train_loss": -27.7347412109375, "global_step": 619448, "epoch": 7463} {"train_loss": -28.047704696655273, "global_step": 619449, "epoch": 7463} {"train_loss": -28.11358642578125, "global_step": 619450, "epoch": 7463} {"train_loss": -28.068815231323242, "global_step": 619451, "epoch": 7463} {"train_loss": -27.990209579467773, "global_step": 619452, "epoch": 7463} {"train_loss": -28.113988876342773, "global_step": 619453, "epoch": 7463} {"train_loss": -28.42119789123535, "global_step": 619454, "epoch": 7463} {"train_loss": -28.29621696472168, "global_step": 619455, "epoch": 7463} {"train_loss": -27.677536010742188, "global_step": 619456, "epoch": 7463} {"train_loss": -28.15927505493164, "global_step": 619457, "epoch": 7463} {"train_loss": -28.395999908447266, "global_step": 619458, "epoch": 7463} {"train_loss": -28.126264572143555, "global_step": 619459, "epoch": 7463} {"train_loss": -28.002546310424805, "global_step": 619460, "epoch": 7463} {"train_loss": -28.34499168395996, "global_step": 619461, "epoch": 7463} {"train_loss": -27.94696044921875, "global_step": 619462, "epoch": 7463} {"train_loss": -28.359329223632812, "global_step": 619463, "epoch": 7463} {"train_loss": -27.988157272338867, "global_step": 619464, "epoch": 7463} {"train_loss": -28.798452377319336, "global_step": 619465, "epoch": 7463} {"train_loss": -28.537433624267578, "global_step": 619466, "epoch": 7463} {"train_loss": -28.107290267944336, "global_step": 619467, "epoch": 7463} {"train_loss": -28.288721084594727, "global_step": 619468, "epoch": 7463} {"train_loss": -28.470319747924805, "global_step": 619469, "epoch": 7463} {"train_loss": -28.05219078063965, "global_step": 619470, "epoch": 7463} {"train_loss": -28.21882438659668, "global_step": 619471, "epoch": 7463} {"train_loss": -27.76967430114746, "global_step": 619472, "epoch": 7463} {"train_loss": -28.029876708984375, "global_step": 619473, "epoch": 7463} {"train_loss": -28.05739402770996, "global_step": 619474, "epoch": 7463} {"train_loss": -27.83649253845215, "global_step": 619475, "epoch": 7463} {"train_loss": -28.24500846862793, "global_step": 619476, "epoch": 7463} {"train_loss": -28.309179306030273, "global_step": 619477, "epoch": 7463} {"train_loss": -28.51839256286621, "global_step": 619478, "epoch": 7463} {"train_loss": -27.777267456054688, "global_step": 619479, "epoch": 7463} {"train_loss": -28.02674674987793, "global_step": 619480, "epoch": 7463} {"train_loss": -28.173871994018555, "global_step": 619481, "epoch": 7463} {"train_loss": -28.3641300201416, "global_step": 619482, "epoch": 7463} {"train_loss": -28.208017349243164, "global_step": 619483, "epoch": 7463} {"train_loss": -28.237211227416992, "global_step": 619484, "epoch": 7463} {"train_loss": -28.15082359313965, "global_step": 619485, "epoch": 7463} {"train_loss": -28.24024772644043, "global_step": 619486, "epoch": 7463} {"train_loss": -27.815576553344727, "global_step": 619487, "epoch": 7463} {"train_loss": -28.258071899414062, "global_step": 619488, "epoch": 7463} {"train_loss": -28.293500900268555, "global_step": 619489, "epoch": 7463} {"train_loss": -27.977354049682617, "global_step": 619490, "epoch": 7463} {"train_loss": -28.3399715423584, "global_step": 619491, "epoch": 7463} {"train_loss": -27.985925674438477, "global_step": 619492, "epoch": 7463} {"train_loss": -28.0761775970459, "global_step": 619493, "epoch": 7463} {"train_loss": -28.2852840423584, "global_step": 619494, "epoch": 7463} {"train_loss": -28.361434936523438, "global_step": 619495, "epoch": 7463} {"train_loss": -27.8781795501709, "global_step": 619496, "epoch": 7463} {"train_loss": -28.13516616821289, "global_step": 619497, "epoch": 7463} {"train_loss": -28.41001319885254, "global_step": 619498, "epoch": 7463} {"train_loss": -27.880895614624023, "global_step": 619499, "epoch": 7463} {"train_loss": -27.580291748046875, "global_step": 619500, "epoch": 7463} {"train_loss": -27.724939346313477, "global_step": 619501, "epoch": 7463} {"train_loss": -27.33750343322754, "global_step": 619502, "epoch": 7463} {"train_loss": -27.758819580078125, "global_step": 619503, "epoch": 7463} {"train_loss": -28.06264305114746, "global_step": 619504, "epoch": 7463} {"train_loss": -28.017377853393555, "global_step": 619505, "epoch": 7463} {"train_loss": -28.24793815612793, "global_step": 619506, "epoch": 7463} {"train_loss": -28.332061767578125, "global_step": 619507, "epoch": 7463} {"train_loss": -27.972726821899414, "global_step": 619508, "epoch": 7463} {"train_loss": -27.761856079101562, "global_step": 619509, "epoch": 7463} {"train_loss": -28.267805099487305, "global_step": 619510, "epoch": 7463} {"train_loss": -28.028503211147815, "global_step": 619511, "epoch": 7463, "val_loss": 6725548.5} {"train_loss": -27.224225997924805, "global_step": 619512, "epoch": 7464} {"train_loss": -27.14466667175293, "global_step": 619513, "epoch": 7464} {"train_loss": -27.5748348236084, "global_step": 619514, "epoch": 7464} {"train_loss": -27.112640380859375, "global_step": 619515, "epoch": 7464} {"train_loss": -27.51299476623535, "global_step": 619516, "epoch": 7464} {"train_loss": -27.260473251342773, "global_step": 619517, "epoch": 7464} {"train_loss": -26.946975708007812, "global_step": 619518, "epoch": 7464} {"train_loss": -26.9853515625, "global_step": 619519, "epoch": 7464} {"train_loss": -26.859594345092773, "global_step": 619520, "epoch": 7464} {"train_loss": -27.42146110534668, "global_step": 619521, "epoch": 7464} {"train_loss": -27.455759048461914, "global_step": 619522, "epoch": 7464} {"train_loss": -27.516712188720703, "global_step": 619523, "epoch": 7464} {"train_loss": -27.62775993347168, "global_step": 619524, "epoch": 7464} {"train_loss": -27.48040199279785, "global_step": 619525, "epoch": 7464} {"train_loss": -27.71039390563965, "global_step": 619526, "epoch": 7464} {"train_loss": -27.945556640625, "global_step": 619527, "epoch": 7464} {"train_loss": -27.748579025268555, "global_step": 619528, "epoch": 7464} {"train_loss": -27.41083335876465, "global_step": 619529, "epoch": 7464} {"train_loss": -27.88250160217285, "global_step": 619530, "epoch": 7464} {"train_loss": -27.756683349609375, "global_step": 619531, "epoch": 7464} {"train_loss": -27.70465660095215, "global_step": 619532, "epoch": 7464} {"train_loss": -27.95330810546875, "global_step": 619533, "epoch": 7464} {"train_loss": -27.729734420776367, "global_step": 619534, "epoch": 7464} {"train_loss": -28.015735626220703, "global_step": 619535, "epoch": 7464} {"train_loss": -28.063879013061523, "global_step": 619536, "epoch": 7464} {"train_loss": -28.237751007080078, "global_step": 619537, "epoch": 7464} {"train_loss": -28.045705795288086, "global_step": 619538, "epoch": 7464} {"train_loss": -28.131824493408203, "global_step": 619539, "epoch": 7464} {"train_loss": -28.102502822875977, "global_step": 619540, "epoch": 7464} {"train_loss": -28.547977447509766, "global_step": 619541, "epoch": 7464} {"train_loss": -28.012592315673828, "global_step": 619542, "epoch": 7464} {"train_loss": -27.889392852783203, "global_step": 619543, "epoch": 7464} {"train_loss": -28.210845947265625, "global_step": 619544, "epoch": 7464} {"train_loss": -28.160696029663086, "global_step": 619545, "epoch": 7464} {"train_loss": -28.244510650634766, "global_step": 619546, "epoch": 7464} {"train_loss": -28.1716365814209, "global_step": 619547, "epoch": 7464} {"train_loss": -28.05810546875, "global_step": 619548, "epoch": 7464} {"train_loss": -28.281843185424805, "global_step": 619549, "epoch": 7464} {"train_loss": -28.271163940429688, "global_step": 619550, "epoch": 7464} {"train_loss": -28.270572662353516, "global_step": 619551, "epoch": 7464} {"train_loss": -28.350509643554688, "global_step": 619552, "epoch": 7464} {"train_loss": -28.29046630859375, "global_step": 619553, "epoch": 7464} {"train_loss": -28.117074966430664, "global_step": 619554, "epoch": 7464} {"train_loss": -28.12420654296875, "global_step": 619555, "epoch": 7464} {"train_loss": -28.408849716186523, "global_step": 619556, "epoch": 7464} {"train_loss": -28.512496948242188, "global_step": 619557, "epoch": 7464} {"train_loss": -27.81403923034668, "global_step": 619558, "epoch": 7464} {"train_loss": -28.276166915893555, "global_step": 619559, "epoch": 7464} {"train_loss": -28.318470001220703, "global_step": 619560, "epoch": 7464} {"train_loss": -28.32375144958496, "global_step": 619561, "epoch": 7464} {"train_loss": -28.239355087280273, "global_step": 619562, "epoch": 7464} {"train_loss": -27.770437240600586, "global_step": 619563, "epoch": 7464} {"train_loss": -28.420318603515625, "global_step": 619564, "epoch": 7464} {"train_loss": -28.245758056640625, "global_step": 619565, "epoch": 7464} {"train_loss": -27.807891845703125, "global_step": 619566, "epoch": 7464} {"train_loss": -28.254886627197266, "global_step": 619567, "epoch": 7464} {"train_loss": -28.18190574645996, "global_step": 619568, "epoch": 7464} {"train_loss": -28.37932777404785, "global_step": 619569, "epoch": 7464} {"train_loss": -28.446197509765625, "global_step": 619570, "epoch": 7464} {"train_loss": -28.41900634765625, "global_step": 619571, "epoch": 7464} {"train_loss": -27.9348201751709, "global_step": 619572, "epoch": 7464} {"train_loss": -27.98126792907715, "global_step": 619573, "epoch": 7464} {"train_loss": -28.10541343688965, "global_step": 619574, "epoch": 7464} {"train_loss": -28.256006240844727, "global_step": 619575, "epoch": 7464} {"train_loss": -28.524280548095703, "global_step": 619576, "epoch": 7464} {"train_loss": -28.286230087280273, "global_step": 619577, "epoch": 7464} {"train_loss": -27.944046020507812, "global_step": 619578, "epoch": 7464} {"train_loss": -27.770963668823242, "global_step": 619579, "epoch": 7464} {"train_loss": -28.52886962890625, "global_step": 619580, "epoch": 7464} {"train_loss": -28.11972427368164, "global_step": 619581, "epoch": 7464} {"train_loss": -27.812274932861328, "global_step": 619582, "epoch": 7464} {"train_loss": -27.99677848815918, "global_step": 619583, "epoch": 7464} {"train_loss": -28.017444610595703, "global_step": 619584, "epoch": 7464} {"train_loss": -27.669940948486328, "global_step": 619585, "epoch": 7464} {"train_loss": -27.698841094970703, "global_step": 619586, "epoch": 7464} {"train_loss": -27.991682052612305, "global_step": 619587, "epoch": 7464} {"train_loss": -28.20306396484375, "global_step": 619588, "epoch": 7464} {"train_loss": -27.801496505737305, "global_step": 619589, "epoch": 7464} {"train_loss": -27.88446617126465, "global_step": 619590, "epoch": 7464} {"train_loss": -27.95901870727539, "global_step": 619591, "epoch": 7464} {"train_loss": -27.743284225463867, "global_step": 619592, "epoch": 7464} {"train_loss": -27.922555923461914, "global_step": 619593, "epoch": 7464} {"train_loss": -27.968737981405603, "global_step": 619594, "epoch": 7464, "val_loss": 6680143.5} {"train_loss": -26.496902465820312, "global_step": 619595, "epoch": 7465} {"train_loss": -27.219104766845703, "global_step": 619596, "epoch": 7465} {"train_loss": -27.796539306640625, "global_step": 619597, "epoch": 7465} {"train_loss": -26.970951080322266, "global_step": 619598, "epoch": 7465} {"train_loss": -27.787311553955078, "global_step": 619599, "epoch": 7465} {"train_loss": -27.787200927734375, "global_step": 619600, "epoch": 7465} {"train_loss": -27.73335838317871, "global_step": 619601, "epoch": 7465} {"train_loss": -27.641342163085938, "global_step": 619602, "epoch": 7465} {"train_loss": -27.56727409362793, "global_step": 619603, "epoch": 7465} {"train_loss": -27.858123779296875, "global_step": 619604, "epoch": 7465} {"train_loss": -27.604177474975586, "global_step": 619605, "epoch": 7465} {"train_loss": -27.631696701049805, "global_step": 619606, "epoch": 7465} {"train_loss": -27.70448112487793, "global_step": 619607, "epoch": 7465} {"train_loss": -27.821796417236328, "global_step": 619608, "epoch": 7465} {"train_loss": -27.831945419311523, "global_step": 619609, "epoch": 7465} {"train_loss": -27.556659698486328, "global_step": 619610, "epoch": 7465} {"train_loss": -27.722564697265625, "global_step": 619611, "epoch": 7465} {"train_loss": -27.63671875, "global_step": 619612, "epoch": 7465} {"train_loss": -27.890125274658203, "global_step": 619613, "epoch": 7465} {"train_loss": -27.792591094970703, "global_step": 619614, "epoch": 7465} {"train_loss": -27.691761016845703, "global_step": 619615, "epoch": 7465} {"train_loss": -28.0341796875, "global_step": 619616, "epoch": 7465} {"train_loss": -28.0650634765625, "global_step": 619617, "epoch": 7465} {"train_loss": -28.025739669799805, "global_step": 619618, "epoch": 7465} {"train_loss": -27.897735595703125, "global_step": 619619, "epoch": 7465} {"train_loss": -27.799299240112305, "global_step": 619620, "epoch": 7465} {"train_loss": -27.8055477142334, "global_step": 619621, "epoch": 7465} {"train_loss": -28.025897979736328, "global_step": 619622, "epoch": 7465} {"train_loss": -28.081327438354492, "global_step": 619623, "epoch": 7465} {"train_loss": -27.935028076171875, "global_step": 619624, "epoch": 7465} {"train_loss": -28.023853302001953, "global_step": 619625, "epoch": 7465} {"train_loss": -27.994897842407227, "global_step": 619626, "epoch": 7465} {"train_loss": -28.204761505126953, "global_step": 619627, "epoch": 7465} {"train_loss": -28.17461585998535, "global_step": 619628, "epoch": 7465} {"train_loss": -28.193012237548828, "global_step": 619629, "epoch": 7465} {"train_loss": -27.847305297851562, "global_step": 619630, "epoch": 7465} {"train_loss": -28.064178466796875, "global_step": 619631, "epoch": 7465} {"train_loss": -28.44704246520996, "global_step": 619632, "epoch": 7465} {"train_loss": -28.174610137939453, "global_step": 619633, "epoch": 7465} {"train_loss": -27.953357696533203, "global_step": 619634, "epoch": 7465} {"train_loss": -28.291458129882812, "global_step": 619635, "epoch": 7465} {"train_loss": -27.965362548828125, "global_step": 619636, "epoch": 7465} {"train_loss": -28.602558135986328, "global_step": 619637, "epoch": 7465} {"train_loss": -27.921472549438477, "global_step": 619638, "epoch": 7465} {"train_loss": -28.389572143554688, "global_step": 619639, "epoch": 7465} {"train_loss": -27.94610595703125, "global_step": 619640, "epoch": 7465} {"train_loss": -28.383031845092773, "global_step": 619641, "epoch": 7465} {"train_loss": -27.939783096313477, "global_step": 619642, "epoch": 7465} {"train_loss": -28.175405502319336, "global_step": 619643, "epoch": 7465} {"train_loss": -27.936325073242188, "global_step": 619644, "epoch": 7465} {"train_loss": -27.536605834960938, "global_step": 619645, "epoch": 7465} {"train_loss": -27.915067672729492, "global_step": 619646, "epoch": 7465} {"train_loss": -27.591360092163086, "global_step": 619647, "epoch": 7465} {"train_loss": -27.872053146362305, "global_step": 619648, "epoch": 7465} {"train_loss": -28.206892013549805, "global_step": 619649, "epoch": 7465} {"train_loss": -27.654804229736328, "global_step": 619650, "epoch": 7465} {"train_loss": -28.118371963500977, "global_step": 619651, "epoch": 7465} {"train_loss": -28.23103904724121, "global_step": 619652, "epoch": 7465} {"train_loss": -27.445114135742188, "global_step": 619653, "epoch": 7465} {"train_loss": -27.981494903564453, "global_step": 619654, "epoch": 7465} {"train_loss": -28.208051681518555, "global_step": 619655, "epoch": 7465} {"train_loss": -28.04041862487793, "global_step": 619656, "epoch": 7465} {"train_loss": -28.09327507019043, "global_step": 619657, "epoch": 7465} {"train_loss": -28.126544952392578, "global_step": 619658, "epoch": 7465} {"train_loss": -28.127248764038086, "global_step": 619659, "epoch": 7465} {"train_loss": -27.64179801940918, "global_step": 619660, "epoch": 7465} {"train_loss": -28.079425811767578, "global_step": 619661, "epoch": 7465} {"train_loss": -28.08929443359375, "global_step": 619662, "epoch": 7465} {"train_loss": -28.157901763916016, "global_step": 619663, "epoch": 7465} {"train_loss": -27.679967880249023, "global_step": 619664, "epoch": 7465} {"train_loss": -28.431320190429688, "global_step": 619665, "epoch": 7465} {"train_loss": -27.900320053100586, "global_step": 619666, "epoch": 7465} {"train_loss": -27.710437774658203, "global_step": 619667, "epoch": 7465} {"train_loss": -27.483509063720703, "global_step": 619668, "epoch": 7465} {"train_loss": -27.771991729736328, "global_step": 619669, "epoch": 7465} {"train_loss": -28.218219757080078, "global_step": 619670, "epoch": 7465} {"train_loss": -27.772275924682617, "global_step": 619671, "epoch": 7465} {"train_loss": -27.983936309814453, "global_step": 619672, "epoch": 7465} {"train_loss": -28.2065486907959, "global_step": 619673, "epoch": 7465} {"train_loss": -28.090961456298828, "global_step": 619674, "epoch": 7465} {"train_loss": -28.09638023376465, "global_step": 619675, "epoch": 7465} {"train_loss": -28.310638427734375, "global_step": 619676, "epoch": 7465} {"train_loss": -27.90038129507777, "global_step": 619677, "epoch": 7465, "val_loss": 6653637.0} {"train_loss": -27.68973159790039, "global_step": 619678, "epoch": 7466} {"train_loss": -28.02604103088379, "global_step": 619679, "epoch": 7466} {"train_loss": -28.000965118408203, "global_step": 619680, "epoch": 7466} {"train_loss": -27.58430290222168, "global_step": 619681, "epoch": 7466} {"train_loss": -27.44793128967285, "global_step": 619682, "epoch": 7466} {"train_loss": -27.7825870513916, "global_step": 619683, "epoch": 7466} {"train_loss": -27.677642822265625, "global_step": 619684, "epoch": 7466} {"train_loss": -28.19524574279785, "global_step": 619685, "epoch": 7466} {"train_loss": -27.919757843017578, "global_step": 619686, "epoch": 7466} {"train_loss": -27.942167282104492, "global_step": 619687, "epoch": 7466} {"train_loss": -27.635650634765625, "global_step": 619688, "epoch": 7466} {"train_loss": -27.656890869140625, "global_step": 619689, "epoch": 7466} {"train_loss": -27.77182960510254, "global_step": 619690, "epoch": 7466} {"train_loss": -27.927595138549805, "global_step": 619691, "epoch": 7466} {"train_loss": -27.655527114868164, "global_step": 619692, "epoch": 7466} {"train_loss": -27.932952880859375, "global_step": 619693, "epoch": 7466} {"train_loss": -27.610198974609375, "global_step": 619694, "epoch": 7466} {"train_loss": -28.153532028198242, "global_step": 619695, "epoch": 7466} {"train_loss": -27.92866325378418, "global_step": 619696, "epoch": 7466} {"train_loss": -27.88837242126465, "global_step": 619697, "epoch": 7466} {"train_loss": -27.95415687561035, "global_step": 619698, "epoch": 7466} {"train_loss": -27.784635543823242, "global_step": 619699, "epoch": 7466} {"train_loss": -28.310667037963867, "global_step": 619700, "epoch": 7466} {"train_loss": -27.85972023010254, "global_step": 619701, "epoch": 7466} {"train_loss": -27.4423885345459, "global_step": 619702, "epoch": 7466} {"train_loss": -27.97379493713379, "global_step": 619703, "epoch": 7466} {"train_loss": -27.76788902282715, "global_step": 619704, "epoch": 7466} {"train_loss": -27.773725509643555, "global_step": 619705, "epoch": 7466} {"train_loss": -28.05704116821289, "global_step": 619706, "epoch": 7466} {"train_loss": -27.7536678314209, "global_step": 619707, "epoch": 7466} {"train_loss": -28.104354858398438, "global_step": 619708, "epoch": 7466} {"train_loss": -28.052555084228516, "global_step": 619709, "epoch": 7466} {"train_loss": -27.865234375, "global_step": 619710, "epoch": 7466} {"train_loss": -27.578277587890625, "global_step": 619711, "epoch": 7466} {"train_loss": -27.423120498657227, "global_step": 619712, "epoch": 7466} {"train_loss": -27.765182495117188, "global_step": 619713, "epoch": 7466} {"train_loss": -28.502634048461914, "global_step": 619714, "epoch": 7466} {"train_loss": -28.143878936767578, "global_step": 619715, "epoch": 7466} {"train_loss": -28.057966232299805, "global_step": 619716, "epoch": 7466} {"train_loss": -27.898130416870117, "global_step": 619717, "epoch": 7466} {"train_loss": -27.868621826171875, "global_step": 619718, "epoch": 7466} {"train_loss": -28.12860679626465, "global_step": 619719, "epoch": 7466} {"train_loss": -28.038818359375, "global_step": 619720, "epoch": 7466} {"train_loss": -28.19775390625, "global_step": 619721, "epoch": 7466} {"train_loss": -27.697162628173828, "global_step": 619722, "epoch": 7466} {"train_loss": -28.26254653930664, "global_step": 619723, "epoch": 7466} {"train_loss": -28.1726016998291, "global_step": 619724, "epoch": 7466} {"train_loss": -27.97481346130371, "global_step": 619725, "epoch": 7466} {"train_loss": -27.898944854736328, "global_step": 619726, "epoch": 7466} {"train_loss": -28.047483444213867, "global_step": 619727, "epoch": 7466} {"train_loss": -28.323368072509766, "global_step": 619728, "epoch": 7466} {"train_loss": -28.40827751159668, "global_step": 619729, "epoch": 7466} {"train_loss": -28.161840438842773, "global_step": 619730, "epoch": 7466} {"train_loss": -28.21821403503418, "global_step": 619731, "epoch": 7466} {"train_loss": -28.550628662109375, "global_step": 619732, "epoch": 7466} {"train_loss": -28.114166259765625, "global_step": 619733, "epoch": 7466} {"train_loss": -28.267578125, "global_step": 619734, "epoch": 7466} {"train_loss": -27.400711059570312, "global_step": 619735, "epoch": 7466} {"train_loss": -28.241683959960938, "global_step": 619736, "epoch": 7466} {"train_loss": -28.11463737487793, "global_step": 619737, "epoch": 7466} {"train_loss": -27.949188232421875, "global_step": 619738, "epoch": 7466} {"train_loss": -27.999103546142578, "global_step": 619739, "epoch": 7466} {"train_loss": -27.87444496154785, "global_step": 619740, "epoch": 7466} {"train_loss": -28.377456665039062, "global_step": 619741, "epoch": 7466} {"train_loss": -28.126178741455078, "global_step": 619742, "epoch": 7466} {"train_loss": -27.905914306640625, "global_step": 619743, "epoch": 7466} {"train_loss": -27.961563110351562, "global_step": 619744, "epoch": 7466} {"train_loss": -27.755361557006836, "global_step": 619745, "epoch": 7466} {"train_loss": -27.931127548217773, "global_step": 619746, "epoch": 7466} {"train_loss": -28.0822811126709, "global_step": 619747, "epoch": 7466} {"train_loss": -28.124698638916016, "global_step": 619748, "epoch": 7466} {"train_loss": -28.257307052612305, "global_step": 619749, "epoch": 7466} {"train_loss": -28.369470596313477, "global_step": 619750, "epoch": 7466} {"train_loss": -28.156747817993164, "global_step": 619751, "epoch": 7466} {"train_loss": -28.501245498657227, "global_step": 619752, "epoch": 7466} {"train_loss": -28.162240982055664, "global_step": 619753, "epoch": 7466} {"train_loss": -28.302143096923828, "global_step": 619754, "epoch": 7466} {"train_loss": -27.837793350219727, "global_step": 619755, "epoch": 7466} {"train_loss": -28.46111488342285, "global_step": 619756, "epoch": 7466} {"train_loss": -28.427778244018555, "global_step": 619757, "epoch": 7466} {"train_loss": -27.99896812438965, "global_step": 619758, "epoch": 7466} {"train_loss": -28.337839126586914, "global_step": 619759, "epoch": 7466} {"train_loss": -28.00466813236834, "global_step": 619760, "epoch": 7466, "val_loss": 6622563.5} {"train_loss": -27.584674835205078, "global_step": 619761, "epoch": 7467} {"train_loss": -27.11407470703125, "global_step": 619762, "epoch": 7467} {"train_loss": -27.611530303955078, "global_step": 619763, "epoch": 7467} {"train_loss": -27.390005111694336, "global_step": 619764, "epoch": 7467} {"train_loss": -27.9010009765625, "global_step": 619765, "epoch": 7467} {"train_loss": -27.91525650024414, "global_step": 619766, "epoch": 7467} {"train_loss": -27.509912490844727, "global_step": 619767, "epoch": 7467} {"train_loss": -27.409650802612305, "global_step": 619768, "epoch": 7467} {"train_loss": -27.440717697143555, "global_step": 619769, "epoch": 7467} {"train_loss": -27.9788761138916, "global_step": 619770, "epoch": 7467} {"train_loss": -28.144489288330078, "global_step": 619771, "epoch": 7467} {"train_loss": -27.660375595092773, "global_step": 619772, "epoch": 7467} {"train_loss": -27.717924118041992, "global_step": 619773, "epoch": 7467} {"train_loss": -27.386632919311523, "global_step": 619774, "epoch": 7467} {"train_loss": -28.149921417236328, "global_step": 619775, "epoch": 7467} {"train_loss": -28.186201095581055, "global_step": 619776, "epoch": 7467} {"train_loss": -28.132251739501953, "global_step": 619777, "epoch": 7467} {"train_loss": -27.91437339782715, "global_step": 619778, "epoch": 7467} {"train_loss": -27.946847915649414, "global_step": 619779, "epoch": 7467} {"train_loss": -28.270172119140625, "global_step": 619780, "epoch": 7467} {"train_loss": -28.22279930114746, "global_step": 619781, "epoch": 7467} {"train_loss": -28.299823760986328, "global_step": 619782, "epoch": 7467} {"train_loss": -27.976699829101562, "global_step": 619783, "epoch": 7467} {"train_loss": -28.146154403686523, "global_step": 619784, "epoch": 7467} {"train_loss": -28.265613555908203, "global_step": 619785, "epoch": 7467} {"train_loss": -28.347064971923828, "global_step": 619786, "epoch": 7467} {"train_loss": -28.210859298706055, "global_step": 619787, "epoch": 7467} {"train_loss": -28.7594051361084, "global_step": 619788, "epoch": 7467} {"train_loss": -28.006900787353516, "global_step": 619789, "epoch": 7467} {"train_loss": -28.27237892150879, "global_step": 619790, "epoch": 7467} {"train_loss": -28.144262313842773, "global_step": 619791, "epoch": 7467} {"train_loss": -28.564416885375977, "global_step": 619792, "epoch": 7467} {"train_loss": -28.373260498046875, "global_step": 619793, "epoch": 7467} {"train_loss": -28.42034912109375, "global_step": 619794, "epoch": 7467} {"train_loss": -28.174896240234375, "global_step": 619795, "epoch": 7467} {"train_loss": -28.78339195251465, "global_step": 619796, "epoch": 7467} {"train_loss": -28.2746639251709, "global_step": 619797, "epoch": 7467} {"train_loss": -28.330432891845703, "global_step": 619798, "epoch": 7467} {"train_loss": -28.172657012939453, "global_step": 619799, "epoch": 7467} {"train_loss": -28.26675796508789, "global_step": 619800, "epoch": 7467} {"train_loss": -28.71234703063965, "global_step": 619801, "epoch": 7467} {"train_loss": -28.330291748046875, "global_step": 619802, "epoch": 7467} {"train_loss": -27.990558624267578, "global_step": 619803, "epoch": 7467} {"train_loss": -28.103565216064453, "global_step": 619804, "epoch": 7467} {"train_loss": -28.359607696533203, "global_step": 619805, "epoch": 7467} {"train_loss": -28.4177303314209, "global_step": 619806, "epoch": 7467} {"train_loss": -28.15537452697754, "global_step": 619807, "epoch": 7467} {"train_loss": -28.073026657104492, "global_step": 619808, "epoch": 7467} {"train_loss": -28.093427658081055, "global_step": 619809, "epoch": 7467} {"train_loss": -28.09671401977539, "global_step": 619810, "epoch": 7467} {"train_loss": -28.27117919921875, "global_step": 619811, "epoch": 7467} {"train_loss": -28.341962814331055, "global_step": 619812, "epoch": 7467} {"train_loss": -28.39692497253418, "global_step": 619813, "epoch": 7467} {"train_loss": -28.42841148376465, "global_step": 619814, "epoch": 7467} {"train_loss": -28.016864776611328, "global_step": 619815, "epoch": 7467} {"train_loss": -28.016468048095703, "global_step": 619816, "epoch": 7467} {"train_loss": -28.095199584960938, "global_step": 619817, "epoch": 7467} {"train_loss": -27.847742080688477, "global_step": 619818, "epoch": 7467} {"train_loss": -27.510395050048828, "global_step": 619819, "epoch": 7467} {"train_loss": -27.838977813720703, "global_step": 619820, "epoch": 7467} {"train_loss": -28.0601863861084, "global_step": 619821, "epoch": 7467} {"train_loss": -28.04365348815918, "global_step": 619822, "epoch": 7467} {"train_loss": -28.072111129760742, "global_step": 619823, "epoch": 7467} {"train_loss": -27.69257164001465, "global_step": 619824, "epoch": 7467} {"train_loss": -27.650226593017578, "global_step": 619825, "epoch": 7467} {"train_loss": -27.783533096313477, "global_step": 619826, "epoch": 7467} {"train_loss": -27.783246994018555, "global_step": 619827, "epoch": 7467} {"train_loss": -27.93891716003418, "global_step": 619828, "epoch": 7467} {"train_loss": -27.751174926757812, "global_step": 619829, "epoch": 7467} {"train_loss": -28.105146408081055, "global_step": 619830, "epoch": 7467} {"train_loss": -28.0203914642334, "global_step": 619831, "epoch": 7467} {"train_loss": -27.693408966064453, "global_step": 619832, "epoch": 7467} {"train_loss": -28.224716186523438, "global_step": 619833, "epoch": 7467} {"train_loss": -27.627832412719727, "global_step": 619834, "epoch": 7467} {"train_loss": -27.9082088470459, "global_step": 619835, "epoch": 7467} {"train_loss": -27.801055908203125, "global_step": 619836, "epoch": 7467} {"train_loss": -27.704984664916992, "global_step": 619837, "epoch": 7467} {"train_loss": -28.129453659057617, "global_step": 619838, "epoch": 7467} {"train_loss": -27.975513458251953, "global_step": 619839, "epoch": 7467} {"train_loss": -27.821136474609375, "global_step": 619840, "epoch": 7467} {"train_loss": -27.593643188476562, "global_step": 619841, "epoch": 7467} {"train_loss": -27.69778823852539, "global_step": 619842, "epoch": 7467} {"train_loss": -28.017995236867883, "global_step": 619843, "epoch": 7467, "val_loss": 6586026.5} {"train_loss": -27.33283805847168, "global_step": 619844, "epoch": 7468} {"train_loss": -27.77010154724121, "global_step": 619845, "epoch": 7468} {"train_loss": -27.583017349243164, "global_step": 619846, "epoch": 7468} {"train_loss": -27.72525978088379, "global_step": 619847, "epoch": 7468} {"train_loss": -27.136051177978516, "global_step": 619848, "epoch": 7468} {"train_loss": -27.61115837097168, "global_step": 619849, "epoch": 7468} {"train_loss": -28.039350509643555, "global_step": 619850, "epoch": 7468} {"train_loss": -27.793310165405273, "global_step": 619851, "epoch": 7468} {"train_loss": -27.789947509765625, "global_step": 619852, "epoch": 7468} {"train_loss": -27.91242790222168, "global_step": 619853, "epoch": 7468} {"train_loss": -27.518712997436523, "global_step": 619854, "epoch": 7468} {"train_loss": -27.393890380859375, "global_step": 619855, "epoch": 7468} {"train_loss": -28.02493667602539, "global_step": 619856, "epoch": 7468} {"train_loss": -27.544570922851562, "global_step": 619857, "epoch": 7468} {"train_loss": -28.09406089782715, "global_step": 619858, "epoch": 7468} {"train_loss": -27.8184757232666, "global_step": 619859, "epoch": 7468} {"train_loss": -27.82254981994629, "global_step": 619860, "epoch": 7468} {"train_loss": -28.126184463500977, "global_step": 619861, "epoch": 7468} {"train_loss": -27.761402130126953, "global_step": 619862, "epoch": 7468} {"train_loss": -28.08050537109375, "global_step": 619863, "epoch": 7468} {"train_loss": -27.717166900634766, "global_step": 619864, "epoch": 7468} {"train_loss": -27.71476173400879, "global_step": 619865, "epoch": 7468} {"train_loss": -27.966018676757812, "global_step": 619866, "epoch": 7468} {"train_loss": -27.86639404296875, "global_step": 619867, "epoch": 7468} {"train_loss": -27.711835861206055, "global_step": 619868, "epoch": 7468} {"train_loss": -28.037317276000977, "global_step": 619869, "epoch": 7468} {"train_loss": -27.988378524780273, "global_step": 619870, "epoch": 7468} {"train_loss": -28.154035568237305, "global_step": 619871, "epoch": 7468} {"train_loss": -28.13392448425293, "global_step": 619872, "epoch": 7468} {"train_loss": -27.90673828125, "global_step": 619873, "epoch": 7468} {"train_loss": -27.91572380065918, "global_step": 619874, "epoch": 7468} {"train_loss": -28.317712783813477, "global_step": 619875, "epoch": 7468} {"train_loss": -27.86739158630371, "global_step": 619876, "epoch": 7468} {"train_loss": -27.71468162536621, "global_step": 619877, "epoch": 7468} {"train_loss": -28.100549697875977, "global_step": 619878, "epoch": 7468} {"train_loss": -28.246784210205078, "global_step": 619879, "epoch": 7468} {"train_loss": -28.075403213500977, "global_step": 619880, "epoch": 7468} {"train_loss": -28.413236618041992, "global_step": 619881, "epoch": 7468} {"train_loss": -28.237812042236328, "global_step": 619882, "epoch": 7468} {"train_loss": -28.16204261779785, "global_step": 619883, "epoch": 7468} {"train_loss": -28.298734664916992, "global_step": 619884, "epoch": 7468} {"train_loss": -28.131433486938477, "global_step": 619885, "epoch": 7468} {"train_loss": -27.965845108032227, "global_step": 619886, "epoch": 7468} {"train_loss": -27.833740234375, "global_step": 619887, "epoch": 7468} {"train_loss": -28.13970375061035, "global_step": 619888, "epoch": 7468} {"train_loss": -28.178449630737305, "global_step": 619889, "epoch": 7468} {"train_loss": -28.293903350830078, "global_step": 619890, "epoch": 7468} {"train_loss": -28.29224967956543, "global_step": 619891, "epoch": 7468} {"train_loss": -28.32013511657715, "global_step": 619892, "epoch": 7468} {"train_loss": -28.16213035583496, "global_step": 619893, "epoch": 7468} {"train_loss": -28.64121437072754, "global_step": 619894, "epoch": 7468} {"train_loss": -28.57470703125, "global_step": 619895, "epoch": 7468} {"train_loss": -28.389877319335938, "global_step": 619896, "epoch": 7468} {"train_loss": -28.270681381225586, "global_step": 619897, "epoch": 7468} {"train_loss": -28.2830810546875, "global_step": 619898, "epoch": 7468} {"train_loss": -28.47414207458496, "global_step": 619899, "epoch": 7468} {"train_loss": -28.2233943939209, "global_step": 619900, "epoch": 7468} {"train_loss": -28.327865600585938, "global_step": 619901, "epoch": 7468} {"train_loss": -28.58588981628418, "global_step": 619902, "epoch": 7468} {"train_loss": -27.843902587890625, "global_step": 619903, "epoch": 7468} {"train_loss": -27.385900497436523, "global_step": 619904, "epoch": 7468} {"train_loss": -26.245203018188477, "global_step": 619905, "epoch": 7468} {"train_loss": -24.953628540039062, "global_step": 619906, "epoch": 7468} {"train_loss": -25.906484603881836, "global_step": 619907, "epoch": 7468} {"train_loss": -27.816486358642578, "global_step": 619908, "epoch": 7468} {"train_loss": -27.5880184173584, "global_step": 619909, "epoch": 7468} {"train_loss": -27.550195693969727, "global_step": 619910, "epoch": 7468} {"train_loss": -27.83157730102539, "global_step": 619911, "epoch": 7468} {"train_loss": -27.747766494750977, "global_step": 619912, "epoch": 7468} {"train_loss": -27.805566787719727, "global_step": 619913, "epoch": 7468} {"train_loss": -27.841989517211914, "global_step": 619914, "epoch": 7468} {"train_loss": -27.775470733642578, "global_step": 619915, "epoch": 7468} {"train_loss": -27.81207275390625, "global_step": 619916, "epoch": 7468} {"train_loss": -27.968982696533203, "global_step": 619917, "epoch": 7468} {"train_loss": -27.83941078186035, "global_step": 619918, "epoch": 7468} {"train_loss": -28.359237670898438, "global_step": 619919, "epoch": 7468} {"train_loss": -27.95216941833496, "global_step": 619920, "epoch": 7468} {"train_loss": -27.822778701782227, "global_step": 619921, "epoch": 7468} {"train_loss": -28.189172744750977, "global_step": 619922, "epoch": 7468} {"train_loss": -27.498926162719727, "global_step": 619923, "epoch": 7468} {"train_loss": -27.60125732421875, "global_step": 619924, "epoch": 7468} {"train_loss": -28.073841094970703, "global_step": 619925, "epoch": 7468} {"train_loss": -27.865090450608587, "global_step": 619926, "epoch": 7468, "val_loss": 6660780.0} {"train_loss": -27.222375869750977, "global_step": 619927, "epoch": 7469} {"train_loss": -27.169830322265625, "global_step": 619928, "epoch": 7469} {"train_loss": -27.780609130859375, "global_step": 619929, "epoch": 7469} {"train_loss": -27.444080352783203, "global_step": 619930, "epoch": 7469} {"train_loss": -27.909643173217773, "global_step": 619931, "epoch": 7469} {"train_loss": -27.486425399780273, "global_step": 619932, "epoch": 7469} {"train_loss": -27.9758358001709, "global_step": 619933, "epoch": 7469} {"train_loss": -27.703882217407227, "global_step": 619934, "epoch": 7469} {"train_loss": -27.40633201599121, "global_step": 619935, "epoch": 7469} {"train_loss": -27.5535831451416, "global_step": 619936, "epoch": 7469} {"train_loss": -27.820783615112305, "global_step": 619937, "epoch": 7469} {"train_loss": -27.859521865844727, "global_step": 619938, "epoch": 7469} {"train_loss": -28.029417037963867, "global_step": 619939, "epoch": 7469} {"train_loss": -28.159399032592773, "global_step": 619940, "epoch": 7469} {"train_loss": -28.118637084960938, "global_step": 619941, "epoch": 7469} {"train_loss": -28.109495162963867, "global_step": 619942, "epoch": 7469} {"train_loss": -28.072357177734375, "global_step": 619943, "epoch": 7469} {"train_loss": -27.98566246032715, "global_step": 619944, "epoch": 7469} {"train_loss": -28.255298614501953, "global_step": 619945, "epoch": 7469} {"train_loss": -27.979419708251953, "global_step": 619946, "epoch": 7469} {"train_loss": -28.04054069519043, "global_step": 619947, "epoch": 7469} {"train_loss": -27.765213012695312, "global_step": 619948, "epoch": 7469} {"train_loss": -28.098281860351562, "global_step": 619949, "epoch": 7469} {"train_loss": -28.122364044189453, "global_step": 619950, "epoch": 7469} {"train_loss": -28.544214248657227, "global_step": 619951, "epoch": 7469} {"train_loss": -28.277210235595703, "global_step": 619952, "epoch": 7469} {"train_loss": -28.44046401977539, "global_step": 619953, "epoch": 7469} {"train_loss": -28.220855712890625, "global_step": 619954, "epoch": 7469} {"train_loss": -28.64771842956543, "global_step": 619955, "epoch": 7469} {"train_loss": -28.321670532226562, "global_step": 619956, "epoch": 7469} {"train_loss": -28.507369995117188, "global_step": 619957, "epoch": 7469} {"train_loss": -28.070941925048828, "global_step": 619958, "epoch": 7469} {"train_loss": -28.08489990234375, "global_step": 619959, "epoch": 7469} {"train_loss": -28.42146110534668, "global_step": 619960, "epoch": 7469} {"train_loss": -28.18463134765625, "global_step": 619961, "epoch": 7469} {"train_loss": -28.185958862304688, "global_step": 619962, "epoch": 7469} {"train_loss": -28.120716094970703, "global_step": 619963, "epoch": 7469} {"train_loss": -28.376239776611328, "global_step": 619964, "epoch": 7469} {"train_loss": -28.25819969177246, "global_step": 619965, "epoch": 7469} {"train_loss": -27.92762565612793, "global_step": 619966, "epoch": 7469} {"train_loss": -28.084325790405273, "global_step": 619967, "epoch": 7469} {"train_loss": -28.29388999938965, "global_step": 619968, "epoch": 7469} {"train_loss": -28.497602462768555, "global_step": 619969, "epoch": 7469} {"train_loss": -28.203275680541992, "global_step": 619970, "epoch": 7469} {"train_loss": -28.49977684020996, "global_step": 619971, "epoch": 7469} {"train_loss": -28.517831802368164, "global_step": 619972, "epoch": 7469} {"train_loss": -28.389041900634766, "global_step": 619973, "epoch": 7469} {"train_loss": -28.418970108032227, "global_step": 619974, "epoch": 7469} {"train_loss": -28.070158004760742, "global_step": 619975, "epoch": 7469} {"train_loss": -28.2050838470459, "global_step": 619976, "epoch": 7469} {"train_loss": -28.022964477539062, "global_step": 619977, "epoch": 7469} {"train_loss": -28.041336059570312, "global_step": 619978, "epoch": 7469} {"train_loss": -28.1641845703125, "global_step": 619979, "epoch": 7469} {"train_loss": -28.23048210144043, "global_step": 619980, "epoch": 7469} {"train_loss": -28.214496612548828, "global_step": 619981, "epoch": 7469} {"train_loss": -28.141159057617188, "global_step": 619982, "epoch": 7469} {"train_loss": -28.178964614868164, "global_step": 619983, "epoch": 7469} {"train_loss": -28.2386417388916, "global_step": 619984, "epoch": 7469} {"train_loss": -28.2194881439209, "global_step": 619985, "epoch": 7469} {"train_loss": -28.42592430114746, "global_step": 619986, "epoch": 7469} {"train_loss": -27.791311264038086, "global_step": 619987, "epoch": 7469} {"train_loss": -28.120132446289062, "global_step": 619988, "epoch": 7469} {"train_loss": -28.308286666870117, "global_step": 619989, "epoch": 7469} {"train_loss": -28.249902725219727, "global_step": 619990, "epoch": 7469} {"train_loss": -28.153045654296875, "global_step": 619991, "epoch": 7469} {"train_loss": -27.984027862548828, "global_step": 619992, "epoch": 7469} {"train_loss": -28.075788497924805, "global_step": 619993, "epoch": 7469} {"train_loss": -28.167327880859375, "global_step": 619994, "epoch": 7469} {"train_loss": -28.316162109375, "global_step": 619995, "epoch": 7469} {"train_loss": -28.517358779907227, "global_step": 619996, "epoch": 7469} {"train_loss": -28.3493709564209, "global_step": 619997, "epoch": 7469} {"train_loss": -28.309213638305664, "global_step": 619998, "epoch": 7469} {"train_loss": -28.152692794799805, "global_step": 619999, "epoch": 7469} {"train_loss": -28.219289779663086, "global_step": 620000, "epoch": 7469} {"train_loss": -28.445837020874023, "global_step": 620001, "epoch": 7469} {"train_loss": -28.525653839111328, "global_step": 620002, "epoch": 7469} {"train_loss": -28.05137062072754, "global_step": 620003, "epoch": 7469} {"train_loss": -28.228870391845703, "global_step": 620004, "epoch": 7469} {"train_loss": -28.35172462463379, "global_step": 620005, "epoch": 7469} {"train_loss": -28.464319229125977, "global_step": 620006, "epoch": 7469} {"train_loss": -28.482330322265625, "global_step": 620007, "epoch": 7469} {"train_loss": -28.4597225189209, "global_step": 620008, "epoch": 7469} {"train_loss": -28.130219516983953, "global_step": 620009, "epoch": 7469, "val_loss": 6623516.0} {"train_loss": -28.20551872253418, "global_step": 620010, "epoch": 7470} {"train_loss": -27.541961669921875, "global_step": 620011, "epoch": 7470} {"train_loss": -26.220041275024414, "global_step": 620012, "epoch": 7470} {"train_loss": -26.572309494018555, "global_step": 620013, "epoch": 7470} {"train_loss": -27.415891647338867, "global_step": 620014, "epoch": 7470} {"train_loss": -27.285221099853516, "global_step": 620015, "epoch": 7470} {"train_loss": -27.551578521728516, "global_step": 620016, "epoch": 7470} {"train_loss": -27.429197311401367, "global_step": 620017, "epoch": 7470} {"train_loss": -27.486499786376953, "global_step": 620018, "epoch": 7470} {"train_loss": -27.352506637573242, "global_step": 620019, "epoch": 7470} {"train_loss": -27.8602237701416, "global_step": 620020, "epoch": 7470} {"train_loss": -27.347265243530273, "global_step": 620021, "epoch": 7470} {"train_loss": -27.976415634155273, "global_step": 620022, "epoch": 7470} {"train_loss": -27.499454498291016, "global_step": 620023, "epoch": 7470} {"train_loss": -27.790679931640625, "global_step": 620024, "epoch": 7470} {"train_loss": -27.910663604736328, "global_step": 620025, "epoch": 7470} {"train_loss": -27.742170333862305, "global_step": 620026, "epoch": 7470} {"train_loss": -27.703088760375977, "global_step": 620027, "epoch": 7470} {"train_loss": -27.993885040283203, "global_step": 620028, "epoch": 7470} {"train_loss": -27.765918731689453, "global_step": 620029, "epoch": 7470} {"train_loss": -28.0229434967041, "global_step": 620030, "epoch": 7470} {"train_loss": -28.085412979125977, "global_step": 620031, "epoch": 7470} {"train_loss": -27.75592041015625, "global_step": 620032, "epoch": 7470} {"train_loss": -27.972318649291992, "global_step": 620033, "epoch": 7470} {"train_loss": -27.709096908569336, "global_step": 620034, "epoch": 7470} {"train_loss": -27.867084503173828, "global_step": 620035, "epoch": 7470} {"train_loss": -28.090280532836914, "global_step": 620036, "epoch": 7470} {"train_loss": -27.759817123413086, "global_step": 620037, "epoch": 7470} {"train_loss": -27.98750877380371, "global_step": 620038, "epoch": 7470} {"train_loss": -28.266443252563477, "global_step": 620039, "epoch": 7470} {"train_loss": -28.246021270751953, "global_step": 620040, "epoch": 7470} {"train_loss": -28.25840187072754, "global_step": 620041, "epoch": 7470} {"train_loss": -28.223791122436523, "global_step": 620042, "epoch": 7470} {"train_loss": -28.044952392578125, "global_step": 620043, "epoch": 7470} {"train_loss": -28.12548828125, "global_step": 620044, "epoch": 7470} {"train_loss": -28.399555206298828, "global_step": 620045, "epoch": 7470} {"train_loss": -28.00624656677246, "global_step": 620046, "epoch": 7470} {"train_loss": -28.0411376953125, "global_step": 620047, "epoch": 7470} {"train_loss": -28.351959228515625, "global_step": 620048, "epoch": 7470} {"train_loss": -28.39820671081543, "global_step": 620049, "epoch": 7470} {"train_loss": -28.226306915283203, "global_step": 620050, "epoch": 7470} {"train_loss": -28.0203857421875, "global_step": 620051, "epoch": 7470} {"train_loss": -28.16823387145996, "global_step": 620052, "epoch": 7470} {"train_loss": -28.494775772094727, "global_step": 620053, "epoch": 7470} {"train_loss": -28.302661895751953, "global_step": 620054, "epoch": 7470} {"train_loss": -27.882038116455078, "global_step": 620055, "epoch": 7470} {"train_loss": -28.228809356689453, "global_step": 620056, "epoch": 7470} {"train_loss": -28.13067626953125, "global_step": 620057, "epoch": 7470} {"train_loss": -28.386404037475586, "global_step": 620058, "epoch": 7470} {"train_loss": -28.242292404174805, "global_step": 620059, "epoch": 7470} {"train_loss": -28.634876251220703, "global_step": 620060, "epoch": 7470} {"train_loss": -28.243024826049805, "global_step": 620061, "epoch": 7470} {"train_loss": -28.03059959411621, "global_step": 620062, "epoch": 7470} {"train_loss": -28.2721004486084, "global_step": 620063, "epoch": 7470} {"train_loss": -28.1541748046875, "global_step": 620064, "epoch": 7470} {"train_loss": -27.928964614868164, "global_step": 620065, "epoch": 7470} {"train_loss": -27.68826675415039, "global_step": 620066, "epoch": 7470} {"train_loss": -28.23890495300293, "global_step": 620067, "epoch": 7470} {"train_loss": -28.433996200561523, "global_step": 620068, "epoch": 7470} {"train_loss": -27.95834732055664, "global_step": 620069, "epoch": 7470} {"train_loss": -28.11275291442871, "global_step": 620070, "epoch": 7470} {"train_loss": -28.181671142578125, "global_step": 620071, "epoch": 7470} {"train_loss": -28.136831283569336, "global_step": 620072, "epoch": 7470} {"train_loss": -28.420103073120117, "global_step": 620073, "epoch": 7470} {"train_loss": -28.126455307006836, "global_step": 620074, "epoch": 7470} {"train_loss": -28.250288009643555, "global_step": 620075, "epoch": 7470} {"train_loss": -28.210697174072266, "global_step": 620076, "epoch": 7470} {"train_loss": -28.161041259765625, "global_step": 620077, "epoch": 7470} {"train_loss": -28.25266456604004, "global_step": 620078, "epoch": 7470} {"train_loss": -27.9447078704834, "global_step": 620079, "epoch": 7470} {"train_loss": -28.329803466796875, "global_step": 620080, "epoch": 7470} {"train_loss": -28.017419815063477, "global_step": 620081, "epoch": 7470} {"train_loss": -28.351648330688477, "global_step": 620082, "epoch": 7470} {"train_loss": -28.3262939453125, "global_step": 620083, "epoch": 7470} {"train_loss": -28.07503318786621, "global_step": 620084, "epoch": 7470} {"train_loss": -27.705841064453125, "global_step": 620085, "epoch": 7470} {"train_loss": -28.06343650817871, "global_step": 620086, "epoch": 7470} {"train_loss": -28.300405502319336, "global_step": 620087, "epoch": 7470} {"train_loss": -28.0009822845459, "global_step": 620088, "epoch": 7470} {"train_loss": -28.28143310546875, "global_step": 620089, "epoch": 7470} {"train_loss": -28.225860595703125, "global_step": 620090, "epoch": 7470} {"train_loss": -27.563196182250977, "global_step": 620091, "epoch": 7470} {"train_loss": -28.01353399437594, "global_step": 620092, "epoch": 7470, "val_loss": 6590373.0} {"train_loss": -27.532073974609375, "global_step": 620093, "epoch": 7471} {"train_loss": -27.632598876953125, "global_step": 620094, "epoch": 7471} {"train_loss": -26.79571533203125, "global_step": 620095, "epoch": 7471} {"train_loss": -27.700788497924805, "global_step": 620096, "epoch": 7471} {"train_loss": -26.881330490112305, "global_step": 620097, "epoch": 7471} {"train_loss": -27.581085205078125, "global_step": 620098, "epoch": 7471} {"train_loss": -27.53293800354004, "global_step": 620099, "epoch": 7471} {"train_loss": -27.874210357666016, "global_step": 620100, "epoch": 7471} {"train_loss": -27.687713623046875, "global_step": 620101, "epoch": 7471} {"train_loss": -27.45650291442871, "global_step": 620102, "epoch": 7471} {"train_loss": -28.21320152282715, "global_step": 620103, "epoch": 7471} {"train_loss": -27.6916446685791, "global_step": 620104, "epoch": 7471} {"train_loss": -27.84260368347168, "global_step": 620105, "epoch": 7471} {"train_loss": -27.20701026916504, "global_step": 620106, "epoch": 7471} {"train_loss": -27.948495864868164, "global_step": 620107, "epoch": 7471} {"train_loss": -27.939178466796875, "global_step": 620108, "epoch": 7471} {"train_loss": -28.0395450592041, "global_step": 620109, "epoch": 7471} {"train_loss": -27.975753784179688, "global_step": 620110, "epoch": 7471} {"train_loss": -27.990915298461914, "global_step": 620111, "epoch": 7471} {"train_loss": -28.109100341796875, "global_step": 620112, "epoch": 7471} {"train_loss": -27.5483455657959, "global_step": 620113, "epoch": 7471} {"train_loss": -28.05470085144043, "global_step": 620114, "epoch": 7471} {"train_loss": -27.450815200805664, "global_step": 620115, "epoch": 7471} {"train_loss": -28.463232040405273, "global_step": 620116, "epoch": 7471} {"train_loss": -27.862689971923828, "global_step": 620117, "epoch": 7471} {"train_loss": -28.25813102722168, "global_step": 620118, "epoch": 7471} {"train_loss": -28.157541275024414, "global_step": 620119, "epoch": 7471} {"train_loss": -27.794981002807617, "global_step": 620120, "epoch": 7471} {"train_loss": -28.365863800048828, "global_step": 620121, "epoch": 7471} {"train_loss": -27.813962936401367, "global_step": 620122, "epoch": 7471} {"train_loss": -28.28143882751465, "global_step": 620123, "epoch": 7471} {"train_loss": -27.999927520751953, "global_step": 620124, "epoch": 7471} {"train_loss": -28.10662269592285, "global_step": 620125, "epoch": 7471} {"train_loss": -28.230117797851562, "global_step": 620126, "epoch": 7471} {"train_loss": -27.939193725585938, "global_step": 620127, "epoch": 7471} {"train_loss": -28.097705841064453, "global_step": 620128, "epoch": 7471} {"train_loss": -28.256711959838867, "global_step": 620129, "epoch": 7471} {"train_loss": -27.88832664489746, "global_step": 620130, "epoch": 7471} {"train_loss": -28.349279403686523, "global_step": 620131, "epoch": 7471} {"train_loss": -28.508289337158203, "global_step": 620132, "epoch": 7471} {"train_loss": -28.49871826171875, "global_step": 620133, "epoch": 7471} {"train_loss": -28.080078125, "global_step": 620134, "epoch": 7471} {"train_loss": -27.9998836517334, "global_step": 620135, "epoch": 7471} {"train_loss": -28.25826072692871, "global_step": 620136, "epoch": 7471} {"train_loss": -28.35818862915039, "global_step": 620137, "epoch": 7471} {"train_loss": -28.002765655517578, "global_step": 620138, "epoch": 7471} {"train_loss": -27.96919822692871, "global_step": 620139, "epoch": 7471} {"train_loss": -28.166706085205078, "global_step": 620140, "epoch": 7471} {"train_loss": -28.266454696655273, "global_step": 620141, "epoch": 7471} {"train_loss": -28.339832305908203, "global_step": 620142, "epoch": 7471} {"train_loss": -27.92597007751465, "global_step": 620143, "epoch": 7471} {"train_loss": -28.510889053344727, "global_step": 620144, "epoch": 7471} {"train_loss": -28.5318546295166, "global_step": 620145, "epoch": 7471} {"train_loss": -28.35746192932129, "global_step": 620146, "epoch": 7471} {"train_loss": -28.776351928710938, "global_step": 620147, "epoch": 7471} {"train_loss": -28.282611846923828, "global_step": 620148, "epoch": 7471} {"train_loss": -28.529834747314453, "global_step": 620149, "epoch": 7471} {"train_loss": -28.63273048400879, "global_step": 620150, "epoch": 7471} {"train_loss": -28.31795310974121, "global_step": 620151, "epoch": 7471} {"train_loss": -28.545059204101562, "global_step": 620152, "epoch": 7471} {"train_loss": -28.300800323486328, "global_step": 620153, "epoch": 7471} {"train_loss": -28.1392879486084, "global_step": 620154, "epoch": 7471} {"train_loss": -27.689685821533203, "global_step": 620155, "epoch": 7471} {"train_loss": -28.060108184814453, "global_step": 620156, "epoch": 7471} {"train_loss": -28.939361572265625, "global_step": 620157, "epoch": 7471} {"train_loss": -28.03277587890625, "global_step": 620158, "epoch": 7471} {"train_loss": -27.58452796936035, "global_step": 620159, "epoch": 7471} {"train_loss": -27.329004287719727, "global_step": 620160, "epoch": 7471} {"train_loss": -27.249929428100586, "global_step": 620161, "epoch": 7471} {"train_loss": -26.949670791625977, "global_step": 620162, "epoch": 7471} {"train_loss": -27.251615524291992, "global_step": 620163, "epoch": 7471} {"train_loss": -27.449689865112305, "global_step": 620164, "epoch": 7471} {"train_loss": -27.97702407836914, "global_step": 620165, "epoch": 7471} {"train_loss": -27.640216827392578, "global_step": 620166, "epoch": 7471} {"train_loss": -27.462385177612305, "global_step": 620167, "epoch": 7471} {"train_loss": -27.548831939697266, "global_step": 620168, "epoch": 7471} {"train_loss": -27.564218521118164, "global_step": 620169, "epoch": 7471} {"train_loss": -27.67927360534668, "global_step": 620170, "epoch": 7471} {"train_loss": -27.927719116210938, "global_step": 620171, "epoch": 7471} {"train_loss": -27.87129020690918, "global_step": 620172, "epoch": 7471} {"train_loss": -27.755420684814453, "global_step": 620173, "epoch": 7471} {"train_loss": -27.503040313720703, "global_step": 620174, "epoch": 7471} {"train_loss": -27.939331813030932, "global_step": 620175, "epoch": 7471, "val_loss": 6628739.0} {"train_loss": -27.861860275268555, "global_step": 620176, "epoch": 7472} {"train_loss": -27.270553588867188, "global_step": 620177, "epoch": 7472} {"train_loss": -27.060745239257812, "global_step": 620178, "epoch": 7472} {"train_loss": -27.2984619140625, "global_step": 620179, "epoch": 7472} {"train_loss": -27.41461753845215, "global_step": 620180, "epoch": 7472} {"train_loss": -27.26410484313965, "global_step": 620181, "epoch": 7472} {"train_loss": -27.483951568603516, "global_step": 620182, "epoch": 7472} {"train_loss": -27.5590763092041, "global_step": 620183, "epoch": 7472} {"train_loss": -27.5950984954834, "global_step": 620184, "epoch": 7472} {"train_loss": -27.9016170501709, "global_step": 620185, "epoch": 7472} {"train_loss": -27.69775390625, "global_step": 620186, "epoch": 7472} {"train_loss": -27.7092342376709, "global_step": 620187, "epoch": 7472} {"train_loss": -27.466535568237305, "global_step": 620188, "epoch": 7472} {"train_loss": -27.302881240844727, "global_step": 620189, "epoch": 7472} {"train_loss": -27.74781608581543, "global_step": 620190, "epoch": 7472} {"train_loss": -27.702972412109375, "global_step": 620191, "epoch": 7472} {"train_loss": -27.962142944335938, "global_step": 620192, "epoch": 7472} {"train_loss": -28.136676788330078, "global_step": 620193, "epoch": 7472} {"train_loss": -27.702957153320312, "global_step": 620194, "epoch": 7472} {"train_loss": -27.939041137695312, "global_step": 620195, "epoch": 7472} {"train_loss": -27.703550338745117, "global_step": 620196, "epoch": 7472} {"train_loss": -28.19622802734375, "global_step": 620197, "epoch": 7472} {"train_loss": -27.743371963500977, "global_step": 620198, "epoch": 7472} {"train_loss": -27.915882110595703, "global_step": 620199, "epoch": 7472} {"train_loss": -28.259504318237305, "global_step": 620200, "epoch": 7472} {"train_loss": -28.160186767578125, "global_step": 620201, "epoch": 7472} {"train_loss": -27.889638900756836, "global_step": 620202, "epoch": 7472} {"train_loss": -28.069473266601562, "global_step": 620203, "epoch": 7472} {"train_loss": -28.339033126831055, "global_step": 620204, "epoch": 7472} {"train_loss": -28.63164710998535, "global_step": 620205, "epoch": 7472} {"train_loss": -28.198928833007812, "global_step": 620206, "epoch": 7472} {"train_loss": -28.458471298217773, "global_step": 620207, "epoch": 7472} {"train_loss": -28.280292510986328, "global_step": 620208, "epoch": 7472} {"train_loss": -28.550168991088867, "global_step": 620209, "epoch": 7472} {"train_loss": -28.533384323120117, "global_step": 620210, "epoch": 7472} {"train_loss": -28.637006759643555, "global_step": 620211, "epoch": 7472} {"train_loss": -28.429462432861328, "global_step": 620212, "epoch": 7472} {"train_loss": -28.281354904174805, "global_step": 620213, "epoch": 7472} {"train_loss": -28.01291847229004, "global_step": 620214, "epoch": 7472} {"train_loss": -28.214481353759766, "global_step": 620215, "epoch": 7472} {"train_loss": -28.476327896118164, "global_step": 620216, "epoch": 7472} {"train_loss": -28.092422485351562, "global_step": 620217, "epoch": 7472} {"train_loss": -28.181264877319336, "global_step": 620218, "epoch": 7472} {"train_loss": -28.402816772460938, "global_step": 620219, "epoch": 7472} {"train_loss": -28.1694278717041, "global_step": 620220, "epoch": 7472} {"train_loss": -28.030231475830078, "global_step": 620221, "epoch": 7472} {"train_loss": -27.589719772338867, "global_step": 620222, "epoch": 7472} {"train_loss": -28.34242057800293, "global_step": 620223, "epoch": 7472} {"train_loss": -28.1946964263916, "global_step": 620224, "epoch": 7472} {"train_loss": -28.358917236328125, "global_step": 620225, "epoch": 7472} {"train_loss": -28.460180282592773, "global_step": 620226, "epoch": 7472} {"train_loss": -28.575733184814453, "global_step": 620227, "epoch": 7472} {"train_loss": -28.3044490814209, "global_step": 620228, "epoch": 7472} {"train_loss": -27.910083770751953, "global_step": 620229, "epoch": 7472} {"train_loss": -28.016529083251953, "global_step": 620230, "epoch": 7472} {"train_loss": -28.3084659576416, "global_step": 620231, "epoch": 7472} {"train_loss": -28.025806427001953, "global_step": 620232, "epoch": 7472} {"train_loss": -28.345285415649414, "global_step": 620233, "epoch": 7472} {"train_loss": -28.247034072875977, "global_step": 620234, "epoch": 7472} {"train_loss": -27.61444091796875, "global_step": 620235, "epoch": 7472} {"train_loss": -27.33426856994629, "global_step": 620236, "epoch": 7472} {"train_loss": -25.8241024017334, "global_step": 620237, "epoch": 7472} {"train_loss": -25.422510147094727, "global_step": 620238, "epoch": 7472} {"train_loss": -26.176227569580078, "global_step": 620239, "epoch": 7472} {"train_loss": -27.005292892456055, "global_step": 620240, "epoch": 7472} {"train_loss": -26.81336784362793, "global_step": 620241, "epoch": 7472} {"train_loss": -27.487293243408203, "global_step": 620242, "epoch": 7472} {"train_loss": -27.774250030517578, "global_step": 620243, "epoch": 7472} {"train_loss": -27.66912269592285, "global_step": 620244, "epoch": 7472} {"train_loss": -27.963668823242188, "global_step": 620245, "epoch": 7472} {"train_loss": -27.456979751586914, "global_step": 620246, "epoch": 7472} {"train_loss": -27.74942398071289, "global_step": 620247, "epoch": 7472} {"train_loss": -27.688623428344727, "global_step": 620248, "epoch": 7472} {"train_loss": -27.426010131835938, "global_step": 620249, "epoch": 7472} {"train_loss": -28.041889190673828, "global_step": 620250, "epoch": 7472} {"train_loss": -28.167667388916016, "global_step": 620251, "epoch": 7472} {"train_loss": -27.417593002319336, "global_step": 620252, "epoch": 7472} {"train_loss": -27.492145538330078, "global_step": 620253, "epoch": 7472} {"train_loss": -27.73247718811035, "global_step": 620254, "epoch": 7472} {"train_loss": -27.65567398071289, "global_step": 620255, "epoch": 7472} {"train_loss": -27.6086368560791, "global_step": 620256, "epoch": 7472} {"train_loss": -27.48048210144043, "global_step": 620257, "epoch": 7472} {"train_loss": -27.820580516953065, "global_step": 620258, "epoch": 7472, "val_loss": 6654473.0} {"train_loss": -27.49601173400879, "global_step": 620259, "epoch": 7473} {"train_loss": -27.170154571533203, "global_step": 620260, "epoch": 7473} {"train_loss": -27.736831665039062, "global_step": 620261, "epoch": 7473} {"train_loss": -26.98188591003418, "global_step": 620262, "epoch": 7473} {"train_loss": -27.211029052734375, "global_step": 620263, "epoch": 7473} {"train_loss": -26.903491973876953, "global_step": 620264, "epoch": 7473} {"train_loss": -27.148202896118164, "global_step": 620265, "epoch": 7473} {"train_loss": -27.34681510925293, "global_step": 620266, "epoch": 7473} {"train_loss": -27.231237411499023, "global_step": 620267, "epoch": 7473} {"train_loss": -27.49433708190918, "global_step": 620268, "epoch": 7473} {"train_loss": -27.21828269958496, "global_step": 620269, "epoch": 7473} {"train_loss": -27.556028366088867, "global_step": 620270, "epoch": 7473} {"train_loss": -27.567075729370117, "global_step": 620271, "epoch": 7473} {"train_loss": -27.580780029296875, "global_step": 620272, "epoch": 7473} {"train_loss": -27.4184513092041, "global_step": 620273, "epoch": 7473} {"train_loss": -27.314239501953125, "global_step": 620274, "epoch": 7473} {"train_loss": -27.39388084411621, "global_step": 620275, "epoch": 7473} {"train_loss": -27.41583824157715, "global_step": 620276, "epoch": 7473} {"train_loss": -27.7652587890625, "global_step": 620277, "epoch": 7473} {"train_loss": -27.832477569580078, "global_step": 620278, "epoch": 7473} {"train_loss": -27.703083038330078, "global_step": 620279, "epoch": 7473} {"train_loss": -27.960845947265625, "global_step": 620280, "epoch": 7473} {"train_loss": -27.493824005126953, "global_step": 620281, "epoch": 7473} {"train_loss": -27.939115524291992, "global_step": 620282, "epoch": 7473} {"train_loss": -27.94650650024414, "global_step": 620283, "epoch": 7473} {"train_loss": -28.012365341186523, "global_step": 620284, "epoch": 7473} {"train_loss": -28.020437240600586, "global_step": 620285, "epoch": 7473} {"train_loss": -28.045454025268555, "global_step": 620286, "epoch": 7473} {"train_loss": -28.11799430847168, "global_step": 620287, "epoch": 7473} {"train_loss": -28.30726432800293, "global_step": 620288, "epoch": 7473} {"train_loss": -28.326948165893555, "global_step": 620289, "epoch": 7473} {"train_loss": -27.990991592407227, "global_step": 620290, "epoch": 7473} {"train_loss": -28.248254776000977, "global_step": 620291, "epoch": 7473} {"train_loss": -27.904138565063477, "global_step": 620292, "epoch": 7473} {"train_loss": -28.02853775024414, "global_step": 620293, "epoch": 7473} {"train_loss": -28.116491317749023, "global_step": 620294, "epoch": 7473} {"train_loss": -28.2338809967041, "global_step": 620295, "epoch": 7473} {"train_loss": -28.358373641967773, "global_step": 620296, "epoch": 7473} {"train_loss": -28.36008644104004, "global_step": 620297, "epoch": 7473} {"train_loss": -27.896793365478516, "global_step": 620298, "epoch": 7473} {"train_loss": -28.470443725585938, "global_step": 620299, "epoch": 7473} {"train_loss": -28.212182998657227, "global_step": 620300, "epoch": 7473} {"train_loss": -28.29510498046875, "global_step": 620301, "epoch": 7473} {"train_loss": -28.46282958984375, "global_step": 620302, "epoch": 7473} {"train_loss": -28.364505767822266, "global_step": 620303, "epoch": 7473} {"train_loss": -27.921911239624023, "global_step": 620304, "epoch": 7473} {"train_loss": -28.26972770690918, "global_step": 620305, "epoch": 7473} {"train_loss": -28.583267211914062, "global_step": 620306, "epoch": 7473} {"train_loss": -28.27106285095215, "global_step": 620307, "epoch": 7473} {"train_loss": -28.355443954467773, "global_step": 620308, "epoch": 7473} {"train_loss": -28.028095245361328, "global_step": 620309, "epoch": 7473} {"train_loss": -28.476072311401367, "global_step": 620310, "epoch": 7473} {"train_loss": -28.059057235717773, "global_step": 620311, "epoch": 7473} {"train_loss": -28.081125259399414, "global_step": 620312, "epoch": 7473} {"train_loss": -28.45833396911621, "global_step": 620313, "epoch": 7473} {"train_loss": -28.3148193359375, "global_step": 620314, "epoch": 7473} {"train_loss": -28.505756378173828, "global_step": 620315, "epoch": 7473} {"train_loss": -28.447412490844727, "global_step": 620316, "epoch": 7473} {"train_loss": -28.3171443939209, "global_step": 620317, "epoch": 7473} {"train_loss": -28.026660919189453, "global_step": 620318, "epoch": 7473} {"train_loss": -27.87387466430664, "global_step": 620319, "epoch": 7473} {"train_loss": -28.272146224975586, "global_step": 620320, "epoch": 7473} {"train_loss": -28.44110107421875, "global_step": 620321, "epoch": 7473} {"train_loss": -28.191625595092773, "global_step": 620322, "epoch": 7473} {"train_loss": -28.13605308532715, "global_step": 620323, "epoch": 7473} {"train_loss": -28.263044357299805, "global_step": 620324, "epoch": 7473} {"train_loss": -28.211774826049805, "global_step": 620325, "epoch": 7473} {"train_loss": -28.511716842651367, "global_step": 620326, "epoch": 7473} {"train_loss": -28.54288673400879, "global_step": 620327, "epoch": 7473} {"train_loss": -28.2116641998291, "global_step": 620328, "epoch": 7473} {"train_loss": -27.983963012695312, "global_step": 620329, "epoch": 7473} {"train_loss": -28.212018966674805, "global_step": 620330, "epoch": 7473} {"train_loss": -27.852935791015625, "global_step": 620331, "epoch": 7473} {"train_loss": -28.247541427612305, "global_step": 620332, "epoch": 7473} {"train_loss": -27.925800323486328, "global_step": 620333, "epoch": 7473} {"train_loss": -27.65203857421875, "global_step": 620334, "epoch": 7473} {"train_loss": -27.88820457458496, "global_step": 620335, "epoch": 7473} {"train_loss": -28.154617309570312, "global_step": 620336, "epoch": 7473} {"train_loss": -28.00086784362793, "global_step": 620337, "epoch": 7473} {"train_loss": -27.346887588500977, "global_step": 620338, "epoch": 7473} {"train_loss": -27.866601943969727, "global_step": 620339, "epoch": 7473} {"train_loss": -27.905344009399414, "global_step": 620340, "epoch": 7473} {"train_loss": -27.95640090574701, "global_step": 620341, "epoch": 7473, "val_loss": 6613422.0} {"train_loss": -26.779911041259766, "global_step": 620342, "epoch": 7474} {"train_loss": -26.173603057861328, "global_step": 620343, "epoch": 7474} {"train_loss": -27.33469581604004, "global_step": 620344, "epoch": 7474} {"train_loss": -27.13459587097168, "global_step": 620345, "epoch": 7474} {"train_loss": -27.0156307220459, "global_step": 620346, "epoch": 7474} {"train_loss": -27.31532096862793, "global_step": 620347, "epoch": 7474} {"train_loss": -26.936420440673828, "global_step": 620348, "epoch": 7474} {"train_loss": -26.0750675201416, "global_step": 620349, "epoch": 7474} {"train_loss": -26.77473258972168, "global_step": 620350, "epoch": 7474} {"train_loss": -27.352893829345703, "global_step": 620351, "epoch": 7474} {"train_loss": -27.419309616088867, "global_step": 620352, "epoch": 7474} {"train_loss": -27.0428524017334, "global_step": 620353, "epoch": 7474} {"train_loss": -27.619043350219727, "global_step": 620354, "epoch": 7474} {"train_loss": -26.936233520507812, "global_step": 620355, "epoch": 7474} {"train_loss": -27.37116813659668, "global_step": 620356, "epoch": 7474} {"train_loss": -27.17167091369629, "global_step": 620357, "epoch": 7474} {"train_loss": -27.06494140625, "global_step": 620358, "epoch": 7474} {"train_loss": -27.251270294189453, "global_step": 620359, "epoch": 7474} {"train_loss": -27.299915313720703, "global_step": 620360, "epoch": 7474} {"train_loss": -27.593252182006836, "global_step": 620361, "epoch": 7474} {"train_loss": -27.33945655822754, "global_step": 620362, "epoch": 7474} {"train_loss": -27.53631019592285, "global_step": 620363, "epoch": 7474} {"train_loss": -27.23699951171875, "global_step": 620364, "epoch": 7474} {"train_loss": -27.690814971923828, "global_step": 620365, "epoch": 7474} {"train_loss": -27.493438720703125, "global_step": 620366, "epoch": 7474} {"train_loss": -27.756372451782227, "global_step": 620367, "epoch": 7474} {"train_loss": -27.728931427001953, "global_step": 620368, "epoch": 7474} {"train_loss": -27.8282413482666, "global_step": 620369, "epoch": 7474} {"train_loss": -28.107778549194336, "global_step": 620370, "epoch": 7474} {"train_loss": -28.067157745361328, "global_step": 620371, "epoch": 7474} {"train_loss": -27.716699600219727, "global_step": 620372, "epoch": 7474} {"train_loss": -28.04128074645996, "global_step": 620373, "epoch": 7474} {"train_loss": -27.947036743164062, "global_step": 620374, "epoch": 7474} {"train_loss": -28.071609497070312, "global_step": 620375, "epoch": 7474} {"train_loss": -27.72041130065918, "global_step": 620376, "epoch": 7474} {"train_loss": -27.545730590820312, "global_step": 620377, "epoch": 7474} {"train_loss": -28.322477340698242, "global_step": 620378, "epoch": 7474} {"train_loss": -28.0048885345459, "global_step": 620379, "epoch": 7474} {"train_loss": -28.13142204284668, "global_step": 620380, "epoch": 7474} {"train_loss": -28.301223754882812, "global_step": 620381, "epoch": 7474} {"train_loss": -28.19412612915039, "global_step": 620382, "epoch": 7474} {"train_loss": -27.965864181518555, "global_step": 620383, "epoch": 7474} {"train_loss": -28.41584587097168, "global_step": 620384, "epoch": 7474} {"train_loss": -28.241018295288086, "global_step": 620385, "epoch": 7474} {"train_loss": -28.090927124023438, "global_step": 620386, "epoch": 7474} {"train_loss": -28.147729873657227, "global_step": 620387, "epoch": 7474} {"train_loss": -28.24995231628418, "global_step": 620388, "epoch": 7474} {"train_loss": -28.5306339263916, "global_step": 620389, "epoch": 7474} {"train_loss": -28.285017013549805, "global_step": 620390, "epoch": 7474} {"train_loss": -28.292795181274414, "global_step": 620391, "epoch": 7474} {"train_loss": -28.4002685546875, "global_step": 620392, "epoch": 7474} {"train_loss": -28.29498863220215, "global_step": 620393, "epoch": 7474} {"train_loss": -28.49094581604004, "global_step": 620394, "epoch": 7474} {"train_loss": -28.57073402404785, "global_step": 620395, "epoch": 7474} {"train_loss": -28.40389060974121, "global_step": 620396, "epoch": 7474} {"train_loss": -28.461597442626953, "global_step": 620397, "epoch": 7474} {"train_loss": -28.447406768798828, "global_step": 620398, "epoch": 7474} {"train_loss": -28.520254135131836, "global_step": 620399, "epoch": 7474} {"train_loss": -28.09040641784668, "global_step": 620400, "epoch": 7474} {"train_loss": -28.322961807250977, "global_step": 620401, "epoch": 7474} {"train_loss": -28.070234298706055, "global_step": 620402, "epoch": 7474} {"train_loss": -28.645544052124023, "global_step": 620403, "epoch": 7474} {"train_loss": -28.01865005493164, "global_step": 620404, "epoch": 7474} {"train_loss": -28.34918785095215, "global_step": 620405, "epoch": 7474} {"train_loss": -28.032804489135742, "global_step": 620406, "epoch": 7474} {"train_loss": -28.24555778503418, "global_step": 620407, "epoch": 7474} {"train_loss": -28.540771484375, "global_step": 620408, "epoch": 7474} {"train_loss": -27.944746017456055, "global_step": 620409, "epoch": 7474} {"train_loss": -27.9149112701416, "global_step": 620410, "epoch": 7474} {"train_loss": -28.515249252319336, "global_step": 620411, "epoch": 7474} {"train_loss": -28.66094970703125, "global_step": 620412, "epoch": 7474} {"train_loss": -28.1525936126709, "global_step": 620413, "epoch": 7474} {"train_loss": -28.23748779296875, "global_step": 620414, "epoch": 7474} {"train_loss": -28.74806022644043, "global_step": 620415, "epoch": 7474} {"train_loss": -28.12375831604004, "global_step": 620416, "epoch": 7474} {"train_loss": -27.816486358642578, "global_step": 620417, "epoch": 7474} {"train_loss": -27.771026611328125, "global_step": 620418, "epoch": 7474} {"train_loss": -27.277280807495117, "global_step": 620419, "epoch": 7474} {"train_loss": -27.20841407775879, "global_step": 620420, "epoch": 7474} {"train_loss": -27.43228530883789, "global_step": 620421, "epoch": 7474} {"train_loss": -27.669513702392578, "global_step": 620422, "epoch": 7474} {"train_loss": -27.859643936157227, "global_step": 620423, "epoch": 7474} {"train_loss": -27.815896781094104, "global_step": 620424, "epoch": 7474, "val_loss": 6679821.5} {"train_loss": -27.504547119140625, "global_step": 620425, "epoch": 7475} {"train_loss": -26.167835235595703, "global_step": 620426, "epoch": 7475} {"train_loss": -27.0201473236084, "global_step": 620427, "epoch": 7475} {"train_loss": -27.1588134765625, "global_step": 620428, "epoch": 7475} {"train_loss": -27.166723251342773, "global_step": 620429, "epoch": 7475} {"train_loss": -27.228174209594727, "global_step": 620430, "epoch": 7475} {"train_loss": -26.883411407470703, "global_step": 620431, "epoch": 7475} {"train_loss": -27.643198013305664, "global_step": 620432, "epoch": 7475} {"train_loss": -27.2661075592041, "global_step": 620433, "epoch": 7475} {"train_loss": -27.117008209228516, "global_step": 620434, "epoch": 7475} {"train_loss": -27.74066734313965, "global_step": 620435, "epoch": 7475} {"train_loss": -27.60150146484375, "global_step": 620436, "epoch": 7475} {"train_loss": -27.436532974243164, "global_step": 620437, "epoch": 7475} {"train_loss": -27.37192153930664, "global_step": 620438, "epoch": 7475} {"train_loss": -27.490819931030273, "global_step": 620439, "epoch": 7475} {"train_loss": -27.7197265625, "global_step": 620440, "epoch": 7475} {"train_loss": -27.887765884399414, "global_step": 620441, "epoch": 7475} {"train_loss": -27.794782638549805, "global_step": 620442, "epoch": 7475} {"train_loss": -27.362686157226562, "global_step": 620443, "epoch": 7475} {"train_loss": -27.95387077331543, "global_step": 620444, "epoch": 7475} {"train_loss": -27.666412353515625, "global_step": 620445, "epoch": 7475} {"train_loss": -27.685256958007812, "global_step": 620446, "epoch": 7475} {"train_loss": -27.7224178314209, "global_step": 620447, "epoch": 7475} {"train_loss": -27.797061920166016, "global_step": 620448, "epoch": 7475} {"train_loss": -27.635730743408203, "global_step": 620449, "epoch": 7475} {"train_loss": -28.176843643188477, "global_step": 620450, "epoch": 7475} {"train_loss": -27.63899040222168, "global_step": 620451, "epoch": 7475} {"train_loss": -27.99993896484375, "global_step": 620452, "epoch": 7475} {"train_loss": -28.298358917236328, "global_step": 620453, "epoch": 7475} {"train_loss": -28.143829345703125, "global_step": 620454, "epoch": 7475} {"train_loss": -28.149824142456055, "global_step": 620455, "epoch": 7475} {"train_loss": -28.008142471313477, "global_step": 620456, "epoch": 7475} {"train_loss": -27.7148494720459, "global_step": 620457, "epoch": 7475} {"train_loss": -28.096282958984375, "global_step": 620458, "epoch": 7475} {"train_loss": -28.34563636779785, "global_step": 620459, "epoch": 7475} {"train_loss": -28.58735466003418, "global_step": 620460, "epoch": 7475} {"train_loss": -28.246063232421875, "global_step": 620461, "epoch": 7475} {"train_loss": -28.12841796875, "global_step": 620462, "epoch": 7475} {"train_loss": -28.353391647338867, "global_step": 620463, "epoch": 7475} {"train_loss": -28.300525665283203, "global_step": 620464, "epoch": 7475} {"train_loss": -28.139570236206055, "global_step": 620465, "epoch": 7475} {"train_loss": -28.341449737548828, "global_step": 620466, "epoch": 7475} {"train_loss": -28.582477569580078, "global_step": 620467, "epoch": 7475} {"train_loss": -27.899824142456055, "global_step": 620468, "epoch": 7475} {"train_loss": -28.243743896484375, "global_step": 620469, "epoch": 7475} {"train_loss": -28.266101837158203, "global_step": 620470, "epoch": 7475} {"train_loss": -28.436370849609375, "global_step": 620471, "epoch": 7475} {"train_loss": -27.87677001953125, "global_step": 620472, "epoch": 7475} {"train_loss": -28.25663185119629, "global_step": 620473, "epoch": 7475} {"train_loss": -28.5701904296875, "global_step": 620474, "epoch": 7475} {"train_loss": -28.2464656829834, "global_step": 620475, "epoch": 7475} {"train_loss": -28.228271484375, "global_step": 620476, "epoch": 7475} {"train_loss": -28.230731964111328, "global_step": 620477, "epoch": 7475} {"train_loss": -28.524871826171875, "global_step": 620478, "epoch": 7475} {"train_loss": -28.419281005859375, "global_step": 620479, "epoch": 7475} {"train_loss": -27.820043563842773, "global_step": 620480, "epoch": 7475} {"train_loss": -27.973724365234375, "global_step": 620481, "epoch": 7475} {"train_loss": -28.420129776000977, "global_step": 620482, "epoch": 7475} {"train_loss": -28.0851993560791, "global_step": 620483, "epoch": 7475} {"train_loss": -27.96481704711914, "global_step": 620484, "epoch": 7475} {"train_loss": -28.397476196289062, "global_step": 620485, "epoch": 7475} {"train_loss": -28.49567985534668, "global_step": 620486, "epoch": 7475} {"train_loss": -27.914413452148438, "global_step": 620487, "epoch": 7475} {"train_loss": -28.07428550720215, "global_step": 620488, "epoch": 7475} {"train_loss": -28.33562660217285, "global_step": 620489, "epoch": 7475} {"train_loss": -28.416141510009766, "global_step": 620490, "epoch": 7475} {"train_loss": -28.4724178314209, "global_step": 620491, "epoch": 7475} {"train_loss": -28.298139572143555, "global_step": 620492, "epoch": 7475} {"train_loss": -28.537357330322266, "global_step": 620493, "epoch": 7475} {"train_loss": -28.5141658782959, "global_step": 620494, "epoch": 7475} {"train_loss": -28.215600967407227, "global_step": 620495, "epoch": 7475} {"train_loss": -28.103734970092773, "global_step": 620496, "epoch": 7475} {"train_loss": -28.23345375061035, "global_step": 620497, "epoch": 7475} {"train_loss": -27.972705841064453, "global_step": 620498, "epoch": 7475} {"train_loss": -27.381362915039062, "global_step": 620499, "epoch": 7475} {"train_loss": -27.806486129760742, "global_step": 620500, "epoch": 7475} {"train_loss": -28.221954345703125, "global_step": 620501, "epoch": 7475} {"train_loss": -28.277027130126953, "global_step": 620502, "epoch": 7475} {"train_loss": -28.1972713470459, "global_step": 620503, "epoch": 7475} {"train_loss": -28.156543731689453, "global_step": 620504, "epoch": 7475} {"train_loss": -28.21827507019043, "global_step": 620505, "epoch": 7475} {"train_loss": -28.615310668945312, "global_step": 620506, "epoch": 7475} {"train_loss": -27.955033911279884, "global_step": 620507, "epoch": 7475, "val_loss": 6700095.0} {"train_loss": -25.902877807617188, "global_step": 620508, "epoch": 7476} {"train_loss": -22.792057037353516, "global_step": 620509, "epoch": 7476} {"train_loss": -24.914600372314453, "global_step": 620510, "epoch": 7476} {"train_loss": -25.222043991088867, "global_step": 620511, "epoch": 7476} {"train_loss": -25.152135848999023, "global_step": 620512, "epoch": 7476} {"train_loss": -26.492572784423828, "global_step": 620513, "epoch": 7476} {"train_loss": -26.766279220581055, "global_step": 620514, "epoch": 7476} {"train_loss": -25.787683486938477, "global_step": 620515, "epoch": 7476} {"train_loss": -26.770376205444336, "global_step": 620516, "epoch": 7476} {"train_loss": -26.774259567260742, "global_step": 620517, "epoch": 7476} {"train_loss": -26.969223022460938, "global_step": 620518, "epoch": 7476} {"train_loss": -26.56439781188965, "global_step": 620519, "epoch": 7476} {"train_loss": -26.9649658203125, "global_step": 620520, "epoch": 7476} {"train_loss": -27.099267959594727, "global_step": 620521, "epoch": 7476} {"train_loss": -26.794025421142578, "global_step": 620522, "epoch": 7476} {"train_loss": -27.37249183654785, "global_step": 620523, "epoch": 7476} {"train_loss": -27.2967586517334, "global_step": 620524, "epoch": 7476} {"train_loss": -27.19626808166504, "global_step": 620525, "epoch": 7476} {"train_loss": -27.16095542907715, "global_step": 620526, "epoch": 7476} {"train_loss": -27.500873565673828, "global_step": 620527, "epoch": 7476} {"train_loss": -26.839452743530273, "global_step": 620528, "epoch": 7476} {"train_loss": -27.281936645507812, "global_step": 620529, "epoch": 7476} {"train_loss": -27.545324325561523, "global_step": 620530, "epoch": 7476} {"train_loss": -27.662220001220703, "global_step": 620531, "epoch": 7476} {"train_loss": -27.737140655517578, "global_step": 620532, "epoch": 7476} {"train_loss": -27.871170043945312, "global_step": 620533, "epoch": 7476} {"train_loss": -27.49737548828125, "global_step": 620534, "epoch": 7476} {"train_loss": -28.108606338500977, "global_step": 620535, "epoch": 7476} {"train_loss": -27.463727951049805, "global_step": 620536, "epoch": 7476} {"train_loss": -27.82927894592285, "global_step": 620537, "epoch": 7476} {"train_loss": -27.725833892822266, "global_step": 620538, "epoch": 7476} {"train_loss": -27.54526710510254, "global_step": 620539, "epoch": 7476} {"train_loss": -27.83740234375, "global_step": 620540, "epoch": 7476} {"train_loss": -27.82057762145996, "global_step": 620541, "epoch": 7476} {"train_loss": -27.933252334594727, "global_step": 620542, "epoch": 7476} {"train_loss": -28.010639190673828, "global_step": 620543, "epoch": 7476} {"train_loss": -28.08041763305664, "global_step": 620544, "epoch": 7476} {"train_loss": -27.72515869140625, "global_step": 620545, "epoch": 7476} {"train_loss": -27.9620361328125, "global_step": 620546, "epoch": 7476} {"train_loss": -27.72755241394043, "global_step": 620547, "epoch": 7476} {"train_loss": -28.392309188842773, "global_step": 620548, "epoch": 7476} {"train_loss": -28.06512451171875, "global_step": 620549, "epoch": 7476} {"train_loss": -27.978958129882812, "global_step": 620550, "epoch": 7476} {"train_loss": -28.296630859375, "global_step": 620551, "epoch": 7476} {"train_loss": -28.276702880859375, "global_step": 620552, "epoch": 7476} {"train_loss": -28.164655685424805, "global_step": 620553, "epoch": 7476} {"train_loss": -28.046615600585938, "global_step": 620554, "epoch": 7476} {"train_loss": -28.04242515563965, "global_step": 620555, "epoch": 7476} {"train_loss": -28.459171295166016, "global_step": 620556, "epoch": 7476} {"train_loss": -28.121551513671875, "global_step": 620557, "epoch": 7476} {"train_loss": -28.01777458190918, "global_step": 620558, "epoch": 7476} {"train_loss": -28.39047622680664, "global_step": 620559, "epoch": 7476} {"train_loss": -28.219898223876953, "global_step": 620560, "epoch": 7476} {"train_loss": -28.59440040588379, "global_step": 620561, "epoch": 7476} {"train_loss": -28.381925582885742, "global_step": 620562, "epoch": 7476} {"train_loss": -28.539966583251953, "global_step": 620563, "epoch": 7476} {"train_loss": -28.109603881835938, "global_step": 620564, "epoch": 7476} {"train_loss": -28.288909912109375, "global_step": 620565, "epoch": 7476} {"train_loss": -28.26186180114746, "global_step": 620566, "epoch": 7476} {"train_loss": -28.223188400268555, "global_step": 620567, "epoch": 7476} {"train_loss": -28.281116485595703, "global_step": 620568, "epoch": 7476} {"train_loss": -28.26456069946289, "global_step": 620569, "epoch": 7476} {"train_loss": -28.10201072692871, "global_step": 620570, "epoch": 7476} {"train_loss": -28.609655380249023, "global_step": 620571, "epoch": 7476} {"train_loss": -28.359359741210938, "global_step": 620572, "epoch": 7476} {"train_loss": -28.265974044799805, "global_step": 620573, "epoch": 7476} {"train_loss": -28.637048721313477, "global_step": 620574, "epoch": 7476} {"train_loss": -28.18549919128418, "global_step": 620575, "epoch": 7476} {"train_loss": -28.59107780456543, "global_step": 620576, "epoch": 7476} {"train_loss": -28.276044845581055, "global_step": 620577, "epoch": 7476} {"train_loss": -28.196949005126953, "global_step": 620578, "epoch": 7476} {"train_loss": -28.596704483032227, "global_step": 620579, "epoch": 7476} {"train_loss": -28.406301498413086, "global_step": 620580, "epoch": 7476} {"train_loss": -28.667144775390625, "global_step": 620581, "epoch": 7476} {"train_loss": -28.342309951782227, "global_step": 620582, "epoch": 7476} {"train_loss": -28.088520050048828, "global_step": 620583, "epoch": 7476} {"train_loss": -27.658432006835938, "global_step": 620584, "epoch": 7476} {"train_loss": -27.75162124633789, "global_step": 620585, "epoch": 7476} {"train_loss": -27.928476333618164, "global_step": 620586, "epoch": 7476} {"train_loss": -28.013538360595703, "global_step": 620587, "epoch": 7476} {"train_loss": -28.116453170776367, "global_step": 620588, "epoch": 7476} {"train_loss": -28.058273315429688, "global_step": 620589, "epoch": 7476} {"train_loss": -27.67065252740699, "global_step": 620590, "epoch": 7476, "val_loss": 6674836.0} {"train_loss": -27.001235961914062, "global_step": 620591, "epoch": 7477} {"train_loss": -25.876134872436523, "global_step": 620592, "epoch": 7477} {"train_loss": -23.990217208862305, "global_step": 620593, "epoch": 7477} {"train_loss": -24.52536964416504, "global_step": 620594, "epoch": 7477} {"train_loss": -26.616931915283203, "global_step": 620595, "epoch": 7477} {"train_loss": -24.570831298828125, "global_step": 620596, "epoch": 7477} {"train_loss": -27.687973022460938, "global_step": 620597, "epoch": 7477} {"train_loss": -25.3742618560791, "global_step": 620598, "epoch": 7477} {"train_loss": -26.868030548095703, "global_step": 620599, "epoch": 7477} {"train_loss": -26.43354606628418, "global_step": 620600, "epoch": 7477} {"train_loss": -26.217605590820312, "global_step": 620601, "epoch": 7477} {"train_loss": -27.1043758392334, "global_step": 620602, "epoch": 7477} {"train_loss": -26.932092666625977, "global_step": 620603, "epoch": 7477} {"train_loss": -27.49609375, "global_step": 620604, "epoch": 7477} {"train_loss": -26.63779640197754, "global_step": 620605, "epoch": 7477} {"train_loss": -26.619993209838867, "global_step": 620606, "epoch": 7477} {"train_loss": -27.326526641845703, "global_step": 620607, "epoch": 7477} {"train_loss": -27.1287841796875, "global_step": 620608, "epoch": 7477} {"train_loss": -27.313308715820312, "global_step": 620609, "epoch": 7477} {"train_loss": -27.198532104492188, "global_step": 620610, "epoch": 7477} {"train_loss": -27.404361724853516, "global_step": 620611, "epoch": 7477} {"train_loss": -27.495880126953125, "global_step": 620612, "epoch": 7477} {"train_loss": -27.015485763549805, "global_step": 620613, "epoch": 7477} {"train_loss": -27.65089225769043, "global_step": 620614, "epoch": 7477} {"train_loss": -26.965259552001953, "global_step": 620615, "epoch": 7477} {"train_loss": -27.39637565612793, "global_step": 620616, "epoch": 7477} {"train_loss": -27.274829864501953, "global_step": 620617, "epoch": 7477} {"train_loss": -27.40679931640625, "global_step": 620618, "epoch": 7477} {"train_loss": -27.629779815673828, "global_step": 620619, "epoch": 7477} {"train_loss": -27.733112335205078, "global_step": 620620, "epoch": 7477} {"train_loss": -27.562789916992188, "global_step": 620621, "epoch": 7477} {"train_loss": -27.511550903320312, "global_step": 620622, "epoch": 7477} {"train_loss": -27.465063095092773, "global_step": 620623, "epoch": 7477} {"train_loss": -27.44745445251465, "global_step": 620624, "epoch": 7477} {"train_loss": -27.495254516601562, "global_step": 620625, "epoch": 7477} {"train_loss": -27.7484188079834, "global_step": 620626, "epoch": 7477} {"train_loss": -27.675113677978516, "global_step": 620627, "epoch": 7477} {"train_loss": -27.5233211517334, "global_step": 620628, "epoch": 7477} {"train_loss": -27.82406997680664, "global_step": 620629, "epoch": 7477} {"train_loss": -27.80560874938965, "global_step": 620630, "epoch": 7477} {"train_loss": -27.7901611328125, "global_step": 620631, "epoch": 7477} {"train_loss": -27.969945907592773, "global_step": 620632, "epoch": 7477} {"train_loss": -27.794946670532227, "global_step": 620633, "epoch": 7477} {"train_loss": -27.7082462310791, "global_step": 620634, "epoch": 7477} {"train_loss": -27.91773796081543, "global_step": 620635, "epoch": 7477} {"train_loss": -27.672433853149414, "global_step": 620636, "epoch": 7477} {"train_loss": -27.62647819519043, "global_step": 620637, "epoch": 7477} {"train_loss": -28.234573364257812, "global_step": 620638, "epoch": 7477} {"train_loss": -27.649036407470703, "global_step": 620639, "epoch": 7477} {"train_loss": -28.078876495361328, "global_step": 620640, "epoch": 7477} {"train_loss": -28.29962730407715, "global_step": 620641, "epoch": 7477} {"train_loss": -28.1295108795166, "global_step": 620642, "epoch": 7477} {"train_loss": -28.12764549255371, "global_step": 620643, "epoch": 7477} {"train_loss": -27.917346954345703, "global_step": 620644, "epoch": 7477} {"train_loss": -28.307336807250977, "global_step": 620645, "epoch": 7477} {"train_loss": -28.401966094970703, "global_step": 620646, "epoch": 7477} {"train_loss": -28.053287506103516, "global_step": 620647, "epoch": 7477} {"train_loss": -28.0402889251709, "global_step": 620648, "epoch": 7477} {"train_loss": -27.834577560424805, "global_step": 620649, "epoch": 7477} {"train_loss": -28.49885368347168, "global_step": 620650, "epoch": 7477} {"train_loss": -28.453943252563477, "global_step": 620651, "epoch": 7477} {"train_loss": -28.347471237182617, "global_step": 620652, "epoch": 7477} {"train_loss": -28.021331787109375, "global_step": 620653, "epoch": 7477} {"train_loss": -27.918127059936523, "global_step": 620654, "epoch": 7477} {"train_loss": -28.608352661132812, "global_step": 620655, "epoch": 7477} {"train_loss": -28.344669342041016, "global_step": 620656, "epoch": 7477} {"train_loss": -28.44135093688965, "global_step": 620657, "epoch": 7477} {"train_loss": -28.45863914489746, "global_step": 620658, "epoch": 7477} {"train_loss": -28.12055778503418, "global_step": 620659, "epoch": 7477} {"train_loss": -28.2402400970459, "global_step": 620660, "epoch": 7477} {"train_loss": -28.5416259765625, "global_step": 620661, "epoch": 7477} {"train_loss": -27.909154891967773, "global_step": 620662, "epoch": 7477} {"train_loss": -28.49470329284668, "global_step": 620663, "epoch": 7477} {"train_loss": -27.942768096923828, "global_step": 620664, "epoch": 7477} {"train_loss": -27.806400299072266, "global_step": 620665, "epoch": 7477} {"train_loss": -28.253149032592773, "global_step": 620666, "epoch": 7477} {"train_loss": -27.84992790222168, "global_step": 620667, "epoch": 7477} {"train_loss": -28.428369522094727, "global_step": 620668, "epoch": 7477} {"train_loss": -28.1239013671875, "global_step": 620669, "epoch": 7477} {"train_loss": -28.138294219970703, "global_step": 620670, "epoch": 7477} {"train_loss": -28.327035903930664, "global_step": 620671, "epoch": 7477} {"train_loss": -28.69842529296875, "global_step": 620672, "epoch": 7477} {"train_loss": -27.585054144801862, "global_step": 620673, "epoch": 7477, "val_loss": 6611997.0} {"train_loss": -26.5712890625, "global_step": 620674, "epoch": 7478} {"train_loss": -24.97287940979004, "global_step": 620675, "epoch": 7478} {"train_loss": -26.306615829467773, "global_step": 620676, "epoch": 7478} {"train_loss": -28.124242782592773, "global_step": 620677, "epoch": 7478} {"train_loss": -26.853912353515625, "global_step": 620678, "epoch": 7478} {"train_loss": -26.851959228515625, "global_step": 620679, "epoch": 7478} {"train_loss": -27.7763671875, "global_step": 620680, "epoch": 7478} {"train_loss": -27.416290283203125, "global_step": 620681, "epoch": 7478} {"train_loss": -27.569122314453125, "global_step": 620682, "epoch": 7478} {"train_loss": -27.56626319885254, "global_step": 620683, "epoch": 7478} {"train_loss": -27.13677406311035, "global_step": 620684, "epoch": 7478} {"train_loss": -27.563852310180664, "global_step": 620685, "epoch": 7478} {"train_loss": -27.822534561157227, "global_step": 620686, "epoch": 7478} {"train_loss": -27.96442222595215, "global_step": 620687, "epoch": 7478} {"train_loss": -28.00253677368164, "global_step": 620688, "epoch": 7478} {"train_loss": -27.813283920288086, "global_step": 620689, "epoch": 7478} {"train_loss": -27.53961181640625, "global_step": 620690, "epoch": 7478} {"train_loss": -27.5891170501709, "global_step": 620691, "epoch": 7478} {"train_loss": -27.952899932861328, "global_step": 620692, "epoch": 7478} {"train_loss": -28.051761627197266, "global_step": 620693, "epoch": 7478} {"train_loss": -27.932209014892578, "global_step": 620694, "epoch": 7478} {"train_loss": -27.975255966186523, "global_step": 620695, "epoch": 7478} {"train_loss": -28.094268798828125, "global_step": 620696, "epoch": 7478} {"train_loss": -28.1810359954834, "global_step": 620697, "epoch": 7478} {"train_loss": -27.8629207611084, "global_step": 620698, "epoch": 7478} {"train_loss": -28.486068725585938, "global_step": 620699, "epoch": 7478} {"train_loss": -27.940078735351562, "global_step": 620700, "epoch": 7478} {"train_loss": -28.24698829650879, "global_step": 620701, "epoch": 7478} {"train_loss": -28.045352935791016, "global_step": 620702, "epoch": 7478} {"train_loss": -28.193466186523438, "global_step": 620703, "epoch": 7478} {"train_loss": -28.803068161010742, "global_step": 620704, "epoch": 7478} {"train_loss": -28.086633682250977, "global_step": 620705, "epoch": 7478} {"train_loss": -28.2783145904541, "global_step": 620706, "epoch": 7478} {"train_loss": -28.02558708190918, "global_step": 620707, "epoch": 7478} {"train_loss": -28.116165161132812, "global_step": 620708, "epoch": 7478} {"train_loss": -28.296667098999023, "global_step": 620709, "epoch": 7478} {"train_loss": -28.429086685180664, "global_step": 620710, "epoch": 7478} {"train_loss": -28.413543701171875, "global_step": 620711, "epoch": 7478} {"train_loss": -28.57732582092285, "global_step": 620712, "epoch": 7478} {"train_loss": -28.7076358795166, "global_step": 620713, "epoch": 7478} {"train_loss": -28.635650634765625, "global_step": 620714, "epoch": 7478} {"train_loss": -28.568368911743164, "global_step": 620715, "epoch": 7478} {"train_loss": -28.263608932495117, "global_step": 620716, "epoch": 7478} {"train_loss": -28.26944351196289, "global_step": 620717, "epoch": 7478} {"train_loss": -28.22554588317871, "global_step": 620718, "epoch": 7478} {"train_loss": -28.340543746948242, "global_step": 620719, "epoch": 7478} {"train_loss": -28.48489761352539, "global_step": 620720, "epoch": 7478} {"train_loss": -28.458362579345703, "global_step": 620721, "epoch": 7478} {"train_loss": -28.66000747680664, "global_step": 620722, "epoch": 7478} {"train_loss": -28.273834228515625, "global_step": 620723, "epoch": 7478} {"train_loss": -28.50457191467285, "global_step": 620724, "epoch": 7478} {"train_loss": -28.374530792236328, "global_step": 620725, "epoch": 7478} {"train_loss": -28.38449478149414, "global_step": 620726, "epoch": 7478} {"train_loss": -27.983007431030273, "global_step": 620727, "epoch": 7478} {"train_loss": -28.47273063659668, "global_step": 620728, "epoch": 7478} {"train_loss": -28.286407470703125, "global_step": 620729, "epoch": 7478} {"train_loss": -28.848180770874023, "global_step": 620730, "epoch": 7478} {"train_loss": -28.273664474487305, "global_step": 620731, "epoch": 7478} {"train_loss": -28.440628051757812, "global_step": 620732, "epoch": 7478} {"train_loss": -28.71466636657715, "global_step": 620733, "epoch": 7478} {"train_loss": -28.125186920166016, "global_step": 620734, "epoch": 7478} {"train_loss": -28.753950119018555, "global_step": 620735, "epoch": 7478} {"train_loss": -28.3832950592041, "global_step": 620736, "epoch": 7478} {"train_loss": -28.012418746948242, "global_step": 620737, "epoch": 7478} {"train_loss": -27.902002334594727, "global_step": 620738, "epoch": 7478} {"train_loss": -28.06081199645996, "global_step": 620739, "epoch": 7478} {"train_loss": -28.181781768798828, "global_step": 620740, "epoch": 7478} {"train_loss": -27.663558959960938, "global_step": 620741, "epoch": 7478} {"train_loss": -27.70045280456543, "global_step": 620742, "epoch": 7478} {"train_loss": -28.051441192626953, "global_step": 620743, "epoch": 7478} {"train_loss": -28.04648780822754, "global_step": 620744, "epoch": 7478} {"train_loss": -28.069177627563477, "global_step": 620745, "epoch": 7478} {"train_loss": -27.716968536376953, "global_step": 620746, "epoch": 7478} {"train_loss": -27.634571075439453, "global_step": 620747, "epoch": 7478} {"train_loss": -28.2955265045166, "global_step": 620748, "epoch": 7478} {"train_loss": -28.081012725830078, "global_step": 620749, "epoch": 7478} {"train_loss": -28.243621826171875, "global_step": 620750, "epoch": 7478} {"train_loss": -27.93378257751465, "global_step": 620751, "epoch": 7478} {"train_loss": -28.073266983032227, "global_step": 620752, "epoch": 7478} {"train_loss": -28.08619499206543, "global_step": 620753, "epoch": 7478} {"train_loss": -27.902515411376953, "global_step": 620754, "epoch": 7478} {"train_loss": -28.31873893737793, "global_step": 620755, "epoch": 7478} {"train_loss": -28.025546430105187, "global_step": 620756, "epoch": 7478, "val_loss": 6683294.0} {"train_loss": -27.349369049072266, "global_step": 620757, "epoch": 7479} {"train_loss": -27.361316680908203, "global_step": 620758, "epoch": 7479} {"train_loss": -27.00031089782715, "global_step": 620759, "epoch": 7479} {"train_loss": -27.641223907470703, "global_step": 620760, "epoch": 7479} {"train_loss": -27.68486976623535, "global_step": 620761, "epoch": 7479} {"train_loss": -26.99755859375, "global_step": 620762, "epoch": 7479} {"train_loss": -27.695404052734375, "global_step": 620763, "epoch": 7479} {"train_loss": -27.47334098815918, "global_step": 620764, "epoch": 7479} {"train_loss": -27.614459991455078, "global_step": 620765, "epoch": 7479} {"train_loss": -27.52168083190918, "global_step": 620766, "epoch": 7479} {"train_loss": -27.24928855895996, "global_step": 620767, "epoch": 7479} {"train_loss": -27.945343017578125, "global_step": 620768, "epoch": 7479} {"train_loss": -27.526227951049805, "global_step": 620769, "epoch": 7479} {"train_loss": -27.957538604736328, "global_step": 620770, "epoch": 7479} {"train_loss": -27.914804458618164, "global_step": 620771, "epoch": 7479} {"train_loss": -28.001434326171875, "global_step": 620772, "epoch": 7479} {"train_loss": -27.770761489868164, "global_step": 620773, "epoch": 7479} {"train_loss": -28.086353302001953, "global_step": 620774, "epoch": 7479} {"train_loss": -27.819366455078125, "global_step": 620775, "epoch": 7479} {"train_loss": -27.84783935546875, "global_step": 620776, "epoch": 7479} {"train_loss": -28.055419921875, "global_step": 620777, "epoch": 7479} {"train_loss": -27.8830509185791, "global_step": 620778, "epoch": 7479} {"train_loss": -27.911819458007812, "global_step": 620779, "epoch": 7479} {"train_loss": -28.274473190307617, "global_step": 620780, "epoch": 7479} {"train_loss": -28.099109649658203, "global_step": 620781, "epoch": 7479} {"train_loss": -27.92778968811035, "global_step": 620782, "epoch": 7479} {"train_loss": -27.764881134033203, "global_step": 620783, "epoch": 7479} {"train_loss": -27.58623695373535, "global_step": 620784, "epoch": 7479} {"train_loss": -28.162261962890625, "global_step": 620785, "epoch": 7479} {"train_loss": -27.839771270751953, "global_step": 620786, "epoch": 7479} {"train_loss": -28.011768341064453, "global_step": 620787, "epoch": 7479} {"train_loss": -27.9553165435791, "global_step": 620788, "epoch": 7479} {"train_loss": -28.059980392456055, "global_step": 620789, "epoch": 7479} {"train_loss": -28.050491333007812, "global_step": 620790, "epoch": 7479} {"train_loss": -27.960376739501953, "global_step": 620791, "epoch": 7479} {"train_loss": -28.00068473815918, "global_step": 620792, "epoch": 7479} {"train_loss": -28.221481323242188, "global_step": 620793, "epoch": 7479} {"train_loss": -28.18112564086914, "global_step": 620794, "epoch": 7479} {"train_loss": -28.139942169189453, "global_step": 620795, "epoch": 7479} {"train_loss": -28.247604370117188, "global_step": 620796, "epoch": 7479} {"train_loss": -27.8824462890625, "global_step": 620797, "epoch": 7479} {"train_loss": -28.140478134155273, "global_step": 620798, "epoch": 7479} {"train_loss": -28.410924911499023, "global_step": 620799, "epoch": 7479} {"train_loss": -28.38153648376465, "global_step": 620800, "epoch": 7479} {"train_loss": -28.055805206298828, "global_step": 620801, "epoch": 7479} {"train_loss": -28.275684356689453, "global_step": 620802, "epoch": 7479} {"train_loss": -28.37440299987793, "global_step": 620803, "epoch": 7479} {"train_loss": -28.181415557861328, "global_step": 620804, "epoch": 7479} {"train_loss": -28.511493682861328, "global_step": 620805, "epoch": 7479} {"train_loss": -28.3295841217041, "global_step": 620806, "epoch": 7479} {"train_loss": -28.264423370361328, "global_step": 620807, "epoch": 7479} {"train_loss": -28.45197105407715, "global_step": 620808, "epoch": 7479} {"train_loss": -28.526281356811523, "global_step": 620809, "epoch": 7479} {"train_loss": -28.47187614440918, "global_step": 620810, "epoch": 7479} {"train_loss": -28.399616241455078, "global_step": 620811, "epoch": 7479} {"train_loss": -28.4668025970459, "global_step": 620812, "epoch": 7479} {"train_loss": -28.13582420349121, "global_step": 620813, "epoch": 7479} {"train_loss": -28.641265869140625, "global_step": 620814, "epoch": 7479} {"train_loss": -28.38161277770996, "global_step": 620815, "epoch": 7479} {"train_loss": -28.199451446533203, "global_step": 620816, "epoch": 7479} {"train_loss": -28.059741973876953, "global_step": 620817, "epoch": 7479} {"train_loss": -28.04387855529785, "global_step": 620818, "epoch": 7479} {"train_loss": -28.195850372314453, "global_step": 620819, "epoch": 7479} {"train_loss": -27.6118106842041, "global_step": 620820, "epoch": 7479} {"train_loss": -28.218585968017578, "global_step": 620821, "epoch": 7479} {"train_loss": -27.892240524291992, "global_step": 620822, "epoch": 7479} {"train_loss": -28.02192497253418, "global_step": 620823, "epoch": 7479} {"train_loss": -28.342626571655273, "global_step": 620824, "epoch": 7479} {"train_loss": -28.067251205444336, "global_step": 620825, "epoch": 7479} {"train_loss": -28.014379501342773, "global_step": 620826, "epoch": 7479} {"train_loss": -28.196075439453125, "global_step": 620827, "epoch": 7479} {"train_loss": -28.1617374420166, "global_step": 620828, "epoch": 7479} {"train_loss": -27.953824996948242, "global_step": 620829, "epoch": 7479} {"train_loss": -28.591222763061523, "global_step": 620830, "epoch": 7479} {"train_loss": -27.825429916381836, "global_step": 620831, "epoch": 7479} {"train_loss": -28.345102310180664, "global_step": 620832, "epoch": 7479} {"train_loss": -27.990066528320312, "global_step": 620833, "epoch": 7479} {"train_loss": -27.93060302734375, "global_step": 620834, "epoch": 7479} {"train_loss": -28.31307029724121, "global_step": 620835, "epoch": 7479} {"train_loss": -28.121068954467773, "global_step": 620836, "epoch": 7479} {"train_loss": -28.05869483947754, "global_step": 620837, "epoch": 7479} {"train_loss": -27.703428268432617, "global_step": 620838, "epoch": 7479} {"train_loss": -28.01234233810241, "global_step": 620839, "epoch": 7479, "val_loss": 6717148.0} {"train_loss": -27.446569442749023, "global_step": 620840, "epoch": 7480} {"train_loss": -26.129779815673828, "global_step": 620841, "epoch": 7480} {"train_loss": -26.06342124938965, "global_step": 620842, "epoch": 7480} {"train_loss": -27.610794067382812, "global_step": 620843, "epoch": 7480} {"train_loss": -27.294031143188477, "global_step": 620844, "epoch": 7480} {"train_loss": -27.7685604095459, "global_step": 620845, "epoch": 7480} {"train_loss": -27.6398868560791, "global_step": 620846, "epoch": 7480} {"train_loss": -27.775012969970703, "global_step": 620847, "epoch": 7480} {"train_loss": -27.165729522705078, "global_step": 620848, "epoch": 7480} {"train_loss": -27.69099235534668, "global_step": 620849, "epoch": 7480} {"train_loss": -27.2215576171875, "global_step": 620850, "epoch": 7480} {"train_loss": -28.031789779663086, "global_step": 620851, "epoch": 7480} {"train_loss": -27.3845157623291, "global_step": 620852, "epoch": 7480} {"train_loss": -27.910978317260742, "global_step": 620853, "epoch": 7480} {"train_loss": -27.687896728515625, "global_step": 620854, "epoch": 7480} {"train_loss": -27.322477340698242, "global_step": 620855, "epoch": 7480} {"train_loss": -27.86175537109375, "global_step": 620856, "epoch": 7480} {"train_loss": -27.878021240234375, "global_step": 620857, "epoch": 7480} {"train_loss": -27.796850204467773, "global_step": 620858, "epoch": 7480} {"train_loss": -27.95220947265625, "global_step": 620859, "epoch": 7480} {"train_loss": -27.843488693237305, "global_step": 620860, "epoch": 7480} {"train_loss": -27.691791534423828, "global_step": 620861, "epoch": 7480} {"train_loss": -28.03031349182129, "global_step": 620862, "epoch": 7480} {"train_loss": -28.025671005249023, "global_step": 620863, "epoch": 7480} {"train_loss": -27.942371368408203, "global_step": 620864, "epoch": 7480} {"train_loss": -27.749561309814453, "global_step": 620865, "epoch": 7480} {"train_loss": -27.73026466369629, "global_step": 620866, "epoch": 7480} {"train_loss": -27.664030075073242, "global_step": 620867, "epoch": 7480} {"train_loss": -27.750085830688477, "global_step": 620868, "epoch": 7480} {"train_loss": -28.114973068237305, "global_step": 620869, "epoch": 7480} {"train_loss": -28.22933006286621, "global_step": 620870, "epoch": 7480} {"train_loss": -27.9392147064209, "global_step": 620871, "epoch": 7480} {"train_loss": -27.99100112915039, "global_step": 620872, "epoch": 7480} {"train_loss": -27.801252365112305, "global_step": 620873, "epoch": 7480} {"train_loss": -27.925048828125, "global_step": 620874, "epoch": 7480} {"train_loss": -27.99184226989746, "global_step": 620875, "epoch": 7480} {"train_loss": -27.42229652404785, "global_step": 620876, "epoch": 7480} {"train_loss": -27.84906578063965, "global_step": 620877, "epoch": 7480} {"train_loss": -28.255523681640625, "global_step": 620878, "epoch": 7480} {"train_loss": -28.399646759033203, "global_step": 620879, "epoch": 7480} {"train_loss": -28.043027877807617, "global_step": 620880, "epoch": 7480} {"train_loss": -28.523508071899414, "global_step": 620881, "epoch": 7480} {"train_loss": -28.217260360717773, "global_step": 620882, "epoch": 7480} {"train_loss": -28.113162994384766, "global_step": 620883, "epoch": 7480} {"train_loss": -28.381744384765625, "global_step": 620884, "epoch": 7480} {"train_loss": -28.113147735595703, "global_step": 620885, "epoch": 7480} {"train_loss": -28.301054000854492, "global_step": 620886, "epoch": 7480} {"train_loss": -28.49090576171875, "global_step": 620887, "epoch": 7480} {"train_loss": -28.05360221862793, "global_step": 620888, "epoch": 7480} {"train_loss": -28.130359649658203, "global_step": 620889, "epoch": 7480} {"train_loss": -28.153284072875977, "global_step": 620890, "epoch": 7480} {"train_loss": -28.148862838745117, "global_step": 620891, "epoch": 7480} {"train_loss": -28.25274658203125, "global_step": 620892, "epoch": 7480} {"train_loss": -28.148862838745117, "global_step": 620893, "epoch": 7480} {"train_loss": -28.43638038635254, "global_step": 620894, "epoch": 7480} {"train_loss": -27.729846954345703, "global_step": 620895, "epoch": 7480} {"train_loss": -27.576154708862305, "global_step": 620896, "epoch": 7480} {"train_loss": -27.788715362548828, "global_step": 620897, "epoch": 7480} {"train_loss": -27.705774307250977, "global_step": 620898, "epoch": 7480} {"train_loss": -28.02168083190918, "global_step": 620899, "epoch": 7480} {"train_loss": -28.008039474487305, "global_step": 620900, "epoch": 7480} {"train_loss": -28.227476119995117, "global_step": 620901, "epoch": 7480} {"train_loss": -27.741607666015625, "global_step": 620902, "epoch": 7480} {"train_loss": -28.111408233642578, "global_step": 620903, "epoch": 7480} {"train_loss": -28.148040771484375, "global_step": 620904, "epoch": 7480} {"train_loss": -28.208982467651367, "global_step": 620905, "epoch": 7480} {"train_loss": -28.107030868530273, "global_step": 620906, "epoch": 7480} {"train_loss": -28.137903213500977, "global_step": 620907, "epoch": 7480} {"train_loss": -28.10601234436035, "global_step": 620908, "epoch": 7480} {"train_loss": -28.148099899291992, "global_step": 620909, "epoch": 7480} {"train_loss": -27.940298080444336, "global_step": 620910, "epoch": 7480} {"train_loss": -28.069684982299805, "global_step": 620911, "epoch": 7480} {"train_loss": -28.112539291381836, "global_step": 620912, "epoch": 7480} {"train_loss": -28.2051944732666, "global_step": 620913, "epoch": 7480} {"train_loss": -28.537708282470703, "global_step": 620914, "epoch": 7480} {"train_loss": -28.274892807006836, "global_step": 620915, "epoch": 7480} {"train_loss": -28.255020141601562, "global_step": 620916, "epoch": 7480} {"train_loss": -28.33697509765625, "global_step": 620917, "epoch": 7480} {"train_loss": -28.47236442565918, "global_step": 620918, "epoch": 7480} {"train_loss": -28.44219398498535, "global_step": 620919, "epoch": 7480} {"train_loss": -28.590173721313477, "global_step": 620920, "epoch": 7480} {"train_loss": -28.348386764526367, "global_step": 620921, "epoch": 7480} {"train_loss": -27.94940514162362, "global_step": 620922, "epoch": 7480, "val_loss": 6654355.5} {"train_loss": -27.95151710510254, "global_step": 620923, "epoch": 7481} {"train_loss": -28.134580612182617, "global_step": 620924, "epoch": 7481} {"train_loss": -28.047452926635742, "global_step": 620925, "epoch": 7481} {"train_loss": -28.043594360351562, "global_step": 620926, "epoch": 7481} {"train_loss": -28.362836837768555, "global_step": 620927, "epoch": 7481} {"train_loss": -27.709394454956055, "global_step": 620928, "epoch": 7481} {"train_loss": -28.08005714416504, "global_step": 620929, "epoch": 7481} {"train_loss": -27.664737701416016, "global_step": 620930, "epoch": 7481} {"train_loss": -28.091093063354492, "global_step": 620931, "epoch": 7481} {"train_loss": -27.828205108642578, "global_step": 620932, "epoch": 7481} {"train_loss": -27.78278923034668, "global_step": 620933, "epoch": 7481} {"train_loss": -28.46956443786621, "global_step": 620934, "epoch": 7481} {"train_loss": -27.88116455078125, "global_step": 620935, "epoch": 7481} {"train_loss": -28.107467651367188, "global_step": 620936, "epoch": 7481} {"train_loss": -28.029062271118164, "global_step": 620937, "epoch": 7481} {"train_loss": -28.275888442993164, "global_step": 620938, "epoch": 7481} {"train_loss": -28.16206169128418, "global_step": 620939, "epoch": 7481} {"train_loss": -28.221546173095703, "global_step": 620940, "epoch": 7481} {"train_loss": -28.261859893798828, "global_step": 620941, "epoch": 7481} {"train_loss": -28.216028213500977, "global_step": 620942, "epoch": 7481} {"train_loss": -28.000354766845703, "global_step": 620943, "epoch": 7481} {"train_loss": -28.33380699157715, "global_step": 620944, "epoch": 7481} {"train_loss": -28.29949951171875, "global_step": 620945, "epoch": 7481} {"train_loss": -28.394529342651367, "global_step": 620946, "epoch": 7481} {"train_loss": -28.200586318969727, "global_step": 620947, "epoch": 7481} {"train_loss": -27.9664306640625, "global_step": 620948, "epoch": 7481} {"train_loss": -28.36077880859375, "global_step": 620949, "epoch": 7481} {"train_loss": -28.019506454467773, "global_step": 620950, "epoch": 7481} {"train_loss": -28.234594345092773, "global_step": 620951, "epoch": 7481} {"train_loss": -28.310544967651367, "global_step": 620952, "epoch": 7481} {"train_loss": -28.0677433013916, "global_step": 620953, "epoch": 7481} {"train_loss": -28.108701705932617, "global_step": 620954, "epoch": 7481} {"train_loss": -28.18649673461914, "global_step": 620955, "epoch": 7481} {"train_loss": -28.63701820373535, "global_step": 620956, "epoch": 7481} {"train_loss": -28.31427001953125, "global_step": 620957, "epoch": 7481} {"train_loss": -28.2133846282959, "global_step": 620958, "epoch": 7481} {"train_loss": -28.380735397338867, "global_step": 620959, "epoch": 7481} {"train_loss": -28.506528854370117, "global_step": 620960, "epoch": 7481} {"train_loss": -28.43369483947754, "global_step": 620961, "epoch": 7481} {"train_loss": -28.52601432800293, "global_step": 620962, "epoch": 7481} {"train_loss": -28.345006942749023, "global_step": 620963, "epoch": 7481} {"train_loss": -28.75850486755371, "global_step": 620964, "epoch": 7481} {"train_loss": -28.335386276245117, "global_step": 620965, "epoch": 7481} {"train_loss": -27.916004180908203, "global_step": 620966, "epoch": 7481} {"train_loss": -28.452896118164062, "global_step": 620967, "epoch": 7481} {"train_loss": -28.15497398376465, "global_step": 620968, "epoch": 7481} {"train_loss": -28.308019638061523, "global_step": 620969, "epoch": 7481} {"train_loss": -28.5762939453125, "global_step": 620970, "epoch": 7481} {"train_loss": -28.5460147857666, "global_step": 620971, "epoch": 7481} {"train_loss": -28.290159225463867, "global_step": 620972, "epoch": 7481} {"train_loss": -28.416784286499023, "global_step": 620973, "epoch": 7481} {"train_loss": -28.560901641845703, "global_step": 620974, "epoch": 7481} {"train_loss": -28.3430233001709, "global_step": 620975, "epoch": 7481} {"train_loss": -28.383026123046875, "global_step": 620976, "epoch": 7481} {"train_loss": -28.3375244140625, "global_step": 620977, "epoch": 7481} {"train_loss": -28.10390281677246, "global_step": 620978, "epoch": 7481} {"train_loss": -28.127466201782227, "global_step": 620979, "epoch": 7481} {"train_loss": -28.2578125, "global_step": 620980, "epoch": 7481} {"train_loss": -27.94632911682129, "global_step": 620981, "epoch": 7481} {"train_loss": -28.053754806518555, "global_step": 620982, "epoch": 7481} {"train_loss": -27.596166610717773, "global_step": 620983, "epoch": 7481} {"train_loss": -28.238821029663086, "global_step": 620984, "epoch": 7481} {"train_loss": -27.96416664123535, "global_step": 620985, "epoch": 7481} {"train_loss": -28.176910400390625, "global_step": 620986, "epoch": 7481} {"train_loss": -28.328882217407227, "global_step": 620987, "epoch": 7481} {"train_loss": -27.937397003173828, "global_step": 620988, "epoch": 7481} {"train_loss": -27.731281280517578, "global_step": 620989, "epoch": 7481} {"train_loss": -28.056943893432617, "global_step": 620990, "epoch": 7481} {"train_loss": -27.644323348999023, "global_step": 620991, "epoch": 7481} {"train_loss": -28.132709503173828, "global_step": 620992, "epoch": 7481} {"train_loss": -28.188465118408203, "global_step": 620993, "epoch": 7481} {"train_loss": -27.992420196533203, "global_step": 620994, "epoch": 7481} {"train_loss": -27.684982299804688, "global_step": 620995, "epoch": 7481} {"train_loss": -28.204931259155273, "global_step": 620996, "epoch": 7481} {"train_loss": -28.00372886657715, "global_step": 620997, "epoch": 7481} {"train_loss": -28.050779342651367, "global_step": 620998, "epoch": 7481} {"train_loss": -28.623254776000977, "global_step": 620999, "epoch": 7481} {"train_loss": -27.85693359375, "global_step": 621000, "epoch": 7481} {"train_loss": -28.315643310546875, "global_step": 621001, "epoch": 7481} {"train_loss": -27.810382843017578, "global_step": 621002, "epoch": 7481} {"train_loss": -28.299856185913086, "global_step": 621003, "epoch": 7481} {"train_loss": -27.956119537353516, "global_step": 621004, "epoch": 7481} {"train_loss": -28.164120685623352, "global_step": 621005, "epoch": 7481, "val_loss": 6673681.0} {"train_loss": -27.428943634033203, "global_step": 621006, "epoch": 7482} {"train_loss": -28.191843032836914, "global_step": 621007, "epoch": 7482} {"train_loss": -27.626562118530273, "global_step": 621008, "epoch": 7482} {"train_loss": -27.112268447875977, "global_step": 621009, "epoch": 7482} {"train_loss": -27.821439743041992, "global_step": 621010, "epoch": 7482} {"train_loss": -27.647336959838867, "global_step": 621011, "epoch": 7482} {"train_loss": -27.890411376953125, "global_step": 621012, "epoch": 7482} {"train_loss": -27.970922470092773, "global_step": 621013, "epoch": 7482} {"train_loss": -27.79068946838379, "global_step": 621014, "epoch": 7482} {"train_loss": -26.997365951538086, "global_step": 621015, "epoch": 7482} {"train_loss": -27.88570213317871, "global_step": 621016, "epoch": 7482} {"train_loss": -27.726835250854492, "global_step": 621017, "epoch": 7482} {"train_loss": -27.983936309814453, "global_step": 621018, "epoch": 7482} {"train_loss": -27.517133712768555, "global_step": 621019, "epoch": 7482} {"train_loss": -27.5098819732666, "global_step": 621020, "epoch": 7482} {"train_loss": -27.18088722229004, "global_step": 621021, "epoch": 7482} {"train_loss": -27.77127456665039, "global_step": 621022, "epoch": 7482} {"train_loss": -27.9669132232666, "global_step": 621023, "epoch": 7482} {"train_loss": -27.70106315612793, "global_step": 621024, "epoch": 7482} {"train_loss": -28.087982177734375, "global_step": 621025, "epoch": 7482} {"train_loss": -27.591394424438477, "global_step": 621026, "epoch": 7482} {"train_loss": -28.086801528930664, "global_step": 621027, "epoch": 7482} {"train_loss": -27.936391830444336, "global_step": 621028, "epoch": 7482} {"train_loss": -27.89435386657715, "global_step": 621029, "epoch": 7482} {"train_loss": -28.441455841064453, "global_step": 621030, "epoch": 7482} {"train_loss": -27.95501136779785, "global_step": 621031, "epoch": 7482} {"train_loss": -28.026464462280273, "global_step": 621032, "epoch": 7482} {"train_loss": -27.90668296813965, "global_step": 621033, "epoch": 7482} {"train_loss": -28.116479873657227, "global_step": 621034, "epoch": 7482} {"train_loss": -28.1510009765625, "global_step": 621035, "epoch": 7482} {"train_loss": -28.139699935913086, "global_step": 621036, "epoch": 7482} {"train_loss": -28.174362182617188, "global_step": 621037, "epoch": 7482} {"train_loss": -27.946247100830078, "global_step": 621038, "epoch": 7482} {"train_loss": -28.152456283569336, "global_step": 621039, "epoch": 7482} {"train_loss": -28.37520408630371, "global_step": 621040, "epoch": 7482} {"train_loss": -28.574222564697266, "global_step": 621041, "epoch": 7482} {"train_loss": -28.186176300048828, "global_step": 621042, "epoch": 7482} {"train_loss": -28.116064071655273, "global_step": 621043, "epoch": 7482} {"train_loss": -28.01987648010254, "global_step": 621044, "epoch": 7482} {"train_loss": -28.470935821533203, "global_step": 621045, "epoch": 7482} {"train_loss": -28.3682918548584, "global_step": 621046, "epoch": 7482} {"train_loss": -28.20882225036621, "global_step": 621047, "epoch": 7482} {"train_loss": -28.150190353393555, "global_step": 621048, "epoch": 7482} {"train_loss": -28.264108657836914, "global_step": 621049, "epoch": 7482} {"train_loss": -28.30048942565918, "global_step": 621050, "epoch": 7482} {"train_loss": -28.350629806518555, "global_step": 621051, "epoch": 7482} {"train_loss": -28.152652740478516, "global_step": 621052, "epoch": 7482} {"train_loss": -28.33477783203125, "global_step": 621053, "epoch": 7482} {"train_loss": -28.282058715820312, "global_step": 621054, "epoch": 7482} {"train_loss": -28.310720443725586, "global_step": 621055, "epoch": 7482} {"train_loss": -28.47250747680664, "global_step": 621056, "epoch": 7482} {"train_loss": -28.15096092224121, "global_step": 621057, "epoch": 7482} {"train_loss": -28.64686393737793, "global_step": 621058, "epoch": 7482} {"train_loss": -28.536718368530273, "global_step": 621059, "epoch": 7482} {"train_loss": -28.2360897064209, "global_step": 621060, "epoch": 7482} {"train_loss": -28.184019088745117, "global_step": 621061, "epoch": 7482} {"train_loss": -28.38850975036621, "global_step": 621062, "epoch": 7482} {"train_loss": -28.46500587463379, "global_step": 621063, "epoch": 7482} {"train_loss": -28.46453285217285, "global_step": 621064, "epoch": 7482} {"train_loss": -28.48601722717285, "global_step": 621065, "epoch": 7482} {"train_loss": -28.447717666625977, "global_step": 621066, "epoch": 7482} {"train_loss": -28.23358154296875, "global_step": 621067, "epoch": 7482} {"train_loss": -28.473148345947266, "global_step": 621068, "epoch": 7482} {"train_loss": -27.969648361206055, "global_step": 621069, "epoch": 7482} {"train_loss": -27.92416763305664, "global_step": 621070, "epoch": 7482} {"train_loss": -27.480615615844727, "global_step": 621071, "epoch": 7482} {"train_loss": -27.000192642211914, "global_step": 621072, "epoch": 7482} {"train_loss": -26.82476234436035, "global_step": 621073, "epoch": 7482} {"train_loss": -27.158130645751953, "global_step": 621074, "epoch": 7482} {"train_loss": -27.7580509185791, "global_step": 621075, "epoch": 7482} {"train_loss": -27.969247817993164, "global_step": 621076, "epoch": 7482} {"train_loss": -27.70355796813965, "global_step": 621077, "epoch": 7482} {"train_loss": -27.686132431030273, "global_step": 621078, "epoch": 7482} {"train_loss": -28.63087272644043, "global_step": 621079, "epoch": 7482} {"train_loss": -28.082242965698242, "global_step": 621080, "epoch": 7482} {"train_loss": -28.415542602539062, "global_step": 621081, "epoch": 7482} {"train_loss": -28.022260665893555, "global_step": 621082, "epoch": 7482} {"train_loss": -28.093427658081055, "global_step": 621083, "epoch": 7482} {"train_loss": -27.95930290222168, "global_step": 621084, "epoch": 7482} {"train_loss": -28.260578155517578, "global_step": 621085, "epoch": 7482} {"train_loss": -28.009180068969727, "global_step": 621086, "epoch": 7482} {"train_loss": -28.115076065063477, "global_step": 621087, "epoch": 7482} {"train_loss": -28.013837377709077, "global_step": 621088, "epoch": 7482, "val_loss": 6634980.0} {"train_loss": -26.584869384765625, "global_step": 621089, "epoch": 7483} {"train_loss": -26.87858009338379, "global_step": 621090, "epoch": 7483} {"train_loss": -27.811986923217773, "global_step": 621091, "epoch": 7483} {"train_loss": -27.1072940826416, "global_step": 621092, "epoch": 7483} {"train_loss": -27.6135311126709, "global_step": 621093, "epoch": 7483} {"train_loss": -27.072052001953125, "global_step": 621094, "epoch": 7483} {"train_loss": -26.89458656311035, "global_step": 621095, "epoch": 7483} {"train_loss": -27.739160537719727, "global_step": 621096, "epoch": 7483} {"train_loss": -27.150476455688477, "global_step": 621097, "epoch": 7483} {"train_loss": -27.399072647094727, "global_step": 621098, "epoch": 7483} {"train_loss": -27.428375244140625, "global_step": 621099, "epoch": 7483} {"train_loss": -27.607040405273438, "global_step": 621100, "epoch": 7483} {"train_loss": -27.56591796875, "global_step": 621101, "epoch": 7483} {"train_loss": -27.503442764282227, "global_step": 621102, "epoch": 7483} {"train_loss": -28.047229766845703, "global_step": 621103, "epoch": 7483} {"train_loss": -27.773157119750977, "global_step": 621104, "epoch": 7483} {"train_loss": -27.8065242767334, "global_step": 621105, "epoch": 7483} {"train_loss": -27.576501846313477, "global_step": 621106, "epoch": 7483} {"train_loss": -27.92730712890625, "global_step": 621107, "epoch": 7483} {"train_loss": -28.273038864135742, "global_step": 621108, "epoch": 7483} {"train_loss": -28.1517333984375, "global_step": 621109, "epoch": 7483} {"train_loss": -27.720495223999023, "global_step": 621110, "epoch": 7483} {"train_loss": -28.059049606323242, "global_step": 621111, "epoch": 7483} {"train_loss": -28.169879913330078, "global_step": 621112, "epoch": 7483} {"train_loss": -28.084989547729492, "global_step": 621113, "epoch": 7483} {"train_loss": -27.842145919799805, "global_step": 621114, "epoch": 7483} {"train_loss": -28.324106216430664, "global_step": 621115, "epoch": 7483} {"train_loss": -27.720441818237305, "global_step": 621116, "epoch": 7483} {"train_loss": -27.925765991210938, "global_step": 621117, "epoch": 7483} {"train_loss": -27.933385848999023, "global_step": 621118, "epoch": 7483} {"train_loss": -28.43757438659668, "global_step": 621119, "epoch": 7483} {"train_loss": -28.280853271484375, "global_step": 621120, "epoch": 7483} {"train_loss": -27.920621871948242, "global_step": 621121, "epoch": 7483} {"train_loss": -27.96124839782715, "global_step": 621122, "epoch": 7483} {"train_loss": -28.13374137878418, "global_step": 621123, "epoch": 7483} {"train_loss": -28.2075138092041, "global_step": 621124, "epoch": 7483} {"train_loss": -28.071218490600586, "global_step": 621125, "epoch": 7483} {"train_loss": -28.00042724609375, "global_step": 621126, "epoch": 7483} {"train_loss": -28.1407413482666, "global_step": 621127, "epoch": 7483} {"train_loss": -28.44510269165039, "global_step": 621128, "epoch": 7483} {"train_loss": -28.319355010986328, "global_step": 621129, "epoch": 7483} {"train_loss": -28.503149032592773, "global_step": 621130, "epoch": 7483} {"train_loss": -28.461271286010742, "global_step": 621131, "epoch": 7483} {"train_loss": -28.627195358276367, "global_step": 621132, "epoch": 7483} {"train_loss": -28.517736434936523, "global_step": 621133, "epoch": 7483} {"train_loss": -28.049585342407227, "global_step": 621134, "epoch": 7483} {"train_loss": -27.999616622924805, "global_step": 621135, "epoch": 7483} {"train_loss": -28.079059600830078, "global_step": 621136, "epoch": 7483} {"train_loss": -28.485742568969727, "global_step": 621137, "epoch": 7483} {"train_loss": -28.118030548095703, "global_step": 621138, "epoch": 7483} {"train_loss": -28.382062911987305, "global_step": 621139, "epoch": 7483} {"train_loss": -28.46420669555664, "global_step": 621140, "epoch": 7483} {"train_loss": -27.997533798217773, "global_step": 621141, "epoch": 7483} {"train_loss": -28.423810958862305, "global_step": 621142, "epoch": 7483} {"train_loss": -28.39002799987793, "global_step": 621143, "epoch": 7483} {"train_loss": -28.388635635375977, "global_step": 621144, "epoch": 7483} {"train_loss": -28.37934684753418, "global_step": 621145, "epoch": 7483} {"train_loss": -28.44525146484375, "global_step": 621146, "epoch": 7483} {"train_loss": -27.5767765045166, "global_step": 621147, "epoch": 7483} {"train_loss": -28.114110946655273, "global_step": 621148, "epoch": 7483} {"train_loss": -28.107690811157227, "global_step": 621149, "epoch": 7483} {"train_loss": -28.3668155670166, "global_step": 621150, "epoch": 7483} {"train_loss": -28.51974868774414, "global_step": 621151, "epoch": 7483} {"train_loss": -28.273839950561523, "global_step": 621152, "epoch": 7483} {"train_loss": -28.48953628540039, "global_step": 621153, "epoch": 7483} {"train_loss": -28.106842041015625, "global_step": 621154, "epoch": 7483} {"train_loss": -28.13050651550293, "global_step": 621155, "epoch": 7483} {"train_loss": -27.8299503326416, "global_step": 621156, "epoch": 7483} {"train_loss": -27.38838005065918, "global_step": 621157, "epoch": 7483} {"train_loss": -26.552692413330078, "global_step": 621158, "epoch": 7483} {"train_loss": -27.06854820251465, "global_step": 621159, "epoch": 7483} {"train_loss": -28.16278648376465, "global_step": 621160, "epoch": 7483} {"train_loss": -27.9520206451416, "global_step": 621161, "epoch": 7483} {"train_loss": -27.759906768798828, "global_step": 621162, "epoch": 7483} {"train_loss": -27.30316734313965, "global_step": 621163, "epoch": 7483} {"train_loss": -28.173324584960938, "global_step": 621164, "epoch": 7483} {"train_loss": -27.950857162475586, "global_step": 621165, "epoch": 7483} {"train_loss": -27.63680076599121, "global_step": 621166, "epoch": 7483} {"train_loss": -27.7474308013916, "global_step": 621167, "epoch": 7483} {"train_loss": -27.847888946533203, "global_step": 621168, "epoch": 7483} {"train_loss": -27.968854904174805, "global_step": 621169, "epoch": 7483} {"train_loss": -27.755084991455078, "global_step": 621170, "epoch": 7483} {"train_loss": -27.926571650677417, "global_step": 621171, "epoch": 7483, "val_loss": 6615311.0} {"train_loss": -28.134326934814453, "global_step": 621172, "epoch": 7484} {"train_loss": -27.444995880126953, "global_step": 621173, "epoch": 7484} {"train_loss": -27.77362060546875, "global_step": 621174, "epoch": 7484} {"train_loss": -27.777372360229492, "global_step": 621175, "epoch": 7484} {"train_loss": -27.897113800048828, "global_step": 621176, "epoch": 7484} {"train_loss": -27.77869987487793, "global_step": 621177, "epoch": 7484} {"train_loss": -28.066116333007812, "global_step": 621178, "epoch": 7484} {"train_loss": -27.959638595581055, "global_step": 621179, "epoch": 7484} {"train_loss": -27.680295944213867, "global_step": 621180, "epoch": 7484} {"train_loss": -27.763687133789062, "global_step": 621181, "epoch": 7484} {"train_loss": -27.40460777282715, "global_step": 621182, "epoch": 7484} {"train_loss": -27.605871200561523, "global_step": 621183, "epoch": 7484} {"train_loss": -27.793664932250977, "global_step": 621184, "epoch": 7484} {"train_loss": -27.641651153564453, "global_step": 621185, "epoch": 7484} {"train_loss": -27.94110107421875, "global_step": 621186, "epoch": 7484} {"train_loss": -27.903461456298828, "global_step": 621187, "epoch": 7484} {"train_loss": -28.11079216003418, "global_step": 621188, "epoch": 7484} {"train_loss": -28.109846115112305, "global_step": 621189, "epoch": 7484} {"train_loss": -28.087940216064453, "global_step": 621190, "epoch": 7484} {"train_loss": -27.686487197875977, "global_step": 621191, "epoch": 7484} {"train_loss": -28.1976261138916, "global_step": 621192, "epoch": 7484} {"train_loss": -28.050262451171875, "global_step": 621193, "epoch": 7484} {"train_loss": -28.182580947875977, "global_step": 621194, "epoch": 7484} {"train_loss": -28.115222930908203, "global_step": 621195, "epoch": 7484} {"train_loss": -28.34433937072754, "global_step": 621196, "epoch": 7484} {"train_loss": -28.34808921813965, "global_step": 621197, "epoch": 7484} {"train_loss": -28.240243911743164, "global_step": 621198, "epoch": 7484} {"train_loss": -28.311498641967773, "global_step": 621199, "epoch": 7484} {"train_loss": -28.003082275390625, "global_step": 621200, "epoch": 7484} {"train_loss": -28.535419464111328, "global_step": 621201, "epoch": 7484} {"train_loss": -28.352680206298828, "global_step": 621202, "epoch": 7484} {"train_loss": -27.99859619140625, "global_step": 621203, "epoch": 7484} {"train_loss": -28.079553604125977, "global_step": 621204, "epoch": 7484} {"train_loss": -28.781463623046875, "global_step": 621205, "epoch": 7484} {"train_loss": -28.446441650390625, "global_step": 621206, "epoch": 7484} {"train_loss": -28.49330711364746, "global_step": 621207, "epoch": 7484} {"train_loss": -28.02143669128418, "global_step": 621208, "epoch": 7484} {"train_loss": -28.191455841064453, "global_step": 621209, "epoch": 7484} {"train_loss": -28.486494064331055, "global_step": 621210, "epoch": 7484} {"train_loss": -28.498838424682617, "global_step": 621211, "epoch": 7484} {"train_loss": -28.267578125, "global_step": 621212, "epoch": 7484} {"train_loss": -28.419092178344727, "global_step": 621213, "epoch": 7484} {"train_loss": -28.311664581298828, "global_step": 621214, "epoch": 7484} {"train_loss": -28.6054630279541, "global_step": 621215, "epoch": 7484} {"train_loss": -28.428625106811523, "global_step": 621216, "epoch": 7484} {"train_loss": -28.574615478515625, "global_step": 621217, "epoch": 7484} {"train_loss": -28.411365509033203, "global_step": 621218, "epoch": 7484} {"train_loss": -28.464929580688477, "global_step": 621219, "epoch": 7484} {"train_loss": -28.890674591064453, "global_step": 621220, "epoch": 7484} {"train_loss": -28.694738388061523, "global_step": 621221, "epoch": 7484} {"train_loss": -28.270727157592773, "global_step": 621222, "epoch": 7484} {"train_loss": -28.35666847229004, "global_step": 621223, "epoch": 7484} {"train_loss": -27.915769577026367, "global_step": 621224, "epoch": 7484} {"train_loss": -28.559537887573242, "global_step": 621225, "epoch": 7484} {"train_loss": -28.1715145111084, "global_step": 621226, "epoch": 7484} {"train_loss": -28.36517333984375, "global_step": 621227, "epoch": 7484} {"train_loss": -28.318647384643555, "global_step": 621228, "epoch": 7484} {"train_loss": -28.254779815673828, "global_step": 621229, "epoch": 7484} {"train_loss": -28.2388916015625, "global_step": 621230, "epoch": 7484} {"train_loss": -28.3455867767334, "global_step": 621231, "epoch": 7484} {"train_loss": -27.90150260925293, "global_step": 621232, "epoch": 7484} {"train_loss": -27.73053550720215, "global_step": 621233, "epoch": 7484} {"train_loss": -27.628360748291016, "global_step": 621234, "epoch": 7484} {"train_loss": -27.86536979675293, "global_step": 621235, "epoch": 7484} {"train_loss": -28.08111572265625, "global_step": 621236, "epoch": 7484} {"train_loss": -28.038440704345703, "global_step": 621237, "epoch": 7484} {"train_loss": -27.85992431640625, "global_step": 621238, "epoch": 7484} {"train_loss": -27.939611434936523, "global_step": 621239, "epoch": 7484} {"train_loss": -27.767993927001953, "global_step": 621240, "epoch": 7484} {"train_loss": -28.219640731811523, "global_step": 621241, "epoch": 7484} {"train_loss": -27.957874298095703, "global_step": 621242, "epoch": 7484} {"train_loss": -28.34174156188965, "global_step": 621243, "epoch": 7484} {"train_loss": -27.885889053344727, "global_step": 621244, "epoch": 7484} {"train_loss": -28.34357261657715, "global_step": 621245, "epoch": 7484} {"train_loss": -27.96577262878418, "global_step": 621246, "epoch": 7484} {"train_loss": -28.087360382080078, "global_step": 621247, "epoch": 7484} {"train_loss": -28.559370040893555, "global_step": 621248, "epoch": 7484} {"train_loss": -28.1767578125, "global_step": 621249, "epoch": 7484} {"train_loss": -28.336917877197266, "global_step": 621250, "epoch": 7484} {"train_loss": -28.174375534057617, "global_step": 621251, "epoch": 7484} {"train_loss": -28.456512451171875, "global_step": 621252, "epoch": 7484} {"train_loss": -28.31110191345215, "global_step": 621253, "epoch": 7484} {"train_loss": -28.146937037088787, "global_step": 621254, "epoch": 7484, "val_loss": 6604779.0} {"train_loss": -26.157352447509766, "global_step": 621255, "epoch": 7485} {"train_loss": -26.7415714263916, "global_step": 621256, "epoch": 7485} {"train_loss": -27.763113021850586, "global_step": 621257, "epoch": 7485} {"train_loss": -26.267780303955078, "global_step": 621258, "epoch": 7485} {"train_loss": -27.420135498046875, "global_step": 621259, "epoch": 7485} {"train_loss": -27.231428146362305, "global_step": 621260, "epoch": 7485} {"train_loss": -27.20292091369629, "global_step": 621261, "epoch": 7485} {"train_loss": -27.319875717163086, "global_step": 621262, "epoch": 7485} {"train_loss": -27.30622673034668, "global_step": 621263, "epoch": 7485} {"train_loss": -27.3692626953125, "global_step": 621264, "epoch": 7485} {"train_loss": -27.648944854736328, "global_step": 621265, "epoch": 7485} {"train_loss": -27.488142013549805, "global_step": 621266, "epoch": 7485} {"train_loss": -27.37473487854004, "global_step": 621267, "epoch": 7485} {"train_loss": -27.276580810546875, "global_step": 621268, "epoch": 7485} {"train_loss": -27.63665199279785, "global_step": 621269, "epoch": 7485} {"train_loss": -27.855609893798828, "global_step": 621270, "epoch": 7485} {"train_loss": -26.89154052734375, "global_step": 621271, "epoch": 7485} {"train_loss": -27.94268226623535, "global_step": 621272, "epoch": 7485} {"train_loss": -27.7165584564209, "global_step": 621273, "epoch": 7485} {"train_loss": -27.39423942565918, "global_step": 621274, "epoch": 7485} {"train_loss": -28.005859375, "global_step": 621275, "epoch": 7485} {"train_loss": -27.93317985534668, "global_step": 621276, "epoch": 7485} {"train_loss": -27.6739559173584, "global_step": 621277, "epoch": 7485} {"train_loss": -27.864856719970703, "global_step": 621278, "epoch": 7485} {"train_loss": -27.88895606994629, "global_step": 621279, "epoch": 7485} {"train_loss": -27.726301193237305, "global_step": 621280, "epoch": 7485} {"train_loss": -27.886335372924805, "global_step": 621281, "epoch": 7485} {"train_loss": -27.55103874206543, "global_step": 621282, "epoch": 7485} {"train_loss": -27.885297775268555, "global_step": 621283, "epoch": 7485} {"train_loss": -27.777851104736328, "global_step": 621284, "epoch": 7485} {"train_loss": -27.891891479492188, "global_step": 621285, "epoch": 7485} {"train_loss": -28.121234893798828, "global_step": 621286, "epoch": 7485} {"train_loss": -27.998693466186523, "global_step": 621287, "epoch": 7485} {"train_loss": -27.900060653686523, "global_step": 621288, "epoch": 7485} {"train_loss": -28.3980655670166, "global_step": 621289, "epoch": 7485} {"train_loss": -27.903650283813477, "global_step": 621290, "epoch": 7485} {"train_loss": -28.159961700439453, "global_step": 621291, "epoch": 7485} {"train_loss": -27.849685668945312, "global_step": 621292, "epoch": 7485} {"train_loss": -28.017744064331055, "global_step": 621293, "epoch": 7485} {"train_loss": -28.17083740234375, "global_step": 621294, "epoch": 7485} {"train_loss": -28.31088638305664, "global_step": 621295, "epoch": 7485} {"train_loss": -28.1651611328125, "global_step": 621296, "epoch": 7485} {"train_loss": -28.347864151000977, "global_step": 621297, "epoch": 7485} {"train_loss": -28.1074161529541, "global_step": 621298, "epoch": 7485} {"train_loss": -28.176061630249023, "global_step": 621299, "epoch": 7485} {"train_loss": -28.289880752563477, "global_step": 621300, "epoch": 7485} {"train_loss": -28.334081649780273, "global_step": 621301, "epoch": 7485} {"train_loss": -28.311140060424805, "global_step": 621302, "epoch": 7485} {"train_loss": -27.812963485717773, "global_step": 621303, "epoch": 7485} {"train_loss": -27.292530059814453, "global_step": 621304, "epoch": 7485} {"train_loss": -27.7519474029541, "global_step": 621305, "epoch": 7485} {"train_loss": -28.49848747253418, "global_step": 621306, "epoch": 7485} {"train_loss": -27.927734375, "global_step": 621307, "epoch": 7485} {"train_loss": -27.60525894165039, "global_step": 621308, "epoch": 7485} {"train_loss": -28.195560455322266, "global_step": 621309, "epoch": 7485} {"train_loss": -27.783300399780273, "global_step": 621310, "epoch": 7485} {"train_loss": -28.008258819580078, "global_step": 621311, "epoch": 7485} {"train_loss": -27.98727798461914, "global_step": 621312, "epoch": 7485} {"train_loss": -28.308826446533203, "global_step": 621313, "epoch": 7485} {"train_loss": -28.13824462890625, "global_step": 621314, "epoch": 7485} {"train_loss": -28.136646270751953, "global_step": 621315, "epoch": 7485} {"train_loss": -28.310962677001953, "global_step": 621316, "epoch": 7485} {"train_loss": -27.75860023498535, "global_step": 621317, "epoch": 7485} {"train_loss": -28.312915802001953, "global_step": 621318, "epoch": 7485} {"train_loss": -28.0904541015625, "global_step": 621319, "epoch": 7485} {"train_loss": -28.501737594604492, "global_step": 621320, "epoch": 7485} {"train_loss": -28.1901798248291, "global_step": 621321, "epoch": 7485} {"train_loss": -28.2988224029541, "global_step": 621322, "epoch": 7485} {"train_loss": -28.490253448486328, "global_step": 621323, "epoch": 7485} {"train_loss": -27.948606491088867, "global_step": 621324, "epoch": 7485} {"train_loss": -28.083179473876953, "global_step": 621325, "epoch": 7485} {"train_loss": -28.5571231842041, "global_step": 621326, "epoch": 7485} {"train_loss": -28.231725692749023, "global_step": 621327, "epoch": 7485} {"train_loss": -28.454336166381836, "global_step": 621328, "epoch": 7485} {"train_loss": -28.484731674194336, "global_step": 621329, "epoch": 7485} {"train_loss": -27.878982543945312, "global_step": 621330, "epoch": 7485} {"train_loss": -28.569122314453125, "global_step": 621331, "epoch": 7485} {"train_loss": -28.311330795288086, "global_step": 621332, "epoch": 7485} {"train_loss": -27.752363204956055, "global_step": 621333, "epoch": 7485} {"train_loss": -28.184125900268555, "global_step": 621334, "epoch": 7485} {"train_loss": -27.964014053344727, "global_step": 621335, "epoch": 7485} {"train_loss": -28.353479385375977, "global_step": 621336, "epoch": 7485} {"train_loss": -27.9097688284265, "global_step": 621337, "epoch": 7485, "val_loss": 6589657.0} {"train_loss": -25.865446090698242, "global_step": 621338, "epoch": 7486} {"train_loss": -26.302595138549805, "global_step": 621339, "epoch": 7486} {"train_loss": -26.977025985717773, "global_step": 621340, "epoch": 7486} {"train_loss": -26.882871627807617, "global_step": 621341, "epoch": 7486} {"train_loss": -26.881805419921875, "global_step": 621342, "epoch": 7486} {"train_loss": -27.16839027404785, "global_step": 621343, "epoch": 7486} {"train_loss": -26.944929122924805, "global_step": 621344, "epoch": 7486} {"train_loss": -27.117782592773438, "global_step": 621345, "epoch": 7486} {"train_loss": -26.605504989624023, "global_step": 621346, "epoch": 7486} {"train_loss": -27.372638702392578, "global_step": 621347, "epoch": 7486} {"train_loss": -27.41926383972168, "global_step": 621348, "epoch": 7486} {"train_loss": -27.7587947845459, "global_step": 621349, "epoch": 7486} {"train_loss": -27.05203628540039, "global_step": 621350, "epoch": 7486} {"train_loss": -27.56305503845215, "global_step": 621351, "epoch": 7486} {"train_loss": -27.208698272705078, "global_step": 621352, "epoch": 7486} {"train_loss": -27.345617294311523, "global_step": 621353, "epoch": 7486} {"train_loss": -27.629064559936523, "global_step": 621354, "epoch": 7486} {"train_loss": -27.391061782836914, "global_step": 621355, "epoch": 7486} {"train_loss": -27.449310302734375, "global_step": 621356, "epoch": 7486} {"train_loss": -27.751867294311523, "global_step": 621357, "epoch": 7486} {"train_loss": -27.5842342376709, "global_step": 621358, "epoch": 7486} {"train_loss": -27.617923736572266, "global_step": 621359, "epoch": 7486} {"train_loss": -27.797719955444336, "global_step": 621360, "epoch": 7486} {"train_loss": -27.445234298706055, "global_step": 621361, "epoch": 7486} {"train_loss": -27.674413681030273, "global_step": 621362, "epoch": 7486} {"train_loss": -27.926626205444336, "global_step": 621363, "epoch": 7486} {"train_loss": -27.5247859954834, "global_step": 621364, "epoch": 7486} {"train_loss": -27.90516471862793, "global_step": 621365, "epoch": 7486} {"train_loss": -27.64558219909668, "global_step": 621366, "epoch": 7486} {"train_loss": -28.140827178955078, "global_step": 621367, "epoch": 7486} {"train_loss": -27.91914939880371, "global_step": 621368, "epoch": 7486} {"train_loss": -28.04621696472168, "global_step": 621369, "epoch": 7486} {"train_loss": -27.763906478881836, "global_step": 621370, "epoch": 7486} {"train_loss": -28.01519775390625, "global_step": 621371, "epoch": 7486} {"train_loss": -28.023832321166992, "global_step": 621372, "epoch": 7486} {"train_loss": -28.049850463867188, "global_step": 621373, "epoch": 7486} {"train_loss": -28.117650985717773, "global_step": 621374, "epoch": 7486} {"train_loss": -27.74898338317871, "global_step": 621375, "epoch": 7486} {"train_loss": -27.970666885375977, "global_step": 621376, "epoch": 7486} {"train_loss": -28.27569007873535, "global_step": 621377, "epoch": 7486} {"train_loss": -28.092761993408203, "global_step": 621378, "epoch": 7486} {"train_loss": -27.817346572875977, "global_step": 621379, "epoch": 7486} {"train_loss": -28.085845947265625, "global_step": 621380, "epoch": 7486} {"train_loss": -28.23554801940918, "global_step": 621381, "epoch": 7486} {"train_loss": -28.233301162719727, "global_step": 621382, "epoch": 7486} {"train_loss": -27.931976318359375, "global_step": 621383, "epoch": 7486} {"train_loss": -28.185016632080078, "global_step": 621384, "epoch": 7486} {"train_loss": -28.1160831451416, "global_step": 621385, "epoch": 7486} {"train_loss": -28.29921531677246, "global_step": 621386, "epoch": 7486} {"train_loss": -28.329015731811523, "global_step": 621387, "epoch": 7486} {"train_loss": -28.429443359375, "global_step": 621388, "epoch": 7486} {"train_loss": -28.257078170776367, "global_step": 621389, "epoch": 7486} {"train_loss": -28.37310218811035, "global_step": 621390, "epoch": 7486} {"train_loss": -28.16741371154785, "global_step": 621391, "epoch": 7486} {"train_loss": -28.349836349487305, "global_step": 621392, "epoch": 7486} {"train_loss": -28.23915672302246, "global_step": 621393, "epoch": 7486} {"train_loss": -28.378528594970703, "global_step": 621394, "epoch": 7486} {"train_loss": -28.430709838867188, "global_step": 621395, "epoch": 7486} {"train_loss": -28.368988037109375, "global_step": 621396, "epoch": 7486} {"train_loss": -28.11152458190918, "global_step": 621397, "epoch": 7486} {"train_loss": -28.270978927612305, "global_step": 621398, "epoch": 7486} {"train_loss": -28.410388946533203, "global_step": 621399, "epoch": 7486} {"train_loss": -28.452375411987305, "global_step": 621400, "epoch": 7486} {"train_loss": -28.595077514648438, "global_step": 621401, "epoch": 7486} {"train_loss": -28.23142433166504, "global_step": 621402, "epoch": 7486} {"train_loss": -28.224445343017578, "global_step": 621403, "epoch": 7486} {"train_loss": -27.883337020874023, "global_step": 621404, "epoch": 7486} {"train_loss": -28.070295333862305, "global_step": 621405, "epoch": 7486} {"train_loss": -27.921390533447266, "global_step": 621406, "epoch": 7486} {"train_loss": -27.74930191040039, "global_step": 621407, "epoch": 7486} {"train_loss": -28.365942001342773, "global_step": 621408, "epoch": 7486} {"train_loss": -28.405582427978516, "global_step": 621409, "epoch": 7486} {"train_loss": -28.543323516845703, "global_step": 621410, "epoch": 7486} {"train_loss": -28.339086532592773, "global_step": 621411, "epoch": 7486} {"train_loss": -28.412982940673828, "global_step": 621412, "epoch": 7486} {"train_loss": -28.26783561706543, "global_step": 621413, "epoch": 7486} {"train_loss": -28.290084838867188, "global_step": 621414, "epoch": 7486} {"train_loss": -27.99722671508789, "global_step": 621415, "epoch": 7486} {"train_loss": -27.84869384765625, "global_step": 621416, "epoch": 7486} {"train_loss": -28.611846923828125, "global_step": 621417, "epoch": 7486} {"train_loss": -28.240283966064453, "global_step": 621418, "epoch": 7486} {"train_loss": -28.11395835876465, "global_step": 621419, "epoch": 7486} {"train_loss": -27.859314677226973, "global_step": 621420, "epoch": 7486, "val_loss": 6639169.5} {"train_loss": -27.76740837097168, "global_step": 621421, "epoch": 7487} {"train_loss": -27.477888107299805, "global_step": 621422, "epoch": 7487} {"train_loss": -27.534732818603516, "global_step": 621423, "epoch": 7487} {"train_loss": -27.58991813659668, "global_step": 621424, "epoch": 7487} {"train_loss": -26.486242294311523, "global_step": 621425, "epoch": 7487} {"train_loss": -27.22711181640625, "global_step": 621426, "epoch": 7487} {"train_loss": -27.096960067749023, "global_step": 621427, "epoch": 7487} {"train_loss": -26.040491104125977, "global_step": 621428, "epoch": 7487} {"train_loss": -27.32172203063965, "global_step": 621429, "epoch": 7487} {"train_loss": -26.58319091796875, "global_step": 621430, "epoch": 7487} {"train_loss": -27.45648193359375, "global_step": 621431, "epoch": 7487} {"train_loss": -26.361547470092773, "global_step": 621432, "epoch": 7487} {"train_loss": -27.368228912353516, "global_step": 621433, "epoch": 7487} {"train_loss": -26.946985244750977, "global_step": 621434, "epoch": 7487} {"train_loss": -27.739826202392578, "global_step": 621435, "epoch": 7487} {"train_loss": -27.3355770111084, "global_step": 621436, "epoch": 7487} {"train_loss": -27.48407554626465, "global_step": 621437, "epoch": 7487} {"train_loss": -27.81707191467285, "global_step": 621438, "epoch": 7487} {"train_loss": -27.358007431030273, "global_step": 621439, "epoch": 7487} {"train_loss": -27.58046531677246, "global_step": 621440, "epoch": 7487} {"train_loss": -27.88751220703125, "global_step": 621441, "epoch": 7487} {"train_loss": -27.21233558654785, "global_step": 621442, "epoch": 7487} {"train_loss": -27.976282119750977, "global_step": 621443, "epoch": 7487} {"train_loss": -27.49439811706543, "global_step": 621444, "epoch": 7487} {"train_loss": -27.746835708618164, "global_step": 621445, "epoch": 7487} {"train_loss": -27.333097457885742, "global_step": 621446, "epoch": 7487} {"train_loss": -27.9010066986084, "global_step": 621447, "epoch": 7487} {"train_loss": -28.20185661315918, "global_step": 621448, "epoch": 7487} {"train_loss": -28.142553329467773, "global_step": 621449, "epoch": 7487} {"train_loss": -27.78571891784668, "global_step": 621450, "epoch": 7487} {"train_loss": -27.854541778564453, "global_step": 621451, "epoch": 7487} {"train_loss": -28.023645401000977, "global_step": 621452, "epoch": 7487} {"train_loss": -27.566808700561523, "global_step": 621453, "epoch": 7487} {"train_loss": -28.2399845123291, "global_step": 621454, "epoch": 7487} {"train_loss": -27.815561294555664, "global_step": 621455, "epoch": 7487} {"train_loss": -28.0028076171875, "global_step": 621456, "epoch": 7487} {"train_loss": -27.8200740814209, "global_step": 621457, "epoch": 7487} {"train_loss": -27.9011173248291, "global_step": 621458, "epoch": 7487} {"train_loss": -27.82783317565918, "global_step": 621459, "epoch": 7487} {"train_loss": -28.081892013549805, "global_step": 621460, "epoch": 7487} {"train_loss": -28.882360458374023, "global_step": 621461, "epoch": 7487} {"train_loss": -28.29547691345215, "global_step": 621462, "epoch": 7487} {"train_loss": -28.189594268798828, "global_step": 621463, "epoch": 7487} {"train_loss": -28.435468673706055, "global_step": 621464, "epoch": 7487} {"train_loss": -27.999252319335938, "global_step": 621465, "epoch": 7487} {"train_loss": -28.347436904907227, "global_step": 621466, "epoch": 7487} {"train_loss": -28.385730743408203, "global_step": 621467, "epoch": 7487} {"train_loss": -28.48953628540039, "global_step": 621468, "epoch": 7487} {"train_loss": -28.185815811157227, "global_step": 621469, "epoch": 7487} {"train_loss": -28.325855255126953, "global_step": 621470, "epoch": 7487} {"train_loss": -28.313907623291016, "global_step": 621471, "epoch": 7487} {"train_loss": -27.99445915222168, "global_step": 621472, "epoch": 7487} {"train_loss": -28.336877822875977, "global_step": 621473, "epoch": 7487} {"train_loss": -28.500165939331055, "global_step": 621474, "epoch": 7487} {"train_loss": -28.437885284423828, "global_step": 621475, "epoch": 7487} {"train_loss": -28.573453903198242, "global_step": 621476, "epoch": 7487} {"train_loss": -28.738605499267578, "global_step": 621477, "epoch": 7487} {"train_loss": -28.688770294189453, "global_step": 621478, "epoch": 7487} {"train_loss": -28.343481063842773, "global_step": 621479, "epoch": 7487} {"train_loss": -28.35922622680664, "global_step": 621480, "epoch": 7487} {"train_loss": -28.40909194946289, "global_step": 621481, "epoch": 7487} {"train_loss": -28.26980972290039, "global_step": 621482, "epoch": 7487} {"train_loss": -28.440393447875977, "global_step": 621483, "epoch": 7487} {"train_loss": -27.934595108032227, "global_step": 621484, "epoch": 7487} {"train_loss": -28.261428833007812, "global_step": 621485, "epoch": 7487} {"train_loss": -27.999231338500977, "global_step": 621486, "epoch": 7487} {"train_loss": -28.4069766998291, "global_step": 621487, "epoch": 7487} {"train_loss": -28.3345947265625, "global_step": 621488, "epoch": 7487} {"train_loss": -28.11524772644043, "global_step": 621489, "epoch": 7487} {"train_loss": -27.696149826049805, "global_step": 621490, "epoch": 7487} {"train_loss": -28.195348739624023, "global_step": 621491, "epoch": 7487} {"train_loss": -28.257810592651367, "global_step": 621492, "epoch": 7487} {"train_loss": -28.12772560119629, "global_step": 621493, "epoch": 7487} {"train_loss": -28.235742568969727, "global_step": 621494, "epoch": 7487} {"train_loss": -28.128467559814453, "global_step": 621495, "epoch": 7487} {"train_loss": -27.775421142578125, "global_step": 621496, "epoch": 7487} {"train_loss": -27.87296485900879, "global_step": 621497, "epoch": 7487} {"train_loss": -28.334802627563477, "global_step": 621498, "epoch": 7487} {"train_loss": -28.065099716186523, "global_step": 621499, "epoch": 7487} {"train_loss": -27.958219528198242, "global_step": 621500, "epoch": 7487} {"train_loss": -28.232397079467773, "global_step": 621501, "epoch": 7487} {"train_loss": -28.272729873657227, "global_step": 621502, "epoch": 7487} {"train_loss": -27.913499510431866, "global_step": 621503, "epoch": 7487, "val_loss": 6569885.0} {"train_loss": -27.917499542236328, "global_step": 621504, "epoch": 7488} {"train_loss": -27.821863174438477, "global_step": 621505, "epoch": 7488} {"train_loss": -27.87409019470215, "global_step": 621506, "epoch": 7488} {"train_loss": -28.16900634765625, "global_step": 621507, "epoch": 7488} {"train_loss": -27.801193237304688, "global_step": 621508, "epoch": 7488} {"train_loss": -27.933752059936523, "global_step": 621509, "epoch": 7488} {"train_loss": -27.5960636138916, "global_step": 621510, "epoch": 7488} {"train_loss": -27.62299156188965, "global_step": 621511, "epoch": 7488} {"train_loss": -27.980329513549805, "global_step": 621512, "epoch": 7488} {"train_loss": -28.171207427978516, "global_step": 621513, "epoch": 7488} {"train_loss": -27.980466842651367, "global_step": 621514, "epoch": 7488} {"train_loss": -28.091968536376953, "global_step": 621515, "epoch": 7488} {"train_loss": -27.769102096557617, "global_step": 621516, "epoch": 7488} {"train_loss": -28.020416259765625, "global_step": 621517, "epoch": 7488} {"train_loss": -28.14851188659668, "global_step": 621518, "epoch": 7488} {"train_loss": -28.183698654174805, "global_step": 621519, "epoch": 7488} {"train_loss": -28.236377716064453, "global_step": 621520, "epoch": 7488} {"train_loss": -27.912078857421875, "global_step": 621521, "epoch": 7488} {"train_loss": -27.980138778686523, "global_step": 621522, "epoch": 7488} {"train_loss": -28.079736709594727, "global_step": 621523, "epoch": 7488} {"train_loss": -28.08583641052246, "global_step": 621524, "epoch": 7488} {"train_loss": -28.074689865112305, "global_step": 621525, "epoch": 7488} {"train_loss": -28.2952938079834, "global_step": 621526, "epoch": 7488} {"train_loss": -28.2050724029541, "global_step": 621527, "epoch": 7488} {"train_loss": -28.636886596679688, "global_step": 621528, "epoch": 7488} {"train_loss": -27.99637794494629, "global_step": 621529, "epoch": 7488} {"train_loss": -28.384796142578125, "global_step": 621530, "epoch": 7488} {"train_loss": -27.860870361328125, "global_step": 621531, "epoch": 7488} {"train_loss": -28.33963394165039, "global_step": 621532, "epoch": 7488} {"train_loss": -28.103139877319336, "global_step": 621533, "epoch": 7488} {"train_loss": -28.13525390625, "global_step": 621534, "epoch": 7488} {"train_loss": -28.252851486206055, "global_step": 621535, "epoch": 7488} {"train_loss": -27.63279151916504, "global_step": 621536, "epoch": 7488} {"train_loss": -28.186628341674805, "global_step": 621537, "epoch": 7488} {"train_loss": -28.187015533447266, "global_step": 621538, "epoch": 7488} {"train_loss": -28.18654441833496, "global_step": 621539, "epoch": 7488} {"train_loss": -28.19515037536621, "global_step": 621540, "epoch": 7488} {"train_loss": -28.118810653686523, "global_step": 621541, "epoch": 7488} {"train_loss": -28.331811904907227, "global_step": 621542, "epoch": 7488} {"train_loss": -28.02909278869629, "global_step": 621543, "epoch": 7488} {"train_loss": -28.266550064086914, "global_step": 621544, "epoch": 7488} {"train_loss": -27.9708309173584, "global_step": 621545, "epoch": 7488} {"train_loss": -28.15549659729004, "global_step": 621546, "epoch": 7488} {"train_loss": -27.980350494384766, "global_step": 621547, "epoch": 7488} {"train_loss": -28.402332305908203, "global_step": 621548, "epoch": 7488} {"train_loss": -27.907135009765625, "global_step": 621549, "epoch": 7488} {"train_loss": -28.057249069213867, "global_step": 621550, "epoch": 7488} {"train_loss": -28.36464500427246, "global_step": 621551, "epoch": 7488} {"train_loss": -28.548004150390625, "global_step": 621552, "epoch": 7488} {"train_loss": -28.447528839111328, "global_step": 621553, "epoch": 7488} {"train_loss": -28.253747940063477, "global_step": 621554, "epoch": 7488} {"train_loss": -28.2596378326416, "global_step": 621555, "epoch": 7488} {"train_loss": -27.783920288085938, "global_step": 621556, "epoch": 7488} {"train_loss": -28.12940788269043, "global_step": 621557, "epoch": 7488} {"train_loss": -27.976598739624023, "global_step": 621558, "epoch": 7488} {"train_loss": -28.209386825561523, "global_step": 621559, "epoch": 7488} {"train_loss": -28.375593185424805, "global_step": 621560, "epoch": 7488} {"train_loss": -27.944257736206055, "global_step": 621561, "epoch": 7488} {"train_loss": -28.40253257751465, "global_step": 621562, "epoch": 7488} {"train_loss": -28.3931941986084, "global_step": 621563, "epoch": 7488} {"train_loss": -28.4826602935791, "global_step": 621564, "epoch": 7488} {"train_loss": -28.177762985229492, "global_step": 621565, "epoch": 7488} {"train_loss": -28.449254989624023, "global_step": 621566, "epoch": 7488} {"train_loss": -28.24136734008789, "global_step": 621567, "epoch": 7488} {"train_loss": -28.437549591064453, "global_step": 621568, "epoch": 7488} {"train_loss": -28.010604858398438, "global_step": 621569, "epoch": 7488} {"train_loss": -28.60236167907715, "global_step": 621570, "epoch": 7488} {"train_loss": -28.23828125, "global_step": 621571, "epoch": 7488} {"train_loss": -27.91599464416504, "global_step": 621572, "epoch": 7488} {"train_loss": -28.37892723083496, "global_step": 621573, "epoch": 7488} {"train_loss": -28.31094741821289, "global_step": 621574, "epoch": 7488} {"train_loss": -28.094715118408203, "global_step": 621575, "epoch": 7488} {"train_loss": -28.51275634765625, "global_step": 621576, "epoch": 7488} {"train_loss": -28.347150802612305, "global_step": 621577, "epoch": 7488} {"train_loss": -27.98138999938965, "global_step": 621578, "epoch": 7488} {"train_loss": -28.58829689025879, "global_step": 621579, "epoch": 7488} {"train_loss": -28.6720027923584, "global_step": 621580, "epoch": 7488} {"train_loss": -28.16064453125, "global_step": 621581, "epoch": 7488} {"train_loss": -28.1318359375, "global_step": 621582, "epoch": 7488} {"train_loss": -28.23211669921875, "global_step": 621583, "epoch": 7488} {"train_loss": -28.625097274780273, "global_step": 621584, "epoch": 7488} {"train_loss": -28.176197052001953, "global_step": 621585, "epoch": 7488} {"train_loss": -28.160440651767225, "global_step": 621586, "epoch": 7488, "val_loss": 6682261.5} {"train_loss": -27.147018432617188, "global_step": 621587, "epoch": 7489} {"train_loss": -26.230438232421875, "global_step": 621588, "epoch": 7489} {"train_loss": -26.91645622253418, "global_step": 621589, "epoch": 7489} {"train_loss": -27.127002716064453, "global_step": 621590, "epoch": 7489} {"train_loss": -26.71039390563965, "global_step": 621591, "epoch": 7489} {"train_loss": -26.739227294921875, "global_step": 621592, "epoch": 7489} {"train_loss": -27.57736587524414, "global_step": 621593, "epoch": 7489} {"train_loss": -26.527252197265625, "global_step": 621594, "epoch": 7489} {"train_loss": -27.9622802734375, "global_step": 621595, "epoch": 7489} {"train_loss": -26.896728515625, "global_step": 621596, "epoch": 7489} {"train_loss": -27.898788452148438, "global_step": 621597, "epoch": 7489} {"train_loss": -26.617712020874023, "global_step": 621598, "epoch": 7489} {"train_loss": -27.951459884643555, "global_step": 621599, "epoch": 7489} {"train_loss": -27.12818717956543, "global_step": 621600, "epoch": 7489} {"train_loss": -27.651914596557617, "global_step": 621601, "epoch": 7489} {"train_loss": -27.63920021057129, "global_step": 621602, "epoch": 7489} {"train_loss": -27.798267364501953, "global_step": 621603, "epoch": 7489} {"train_loss": -27.816431045532227, "global_step": 621604, "epoch": 7489} {"train_loss": -27.36297035217285, "global_step": 621605, "epoch": 7489} {"train_loss": -27.427627563476562, "global_step": 621606, "epoch": 7489} {"train_loss": -27.9625186920166, "global_step": 621607, "epoch": 7489} {"train_loss": -27.529224395751953, "global_step": 621608, "epoch": 7489} {"train_loss": -28.013132095336914, "global_step": 621609, "epoch": 7489} {"train_loss": -27.521595001220703, "global_step": 621610, "epoch": 7489} {"train_loss": -27.3328857421875, "global_step": 621611, "epoch": 7489} {"train_loss": -27.58180809020996, "global_step": 621612, "epoch": 7489} {"train_loss": -28.021163940429688, "global_step": 621613, "epoch": 7489} {"train_loss": -27.653928756713867, "global_step": 621614, "epoch": 7489} {"train_loss": -27.253355026245117, "global_step": 621615, "epoch": 7489} {"train_loss": -27.12192726135254, "global_step": 621616, "epoch": 7489} {"train_loss": -27.612478256225586, "global_step": 621617, "epoch": 7489} {"train_loss": -27.79627799987793, "global_step": 621618, "epoch": 7489} {"train_loss": -27.459747314453125, "global_step": 621619, "epoch": 7489} {"train_loss": -27.586984634399414, "global_step": 621620, "epoch": 7489} {"train_loss": -27.8532657623291, "global_step": 621621, "epoch": 7489} {"train_loss": -27.704877853393555, "global_step": 621622, "epoch": 7489} {"train_loss": -27.8441162109375, "global_step": 621623, "epoch": 7489} {"train_loss": -27.428211212158203, "global_step": 621624, "epoch": 7489} {"train_loss": -27.90150260925293, "global_step": 621625, "epoch": 7489} {"train_loss": -28.020355224609375, "global_step": 621626, "epoch": 7489} {"train_loss": -28.113052368164062, "global_step": 621627, "epoch": 7489} {"train_loss": -28.13030433654785, "global_step": 621628, "epoch": 7489} {"train_loss": -28.22439956665039, "global_step": 621629, "epoch": 7489} {"train_loss": -28.237375259399414, "global_step": 621630, "epoch": 7489} {"train_loss": -27.808582305908203, "global_step": 621631, "epoch": 7489} {"train_loss": -27.8978328704834, "global_step": 621632, "epoch": 7489} {"train_loss": -28.12897300720215, "global_step": 621633, "epoch": 7489} {"train_loss": -28.159223556518555, "global_step": 621634, "epoch": 7489} {"train_loss": -28.117721557617188, "global_step": 621635, "epoch": 7489} {"train_loss": -28.106664657592773, "global_step": 621636, "epoch": 7489} {"train_loss": -28.2167911529541, "global_step": 621637, "epoch": 7489} {"train_loss": -27.89874839782715, "global_step": 621638, "epoch": 7489} {"train_loss": -28.3001651763916, "global_step": 621639, "epoch": 7489} {"train_loss": -28.174747467041016, "global_step": 621640, "epoch": 7489} {"train_loss": -28.15229606628418, "global_step": 621641, "epoch": 7489} {"train_loss": -28.205774307250977, "global_step": 621642, "epoch": 7489} {"train_loss": -27.398029327392578, "global_step": 621643, "epoch": 7489} {"train_loss": -26.95747184753418, "global_step": 621644, "epoch": 7489} {"train_loss": -26.52363395690918, "global_step": 621645, "epoch": 7489} {"train_loss": -28.195898056030273, "global_step": 621646, "epoch": 7489} {"train_loss": -27.326587677001953, "global_step": 621647, "epoch": 7489} {"train_loss": -27.311487197875977, "global_step": 621648, "epoch": 7489} {"train_loss": -28.266357421875, "global_step": 621649, "epoch": 7489} {"train_loss": -27.995990753173828, "global_step": 621650, "epoch": 7489} {"train_loss": -28.29366111755371, "global_step": 621651, "epoch": 7489} {"train_loss": -27.708463668823242, "global_step": 621652, "epoch": 7489} {"train_loss": -28.226886749267578, "global_step": 621653, "epoch": 7489} {"train_loss": -27.813684463500977, "global_step": 621654, "epoch": 7489} {"train_loss": -28.242624282836914, "global_step": 621655, "epoch": 7489} {"train_loss": -28.336801528930664, "global_step": 621656, "epoch": 7489} {"train_loss": -28.030447006225586, "global_step": 621657, "epoch": 7489} {"train_loss": -28.305419921875, "global_step": 621658, "epoch": 7489} {"train_loss": -28.19935417175293, "global_step": 621659, "epoch": 7489} {"train_loss": -28.2679443359375, "global_step": 621660, "epoch": 7489} {"train_loss": -28.066137313842773, "global_step": 621661, "epoch": 7489} {"train_loss": -28.481983184814453, "global_step": 621662, "epoch": 7489} {"train_loss": -28.26616859436035, "global_step": 621663, "epoch": 7489} {"train_loss": -28.020734786987305, "global_step": 621664, "epoch": 7489} {"train_loss": -27.988733291625977, "global_step": 621665, "epoch": 7489} {"train_loss": -28.183364868164062, "global_step": 621666, "epoch": 7489} {"train_loss": -27.961929321289062, "global_step": 621667, "epoch": 7489} {"train_loss": -28.16534423828125, "global_step": 621668, "epoch": 7489} {"train_loss": -27.773279925426806, "global_step": 621669, "epoch": 7489, "val_loss": 6599561.0} {"train_loss": -26.642602920532227, "global_step": 621670, "epoch": 7490} {"train_loss": -26.3099308013916, "global_step": 621671, "epoch": 7490} {"train_loss": -27.139577865600586, "global_step": 621672, "epoch": 7490} {"train_loss": -27.147144317626953, "global_step": 621673, "epoch": 7490} {"train_loss": -27.640094757080078, "global_step": 621674, "epoch": 7490} {"train_loss": -27.035627365112305, "global_step": 621675, "epoch": 7490} {"train_loss": -26.38533592224121, "global_step": 621676, "epoch": 7490} {"train_loss": -26.667200088500977, "global_step": 621677, "epoch": 7490} {"train_loss": -26.802785873413086, "global_step": 621678, "epoch": 7490} {"train_loss": -27.12908363342285, "global_step": 621679, "epoch": 7490} {"train_loss": -27.2464542388916, "global_step": 621680, "epoch": 7490} {"train_loss": -27.508270263671875, "global_step": 621681, "epoch": 7490} {"train_loss": -27.414106369018555, "global_step": 621682, "epoch": 7490} {"train_loss": -26.915607452392578, "global_step": 621683, "epoch": 7490} {"train_loss": -27.295001983642578, "global_step": 621684, "epoch": 7490} {"train_loss": -27.657928466796875, "global_step": 621685, "epoch": 7490} {"train_loss": -27.64251708984375, "global_step": 621686, "epoch": 7490} {"train_loss": -27.535633087158203, "global_step": 621687, "epoch": 7490} {"train_loss": -27.183563232421875, "global_step": 621688, "epoch": 7490} {"train_loss": -27.765661239624023, "global_step": 621689, "epoch": 7490} {"train_loss": -27.671422958374023, "global_step": 621690, "epoch": 7490} {"train_loss": -27.8798770904541, "global_step": 621691, "epoch": 7490} {"train_loss": -27.697866439819336, "global_step": 621692, "epoch": 7490} {"train_loss": -27.697528839111328, "global_step": 621693, "epoch": 7490} {"train_loss": -28.08741569519043, "global_step": 621694, "epoch": 7490} {"train_loss": -27.603952407836914, "global_step": 621695, "epoch": 7490} {"train_loss": -27.78919792175293, "global_step": 621696, "epoch": 7490} {"train_loss": -27.79095458984375, "global_step": 621697, "epoch": 7490} {"train_loss": -28.10556983947754, "global_step": 621698, "epoch": 7490} {"train_loss": -27.96253776550293, "global_step": 621699, "epoch": 7490} {"train_loss": -27.860300064086914, "global_step": 621700, "epoch": 7490} {"train_loss": -28.0365047454834, "global_step": 621701, "epoch": 7490} {"train_loss": -28.22297477722168, "global_step": 621702, "epoch": 7490} {"train_loss": -28.142475128173828, "global_step": 621703, "epoch": 7490} {"train_loss": -28.0738582611084, "global_step": 621704, "epoch": 7490} {"train_loss": -28.17439079284668, "global_step": 621705, "epoch": 7490} {"train_loss": -28.36713218688965, "global_step": 621706, "epoch": 7490} {"train_loss": -28.01387596130371, "global_step": 621707, "epoch": 7490} {"train_loss": -28.099945068359375, "global_step": 621708, "epoch": 7490} {"train_loss": -28.114328384399414, "global_step": 621709, "epoch": 7490} {"train_loss": -28.19923210144043, "global_step": 621710, "epoch": 7490} {"train_loss": -28.336322784423828, "global_step": 621711, "epoch": 7490} {"train_loss": -28.340087890625, "global_step": 621712, "epoch": 7490} {"train_loss": -28.318618774414062, "global_step": 621713, "epoch": 7490} {"train_loss": -28.547733306884766, "global_step": 621714, "epoch": 7490} {"train_loss": -28.30219078063965, "global_step": 621715, "epoch": 7490} {"train_loss": -28.52545166015625, "global_step": 621716, "epoch": 7490} {"train_loss": -28.265487670898438, "global_step": 621717, "epoch": 7490} {"train_loss": -28.14093017578125, "global_step": 621718, "epoch": 7490} {"train_loss": -28.3538818359375, "global_step": 621719, "epoch": 7490} {"train_loss": -28.509265899658203, "global_step": 621720, "epoch": 7490} {"train_loss": -28.006927490234375, "global_step": 621721, "epoch": 7490} {"train_loss": -28.18866539001465, "global_step": 621722, "epoch": 7490} {"train_loss": -28.321325302124023, "global_step": 621723, "epoch": 7490} {"train_loss": -28.320240020751953, "global_step": 621724, "epoch": 7490} {"train_loss": -28.786741256713867, "global_step": 621725, "epoch": 7490} {"train_loss": -28.05490493774414, "global_step": 621726, "epoch": 7490} {"train_loss": -27.83331298828125, "global_step": 621727, "epoch": 7490} {"train_loss": -28.23041343688965, "global_step": 621728, "epoch": 7490} {"train_loss": -28.542694091796875, "global_step": 621729, "epoch": 7490} {"train_loss": -27.866674423217773, "global_step": 621730, "epoch": 7490} {"train_loss": -28.410551071166992, "global_step": 621731, "epoch": 7490} {"train_loss": -27.7620849609375, "global_step": 621732, "epoch": 7490} {"train_loss": -28.075510025024414, "global_step": 621733, "epoch": 7490} {"train_loss": -27.925992965698242, "global_step": 621734, "epoch": 7490} {"train_loss": -27.866779327392578, "global_step": 621735, "epoch": 7490} {"train_loss": -28.15862464904785, "global_step": 621736, "epoch": 7490} {"train_loss": -27.900287628173828, "global_step": 621737, "epoch": 7490} {"train_loss": -28.005598068237305, "global_step": 621738, "epoch": 7490} {"train_loss": -28.22564697265625, "global_step": 621739, "epoch": 7490} {"train_loss": -28.1019229888916, "global_step": 621740, "epoch": 7490} {"train_loss": -28.351736068725586, "global_step": 621741, "epoch": 7490} {"train_loss": -28.28834342956543, "global_step": 621742, "epoch": 7490} {"train_loss": -28.167072296142578, "global_step": 621743, "epoch": 7490} {"train_loss": -28.2750301361084, "global_step": 621744, "epoch": 7490} {"train_loss": -28.31036949157715, "global_step": 621745, "epoch": 7490} {"train_loss": -28.1853084564209, "global_step": 621746, "epoch": 7490} {"train_loss": -28.571805953979492, "global_step": 621747, "epoch": 7490} {"train_loss": -28.461959838867188, "global_step": 621748, "epoch": 7490} {"train_loss": -28.156980514526367, "global_step": 621749, "epoch": 7490} {"train_loss": -28.433521270751953, "global_step": 621750, "epoch": 7490} {"train_loss": -28.2083740234375, "global_step": 621751, "epoch": 7490} {"train_loss": -27.92554416426693, "global_step": 621752, "epoch": 7490, "val_loss": 6654136.0} {"train_loss": -28.1600399017334, "global_step": 621753, "epoch": 7491} {"train_loss": -28.220029830932617, "global_step": 621754, "epoch": 7491} {"train_loss": -28.077417373657227, "global_step": 621755, "epoch": 7491} {"train_loss": -27.55780601501465, "global_step": 621756, "epoch": 7491} {"train_loss": -27.60576820373535, "global_step": 621757, "epoch": 7491} {"train_loss": -27.660932540893555, "global_step": 621758, "epoch": 7491} {"train_loss": -27.80707359313965, "global_step": 621759, "epoch": 7491} {"train_loss": -27.88941764831543, "global_step": 621760, "epoch": 7491} {"train_loss": -27.49690818786621, "global_step": 621761, "epoch": 7491} {"train_loss": -27.806854248046875, "global_step": 621762, "epoch": 7491} {"train_loss": -28.036212921142578, "global_step": 621763, "epoch": 7491} {"train_loss": -28.1416072845459, "global_step": 621764, "epoch": 7491} {"train_loss": -27.662851333618164, "global_step": 621765, "epoch": 7491} {"train_loss": -27.912405014038086, "global_step": 621766, "epoch": 7491} {"train_loss": -27.636280059814453, "global_step": 621767, "epoch": 7491} {"train_loss": -27.965988159179688, "global_step": 621768, "epoch": 7491} {"train_loss": -28.193918228149414, "global_step": 621769, "epoch": 7491} {"train_loss": -27.94598960876465, "global_step": 621770, "epoch": 7491} {"train_loss": -27.969953536987305, "global_step": 621771, "epoch": 7491} {"train_loss": -28.171527862548828, "global_step": 621772, "epoch": 7491} {"train_loss": -28.367752075195312, "global_step": 621773, "epoch": 7491} {"train_loss": -27.78922462463379, "global_step": 621774, "epoch": 7491} {"train_loss": -27.879852294921875, "global_step": 621775, "epoch": 7491} {"train_loss": -27.95914077758789, "global_step": 621776, "epoch": 7491} {"train_loss": -27.974411010742188, "global_step": 621777, "epoch": 7491} {"train_loss": -28.057592391967773, "global_step": 621778, "epoch": 7491} {"train_loss": -27.827829360961914, "global_step": 621779, "epoch": 7491} {"train_loss": -27.993871688842773, "global_step": 621780, "epoch": 7491} {"train_loss": -28.26600456237793, "global_step": 621781, "epoch": 7491} {"train_loss": -28.448699951171875, "global_step": 621782, "epoch": 7491} {"train_loss": -28.05999755859375, "global_step": 621783, "epoch": 7491} {"train_loss": -28.654321670532227, "global_step": 621784, "epoch": 7491} {"train_loss": -28.14497184753418, "global_step": 621785, "epoch": 7491} {"train_loss": -28.084280014038086, "global_step": 621786, "epoch": 7491} {"train_loss": -28.337976455688477, "global_step": 621787, "epoch": 7491} {"train_loss": -28.0372257232666, "global_step": 621788, "epoch": 7491} {"train_loss": -28.203603744506836, "global_step": 621789, "epoch": 7491} {"train_loss": -28.13799476623535, "global_step": 621790, "epoch": 7491} {"train_loss": -28.1528377532959, "global_step": 621791, "epoch": 7491} {"train_loss": -28.453699111938477, "global_step": 621792, "epoch": 7491} {"train_loss": -27.969379425048828, "global_step": 621793, "epoch": 7491} {"train_loss": -27.784894943237305, "global_step": 621794, "epoch": 7491} {"train_loss": -28.18755531311035, "global_step": 621795, "epoch": 7491} {"train_loss": -28.119043350219727, "global_step": 621796, "epoch": 7491} {"train_loss": -27.88641929626465, "global_step": 621797, "epoch": 7491} {"train_loss": -28.036710739135742, "global_step": 621798, "epoch": 7491} {"train_loss": -27.88982582092285, "global_step": 621799, "epoch": 7491} {"train_loss": -27.907621383666992, "global_step": 621800, "epoch": 7491} {"train_loss": -27.831823348999023, "global_step": 621801, "epoch": 7491} {"train_loss": -28.193342208862305, "global_step": 621802, "epoch": 7491} {"train_loss": -28.206815719604492, "global_step": 621803, "epoch": 7491} {"train_loss": -27.880725860595703, "global_step": 621804, "epoch": 7491} {"train_loss": -28.242658615112305, "global_step": 621805, "epoch": 7491} {"train_loss": -27.9744873046875, "global_step": 621806, "epoch": 7491} {"train_loss": -28.030237197875977, "global_step": 621807, "epoch": 7491} {"train_loss": -28.355497360229492, "global_step": 621808, "epoch": 7491} {"train_loss": -28.466922760009766, "global_step": 621809, "epoch": 7491} {"train_loss": -28.124128341674805, "global_step": 621810, "epoch": 7491} {"train_loss": -28.125219345092773, "global_step": 621811, "epoch": 7491} {"train_loss": -28.043170928955078, "global_step": 621812, "epoch": 7491} {"train_loss": -28.077594757080078, "global_step": 621813, "epoch": 7491} {"train_loss": -28.092777252197266, "global_step": 621814, "epoch": 7491} {"train_loss": -27.541410446166992, "global_step": 621815, "epoch": 7491} {"train_loss": -28.101795196533203, "global_step": 621816, "epoch": 7491} {"train_loss": -28.2568302154541, "global_step": 621817, "epoch": 7491} {"train_loss": -28.305280685424805, "global_step": 621818, "epoch": 7491} {"train_loss": -28.286630630493164, "global_step": 621819, "epoch": 7491} {"train_loss": -28.014911651611328, "global_step": 621820, "epoch": 7491} {"train_loss": -27.978317260742188, "global_step": 621821, "epoch": 7491} {"train_loss": -27.862512588500977, "global_step": 621822, "epoch": 7491} {"train_loss": -28.294538497924805, "global_step": 621823, "epoch": 7491} {"train_loss": -28.033788681030273, "global_step": 621824, "epoch": 7491} {"train_loss": -28.230621337890625, "global_step": 621825, "epoch": 7491} {"train_loss": -28.06512451171875, "global_step": 621826, "epoch": 7491} {"train_loss": -28.099273681640625, "global_step": 621827, "epoch": 7491} {"train_loss": -28.45416831970215, "global_step": 621828, "epoch": 7491} {"train_loss": -27.900068283081055, "global_step": 621829, "epoch": 7491} {"train_loss": -28.381601333618164, "global_step": 621830, "epoch": 7491} {"train_loss": -28.328088760375977, "global_step": 621831, "epoch": 7491} {"train_loss": -28.4388484954834, "global_step": 621832, "epoch": 7491} {"train_loss": -27.870868682861328, "global_step": 621833, "epoch": 7491} {"train_loss": -28.276691436767578, "global_step": 621834, "epoch": 7491} {"train_loss": -28.04845228539892, "global_step": 621835, "epoch": 7491, "val_loss": 6610191.0} {"train_loss": -27.356847763061523, "global_step": 621836, "epoch": 7492} {"train_loss": -27.239423751831055, "global_step": 621837, "epoch": 7492} {"train_loss": -27.985944747924805, "global_step": 621838, "epoch": 7492} {"train_loss": -27.360187530517578, "global_step": 621839, "epoch": 7492} {"train_loss": -27.58281898498535, "global_step": 621840, "epoch": 7492} {"train_loss": -27.97391128540039, "global_step": 621841, "epoch": 7492} {"train_loss": -27.57557487487793, "global_step": 621842, "epoch": 7492} {"train_loss": -28.15757179260254, "global_step": 621843, "epoch": 7492} {"train_loss": -28.0010986328125, "global_step": 621844, "epoch": 7492} {"train_loss": -27.95751953125, "global_step": 621845, "epoch": 7492} {"train_loss": -28.06735610961914, "global_step": 621846, "epoch": 7492} {"train_loss": -28.06702995300293, "global_step": 621847, "epoch": 7492} {"train_loss": -28.038410186767578, "global_step": 621848, "epoch": 7492} {"train_loss": -28.111408233642578, "global_step": 621849, "epoch": 7492} {"train_loss": -28.428436279296875, "global_step": 621850, "epoch": 7492} {"train_loss": -28.13520622253418, "global_step": 621851, "epoch": 7492} {"train_loss": -27.94711685180664, "global_step": 621852, "epoch": 7492} {"train_loss": -27.793188095092773, "global_step": 621853, "epoch": 7492} {"train_loss": -28.231189727783203, "global_step": 621854, "epoch": 7492} {"train_loss": -28.011255264282227, "global_step": 621855, "epoch": 7492} {"train_loss": -28.606290817260742, "global_step": 621856, "epoch": 7492} {"train_loss": -28.317785263061523, "global_step": 621857, "epoch": 7492} {"train_loss": -28.000761032104492, "global_step": 621858, "epoch": 7492} {"train_loss": -27.94487953186035, "global_step": 621859, "epoch": 7492} {"train_loss": -27.90952491760254, "global_step": 621860, "epoch": 7492} {"train_loss": -28.287519454956055, "global_step": 621861, "epoch": 7492} {"train_loss": -28.085187911987305, "global_step": 621862, "epoch": 7492} {"train_loss": -28.228870391845703, "global_step": 621863, "epoch": 7492} {"train_loss": -27.860509872436523, "global_step": 621864, "epoch": 7492} {"train_loss": -28.52948570251465, "global_step": 621865, "epoch": 7492} {"train_loss": -27.983057022094727, "global_step": 621866, "epoch": 7492} {"train_loss": -28.295557022094727, "global_step": 621867, "epoch": 7492} {"train_loss": -28.339502334594727, "global_step": 621868, "epoch": 7492} {"train_loss": -28.28387451171875, "global_step": 621869, "epoch": 7492} {"train_loss": -27.90024757385254, "global_step": 621870, "epoch": 7492} {"train_loss": -28.124454498291016, "global_step": 621871, "epoch": 7492} {"train_loss": -27.992109298706055, "global_step": 621872, "epoch": 7492} {"train_loss": -27.908918380737305, "global_step": 621873, "epoch": 7492} {"train_loss": -28.294330596923828, "global_step": 621874, "epoch": 7492} {"train_loss": -28.07958984375, "global_step": 621875, "epoch": 7492} {"train_loss": -27.76020622253418, "global_step": 621876, "epoch": 7492} {"train_loss": -28.4212646484375, "global_step": 621877, "epoch": 7492} {"train_loss": -27.971338272094727, "global_step": 621878, "epoch": 7492} {"train_loss": -27.444751739501953, "global_step": 621879, "epoch": 7492} {"train_loss": -28.347742080688477, "global_step": 621880, "epoch": 7492} {"train_loss": -27.99299430847168, "global_step": 621881, "epoch": 7492} {"train_loss": -28.192712783813477, "global_step": 621882, "epoch": 7492} {"train_loss": -28.23402214050293, "global_step": 621883, "epoch": 7492} {"train_loss": -28.371458053588867, "global_step": 621884, "epoch": 7492} {"train_loss": -28.33928871154785, "global_step": 621885, "epoch": 7492} {"train_loss": -28.075159072875977, "global_step": 621886, "epoch": 7492} {"train_loss": -28.545469284057617, "global_step": 621887, "epoch": 7492} {"train_loss": -28.3927059173584, "global_step": 621888, "epoch": 7492} {"train_loss": -28.1654052734375, "global_step": 621889, "epoch": 7492} {"train_loss": -28.248388290405273, "global_step": 621890, "epoch": 7492} {"train_loss": -28.480743408203125, "global_step": 621891, "epoch": 7492} {"train_loss": -28.46966552734375, "global_step": 621892, "epoch": 7492} {"train_loss": -28.393980026245117, "global_step": 621893, "epoch": 7492} {"train_loss": -28.41895866394043, "global_step": 621894, "epoch": 7492} {"train_loss": -27.87055015563965, "global_step": 621895, "epoch": 7492} {"train_loss": -26.298908233642578, "global_step": 621896, "epoch": 7492} {"train_loss": -23.995935440063477, "global_step": 621897, "epoch": 7492} {"train_loss": -23.2553653717041, "global_step": 621898, "epoch": 7492} {"train_loss": -26.026077270507812, "global_step": 621899, "epoch": 7492} {"train_loss": -27.60566520690918, "global_step": 621900, "epoch": 7492} {"train_loss": -26.943557739257812, "global_step": 621901, "epoch": 7492} {"train_loss": -26.77815055847168, "global_step": 621902, "epoch": 7492} {"train_loss": -27.66253662109375, "global_step": 621903, "epoch": 7492} {"train_loss": -26.630834579467773, "global_step": 621904, "epoch": 7492} {"train_loss": -27.677221298217773, "global_step": 621905, "epoch": 7492} {"train_loss": -27.556909561157227, "global_step": 621906, "epoch": 7492} {"train_loss": -27.061063766479492, "global_step": 621907, "epoch": 7492} {"train_loss": -27.478540420532227, "global_step": 621908, "epoch": 7492} {"train_loss": -27.55719566345215, "global_step": 621909, "epoch": 7492} {"train_loss": -27.3604679107666, "global_step": 621910, "epoch": 7492} {"train_loss": -27.98935890197754, "global_step": 621911, "epoch": 7492} {"train_loss": -27.817724227905273, "global_step": 621912, "epoch": 7492} {"train_loss": -28.12407875061035, "global_step": 621913, "epoch": 7492} {"train_loss": -27.49319839477539, "global_step": 621914, "epoch": 7492} {"train_loss": -27.640722274780273, "global_step": 621915, "epoch": 7492} {"train_loss": -27.883264541625977, "global_step": 621916, "epoch": 7492} {"train_loss": -27.419525146484375, "global_step": 621917, "epoch": 7492} {"train_loss": -27.819219060691005, "global_step": 621918, "epoch": 7492, "val_loss": 6542475.0} {"train_loss": -27.39524269104004, "global_step": 621919, "epoch": 7493} {"train_loss": -27.774694442749023, "global_step": 621920, "epoch": 7493} {"train_loss": -27.475046157836914, "global_step": 621921, "epoch": 7493} {"train_loss": -27.73211669921875, "global_step": 621922, "epoch": 7493} {"train_loss": -27.703344345092773, "global_step": 621923, "epoch": 7493} {"train_loss": -27.44427490234375, "global_step": 621924, "epoch": 7493} {"train_loss": -27.542097091674805, "global_step": 621925, "epoch": 7493} {"train_loss": -27.362293243408203, "global_step": 621926, "epoch": 7493} {"train_loss": -27.58335304260254, "global_step": 621927, "epoch": 7493} {"train_loss": -27.683759689331055, "global_step": 621928, "epoch": 7493} {"train_loss": -27.677026748657227, "global_step": 621929, "epoch": 7493} {"train_loss": -27.404529571533203, "global_step": 621930, "epoch": 7493} {"train_loss": -27.677326202392578, "global_step": 621931, "epoch": 7493} {"train_loss": -27.68644142150879, "global_step": 621932, "epoch": 7493} {"train_loss": -27.780542373657227, "global_step": 621933, "epoch": 7493} {"train_loss": -27.717334747314453, "global_step": 621934, "epoch": 7493} {"train_loss": -27.930225372314453, "global_step": 621935, "epoch": 7493} {"train_loss": -27.848005294799805, "global_step": 621936, "epoch": 7493} {"train_loss": -27.749242782592773, "global_step": 621937, "epoch": 7493} {"train_loss": -27.935190200805664, "global_step": 621938, "epoch": 7493} {"train_loss": -27.822118759155273, "global_step": 621939, "epoch": 7493} {"train_loss": -28.142602920532227, "global_step": 621940, "epoch": 7493} {"train_loss": -27.96260643005371, "global_step": 621941, "epoch": 7493} {"train_loss": -27.887195587158203, "global_step": 621942, "epoch": 7493} {"train_loss": -27.999099731445312, "global_step": 621943, "epoch": 7493} {"train_loss": -27.724695205688477, "global_step": 621944, "epoch": 7493} {"train_loss": -28.131200790405273, "global_step": 621945, "epoch": 7493} {"train_loss": -27.9320068359375, "global_step": 621946, "epoch": 7493} {"train_loss": -28.187768936157227, "global_step": 621947, "epoch": 7493} {"train_loss": -27.793176651000977, "global_step": 621948, "epoch": 7493} {"train_loss": -28.079803466796875, "global_step": 621949, "epoch": 7493} {"train_loss": -28.2176570892334, "global_step": 621950, "epoch": 7493} {"train_loss": -27.82855796813965, "global_step": 621951, "epoch": 7493} {"train_loss": -27.8115177154541, "global_step": 621952, "epoch": 7493} {"train_loss": -28.39851188659668, "global_step": 621953, "epoch": 7493} {"train_loss": -28.2900447845459, "global_step": 621954, "epoch": 7493} {"train_loss": -28.42926025390625, "global_step": 621955, "epoch": 7493} {"train_loss": -28.256933212280273, "global_step": 621956, "epoch": 7493} {"train_loss": -28.44667625427246, "global_step": 621957, "epoch": 7493} {"train_loss": -28.39259147644043, "global_step": 621958, "epoch": 7493} {"train_loss": -28.13690757751465, "global_step": 621959, "epoch": 7493} {"train_loss": -28.31666374206543, "global_step": 621960, "epoch": 7493} {"train_loss": -28.330175399780273, "global_step": 621961, "epoch": 7493} {"train_loss": -28.2244815826416, "global_step": 621962, "epoch": 7493} {"train_loss": -28.420862197875977, "global_step": 621963, "epoch": 7493} {"train_loss": -27.903369903564453, "global_step": 621964, "epoch": 7493} {"train_loss": -28.160123825073242, "global_step": 621965, "epoch": 7493} {"train_loss": -28.5665283203125, "global_step": 621966, "epoch": 7493} {"train_loss": -28.533056259155273, "global_step": 621967, "epoch": 7493} {"train_loss": -27.926610946655273, "global_step": 621968, "epoch": 7493} {"train_loss": -28.00830078125, "global_step": 621969, "epoch": 7493} {"train_loss": -28.105920791625977, "global_step": 621970, "epoch": 7493} {"train_loss": -27.579343795776367, "global_step": 621971, "epoch": 7493} {"train_loss": -27.76167869567871, "global_step": 621972, "epoch": 7493} {"train_loss": -28.23176383972168, "global_step": 621973, "epoch": 7493} {"train_loss": -28.43848991394043, "global_step": 621974, "epoch": 7493} {"train_loss": -27.79212760925293, "global_step": 621975, "epoch": 7493} {"train_loss": -28.236433029174805, "global_step": 621976, "epoch": 7493} {"train_loss": -28.417724609375, "global_step": 621977, "epoch": 7493} {"train_loss": -28.0365047454834, "global_step": 621978, "epoch": 7493} {"train_loss": -27.793842315673828, "global_step": 621979, "epoch": 7493} {"train_loss": -27.612228393554688, "global_step": 621980, "epoch": 7493} {"train_loss": -28.4518985748291, "global_step": 621981, "epoch": 7493} {"train_loss": -27.945905685424805, "global_step": 621982, "epoch": 7493} {"train_loss": -28.075368881225586, "global_step": 621983, "epoch": 7493} {"train_loss": -28.100400924682617, "global_step": 621984, "epoch": 7493} {"train_loss": -28.025907516479492, "global_step": 621985, "epoch": 7493} {"train_loss": -28.057861328125, "global_step": 621986, "epoch": 7493} {"train_loss": -27.89812660217285, "global_step": 621987, "epoch": 7493} {"train_loss": -28.30939292907715, "global_step": 621988, "epoch": 7493} {"train_loss": -28.116247177124023, "global_step": 621989, "epoch": 7493} {"train_loss": -28.02593994140625, "global_step": 621990, "epoch": 7493} {"train_loss": -28.039066314697266, "global_step": 621991, "epoch": 7493} {"train_loss": -28.29958152770996, "global_step": 621992, "epoch": 7493} {"train_loss": -28.31254005432129, "global_step": 621993, "epoch": 7493} {"train_loss": -28.423038482666016, "global_step": 621994, "epoch": 7493} {"train_loss": -28.026838302612305, "global_step": 621995, "epoch": 7493} {"train_loss": -27.866336822509766, "global_step": 621996, "epoch": 7493} {"train_loss": -27.974639892578125, "global_step": 621997, "epoch": 7493} {"train_loss": -28.313077926635742, "global_step": 621998, "epoch": 7493} {"train_loss": -28.463315963745117, "global_step": 621999, "epoch": 7493} {"train_loss": -28.164228439331055, "global_step": 622000, "epoch": 7493} {"train_loss": -28.002451678356493, "global_step": 622001, "epoch": 7493, "val_loss": 6638111.0} {"train_loss": -28.0350341796875, "global_step": 622002, "epoch": 7494} {"train_loss": -27.787626266479492, "global_step": 622003, "epoch": 7494} {"train_loss": -27.693012237548828, "global_step": 622004, "epoch": 7494} {"train_loss": -27.404193878173828, "global_step": 622005, "epoch": 7494} {"train_loss": -28.02532386779785, "global_step": 622006, "epoch": 7494} {"train_loss": -27.820032119750977, "global_step": 622007, "epoch": 7494} {"train_loss": -27.893518447875977, "global_step": 622008, "epoch": 7494} {"train_loss": -27.870803833007812, "global_step": 622009, "epoch": 7494} {"train_loss": -27.77536392211914, "global_step": 622010, "epoch": 7494} {"train_loss": -27.89691162109375, "global_step": 622011, "epoch": 7494} {"train_loss": -28.131977081298828, "global_step": 622012, "epoch": 7494} {"train_loss": -27.526121139526367, "global_step": 622013, "epoch": 7494} {"train_loss": -28.2885799407959, "global_step": 622014, "epoch": 7494} {"train_loss": -27.21729850769043, "global_step": 622015, "epoch": 7494} {"train_loss": -28.26015281677246, "global_step": 622016, "epoch": 7494} {"train_loss": -28.1592960357666, "global_step": 622017, "epoch": 7494} {"train_loss": -28.207626342773438, "global_step": 622018, "epoch": 7494} {"train_loss": -28.15774917602539, "global_step": 622019, "epoch": 7494} {"train_loss": -28.029569625854492, "global_step": 622020, "epoch": 7494} {"train_loss": -27.943052291870117, "global_step": 622021, "epoch": 7494} {"train_loss": -28.416967391967773, "global_step": 622022, "epoch": 7494} {"train_loss": -28.37925148010254, "global_step": 622023, "epoch": 7494} {"train_loss": -27.995153427124023, "global_step": 622024, "epoch": 7494} {"train_loss": -28.45182228088379, "global_step": 622025, "epoch": 7494} {"train_loss": -28.3170166015625, "global_step": 622026, "epoch": 7494} {"train_loss": -28.550262451171875, "global_step": 622027, "epoch": 7494} {"train_loss": -28.47393798828125, "global_step": 622028, "epoch": 7494} {"train_loss": -28.347097396850586, "global_step": 622029, "epoch": 7494} {"train_loss": -28.23093032836914, "global_step": 622030, "epoch": 7494} {"train_loss": -28.178308486938477, "global_step": 622031, "epoch": 7494} {"train_loss": -28.202550888061523, "global_step": 622032, "epoch": 7494} {"train_loss": -28.119916915893555, "global_step": 622033, "epoch": 7494} {"train_loss": -28.107009887695312, "global_step": 622034, "epoch": 7494} {"train_loss": -27.9951114654541, "global_step": 622035, "epoch": 7494} {"train_loss": -28.429508209228516, "global_step": 622036, "epoch": 7494} {"train_loss": -28.190784454345703, "global_step": 622037, "epoch": 7494} {"train_loss": -28.2744140625, "global_step": 622038, "epoch": 7494} {"train_loss": -28.284164428710938, "global_step": 622039, "epoch": 7494} {"train_loss": -27.989206314086914, "global_step": 622040, "epoch": 7494} {"train_loss": -27.841934204101562, "global_step": 622041, "epoch": 7494} {"train_loss": -28.197378158569336, "global_step": 622042, "epoch": 7494} {"train_loss": -28.4300594329834, "global_step": 622043, "epoch": 7494} {"train_loss": -28.715436935424805, "global_step": 622044, "epoch": 7494} {"train_loss": -28.06427574157715, "global_step": 622045, "epoch": 7494} {"train_loss": -28.12062644958496, "global_step": 622046, "epoch": 7494} {"train_loss": -28.278074264526367, "global_step": 622047, "epoch": 7494} {"train_loss": -28.266813278198242, "global_step": 622048, "epoch": 7494} {"train_loss": -28.1528263092041, "global_step": 622049, "epoch": 7494} {"train_loss": -28.18634605407715, "global_step": 622050, "epoch": 7494} {"train_loss": -27.816064834594727, "global_step": 622051, "epoch": 7494} {"train_loss": -28.467199325561523, "global_step": 622052, "epoch": 7494} {"train_loss": -28.138553619384766, "global_step": 622053, "epoch": 7494} {"train_loss": -28.3515625, "global_step": 622054, "epoch": 7494} {"train_loss": -28.290273666381836, "global_step": 622055, "epoch": 7494} {"train_loss": -28.179357528686523, "global_step": 622056, "epoch": 7494} {"train_loss": -28.85456657409668, "global_step": 622057, "epoch": 7494} {"train_loss": -28.403844833374023, "global_step": 622058, "epoch": 7494} {"train_loss": -28.291858673095703, "global_step": 622059, "epoch": 7494} {"train_loss": -28.70046043395996, "global_step": 622060, "epoch": 7494} {"train_loss": -28.072927474975586, "global_step": 622061, "epoch": 7494} {"train_loss": -27.928817749023438, "global_step": 622062, "epoch": 7494} {"train_loss": -27.8705997467041, "global_step": 622063, "epoch": 7494} {"train_loss": -28.009429931640625, "global_step": 622064, "epoch": 7494} {"train_loss": -27.915393829345703, "global_step": 622065, "epoch": 7494} {"train_loss": -28.324783325195312, "global_step": 622066, "epoch": 7494} {"train_loss": -28.26604652404785, "global_step": 622067, "epoch": 7494} {"train_loss": -28.62965202331543, "global_step": 622068, "epoch": 7494} {"train_loss": -28.319995880126953, "global_step": 622069, "epoch": 7494} {"train_loss": -28.582792282104492, "global_step": 622070, "epoch": 7494} {"train_loss": -28.24566078186035, "global_step": 622071, "epoch": 7494} {"train_loss": -28.33985710144043, "global_step": 622072, "epoch": 7494} {"train_loss": -28.3909854888916, "global_step": 622073, "epoch": 7494} {"train_loss": -28.226226806640625, "global_step": 622074, "epoch": 7494} {"train_loss": -28.5732479095459, "global_step": 622075, "epoch": 7494} {"train_loss": -28.196935653686523, "global_step": 622076, "epoch": 7494} {"train_loss": -28.27643394470215, "global_step": 622077, "epoch": 7494} {"train_loss": -28.18874168395996, "global_step": 622078, "epoch": 7494} {"train_loss": -27.987842559814453, "global_step": 622079, "epoch": 7494} {"train_loss": -28.001800537109375, "global_step": 622080, "epoch": 7494} {"train_loss": -28.100940704345703, "global_step": 622081, "epoch": 7494} {"train_loss": -28.2839298248291, "global_step": 622082, "epoch": 7494} {"train_loss": -28.7370662689209, "global_step": 622083, "epoch": 7494} {"train_loss": -28.181890694491834, "global_step": 622084, "epoch": 7494, "val_loss": 6720769.0} {"train_loss": -27.44378662109375, "global_step": 622085, "epoch": 7495} {"train_loss": -27.5438175201416, "global_step": 622086, "epoch": 7495} {"train_loss": -27.540796279907227, "global_step": 622087, "epoch": 7495} {"train_loss": -27.017963409423828, "global_step": 622088, "epoch": 7495} {"train_loss": -27.1893253326416, "global_step": 622089, "epoch": 7495} {"train_loss": -27.373641967773438, "global_step": 622090, "epoch": 7495} {"train_loss": -27.60394287109375, "global_step": 622091, "epoch": 7495} {"train_loss": -27.343524932861328, "global_step": 622092, "epoch": 7495} {"train_loss": -27.540058135986328, "global_step": 622093, "epoch": 7495} {"train_loss": -27.073938369750977, "global_step": 622094, "epoch": 7495} {"train_loss": -26.85593605041504, "global_step": 622095, "epoch": 7495} {"train_loss": -27.53095054626465, "global_step": 622096, "epoch": 7495} {"train_loss": -27.634180068969727, "global_step": 622097, "epoch": 7495} {"train_loss": -27.42537498474121, "global_step": 622098, "epoch": 7495} {"train_loss": -27.603803634643555, "global_step": 622099, "epoch": 7495} {"train_loss": -27.664602279663086, "global_step": 622100, "epoch": 7495} {"train_loss": -27.619726181030273, "global_step": 622101, "epoch": 7495} {"train_loss": -27.89131736755371, "global_step": 622102, "epoch": 7495} {"train_loss": -27.921545028686523, "global_step": 622103, "epoch": 7495} {"train_loss": -27.691720962524414, "global_step": 622104, "epoch": 7495} {"train_loss": -27.567646026611328, "global_step": 622105, "epoch": 7495} {"train_loss": -27.92420768737793, "global_step": 622106, "epoch": 7495} {"train_loss": -28.252349853515625, "global_step": 622107, "epoch": 7495} {"train_loss": -27.810684204101562, "global_step": 622108, "epoch": 7495} {"train_loss": -27.968896865844727, "global_step": 622109, "epoch": 7495} {"train_loss": -28.138315200805664, "global_step": 622110, "epoch": 7495} {"train_loss": -27.933212280273438, "global_step": 622111, "epoch": 7495} {"train_loss": -28.239124298095703, "global_step": 622112, "epoch": 7495} {"train_loss": -28.030384063720703, "global_step": 622113, "epoch": 7495} {"train_loss": -28.27353858947754, "global_step": 622114, "epoch": 7495} {"train_loss": -28.286130905151367, "global_step": 622115, "epoch": 7495} {"train_loss": -28.060592651367188, "global_step": 622116, "epoch": 7495} {"train_loss": -27.708789825439453, "global_step": 622117, "epoch": 7495} {"train_loss": -28.1452579498291, "global_step": 622118, "epoch": 7495} {"train_loss": -28.38458824157715, "global_step": 622119, "epoch": 7495} {"train_loss": -27.98577880859375, "global_step": 622120, "epoch": 7495} {"train_loss": -28.023344039916992, "global_step": 622121, "epoch": 7495} {"train_loss": -28.166156768798828, "global_step": 622122, "epoch": 7495} {"train_loss": -27.823928833007812, "global_step": 622123, "epoch": 7495} {"train_loss": -28.4554443359375, "global_step": 622124, "epoch": 7495} {"train_loss": -28.304471969604492, "global_step": 622125, "epoch": 7495} {"train_loss": -27.959623336791992, "global_step": 622126, "epoch": 7495} {"train_loss": -28.100910186767578, "global_step": 622127, "epoch": 7495} {"train_loss": -28.094430923461914, "global_step": 622128, "epoch": 7495} {"train_loss": -28.164228439331055, "global_step": 622129, "epoch": 7495} {"train_loss": -27.973352432250977, "global_step": 622130, "epoch": 7495} {"train_loss": -28.177417755126953, "global_step": 622131, "epoch": 7495} {"train_loss": -28.781896591186523, "global_step": 622132, "epoch": 7495} {"train_loss": -28.25665283203125, "global_step": 622133, "epoch": 7495} {"train_loss": -28.3675479888916, "global_step": 622134, "epoch": 7495} {"train_loss": -28.516468048095703, "global_step": 622135, "epoch": 7495} {"train_loss": -28.07230567932129, "global_step": 622136, "epoch": 7495} {"train_loss": -28.797346115112305, "global_step": 622137, "epoch": 7495} {"train_loss": -28.12917137145996, "global_step": 622138, "epoch": 7495} {"train_loss": -28.594806671142578, "global_step": 622139, "epoch": 7495} {"train_loss": -28.185413360595703, "global_step": 622140, "epoch": 7495} {"train_loss": -28.03665542602539, "global_step": 622141, "epoch": 7495} {"train_loss": -28.21919059753418, "global_step": 622142, "epoch": 7495} {"train_loss": -28.21026039123535, "global_step": 622143, "epoch": 7495} {"train_loss": -28.288476943969727, "global_step": 622144, "epoch": 7495} {"train_loss": -28.060800552368164, "global_step": 622145, "epoch": 7495} {"train_loss": -28.5416259765625, "global_step": 622146, "epoch": 7495} {"train_loss": -28.036975860595703, "global_step": 622147, "epoch": 7495} {"train_loss": -28.20842933654785, "global_step": 622148, "epoch": 7495} {"train_loss": -28.144330978393555, "global_step": 622149, "epoch": 7495} {"train_loss": -28.226728439331055, "global_step": 622150, "epoch": 7495} {"train_loss": -28.104368209838867, "global_step": 622151, "epoch": 7495} {"train_loss": -28.074445724487305, "global_step": 622152, "epoch": 7495} {"train_loss": -27.93364906311035, "global_step": 622153, "epoch": 7495} {"train_loss": -28.272321701049805, "global_step": 622154, "epoch": 7495} {"train_loss": -28.117902755737305, "global_step": 622155, "epoch": 7495} {"train_loss": -28.08811378479004, "global_step": 622156, "epoch": 7495} {"train_loss": -28.1953125, "global_step": 622157, "epoch": 7495} {"train_loss": -28.150821685791016, "global_step": 622158, "epoch": 7495} {"train_loss": -27.946762084960938, "global_step": 622159, "epoch": 7495} {"train_loss": -27.8828125, "global_step": 622160, "epoch": 7495} {"train_loss": -27.98456382751465, "global_step": 622161, "epoch": 7495} {"train_loss": -28.072336196899414, "global_step": 622162, "epoch": 7495} {"train_loss": -28.163129806518555, "global_step": 622163, "epoch": 7495} {"train_loss": -28.0819091796875, "global_step": 622164, "epoch": 7495} {"train_loss": -28.025781631469727, "global_step": 622165, "epoch": 7495} {"train_loss": -27.587095260620117, "global_step": 622166, "epoch": 7495} {"train_loss": -27.970277786254883, "global_step": 622167, "epoch": 7495, "val_loss": 6670114.0} {"train_loss": -27.22553062438965, "global_step": 622168, "epoch": 7496} {"train_loss": -27.409351348876953, "global_step": 622169, "epoch": 7496} {"train_loss": -26.526397705078125, "global_step": 622170, "epoch": 7496} {"train_loss": -26.336660385131836, "global_step": 622171, "epoch": 7496} {"train_loss": -26.71441078186035, "global_step": 622172, "epoch": 7496} {"train_loss": -27.285938262939453, "global_step": 622173, "epoch": 7496} {"train_loss": -26.640167236328125, "global_step": 622174, "epoch": 7496} {"train_loss": -27.007980346679688, "global_step": 622175, "epoch": 7496} {"train_loss": -26.955236434936523, "global_step": 622176, "epoch": 7496} {"train_loss": -27.375547409057617, "global_step": 622177, "epoch": 7496} {"train_loss": -27.064624786376953, "global_step": 622178, "epoch": 7496} {"train_loss": -27.175525665283203, "global_step": 622179, "epoch": 7496} {"train_loss": -27.656049728393555, "global_step": 622180, "epoch": 7496} {"train_loss": -27.164411544799805, "global_step": 622181, "epoch": 7496} {"train_loss": -27.140329360961914, "global_step": 622182, "epoch": 7496} {"train_loss": -27.79433250427246, "global_step": 622183, "epoch": 7496} {"train_loss": -27.589609146118164, "global_step": 622184, "epoch": 7496} {"train_loss": -27.528348922729492, "global_step": 622185, "epoch": 7496} {"train_loss": -27.648944854736328, "global_step": 622186, "epoch": 7496} {"train_loss": -27.747543334960938, "global_step": 622187, "epoch": 7496} {"train_loss": -27.372711181640625, "global_step": 622188, "epoch": 7496} {"train_loss": -27.811349868774414, "global_step": 622189, "epoch": 7496} {"train_loss": -27.46610450744629, "global_step": 622190, "epoch": 7496} {"train_loss": -27.433847427368164, "global_step": 622191, "epoch": 7496} {"train_loss": -27.652006149291992, "global_step": 622192, "epoch": 7496} {"train_loss": -27.664106369018555, "global_step": 622193, "epoch": 7496} {"train_loss": -27.598188400268555, "global_step": 622194, "epoch": 7496} {"train_loss": -27.968908309936523, "global_step": 622195, "epoch": 7496} {"train_loss": -27.9501895904541, "global_step": 622196, "epoch": 7496} {"train_loss": -27.668445587158203, "global_step": 622197, "epoch": 7496} {"train_loss": -27.51435661315918, "global_step": 622198, "epoch": 7496} {"train_loss": -28.185016632080078, "global_step": 622199, "epoch": 7496} {"train_loss": -27.887060165405273, "global_step": 622200, "epoch": 7496} {"train_loss": -28.080236434936523, "global_step": 622201, "epoch": 7496} {"train_loss": -28.251501083374023, "global_step": 622202, "epoch": 7496} {"train_loss": -27.403900146484375, "global_step": 622203, "epoch": 7496} {"train_loss": -27.966318130493164, "global_step": 622204, "epoch": 7496} {"train_loss": -28.08173179626465, "global_step": 622205, "epoch": 7496} {"train_loss": -28.3862361907959, "global_step": 622206, "epoch": 7496} {"train_loss": -28.1050968170166, "global_step": 622207, "epoch": 7496} {"train_loss": -28.022607803344727, "global_step": 622208, "epoch": 7496} {"train_loss": -28.311649322509766, "global_step": 622209, "epoch": 7496} {"train_loss": -28.164966583251953, "global_step": 622210, "epoch": 7496} {"train_loss": -28.01718521118164, "global_step": 622211, "epoch": 7496} {"train_loss": -28.16046142578125, "global_step": 622212, "epoch": 7496} {"train_loss": -28.36669921875, "global_step": 622213, "epoch": 7496} {"train_loss": -28.45049476623535, "global_step": 622214, "epoch": 7496} {"train_loss": -28.3138484954834, "global_step": 622215, "epoch": 7496} {"train_loss": -28.387592315673828, "global_step": 622216, "epoch": 7496} {"train_loss": -28.130496978759766, "global_step": 622217, "epoch": 7496} {"train_loss": -28.094039916992188, "global_step": 622218, "epoch": 7496} {"train_loss": -28.211938858032227, "global_step": 622219, "epoch": 7496} {"train_loss": -28.475549697875977, "global_step": 622220, "epoch": 7496} {"train_loss": -28.40668296813965, "global_step": 622221, "epoch": 7496} {"train_loss": -28.1611385345459, "global_step": 622222, "epoch": 7496} {"train_loss": -28.40398597717285, "global_step": 622223, "epoch": 7496} {"train_loss": -28.425159454345703, "global_step": 622224, "epoch": 7496} {"train_loss": -28.503528594970703, "global_step": 622225, "epoch": 7496} {"train_loss": -27.669309616088867, "global_step": 622226, "epoch": 7496} {"train_loss": -28.185688018798828, "global_step": 622227, "epoch": 7496} {"train_loss": -28.605321884155273, "global_step": 622228, "epoch": 7496} {"train_loss": -28.136627197265625, "global_step": 622229, "epoch": 7496} {"train_loss": -28.40809440612793, "global_step": 622230, "epoch": 7496} {"train_loss": -28.394987106323242, "global_step": 622231, "epoch": 7496} {"train_loss": -28.117050170898438, "global_step": 622232, "epoch": 7496} {"train_loss": -28.468612670898438, "global_step": 622233, "epoch": 7496} {"train_loss": -28.086286544799805, "global_step": 622234, "epoch": 7496} {"train_loss": -28.116790771484375, "global_step": 622235, "epoch": 7496} {"train_loss": -28.211088180541992, "global_step": 622236, "epoch": 7496} {"train_loss": -28.054162979125977, "global_step": 622237, "epoch": 7496} {"train_loss": -28.282958984375, "global_step": 622238, "epoch": 7496} {"train_loss": -28.092737197875977, "global_step": 622239, "epoch": 7496} {"train_loss": -28.0800724029541, "global_step": 622240, "epoch": 7496} {"train_loss": -28.147199630737305, "global_step": 622241, "epoch": 7496} {"train_loss": -28.134382247924805, "global_step": 622242, "epoch": 7496} {"train_loss": -28.43988037109375, "global_step": 622243, "epoch": 7496} {"train_loss": -27.89369010925293, "global_step": 622244, "epoch": 7496} {"train_loss": -28.710575103759766, "global_step": 622245, "epoch": 7496} {"train_loss": -28.026464462280273, "global_step": 622246, "epoch": 7496} {"train_loss": -28.201711654663086, "global_step": 622247, "epoch": 7496} {"train_loss": -28.528488159179688, "global_step": 622248, "epoch": 7496} {"train_loss": -28.367528915405273, "global_step": 622249, "epoch": 7496} {"train_loss": -27.885601618203772, "global_step": 622250, "epoch": 7496, "val_loss": 6842519.0} {"train_loss": -27.76803970336914, "global_step": 622251, "epoch": 7497} {"train_loss": -27.654775619506836, "global_step": 622252, "epoch": 7497} {"train_loss": -27.91322898864746, "global_step": 622253, "epoch": 7497} {"train_loss": -27.373260498046875, "global_step": 622254, "epoch": 7497} {"train_loss": -26.339651107788086, "global_step": 622255, "epoch": 7497} {"train_loss": -27.079151153564453, "global_step": 622256, "epoch": 7497} {"train_loss": -27.48833656311035, "global_step": 622257, "epoch": 7497} {"train_loss": -27.562301635742188, "global_step": 622258, "epoch": 7497} {"train_loss": -26.9763126373291, "global_step": 622259, "epoch": 7497} {"train_loss": -27.47271728515625, "global_step": 622260, "epoch": 7497} {"train_loss": -27.97612953186035, "global_step": 622261, "epoch": 7497} {"train_loss": -27.660755157470703, "global_step": 622262, "epoch": 7497} {"train_loss": -27.775861740112305, "global_step": 622263, "epoch": 7497} {"train_loss": -27.26901626586914, "global_step": 622264, "epoch": 7497} {"train_loss": -27.333072662353516, "global_step": 622265, "epoch": 7497} {"train_loss": -27.574609756469727, "global_step": 622266, "epoch": 7497} {"train_loss": -27.416608810424805, "global_step": 622267, "epoch": 7497} {"train_loss": -27.66547203063965, "global_step": 622268, "epoch": 7497} {"train_loss": -27.457172393798828, "global_step": 622269, "epoch": 7497} {"train_loss": -28.118741989135742, "global_step": 622270, "epoch": 7497} {"train_loss": -27.740514755249023, "global_step": 622271, "epoch": 7497} {"train_loss": -27.863739013671875, "global_step": 622272, "epoch": 7497} {"train_loss": -28.17555809020996, "global_step": 622273, "epoch": 7497} {"train_loss": -27.98409080505371, "global_step": 622274, "epoch": 7497} {"train_loss": -28.115619659423828, "global_step": 622275, "epoch": 7497} {"train_loss": -27.988080978393555, "global_step": 622276, "epoch": 7497} {"train_loss": -27.785810470581055, "global_step": 622277, "epoch": 7497} {"train_loss": -27.927671432495117, "global_step": 622278, "epoch": 7497} {"train_loss": -28.37237548828125, "global_step": 622279, "epoch": 7497} {"train_loss": -27.615665435791016, "global_step": 622280, "epoch": 7497} {"train_loss": -28.18927001953125, "global_step": 622281, "epoch": 7497} {"train_loss": -27.909940719604492, "global_step": 622282, "epoch": 7497} {"train_loss": -27.908063888549805, "global_step": 622283, "epoch": 7497} {"train_loss": -28.066986083984375, "global_step": 622284, "epoch": 7497} {"train_loss": -27.975751876831055, "global_step": 622285, "epoch": 7497} {"train_loss": -27.79072380065918, "global_step": 622286, "epoch": 7497} {"train_loss": -28.098424911499023, "global_step": 622287, "epoch": 7497} {"train_loss": -27.857391357421875, "global_step": 622288, "epoch": 7497} {"train_loss": -27.96759033203125, "global_step": 622289, "epoch": 7497} {"train_loss": -28.266443252563477, "global_step": 622290, "epoch": 7497} {"train_loss": -28.36383056640625, "global_step": 622291, "epoch": 7497} {"train_loss": -28.06635093688965, "global_step": 622292, "epoch": 7497} {"train_loss": -28.562427520751953, "global_step": 622293, "epoch": 7497} {"train_loss": -27.996084213256836, "global_step": 622294, "epoch": 7497} {"train_loss": -28.65007972717285, "global_step": 622295, "epoch": 7497} {"train_loss": -28.144601821899414, "global_step": 622296, "epoch": 7497} {"train_loss": -28.328693389892578, "global_step": 622297, "epoch": 7497} {"train_loss": -28.166778564453125, "global_step": 622298, "epoch": 7497} {"train_loss": -28.28128433227539, "global_step": 622299, "epoch": 7497} {"train_loss": -28.373865127563477, "global_step": 622300, "epoch": 7497} {"train_loss": -28.28399658203125, "global_step": 622301, "epoch": 7497} {"train_loss": -28.121091842651367, "global_step": 622302, "epoch": 7497} {"train_loss": -28.450531005859375, "global_step": 622303, "epoch": 7497} {"train_loss": -28.08619499206543, "global_step": 622304, "epoch": 7497} {"train_loss": -28.228595733642578, "global_step": 622305, "epoch": 7497} {"train_loss": -28.557113647460938, "global_step": 622306, "epoch": 7497} {"train_loss": -28.0915584564209, "global_step": 622307, "epoch": 7497} {"train_loss": -28.06642723083496, "global_step": 622308, "epoch": 7497} {"train_loss": -28.363683700561523, "global_step": 622309, "epoch": 7497} {"train_loss": -28.2163143157959, "global_step": 622310, "epoch": 7497} {"train_loss": -27.648868560791016, "global_step": 622311, "epoch": 7497} {"train_loss": -27.972126007080078, "global_step": 622312, "epoch": 7497} {"train_loss": -28.433094024658203, "global_step": 622313, "epoch": 7497} {"train_loss": -28.01796531677246, "global_step": 622314, "epoch": 7497} {"train_loss": -28.058868408203125, "global_step": 622315, "epoch": 7497} {"train_loss": -28.25126075744629, "global_step": 622316, "epoch": 7497} {"train_loss": -28.2061824798584, "global_step": 622317, "epoch": 7497} {"train_loss": -28.08222770690918, "global_step": 622318, "epoch": 7497} {"train_loss": -27.79865837097168, "global_step": 622319, "epoch": 7497} {"train_loss": -28.45350456237793, "global_step": 622320, "epoch": 7497} {"train_loss": -28.438684463500977, "global_step": 622321, "epoch": 7497} {"train_loss": -28.54701042175293, "global_step": 622322, "epoch": 7497} {"train_loss": -28.395538330078125, "global_step": 622323, "epoch": 7497} {"train_loss": -28.160663604736328, "global_step": 622324, "epoch": 7497} {"train_loss": -27.9704532623291, "global_step": 622325, "epoch": 7497} {"train_loss": -28.394338607788086, "global_step": 622326, "epoch": 7497} {"train_loss": -28.419647216796875, "global_step": 622327, "epoch": 7497} {"train_loss": -28.317052841186523, "global_step": 622328, "epoch": 7497} {"train_loss": -28.245466232299805, "global_step": 622329, "epoch": 7497} {"train_loss": -28.138858795166016, "global_step": 622330, "epoch": 7497} {"train_loss": -28.289569854736328, "global_step": 622331, "epoch": 7497} {"train_loss": -28.226886749267578, "global_step": 622332, "epoch": 7497} {"train_loss": -27.996462741530085, "global_step": 622333, "epoch": 7497, "val_loss": 6596467.0} {"train_loss": -27.580854415893555, "global_step": 622334, "epoch": 7498} {"train_loss": -26.65533447265625, "global_step": 622335, "epoch": 7498} {"train_loss": -27.583728790283203, "global_step": 622336, "epoch": 7498} {"train_loss": -27.580631256103516, "global_step": 622337, "epoch": 7498} {"train_loss": -27.893924713134766, "global_step": 622338, "epoch": 7498} {"train_loss": -27.503620147705078, "global_step": 622339, "epoch": 7498} {"train_loss": -26.598814010620117, "global_step": 622340, "epoch": 7498} {"train_loss": -27.005964279174805, "global_step": 622341, "epoch": 7498} {"train_loss": -26.746793746948242, "global_step": 622342, "epoch": 7498} {"train_loss": -27.624164581298828, "global_step": 622343, "epoch": 7498} {"train_loss": -27.290292739868164, "global_step": 622344, "epoch": 7498} {"train_loss": -27.347721099853516, "global_step": 622345, "epoch": 7498} {"train_loss": -27.741003036499023, "global_step": 622346, "epoch": 7498} {"train_loss": -27.78497886657715, "global_step": 622347, "epoch": 7498} {"train_loss": -27.171430587768555, "global_step": 622348, "epoch": 7498} {"train_loss": -27.15488052368164, "global_step": 622349, "epoch": 7498} {"train_loss": -27.255346298217773, "global_step": 622350, "epoch": 7498} {"train_loss": -27.42978286743164, "global_step": 622351, "epoch": 7498} {"train_loss": -27.914636611938477, "global_step": 622352, "epoch": 7498} {"train_loss": -27.7366886138916, "global_step": 622353, "epoch": 7498} {"train_loss": -27.685209274291992, "global_step": 622354, "epoch": 7498} {"train_loss": -27.936853408813477, "global_step": 622355, "epoch": 7498} {"train_loss": -27.744552612304688, "global_step": 622356, "epoch": 7498} {"train_loss": -27.757680892944336, "global_step": 622357, "epoch": 7498} {"train_loss": -27.843175888061523, "global_step": 622358, "epoch": 7498} {"train_loss": -28.254114151000977, "global_step": 622359, "epoch": 7498} {"train_loss": -27.967864990234375, "global_step": 622360, "epoch": 7498} {"train_loss": -28.12652015686035, "global_step": 622361, "epoch": 7498} {"train_loss": -27.689828872680664, "global_step": 622362, "epoch": 7498} {"train_loss": -27.767038345336914, "global_step": 622363, "epoch": 7498} {"train_loss": -28.371259689331055, "global_step": 622364, "epoch": 7498} {"train_loss": -27.890918731689453, "global_step": 622365, "epoch": 7498} {"train_loss": -27.73707389831543, "global_step": 622366, "epoch": 7498} {"train_loss": -28.10283851623535, "global_step": 622367, "epoch": 7498} {"train_loss": -27.965442657470703, "global_step": 622368, "epoch": 7498} {"train_loss": -28.71930503845215, "global_step": 622369, "epoch": 7498} {"train_loss": -28.06891441345215, "global_step": 622370, "epoch": 7498} {"train_loss": -28.1785831451416, "global_step": 622371, "epoch": 7498} {"train_loss": -28.088674545288086, "global_step": 622372, "epoch": 7498} {"train_loss": -28.341949462890625, "global_step": 622373, "epoch": 7498} {"train_loss": -28.300073623657227, "global_step": 622374, "epoch": 7498} {"train_loss": -28.079395294189453, "global_step": 622375, "epoch": 7498} {"train_loss": -28.113813400268555, "global_step": 622376, "epoch": 7498} {"train_loss": -28.045515060424805, "global_step": 622377, "epoch": 7498} {"train_loss": -28.78680992126465, "global_step": 622378, "epoch": 7498} {"train_loss": -28.282596588134766, "global_step": 622379, "epoch": 7498} {"train_loss": -28.30177879333496, "global_step": 622380, "epoch": 7498} {"train_loss": -28.162580490112305, "global_step": 622381, "epoch": 7498} {"train_loss": -28.243616104125977, "global_step": 622382, "epoch": 7498} {"train_loss": -28.307538986206055, "global_step": 622383, "epoch": 7498} {"train_loss": -28.182987213134766, "global_step": 622384, "epoch": 7498} {"train_loss": -28.507028579711914, "global_step": 622385, "epoch": 7498} {"train_loss": -28.3749942779541, "global_step": 622386, "epoch": 7498} {"train_loss": -28.276769638061523, "global_step": 622387, "epoch": 7498} {"train_loss": -28.121137619018555, "global_step": 622388, "epoch": 7498} {"train_loss": -28.435972213745117, "global_step": 622389, "epoch": 7498} {"train_loss": -28.606897354125977, "global_step": 622390, "epoch": 7498} {"train_loss": -28.196203231811523, "global_step": 622391, "epoch": 7498} {"train_loss": -28.431562423706055, "global_step": 622392, "epoch": 7498} {"train_loss": -28.30097770690918, "global_step": 622393, "epoch": 7498} {"train_loss": -28.067859649658203, "global_step": 622394, "epoch": 7498} {"train_loss": -28.194196701049805, "global_step": 622395, "epoch": 7498} {"train_loss": -28.338031768798828, "global_step": 622396, "epoch": 7498} {"train_loss": -28.125568389892578, "global_step": 622397, "epoch": 7498} {"train_loss": -28.558713912963867, "global_step": 622398, "epoch": 7498} {"train_loss": -28.592914581298828, "global_step": 622399, "epoch": 7498} {"train_loss": -28.191434860229492, "global_step": 622400, "epoch": 7498} {"train_loss": -28.37354850769043, "global_step": 622401, "epoch": 7498} {"train_loss": -28.397558212280273, "global_step": 622402, "epoch": 7498} {"train_loss": -28.444580078125, "global_step": 622403, "epoch": 7498} {"train_loss": -28.499074935913086, "global_step": 622404, "epoch": 7498} {"train_loss": -27.94012451171875, "global_step": 622405, "epoch": 7498} {"train_loss": -27.56214714050293, "global_step": 622406, "epoch": 7498} {"train_loss": -26.94904899597168, "global_step": 622407, "epoch": 7498} {"train_loss": -25.457550048828125, "global_step": 622408, "epoch": 7498} {"train_loss": -26.4676456451416, "global_step": 622409, "epoch": 7498} {"train_loss": -28.070449829101562, "global_step": 622410, "epoch": 7498} {"train_loss": -27.520421981811523, "global_step": 622411, "epoch": 7498} {"train_loss": -27.789987564086914, "global_step": 622412, "epoch": 7498} {"train_loss": -27.360563278198242, "global_step": 622413, "epoch": 7498} {"train_loss": -28.007543563842773, "global_step": 622414, "epoch": 7498} {"train_loss": -27.44268226623535, "global_step": 622415, "epoch": 7498} {"train_loss": -27.88053850380771, "global_step": 622416, "epoch": 7498, "val_loss": 6584142.0} {"train_loss": -27.521326065063477, "global_step": 622417, "epoch": 7499} {"train_loss": -27.154706954956055, "global_step": 622418, "epoch": 7499} {"train_loss": -27.415552139282227, "global_step": 622419, "epoch": 7499} {"train_loss": -27.28952407836914, "global_step": 622420, "epoch": 7499} {"train_loss": -27.163715362548828, "global_step": 622421, "epoch": 7499} {"train_loss": -27.448806762695312, "global_step": 622422, "epoch": 7499} {"train_loss": -27.24909782409668, "global_step": 622423, "epoch": 7499} {"train_loss": -27.847864151000977, "global_step": 622424, "epoch": 7499} {"train_loss": -27.4766788482666, "global_step": 622425, "epoch": 7499} {"train_loss": -27.964359283447266, "global_step": 622426, "epoch": 7499} {"train_loss": -27.620803833007812, "global_step": 622427, "epoch": 7499} {"train_loss": -27.76568031311035, "global_step": 622428, "epoch": 7499} {"train_loss": -27.814538955688477, "global_step": 622429, "epoch": 7499} {"train_loss": -27.323217391967773, "global_step": 622430, "epoch": 7499} {"train_loss": -28.154312133789062, "global_step": 622431, "epoch": 7499} {"train_loss": -27.51605796813965, "global_step": 622432, "epoch": 7499} {"train_loss": -28.04513931274414, "global_step": 622433, "epoch": 7499} {"train_loss": -27.77227783203125, "global_step": 622434, "epoch": 7499} {"train_loss": -27.596832275390625, "global_step": 622435, "epoch": 7499} {"train_loss": -27.74860191345215, "global_step": 622436, "epoch": 7499} {"train_loss": -28.069990158081055, "global_step": 622437, "epoch": 7499} {"train_loss": -27.74420166015625, "global_step": 622438, "epoch": 7499} {"train_loss": -27.47100257873535, "global_step": 622439, "epoch": 7499} {"train_loss": -27.958654403686523, "global_step": 622440, "epoch": 7499} {"train_loss": -28.1484375, "global_step": 622441, "epoch": 7499} {"train_loss": -28.096521377563477, "global_step": 622442, "epoch": 7499} {"train_loss": -28.199512481689453, "global_step": 622443, "epoch": 7499} {"train_loss": -28.42499351501465, "global_step": 622444, "epoch": 7499} {"train_loss": -28.26584243774414, "global_step": 622445, "epoch": 7499} {"train_loss": -28.16217613220215, "global_step": 622446, "epoch": 7499} {"train_loss": -27.984479904174805, "global_step": 622447, "epoch": 7499} {"train_loss": -28.036884307861328, "global_step": 622448, "epoch": 7499} {"train_loss": -28.2351131439209, "global_step": 622449, "epoch": 7499} {"train_loss": -28.16376304626465, "global_step": 622450, "epoch": 7499} {"train_loss": -28.112829208374023, "global_step": 622451, "epoch": 7499} {"train_loss": -27.908233642578125, "global_step": 622452, "epoch": 7499} {"train_loss": -28.268537521362305, "global_step": 622453, "epoch": 7499} {"train_loss": -28.48349952697754, "global_step": 622454, "epoch": 7499} {"train_loss": -28.209808349609375, "global_step": 622455, "epoch": 7499} {"train_loss": -28.15850257873535, "global_step": 622456, "epoch": 7499} {"train_loss": -28.516469955444336, "global_step": 622457, "epoch": 7499} {"train_loss": -28.115015029907227, "global_step": 622458, "epoch": 7499} {"train_loss": -28.42823600769043, "global_step": 622459, "epoch": 7499} {"train_loss": -28.327863693237305, "global_step": 622460, "epoch": 7499} {"train_loss": -28.469755172729492, "global_step": 622461, "epoch": 7499} {"train_loss": -28.47566032409668, "global_step": 622462, "epoch": 7499} {"train_loss": -28.232919692993164, "global_step": 622463, "epoch": 7499} {"train_loss": -28.411365509033203, "global_step": 622464, "epoch": 7499} {"train_loss": -27.97901725769043, "global_step": 622465, "epoch": 7499} {"train_loss": -28.300003051757812, "global_step": 622466, "epoch": 7499} {"train_loss": -28.536222457885742, "global_step": 622467, "epoch": 7499} {"train_loss": -28.165912628173828, "global_step": 622468, "epoch": 7499} {"train_loss": -28.059635162353516, "global_step": 622469, "epoch": 7499} {"train_loss": -28.144689559936523, "global_step": 622470, "epoch": 7499} {"train_loss": -28.280242919921875, "global_step": 622471, "epoch": 7499} {"train_loss": -28.356748580932617, "global_step": 622472, "epoch": 7499} {"train_loss": -28.26694679260254, "global_step": 622473, "epoch": 7499} {"train_loss": -28.11480140686035, "global_step": 622474, "epoch": 7499} {"train_loss": -27.999271392822266, "global_step": 622475, "epoch": 7499} {"train_loss": -27.8912353515625, "global_step": 622476, "epoch": 7499} {"train_loss": -27.955472946166992, "global_step": 622477, "epoch": 7499} {"train_loss": -28.0666561126709, "global_step": 622478, "epoch": 7499} {"train_loss": -28.26974868774414, "global_step": 622479, "epoch": 7499} {"train_loss": -28.014163970947266, "global_step": 622480, "epoch": 7499} {"train_loss": -28.24762535095215, "global_step": 622481, "epoch": 7499} {"train_loss": -28.203229904174805, "global_step": 622482, "epoch": 7499} {"train_loss": -27.795276641845703, "global_step": 622483, "epoch": 7499} {"train_loss": -28.113895416259766, "global_step": 622484, "epoch": 7499} {"train_loss": -27.667627334594727, "global_step": 622485, "epoch": 7499} {"train_loss": -28.271289825439453, "global_step": 622486, "epoch": 7499} {"train_loss": -27.627500534057617, "global_step": 622487, "epoch": 7499} {"train_loss": -27.735427856445312, "global_step": 622488, "epoch": 7499} {"train_loss": -27.643972396850586, "global_step": 622489, "epoch": 7499} {"train_loss": -27.64753532409668, "global_step": 622490, "epoch": 7499} {"train_loss": -28.235107421875, "global_step": 622491, "epoch": 7499} {"train_loss": -28.15203857421875, "global_step": 622492, "epoch": 7499} {"train_loss": -28.314701080322266, "global_step": 622493, "epoch": 7499} {"train_loss": -27.855560302734375, "global_step": 622494, "epoch": 7499} {"train_loss": -28.218679428100586, "global_step": 622495, "epoch": 7499} {"train_loss": -28.53998374938965, "global_step": 622496, "epoch": 7499} {"train_loss": -27.9318904876709, "global_step": 622497, "epoch": 7499} {"train_loss": -27.987783432006836, "global_step": 622498, "epoch": 7499} {"train_loss": -27.994175026215704, "global_step": 622499, "epoch": 7499, "val_loss": 6611791.5} {"train_loss": -28.414121627807617, "global_step": 622500, "epoch": 7500} {"train_loss": -27.275421142578125, "global_step": 622501, "epoch": 7500} {"train_loss": -27.581146240234375, "global_step": 622502, "epoch": 7500} {"train_loss": -28.00685691833496, "global_step": 622503, "epoch": 7500} {"train_loss": -27.938169479370117, "global_step": 622504, "epoch": 7500} {"train_loss": -27.5716609954834, "global_step": 622505, "epoch": 7500} {"train_loss": -27.501693725585938, "global_step": 622506, "epoch": 7500} {"train_loss": -28.170501708984375, "global_step": 622507, "epoch": 7500} {"train_loss": -27.520526885986328, "global_step": 622508, "epoch": 7500} {"train_loss": -27.81328773498535, "global_step": 622509, "epoch": 7500} {"train_loss": -28.36060905456543, "global_step": 622510, "epoch": 7500} {"train_loss": -28.14174461364746, "global_step": 622511, "epoch": 7500} {"train_loss": -28.44875144958496, "global_step": 622512, "epoch": 7500} {"train_loss": -27.962472915649414, "global_step": 622513, "epoch": 7500} {"train_loss": -27.73207664489746, "global_step": 622514, "epoch": 7500} {"train_loss": -28.04225730895996, "global_step": 622515, "epoch": 7500} {"train_loss": -28.064167022705078, "global_step": 622516, "epoch": 7500} {"train_loss": -28.337554931640625, "global_step": 622517, "epoch": 7500} {"train_loss": -28.0709171295166, "global_step": 622518, "epoch": 7500} {"train_loss": -28.227075576782227, "global_step": 622519, "epoch": 7500} {"train_loss": -28.058313369750977, "global_step": 622520, "epoch": 7500} {"train_loss": -28.15895652770996, "global_step": 622521, "epoch": 7500} {"train_loss": -28.106021881103516, "global_step": 622522, "epoch": 7500} {"train_loss": -28.460424423217773, "global_step": 622523, "epoch": 7500} {"train_loss": -28.285938262939453, "global_step": 622524, "epoch": 7500} {"train_loss": -28.061857223510742, "global_step": 622525, "epoch": 7500} {"train_loss": -27.92323112487793, "global_step": 622526, "epoch": 7500} {"train_loss": -28.064157485961914, "global_step": 622527, "epoch": 7500} {"train_loss": -28.208749771118164, "global_step": 622528, "epoch": 7500} {"train_loss": -28.250192642211914, "global_step": 622529, "epoch": 7500} {"train_loss": -28.00235939025879, "global_step": 622530, "epoch": 7500} {"train_loss": -27.887983322143555, "global_step": 622531, "epoch": 7500} {"train_loss": -28.223785400390625, "global_step": 622532, "epoch": 7500} {"train_loss": -28.087604522705078, "global_step": 622533, "epoch": 7500} {"train_loss": -27.96530532836914, "global_step": 622534, "epoch": 7500} {"train_loss": -28.287702560424805, "global_step": 622535, "epoch": 7500} {"train_loss": -28.069059371948242, "global_step": 622536, "epoch": 7500} {"train_loss": -27.864582061767578, "global_step": 622537, "epoch": 7500} {"train_loss": -28.246240615844727, "global_step": 622538, "epoch": 7500} {"train_loss": -28.160192489624023, "global_step": 622539, "epoch": 7500} {"train_loss": -28.50922966003418, "global_step": 622540, "epoch": 7500} {"train_loss": -28.52349853515625, "global_step": 622541, "epoch": 7500} {"train_loss": -28.273279190063477, "global_step": 622542, "epoch": 7500} {"train_loss": -28.664499282836914, "global_step": 622543, "epoch": 7500} {"train_loss": -28.091114044189453, "global_step": 622544, "epoch": 7500} {"train_loss": -28.213037490844727, "global_step": 622545, "epoch": 7500} {"train_loss": -28.27101707458496, "global_step": 622546, "epoch": 7500} {"train_loss": -28.371952056884766, "global_step": 622547, "epoch": 7500} {"train_loss": -28.3626766204834, "global_step": 622548, "epoch": 7500} {"train_loss": -28.12735939025879, "global_step": 622549, "epoch": 7500} {"train_loss": -28.058380126953125, "global_step": 622550, "epoch": 7500} {"train_loss": -28.6954345703125, "global_step": 622551, "epoch": 7500} {"train_loss": -28.245847702026367, "global_step": 622552, "epoch": 7500} {"train_loss": -28.611047744750977, "global_step": 622553, "epoch": 7500} {"train_loss": -28.42048454284668, "global_step": 622554, "epoch": 7500} {"train_loss": -27.986364364624023, "global_step": 622555, "epoch": 7500} {"train_loss": -28.11677360534668, "global_step": 622556, "epoch": 7500} {"train_loss": -28.185754776000977, "global_step": 622557, "epoch": 7500} {"train_loss": -27.93535804748535, "global_step": 622558, "epoch": 7500} {"train_loss": -28.2025146484375, "global_step": 622559, "epoch": 7500} {"train_loss": -27.706451416015625, "global_step": 622560, "epoch": 7500} {"train_loss": -27.56537437438965, "global_step": 622561, "epoch": 7500} {"train_loss": -27.762603759765625, "global_step": 622562, "epoch": 7500} {"train_loss": -27.692855834960938, "global_step": 622563, "epoch": 7500} {"train_loss": -27.76251220703125, "global_step": 622564, "epoch": 7500} {"train_loss": -28.073627471923828, "global_step": 622565, "epoch": 7500} {"train_loss": -28.25483512878418, "global_step": 622566, "epoch": 7500} {"train_loss": -27.757343292236328, "global_step": 622567, "epoch": 7500} {"train_loss": -28.09223747253418, "global_step": 622568, "epoch": 7500} {"train_loss": -27.881622314453125, "global_step": 622569, "epoch": 7500} {"train_loss": -28.296377182006836, "global_step": 622570, "epoch": 7500} {"train_loss": -28.318445205688477, "global_step": 622571, "epoch": 7500} {"train_loss": -27.715864181518555, "global_step": 622572, "epoch": 7500} {"train_loss": -28.163877487182617, "global_step": 622573, "epoch": 7500} {"train_loss": -28.347227096557617, "global_step": 622574, "epoch": 7500} {"train_loss": -28.071569442749023, "global_step": 622575, "epoch": 7500} {"train_loss": -27.7301025390625, "global_step": 622576, "epoch": 7500} {"train_loss": -28.01226234436035, "global_step": 622577, "epoch": 7500} {"train_loss": -28.308027267456055, "global_step": 622578, "epoch": 7500} {"train_loss": -27.982526779174805, "global_step": 622579, "epoch": 7500} {"train_loss": -28.1875, "global_step": 622580, "epoch": 7500} {"train_loss": -27.936819076538086, "global_step": 622581, "epoch": 7500} {"train_loss": -28.089178292148084, "global_step": 622582, "epoch": 7500, "train/sim_max_reward_0": 0.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4500000": 1.0, "test/sim_max_reward_4500001": 1.0, "test/sim_max_reward_4500002": 1.0, "test/sim_max_reward_4500003": 1.0, "test/sim_max_reward_4500004": 1.0, "test/sim_max_reward_4500005": 1.0, "test/sim_max_reward_4500006": 1.0, "test/sim_max_reward_4500007": 0.0, "test/sim_max_reward_4500008": 1.0, "test/sim_max_reward_4500009": 1.0, "test/sim_max_reward_4500010": 1.0, "test/sim_max_reward_4500011": 1.0, "test/sim_max_reward_4500012": 1.0, "test/sim_max_reward_4500013": 0.0, "test/sim_max_reward_4500014": 1.0, "test/sim_max_reward_4500015": 1.0, "test/sim_max_reward_4500016": 1.0, "test/sim_max_reward_4500017": 1.0, "test/sim_max_reward_4500018": 0.0, "test/sim_max_reward_4500019": 1.0, "test/sim_max_reward_4500020": 1.0, "test/sim_max_reward_4500021": 1.0, "train/mean_score": 0.8333333333333334, "test/mean_score": 0.8636363636363636, "val_loss": 6789139.5} {"train_loss": -27.63628578186035, "global_step": 622583, "epoch": 7501} {"train_loss": -26.762914657592773, "global_step": 622584, "epoch": 7501} {"train_loss": -27.5429744720459, "global_step": 622585, "epoch": 7501} {"train_loss": -27.80258560180664, "global_step": 622586, "epoch": 7501} {"train_loss": -27.373029708862305, "global_step": 622587, "epoch": 7501} {"train_loss": -27.952905654907227, "global_step": 622588, "epoch": 7501} {"train_loss": -27.314477920532227, "global_step": 622589, "epoch": 7501} {"train_loss": -27.80194091796875, "global_step": 622590, "epoch": 7501} {"train_loss": -27.619873046875, "global_step": 622591, "epoch": 7501} {"train_loss": -26.909154891967773, "global_step": 622592, "epoch": 7501} {"train_loss": -27.71205711364746, "global_step": 622593, "epoch": 7501} {"train_loss": -27.528472900390625, "global_step": 622594, "epoch": 7501} {"train_loss": -27.71078872680664, "global_step": 622595, "epoch": 7501} {"train_loss": -27.8980712890625, "global_step": 622596, "epoch": 7501} {"train_loss": -27.541000366210938, "global_step": 622597, "epoch": 7501} {"train_loss": -27.940570831298828, "global_step": 622598, "epoch": 7501} {"train_loss": -28.104785919189453, "global_step": 622599, "epoch": 7501} {"train_loss": -27.620878219604492, "global_step": 622600, "epoch": 7501} {"train_loss": -27.6584529876709, "global_step": 622601, "epoch": 7501} {"train_loss": -27.718505859375, "global_step": 622602, "epoch": 7501} {"train_loss": -28.235736846923828, "global_step": 622603, "epoch": 7501} {"train_loss": -27.648696899414062, "global_step": 622604, "epoch": 7501} {"train_loss": -27.783111572265625, "global_step": 622605, "epoch": 7501} {"train_loss": -28.18259048461914, "global_step": 622606, "epoch": 7501} {"train_loss": -28.10157585144043, "global_step": 622607, "epoch": 7501} {"train_loss": -28.06512451171875, "global_step": 622608, "epoch": 7501} {"train_loss": -28.120777130126953, "global_step": 622609, "epoch": 7501} {"train_loss": -28.08794593811035, "global_step": 622610, "epoch": 7501} {"train_loss": -28.158899307250977, "global_step": 622611, "epoch": 7501} {"train_loss": -28.251081466674805, "global_step": 622612, "epoch": 7501} {"train_loss": -28.233423233032227, "global_step": 622613, "epoch": 7501} {"train_loss": -28.027759552001953, "global_step": 622614, "epoch": 7501} {"train_loss": -28.233753204345703, "global_step": 622615, "epoch": 7501} {"train_loss": -28.158262252807617, "global_step": 622616, "epoch": 7501} {"train_loss": -27.973770141601562, "global_step": 622617, "epoch": 7501} {"train_loss": -28.362380981445312, "global_step": 622618, "epoch": 7501} {"train_loss": -28.31598472595215, "global_step": 622619, "epoch": 7501} {"train_loss": -27.929529190063477, "global_step": 622620, "epoch": 7501} {"train_loss": -28.02786636352539, "global_step": 622621, "epoch": 7501} {"train_loss": -28.078369140625, "global_step": 622622, "epoch": 7501} {"train_loss": -28.244861602783203, "global_step": 622623, "epoch": 7501} {"train_loss": -28.422353744506836, "global_step": 622624, "epoch": 7501} {"train_loss": -28.410430908203125, "global_step": 622625, "epoch": 7501} {"train_loss": -27.99941062927246, "global_step": 622626, "epoch": 7501} {"train_loss": -28.543787002563477, "global_step": 622627, "epoch": 7501} {"train_loss": -28.321624755859375, "global_step": 622628, "epoch": 7501} {"train_loss": -28.309980392456055, "global_step": 622629, "epoch": 7501} {"train_loss": -28.34809684753418, "global_step": 622630, "epoch": 7501} {"train_loss": -28.421619415283203, "global_step": 622631, "epoch": 7501} {"train_loss": -28.240222930908203, "global_step": 622632, "epoch": 7501} {"train_loss": -27.915307998657227, "global_step": 622633, "epoch": 7501} {"train_loss": -28.21844482421875, "global_step": 622634, "epoch": 7501} {"train_loss": -28.521286010742188, "global_step": 622635, "epoch": 7501} {"train_loss": -28.07279396057129, "global_step": 622636, "epoch": 7501} {"train_loss": -27.83503532409668, "global_step": 622637, "epoch": 7501} {"train_loss": -27.841510772705078, "global_step": 622638, "epoch": 7501} {"train_loss": -28.507532119750977, "global_step": 622639, "epoch": 7501} {"train_loss": -28.35346031188965, "global_step": 622640, "epoch": 7501} {"train_loss": -27.89130210876465, "global_step": 622641, "epoch": 7501} {"train_loss": -28.1844482421875, "global_step": 622642, "epoch": 7501} {"train_loss": -27.75472068786621, "global_step": 622643, "epoch": 7501} {"train_loss": -28.01068687438965, "global_step": 622644, "epoch": 7501} {"train_loss": -28.058456420898438, "global_step": 622645, "epoch": 7501} {"train_loss": -27.845266342163086, "global_step": 622646, "epoch": 7501} {"train_loss": -28.461957931518555, "global_step": 622647, "epoch": 7501} {"train_loss": -27.897165298461914, "global_step": 622648, "epoch": 7501} {"train_loss": -28.33222007751465, "global_step": 622649, "epoch": 7501} {"train_loss": -28.19716453552246, "global_step": 622650, "epoch": 7501} {"train_loss": -27.7873592376709, "global_step": 622651, "epoch": 7501} {"train_loss": -28.037734985351562, "global_step": 622652, "epoch": 7501} {"train_loss": -27.794214248657227, "global_step": 622653, "epoch": 7501} {"train_loss": -28.16963005065918, "global_step": 622654, "epoch": 7501} {"train_loss": -27.99774742126465, "global_step": 622655, "epoch": 7501} {"train_loss": -28.714136123657227, "global_step": 622656, "epoch": 7501} {"train_loss": -27.91579246520996, "global_step": 622657, "epoch": 7501} {"train_loss": -27.597278594970703, "global_step": 622658, "epoch": 7501} {"train_loss": -27.85085105895996, "global_step": 622659, "epoch": 7501} {"train_loss": -27.86297035217285, "global_step": 622660, "epoch": 7501} {"train_loss": -28.02654457092285, "global_step": 622661, "epoch": 7501} {"train_loss": -27.979816436767578, "global_step": 622662, "epoch": 7501} {"train_loss": -27.365896224975586, "global_step": 622663, "epoch": 7501} {"train_loss": -27.9971866607666, "global_step": 622664, "epoch": 7501} {"train_loss": -27.975473312010248, "global_step": 622665, "epoch": 7501, "val_loss": 6796277.0} {"train_loss": -25.5238094329834, "global_step": 622666, "epoch": 7502} {"train_loss": -26.47389793395996, "global_step": 622667, "epoch": 7502} {"train_loss": -27.393707275390625, "global_step": 622668, "epoch": 7502} {"train_loss": -25.972537994384766, "global_step": 622669, "epoch": 7502} {"train_loss": -27.674253463745117, "global_step": 622670, "epoch": 7502} {"train_loss": -26.814014434814453, "global_step": 622671, "epoch": 7502} {"train_loss": -27.74505043029785, "global_step": 622672, "epoch": 7502} {"train_loss": -27.444171905517578, "global_step": 622673, "epoch": 7502} {"train_loss": -27.398847579956055, "global_step": 622674, "epoch": 7502} {"train_loss": -27.705244064331055, "global_step": 622675, "epoch": 7502} {"train_loss": -27.690465927124023, "global_step": 622676, "epoch": 7502} {"train_loss": -27.40572166442871, "global_step": 622677, "epoch": 7502} {"train_loss": -28.118579864501953, "global_step": 622678, "epoch": 7502} {"train_loss": -27.6448917388916, "global_step": 622679, "epoch": 7502} {"train_loss": -27.807523727416992, "global_step": 622680, "epoch": 7502} {"train_loss": -27.8105411529541, "global_step": 622681, "epoch": 7502} {"train_loss": -27.958438873291016, "global_step": 622682, "epoch": 7502} {"train_loss": -27.574071884155273, "global_step": 622683, "epoch": 7502} {"train_loss": -27.768468856811523, "global_step": 622684, "epoch": 7502} {"train_loss": -27.37640380859375, "global_step": 622685, "epoch": 7502} {"train_loss": -27.741796493530273, "global_step": 622686, "epoch": 7502} {"train_loss": -27.9145565032959, "global_step": 622687, "epoch": 7502} {"train_loss": -27.6210880279541, "global_step": 622688, "epoch": 7502} {"train_loss": -27.96473503112793, "global_step": 622689, "epoch": 7502} {"train_loss": -27.774023056030273, "global_step": 622690, "epoch": 7502} {"train_loss": -28.033796310424805, "global_step": 622691, "epoch": 7502} {"train_loss": -27.771759033203125, "global_step": 622692, "epoch": 7502} {"train_loss": -28.138595581054688, "global_step": 622693, "epoch": 7502} {"train_loss": -27.781082153320312, "global_step": 622694, "epoch": 7502} {"train_loss": -28.241077423095703, "global_step": 622695, "epoch": 7502} {"train_loss": -28.08918571472168, "global_step": 622696, "epoch": 7502} {"train_loss": -27.93354606628418, "global_step": 622697, "epoch": 7502} {"train_loss": -28.114858627319336, "global_step": 622698, "epoch": 7502} {"train_loss": -28.085468292236328, "global_step": 622699, "epoch": 7502} {"train_loss": -27.847095489501953, "global_step": 622700, "epoch": 7502} {"train_loss": -28.20945167541504, "global_step": 622701, "epoch": 7502} {"train_loss": -28.128162384033203, "global_step": 622702, "epoch": 7502} {"train_loss": -27.76987648010254, "global_step": 622703, "epoch": 7502} {"train_loss": -27.6509952545166, "global_step": 622704, "epoch": 7502} {"train_loss": -28.35639762878418, "global_step": 622705, "epoch": 7502} {"train_loss": -28.4141902923584, "global_step": 622706, "epoch": 7502} {"train_loss": -27.91822624206543, "global_step": 622707, "epoch": 7502} {"train_loss": -27.969629287719727, "global_step": 622708, "epoch": 7502} {"train_loss": -28.189619064331055, "global_step": 622709, "epoch": 7502} {"train_loss": -28.274646759033203, "global_step": 622710, "epoch": 7502} {"train_loss": -28.155536651611328, "global_step": 622711, "epoch": 7502} {"train_loss": -28.232202529907227, "global_step": 622712, "epoch": 7502} {"train_loss": -28.337377548217773, "global_step": 622713, "epoch": 7502} {"train_loss": -28.55604362487793, "global_step": 622714, "epoch": 7502} {"train_loss": -28.4754581451416, "global_step": 622715, "epoch": 7502} {"train_loss": -28.011133193969727, "global_step": 622716, "epoch": 7502} {"train_loss": -28.67827796936035, "global_step": 622717, "epoch": 7502} {"train_loss": -28.277517318725586, "global_step": 622718, "epoch": 7502} {"train_loss": -28.137435913085938, "global_step": 622719, "epoch": 7502} {"train_loss": -27.977453231811523, "global_step": 622720, "epoch": 7502} {"train_loss": -28.173078536987305, "global_step": 622721, "epoch": 7502} {"train_loss": -28.339818954467773, "global_step": 622722, "epoch": 7502} {"train_loss": -28.119924545288086, "global_step": 622723, "epoch": 7502} {"train_loss": -28.11533546447754, "global_step": 622724, "epoch": 7502} {"train_loss": -28.13396644592285, "global_step": 622725, "epoch": 7502} {"train_loss": -27.754343032836914, "global_step": 622726, "epoch": 7502} {"train_loss": -28.245731353759766, "global_step": 622727, "epoch": 7502} {"train_loss": -28.15740966796875, "global_step": 622728, "epoch": 7502} {"train_loss": -28.133773803710938, "global_step": 622729, "epoch": 7502} {"train_loss": -28.190032958984375, "global_step": 622730, "epoch": 7502} {"train_loss": -28.171600341796875, "global_step": 622731, "epoch": 7502} {"train_loss": -28.229129791259766, "global_step": 622732, "epoch": 7502} {"train_loss": -28.454614639282227, "global_step": 622733, "epoch": 7502} {"train_loss": -28.231372833251953, "global_step": 622734, "epoch": 7502} {"train_loss": -27.755903244018555, "global_step": 622735, "epoch": 7502} {"train_loss": -28.391523361206055, "global_step": 622736, "epoch": 7502} {"train_loss": -28.23309898376465, "global_step": 622737, "epoch": 7502} {"train_loss": -28.012235641479492, "global_step": 622738, "epoch": 7502} {"train_loss": -28.515186309814453, "global_step": 622739, "epoch": 7502} {"train_loss": -27.98792839050293, "global_step": 622740, "epoch": 7502} {"train_loss": -28.10625648498535, "global_step": 622741, "epoch": 7502} {"train_loss": -28.61789894104004, "global_step": 622742, "epoch": 7502} {"train_loss": -28.0400333404541, "global_step": 622743, "epoch": 7502} {"train_loss": -28.312747955322266, "global_step": 622744, "epoch": 7502} {"train_loss": -28.110309600830078, "global_step": 622745, "epoch": 7502} {"train_loss": -28.2674617767334, "global_step": 622746, "epoch": 7502} {"train_loss": -27.770116806030273, "global_step": 622747, "epoch": 7502} {"train_loss": -27.93440726866205, "global_step": 622748, "epoch": 7502, "val_loss": 6810664.5} {"train_loss": -27.68255043029785, "global_step": 622749, "epoch": 7503} {"train_loss": -27.1639461517334, "global_step": 622750, "epoch": 7503} {"train_loss": -26.51824951171875, "global_step": 622751, "epoch": 7503} {"train_loss": -26.640796661376953, "global_step": 622752, "epoch": 7503} {"train_loss": -27.078805923461914, "global_step": 622753, "epoch": 7503} {"train_loss": -26.887739181518555, "global_step": 622754, "epoch": 7503} {"train_loss": -26.277286529541016, "global_step": 622755, "epoch": 7503} {"train_loss": -26.7791748046875, "global_step": 622756, "epoch": 7503} {"train_loss": -26.96341323852539, "global_step": 622757, "epoch": 7503} {"train_loss": -27.2525634765625, "global_step": 622758, "epoch": 7503} {"train_loss": -27.498815536499023, "global_step": 622759, "epoch": 7503} {"train_loss": -27.837543487548828, "global_step": 622760, "epoch": 7503} {"train_loss": -27.251968383789062, "global_step": 622761, "epoch": 7503} {"train_loss": -27.703832626342773, "global_step": 622762, "epoch": 7503} {"train_loss": -27.67254638671875, "global_step": 622763, "epoch": 7503} {"train_loss": -27.411884307861328, "global_step": 622764, "epoch": 7503} {"train_loss": -27.80560302734375, "global_step": 622765, "epoch": 7503} {"train_loss": -27.55096435546875, "global_step": 622766, "epoch": 7503} {"train_loss": -27.696863174438477, "global_step": 622767, "epoch": 7503} {"train_loss": -27.7755126953125, "global_step": 622768, "epoch": 7503} {"train_loss": -27.651123046875, "global_step": 622769, "epoch": 7503} {"train_loss": -27.828821182250977, "global_step": 622770, "epoch": 7503} {"train_loss": -28.410598754882812, "global_step": 622771, "epoch": 7503} {"train_loss": -27.24427604675293, "global_step": 622772, "epoch": 7503} {"train_loss": -27.898035049438477, "global_step": 622773, "epoch": 7503} {"train_loss": -27.817977905273438, "global_step": 622774, "epoch": 7503} {"train_loss": -28.083454132080078, "global_step": 622775, "epoch": 7503} {"train_loss": -27.8072509765625, "global_step": 622776, "epoch": 7503} {"train_loss": -27.996374130249023, "global_step": 622777, "epoch": 7503} {"train_loss": -27.876789093017578, "global_step": 622778, "epoch": 7503} {"train_loss": -27.65650749206543, "global_step": 622779, "epoch": 7503} {"train_loss": -27.881912231445312, "global_step": 622780, "epoch": 7503} {"train_loss": -27.92866325378418, "global_step": 622781, "epoch": 7503} {"train_loss": -28.081512451171875, "global_step": 622782, "epoch": 7503} {"train_loss": -28.024322509765625, "global_step": 622783, "epoch": 7503} {"train_loss": -28.084394454956055, "global_step": 622784, "epoch": 7503} {"train_loss": -28.278736114501953, "global_step": 622785, "epoch": 7503} {"train_loss": -27.9396915435791, "global_step": 622786, "epoch": 7503} {"train_loss": -28.050317764282227, "global_step": 622787, "epoch": 7503} {"train_loss": -28.22804832458496, "global_step": 622788, "epoch": 7503} {"train_loss": -28.232940673828125, "global_step": 622789, "epoch": 7503} {"train_loss": -27.920028686523438, "global_step": 622790, "epoch": 7503} {"train_loss": -28.03125, "global_step": 622791, "epoch": 7503} {"train_loss": -28.3324031829834, "global_step": 622792, "epoch": 7503} {"train_loss": -28.266870498657227, "global_step": 622793, "epoch": 7503} {"train_loss": -28.16936683654785, "global_step": 622794, "epoch": 7503} {"train_loss": -28.149641036987305, "global_step": 622795, "epoch": 7503} {"train_loss": -28.45246696472168, "global_step": 622796, "epoch": 7503} {"train_loss": -28.0111026763916, "global_step": 622797, "epoch": 7503} {"train_loss": -28.240232467651367, "global_step": 622798, "epoch": 7503} {"train_loss": -28.052051544189453, "global_step": 622799, "epoch": 7503} {"train_loss": -28.534259796142578, "global_step": 622800, "epoch": 7503} {"train_loss": -28.179828643798828, "global_step": 622801, "epoch": 7503} {"train_loss": -28.864755630493164, "global_step": 622802, "epoch": 7503} {"train_loss": -28.478437423706055, "global_step": 622803, "epoch": 7503} {"train_loss": -28.576950073242188, "global_step": 622804, "epoch": 7503} {"train_loss": -28.1991024017334, "global_step": 622805, "epoch": 7503} {"train_loss": -28.42142105102539, "global_step": 622806, "epoch": 7503} {"train_loss": -28.063440322875977, "global_step": 622807, "epoch": 7503} {"train_loss": -27.774389266967773, "global_step": 622808, "epoch": 7503} {"train_loss": -28.2742919921875, "global_step": 622809, "epoch": 7503} {"train_loss": -28.252445220947266, "global_step": 622810, "epoch": 7503} {"train_loss": -28.29182243347168, "global_step": 622811, "epoch": 7503} {"train_loss": -28.459335327148438, "global_step": 622812, "epoch": 7503} {"train_loss": -27.78732681274414, "global_step": 622813, "epoch": 7503} {"train_loss": -28.331298828125, "global_step": 622814, "epoch": 7503} {"train_loss": -28.015710830688477, "global_step": 622815, "epoch": 7503} {"train_loss": -28.75898551940918, "global_step": 622816, "epoch": 7503} {"train_loss": -28.500890731811523, "global_step": 622817, "epoch": 7503} {"train_loss": -28.036426544189453, "global_step": 622818, "epoch": 7503} {"train_loss": -28.2326602935791, "global_step": 622819, "epoch": 7503} {"train_loss": -27.873144149780273, "global_step": 622820, "epoch": 7503} {"train_loss": -28.181793212890625, "global_step": 622821, "epoch": 7503} {"train_loss": -28.42805290222168, "global_step": 622822, "epoch": 7503} {"train_loss": -28.113203048706055, "global_step": 622823, "epoch": 7503} {"train_loss": -28.038318634033203, "global_step": 622824, "epoch": 7503} {"train_loss": -28.39259147644043, "global_step": 622825, "epoch": 7503} {"train_loss": -28.326868057250977, "global_step": 622826, "epoch": 7503} {"train_loss": -28.46137809753418, "global_step": 622827, "epoch": 7503} {"train_loss": -28.543384552001953, "global_step": 622828, "epoch": 7503} {"train_loss": -28.68340492248535, "global_step": 622829, "epoch": 7503} {"train_loss": -28.546411514282227, "global_step": 622830, "epoch": 7503} {"train_loss": -27.957544579563372, "global_step": 622831, "epoch": 7503, "val_loss": 6781102.0} {"train_loss": -27.877038955688477, "global_step": 622832, "epoch": 7504} {"train_loss": -27.256311416625977, "global_step": 622833, "epoch": 7504} {"train_loss": -27.99859046936035, "global_step": 622834, "epoch": 7504} {"train_loss": -27.17230224609375, "global_step": 622835, "epoch": 7504} {"train_loss": -27.679492950439453, "global_step": 622836, "epoch": 7504} {"train_loss": -27.6044864654541, "global_step": 622837, "epoch": 7504} {"train_loss": -28.258085250854492, "global_step": 622838, "epoch": 7504} {"train_loss": -28.13953971862793, "global_step": 622839, "epoch": 7504} {"train_loss": -27.94467544555664, "global_step": 622840, "epoch": 7504} {"train_loss": -27.63750648498535, "global_step": 622841, "epoch": 7504} {"train_loss": -27.713642120361328, "global_step": 622842, "epoch": 7504} {"train_loss": -28.208454132080078, "global_step": 622843, "epoch": 7504} {"train_loss": -28.11366081237793, "global_step": 622844, "epoch": 7504} {"train_loss": -28.002832412719727, "global_step": 622845, "epoch": 7504} {"train_loss": -28.089279174804688, "global_step": 622846, "epoch": 7504} {"train_loss": -27.980121612548828, "global_step": 622847, "epoch": 7504} {"train_loss": -28.209930419921875, "global_step": 622848, "epoch": 7504} {"train_loss": -28.043432235717773, "global_step": 622849, "epoch": 7504} {"train_loss": -27.948522567749023, "global_step": 622850, "epoch": 7504} {"train_loss": -27.8687744140625, "global_step": 622851, "epoch": 7504} {"train_loss": -27.9404239654541, "global_step": 622852, "epoch": 7504} {"train_loss": -27.822315216064453, "global_step": 622853, "epoch": 7504} {"train_loss": -27.983551025390625, "global_step": 622854, "epoch": 7504} {"train_loss": -28.017822265625, "global_step": 622855, "epoch": 7504} {"train_loss": -28.46034049987793, "global_step": 622856, "epoch": 7504} {"train_loss": -28.397314071655273, "global_step": 622857, "epoch": 7504} {"train_loss": -27.915311813354492, "global_step": 622858, "epoch": 7504} {"train_loss": -28.20771598815918, "global_step": 622859, "epoch": 7504} {"train_loss": -28.129499435424805, "global_step": 622860, "epoch": 7504} {"train_loss": -28.095996856689453, "global_step": 622861, "epoch": 7504} {"train_loss": -27.861005783081055, "global_step": 622862, "epoch": 7504} {"train_loss": -28.11903953552246, "global_step": 622863, "epoch": 7504} {"train_loss": -27.860727310180664, "global_step": 622864, "epoch": 7504} {"train_loss": -27.852798461914062, "global_step": 622865, "epoch": 7504} {"train_loss": -28.123579025268555, "global_step": 622866, "epoch": 7504} {"train_loss": -28.421466827392578, "global_step": 622867, "epoch": 7504} {"train_loss": -28.20123291015625, "global_step": 622868, "epoch": 7504} {"train_loss": -28.25335121154785, "global_step": 622869, "epoch": 7504} {"train_loss": -28.600732803344727, "global_step": 622870, "epoch": 7504} {"train_loss": -28.167984008789062, "global_step": 622871, "epoch": 7504} {"train_loss": -28.126998901367188, "global_step": 622872, "epoch": 7504} {"train_loss": -28.299726486206055, "global_step": 622873, "epoch": 7504} {"train_loss": -28.174427032470703, "global_step": 622874, "epoch": 7504} {"train_loss": -28.43963623046875, "global_step": 622875, "epoch": 7504} {"train_loss": -28.27500343322754, "global_step": 622876, "epoch": 7504} {"train_loss": -28.453344345092773, "global_step": 622877, "epoch": 7504} {"train_loss": -28.187307357788086, "global_step": 622878, "epoch": 7504} {"train_loss": -28.352521896362305, "global_step": 622879, "epoch": 7504} {"train_loss": -28.264114379882812, "global_step": 622880, "epoch": 7504} {"train_loss": -28.08819007873535, "global_step": 622881, "epoch": 7504} {"train_loss": -28.097854614257812, "global_step": 622882, "epoch": 7504} {"train_loss": -28.398406982421875, "global_step": 622883, "epoch": 7504} {"train_loss": -28.060882568359375, "global_step": 622884, "epoch": 7504} {"train_loss": -28.52821159362793, "global_step": 622885, "epoch": 7504} {"train_loss": -28.5225772857666, "global_step": 622886, "epoch": 7504} {"train_loss": -28.386337280273438, "global_step": 622887, "epoch": 7504} {"train_loss": -28.263076782226562, "global_step": 622888, "epoch": 7504} {"train_loss": -28.084869384765625, "global_step": 622889, "epoch": 7504} {"train_loss": -28.25782585144043, "global_step": 622890, "epoch": 7504} {"train_loss": -28.51576805114746, "global_step": 622891, "epoch": 7504} {"train_loss": -28.066736221313477, "global_step": 622892, "epoch": 7504} {"train_loss": -28.272979736328125, "global_step": 622893, "epoch": 7504} {"train_loss": -28.075071334838867, "global_step": 622894, "epoch": 7504} {"train_loss": -28.100982666015625, "global_step": 622895, "epoch": 7504} {"train_loss": -28.656641006469727, "global_step": 622896, "epoch": 7504} {"train_loss": -27.916452407836914, "global_step": 622897, "epoch": 7504} {"train_loss": -28.146398544311523, "global_step": 622898, "epoch": 7504} {"train_loss": -27.822280883789062, "global_step": 622899, "epoch": 7504} {"train_loss": -28.03041648864746, "global_step": 622900, "epoch": 7504} {"train_loss": -28.22027587890625, "global_step": 622901, "epoch": 7504} {"train_loss": -28.44211769104004, "global_step": 622902, "epoch": 7504} {"train_loss": -28.240629196166992, "global_step": 622903, "epoch": 7504} {"train_loss": -28.32356071472168, "global_step": 622904, "epoch": 7504} {"train_loss": -28.265798568725586, "global_step": 622905, "epoch": 7504} {"train_loss": -28.290754318237305, "global_step": 622906, "epoch": 7504} {"train_loss": -27.989301681518555, "global_step": 622907, "epoch": 7504} {"train_loss": -28.10626220703125, "global_step": 622908, "epoch": 7504} {"train_loss": -28.008682250976562, "global_step": 622909, "epoch": 7504} {"train_loss": -28.039453506469727, "global_step": 622910, "epoch": 7504} {"train_loss": -27.684173583984375, "global_step": 622911, "epoch": 7504} {"train_loss": -27.924482345581055, "global_step": 622912, "epoch": 7504} {"train_loss": -26.94411277770996, "global_step": 622913, "epoch": 7504} {"train_loss": -28.090100805443452, "global_step": 622914, "epoch": 7504, "val_loss": 6878657.5} {"train_loss": -27.691373825073242, "global_step": 622915, "epoch": 7505} {"train_loss": -26.18259048461914, "global_step": 622916, "epoch": 7505} {"train_loss": -26.839929580688477, "global_step": 622917, "epoch": 7505} {"train_loss": -27.192138671875, "global_step": 622918, "epoch": 7505} {"train_loss": -26.884510040283203, "global_step": 622919, "epoch": 7505} {"train_loss": -27.114465713500977, "global_step": 622920, "epoch": 7505} {"train_loss": -26.5085506439209, "global_step": 622921, "epoch": 7505} {"train_loss": -27.083715438842773, "global_step": 622922, "epoch": 7505} {"train_loss": -27.063764572143555, "global_step": 622923, "epoch": 7505} {"train_loss": -27.281408309936523, "global_step": 622924, "epoch": 7505} {"train_loss": -27.35516929626465, "global_step": 622925, "epoch": 7505} {"train_loss": -27.3823299407959, "global_step": 622926, "epoch": 7505} {"train_loss": -27.365966796875, "global_step": 622927, "epoch": 7505} {"train_loss": -27.26344108581543, "global_step": 622928, "epoch": 7505} {"train_loss": -27.833560943603516, "global_step": 622929, "epoch": 7505} {"train_loss": -27.532194137573242, "global_step": 622930, "epoch": 7505} {"train_loss": -27.634220123291016, "global_step": 622931, "epoch": 7505} {"train_loss": -27.76019287109375, "global_step": 622932, "epoch": 7505} {"train_loss": -27.354385375976562, "global_step": 622933, "epoch": 7505} {"train_loss": -27.49222755432129, "global_step": 622934, "epoch": 7505} {"train_loss": -27.8160457611084, "global_step": 622935, "epoch": 7505} {"train_loss": -28.003164291381836, "global_step": 622936, "epoch": 7505} {"train_loss": -28.08937644958496, "global_step": 622937, "epoch": 7505} {"train_loss": -27.95611572265625, "global_step": 622938, "epoch": 7505} {"train_loss": -27.749597549438477, "global_step": 622939, "epoch": 7505} {"train_loss": -27.696292877197266, "global_step": 622940, "epoch": 7505} {"train_loss": -27.717849731445312, "global_step": 622941, "epoch": 7505} {"train_loss": -27.90496826171875, "global_step": 622942, "epoch": 7505} {"train_loss": -27.71034812927246, "global_step": 622943, "epoch": 7505} {"train_loss": -27.891036987304688, "global_step": 622944, "epoch": 7505} {"train_loss": -27.730920791625977, "global_step": 622945, "epoch": 7505} {"train_loss": -27.969635009765625, "global_step": 622946, "epoch": 7505} {"train_loss": -27.843076705932617, "global_step": 622947, "epoch": 7505} {"train_loss": -28.019306182861328, "global_step": 622948, "epoch": 7505} {"train_loss": -28.37129020690918, "global_step": 622949, "epoch": 7505} {"train_loss": -28.132394790649414, "global_step": 622950, "epoch": 7505} {"train_loss": -28.220487594604492, "global_step": 622951, "epoch": 7505} {"train_loss": -28.073530197143555, "global_step": 622952, "epoch": 7505} {"train_loss": -28.044055938720703, "global_step": 622953, "epoch": 7505} {"train_loss": -28.409887313842773, "global_step": 622954, "epoch": 7505} {"train_loss": -28.376707077026367, "global_step": 622955, "epoch": 7505} {"train_loss": -28.189620971679688, "global_step": 622956, "epoch": 7505} {"train_loss": -28.182392120361328, "global_step": 622957, "epoch": 7505} {"train_loss": -28.075653076171875, "global_step": 622958, "epoch": 7505} {"train_loss": -28.395465850830078, "global_step": 622959, "epoch": 7505} {"train_loss": -28.13368797302246, "global_step": 622960, "epoch": 7505} {"train_loss": -28.387903213500977, "global_step": 622961, "epoch": 7505} {"train_loss": -28.18377113342285, "global_step": 622962, "epoch": 7505} {"train_loss": -28.018835067749023, "global_step": 622963, "epoch": 7505} {"train_loss": -28.495954513549805, "global_step": 622964, "epoch": 7505} {"train_loss": -28.055572509765625, "global_step": 622965, "epoch": 7505} {"train_loss": -28.377731323242188, "global_step": 622966, "epoch": 7505} {"train_loss": -28.065658569335938, "global_step": 622967, "epoch": 7505} {"train_loss": -28.562829971313477, "global_step": 622968, "epoch": 7505} {"train_loss": -28.321399688720703, "global_step": 622969, "epoch": 7505} {"train_loss": -28.421939849853516, "global_step": 622970, "epoch": 7505} {"train_loss": -28.055265426635742, "global_step": 622971, "epoch": 7505} {"train_loss": -27.861465454101562, "global_step": 622972, "epoch": 7505} {"train_loss": -27.82831382751465, "global_step": 622973, "epoch": 7505} {"train_loss": -28.303455352783203, "global_step": 622974, "epoch": 7505} {"train_loss": -28.431293487548828, "global_step": 622975, "epoch": 7505} {"train_loss": -28.319244384765625, "global_step": 622976, "epoch": 7505} {"train_loss": -27.767805099487305, "global_step": 622977, "epoch": 7505} {"train_loss": -28.245466232299805, "global_step": 622978, "epoch": 7505} {"train_loss": -27.953474044799805, "global_step": 622979, "epoch": 7505} {"train_loss": -27.989013671875, "global_step": 622980, "epoch": 7505} {"train_loss": -28.155197143554688, "global_step": 622981, "epoch": 7505} {"train_loss": -28.50006103515625, "global_step": 622982, "epoch": 7505} {"train_loss": -28.503564834594727, "global_step": 622983, "epoch": 7505} {"train_loss": -28.28876304626465, "global_step": 622984, "epoch": 7505} {"train_loss": -27.994009017944336, "global_step": 622985, "epoch": 7505} {"train_loss": -28.491079330444336, "global_step": 622986, "epoch": 7505} {"train_loss": -28.38687515258789, "global_step": 622987, "epoch": 7505} {"train_loss": -27.95252799987793, "global_step": 622988, "epoch": 7505} {"train_loss": -28.33896827697754, "global_step": 622989, "epoch": 7505} {"train_loss": -27.947574615478516, "global_step": 622990, "epoch": 7505} {"train_loss": -28.019550323486328, "global_step": 622991, "epoch": 7505} {"train_loss": -28.116743087768555, "global_step": 622992, "epoch": 7505} {"train_loss": -27.634252548217773, "global_step": 622993, "epoch": 7505} {"train_loss": -28.09397315979004, "global_step": 622994, "epoch": 7505} {"train_loss": -28.030364990234375, "global_step": 622995, "epoch": 7505} {"train_loss": -28.4930419921875, "global_step": 622996, "epoch": 7505} {"train_loss": -27.920969491981598, "global_step": 622997, "epoch": 7505, "val_loss": 6813275.0} {"train_loss": -26.23891258239746, "global_step": 622998, "epoch": 7506} {"train_loss": -25.99881935119629, "global_step": 622999, "epoch": 7506} {"train_loss": -26.02546501159668, "global_step": 623000, "epoch": 7506} {"train_loss": -26.7911376953125, "global_step": 623001, "epoch": 7506} {"train_loss": -26.23982810974121, "global_step": 623002, "epoch": 7506} {"train_loss": -26.62617301940918, "global_step": 623003, "epoch": 7506} {"train_loss": -26.932514190673828, "global_step": 623004, "epoch": 7506} {"train_loss": -26.602588653564453, "global_step": 623005, "epoch": 7506} {"train_loss": -26.961658477783203, "global_step": 623006, "epoch": 7506} {"train_loss": -26.874847412109375, "global_step": 623007, "epoch": 7506} {"train_loss": -27.4469051361084, "global_step": 623008, "epoch": 7506} {"train_loss": -27.33251953125, "global_step": 623009, "epoch": 7506} {"train_loss": -27.031824111938477, "global_step": 623010, "epoch": 7506} {"train_loss": -27.19550895690918, "global_step": 623011, "epoch": 7506} {"train_loss": -27.557043075561523, "global_step": 623012, "epoch": 7506} {"train_loss": -27.242080688476562, "global_step": 623013, "epoch": 7506} {"train_loss": -27.519855499267578, "global_step": 623014, "epoch": 7506} {"train_loss": -27.396726608276367, "global_step": 623015, "epoch": 7506} {"train_loss": -27.034589767456055, "global_step": 623016, "epoch": 7506} {"train_loss": -27.613229751586914, "global_step": 623017, "epoch": 7506} {"train_loss": -27.60334587097168, "global_step": 623018, "epoch": 7506} {"train_loss": -27.21156120300293, "global_step": 623019, "epoch": 7506} {"train_loss": -27.47529411315918, "global_step": 623020, "epoch": 7506} {"train_loss": -27.748193740844727, "global_step": 623021, "epoch": 7506} {"train_loss": -27.404956817626953, "global_step": 623022, "epoch": 7506} {"train_loss": -27.695531845092773, "global_step": 623023, "epoch": 7506} {"train_loss": -28.017608642578125, "global_step": 623024, "epoch": 7506} {"train_loss": -27.9016056060791, "global_step": 623025, "epoch": 7506} {"train_loss": -27.873987197875977, "global_step": 623026, "epoch": 7506} {"train_loss": -27.949146270751953, "global_step": 623027, "epoch": 7506} {"train_loss": -27.750452041625977, "global_step": 623028, "epoch": 7506} {"train_loss": -27.727619171142578, "global_step": 623029, "epoch": 7506} {"train_loss": -27.331939697265625, "global_step": 623030, "epoch": 7506} {"train_loss": -27.825565338134766, "global_step": 623031, "epoch": 7506} {"train_loss": -27.970966339111328, "global_step": 623032, "epoch": 7506} {"train_loss": -28.072614669799805, "global_step": 623033, "epoch": 7506} {"train_loss": -28.13226318359375, "global_step": 623034, "epoch": 7506} {"train_loss": -27.8900089263916, "global_step": 623035, "epoch": 7506} {"train_loss": -28.14920997619629, "global_step": 623036, "epoch": 7506} {"train_loss": -28.0615291595459, "global_step": 623037, "epoch": 7506} {"train_loss": -27.823287963867188, "global_step": 623038, "epoch": 7506} {"train_loss": -28.0739803314209, "global_step": 623039, "epoch": 7506} {"train_loss": -28.31989860534668, "global_step": 623040, "epoch": 7506} {"train_loss": -27.981281280517578, "global_step": 623041, "epoch": 7506} {"train_loss": -28.46114158630371, "global_step": 623042, "epoch": 7506} {"train_loss": -28.08475112915039, "global_step": 623043, "epoch": 7506} {"train_loss": -28.0958251953125, "global_step": 623044, "epoch": 7506} {"train_loss": -28.0451717376709, "global_step": 623045, "epoch": 7506} {"train_loss": -28.555200576782227, "global_step": 623046, "epoch": 7506} {"train_loss": -28.11793327331543, "global_step": 623047, "epoch": 7506} {"train_loss": -28.456409454345703, "global_step": 623048, "epoch": 7506} {"train_loss": -28.244665145874023, "global_step": 623049, "epoch": 7506} {"train_loss": -28.583410263061523, "global_step": 623050, "epoch": 7506} {"train_loss": -27.9280948638916, "global_step": 623051, "epoch": 7506} {"train_loss": -28.478687286376953, "global_step": 623052, "epoch": 7506} {"train_loss": -28.29303550720215, "global_step": 623053, "epoch": 7506} {"train_loss": -28.55278968811035, "global_step": 623054, "epoch": 7506} {"train_loss": -28.321805953979492, "global_step": 623055, "epoch": 7506} {"train_loss": -28.354450225830078, "global_step": 623056, "epoch": 7506} {"train_loss": -28.186481475830078, "global_step": 623057, "epoch": 7506} {"train_loss": -28.410476684570312, "global_step": 623058, "epoch": 7506} {"train_loss": -28.126516342163086, "global_step": 623059, "epoch": 7506} {"train_loss": -28.43118667602539, "global_step": 623060, "epoch": 7506} {"train_loss": -28.119049072265625, "global_step": 623061, "epoch": 7506} {"train_loss": -28.11809730529785, "global_step": 623062, "epoch": 7506} {"train_loss": -27.74519920349121, "global_step": 623063, "epoch": 7506} {"train_loss": -27.94122886657715, "global_step": 623064, "epoch": 7506} {"train_loss": -27.80158042907715, "global_step": 623065, "epoch": 7506} {"train_loss": -27.1563777923584, "global_step": 623066, "epoch": 7506} {"train_loss": -26.278350830078125, "global_step": 623067, "epoch": 7506} {"train_loss": -25.413022994995117, "global_step": 623068, "epoch": 7506} {"train_loss": -26.187732696533203, "global_step": 623069, "epoch": 7506} {"train_loss": -27.6820068359375, "global_step": 623070, "epoch": 7506} {"train_loss": -27.72027587890625, "global_step": 623071, "epoch": 7506} {"train_loss": -28.27703285217285, "global_step": 623072, "epoch": 7506} {"train_loss": -27.795368194580078, "global_step": 623073, "epoch": 7506} {"train_loss": -28.129581451416016, "global_step": 623074, "epoch": 7506} {"train_loss": -28.134302139282227, "global_step": 623075, "epoch": 7506} {"train_loss": -28.148029327392578, "global_step": 623076, "epoch": 7506} {"train_loss": -28.11484146118164, "global_step": 623077, "epoch": 7506} {"train_loss": -27.624425888061523, "global_step": 623078, "epoch": 7506} {"train_loss": -28.252283096313477, "global_step": 623079, "epoch": 7506} {"train_loss": -27.6722606980657, "global_step": 623080, "epoch": 7506, "val_loss": 6797108.5} {"train_loss": -26.955154418945312, "global_step": 623081, "epoch": 7507} {"train_loss": -27.052921295166016, "global_step": 623082, "epoch": 7507} {"train_loss": -27.035175323486328, "global_step": 623083, "epoch": 7507} {"train_loss": -26.100061416625977, "global_step": 623084, "epoch": 7507} {"train_loss": -27.34769630432129, "global_step": 623085, "epoch": 7507} {"train_loss": -27.110565185546875, "global_step": 623086, "epoch": 7507} {"train_loss": -27.47833824157715, "global_step": 623087, "epoch": 7507} {"train_loss": -26.684778213500977, "global_step": 623088, "epoch": 7507} {"train_loss": -27.466108322143555, "global_step": 623089, "epoch": 7507} {"train_loss": -27.225727081298828, "global_step": 623090, "epoch": 7507} {"train_loss": -27.3786563873291, "global_step": 623091, "epoch": 7507} {"train_loss": -27.374597549438477, "global_step": 623092, "epoch": 7507} {"train_loss": -27.107913970947266, "global_step": 623093, "epoch": 7507} {"train_loss": -27.43360710144043, "global_step": 623094, "epoch": 7507} {"train_loss": -27.40643310546875, "global_step": 623095, "epoch": 7507} {"train_loss": -27.66739845275879, "global_step": 623096, "epoch": 7507} {"train_loss": -27.572101593017578, "global_step": 623097, "epoch": 7507} {"train_loss": -27.30291748046875, "global_step": 623098, "epoch": 7507} {"train_loss": -27.644119262695312, "global_step": 623099, "epoch": 7507} {"train_loss": -27.272851943969727, "global_step": 623100, "epoch": 7507} {"train_loss": -26.575857162475586, "global_step": 623101, "epoch": 7507} {"train_loss": -27.744220733642578, "global_step": 623102, "epoch": 7507} {"train_loss": -27.862524032592773, "global_step": 623103, "epoch": 7507} {"train_loss": -27.816370010375977, "global_step": 623104, "epoch": 7507} {"train_loss": -27.937381744384766, "global_step": 623105, "epoch": 7507} {"train_loss": -27.877119064331055, "global_step": 623106, "epoch": 7507} {"train_loss": -27.740880966186523, "global_step": 623107, "epoch": 7507} {"train_loss": -27.94552993774414, "global_step": 623108, "epoch": 7507} {"train_loss": -27.827783584594727, "global_step": 623109, "epoch": 7507} {"train_loss": -28.000415802001953, "global_step": 623110, "epoch": 7507} {"train_loss": -27.63014030456543, "global_step": 623111, "epoch": 7507} {"train_loss": -28.013818740844727, "global_step": 623112, "epoch": 7507} {"train_loss": -28.402494430541992, "global_step": 623113, "epoch": 7507} {"train_loss": -27.897262573242188, "global_step": 623114, "epoch": 7507} {"train_loss": -28.1016902923584, "global_step": 623115, "epoch": 7507} {"train_loss": -28.685575485229492, "global_step": 623116, "epoch": 7507} {"train_loss": -28.06492042541504, "global_step": 623117, "epoch": 7507} {"train_loss": -28.47686195373535, "global_step": 623118, "epoch": 7507} {"train_loss": -27.996129989624023, "global_step": 623119, "epoch": 7507} {"train_loss": -27.824462890625, "global_step": 623120, "epoch": 7507} {"train_loss": -28.18830680847168, "global_step": 623121, "epoch": 7507} {"train_loss": -28.293914794921875, "global_step": 623122, "epoch": 7507} {"train_loss": -28.180700302124023, "global_step": 623123, "epoch": 7507} {"train_loss": -28.263334274291992, "global_step": 623124, "epoch": 7507} {"train_loss": -28.155786514282227, "global_step": 623125, "epoch": 7507} {"train_loss": -28.476404190063477, "global_step": 623126, "epoch": 7507} {"train_loss": -28.43433952331543, "global_step": 623127, "epoch": 7507} {"train_loss": -28.097671508789062, "global_step": 623128, "epoch": 7507} {"train_loss": -28.367401123046875, "global_step": 623129, "epoch": 7507} {"train_loss": -28.2337646484375, "global_step": 623130, "epoch": 7507} {"train_loss": -28.18290138244629, "global_step": 623131, "epoch": 7507} {"train_loss": -28.261831283569336, "global_step": 623132, "epoch": 7507} {"train_loss": -28.317398071289062, "global_step": 623133, "epoch": 7507} {"train_loss": -28.450183868408203, "global_step": 623134, "epoch": 7507} {"train_loss": -28.625171661376953, "global_step": 623135, "epoch": 7507} {"train_loss": -28.00202751159668, "global_step": 623136, "epoch": 7507} {"train_loss": -28.203893661499023, "global_step": 623137, "epoch": 7507} {"train_loss": -27.98183250427246, "global_step": 623138, "epoch": 7507} {"train_loss": -28.38758659362793, "global_step": 623139, "epoch": 7507} {"train_loss": -28.281957626342773, "global_step": 623140, "epoch": 7507} {"train_loss": -27.877716064453125, "global_step": 623141, "epoch": 7507} {"train_loss": -27.95624351501465, "global_step": 623142, "epoch": 7507} {"train_loss": -28.708906173706055, "global_step": 623143, "epoch": 7507} {"train_loss": -27.86111831665039, "global_step": 623144, "epoch": 7507} {"train_loss": -27.766666412353516, "global_step": 623145, "epoch": 7507} {"train_loss": -27.86760902404785, "global_step": 623146, "epoch": 7507} {"train_loss": -27.857709884643555, "global_step": 623147, "epoch": 7507} {"train_loss": -28.200830459594727, "global_step": 623148, "epoch": 7507} {"train_loss": -27.457395553588867, "global_step": 623149, "epoch": 7507} {"train_loss": -28.412073135375977, "global_step": 623150, "epoch": 7507} {"train_loss": -27.510696411132812, "global_step": 623151, "epoch": 7507} {"train_loss": -27.525226593017578, "global_step": 623152, "epoch": 7507} {"train_loss": -27.672210693359375, "global_step": 623153, "epoch": 7507} {"train_loss": -27.5819149017334, "global_step": 623154, "epoch": 7507} {"train_loss": -28.216100692749023, "global_step": 623155, "epoch": 7507} {"train_loss": -27.886188507080078, "global_step": 623156, "epoch": 7507} {"train_loss": -27.906667709350586, "global_step": 623157, "epoch": 7507} {"train_loss": -27.661243438720703, "global_step": 623158, "epoch": 7507} {"train_loss": -27.845417022705078, "global_step": 623159, "epoch": 7507} {"train_loss": -27.986425399780273, "global_step": 623160, "epoch": 7507} {"train_loss": -27.660144805908203, "global_step": 623161, "epoch": 7507} {"train_loss": -28.334857940673828, "global_step": 623162, "epoch": 7507} {"train_loss": -27.828223125044122, "global_step": 623163, "epoch": 7507, "val_loss": 6844155.0} {"train_loss": -27.568145751953125, "global_step": 623164, "epoch": 7508} {"train_loss": -27.946151733398438, "global_step": 623165, "epoch": 7508} {"train_loss": -27.80967140197754, "global_step": 623166, "epoch": 7508} {"train_loss": -27.794071197509766, "global_step": 623167, "epoch": 7508} {"train_loss": -27.57404899597168, "global_step": 623168, "epoch": 7508} {"train_loss": -27.947010040283203, "global_step": 623169, "epoch": 7508} {"train_loss": -27.58504295349121, "global_step": 623170, "epoch": 7508} {"train_loss": -27.554107666015625, "global_step": 623171, "epoch": 7508} {"train_loss": -27.557703018188477, "global_step": 623172, "epoch": 7508} {"train_loss": -27.779996871948242, "global_step": 623173, "epoch": 7508} {"train_loss": -27.955636978149414, "global_step": 623174, "epoch": 7508} {"train_loss": -27.83916664123535, "global_step": 623175, "epoch": 7508} {"train_loss": -27.736297607421875, "global_step": 623176, "epoch": 7508} {"train_loss": -27.98981285095215, "global_step": 623177, "epoch": 7508} {"train_loss": -27.6109676361084, "global_step": 623178, "epoch": 7508} {"train_loss": -27.76612663269043, "global_step": 623179, "epoch": 7508} {"train_loss": -27.799346923828125, "global_step": 623180, "epoch": 7508} {"train_loss": -27.858381271362305, "global_step": 623181, "epoch": 7508} {"train_loss": -28.17441177368164, "global_step": 623182, "epoch": 7508} {"train_loss": -28.28718376159668, "global_step": 623183, "epoch": 7508} {"train_loss": -28.03959083557129, "global_step": 623184, "epoch": 7508} {"train_loss": -27.90744400024414, "global_step": 623185, "epoch": 7508} {"train_loss": -28.458038330078125, "global_step": 623186, "epoch": 7508} {"train_loss": -28.203739166259766, "global_step": 623187, "epoch": 7508} {"train_loss": -28.20774269104004, "global_step": 623188, "epoch": 7508} {"train_loss": -28.1584415435791, "global_step": 623189, "epoch": 7508} {"train_loss": -28.194665908813477, "global_step": 623190, "epoch": 7508} {"train_loss": -27.965795516967773, "global_step": 623191, "epoch": 7508} {"train_loss": -27.6962833404541, "global_step": 623192, "epoch": 7508} {"train_loss": -28.13433265686035, "global_step": 623193, "epoch": 7508} {"train_loss": -28.22254753112793, "global_step": 623194, "epoch": 7508} {"train_loss": -27.881357192993164, "global_step": 623195, "epoch": 7508} {"train_loss": -28.09760093688965, "global_step": 623196, "epoch": 7508} {"train_loss": -28.189865112304688, "global_step": 623197, "epoch": 7508} {"train_loss": -27.862762451171875, "global_step": 623198, "epoch": 7508} {"train_loss": -28.217493057250977, "global_step": 623199, "epoch": 7508} {"train_loss": -28.373449325561523, "global_step": 623200, "epoch": 7508} {"train_loss": -28.13677406311035, "global_step": 623201, "epoch": 7508} {"train_loss": -28.154767990112305, "global_step": 623202, "epoch": 7508} {"train_loss": -27.99883460998535, "global_step": 623203, "epoch": 7508} {"train_loss": -28.44580078125, "global_step": 623204, "epoch": 7508} {"train_loss": -28.118305206298828, "global_step": 623205, "epoch": 7508} {"train_loss": -28.048070907592773, "global_step": 623206, "epoch": 7508} {"train_loss": -28.2037296295166, "global_step": 623207, "epoch": 7508} {"train_loss": -28.423995971679688, "global_step": 623208, "epoch": 7508} {"train_loss": -28.41301918029785, "global_step": 623209, "epoch": 7508} {"train_loss": -28.177764892578125, "global_step": 623210, "epoch": 7508} {"train_loss": -28.317890167236328, "global_step": 623211, "epoch": 7508} {"train_loss": -28.357410430908203, "global_step": 623212, "epoch": 7508} {"train_loss": -28.345874786376953, "global_step": 623213, "epoch": 7508} {"train_loss": -28.190587997436523, "global_step": 623214, "epoch": 7508} {"train_loss": -28.287708282470703, "global_step": 623215, "epoch": 7508} {"train_loss": -27.919782638549805, "global_step": 623216, "epoch": 7508} {"train_loss": -27.991003036499023, "global_step": 623217, "epoch": 7508} {"train_loss": -28.62952995300293, "global_step": 623218, "epoch": 7508} {"train_loss": -28.197193145751953, "global_step": 623219, "epoch": 7508} {"train_loss": -28.127531051635742, "global_step": 623220, "epoch": 7508} {"train_loss": -28.628286361694336, "global_step": 623221, "epoch": 7508} {"train_loss": -28.04999351501465, "global_step": 623222, "epoch": 7508} {"train_loss": -27.97515296936035, "global_step": 623223, "epoch": 7508} {"train_loss": -28.342334747314453, "global_step": 623224, "epoch": 7508} {"train_loss": -27.906341552734375, "global_step": 623225, "epoch": 7508} {"train_loss": -28.097305297851562, "global_step": 623226, "epoch": 7508} {"train_loss": -28.212482452392578, "global_step": 623227, "epoch": 7508} {"train_loss": -28.315921783447266, "global_step": 623228, "epoch": 7508} {"train_loss": -28.02479362487793, "global_step": 623229, "epoch": 7508} {"train_loss": -28.445362091064453, "global_step": 623230, "epoch": 7508} {"train_loss": -28.045774459838867, "global_step": 623231, "epoch": 7508} {"train_loss": -28.297590255737305, "global_step": 623232, "epoch": 7508} {"train_loss": -28.17706298828125, "global_step": 623233, "epoch": 7508} {"train_loss": -27.902307510375977, "global_step": 623234, "epoch": 7508} {"train_loss": -28.163339614868164, "global_step": 623235, "epoch": 7508} {"train_loss": -28.262054443359375, "global_step": 623236, "epoch": 7508} {"train_loss": -27.966083526611328, "global_step": 623237, "epoch": 7508} {"train_loss": -28.080907821655273, "global_step": 623238, "epoch": 7508} {"train_loss": -28.07204246520996, "global_step": 623239, "epoch": 7508} {"train_loss": -28.312824249267578, "global_step": 623240, "epoch": 7508} {"train_loss": -28.251211166381836, "global_step": 623241, "epoch": 7508} {"train_loss": -28.294763565063477, "global_step": 623242, "epoch": 7508} {"train_loss": -27.774572372436523, "global_step": 623243, "epoch": 7508} {"train_loss": -27.99311637878418, "global_step": 623244, "epoch": 7508} {"train_loss": -27.977203369140625, "global_step": 623245, "epoch": 7508} {"train_loss": -28.071062777415815, "global_step": 623246, "epoch": 7508, "val_loss": 6800318.0} {"train_loss": -27.572418212890625, "global_step": 623247, "epoch": 7509} {"train_loss": -27.644611358642578, "global_step": 623248, "epoch": 7509} {"train_loss": -27.753101348876953, "global_step": 623249, "epoch": 7509} {"train_loss": -27.435321807861328, "global_step": 623250, "epoch": 7509} {"train_loss": -27.5770263671875, "global_step": 623251, "epoch": 7509} {"train_loss": -27.5006160736084, "global_step": 623252, "epoch": 7509} {"train_loss": -27.121809005737305, "global_step": 623253, "epoch": 7509} {"train_loss": -27.599882125854492, "global_step": 623254, "epoch": 7509} {"train_loss": -27.411962509155273, "global_step": 623255, "epoch": 7509} {"train_loss": -27.358579635620117, "global_step": 623256, "epoch": 7509} {"train_loss": -26.95654296875, "global_step": 623257, "epoch": 7509} {"train_loss": -27.369831085205078, "global_step": 623258, "epoch": 7509} {"train_loss": -27.780187606811523, "global_step": 623259, "epoch": 7509} {"train_loss": -27.496694564819336, "global_step": 623260, "epoch": 7509} {"train_loss": -27.64910316467285, "global_step": 623261, "epoch": 7509} {"train_loss": -28.056976318359375, "global_step": 623262, "epoch": 7509} {"train_loss": -27.643192291259766, "global_step": 623263, "epoch": 7509} {"train_loss": -27.897571563720703, "global_step": 623264, "epoch": 7509} {"train_loss": -27.9442081451416, "global_step": 623265, "epoch": 7509} {"train_loss": -28.17889404296875, "global_step": 623266, "epoch": 7509} {"train_loss": -27.765161514282227, "global_step": 623267, "epoch": 7509} {"train_loss": -28.07549476623535, "global_step": 623268, "epoch": 7509} {"train_loss": -28.141244888305664, "global_step": 623269, "epoch": 7509} {"train_loss": -28.21603775024414, "global_step": 623270, "epoch": 7509} {"train_loss": -27.429059982299805, "global_step": 623271, "epoch": 7509} {"train_loss": -28.2531681060791, "global_step": 623272, "epoch": 7509} {"train_loss": -27.838977813720703, "global_step": 623273, "epoch": 7509} {"train_loss": -28.140899658203125, "global_step": 623274, "epoch": 7509} {"train_loss": -27.986724853515625, "global_step": 623275, "epoch": 7509} {"train_loss": -27.983243942260742, "global_step": 623276, "epoch": 7509} {"train_loss": -27.942350387573242, "global_step": 623277, "epoch": 7509} {"train_loss": -28.099782943725586, "global_step": 623278, "epoch": 7509} {"train_loss": -27.80499839782715, "global_step": 623279, "epoch": 7509} {"train_loss": -28.047637939453125, "global_step": 623280, "epoch": 7509} {"train_loss": -27.94169044494629, "global_step": 623281, "epoch": 7509} {"train_loss": -27.94379234313965, "global_step": 623282, "epoch": 7509} {"train_loss": -28.425260543823242, "global_step": 623283, "epoch": 7509} {"train_loss": -28.160125732421875, "global_step": 623284, "epoch": 7509} {"train_loss": -28.27627944946289, "global_step": 623285, "epoch": 7509} {"train_loss": -28.04999351501465, "global_step": 623286, "epoch": 7509} {"train_loss": -28.4390926361084, "global_step": 623287, "epoch": 7509} {"train_loss": -28.1737060546875, "global_step": 623288, "epoch": 7509} {"train_loss": -28.03822135925293, "global_step": 623289, "epoch": 7509} {"train_loss": -28.17534828186035, "global_step": 623290, "epoch": 7509} {"train_loss": -28.653945922851562, "global_step": 623291, "epoch": 7509} {"train_loss": -28.405445098876953, "global_step": 623292, "epoch": 7509} {"train_loss": -28.610559463500977, "global_step": 623293, "epoch": 7509} {"train_loss": -28.235326766967773, "global_step": 623294, "epoch": 7509} {"train_loss": -28.63675880432129, "global_step": 623295, "epoch": 7509} {"train_loss": -28.34464454650879, "global_step": 623296, "epoch": 7509} {"train_loss": -28.356155395507812, "global_step": 623297, "epoch": 7509} {"train_loss": -28.626928329467773, "global_step": 623298, "epoch": 7509} {"train_loss": -28.458410263061523, "global_step": 623299, "epoch": 7509} {"train_loss": -28.422815322875977, "global_step": 623300, "epoch": 7509} {"train_loss": -28.217193603515625, "global_step": 623301, "epoch": 7509} {"train_loss": -28.50909996032715, "global_step": 623302, "epoch": 7509} {"train_loss": -28.515119552612305, "global_step": 623303, "epoch": 7509} {"train_loss": -28.288434982299805, "global_step": 623304, "epoch": 7509} {"train_loss": -28.5614070892334, "global_step": 623305, "epoch": 7509} {"train_loss": -28.143095016479492, "global_step": 623306, "epoch": 7509} {"train_loss": -28.17401695251465, "global_step": 623307, "epoch": 7509} {"train_loss": -28.21909523010254, "global_step": 623308, "epoch": 7509} {"train_loss": -28.480093002319336, "global_step": 623309, "epoch": 7509} {"train_loss": -28.51148796081543, "global_step": 623310, "epoch": 7509} {"train_loss": -28.162336349487305, "global_step": 623311, "epoch": 7509} {"train_loss": -28.04488182067871, "global_step": 623312, "epoch": 7509} {"train_loss": -28.07978630065918, "global_step": 623313, "epoch": 7509} {"train_loss": -27.904932022094727, "global_step": 623314, "epoch": 7509} {"train_loss": -27.68829345703125, "global_step": 623315, "epoch": 7509} {"train_loss": -27.293371200561523, "global_step": 623316, "epoch": 7509} {"train_loss": -26.809125900268555, "global_step": 623317, "epoch": 7509} {"train_loss": -27.34734535217285, "global_step": 623318, "epoch": 7509} {"train_loss": -27.892852783203125, "global_step": 623319, "epoch": 7509} {"train_loss": -27.837636947631836, "global_step": 623320, "epoch": 7509} {"train_loss": -27.7022647857666, "global_step": 623321, "epoch": 7509} {"train_loss": -28.028234481811523, "global_step": 623322, "epoch": 7509} {"train_loss": -27.632261276245117, "global_step": 623323, "epoch": 7509} {"train_loss": -28.150348663330078, "global_step": 623324, "epoch": 7509} {"train_loss": -27.427915573120117, "global_step": 623325, "epoch": 7509} {"train_loss": -28.055622100830078, "global_step": 623326, "epoch": 7509} {"train_loss": -27.598602294921875, "global_step": 623327, "epoch": 7509} {"train_loss": -27.788000106811523, "global_step": 623328, "epoch": 7509} {"train_loss": -27.95771088657609, "global_step": 623329, "epoch": 7509, "val_loss": 6772959.5} {"train_loss": -27.123733520507812, "global_step": 623330, "epoch": 7510} {"train_loss": -26.871307373046875, "global_step": 623331, "epoch": 7510} {"train_loss": -27.176610946655273, "global_step": 623332, "epoch": 7510} {"train_loss": -27.29474449157715, "global_step": 623333, "epoch": 7510} {"train_loss": -26.77313232421875, "global_step": 623334, "epoch": 7510} {"train_loss": -26.8216609954834, "global_step": 623335, "epoch": 7510} {"train_loss": -27.46491050720215, "global_step": 623336, "epoch": 7510} {"train_loss": -27.07402992248535, "global_step": 623337, "epoch": 7510} {"train_loss": -27.494131088256836, "global_step": 623338, "epoch": 7510} {"train_loss": -27.65528678894043, "global_step": 623339, "epoch": 7510} {"train_loss": -27.495285034179688, "global_step": 623340, "epoch": 7510} {"train_loss": -27.239953994750977, "global_step": 623341, "epoch": 7510} {"train_loss": -27.658056259155273, "global_step": 623342, "epoch": 7510} {"train_loss": -27.399555206298828, "global_step": 623343, "epoch": 7510} {"train_loss": -27.298831939697266, "global_step": 623344, "epoch": 7510} {"train_loss": -27.524890899658203, "global_step": 623345, "epoch": 7510} {"train_loss": -27.385303497314453, "global_step": 623346, "epoch": 7510} {"train_loss": -27.257482528686523, "global_step": 623347, "epoch": 7510} {"train_loss": -27.494186401367188, "global_step": 623348, "epoch": 7510} {"train_loss": -27.537887573242188, "global_step": 623349, "epoch": 7510} {"train_loss": -27.678619384765625, "global_step": 623350, "epoch": 7510} {"train_loss": -27.038908004760742, "global_step": 623351, "epoch": 7510} {"train_loss": -27.49212074279785, "global_step": 623352, "epoch": 7510} {"train_loss": -27.811630249023438, "global_step": 623353, "epoch": 7510} {"train_loss": -27.784719467163086, "global_step": 623354, "epoch": 7510} {"train_loss": -28.00457763671875, "global_step": 623355, "epoch": 7510} {"train_loss": -27.7372989654541, "global_step": 623356, "epoch": 7510} {"train_loss": -27.799463272094727, "global_step": 623357, "epoch": 7510} {"train_loss": -28.083316802978516, "global_step": 623358, "epoch": 7510} {"train_loss": -27.727197647094727, "global_step": 623359, "epoch": 7510} {"train_loss": -28.05707359313965, "global_step": 623360, "epoch": 7510} {"train_loss": -27.800329208374023, "global_step": 623361, "epoch": 7510} {"train_loss": -27.93878173828125, "global_step": 623362, "epoch": 7510} {"train_loss": -28.170881271362305, "global_step": 623363, "epoch": 7510} {"train_loss": -27.826770782470703, "global_step": 623364, "epoch": 7510} {"train_loss": -27.845056533813477, "global_step": 623365, "epoch": 7510} {"train_loss": -28.22357177734375, "global_step": 623366, "epoch": 7510} {"train_loss": -27.85957145690918, "global_step": 623367, "epoch": 7510} {"train_loss": -28.09954833984375, "global_step": 623368, "epoch": 7510} {"train_loss": -28.1822509765625, "global_step": 623369, "epoch": 7510} {"train_loss": -28.098026275634766, "global_step": 623370, "epoch": 7510} {"train_loss": -27.956684112548828, "global_step": 623371, "epoch": 7510} {"train_loss": -28.053491592407227, "global_step": 623372, "epoch": 7510} {"train_loss": -28.356786727905273, "global_step": 623373, "epoch": 7510} {"train_loss": -28.509998321533203, "global_step": 623374, "epoch": 7510} {"train_loss": -27.90064811706543, "global_step": 623375, "epoch": 7510} {"train_loss": -28.425872802734375, "global_step": 623376, "epoch": 7510} {"train_loss": -28.2784366607666, "global_step": 623377, "epoch": 7510} {"train_loss": -28.413787841796875, "global_step": 623378, "epoch": 7510} {"train_loss": -28.2872257232666, "global_step": 623379, "epoch": 7510} {"train_loss": -28.064062118530273, "global_step": 623380, "epoch": 7510} {"train_loss": -28.289966583251953, "global_step": 623381, "epoch": 7510} {"train_loss": -28.40277099609375, "global_step": 623382, "epoch": 7510} {"train_loss": -28.484649658203125, "global_step": 623383, "epoch": 7510} {"train_loss": -28.155517578125, "global_step": 623384, "epoch": 7510} {"train_loss": -28.330322265625, "global_step": 623385, "epoch": 7510} {"train_loss": -28.491958618164062, "global_step": 623386, "epoch": 7510} {"train_loss": -28.551624298095703, "global_step": 623387, "epoch": 7510} {"train_loss": -27.95050048828125, "global_step": 623388, "epoch": 7510} {"train_loss": -28.565570831298828, "global_step": 623389, "epoch": 7510} {"train_loss": -28.299341201782227, "global_step": 623390, "epoch": 7510} {"train_loss": -28.593585968017578, "global_step": 623391, "epoch": 7510} {"train_loss": -28.414752960205078, "global_step": 623392, "epoch": 7510} {"train_loss": -28.710073471069336, "global_step": 623393, "epoch": 7510} {"train_loss": -28.45306396484375, "global_step": 623394, "epoch": 7510} {"train_loss": -28.09669303894043, "global_step": 623395, "epoch": 7510} {"train_loss": -28.232837677001953, "global_step": 623396, "epoch": 7510} {"train_loss": -28.56119155883789, "global_step": 623397, "epoch": 7510} {"train_loss": -28.369718551635742, "global_step": 623398, "epoch": 7510} {"train_loss": -28.229705810546875, "global_step": 623399, "epoch": 7510} {"train_loss": -28.507001876831055, "global_step": 623400, "epoch": 7510} {"train_loss": -28.62216567993164, "global_step": 623401, "epoch": 7510} {"train_loss": -28.483190536499023, "global_step": 623402, "epoch": 7510} {"train_loss": -28.423511505126953, "global_step": 623403, "epoch": 7510} {"train_loss": -27.9164981842041, "global_step": 623404, "epoch": 7510} {"train_loss": -25.93121337890625, "global_step": 623405, "epoch": 7510} {"train_loss": -21.47995376586914, "global_step": 623406, "epoch": 7510} {"train_loss": -18.750518798828125, "global_step": 623407, "epoch": 7510} {"train_loss": -24.909286499023438, "global_step": 623408, "epoch": 7510} {"train_loss": -25.805683135986328, "global_step": 623409, "epoch": 7510} {"train_loss": -26.75003433227539, "global_step": 623410, "epoch": 7510} {"train_loss": -25.69563865661621, "global_step": 623411, "epoch": 7510} {"train_loss": -27.607750122805676, "global_step": 623412, "epoch": 7510, "val_loss": 6828129.0} {"train_loss": -26.63214111328125, "global_step": 623413, "epoch": 7511} {"train_loss": -25.726720809936523, "global_step": 623414, "epoch": 7511} {"train_loss": -26.5881404876709, "global_step": 623415, "epoch": 7511} {"train_loss": -26.523160934448242, "global_step": 623416, "epoch": 7511} {"train_loss": -25.8399715423584, "global_step": 623417, "epoch": 7511} {"train_loss": -26.427356719970703, "global_step": 623418, "epoch": 7511} {"train_loss": -26.534942626953125, "global_step": 623419, "epoch": 7511} {"train_loss": -26.31519889831543, "global_step": 623420, "epoch": 7511} {"train_loss": -26.891809463500977, "global_step": 623421, "epoch": 7511} {"train_loss": -26.8559513092041, "global_step": 623422, "epoch": 7511} {"train_loss": -26.977218627929688, "global_step": 623423, "epoch": 7511} {"train_loss": -26.907941818237305, "global_step": 623424, "epoch": 7511} {"train_loss": -26.991275787353516, "global_step": 623425, "epoch": 7511} {"train_loss": -27.023157119750977, "global_step": 623426, "epoch": 7511} {"train_loss": -26.7246150970459, "global_step": 623427, "epoch": 7511} {"train_loss": -27.169042587280273, "global_step": 623428, "epoch": 7511} {"train_loss": -26.596206665039062, "global_step": 623429, "epoch": 7511} {"train_loss": -26.965158462524414, "global_step": 623430, "epoch": 7511} {"train_loss": -27.093488693237305, "global_step": 623431, "epoch": 7511} {"train_loss": -27.090097427368164, "global_step": 623432, "epoch": 7511} {"train_loss": -27.53130531311035, "global_step": 623433, "epoch": 7511} {"train_loss": -27.014301300048828, "global_step": 623434, "epoch": 7511} {"train_loss": -27.055408477783203, "global_step": 623435, "epoch": 7511} {"train_loss": -27.32240104675293, "global_step": 623436, "epoch": 7511} {"train_loss": -27.08599853515625, "global_step": 623437, "epoch": 7511} {"train_loss": -27.3128719329834, "global_step": 623438, "epoch": 7511} {"train_loss": -27.50575065612793, "global_step": 623439, "epoch": 7511} {"train_loss": -27.432432174682617, "global_step": 623440, "epoch": 7511} {"train_loss": -27.554080963134766, "global_step": 623441, "epoch": 7511} {"train_loss": -27.405567169189453, "global_step": 623442, "epoch": 7511} {"train_loss": -27.720327377319336, "global_step": 623443, "epoch": 7511} {"train_loss": -27.676069259643555, "global_step": 623444, "epoch": 7511} {"train_loss": -27.566564559936523, "global_step": 623445, "epoch": 7511} {"train_loss": -27.910070419311523, "global_step": 623446, "epoch": 7511} {"train_loss": -27.2895565032959, "global_step": 623447, "epoch": 7511} {"train_loss": -27.803693771362305, "global_step": 623448, "epoch": 7511} {"train_loss": -27.815753936767578, "global_step": 623449, "epoch": 7511} {"train_loss": -27.969945907592773, "global_step": 623450, "epoch": 7511} {"train_loss": -27.8655948638916, "global_step": 623451, "epoch": 7511} {"train_loss": -27.57325553894043, "global_step": 623452, "epoch": 7511} {"train_loss": -27.86759376525879, "global_step": 623453, "epoch": 7511} {"train_loss": -27.646848678588867, "global_step": 623454, "epoch": 7511} {"train_loss": -27.83344841003418, "global_step": 623455, "epoch": 7511} {"train_loss": -27.843769073486328, "global_step": 623456, "epoch": 7511} {"train_loss": -27.767560958862305, "global_step": 623457, "epoch": 7511} {"train_loss": -27.937681198120117, "global_step": 623458, "epoch": 7511} {"train_loss": -28.104711532592773, "global_step": 623459, "epoch": 7511} {"train_loss": -27.973388671875, "global_step": 623460, "epoch": 7511} {"train_loss": -27.827402114868164, "global_step": 623461, "epoch": 7511} {"train_loss": -28.09113883972168, "global_step": 623462, "epoch": 7511} {"train_loss": -27.951190948486328, "global_step": 623463, "epoch": 7511} {"train_loss": -28.267606735229492, "global_step": 623464, "epoch": 7511} {"train_loss": -28.0460262298584, "global_step": 623465, "epoch": 7511} {"train_loss": -28.1856632232666, "global_step": 623466, "epoch": 7511} {"train_loss": -28.3233642578125, "global_step": 623467, "epoch": 7511} {"train_loss": -28.05653190612793, "global_step": 623468, "epoch": 7511} {"train_loss": -27.937976837158203, "global_step": 623469, "epoch": 7511} {"train_loss": -28.197162628173828, "global_step": 623470, "epoch": 7511} {"train_loss": -28.01025390625, "global_step": 623471, "epoch": 7511} {"train_loss": -28.15203857421875, "global_step": 623472, "epoch": 7511} {"train_loss": -27.970102310180664, "global_step": 623473, "epoch": 7511} {"train_loss": -27.8966007232666, "global_step": 623474, "epoch": 7511} {"train_loss": -27.7726993560791, "global_step": 623475, "epoch": 7511} {"train_loss": -28.15736198425293, "global_step": 623476, "epoch": 7511} {"train_loss": -28.39151954650879, "global_step": 623477, "epoch": 7511} {"train_loss": -28.07076072692871, "global_step": 623478, "epoch": 7511} {"train_loss": -28.194263458251953, "global_step": 623479, "epoch": 7511} {"train_loss": -28.35986328125, "global_step": 623480, "epoch": 7511} {"train_loss": -28.160511016845703, "global_step": 623481, "epoch": 7511} {"train_loss": -28.313156127929688, "global_step": 623482, "epoch": 7511} {"train_loss": -27.901472091674805, "global_step": 623483, "epoch": 7511} {"train_loss": -28.47733497619629, "global_step": 623484, "epoch": 7511} {"train_loss": -28.20534324645996, "global_step": 623485, "epoch": 7511} {"train_loss": -27.7772216796875, "global_step": 623486, "epoch": 7511} {"train_loss": -28.27715492248535, "global_step": 623487, "epoch": 7511} {"train_loss": -28.260303497314453, "global_step": 623488, "epoch": 7511} {"train_loss": -28.062780380249023, "global_step": 623489, "epoch": 7511} {"train_loss": -28.245813369750977, "global_step": 623490, "epoch": 7511} {"train_loss": -28.371891021728516, "global_step": 623491, "epoch": 7511} {"train_loss": -28.42108154296875, "global_step": 623492, "epoch": 7511} {"train_loss": -28.036169052124023, "global_step": 623493, "epoch": 7511} {"train_loss": -28.265125274658203, "global_step": 623494, "epoch": 7511} {"train_loss": -27.597836138254188, "global_step": 623495, "epoch": 7511, "val_loss": 6783725.0} {"train_loss": -28.351062774658203, "global_step": 623496, "epoch": 7512} {"train_loss": -27.811450958251953, "global_step": 623497, "epoch": 7512} {"train_loss": -27.61231803894043, "global_step": 623498, "epoch": 7512} {"train_loss": -28.056432723999023, "global_step": 623499, "epoch": 7512} {"train_loss": -27.671361923217773, "global_step": 623500, "epoch": 7512} {"train_loss": -28.087875366210938, "global_step": 623501, "epoch": 7512} {"train_loss": -27.84039306640625, "global_step": 623502, "epoch": 7512} {"train_loss": -27.03128433227539, "global_step": 623503, "epoch": 7512} {"train_loss": -27.990201950073242, "global_step": 623504, "epoch": 7512} {"train_loss": -27.88934898376465, "global_step": 623505, "epoch": 7512} {"train_loss": -27.50473403930664, "global_step": 623506, "epoch": 7512} {"train_loss": -27.790273666381836, "global_step": 623507, "epoch": 7512} {"train_loss": -27.716215133666992, "global_step": 623508, "epoch": 7512} {"train_loss": -27.6724910736084, "global_step": 623509, "epoch": 7512} {"train_loss": -27.809528350830078, "global_step": 623510, "epoch": 7512} {"train_loss": -27.300739288330078, "global_step": 623511, "epoch": 7512} {"train_loss": -27.958515167236328, "global_step": 623512, "epoch": 7512} {"train_loss": -27.796377182006836, "global_step": 623513, "epoch": 7512} {"train_loss": -27.949420928955078, "global_step": 623514, "epoch": 7512} {"train_loss": -27.8843936920166, "global_step": 623515, "epoch": 7512} {"train_loss": -27.968168258666992, "global_step": 623516, "epoch": 7512} {"train_loss": -27.799169540405273, "global_step": 623517, "epoch": 7512} {"train_loss": -28.19728660583496, "global_step": 623518, "epoch": 7512} {"train_loss": -27.182483673095703, "global_step": 623519, "epoch": 7512} {"train_loss": -27.965972900390625, "global_step": 623520, "epoch": 7512} {"train_loss": -28.085195541381836, "global_step": 623521, "epoch": 7512} {"train_loss": -28.323486328125, "global_step": 623522, "epoch": 7512} {"train_loss": -28.147119522094727, "global_step": 623523, "epoch": 7512} {"train_loss": -28.02676773071289, "global_step": 623524, "epoch": 7512} {"train_loss": -27.88811683654785, "global_step": 623525, "epoch": 7512} {"train_loss": -28.417272567749023, "global_step": 623526, "epoch": 7512} {"train_loss": -28.300949096679688, "global_step": 623527, "epoch": 7512} {"train_loss": -28.219192504882812, "global_step": 623528, "epoch": 7512} {"train_loss": -28.681079864501953, "global_step": 623529, "epoch": 7512} {"train_loss": -28.306787490844727, "global_step": 623530, "epoch": 7512} {"train_loss": -28.252643585205078, "global_step": 623531, "epoch": 7512} {"train_loss": -28.27735710144043, "global_step": 623532, "epoch": 7512} {"train_loss": -28.299102783203125, "global_step": 623533, "epoch": 7512} {"train_loss": -28.163909912109375, "global_step": 623534, "epoch": 7512} {"train_loss": -28.246267318725586, "global_step": 623535, "epoch": 7512} {"train_loss": -28.661264419555664, "global_step": 623536, "epoch": 7512} {"train_loss": -28.501394271850586, "global_step": 623537, "epoch": 7512} {"train_loss": -28.421375274658203, "global_step": 623538, "epoch": 7512} {"train_loss": -28.23587417602539, "global_step": 623539, "epoch": 7512} {"train_loss": -28.523176193237305, "global_step": 623540, "epoch": 7512} {"train_loss": -28.173261642456055, "global_step": 623541, "epoch": 7512} {"train_loss": -28.39577293395996, "global_step": 623542, "epoch": 7512} {"train_loss": -28.332672119140625, "global_step": 623543, "epoch": 7512} {"train_loss": -28.10190200805664, "global_step": 623544, "epoch": 7512} {"train_loss": -28.33597755432129, "global_step": 623545, "epoch": 7512} {"train_loss": -28.467697143554688, "global_step": 623546, "epoch": 7512} {"train_loss": -28.43726921081543, "global_step": 623547, "epoch": 7512} {"train_loss": -28.140838623046875, "global_step": 623548, "epoch": 7512} {"train_loss": -28.587127685546875, "global_step": 623549, "epoch": 7512} {"train_loss": -28.4419002532959, "global_step": 623550, "epoch": 7512} {"train_loss": -28.38081169128418, "global_step": 623551, "epoch": 7512} {"train_loss": -28.456754684448242, "global_step": 623552, "epoch": 7512} {"train_loss": -28.51239013671875, "global_step": 623553, "epoch": 7512} {"train_loss": -28.179737091064453, "global_step": 623554, "epoch": 7512} {"train_loss": -28.564090728759766, "global_step": 623555, "epoch": 7512} {"train_loss": -28.360910415649414, "global_step": 623556, "epoch": 7512} {"train_loss": -28.42340087890625, "global_step": 623557, "epoch": 7512} {"train_loss": -28.604169845581055, "global_step": 623558, "epoch": 7512} {"train_loss": -28.536474227905273, "global_step": 623559, "epoch": 7512} {"train_loss": -28.226362228393555, "global_step": 623560, "epoch": 7512} {"train_loss": -27.986892700195312, "global_step": 623561, "epoch": 7512} {"train_loss": -27.746627807617188, "global_step": 623562, "epoch": 7512} {"train_loss": -28.105377197265625, "global_step": 623563, "epoch": 7512} {"train_loss": -28.432025909423828, "global_step": 623564, "epoch": 7512} {"train_loss": -27.86104393005371, "global_step": 623565, "epoch": 7512} {"train_loss": -28.242034912109375, "global_step": 623566, "epoch": 7512} {"train_loss": -27.931304931640625, "global_step": 623567, "epoch": 7512} {"train_loss": -28.007129669189453, "global_step": 623568, "epoch": 7512} {"train_loss": -27.979459762573242, "global_step": 623569, "epoch": 7512} {"train_loss": -28.168720245361328, "global_step": 623570, "epoch": 7512} {"train_loss": -27.59295654296875, "global_step": 623571, "epoch": 7512} {"train_loss": -27.89448356628418, "global_step": 623572, "epoch": 7512} {"train_loss": -27.21309471130371, "global_step": 623573, "epoch": 7512} {"train_loss": -27.21174430847168, "global_step": 623574, "epoch": 7512} {"train_loss": -27.175094604492188, "global_step": 623575, "epoch": 7512} {"train_loss": -27.745838165283203, "global_step": 623576, "epoch": 7512} {"train_loss": -28.214221954345703, "global_step": 623577, "epoch": 7512} {"train_loss": -28.063031851527203, "global_step": 623578, "epoch": 7512, "val_loss": 6738722.0} {"train_loss": -28.08279800415039, "global_step": 623579, "epoch": 7513} {"train_loss": -27.540302276611328, "global_step": 623580, "epoch": 7513} {"train_loss": -28.193403244018555, "global_step": 623581, "epoch": 7513} {"train_loss": -27.51276969909668, "global_step": 623582, "epoch": 7513} {"train_loss": -27.598615646362305, "global_step": 623583, "epoch": 7513} {"train_loss": -27.40895652770996, "global_step": 623584, "epoch": 7513} {"train_loss": -27.9085750579834, "global_step": 623585, "epoch": 7513} {"train_loss": -27.779020309448242, "global_step": 623586, "epoch": 7513} {"train_loss": -27.920154571533203, "global_step": 623587, "epoch": 7513} {"train_loss": -27.77015495300293, "global_step": 623588, "epoch": 7513} {"train_loss": -27.756336212158203, "global_step": 623589, "epoch": 7513} {"train_loss": -27.911035537719727, "global_step": 623590, "epoch": 7513} {"train_loss": -27.800439834594727, "global_step": 623591, "epoch": 7513} {"train_loss": -28.01515769958496, "global_step": 623592, "epoch": 7513} {"train_loss": -27.572126388549805, "global_step": 623593, "epoch": 7513} {"train_loss": -27.94288444519043, "global_step": 623594, "epoch": 7513} {"train_loss": -27.84242057800293, "global_step": 623595, "epoch": 7513} {"train_loss": -27.84540367126465, "global_step": 623596, "epoch": 7513} {"train_loss": -27.872333526611328, "global_step": 623597, "epoch": 7513} {"train_loss": -28.205615997314453, "global_step": 623598, "epoch": 7513} {"train_loss": -27.874460220336914, "global_step": 623599, "epoch": 7513} {"train_loss": -27.7491455078125, "global_step": 623600, "epoch": 7513} {"train_loss": -28.037519454956055, "global_step": 623601, "epoch": 7513} {"train_loss": -27.833948135375977, "global_step": 623602, "epoch": 7513} {"train_loss": -27.98402214050293, "global_step": 623603, "epoch": 7513} {"train_loss": -28.103300094604492, "global_step": 623604, "epoch": 7513} {"train_loss": -28.18413734436035, "global_step": 623605, "epoch": 7513} {"train_loss": -28.330198287963867, "global_step": 623606, "epoch": 7513} {"train_loss": -28.139997482299805, "global_step": 623607, "epoch": 7513} {"train_loss": -28.315153121948242, "global_step": 623608, "epoch": 7513} {"train_loss": -28.21693229675293, "global_step": 623609, "epoch": 7513} {"train_loss": -28.630680084228516, "global_step": 623610, "epoch": 7513} {"train_loss": -28.29115104675293, "global_step": 623611, "epoch": 7513} {"train_loss": -28.140573501586914, "global_step": 623612, "epoch": 7513} {"train_loss": -28.187213897705078, "global_step": 623613, "epoch": 7513} {"train_loss": -28.40824317932129, "global_step": 623614, "epoch": 7513} {"train_loss": -27.96038246154785, "global_step": 623615, "epoch": 7513} {"train_loss": -28.555952072143555, "global_step": 623616, "epoch": 7513} {"train_loss": -28.40571403503418, "global_step": 623617, "epoch": 7513} {"train_loss": -28.189878463745117, "global_step": 623618, "epoch": 7513} {"train_loss": -28.38970947265625, "global_step": 623619, "epoch": 7513} {"train_loss": -28.126169204711914, "global_step": 623620, "epoch": 7513} {"train_loss": -28.196552276611328, "global_step": 623621, "epoch": 7513} {"train_loss": -28.114974975585938, "global_step": 623622, "epoch": 7513} {"train_loss": -28.203418731689453, "global_step": 623623, "epoch": 7513} {"train_loss": -28.128814697265625, "global_step": 623624, "epoch": 7513} {"train_loss": -28.425800323486328, "global_step": 623625, "epoch": 7513} {"train_loss": -28.22263526916504, "global_step": 623626, "epoch": 7513} {"train_loss": -28.183866500854492, "global_step": 623627, "epoch": 7513} {"train_loss": -27.965621948242188, "global_step": 623628, "epoch": 7513} {"train_loss": -28.03632926940918, "global_step": 623629, "epoch": 7513} {"train_loss": -27.837268829345703, "global_step": 623630, "epoch": 7513} {"train_loss": -27.41749382019043, "global_step": 623631, "epoch": 7513} {"train_loss": -28.241077423095703, "global_step": 623632, "epoch": 7513} {"train_loss": -28.199254989624023, "global_step": 623633, "epoch": 7513} {"train_loss": -28.220691680908203, "global_step": 623634, "epoch": 7513} {"train_loss": -27.84224510192871, "global_step": 623635, "epoch": 7513} {"train_loss": -28.352563858032227, "global_step": 623636, "epoch": 7513} {"train_loss": -28.2255859375, "global_step": 623637, "epoch": 7513} {"train_loss": -28.281330108642578, "global_step": 623638, "epoch": 7513} {"train_loss": -28.14371109008789, "global_step": 623639, "epoch": 7513} {"train_loss": -28.441436767578125, "global_step": 623640, "epoch": 7513} {"train_loss": -28.241498947143555, "global_step": 623641, "epoch": 7513} {"train_loss": -28.437971115112305, "global_step": 623642, "epoch": 7513} {"train_loss": -28.242055892944336, "global_step": 623643, "epoch": 7513} {"train_loss": -28.34087562561035, "global_step": 623644, "epoch": 7513} {"train_loss": -28.225961685180664, "global_step": 623645, "epoch": 7513} {"train_loss": -28.061054229736328, "global_step": 623646, "epoch": 7513} {"train_loss": -28.27657127380371, "global_step": 623647, "epoch": 7513} {"train_loss": -28.22637367248535, "global_step": 623648, "epoch": 7513} {"train_loss": -27.7509822845459, "global_step": 623649, "epoch": 7513} {"train_loss": -27.699010848999023, "global_step": 623650, "epoch": 7513} {"train_loss": -27.519575119018555, "global_step": 623651, "epoch": 7513} {"train_loss": -27.806472778320312, "global_step": 623652, "epoch": 7513} {"train_loss": -27.93409538269043, "global_step": 623653, "epoch": 7513} {"train_loss": -28.217575073242188, "global_step": 623654, "epoch": 7513} {"train_loss": -27.636219024658203, "global_step": 623655, "epoch": 7513} {"train_loss": -27.8259334564209, "global_step": 623656, "epoch": 7513} {"train_loss": -27.6507625579834, "global_step": 623657, "epoch": 7513} {"train_loss": -27.979995727539062, "global_step": 623658, "epoch": 7513} {"train_loss": -27.925800323486328, "global_step": 623659, "epoch": 7513} {"train_loss": -28.43867301940918, "global_step": 623660, "epoch": 7513} {"train_loss": -28.05444434751947, "global_step": 623661, "epoch": 7513, "val_loss": 6782543.0} {"train_loss": -26.29371452331543, "global_step": 623662, "epoch": 7514} {"train_loss": -26.360004425048828, "global_step": 623663, "epoch": 7514} {"train_loss": -27.059112548828125, "global_step": 623664, "epoch": 7514} {"train_loss": -26.52350425720215, "global_step": 623665, "epoch": 7514} {"train_loss": -25.64369773864746, "global_step": 623666, "epoch": 7514} {"train_loss": -27.18821144104004, "global_step": 623667, "epoch": 7514} {"train_loss": -26.653356552124023, "global_step": 623668, "epoch": 7514} {"train_loss": -27.127771377563477, "global_step": 623669, "epoch": 7514} {"train_loss": -26.952112197875977, "global_step": 623670, "epoch": 7514} {"train_loss": -26.1877498626709, "global_step": 623671, "epoch": 7514} {"train_loss": -27.06794548034668, "global_step": 623672, "epoch": 7514} {"train_loss": -26.506025314331055, "global_step": 623673, "epoch": 7514} {"train_loss": -27.183536529541016, "global_step": 623674, "epoch": 7514} {"train_loss": -27.235980987548828, "global_step": 623675, "epoch": 7514} {"train_loss": -27.304502487182617, "global_step": 623676, "epoch": 7514} {"train_loss": -27.36284828186035, "global_step": 623677, "epoch": 7514} {"train_loss": -27.362768173217773, "global_step": 623678, "epoch": 7514} {"train_loss": -27.267871856689453, "global_step": 623679, "epoch": 7514} {"train_loss": -27.43177604675293, "global_step": 623680, "epoch": 7514} {"train_loss": -27.543798446655273, "global_step": 623681, "epoch": 7514} {"train_loss": -27.425678253173828, "global_step": 623682, "epoch": 7514} {"train_loss": -27.62944984436035, "global_step": 623683, "epoch": 7514} {"train_loss": -27.341083526611328, "global_step": 623684, "epoch": 7514} {"train_loss": -27.469709396362305, "global_step": 623685, "epoch": 7514} {"train_loss": -27.680328369140625, "global_step": 623686, "epoch": 7514} {"train_loss": -27.84030532836914, "global_step": 623687, "epoch": 7514} {"train_loss": -27.901716232299805, "global_step": 623688, "epoch": 7514} {"train_loss": -28.177968978881836, "global_step": 623689, "epoch": 7514} {"train_loss": -27.576553344726562, "global_step": 623690, "epoch": 7514} {"train_loss": -27.41607666015625, "global_step": 623691, "epoch": 7514} {"train_loss": -27.736133575439453, "global_step": 623692, "epoch": 7514} {"train_loss": -27.844013214111328, "global_step": 623693, "epoch": 7514} {"train_loss": -28.034759521484375, "global_step": 623694, "epoch": 7514} {"train_loss": -27.688678741455078, "global_step": 623695, "epoch": 7514} {"train_loss": -27.995649337768555, "global_step": 623696, "epoch": 7514} {"train_loss": -28.227148056030273, "global_step": 623697, "epoch": 7514} {"train_loss": -28.1337947845459, "global_step": 623698, "epoch": 7514} {"train_loss": -28.06001091003418, "global_step": 623699, "epoch": 7514} {"train_loss": -28.025243759155273, "global_step": 623700, "epoch": 7514} {"train_loss": -28.371475219726562, "global_step": 623701, "epoch": 7514} {"train_loss": -28.05910301208496, "global_step": 623702, "epoch": 7514} {"train_loss": -27.9691162109375, "global_step": 623703, "epoch": 7514} {"train_loss": -27.80433464050293, "global_step": 623704, "epoch": 7514} {"train_loss": -27.94478416442871, "global_step": 623705, "epoch": 7514} {"train_loss": -28.10331153869629, "global_step": 623706, "epoch": 7514} {"train_loss": -28.120996475219727, "global_step": 623707, "epoch": 7514} {"train_loss": -27.953046798706055, "global_step": 623708, "epoch": 7514} {"train_loss": -27.928125381469727, "global_step": 623709, "epoch": 7514} {"train_loss": -27.867725372314453, "global_step": 623710, "epoch": 7514} {"train_loss": -28.16444206237793, "global_step": 623711, "epoch": 7514} {"train_loss": -28.5399112701416, "global_step": 623712, "epoch": 7514} {"train_loss": -28.065601348876953, "global_step": 623713, "epoch": 7514} {"train_loss": -28.046890258789062, "global_step": 623714, "epoch": 7514} {"train_loss": -28.71095085144043, "global_step": 623715, "epoch": 7514} {"train_loss": -28.336957931518555, "global_step": 623716, "epoch": 7514} {"train_loss": -28.197324752807617, "global_step": 623717, "epoch": 7514} {"train_loss": -28.473501205444336, "global_step": 623718, "epoch": 7514} {"train_loss": -27.97651481628418, "global_step": 623719, "epoch": 7514} {"train_loss": -28.08723258972168, "global_step": 623720, "epoch": 7514} {"train_loss": -28.106475830078125, "global_step": 623721, "epoch": 7514} {"train_loss": -28.5529842376709, "global_step": 623722, "epoch": 7514} {"train_loss": -27.79103660583496, "global_step": 623723, "epoch": 7514} {"train_loss": -28.129962921142578, "global_step": 623724, "epoch": 7514} {"train_loss": -28.428003311157227, "global_step": 623725, "epoch": 7514} {"train_loss": -28.238813400268555, "global_step": 623726, "epoch": 7514} {"train_loss": -28.357730865478516, "global_step": 623727, "epoch": 7514} {"train_loss": -28.335058212280273, "global_step": 623728, "epoch": 7514} {"train_loss": -28.118749618530273, "global_step": 623729, "epoch": 7514} {"train_loss": -27.837814331054688, "global_step": 623730, "epoch": 7514} {"train_loss": -28.107934951782227, "global_step": 623731, "epoch": 7514} {"train_loss": -28.236053466796875, "global_step": 623732, "epoch": 7514} {"train_loss": -28.13482093811035, "global_step": 623733, "epoch": 7514} {"train_loss": -28.128314971923828, "global_step": 623734, "epoch": 7514} {"train_loss": -28.54111671447754, "global_step": 623735, "epoch": 7514} {"train_loss": -27.7268009185791, "global_step": 623736, "epoch": 7514} {"train_loss": -28.250268936157227, "global_step": 623737, "epoch": 7514} {"train_loss": -28.232345581054688, "global_step": 623738, "epoch": 7514} {"train_loss": -28.40009880065918, "global_step": 623739, "epoch": 7514} {"train_loss": -28.24810791015625, "global_step": 623740, "epoch": 7514} {"train_loss": -28.228351593017578, "global_step": 623741, "epoch": 7514} {"train_loss": -28.077985763549805, "global_step": 623742, "epoch": 7514} {"train_loss": -28.48386001586914, "global_step": 623743, "epoch": 7514} {"train_loss": -27.791017670229255, "global_step": 623744, "epoch": 7514, "val_loss": 6793779.5} {"train_loss": -27.99016761779785, "global_step": 623745, "epoch": 7515} {"train_loss": -27.94117546081543, "global_step": 623746, "epoch": 7515} {"train_loss": -27.924116134643555, "global_step": 623747, "epoch": 7515} {"train_loss": -28.17264175415039, "global_step": 623748, "epoch": 7515} {"train_loss": -28.0631046295166, "global_step": 623749, "epoch": 7515} {"train_loss": -28.040136337280273, "global_step": 623750, "epoch": 7515} {"train_loss": -27.82100486755371, "global_step": 623751, "epoch": 7515} {"train_loss": -27.916357040405273, "global_step": 623752, "epoch": 7515} {"train_loss": -27.907373428344727, "global_step": 623753, "epoch": 7515} {"train_loss": -28.2336368560791, "global_step": 623754, "epoch": 7515} {"train_loss": -27.994632720947266, "global_step": 623755, "epoch": 7515} {"train_loss": -27.586822509765625, "global_step": 623756, "epoch": 7515} {"train_loss": -27.736968994140625, "global_step": 623757, "epoch": 7515} {"train_loss": -28.566877365112305, "global_step": 623758, "epoch": 7515} {"train_loss": -28.453845977783203, "global_step": 623759, "epoch": 7515} {"train_loss": -28.175397872924805, "global_step": 623760, "epoch": 7515} {"train_loss": -28.120868682861328, "global_step": 623761, "epoch": 7515} {"train_loss": -28.084869384765625, "global_step": 623762, "epoch": 7515} {"train_loss": -28.38079833984375, "global_step": 623763, "epoch": 7515} {"train_loss": -28.337265014648438, "global_step": 623764, "epoch": 7515} {"train_loss": -28.227924346923828, "global_step": 623765, "epoch": 7515} {"train_loss": -28.502384185791016, "global_step": 623766, "epoch": 7515} {"train_loss": -28.093915939331055, "global_step": 623767, "epoch": 7515} {"train_loss": -28.45391845703125, "global_step": 623768, "epoch": 7515} {"train_loss": -28.16595458984375, "global_step": 623769, "epoch": 7515} {"train_loss": -28.386829376220703, "global_step": 623770, "epoch": 7515} {"train_loss": -28.210325241088867, "global_step": 623771, "epoch": 7515} {"train_loss": -28.403121948242188, "global_step": 623772, "epoch": 7515} {"train_loss": -28.436511993408203, "global_step": 623773, "epoch": 7515} {"train_loss": -27.932880401611328, "global_step": 623774, "epoch": 7515} {"train_loss": -27.954065322875977, "global_step": 623775, "epoch": 7515} {"train_loss": -28.2978515625, "global_step": 623776, "epoch": 7515} {"train_loss": -28.1218318939209, "global_step": 623777, "epoch": 7515} {"train_loss": -28.42402458190918, "global_step": 623778, "epoch": 7515} {"train_loss": -28.09614372253418, "global_step": 623779, "epoch": 7515} {"train_loss": -28.134695053100586, "global_step": 623780, "epoch": 7515} {"train_loss": -28.249561309814453, "global_step": 623781, "epoch": 7515} {"train_loss": -28.006546020507812, "global_step": 623782, "epoch": 7515} {"train_loss": -28.358118057250977, "global_step": 623783, "epoch": 7515} {"train_loss": -28.23707389831543, "global_step": 623784, "epoch": 7515} {"train_loss": -28.156147003173828, "global_step": 623785, "epoch": 7515} {"train_loss": -28.1247501373291, "global_step": 623786, "epoch": 7515} {"train_loss": -27.878971099853516, "global_step": 623787, "epoch": 7515} {"train_loss": -28.31795310974121, "global_step": 623788, "epoch": 7515} {"train_loss": -28.0481014251709, "global_step": 623789, "epoch": 7515} {"train_loss": -28.172483444213867, "global_step": 623790, "epoch": 7515} {"train_loss": -28.02936363220215, "global_step": 623791, "epoch": 7515} {"train_loss": -28.206939697265625, "global_step": 623792, "epoch": 7515} {"train_loss": -28.500890731811523, "global_step": 623793, "epoch": 7515} {"train_loss": -28.05767250061035, "global_step": 623794, "epoch": 7515} {"train_loss": -28.238874435424805, "global_step": 623795, "epoch": 7515} {"train_loss": -27.768173217773438, "global_step": 623796, "epoch": 7515} {"train_loss": -28.232269287109375, "global_step": 623797, "epoch": 7515} {"train_loss": -28.068222045898438, "global_step": 623798, "epoch": 7515} {"train_loss": -28.062768936157227, "global_step": 623799, "epoch": 7515} {"train_loss": -28.12103271484375, "global_step": 623800, "epoch": 7515} {"train_loss": -28.2307071685791, "global_step": 623801, "epoch": 7515} {"train_loss": -28.29315185546875, "global_step": 623802, "epoch": 7515} {"train_loss": -28.634855270385742, "global_step": 623803, "epoch": 7515} {"train_loss": -28.332809448242188, "global_step": 623804, "epoch": 7515} {"train_loss": -28.11588478088379, "global_step": 623805, "epoch": 7515} {"train_loss": -28.189865112304688, "global_step": 623806, "epoch": 7515} {"train_loss": -27.9656925201416, "global_step": 623807, "epoch": 7515} {"train_loss": -28.12330436706543, "global_step": 623808, "epoch": 7515} {"train_loss": -28.14200210571289, "global_step": 623809, "epoch": 7515} {"train_loss": -28.004215240478516, "global_step": 623810, "epoch": 7515} {"train_loss": -27.847082138061523, "global_step": 623811, "epoch": 7515} {"train_loss": -28.357324600219727, "global_step": 623812, "epoch": 7515} {"train_loss": -28.258771896362305, "global_step": 623813, "epoch": 7515} {"train_loss": -28.247629165649414, "global_step": 623814, "epoch": 7515} {"train_loss": -28.049489974975586, "global_step": 623815, "epoch": 7515} {"train_loss": -27.864459991455078, "global_step": 623816, "epoch": 7515} {"train_loss": -28.446470260620117, "global_step": 623817, "epoch": 7515} {"train_loss": -28.213397979736328, "global_step": 623818, "epoch": 7515} {"train_loss": -28.032917022705078, "global_step": 623819, "epoch": 7515} {"train_loss": -28.174331665039062, "global_step": 623820, "epoch": 7515} {"train_loss": -28.246801376342773, "global_step": 623821, "epoch": 7515} {"train_loss": -28.465055465698242, "global_step": 623822, "epoch": 7515} {"train_loss": -28.441614151000977, "global_step": 623823, "epoch": 7515} {"train_loss": -28.639286041259766, "global_step": 623824, "epoch": 7515} {"train_loss": -28.0242977142334, "global_step": 623825, "epoch": 7515} {"train_loss": -28.4951114654541, "global_step": 623826, "epoch": 7515} {"train_loss": -28.15798610089773, "global_step": 623827, "epoch": 7515, "val_loss": 6657077.5} {"train_loss": -27.59214210510254, "global_step": 623828, "epoch": 7516} {"train_loss": -28.04665184020996, "global_step": 623829, "epoch": 7516} {"train_loss": -27.8560791015625, "global_step": 623830, "epoch": 7516} {"train_loss": -27.658689498901367, "global_step": 623831, "epoch": 7516} {"train_loss": -27.811880111694336, "global_step": 623832, "epoch": 7516} {"train_loss": -27.73762321472168, "global_step": 623833, "epoch": 7516} {"train_loss": -27.986703872680664, "global_step": 623834, "epoch": 7516} {"train_loss": -27.422016143798828, "global_step": 623835, "epoch": 7516} {"train_loss": -27.98528480529785, "global_step": 623836, "epoch": 7516} {"train_loss": -27.648168563842773, "global_step": 623837, "epoch": 7516} {"train_loss": -28.087570190429688, "global_step": 623838, "epoch": 7516} {"train_loss": -27.625152587890625, "global_step": 623839, "epoch": 7516} {"train_loss": -28.405475616455078, "global_step": 623840, "epoch": 7516} {"train_loss": -27.984329223632812, "global_step": 623841, "epoch": 7516} {"train_loss": -28.06661033630371, "global_step": 623842, "epoch": 7516} {"train_loss": -28.123464584350586, "global_step": 623843, "epoch": 7516} {"train_loss": -27.988861083984375, "global_step": 623844, "epoch": 7516} {"train_loss": -28.232202529907227, "global_step": 623845, "epoch": 7516} {"train_loss": -28.036001205444336, "global_step": 623846, "epoch": 7516} {"train_loss": -28.03127098083496, "global_step": 623847, "epoch": 7516} {"train_loss": -28.009763717651367, "global_step": 623848, "epoch": 7516} {"train_loss": -28.04949951171875, "global_step": 623849, "epoch": 7516} {"train_loss": -27.973642349243164, "global_step": 623850, "epoch": 7516} {"train_loss": -28.1772518157959, "global_step": 623851, "epoch": 7516} {"train_loss": -28.15117835998535, "global_step": 623852, "epoch": 7516} {"train_loss": -27.698389053344727, "global_step": 623853, "epoch": 7516} {"train_loss": -28.07451820373535, "global_step": 623854, "epoch": 7516} {"train_loss": -28.10205078125, "global_step": 623855, "epoch": 7516} {"train_loss": -28.353351593017578, "global_step": 623856, "epoch": 7516} {"train_loss": -28.018402099609375, "global_step": 623857, "epoch": 7516} {"train_loss": -27.74933433532715, "global_step": 623858, "epoch": 7516} {"train_loss": -27.85792350769043, "global_step": 623859, "epoch": 7516} {"train_loss": -28.465320587158203, "global_step": 623860, "epoch": 7516} {"train_loss": -28.20107078552246, "global_step": 623861, "epoch": 7516} {"train_loss": -28.377851486206055, "global_step": 623862, "epoch": 7516} {"train_loss": -28.664541244506836, "global_step": 623863, "epoch": 7516} {"train_loss": -28.1072998046875, "global_step": 623864, "epoch": 7516} {"train_loss": -27.725378036499023, "global_step": 623865, "epoch": 7516} {"train_loss": -28.08660316467285, "global_step": 623866, "epoch": 7516} {"train_loss": -28.417057037353516, "global_step": 623867, "epoch": 7516} {"train_loss": -28.06300163269043, "global_step": 623868, "epoch": 7516} {"train_loss": -28.236326217651367, "global_step": 623869, "epoch": 7516} {"train_loss": -28.188474655151367, "global_step": 623870, "epoch": 7516} {"train_loss": -28.432376861572266, "global_step": 623871, "epoch": 7516} {"train_loss": -28.23563003540039, "global_step": 623872, "epoch": 7516} {"train_loss": -28.3181095123291, "global_step": 623873, "epoch": 7516} {"train_loss": -28.119537353515625, "global_step": 623874, "epoch": 7516} {"train_loss": -28.223081588745117, "global_step": 623875, "epoch": 7516} {"train_loss": -28.37957763671875, "global_step": 623876, "epoch": 7516} {"train_loss": -28.013916015625, "global_step": 623877, "epoch": 7516} {"train_loss": -28.15081787109375, "global_step": 623878, "epoch": 7516} {"train_loss": -28.214319229125977, "global_step": 623879, "epoch": 7516} {"train_loss": -28.2623348236084, "global_step": 623880, "epoch": 7516} {"train_loss": -28.29510498046875, "global_step": 623881, "epoch": 7516} {"train_loss": -28.218225479125977, "global_step": 623882, "epoch": 7516} {"train_loss": -28.133411407470703, "global_step": 623883, "epoch": 7516} {"train_loss": -27.584802627563477, "global_step": 623884, "epoch": 7516} {"train_loss": -27.24770164489746, "global_step": 623885, "epoch": 7516} {"train_loss": -27.56056022644043, "global_step": 623886, "epoch": 7516} {"train_loss": -27.889036178588867, "global_step": 623887, "epoch": 7516} {"train_loss": -28.195287704467773, "global_step": 623888, "epoch": 7516} {"train_loss": -28.11332130432129, "global_step": 623889, "epoch": 7516} {"train_loss": -28.660959243774414, "global_step": 623890, "epoch": 7516} {"train_loss": -28.24175453186035, "global_step": 623891, "epoch": 7516} {"train_loss": -27.5019588470459, "global_step": 623892, "epoch": 7516} {"train_loss": -28.38496208190918, "global_step": 623893, "epoch": 7516} {"train_loss": -27.7932071685791, "global_step": 623894, "epoch": 7516} {"train_loss": -27.87236976623535, "global_step": 623895, "epoch": 7516} {"train_loss": -27.973730087280273, "global_step": 623896, "epoch": 7516} {"train_loss": -27.896228790283203, "global_step": 623897, "epoch": 7516} {"train_loss": -27.829761505126953, "global_step": 623898, "epoch": 7516} {"train_loss": -27.383106231689453, "global_step": 623899, "epoch": 7516} {"train_loss": -28.298969268798828, "global_step": 623900, "epoch": 7516} {"train_loss": -27.453231811523438, "global_step": 623901, "epoch": 7516} {"train_loss": -27.600698471069336, "global_step": 623902, "epoch": 7516} {"train_loss": -28.30598258972168, "global_step": 623903, "epoch": 7516} {"train_loss": -28.19830322265625, "global_step": 623904, "epoch": 7516} {"train_loss": -27.95223045349121, "global_step": 623905, "epoch": 7516} {"train_loss": -28.66169548034668, "global_step": 623906, "epoch": 7516} {"train_loss": -27.900726318359375, "global_step": 623907, "epoch": 7516} {"train_loss": -28.578638076782227, "global_step": 623908, "epoch": 7516} {"train_loss": -28.133146286010742, "global_step": 623909, "epoch": 7516} {"train_loss": -28.048762654683674, "global_step": 623910, "epoch": 7516, "val_loss": 6673017.0} {"train_loss": -27.952911376953125, "global_step": 623911, "epoch": 7517} {"train_loss": -27.20501136779785, "global_step": 623912, "epoch": 7517} {"train_loss": -26.961355209350586, "global_step": 623913, "epoch": 7517} {"train_loss": -27.06342124938965, "global_step": 623914, "epoch": 7517} {"train_loss": -27.836933135986328, "global_step": 623915, "epoch": 7517} {"train_loss": -27.898038864135742, "global_step": 623916, "epoch": 7517} {"train_loss": -27.42266845703125, "global_step": 623917, "epoch": 7517} {"train_loss": -27.754898071289062, "global_step": 623918, "epoch": 7517} {"train_loss": -27.922468185424805, "global_step": 623919, "epoch": 7517} {"train_loss": -27.23248863220215, "global_step": 623920, "epoch": 7517} {"train_loss": -27.785486221313477, "global_step": 623921, "epoch": 7517} {"train_loss": -27.649717330932617, "global_step": 623922, "epoch": 7517} {"train_loss": -27.62188148498535, "global_step": 623923, "epoch": 7517} {"train_loss": -28.323444366455078, "global_step": 623924, "epoch": 7517} {"train_loss": -28.02117347717285, "global_step": 623925, "epoch": 7517} {"train_loss": -27.799768447875977, "global_step": 623926, "epoch": 7517} {"train_loss": -27.66182518005371, "global_step": 623927, "epoch": 7517} {"train_loss": -27.750370025634766, "global_step": 623928, "epoch": 7517} {"train_loss": -28.30637550354004, "global_step": 623929, "epoch": 7517} {"train_loss": -27.781909942626953, "global_step": 623930, "epoch": 7517} {"train_loss": -28.091039657592773, "global_step": 623931, "epoch": 7517} {"train_loss": -28.22319984436035, "global_step": 623932, "epoch": 7517} {"train_loss": -28.591861724853516, "global_step": 623933, "epoch": 7517} {"train_loss": -27.98919105529785, "global_step": 623934, "epoch": 7517} {"train_loss": -28.482227325439453, "global_step": 623935, "epoch": 7517} {"train_loss": -28.253875732421875, "global_step": 623936, "epoch": 7517} {"train_loss": -28.131000518798828, "global_step": 623937, "epoch": 7517} {"train_loss": -28.520309448242188, "global_step": 623938, "epoch": 7517} {"train_loss": -28.196035385131836, "global_step": 623939, "epoch": 7517} {"train_loss": -27.866714477539062, "global_step": 623940, "epoch": 7517} {"train_loss": -28.527509689331055, "global_step": 623941, "epoch": 7517} {"train_loss": -28.339399337768555, "global_step": 623942, "epoch": 7517} {"train_loss": -28.080060958862305, "global_step": 623943, "epoch": 7517} {"train_loss": -27.82501792907715, "global_step": 623944, "epoch": 7517} {"train_loss": -28.339111328125, "global_step": 623945, "epoch": 7517} {"train_loss": -28.544300079345703, "global_step": 623946, "epoch": 7517} {"train_loss": -27.81806755065918, "global_step": 623947, "epoch": 7517} {"train_loss": -28.18804931640625, "global_step": 623948, "epoch": 7517} {"train_loss": -28.04017448425293, "global_step": 623949, "epoch": 7517} {"train_loss": -28.440845489501953, "global_step": 623950, "epoch": 7517} {"train_loss": -28.257150650024414, "global_step": 623951, "epoch": 7517} {"train_loss": -28.040693283081055, "global_step": 623952, "epoch": 7517} {"train_loss": -28.16983413696289, "global_step": 623953, "epoch": 7517} {"train_loss": -28.593952178955078, "global_step": 623954, "epoch": 7517} {"train_loss": -28.439716339111328, "global_step": 623955, "epoch": 7517} {"train_loss": -28.1806697845459, "global_step": 623956, "epoch": 7517} {"train_loss": -28.227920532226562, "global_step": 623957, "epoch": 7517} {"train_loss": -27.783679962158203, "global_step": 623958, "epoch": 7517} {"train_loss": -27.915592193603516, "global_step": 623959, "epoch": 7517} {"train_loss": -28.5314998626709, "global_step": 623960, "epoch": 7517} {"train_loss": -28.184412002563477, "global_step": 623961, "epoch": 7517} {"train_loss": -27.5079288482666, "global_step": 623962, "epoch": 7517} {"train_loss": -28.28482437133789, "global_step": 623963, "epoch": 7517} {"train_loss": -27.933746337890625, "global_step": 623964, "epoch": 7517} {"train_loss": -28.02947425842285, "global_step": 623965, "epoch": 7517} {"train_loss": -28.242542266845703, "global_step": 623966, "epoch": 7517} {"train_loss": -27.770910263061523, "global_step": 623967, "epoch": 7517} {"train_loss": -27.858983993530273, "global_step": 623968, "epoch": 7517} {"train_loss": -28.037973403930664, "global_step": 623969, "epoch": 7517} {"train_loss": -27.507482528686523, "global_step": 623970, "epoch": 7517} {"train_loss": -28.031070709228516, "global_step": 623971, "epoch": 7517} {"train_loss": -27.862585067749023, "global_step": 623972, "epoch": 7517} {"train_loss": -28.07818603515625, "global_step": 623973, "epoch": 7517} {"train_loss": -28.05234146118164, "global_step": 623974, "epoch": 7517} {"train_loss": -28.319814682006836, "global_step": 623975, "epoch": 7517} {"train_loss": -28.33326530456543, "global_step": 623976, "epoch": 7517} {"train_loss": -28.30377769470215, "global_step": 623977, "epoch": 7517} {"train_loss": -27.97930335998535, "global_step": 623978, "epoch": 7517} {"train_loss": -28.276660919189453, "global_step": 623979, "epoch": 7517} {"train_loss": -28.25286293029785, "global_step": 623980, "epoch": 7517} {"train_loss": -28.1176815032959, "global_step": 623981, "epoch": 7517} {"train_loss": -28.127866744995117, "global_step": 623982, "epoch": 7517} {"train_loss": -27.58747673034668, "global_step": 623983, "epoch": 7517} {"train_loss": -28.24027442932129, "global_step": 623984, "epoch": 7517} {"train_loss": -28.191059112548828, "global_step": 623985, "epoch": 7517} {"train_loss": -28.428083419799805, "global_step": 623986, "epoch": 7517} {"train_loss": -28.0168399810791, "global_step": 623987, "epoch": 7517} {"train_loss": -28.050405502319336, "global_step": 623988, "epoch": 7517} {"train_loss": -28.133203506469727, "global_step": 623989, "epoch": 7517} {"train_loss": -28.129159927368164, "global_step": 623990, "epoch": 7517} {"train_loss": -27.977081298828125, "global_step": 623991, "epoch": 7517} {"train_loss": -27.98208999633789, "global_step": 623992, "epoch": 7517} {"train_loss": -28.022116304880164, "global_step": 623993, "epoch": 7517, "val_loss": 6745502.5} {"train_loss": -27.263263702392578, "global_step": 623994, "epoch": 7518} {"train_loss": -27.62762451171875, "global_step": 623995, "epoch": 7518} {"train_loss": -26.662521362304688, "global_step": 623996, "epoch": 7518} {"train_loss": -27.035354614257812, "global_step": 623997, "epoch": 7518} {"train_loss": -27.2216796875, "global_step": 623998, "epoch": 7518} {"train_loss": -26.949752807617188, "global_step": 623999, "epoch": 7518} {"train_loss": -26.566434860229492, "global_step": 624000, "epoch": 7518} {"train_loss": -27.39105796813965, "global_step": 624001, "epoch": 7518} {"train_loss": -27.109119415283203, "global_step": 624002, "epoch": 7518} {"train_loss": -26.727880477905273, "global_step": 624003, "epoch": 7518} {"train_loss": -26.951339721679688, "global_step": 624004, "epoch": 7518} {"train_loss": -27.562170028686523, "global_step": 624005, "epoch": 7518} {"train_loss": -27.468246459960938, "global_step": 624006, "epoch": 7518} {"train_loss": -27.18084716796875, "global_step": 624007, "epoch": 7518} {"train_loss": -27.40488624572754, "global_step": 624008, "epoch": 7518} {"train_loss": -27.514373779296875, "global_step": 624009, "epoch": 7518} {"train_loss": -27.556961059570312, "global_step": 624010, "epoch": 7518} {"train_loss": -27.34678077697754, "global_step": 624011, "epoch": 7518} {"train_loss": -27.94843101501465, "global_step": 624012, "epoch": 7518} {"train_loss": -27.91977310180664, "global_step": 624013, "epoch": 7518} {"train_loss": -28.079389572143555, "global_step": 624014, "epoch": 7518} {"train_loss": -28.083181381225586, "global_step": 624015, "epoch": 7518} {"train_loss": -27.470840454101562, "global_step": 624016, "epoch": 7518} {"train_loss": -27.990232467651367, "global_step": 624017, "epoch": 7518} {"train_loss": -27.843658447265625, "global_step": 624018, "epoch": 7518} {"train_loss": -27.87018394470215, "global_step": 624019, "epoch": 7518} {"train_loss": -28.31315040588379, "global_step": 624020, "epoch": 7518} {"train_loss": -28.007587432861328, "global_step": 624021, "epoch": 7518} {"train_loss": -28.115087509155273, "global_step": 624022, "epoch": 7518} {"train_loss": -27.89375877380371, "global_step": 624023, "epoch": 7518} {"train_loss": -27.84521484375, "global_step": 624024, "epoch": 7518} {"train_loss": -28.165924072265625, "global_step": 624025, "epoch": 7518} {"train_loss": -28.071836471557617, "global_step": 624026, "epoch": 7518} {"train_loss": -28.011077880859375, "global_step": 624027, "epoch": 7518} {"train_loss": -28.03058433532715, "global_step": 624028, "epoch": 7518} {"train_loss": -28.2167911529541, "global_step": 624029, "epoch": 7518} {"train_loss": -28.188695907592773, "global_step": 624030, "epoch": 7518} {"train_loss": -27.958044052124023, "global_step": 624031, "epoch": 7518} {"train_loss": -28.229475021362305, "global_step": 624032, "epoch": 7518} {"train_loss": -28.2630558013916, "global_step": 624033, "epoch": 7518} {"train_loss": -28.237524032592773, "global_step": 624034, "epoch": 7518} {"train_loss": -28.179285049438477, "global_step": 624035, "epoch": 7518} {"train_loss": -28.024662017822266, "global_step": 624036, "epoch": 7518} {"train_loss": -28.253889083862305, "global_step": 624037, "epoch": 7518} {"train_loss": -27.927631378173828, "global_step": 624038, "epoch": 7518} {"train_loss": -27.992523193359375, "global_step": 624039, "epoch": 7518} {"train_loss": -28.352197647094727, "global_step": 624040, "epoch": 7518} {"train_loss": -28.01215171813965, "global_step": 624041, "epoch": 7518} {"train_loss": -28.125411987304688, "global_step": 624042, "epoch": 7518} {"train_loss": -28.2656307220459, "global_step": 624043, "epoch": 7518} {"train_loss": -28.57291603088379, "global_step": 624044, "epoch": 7518} {"train_loss": -28.288440704345703, "global_step": 624045, "epoch": 7518} {"train_loss": -28.249380111694336, "global_step": 624046, "epoch": 7518} {"train_loss": -28.196624755859375, "global_step": 624047, "epoch": 7518} {"train_loss": -28.438940048217773, "global_step": 624048, "epoch": 7518} {"train_loss": -28.490070343017578, "global_step": 624049, "epoch": 7518} {"train_loss": -28.47487449645996, "global_step": 624050, "epoch": 7518} {"train_loss": -28.276962280273438, "global_step": 624051, "epoch": 7518} {"train_loss": -28.5357723236084, "global_step": 624052, "epoch": 7518} {"train_loss": -28.538299560546875, "global_step": 624053, "epoch": 7518} {"train_loss": -28.043554306030273, "global_step": 624054, "epoch": 7518} {"train_loss": -28.046537399291992, "global_step": 624055, "epoch": 7518} {"train_loss": -28.059080123901367, "global_step": 624056, "epoch": 7518} {"train_loss": -28.033447265625, "global_step": 624057, "epoch": 7518} {"train_loss": -27.949085235595703, "global_step": 624058, "epoch": 7518} {"train_loss": -28.29416847229004, "global_step": 624059, "epoch": 7518} {"train_loss": -28.071638107299805, "global_step": 624060, "epoch": 7518} {"train_loss": -28.02326011657715, "global_step": 624061, "epoch": 7518} {"train_loss": -28.003559112548828, "global_step": 624062, "epoch": 7518} {"train_loss": -28.106006622314453, "global_step": 624063, "epoch": 7518} {"train_loss": -27.880346298217773, "global_step": 624064, "epoch": 7518} {"train_loss": -28.039960861206055, "global_step": 624065, "epoch": 7518} {"train_loss": -27.795520782470703, "global_step": 624066, "epoch": 7518} {"train_loss": -28.152271270751953, "global_step": 624067, "epoch": 7518} {"train_loss": -28.1995849609375, "global_step": 624068, "epoch": 7518} {"train_loss": -27.970441818237305, "global_step": 624069, "epoch": 7518} {"train_loss": -28.228015899658203, "global_step": 624070, "epoch": 7518} {"train_loss": -28.713308334350586, "global_step": 624071, "epoch": 7518} {"train_loss": -28.420866012573242, "global_step": 624072, "epoch": 7518} {"train_loss": -28.131591796875, "global_step": 624073, "epoch": 7518} {"train_loss": -28.142059326171875, "global_step": 624074, "epoch": 7518} {"train_loss": -27.86469078063965, "global_step": 624075, "epoch": 7518} {"train_loss": -27.946059790002295, "global_step": 624076, "epoch": 7518, "val_loss": 6703406.0} {"train_loss": -27.1660213470459, "global_step": 624077, "epoch": 7519} {"train_loss": -27.67400550842285, "global_step": 624078, "epoch": 7519} {"train_loss": -27.195114135742188, "global_step": 624079, "epoch": 7519} {"train_loss": -27.65606117248535, "global_step": 624080, "epoch": 7519} {"train_loss": -27.738067626953125, "global_step": 624081, "epoch": 7519} {"train_loss": -27.296682357788086, "global_step": 624082, "epoch": 7519} {"train_loss": -27.257953643798828, "global_step": 624083, "epoch": 7519} {"train_loss": -27.67997169494629, "global_step": 624084, "epoch": 7519} {"train_loss": -27.659467697143555, "global_step": 624085, "epoch": 7519} {"train_loss": -27.27777671813965, "global_step": 624086, "epoch": 7519} {"train_loss": -27.819427490234375, "global_step": 624087, "epoch": 7519} {"train_loss": -27.753995895385742, "global_step": 624088, "epoch": 7519} {"train_loss": -27.64697265625, "global_step": 624089, "epoch": 7519} {"train_loss": -27.609119415283203, "global_step": 624090, "epoch": 7519} {"train_loss": -27.360692977905273, "global_step": 624091, "epoch": 7519} {"train_loss": -27.879682540893555, "global_step": 624092, "epoch": 7519} {"train_loss": -27.780960083007812, "global_step": 624093, "epoch": 7519} {"train_loss": -27.395654678344727, "global_step": 624094, "epoch": 7519} {"train_loss": -27.599979400634766, "global_step": 624095, "epoch": 7519} {"train_loss": -27.807525634765625, "global_step": 624096, "epoch": 7519} {"train_loss": -28.031757354736328, "global_step": 624097, "epoch": 7519} {"train_loss": -27.708288192749023, "global_step": 624098, "epoch": 7519} {"train_loss": -27.56207847595215, "global_step": 624099, "epoch": 7519} {"train_loss": -27.705707550048828, "global_step": 624100, "epoch": 7519} {"train_loss": -28.054752349853516, "global_step": 624101, "epoch": 7519} {"train_loss": -27.868499755859375, "global_step": 624102, "epoch": 7519} {"train_loss": -27.864286422729492, "global_step": 624103, "epoch": 7519} {"train_loss": -28.2994384765625, "global_step": 624104, "epoch": 7519} {"train_loss": -28.2139949798584, "global_step": 624105, "epoch": 7519} {"train_loss": -28.278757095336914, "global_step": 624106, "epoch": 7519} {"train_loss": -27.996795654296875, "global_step": 624107, "epoch": 7519} {"train_loss": -28.0870418548584, "global_step": 624108, "epoch": 7519} {"train_loss": -27.9000244140625, "global_step": 624109, "epoch": 7519} {"train_loss": -28.249847412109375, "global_step": 624110, "epoch": 7519} {"train_loss": -27.92057228088379, "global_step": 624111, "epoch": 7519} {"train_loss": -28.487730026245117, "global_step": 624112, "epoch": 7519} {"train_loss": -27.990009307861328, "global_step": 624113, "epoch": 7519} {"train_loss": -28.518634796142578, "global_step": 624114, "epoch": 7519} {"train_loss": -28.049091339111328, "global_step": 624115, "epoch": 7519} {"train_loss": -28.245458602905273, "global_step": 624116, "epoch": 7519} {"train_loss": -28.48728370666504, "global_step": 624117, "epoch": 7519} {"train_loss": -27.972782135009766, "global_step": 624118, "epoch": 7519} {"train_loss": -28.005844116210938, "global_step": 624119, "epoch": 7519} {"train_loss": -28.097198486328125, "global_step": 624120, "epoch": 7519} {"train_loss": -28.5435848236084, "global_step": 624121, "epoch": 7519} {"train_loss": -28.124277114868164, "global_step": 624122, "epoch": 7519} {"train_loss": -28.432392120361328, "global_step": 624123, "epoch": 7519} {"train_loss": -28.44390869140625, "global_step": 624124, "epoch": 7519} {"train_loss": -28.518930435180664, "global_step": 624125, "epoch": 7519} {"train_loss": -28.5517635345459, "global_step": 624126, "epoch": 7519} {"train_loss": -28.37405776977539, "global_step": 624127, "epoch": 7519} {"train_loss": -28.002553939819336, "global_step": 624128, "epoch": 7519} {"train_loss": -28.3403377532959, "global_step": 624129, "epoch": 7519} {"train_loss": -28.2804012298584, "global_step": 624130, "epoch": 7519} {"train_loss": -28.2979736328125, "global_step": 624131, "epoch": 7519} {"train_loss": -28.144134521484375, "global_step": 624132, "epoch": 7519} {"train_loss": -27.642333984375, "global_step": 624133, "epoch": 7519} {"train_loss": -27.43159294128418, "global_step": 624134, "epoch": 7519} {"train_loss": -27.03334617614746, "global_step": 624135, "epoch": 7519} {"train_loss": -27.3659610748291, "global_step": 624136, "epoch": 7519} {"train_loss": -27.880325317382812, "global_step": 624137, "epoch": 7519} {"train_loss": -27.344900131225586, "global_step": 624138, "epoch": 7519} {"train_loss": -27.236072540283203, "global_step": 624139, "epoch": 7519} {"train_loss": -27.6180419921875, "global_step": 624140, "epoch": 7519} {"train_loss": -27.34921646118164, "global_step": 624141, "epoch": 7519} {"train_loss": -27.728723526000977, "global_step": 624142, "epoch": 7519} {"train_loss": -27.739892959594727, "global_step": 624143, "epoch": 7519} {"train_loss": -27.335407257080078, "global_step": 624144, "epoch": 7519} {"train_loss": -27.998056411743164, "global_step": 624145, "epoch": 7519} {"train_loss": -27.649169921875, "global_step": 624146, "epoch": 7519} {"train_loss": -27.231525421142578, "global_step": 624147, "epoch": 7519} {"train_loss": -27.48262596130371, "global_step": 624148, "epoch": 7519} {"train_loss": -27.832794189453125, "global_step": 624149, "epoch": 7519} {"train_loss": -28.126117706298828, "global_step": 624150, "epoch": 7519} {"train_loss": -27.320947647094727, "global_step": 624151, "epoch": 7519} {"train_loss": -27.771142959594727, "global_step": 624152, "epoch": 7519} {"train_loss": -27.89008903503418, "global_step": 624153, "epoch": 7519} {"train_loss": -28.067707061767578, "global_step": 624154, "epoch": 7519} {"train_loss": -27.99727439880371, "global_step": 624155, "epoch": 7519} {"train_loss": -27.56879997253418, "global_step": 624156, "epoch": 7519} {"train_loss": -28.393524169921875, "global_step": 624157, "epoch": 7519} {"train_loss": -27.995594024658203, "global_step": 624158, "epoch": 7519} {"train_loss": -27.857261496854115, "global_step": 624159, "epoch": 7519, "val_loss": 6717390.5} {"train_loss": -26.864227294921875, "global_step": 624160, "epoch": 7520} {"train_loss": -26.129932403564453, "global_step": 624161, "epoch": 7520} {"train_loss": -27.541067123413086, "global_step": 624162, "epoch": 7520} {"train_loss": -27.232004165649414, "global_step": 624163, "epoch": 7520} {"train_loss": -27.353559494018555, "global_step": 624164, "epoch": 7520} {"train_loss": -27.045560836791992, "global_step": 624165, "epoch": 7520} {"train_loss": -27.12505531311035, "global_step": 624166, "epoch": 7520} {"train_loss": -27.719953536987305, "global_step": 624167, "epoch": 7520} {"train_loss": -27.6989803314209, "global_step": 624168, "epoch": 7520} {"train_loss": -27.498620986938477, "global_step": 624169, "epoch": 7520} {"train_loss": -27.295743942260742, "global_step": 624170, "epoch": 7520} {"train_loss": -27.598852157592773, "global_step": 624171, "epoch": 7520} {"train_loss": -27.768329620361328, "global_step": 624172, "epoch": 7520} {"train_loss": -27.9193115234375, "global_step": 624173, "epoch": 7520} {"train_loss": -27.627676010131836, "global_step": 624174, "epoch": 7520} {"train_loss": -27.54471206665039, "global_step": 624175, "epoch": 7520} {"train_loss": -27.80292320251465, "global_step": 624176, "epoch": 7520} {"train_loss": -27.943944931030273, "global_step": 624177, "epoch": 7520} {"train_loss": -27.895788192749023, "global_step": 624178, "epoch": 7520} {"train_loss": -27.986539840698242, "global_step": 624179, "epoch": 7520} {"train_loss": -27.901098251342773, "global_step": 624180, "epoch": 7520} {"train_loss": -27.98859977722168, "global_step": 624181, "epoch": 7520} {"train_loss": -28.032821655273438, "global_step": 624182, "epoch": 7520} {"train_loss": -28.036218643188477, "global_step": 624183, "epoch": 7520} {"train_loss": -27.931049346923828, "global_step": 624184, "epoch": 7520} {"train_loss": -27.953628540039062, "global_step": 624185, "epoch": 7520} {"train_loss": -28.188138961791992, "global_step": 624186, "epoch": 7520} {"train_loss": -27.92458152770996, "global_step": 624187, "epoch": 7520} {"train_loss": -28.22066307067871, "global_step": 624188, "epoch": 7520} {"train_loss": -28.378955841064453, "global_step": 624189, "epoch": 7520} {"train_loss": -28.131732940673828, "global_step": 624190, "epoch": 7520} {"train_loss": -28.3471736907959, "global_step": 624191, "epoch": 7520} {"train_loss": -28.1527156829834, "global_step": 624192, "epoch": 7520} {"train_loss": -28.634016036987305, "global_step": 624193, "epoch": 7520} {"train_loss": -27.88294792175293, "global_step": 624194, "epoch": 7520} {"train_loss": -28.36280632019043, "global_step": 624195, "epoch": 7520} {"train_loss": -27.77273941040039, "global_step": 624196, "epoch": 7520} {"train_loss": -28.276472091674805, "global_step": 624197, "epoch": 7520} {"train_loss": -28.207427978515625, "global_step": 624198, "epoch": 7520} {"train_loss": -28.359830856323242, "global_step": 624199, "epoch": 7520} {"train_loss": -28.665395736694336, "global_step": 624200, "epoch": 7520} {"train_loss": -28.09578514099121, "global_step": 624201, "epoch": 7520} {"train_loss": -27.7489013671875, "global_step": 624202, "epoch": 7520} {"train_loss": -28.331684112548828, "global_step": 624203, "epoch": 7520} {"train_loss": -28.100040435791016, "global_step": 624204, "epoch": 7520} {"train_loss": -28.2252140045166, "global_step": 624205, "epoch": 7520} {"train_loss": -28.469928741455078, "global_step": 624206, "epoch": 7520} {"train_loss": -28.203603744506836, "global_step": 624207, "epoch": 7520} {"train_loss": -28.108068466186523, "global_step": 624208, "epoch": 7520} {"train_loss": -28.476001739501953, "global_step": 624209, "epoch": 7520} {"train_loss": -28.629318237304688, "global_step": 624210, "epoch": 7520} {"train_loss": -28.65254020690918, "global_step": 624211, "epoch": 7520} {"train_loss": -28.520751953125, "global_step": 624212, "epoch": 7520} {"train_loss": -28.321033477783203, "global_step": 624213, "epoch": 7520} {"train_loss": -27.639083862304688, "global_step": 624214, "epoch": 7520} {"train_loss": -28.182392120361328, "global_step": 624215, "epoch": 7520} {"train_loss": -28.2586612701416, "global_step": 624216, "epoch": 7520} {"train_loss": -28.35343360900879, "global_step": 624217, "epoch": 7520} {"train_loss": -28.15435791015625, "global_step": 624218, "epoch": 7520} {"train_loss": -28.35027503967285, "global_step": 624219, "epoch": 7520} {"train_loss": -28.163349151611328, "global_step": 624220, "epoch": 7520} {"train_loss": -28.546279907226562, "global_step": 624221, "epoch": 7520} {"train_loss": -28.25360107421875, "global_step": 624222, "epoch": 7520} {"train_loss": -28.362024307250977, "global_step": 624223, "epoch": 7520} {"train_loss": -28.420644760131836, "global_step": 624224, "epoch": 7520} {"train_loss": -28.43776512145996, "global_step": 624225, "epoch": 7520} {"train_loss": -28.217945098876953, "global_step": 624226, "epoch": 7520} {"train_loss": -28.471593856811523, "global_step": 624227, "epoch": 7520} {"train_loss": -28.63618278503418, "global_step": 624228, "epoch": 7520} {"train_loss": -28.14410972595215, "global_step": 624229, "epoch": 7520} {"train_loss": -27.776647567749023, "global_step": 624230, "epoch": 7520} {"train_loss": -27.586639404296875, "global_step": 624231, "epoch": 7520} {"train_loss": -27.92999267578125, "global_step": 624232, "epoch": 7520} {"train_loss": -28.007953643798828, "global_step": 624233, "epoch": 7520} {"train_loss": -27.405725479125977, "global_step": 624234, "epoch": 7520} {"train_loss": -27.561452865600586, "global_step": 624235, "epoch": 7520} {"train_loss": -28.154010772705078, "global_step": 624236, "epoch": 7520} {"train_loss": -28.134296417236328, "global_step": 624237, "epoch": 7520} {"train_loss": -28.1086368560791, "global_step": 624238, "epoch": 7520} {"train_loss": -27.957508087158203, "global_step": 624239, "epoch": 7520} {"train_loss": -28.429443359375, "global_step": 624240, "epoch": 7520} {"train_loss": -28.325769424438477, "global_step": 624241, "epoch": 7520} {"train_loss": -28.01817151724574, "global_step": 624242, "epoch": 7520, "val_loss": 6722158.0} {"train_loss": -24.45875358581543, "global_step": 624243, "epoch": 7521} {"train_loss": -26.711170196533203, "global_step": 624244, "epoch": 7521} {"train_loss": -25.157495498657227, "global_step": 624245, "epoch": 7521} {"train_loss": -27.222150802612305, "global_step": 624246, "epoch": 7521} {"train_loss": -26.4477481842041, "global_step": 624247, "epoch": 7521} {"train_loss": -26.169219970703125, "global_step": 624248, "epoch": 7521} {"train_loss": -26.682483673095703, "global_step": 624249, "epoch": 7521} {"train_loss": -26.906782150268555, "global_step": 624250, "epoch": 7521} {"train_loss": -26.83145523071289, "global_step": 624251, "epoch": 7521} {"train_loss": -27.144561767578125, "global_step": 624252, "epoch": 7521} {"train_loss": -27.71719741821289, "global_step": 624253, "epoch": 7521} {"train_loss": -26.942432403564453, "global_step": 624254, "epoch": 7521} {"train_loss": -27.262388229370117, "global_step": 624255, "epoch": 7521} {"train_loss": -27.063861846923828, "global_step": 624256, "epoch": 7521} {"train_loss": -27.943754196166992, "global_step": 624257, "epoch": 7521} {"train_loss": -27.28505516052246, "global_step": 624258, "epoch": 7521} {"train_loss": -27.08013343811035, "global_step": 624259, "epoch": 7521} {"train_loss": -27.588354110717773, "global_step": 624260, "epoch": 7521} {"train_loss": -27.433258056640625, "global_step": 624261, "epoch": 7521} {"train_loss": -27.773818969726562, "global_step": 624262, "epoch": 7521} {"train_loss": -27.203052520751953, "global_step": 624263, "epoch": 7521} {"train_loss": -27.322141647338867, "global_step": 624264, "epoch": 7521} {"train_loss": -27.592090606689453, "global_step": 624265, "epoch": 7521} {"train_loss": -27.845722198486328, "global_step": 624266, "epoch": 7521} {"train_loss": -27.49136734008789, "global_step": 624267, "epoch": 7521} {"train_loss": -27.62989616394043, "global_step": 624268, "epoch": 7521} {"train_loss": -27.811044692993164, "global_step": 624269, "epoch": 7521} {"train_loss": -27.76226806640625, "global_step": 624270, "epoch": 7521} {"train_loss": -27.878149032592773, "global_step": 624271, "epoch": 7521} {"train_loss": -27.83928871154785, "global_step": 624272, "epoch": 7521} {"train_loss": -27.893421173095703, "global_step": 624273, "epoch": 7521} {"train_loss": -27.417144775390625, "global_step": 624274, "epoch": 7521} {"train_loss": -28.24362564086914, "global_step": 624275, "epoch": 7521} {"train_loss": -27.99690055847168, "global_step": 624276, "epoch": 7521} {"train_loss": -27.8692626953125, "global_step": 624277, "epoch": 7521} {"train_loss": -28.324462890625, "global_step": 624278, "epoch": 7521} {"train_loss": -28.390380859375, "global_step": 624279, "epoch": 7521} {"train_loss": -27.915069580078125, "global_step": 624280, "epoch": 7521} {"train_loss": -28.32197380065918, "global_step": 624281, "epoch": 7521} {"train_loss": -28.04058837890625, "global_step": 624282, "epoch": 7521} {"train_loss": -28.1928768157959, "global_step": 624283, "epoch": 7521} {"train_loss": -28.07551383972168, "global_step": 624284, "epoch": 7521} {"train_loss": -28.078088760375977, "global_step": 624285, "epoch": 7521} {"train_loss": -28.25422477722168, "global_step": 624286, "epoch": 7521} {"train_loss": -28.229841232299805, "global_step": 624287, "epoch": 7521} {"train_loss": -28.27906608581543, "global_step": 624288, "epoch": 7521} {"train_loss": -28.283954620361328, "global_step": 624289, "epoch": 7521} {"train_loss": -28.181543350219727, "global_step": 624290, "epoch": 7521} {"train_loss": -28.374475479125977, "global_step": 624291, "epoch": 7521} {"train_loss": -28.24481773376465, "global_step": 624292, "epoch": 7521} {"train_loss": -28.202035903930664, "global_step": 624293, "epoch": 7521} {"train_loss": -28.260883331298828, "global_step": 624294, "epoch": 7521} {"train_loss": -27.8584041595459, "global_step": 624295, "epoch": 7521} {"train_loss": -28.5670223236084, "global_step": 624296, "epoch": 7521} {"train_loss": -28.201757431030273, "global_step": 624297, "epoch": 7521} {"train_loss": -28.246337890625, "global_step": 624298, "epoch": 7521} {"train_loss": -28.55889320373535, "global_step": 624299, "epoch": 7521} {"train_loss": -28.400754928588867, "global_step": 624300, "epoch": 7521} {"train_loss": -28.264150619506836, "global_step": 624301, "epoch": 7521} {"train_loss": -28.690235137939453, "global_step": 624302, "epoch": 7521} {"train_loss": -28.285429000854492, "global_step": 624303, "epoch": 7521} {"train_loss": -28.07568359375, "global_step": 624304, "epoch": 7521} {"train_loss": -28.121641159057617, "global_step": 624305, "epoch": 7521} {"train_loss": -28.03309440612793, "global_step": 624306, "epoch": 7521} {"train_loss": -28.305923461914062, "global_step": 624307, "epoch": 7521} {"train_loss": -28.380292892456055, "global_step": 624308, "epoch": 7521} {"train_loss": -28.476856231689453, "global_step": 624309, "epoch": 7521} {"train_loss": -28.207685470581055, "global_step": 624310, "epoch": 7521} {"train_loss": -27.987024307250977, "global_step": 624311, "epoch": 7521} {"train_loss": -28.112476348876953, "global_step": 624312, "epoch": 7521} {"train_loss": -27.965696334838867, "global_step": 624313, "epoch": 7521} {"train_loss": -28.05042839050293, "global_step": 624314, "epoch": 7521} {"train_loss": -27.83074951171875, "global_step": 624315, "epoch": 7521} {"train_loss": -27.43283462524414, "global_step": 624316, "epoch": 7521} {"train_loss": -27.1887264251709, "global_step": 624317, "epoch": 7521} {"train_loss": -27.737518310546875, "global_step": 624318, "epoch": 7521} {"train_loss": -28.106733322143555, "global_step": 624319, "epoch": 7521} {"train_loss": -27.93463706970215, "global_step": 624320, "epoch": 7521} {"train_loss": -28.016265869140625, "global_step": 624321, "epoch": 7521} {"train_loss": -27.93291664123535, "global_step": 624322, "epoch": 7521} {"train_loss": -28.0457820892334, "global_step": 624323, "epoch": 7521} {"train_loss": -28.15717124938965, "global_step": 624324, "epoch": 7521} {"train_loss": -27.75891949757036, "global_step": 624325, "epoch": 7521, "val_loss": 6709492.0} {"train_loss": -27.928327560424805, "global_step": 624326, "epoch": 7522} {"train_loss": -27.340444564819336, "global_step": 624327, "epoch": 7522} {"train_loss": -27.98089599609375, "global_step": 624328, "epoch": 7522} {"train_loss": -27.841827392578125, "global_step": 624329, "epoch": 7522} {"train_loss": -27.954458236694336, "global_step": 624330, "epoch": 7522} {"train_loss": -28.010150909423828, "global_step": 624331, "epoch": 7522} {"train_loss": -27.67315673828125, "global_step": 624332, "epoch": 7522} {"train_loss": -27.819660186767578, "global_step": 624333, "epoch": 7522} {"train_loss": -28.068220138549805, "global_step": 624334, "epoch": 7522} {"train_loss": -27.882726669311523, "global_step": 624335, "epoch": 7522} {"train_loss": -28.2872314453125, "global_step": 624336, "epoch": 7522} {"train_loss": -28.0662784576416, "global_step": 624337, "epoch": 7522} {"train_loss": -27.843399047851562, "global_step": 624338, "epoch": 7522} {"train_loss": -27.93277359008789, "global_step": 624339, "epoch": 7522} {"train_loss": -28.022165298461914, "global_step": 624340, "epoch": 7522} {"train_loss": -28.249893188476562, "global_step": 624341, "epoch": 7522} {"train_loss": -28.438522338867188, "global_step": 624342, "epoch": 7522} {"train_loss": -28.178180694580078, "global_step": 624343, "epoch": 7522} {"train_loss": -28.209203720092773, "global_step": 624344, "epoch": 7522} {"train_loss": -27.971603393554688, "global_step": 624345, "epoch": 7522} {"train_loss": -28.19514274597168, "global_step": 624346, "epoch": 7522} {"train_loss": -28.02741050720215, "global_step": 624347, "epoch": 7522} {"train_loss": -28.453107833862305, "global_step": 624348, "epoch": 7522} {"train_loss": -28.172840118408203, "global_step": 624349, "epoch": 7522} {"train_loss": -28.156787872314453, "global_step": 624350, "epoch": 7522} {"train_loss": -28.42351722717285, "global_step": 624351, "epoch": 7522} {"train_loss": -28.0924072265625, "global_step": 624352, "epoch": 7522} {"train_loss": -28.66290283203125, "global_step": 624353, "epoch": 7522} {"train_loss": -28.541278839111328, "global_step": 624354, "epoch": 7522} {"train_loss": -28.452545166015625, "global_step": 624355, "epoch": 7522} {"train_loss": -28.095108032226562, "global_step": 624356, "epoch": 7522} {"train_loss": -27.910947799682617, "global_step": 624357, "epoch": 7522} {"train_loss": -27.900100708007812, "global_step": 624358, "epoch": 7522} {"train_loss": -28.29669189453125, "global_step": 624359, "epoch": 7522} {"train_loss": -28.117542266845703, "global_step": 624360, "epoch": 7522} {"train_loss": -28.180286407470703, "global_step": 624361, "epoch": 7522} {"train_loss": -28.058752059936523, "global_step": 624362, "epoch": 7522} {"train_loss": -28.33550453186035, "global_step": 624363, "epoch": 7522} {"train_loss": -27.6624813079834, "global_step": 624364, "epoch": 7522} {"train_loss": -28.522201538085938, "global_step": 624365, "epoch": 7522} {"train_loss": -27.930646896362305, "global_step": 624366, "epoch": 7522} {"train_loss": -28.1065616607666, "global_step": 624367, "epoch": 7522} {"train_loss": -28.305999755859375, "global_step": 624368, "epoch": 7522} {"train_loss": -27.79373550415039, "global_step": 624369, "epoch": 7522} {"train_loss": -27.97153663635254, "global_step": 624370, "epoch": 7522} {"train_loss": -28.255964279174805, "global_step": 624371, "epoch": 7522} {"train_loss": -27.959598541259766, "global_step": 624372, "epoch": 7522} {"train_loss": -28.213062286376953, "global_step": 624373, "epoch": 7522} {"train_loss": -28.131311416625977, "global_step": 624374, "epoch": 7522} {"train_loss": -27.865819931030273, "global_step": 624375, "epoch": 7522} {"train_loss": -27.401655197143555, "global_step": 624376, "epoch": 7522} {"train_loss": -26.38693618774414, "global_step": 624377, "epoch": 7522} {"train_loss": -24.443557739257812, "global_step": 624378, "epoch": 7522} {"train_loss": -24.45928192138672, "global_step": 624379, "epoch": 7522} {"train_loss": -27.496185302734375, "global_step": 624380, "epoch": 7522} {"train_loss": -26.54729652404785, "global_step": 624381, "epoch": 7522} {"train_loss": -25.909772872924805, "global_step": 624382, "epoch": 7522} {"train_loss": -27.344640731811523, "global_step": 624383, "epoch": 7522} {"train_loss": -27.15966796875, "global_step": 624384, "epoch": 7522} {"train_loss": -27.400365829467773, "global_step": 624385, "epoch": 7522} {"train_loss": -27.066314697265625, "global_step": 624386, "epoch": 7522} {"train_loss": -27.751901626586914, "global_step": 624387, "epoch": 7522} {"train_loss": -27.1689453125, "global_step": 624388, "epoch": 7522} {"train_loss": -27.659076690673828, "global_step": 624389, "epoch": 7522} {"train_loss": -27.20277214050293, "global_step": 624390, "epoch": 7522} {"train_loss": -27.84552574157715, "global_step": 624391, "epoch": 7522} {"train_loss": -27.441024780273438, "global_step": 624392, "epoch": 7522} {"train_loss": -27.807310104370117, "global_step": 624393, "epoch": 7522} {"train_loss": -27.823287963867188, "global_step": 624394, "epoch": 7522} {"train_loss": -27.501312255859375, "global_step": 624395, "epoch": 7522} {"train_loss": -27.933414459228516, "global_step": 624396, "epoch": 7522} {"train_loss": -27.78079605102539, "global_step": 624397, "epoch": 7522} {"train_loss": -27.912708282470703, "global_step": 624398, "epoch": 7522} {"train_loss": -27.712757110595703, "global_step": 624399, "epoch": 7522} {"train_loss": -27.279760360717773, "global_step": 624400, "epoch": 7522} {"train_loss": -27.840368270874023, "global_step": 624401, "epoch": 7522} {"train_loss": -28.038251876831055, "global_step": 624402, "epoch": 7522} {"train_loss": -27.687225341796875, "global_step": 624403, "epoch": 7522} {"train_loss": -27.9348087310791, "global_step": 624404, "epoch": 7522} {"train_loss": -28.079456329345703, "global_step": 624405, "epoch": 7522} {"train_loss": -28.068256378173828, "global_step": 624406, "epoch": 7522} {"train_loss": -28.160200119018555, "global_step": 624407, "epoch": 7522} {"train_loss": -27.788415885833373, "global_step": 624408, "epoch": 7522, "val_loss": 6708938.0} {"train_loss": -27.735097885131836, "global_step": 624409, "epoch": 7523} {"train_loss": -27.415332794189453, "global_step": 624410, "epoch": 7523} {"train_loss": -27.86260986328125, "global_step": 624411, "epoch": 7523} {"train_loss": -27.849905014038086, "global_step": 624412, "epoch": 7523} {"train_loss": -27.8994197845459, "global_step": 624413, "epoch": 7523} {"train_loss": -27.939289093017578, "global_step": 624414, "epoch": 7523} {"train_loss": -27.64333152770996, "global_step": 624415, "epoch": 7523} {"train_loss": -27.465911865234375, "global_step": 624416, "epoch": 7523} {"train_loss": -28.006376266479492, "global_step": 624417, "epoch": 7523} {"train_loss": -27.974966049194336, "global_step": 624418, "epoch": 7523} {"train_loss": -28.059370040893555, "global_step": 624419, "epoch": 7523} {"train_loss": -27.97572135925293, "global_step": 624420, "epoch": 7523} {"train_loss": -27.864093780517578, "global_step": 624421, "epoch": 7523} {"train_loss": -28.452789306640625, "global_step": 624422, "epoch": 7523} {"train_loss": -28.225683212280273, "global_step": 624423, "epoch": 7523} {"train_loss": -28.112279891967773, "global_step": 624424, "epoch": 7523} {"train_loss": -28.029653549194336, "global_step": 624425, "epoch": 7523} {"train_loss": -28.1707763671875, "global_step": 624426, "epoch": 7523} {"train_loss": -28.505084991455078, "global_step": 624427, "epoch": 7523} {"train_loss": -27.87589454650879, "global_step": 624428, "epoch": 7523} {"train_loss": -28.17536735534668, "global_step": 624429, "epoch": 7523} {"train_loss": -28.21229362487793, "global_step": 624430, "epoch": 7523} {"train_loss": -28.480207443237305, "global_step": 624431, "epoch": 7523} {"train_loss": -28.19338035583496, "global_step": 624432, "epoch": 7523} {"train_loss": -28.295080184936523, "global_step": 624433, "epoch": 7523} {"train_loss": -28.301761627197266, "global_step": 624434, "epoch": 7523} {"train_loss": -28.33155632019043, "global_step": 624435, "epoch": 7523} {"train_loss": -28.248926162719727, "global_step": 624436, "epoch": 7523} {"train_loss": -28.288049697875977, "global_step": 624437, "epoch": 7523} {"train_loss": -28.3336181640625, "global_step": 624438, "epoch": 7523} {"train_loss": -28.343297958374023, "global_step": 624439, "epoch": 7523} {"train_loss": -28.02375602722168, "global_step": 624440, "epoch": 7523} {"train_loss": -28.489246368408203, "global_step": 624441, "epoch": 7523} {"train_loss": -28.410337448120117, "global_step": 624442, "epoch": 7523} {"train_loss": -28.2836971282959, "global_step": 624443, "epoch": 7523} {"train_loss": -28.893802642822266, "global_step": 624444, "epoch": 7523} {"train_loss": -28.234222412109375, "global_step": 624445, "epoch": 7523} {"train_loss": -28.382593154907227, "global_step": 624446, "epoch": 7523} {"train_loss": -28.279077529907227, "global_step": 624447, "epoch": 7523} {"train_loss": -28.5551700592041, "global_step": 624448, "epoch": 7523} {"train_loss": -28.30950927734375, "global_step": 624449, "epoch": 7523} {"train_loss": -28.25957679748535, "global_step": 624450, "epoch": 7523} {"train_loss": -28.49848747253418, "global_step": 624451, "epoch": 7523} {"train_loss": -28.564401626586914, "global_step": 624452, "epoch": 7523} {"train_loss": -28.321821212768555, "global_step": 624453, "epoch": 7523} {"train_loss": -28.259424209594727, "global_step": 624454, "epoch": 7523} {"train_loss": -28.62806510925293, "global_step": 624455, "epoch": 7523} {"train_loss": -28.6196346282959, "global_step": 624456, "epoch": 7523} {"train_loss": -28.16868019104004, "global_step": 624457, "epoch": 7523} {"train_loss": -28.169178009033203, "global_step": 624458, "epoch": 7523} {"train_loss": -28.56003189086914, "global_step": 624459, "epoch": 7523} {"train_loss": -28.734846115112305, "global_step": 624460, "epoch": 7523} {"train_loss": -28.440000534057617, "global_step": 624461, "epoch": 7523} {"train_loss": -27.994115829467773, "global_step": 624462, "epoch": 7523} {"train_loss": -28.327077865600586, "global_step": 624463, "epoch": 7523} {"train_loss": -27.80164909362793, "global_step": 624464, "epoch": 7523} {"train_loss": -27.183547973632812, "global_step": 624465, "epoch": 7523} {"train_loss": -27.351362228393555, "global_step": 624466, "epoch": 7523} {"train_loss": -28.016218185424805, "global_step": 624467, "epoch": 7523} {"train_loss": -27.96221351623535, "global_step": 624468, "epoch": 7523} {"train_loss": -27.924108505249023, "global_step": 624469, "epoch": 7523} {"train_loss": -28.044025421142578, "global_step": 624470, "epoch": 7523} {"train_loss": -28.358545303344727, "global_step": 624471, "epoch": 7523} {"train_loss": -28.403661727905273, "global_step": 624472, "epoch": 7523} {"train_loss": -28.308195114135742, "global_step": 624473, "epoch": 7523} {"train_loss": -28.000904083251953, "global_step": 624474, "epoch": 7523} {"train_loss": -28.35689353942871, "global_step": 624475, "epoch": 7523} {"train_loss": -28.284109115600586, "global_step": 624476, "epoch": 7523} {"train_loss": -28.432880401611328, "global_step": 624477, "epoch": 7523} {"train_loss": -28.26435661315918, "global_step": 624478, "epoch": 7523} {"train_loss": -28.461252212524414, "global_step": 624479, "epoch": 7523} {"train_loss": -28.16303825378418, "global_step": 624480, "epoch": 7523} {"train_loss": -28.488662719726562, "global_step": 624481, "epoch": 7523} {"train_loss": -28.48358154296875, "global_step": 624482, "epoch": 7523} {"train_loss": -28.36945915222168, "global_step": 624483, "epoch": 7523} {"train_loss": -28.30792236328125, "global_step": 624484, "epoch": 7523} {"train_loss": -28.53850746154785, "global_step": 624485, "epoch": 7523} {"train_loss": -28.436986923217773, "global_step": 624486, "epoch": 7523} {"train_loss": -28.109643936157227, "global_step": 624487, "epoch": 7523} {"train_loss": -28.406843185424805, "global_step": 624488, "epoch": 7523} {"train_loss": -28.332508087158203, "global_step": 624489, "epoch": 7523} {"train_loss": -28.392858505249023, "global_step": 624490, "epoch": 7523} {"train_loss": -28.211145263120354, "global_step": 624491, "epoch": 7523, "val_loss": 6722094.5} {"train_loss": -27.846845626831055, "global_step": 624492, "epoch": 7524} {"train_loss": -27.837949752807617, "global_step": 624493, "epoch": 7524} {"train_loss": -27.43585777282715, "global_step": 624494, "epoch": 7524} {"train_loss": -27.647993087768555, "global_step": 624495, "epoch": 7524} {"train_loss": -27.079364776611328, "global_step": 624496, "epoch": 7524} {"train_loss": -27.2011661529541, "global_step": 624497, "epoch": 7524} {"train_loss": -27.54035758972168, "global_step": 624498, "epoch": 7524} {"train_loss": -26.7027530670166, "global_step": 624499, "epoch": 7524} {"train_loss": -26.71088218688965, "global_step": 624500, "epoch": 7524} {"train_loss": -27.115713119506836, "global_step": 624501, "epoch": 7524} {"train_loss": -27.086944580078125, "global_step": 624502, "epoch": 7524} {"train_loss": -27.03740882873535, "global_step": 624503, "epoch": 7524} {"train_loss": -26.63599967956543, "global_step": 624504, "epoch": 7524} {"train_loss": -27.138498306274414, "global_step": 624505, "epoch": 7524} {"train_loss": -27.5349178314209, "global_step": 624506, "epoch": 7524} {"train_loss": -27.46441650390625, "global_step": 624507, "epoch": 7524} {"train_loss": -27.24365234375, "global_step": 624508, "epoch": 7524} {"train_loss": -27.405973434448242, "global_step": 624509, "epoch": 7524} {"train_loss": -27.490793228149414, "global_step": 624510, "epoch": 7524} {"train_loss": -27.35528564453125, "global_step": 624511, "epoch": 7524} {"train_loss": -27.726911544799805, "global_step": 624512, "epoch": 7524} {"train_loss": -27.671741485595703, "global_step": 624513, "epoch": 7524} {"train_loss": -27.859222412109375, "global_step": 624514, "epoch": 7524} {"train_loss": -27.93430519104004, "global_step": 624515, "epoch": 7524} {"train_loss": -27.720144271850586, "global_step": 624516, "epoch": 7524} {"train_loss": -27.74822425842285, "global_step": 624517, "epoch": 7524} {"train_loss": -27.766202926635742, "global_step": 624518, "epoch": 7524} {"train_loss": -28.248706817626953, "global_step": 624519, "epoch": 7524} {"train_loss": -27.718225479125977, "global_step": 624520, "epoch": 7524} {"train_loss": -27.888381958007812, "global_step": 624521, "epoch": 7524} {"train_loss": -27.72486686706543, "global_step": 624522, "epoch": 7524} {"train_loss": -28.026691436767578, "global_step": 624523, "epoch": 7524} {"train_loss": -28.162200927734375, "global_step": 624524, "epoch": 7524} {"train_loss": -28.00092887878418, "global_step": 624525, "epoch": 7524} {"train_loss": -27.89969253540039, "global_step": 624526, "epoch": 7524} {"train_loss": -28.054885864257812, "global_step": 624527, "epoch": 7524} {"train_loss": -28.12491226196289, "global_step": 624528, "epoch": 7524} {"train_loss": -28.31817054748535, "global_step": 624529, "epoch": 7524} {"train_loss": -28.244089126586914, "global_step": 624530, "epoch": 7524} {"train_loss": -28.178909301757812, "global_step": 624531, "epoch": 7524} {"train_loss": -28.40471839904785, "global_step": 624532, "epoch": 7524} {"train_loss": -28.183088302612305, "global_step": 624533, "epoch": 7524} {"train_loss": -28.536468505859375, "global_step": 624534, "epoch": 7524} {"train_loss": -28.209890365600586, "global_step": 624535, "epoch": 7524} {"train_loss": -28.197492599487305, "global_step": 624536, "epoch": 7524} {"train_loss": -27.985681533813477, "global_step": 624537, "epoch": 7524} {"train_loss": -28.222070693969727, "global_step": 624538, "epoch": 7524} {"train_loss": -28.0714054107666, "global_step": 624539, "epoch": 7524} {"train_loss": -28.353622436523438, "global_step": 624540, "epoch": 7524} {"train_loss": -28.337308883666992, "global_step": 624541, "epoch": 7524} {"train_loss": -28.593597412109375, "global_step": 624542, "epoch": 7524} {"train_loss": -28.24407958984375, "global_step": 624543, "epoch": 7524} {"train_loss": -28.158933639526367, "global_step": 624544, "epoch": 7524} {"train_loss": -28.3294677734375, "global_step": 624545, "epoch": 7524} {"train_loss": -28.069128036499023, "global_step": 624546, "epoch": 7524} {"train_loss": -28.428726196289062, "global_step": 624547, "epoch": 7524} {"train_loss": -28.228681564331055, "global_step": 624548, "epoch": 7524} {"train_loss": -28.43560791015625, "global_step": 624549, "epoch": 7524} {"train_loss": -28.3443546295166, "global_step": 624550, "epoch": 7524} {"train_loss": -28.39227867126465, "global_step": 624551, "epoch": 7524} {"train_loss": -28.5639591217041, "global_step": 624552, "epoch": 7524} {"train_loss": -28.20509147644043, "global_step": 624553, "epoch": 7524} {"train_loss": -28.133996963500977, "global_step": 624554, "epoch": 7524} {"train_loss": -27.913888931274414, "global_step": 624555, "epoch": 7524} {"train_loss": -28.35990333557129, "global_step": 624556, "epoch": 7524} {"train_loss": -28.388751983642578, "global_step": 624557, "epoch": 7524} {"train_loss": -28.437408447265625, "global_step": 624558, "epoch": 7524} {"train_loss": -28.44113540649414, "global_step": 624559, "epoch": 7524} {"train_loss": -28.004194259643555, "global_step": 624560, "epoch": 7524} {"train_loss": -27.77503776550293, "global_step": 624561, "epoch": 7524} {"train_loss": -28.373584747314453, "global_step": 624562, "epoch": 7524} {"train_loss": -28.1146183013916, "global_step": 624563, "epoch": 7524} {"train_loss": -27.950210571289062, "global_step": 624564, "epoch": 7524} {"train_loss": -28.149444580078125, "global_step": 624565, "epoch": 7524} {"train_loss": -28.26495361328125, "global_step": 624566, "epoch": 7524} {"train_loss": -27.887311935424805, "global_step": 624567, "epoch": 7524} {"train_loss": -28.293603897094727, "global_step": 624568, "epoch": 7524} {"train_loss": -28.247594833374023, "global_step": 624569, "epoch": 7524} {"train_loss": -28.624622344970703, "global_step": 624570, "epoch": 7524} {"train_loss": -28.002710342407227, "global_step": 624571, "epoch": 7524} {"train_loss": -27.8179931640625, "global_step": 624572, "epoch": 7524} {"train_loss": -28.347000122070312, "global_step": 624573, "epoch": 7524} {"train_loss": -27.916452982339514, "global_step": 624574, "epoch": 7524, "val_loss": 6794497.0} {"train_loss": -27.649606704711914, "global_step": 624575, "epoch": 7525} {"train_loss": -27.911691665649414, "global_step": 624576, "epoch": 7525} {"train_loss": -27.6632080078125, "global_step": 624577, "epoch": 7525} {"train_loss": -27.93964958190918, "global_step": 624578, "epoch": 7525} {"train_loss": -27.65191078186035, "global_step": 624579, "epoch": 7525} {"train_loss": -27.806100845336914, "global_step": 624580, "epoch": 7525} {"train_loss": -27.835590362548828, "global_step": 624581, "epoch": 7525} {"train_loss": -27.6601505279541, "global_step": 624582, "epoch": 7525} {"train_loss": -27.782672882080078, "global_step": 624583, "epoch": 7525} {"train_loss": -27.53553581237793, "global_step": 624584, "epoch": 7525} {"train_loss": -27.6674747467041, "global_step": 624585, "epoch": 7525} {"train_loss": -27.6458797454834, "global_step": 624586, "epoch": 7525} {"train_loss": -27.836523056030273, "global_step": 624587, "epoch": 7525} {"train_loss": -28.061676025390625, "global_step": 624588, "epoch": 7525} {"train_loss": -28.09303092956543, "global_step": 624589, "epoch": 7525} {"train_loss": -27.545804977416992, "global_step": 624590, "epoch": 7525} {"train_loss": -27.878890991210938, "global_step": 624591, "epoch": 7525} {"train_loss": -27.678945541381836, "global_step": 624592, "epoch": 7525} {"train_loss": -27.760929107666016, "global_step": 624593, "epoch": 7525} {"train_loss": -27.626708984375, "global_step": 624594, "epoch": 7525} {"train_loss": -27.846744537353516, "global_step": 624595, "epoch": 7525} {"train_loss": -28.152124404907227, "global_step": 624596, "epoch": 7525} {"train_loss": -27.645132064819336, "global_step": 624597, "epoch": 7525} {"train_loss": -28.33039665222168, "global_step": 624598, "epoch": 7525} {"train_loss": -27.82649803161621, "global_step": 624599, "epoch": 7525} {"train_loss": -28.056554794311523, "global_step": 624600, "epoch": 7525} {"train_loss": -27.966718673706055, "global_step": 624601, "epoch": 7525} {"train_loss": -27.821308135986328, "global_step": 624602, "epoch": 7525} {"train_loss": -28.010461807250977, "global_step": 624603, "epoch": 7525} {"train_loss": -27.782697677612305, "global_step": 624604, "epoch": 7525} {"train_loss": -28.11948013305664, "global_step": 624605, "epoch": 7525} {"train_loss": -28.299213409423828, "global_step": 624606, "epoch": 7525} {"train_loss": -27.935108184814453, "global_step": 624607, "epoch": 7525} {"train_loss": -27.814550399780273, "global_step": 624608, "epoch": 7525} {"train_loss": -28.1726131439209, "global_step": 624609, "epoch": 7525} {"train_loss": -28.26133155822754, "global_step": 624610, "epoch": 7525} {"train_loss": -27.942249298095703, "global_step": 624611, "epoch": 7525} {"train_loss": -28.315488815307617, "global_step": 624612, "epoch": 7525} {"train_loss": -28.038877487182617, "global_step": 624613, "epoch": 7525} {"train_loss": -28.146438598632812, "global_step": 624614, "epoch": 7525} {"train_loss": -28.30179786682129, "global_step": 624615, "epoch": 7525} {"train_loss": -28.424697875976562, "global_step": 624616, "epoch": 7525} {"train_loss": -28.290191650390625, "global_step": 624617, "epoch": 7525} {"train_loss": -28.349451065063477, "global_step": 624618, "epoch": 7525} {"train_loss": -28.2943172454834, "global_step": 624619, "epoch": 7525} {"train_loss": -28.43610191345215, "global_step": 624620, "epoch": 7525} {"train_loss": -28.389514923095703, "global_step": 624621, "epoch": 7525} {"train_loss": -28.455102920532227, "global_step": 624622, "epoch": 7525} {"train_loss": -28.129987716674805, "global_step": 624623, "epoch": 7525} {"train_loss": -28.27392578125, "global_step": 624624, "epoch": 7525} {"train_loss": -28.026260375976562, "global_step": 624625, "epoch": 7525} {"train_loss": -28.0405330657959, "global_step": 624626, "epoch": 7525} {"train_loss": -28.03887939453125, "global_step": 624627, "epoch": 7525} {"train_loss": -27.500232696533203, "global_step": 624628, "epoch": 7525} {"train_loss": -27.090673446655273, "global_step": 624629, "epoch": 7525} {"train_loss": -27.70456314086914, "global_step": 624630, "epoch": 7525} {"train_loss": -28.089038848876953, "global_step": 624631, "epoch": 7525} {"train_loss": -27.980640411376953, "global_step": 624632, "epoch": 7525} {"train_loss": -27.96441650390625, "global_step": 624633, "epoch": 7525} {"train_loss": -28.228118896484375, "global_step": 624634, "epoch": 7525} {"train_loss": -27.84571647644043, "global_step": 624635, "epoch": 7525} {"train_loss": -28.24201011657715, "global_step": 624636, "epoch": 7525} {"train_loss": -28.03192138671875, "global_step": 624637, "epoch": 7525} {"train_loss": -28.597259521484375, "global_step": 624638, "epoch": 7525} {"train_loss": -27.790449142456055, "global_step": 624639, "epoch": 7525} {"train_loss": -28.130151748657227, "global_step": 624640, "epoch": 7525} {"train_loss": -28.360687255859375, "global_step": 624641, "epoch": 7525} {"train_loss": -28.17724609375, "global_step": 624642, "epoch": 7525} {"train_loss": -28.3006591796875, "global_step": 624643, "epoch": 7525} {"train_loss": -28.571836471557617, "global_step": 624644, "epoch": 7525} {"train_loss": -27.832706451416016, "global_step": 624645, "epoch": 7525} {"train_loss": -27.81561851501465, "global_step": 624646, "epoch": 7525} {"train_loss": -28.001127243041992, "global_step": 624647, "epoch": 7525} {"train_loss": -28.063013076782227, "global_step": 624648, "epoch": 7525} {"train_loss": -28.222248077392578, "global_step": 624649, "epoch": 7525} {"train_loss": -28.217426300048828, "global_step": 624650, "epoch": 7525} {"train_loss": -28.062597274780273, "global_step": 624651, "epoch": 7525} {"train_loss": -28.353168487548828, "global_step": 624652, "epoch": 7525} {"train_loss": -28.20148277282715, "global_step": 624653, "epoch": 7525} {"train_loss": -28.26444435119629, "global_step": 624654, "epoch": 7525} {"train_loss": -28.24957275390625, "global_step": 624655, "epoch": 7525} {"train_loss": -28.0666561126709, "global_step": 624656, "epoch": 7525} {"train_loss": -28.022171135408332, "global_step": 624657, "epoch": 7525, "val_loss": 6678893.0} {"train_loss": -27.964130401611328, "global_step": 624658, "epoch": 7526} {"train_loss": -27.684844970703125, "global_step": 624659, "epoch": 7526} {"train_loss": -27.781442642211914, "global_step": 624660, "epoch": 7526} {"train_loss": -27.49580955505371, "global_step": 624661, "epoch": 7526} {"train_loss": -28.176355361938477, "global_step": 624662, "epoch": 7526} {"train_loss": -28.026447296142578, "global_step": 624663, "epoch": 7526} {"train_loss": -27.907806396484375, "global_step": 624664, "epoch": 7526} {"train_loss": -27.690717697143555, "global_step": 624665, "epoch": 7526} {"train_loss": -27.93769645690918, "global_step": 624666, "epoch": 7526} {"train_loss": -27.808151245117188, "global_step": 624667, "epoch": 7526} {"train_loss": -28.181928634643555, "global_step": 624668, "epoch": 7526} {"train_loss": -28.114337921142578, "global_step": 624669, "epoch": 7526} {"train_loss": -27.889938354492188, "global_step": 624670, "epoch": 7526} {"train_loss": -27.880537033081055, "global_step": 624671, "epoch": 7526} {"train_loss": -28.0963077545166, "global_step": 624672, "epoch": 7526} {"train_loss": -27.637990951538086, "global_step": 624673, "epoch": 7526} {"train_loss": -28.273406982421875, "global_step": 624674, "epoch": 7526} {"train_loss": -27.93877601623535, "global_step": 624675, "epoch": 7526} {"train_loss": -27.9572696685791, "global_step": 624676, "epoch": 7526} {"train_loss": -27.9947509765625, "global_step": 624677, "epoch": 7526} {"train_loss": -27.885679244995117, "global_step": 624678, "epoch": 7526} {"train_loss": -27.974868774414062, "global_step": 624679, "epoch": 7526} {"train_loss": -28.269428253173828, "global_step": 624680, "epoch": 7526} {"train_loss": -28.304285049438477, "global_step": 624681, "epoch": 7526} {"train_loss": -28.061975479125977, "global_step": 624682, "epoch": 7526} {"train_loss": -28.34876823425293, "global_step": 624683, "epoch": 7526} {"train_loss": -28.283355712890625, "global_step": 624684, "epoch": 7526} {"train_loss": -28.117053985595703, "global_step": 624685, "epoch": 7526} {"train_loss": -28.153417587280273, "global_step": 624686, "epoch": 7526} {"train_loss": -28.344446182250977, "global_step": 624687, "epoch": 7526} {"train_loss": -28.527179718017578, "global_step": 624688, "epoch": 7526} {"train_loss": -28.17453384399414, "global_step": 624689, "epoch": 7526} {"train_loss": -28.14448356628418, "global_step": 624690, "epoch": 7526} {"train_loss": -28.364953994750977, "global_step": 624691, "epoch": 7526} {"train_loss": -28.539602279663086, "global_step": 624692, "epoch": 7526} {"train_loss": -28.27850341796875, "global_step": 624693, "epoch": 7526} {"train_loss": -28.325342178344727, "global_step": 624694, "epoch": 7526} {"train_loss": -28.36262321472168, "global_step": 624695, "epoch": 7526} {"train_loss": -28.384674072265625, "global_step": 624696, "epoch": 7526} {"train_loss": -28.162351608276367, "global_step": 624697, "epoch": 7526} {"train_loss": -28.294050216674805, "global_step": 624698, "epoch": 7526} {"train_loss": -28.175886154174805, "global_step": 624699, "epoch": 7526} {"train_loss": -28.362157821655273, "global_step": 624700, "epoch": 7526} {"train_loss": -28.14434814453125, "global_step": 624701, "epoch": 7526} {"train_loss": -28.537342071533203, "global_step": 624702, "epoch": 7526} {"train_loss": -28.473342895507812, "global_step": 624703, "epoch": 7526} {"train_loss": -27.9566593170166, "global_step": 624704, "epoch": 7526} {"train_loss": -27.987823486328125, "global_step": 624705, "epoch": 7526} {"train_loss": -28.054931640625, "global_step": 624706, "epoch": 7526} {"train_loss": -28.17222023010254, "global_step": 624707, "epoch": 7526} {"train_loss": -28.29461097717285, "global_step": 624708, "epoch": 7526} {"train_loss": -28.012592315673828, "global_step": 624709, "epoch": 7526} {"train_loss": -28.036767959594727, "global_step": 624710, "epoch": 7526} {"train_loss": -27.80550193786621, "global_step": 624711, "epoch": 7526} {"train_loss": -28.07245445251465, "global_step": 624712, "epoch": 7526} {"train_loss": -27.738330841064453, "global_step": 624713, "epoch": 7526} {"train_loss": -28.483264923095703, "global_step": 624714, "epoch": 7526} {"train_loss": -27.94742774963379, "global_step": 624715, "epoch": 7526} {"train_loss": -27.99554443359375, "global_step": 624716, "epoch": 7526} {"train_loss": -28.027524948120117, "global_step": 624717, "epoch": 7526} {"train_loss": -27.660364151000977, "global_step": 624718, "epoch": 7526} {"train_loss": -27.810964584350586, "global_step": 624719, "epoch": 7526} {"train_loss": -28.4190673828125, "global_step": 624720, "epoch": 7526} {"train_loss": -28.29448890686035, "global_step": 624721, "epoch": 7526} {"train_loss": -28.431156158447266, "global_step": 624722, "epoch": 7526} {"train_loss": -28.117969512939453, "global_step": 624723, "epoch": 7526} {"train_loss": -28.987751007080078, "global_step": 624724, "epoch": 7526} {"train_loss": -28.336029052734375, "global_step": 624725, "epoch": 7526} {"train_loss": -28.07065200805664, "global_step": 624726, "epoch": 7526} {"train_loss": -28.487089157104492, "global_step": 624727, "epoch": 7526} {"train_loss": -28.5747127532959, "global_step": 624728, "epoch": 7526} {"train_loss": -28.23008155822754, "global_step": 624729, "epoch": 7526} {"train_loss": -28.213525772094727, "global_step": 624730, "epoch": 7526} {"train_loss": -28.348554611206055, "global_step": 624731, "epoch": 7526} {"train_loss": -28.380346298217773, "global_step": 624732, "epoch": 7526} {"train_loss": -28.374662399291992, "global_step": 624733, "epoch": 7526} {"train_loss": -28.62750816345215, "global_step": 624734, "epoch": 7526} {"train_loss": -28.319196701049805, "global_step": 624735, "epoch": 7526} {"train_loss": -28.230329513549805, "global_step": 624736, "epoch": 7526} {"train_loss": -28.56522560119629, "global_step": 624737, "epoch": 7526} {"train_loss": -28.325597763061523, "global_step": 624738, "epoch": 7526} {"train_loss": -28.203643798828125, "global_step": 624739, "epoch": 7526} {"train_loss": -28.16731266803052, "global_step": 624740, "epoch": 7526, "val_loss": 6709253.0} {"train_loss": -28.069181442260742, "global_step": 624741, "epoch": 7527} {"train_loss": -27.264368057250977, "global_step": 624742, "epoch": 7527} {"train_loss": -26.75299072265625, "global_step": 624743, "epoch": 7527} {"train_loss": -26.935171127319336, "global_step": 624744, "epoch": 7527} {"train_loss": -27.195255279541016, "global_step": 624745, "epoch": 7527} {"train_loss": -27.255111694335938, "global_step": 624746, "epoch": 7527} {"train_loss": -27.710529327392578, "global_step": 624747, "epoch": 7527} {"train_loss": -27.602819442749023, "global_step": 624748, "epoch": 7527} {"train_loss": -27.1673526763916, "global_step": 624749, "epoch": 7527} {"train_loss": -27.774887084960938, "global_step": 624750, "epoch": 7527} {"train_loss": -27.888046264648438, "global_step": 624751, "epoch": 7527} {"train_loss": -27.314069747924805, "global_step": 624752, "epoch": 7527} {"train_loss": -27.282079696655273, "global_step": 624753, "epoch": 7527} {"train_loss": -26.9888916015625, "global_step": 624754, "epoch": 7527} {"train_loss": -28.051380157470703, "global_step": 624755, "epoch": 7527} {"train_loss": -27.78836441040039, "global_step": 624756, "epoch": 7527} {"train_loss": -27.782434463500977, "global_step": 624757, "epoch": 7527} {"train_loss": -27.7380313873291, "global_step": 624758, "epoch": 7527} {"train_loss": -27.844358444213867, "global_step": 624759, "epoch": 7527} {"train_loss": -28.12628173828125, "global_step": 624760, "epoch": 7527} {"train_loss": -27.75482749938965, "global_step": 624761, "epoch": 7527} {"train_loss": -27.913496017456055, "global_step": 624762, "epoch": 7527} {"train_loss": -28.093463897705078, "global_step": 624763, "epoch": 7527} {"train_loss": -27.715362548828125, "global_step": 624764, "epoch": 7527} {"train_loss": -27.94327163696289, "global_step": 624765, "epoch": 7527} {"train_loss": -28.037961959838867, "global_step": 624766, "epoch": 7527} {"train_loss": -28.459741592407227, "global_step": 624767, "epoch": 7527} {"train_loss": -27.840314865112305, "global_step": 624768, "epoch": 7527} {"train_loss": -28.176191329956055, "global_step": 624769, "epoch": 7527} {"train_loss": -27.496198654174805, "global_step": 624770, "epoch": 7527} {"train_loss": -27.99783706665039, "global_step": 624771, "epoch": 7527} {"train_loss": -28.069244384765625, "global_step": 624772, "epoch": 7527} {"train_loss": -28.28265380859375, "global_step": 624773, "epoch": 7527} {"train_loss": -28.104833602905273, "global_step": 624774, "epoch": 7527} {"train_loss": -28.122007369995117, "global_step": 624775, "epoch": 7527} {"train_loss": -27.93292808532715, "global_step": 624776, "epoch": 7527} {"train_loss": -28.080677032470703, "global_step": 624777, "epoch": 7527} {"train_loss": -28.343708038330078, "global_step": 624778, "epoch": 7527} {"train_loss": -27.926244735717773, "global_step": 624779, "epoch": 7527} {"train_loss": -28.045080184936523, "global_step": 624780, "epoch": 7527} {"train_loss": -28.213972091674805, "global_step": 624781, "epoch": 7527} {"train_loss": -28.414865493774414, "global_step": 624782, "epoch": 7527} {"train_loss": -28.107574462890625, "global_step": 624783, "epoch": 7527} {"train_loss": -28.43900489807129, "global_step": 624784, "epoch": 7527} {"train_loss": -28.318784713745117, "global_step": 624785, "epoch": 7527} {"train_loss": -28.072484970092773, "global_step": 624786, "epoch": 7527} {"train_loss": -28.295820236206055, "global_step": 624787, "epoch": 7527} {"train_loss": -28.509214401245117, "global_step": 624788, "epoch": 7527} {"train_loss": -28.159814834594727, "global_step": 624789, "epoch": 7527} {"train_loss": -28.264102935791016, "global_step": 624790, "epoch": 7527} {"train_loss": -28.645248413085938, "global_step": 624791, "epoch": 7527} {"train_loss": -28.18546485900879, "global_step": 624792, "epoch": 7527} {"train_loss": -28.283796310424805, "global_step": 624793, "epoch": 7527} {"train_loss": -28.11370849609375, "global_step": 624794, "epoch": 7527} {"train_loss": -28.217819213867188, "global_step": 624795, "epoch": 7527} {"train_loss": -28.35127067565918, "global_step": 624796, "epoch": 7527} {"train_loss": -28.138580322265625, "global_step": 624797, "epoch": 7527} {"train_loss": -28.368314743041992, "global_step": 624798, "epoch": 7527} {"train_loss": -28.313556671142578, "global_step": 624799, "epoch": 7527} {"train_loss": -28.429431915283203, "global_step": 624800, "epoch": 7527} {"train_loss": -28.0709285736084, "global_step": 624801, "epoch": 7527} {"train_loss": -28.291629791259766, "global_step": 624802, "epoch": 7527} {"train_loss": -28.284610748291016, "global_step": 624803, "epoch": 7527} {"train_loss": -28.10833168029785, "global_step": 624804, "epoch": 7527} {"train_loss": -27.905841827392578, "global_step": 624805, "epoch": 7527} {"train_loss": -27.59281349182129, "global_step": 624806, "epoch": 7527} {"train_loss": -27.715625762939453, "global_step": 624807, "epoch": 7527} {"train_loss": -27.860029220581055, "global_step": 624808, "epoch": 7527} {"train_loss": -28.09986686706543, "global_step": 624809, "epoch": 7527} {"train_loss": -28.34537696838379, "global_step": 624810, "epoch": 7527} {"train_loss": -28.167163848876953, "global_step": 624811, "epoch": 7527} {"train_loss": -28.088376998901367, "global_step": 624812, "epoch": 7527} {"train_loss": -28.21198081970215, "global_step": 624813, "epoch": 7527} {"train_loss": -28.26167869567871, "global_step": 624814, "epoch": 7527} {"train_loss": -28.649677276611328, "global_step": 624815, "epoch": 7527} {"train_loss": -28.375598907470703, "global_step": 624816, "epoch": 7527} {"train_loss": -28.646194458007812, "global_step": 624817, "epoch": 7527} {"train_loss": -27.921545028686523, "global_step": 624818, "epoch": 7527} {"train_loss": -28.448755264282227, "global_step": 624819, "epoch": 7527} {"train_loss": -28.58759117126465, "global_step": 624820, "epoch": 7527} {"train_loss": -28.419544219970703, "global_step": 624821, "epoch": 7527} {"train_loss": -28.700651168823242, "global_step": 624822, "epoch": 7527} {"train_loss": -28.030684942222504, "global_step": 624823, "epoch": 7527, "val_loss": 6619425.0} {"train_loss": -26.707672119140625, "global_step": 624824, "epoch": 7528} {"train_loss": -25.878583908081055, "global_step": 624825, "epoch": 7528} {"train_loss": -26.41265296936035, "global_step": 624826, "epoch": 7528} {"train_loss": -25.92758560180664, "global_step": 624827, "epoch": 7528} {"train_loss": -26.570709228515625, "global_step": 624828, "epoch": 7528} {"train_loss": -26.110382080078125, "global_step": 624829, "epoch": 7528} {"train_loss": -25.281539916992188, "global_step": 624830, "epoch": 7528} {"train_loss": -27.33193016052246, "global_step": 624831, "epoch": 7528} {"train_loss": -26.278844833374023, "global_step": 624832, "epoch": 7528} {"train_loss": -25.63224220275879, "global_step": 624833, "epoch": 7528} {"train_loss": -26.871585845947266, "global_step": 624834, "epoch": 7528} {"train_loss": -26.3137264251709, "global_step": 624835, "epoch": 7528} {"train_loss": -26.804731369018555, "global_step": 624836, "epoch": 7528} {"train_loss": -26.785022735595703, "global_step": 624837, "epoch": 7528} {"train_loss": -27.160358428955078, "global_step": 624838, "epoch": 7528} {"train_loss": -26.711841583251953, "global_step": 624839, "epoch": 7528} {"train_loss": -27.568655014038086, "global_step": 624840, "epoch": 7528} {"train_loss": -27.09834098815918, "global_step": 624841, "epoch": 7528} {"train_loss": -26.92984390258789, "global_step": 624842, "epoch": 7528} {"train_loss": -27.149585723876953, "global_step": 624843, "epoch": 7528} {"train_loss": -27.03131675720215, "global_step": 624844, "epoch": 7528} {"train_loss": -27.40781593322754, "global_step": 624845, "epoch": 7528} {"train_loss": -27.336530685424805, "global_step": 624846, "epoch": 7528} {"train_loss": -27.347442626953125, "global_step": 624847, "epoch": 7528} {"train_loss": -27.318750381469727, "global_step": 624848, "epoch": 7528} {"train_loss": -27.57685661315918, "global_step": 624849, "epoch": 7528} {"train_loss": -27.517675399780273, "global_step": 624850, "epoch": 7528} {"train_loss": -27.1876220703125, "global_step": 624851, "epoch": 7528} {"train_loss": -27.67725944519043, "global_step": 624852, "epoch": 7528} {"train_loss": -27.616891860961914, "global_step": 624853, "epoch": 7528} {"train_loss": -27.781492233276367, "global_step": 624854, "epoch": 7528} {"train_loss": -27.82490348815918, "global_step": 624855, "epoch": 7528} {"train_loss": -27.07332420349121, "global_step": 624856, "epoch": 7528} {"train_loss": -27.811315536499023, "global_step": 624857, "epoch": 7528} {"train_loss": -27.5618896484375, "global_step": 624858, "epoch": 7528} {"train_loss": -27.74489402770996, "global_step": 624859, "epoch": 7528} {"train_loss": -27.618757247924805, "global_step": 624860, "epoch": 7528} {"train_loss": -27.96858024597168, "global_step": 624861, "epoch": 7528} {"train_loss": -27.16859245300293, "global_step": 624862, "epoch": 7528} {"train_loss": -27.97663688659668, "global_step": 624863, "epoch": 7528} {"train_loss": -28.3655948638916, "global_step": 624864, "epoch": 7528} {"train_loss": -27.838764190673828, "global_step": 624865, "epoch": 7528} {"train_loss": -27.929895401000977, "global_step": 624866, "epoch": 7528} {"train_loss": -28.040159225463867, "global_step": 624867, "epoch": 7528} {"train_loss": -28.042566299438477, "global_step": 624868, "epoch": 7528} {"train_loss": -28.110599517822266, "global_step": 624869, "epoch": 7528} {"train_loss": -27.666532516479492, "global_step": 624870, "epoch": 7528} {"train_loss": -28.3747615814209, "global_step": 624871, "epoch": 7528} {"train_loss": -27.93747901916504, "global_step": 624872, "epoch": 7528} {"train_loss": -28.04267692565918, "global_step": 624873, "epoch": 7528} {"train_loss": -28.183698654174805, "global_step": 624874, "epoch": 7528} {"train_loss": -27.771636962890625, "global_step": 624875, "epoch": 7528} {"train_loss": -28.50715446472168, "global_step": 624876, "epoch": 7528} {"train_loss": -27.79638671875, "global_step": 624877, "epoch": 7528} {"train_loss": -28.461517333984375, "global_step": 624878, "epoch": 7528} {"train_loss": -27.674301147460938, "global_step": 624879, "epoch": 7528} {"train_loss": -28.256689071655273, "global_step": 624880, "epoch": 7528} {"train_loss": -28.11590576171875, "global_step": 624881, "epoch": 7528} {"train_loss": -27.91823387145996, "global_step": 624882, "epoch": 7528} {"train_loss": -27.683286666870117, "global_step": 624883, "epoch": 7528} {"train_loss": -27.85798454284668, "global_step": 624884, "epoch": 7528} {"train_loss": -28.054046630859375, "global_step": 624885, "epoch": 7528} {"train_loss": -28.2600154876709, "global_step": 624886, "epoch": 7528} {"train_loss": -28.07964515686035, "global_step": 624887, "epoch": 7528} {"train_loss": -27.814844131469727, "global_step": 624888, "epoch": 7528} {"train_loss": -28.265012741088867, "global_step": 624889, "epoch": 7528} {"train_loss": -27.975116729736328, "global_step": 624890, "epoch": 7528} {"train_loss": -28.134443283081055, "global_step": 624891, "epoch": 7528} {"train_loss": -28.12335777282715, "global_step": 624892, "epoch": 7528} {"train_loss": -28.32962989807129, "global_step": 624893, "epoch": 7528} {"train_loss": -28.527597427368164, "global_step": 624894, "epoch": 7528} {"train_loss": -28.277063369750977, "global_step": 624895, "epoch": 7528} {"train_loss": -27.76716423034668, "global_step": 624896, "epoch": 7528} {"train_loss": -28.311548233032227, "global_step": 624897, "epoch": 7528} {"train_loss": -28.10349464416504, "global_step": 624898, "epoch": 7528} {"train_loss": -28.332157135009766, "global_step": 624899, "epoch": 7528} {"train_loss": -28.287321090698242, "global_step": 624900, "epoch": 7528} {"train_loss": -28.21786880493164, "global_step": 624901, "epoch": 7528} {"train_loss": -28.325170516967773, "global_step": 624902, "epoch": 7528} {"train_loss": -28.296689987182617, "global_step": 624903, "epoch": 7528} {"train_loss": -28.368879318237305, "global_step": 624904, "epoch": 7528} {"train_loss": -27.95296287536621, "global_step": 624905, "epoch": 7528} {"train_loss": -27.584479803062347, "global_step": 624906, "epoch": 7528, "val_loss": 6842076.0} {"train_loss": -27.058502197265625, "global_step": 624907, "epoch": 7529} {"train_loss": -27.685474395751953, "global_step": 624908, "epoch": 7529} {"train_loss": -27.722198486328125, "global_step": 624909, "epoch": 7529} {"train_loss": -27.521947860717773, "global_step": 624910, "epoch": 7529} {"train_loss": -27.045740127563477, "global_step": 624911, "epoch": 7529} {"train_loss": -27.676502227783203, "global_step": 624912, "epoch": 7529} {"train_loss": -27.470184326171875, "global_step": 624913, "epoch": 7529} {"train_loss": -28.038671493530273, "global_step": 624914, "epoch": 7529} {"train_loss": -27.638525009155273, "global_step": 624915, "epoch": 7529} {"train_loss": -27.318017959594727, "global_step": 624916, "epoch": 7529} {"train_loss": -27.128461837768555, "global_step": 624917, "epoch": 7529} {"train_loss": -27.143939971923828, "global_step": 624918, "epoch": 7529} {"train_loss": -27.180255889892578, "global_step": 624919, "epoch": 7529} {"train_loss": -27.314294815063477, "global_step": 624920, "epoch": 7529} {"train_loss": -27.758466720581055, "global_step": 624921, "epoch": 7529} {"train_loss": -27.53602409362793, "global_step": 624922, "epoch": 7529} {"train_loss": -27.539920806884766, "global_step": 624923, "epoch": 7529} {"train_loss": -28.05146598815918, "global_step": 624924, "epoch": 7529} {"train_loss": -28.04066276550293, "global_step": 624925, "epoch": 7529} {"train_loss": -27.984365463256836, "global_step": 624926, "epoch": 7529} {"train_loss": -27.895648956298828, "global_step": 624927, "epoch": 7529} {"train_loss": -27.6304988861084, "global_step": 624928, "epoch": 7529} {"train_loss": -27.828733444213867, "global_step": 624929, "epoch": 7529} {"train_loss": -27.9869327545166, "global_step": 624930, "epoch": 7529} {"train_loss": -28.166852951049805, "global_step": 624931, "epoch": 7529} {"train_loss": -28.009313583374023, "global_step": 624932, "epoch": 7529} {"train_loss": -28.27667236328125, "global_step": 624933, "epoch": 7529} {"train_loss": -28.2099666595459, "global_step": 624934, "epoch": 7529} {"train_loss": -28.223249435424805, "global_step": 624935, "epoch": 7529} {"train_loss": -28.08700942993164, "global_step": 624936, "epoch": 7529} {"train_loss": -28.048328399658203, "global_step": 624937, "epoch": 7529} {"train_loss": -28.104446411132812, "global_step": 624938, "epoch": 7529} {"train_loss": -28.576696395874023, "global_step": 624939, "epoch": 7529} {"train_loss": -28.283161163330078, "global_step": 624940, "epoch": 7529} {"train_loss": -28.230085372924805, "global_step": 624941, "epoch": 7529} {"train_loss": -28.052865982055664, "global_step": 624942, "epoch": 7529} {"train_loss": -28.11445426940918, "global_step": 624943, "epoch": 7529} {"train_loss": -27.944351196289062, "global_step": 624944, "epoch": 7529} {"train_loss": -28.576581954956055, "global_step": 624945, "epoch": 7529} {"train_loss": -28.52972412109375, "global_step": 624946, "epoch": 7529} {"train_loss": -28.141571044921875, "global_step": 624947, "epoch": 7529} {"train_loss": -28.3195858001709, "global_step": 624948, "epoch": 7529} {"train_loss": -28.24383544921875, "global_step": 624949, "epoch": 7529} {"train_loss": -28.355621337890625, "global_step": 624950, "epoch": 7529} {"train_loss": -28.39898681640625, "global_step": 624951, "epoch": 7529} {"train_loss": -28.496280670166016, "global_step": 624952, "epoch": 7529} {"train_loss": -28.3680477142334, "global_step": 624953, "epoch": 7529} {"train_loss": -28.24220848083496, "global_step": 624954, "epoch": 7529} {"train_loss": -28.584897994995117, "global_step": 624955, "epoch": 7529} {"train_loss": -28.570892333984375, "global_step": 624956, "epoch": 7529} {"train_loss": -28.3597469329834, "global_step": 624957, "epoch": 7529} {"train_loss": -28.5511531829834, "global_step": 624958, "epoch": 7529} {"train_loss": -28.671695709228516, "global_step": 624959, "epoch": 7529} {"train_loss": -28.57655143737793, "global_step": 624960, "epoch": 7529} {"train_loss": -28.645465850830078, "global_step": 624961, "epoch": 7529} {"train_loss": -28.401350021362305, "global_step": 624962, "epoch": 7529} {"train_loss": -28.271451950073242, "global_step": 624963, "epoch": 7529} {"train_loss": -28.58332633972168, "global_step": 624964, "epoch": 7529} {"train_loss": -28.343122482299805, "global_step": 624965, "epoch": 7529} {"train_loss": -28.264448165893555, "global_step": 624966, "epoch": 7529} {"train_loss": -28.43549156188965, "global_step": 624967, "epoch": 7529} {"train_loss": -28.55741310119629, "global_step": 624968, "epoch": 7529} {"train_loss": -28.573698043823242, "global_step": 624969, "epoch": 7529} {"train_loss": -28.0513916015625, "global_step": 624970, "epoch": 7529} {"train_loss": -28.420623779296875, "global_step": 624971, "epoch": 7529} {"train_loss": -28.034177780151367, "global_step": 624972, "epoch": 7529} {"train_loss": -28.461139678955078, "global_step": 624973, "epoch": 7529} {"train_loss": -28.22943115234375, "global_step": 624974, "epoch": 7529} {"train_loss": -27.78615379333496, "global_step": 624975, "epoch": 7529} {"train_loss": -27.550745010375977, "global_step": 624976, "epoch": 7529} {"train_loss": -27.765241622924805, "global_step": 624977, "epoch": 7529} {"train_loss": -27.932769775390625, "global_step": 624978, "epoch": 7529} {"train_loss": -28.11005973815918, "global_step": 624979, "epoch": 7529} {"train_loss": -27.91232681274414, "global_step": 624980, "epoch": 7529} {"train_loss": -27.719345092773438, "global_step": 624981, "epoch": 7529} {"train_loss": -28.35393714904785, "global_step": 624982, "epoch": 7529} {"train_loss": -27.954137802124023, "global_step": 624983, "epoch": 7529} {"train_loss": -27.990766525268555, "global_step": 624984, "epoch": 7529} {"train_loss": -28.159921646118164, "global_step": 624985, "epoch": 7529} {"train_loss": -28.142419815063477, "global_step": 624986, "epoch": 7529} {"train_loss": -28.138166427612305, "global_step": 624987, "epoch": 7529} {"train_loss": -28.528919219970703, "global_step": 624988, "epoch": 7529} {"train_loss": -28.077468067766674, "global_step": 624989, "epoch": 7529, "val_loss": 6794268.0} {"train_loss": -27.27326774597168, "global_step": 624990, "epoch": 7530} {"train_loss": -27.21457290649414, "global_step": 624991, "epoch": 7530} {"train_loss": -27.171422958374023, "global_step": 624992, "epoch": 7530} {"train_loss": -27.464313507080078, "global_step": 624993, "epoch": 7530} {"train_loss": -27.40338134765625, "global_step": 624994, "epoch": 7530} {"train_loss": -27.525562286376953, "global_step": 624995, "epoch": 7530} {"train_loss": -27.33136558532715, "global_step": 624996, "epoch": 7530} {"train_loss": -27.453170776367188, "global_step": 624997, "epoch": 7530} {"train_loss": -27.107959747314453, "global_step": 624998, "epoch": 7530} {"train_loss": -27.36821937561035, "global_step": 624999, "epoch": 7530} {"train_loss": -27.7873477935791, "global_step": 625000, "epoch": 7530} {"train_loss": -27.063861846923828, "global_step": 625001, "epoch": 7530} {"train_loss": -28.136865615844727, "global_step": 625002, "epoch": 7530} {"train_loss": -27.65254020690918, "global_step": 625003, "epoch": 7530} {"train_loss": -27.620746612548828, "global_step": 625004, "epoch": 7530} {"train_loss": -27.429107666015625, "global_step": 625005, "epoch": 7530} {"train_loss": -27.434101104736328, "global_step": 625006, "epoch": 7530} {"train_loss": -27.92537498474121, "global_step": 625007, "epoch": 7530} {"train_loss": -27.711746215820312, "global_step": 625008, "epoch": 7530} {"train_loss": -27.8736515045166, "global_step": 625009, "epoch": 7530} {"train_loss": -27.778369903564453, "global_step": 625010, "epoch": 7530} {"train_loss": -27.7846622467041, "global_step": 625011, "epoch": 7530} {"train_loss": -27.73011589050293, "global_step": 625012, "epoch": 7530} {"train_loss": -28.217111587524414, "global_step": 625013, "epoch": 7530} {"train_loss": -27.832178115844727, "global_step": 625014, "epoch": 7530} {"train_loss": -27.52788734436035, "global_step": 625015, "epoch": 7530} {"train_loss": -27.741870880126953, "global_step": 625016, "epoch": 7530} {"train_loss": -27.81304931640625, "global_step": 625017, "epoch": 7530} {"train_loss": -27.931812286376953, "global_step": 625018, "epoch": 7530} {"train_loss": -28.173505783081055, "global_step": 625019, "epoch": 7530} {"train_loss": -27.649063110351562, "global_step": 625020, "epoch": 7530} {"train_loss": -27.947599411010742, "global_step": 625021, "epoch": 7530} {"train_loss": -28.18787956237793, "global_step": 625022, "epoch": 7530} {"train_loss": -27.928953170776367, "global_step": 625023, "epoch": 7530} {"train_loss": -27.727405548095703, "global_step": 625024, "epoch": 7530} {"train_loss": -28.010955810546875, "global_step": 625025, "epoch": 7530} {"train_loss": -28.221759796142578, "global_step": 625026, "epoch": 7530} {"train_loss": -28.19927406311035, "global_step": 625027, "epoch": 7530} {"train_loss": -27.83608055114746, "global_step": 625028, "epoch": 7530} {"train_loss": -27.998218536376953, "global_step": 625029, "epoch": 7530} {"train_loss": -28.174413681030273, "global_step": 625030, "epoch": 7530} {"train_loss": -28.304731369018555, "global_step": 625031, "epoch": 7530} {"train_loss": -28.1743221282959, "global_step": 625032, "epoch": 7530} {"train_loss": -28.38677406311035, "global_step": 625033, "epoch": 7530} {"train_loss": -28.27070426940918, "global_step": 625034, "epoch": 7530} {"train_loss": -28.44947624206543, "global_step": 625035, "epoch": 7530} {"train_loss": -28.40485191345215, "global_step": 625036, "epoch": 7530} {"train_loss": -28.430561065673828, "global_step": 625037, "epoch": 7530} {"train_loss": -28.283985137939453, "global_step": 625038, "epoch": 7530} {"train_loss": -28.47041130065918, "global_step": 625039, "epoch": 7530} {"train_loss": -28.334760665893555, "global_step": 625040, "epoch": 7530} {"train_loss": -28.460432052612305, "global_step": 625041, "epoch": 7530} {"train_loss": -28.560901641845703, "global_step": 625042, "epoch": 7530} {"train_loss": -28.359663009643555, "global_step": 625043, "epoch": 7530} {"train_loss": -28.220972061157227, "global_step": 625044, "epoch": 7530} {"train_loss": -27.935321807861328, "global_step": 625045, "epoch": 7530} {"train_loss": -28.219501495361328, "global_step": 625046, "epoch": 7530} {"train_loss": -28.225147247314453, "global_step": 625047, "epoch": 7530} {"train_loss": -28.44866371154785, "global_step": 625048, "epoch": 7530} {"train_loss": -28.537145614624023, "global_step": 625049, "epoch": 7530} {"train_loss": -28.227563858032227, "global_step": 625050, "epoch": 7530} {"train_loss": -28.69232177734375, "global_step": 625051, "epoch": 7530} {"train_loss": -28.21830177307129, "global_step": 625052, "epoch": 7530} {"train_loss": -28.142820358276367, "global_step": 625053, "epoch": 7530} {"train_loss": -28.034467697143555, "global_step": 625054, "epoch": 7530} {"train_loss": -28.46515464782715, "global_step": 625055, "epoch": 7530} {"train_loss": -28.156408309936523, "global_step": 625056, "epoch": 7530} {"train_loss": -28.40241050720215, "global_step": 625057, "epoch": 7530} {"train_loss": -28.828353881835938, "global_step": 625058, "epoch": 7530} {"train_loss": -28.63575553894043, "global_step": 625059, "epoch": 7530} {"train_loss": -28.319812774658203, "global_step": 625060, "epoch": 7530} {"train_loss": -28.363208770751953, "global_step": 625061, "epoch": 7530} {"train_loss": -28.152090072631836, "global_step": 625062, "epoch": 7530} {"train_loss": -28.48432731628418, "global_step": 625063, "epoch": 7530} {"train_loss": -28.545949935913086, "global_step": 625064, "epoch": 7530} {"train_loss": -28.435155868530273, "global_step": 625065, "epoch": 7530} {"train_loss": -28.316650390625, "global_step": 625066, "epoch": 7530} {"train_loss": -28.49488639831543, "global_step": 625067, "epoch": 7530} {"train_loss": -28.62982749938965, "global_step": 625068, "epoch": 7530} {"train_loss": -28.459228515625, "global_step": 625069, "epoch": 7530} {"train_loss": -28.130645751953125, "global_step": 625070, "epoch": 7530} {"train_loss": -28.142414093017578, "global_step": 625071, "epoch": 7530} {"train_loss": -28.030144335275672, "global_step": 625072, "epoch": 7530, "val_loss": 6924864.0} {"train_loss": -26.968427658081055, "global_step": 625073, "epoch": 7531} {"train_loss": -24.850547790527344, "global_step": 625074, "epoch": 7531} {"train_loss": -24.37556266784668, "global_step": 625075, "epoch": 7531} {"train_loss": -25.72686195373535, "global_step": 625076, "epoch": 7531} {"train_loss": -26.422794342041016, "global_step": 625077, "epoch": 7531} {"train_loss": -26.782367706298828, "global_step": 625078, "epoch": 7531} {"train_loss": -26.84320068359375, "global_step": 625079, "epoch": 7531} {"train_loss": -26.002288818359375, "global_step": 625080, "epoch": 7531} {"train_loss": -27.162687301635742, "global_step": 625081, "epoch": 7531} {"train_loss": -26.697839736938477, "global_step": 625082, "epoch": 7531} {"train_loss": -26.826807022094727, "global_step": 625083, "epoch": 7531} {"train_loss": -27.38897132873535, "global_step": 625084, "epoch": 7531} {"train_loss": -26.882322311401367, "global_step": 625085, "epoch": 7531} {"train_loss": -26.85869789123535, "global_step": 625086, "epoch": 7531} {"train_loss": -27.560049057006836, "global_step": 625087, "epoch": 7531} {"train_loss": -26.402942657470703, "global_step": 625088, "epoch": 7531} {"train_loss": -27.098596572875977, "global_step": 625089, "epoch": 7531} {"train_loss": -27.433568954467773, "global_step": 625090, "epoch": 7531} {"train_loss": -27.221914291381836, "global_step": 625091, "epoch": 7531} {"train_loss": -27.668485641479492, "global_step": 625092, "epoch": 7531} {"train_loss": -27.2059268951416, "global_step": 625093, "epoch": 7531} {"train_loss": -27.23371696472168, "global_step": 625094, "epoch": 7531} {"train_loss": -27.213354110717773, "global_step": 625095, "epoch": 7531} {"train_loss": -27.39007568359375, "global_step": 625096, "epoch": 7531} {"train_loss": -27.374134063720703, "global_step": 625097, "epoch": 7531} {"train_loss": -27.506759643554688, "global_step": 625098, "epoch": 7531} {"train_loss": -27.83289909362793, "global_step": 625099, "epoch": 7531} {"train_loss": -27.742816925048828, "global_step": 625100, "epoch": 7531} {"train_loss": -27.621047973632812, "global_step": 625101, "epoch": 7531} {"train_loss": -27.137983322143555, "global_step": 625102, "epoch": 7531} {"train_loss": -27.24448585510254, "global_step": 625103, "epoch": 7531} {"train_loss": -27.78443717956543, "global_step": 625104, "epoch": 7531} {"train_loss": -27.529382705688477, "global_step": 625105, "epoch": 7531} {"train_loss": -27.432605743408203, "global_step": 625106, "epoch": 7531} {"train_loss": -27.880163192749023, "global_step": 625107, "epoch": 7531} {"train_loss": -27.713958740234375, "global_step": 625108, "epoch": 7531} {"train_loss": -27.42864418029785, "global_step": 625109, "epoch": 7531} {"train_loss": -28.045766830444336, "global_step": 625110, "epoch": 7531} {"train_loss": -27.41705894470215, "global_step": 625111, "epoch": 7531} {"train_loss": -27.930692672729492, "global_step": 625112, "epoch": 7531} {"train_loss": -28.33643913269043, "global_step": 625113, "epoch": 7531} {"train_loss": -27.645605087280273, "global_step": 625114, "epoch": 7531} {"train_loss": -27.929706573486328, "global_step": 625115, "epoch": 7531} {"train_loss": -27.53192710876465, "global_step": 625116, "epoch": 7531} {"train_loss": -27.810001373291016, "global_step": 625117, "epoch": 7531} {"train_loss": -27.78045654296875, "global_step": 625118, "epoch": 7531} {"train_loss": -27.951507568359375, "global_step": 625119, "epoch": 7531} {"train_loss": -28.152158737182617, "global_step": 625120, "epoch": 7531} {"train_loss": -28.042211532592773, "global_step": 625121, "epoch": 7531} {"train_loss": -28.499576568603516, "global_step": 625122, "epoch": 7531} {"train_loss": -27.946807861328125, "global_step": 625123, "epoch": 7531} {"train_loss": -28.3177433013916, "global_step": 625124, "epoch": 7531} {"train_loss": -28.082372665405273, "global_step": 625125, "epoch": 7531} {"train_loss": -28.129108428955078, "global_step": 625126, "epoch": 7531} {"train_loss": -28.425281524658203, "global_step": 625127, "epoch": 7531} {"train_loss": -28.275039672851562, "global_step": 625128, "epoch": 7531} {"train_loss": -28.53496742248535, "global_step": 625129, "epoch": 7531} {"train_loss": -28.448322296142578, "global_step": 625130, "epoch": 7531} {"train_loss": -28.36872673034668, "global_step": 625131, "epoch": 7531} {"train_loss": -28.3714599609375, "global_step": 625132, "epoch": 7531} {"train_loss": -28.049346923828125, "global_step": 625133, "epoch": 7531} {"train_loss": -28.560108184814453, "global_step": 625134, "epoch": 7531} {"train_loss": -28.503931045532227, "global_step": 625135, "epoch": 7531} {"train_loss": -28.00739860534668, "global_step": 625136, "epoch": 7531} {"train_loss": -28.78803825378418, "global_step": 625137, "epoch": 7531} {"train_loss": -28.306507110595703, "global_step": 625138, "epoch": 7531} {"train_loss": -28.676549911499023, "global_step": 625139, "epoch": 7531} {"train_loss": -28.29230308532715, "global_step": 625140, "epoch": 7531} {"train_loss": -28.576745986938477, "global_step": 625141, "epoch": 7531} {"train_loss": -28.23310661315918, "global_step": 625142, "epoch": 7531} {"train_loss": -28.297948837280273, "global_step": 625143, "epoch": 7531} {"train_loss": -28.63335609436035, "global_step": 625144, "epoch": 7531} {"train_loss": -28.584716796875, "global_step": 625145, "epoch": 7531} {"train_loss": -28.602264404296875, "global_step": 625146, "epoch": 7531} {"train_loss": -28.418867111206055, "global_step": 625147, "epoch": 7531} {"train_loss": -28.106647491455078, "global_step": 625148, "epoch": 7531} {"train_loss": -28.395334243774414, "global_step": 625149, "epoch": 7531} {"train_loss": -28.539642333984375, "global_step": 625150, "epoch": 7531} {"train_loss": -28.466821670532227, "global_step": 625151, "epoch": 7531} {"train_loss": -28.525970458984375, "global_step": 625152, "epoch": 7531} {"train_loss": -28.898611068725586, "global_step": 625153, "epoch": 7531} {"train_loss": -28.520288467407227, "global_step": 625154, "epoch": 7531} {"train_loss": -27.71332320247788, "global_step": 625155, "epoch": 7531, "val_loss": 6849972.0} {"train_loss": -27.646024703979492, "global_step": 625156, "epoch": 7532} {"train_loss": -26.948251724243164, "global_step": 625157, "epoch": 7532} {"train_loss": -27.238983154296875, "global_step": 625158, "epoch": 7532} {"train_loss": -28.227941513061523, "global_step": 625159, "epoch": 7532} {"train_loss": -27.17215347290039, "global_step": 625160, "epoch": 7532} {"train_loss": -26.97145652770996, "global_step": 625161, "epoch": 7532} {"train_loss": -26.687952041625977, "global_step": 625162, "epoch": 7532} {"train_loss": -26.902496337890625, "global_step": 625163, "epoch": 7532} {"train_loss": -27.515506744384766, "global_step": 625164, "epoch": 7532} {"train_loss": -27.579669952392578, "global_step": 625165, "epoch": 7532} {"train_loss": -27.609704971313477, "global_step": 625166, "epoch": 7532} {"train_loss": -27.048303604125977, "global_step": 625167, "epoch": 7532} {"train_loss": -27.87253189086914, "global_step": 625168, "epoch": 7532} {"train_loss": -27.640472412109375, "global_step": 625169, "epoch": 7532} {"train_loss": -27.552661895751953, "global_step": 625170, "epoch": 7532} {"train_loss": -27.746850967407227, "global_step": 625171, "epoch": 7532} {"train_loss": -27.318668365478516, "global_step": 625172, "epoch": 7532} {"train_loss": -27.96407127380371, "global_step": 625173, "epoch": 7532} {"train_loss": -27.601627349853516, "global_step": 625174, "epoch": 7532} {"train_loss": -27.908491134643555, "global_step": 625175, "epoch": 7532} {"train_loss": -27.612390518188477, "global_step": 625176, "epoch": 7532} {"train_loss": -27.75980567932129, "global_step": 625177, "epoch": 7532} {"train_loss": -27.705703735351562, "global_step": 625178, "epoch": 7532} {"train_loss": -28.120777130126953, "global_step": 625179, "epoch": 7532} {"train_loss": -27.844757080078125, "global_step": 625180, "epoch": 7532} {"train_loss": -28.068506240844727, "global_step": 625181, "epoch": 7532} {"train_loss": -27.57319450378418, "global_step": 625182, "epoch": 7532} {"train_loss": -27.886754989624023, "global_step": 625183, "epoch": 7532} {"train_loss": -27.84396743774414, "global_step": 625184, "epoch": 7532} {"train_loss": -28.063268661499023, "global_step": 625185, "epoch": 7532} {"train_loss": -27.747547149658203, "global_step": 625186, "epoch": 7532} {"train_loss": -28.15260887145996, "global_step": 625187, "epoch": 7532} {"train_loss": -27.75092124938965, "global_step": 625188, "epoch": 7532} {"train_loss": -28.029693603515625, "global_step": 625189, "epoch": 7532} {"train_loss": -27.88374137878418, "global_step": 625190, "epoch": 7532} {"train_loss": -28.25028419494629, "global_step": 625191, "epoch": 7532} {"train_loss": -28.302738189697266, "global_step": 625192, "epoch": 7532} {"train_loss": -27.973302841186523, "global_step": 625193, "epoch": 7532} {"train_loss": -28.079938888549805, "global_step": 625194, "epoch": 7532} {"train_loss": -27.888565063476562, "global_step": 625195, "epoch": 7532} {"train_loss": -28.48943519592285, "global_step": 625196, "epoch": 7532} {"train_loss": -27.89625358581543, "global_step": 625197, "epoch": 7532} {"train_loss": -28.021703720092773, "global_step": 625198, "epoch": 7532} {"train_loss": -28.310510635375977, "global_step": 625199, "epoch": 7532} {"train_loss": -28.1760311126709, "global_step": 625200, "epoch": 7532} {"train_loss": -27.68166160583496, "global_step": 625201, "epoch": 7532} {"train_loss": -28.130462646484375, "global_step": 625202, "epoch": 7532} {"train_loss": -28.16596794128418, "global_step": 625203, "epoch": 7532} {"train_loss": -28.233591079711914, "global_step": 625204, "epoch": 7532} {"train_loss": -28.221967697143555, "global_step": 625205, "epoch": 7532} {"train_loss": -28.110876083374023, "global_step": 625206, "epoch": 7532} {"train_loss": -28.49981117248535, "global_step": 625207, "epoch": 7532} {"train_loss": -27.993850708007812, "global_step": 625208, "epoch": 7532} {"train_loss": -28.301923751831055, "global_step": 625209, "epoch": 7532} {"train_loss": -28.4515323638916, "global_step": 625210, "epoch": 7532} {"train_loss": -28.137104034423828, "global_step": 625211, "epoch": 7532} {"train_loss": -28.31013298034668, "global_step": 625212, "epoch": 7532} {"train_loss": -27.8794002532959, "global_step": 625213, "epoch": 7532} {"train_loss": -28.620031356811523, "global_step": 625214, "epoch": 7532} {"train_loss": -28.311603546142578, "global_step": 625215, "epoch": 7532} {"train_loss": -28.039648056030273, "global_step": 625216, "epoch": 7532} {"train_loss": -28.349658966064453, "global_step": 625217, "epoch": 7532} {"train_loss": -28.35516929626465, "global_step": 625218, "epoch": 7532} {"train_loss": -28.19195556640625, "global_step": 625219, "epoch": 7532} {"train_loss": -28.286819458007812, "global_step": 625220, "epoch": 7532} {"train_loss": -27.800430297851562, "global_step": 625221, "epoch": 7532} {"train_loss": -28.31399917602539, "global_step": 625222, "epoch": 7532} {"train_loss": -28.515527725219727, "global_step": 625223, "epoch": 7532} {"train_loss": -28.435022354125977, "global_step": 625224, "epoch": 7532} {"train_loss": -28.248661041259766, "global_step": 625225, "epoch": 7532} {"train_loss": -28.266189575195312, "global_step": 625226, "epoch": 7532} {"train_loss": -28.082763671875, "global_step": 625227, "epoch": 7532} {"train_loss": -28.627429962158203, "global_step": 625228, "epoch": 7532} {"train_loss": -27.946823120117188, "global_step": 625229, "epoch": 7532} {"train_loss": -28.049238204956055, "global_step": 625230, "epoch": 7532} {"train_loss": -28.2520694732666, "global_step": 625231, "epoch": 7532} {"train_loss": -28.364171981811523, "global_step": 625232, "epoch": 7532} {"train_loss": -28.04560661315918, "global_step": 625233, "epoch": 7532} {"train_loss": -28.121671676635742, "global_step": 625234, "epoch": 7532} {"train_loss": -28.08829689025879, "global_step": 625235, "epoch": 7532} {"train_loss": -28.32996940612793, "global_step": 625236, "epoch": 7532} {"train_loss": -28.186513900756836, "global_step": 625237, "epoch": 7532} {"train_loss": -27.947525713817182, "global_step": 625238, "epoch": 7532, "val_loss": 6830365.0} {"train_loss": -27.703022003173828, "global_step": 625239, "epoch": 7533} {"train_loss": -27.623090744018555, "global_step": 625240, "epoch": 7533} {"train_loss": -27.603286743164062, "global_step": 625241, "epoch": 7533} {"train_loss": -27.600229263305664, "global_step": 625242, "epoch": 7533} {"train_loss": -27.309833526611328, "global_step": 625243, "epoch": 7533} {"train_loss": -27.604578018188477, "global_step": 625244, "epoch": 7533} {"train_loss": -27.726388931274414, "global_step": 625245, "epoch": 7533} {"train_loss": -27.066669464111328, "global_step": 625246, "epoch": 7533} {"train_loss": -27.097944259643555, "global_step": 625247, "epoch": 7533} {"train_loss": -27.457443237304688, "global_step": 625248, "epoch": 7533} {"train_loss": -28.010395050048828, "global_step": 625249, "epoch": 7533} {"train_loss": -27.420639038085938, "global_step": 625250, "epoch": 7533} {"train_loss": -27.834463119506836, "global_step": 625251, "epoch": 7533} {"train_loss": -27.653562545776367, "global_step": 625252, "epoch": 7533} {"train_loss": -27.825183868408203, "global_step": 625253, "epoch": 7533} {"train_loss": -28.0123233795166, "global_step": 625254, "epoch": 7533} {"train_loss": -27.95427894592285, "global_step": 625255, "epoch": 7533} {"train_loss": -27.99335289001465, "global_step": 625256, "epoch": 7533} {"train_loss": -28.166791915893555, "global_step": 625257, "epoch": 7533} {"train_loss": -27.820484161376953, "global_step": 625258, "epoch": 7533} {"train_loss": -27.667434692382812, "global_step": 625259, "epoch": 7533} {"train_loss": -28.25758934020996, "global_step": 625260, "epoch": 7533} {"train_loss": -27.613996505737305, "global_step": 625261, "epoch": 7533} {"train_loss": -28.13654136657715, "global_step": 625262, "epoch": 7533} {"train_loss": -27.734695434570312, "global_step": 625263, "epoch": 7533} {"train_loss": -28.140731811523438, "global_step": 625264, "epoch": 7533} {"train_loss": -28.269397735595703, "global_step": 625265, "epoch": 7533} {"train_loss": -27.9023380279541, "global_step": 625266, "epoch": 7533} {"train_loss": -28.173913955688477, "global_step": 625267, "epoch": 7533} {"train_loss": -27.626789093017578, "global_step": 625268, "epoch": 7533} {"train_loss": -27.571683883666992, "global_step": 625269, "epoch": 7533} {"train_loss": -27.8288516998291, "global_step": 625270, "epoch": 7533} {"train_loss": -27.881591796875, "global_step": 625271, "epoch": 7533} {"train_loss": -28.133642196655273, "global_step": 625272, "epoch": 7533} {"train_loss": -28.242284774780273, "global_step": 625273, "epoch": 7533} {"train_loss": -27.966108322143555, "global_step": 625274, "epoch": 7533} {"train_loss": -28.04975700378418, "global_step": 625275, "epoch": 7533} {"train_loss": -28.516733169555664, "global_step": 625276, "epoch": 7533} {"train_loss": -28.045215606689453, "global_step": 625277, "epoch": 7533} {"train_loss": -28.4171085357666, "global_step": 625278, "epoch": 7533} {"train_loss": -28.31949234008789, "global_step": 625279, "epoch": 7533} {"train_loss": -28.405548095703125, "global_step": 625280, "epoch": 7533} {"train_loss": -28.050817489624023, "global_step": 625281, "epoch": 7533} {"train_loss": -28.282733917236328, "global_step": 625282, "epoch": 7533} {"train_loss": -27.9445858001709, "global_step": 625283, "epoch": 7533} {"train_loss": -28.278629302978516, "global_step": 625284, "epoch": 7533} {"train_loss": -28.338794708251953, "global_step": 625285, "epoch": 7533} {"train_loss": -28.4843807220459, "global_step": 625286, "epoch": 7533} {"train_loss": -28.250211715698242, "global_step": 625287, "epoch": 7533} {"train_loss": -28.165517807006836, "global_step": 625288, "epoch": 7533} {"train_loss": -28.145360946655273, "global_step": 625289, "epoch": 7533} {"train_loss": -28.464588165283203, "global_step": 625290, "epoch": 7533} {"train_loss": -28.700489044189453, "global_step": 625291, "epoch": 7533} {"train_loss": -28.012659072875977, "global_step": 625292, "epoch": 7533} {"train_loss": -28.268787384033203, "global_step": 625293, "epoch": 7533} {"train_loss": -28.132612228393555, "global_step": 625294, "epoch": 7533} {"train_loss": -28.34272575378418, "global_step": 625295, "epoch": 7533} {"train_loss": -28.003677368164062, "global_step": 625296, "epoch": 7533} {"train_loss": -27.851423263549805, "global_step": 625297, "epoch": 7533} {"train_loss": -27.9196834564209, "global_step": 625298, "epoch": 7533} {"train_loss": -28.114953994750977, "global_step": 625299, "epoch": 7533} {"train_loss": -28.109418869018555, "global_step": 625300, "epoch": 7533} {"train_loss": -27.690155029296875, "global_step": 625301, "epoch": 7533} {"train_loss": -27.894805908203125, "global_step": 625302, "epoch": 7533} {"train_loss": -28.249441146850586, "global_step": 625303, "epoch": 7533} {"train_loss": -27.559507369995117, "global_step": 625304, "epoch": 7533} {"train_loss": -27.731931686401367, "global_step": 625305, "epoch": 7533} {"train_loss": -27.596899032592773, "global_step": 625306, "epoch": 7533} {"train_loss": -27.668598175048828, "global_step": 625307, "epoch": 7533} {"train_loss": -27.98175621032715, "global_step": 625308, "epoch": 7533} {"train_loss": -27.719633102416992, "global_step": 625309, "epoch": 7533} {"train_loss": -27.773141860961914, "global_step": 625310, "epoch": 7533} {"train_loss": -28.232666015625, "global_step": 625311, "epoch": 7533} {"train_loss": -28.535547256469727, "global_step": 625312, "epoch": 7533} {"train_loss": -27.8612060546875, "global_step": 625313, "epoch": 7533} {"train_loss": -28.0212459564209, "global_step": 625314, "epoch": 7533} {"train_loss": -28.191125869750977, "global_step": 625315, "epoch": 7533} {"train_loss": -28.19422721862793, "global_step": 625316, "epoch": 7533} {"train_loss": -27.943265914916992, "global_step": 625317, "epoch": 7533} {"train_loss": -28.273212432861328, "global_step": 625318, "epoch": 7533} {"train_loss": -28.096094131469727, "global_step": 625319, "epoch": 7533} {"train_loss": -28.430456161499023, "global_step": 625320, "epoch": 7533} {"train_loss": -27.984208945768426, "global_step": 625321, "epoch": 7533, "val_loss": 6831564.0} {"train_loss": -27.52579116821289, "global_step": 625322, "epoch": 7534} {"train_loss": -27.923816680908203, "global_step": 625323, "epoch": 7534} {"train_loss": -27.56402015686035, "global_step": 625324, "epoch": 7534} {"train_loss": -27.86578941345215, "global_step": 625325, "epoch": 7534} {"train_loss": -27.2894229888916, "global_step": 625326, "epoch": 7534} {"train_loss": -27.749588012695312, "global_step": 625327, "epoch": 7534} {"train_loss": -27.481536865234375, "global_step": 625328, "epoch": 7534} {"train_loss": -27.246118545532227, "global_step": 625329, "epoch": 7534} {"train_loss": -27.544443130493164, "global_step": 625330, "epoch": 7534} {"train_loss": -27.940465927124023, "global_step": 625331, "epoch": 7534} {"train_loss": -27.49835777282715, "global_step": 625332, "epoch": 7534} {"train_loss": -28.033369064331055, "global_step": 625333, "epoch": 7534} {"train_loss": -27.987884521484375, "global_step": 625334, "epoch": 7534} {"train_loss": -27.7529296875, "global_step": 625335, "epoch": 7534} {"train_loss": -27.3492488861084, "global_step": 625336, "epoch": 7534} {"train_loss": -28.018253326416016, "global_step": 625337, "epoch": 7534} {"train_loss": -27.82625389099121, "global_step": 625338, "epoch": 7534} {"train_loss": -28.19473648071289, "global_step": 625339, "epoch": 7534} {"train_loss": -27.90120506286621, "global_step": 625340, "epoch": 7534} {"train_loss": -28.0135440826416, "global_step": 625341, "epoch": 7534} {"train_loss": -28.345645904541016, "global_step": 625342, "epoch": 7534} {"train_loss": -28.210988998413086, "global_step": 625343, "epoch": 7534} {"train_loss": -27.881336212158203, "global_step": 625344, "epoch": 7534} {"train_loss": -28.255502700805664, "global_step": 625345, "epoch": 7534} {"train_loss": -28.13312339782715, "global_step": 625346, "epoch": 7534} {"train_loss": -28.440753936767578, "global_step": 625347, "epoch": 7534} {"train_loss": -28.14813232421875, "global_step": 625348, "epoch": 7534} {"train_loss": -27.971099853515625, "global_step": 625349, "epoch": 7534} {"train_loss": -27.874805450439453, "global_step": 625350, "epoch": 7534} {"train_loss": -28.12363624572754, "global_step": 625351, "epoch": 7534} {"train_loss": -28.47005271911621, "global_step": 625352, "epoch": 7534} {"train_loss": -28.206506729125977, "global_step": 625353, "epoch": 7534} {"train_loss": -28.09739112854004, "global_step": 625354, "epoch": 7534} {"train_loss": -28.45145606994629, "global_step": 625355, "epoch": 7534} {"train_loss": -28.582538604736328, "global_step": 625356, "epoch": 7534} {"train_loss": -28.083786010742188, "global_step": 625357, "epoch": 7534} {"train_loss": -28.20416831970215, "global_step": 625358, "epoch": 7534} {"train_loss": -28.284412384033203, "global_step": 625359, "epoch": 7534} {"train_loss": -28.091909408569336, "global_step": 625360, "epoch": 7534} {"train_loss": -28.082815170288086, "global_step": 625361, "epoch": 7534} {"train_loss": -28.418121337890625, "global_step": 625362, "epoch": 7534} {"train_loss": -28.13614273071289, "global_step": 625363, "epoch": 7534} {"train_loss": -28.582046508789062, "global_step": 625364, "epoch": 7534} {"train_loss": -28.006681442260742, "global_step": 625365, "epoch": 7534} {"train_loss": -28.529340744018555, "global_step": 625366, "epoch": 7534} {"train_loss": -28.643957138061523, "global_step": 625367, "epoch": 7534} {"train_loss": -28.6252498626709, "global_step": 625368, "epoch": 7534} {"train_loss": -28.229894638061523, "global_step": 625369, "epoch": 7534} {"train_loss": -28.50721549987793, "global_step": 625370, "epoch": 7534} {"train_loss": -28.25238037109375, "global_step": 625371, "epoch": 7534} {"train_loss": -27.87664222717285, "global_step": 625372, "epoch": 7534} {"train_loss": -28.114118576049805, "global_step": 625373, "epoch": 7534} {"train_loss": -28.430526733398438, "global_step": 625374, "epoch": 7534} {"train_loss": -28.475141525268555, "global_step": 625375, "epoch": 7534} {"train_loss": -27.742938995361328, "global_step": 625376, "epoch": 7534} {"train_loss": -27.87935447692871, "global_step": 625377, "epoch": 7534} {"train_loss": -27.9700927734375, "global_step": 625378, "epoch": 7534} {"train_loss": -28.2839412689209, "global_step": 625379, "epoch": 7534} {"train_loss": -28.24262046813965, "global_step": 625380, "epoch": 7534} {"train_loss": -28.0926513671875, "global_step": 625381, "epoch": 7534} {"train_loss": -28.075063705444336, "global_step": 625382, "epoch": 7534} {"train_loss": -27.9130802154541, "global_step": 625383, "epoch": 7534} {"train_loss": -27.916715621948242, "global_step": 625384, "epoch": 7534} {"train_loss": -28.038959503173828, "global_step": 625385, "epoch": 7534} {"train_loss": -28.147674560546875, "global_step": 625386, "epoch": 7534} {"train_loss": -28.29219627380371, "global_step": 625387, "epoch": 7534} {"train_loss": -27.8237361907959, "global_step": 625388, "epoch": 7534} {"train_loss": -27.838760375976562, "global_step": 625389, "epoch": 7534} {"train_loss": -27.888708114624023, "global_step": 625390, "epoch": 7534} {"train_loss": -27.9227237701416, "global_step": 625391, "epoch": 7534} {"train_loss": -28.263174057006836, "global_step": 625392, "epoch": 7534} {"train_loss": -28.023889541625977, "global_step": 625393, "epoch": 7534} {"train_loss": -27.954809188842773, "global_step": 625394, "epoch": 7534} {"train_loss": -28.2591609954834, "global_step": 625395, "epoch": 7534} {"train_loss": -28.652875900268555, "global_step": 625396, "epoch": 7534} {"train_loss": -28.348093032836914, "global_step": 625397, "epoch": 7534} {"train_loss": -28.109817504882812, "global_step": 625398, "epoch": 7534} {"train_loss": -28.086008071899414, "global_step": 625399, "epoch": 7534} {"train_loss": -28.007156372070312, "global_step": 625400, "epoch": 7534} {"train_loss": -28.09523582458496, "global_step": 625401, "epoch": 7534} {"train_loss": -27.94545555114746, "global_step": 625402, "epoch": 7534} {"train_loss": -27.950773239135742, "global_step": 625403, "epoch": 7534} {"train_loss": -28.063099022371222, "global_step": 625404, "epoch": 7534, "val_loss": 6889417.0} {"train_loss": -27.096670150756836, "global_step": 625405, "epoch": 7535} {"train_loss": -27.349287033081055, "global_step": 625406, "epoch": 7535} {"train_loss": -26.85938835144043, "global_step": 625407, "epoch": 7535} {"train_loss": -27.758176803588867, "global_step": 625408, "epoch": 7535} {"train_loss": -26.899206161499023, "global_step": 625409, "epoch": 7535} {"train_loss": -26.63221549987793, "global_step": 625410, "epoch": 7535} {"train_loss": -27.5604305267334, "global_step": 625411, "epoch": 7535} {"train_loss": -27.552270889282227, "global_step": 625412, "epoch": 7535} {"train_loss": -27.35938835144043, "global_step": 625413, "epoch": 7535} {"train_loss": -27.064502716064453, "global_step": 625414, "epoch": 7535} {"train_loss": -27.23931312561035, "global_step": 625415, "epoch": 7535} {"train_loss": -26.744836807250977, "global_step": 625416, "epoch": 7535} {"train_loss": -27.48736572265625, "global_step": 625417, "epoch": 7535} {"train_loss": -26.904951095581055, "global_step": 625418, "epoch": 7535} {"train_loss": -27.40102195739746, "global_step": 625419, "epoch": 7535} {"train_loss": -27.247406005859375, "global_step": 625420, "epoch": 7535} {"train_loss": -27.561925888061523, "global_step": 625421, "epoch": 7535} {"train_loss": -27.24335289001465, "global_step": 625422, "epoch": 7535} {"train_loss": -27.41533851623535, "global_step": 625423, "epoch": 7535} {"train_loss": -27.559667587280273, "global_step": 625424, "epoch": 7535} {"train_loss": -28.039587020874023, "global_step": 625425, "epoch": 7535} {"train_loss": -27.699920654296875, "global_step": 625426, "epoch": 7535} {"train_loss": -27.2265682220459, "global_step": 625427, "epoch": 7535} {"train_loss": -27.7023868560791, "global_step": 625428, "epoch": 7535} {"train_loss": -27.97458267211914, "global_step": 625429, "epoch": 7535} {"train_loss": -27.248449325561523, "global_step": 625430, "epoch": 7535} {"train_loss": -27.825342178344727, "global_step": 625431, "epoch": 7535} {"train_loss": -27.846515655517578, "global_step": 625432, "epoch": 7535} {"train_loss": -27.806989669799805, "global_step": 625433, "epoch": 7535} {"train_loss": -27.94309425354004, "global_step": 625434, "epoch": 7535} {"train_loss": -28.208194732666016, "global_step": 625435, "epoch": 7535} {"train_loss": -27.980756759643555, "global_step": 625436, "epoch": 7535} {"train_loss": -27.828901290893555, "global_step": 625437, "epoch": 7535} {"train_loss": -27.8391056060791, "global_step": 625438, "epoch": 7535} {"train_loss": -28.0148868560791, "global_step": 625439, "epoch": 7535} {"train_loss": -28.000751495361328, "global_step": 625440, "epoch": 7535} {"train_loss": -27.6743221282959, "global_step": 625441, "epoch": 7535} {"train_loss": -27.862613677978516, "global_step": 625442, "epoch": 7535} {"train_loss": -28.3189640045166, "global_step": 625443, "epoch": 7535} {"train_loss": -28.000690460205078, "global_step": 625444, "epoch": 7535} {"train_loss": -28.045743942260742, "global_step": 625445, "epoch": 7535} {"train_loss": -28.1597843170166, "global_step": 625446, "epoch": 7535} {"train_loss": -28.132383346557617, "global_step": 625447, "epoch": 7535} {"train_loss": -28.480060577392578, "global_step": 625448, "epoch": 7535} {"train_loss": -28.20453453063965, "global_step": 625449, "epoch": 7535} {"train_loss": -28.283960342407227, "global_step": 625450, "epoch": 7535} {"train_loss": -28.263050079345703, "global_step": 625451, "epoch": 7535} {"train_loss": -28.62983512878418, "global_step": 625452, "epoch": 7535} {"train_loss": -28.53608512878418, "global_step": 625453, "epoch": 7535} {"train_loss": -27.9890193939209, "global_step": 625454, "epoch": 7535} {"train_loss": -28.243249893188477, "global_step": 625455, "epoch": 7535} {"train_loss": -28.409244537353516, "global_step": 625456, "epoch": 7535} {"train_loss": -28.282419204711914, "global_step": 625457, "epoch": 7535} {"train_loss": -27.8588809967041, "global_step": 625458, "epoch": 7535} {"train_loss": -28.249731063842773, "global_step": 625459, "epoch": 7535} {"train_loss": -28.150028228759766, "global_step": 625460, "epoch": 7535} {"train_loss": -28.307641983032227, "global_step": 625461, "epoch": 7535} {"train_loss": -28.023544311523438, "global_step": 625462, "epoch": 7535} {"train_loss": -28.25240135192871, "global_step": 625463, "epoch": 7535} {"train_loss": -28.44659423828125, "global_step": 625464, "epoch": 7535} {"train_loss": -28.602869033813477, "global_step": 625465, "epoch": 7535} {"train_loss": -28.184167861938477, "global_step": 625466, "epoch": 7535} {"train_loss": -28.496475219726562, "global_step": 625467, "epoch": 7535} {"train_loss": -28.33686637878418, "global_step": 625468, "epoch": 7535} {"train_loss": -28.438037872314453, "global_step": 625469, "epoch": 7535} {"train_loss": -28.219730377197266, "global_step": 625470, "epoch": 7535} {"train_loss": -28.55904197692871, "global_step": 625471, "epoch": 7535} {"train_loss": -28.626317977905273, "global_step": 625472, "epoch": 7535} {"train_loss": -28.2871150970459, "global_step": 625473, "epoch": 7535} {"train_loss": -28.49112892150879, "global_step": 625474, "epoch": 7535} {"train_loss": -28.400903701782227, "global_step": 625475, "epoch": 7535} {"train_loss": -28.378345489501953, "global_step": 625476, "epoch": 7535} {"train_loss": -28.08502769470215, "global_step": 625477, "epoch": 7535} {"train_loss": -28.308368682861328, "global_step": 625478, "epoch": 7535} {"train_loss": -28.640796661376953, "global_step": 625479, "epoch": 7535} {"train_loss": -27.94959831237793, "global_step": 625480, "epoch": 7535} {"train_loss": -28.2780818939209, "global_step": 625481, "epoch": 7535} {"train_loss": -28.711523056030273, "global_step": 625482, "epoch": 7535} {"train_loss": -28.382543563842773, "global_step": 625483, "epoch": 7535} {"train_loss": -28.133670806884766, "global_step": 625484, "epoch": 7535} {"train_loss": -28.237157821655273, "global_step": 625485, "epoch": 7535} {"train_loss": -28.359970092773438, "global_step": 625486, "epoch": 7535} {"train_loss": -27.932130606777697, "global_step": 625487, "epoch": 7535, "val_loss": 6815100.0} {"train_loss": -27.830896377563477, "global_step": 625488, "epoch": 7536} {"train_loss": -27.176319122314453, "global_step": 625489, "epoch": 7536} {"train_loss": -27.4979190826416, "global_step": 625490, "epoch": 7536} {"train_loss": -27.024066925048828, "global_step": 625491, "epoch": 7536} {"train_loss": -27.28785514831543, "global_step": 625492, "epoch": 7536} {"train_loss": -26.0551815032959, "global_step": 625493, "epoch": 7536} {"train_loss": -27.172225952148438, "global_step": 625494, "epoch": 7536} {"train_loss": -25.976011276245117, "global_step": 625495, "epoch": 7536} {"train_loss": -27.514083862304688, "global_step": 625496, "epoch": 7536} {"train_loss": -27.27410316467285, "global_step": 625497, "epoch": 7536} {"train_loss": -27.30030632019043, "global_step": 625498, "epoch": 7536} {"train_loss": -27.275257110595703, "global_step": 625499, "epoch": 7536} {"train_loss": -27.499597549438477, "global_step": 625500, "epoch": 7536} {"train_loss": -27.17731285095215, "global_step": 625501, "epoch": 7536} {"train_loss": -27.961658477783203, "global_step": 625502, "epoch": 7536} {"train_loss": -27.47382164001465, "global_step": 625503, "epoch": 7536} {"train_loss": -27.111257553100586, "global_step": 625504, "epoch": 7536} {"train_loss": -27.583267211914062, "global_step": 625505, "epoch": 7536} {"train_loss": -27.14584732055664, "global_step": 625506, "epoch": 7536} {"train_loss": -27.671743392944336, "global_step": 625507, "epoch": 7536} {"train_loss": -27.661746978759766, "global_step": 625508, "epoch": 7536} {"train_loss": -27.67597007751465, "global_step": 625509, "epoch": 7536} {"train_loss": -27.743764877319336, "global_step": 625510, "epoch": 7536} {"train_loss": -27.8469181060791, "global_step": 625511, "epoch": 7536} {"train_loss": -27.8232479095459, "global_step": 625512, "epoch": 7536} {"train_loss": -27.758115768432617, "global_step": 625513, "epoch": 7536} {"train_loss": -27.756793975830078, "global_step": 625514, "epoch": 7536} {"train_loss": -27.82333755493164, "global_step": 625515, "epoch": 7536} {"train_loss": -27.833471298217773, "global_step": 625516, "epoch": 7536} {"train_loss": -28.200849533081055, "global_step": 625517, "epoch": 7536} {"train_loss": -27.9573917388916, "global_step": 625518, "epoch": 7536} {"train_loss": -27.58905029296875, "global_step": 625519, "epoch": 7536} {"train_loss": -28.013479232788086, "global_step": 625520, "epoch": 7536} {"train_loss": -27.907087326049805, "global_step": 625521, "epoch": 7536} {"train_loss": -28.236902236938477, "global_step": 625522, "epoch": 7536} {"train_loss": -28.327260971069336, "global_step": 625523, "epoch": 7536} {"train_loss": -27.961938858032227, "global_step": 625524, "epoch": 7536} {"train_loss": -27.972991943359375, "global_step": 625525, "epoch": 7536} {"train_loss": -28.11494255065918, "global_step": 625526, "epoch": 7536} {"train_loss": -27.973922729492188, "global_step": 625527, "epoch": 7536} {"train_loss": -27.9847469329834, "global_step": 625528, "epoch": 7536} {"train_loss": -27.967639923095703, "global_step": 625529, "epoch": 7536} {"train_loss": -28.17926597595215, "global_step": 625530, "epoch": 7536} {"train_loss": -28.4234561920166, "global_step": 625531, "epoch": 7536} {"train_loss": -28.13569450378418, "global_step": 625532, "epoch": 7536} {"train_loss": -28.350915908813477, "global_step": 625533, "epoch": 7536} {"train_loss": -28.1372127532959, "global_step": 625534, "epoch": 7536} {"train_loss": -28.134119033813477, "global_step": 625535, "epoch": 7536} {"train_loss": -28.196613311767578, "global_step": 625536, "epoch": 7536} {"train_loss": -28.494394302368164, "global_step": 625537, "epoch": 7536} {"train_loss": -28.013385772705078, "global_step": 625538, "epoch": 7536} {"train_loss": -28.25387954711914, "global_step": 625539, "epoch": 7536} {"train_loss": -28.48890495300293, "global_step": 625540, "epoch": 7536} {"train_loss": -28.348541259765625, "global_step": 625541, "epoch": 7536} {"train_loss": -28.311243057250977, "global_step": 625542, "epoch": 7536} {"train_loss": -28.534231185913086, "global_step": 625543, "epoch": 7536} {"train_loss": -28.087427139282227, "global_step": 625544, "epoch": 7536} {"train_loss": -27.78583335876465, "global_step": 625545, "epoch": 7536} {"train_loss": -27.373077392578125, "global_step": 625546, "epoch": 7536} {"train_loss": -27.21462059020996, "global_step": 625547, "epoch": 7536} {"train_loss": -27.425968170166016, "global_step": 625548, "epoch": 7536} {"train_loss": -28.24961280822754, "global_step": 625549, "epoch": 7536} {"train_loss": -28.167959213256836, "global_step": 625550, "epoch": 7536} {"train_loss": -27.886627197265625, "global_step": 625551, "epoch": 7536} {"train_loss": -28.655866622924805, "global_step": 625552, "epoch": 7536} {"train_loss": -28.2056884765625, "global_step": 625553, "epoch": 7536} {"train_loss": -27.970367431640625, "global_step": 625554, "epoch": 7536} {"train_loss": -28.31599235534668, "global_step": 625555, "epoch": 7536} {"train_loss": -27.995935440063477, "global_step": 625556, "epoch": 7536} {"train_loss": -28.144214630126953, "global_step": 625557, "epoch": 7536} {"train_loss": -27.877429962158203, "global_step": 625558, "epoch": 7536} {"train_loss": -27.843347549438477, "global_step": 625559, "epoch": 7536} {"train_loss": -28.05902671813965, "global_step": 625560, "epoch": 7536} {"train_loss": -28.177234649658203, "global_step": 625561, "epoch": 7536} {"train_loss": -28.264108657836914, "global_step": 625562, "epoch": 7536} {"train_loss": -28.554590225219727, "global_step": 625563, "epoch": 7536} {"train_loss": -28.06487464904785, "global_step": 625564, "epoch": 7536} {"train_loss": -28.637313842773438, "global_step": 625565, "epoch": 7536} {"train_loss": -28.324787139892578, "global_step": 625566, "epoch": 7536} {"train_loss": -28.175771713256836, "global_step": 625567, "epoch": 7536} {"train_loss": -27.849573135375977, "global_step": 625568, "epoch": 7536} {"train_loss": -28.01881217956543, "global_step": 625569, "epoch": 7536} {"train_loss": -27.8672511089279, "global_step": 625570, "epoch": 7536, "val_loss": 6858763.0} {"train_loss": -27.348608016967773, "global_step": 625571, "epoch": 7537} {"train_loss": -27.620868682861328, "global_step": 625572, "epoch": 7537} {"train_loss": -27.413623809814453, "global_step": 625573, "epoch": 7537} {"train_loss": -27.73227310180664, "global_step": 625574, "epoch": 7537} {"train_loss": -27.449209213256836, "global_step": 625575, "epoch": 7537} {"train_loss": -27.77073097229004, "global_step": 625576, "epoch": 7537} {"train_loss": -27.598798751831055, "global_step": 625577, "epoch": 7537} {"train_loss": -27.80933952331543, "global_step": 625578, "epoch": 7537} {"train_loss": -27.664859771728516, "global_step": 625579, "epoch": 7537} {"train_loss": -27.65643310546875, "global_step": 625580, "epoch": 7537} {"train_loss": -27.74542808532715, "global_step": 625581, "epoch": 7537} {"train_loss": -27.541690826416016, "global_step": 625582, "epoch": 7537} {"train_loss": -27.92921257019043, "global_step": 625583, "epoch": 7537} {"train_loss": -27.90848159790039, "global_step": 625584, "epoch": 7537} {"train_loss": -27.843114852905273, "global_step": 625585, "epoch": 7537} {"train_loss": -28.013349533081055, "global_step": 625586, "epoch": 7537} {"train_loss": -27.929800033569336, "global_step": 625587, "epoch": 7537} {"train_loss": -27.999740600585938, "global_step": 625588, "epoch": 7537} {"train_loss": -28.177579879760742, "global_step": 625589, "epoch": 7537} {"train_loss": -28.26226234436035, "global_step": 625590, "epoch": 7537} {"train_loss": -28.39056396484375, "global_step": 625591, "epoch": 7537} {"train_loss": -27.812971115112305, "global_step": 625592, "epoch": 7537} {"train_loss": -28.12236976623535, "global_step": 625593, "epoch": 7537} {"train_loss": -28.252887725830078, "global_step": 625594, "epoch": 7537} {"train_loss": -28.14971351623535, "global_step": 625595, "epoch": 7537} {"train_loss": -28.2464542388916, "global_step": 625596, "epoch": 7537} {"train_loss": -28.310352325439453, "global_step": 625597, "epoch": 7537} {"train_loss": -28.357975006103516, "global_step": 625598, "epoch": 7537} {"train_loss": -28.22393798828125, "global_step": 625599, "epoch": 7537} {"train_loss": -27.783863067626953, "global_step": 625600, "epoch": 7537} {"train_loss": -28.15716552734375, "global_step": 625601, "epoch": 7537} {"train_loss": -27.885263442993164, "global_step": 625602, "epoch": 7537} {"train_loss": -28.373157501220703, "global_step": 625603, "epoch": 7537} {"train_loss": -28.43585205078125, "global_step": 625604, "epoch": 7537} {"train_loss": -27.80122184753418, "global_step": 625605, "epoch": 7537} {"train_loss": -28.29631996154785, "global_step": 625606, "epoch": 7537} {"train_loss": -28.09490966796875, "global_step": 625607, "epoch": 7537} {"train_loss": -27.96903419494629, "global_step": 625608, "epoch": 7537} {"train_loss": -28.182912826538086, "global_step": 625609, "epoch": 7537} {"train_loss": -28.292646408081055, "global_step": 625610, "epoch": 7537} {"train_loss": -28.132160186767578, "global_step": 625611, "epoch": 7537} {"train_loss": -28.161340713500977, "global_step": 625612, "epoch": 7537} {"train_loss": -28.113636016845703, "global_step": 625613, "epoch": 7537} {"train_loss": -27.998004913330078, "global_step": 625614, "epoch": 7537} {"train_loss": -28.075225830078125, "global_step": 625615, "epoch": 7537} {"train_loss": -27.9223690032959, "global_step": 625616, "epoch": 7537} {"train_loss": -28.466089248657227, "global_step": 625617, "epoch": 7537} {"train_loss": -28.58249282836914, "global_step": 625618, "epoch": 7537} {"train_loss": -28.24871253967285, "global_step": 625619, "epoch": 7537} {"train_loss": -28.016340255737305, "global_step": 625620, "epoch": 7537} {"train_loss": -28.314828872680664, "global_step": 625621, "epoch": 7537} {"train_loss": -28.393163681030273, "global_step": 625622, "epoch": 7537} {"train_loss": -28.357959747314453, "global_step": 625623, "epoch": 7537} {"train_loss": -28.310474395751953, "global_step": 625624, "epoch": 7537} {"train_loss": -28.2120304107666, "global_step": 625625, "epoch": 7537} {"train_loss": -28.139917373657227, "global_step": 625626, "epoch": 7537} {"train_loss": -27.76218605041504, "global_step": 625627, "epoch": 7537} {"train_loss": -27.36109733581543, "global_step": 625628, "epoch": 7537} {"train_loss": -28.08571434020996, "global_step": 625629, "epoch": 7537} {"train_loss": -27.88649559020996, "global_step": 625630, "epoch": 7537} {"train_loss": -28.154529571533203, "global_step": 625631, "epoch": 7537} {"train_loss": -27.886945724487305, "global_step": 625632, "epoch": 7537} {"train_loss": -28.285175323486328, "global_step": 625633, "epoch": 7537} {"train_loss": -28.236597061157227, "global_step": 625634, "epoch": 7537} {"train_loss": -28.307958602905273, "global_step": 625635, "epoch": 7537} {"train_loss": -28.485326766967773, "global_step": 625636, "epoch": 7537} {"train_loss": -28.4404239654541, "global_step": 625637, "epoch": 7537} {"train_loss": -28.314245223999023, "global_step": 625638, "epoch": 7537} {"train_loss": -28.4057559967041, "global_step": 625639, "epoch": 7537} {"train_loss": -28.23213768005371, "global_step": 625640, "epoch": 7537} {"train_loss": -28.227588653564453, "global_step": 625641, "epoch": 7537} {"train_loss": -28.156110763549805, "global_step": 625642, "epoch": 7537} {"train_loss": -28.475360870361328, "global_step": 625643, "epoch": 7537} {"train_loss": -28.03066062927246, "global_step": 625644, "epoch": 7537} {"train_loss": -28.1141300201416, "global_step": 625645, "epoch": 7537} {"train_loss": -28.28956413269043, "global_step": 625646, "epoch": 7537} {"train_loss": -28.147918701171875, "global_step": 625647, "epoch": 7537} {"train_loss": -28.415103912353516, "global_step": 625648, "epoch": 7537} {"train_loss": -28.5607852935791, "global_step": 625649, "epoch": 7537} {"train_loss": -28.39631462097168, "global_step": 625650, "epoch": 7537} {"train_loss": -27.8203067779541, "global_step": 625651, "epoch": 7537} {"train_loss": -28.195419311523438, "global_step": 625652, "epoch": 7537} {"train_loss": -28.07918741616858, "global_step": 625653, "epoch": 7537, "val_loss": 6827239.0} {"train_loss": -26.342565536499023, "global_step": 625654, "epoch": 7538} {"train_loss": -25.796255111694336, "global_step": 625655, "epoch": 7538} {"train_loss": -26.524850845336914, "global_step": 625656, "epoch": 7538} {"train_loss": -27.888629913330078, "global_step": 625657, "epoch": 7538} {"train_loss": -27.356855392456055, "global_step": 625658, "epoch": 7538} {"train_loss": -27.484113693237305, "global_step": 625659, "epoch": 7538} {"train_loss": -27.899438858032227, "global_step": 625660, "epoch": 7538} {"train_loss": -27.989709854125977, "global_step": 625661, "epoch": 7538} {"train_loss": -27.70149803161621, "global_step": 625662, "epoch": 7538} {"train_loss": -27.959035873413086, "global_step": 625663, "epoch": 7538} {"train_loss": -27.907373428344727, "global_step": 625664, "epoch": 7538} {"train_loss": -27.9244441986084, "global_step": 625665, "epoch": 7538} {"train_loss": -28.159494400024414, "global_step": 625666, "epoch": 7538} {"train_loss": -28.145843505859375, "global_step": 625667, "epoch": 7538} {"train_loss": -28.136343002319336, "global_step": 625668, "epoch": 7538} {"train_loss": -28.1878662109375, "global_step": 625669, "epoch": 7538} {"train_loss": -27.90109634399414, "global_step": 625670, "epoch": 7538} {"train_loss": -27.974836349487305, "global_step": 625671, "epoch": 7538} {"train_loss": -27.84125328063965, "global_step": 625672, "epoch": 7538} {"train_loss": -28.311384201049805, "global_step": 625673, "epoch": 7538} {"train_loss": -28.081323623657227, "global_step": 625674, "epoch": 7538} {"train_loss": -27.832792282104492, "global_step": 625675, "epoch": 7538} {"train_loss": -27.877344131469727, "global_step": 625676, "epoch": 7538} {"train_loss": -27.88933753967285, "global_step": 625677, "epoch": 7538} {"train_loss": -28.146087646484375, "global_step": 625678, "epoch": 7538} {"train_loss": -28.232358932495117, "global_step": 625679, "epoch": 7538} {"train_loss": -27.912946701049805, "global_step": 625680, "epoch": 7538} {"train_loss": -28.22004508972168, "global_step": 625681, "epoch": 7538} {"train_loss": -28.1837158203125, "global_step": 625682, "epoch": 7538} {"train_loss": -28.157184600830078, "global_step": 625683, "epoch": 7538} {"train_loss": -28.36966323852539, "global_step": 625684, "epoch": 7538} {"train_loss": -28.56355094909668, "global_step": 625685, "epoch": 7538} {"train_loss": -28.2360782623291, "global_step": 625686, "epoch": 7538} {"train_loss": -28.219823837280273, "global_step": 625687, "epoch": 7538} {"train_loss": -28.59492301940918, "global_step": 625688, "epoch": 7538} {"train_loss": -28.261005401611328, "global_step": 625689, "epoch": 7538} {"train_loss": -27.94696044921875, "global_step": 625690, "epoch": 7538} {"train_loss": -28.480871200561523, "global_step": 625691, "epoch": 7538} {"train_loss": -28.40118980407715, "global_step": 625692, "epoch": 7538} {"train_loss": -28.212751388549805, "global_step": 625693, "epoch": 7538} {"train_loss": -28.440916061401367, "global_step": 625694, "epoch": 7538} {"train_loss": -28.261045455932617, "global_step": 625695, "epoch": 7538} {"train_loss": -27.94315528869629, "global_step": 625696, "epoch": 7538} {"train_loss": -28.141544342041016, "global_step": 625697, "epoch": 7538} {"train_loss": -28.514490127563477, "global_step": 625698, "epoch": 7538} {"train_loss": -28.35955810546875, "global_step": 625699, "epoch": 7538} {"train_loss": -28.393747329711914, "global_step": 625700, "epoch": 7538} {"train_loss": -28.146203994750977, "global_step": 625701, "epoch": 7538} {"train_loss": -27.981815338134766, "global_step": 625702, "epoch": 7538} {"train_loss": -28.44843864440918, "global_step": 625703, "epoch": 7538} {"train_loss": -28.6096134185791, "global_step": 625704, "epoch": 7538} {"train_loss": -28.133325576782227, "global_step": 625705, "epoch": 7538} {"train_loss": -28.039581298828125, "global_step": 625706, "epoch": 7538} {"train_loss": -28.652372360229492, "global_step": 625707, "epoch": 7538} {"train_loss": -28.482648849487305, "global_step": 625708, "epoch": 7538} {"train_loss": -27.82014274597168, "global_step": 625709, "epoch": 7538} {"train_loss": -28.15376853942871, "global_step": 625710, "epoch": 7538} {"train_loss": -28.0938777923584, "global_step": 625711, "epoch": 7538} {"train_loss": -28.669301986694336, "global_step": 625712, "epoch": 7538} {"train_loss": -28.38226318359375, "global_step": 625713, "epoch": 7538} {"train_loss": -27.565649032592773, "global_step": 625714, "epoch": 7538} {"train_loss": -27.994674682617188, "global_step": 625715, "epoch": 7538} {"train_loss": -27.034320831298828, "global_step": 625716, "epoch": 7538} {"train_loss": -26.516935348510742, "global_step": 625717, "epoch": 7538} {"train_loss": -25.619665145874023, "global_step": 625718, "epoch": 7538} {"train_loss": -27.358854293823242, "global_step": 625719, "epoch": 7538} {"train_loss": -27.8403377532959, "global_step": 625720, "epoch": 7538} {"train_loss": -26.744598388671875, "global_step": 625721, "epoch": 7538} {"train_loss": -27.971017837524414, "global_step": 625722, "epoch": 7538} {"train_loss": -27.2459659576416, "global_step": 625723, "epoch": 7538} {"train_loss": -27.6490535736084, "global_step": 625724, "epoch": 7538} {"train_loss": -27.02888298034668, "global_step": 625725, "epoch": 7538} {"train_loss": -27.967016220092773, "global_step": 625726, "epoch": 7538} {"train_loss": -27.539661407470703, "global_step": 625727, "epoch": 7538} {"train_loss": -27.645627975463867, "global_step": 625728, "epoch": 7538} {"train_loss": -28.220916748046875, "global_step": 625729, "epoch": 7538} {"train_loss": -27.6545352935791, "global_step": 625730, "epoch": 7538} {"train_loss": -27.666961669921875, "global_step": 625731, "epoch": 7538} {"train_loss": -27.60930824279785, "global_step": 625732, "epoch": 7538} {"train_loss": -27.58404541015625, "global_step": 625733, "epoch": 7538} {"train_loss": -27.743383407592773, "global_step": 625734, "epoch": 7538} {"train_loss": -27.914289474487305, "global_step": 625735, "epoch": 7538} {"train_loss": -27.877696117722845, "global_step": 625736, "epoch": 7538, "val_loss": 6961031.5} {"train_loss": -26.868885040283203, "global_step": 625737, "epoch": 7539} {"train_loss": -26.731042861938477, "global_step": 625738, "epoch": 7539} {"train_loss": -27.643613815307617, "global_step": 625739, "epoch": 7539} {"train_loss": -26.1737060546875, "global_step": 625740, "epoch": 7539} {"train_loss": -26.279773712158203, "global_step": 625741, "epoch": 7539} {"train_loss": -27.194782257080078, "global_step": 625742, "epoch": 7539} {"train_loss": -26.058032989501953, "global_step": 625743, "epoch": 7539} {"train_loss": -27.177515029907227, "global_step": 625744, "epoch": 7539} {"train_loss": -26.56226921081543, "global_step": 625745, "epoch": 7539} {"train_loss": -26.57883071899414, "global_step": 625746, "epoch": 7539} {"train_loss": -27.17927360534668, "global_step": 625747, "epoch": 7539} {"train_loss": -27.118274688720703, "global_step": 625748, "epoch": 7539} {"train_loss": -27.553503036499023, "global_step": 625749, "epoch": 7539} {"train_loss": -27.409765243530273, "global_step": 625750, "epoch": 7539} {"train_loss": -27.550601959228516, "global_step": 625751, "epoch": 7539} {"train_loss": -27.34270668029785, "global_step": 625752, "epoch": 7539} {"train_loss": -26.750635147094727, "global_step": 625753, "epoch": 7539} {"train_loss": -27.78571128845215, "global_step": 625754, "epoch": 7539} {"train_loss": -27.619482040405273, "global_step": 625755, "epoch": 7539} {"train_loss": -27.280975341796875, "global_step": 625756, "epoch": 7539} {"train_loss": -27.507471084594727, "global_step": 625757, "epoch": 7539} {"train_loss": -27.49479103088379, "global_step": 625758, "epoch": 7539} {"train_loss": -27.64938735961914, "global_step": 625759, "epoch": 7539} {"train_loss": -27.9235782623291, "global_step": 625760, "epoch": 7539} {"train_loss": -27.714365005493164, "global_step": 625761, "epoch": 7539} {"train_loss": -27.903717041015625, "global_step": 625762, "epoch": 7539} {"train_loss": -27.713825225830078, "global_step": 625763, "epoch": 7539} {"train_loss": -27.59100914001465, "global_step": 625764, "epoch": 7539} {"train_loss": -27.765050888061523, "global_step": 625765, "epoch": 7539} {"train_loss": -28.200891494750977, "global_step": 625766, "epoch": 7539} {"train_loss": -28.14051628112793, "global_step": 625767, "epoch": 7539} {"train_loss": -27.994495391845703, "global_step": 625768, "epoch": 7539} {"train_loss": -28.212270736694336, "global_step": 625769, "epoch": 7539} {"train_loss": -28.06686782836914, "global_step": 625770, "epoch": 7539} {"train_loss": -28.065893173217773, "global_step": 625771, "epoch": 7539} {"train_loss": -27.929737091064453, "global_step": 625772, "epoch": 7539} {"train_loss": -28.22296142578125, "global_step": 625773, "epoch": 7539} {"train_loss": -28.038177490234375, "global_step": 625774, "epoch": 7539} {"train_loss": -27.923725128173828, "global_step": 625775, "epoch": 7539} {"train_loss": -28.077375411987305, "global_step": 625776, "epoch": 7539} {"train_loss": -28.146570205688477, "global_step": 625777, "epoch": 7539} {"train_loss": -28.1267032623291, "global_step": 625778, "epoch": 7539} {"train_loss": -28.001815795898438, "global_step": 625779, "epoch": 7539} {"train_loss": -28.018329620361328, "global_step": 625780, "epoch": 7539} {"train_loss": -28.458261489868164, "global_step": 625781, "epoch": 7539} {"train_loss": -28.286914825439453, "global_step": 625782, "epoch": 7539} {"train_loss": -28.696409225463867, "global_step": 625783, "epoch": 7539} {"train_loss": -28.228506088256836, "global_step": 625784, "epoch": 7539} {"train_loss": -28.013214111328125, "global_step": 625785, "epoch": 7539} {"train_loss": -28.586103439331055, "global_step": 625786, "epoch": 7539} {"train_loss": -28.00819969177246, "global_step": 625787, "epoch": 7539} {"train_loss": -28.49264907836914, "global_step": 625788, "epoch": 7539} {"train_loss": -28.332433700561523, "global_step": 625789, "epoch": 7539} {"train_loss": -27.873300552368164, "global_step": 625790, "epoch": 7539} {"train_loss": -27.94930076599121, "global_step": 625791, "epoch": 7539} {"train_loss": -28.338376998901367, "global_step": 625792, "epoch": 7539} {"train_loss": -28.328094482421875, "global_step": 625793, "epoch": 7539} {"train_loss": -28.389204025268555, "global_step": 625794, "epoch": 7539} {"train_loss": -28.390966415405273, "global_step": 625795, "epoch": 7539} {"train_loss": -28.388885498046875, "global_step": 625796, "epoch": 7539} {"train_loss": -28.304182052612305, "global_step": 625797, "epoch": 7539} {"train_loss": -28.240325927734375, "global_step": 625798, "epoch": 7539} {"train_loss": -27.986419677734375, "global_step": 625799, "epoch": 7539} {"train_loss": -28.36201286315918, "global_step": 625800, "epoch": 7539} {"train_loss": -28.27435874938965, "global_step": 625801, "epoch": 7539} {"train_loss": -28.172033309936523, "global_step": 625802, "epoch": 7539} {"train_loss": -28.03858757019043, "global_step": 625803, "epoch": 7539} {"train_loss": -28.739770889282227, "global_step": 625804, "epoch": 7539} {"train_loss": -28.33515739440918, "global_step": 625805, "epoch": 7539} {"train_loss": -28.443761825561523, "global_step": 625806, "epoch": 7539} {"train_loss": -28.36578369140625, "global_step": 625807, "epoch": 7539} {"train_loss": -28.04927635192871, "global_step": 625808, "epoch": 7539} {"train_loss": -28.37251091003418, "global_step": 625809, "epoch": 7539} {"train_loss": -28.280441284179688, "global_step": 625810, "epoch": 7539} {"train_loss": -28.565719604492188, "global_step": 625811, "epoch": 7539} {"train_loss": -28.337926864624023, "global_step": 625812, "epoch": 7539} {"train_loss": -28.649158477783203, "global_step": 625813, "epoch": 7539} {"train_loss": -28.4020938873291, "global_step": 625814, "epoch": 7539} {"train_loss": -28.213048934936523, "global_step": 625815, "epoch": 7539} {"train_loss": -28.247913360595703, "global_step": 625816, "epoch": 7539} {"train_loss": -28.140283584594727, "global_step": 625817, "epoch": 7539} {"train_loss": -28.691120147705078, "global_step": 625818, "epoch": 7539} {"train_loss": -27.89993511337832, "global_step": 625819, "epoch": 7539, "val_loss": 6716557.0} {"train_loss": -27.6231746673584, "global_step": 625820, "epoch": 7540} {"train_loss": -27.35009765625, "global_step": 625821, "epoch": 7540} {"train_loss": -27.081281661987305, "global_step": 625822, "epoch": 7540} {"train_loss": -27.201507568359375, "global_step": 625823, "epoch": 7540} {"train_loss": -27.053983688354492, "global_step": 625824, "epoch": 7540} {"train_loss": -27.9207706451416, "global_step": 625825, "epoch": 7540} {"train_loss": -27.5924129486084, "global_step": 625826, "epoch": 7540} {"train_loss": -27.976348876953125, "global_step": 625827, "epoch": 7540} {"train_loss": -27.732336044311523, "global_step": 625828, "epoch": 7540} {"train_loss": -27.910852432250977, "global_step": 625829, "epoch": 7540} {"train_loss": -27.127552032470703, "global_step": 625830, "epoch": 7540} {"train_loss": -27.239913940429688, "global_step": 625831, "epoch": 7540} {"train_loss": -27.879987716674805, "global_step": 625832, "epoch": 7540} {"train_loss": -27.389453887939453, "global_step": 625833, "epoch": 7540} {"train_loss": -27.62030601501465, "global_step": 625834, "epoch": 7540} {"train_loss": -27.76350975036621, "global_step": 625835, "epoch": 7540} {"train_loss": -26.921009063720703, "global_step": 625836, "epoch": 7540} {"train_loss": -27.5401554107666, "global_step": 625837, "epoch": 7540} {"train_loss": -27.639501571655273, "global_step": 625838, "epoch": 7540} {"train_loss": -27.679162979125977, "global_step": 625839, "epoch": 7540} {"train_loss": -27.8427734375, "global_step": 625840, "epoch": 7540} {"train_loss": -27.956893920898438, "global_step": 625841, "epoch": 7540} {"train_loss": -27.85967445373535, "global_step": 625842, "epoch": 7540} {"train_loss": -27.276498794555664, "global_step": 625843, "epoch": 7540} {"train_loss": -27.580066680908203, "global_step": 625844, "epoch": 7540} {"train_loss": -27.790082931518555, "global_step": 625845, "epoch": 7540} {"train_loss": -27.4473934173584, "global_step": 625846, "epoch": 7540} {"train_loss": -27.857938766479492, "global_step": 625847, "epoch": 7540} {"train_loss": -27.867883682250977, "global_step": 625848, "epoch": 7540} {"train_loss": -27.959918975830078, "global_step": 625849, "epoch": 7540} {"train_loss": -27.657470703125, "global_step": 625850, "epoch": 7540} {"train_loss": -27.8870849609375, "global_step": 625851, "epoch": 7540} {"train_loss": -28.01149559020996, "global_step": 625852, "epoch": 7540} {"train_loss": -27.86002540588379, "global_step": 625853, "epoch": 7540} {"train_loss": -28.0734806060791, "global_step": 625854, "epoch": 7540} {"train_loss": -27.91947364807129, "global_step": 625855, "epoch": 7540} {"train_loss": -28.114667892456055, "global_step": 625856, "epoch": 7540} {"train_loss": -28.326696395874023, "global_step": 625857, "epoch": 7540} {"train_loss": -28.33489418029785, "global_step": 625858, "epoch": 7540} {"train_loss": -28.749866485595703, "global_step": 625859, "epoch": 7540} {"train_loss": -28.270477294921875, "global_step": 625860, "epoch": 7540} {"train_loss": -28.140792846679688, "global_step": 625861, "epoch": 7540} {"train_loss": -28.091562271118164, "global_step": 625862, "epoch": 7540} {"train_loss": -28.23628044128418, "global_step": 625863, "epoch": 7540} {"train_loss": -28.256549835205078, "global_step": 625864, "epoch": 7540} {"train_loss": -28.641422271728516, "global_step": 625865, "epoch": 7540} {"train_loss": -28.39678955078125, "global_step": 625866, "epoch": 7540} {"train_loss": -28.1976375579834, "global_step": 625867, "epoch": 7540} {"train_loss": -28.317462921142578, "global_step": 625868, "epoch": 7540} {"train_loss": -28.121936798095703, "global_step": 625869, "epoch": 7540} {"train_loss": -28.35755729675293, "global_step": 625870, "epoch": 7540} {"train_loss": -28.1987247467041, "global_step": 625871, "epoch": 7540} {"train_loss": -28.270185470581055, "global_step": 625872, "epoch": 7540} {"train_loss": -28.500131607055664, "global_step": 625873, "epoch": 7540} {"train_loss": -28.406375885009766, "global_step": 625874, "epoch": 7540} {"train_loss": -27.935440063476562, "global_step": 625875, "epoch": 7540} {"train_loss": -28.1589412689209, "global_step": 625876, "epoch": 7540} {"train_loss": -28.328357696533203, "global_step": 625877, "epoch": 7540} {"train_loss": -28.035297393798828, "global_step": 625878, "epoch": 7540} {"train_loss": -28.037139892578125, "global_step": 625879, "epoch": 7540} {"train_loss": -28.237878799438477, "global_step": 625880, "epoch": 7540} {"train_loss": -28.148706436157227, "global_step": 625881, "epoch": 7540} {"train_loss": -28.362873077392578, "global_step": 625882, "epoch": 7540} {"train_loss": -28.41444206237793, "global_step": 625883, "epoch": 7540} {"train_loss": -28.12300682067871, "global_step": 625884, "epoch": 7540} {"train_loss": -28.06511878967285, "global_step": 625885, "epoch": 7540} {"train_loss": -28.12217140197754, "global_step": 625886, "epoch": 7540} {"train_loss": -28.02808952331543, "global_step": 625887, "epoch": 7540} {"train_loss": -28.06487464904785, "global_step": 625888, "epoch": 7540} {"train_loss": -27.8344783782959, "global_step": 625889, "epoch": 7540} {"train_loss": -28.492528915405273, "global_step": 625890, "epoch": 7540} {"train_loss": -28.015274047851562, "global_step": 625891, "epoch": 7540} {"train_loss": -27.568212509155273, "global_step": 625892, "epoch": 7540} {"train_loss": -28.141498565673828, "global_step": 625893, "epoch": 7540} {"train_loss": -28.10615348815918, "global_step": 625894, "epoch": 7540} {"train_loss": -27.66596031188965, "global_step": 625895, "epoch": 7540} {"train_loss": -28.392805099487305, "global_step": 625896, "epoch": 7540} {"train_loss": -27.924560546875, "global_step": 625897, "epoch": 7540} {"train_loss": -27.891998291015625, "global_step": 625898, "epoch": 7540} {"train_loss": -28.201208114624023, "global_step": 625899, "epoch": 7540} {"train_loss": -28.06536865234375, "global_step": 625900, "epoch": 7540} {"train_loss": -28.268402099609375, "global_step": 625901, "epoch": 7540} {"train_loss": -27.938920285328326, "global_step": 625902, "epoch": 7540, "val_loss": 6670003.0} {"train_loss": -25.955602645874023, "global_step": 625903, "epoch": 7541} {"train_loss": -25.37334632873535, "global_step": 625904, "epoch": 7541} {"train_loss": -24.963844299316406, "global_step": 625905, "epoch": 7541} {"train_loss": -25.299837112426758, "global_step": 625906, "epoch": 7541} {"train_loss": -25.775659561157227, "global_step": 625907, "epoch": 7541} {"train_loss": -25.7523136138916, "global_step": 625908, "epoch": 7541} {"train_loss": -26.32275390625, "global_step": 625909, "epoch": 7541} {"train_loss": -26.476505279541016, "global_step": 625910, "epoch": 7541} {"train_loss": -26.576635360717773, "global_step": 625911, "epoch": 7541} {"train_loss": -26.514347076416016, "global_step": 625912, "epoch": 7541} {"train_loss": -26.936182022094727, "global_step": 625913, "epoch": 7541} {"train_loss": -26.786991119384766, "global_step": 625914, "epoch": 7541} {"train_loss": -26.61750602722168, "global_step": 625915, "epoch": 7541} {"train_loss": -27.07709312438965, "global_step": 625916, "epoch": 7541} {"train_loss": -27.0697078704834, "global_step": 625917, "epoch": 7541} {"train_loss": -27.022506713867188, "global_step": 625918, "epoch": 7541} {"train_loss": -26.991605758666992, "global_step": 625919, "epoch": 7541} {"train_loss": -27.320911407470703, "global_step": 625920, "epoch": 7541} {"train_loss": -27.066883087158203, "global_step": 625921, "epoch": 7541} {"train_loss": -27.194482803344727, "global_step": 625922, "epoch": 7541} {"train_loss": -27.19880485534668, "global_step": 625923, "epoch": 7541} {"train_loss": -26.902936935424805, "global_step": 625924, "epoch": 7541} {"train_loss": -27.378137588500977, "global_step": 625925, "epoch": 7541} {"train_loss": -27.525617599487305, "global_step": 625926, "epoch": 7541} {"train_loss": -27.35220718383789, "global_step": 625927, "epoch": 7541} {"train_loss": -27.7680721282959, "global_step": 625928, "epoch": 7541} {"train_loss": -27.871021270751953, "global_step": 625929, "epoch": 7541} {"train_loss": -27.453046798706055, "global_step": 625930, "epoch": 7541} {"train_loss": -27.829694747924805, "global_step": 625931, "epoch": 7541} {"train_loss": -27.5779972076416, "global_step": 625932, "epoch": 7541} {"train_loss": -27.517541885375977, "global_step": 625933, "epoch": 7541} {"train_loss": -27.30510902404785, "global_step": 625934, "epoch": 7541} {"train_loss": -27.63205909729004, "global_step": 625935, "epoch": 7541} {"train_loss": -28.076679229736328, "global_step": 625936, "epoch": 7541} {"train_loss": -27.424055099487305, "global_step": 625937, "epoch": 7541} {"train_loss": -27.623605728149414, "global_step": 625938, "epoch": 7541} {"train_loss": -28.0920467376709, "global_step": 625939, "epoch": 7541} {"train_loss": -27.861194610595703, "global_step": 625940, "epoch": 7541} {"train_loss": -28.05133056640625, "global_step": 625941, "epoch": 7541} {"train_loss": -27.967761993408203, "global_step": 625942, "epoch": 7541} {"train_loss": -27.7268009185791, "global_step": 625943, "epoch": 7541} {"train_loss": -28.170530319213867, "global_step": 625944, "epoch": 7541} {"train_loss": -27.971471786499023, "global_step": 625945, "epoch": 7541} {"train_loss": -28.176528930664062, "global_step": 625946, "epoch": 7541} {"train_loss": -27.695798873901367, "global_step": 625947, "epoch": 7541} {"train_loss": -28.361547470092773, "global_step": 625948, "epoch": 7541} {"train_loss": -27.842939376831055, "global_step": 625949, "epoch": 7541} {"train_loss": -28.308984756469727, "global_step": 625950, "epoch": 7541} {"train_loss": -27.86150550842285, "global_step": 625951, "epoch": 7541} {"train_loss": -27.791738510131836, "global_step": 625952, "epoch": 7541} {"train_loss": -28.09113883972168, "global_step": 625953, "epoch": 7541} {"train_loss": -27.834585189819336, "global_step": 625954, "epoch": 7541} {"train_loss": -28.249860763549805, "global_step": 625955, "epoch": 7541} {"train_loss": -28.04608154296875, "global_step": 625956, "epoch": 7541} {"train_loss": -28.247915267944336, "global_step": 625957, "epoch": 7541} {"train_loss": -28.149911880493164, "global_step": 625958, "epoch": 7541} {"train_loss": -27.956384658813477, "global_step": 625959, "epoch": 7541} {"train_loss": -28.502038955688477, "global_step": 625960, "epoch": 7541} {"train_loss": -27.976709365844727, "global_step": 625961, "epoch": 7541} {"train_loss": -28.391992568969727, "global_step": 625962, "epoch": 7541} {"train_loss": -28.05287742614746, "global_step": 625963, "epoch": 7541} {"train_loss": -28.465381622314453, "global_step": 625964, "epoch": 7541} {"train_loss": -28.320730209350586, "global_step": 625965, "epoch": 7541} {"train_loss": -27.8245792388916, "global_step": 625966, "epoch": 7541} {"train_loss": -28.17897605895996, "global_step": 625967, "epoch": 7541} {"train_loss": -28.2779598236084, "global_step": 625968, "epoch": 7541} {"train_loss": -28.16718101501465, "global_step": 625969, "epoch": 7541} {"train_loss": -28.171512603759766, "global_step": 625970, "epoch": 7541} {"train_loss": -28.201635360717773, "global_step": 625971, "epoch": 7541} {"train_loss": -28.19341468811035, "global_step": 625972, "epoch": 7541} {"train_loss": -28.41509437561035, "global_step": 625973, "epoch": 7541} {"train_loss": -28.5031795501709, "global_step": 625974, "epoch": 7541} {"train_loss": -28.23556900024414, "global_step": 625975, "epoch": 7541} {"train_loss": -28.395584106445312, "global_step": 625976, "epoch": 7541} {"train_loss": -28.297616958618164, "global_step": 625977, "epoch": 7541} {"train_loss": -28.134021759033203, "global_step": 625978, "epoch": 7541} {"train_loss": -28.107349395751953, "global_step": 625979, "epoch": 7541} {"train_loss": -28.248865127563477, "global_step": 625980, "epoch": 7541} {"train_loss": -28.319135665893555, "global_step": 625981, "epoch": 7541} {"train_loss": -28.353702545166016, "global_step": 625982, "epoch": 7541} {"train_loss": -28.615575790405273, "global_step": 625983, "epoch": 7541} {"train_loss": -28.315185546875, "global_step": 625984, "epoch": 7541} {"train_loss": -27.627503613391553, "global_step": 625985, "epoch": 7541, "val_loss": 6817129.0} {"train_loss": -27.691558837890625, "global_step": 625986, "epoch": 7542} {"train_loss": -27.030805587768555, "global_step": 625987, "epoch": 7542} {"train_loss": -25.35645866394043, "global_step": 625988, "epoch": 7542} {"train_loss": -23.707977294921875, "global_step": 625989, "epoch": 7542} {"train_loss": -24.29681396484375, "global_step": 625990, "epoch": 7542} {"train_loss": -25.149187088012695, "global_step": 625991, "epoch": 7542} {"train_loss": -25.242807388305664, "global_step": 625992, "epoch": 7542} {"train_loss": -26.159894943237305, "global_step": 625993, "epoch": 7542} {"train_loss": -23.80640983581543, "global_step": 625994, "epoch": 7542} {"train_loss": -27.134979248046875, "global_step": 625995, "epoch": 7542} {"train_loss": -25.235387802124023, "global_step": 625996, "epoch": 7542} {"train_loss": -26.425262451171875, "global_step": 625997, "epoch": 7542} {"train_loss": -26.2144718170166, "global_step": 625998, "epoch": 7542} {"train_loss": -26.7884521484375, "global_step": 625999, "epoch": 7542} {"train_loss": -26.761585235595703, "global_step": 626000, "epoch": 7542} {"train_loss": -26.519989013671875, "global_step": 626001, "epoch": 7542} {"train_loss": -27.05500602722168, "global_step": 626002, "epoch": 7542} {"train_loss": -26.744428634643555, "global_step": 626003, "epoch": 7542} {"train_loss": -27.3199462890625, "global_step": 626004, "epoch": 7542} {"train_loss": -27.34792137145996, "global_step": 626005, "epoch": 7542} {"train_loss": -27.144330978393555, "global_step": 626006, "epoch": 7542} {"train_loss": -27.38197898864746, "global_step": 626007, "epoch": 7542} {"train_loss": -27.206628799438477, "global_step": 626008, "epoch": 7542} {"train_loss": -27.533737182617188, "global_step": 626009, "epoch": 7542} {"train_loss": -27.307769775390625, "global_step": 626010, "epoch": 7542} {"train_loss": -27.036331176757812, "global_step": 626011, "epoch": 7542} {"train_loss": -27.499048233032227, "global_step": 626012, "epoch": 7542} {"train_loss": -27.36158561706543, "global_step": 626013, "epoch": 7542} {"train_loss": -27.526235580444336, "global_step": 626014, "epoch": 7542} {"train_loss": -27.792142868041992, "global_step": 626015, "epoch": 7542} {"train_loss": -27.83534049987793, "global_step": 626016, "epoch": 7542} {"train_loss": -27.64740562438965, "global_step": 626017, "epoch": 7542} {"train_loss": -27.55158042907715, "global_step": 626018, "epoch": 7542} {"train_loss": -27.3392391204834, "global_step": 626019, "epoch": 7542} {"train_loss": -27.468704223632812, "global_step": 626020, "epoch": 7542} {"train_loss": -27.369001388549805, "global_step": 626021, "epoch": 7542} {"train_loss": -27.78525161743164, "global_step": 626022, "epoch": 7542} {"train_loss": -27.57337760925293, "global_step": 626023, "epoch": 7542} {"train_loss": -28.075475692749023, "global_step": 626024, "epoch": 7542} {"train_loss": -28.01154899597168, "global_step": 626025, "epoch": 7542} {"train_loss": -27.3282470703125, "global_step": 626026, "epoch": 7542} {"train_loss": -27.942426681518555, "global_step": 626027, "epoch": 7542} {"train_loss": -27.583852767944336, "global_step": 626028, "epoch": 7542} {"train_loss": -27.913965225219727, "global_step": 626029, "epoch": 7542} {"train_loss": -27.622129440307617, "global_step": 626030, "epoch": 7542} {"train_loss": -27.903812408447266, "global_step": 626031, "epoch": 7542} {"train_loss": -27.85658073425293, "global_step": 626032, "epoch": 7542} {"train_loss": -28.168012619018555, "global_step": 626033, "epoch": 7542} {"train_loss": -28.12432861328125, "global_step": 626034, "epoch": 7542} {"train_loss": -27.697711944580078, "global_step": 626035, "epoch": 7542} {"train_loss": -28.462268829345703, "global_step": 626036, "epoch": 7542} {"train_loss": -28.028573989868164, "global_step": 626037, "epoch": 7542} {"train_loss": -27.930219650268555, "global_step": 626038, "epoch": 7542} {"train_loss": -27.982030868530273, "global_step": 626039, "epoch": 7542} {"train_loss": -27.73891258239746, "global_step": 626040, "epoch": 7542} {"train_loss": -28.318700790405273, "global_step": 626041, "epoch": 7542} {"train_loss": -27.839582443237305, "global_step": 626042, "epoch": 7542} {"train_loss": -28.108747482299805, "global_step": 626043, "epoch": 7542} {"train_loss": -28.087574005126953, "global_step": 626044, "epoch": 7542} {"train_loss": -28.037952423095703, "global_step": 626045, "epoch": 7542} {"train_loss": -28.069433212280273, "global_step": 626046, "epoch": 7542} {"train_loss": -28.19953727722168, "global_step": 626047, "epoch": 7542} {"train_loss": -27.830175399780273, "global_step": 626048, "epoch": 7542} {"train_loss": -28.467824935913086, "global_step": 626049, "epoch": 7542} {"train_loss": -28.038129806518555, "global_step": 626050, "epoch": 7542} {"train_loss": -28.392181396484375, "global_step": 626051, "epoch": 7542} {"train_loss": -27.92681884765625, "global_step": 626052, "epoch": 7542} {"train_loss": -27.986042022705078, "global_step": 626053, "epoch": 7542} {"train_loss": -28.456619262695312, "global_step": 626054, "epoch": 7542} {"train_loss": -28.34417724609375, "global_step": 626055, "epoch": 7542} {"train_loss": -28.38380241394043, "global_step": 626056, "epoch": 7542} {"train_loss": -28.35292625427246, "global_step": 626057, "epoch": 7542} {"train_loss": -28.58182144165039, "global_step": 626058, "epoch": 7542} {"train_loss": -28.108774185180664, "global_step": 626059, "epoch": 7542} {"train_loss": -28.225605010986328, "global_step": 626060, "epoch": 7542} {"train_loss": -28.23282241821289, "global_step": 626061, "epoch": 7542} {"train_loss": -28.155603408813477, "global_step": 626062, "epoch": 7542} {"train_loss": -28.392459869384766, "global_step": 626063, "epoch": 7542} {"train_loss": -28.195865631103516, "global_step": 626064, "epoch": 7542} {"train_loss": -28.55134391784668, "global_step": 626065, "epoch": 7542} {"train_loss": -28.311376571655273, "global_step": 626066, "epoch": 7542} {"train_loss": -28.452686309814453, "global_step": 626067, "epoch": 7542} {"train_loss": -27.47568256883736, "global_step": 626068, "epoch": 7542, "val_loss": 6714981.0} {"train_loss": -27.13457679748535, "global_step": 626069, "epoch": 7543} {"train_loss": -27.465219497680664, "global_step": 626070, "epoch": 7543} {"train_loss": -27.7130184173584, "global_step": 626071, "epoch": 7543} {"train_loss": -27.383214950561523, "global_step": 626072, "epoch": 7543} {"train_loss": -27.610498428344727, "global_step": 626073, "epoch": 7543} {"train_loss": -27.628849029541016, "global_step": 626074, "epoch": 7543} {"train_loss": -27.566511154174805, "global_step": 626075, "epoch": 7543} {"train_loss": -27.56520652770996, "global_step": 626076, "epoch": 7543} {"train_loss": -26.999311447143555, "global_step": 626077, "epoch": 7543} {"train_loss": -27.69894790649414, "global_step": 626078, "epoch": 7543} {"train_loss": -27.71013832092285, "global_step": 626079, "epoch": 7543} {"train_loss": -27.377866744995117, "global_step": 626080, "epoch": 7543} {"train_loss": -27.881208419799805, "global_step": 626081, "epoch": 7543} {"train_loss": -27.332792282104492, "global_step": 626082, "epoch": 7543} {"train_loss": -27.953475952148438, "global_step": 626083, "epoch": 7543} {"train_loss": -27.61737060546875, "global_step": 626084, "epoch": 7543} {"train_loss": -27.751935958862305, "global_step": 626085, "epoch": 7543} {"train_loss": -27.69691276550293, "global_step": 626086, "epoch": 7543} {"train_loss": -27.994110107421875, "global_step": 626087, "epoch": 7543} {"train_loss": -28.196914672851562, "global_step": 626088, "epoch": 7543} {"train_loss": -27.992725372314453, "global_step": 626089, "epoch": 7543} {"train_loss": -27.82600212097168, "global_step": 626090, "epoch": 7543} {"train_loss": -27.868505477905273, "global_step": 626091, "epoch": 7543} {"train_loss": -28.240936279296875, "global_step": 626092, "epoch": 7543} {"train_loss": -28.0910587310791, "global_step": 626093, "epoch": 7543} {"train_loss": -27.854833602905273, "global_step": 626094, "epoch": 7543} {"train_loss": -28.089187622070312, "global_step": 626095, "epoch": 7543} {"train_loss": -28.260889053344727, "global_step": 626096, "epoch": 7543} {"train_loss": -28.443716049194336, "global_step": 626097, "epoch": 7543} {"train_loss": -28.2254638671875, "global_step": 626098, "epoch": 7543} {"train_loss": -27.661975860595703, "global_step": 626099, "epoch": 7543} {"train_loss": -27.992040634155273, "global_step": 626100, "epoch": 7543} {"train_loss": -28.180646896362305, "global_step": 626101, "epoch": 7543} {"train_loss": -28.36325454711914, "global_step": 626102, "epoch": 7543} {"train_loss": -27.881519317626953, "global_step": 626103, "epoch": 7543} {"train_loss": -28.014068603515625, "global_step": 626104, "epoch": 7543} {"train_loss": -28.0566463470459, "global_step": 626105, "epoch": 7543} {"train_loss": -28.08206558227539, "global_step": 626106, "epoch": 7543} {"train_loss": -28.199560165405273, "global_step": 626107, "epoch": 7543} {"train_loss": -28.081518173217773, "global_step": 626108, "epoch": 7543} {"train_loss": -28.21870231628418, "global_step": 626109, "epoch": 7543} {"train_loss": -28.278961181640625, "global_step": 626110, "epoch": 7543} {"train_loss": -28.594486236572266, "global_step": 626111, "epoch": 7543} {"train_loss": -27.781869888305664, "global_step": 626112, "epoch": 7543} {"train_loss": -28.267425537109375, "global_step": 626113, "epoch": 7543} {"train_loss": -28.68023681640625, "global_step": 626114, "epoch": 7543} {"train_loss": -28.34201431274414, "global_step": 626115, "epoch": 7543} {"train_loss": -28.36256217956543, "global_step": 626116, "epoch": 7543} {"train_loss": -28.039472579956055, "global_step": 626117, "epoch": 7543} {"train_loss": -28.610626220703125, "global_step": 626118, "epoch": 7543} {"train_loss": -28.32659339904785, "global_step": 626119, "epoch": 7543} {"train_loss": -28.256855010986328, "global_step": 626120, "epoch": 7543} {"train_loss": -28.344038009643555, "global_step": 626121, "epoch": 7543} {"train_loss": -28.56007957458496, "global_step": 626122, "epoch": 7543} {"train_loss": -28.548614501953125, "global_step": 626123, "epoch": 7543} {"train_loss": -28.616052627563477, "global_step": 626124, "epoch": 7543} {"train_loss": -28.106054306030273, "global_step": 626125, "epoch": 7543} {"train_loss": -28.340896606445312, "global_step": 626126, "epoch": 7543} {"train_loss": -28.756269454956055, "global_step": 626127, "epoch": 7543} {"train_loss": -28.339994430541992, "global_step": 626128, "epoch": 7543} {"train_loss": -28.34206199645996, "global_step": 626129, "epoch": 7543} {"train_loss": -28.230249404907227, "global_step": 626130, "epoch": 7543} {"train_loss": -28.244455337524414, "global_step": 626131, "epoch": 7543} {"train_loss": -27.88992691040039, "global_step": 626132, "epoch": 7543} {"train_loss": -28.381134033203125, "global_step": 626133, "epoch": 7543} {"train_loss": -28.235448837280273, "global_step": 626134, "epoch": 7543} {"train_loss": -28.314905166625977, "global_step": 626135, "epoch": 7543} {"train_loss": -28.22711181640625, "global_step": 626136, "epoch": 7543} {"train_loss": -28.63541603088379, "global_step": 626137, "epoch": 7543} {"train_loss": -28.43514060974121, "global_step": 626138, "epoch": 7543} {"train_loss": -28.531049728393555, "global_step": 626139, "epoch": 7543} {"train_loss": -28.636402130126953, "global_step": 626140, "epoch": 7543} {"train_loss": -28.487430572509766, "global_step": 626141, "epoch": 7543} {"train_loss": -28.77788734436035, "global_step": 626142, "epoch": 7543} {"train_loss": -28.472076416015625, "global_step": 626143, "epoch": 7543} {"train_loss": -28.16935157775879, "global_step": 626144, "epoch": 7543} {"train_loss": -28.415815353393555, "global_step": 626145, "epoch": 7543} {"train_loss": -28.504175186157227, "global_step": 626146, "epoch": 7543} {"train_loss": -28.357421875, "global_step": 626147, "epoch": 7543} {"train_loss": -28.086963653564453, "global_step": 626148, "epoch": 7543} {"train_loss": -28.239782333374023, "global_step": 626149, "epoch": 7543} {"train_loss": -28.003271102905273, "global_step": 626150, "epoch": 7543} {"train_loss": -28.09551652655544, "global_step": 626151, "epoch": 7543, "val_loss": 6762016.0} {"train_loss": -27.868824005126953, "global_step": 626152, "epoch": 7544} {"train_loss": -27.54730224609375, "global_step": 626153, "epoch": 7544} {"train_loss": -27.525487899780273, "global_step": 626154, "epoch": 7544} {"train_loss": -26.833694458007812, "global_step": 626155, "epoch": 7544} {"train_loss": -26.809728622436523, "global_step": 626156, "epoch": 7544} {"train_loss": -27.564489364624023, "global_step": 626157, "epoch": 7544} {"train_loss": -26.695575714111328, "global_step": 626158, "epoch": 7544} {"train_loss": -26.979557037353516, "global_step": 626159, "epoch": 7544} {"train_loss": -26.627166748046875, "global_step": 626160, "epoch": 7544} {"train_loss": -27.5297908782959, "global_step": 626161, "epoch": 7544} {"train_loss": -27.676809310913086, "global_step": 626162, "epoch": 7544} {"train_loss": -27.523462295532227, "global_step": 626163, "epoch": 7544} {"train_loss": -27.666555404663086, "global_step": 626164, "epoch": 7544} {"train_loss": -27.57221031188965, "global_step": 626165, "epoch": 7544} {"train_loss": -27.28277015686035, "global_step": 626166, "epoch": 7544} {"train_loss": -27.627262115478516, "global_step": 626167, "epoch": 7544} {"train_loss": -27.279394149780273, "global_step": 626168, "epoch": 7544} {"train_loss": -27.43674087524414, "global_step": 626169, "epoch": 7544} {"train_loss": -28.031208038330078, "global_step": 626170, "epoch": 7544} {"train_loss": -27.611780166625977, "global_step": 626171, "epoch": 7544} {"train_loss": -27.80269432067871, "global_step": 626172, "epoch": 7544} {"train_loss": -27.372100830078125, "global_step": 626173, "epoch": 7544} {"train_loss": -27.8966007232666, "global_step": 626174, "epoch": 7544} {"train_loss": -27.901824951171875, "global_step": 626175, "epoch": 7544} {"train_loss": -27.87452507019043, "global_step": 626176, "epoch": 7544} {"train_loss": -28.089385986328125, "global_step": 626177, "epoch": 7544} {"train_loss": -28.01959800720215, "global_step": 626178, "epoch": 7544} {"train_loss": -28.362817764282227, "global_step": 626179, "epoch": 7544} {"train_loss": -27.67508888244629, "global_step": 626180, "epoch": 7544} {"train_loss": -28.15669822692871, "global_step": 626181, "epoch": 7544} {"train_loss": -28.062946319580078, "global_step": 626182, "epoch": 7544} {"train_loss": -28.031280517578125, "global_step": 626183, "epoch": 7544} {"train_loss": -28.42685890197754, "global_step": 626184, "epoch": 7544} {"train_loss": -28.11835289001465, "global_step": 626185, "epoch": 7544} {"train_loss": -28.249114990234375, "global_step": 626186, "epoch": 7544} {"train_loss": -28.181232452392578, "global_step": 626187, "epoch": 7544} {"train_loss": -28.010517120361328, "global_step": 626188, "epoch": 7544} {"train_loss": -28.21144676208496, "global_step": 626189, "epoch": 7544} {"train_loss": -28.384143829345703, "global_step": 626190, "epoch": 7544} {"train_loss": -27.99896812438965, "global_step": 626191, "epoch": 7544} {"train_loss": -28.428430557250977, "global_step": 626192, "epoch": 7544} {"train_loss": -28.20513343811035, "global_step": 626193, "epoch": 7544} {"train_loss": -28.01741600036621, "global_step": 626194, "epoch": 7544} {"train_loss": -28.050107955932617, "global_step": 626195, "epoch": 7544} {"train_loss": -27.926420211791992, "global_step": 626196, "epoch": 7544} {"train_loss": -28.152225494384766, "global_step": 626197, "epoch": 7544} {"train_loss": -28.043272018432617, "global_step": 626198, "epoch": 7544} {"train_loss": -28.121429443359375, "global_step": 626199, "epoch": 7544} {"train_loss": -27.924909591674805, "global_step": 626200, "epoch": 7544} {"train_loss": -28.244688034057617, "global_step": 626201, "epoch": 7544} {"train_loss": -28.048852920532227, "global_step": 626202, "epoch": 7544} {"train_loss": -28.19637107849121, "global_step": 626203, "epoch": 7544} {"train_loss": -28.090967178344727, "global_step": 626204, "epoch": 7544} {"train_loss": -28.642505645751953, "global_step": 626205, "epoch": 7544} {"train_loss": -27.909021377563477, "global_step": 626206, "epoch": 7544} {"train_loss": -27.890527725219727, "global_step": 626207, "epoch": 7544} {"train_loss": -28.358732223510742, "global_step": 626208, "epoch": 7544} {"train_loss": -27.97175407409668, "global_step": 626209, "epoch": 7544} {"train_loss": -27.972925186157227, "global_step": 626210, "epoch": 7544} {"train_loss": -28.28952980041504, "global_step": 626211, "epoch": 7544} {"train_loss": -27.842260360717773, "global_step": 626212, "epoch": 7544} {"train_loss": -28.27803611755371, "global_step": 626213, "epoch": 7544} {"train_loss": -28.066150665283203, "global_step": 626214, "epoch": 7544} {"train_loss": -28.278162002563477, "global_step": 626215, "epoch": 7544} {"train_loss": -27.883808135986328, "global_step": 626216, "epoch": 7544} {"train_loss": -28.143705368041992, "global_step": 626217, "epoch": 7544} {"train_loss": -28.174829483032227, "global_step": 626218, "epoch": 7544} {"train_loss": -28.042057037353516, "global_step": 626219, "epoch": 7544} {"train_loss": -28.612842559814453, "global_step": 626220, "epoch": 7544} {"train_loss": -28.203283309936523, "global_step": 626221, "epoch": 7544} {"train_loss": -28.4160099029541, "global_step": 626222, "epoch": 7544} {"train_loss": -28.106760025024414, "global_step": 626223, "epoch": 7544} {"train_loss": -28.4536075592041, "global_step": 626224, "epoch": 7544} {"train_loss": -28.473331451416016, "global_step": 626225, "epoch": 7544} {"train_loss": -28.21759605407715, "global_step": 626226, "epoch": 7544} {"train_loss": -28.233036041259766, "global_step": 626227, "epoch": 7544} {"train_loss": -28.342792510986328, "global_step": 626228, "epoch": 7544} {"train_loss": -28.3407039642334, "global_step": 626229, "epoch": 7544} {"train_loss": -28.659107208251953, "global_step": 626230, "epoch": 7544} {"train_loss": -28.06585693359375, "global_step": 626231, "epoch": 7544} {"train_loss": -27.9915771484375, "global_step": 626232, "epoch": 7544} {"train_loss": -27.74152183532715, "global_step": 626233, "epoch": 7544} {"train_loss": -27.94515839542251, "global_step": 626234, "epoch": 7544, "val_loss": 6701773.5} {"train_loss": -27.54764747619629, "global_step": 626235, "epoch": 7545} {"train_loss": -27.405353546142578, "global_step": 626236, "epoch": 7545} {"train_loss": -26.822946548461914, "global_step": 626237, "epoch": 7545} {"train_loss": -27.228668212890625, "global_step": 626238, "epoch": 7545} {"train_loss": -27.6181583404541, "global_step": 626239, "epoch": 7545} {"train_loss": -27.107685089111328, "global_step": 626240, "epoch": 7545} {"train_loss": -27.484973907470703, "global_step": 626241, "epoch": 7545} {"train_loss": -28.00909996032715, "global_step": 626242, "epoch": 7545} {"train_loss": -27.430089950561523, "global_step": 626243, "epoch": 7545} {"train_loss": -27.263092041015625, "global_step": 626244, "epoch": 7545} {"train_loss": -28.409589767456055, "global_step": 626245, "epoch": 7545} {"train_loss": -27.981353759765625, "global_step": 626246, "epoch": 7545} {"train_loss": -27.725812911987305, "global_step": 626247, "epoch": 7545} {"train_loss": -27.98079490661621, "global_step": 626248, "epoch": 7545} {"train_loss": -27.988330841064453, "global_step": 626249, "epoch": 7545} {"train_loss": -27.753808975219727, "global_step": 626250, "epoch": 7545} {"train_loss": -28.017724990844727, "global_step": 626251, "epoch": 7545} {"train_loss": -27.43781089782715, "global_step": 626252, "epoch": 7545} {"train_loss": -28.034555435180664, "global_step": 626253, "epoch": 7545} {"train_loss": -27.81012535095215, "global_step": 626254, "epoch": 7545} {"train_loss": -27.918298721313477, "global_step": 626255, "epoch": 7545} {"train_loss": -27.850067138671875, "global_step": 626256, "epoch": 7545} {"train_loss": -27.7523136138916, "global_step": 626257, "epoch": 7545} {"train_loss": -28.00968360900879, "global_step": 626258, "epoch": 7545} {"train_loss": -27.580469131469727, "global_step": 626259, "epoch": 7545} {"train_loss": -28.02764892578125, "global_step": 626260, "epoch": 7545} {"train_loss": -27.824674606323242, "global_step": 626261, "epoch": 7545} {"train_loss": -28.116125106811523, "global_step": 626262, "epoch": 7545} {"train_loss": -27.675642013549805, "global_step": 626263, "epoch": 7545} {"train_loss": -27.7891788482666, "global_step": 626264, "epoch": 7545} {"train_loss": -28.045639038085938, "global_step": 626265, "epoch": 7545} {"train_loss": -27.7148494720459, "global_step": 626266, "epoch": 7545} {"train_loss": -28.062437057495117, "global_step": 626267, "epoch": 7545} {"train_loss": -28.0828800201416, "global_step": 626268, "epoch": 7545} {"train_loss": -28.091123580932617, "global_step": 626269, "epoch": 7545} {"train_loss": -27.931716918945312, "global_step": 626270, "epoch": 7545} {"train_loss": -28.264432907104492, "global_step": 626271, "epoch": 7545} {"train_loss": -27.682682037353516, "global_step": 626272, "epoch": 7545} {"train_loss": -28.445159912109375, "global_step": 626273, "epoch": 7545} {"train_loss": -28.11182975769043, "global_step": 626274, "epoch": 7545} {"train_loss": -28.269763946533203, "global_step": 626275, "epoch": 7545} {"train_loss": -28.287511825561523, "global_step": 626276, "epoch": 7545} {"train_loss": -28.164365768432617, "global_step": 626277, "epoch": 7545} {"train_loss": -28.468053817749023, "global_step": 626278, "epoch": 7545} {"train_loss": -28.36471939086914, "global_step": 626279, "epoch": 7545} {"train_loss": -28.43244743347168, "global_step": 626280, "epoch": 7545} {"train_loss": -28.262094497680664, "global_step": 626281, "epoch": 7545} {"train_loss": -28.00664710998535, "global_step": 626282, "epoch": 7545} {"train_loss": -28.44818115234375, "global_step": 626283, "epoch": 7545} {"train_loss": -28.097639083862305, "global_step": 626284, "epoch": 7545} {"train_loss": -28.107162475585938, "global_step": 626285, "epoch": 7545} {"train_loss": -28.519399642944336, "global_step": 626286, "epoch": 7545} {"train_loss": -28.369924545288086, "global_step": 626287, "epoch": 7545} {"train_loss": -27.98036003112793, "global_step": 626288, "epoch": 7545} {"train_loss": -28.5118465423584, "global_step": 626289, "epoch": 7545} {"train_loss": -27.962121963500977, "global_step": 626290, "epoch": 7545} {"train_loss": -28.209142684936523, "global_step": 626291, "epoch": 7545} {"train_loss": -28.188648223876953, "global_step": 626292, "epoch": 7545} {"train_loss": -28.4049129486084, "global_step": 626293, "epoch": 7545} {"train_loss": -28.20851707458496, "global_step": 626294, "epoch": 7545} {"train_loss": -27.576101303100586, "global_step": 626295, "epoch": 7545} {"train_loss": -28.532928466796875, "global_step": 626296, "epoch": 7545} {"train_loss": -27.91741371154785, "global_step": 626297, "epoch": 7545} {"train_loss": -28.21563720703125, "global_step": 626298, "epoch": 7545} {"train_loss": -28.03095054626465, "global_step": 626299, "epoch": 7545} {"train_loss": -28.295734405517578, "global_step": 626300, "epoch": 7545} {"train_loss": -27.838672637939453, "global_step": 626301, "epoch": 7545} {"train_loss": -28.5471248626709, "global_step": 626302, "epoch": 7545} {"train_loss": -28.014556884765625, "global_step": 626303, "epoch": 7545} {"train_loss": -28.18879508972168, "global_step": 626304, "epoch": 7545} {"train_loss": -27.894201278686523, "global_step": 626305, "epoch": 7545} {"train_loss": -27.571155548095703, "global_step": 626306, "epoch": 7545} {"train_loss": -27.943464279174805, "global_step": 626307, "epoch": 7545} {"train_loss": -27.932708740234375, "global_step": 626308, "epoch": 7545} {"train_loss": -28.463306427001953, "global_step": 626309, "epoch": 7545} {"train_loss": -27.989328384399414, "global_step": 626310, "epoch": 7545} {"train_loss": -28.3265380859375, "global_step": 626311, "epoch": 7545} {"train_loss": -28.649539947509766, "global_step": 626312, "epoch": 7545} {"train_loss": -28.09515953063965, "global_step": 626313, "epoch": 7545} {"train_loss": -27.96990394592285, "global_step": 626314, "epoch": 7545} {"train_loss": -28.14739990234375, "global_step": 626315, "epoch": 7545} {"train_loss": -28.6343936920166, "global_step": 626316, "epoch": 7545} {"train_loss": -28.013095373130707, "global_step": 626317, "epoch": 7545, "val_loss": 6728269.0} {"train_loss": -27.681243896484375, "global_step": 626318, "epoch": 7546} {"train_loss": -27.315143585205078, "global_step": 626319, "epoch": 7546} {"train_loss": -28.03584098815918, "global_step": 626320, "epoch": 7546} {"train_loss": -27.44510841369629, "global_step": 626321, "epoch": 7546} {"train_loss": -27.910888671875, "global_step": 626322, "epoch": 7546} {"train_loss": -27.05946159362793, "global_step": 626323, "epoch": 7546} {"train_loss": -27.31375503540039, "global_step": 626324, "epoch": 7546} {"train_loss": -28.17563247680664, "global_step": 626325, "epoch": 7546} {"train_loss": -27.34873390197754, "global_step": 626326, "epoch": 7546} {"train_loss": -28.21864128112793, "global_step": 626327, "epoch": 7546} {"train_loss": -27.821151733398438, "global_step": 626328, "epoch": 7546} {"train_loss": -27.570556640625, "global_step": 626329, "epoch": 7546} {"train_loss": -28.02900505065918, "global_step": 626330, "epoch": 7546} {"train_loss": -27.732507705688477, "global_step": 626331, "epoch": 7546} {"train_loss": -27.6049747467041, "global_step": 626332, "epoch": 7546} {"train_loss": -28.094640731811523, "global_step": 626333, "epoch": 7546} {"train_loss": -27.870193481445312, "global_step": 626334, "epoch": 7546} {"train_loss": -28.040937423706055, "global_step": 626335, "epoch": 7546} {"train_loss": -27.848730087280273, "global_step": 626336, "epoch": 7546} {"train_loss": -28.29722023010254, "global_step": 626337, "epoch": 7546} {"train_loss": -27.859790802001953, "global_step": 626338, "epoch": 7546} {"train_loss": -27.9217586517334, "global_step": 626339, "epoch": 7546} {"train_loss": -28.1827392578125, "global_step": 626340, "epoch": 7546} {"train_loss": -28.094701766967773, "global_step": 626341, "epoch": 7546} {"train_loss": -27.7773380279541, "global_step": 626342, "epoch": 7546} {"train_loss": -28.0639591217041, "global_step": 626343, "epoch": 7546} {"train_loss": -28.25227165222168, "global_step": 626344, "epoch": 7546} {"train_loss": -28.324331283569336, "global_step": 626345, "epoch": 7546} {"train_loss": -28.20647621154785, "global_step": 626346, "epoch": 7546} {"train_loss": -28.08831787109375, "global_step": 626347, "epoch": 7546} {"train_loss": -28.135339736938477, "global_step": 626348, "epoch": 7546} {"train_loss": -28.03611183166504, "global_step": 626349, "epoch": 7546} {"train_loss": -28.174055099487305, "global_step": 626350, "epoch": 7546} {"train_loss": -28.186904907226562, "global_step": 626351, "epoch": 7546} {"train_loss": -28.082395553588867, "global_step": 626352, "epoch": 7546} {"train_loss": -28.32789421081543, "global_step": 626353, "epoch": 7546} {"train_loss": -28.145282745361328, "global_step": 626354, "epoch": 7546} {"train_loss": -28.120410919189453, "global_step": 626355, "epoch": 7546} {"train_loss": -28.363859176635742, "global_step": 626356, "epoch": 7546} {"train_loss": -28.35293960571289, "global_step": 626357, "epoch": 7546} {"train_loss": -28.263015747070312, "global_step": 626358, "epoch": 7546} {"train_loss": -27.908803939819336, "global_step": 626359, "epoch": 7546} {"train_loss": -28.278425216674805, "global_step": 626360, "epoch": 7546} {"train_loss": -28.005294799804688, "global_step": 626361, "epoch": 7546} {"train_loss": -27.84138298034668, "global_step": 626362, "epoch": 7546} {"train_loss": -27.78927993774414, "global_step": 626363, "epoch": 7546} {"train_loss": -28.163732528686523, "global_step": 626364, "epoch": 7546} {"train_loss": -28.411001205444336, "global_step": 626365, "epoch": 7546} {"train_loss": -28.510705947875977, "global_step": 626366, "epoch": 7546} {"train_loss": -28.31695556640625, "global_step": 626367, "epoch": 7546} {"train_loss": -28.802717208862305, "global_step": 626368, "epoch": 7546} {"train_loss": -28.465986251831055, "global_step": 626369, "epoch": 7546} {"train_loss": -28.05817985534668, "global_step": 626370, "epoch": 7546} {"train_loss": -28.2353572845459, "global_step": 626371, "epoch": 7546} {"train_loss": -28.226947784423828, "global_step": 626372, "epoch": 7546} {"train_loss": -28.303781509399414, "global_step": 626373, "epoch": 7546} {"train_loss": -28.60511589050293, "global_step": 626374, "epoch": 7546} {"train_loss": -28.390827178955078, "global_step": 626375, "epoch": 7546} {"train_loss": -28.3399658203125, "global_step": 626376, "epoch": 7546} {"train_loss": -28.33582878112793, "global_step": 626377, "epoch": 7546} {"train_loss": -28.102521896362305, "global_step": 626378, "epoch": 7546} {"train_loss": -27.87091636657715, "global_step": 626379, "epoch": 7546} {"train_loss": -27.562850952148438, "global_step": 626380, "epoch": 7546} {"train_loss": -27.965253829956055, "global_step": 626381, "epoch": 7546} {"train_loss": -28.307031631469727, "global_step": 626382, "epoch": 7546} {"train_loss": -28.208356857299805, "global_step": 626383, "epoch": 7546} {"train_loss": -27.92301368713379, "global_step": 626384, "epoch": 7546} {"train_loss": -28.436620712280273, "global_step": 626385, "epoch": 7546} {"train_loss": -28.09003257751465, "global_step": 626386, "epoch": 7546} {"train_loss": -27.992414474487305, "global_step": 626387, "epoch": 7546} {"train_loss": -28.124738693237305, "global_step": 626388, "epoch": 7546} {"train_loss": -28.199071884155273, "global_step": 626389, "epoch": 7546} {"train_loss": -27.834857940673828, "global_step": 626390, "epoch": 7546} {"train_loss": -28.379627227783203, "global_step": 626391, "epoch": 7546} {"train_loss": -28.214664459228516, "global_step": 626392, "epoch": 7546} {"train_loss": -28.06671142578125, "global_step": 626393, "epoch": 7546} {"train_loss": -27.942243576049805, "global_step": 626394, "epoch": 7546} {"train_loss": -28.052932739257812, "global_step": 626395, "epoch": 7546} {"train_loss": -28.030378341674805, "global_step": 626396, "epoch": 7546} {"train_loss": -28.136016845703125, "global_step": 626397, "epoch": 7546} {"train_loss": -28.320545196533203, "global_step": 626398, "epoch": 7546} {"train_loss": -28.031723022460938, "global_step": 626399, "epoch": 7546} {"train_loss": -28.060956771115222, "global_step": 626400, "epoch": 7546, "val_loss": 6702854.0} {"train_loss": -27.462757110595703, "global_step": 626401, "epoch": 7547} {"train_loss": -27.225255966186523, "global_step": 626402, "epoch": 7547} {"train_loss": -27.168567657470703, "global_step": 626403, "epoch": 7547} {"train_loss": -27.54215431213379, "global_step": 626404, "epoch": 7547} {"train_loss": -27.913137435913086, "global_step": 626405, "epoch": 7547} {"train_loss": -27.369922637939453, "global_step": 626406, "epoch": 7547} {"train_loss": -27.787948608398438, "global_step": 626407, "epoch": 7547} {"train_loss": -27.969451904296875, "global_step": 626408, "epoch": 7547} {"train_loss": -27.17047119140625, "global_step": 626409, "epoch": 7547} {"train_loss": -27.820755004882812, "global_step": 626410, "epoch": 7547} {"train_loss": -27.823583602905273, "global_step": 626411, "epoch": 7547} {"train_loss": -28.2923641204834, "global_step": 626412, "epoch": 7547} {"train_loss": -28.05665397644043, "global_step": 626413, "epoch": 7547} {"train_loss": -28.038480758666992, "global_step": 626414, "epoch": 7547} {"train_loss": -28.14449119567871, "global_step": 626415, "epoch": 7547} {"train_loss": -27.94757652282715, "global_step": 626416, "epoch": 7547} {"train_loss": -27.872167587280273, "global_step": 626417, "epoch": 7547} {"train_loss": -28.258895874023438, "global_step": 626418, "epoch": 7547} {"train_loss": -27.971235275268555, "global_step": 626419, "epoch": 7547} {"train_loss": -27.844501495361328, "global_step": 626420, "epoch": 7547} {"train_loss": -28.038818359375, "global_step": 626421, "epoch": 7547} {"train_loss": -27.905288696289062, "global_step": 626422, "epoch": 7547} {"train_loss": -28.10188865661621, "global_step": 626423, "epoch": 7547} {"train_loss": -28.121896743774414, "global_step": 626424, "epoch": 7547} {"train_loss": -28.449735641479492, "global_step": 626425, "epoch": 7547} {"train_loss": -28.595947265625, "global_step": 626426, "epoch": 7547} {"train_loss": -27.891305923461914, "global_step": 626427, "epoch": 7547} {"train_loss": -28.128686904907227, "global_step": 626428, "epoch": 7547} {"train_loss": -28.326904296875, "global_step": 626429, "epoch": 7547} {"train_loss": -28.248327255249023, "global_step": 626430, "epoch": 7547} {"train_loss": -28.1103458404541, "global_step": 626431, "epoch": 7547} {"train_loss": -28.230213165283203, "global_step": 626432, "epoch": 7547} {"train_loss": -28.047760009765625, "global_step": 626433, "epoch": 7547} {"train_loss": -28.332326889038086, "global_step": 626434, "epoch": 7547} {"train_loss": -28.304189682006836, "global_step": 626435, "epoch": 7547} {"train_loss": -28.354389190673828, "global_step": 626436, "epoch": 7547} {"train_loss": -27.884946823120117, "global_step": 626437, "epoch": 7547} {"train_loss": -28.029062271118164, "global_step": 626438, "epoch": 7547} {"train_loss": -27.62184715270996, "global_step": 626439, "epoch": 7547} {"train_loss": -28.06430435180664, "global_step": 626440, "epoch": 7547} {"train_loss": -28.336145401000977, "global_step": 626441, "epoch": 7547} {"train_loss": -27.8387451171875, "global_step": 626442, "epoch": 7547} {"train_loss": -28.378265380859375, "global_step": 626443, "epoch": 7547} {"train_loss": -28.43585205078125, "global_step": 626444, "epoch": 7547} {"train_loss": -28.531042098999023, "global_step": 626445, "epoch": 7547} {"train_loss": -28.210113525390625, "global_step": 626446, "epoch": 7547} {"train_loss": -28.29050064086914, "global_step": 626447, "epoch": 7547} {"train_loss": -28.41647720336914, "global_step": 626448, "epoch": 7547} {"train_loss": -28.00812339782715, "global_step": 626449, "epoch": 7547} {"train_loss": -28.242694854736328, "global_step": 626450, "epoch": 7547} {"train_loss": -28.2747859954834, "global_step": 626451, "epoch": 7547} {"train_loss": -28.311344146728516, "global_step": 626452, "epoch": 7547} {"train_loss": -28.20515251159668, "global_step": 626453, "epoch": 7547} {"train_loss": -28.420886993408203, "global_step": 626454, "epoch": 7547} {"train_loss": -28.4044246673584, "global_step": 626455, "epoch": 7547} {"train_loss": -28.474029541015625, "global_step": 626456, "epoch": 7547} {"train_loss": -28.315881729125977, "global_step": 626457, "epoch": 7547} {"train_loss": -28.351181030273438, "global_step": 626458, "epoch": 7547} {"train_loss": -28.60096549987793, "global_step": 626459, "epoch": 7547} {"train_loss": -28.956069946289062, "global_step": 626460, "epoch": 7547} {"train_loss": -28.217920303344727, "global_step": 626461, "epoch": 7547} {"train_loss": -28.60053062438965, "global_step": 626462, "epoch": 7547} {"train_loss": -28.037607192993164, "global_step": 626463, "epoch": 7547} {"train_loss": -28.43690299987793, "global_step": 626464, "epoch": 7547} {"train_loss": -28.372222900390625, "global_step": 626465, "epoch": 7547} {"train_loss": -28.533079147338867, "global_step": 626466, "epoch": 7547} {"train_loss": -28.295841217041016, "global_step": 626467, "epoch": 7547} {"train_loss": -28.49029541015625, "global_step": 626468, "epoch": 7547} {"train_loss": -28.2336368560791, "global_step": 626469, "epoch": 7547} {"train_loss": -28.251306533813477, "global_step": 626470, "epoch": 7547} {"train_loss": -28.29005241394043, "global_step": 626471, "epoch": 7547} {"train_loss": -28.341272354125977, "global_step": 626472, "epoch": 7547} {"train_loss": -28.21722984313965, "global_step": 626473, "epoch": 7547} {"train_loss": -28.24273109436035, "global_step": 626474, "epoch": 7547} {"train_loss": -28.127105712890625, "global_step": 626475, "epoch": 7547} {"train_loss": -28.192340850830078, "global_step": 626476, "epoch": 7547} {"train_loss": -28.44781494140625, "global_step": 626477, "epoch": 7547} {"train_loss": -27.9135684967041, "global_step": 626478, "epoch": 7547} {"train_loss": -28.055978775024414, "global_step": 626479, "epoch": 7547} {"train_loss": -28.30415153503418, "global_step": 626480, "epoch": 7547} {"train_loss": -28.1008243560791, "global_step": 626481, "epoch": 7547} {"train_loss": -27.89912986755371, "global_step": 626482, "epoch": 7547} {"train_loss": -28.11888072002365, "global_step": 626483, "epoch": 7547, "val_loss": 6689288.0} {"train_loss": -27.542118072509766, "global_step": 626484, "epoch": 7548} {"train_loss": -26.970401763916016, "global_step": 626485, "epoch": 7548} {"train_loss": -27.474063873291016, "global_step": 626486, "epoch": 7548} {"train_loss": -27.448959350585938, "global_step": 626487, "epoch": 7548} {"train_loss": -27.371261596679688, "global_step": 626488, "epoch": 7548} {"train_loss": -27.323169708251953, "global_step": 626489, "epoch": 7548} {"train_loss": -27.658491134643555, "global_step": 626490, "epoch": 7548} {"train_loss": -27.373035430908203, "global_step": 626491, "epoch": 7548} {"train_loss": -27.97067642211914, "global_step": 626492, "epoch": 7548} {"train_loss": -27.418928146362305, "global_step": 626493, "epoch": 7548} {"train_loss": -27.528396606445312, "global_step": 626494, "epoch": 7548} {"train_loss": -27.891843795776367, "global_step": 626495, "epoch": 7548} {"train_loss": -27.700647354125977, "global_step": 626496, "epoch": 7548} {"train_loss": -28.0161075592041, "global_step": 626497, "epoch": 7548} {"train_loss": -27.767288208007812, "global_step": 626498, "epoch": 7548} {"train_loss": -28.122644424438477, "global_step": 626499, "epoch": 7548} {"train_loss": -27.571369171142578, "global_step": 626500, "epoch": 7548} {"train_loss": -28.057836532592773, "global_step": 626501, "epoch": 7548} {"train_loss": -27.98752212524414, "global_step": 626502, "epoch": 7548} {"train_loss": -27.887409210205078, "global_step": 626503, "epoch": 7548} {"train_loss": -27.969938278198242, "global_step": 626504, "epoch": 7548} {"train_loss": -28.280914306640625, "global_step": 626505, "epoch": 7548} {"train_loss": -27.908071517944336, "global_step": 626506, "epoch": 7548} {"train_loss": -27.877227783203125, "global_step": 626507, "epoch": 7548} {"train_loss": -27.933435440063477, "global_step": 626508, "epoch": 7548} {"train_loss": -28.10943031311035, "global_step": 626509, "epoch": 7548} {"train_loss": -28.187524795532227, "global_step": 626510, "epoch": 7548} {"train_loss": -28.35758399963379, "global_step": 626511, "epoch": 7548} {"train_loss": -28.07526969909668, "global_step": 626512, "epoch": 7548} {"train_loss": -28.11649513244629, "global_step": 626513, "epoch": 7548} {"train_loss": -28.349328994750977, "global_step": 626514, "epoch": 7548} {"train_loss": -28.369171142578125, "global_step": 626515, "epoch": 7548} {"train_loss": -28.13763999938965, "global_step": 626516, "epoch": 7548} {"train_loss": -28.005292892456055, "global_step": 626517, "epoch": 7548} {"train_loss": -28.091821670532227, "global_step": 626518, "epoch": 7548} {"train_loss": -28.48711585998535, "global_step": 626519, "epoch": 7548} {"train_loss": -28.178333282470703, "global_step": 626520, "epoch": 7548} {"train_loss": -27.870731353759766, "global_step": 626521, "epoch": 7548} {"train_loss": -28.269750595092773, "global_step": 626522, "epoch": 7548} {"train_loss": -27.99539566040039, "global_step": 626523, "epoch": 7548} {"train_loss": -28.30086326599121, "global_step": 626524, "epoch": 7548} {"train_loss": -28.45509147644043, "global_step": 626525, "epoch": 7548} {"train_loss": -28.298736572265625, "global_step": 626526, "epoch": 7548} {"train_loss": -28.26112174987793, "global_step": 626527, "epoch": 7548} {"train_loss": -28.292821884155273, "global_step": 626528, "epoch": 7548} {"train_loss": -27.918445587158203, "global_step": 626529, "epoch": 7548} {"train_loss": -28.180622100830078, "global_step": 626530, "epoch": 7548} {"train_loss": -28.385034561157227, "global_step": 626531, "epoch": 7548} {"train_loss": -28.353357315063477, "global_step": 626532, "epoch": 7548} {"train_loss": -28.638036727905273, "global_step": 626533, "epoch": 7548} {"train_loss": -28.51776695251465, "global_step": 626534, "epoch": 7548} {"train_loss": -28.495481491088867, "global_step": 626535, "epoch": 7548} {"train_loss": -28.207616806030273, "global_step": 626536, "epoch": 7548} {"train_loss": -28.294260025024414, "global_step": 626537, "epoch": 7548} {"train_loss": -28.26431655883789, "global_step": 626538, "epoch": 7548} {"train_loss": -28.272308349609375, "global_step": 626539, "epoch": 7548} {"train_loss": -27.942480087280273, "global_step": 626540, "epoch": 7548} {"train_loss": -28.28704261779785, "global_step": 626541, "epoch": 7548} {"train_loss": -28.104700088500977, "global_step": 626542, "epoch": 7548} {"train_loss": -28.463916778564453, "global_step": 626543, "epoch": 7548} {"train_loss": -28.238067626953125, "global_step": 626544, "epoch": 7548} {"train_loss": -28.420166015625, "global_step": 626545, "epoch": 7548} {"train_loss": -28.359546661376953, "global_step": 626546, "epoch": 7548} {"train_loss": -28.560245513916016, "global_step": 626547, "epoch": 7548} {"train_loss": -28.2723331451416, "global_step": 626548, "epoch": 7548} {"train_loss": -28.637094497680664, "global_step": 626549, "epoch": 7548} {"train_loss": -28.5040283203125, "global_step": 626550, "epoch": 7548} {"train_loss": -28.547216415405273, "global_step": 626551, "epoch": 7548} {"train_loss": -28.409101486206055, "global_step": 626552, "epoch": 7548} {"train_loss": -28.49489402770996, "global_step": 626553, "epoch": 7548} {"train_loss": -28.12483024597168, "global_step": 626554, "epoch": 7548} {"train_loss": -28.406965255737305, "global_step": 626555, "epoch": 7548} {"train_loss": -28.00507926940918, "global_step": 626556, "epoch": 7548} {"train_loss": -27.950101852416992, "global_step": 626557, "epoch": 7548} {"train_loss": -28.12556266784668, "global_step": 626558, "epoch": 7548} {"train_loss": -28.01739501953125, "global_step": 626559, "epoch": 7548} {"train_loss": -28.357614517211914, "global_step": 626560, "epoch": 7548} {"train_loss": -28.042896270751953, "global_step": 626561, "epoch": 7548} {"train_loss": -27.8068790435791, "global_step": 626562, "epoch": 7548} {"train_loss": -27.491296768188477, "global_step": 626563, "epoch": 7548} {"train_loss": -27.917129516601562, "global_step": 626564, "epoch": 7548} {"train_loss": -27.59503746032715, "global_step": 626565, "epoch": 7548} {"train_loss": -28.078304015010236, "global_step": 626566, "epoch": 7548, "val_loss": 6748875.0} {"train_loss": -27.546951293945312, "global_step": 626567, "epoch": 7549} {"train_loss": -26.928131103515625, "global_step": 626568, "epoch": 7549} {"train_loss": -26.001264572143555, "global_step": 626569, "epoch": 7549} {"train_loss": -27.2800235748291, "global_step": 626570, "epoch": 7549} {"train_loss": -27.691699981689453, "global_step": 626571, "epoch": 7549} {"train_loss": -27.547103881835938, "global_step": 626572, "epoch": 7549} {"train_loss": -27.345691680908203, "global_step": 626573, "epoch": 7549} {"train_loss": -27.640539169311523, "global_step": 626574, "epoch": 7549} {"train_loss": -27.882633209228516, "global_step": 626575, "epoch": 7549} {"train_loss": -27.937454223632812, "global_step": 626576, "epoch": 7549} {"train_loss": -27.862085342407227, "global_step": 626577, "epoch": 7549} {"train_loss": -27.733551025390625, "global_step": 626578, "epoch": 7549} {"train_loss": -27.657094955444336, "global_step": 626579, "epoch": 7549} {"train_loss": -28.20673179626465, "global_step": 626580, "epoch": 7549} {"train_loss": -27.667211532592773, "global_step": 626581, "epoch": 7549} {"train_loss": -27.933990478515625, "global_step": 626582, "epoch": 7549} {"train_loss": -27.85450553894043, "global_step": 626583, "epoch": 7549} {"train_loss": -27.802392959594727, "global_step": 626584, "epoch": 7549} {"train_loss": -27.887069702148438, "global_step": 626585, "epoch": 7549} {"train_loss": -27.8759708404541, "global_step": 626586, "epoch": 7549} {"train_loss": -28.19135093688965, "global_step": 626587, "epoch": 7549} {"train_loss": -27.7600154876709, "global_step": 626588, "epoch": 7549} {"train_loss": -28.198577880859375, "global_step": 626589, "epoch": 7549} {"train_loss": -28.06134033203125, "global_step": 626590, "epoch": 7549} {"train_loss": -27.285486221313477, "global_step": 626591, "epoch": 7549} {"train_loss": -27.43756675720215, "global_step": 626592, "epoch": 7549} {"train_loss": -28.195514678955078, "global_step": 626593, "epoch": 7549} {"train_loss": -27.495763778686523, "global_step": 626594, "epoch": 7549} {"train_loss": -27.935766220092773, "global_step": 626595, "epoch": 7549} {"train_loss": -27.833189010620117, "global_step": 626596, "epoch": 7549} {"train_loss": -27.885101318359375, "global_step": 626597, "epoch": 7549} {"train_loss": -27.896574020385742, "global_step": 626598, "epoch": 7549} {"train_loss": -27.754812240600586, "global_step": 626599, "epoch": 7549} {"train_loss": -27.787128448486328, "global_step": 626600, "epoch": 7549} {"train_loss": -28.03909683227539, "global_step": 626601, "epoch": 7549} {"train_loss": -28.15057373046875, "global_step": 626602, "epoch": 7549} {"train_loss": -28.289936065673828, "global_step": 626603, "epoch": 7549} {"train_loss": -28.496667861938477, "global_step": 626604, "epoch": 7549} {"train_loss": -27.64545249938965, "global_step": 626605, "epoch": 7549} {"train_loss": -28.347578048706055, "global_step": 626606, "epoch": 7549} {"train_loss": -27.966108322143555, "global_step": 626607, "epoch": 7549} {"train_loss": -27.858856201171875, "global_step": 626608, "epoch": 7549} {"train_loss": -28.154356002807617, "global_step": 626609, "epoch": 7549} {"train_loss": -28.643543243408203, "global_step": 626610, "epoch": 7549} {"train_loss": -28.17511558532715, "global_step": 626611, "epoch": 7549} {"train_loss": -28.44721794128418, "global_step": 626612, "epoch": 7549} {"train_loss": -28.347227096557617, "global_step": 626613, "epoch": 7549} {"train_loss": -28.414459228515625, "global_step": 626614, "epoch": 7549} {"train_loss": -28.176654815673828, "global_step": 626615, "epoch": 7549} {"train_loss": -28.484167098999023, "global_step": 626616, "epoch": 7549} {"train_loss": -28.617706298828125, "global_step": 626617, "epoch": 7549} {"train_loss": -28.393909454345703, "global_step": 626618, "epoch": 7549} {"train_loss": -28.468347549438477, "global_step": 626619, "epoch": 7549} {"train_loss": -28.143980026245117, "global_step": 626620, "epoch": 7549} {"train_loss": -28.1011905670166, "global_step": 626621, "epoch": 7549} {"train_loss": -28.3753604888916, "global_step": 626622, "epoch": 7549} {"train_loss": -28.436126708984375, "global_step": 626623, "epoch": 7549} {"train_loss": -28.33440589904785, "global_step": 626624, "epoch": 7549} {"train_loss": -28.468276977539062, "global_step": 626625, "epoch": 7549} {"train_loss": -28.075220108032227, "global_step": 626626, "epoch": 7549} {"train_loss": -28.241043090820312, "global_step": 626627, "epoch": 7549} {"train_loss": -28.084705352783203, "global_step": 626628, "epoch": 7549} {"train_loss": -27.68231201171875, "global_step": 626629, "epoch": 7549} {"train_loss": -27.462316513061523, "global_step": 626630, "epoch": 7549} {"train_loss": -27.401880264282227, "global_step": 626631, "epoch": 7549} {"train_loss": -28.0284366607666, "global_step": 626632, "epoch": 7549} {"train_loss": -27.960845947265625, "global_step": 626633, "epoch": 7549} {"train_loss": -28.02066421508789, "global_step": 626634, "epoch": 7549} {"train_loss": -28.188337326049805, "global_step": 626635, "epoch": 7549} {"train_loss": -28.027774810791016, "global_step": 626636, "epoch": 7549} {"train_loss": -28.606708526611328, "global_step": 626637, "epoch": 7549} {"train_loss": -28.538532257080078, "global_step": 626638, "epoch": 7549} {"train_loss": -28.313037872314453, "global_step": 626639, "epoch": 7549} {"train_loss": -28.476648330688477, "global_step": 626640, "epoch": 7549} {"train_loss": -28.222440719604492, "global_step": 626641, "epoch": 7549} {"train_loss": -28.4623966217041, "global_step": 626642, "epoch": 7549} {"train_loss": -28.11139488220215, "global_step": 626643, "epoch": 7549} {"train_loss": -28.44036865234375, "global_step": 626644, "epoch": 7549} {"train_loss": -27.888294219970703, "global_step": 626645, "epoch": 7549} {"train_loss": -27.94491958618164, "global_step": 626646, "epoch": 7549} {"train_loss": -27.9293155670166, "global_step": 626647, "epoch": 7549} {"train_loss": -28.013540267944336, "global_step": 626648, "epoch": 7549} {"train_loss": -27.97289117560329, "global_step": 626649, "epoch": 7549, "val_loss": 6731869.0} {"train_loss": -27.040555953979492, "global_step": 626650, "epoch": 7550} {"train_loss": -25.92145347595215, "global_step": 626651, "epoch": 7550} {"train_loss": -26.65862464904785, "global_step": 626652, "epoch": 7550} {"train_loss": -27.93165397644043, "global_step": 626653, "epoch": 7550} {"train_loss": -27.4881534576416, "global_step": 626654, "epoch": 7550} {"train_loss": -27.3391056060791, "global_step": 626655, "epoch": 7550} {"train_loss": -27.640573501586914, "global_step": 626656, "epoch": 7550} {"train_loss": -27.347705841064453, "global_step": 626657, "epoch": 7550} {"train_loss": -27.514699935913086, "global_step": 626658, "epoch": 7550} {"train_loss": -27.450544357299805, "global_step": 626659, "epoch": 7550} {"train_loss": -28.03678321838379, "global_step": 626660, "epoch": 7550} {"train_loss": -27.4833927154541, "global_step": 626661, "epoch": 7550} {"train_loss": -27.804275512695312, "global_step": 626662, "epoch": 7550} {"train_loss": -27.39947509765625, "global_step": 626663, "epoch": 7550} {"train_loss": -27.831045150756836, "global_step": 626664, "epoch": 7550} {"train_loss": -27.999664306640625, "global_step": 626665, "epoch": 7550} {"train_loss": -27.7092227935791, "global_step": 626666, "epoch": 7550} {"train_loss": -27.789844512939453, "global_step": 626667, "epoch": 7550} {"train_loss": -27.65645408630371, "global_step": 626668, "epoch": 7550} {"train_loss": -27.75872230529785, "global_step": 626669, "epoch": 7550} {"train_loss": -27.90632438659668, "global_step": 626670, "epoch": 7550} {"train_loss": -27.658447265625, "global_step": 626671, "epoch": 7550} {"train_loss": -28.073755264282227, "global_step": 626672, "epoch": 7550} {"train_loss": -28.1434268951416, "global_step": 626673, "epoch": 7550} {"train_loss": -28.10859489440918, "global_step": 626674, "epoch": 7550} {"train_loss": -28.135480880737305, "global_step": 626675, "epoch": 7550} {"train_loss": -27.864294052124023, "global_step": 626676, "epoch": 7550} {"train_loss": -28.1041259765625, "global_step": 626677, "epoch": 7550} {"train_loss": -28.308629989624023, "global_step": 626678, "epoch": 7550} {"train_loss": -27.94209861755371, "global_step": 626679, "epoch": 7550} {"train_loss": -28.03681755065918, "global_step": 626680, "epoch": 7550} {"train_loss": -28.263208389282227, "global_step": 626681, "epoch": 7550} {"train_loss": -28.070083618164062, "global_step": 626682, "epoch": 7550} {"train_loss": -28.18556785583496, "global_step": 626683, "epoch": 7550} {"train_loss": -28.162261962890625, "global_step": 626684, "epoch": 7550} {"train_loss": -28.1906681060791, "global_step": 626685, "epoch": 7550} {"train_loss": -28.132099151611328, "global_step": 626686, "epoch": 7550} {"train_loss": -27.943689346313477, "global_step": 626687, "epoch": 7550} {"train_loss": -28.106689453125, "global_step": 626688, "epoch": 7550} {"train_loss": -27.3504695892334, "global_step": 626689, "epoch": 7550} {"train_loss": -27.80817985534668, "global_step": 626690, "epoch": 7550} {"train_loss": -28.19209098815918, "global_step": 626691, "epoch": 7550} {"train_loss": -28.30731201171875, "global_step": 626692, "epoch": 7550} {"train_loss": -28.256067276000977, "global_step": 626693, "epoch": 7550} {"train_loss": -28.31155776977539, "global_step": 626694, "epoch": 7550} {"train_loss": -28.19318199157715, "global_step": 626695, "epoch": 7550} {"train_loss": -28.343387603759766, "global_step": 626696, "epoch": 7550} {"train_loss": -28.234729766845703, "global_step": 626697, "epoch": 7550} {"train_loss": -28.345373153686523, "global_step": 626698, "epoch": 7550} {"train_loss": -28.3265323638916, "global_step": 626699, "epoch": 7550} {"train_loss": -28.487165451049805, "global_step": 626700, "epoch": 7550} {"train_loss": -28.454086303710938, "global_step": 626701, "epoch": 7550} {"train_loss": -28.517431259155273, "global_step": 626702, "epoch": 7550} {"train_loss": -28.52252197265625, "global_step": 626703, "epoch": 7550} {"train_loss": -28.53922462463379, "global_step": 626704, "epoch": 7550} {"train_loss": -28.5743408203125, "global_step": 626705, "epoch": 7550} {"train_loss": -28.697290420532227, "global_step": 626706, "epoch": 7550} {"train_loss": -28.46880531311035, "global_step": 626707, "epoch": 7550} {"train_loss": -28.2957763671875, "global_step": 626708, "epoch": 7550} {"train_loss": -28.468994140625, "global_step": 626709, "epoch": 7550} {"train_loss": -28.464984893798828, "global_step": 626710, "epoch": 7550} {"train_loss": -28.341333389282227, "global_step": 626711, "epoch": 7550} {"train_loss": -28.377674102783203, "global_step": 626712, "epoch": 7550} {"train_loss": -28.51409912109375, "global_step": 626713, "epoch": 7550} {"train_loss": -28.02497673034668, "global_step": 626714, "epoch": 7550} {"train_loss": -27.8870906829834, "global_step": 626715, "epoch": 7550} {"train_loss": -28.29668617248535, "global_step": 626716, "epoch": 7550} {"train_loss": -28.360126495361328, "global_step": 626717, "epoch": 7550} {"train_loss": -28.120779037475586, "global_step": 626718, "epoch": 7550} {"train_loss": -28.5367374420166, "global_step": 626719, "epoch": 7550} {"train_loss": -28.245092391967773, "global_step": 626720, "epoch": 7550} {"train_loss": -27.936330795288086, "global_step": 626721, "epoch": 7550} {"train_loss": -27.379480361938477, "global_step": 626722, "epoch": 7550} {"train_loss": -27.727930068969727, "global_step": 626723, "epoch": 7550} {"train_loss": -28.456207275390625, "global_step": 626724, "epoch": 7550} {"train_loss": -28.10163688659668, "global_step": 626725, "epoch": 7550} {"train_loss": -27.65644645690918, "global_step": 626726, "epoch": 7550} {"train_loss": -27.35504150390625, "global_step": 626727, "epoch": 7550} {"train_loss": -27.817386627197266, "global_step": 626728, "epoch": 7550} {"train_loss": -28.284168243408203, "global_step": 626729, "epoch": 7550} {"train_loss": -27.667688369750977, "global_step": 626730, "epoch": 7550} {"train_loss": -27.958295822143555, "global_step": 626731, "epoch": 7550} {"train_loss": -27.997718006731517, "global_step": 626732, "epoch": 7550, "train/sim_max_reward_0": 0.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4500000": 1.0, "test/sim_max_reward_4500001": 1.0, "test/sim_max_reward_4500002": 1.0, "test/sim_max_reward_4500003": 1.0, "test/sim_max_reward_4500004": 1.0, "test/sim_max_reward_4500005": 0.0, "test/sim_max_reward_4500006": 1.0, "test/sim_max_reward_4500007": 0.0, "test/sim_max_reward_4500008": 1.0, "test/sim_max_reward_4500009": 1.0, "test/sim_max_reward_4500010": 1.0, "test/sim_max_reward_4500011": 1.0, "test/sim_max_reward_4500012": 1.0, "test/sim_max_reward_4500013": 0.0, "test/sim_max_reward_4500014": 1.0, "test/sim_max_reward_4500015": 1.0, "test/sim_max_reward_4500016": 1.0, "test/sim_max_reward_4500017": 1.0, "test/sim_max_reward_4500018": 0.0, "test/sim_max_reward_4500019": 0.0, "test/sim_max_reward_4500020": 1.0, "test/sim_max_reward_4500021": 1.0, "train/mean_score": 0.8333333333333334, "test/mean_score": 0.7727272727272727, "val_loss": 6747783.0} {"train_loss": -27.713293075561523, "global_step": 626733, "epoch": 7551} {"train_loss": -27.15871238708496, "global_step": 626734, "epoch": 7551} {"train_loss": -27.39451026916504, "global_step": 626735, "epoch": 7551} {"train_loss": -27.31863784790039, "global_step": 626736, "epoch": 7551} {"train_loss": -27.45499038696289, "global_step": 626737, "epoch": 7551} {"train_loss": -27.71022605895996, "global_step": 626738, "epoch": 7551} {"train_loss": -27.514957427978516, "global_step": 626739, "epoch": 7551} {"train_loss": -27.709335327148438, "global_step": 626740, "epoch": 7551} {"train_loss": -27.302967071533203, "global_step": 626741, "epoch": 7551} {"train_loss": -27.80405044555664, "global_step": 626742, "epoch": 7551} {"train_loss": -27.55524253845215, "global_step": 626743, "epoch": 7551} {"train_loss": -27.487829208374023, "global_step": 626744, "epoch": 7551} {"train_loss": -27.268909454345703, "global_step": 626745, "epoch": 7551} {"train_loss": -27.925048828125, "global_step": 626746, "epoch": 7551} {"train_loss": -27.77520751953125, "global_step": 626747, "epoch": 7551} {"train_loss": -28.044336318969727, "global_step": 626748, "epoch": 7551} {"train_loss": -28.090330123901367, "global_step": 626749, "epoch": 7551} {"train_loss": -27.686676025390625, "global_step": 626750, "epoch": 7551} {"train_loss": -27.827688217163086, "global_step": 626751, "epoch": 7551} {"train_loss": -27.668867111206055, "global_step": 626752, "epoch": 7551} {"train_loss": -27.57208251953125, "global_step": 626753, "epoch": 7551} {"train_loss": -27.798282623291016, "global_step": 626754, "epoch": 7551} {"train_loss": -27.560888290405273, "global_step": 626755, "epoch": 7551} {"train_loss": -27.347742080688477, "global_step": 626756, "epoch": 7551} {"train_loss": -27.709012985229492, "global_step": 626757, "epoch": 7551} {"train_loss": -28.220508575439453, "global_step": 626758, "epoch": 7551} {"train_loss": -27.961679458618164, "global_step": 626759, "epoch": 7551} {"train_loss": -27.885751724243164, "global_step": 626760, "epoch": 7551} {"train_loss": -28.144224166870117, "global_step": 626761, "epoch": 7551} {"train_loss": -28.04900550842285, "global_step": 626762, "epoch": 7551} {"train_loss": -27.7130069732666, "global_step": 626763, "epoch": 7551} {"train_loss": -28.0878849029541, "global_step": 626764, "epoch": 7551} {"train_loss": -27.71697425842285, "global_step": 626765, "epoch": 7551} {"train_loss": -28.02608299255371, "global_step": 626766, "epoch": 7551} {"train_loss": -28.108179092407227, "global_step": 626767, "epoch": 7551} {"train_loss": -28.098215103149414, "global_step": 626768, "epoch": 7551} {"train_loss": -28.100324630737305, "global_step": 626769, "epoch": 7551} {"train_loss": -28.33770751953125, "global_step": 626770, "epoch": 7551} {"train_loss": -28.366504669189453, "global_step": 626771, "epoch": 7551} {"train_loss": -28.2701416015625, "global_step": 626772, "epoch": 7551} {"train_loss": -28.231393814086914, "global_step": 626773, "epoch": 7551} {"train_loss": -28.413578033447266, "global_step": 626774, "epoch": 7551} {"train_loss": -28.055601119995117, "global_step": 626775, "epoch": 7551} {"train_loss": -28.15509605407715, "global_step": 626776, "epoch": 7551} {"train_loss": -27.9781494140625, "global_step": 626777, "epoch": 7551} {"train_loss": -28.11994743347168, "global_step": 626778, "epoch": 7551} {"train_loss": -28.08997917175293, "global_step": 626779, "epoch": 7551} {"train_loss": -28.11604118347168, "global_step": 626780, "epoch": 7551} {"train_loss": -27.943777084350586, "global_step": 626781, "epoch": 7551} {"train_loss": -28.247167587280273, "global_step": 626782, "epoch": 7551} {"train_loss": -28.01810646057129, "global_step": 626783, "epoch": 7551} {"train_loss": -27.829620361328125, "global_step": 626784, "epoch": 7551} {"train_loss": -28.007688522338867, "global_step": 626785, "epoch": 7551} {"train_loss": -28.1689453125, "global_step": 626786, "epoch": 7551} {"train_loss": -28.219039916992188, "global_step": 626787, "epoch": 7551} {"train_loss": -28.614843368530273, "global_step": 626788, "epoch": 7551} {"train_loss": -28.564849853515625, "global_step": 626789, "epoch": 7551} {"train_loss": -28.255674362182617, "global_step": 626790, "epoch": 7551} {"train_loss": -28.006927490234375, "global_step": 626791, "epoch": 7551} {"train_loss": -28.56217384338379, "global_step": 626792, "epoch": 7551} {"train_loss": -28.31571388244629, "global_step": 626793, "epoch": 7551} {"train_loss": -28.447824478149414, "global_step": 626794, "epoch": 7551} {"train_loss": -28.413909912109375, "global_step": 626795, "epoch": 7551} {"train_loss": -28.342029571533203, "global_step": 626796, "epoch": 7551} {"train_loss": -28.497257232666016, "global_step": 626797, "epoch": 7551} {"train_loss": -28.204694747924805, "global_step": 626798, "epoch": 7551} {"train_loss": -28.341123580932617, "global_step": 626799, "epoch": 7551} {"train_loss": -28.266845703125, "global_step": 626800, "epoch": 7551} {"train_loss": -28.21343421936035, "global_step": 626801, "epoch": 7551} {"train_loss": -28.544981002807617, "global_step": 626802, "epoch": 7551} {"train_loss": -28.06329345703125, "global_step": 626803, "epoch": 7551} {"train_loss": -28.407703399658203, "global_step": 626804, "epoch": 7551} {"train_loss": -28.253143310546875, "global_step": 626805, "epoch": 7551} {"train_loss": -28.253271102905273, "global_step": 626806, "epoch": 7551} {"train_loss": -28.059646606445312, "global_step": 626807, "epoch": 7551} {"train_loss": -28.250492095947266, "global_step": 626808, "epoch": 7551} {"train_loss": -27.864582061767578, "global_step": 626809, "epoch": 7551} {"train_loss": -27.038028717041016, "global_step": 626810, "epoch": 7551} {"train_loss": -26.951231002807617, "global_step": 626811, "epoch": 7551} {"train_loss": -26.975019454956055, "global_step": 626812, "epoch": 7551} {"train_loss": -27.562585830688477, "global_step": 626813, "epoch": 7551} {"train_loss": -28.266651153564453, "global_step": 626814, "epoch": 7551} {"train_loss": -27.938774200807135, "global_step": 626815, "epoch": 7551, "val_loss": 6771928.0} {"train_loss": -26.74207878112793, "global_step": 626816, "epoch": 7552} {"train_loss": -25.126087188720703, "global_step": 626817, "epoch": 7552} {"train_loss": -27.183679580688477, "global_step": 626818, "epoch": 7552} {"train_loss": -27.050617218017578, "global_step": 626819, "epoch": 7552} {"train_loss": -27.133316040039062, "global_step": 626820, "epoch": 7552} {"train_loss": -27.0090274810791, "global_step": 626821, "epoch": 7552} {"train_loss": -27.543354034423828, "global_step": 626822, "epoch": 7552} {"train_loss": -27.4089412689209, "global_step": 626823, "epoch": 7552} {"train_loss": -27.18720054626465, "global_step": 626824, "epoch": 7552} {"train_loss": -27.66574478149414, "global_step": 626825, "epoch": 7552} {"train_loss": -27.51690101623535, "global_step": 626826, "epoch": 7552} {"train_loss": -27.563495635986328, "global_step": 626827, "epoch": 7552} {"train_loss": -27.552204132080078, "global_step": 626828, "epoch": 7552} {"train_loss": -27.472578048706055, "global_step": 626829, "epoch": 7552} {"train_loss": -27.549854278564453, "global_step": 626830, "epoch": 7552} {"train_loss": -27.500812530517578, "global_step": 626831, "epoch": 7552} {"train_loss": -27.656896591186523, "global_step": 626832, "epoch": 7552} {"train_loss": -27.6656436920166, "global_step": 626833, "epoch": 7552} {"train_loss": -27.449514389038086, "global_step": 626834, "epoch": 7552} {"train_loss": -28.115478515625, "global_step": 626835, "epoch": 7552} {"train_loss": -27.564685821533203, "global_step": 626836, "epoch": 7552} {"train_loss": -27.791122436523438, "global_step": 626837, "epoch": 7552} {"train_loss": -27.613916397094727, "global_step": 626838, "epoch": 7552} {"train_loss": -27.728988647460938, "global_step": 626839, "epoch": 7552} {"train_loss": -27.794952392578125, "global_step": 626840, "epoch": 7552} {"train_loss": -28.218250274658203, "global_step": 626841, "epoch": 7552} {"train_loss": -27.2652587890625, "global_step": 626842, "epoch": 7552} {"train_loss": -27.82313346862793, "global_step": 626843, "epoch": 7552} {"train_loss": -27.374921798706055, "global_step": 626844, "epoch": 7552} {"train_loss": -27.71844482421875, "global_step": 626845, "epoch": 7552} {"train_loss": -28.114660263061523, "global_step": 626846, "epoch": 7552} {"train_loss": -28.157201766967773, "global_step": 626847, "epoch": 7552} {"train_loss": -28.187536239624023, "global_step": 626848, "epoch": 7552} {"train_loss": -27.917404174804688, "global_step": 626849, "epoch": 7552} {"train_loss": -28.28464698791504, "global_step": 626850, "epoch": 7552} {"train_loss": -28.262958526611328, "global_step": 626851, "epoch": 7552} {"train_loss": -28.133228302001953, "global_step": 626852, "epoch": 7552} {"train_loss": -27.969511032104492, "global_step": 626853, "epoch": 7552} {"train_loss": -28.3610782623291, "global_step": 626854, "epoch": 7552} {"train_loss": -27.960580825805664, "global_step": 626855, "epoch": 7552} {"train_loss": -28.19846534729004, "global_step": 626856, "epoch": 7552} {"train_loss": -28.244726181030273, "global_step": 626857, "epoch": 7552} {"train_loss": -28.060455322265625, "global_step": 626858, "epoch": 7552} {"train_loss": -28.03506851196289, "global_step": 626859, "epoch": 7552} {"train_loss": -28.269733428955078, "global_step": 626860, "epoch": 7552} {"train_loss": -28.366846084594727, "global_step": 626861, "epoch": 7552} {"train_loss": -28.310474395751953, "global_step": 626862, "epoch": 7552} {"train_loss": -28.398670196533203, "global_step": 626863, "epoch": 7552} {"train_loss": -28.206567764282227, "global_step": 626864, "epoch": 7552} {"train_loss": -28.44607925415039, "global_step": 626865, "epoch": 7552} {"train_loss": -28.179798126220703, "global_step": 626866, "epoch": 7552} {"train_loss": -27.9587459564209, "global_step": 626867, "epoch": 7552} {"train_loss": -28.36728858947754, "global_step": 626868, "epoch": 7552} {"train_loss": -28.352872848510742, "global_step": 626869, "epoch": 7552} {"train_loss": -28.52194595336914, "global_step": 626870, "epoch": 7552} {"train_loss": -28.533096313476562, "global_step": 626871, "epoch": 7552} {"train_loss": -28.61386489868164, "global_step": 626872, "epoch": 7552} {"train_loss": -28.27557373046875, "global_step": 626873, "epoch": 7552} {"train_loss": -28.527008056640625, "global_step": 626874, "epoch": 7552} {"train_loss": -28.532087326049805, "global_step": 626875, "epoch": 7552} {"train_loss": -28.3912410736084, "global_step": 626876, "epoch": 7552} {"train_loss": -28.278247833251953, "global_step": 626877, "epoch": 7552} {"train_loss": -28.17718505859375, "global_step": 626878, "epoch": 7552} {"train_loss": -28.103540420532227, "global_step": 626879, "epoch": 7552} {"train_loss": -28.157623291015625, "global_step": 626880, "epoch": 7552} {"train_loss": -27.984710693359375, "global_step": 626881, "epoch": 7552} {"train_loss": -28.289587020874023, "global_step": 626882, "epoch": 7552} {"train_loss": -28.347204208374023, "global_step": 626883, "epoch": 7552} {"train_loss": -28.294641494750977, "global_step": 626884, "epoch": 7552} {"train_loss": -28.168439865112305, "global_step": 626885, "epoch": 7552} {"train_loss": -28.5316104888916, "global_step": 626886, "epoch": 7552} {"train_loss": -28.591781616210938, "global_step": 626887, "epoch": 7552} {"train_loss": -28.42865562438965, "global_step": 626888, "epoch": 7552} {"train_loss": -28.214691162109375, "global_step": 626889, "epoch": 7552} {"train_loss": -28.536212921142578, "global_step": 626890, "epoch": 7552} {"train_loss": -28.019306182861328, "global_step": 626891, "epoch": 7552} {"train_loss": -28.563520431518555, "global_step": 626892, "epoch": 7552} {"train_loss": -28.47771644592285, "global_step": 626893, "epoch": 7552} {"train_loss": -28.0251522064209, "global_step": 626894, "epoch": 7552} {"train_loss": -27.947086334228516, "global_step": 626895, "epoch": 7552} {"train_loss": -27.572317123413086, "global_step": 626896, "epoch": 7552} {"train_loss": -27.885971069335938, "global_step": 626897, "epoch": 7552} {"train_loss": -27.94508348028344, "global_step": 626898, "epoch": 7552, "val_loss": 6756278.0} {"train_loss": -26.952802658081055, "global_step": 626899, "epoch": 7553} {"train_loss": -27.15240478515625, "global_step": 626900, "epoch": 7553} {"train_loss": -27.02535057067871, "global_step": 626901, "epoch": 7553} {"train_loss": -27.566823959350586, "global_step": 626902, "epoch": 7553} {"train_loss": -27.991918563842773, "global_step": 626903, "epoch": 7553} {"train_loss": -27.172882080078125, "global_step": 626904, "epoch": 7553} {"train_loss": -27.7772159576416, "global_step": 626905, "epoch": 7553} {"train_loss": -27.476572036743164, "global_step": 626906, "epoch": 7553} {"train_loss": -27.491230010986328, "global_step": 626907, "epoch": 7553} {"train_loss": -27.573850631713867, "global_step": 626908, "epoch": 7553} {"train_loss": -27.8764591217041, "global_step": 626909, "epoch": 7553} {"train_loss": -28.190780639648438, "global_step": 626910, "epoch": 7553} {"train_loss": -27.687122344970703, "global_step": 626911, "epoch": 7553} {"train_loss": -27.772205352783203, "global_step": 626912, "epoch": 7553} {"train_loss": -27.863088607788086, "global_step": 626913, "epoch": 7553} {"train_loss": -27.724445343017578, "global_step": 626914, "epoch": 7553} {"train_loss": -27.935895919799805, "global_step": 626915, "epoch": 7553} {"train_loss": -27.949193954467773, "global_step": 626916, "epoch": 7553} {"train_loss": -27.795917510986328, "global_step": 626917, "epoch": 7553} {"train_loss": -27.992938995361328, "global_step": 626918, "epoch": 7553} {"train_loss": -28.07099723815918, "global_step": 626919, "epoch": 7553} {"train_loss": -27.857192993164062, "global_step": 626920, "epoch": 7553} {"train_loss": -28.055042266845703, "global_step": 626921, "epoch": 7553} {"train_loss": -28.41792106628418, "global_step": 626922, "epoch": 7553} {"train_loss": -28.194059371948242, "global_step": 626923, "epoch": 7553} {"train_loss": -28.016077041625977, "global_step": 626924, "epoch": 7553} {"train_loss": -27.953399658203125, "global_step": 626925, "epoch": 7553} {"train_loss": -28.153196334838867, "global_step": 626926, "epoch": 7553} {"train_loss": -27.991718292236328, "global_step": 626927, "epoch": 7553} {"train_loss": -28.43206787109375, "global_step": 626928, "epoch": 7553} {"train_loss": -28.03632164001465, "global_step": 626929, "epoch": 7553} {"train_loss": -28.377460479736328, "global_step": 626930, "epoch": 7553} {"train_loss": -27.840967178344727, "global_step": 626931, "epoch": 7553} {"train_loss": -28.06791114807129, "global_step": 626932, "epoch": 7553} {"train_loss": -28.536102294921875, "global_step": 626933, "epoch": 7553} {"train_loss": -27.78553581237793, "global_step": 626934, "epoch": 7553} {"train_loss": -28.472400665283203, "global_step": 626935, "epoch": 7553} {"train_loss": -28.09516716003418, "global_step": 626936, "epoch": 7553} {"train_loss": -28.20920753479004, "global_step": 626937, "epoch": 7553} {"train_loss": -28.618518829345703, "global_step": 626938, "epoch": 7553} {"train_loss": -28.220458984375, "global_step": 626939, "epoch": 7553} {"train_loss": -28.527631759643555, "global_step": 626940, "epoch": 7553} {"train_loss": -28.222761154174805, "global_step": 626941, "epoch": 7553} {"train_loss": -28.189847946166992, "global_step": 626942, "epoch": 7553} {"train_loss": -28.31266212463379, "global_step": 626943, "epoch": 7553} {"train_loss": -28.081024169921875, "global_step": 626944, "epoch": 7553} {"train_loss": -28.505889892578125, "global_step": 626945, "epoch": 7553} {"train_loss": -28.175018310546875, "global_step": 626946, "epoch": 7553} {"train_loss": -28.5466365814209, "global_step": 626947, "epoch": 7553} {"train_loss": -28.7292537689209, "global_step": 626948, "epoch": 7553} {"train_loss": -28.378774642944336, "global_step": 626949, "epoch": 7553} {"train_loss": -28.500837326049805, "global_step": 626950, "epoch": 7553} {"train_loss": -28.312137603759766, "global_step": 626951, "epoch": 7553} {"train_loss": -28.71710205078125, "global_step": 626952, "epoch": 7553} {"train_loss": -28.485376358032227, "global_step": 626953, "epoch": 7553} {"train_loss": -28.110754013061523, "global_step": 626954, "epoch": 7553} {"train_loss": -28.677717208862305, "global_step": 626955, "epoch": 7553} {"train_loss": -28.530431747436523, "global_step": 626956, "epoch": 7553} {"train_loss": -28.314212799072266, "global_step": 626957, "epoch": 7553} {"train_loss": -28.268171310424805, "global_step": 626958, "epoch": 7553} {"train_loss": -28.345685958862305, "global_step": 626959, "epoch": 7553} {"train_loss": -28.10097312927246, "global_step": 626960, "epoch": 7553} {"train_loss": -28.610706329345703, "global_step": 626961, "epoch": 7553} {"train_loss": -28.307050704956055, "global_step": 626962, "epoch": 7553} {"train_loss": -27.932865142822266, "global_step": 626963, "epoch": 7553} {"train_loss": -27.771589279174805, "global_step": 626964, "epoch": 7553} {"train_loss": -27.089176177978516, "global_step": 626965, "epoch": 7553} {"train_loss": -25.606298446655273, "global_step": 626966, "epoch": 7553} {"train_loss": -27.15386390686035, "global_step": 626967, "epoch": 7553} {"train_loss": -27.206806182861328, "global_step": 626968, "epoch": 7553} {"train_loss": -26.646677017211914, "global_step": 626969, "epoch": 7553} {"train_loss": -27.220905303955078, "global_step": 626970, "epoch": 7553} {"train_loss": -26.852689743041992, "global_step": 626971, "epoch": 7553} {"train_loss": -27.72418785095215, "global_step": 626972, "epoch": 7553} {"train_loss": -26.846729278564453, "global_step": 626973, "epoch": 7553} {"train_loss": -27.757287979125977, "global_step": 626974, "epoch": 7553} {"train_loss": -27.602706909179688, "global_step": 626975, "epoch": 7553} {"train_loss": -27.581588745117188, "global_step": 626976, "epoch": 7553} {"train_loss": -27.99759292602539, "global_step": 626977, "epoch": 7553} {"train_loss": -27.378629684448242, "global_step": 626978, "epoch": 7553} {"train_loss": -27.308813095092773, "global_step": 626979, "epoch": 7553} {"train_loss": -28.070592880249023, "global_step": 626980, "epoch": 7553} {"train_loss": -27.927354031298535, "global_step": 626981, "epoch": 7553, "val_loss": 6735970.0} {"train_loss": -26.446645736694336, "global_step": 626982, "epoch": 7554} {"train_loss": -27.285566329956055, "global_step": 626983, "epoch": 7554} {"train_loss": -26.993322372436523, "global_step": 626984, "epoch": 7554} {"train_loss": -27.005613327026367, "global_step": 626985, "epoch": 7554} {"train_loss": -26.766311645507812, "global_step": 626986, "epoch": 7554} {"train_loss": -27.29779624938965, "global_step": 626987, "epoch": 7554} {"train_loss": -27.171701431274414, "global_step": 626988, "epoch": 7554} {"train_loss": -27.175779342651367, "global_step": 626989, "epoch": 7554} {"train_loss": -27.501220703125, "global_step": 626990, "epoch": 7554} {"train_loss": -27.333404541015625, "global_step": 626991, "epoch": 7554} {"train_loss": -27.37626075744629, "global_step": 626992, "epoch": 7554} {"train_loss": -27.341543197631836, "global_step": 626993, "epoch": 7554} {"train_loss": -27.71229362487793, "global_step": 626994, "epoch": 7554} {"train_loss": -27.610889434814453, "global_step": 626995, "epoch": 7554} {"train_loss": -27.27243995666504, "global_step": 626996, "epoch": 7554} {"train_loss": -27.59956169128418, "global_step": 626997, "epoch": 7554} {"train_loss": -27.61882972717285, "global_step": 626998, "epoch": 7554} {"train_loss": -27.44178581237793, "global_step": 626999, "epoch": 7554} {"train_loss": -27.77142333984375, "global_step": 627000, "epoch": 7554} {"train_loss": -27.854578018188477, "global_step": 627001, "epoch": 7554} {"train_loss": -27.93116569519043, "global_step": 627002, "epoch": 7554} {"train_loss": -28.133991241455078, "global_step": 627003, "epoch": 7554} {"train_loss": -27.931427001953125, "global_step": 627004, "epoch": 7554} {"train_loss": -27.998579025268555, "global_step": 627005, "epoch": 7554} {"train_loss": -27.821456909179688, "global_step": 627006, "epoch": 7554} {"train_loss": -27.8361873626709, "global_step": 627007, "epoch": 7554} {"train_loss": -27.833118438720703, "global_step": 627008, "epoch": 7554} {"train_loss": -28.085302352905273, "global_step": 627009, "epoch": 7554} {"train_loss": -27.956777572631836, "global_step": 627010, "epoch": 7554} {"train_loss": -27.962646484375, "global_step": 627011, "epoch": 7554} {"train_loss": -27.868671417236328, "global_step": 627012, "epoch": 7554} {"train_loss": -28.082828521728516, "global_step": 627013, "epoch": 7554} {"train_loss": -28.230573654174805, "global_step": 627014, "epoch": 7554} {"train_loss": -28.01362419128418, "global_step": 627015, "epoch": 7554} {"train_loss": -28.02719497680664, "global_step": 627016, "epoch": 7554} {"train_loss": -28.182077407836914, "global_step": 627017, "epoch": 7554} {"train_loss": -28.4689884185791, "global_step": 627018, "epoch": 7554} {"train_loss": -28.36455726623535, "global_step": 627019, "epoch": 7554} {"train_loss": -27.869352340698242, "global_step": 627020, "epoch": 7554} {"train_loss": -28.2235107421875, "global_step": 627021, "epoch": 7554} {"train_loss": -28.352033615112305, "global_step": 627022, "epoch": 7554} {"train_loss": -27.960973739624023, "global_step": 627023, "epoch": 7554} {"train_loss": -28.003320693969727, "global_step": 627024, "epoch": 7554} {"train_loss": -28.1516170501709, "global_step": 627025, "epoch": 7554} {"train_loss": -28.175983428955078, "global_step": 627026, "epoch": 7554} {"train_loss": -28.25144386291504, "global_step": 627027, "epoch": 7554} {"train_loss": -28.45142936706543, "global_step": 627028, "epoch": 7554} {"train_loss": -28.083927154541016, "global_step": 627029, "epoch": 7554} {"train_loss": -28.53765296936035, "global_step": 627030, "epoch": 7554} {"train_loss": -28.411794662475586, "global_step": 627031, "epoch": 7554} {"train_loss": -28.472192764282227, "global_step": 627032, "epoch": 7554} {"train_loss": -28.241668701171875, "global_step": 627033, "epoch": 7554} {"train_loss": -27.943708419799805, "global_step": 627034, "epoch": 7554} {"train_loss": -27.84451675415039, "global_step": 627035, "epoch": 7554} {"train_loss": -28.216552734375, "global_step": 627036, "epoch": 7554} {"train_loss": -28.52589225769043, "global_step": 627037, "epoch": 7554} {"train_loss": -28.163034439086914, "global_step": 627038, "epoch": 7554} {"train_loss": -28.31507682800293, "global_step": 627039, "epoch": 7554} {"train_loss": -28.429523468017578, "global_step": 627040, "epoch": 7554} {"train_loss": -28.214319229125977, "global_step": 627041, "epoch": 7554} {"train_loss": -28.190414428710938, "global_step": 627042, "epoch": 7554} {"train_loss": -28.029829025268555, "global_step": 627043, "epoch": 7554} {"train_loss": -28.2786922454834, "global_step": 627044, "epoch": 7554} {"train_loss": -28.135950088500977, "global_step": 627045, "epoch": 7554} {"train_loss": -28.624622344970703, "global_step": 627046, "epoch": 7554} {"train_loss": -28.029775619506836, "global_step": 627047, "epoch": 7554} {"train_loss": -27.927814483642578, "global_step": 627048, "epoch": 7554} {"train_loss": -27.453887939453125, "global_step": 627049, "epoch": 7554} {"train_loss": -28.138818740844727, "global_step": 627050, "epoch": 7554} {"train_loss": -28.15480613708496, "global_step": 627051, "epoch": 7554} {"train_loss": -28.00966453552246, "global_step": 627052, "epoch": 7554} {"train_loss": -28.185224533081055, "global_step": 627053, "epoch": 7554} {"train_loss": -27.605579376220703, "global_step": 627054, "epoch": 7554} {"train_loss": -28.19556999206543, "global_step": 627055, "epoch": 7554} {"train_loss": -28.110595703125, "global_step": 627056, "epoch": 7554} {"train_loss": -28.488698959350586, "global_step": 627057, "epoch": 7554} {"train_loss": -27.98866081237793, "global_step": 627058, "epoch": 7554} {"train_loss": -28.544815063476562, "global_step": 627059, "epoch": 7554} {"train_loss": -28.284788131713867, "global_step": 627060, "epoch": 7554} {"train_loss": -28.169469833374023, "global_step": 627061, "epoch": 7554} {"train_loss": -28.075490951538086, "global_step": 627062, "epoch": 7554} {"train_loss": -28.111236572265625, "global_step": 627063, "epoch": 7554} {"train_loss": -27.964407702526415, "global_step": 627064, "epoch": 7554, "val_loss": 6666581.0} {"train_loss": -26.731653213500977, "global_step": 627065, "epoch": 7555} {"train_loss": -26.157012939453125, "global_step": 627066, "epoch": 7555} {"train_loss": -27.379491806030273, "global_step": 627067, "epoch": 7555} {"train_loss": -27.89290428161621, "global_step": 627068, "epoch": 7555} {"train_loss": -27.416290283203125, "global_step": 627069, "epoch": 7555} {"train_loss": -27.557836532592773, "global_step": 627070, "epoch": 7555} {"train_loss": -27.805805206298828, "global_step": 627071, "epoch": 7555} {"train_loss": -28.09705924987793, "global_step": 627072, "epoch": 7555} {"train_loss": -27.74940299987793, "global_step": 627073, "epoch": 7555} {"train_loss": -27.987354278564453, "global_step": 627074, "epoch": 7555} {"train_loss": -27.669828414916992, "global_step": 627075, "epoch": 7555} {"train_loss": -28.096731185913086, "global_step": 627076, "epoch": 7555} {"train_loss": -27.726490020751953, "global_step": 627077, "epoch": 7555} {"train_loss": -27.786117553710938, "global_step": 627078, "epoch": 7555} {"train_loss": -27.980260848999023, "global_step": 627079, "epoch": 7555} {"train_loss": -28.03302574157715, "global_step": 627080, "epoch": 7555} {"train_loss": -27.85921287536621, "global_step": 627081, "epoch": 7555} {"train_loss": -27.9150390625, "global_step": 627082, "epoch": 7555} {"train_loss": -28.0939884185791, "global_step": 627083, "epoch": 7555} {"train_loss": -28.21522331237793, "global_step": 627084, "epoch": 7555} {"train_loss": -28.132665634155273, "global_step": 627085, "epoch": 7555} {"train_loss": -28.186359405517578, "global_step": 627086, "epoch": 7555} {"train_loss": -27.54436683654785, "global_step": 627087, "epoch": 7555} {"train_loss": -27.686798095703125, "global_step": 627088, "epoch": 7555} {"train_loss": -27.809133529663086, "global_step": 627089, "epoch": 7555} {"train_loss": -27.83856773376465, "global_step": 627090, "epoch": 7555} {"train_loss": -27.963510513305664, "global_step": 627091, "epoch": 7555} {"train_loss": -28.371557235717773, "global_step": 627092, "epoch": 7555} {"train_loss": -28.67612648010254, "global_step": 627093, "epoch": 7555} {"train_loss": -28.316335678100586, "global_step": 627094, "epoch": 7555} {"train_loss": -28.5040225982666, "global_step": 627095, "epoch": 7555} {"train_loss": -28.133459091186523, "global_step": 627096, "epoch": 7555} {"train_loss": -28.08662986755371, "global_step": 627097, "epoch": 7555} {"train_loss": -28.168725967407227, "global_step": 627098, "epoch": 7555} {"train_loss": -28.07118034362793, "global_step": 627099, "epoch": 7555} {"train_loss": -27.8948974609375, "global_step": 627100, "epoch": 7555} {"train_loss": -28.3096923828125, "global_step": 627101, "epoch": 7555} {"train_loss": -28.51997947692871, "global_step": 627102, "epoch": 7555} {"train_loss": -28.33965492248535, "global_step": 627103, "epoch": 7555} {"train_loss": -28.10267448425293, "global_step": 627104, "epoch": 7555} {"train_loss": -27.960859298706055, "global_step": 627105, "epoch": 7555} {"train_loss": -28.4012508392334, "global_step": 627106, "epoch": 7555} {"train_loss": -28.080799102783203, "global_step": 627107, "epoch": 7555} {"train_loss": -28.315786361694336, "global_step": 627108, "epoch": 7555} {"train_loss": -28.122495651245117, "global_step": 627109, "epoch": 7555} {"train_loss": -28.404138565063477, "global_step": 627110, "epoch": 7555} {"train_loss": -28.149688720703125, "global_step": 627111, "epoch": 7555} {"train_loss": -28.309589385986328, "global_step": 627112, "epoch": 7555} {"train_loss": -28.3112735748291, "global_step": 627113, "epoch": 7555} {"train_loss": -28.7026424407959, "global_step": 627114, "epoch": 7555} {"train_loss": -28.638208389282227, "global_step": 627115, "epoch": 7555} {"train_loss": -28.162405014038086, "global_step": 627116, "epoch": 7555} {"train_loss": -28.473703384399414, "global_step": 627117, "epoch": 7555} {"train_loss": -28.41902732849121, "global_step": 627118, "epoch": 7555} {"train_loss": -28.38409423828125, "global_step": 627119, "epoch": 7555} {"train_loss": -28.597211837768555, "global_step": 627120, "epoch": 7555} {"train_loss": -28.3920955657959, "global_step": 627121, "epoch": 7555} {"train_loss": -28.554174423217773, "global_step": 627122, "epoch": 7555} {"train_loss": -28.616104125976562, "global_step": 627123, "epoch": 7555} {"train_loss": -28.223529815673828, "global_step": 627124, "epoch": 7555} {"train_loss": -28.5404052734375, "global_step": 627125, "epoch": 7555} {"train_loss": -28.290027618408203, "global_step": 627126, "epoch": 7555} {"train_loss": -28.377145767211914, "global_step": 627127, "epoch": 7555} {"train_loss": -28.247007369995117, "global_step": 627128, "epoch": 7555} {"train_loss": -28.2098331451416, "global_step": 627129, "epoch": 7555} {"train_loss": -28.58795738220215, "global_step": 627130, "epoch": 7555} {"train_loss": -28.13922691345215, "global_step": 627131, "epoch": 7555} {"train_loss": -28.9458065032959, "global_step": 627132, "epoch": 7555} {"train_loss": -28.016998291015625, "global_step": 627133, "epoch": 7555} {"train_loss": -28.351205825805664, "global_step": 627134, "epoch": 7555} {"train_loss": -28.189783096313477, "global_step": 627135, "epoch": 7555} {"train_loss": -28.46912956237793, "global_step": 627136, "epoch": 7555} {"train_loss": -27.84541130065918, "global_step": 627137, "epoch": 7555} {"train_loss": -28.326757431030273, "global_step": 627138, "epoch": 7555} {"train_loss": -27.913726806640625, "global_step": 627139, "epoch": 7555} {"train_loss": -28.175662994384766, "global_step": 627140, "epoch": 7555} {"train_loss": -27.243518829345703, "global_step": 627141, "epoch": 7555} {"train_loss": -25.322391510009766, "global_step": 627142, "epoch": 7555} {"train_loss": -19.418893814086914, "global_step": 627143, "epoch": 7555} {"train_loss": -23.266672134399414, "global_step": 627144, "epoch": 7555} {"train_loss": -25.619787216186523, "global_step": 627145, "epoch": 7555} {"train_loss": -25.248382568359375, "global_step": 627146, "epoch": 7555} {"train_loss": -27.807904002178145, "global_step": 627147, "epoch": 7555, "val_loss": 6802351.0} {"train_loss": -24.497251510620117, "global_step": 627148, "epoch": 7556} {"train_loss": -22.665353775024414, "global_step": 627149, "epoch": 7556} {"train_loss": -25.410871505737305, "global_step": 627150, "epoch": 7556} {"train_loss": -23.339303970336914, "global_step": 627151, "epoch": 7556} {"train_loss": -24.556257247924805, "global_step": 627152, "epoch": 7556} {"train_loss": -25.212329864501953, "global_step": 627153, "epoch": 7556} {"train_loss": -25.4649715423584, "global_step": 627154, "epoch": 7556} {"train_loss": -24.44815444946289, "global_step": 627155, "epoch": 7556} {"train_loss": -24.81564712524414, "global_step": 627156, "epoch": 7556} {"train_loss": -25.129369735717773, "global_step": 627157, "epoch": 7556} {"train_loss": -25.2946720123291, "global_step": 627158, "epoch": 7556} {"train_loss": -26.05829429626465, "global_step": 627159, "epoch": 7556} {"train_loss": -25.505359649658203, "global_step": 627160, "epoch": 7556} {"train_loss": -25.094511032104492, "global_step": 627161, "epoch": 7556} {"train_loss": -25.45793342590332, "global_step": 627162, "epoch": 7556} {"train_loss": -26.02005386352539, "global_step": 627163, "epoch": 7556} {"train_loss": -26.228017807006836, "global_step": 627164, "epoch": 7556} {"train_loss": -26.062063217163086, "global_step": 627165, "epoch": 7556} {"train_loss": -25.750898361206055, "global_step": 627166, "epoch": 7556} {"train_loss": -25.855518341064453, "global_step": 627167, "epoch": 7556} {"train_loss": -26.15805435180664, "global_step": 627168, "epoch": 7556} {"train_loss": -26.149337768554688, "global_step": 627169, "epoch": 7556} {"train_loss": -26.02204704284668, "global_step": 627170, "epoch": 7556} {"train_loss": -26.179624557495117, "global_step": 627171, "epoch": 7556} {"train_loss": -26.163171768188477, "global_step": 627172, "epoch": 7556} {"train_loss": -26.290063858032227, "global_step": 627173, "epoch": 7556} {"train_loss": -26.58344078063965, "global_step": 627174, "epoch": 7556} {"train_loss": -26.821949005126953, "global_step": 627175, "epoch": 7556} {"train_loss": -26.79022789001465, "global_step": 627176, "epoch": 7556} {"train_loss": -27.164596557617188, "global_step": 627177, "epoch": 7556} {"train_loss": -26.714258193969727, "global_step": 627178, "epoch": 7556} {"train_loss": -26.815250396728516, "global_step": 627179, "epoch": 7556} {"train_loss": -27.10347557067871, "global_step": 627180, "epoch": 7556} {"train_loss": -26.929126739501953, "global_step": 627181, "epoch": 7556} {"train_loss": -27.187667846679688, "global_step": 627182, "epoch": 7556} {"train_loss": -26.867746353149414, "global_step": 627183, "epoch": 7556} {"train_loss": -27.214887619018555, "global_step": 627184, "epoch": 7556} {"train_loss": -26.730924606323242, "global_step": 627185, "epoch": 7556} {"train_loss": -27.05267906188965, "global_step": 627186, "epoch": 7556} {"train_loss": -27.267908096313477, "global_step": 627187, "epoch": 7556} {"train_loss": -27.291479110717773, "global_step": 627188, "epoch": 7556} {"train_loss": -26.88983726501465, "global_step": 627189, "epoch": 7556} {"train_loss": -27.11732292175293, "global_step": 627190, "epoch": 7556} {"train_loss": -27.273406982421875, "global_step": 627191, "epoch": 7556} {"train_loss": -27.474655151367188, "global_step": 627192, "epoch": 7556} {"train_loss": -27.380090713500977, "global_step": 627193, "epoch": 7556} {"train_loss": -27.517175674438477, "global_step": 627194, "epoch": 7556} {"train_loss": -27.373931884765625, "global_step": 627195, "epoch": 7556} {"train_loss": -27.4888973236084, "global_step": 627196, "epoch": 7556} {"train_loss": -27.53114128112793, "global_step": 627197, "epoch": 7556} {"train_loss": -27.647153854370117, "global_step": 627198, "epoch": 7556} {"train_loss": -27.426898956298828, "global_step": 627199, "epoch": 7556} {"train_loss": -27.302366256713867, "global_step": 627200, "epoch": 7556} {"train_loss": -27.50873374938965, "global_step": 627201, "epoch": 7556} {"train_loss": -27.625553131103516, "global_step": 627202, "epoch": 7556} {"train_loss": -27.868148803710938, "global_step": 627203, "epoch": 7556} {"train_loss": -27.61648941040039, "global_step": 627204, "epoch": 7556} {"train_loss": -27.863245010375977, "global_step": 627205, "epoch": 7556} {"train_loss": -27.43812370300293, "global_step": 627206, "epoch": 7556} {"train_loss": -27.983875274658203, "global_step": 627207, "epoch": 7556} {"train_loss": -27.9146671295166, "global_step": 627208, "epoch": 7556} {"train_loss": -27.512603759765625, "global_step": 627209, "epoch": 7556} {"train_loss": -28.093128204345703, "global_step": 627210, "epoch": 7556} {"train_loss": -27.566679000854492, "global_step": 627211, "epoch": 7556} {"train_loss": -27.860288619995117, "global_step": 627212, "epoch": 7556} {"train_loss": -28.10475730895996, "global_step": 627213, "epoch": 7556} {"train_loss": -27.829145431518555, "global_step": 627214, "epoch": 7556} {"train_loss": -27.851659774780273, "global_step": 627215, "epoch": 7556} {"train_loss": -27.780187606811523, "global_step": 627216, "epoch": 7556} {"train_loss": -28.196430206298828, "global_step": 627217, "epoch": 7556} {"train_loss": -28.145917892456055, "global_step": 627218, "epoch": 7556} {"train_loss": -28.06686782836914, "global_step": 627219, "epoch": 7556} {"train_loss": -28.05689811706543, "global_step": 627220, "epoch": 7556} {"train_loss": -27.985309600830078, "global_step": 627221, "epoch": 7556} {"train_loss": -28.0101261138916, "global_step": 627222, "epoch": 7556} {"train_loss": -28.04693603515625, "global_step": 627223, "epoch": 7556} {"train_loss": -28.518484115600586, "global_step": 627224, "epoch": 7556} {"train_loss": -28.53420066833496, "global_step": 627225, "epoch": 7556} {"train_loss": -27.997669219970703, "global_step": 627226, "epoch": 7556} {"train_loss": -28.240924835205078, "global_step": 627227, "epoch": 7556} {"train_loss": -28.22611427307129, "global_step": 627228, "epoch": 7556} {"train_loss": -28.13014793395996, "global_step": 627229, "epoch": 7556} {"train_loss": -26.905262567910803, "global_step": 627230, "epoch": 7556, "val_loss": 6726829.0} {"train_loss": -27.894556045532227, "global_step": 627231, "epoch": 7557} {"train_loss": -27.15498161315918, "global_step": 627232, "epoch": 7557} {"train_loss": -26.822235107421875, "global_step": 627233, "epoch": 7557} {"train_loss": -27.367355346679688, "global_step": 627234, "epoch": 7557} {"train_loss": -27.773303985595703, "global_step": 627235, "epoch": 7557} {"train_loss": -26.883909225463867, "global_step": 627236, "epoch": 7557} {"train_loss": -26.201557159423828, "global_step": 627237, "epoch": 7557} {"train_loss": -27.322301864624023, "global_step": 627238, "epoch": 7557} {"train_loss": -27.86859130859375, "global_step": 627239, "epoch": 7557} {"train_loss": -27.49239158630371, "global_step": 627240, "epoch": 7557} {"train_loss": -27.841144561767578, "global_step": 627241, "epoch": 7557} {"train_loss": -27.587182998657227, "global_step": 627242, "epoch": 7557} {"train_loss": -27.352985382080078, "global_step": 627243, "epoch": 7557} {"train_loss": -27.69565200805664, "global_step": 627244, "epoch": 7557} {"train_loss": -27.946491241455078, "global_step": 627245, "epoch": 7557} {"train_loss": -27.979816436767578, "global_step": 627246, "epoch": 7557} {"train_loss": -27.85519790649414, "global_step": 627247, "epoch": 7557} {"train_loss": -27.9229736328125, "global_step": 627248, "epoch": 7557} {"train_loss": -28.127756118774414, "global_step": 627249, "epoch": 7557} {"train_loss": -27.95590591430664, "global_step": 627250, "epoch": 7557} {"train_loss": -28.178319931030273, "global_step": 627251, "epoch": 7557} {"train_loss": -27.889135360717773, "global_step": 627252, "epoch": 7557} {"train_loss": -28.15140724182129, "global_step": 627253, "epoch": 7557} {"train_loss": -27.849960327148438, "global_step": 627254, "epoch": 7557} {"train_loss": -28.12981605529785, "global_step": 627255, "epoch": 7557} {"train_loss": -27.766708374023438, "global_step": 627256, "epoch": 7557} {"train_loss": -28.329980850219727, "global_step": 627257, "epoch": 7557} {"train_loss": -27.975473403930664, "global_step": 627258, "epoch": 7557} {"train_loss": -28.20654296875, "global_step": 627259, "epoch": 7557} {"train_loss": -28.203466415405273, "global_step": 627260, "epoch": 7557} {"train_loss": -27.953510284423828, "global_step": 627261, "epoch": 7557} {"train_loss": -28.271642684936523, "global_step": 627262, "epoch": 7557} {"train_loss": -28.1841983795166, "global_step": 627263, "epoch": 7557} {"train_loss": -27.92475700378418, "global_step": 627264, "epoch": 7557} {"train_loss": -27.9561710357666, "global_step": 627265, "epoch": 7557} {"train_loss": -28.464344024658203, "global_step": 627266, "epoch": 7557} {"train_loss": -28.074872970581055, "global_step": 627267, "epoch": 7557} {"train_loss": -28.533832550048828, "global_step": 627268, "epoch": 7557} {"train_loss": -28.31312370300293, "global_step": 627269, "epoch": 7557} {"train_loss": -28.0539608001709, "global_step": 627270, "epoch": 7557} {"train_loss": -28.233556747436523, "global_step": 627271, "epoch": 7557} {"train_loss": -28.151330947875977, "global_step": 627272, "epoch": 7557} {"train_loss": -28.859912872314453, "global_step": 627273, "epoch": 7557} {"train_loss": -28.20627784729004, "global_step": 627274, "epoch": 7557} {"train_loss": -27.748458862304688, "global_step": 627275, "epoch": 7557} {"train_loss": -28.11481285095215, "global_step": 627276, "epoch": 7557} {"train_loss": -28.33668327331543, "global_step": 627277, "epoch": 7557} {"train_loss": -28.071292877197266, "global_step": 627278, "epoch": 7557} {"train_loss": -28.50556755065918, "global_step": 627279, "epoch": 7557} {"train_loss": -28.21896743774414, "global_step": 627280, "epoch": 7557} {"train_loss": -28.62757682800293, "global_step": 627281, "epoch": 7557} {"train_loss": -28.473073959350586, "global_step": 627282, "epoch": 7557} {"train_loss": -28.4206600189209, "global_step": 627283, "epoch": 7557} {"train_loss": -28.539520263671875, "global_step": 627284, "epoch": 7557} {"train_loss": -28.32491111755371, "global_step": 627285, "epoch": 7557} {"train_loss": -28.678476333618164, "global_step": 627286, "epoch": 7557} {"train_loss": -28.26973533630371, "global_step": 627287, "epoch": 7557} {"train_loss": -28.30779457092285, "global_step": 627288, "epoch": 7557} {"train_loss": -28.45720863342285, "global_step": 627289, "epoch": 7557} {"train_loss": -28.592288970947266, "global_step": 627290, "epoch": 7557} {"train_loss": -28.509321212768555, "global_step": 627291, "epoch": 7557} {"train_loss": -28.62396240234375, "global_step": 627292, "epoch": 7557} {"train_loss": -28.63873291015625, "global_step": 627293, "epoch": 7557} {"train_loss": -28.544071197509766, "global_step": 627294, "epoch": 7557} {"train_loss": -28.1925048828125, "global_step": 627295, "epoch": 7557} {"train_loss": -28.732282638549805, "global_step": 627296, "epoch": 7557} {"train_loss": -28.191312789916992, "global_step": 627297, "epoch": 7557} {"train_loss": -28.336130142211914, "global_step": 627298, "epoch": 7557} {"train_loss": -28.4514102935791, "global_step": 627299, "epoch": 7557} {"train_loss": -28.332412719726562, "global_step": 627300, "epoch": 7557} {"train_loss": -28.5841064453125, "global_step": 627301, "epoch": 7557} {"train_loss": -28.063215255737305, "global_step": 627302, "epoch": 7557} {"train_loss": -28.48740577697754, "global_step": 627303, "epoch": 7557} {"train_loss": -28.117033004760742, "global_step": 627304, "epoch": 7557} {"train_loss": -28.194995880126953, "global_step": 627305, "epoch": 7557} {"train_loss": -28.43727684020996, "global_step": 627306, "epoch": 7557} {"train_loss": -28.356210708618164, "global_step": 627307, "epoch": 7557} {"train_loss": -28.26995277404785, "global_step": 627308, "epoch": 7557} {"train_loss": -28.590051651000977, "global_step": 627309, "epoch": 7557} {"train_loss": -27.965869903564453, "global_step": 627310, "epoch": 7557} {"train_loss": -28.058347702026367, "global_step": 627311, "epoch": 7557} {"train_loss": -28.139379501342773, "global_step": 627312, "epoch": 7557} {"train_loss": -28.094803683729058, "global_step": 627313, "epoch": 7557, "val_loss": 6697385.5} {"train_loss": -27.302709579467773, "global_step": 627314, "epoch": 7558} {"train_loss": -27.4055233001709, "global_step": 627315, "epoch": 7558} {"train_loss": -27.808359146118164, "global_step": 627316, "epoch": 7558} {"train_loss": -27.8324031829834, "global_step": 627317, "epoch": 7558} {"train_loss": -27.590499877929688, "global_step": 627318, "epoch": 7558} {"train_loss": -27.50593376159668, "global_step": 627319, "epoch": 7558} {"train_loss": -27.628747940063477, "global_step": 627320, "epoch": 7558} {"train_loss": -27.7839298248291, "global_step": 627321, "epoch": 7558} {"train_loss": -27.794286727905273, "global_step": 627322, "epoch": 7558} {"train_loss": -27.568374633789062, "global_step": 627323, "epoch": 7558} {"train_loss": -28.06705093383789, "global_step": 627324, "epoch": 7558} {"train_loss": -27.7778377532959, "global_step": 627325, "epoch": 7558} {"train_loss": -27.99152946472168, "global_step": 627326, "epoch": 7558} {"train_loss": -28.150043487548828, "global_step": 627327, "epoch": 7558} {"train_loss": -27.90570640563965, "global_step": 627328, "epoch": 7558} {"train_loss": -27.993398666381836, "global_step": 627329, "epoch": 7558} {"train_loss": -27.7291202545166, "global_step": 627330, "epoch": 7558} {"train_loss": -28.205503463745117, "global_step": 627331, "epoch": 7558} {"train_loss": -27.75176429748535, "global_step": 627332, "epoch": 7558} {"train_loss": -28.207305908203125, "global_step": 627333, "epoch": 7558} {"train_loss": -28.130578994750977, "global_step": 627334, "epoch": 7558} {"train_loss": -28.13553810119629, "global_step": 627335, "epoch": 7558} {"train_loss": -27.964807510375977, "global_step": 627336, "epoch": 7558} {"train_loss": -28.277856826782227, "global_step": 627337, "epoch": 7558} {"train_loss": -28.1904239654541, "global_step": 627338, "epoch": 7558} {"train_loss": -28.21272087097168, "global_step": 627339, "epoch": 7558} {"train_loss": -28.23587417602539, "global_step": 627340, "epoch": 7558} {"train_loss": -28.132221221923828, "global_step": 627341, "epoch": 7558} {"train_loss": -28.246967315673828, "global_step": 627342, "epoch": 7558} {"train_loss": -28.68538475036621, "global_step": 627343, "epoch": 7558} {"train_loss": -28.478443145751953, "global_step": 627344, "epoch": 7558} {"train_loss": -28.482624053955078, "global_step": 627345, "epoch": 7558} {"train_loss": -27.741147994995117, "global_step": 627346, "epoch": 7558} {"train_loss": -28.0604248046875, "global_step": 627347, "epoch": 7558} {"train_loss": -27.819318771362305, "global_step": 627348, "epoch": 7558} {"train_loss": -28.458850860595703, "global_step": 627349, "epoch": 7558} {"train_loss": -28.080915451049805, "global_step": 627350, "epoch": 7558} {"train_loss": -27.96900749206543, "global_step": 627351, "epoch": 7558} {"train_loss": -28.423145294189453, "global_step": 627352, "epoch": 7558} {"train_loss": -28.338993072509766, "global_step": 627353, "epoch": 7558} {"train_loss": -28.29610252380371, "global_step": 627354, "epoch": 7558} {"train_loss": -28.18865966796875, "global_step": 627355, "epoch": 7558} {"train_loss": -28.24298667907715, "global_step": 627356, "epoch": 7558} {"train_loss": -27.930408477783203, "global_step": 627357, "epoch": 7558} {"train_loss": -27.82179069519043, "global_step": 627358, "epoch": 7558} {"train_loss": -28.38620376586914, "global_step": 627359, "epoch": 7558} {"train_loss": -28.26344108581543, "global_step": 627360, "epoch": 7558} {"train_loss": -28.021127700805664, "global_step": 627361, "epoch": 7558} {"train_loss": -28.47096824645996, "global_step": 627362, "epoch": 7558} {"train_loss": -28.327014923095703, "global_step": 627363, "epoch": 7558} {"train_loss": -28.1378116607666, "global_step": 627364, "epoch": 7558} {"train_loss": -27.6916446685791, "global_step": 627365, "epoch": 7558} {"train_loss": -27.758779525756836, "global_step": 627366, "epoch": 7558} {"train_loss": -28.576231002807617, "global_step": 627367, "epoch": 7558} {"train_loss": -28.63142204284668, "global_step": 627368, "epoch": 7558} {"train_loss": -28.201547622680664, "global_step": 627369, "epoch": 7558} {"train_loss": -28.330341339111328, "global_step": 627370, "epoch": 7558} {"train_loss": -28.30411148071289, "global_step": 627371, "epoch": 7558} {"train_loss": -28.50372314453125, "global_step": 627372, "epoch": 7558} {"train_loss": -28.5185489654541, "global_step": 627373, "epoch": 7558} {"train_loss": -28.225128173828125, "global_step": 627374, "epoch": 7558} {"train_loss": -28.16983985900879, "global_step": 627375, "epoch": 7558} {"train_loss": -28.358457565307617, "global_step": 627376, "epoch": 7558} {"train_loss": -28.55301856994629, "global_step": 627377, "epoch": 7558} {"train_loss": -28.438169479370117, "global_step": 627378, "epoch": 7558} {"train_loss": -28.21084976196289, "global_step": 627379, "epoch": 7558} {"train_loss": -28.375885009765625, "global_step": 627380, "epoch": 7558} {"train_loss": -28.56568717956543, "global_step": 627381, "epoch": 7558} {"train_loss": -28.2918701171875, "global_step": 627382, "epoch": 7558} {"train_loss": -28.129425048828125, "global_step": 627383, "epoch": 7558} {"train_loss": -28.292469024658203, "global_step": 627384, "epoch": 7558} {"train_loss": -28.33399772644043, "global_step": 627385, "epoch": 7558} {"train_loss": -28.143329620361328, "global_step": 627386, "epoch": 7558} {"train_loss": -28.392194747924805, "global_step": 627387, "epoch": 7558} {"train_loss": -28.182397842407227, "global_step": 627388, "epoch": 7558} {"train_loss": -28.412866592407227, "global_step": 627389, "epoch": 7558} {"train_loss": -28.285858154296875, "global_step": 627390, "epoch": 7558} {"train_loss": -28.062408447265625, "global_step": 627391, "epoch": 7558} {"train_loss": -28.16827392578125, "global_step": 627392, "epoch": 7558} {"train_loss": -28.45392417907715, "global_step": 627393, "epoch": 7558} {"train_loss": -28.133214950561523, "global_step": 627394, "epoch": 7558} {"train_loss": -28.786252975463867, "global_step": 627395, "epoch": 7558} {"train_loss": -28.153756291033275, "global_step": 627396, "epoch": 7558, "val_loss": 6679555.0} {"train_loss": -27.9603214263916, "global_step": 627397, "epoch": 7559} {"train_loss": -26.87933921813965, "global_step": 627398, "epoch": 7559} {"train_loss": -26.637344360351562, "global_step": 627399, "epoch": 7559} {"train_loss": -26.58316421508789, "global_step": 627400, "epoch": 7559} {"train_loss": -27.579303741455078, "global_step": 627401, "epoch": 7559} {"train_loss": -27.513769149780273, "global_step": 627402, "epoch": 7559} {"train_loss": -27.741718292236328, "global_step": 627403, "epoch": 7559} {"train_loss": -27.927732467651367, "global_step": 627404, "epoch": 7559} {"train_loss": -27.014850616455078, "global_step": 627405, "epoch": 7559} {"train_loss": -27.64188003540039, "global_step": 627406, "epoch": 7559} {"train_loss": -28.003198623657227, "global_step": 627407, "epoch": 7559} {"train_loss": -27.869583129882812, "global_step": 627408, "epoch": 7559} {"train_loss": -27.7933406829834, "global_step": 627409, "epoch": 7559} {"train_loss": -27.700672149658203, "global_step": 627410, "epoch": 7559} {"train_loss": -28.2286319732666, "global_step": 627411, "epoch": 7559} {"train_loss": -27.812122344970703, "global_step": 627412, "epoch": 7559} {"train_loss": -28.409534454345703, "global_step": 627413, "epoch": 7559} {"train_loss": -27.76397132873535, "global_step": 627414, "epoch": 7559} {"train_loss": -27.72918128967285, "global_step": 627415, "epoch": 7559} {"train_loss": -27.750873565673828, "global_step": 627416, "epoch": 7559} {"train_loss": -28.1696834564209, "global_step": 627417, "epoch": 7559} {"train_loss": -27.70609474182129, "global_step": 627418, "epoch": 7559} {"train_loss": -28.07167625427246, "global_step": 627419, "epoch": 7559} {"train_loss": -28.140039443969727, "global_step": 627420, "epoch": 7559} {"train_loss": -27.859357833862305, "global_step": 627421, "epoch": 7559} {"train_loss": -28.349720001220703, "global_step": 627422, "epoch": 7559} {"train_loss": -28.302082061767578, "global_step": 627423, "epoch": 7559} {"train_loss": -28.134204864501953, "global_step": 627424, "epoch": 7559} {"train_loss": -28.260412216186523, "global_step": 627425, "epoch": 7559} {"train_loss": -28.01600456237793, "global_step": 627426, "epoch": 7559} {"train_loss": -27.98752784729004, "global_step": 627427, "epoch": 7559} {"train_loss": -28.37556266784668, "global_step": 627428, "epoch": 7559} {"train_loss": -28.205045700073242, "global_step": 627429, "epoch": 7559} {"train_loss": -28.44140625, "global_step": 627430, "epoch": 7559} {"train_loss": -28.0697021484375, "global_step": 627431, "epoch": 7559} {"train_loss": -28.008045196533203, "global_step": 627432, "epoch": 7559} {"train_loss": -28.21900749206543, "global_step": 627433, "epoch": 7559} {"train_loss": -28.469038009643555, "global_step": 627434, "epoch": 7559} {"train_loss": -28.139667510986328, "global_step": 627435, "epoch": 7559} {"train_loss": -28.40097427368164, "global_step": 627436, "epoch": 7559} {"train_loss": -28.5614070892334, "global_step": 627437, "epoch": 7559} {"train_loss": -28.217609405517578, "global_step": 627438, "epoch": 7559} {"train_loss": -27.9529972076416, "global_step": 627439, "epoch": 7559} {"train_loss": -28.2613582611084, "global_step": 627440, "epoch": 7559} {"train_loss": -28.248273849487305, "global_step": 627441, "epoch": 7559} {"train_loss": -28.307783126831055, "global_step": 627442, "epoch": 7559} {"train_loss": -28.265344619750977, "global_step": 627443, "epoch": 7559} {"train_loss": -28.27595329284668, "global_step": 627444, "epoch": 7559} {"train_loss": -28.439245223999023, "global_step": 627445, "epoch": 7559} {"train_loss": -28.616308212280273, "global_step": 627446, "epoch": 7559} {"train_loss": -28.4819393157959, "global_step": 627447, "epoch": 7559} {"train_loss": -28.572362899780273, "global_step": 627448, "epoch": 7559} {"train_loss": -28.337188720703125, "global_step": 627449, "epoch": 7559} {"train_loss": -28.278165817260742, "global_step": 627450, "epoch": 7559} {"train_loss": -28.508188247680664, "global_step": 627451, "epoch": 7559} {"train_loss": -28.508337020874023, "global_step": 627452, "epoch": 7559} {"train_loss": -28.325632095336914, "global_step": 627453, "epoch": 7559} {"train_loss": -28.55994987487793, "global_step": 627454, "epoch": 7559} {"train_loss": -28.266340255737305, "global_step": 627455, "epoch": 7559} {"train_loss": -28.580896377563477, "global_step": 627456, "epoch": 7559} {"train_loss": -28.338348388671875, "global_step": 627457, "epoch": 7559} {"train_loss": -28.31007957458496, "global_step": 627458, "epoch": 7559} {"train_loss": -28.32025146484375, "global_step": 627459, "epoch": 7559} {"train_loss": -27.805591583251953, "global_step": 627460, "epoch": 7559} {"train_loss": -28.577619552612305, "global_step": 627461, "epoch": 7559} {"train_loss": -28.36911392211914, "global_step": 627462, "epoch": 7559} {"train_loss": -28.27168083190918, "global_step": 627463, "epoch": 7559} {"train_loss": -28.2386417388916, "global_step": 627464, "epoch": 7559} {"train_loss": -27.998641967773438, "global_step": 627465, "epoch": 7559} {"train_loss": -28.064809799194336, "global_step": 627466, "epoch": 7559} {"train_loss": -28.317102432250977, "global_step": 627467, "epoch": 7559} {"train_loss": -28.53009605407715, "global_step": 627468, "epoch": 7559} {"train_loss": -27.92130470275879, "global_step": 627469, "epoch": 7559} {"train_loss": -28.123620986938477, "global_step": 627470, "epoch": 7559} {"train_loss": -28.173376083374023, "global_step": 627471, "epoch": 7559} {"train_loss": -28.076459884643555, "global_step": 627472, "epoch": 7559} {"train_loss": -28.281503677368164, "global_step": 627473, "epoch": 7559} {"train_loss": -27.610097885131836, "global_step": 627474, "epoch": 7559} {"train_loss": -28.11285400390625, "global_step": 627475, "epoch": 7559} {"train_loss": -27.943403244018555, "global_step": 627476, "epoch": 7559} {"train_loss": -28.02338218688965, "global_step": 627477, "epoch": 7559} {"train_loss": -28.55706787109375, "global_step": 627478, "epoch": 7559} {"train_loss": -28.07333452155791, "global_step": 627479, "epoch": 7559, "val_loss": 6783641.0} {"train_loss": -25.849796295166016, "global_step": 627480, "epoch": 7560} {"train_loss": -25.18088150024414, "global_step": 627481, "epoch": 7560} {"train_loss": -25.77530288696289, "global_step": 627482, "epoch": 7560} {"train_loss": -26.448816299438477, "global_step": 627483, "epoch": 7560} {"train_loss": -25.87830924987793, "global_step": 627484, "epoch": 7560} {"train_loss": -25.68979835510254, "global_step": 627485, "epoch": 7560} {"train_loss": -26.7520809173584, "global_step": 627486, "epoch": 7560} {"train_loss": -26.56760597229004, "global_step": 627487, "epoch": 7560} {"train_loss": -26.752710342407227, "global_step": 627488, "epoch": 7560} {"train_loss": -27.004880905151367, "global_step": 627489, "epoch": 7560} {"train_loss": -27.464496612548828, "global_step": 627490, "epoch": 7560} {"train_loss": -27.002994537353516, "global_step": 627491, "epoch": 7560} {"train_loss": -27.10126304626465, "global_step": 627492, "epoch": 7560} {"train_loss": -26.969043731689453, "global_step": 627493, "epoch": 7560} {"train_loss": -26.693838119506836, "global_step": 627494, "epoch": 7560} {"train_loss": -27.599889755249023, "global_step": 627495, "epoch": 7560} {"train_loss": -27.52034568786621, "global_step": 627496, "epoch": 7560} {"train_loss": -27.369596481323242, "global_step": 627497, "epoch": 7560} {"train_loss": -27.341785430908203, "global_step": 627498, "epoch": 7560} {"train_loss": -27.643274307250977, "global_step": 627499, "epoch": 7560} {"train_loss": -27.813373565673828, "global_step": 627500, "epoch": 7560} {"train_loss": -27.70354652404785, "global_step": 627501, "epoch": 7560} {"train_loss": -27.67521095275879, "global_step": 627502, "epoch": 7560} {"train_loss": -27.78968620300293, "global_step": 627503, "epoch": 7560} {"train_loss": -27.62485694885254, "global_step": 627504, "epoch": 7560} {"train_loss": -27.62118911743164, "global_step": 627505, "epoch": 7560} {"train_loss": -27.797595977783203, "global_step": 627506, "epoch": 7560} {"train_loss": -27.811185836791992, "global_step": 627507, "epoch": 7560} {"train_loss": -27.871484756469727, "global_step": 627508, "epoch": 7560} {"train_loss": -28.20587730407715, "global_step": 627509, "epoch": 7560} {"train_loss": -28.110761642456055, "global_step": 627510, "epoch": 7560} {"train_loss": -27.934158325195312, "global_step": 627511, "epoch": 7560} {"train_loss": -27.70233726501465, "global_step": 627512, "epoch": 7560} {"train_loss": -28.312274932861328, "global_step": 627513, "epoch": 7560} {"train_loss": -28.260839462280273, "global_step": 627514, "epoch": 7560} {"train_loss": -27.9345703125, "global_step": 627515, "epoch": 7560} {"train_loss": -28.424707412719727, "global_step": 627516, "epoch": 7560} {"train_loss": -27.76755714416504, "global_step": 627517, "epoch": 7560} {"train_loss": -27.953155517578125, "global_step": 627518, "epoch": 7560} {"train_loss": -27.972455978393555, "global_step": 627519, "epoch": 7560} {"train_loss": -28.458581924438477, "global_step": 627520, "epoch": 7560} {"train_loss": -27.972585678100586, "global_step": 627521, "epoch": 7560} {"train_loss": -28.029138565063477, "global_step": 627522, "epoch": 7560} {"train_loss": -28.45100212097168, "global_step": 627523, "epoch": 7560} {"train_loss": -27.9560489654541, "global_step": 627524, "epoch": 7560} {"train_loss": -28.087690353393555, "global_step": 627525, "epoch": 7560} {"train_loss": -28.36769676208496, "global_step": 627526, "epoch": 7560} {"train_loss": -28.331335067749023, "global_step": 627527, "epoch": 7560} {"train_loss": -27.9261474609375, "global_step": 627528, "epoch": 7560} {"train_loss": -28.391427993774414, "global_step": 627529, "epoch": 7560} {"train_loss": -28.485727310180664, "global_step": 627530, "epoch": 7560} {"train_loss": -28.193206787109375, "global_step": 627531, "epoch": 7560} {"train_loss": -28.23638343811035, "global_step": 627532, "epoch": 7560} {"train_loss": -28.28049659729004, "global_step": 627533, "epoch": 7560} {"train_loss": -28.616168975830078, "global_step": 627534, "epoch": 7560} {"train_loss": -28.6405029296875, "global_step": 627535, "epoch": 7560} {"train_loss": -28.7110595703125, "global_step": 627536, "epoch": 7560} {"train_loss": -28.688940048217773, "global_step": 627537, "epoch": 7560} {"train_loss": -28.36604118347168, "global_step": 627538, "epoch": 7560} {"train_loss": -28.595346450805664, "global_step": 627539, "epoch": 7560} {"train_loss": -28.51778221130371, "global_step": 627540, "epoch": 7560} {"train_loss": -28.26405906677246, "global_step": 627541, "epoch": 7560} {"train_loss": -28.443159103393555, "global_step": 627542, "epoch": 7560} {"train_loss": -28.55124855041504, "global_step": 627543, "epoch": 7560} {"train_loss": -28.370044708251953, "global_step": 627544, "epoch": 7560} {"train_loss": -28.257389068603516, "global_step": 627545, "epoch": 7560} {"train_loss": -28.224584579467773, "global_step": 627546, "epoch": 7560} {"train_loss": -28.27436637878418, "global_step": 627547, "epoch": 7560} {"train_loss": -28.626361846923828, "global_step": 627548, "epoch": 7560} {"train_loss": -28.370737075805664, "global_step": 627549, "epoch": 7560} {"train_loss": -28.537073135375977, "global_step": 627550, "epoch": 7560} {"train_loss": -28.226058959960938, "global_step": 627551, "epoch": 7560} {"train_loss": -28.048505783081055, "global_step": 627552, "epoch": 7560} {"train_loss": -28.13591957092285, "global_step": 627553, "epoch": 7560} {"train_loss": -28.29829216003418, "global_step": 627554, "epoch": 7560} {"train_loss": -28.09392738342285, "global_step": 627555, "epoch": 7560} {"train_loss": -28.541336059570312, "global_step": 627556, "epoch": 7560} {"train_loss": -28.525320053100586, "global_step": 627557, "epoch": 7560} {"train_loss": -28.373321533203125, "global_step": 627558, "epoch": 7560} {"train_loss": -28.294660568237305, "global_step": 627559, "epoch": 7560} {"train_loss": -28.153966903686523, "global_step": 627560, "epoch": 7560} {"train_loss": -28.159534454345703, "global_step": 627561, "epoch": 7560} {"train_loss": -27.8498128408409, "global_step": 627562, "epoch": 7560, "val_loss": 6661548.0} {"train_loss": -27.468006134033203, "global_step": 627563, "epoch": 7561} {"train_loss": -27.394750595092773, "global_step": 627564, "epoch": 7561} {"train_loss": -27.36907386779785, "global_step": 627565, "epoch": 7561} {"train_loss": -28.088449478149414, "global_step": 627566, "epoch": 7561} {"train_loss": -27.73781394958496, "global_step": 627567, "epoch": 7561} {"train_loss": -27.624242782592773, "global_step": 627568, "epoch": 7561} {"train_loss": -27.420495986938477, "global_step": 627569, "epoch": 7561} {"train_loss": -27.785846710205078, "global_step": 627570, "epoch": 7561} {"train_loss": -27.608905792236328, "global_step": 627571, "epoch": 7561} {"train_loss": -28.132123947143555, "global_step": 627572, "epoch": 7561} {"train_loss": -28.042160034179688, "global_step": 627573, "epoch": 7561} {"train_loss": -27.933883666992188, "global_step": 627574, "epoch": 7561} {"train_loss": -27.953710556030273, "global_step": 627575, "epoch": 7561} {"train_loss": -27.68817710876465, "global_step": 627576, "epoch": 7561} {"train_loss": -27.84467124938965, "global_step": 627577, "epoch": 7561} {"train_loss": -28.178003311157227, "global_step": 627578, "epoch": 7561} {"train_loss": -27.65183448791504, "global_step": 627579, "epoch": 7561} {"train_loss": -28.061695098876953, "global_step": 627580, "epoch": 7561} {"train_loss": -28.343957901000977, "global_step": 627581, "epoch": 7561} {"train_loss": -27.921478271484375, "global_step": 627582, "epoch": 7561} {"train_loss": -28.50333023071289, "global_step": 627583, "epoch": 7561} {"train_loss": -27.984472274780273, "global_step": 627584, "epoch": 7561} {"train_loss": -28.112003326416016, "global_step": 627585, "epoch": 7561} {"train_loss": -28.06268310546875, "global_step": 627586, "epoch": 7561} {"train_loss": -27.711292266845703, "global_step": 627587, "epoch": 7561} {"train_loss": -28.252613067626953, "global_step": 627588, "epoch": 7561} {"train_loss": -27.749313354492188, "global_step": 627589, "epoch": 7561} {"train_loss": -28.185989379882812, "global_step": 627590, "epoch": 7561} {"train_loss": -28.274545669555664, "global_step": 627591, "epoch": 7561} {"train_loss": -28.362274169921875, "global_step": 627592, "epoch": 7561} {"train_loss": -28.266544342041016, "global_step": 627593, "epoch": 7561} {"train_loss": -28.190290451049805, "global_step": 627594, "epoch": 7561} {"train_loss": -27.94501304626465, "global_step": 627595, "epoch": 7561} {"train_loss": -28.28230094909668, "global_step": 627596, "epoch": 7561} {"train_loss": -28.019546508789062, "global_step": 627597, "epoch": 7561} {"train_loss": -27.99763298034668, "global_step": 627598, "epoch": 7561} {"train_loss": -28.069665908813477, "global_step": 627599, "epoch": 7561} {"train_loss": -28.494287490844727, "global_step": 627600, "epoch": 7561} {"train_loss": -28.28509521484375, "global_step": 627601, "epoch": 7561} {"train_loss": -28.25078773498535, "global_step": 627602, "epoch": 7561} {"train_loss": -27.9752197265625, "global_step": 627603, "epoch": 7561} {"train_loss": -28.371789932250977, "global_step": 627604, "epoch": 7561} {"train_loss": -28.63681411743164, "global_step": 627605, "epoch": 7561} {"train_loss": -28.31587028503418, "global_step": 627606, "epoch": 7561} {"train_loss": -28.121780395507812, "global_step": 627607, "epoch": 7561} {"train_loss": -28.229084014892578, "global_step": 627608, "epoch": 7561} {"train_loss": -28.140783309936523, "global_step": 627609, "epoch": 7561} {"train_loss": -27.67595863342285, "global_step": 627610, "epoch": 7561} {"train_loss": -27.984760284423828, "global_step": 627611, "epoch": 7561} {"train_loss": -28.166425704956055, "global_step": 627612, "epoch": 7561} {"train_loss": -28.298669815063477, "global_step": 627613, "epoch": 7561} {"train_loss": -27.580671310424805, "global_step": 627614, "epoch": 7561} {"train_loss": -27.0364933013916, "global_step": 627615, "epoch": 7561} {"train_loss": -27.259618759155273, "global_step": 627616, "epoch": 7561} {"train_loss": -27.90716552734375, "global_step": 627617, "epoch": 7561} {"train_loss": -27.46930503845215, "global_step": 627618, "epoch": 7561} {"train_loss": -26.69467544555664, "global_step": 627619, "epoch": 7561} {"train_loss": -27.328433990478516, "global_step": 627620, "epoch": 7561} {"train_loss": -27.6878662109375, "global_step": 627621, "epoch": 7561} {"train_loss": -27.468103408813477, "global_step": 627622, "epoch": 7561} {"train_loss": -27.22607421875, "global_step": 627623, "epoch": 7561} {"train_loss": -27.710947036743164, "global_step": 627624, "epoch": 7561} {"train_loss": -27.459089279174805, "global_step": 627625, "epoch": 7561} {"train_loss": -27.929895401000977, "global_step": 627626, "epoch": 7561} {"train_loss": -27.639728546142578, "global_step": 627627, "epoch": 7561} {"train_loss": -27.819726943969727, "global_step": 627628, "epoch": 7561} {"train_loss": -27.70460319519043, "global_step": 627629, "epoch": 7561} {"train_loss": -27.7965087890625, "global_step": 627630, "epoch": 7561} {"train_loss": -27.940839767456055, "global_step": 627631, "epoch": 7561} {"train_loss": -27.86020851135254, "global_step": 627632, "epoch": 7561} {"train_loss": -27.954023361206055, "global_step": 627633, "epoch": 7561} {"train_loss": -27.581390380859375, "global_step": 627634, "epoch": 7561} {"train_loss": -28.302875518798828, "global_step": 627635, "epoch": 7561} {"train_loss": -27.6967830657959, "global_step": 627636, "epoch": 7561} {"train_loss": -27.89275550842285, "global_step": 627637, "epoch": 7561} {"train_loss": -27.787221908569336, "global_step": 627638, "epoch": 7561} {"train_loss": -27.633560180664062, "global_step": 627639, "epoch": 7561} {"train_loss": -28.27349853515625, "global_step": 627640, "epoch": 7561} {"train_loss": -27.9954891204834, "global_step": 627641, "epoch": 7561} {"train_loss": -28.075658798217773, "global_step": 627642, "epoch": 7561} {"train_loss": -28.2590274810791, "global_step": 627643, "epoch": 7561} {"train_loss": -27.6243953704834, "global_step": 627644, "epoch": 7561} {"train_loss": -27.90285650506077, "global_step": 627645, "epoch": 7561, "val_loss": 6662856.0} {"train_loss": -27.148351669311523, "global_step": 627646, "epoch": 7562} {"train_loss": -28.26445960998535, "global_step": 627647, "epoch": 7562} {"train_loss": -27.727354049682617, "global_step": 627648, "epoch": 7562} {"train_loss": -27.623737335205078, "global_step": 627649, "epoch": 7562} {"train_loss": -27.84992790222168, "global_step": 627650, "epoch": 7562} {"train_loss": -27.79681396484375, "global_step": 627651, "epoch": 7562} {"train_loss": -28.00214195251465, "global_step": 627652, "epoch": 7562} {"train_loss": -27.567407608032227, "global_step": 627653, "epoch": 7562} {"train_loss": -27.928699493408203, "global_step": 627654, "epoch": 7562} {"train_loss": -27.899396896362305, "global_step": 627655, "epoch": 7562} {"train_loss": -27.819135665893555, "global_step": 627656, "epoch": 7562} {"train_loss": -28.19927406311035, "global_step": 627657, "epoch": 7562} {"train_loss": -27.74492835998535, "global_step": 627658, "epoch": 7562} {"train_loss": -28.147363662719727, "global_step": 627659, "epoch": 7562} {"train_loss": -28.023273468017578, "global_step": 627660, "epoch": 7562} {"train_loss": -27.871753692626953, "global_step": 627661, "epoch": 7562} {"train_loss": -28.077056884765625, "global_step": 627662, "epoch": 7562} {"train_loss": -27.959747314453125, "global_step": 627663, "epoch": 7562} {"train_loss": -28.12298583984375, "global_step": 627664, "epoch": 7562} {"train_loss": -28.100751876831055, "global_step": 627665, "epoch": 7562} {"train_loss": -28.26826286315918, "global_step": 627666, "epoch": 7562} {"train_loss": -28.0256290435791, "global_step": 627667, "epoch": 7562} {"train_loss": -28.48969078063965, "global_step": 627668, "epoch": 7562} {"train_loss": -28.03330421447754, "global_step": 627669, "epoch": 7562} {"train_loss": -28.26753044128418, "global_step": 627670, "epoch": 7562} {"train_loss": -28.416772842407227, "global_step": 627671, "epoch": 7562} {"train_loss": -28.407087326049805, "global_step": 627672, "epoch": 7562} {"train_loss": -28.497894287109375, "global_step": 627673, "epoch": 7562} {"train_loss": -27.892011642456055, "global_step": 627674, "epoch": 7562} {"train_loss": -28.52430534362793, "global_step": 627675, "epoch": 7562} {"train_loss": -27.99680519104004, "global_step": 627676, "epoch": 7562} {"train_loss": -28.34321403503418, "global_step": 627677, "epoch": 7562} {"train_loss": -28.54082679748535, "global_step": 627678, "epoch": 7562} {"train_loss": -28.040372848510742, "global_step": 627679, "epoch": 7562} {"train_loss": -28.466262817382812, "global_step": 627680, "epoch": 7562} {"train_loss": -28.073596954345703, "global_step": 627681, "epoch": 7562} {"train_loss": -28.869932174682617, "global_step": 627682, "epoch": 7562} {"train_loss": -28.241840362548828, "global_step": 627683, "epoch": 7562} {"train_loss": -28.186899185180664, "global_step": 627684, "epoch": 7562} {"train_loss": -28.442615509033203, "global_step": 627685, "epoch": 7562} {"train_loss": -28.32219886779785, "global_step": 627686, "epoch": 7562} {"train_loss": -28.222904205322266, "global_step": 627687, "epoch": 7562} {"train_loss": -28.457014083862305, "global_step": 627688, "epoch": 7562} {"train_loss": -28.474933624267578, "global_step": 627689, "epoch": 7562} {"train_loss": -28.661657333374023, "global_step": 627690, "epoch": 7562} {"train_loss": -28.48890495300293, "global_step": 627691, "epoch": 7562} {"train_loss": -28.498884201049805, "global_step": 627692, "epoch": 7562} {"train_loss": -28.350732803344727, "global_step": 627693, "epoch": 7562} {"train_loss": -28.26923179626465, "global_step": 627694, "epoch": 7562} {"train_loss": -28.23233413696289, "global_step": 627695, "epoch": 7562} {"train_loss": -28.11673355102539, "global_step": 627696, "epoch": 7562} {"train_loss": -27.764570236206055, "global_step": 627697, "epoch": 7562} {"train_loss": -27.4542236328125, "global_step": 627698, "epoch": 7562} {"train_loss": -27.89642333984375, "global_step": 627699, "epoch": 7562} {"train_loss": -28.088903427124023, "global_step": 627700, "epoch": 7562} {"train_loss": -28.14332389831543, "global_step": 627701, "epoch": 7562} {"train_loss": -28.585371017456055, "global_step": 627702, "epoch": 7562} {"train_loss": -28.27349853515625, "global_step": 627703, "epoch": 7562} {"train_loss": -28.42816734313965, "global_step": 627704, "epoch": 7562} {"train_loss": -28.01252555847168, "global_step": 627705, "epoch": 7562} {"train_loss": -28.37428092956543, "global_step": 627706, "epoch": 7562} {"train_loss": -27.721471786499023, "global_step": 627707, "epoch": 7562} {"train_loss": -28.220966339111328, "global_step": 627708, "epoch": 7562} {"train_loss": -27.927820205688477, "global_step": 627709, "epoch": 7562} {"train_loss": -27.676374435424805, "global_step": 627710, "epoch": 7562} {"train_loss": -28.179840087890625, "global_step": 627711, "epoch": 7562} {"train_loss": -27.980127334594727, "global_step": 627712, "epoch": 7562} {"train_loss": -27.840805053710938, "global_step": 627713, "epoch": 7562} {"train_loss": -28.003253936767578, "global_step": 627714, "epoch": 7562} {"train_loss": -28.1087646484375, "global_step": 627715, "epoch": 7562} {"train_loss": -27.596548080444336, "global_step": 627716, "epoch": 7562} {"train_loss": -27.87738609313965, "global_step": 627717, "epoch": 7562} {"train_loss": -27.60964012145996, "global_step": 627718, "epoch": 7562} {"train_loss": -27.95814323425293, "global_step": 627719, "epoch": 7562} {"train_loss": -28.02180290222168, "global_step": 627720, "epoch": 7562} {"train_loss": -28.151935577392578, "global_step": 627721, "epoch": 7562} {"train_loss": -28.0567626953125, "global_step": 627722, "epoch": 7562} {"train_loss": -27.860273361206055, "global_step": 627723, "epoch": 7562} {"train_loss": -27.903522491455078, "global_step": 627724, "epoch": 7562} {"train_loss": -27.879322052001953, "global_step": 627725, "epoch": 7562} {"train_loss": -28.240564346313477, "global_step": 627726, "epoch": 7562} {"train_loss": -28.305694580078125, "global_step": 627727, "epoch": 7562} {"train_loss": -28.102337412087316, "global_step": 627728, "epoch": 7562, "val_loss": 6676506.0} {"train_loss": -27.549163818359375, "global_step": 627729, "epoch": 7563} {"train_loss": -27.63153648376465, "global_step": 627730, "epoch": 7563} {"train_loss": -27.55183219909668, "global_step": 627731, "epoch": 7563} {"train_loss": -27.616092681884766, "global_step": 627732, "epoch": 7563} {"train_loss": -27.64312171936035, "global_step": 627733, "epoch": 7563} {"train_loss": -27.418807983398438, "global_step": 627734, "epoch": 7563} {"train_loss": -27.459814071655273, "global_step": 627735, "epoch": 7563} {"train_loss": -28.009109497070312, "global_step": 627736, "epoch": 7563} {"train_loss": -27.467395782470703, "global_step": 627737, "epoch": 7563} {"train_loss": -27.084735870361328, "global_step": 627738, "epoch": 7563} {"train_loss": -27.55881690979004, "global_step": 627739, "epoch": 7563} {"train_loss": -27.191986083984375, "global_step": 627740, "epoch": 7563} {"train_loss": -27.351776123046875, "global_step": 627741, "epoch": 7563} {"train_loss": -27.594385147094727, "global_step": 627742, "epoch": 7563} {"train_loss": -27.860065460205078, "global_step": 627743, "epoch": 7563} {"train_loss": -27.699893951416016, "global_step": 627744, "epoch": 7563} {"train_loss": -27.759183883666992, "global_step": 627745, "epoch": 7563} {"train_loss": -27.604572296142578, "global_step": 627746, "epoch": 7563} {"train_loss": -27.762670516967773, "global_step": 627747, "epoch": 7563} {"train_loss": -28.015705108642578, "global_step": 627748, "epoch": 7563} {"train_loss": -28.258981704711914, "global_step": 627749, "epoch": 7563} {"train_loss": -27.9462890625, "global_step": 627750, "epoch": 7563} {"train_loss": -28.140838623046875, "global_step": 627751, "epoch": 7563} {"train_loss": -27.605304718017578, "global_step": 627752, "epoch": 7563} {"train_loss": -28.235620498657227, "global_step": 627753, "epoch": 7563} {"train_loss": -28.141748428344727, "global_step": 627754, "epoch": 7563} {"train_loss": -27.976425170898438, "global_step": 627755, "epoch": 7563} {"train_loss": -27.92313575744629, "global_step": 627756, "epoch": 7563} {"train_loss": -28.330984115600586, "global_step": 627757, "epoch": 7563} {"train_loss": -27.741458892822266, "global_step": 627758, "epoch": 7563} {"train_loss": -28.596586227416992, "global_step": 627759, "epoch": 7563} {"train_loss": -27.98138427734375, "global_step": 627760, "epoch": 7563} {"train_loss": -27.930200576782227, "global_step": 627761, "epoch": 7563} {"train_loss": -28.448139190673828, "global_step": 627762, "epoch": 7563} {"train_loss": -28.395553588867188, "global_step": 627763, "epoch": 7563} {"train_loss": -28.43613052368164, "global_step": 627764, "epoch": 7563} {"train_loss": -28.09441566467285, "global_step": 627765, "epoch": 7563} {"train_loss": -28.40549659729004, "global_step": 627766, "epoch": 7563} {"train_loss": -28.352447509765625, "global_step": 627767, "epoch": 7563} {"train_loss": -28.433149337768555, "global_step": 627768, "epoch": 7563} {"train_loss": -27.783740997314453, "global_step": 627769, "epoch": 7563} {"train_loss": -27.983871459960938, "global_step": 627770, "epoch": 7563} {"train_loss": -28.2747802734375, "global_step": 627771, "epoch": 7563} {"train_loss": -28.081928253173828, "global_step": 627772, "epoch": 7563} {"train_loss": -28.003854751586914, "global_step": 627773, "epoch": 7563} {"train_loss": -27.93328857421875, "global_step": 627774, "epoch": 7563} {"train_loss": -28.030078887939453, "global_step": 627775, "epoch": 7563} {"train_loss": -27.724700927734375, "global_step": 627776, "epoch": 7563} {"train_loss": -27.930908203125, "global_step": 627777, "epoch": 7563} {"train_loss": -28.470563888549805, "global_step": 627778, "epoch": 7563} {"train_loss": -28.502195358276367, "global_step": 627779, "epoch": 7563} {"train_loss": -27.89923667907715, "global_step": 627780, "epoch": 7563} {"train_loss": -28.30354881286621, "global_step": 627781, "epoch": 7563} {"train_loss": -28.06178092956543, "global_step": 627782, "epoch": 7563} {"train_loss": -28.24799156188965, "global_step": 627783, "epoch": 7563} {"train_loss": -28.149927139282227, "global_step": 627784, "epoch": 7563} {"train_loss": -27.934926986694336, "global_step": 627785, "epoch": 7563} {"train_loss": -28.137847900390625, "global_step": 627786, "epoch": 7563} {"train_loss": -28.0891170501709, "global_step": 627787, "epoch": 7563} {"train_loss": -28.08270835876465, "global_step": 627788, "epoch": 7563} {"train_loss": -28.191381454467773, "global_step": 627789, "epoch": 7563} {"train_loss": -28.364490509033203, "global_step": 627790, "epoch": 7563} {"train_loss": -28.607410430908203, "global_step": 627791, "epoch": 7563} {"train_loss": -28.438053131103516, "global_step": 627792, "epoch": 7563} {"train_loss": -28.50446891784668, "global_step": 627793, "epoch": 7563} {"train_loss": -28.354400634765625, "global_step": 627794, "epoch": 7563} {"train_loss": -28.3986759185791, "global_step": 627795, "epoch": 7563} {"train_loss": -28.258045196533203, "global_step": 627796, "epoch": 7563} {"train_loss": -28.801166534423828, "global_step": 627797, "epoch": 7563} {"train_loss": -28.48884391784668, "global_step": 627798, "epoch": 7563} {"train_loss": -28.3328857421875, "global_step": 627799, "epoch": 7563} {"train_loss": -28.532602310180664, "global_step": 627800, "epoch": 7563} {"train_loss": -28.506567001342773, "global_step": 627801, "epoch": 7563} {"train_loss": -28.709918975830078, "global_step": 627802, "epoch": 7563} {"train_loss": -28.37782096862793, "global_step": 627803, "epoch": 7563} {"train_loss": -28.58955192565918, "global_step": 627804, "epoch": 7563} {"train_loss": -28.199975967407227, "global_step": 627805, "epoch": 7563} {"train_loss": -28.64387321472168, "global_step": 627806, "epoch": 7563} {"train_loss": -28.401029586791992, "global_step": 627807, "epoch": 7563} {"train_loss": -28.535308837890625, "global_step": 627808, "epoch": 7563} {"train_loss": -28.37078285217285, "global_step": 627809, "epoch": 7563} {"train_loss": -28.544055938720703, "global_step": 627810, "epoch": 7563} {"train_loss": -28.077460024730268, "global_step": 627811, "epoch": 7563, "val_loss": 6955685.0} {"train_loss": -26.80552101135254, "global_step": 627812, "epoch": 7564} {"train_loss": -26.87995719909668, "global_step": 627813, "epoch": 7564} {"train_loss": -26.601423263549805, "global_step": 627814, "epoch": 7564} {"train_loss": -27.198444366455078, "global_step": 627815, "epoch": 7564} {"train_loss": -27.699405670166016, "global_step": 627816, "epoch": 7564} {"train_loss": -27.482812881469727, "global_step": 627817, "epoch": 7564} {"train_loss": -27.838483810424805, "global_step": 627818, "epoch": 7564} {"train_loss": -27.75275230407715, "global_step": 627819, "epoch": 7564} {"train_loss": -27.257171630859375, "global_step": 627820, "epoch": 7564} {"train_loss": -27.445844650268555, "global_step": 627821, "epoch": 7564} {"train_loss": -27.79964256286621, "global_step": 627822, "epoch": 7564} {"train_loss": -27.16969108581543, "global_step": 627823, "epoch": 7564} {"train_loss": -27.905881881713867, "global_step": 627824, "epoch": 7564} {"train_loss": -27.611011505126953, "global_step": 627825, "epoch": 7564} {"train_loss": -27.578388214111328, "global_step": 627826, "epoch": 7564} {"train_loss": -27.556842803955078, "global_step": 627827, "epoch": 7564} {"train_loss": -28.027179718017578, "global_step": 627828, "epoch": 7564} {"train_loss": -28.140979766845703, "global_step": 627829, "epoch": 7564} {"train_loss": -27.931787490844727, "global_step": 627830, "epoch": 7564} {"train_loss": -28.19036293029785, "global_step": 627831, "epoch": 7564} {"train_loss": -27.95159912109375, "global_step": 627832, "epoch": 7564} {"train_loss": -27.84769630432129, "global_step": 627833, "epoch": 7564} {"train_loss": -28.124364852905273, "global_step": 627834, "epoch": 7564} {"train_loss": -27.975324630737305, "global_step": 627835, "epoch": 7564} {"train_loss": -28.286298751831055, "global_step": 627836, "epoch": 7564} {"train_loss": -27.8068904876709, "global_step": 627837, "epoch": 7564} {"train_loss": -27.90113639831543, "global_step": 627838, "epoch": 7564} {"train_loss": -28.0978946685791, "global_step": 627839, "epoch": 7564} {"train_loss": -27.719135284423828, "global_step": 627840, "epoch": 7564} {"train_loss": -27.868824005126953, "global_step": 627841, "epoch": 7564} {"train_loss": -27.89423179626465, "global_step": 627842, "epoch": 7564} {"train_loss": -27.921411514282227, "global_step": 627843, "epoch": 7564} {"train_loss": -27.7966365814209, "global_step": 627844, "epoch": 7564} {"train_loss": -28.31548500061035, "global_step": 627845, "epoch": 7564} {"train_loss": -28.03207778930664, "global_step": 627846, "epoch": 7564} {"train_loss": -27.858701705932617, "global_step": 627847, "epoch": 7564} {"train_loss": -28.027990341186523, "global_step": 627848, "epoch": 7564} {"train_loss": -28.17270278930664, "global_step": 627849, "epoch": 7564} {"train_loss": -28.264514923095703, "global_step": 627850, "epoch": 7564} {"train_loss": -28.0649356842041, "global_step": 627851, "epoch": 7564} {"train_loss": -28.333484649658203, "global_step": 627852, "epoch": 7564} {"train_loss": -28.2828311920166, "global_step": 627853, "epoch": 7564} {"train_loss": -28.010297775268555, "global_step": 627854, "epoch": 7564} {"train_loss": -27.951696395874023, "global_step": 627855, "epoch": 7564} {"train_loss": -28.18452262878418, "global_step": 627856, "epoch": 7564} {"train_loss": -28.038000106811523, "global_step": 627857, "epoch": 7564} {"train_loss": -28.4320011138916, "global_step": 627858, "epoch": 7564} {"train_loss": -28.08770179748535, "global_step": 627859, "epoch": 7564} {"train_loss": -27.848798751831055, "global_step": 627860, "epoch": 7564} {"train_loss": -28.094547271728516, "global_step": 627861, "epoch": 7564} {"train_loss": -28.03179931640625, "global_step": 627862, "epoch": 7564} {"train_loss": -28.339155197143555, "global_step": 627863, "epoch": 7564} {"train_loss": -28.001951217651367, "global_step": 627864, "epoch": 7564} {"train_loss": -28.00196647644043, "global_step": 627865, "epoch": 7564} {"train_loss": -28.058969497680664, "global_step": 627866, "epoch": 7564} {"train_loss": -28.170896530151367, "global_step": 627867, "epoch": 7564} {"train_loss": -28.59601402282715, "global_step": 627868, "epoch": 7564} {"train_loss": -28.164936065673828, "global_step": 627869, "epoch": 7564} {"train_loss": -28.036518096923828, "global_step": 627870, "epoch": 7564} {"train_loss": -28.219406127929688, "global_step": 627871, "epoch": 7564} {"train_loss": -27.93643569946289, "global_step": 627872, "epoch": 7564} {"train_loss": -28.14127540588379, "global_step": 627873, "epoch": 7564} {"train_loss": -28.455053329467773, "global_step": 627874, "epoch": 7564} {"train_loss": -27.97635841369629, "global_step": 627875, "epoch": 7564} {"train_loss": -28.07450294494629, "global_step": 627876, "epoch": 7564} {"train_loss": -28.09644889831543, "global_step": 627877, "epoch": 7564} {"train_loss": -28.146240234375, "global_step": 627878, "epoch": 7564} {"train_loss": -28.090402603149414, "global_step": 627879, "epoch": 7564} {"train_loss": -28.15247917175293, "global_step": 627880, "epoch": 7564} {"train_loss": -27.901294708251953, "global_step": 627881, "epoch": 7564} {"train_loss": -28.175867080688477, "global_step": 627882, "epoch": 7564} {"train_loss": -28.282743453979492, "global_step": 627883, "epoch": 7564} {"train_loss": -28.16657829284668, "global_step": 627884, "epoch": 7564} {"train_loss": -28.287094116210938, "global_step": 627885, "epoch": 7564} {"train_loss": -28.538633346557617, "global_step": 627886, "epoch": 7564} {"train_loss": -28.328290939331055, "global_step": 627887, "epoch": 7564} {"train_loss": -28.090530395507812, "global_step": 627888, "epoch": 7564} {"train_loss": -27.963895797729492, "global_step": 627889, "epoch": 7564} {"train_loss": -28.29195213317871, "global_step": 627890, "epoch": 7564} {"train_loss": -28.1020565032959, "global_step": 627891, "epoch": 7564} {"train_loss": -28.3908748626709, "global_step": 627892, "epoch": 7564} {"train_loss": -28.40852928161621, "global_step": 627893, "epoch": 7564} {"train_loss": -27.961809503026757, "global_step": 627894, "epoch": 7564, "val_loss": 6821489.0} {"train_loss": -27.554548263549805, "global_step": 627895, "epoch": 7565} {"train_loss": -26.807462692260742, "global_step": 627896, "epoch": 7565} {"train_loss": -27.392852783203125, "global_step": 627897, "epoch": 7565} {"train_loss": -27.7869815826416, "global_step": 627898, "epoch": 7565} {"train_loss": -27.40903663635254, "global_step": 627899, "epoch": 7565} {"train_loss": -27.245304107666016, "global_step": 627900, "epoch": 7565} {"train_loss": -27.298704147338867, "global_step": 627901, "epoch": 7565} {"train_loss": -27.79987907409668, "global_step": 627902, "epoch": 7565} {"train_loss": -27.30145835876465, "global_step": 627903, "epoch": 7565} {"train_loss": -27.482666015625, "global_step": 627904, "epoch": 7565} {"train_loss": -27.52461051940918, "global_step": 627905, "epoch": 7565} {"train_loss": -27.6416015625, "global_step": 627906, "epoch": 7565} {"train_loss": -27.397550582885742, "global_step": 627907, "epoch": 7565} {"train_loss": -27.72248649597168, "global_step": 627908, "epoch": 7565} {"train_loss": -27.850311279296875, "global_step": 627909, "epoch": 7565} {"train_loss": -28.05982780456543, "global_step": 627910, "epoch": 7565} {"train_loss": -27.779340744018555, "global_step": 627911, "epoch": 7565} {"train_loss": -27.83881950378418, "global_step": 627912, "epoch": 7565} {"train_loss": -28.0626277923584, "global_step": 627913, "epoch": 7565} {"train_loss": -27.887792587280273, "global_step": 627914, "epoch": 7565} {"train_loss": -27.780704498291016, "global_step": 627915, "epoch": 7565} {"train_loss": -27.85991859436035, "global_step": 627916, "epoch": 7565} {"train_loss": -27.230411529541016, "global_step": 627917, "epoch": 7565} {"train_loss": -27.941028594970703, "global_step": 627918, "epoch": 7565} {"train_loss": -27.94645118713379, "global_step": 627919, "epoch": 7565} {"train_loss": -27.85822105407715, "global_step": 627920, "epoch": 7565} {"train_loss": -27.802021026611328, "global_step": 627921, "epoch": 7565} {"train_loss": -27.7692813873291, "global_step": 627922, "epoch": 7565} {"train_loss": -27.749338150024414, "global_step": 627923, "epoch": 7565} {"train_loss": -27.6680908203125, "global_step": 627924, "epoch": 7565} {"train_loss": -28.138111114501953, "global_step": 627925, "epoch": 7565} {"train_loss": -28.151098251342773, "global_step": 627926, "epoch": 7565} {"train_loss": -27.628189086914062, "global_step": 627927, "epoch": 7565} {"train_loss": -28.287906646728516, "global_step": 627928, "epoch": 7565} {"train_loss": -28.439260482788086, "global_step": 627929, "epoch": 7565} {"train_loss": -28.11128807067871, "global_step": 627930, "epoch": 7565} {"train_loss": -28.325910568237305, "global_step": 627931, "epoch": 7565} {"train_loss": -27.6947078704834, "global_step": 627932, "epoch": 7565} {"train_loss": -28.389007568359375, "global_step": 627933, "epoch": 7565} {"train_loss": -27.995092391967773, "global_step": 627934, "epoch": 7565} {"train_loss": -27.98882484436035, "global_step": 627935, "epoch": 7565} {"train_loss": -28.48259925842285, "global_step": 627936, "epoch": 7565} {"train_loss": -28.65301513671875, "global_step": 627937, "epoch": 7565} {"train_loss": -28.368310928344727, "global_step": 627938, "epoch": 7565} {"train_loss": -28.347766876220703, "global_step": 627939, "epoch": 7565} {"train_loss": -28.602127075195312, "global_step": 627940, "epoch": 7565} {"train_loss": -28.479406356811523, "global_step": 627941, "epoch": 7565} {"train_loss": -28.300222396850586, "global_step": 627942, "epoch": 7565} {"train_loss": -28.174591064453125, "global_step": 627943, "epoch": 7565} {"train_loss": -28.35658073425293, "global_step": 627944, "epoch": 7565} {"train_loss": -28.249252319335938, "global_step": 627945, "epoch": 7565} {"train_loss": -28.3491268157959, "global_step": 627946, "epoch": 7565} {"train_loss": -28.450977325439453, "global_step": 627947, "epoch": 7565} {"train_loss": -28.756275177001953, "global_step": 627948, "epoch": 7565} {"train_loss": -28.104955673217773, "global_step": 627949, "epoch": 7565} {"train_loss": -28.5340518951416, "global_step": 627950, "epoch": 7565} {"train_loss": -28.56833267211914, "global_step": 627951, "epoch": 7565} {"train_loss": -28.67885398864746, "global_step": 627952, "epoch": 7565} {"train_loss": -28.3944149017334, "global_step": 627953, "epoch": 7565} {"train_loss": -28.909692764282227, "global_step": 627954, "epoch": 7565} {"train_loss": -28.33241081237793, "global_step": 627955, "epoch": 7565} {"train_loss": -28.22931480407715, "global_step": 627956, "epoch": 7565} {"train_loss": -27.96725845336914, "global_step": 627957, "epoch": 7565} {"train_loss": -27.829181671142578, "global_step": 627958, "epoch": 7565} {"train_loss": -27.97100257873535, "global_step": 627959, "epoch": 7565} {"train_loss": -27.925146102905273, "global_step": 627960, "epoch": 7565} {"train_loss": -27.99298095703125, "global_step": 627961, "epoch": 7565} {"train_loss": -27.863189697265625, "global_step": 627962, "epoch": 7565} {"train_loss": -27.714313507080078, "global_step": 627963, "epoch": 7565} {"train_loss": -27.704755783081055, "global_step": 627964, "epoch": 7565} {"train_loss": -28.421167373657227, "global_step": 627965, "epoch": 7565} {"train_loss": -27.8902645111084, "global_step": 627966, "epoch": 7565} {"train_loss": -27.815231323242188, "global_step": 627967, "epoch": 7565} {"train_loss": -28.181482315063477, "global_step": 627968, "epoch": 7565} {"train_loss": -28.10959243774414, "global_step": 627969, "epoch": 7565} {"train_loss": -28.08432388305664, "global_step": 627970, "epoch": 7565} {"train_loss": -28.13469886779785, "global_step": 627971, "epoch": 7565} {"train_loss": -28.053146362304688, "global_step": 627972, "epoch": 7565} {"train_loss": -28.1581974029541, "global_step": 627973, "epoch": 7565} {"train_loss": -27.888294219970703, "global_step": 627974, "epoch": 7565} {"train_loss": -28.346418380737305, "global_step": 627975, "epoch": 7565} {"train_loss": -28.194229125976562, "global_step": 627976, "epoch": 7565} {"train_loss": -28.00965851473521, "global_step": 627977, "epoch": 7565, "val_loss": 6799001.0} {"train_loss": -26.223546981811523, "global_step": 627978, "epoch": 7566} {"train_loss": -26.589950561523438, "global_step": 627979, "epoch": 7566} {"train_loss": -26.04827308654785, "global_step": 627980, "epoch": 7566} {"train_loss": -27.716882705688477, "global_step": 627981, "epoch": 7566} {"train_loss": -27.049915313720703, "global_step": 627982, "epoch": 7566} {"train_loss": -26.676538467407227, "global_step": 627983, "epoch": 7566} {"train_loss": -27.08086585998535, "global_step": 627984, "epoch": 7566} {"train_loss": -27.622573852539062, "global_step": 627985, "epoch": 7566} {"train_loss": -27.30940055847168, "global_step": 627986, "epoch": 7566} {"train_loss": -27.759145736694336, "global_step": 627987, "epoch": 7566} {"train_loss": -27.331085205078125, "global_step": 627988, "epoch": 7566} {"train_loss": -27.65754508972168, "global_step": 627989, "epoch": 7566} {"train_loss": -27.524250030517578, "global_step": 627990, "epoch": 7566} {"train_loss": -27.384429931640625, "global_step": 627991, "epoch": 7566} {"train_loss": -27.485977172851562, "global_step": 627992, "epoch": 7566} {"train_loss": -27.630990982055664, "global_step": 627993, "epoch": 7566} {"train_loss": -27.82069206237793, "global_step": 627994, "epoch": 7566} {"train_loss": -27.920520782470703, "global_step": 627995, "epoch": 7566} {"train_loss": -27.500574111938477, "global_step": 627996, "epoch": 7566} {"train_loss": -27.601947784423828, "global_step": 627997, "epoch": 7566} {"train_loss": -27.65475845336914, "global_step": 627998, "epoch": 7566} {"train_loss": -28.057132720947266, "global_step": 627999, "epoch": 7566} {"train_loss": -27.817169189453125, "global_step": 628000, "epoch": 7566} {"train_loss": -27.847211837768555, "global_step": 628001, "epoch": 7566} {"train_loss": -28.159927368164062, "global_step": 628002, "epoch": 7566} {"train_loss": -27.8725643157959, "global_step": 628003, "epoch": 7566} {"train_loss": -28.037860870361328, "global_step": 628004, "epoch": 7566} {"train_loss": -28.193872451782227, "global_step": 628005, "epoch": 7566} {"train_loss": -27.877227783203125, "global_step": 628006, "epoch": 7566} {"train_loss": -28.161712646484375, "global_step": 628007, "epoch": 7566} {"train_loss": -28.147729873657227, "global_step": 628008, "epoch": 7566} {"train_loss": -27.979461669921875, "global_step": 628009, "epoch": 7566} {"train_loss": -28.14449119567871, "global_step": 628010, "epoch": 7566} {"train_loss": -28.271621704101562, "global_step": 628011, "epoch": 7566} {"train_loss": -28.445051193237305, "global_step": 628012, "epoch": 7566} {"train_loss": -28.19427490234375, "global_step": 628013, "epoch": 7566} {"train_loss": -27.973560333251953, "global_step": 628014, "epoch": 7566} {"train_loss": -27.912078857421875, "global_step": 628015, "epoch": 7566} {"train_loss": -28.467676162719727, "global_step": 628016, "epoch": 7566} {"train_loss": -28.248868942260742, "global_step": 628017, "epoch": 7566} {"train_loss": -28.153350830078125, "global_step": 628018, "epoch": 7566} {"train_loss": -28.420734405517578, "global_step": 628019, "epoch": 7566} {"train_loss": -28.663366317749023, "global_step": 628020, "epoch": 7566} {"train_loss": -28.142745971679688, "global_step": 628021, "epoch": 7566} {"train_loss": -28.1683406829834, "global_step": 628022, "epoch": 7566} {"train_loss": -28.30230140686035, "global_step": 628023, "epoch": 7566} {"train_loss": -27.902862548828125, "global_step": 628024, "epoch": 7566} {"train_loss": -28.46845054626465, "global_step": 628025, "epoch": 7566} {"train_loss": -28.245389938354492, "global_step": 628026, "epoch": 7566} {"train_loss": -28.492334365844727, "global_step": 628027, "epoch": 7566} {"train_loss": -28.282535552978516, "global_step": 628028, "epoch": 7566} {"train_loss": -28.6104793548584, "global_step": 628029, "epoch": 7566} {"train_loss": -28.295373916625977, "global_step": 628030, "epoch": 7566} {"train_loss": -28.12076187133789, "global_step": 628031, "epoch": 7566} {"train_loss": -28.35117530822754, "global_step": 628032, "epoch": 7566} {"train_loss": -28.356657028198242, "global_step": 628033, "epoch": 7566} {"train_loss": -28.343597412109375, "global_step": 628034, "epoch": 7566} {"train_loss": -28.634952545166016, "global_step": 628035, "epoch": 7566} {"train_loss": -28.200897216796875, "global_step": 628036, "epoch": 7566} {"train_loss": -28.10017204284668, "global_step": 628037, "epoch": 7566} {"train_loss": -28.55425453186035, "global_step": 628038, "epoch": 7566} {"train_loss": -28.402265548706055, "global_step": 628039, "epoch": 7566} {"train_loss": -28.273609161376953, "global_step": 628040, "epoch": 7566} {"train_loss": -28.316373825073242, "global_step": 628041, "epoch": 7566} {"train_loss": -28.325841903686523, "global_step": 628042, "epoch": 7566} {"train_loss": -28.464468002319336, "global_step": 628043, "epoch": 7566} {"train_loss": -28.1054630279541, "global_step": 628044, "epoch": 7566} {"train_loss": -28.221338272094727, "global_step": 628045, "epoch": 7566} {"train_loss": -28.623294830322266, "global_step": 628046, "epoch": 7566} {"train_loss": -28.123910903930664, "global_step": 628047, "epoch": 7566} {"train_loss": -28.109655380249023, "global_step": 628048, "epoch": 7566} {"train_loss": -28.4416561126709, "global_step": 628049, "epoch": 7566} {"train_loss": -28.07806968688965, "global_step": 628050, "epoch": 7566} {"train_loss": -28.229358673095703, "global_step": 628051, "epoch": 7566} {"train_loss": -28.22055435180664, "global_step": 628052, "epoch": 7566} {"train_loss": -28.235889434814453, "global_step": 628053, "epoch": 7566} {"train_loss": -28.068836212158203, "global_step": 628054, "epoch": 7566} {"train_loss": -28.290420532226562, "global_step": 628055, "epoch": 7566} {"train_loss": -28.319263458251953, "global_step": 628056, "epoch": 7566} {"train_loss": -28.087890625, "global_step": 628057, "epoch": 7566} {"train_loss": -28.446735382080078, "global_step": 628058, "epoch": 7566} {"train_loss": -28.528390884399414, "global_step": 628059, "epoch": 7566} {"train_loss": -27.997497949255518, "global_step": 628060, "epoch": 7566, "val_loss": 6751473.0} {"train_loss": -28.190338134765625, "global_step": 628061, "epoch": 7567} {"train_loss": -27.963918685913086, "global_step": 628062, "epoch": 7567} {"train_loss": -27.743213653564453, "global_step": 628063, "epoch": 7567} {"train_loss": -27.818700790405273, "global_step": 628064, "epoch": 7567} {"train_loss": -27.96038818359375, "global_step": 628065, "epoch": 7567} {"train_loss": -27.831689834594727, "global_step": 628066, "epoch": 7567} {"train_loss": -28.323078155517578, "global_step": 628067, "epoch": 7567} {"train_loss": -27.90546989440918, "global_step": 628068, "epoch": 7567} {"train_loss": -27.580474853515625, "global_step": 628069, "epoch": 7567} {"train_loss": -28.25980567932129, "global_step": 628070, "epoch": 7567} {"train_loss": -27.620519638061523, "global_step": 628071, "epoch": 7567} {"train_loss": -27.962560653686523, "global_step": 628072, "epoch": 7567} {"train_loss": -28.0709285736084, "global_step": 628073, "epoch": 7567} {"train_loss": -28.216394424438477, "global_step": 628074, "epoch": 7567} {"train_loss": -28.310760498046875, "global_step": 628075, "epoch": 7567} {"train_loss": -27.956256866455078, "global_step": 628076, "epoch": 7567} {"train_loss": -28.140796661376953, "global_step": 628077, "epoch": 7567} {"train_loss": -28.009765625, "global_step": 628078, "epoch": 7567} {"train_loss": -28.344974517822266, "global_step": 628079, "epoch": 7567} {"train_loss": -28.277297973632812, "global_step": 628080, "epoch": 7567} {"train_loss": -28.252206802368164, "global_step": 628081, "epoch": 7567} {"train_loss": -28.38690185546875, "global_step": 628082, "epoch": 7567} {"train_loss": -27.93720054626465, "global_step": 628083, "epoch": 7567} {"train_loss": -28.361270904541016, "global_step": 628084, "epoch": 7567} {"train_loss": -28.1781005859375, "global_step": 628085, "epoch": 7567} {"train_loss": -28.215152740478516, "global_step": 628086, "epoch": 7567} {"train_loss": -28.26850700378418, "global_step": 628087, "epoch": 7567} {"train_loss": -28.44679069519043, "global_step": 628088, "epoch": 7567} {"train_loss": -27.97190284729004, "global_step": 628089, "epoch": 7567} {"train_loss": -28.556304931640625, "global_step": 628090, "epoch": 7567} {"train_loss": -28.370512008666992, "global_step": 628091, "epoch": 7567} {"train_loss": -27.753726959228516, "global_step": 628092, "epoch": 7567} {"train_loss": -28.248889923095703, "global_step": 628093, "epoch": 7567} {"train_loss": -28.063583374023438, "global_step": 628094, "epoch": 7567} {"train_loss": -28.622007369995117, "global_step": 628095, "epoch": 7567} {"train_loss": -28.492355346679688, "global_step": 628096, "epoch": 7567} {"train_loss": -28.360076904296875, "global_step": 628097, "epoch": 7567} {"train_loss": -28.289228439331055, "global_step": 628098, "epoch": 7567} {"train_loss": -27.914840698242188, "global_step": 628099, "epoch": 7567} {"train_loss": -28.117340087890625, "global_step": 628100, "epoch": 7567} {"train_loss": -28.211776733398438, "global_step": 628101, "epoch": 7567} {"train_loss": -28.28614616394043, "global_step": 628102, "epoch": 7567} {"train_loss": -27.755483627319336, "global_step": 628103, "epoch": 7567} {"train_loss": -28.19062614440918, "global_step": 628104, "epoch": 7567} {"train_loss": -28.381473541259766, "global_step": 628105, "epoch": 7567} {"train_loss": -28.239215850830078, "global_step": 628106, "epoch": 7567} {"train_loss": -28.401397705078125, "global_step": 628107, "epoch": 7567} {"train_loss": -28.206403732299805, "global_step": 628108, "epoch": 7567} {"train_loss": -28.15862464904785, "global_step": 628109, "epoch": 7567} {"train_loss": -28.63221549987793, "global_step": 628110, "epoch": 7567} {"train_loss": -28.10621452331543, "global_step": 628111, "epoch": 7567} {"train_loss": -28.445554733276367, "global_step": 628112, "epoch": 7567} {"train_loss": -28.68965721130371, "global_step": 628113, "epoch": 7567} {"train_loss": -28.164941787719727, "global_step": 628114, "epoch": 7567} {"train_loss": -28.03944206237793, "global_step": 628115, "epoch": 7567} {"train_loss": -28.040664672851562, "global_step": 628116, "epoch": 7567} {"train_loss": -28.35251235961914, "global_step": 628117, "epoch": 7567} {"train_loss": -27.8361873626709, "global_step": 628118, "epoch": 7567} {"train_loss": -27.9231014251709, "global_step": 628119, "epoch": 7567} {"train_loss": -27.619251251220703, "global_step": 628120, "epoch": 7567} {"train_loss": -28.44828224182129, "global_step": 628121, "epoch": 7567} {"train_loss": -28.279327392578125, "global_step": 628122, "epoch": 7567} {"train_loss": -28.18796157836914, "global_step": 628123, "epoch": 7567} {"train_loss": -28.237213134765625, "global_step": 628124, "epoch": 7567} {"train_loss": -28.08399772644043, "global_step": 628125, "epoch": 7567} {"train_loss": -28.309125900268555, "global_step": 628126, "epoch": 7567} {"train_loss": -28.001699447631836, "global_step": 628127, "epoch": 7567} {"train_loss": -28.149616241455078, "global_step": 628128, "epoch": 7567} {"train_loss": -28.1964054107666, "global_step": 628129, "epoch": 7567} {"train_loss": -27.883285522460938, "global_step": 628130, "epoch": 7567} {"train_loss": -28.340787887573242, "global_step": 628131, "epoch": 7567} {"train_loss": -28.323688507080078, "global_step": 628132, "epoch": 7567} {"train_loss": -28.020994186401367, "global_step": 628133, "epoch": 7567} {"train_loss": -28.255096435546875, "global_step": 628134, "epoch": 7567} {"train_loss": -28.05771255493164, "global_step": 628135, "epoch": 7567} {"train_loss": -28.271116256713867, "global_step": 628136, "epoch": 7567} {"train_loss": -28.525653839111328, "global_step": 628137, "epoch": 7567} {"train_loss": -28.479196548461914, "global_step": 628138, "epoch": 7567} {"train_loss": -28.137531280517578, "global_step": 628139, "epoch": 7567} {"train_loss": -28.173725128173828, "global_step": 628140, "epoch": 7567} {"train_loss": -28.69196891784668, "global_step": 628141, "epoch": 7567} {"train_loss": -28.129169464111328, "global_step": 628142, "epoch": 7567} {"train_loss": -28.159583470907556, "global_step": 628143, "epoch": 7567, "val_loss": 6778905.0} {"train_loss": -27.52150535583496, "global_step": 628144, "epoch": 7568} {"train_loss": -27.486047744750977, "global_step": 628145, "epoch": 7568} {"train_loss": -27.095163345336914, "global_step": 628146, "epoch": 7568} {"train_loss": -26.712238311767578, "global_step": 628147, "epoch": 7568} {"train_loss": -26.796051025390625, "global_step": 628148, "epoch": 7568} {"train_loss": -26.690683364868164, "global_step": 628149, "epoch": 7568} {"train_loss": -26.891876220703125, "global_step": 628150, "epoch": 7568} {"train_loss": -27.804752349853516, "global_step": 628151, "epoch": 7568} {"train_loss": -27.659276962280273, "global_step": 628152, "epoch": 7568} {"train_loss": -27.1444149017334, "global_step": 628153, "epoch": 7568} {"train_loss": -27.07535743713379, "global_step": 628154, "epoch": 7568} {"train_loss": -28.214874267578125, "global_step": 628155, "epoch": 7568} {"train_loss": -27.378570556640625, "global_step": 628156, "epoch": 7568} {"train_loss": -27.414331436157227, "global_step": 628157, "epoch": 7568} {"train_loss": -27.438642501831055, "global_step": 628158, "epoch": 7568} {"train_loss": -27.49873161315918, "global_step": 628159, "epoch": 7568} {"train_loss": -27.526260375976562, "global_step": 628160, "epoch": 7568} {"train_loss": -27.967329025268555, "global_step": 628161, "epoch": 7568} {"train_loss": -27.694293975830078, "global_step": 628162, "epoch": 7568} {"train_loss": -27.95334243774414, "global_step": 628163, "epoch": 7568} {"train_loss": -27.665130615234375, "global_step": 628164, "epoch": 7568} {"train_loss": -27.701231002807617, "global_step": 628165, "epoch": 7568} {"train_loss": -27.428680419921875, "global_step": 628166, "epoch": 7568} {"train_loss": -27.74250602722168, "global_step": 628167, "epoch": 7568} {"train_loss": -27.99982261657715, "global_step": 628168, "epoch": 7568} {"train_loss": -27.389057159423828, "global_step": 628169, "epoch": 7568} {"train_loss": -27.87210464477539, "global_step": 628170, "epoch": 7568} {"train_loss": -28.01094627380371, "global_step": 628171, "epoch": 7568} {"train_loss": -27.92188835144043, "global_step": 628172, "epoch": 7568} {"train_loss": -27.999408721923828, "global_step": 628173, "epoch": 7568} {"train_loss": -28.119861602783203, "global_step": 628174, "epoch": 7568} {"train_loss": -27.919660568237305, "global_step": 628175, "epoch": 7568} {"train_loss": -27.955270767211914, "global_step": 628176, "epoch": 7568} {"train_loss": -27.933149337768555, "global_step": 628177, "epoch": 7568} {"train_loss": -28.263769149780273, "global_step": 628178, "epoch": 7568} {"train_loss": -27.853839874267578, "global_step": 628179, "epoch": 7568} {"train_loss": -27.944318771362305, "global_step": 628180, "epoch": 7568} {"train_loss": -28.1229248046875, "global_step": 628181, "epoch": 7568} {"train_loss": -27.94587516784668, "global_step": 628182, "epoch": 7568} {"train_loss": -27.783605575561523, "global_step": 628183, "epoch": 7568} {"train_loss": -27.986419677734375, "global_step": 628184, "epoch": 7568} {"train_loss": -27.869287490844727, "global_step": 628185, "epoch": 7568} {"train_loss": -28.0639705657959, "global_step": 628186, "epoch": 7568} {"train_loss": -28.04619789123535, "global_step": 628187, "epoch": 7568} {"train_loss": -28.495025634765625, "global_step": 628188, "epoch": 7568} {"train_loss": -28.09588050842285, "global_step": 628189, "epoch": 7568} {"train_loss": -28.377676010131836, "global_step": 628190, "epoch": 7568} {"train_loss": -28.116418838500977, "global_step": 628191, "epoch": 7568} {"train_loss": -28.4283390045166, "global_step": 628192, "epoch": 7568} {"train_loss": -28.35438346862793, "global_step": 628193, "epoch": 7568} {"train_loss": -28.173871994018555, "global_step": 628194, "epoch": 7568} {"train_loss": -28.218900680541992, "global_step": 628195, "epoch": 7568} {"train_loss": -28.203466415405273, "global_step": 628196, "epoch": 7568} {"train_loss": -28.159378051757812, "global_step": 628197, "epoch": 7568} {"train_loss": -28.51934814453125, "global_step": 628198, "epoch": 7568} {"train_loss": -28.261524200439453, "global_step": 628199, "epoch": 7568} {"train_loss": -28.204071044921875, "global_step": 628200, "epoch": 7568} {"train_loss": -27.923795700073242, "global_step": 628201, "epoch": 7568} {"train_loss": -27.807336807250977, "global_step": 628202, "epoch": 7568} {"train_loss": -27.773639678955078, "global_step": 628203, "epoch": 7568} {"train_loss": -28.286762237548828, "global_step": 628204, "epoch": 7568} {"train_loss": -28.288015365600586, "global_step": 628205, "epoch": 7568} {"train_loss": -28.246627807617188, "global_step": 628206, "epoch": 7568} {"train_loss": -28.541330337524414, "global_step": 628207, "epoch": 7568} {"train_loss": -28.313562393188477, "global_step": 628208, "epoch": 7568} {"train_loss": -27.962005615234375, "global_step": 628209, "epoch": 7568} {"train_loss": -28.2711238861084, "global_step": 628210, "epoch": 7568} {"train_loss": -28.236297607421875, "global_step": 628211, "epoch": 7568} {"train_loss": -28.617816925048828, "global_step": 628212, "epoch": 7568} {"train_loss": -28.379974365234375, "global_step": 628213, "epoch": 7568} {"train_loss": -27.91669273376465, "global_step": 628214, "epoch": 7568} {"train_loss": -28.068017959594727, "global_step": 628215, "epoch": 7568} {"train_loss": -27.91607666015625, "global_step": 628216, "epoch": 7568} {"train_loss": -27.85914421081543, "global_step": 628217, "epoch": 7568} {"train_loss": -28.072534561157227, "global_step": 628218, "epoch": 7568} {"train_loss": -28.060943603515625, "global_step": 628219, "epoch": 7568} {"train_loss": -28.33367347717285, "global_step": 628220, "epoch": 7568} {"train_loss": -27.812997817993164, "global_step": 628221, "epoch": 7568} {"train_loss": -28.275531768798828, "global_step": 628222, "epoch": 7568} {"train_loss": -27.962717056274414, "global_step": 628223, "epoch": 7568} {"train_loss": -28.276697158813477, "global_step": 628224, "epoch": 7568} {"train_loss": -28.32663917541504, "global_step": 628225, "epoch": 7568} {"train_loss": -27.9132005622588, "global_step": 628226, "epoch": 7568, "val_loss": 6819155.5} {"train_loss": -27.62886619567871, "global_step": 628227, "epoch": 7569} {"train_loss": -27.407087326049805, "global_step": 628228, "epoch": 7569} {"train_loss": -27.817611694335938, "global_step": 628229, "epoch": 7569} {"train_loss": -27.2147274017334, "global_step": 628230, "epoch": 7569} {"train_loss": -27.63496208190918, "global_step": 628231, "epoch": 7569} {"train_loss": -27.919147491455078, "global_step": 628232, "epoch": 7569} {"train_loss": -27.422199249267578, "global_step": 628233, "epoch": 7569} {"train_loss": -27.528915405273438, "global_step": 628234, "epoch": 7569} {"train_loss": -27.57195472717285, "global_step": 628235, "epoch": 7569} {"train_loss": -27.563922882080078, "global_step": 628236, "epoch": 7569} {"train_loss": -27.171804428100586, "global_step": 628237, "epoch": 7569} {"train_loss": -27.303857803344727, "global_step": 628238, "epoch": 7569} {"train_loss": -27.933612823486328, "global_step": 628239, "epoch": 7569} {"train_loss": -27.510934829711914, "global_step": 628240, "epoch": 7569} {"train_loss": -27.783254623413086, "global_step": 628241, "epoch": 7569} {"train_loss": -27.600812911987305, "global_step": 628242, "epoch": 7569} {"train_loss": -27.612823486328125, "global_step": 628243, "epoch": 7569} {"train_loss": -27.581085205078125, "global_step": 628244, "epoch": 7569} {"train_loss": -27.514698028564453, "global_step": 628245, "epoch": 7569} {"train_loss": -28.140623092651367, "global_step": 628246, "epoch": 7569} {"train_loss": -27.29534912109375, "global_step": 628247, "epoch": 7569} {"train_loss": -27.419708251953125, "global_step": 628248, "epoch": 7569} {"train_loss": -27.74051856994629, "global_step": 628249, "epoch": 7569} {"train_loss": -27.890045166015625, "global_step": 628250, "epoch": 7569} {"train_loss": -27.52045249938965, "global_step": 628251, "epoch": 7569} {"train_loss": -27.938434600830078, "global_step": 628252, "epoch": 7569} {"train_loss": -28.035863876342773, "global_step": 628253, "epoch": 7569} {"train_loss": -27.841848373413086, "global_step": 628254, "epoch": 7569} {"train_loss": -27.8443603515625, "global_step": 628255, "epoch": 7569} {"train_loss": -27.72830581665039, "global_step": 628256, "epoch": 7569} {"train_loss": -27.837635040283203, "global_step": 628257, "epoch": 7569} {"train_loss": -27.80643653869629, "global_step": 628258, "epoch": 7569} {"train_loss": -28.1954288482666, "global_step": 628259, "epoch": 7569} {"train_loss": -28.052892684936523, "global_step": 628260, "epoch": 7569} {"train_loss": -28.038244247436523, "global_step": 628261, "epoch": 7569} {"train_loss": -27.846546173095703, "global_step": 628262, "epoch": 7569} {"train_loss": -28.172964096069336, "global_step": 628263, "epoch": 7569} {"train_loss": -27.621606826782227, "global_step": 628264, "epoch": 7569} {"train_loss": -28.494476318359375, "global_step": 628265, "epoch": 7569} {"train_loss": -28.407079696655273, "global_step": 628266, "epoch": 7569} {"train_loss": -28.11899185180664, "global_step": 628267, "epoch": 7569} {"train_loss": -28.28570556640625, "global_step": 628268, "epoch": 7569} {"train_loss": -28.212894439697266, "global_step": 628269, "epoch": 7569} {"train_loss": -28.353473663330078, "global_step": 628270, "epoch": 7569} {"train_loss": -28.158044815063477, "global_step": 628271, "epoch": 7569} {"train_loss": -28.219898223876953, "global_step": 628272, "epoch": 7569} {"train_loss": -28.410388946533203, "global_step": 628273, "epoch": 7569} {"train_loss": -28.73529052734375, "global_step": 628274, "epoch": 7569} {"train_loss": -27.994522094726562, "global_step": 628275, "epoch": 7569} {"train_loss": -28.6036376953125, "global_step": 628276, "epoch": 7569} {"train_loss": -28.604333877563477, "global_step": 628277, "epoch": 7569} {"train_loss": -28.52662467956543, "global_step": 628278, "epoch": 7569} {"train_loss": -28.2816104888916, "global_step": 628279, "epoch": 7569} {"train_loss": -28.672941207885742, "global_step": 628280, "epoch": 7569} {"train_loss": -28.278722763061523, "global_step": 628281, "epoch": 7569} {"train_loss": -28.4467830657959, "global_step": 628282, "epoch": 7569} {"train_loss": -28.29127311706543, "global_step": 628283, "epoch": 7569} {"train_loss": -28.515588760375977, "global_step": 628284, "epoch": 7569} {"train_loss": -28.768997192382812, "global_step": 628285, "epoch": 7569} {"train_loss": -28.758228302001953, "global_step": 628286, "epoch": 7569} {"train_loss": -28.555692672729492, "global_step": 628287, "epoch": 7569} {"train_loss": -28.766132354736328, "global_step": 628288, "epoch": 7569} {"train_loss": -28.384519577026367, "global_step": 628289, "epoch": 7569} {"train_loss": -28.30055809020996, "global_step": 628290, "epoch": 7569} {"train_loss": -28.65144157409668, "global_step": 628291, "epoch": 7569} {"train_loss": -27.924087524414062, "global_step": 628292, "epoch": 7569} {"train_loss": -27.809350967407227, "global_step": 628293, "epoch": 7569} {"train_loss": -27.042499542236328, "global_step": 628294, "epoch": 7569} {"train_loss": -26.454660415649414, "global_step": 628295, "epoch": 7569} {"train_loss": -26.59518814086914, "global_step": 628296, "epoch": 7569} {"train_loss": -27.0504093170166, "global_step": 628297, "epoch": 7569} {"train_loss": -27.640146255493164, "global_step": 628298, "epoch": 7569} {"train_loss": -28.132537841796875, "global_step": 628299, "epoch": 7569} {"train_loss": -28.201757431030273, "global_step": 628300, "epoch": 7569} {"train_loss": -28.1590633392334, "global_step": 628301, "epoch": 7569} {"train_loss": -28.068323135375977, "global_step": 628302, "epoch": 7569} {"train_loss": -28.256803512573242, "global_step": 628303, "epoch": 7569} {"train_loss": -28.197622299194336, "global_step": 628304, "epoch": 7569} {"train_loss": -28.142953872680664, "global_step": 628305, "epoch": 7569} {"train_loss": -27.899219512939453, "global_step": 628306, "epoch": 7569} {"train_loss": -28.37650489807129, "global_step": 628307, "epoch": 7569} {"train_loss": -27.855087280273438, "global_step": 628308, "epoch": 7569} {"train_loss": -27.938230054924286, "global_step": 628309, "epoch": 7569, "val_loss": 6768667.0} {"train_loss": -27.939176559448242, "global_step": 628310, "epoch": 7570} {"train_loss": -27.987104415893555, "global_step": 628311, "epoch": 7570} {"train_loss": -27.57242202758789, "global_step": 628312, "epoch": 7570} {"train_loss": -28.077192306518555, "global_step": 628313, "epoch": 7570} {"train_loss": -27.897775650024414, "global_step": 628314, "epoch": 7570} {"train_loss": -27.58890724182129, "global_step": 628315, "epoch": 7570} {"train_loss": -27.99332046508789, "global_step": 628316, "epoch": 7570} {"train_loss": -27.75640296936035, "global_step": 628317, "epoch": 7570} {"train_loss": -28.024450302124023, "global_step": 628318, "epoch": 7570} {"train_loss": -28.176244735717773, "global_step": 628319, "epoch": 7570} {"train_loss": -27.735198974609375, "global_step": 628320, "epoch": 7570} {"train_loss": -28.123279571533203, "global_step": 628321, "epoch": 7570} {"train_loss": -27.764801025390625, "global_step": 628322, "epoch": 7570} {"train_loss": -27.8775691986084, "global_step": 628323, "epoch": 7570} {"train_loss": -27.933332443237305, "global_step": 628324, "epoch": 7570} {"train_loss": -27.705835342407227, "global_step": 628325, "epoch": 7570} {"train_loss": -27.697540283203125, "global_step": 628326, "epoch": 7570} {"train_loss": -28.143604278564453, "global_step": 628327, "epoch": 7570} {"train_loss": -28.110122680664062, "global_step": 628328, "epoch": 7570} {"train_loss": -28.22391700744629, "global_step": 628329, "epoch": 7570} {"train_loss": -27.680627822875977, "global_step": 628330, "epoch": 7570} {"train_loss": -28.063648223876953, "global_step": 628331, "epoch": 7570} {"train_loss": -28.189258575439453, "global_step": 628332, "epoch": 7570} {"train_loss": -28.527185440063477, "global_step": 628333, "epoch": 7570} {"train_loss": -28.12809181213379, "global_step": 628334, "epoch": 7570} {"train_loss": -28.11726188659668, "global_step": 628335, "epoch": 7570} {"train_loss": -28.060632705688477, "global_step": 628336, "epoch": 7570} {"train_loss": -28.175113677978516, "global_step": 628337, "epoch": 7570} {"train_loss": -28.233673095703125, "global_step": 628338, "epoch": 7570} {"train_loss": -27.829797744750977, "global_step": 628339, "epoch": 7570} {"train_loss": -28.094253540039062, "global_step": 628340, "epoch": 7570} {"train_loss": -28.0725040435791, "global_step": 628341, "epoch": 7570} {"train_loss": -28.1883487701416, "global_step": 628342, "epoch": 7570} {"train_loss": -28.294591903686523, "global_step": 628343, "epoch": 7570} {"train_loss": -28.294225692749023, "global_step": 628344, "epoch": 7570} {"train_loss": -28.062246322631836, "global_step": 628345, "epoch": 7570} {"train_loss": -28.179126739501953, "global_step": 628346, "epoch": 7570} {"train_loss": -28.099079132080078, "global_step": 628347, "epoch": 7570} {"train_loss": -28.552555084228516, "global_step": 628348, "epoch": 7570} {"train_loss": -28.432199478149414, "global_step": 628349, "epoch": 7570} {"train_loss": -28.36649513244629, "global_step": 628350, "epoch": 7570} {"train_loss": -28.02219581604004, "global_step": 628351, "epoch": 7570} {"train_loss": -28.234745025634766, "global_step": 628352, "epoch": 7570} {"train_loss": -28.2791690826416, "global_step": 628353, "epoch": 7570} {"train_loss": -28.26555824279785, "global_step": 628354, "epoch": 7570} {"train_loss": -28.207258224487305, "global_step": 628355, "epoch": 7570} {"train_loss": -28.4663028717041, "global_step": 628356, "epoch": 7570} {"train_loss": -28.45682144165039, "global_step": 628357, "epoch": 7570} {"train_loss": -28.58782958984375, "global_step": 628358, "epoch": 7570} {"train_loss": -28.425785064697266, "global_step": 628359, "epoch": 7570} {"train_loss": -28.046300888061523, "global_step": 628360, "epoch": 7570} {"train_loss": -28.379379272460938, "global_step": 628361, "epoch": 7570} {"train_loss": -28.135894775390625, "global_step": 628362, "epoch": 7570} {"train_loss": -27.455352783203125, "global_step": 628363, "epoch": 7570} {"train_loss": -27.566797256469727, "global_step": 628364, "epoch": 7570} {"train_loss": -27.69866943359375, "global_step": 628365, "epoch": 7570} {"train_loss": -27.7111873626709, "global_step": 628366, "epoch": 7570} {"train_loss": -27.44672203063965, "global_step": 628367, "epoch": 7570} {"train_loss": -27.732501983642578, "global_step": 628368, "epoch": 7570} {"train_loss": -28.346643447875977, "global_step": 628369, "epoch": 7570} {"train_loss": -27.48072624206543, "global_step": 628370, "epoch": 7570} {"train_loss": -28.079349517822266, "global_step": 628371, "epoch": 7570} {"train_loss": -27.990238189697266, "global_step": 628372, "epoch": 7570} {"train_loss": -27.97052001953125, "global_step": 628373, "epoch": 7570} {"train_loss": -27.84563636779785, "global_step": 628374, "epoch": 7570} {"train_loss": -28.2255916595459, "global_step": 628375, "epoch": 7570} {"train_loss": -28.33314323425293, "global_step": 628376, "epoch": 7570} {"train_loss": -28.05747413635254, "global_step": 628377, "epoch": 7570} {"train_loss": -28.026762008666992, "global_step": 628378, "epoch": 7570} {"train_loss": -28.58673095703125, "global_step": 628379, "epoch": 7570} {"train_loss": -27.827665328979492, "global_step": 628380, "epoch": 7570} {"train_loss": -27.935606002807617, "global_step": 628381, "epoch": 7570} {"train_loss": -27.93756103515625, "global_step": 628382, "epoch": 7570} {"train_loss": -28.2027530670166, "global_step": 628383, "epoch": 7570} {"train_loss": -28.119491577148438, "global_step": 628384, "epoch": 7570} {"train_loss": -28.328433990478516, "global_step": 628385, "epoch": 7570} {"train_loss": -27.871551513671875, "global_step": 628386, "epoch": 7570} {"train_loss": -28.194189071655273, "global_step": 628387, "epoch": 7570} {"train_loss": -28.112319946289062, "global_step": 628388, "epoch": 7570} {"train_loss": -28.2510929107666, "global_step": 628389, "epoch": 7570} {"train_loss": -28.022809982299805, "global_step": 628390, "epoch": 7570} {"train_loss": -28.361328125, "global_step": 628391, "epoch": 7570} {"train_loss": -28.058200606380602, "global_step": 628392, "epoch": 7570, "val_loss": 6772918.0} {"train_loss": -27.26202964782715, "global_step": 628393, "epoch": 7571} {"train_loss": -27.115020751953125, "global_step": 628394, "epoch": 7571} {"train_loss": -27.029556274414062, "global_step": 628395, "epoch": 7571} {"train_loss": -27.336023330688477, "global_step": 628396, "epoch": 7571} {"train_loss": -27.34381103515625, "global_step": 628397, "epoch": 7571} {"train_loss": -26.62710952758789, "global_step": 628398, "epoch": 7571} {"train_loss": -27.81804847717285, "global_step": 628399, "epoch": 7571} {"train_loss": -27.0582332611084, "global_step": 628400, "epoch": 7571} {"train_loss": -27.202991485595703, "global_step": 628401, "epoch": 7571} {"train_loss": -27.236663818359375, "global_step": 628402, "epoch": 7571} {"train_loss": -27.454675674438477, "global_step": 628403, "epoch": 7571} {"train_loss": -27.60066795349121, "global_step": 628404, "epoch": 7571} {"train_loss": -27.42311668395996, "global_step": 628405, "epoch": 7571} {"train_loss": -27.655231475830078, "global_step": 628406, "epoch": 7571} {"train_loss": -27.626920700073242, "global_step": 628407, "epoch": 7571} {"train_loss": -27.61439323425293, "global_step": 628408, "epoch": 7571} {"train_loss": -27.367919921875, "global_step": 628409, "epoch": 7571} {"train_loss": -27.322330474853516, "global_step": 628410, "epoch": 7571} {"train_loss": -27.79315185546875, "global_step": 628411, "epoch": 7571} {"train_loss": -27.741796493530273, "global_step": 628412, "epoch": 7571} {"train_loss": -27.28399085998535, "global_step": 628413, "epoch": 7571} {"train_loss": -27.61090087890625, "global_step": 628414, "epoch": 7571} {"train_loss": -27.83837890625, "global_step": 628415, "epoch": 7571} {"train_loss": -27.813949584960938, "global_step": 628416, "epoch": 7571} {"train_loss": -27.737882614135742, "global_step": 628417, "epoch": 7571} {"train_loss": -28.088428497314453, "global_step": 628418, "epoch": 7571} {"train_loss": -27.585529327392578, "global_step": 628419, "epoch": 7571} {"train_loss": -28.060083389282227, "global_step": 628420, "epoch": 7571} {"train_loss": -27.66427993774414, "global_step": 628421, "epoch": 7571} {"train_loss": -27.963788986206055, "global_step": 628422, "epoch": 7571} {"train_loss": -28.064741134643555, "global_step": 628423, "epoch": 7571} {"train_loss": -27.94622802734375, "global_step": 628424, "epoch": 7571} {"train_loss": -28.145185470581055, "global_step": 628425, "epoch": 7571} {"train_loss": -28.186767578125, "global_step": 628426, "epoch": 7571} {"train_loss": -27.6518611907959, "global_step": 628427, "epoch": 7571} {"train_loss": -28.33902359008789, "global_step": 628428, "epoch": 7571} {"train_loss": -27.987695693969727, "global_step": 628429, "epoch": 7571} {"train_loss": -28.183019638061523, "global_step": 628430, "epoch": 7571} {"train_loss": -28.078205108642578, "global_step": 628431, "epoch": 7571} {"train_loss": -28.28021240234375, "global_step": 628432, "epoch": 7571} {"train_loss": -28.311172485351562, "global_step": 628433, "epoch": 7571} {"train_loss": -27.83465003967285, "global_step": 628434, "epoch": 7571} {"train_loss": -28.417499542236328, "global_step": 628435, "epoch": 7571} {"train_loss": -28.32793617248535, "global_step": 628436, "epoch": 7571} {"train_loss": -28.265491485595703, "global_step": 628437, "epoch": 7571} {"train_loss": -28.284948348999023, "global_step": 628438, "epoch": 7571} {"train_loss": -28.032272338867188, "global_step": 628439, "epoch": 7571} {"train_loss": -28.00029945373535, "global_step": 628440, "epoch": 7571} {"train_loss": -27.826435089111328, "global_step": 628441, "epoch": 7571} {"train_loss": -28.0229549407959, "global_step": 628442, "epoch": 7571} {"train_loss": -28.419864654541016, "global_step": 628443, "epoch": 7571} {"train_loss": -28.30402946472168, "global_step": 628444, "epoch": 7571} {"train_loss": -28.153547286987305, "global_step": 628445, "epoch": 7571} {"train_loss": -27.800098419189453, "global_step": 628446, "epoch": 7571} {"train_loss": -27.935937881469727, "global_step": 628447, "epoch": 7571} {"train_loss": -28.459503173828125, "global_step": 628448, "epoch": 7571} {"train_loss": -28.458585739135742, "global_step": 628449, "epoch": 7571} {"train_loss": -28.11533546447754, "global_step": 628450, "epoch": 7571} {"train_loss": -28.232351303100586, "global_step": 628451, "epoch": 7571} {"train_loss": -28.39509391784668, "global_step": 628452, "epoch": 7571} {"train_loss": -28.581480026245117, "global_step": 628453, "epoch": 7571} {"train_loss": -28.100055694580078, "global_step": 628454, "epoch": 7571} {"train_loss": -27.991363525390625, "global_step": 628455, "epoch": 7571} {"train_loss": -28.174732208251953, "global_step": 628456, "epoch": 7571} {"train_loss": -28.179595947265625, "global_step": 628457, "epoch": 7571} {"train_loss": -28.375625610351562, "global_step": 628458, "epoch": 7571} {"train_loss": -28.085712432861328, "global_step": 628459, "epoch": 7571} {"train_loss": -28.196460723876953, "global_step": 628460, "epoch": 7571} {"train_loss": -28.153167724609375, "global_step": 628461, "epoch": 7571} {"train_loss": -28.24212074279785, "global_step": 628462, "epoch": 7571} {"train_loss": -28.05561637878418, "global_step": 628463, "epoch": 7571} {"train_loss": -27.875131607055664, "global_step": 628464, "epoch": 7571} {"train_loss": -28.46964454650879, "global_step": 628465, "epoch": 7571} {"train_loss": -28.290979385375977, "global_step": 628466, "epoch": 7571} {"train_loss": -28.1751766204834, "global_step": 628467, "epoch": 7571} {"train_loss": -28.47747230529785, "global_step": 628468, "epoch": 7571} {"train_loss": -28.115217208862305, "global_step": 628469, "epoch": 7571} {"train_loss": -28.112701416015625, "global_step": 628470, "epoch": 7571} {"train_loss": -27.66983413696289, "global_step": 628471, "epoch": 7571} {"train_loss": -28.320615768432617, "global_step": 628472, "epoch": 7571} {"train_loss": -28.30966567993164, "global_step": 628473, "epoch": 7571} {"train_loss": -28.429662704467773, "global_step": 628474, "epoch": 7571} {"train_loss": -27.94113409662821, "global_step": 628475, "epoch": 7571, "val_loss": 6715683.0} {"train_loss": -27.59846305847168, "global_step": 628476, "epoch": 7572} {"train_loss": -27.155609130859375, "global_step": 628477, "epoch": 7572} {"train_loss": -27.524091720581055, "global_step": 628478, "epoch": 7572} {"train_loss": -27.87029457092285, "global_step": 628479, "epoch": 7572} {"train_loss": -27.70741081237793, "global_step": 628480, "epoch": 7572} {"train_loss": -27.496450424194336, "global_step": 628481, "epoch": 7572} {"train_loss": -27.738739013671875, "global_step": 628482, "epoch": 7572} {"train_loss": -27.929182052612305, "global_step": 628483, "epoch": 7572} {"train_loss": -28.02414321899414, "global_step": 628484, "epoch": 7572} {"train_loss": -27.75868034362793, "global_step": 628485, "epoch": 7572} {"train_loss": -28.02191734313965, "global_step": 628486, "epoch": 7572} {"train_loss": -27.8695068359375, "global_step": 628487, "epoch": 7572} {"train_loss": -28.074264526367188, "global_step": 628488, "epoch": 7572} {"train_loss": -27.79022216796875, "global_step": 628489, "epoch": 7572} {"train_loss": -28.228424072265625, "global_step": 628490, "epoch": 7572} {"train_loss": -28.166400909423828, "global_step": 628491, "epoch": 7572} {"train_loss": -28.070905685424805, "global_step": 628492, "epoch": 7572} {"train_loss": -28.325225830078125, "global_step": 628493, "epoch": 7572} {"train_loss": -28.36834144592285, "global_step": 628494, "epoch": 7572} {"train_loss": -28.159448623657227, "global_step": 628495, "epoch": 7572} {"train_loss": -27.987024307250977, "global_step": 628496, "epoch": 7572} {"train_loss": -28.207422256469727, "global_step": 628497, "epoch": 7572} {"train_loss": -28.336374282836914, "global_step": 628498, "epoch": 7572} {"train_loss": -28.29121971130371, "global_step": 628499, "epoch": 7572} {"train_loss": -28.284936904907227, "global_step": 628500, "epoch": 7572} {"train_loss": -28.20515251159668, "global_step": 628501, "epoch": 7572} {"train_loss": -28.26031494140625, "global_step": 628502, "epoch": 7572} {"train_loss": -28.37982749938965, "global_step": 628503, "epoch": 7572} {"train_loss": -28.404470443725586, "global_step": 628504, "epoch": 7572} {"train_loss": -28.068206787109375, "global_step": 628505, "epoch": 7572} {"train_loss": -28.250925064086914, "global_step": 628506, "epoch": 7572} {"train_loss": -28.40546989440918, "global_step": 628507, "epoch": 7572} {"train_loss": -28.35651969909668, "global_step": 628508, "epoch": 7572} {"train_loss": -28.155288696289062, "global_step": 628509, "epoch": 7572} {"train_loss": -28.30769920349121, "global_step": 628510, "epoch": 7572} {"train_loss": -28.293333053588867, "global_step": 628511, "epoch": 7572} {"train_loss": -28.62711524963379, "global_step": 628512, "epoch": 7572} {"train_loss": -28.10120964050293, "global_step": 628513, "epoch": 7572} {"train_loss": -28.32562828063965, "global_step": 628514, "epoch": 7572} {"train_loss": -28.027536392211914, "global_step": 628515, "epoch": 7572} {"train_loss": -28.037841796875, "global_step": 628516, "epoch": 7572} {"train_loss": -28.388391494750977, "global_step": 628517, "epoch": 7572} {"train_loss": -28.299108505249023, "global_step": 628518, "epoch": 7572} {"train_loss": -27.84779167175293, "global_step": 628519, "epoch": 7572} {"train_loss": -28.317224502563477, "global_step": 628520, "epoch": 7572} {"train_loss": -27.908843994140625, "global_step": 628521, "epoch": 7572} {"train_loss": -28.338134765625, "global_step": 628522, "epoch": 7572} {"train_loss": -28.335845947265625, "global_step": 628523, "epoch": 7572} {"train_loss": -28.099578857421875, "global_step": 628524, "epoch": 7572} {"train_loss": -28.055389404296875, "global_step": 628525, "epoch": 7572} {"train_loss": -28.243051528930664, "global_step": 628526, "epoch": 7572} {"train_loss": -28.29172134399414, "global_step": 628527, "epoch": 7572} {"train_loss": -28.3691349029541, "global_step": 628528, "epoch": 7572} {"train_loss": -28.117895126342773, "global_step": 628529, "epoch": 7572} {"train_loss": -28.636701583862305, "global_step": 628530, "epoch": 7572} {"train_loss": -27.50251579284668, "global_step": 628531, "epoch": 7572} {"train_loss": -27.744836807250977, "global_step": 628532, "epoch": 7572} {"train_loss": -27.737930297851562, "global_step": 628533, "epoch": 7572} {"train_loss": -27.829147338867188, "global_step": 628534, "epoch": 7572} {"train_loss": -28.344104766845703, "global_step": 628535, "epoch": 7572} {"train_loss": -28.046384811401367, "global_step": 628536, "epoch": 7572} {"train_loss": -27.9337158203125, "global_step": 628537, "epoch": 7572} {"train_loss": -27.915273666381836, "global_step": 628538, "epoch": 7572} {"train_loss": -28.339330673217773, "global_step": 628539, "epoch": 7572} {"train_loss": -28.23833656311035, "global_step": 628540, "epoch": 7572} {"train_loss": -27.9000244140625, "global_step": 628541, "epoch": 7572} {"train_loss": -27.71368980407715, "global_step": 628542, "epoch": 7572} {"train_loss": -28.084339141845703, "global_step": 628543, "epoch": 7572} {"train_loss": -28.118188858032227, "global_step": 628544, "epoch": 7572} {"train_loss": -28.163366317749023, "global_step": 628545, "epoch": 7572} {"train_loss": -28.197717666625977, "global_step": 628546, "epoch": 7572} {"train_loss": -28.15533447265625, "global_step": 628547, "epoch": 7572} {"train_loss": -28.166828155517578, "global_step": 628548, "epoch": 7572} {"train_loss": -28.230976104736328, "global_step": 628549, "epoch": 7572} {"train_loss": -27.826093673706055, "global_step": 628550, "epoch": 7572} {"train_loss": -27.8446044921875, "global_step": 628551, "epoch": 7572} {"train_loss": -28.322845458984375, "global_step": 628552, "epoch": 7572} {"train_loss": -28.436246871948242, "global_step": 628553, "epoch": 7572} {"train_loss": -27.934972763061523, "global_step": 628554, "epoch": 7572} {"train_loss": -28.162540435791016, "global_step": 628555, "epoch": 7572} {"train_loss": -28.515018463134766, "global_step": 628556, "epoch": 7572} {"train_loss": -27.933935165405273, "global_step": 628557, "epoch": 7572} {"train_loss": -28.101400053644756, "global_step": 628558, "epoch": 7572, "val_loss": 6762103.0} {"train_loss": -28.103397369384766, "global_step": 628559, "epoch": 7573} {"train_loss": -27.61969566345215, "global_step": 628560, "epoch": 7573} {"train_loss": -27.77656364440918, "global_step": 628561, "epoch": 7573} {"train_loss": -27.559141159057617, "global_step": 628562, "epoch": 7573} {"train_loss": -28.0399112701416, "global_step": 628563, "epoch": 7573} {"train_loss": -27.6453914642334, "global_step": 628564, "epoch": 7573} {"train_loss": -27.066253662109375, "global_step": 628565, "epoch": 7573} {"train_loss": -27.998748779296875, "global_step": 628566, "epoch": 7573} {"train_loss": -27.7037410736084, "global_step": 628567, "epoch": 7573} {"train_loss": -27.937829971313477, "global_step": 628568, "epoch": 7573} {"train_loss": -27.595300674438477, "global_step": 628569, "epoch": 7573} {"train_loss": -27.76226806640625, "global_step": 628570, "epoch": 7573} {"train_loss": -27.78010368347168, "global_step": 628571, "epoch": 7573} {"train_loss": -27.72027015686035, "global_step": 628572, "epoch": 7573} {"train_loss": -27.73821449279785, "global_step": 628573, "epoch": 7573} {"train_loss": -28.16122817993164, "global_step": 628574, "epoch": 7573} {"train_loss": -27.60062599182129, "global_step": 628575, "epoch": 7573} {"train_loss": -27.854705810546875, "global_step": 628576, "epoch": 7573} {"train_loss": -27.789047241210938, "global_step": 628577, "epoch": 7573} {"train_loss": -28.088876724243164, "global_step": 628578, "epoch": 7573} {"train_loss": -28.06914710998535, "global_step": 628579, "epoch": 7573} {"train_loss": -27.28803825378418, "global_step": 628580, "epoch": 7573} {"train_loss": -27.199995040893555, "global_step": 628581, "epoch": 7573} {"train_loss": -27.88490104675293, "global_step": 628582, "epoch": 7573} {"train_loss": -28.119070053100586, "global_step": 628583, "epoch": 7573} {"train_loss": -27.530790328979492, "global_step": 628584, "epoch": 7573} {"train_loss": -27.485275268554688, "global_step": 628585, "epoch": 7573} {"train_loss": -28.14005470275879, "global_step": 628586, "epoch": 7573} {"train_loss": -27.881505966186523, "global_step": 628587, "epoch": 7573} {"train_loss": -28.178817749023438, "global_step": 628588, "epoch": 7573} {"train_loss": -28.259641647338867, "global_step": 628589, "epoch": 7573} {"train_loss": -27.48476219177246, "global_step": 628590, "epoch": 7573} {"train_loss": -28.071887969970703, "global_step": 628591, "epoch": 7573} {"train_loss": -27.420324325561523, "global_step": 628592, "epoch": 7573} {"train_loss": -28.057621002197266, "global_step": 628593, "epoch": 7573} {"train_loss": -28.10938835144043, "global_step": 628594, "epoch": 7573} {"train_loss": -28.006500244140625, "global_step": 628595, "epoch": 7573} {"train_loss": -27.858509063720703, "global_step": 628596, "epoch": 7573} {"train_loss": -28.1263370513916, "global_step": 628597, "epoch": 7573} {"train_loss": -27.766035079956055, "global_step": 628598, "epoch": 7573} {"train_loss": -27.793170928955078, "global_step": 628599, "epoch": 7573} {"train_loss": -28.224756240844727, "global_step": 628600, "epoch": 7573} {"train_loss": -28.21710777282715, "global_step": 628601, "epoch": 7573} {"train_loss": -28.21845054626465, "global_step": 628602, "epoch": 7573} {"train_loss": -27.943952560424805, "global_step": 628603, "epoch": 7573} {"train_loss": -27.738723754882812, "global_step": 628604, "epoch": 7573} {"train_loss": -27.713117599487305, "global_step": 628605, "epoch": 7573} {"train_loss": -28.021625518798828, "global_step": 628606, "epoch": 7573} {"train_loss": -28.166715621948242, "global_step": 628607, "epoch": 7573} {"train_loss": -28.098133087158203, "global_step": 628608, "epoch": 7573} {"train_loss": -28.314111709594727, "global_step": 628609, "epoch": 7573} {"train_loss": -28.066808700561523, "global_step": 628610, "epoch": 7573} {"train_loss": -28.017148971557617, "global_step": 628611, "epoch": 7573} {"train_loss": -28.176298141479492, "global_step": 628612, "epoch": 7573} {"train_loss": -28.17365074157715, "global_step": 628613, "epoch": 7573} {"train_loss": -28.05341148376465, "global_step": 628614, "epoch": 7573} {"train_loss": -27.7309627532959, "global_step": 628615, "epoch": 7573} {"train_loss": -27.903064727783203, "global_step": 628616, "epoch": 7573} {"train_loss": -28.024372100830078, "global_step": 628617, "epoch": 7573} {"train_loss": -28.016555786132812, "global_step": 628618, "epoch": 7573} {"train_loss": -27.648176193237305, "global_step": 628619, "epoch": 7573} {"train_loss": -28.403690338134766, "global_step": 628620, "epoch": 7573} {"train_loss": -28.253782272338867, "global_step": 628621, "epoch": 7573} {"train_loss": -27.706008911132812, "global_step": 628622, "epoch": 7573} {"train_loss": -27.9830322265625, "global_step": 628623, "epoch": 7573} {"train_loss": -28.0371150970459, "global_step": 628624, "epoch": 7573} {"train_loss": -28.213315963745117, "global_step": 628625, "epoch": 7573} {"train_loss": -27.913923263549805, "global_step": 628626, "epoch": 7573} {"train_loss": -28.366500854492188, "global_step": 628627, "epoch": 7573} {"train_loss": -27.901342391967773, "global_step": 628628, "epoch": 7573} {"train_loss": -27.942218780517578, "global_step": 628629, "epoch": 7573} {"train_loss": -28.342077255249023, "global_step": 628630, "epoch": 7573} {"train_loss": -28.499618530273438, "global_step": 628631, "epoch": 7573} {"train_loss": -28.39642906188965, "global_step": 628632, "epoch": 7573} {"train_loss": -28.381567001342773, "global_step": 628633, "epoch": 7573} {"train_loss": -28.1278076171875, "global_step": 628634, "epoch": 7573} {"train_loss": -28.43634033203125, "global_step": 628635, "epoch": 7573} {"train_loss": -28.443639755249023, "global_step": 628636, "epoch": 7573} {"train_loss": -28.392688751220703, "global_step": 628637, "epoch": 7573} {"train_loss": -28.2905216217041, "global_step": 628638, "epoch": 7573} {"train_loss": -28.2006893157959, "global_step": 628639, "epoch": 7573} {"train_loss": -28.16217041015625, "global_step": 628640, "epoch": 7573} {"train_loss": -27.970449723393084, "global_step": 628641, "epoch": 7573, "val_loss": 6738696.0} {"train_loss": -28.268146514892578, "global_step": 628642, "epoch": 7574} {"train_loss": -27.798429489135742, "global_step": 628643, "epoch": 7574} {"train_loss": -28.07892417907715, "global_step": 628644, "epoch": 7574} {"train_loss": -27.6865234375, "global_step": 628645, "epoch": 7574} {"train_loss": -27.48475456237793, "global_step": 628646, "epoch": 7574} {"train_loss": -27.91998291015625, "global_step": 628647, "epoch": 7574} {"train_loss": -27.805295944213867, "global_step": 628648, "epoch": 7574} {"train_loss": -26.4931640625, "global_step": 628649, "epoch": 7574} {"train_loss": -26.055709838867188, "global_step": 628650, "epoch": 7574} {"train_loss": -25.990942001342773, "global_step": 628651, "epoch": 7574} {"train_loss": -27.187713623046875, "global_step": 628652, "epoch": 7574} {"train_loss": -27.472793579101562, "global_step": 628653, "epoch": 7574} {"train_loss": -26.9138126373291, "global_step": 628654, "epoch": 7574} {"train_loss": -27.2476749420166, "global_step": 628655, "epoch": 7574} {"train_loss": -27.405914306640625, "global_step": 628656, "epoch": 7574} {"train_loss": -27.92291831970215, "global_step": 628657, "epoch": 7574} {"train_loss": -27.540319442749023, "global_step": 628658, "epoch": 7574} {"train_loss": -27.777618408203125, "global_step": 628659, "epoch": 7574} {"train_loss": -27.562652587890625, "global_step": 628660, "epoch": 7574} {"train_loss": -28.3460693359375, "global_step": 628661, "epoch": 7574} {"train_loss": -27.89617347717285, "global_step": 628662, "epoch": 7574} {"train_loss": -27.780853271484375, "global_step": 628663, "epoch": 7574} {"train_loss": -27.658666610717773, "global_step": 628664, "epoch": 7574} {"train_loss": -27.693445205688477, "global_step": 628665, "epoch": 7574} {"train_loss": -27.678556442260742, "global_step": 628666, "epoch": 7574} {"train_loss": -28.039587020874023, "global_step": 628667, "epoch": 7574} {"train_loss": -27.739282608032227, "global_step": 628668, "epoch": 7574} {"train_loss": -27.879785537719727, "global_step": 628669, "epoch": 7574} {"train_loss": -27.85404396057129, "global_step": 628670, "epoch": 7574} {"train_loss": -28.203413009643555, "global_step": 628671, "epoch": 7574} {"train_loss": -27.641965866088867, "global_step": 628672, "epoch": 7574} {"train_loss": -27.92608642578125, "global_step": 628673, "epoch": 7574} {"train_loss": -27.767786026000977, "global_step": 628674, "epoch": 7574} {"train_loss": -27.98296546936035, "global_step": 628675, "epoch": 7574} {"train_loss": -28.075891494750977, "global_step": 628676, "epoch": 7574} {"train_loss": -28.28510856628418, "global_step": 628677, "epoch": 7574} {"train_loss": -28.077503204345703, "global_step": 628678, "epoch": 7574} {"train_loss": -28.048725128173828, "global_step": 628679, "epoch": 7574} {"train_loss": -28.1402587890625, "global_step": 628680, "epoch": 7574} {"train_loss": -28.178632736206055, "global_step": 628681, "epoch": 7574} {"train_loss": -28.398481369018555, "global_step": 628682, "epoch": 7574} {"train_loss": -28.11199378967285, "global_step": 628683, "epoch": 7574} {"train_loss": -28.19379997253418, "global_step": 628684, "epoch": 7574} {"train_loss": -28.332300186157227, "global_step": 628685, "epoch": 7574} {"train_loss": -28.423847198486328, "global_step": 628686, "epoch": 7574} {"train_loss": -28.295862197875977, "global_step": 628687, "epoch": 7574} {"train_loss": -28.24336051940918, "global_step": 628688, "epoch": 7574} {"train_loss": -28.614242553710938, "global_step": 628689, "epoch": 7574} {"train_loss": -28.298755645751953, "global_step": 628690, "epoch": 7574} {"train_loss": -28.402170181274414, "global_step": 628691, "epoch": 7574} {"train_loss": -28.285795211791992, "global_step": 628692, "epoch": 7574} {"train_loss": -28.4359130859375, "global_step": 628693, "epoch": 7574} {"train_loss": -28.038137435913086, "global_step": 628694, "epoch": 7574} {"train_loss": -28.394956588745117, "global_step": 628695, "epoch": 7574} {"train_loss": -28.235076904296875, "global_step": 628696, "epoch": 7574} {"train_loss": -28.57276725769043, "global_step": 628697, "epoch": 7574} {"train_loss": -28.5197811126709, "global_step": 628698, "epoch": 7574} {"train_loss": -28.388492584228516, "global_step": 628699, "epoch": 7574} {"train_loss": -28.391813278198242, "global_step": 628700, "epoch": 7574} {"train_loss": -28.673404693603516, "global_step": 628701, "epoch": 7574} {"train_loss": -28.008819580078125, "global_step": 628702, "epoch": 7574} {"train_loss": -28.292011260986328, "global_step": 628703, "epoch": 7574} {"train_loss": -27.992666244506836, "global_step": 628704, "epoch": 7574} {"train_loss": -28.17333984375, "global_step": 628705, "epoch": 7574} {"train_loss": -28.295333862304688, "global_step": 628706, "epoch": 7574} {"train_loss": -28.50855827331543, "global_step": 628707, "epoch": 7574} {"train_loss": -27.9759578704834, "global_step": 628708, "epoch": 7574} {"train_loss": -27.99393081665039, "global_step": 628709, "epoch": 7574} {"train_loss": -28.146921157836914, "global_step": 628710, "epoch": 7574} {"train_loss": -28.19580078125, "global_step": 628711, "epoch": 7574} {"train_loss": -28.44775390625, "global_step": 628712, "epoch": 7574} {"train_loss": -28.42145347595215, "global_step": 628713, "epoch": 7574} {"train_loss": -28.1329402923584, "global_step": 628714, "epoch": 7574} {"train_loss": -28.42951011657715, "global_step": 628715, "epoch": 7574} {"train_loss": -28.095876693725586, "global_step": 628716, "epoch": 7574} {"train_loss": -28.33977699279785, "global_step": 628717, "epoch": 7574} {"train_loss": -28.080097198486328, "global_step": 628718, "epoch": 7574} {"train_loss": -28.167484283447266, "global_step": 628719, "epoch": 7574} {"train_loss": -28.177011489868164, "global_step": 628720, "epoch": 7574} {"train_loss": -28.334930419921875, "global_step": 628721, "epoch": 7574} {"train_loss": -28.132654190063477, "global_step": 628722, "epoch": 7574} {"train_loss": -27.91151237487793, "global_step": 628723, "epoch": 7574} {"train_loss": -27.984650393566454, "global_step": 628724, "epoch": 7574, "val_loss": 6805170.0} {"train_loss": -27.86579704284668, "global_step": 628725, "epoch": 7575} {"train_loss": -27.702184677124023, "global_step": 628726, "epoch": 7575} {"train_loss": -28.275714874267578, "global_step": 628727, "epoch": 7575} {"train_loss": -28.049108505249023, "global_step": 628728, "epoch": 7575} {"train_loss": -27.73797035217285, "global_step": 628729, "epoch": 7575} {"train_loss": -27.892820358276367, "global_step": 628730, "epoch": 7575} {"train_loss": -27.703857421875, "global_step": 628731, "epoch": 7575} {"train_loss": -27.7008113861084, "global_step": 628732, "epoch": 7575} {"train_loss": -27.55866050720215, "global_step": 628733, "epoch": 7575} {"train_loss": -27.90887451171875, "global_step": 628734, "epoch": 7575} {"train_loss": -27.701862335205078, "global_step": 628735, "epoch": 7575} {"train_loss": -28.073780059814453, "global_step": 628736, "epoch": 7575} {"train_loss": -28.011962890625, "global_step": 628737, "epoch": 7575} {"train_loss": -27.974653244018555, "global_step": 628738, "epoch": 7575} {"train_loss": -27.47626304626465, "global_step": 628739, "epoch": 7575} {"train_loss": -28.11113929748535, "global_step": 628740, "epoch": 7575} {"train_loss": -28.01407814025879, "global_step": 628741, "epoch": 7575} {"train_loss": -27.860397338867188, "global_step": 628742, "epoch": 7575} {"train_loss": -28.164371490478516, "global_step": 628743, "epoch": 7575} {"train_loss": -27.797718048095703, "global_step": 628744, "epoch": 7575} {"train_loss": -28.232519149780273, "global_step": 628745, "epoch": 7575} {"train_loss": -27.970746994018555, "global_step": 628746, "epoch": 7575} {"train_loss": -28.307371139526367, "global_step": 628747, "epoch": 7575} {"train_loss": -28.269290924072266, "global_step": 628748, "epoch": 7575} {"train_loss": -28.24698829650879, "global_step": 628749, "epoch": 7575} {"train_loss": -28.413501739501953, "global_step": 628750, "epoch": 7575} {"train_loss": -28.053253173828125, "global_step": 628751, "epoch": 7575} {"train_loss": -28.63657569885254, "global_step": 628752, "epoch": 7575} {"train_loss": -28.29071044921875, "global_step": 628753, "epoch": 7575} {"train_loss": -28.166135787963867, "global_step": 628754, "epoch": 7575} {"train_loss": -28.39344596862793, "global_step": 628755, "epoch": 7575} {"train_loss": -28.6004581451416, "global_step": 628756, "epoch": 7575} {"train_loss": -28.570423126220703, "global_step": 628757, "epoch": 7575} {"train_loss": -28.56829261779785, "global_step": 628758, "epoch": 7575} {"train_loss": -28.19502067565918, "global_step": 628759, "epoch": 7575} {"train_loss": -28.402524948120117, "global_step": 628760, "epoch": 7575} {"train_loss": -28.141958236694336, "global_step": 628761, "epoch": 7575} {"train_loss": -28.416229248046875, "global_step": 628762, "epoch": 7575} {"train_loss": -28.109052658081055, "global_step": 628763, "epoch": 7575} {"train_loss": -28.175806045532227, "global_step": 628764, "epoch": 7575} {"train_loss": -28.76775550842285, "global_step": 628765, "epoch": 7575} {"train_loss": -28.084949493408203, "global_step": 628766, "epoch": 7575} {"train_loss": -28.575979232788086, "global_step": 628767, "epoch": 7575} {"train_loss": -28.01679801940918, "global_step": 628768, "epoch": 7575} {"train_loss": -28.04501724243164, "global_step": 628769, "epoch": 7575} {"train_loss": -27.99207878112793, "global_step": 628770, "epoch": 7575} {"train_loss": -28.167621612548828, "global_step": 628771, "epoch": 7575} {"train_loss": -28.41282081604004, "global_step": 628772, "epoch": 7575} {"train_loss": -28.53596305847168, "global_step": 628773, "epoch": 7575} {"train_loss": -27.9692325592041, "global_step": 628774, "epoch": 7575} {"train_loss": -28.5474910736084, "global_step": 628775, "epoch": 7575} {"train_loss": -28.16520118713379, "global_step": 628776, "epoch": 7575} {"train_loss": -28.198505401611328, "global_step": 628777, "epoch": 7575} {"train_loss": -28.284595489501953, "global_step": 628778, "epoch": 7575} {"train_loss": -28.1953125, "global_step": 628779, "epoch": 7575} {"train_loss": -28.102020263671875, "global_step": 628780, "epoch": 7575} {"train_loss": -28.272659301757812, "global_step": 628781, "epoch": 7575} {"train_loss": -28.334217071533203, "global_step": 628782, "epoch": 7575} {"train_loss": -28.4560604095459, "global_step": 628783, "epoch": 7575} {"train_loss": -28.449798583984375, "global_step": 628784, "epoch": 7575} {"train_loss": -28.233657836914062, "global_step": 628785, "epoch": 7575} {"train_loss": -28.324634552001953, "global_step": 628786, "epoch": 7575} {"train_loss": -28.042470932006836, "global_step": 628787, "epoch": 7575} {"train_loss": -27.861454010009766, "global_step": 628788, "epoch": 7575} {"train_loss": -28.053308486938477, "global_step": 628789, "epoch": 7575} {"train_loss": -27.553735733032227, "global_step": 628790, "epoch": 7575} {"train_loss": -26.72035026550293, "global_step": 628791, "epoch": 7575} {"train_loss": -26.579345703125, "global_step": 628792, "epoch": 7575} {"train_loss": -27.393335342407227, "global_step": 628793, "epoch": 7575} {"train_loss": -28.367511749267578, "global_step": 628794, "epoch": 7575} {"train_loss": -26.70419692993164, "global_step": 628795, "epoch": 7575} {"train_loss": -27.799057006835938, "global_step": 628796, "epoch": 7575} {"train_loss": -27.607624053955078, "global_step": 628797, "epoch": 7575} {"train_loss": -27.63119888305664, "global_step": 628798, "epoch": 7575} {"train_loss": -27.724822998046875, "global_step": 628799, "epoch": 7575} {"train_loss": -27.62158203125, "global_step": 628800, "epoch": 7575} {"train_loss": -27.479145050048828, "global_step": 628801, "epoch": 7575} {"train_loss": -27.6944522857666, "global_step": 628802, "epoch": 7575} {"train_loss": -28.228910446166992, "global_step": 628803, "epoch": 7575} {"train_loss": -28.05085563659668, "global_step": 628804, "epoch": 7575} {"train_loss": -27.878559112548828, "global_step": 628805, "epoch": 7575} {"train_loss": -28.050312042236328, "global_step": 628806, "epoch": 7575} {"train_loss": -28.028709365660887, "global_step": 628807, "epoch": 7575, "val_loss": 6697024.5} {"train_loss": -27.540908813476562, "global_step": 628808, "epoch": 7576} {"train_loss": -27.518482208251953, "global_step": 628809, "epoch": 7576} {"train_loss": -27.520355224609375, "global_step": 628810, "epoch": 7576} {"train_loss": -27.85736656188965, "global_step": 628811, "epoch": 7576} {"train_loss": -27.431671142578125, "global_step": 628812, "epoch": 7576} {"train_loss": -27.920745849609375, "global_step": 628813, "epoch": 7576} {"train_loss": -27.405521392822266, "global_step": 628814, "epoch": 7576} {"train_loss": -27.72336769104004, "global_step": 628815, "epoch": 7576} {"train_loss": -27.529067993164062, "global_step": 628816, "epoch": 7576} {"train_loss": -27.54669761657715, "global_step": 628817, "epoch": 7576} {"train_loss": -28.078754425048828, "global_step": 628818, "epoch": 7576} {"train_loss": -27.680908203125, "global_step": 628819, "epoch": 7576} {"train_loss": -27.693700790405273, "global_step": 628820, "epoch": 7576} {"train_loss": -27.80780601501465, "global_step": 628821, "epoch": 7576} {"train_loss": -28.080596923828125, "global_step": 628822, "epoch": 7576} {"train_loss": -28.0087833404541, "global_step": 628823, "epoch": 7576} {"train_loss": -28.241302490234375, "global_step": 628824, "epoch": 7576} {"train_loss": -28.19425392150879, "global_step": 628825, "epoch": 7576} {"train_loss": -27.60951042175293, "global_step": 628826, "epoch": 7576} {"train_loss": -28.11432456970215, "global_step": 628827, "epoch": 7576} {"train_loss": -27.714527130126953, "global_step": 628828, "epoch": 7576} {"train_loss": -28.153715133666992, "global_step": 628829, "epoch": 7576} {"train_loss": -28.102277755737305, "global_step": 628830, "epoch": 7576} {"train_loss": -28.25494956970215, "global_step": 628831, "epoch": 7576} {"train_loss": -28.48859214782715, "global_step": 628832, "epoch": 7576} {"train_loss": -28.249860763549805, "global_step": 628833, "epoch": 7576} {"train_loss": -28.30478286743164, "global_step": 628834, "epoch": 7576} {"train_loss": -28.25180435180664, "global_step": 628835, "epoch": 7576} {"train_loss": -28.161035537719727, "global_step": 628836, "epoch": 7576} {"train_loss": -28.22974967956543, "global_step": 628837, "epoch": 7576} {"train_loss": -28.205163955688477, "global_step": 628838, "epoch": 7576} {"train_loss": -28.034772872924805, "global_step": 628839, "epoch": 7576} {"train_loss": -28.39350700378418, "global_step": 628840, "epoch": 7576} {"train_loss": -28.315738677978516, "global_step": 628841, "epoch": 7576} {"train_loss": -28.191211700439453, "global_step": 628842, "epoch": 7576} {"train_loss": -28.3695011138916, "global_step": 628843, "epoch": 7576} {"train_loss": -28.397369384765625, "global_step": 628844, "epoch": 7576} {"train_loss": -28.398696899414062, "global_step": 628845, "epoch": 7576} {"train_loss": -28.50250816345215, "global_step": 628846, "epoch": 7576} {"train_loss": -28.239736557006836, "global_step": 628847, "epoch": 7576} {"train_loss": -28.396381378173828, "global_step": 628848, "epoch": 7576} {"train_loss": -27.918447494506836, "global_step": 628849, "epoch": 7576} {"train_loss": -28.1318359375, "global_step": 628850, "epoch": 7576} {"train_loss": -28.004358291625977, "global_step": 628851, "epoch": 7576} {"train_loss": -27.888593673706055, "global_step": 628852, "epoch": 7576} {"train_loss": -28.095539093017578, "global_step": 628853, "epoch": 7576} {"train_loss": -28.206588745117188, "global_step": 628854, "epoch": 7576} {"train_loss": -28.314233779907227, "global_step": 628855, "epoch": 7576} {"train_loss": -28.619434356689453, "global_step": 628856, "epoch": 7576} {"train_loss": -28.779443740844727, "global_step": 628857, "epoch": 7576} {"train_loss": -28.042774200439453, "global_step": 628858, "epoch": 7576} {"train_loss": -28.210132598876953, "global_step": 628859, "epoch": 7576} {"train_loss": -28.416156768798828, "global_step": 628860, "epoch": 7576} {"train_loss": -28.146902084350586, "global_step": 628861, "epoch": 7576} {"train_loss": -28.194955825805664, "global_step": 628862, "epoch": 7576} {"train_loss": -28.2910213470459, "global_step": 628863, "epoch": 7576} {"train_loss": -28.110647201538086, "global_step": 628864, "epoch": 7576} {"train_loss": -27.761133193969727, "global_step": 628865, "epoch": 7576} {"train_loss": -28.276708602905273, "global_step": 628866, "epoch": 7576} {"train_loss": -28.031347274780273, "global_step": 628867, "epoch": 7576} {"train_loss": -28.206811904907227, "global_step": 628868, "epoch": 7576} {"train_loss": -27.987455368041992, "global_step": 628869, "epoch": 7576} {"train_loss": -27.912979125976562, "global_step": 628870, "epoch": 7576} {"train_loss": -28.328479766845703, "global_step": 628871, "epoch": 7576} {"train_loss": -27.796552658081055, "global_step": 628872, "epoch": 7576} {"train_loss": -28.475738525390625, "global_step": 628873, "epoch": 7576} {"train_loss": -28.231796264648438, "global_step": 628874, "epoch": 7576} {"train_loss": -28.2023868560791, "global_step": 628875, "epoch": 7576} {"train_loss": -28.293649673461914, "global_step": 628876, "epoch": 7576} {"train_loss": -28.193784713745117, "global_step": 628877, "epoch": 7576} {"train_loss": -28.038076400756836, "global_step": 628878, "epoch": 7576} {"train_loss": -28.11176109313965, "global_step": 628879, "epoch": 7576} {"train_loss": -28.242145538330078, "global_step": 628880, "epoch": 7576} {"train_loss": -28.63319206237793, "global_step": 628881, "epoch": 7576} {"train_loss": -28.360763549804688, "global_step": 628882, "epoch": 7576} {"train_loss": -28.133594512939453, "global_step": 628883, "epoch": 7576} {"train_loss": -28.44595718383789, "global_step": 628884, "epoch": 7576} {"train_loss": -27.92718505859375, "global_step": 628885, "epoch": 7576} {"train_loss": -28.209156036376953, "global_step": 628886, "epoch": 7576} {"train_loss": -28.131277084350586, "global_step": 628887, "epoch": 7576} {"train_loss": -28.337646484375, "global_step": 628888, "epoch": 7576} {"train_loss": -28.44281005859375, "global_step": 628889, "epoch": 7576} {"train_loss": -28.12125341576266, "global_step": 628890, "epoch": 7576, "val_loss": 6701673.0} {"train_loss": -27.806482315063477, "global_step": 628891, "epoch": 7577} {"train_loss": -27.552595138549805, "global_step": 628892, "epoch": 7577} {"train_loss": -27.842575073242188, "global_step": 628893, "epoch": 7577} {"train_loss": -27.330480575561523, "global_step": 628894, "epoch": 7577} {"train_loss": -27.561634063720703, "global_step": 628895, "epoch": 7577} {"train_loss": -27.571863174438477, "global_step": 628896, "epoch": 7577} {"train_loss": -27.398086547851562, "global_step": 628897, "epoch": 7577} {"train_loss": -27.99260902404785, "global_step": 628898, "epoch": 7577} {"train_loss": -27.6685791015625, "global_step": 628899, "epoch": 7577} {"train_loss": -27.395811080932617, "global_step": 628900, "epoch": 7577} {"train_loss": -28.007383346557617, "global_step": 628901, "epoch": 7577} {"train_loss": -28.185260772705078, "global_step": 628902, "epoch": 7577} {"train_loss": -27.444074630737305, "global_step": 628903, "epoch": 7577} {"train_loss": -27.975326538085938, "global_step": 628904, "epoch": 7577} {"train_loss": -28.233795166015625, "global_step": 628905, "epoch": 7577} {"train_loss": -28.358381271362305, "global_step": 628906, "epoch": 7577} {"train_loss": -28.366926193237305, "global_step": 628907, "epoch": 7577} {"train_loss": -27.9403133392334, "global_step": 628908, "epoch": 7577} {"train_loss": -28.101211547851562, "global_step": 628909, "epoch": 7577} {"train_loss": -28.26588249206543, "global_step": 628910, "epoch": 7577} {"train_loss": -28.236907958984375, "global_step": 628911, "epoch": 7577} {"train_loss": -28.503339767456055, "global_step": 628912, "epoch": 7577} {"train_loss": -28.032480239868164, "global_step": 628913, "epoch": 7577} {"train_loss": -27.97098159790039, "global_step": 628914, "epoch": 7577} {"train_loss": -27.652881622314453, "global_step": 628915, "epoch": 7577} {"train_loss": -27.760498046875, "global_step": 628916, "epoch": 7577} {"train_loss": -27.616607666015625, "global_step": 628917, "epoch": 7577} {"train_loss": -28.4425048828125, "global_step": 628918, "epoch": 7577} {"train_loss": -28.042724609375, "global_step": 628919, "epoch": 7577} {"train_loss": -28.230010986328125, "global_step": 628920, "epoch": 7577} {"train_loss": -28.603015899658203, "global_step": 628921, "epoch": 7577} {"train_loss": -28.00516128540039, "global_step": 628922, "epoch": 7577} {"train_loss": -28.353525161743164, "global_step": 628923, "epoch": 7577} {"train_loss": -28.5079345703125, "global_step": 628924, "epoch": 7577} {"train_loss": -28.346723556518555, "global_step": 628925, "epoch": 7577} {"train_loss": -28.55950927734375, "global_step": 628926, "epoch": 7577} {"train_loss": -28.384418487548828, "global_step": 628927, "epoch": 7577} {"train_loss": -28.59221839904785, "global_step": 628928, "epoch": 7577} {"train_loss": -28.500402450561523, "global_step": 628929, "epoch": 7577} {"train_loss": -28.310199737548828, "global_step": 628930, "epoch": 7577} {"train_loss": -28.451099395751953, "global_step": 628931, "epoch": 7577} {"train_loss": -28.932653427124023, "global_step": 628932, "epoch": 7577} {"train_loss": -27.949918746948242, "global_step": 628933, "epoch": 7577} {"train_loss": -28.463104248046875, "global_step": 628934, "epoch": 7577} {"train_loss": -28.154062271118164, "global_step": 628935, "epoch": 7577} {"train_loss": -28.340925216674805, "global_step": 628936, "epoch": 7577} {"train_loss": -28.209640502929688, "global_step": 628937, "epoch": 7577} {"train_loss": -28.44428062438965, "global_step": 628938, "epoch": 7577} {"train_loss": -28.195789337158203, "global_step": 628939, "epoch": 7577} {"train_loss": -28.0745906829834, "global_step": 628940, "epoch": 7577} {"train_loss": -28.26325035095215, "global_step": 628941, "epoch": 7577} {"train_loss": -28.179655075073242, "global_step": 628942, "epoch": 7577} {"train_loss": -27.93243408203125, "global_step": 628943, "epoch": 7577} {"train_loss": -27.874094009399414, "global_step": 628944, "epoch": 7577} {"train_loss": -27.759668350219727, "global_step": 628945, "epoch": 7577} {"train_loss": -28.060434341430664, "global_step": 628946, "epoch": 7577} {"train_loss": -27.85188102722168, "global_step": 628947, "epoch": 7577} {"train_loss": -27.94087791442871, "global_step": 628948, "epoch": 7577} {"train_loss": -27.839685440063477, "global_step": 628949, "epoch": 7577} {"train_loss": -28.2586669921875, "global_step": 628950, "epoch": 7577} {"train_loss": -28.1861629486084, "global_step": 628951, "epoch": 7577} {"train_loss": -28.070554733276367, "global_step": 628952, "epoch": 7577} {"train_loss": -28.436237335205078, "global_step": 628953, "epoch": 7577} {"train_loss": -28.253305435180664, "global_step": 628954, "epoch": 7577} {"train_loss": -28.21879005432129, "global_step": 628955, "epoch": 7577} {"train_loss": -27.649999618530273, "global_step": 628956, "epoch": 7577} {"train_loss": -28.08914566040039, "global_step": 628957, "epoch": 7577} {"train_loss": -28.008466720581055, "global_step": 628958, "epoch": 7577} {"train_loss": -27.88861656188965, "global_step": 628959, "epoch": 7577} {"train_loss": -27.923593521118164, "global_step": 628960, "epoch": 7577} {"train_loss": -27.86313819885254, "global_step": 628961, "epoch": 7577} {"train_loss": -28.364179611206055, "global_step": 628962, "epoch": 7577} {"train_loss": -28.1688232421875, "global_step": 628963, "epoch": 7577} {"train_loss": -28.020587921142578, "global_step": 628964, "epoch": 7577} {"train_loss": -28.182153701782227, "global_step": 628965, "epoch": 7577} {"train_loss": -27.677515029907227, "global_step": 628966, "epoch": 7577} {"train_loss": -27.84779930114746, "global_step": 628967, "epoch": 7577} {"train_loss": -28.2264461517334, "global_step": 628968, "epoch": 7577} {"train_loss": -27.949695587158203, "global_step": 628969, "epoch": 7577} {"train_loss": -28.254413604736328, "global_step": 628970, "epoch": 7577} {"train_loss": -28.25457763671875, "global_step": 628971, "epoch": 7577} {"train_loss": -28.556705474853516, "global_step": 628972, "epoch": 7577} {"train_loss": -28.088362774216986, "global_step": 628973, "epoch": 7577, "val_loss": 6694401.0} {"train_loss": -27.913846969604492, "global_step": 628974, "epoch": 7578} {"train_loss": -27.703405380249023, "global_step": 628975, "epoch": 7578} {"train_loss": -27.891393661499023, "global_step": 628976, "epoch": 7578} {"train_loss": -27.773517608642578, "global_step": 628977, "epoch": 7578} {"train_loss": -27.798437118530273, "global_step": 628978, "epoch": 7578} {"train_loss": -27.617969512939453, "global_step": 628979, "epoch": 7578} {"train_loss": -28.41461753845215, "global_step": 628980, "epoch": 7578} {"train_loss": -27.741708755493164, "global_step": 628981, "epoch": 7578} {"train_loss": -27.935565948486328, "global_step": 628982, "epoch": 7578} {"train_loss": -27.775970458984375, "global_step": 628983, "epoch": 7578} {"train_loss": -27.7587947845459, "global_step": 628984, "epoch": 7578} {"train_loss": -27.892547607421875, "global_step": 628985, "epoch": 7578} {"train_loss": -27.644189834594727, "global_step": 628986, "epoch": 7578} {"train_loss": -27.79298973083496, "global_step": 628987, "epoch": 7578} {"train_loss": -27.8253173828125, "global_step": 628988, "epoch": 7578} {"train_loss": -27.97205924987793, "global_step": 628989, "epoch": 7578} {"train_loss": -27.95404624938965, "global_step": 628990, "epoch": 7578} {"train_loss": -28.01384925842285, "global_step": 628991, "epoch": 7578} {"train_loss": -27.73237419128418, "global_step": 628992, "epoch": 7578} {"train_loss": -28.383005142211914, "global_step": 628993, "epoch": 7578} {"train_loss": -27.81727409362793, "global_step": 628994, "epoch": 7578} {"train_loss": -28.130903244018555, "global_step": 628995, "epoch": 7578} {"train_loss": -28.17424964904785, "global_step": 628996, "epoch": 7578} {"train_loss": -28.1934871673584, "global_step": 628997, "epoch": 7578} {"train_loss": -28.1131649017334, "global_step": 628998, "epoch": 7578} {"train_loss": -27.993314743041992, "global_step": 628999, "epoch": 7578} {"train_loss": -28.062061309814453, "global_step": 629000, "epoch": 7578} {"train_loss": -28.346939086914062, "global_step": 629001, "epoch": 7578} {"train_loss": -28.505277633666992, "global_step": 629002, "epoch": 7578} {"train_loss": -28.290058135986328, "global_step": 629003, "epoch": 7578} {"train_loss": -28.108701705932617, "global_step": 629004, "epoch": 7578} {"train_loss": -28.023584365844727, "global_step": 629005, "epoch": 7578} {"train_loss": -28.277143478393555, "global_step": 629006, "epoch": 7578} {"train_loss": -28.186487197875977, "global_step": 629007, "epoch": 7578} {"train_loss": -27.969079971313477, "global_step": 629008, "epoch": 7578} {"train_loss": -28.51905632019043, "global_step": 629009, "epoch": 7578} {"train_loss": -28.399709701538086, "global_step": 629010, "epoch": 7578} {"train_loss": -28.049718856811523, "global_step": 629011, "epoch": 7578} {"train_loss": -28.2908992767334, "global_step": 629012, "epoch": 7578} {"train_loss": -28.422500610351562, "global_step": 629013, "epoch": 7578} {"train_loss": -28.43267822265625, "global_step": 629014, "epoch": 7578} {"train_loss": -28.172409057617188, "global_step": 629015, "epoch": 7578} {"train_loss": -28.274856567382812, "global_step": 629016, "epoch": 7578} {"train_loss": -28.197595596313477, "global_step": 629017, "epoch": 7578} {"train_loss": -28.279254913330078, "global_step": 629018, "epoch": 7578} {"train_loss": -28.19943618774414, "global_step": 629019, "epoch": 7578} {"train_loss": -28.008779525756836, "global_step": 629020, "epoch": 7578} {"train_loss": -28.31324577331543, "global_step": 629021, "epoch": 7578} {"train_loss": -28.45894432067871, "global_step": 629022, "epoch": 7578} {"train_loss": -28.73902702331543, "global_step": 629023, "epoch": 7578} {"train_loss": -28.7345027923584, "global_step": 629024, "epoch": 7578} {"train_loss": -28.287046432495117, "global_step": 629025, "epoch": 7578} {"train_loss": -28.583280563354492, "global_step": 629026, "epoch": 7578} {"train_loss": -28.206161499023438, "global_step": 629027, "epoch": 7578} {"train_loss": -28.45680046081543, "global_step": 629028, "epoch": 7578} {"train_loss": -28.6804141998291, "global_step": 629029, "epoch": 7578} {"train_loss": -28.06269645690918, "global_step": 629030, "epoch": 7578} {"train_loss": -28.500471115112305, "global_step": 629031, "epoch": 7578} {"train_loss": -28.172565460205078, "global_step": 629032, "epoch": 7578} {"train_loss": -27.906381607055664, "global_step": 629033, "epoch": 7578} {"train_loss": -27.190109252929688, "global_step": 629034, "epoch": 7578} {"train_loss": -27.47760581970215, "global_step": 629035, "epoch": 7578} {"train_loss": -27.711942672729492, "global_step": 629036, "epoch": 7578} {"train_loss": -27.790298461914062, "global_step": 629037, "epoch": 7578} {"train_loss": -28.2261905670166, "global_step": 629038, "epoch": 7578} {"train_loss": -28.066837310791016, "global_step": 629039, "epoch": 7578} {"train_loss": -27.579397201538086, "global_step": 629040, "epoch": 7578} {"train_loss": -28.219532012939453, "global_step": 629041, "epoch": 7578} {"train_loss": -27.97551918029785, "global_step": 629042, "epoch": 7578} {"train_loss": -27.789936065673828, "global_step": 629043, "epoch": 7578} {"train_loss": -27.683378219604492, "global_step": 629044, "epoch": 7578} {"train_loss": -28.011356353759766, "global_step": 629045, "epoch": 7578} {"train_loss": -28.09669303894043, "global_step": 629046, "epoch": 7578} {"train_loss": -27.868549346923828, "global_step": 629047, "epoch": 7578} {"train_loss": -28.334980010986328, "global_step": 629048, "epoch": 7578} {"train_loss": -27.89273452758789, "global_step": 629049, "epoch": 7578} {"train_loss": -28.191762924194336, "global_step": 629050, "epoch": 7578} {"train_loss": -27.93525505065918, "global_step": 629051, "epoch": 7578} {"train_loss": -28.338428497314453, "global_step": 629052, "epoch": 7578} {"train_loss": -27.454626083374023, "global_step": 629053, "epoch": 7578} {"train_loss": -28.125446319580078, "global_step": 629054, "epoch": 7578} {"train_loss": -27.73581886291504, "global_step": 629055, "epoch": 7578} {"train_loss": -28.07102513600545, "global_step": 629056, "epoch": 7578, "val_loss": 6716765.0} {"train_loss": -27.62668228149414, "global_step": 629057, "epoch": 7579} {"train_loss": -27.039295196533203, "global_step": 629058, "epoch": 7579} {"train_loss": -27.879959106445312, "global_step": 629059, "epoch": 7579} {"train_loss": -27.443933486938477, "global_step": 629060, "epoch": 7579} {"train_loss": -27.351842880249023, "global_step": 629061, "epoch": 7579} {"train_loss": -27.348386764526367, "global_step": 629062, "epoch": 7579} {"train_loss": -27.57041358947754, "global_step": 629063, "epoch": 7579} {"train_loss": -27.765531539916992, "global_step": 629064, "epoch": 7579} {"train_loss": -27.249547958374023, "global_step": 629065, "epoch": 7579} {"train_loss": -27.4436092376709, "global_step": 629066, "epoch": 7579} {"train_loss": -27.70916175842285, "global_step": 629067, "epoch": 7579} {"train_loss": -27.531436920166016, "global_step": 629068, "epoch": 7579} {"train_loss": -27.658557891845703, "global_step": 629069, "epoch": 7579} {"train_loss": -27.744775772094727, "global_step": 629070, "epoch": 7579} {"train_loss": -27.932392120361328, "global_step": 629071, "epoch": 7579} {"train_loss": -27.7059268951416, "global_step": 629072, "epoch": 7579} {"train_loss": -27.8885555267334, "global_step": 629073, "epoch": 7579} {"train_loss": -27.777856826782227, "global_step": 629074, "epoch": 7579} {"train_loss": -28.069671630859375, "global_step": 629075, "epoch": 7579} {"train_loss": -28.037405014038086, "global_step": 629076, "epoch": 7579} {"train_loss": -28.03726577758789, "global_step": 629077, "epoch": 7579} {"train_loss": -27.631860733032227, "global_step": 629078, "epoch": 7579} {"train_loss": -27.920934677124023, "global_step": 629079, "epoch": 7579} {"train_loss": -27.86537742614746, "global_step": 629080, "epoch": 7579} {"train_loss": -28.01991081237793, "global_step": 629081, "epoch": 7579} {"train_loss": -28.0897274017334, "global_step": 629082, "epoch": 7579} {"train_loss": -27.688251495361328, "global_step": 629083, "epoch": 7579} {"train_loss": -28.09063148498535, "global_step": 629084, "epoch": 7579} {"train_loss": -28.203428268432617, "global_step": 629085, "epoch": 7579} {"train_loss": -28.2388858795166, "global_step": 629086, "epoch": 7579} {"train_loss": -28.189138412475586, "global_step": 629087, "epoch": 7579} {"train_loss": -27.954389572143555, "global_step": 629088, "epoch": 7579} {"train_loss": -28.105194091796875, "global_step": 629089, "epoch": 7579} {"train_loss": -28.2940616607666, "global_step": 629090, "epoch": 7579} {"train_loss": -28.270126342773438, "global_step": 629091, "epoch": 7579} {"train_loss": -28.00404167175293, "global_step": 629092, "epoch": 7579} {"train_loss": -28.00129508972168, "global_step": 629093, "epoch": 7579} {"train_loss": -28.069974899291992, "global_step": 629094, "epoch": 7579} {"train_loss": -28.417932510375977, "global_step": 629095, "epoch": 7579} {"train_loss": -28.45118522644043, "global_step": 629096, "epoch": 7579} {"train_loss": -28.15711784362793, "global_step": 629097, "epoch": 7579} {"train_loss": -28.075698852539062, "global_step": 629098, "epoch": 7579} {"train_loss": -28.019800186157227, "global_step": 629099, "epoch": 7579} {"train_loss": -27.807458877563477, "global_step": 629100, "epoch": 7579} {"train_loss": -27.84760093688965, "global_step": 629101, "epoch": 7579} {"train_loss": -28.14430809020996, "global_step": 629102, "epoch": 7579} {"train_loss": -28.102529525756836, "global_step": 629103, "epoch": 7579} {"train_loss": -28.143598556518555, "global_step": 629104, "epoch": 7579} {"train_loss": -28.417661666870117, "global_step": 629105, "epoch": 7579} {"train_loss": -28.208251953125, "global_step": 629106, "epoch": 7579} {"train_loss": -28.330921173095703, "global_step": 629107, "epoch": 7579} {"train_loss": -28.22499656677246, "global_step": 629108, "epoch": 7579} {"train_loss": -28.527435302734375, "global_step": 629109, "epoch": 7579} {"train_loss": -28.356536865234375, "global_step": 629110, "epoch": 7579} {"train_loss": -28.37981605529785, "global_step": 629111, "epoch": 7579} {"train_loss": -28.2736759185791, "global_step": 629112, "epoch": 7579} {"train_loss": -28.281143188476562, "global_step": 629113, "epoch": 7579} {"train_loss": -27.9906005859375, "global_step": 629114, "epoch": 7579} {"train_loss": -28.10123062133789, "global_step": 629115, "epoch": 7579} {"train_loss": -28.310834884643555, "global_step": 629116, "epoch": 7579} {"train_loss": -28.2354736328125, "global_step": 629117, "epoch": 7579} {"train_loss": -28.456424713134766, "global_step": 629118, "epoch": 7579} {"train_loss": -28.412811279296875, "global_step": 629119, "epoch": 7579} {"train_loss": -28.12212562561035, "global_step": 629120, "epoch": 7579} {"train_loss": -28.32468032836914, "global_step": 629121, "epoch": 7579} {"train_loss": -28.48530387878418, "global_step": 629122, "epoch": 7579} {"train_loss": -28.077844619750977, "global_step": 629123, "epoch": 7579} {"train_loss": -28.673023223876953, "global_step": 629124, "epoch": 7579} {"train_loss": -28.255517959594727, "global_step": 629125, "epoch": 7579} {"train_loss": -28.602148056030273, "global_step": 629126, "epoch": 7579} {"train_loss": -28.365238189697266, "global_step": 629127, "epoch": 7579} {"train_loss": -28.729318618774414, "global_step": 629128, "epoch": 7579} {"train_loss": -28.164148330688477, "global_step": 629129, "epoch": 7579} {"train_loss": -28.421964645385742, "global_step": 629130, "epoch": 7579} {"train_loss": -28.77349853515625, "global_step": 629131, "epoch": 7579} {"train_loss": -28.10898780822754, "global_step": 629132, "epoch": 7579} {"train_loss": -28.291522979736328, "global_step": 629133, "epoch": 7579} {"train_loss": -28.2330265045166, "global_step": 629134, "epoch": 7579} {"train_loss": -28.470245361328125, "global_step": 629135, "epoch": 7579} {"train_loss": -28.155704498291016, "global_step": 629136, "epoch": 7579} {"train_loss": -28.06104850769043, "global_step": 629137, "epoch": 7579} {"train_loss": -28.16872215270996, "global_step": 629138, "epoch": 7579} {"train_loss": -28.058944380426983, "global_step": 629139, "epoch": 7579, "val_loss": 6815069.0} {"train_loss": -28.101049423217773, "global_step": 629140, "epoch": 7580} {"train_loss": -27.64942741394043, "global_step": 629141, "epoch": 7580} {"train_loss": -27.888296127319336, "global_step": 629142, "epoch": 7580} {"train_loss": -28.319929122924805, "global_step": 629143, "epoch": 7580} {"train_loss": -27.760541915893555, "global_step": 629144, "epoch": 7580} {"train_loss": -27.542028427124023, "global_step": 629145, "epoch": 7580} {"train_loss": -28.25543212890625, "global_step": 629146, "epoch": 7580} {"train_loss": -27.74114990234375, "global_step": 629147, "epoch": 7580} {"train_loss": -27.696897506713867, "global_step": 629148, "epoch": 7580} {"train_loss": -27.810815811157227, "global_step": 629149, "epoch": 7580} {"train_loss": -26.951644897460938, "global_step": 629150, "epoch": 7580} {"train_loss": -26.311399459838867, "global_step": 629151, "epoch": 7580} {"train_loss": -25.216785430908203, "global_step": 629152, "epoch": 7580} {"train_loss": -25.216251373291016, "global_step": 629153, "epoch": 7580} {"train_loss": -27.997283935546875, "global_step": 629154, "epoch": 7580} {"train_loss": -26.288665771484375, "global_step": 629155, "epoch": 7580} {"train_loss": -27.6541690826416, "global_step": 629156, "epoch": 7580} {"train_loss": -26.83167839050293, "global_step": 629157, "epoch": 7580} {"train_loss": -28.117279052734375, "global_step": 629158, "epoch": 7580} {"train_loss": -27.181440353393555, "global_step": 629159, "epoch": 7580} {"train_loss": -27.207233428955078, "global_step": 629160, "epoch": 7580} {"train_loss": -27.890396118164062, "global_step": 629161, "epoch": 7580} {"train_loss": -27.516998291015625, "global_step": 629162, "epoch": 7580} {"train_loss": -27.587438583374023, "global_step": 629163, "epoch": 7580} {"train_loss": -27.8332462310791, "global_step": 629164, "epoch": 7580} {"train_loss": -27.697113037109375, "global_step": 629165, "epoch": 7580} {"train_loss": -27.40370750427246, "global_step": 629166, "epoch": 7580} {"train_loss": -27.76953125, "global_step": 629167, "epoch": 7580} {"train_loss": -28.1348819732666, "global_step": 629168, "epoch": 7580} {"train_loss": -27.475080490112305, "global_step": 629169, "epoch": 7580} {"train_loss": -27.52872657775879, "global_step": 629170, "epoch": 7580} {"train_loss": -27.956174850463867, "global_step": 629171, "epoch": 7580} {"train_loss": -27.739124298095703, "global_step": 629172, "epoch": 7580} {"train_loss": -27.915414810180664, "global_step": 629173, "epoch": 7580} {"train_loss": -27.75190544128418, "global_step": 629174, "epoch": 7580} {"train_loss": -27.993885040283203, "global_step": 629175, "epoch": 7580} {"train_loss": -27.461624145507812, "global_step": 629176, "epoch": 7580} {"train_loss": -27.75827980041504, "global_step": 629177, "epoch": 7580} {"train_loss": -27.77239990234375, "global_step": 629178, "epoch": 7580} {"train_loss": -27.666751861572266, "global_step": 629179, "epoch": 7580} {"train_loss": -27.864492416381836, "global_step": 629180, "epoch": 7580} {"train_loss": -27.727542877197266, "global_step": 629181, "epoch": 7580} {"train_loss": -27.98163414001465, "global_step": 629182, "epoch": 7580} {"train_loss": -28.08062744140625, "global_step": 629183, "epoch": 7580} {"train_loss": -28.29751968383789, "global_step": 629184, "epoch": 7580} {"train_loss": -27.724164962768555, "global_step": 629185, "epoch": 7580} {"train_loss": -28.235639572143555, "global_step": 629186, "epoch": 7580} {"train_loss": -28.25754737854004, "global_step": 629187, "epoch": 7580} {"train_loss": -28.174407958984375, "global_step": 629188, "epoch": 7580} {"train_loss": -27.966846466064453, "global_step": 629189, "epoch": 7580} {"train_loss": -28.107297897338867, "global_step": 629190, "epoch": 7580} {"train_loss": -28.132665634155273, "global_step": 629191, "epoch": 7580} {"train_loss": -28.042163848876953, "global_step": 629192, "epoch": 7580} {"train_loss": -27.8533992767334, "global_step": 629193, "epoch": 7580} {"train_loss": -28.377450942993164, "global_step": 629194, "epoch": 7580} {"train_loss": -28.24249267578125, "global_step": 629195, "epoch": 7580} {"train_loss": -28.42367935180664, "global_step": 629196, "epoch": 7580} {"train_loss": -28.543292999267578, "global_step": 629197, "epoch": 7580} {"train_loss": -27.8071231842041, "global_step": 629198, "epoch": 7580} {"train_loss": -28.326526641845703, "global_step": 629199, "epoch": 7580} {"train_loss": -28.358158111572266, "global_step": 629200, "epoch": 7580} {"train_loss": -28.32291030883789, "global_step": 629201, "epoch": 7580} {"train_loss": -28.472043991088867, "global_step": 629202, "epoch": 7580} {"train_loss": -28.1900577545166, "global_step": 629203, "epoch": 7580} {"train_loss": -28.39984130859375, "global_step": 629204, "epoch": 7580} {"train_loss": -28.405231475830078, "global_step": 629205, "epoch": 7580} {"train_loss": -27.96371841430664, "global_step": 629206, "epoch": 7580} {"train_loss": -27.93253517150879, "global_step": 629207, "epoch": 7580} {"train_loss": -27.575443267822266, "global_step": 629208, "epoch": 7580} {"train_loss": -27.2415714263916, "global_step": 629209, "epoch": 7580} {"train_loss": -26.362873077392578, "global_step": 629210, "epoch": 7580} {"train_loss": -25.273820877075195, "global_step": 629211, "epoch": 7580} {"train_loss": -26.038694381713867, "global_step": 629212, "epoch": 7580} {"train_loss": -27.719989776611328, "global_step": 629213, "epoch": 7580} {"train_loss": -27.495681762695312, "global_step": 629214, "epoch": 7580} {"train_loss": -27.873245239257812, "global_step": 629215, "epoch": 7580} {"train_loss": -27.462392807006836, "global_step": 629216, "epoch": 7580} {"train_loss": -27.472089767456055, "global_step": 629217, "epoch": 7580} {"train_loss": -27.336774826049805, "global_step": 629218, "epoch": 7580} {"train_loss": -27.686994552612305, "global_step": 629219, "epoch": 7580} {"train_loss": -27.588232040405273, "global_step": 629220, "epoch": 7580} {"train_loss": -27.615930557250977, "global_step": 629221, "epoch": 7580} {"train_loss": -27.68704531566206, "global_step": 629222, "epoch": 7580, "val_loss": 6723590.5} {"train_loss": -27.607086181640625, "global_step": 629223, "epoch": 7581} {"train_loss": -26.89729118347168, "global_step": 629224, "epoch": 7581} {"train_loss": -26.7258243560791, "global_step": 629225, "epoch": 7581} {"train_loss": -26.905744552612305, "global_step": 629226, "epoch": 7581} {"train_loss": -27.31694984436035, "global_step": 629227, "epoch": 7581} {"train_loss": -27.71027183532715, "global_step": 629228, "epoch": 7581} {"train_loss": -27.641870498657227, "global_step": 629229, "epoch": 7581} {"train_loss": -27.3885498046875, "global_step": 629230, "epoch": 7581} {"train_loss": -27.513696670532227, "global_step": 629231, "epoch": 7581} {"train_loss": -27.599567413330078, "global_step": 629232, "epoch": 7581} {"train_loss": -27.737781524658203, "global_step": 629233, "epoch": 7581} {"train_loss": -27.596891403198242, "global_step": 629234, "epoch": 7581} {"train_loss": -27.598590850830078, "global_step": 629235, "epoch": 7581} {"train_loss": -27.8793888092041, "global_step": 629236, "epoch": 7581} {"train_loss": -27.77106285095215, "global_step": 629237, "epoch": 7581} {"train_loss": -27.679285049438477, "global_step": 629238, "epoch": 7581} {"train_loss": -27.929401397705078, "global_step": 629239, "epoch": 7581} {"train_loss": -27.78474235534668, "global_step": 629240, "epoch": 7581} {"train_loss": -27.80653953552246, "global_step": 629241, "epoch": 7581} {"train_loss": -27.987796783447266, "global_step": 629242, "epoch": 7581} {"train_loss": -27.750341415405273, "global_step": 629243, "epoch": 7581} {"train_loss": -27.930814743041992, "global_step": 629244, "epoch": 7581} {"train_loss": -27.90240478515625, "global_step": 629245, "epoch": 7581} {"train_loss": -27.917560577392578, "global_step": 629246, "epoch": 7581} {"train_loss": -28.15022087097168, "global_step": 629247, "epoch": 7581} {"train_loss": -28.303739547729492, "global_step": 629248, "epoch": 7581} {"train_loss": -28.146509170532227, "global_step": 629249, "epoch": 7581} {"train_loss": -27.928674697875977, "global_step": 629250, "epoch": 7581} {"train_loss": -28.198596954345703, "global_step": 629251, "epoch": 7581} {"train_loss": -28.3497371673584, "global_step": 629252, "epoch": 7581} {"train_loss": -28.33440589904785, "global_step": 629253, "epoch": 7581} {"train_loss": -28.069110870361328, "global_step": 629254, "epoch": 7581} {"train_loss": -28.303760528564453, "global_step": 629255, "epoch": 7581} {"train_loss": -28.164798736572266, "global_step": 629256, "epoch": 7581} {"train_loss": -28.149036407470703, "global_step": 629257, "epoch": 7581} {"train_loss": -28.351186752319336, "global_step": 629258, "epoch": 7581} {"train_loss": -28.135421752929688, "global_step": 629259, "epoch": 7581} {"train_loss": -28.370161056518555, "global_step": 629260, "epoch": 7581} {"train_loss": -27.991418838500977, "global_step": 629261, "epoch": 7581} {"train_loss": -28.142990112304688, "global_step": 629262, "epoch": 7581} {"train_loss": -28.086471557617188, "global_step": 629263, "epoch": 7581} {"train_loss": -28.115453720092773, "global_step": 629264, "epoch": 7581} {"train_loss": -28.202756881713867, "global_step": 629265, "epoch": 7581} {"train_loss": -28.168920516967773, "global_step": 629266, "epoch": 7581} {"train_loss": -28.0732421875, "global_step": 629267, "epoch": 7581} {"train_loss": -28.19744300842285, "global_step": 629268, "epoch": 7581} {"train_loss": -28.358917236328125, "global_step": 629269, "epoch": 7581} {"train_loss": -28.400739669799805, "global_step": 629270, "epoch": 7581} {"train_loss": -28.660003662109375, "global_step": 629271, "epoch": 7581} {"train_loss": -28.417898178100586, "global_step": 629272, "epoch": 7581} {"train_loss": -28.239765167236328, "global_step": 629273, "epoch": 7581} {"train_loss": -28.267541885375977, "global_step": 629274, "epoch": 7581} {"train_loss": -28.2196102142334, "global_step": 629275, "epoch": 7581} {"train_loss": -28.301633834838867, "global_step": 629276, "epoch": 7581} {"train_loss": -28.17307472229004, "global_step": 629277, "epoch": 7581} {"train_loss": -28.1860408782959, "global_step": 629278, "epoch": 7581} {"train_loss": -28.512975692749023, "global_step": 629279, "epoch": 7581} {"train_loss": -28.154638290405273, "global_step": 629280, "epoch": 7581} {"train_loss": -28.053699493408203, "global_step": 629281, "epoch": 7581} {"train_loss": -27.51904296875, "global_step": 629282, "epoch": 7581} {"train_loss": -27.907440185546875, "global_step": 629283, "epoch": 7581} {"train_loss": -28.015634536743164, "global_step": 629284, "epoch": 7581} {"train_loss": -28.18598747253418, "global_step": 629285, "epoch": 7581} {"train_loss": -28.0015926361084, "global_step": 629286, "epoch": 7581} {"train_loss": -28.529041290283203, "global_step": 629287, "epoch": 7581} {"train_loss": -28.511877059936523, "global_step": 629288, "epoch": 7581} {"train_loss": -28.465490341186523, "global_step": 629289, "epoch": 7581} {"train_loss": -28.324176788330078, "global_step": 629290, "epoch": 7581} {"train_loss": -28.423315048217773, "global_step": 629291, "epoch": 7581} {"train_loss": -28.63788414001465, "global_step": 629292, "epoch": 7581} {"train_loss": -28.18243408203125, "global_step": 629293, "epoch": 7581} {"train_loss": -28.406843185424805, "global_step": 629294, "epoch": 7581} {"train_loss": -28.600812911987305, "global_step": 629295, "epoch": 7581} {"train_loss": -28.247297286987305, "global_step": 629296, "epoch": 7581} {"train_loss": -28.389423370361328, "global_step": 629297, "epoch": 7581} {"train_loss": -28.265668869018555, "global_step": 629298, "epoch": 7581} {"train_loss": -28.3664608001709, "global_step": 629299, "epoch": 7581} {"train_loss": -28.717554092407227, "global_step": 629300, "epoch": 7581} {"train_loss": -28.1569766998291, "global_step": 629301, "epoch": 7581} {"train_loss": -28.6712589263916, "global_step": 629302, "epoch": 7581} {"train_loss": -28.600711822509766, "global_step": 629303, "epoch": 7581} {"train_loss": -28.733612060546875, "global_step": 629304, "epoch": 7581} {"train_loss": -28.086678424513483, "global_step": 629305, "epoch": 7581, "val_loss": 6762174.0} {"train_loss": -27.5695743560791, "global_step": 629306, "epoch": 7582} {"train_loss": -27.98201560974121, "global_step": 629307, "epoch": 7582} {"train_loss": -27.978158950805664, "global_step": 629308, "epoch": 7582} {"train_loss": -27.809356689453125, "global_step": 629309, "epoch": 7582} {"train_loss": -27.704816818237305, "global_step": 629310, "epoch": 7582} {"train_loss": -27.864429473876953, "global_step": 629311, "epoch": 7582} {"train_loss": -27.86154556274414, "global_step": 629312, "epoch": 7582} {"train_loss": -27.89625358581543, "global_step": 629313, "epoch": 7582} {"train_loss": -28.019088745117188, "global_step": 629314, "epoch": 7582} {"train_loss": -27.963476181030273, "global_step": 629315, "epoch": 7582} {"train_loss": -27.97247886657715, "global_step": 629316, "epoch": 7582} {"train_loss": -28.192779541015625, "global_step": 629317, "epoch": 7582} {"train_loss": -28.09930992126465, "global_step": 629318, "epoch": 7582} {"train_loss": -27.970251083374023, "global_step": 629319, "epoch": 7582} {"train_loss": -28.10182762145996, "global_step": 629320, "epoch": 7582} {"train_loss": -28.028295516967773, "global_step": 629321, "epoch": 7582} {"train_loss": -27.996870040893555, "global_step": 629322, "epoch": 7582} {"train_loss": -28.0787410736084, "global_step": 629323, "epoch": 7582} {"train_loss": -28.361326217651367, "global_step": 629324, "epoch": 7582} {"train_loss": -28.52225685119629, "global_step": 629325, "epoch": 7582} {"train_loss": -27.74139404296875, "global_step": 629326, "epoch": 7582} {"train_loss": -28.199756622314453, "global_step": 629327, "epoch": 7582} {"train_loss": -28.292068481445312, "global_step": 629328, "epoch": 7582} {"train_loss": -27.998510360717773, "global_step": 629329, "epoch": 7582} {"train_loss": -28.079092025756836, "global_step": 629330, "epoch": 7582} {"train_loss": -28.34417724609375, "global_step": 629331, "epoch": 7582} {"train_loss": -28.203489303588867, "global_step": 629332, "epoch": 7582} {"train_loss": -27.480802536010742, "global_step": 629333, "epoch": 7582} {"train_loss": -27.45672607421875, "global_step": 629334, "epoch": 7582} {"train_loss": -27.922992706298828, "global_step": 629335, "epoch": 7582} {"train_loss": -27.920703887939453, "global_step": 629336, "epoch": 7582} {"train_loss": -28.01203727722168, "global_step": 629337, "epoch": 7582} {"train_loss": -28.127721786499023, "global_step": 629338, "epoch": 7582} {"train_loss": -27.802886962890625, "global_step": 629339, "epoch": 7582} {"train_loss": -28.0251407623291, "global_step": 629340, "epoch": 7582} {"train_loss": -27.607336044311523, "global_step": 629341, "epoch": 7582} {"train_loss": -27.736230850219727, "global_step": 629342, "epoch": 7582} {"train_loss": -28.359363555908203, "global_step": 629343, "epoch": 7582} {"train_loss": -27.901315689086914, "global_step": 629344, "epoch": 7582} {"train_loss": -28.189285278320312, "global_step": 629345, "epoch": 7582} {"train_loss": -27.87847900390625, "global_step": 629346, "epoch": 7582} {"train_loss": -28.162769317626953, "global_step": 629347, "epoch": 7582} {"train_loss": -28.241230010986328, "global_step": 629348, "epoch": 7582} {"train_loss": -27.918760299682617, "global_step": 629349, "epoch": 7582} {"train_loss": -28.025897979736328, "global_step": 629350, "epoch": 7582} {"train_loss": -28.475000381469727, "global_step": 629351, "epoch": 7582} {"train_loss": -28.330612182617188, "global_step": 629352, "epoch": 7582} {"train_loss": -28.37835121154785, "global_step": 629353, "epoch": 7582} {"train_loss": -28.657140731811523, "global_step": 629354, "epoch": 7582} {"train_loss": -28.13612174987793, "global_step": 629355, "epoch": 7582} {"train_loss": -27.958826065063477, "global_step": 629356, "epoch": 7582} {"train_loss": -28.250234603881836, "global_step": 629357, "epoch": 7582} {"train_loss": -28.476667404174805, "global_step": 629358, "epoch": 7582} {"train_loss": -28.142744064331055, "global_step": 629359, "epoch": 7582} {"train_loss": -28.263349533081055, "global_step": 629360, "epoch": 7582} {"train_loss": -28.291723251342773, "global_step": 629361, "epoch": 7582} {"train_loss": -28.421436309814453, "global_step": 629362, "epoch": 7582} {"train_loss": -28.379735946655273, "global_step": 629363, "epoch": 7582} {"train_loss": -28.753387451171875, "global_step": 629364, "epoch": 7582} {"train_loss": -28.465728759765625, "global_step": 629365, "epoch": 7582} {"train_loss": -28.781936645507812, "global_step": 629366, "epoch": 7582} {"train_loss": -28.602872848510742, "global_step": 629367, "epoch": 7582} {"train_loss": -28.582284927368164, "global_step": 629368, "epoch": 7582} {"train_loss": -28.28090476989746, "global_step": 629369, "epoch": 7582} {"train_loss": -28.485898971557617, "global_step": 629370, "epoch": 7582} {"train_loss": -28.136926651000977, "global_step": 629371, "epoch": 7582} {"train_loss": -28.313100814819336, "global_step": 629372, "epoch": 7582} {"train_loss": -28.326536178588867, "global_step": 629373, "epoch": 7582} {"train_loss": -28.43701171875, "global_step": 629374, "epoch": 7582} {"train_loss": -28.165266036987305, "global_step": 629375, "epoch": 7582} {"train_loss": -28.383377075195312, "global_step": 629376, "epoch": 7582} {"train_loss": -28.28309440612793, "global_step": 629377, "epoch": 7582} {"train_loss": -28.358182907104492, "global_step": 629378, "epoch": 7582} {"train_loss": -28.23117446899414, "global_step": 629379, "epoch": 7582} {"train_loss": -28.3942813873291, "global_step": 629380, "epoch": 7582} {"train_loss": -28.23664665222168, "global_step": 629381, "epoch": 7582} {"train_loss": -28.386831283569336, "global_step": 629382, "epoch": 7582} {"train_loss": -28.540130615234375, "global_step": 629383, "epoch": 7582} {"train_loss": -28.30975914001465, "global_step": 629384, "epoch": 7582} {"train_loss": -28.358591079711914, "global_step": 629385, "epoch": 7582} {"train_loss": -28.542139053344727, "global_step": 629386, "epoch": 7582} {"train_loss": -28.250940322875977, "global_step": 629387, "epoch": 7582} {"train_loss": -28.174969018223774, "global_step": 629388, "epoch": 7582, "val_loss": 6794068.0} {"train_loss": -27.868127822875977, "global_step": 629389, "epoch": 7583} {"train_loss": -27.821271896362305, "global_step": 629390, "epoch": 7583} {"train_loss": -27.99118995666504, "global_step": 629391, "epoch": 7583} {"train_loss": -27.85755729675293, "global_step": 629392, "epoch": 7583} {"train_loss": -28.0518856048584, "global_step": 629393, "epoch": 7583} {"train_loss": -28.082504272460938, "global_step": 629394, "epoch": 7583} {"train_loss": -28.417713165283203, "global_step": 629395, "epoch": 7583} {"train_loss": -28.073383331298828, "global_step": 629396, "epoch": 7583} {"train_loss": -27.918731689453125, "global_step": 629397, "epoch": 7583} {"train_loss": -27.53314208984375, "global_step": 629398, "epoch": 7583} {"train_loss": -27.71392250061035, "global_step": 629399, "epoch": 7583} {"train_loss": -27.780048370361328, "global_step": 629400, "epoch": 7583} {"train_loss": -27.967533111572266, "global_step": 629401, "epoch": 7583} {"train_loss": -28.16208267211914, "global_step": 629402, "epoch": 7583} {"train_loss": -28.237857818603516, "global_step": 629403, "epoch": 7583} {"train_loss": -28.2750244140625, "global_step": 629404, "epoch": 7583} {"train_loss": -28.3587589263916, "global_step": 629405, "epoch": 7583} {"train_loss": -27.748762130737305, "global_step": 629406, "epoch": 7583} {"train_loss": -28.314407348632812, "global_step": 629407, "epoch": 7583} {"train_loss": -28.181501388549805, "global_step": 629408, "epoch": 7583} {"train_loss": -28.210926055908203, "global_step": 629409, "epoch": 7583} {"train_loss": -28.094572067260742, "global_step": 629410, "epoch": 7583} {"train_loss": -28.4033260345459, "global_step": 629411, "epoch": 7583} {"train_loss": -28.4079532623291, "global_step": 629412, "epoch": 7583} {"train_loss": -28.25141716003418, "global_step": 629413, "epoch": 7583} {"train_loss": -28.240819931030273, "global_step": 629414, "epoch": 7583} {"train_loss": -28.206424713134766, "global_step": 629415, "epoch": 7583} {"train_loss": -28.657470703125, "global_step": 629416, "epoch": 7583} {"train_loss": -28.103870391845703, "global_step": 629417, "epoch": 7583} {"train_loss": -28.380722045898438, "global_step": 629418, "epoch": 7583} {"train_loss": -28.48749351501465, "global_step": 629419, "epoch": 7583} {"train_loss": -28.41937828063965, "global_step": 629420, "epoch": 7583} {"train_loss": -28.2896728515625, "global_step": 629421, "epoch": 7583} {"train_loss": -28.146459579467773, "global_step": 629422, "epoch": 7583} {"train_loss": -28.6079158782959, "global_step": 629423, "epoch": 7583} {"train_loss": -28.24390983581543, "global_step": 629424, "epoch": 7583} {"train_loss": -28.5494441986084, "global_step": 629425, "epoch": 7583} {"train_loss": -28.47509765625, "global_step": 629426, "epoch": 7583} {"train_loss": -28.328067779541016, "global_step": 629427, "epoch": 7583} {"train_loss": -28.4437313079834, "global_step": 629428, "epoch": 7583} {"train_loss": -27.993566513061523, "global_step": 629429, "epoch": 7583} {"train_loss": -28.234943389892578, "global_step": 629430, "epoch": 7583} {"train_loss": -28.275100708007812, "global_step": 629431, "epoch": 7583} {"train_loss": -28.109548568725586, "global_step": 629432, "epoch": 7583} {"train_loss": -28.69723892211914, "global_step": 629433, "epoch": 7583} {"train_loss": -28.385766983032227, "global_step": 629434, "epoch": 7583} {"train_loss": -28.219587326049805, "global_step": 629435, "epoch": 7583} {"train_loss": -27.54327964782715, "global_step": 629436, "epoch": 7583} {"train_loss": -27.629438400268555, "global_step": 629437, "epoch": 7583} {"train_loss": -27.413480758666992, "global_step": 629438, "epoch": 7583} {"train_loss": -27.506208419799805, "global_step": 629439, "epoch": 7583} {"train_loss": -28.039920806884766, "global_step": 629440, "epoch": 7583} {"train_loss": -28.039587020874023, "global_step": 629441, "epoch": 7583} {"train_loss": -28.252704620361328, "global_step": 629442, "epoch": 7583} {"train_loss": -28.312543869018555, "global_step": 629443, "epoch": 7583} {"train_loss": -28.096044540405273, "global_step": 629444, "epoch": 7583} {"train_loss": -28.10257339477539, "global_step": 629445, "epoch": 7583} {"train_loss": -27.9781551361084, "global_step": 629446, "epoch": 7583} {"train_loss": -28.4864444732666, "global_step": 629447, "epoch": 7583} {"train_loss": -28.374231338500977, "global_step": 629448, "epoch": 7583} {"train_loss": -28.239307403564453, "global_step": 629449, "epoch": 7583} {"train_loss": -28.189706802368164, "global_step": 629450, "epoch": 7583} {"train_loss": -27.985776901245117, "global_step": 629451, "epoch": 7583} {"train_loss": -28.054367065429688, "global_step": 629452, "epoch": 7583} {"train_loss": -28.327306747436523, "global_step": 629453, "epoch": 7583} {"train_loss": -28.120283126831055, "global_step": 629454, "epoch": 7583} {"train_loss": -28.5169677734375, "global_step": 629455, "epoch": 7583} {"train_loss": -28.546222686767578, "global_step": 629456, "epoch": 7583} {"train_loss": -28.188312530517578, "global_step": 629457, "epoch": 7583} {"train_loss": -28.259037017822266, "global_step": 629458, "epoch": 7583} {"train_loss": -28.19642448425293, "global_step": 629459, "epoch": 7583} {"train_loss": -28.350744247436523, "global_step": 629460, "epoch": 7583} {"train_loss": -27.666181564331055, "global_step": 629461, "epoch": 7583} {"train_loss": -28.2125244140625, "global_step": 629462, "epoch": 7583} {"train_loss": -28.348968505859375, "global_step": 629463, "epoch": 7583} {"train_loss": -27.859333038330078, "global_step": 629464, "epoch": 7583} {"train_loss": -27.989273071289062, "global_step": 629465, "epoch": 7583} {"train_loss": -27.91458511352539, "global_step": 629466, "epoch": 7583} {"train_loss": -27.897863388061523, "global_step": 629467, "epoch": 7583} {"train_loss": -28.185516357421875, "global_step": 629468, "epoch": 7583} {"train_loss": -27.99546241760254, "global_step": 629469, "epoch": 7583} {"train_loss": -28.371923446655273, "global_step": 629470, "epoch": 7583} {"train_loss": -28.146863592676368, "global_step": 629471, "epoch": 7583, "val_loss": 6770097.0} {"train_loss": -26.94232177734375, "global_step": 629472, "epoch": 7584} {"train_loss": -26.49220848083496, "global_step": 629473, "epoch": 7584} {"train_loss": -27.01960563659668, "global_step": 629474, "epoch": 7584} {"train_loss": -27.341278076171875, "global_step": 629475, "epoch": 7584} {"train_loss": -27.053394317626953, "global_step": 629476, "epoch": 7584} {"train_loss": -26.910675048828125, "global_step": 629477, "epoch": 7584} {"train_loss": -26.957117080688477, "global_step": 629478, "epoch": 7584} {"train_loss": -27.397602081298828, "global_step": 629479, "epoch": 7584} {"train_loss": -27.265241622924805, "global_step": 629480, "epoch": 7584} {"train_loss": -27.24787712097168, "global_step": 629481, "epoch": 7584} {"train_loss": -27.718496322631836, "global_step": 629482, "epoch": 7584} {"train_loss": -27.476627349853516, "global_step": 629483, "epoch": 7584} {"train_loss": -27.72889518737793, "global_step": 629484, "epoch": 7584} {"train_loss": -28.096471786499023, "global_step": 629485, "epoch": 7584} {"train_loss": -27.819610595703125, "global_step": 629486, "epoch": 7584} {"train_loss": -27.559595108032227, "global_step": 629487, "epoch": 7584} {"train_loss": -27.726415634155273, "global_step": 629488, "epoch": 7584} {"train_loss": -27.84437370300293, "global_step": 629489, "epoch": 7584} {"train_loss": -27.88471794128418, "global_step": 629490, "epoch": 7584} {"train_loss": -27.78911781311035, "global_step": 629491, "epoch": 7584} {"train_loss": -28.216657638549805, "global_step": 629492, "epoch": 7584} {"train_loss": -27.957006454467773, "global_step": 629493, "epoch": 7584} {"train_loss": -28.195295333862305, "global_step": 629494, "epoch": 7584} {"train_loss": -27.71351432800293, "global_step": 629495, "epoch": 7584} {"train_loss": -27.869293212890625, "global_step": 629496, "epoch": 7584} {"train_loss": -28.090835571289062, "global_step": 629497, "epoch": 7584} {"train_loss": -27.968189239501953, "global_step": 629498, "epoch": 7584} {"train_loss": -27.95806312561035, "global_step": 629499, "epoch": 7584} {"train_loss": -28.225576400756836, "global_step": 629500, "epoch": 7584} {"train_loss": -28.068145751953125, "global_step": 629501, "epoch": 7584} {"train_loss": -28.016403198242188, "global_step": 629502, "epoch": 7584} {"train_loss": -28.083173751831055, "global_step": 629503, "epoch": 7584} {"train_loss": -28.51080894470215, "global_step": 629504, "epoch": 7584} {"train_loss": -27.926727294921875, "global_step": 629505, "epoch": 7584} {"train_loss": -28.390735626220703, "global_step": 629506, "epoch": 7584} {"train_loss": -27.964078903198242, "global_step": 629507, "epoch": 7584} {"train_loss": -28.41021728515625, "global_step": 629508, "epoch": 7584} {"train_loss": -28.556716918945312, "global_step": 629509, "epoch": 7584} {"train_loss": -28.290342330932617, "global_step": 629510, "epoch": 7584} {"train_loss": -28.303308486938477, "global_step": 629511, "epoch": 7584} {"train_loss": -28.362812042236328, "global_step": 629512, "epoch": 7584} {"train_loss": -28.592008590698242, "global_step": 629513, "epoch": 7584} {"train_loss": -28.45258140563965, "global_step": 629514, "epoch": 7584} {"train_loss": -28.44362449645996, "global_step": 629515, "epoch": 7584} {"train_loss": -28.445432662963867, "global_step": 629516, "epoch": 7584} {"train_loss": -28.227197647094727, "global_step": 629517, "epoch": 7584} {"train_loss": -28.457868576049805, "global_step": 629518, "epoch": 7584} {"train_loss": -28.386844635009766, "global_step": 629519, "epoch": 7584} {"train_loss": -28.49786949157715, "global_step": 629520, "epoch": 7584} {"train_loss": -28.098560333251953, "global_step": 629521, "epoch": 7584} {"train_loss": -28.10101318359375, "global_step": 629522, "epoch": 7584} {"train_loss": -28.213178634643555, "global_step": 629523, "epoch": 7584} {"train_loss": -28.52975845336914, "global_step": 629524, "epoch": 7584} {"train_loss": -28.439599990844727, "global_step": 629525, "epoch": 7584} {"train_loss": -28.451459884643555, "global_step": 629526, "epoch": 7584} {"train_loss": -27.918689727783203, "global_step": 629527, "epoch": 7584} {"train_loss": -27.39449119567871, "global_step": 629528, "epoch": 7584} {"train_loss": -27.439029693603516, "global_step": 629529, "epoch": 7584} {"train_loss": -27.630722045898438, "global_step": 629530, "epoch": 7584} {"train_loss": -27.761411666870117, "global_step": 629531, "epoch": 7584} {"train_loss": -28.121387481689453, "global_step": 629532, "epoch": 7584} {"train_loss": -28.341678619384766, "global_step": 629533, "epoch": 7584} {"train_loss": -27.978952407836914, "global_step": 629534, "epoch": 7584} {"train_loss": -27.64801025390625, "global_step": 629535, "epoch": 7584} {"train_loss": -27.849145889282227, "global_step": 629536, "epoch": 7584} {"train_loss": -27.92941665649414, "global_step": 629537, "epoch": 7584} {"train_loss": -27.974781036376953, "global_step": 629538, "epoch": 7584} {"train_loss": -27.657958984375, "global_step": 629539, "epoch": 7584} {"train_loss": -28.107574462890625, "global_step": 629540, "epoch": 7584} {"train_loss": -27.898624420166016, "global_step": 629541, "epoch": 7584} {"train_loss": -27.736310958862305, "global_step": 629542, "epoch": 7584} {"train_loss": -27.88775634765625, "global_step": 629543, "epoch": 7584} {"train_loss": -28.129011154174805, "global_step": 629544, "epoch": 7584} {"train_loss": -28.040067672729492, "global_step": 629545, "epoch": 7584} {"train_loss": -28.13643455505371, "global_step": 629546, "epoch": 7584} {"train_loss": -27.99628257751465, "global_step": 629547, "epoch": 7584} {"train_loss": -27.493350982666016, "global_step": 629548, "epoch": 7584} {"train_loss": -27.442581176757812, "global_step": 629549, "epoch": 7584} {"train_loss": -26.83985710144043, "global_step": 629550, "epoch": 7584} {"train_loss": -28.0406436920166, "global_step": 629551, "epoch": 7584} {"train_loss": -28.0169677734375, "global_step": 629552, "epoch": 7584} {"train_loss": -28.039722442626953, "global_step": 629553, "epoch": 7584} {"train_loss": -27.902356021375542, "global_step": 629554, "epoch": 7584, "val_loss": 6792930.0} {"train_loss": -27.018110275268555, "global_step": 629555, "epoch": 7585} {"train_loss": -26.91926383972168, "global_step": 629556, "epoch": 7585} {"train_loss": -27.480756759643555, "global_step": 629557, "epoch": 7585} {"train_loss": -26.951078414916992, "global_step": 629558, "epoch": 7585} {"train_loss": -27.227630615234375, "global_step": 629559, "epoch": 7585} {"train_loss": -27.104467391967773, "global_step": 629560, "epoch": 7585} {"train_loss": -27.589895248413086, "global_step": 629561, "epoch": 7585} {"train_loss": -27.33465576171875, "global_step": 629562, "epoch": 7585} {"train_loss": -27.47509765625, "global_step": 629563, "epoch": 7585} {"train_loss": -27.601720809936523, "global_step": 629564, "epoch": 7585} {"train_loss": -27.39822769165039, "global_step": 629565, "epoch": 7585} {"train_loss": -27.41636085510254, "global_step": 629566, "epoch": 7585} {"train_loss": -28.022016525268555, "global_step": 629567, "epoch": 7585} {"train_loss": -27.9746036529541, "global_step": 629568, "epoch": 7585} {"train_loss": -27.707365036010742, "global_step": 629569, "epoch": 7585} {"train_loss": -28.065780639648438, "global_step": 629570, "epoch": 7585} {"train_loss": -27.730316162109375, "global_step": 629571, "epoch": 7585} {"train_loss": -28.114398956298828, "global_step": 629572, "epoch": 7585} {"train_loss": -28.185546875, "global_step": 629573, "epoch": 7585} {"train_loss": -27.729888916015625, "global_step": 629574, "epoch": 7585} {"train_loss": -28.199127197265625, "global_step": 629575, "epoch": 7585} {"train_loss": -27.693634033203125, "global_step": 629576, "epoch": 7585} {"train_loss": -28.2218074798584, "global_step": 629577, "epoch": 7585} {"train_loss": -28.033954620361328, "global_step": 629578, "epoch": 7585} {"train_loss": -28.053781509399414, "global_step": 629579, "epoch": 7585} {"train_loss": -27.73463249206543, "global_step": 629580, "epoch": 7585} {"train_loss": -28.09323501586914, "global_step": 629581, "epoch": 7585} {"train_loss": -28.147008895874023, "global_step": 629582, "epoch": 7585} {"train_loss": -28.29691505432129, "global_step": 629583, "epoch": 7585} {"train_loss": -28.297513961791992, "global_step": 629584, "epoch": 7585} {"train_loss": -28.360212326049805, "global_step": 629585, "epoch": 7585} {"train_loss": -28.288196563720703, "global_step": 629586, "epoch": 7585} {"train_loss": -28.210468292236328, "global_step": 629587, "epoch": 7585} {"train_loss": -28.4746150970459, "global_step": 629588, "epoch": 7585} {"train_loss": -28.253189086914062, "global_step": 629589, "epoch": 7585} {"train_loss": -28.447696685791016, "global_step": 629590, "epoch": 7585} {"train_loss": -28.444244384765625, "global_step": 629591, "epoch": 7585} {"train_loss": -28.50986671447754, "global_step": 629592, "epoch": 7585} {"train_loss": -28.43121337890625, "global_step": 629593, "epoch": 7585} {"train_loss": -28.05889320373535, "global_step": 629594, "epoch": 7585} {"train_loss": -28.384937286376953, "global_step": 629595, "epoch": 7585} {"train_loss": -28.25568962097168, "global_step": 629596, "epoch": 7585} {"train_loss": -28.517704010009766, "global_step": 629597, "epoch": 7585} {"train_loss": -28.579137802124023, "global_step": 629598, "epoch": 7585} {"train_loss": -27.97916030883789, "global_step": 629599, "epoch": 7585} {"train_loss": -28.458349227905273, "global_step": 629600, "epoch": 7585} {"train_loss": -28.282855987548828, "global_step": 629601, "epoch": 7585} {"train_loss": -27.99847984313965, "global_step": 629602, "epoch": 7585} {"train_loss": -27.881315231323242, "global_step": 629603, "epoch": 7585} {"train_loss": -28.389623641967773, "global_step": 629604, "epoch": 7585} {"train_loss": -28.1361141204834, "global_step": 629605, "epoch": 7585} {"train_loss": -28.043598175048828, "global_step": 629606, "epoch": 7585} {"train_loss": -28.100534439086914, "global_step": 629607, "epoch": 7585} {"train_loss": -28.120773315429688, "global_step": 629608, "epoch": 7585} {"train_loss": -28.142826080322266, "global_step": 629609, "epoch": 7585} {"train_loss": -28.566495895385742, "global_step": 629610, "epoch": 7585} {"train_loss": -28.27668571472168, "global_step": 629611, "epoch": 7585} {"train_loss": -28.220264434814453, "global_step": 629612, "epoch": 7585} {"train_loss": -28.23504066467285, "global_step": 629613, "epoch": 7585} {"train_loss": -28.209264755249023, "global_step": 629614, "epoch": 7585} {"train_loss": -28.3591251373291, "global_step": 629615, "epoch": 7585} {"train_loss": -28.522781372070312, "global_step": 629616, "epoch": 7585} {"train_loss": -28.401594161987305, "global_step": 629617, "epoch": 7585} {"train_loss": -28.364408493041992, "global_step": 629618, "epoch": 7585} {"train_loss": -28.644397735595703, "global_step": 629619, "epoch": 7585} {"train_loss": -27.957504272460938, "global_step": 629620, "epoch": 7585} {"train_loss": -28.532093048095703, "global_step": 629621, "epoch": 7585} {"train_loss": -28.382963180541992, "global_step": 629622, "epoch": 7585} {"train_loss": -28.641992568969727, "global_step": 629623, "epoch": 7585} {"train_loss": -27.99688148498535, "global_step": 629624, "epoch": 7585} {"train_loss": -28.116769790649414, "global_step": 629625, "epoch": 7585} {"train_loss": -28.679914474487305, "global_step": 629626, "epoch": 7585} {"train_loss": -28.277606964111328, "global_step": 629627, "epoch": 7585} {"train_loss": -28.44654655456543, "global_step": 629628, "epoch": 7585} {"train_loss": -28.538236618041992, "global_step": 629629, "epoch": 7585} {"train_loss": -28.038898468017578, "global_step": 629630, "epoch": 7585} {"train_loss": -28.08200454711914, "global_step": 629631, "epoch": 7585} {"train_loss": -28.491849899291992, "global_step": 629632, "epoch": 7585} {"train_loss": -28.319555282592773, "global_step": 629633, "epoch": 7585} {"train_loss": -28.150650024414062, "global_step": 629634, "epoch": 7585} {"train_loss": -28.270782470703125, "global_step": 629635, "epoch": 7585} {"train_loss": -28.03687858581543, "global_step": 629636, "epoch": 7585} {"train_loss": -28.086859048131, "global_step": 629637, "epoch": 7585, "val_loss": 6768437.0} {"train_loss": -26.39442253112793, "global_step": 629638, "epoch": 7586} {"train_loss": -26.784650802612305, "global_step": 629639, "epoch": 7586} {"train_loss": -27.4426326751709, "global_step": 629640, "epoch": 7586} {"train_loss": -27.18328857421875, "global_step": 629641, "epoch": 7586} {"train_loss": -26.781274795532227, "global_step": 629642, "epoch": 7586} {"train_loss": -27.160907745361328, "global_step": 629643, "epoch": 7586} {"train_loss": -27.15119743347168, "global_step": 629644, "epoch": 7586} {"train_loss": -27.25394630432129, "global_step": 629645, "epoch": 7586} {"train_loss": -27.36249351501465, "global_step": 629646, "epoch": 7586} {"train_loss": -27.514530181884766, "global_step": 629647, "epoch": 7586} {"train_loss": -27.8530216217041, "global_step": 629648, "epoch": 7586} {"train_loss": -27.585742950439453, "global_step": 629649, "epoch": 7586} {"train_loss": -27.769338607788086, "global_step": 629650, "epoch": 7586} {"train_loss": -27.630895614624023, "global_step": 629651, "epoch": 7586} {"train_loss": -28.072528839111328, "global_step": 629652, "epoch": 7586} {"train_loss": -27.4920711517334, "global_step": 629653, "epoch": 7586} {"train_loss": -27.58319664001465, "global_step": 629654, "epoch": 7586} {"train_loss": -27.553503036499023, "global_step": 629655, "epoch": 7586} {"train_loss": -27.549875259399414, "global_step": 629656, "epoch": 7586} {"train_loss": -27.87701988220215, "global_step": 629657, "epoch": 7586} {"train_loss": -27.837888717651367, "global_step": 629658, "epoch": 7586} {"train_loss": -27.904882431030273, "global_step": 629659, "epoch": 7586} {"train_loss": -27.853483200073242, "global_step": 629660, "epoch": 7586} {"train_loss": -27.4822940826416, "global_step": 629661, "epoch": 7586} {"train_loss": -27.90726089477539, "global_step": 629662, "epoch": 7586} {"train_loss": -27.8531436920166, "global_step": 629663, "epoch": 7586} {"train_loss": -27.735370635986328, "global_step": 629664, "epoch": 7586} {"train_loss": -28.049463272094727, "global_step": 629665, "epoch": 7586} {"train_loss": -28.146875381469727, "global_step": 629666, "epoch": 7586} {"train_loss": -28.17829704284668, "global_step": 629667, "epoch": 7586} {"train_loss": -28.215917587280273, "global_step": 629668, "epoch": 7586} {"train_loss": -28.193912506103516, "global_step": 629669, "epoch": 7586} {"train_loss": -28.1783504486084, "global_step": 629670, "epoch": 7586} {"train_loss": -28.307266235351562, "global_step": 629671, "epoch": 7586} {"train_loss": -28.0888729095459, "global_step": 629672, "epoch": 7586} {"train_loss": -28.512317657470703, "global_step": 629673, "epoch": 7586} {"train_loss": -28.07503318786621, "global_step": 629674, "epoch": 7586} {"train_loss": -28.041242599487305, "global_step": 629675, "epoch": 7586} {"train_loss": -28.38361930847168, "global_step": 629676, "epoch": 7586} {"train_loss": -28.290647506713867, "global_step": 629677, "epoch": 7586} {"train_loss": -28.570775985717773, "global_step": 629678, "epoch": 7586} {"train_loss": -28.16107177734375, "global_step": 629679, "epoch": 7586} {"train_loss": -27.90012550354004, "global_step": 629680, "epoch": 7586} {"train_loss": -28.149932861328125, "global_step": 629681, "epoch": 7586} {"train_loss": -28.390338897705078, "global_step": 629682, "epoch": 7586} {"train_loss": -28.751218795776367, "global_step": 629683, "epoch": 7586} {"train_loss": -28.166717529296875, "global_step": 629684, "epoch": 7586} {"train_loss": -28.3182430267334, "global_step": 629685, "epoch": 7586} {"train_loss": -28.101526260375977, "global_step": 629686, "epoch": 7586} {"train_loss": -28.581832885742188, "global_step": 629687, "epoch": 7586} {"train_loss": -28.48280906677246, "global_step": 629688, "epoch": 7586} {"train_loss": -28.76079750061035, "global_step": 629689, "epoch": 7586} {"train_loss": -28.4580020904541, "global_step": 629690, "epoch": 7586} {"train_loss": -28.445592880249023, "global_step": 629691, "epoch": 7586} {"train_loss": -28.303003311157227, "global_step": 629692, "epoch": 7586} {"train_loss": -28.759353637695312, "global_step": 629693, "epoch": 7586} {"train_loss": -28.156635284423828, "global_step": 629694, "epoch": 7586} {"train_loss": -28.237812042236328, "global_step": 629695, "epoch": 7586} {"train_loss": -28.663639068603516, "global_step": 629696, "epoch": 7586} {"train_loss": -28.403778076171875, "global_step": 629697, "epoch": 7586} {"train_loss": -28.617511749267578, "global_step": 629698, "epoch": 7586} {"train_loss": -28.0862979888916, "global_step": 629699, "epoch": 7586} {"train_loss": -28.302831649780273, "global_step": 629700, "epoch": 7586} {"train_loss": -28.472278594970703, "global_step": 629701, "epoch": 7586} {"train_loss": -28.444665908813477, "global_step": 629702, "epoch": 7586} {"train_loss": -28.682886123657227, "global_step": 629703, "epoch": 7586} {"train_loss": -28.344663619995117, "global_step": 629704, "epoch": 7586} {"train_loss": -28.29329490661621, "global_step": 629705, "epoch": 7586} {"train_loss": -28.58294105529785, "global_step": 629706, "epoch": 7586} {"train_loss": -27.871917724609375, "global_step": 629707, "epoch": 7586} {"train_loss": -28.55035972595215, "global_step": 629708, "epoch": 7586} {"train_loss": -28.069538116455078, "global_step": 629709, "epoch": 7586} {"train_loss": -27.834196090698242, "global_step": 629710, "epoch": 7586} {"train_loss": -26.857526779174805, "global_step": 629711, "epoch": 7586} {"train_loss": -26.346820831298828, "global_step": 629712, "epoch": 7586} {"train_loss": -27.67498779296875, "global_step": 629713, "epoch": 7586} {"train_loss": -27.311872482299805, "global_step": 629714, "epoch": 7586} {"train_loss": -27.03773307800293, "global_step": 629715, "epoch": 7586} {"train_loss": -27.90448570251465, "global_step": 629716, "epoch": 7586} {"train_loss": -27.6522159576416, "global_step": 629717, "epoch": 7586} {"train_loss": -27.38633155822754, "global_step": 629718, "epoch": 7586} {"train_loss": -27.73703956604004, "global_step": 629719, "epoch": 7586} {"train_loss": -27.933944633208124, "global_step": 629720, "epoch": 7586, "val_loss": 6694308.0} {"train_loss": -25.813831329345703, "global_step": 629721, "epoch": 7587} {"train_loss": -26.02443504333496, "global_step": 629722, "epoch": 7587} {"train_loss": -26.53244400024414, "global_step": 629723, "epoch": 7587} {"train_loss": -27.8106632232666, "global_step": 629724, "epoch": 7587} {"train_loss": -26.36602210998535, "global_step": 629725, "epoch": 7587} {"train_loss": -27.12965965270996, "global_step": 629726, "epoch": 7587} {"train_loss": -26.500625610351562, "global_step": 629727, "epoch": 7587} {"train_loss": -27.034631729125977, "global_step": 629728, "epoch": 7587} {"train_loss": -26.7850284576416, "global_step": 629729, "epoch": 7587} {"train_loss": -27.605749130249023, "global_step": 629730, "epoch": 7587} {"train_loss": -27.45281410217285, "global_step": 629731, "epoch": 7587} {"train_loss": -27.46522331237793, "global_step": 629732, "epoch": 7587} {"train_loss": -27.262622833251953, "global_step": 629733, "epoch": 7587} {"train_loss": -27.774709701538086, "global_step": 629734, "epoch": 7587} {"train_loss": -27.449542999267578, "global_step": 629735, "epoch": 7587} {"train_loss": -27.122344970703125, "global_step": 629736, "epoch": 7587} {"train_loss": -27.533374786376953, "global_step": 629737, "epoch": 7587} {"train_loss": -27.8914852142334, "global_step": 629738, "epoch": 7587} {"train_loss": -27.714475631713867, "global_step": 629739, "epoch": 7587} {"train_loss": -27.631322860717773, "global_step": 629740, "epoch": 7587} {"train_loss": -27.68448257446289, "global_step": 629741, "epoch": 7587} {"train_loss": -27.983524322509766, "global_step": 629742, "epoch": 7587} {"train_loss": -27.74491310119629, "global_step": 629743, "epoch": 7587} {"train_loss": -27.780187606811523, "global_step": 629744, "epoch": 7587} {"train_loss": -27.72137451171875, "global_step": 629745, "epoch": 7587} {"train_loss": -27.66534423828125, "global_step": 629746, "epoch": 7587} {"train_loss": -28.10927391052246, "global_step": 629747, "epoch": 7587} {"train_loss": -27.724349975585938, "global_step": 629748, "epoch": 7587} {"train_loss": -28.17597007751465, "global_step": 629749, "epoch": 7587} {"train_loss": -28.191740036010742, "global_step": 629750, "epoch": 7587} {"train_loss": -28.294769287109375, "global_step": 629751, "epoch": 7587} {"train_loss": -28.119714736938477, "global_step": 629752, "epoch": 7587} {"train_loss": -27.830556869506836, "global_step": 629753, "epoch": 7587} {"train_loss": -28.43796157836914, "global_step": 629754, "epoch": 7587} {"train_loss": -28.234060287475586, "global_step": 629755, "epoch": 7587} {"train_loss": -28.11163330078125, "global_step": 629756, "epoch": 7587} {"train_loss": -28.321683883666992, "global_step": 629757, "epoch": 7587} {"train_loss": -28.201826095581055, "global_step": 629758, "epoch": 7587} {"train_loss": -28.34624671936035, "global_step": 629759, "epoch": 7587} {"train_loss": -28.463842391967773, "global_step": 629760, "epoch": 7587} {"train_loss": -28.221637725830078, "global_step": 629761, "epoch": 7587} {"train_loss": -28.51641845703125, "global_step": 629762, "epoch": 7587} {"train_loss": -28.387115478515625, "global_step": 629763, "epoch": 7587} {"train_loss": -28.473358154296875, "global_step": 629764, "epoch": 7587} {"train_loss": -28.1566104888916, "global_step": 629765, "epoch": 7587} {"train_loss": -28.301746368408203, "global_step": 629766, "epoch": 7587} {"train_loss": -28.0499210357666, "global_step": 629767, "epoch": 7587} {"train_loss": -28.298492431640625, "global_step": 629768, "epoch": 7587} {"train_loss": -28.363311767578125, "global_step": 629769, "epoch": 7587} {"train_loss": -28.269535064697266, "global_step": 629770, "epoch": 7587} {"train_loss": -28.322057723999023, "global_step": 629771, "epoch": 7587} {"train_loss": -28.766281127929688, "global_step": 629772, "epoch": 7587} {"train_loss": -28.834775924682617, "global_step": 629773, "epoch": 7587} {"train_loss": -28.18489646911621, "global_step": 629774, "epoch": 7587} {"train_loss": -28.39664649963379, "global_step": 629775, "epoch": 7587} {"train_loss": -28.270553588867188, "global_step": 629776, "epoch": 7587} {"train_loss": -28.134174346923828, "global_step": 629777, "epoch": 7587} {"train_loss": -28.514245986938477, "global_step": 629778, "epoch": 7587} {"train_loss": -28.231414794921875, "global_step": 629779, "epoch": 7587} {"train_loss": -28.394378662109375, "global_step": 629780, "epoch": 7587} {"train_loss": -28.0338077545166, "global_step": 629781, "epoch": 7587} {"train_loss": -28.246423721313477, "global_step": 629782, "epoch": 7587} {"train_loss": -28.434207916259766, "global_step": 629783, "epoch": 7587} {"train_loss": -28.450002670288086, "global_step": 629784, "epoch": 7587} {"train_loss": -28.69813346862793, "global_step": 629785, "epoch": 7587} {"train_loss": -28.203842163085938, "global_step": 629786, "epoch": 7587} {"train_loss": -28.347448348999023, "global_step": 629787, "epoch": 7587} {"train_loss": -28.430694580078125, "global_step": 629788, "epoch": 7587} {"train_loss": -28.1156005859375, "global_step": 629789, "epoch": 7587} {"train_loss": -27.98834800720215, "global_step": 629790, "epoch": 7587} {"train_loss": -27.85292625427246, "global_step": 629791, "epoch": 7587} {"train_loss": -28.03008460998535, "global_step": 629792, "epoch": 7587} {"train_loss": -27.974313735961914, "global_step": 629793, "epoch": 7587} {"train_loss": -28.497161865234375, "global_step": 629794, "epoch": 7587} {"train_loss": -28.424213409423828, "global_step": 629795, "epoch": 7587} {"train_loss": -28.1641902923584, "global_step": 629796, "epoch": 7587} {"train_loss": -28.2268123626709, "global_step": 629797, "epoch": 7587} {"train_loss": -28.200952529907227, "global_step": 629798, "epoch": 7587} {"train_loss": -28.21542739868164, "global_step": 629799, "epoch": 7587} {"train_loss": -28.285837173461914, "global_step": 629800, "epoch": 7587} {"train_loss": -28.46539306640625, "global_step": 629801, "epoch": 7587} {"train_loss": -28.50836753845215, "global_step": 629802, "epoch": 7587} {"train_loss": -27.97045778940959, "global_step": 629803, "epoch": 7587, "val_loss": 6863598.0} {"train_loss": -27.845977783203125, "global_step": 629804, "epoch": 7588} {"train_loss": -27.721662521362305, "global_step": 629805, "epoch": 7588} {"train_loss": -27.66499900817871, "global_step": 629806, "epoch": 7588} {"train_loss": -27.730316162109375, "global_step": 629807, "epoch": 7588} {"train_loss": -27.62078285217285, "global_step": 629808, "epoch": 7588} {"train_loss": -27.899511337280273, "global_step": 629809, "epoch": 7588} {"train_loss": -27.523284912109375, "global_step": 629810, "epoch": 7588} {"train_loss": -27.86187744140625, "global_step": 629811, "epoch": 7588} {"train_loss": -27.448755264282227, "global_step": 629812, "epoch": 7588} {"train_loss": -27.860870361328125, "global_step": 629813, "epoch": 7588} {"train_loss": -27.693740844726562, "global_step": 629814, "epoch": 7588} {"train_loss": -27.920400619506836, "global_step": 629815, "epoch": 7588} {"train_loss": -27.77247428894043, "global_step": 629816, "epoch": 7588} {"train_loss": -27.864301681518555, "global_step": 629817, "epoch": 7588} {"train_loss": -28.12421989440918, "global_step": 629818, "epoch": 7588} {"train_loss": -27.848388671875, "global_step": 629819, "epoch": 7588} {"train_loss": -27.929813385009766, "global_step": 629820, "epoch": 7588} {"train_loss": -27.782434463500977, "global_step": 629821, "epoch": 7588} {"train_loss": -27.92146873474121, "global_step": 629822, "epoch": 7588} {"train_loss": -28.2733154296875, "global_step": 629823, "epoch": 7588} {"train_loss": -28.37592124938965, "global_step": 629824, "epoch": 7588} {"train_loss": -27.95819664001465, "global_step": 629825, "epoch": 7588} {"train_loss": -28.2340030670166, "global_step": 629826, "epoch": 7588} {"train_loss": -28.175756454467773, "global_step": 629827, "epoch": 7588} {"train_loss": -28.27508544921875, "global_step": 629828, "epoch": 7588} {"train_loss": -28.190393447875977, "global_step": 629829, "epoch": 7588} {"train_loss": -28.454248428344727, "global_step": 629830, "epoch": 7588} {"train_loss": -28.23236656188965, "global_step": 629831, "epoch": 7588} {"train_loss": -28.01607322692871, "global_step": 629832, "epoch": 7588} {"train_loss": -28.07724952697754, "global_step": 629833, "epoch": 7588} {"train_loss": -28.322839736938477, "global_step": 629834, "epoch": 7588} {"train_loss": -28.081640243530273, "global_step": 629835, "epoch": 7588} {"train_loss": -28.234907150268555, "global_step": 629836, "epoch": 7588} {"train_loss": -28.066797256469727, "global_step": 629837, "epoch": 7588} {"train_loss": -28.335254669189453, "global_step": 629838, "epoch": 7588} {"train_loss": -28.513952255249023, "global_step": 629839, "epoch": 7588} {"train_loss": -28.34505271911621, "global_step": 629840, "epoch": 7588} {"train_loss": -28.157474517822266, "global_step": 629841, "epoch": 7588} {"train_loss": -27.97979164123535, "global_step": 629842, "epoch": 7588} {"train_loss": -28.2742919921875, "global_step": 629843, "epoch": 7588} {"train_loss": -28.512540817260742, "global_step": 629844, "epoch": 7588} {"train_loss": -27.99139404296875, "global_step": 629845, "epoch": 7588} {"train_loss": -28.21051025390625, "global_step": 629846, "epoch": 7588} {"train_loss": -28.462080001831055, "global_step": 629847, "epoch": 7588} {"train_loss": -28.263654708862305, "global_step": 629848, "epoch": 7588} {"train_loss": -28.09014892578125, "global_step": 629849, "epoch": 7588} {"train_loss": -28.609540939331055, "global_step": 629850, "epoch": 7588} {"train_loss": -27.96982192993164, "global_step": 629851, "epoch": 7588} {"train_loss": -28.385913848876953, "global_step": 629852, "epoch": 7588} {"train_loss": -28.39789390563965, "global_step": 629853, "epoch": 7588} {"train_loss": -28.065214157104492, "global_step": 629854, "epoch": 7588} {"train_loss": -28.867252349853516, "global_step": 629855, "epoch": 7588} {"train_loss": -28.578521728515625, "global_step": 629856, "epoch": 7588} {"train_loss": -28.371368408203125, "global_step": 629857, "epoch": 7588} {"train_loss": -28.469532012939453, "global_step": 629858, "epoch": 7588} {"train_loss": -28.32867431640625, "global_step": 629859, "epoch": 7588} {"train_loss": -28.47113037109375, "global_step": 629860, "epoch": 7588} {"train_loss": -28.43295669555664, "global_step": 629861, "epoch": 7588} {"train_loss": -28.275373458862305, "global_step": 629862, "epoch": 7588} {"train_loss": -28.093158721923828, "global_step": 629863, "epoch": 7588} {"train_loss": -28.190393447875977, "global_step": 629864, "epoch": 7588} {"train_loss": -28.405359268188477, "global_step": 629865, "epoch": 7588} {"train_loss": -28.716297149658203, "global_step": 629866, "epoch": 7588} {"train_loss": -28.292280197143555, "global_step": 629867, "epoch": 7588} {"train_loss": -28.37091064453125, "global_step": 629868, "epoch": 7588} {"train_loss": -28.421432495117188, "global_step": 629869, "epoch": 7588} {"train_loss": -27.884626388549805, "global_step": 629870, "epoch": 7588} {"train_loss": -27.285974502563477, "global_step": 629871, "epoch": 7588} {"train_loss": -26.665576934814453, "global_step": 629872, "epoch": 7588} {"train_loss": -26.633337020874023, "global_step": 629873, "epoch": 7588} {"train_loss": -28.12009620666504, "global_step": 629874, "epoch": 7588} {"train_loss": -28.096586227416992, "global_step": 629875, "epoch": 7588} {"train_loss": -27.153091430664062, "global_step": 629876, "epoch": 7588} {"train_loss": -27.707029342651367, "global_step": 629877, "epoch": 7588} {"train_loss": -27.968503952026367, "global_step": 629878, "epoch": 7588} {"train_loss": -27.09272575378418, "global_step": 629879, "epoch": 7588} {"train_loss": -27.8945255279541, "global_step": 629880, "epoch": 7588} {"train_loss": -27.89363670349121, "global_step": 629881, "epoch": 7588} {"train_loss": -28.152917861938477, "global_step": 629882, "epoch": 7588} {"train_loss": -27.88701820373535, "global_step": 629883, "epoch": 7588} {"train_loss": -27.912702560424805, "global_step": 629884, "epoch": 7588} {"train_loss": -28.095474243164062, "global_step": 629885, "epoch": 7588} {"train_loss": -28.040427472217974, "global_step": 629886, "epoch": 7588, "val_loss": 6831066.0} {"train_loss": -27.057270050048828, "global_step": 629887, "epoch": 7589} {"train_loss": -26.782968521118164, "global_step": 629888, "epoch": 7589} {"train_loss": -27.330890655517578, "global_step": 629889, "epoch": 7589} {"train_loss": -27.12944984436035, "global_step": 629890, "epoch": 7589} {"train_loss": -27.217926025390625, "global_step": 629891, "epoch": 7589} {"train_loss": -27.235671997070312, "global_step": 629892, "epoch": 7589} {"train_loss": -27.423009872436523, "global_step": 629893, "epoch": 7589} {"train_loss": -27.9755916595459, "global_step": 629894, "epoch": 7589} {"train_loss": -27.451507568359375, "global_step": 629895, "epoch": 7589} {"train_loss": -27.639245986938477, "global_step": 629896, "epoch": 7589} {"train_loss": -27.7912540435791, "global_step": 629897, "epoch": 7589} {"train_loss": -27.538928985595703, "global_step": 629898, "epoch": 7589} {"train_loss": -28.024824142456055, "global_step": 629899, "epoch": 7589} {"train_loss": -27.462961196899414, "global_step": 629900, "epoch": 7589} {"train_loss": -27.98862648010254, "global_step": 629901, "epoch": 7589} {"train_loss": -27.764814376831055, "global_step": 629902, "epoch": 7589} {"train_loss": -27.565704345703125, "global_step": 629903, "epoch": 7589} {"train_loss": -27.997425079345703, "global_step": 629904, "epoch": 7589} {"train_loss": -27.8880672454834, "global_step": 629905, "epoch": 7589} {"train_loss": -27.8138484954834, "global_step": 629906, "epoch": 7589} {"train_loss": -27.887847900390625, "global_step": 629907, "epoch": 7589} {"train_loss": -27.75425148010254, "global_step": 629908, "epoch": 7589} {"train_loss": -28.134326934814453, "global_step": 629909, "epoch": 7589} {"train_loss": -28.31003761291504, "global_step": 629910, "epoch": 7589} {"train_loss": -27.801862716674805, "global_step": 629911, "epoch": 7589} {"train_loss": -28.223745346069336, "global_step": 629912, "epoch": 7589} {"train_loss": -28.105966567993164, "global_step": 629913, "epoch": 7589} {"train_loss": -28.500120162963867, "global_step": 629914, "epoch": 7589} {"train_loss": -28.113525390625, "global_step": 629915, "epoch": 7589} {"train_loss": -28.280149459838867, "global_step": 629916, "epoch": 7589} {"train_loss": -28.4328670501709, "global_step": 629917, "epoch": 7589} {"train_loss": -28.358850479125977, "global_step": 629918, "epoch": 7589} {"train_loss": -28.37921142578125, "global_step": 629919, "epoch": 7589} {"train_loss": -28.26177406311035, "global_step": 629920, "epoch": 7589} {"train_loss": -28.277685165405273, "global_step": 629921, "epoch": 7589} {"train_loss": -28.765493392944336, "global_step": 629922, "epoch": 7589} {"train_loss": -28.095441818237305, "global_step": 629923, "epoch": 7589} {"train_loss": -28.407379150390625, "global_step": 629924, "epoch": 7589} {"train_loss": -28.48689079284668, "global_step": 629925, "epoch": 7589} {"train_loss": -28.434545516967773, "global_step": 629926, "epoch": 7589} {"train_loss": -28.177413940429688, "global_step": 629927, "epoch": 7589} {"train_loss": -28.734146118164062, "global_step": 629928, "epoch": 7589} {"train_loss": -28.219568252563477, "global_step": 629929, "epoch": 7589} {"train_loss": -28.48213005065918, "global_step": 629930, "epoch": 7589} {"train_loss": -28.555023193359375, "global_step": 629931, "epoch": 7589} {"train_loss": -27.92462158203125, "global_step": 629932, "epoch": 7589} {"train_loss": -28.819721221923828, "global_step": 629933, "epoch": 7589} {"train_loss": -28.63760757446289, "global_step": 629934, "epoch": 7589} {"train_loss": -28.383808135986328, "global_step": 629935, "epoch": 7589} {"train_loss": -28.500396728515625, "global_step": 629936, "epoch": 7589} {"train_loss": -28.333770751953125, "global_step": 629937, "epoch": 7589} {"train_loss": -28.184728622436523, "global_step": 629938, "epoch": 7589} {"train_loss": -28.646728515625, "global_step": 629939, "epoch": 7589} {"train_loss": -28.45069694519043, "global_step": 629940, "epoch": 7589} {"train_loss": -27.95448112487793, "global_step": 629941, "epoch": 7589} {"train_loss": -27.6743106842041, "global_step": 629942, "epoch": 7589} {"train_loss": -27.337682723999023, "global_step": 629943, "epoch": 7589} {"train_loss": -27.568408966064453, "global_step": 629944, "epoch": 7589} {"train_loss": -28.2242431640625, "global_step": 629945, "epoch": 7589} {"train_loss": -27.84193229675293, "global_step": 629946, "epoch": 7589} {"train_loss": -27.111501693725586, "global_step": 629947, "epoch": 7589} {"train_loss": -27.351964950561523, "global_step": 629948, "epoch": 7589} {"train_loss": -28.008899688720703, "global_step": 629949, "epoch": 7589} {"train_loss": -27.958215713500977, "global_step": 629950, "epoch": 7589} {"train_loss": -27.635700225830078, "global_step": 629951, "epoch": 7589} {"train_loss": -26.463592529296875, "global_step": 629952, "epoch": 7589} {"train_loss": -27.6967830657959, "global_step": 629953, "epoch": 7589} {"train_loss": -27.464481353759766, "global_step": 629954, "epoch": 7589} {"train_loss": -27.12442398071289, "global_step": 629955, "epoch": 7589} {"train_loss": -27.949289321899414, "global_step": 629956, "epoch": 7589} {"train_loss": -27.477834701538086, "global_step": 629957, "epoch": 7589} {"train_loss": -28.00141716003418, "global_step": 629958, "epoch": 7589} {"train_loss": -28.043210983276367, "global_step": 629959, "epoch": 7589} {"train_loss": -28.245885848999023, "global_step": 629960, "epoch": 7589} {"train_loss": -27.9238224029541, "global_step": 629961, "epoch": 7589} {"train_loss": -27.863378524780273, "global_step": 629962, "epoch": 7589} {"train_loss": -28.0272216796875, "global_step": 629963, "epoch": 7589} {"train_loss": -28.0579891204834, "global_step": 629964, "epoch": 7589} {"train_loss": -27.888410568237305, "global_step": 629965, "epoch": 7589} {"train_loss": -28.058761596679688, "global_step": 629966, "epoch": 7589} {"train_loss": -28.28034782409668, "global_step": 629967, "epoch": 7589} {"train_loss": -28.11869239807129, "global_step": 629968, "epoch": 7589} {"train_loss": -27.941975260355388, "global_step": 629969, "epoch": 7589, "val_loss": 6731055.0} {"train_loss": -27.60504722595215, "global_step": 629970, "epoch": 7590} {"train_loss": -27.296701431274414, "global_step": 629971, "epoch": 7590} {"train_loss": -27.156869888305664, "global_step": 629972, "epoch": 7590} {"train_loss": -27.2048397064209, "global_step": 629973, "epoch": 7590} {"train_loss": -27.58635902404785, "global_step": 629974, "epoch": 7590} {"train_loss": -27.47450828552246, "global_step": 629975, "epoch": 7590} {"train_loss": -28.001733779907227, "global_step": 629976, "epoch": 7590} {"train_loss": -27.8607177734375, "global_step": 629977, "epoch": 7590} {"train_loss": -27.678747177124023, "global_step": 629978, "epoch": 7590} {"train_loss": -27.87615966796875, "global_step": 629979, "epoch": 7590} {"train_loss": -27.889801025390625, "global_step": 629980, "epoch": 7590} {"train_loss": -28.088285446166992, "global_step": 629981, "epoch": 7590} {"train_loss": -28.032880783081055, "global_step": 629982, "epoch": 7590} {"train_loss": -27.750274658203125, "global_step": 629983, "epoch": 7590} {"train_loss": -27.785587310791016, "global_step": 629984, "epoch": 7590} {"train_loss": -28.007226943969727, "global_step": 629985, "epoch": 7590} {"train_loss": -27.910236358642578, "global_step": 629986, "epoch": 7590} {"train_loss": -28.252838134765625, "global_step": 629987, "epoch": 7590} {"train_loss": -27.95281410217285, "global_step": 629988, "epoch": 7590} {"train_loss": -28.074420928955078, "global_step": 629989, "epoch": 7590} {"train_loss": -27.597517013549805, "global_step": 629990, "epoch": 7590} {"train_loss": -27.937931060791016, "global_step": 629991, "epoch": 7590} {"train_loss": -27.832792282104492, "global_step": 629992, "epoch": 7590} {"train_loss": -28.232715606689453, "global_step": 629993, "epoch": 7590} {"train_loss": -27.9683780670166, "global_step": 629994, "epoch": 7590} {"train_loss": -27.8427677154541, "global_step": 629995, "epoch": 7590} {"train_loss": -27.801746368408203, "global_step": 629996, "epoch": 7590} {"train_loss": -28.2465763092041, "global_step": 629997, "epoch": 7590} {"train_loss": -28.023855209350586, "global_step": 629998, "epoch": 7590} {"train_loss": -28.301366806030273, "global_step": 629999, "epoch": 7590} {"train_loss": -28.167524337768555, "global_step": 630000, "epoch": 7590} {"train_loss": -28.455434799194336, "global_step": 630001, "epoch": 7590} {"train_loss": -28.054967880249023, "global_step": 630002, "epoch": 7590} {"train_loss": -27.841297149658203, "global_step": 630003, "epoch": 7590} {"train_loss": -28.345321655273438, "global_step": 630004, "epoch": 7590} {"train_loss": -28.0140438079834, "global_step": 630005, "epoch": 7590} {"train_loss": -28.2185115814209, "global_step": 630006, "epoch": 7590} {"train_loss": -28.26594352722168, "global_step": 630007, "epoch": 7590} {"train_loss": -27.994007110595703, "global_step": 630008, "epoch": 7590} {"train_loss": -28.348983764648438, "global_step": 630009, "epoch": 7590} {"train_loss": -28.230939865112305, "global_step": 630010, "epoch": 7590} {"train_loss": -27.71306800842285, "global_step": 630011, "epoch": 7590} {"train_loss": -27.60992431640625, "global_step": 630012, "epoch": 7590} {"train_loss": -28.248071670532227, "global_step": 630013, "epoch": 7590} {"train_loss": -28.4942684173584, "global_step": 630014, "epoch": 7590} {"train_loss": -27.961179733276367, "global_step": 630015, "epoch": 7590} {"train_loss": -28.08784294128418, "global_step": 630016, "epoch": 7590} {"train_loss": -28.35047721862793, "global_step": 630017, "epoch": 7590} {"train_loss": -28.242267608642578, "global_step": 630018, "epoch": 7590} {"train_loss": -28.187536239624023, "global_step": 630019, "epoch": 7590} {"train_loss": -28.73370933532715, "global_step": 630020, "epoch": 7590} {"train_loss": -27.955093383789062, "global_step": 630021, "epoch": 7590} {"train_loss": -28.281925201416016, "global_step": 630022, "epoch": 7590} {"train_loss": -28.401248931884766, "global_step": 630023, "epoch": 7590} {"train_loss": -28.201068878173828, "global_step": 630024, "epoch": 7590} {"train_loss": -28.59505271911621, "global_step": 630025, "epoch": 7590} {"train_loss": -28.184850692749023, "global_step": 630026, "epoch": 7590} {"train_loss": -28.0908260345459, "global_step": 630027, "epoch": 7590} {"train_loss": -28.31471061706543, "global_step": 630028, "epoch": 7590} {"train_loss": -28.547534942626953, "global_step": 630029, "epoch": 7590} {"train_loss": -28.3446102142334, "global_step": 630030, "epoch": 7590} {"train_loss": -27.788427352905273, "global_step": 630031, "epoch": 7590} {"train_loss": -28.117023468017578, "global_step": 630032, "epoch": 7590} {"train_loss": -28.032794952392578, "global_step": 630033, "epoch": 7590} {"train_loss": -28.4860782623291, "global_step": 630034, "epoch": 7590} {"train_loss": -28.277990341186523, "global_step": 630035, "epoch": 7590} {"train_loss": -28.158300399780273, "global_step": 630036, "epoch": 7590} {"train_loss": -27.9252986907959, "global_step": 630037, "epoch": 7590} {"train_loss": -27.93572425842285, "global_step": 630038, "epoch": 7590} {"train_loss": -28.126911163330078, "global_step": 630039, "epoch": 7590} {"train_loss": -28.159460067749023, "global_step": 630040, "epoch": 7590} {"train_loss": -28.287158966064453, "global_step": 630041, "epoch": 7590} {"train_loss": -28.189977645874023, "global_step": 630042, "epoch": 7590} {"train_loss": -28.345203399658203, "global_step": 630043, "epoch": 7590} {"train_loss": -28.05511474609375, "global_step": 630044, "epoch": 7590} {"train_loss": -27.82511329650879, "global_step": 630045, "epoch": 7590} {"train_loss": -27.667133331298828, "global_step": 630046, "epoch": 7590} {"train_loss": -27.40382194519043, "global_step": 630047, "epoch": 7590} {"train_loss": -28.26664161682129, "global_step": 630048, "epoch": 7590} {"train_loss": -28.5400333404541, "global_step": 630049, "epoch": 7590} {"train_loss": -28.51898193359375, "global_step": 630050, "epoch": 7590} {"train_loss": -27.914981842041016, "global_step": 630051, "epoch": 7590} {"train_loss": -28.055013334894756, "global_step": 630052, "epoch": 7590, "val_loss": 6783031.0} {"train_loss": -27.513626098632812, "global_step": 630053, "epoch": 7591} {"train_loss": -28.107349395751953, "global_step": 630054, "epoch": 7591} {"train_loss": -27.69687843322754, "global_step": 630055, "epoch": 7591} {"train_loss": -27.2891902923584, "global_step": 630056, "epoch": 7591} {"train_loss": -27.248920440673828, "global_step": 630057, "epoch": 7591} {"train_loss": -27.66204833984375, "global_step": 630058, "epoch": 7591} {"train_loss": -27.621198654174805, "global_step": 630059, "epoch": 7591} {"train_loss": -27.430402755737305, "global_step": 630060, "epoch": 7591} {"train_loss": -27.855640411376953, "global_step": 630061, "epoch": 7591} {"train_loss": -27.464954376220703, "global_step": 630062, "epoch": 7591} {"train_loss": -27.833608627319336, "global_step": 630063, "epoch": 7591} {"train_loss": -27.50974464416504, "global_step": 630064, "epoch": 7591} {"train_loss": -27.862323760986328, "global_step": 630065, "epoch": 7591} {"train_loss": -28.025766372680664, "global_step": 630066, "epoch": 7591} {"train_loss": -27.7868709564209, "global_step": 630067, "epoch": 7591} {"train_loss": -28.321002960205078, "global_step": 630068, "epoch": 7591} {"train_loss": -28.196186065673828, "global_step": 630069, "epoch": 7591} {"train_loss": -27.970273971557617, "global_step": 630070, "epoch": 7591} {"train_loss": -27.658716201782227, "global_step": 630071, "epoch": 7591} {"train_loss": -28.263446807861328, "global_step": 630072, "epoch": 7591} {"train_loss": -27.958206176757812, "global_step": 630073, "epoch": 7591} {"train_loss": -27.87827491760254, "global_step": 630074, "epoch": 7591} {"train_loss": -28.04861831665039, "global_step": 630075, "epoch": 7591} {"train_loss": -28.26472282409668, "global_step": 630076, "epoch": 7591} {"train_loss": -27.87758445739746, "global_step": 630077, "epoch": 7591} {"train_loss": -28.487884521484375, "global_step": 630078, "epoch": 7591} {"train_loss": -28.37147331237793, "global_step": 630079, "epoch": 7591} {"train_loss": -27.797149658203125, "global_step": 630080, "epoch": 7591} {"train_loss": -27.95135498046875, "global_step": 630081, "epoch": 7591} {"train_loss": -28.01154899597168, "global_step": 630082, "epoch": 7591} {"train_loss": -28.05989646911621, "global_step": 630083, "epoch": 7591} {"train_loss": -28.460554122924805, "global_step": 630084, "epoch": 7591} {"train_loss": -28.608570098876953, "global_step": 630085, "epoch": 7591} {"train_loss": -28.12885856628418, "global_step": 630086, "epoch": 7591} {"train_loss": -28.290393829345703, "global_step": 630087, "epoch": 7591} {"train_loss": -28.1046085357666, "global_step": 630088, "epoch": 7591} {"train_loss": -28.181873321533203, "global_step": 630089, "epoch": 7591} {"train_loss": -28.323471069335938, "global_step": 630090, "epoch": 7591} {"train_loss": -28.26020622253418, "global_step": 630091, "epoch": 7591} {"train_loss": -28.890583038330078, "global_step": 630092, "epoch": 7591} {"train_loss": -28.026504516601562, "global_step": 630093, "epoch": 7591} {"train_loss": -28.578195571899414, "global_step": 630094, "epoch": 7591} {"train_loss": -28.49073600769043, "global_step": 630095, "epoch": 7591} {"train_loss": -28.3613338470459, "global_step": 630096, "epoch": 7591} {"train_loss": -28.246755599975586, "global_step": 630097, "epoch": 7591} {"train_loss": -28.175495147705078, "global_step": 630098, "epoch": 7591} {"train_loss": -27.907068252563477, "global_step": 630099, "epoch": 7591} {"train_loss": -28.613330841064453, "global_step": 630100, "epoch": 7591} {"train_loss": -28.306127548217773, "global_step": 630101, "epoch": 7591} {"train_loss": -28.489526748657227, "global_step": 630102, "epoch": 7591} {"train_loss": -28.910663604736328, "global_step": 630103, "epoch": 7591} {"train_loss": -28.382705688476562, "global_step": 630104, "epoch": 7591} {"train_loss": -28.047407150268555, "global_step": 630105, "epoch": 7591} {"train_loss": -27.858190536499023, "global_step": 630106, "epoch": 7591} {"train_loss": -27.994626998901367, "global_step": 630107, "epoch": 7591} {"train_loss": -28.040136337280273, "global_step": 630108, "epoch": 7591} {"train_loss": -28.065216064453125, "global_step": 630109, "epoch": 7591} {"train_loss": -28.444717407226562, "global_step": 630110, "epoch": 7591} {"train_loss": -28.437421798706055, "global_step": 630111, "epoch": 7591} {"train_loss": -28.620031356811523, "global_step": 630112, "epoch": 7591} {"train_loss": -27.849225997924805, "global_step": 630113, "epoch": 7591} {"train_loss": -27.839391708374023, "global_step": 630114, "epoch": 7591} {"train_loss": -28.318273544311523, "global_step": 630115, "epoch": 7591} {"train_loss": -27.452905654907227, "global_step": 630116, "epoch": 7591} {"train_loss": -27.744873046875, "global_step": 630117, "epoch": 7591} {"train_loss": -27.338415145874023, "global_step": 630118, "epoch": 7591} {"train_loss": -27.790760040283203, "global_step": 630119, "epoch": 7591} {"train_loss": -27.39729118347168, "global_step": 630120, "epoch": 7591} {"train_loss": -26.971067428588867, "global_step": 630121, "epoch": 7591} {"train_loss": -28.2253360748291, "global_step": 630122, "epoch": 7591} {"train_loss": -27.397815704345703, "global_step": 630123, "epoch": 7591} {"train_loss": -26.858816146850586, "global_step": 630124, "epoch": 7591} {"train_loss": -28.051931381225586, "global_step": 630125, "epoch": 7591} {"train_loss": -27.313995361328125, "global_step": 630126, "epoch": 7591} {"train_loss": -27.892520904541016, "global_step": 630127, "epoch": 7591} {"train_loss": -27.614551544189453, "global_step": 630128, "epoch": 7591} {"train_loss": -27.636037826538086, "global_step": 630129, "epoch": 7591} {"train_loss": -28.0780086517334, "global_step": 630130, "epoch": 7591} {"train_loss": -27.865421295166016, "global_step": 630131, "epoch": 7591} {"train_loss": -27.970794677734375, "global_step": 630132, "epoch": 7591} {"train_loss": -28.182178497314453, "global_step": 630133, "epoch": 7591} {"train_loss": -28.34406852722168, "global_step": 630134, "epoch": 7591} {"train_loss": -27.978465091751282, "global_step": 630135, "epoch": 7591, "val_loss": 6711431.0} {"train_loss": -27.72955894470215, "global_step": 630136, "epoch": 7592} {"train_loss": -27.3813419342041, "global_step": 630137, "epoch": 7592} {"train_loss": -27.922391891479492, "global_step": 630138, "epoch": 7592} {"train_loss": -27.7639217376709, "global_step": 630139, "epoch": 7592} {"train_loss": -27.401235580444336, "global_step": 630140, "epoch": 7592} {"train_loss": -26.899015426635742, "global_step": 630141, "epoch": 7592} {"train_loss": -27.583600997924805, "global_step": 630142, "epoch": 7592} {"train_loss": -27.43641471862793, "global_step": 630143, "epoch": 7592} {"train_loss": -27.66714859008789, "global_step": 630144, "epoch": 7592} {"train_loss": -27.487548828125, "global_step": 630145, "epoch": 7592} {"train_loss": -27.752450942993164, "global_step": 630146, "epoch": 7592} {"train_loss": -27.71402931213379, "global_step": 630147, "epoch": 7592} {"train_loss": -27.720090866088867, "global_step": 630148, "epoch": 7592} {"train_loss": -27.344024658203125, "global_step": 630149, "epoch": 7592} {"train_loss": -28.343658447265625, "global_step": 630150, "epoch": 7592} {"train_loss": -27.699289321899414, "global_step": 630151, "epoch": 7592} {"train_loss": -28.112628936767578, "global_step": 630152, "epoch": 7592} {"train_loss": -27.62941551208496, "global_step": 630153, "epoch": 7592} {"train_loss": -28.097553253173828, "global_step": 630154, "epoch": 7592} {"train_loss": -27.63917350769043, "global_step": 630155, "epoch": 7592} {"train_loss": -28.589435577392578, "global_step": 630156, "epoch": 7592} {"train_loss": -28.010873794555664, "global_step": 630157, "epoch": 7592} {"train_loss": -28.119359970092773, "global_step": 630158, "epoch": 7592} {"train_loss": -27.59937858581543, "global_step": 630159, "epoch": 7592} {"train_loss": -28.121328353881836, "global_step": 630160, "epoch": 7592} {"train_loss": -28.0416202545166, "global_step": 630161, "epoch": 7592} {"train_loss": -28.20916748046875, "global_step": 630162, "epoch": 7592} {"train_loss": -27.943029403686523, "global_step": 630163, "epoch": 7592} {"train_loss": -28.1298828125, "global_step": 630164, "epoch": 7592} {"train_loss": -28.02581787109375, "global_step": 630165, "epoch": 7592} {"train_loss": -28.291858673095703, "global_step": 630166, "epoch": 7592} {"train_loss": -28.07798194885254, "global_step": 630167, "epoch": 7592} {"train_loss": -28.19727897644043, "global_step": 630168, "epoch": 7592} {"train_loss": -28.324548721313477, "global_step": 630169, "epoch": 7592} {"train_loss": -28.152990341186523, "global_step": 630170, "epoch": 7592} {"train_loss": -28.068517684936523, "global_step": 630171, "epoch": 7592} {"train_loss": -28.015378952026367, "global_step": 630172, "epoch": 7592} {"train_loss": -28.05341911315918, "global_step": 630173, "epoch": 7592} {"train_loss": -28.229246139526367, "global_step": 630174, "epoch": 7592} {"train_loss": -28.029312133789062, "global_step": 630175, "epoch": 7592} {"train_loss": -28.0950927734375, "global_step": 630176, "epoch": 7592} {"train_loss": -27.807889938354492, "global_step": 630177, "epoch": 7592} {"train_loss": -28.107528686523438, "global_step": 630178, "epoch": 7592} {"train_loss": -28.03700065612793, "global_step": 630179, "epoch": 7592} {"train_loss": -28.066425323486328, "global_step": 630180, "epoch": 7592} {"train_loss": -27.762012481689453, "global_step": 630181, "epoch": 7592} {"train_loss": -27.966461181640625, "global_step": 630182, "epoch": 7592} {"train_loss": -28.257253646850586, "global_step": 630183, "epoch": 7592} {"train_loss": -28.321989059448242, "global_step": 630184, "epoch": 7592} {"train_loss": -27.95891761779785, "global_step": 630185, "epoch": 7592} {"train_loss": -28.226266860961914, "global_step": 630186, "epoch": 7592} {"train_loss": -28.12054443359375, "global_step": 630187, "epoch": 7592} {"train_loss": -28.215229034423828, "global_step": 630188, "epoch": 7592} {"train_loss": -28.016172409057617, "global_step": 630189, "epoch": 7592} {"train_loss": -28.10628318786621, "global_step": 630190, "epoch": 7592} {"train_loss": -28.371295928955078, "global_step": 630191, "epoch": 7592} {"train_loss": -28.26007652282715, "global_step": 630192, "epoch": 7592} {"train_loss": -28.335721969604492, "global_step": 630193, "epoch": 7592} {"train_loss": -28.50345230102539, "global_step": 630194, "epoch": 7592} {"train_loss": -28.29193687438965, "global_step": 630195, "epoch": 7592} {"train_loss": -28.395374298095703, "global_step": 630196, "epoch": 7592} {"train_loss": -27.914722442626953, "global_step": 630197, "epoch": 7592} {"train_loss": -27.98312759399414, "global_step": 630198, "epoch": 7592} {"train_loss": -28.268884658813477, "global_step": 630199, "epoch": 7592} {"train_loss": -28.326629638671875, "global_step": 630200, "epoch": 7592} {"train_loss": -28.217084884643555, "global_step": 630201, "epoch": 7592} {"train_loss": -28.211156845092773, "global_step": 630202, "epoch": 7592} {"train_loss": -27.982831954956055, "global_step": 630203, "epoch": 7592} {"train_loss": -28.1093807220459, "global_step": 630204, "epoch": 7592} {"train_loss": -28.046157836914062, "global_step": 630205, "epoch": 7592} {"train_loss": -28.37227439880371, "global_step": 630206, "epoch": 7592} {"train_loss": -28.296247482299805, "global_step": 630207, "epoch": 7592} {"train_loss": -28.77638816833496, "global_step": 630208, "epoch": 7592} {"train_loss": -28.376813888549805, "global_step": 630209, "epoch": 7592} {"train_loss": -28.38286781311035, "global_step": 630210, "epoch": 7592} {"train_loss": -28.218854904174805, "global_step": 630211, "epoch": 7592} {"train_loss": -28.07620620727539, "global_step": 630212, "epoch": 7592} {"train_loss": -27.810693740844727, "global_step": 630213, "epoch": 7592} {"train_loss": -28.058319091796875, "global_step": 630214, "epoch": 7592} {"train_loss": -28.56598472595215, "global_step": 630215, "epoch": 7592} {"train_loss": -28.318384170532227, "global_step": 630216, "epoch": 7592} {"train_loss": -28.566925048828125, "global_step": 630217, "epoch": 7592} {"train_loss": -28.048696380063713, "global_step": 630218, "epoch": 7592, "val_loss": 6846092.0} {"train_loss": -26.754013061523438, "global_step": 630219, "epoch": 7593} {"train_loss": -26.883747100830078, "global_step": 630220, "epoch": 7593} {"train_loss": -27.3209285736084, "global_step": 630221, "epoch": 7593} {"train_loss": -26.539081573486328, "global_step": 630222, "epoch": 7593} {"train_loss": -27.5015811920166, "global_step": 630223, "epoch": 7593} {"train_loss": -27.445453643798828, "global_step": 630224, "epoch": 7593} {"train_loss": -27.527807235717773, "global_step": 630225, "epoch": 7593} {"train_loss": -27.24552345275879, "global_step": 630226, "epoch": 7593} {"train_loss": -27.92547607421875, "global_step": 630227, "epoch": 7593} {"train_loss": -27.48615837097168, "global_step": 630228, "epoch": 7593} {"train_loss": -27.5981388092041, "global_step": 630229, "epoch": 7593} {"train_loss": -27.587848663330078, "global_step": 630230, "epoch": 7593} {"train_loss": -27.8258113861084, "global_step": 630231, "epoch": 7593} {"train_loss": -27.2690486907959, "global_step": 630232, "epoch": 7593} {"train_loss": -27.630329132080078, "global_step": 630233, "epoch": 7593} {"train_loss": -27.572784423828125, "global_step": 630234, "epoch": 7593} {"train_loss": -27.742237091064453, "global_step": 630235, "epoch": 7593} {"train_loss": -27.394922256469727, "global_step": 630236, "epoch": 7593} {"train_loss": -28.070632934570312, "global_step": 630237, "epoch": 7593} {"train_loss": -27.766382217407227, "global_step": 630238, "epoch": 7593} {"train_loss": -27.92164421081543, "global_step": 630239, "epoch": 7593} {"train_loss": -27.66657066345215, "global_step": 630240, "epoch": 7593} {"train_loss": -27.782245635986328, "global_step": 630241, "epoch": 7593} {"train_loss": -27.808887481689453, "global_step": 630242, "epoch": 7593} {"train_loss": -27.78744888305664, "global_step": 630243, "epoch": 7593} {"train_loss": -27.62787437438965, "global_step": 630244, "epoch": 7593} {"train_loss": -28.2797908782959, "global_step": 630245, "epoch": 7593} {"train_loss": -27.892892837524414, "global_step": 630246, "epoch": 7593} {"train_loss": -27.856689453125, "global_step": 630247, "epoch": 7593} {"train_loss": -28.542255401611328, "global_step": 630248, "epoch": 7593} {"train_loss": -27.976850509643555, "global_step": 630249, "epoch": 7593} {"train_loss": -27.900964736938477, "global_step": 630250, "epoch": 7593} {"train_loss": -28.043609619140625, "global_step": 630251, "epoch": 7593} {"train_loss": -28.238367080688477, "global_step": 630252, "epoch": 7593} {"train_loss": -28.579648971557617, "global_step": 630253, "epoch": 7593} {"train_loss": -28.068099975585938, "global_step": 630254, "epoch": 7593} {"train_loss": -28.429346084594727, "global_step": 630255, "epoch": 7593} {"train_loss": -28.395612716674805, "global_step": 630256, "epoch": 7593} {"train_loss": -27.912322998046875, "global_step": 630257, "epoch": 7593} {"train_loss": -28.18231201171875, "global_step": 630258, "epoch": 7593} {"train_loss": -28.133466720581055, "global_step": 630259, "epoch": 7593} {"train_loss": -28.271240234375, "global_step": 630260, "epoch": 7593} {"train_loss": -28.479700088500977, "global_step": 630261, "epoch": 7593} {"train_loss": -28.379907608032227, "global_step": 630262, "epoch": 7593} {"train_loss": -28.45835304260254, "global_step": 630263, "epoch": 7593} {"train_loss": -28.495023727416992, "global_step": 630264, "epoch": 7593} {"train_loss": -28.168996810913086, "global_step": 630265, "epoch": 7593} {"train_loss": -28.602436065673828, "global_step": 630266, "epoch": 7593} {"train_loss": -28.379690170288086, "global_step": 630267, "epoch": 7593} {"train_loss": -28.234716415405273, "global_step": 630268, "epoch": 7593} {"train_loss": -28.401599884033203, "global_step": 630269, "epoch": 7593} {"train_loss": -28.128299713134766, "global_step": 630270, "epoch": 7593} {"train_loss": -28.493488311767578, "global_step": 630271, "epoch": 7593} {"train_loss": -28.544696807861328, "global_step": 630272, "epoch": 7593} {"train_loss": -27.7696533203125, "global_step": 630273, "epoch": 7593} {"train_loss": -28.351694107055664, "global_step": 630274, "epoch": 7593} {"train_loss": -28.14569091796875, "global_step": 630275, "epoch": 7593} {"train_loss": -28.36456298828125, "global_step": 630276, "epoch": 7593} {"train_loss": -28.477924346923828, "global_step": 630277, "epoch": 7593} {"train_loss": -28.554960250854492, "global_step": 630278, "epoch": 7593} {"train_loss": -28.435943603515625, "global_step": 630279, "epoch": 7593} {"train_loss": -28.39560317993164, "global_step": 630280, "epoch": 7593} {"train_loss": -28.342487335205078, "global_step": 630281, "epoch": 7593} {"train_loss": -28.553363800048828, "global_step": 630282, "epoch": 7593} {"train_loss": -28.390798568725586, "global_step": 630283, "epoch": 7593} {"train_loss": -28.51177406311035, "global_step": 630284, "epoch": 7593} {"train_loss": -28.372446060180664, "global_step": 630285, "epoch": 7593} {"train_loss": -28.437719345092773, "global_step": 630286, "epoch": 7593} {"train_loss": -28.08351707458496, "global_step": 630287, "epoch": 7593} {"train_loss": -28.218311309814453, "global_step": 630288, "epoch": 7593} {"train_loss": -28.034582138061523, "global_step": 630289, "epoch": 7593} {"train_loss": -28.090402603149414, "global_step": 630290, "epoch": 7593} {"train_loss": -27.807220458984375, "global_step": 630291, "epoch": 7593} {"train_loss": -27.937231063842773, "global_step": 630292, "epoch": 7593} {"train_loss": -28.345327377319336, "global_step": 630293, "epoch": 7593} {"train_loss": -28.2630558013916, "global_step": 630294, "epoch": 7593} {"train_loss": -28.421539306640625, "global_step": 630295, "epoch": 7593} {"train_loss": -28.191303253173828, "global_step": 630296, "epoch": 7593} {"train_loss": -28.394256591796875, "global_step": 630297, "epoch": 7593} {"train_loss": -27.88152503967285, "global_step": 630298, "epoch": 7593} {"train_loss": -28.017648696899414, "global_step": 630299, "epoch": 7593} {"train_loss": -27.58473014831543, "global_step": 630300, "epoch": 7593} {"train_loss": -28.02652657750141, "global_step": 630301, "epoch": 7593, "val_loss": 6736814.0} {"train_loss": -27.39922523498535, "global_step": 630302, "epoch": 7594} {"train_loss": -27.007770538330078, "global_step": 630303, "epoch": 7594} {"train_loss": -26.46884536743164, "global_step": 630304, "epoch": 7594} {"train_loss": -27.363828659057617, "global_step": 630305, "epoch": 7594} {"train_loss": -27.334747314453125, "global_step": 630306, "epoch": 7594} {"train_loss": -27.589263916015625, "global_step": 630307, "epoch": 7594} {"train_loss": -27.71270751953125, "global_step": 630308, "epoch": 7594} {"train_loss": -27.446630477905273, "global_step": 630309, "epoch": 7594} {"train_loss": -27.48810386657715, "global_step": 630310, "epoch": 7594} {"train_loss": -27.4686279296875, "global_step": 630311, "epoch": 7594} {"train_loss": -27.90468406677246, "global_step": 630312, "epoch": 7594} {"train_loss": -27.4792423248291, "global_step": 630313, "epoch": 7594} {"train_loss": -27.763458251953125, "global_step": 630314, "epoch": 7594} {"train_loss": -27.4487361907959, "global_step": 630315, "epoch": 7594} {"train_loss": -27.49759864807129, "global_step": 630316, "epoch": 7594} {"train_loss": -27.93235206604004, "global_step": 630317, "epoch": 7594} {"train_loss": -27.824872970581055, "global_step": 630318, "epoch": 7594} {"train_loss": -27.94624137878418, "global_step": 630319, "epoch": 7594} {"train_loss": -28.007104873657227, "global_step": 630320, "epoch": 7594} {"train_loss": -28.34437370300293, "global_step": 630321, "epoch": 7594} {"train_loss": -27.989500045776367, "global_step": 630322, "epoch": 7594} {"train_loss": -27.94844627380371, "global_step": 630323, "epoch": 7594} {"train_loss": -28.169269561767578, "global_step": 630324, "epoch": 7594} {"train_loss": -28.072484970092773, "global_step": 630325, "epoch": 7594} {"train_loss": -27.900434494018555, "global_step": 630326, "epoch": 7594} {"train_loss": -27.74701499938965, "global_step": 630327, "epoch": 7594} {"train_loss": -27.91986083984375, "global_step": 630328, "epoch": 7594} {"train_loss": -27.443933486938477, "global_step": 630329, "epoch": 7594} {"train_loss": -27.936185836791992, "global_step": 630330, "epoch": 7594} {"train_loss": -28.128931045532227, "global_step": 630331, "epoch": 7594} {"train_loss": -28.22968101501465, "global_step": 630332, "epoch": 7594} {"train_loss": -28.159521102905273, "global_step": 630333, "epoch": 7594} {"train_loss": -28.220212936401367, "global_step": 630334, "epoch": 7594} {"train_loss": -28.109174728393555, "global_step": 630335, "epoch": 7594} {"train_loss": -27.880468368530273, "global_step": 630336, "epoch": 7594} {"train_loss": -27.956892013549805, "global_step": 630337, "epoch": 7594} {"train_loss": -28.004484176635742, "global_step": 630338, "epoch": 7594} {"train_loss": -28.154401779174805, "global_step": 630339, "epoch": 7594} {"train_loss": -28.029977798461914, "global_step": 630340, "epoch": 7594} {"train_loss": -28.14939308166504, "global_step": 630341, "epoch": 7594} {"train_loss": -27.893646240234375, "global_step": 630342, "epoch": 7594} {"train_loss": -27.959842681884766, "global_step": 630343, "epoch": 7594} {"train_loss": -28.50697135925293, "global_step": 630344, "epoch": 7594} {"train_loss": -28.230453491210938, "global_step": 630345, "epoch": 7594} {"train_loss": -28.016775131225586, "global_step": 630346, "epoch": 7594} {"train_loss": -27.953577041625977, "global_step": 630347, "epoch": 7594} {"train_loss": -28.360660552978516, "global_step": 630348, "epoch": 7594} {"train_loss": -28.00933837890625, "global_step": 630349, "epoch": 7594} {"train_loss": -27.850202560424805, "global_step": 630350, "epoch": 7594} {"train_loss": -28.33219337463379, "global_step": 630351, "epoch": 7594} {"train_loss": -28.09075927734375, "global_step": 630352, "epoch": 7594} {"train_loss": -27.549596786499023, "global_step": 630353, "epoch": 7594} {"train_loss": -28.28631019592285, "global_step": 630354, "epoch": 7594} {"train_loss": -28.062360763549805, "global_step": 630355, "epoch": 7594} {"train_loss": -28.39120864868164, "global_step": 630356, "epoch": 7594} {"train_loss": -27.9310302734375, "global_step": 630357, "epoch": 7594} {"train_loss": -27.682880401611328, "global_step": 630358, "epoch": 7594} {"train_loss": -28.01556968688965, "global_step": 630359, "epoch": 7594} {"train_loss": -28.291921615600586, "global_step": 630360, "epoch": 7594} {"train_loss": -28.619298934936523, "global_step": 630361, "epoch": 7594} {"train_loss": -28.48951530456543, "global_step": 630362, "epoch": 7594} {"train_loss": -28.55950927734375, "global_step": 630363, "epoch": 7594} {"train_loss": -27.89875602722168, "global_step": 630364, "epoch": 7594} {"train_loss": -28.367984771728516, "global_step": 630365, "epoch": 7594} {"train_loss": -28.46979331970215, "global_step": 630366, "epoch": 7594} {"train_loss": -28.160131454467773, "global_step": 630367, "epoch": 7594} {"train_loss": -28.311874389648438, "global_step": 630368, "epoch": 7594} {"train_loss": -28.443317413330078, "global_step": 630369, "epoch": 7594} {"train_loss": -28.40543556213379, "global_step": 630370, "epoch": 7594} {"train_loss": -28.603967666625977, "global_step": 630371, "epoch": 7594} {"train_loss": -28.55596923828125, "global_step": 630372, "epoch": 7594} {"train_loss": -28.227643966674805, "global_step": 630373, "epoch": 7594} {"train_loss": -28.378997802734375, "global_step": 630374, "epoch": 7594} {"train_loss": -28.382232666015625, "global_step": 630375, "epoch": 7594} {"train_loss": -28.534042358398438, "global_step": 630376, "epoch": 7594} {"train_loss": -28.46347427368164, "global_step": 630377, "epoch": 7594} {"train_loss": -28.13331413269043, "global_step": 630378, "epoch": 7594} {"train_loss": -28.070755004882812, "global_step": 630379, "epoch": 7594} {"train_loss": -28.358993530273438, "global_step": 630380, "epoch": 7594} {"train_loss": -28.229827880859375, "global_step": 630381, "epoch": 7594} {"train_loss": -28.407791137695312, "global_step": 630382, "epoch": 7594} {"train_loss": -27.6831111907959, "global_step": 630383, "epoch": 7594} {"train_loss": -28.016524900873023, "global_step": 630384, "epoch": 7594, "val_loss": 6796410.0} {"train_loss": -27.209009170532227, "global_step": 630385, "epoch": 7595} {"train_loss": -27.455408096313477, "global_step": 630386, "epoch": 7595} {"train_loss": -27.455230712890625, "global_step": 630387, "epoch": 7595} {"train_loss": -27.126440048217773, "global_step": 630388, "epoch": 7595} {"train_loss": -27.890588760375977, "global_step": 630389, "epoch": 7595} {"train_loss": -27.924610137939453, "global_step": 630390, "epoch": 7595} {"train_loss": -27.366235733032227, "global_step": 630391, "epoch": 7595} {"train_loss": -27.773956298828125, "global_step": 630392, "epoch": 7595} {"train_loss": -27.6674747467041, "global_step": 630393, "epoch": 7595} {"train_loss": -28.015033721923828, "global_step": 630394, "epoch": 7595} {"train_loss": -27.30304527282715, "global_step": 630395, "epoch": 7595} {"train_loss": -28.139623641967773, "global_step": 630396, "epoch": 7595} {"train_loss": -27.852066040039062, "global_step": 630397, "epoch": 7595} {"train_loss": -28.032196044921875, "global_step": 630398, "epoch": 7595} {"train_loss": -28.397186279296875, "global_step": 630399, "epoch": 7595} {"train_loss": -27.773975372314453, "global_step": 630400, "epoch": 7595} {"train_loss": -27.80891990661621, "global_step": 630401, "epoch": 7595} {"train_loss": -27.51312828063965, "global_step": 630402, "epoch": 7595} {"train_loss": -27.837804794311523, "global_step": 630403, "epoch": 7595} {"train_loss": -28.094396591186523, "global_step": 630404, "epoch": 7595} {"train_loss": -27.624608993530273, "global_step": 630405, "epoch": 7595} {"train_loss": -28.03081703186035, "global_step": 630406, "epoch": 7595} {"train_loss": -27.987424850463867, "global_step": 630407, "epoch": 7595} {"train_loss": -28.20318603515625, "global_step": 630408, "epoch": 7595} {"train_loss": -28.4545841217041, "global_step": 630409, "epoch": 7595} {"train_loss": -27.943511962890625, "global_step": 630410, "epoch": 7595} {"train_loss": -27.813379287719727, "global_step": 630411, "epoch": 7595} {"train_loss": -28.062097549438477, "global_step": 630412, "epoch": 7595} {"train_loss": -28.300247192382812, "global_step": 630413, "epoch": 7595} {"train_loss": -28.252965927124023, "global_step": 630414, "epoch": 7595} {"train_loss": -28.24397087097168, "global_step": 630415, "epoch": 7595} {"train_loss": -28.35712242126465, "global_step": 630416, "epoch": 7595} {"train_loss": -28.249109268188477, "global_step": 630417, "epoch": 7595} {"train_loss": -28.28919792175293, "global_step": 630418, "epoch": 7595} {"train_loss": -27.962533950805664, "global_step": 630419, "epoch": 7595} {"train_loss": -28.256000518798828, "global_step": 630420, "epoch": 7595} {"train_loss": -28.3349552154541, "global_step": 630421, "epoch": 7595} {"train_loss": -28.115528106689453, "global_step": 630422, "epoch": 7595} {"train_loss": -28.3587703704834, "global_step": 630423, "epoch": 7595} {"train_loss": -28.273191452026367, "global_step": 630424, "epoch": 7595} {"train_loss": -28.49285316467285, "global_step": 630425, "epoch": 7595} {"train_loss": -28.472742080688477, "global_step": 630426, "epoch": 7595} {"train_loss": -28.79755973815918, "global_step": 630427, "epoch": 7595} {"train_loss": -28.824951171875, "global_step": 630428, "epoch": 7595} {"train_loss": -28.120264053344727, "global_step": 630429, "epoch": 7595} {"train_loss": -28.768238067626953, "global_step": 630430, "epoch": 7595} {"train_loss": -28.471515655517578, "global_step": 630431, "epoch": 7595} {"train_loss": -28.553327560424805, "global_step": 630432, "epoch": 7595} {"train_loss": -28.0698299407959, "global_step": 630433, "epoch": 7595} {"train_loss": -28.363971710205078, "global_step": 630434, "epoch": 7595} {"train_loss": -28.212263107299805, "global_step": 630435, "epoch": 7595} {"train_loss": -28.506591796875, "global_step": 630436, "epoch": 7595} {"train_loss": -28.6810245513916, "global_step": 630437, "epoch": 7595} {"train_loss": -28.5312557220459, "global_step": 630438, "epoch": 7595} {"train_loss": -28.28643798828125, "global_step": 630439, "epoch": 7595} {"train_loss": -28.175195693969727, "global_step": 630440, "epoch": 7595} {"train_loss": -28.26331901550293, "global_step": 630441, "epoch": 7595} {"train_loss": -28.017072677612305, "global_step": 630442, "epoch": 7595} {"train_loss": -28.3270263671875, "global_step": 630443, "epoch": 7595} {"train_loss": -28.645633697509766, "global_step": 630444, "epoch": 7595} {"train_loss": -28.132192611694336, "global_step": 630445, "epoch": 7595} {"train_loss": -28.110692977905273, "global_step": 630446, "epoch": 7595} {"train_loss": -28.36141014099121, "global_step": 630447, "epoch": 7595} {"train_loss": -28.089216232299805, "global_step": 630448, "epoch": 7595} {"train_loss": -28.543622970581055, "global_step": 630449, "epoch": 7595} {"train_loss": -28.013721466064453, "global_step": 630450, "epoch": 7595} {"train_loss": -27.714508056640625, "global_step": 630451, "epoch": 7595} {"train_loss": -28.39341163635254, "global_step": 630452, "epoch": 7595} {"train_loss": -28.03889274597168, "global_step": 630453, "epoch": 7595} {"train_loss": -27.923852920532227, "global_step": 630454, "epoch": 7595} {"train_loss": -28.136274337768555, "global_step": 630455, "epoch": 7595} {"train_loss": -27.911413192749023, "global_step": 630456, "epoch": 7595} {"train_loss": -27.793487548828125, "global_step": 630457, "epoch": 7595} {"train_loss": -28.031940460205078, "global_step": 630458, "epoch": 7595} {"train_loss": -28.01685905456543, "global_step": 630459, "epoch": 7595} {"train_loss": -28.07108497619629, "global_step": 630460, "epoch": 7595} {"train_loss": -27.96685791015625, "global_step": 630461, "epoch": 7595} {"train_loss": -27.531906127929688, "global_step": 630462, "epoch": 7595} {"train_loss": -27.728845596313477, "global_step": 630463, "epoch": 7595} {"train_loss": -27.82097816467285, "global_step": 630464, "epoch": 7595} {"train_loss": -28.23590087890625, "global_step": 630465, "epoch": 7595} {"train_loss": -28.074249267578125, "global_step": 630466, "epoch": 7595} {"train_loss": -28.080987103014106, "global_step": 630467, "epoch": 7595, "val_loss": 6747126.0} {"train_loss": -27.66962242126465, "global_step": 630468, "epoch": 7596} {"train_loss": -27.542072296142578, "global_step": 630469, "epoch": 7596} {"train_loss": -27.99472427368164, "global_step": 630470, "epoch": 7596} {"train_loss": -27.115182876586914, "global_step": 630471, "epoch": 7596} {"train_loss": -27.240142822265625, "global_step": 630472, "epoch": 7596} {"train_loss": -27.71380043029785, "global_step": 630473, "epoch": 7596} {"train_loss": -27.39158058166504, "global_step": 630474, "epoch": 7596} {"train_loss": -27.41944694519043, "global_step": 630475, "epoch": 7596} {"train_loss": -27.184762954711914, "global_step": 630476, "epoch": 7596} {"train_loss": -27.560260772705078, "global_step": 630477, "epoch": 7596} {"train_loss": -27.747547149658203, "global_step": 630478, "epoch": 7596} {"train_loss": -27.98634910583496, "global_step": 630479, "epoch": 7596} {"train_loss": -27.778676986694336, "global_step": 630480, "epoch": 7596} {"train_loss": -27.929285049438477, "global_step": 630481, "epoch": 7596} {"train_loss": -27.844892501831055, "global_step": 630482, "epoch": 7596} {"train_loss": -27.7244930267334, "global_step": 630483, "epoch": 7596} {"train_loss": -27.417739868164062, "global_step": 630484, "epoch": 7596} {"train_loss": -27.7021427154541, "global_step": 630485, "epoch": 7596} {"train_loss": -28.242292404174805, "global_step": 630486, "epoch": 7596} {"train_loss": -27.851987838745117, "global_step": 630487, "epoch": 7596} {"train_loss": -27.968109130859375, "global_step": 630488, "epoch": 7596} {"train_loss": -27.549392700195312, "global_step": 630489, "epoch": 7596} {"train_loss": -27.944366455078125, "global_step": 630490, "epoch": 7596} {"train_loss": -28.044591903686523, "global_step": 630491, "epoch": 7596} {"train_loss": -27.793100357055664, "global_step": 630492, "epoch": 7596} {"train_loss": -28.005329132080078, "global_step": 630493, "epoch": 7596} {"train_loss": -27.87677001953125, "global_step": 630494, "epoch": 7596} {"train_loss": -27.99539566040039, "global_step": 630495, "epoch": 7596} {"train_loss": -27.95623779296875, "global_step": 630496, "epoch": 7596} {"train_loss": -28.09246826171875, "global_step": 630497, "epoch": 7596} {"train_loss": -28.068256378173828, "global_step": 630498, "epoch": 7596} {"train_loss": -27.9957332611084, "global_step": 630499, "epoch": 7596} {"train_loss": -28.023813247680664, "global_step": 630500, "epoch": 7596} {"train_loss": -28.182165145874023, "global_step": 630501, "epoch": 7596} {"train_loss": -28.094655990600586, "global_step": 630502, "epoch": 7596} {"train_loss": -28.5930233001709, "global_step": 630503, "epoch": 7596} {"train_loss": -28.0167236328125, "global_step": 630504, "epoch": 7596} {"train_loss": -28.200714111328125, "global_step": 630505, "epoch": 7596} {"train_loss": -28.594192504882812, "global_step": 630506, "epoch": 7596} {"train_loss": -28.220596313476562, "global_step": 630507, "epoch": 7596} {"train_loss": -28.28871726989746, "global_step": 630508, "epoch": 7596} {"train_loss": -28.6191463470459, "global_step": 630509, "epoch": 7596} {"train_loss": -28.550827026367188, "global_step": 630510, "epoch": 7596} {"train_loss": -28.59270668029785, "global_step": 630511, "epoch": 7596} {"train_loss": -28.57252311706543, "global_step": 630512, "epoch": 7596} {"train_loss": -28.34332847595215, "global_step": 630513, "epoch": 7596} {"train_loss": -28.359241485595703, "global_step": 630514, "epoch": 7596} {"train_loss": -28.677148818969727, "global_step": 630515, "epoch": 7596} {"train_loss": -28.579696655273438, "global_step": 630516, "epoch": 7596} {"train_loss": -28.129751205444336, "global_step": 630517, "epoch": 7596} {"train_loss": -27.917388916015625, "global_step": 630518, "epoch": 7596} {"train_loss": -28.651025772094727, "global_step": 630519, "epoch": 7596} {"train_loss": -28.691242218017578, "global_step": 630520, "epoch": 7596} {"train_loss": -28.784826278686523, "global_step": 630521, "epoch": 7596} {"train_loss": -28.40912437438965, "global_step": 630522, "epoch": 7596} {"train_loss": -28.72670555114746, "global_step": 630523, "epoch": 7596} {"train_loss": -28.49860954284668, "global_step": 630524, "epoch": 7596} {"train_loss": -28.430418014526367, "global_step": 630525, "epoch": 7596} {"train_loss": -28.364431381225586, "global_step": 630526, "epoch": 7596} {"train_loss": -28.040863037109375, "global_step": 630527, "epoch": 7596} {"train_loss": -28.37981605529785, "global_step": 630528, "epoch": 7596} {"train_loss": -28.0904483795166, "global_step": 630529, "epoch": 7596} {"train_loss": -27.82034683227539, "global_step": 630530, "epoch": 7596} {"train_loss": -27.937368392944336, "global_step": 630531, "epoch": 7596} {"train_loss": -27.809858322143555, "global_step": 630532, "epoch": 7596} {"train_loss": -27.771759033203125, "global_step": 630533, "epoch": 7596} {"train_loss": -27.80213737487793, "global_step": 630534, "epoch": 7596} {"train_loss": -27.95655632019043, "global_step": 630535, "epoch": 7596} {"train_loss": -28.027326583862305, "global_step": 630536, "epoch": 7596} {"train_loss": -28.04718017578125, "global_step": 630537, "epoch": 7596} {"train_loss": -28.232580184936523, "global_step": 630538, "epoch": 7596} {"train_loss": -28.07057762145996, "global_step": 630539, "epoch": 7596} {"train_loss": -28.144262313842773, "global_step": 630540, "epoch": 7596} {"train_loss": -28.3647518157959, "global_step": 630541, "epoch": 7596} {"train_loss": -28.42103385925293, "global_step": 630542, "epoch": 7596} {"train_loss": -28.249780654907227, "global_step": 630543, "epoch": 7596} {"train_loss": -28.274341583251953, "global_step": 630544, "epoch": 7596} {"train_loss": -28.337614059448242, "global_step": 630545, "epoch": 7596} {"train_loss": -28.061742782592773, "global_step": 630546, "epoch": 7596} {"train_loss": -28.196924209594727, "global_step": 630547, "epoch": 7596} {"train_loss": -28.198293685913086, "global_step": 630548, "epoch": 7596} {"train_loss": -27.78315544128418, "global_step": 630549, "epoch": 7596} {"train_loss": -28.04962427070342, "global_step": 630550, "epoch": 7596, "val_loss": 6678293.0} {"train_loss": -27.256977081298828, "global_step": 630551, "epoch": 7597} {"train_loss": -26.809377670288086, "global_step": 630552, "epoch": 7597} {"train_loss": -27.825275421142578, "global_step": 630553, "epoch": 7597} {"train_loss": -27.28384780883789, "global_step": 630554, "epoch": 7597} {"train_loss": -27.648513793945312, "global_step": 630555, "epoch": 7597} {"train_loss": -27.249792098999023, "global_step": 630556, "epoch": 7597} {"train_loss": -27.61567497253418, "global_step": 630557, "epoch": 7597} {"train_loss": -27.280187606811523, "global_step": 630558, "epoch": 7597} {"train_loss": -27.854955673217773, "global_step": 630559, "epoch": 7597} {"train_loss": -27.501636505126953, "global_step": 630560, "epoch": 7597} {"train_loss": -27.5762996673584, "global_step": 630561, "epoch": 7597} {"train_loss": -27.822235107421875, "global_step": 630562, "epoch": 7597} {"train_loss": -28.17725944519043, "global_step": 630563, "epoch": 7597} {"train_loss": -28.0792236328125, "global_step": 630564, "epoch": 7597} {"train_loss": -27.59891700744629, "global_step": 630565, "epoch": 7597} {"train_loss": -27.906545639038086, "global_step": 630566, "epoch": 7597} {"train_loss": -27.900781631469727, "global_step": 630567, "epoch": 7597} {"train_loss": -28.4722957611084, "global_step": 630568, "epoch": 7597} {"train_loss": -27.947101593017578, "global_step": 630569, "epoch": 7597} {"train_loss": -27.908945083618164, "global_step": 630570, "epoch": 7597} {"train_loss": -28.151498794555664, "global_step": 630571, "epoch": 7597} {"train_loss": -28.36493492126465, "global_step": 630572, "epoch": 7597} {"train_loss": -28.311498641967773, "global_step": 630573, "epoch": 7597} {"train_loss": -27.503833770751953, "global_step": 630574, "epoch": 7597} {"train_loss": -28.001026153564453, "global_step": 630575, "epoch": 7597} {"train_loss": -28.412084579467773, "global_step": 630576, "epoch": 7597} {"train_loss": -28.07221031188965, "global_step": 630577, "epoch": 7597} {"train_loss": -27.893604278564453, "global_step": 630578, "epoch": 7597} {"train_loss": -28.15174674987793, "global_step": 630579, "epoch": 7597} {"train_loss": -28.1848201751709, "global_step": 630580, "epoch": 7597} {"train_loss": -28.053115844726562, "global_step": 630581, "epoch": 7597} {"train_loss": -27.653074264526367, "global_step": 630582, "epoch": 7597} {"train_loss": -28.25070571899414, "global_step": 630583, "epoch": 7597} {"train_loss": -28.152753829956055, "global_step": 630584, "epoch": 7597} {"train_loss": -28.6213321685791, "global_step": 630585, "epoch": 7597} {"train_loss": -27.85212516784668, "global_step": 630586, "epoch": 7597} {"train_loss": -27.417572021484375, "global_step": 630587, "epoch": 7597} {"train_loss": -28.05100440979004, "global_step": 630588, "epoch": 7597} {"train_loss": -27.908002853393555, "global_step": 630589, "epoch": 7597} {"train_loss": -27.958669662475586, "global_step": 630590, "epoch": 7597} {"train_loss": -27.98457908630371, "global_step": 630591, "epoch": 7597} {"train_loss": -28.164220809936523, "global_step": 630592, "epoch": 7597} {"train_loss": -28.42304801940918, "global_step": 630593, "epoch": 7597} {"train_loss": -28.378437042236328, "global_step": 630594, "epoch": 7597} {"train_loss": -28.289182662963867, "global_step": 630595, "epoch": 7597} {"train_loss": -28.647214889526367, "global_step": 630596, "epoch": 7597} {"train_loss": -28.369794845581055, "global_step": 630597, "epoch": 7597} {"train_loss": -28.27484130859375, "global_step": 630598, "epoch": 7597} {"train_loss": -28.2158203125, "global_step": 630599, "epoch": 7597} {"train_loss": -28.172571182250977, "global_step": 630600, "epoch": 7597} {"train_loss": -28.215900421142578, "global_step": 630601, "epoch": 7597} {"train_loss": -28.047595977783203, "global_step": 630602, "epoch": 7597} {"train_loss": -28.383447647094727, "global_step": 630603, "epoch": 7597} {"train_loss": -28.27947998046875, "global_step": 630604, "epoch": 7597} {"train_loss": -28.564895629882812, "global_step": 630605, "epoch": 7597} {"train_loss": -28.269067764282227, "global_step": 630606, "epoch": 7597} {"train_loss": -28.003259658813477, "global_step": 630607, "epoch": 7597} {"train_loss": -28.193029403686523, "global_step": 630608, "epoch": 7597} {"train_loss": -28.4613094329834, "global_step": 630609, "epoch": 7597} {"train_loss": -28.575977325439453, "global_step": 630610, "epoch": 7597} {"train_loss": -28.192657470703125, "global_step": 630611, "epoch": 7597} {"train_loss": -28.120946884155273, "global_step": 630612, "epoch": 7597} {"train_loss": -28.375335693359375, "global_step": 630613, "epoch": 7597} {"train_loss": -28.25927734375, "global_step": 630614, "epoch": 7597} {"train_loss": -28.245758056640625, "global_step": 630615, "epoch": 7597} {"train_loss": -28.1087703704834, "global_step": 630616, "epoch": 7597} {"train_loss": -28.42473793029785, "global_step": 630617, "epoch": 7597} {"train_loss": -28.2391357421875, "global_step": 630618, "epoch": 7597} {"train_loss": -28.052234649658203, "global_step": 630619, "epoch": 7597} {"train_loss": -28.058263778686523, "global_step": 630620, "epoch": 7597} {"train_loss": -28.302183151245117, "global_step": 630621, "epoch": 7597} {"train_loss": -27.804224014282227, "global_step": 630622, "epoch": 7597} {"train_loss": -28.072952270507812, "global_step": 630623, "epoch": 7597} {"train_loss": -27.933258056640625, "global_step": 630624, "epoch": 7597} {"train_loss": -28.13212013244629, "global_step": 630625, "epoch": 7597} {"train_loss": -28.39006996154785, "global_step": 630626, "epoch": 7597} {"train_loss": -28.0830078125, "global_step": 630627, "epoch": 7597} {"train_loss": -27.818347930908203, "global_step": 630628, "epoch": 7597} {"train_loss": -28.379613876342773, "global_step": 630629, "epoch": 7597} {"train_loss": -28.052692413330078, "global_step": 630630, "epoch": 7597} {"train_loss": -28.1212100982666, "global_step": 630631, "epoch": 7597} {"train_loss": -28.106592178344727, "global_step": 630632, "epoch": 7597} {"train_loss": -28.039164186960242, "global_step": 630633, "epoch": 7597, "val_loss": 6755469.5} {"train_loss": -28.080106735229492, "global_step": 630634, "epoch": 7598} {"train_loss": -28.0179386138916, "global_step": 630635, "epoch": 7598} {"train_loss": -27.360666275024414, "global_step": 630636, "epoch": 7598} {"train_loss": -27.340036392211914, "global_step": 630637, "epoch": 7598} {"train_loss": -27.624298095703125, "global_step": 630638, "epoch": 7598} {"train_loss": -27.633893966674805, "global_step": 630639, "epoch": 7598} {"train_loss": -27.45415687561035, "global_step": 630640, "epoch": 7598} {"train_loss": -27.5682430267334, "global_step": 630641, "epoch": 7598} {"train_loss": -27.289167404174805, "global_step": 630642, "epoch": 7598} {"train_loss": -27.722333908081055, "global_step": 630643, "epoch": 7598} {"train_loss": -27.80441665649414, "global_step": 630644, "epoch": 7598} {"train_loss": -27.8641300201416, "global_step": 630645, "epoch": 7598} {"train_loss": -27.895832061767578, "global_step": 630646, "epoch": 7598} {"train_loss": -27.4525146484375, "global_step": 630647, "epoch": 7598} {"train_loss": -27.886789321899414, "global_step": 630648, "epoch": 7598} {"train_loss": -27.891828536987305, "global_step": 630649, "epoch": 7598} {"train_loss": -27.975671768188477, "global_step": 630650, "epoch": 7598} {"train_loss": -28.1028995513916, "global_step": 630651, "epoch": 7598} {"train_loss": -27.649572372436523, "global_step": 630652, "epoch": 7598} {"train_loss": -27.698766708374023, "global_step": 630653, "epoch": 7598} {"train_loss": -27.929397583007812, "global_step": 630654, "epoch": 7598} {"train_loss": -27.88380241394043, "global_step": 630655, "epoch": 7598} {"train_loss": -27.608739852905273, "global_step": 630656, "epoch": 7598} {"train_loss": -27.8309268951416, "global_step": 630657, "epoch": 7598} {"train_loss": -27.949438095092773, "global_step": 630658, "epoch": 7598} {"train_loss": -27.689359664916992, "global_step": 630659, "epoch": 7598} {"train_loss": -28.012313842773438, "global_step": 630660, "epoch": 7598} {"train_loss": -28.227136611938477, "global_step": 630661, "epoch": 7598} {"train_loss": -27.948352813720703, "global_step": 630662, "epoch": 7598} {"train_loss": -28.38865089416504, "global_step": 630663, "epoch": 7598} {"train_loss": -28.056873321533203, "global_step": 630664, "epoch": 7598} {"train_loss": -28.02617835998535, "global_step": 630665, "epoch": 7598} {"train_loss": -28.117544174194336, "global_step": 630666, "epoch": 7598} {"train_loss": -28.36407470703125, "global_step": 630667, "epoch": 7598} {"train_loss": -28.246763229370117, "global_step": 630668, "epoch": 7598} {"train_loss": -28.233169555664062, "global_step": 630669, "epoch": 7598} {"train_loss": -28.114953994750977, "global_step": 630670, "epoch": 7598} {"train_loss": -28.35262107849121, "global_step": 630671, "epoch": 7598} {"train_loss": -27.788305282592773, "global_step": 630672, "epoch": 7598} {"train_loss": -27.90781593322754, "global_step": 630673, "epoch": 7598} {"train_loss": -28.205001831054688, "global_step": 630674, "epoch": 7598} {"train_loss": -27.874622344970703, "global_step": 630675, "epoch": 7598} {"train_loss": -28.321069717407227, "global_step": 630676, "epoch": 7598} {"train_loss": -28.17901039123535, "global_step": 630677, "epoch": 7598} {"train_loss": -28.3489990234375, "global_step": 630678, "epoch": 7598} {"train_loss": -28.01295280456543, "global_step": 630679, "epoch": 7598} {"train_loss": -28.529020309448242, "global_step": 630680, "epoch": 7598} {"train_loss": -28.28492546081543, "global_step": 630681, "epoch": 7598} {"train_loss": -28.097293853759766, "global_step": 630682, "epoch": 7598} {"train_loss": -28.277545928955078, "global_step": 630683, "epoch": 7598} {"train_loss": -28.19032096862793, "global_step": 630684, "epoch": 7598} {"train_loss": -28.394515991210938, "global_step": 630685, "epoch": 7598} {"train_loss": -28.386856079101562, "global_step": 630686, "epoch": 7598} {"train_loss": -28.35145378112793, "global_step": 630687, "epoch": 7598} {"train_loss": -28.9532470703125, "global_step": 630688, "epoch": 7598} {"train_loss": -28.24837303161621, "global_step": 630689, "epoch": 7598} {"train_loss": -27.98968505859375, "global_step": 630690, "epoch": 7598} {"train_loss": -28.243131637573242, "global_step": 630691, "epoch": 7598} {"train_loss": -28.50138282775879, "global_step": 630692, "epoch": 7598} {"train_loss": -28.55531120300293, "global_step": 630693, "epoch": 7598} {"train_loss": -28.192737579345703, "global_step": 630694, "epoch": 7598} {"train_loss": -28.730987548828125, "global_step": 630695, "epoch": 7598} {"train_loss": -28.895727157592773, "global_step": 630696, "epoch": 7598} {"train_loss": -28.37299919128418, "global_step": 630697, "epoch": 7598} {"train_loss": -28.43507194519043, "global_step": 630698, "epoch": 7598} {"train_loss": -28.434438705444336, "global_step": 630699, "epoch": 7598} {"train_loss": -28.268360137939453, "global_step": 630700, "epoch": 7598} {"train_loss": -28.5087833404541, "global_step": 630701, "epoch": 7598} {"train_loss": -28.041339874267578, "global_step": 630702, "epoch": 7598} {"train_loss": -27.537067413330078, "global_step": 630703, "epoch": 7598} {"train_loss": -26.669065475463867, "global_step": 630704, "epoch": 7598} {"train_loss": -24.645780563354492, "global_step": 630705, "epoch": 7598} {"train_loss": -24.157312393188477, "global_step": 630706, "epoch": 7598} {"train_loss": -24.423856735229492, "global_step": 630707, "epoch": 7598} {"train_loss": -24.585302352905273, "global_step": 630708, "epoch": 7598} {"train_loss": -27.2940673828125, "global_step": 630709, "epoch": 7598} {"train_loss": -26.22051429748535, "global_step": 630710, "epoch": 7598} {"train_loss": -27.2172908782959, "global_step": 630711, "epoch": 7598} {"train_loss": -26.779821395874023, "global_step": 630712, "epoch": 7598} {"train_loss": -27.0546875, "global_step": 630713, "epoch": 7598} {"train_loss": -27.13189125061035, "global_step": 630714, "epoch": 7598} {"train_loss": -27.19586181640625, "global_step": 630715, "epoch": 7598} {"train_loss": -27.75436490989593, "global_step": 630716, "epoch": 7598, "val_loss": 6715740.0} {"train_loss": -26.752899169921875, "global_step": 630717, "epoch": 7599} {"train_loss": -26.2917423248291, "global_step": 630718, "epoch": 7599} {"train_loss": -26.805419921875, "global_step": 630719, "epoch": 7599} {"train_loss": -26.467084884643555, "global_step": 630720, "epoch": 7599} {"train_loss": -26.655176162719727, "global_step": 630721, "epoch": 7599} {"train_loss": -26.963577270507812, "global_step": 630722, "epoch": 7599} {"train_loss": -27.057422637939453, "global_step": 630723, "epoch": 7599} {"train_loss": -26.46607780456543, "global_step": 630724, "epoch": 7599} {"train_loss": -27.050352096557617, "global_step": 630725, "epoch": 7599} {"train_loss": -27.148584365844727, "global_step": 630726, "epoch": 7599} {"train_loss": -26.97208595275879, "global_step": 630727, "epoch": 7599} {"train_loss": -26.813398361206055, "global_step": 630728, "epoch": 7599} {"train_loss": -27.18726921081543, "global_step": 630729, "epoch": 7599} {"train_loss": -27.324283599853516, "global_step": 630730, "epoch": 7599} {"train_loss": -27.201623916625977, "global_step": 630731, "epoch": 7599} {"train_loss": -27.3847599029541, "global_step": 630732, "epoch": 7599} {"train_loss": -27.658203125, "global_step": 630733, "epoch": 7599} {"train_loss": -27.52484130859375, "global_step": 630734, "epoch": 7599} {"train_loss": -27.45155143737793, "global_step": 630735, "epoch": 7599} {"train_loss": -27.659168243408203, "global_step": 630736, "epoch": 7599} {"train_loss": -27.78663444519043, "global_step": 630737, "epoch": 7599} {"train_loss": -27.71579360961914, "global_step": 630738, "epoch": 7599} {"train_loss": -27.680517196655273, "global_step": 630739, "epoch": 7599} {"train_loss": -27.69431495666504, "global_step": 630740, "epoch": 7599} {"train_loss": -27.976898193359375, "global_step": 630741, "epoch": 7599} {"train_loss": -27.538721084594727, "global_step": 630742, "epoch": 7599} {"train_loss": -27.624738693237305, "global_step": 630743, "epoch": 7599} {"train_loss": -27.8644962310791, "global_step": 630744, "epoch": 7599} {"train_loss": -27.69964027404785, "global_step": 630745, "epoch": 7599} {"train_loss": -28.018299102783203, "global_step": 630746, "epoch": 7599} {"train_loss": -27.931121826171875, "global_step": 630747, "epoch": 7599} {"train_loss": -28.042465209960938, "global_step": 630748, "epoch": 7599} {"train_loss": -27.581024169921875, "global_step": 630749, "epoch": 7599} {"train_loss": -27.817520141601562, "global_step": 630750, "epoch": 7599} {"train_loss": -27.7967529296875, "global_step": 630751, "epoch": 7599} {"train_loss": -27.84417152404785, "global_step": 630752, "epoch": 7599} {"train_loss": -27.993066787719727, "global_step": 630753, "epoch": 7599} {"train_loss": -28.048507690429688, "global_step": 630754, "epoch": 7599} {"train_loss": -28.38406753540039, "global_step": 630755, "epoch": 7599} {"train_loss": -28.28546714782715, "global_step": 630756, "epoch": 7599} {"train_loss": -28.3226375579834, "global_step": 630757, "epoch": 7599} {"train_loss": -28.123132705688477, "global_step": 630758, "epoch": 7599} {"train_loss": -28.836729049682617, "global_step": 630759, "epoch": 7599} {"train_loss": -28.614160537719727, "global_step": 630760, "epoch": 7599} {"train_loss": -28.254201889038086, "global_step": 630761, "epoch": 7599} {"train_loss": -28.304716110229492, "global_step": 630762, "epoch": 7599} {"train_loss": -28.119125366210938, "global_step": 630763, "epoch": 7599} {"train_loss": -28.575475692749023, "global_step": 630764, "epoch": 7599} {"train_loss": -28.241729736328125, "global_step": 630765, "epoch": 7599} {"train_loss": -28.329456329345703, "global_step": 630766, "epoch": 7599} {"train_loss": -28.193689346313477, "global_step": 630767, "epoch": 7599} {"train_loss": -28.62818717956543, "global_step": 630768, "epoch": 7599} {"train_loss": -28.203277587890625, "global_step": 630769, "epoch": 7599} {"train_loss": -27.93079948425293, "global_step": 630770, "epoch": 7599} {"train_loss": -28.4610595703125, "global_step": 630771, "epoch": 7599} {"train_loss": -28.110239028930664, "global_step": 630772, "epoch": 7599} {"train_loss": -27.666004180908203, "global_step": 630773, "epoch": 7599} {"train_loss": -28.093976974487305, "global_step": 630774, "epoch": 7599} {"train_loss": -28.348791122436523, "global_step": 630775, "epoch": 7599} {"train_loss": -28.016754150390625, "global_step": 630776, "epoch": 7599} {"train_loss": -28.0692081451416, "global_step": 630777, "epoch": 7599} {"train_loss": -28.39029884338379, "global_step": 630778, "epoch": 7599} {"train_loss": -28.260208129882812, "global_step": 630779, "epoch": 7599} {"train_loss": -27.86114501953125, "global_step": 630780, "epoch": 7599} {"train_loss": -28.05989646911621, "global_step": 630781, "epoch": 7599} {"train_loss": -28.124841690063477, "global_step": 630782, "epoch": 7599} {"train_loss": -28.095212936401367, "global_step": 630783, "epoch": 7599} {"train_loss": -28.476184844970703, "global_step": 630784, "epoch": 7599} {"train_loss": -28.322193145751953, "global_step": 630785, "epoch": 7599} {"train_loss": -28.376789093017578, "global_step": 630786, "epoch": 7599} {"train_loss": -28.409637451171875, "global_step": 630787, "epoch": 7599} {"train_loss": -27.830121994018555, "global_step": 630788, "epoch": 7599} {"train_loss": -28.13534927368164, "global_step": 630789, "epoch": 7599} {"train_loss": -28.15610122680664, "global_step": 630790, "epoch": 7599} {"train_loss": -28.619237899780273, "global_step": 630791, "epoch": 7599} {"train_loss": -28.208478927612305, "global_step": 630792, "epoch": 7599} {"train_loss": -28.54825782775879, "global_step": 630793, "epoch": 7599} {"train_loss": -28.473865509033203, "global_step": 630794, "epoch": 7599} {"train_loss": -28.454206466674805, "global_step": 630795, "epoch": 7599} {"train_loss": -28.409896850585938, "global_step": 630796, "epoch": 7599} {"train_loss": -28.076276779174805, "global_step": 630797, "epoch": 7599} {"train_loss": -28.200185775756836, "global_step": 630798, "epoch": 7599} {"train_loss": -27.883092305746423, "global_step": 630799, "epoch": 7599, "val_loss": 6776823.5} {"train_loss": -27.886510848999023, "global_step": 630800, "epoch": 7600} {"train_loss": -27.943029403686523, "global_step": 630801, "epoch": 7600} {"train_loss": -28.09974479675293, "global_step": 630802, "epoch": 7600} {"train_loss": -28.302587509155273, "global_step": 630803, "epoch": 7600} {"train_loss": -27.531686782836914, "global_step": 630804, "epoch": 7600} {"train_loss": -27.465314865112305, "global_step": 630805, "epoch": 7600} {"train_loss": -27.312280654907227, "global_step": 630806, "epoch": 7600} {"train_loss": -28.4617919921875, "global_step": 630807, "epoch": 7600} {"train_loss": -27.77113914489746, "global_step": 630808, "epoch": 7600} {"train_loss": -27.859098434448242, "global_step": 630809, "epoch": 7600} {"train_loss": -28.215316772460938, "global_step": 630810, "epoch": 7600} {"train_loss": -28.144317626953125, "global_step": 630811, "epoch": 7600} {"train_loss": -27.930877685546875, "global_step": 630812, "epoch": 7600} {"train_loss": -28.37306785583496, "global_step": 630813, "epoch": 7600} {"train_loss": -28.107568740844727, "global_step": 630814, "epoch": 7600} {"train_loss": -28.256711959838867, "global_step": 630815, "epoch": 7600} {"train_loss": -28.07341957092285, "global_step": 630816, "epoch": 7600} {"train_loss": -27.703704833984375, "global_step": 630817, "epoch": 7600} {"train_loss": -27.61326026916504, "global_step": 630818, "epoch": 7600} {"train_loss": -28.717681884765625, "global_step": 630819, "epoch": 7600} {"train_loss": -27.79376792907715, "global_step": 630820, "epoch": 7600} {"train_loss": -28.097211837768555, "global_step": 630821, "epoch": 7600} {"train_loss": -28.40651512145996, "global_step": 630822, "epoch": 7600} {"train_loss": -28.14185905456543, "global_step": 630823, "epoch": 7600} {"train_loss": -28.402759552001953, "global_step": 630824, "epoch": 7600} {"train_loss": -28.398651123046875, "global_step": 630825, "epoch": 7600} {"train_loss": -28.030065536499023, "global_step": 630826, "epoch": 7600} {"train_loss": -28.362293243408203, "global_step": 630827, "epoch": 7600} {"train_loss": -28.032825469970703, "global_step": 630828, "epoch": 7600} {"train_loss": -28.497949600219727, "global_step": 630829, "epoch": 7600} {"train_loss": -28.113317489624023, "global_step": 630830, "epoch": 7600} {"train_loss": -28.482568740844727, "global_step": 630831, "epoch": 7600} {"train_loss": -28.307546615600586, "global_step": 630832, "epoch": 7600} {"train_loss": -28.078933715820312, "global_step": 630833, "epoch": 7600} {"train_loss": -28.52442741394043, "global_step": 630834, "epoch": 7600} {"train_loss": -28.14496421813965, "global_step": 630835, "epoch": 7600} {"train_loss": -28.283315658569336, "global_step": 630836, "epoch": 7600} {"train_loss": -28.3713321685791, "global_step": 630837, "epoch": 7600} {"train_loss": -28.673248291015625, "global_step": 630838, "epoch": 7600} {"train_loss": -28.387115478515625, "global_step": 630839, "epoch": 7600} {"train_loss": -28.43556022644043, "global_step": 630840, "epoch": 7600} {"train_loss": -28.75146484375, "global_step": 630841, "epoch": 7600} {"train_loss": -28.2546329498291, "global_step": 630842, "epoch": 7600} {"train_loss": -28.2239990234375, "global_step": 630843, "epoch": 7600} {"train_loss": -28.306232452392578, "global_step": 630844, "epoch": 7600} {"train_loss": -28.442367553710938, "global_step": 630845, "epoch": 7600} {"train_loss": -27.981739044189453, "global_step": 630846, "epoch": 7600} {"train_loss": -28.23640251159668, "global_step": 630847, "epoch": 7600} {"train_loss": -28.30030632019043, "global_step": 630848, "epoch": 7600} {"train_loss": -28.20794677734375, "global_step": 630849, "epoch": 7600} {"train_loss": -28.44294548034668, "global_step": 630850, "epoch": 7600} {"train_loss": -28.142847061157227, "global_step": 630851, "epoch": 7600} {"train_loss": -28.483356475830078, "global_step": 630852, "epoch": 7600} {"train_loss": -28.281436920166016, "global_step": 630853, "epoch": 7600} {"train_loss": -28.283618927001953, "global_step": 630854, "epoch": 7600} {"train_loss": -28.169218063354492, "global_step": 630855, "epoch": 7600} {"train_loss": -28.034040451049805, "global_step": 630856, "epoch": 7600} {"train_loss": -27.7216854095459, "global_step": 630857, "epoch": 7600} {"train_loss": -27.42193603515625, "global_step": 630858, "epoch": 7600} {"train_loss": -27.633901596069336, "global_step": 630859, "epoch": 7600} {"train_loss": -28.05267333984375, "global_step": 630860, "epoch": 7600} {"train_loss": -28.231412887573242, "global_step": 630861, "epoch": 7600} {"train_loss": -28.355239868164062, "global_step": 630862, "epoch": 7600} {"train_loss": -28.13471794128418, "global_step": 630863, "epoch": 7600} {"train_loss": -28.12542724609375, "global_step": 630864, "epoch": 7600} {"train_loss": -28.214704513549805, "global_step": 630865, "epoch": 7600} {"train_loss": -28.8490047454834, "global_step": 630866, "epoch": 7600} {"train_loss": -28.01445960998535, "global_step": 630867, "epoch": 7600} {"train_loss": -28.295080184936523, "global_step": 630868, "epoch": 7600} {"train_loss": -27.95038414001465, "global_step": 630869, "epoch": 7600} {"train_loss": -28.016178131103516, "global_step": 630870, "epoch": 7600} {"train_loss": -27.767362594604492, "global_step": 630871, "epoch": 7600} {"train_loss": -28.405675888061523, "global_step": 630872, "epoch": 7600} {"train_loss": -27.803043365478516, "global_step": 630873, "epoch": 7600} {"train_loss": -28.227323532104492, "global_step": 630874, "epoch": 7600} {"train_loss": -28.10678482055664, "global_step": 630875, "epoch": 7600} {"train_loss": -28.29066276550293, "global_step": 630876, "epoch": 7600} {"train_loss": -28.36244010925293, "global_step": 630877, "epoch": 7600} {"train_loss": -28.18023109436035, "global_step": 630878, "epoch": 7600} {"train_loss": -28.09419822692871, "global_step": 630879, "epoch": 7600} {"train_loss": -27.864002227783203, "global_step": 630880, "epoch": 7600} {"train_loss": -28.045133590698242, "global_step": 630881, "epoch": 7600} {"train_loss": -28.166554646319653, "global_step": 630882, "epoch": 7600, "train/sim_max_reward_0": 0.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4500000": 1.0, "test/sim_max_reward_4500001": 1.0, "test/sim_max_reward_4500002": 1.0, "test/sim_max_reward_4500003": 1.0, "test/sim_max_reward_4500004": 1.0, "test/sim_max_reward_4500005": 1.0, "test/sim_max_reward_4500006": 1.0, "test/sim_max_reward_4500007": 0.0, "test/sim_max_reward_4500008": 1.0, "test/sim_max_reward_4500009": 1.0, "test/sim_max_reward_4500010": 1.0, "test/sim_max_reward_4500011": 1.0, "test/sim_max_reward_4500012": 1.0, "test/sim_max_reward_4500013": 0.0, "test/sim_max_reward_4500014": 1.0, "test/sim_max_reward_4500015": 1.0, "test/sim_max_reward_4500016": 1.0, "test/sim_max_reward_4500017": 1.0, "test/sim_max_reward_4500018": 1.0, "test/sim_max_reward_4500019": 1.0, "test/sim_max_reward_4500020": 1.0, "test/sim_max_reward_4500021": 1.0, "train/mean_score": 0.8333333333333334, "test/mean_score": 0.9090909090909091, "val_loss": 6639065.0} {"train_loss": -27.781097412109375, "global_step": 630883, "epoch": 7601} {"train_loss": -27.486026763916016, "global_step": 630884, "epoch": 7601} {"train_loss": -27.782886505126953, "global_step": 630885, "epoch": 7601} {"train_loss": -27.946563720703125, "global_step": 630886, "epoch": 7601} {"train_loss": -27.62723159790039, "global_step": 630887, "epoch": 7601} {"train_loss": -28.030187606811523, "global_step": 630888, "epoch": 7601} {"train_loss": -27.73345947265625, "global_step": 630889, "epoch": 7601} {"train_loss": -28.303686141967773, "global_step": 630890, "epoch": 7601} {"train_loss": -27.863727569580078, "global_step": 630891, "epoch": 7601} {"train_loss": -27.513580322265625, "global_step": 630892, "epoch": 7601} {"train_loss": -27.637048721313477, "global_step": 630893, "epoch": 7601} {"train_loss": -27.524036407470703, "global_step": 630894, "epoch": 7601} {"train_loss": -27.647979736328125, "global_step": 630895, "epoch": 7601} {"train_loss": -27.998632431030273, "global_step": 630896, "epoch": 7601} {"train_loss": -27.64578628540039, "global_step": 630897, "epoch": 7601} {"train_loss": -28.02606201171875, "global_step": 630898, "epoch": 7601} {"train_loss": -28.101974487304688, "global_step": 630899, "epoch": 7601} {"train_loss": -27.83003807067871, "global_step": 630900, "epoch": 7601} {"train_loss": -27.789325714111328, "global_step": 630901, "epoch": 7601} {"train_loss": -28.15618324279785, "global_step": 630902, "epoch": 7601} {"train_loss": -27.95514488220215, "global_step": 630903, "epoch": 7601} {"train_loss": -27.980920791625977, "global_step": 630904, "epoch": 7601} {"train_loss": -28.058170318603516, "global_step": 630905, "epoch": 7601} {"train_loss": -27.914854049682617, "global_step": 630906, "epoch": 7601} {"train_loss": -28.00674819946289, "global_step": 630907, "epoch": 7601} {"train_loss": -28.246891021728516, "global_step": 630908, "epoch": 7601} {"train_loss": -28.464874267578125, "global_step": 630909, "epoch": 7601} {"train_loss": -28.07464599609375, "global_step": 630910, "epoch": 7601} {"train_loss": -28.30122184753418, "global_step": 630911, "epoch": 7601} {"train_loss": -28.13054847717285, "global_step": 630912, "epoch": 7601} {"train_loss": -28.108747482299805, "global_step": 630913, "epoch": 7601} {"train_loss": -28.321287155151367, "global_step": 630914, "epoch": 7601} {"train_loss": -28.084918975830078, "global_step": 630915, "epoch": 7601} {"train_loss": -28.45556640625, "global_step": 630916, "epoch": 7601} {"train_loss": -28.28154945373535, "global_step": 630917, "epoch": 7601} {"train_loss": -28.1767578125, "global_step": 630918, "epoch": 7601} {"train_loss": -28.2977352142334, "global_step": 630919, "epoch": 7601} {"train_loss": -28.200653076171875, "global_step": 630920, "epoch": 7601} {"train_loss": -27.991193771362305, "global_step": 630921, "epoch": 7601} {"train_loss": -28.65677261352539, "global_step": 630922, "epoch": 7601} {"train_loss": -28.01611328125, "global_step": 630923, "epoch": 7601} {"train_loss": -28.35439109802246, "global_step": 630924, "epoch": 7601} {"train_loss": -27.936019897460938, "global_step": 630925, "epoch": 7601} {"train_loss": -28.240808486938477, "global_step": 630926, "epoch": 7601} {"train_loss": -28.21854019165039, "global_step": 630927, "epoch": 7601} {"train_loss": -28.28139305114746, "global_step": 630928, "epoch": 7601} {"train_loss": -28.328882217407227, "global_step": 630929, "epoch": 7601} {"train_loss": -28.2930850982666, "global_step": 630930, "epoch": 7601} {"train_loss": -27.783218383789062, "global_step": 630931, "epoch": 7601} {"train_loss": -28.00278091430664, "global_step": 630932, "epoch": 7601} {"train_loss": -28.251989364624023, "global_step": 630933, "epoch": 7601} {"train_loss": -28.014795303344727, "global_step": 630934, "epoch": 7601} {"train_loss": -28.168628692626953, "global_step": 630935, "epoch": 7601} {"train_loss": -28.1689453125, "global_step": 630936, "epoch": 7601} {"train_loss": -28.14667320251465, "global_step": 630937, "epoch": 7601} {"train_loss": -28.134906768798828, "global_step": 630938, "epoch": 7601} {"train_loss": -28.332197189331055, "global_step": 630939, "epoch": 7601} {"train_loss": -28.439992904663086, "global_step": 630940, "epoch": 7601} {"train_loss": -28.2036190032959, "global_step": 630941, "epoch": 7601} {"train_loss": -28.04282569885254, "global_step": 630942, "epoch": 7601} {"train_loss": -28.55879020690918, "global_step": 630943, "epoch": 7601} {"train_loss": -28.182403564453125, "global_step": 630944, "epoch": 7601} {"train_loss": -28.377613067626953, "global_step": 630945, "epoch": 7601} {"train_loss": -28.08966064453125, "global_step": 630946, "epoch": 7601} {"train_loss": -28.164697647094727, "global_step": 630947, "epoch": 7601} {"train_loss": -28.31672477722168, "global_step": 630948, "epoch": 7601} {"train_loss": -28.471221923828125, "global_step": 630949, "epoch": 7601} {"train_loss": -28.52191162109375, "global_step": 630950, "epoch": 7601} {"train_loss": -28.5976619720459, "global_step": 630951, "epoch": 7601} {"train_loss": -28.350555419921875, "global_step": 630952, "epoch": 7601} {"train_loss": -28.1774959564209, "global_step": 630953, "epoch": 7601} {"train_loss": -28.60157585144043, "global_step": 630954, "epoch": 7601} {"train_loss": -28.121320724487305, "global_step": 630955, "epoch": 7601} {"train_loss": -27.964202880859375, "global_step": 630956, "epoch": 7601} {"train_loss": -28.091949462890625, "global_step": 630957, "epoch": 7601} {"train_loss": -28.170034408569336, "global_step": 630958, "epoch": 7601} {"train_loss": -28.59514808654785, "global_step": 630959, "epoch": 7601} {"train_loss": -27.970539093017578, "global_step": 630960, "epoch": 7601} {"train_loss": -28.374195098876953, "global_step": 630961, "epoch": 7601} {"train_loss": -28.19668960571289, "global_step": 630962, "epoch": 7601} {"train_loss": -28.29835319519043, "global_step": 630963, "epoch": 7601} {"train_loss": -28.639326095581055, "global_step": 630964, "epoch": 7601} {"train_loss": -28.13202752262713, "global_step": 630965, "epoch": 7601, "val_loss": 6657879.5} {"train_loss": -27.12428092956543, "global_step": 630966, "epoch": 7602} {"train_loss": -26.446374893188477, "global_step": 630967, "epoch": 7602} {"train_loss": -26.622228622436523, "global_step": 630968, "epoch": 7602} {"train_loss": -27.48505973815918, "global_step": 630969, "epoch": 7602} {"train_loss": -27.67506217956543, "global_step": 630970, "epoch": 7602} {"train_loss": -27.1253662109375, "global_step": 630971, "epoch": 7602} {"train_loss": -28.087194442749023, "global_step": 630972, "epoch": 7602} {"train_loss": -27.711505889892578, "global_step": 630973, "epoch": 7602} {"train_loss": -28.25789451599121, "global_step": 630974, "epoch": 7602} {"train_loss": -27.96882438659668, "global_step": 630975, "epoch": 7602} {"train_loss": -28.100784301757812, "global_step": 630976, "epoch": 7602} {"train_loss": -27.7163143157959, "global_step": 630977, "epoch": 7602} {"train_loss": -27.826025009155273, "global_step": 630978, "epoch": 7602} {"train_loss": -28.003339767456055, "global_step": 630979, "epoch": 7602} {"train_loss": -27.694028854370117, "global_step": 630980, "epoch": 7602} {"train_loss": -28.016260147094727, "global_step": 630981, "epoch": 7602} {"train_loss": -28.15406608581543, "global_step": 630982, "epoch": 7602} {"train_loss": -28.054468154907227, "global_step": 630983, "epoch": 7602} {"train_loss": -28.251379013061523, "global_step": 630984, "epoch": 7602} {"train_loss": -27.938634872436523, "global_step": 630985, "epoch": 7602} {"train_loss": -27.877294540405273, "global_step": 630986, "epoch": 7602} {"train_loss": -28.170751571655273, "global_step": 630987, "epoch": 7602} {"train_loss": -28.159164428710938, "global_step": 630988, "epoch": 7602} {"train_loss": -27.978357315063477, "global_step": 630989, "epoch": 7602} {"train_loss": -28.177490234375, "global_step": 630990, "epoch": 7602} {"train_loss": -28.21648597717285, "global_step": 630991, "epoch": 7602} {"train_loss": -28.5226993560791, "global_step": 630992, "epoch": 7602} {"train_loss": -28.321765899658203, "global_step": 630993, "epoch": 7602} {"train_loss": -27.9822998046875, "global_step": 630994, "epoch": 7602} {"train_loss": -28.5491943359375, "global_step": 630995, "epoch": 7602} {"train_loss": -27.881717681884766, "global_step": 630996, "epoch": 7602} {"train_loss": -27.993616104125977, "global_step": 630997, "epoch": 7602} {"train_loss": -28.420495986938477, "global_step": 630998, "epoch": 7602} {"train_loss": -27.718219757080078, "global_step": 630999, "epoch": 7602} {"train_loss": -28.254682540893555, "global_step": 631000, "epoch": 7602} {"train_loss": -28.265823364257812, "global_step": 631001, "epoch": 7602} {"train_loss": -28.14299964904785, "global_step": 631002, "epoch": 7602} {"train_loss": -28.13214683532715, "global_step": 631003, "epoch": 7602} {"train_loss": -28.486494064331055, "global_step": 631004, "epoch": 7602} {"train_loss": -28.392227172851562, "global_step": 631005, "epoch": 7602} {"train_loss": -28.618940353393555, "global_step": 631006, "epoch": 7602} {"train_loss": -28.247663497924805, "global_step": 631007, "epoch": 7602} {"train_loss": -28.2572021484375, "global_step": 631008, "epoch": 7602} {"train_loss": -28.031728744506836, "global_step": 631009, "epoch": 7602} {"train_loss": -28.34368324279785, "global_step": 631010, "epoch": 7602} {"train_loss": -28.2153263092041, "global_step": 631011, "epoch": 7602} {"train_loss": -27.9199275970459, "global_step": 631012, "epoch": 7602} {"train_loss": -28.3832950592041, "global_step": 631013, "epoch": 7602} {"train_loss": -28.069828033447266, "global_step": 631014, "epoch": 7602} {"train_loss": -28.163299560546875, "global_step": 631015, "epoch": 7602} {"train_loss": -28.24982261657715, "global_step": 631016, "epoch": 7602} {"train_loss": -28.770055770874023, "global_step": 631017, "epoch": 7602} {"train_loss": -28.33758544921875, "global_step": 631018, "epoch": 7602} {"train_loss": -28.302722930908203, "global_step": 631019, "epoch": 7602} {"train_loss": -28.711395263671875, "global_step": 631020, "epoch": 7602} {"train_loss": -28.13825798034668, "global_step": 631021, "epoch": 7602} {"train_loss": -28.190473556518555, "global_step": 631022, "epoch": 7602} {"train_loss": -28.167749404907227, "global_step": 631023, "epoch": 7602} {"train_loss": -28.255117416381836, "global_step": 631024, "epoch": 7602} {"train_loss": -28.392242431640625, "global_step": 631025, "epoch": 7602} {"train_loss": -28.245847702026367, "global_step": 631026, "epoch": 7602} {"train_loss": -28.228515625, "global_step": 631027, "epoch": 7602} {"train_loss": -28.160795211791992, "global_step": 631028, "epoch": 7602} {"train_loss": -27.752552032470703, "global_step": 631029, "epoch": 7602} {"train_loss": -27.910276412963867, "global_step": 631030, "epoch": 7602} {"train_loss": -28.031946182250977, "global_step": 631031, "epoch": 7602} {"train_loss": -28.22303581237793, "global_step": 631032, "epoch": 7602} {"train_loss": -28.067834854125977, "global_step": 631033, "epoch": 7602} {"train_loss": -28.14735221862793, "global_step": 631034, "epoch": 7602} {"train_loss": -28.178009033203125, "global_step": 631035, "epoch": 7602} {"train_loss": -28.228979110717773, "global_step": 631036, "epoch": 7602} {"train_loss": -27.873737335205078, "global_step": 631037, "epoch": 7602} {"train_loss": -28.601720809936523, "global_step": 631038, "epoch": 7602} {"train_loss": -28.23406982421875, "global_step": 631039, "epoch": 7602} {"train_loss": -27.874433517456055, "global_step": 631040, "epoch": 7602} {"train_loss": -28.195959091186523, "global_step": 631041, "epoch": 7602} {"train_loss": -27.687286376953125, "global_step": 631042, "epoch": 7602} {"train_loss": -27.339630126953125, "global_step": 631043, "epoch": 7602} {"train_loss": -26.957937240600586, "global_step": 631044, "epoch": 7602} {"train_loss": -25.421829223632812, "global_step": 631045, "epoch": 7602} {"train_loss": -26.504718780517578, "global_step": 631046, "epoch": 7602} {"train_loss": -27.932392120361328, "global_step": 631047, "epoch": 7602} {"train_loss": -27.98574385585555, "global_step": 631048, "epoch": 7602, "val_loss": 6669385.0} {"train_loss": -22.64092445373535, "global_step": 631049, "epoch": 7603} {"train_loss": -26.202539443969727, "global_step": 631050, "epoch": 7603} {"train_loss": -25.244720458984375, "global_step": 631051, "epoch": 7603} {"train_loss": -25.42926597595215, "global_step": 631052, "epoch": 7603} {"train_loss": -26.828994750976562, "global_step": 631053, "epoch": 7603} {"train_loss": -25.9155216217041, "global_step": 631054, "epoch": 7603} {"train_loss": -25.821060180664062, "global_step": 631055, "epoch": 7603} {"train_loss": -26.1026554107666, "global_step": 631056, "epoch": 7603} {"train_loss": -26.611433029174805, "global_step": 631057, "epoch": 7603} {"train_loss": -26.515527725219727, "global_step": 631058, "epoch": 7603} {"train_loss": -26.28321647644043, "global_step": 631059, "epoch": 7603} {"train_loss": -26.683210372924805, "global_step": 631060, "epoch": 7603} {"train_loss": -27.18928337097168, "global_step": 631061, "epoch": 7603} {"train_loss": -26.93429946899414, "global_step": 631062, "epoch": 7603} {"train_loss": -26.716039657592773, "global_step": 631063, "epoch": 7603} {"train_loss": -27.0174617767334, "global_step": 631064, "epoch": 7603} {"train_loss": -26.945764541625977, "global_step": 631065, "epoch": 7603} {"train_loss": -27.48211669921875, "global_step": 631066, "epoch": 7603} {"train_loss": -27.137439727783203, "global_step": 631067, "epoch": 7603} {"train_loss": -27.145923614501953, "global_step": 631068, "epoch": 7603} {"train_loss": -27.215473175048828, "global_step": 631069, "epoch": 7603} {"train_loss": -27.03843116760254, "global_step": 631070, "epoch": 7603} {"train_loss": -27.160907745361328, "global_step": 631071, "epoch": 7603} {"train_loss": -26.712797164916992, "global_step": 631072, "epoch": 7603} {"train_loss": -27.203277587890625, "global_step": 631073, "epoch": 7603} {"train_loss": -27.704803466796875, "global_step": 631074, "epoch": 7603} {"train_loss": -27.686811447143555, "global_step": 631075, "epoch": 7603} {"train_loss": -27.590784072875977, "global_step": 631076, "epoch": 7603} {"train_loss": -27.22663688659668, "global_step": 631077, "epoch": 7603} {"train_loss": -27.970733642578125, "global_step": 631078, "epoch": 7603} {"train_loss": -27.48076820373535, "global_step": 631079, "epoch": 7603} {"train_loss": -27.374160766601562, "global_step": 631080, "epoch": 7603} {"train_loss": -27.566389083862305, "global_step": 631081, "epoch": 7603} {"train_loss": -27.2908935546875, "global_step": 631082, "epoch": 7603} {"train_loss": -27.883075714111328, "global_step": 631083, "epoch": 7603} {"train_loss": -27.413105010986328, "global_step": 631084, "epoch": 7603} {"train_loss": -27.91812515258789, "global_step": 631085, "epoch": 7603} {"train_loss": -27.771947860717773, "global_step": 631086, "epoch": 7603} {"train_loss": -27.858932495117188, "global_step": 631087, "epoch": 7603} {"train_loss": -27.7556209564209, "global_step": 631088, "epoch": 7603} {"train_loss": -27.818811416625977, "global_step": 631089, "epoch": 7603} {"train_loss": -27.986469268798828, "global_step": 631090, "epoch": 7603} {"train_loss": -27.818134307861328, "global_step": 631091, "epoch": 7603} {"train_loss": -28.174230575561523, "global_step": 631092, "epoch": 7603} {"train_loss": -27.986936569213867, "global_step": 631093, "epoch": 7603} {"train_loss": -28.086196899414062, "global_step": 631094, "epoch": 7603} {"train_loss": -27.723297119140625, "global_step": 631095, "epoch": 7603} {"train_loss": -27.813989639282227, "global_step": 631096, "epoch": 7603} {"train_loss": -28.357528686523438, "global_step": 631097, "epoch": 7603} {"train_loss": -27.574575424194336, "global_step": 631098, "epoch": 7603} {"train_loss": -27.805688858032227, "global_step": 631099, "epoch": 7603} {"train_loss": -27.64691162109375, "global_step": 631100, "epoch": 7603} {"train_loss": -27.925037384033203, "global_step": 631101, "epoch": 7603} {"train_loss": -27.915266036987305, "global_step": 631102, "epoch": 7603} {"train_loss": -28.246702194213867, "global_step": 631103, "epoch": 7603} {"train_loss": -28.145160675048828, "global_step": 631104, "epoch": 7603} {"train_loss": -27.575439453125, "global_step": 631105, "epoch": 7603} {"train_loss": -28.21881103515625, "global_step": 631106, "epoch": 7603} {"train_loss": -27.921483993530273, "global_step": 631107, "epoch": 7603} {"train_loss": -27.868330001831055, "global_step": 631108, "epoch": 7603} {"train_loss": -28.0456485748291, "global_step": 631109, "epoch": 7603} {"train_loss": -27.745092391967773, "global_step": 631110, "epoch": 7603} {"train_loss": -28.157764434814453, "global_step": 631111, "epoch": 7603} {"train_loss": -27.816314697265625, "global_step": 631112, "epoch": 7603} {"train_loss": -27.6107177734375, "global_step": 631113, "epoch": 7603} {"train_loss": -28.017881393432617, "global_step": 631114, "epoch": 7603} {"train_loss": -27.72149085998535, "global_step": 631115, "epoch": 7603} {"train_loss": -27.84556007385254, "global_step": 631116, "epoch": 7603} {"train_loss": -27.891172409057617, "global_step": 631117, "epoch": 7603} {"train_loss": -28.14142417907715, "global_step": 631118, "epoch": 7603} {"train_loss": -28.14177894592285, "global_step": 631119, "epoch": 7603} {"train_loss": -28.03901481628418, "global_step": 631120, "epoch": 7603} {"train_loss": -28.016504287719727, "global_step": 631121, "epoch": 7603} {"train_loss": -28.129770278930664, "global_step": 631122, "epoch": 7603} {"train_loss": -28.056379318237305, "global_step": 631123, "epoch": 7603} {"train_loss": -28.141782760620117, "global_step": 631124, "epoch": 7603} {"train_loss": -27.968082427978516, "global_step": 631125, "epoch": 7603} {"train_loss": -27.632080078125, "global_step": 631126, "epoch": 7603} {"train_loss": -28.18568992614746, "global_step": 631127, "epoch": 7603} {"train_loss": -28.09161949157715, "global_step": 631128, "epoch": 7603} {"train_loss": -28.32578468322754, "global_step": 631129, "epoch": 7603} {"train_loss": -28.15437126159668, "global_step": 631130, "epoch": 7603} {"train_loss": -27.45271613798946, "global_step": 631131, "epoch": 7603, "val_loss": 6727969.5} {"train_loss": -28.059894561767578, "global_step": 631132, "epoch": 7604} {"train_loss": -27.4091796875, "global_step": 631133, "epoch": 7604} {"train_loss": -26.226383209228516, "global_step": 631134, "epoch": 7604} {"train_loss": -25.213640213012695, "global_step": 631135, "epoch": 7604} {"train_loss": -25.538862228393555, "global_step": 631136, "epoch": 7604} {"train_loss": -27.03411293029785, "global_step": 631137, "epoch": 7604} {"train_loss": -27.089879989624023, "global_step": 631138, "epoch": 7604} {"train_loss": -27.61512565612793, "global_step": 631139, "epoch": 7604} {"train_loss": -27.489124298095703, "global_step": 631140, "epoch": 7604} {"train_loss": -26.843774795532227, "global_step": 631141, "epoch": 7604} {"train_loss": -27.640289306640625, "global_step": 631142, "epoch": 7604} {"train_loss": -27.480566024780273, "global_step": 631143, "epoch": 7604} {"train_loss": -27.92270278930664, "global_step": 631144, "epoch": 7604} {"train_loss": -27.798791885375977, "global_step": 631145, "epoch": 7604} {"train_loss": -27.760156631469727, "global_step": 631146, "epoch": 7604} {"train_loss": -27.616470336914062, "global_step": 631147, "epoch": 7604} {"train_loss": -27.55414390563965, "global_step": 631148, "epoch": 7604} {"train_loss": -27.904905319213867, "global_step": 631149, "epoch": 7604} {"train_loss": -27.307348251342773, "global_step": 631150, "epoch": 7604} {"train_loss": -28.201074600219727, "global_step": 631151, "epoch": 7604} {"train_loss": -28.012191772460938, "global_step": 631152, "epoch": 7604} {"train_loss": -28.341766357421875, "global_step": 631153, "epoch": 7604} {"train_loss": -27.666126251220703, "global_step": 631154, "epoch": 7604} {"train_loss": -27.841083526611328, "global_step": 631155, "epoch": 7604} {"train_loss": -28.185651779174805, "global_step": 631156, "epoch": 7604} {"train_loss": -27.832874298095703, "global_step": 631157, "epoch": 7604} {"train_loss": -28.120880126953125, "global_step": 631158, "epoch": 7604} {"train_loss": -28.392377853393555, "global_step": 631159, "epoch": 7604} {"train_loss": -27.837249755859375, "global_step": 631160, "epoch": 7604} {"train_loss": -27.951303482055664, "global_step": 631161, "epoch": 7604} {"train_loss": -27.805334091186523, "global_step": 631162, "epoch": 7604} {"train_loss": -28.187047958374023, "global_step": 631163, "epoch": 7604} {"train_loss": -27.866668701171875, "global_step": 631164, "epoch": 7604} {"train_loss": -28.237546920776367, "global_step": 631165, "epoch": 7604} {"train_loss": -27.828128814697266, "global_step": 631166, "epoch": 7604} {"train_loss": -27.567846298217773, "global_step": 631167, "epoch": 7604} {"train_loss": -27.612104415893555, "global_step": 631168, "epoch": 7604} {"train_loss": -27.881031036376953, "global_step": 631169, "epoch": 7604} {"train_loss": -27.3206844329834, "global_step": 631170, "epoch": 7604} {"train_loss": -28.47712516784668, "global_step": 631171, "epoch": 7604} {"train_loss": -27.61279296875, "global_step": 631172, "epoch": 7604} {"train_loss": -27.771528244018555, "global_step": 631173, "epoch": 7604} {"train_loss": -27.651763916015625, "global_step": 631174, "epoch": 7604} {"train_loss": -28.079389572143555, "global_step": 631175, "epoch": 7604} {"train_loss": -28.178930282592773, "global_step": 631176, "epoch": 7604} {"train_loss": -28.183673858642578, "global_step": 631177, "epoch": 7604} {"train_loss": -27.913434982299805, "global_step": 631178, "epoch": 7604} {"train_loss": -27.832645416259766, "global_step": 631179, "epoch": 7604} {"train_loss": -28.510923385620117, "global_step": 631180, "epoch": 7604} {"train_loss": -28.052778244018555, "global_step": 631181, "epoch": 7604} {"train_loss": -28.39072608947754, "global_step": 631182, "epoch": 7604} {"train_loss": -28.135473251342773, "global_step": 631183, "epoch": 7604} {"train_loss": -28.02603530883789, "global_step": 631184, "epoch": 7604} {"train_loss": -28.358274459838867, "global_step": 631185, "epoch": 7604} {"train_loss": -28.226221084594727, "global_step": 631186, "epoch": 7604} {"train_loss": -28.164289474487305, "global_step": 631187, "epoch": 7604} {"train_loss": -28.314722061157227, "global_step": 631188, "epoch": 7604} {"train_loss": -28.277368545532227, "global_step": 631189, "epoch": 7604} {"train_loss": -28.306324005126953, "global_step": 631190, "epoch": 7604} {"train_loss": -28.2450008392334, "global_step": 631191, "epoch": 7604} {"train_loss": -28.260894775390625, "global_step": 631192, "epoch": 7604} {"train_loss": -28.329242706298828, "global_step": 631193, "epoch": 7604} {"train_loss": -28.679718017578125, "global_step": 631194, "epoch": 7604} {"train_loss": -28.574140548706055, "global_step": 631195, "epoch": 7604} {"train_loss": -28.352741241455078, "global_step": 631196, "epoch": 7604} {"train_loss": -28.217344284057617, "global_step": 631197, "epoch": 7604} {"train_loss": -28.27119255065918, "global_step": 631198, "epoch": 7604} {"train_loss": -28.262556076049805, "global_step": 631199, "epoch": 7604} {"train_loss": -28.6485652923584, "global_step": 631200, "epoch": 7604} {"train_loss": -28.217782974243164, "global_step": 631201, "epoch": 7604} {"train_loss": -28.341699600219727, "global_step": 631202, "epoch": 7604} {"train_loss": -28.14289665222168, "global_step": 631203, "epoch": 7604} {"train_loss": -28.42205810546875, "global_step": 631204, "epoch": 7604} {"train_loss": -28.226125717163086, "global_step": 631205, "epoch": 7604} {"train_loss": -28.340591430664062, "global_step": 631206, "epoch": 7604} {"train_loss": -27.914722442626953, "global_step": 631207, "epoch": 7604} {"train_loss": -28.628585815429688, "global_step": 631208, "epoch": 7604} {"train_loss": -28.269296646118164, "global_step": 631209, "epoch": 7604} {"train_loss": -28.039447784423828, "global_step": 631210, "epoch": 7604} {"train_loss": -27.98554801940918, "global_step": 631211, "epoch": 7604} {"train_loss": -28.35499382019043, "global_step": 631212, "epoch": 7604} {"train_loss": -28.430883407592773, "global_step": 631213, "epoch": 7604} {"train_loss": -27.932906575949794, "global_step": 631214, "epoch": 7604, "val_loss": 6703314.0} {"train_loss": -27.639450073242188, "global_step": 631215, "epoch": 7605} {"train_loss": -27.856725692749023, "global_step": 631216, "epoch": 7605} {"train_loss": -28.00166130065918, "global_step": 631217, "epoch": 7605} {"train_loss": -27.49676513671875, "global_step": 631218, "epoch": 7605} {"train_loss": -27.63291358947754, "global_step": 631219, "epoch": 7605} {"train_loss": -27.681537628173828, "global_step": 631220, "epoch": 7605} {"train_loss": -27.45355224609375, "global_step": 631221, "epoch": 7605} {"train_loss": -27.369897842407227, "global_step": 631222, "epoch": 7605} {"train_loss": -27.7088680267334, "global_step": 631223, "epoch": 7605} {"train_loss": -27.64832878112793, "global_step": 631224, "epoch": 7605} {"train_loss": -27.742040634155273, "global_step": 631225, "epoch": 7605} {"train_loss": -27.633087158203125, "global_step": 631226, "epoch": 7605} {"train_loss": -27.6522274017334, "global_step": 631227, "epoch": 7605} {"train_loss": -27.857824325561523, "global_step": 631228, "epoch": 7605} {"train_loss": -27.929899215698242, "global_step": 631229, "epoch": 7605} {"train_loss": -28.11469841003418, "global_step": 631230, "epoch": 7605} {"train_loss": -28.135761260986328, "global_step": 631231, "epoch": 7605} {"train_loss": -28.161767959594727, "global_step": 631232, "epoch": 7605} {"train_loss": -28.116113662719727, "global_step": 631233, "epoch": 7605} {"train_loss": -28.014129638671875, "global_step": 631234, "epoch": 7605} {"train_loss": -27.393585205078125, "global_step": 631235, "epoch": 7605} {"train_loss": -27.7565975189209, "global_step": 631236, "epoch": 7605} {"train_loss": -28.091089248657227, "global_step": 631237, "epoch": 7605} {"train_loss": -28.186176300048828, "global_step": 631238, "epoch": 7605} {"train_loss": -28.06422996520996, "global_step": 631239, "epoch": 7605} {"train_loss": -28.172382354736328, "global_step": 631240, "epoch": 7605} {"train_loss": -27.969511032104492, "global_step": 631241, "epoch": 7605} {"train_loss": -28.1717586517334, "global_step": 631242, "epoch": 7605} {"train_loss": -28.210968017578125, "global_step": 631243, "epoch": 7605} {"train_loss": -28.313552856445312, "global_step": 631244, "epoch": 7605} {"train_loss": -28.306730270385742, "global_step": 631245, "epoch": 7605} {"train_loss": -28.1043643951416, "global_step": 631246, "epoch": 7605} {"train_loss": -28.477155685424805, "global_step": 631247, "epoch": 7605} {"train_loss": -27.92426109313965, "global_step": 631248, "epoch": 7605} {"train_loss": -28.305633544921875, "global_step": 631249, "epoch": 7605} {"train_loss": -28.171863555908203, "global_step": 631250, "epoch": 7605} {"train_loss": -28.293676376342773, "global_step": 631251, "epoch": 7605} {"train_loss": -28.076730728149414, "global_step": 631252, "epoch": 7605} {"train_loss": -28.26807975769043, "global_step": 631253, "epoch": 7605} {"train_loss": -28.0422420501709, "global_step": 631254, "epoch": 7605} {"train_loss": -27.991697311401367, "global_step": 631255, "epoch": 7605} {"train_loss": -28.184982299804688, "global_step": 631256, "epoch": 7605} {"train_loss": -28.307432174682617, "global_step": 631257, "epoch": 7605} {"train_loss": -28.511228561401367, "global_step": 631258, "epoch": 7605} {"train_loss": -28.177526473999023, "global_step": 631259, "epoch": 7605} {"train_loss": -28.505939483642578, "global_step": 631260, "epoch": 7605} {"train_loss": -28.299549102783203, "global_step": 631261, "epoch": 7605} {"train_loss": -28.59095573425293, "global_step": 631262, "epoch": 7605} {"train_loss": -28.169015884399414, "global_step": 631263, "epoch": 7605} {"train_loss": -28.27521324157715, "global_step": 631264, "epoch": 7605} {"train_loss": -28.383859634399414, "global_step": 631265, "epoch": 7605} {"train_loss": -28.69892692565918, "global_step": 631266, "epoch": 7605} {"train_loss": -28.047163009643555, "global_step": 631267, "epoch": 7605} {"train_loss": -28.326574325561523, "global_step": 631268, "epoch": 7605} {"train_loss": -28.850671768188477, "global_step": 631269, "epoch": 7605} {"train_loss": -28.167139053344727, "global_step": 631270, "epoch": 7605} {"train_loss": -28.2749080657959, "global_step": 631271, "epoch": 7605} {"train_loss": -27.939985275268555, "global_step": 631272, "epoch": 7605} {"train_loss": -28.069721221923828, "global_step": 631273, "epoch": 7605} {"train_loss": -28.377973556518555, "global_step": 631274, "epoch": 7605} {"train_loss": -28.139022827148438, "global_step": 631275, "epoch": 7605} {"train_loss": -27.8591251373291, "global_step": 631276, "epoch": 7605} {"train_loss": -27.877405166625977, "global_step": 631277, "epoch": 7605} {"train_loss": -28.017303466796875, "global_step": 631278, "epoch": 7605} {"train_loss": -27.7769832611084, "global_step": 631279, "epoch": 7605} {"train_loss": -28.119678497314453, "global_step": 631280, "epoch": 7605} {"train_loss": -28.07805824279785, "global_step": 631281, "epoch": 7605} {"train_loss": -28.32171058654785, "global_step": 631282, "epoch": 7605} {"train_loss": -27.663177490234375, "global_step": 631283, "epoch": 7605} {"train_loss": -28.121713638305664, "global_step": 631284, "epoch": 7605} {"train_loss": -27.670276641845703, "global_step": 631285, "epoch": 7605} {"train_loss": -26.995197296142578, "global_step": 631286, "epoch": 7605} {"train_loss": -26.1041259765625, "global_step": 631287, "epoch": 7605} {"train_loss": -28.063125610351562, "global_step": 631288, "epoch": 7605} {"train_loss": -27.40177345275879, "global_step": 631289, "epoch": 7605} {"train_loss": -24.836078643798828, "global_step": 631290, "epoch": 7605} {"train_loss": -27.169769287109375, "global_step": 631291, "epoch": 7605} {"train_loss": -26.298969268798828, "global_step": 631292, "epoch": 7605} {"train_loss": -27.872547149658203, "global_step": 631293, "epoch": 7605} {"train_loss": -25.86053466796875, "global_step": 631294, "epoch": 7605} {"train_loss": -27.351057052612305, "global_step": 631295, "epoch": 7605} {"train_loss": -27.229053497314453, "global_step": 631296, "epoch": 7605} {"train_loss": -27.850841935858668, "global_step": 631297, "epoch": 7605, "val_loss": 6799881.5} {"train_loss": -26.331222534179688, "global_step": 631298, "epoch": 7606} {"train_loss": -27.16666603088379, "global_step": 631299, "epoch": 7606} {"train_loss": -26.015155792236328, "global_step": 631300, "epoch": 7606} {"train_loss": -26.79214859008789, "global_step": 631301, "epoch": 7606} {"train_loss": -27.0812931060791, "global_step": 631302, "epoch": 7606} {"train_loss": -26.915143966674805, "global_step": 631303, "epoch": 7606} {"train_loss": -26.681018829345703, "global_step": 631304, "epoch": 7606} {"train_loss": -26.785001754760742, "global_step": 631305, "epoch": 7606} {"train_loss": -26.551374435424805, "global_step": 631306, "epoch": 7606} {"train_loss": -27.192052841186523, "global_step": 631307, "epoch": 7606} {"train_loss": -27.1795597076416, "global_step": 631308, "epoch": 7606} {"train_loss": -26.821842193603516, "global_step": 631309, "epoch": 7606} {"train_loss": -26.981855392456055, "global_step": 631310, "epoch": 7606} {"train_loss": -27.34657096862793, "global_step": 631311, "epoch": 7606} {"train_loss": -27.208906173706055, "global_step": 631312, "epoch": 7606} {"train_loss": -27.382965087890625, "global_step": 631313, "epoch": 7606} {"train_loss": -27.16192054748535, "global_step": 631314, "epoch": 7606} {"train_loss": -26.9549560546875, "global_step": 631315, "epoch": 7606} {"train_loss": -27.344099044799805, "global_step": 631316, "epoch": 7606} {"train_loss": -27.689252853393555, "global_step": 631317, "epoch": 7606} {"train_loss": -27.34820556640625, "global_step": 631318, "epoch": 7606} {"train_loss": -27.64422035217285, "global_step": 631319, "epoch": 7606} {"train_loss": -27.165815353393555, "global_step": 631320, "epoch": 7606} {"train_loss": -28.102258682250977, "global_step": 631321, "epoch": 7606} {"train_loss": -27.16096305847168, "global_step": 631322, "epoch": 7606} {"train_loss": -27.76629066467285, "global_step": 631323, "epoch": 7606} {"train_loss": -28.001632690429688, "global_step": 631324, "epoch": 7606} {"train_loss": -27.62799644470215, "global_step": 631325, "epoch": 7606} {"train_loss": -28.135639190673828, "global_step": 631326, "epoch": 7606} {"train_loss": -27.7344913482666, "global_step": 631327, "epoch": 7606} {"train_loss": -28.1290283203125, "global_step": 631328, "epoch": 7606} {"train_loss": -27.560443878173828, "global_step": 631329, "epoch": 7606} {"train_loss": -28.067825317382812, "global_step": 631330, "epoch": 7606} {"train_loss": -28.055652618408203, "global_step": 631331, "epoch": 7606} {"train_loss": -28.072174072265625, "global_step": 631332, "epoch": 7606} {"train_loss": -27.687335968017578, "global_step": 631333, "epoch": 7606} {"train_loss": -28.01422119140625, "global_step": 631334, "epoch": 7606} {"train_loss": -28.519805908203125, "global_step": 631335, "epoch": 7606} {"train_loss": -27.779977798461914, "global_step": 631336, "epoch": 7606} {"train_loss": -28.048566818237305, "global_step": 631337, "epoch": 7606} {"train_loss": -28.184036254882812, "global_step": 631338, "epoch": 7606} {"train_loss": -27.821807861328125, "global_step": 631339, "epoch": 7606} {"train_loss": -28.40119743347168, "global_step": 631340, "epoch": 7606} {"train_loss": -28.06792640686035, "global_step": 631341, "epoch": 7606} {"train_loss": -28.37653160095215, "global_step": 631342, "epoch": 7606} {"train_loss": -28.127180099487305, "global_step": 631343, "epoch": 7606} {"train_loss": -28.0601749420166, "global_step": 631344, "epoch": 7606} {"train_loss": -28.083127975463867, "global_step": 631345, "epoch": 7606} {"train_loss": -27.9029541015625, "global_step": 631346, "epoch": 7606} {"train_loss": -28.058149337768555, "global_step": 631347, "epoch": 7606} {"train_loss": -28.29048728942871, "global_step": 631348, "epoch": 7606} {"train_loss": -28.297245025634766, "global_step": 631349, "epoch": 7606} {"train_loss": -27.777847290039062, "global_step": 631350, "epoch": 7606} {"train_loss": -28.33989906311035, "global_step": 631351, "epoch": 7606} {"train_loss": -28.3364315032959, "global_step": 631352, "epoch": 7606} {"train_loss": -28.264001846313477, "global_step": 631353, "epoch": 7606} {"train_loss": -28.086332321166992, "global_step": 631354, "epoch": 7606} {"train_loss": -28.425046920776367, "global_step": 631355, "epoch": 7606} {"train_loss": -28.098825454711914, "global_step": 631356, "epoch": 7606} {"train_loss": -28.373929977416992, "global_step": 631357, "epoch": 7606} {"train_loss": -28.204137802124023, "global_step": 631358, "epoch": 7606} {"train_loss": -27.952192306518555, "global_step": 631359, "epoch": 7606} {"train_loss": -28.649616241455078, "global_step": 631360, "epoch": 7606} {"train_loss": -28.191974639892578, "global_step": 631361, "epoch": 7606} {"train_loss": -28.5037899017334, "global_step": 631362, "epoch": 7606} {"train_loss": -28.111108779907227, "global_step": 631363, "epoch": 7606} {"train_loss": -27.757909774780273, "global_step": 631364, "epoch": 7606} {"train_loss": -26.18505859375, "global_step": 631365, "epoch": 7606} {"train_loss": -26.050479888916016, "global_step": 631366, "epoch": 7606} {"train_loss": -26.403928756713867, "global_step": 631367, "epoch": 7606} {"train_loss": -25.575937271118164, "global_step": 631368, "epoch": 7606} {"train_loss": -27.332075119018555, "global_step": 631369, "epoch": 7606} {"train_loss": -27.604679107666016, "global_step": 631370, "epoch": 7606} {"train_loss": -27.0721435546875, "global_step": 631371, "epoch": 7606} {"train_loss": -27.653833389282227, "global_step": 631372, "epoch": 7606} {"train_loss": -27.671667098999023, "global_step": 631373, "epoch": 7606} {"train_loss": -28.0004825592041, "global_step": 631374, "epoch": 7606} {"train_loss": -27.216928482055664, "global_step": 631375, "epoch": 7606} {"train_loss": -27.67340087890625, "global_step": 631376, "epoch": 7606} {"train_loss": -27.455610275268555, "global_step": 631377, "epoch": 7606} {"train_loss": -27.758224487304688, "global_step": 631378, "epoch": 7606} {"train_loss": -27.679346084594727, "global_step": 631379, "epoch": 7606} {"train_loss": -27.611370086669922, "global_step": 631380, "epoch": 7606, "val_loss": 6627157.0} {"train_loss": -27.48388671875, "global_step": 631381, "epoch": 7607} {"train_loss": -27.85715103149414, "global_step": 631382, "epoch": 7607} {"train_loss": -27.43672752380371, "global_step": 631383, "epoch": 7607} {"train_loss": -28.056859970092773, "global_step": 631384, "epoch": 7607} {"train_loss": -27.433027267456055, "global_step": 631385, "epoch": 7607} {"train_loss": -27.467029571533203, "global_step": 631386, "epoch": 7607} {"train_loss": -27.651952743530273, "global_step": 631387, "epoch": 7607} {"train_loss": -27.718496322631836, "global_step": 631388, "epoch": 7607} {"train_loss": -27.853769302368164, "global_step": 631389, "epoch": 7607} {"train_loss": -28.14117431640625, "global_step": 631390, "epoch": 7607} {"train_loss": -28.01350212097168, "global_step": 631391, "epoch": 7607} {"train_loss": -27.89076042175293, "global_step": 631392, "epoch": 7607} {"train_loss": -27.44362449645996, "global_step": 631393, "epoch": 7607} {"train_loss": -27.79279899597168, "global_step": 631394, "epoch": 7607} {"train_loss": -27.99148941040039, "global_step": 631395, "epoch": 7607} {"train_loss": -28.2605037689209, "global_step": 631396, "epoch": 7607} {"train_loss": -28.22690773010254, "global_step": 631397, "epoch": 7607} {"train_loss": -27.926044464111328, "global_step": 631398, "epoch": 7607} {"train_loss": -27.904855728149414, "global_step": 631399, "epoch": 7607} {"train_loss": -28.06292724609375, "global_step": 631400, "epoch": 7607} {"train_loss": -28.076032638549805, "global_step": 631401, "epoch": 7607} {"train_loss": -27.93470573425293, "global_step": 631402, "epoch": 7607} {"train_loss": -28.56884765625, "global_step": 631403, "epoch": 7607} {"train_loss": -27.88150978088379, "global_step": 631404, "epoch": 7607} {"train_loss": -27.961591720581055, "global_step": 631405, "epoch": 7607} {"train_loss": -28.635772705078125, "global_step": 631406, "epoch": 7607} {"train_loss": -28.39059829711914, "global_step": 631407, "epoch": 7607} {"train_loss": -28.26483726501465, "global_step": 631408, "epoch": 7607} {"train_loss": -27.9558048248291, "global_step": 631409, "epoch": 7607} {"train_loss": -28.02164649963379, "global_step": 631410, "epoch": 7607} {"train_loss": -28.263168334960938, "global_step": 631411, "epoch": 7607} {"train_loss": -28.22926902770996, "global_step": 631412, "epoch": 7607} {"train_loss": -28.26433753967285, "global_step": 631413, "epoch": 7607} {"train_loss": -28.473886489868164, "global_step": 631414, "epoch": 7607} {"train_loss": -28.10995864868164, "global_step": 631415, "epoch": 7607} {"train_loss": -28.07257652282715, "global_step": 631416, "epoch": 7607} {"train_loss": -28.267169952392578, "global_step": 631417, "epoch": 7607} {"train_loss": -28.542341232299805, "global_step": 631418, "epoch": 7607} {"train_loss": -27.959604263305664, "global_step": 631419, "epoch": 7607} {"train_loss": -28.459508895874023, "global_step": 631420, "epoch": 7607} {"train_loss": -28.366979598999023, "global_step": 631421, "epoch": 7607} {"train_loss": -28.490509033203125, "global_step": 631422, "epoch": 7607} {"train_loss": -28.655399322509766, "global_step": 631423, "epoch": 7607} {"train_loss": -28.230207443237305, "global_step": 631424, "epoch": 7607} {"train_loss": -28.242095947265625, "global_step": 631425, "epoch": 7607} {"train_loss": -28.28537940979004, "global_step": 631426, "epoch": 7607} {"train_loss": -28.664264678955078, "global_step": 631427, "epoch": 7607} {"train_loss": -28.389789581298828, "global_step": 631428, "epoch": 7607} {"train_loss": -28.447677612304688, "global_step": 631429, "epoch": 7607} {"train_loss": -28.236541748046875, "global_step": 631430, "epoch": 7607} {"train_loss": -28.35552406311035, "global_step": 631431, "epoch": 7607} {"train_loss": -28.364978790283203, "global_step": 631432, "epoch": 7607} {"train_loss": -28.41070556640625, "global_step": 631433, "epoch": 7607} {"train_loss": -28.424713134765625, "global_step": 631434, "epoch": 7607} {"train_loss": -28.67264175415039, "global_step": 631435, "epoch": 7607} {"train_loss": -28.49448585510254, "global_step": 631436, "epoch": 7607} {"train_loss": -28.326826095581055, "global_step": 631437, "epoch": 7607} {"train_loss": -28.435834884643555, "global_step": 631438, "epoch": 7607} {"train_loss": -28.373727798461914, "global_step": 631439, "epoch": 7607} {"train_loss": -28.76555824279785, "global_step": 631440, "epoch": 7607} {"train_loss": -28.286096572875977, "global_step": 631441, "epoch": 7607} {"train_loss": -28.466175079345703, "global_step": 631442, "epoch": 7607} {"train_loss": -28.610595703125, "global_step": 631443, "epoch": 7607} {"train_loss": -28.7159366607666, "global_step": 631444, "epoch": 7607} {"train_loss": -28.77202796936035, "global_step": 631445, "epoch": 7607} {"train_loss": -28.852888107299805, "global_step": 631446, "epoch": 7607} {"train_loss": -28.933658599853516, "global_step": 631447, "epoch": 7607} {"train_loss": -28.28464126586914, "global_step": 631448, "epoch": 7607} {"train_loss": -28.34657096862793, "global_step": 631449, "epoch": 7607} {"train_loss": -28.15984535217285, "global_step": 631450, "epoch": 7607} {"train_loss": -28.373825073242188, "global_step": 631451, "epoch": 7607} {"train_loss": -28.042898178100586, "global_step": 631452, "epoch": 7607} {"train_loss": -28.07960319519043, "global_step": 631453, "epoch": 7607} {"train_loss": -27.47419548034668, "global_step": 631454, "epoch": 7607} {"train_loss": -28.456247329711914, "global_step": 631455, "epoch": 7607} {"train_loss": -27.989151000976562, "global_step": 631456, "epoch": 7607} {"train_loss": -27.818744659423828, "global_step": 631457, "epoch": 7607} {"train_loss": -28.14771842956543, "global_step": 631458, "epoch": 7607} {"train_loss": -28.223058700561523, "global_step": 631459, "epoch": 7607} {"train_loss": -27.97129249572754, "global_step": 631460, "epoch": 7607} {"train_loss": -28.1982479095459, "global_step": 631461, "epoch": 7607} {"train_loss": -27.997943878173828, "global_step": 631462, "epoch": 7607} {"train_loss": -28.20096401995923, "global_step": 631463, "epoch": 7607, "val_loss": 6719968.0} {"train_loss": -27.03937339782715, "global_step": 631464, "epoch": 7608} {"train_loss": -26.625638961791992, "global_step": 631465, "epoch": 7608} {"train_loss": -27.938720703125, "global_step": 631466, "epoch": 7608} {"train_loss": -26.822885513305664, "global_step": 631467, "epoch": 7608} {"train_loss": -27.120874404907227, "global_step": 631468, "epoch": 7608} {"train_loss": -27.608129501342773, "global_step": 631469, "epoch": 7608} {"train_loss": -28.040098190307617, "global_step": 631470, "epoch": 7608} {"train_loss": -27.60637855529785, "global_step": 631471, "epoch": 7608} {"train_loss": -28.091537475585938, "global_step": 631472, "epoch": 7608} {"train_loss": -27.81694984436035, "global_step": 631473, "epoch": 7608} {"train_loss": -27.707128524780273, "global_step": 631474, "epoch": 7608} {"train_loss": -28.150146484375, "global_step": 631475, "epoch": 7608} {"train_loss": -27.557538986206055, "global_step": 631476, "epoch": 7608} {"train_loss": -27.869897842407227, "global_step": 631477, "epoch": 7608} {"train_loss": -28.06125259399414, "global_step": 631478, "epoch": 7608} {"train_loss": -28.028223037719727, "global_step": 631479, "epoch": 7608} {"train_loss": -28.05214500427246, "global_step": 631480, "epoch": 7608} {"train_loss": -28.048139572143555, "global_step": 631481, "epoch": 7608} {"train_loss": -27.732257843017578, "global_step": 631482, "epoch": 7608} {"train_loss": -27.876026153564453, "global_step": 631483, "epoch": 7608} {"train_loss": -28.3046817779541, "global_step": 631484, "epoch": 7608} {"train_loss": -28.09524917602539, "global_step": 631485, "epoch": 7608} {"train_loss": -28.2442626953125, "global_step": 631486, "epoch": 7608} {"train_loss": -28.12213706970215, "global_step": 631487, "epoch": 7608} {"train_loss": -28.107410430908203, "global_step": 631488, "epoch": 7608} {"train_loss": -28.25545310974121, "global_step": 631489, "epoch": 7608} {"train_loss": -28.38941764831543, "global_step": 631490, "epoch": 7608} {"train_loss": -28.358657836914062, "global_step": 631491, "epoch": 7608} {"train_loss": -28.091699600219727, "global_step": 631492, "epoch": 7608} {"train_loss": -28.376413345336914, "global_step": 631493, "epoch": 7608} {"train_loss": -28.139068603515625, "global_step": 631494, "epoch": 7608} {"train_loss": -28.2933349609375, "global_step": 631495, "epoch": 7608} {"train_loss": -28.444412231445312, "global_step": 631496, "epoch": 7608} {"train_loss": -28.3182373046875, "global_step": 631497, "epoch": 7608} {"train_loss": -28.17575454711914, "global_step": 631498, "epoch": 7608} {"train_loss": -28.06206703186035, "global_step": 631499, "epoch": 7608} {"train_loss": -28.423282623291016, "global_step": 631500, "epoch": 7608} {"train_loss": -28.297576904296875, "global_step": 631501, "epoch": 7608} {"train_loss": -28.543569564819336, "global_step": 631502, "epoch": 7608} {"train_loss": -28.407974243164062, "global_step": 631503, "epoch": 7608} {"train_loss": -28.29298210144043, "global_step": 631504, "epoch": 7608} {"train_loss": -28.114572525024414, "global_step": 631505, "epoch": 7608} {"train_loss": -28.783893585205078, "global_step": 631506, "epoch": 7608} {"train_loss": -28.308149337768555, "global_step": 631507, "epoch": 7608} {"train_loss": -28.255903244018555, "global_step": 631508, "epoch": 7608} {"train_loss": -28.325986862182617, "global_step": 631509, "epoch": 7608} {"train_loss": -28.190872192382812, "global_step": 631510, "epoch": 7608} {"train_loss": -28.279401779174805, "global_step": 631511, "epoch": 7608} {"train_loss": -28.426843643188477, "global_step": 631512, "epoch": 7608} {"train_loss": -28.306432723999023, "global_step": 631513, "epoch": 7608} {"train_loss": -28.254358291625977, "global_step": 631514, "epoch": 7608} {"train_loss": -28.253662109375, "global_step": 631515, "epoch": 7608} {"train_loss": -27.999927520751953, "global_step": 631516, "epoch": 7608} {"train_loss": -28.818775177001953, "global_step": 631517, "epoch": 7608} {"train_loss": -28.421051025390625, "global_step": 631518, "epoch": 7608} {"train_loss": -28.48707389831543, "global_step": 631519, "epoch": 7608} {"train_loss": -28.20503807067871, "global_step": 631520, "epoch": 7608} {"train_loss": -28.33935546875, "global_step": 631521, "epoch": 7608} {"train_loss": -28.3327693939209, "global_step": 631522, "epoch": 7608} {"train_loss": -28.450925827026367, "global_step": 631523, "epoch": 7608} {"train_loss": -28.486392974853516, "global_step": 631524, "epoch": 7608} {"train_loss": -28.594043731689453, "global_step": 631525, "epoch": 7608} {"train_loss": -28.433624267578125, "global_step": 631526, "epoch": 7608} {"train_loss": -28.418109893798828, "global_step": 631527, "epoch": 7608} {"train_loss": -28.20013427734375, "global_step": 631528, "epoch": 7608} {"train_loss": -28.234085083007812, "global_step": 631529, "epoch": 7608} {"train_loss": -27.906356811523438, "global_step": 631530, "epoch": 7608} {"train_loss": -28.139068603515625, "global_step": 631531, "epoch": 7608} {"train_loss": -28.291913986206055, "global_step": 631532, "epoch": 7608} {"train_loss": -28.390411376953125, "global_step": 631533, "epoch": 7608} {"train_loss": -28.393293380737305, "global_step": 631534, "epoch": 7608} {"train_loss": -28.179615020751953, "global_step": 631535, "epoch": 7608} {"train_loss": -27.84881591796875, "global_step": 631536, "epoch": 7608} {"train_loss": -28.285400390625, "global_step": 631537, "epoch": 7608} {"train_loss": -28.33579444885254, "global_step": 631538, "epoch": 7608} {"train_loss": -28.10589027404785, "global_step": 631539, "epoch": 7608} {"train_loss": -27.9462947845459, "global_step": 631540, "epoch": 7608} {"train_loss": -28.16815757751465, "global_step": 631541, "epoch": 7608} {"train_loss": -27.932479858398438, "global_step": 631542, "epoch": 7608} {"train_loss": -28.06354331970215, "global_step": 631543, "epoch": 7608} {"train_loss": -28.415546417236328, "global_step": 631544, "epoch": 7608} {"train_loss": -28.390533447265625, "global_step": 631545, "epoch": 7608} {"train_loss": -28.13797681877412, "global_step": 631546, "epoch": 7608, "val_loss": 6662547.0} {"train_loss": -28.17819595336914, "global_step": 631547, "epoch": 7609} {"train_loss": -27.920501708984375, "global_step": 631548, "epoch": 7609} {"train_loss": -27.693090438842773, "global_step": 631549, "epoch": 7609} {"train_loss": -27.927494049072266, "global_step": 631550, "epoch": 7609} {"train_loss": -28.122241973876953, "global_step": 631551, "epoch": 7609} {"train_loss": -28.027536392211914, "global_step": 631552, "epoch": 7609} {"train_loss": -28.112436294555664, "global_step": 631553, "epoch": 7609} {"train_loss": -28.54402732849121, "global_step": 631554, "epoch": 7609} {"train_loss": -27.9216251373291, "global_step": 631555, "epoch": 7609} {"train_loss": -27.96255874633789, "global_step": 631556, "epoch": 7609} {"train_loss": -28.023080825805664, "global_step": 631557, "epoch": 7609} {"train_loss": -27.876708984375, "global_step": 631558, "epoch": 7609} {"train_loss": -28.162860870361328, "global_step": 631559, "epoch": 7609} {"train_loss": -28.00739860534668, "global_step": 631560, "epoch": 7609} {"train_loss": -27.52863883972168, "global_step": 631561, "epoch": 7609} {"train_loss": -27.974365234375, "global_step": 631562, "epoch": 7609} {"train_loss": -27.774755477905273, "global_step": 631563, "epoch": 7609} {"train_loss": -27.829557418823242, "global_step": 631564, "epoch": 7609} {"train_loss": -28.16778564453125, "global_step": 631565, "epoch": 7609} {"train_loss": -28.24822998046875, "global_step": 631566, "epoch": 7609} {"train_loss": -28.066287994384766, "global_step": 631567, "epoch": 7609} {"train_loss": -28.058195114135742, "global_step": 631568, "epoch": 7609} {"train_loss": -28.18817138671875, "global_step": 631569, "epoch": 7609} {"train_loss": -28.324106216430664, "global_step": 631570, "epoch": 7609} {"train_loss": -28.197431564331055, "global_step": 631571, "epoch": 7609} {"train_loss": -28.317285537719727, "global_step": 631572, "epoch": 7609} {"train_loss": -28.424457550048828, "global_step": 631573, "epoch": 7609} {"train_loss": -28.0175724029541, "global_step": 631574, "epoch": 7609} {"train_loss": -28.470579147338867, "global_step": 631575, "epoch": 7609} {"train_loss": -28.439783096313477, "global_step": 631576, "epoch": 7609} {"train_loss": -28.43755531311035, "global_step": 631577, "epoch": 7609} {"train_loss": -28.483747482299805, "global_step": 631578, "epoch": 7609} {"train_loss": -28.332672119140625, "global_step": 631579, "epoch": 7609} {"train_loss": -28.716367721557617, "global_step": 631580, "epoch": 7609} {"train_loss": -28.15931510925293, "global_step": 631581, "epoch": 7609} {"train_loss": -28.128406524658203, "global_step": 631582, "epoch": 7609} {"train_loss": -28.382413864135742, "global_step": 631583, "epoch": 7609} {"train_loss": -28.299121856689453, "global_step": 631584, "epoch": 7609} {"train_loss": -28.42413330078125, "global_step": 631585, "epoch": 7609} {"train_loss": -28.055484771728516, "global_step": 631586, "epoch": 7609} {"train_loss": -28.298450469970703, "global_step": 631587, "epoch": 7609} {"train_loss": -28.242929458618164, "global_step": 631588, "epoch": 7609} {"train_loss": -28.20124626159668, "global_step": 631589, "epoch": 7609} {"train_loss": -28.175851821899414, "global_step": 631590, "epoch": 7609} {"train_loss": -28.394643783569336, "global_step": 631591, "epoch": 7609} {"train_loss": -28.26688003540039, "global_step": 631592, "epoch": 7609} {"train_loss": -28.509077072143555, "global_step": 631593, "epoch": 7609} {"train_loss": -28.501279830932617, "global_step": 631594, "epoch": 7609} {"train_loss": -28.456884384155273, "global_step": 631595, "epoch": 7609} {"train_loss": -28.217893600463867, "global_step": 631596, "epoch": 7609} {"train_loss": -28.00298500061035, "global_step": 631597, "epoch": 7609} {"train_loss": -27.898366928100586, "global_step": 631598, "epoch": 7609} {"train_loss": -27.9510498046875, "global_step": 631599, "epoch": 7609} {"train_loss": -28.30136489868164, "global_step": 631600, "epoch": 7609} {"train_loss": -27.85586929321289, "global_step": 631601, "epoch": 7609} {"train_loss": -27.859567642211914, "global_step": 631602, "epoch": 7609} {"train_loss": -28.214324951171875, "global_step": 631603, "epoch": 7609} {"train_loss": -28.225326538085938, "global_step": 631604, "epoch": 7609} {"train_loss": -27.938440322875977, "global_step": 631605, "epoch": 7609} {"train_loss": -28.5697021484375, "global_step": 631606, "epoch": 7609} {"train_loss": -28.213525772094727, "global_step": 631607, "epoch": 7609} {"train_loss": -27.9696044921875, "global_step": 631608, "epoch": 7609} {"train_loss": -28.3536376953125, "global_step": 631609, "epoch": 7609} {"train_loss": -27.92569923400879, "global_step": 631610, "epoch": 7609} {"train_loss": -27.150074005126953, "global_step": 631611, "epoch": 7609} {"train_loss": -27.87605857849121, "global_step": 631612, "epoch": 7609} {"train_loss": -27.371795654296875, "global_step": 631613, "epoch": 7609} {"train_loss": -27.133148193359375, "global_step": 631614, "epoch": 7609} {"train_loss": -28.075483322143555, "global_step": 631615, "epoch": 7609} {"train_loss": -28.106653213500977, "global_step": 631616, "epoch": 7609} {"train_loss": -27.802398681640625, "global_step": 631617, "epoch": 7609} {"train_loss": -27.774030685424805, "global_step": 631618, "epoch": 7609} {"train_loss": -27.88406753540039, "global_step": 631619, "epoch": 7609} {"train_loss": -28.119359970092773, "global_step": 631620, "epoch": 7609} {"train_loss": -28.1707820892334, "global_step": 631621, "epoch": 7609} {"train_loss": -27.960952758789062, "global_step": 631622, "epoch": 7609} {"train_loss": -27.702306747436523, "global_step": 631623, "epoch": 7609} {"train_loss": -28.170454025268555, "global_step": 631624, "epoch": 7609} {"train_loss": -28.140851974487305, "global_step": 631625, "epoch": 7609} {"train_loss": -27.696149826049805, "global_step": 631626, "epoch": 7609} {"train_loss": -28.3371639251709, "global_step": 631627, "epoch": 7609} {"train_loss": -28.313556671142578, "global_step": 631628, "epoch": 7609} {"train_loss": -28.093331854027436, "global_step": 631629, "epoch": 7609, "val_loss": 6744662.0} {"train_loss": -27.525283813476562, "global_step": 631630, "epoch": 7610} {"train_loss": -27.66182518005371, "global_step": 631631, "epoch": 7610} {"train_loss": -28.00638771057129, "global_step": 631632, "epoch": 7610} {"train_loss": -27.56056785583496, "global_step": 631633, "epoch": 7610} {"train_loss": -27.5581111907959, "global_step": 631634, "epoch": 7610} {"train_loss": -27.76863670349121, "global_step": 631635, "epoch": 7610} {"train_loss": -27.677820205688477, "global_step": 631636, "epoch": 7610} {"train_loss": -27.708417892456055, "global_step": 631637, "epoch": 7610} {"train_loss": -27.884510040283203, "global_step": 631638, "epoch": 7610} {"train_loss": -28.09576988220215, "global_step": 631639, "epoch": 7610} {"train_loss": -27.953372955322266, "global_step": 631640, "epoch": 7610} {"train_loss": -28.041717529296875, "global_step": 631641, "epoch": 7610} {"train_loss": -28.164106369018555, "global_step": 631642, "epoch": 7610} {"train_loss": -28.29817008972168, "global_step": 631643, "epoch": 7610} {"train_loss": -28.43085289001465, "global_step": 631644, "epoch": 7610} {"train_loss": -28.018085479736328, "global_step": 631645, "epoch": 7610} {"train_loss": -28.266427993774414, "global_step": 631646, "epoch": 7610} {"train_loss": -28.04561424255371, "global_step": 631647, "epoch": 7610} {"train_loss": -28.076644897460938, "global_step": 631648, "epoch": 7610} {"train_loss": -28.3040714263916, "global_step": 631649, "epoch": 7610} {"train_loss": -28.477981567382812, "global_step": 631650, "epoch": 7610} {"train_loss": -28.001218795776367, "global_step": 631651, "epoch": 7610} {"train_loss": -28.266483306884766, "global_step": 631652, "epoch": 7610} {"train_loss": -27.8706111907959, "global_step": 631653, "epoch": 7610} {"train_loss": -28.106252670288086, "global_step": 631654, "epoch": 7610} {"train_loss": -28.406213760375977, "global_step": 631655, "epoch": 7610} {"train_loss": -28.300647735595703, "global_step": 631656, "epoch": 7610} {"train_loss": -28.298566818237305, "global_step": 631657, "epoch": 7610} {"train_loss": -28.070648193359375, "global_step": 631658, "epoch": 7610} {"train_loss": -27.897571563720703, "global_step": 631659, "epoch": 7610} {"train_loss": -28.07258415222168, "global_step": 631660, "epoch": 7610} {"train_loss": -28.410871505737305, "global_step": 631661, "epoch": 7610} {"train_loss": -28.13331413269043, "global_step": 631662, "epoch": 7610} {"train_loss": -28.55018424987793, "global_step": 631663, "epoch": 7610} {"train_loss": -28.357629776000977, "global_step": 631664, "epoch": 7610} {"train_loss": -27.816162109375, "global_step": 631665, "epoch": 7610} {"train_loss": -28.533645629882812, "global_step": 631666, "epoch": 7610} {"train_loss": -28.14967155456543, "global_step": 631667, "epoch": 7610} {"train_loss": -28.410614013671875, "global_step": 631668, "epoch": 7610} {"train_loss": -28.334341049194336, "global_step": 631669, "epoch": 7610} {"train_loss": -28.361642837524414, "global_step": 631670, "epoch": 7610} {"train_loss": -28.5015811920166, "global_step": 631671, "epoch": 7610} {"train_loss": -28.17765235900879, "global_step": 631672, "epoch": 7610} {"train_loss": -28.319665908813477, "global_step": 631673, "epoch": 7610} {"train_loss": -28.558698654174805, "global_step": 631674, "epoch": 7610} {"train_loss": -28.17791748046875, "global_step": 631675, "epoch": 7610} {"train_loss": -28.277027130126953, "global_step": 631676, "epoch": 7610} {"train_loss": -27.637182235717773, "global_step": 631677, "epoch": 7610} {"train_loss": -27.62232780456543, "global_step": 631678, "epoch": 7610} {"train_loss": -28.2667293548584, "global_step": 631679, "epoch": 7610} {"train_loss": -28.518524169921875, "global_step": 631680, "epoch": 7610} {"train_loss": -27.90679359436035, "global_step": 631681, "epoch": 7610} {"train_loss": -27.8001708984375, "global_step": 631682, "epoch": 7610} {"train_loss": -28.107559204101562, "global_step": 631683, "epoch": 7610} {"train_loss": -28.29013442993164, "global_step": 631684, "epoch": 7610} {"train_loss": -28.220767974853516, "global_step": 631685, "epoch": 7610} {"train_loss": -28.0357723236084, "global_step": 631686, "epoch": 7610} {"train_loss": -27.87238121032715, "global_step": 631687, "epoch": 7610} {"train_loss": -27.722797393798828, "global_step": 631688, "epoch": 7610} {"train_loss": -28.228506088256836, "global_step": 631689, "epoch": 7610} {"train_loss": -28.047910690307617, "global_step": 631690, "epoch": 7610} {"train_loss": -28.39359474182129, "global_step": 631691, "epoch": 7610} {"train_loss": -28.08099365234375, "global_step": 631692, "epoch": 7610} {"train_loss": -28.182361602783203, "global_step": 631693, "epoch": 7610} {"train_loss": -28.39699363708496, "global_step": 631694, "epoch": 7610} {"train_loss": -27.788101196289062, "global_step": 631695, "epoch": 7610} {"train_loss": -28.27555274963379, "global_step": 631696, "epoch": 7610} {"train_loss": -28.121826171875, "global_step": 631697, "epoch": 7610} {"train_loss": -28.44269371032715, "global_step": 631698, "epoch": 7610} {"train_loss": -27.930994033813477, "global_step": 631699, "epoch": 7610} {"train_loss": -28.076038360595703, "global_step": 631700, "epoch": 7610} {"train_loss": -28.032485961914062, "global_step": 631701, "epoch": 7610} {"train_loss": -28.41196632385254, "global_step": 631702, "epoch": 7610} {"train_loss": -28.109039306640625, "global_step": 631703, "epoch": 7610} {"train_loss": -28.524005889892578, "global_step": 631704, "epoch": 7610} {"train_loss": -28.12151527404785, "global_step": 631705, "epoch": 7610} {"train_loss": -28.396543502807617, "global_step": 631706, "epoch": 7610} {"train_loss": -28.664813995361328, "global_step": 631707, "epoch": 7610} {"train_loss": -28.022916793823242, "global_step": 631708, "epoch": 7610} {"train_loss": -28.167495727539062, "global_step": 631709, "epoch": 7610} {"train_loss": -28.040998458862305, "global_step": 631710, "epoch": 7610} {"train_loss": -27.978254318237305, "global_step": 631711, "epoch": 7610} {"train_loss": -28.126946897391814, "global_step": 631712, "epoch": 7610, "val_loss": 6668263.0} {"train_loss": -28.203832626342773, "global_step": 631713, "epoch": 7611} {"train_loss": -28.02595329284668, "global_step": 631714, "epoch": 7611} {"train_loss": -28.407556533813477, "global_step": 631715, "epoch": 7611} {"train_loss": -28.229400634765625, "global_step": 631716, "epoch": 7611} {"train_loss": -28.083051681518555, "global_step": 631717, "epoch": 7611} {"train_loss": -28.526147842407227, "global_step": 631718, "epoch": 7611} {"train_loss": -28.035802841186523, "global_step": 631719, "epoch": 7611} {"train_loss": -28.46347427368164, "global_step": 631720, "epoch": 7611} {"train_loss": -28.405292510986328, "global_step": 631721, "epoch": 7611} {"train_loss": -28.220457077026367, "global_step": 631722, "epoch": 7611} {"train_loss": -27.828954696655273, "global_step": 631723, "epoch": 7611} {"train_loss": -27.97621726989746, "global_step": 631724, "epoch": 7611} {"train_loss": -28.093280792236328, "global_step": 631725, "epoch": 7611} {"train_loss": -28.4337215423584, "global_step": 631726, "epoch": 7611} {"train_loss": -28.406469345092773, "global_step": 631727, "epoch": 7611} {"train_loss": -28.25567626953125, "global_step": 631728, "epoch": 7611} {"train_loss": -27.825239181518555, "global_step": 631729, "epoch": 7611} {"train_loss": -27.99334716796875, "global_step": 631730, "epoch": 7611} {"train_loss": -27.244369506835938, "global_step": 631731, "epoch": 7611} {"train_loss": -27.824249267578125, "global_step": 631732, "epoch": 7611} {"train_loss": -27.89935874938965, "global_step": 631733, "epoch": 7611} {"train_loss": -28.009506225585938, "global_step": 631734, "epoch": 7611} {"train_loss": -28.271825790405273, "global_step": 631735, "epoch": 7611} {"train_loss": -28.210859298706055, "global_step": 631736, "epoch": 7611} {"train_loss": -28.183578491210938, "global_step": 631737, "epoch": 7611} {"train_loss": -28.171035766601562, "global_step": 631738, "epoch": 7611} {"train_loss": -27.97433853149414, "global_step": 631739, "epoch": 7611} {"train_loss": -28.112945556640625, "global_step": 631740, "epoch": 7611} {"train_loss": -28.09400749206543, "global_step": 631741, "epoch": 7611} {"train_loss": -28.41120719909668, "global_step": 631742, "epoch": 7611} {"train_loss": -28.093427658081055, "global_step": 631743, "epoch": 7611} {"train_loss": -28.66633415222168, "global_step": 631744, "epoch": 7611} {"train_loss": -28.592941284179688, "global_step": 631745, "epoch": 7611} {"train_loss": -28.158483505249023, "global_step": 631746, "epoch": 7611} {"train_loss": -28.49151039123535, "global_step": 631747, "epoch": 7611} {"train_loss": -28.3826847076416, "global_step": 631748, "epoch": 7611} {"train_loss": -28.53949546813965, "global_step": 631749, "epoch": 7611} {"train_loss": -28.145063400268555, "global_step": 631750, "epoch": 7611} {"train_loss": -28.249744415283203, "global_step": 631751, "epoch": 7611} {"train_loss": -28.2012882232666, "global_step": 631752, "epoch": 7611} {"train_loss": -28.26839256286621, "global_step": 631753, "epoch": 7611} {"train_loss": -28.413984298706055, "global_step": 631754, "epoch": 7611} {"train_loss": -28.318479537963867, "global_step": 631755, "epoch": 7611} {"train_loss": -28.491230010986328, "global_step": 631756, "epoch": 7611} {"train_loss": -28.344999313354492, "global_step": 631757, "epoch": 7611} {"train_loss": -28.227691650390625, "global_step": 631758, "epoch": 7611} {"train_loss": -28.226593017578125, "global_step": 631759, "epoch": 7611} {"train_loss": -28.043554306030273, "global_step": 631760, "epoch": 7611} {"train_loss": -28.487060546875, "global_step": 631761, "epoch": 7611} {"train_loss": -28.390106201171875, "global_step": 631762, "epoch": 7611} {"train_loss": -28.244400024414062, "global_step": 631763, "epoch": 7611} {"train_loss": -28.356857299804688, "global_step": 631764, "epoch": 7611} {"train_loss": -28.271961212158203, "global_step": 631765, "epoch": 7611} {"train_loss": -28.0465145111084, "global_step": 631766, "epoch": 7611} {"train_loss": -28.04896354675293, "global_step": 631767, "epoch": 7611} {"train_loss": -28.35100746154785, "global_step": 631768, "epoch": 7611} {"train_loss": -28.448719024658203, "global_step": 631769, "epoch": 7611} {"train_loss": -28.2496337890625, "global_step": 631770, "epoch": 7611} {"train_loss": -28.000354766845703, "global_step": 631771, "epoch": 7611} {"train_loss": -27.824743270874023, "global_step": 631772, "epoch": 7611} {"train_loss": -28.20606803894043, "global_step": 631773, "epoch": 7611} {"train_loss": -28.70074462890625, "global_step": 631774, "epoch": 7611} {"train_loss": -28.02094078063965, "global_step": 631775, "epoch": 7611} {"train_loss": -27.888126373291016, "global_step": 631776, "epoch": 7611} {"train_loss": -27.886890411376953, "global_step": 631777, "epoch": 7611} {"train_loss": -28.131855010986328, "global_step": 631778, "epoch": 7611} {"train_loss": -27.94285011291504, "global_step": 631779, "epoch": 7611} {"train_loss": -27.864364624023438, "global_step": 631780, "epoch": 7611} {"train_loss": -28.106342315673828, "global_step": 631781, "epoch": 7611} {"train_loss": -28.189498901367188, "global_step": 631782, "epoch": 7611} {"train_loss": -28.16632080078125, "global_step": 631783, "epoch": 7611} {"train_loss": -27.58584976196289, "global_step": 631784, "epoch": 7611} {"train_loss": -28.21290397644043, "global_step": 631785, "epoch": 7611} {"train_loss": -28.36519432067871, "global_step": 631786, "epoch": 7611} {"train_loss": -28.025699615478516, "global_step": 631787, "epoch": 7611} {"train_loss": -27.936086654663086, "global_step": 631788, "epoch": 7611} {"train_loss": -28.24065589904785, "global_step": 631789, "epoch": 7611} {"train_loss": -28.13564109802246, "global_step": 631790, "epoch": 7611} {"train_loss": -28.15625, "global_step": 631791, "epoch": 7611} {"train_loss": -28.3972225189209, "global_step": 631792, "epoch": 7611} {"train_loss": -27.910085678100586, "global_step": 631793, "epoch": 7611} {"train_loss": -27.7955322265625, "global_step": 631794, "epoch": 7611} {"train_loss": -28.17286955592144, "global_step": 631795, "epoch": 7611, "val_loss": 6761403.5} {"train_loss": -27.2452392578125, "global_step": 631796, "epoch": 7612} {"train_loss": -27.45481300354004, "global_step": 631797, "epoch": 7612} {"train_loss": -28.014307022094727, "global_step": 631798, "epoch": 7612} {"train_loss": -27.502960205078125, "global_step": 631799, "epoch": 7612} {"train_loss": -27.663211822509766, "global_step": 631800, "epoch": 7612} {"train_loss": -27.156137466430664, "global_step": 631801, "epoch": 7612} {"train_loss": -28.017364501953125, "global_step": 631802, "epoch": 7612} {"train_loss": -27.985279083251953, "global_step": 631803, "epoch": 7612} {"train_loss": -27.23370361328125, "global_step": 631804, "epoch": 7612} {"train_loss": -27.606958389282227, "global_step": 631805, "epoch": 7612} {"train_loss": -27.548208236694336, "global_step": 631806, "epoch": 7612} {"train_loss": -27.658567428588867, "global_step": 631807, "epoch": 7612} {"train_loss": -27.916461944580078, "global_step": 631808, "epoch": 7612} {"train_loss": -27.6109619140625, "global_step": 631809, "epoch": 7612} {"train_loss": -27.71754264831543, "global_step": 631810, "epoch": 7612} {"train_loss": -27.92608070373535, "global_step": 631811, "epoch": 7612} {"train_loss": -27.90485191345215, "global_step": 631812, "epoch": 7612} {"train_loss": -28.05946159362793, "global_step": 631813, "epoch": 7612} {"train_loss": -27.583398818969727, "global_step": 631814, "epoch": 7612} {"train_loss": -27.96619987487793, "global_step": 631815, "epoch": 7612} {"train_loss": -27.9417724609375, "global_step": 631816, "epoch": 7612} {"train_loss": -28.00908851623535, "global_step": 631817, "epoch": 7612} {"train_loss": -27.9869384765625, "global_step": 631818, "epoch": 7612} {"train_loss": -27.865304946899414, "global_step": 631819, "epoch": 7612} {"train_loss": -27.8918399810791, "global_step": 631820, "epoch": 7612} {"train_loss": -27.787534713745117, "global_step": 631821, "epoch": 7612} {"train_loss": -28.286359786987305, "global_step": 631822, "epoch": 7612} {"train_loss": -27.7542724609375, "global_step": 631823, "epoch": 7612} {"train_loss": -28.055837631225586, "global_step": 631824, "epoch": 7612} {"train_loss": -28.076791763305664, "global_step": 631825, "epoch": 7612} {"train_loss": -28.060577392578125, "global_step": 631826, "epoch": 7612} {"train_loss": -27.891809463500977, "global_step": 631827, "epoch": 7612} {"train_loss": -28.078855514526367, "global_step": 631828, "epoch": 7612} {"train_loss": -28.045068740844727, "global_step": 631829, "epoch": 7612} {"train_loss": -28.568134307861328, "global_step": 631830, "epoch": 7612} {"train_loss": -27.888212203979492, "global_step": 631831, "epoch": 7612} {"train_loss": -28.233144760131836, "global_step": 631832, "epoch": 7612} {"train_loss": -28.100543975830078, "global_step": 631833, "epoch": 7612} {"train_loss": -28.046695709228516, "global_step": 631834, "epoch": 7612} {"train_loss": -28.4112548828125, "global_step": 631835, "epoch": 7612} {"train_loss": -28.1176700592041, "global_step": 631836, "epoch": 7612} {"train_loss": -28.433380126953125, "global_step": 631837, "epoch": 7612} {"train_loss": -28.111591339111328, "global_step": 631838, "epoch": 7612} {"train_loss": -27.92437744140625, "global_step": 631839, "epoch": 7612} {"train_loss": -28.45954704284668, "global_step": 631840, "epoch": 7612} {"train_loss": -28.371780395507812, "global_step": 631841, "epoch": 7612} {"train_loss": -28.02887535095215, "global_step": 631842, "epoch": 7612} {"train_loss": -28.532867431640625, "global_step": 631843, "epoch": 7612} {"train_loss": -28.184452056884766, "global_step": 631844, "epoch": 7612} {"train_loss": -28.04874610900879, "global_step": 631845, "epoch": 7612} {"train_loss": -28.45197105407715, "global_step": 631846, "epoch": 7612} {"train_loss": -28.31195068359375, "global_step": 631847, "epoch": 7612} {"train_loss": -28.054922103881836, "global_step": 631848, "epoch": 7612} {"train_loss": -28.1323299407959, "global_step": 631849, "epoch": 7612} {"train_loss": -28.152027130126953, "global_step": 631850, "epoch": 7612} {"train_loss": -28.802534103393555, "global_step": 631851, "epoch": 7612} {"train_loss": -28.736835479736328, "global_step": 631852, "epoch": 7612} {"train_loss": -28.185317993164062, "global_step": 631853, "epoch": 7612} {"train_loss": -28.168094635009766, "global_step": 631854, "epoch": 7612} {"train_loss": -27.792367935180664, "global_step": 631855, "epoch": 7612} {"train_loss": -27.293928146362305, "global_step": 631856, "epoch": 7612} {"train_loss": -27.610631942749023, "global_step": 631857, "epoch": 7612} {"train_loss": -27.828454971313477, "global_step": 631858, "epoch": 7612} {"train_loss": -28.610950469970703, "global_step": 631859, "epoch": 7612} {"train_loss": -28.577136993408203, "global_step": 631860, "epoch": 7612} {"train_loss": -28.350299835205078, "global_step": 631861, "epoch": 7612} {"train_loss": -28.118274688720703, "global_step": 631862, "epoch": 7612} {"train_loss": -28.11402702331543, "global_step": 631863, "epoch": 7612} {"train_loss": -27.635725021362305, "global_step": 631864, "epoch": 7612} {"train_loss": -28.451154708862305, "global_step": 631865, "epoch": 7612} {"train_loss": -28.082412719726562, "global_step": 631866, "epoch": 7612} {"train_loss": -28.5816650390625, "global_step": 631867, "epoch": 7612} {"train_loss": -27.987512588500977, "global_step": 631868, "epoch": 7612} {"train_loss": -28.342029571533203, "global_step": 631869, "epoch": 7612} {"train_loss": -28.188434600830078, "global_step": 631870, "epoch": 7612} {"train_loss": -28.79328727722168, "global_step": 631871, "epoch": 7612} {"train_loss": -28.461048126220703, "global_step": 631872, "epoch": 7612} {"train_loss": -28.322132110595703, "global_step": 631873, "epoch": 7612} {"train_loss": -28.527448654174805, "global_step": 631874, "epoch": 7612} {"train_loss": -28.477386474609375, "global_step": 631875, "epoch": 7612} {"train_loss": -28.384246826171875, "global_step": 631876, "epoch": 7612} {"train_loss": -28.038299560546875, "global_step": 631877, "epoch": 7612} {"train_loss": -28.05346445290439, "global_step": 631878, "epoch": 7612, "val_loss": 6697325.0} {"train_loss": -27.751266479492188, "global_step": 631879, "epoch": 7613} {"train_loss": -28.06525230407715, "global_step": 631880, "epoch": 7613} {"train_loss": -27.700536727905273, "global_step": 631881, "epoch": 7613} {"train_loss": -27.611860275268555, "global_step": 631882, "epoch": 7613} {"train_loss": -27.74200439453125, "global_step": 631883, "epoch": 7613} {"train_loss": -28.12409019470215, "global_step": 631884, "epoch": 7613} {"train_loss": -28.229318618774414, "global_step": 631885, "epoch": 7613} {"train_loss": -27.550506591796875, "global_step": 631886, "epoch": 7613} {"train_loss": -27.849279403686523, "global_step": 631887, "epoch": 7613} {"train_loss": -28.104999542236328, "global_step": 631888, "epoch": 7613} {"train_loss": -27.815048217773438, "global_step": 631889, "epoch": 7613} {"train_loss": -27.260879516601562, "global_step": 631890, "epoch": 7613} {"train_loss": -27.67283058166504, "global_step": 631891, "epoch": 7613} {"train_loss": -27.93049430847168, "global_step": 631892, "epoch": 7613} {"train_loss": -27.599872589111328, "global_step": 631893, "epoch": 7613} {"train_loss": -27.702138900756836, "global_step": 631894, "epoch": 7613} {"train_loss": -28.139617919921875, "global_step": 631895, "epoch": 7613} {"train_loss": -28.0169677734375, "global_step": 631896, "epoch": 7613} {"train_loss": -27.645597457885742, "global_step": 631897, "epoch": 7613} {"train_loss": -27.449604034423828, "global_step": 631898, "epoch": 7613} {"train_loss": -28.060260772705078, "global_step": 631899, "epoch": 7613} {"train_loss": -27.89200782775879, "global_step": 631900, "epoch": 7613} {"train_loss": -27.8116455078125, "global_step": 631901, "epoch": 7613} {"train_loss": -27.39472007751465, "global_step": 631902, "epoch": 7613} {"train_loss": -28.0953311920166, "global_step": 631903, "epoch": 7613} {"train_loss": -27.433435440063477, "global_step": 631904, "epoch": 7613} {"train_loss": -28.41552734375, "global_step": 631905, "epoch": 7613} {"train_loss": -27.758773803710938, "global_step": 631906, "epoch": 7613} {"train_loss": -27.762527465820312, "global_step": 631907, "epoch": 7613} {"train_loss": -27.824432373046875, "global_step": 631908, "epoch": 7613} {"train_loss": -27.73093605041504, "global_step": 631909, "epoch": 7613} {"train_loss": -28.546863555908203, "global_step": 631910, "epoch": 7613} {"train_loss": -27.66749382019043, "global_step": 631911, "epoch": 7613} {"train_loss": -27.754993438720703, "global_step": 631912, "epoch": 7613} {"train_loss": -27.926605224609375, "global_step": 631913, "epoch": 7613} {"train_loss": -27.98467445373535, "global_step": 631914, "epoch": 7613} {"train_loss": -28.3606014251709, "global_step": 631915, "epoch": 7613} {"train_loss": -28.1920108795166, "global_step": 631916, "epoch": 7613} {"train_loss": -27.95844841003418, "global_step": 631917, "epoch": 7613} {"train_loss": -28.084806442260742, "global_step": 631918, "epoch": 7613} {"train_loss": -28.603073120117188, "global_step": 631919, "epoch": 7613} {"train_loss": -28.168643951416016, "global_step": 631920, "epoch": 7613} {"train_loss": -28.3527774810791, "global_step": 631921, "epoch": 7613} {"train_loss": -28.436466217041016, "global_step": 631922, "epoch": 7613} {"train_loss": -28.468168258666992, "global_step": 631923, "epoch": 7613} {"train_loss": -28.353687286376953, "global_step": 631924, "epoch": 7613} {"train_loss": -28.26252555847168, "global_step": 631925, "epoch": 7613} {"train_loss": -28.212553024291992, "global_step": 631926, "epoch": 7613} {"train_loss": -28.466083526611328, "global_step": 631927, "epoch": 7613} {"train_loss": -28.48872184753418, "global_step": 631928, "epoch": 7613} {"train_loss": -28.509552001953125, "global_step": 631929, "epoch": 7613} {"train_loss": -28.386432647705078, "global_step": 631930, "epoch": 7613} {"train_loss": -28.54107093811035, "global_step": 631931, "epoch": 7613} {"train_loss": -28.491260528564453, "global_step": 631932, "epoch": 7613} {"train_loss": -28.396759033203125, "global_step": 631933, "epoch": 7613} {"train_loss": -28.442617416381836, "global_step": 631934, "epoch": 7613} {"train_loss": -28.600452423095703, "global_step": 631935, "epoch": 7613} {"train_loss": -28.528898239135742, "global_step": 631936, "epoch": 7613} {"train_loss": -28.692096710205078, "global_step": 631937, "epoch": 7613} {"train_loss": -28.464441299438477, "global_step": 631938, "epoch": 7613} {"train_loss": -28.485803604125977, "global_step": 631939, "epoch": 7613} {"train_loss": -28.349294662475586, "global_step": 631940, "epoch": 7613} {"train_loss": -28.152612686157227, "global_step": 631941, "epoch": 7613} {"train_loss": -28.51923942565918, "global_step": 631942, "epoch": 7613} {"train_loss": -28.61545181274414, "global_step": 631943, "epoch": 7613} {"train_loss": -28.37306785583496, "global_step": 631944, "epoch": 7613} {"train_loss": -28.376270294189453, "global_step": 631945, "epoch": 7613} {"train_loss": -28.62605857849121, "global_step": 631946, "epoch": 7613} {"train_loss": -28.53717041015625, "global_step": 631947, "epoch": 7613} {"train_loss": -28.076181411743164, "global_step": 631948, "epoch": 7613} {"train_loss": -28.577604293823242, "global_step": 631949, "epoch": 7613} {"train_loss": -28.12957763671875, "global_step": 631950, "epoch": 7613} {"train_loss": -27.653284072875977, "global_step": 631951, "epoch": 7613} {"train_loss": -28.021177291870117, "global_step": 631952, "epoch": 7613} {"train_loss": -28.347135543823242, "global_step": 631953, "epoch": 7613} {"train_loss": -28.056676864624023, "global_step": 631954, "epoch": 7613} {"train_loss": -27.87091064453125, "global_step": 631955, "epoch": 7613} {"train_loss": -27.857370376586914, "global_step": 631956, "epoch": 7613} {"train_loss": -27.91776466369629, "global_step": 631957, "epoch": 7613} {"train_loss": -28.121707916259766, "global_step": 631958, "epoch": 7613} {"train_loss": -28.17306900024414, "global_step": 631959, "epoch": 7613} {"train_loss": -28.309682846069336, "global_step": 631960, "epoch": 7613} {"train_loss": -28.114597228636224, "global_step": 631961, "epoch": 7613, "val_loss": 6593842.0} {"train_loss": -27.044958114624023, "global_step": 631962, "epoch": 7614} {"train_loss": -27.123441696166992, "global_step": 631963, "epoch": 7614} {"train_loss": -26.6507568359375, "global_step": 631964, "epoch": 7614} {"train_loss": -26.802953720092773, "global_step": 631965, "epoch": 7614} {"train_loss": -26.849706649780273, "global_step": 631966, "epoch": 7614} {"train_loss": -27.11494255065918, "global_step": 631967, "epoch": 7614} {"train_loss": -27.165739059448242, "global_step": 631968, "epoch": 7614} {"train_loss": -26.950956344604492, "global_step": 631969, "epoch": 7614} {"train_loss": -27.11982536315918, "global_step": 631970, "epoch": 7614} {"train_loss": -27.907541275024414, "global_step": 631971, "epoch": 7614} {"train_loss": -27.225479125976562, "global_step": 631972, "epoch": 7614} {"train_loss": -27.357763290405273, "global_step": 631973, "epoch": 7614} {"train_loss": -27.53036880493164, "global_step": 631974, "epoch": 7614} {"train_loss": -27.64286231994629, "global_step": 631975, "epoch": 7614} {"train_loss": -27.554458618164062, "global_step": 631976, "epoch": 7614} {"train_loss": -27.947223663330078, "global_step": 631977, "epoch": 7614} {"train_loss": -27.808746337890625, "global_step": 631978, "epoch": 7614} {"train_loss": -27.544591903686523, "global_step": 631979, "epoch": 7614} {"train_loss": -28.060749053955078, "global_step": 631980, "epoch": 7614} {"train_loss": -27.89813232421875, "global_step": 631981, "epoch": 7614} {"train_loss": -28.115121841430664, "global_step": 631982, "epoch": 7614} {"train_loss": -27.996545791625977, "global_step": 631983, "epoch": 7614} {"train_loss": -27.633716583251953, "global_step": 631984, "epoch": 7614} {"train_loss": -27.9762020111084, "global_step": 631985, "epoch": 7614} {"train_loss": -28.020544052124023, "global_step": 631986, "epoch": 7614} {"train_loss": -28.194921493530273, "global_step": 631987, "epoch": 7614} {"train_loss": -28.207014083862305, "global_step": 631988, "epoch": 7614} {"train_loss": -27.98775291442871, "global_step": 631989, "epoch": 7614} {"train_loss": -28.10318946838379, "global_step": 631990, "epoch": 7614} {"train_loss": -28.28407096862793, "global_step": 631991, "epoch": 7614} {"train_loss": -28.01484489440918, "global_step": 631992, "epoch": 7614} {"train_loss": -28.272607803344727, "global_step": 631993, "epoch": 7614} {"train_loss": -28.108816146850586, "global_step": 631994, "epoch": 7614} {"train_loss": -28.266101837158203, "global_step": 631995, "epoch": 7614} {"train_loss": -27.944807052612305, "global_step": 631996, "epoch": 7614} {"train_loss": -28.230939865112305, "global_step": 631997, "epoch": 7614} {"train_loss": -27.925323486328125, "global_step": 631998, "epoch": 7614} {"train_loss": -27.8839111328125, "global_step": 631999, "epoch": 7614} {"train_loss": -27.42853355407715, "global_step": 632000, "epoch": 7614} {"train_loss": -27.84673500061035, "global_step": 632001, "epoch": 7614} {"train_loss": -27.93751335144043, "global_step": 632002, "epoch": 7614} {"train_loss": -28.184783935546875, "global_step": 632003, "epoch": 7614} {"train_loss": -27.575180053710938, "global_step": 632004, "epoch": 7614} {"train_loss": -28.101093292236328, "global_step": 632005, "epoch": 7614} {"train_loss": -28.176223754882812, "global_step": 632006, "epoch": 7614} {"train_loss": -28.246301651000977, "global_step": 632007, "epoch": 7614} {"train_loss": -27.78602409362793, "global_step": 632008, "epoch": 7614} {"train_loss": -28.361047744750977, "global_step": 632009, "epoch": 7614} {"train_loss": -27.751672744750977, "global_step": 632010, "epoch": 7614} {"train_loss": -28.128767013549805, "global_step": 632011, "epoch": 7614} {"train_loss": -28.498920440673828, "global_step": 632012, "epoch": 7614} {"train_loss": -27.960538864135742, "global_step": 632013, "epoch": 7614} {"train_loss": -28.408935546875, "global_step": 632014, "epoch": 7614} {"train_loss": -28.622037887573242, "global_step": 632015, "epoch": 7614} {"train_loss": -28.2564697265625, "global_step": 632016, "epoch": 7614} {"train_loss": -28.610647201538086, "global_step": 632017, "epoch": 7614} {"train_loss": -28.475393295288086, "global_step": 632018, "epoch": 7614} {"train_loss": -28.1512451171875, "global_step": 632019, "epoch": 7614} {"train_loss": -28.245960235595703, "global_step": 632020, "epoch": 7614} {"train_loss": -28.23908805847168, "global_step": 632021, "epoch": 7614} {"train_loss": -28.04741859436035, "global_step": 632022, "epoch": 7614} {"train_loss": -28.34604835510254, "global_step": 632023, "epoch": 7614} {"train_loss": -28.010223388671875, "global_step": 632024, "epoch": 7614} {"train_loss": -28.253149032592773, "global_step": 632025, "epoch": 7614} {"train_loss": -28.37225914001465, "global_step": 632026, "epoch": 7614} {"train_loss": -27.8143310546875, "global_step": 632027, "epoch": 7614} {"train_loss": -27.876922607421875, "global_step": 632028, "epoch": 7614} {"train_loss": -28.02753257751465, "global_step": 632029, "epoch": 7614} {"train_loss": -28.356693267822266, "global_step": 632030, "epoch": 7614} {"train_loss": -28.244770050048828, "global_step": 632031, "epoch": 7614} {"train_loss": -27.9635066986084, "global_step": 632032, "epoch": 7614} {"train_loss": -27.87434196472168, "global_step": 632033, "epoch": 7614} {"train_loss": -28.191635131835938, "global_step": 632034, "epoch": 7614} {"train_loss": -28.408552169799805, "global_step": 632035, "epoch": 7614} {"train_loss": -28.1025447845459, "global_step": 632036, "epoch": 7614} {"train_loss": -28.530078887939453, "global_step": 632037, "epoch": 7614} {"train_loss": -28.570714950561523, "global_step": 632038, "epoch": 7614} {"train_loss": -27.72798728942871, "global_step": 632039, "epoch": 7614} {"train_loss": -28.048810958862305, "global_step": 632040, "epoch": 7614} {"train_loss": -28.255029678344727, "global_step": 632041, "epoch": 7614} {"train_loss": -28.23443603515625, "global_step": 632042, "epoch": 7614} {"train_loss": -28.498218536376953, "global_step": 632043, "epoch": 7614} {"train_loss": -27.946831530835254, "global_step": 632044, "epoch": 7614, "val_loss": 7011432.0} {"train_loss": -27.85031509399414, "global_step": 632045, "epoch": 7615} {"train_loss": -27.802997589111328, "global_step": 632046, "epoch": 7615} {"train_loss": -27.6404972076416, "global_step": 632047, "epoch": 7615} {"train_loss": -27.97186279296875, "global_step": 632048, "epoch": 7615} {"train_loss": -28.316333770751953, "global_step": 632049, "epoch": 7615} {"train_loss": -27.705707550048828, "global_step": 632050, "epoch": 7615} {"train_loss": -27.4787540435791, "global_step": 632051, "epoch": 7615} {"train_loss": -28.399457931518555, "global_step": 632052, "epoch": 7615} {"train_loss": -28.28253173828125, "global_step": 632053, "epoch": 7615} {"train_loss": -27.7777156829834, "global_step": 632054, "epoch": 7615} {"train_loss": -27.4213809967041, "global_step": 632055, "epoch": 7615} {"train_loss": -28.356475830078125, "global_step": 632056, "epoch": 7615} {"train_loss": -27.9305362701416, "global_step": 632057, "epoch": 7615} {"train_loss": -27.8725643157959, "global_step": 632058, "epoch": 7615} {"train_loss": -27.807722091674805, "global_step": 632059, "epoch": 7615} {"train_loss": -28.251489639282227, "global_step": 632060, "epoch": 7615} {"train_loss": -28.063404083251953, "global_step": 632061, "epoch": 7615} {"train_loss": -27.996280670166016, "global_step": 632062, "epoch": 7615} {"train_loss": -27.6439151763916, "global_step": 632063, "epoch": 7615} {"train_loss": -27.98233413696289, "global_step": 632064, "epoch": 7615} {"train_loss": -28.009246826171875, "global_step": 632065, "epoch": 7615} {"train_loss": -27.67774772644043, "global_step": 632066, "epoch": 7615} {"train_loss": -28.241559982299805, "global_step": 632067, "epoch": 7615} {"train_loss": -28.084192276000977, "global_step": 632068, "epoch": 7615} {"train_loss": -28.390310287475586, "global_step": 632069, "epoch": 7615} {"train_loss": -28.121179580688477, "global_step": 632070, "epoch": 7615} {"train_loss": -27.706632614135742, "global_step": 632071, "epoch": 7615} {"train_loss": -28.357757568359375, "global_step": 632072, "epoch": 7615} {"train_loss": -28.055761337280273, "global_step": 632073, "epoch": 7615} {"train_loss": -28.174081802368164, "global_step": 632074, "epoch": 7615} {"train_loss": -27.73017692565918, "global_step": 632075, "epoch": 7615} {"train_loss": -28.277196884155273, "global_step": 632076, "epoch": 7615} {"train_loss": -28.44803237915039, "global_step": 632077, "epoch": 7615} {"train_loss": -28.23325538635254, "global_step": 632078, "epoch": 7615} {"train_loss": -28.23273277282715, "global_step": 632079, "epoch": 7615} {"train_loss": -28.0936336517334, "global_step": 632080, "epoch": 7615} {"train_loss": -28.27703285217285, "global_step": 632081, "epoch": 7615} {"train_loss": -28.306049346923828, "global_step": 632082, "epoch": 7615} {"train_loss": -28.416685104370117, "global_step": 632083, "epoch": 7615} {"train_loss": -28.01779556274414, "global_step": 632084, "epoch": 7615} {"train_loss": -28.44712257385254, "global_step": 632085, "epoch": 7615} {"train_loss": -28.05972671508789, "global_step": 632086, "epoch": 7615} {"train_loss": -28.32390785217285, "global_step": 632087, "epoch": 7615} {"train_loss": -28.61762809753418, "global_step": 632088, "epoch": 7615} {"train_loss": -28.528066635131836, "global_step": 632089, "epoch": 7615} {"train_loss": -28.160816192626953, "global_step": 632090, "epoch": 7615} {"train_loss": -28.12909507751465, "global_step": 632091, "epoch": 7615} {"train_loss": -28.727783203125, "global_step": 632092, "epoch": 7615} {"train_loss": -28.335391998291016, "global_step": 632093, "epoch": 7615} {"train_loss": -28.260822296142578, "global_step": 632094, "epoch": 7615} {"train_loss": -28.128591537475586, "global_step": 632095, "epoch": 7615} {"train_loss": -28.317005157470703, "global_step": 632096, "epoch": 7615} {"train_loss": -28.75910758972168, "global_step": 632097, "epoch": 7615} {"train_loss": -28.597143173217773, "global_step": 632098, "epoch": 7615} {"train_loss": -28.131383895874023, "global_step": 632099, "epoch": 7615} {"train_loss": -28.141523361206055, "global_step": 632100, "epoch": 7615} {"train_loss": -28.451923370361328, "global_step": 632101, "epoch": 7615} {"train_loss": -28.4801025390625, "global_step": 632102, "epoch": 7615} {"train_loss": -28.091344833374023, "global_step": 632103, "epoch": 7615} {"train_loss": -28.31781005859375, "global_step": 632104, "epoch": 7615} {"train_loss": -28.293548583984375, "global_step": 632105, "epoch": 7615} {"train_loss": -27.765588760375977, "global_step": 632106, "epoch": 7615} {"train_loss": -26.829675674438477, "global_step": 632107, "epoch": 7615} {"train_loss": -27.7685546875, "global_step": 632108, "epoch": 7615} {"train_loss": -28.213842391967773, "global_step": 632109, "epoch": 7615} {"train_loss": -27.543237686157227, "global_step": 632110, "epoch": 7615} {"train_loss": -27.985132217407227, "global_step": 632111, "epoch": 7615} {"train_loss": -28.16057777404785, "global_step": 632112, "epoch": 7615} {"train_loss": -28.333087921142578, "global_step": 632113, "epoch": 7615} {"train_loss": -28.393665313720703, "global_step": 632114, "epoch": 7615} {"train_loss": -28.13678550720215, "global_step": 632115, "epoch": 7615} {"train_loss": -27.3636474609375, "global_step": 632116, "epoch": 7615} {"train_loss": -26.227807998657227, "global_step": 632117, "epoch": 7615} {"train_loss": -23.90419578552246, "global_step": 632118, "epoch": 7615} {"train_loss": -25.0313663482666, "global_step": 632119, "epoch": 7615} {"train_loss": -28.07535743713379, "global_step": 632120, "epoch": 7615} {"train_loss": -26.57547950744629, "global_step": 632121, "epoch": 7615} {"train_loss": -27.42732810974121, "global_step": 632122, "epoch": 7615} {"train_loss": -26.992645263671875, "global_step": 632123, "epoch": 7615} {"train_loss": -27.956573486328125, "global_step": 632124, "epoch": 7615} {"train_loss": -26.980253219604492, "global_step": 632125, "epoch": 7615} {"train_loss": -27.85956382751465, "global_step": 632126, "epoch": 7615} {"train_loss": -27.927448778267365, "global_step": 632127, "epoch": 7615, "val_loss": 6989483.0} {"train_loss": -27.215747833251953, "global_step": 632128, "epoch": 7616} {"train_loss": -27.624731063842773, "global_step": 632129, "epoch": 7616} {"train_loss": -27.0194034576416, "global_step": 632130, "epoch": 7616} {"train_loss": -26.92976951599121, "global_step": 632131, "epoch": 7616} {"train_loss": -27.411636352539062, "global_step": 632132, "epoch": 7616} {"train_loss": -27.065771102905273, "global_step": 632133, "epoch": 7616} {"train_loss": -27.3149356842041, "global_step": 632134, "epoch": 7616} {"train_loss": -27.457258224487305, "global_step": 632135, "epoch": 7616} {"train_loss": -27.409778594970703, "global_step": 632136, "epoch": 7616} {"train_loss": -26.443281173706055, "global_step": 632137, "epoch": 7616} {"train_loss": -27.686670303344727, "global_step": 632138, "epoch": 7616} {"train_loss": -27.2197265625, "global_step": 632139, "epoch": 7616} {"train_loss": -27.292755126953125, "global_step": 632140, "epoch": 7616} {"train_loss": -27.587278366088867, "global_step": 632141, "epoch": 7616} {"train_loss": -27.71347427368164, "global_step": 632142, "epoch": 7616} {"train_loss": -27.784574508666992, "global_step": 632143, "epoch": 7616} {"train_loss": -27.744190216064453, "global_step": 632144, "epoch": 7616} {"train_loss": -27.947437286376953, "global_step": 632145, "epoch": 7616} {"train_loss": -27.842456817626953, "global_step": 632146, "epoch": 7616} {"train_loss": -27.740875244140625, "global_step": 632147, "epoch": 7616} {"train_loss": -28.009565353393555, "global_step": 632148, "epoch": 7616} {"train_loss": -27.966291427612305, "global_step": 632149, "epoch": 7616} {"train_loss": -27.8971004486084, "global_step": 632150, "epoch": 7616} {"train_loss": -28.113859176635742, "global_step": 632151, "epoch": 7616} {"train_loss": -27.961240768432617, "global_step": 632152, "epoch": 7616} {"train_loss": -27.960412979125977, "global_step": 632153, "epoch": 7616} {"train_loss": -27.801828384399414, "global_step": 632154, "epoch": 7616} {"train_loss": -28.037214279174805, "global_step": 632155, "epoch": 7616} {"train_loss": -27.91322135925293, "global_step": 632156, "epoch": 7616} {"train_loss": -28.059955596923828, "global_step": 632157, "epoch": 7616} {"train_loss": -27.8837890625, "global_step": 632158, "epoch": 7616} {"train_loss": -28.322614669799805, "global_step": 632159, "epoch": 7616} {"train_loss": -27.762372970581055, "global_step": 632160, "epoch": 7616} {"train_loss": -28.306669235229492, "global_step": 632161, "epoch": 7616} {"train_loss": -28.0550537109375, "global_step": 632162, "epoch": 7616} {"train_loss": -27.938562393188477, "global_step": 632163, "epoch": 7616} {"train_loss": -28.477645874023438, "global_step": 632164, "epoch": 7616} {"train_loss": -28.0546932220459, "global_step": 632165, "epoch": 7616} {"train_loss": -28.42142677307129, "global_step": 632166, "epoch": 7616} {"train_loss": -28.157514572143555, "global_step": 632167, "epoch": 7616} {"train_loss": -28.020950317382812, "global_step": 632168, "epoch": 7616} {"train_loss": -28.23426628112793, "global_step": 632169, "epoch": 7616} {"train_loss": -27.91993522644043, "global_step": 632170, "epoch": 7616} {"train_loss": -28.4908447265625, "global_step": 632171, "epoch": 7616} {"train_loss": -28.325061798095703, "global_step": 632172, "epoch": 7616} {"train_loss": -28.122303009033203, "global_step": 632173, "epoch": 7616} {"train_loss": -28.57916259765625, "global_step": 632174, "epoch": 7616} {"train_loss": -28.103363037109375, "global_step": 632175, "epoch": 7616} {"train_loss": -28.243513107299805, "global_step": 632176, "epoch": 7616} {"train_loss": -28.087299346923828, "global_step": 632177, "epoch": 7616} {"train_loss": -28.116275787353516, "global_step": 632178, "epoch": 7616} {"train_loss": -27.235631942749023, "global_step": 632179, "epoch": 7616} {"train_loss": -26.79559898376465, "global_step": 632180, "epoch": 7616} {"train_loss": -26.78704261779785, "global_step": 632181, "epoch": 7616} {"train_loss": -27.34316062927246, "global_step": 632182, "epoch": 7616} {"train_loss": -27.885568618774414, "global_step": 632183, "epoch": 7616} {"train_loss": -27.6961612701416, "global_step": 632184, "epoch": 7616} {"train_loss": -27.845712661743164, "global_step": 632185, "epoch": 7616} {"train_loss": -28.067581176757812, "global_step": 632186, "epoch": 7616} {"train_loss": -27.66194725036621, "global_step": 632187, "epoch": 7616} {"train_loss": -28.240406036376953, "global_step": 632188, "epoch": 7616} {"train_loss": -27.865020751953125, "global_step": 632189, "epoch": 7616} {"train_loss": -27.206491470336914, "global_step": 632190, "epoch": 7616} {"train_loss": -27.726537704467773, "global_step": 632191, "epoch": 7616} {"train_loss": -27.621206283569336, "global_step": 632192, "epoch": 7616} {"train_loss": -27.705419540405273, "global_step": 632193, "epoch": 7616} {"train_loss": -27.847126007080078, "global_step": 632194, "epoch": 7616} {"train_loss": -27.791601181030273, "global_step": 632195, "epoch": 7616} {"train_loss": -27.902069091796875, "global_step": 632196, "epoch": 7616} {"train_loss": -27.98761558532715, "global_step": 632197, "epoch": 7616} {"train_loss": -27.820104598999023, "global_step": 632198, "epoch": 7616} {"train_loss": -28.223495483398438, "global_step": 632199, "epoch": 7616} {"train_loss": -28.038272857666016, "global_step": 632200, "epoch": 7616} {"train_loss": -28.206268310546875, "global_step": 632201, "epoch": 7616} {"train_loss": -27.971969604492188, "global_step": 632202, "epoch": 7616} {"train_loss": -28.035619735717773, "global_step": 632203, "epoch": 7616} {"train_loss": -28.006650924682617, "global_step": 632204, "epoch": 7616} {"train_loss": -27.796483993530273, "global_step": 632205, "epoch": 7616} {"train_loss": -28.004419326782227, "global_step": 632206, "epoch": 7616} {"train_loss": -28.12531852722168, "global_step": 632207, "epoch": 7616} {"train_loss": -28.407012939453125, "global_step": 632208, "epoch": 7616} {"train_loss": -28.071577072143555, "global_step": 632209, "epoch": 7616} {"train_loss": -27.819206513554217, "global_step": 632210, "epoch": 7616, "val_loss": 6944620.0} {"train_loss": -27.765024185180664, "global_step": 632211, "epoch": 7617} {"train_loss": -28.02210807800293, "global_step": 632212, "epoch": 7617} {"train_loss": -27.887042999267578, "global_step": 632213, "epoch": 7617} {"train_loss": -27.901092529296875, "global_step": 632214, "epoch": 7617} {"train_loss": -27.936389923095703, "global_step": 632215, "epoch": 7617} {"train_loss": -28.080875396728516, "global_step": 632216, "epoch": 7617} {"train_loss": -28.305387496948242, "global_step": 632217, "epoch": 7617} {"train_loss": -28.1998233795166, "global_step": 632218, "epoch": 7617} {"train_loss": -28.28515625, "global_step": 632219, "epoch": 7617} {"train_loss": -28.300207138061523, "global_step": 632220, "epoch": 7617} {"train_loss": -28.4865665435791, "global_step": 632221, "epoch": 7617} {"train_loss": -28.346643447875977, "global_step": 632222, "epoch": 7617} {"train_loss": -27.803394317626953, "global_step": 632223, "epoch": 7617} {"train_loss": -28.587392807006836, "global_step": 632224, "epoch": 7617} {"train_loss": -28.001367568969727, "global_step": 632225, "epoch": 7617} {"train_loss": -28.20849609375, "global_step": 632226, "epoch": 7617} {"train_loss": -28.0755615234375, "global_step": 632227, "epoch": 7617} {"train_loss": -28.3100528717041, "global_step": 632228, "epoch": 7617} {"train_loss": -27.92061424255371, "global_step": 632229, "epoch": 7617} {"train_loss": -28.547565460205078, "global_step": 632230, "epoch": 7617} {"train_loss": -28.38471031188965, "global_step": 632231, "epoch": 7617} {"train_loss": -28.2338809967041, "global_step": 632232, "epoch": 7617} {"train_loss": -28.15130043029785, "global_step": 632233, "epoch": 7617} {"train_loss": -28.0611629486084, "global_step": 632234, "epoch": 7617} {"train_loss": -28.090789794921875, "global_step": 632235, "epoch": 7617} {"train_loss": -28.22113037109375, "global_step": 632236, "epoch": 7617} {"train_loss": -28.249374389648438, "global_step": 632237, "epoch": 7617} {"train_loss": -28.071081161499023, "global_step": 632238, "epoch": 7617} {"train_loss": -28.436670303344727, "global_step": 632239, "epoch": 7617} {"train_loss": -28.047698974609375, "global_step": 632240, "epoch": 7617} {"train_loss": -28.35464859008789, "global_step": 632241, "epoch": 7617} {"train_loss": -28.725461959838867, "global_step": 632242, "epoch": 7617} {"train_loss": -28.129560470581055, "global_step": 632243, "epoch": 7617} {"train_loss": -28.642236709594727, "global_step": 632244, "epoch": 7617} {"train_loss": -28.40912437438965, "global_step": 632245, "epoch": 7617} {"train_loss": -28.3992919921875, "global_step": 632246, "epoch": 7617} {"train_loss": -28.642337799072266, "global_step": 632247, "epoch": 7617} {"train_loss": -28.123144149780273, "global_step": 632248, "epoch": 7617} {"train_loss": -28.4339542388916, "global_step": 632249, "epoch": 7617} {"train_loss": -28.4638729095459, "global_step": 632250, "epoch": 7617} {"train_loss": -28.693897247314453, "global_step": 632251, "epoch": 7617} {"train_loss": -28.5349178314209, "global_step": 632252, "epoch": 7617} {"train_loss": -28.463117599487305, "global_step": 632253, "epoch": 7617} {"train_loss": -28.0927677154541, "global_step": 632254, "epoch": 7617} {"train_loss": -28.12639808654785, "global_step": 632255, "epoch": 7617} {"train_loss": -28.4356632232666, "global_step": 632256, "epoch": 7617} {"train_loss": -28.330854415893555, "global_step": 632257, "epoch": 7617} {"train_loss": -28.287139892578125, "global_step": 632258, "epoch": 7617} {"train_loss": -27.72211265563965, "global_step": 632259, "epoch": 7617} {"train_loss": -27.131336212158203, "global_step": 632260, "epoch": 7617} {"train_loss": -26.168460845947266, "global_step": 632261, "epoch": 7617} {"train_loss": -26.6909122467041, "global_step": 632262, "epoch": 7617} {"train_loss": -27.9202823638916, "global_step": 632263, "epoch": 7617} {"train_loss": -27.012134552001953, "global_step": 632264, "epoch": 7617} {"train_loss": -28.510522842407227, "global_step": 632265, "epoch": 7617} {"train_loss": -27.763004302978516, "global_step": 632266, "epoch": 7617} {"train_loss": -27.7420711517334, "global_step": 632267, "epoch": 7617} {"train_loss": -27.157489776611328, "global_step": 632268, "epoch": 7617} {"train_loss": -27.96009635925293, "global_step": 632269, "epoch": 7617} {"train_loss": -27.899137496948242, "global_step": 632270, "epoch": 7617} {"train_loss": -27.849409103393555, "global_step": 632271, "epoch": 7617} {"train_loss": -27.985517501831055, "global_step": 632272, "epoch": 7617} {"train_loss": -27.932373046875, "global_step": 632273, "epoch": 7617} {"train_loss": -28.05901527404785, "global_step": 632274, "epoch": 7617} {"train_loss": -28.35617446899414, "global_step": 632275, "epoch": 7617} {"train_loss": -27.974853515625, "global_step": 632276, "epoch": 7617} {"train_loss": -28.150165557861328, "global_step": 632277, "epoch": 7617} {"train_loss": -28.26802635192871, "global_step": 632278, "epoch": 7617} {"train_loss": -27.9492130279541, "global_step": 632279, "epoch": 7617} {"train_loss": -28.117786407470703, "global_step": 632280, "epoch": 7617} {"train_loss": -28.049224853515625, "global_step": 632281, "epoch": 7617} {"train_loss": -27.54646873474121, "global_step": 632282, "epoch": 7617} {"train_loss": -28.083478927612305, "global_step": 632283, "epoch": 7617} {"train_loss": -27.880172729492188, "global_step": 632284, "epoch": 7617} {"train_loss": -28.01661491394043, "global_step": 632285, "epoch": 7617} {"train_loss": -27.59820556640625, "global_step": 632286, "epoch": 7617} {"train_loss": -28.12017250061035, "global_step": 632287, "epoch": 7617} {"train_loss": -28.337499618530273, "global_step": 632288, "epoch": 7617} {"train_loss": -28.492151260375977, "global_step": 632289, "epoch": 7617} {"train_loss": -28.550336837768555, "global_step": 632290, "epoch": 7617} {"train_loss": -28.165241241455078, "global_step": 632291, "epoch": 7617} {"train_loss": -28.093982696533203, "global_step": 632292, "epoch": 7617} {"train_loss": -28.088169051940184, "global_step": 632293, "epoch": 7617, "val_loss": 7006816.0} {"train_loss": -28.06403160095215, "global_step": 632294, "epoch": 7618} {"train_loss": -27.554859161376953, "global_step": 632295, "epoch": 7618} {"train_loss": -27.25013542175293, "global_step": 632296, "epoch": 7618} {"train_loss": -27.095788955688477, "global_step": 632297, "epoch": 7618} {"train_loss": -27.086267471313477, "global_step": 632298, "epoch": 7618} {"train_loss": -27.57337760925293, "global_step": 632299, "epoch": 7618} {"train_loss": -27.08429527282715, "global_step": 632300, "epoch": 7618} {"train_loss": -27.917158126831055, "global_step": 632301, "epoch": 7618} {"train_loss": -27.430234909057617, "global_step": 632302, "epoch": 7618} {"train_loss": -27.787311553955078, "global_step": 632303, "epoch": 7618} {"train_loss": -27.592060089111328, "global_step": 632304, "epoch": 7618} {"train_loss": -27.890140533447266, "global_step": 632305, "epoch": 7618} {"train_loss": -27.277301788330078, "global_step": 632306, "epoch": 7618} {"train_loss": -27.698638916015625, "global_step": 632307, "epoch": 7618} {"train_loss": -27.777387619018555, "global_step": 632308, "epoch": 7618} {"train_loss": -27.757333755493164, "global_step": 632309, "epoch": 7618} {"train_loss": -27.936323165893555, "global_step": 632310, "epoch": 7618} {"train_loss": -27.645954132080078, "global_step": 632311, "epoch": 7618} {"train_loss": -27.845468521118164, "global_step": 632312, "epoch": 7618} {"train_loss": -27.846588134765625, "global_step": 632313, "epoch": 7618} {"train_loss": -28.0602970123291, "global_step": 632314, "epoch": 7618} {"train_loss": -28.286413192749023, "global_step": 632315, "epoch": 7618} {"train_loss": -27.657119750976562, "global_step": 632316, "epoch": 7618} {"train_loss": -28.049509048461914, "global_step": 632317, "epoch": 7618} {"train_loss": -28.255767822265625, "global_step": 632318, "epoch": 7618} {"train_loss": -28.26582145690918, "global_step": 632319, "epoch": 7618} {"train_loss": -28.241596221923828, "global_step": 632320, "epoch": 7618} {"train_loss": -28.05474281311035, "global_step": 632321, "epoch": 7618} {"train_loss": -28.434772491455078, "global_step": 632322, "epoch": 7618} {"train_loss": -27.873279571533203, "global_step": 632323, "epoch": 7618} {"train_loss": -28.230072021484375, "global_step": 632324, "epoch": 7618} {"train_loss": -28.21955680847168, "global_step": 632325, "epoch": 7618} {"train_loss": -27.934680938720703, "global_step": 632326, "epoch": 7618} {"train_loss": -27.962818145751953, "global_step": 632327, "epoch": 7618} {"train_loss": -28.426542282104492, "global_step": 632328, "epoch": 7618} {"train_loss": -27.916778564453125, "global_step": 632329, "epoch": 7618} {"train_loss": -28.261560440063477, "global_step": 632330, "epoch": 7618} {"train_loss": -28.486356735229492, "global_step": 632331, "epoch": 7618} {"train_loss": -28.148361206054688, "global_step": 632332, "epoch": 7618} {"train_loss": -28.379796981811523, "global_step": 632333, "epoch": 7618} {"train_loss": -28.299259185791016, "global_step": 632334, "epoch": 7618} {"train_loss": -28.144128799438477, "global_step": 632335, "epoch": 7618} {"train_loss": -28.63901710510254, "global_step": 632336, "epoch": 7618} {"train_loss": -28.2624454498291, "global_step": 632337, "epoch": 7618} {"train_loss": -28.363494873046875, "global_step": 632338, "epoch": 7618} {"train_loss": -28.4945011138916, "global_step": 632339, "epoch": 7618} {"train_loss": -28.358800888061523, "global_step": 632340, "epoch": 7618} {"train_loss": -28.545835494995117, "global_step": 632341, "epoch": 7618} {"train_loss": -28.384443283081055, "global_step": 632342, "epoch": 7618} {"train_loss": -28.359411239624023, "global_step": 632343, "epoch": 7618} {"train_loss": -27.98850440979004, "global_step": 632344, "epoch": 7618} {"train_loss": -28.410125732421875, "global_step": 632345, "epoch": 7618} {"train_loss": -27.643827438354492, "global_step": 632346, "epoch": 7618} {"train_loss": -27.503253936767578, "global_step": 632347, "epoch": 7618} {"train_loss": -27.426807403564453, "global_step": 632348, "epoch": 7618} {"train_loss": -27.712360382080078, "global_step": 632349, "epoch": 7618} {"train_loss": -28.290674209594727, "global_step": 632350, "epoch": 7618} {"train_loss": -27.581045150756836, "global_step": 632351, "epoch": 7618} {"train_loss": -27.70697021484375, "global_step": 632352, "epoch": 7618} {"train_loss": -27.864465713500977, "global_step": 632353, "epoch": 7618} {"train_loss": -28.613855361938477, "global_step": 632354, "epoch": 7618} {"train_loss": -28.389982223510742, "global_step": 632355, "epoch": 7618} {"train_loss": -27.971418380737305, "global_step": 632356, "epoch": 7618} {"train_loss": -28.07341957092285, "global_step": 632357, "epoch": 7618} {"train_loss": -28.440866470336914, "global_step": 632358, "epoch": 7618} {"train_loss": -28.276233673095703, "global_step": 632359, "epoch": 7618} {"train_loss": -28.34503746032715, "global_step": 632360, "epoch": 7618} {"train_loss": -28.10943603515625, "global_step": 632361, "epoch": 7618} {"train_loss": -28.2305908203125, "global_step": 632362, "epoch": 7618} {"train_loss": -28.284448623657227, "global_step": 632363, "epoch": 7618} {"train_loss": -28.352834701538086, "global_step": 632364, "epoch": 7618} {"train_loss": -28.113998413085938, "global_step": 632365, "epoch": 7618} {"train_loss": -28.234338760375977, "global_step": 632366, "epoch": 7618} {"train_loss": -27.947057723999023, "global_step": 632367, "epoch": 7618} {"train_loss": -28.264596939086914, "global_step": 632368, "epoch": 7618} {"train_loss": -28.312896728515625, "global_step": 632369, "epoch": 7618} {"train_loss": -28.219486236572266, "global_step": 632370, "epoch": 7618} {"train_loss": -28.83283042907715, "global_step": 632371, "epoch": 7618} {"train_loss": -28.410688400268555, "global_step": 632372, "epoch": 7618} {"train_loss": -28.517078399658203, "global_step": 632373, "epoch": 7618} {"train_loss": -28.139368057250977, "global_step": 632374, "epoch": 7618} {"train_loss": -28.450550079345703, "global_step": 632375, "epoch": 7618} {"train_loss": -28.043091463755413, "global_step": 632376, "epoch": 7618, "val_loss": 6977529.5} {"train_loss": -27.758466720581055, "global_step": 632377, "epoch": 7619} {"train_loss": -26.5557861328125, "global_step": 632378, "epoch": 7619} {"train_loss": -27.789630889892578, "global_step": 632379, "epoch": 7619} {"train_loss": -27.34120750427246, "global_step": 632380, "epoch": 7619} {"train_loss": -26.8370304107666, "global_step": 632381, "epoch": 7619} {"train_loss": -27.41468620300293, "global_step": 632382, "epoch": 7619} {"train_loss": -27.730335235595703, "global_step": 632383, "epoch": 7619} {"train_loss": -27.418598175048828, "global_step": 632384, "epoch": 7619} {"train_loss": -27.36055564880371, "global_step": 632385, "epoch": 7619} {"train_loss": -27.255691528320312, "global_step": 632386, "epoch": 7619} {"train_loss": -27.240997314453125, "global_step": 632387, "epoch": 7619} {"train_loss": -27.81878662109375, "global_step": 632388, "epoch": 7619} {"train_loss": -27.286001205444336, "global_step": 632389, "epoch": 7619} {"train_loss": -27.362905502319336, "global_step": 632390, "epoch": 7619} {"train_loss": -27.83930015563965, "global_step": 632391, "epoch": 7619} {"train_loss": -27.504819869995117, "global_step": 632392, "epoch": 7619} {"train_loss": -27.89328384399414, "global_step": 632393, "epoch": 7619} {"train_loss": -27.762577056884766, "global_step": 632394, "epoch": 7619} {"train_loss": -27.634811401367188, "global_step": 632395, "epoch": 7619} {"train_loss": -27.84885597229004, "global_step": 632396, "epoch": 7619} {"train_loss": -27.843341827392578, "global_step": 632397, "epoch": 7619} {"train_loss": -27.92447280883789, "global_step": 632398, "epoch": 7619} {"train_loss": -27.839645385742188, "global_step": 632399, "epoch": 7619} {"train_loss": -27.73409080505371, "global_step": 632400, "epoch": 7619} {"train_loss": -27.894153594970703, "global_step": 632401, "epoch": 7619} {"train_loss": -27.77202796936035, "global_step": 632402, "epoch": 7619} {"train_loss": -27.624448776245117, "global_step": 632403, "epoch": 7619} {"train_loss": -27.98468017578125, "global_step": 632404, "epoch": 7619} {"train_loss": -28.096389770507812, "global_step": 632405, "epoch": 7619} {"train_loss": -28.099130630493164, "global_step": 632406, "epoch": 7619} {"train_loss": -28.233081817626953, "global_step": 632407, "epoch": 7619} {"train_loss": -27.802234649658203, "global_step": 632408, "epoch": 7619} {"train_loss": -28.202848434448242, "global_step": 632409, "epoch": 7619} {"train_loss": -27.85072135925293, "global_step": 632410, "epoch": 7619} {"train_loss": -28.198514938354492, "global_step": 632411, "epoch": 7619} {"train_loss": -28.01704216003418, "global_step": 632412, "epoch": 7619} {"train_loss": -28.45575523376465, "global_step": 632413, "epoch": 7619} {"train_loss": -28.304899215698242, "global_step": 632414, "epoch": 7619} {"train_loss": -27.96183204650879, "global_step": 632415, "epoch": 7619} {"train_loss": -28.277708053588867, "global_step": 632416, "epoch": 7619} {"train_loss": -28.232282638549805, "global_step": 632417, "epoch": 7619} {"train_loss": -28.65168571472168, "global_step": 632418, "epoch": 7619} {"train_loss": -28.279157638549805, "global_step": 632419, "epoch": 7619} {"train_loss": -27.924779891967773, "global_step": 632420, "epoch": 7619} {"train_loss": -28.113800048828125, "global_step": 632421, "epoch": 7619} {"train_loss": -27.88825035095215, "global_step": 632422, "epoch": 7619} {"train_loss": -28.19769859313965, "global_step": 632423, "epoch": 7619} {"train_loss": -28.069807052612305, "global_step": 632424, "epoch": 7619} {"train_loss": -28.23505210876465, "global_step": 632425, "epoch": 7619} {"train_loss": -28.077865600585938, "global_step": 632426, "epoch": 7619} {"train_loss": -27.86885643005371, "global_step": 632427, "epoch": 7619} {"train_loss": -28.163679122924805, "global_step": 632428, "epoch": 7619} {"train_loss": -28.236188888549805, "global_step": 632429, "epoch": 7619} {"train_loss": -27.931379318237305, "global_step": 632430, "epoch": 7619} {"train_loss": -27.89246940612793, "global_step": 632431, "epoch": 7619} {"train_loss": -28.273406982421875, "global_step": 632432, "epoch": 7619} {"train_loss": -28.03696632385254, "global_step": 632433, "epoch": 7619} {"train_loss": -27.592578887939453, "global_step": 632434, "epoch": 7619} {"train_loss": -27.323883056640625, "global_step": 632435, "epoch": 7619} {"train_loss": -27.057025909423828, "global_step": 632436, "epoch": 7619} {"train_loss": -26.820348739624023, "global_step": 632437, "epoch": 7619} {"train_loss": -28.142719268798828, "global_step": 632438, "epoch": 7619} {"train_loss": -27.3651065826416, "global_step": 632439, "epoch": 7619} {"train_loss": -27.71253776550293, "global_step": 632440, "epoch": 7619} {"train_loss": -27.957441329956055, "global_step": 632441, "epoch": 7619} {"train_loss": -27.967710494995117, "global_step": 632442, "epoch": 7619} {"train_loss": -28.074493408203125, "global_step": 632443, "epoch": 7619} {"train_loss": -28.01490592956543, "global_step": 632444, "epoch": 7619} {"train_loss": -27.847259521484375, "global_step": 632445, "epoch": 7619} {"train_loss": -27.97021484375, "global_step": 632446, "epoch": 7619} {"train_loss": -27.633642196655273, "global_step": 632447, "epoch": 7619} {"train_loss": -28.046314239501953, "global_step": 632448, "epoch": 7619} {"train_loss": -28.03950309753418, "global_step": 632449, "epoch": 7619} {"train_loss": -27.876203536987305, "global_step": 632450, "epoch": 7619} {"train_loss": -27.586584091186523, "global_step": 632451, "epoch": 7619} {"train_loss": -27.785669326782227, "global_step": 632452, "epoch": 7619} {"train_loss": -28.09453773498535, "global_step": 632453, "epoch": 7619} {"train_loss": -28.0167293548584, "global_step": 632454, "epoch": 7619} {"train_loss": -27.942625045776367, "global_step": 632455, "epoch": 7619} {"train_loss": -27.978918075561523, "global_step": 632456, "epoch": 7619} {"train_loss": -28.071874618530273, "global_step": 632457, "epoch": 7619} {"train_loss": -27.75530433654785, "global_step": 632458, "epoch": 7619} {"train_loss": -27.85947995013501, "global_step": 632459, "epoch": 7619, "val_loss": 7010231.5} {"train_loss": -26.433908462524414, "global_step": 632460, "epoch": 7620} {"train_loss": -26.959218978881836, "global_step": 632461, "epoch": 7620} {"train_loss": -27.56110954284668, "global_step": 632462, "epoch": 7620} {"train_loss": -26.871301651000977, "global_step": 632463, "epoch": 7620} {"train_loss": -27.3634090423584, "global_step": 632464, "epoch": 7620} {"train_loss": -27.24212646484375, "global_step": 632465, "epoch": 7620} {"train_loss": -27.06342887878418, "global_step": 632466, "epoch": 7620} {"train_loss": -27.668607711791992, "global_step": 632467, "epoch": 7620} {"train_loss": -27.466474533081055, "global_step": 632468, "epoch": 7620} {"train_loss": -27.613861083984375, "global_step": 632469, "epoch": 7620} {"train_loss": -27.2285213470459, "global_step": 632470, "epoch": 7620} {"train_loss": -27.855865478515625, "global_step": 632471, "epoch": 7620} {"train_loss": -27.303298950195312, "global_step": 632472, "epoch": 7620} {"train_loss": -27.963825225830078, "global_step": 632473, "epoch": 7620} {"train_loss": -27.747419357299805, "global_step": 632474, "epoch": 7620} {"train_loss": -27.31910514831543, "global_step": 632475, "epoch": 7620} {"train_loss": -27.484201431274414, "global_step": 632476, "epoch": 7620} {"train_loss": -27.83570671081543, "global_step": 632477, "epoch": 7620} {"train_loss": -27.96762466430664, "global_step": 632478, "epoch": 7620} {"train_loss": -27.96721839904785, "global_step": 632479, "epoch": 7620} {"train_loss": -27.966272354125977, "global_step": 632480, "epoch": 7620} {"train_loss": -27.609298706054688, "global_step": 632481, "epoch": 7620} {"train_loss": -28.141590118408203, "global_step": 632482, "epoch": 7620} {"train_loss": -27.884977340698242, "global_step": 632483, "epoch": 7620} {"train_loss": -27.924823760986328, "global_step": 632484, "epoch": 7620} {"train_loss": -28.091510772705078, "global_step": 632485, "epoch": 7620} {"train_loss": -27.931598663330078, "global_step": 632486, "epoch": 7620} {"train_loss": -28.108585357666016, "global_step": 632487, "epoch": 7620} {"train_loss": -28.04571533203125, "global_step": 632488, "epoch": 7620} {"train_loss": -27.919021606445312, "global_step": 632489, "epoch": 7620} {"train_loss": -27.931806564331055, "global_step": 632490, "epoch": 7620} {"train_loss": -28.37506675720215, "global_step": 632491, "epoch": 7620} {"train_loss": -28.372974395751953, "global_step": 632492, "epoch": 7620} {"train_loss": -28.11753273010254, "global_step": 632493, "epoch": 7620} {"train_loss": -28.421497344970703, "global_step": 632494, "epoch": 7620} {"train_loss": -28.0842227935791, "global_step": 632495, "epoch": 7620} {"train_loss": -28.45355224609375, "global_step": 632496, "epoch": 7620} {"train_loss": -28.611764907836914, "global_step": 632497, "epoch": 7620} {"train_loss": -28.659637451171875, "global_step": 632498, "epoch": 7620} {"train_loss": -28.13007926940918, "global_step": 632499, "epoch": 7620} {"train_loss": -28.282306671142578, "global_step": 632500, "epoch": 7620} {"train_loss": -28.200830459594727, "global_step": 632501, "epoch": 7620} {"train_loss": -28.34524917602539, "global_step": 632502, "epoch": 7620} {"train_loss": -28.606159210205078, "global_step": 632503, "epoch": 7620} {"train_loss": -28.2740421295166, "global_step": 632504, "epoch": 7620} {"train_loss": -28.45990562438965, "global_step": 632505, "epoch": 7620} {"train_loss": -28.389633178710938, "global_step": 632506, "epoch": 7620} {"train_loss": -28.56927490234375, "global_step": 632507, "epoch": 7620} {"train_loss": -28.498218536376953, "global_step": 632508, "epoch": 7620} {"train_loss": -28.810827255249023, "global_step": 632509, "epoch": 7620} {"train_loss": -28.447595596313477, "global_step": 632510, "epoch": 7620} {"train_loss": -28.593488693237305, "global_step": 632511, "epoch": 7620} {"train_loss": -28.571945190429688, "global_step": 632512, "epoch": 7620} {"train_loss": -28.55010414123535, "global_step": 632513, "epoch": 7620} {"train_loss": -28.359149932861328, "global_step": 632514, "epoch": 7620} {"train_loss": -28.6485538482666, "global_step": 632515, "epoch": 7620} {"train_loss": -28.336400985717773, "global_step": 632516, "epoch": 7620} {"train_loss": -28.127334594726562, "global_step": 632517, "epoch": 7620} {"train_loss": -28.4480037689209, "global_step": 632518, "epoch": 7620} {"train_loss": -28.627283096313477, "global_step": 632519, "epoch": 7620} {"train_loss": -28.58599853515625, "global_step": 632520, "epoch": 7620} {"train_loss": -28.611286163330078, "global_step": 632521, "epoch": 7620} {"train_loss": -28.264495849609375, "global_step": 632522, "epoch": 7620} {"train_loss": -28.229480743408203, "global_step": 632523, "epoch": 7620} {"train_loss": -28.188444137573242, "global_step": 632524, "epoch": 7620} {"train_loss": -28.05048179626465, "global_step": 632525, "epoch": 7620} {"train_loss": -27.689645767211914, "global_step": 632526, "epoch": 7620} {"train_loss": -27.461095809936523, "global_step": 632527, "epoch": 7620} {"train_loss": -27.244140625, "global_step": 632528, "epoch": 7620} {"train_loss": -27.2198429107666, "global_step": 632529, "epoch": 7620} {"train_loss": -26.45025634765625, "global_step": 632530, "epoch": 7620} {"train_loss": -27.24224281311035, "global_step": 632531, "epoch": 7620} {"train_loss": -27.835294723510742, "global_step": 632532, "epoch": 7620} {"train_loss": -27.216352462768555, "global_step": 632533, "epoch": 7620} {"train_loss": -27.638586044311523, "global_step": 632534, "epoch": 7620} {"train_loss": -27.644947052001953, "global_step": 632535, "epoch": 7620} {"train_loss": -27.817035675048828, "global_step": 632536, "epoch": 7620} {"train_loss": -27.453113555908203, "global_step": 632537, "epoch": 7620} {"train_loss": -27.96687126159668, "global_step": 632538, "epoch": 7620} {"train_loss": -27.90654945373535, "global_step": 632539, "epoch": 7620} {"train_loss": -27.853046417236328, "global_step": 632540, "epoch": 7620} {"train_loss": -27.94807243347168, "global_step": 632541, "epoch": 7620} {"train_loss": -27.95601651754724, "global_step": 632542, "epoch": 7620, "val_loss": 6951577.0} {"train_loss": -26.951465606689453, "global_step": 632543, "epoch": 7621} {"train_loss": -27.13067054748535, "global_step": 632544, "epoch": 7621} {"train_loss": -27.077695846557617, "global_step": 632545, "epoch": 7621} {"train_loss": -27.146963119506836, "global_step": 632546, "epoch": 7621} {"train_loss": -26.95051383972168, "global_step": 632547, "epoch": 7621} {"train_loss": -26.83794593811035, "global_step": 632548, "epoch": 7621} {"train_loss": -27.070627212524414, "global_step": 632549, "epoch": 7621} {"train_loss": -26.999832153320312, "global_step": 632550, "epoch": 7621} {"train_loss": -27.596527099609375, "global_step": 632551, "epoch": 7621} {"train_loss": -27.004117965698242, "global_step": 632552, "epoch": 7621} {"train_loss": -27.397064208984375, "global_step": 632553, "epoch": 7621} {"train_loss": -27.419523239135742, "global_step": 632554, "epoch": 7621} {"train_loss": -27.370731353759766, "global_step": 632555, "epoch": 7621} {"train_loss": -27.271549224853516, "global_step": 632556, "epoch": 7621} {"train_loss": -27.684179306030273, "global_step": 632557, "epoch": 7621} {"train_loss": -27.49936866760254, "global_step": 632558, "epoch": 7621} {"train_loss": -27.178022384643555, "global_step": 632559, "epoch": 7621} {"train_loss": -27.907514572143555, "global_step": 632560, "epoch": 7621} {"train_loss": -27.50079345703125, "global_step": 632561, "epoch": 7621} {"train_loss": -27.465423583984375, "global_step": 632562, "epoch": 7621} {"train_loss": -27.34122085571289, "global_step": 632563, "epoch": 7621} {"train_loss": -27.20684814453125, "global_step": 632564, "epoch": 7621} {"train_loss": -27.632654190063477, "global_step": 632565, "epoch": 7621} {"train_loss": -27.595144271850586, "global_step": 632566, "epoch": 7621} {"train_loss": -28.072233200073242, "global_step": 632567, "epoch": 7621} {"train_loss": -27.775110244750977, "global_step": 632568, "epoch": 7621} {"train_loss": -27.962656021118164, "global_step": 632569, "epoch": 7621} {"train_loss": -28.003076553344727, "global_step": 632570, "epoch": 7621} {"train_loss": -27.365341186523438, "global_step": 632571, "epoch": 7621} {"train_loss": -28.114459991455078, "global_step": 632572, "epoch": 7621} {"train_loss": -27.929458618164062, "global_step": 632573, "epoch": 7621} {"train_loss": -27.810102462768555, "global_step": 632574, "epoch": 7621} {"train_loss": -27.935333251953125, "global_step": 632575, "epoch": 7621} {"train_loss": -28.1740665435791, "global_step": 632576, "epoch": 7621} {"train_loss": -28.090641021728516, "global_step": 632577, "epoch": 7621} {"train_loss": -28.20245933532715, "global_step": 632578, "epoch": 7621} {"train_loss": -28.0733642578125, "global_step": 632579, "epoch": 7621} {"train_loss": -28.232084274291992, "global_step": 632580, "epoch": 7621} {"train_loss": -27.732919692993164, "global_step": 632581, "epoch": 7621} {"train_loss": -28.128448486328125, "global_step": 632582, "epoch": 7621} {"train_loss": -28.122699737548828, "global_step": 632583, "epoch": 7621} {"train_loss": -28.51108741760254, "global_step": 632584, "epoch": 7621} {"train_loss": -27.644744873046875, "global_step": 632585, "epoch": 7621} {"train_loss": -28.189971923828125, "global_step": 632586, "epoch": 7621} {"train_loss": -28.159778594970703, "global_step": 632587, "epoch": 7621} {"train_loss": -28.170318603515625, "global_step": 632588, "epoch": 7621} {"train_loss": -28.332544326782227, "global_step": 632589, "epoch": 7621} {"train_loss": -28.406240463256836, "global_step": 632590, "epoch": 7621} {"train_loss": -28.327655792236328, "global_step": 632591, "epoch": 7621} {"train_loss": -28.415563583374023, "global_step": 632592, "epoch": 7621} {"train_loss": -28.307310104370117, "global_step": 632593, "epoch": 7621} {"train_loss": -28.23951530456543, "global_step": 632594, "epoch": 7621} {"train_loss": -28.778608322143555, "global_step": 632595, "epoch": 7621} {"train_loss": -28.217456817626953, "global_step": 632596, "epoch": 7621} {"train_loss": -28.394073486328125, "global_step": 632597, "epoch": 7621} {"train_loss": -28.153690338134766, "global_step": 632598, "epoch": 7621} {"train_loss": -28.485422134399414, "global_step": 632599, "epoch": 7621} {"train_loss": -28.11456298828125, "global_step": 632600, "epoch": 7621} {"train_loss": -28.774255752563477, "global_step": 632601, "epoch": 7621} {"train_loss": -27.9350643157959, "global_step": 632602, "epoch": 7621} {"train_loss": -27.87506675720215, "global_step": 632603, "epoch": 7621} {"train_loss": -28.126266479492188, "global_step": 632604, "epoch": 7621} {"train_loss": -28.081512451171875, "global_step": 632605, "epoch": 7621} {"train_loss": -28.261632919311523, "global_step": 632606, "epoch": 7621} {"train_loss": -28.222814559936523, "global_step": 632607, "epoch": 7621} {"train_loss": -28.04292106628418, "global_step": 632608, "epoch": 7621} {"train_loss": -27.938196182250977, "global_step": 632609, "epoch": 7621} {"train_loss": -28.224729537963867, "global_step": 632610, "epoch": 7621} {"train_loss": -28.3870849609375, "global_step": 632611, "epoch": 7621} {"train_loss": -27.366424560546875, "global_step": 632612, "epoch": 7621} {"train_loss": -27.131118774414062, "global_step": 632613, "epoch": 7621} {"train_loss": -28.43023681640625, "global_step": 632614, "epoch": 7621} {"train_loss": -27.967248916625977, "global_step": 632615, "epoch": 7621} {"train_loss": -27.52191162109375, "global_step": 632616, "epoch": 7621} {"train_loss": -28.09647560119629, "global_step": 632617, "epoch": 7621} {"train_loss": -27.531423568725586, "global_step": 632618, "epoch": 7621} {"train_loss": -28.341642379760742, "global_step": 632619, "epoch": 7621} {"train_loss": -27.70533561706543, "global_step": 632620, "epoch": 7621} {"train_loss": -28.4119815826416, "global_step": 632621, "epoch": 7621} {"train_loss": -28.30155372619629, "global_step": 632622, "epoch": 7621} {"train_loss": -28.403722763061523, "global_step": 632623, "epoch": 7621} {"train_loss": -28.123769760131836, "global_step": 632624, "epoch": 7621} {"train_loss": -27.85626609066883, "global_step": 632625, "epoch": 7621, "val_loss": 7002984.0} {"train_loss": -27.945327758789062, "global_step": 632626, "epoch": 7622} {"train_loss": -27.739171981811523, "global_step": 632627, "epoch": 7622} {"train_loss": -28.11041831970215, "global_step": 632628, "epoch": 7622} {"train_loss": -27.756671905517578, "global_step": 632629, "epoch": 7622} {"train_loss": -27.8901309967041, "global_step": 632630, "epoch": 7622} {"train_loss": -27.546979904174805, "global_step": 632631, "epoch": 7622} {"train_loss": -28.026960372924805, "global_step": 632632, "epoch": 7622} {"train_loss": -28.188291549682617, "global_step": 632633, "epoch": 7622} {"train_loss": -27.778425216674805, "global_step": 632634, "epoch": 7622} {"train_loss": -27.759313583374023, "global_step": 632635, "epoch": 7622} {"train_loss": -28.091083526611328, "global_step": 632636, "epoch": 7622} {"train_loss": -28.133392333984375, "global_step": 632637, "epoch": 7622} {"train_loss": -27.886926651000977, "global_step": 632638, "epoch": 7622} {"train_loss": -27.541900634765625, "global_step": 632639, "epoch": 7622} {"train_loss": -27.57557487487793, "global_step": 632640, "epoch": 7622} {"train_loss": -27.930028915405273, "global_step": 632641, "epoch": 7622} {"train_loss": -28.081451416015625, "global_step": 632642, "epoch": 7622} {"train_loss": -28.008935928344727, "global_step": 632643, "epoch": 7622} {"train_loss": -28.131732940673828, "global_step": 632644, "epoch": 7622} {"train_loss": -27.950519561767578, "global_step": 632645, "epoch": 7622} {"train_loss": -28.265766143798828, "global_step": 632646, "epoch": 7622} {"train_loss": -28.02652359008789, "global_step": 632647, "epoch": 7622} {"train_loss": -28.361865997314453, "global_step": 632648, "epoch": 7622} {"train_loss": -28.28476905822754, "global_step": 632649, "epoch": 7622} {"train_loss": -28.14691162109375, "global_step": 632650, "epoch": 7622} {"train_loss": -28.100299835205078, "global_step": 632651, "epoch": 7622} {"train_loss": -28.3132266998291, "global_step": 632652, "epoch": 7622} {"train_loss": -28.498626708984375, "global_step": 632653, "epoch": 7622} {"train_loss": -28.15337562561035, "global_step": 632654, "epoch": 7622} {"train_loss": -28.292510986328125, "global_step": 632655, "epoch": 7622} {"train_loss": -28.814924240112305, "global_step": 632656, "epoch": 7622} {"train_loss": -28.37025260925293, "global_step": 632657, "epoch": 7622} {"train_loss": -28.408727645874023, "global_step": 632658, "epoch": 7622} {"train_loss": -28.205102920532227, "global_step": 632659, "epoch": 7622} {"train_loss": -28.223413467407227, "global_step": 632660, "epoch": 7622} {"train_loss": -28.4276123046875, "global_step": 632661, "epoch": 7622} {"train_loss": -28.232330322265625, "global_step": 632662, "epoch": 7622} {"train_loss": -28.566974639892578, "global_step": 632663, "epoch": 7622} {"train_loss": -28.3786563873291, "global_step": 632664, "epoch": 7622} {"train_loss": -28.460575103759766, "global_step": 632665, "epoch": 7622} {"train_loss": -28.387903213500977, "global_step": 632666, "epoch": 7622} {"train_loss": -28.422061920166016, "global_step": 632667, "epoch": 7622} {"train_loss": -28.310575485229492, "global_step": 632668, "epoch": 7622} {"train_loss": -28.12481117248535, "global_step": 632669, "epoch": 7622} {"train_loss": -28.07736587524414, "global_step": 632670, "epoch": 7622} {"train_loss": -27.682470321655273, "global_step": 632671, "epoch": 7622} {"train_loss": -27.616443634033203, "global_step": 632672, "epoch": 7622} {"train_loss": -28.2127628326416, "global_step": 632673, "epoch": 7622} {"train_loss": -28.053852081298828, "global_step": 632674, "epoch": 7622} {"train_loss": -27.88142204284668, "global_step": 632675, "epoch": 7622} {"train_loss": -28.44733238220215, "global_step": 632676, "epoch": 7622} {"train_loss": -28.23813819885254, "global_step": 632677, "epoch": 7622} {"train_loss": -27.748456954956055, "global_step": 632678, "epoch": 7622} {"train_loss": -28.19795036315918, "global_step": 632679, "epoch": 7622} {"train_loss": -28.016998291015625, "global_step": 632680, "epoch": 7622} {"train_loss": -28.40899658203125, "global_step": 632681, "epoch": 7622} {"train_loss": -28.167449951171875, "global_step": 632682, "epoch": 7622} {"train_loss": -28.200559616088867, "global_step": 632683, "epoch": 7622} {"train_loss": -28.50229835510254, "global_step": 632684, "epoch": 7622} {"train_loss": -27.99237060546875, "global_step": 632685, "epoch": 7622} {"train_loss": -28.190555572509766, "global_step": 632686, "epoch": 7622} {"train_loss": -28.315399169921875, "global_step": 632687, "epoch": 7622} {"train_loss": -28.11427879333496, "global_step": 632688, "epoch": 7622} {"train_loss": -28.28739356994629, "global_step": 632689, "epoch": 7622} {"train_loss": -28.3370304107666, "global_step": 632690, "epoch": 7622} {"train_loss": -27.89471435546875, "global_step": 632691, "epoch": 7622} {"train_loss": -28.57842445373535, "global_step": 632692, "epoch": 7622} {"train_loss": -28.0701904296875, "global_step": 632693, "epoch": 7622} {"train_loss": -28.620502471923828, "global_step": 632694, "epoch": 7622} {"train_loss": -28.248804092407227, "global_step": 632695, "epoch": 7622} {"train_loss": -28.360815048217773, "global_step": 632696, "epoch": 7622} {"train_loss": -28.310754776000977, "global_step": 632697, "epoch": 7622} {"train_loss": -28.046979904174805, "global_step": 632698, "epoch": 7622} {"train_loss": -28.395355224609375, "global_step": 632699, "epoch": 7622} {"train_loss": -28.471038818359375, "global_step": 632700, "epoch": 7622} {"train_loss": -28.533090591430664, "global_step": 632701, "epoch": 7622} {"train_loss": -28.01337242126465, "global_step": 632702, "epoch": 7622} {"train_loss": -28.09531593322754, "global_step": 632703, "epoch": 7622} {"train_loss": -28.06064796447754, "global_step": 632704, "epoch": 7622} {"train_loss": -28.00656509399414, "global_step": 632705, "epoch": 7622} {"train_loss": -27.985580444335938, "global_step": 632706, "epoch": 7622} {"train_loss": -28.369688034057617, "global_step": 632707, "epoch": 7622} {"train_loss": -28.17174095705331, "global_step": 632708, "epoch": 7622, "val_loss": 6912784.0} {"train_loss": -27.63968849182129, "global_step": 632709, "epoch": 7623} {"train_loss": -27.152936935424805, "global_step": 632710, "epoch": 7623} {"train_loss": -27.796894073486328, "global_step": 632711, "epoch": 7623} {"train_loss": -27.89729118347168, "global_step": 632712, "epoch": 7623} {"train_loss": -27.31190299987793, "global_step": 632713, "epoch": 7623} {"train_loss": -27.733259201049805, "global_step": 632714, "epoch": 7623} {"train_loss": -28.258596420288086, "global_step": 632715, "epoch": 7623} {"train_loss": -27.80645751953125, "global_step": 632716, "epoch": 7623} {"train_loss": -28.026559829711914, "global_step": 632717, "epoch": 7623} {"train_loss": -28.212018966674805, "global_step": 632718, "epoch": 7623} {"train_loss": -28.347400665283203, "global_step": 632719, "epoch": 7623} {"train_loss": -28.29047203063965, "global_step": 632720, "epoch": 7623} {"train_loss": -28.516925811767578, "global_step": 632721, "epoch": 7623} {"train_loss": -27.738210678100586, "global_step": 632722, "epoch": 7623} {"train_loss": -27.981287002563477, "global_step": 632723, "epoch": 7623} {"train_loss": -28.316434860229492, "global_step": 632724, "epoch": 7623} {"train_loss": -28.341394424438477, "global_step": 632725, "epoch": 7623} {"train_loss": -28.357030868530273, "global_step": 632726, "epoch": 7623} {"train_loss": -28.282474517822266, "global_step": 632727, "epoch": 7623} {"train_loss": -28.21525001525879, "global_step": 632728, "epoch": 7623} {"train_loss": -28.6950740814209, "global_step": 632729, "epoch": 7623} {"train_loss": -28.200546264648438, "global_step": 632730, "epoch": 7623} {"train_loss": -28.129535675048828, "global_step": 632731, "epoch": 7623} {"train_loss": -28.14606285095215, "global_step": 632732, "epoch": 7623} {"train_loss": -28.3520450592041, "global_step": 632733, "epoch": 7623} {"train_loss": -28.58479881286621, "global_step": 632734, "epoch": 7623} {"train_loss": -28.21933364868164, "global_step": 632735, "epoch": 7623} {"train_loss": -28.516748428344727, "global_step": 632736, "epoch": 7623} {"train_loss": -28.258024215698242, "global_step": 632737, "epoch": 7623} {"train_loss": -28.509113311767578, "global_step": 632738, "epoch": 7623} {"train_loss": -28.568464279174805, "global_step": 632739, "epoch": 7623} {"train_loss": -28.322195053100586, "global_step": 632740, "epoch": 7623} {"train_loss": -28.382604598999023, "global_step": 632741, "epoch": 7623} {"train_loss": -28.249359130859375, "global_step": 632742, "epoch": 7623} {"train_loss": -28.285003662109375, "global_step": 632743, "epoch": 7623} {"train_loss": -28.23244285583496, "global_step": 632744, "epoch": 7623} {"train_loss": -28.37445068359375, "global_step": 632745, "epoch": 7623} {"train_loss": -28.62282371520996, "global_step": 632746, "epoch": 7623} {"train_loss": -28.273237228393555, "global_step": 632747, "epoch": 7623} {"train_loss": -28.29682731628418, "global_step": 632748, "epoch": 7623} {"train_loss": -28.579761505126953, "global_step": 632749, "epoch": 7623} {"train_loss": -28.34026527404785, "global_step": 632750, "epoch": 7623} {"train_loss": -28.6239070892334, "global_step": 632751, "epoch": 7623} {"train_loss": -28.406661987304688, "global_step": 632752, "epoch": 7623} {"train_loss": -28.406875610351562, "global_step": 632753, "epoch": 7623} {"train_loss": -27.96170425415039, "global_step": 632754, "epoch": 7623} {"train_loss": -27.594823837280273, "global_step": 632755, "epoch": 7623} {"train_loss": -27.148874282836914, "global_step": 632756, "epoch": 7623} {"train_loss": -27.105438232421875, "global_step": 632757, "epoch": 7623} {"train_loss": -27.403661727905273, "global_step": 632758, "epoch": 7623} {"train_loss": -27.587783813476562, "global_step": 632759, "epoch": 7623} {"train_loss": -27.440576553344727, "global_step": 632760, "epoch": 7623} {"train_loss": -27.157236099243164, "global_step": 632761, "epoch": 7623} {"train_loss": -28.097143173217773, "global_step": 632762, "epoch": 7623} {"train_loss": -27.819660186767578, "global_step": 632763, "epoch": 7623} {"train_loss": -27.796524047851562, "global_step": 632764, "epoch": 7623} {"train_loss": -28.21697998046875, "global_step": 632765, "epoch": 7623} {"train_loss": -27.694305419921875, "global_step": 632766, "epoch": 7623} {"train_loss": -28.142248153686523, "global_step": 632767, "epoch": 7623} {"train_loss": -27.654022216796875, "global_step": 632768, "epoch": 7623} {"train_loss": -27.9555606842041, "global_step": 632769, "epoch": 7623} {"train_loss": -27.845687866210938, "global_step": 632770, "epoch": 7623} {"train_loss": -28.030384063720703, "global_step": 632771, "epoch": 7623} {"train_loss": -28.243467330932617, "global_step": 632772, "epoch": 7623} {"train_loss": -28.052175521850586, "global_step": 632773, "epoch": 7623} {"train_loss": -27.820632934570312, "global_step": 632774, "epoch": 7623} {"train_loss": -28.19099235534668, "global_step": 632775, "epoch": 7623} {"train_loss": -27.97625732421875, "global_step": 632776, "epoch": 7623} {"train_loss": -27.5554256439209, "global_step": 632777, "epoch": 7623} {"train_loss": -27.754419326782227, "global_step": 632778, "epoch": 7623} {"train_loss": -28.18556022644043, "global_step": 632779, "epoch": 7623} {"train_loss": -27.718351364135742, "global_step": 632780, "epoch": 7623} {"train_loss": -28.220687866210938, "global_step": 632781, "epoch": 7623} {"train_loss": -27.99544334411621, "global_step": 632782, "epoch": 7623} {"train_loss": -28.271881103515625, "global_step": 632783, "epoch": 7623} {"train_loss": -27.930347442626953, "global_step": 632784, "epoch": 7623} {"train_loss": -28.224945068359375, "global_step": 632785, "epoch": 7623} {"train_loss": -28.66449546813965, "global_step": 632786, "epoch": 7623} {"train_loss": -28.34541893005371, "global_step": 632787, "epoch": 7623} {"train_loss": -28.197345733642578, "global_step": 632788, "epoch": 7623} {"train_loss": -28.191619873046875, "global_step": 632789, "epoch": 7623} {"train_loss": -28.476953506469727, "global_step": 632790, "epoch": 7623} {"train_loss": -28.0753156593047, "global_step": 632791, "epoch": 7623, "val_loss": 6922760.0} {"train_loss": -27.99469566345215, "global_step": 632792, "epoch": 7624} {"train_loss": -27.909276962280273, "global_step": 632793, "epoch": 7624} {"train_loss": -27.60345458984375, "global_step": 632794, "epoch": 7624} {"train_loss": -27.52188491821289, "global_step": 632795, "epoch": 7624} {"train_loss": -27.92535400390625, "global_step": 632796, "epoch": 7624} {"train_loss": -27.68037223815918, "global_step": 632797, "epoch": 7624} {"train_loss": -28.160343170166016, "global_step": 632798, "epoch": 7624} {"train_loss": -27.87542724609375, "global_step": 632799, "epoch": 7624} {"train_loss": -28.2142391204834, "global_step": 632800, "epoch": 7624} {"train_loss": -28.199249267578125, "global_step": 632801, "epoch": 7624} {"train_loss": -28.05974769592285, "global_step": 632802, "epoch": 7624} {"train_loss": -28.31952476501465, "global_step": 632803, "epoch": 7624} {"train_loss": -28.261096954345703, "global_step": 632804, "epoch": 7624} {"train_loss": -28.135528564453125, "global_step": 632805, "epoch": 7624} {"train_loss": -28.430845260620117, "global_step": 632806, "epoch": 7624} {"train_loss": -27.715045928955078, "global_step": 632807, "epoch": 7624} {"train_loss": -28.073806762695312, "global_step": 632808, "epoch": 7624} {"train_loss": -28.08197593688965, "global_step": 632809, "epoch": 7624} {"train_loss": -27.917022705078125, "global_step": 632810, "epoch": 7624} {"train_loss": -28.406204223632812, "global_step": 632811, "epoch": 7624} {"train_loss": -27.639554977416992, "global_step": 632812, "epoch": 7624} {"train_loss": -28.37643814086914, "global_step": 632813, "epoch": 7624} {"train_loss": -27.823638916015625, "global_step": 632814, "epoch": 7624} {"train_loss": -28.316974639892578, "global_step": 632815, "epoch": 7624} {"train_loss": -28.08233070373535, "global_step": 632816, "epoch": 7624} {"train_loss": -28.0476131439209, "global_step": 632817, "epoch": 7624} {"train_loss": -28.340213775634766, "global_step": 632818, "epoch": 7624} {"train_loss": -27.982168197631836, "global_step": 632819, "epoch": 7624} {"train_loss": -28.15066909790039, "global_step": 632820, "epoch": 7624} {"train_loss": -28.12265968322754, "global_step": 632821, "epoch": 7624} {"train_loss": -28.187122344970703, "global_step": 632822, "epoch": 7624} {"train_loss": -28.14801597595215, "global_step": 632823, "epoch": 7624} {"train_loss": -28.162036895751953, "global_step": 632824, "epoch": 7624} {"train_loss": -28.51914405822754, "global_step": 632825, "epoch": 7624} {"train_loss": -28.09466552734375, "global_step": 632826, "epoch": 7624} {"train_loss": -28.380216598510742, "global_step": 632827, "epoch": 7624} {"train_loss": -28.29547119140625, "global_step": 632828, "epoch": 7624} {"train_loss": -27.935352325439453, "global_step": 632829, "epoch": 7624} {"train_loss": -28.449438095092773, "global_step": 632830, "epoch": 7624} {"train_loss": -28.319278717041016, "global_step": 632831, "epoch": 7624} {"train_loss": -28.511518478393555, "global_step": 632832, "epoch": 7624} {"train_loss": -28.20102882385254, "global_step": 632833, "epoch": 7624} {"train_loss": -28.161855697631836, "global_step": 632834, "epoch": 7624} {"train_loss": -28.125751495361328, "global_step": 632835, "epoch": 7624} {"train_loss": -28.32948112487793, "global_step": 632836, "epoch": 7624} {"train_loss": -28.525558471679688, "global_step": 632837, "epoch": 7624} {"train_loss": -28.360586166381836, "global_step": 632838, "epoch": 7624} {"train_loss": -28.543598175048828, "global_step": 632839, "epoch": 7624} {"train_loss": -27.992477416992188, "global_step": 632840, "epoch": 7624} {"train_loss": -28.071430206298828, "global_step": 632841, "epoch": 7624} {"train_loss": -28.35980224609375, "global_step": 632842, "epoch": 7624} {"train_loss": -28.11554527282715, "global_step": 632843, "epoch": 7624} {"train_loss": -28.126855850219727, "global_step": 632844, "epoch": 7624} {"train_loss": -28.006772994995117, "global_step": 632845, "epoch": 7624} {"train_loss": -27.70847511291504, "global_step": 632846, "epoch": 7624} {"train_loss": -28.415695190429688, "global_step": 632847, "epoch": 7624} {"train_loss": -28.43400001525879, "global_step": 632848, "epoch": 7624} {"train_loss": -28.629291534423828, "global_step": 632849, "epoch": 7624} {"train_loss": -28.148727416992188, "global_step": 632850, "epoch": 7624} {"train_loss": -28.009403228759766, "global_step": 632851, "epoch": 7624} {"train_loss": -28.194610595703125, "global_step": 632852, "epoch": 7624} {"train_loss": -27.992034912109375, "global_step": 632853, "epoch": 7624} {"train_loss": -28.44021987915039, "global_step": 632854, "epoch": 7624} {"train_loss": -28.350711822509766, "global_step": 632855, "epoch": 7624} {"train_loss": -28.27552604675293, "global_step": 632856, "epoch": 7624} {"train_loss": -27.936437606811523, "global_step": 632857, "epoch": 7624} {"train_loss": -27.840246200561523, "global_step": 632858, "epoch": 7624} {"train_loss": -28.271728515625, "global_step": 632859, "epoch": 7624} {"train_loss": -28.144092559814453, "global_step": 632860, "epoch": 7624} {"train_loss": -27.641799926757812, "global_step": 632861, "epoch": 7624} {"train_loss": -27.73224449157715, "global_step": 632862, "epoch": 7624} {"train_loss": -27.929397583007812, "global_step": 632863, "epoch": 7624} {"train_loss": -28.211414337158203, "global_step": 632864, "epoch": 7624} {"train_loss": -28.1458683013916, "global_step": 632865, "epoch": 7624} {"train_loss": -28.1394100189209, "global_step": 632866, "epoch": 7624} {"train_loss": -27.979215621948242, "global_step": 632867, "epoch": 7624} {"train_loss": -28.09747314453125, "global_step": 632868, "epoch": 7624} {"train_loss": -28.219989776611328, "global_step": 632869, "epoch": 7624} {"train_loss": -28.453012466430664, "global_step": 632870, "epoch": 7624} {"train_loss": -28.131244659423828, "global_step": 632871, "epoch": 7624} {"train_loss": -28.320758819580078, "global_step": 632872, "epoch": 7624} {"train_loss": -28.297712326049805, "global_step": 632873, "epoch": 7624} {"train_loss": -28.1564889930817, "global_step": 632874, "epoch": 7624, "val_loss": 6958536.5} {"train_loss": -27.912551879882812, "global_step": 632875, "epoch": 7625} {"train_loss": -28.121347427368164, "global_step": 632876, "epoch": 7625} {"train_loss": -28.060821533203125, "global_step": 632877, "epoch": 7625} {"train_loss": -28.08732032775879, "global_step": 632878, "epoch": 7625} {"train_loss": -28.028818130493164, "global_step": 632879, "epoch": 7625} {"train_loss": -27.8387508392334, "global_step": 632880, "epoch": 7625} {"train_loss": -27.90520668029785, "global_step": 632881, "epoch": 7625} {"train_loss": -27.723493576049805, "global_step": 632882, "epoch": 7625} {"train_loss": -28.147415161132812, "global_step": 632883, "epoch": 7625} {"train_loss": -27.91004753112793, "global_step": 632884, "epoch": 7625} {"train_loss": -28.31915855407715, "global_step": 632885, "epoch": 7625} {"train_loss": -28.439666748046875, "global_step": 632886, "epoch": 7625} {"train_loss": -28.147123336791992, "global_step": 632887, "epoch": 7625} {"train_loss": -27.915485382080078, "global_step": 632888, "epoch": 7625} {"train_loss": -28.095258712768555, "global_step": 632889, "epoch": 7625} {"train_loss": -27.65504264831543, "global_step": 632890, "epoch": 7625} {"train_loss": -28.164539337158203, "global_step": 632891, "epoch": 7625} {"train_loss": -28.282255172729492, "global_step": 632892, "epoch": 7625} {"train_loss": -27.91383171081543, "global_step": 632893, "epoch": 7625} {"train_loss": -28.35774803161621, "global_step": 632894, "epoch": 7625} {"train_loss": -28.124359130859375, "global_step": 632895, "epoch": 7625} {"train_loss": -28.545902252197266, "global_step": 632896, "epoch": 7625} {"train_loss": -28.24407958984375, "global_step": 632897, "epoch": 7625} {"train_loss": -28.484094619750977, "global_step": 632898, "epoch": 7625} {"train_loss": -28.140655517578125, "global_step": 632899, "epoch": 7625} {"train_loss": -28.376575469970703, "global_step": 632900, "epoch": 7625} {"train_loss": -28.484228134155273, "global_step": 632901, "epoch": 7625} {"train_loss": -28.189716339111328, "global_step": 632902, "epoch": 7625} {"train_loss": -28.129560470581055, "global_step": 632903, "epoch": 7625} {"train_loss": -28.615737915039062, "global_step": 632904, "epoch": 7625} {"train_loss": -28.406538009643555, "global_step": 632905, "epoch": 7625} {"train_loss": -27.977807998657227, "global_step": 632906, "epoch": 7625} {"train_loss": -27.977344512939453, "global_step": 632907, "epoch": 7625} {"train_loss": -28.187875747680664, "global_step": 632908, "epoch": 7625} {"train_loss": -28.0537166595459, "global_step": 632909, "epoch": 7625} {"train_loss": -28.024738311767578, "global_step": 632910, "epoch": 7625} {"train_loss": -27.823505401611328, "global_step": 632911, "epoch": 7625} {"train_loss": -27.648969650268555, "global_step": 632912, "epoch": 7625} {"train_loss": -27.3363094329834, "global_step": 632913, "epoch": 7625} {"train_loss": -28.05641746520996, "global_step": 632914, "epoch": 7625} {"train_loss": -28.522363662719727, "global_step": 632915, "epoch": 7625} {"train_loss": -27.70950698852539, "global_step": 632916, "epoch": 7625} {"train_loss": -28.183942794799805, "global_step": 632917, "epoch": 7625} {"train_loss": -27.9544620513916, "global_step": 632918, "epoch": 7625} {"train_loss": -27.293731689453125, "global_step": 632919, "epoch": 7625} {"train_loss": -28.236133575439453, "global_step": 632920, "epoch": 7625} {"train_loss": -27.07390785217285, "global_step": 632921, "epoch": 7625} {"train_loss": -27.40821647644043, "global_step": 632922, "epoch": 7625} {"train_loss": -27.424884796142578, "global_step": 632923, "epoch": 7625} {"train_loss": -28.50031089782715, "global_step": 632924, "epoch": 7625} {"train_loss": -27.621185302734375, "global_step": 632925, "epoch": 7625} {"train_loss": -28.1228084564209, "global_step": 632926, "epoch": 7625} {"train_loss": -28.1746883392334, "global_step": 632927, "epoch": 7625} {"train_loss": -27.899810791015625, "global_step": 632928, "epoch": 7625} {"train_loss": -28.067655563354492, "global_step": 632929, "epoch": 7625} {"train_loss": -28.323108673095703, "global_step": 632930, "epoch": 7625} {"train_loss": -28.34608268737793, "global_step": 632931, "epoch": 7625} {"train_loss": -28.182437896728516, "global_step": 632932, "epoch": 7625} {"train_loss": -27.706571578979492, "global_step": 632933, "epoch": 7625} {"train_loss": -27.951868057250977, "global_step": 632934, "epoch": 7625} {"train_loss": -28.074127197265625, "global_step": 632935, "epoch": 7625} {"train_loss": -28.286428451538086, "global_step": 632936, "epoch": 7625} {"train_loss": -27.832548141479492, "global_step": 632937, "epoch": 7625} {"train_loss": -28.022876739501953, "global_step": 632938, "epoch": 7625} {"train_loss": -27.939008712768555, "global_step": 632939, "epoch": 7625} {"train_loss": -28.2794189453125, "global_step": 632940, "epoch": 7625} {"train_loss": -28.082366943359375, "global_step": 632941, "epoch": 7625} {"train_loss": -28.242401123046875, "global_step": 632942, "epoch": 7625} {"train_loss": -28.3587703704834, "global_step": 632943, "epoch": 7625} {"train_loss": -28.12686538696289, "global_step": 632944, "epoch": 7625} {"train_loss": -28.234262466430664, "global_step": 632945, "epoch": 7625} {"train_loss": -28.04450798034668, "global_step": 632946, "epoch": 7625} {"train_loss": -28.45547866821289, "global_step": 632947, "epoch": 7625} {"train_loss": -28.455846786499023, "global_step": 632948, "epoch": 7625} {"train_loss": -28.1379337310791, "global_step": 632949, "epoch": 7625} {"train_loss": -28.520483016967773, "global_step": 632950, "epoch": 7625} {"train_loss": -28.643173217773438, "global_step": 632951, "epoch": 7625} {"train_loss": -28.284021377563477, "global_step": 632952, "epoch": 7625} {"train_loss": -28.418073654174805, "global_step": 632953, "epoch": 7625} {"train_loss": -28.429529190063477, "global_step": 632954, "epoch": 7625} {"train_loss": -28.19681167602539, "global_step": 632955, "epoch": 7625} {"train_loss": -28.51422119140625, "global_step": 632956, "epoch": 7625} {"train_loss": -28.12030316548175, "global_step": 632957, "epoch": 7625, "val_loss": 6893579.0} {"train_loss": -27.679956436157227, "global_step": 632958, "epoch": 7626} {"train_loss": -27.742156982421875, "global_step": 632959, "epoch": 7626} {"train_loss": -27.93402099609375, "global_step": 632960, "epoch": 7626} {"train_loss": -28.41611671447754, "global_step": 632961, "epoch": 7626} {"train_loss": -28.361845016479492, "global_step": 632962, "epoch": 7626} {"train_loss": -27.935407638549805, "global_step": 632963, "epoch": 7626} {"train_loss": -28.331195831298828, "global_step": 632964, "epoch": 7626} {"train_loss": -28.2935848236084, "global_step": 632965, "epoch": 7626} {"train_loss": -28.093046188354492, "global_step": 632966, "epoch": 7626} {"train_loss": -28.29036521911621, "global_step": 632967, "epoch": 7626} {"train_loss": -28.08759880065918, "global_step": 632968, "epoch": 7626} {"train_loss": -28.243040084838867, "global_step": 632969, "epoch": 7626} {"train_loss": -28.07989501953125, "global_step": 632970, "epoch": 7626} {"train_loss": -28.129011154174805, "global_step": 632971, "epoch": 7626} {"train_loss": -28.357696533203125, "global_step": 632972, "epoch": 7626} {"train_loss": -28.124601364135742, "global_step": 632973, "epoch": 7626} {"train_loss": -27.626312255859375, "global_step": 632974, "epoch": 7626} {"train_loss": -28.081815719604492, "global_step": 632975, "epoch": 7626} {"train_loss": -28.733739852905273, "global_step": 632976, "epoch": 7626} {"train_loss": -27.949533462524414, "global_step": 632977, "epoch": 7626} {"train_loss": -28.099756240844727, "global_step": 632978, "epoch": 7626} {"train_loss": -28.922901153564453, "global_step": 632979, "epoch": 7626} {"train_loss": -28.184814453125, "global_step": 632980, "epoch": 7626} {"train_loss": -27.99305534362793, "global_step": 632981, "epoch": 7626} {"train_loss": -28.23441505432129, "global_step": 632982, "epoch": 7626} {"train_loss": -28.403757095336914, "global_step": 632983, "epoch": 7626} {"train_loss": -28.138269424438477, "global_step": 632984, "epoch": 7626} {"train_loss": -28.404834747314453, "global_step": 632985, "epoch": 7626} {"train_loss": -28.333463668823242, "global_step": 632986, "epoch": 7626} {"train_loss": -27.823957443237305, "global_step": 632987, "epoch": 7626} {"train_loss": -27.902868270874023, "global_step": 632988, "epoch": 7626} {"train_loss": -28.170026779174805, "global_step": 632989, "epoch": 7626} {"train_loss": -28.1010799407959, "global_step": 632990, "epoch": 7626} {"train_loss": -28.164453506469727, "global_step": 632991, "epoch": 7626} {"train_loss": -27.569379806518555, "global_step": 632992, "epoch": 7626} {"train_loss": -28.362350463867188, "global_step": 632993, "epoch": 7626} {"train_loss": -27.658658981323242, "global_step": 632994, "epoch": 7626} {"train_loss": -27.998701095581055, "global_step": 632995, "epoch": 7626} {"train_loss": -27.95556640625, "global_step": 632996, "epoch": 7626} {"train_loss": -28.120319366455078, "global_step": 632997, "epoch": 7626} {"train_loss": -27.893964767456055, "global_step": 632998, "epoch": 7626} {"train_loss": -28.41786003112793, "global_step": 632999, "epoch": 7626} {"train_loss": -28.444910049438477, "global_step": 633000, "epoch": 7626} {"train_loss": -27.88886070251465, "global_step": 633001, "epoch": 7626} {"train_loss": -28.065906524658203, "global_step": 633002, "epoch": 7626} {"train_loss": -28.2669734954834, "global_step": 633003, "epoch": 7626} {"train_loss": -28.07546043395996, "global_step": 633004, "epoch": 7626} {"train_loss": -28.31354331970215, "global_step": 633005, "epoch": 7626} {"train_loss": -28.66552734375, "global_step": 633006, "epoch": 7626} {"train_loss": -28.564971923828125, "global_step": 633007, "epoch": 7626} {"train_loss": -28.16986083984375, "global_step": 633008, "epoch": 7626} {"train_loss": -28.280597686767578, "global_step": 633009, "epoch": 7626} {"train_loss": -28.76055908203125, "global_step": 633010, "epoch": 7626} {"train_loss": -28.356449127197266, "global_step": 633011, "epoch": 7626} {"train_loss": -28.243722915649414, "global_step": 633012, "epoch": 7626} {"train_loss": -28.327198028564453, "global_step": 633013, "epoch": 7626} {"train_loss": -28.315073013305664, "global_step": 633014, "epoch": 7626} {"train_loss": -28.329160690307617, "global_step": 633015, "epoch": 7626} {"train_loss": -28.19683265686035, "global_step": 633016, "epoch": 7626} {"train_loss": -28.175048828125, "global_step": 633017, "epoch": 7626} {"train_loss": -28.32553482055664, "global_step": 633018, "epoch": 7626} {"train_loss": -28.183408737182617, "global_step": 633019, "epoch": 7626} {"train_loss": -28.438465118408203, "global_step": 633020, "epoch": 7626} {"train_loss": -28.05816078186035, "global_step": 633021, "epoch": 7626} {"train_loss": -28.0955753326416, "global_step": 633022, "epoch": 7626} {"train_loss": -28.187341690063477, "global_step": 633023, "epoch": 7626} {"train_loss": -27.90887451171875, "global_step": 633024, "epoch": 7626} {"train_loss": -28.42339515686035, "global_step": 633025, "epoch": 7626} {"train_loss": -28.758142471313477, "global_step": 633026, "epoch": 7626} {"train_loss": -28.647815704345703, "global_step": 633027, "epoch": 7626} {"train_loss": -28.262287139892578, "global_step": 633028, "epoch": 7626} {"train_loss": -28.35108757019043, "global_step": 633029, "epoch": 7626} {"train_loss": -28.324682235717773, "global_step": 633030, "epoch": 7626} {"train_loss": -28.3743839263916, "global_step": 633031, "epoch": 7626} {"train_loss": -28.508869171142578, "global_step": 633032, "epoch": 7626} {"train_loss": -28.25471305847168, "global_step": 633033, "epoch": 7626} {"train_loss": -28.508398056030273, "global_step": 633034, "epoch": 7626} {"train_loss": -28.089923858642578, "global_step": 633035, "epoch": 7626} {"train_loss": -28.688562393188477, "global_step": 633036, "epoch": 7626} {"train_loss": -28.38832664489746, "global_step": 633037, "epoch": 7626} {"train_loss": -28.030099868774414, "global_step": 633038, "epoch": 7626} {"train_loss": -28.537372589111328, "global_step": 633039, "epoch": 7626} {"train_loss": -28.217214745211315, "global_step": 633040, "epoch": 7626, "val_loss": 6876136.0} {"train_loss": -27.41813087463379, "global_step": 633041, "epoch": 7627} {"train_loss": -26.94586181640625, "global_step": 633042, "epoch": 7627} {"train_loss": -26.525609970092773, "global_step": 633043, "epoch": 7627} {"train_loss": -26.6165828704834, "global_step": 633044, "epoch": 7627} {"train_loss": -27.68328857421875, "global_step": 633045, "epoch": 7627} {"train_loss": -26.993122100830078, "global_step": 633046, "epoch": 7627} {"train_loss": -27.30868911743164, "global_step": 633047, "epoch": 7627} {"train_loss": -27.307382583618164, "global_step": 633048, "epoch": 7627} {"train_loss": -26.966617584228516, "global_step": 633049, "epoch": 7627} {"train_loss": -27.43985366821289, "global_step": 633050, "epoch": 7627} {"train_loss": -27.886554718017578, "global_step": 633051, "epoch": 7627} {"train_loss": -27.517608642578125, "global_step": 633052, "epoch": 7627} {"train_loss": -27.961166381835938, "global_step": 633053, "epoch": 7627} {"train_loss": -27.046003341674805, "global_step": 633054, "epoch": 7627} {"train_loss": -27.715871810913086, "global_step": 633055, "epoch": 7627} {"train_loss": -27.634443283081055, "global_step": 633056, "epoch": 7627} {"train_loss": -27.68790054321289, "global_step": 633057, "epoch": 7627} {"train_loss": -27.555313110351562, "global_step": 633058, "epoch": 7627} {"train_loss": -27.75225830078125, "global_step": 633059, "epoch": 7627} {"train_loss": -27.579456329345703, "global_step": 633060, "epoch": 7627} {"train_loss": -27.96461296081543, "global_step": 633061, "epoch": 7627} {"train_loss": -27.492033004760742, "global_step": 633062, "epoch": 7627} {"train_loss": -27.830846786499023, "global_step": 633063, "epoch": 7627} {"train_loss": -28.308069229125977, "global_step": 633064, "epoch": 7627} {"train_loss": -28.162023544311523, "global_step": 633065, "epoch": 7627} {"train_loss": -28.333271026611328, "global_step": 633066, "epoch": 7627} {"train_loss": -27.58270263671875, "global_step": 633067, "epoch": 7627} {"train_loss": -28.135955810546875, "global_step": 633068, "epoch": 7627} {"train_loss": -27.69156265258789, "global_step": 633069, "epoch": 7627} {"train_loss": -28.07868766784668, "global_step": 633070, "epoch": 7627} {"train_loss": -27.95692253112793, "global_step": 633071, "epoch": 7627} {"train_loss": -28.261035919189453, "global_step": 633072, "epoch": 7627} {"train_loss": -28.154027938842773, "global_step": 633073, "epoch": 7627} {"train_loss": -27.90238380432129, "global_step": 633074, "epoch": 7627} {"train_loss": -27.86683464050293, "global_step": 633075, "epoch": 7627} {"train_loss": -27.69516944885254, "global_step": 633076, "epoch": 7627} {"train_loss": -28.0218448638916, "global_step": 633077, "epoch": 7627} {"train_loss": -27.634735107421875, "global_step": 633078, "epoch": 7627} {"train_loss": -28.043792724609375, "global_step": 633079, "epoch": 7627} {"train_loss": -28.217084884643555, "global_step": 633080, "epoch": 7627} {"train_loss": -27.785398483276367, "global_step": 633081, "epoch": 7627} {"train_loss": -28.188425064086914, "global_step": 633082, "epoch": 7627} {"train_loss": -27.974119186401367, "global_step": 633083, "epoch": 7627} {"train_loss": -27.944547653198242, "global_step": 633084, "epoch": 7627} {"train_loss": -28.169574737548828, "global_step": 633085, "epoch": 7627} {"train_loss": -28.227563858032227, "global_step": 633086, "epoch": 7627} {"train_loss": -28.71451759338379, "global_step": 633087, "epoch": 7627} {"train_loss": -28.320398330688477, "global_step": 633088, "epoch": 7627} {"train_loss": -28.29376220703125, "global_step": 633089, "epoch": 7627} {"train_loss": -28.35699462890625, "global_step": 633090, "epoch": 7627} {"train_loss": -28.12161636352539, "global_step": 633091, "epoch": 7627} {"train_loss": -28.445581436157227, "global_step": 633092, "epoch": 7627} {"train_loss": -28.506872177124023, "global_step": 633093, "epoch": 7627} {"train_loss": -28.275644302368164, "global_step": 633094, "epoch": 7627} {"train_loss": -28.345243453979492, "global_step": 633095, "epoch": 7627} {"train_loss": -28.28081703186035, "global_step": 633096, "epoch": 7627} {"train_loss": -28.27715492248535, "global_step": 633097, "epoch": 7627} {"train_loss": -28.583084106445312, "global_step": 633098, "epoch": 7627} {"train_loss": -28.254337310791016, "global_step": 633099, "epoch": 7627} {"train_loss": -28.266977310180664, "global_step": 633100, "epoch": 7627} {"train_loss": -28.280567169189453, "global_step": 633101, "epoch": 7627} {"train_loss": -28.329822540283203, "global_step": 633102, "epoch": 7627} {"train_loss": -28.095050811767578, "global_step": 633103, "epoch": 7627} {"train_loss": -28.373315811157227, "global_step": 633104, "epoch": 7627} {"train_loss": -28.34894371032715, "global_step": 633105, "epoch": 7627} {"train_loss": -28.432098388671875, "global_step": 633106, "epoch": 7627} {"train_loss": -28.6361026763916, "global_step": 633107, "epoch": 7627} {"train_loss": -27.988248825073242, "global_step": 633108, "epoch": 7627} {"train_loss": -28.36606788635254, "global_step": 633109, "epoch": 7627} {"train_loss": -28.516895294189453, "global_step": 633110, "epoch": 7627} {"train_loss": -28.53793716430664, "global_step": 633111, "epoch": 7627} {"train_loss": -28.44317054748535, "global_step": 633112, "epoch": 7627} {"train_loss": -28.5390682220459, "global_step": 633113, "epoch": 7627} {"train_loss": -28.83279800415039, "global_step": 633114, "epoch": 7627} {"train_loss": -28.27976417541504, "global_step": 633115, "epoch": 7627} {"train_loss": -28.30348777770996, "global_step": 633116, "epoch": 7627} {"train_loss": -28.462848663330078, "global_step": 633117, "epoch": 7627} {"train_loss": -28.31464958190918, "global_step": 633118, "epoch": 7627} {"train_loss": -28.591949462890625, "global_step": 633119, "epoch": 7627} {"train_loss": -28.225088119506836, "global_step": 633120, "epoch": 7627} {"train_loss": -28.1414794921875, "global_step": 633121, "epoch": 7627} {"train_loss": -28.555438995361328, "global_step": 633122, "epoch": 7627} {"train_loss": -28.005894603499446, "global_step": 633123, "epoch": 7627, "val_loss": 6887760.0} {"train_loss": -28.36087417602539, "global_step": 633124, "epoch": 7628} {"train_loss": -27.49348258972168, "global_step": 633125, "epoch": 7628} {"train_loss": -27.5987606048584, "global_step": 633126, "epoch": 7628} {"train_loss": -27.94864273071289, "global_step": 633127, "epoch": 7628} {"train_loss": -27.954975128173828, "global_step": 633128, "epoch": 7628} {"train_loss": -27.2247257232666, "global_step": 633129, "epoch": 7628} {"train_loss": -27.630115509033203, "global_step": 633130, "epoch": 7628} {"train_loss": -27.416706085205078, "global_step": 633131, "epoch": 7628} {"train_loss": -27.96750259399414, "global_step": 633132, "epoch": 7628} {"train_loss": -27.969329833984375, "global_step": 633133, "epoch": 7628} {"train_loss": -27.855920791625977, "global_step": 633134, "epoch": 7628} {"train_loss": -27.68507194519043, "global_step": 633135, "epoch": 7628} {"train_loss": -27.49652099609375, "global_step": 633136, "epoch": 7628} {"train_loss": -27.880273818969727, "global_step": 633137, "epoch": 7628} {"train_loss": -27.56794548034668, "global_step": 633138, "epoch": 7628} {"train_loss": -28.378767013549805, "global_step": 633139, "epoch": 7628} {"train_loss": -27.80079460144043, "global_step": 633140, "epoch": 7628} {"train_loss": -28.02542495727539, "global_step": 633141, "epoch": 7628} {"train_loss": -27.775299072265625, "global_step": 633142, "epoch": 7628} {"train_loss": -27.90675163269043, "global_step": 633143, "epoch": 7628} {"train_loss": -27.651992797851562, "global_step": 633144, "epoch": 7628} {"train_loss": -27.930505752563477, "global_step": 633145, "epoch": 7628} {"train_loss": -27.986896514892578, "global_step": 633146, "epoch": 7628} {"train_loss": -27.963586807250977, "global_step": 633147, "epoch": 7628} {"train_loss": -28.049909591674805, "global_step": 633148, "epoch": 7628} {"train_loss": -28.11984634399414, "global_step": 633149, "epoch": 7628} {"train_loss": -28.38319206237793, "global_step": 633150, "epoch": 7628} {"train_loss": -27.632110595703125, "global_step": 633151, "epoch": 7628} {"train_loss": -28.083723068237305, "global_step": 633152, "epoch": 7628} {"train_loss": -28.05925941467285, "global_step": 633153, "epoch": 7628} {"train_loss": -28.152179718017578, "global_step": 633154, "epoch": 7628} {"train_loss": -28.28972816467285, "global_step": 633155, "epoch": 7628} {"train_loss": -28.013736724853516, "global_step": 633156, "epoch": 7628} {"train_loss": -28.031919479370117, "global_step": 633157, "epoch": 7628} {"train_loss": -28.119115829467773, "global_step": 633158, "epoch": 7628} {"train_loss": -28.157812118530273, "global_step": 633159, "epoch": 7628} {"train_loss": -28.362646102905273, "global_step": 633160, "epoch": 7628} {"train_loss": -27.915699005126953, "global_step": 633161, "epoch": 7628} {"train_loss": -28.248056411743164, "global_step": 633162, "epoch": 7628} {"train_loss": -28.362777709960938, "global_step": 633163, "epoch": 7628} {"train_loss": -28.136228561401367, "global_step": 633164, "epoch": 7628} {"train_loss": -28.10468101501465, "global_step": 633165, "epoch": 7628} {"train_loss": -28.0150203704834, "global_step": 633166, "epoch": 7628} {"train_loss": -28.294036865234375, "global_step": 633167, "epoch": 7628} {"train_loss": -27.88437271118164, "global_step": 633168, "epoch": 7628} {"train_loss": -28.458654403686523, "global_step": 633169, "epoch": 7628} {"train_loss": -28.191436767578125, "global_step": 633170, "epoch": 7628} {"train_loss": -28.39072608947754, "global_step": 633171, "epoch": 7628} {"train_loss": -28.10664176940918, "global_step": 633172, "epoch": 7628} {"train_loss": -28.341400146484375, "global_step": 633173, "epoch": 7628} {"train_loss": -28.092084884643555, "global_step": 633174, "epoch": 7628} {"train_loss": -28.271804809570312, "global_step": 633175, "epoch": 7628} {"train_loss": -28.442951202392578, "global_step": 633176, "epoch": 7628} {"train_loss": -28.53826332092285, "global_step": 633177, "epoch": 7628} {"train_loss": -28.28175163269043, "global_step": 633178, "epoch": 7628} {"train_loss": -28.142547607421875, "global_step": 633179, "epoch": 7628} {"train_loss": -28.4376163482666, "global_step": 633180, "epoch": 7628} {"train_loss": -28.352502822875977, "global_step": 633181, "epoch": 7628} {"train_loss": -28.650083541870117, "global_step": 633182, "epoch": 7628} {"train_loss": -28.4160213470459, "global_step": 633183, "epoch": 7628} {"train_loss": -28.564884185791016, "global_step": 633184, "epoch": 7628} {"train_loss": -28.593839645385742, "global_step": 633185, "epoch": 7628} {"train_loss": -28.565210342407227, "global_step": 633186, "epoch": 7628} {"train_loss": -28.416584014892578, "global_step": 633187, "epoch": 7628} {"train_loss": -28.72190284729004, "global_step": 633188, "epoch": 7628} {"train_loss": -28.4768009185791, "global_step": 633189, "epoch": 7628} {"train_loss": -28.588825225830078, "global_step": 633190, "epoch": 7628} {"train_loss": -28.264652252197266, "global_step": 633191, "epoch": 7628} {"train_loss": -28.80903434753418, "global_step": 633192, "epoch": 7628} {"train_loss": -28.43060874938965, "global_step": 633193, "epoch": 7628} {"train_loss": -28.16605567932129, "global_step": 633194, "epoch": 7628} {"train_loss": -28.22983169555664, "global_step": 633195, "epoch": 7628} {"train_loss": -28.543060302734375, "global_step": 633196, "epoch": 7628} {"train_loss": -28.363866806030273, "global_step": 633197, "epoch": 7628} {"train_loss": -28.32196617126465, "global_step": 633198, "epoch": 7628} {"train_loss": -28.14899253845215, "global_step": 633199, "epoch": 7628} {"train_loss": -28.48011589050293, "global_step": 633200, "epoch": 7628} {"train_loss": -28.581098556518555, "global_step": 633201, "epoch": 7628} {"train_loss": -28.193159103393555, "global_step": 633202, "epoch": 7628} {"train_loss": -27.7410831451416, "global_step": 633203, "epoch": 7628} {"train_loss": -28.241079330444336, "global_step": 633204, "epoch": 7628} {"train_loss": -27.831161499023438, "global_step": 633205, "epoch": 7628} {"train_loss": -28.13618204967085, "global_step": 633206, "epoch": 7628, "val_loss": 6902224.0} {"train_loss": -26.549163818359375, "global_step": 633207, "epoch": 7629} {"train_loss": -26.71297264099121, "global_step": 633208, "epoch": 7629} {"train_loss": -24.83807945251465, "global_step": 633209, "epoch": 7629} {"train_loss": -25.381315231323242, "global_step": 633210, "epoch": 7629} {"train_loss": -25.859872817993164, "global_step": 633211, "epoch": 7629} {"train_loss": -26.530237197875977, "global_step": 633212, "epoch": 7629} {"train_loss": -26.77808952331543, "global_step": 633213, "epoch": 7629} {"train_loss": -27.234363555908203, "global_step": 633214, "epoch": 7629} {"train_loss": -26.912954330444336, "global_step": 633215, "epoch": 7629} {"train_loss": -27.202123641967773, "global_step": 633216, "epoch": 7629} {"train_loss": -27.547651290893555, "global_step": 633217, "epoch": 7629} {"train_loss": -27.040613174438477, "global_step": 633218, "epoch": 7629} {"train_loss": -27.31007957458496, "global_step": 633219, "epoch": 7629} {"train_loss": -27.254730224609375, "global_step": 633220, "epoch": 7629} {"train_loss": -27.59100914001465, "global_step": 633221, "epoch": 7629} {"train_loss": -26.83942985534668, "global_step": 633222, "epoch": 7629} {"train_loss": -27.009967803955078, "global_step": 633223, "epoch": 7629} {"train_loss": -27.59208106994629, "global_step": 633224, "epoch": 7629} {"train_loss": -27.362775802612305, "global_step": 633225, "epoch": 7629} {"train_loss": -27.211698532104492, "global_step": 633226, "epoch": 7629} {"train_loss": -27.571552276611328, "global_step": 633227, "epoch": 7629} {"train_loss": -27.9727725982666, "global_step": 633228, "epoch": 7629} {"train_loss": -27.726404190063477, "global_step": 633229, "epoch": 7629} {"train_loss": -27.600805282592773, "global_step": 633230, "epoch": 7629} {"train_loss": -27.664621353149414, "global_step": 633231, "epoch": 7629} {"train_loss": -27.550214767456055, "global_step": 633232, "epoch": 7629} {"train_loss": -27.86713981628418, "global_step": 633233, "epoch": 7629} {"train_loss": -28.03101921081543, "global_step": 633234, "epoch": 7629} {"train_loss": -27.602285385131836, "global_step": 633235, "epoch": 7629} {"train_loss": -28.287214279174805, "global_step": 633236, "epoch": 7629} {"train_loss": -27.750396728515625, "global_step": 633237, "epoch": 7629} {"train_loss": -28.01641845703125, "global_step": 633238, "epoch": 7629} {"train_loss": -28.11704444885254, "global_step": 633239, "epoch": 7629} {"train_loss": -28.106958389282227, "global_step": 633240, "epoch": 7629} {"train_loss": -27.995532989501953, "global_step": 633241, "epoch": 7629} {"train_loss": -28.00897216796875, "global_step": 633242, "epoch": 7629} {"train_loss": -27.521453857421875, "global_step": 633243, "epoch": 7629} {"train_loss": -28.384241104125977, "global_step": 633244, "epoch": 7629} {"train_loss": -27.928375244140625, "global_step": 633245, "epoch": 7629} {"train_loss": -27.981903076171875, "global_step": 633246, "epoch": 7629} {"train_loss": -28.085494995117188, "global_step": 633247, "epoch": 7629} {"train_loss": -28.071760177612305, "global_step": 633248, "epoch": 7629} {"train_loss": -28.447998046875, "global_step": 633249, "epoch": 7629} {"train_loss": -28.252429962158203, "global_step": 633250, "epoch": 7629} {"train_loss": -27.893783569335938, "global_step": 633251, "epoch": 7629} {"train_loss": -28.31672477722168, "global_step": 633252, "epoch": 7629} {"train_loss": -28.499542236328125, "global_step": 633253, "epoch": 7629} {"train_loss": -28.32415771484375, "global_step": 633254, "epoch": 7629} {"train_loss": -28.50714111328125, "global_step": 633255, "epoch": 7629} {"train_loss": -28.11832618713379, "global_step": 633256, "epoch": 7629} {"train_loss": -28.247655868530273, "global_step": 633257, "epoch": 7629} {"train_loss": -28.21974754333496, "global_step": 633258, "epoch": 7629} {"train_loss": -28.0850772857666, "global_step": 633259, "epoch": 7629} {"train_loss": -28.050235748291016, "global_step": 633260, "epoch": 7629} {"train_loss": -28.077306747436523, "global_step": 633261, "epoch": 7629} {"train_loss": -28.236968994140625, "global_step": 633262, "epoch": 7629} {"train_loss": -28.46897315979004, "global_step": 633263, "epoch": 7629} {"train_loss": -28.115819931030273, "global_step": 633264, "epoch": 7629} {"train_loss": -28.38709831237793, "global_step": 633265, "epoch": 7629} {"train_loss": -28.10805320739746, "global_step": 633266, "epoch": 7629} {"train_loss": -28.5616397857666, "global_step": 633267, "epoch": 7629} {"train_loss": -28.48390007019043, "global_step": 633268, "epoch": 7629} {"train_loss": -28.26337242126465, "global_step": 633269, "epoch": 7629} {"train_loss": -28.255773544311523, "global_step": 633270, "epoch": 7629} {"train_loss": -28.171833038330078, "global_step": 633271, "epoch": 7629} {"train_loss": -28.59804344177246, "global_step": 633272, "epoch": 7629} {"train_loss": -28.210004806518555, "global_step": 633273, "epoch": 7629} {"train_loss": -28.136600494384766, "global_step": 633274, "epoch": 7629} {"train_loss": -28.34452247619629, "global_step": 633275, "epoch": 7629} {"train_loss": -28.247364044189453, "global_step": 633276, "epoch": 7629} {"train_loss": -28.414310455322266, "global_step": 633277, "epoch": 7629} {"train_loss": -28.437198638916016, "global_step": 633278, "epoch": 7629} {"train_loss": -28.695621490478516, "global_step": 633279, "epoch": 7629} {"train_loss": -28.275970458984375, "global_step": 633280, "epoch": 7629} {"train_loss": -28.31975746154785, "global_step": 633281, "epoch": 7629} {"train_loss": -28.614093780517578, "global_step": 633282, "epoch": 7629} {"train_loss": -28.32191276550293, "global_step": 633283, "epoch": 7629} {"train_loss": -28.618722915649414, "global_step": 633284, "epoch": 7629} {"train_loss": -28.200769424438477, "global_step": 633285, "epoch": 7629} {"train_loss": -28.78605079650879, "global_step": 633286, "epoch": 7629} {"train_loss": -28.27947998046875, "global_step": 633287, "epoch": 7629} {"train_loss": -28.178007125854492, "global_step": 633288, "epoch": 7629} {"train_loss": -27.844188322503882, "global_step": 633289, "epoch": 7629, "val_loss": 6891629.0} {"train_loss": -26.985382080078125, "global_step": 633290, "epoch": 7630} {"train_loss": -27.403528213500977, "global_step": 633291, "epoch": 7630} {"train_loss": -28.056137084960938, "global_step": 633292, "epoch": 7630} {"train_loss": -27.164539337158203, "global_step": 633293, "epoch": 7630} {"train_loss": -27.46880531311035, "global_step": 633294, "epoch": 7630} {"train_loss": -27.4749813079834, "global_step": 633295, "epoch": 7630} {"train_loss": -27.089664459228516, "global_step": 633296, "epoch": 7630} {"train_loss": -27.56109619140625, "global_step": 633297, "epoch": 7630} {"train_loss": -26.917129516601562, "global_step": 633298, "epoch": 7630} {"train_loss": -26.802976608276367, "global_step": 633299, "epoch": 7630} {"train_loss": -27.698196411132812, "global_step": 633300, "epoch": 7630} {"train_loss": -27.529632568359375, "global_step": 633301, "epoch": 7630} {"train_loss": -27.7242431640625, "global_step": 633302, "epoch": 7630} {"train_loss": -27.8209228515625, "global_step": 633303, "epoch": 7630} {"train_loss": -27.3831729888916, "global_step": 633304, "epoch": 7630} {"train_loss": -27.791162490844727, "global_step": 633305, "epoch": 7630} {"train_loss": -27.702896118164062, "global_step": 633306, "epoch": 7630} {"train_loss": -27.9779109954834, "global_step": 633307, "epoch": 7630} {"train_loss": -28.112363815307617, "global_step": 633308, "epoch": 7630} {"train_loss": -28.1518611907959, "global_step": 633309, "epoch": 7630} {"train_loss": -28.063465118408203, "global_step": 633310, "epoch": 7630} {"train_loss": -28.2565860748291, "global_step": 633311, "epoch": 7630} {"train_loss": -28.012073516845703, "global_step": 633312, "epoch": 7630} {"train_loss": -28.518075942993164, "global_step": 633313, "epoch": 7630} {"train_loss": -27.819799423217773, "global_step": 633314, "epoch": 7630} {"train_loss": -28.108722686767578, "global_step": 633315, "epoch": 7630} {"train_loss": -28.12067985534668, "global_step": 633316, "epoch": 7630} {"train_loss": -28.144540786743164, "global_step": 633317, "epoch": 7630} {"train_loss": -27.953659057617188, "global_step": 633318, "epoch": 7630} {"train_loss": -28.285017013549805, "global_step": 633319, "epoch": 7630} {"train_loss": -28.0838623046875, "global_step": 633320, "epoch": 7630} {"train_loss": -28.512271881103516, "global_step": 633321, "epoch": 7630} {"train_loss": -27.848480224609375, "global_step": 633322, "epoch": 7630} {"train_loss": -28.50153160095215, "global_step": 633323, "epoch": 7630} {"train_loss": -28.103708267211914, "global_step": 633324, "epoch": 7630} {"train_loss": -28.04566764831543, "global_step": 633325, "epoch": 7630} {"train_loss": -28.263166427612305, "global_step": 633326, "epoch": 7630} {"train_loss": -28.484561920166016, "global_step": 633327, "epoch": 7630} {"train_loss": -28.22515869140625, "global_step": 633328, "epoch": 7630} {"train_loss": -28.275482177734375, "global_step": 633329, "epoch": 7630} {"train_loss": -28.359394073486328, "global_step": 633330, "epoch": 7630} {"train_loss": -28.3613338470459, "global_step": 633331, "epoch": 7630} {"train_loss": -28.465673446655273, "global_step": 633332, "epoch": 7630} {"train_loss": -28.331104278564453, "global_step": 633333, "epoch": 7630} {"train_loss": -27.82783317565918, "global_step": 633334, "epoch": 7630} {"train_loss": -28.301624298095703, "global_step": 633335, "epoch": 7630} {"train_loss": -28.485458374023438, "global_step": 633336, "epoch": 7630} {"train_loss": -28.438650131225586, "global_step": 633337, "epoch": 7630} {"train_loss": -28.1795597076416, "global_step": 633338, "epoch": 7630} {"train_loss": -27.852783203125, "global_step": 633339, "epoch": 7630} {"train_loss": -27.95539665222168, "global_step": 633340, "epoch": 7630} {"train_loss": -28.421674728393555, "global_step": 633341, "epoch": 7630} {"train_loss": -28.282323837280273, "global_step": 633342, "epoch": 7630} {"train_loss": -28.05230712890625, "global_step": 633343, "epoch": 7630} {"train_loss": -28.35394287109375, "global_step": 633344, "epoch": 7630} {"train_loss": -28.270795822143555, "global_step": 633345, "epoch": 7630} {"train_loss": -28.05170249938965, "global_step": 633346, "epoch": 7630} {"train_loss": -28.30159568786621, "global_step": 633347, "epoch": 7630} {"train_loss": -28.2099666595459, "global_step": 633348, "epoch": 7630} {"train_loss": -28.484546661376953, "global_step": 633349, "epoch": 7630} {"train_loss": -28.165618896484375, "global_step": 633350, "epoch": 7630} {"train_loss": -28.158716201782227, "global_step": 633351, "epoch": 7630} {"train_loss": -28.276098251342773, "global_step": 633352, "epoch": 7630} {"train_loss": -28.197891235351562, "global_step": 633353, "epoch": 7630} {"train_loss": -28.256362915039062, "global_step": 633354, "epoch": 7630} {"train_loss": -28.219079971313477, "global_step": 633355, "epoch": 7630} {"train_loss": -28.21497917175293, "global_step": 633356, "epoch": 7630} {"train_loss": -28.44984245300293, "global_step": 633357, "epoch": 7630} {"train_loss": -28.161890029907227, "global_step": 633358, "epoch": 7630} {"train_loss": -27.646991729736328, "global_step": 633359, "epoch": 7630} {"train_loss": -28.153217315673828, "global_step": 633360, "epoch": 7630} {"train_loss": -27.789947509765625, "global_step": 633361, "epoch": 7630} {"train_loss": -27.656036376953125, "global_step": 633362, "epoch": 7630} {"train_loss": -27.66779136657715, "global_step": 633363, "epoch": 7630} {"train_loss": -28.130170822143555, "global_step": 633364, "epoch": 7630} {"train_loss": -28.215295791625977, "global_step": 633365, "epoch": 7630} {"train_loss": -28.0302791595459, "global_step": 633366, "epoch": 7630} {"train_loss": -28.528736114501953, "global_step": 633367, "epoch": 7630} {"train_loss": -28.40034294128418, "global_step": 633368, "epoch": 7630} {"train_loss": -28.1082763671875, "global_step": 633369, "epoch": 7630} {"train_loss": -28.25275993347168, "global_step": 633370, "epoch": 7630} {"train_loss": -27.923797607421875, "global_step": 633371, "epoch": 7630} {"train_loss": -28.02015203452972, "global_step": 633372, "epoch": 7630, "val_loss": 6938463.0} {"train_loss": -28.018665313720703, "global_step": 633373, "epoch": 7631} {"train_loss": -27.78046226501465, "global_step": 633374, "epoch": 7631} {"train_loss": -27.737518310546875, "global_step": 633375, "epoch": 7631} {"train_loss": -27.3914852142334, "global_step": 633376, "epoch": 7631} {"train_loss": -27.90277099609375, "global_step": 633377, "epoch": 7631} {"train_loss": -27.5821590423584, "global_step": 633378, "epoch": 7631} {"train_loss": -27.6189022064209, "global_step": 633379, "epoch": 7631} {"train_loss": -28.25128746032715, "global_step": 633380, "epoch": 7631} {"train_loss": -28.146015167236328, "global_step": 633381, "epoch": 7631} {"train_loss": -27.662384033203125, "global_step": 633382, "epoch": 7631} {"train_loss": -28.123022079467773, "global_step": 633383, "epoch": 7631} {"train_loss": -28.12346839904785, "global_step": 633384, "epoch": 7631} {"train_loss": -28.097137451171875, "global_step": 633385, "epoch": 7631} {"train_loss": -28.037023544311523, "global_step": 633386, "epoch": 7631} {"train_loss": -27.872711181640625, "global_step": 633387, "epoch": 7631} {"train_loss": -27.941089630126953, "global_step": 633388, "epoch": 7631} {"train_loss": -28.024694442749023, "global_step": 633389, "epoch": 7631} {"train_loss": -28.03009033203125, "global_step": 633390, "epoch": 7631} {"train_loss": -28.314319610595703, "global_step": 633391, "epoch": 7631} {"train_loss": -28.413915634155273, "global_step": 633392, "epoch": 7631} {"train_loss": -28.18185806274414, "global_step": 633393, "epoch": 7631} {"train_loss": -27.91568374633789, "global_step": 633394, "epoch": 7631} {"train_loss": -28.316864013671875, "global_step": 633395, "epoch": 7631} {"train_loss": -28.454212188720703, "global_step": 633396, "epoch": 7631} {"train_loss": -28.339975357055664, "global_step": 633397, "epoch": 7631} {"train_loss": -27.8262939453125, "global_step": 633398, "epoch": 7631} {"train_loss": -27.920185089111328, "global_step": 633399, "epoch": 7631} {"train_loss": -28.22110366821289, "global_step": 633400, "epoch": 7631} {"train_loss": -28.520278930664062, "global_step": 633401, "epoch": 7631} {"train_loss": -28.21131706237793, "global_step": 633402, "epoch": 7631} {"train_loss": -28.199951171875, "global_step": 633403, "epoch": 7631} {"train_loss": -28.311975479125977, "global_step": 633404, "epoch": 7631} {"train_loss": -28.8505859375, "global_step": 633405, "epoch": 7631} {"train_loss": -28.616592407226562, "global_step": 633406, "epoch": 7631} {"train_loss": -28.454397201538086, "global_step": 633407, "epoch": 7631} {"train_loss": -28.19832420349121, "global_step": 633408, "epoch": 7631} {"train_loss": -28.2404727935791, "global_step": 633409, "epoch": 7631} {"train_loss": -28.51055908203125, "global_step": 633410, "epoch": 7631} {"train_loss": -28.11370849609375, "global_step": 633411, "epoch": 7631} {"train_loss": -28.185026168823242, "global_step": 633412, "epoch": 7631} {"train_loss": -27.929845809936523, "global_step": 633413, "epoch": 7631} {"train_loss": -27.873371124267578, "global_step": 633414, "epoch": 7631} {"train_loss": -28.2365665435791, "global_step": 633415, "epoch": 7631} {"train_loss": -27.705713272094727, "global_step": 633416, "epoch": 7631} {"train_loss": -28.258045196533203, "global_step": 633417, "epoch": 7631} {"train_loss": -28.3155517578125, "global_step": 633418, "epoch": 7631} {"train_loss": -28.358129501342773, "global_step": 633419, "epoch": 7631} {"train_loss": -28.140625, "global_step": 633420, "epoch": 7631} {"train_loss": -28.2863826751709, "global_step": 633421, "epoch": 7631} {"train_loss": -28.373071670532227, "global_step": 633422, "epoch": 7631} {"train_loss": -28.190113067626953, "global_step": 633423, "epoch": 7631} {"train_loss": -28.108997344970703, "global_step": 633424, "epoch": 7631} {"train_loss": -28.325124740600586, "global_step": 633425, "epoch": 7631} {"train_loss": -28.42194175720215, "global_step": 633426, "epoch": 7631} {"train_loss": -27.93161392211914, "global_step": 633427, "epoch": 7631} {"train_loss": -28.09954261779785, "global_step": 633428, "epoch": 7631} {"train_loss": -28.204309463500977, "global_step": 633429, "epoch": 7631} {"train_loss": -28.6788272857666, "global_step": 633430, "epoch": 7631} {"train_loss": -28.249372482299805, "global_step": 633431, "epoch": 7631} {"train_loss": -28.070037841796875, "global_step": 633432, "epoch": 7631} {"train_loss": -28.357101440429688, "global_step": 633433, "epoch": 7631} {"train_loss": -28.492919921875, "global_step": 633434, "epoch": 7631} {"train_loss": -28.35959815979004, "global_step": 633435, "epoch": 7631} {"train_loss": -28.30859375, "global_step": 633436, "epoch": 7631} {"train_loss": -28.656274795532227, "global_step": 633437, "epoch": 7631} {"train_loss": -28.360626220703125, "global_step": 633438, "epoch": 7631} {"train_loss": -28.280202865600586, "global_step": 633439, "epoch": 7631} {"train_loss": -28.47114372253418, "global_step": 633440, "epoch": 7631} {"train_loss": -28.422895431518555, "global_step": 633441, "epoch": 7631} {"train_loss": -28.262699127197266, "global_step": 633442, "epoch": 7631} {"train_loss": -28.361682891845703, "global_step": 633443, "epoch": 7631} {"train_loss": -27.667898178100586, "global_step": 633444, "epoch": 7631} {"train_loss": -28.069351196289062, "global_step": 633445, "epoch": 7631} {"train_loss": -28.362491607666016, "global_step": 633446, "epoch": 7631} {"train_loss": -28.53313636779785, "global_step": 633447, "epoch": 7631} {"train_loss": -28.191619873046875, "global_step": 633448, "epoch": 7631} {"train_loss": -27.68341064453125, "global_step": 633449, "epoch": 7631} {"train_loss": -28.1024112701416, "global_step": 633450, "epoch": 7631} {"train_loss": -28.24293327331543, "global_step": 633451, "epoch": 7631} {"train_loss": -27.751867294311523, "global_step": 633452, "epoch": 7631} {"train_loss": -28.03986167907715, "global_step": 633453, "epoch": 7631} {"train_loss": -28.156721115112305, "global_step": 633454, "epoch": 7631} {"train_loss": -28.17628088342138, "global_step": 633455, "epoch": 7631, "val_loss": 6832066.5} {"train_loss": -27.036813735961914, "global_step": 633456, "epoch": 7632} {"train_loss": -26.539260864257812, "global_step": 633457, "epoch": 7632} {"train_loss": -26.74574089050293, "global_step": 633458, "epoch": 7632} {"train_loss": -26.92255210876465, "global_step": 633459, "epoch": 7632} {"train_loss": -27.601346969604492, "global_step": 633460, "epoch": 7632} {"train_loss": -27.05783462524414, "global_step": 633461, "epoch": 7632} {"train_loss": -27.4876651763916, "global_step": 633462, "epoch": 7632} {"train_loss": -27.1571044921875, "global_step": 633463, "epoch": 7632} {"train_loss": -27.44061851501465, "global_step": 633464, "epoch": 7632} {"train_loss": -27.701501846313477, "global_step": 633465, "epoch": 7632} {"train_loss": -27.875654220581055, "global_step": 633466, "epoch": 7632} {"train_loss": -27.545629501342773, "global_step": 633467, "epoch": 7632} {"train_loss": -27.201696395874023, "global_step": 633468, "epoch": 7632} {"train_loss": -27.961109161376953, "global_step": 633469, "epoch": 7632} {"train_loss": -27.86396598815918, "global_step": 633470, "epoch": 7632} {"train_loss": -27.594282150268555, "global_step": 633471, "epoch": 7632} {"train_loss": -27.803546905517578, "global_step": 633472, "epoch": 7632} {"train_loss": -28.00514793395996, "global_step": 633473, "epoch": 7632} {"train_loss": -27.89739418029785, "global_step": 633474, "epoch": 7632} {"train_loss": -27.704076766967773, "global_step": 633475, "epoch": 7632} {"train_loss": -28.16580581665039, "global_step": 633476, "epoch": 7632} {"train_loss": -27.8215389251709, "global_step": 633477, "epoch": 7632} {"train_loss": -28.152118682861328, "global_step": 633478, "epoch": 7632} {"train_loss": -27.87009620666504, "global_step": 633479, "epoch": 7632} {"train_loss": -28.418989181518555, "global_step": 633480, "epoch": 7632} {"train_loss": -28.244836807250977, "global_step": 633481, "epoch": 7632} {"train_loss": -27.910993576049805, "global_step": 633482, "epoch": 7632} {"train_loss": -28.086334228515625, "global_step": 633483, "epoch": 7632} {"train_loss": -28.183746337890625, "global_step": 633484, "epoch": 7632} {"train_loss": -27.710285186767578, "global_step": 633485, "epoch": 7632} {"train_loss": -28.175901412963867, "global_step": 633486, "epoch": 7632} {"train_loss": -28.600189208984375, "global_step": 633487, "epoch": 7632} {"train_loss": -28.09583854675293, "global_step": 633488, "epoch": 7632} {"train_loss": -28.081724166870117, "global_step": 633489, "epoch": 7632} {"train_loss": -28.009973526000977, "global_step": 633490, "epoch": 7632} {"train_loss": -28.219589233398438, "global_step": 633491, "epoch": 7632} {"train_loss": -28.21246337890625, "global_step": 633492, "epoch": 7632} {"train_loss": -28.157413482666016, "global_step": 633493, "epoch": 7632} {"train_loss": -28.209341049194336, "global_step": 633494, "epoch": 7632} {"train_loss": -28.44996452331543, "global_step": 633495, "epoch": 7632} {"train_loss": -28.21784019470215, "global_step": 633496, "epoch": 7632} {"train_loss": -28.266279220581055, "global_step": 633497, "epoch": 7632} {"train_loss": -28.3647518157959, "global_step": 633498, "epoch": 7632} {"train_loss": -28.090087890625, "global_step": 633499, "epoch": 7632} {"train_loss": -28.391775131225586, "global_step": 633500, "epoch": 7632} {"train_loss": -28.57596206665039, "global_step": 633501, "epoch": 7632} {"train_loss": -27.969308853149414, "global_step": 633502, "epoch": 7632} {"train_loss": -28.26658058166504, "global_step": 633503, "epoch": 7632} {"train_loss": -28.79096794128418, "global_step": 633504, "epoch": 7632} {"train_loss": -28.486841201782227, "global_step": 633505, "epoch": 7632} {"train_loss": -28.6058292388916, "global_step": 633506, "epoch": 7632} {"train_loss": -28.592100143432617, "global_step": 633507, "epoch": 7632} {"train_loss": -28.40478515625, "global_step": 633508, "epoch": 7632} {"train_loss": -28.349363327026367, "global_step": 633509, "epoch": 7632} {"train_loss": -28.4293270111084, "global_step": 633510, "epoch": 7632} {"train_loss": -28.235614776611328, "global_step": 633511, "epoch": 7632} {"train_loss": -28.042865753173828, "global_step": 633512, "epoch": 7632} {"train_loss": -28.101516723632812, "global_step": 633513, "epoch": 7632} {"train_loss": -28.285337448120117, "global_step": 633514, "epoch": 7632} {"train_loss": -28.196699142456055, "global_step": 633515, "epoch": 7632} {"train_loss": -28.50638771057129, "global_step": 633516, "epoch": 7632} {"train_loss": -28.12692642211914, "global_step": 633517, "epoch": 7632} {"train_loss": -28.465314865112305, "global_step": 633518, "epoch": 7632} {"train_loss": -27.880651473999023, "global_step": 633519, "epoch": 7632} {"train_loss": -27.771575927734375, "global_step": 633520, "epoch": 7632} {"train_loss": -28.043195724487305, "global_step": 633521, "epoch": 7632} {"train_loss": -28.210229873657227, "global_step": 633522, "epoch": 7632} {"train_loss": -28.074914932250977, "global_step": 633523, "epoch": 7632} {"train_loss": -28.043249130249023, "global_step": 633524, "epoch": 7632} {"train_loss": -28.384586334228516, "global_step": 633525, "epoch": 7632} {"train_loss": -28.544830322265625, "global_step": 633526, "epoch": 7632} {"train_loss": -28.444843292236328, "global_step": 633527, "epoch": 7632} {"train_loss": -28.03827476501465, "global_step": 633528, "epoch": 7632} {"train_loss": -27.979223251342773, "global_step": 633529, "epoch": 7632} {"train_loss": -28.240509033203125, "global_step": 633530, "epoch": 7632} {"train_loss": -27.890533447265625, "global_step": 633531, "epoch": 7632} {"train_loss": -28.418760299682617, "global_step": 633532, "epoch": 7632} {"train_loss": -28.522842407226562, "global_step": 633533, "epoch": 7632} {"train_loss": -28.167861938476562, "global_step": 633534, "epoch": 7632} {"train_loss": -28.254974365234375, "global_step": 633535, "epoch": 7632} {"train_loss": -28.40961265563965, "global_step": 633536, "epoch": 7632} {"train_loss": -28.000818252563477, "global_step": 633537, "epoch": 7632} {"train_loss": -28.044242330344325, "global_step": 633538, "epoch": 7632, "val_loss": 6827348.5} {"train_loss": -27.404571533203125, "global_step": 633539, "epoch": 7633} {"train_loss": -27.073307037353516, "global_step": 633540, "epoch": 7633} {"train_loss": -27.165945053100586, "global_step": 633541, "epoch": 7633} {"train_loss": -27.082117080688477, "global_step": 633542, "epoch": 7633} {"train_loss": -27.27362060546875, "global_step": 633543, "epoch": 7633} {"train_loss": -27.082141876220703, "global_step": 633544, "epoch": 7633} {"train_loss": -26.7805233001709, "global_step": 633545, "epoch": 7633} {"train_loss": -27.173398971557617, "global_step": 633546, "epoch": 7633} {"train_loss": -27.97527503967285, "global_step": 633547, "epoch": 7633} {"train_loss": -27.36863136291504, "global_step": 633548, "epoch": 7633} {"train_loss": -28.005817413330078, "global_step": 633549, "epoch": 7633} {"train_loss": -27.71295166015625, "global_step": 633550, "epoch": 7633} {"train_loss": -28.06927490234375, "global_step": 633551, "epoch": 7633} {"train_loss": -27.849103927612305, "global_step": 633552, "epoch": 7633} {"train_loss": -27.676528930664062, "global_step": 633553, "epoch": 7633} {"train_loss": -27.986555099487305, "global_step": 633554, "epoch": 7633} {"train_loss": -27.591501235961914, "global_step": 633555, "epoch": 7633} {"train_loss": -27.686269760131836, "global_step": 633556, "epoch": 7633} {"train_loss": -28.3073673248291, "global_step": 633557, "epoch": 7633} {"train_loss": -28.13764762878418, "global_step": 633558, "epoch": 7633} {"train_loss": -28.013641357421875, "global_step": 633559, "epoch": 7633} {"train_loss": -27.92926025390625, "global_step": 633560, "epoch": 7633} {"train_loss": -28.19544792175293, "global_step": 633561, "epoch": 7633} {"train_loss": -28.092416763305664, "global_step": 633562, "epoch": 7633} {"train_loss": -27.850223541259766, "global_step": 633563, "epoch": 7633} {"train_loss": -28.245223999023438, "global_step": 633564, "epoch": 7633} {"train_loss": -28.29253578186035, "global_step": 633565, "epoch": 7633} {"train_loss": -27.884435653686523, "global_step": 633566, "epoch": 7633} {"train_loss": -28.04595375061035, "global_step": 633567, "epoch": 7633} {"train_loss": -28.09040641784668, "global_step": 633568, "epoch": 7633} {"train_loss": -28.328277587890625, "global_step": 633569, "epoch": 7633} {"train_loss": -28.341796875, "global_step": 633570, "epoch": 7633} {"train_loss": -28.313480377197266, "global_step": 633571, "epoch": 7633} {"train_loss": -27.953601837158203, "global_step": 633572, "epoch": 7633} {"train_loss": -28.450824737548828, "global_step": 633573, "epoch": 7633} {"train_loss": -27.985692977905273, "global_step": 633574, "epoch": 7633} {"train_loss": -28.12867546081543, "global_step": 633575, "epoch": 7633} {"train_loss": -28.04132080078125, "global_step": 633576, "epoch": 7633} {"train_loss": -28.43107032775879, "global_step": 633577, "epoch": 7633} {"train_loss": -28.305139541625977, "global_step": 633578, "epoch": 7633} {"train_loss": -28.149972915649414, "global_step": 633579, "epoch": 7633} {"train_loss": -28.23443031311035, "global_step": 633580, "epoch": 7633} {"train_loss": -28.344449996948242, "global_step": 633581, "epoch": 7633} {"train_loss": -28.295989990234375, "global_step": 633582, "epoch": 7633} {"train_loss": -28.77058219909668, "global_step": 633583, "epoch": 7633} {"train_loss": -28.168792724609375, "global_step": 633584, "epoch": 7633} {"train_loss": -28.24452018737793, "global_step": 633585, "epoch": 7633} {"train_loss": -28.150558471679688, "global_step": 633586, "epoch": 7633} {"train_loss": -28.358901977539062, "global_step": 633587, "epoch": 7633} {"train_loss": -28.139989852905273, "global_step": 633588, "epoch": 7633} {"train_loss": -28.503244400024414, "global_step": 633589, "epoch": 7633} {"train_loss": -27.997175216674805, "global_step": 633590, "epoch": 7633} {"train_loss": -28.577972412109375, "global_step": 633591, "epoch": 7633} {"train_loss": -28.078908920288086, "global_step": 633592, "epoch": 7633} {"train_loss": -28.336624145507812, "global_step": 633593, "epoch": 7633} {"train_loss": -28.762205123901367, "global_step": 633594, "epoch": 7633} {"train_loss": -28.48284339904785, "global_step": 633595, "epoch": 7633} {"train_loss": -28.347768783569336, "global_step": 633596, "epoch": 7633} {"train_loss": -27.8070068359375, "global_step": 633597, "epoch": 7633} {"train_loss": -27.958740234375, "global_step": 633598, "epoch": 7633} {"train_loss": -28.256061553955078, "global_step": 633599, "epoch": 7633} {"train_loss": -28.38528823852539, "global_step": 633600, "epoch": 7633} {"train_loss": -28.15248680114746, "global_step": 633601, "epoch": 7633} {"train_loss": -28.226118087768555, "global_step": 633602, "epoch": 7633} {"train_loss": -28.415912628173828, "global_step": 633603, "epoch": 7633} {"train_loss": -28.181446075439453, "global_step": 633604, "epoch": 7633} {"train_loss": -28.134811401367188, "global_step": 633605, "epoch": 7633} {"train_loss": -28.488187789916992, "global_step": 633606, "epoch": 7633} {"train_loss": -28.508283615112305, "global_step": 633607, "epoch": 7633} {"train_loss": -28.432422637939453, "global_step": 633608, "epoch": 7633} {"train_loss": -28.715925216674805, "global_step": 633609, "epoch": 7633} {"train_loss": -28.526941299438477, "global_step": 633610, "epoch": 7633} {"train_loss": -28.522069931030273, "global_step": 633611, "epoch": 7633} {"train_loss": -28.5270938873291, "global_step": 633612, "epoch": 7633} {"train_loss": -28.067956924438477, "global_step": 633613, "epoch": 7633} {"train_loss": -28.324359893798828, "global_step": 633614, "epoch": 7633} {"train_loss": -27.7023868560791, "global_step": 633615, "epoch": 7633} {"train_loss": -26.971967697143555, "global_step": 633616, "epoch": 7633} {"train_loss": -27.0179443359375, "global_step": 633617, "epoch": 7633} {"train_loss": -27.119291305541992, "global_step": 633618, "epoch": 7633} {"train_loss": -27.639698028564453, "global_step": 633619, "epoch": 7633} {"train_loss": -27.951263427734375, "global_step": 633620, "epoch": 7633} {"train_loss": -28.019542096609094, "global_step": 633621, "epoch": 7633, "val_loss": 6871068.0} {"train_loss": -26.786579132080078, "global_step": 633622, "epoch": 7634} {"train_loss": -24.912124633789062, "global_step": 633623, "epoch": 7634} {"train_loss": -23.986648559570312, "global_step": 633624, "epoch": 7634} {"train_loss": -25.283124923706055, "global_step": 633625, "epoch": 7634} {"train_loss": -26.648054122924805, "global_step": 633626, "epoch": 7634} {"train_loss": -26.077219009399414, "global_step": 633627, "epoch": 7634} {"train_loss": -26.8045654296875, "global_step": 633628, "epoch": 7634} {"train_loss": -26.524221420288086, "global_step": 633629, "epoch": 7634} {"train_loss": -27.06241798400879, "global_step": 633630, "epoch": 7634} {"train_loss": -26.50799560546875, "global_step": 633631, "epoch": 7634} {"train_loss": -27.228857040405273, "global_step": 633632, "epoch": 7634} {"train_loss": -26.842273712158203, "global_step": 633633, "epoch": 7634} {"train_loss": -26.7506103515625, "global_step": 633634, "epoch": 7634} {"train_loss": -27.00311279296875, "global_step": 633635, "epoch": 7634} {"train_loss": -27.444000244140625, "global_step": 633636, "epoch": 7634} {"train_loss": -27.2069091796875, "global_step": 633637, "epoch": 7634} {"train_loss": -27.32134437561035, "global_step": 633638, "epoch": 7634} {"train_loss": -27.382389068603516, "global_step": 633639, "epoch": 7634} {"train_loss": -27.36102294921875, "global_step": 633640, "epoch": 7634} {"train_loss": -27.903207778930664, "global_step": 633641, "epoch": 7634} {"train_loss": -27.58915138244629, "global_step": 633642, "epoch": 7634} {"train_loss": -27.896482467651367, "global_step": 633643, "epoch": 7634} {"train_loss": -27.726806640625, "global_step": 633644, "epoch": 7634} {"train_loss": -27.60719108581543, "global_step": 633645, "epoch": 7634} {"train_loss": -27.362262725830078, "global_step": 633646, "epoch": 7634} {"train_loss": -27.75974464416504, "global_step": 633647, "epoch": 7634} {"train_loss": -27.86542320251465, "global_step": 633648, "epoch": 7634} {"train_loss": -27.794570922851562, "global_step": 633649, "epoch": 7634} {"train_loss": -27.773056030273438, "global_step": 633650, "epoch": 7634} {"train_loss": -27.72747230529785, "global_step": 633651, "epoch": 7634} {"train_loss": -28.19685173034668, "global_step": 633652, "epoch": 7634} {"train_loss": -27.693124771118164, "global_step": 633653, "epoch": 7634} {"train_loss": -27.90696144104004, "global_step": 633654, "epoch": 7634} {"train_loss": -27.879850387573242, "global_step": 633655, "epoch": 7634} {"train_loss": -27.80205726623535, "global_step": 633656, "epoch": 7634} {"train_loss": -27.77406120300293, "global_step": 633657, "epoch": 7634} {"train_loss": -27.89386558532715, "global_step": 633658, "epoch": 7634} {"train_loss": -27.98898696899414, "global_step": 633659, "epoch": 7634} {"train_loss": -27.875091552734375, "global_step": 633660, "epoch": 7634} {"train_loss": -28.131433486938477, "global_step": 633661, "epoch": 7634} {"train_loss": -27.95841407775879, "global_step": 633662, "epoch": 7634} {"train_loss": -28.169031143188477, "global_step": 633663, "epoch": 7634} {"train_loss": -28.02203941345215, "global_step": 633664, "epoch": 7634} {"train_loss": -27.947370529174805, "global_step": 633665, "epoch": 7634} {"train_loss": -28.119434356689453, "global_step": 633666, "epoch": 7634} {"train_loss": -28.119873046875, "global_step": 633667, "epoch": 7634} {"train_loss": -28.326282501220703, "global_step": 633668, "epoch": 7634} {"train_loss": -28.30517578125, "global_step": 633669, "epoch": 7634} {"train_loss": -27.929365158081055, "global_step": 633670, "epoch": 7634} {"train_loss": -28.134618759155273, "global_step": 633671, "epoch": 7634} {"train_loss": -28.283620834350586, "global_step": 633672, "epoch": 7634} {"train_loss": -28.183759689331055, "global_step": 633673, "epoch": 7634} {"train_loss": -28.360565185546875, "global_step": 633674, "epoch": 7634} {"train_loss": -28.311065673828125, "global_step": 633675, "epoch": 7634} {"train_loss": -28.470905303955078, "global_step": 633676, "epoch": 7634} {"train_loss": -28.15268325805664, "global_step": 633677, "epoch": 7634} {"train_loss": -28.127975463867188, "global_step": 633678, "epoch": 7634} {"train_loss": -28.75713539123535, "global_step": 633679, "epoch": 7634} {"train_loss": -28.80231285095215, "global_step": 633680, "epoch": 7634} {"train_loss": -28.223493576049805, "global_step": 633681, "epoch": 7634} {"train_loss": -28.397985458374023, "global_step": 633682, "epoch": 7634} {"train_loss": -28.463430404663086, "global_step": 633683, "epoch": 7634} {"train_loss": -28.55708122253418, "global_step": 633684, "epoch": 7634} {"train_loss": -28.60846519470215, "global_step": 633685, "epoch": 7634} {"train_loss": -28.309894561767578, "global_step": 633686, "epoch": 7634} {"train_loss": -28.457000732421875, "global_step": 633687, "epoch": 7634} {"train_loss": -28.928802490234375, "global_step": 633688, "epoch": 7634} {"train_loss": -28.37738609313965, "global_step": 633689, "epoch": 7634} {"train_loss": -28.6986083984375, "global_step": 633690, "epoch": 7634} {"train_loss": -28.59278678894043, "global_step": 633691, "epoch": 7634} {"train_loss": -28.708454132080078, "global_step": 633692, "epoch": 7634} {"train_loss": -28.125471115112305, "global_step": 633693, "epoch": 7634} {"train_loss": -28.117328643798828, "global_step": 633694, "epoch": 7634} {"train_loss": -27.92112159729004, "global_step": 633695, "epoch": 7634} {"train_loss": -27.249448776245117, "global_step": 633696, "epoch": 7634} {"train_loss": -27.149641036987305, "global_step": 633697, "epoch": 7634} {"train_loss": -28.00888442993164, "global_step": 633698, "epoch": 7634} {"train_loss": -28.1346492767334, "global_step": 633699, "epoch": 7634} {"train_loss": -28.02493667602539, "global_step": 633700, "epoch": 7634} {"train_loss": -28.017621994018555, "global_step": 633701, "epoch": 7634} {"train_loss": -27.838550567626953, "global_step": 633702, "epoch": 7634} {"train_loss": -27.871435165405273, "global_step": 633703, "epoch": 7634} {"train_loss": -27.72676743656756, "global_step": 633704, "epoch": 7634, "val_loss": 6875637.5} {"train_loss": -27.823637008666992, "global_step": 633705, "epoch": 7635} {"train_loss": -26.467710494995117, "global_step": 633706, "epoch": 7635} {"train_loss": -25.930877685546875, "global_step": 633707, "epoch": 7635} {"train_loss": -25.46510887145996, "global_step": 633708, "epoch": 7635} {"train_loss": -27.053815841674805, "global_step": 633709, "epoch": 7635} {"train_loss": -27.1878719329834, "global_step": 633710, "epoch": 7635} {"train_loss": -26.816373825073242, "global_step": 633711, "epoch": 7635} {"train_loss": -27.140716552734375, "global_step": 633712, "epoch": 7635} {"train_loss": -27.49600601196289, "global_step": 633713, "epoch": 7635} {"train_loss": -26.9586124420166, "global_step": 633714, "epoch": 7635} {"train_loss": -27.240680694580078, "global_step": 633715, "epoch": 7635} {"train_loss": -27.393808364868164, "global_step": 633716, "epoch": 7635} {"train_loss": -27.297571182250977, "global_step": 633717, "epoch": 7635} {"train_loss": -27.698108673095703, "global_step": 633718, "epoch": 7635} {"train_loss": -27.395828247070312, "global_step": 633719, "epoch": 7635} {"train_loss": -27.716236114501953, "global_step": 633720, "epoch": 7635} {"train_loss": -27.741918563842773, "global_step": 633721, "epoch": 7635} {"train_loss": -27.64847183227539, "global_step": 633722, "epoch": 7635} {"train_loss": -27.973600387573242, "global_step": 633723, "epoch": 7635} {"train_loss": -27.43055534362793, "global_step": 633724, "epoch": 7635} {"train_loss": -27.77638053894043, "global_step": 633725, "epoch": 7635} {"train_loss": -27.923480987548828, "global_step": 633726, "epoch": 7635} {"train_loss": -27.636945724487305, "global_step": 633727, "epoch": 7635} {"train_loss": -27.816162109375, "global_step": 633728, "epoch": 7635} {"train_loss": -27.986059188842773, "global_step": 633729, "epoch": 7635} {"train_loss": -28.194116592407227, "global_step": 633730, "epoch": 7635} {"train_loss": -28.214200973510742, "global_step": 633731, "epoch": 7635} {"train_loss": -28.0480899810791, "global_step": 633732, "epoch": 7635} {"train_loss": -28.09746742248535, "global_step": 633733, "epoch": 7635} {"train_loss": -27.474246978759766, "global_step": 633734, "epoch": 7635} {"train_loss": -28.0600643157959, "global_step": 633735, "epoch": 7635} {"train_loss": -28.070117950439453, "global_step": 633736, "epoch": 7635} {"train_loss": -28.327747344970703, "global_step": 633737, "epoch": 7635} {"train_loss": -28.181976318359375, "global_step": 633738, "epoch": 7635} {"train_loss": -27.86808204650879, "global_step": 633739, "epoch": 7635} {"train_loss": -27.922210693359375, "global_step": 633740, "epoch": 7635} {"train_loss": -28.3150634765625, "global_step": 633741, "epoch": 7635} {"train_loss": -28.001718521118164, "global_step": 633742, "epoch": 7635} {"train_loss": -28.685474395751953, "global_step": 633743, "epoch": 7635} {"train_loss": -27.934833526611328, "global_step": 633744, "epoch": 7635} {"train_loss": -28.165668487548828, "global_step": 633745, "epoch": 7635} {"train_loss": -27.96866798400879, "global_step": 633746, "epoch": 7635} {"train_loss": -27.989612579345703, "global_step": 633747, "epoch": 7635} {"train_loss": -27.9826717376709, "global_step": 633748, "epoch": 7635} {"train_loss": -28.321613311767578, "global_step": 633749, "epoch": 7635} {"train_loss": -28.36810874938965, "global_step": 633750, "epoch": 7635} {"train_loss": -28.708393096923828, "global_step": 633751, "epoch": 7635} {"train_loss": -28.48099136352539, "global_step": 633752, "epoch": 7635} {"train_loss": -28.3724422454834, "global_step": 633753, "epoch": 7635} {"train_loss": -28.02577018737793, "global_step": 633754, "epoch": 7635} {"train_loss": -28.02958106994629, "global_step": 633755, "epoch": 7635} {"train_loss": -28.406225204467773, "global_step": 633756, "epoch": 7635} {"train_loss": -28.436506271362305, "global_step": 633757, "epoch": 7635} {"train_loss": -28.540124893188477, "global_step": 633758, "epoch": 7635} {"train_loss": -28.40531349182129, "global_step": 633759, "epoch": 7635} {"train_loss": -28.22015380859375, "global_step": 633760, "epoch": 7635} {"train_loss": -28.4847469329834, "global_step": 633761, "epoch": 7635} {"train_loss": -28.561420440673828, "global_step": 633762, "epoch": 7635} {"train_loss": -28.320926666259766, "global_step": 633763, "epoch": 7635} {"train_loss": -28.288074493408203, "global_step": 633764, "epoch": 7635} {"train_loss": -28.4921817779541, "global_step": 633765, "epoch": 7635} {"train_loss": -28.695728302001953, "global_step": 633766, "epoch": 7635} {"train_loss": -28.596759796142578, "global_step": 633767, "epoch": 7635} {"train_loss": -28.584699630737305, "global_step": 633768, "epoch": 7635} {"train_loss": -28.14703941345215, "global_step": 633769, "epoch": 7635} {"train_loss": -28.171499252319336, "global_step": 633770, "epoch": 7635} {"train_loss": -28.61237144470215, "global_step": 633771, "epoch": 7635} {"train_loss": -28.685468673706055, "global_step": 633772, "epoch": 7635} {"train_loss": -28.398181915283203, "global_step": 633773, "epoch": 7635} {"train_loss": -28.657989501953125, "global_step": 633774, "epoch": 7635} {"train_loss": -29.04596519470215, "global_step": 633775, "epoch": 7635} {"train_loss": -28.703107833862305, "global_step": 633776, "epoch": 7635} {"train_loss": -28.51276206970215, "global_step": 633777, "epoch": 7635} {"train_loss": -28.551923751831055, "global_step": 633778, "epoch": 7635} {"train_loss": -28.46048355102539, "global_step": 633779, "epoch": 7635} {"train_loss": -28.69500732421875, "global_step": 633780, "epoch": 7635} {"train_loss": -27.92481803894043, "global_step": 633781, "epoch": 7635} {"train_loss": -28.128442764282227, "global_step": 633782, "epoch": 7635} {"train_loss": -27.428558349609375, "global_step": 633783, "epoch": 7635} {"train_loss": -28.023147583007812, "global_step": 633784, "epoch": 7635} {"train_loss": -27.853565216064453, "global_step": 633785, "epoch": 7635} {"train_loss": -27.835723876953125, "global_step": 633786, "epoch": 7635} {"train_loss": -27.984927556600915, "global_step": 633787, "epoch": 7635, "val_loss": 6841944.5} {"train_loss": -25.5147705078125, "global_step": 633788, "epoch": 7636} {"train_loss": -23.54645347595215, "global_step": 633789, "epoch": 7636} {"train_loss": -24.569761276245117, "global_step": 633790, "epoch": 7636} {"train_loss": -26.061986923217773, "global_step": 633791, "epoch": 7636} {"train_loss": -26.646692276000977, "global_step": 633792, "epoch": 7636} {"train_loss": -26.235721588134766, "global_step": 633793, "epoch": 7636} {"train_loss": -26.36104393005371, "global_step": 633794, "epoch": 7636} {"train_loss": -26.772144317626953, "global_step": 633795, "epoch": 7636} {"train_loss": -27.163339614868164, "global_step": 633796, "epoch": 7636} {"train_loss": -26.707447052001953, "global_step": 633797, "epoch": 7636} {"train_loss": -26.954381942749023, "global_step": 633798, "epoch": 7636} {"train_loss": -26.901508331298828, "global_step": 633799, "epoch": 7636} {"train_loss": -26.952070236206055, "global_step": 633800, "epoch": 7636} {"train_loss": -27.55722427368164, "global_step": 633801, "epoch": 7636} {"train_loss": -27.46912956237793, "global_step": 633802, "epoch": 7636} {"train_loss": -27.3530330657959, "global_step": 633803, "epoch": 7636} {"train_loss": -28.022357940673828, "global_step": 633804, "epoch": 7636} {"train_loss": -27.291141510009766, "global_step": 633805, "epoch": 7636} {"train_loss": -27.637231826782227, "global_step": 633806, "epoch": 7636} {"train_loss": -27.779693603515625, "global_step": 633807, "epoch": 7636} {"train_loss": -27.861358642578125, "global_step": 633808, "epoch": 7636} {"train_loss": -27.376073837280273, "global_step": 633809, "epoch": 7636} {"train_loss": -27.717519760131836, "global_step": 633810, "epoch": 7636} {"train_loss": -27.82095718383789, "global_step": 633811, "epoch": 7636} {"train_loss": -27.596445083618164, "global_step": 633812, "epoch": 7636} {"train_loss": -27.8680477142334, "global_step": 633813, "epoch": 7636} {"train_loss": -27.736753463745117, "global_step": 633814, "epoch": 7636} {"train_loss": -27.67145347595215, "global_step": 633815, "epoch": 7636} {"train_loss": -27.929479598999023, "global_step": 633816, "epoch": 7636} {"train_loss": -27.754308700561523, "global_step": 633817, "epoch": 7636} {"train_loss": -28.05551528930664, "global_step": 633818, "epoch": 7636} {"train_loss": -27.819538116455078, "global_step": 633819, "epoch": 7636} {"train_loss": -27.925962448120117, "global_step": 633820, "epoch": 7636} {"train_loss": -27.9338321685791, "global_step": 633821, "epoch": 7636} {"train_loss": -28.28724479675293, "global_step": 633822, "epoch": 7636} {"train_loss": -28.105209350585938, "global_step": 633823, "epoch": 7636} {"train_loss": -28.364797592163086, "global_step": 633824, "epoch": 7636} {"train_loss": -28.1167049407959, "global_step": 633825, "epoch": 7636} {"train_loss": -28.121755599975586, "global_step": 633826, "epoch": 7636} {"train_loss": -28.376392364501953, "global_step": 633827, "epoch": 7636} {"train_loss": -28.234039306640625, "global_step": 633828, "epoch": 7636} {"train_loss": -28.430042266845703, "global_step": 633829, "epoch": 7636} {"train_loss": -27.948728561401367, "global_step": 633830, "epoch": 7636} {"train_loss": -28.368310928344727, "global_step": 633831, "epoch": 7636} {"train_loss": -28.387094497680664, "global_step": 633832, "epoch": 7636} {"train_loss": -28.663593292236328, "global_step": 633833, "epoch": 7636} {"train_loss": -28.347244262695312, "global_step": 633834, "epoch": 7636} {"train_loss": -28.3042049407959, "global_step": 633835, "epoch": 7636} {"train_loss": -28.582212448120117, "global_step": 633836, "epoch": 7636} {"train_loss": -28.464344024658203, "global_step": 633837, "epoch": 7636} {"train_loss": -28.239545822143555, "global_step": 633838, "epoch": 7636} {"train_loss": -28.364776611328125, "global_step": 633839, "epoch": 7636} {"train_loss": -28.064563751220703, "global_step": 633840, "epoch": 7636} {"train_loss": -28.453857421875, "global_step": 633841, "epoch": 7636} {"train_loss": -28.657398223876953, "global_step": 633842, "epoch": 7636} {"train_loss": -28.376745223999023, "global_step": 633843, "epoch": 7636} {"train_loss": -28.02662467956543, "global_step": 633844, "epoch": 7636} {"train_loss": -28.159215927124023, "global_step": 633845, "epoch": 7636} {"train_loss": -28.210926055908203, "global_step": 633846, "epoch": 7636} {"train_loss": -28.490909576416016, "global_step": 633847, "epoch": 7636} {"train_loss": -28.69402503967285, "global_step": 633848, "epoch": 7636} {"train_loss": -28.252405166625977, "global_step": 633849, "epoch": 7636} {"train_loss": -28.601287841796875, "global_step": 633850, "epoch": 7636} {"train_loss": -28.62616539001465, "global_step": 633851, "epoch": 7636} {"train_loss": -28.338794708251953, "global_step": 633852, "epoch": 7636} {"train_loss": -28.4512996673584, "global_step": 633853, "epoch": 7636} {"train_loss": -28.357318878173828, "global_step": 633854, "epoch": 7636} {"train_loss": -28.564390182495117, "global_step": 633855, "epoch": 7636} {"train_loss": -28.462316513061523, "global_step": 633856, "epoch": 7636} {"train_loss": -28.635009765625, "global_step": 633857, "epoch": 7636} {"train_loss": -28.504474639892578, "global_step": 633858, "epoch": 7636} {"train_loss": -28.347898483276367, "global_step": 633859, "epoch": 7636} {"train_loss": -28.267959594726562, "global_step": 633860, "epoch": 7636} {"train_loss": -28.494760513305664, "global_step": 633861, "epoch": 7636} {"train_loss": -28.4229793548584, "global_step": 633862, "epoch": 7636} {"train_loss": -28.4829044342041, "global_step": 633863, "epoch": 7636} {"train_loss": -27.891569137573242, "global_step": 633864, "epoch": 7636} {"train_loss": -28.409698486328125, "global_step": 633865, "epoch": 7636} {"train_loss": -28.41351890563965, "global_step": 633866, "epoch": 7636} {"train_loss": -27.772802352905273, "global_step": 633867, "epoch": 7636} {"train_loss": -28.30474281311035, "global_step": 633868, "epoch": 7636} {"train_loss": -28.107349395751953, "global_step": 633869, "epoch": 7636} {"train_loss": -27.83476866296975, "global_step": 633870, "epoch": 7636, "val_loss": 6908960.0} {"train_loss": -27.46942710876465, "global_step": 633871, "epoch": 7637} {"train_loss": -26.80872917175293, "global_step": 633872, "epoch": 7637} {"train_loss": -27.702381134033203, "global_step": 633873, "epoch": 7637} {"train_loss": -27.42120933532715, "global_step": 633874, "epoch": 7637} {"train_loss": -27.87468910217285, "global_step": 633875, "epoch": 7637} {"train_loss": -27.699254989624023, "global_step": 633876, "epoch": 7637} {"train_loss": -27.898313522338867, "global_step": 633877, "epoch": 7637} {"train_loss": -27.450124740600586, "global_step": 633878, "epoch": 7637} {"train_loss": -28.112939834594727, "global_step": 633879, "epoch": 7637} {"train_loss": -27.865488052368164, "global_step": 633880, "epoch": 7637} {"train_loss": -27.8824520111084, "global_step": 633881, "epoch": 7637} {"train_loss": -28.06157875061035, "global_step": 633882, "epoch": 7637} {"train_loss": -28.429443359375, "global_step": 633883, "epoch": 7637} {"train_loss": -28.122100830078125, "global_step": 633884, "epoch": 7637} {"train_loss": -28.206037521362305, "global_step": 633885, "epoch": 7637} {"train_loss": -28.188796997070312, "global_step": 633886, "epoch": 7637} {"train_loss": -28.456893920898438, "global_step": 633887, "epoch": 7637} {"train_loss": -28.2116756439209, "global_step": 633888, "epoch": 7637} {"train_loss": -28.082014083862305, "global_step": 633889, "epoch": 7637} {"train_loss": -28.141357421875, "global_step": 633890, "epoch": 7637} {"train_loss": -28.02129554748535, "global_step": 633891, "epoch": 7637} {"train_loss": -28.21649742126465, "global_step": 633892, "epoch": 7637} {"train_loss": -28.537128448486328, "global_step": 633893, "epoch": 7637} {"train_loss": -28.16412925720215, "global_step": 633894, "epoch": 7637} {"train_loss": -28.209171295166016, "global_step": 633895, "epoch": 7637} {"train_loss": -28.384122848510742, "global_step": 633896, "epoch": 7637} {"train_loss": -28.179580688476562, "global_step": 633897, "epoch": 7637} {"train_loss": -28.57282066345215, "global_step": 633898, "epoch": 7637} {"train_loss": -27.96713638305664, "global_step": 633899, "epoch": 7637} {"train_loss": -27.792814254760742, "global_step": 633900, "epoch": 7637} {"train_loss": -28.400604248046875, "global_step": 633901, "epoch": 7637} {"train_loss": -28.334659576416016, "global_step": 633902, "epoch": 7637} {"train_loss": -28.522693634033203, "global_step": 633903, "epoch": 7637} {"train_loss": -28.305341720581055, "global_step": 633904, "epoch": 7637} {"train_loss": -28.28645133972168, "global_step": 633905, "epoch": 7637} {"train_loss": -28.5403995513916, "global_step": 633906, "epoch": 7637} {"train_loss": -28.0200138092041, "global_step": 633907, "epoch": 7637} {"train_loss": -27.812042236328125, "global_step": 633908, "epoch": 7637} {"train_loss": -28.426340103149414, "global_step": 633909, "epoch": 7637} {"train_loss": -28.47723960876465, "global_step": 633910, "epoch": 7637} {"train_loss": -28.331836700439453, "global_step": 633911, "epoch": 7637} {"train_loss": -28.394582748413086, "global_step": 633912, "epoch": 7637} {"train_loss": -28.260679244995117, "global_step": 633913, "epoch": 7637} {"train_loss": -28.24051856994629, "global_step": 633914, "epoch": 7637} {"train_loss": -28.337194442749023, "global_step": 633915, "epoch": 7637} {"train_loss": -28.24592399597168, "global_step": 633916, "epoch": 7637} {"train_loss": -28.359607696533203, "global_step": 633917, "epoch": 7637} {"train_loss": -27.966690063476562, "global_step": 633918, "epoch": 7637} {"train_loss": -28.4847354888916, "global_step": 633919, "epoch": 7637} {"train_loss": -27.880680084228516, "global_step": 633920, "epoch": 7637} {"train_loss": -28.408422470092773, "global_step": 633921, "epoch": 7637} {"train_loss": -28.31593894958496, "global_step": 633922, "epoch": 7637} {"train_loss": -28.221200942993164, "global_step": 633923, "epoch": 7637} {"train_loss": -28.261640548706055, "global_step": 633924, "epoch": 7637} {"train_loss": -27.783157348632812, "global_step": 633925, "epoch": 7637} {"train_loss": -28.536579132080078, "global_step": 633926, "epoch": 7637} {"train_loss": -27.944406509399414, "global_step": 633927, "epoch": 7637} {"train_loss": -28.484846115112305, "global_step": 633928, "epoch": 7637} {"train_loss": -27.72846031188965, "global_step": 633929, "epoch": 7637} {"train_loss": -27.806686401367188, "global_step": 633930, "epoch": 7637} {"train_loss": -28.46099853515625, "global_step": 633931, "epoch": 7637} {"train_loss": -28.1353759765625, "global_step": 633932, "epoch": 7637} {"train_loss": -28.34273338317871, "global_step": 633933, "epoch": 7637} {"train_loss": -28.022933959960938, "global_step": 633934, "epoch": 7637} {"train_loss": -28.19137954711914, "global_step": 633935, "epoch": 7637} {"train_loss": -28.085681915283203, "global_step": 633936, "epoch": 7637} {"train_loss": -28.027755737304688, "global_step": 633937, "epoch": 7637} {"train_loss": -28.2646484375, "global_step": 633938, "epoch": 7637} {"train_loss": -27.630483627319336, "global_step": 633939, "epoch": 7637} {"train_loss": -28.35992431640625, "global_step": 633940, "epoch": 7637} {"train_loss": -27.877796173095703, "global_step": 633941, "epoch": 7637} {"train_loss": -27.981351852416992, "global_step": 633942, "epoch": 7637} {"train_loss": -27.9929141998291, "global_step": 633943, "epoch": 7637} {"train_loss": -28.454126358032227, "global_step": 633944, "epoch": 7637} {"train_loss": -27.93597412109375, "global_step": 633945, "epoch": 7637} {"train_loss": -28.317472457885742, "global_step": 633946, "epoch": 7637} {"train_loss": -28.5290470123291, "global_step": 633947, "epoch": 7637} {"train_loss": -28.00702476501465, "global_step": 633948, "epoch": 7637} {"train_loss": -28.3035888671875, "global_step": 633949, "epoch": 7637} {"train_loss": -28.34792137145996, "global_step": 633950, "epoch": 7637} {"train_loss": -28.076406478881836, "global_step": 633951, "epoch": 7637} {"train_loss": -28.48296546936035, "global_step": 633952, "epoch": 7637} {"train_loss": -28.123244963496564, "global_step": 633953, "epoch": 7637, "val_loss": 6828916.0} {"train_loss": -27.462270736694336, "global_step": 633954, "epoch": 7638} {"train_loss": -26.916593551635742, "global_step": 633955, "epoch": 7638} {"train_loss": -27.53000831604004, "global_step": 633956, "epoch": 7638} {"train_loss": -27.45826530456543, "global_step": 633957, "epoch": 7638} {"train_loss": -27.644079208374023, "global_step": 633958, "epoch": 7638} {"train_loss": -27.429244995117188, "global_step": 633959, "epoch": 7638} {"train_loss": -27.152729034423828, "global_step": 633960, "epoch": 7638} {"train_loss": -26.900970458984375, "global_step": 633961, "epoch": 7638} {"train_loss": -28.081491470336914, "global_step": 633962, "epoch": 7638} {"train_loss": -27.952774047851562, "global_step": 633963, "epoch": 7638} {"train_loss": -27.69366455078125, "global_step": 633964, "epoch": 7638} {"train_loss": -27.711780548095703, "global_step": 633965, "epoch": 7638} {"train_loss": -27.86628532409668, "global_step": 633966, "epoch": 7638} {"train_loss": -27.420331954956055, "global_step": 633967, "epoch": 7638} {"train_loss": -27.616540908813477, "global_step": 633968, "epoch": 7638} {"train_loss": -28.107746124267578, "global_step": 633969, "epoch": 7638} {"train_loss": -28.031417846679688, "global_step": 633970, "epoch": 7638} {"train_loss": -28.11870765686035, "global_step": 633971, "epoch": 7638} {"train_loss": -27.75095558166504, "global_step": 633972, "epoch": 7638} {"train_loss": -27.69344139099121, "global_step": 633973, "epoch": 7638} {"train_loss": -27.658349990844727, "global_step": 633974, "epoch": 7638} {"train_loss": -27.988794326782227, "global_step": 633975, "epoch": 7638} {"train_loss": -28.111164093017578, "global_step": 633976, "epoch": 7638} {"train_loss": -27.819181442260742, "global_step": 633977, "epoch": 7638} {"train_loss": -28.09014320373535, "global_step": 633978, "epoch": 7638} {"train_loss": -28.38260841369629, "global_step": 633979, "epoch": 7638} {"train_loss": -28.369306564331055, "global_step": 633980, "epoch": 7638} {"train_loss": -28.503705978393555, "global_step": 633981, "epoch": 7638} {"train_loss": -28.046567916870117, "global_step": 633982, "epoch": 7638} {"train_loss": -28.219482421875, "global_step": 633983, "epoch": 7638} {"train_loss": -28.073328018188477, "global_step": 633984, "epoch": 7638} {"train_loss": -28.43116569519043, "global_step": 633985, "epoch": 7638} {"train_loss": -28.4461669921875, "global_step": 633986, "epoch": 7638} {"train_loss": -28.337202072143555, "global_step": 633987, "epoch": 7638} {"train_loss": -28.62281608581543, "global_step": 633988, "epoch": 7638} {"train_loss": -28.52197265625, "global_step": 633989, "epoch": 7638} {"train_loss": -28.297693252563477, "global_step": 633990, "epoch": 7638} {"train_loss": -28.26035499572754, "global_step": 633991, "epoch": 7638} {"train_loss": -28.380146026611328, "global_step": 633992, "epoch": 7638} {"train_loss": -28.545103073120117, "global_step": 633993, "epoch": 7638} {"train_loss": -28.70326042175293, "global_step": 633994, "epoch": 7638} {"train_loss": -28.414518356323242, "global_step": 633995, "epoch": 7638} {"train_loss": -28.4156551361084, "global_step": 633996, "epoch": 7638} {"train_loss": -28.6570987701416, "global_step": 633997, "epoch": 7638} {"train_loss": -28.44341468811035, "global_step": 633998, "epoch": 7638} {"train_loss": -27.951887130737305, "global_step": 633999, "epoch": 7638} {"train_loss": -28.548725128173828, "global_step": 634000, "epoch": 7638} {"train_loss": -28.295215606689453, "global_step": 634001, "epoch": 7638} {"train_loss": -29.03702735900879, "global_step": 634002, "epoch": 7638} {"train_loss": -27.950366973876953, "global_step": 634003, "epoch": 7638} {"train_loss": -28.679828643798828, "global_step": 634004, "epoch": 7638} {"train_loss": -28.716413497924805, "global_step": 634005, "epoch": 7638} {"train_loss": -28.916122436523438, "global_step": 634006, "epoch": 7638} {"train_loss": -28.338354110717773, "global_step": 634007, "epoch": 7638} {"train_loss": -28.239999771118164, "global_step": 634008, "epoch": 7638} {"train_loss": -28.186975479125977, "global_step": 634009, "epoch": 7638} {"train_loss": -28.362564086914062, "global_step": 634010, "epoch": 7638} {"train_loss": -28.233448028564453, "global_step": 634011, "epoch": 7638} {"train_loss": -28.112207412719727, "global_step": 634012, "epoch": 7638} {"train_loss": -27.439023971557617, "global_step": 634013, "epoch": 7638} {"train_loss": -27.019088745117188, "global_step": 634014, "epoch": 7638} {"train_loss": -27.728540420532227, "global_step": 634015, "epoch": 7638} {"train_loss": -28.078332901000977, "global_step": 634016, "epoch": 7638} {"train_loss": -27.464664459228516, "global_step": 634017, "epoch": 7638} {"train_loss": -27.71051597595215, "global_step": 634018, "epoch": 7638} {"train_loss": -27.92902946472168, "global_step": 634019, "epoch": 7638} {"train_loss": -27.54538345336914, "global_step": 634020, "epoch": 7638} {"train_loss": -28.482227325439453, "global_step": 634021, "epoch": 7638} {"train_loss": -27.5009765625, "global_step": 634022, "epoch": 7638} {"train_loss": -28.15288734436035, "global_step": 634023, "epoch": 7638} {"train_loss": -27.857641220092773, "global_step": 634024, "epoch": 7638} {"train_loss": -27.632856369018555, "global_step": 634025, "epoch": 7638} {"train_loss": -28.274633407592773, "global_step": 634026, "epoch": 7638} {"train_loss": -28.053686141967773, "global_step": 634027, "epoch": 7638} {"train_loss": -27.7830867767334, "global_step": 634028, "epoch": 7638} {"train_loss": -27.875959396362305, "global_step": 634029, "epoch": 7638} {"train_loss": -28.388158798217773, "global_step": 634030, "epoch": 7638} {"train_loss": -27.745203018188477, "global_step": 634031, "epoch": 7638} {"train_loss": -28.067907333374023, "global_step": 634032, "epoch": 7638} {"train_loss": -28.0325984954834, "global_step": 634033, "epoch": 7638} {"train_loss": -28.437530517578125, "global_step": 634034, "epoch": 7638} {"train_loss": -27.925445556640625, "global_step": 634035, "epoch": 7638} {"train_loss": -28.04388639151332, "global_step": 634036, "epoch": 7638, "val_loss": 6867962.0} {"train_loss": -27.456384658813477, "global_step": 634037, "epoch": 7639} {"train_loss": -28.13892936706543, "global_step": 634038, "epoch": 7639} {"train_loss": -27.4271183013916, "global_step": 634039, "epoch": 7639} {"train_loss": -27.61346435546875, "global_step": 634040, "epoch": 7639} {"train_loss": -27.105762481689453, "global_step": 634041, "epoch": 7639} {"train_loss": -26.917760848999023, "global_step": 634042, "epoch": 7639} {"train_loss": -26.80433464050293, "global_step": 634043, "epoch": 7639} {"train_loss": -27.335819244384766, "global_step": 634044, "epoch": 7639} {"train_loss": -27.6878604888916, "global_step": 634045, "epoch": 7639} {"train_loss": -27.134809494018555, "global_step": 634046, "epoch": 7639} {"train_loss": -27.645978927612305, "global_step": 634047, "epoch": 7639} {"train_loss": -27.634693145751953, "global_step": 634048, "epoch": 7639} {"train_loss": -26.891382217407227, "global_step": 634049, "epoch": 7639} {"train_loss": -27.380130767822266, "global_step": 634050, "epoch": 7639} {"train_loss": -27.46894645690918, "global_step": 634051, "epoch": 7639} {"train_loss": -27.384607315063477, "global_step": 634052, "epoch": 7639} {"train_loss": -27.291534423828125, "global_step": 634053, "epoch": 7639} {"train_loss": -27.732803344726562, "global_step": 634054, "epoch": 7639} {"train_loss": -27.814437866210938, "global_step": 634055, "epoch": 7639} {"train_loss": -27.68305778503418, "global_step": 634056, "epoch": 7639} {"train_loss": -27.662458419799805, "global_step": 634057, "epoch": 7639} {"train_loss": -27.77827262878418, "global_step": 634058, "epoch": 7639} {"train_loss": -28.285520553588867, "global_step": 634059, "epoch": 7639} {"train_loss": -28.095849990844727, "global_step": 634060, "epoch": 7639} {"train_loss": -28.2847957611084, "global_step": 634061, "epoch": 7639} {"train_loss": -27.701587677001953, "global_step": 634062, "epoch": 7639} {"train_loss": -27.76019859313965, "global_step": 634063, "epoch": 7639} {"train_loss": -27.722705841064453, "global_step": 634064, "epoch": 7639} {"train_loss": -27.94927406311035, "global_step": 634065, "epoch": 7639} {"train_loss": -27.71754264831543, "global_step": 634066, "epoch": 7639} {"train_loss": -27.825292587280273, "global_step": 634067, "epoch": 7639} {"train_loss": -27.88944435119629, "global_step": 634068, "epoch": 7639} {"train_loss": -27.845046997070312, "global_step": 634069, "epoch": 7639} {"train_loss": -28.545654296875, "global_step": 634070, "epoch": 7639} {"train_loss": -28.204090118408203, "global_step": 634071, "epoch": 7639} {"train_loss": -28.05323600769043, "global_step": 634072, "epoch": 7639} {"train_loss": -28.24371337890625, "global_step": 634073, "epoch": 7639} {"train_loss": -28.261011123657227, "global_step": 634074, "epoch": 7639} {"train_loss": -28.118518829345703, "global_step": 634075, "epoch": 7639} {"train_loss": -28.137659072875977, "global_step": 634076, "epoch": 7639} {"train_loss": -28.018896102905273, "global_step": 634077, "epoch": 7639} {"train_loss": -28.321569442749023, "global_step": 634078, "epoch": 7639} {"train_loss": -28.262434005737305, "global_step": 634079, "epoch": 7639} {"train_loss": -28.269901275634766, "global_step": 634080, "epoch": 7639} {"train_loss": -28.285400390625, "global_step": 634081, "epoch": 7639} {"train_loss": -28.3065242767334, "global_step": 634082, "epoch": 7639} {"train_loss": -28.272226333618164, "global_step": 634083, "epoch": 7639} {"train_loss": -28.428516387939453, "global_step": 634084, "epoch": 7639} {"train_loss": -28.571441650390625, "global_step": 634085, "epoch": 7639} {"train_loss": -28.33048439025879, "global_step": 634086, "epoch": 7639} {"train_loss": -27.8879337310791, "global_step": 634087, "epoch": 7639} {"train_loss": -28.129364013671875, "global_step": 634088, "epoch": 7639} {"train_loss": -28.691415786743164, "global_step": 634089, "epoch": 7639} {"train_loss": -28.40885353088379, "global_step": 634090, "epoch": 7639} {"train_loss": -28.34382438659668, "global_step": 634091, "epoch": 7639} {"train_loss": -28.56731605529785, "global_step": 634092, "epoch": 7639} {"train_loss": -28.36372184753418, "global_step": 634093, "epoch": 7639} {"train_loss": -28.43768310546875, "global_step": 634094, "epoch": 7639} {"train_loss": -28.513294219970703, "global_step": 634095, "epoch": 7639} {"train_loss": -28.080957412719727, "global_step": 634096, "epoch": 7639} {"train_loss": -28.691436767578125, "global_step": 634097, "epoch": 7639} {"train_loss": -28.06305503845215, "global_step": 634098, "epoch": 7639} {"train_loss": -28.250823974609375, "global_step": 634099, "epoch": 7639} {"train_loss": -28.35629653930664, "global_step": 634100, "epoch": 7639} {"train_loss": -28.568389892578125, "global_step": 634101, "epoch": 7639} {"train_loss": -28.210346221923828, "global_step": 634102, "epoch": 7639} {"train_loss": -28.644500732421875, "global_step": 634103, "epoch": 7639} {"train_loss": -28.275903701782227, "global_step": 634104, "epoch": 7639} {"train_loss": -28.689863204956055, "global_step": 634105, "epoch": 7639} {"train_loss": -28.297128677368164, "global_step": 634106, "epoch": 7639} {"train_loss": -27.902021408081055, "global_step": 634107, "epoch": 7639} {"train_loss": -28.4744815826416, "global_step": 634108, "epoch": 7639} {"train_loss": -28.061676025390625, "global_step": 634109, "epoch": 7639} {"train_loss": -28.39533042907715, "global_step": 634110, "epoch": 7639} {"train_loss": -28.33771324157715, "global_step": 634111, "epoch": 7639} {"train_loss": -28.235595703125, "global_step": 634112, "epoch": 7639} {"train_loss": -28.081348419189453, "global_step": 634113, "epoch": 7639} {"train_loss": -28.44658851623535, "global_step": 634114, "epoch": 7639} {"train_loss": -28.209705352783203, "global_step": 634115, "epoch": 7639} {"train_loss": -28.39752197265625, "global_step": 634116, "epoch": 7639} {"train_loss": -28.14336585998535, "global_step": 634117, "epoch": 7639} {"train_loss": -28.365070343017578, "global_step": 634118, "epoch": 7639} {"train_loss": -28.02726127440671, "global_step": 634119, "epoch": 7639, "val_loss": 6786409.0} {"train_loss": -27.902475357055664, "global_step": 634120, "epoch": 7640} {"train_loss": -27.34855079650879, "global_step": 634121, "epoch": 7640} {"train_loss": -27.389331817626953, "global_step": 634122, "epoch": 7640} {"train_loss": -27.017358779907227, "global_step": 634123, "epoch": 7640} {"train_loss": -27.20088005065918, "global_step": 634124, "epoch": 7640} {"train_loss": -27.49452781677246, "global_step": 634125, "epoch": 7640} {"train_loss": -27.660306930541992, "global_step": 634126, "epoch": 7640} {"train_loss": -27.948911666870117, "global_step": 634127, "epoch": 7640} {"train_loss": -27.26865577697754, "global_step": 634128, "epoch": 7640} {"train_loss": -27.182348251342773, "global_step": 634129, "epoch": 7640} {"train_loss": -27.703479766845703, "global_step": 634130, "epoch": 7640} {"train_loss": -27.85312271118164, "global_step": 634131, "epoch": 7640} {"train_loss": -27.825754165649414, "global_step": 634132, "epoch": 7640} {"train_loss": -28.051122665405273, "global_step": 634133, "epoch": 7640} {"train_loss": -27.7366886138916, "global_step": 634134, "epoch": 7640} {"train_loss": -28.44988441467285, "global_step": 634135, "epoch": 7640} {"train_loss": -27.92976188659668, "global_step": 634136, "epoch": 7640} {"train_loss": -28.210235595703125, "global_step": 634137, "epoch": 7640} {"train_loss": -27.84067726135254, "global_step": 634138, "epoch": 7640} {"train_loss": -28.43124771118164, "global_step": 634139, "epoch": 7640} {"train_loss": -28.235260009765625, "global_step": 634140, "epoch": 7640} {"train_loss": -28.164020538330078, "global_step": 634141, "epoch": 7640} {"train_loss": -28.386682510375977, "global_step": 634142, "epoch": 7640} {"train_loss": -28.214746475219727, "global_step": 634143, "epoch": 7640} {"train_loss": -28.139501571655273, "global_step": 634144, "epoch": 7640} {"train_loss": -28.052734375, "global_step": 634145, "epoch": 7640} {"train_loss": -28.190195083618164, "global_step": 634146, "epoch": 7640} {"train_loss": -28.29387855529785, "global_step": 634147, "epoch": 7640} {"train_loss": -28.159833908081055, "global_step": 634148, "epoch": 7640} {"train_loss": -28.29599380493164, "global_step": 634149, "epoch": 7640} {"train_loss": -28.360010147094727, "global_step": 634150, "epoch": 7640} {"train_loss": -28.08355712890625, "global_step": 634151, "epoch": 7640} {"train_loss": -28.407575607299805, "global_step": 634152, "epoch": 7640} {"train_loss": -28.475866317749023, "global_step": 634153, "epoch": 7640} {"train_loss": -28.582141876220703, "global_step": 634154, "epoch": 7640} {"train_loss": -28.07765769958496, "global_step": 634155, "epoch": 7640} {"train_loss": -27.947805404663086, "global_step": 634156, "epoch": 7640} {"train_loss": -28.65846061706543, "global_step": 634157, "epoch": 7640} {"train_loss": -28.2855281829834, "global_step": 634158, "epoch": 7640} {"train_loss": -28.2272891998291, "global_step": 634159, "epoch": 7640} {"train_loss": -28.313373565673828, "global_step": 634160, "epoch": 7640} {"train_loss": -28.11091423034668, "global_step": 634161, "epoch": 7640} {"train_loss": -28.4208927154541, "global_step": 634162, "epoch": 7640} {"train_loss": -28.399524688720703, "global_step": 634163, "epoch": 7640} {"train_loss": -28.228046417236328, "global_step": 634164, "epoch": 7640} {"train_loss": -28.31819725036621, "global_step": 634165, "epoch": 7640} {"train_loss": -28.381494522094727, "global_step": 634166, "epoch": 7640} {"train_loss": -27.971349716186523, "global_step": 634167, "epoch": 7640} {"train_loss": -28.248132705688477, "global_step": 634168, "epoch": 7640} {"train_loss": -27.97781753540039, "global_step": 634169, "epoch": 7640} {"train_loss": -28.31593132019043, "global_step": 634170, "epoch": 7640} {"train_loss": -28.15771484375, "global_step": 634171, "epoch": 7640} {"train_loss": -27.64409828186035, "global_step": 634172, "epoch": 7640} {"train_loss": -28.08326530456543, "global_step": 634173, "epoch": 7640} {"train_loss": -28.077375411987305, "global_step": 634174, "epoch": 7640} {"train_loss": -28.091110229492188, "global_step": 634175, "epoch": 7640} {"train_loss": -28.177541732788086, "global_step": 634176, "epoch": 7640} {"train_loss": -27.989770889282227, "global_step": 634177, "epoch": 7640} {"train_loss": -28.09882926940918, "global_step": 634178, "epoch": 7640} {"train_loss": -27.95014762878418, "global_step": 634179, "epoch": 7640} {"train_loss": -28.115924835205078, "global_step": 634180, "epoch": 7640} {"train_loss": -28.271459579467773, "global_step": 634181, "epoch": 7640} {"train_loss": -28.194000244140625, "global_step": 634182, "epoch": 7640} {"train_loss": -28.19342041015625, "global_step": 634183, "epoch": 7640} {"train_loss": -28.38241958618164, "global_step": 634184, "epoch": 7640} {"train_loss": -28.26142692565918, "global_step": 634185, "epoch": 7640} {"train_loss": -28.426013946533203, "global_step": 634186, "epoch": 7640} {"train_loss": -28.220733642578125, "global_step": 634187, "epoch": 7640} {"train_loss": -28.260175704956055, "global_step": 634188, "epoch": 7640} {"train_loss": -28.602874755859375, "global_step": 634189, "epoch": 7640} {"train_loss": -28.81658935546875, "global_step": 634190, "epoch": 7640} {"train_loss": -28.275304794311523, "global_step": 634191, "epoch": 7640} {"train_loss": -28.15433120727539, "global_step": 634192, "epoch": 7640} {"train_loss": -28.14227867126465, "global_step": 634193, "epoch": 7640} {"train_loss": -28.220182418823242, "global_step": 634194, "epoch": 7640} {"train_loss": -27.872900009155273, "global_step": 634195, "epoch": 7640} {"train_loss": -28.133283615112305, "global_step": 634196, "epoch": 7640} {"train_loss": -28.718183517456055, "global_step": 634197, "epoch": 7640} {"train_loss": -28.065261840820312, "global_step": 634198, "epoch": 7640} {"train_loss": -27.814895629882812, "global_step": 634199, "epoch": 7640} {"train_loss": -28.337427139282227, "global_step": 634200, "epoch": 7640} {"train_loss": -28.500940322875977, "global_step": 634201, "epoch": 7640} {"train_loss": -28.09161330992917, "global_step": 634202, "epoch": 7640, "val_loss": 6905390.0} {"train_loss": -26.653913497924805, "global_step": 634203, "epoch": 7641} {"train_loss": -25.430034637451172, "global_step": 634204, "epoch": 7641} {"train_loss": -25.65793800354004, "global_step": 634205, "epoch": 7641} {"train_loss": -27.25349235534668, "global_step": 634206, "epoch": 7641} {"train_loss": -26.761505126953125, "global_step": 634207, "epoch": 7641} {"train_loss": -26.895536422729492, "global_step": 634208, "epoch": 7641} {"train_loss": -26.529861450195312, "global_step": 634209, "epoch": 7641} {"train_loss": -27.03614616394043, "global_step": 634210, "epoch": 7641} {"train_loss": -26.41364097595215, "global_step": 634211, "epoch": 7641} {"train_loss": -27.409900665283203, "global_step": 634212, "epoch": 7641} {"train_loss": -27.44684410095215, "global_step": 634213, "epoch": 7641} {"train_loss": -27.39432716369629, "global_step": 634214, "epoch": 7641} {"train_loss": -27.3471736907959, "global_step": 634215, "epoch": 7641} {"train_loss": -27.480545043945312, "global_step": 634216, "epoch": 7641} {"train_loss": -27.127389907836914, "global_step": 634217, "epoch": 7641} {"train_loss": -27.332143783569336, "global_step": 634218, "epoch": 7641} {"train_loss": -27.302473068237305, "global_step": 634219, "epoch": 7641} {"train_loss": -27.215330123901367, "global_step": 634220, "epoch": 7641} {"train_loss": -27.795007705688477, "global_step": 634221, "epoch": 7641} {"train_loss": -27.5330753326416, "global_step": 634222, "epoch": 7641} {"train_loss": -27.712446212768555, "global_step": 634223, "epoch": 7641} {"train_loss": -27.501951217651367, "global_step": 634224, "epoch": 7641} {"train_loss": -27.8519229888916, "global_step": 634225, "epoch": 7641} {"train_loss": -28.13919448852539, "global_step": 634226, "epoch": 7641} {"train_loss": -27.932764053344727, "global_step": 634227, "epoch": 7641} {"train_loss": -28.016326904296875, "global_step": 634228, "epoch": 7641} {"train_loss": -27.861236572265625, "global_step": 634229, "epoch": 7641} {"train_loss": -27.82294273376465, "global_step": 634230, "epoch": 7641} {"train_loss": -28.2906436920166, "global_step": 634231, "epoch": 7641} {"train_loss": -27.856952667236328, "global_step": 634232, "epoch": 7641} {"train_loss": -27.59449577331543, "global_step": 634233, "epoch": 7641} {"train_loss": -28.11976432800293, "global_step": 634234, "epoch": 7641} {"train_loss": -27.956689834594727, "global_step": 634235, "epoch": 7641} {"train_loss": -27.827468872070312, "global_step": 634236, "epoch": 7641} {"train_loss": -28.158735275268555, "global_step": 634237, "epoch": 7641} {"train_loss": -28.49591636657715, "global_step": 634238, "epoch": 7641} {"train_loss": -28.080774307250977, "global_step": 634239, "epoch": 7641} {"train_loss": -27.999454498291016, "global_step": 634240, "epoch": 7641} {"train_loss": -28.05878257751465, "global_step": 634241, "epoch": 7641} {"train_loss": -28.126785278320312, "global_step": 634242, "epoch": 7641} {"train_loss": -28.26775550842285, "global_step": 634243, "epoch": 7641} {"train_loss": -28.022485733032227, "global_step": 634244, "epoch": 7641} {"train_loss": -28.5961856842041, "global_step": 634245, "epoch": 7641} {"train_loss": -28.253040313720703, "global_step": 634246, "epoch": 7641} {"train_loss": -28.36188316345215, "global_step": 634247, "epoch": 7641} {"train_loss": -28.1956844329834, "global_step": 634248, "epoch": 7641} {"train_loss": -28.298065185546875, "global_step": 634249, "epoch": 7641} {"train_loss": -28.418699264526367, "global_step": 634250, "epoch": 7641} {"train_loss": -27.837427139282227, "global_step": 634251, "epoch": 7641} {"train_loss": -28.710174560546875, "global_step": 634252, "epoch": 7641} {"train_loss": -28.262598037719727, "global_step": 634253, "epoch": 7641} {"train_loss": -28.235925674438477, "global_step": 634254, "epoch": 7641} {"train_loss": -28.461538314819336, "global_step": 634255, "epoch": 7641} {"train_loss": -28.187366485595703, "global_step": 634256, "epoch": 7641} {"train_loss": -28.146066665649414, "global_step": 634257, "epoch": 7641} {"train_loss": -28.5248966217041, "global_step": 634258, "epoch": 7641} {"train_loss": -28.43191909790039, "global_step": 634259, "epoch": 7641} {"train_loss": -28.429590225219727, "global_step": 634260, "epoch": 7641} {"train_loss": -28.3542423248291, "global_step": 634261, "epoch": 7641} {"train_loss": -28.182016372680664, "global_step": 634262, "epoch": 7641} {"train_loss": -28.649648666381836, "global_step": 634263, "epoch": 7641} {"train_loss": -28.28192138671875, "global_step": 634264, "epoch": 7641} {"train_loss": -28.29884910583496, "global_step": 634265, "epoch": 7641} {"train_loss": -28.677648544311523, "global_step": 634266, "epoch": 7641} {"train_loss": -28.652206420898438, "global_step": 634267, "epoch": 7641} {"train_loss": -28.275476455688477, "global_step": 634268, "epoch": 7641} {"train_loss": -28.063695907592773, "global_step": 634269, "epoch": 7641} {"train_loss": -28.208179473876953, "global_step": 634270, "epoch": 7641} {"train_loss": -28.65931510925293, "global_step": 634271, "epoch": 7641} {"train_loss": -28.711084365844727, "global_step": 634272, "epoch": 7641} {"train_loss": -28.209869384765625, "global_step": 634273, "epoch": 7641} {"train_loss": -28.6177978515625, "global_step": 634274, "epoch": 7641} {"train_loss": -28.518905639648438, "global_step": 634275, "epoch": 7641} {"train_loss": -28.078596115112305, "global_step": 634276, "epoch": 7641} {"train_loss": -28.075531005859375, "global_step": 634277, "epoch": 7641} {"train_loss": -27.991865158081055, "global_step": 634278, "epoch": 7641} {"train_loss": -27.8339786529541, "global_step": 634279, "epoch": 7641} {"train_loss": -28.22454261779785, "global_step": 634280, "epoch": 7641} {"train_loss": -27.99383544921875, "global_step": 634281, "epoch": 7641} {"train_loss": -28.277301788330078, "global_step": 634282, "epoch": 7641} {"train_loss": -28.3990535736084, "global_step": 634283, "epoch": 7641} {"train_loss": -28.67084312438965, "global_step": 634284, "epoch": 7641} {"train_loss": -27.934279843985315, "global_step": 634285, "epoch": 7641, "val_loss": 6900412.0} {"train_loss": -24.820810317993164, "global_step": 634286, "epoch": 7642} {"train_loss": -25.439544677734375, "global_step": 634287, "epoch": 7642} {"train_loss": -27.418659210205078, "global_step": 634288, "epoch": 7642} {"train_loss": -26.8928165435791, "global_step": 634289, "epoch": 7642} {"train_loss": -26.943777084350586, "global_step": 634290, "epoch": 7642} {"train_loss": -26.3165283203125, "global_step": 634291, "epoch": 7642} {"train_loss": -27.074682235717773, "global_step": 634292, "epoch": 7642} {"train_loss": -27.077238082885742, "global_step": 634293, "epoch": 7642} {"train_loss": -27.077091217041016, "global_step": 634294, "epoch": 7642} {"train_loss": -27.51185417175293, "global_step": 634295, "epoch": 7642} {"train_loss": -27.22382164001465, "global_step": 634296, "epoch": 7642} {"train_loss": -27.226943969726562, "global_step": 634297, "epoch": 7642} {"train_loss": -27.141372680664062, "global_step": 634298, "epoch": 7642} {"train_loss": -27.273029327392578, "global_step": 634299, "epoch": 7642} {"train_loss": -27.687280654907227, "global_step": 634300, "epoch": 7642} {"train_loss": -27.367584228515625, "global_step": 634301, "epoch": 7642} {"train_loss": -27.010854721069336, "global_step": 634302, "epoch": 7642} {"train_loss": -27.480844497680664, "global_step": 634303, "epoch": 7642} {"train_loss": -27.50299644470215, "global_step": 634304, "epoch": 7642} {"train_loss": -27.47385025024414, "global_step": 634305, "epoch": 7642} {"train_loss": -27.627979278564453, "global_step": 634306, "epoch": 7642} {"train_loss": -27.510435104370117, "global_step": 634307, "epoch": 7642} {"train_loss": -27.795202255249023, "global_step": 634308, "epoch": 7642} {"train_loss": -27.421728134155273, "global_step": 634309, "epoch": 7642} {"train_loss": -28.045764923095703, "global_step": 634310, "epoch": 7642} {"train_loss": -28.21906089782715, "global_step": 634311, "epoch": 7642} {"train_loss": -27.867109298706055, "global_step": 634312, "epoch": 7642} {"train_loss": -27.846176147460938, "global_step": 634313, "epoch": 7642} {"train_loss": -28.1452693939209, "global_step": 634314, "epoch": 7642} {"train_loss": -28.221036911010742, "global_step": 634315, "epoch": 7642} {"train_loss": -28.02699089050293, "global_step": 634316, "epoch": 7642} {"train_loss": -27.66847038269043, "global_step": 634317, "epoch": 7642} {"train_loss": -28.112873077392578, "global_step": 634318, "epoch": 7642} {"train_loss": -28.143096923828125, "global_step": 634319, "epoch": 7642} {"train_loss": -28.551855087280273, "global_step": 634320, "epoch": 7642} {"train_loss": -28.440948486328125, "global_step": 634321, "epoch": 7642} {"train_loss": -27.941883087158203, "global_step": 634322, "epoch": 7642} {"train_loss": -28.159912109375, "global_step": 634323, "epoch": 7642} {"train_loss": -28.0258731842041, "global_step": 634324, "epoch": 7642} {"train_loss": -28.284576416015625, "global_step": 634325, "epoch": 7642} {"train_loss": -28.055784225463867, "global_step": 634326, "epoch": 7642} {"train_loss": -28.35529899597168, "global_step": 634327, "epoch": 7642} {"train_loss": -28.241117477416992, "global_step": 634328, "epoch": 7642} {"train_loss": -28.444421768188477, "global_step": 634329, "epoch": 7642} {"train_loss": -28.49616050720215, "global_step": 634330, "epoch": 7642} {"train_loss": -28.349634170532227, "global_step": 634331, "epoch": 7642} {"train_loss": -28.40632438659668, "global_step": 634332, "epoch": 7642} {"train_loss": -28.486637115478516, "global_step": 634333, "epoch": 7642} {"train_loss": -28.41200065612793, "global_step": 634334, "epoch": 7642} {"train_loss": -28.076868057250977, "global_step": 634335, "epoch": 7642} {"train_loss": -28.6445369720459, "global_step": 634336, "epoch": 7642} {"train_loss": -28.170001983642578, "global_step": 634337, "epoch": 7642} {"train_loss": -28.486103057861328, "global_step": 634338, "epoch": 7642} {"train_loss": -28.628433227539062, "global_step": 634339, "epoch": 7642} {"train_loss": -28.445737838745117, "global_step": 634340, "epoch": 7642} {"train_loss": -28.058704376220703, "global_step": 634341, "epoch": 7642} {"train_loss": -28.16657829284668, "global_step": 634342, "epoch": 7642} {"train_loss": -28.226947784423828, "global_step": 634343, "epoch": 7642} {"train_loss": -28.632232666015625, "global_step": 634344, "epoch": 7642} {"train_loss": -28.308441162109375, "global_step": 634345, "epoch": 7642} {"train_loss": -28.030841827392578, "global_step": 634346, "epoch": 7642} {"train_loss": -28.14576530456543, "global_step": 634347, "epoch": 7642} {"train_loss": -28.077972412109375, "global_step": 634348, "epoch": 7642} {"train_loss": -28.24098014831543, "global_step": 634349, "epoch": 7642} {"train_loss": -28.20758628845215, "global_step": 634350, "epoch": 7642} {"train_loss": -28.013874053955078, "global_step": 634351, "epoch": 7642} {"train_loss": -28.307214736938477, "global_step": 634352, "epoch": 7642} {"train_loss": -28.27863883972168, "global_step": 634353, "epoch": 7642} {"train_loss": -28.05167579650879, "global_step": 634354, "epoch": 7642} {"train_loss": -27.917709350585938, "global_step": 634355, "epoch": 7642} {"train_loss": -27.703832626342773, "global_step": 634356, "epoch": 7642} {"train_loss": -27.583118438720703, "global_step": 634357, "epoch": 7642} {"train_loss": -28.2673282623291, "global_step": 634358, "epoch": 7642} {"train_loss": -28.324445724487305, "global_step": 634359, "epoch": 7642} {"train_loss": -28.142730712890625, "global_step": 634360, "epoch": 7642} {"train_loss": -28.076587677001953, "global_step": 634361, "epoch": 7642} {"train_loss": -28.464197158813477, "global_step": 634362, "epoch": 7642} {"train_loss": -28.360082626342773, "global_step": 634363, "epoch": 7642} {"train_loss": -28.197362899780273, "global_step": 634364, "epoch": 7642} {"train_loss": -28.299352645874023, "global_step": 634365, "epoch": 7642} {"train_loss": -28.48358154296875, "global_step": 634366, "epoch": 7642} {"train_loss": -28.475128173828125, "global_step": 634367, "epoch": 7642} {"train_loss": -27.87376245245876, "global_step": 634368, "epoch": 7642, "val_loss": 6845992.5} {"train_loss": -27.904470443725586, "global_step": 634369, "epoch": 7643} {"train_loss": -26.959003448486328, "global_step": 634370, "epoch": 7643} {"train_loss": -27.433032989501953, "global_step": 634371, "epoch": 7643} {"train_loss": -27.324560165405273, "global_step": 634372, "epoch": 7643} {"train_loss": -27.283308029174805, "global_step": 634373, "epoch": 7643} {"train_loss": -27.097875595092773, "global_step": 634374, "epoch": 7643} {"train_loss": -27.815832138061523, "global_step": 634375, "epoch": 7643} {"train_loss": -27.581674575805664, "global_step": 634376, "epoch": 7643} {"train_loss": -28.08550453186035, "global_step": 634377, "epoch": 7643} {"train_loss": -27.5372371673584, "global_step": 634378, "epoch": 7643} {"train_loss": -27.865619659423828, "global_step": 634379, "epoch": 7643} {"train_loss": -27.962888717651367, "global_step": 634380, "epoch": 7643} {"train_loss": -27.90602684020996, "global_step": 634381, "epoch": 7643} {"train_loss": -27.51419448852539, "global_step": 634382, "epoch": 7643} {"train_loss": -27.94318962097168, "global_step": 634383, "epoch": 7643} {"train_loss": -27.81190299987793, "global_step": 634384, "epoch": 7643} {"train_loss": -27.567956924438477, "global_step": 634385, "epoch": 7643} {"train_loss": -27.73821449279785, "global_step": 634386, "epoch": 7643} {"train_loss": -27.90677833557129, "global_step": 634387, "epoch": 7643} {"train_loss": -27.903257369995117, "global_step": 634388, "epoch": 7643} {"train_loss": -28.011173248291016, "global_step": 634389, "epoch": 7643} {"train_loss": -27.97600746154785, "global_step": 634390, "epoch": 7643} {"train_loss": -27.9726505279541, "global_step": 634391, "epoch": 7643} {"train_loss": -28.19189453125, "global_step": 634392, "epoch": 7643} {"train_loss": -27.848840713500977, "global_step": 634393, "epoch": 7643} {"train_loss": -28.248762130737305, "global_step": 634394, "epoch": 7643} {"train_loss": -28.14402198791504, "global_step": 634395, "epoch": 7643} {"train_loss": -27.900693893432617, "global_step": 634396, "epoch": 7643} {"train_loss": -28.348331451416016, "global_step": 634397, "epoch": 7643} {"train_loss": -28.046377182006836, "global_step": 634398, "epoch": 7643} {"train_loss": -28.712554931640625, "global_step": 634399, "epoch": 7643} {"train_loss": -28.335386276245117, "global_step": 634400, "epoch": 7643} {"train_loss": -28.52532386779785, "global_step": 634401, "epoch": 7643} {"train_loss": -28.363733291625977, "global_step": 634402, "epoch": 7643} {"train_loss": -28.358627319335938, "global_step": 634403, "epoch": 7643} {"train_loss": -28.550159454345703, "global_step": 634404, "epoch": 7643} {"train_loss": -28.3154296875, "global_step": 634405, "epoch": 7643} {"train_loss": -28.350067138671875, "global_step": 634406, "epoch": 7643} {"train_loss": -28.161035537719727, "global_step": 634407, "epoch": 7643} {"train_loss": -28.451940536499023, "global_step": 634408, "epoch": 7643} {"train_loss": -28.604944229125977, "global_step": 634409, "epoch": 7643} {"train_loss": -28.655868530273438, "global_step": 634410, "epoch": 7643} {"train_loss": -28.675479888916016, "global_step": 634411, "epoch": 7643} {"train_loss": -28.30498695373535, "global_step": 634412, "epoch": 7643} {"train_loss": -28.509632110595703, "global_step": 634413, "epoch": 7643} {"train_loss": -28.552576065063477, "global_step": 634414, "epoch": 7643} {"train_loss": -28.43453025817871, "global_step": 634415, "epoch": 7643} {"train_loss": -28.395654678344727, "global_step": 634416, "epoch": 7643} {"train_loss": -28.399145126342773, "global_step": 634417, "epoch": 7643} {"train_loss": -28.44618034362793, "global_step": 634418, "epoch": 7643} {"train_loss": -28.61225700378418, "global_step": 634419, "epoch": 7643} {"train_loss": -28.36237907409668, "global_step": 634420, "epoch": 7643} {"train_loss": -28.45588493347168, "global_step": 634421, "epoch": 7643} {"train_loss": -28.453840255737305, "global_step": 634422, "epoch": 7643} {"train_loss": -28.30634880065918, "global_step": 634423, "epoch": 7643} {"train_loss": -28.4726505279541, "global_step": 634424, "epoch": 7643} {"train_loss": -28.5913028717041, "global_step": 634425, "epoch": 7643} {"train_loss": -28.666425704956055, "global_step": 634426, "epoch": 7643} {"train_loss": -28.504220962524414, "global_step": 634427, "epoch": 7643} {"train_loss": -28.431203842163086, "global_step": 634428, "epoch": 7643} {"train_loss": -28.55506706237793, "global_step": 634429, "epoch": 7643} {"train_loss": -28.69742202758789, "global_step": 634430, "epoch": 7643} {"train_loss": -28.437665939331055, "global_step": 634431, "epoch": 7643} {"train_loss": -28.165088653564453, "global_step": 634432, "epoch": 7643} {"train_loss": -28.617584228515625, "global_step": 634433, "epoch": 7643} {"train_loss": -27.7652587890625, "global_step": 634434, "epoch": 7643} {"train_loss": -27.879241943359375, "global_step": 634435, "epoch": 7643} {"train_loss": -28.037839889526367, "global_step": 634436, "epoch": 7643} {"train_loss": -28.09015464782715, "global_step": 634437, "epoch": 7643} {"train_loss": -28.33906364440918, "global_step": 634438, "epoch": 7643} {"train_loss": -28.387680053710938, "global_step": 634439, "epoch": 7643} {"train_loss": -28.756261825561523, "global_step": 634440, "epoch": 7643} {"train_loss": -28.325605392456055, "global_step": 634441, "epoch": 7643} {"train_loss": -28.21845817565918, "global_step": 634442, "epoch": 7643} {"train_loss": -28.19898796081543, "global_step": 634443, "epoch": 7643} {"train_loss": -28.12786293029785, "global_step": 634444, "epoch": 7643} {"train_loss": -28.388044357299805, "global_step": 634445, "epoch": 7643} {"train_loss": -28.24175453186035, "global_step": 634446, "epoch": 7643} {"train_loss": -28.710485458374023, "global_step": 634447, "epoch": 7643} {"train_loss": -28.13632583618164, "global_step": 634448, "epoch": 7643} {"train_loss": -28.33510398864746, "global_step": 634449, "epoch": 7643} {"train_loss": -28.396711349487305, "global_step": 634450, "epoch": 7643} {"train_loss": -28.17599666549499, "global_step": 634451, "epoch": 7643, "val_loss": 6826807.5} {"train_loss": -25.602447509765625, "global_step": 634452, "epoch": 7644} {"train_loss": -23.360811233520508, "global_step": 634453, "epoch": 7644} {"train_loss": -25.029178619384766, "global_step": 634454, "epoch": 7644} {"train_loss": -26.820547103881836, "global_step": 634455, "epoch": 7644} {"train_loss": -27.168292999267578, "global_step": 634456, "epoch": 7644} {"train_loss": -26.9856014251709, "global_step": 634457, "epoch": 7644} {"train_loss": -26.82538414001465, "global_step": 634458, "epoch": 7644} {"train_loss": -26.771265029907227, "global_step": 634459, "epoch": 7644} {"train_loss": -26.597543716430664, "global_step": 634460, "epoch": 7644} {"train_loss": -27.714609146118164, "global_step": 634461, "epoch": 7644} {"train_loss": -26.93617820739746, "global_step": 634462, "epoch": 7644} {"train_loss": -27.15592384338379, "global_step": 634463, "epoch": 7644} {"train_loss": -27.272933959960938, "global_step": 634464, "epoch": 7644} {"train_loss": -27.104902267456055, "global_step": 634465, "epoch": 7644} {"train_loss": -27.202863693237305, "global_step": 634466, "epoch": 7644} {"train_loss": -27.407724380493164, "global_step": 634467, "epoch": 7644} {"train_loss": -27.3828182220459, "global_step": 634468, "epoch": 7644} {"train_loss": -27.244115829467773, "global_step": 634469, "epoch": 7644} {"train_loss": -27.6680850982666, "global_step": 634470, "epoch": 7644} {"train_loss": -27.337621688842773, "global_step": 634471, "epoch": 7644} {"train_loss": -27.5305233001709, "global_step": 634472, "epoch": 7644} {"train_loss": -27.60407066345215, "global_step": 634473, "epoch": 7644} {"train_loss": -27.59902000427246, "global_step": 634474, "epoch": 7644} {"train_loss": -27.704206466674805, "global_step": 634475, "epoch": 7644} {"train_loss": -27.91285514831543, "global_step": 634476, "epoch": 7644} {"train_loss": -27.670578002929688, "global_step": 634477, "epoch": 7644} {"train_loss": -27.79781150817871, "global_step": 634478, "epoch": 7644} {"train_loss": -27.489898681640625, "global_step": 634479, "epoch": 7644} {"train_loss": -28.226001739501953, "global_step": 634480, "epoch": 7644} {"train_loss": -27.836029052734375, "global_step": 634481, "epoch": 7644} {"train_loss": -27.726795196533203, "global_step": 634482, "epoch": 7644} {"train_loss": -28.161996841430664, "global_step": 634483, "epoch": 7644} {"train_loss": -27.87166404724121, "global_step": 634484, "epoch": 7644} {"train_loss": -27.701780319213867, "global_step": 634485, "epoch": 7644} {"train_loss": -27.867053985595703, "global_step": 634486, "epoch": 7644} {"train_loss": -27.99224281311035, "global_step": 634487, "epoch": 7644} {"train_loss": -27.868131637573242, "global_step": 634488, "epoch": 7644} {"train_loss": -27.776105880737305, "global_step": 634489, "epoch": 7644} {"train_loss": -27.90120506286621, "global_step": 634490, "epoch": 7644} {"train_loss": -28.174346923828125, "global_step": 634491, "epoch": 7644} {"train_loss": -28.27174186706543, "global_step": 634492, "epoch": 7644} {"train_loss": -28.108795166015625, "global_step": 634493, "epoch": 7644} {"train_loss": -27.98444175720215, "global_step": 634494, "epoch": 7644} {"train_loss": -28.310285568237305, "global_step": 634495, "epoch": 7644} {"train_loss": -28.411853790283203, "global_step": 634496, "epoch": 7644} {"train_loss": -28.316608428955078, "global_step": 634497, "epoch": 7644} {"train_loss": -28.441747665405273, "global_step": 634498, "epoch": 7644} {"train_loss": -28.217742919921875, "global_step": 634499, "epoch": 7644} {"train_loss": -28.739501953125, "global_step": 634500, "epoch": 7644} {"train_loss": -28.28193473815918, "global_step": 634501, "epoch": 7644} {"train_loss": -28.53818702697754, "global_step": 634502, "epoch": 7644} {"train_loss": -27.80495262145996, "global_step": 634503, "epoch": 7644} {"train_loss": -28.317035675048828, "global_step": 634504, "epoch": 7644} {"train_loss": -28.37005615234375, "global_step": 634505, "epoch": 7644} {"train_loss": -28.205312728881836, "global_step": 634506, "epoch": 7644} {"train_loss": -28.365774154663086, "global_step": 634507, "epoch": 7644} {"train_loss": -28.317224502563477, "global_step": 634508, "epoch": 7644} {"train_loss": -28.34673500061035, "global_step": 634509, "epoch": 7644} {"train_loss": -28.353519439697266, "global_step": 634510, "epoch": 7644} {"train_loss": -27.959293365478516, "global_step": 634511, "epoch": 7644} {"train_loss": -28.459253311157227, "global_step": 634512, "epoch": 7644} {"train_loss": -28.340152740478516, "global_step": 634513, "epoch": 7644} {"train_loss": -28.129850387573242, "global_step": 634514, "epoch": 7644} {"train_loss": -28.3846435546875, "global_step": 634515, "epoch": 7644} {"train_loss": -28.312896728515625, "global_step": 634516, "epoch": 7644} {"train_loss": -28.418689727783203, "global_step": 634517, "epoch": 7644} {"train_loss": -28.173181533813477, "global_step": 634518, "epoch": 7644} {"train_loss": -28.598026275634766, "global_step": 634519, "epoch": 7644} {"train_loss": -28.234811782836914, "global_step": 634520, "epoch": 7644} {"train_loss": -27.967432022094727, "global_step": 634521, "epoch": 7644} {"train_loss": -28.41023826599121, "global_step": 634522, "epoch": 7644} {"train_loss": -28.954700469970703, "global_step": 634523, "epoch": 7644} {"train_loss": -28.29501724243164, "global_step": 634524, "epoch": 7644} {"train_loss": -28.06357765197754, "global_step": 634525, "epoch": 7644} {"train_loss": -28.228445053100586, "global_step": 634526, "epoch": 7644} {"train_loss": -28.152246475219727, "global_step": 634527, "epoch": 7644} {"train_loss": -28.444137573242188, "global_step": 634528, "epoch": 7644} {"train_loss": -28.42913818359375, "global_step": 634529, "epoch": 7644} {"train_loss": -28.251163482666016, "global_step": 634530, "epoch": 7644} {"train_loss": -27.882003784179688, "global_step": 634531, "epoch": 7644} {"train_loss": -28.44538688659668, "global_step": 634532, "epoch": 7644} {"train_loss": -28.714115142822266, "global_step": 634533, "epoch": 7644} {"train_loss": -27.822828476687512, "global_step": 634534, "epoch": 7644, "val_loss": 6774291.0} {"train_loss": -26.720067977905273, "global_step": 634535, "epoch": 7645} {"train_loss": -26.73276710510254, "global_step": 634536, "epoch": 7645} {"train_loss": -26.717573165893555, "global_step": 634537, "epoch": 7645} {"train_loss": -25.91330909729004, "global_step": 634538, "epoch": 7645} {"train_loss": -26.229394912719727, "global_step": 634539, "epoch": 7645} {"train_loss": -27.51716423034668, "global_step": 634540, "epoch": 7645} {"train_loss": -26.782678604125977, "global_step": 634541, "epoch": 7645} {"train_loss": -27.77960205078125, "global_step": 634542, "epoch": 7645} {"train_loss": -27.194833755493164, "global_step": 634543, "epoch": 7645} {"train_loss": -27.50431251525879, "global_step": 634544, "epoch": 7645} {"train_loss": -27.60569190979004, "global_step": 634545, "epoch": 7645} {"train_loss": -27.266571044921875, "global_step": 634546, "epoch": 7645} {"train_loss": -27.970600128173828, "global_step": 634547, "epoch": 7645} {"train_loss": -27.26618003845215, "global_step": 634548, "epoch": 7645} {"train_loss": -27.501678466796875, "global_step": 634549, "epoch": 7645} {"train_loss": -27.61545753479004, "global_step": 634550, "epoch": 7645} {"train_loss": -27.6971378326416, "global_step": 634551, "epoch": 7645} {"train_loss": -27.85162353515625, "global_step": 634552, "epoch": 7645} {"train_loss": -27.862619400024414, "global_step": 634553, "epoch": 7645} {"train_loss": -27.616657257080078, "global_step": 634554, "epoch": 7645} {"train_loss": -27.992130279541016, "global_step": 634555, "epoch": 7645} {"train_loss": -27.489322662353516, "global_step": 634556, "epoch": 7645} {"train_loss": -27.806543350219727, "global_step": 634557, "epoch": 7645} {"train_loss": -27.81818199157715, "global_step": 634558, "epoch": 7645} {"train_loss": -27.886220932006836, "global_step": 634559, "epoch": 7645} {"train_loss": -27.76312255859375, "global_step": 634560, "epoch": 7645} {"train_loss": -28.078754425048828, "global_step": 634561, "epoch": 7645} {"train_loss": -27.87223243713379, "global_step": 634562, "epoch": 7645} {"train_loss": -28.282251358032227, "global_step": 634563, "epoch": 7645} {"train_loss": -27.994709014892578, "global_step": 634564, "epoch": 7645} {"train_loss": -28.004547119140625, "global_step": 634565, "epoch": 7645} {"train_loss": -28.00056266784668, "global_step": 634566, "epoch": 7645} {"train_loss": -27.981647491455078, "global_step": 634567, "epoch": 7645} {"train_loss": -28.045368194580078, "global_step": 634568, "epoch": 7645} {"train_loss": -27.967227935791016, "global_step": 634569, "epoch": 7645} {"train_loss": -28.512014389038086, "global_step": 634570, "epoch": 7645} {"train_loss": -28.160852432250977, "global_step": 634571, "epoch": 7645} {"train_loss": -28.388843536376953, "global_step": 634572, "epoch": 7645} {"train_loss": -28.017017364501953, "global_step": 634573, "epoch": 7645} {"train_loss": -28.068078994750977, "global_step": 634574, "epoch": 7645} {"train_loss": -28.515974044799805, "global_step": 634575, "epoch": 7645} {"train_loss": -28.21231460571289, "global_step": 634576, "epoch": 7645} {"train_loss": -28.30386734008789, "global_step": 634577, "epoch": 7645} {"train_loss": -28.236663818359375, "global_step": 634578, "epoch": 7645} {"train_loss": -28.178312301635742, "global_step": 634579, "epoch": 7645} {"train_loss": -28.219274520874023, "global_step": 634580, "epoch": 7645} {"train_loss": -28.40778160095215, "global_step": 634581, "epoch": 7645} {"train_loss": -28.320636749267578, "global_step": 634582, "epoch": 7645} {"train_loss": -28.434295654296875, "global_step": 634583, "epoch": 7645} {"train_loss": -28.45115089416504, "global_step": 634584, "epoch": 7645} {"train_loss": -28.554691314697266, "global_step": 634585, "epoch": 7645} {"train_loss": -28.40894889831543, "global_step": 634586, "epoch": 7645} {"train_loss": -28.2519474029541, "global_step": 634587, "epoch": 7645} {"train_loss": -28.386932373046875, "global_step": 634588, "epoch": 7645} {"train_loss": -28.48981285095215, "global_step": 634589, "epoch": 7645} {"train_loss": -28.12680435180664, "global_step": 634590, "epoch": 7645} {"train_loss": -28.65565299987793, "global_step": 634591, "epoch": 7645} {"train_loss": -28.527212142944336, "global_step": 634592, "epoch": 7645} {"train_loss": -28.58233642578125, "global_step": 634593, "epoch": 7645} {"train_loss": -28.604772567749023, "global_step": 634594, "epoch": 7645} {"train_loss": -28.96882438659668, "global_step": 634595, "epoch": 7645} {"train_loss": -28.45338249206543, "global_step": 634596, "epoch": 7645} {"train_loss": -28.58088493347168, "global_step": 634597, "epoch": 7645} {"train_loss": -28.535924911499023, "global_step": 634598, "epoch": 7645} {"train_loss": -28.4881649017334, "global_step": 634599, "epoch": 7645} {"train_loss": -28.202625274658203, "global_step": 634600, "epoch": 7645} {"train_loss": -28.304065704345703, "global_step": 634601, "epoch": 7645} {"train_loss": -28.04762077331543, "global_step": 634602, "epoch": 7645} {"train_loss": -27.960947036743164, "global_step": 634603, "epoch": 7645} {"train_loss": -27.679962158203125, "global_step": 634604, "epoch": 7645} {"train_loss": -27.9022216796875, "global_step": 634605, "epoch": 7645} {"train_loss": -28.299530029296875, "global_step": 634606, "epoch": 7645} {"train_loss": -27.702823638916016, "global_step": 634607, "epoch": 7645} {"train_loss": -27.6031494140625, "global_step": 634608, "epoch": 7645} {"train_loss": -27.883203506469727, "global_step": 634609, "epoch": 7645} {"train_loss": -27.876972198486328, "global_step": 634610, "epoch": 7645} {"train_loss": -27.86945152282715, "global_step": 634611, "epoch": 7645} {"train_loss": -28.242948532104492, "global_step": 634612, "epoch": 7645} {"train_loss": -27.982114791870117, "global_step": 634613, "epoch": 7645} {"train_loss": -28.2526912689209, "global_step": 634614, "epoch": 7645} {"train_loss": -28.23566246032715, "global_step": 634615, "epoch": 7645} {"train_loss": -27.7790584564209, "global_step": 634616, "epoch": 7645} {"train_loss": -27.95999584427799, "global_step": 634617, "epoch": 7645, "val_loss": 6843357.0} {"train_loss": -27.424118041992188, "global_step": 634618, "epoch": 7646} {"train_loss": -27.148223876953125, "global_step": 634619, "epoch": 7646} {"train_loss": -27.66947364807129, "global_step": 634620, "epoch": 7646} {"train_loss": -27.596765518188477, "global_step": 634621, "epoch": 7646} {"train_loss": -27.1120548248291, "global_step": 634622, "epoch": 7646} {"train_loss": -26.83942985534668, "global_step": 634623, "epoch": 7646} {"train_loss": -27.109045028686523, "global_step": 634624, "epoch": 7646} {"train_loss": -27.532562255859375, "global_step": 634625, "epoch": 7646} {"train_loss": -27.06583023071289, "global_step": 634626, "epoch": 7646} {"train_loss": -27.406818389892578, "global_step": 634627, "epoch": 7646} {"train_loss": -27.73589515686035, "global_step": 634628, "epoch": 7646} {"train_loss": -27.761829376220703, "global_step": 634629, "epoch": 7646} {"train_loss": -27.677350997924805, "global_step": 634630, "epoch": 7646} {"train_loss": -27.97200584411621, "global_step": 634631, "epoch": 7646} {"train_loss": -27.5922908782959, "global_step": 634632, "epoch": 7646} {"train_loss": -28.056608200073242, "global_step": 634633, "epoch": 7646} {"train_loss": -27.823657989501953, "global_step": 634634, "epoch": 7646} {"train_loss": -28.092809677124023, "global_step": 634635, "epoch": 7646} {"train_loss": -27.888288497924805, "global_step": 634636, "epoch": 7646} {"train_loss": -27.9462947845459, "global_step": 634637, "epoch": 7646} {"train_loss": -27.888410568237305, "global_step": 634638, "epoch": 7646} {"train_loss": -28.117385864257812, "global_step": 634639, "epoch": 7646} {"train_loss": -28.32642936706543, "global_step": 634640, "epoch": 7646} {"train_loss": -28.182281494140625, "global_step": 634641, "epoch": 7646} {"train_loss": -28.130590438842773, "global_step": 634642, "epoch": 7646} {"train_loss": -27.958337783813477, "global_step": 634643, "epoch": 7646} {"train_loss": -27.895288467407227, "global_step": 634644, "epoch": 7646} {"train_loss": -28.19684410095215, "global_step": 634645, "epoch": 7646} {"train_loss": -28.299890518188477, "global_step": 634646, "epoch": 7646} {"train_loss": -27.93117332458496, "global_step": 634647, "epoch": 7646} {"train_loss": -28.2303524017334, "global_step": 634648, "epoch": 7646} {"train_loss": -28.429126739501953, "global_step": 634649, "epoch": 7646} {"train_loss": -28.37529945373535, "global_step": 634650, "epoch": 7646} {"train_loss": -27.82600975036621, "global_step": 634651, "epoch": 7646} {"train_loss": -28.31464195251465, "global_step": 634652, "epoch": 7646} {"train_loss": -28.472492218017578, "global_step": 634653, "epoch": 7646} {"train_loss": -28.239826202392578, "global_step": 634654, "epoch": 7646} {"train_loss": -28.564809799194336, "global_step": 634655, "epoch": 7646} {"train_loss": -28.62741470336914, "global_step": 634656, "epoch": 7646} {"train_loss": -28.248706817626953, "global_step": 634657, "epoch": 7646} {"train_loss": -28.356786727905273, "global_step": 634658, "epoch": 7646} {"train_loss": -28.626789093017578, "global_step": 634659, "epoch": 7646} {"train_loss": -28.128217697143555, "global_step": 634660, "epoch": 7646} {"train_loss": -28.40386962890625, "global_step": 634661, "epoch": 7646} {"train_loss": -28.012287139892578, "global_step": 634662, "epoch": 7646} {"train_loss": -28.428375244140625, "global_step": 634663, "epoch": 7646} {"train_loss": -28.50019645690918, "global_step": 634664, "epoch": 7646} {"train_loss": -28.27559471130371, "global_step": 634665, "epoch": 7646} {"train_loss": -28.090850830078125, "global_step": 634666, "epoch": 7646} {"train_loss": -27.853076934814453, "global_step": 634667, "epoch": 7646} {"train_loss": -27.845172882080078, "global_step": 634668, "epoch": 7646} {"train_loss": -28.350271224975586, "global_step": 634669, "epoch": 7646} {"train_loss": -28.27019691467285, "global_step": 634670, "epoch": 7646} {"train_loss": -27.392337799072266, "global_step": 634671, "epoch": 7646} {"train_loss": -28.416797637939453, "global_step": 634672, "epoch": 7646} {"train_loss": -28.772119522094727, "global_step": 634673, "epoch": 7646} {"train_loss": -28.19410514831543, "global_step": 634674, "epoch": 7646} {"train_loss": -28.483325958251953, "global_step": 634675, "epoch": 7646} {"train_loss": -28.239337921142578, "global_step": 634676, "epoch": 7646} {"train_loss": -28.34417724609375, "global_step": 634677, "epoch": 7646} {"train_loss": -28.41804313659668, "global_step": 634678, "epoch": 7646} {"train_loss": -28.406702041625977, "global_step": 634679, "epoch": 7646} {"train_loss": -28.10493278503418, "global_step": 634680, "epoch": 7646} {"train_loss": -28.279829025268555, "global_step": 634681, "epoch": 7646} {"train_loss": -28.31867790222168, "global_step": 634682, "epoch": 7646} {"train_loss": -28.531951904296875, "global_step": 634683, "epoch": 7646} {"train_loss": -28.227136611938477, "global_step": 634684, "epoch": 7646} {"train_loss": -28.552814483642578, "global_step": 634685, "epoch": 7646} {"train_loss": -28.172529220581055, "global_step": 634686, "epoch": 7646} {"train_loss": -28.09954261779785, "global_step": 634687, "epoch": 7646} {"train_loss": -28.215368270874023, "global_step": 634688, "epoch": 7646} {"train_loss": -27.992521286010742, "global_step": 634689, "epoch": 7646} {"train_loss": -27.829273223876953, "global_step": 634690, "epoch": 7646} {"train_loss": -28.58517837524414, "global_step": 634691, "epoch": 7646} {"train_loss": -28.481740951538086, "global_step": 634692, "epoch": 7646} {"train_loss": -28.520883560180664, "global_step": 634693, "epoch": 7646} {"train_loss": -28.24091148376465, "global_step": 634694, "epoch": 7646} {"train_loss": -28.517248153686523, "global_step": 634695, "epoch": 7646} {"train_loss": -27.821674346923828, "global_step": 634696, "epoch": 7646} {"train_loss": -28.446035385131836, "global_step": 634697, "epoch": 7646} {"train_loss": -27.923254013061523, "global_step": 634698, "epoch": 7646} {"train_loss": -28.23182487487793, "global_step": 634699, "epoch": 7646} {"train_loss": -28.08275089493717, "global_step": 634700, "epoch": 7646, "val_loss": 6831223.0} {"train_loss": -27.48357582092285, "global_step": 634701, "epoch": 7647} {"train_loss": -26.927597045898438, "global_step": 634702, "epoch": 7647} {"train_loss": -27.43170738220215, "global_step": 634703, "epoch": 7647} {"train_loss": -26.76923179626465, "global_step": 634704, "epoch": 7647} {"train_loss": -27.4642333984375, "global_step": 634705, "epoch": 7647} {"train_loss": -27.23001480102539, "global_step": 634706, "epoch": 7647} {"train_loss": -27.5428524017334, "global_step": 634707, "epoch": 7647} {"train_loss": -27.523590087890625, "global_step": 634708, "epoch": 7647} {"train_loss": -26.945514678955078, "global_step": 634709, "epoch": 7647} {"train_loss": -27.709436416625977, "global_step": 634710, "epoch": 7647} {"train_loss": -27.260889053344727, "global_step": 634711, "epoch": 7647} {"train_loss": -27.8830509185791, "global_step": 634712, "epoch": 7647} {"train_loss": -27.40679931640625, "global_step": 634713, "epoch": 7647} {"train_loss": -27.6066951751709, "global_step": 634714, "epoch": 7647} {"train_loss": -27.874738693237305, "global_step": 634715, "epoch": 7647} {"train_loss": -27.516874313354492, "global_step": 634716, "epoch": 7647} {"train_loss": -27.575727462768555, "global_step": 634717, "epoch": 7647} {"train_loss": -28.031524658203125, "global_step": 634718, "epoch": 7647} {"train_loss": -27.34515953063965, "global_step": 634719, "epoch": 7647} {"train_loss": -27.76041603088379, "global_step": 634720, "epoch": 7647} {"train_loss": -27.868860244750977, "global_step": 634721, "epoch": 7647} {"train_loss": -27.614622116088867, "global_step": 634722, "epoch": 7647} {"train_loss": -27.784381866455078, "global_step": 634723, "epoch": 7647} {"train_loss": -27.80836296081543, "global_step": 634724, "epoch": 7647} {"train_loss": -28.1296329498291, "global_step": 634725, "epoch": 7647} {"train_loss": -27.67158317565918, "global_step": 634726, "epoch": 7647} {"train_loss": -28.154691696166992, "global_step": 634727, "epoch": 7647} {"train_loss": -28.075841903686523, "global_step": 634728, "epoch": 7647} {"train_loss": -28.176074981689453, "global_step": 634729, "epoch": 7647} {"train_loss": -28.1387882232666, "global_step": 634730, "epoch": 7647} {"train_loss": -27.973852157592773, "global_step": 634731, "epoch": 7647} {"train_loss": -28.37027359008789, "global_step": 634732, "epoch": 7647} {"train_loss": -28.097015380859375, "global_step": 634733, "epoch": 7647} {"train_loss": -28.197895050048828, "global_step": 634734, "epoch": 7647} {"train_loss": -28.16455078125, "global_step": 634735, "epoch": 7647} {"train_loss": -28.55537223815918, "global_step": 634736, "epoch": 7647} {"train_loss": -28.157835006713867, "global_step": 634737, "epoch": 7647} {"train_loss": -28.181900024414062, "global_step": 634738, "epoch": 7647} {"train_loss": -27.933029174804688, "global_step": 634739, "epoch": 7647} {"train_loss": -28.520193099975586, "global_step": 634740, "epoch": 7647} {"train_loss": -28.035757064819336, "global_step": 634741, "epoch": 7647} {"train_loss": -28.841955184936523, "global_step": 634742, "epoch": 7647} {"train_loss": -28.176633834838867, "global_step": 634743, "epoch": 7647} {"train_loss": -28.11530113220215, "global_step": 634744, "epoch": 7647} {"train_loss": -28.565534591674805, "global_step": 634745, "epoch": 7647} {"train_loss": -28.336994171142578, "global_step": 634746, "epoch": 7647} {"train_loss": -28.141263961791992, "global_step": 634747, "epoch": 7647} {"train_loss": -28.33359146118164, "global_step": 634748, "epoch": 7647} {"train_loss": -28.755029678344727, "global_step": 634749, "epoch": 7647} {"train_loss": -28.697370529174805, "global_step": 634750, "epoch": 7647} {"train_loss": -28.283212661743164, "global_step": 634751, "epoch": 7647} {"train_loss": -28.421865463256836, "global_step": 634752, "epoch": 7647} {"train_loss": -28.369709014892578, "global_step": 634753, "epoch": 7647} {"train_loss": -28.2995662689209, "global_step": 634754, "epoch": 7647} {"train_loss": -28.422677993774414, "global_step": 634755, "epoch": 7647} {"train_loss": -28.793338775634766, "global_step": 634756, "epoch": 7647} {"train_loss": -28.466527938842773, "global_step": 634757, "epoch": 7647} {"train_loss": -28.62409019470215, "global_step": 634758, "epoch": 7647} {"train_loss": -28.857685089111328, "global_step": 634759, "epoch": 7647} {"train_loss": -28.385883331298828, "global_step": 634760, "epoch": 7647} {"train_loss": -28.463342666625977, "global_step": 634761, "epoch": 7647} {"train_loss": -28.326154708862305, "global_step": 634762, "epoch": 7647} {"train_loss": -28.300464630126953, "global_step": 634763, "epoch": 7647} {"train_loss": -27.717214584350586, "global_step": 634764, "epoch": 7647} {"train_loss": -27.4822998046875, "global_step": 634765, "epoch": 7647} {"train_loss": -28.08376121520996, "global_step": 634766, "epoch": 7647} {"train_loss": -28.408857345581055, "global_step": 634767, "epoch": 7647} {"train_loss": -28.21295738220215, "global_step": 634768, "epoch": 7647} {"train_loss": -28.346277236938477, "global_step": 634769, "epoch": 7647} {"train_loss": -28.571613311767578, "global_step": 634770, "epoch": 7647} {"train_loss": -28.23948097229004, "global_step": 634771, "epoch": 7647} {"train_loss": -28.098779678344727, "global_step": 634772, "epoch": 7647} {"train_loss": -27.56839942932129, "global_step": 634773, "epoch": 7647} {"train_loss": -27.596166610717773, "global_step": 634774, "epoch": 7647} {"train_loss": -26.90472412109375, "global_step": 634775, "epoch": 7647} {"train_loss": -27.6867733001709, "global_step": 634776, "epoch": 7647} {"train_loss": -28.074262619018555, "global_step": 634777, "epoch": 7647} {"train_loss": -27.727222442626953, "global_step": 634778, "epoch": 7647} {"train_loss": -27.790258407592773, "global_step": 634779, "epoch": 7647} {"train_loss": -27.8398494720459, "global_step": 634780, "epoch": 7647} {"train_loss": -27.73652458190918, "global_step": 634781, "epoch": 7647} {"train_loss": -27.86197853088379, "global_step": 634782, "epoch": 7647} {"train_loss": -27.967926025390625, "global_step": 634783, "epoch": 7647, "val_loss": 6820903.5} {"train_loss": -27.115509033203125, "global_step": 634784, "epoch": 7648} {"train_loss": -25.664682388305664, "global_step": 634785, "epoch": 7648} {"train_loss": -25.410797119140625, "global_step": 634786, "epoch": 7648} {"train_loss": -26.67194175720215, "global_step": 634787, "epoch": 7648} {"train_loss": -26.583425521850586, "global_step": 634788, "epoch": 7648} {"train_loss": -26.442712783813477, "global_step": 634789, "epoch": 7648} {"train_loss": -27.21632194519043, "global_step": 634790, "epoch": 7648} {"train_loss": -27.264307022094727, "global_step": 634791, "epoch": 7648} {"train_loss": -27.094364166259766, "global_step": 634792, "epoch": 7648} {"train_loss": -26.972089767456055, "global_step": 634793, "epoch": 7648} {"train_loss": -27.21146583557129, "global_step": 634794, "epoch": 7648} {"train_loss": -26.853357315063477, "global_step": 634795, "epoch": 7648} {"train_loss": -27.277423858642578, "global_step": 634796, "epoch": 7648} {"train_loss": -27.14349937438965, "global_step": 634797, "epoch": 7648} {"train_loss": -25.93283462524414, "global_step": 634798, "epoch": 7648} {"train_loss": -27.693653106689453, "global_step": 634799, "epoch": 7648} {"train_loss": -27.397375106811523, "global_step": 634800, "epoch": 7648} {"train_loss": -27.563871383666992, "global_step": 634801, "epoch": 7648} {"train_loss": -27.59177589416504, "global_step": 634802, "epoch": 7648} {"train_loss": -27.574697494506836, "global_step": 634803, "epoch": 7648} {"train_loss": -27.506391525268555, "global_step": 634804, "epoch": 7648} {"train_loss": -27.332456588745117, "global_step": 634805, "epoch": 7648} {"train_loss": -27.37835693359375, "global_step": 634806, "epoch": 7648} {"train_loss": -27.67877769470215, "global_step": 634807, "epoch": 7648} {"train_loss": -27.6007137298584, "global_step": 634808, "epoch": 7648} {"train_loss": -27.79241371154785, "global_step": 634809, "epoch": 7648} {"train_loss": -27.3402156829834, "global_step": 634810, "epoch": 7648} {"train_loss": -27.52131462097168, "global_step": 634811, "epoch": 7648} {"train_loss": -27.755237579345703, "global_step": 634812, "epoch": 7648} {"train_loss": -27.75459098815918, "global_step": 634813, "epoch": 7648} {"train_loss": -27.9754581451416, "global_step": 634814, "epoch": 7648} {"train_loss": -27.6661434173584, "global_step": 634815, "epoch": 7648} {"train_loss": -28.206043243408203, "global_step": 634816, "epoch": 7648} {"train_loss": -27.669574737548828, "global_step": 634817, "epoch": 7648} {"train_loss": -28.006982803344727, "global_step": 634818, "epoch": 7648} {"train_loss": -28.117919921875, "global_step": 634819, "epoch": 7648} {"train_loss": -28.272306442260742, "global_step": 634820, "epoch": 7648} {"train_loss": -28.13836097717285, "global_step": 634821, "epoch": 7648} {"train_loss": -27.853544235229492, "global_step": 634822, "epoch": 7648} {"train_loss": -28.241159439086914, "global_step": 634823, "epoch": 7648} {"train_loss": -28.02033042907715, "global_step": 634824, "epoch": 7648} {"train_loss": -28.065134048461914, "global_step": 634825, "epoch": 7648} {"train_loss": -28.112207412719727, "global_step": 634826, "epoch": 7648} {"train_loss": -28.056140899658203, "global_step": 634827, "epoch": 7648} {"train_loss": -28.000864028930664, "global_step": 634828, "epoch": 7648} {"train_loss": -28.623779296875, "global_step": 634829, "epoch": 7648} {"train_loss": -28.398059844970703, "global_step": 634830, "epoch": 7648} {"train_loss": -28.537973403930664, "global_step": 634831, "epoch": 7648} {"train_loss": -28.385541915893555, "global_step": 634832, "epoch": 7648} {"train_loss": -28.089563369750977, "global_step": 634833, "epoch": 7648} {"train_loss": -28.350732803344727, "global_step": 634834, "epoch": 7648} {"train_loss": -28.2238712310791, "global_step": 634835, "epoch": 7648} {"train_loss": -28.268329620361328, "global_step": 634836, "epoch": 7648} {"train_loss": -28.540197372436523, "global_step": 634837, "epoch": 7648} {"train_loss": -28.199005126953125, "global_step": 634838, "epoch": 7648} {"train_loss": -28.223230361938477, "global_step": 634839, "epoch": 7648} {"train_loss": -28.278827667236328, "global_step": 634840, "epoch": 7648} {"train_loss": -27.92933464050293, "global_step": 634841, "epoch": 7648} {"train_loss": -28.301025390625, "global_step": 634842, "epoch": 7648} {"train_loss": -28.064971923828125, "global_step": 634843, "epoch": 7648} {"train_loss": -28.43851661682129, "global_step": 634844, "epoch": 7648} {"train_loss": -28.344131469726562, "global_step": 634845, "epoch": 7648} {"train_loss": -28.1890926361084, "global_step": 634846, "epoch": 7648} {"train_loss": -28.300764083862305, "global_step": 634847, "epoch": 7648} {"train_loss": -28.313241958618164, "global_step": 634848, "epoch": 7648} {"train_loss": -28.42237663269043, "global_step": 634849, "epoch": 7648} {"train_loss": -28.281085968017578, "global_step": 634850, "epoch": 7648} {"train_loss": -28.032245635986328, "global_step": 634851, "epoch": 7648} {"train_loss": -28.23197364807129, "global_step": 634852, "epoch": 7648} {"train_loss": -27.888662338256836, "global_step": 634853, "epoch": 7648} {"train_loss": -28.001087188720703, "global_step": 634854, "epoch": 7648} {"train_loss": -27.993982315063477, "global_step": 634855, "epoch": 7648} {"train_loss": -28.43121910095215, "global_step": 634856, "epoch": 7648} {"train_loss": -28.109100341796875, "global_step": 634857, "epoch": 7648} {"train_loss": -28.144153594970703, "global_step": 634858, "epoch": 7648} {"train_loss": -28.443191528320312, "global_step": 634859, "epoch": 7648} {"train_loss": -28.297956466674805, "global_step": 634860, "epoch": 7648} {"train_loss": -27.895709991455078, "global_step": 634861, "epoch": 7648} {"train_loss": -27.9840145111084, "global_step": 634862, "epoch": 7648} {"train_loss": -28.28681755065918, "global_step": 634863, "epoch": 7648} {"train_loss": -28.27765464782715, "global_step": 634864, "epoch": 7648} {"train_loss": -28.587860107421875, "global_step": 634865, "epoch": 7648} {"train_loss": -27.795583816896002, "global_step": 634866, "epoch": 7648, "val_loss": 6830359.0} {"train_loss": -27.660400390625, "global_step": 634867, "epoch": 7649} {"train_loss": -27.71040153503418, "global_step": 634868, "epoch": 7649} {"train_loss": -28.008686065673828, "global_step": 634869, "epoch": 7649} {"train_loss": -28.027435302734375, "global_step": 634870, "epoch": 7649} {"train_loss": -27.660810470581055, "global_step": 634871, "epoch": 7649} {"train_loss": -27.380416870117188, "global_step": 634872, "epoch": 7649} {"train_loss": -28.10625648498535, "global_step": 634873, "epoch": 7649} {"train_loss": -27.694961547851562, "global_step": 634874, "epoch": 7649} {"train_loss": -27.957386016845703, "global_step": 634875, "epoch": 7649} {"train_loss": -28.248456954956055, "global_step": 634876, "epoch": 7649} {"train_loss": -28.202392578125, "global_step": 634877, "epoch": 7649} {"train_loss": -27.935028076171875, "global_step": 634878, "epoch": 7649} {"train_loss": -28.27308464050293, "global_step": 634879, "epoch": 7649} {"train_loss": -27.852514266967773, "global_step": 634880, "epoch": 7649} {"train_loss": -28.317487716674805, "global_step": 634881, "epoch": 7649} {"train_loss": -28.149524688720703, "global_step": 634882, "epoch": 7649} {"train_loss": -27.82366371154785, "global_step": 634883, "epoch": 7649} {"train_loss": -28.135740280151367, "global_step": 634884, "epoch": 7649} {"train_loss": -28.502546310424805, "global_step": 634885, "epoch": 7649} {"train_loss": -28.3654727935791, "global_step": 634886, "epoch": 7649} {"train_loss": -28.205596923828125, "global_step": 634887, "epoch": 7649} {"train_loss": -28.064130783081055, "global_step": 634888, "epoch": 7649} {"train_loss": -28.280683517456055, "global_step": 634889, "epoch": 7649} {"train_loss": -28.558591842651367, "global_step": 634890, "epoch": 7649} {"train_loss": -27.953947067260742, "global_step": 634891, "epoch": 7649} {"train_loss": -28.5220947265625, "global_step": 634892, "epoch": 7649} {"train_loss": -28.36836051940918, "global_step": 634893, "epoch": 7649} {"train_loss": -28.027332305908203, "global_step": 634894, "epoch": 7649} {"train_loss": -28.19748878479004, "global_step": 634895, "epoch": 7649} {"train_loss": -28.625198364257812, "global_step": 634896, "epoch": 7649} {"train_loss": -28.0804386138916, "global_step": 634897, "epoch": 7649} {"train_loss": -28.28435707092285, "global_step": 634898, "epoch": 7649} {"train_loss": -28.435266494750977, "global_step": 634899, "epoch": 7649} {"train_loss": -28.21550941467285, "global_step": 634900, "epoch": 7649} {"train_loss": -27.850006103515625, "global_step": 634901, "epoch": 7649} {"train_loss": -28.38701820373535, "global_step": 634902, "epoch": 7649} {"train_loss": -28.359848022460938, "global_step": 634903, "epoch": 7649} {"train_loss": -27.993576049804688, "global_step": 634904, "epoch": 7649} {"train_loss": -28.186676025390625, "global_step": 634905, "epoch": 7649} {"train_loss": -28.053485870361328, "global_step": 634906, "epoch": 7649} {"train_loss": -27.932031631469727, "global_step": 634907, "epoch": 7649} {"train_loss": -27.725982666015625, "global_step": 634908, "epoch": 7649} {"train_loss": -27.706571578979492, "global_step": 634909, "epoch": 7649} {"train_loss": -27.48648452758789, "global_step": 634910, "epoch": 7649} {"train_loss": -28.351301193237305, "global_step": 634911, "epoch": 7649} {"train_loss": -27.700952529907227, "global_step": 634912, "epoch": 7649} {"train_loss": -27.537097930908203, "global_step": 634913, "epoch": 7649} {"train_loss": -28.21503257751465, "global_step": 634914, "epoch": 7649} {"train_loss": -27.228723526000977, "global_step": 634915, "epoch": 7649} {"train_loss": -27.70094871520996, "global_step": 634916, "epoch": 7649} {"train_loss": -27.798734664916992, "global_step": 634917, "epoch": 7649} {"train_loss": -27.557483673095703, "global_step": 634918, "epoch": 7649} {"train_loss": -28.045703887939453, "global_step": 634919, "epoch": 7649} {"train_loss": -27.669416427612305, "global_step": 634920, "epoch": 7649} {"train_loss": -28.121906280517578, "global_step": 634921, "epoch": 7649} {"train_loss": -27.957935333251953, "global_step": 634922, "epoch": 7649} {"train_loss": -27.957494735717773, "global_step": 634923, "epoch": 7649} {"train_loss": -28.04047966003418, "global_step": 634924, "epoch": 7649} {"train_loss": -28.104825973510742, "global_step": 634925, "epoch": 7649} {"train_loss": -28.052637100219727, "global_step": 634926, "epoch": 7649} {"train_loss": -27.967529296875, "global_step": 634927, "epoch": 7649} {"train_loss": -28.23627281188965, "global_step": 634928, "epoch": 7649} {"train_loss": -28.291166305541992, "global_step": 634929, "epoch": 7649} {"train_loss": -28.319761276245117, "global_step": 634930, "epoch": 7649} {"train_loss": -28.15771484375, "global_step": 634931, "epoch": 7649} {"train_loss": -27.8657169342041, "global_step": 634932, "epoch": 7649} {"train_loss": -28.268728256225586, "global_step": 634933, "epoch": 7649} {"train_loss": -28.296152114868164, "global_step": 634934, "epoch": 7649} {"train_loss": -28.472614288330078, "global_step": 634935, "epoch": 7649} {"train_loss": -28.295108795166016, "global_step": 634936, "epoch": 7649} {"train_loss": -28.80838394165039, "global_step": 634937, "epoch": 7649} {"train_loss": -28.19403076171875, "global_step": 634938, "epoch": 7649} {"train_loss": -27.825613021850586, "global_step": 634939, "epoch": 7649} {"train_loss": -28.420679092407227, "global_step": 634940, "epoch": 7649} {"train_loss": -27.9554386138916, "global_step": 634941, "epoch": 7649} {"train_loss": -28.4462833404541, "global_step": 634942, "epoch": 7649} {"train_loss": -28.119836807250977, "global_step": 634943, "epoch": 7649} {"train_loss": -28.26189613342285, "global_step": 634944, "epoch": 7649} {"train_loss": -28.436237335205078, "global_step": 634945, "epoch": 7649} {"train_loss": -28.202716827392578, "global_step": 634946, "epoch": 7649} {"train_loss": -27.878402709960938, "global_step": 634947, "epoch": 7649} {"train_loss": -28.226730346679688, "global_step": 634948, "epoch": 7649} {"train_loss": -28.074723507984576, "global_step": 634949, "epoch": 7649, "val_loss": 6743543.0} {"train_loss": -27.417301177978516, "global_step": 634950, "epoch": 7650} {"train_loss": -26.6358699798584, "global_step": 634951, "epoch": 7650} {"train_loss": -23.549468994140625, "global_step": 634952, "epoch": 7650} {"train_loss": -20.1250057220459, "global_step": 634953, "epoch": 7650} {"train_loss": -25.738672256469727, "global_step": 634954, "epoch": 7650} {"train_loss": -25.6517333984375, "global_step": 634955, "epoch": 7650} {"train_loss": -26.702606201171875, "global_step": 634956, "epoch": 7650} {"train_loss": -26.352441787719727, "global_step": 634957, "epoch": 7650} {"train_loss": -26.82185173034668, "global_step": 634958, "epoch": 7650} {"train_loss": -26.853612899780273, "global_step": 634959, "epoch": 7650} {"train_loss": -26.446508407592773, "global_step": 634960, "epoch": 7650} {"train_loss": -27.174009323120117, "global_step": 634961, "epoch": 7650} {"train_loss": -27.15653419494629, "global_step": 634962, "epoch": 7650} {"train_loss": -27.176803588867188, "global_step": 634963, "epoch": 7650} {"train_loss": -26.91938591003418, "global_step": 634964, "epoch": 7650} {"train_loss": -27.675031661987305, "global_step": 634965, "epoch": 7650} {"train_loss": -27.62095069885254, "global_step": 634966, "epoch": 7650} {"train_loss": -27.428028106689453, "global_step": 634967, "epoch": 7650} {"train_loss": -27.325977325439453, "global_step": 634968, "epoch": 7650} {"train_loss": -27.473661422729492, "global_step": 634969, "epoch": 7650} {"train_loss": -26.952075958251953, "global_step": 634970, "epoch": 7650} {"train_loss": -27.276824951171875, "global_step": 634971, "epoch": 7650} {"train_loss": -27.451080322265625, "global_step": 634972, "epoch": 7650} {"train_loss": -27.2670955657959, "global_step": 634973, "epoch": 7650} {"train_loss": -27.6854190826416, "global_step": 634974, "epoch": 7650} {"train_loss": -27.457117080688477, "global_step": 634975, "epoch": 7650} {"train_loss": -27.74128532409668, "global_step": 634976, "epoch": 7650} {"train_loss": -27.61517906188965, "global_step": 634977, "epoch": 7650} {"train_loss": -27.56671714782715, "global_step": 634978, "epoch": 7650} {"train_loss": -27.572473526000977, "global_step": 634979, "epoch": 7650} {"train_loss": -27.811384201049805, "global_step": 634980, "epoch": 7650} {"train_loss": -27.834264755249023, "global_step": 634981, "epoch": 7650} {"train_loss": -28.003110885620117, "global_step": 634982, "epoch": 7650} {"train_loss": -27.783842086791992, "global_step": 634983, "epoch": 7650} {"train_loss": -27.794397354125977, "global_step": 634984, "epoch": 7650} {"train_loss": -27.686445236206055, "global_step": 634985, "epoch": 7650} {"train_loss": -27.714221954345703, "global_step": 634986, "epoch": 7650} {"train_loss": -27.977392196655273, "global_step": 634987, "epoch": 7650} {"train_loss": -27.715351104736328, "global_step": 634988, "epoch": 7650} {"train_loss": -27.7961483001709, "global_step": 634989, "epoch": 7650} {"train_loss": -27.70954704284668, "global_step": 634990, "epoch": 7650} {"train_loss": -27.677976608276367, "global_step": 634991, "epoch": 7650} {"train_loss": -27.773706436157227, "global_step": 634992, "epoch": 7650} {"train_loss": -27.63385009765625, "global_step": 634993, "epoch": 7650} {"train_loss": -27.9180850982666, "global_step": 634994, "epoch": 7650} {"train_loss": -27.648656845092773, "global_step": 634995, "epoch": 7650} {"train_loss": -28.092763900756836, "global_step": 634996, "epoch": 7650} {"train_loss": -28.40406608581543, "global_step": 634997, "epoch": 7650} {"train_loss": -27.8973445892334, "global_step": 634998, "epoch": 7650} {"train_loss": -28.162015914916992, "global_step": 634999, "epoch": 7650} {"train_loss": -27.99651527404785, "global_step": 635000, "epoch": 7650} {"train_loss": -28.08108901977539, "global_step": 635001, "epoch": 7650} {"train_loss": -27.929412841796875, "global_step": 635002, "epoch": 7650} {"train_loss": -27.962955474853516, "global_step": 635003, "epoch": 7650} {"train_loss": -28.26099967956543, "global_step": 635004, "epoch": 7650} {"train_loss": -28.174213409423828, "global_step": 635005, "epoch": 7650} {"train_loss": -28.243078231811523, "global_step": 635006, "epoch": 7650} {"train_loss": -28.068403244018555, "global_step": 635007, "epoch": 7650} {"train_loss": -27.946805953979492, "global_step": 635008, "epoch": 7650} {"train_loss": -28.142675399780273, "global_step": 635009, "epoch": 7650} {"train_loss": -28.008283615112305, "global_step": 635010, "epoch": 7650} {"train_loss": -28.3527889251709, "global_step": 635011, "epoch": 7650} {"train_loss": -28.127395629882812, "global_step": 635012, "epoch": 7650} {"train_loss": -28.218252182006836, "global_step": 635013, "epoch": 7650} {"train_loss": -28.29059410095215, "global_step": 635014, "epoch": 7650} {"train_loss": -28.372589111328125, "global_step": 635015, "epoch": 7650} {"train_loss": -28.299560546875, "global_step": 635016, "epoch": 7650} {"train_loss": -27.972640991210938, "global_step": 635017, "epoch": 7650} {"train_loss": -28.417362213134766, "global_step": 635018, "epoch": 7650} {"train_loss": -28.528799057006836, "global_step": 635019, "epoch": 7650} {"train_loss": -28.302234649658203, "global_step": 635020, "epoch": 7650} {"train_loss": -28.12717056274414, "global_step": 635021, "epoch": 7650} {"train_loss": -28.0717830657959, "global_step": 635022, "epoch": 7650} {"train_loss": -28.15822410583496, "global_step": 635023, "epoch": 7650} {"train_loss": -27.752241134643555, "global_step": 635024, "epoch": 7650} {"train_loss": -28.346271514892578, "global_step": 635025, "epoch": 7650} {"train_loss": -28.075057983398438, "global_step": 635026, "epoch": 7650} {"train_loss": -28.123090744018555, "global_step": 635027, "epoch": 7650} {"train_loss": -28.283063888549805, "global_step": 635028, "epoch": 7650} {"train_loss": -28.162900924682617, "global_step": 635029, "epoch": 7650} {"train_loss": -28.041290283203125, "global_step": 635030, "epoch": 7650} {"train_loss": -27.967823028564453, "global_step": 635031, "epoch": 7650} {"train_loss": -27.58272979920169, "global_step": 635032, "epoch": 7650, "train/sim_max_reward_0": 0.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4500000": 1.0, "test/sim_max_reward_4500001": 0.0, "test/sim_max_reward_4500002": 1.0, "test/sim_max_reward_4500003": 1.0, "test/sim_max_reward_4500004": 1.0, "test/sim_max_reward_4500005": 1.0, "test/sim_max_reward_4500006": 1.0, "test/sim_max_reward_4500007": 0.0, "test/sim_max_reward_4500008": 1.0, "test/sim_max_reward_4500009": 1.0, "test/sim_max_reward_4500010": 1.0, "test/sim_max_reward_4500011": 1.0, "test/sim_max_reward_4500012": 1.0, "test/sim_max_reward_4500013": 0.0, "test/sim_max_reward_4500014": 1.0, "test/sim_max_reward_4500015": 1.0, "test/sim_max_reward_4500016": 1.0, "test/sim_max_reward_4500017": 1.0, "test/sim_max_reward_4500018": 1.0, "test/sim_max_reward_4500019": 1.0, "test/sim_max_reward_4500020": 1.0, "test/sim_max_reward_4500021": 1.0, "train/mean_score": 0.8333333333333334, "test/mean_score": 0.8636363636363636, "val_loss": 6663558.5} {"train_loss": -27.30499267578125, "global_step": 635033, "epoch": 7651} {"train_loss": -26.135473251342773, "global_step": 635034, "epoch": 7651} {"train_loss": -26.726465225219727, "global_step": 635035, "epoch": 7651} {"train_loss": -27.119226455688477, "global_step": 635036, "epoch": 7651} {"train_loss": -26.323837280273438, "global_step": 635037, "epoch": 7651} {"train_loss": -27.380033493041992, "global_step": 635038, "epoch": 7651} {"train_loss": -26.925024032592773, "global_step": 635039, "epoch": 7651} {"train_loss": -27.601703643798828, "global_step": 635040, "epoch": 7651} {"train_loss": -27.339111328125, "global_step": 635041, "epoch": 7651} {"train_loss": -27.46613883972168, "global_step": 635042, "epoch": 7651} {"train_loss": -27.637800216674805, "global_step": 635043, "epoch": 7651} {"train_loss": -27.338483810424805, "global_step": 635044, "epoch": 7651} {"train_loss": -27.53205680847168, "global_step": 635045, "epoch": 7651} {"train_loss": -27.594894409179688, "global_step": 635046, "epoch": 7651} {"train_loss": -27.75294303894043, "global_step": 635047, "epoch": 7651} {"train_loss": -27.777761459350586, "global_step": 635048, "epoch": 7651} {"train_loss": -27.804895401000977, "global_step": 635049, "epoch": 7651} {"train_loss": -27.378793716430664, "global_step": 635050, "epoch": 7651} {"train_loss": -27.928741455078125, "global_step": 635051, "epoch": 7651} {"train_loss": -27.968088150024414, "global_step": 635052, "epoch": 7651} {"train_loss": -27.832117080688477, "global_step": 635053, "epoch": 7651} {"train_loss": -27.933835983276367, "global_step": 635054, "epoch": 7651} {"train_loss": -27.9509334564209, "global_step": 635055, "epoch": 7651} {"train_loss": -27.779773712158203, "global_step": 635056, "epoch": 7651} {"train_loss": -28.207300186157227, "global_step": 635057, "epoch": 7651} {"train_loss": -27.998571395874023, "global_step": 635058, "epoch": 7651} {"train_loss": -27.859607696533203, "global_step": 635059, "epoch": 7651} {"train_loss": -28.193273544311523, "global_step": 635060, "epoch": 7651} {"train_loss": -28.015233993530273, "global_step": 635061, "epoch": 7651} {"train_loss": -28.416519165039062, "global_step": 635062, "epoch": 7651} {"train_loss": -27.977445602416992, "global_step": 635063, "epoch": 7651} {"train_loss": -27.834890365600586, "global_step": 635064, "epoch": 7651} {"train_loss": -27.933673858642578, "global_step": 635065, "epoch": 7651} {"train_loss": -28.16951560974121, "global_step": 635066, "epoch": 7651} {"train_loss": -28.48561668395996, "global_step": 635067, "epoch": 7651} {"train_loss": -28.40984535217285, "global_step": 635068, "epoch": 7651} {"train_loss": -28.076841354370117, "global_step": 635069, "epoch": 7651} {"train_loss": -28.04920768737793, "global_step": 635070, "epoch": 7651} {"train_loss": -28.57767105102539, "global_step": 635071, "epoch": 7651} {"train_loss": -28.13922119140625, "global_step": 635072, "epoch": 7651} {"train_loss": -28.17523765563965, "global_step": 635073, "epoch": 7651} {"train_loss": -28.301223754882812, "global_step": 635074, "epoch": 7651} {"train_loss": -28.369428634643555, "global_step": 635075, "epoch": 7651} {"train_loss": -27.852453231811523, "global_step": 635076, "epoch": 7651} {"train_loss": -28.392736434936523, "global_step": 635077, "epoch": 7651} {"train_loss": -28.577539443969727, "global_step": 635078, "epoch": 7651} {"train_loss": -28.062402725219727, "global_step": 635079, "epoch": 7651} {"train_loss": -28.699493408203125, "global_step": 635080, "epoch": 7651} {"train_loss": -28.16512107849121, "global_step": 635081, "epoch": 7651} {"train_loss": -27.769134521484375, "global_step": 635082, "epoch": 7651} {"train_loss": -28.395856857299805, "global_step": 635083, "epoch": 7651} {"train_loss": -28.516843795776367, "global_step": 635084, "epoch": 7651} {"train_loss": -28.26253318786621, "global_step": 635085, "epoch": 7651} {"train_loss": -28.660688400268555, "global_step": 635086, "epoch": 7651} {"train_loss": -28.510055541992188, "global_step": 635087, "epoch": 7651} {"train_loss": -28.302526473999023, "global_step": 635088, "epoch": 7651} {"train_loss": -28.22389793395996, "global_step": 635089, "epoch": 7651} {"train_loss": -28.505475997924805, "global_step": 635090, "epoch": 7651} {"train_loss": -28.43525505065918, "global_step": 635091, "epoch": 7651} {"train_loss": -28.686994552612305, "global_step": 635092, "epoch": 7651} {"train_loss": -28.3135986328125, "global_step": 635093, "epoch": 7651} {"train_loss": -28.54583168029785, "global_step": 635094, "epoch": 7651} {"train_loss": -28.556659698486328, "global_step": 635095, "epoch": 7651} {"train_loss": -28.620100021362305, "global_step": 635096, "epoch": 7651} {"train_loss": -28.55722999572754, "global_step": 635097, "epoch": 7651} {"train_loss": -28.025360107421875, "global_step": 635098, "epoch": 7651} {"train_loss": -28.103422164916992, "global_step": 635099, "epoch": 7651} {"train_loss": -27.385324478149414, "global_step": 635100, "epoch": 7651} {"train_loss": -28.33173179626465, "global_step": 635101, "epoch": 7651} {"train_loss": -27.900959014892578, "global_step": 635102, "epoch": 7651} {"train_loss": -28.19817543029785, "global_step": 635103, "epoch": 7651} {"train_loss": -28.260272979736328, "global_step": 635104, "epoch": 7651} {"train_loss": -28.099597930908203, "global_step": 635105, "epoch": 7651} {"train_loss": -28.160924911499023, "global_step": 635106, "epoch": 7651} {"train_loss": -28.192764282226562, "global_step": 635107, "epoch": 7651} {"train_loss": -28.16135597229004, "global_step": 635108, "epoch": 7651} {"train_loss": -28.545331954956055, "global_step": 635109, "epoch": 7651} {"train_loss": -28.257471084594727, "global_step": 635110, "epoch": 7651} {"train_loss": -28.296051025390625, "global_step": 635111, "epoch": 7651} {"train_loss": -28.107019424438477, "global_step": 635112, "epoch": 7651} {"train_loss": -28.60468864440918, "global_step": 635113, "epoch": 7651} {"train_loss": -27.870162963867188, "global_step": 635114, "epoch": 7651} {"train_loss": -28.004216826105694, "global_step": 635115, "epoch": 7651, "val_loss": 6734493.0} {"train_loss": -27.86714744567871, "global_step": 635116, "epoch": 7652} {"train_loss": -27.593891143798828, "global_step": 635117, "epoch": 7652} {"train_loss": -27.450607299804688, "global_step": 635118, "epoch": 7652} {"train_loss": -27.327146530151367, "global_step": 635119, "epoch": 7652} {"train_loss": -27.648330688476562, "global_step": 635120, "epoch": 7652} {"train_loss": -27.415578842163086, "global_step": 635121, "epoch": 7652} {"train_loss": -27.11820411682129, "global_step": 635122, "epoch": 7652} {"train_loss": -27.312902450561523, "global_step": 635123, "epoch": 7652} {"train_loss": -27.820816040039062, "global_step": 635124, "epoch": 7652} {"train_loss": -27.426822662353516, "global_step": 635125, "epoch": 7652} {"train_loss": -27.302234649658203, "global_step": 635126, "epoch": 7652} {"train_loss": -27.672046661376953, "global_step": 635127, "epoch": 7652} {"train_loss": -27.629505157470703, "global_step": 635128, "epoch": 7652} {"train_loss": -28.14760398864746, "global_step": 635129, "epoch": 7652} {"train_loss": -28.034101486206055, "global_step": 635130, "epoch": 7652} {"train_loss": -28.067218780517578, "global_step": 635131, "epoch": 7652} {"train_loss": -28.085477828979492, "global_step": 635132, "epoch": 7652} {"train_loss": -27.728025436401367, "global_step": 635133, "epoch": 7652} {"train_loss": -27.866918563842773, "global_step": 635134, "epoch": 7652} {"train_loss": -27.974817276000977, "global_step": 635135, "epoch": 7652} {"train_loss": -27.71626091003418, "global_step": 635136, "epoch": 7652} {"train_loss": -27.753253936767578, "global_step": 635137, "epoch": 7652} {"train_loss": -27.872928619384766, "global_step": 635138, "epoch": 7652} {"train_loss": -28.065988540649414, "global_step": 635139, "epoch": 7652} {"train_loss": -28.122400283813477, "global_step": 635140, "epoch": 7652} {"train_loss": -27.823230743408203, "global_step": 635141, "epoch": 7652} {"train_loss": -28.277570724487305, "global_step": 635142, "epoch": 7652} {"train_loss": -28.456226348876953, "global_step": 635143, "epoch": 7652} {"train_loss": -28.397720336914062, "global_step": 635144, "epoch": 7652} {"train_loss": -27.886960983276367, "global_step": 635145, "epoch": 7652} {"train_loss": -28.43599510192871, "global_step": 635146, "epoch": 7652} {"train_loss": -28.119123458862305, "global_step": 635147, "epoch": 7652} {"train_loss": -28.314624786376953, "global_step": 635148, "epoch": 7652} {"train_loss": -28.55535888671875, "global_step": 635149, "epoch": 7652} {"train_loss": -27.972808837890625, "global_step": 635150, "epoch": 7652} {"train_loss": -28.151519775390625, "global_step": 635151, "epoch": 7652} {"train_loss": -28.19211196899414, "global_step": 635152, "epoch": 7652} {"train_loss": -28.26812744140625, "global_step": 635153, "epoch": 7652} {"train_loss": -28.73516273498535, "global_step": 635154, "epoch": 7652} {"train_loss": -28.2031307220459, "global_step": 635155, "epoch": 7652} {"train_loss": -28.299880981445312, "global_step": 635156, "epoch": 7652} {"train_loss": -28.4256591796875, "global_step": 635157, "epoch": 7652} {"train_loss": -28.187576293945312, "global_step": 635158, "epoch": 7652} {"train_loss": -28.648035049438477, "global_step": 635159, "epoch": 7652} {"train_loss": -28.562124252319336, "global_step": 635160, "epoch": 7652} {"train_loss": -27.8659610748291, "global_step": 635161, "epoch": 7652} {"train_loss": -28.18295669555664, "global_step": 635162, "epoch": 7652} {"train_loss": -27.996389389038086, "global_step": 635163, "epoch": 7652} {"train_loss": -28.37086296081543, "global_step": 635164, "epoch": 7652} {"train_loss": -28.465057373046875, "global_step": 635165, "epoch": 7652} {"train_loss": -28.48702049255371, "global_step": 635166, "epoch": 7652} {"train_loss": -28.312570571899414, "global_step": 635167, "epoch": 7652} {"train_loss": -28.21337890625, "global_step": 635168, "epoch": 7652} {"train_loss": -27.9660587310791, "global_step": 635169, "epoch": 7652} {"train_loss": -28.403905868530273, "global_step": 635170, "epoch": 7652} {"train_loss": -28.311918258666992, "global_step": 635171, "epoch": 7652} {"train_loss": -28.356159210205078, "global_step": 635172, "epoch": 7652} {"train_loss": -28.639936447143555, "global_step": 635173, "epoch": 7652} {"train_loss": -28.710607528686523, "global_step": 635174, "epoch": 7652} {"train_loss": -28.58793067932129, "global_step": 635175, "epoch": 7652} {"train_loss": -28.49332046508789, "global_step": 635176, "epoch": 7652} {"train_loss": -28.719274520874023, "global_step": 635177, "epoch": 7652} {"train_loss": -28.609174728393555, "global_step": 635178, "epoch": 7652} {"train_loss": -28.545530319213867, "global_step": 635179, "epoch": 7652} {"train_loss": -28.559534072875977, "global_step": 635180, "epoch": 7652} {"train_loss": -28.524810791015625, "global_step": 635181, "epoch": 7652} {"train_loss": -28.66303825378418, "global_step": 635182, "epoch": 7652} {"train_loss": -28.43939208984375, "global_step": 635183, "epoch": 7652} {"train_loss": -28.56182289123535, "global_step": 635184, "epoch": 7652} {"train_loss": -28.327444076538086, "global_step": 635185, "epoch": 7652} {"train_loss": -27.992706298828125, "global_step": 635186, "epoch": 7652} {"train_loss": -27.997516632080078, "global_step": 635187, "epoch": 7652} {"train_loss": -28.067853927612305, "global_step": 635188, "epoch": 7652} {"train_loss": -28.3256778717041, "global_step": 635189, "epoch": 7652} {"train_loss": -27.997604370117188, "global_step": 635190, "epoch": 7652} {"train_loss": -27.140729904174805, "global_step": 635191, "epoch": 7652} {"train_loss": -26.835798263549805, "global_step": 635192, "epoch": 7652} {"train_loss": -27.715513229370117, "global_step": 635193, "epoch": 7652} {"train_loss": -28.308786392211914, "global_step": 635194, "epoch": 7652} {"train_loss": -27.43910026550293, "global_step": 635195, "epoch": 7652} {"train_loss": -27.947168350219727, "global_step": 635196, "epoch": 7652} {"train_loss": -27.92877769470215, "global_step": 635197, "epoch": 7652} {"train_loss": -28.063876577170497, "global_step": 635198, "epoch": 7652, "val_loss": 6684938.0} {"train_loss": -25.202251434326172, "global_step": 635199, "epoch": 7653} {"train_loss": -23.577390670776367, "global_step": 635200, "epoch": 7653} {"train_loss": -26.678543090820312, "global_step": 635201, "epoch": 7653} {"train_loss": -24.5374698638916, "global_step": 635202, "epoch": 7653} {"train_loss": -25.99765968322754, "global_step": 635203, "epoch": 7653} {"train_loss": -25.683948516845703, "global_step": 635204, "epoch": 7653} {"train_loss": -26.254791259765625, "global_step": 635205, "epoch": 7653} {"train_loss": -25.951175689697266, "global_step": 635206, "epoch": 7653} {"train_loss": -26.05842399597168, "global_step": 635207, "epoch": 7653} {"train_loss": -27.182477951049805, "global_step": 635208, "epoch": 7653} {"train_loss": -27.133869171142578, "global_step": 635209, "epoch": 7653} {"train_loss": -26.8515625, "global_step": 635210, "epoch": 7653} {"train_loss": -26.647912979125977, "global_step": 635211, "epoch": 7653} {"train_loss": -27.248891830444336, "global_step": 635212, "epoch": 7653} {"train_loss": -26.66403579711914, "global_step": 635213, "epoch": 7653} {"train_loss": -27.217864990234375, "global_step": 635214, "epoch": 7653} {"train_loss": -26.854766845703125, "global_step": 635215, "epoch": 7653} {"train_loss": -26.839502334594727, "global_step": 635216, "epoch": 7653} {"train_loss": -27.05963134765625, "global_step": 635217, "epoch": 7653} {"train_loss": -27.113012313842773, "global_step": 635218, "epoch": 7653} {"train_loss": -27.440277099609375, "global_step": 635219, "epoch": 7653} {"train_loss": -27.76604652404785, "global_step": 635220, "epoch": 7653} {"train_loss": -27.33237648010254, "global_step": 635221, "epoch": 7653} {"train_loss": -27.060043334960938, "global_step": 635222, "epoch": 7653} {"train_loss": -27.34518814086914, "global_step": 635223, "epoch": 7653} {"train_loss": -27.396198272705078, "global_step": 635224, "epoch": 7653} {"train_loss": -27.605154037475586, "global_step": 635225, "epoch": 7653} {"train_loss": -27.55435562133789, "global_step": 635226, "epoch": 7653} {"train_loss": -27.72402000427246, "global_step": 635227, "epoch": 7653} {"train_loss": -27.71601676940918, "global_step": 635228, "epoch": 7653} {"train_loss": -27.661102294921875, "global_step": 635229, "epoch": 7653} {"train_loss": -27.827545166015625, "global_step": 635230, "epoch": 7653} {"train_loss": -27.605926513671875, "global_step": 635231, "epoch": 7653} {"train_loss": -27.86509132385254, "global_step": 635232, "epoch": 7653} {"train_loss": -27.969369888305664, "global_step": 635233, "epoch": 7653} {"train_loss": -27.788806915283203, "global_step": 635234, "epoch": 7653} {"train_loss": -28.09982681274414, "global_step": 635235, "epoch": 7653} {"train_loss": -27.932849884033203, "global_step": 635236, "epoch": 7653} {"train_loss": -27.94708824157715, "global_step": 635237, "epoch": 7653} {"train_loss": -28.431156158447266, "global_step": 635238, "epoch": 7653} {"train_loss": -28.109100341796875, "global_step": 635239, "epoch": 7653} {"train_loss": -28.129077911376953, "global_step": 635240, "epoch": 7653} {"train_loss": -28.321680068969727, "global_step": 635241, "epoch": 7653} {"train_loss": -28.24517250061035, "global_step": 635242, "epoch": 7653} {"train_loss": -28.059309005737305, "global_step": 635243, "epoch": 7653} {"train_loss": -28.02345085144043, "global_step": 635244, "epoch": 7653} {"train_loss": -28.18412208557129, "global_step": 635245, "epoch": 7653} {"train_loss": -28.045654296875, "global_step": 635246, "epoch": 7653} {"train_loss": -28.05963134765625, "global_step": 635247, "epoch": 7653} {"train_loss": -27.832502365112305, "global_step": 635248, "epoch": 7653} {"train_loss": -28.172422409057617, "global_step": 635249, "epoch": 7653} {"train_loss": -28.2386474609375, "global_step": 635250, "epoch": 7653} {"train_loss": -28.354278564453125, "global_step": 635251, "epoch": 7653} {"train_loss": -28.214529037475586, "global_step": 635252, "epoch": 7653} {"train_loss": -28.39771842956543, "global_step": 635253, "epoch": 7653} {"train_loss": -28.292266845703125, "global_step": 635254, "epoch": 7653} {"train_loss": -28.331174850463867, "global_step": 635255, "epoch": 7653} {"train_loss": -28.037927627563477, "global_step": 635256, "epoch": 7653} {"train_loss": -28.121450424194336, "global_step": 635257, "epoch": 7653} {"train_loss": -28.242603302001953, "global_step": 635258, "epoch": 7653} {"train_loss": -28.014862060546875, "global_step": 635259, "epoch": 7653} {"train_loss": -28.273950576782227, "global_step": 635260, "epoch": 7653} {"train_loss": -28.550710678100586, "global_step": 635261, "epoch": 7653} {"train_loss": -28.481985092163086, "global_step": 635262, "epoch": 7653} {"train_loss": -28.48109245300293, "global_step": 635263, "epoch": 7653} {"train_loss": -28.458633422851562, "global_step": 635264, "epoch": 7653} {"train_loss": -28.715688705444336, "global_step": 635265, "epoch": 7653} {"train_loss": -28.5101375579834, "global_step": 635266, "epoch": 7653} {"train_loss": -28.705875396728516, "global_step": 635267, "epoch": 7653} {"train_loss": -28.969501495361328, "global_step": 635268, "epoch": 7653} {"train_loss": -28.30380630493164, "global_step": 635269, "epoch": 7653} {"train_loss": -28.57647705078125, "global_step": 635270, "epoch": 7653} {"train_loss": -28.743839263916016, "global_step": 635271, "epoch": 7653} {"train_loss": -28.52471351623535, "global_step": 635272, "epoch": 7653} {"train_loss": -28.28639030456543, "global_step": 635273, "epoch": 7653} {"train_loss": -28.828231811523438, "global_step": 635274, "epoch": 7653} {"train_loss": -28.7537841796875, "global_step": 635275, "epoch": 7653} {"train_loss": -28.661664962768555, "global_step": 635276, "epoch": 7653} {"train_loss": -28.816259384155273, "global_step": 635277, "epoch": 7653} {"train_loss": -28.62537956237793, "global_step": 635278, "epoch": 7653} {"train_loss": -28.18328857421875, "global_step": 635279, "epoch": 7653} {"train_loss": -27.8962459564209, "global_step": 635280, "epoch": 7653} {"train_loss": -27.70732721075954, "global_step": 635281, "epoch": 7653, "val_loss": 6686887.0} {"train_loss": -25.8126163482666, "global_step": 635282, "epoch": 7654} {"train_loss": -24.966205596923828, "global_step": 635283, "epoch": 7654} {"train_loss": -26.332014083862305, "global_step": 635284, "epoch": 7654} {"train_loss": -26.824420928955078, "global_step": 635285, "epoch": 7654} {"train_loss": -25.522329330444336, "global_step": 635286, "epoch": 7654} {"train_loss": -26.361154556274414, "global_step": 635287, "epoch": 7654} {"train_loss": -27.499502182006836, "global_step": 635288, "epoch": 7654} {"train_loss": -26.850128173828125, "global_step": 635289, "epoch": 7654} {"train_loss": -27.518835067749023, "global_step": 635290, "epoch": 7654} {"train_loss": -27.174182891845703, "global_step": 635291, "epoch": 7654} {"train_loss": -27.7716007232666, "global_step": 635292, "epoch": 7654} {"train_loss": -27.071348190307617, "global_step": 635293, "epoch": 7654} {"train_loss": -27.149383544921875, "global_step": 635294, "epoch": 7654} {"train_loss": -27.56831169128418, "global_step": 635295, "epoch": 7654} {"train_loss": -27.453161239624023, "global_step": 635296, "epoch": 7654} {"train_loss": -27.616491317749023, "global_step": 635297, "epoch": 7654} {"train_loss": -27.6767520904541, "global_step": 635298, "epoch": 7654} {"train_loss": -28.0035400390625, "global_step": 635299, "epoch": 7654} {"train_loss": -27.73871421813965, "global_step": 635300, "epoch": 7654} {"train_loss": -27.520832061767578, "global_step": 635301, "epoch": 7654} {"train_loss": -27.7488956451416, "global_step": 635302, "epoch": 7654} {"train_loss": -27.97650146484375, "global_step": 635303, "epoch": 7654} {"train_loss": -27.711654663085938, "global_step": 635304, "epoch": 7654} {"train_loss": -28.042810440063477, "global_step": 635305, "epoch": 7654} {"train_loss": -27.8187198638916, "global_step": 635306, "epoch": 7654} {"train_loss": -28.1308536529541, "global_step": 635307, "epoch": 7654} {"train_loss": -27.863174438476562, "global_step": 635308, "epoch": 7654} {"train_loss": -27.988037109375, "global_step": 635309, "epoch": 7654} {"train_loss": -28.187671661376953, "global_step": 635310, "epoch": 7654} {"train_loss": -28.143091201782227, "global_step": 635311, "epoch": 7654} {"train_loss": -28.010456085205078, "global_step": 635312, "epoch": 7654} {"train_loss": -28.075180053710938, "global_step": 635313, "epoch": 7654} {"train_loss": -28.483930587768555, "global_step": 635314, "epoch": 7654} {"train_loss": -27.868026733398438, "global_step": 635315, "epoch": 7654} {"train_loss": -28.291061401367188, "global_step": 635316, "epoch": 7654} {"train_loss": -28.169479370117188, "global_step": 635317, "epoch": 7654} {"train_loss": -28.264413833618164, "global_step": 635318, "epoch": 7654} {"train_loss": -28.177228927612305, "global_step": 635319, "epoch": 7654} {"train_loss": -28.199390411376953, "global_step": 635320, "epoch": 7654} {"train_loss": -28.536609649658203, "global_step": 635321, "epoch": 7654} {"train_loss": -28.214859008789062, "global_step": 635322, "epoch": 7654} {"train_loss": -28.281530380249023, "global_step": 635323, "epoch": 7654} {"train_loss": -28.287220001220703, "global_step": 635324, "epoch": 7654} {"train_loss": -28.448444366455078, "global_step": 635325, "epoch": 7654} {"train_loss": -28.339252471923828, "global_step": 635326, "epoch": 7654} {"train_loss": -28.312625885009766, "global_step": 635327, "epoch": 7654} {"train_loss": -28.26666259765625, "global_step": 635328, "epoch": 7654} {"train_loss": -28.450714111328125, "global_step": 635329, "epoch": 7654} {"train_loss": -28.75390625, "global_step": 635330, "epoch": 7654} {"train_loss": -28.13101577758789, "global_step": 635331, "epoch": 7654} {"train_loss": -28.48267936706543, "global_step": 635332, "epoch": 7654} {"train_loss": -28.14430046081543, "global_step": 635333, "epoch": 7654} {"train_loss": -28.763086318969727, "global_step": 635334, "epoch": 7654} {"train_loss": -28.533918380737305, "global_step": 635335, "epoch": 7654} {"train_loss": -28.15240478515625, "global_step": 635336, "epoch": 7654} {"train_loss": -28.251440048217773, "global_step": 635337, "epoch": 7654} {"train_loss": -28.18145179748535, "global_step": 635338, "epoch": 7654} {"train_loss": -28.02791404724121, "global_step": 635339, "epoch": 7654} {"train_loss": -28.17754554748535, "global_step": 635340, "epoch": 7654} {"train_loss": -28.571924209594727, "global_step": 635341, "epoch": 7654} {"train_loss": -27.980871200561523, "global_step": 635342, "epoch": 7654} {"train_loss": -28.189905166625977, "global_step": 635343, "epoch": 7654} {"train_loss": -28.681671142578125, "global_step": 635344, "epoch": 7654} {"train_loss": -28.554880142211914, "global_step": 635345, "epoch": 7654} {"train_loss": -28.441198348999023, "global_step": 635346, "epoch": 7654} {"train_loss": -27.838953018188477, "global_step": 635347, "epoch": 7654} {"train_loss": -28.4809627532959, "global_step": 635348, "epoch": 7654} {"train_loss": -28.419946670532227, "global_step": 635349, "epoch": 7654} {"train_loss": -28.030126571655273, "global_step": 635350, "epoch": 7654} {"train_loss": -28.006677627563477, "global_step": 635351, "epoch": 7654} {"train_loss": -28.85025405883789, "global_step": 635352, "epoch": 7654} {"train_loss": -28.33135414123535, "global_step": 635353, "epoch": 7654} {"train_loss": -28.152420043945312, "global_step": 635354, "epoch": 7654} {"train_loss": -28.578107833862305, "global_step": 635355, "epoch": 7654} {"train_loss": -28.1729793548584, "global_step": 635356, "epoch": 7654} {"train_loss": -28.010290145874023, "global_step": 635357, "epoch": 7654} {"train_loss": -28.671300888061523, "global_step": 635358, "epoch": 7654} {"train_loss": -28.31806755065918, "global_step": 635359, "epoch": 7654} {"train_loss": -28.431798934936523, "global_step": 635360, "epoch": 7654} {"train_loss": -28.6044864654541, "global_step": 635361, "epoch": 7654} {"train_loss": -28.60443687438965, "global_step": 635362, "epoch": 7654} {"train_loss": -28.127460479736328, "global_step": 635363, "epoch": 7654} {"train_loss": -27.973445019090033, "global_step": 635364, "epoch": 7654, "val_loss": 6680711.0} {"train_loss": -27.964807510375977, "global_step": 635365, "epoch": 7655} {"train_loss": -27.221588134765625, "global_step": 635366, "epoch": 7655} {"train_loss": -26.921878814697266, "global_step": 635367, "epoch": 7655} {"train_loss": -25.99798583984375, "global_step": 635368, "epoch": 7655} {"train_loss": -25.917531967163086, "global_step": 635369, "epoch": 7655} {"train_loss": -27.418018341064453, "global_step": 635370, "epoch": 7655} {"train_loss": -27.318023681640625, "global_step": 635371, "epoch": 7655} {"train_loss": -27.541690826416016, "global_step": 635372, "epoch": 7655} {"train_loss": -27.383136749267578, "global_step": 635373, "epoch": 7655} {"train_loss": -26.8398494720459, "global_step": 635374, "epoch": 7655} {"train_loss": -27.779443740844727, "global_step": 635375, "epoch": 7655} {"train_loss": -27.8210391998291, "global_step": 635376, "epoch": 7655} {"train_loss": -27.667083740234375, "global_step": 635377, "epoch": 7655} {"train_loss": -27.79766273498535, "global_step": 635378, "epoch": 7655} {"train_loss": -27.593420028686523, "global_step": 635379, "epoch": 7655} {"train_loss": -27.7841796875, "global_step": 635380, "epoch": 7655} {"train_loss": -27.696008682250977, "global_step": 635381, "epoch": 7655} {"train_loss": -28.17059898376465, "global_step": 635382, "epoch": 7655} {"train_loss": -27.764968872070312, "global_step": 635383, "epoch": 7655} {"train_loss": -28.24349021911621, "global_step": 635384, "epoch": 7655} {"train_loss": -28.118764877319336, "global_step": 635385, "epoch": 7655} {"train_loss": -28.313495635986328, "global_step": 635386, "epoch": 7655} {"train_loss": -28.213159561157227, "global_step": 635387, "epoch": 7655} {"train_loss": -27.876623153686523, "global_step": 635388, "epoch": 7655} {"train_loss": -27.958311080932617, "global_step": 635389, "epoch": 7655} {"train_loss": -28.6528263092041, "global_step": 635390, "epoch": 7655} {"train_loss": -27.875980377197266, "global_step": 635391, "epoch": 7655} {"train_loss": -28.186447143554688, "global_step": 635392, "epoch": 7655} {"train_loss": -28.0991153717041, "global_step": 635393, "epoch": 7655} {"train_loss": -28.3989200592041, "global_step": 635394, "epoch": 7655} {"train_loss": -28.6949520111084, "global_step": 635395, "epoch": 7655} {"train_loss": -28.419971466064453, "global_step": 635396, "epoch": 7655} {"train_loss": -28.186420440673828, "global_step": 635397, "epoch": 7655} {"train_loss": -27.946826934814453, "global_step": 635398, "epoch": 7655} {"train_loss": -28.205724716186523, "global_step": 635399, "epoch": 7655} {"train_loss": -28.3948917388916, "global_step": 635400, "epoch": 7655} {"train_loss": -28.37664222717285, "global_step": 635401, "epoch": 7655} {"train_loss": -28.453969955444336, "global_step": 635402, "epoch": 7655} {"train_loss": -28.470325469970703, "global_step": 635403, "epoch": 7655} {"train_loss": -28.367639541625977, "global_step": 635404, "epoch": 7655} {"train_loss": -28.542877197265625, "global_step": 635405, "epoch": 7655} {"train_loss": -28.731826782226562, "global_step": 635406, "epoch": 7655} {"train_loss": -28.006078720092773, "global_step": 635407, "epoch": 7655} {"train_loss": -28.7364444732666, "global_step": 635408, "epoch": 7655} {"train_loss": -28.66334342956543, "global_step": 635409, "epoch": 7655} {"train_loss": -28.825559616088867, "global_step": 635410, "epoch": 7655} {"train_loss": -28.282270431518555, "global_step": 635411, "epoch": 7655} {"train_loss": -28.505218505859375, "global_step": 635412, "epoch": 7655} {"train_loss": -28.303171157836914, "global_step": 635413, "epoch": 7655} {"train_loss": -28.138580322265625, "global_step": 635414, "epoch": 7655} {"train_loss": -28.484357833862305, "global_step": 635415, "epoch": 7655} {"train_loss": -27.93603515625, "global_step": 635416, "epoch": 7655} {"train_loss": -28.386768341064453, "global_step": 635417, "epoch": 7655} {"train_loss": -27.805988311767578, "global_step": 635418, "epoch": 7655} {"train_loss": -27.544729232788086, "global_step": 635419, "epoch": 7655} {"train_loss": -26.6794376373291, "global_step": 635420, "epoch": 7655} {"train_loss": -27.96435546875, "global_step": 635421, "epoch": 7655} {"train_loss": -27.954221725463867, "global_step": 635422, "epoch": 7655} {"train_loss": -27.610107421875, "global_step": 635423, "epoch": 7655} {"train_loss": -28.26454734802246, "global_step": 635424, "epoch": 7655} {"train_loss": -27.83009910583496, "global_step": 635425, "epoch": 7655} {"train_loss": -28.05014419555664, "global_step": 635426, "epoch": 7655} {"train_loss": -27.739774703979492, "global_step": 635427, "epoch": 7655} {"train_loss": -28.303089141845703, "global_step": 635428, "epoch": 7655} {"train_loss": -28.1412353515625, "global_step": 635429, "epoch": 7655} {"train_loss": -28.32343864440918, "global_step": 635430, "epoch": 7655} {"train_loss": -27.95448875427246, "global_step": 635431, "epoch": 7655} {"train_loss": -28.294340133666992, "global_step": 635432, "epoch": 7655} {"train_loss": -28.20362663269043, "global_step": 635433, "epoch": 7655} {"train_loss": -27.784143447875977, "global_step": 635434, "epoch": 7655} {"train_loss": -28.349334716796875, "global_step": 635435, "epoch": 7655} {"train_loss": -27.936819076538086, "global_step": 635436, "epoch": 7655} {"train_loss": -28.153608322143555, "global_step": 635437, "epoch": 7655} {"train_loss": -28.220251083374023, "global_step": 635438, "epoch": 7655} {"train_loss": -28.538793563842773, "global_step": 635439, "epoch": 7655} {"train_loss": -28.14813804626465, "global_step": 635440, "epoch": 7655} {"train_loss": -27.95501136779785, "global_step": 635441, "epoch": 7655} {"train_loss": -28.63665771484375, "global_step": 635442, "epoch": 7655} {"train_loss": -28.50855827331543, "global_step": 635443, "epoch": 7655} {"train_loss": -28.367536544799805, "global_step": 635444, "epoch": 7655} {"train_loss": -28.30559730529785, "global_step": 635445, "epoch": 7655} {"train_loss": -28.332733154296875, "global_step": 635446, "epoch": 7655} {"train_loss": -28.035264922911864, "global_step": 635447, "epoch": 7655, "val_loss": 6697857.0} {"train_loss": -27.94052505493164, "global_step": 635448, "epoch": 7656} {"train_loss": -27.860288619995117, "global_step": 635449, "epoch": 7656} {"train_loss": -28.07525634765625, "global_step": 635450, "epoch": 7656} {"train_loss": -28.0078182220459, "global_step": 635451, "epoch": 7656} {"train_loss": -28.122228622436523, "global_step": 635452, "epoch": 7656} {"train_loss": -28.07134437561035, "global_step": 635453, "epoch": 7656} {"train_loss": -28.045984268188477, "global_step": 635454, "epoch": 7656} {"train_loss": -27.94891929626465, "global_step": 635455, "epoch": 7656} {"train_loss": -27.4985294342041, "global_step": 635456, "epoch": 7656} {"train_loss": -27.092884063720703, "global_step": 635457, "epoch": 7656} {"train_loss": -27.7885684967041, "global_step": 635458, "epoch": 7656} {"train_loss": -27.777673721313477, "global_step": 635459, "epoch": 7656} {"train_loss": -27.588048934936523, "global_step": 635460, "epoch": 7656} {"train_loss": -27.7099666595459, "global_step": 635461, "epoch": 7656} {"train_loss": -27.884387969970703, "global_step": 635462, "epoch": 7656} {"train_loss": -27.368555068969727, "global_step": 635463, "epoch": 7656} {"train_loss": -27.570331573486328, "global_step": 635464, "epoch": 7656} {"train_loss": -27.89337158203125, "global_step": 635465, "epoch": 7656} {"train_loss": -28.107879638671875, "global_step": 635466, "epoch": 7656} {"train_loss": -28.014928817749023, "global_step": 635467, "epoch": 7656} {"train_loss": -27.958786010742188, "global_step": 635468, "epoch": 7656} {"train_loss": -27.913366317749023, "global_step": 635469, "epoch": 7656} {"train_loss": -28.07765007019043, "global_step": 635470, "epoch": 7656} {"train_loss": -28.50092887878418, "global_step": 635471, "epoch": 7656} {"train_loss": -27.5454158782959, "global_step": 635472, "epoch": 7656} {"train_loss": -28.30816650390625, "global_step": 635473, "epoch": 7656} {"train_loss": -27.81769371032715, "global_step": 635474, "epoch": 7656} {"train_loss": -28.21881675720215, "global_step": 635475, "epoch": 7656} {"train_loss": -28.3714656829834, "global_step": 635476, "epoch": 7656} {"train_loss": -28.183637619018555, "global_step": 635477, "epoch": 7656} {"train_loss": -27.974903106689453, "global_step": 635478, "epoch": 7656} {"train_loss": -28.29306411743164, "global_step": 635479, "epoch": 7656} {"train_loss": -28.188703536987305, "global_step": 635480, "epoch": 7656} {"train_loss": -28.233129501342773, "global_step": 635481, "epoch": 7656} {"train_loss": -27.945423126220703, "global_step": 635482, "epoch": 7656} {"train_loss": -28.130634307861328, "global_step": 635483, "epoch": 7656} {"train_loss": -28.02045249938965, "global_step": 635484, "epoch": 7656} {"train_loss": -28.42384147644043, "global_step": 635485, "epoch": 7656} {"train_loss": -28.370691299438477, "global_step": 635486, "epoch": 7656} {"train_loss": -28.373594284057617, "global_step": 635487, "epoch": 7656} {"train_loss": -28.131040573120117, "global_step": 635488, "epoch": 7656} {"train_loss": -28.2568416595459, "global_step": 635489, "epoch": 7656} {"train_loss": -28.40934181213379, "global_step": 635490, "epoch": 7656} {"train_loss": -28.642675399780273, "global_step": 635491, "epoch": 7656} {"train_loss": -28.509870529174805, "global_step": 635492, "epoch": 7656} {"train_loss": -28.620840072631836, "global_step": 635493, "epoch": 7656} {"train_loss": -28.258459091186523, "global_step": 635494, "epoch": 7656} {"train_loss": -28.438512802124023, "global_step": 635495, "epoch": 7656} {"train_loss": -28.419540405273438, "global_step": 635496, "epoch": 7656} {"train_loss": -28.725011825561523, "global_step": 635497, "epoch": 7656} {"train_loss": -28.194425582885742, "global_step": 635498, "epoch": 7656} {"train_loss": -28.604528427124023, "global_step": 635499, "epoch": 7656} {"train_loss": -28.497716903686523, "global_step": 635500, "epoch": 7656} {"train_loss": -28.053068161010742, "global_step": 635501, "epoch": 7656} {"train_loss": -28.45090675354004, "global_step": 635502, "epoch": 7656} {"train_loss": -28.217329025268555, "global_step": 635503, "epoch": 7656} {"train_loss": -28.30938720703125, "global_step": 635504, "epoch": 7656} {"train_loss": -28.492834091186523, "global_step": 635505, "epoch": 7656} {"train_loss": -28.43806266784668, "global_step": 635506, "epoch": 7656} {"train_loss": -28.58648681640625, "global_step": 635507, "epoch": 7656} {"train_loss": -28.390823364257812, "global_step": 635508, "epoch": 7656} {"train_loss": -28.445646286010742, "global_step": 635509, "epoch": 7656} {"train_loss": -28.301319122314453, "global_step": 635510, "epoch": 7656} {"train_loss": -28.371057510375977, "global_step": 635511, "epoch": 7656} {"train_loss": -28.088064193725586, "global_step": 635512, "epoch": 7656} {"train_loss": -28.062047958374023, "global_step": 635513, "epoch": 7656} {"train_loss": -28.394033432006836, "global_step": 635514, "epoch": 7656} {"train_loss": -28.427759170532227, "global_step": 635515, "epoch": 7656} {"train_loss": -28.12334632873535, "global_step": 635516, "epoch": 7656} {"train_loss": -28.136884689331055, "global_step": 635517, "epoch": 7656} {"train_loss": -28.32843589782715, "global_step": 635518, "epoch": 7656} {"train_loss": -28.514841079711914, "global_step": 635519, "epoch": 7656} {"train_loss": -27.95330810546875, "global_step": 635520, "epoch": 7656} {"train_loss": -28.280689239501953, "global_step": 635521, "epoch": 7656} {"train_loss": -28.287939071655273, "global_step": 635522, "epoch": 7656} {"train_loss": -28.0020694732666, "global_step": 635523, "epoch": 7656} {"train_loss": -28.47299575805664, "global_step": 635524, "epoch": 7656} {"train_loss": -27.825891494750977, "global_step": 635525, "epoch": 7656} {"train_loss": -28.334531784057617, "global_step": 635526, "epoch": 7656} {"train_loss": -27.946277618408203, "global_step": 635527, "epoch": 7656} {"train_loss": -28.172637939453125, "global_step": 635528, "epoch": 7656} {"train_loss": -28.344995498657227, "global_step": 635529, "epoch": 7656} {"train_loss": -28.14189550101039, "global_step": 635530, "epoch": 7656, "val_loss": 6585762.5} {"train_loss": -27.922088623046875, "global_step": 635531, "epoch": 7657} {"train_loss": -27.8543643951416, "global_step": 635532, "epoch": 7657} {"train_loss": -28.127521514892578, "global_step": 635533, "epoch": 7657} {"train_loss": -28.347681045532227, "global_step": 635534, "epoch": 7657} {"train_loss": -27.821598052978516, "global_step": 635535, "epoch": 7657} {"train_loss": -28.25790786743164, "global_step": 635536, "epoch": 7657} {"train_loss": -28.060840606689453, "global_step": 635537, "epoch": 7657} {"train_loss": -27.931921005249023, "global_step": 635538, "epoch": 7657} {"train_loss": -27.76106071472168, "global_step": 635539, "epoch": 7657} {"train_loss": -28.401945114135742, "global_step": 635540, "epoch": 7657} {"train_loss": -28.243494033813477, "global_step": 635541, "epoch": 7657} {"train_loss": -28.113067626953125, "global_step": 635542, "epoch": 7657} {"train_loss": -28.38368034362793, "global_step": 635543, "epoch": 7657} {"train_loss": -28.35614013671875, "global_step": 635544, "epoch": 7657} {"train_loss": -27.921396255493164, "global_step": 635545, "epoch": 7657} {"train_loss": -27.90106773376465, "global_step": 635546, "epoch": 7657} {"train_loss": -28.330093383789062, "global_step": 635547, "epoch": 7657} {"train_loss": -28.526275634765625, "global_step": 635548, "epoch": 7657} {"train_loss": -28.185476303100586, "global_step": 635549, "epoch": 7657} {"train_loss": -28.29534912109375, "global_step": 635550, "epoch": 7657} {"train_loss": -27.971118927001953, "global_step": 635551, "epoch": 7657} {"train_loss": -27.93775749206543, "global_step": 635552, "epoch": 7657} {"train_loss": -27.7266902923584, "global_step": 635553, "epoch": 7657} {"train_loss": -28.107852935791016, "global_step": 635554, "epoch": 7657} {"train_loss": -28.152545928955078, "global_step": 635555, "epoch": 7657} {"train_loss": -28.2273006439209, "global_step": 635556, "epoch": 7657} {"train_loss": -28.022573471069336, "global_step": 635557, "epoch": 7657} {"train_loss": -28.66160011291504, "global_step": 635558, "epoch": 7657} {"train_loss": -28.16204261779785, "global_step": 635559, "epoch": 7657} {"train_loss": -28.242874145507812, "global_step": 635560, "epoch": 7657} {"train_loss": -28.588367462158203, "global_step": 635561, "epoch": 7657} {"train_loss": -28.484760284423828, "global_step": 635562, "epoch": 7657} {"train_loss": -27.736251831054688, "global_step": 635563, "epoch": 7657} {"train_loss": -28.4138240814209, "global_step": 635564, "epoch": 7657} {"train_loss": -28.777179718017578, "global_step": 635565, "epoch": 7657} {"train_loss": -28.21192741394043, "global_step": 635566, "epoch": 7657} {"train_loss": -28.23341178894043, "global_step": 635567, "epoch": 7657} {"train_loss": -28.212554931640625, "global_step": 635568, "epoch": 7657} {"train_loss": -28.13577651977539, "global_step": 635569, "epoch": 7657} {"train_loss": -28.211694717407227, "global_step": 635570, "epoch": 7657} {"train_loss": -28.59217643737793, "global_step": 635571, "epoch": 7657} {"train_loss": -28.3563232421875, "global_step": 635572, "epoch": 7657} {"train_loss": -28.109909057617188, "global_step": 635573, "epoch": 7657} {"train_loss": -28.18798828125, "global_step": 635574, "epoch": 7657} {"train_loss": -27.71564292907715, "global_step": 635575, "epoch": 7657} {"train_loss": -27.695383071899414, "global_step": 635576, "epoch": 7657} {"train_loss": -28.09088134765625, "global_step": 635577, "epoch": 7657} {"train_loss": -28.376134872436523, "global_step": 635578, "epoch": 7657} {"train_loss": -28.26386070251465, "global_step": 635579, "epoch": 7657} {"train_loss": -28.31157875061035, "global_step": 635580, "epoch": 7657} {"train_loss": -28.258676528930664, "global_step": 635581, "epoch": 7657} {"train_loss": -28.508642196655273, "global_step": 635582, "epoch": 7657} {"train_loss": -28.06123161315918, "global_step": 635583, "epoch": 7657} {"train_loss": -28.623138427734375, "global_step": 635584, "epoch": 7657} {"train_loss": -28.44089126586914, "global_step": 635585, "epoch": 7657} {"train_loss": -27.842548370361328, "global_step": 635586, "epoch": 7657} {"train_loss": -28.301898956298828, "global_step": 635587, "epoch": 7657} {"train_loss": -28.497644424438477, "global_step": 635588, "epoch": 7657} {"train_loss": -28.571298599243164, "global_step": 635589, "epoch": 7657} {"train_loss": -28.47672462463379, "global_step": 635590, "epoch": 7657} {"train_loss": -28.319822311401367, "global_step": 635591, "epoch": 7657} {"train_loss": -28.008258819580078, "global_step": 635592, "epoch": 7657} {"train_loss": -28.36467933654785, "global_step": 635593, "epoch": 7657} {"train_loss": -28.305023193359375, "global_step": 635594, "epoch": 7657} {"train_loss": -28.32013511657715, "global_step": 635595, "epoch": 7657} {"train_loss": -28.01715087890625, "global_step": 635596, "epoch": 7657} {"train_loss": -28.068740844726562, "global_step": 635597, "epoch": 7657} {"train_loss": -28.36209487915039, "global_step": 635598, "epoch": 7657} {"train_loss": -28.675329208374023, "global_step": 635599, "epoch": 7657} {"train_loss": -28.538833618164062, "global_step": 635600, "epoch": 7657} {"train_loss": -28.293731689453125, "global_step": 635601, "epoch": 7657} {"train_loss": -28.35184097290039, "global_step": 635602, "epoch": 7657} {"train_loss": -28.54569435119629, "global_step": 635603, "epoch": 7657} {"train_loss": -28.342924118041992, "global_step": 635604, "epoch": 7657} {"train_loss": -28.213186264038086, "global_step": 635605, "epoch": 7657} {"train_loss": -27.99944496154785, "global_step": 635606, "epoch": 7657} {"train_loss": -28.59407615661621, "global_step": 635607, "epoch": 7657} {"train_loss": -28.04298210144043, "global_step": 635608, "epoch": 7657} {"train_loss": -28.382648468017578, "global_step": 635609, "epoch": 7657} {"train_loss": -28.588180541992188, "global_step": 635610, "epoch": 7657} {"train_loss": -28.200048446655273, "global_step": 635611, "epoch": 7657} {"train_loss": -28.3111629486084, "global_step": 635612, "epoch": 7657} {"train_loss": -28.230247106896826, "global_step": 635613, "epoch": 7657, "val_loss": 6709848.5} {"train_loss": -28.3897647857666, "global_step": 635614, "epoch": 7658} {"train_loss": -27.00477409362793, "global_step": 635615, "epoch": 7658} {"train_loss": -27.179141998291016, "global_step": 635616, "epoch": 7658} {"train_loss": -27.47479820251465, "global_step": 635617, "epoch": 7658} {"train_loss": -27.27605628967285, "global_step": 635618, "epoch": 7658} {"train_loss": -27.45110511779785, "global_step": 635619, "epoch": 7658} {"train_loss": -27.557031631469727, "global_step": 635620, "epoch": 7658} {"train_loss": -27.335901260375977, "global_step": 635621, "epoch": 7658} {"train_loss": -27.913068771362305, "global_step": 635622, "epoch": 7658} {"train_loss": -27.934162139892578, "global_step": 635623, "epoch": 7658} {"train_loss": -28.015827178955078, "global_step": 635624, "epoch": 7658} {"train_loss": -27.906763076782227, "global_step": 635625, "epoch": 7658} {"train_loss": -27.916095733642578, "global_step": 635626, "epoch": 7658} {"train_loss": -28.351978302001953, "global_step": 635627, "epoch": 7658} {"train_loss": -27.998397827148438, "global_step": 635628, "epoch": 7658} {"train_loss": -27.890607833862305, "global_step": 635629, "epoch": 7658} {"train_loss": -27.93766212463379, "global_step": 635630, "epoch": 7658} {"train_loss": -28.004261016845703, "global_step": 635631, "epoch": 7658} {"train_loss": -27.959211349487305, "global_step": 635632, "epoch": 7658} {"train_loss": -27.38093376159668, "global_step": 635633, "epoch": 7658} {"train_loss": -28.073972702026367, "global_step": 635634, "epoch": 7658} {"train_loss": -28.576990127563477, "global_step": 635635, "epoch": 7658} {"train_loss": -28.190855026245117, "global_step": 635636, "epoch": 7658} {"train_loss": -28.038572311401367, "global_step": 635637, "epoch": 7658} {"train_loss": -28.26271629333496, "global_step": 635638, "epoch": 7658} {"train_loss": -28.31353187561035, "global_step": 635639, "epoch": 7658} {"train_loss": -27.8927001953125, "global_step": 635640, "epoch": 7658} {"train_loss": -28.183332443237305, "global_step": 635641, "epoch": 7658} {"train_loss": -27.97220230102539, "global_step": 635642, "epoch": 7658} {"train_loss": -28.114643096923828, "global_step": 635643, "epoch": 7658} {"train_loss": -27.8060302734375, "global_step": 635644, "epoch": 7658} {"train_loss": -28.365203857421875, "global_step": 635645, "epoch": 7658} {"train_loss": -27.995023727416992, "global_step": 635646, "epoch": 7658} {"train_loss": -28.298080444335938, "global_step": 635647, "epoch": 7658} {"train_loss": -28.035266876220703, "global_step": 635648, "epoch": 7658} {"train_loss": -28.2083683013916, "global_step": 635649, "epoch": 7658} {"train_loss": -28.358800888061523, "global_step": 635650, "epoch": 7658} {"train_loss": -28.286359786987305, "global_step": 635651, "epoch": 7658} {"train_loss": -28.361480712890625, "global_step": 635652, "epoch": 7658} {"train_loss": -28.651288986206055, "global_step": 635653, "epoch": 7658} {"train_loss": -28.196460723876953, "global_step": 635654, "epoch": 7658} {"train_loss": -28.214609146118164, "global_step": 635655, "epoch": 7658} {"train_loss": -28.440185546875, "global_step": 635656, "epoch": 7658} {"train_loss": -28.3785343170166, "global_step": 635657, "epoch": 7658} {"train_loss": -28.277603149414062, "global_step": 635658, "epoch": 7658} {"train_loss": -28.550888061523438, "global_step": 635659, "epoch": 7658} {"train_loss": -28.377628326416016, "global_step": 635660, "epoch": 7658} {"train_loss": -28.714757919311523, "global_step": 635661, "epoch": 7658} {"train_loss": -28.417585372924805, "global_step": 635662, "epoch": 7658} {"train_loss": -28.350671768188477, "global_step": 635663, "epoch": 7658} {"train_loss": -28.337656021118164, "global_step": 635664, "epoch": 7658} {"train_loss": -27.963159561157227, "global_step": 635665, "epoch": 7658} {"train_loss": -28.47663688659668, "global_step": 635666, "epoch": 7658} {"train_loss": -28.275257110595703, "global_step": 635667, "epoch": 7658} {"train_loss": -28.3427677154541, "global_step": 635668, "epoch": 7658} {"train_loss": -28.489004135131836, "global_step": 635669, "epoch": 7658} {"train_loss": -28.42423439025879, "global_step": 635670, "epoch": 7658} {"train_loss": -28.686050415039062, "global_step": 635671, "epoch": 7658} {"train_loss": -28.510541915893555, "global_step": 635672, "epoch": 7658} {"train_loss": -28.113525390625, "global_step": 635673, "epoch": 7658} {"train_loss": -28.128772735595703, "global_step": 635674, "epoch": 7658} {"train_loss": -27.871566772460938, "global_step": 635675, "epoch": 7658} {"train_loss": -27.474653244018555, "global_step": 635676, "epoch": 7658} {"train_loss": -28.14960289001465, "global_step": 635677, "epoch": 7658} {"train_loss": -28.338769912719727, "global_step": 635678, "epoch": 7658} {"train_loss": -28.369770050048828, "global_step": 635679, "epoch": 7658} {"train_loss": -28.3946533203125, "global_step": 635680, "epoch": 7658} {"train_loss": -28.229089736938477, "global_step": 635681, "epoch": 7658} {"train_loss": -28.060470581054688, "global_step": 635682, "epoch": 7658} {"train_loss": -28.293039321899414, "global_step": 635683, "epoch": 7658} {"train_loss": -28.256284713745117, "global_step": 635684, "epoch": 7658} {"train_loss": -28.3320255279541, "global_step": 635685, "epoch": 7658} {"train_loss": -27.65105628967285, "global_step": 635686, "epoch": 7658} {"train_loss": -28.14764404296875, "global_step": 635687, "epoch": 7658} {"train_loss": -28.063379287719727, "global_step": 635688, "epoch": 7658} {"train_loss": -28.16196060180664, "global_step": 635689, "epoch": 7658} {"train_loss": -28.245391845703125, "global_step": 635690, "epoch": 7658} {"train_loss": -28.19692039489746, "global_step": 635691, "epoch": 7658} {"train_loss": -28.492206573486328, "global_step": 635692, "epoch": 7658} {"train_loss": -28.12342643737793, "global_step": 635693, "epoch": 7658} {"train_loss": -28.264694213867188, "global_step": 635694, "epoch": 7658} {"train_loss": -28.167505264282227, "global_step": 635695, "epoch": 7658} {"train_loss": -28.131328582763672, "global_step": 635696, "epoch": 7658, "val_loss": 6729777.0} {"train_loss": -26.976490020751953, "global_step": 635697, "epoch": 7659} {"train_loss": -26.912015914916992, "global_step": 635698, "epoch": 7659} {"train_loss": -27.437747955322266, "global_step": 635699, "epoch": 7659} {"train_loss": -27.8985652923584, "global_step": 635700, "epoch": 7659} {"train_loss": -27.4947566986084, "global_step": 635701, "epoch": 7659} {"train_loss": -27.371612548828125, "global_step": 635702, "epoch": 7659} {"train_loss": -27.771438598632812, "global_step": 635703, "epoch": 7659} {"train_loss": -27.871612548828125, "global_step": 635704, "epoch": 7659} {"train_loss": -27.64063835144043, "global_step": 635705, "epoch": 7659} {"train_loss": -27.712045669555664, "global_step": 635706, "epoch": 7659} {"train_loss": -27.563812255859375, "global_step": 635707, "epoch": 7659} {"train_loss": -27.898061752319336, "global_step": 635708, "epoch": 7659} {"train_loss": -28.27435874938965, "global_step": 635709, "epoch": 7659} {"train_loss": -27.542593002319336, "global_step": 635710, "epoch": 7659} {"train_loss": -28.360137939453125, "global_step": 635711, "epoch": 7659} {"train_loss": -28.1312198638916, "global_step": 635712, "epoch": 7659} {"train_loss": -28.04986572265625, "global_step": 635713, "epoch": 7659} {"train_loss": -28.01368522644043, "global_step": 635714, "epoch": 7659} {"train_loss": -28.138757705688477, "global_step": 635715, "epoch": 7659} {"train_loss": -28.39484977722168, "global_step": 635716, "epoch": 7659} {"train_loss": -28.051101684570312, "global_step": 635717, "epoch": 7659} {"train_loss": -28.004444122314453, "global_step": 635718, "epoch": 7659} {"train_loss": -27.615232467651367, "global_step": 635719, "epoch": 7659} {"train_loss": -28.037290573120117, "global_step": 635720, "epoch": 7659} {"train_loss": -28.151105880737305, "global_step": 635721, "epoch": 7659} {"train_loss": -27.60888671875, "global_step": 635722, "epoch": 7659} {"train_loss": -28.289453506469727, "global_step": 635723, "epoch": 7659} {"train_loss": -28.179723739624023, "global_step": 635724, "epoch": 7659} {"train_loss": -28.151769638061523, "global_step": 635725, "epoch": 7659} {"train_loss": -28.172231674194336, "global_step": 635726, "epoch": 7659} {"train_loss": -27.97724723815918, "global_step": 635727, "epoch": 7659} {"train_loss": -28.32293701171875, "global_step": 635728, "epoch": 7659} {"train_loss": -28.039026260375977, "global_step": 635729, "epoch": 7659} {"train_loss": -28.202472686767578, "global_step": 635730, "epoch": 7659} {"train_loss": -27.669193267822266, "global_step": 635731, "epoch": 7659} {"train_loss": -28.18781089782715, "global_step": 635732, "epoch": 7659} {"train_loss": -27.870258331298828, "global_step": 635733, "epoch": 7659} {"train_loss": -28.63081932067871, "global_step": 635734, "epoch": 7659} {"train_loss": -27.990386962890625, "global_step": 635735, "epoch": 7659} {"train_loss": -28.063873291015625, "global_step": 635736, "epoch": 7659} {"train_loss": -27.89607048034668, "global_step": 635737, "epoch": 7659} {"train_loss": -28.58063316345215, "global_step": 635738, "epoch": 7659} {"train_loss": -27.89436912536621, "global_step": 635739, "epoch": 7659} {"train_loss": -28.5233154296875, "global_step": 635740, "epoch": 7659} {"train_loss": -28.309589385986328, "global_step": 635741, "epoch": 7659} {"train_loss": -28.032535552978516, "global_step": 635742, "epoch": 7659} {"train_loss": -28.487943649291992, "global_step": 635743, "epoch": 7659} {"train_loss": -28.28885269165039, "global_step": 635744, "epoch": 7659} {"train_loss": -28.53754234313965, "global_step": 635745, "epoch": 7659} {"train_loss": -28.435754776000977, "global_step": 635746, "epoch": 7659} {"train_loss": -28.515119552612305, "global_step": 635747, "epoch": 7659} {"train_loss": -28.26593589782715, "global_step": 635748, "epoch": 7659} {"train_loss": -28.267724990844727, "global_step": 635749, "epoch": 7659} {"train_loss": -28.39307975769043, "global_step": 635750, "epoch": 7659} {"train_loss": -28.52031898498535, "global_step": 635751, "epoch": 7659} {"train_loss": -27.995450973510742, "global_step": 635752, "epoch": 7659} {"train_loss": -28.230010986328125, "global_step": 635753, "epoch": 7659} {"train_loss": -28.1712646484375, "global_step": 635754, "epoch": 7659} {"train_loss": -28.529951095581055, "global_step": 635755, "epoch": 7659} {"train_loss": -28.3383731842041, "global_step": 635756, "epoch": 7659} {"train_loss": -28.185272216796875, "global_step": 635757, "epoch": 7659} {"train_loss": -28.44141960144043, "global_step": 635758, "epoch": 7659} {"train_loss": -28.62836265563965, "global_step": 635759, "epoch": 7659} {"train_loss": -28.430509567260742, "global_step": 635760, "epoch": 7659} {"train_loss": -28.3242130279541, "global_step": 635761, "epoch": 7659} {"train_loss": -27.9338321685791, "global_step": 635762, "epoch": 7659} {"train_loss": -28.240188598632812, "global_step": 635763, "epoch": 7659} {"train_loss": -28.156198501586914, "global_step": 635764, "epoch": 7659} {"train_loss": -27.870534896850586, "global_step": 635765, "epoch": 7659} {"train_loss": -27.18568992614746, "global_step": 635766, "epoch": 7659} {"train_loss": -27.233057022094727, "global_step": 635767, "epoch": 7659} {"train_loss": -27.788549423217773, "global_step": 635768, "epoch": 7659} {"train_loss": -27.922216415405273, "global_step": 635769, "epoch": 7659} {"train_loss": -27.91602897644043, "global_step": 635770, "epoch": 7659} {"train_loss": -27.912641525268555, "global_step": 635771, "epoch": 7659} {"train_loss": -27.875593185424805, "global_step": 635772, "epoch": 7659} {"train_loss": -28.331562042236328, "global_step": 635773, "epoch": 7659} {"train_loss": -27.957258224487305, "global_step": 635774, "epoch": 7659} {"train_loss": -28.235916137695312, "global_step": 635775, "epoch": 7659} {"train_loss": -28.2188663482666, "global_step": 635776, "epoch": 7659} {"train_loss": -27.869367599487305, "global_step": 635777, "epoch": 7659} {"train_loss": -27.744827270507812, "global_step": 635778, "epoch": 7659} {"train_loss": -28.034195865493224, "global_step": 635779, "epoch": 7659, "val_loss": 6686534.0} {"train_loss": -27.87067985534668, "global_step": 635780, "epoch": 7660} {"train_loss": -27.536365509033203, "global_step": 635781, "epoch": 7660} {"train_loss": -27.55609130859375, "global_step": 635782, "epoch": 7660} {"train_loss": -27.753921508789062, "global_step": 635783, "epoch": 7660} {"train_loss": -27.6101131439209, "global_step": 635784, "epoch": 7660} {"train_loss": -27.03223991394043, "global_step": 635785, "epoch": 7660} {"train_loss": -27.731103897094727, "global_step": 635786, "epoch": 7660} {"train_loss": -28.00261878967285, "global_step": 635787, "epoch": 7660} {"train_loss": -27.489765167236328, "global_step": 635788, "epoch": 7660} {"train_loss": -27.51824951171875, "global_step": 635789, "epoch": 7660} {"train_loss": -27.304529190063477, "global_step": 635790, "epoch": 7660} {"train_loss": -27.394866943359375, "global_step": 635791, "epoch": 7660} {"train_loss": -27.999618530273438, "global_step": 635792, "epoch": 7660} {"train_loss": -27.418048858642578, "global_step": 635793, "epoch": 7660} {"train_loss": -27.737112045288086, "global_step": 635794, "epoch": 7660} {"train_loss": -27.79133415222168, "global_step": 635795, "epoch": 7660} {"train_loss": -28.131216049194336, "global_step": 635796, "epoch": 7660} {"train_loss": -27.84346580505371, "global_step": 635797, "epoch": 7660} {"train_loss": -28.181446075439453, "global_step": 635798, "epoch": 7660} {"train_loss": -27.71661376953125, "global_step": 635799, "epoch": 7660} {"train_loss": -27.851856231689453, "global_step": 635800, "epoch": 7660} {"train_loss": -27.965808868408203, "global_step": 635801, "epoch": 7660} {"train_loss": -27.95844078063965, "global_step": 635802, "epoch": 7660} {"train_loss": -28.2731876373291, "global_step": 635803, "epoch": 7660} {"train_loss": -28.155872344970703, "global_step": 635804, "epoch": 7660} {"train_loss": -28.46375846862793, "global_step": 635805, "epoch": 7660} {"train_loss": -27.94700050354004, "global_step": 635806, "epoch": 7660} {"train_loss": -28.436086654663086, "global_step": 635807, "epoch": 7660} {"train_loss": -28.256681442260742, "global_step": 635808, "epoch": 7660} {"train_loss": -28.412817001342773, "global_step": 635809, "epoch": 7660} {"train_loss": -28.125417709350586, "global_step": 635810, "epoch": 7660} {"train_loss": -28.30926513671875, "global_step": 635811, "epoch": 7660} {"train_loss": -28.627695083618164, "global_step": 635812, "epoch": 7660} {"train_loss": -28.324445724487305, "global_step": 635813, "epoch": 7660} {"train_loss": -28.182889938354492, "global_step": 635814, "epoch": 7660} {"train_loss": -28.117828369140625, "global_step": 635815, "epoch": 7660} {"train_loss": -28.271757125854492, "global_step": 635816, "epoch": 7660} {"train_loss": -28.439321517944336, "global_step": 635817, "epoch": 7660} {"train_loss": -28.50960350036621, "global_step": 635818, "epoch": 7660} {"train_loss": -28.636749267578125, "global_step": 635819, "epoch": 7660} {"train_loss": -28.285348892211914, "global_step": 635820, "epoch": 7660} {"train_loss": -28.426868438720703, "global_step": 635821, "epoch": 7660} {"train_loss": -28.29999351501465, "global_step": 635822, "epoch": 7660} {"train_loss": -28.12601661682129, "global_step": 635823, "epoch": 7660} {"train_loss": -28.391149520874023, "global_step": 635824, "epoch": 7660} {"train_loss": -28.27631950378418, "global_step": 635825, "epoch": 7660} {"train_loss": -28.24555015563965, "global_step": 635826, "epoch": 7660} {"train_loss": -28.075876235961914, "global_step": 635827, "epoch": 7660} {"train_loss": -28.34685707092285, "global_step": 635828, "epoch": 7660} {"train_loss": -28.413440704345703, "global_step": 635829, "epoch": 7660} {"train_loss": -28.532642364501953, "global_step": 635830, "epoch": 7660} {"train_loss": -28.238428115844727, "global_step": 635831, "epoch": 7660} {"train_loss": -28.4846134185791, "global_step": 635832, "epoch": 7660} {"train_loss": -28.34912109375, "global_step": 635833, "epoch": 7660} {"train_loss": -28.79242515563965, "global_step": 635834, "epoch": 7660} {"train_loss": -28.30132484436035, "global_step": 635835, "epoch": 7660} {"train_loss": -28.067785263061523, "global_step": 635836, "epoch": 7660} {"train_loss": -28.392047882080078, "global_step": 635837, "epoch": 7660} {"train_loss": -28.351215362548828, "global_step": 635838, "epoch": 7660} {"train_loss": -28.339954376220703, "global_step": 635839, "epoch": 7660} {"train_loss": -28.40692710876465, "global_step": 635840, "epoch": 7660} {"train_loss": -27.95953941345215, "global_step": 635841, "epoch": 7660} {"train_loss": -28.459997177124023, "global_step": 635842, "epoch": 7660} {"train_loss": -27.888690948486328, "global_step": 635843, "epoch": 7660} {"train_loss": -28.027246475219727, "global_step": 635844, "epoch": 7660} {"train_loss": -28.559690475463867, "global_step": 635845, "epoch": 7660} {"train_loss": -28.0699405670166, "global_step": 635846, "epoch": 7660} {"train_loss": -28.275022506713867, "global_step": 635847, "epoch": 7660} {"train_loss": -28.237207412719727, "global_step": 635848, "epoch": 7660} {"train_loss": -28.179182052612305, "global_step": 635849, "epoch": 7660} {"train_loss": -28.580442428588867, "global_step": 635850, "epoch": 7660} {"train_loss": -28.074848175048828, "global_step": 635851, "epoch": 7660} {"train_loss": -28.177106857299805, "global_step": 635852, "epoch": 7660} {"train_loss": -28.21034049987793, "global_step": 635853, "epoch": 7660} {"train_loss": -28.131011962890625, "global_step": 635854, "epoch": 7660} {"train_loss": -28.334325790405273, "global_step": 635855, "epoch": 7660} {"train_loss": -28.34823989868164, "global_step": 635856, "epoch": 7660} {"train_loss": -28.30730628967285, "global_step": 635857, "epoch": 7660} {"train_loss": -27.988239288330078, "global_step": 635858, "epoch": 7660} {"train_loss": -28.23335075378418, "global_step": 635859, "epoch": 7660} {"train_loss": -28.270980834960938, "global_step": 635860, "epoch": 7660} {"train_loss": -28.2401123046875, "global_step": 635861, "epoch": 7660} {"train_loss": -28.135258180549346, "global_step": 635862, "epoch": 7660, "val_loss": 6627551.0} {"train_loss": -28.19636344909668, "global_step": 635863, "epoch": 7661} {"train_loss": -27.41806411743164, "global_step": 635864, "epoch": 7661} {"train_loss": -27.999258041381836, "global_step": 635865, "epoch": 7661} {"train_loss": -28.153594970703125, "global_step": 635866, "epoch": 7661} {"train_loss": -28.13570213317871, "global_step": 635867, "epoch": 7661} {"train_loss": -27.396997451782227, "global_step": 635868, "epoch": 7661} {"train_loss": -28.1696720123291, "global_step": 635869, "epoch": 7661} {"train_loss": -27.91908073425293, "global_step": 635870, "epoch": 7661} {"train_loss": -28.414514541625977, "global_step": 635871, "epoch": 7661} {"train_loss": -28.249662399291992, "global_step": 635872, "epoch": 7661} {"train_loss": -27.715856552124023, "global_step": 635873, "epoch": 7661} {"train_loss": -28.073230743408203, "global_step": 635874, "epoch": 7661} {"train_loss": -27.756772994995117, "global_step": 635875, "epoch": 7661} {"train_loss": -28.202808380126953, "global_step": 635876, "epoch": 7661} {"train_loss": -28.075531005859375, "global_step": 635877, "epoch": 7661} {"train_loss": -28.26584243774414, "global_step": 635878, "epoch": 7661} {"train_loss": -28.036386489868164, "global_step": 635879, "epoch": 7661} {"train_loss": -27.9002742767334, "global_step": 635880, "epoch": 7661} {"train_loss": -28.253021240234375, "global_step": 635881, "epoch": 7661} {"train_loss": -28.068023681640625, "global_step": 635882, "epoch": 7661} {"train_loss": -27.767536163330078, "global_step": 635883, "epoch": 7661} {"train_loss": -28.298505783081055, "global_step": 635884, "epoch": 7661} {"train_loss": -27.88533592224121, "global_step": 635885, "epoch": 7661} {"train_loss": -28.394306182861328, "global_step": 635886, "epoch": 7661} {"train_loss": -28.24529457092285, "global_step": 635887, "epoch": 7661} {"train_loss": -28.25935935974121, "global_step": 635888, "epoch": 7661} {"train_loss": -27.966028213500977, "global_step": 635889, "epoch": 7661} {"train_loss": -28.055814743041992, "global_step": 635890, "epoch": 7661} {"train_loss": -28.062015533447266, "global_step": 635891, "epoch": 7661} {"train_loss": -28.134784698486328, "global_step": 635892, "epoch": 7661} {"train_loss": -28.27544593811035, "global_step": 635893, "epoch": 7661} {"train_loss": -28.558191299438477, "global_step": 635894, "epoch": 7661} {"train_loss": -28.343175888061523, "global_step": 635895, "epoch": 7661} {"train_loss": -28.229948043823242, "global_step": 635896, "epoch": 7661} {"train_loss": -28.292423248291016, "global_step": 635897, "epoch": 7661} {"train_loss": -28.185453414916992, "global_step": 635898, "epoch": 7661} {"train_loss": -28.251590728759766, "global_step": 635899, "epoch": 7661} {"train_loss": -28.347768783569336, "global_step": 635900, "epoch": 7661} {"train_loss": -27.9539852142334, "global_step": 635901, "epoch": 7661} {"train_loss": -28.020429611206055, "global_step": 635902, "epoch": 7661} {"train_loss": -27.9965763092041, "global_step": 635903, "epoch": 7661} {"train_loss": -28.1689453125, "global_step": 635904, "epoch": 7661} {"train_loss": -28.567174911499023, "global_step": 635905, "epoch": 7661} {"train_loss": -28.255094528198242, "global_step": 635906, "epoch": 7661} {"train_loss": -28.121967315673828, "global_step": 635907, "epoch": 7661} {"train_loss": -27.735015869140625, "global_step": 635908, "epoch": 7661} {"train_loss": -28.24647331237793, "global_step": 635909, "epoch": 7661} {"train_loss": -28.56284523010254, "global_step": 635910, "epoch": 7661} {"train_loss": -28.5457820892334, "global_step": 635911, "epoch": 7661} {"train_loss": -28.532155990600586, "global_step": 635912, "epoch": 7661} {"train_loss": -28.564620971679688, "global_step": 635913, "epoch": 7661} {"train_loss": -28.535749435424805, "global_step": 635914, "epoch": 7661} {"train_loss": -28.541065216064453, "global_step": 635915, "epoch": 7661} {"train_loss": -28.274423599243164, "global_step": 635916, "epoch": 7661} {"train_loss": -28.53461265563965, "global_step": 635917, "epoch": 7661} {"train_loss": -28.271291732788086, "global_step": 635918, "epoch": 7661} {"train_loss": -28.419408798217773, "global_step": 635919, "epoch": 7661} {"train_loss": -28.279998779296875, "global_step": 635920, "epoch": 7661} {"train_loss": -28.270544052124023, "global_step": 635921, "epoch": 7661} {"train_loss": -28.27010154724121, "global_step": 635922, "epoch": 7661} {"train_loss": -28.348852157592773, "global_step": 635923, "epoch": 7661} {"train_loss": -28.19630241394043, "global_step": 635924, "epoch": 7661} {"train_loss": -28.696624755859375, "global_step": 635925, "epoch": 7661} {"train_loss": -28.46100425720215, "global_step": 635926, "epoch": 7661} {"train_loss": -28.075178146362305, "global_step": 635927, "epoch": 7661} {"train_loss": -29.0379581451416, "global_step": 635928, "epoch": 7661} {"train_loss": -28.1695613861084, "global_step": 635929, "epoch": 7661} {"train_loss": -28.25248146057129, "global_step": 635930, "epoch": 7661} {"train_loss": -28.3992919921875, "global_step": 635931, "epoch": 7661} {"train_loss": -28.575183868408203, "global_step": 635932, "epoch": 7661} {"train_loss": -27.843366622924805, "global_step": 635933, "epoch": 7661} {"train_loss": -28.094257354736328, "global_step": 635934, "epoch": 7661} {"train_loss": -27.828046798706055, "global_step": 635935, "epoch": 7661} {"train_loss": -27.883228302001953, "global_step": 635936, "epoch": 7661} {"train_loss": -28.155820846557617, "global_step": 635937, "epoch": 7661} {"train_loss": -28.021265029907227, "global_step": 635938, "epoch": 7661} {"train_loss": -28.23779296875, "global_step": 635939, "epoch": 7661} {"train_loss": -28.28830337524414, "global_step": 635940, "epoch": 7661} {"train_loss": -28.134403228759766, "global_step": 635941, "epoch": 7661} {"train_loss": -28.147287368774414, "global_step": 635942, "epoch": 7661} {"train_loss": -28.118488311767578, "global_step": 635943, "epoch": 7661} {"train_loss": -27.890460968017578, "global_step": 635944, "epoch": 7661} {"train_loss": -28.201062650565643, "global_step": 635945, "epoch": 7661, "val_loss": 6647088.5} {"train_loss": -27.944711685180664, "global_step": 635946, "epoch": 7662} {"train_loss": -27.992197036743164, "global_step": 635947, "epoch": 7662} {"train_loss": -27.83786964416504, "global_step": 635948, "epoch": 7662} {"train_loss": -27.773115158081055, "global_step": 635949, "epoch": 7662} {"train_loss": -27.966995239257812, "global_step": 635950, "epoch": 7662} {"train_loss": -27.887792587280273, "global_step": 635951, "epoch": 7662} {"train_loss": -28.01533317565918, "global_step": 635952, "epoch": 7662} {"train_loss": -28.074756622314453, "global_step": 635953, "epoch": 7662} {"train_loss": -28.284650802612305, "global_step": 635954, "epoch": 7662} {"train_loss": -27.672306060791016, "global_step": 635955, "epoch": 7662} {"train_loss": -27.85991859436035, "global_step": 635956, "epoch": 7662} {"train_loss": -27.79266929626465, "global_step": 635957, "epoch": 7662} {"train_loss": -27.898359298706055, "global_step": 635958, "epoch": 7662} {"train_loss": -27.71158790588379, "global_step": 635959, "epoch": 7662} {"train_loss": -28.04396629333496, "global_step": 635960, "epoch": 7662} {"train_loss": -28.060266494750977, "global_step": 635961, "epoch": 7662} {"train_loss": -27.97212028503418, "global_step": 635962, "epoch": 7662} {"train_loss": -27.947126388549805, "global_step": 635963, "epoch": 7662} {"train_loss": -27.822967529296875, "global_step": 635964, "epoch": 7662} {"train_loss": -28.138105392456055, "global_step": 635965, "epoch": 7662} {"train_loss": -27.92889404296875, "global_step": 635966, "epoch": 7662} {"train_loss": -28.17632484436035, "global_step": 635967, "epoch": 7662} {"train_loss": -28.00262451171875, "global_step": 635968, "epoch": 7662} {"train_loss": -28.544509887695312, "global_step": 635969, "epoch": 7662} {"train_loss": -28.147958755493164, "global_step": 635970, "epoch": 7662} {"train_loss": -28.045272827148438, "global_step": 635971, "epoch": 7662} {"train_loss": -28.161788940429688, "global_step": 635972, "epoch": 7662} {"train_loss": -28.474090576171875, "global_step": 635973, "epoch": 7662} {"train_loss": -28.203418731689453, "global_step": 635974, "epoch": 7662} {"train_loss": -28.011911392211914, "global_step": 635975, "epoch": 7662} {"train_loss": -27.96099853515625, "global_step": 635976, "epoch": 7662} {"train_loss": -28.056976318359375, "global_step": 635977, "epoch": 7662} {"train_loss": -28.22027587890625, "global_step": 635978, "epoch": 7662} {"train_loss": -28.385053634643555, "global_step": 635979, "epoch": 7662} {"train_loss": -28.1653995513916, "global_step": 635980, "epoch": 7662} {"train_loss": -28.294193267822266, "global_step": 635981, "epoch": 7662} {"train_loss": -28.632587432861328, "global_step": 635982, "epoch": 7662} {"train_loss": -28.208444595336914, "global_step": 635983, "epoch": 7662} {"train_loss": -28.148303985595703, "global_step": 635984, "epoch": 7662} {"train_loss": -28.18263816833496, "global_step": 635985, "epoch": 7662} {"train_loss": -28.531408309936523, "global_step": 635986, "epoch": 7662} {"train_loss": -28.21917724609375, "global_step": 635987, "epoch": 7662} {"train_loss": -28.4481258392334, "global_step": 635988, "epoch": 7662} {"train_loss": -28.393686294555664, "global_step": 635989, "epoch": 7662} {"train_loss": -28.882715225219727, "global_step": 635990, "epoch": 7662} {"train_loss": -28.491235733032227, "global_step": 635991, "epoch": 7662} {"train_loss": -28.633289337158203, "global_step": 635992, "epoch": 7662} {"train_loss": -28.402515411376953, "global_step": 635993, "epoch": 7662} {"train_loss": -28.546796798706055, "global_step": 635994, "epoch": 7662} {"train_loss": -27.630767822265625, "global_step": 635995, "epoch": 7662} {"train_loss": -27.989194869995117, "global_step": 635996, "epoch": 7662} {"train_loss": -27.339670181274414, "global_step": 635997, "epoch": 7662} {"train_loss": -27.44351577758789, "global_step": 635998, "epoch": 7662} {"train_loss": -27.8302001953125, "global_step": 635999, "epoch": 7662} {"train_loss": -28.6063232421875, "global_step": 636000, "epoch": 7662} {"train_loss": -28.2034854888916, "global_step": 636001, "epoch": 7662} {"train_loss": -27.745725631713867, "global_step": 636002, "epoch": 7662} {"train_loss": -28.185522079467773, "global_step": 636003, "epoch": 7662} {"train_loss": -27.99234390258789, "global_step": 636004, "epoch": 7662} {"train_loss": -28.082345962524414, "global_step": 636005, "epoch": 7662} {"train_loss": -28.16973304748535, "global_step": 636006, "epoch": 7662} {"train_loss": -28.18731689453125, "global_step": 636007, "epoch": 7662} {"train_loss": -28.04801368713379, "global_step": 636008, "epoch": 7662} {"train_loss": -28.145938873291016, "global_step": 636009, "epoch": 7662} {"train_loss": -28.493947982788086, "global_step": 636010, "epoch": 7662} {"train_loss": -27.902637481689453, "global_step": 636011, "epoch": 7662} {"train_loss": -28.232370376586914, "global_step": 636012, "epoch": 7662} {"train_loss": -28.498273849487305, "global_step": 636013, "epoch": 7662} {"train_loss": -28.38484764099121, "global_step": 636014, "epoch": 7662} {"train_loss": -28.031904220581055, "global_step": 636015, "epoch": 7662} {"train_loss": -28.08001708984375, "global_step": 636016, "epoch": 7662} {"train_loss": -28.274335861206055, "global_step": 636017, "epoch": 7662} {"train_loss": -27.866491317749023, "global_step": 636018, "epoch": 7662} {"train_loss": -28.088459014892578, "global_step": 636019, "epoch": 7662} {"train_loss": -28.168264389038086, "global_step": 636020, "epoch": 7662} {"train_loss": -28.1829833984375, "global_step": 636021, "epoch": 7662} {"train_loss": -28.324914932250977, "global_step": 636022, "epoch": 7662} {"train_loss": -27.677091598510742, "global_step": 636023, "epoch": 7662} {"train_loss": -27.600116729736328, "global_step": 636024, "epoch": 7662} {"train_loss": -28.106281280517578, "global_step": 636025, "epoch": 7662} {"train_loss": -28.254989624023438, "global_step": 636026, "epoch": 7662} {"train_loss": -28.216400146484375, "global_step": 636027, "epoch": 7662} {"train_loss": -28.10088435713067, "global_step": 636028, "epoch": 7662, "val_loss": 6556637.0} {"train_loss": -26.126312255859375, "global_step": 636029, "epoch": 7663} {"train_loss": -26.30571937561035, "global_step": 636030, "epoch": 7663} {"train_loss": -26.94837760925293, "global_step": 636031, "epoch": 7663} {"train_loss": -27.413724899291992, "global_step": 636032, "epoch": 7663} {"train_loss": -26.400175094604492, "global_step": 636033, "epoch": 7663} {"train_loss": -27.75031089782715, "global_step": 636034, "epoch": 7663} {"train_loss": -27.734771728515625, "global_step": 636035, "epoch": 7663} {"train_loss": -26.968488693237305, "global_step": 636036, "epoch": 7663} {"train_loss": -27.950483322143555, "global_step": 636037, "epoch": 7663} {"train_loss": -27.14984703063965, "global_step": 636038, "epoch": 7663} {"train_loss": -27.19463539123535, "global_step": 636039, "epoch": 7663} {"train_loss": -26.643903732299805, "global_step": 636040, "epoch": 7663} {"train_loss": -27.2813777923584, "global_step": 636041, "epoch": 7663} {"train_loss": -27.456998825073242, "global_step": 636042, "epoch": 7663} {"train_loss": -27.47356605529785, "global_step": 636043, "epoch": 7663} {"train_loss": -27.897109985351562, "global_step": 636044, "epoch": 7663} {"train_loss": -27.425939559936523, "global_step": 636045, "epoch": 7663} {"train_loss": -27.67276954650879, "global_step": 636046, "epoch": 7663} {"train_loss": -27.285764694213867, "global_step": 636047, "epoch": 7663} {"train_loss": -27.976383209228516, "global_step": 636048, "epoch": 7663} {"train_loss": -27.82794761657715, "global_step": 636049, "epoch": 7663} {"train_loss": -27.77579689025879, "global_step": 636050, "epoch": 7663} {"train_loss": -27.914581298828125, "global_step": 636051, "epoch": 7663} {"train_loss": -27.531848907470703, "global_step": 636052, "epoch": 7663} {"train_loss": -27.852155685424805, "global_step": 636053, "epoch": 7663} {"train_loss": -27.98508644104004, "global_step": 636054, "epoch": 7663} {"train_loss": -27.99879264831543, "global_step": 636055, "epoch": 7663} {"train_loss": -28.032169342041016, "global_step": 636056, "epoch": 7663} {"train_loss": -27.960927963256836, "global_step": 636057, "epoch": 7663} {"train_loss": -28.291101455688477, "global_step": 636058, "epoch": 7663} {"train_loss": -27.76618766784668, "global_step": 636059, "epoch": 7663} {"train_loss": -28.1920223236084, "global_step": 636060, "epoch": 7663} {"train_loss": -28.300268173217773, "global_step": 636061, "epoch": 7663} {"train_loss": -28.212060928344727, "global_step": 636062, "epoch": 7663} {"train_loss": -28.495920181274414, "global_step": 636063, "epoch": 7663} {"train_loss": -28.1121826171875, "global_step": 636064, "epoch": 7663} {"train_loss": -28.489343643188477, "global_step": 636065, "epoch": 7663} {"train_loss": -28.66535758972168, "global_step": 636066, "epoch": 7663} {"train_loss": -28.361692428588867, "global_step": 636067, "epoch": 7663} {"train_loss": -27.746118545532227, "global_step": 636068, "epoch": 7663} {"train_loss": -28.338031768798828, "global_step": 636069, "epoch": 7663} {"train_loss": -28.144636154174805, "global_step": 636070, "epoch": 7663} {"train_loss": -27.978668212890625, "global_step": 636071, "epoch": 7663} {"train_loss": -28.25065040588379, "global_step": 636072, "epoch": 7663} {"train_loss": -28.67365074157715, "global_step": 636073, "epoch": 7663} {"train_loss": -28.259063720703125, "global_step": 636074, "epoch": 7663} {"train_loss": -28.144315719604492, "global_step": 636075, "epoch": 7663} {"train_loss": -28.03658103942871, "global_step": 636076, "epoch": 7663} {"train_loss": -27.7528018951416, "global_step": 636077, "epoch": 7663} {"train_loss": -27.895532608032227, "global_step": 636078, "epoch": 7663} {"train_loss": -27.93755531311035, "global_step": 636079, "epoch": 7663} {"train_loss": -27.925033569335938, "global_step": 636080, "epoch": 7663} {"train_loss": -28.20366859436035, "global_step": 636081, "epoch": 7663} {"train_loss": -28.096012115478516, "global_step": 636082, "epoch": 7663} {"train_loss": -28.46002769470215, "global_step": 636083, "epoch": 7663} {"train_loss": -28.140295028686523, "global_step": 636084, "epoch": 7663} {"train_loss": -27.894861221313477, "global_step": 636085, "epoch": 7663} {"train_loss": -27.870193481445312, "global_step": 636086, "epoch": 7663} {"train_loss": -28.22747230529785, "global_step": 636087, "epoch": 7663} {"train_loss": -28.27691650390625, "global_step": 636088, "epoch": 7663} {"train_loss": -28.525089263916016, "global_step": 636089, "epoch": 7663} {"train_loss": -28.226993560791016, "global_step": 636090, "epoch": 7663} {"train_loss": -28.65595817565918, "global_step": 636091, "epoch": 7663} {"train_loss": -28.231306076049805, "global_step": 636092, "epoch": 7663} {"train_loss": -28.283300399780273, "global_step": 636093, "epoch": 7663} {"train_loss": -28.53632164001465, "global_step": 636094, "epoch": 7663} {"train_loss": -28.686859130859375, "global_step": 636095, "epoch": 7663} {"train_loss": -28.1627197265625, "global_step": 636096, "epoch": 7663} {"train_loss": -28.230487823486328, "global_step": 636097, "epoch": 7663} {"train_loss": -28.632123947143555, "global_step": 636098, "epoch": 7663} {"train_loss": -28.434789657592773, "global_step": 636099, "epoch": 7663} {"train_loss": -29.05402946472168, "global_step": 636100, "epoch": 7663} {"train_loss": -28.6103515625, "global_step": 636101, "epoch": 7663} {"train_loss": -28.84317398071289, "global_step": 636102, "epoch": 7663} {"train_loss": -28.429304122924805, "global_step": 636103, "epoch": 7663} {"train_loss": -28.419158935546875, "global_step": 636104, "epoch": 7663} {"train_loss": -28.15240478515625, "global_step": 636105, "epoch": 7663} {"train_loss": -28.326358795166016, "global_step": 636106, "epoch": 7663} {"train_loss": -28.53219985961914, "global_step": 636107, "epoch": 7663} {"train_loss": -28.37078285217285, "global_step": 636108, "epoch": 7663} {"train_loss": -28.39697265625, "global_step": 636109, "epoch": 7663} {"train_loss": -28.48308753967285, "global_step": 636110, "epoch": 7663} {"train_loss": -27.99469979987087, "global_step": 636111, "epoch": 7663, "val_loss": 6585557.0} {"train_loss": -27.86960792541504, "global_step": 636112, "epoch": 7664} {"train_loss": -26.913129806518555, "global_step": 636113, "epoch": 7664} {"train_loss": -27.44167137145996, "global_step": 636114, "epoch": 7664} {"train_loss": -26.776330947875977, "global_step": 636115, "epoch": 7664} {"train_loss": -27.147998809814453, "global_step": 636116, "epoch": 7664} {"train_loss": -28.02585220336914, "global_step": 636117, "epoch": 7664} {"train_loss": -27.05588722229004, "global_step": 636118, "epoch": 7664} {"train_loss": -28.070209503173828, "global_step": 636119, "epoch": 7664} {"train_loss": -28.259967803955078, "global_step": 636120, "epoch": 7664} {"train_loss": -27.48700523376465, "global_step": 636121, "epoch": 7664} {"train_loss": -27.986230850219727, "global_step": 636122, "epoch": 7664} {"train_loss": -27.785985946655273, "global_step": 636123, "epoch": 7664} {"train_loss": -27.763751983642578, "global_step": 636124, "epoch": 7664} {"train_loss": -27.834257125854492, "global_step": 636125, "epoch": 7664} {"train_loss": -28.140716552734375, "global_step": 636126, "epoch": 7664} {"train_loss": -27.646711349487305, "global_step": 636127, "epoch": 7664} {"train_loss": -28.008716583251953, "global_step": 636128, "epoch": 7664} {"train_loss": -27.52080726623535, "global_step": 636129, "epoch": 7664} {"train_loss": -27.571456909179688, "global_step": 636130, "epoch": 7664} {"train_loss": -27.72212028503418, "global_step": 636131, "epoch": 7664} {"train_loss": -27.83452796936035, "global_step": 636132, "epoch": 7664} {"train_loss": -28.245513916015625, "global_step": 636133, "epoch": 7664} {"train_loss": -27.832473754882812, "global_step": 636134, "epoch": 7664} {"train_loss": -28.114240646362305, "global_step": 636135, "epoch": 7664} {"train_loss": -27.98142433166504, "global_step": 636136, "epoch": 7664} {"train_loss": -28.557172775268555, "global_step": 636137, "epoch": 7664} {"train_loss": -27.914865493774414, "global_step": 636138, "epoch": 7664} {"train_loss": -28.272567749023438, "global_step": 636139, "epoch": 7664} {"train_loss": -28.40717124938965, "global_step": 636140, "epoch": 7664} {"train_loss": -27.91109275817871, "global_step": 636141, "epoch": 7664} {"train_loss": -28.307950973510742, "global_step": 636142, "epoch": 7664} {"train_loss": -28.031057357788086, "global_step": 636143, "epoch": 7664} {"train_loss": -28.272443771362305, "global_step": 636144, "epoch": 7664} {"train_loss": -28.060638427734375, "global_step": 636145, "epoch": 7664} {"train_loss": -28.158597946166992, "global_step": 636146, "epoch": 7664} {"train_loss": -28.10898208618164, "global_step": 636147, "epoch": 7664} {"train_loss": -28.2440242767334, "global_step": 636148, "epoch": 7664} {"train_loss": -28.088058471679688, "global_step": 636149, "epoch": 7664} {"train_loss": -28.387897491455078, "global_step": 636150, "epoch": 7664} {"train_loss": -28.28193473815918, "global_step": 636151, "epoch": 7664} {"train_loss": -28.048919677734375, "global_step": 636152, "epoch": 7664} {"train_loss": -28.004810333251953, "global_step": 636153, "epoch": 7664} {"train_loss": -28.4287052154541, "global_step": 636154, "epoch": 7664} {"train_loss": -28.1728572845459, "global_step": 636155, "epoch": 7664} {"train_loss": -28.391632080078125, "global_step": 636156, "epoch": 7664} {"train_loss": -28.834217071533203, "global_step": 636157, "epoch": 7664} {"train_loss": -28.346359252929688, "global_step": 636158, "epoch": 7664} {"train_loss": -28.47720718383789, "global_step": 636159, "epoch": 7664} {"train_loss": -28.428787231445312, "global_step": 636160, "epoch": 7664} {"train_loss": -28.437055587768555, "global_step": 636161, "epoch": 7664} {"train_loss": -28.304580688476562, "global_step": 636162, "epoch": 7664} {"train_loss": -28.467504501342773, "global_step": 636163, "epoch": 7664} {"train_loss": -28.547332763671875, "global_step": 636164, "epoch": 7664} {"train_loss": -28.256134033203125, "global_step": 636165, "epoch": 7664} {"train_loss": -28.188852310180664, "global_step": 636166, "epoch": 7664} {"train_loss": -28.263996124267578, "global_step": 636167, "epoch": 7664} {"train_loss": -28.219369888305664, "global_step": 636168, "epoch": 7664} {"train_loss": -28.273645401000977, "global_step": 636169, "epoch": 7664} {"train_loss": -28.421003341674805, "global_step": 636170, "epoch": 7664} {"train_loss": -28.495214462280273, "global_step": 636171, "epoch": 7664} {"train_loss": -28.500782012939453, "global_step": 636172, "epoch": 7664} {"train_loss": -28.681928634643555, "global_step": 636173, "epoch": 7664} {"train_loss": -28.29248046875, "global_step": 636174, "epoch": 7664} {"train_loss": -28.3555908203125, "global_step": 636175, "epoch": 7664} {"train_loss": -28.339740753173828, "global_step": 636176, "epoch": 7664} {"train_loss": -28.404333114624023, "global_step": 636177, "epoch": 7664} {"train_loss": -27.884851455688477, "global_step": 636178, "epoch": 7664} {"train_loss": -27.934207916259766, "global_step": 636179, "epoch": 7664} {"train_loss": -27.981937408447266, "global_step": 636180, "epoch": 7664} {"train_loss": -28.253881454467773, "global_step": 636181, "epoch": 7664} {"train_loss": -28.283361434936523, "global_step": 636182, "epoch": 7664} {"train_loss": -28.446979522705078, "global_step": 636183, "epoch": 7664} {"train_loss": -28.490461349487305, "global_step": 636184, "epoch": 7664} {"train_loss": -28.343475341796875, "global_step": 636185, "epoch": 7664} {"train_loss": -27.9949951171875, "global_step": 636186, "epoch": 7664} {"train_loss": -27.91839599609375, "global_step": 636187, "epoch": 7664} {"train_loss": -28.26360511779785, "global_step": 636188, "epoch": 7664} {"train_loss": -28.4473934173584, "global_step": 636189, "epoch": 7664} {"train_loss": -28.697431564331055, "global_step": 636190, "epoch": 7664} {"train_loss": -27.8682861328125, "global_step": 636191, "epoch": 7664} {"train_loss": -27.990341186523438, "global_step": 636192, "epoch": 7664} {"train_loss": -28.138254165649414, "global_step": 636193, "epoch": 7664} {"train_loss": -28.10502888782915, "global_step": 636194, "epoch": 7664, "val_loss": 6646341.5} {"train_loss": -26.787633895874023, "global_step": 636195, "epoch": 7665} {"train_loss": -25.30928611755371, "global_step": 636196, "epoch": 7665} {"train_loss": -25.94234275817871, "global_step": 636197, "epoch": 7665} {"train_loss": -27.6320858001709, "global_step": 636198, "epoch": 7665} {"train_loss": -27.046878814697266, "global_step": 636199, "epoch": 7665} {"train_loss": -27.21406364440918, "global_step": 636200, "epoch": 7665} {"train_loss": -27.4634952545166, "global_step": 636201, "epoch": 7665} {"train_loss": -26.876007080078125, "global_step": 636202, "epoch": 7665} {"train_loss": -27.551898956298828, "global_step": 636203, "epoch": 7665} {"train_loss": -27.351215362548828, "global_step": 636204, "epoch": 7665} {"train_loss": -26.829679489135742, "global_step": 636205, "epoch": 7665} {"train_loss": -27.829992294311523, "global_step": 636206, "epoch": 7665} {"train_loss": -27.82834815979004, "global_step": 636207, "epoch": 7665} {"train_loss": -27.211660385131836, "global_step": 636208, "epoch": 7665} {"train_loss": -27.367584228515625, "global_step": 636209, "epoch": 7665} {"train_loss": -27.557355880737305, "global_step": 636210, "epoch": 7665} {"train_loss": -27.793012619018555, "global_step": 636211, "epoch": 7665} {"train_loss": -27.713830947875977, "global_step": 636212, "epoch": 7665} {"train_loss": -27.357940673828125, "global_step": 636213, "epoch": 7665} {"train_loss": -27.630603790283203, "global_step": 636214, "epoch": 7665} {"train_loss": -28.105615615844727, "global_step": 636215, "epoch": 7665} {"train_loss": -28.060205459594727, "global_step": 636216, "epoch": 7665} {"train_loss": -27.841033935546875, "global_step": 636217, "epoch": 7665} {"train_loss": -28.03822135925293, "global_step": 636218, "epoch": 7665} {"train_loss": -27.878976821899414, "global_step": 636219, "epoch": 7665} {"train_loss": -27.927854537963867, "global_step": 636220, "epoch": 7665} {"train_loss": -27.9052734375, "global_step": 636221, "epoch": 7665} {"train_loss": -28.149450302124023, "global_step": 636222, "epoch": 7665} {"train_loss": -28.047555923461914, "global_step": 636223, "epoch": 7665} {"train_loss": -27.87449073791504, "global_step": 636224, "epoch": 7665} {"train_loss": -28.01493263244629, "global_step": 636225, "epoch": 7665} {"train_loss": -27.903905868530273, "global_step": 636226, "epoch": 7665} {"train_loss": -28.14179801940918, "global_step": 636227, "epoch": 7665} {"train_loss": -27.918792724609375, "global_step": 636228, "epoch": 7665} {"train_loss": -27.966543197631836, "global_step": 636229, "epoch": 7665} {"train_loss": -28.037755966186523, "global_step": 636230, "epoch": 7665} {"train_loss": -28.301666259765625, "global_step": 636231, "epoch": 7665} {"train_loss": -28.38828468322754, "global_step": 636232, "epoch": 7665} {"train_loss": -28.429523468017578, "global_step": 636233, "epoch": 7665} {"train_loss": -28.340009689331055, "global_step": 636234, "epoch": 7665} {"train_loss": -28.001800537109375, "global_step": 636235, "epoch": 7665} {"train_loss": -28.322294235229492, "global_step": 636236, "epoch": 7665} {"train_loss": -28.138166427612305, "global_step": 636237, "epoch": 7665} {"train_loss": -28.10693359375, "global_step": 636238, "epoch": 7665} {"train_loss": -28.6007137298584, "global_step": 636239, "epoch": 7665} {"train_loss": -28.373777389526367, "global_step": 636240, "epoch": 7665} {"train_loss": -27.98431396484375, "global_step": 636241, "epoch": 7665} {"train_loss": -28.333234786987305, "global_step": 636242, "epoch": 7665} {"train_loss": -28.0467472076416, "global_step": 636243, "epoch": 7665} {"train_loss": -28.254199981689453, "global_step": 636244, "epoch": 7665} {"train_loss": -27.862340927124023, "global_step": 636245, "epoch": 7665} {"train_loss": -28.248666763305664, "global_step": 636246, "epoch": 7665} {"train_loss": -28.149612426757812, "global_step": 636247, "epoch": 7665} {"train_loss": -28.43189811706543, "global_step": 636248, "epoch": 7665} {"train_loss": -28.380517959594727, "global_step": 636249, "epoch": 7665} {"train_loss": -28.115686416625977, "global_step": 636250, "epoch": 7665} {"train_loss": -28.350940704345703, "global_step": 636251, "epoch": 7665} {"train_loss": -28.544391632080078, "global_step": 636252, "epoch": 7665} {"train_loss": -28.342458724975586, "global_step": 636253, "epoch": 7665} {"train_loss": -28.50070571899414, "global_step": 636254, "epoch": 7665} {"train_loss": -28.37507438659668, "global_step": 636255, "epoch": 7665} {"train_loss": -28.37726402282715, "global_step": 636256, "epoch": 7665} {"train_loss": -28.70218849182129, "global_step": 636257, "epoch": 7665} {"train_loss": -28.40789222717285, "global_step": 636258, "epoch": 7665} {"train_loss": -28.0954647064209, "global_step": 636259, "epoch": 7665} {"train_loss": -28.42963218688965, "global_step": 636260, "epoch": 7665} {"train_loss": -28.2994441986084, "global_step": 636261, "epoch": 7665} {"train_loss": -28.12227439880371, "global_step": 636262, "epoch": 7665} {"train_loss": -28.0998477935791, "global_step": 636263, "epoch": 7665} {"train_loss": -28.258874893188477, "global_step": 636264, "epoch": 7665} {"train_loss": -28.420740127563477, "global_step": 636265, "epoch": 7665} {"train_loss": -28.411588668823242, "global_step": 636266, "epoch": 7665} {"train_loss": -28.236042022705078, "global_step": 636267, "epoch": 7665} {"train_loss": -28.474069595336914, "global_step": 636268, "epoch": 7665} {"train_loss": -28.194387435913086, "global_step": 636269, "epoch": 7665} {"train_loss": -28.485082626342773, "global_step": 636270, "epoch": 7665} {"train_loss": -28.0660457611084, "global_step": 636271, "epoch": 7665} {"train_loss": -28.6957950592041, "global_step": 636272, "epoch": 7665} {"train_loss": -28.579986572265625, "global_step": 636273, "epoch": 7665} {"train_loss": -27.921579360961914, "global_step": 636274, "epoch": 7665} {"train_loss": -28.667200088500977, "global_step": 636275, "epoch": 7665} {"train_loss": -28.114587783813477, "global_step": 636276, "epoch": 7665} {"train_loss": -27.98057160894555, "global_step": 636277, "epoch": 7665, "val_loss": 6644949.0} {"train_loss": -27.12006950378418, "global_step": 636278, "epoch": 7666} {"train_loss": -27.102880477905273, "global_step": 636279, "epoch": 7666} {"train_loss": -27.409637451171875, "global_step": 636280, "epoch": 7666} {"train_loss": -27.282773971557617, "global_step": 636281, "epoch": 7666} {"train_loss": -27.016382217407227, "global_step": 636282, "epoch": 7666} {"train_loss": -27.154266357421875, "global_step": 636283, "epoch": 7666} {"train_loss": -27.160541534423828, "global_step": 636284, "epoch": 7666} {"train_loss": -27.367605209350586, "global_step": 636285, "epoch": 7666} {"train_loss": -27.327285766601562, "global_step": 636286, "epoch": 7666} {"train_loss": -27.505115509033203, "global_step": 636287, "epoch": 7666} {"train_loss": -27.60525894165039, "global_step": 636288, "epoch": 7666} {"train_loss": -27.47549819946289, "global_step": 636289, "epoch": 7666} {"train_loss": -27.700565338134766, "global_step": 636290, "epoch": 7666} {"train_loss": -27.031469345092773, "global_step": 636291, "epoch": 7666} {"train_loss": -27.58558464050293, "global_step": 636292, "epoch": 7666} {"train_loss": -27.72464942932129, "global_step": 636293, "epoch": 7666} {"train_loss": -27.474964141845703, "global_step": 636294, "epoch": 7666} {"train_loss": -27.712085723876953, "global_step": 636295, "epoch": 7666} {"train_loss": -27.713247299194336, "global_step": 636296, "epoch": 7666} {"train_loss": -27.900379180908203, "global_step": 636297, "epoch": 7666} {"train_loss": -27.761098861694336, "global_step": 636298, "epoch": 7666} {"train_loss": -27.341230392456055, "global_step": 636299, "epoch": 7666} {"train_loss": -27.57196044921875, "global_step": 636300, "epoch": 7666} {"train_loss": -28.0515193939209, "global_step": 636301, "epoch": 7666} {"train_loss": -27.944427490234375, "global_step": 636302, "epoch": 7666} {"train_loss": -28.12384605407715, "global_step": 636303, "epoch": 7666} {"train_loss": -27.593109130859375, "global_step": 636304, "epoch": 7666} {"train_loss": -27.8187313079834, "global_step": 636305, "epoch": 7666} {"train_loss": -27.622812271118164, "global_step": 636306, "epoch": 7666} {"train_loss": -27.649946212768555, "global_step": 636307, "epoch": 7666} {"train_loss": -28.44692039489746, "global_step": 636308, "epoch": 7666} {"train_loss": -27.648839950561523, "global_step": 636309, "epoch": 7666} {"train_loss": -28.13189697265625, "global_step": 636310, "epoch": 7666} {"train_loss": -28.082738876342773, "global_step": 636311, "epoch": 7666} {"train_loss": -28.35089683532715, "global_step": 636312, "epoch": 7666} {"train_loss": -28.057758331298828, "global_step": 636313, "epoch": 7666} {"train_loss": -28.29644775390625, "global_step": 636314, "epoch": 7666} {"train_loss": -27.93706703186035, "global_step": 636315, "epoch": 7666} {"train_loss": -28.106613159179688, "global_step": 636316, "epoch": 7666} {"train_loss": -28.281421661376953, "global_step": 636317, "epoch": 7666} {"train_loss": -28.330108642578125, "global_step": 636318, "epoch": 7666} {"train_loss": -28.50665855407715, "global_step": 636319, "epoch": 7666} {"train_loss": -28.444019317626953, "global_step": 636320, "epoch": 7666} {"train_loss": -28.509540557861328, "global_step": 636321, "epoch": 7666} {"train_loss": -28.06818962097168, "global_step": 636322, "epoch": 7666} {"train_loss": -28.585134506225586, "global_step": 636323, "epoch": 7666} {"train_loss": -28.27312660217285, "global_step": 636324, "epoch": 7666} {"train_loss": -28.042150497436523, "global_step": 636325, "epoch": 7666} {"train_loss": -28.222375869750977, "global_step": 636326, "epoch": 7666} {"train_loss": -28.444623947143555, "global_step": 636327, "epoch": 7666} {"train_loss": -28.065460205078125, "global_step": 636328, "epoch": 7666} {"train_loss": -28.367456436157227, "global_step": 636329, "epoch": 7666} {"train_loss": -28.357406616210938, "global_step": 636330, "epoch": 7666} {"train_loss": -28.655517578125, "global_step": 636331, "epoch": 7666} {"train_loss": -28.787128448486328, "global_step": 636332, "epoch": 7666} {"train_loss": -28.46597671508789, "global_step": 636333, "epoch": 7666} {"train_loss": -28.307199478149414, "global_step": 636334, "epoch": 7666} {"train_loss": -28.340436935424805, "global_step": 636335, "epoch": 7666} {"train_loss": -28.562519073486328, "global_step": 636336, "epoch": 7666} {"train_loss": -28.35150146484375, "global_step": 636337, "epoch": 7666} {"train_loss": -28.596067428588867, "global_step": 636338, "epoch": 7666} {"train_loss": -27.996448516845703, "global_step": 636339, "epoch": 7666} {"train_loss": -28.111188888549805, "global_step": 636340, "epoch": 7666} {"train_loss": -27.617055892944336, "global_step": 636341, "epoch": 7666} {"train_loss": -26.521764755249023, "global_step": 636342, "epoch": 7666} {"train_loss": -26.926223754882812, "global_step": 636343, "epoch": 7666} {"train_loss": -28.220617294311523, "global_step": 636344, "epoch": 7666} {"train_loss": -27.229450225830078, "global_step": 636345, "epoch": 7666} {"train_loss": -27.522329330444336, "global_step": 636346, "epoch": 7666} {"train_loss": -27.99338150024414, "global_step": 636347, "epoch": 7666} {"train_loss": -27.874608993530273, "global_step": 636348, "epoch": 7666} {"train_loss": -27.8143367767334, "global_step": 636349, "epoch": 7666} {"train_loss": -28.272642135620117, "global_step": 636350, "epoch": 7666} {"train_loss": -28.010427474975586, "global_step": 636351, "epoch": 7666} {"train_loss": -28.604328155517578, "global_step": 636352, "epoch": 7666} {"train_loss": -28.065521240234375, "global_step": 636353, "epoch": 7666} {"train_loss": -28.14912223815918, "global_step": 636354, "epoch": 7666} {"train_loss": -28.17012596130371, "global_step": 636355, "epoch": 7666} {"train_loss": -28.421066284179688, "global_step": 636356, "epoch": 7666} {"train_loss": -27.766529083251953, "global_step": 636357, "epoch": 7666} {"train_loss": -28.37833023071289, "global_step": 636358, "epoch": 7666} {"train_loss": -28.533588409423828, "global_step": 636359, "epoch": 7666} {"train_loss": -27.923797768282604, "global_step": 636360, "epoch": 7666, "val_loss": 6705345.5} {"train_loss": -27.106952667236328, "global_step": 636361, "epoch": 7667} {"train_loss": -26.797971725463867, "global_step": 636362, "epoch": 7667} {"train_loss": -27.483434677124023, "global_step": 636363, "epoch": 7667} {"train_loss": -27.589380264282227, "global_step": 636364, "epoch": 7667} {"train_loss": -27.302045822143555, "global_step": 636365, "epoch": 7667} {"train_loss": -27.3962345123291, "global_step": 636366, "epoch": 7667} {"train_loss": -27.4052734375, "global_step": 636367, "epoch": 7667} {"train_loss": -27.363927841186523, "global_step": 636368, "epoch": 7667} {"train_loss": -27.012100219726562, "global_step": 636369, "epoch": 7667} {"train_loss": -27.556684494018555, "global_step": 636370, "epoch": 7667} {"train_loss": -27.369470596313477, "global_step": 636371, "epoch": 7667} {"train_loss": -27.99784278869629, "global_step": 636372, "epoch": 7667} {"train_loss": -27.884296417236328, "global_step": 636373, "epoch": 7667} {"train_loss": -27.558332443237305, "global_step": 636374, "epoch": 7667} {"train_loss": -27.36577796936035, "global_step": 636375, "epoch": 7667} {"train_loss": -27.92365837097168, "global_step": 636376, "epoch": 7667} {"train_loss": -27.83953285217285, "global_step": 636377, "epoch": 7667} {"train_loss": -27.698144912719727, "global_step": 636378, "epoch": 7667} {"train_loss": -27.653522491455078, "global_step": 636379, "epoch": 7667} {"train_loss": -27.883380889892578, "global_step": 636380, "epoch": 7667} {"train_loss": -27.690160751342773, "global_step": 636381, "epoch": 7667} {"train_loss": -28.466537475585938, "global_step": 636382, "epoch": 7667} {"train_loss": -28.039947509765625, "global_step": 636383, "epoch": 7667} {"train_loss": -28.010700225830078, "global_step": 636384, "epoch": 7667} {"train_loss": -27.8834285736084, "global_step": 636385, "epoch": 7667} {"train_loss": -27.72877311706543, "global_step": 636386, "epoch": 7667} {"train_loss": -28.067602157592773, "global_step": 636387, "epoch": 7667} {"train_loss": -27.972824096679688, "global_step": 636388, "epoch": 7667} {"train_loss": -28.0208740234375, "global_step": 636389, "epoch": 7667} {"train_loss": -28.170185089111328, "global_step": 636390, "epoch": 7667} {"train_loss": -28.166845321655273, "global_step": 636391, "epoch": 7667} {"train_loss": -27.775531768798828, "global_step": 636392, "epoch": 7667} {"train_loss": -28.112268447875977, "global_step": 636393, "epoch": 7667} {"train_loss": -28.008337020874023, "global_step": 636394, "epoch": 7667} {"train_loss": -28.51045036315918, "global_step": 636395, "epoch": 7667} {"train_loss": -28.250085830688477, "global_step": 636396, "epoch": 7667} {"train_loss": -28.414169311523438, "global_step": 636397, "epoch": 7667} {"train_loss": -28.256391525268555, "global_step": 636398, "epoch": 7667} {"train_loss": -28.042755126953125, "global_step": 636399, "epoch": 7667} {"train_loss": -28.082578659057617, "global_step": 636400, "epoch": 7667} {"train_loss": -28.13205337524414, "global_step": 636401, "epoch": 7667} {"train_loss": -28.259557723999023, "global_step": 636402, "epoch": 7667} {"train_loss": -28.176767349243164, "global_step": 636403, "epoch": 7667} {"train_loss": -28.2213191986084, "global_step": 636404, "epoch": 7667} {"train_loss": -27.697751998901367, "global_step": 636405, "epoch": 7667} {"train_loss": -28.238473892211914, "global_step": 636406, "epoch": 7667} {"train_loss": -28.548828125, "global_step": 636407, "epoch": 7667} {"train_loss": -28.339481353759766, "global_step": 636408, "epoch": 7667} {"train_loss": -28.71282958984375, "global_step": 636409, "epoch": 7667} {"train_loss": -28.47564697265625, "global_step": 636410, "epoch": 7667} {"train_loss": -28.240217208862305, "global_step": 636411, "epoch": 7667} {"train_loss": -28.13618278503418, "global_step": 636412, "epoch": 7667} {"train_loss": -28.472089767456055, "global_step": 636413, "epoch": 7667} {"train_loss": -28.477340698242188, "global_step": 636414, "epoch": 7667} {"train_loss": -28.617902755737305, "global_step": 636415, "epoch": 7667} {"train_loss": -28.5875186920166, "global_step": 636416, "epoch": 7667} {"train_loss": -28.34451675415039, "global_step": 636417, "epoch": 7667} {"train_loss": -28.901220321655273, "global_step": 636418, "epoch": 7667} {"train_loss": -28.774450302124023, "global_step": 636419, "epoch": 7667} {"train_loss": -27.993860244750977, "global_step": 636420, "epoch": 7667} {"train_loss": -28.08856773376465, "global_step": 636421, "epoch": 7667} {"train_loss": -28.645292282104492, "global_step": 636422, "epoch": 7667} {"train_loss": -28.267892837524414, "global_step": 636423, "epoch": 7667} {"train_loss": -28.690948486328125, "global_step": 636424, "epoch": 7667} {"train_loss": -28.58302879333496, "global_step": 636425, "epoch": 7667} {"train_loss": -28.681777954101562, "global_step": 636426, "epoch": 7667} {"train_loss": -28.736133575439453, "global_step": 636427, "epoch": 7667} {"train_loss": -28.57502555847168, "global_step": 636428, "epoch": 7667} {"train_loss": -28.310626983642578, "global_step": 636429, "epoch": 7667} {"train_loss": -28.102094650268555, "global_step": 636430, "epoch": 7667} {"train_loss": -28.111774444580078, "global_step": 636431, "epoch": 7667} {"train_loss": -28.535490036010742, "global_step": 636432, "epoch": 7667} {"train_loss": -28.962356567382812, "global_step": 636433, "epoch": 7667} {"train_loss": -28.07270622253418, "global_step": 636434, "epoch": 7667} {"train_loss": -28.38410758972168, "global_step": 636435, "epoch": 7667} {"train_loss": -28.29657554626465, "global_step": 636436, "epoch": 7667} {"train_loss": -27.64338493347168, "global_step": 636437, "epoch": 7667} {"train_loss": -26.569107055664062, "global_step": 636438, "epoch": 7667} {"train_loss": -24.429794311523438, "global_step": 636439, "epoch": 7667} {"train_loss": -25.619474411010742, "global_step": 636440, "epoch": 7667} {"train_loss": -27.731781005859375, "global_step": 636441, "epoch": 7667} {"train_loss": -27.15044593811035, "global_step": 636442, "epoch": 7667} {"train_loss": -27.964207476880176, "global_step": 636443, "epoch": 7667, "val_loss": 6711543.0} {"train_loss": -25.885482788085938, "global_step": 636444, "epoch": 7668} {"train_loss": -27.435739517211914, "global_step": 636445, "epoch": 7668} {"train_loss": -26.003034591674805, "global_step": 636446, "epoch": 7668} {"train_loss": -26.818326950073242, "global_step": 636447, "epoch": 7668} {"train_loss": -26.541797637939453, "global_step": 636448, "epoch": 7668} {"train_loss": -26.4575138092041, "global_step": 636449, "epoch": 7668} {"train_loss": -27.27266502380371, "global_step": 636450, "epoch": 7668} {"train_loss": -26.39627456665039, "global_step": 636451, "epoch": 7668} {"train_loss": -26.618833541870117, "global_step": 636452, "epoch": 7668} {"train_loss": -27.103357315063477, "global_step": 636453, "epoch": 7668} {"train_loss": -26.77176856994629, "global_step": 636454, "epoch": 7668} {"train_loss": -26.7076416015625, "global_step": 636455, "epoch": 7668} {"train_loss": -27.000349044799805, "global_step": 636456, "epoch": 7668} {"train_loss": -27.01318359375, "global_step": 636457, "epoch": 7668} {"train_loss": -26.934467315673828, "global_step": 636458, "epoch": 7668} {"train_loss": -27.232770919799805, "global_step": 636459, "epoch": 7668} {"train_loss": -27.174793243408203, "global_step": 636460, "epoch": 7668} {"train_loss": -26.98345375061035, "global_step": 636461, "epoch": 7668} {"train_loss": -27.550800323486328, "global_step": 636462, "epoch": 7668} {"train_loss": -27.27479362487793, "global_step": 636463, "epoch": 7668} {"train_loss": -27.60414695739746, "global_step": 636464, "epoch": 7668} {"train_loss": -27.564661026000977, "global_step": 636465, "epoch": 7668} {"train_loss": -27.67559242248535, "global_step": 636466, "epoch": 7668} {"train_loss": -27.7581729888916, "global_step": 636467, "epoch": 7668} {"train_loss": -27.735944747924805, "global_step": 636468, "epoch": 7668} {"train_loss": -27.555255889892578, "global_step": 636469, "epoch": 7668} {"train_loss": -27.600357055664062, "global_step": 636470, "epoch": 7668} {"train_loss": -28.0319766998291, "global_step": 636471, "epoch": 7668} {"train_loss": -27.5921573638916, "global_step": 636472, "epoch": 7668} {"train_loss": -27.75180435180664, "global_step": 636473, "epoch": 7668} {"train_loss": -27.760971069335938, "global_step": 636474, "epoch": 7668} {"train_loss": -27.7662410736084, "global_step": 636475, "epoch": 7668} {"train_loss": -27.918598175048828, "global_step": 636476, "epoch": 7668} {"train_loss": -27.9210205078125, "global_step": 636477, "epoch": 7668} {"train_loss": -27.90052604675293, "global_step": 636478, "epoch": 7668} {"train_loss": -27.76079750061035, "global_step": 636479, "epoch": 7668} {"train_loss": -27.958927154541016, "global_step": 636480, "epoch": 7668} {"train_loss": -27.878406524658203, "global_step": 636481, "epoch": 7668} {"train_loss": -28.302915573120117, "global_step": 636482, "epoch": 7668} {"train_loss": -28.14935302734375, "global_step": 636483, "epoch": 7668} {"train_loss": -28.139755249023438, "global_step": 636484, "epoch": 7668} {"train_loss": -28.37872886657715, "global_step": 636485, "epoch": 7668} {"train_loss": -28.292804718017578, "global_step": 636486, "epoch": 7668} {"train_loss": -28.3544864654541, "global_step": 636487, "epoch": 7668} {"train_loss": -28.350610733032227, "global_step": 636488, "epoch": 7668} {"train_loss": -28.17035484313965, "global_step": 636489, "epoch": 7668} {"train_loss": -28.21018409729004, "global_step": 636490, "epoch": 7668} {"train_loss": -28.383874893188477, "global_step": 636491, "epoch": 7668} {"train_loss": -28.48578453063965, "global_step": 636492, "epoch": 7668} {"train_loss": -28.05035972595215, "global_step": 636493, "epoch": 7668} {"train_loss": -28.28590202331543, "global_step": 636494, "epoch": 7668} {"train_loss": -28.135894775390625, "global_step": 636495, "epoch": 7668} {"train_loss": -28.357837677001953, "global_step": 636496, "epoch": 7668} {"train_loss": -28.358306884765625, "global_step": 636497, "epoch": 7668} {"train_loss": -28.397043228149414, "global_step": 636498, "epoch": 7668} {"train_loss": -28.12912368774414, "global_step": 636499, "epoch": 7668} {"train_loss": -28.425458908081055, "global_step": 636500, "epoch": 7668} {"train_loss": -28.512815475463867, "global_step": 636501, "epoch": 7668} {"train_loss": -28.01655387878418, "global_step": 636502, "epoch": 7668} {"train_loss": -28.593067169189453, "global_step": 636503, "epoch": 7668} {"train_loss": -28.138671875, "global_step": 636504, "epoch": 7668} {"train_loss": -28.434524536132812, "global_step": 636505, "epoch": 7668} {"train_loss": -28.366575241088867, "global_step": 636506, "epoch": 7668} {"train_loss": -28.400592803955078, "global_step": 636507, "epoch": 7668} {"train_loss": -28.21540641784668, "global_step": 636508, "epoch": 7668} {"train_loss": -28.4656982421875, "global_step": 636509, "epoch": 7668} {"train_loss": -28.55891990661621, "global_step": 636510, "epoch": 7668} {"train_loss": -29.01007080078125, "global_step": 636511, "epoch": 7668} {"train_loss": -28.3391056060791, "global_step": 636512, "epoch": 7668} {"train_loss": -28.548294067382812, "global_step": 636513, "epoch": 7668} {"train_loss": -28.10979652404785, "global_step": 636514, "epoch": 7668} {"train_loss": -28.78095054626465, "global_step": 636515, "epoch": 7668} {"train_loss": -28.622268676757812, "global_step": 636516, "epoch": 7668} {"train_loss": -28.300806045532227, "global_step": 636517, "epoch": 7668} {"train_loss": -28.42592430114746, "global_step": 636518, "epoch": 7668} {"train_loss": -27.939102172851562, "global_step": 636519, "epoch": 7668} {"train_loss": -27.7287654876709, "global_step": 636520, "epoch": 7668} {"train_loss": -28.1037540435791, "global_step": 636521, "epoch": 7668} {"train_loss": -28.272796630859375, "global_step": 636522, "epoch": 7668} {"train_loss": -28.04389762878418, "global_step": 636523, "epoch": 7668} {"train_loss": -28.366514205932617, "global_step": 636524, "epoch": 7668} {"train_loss": -28.221149444580078, "global_step": 636525, "epoch": 7668} {"train_loss": -27.842161546270532, "global_step": 636526, "epoch": 7668, "val_loss": 6743148.0} {"train_loss": -27.676788330078125, "global_step": 636527, "epoch": 7669} {"train_loss": -27.663938522338867, "global_step": 636528, "epoch": 7669} {"train_loss": -27.91364097595215, "global_step": 636529, "epoch": 7669} {"train_loss": -27.98490333557129, "global_step": 636530, "epoch": 7669} {"train_loss": -27.75751304626465, "global_step": 636531, "epoch": 7669} {"train_loss": -27.8111629486084, "global_step": 636532, "epoch": 7669} {"train_loss": -28.218048095703125, "global_step": 636533, "epoch": 7669} {"train_loss": -27.840106964111328, "global_step": 636534, "epoch": 7669} {"train_loss": -27.619449615478516, "global_step": 636535, "epoch": 7669} {"train_loss": -27.884180068969727, "global_step": 636536, "epoch": 7669} {"train_loss": -27.23457145690918, "global_step": 636537, "epoch": 7669} {"train_loss": -27.71255874633789, "global_step": 636538, "epoch": 7669} {"train_loss": -28.09665298461914, "global_step": 636539, "epoch": 7669} {"train_loss": -27.916738510131836, "global_step": 636540, "epoch": 7669} {"train_loss": -27.719806671142578, "global_step": 636541, "epoch": 7669} {"train_loss": -27.9741268157959, "global_step": 636542, "epoch": 7669} {"train_loss": -28.120330810546875, "global_step": 636543, "epoch": 7669} {"train_loss": -28.08831214904785, "global_step": 636544, "epoch": 7669} {"train_loss": -28.117345809936523, "global_step": 636545, "epoch": 7669} {"train_loss": -28.02643394470215, "global_step": 636546, "epoch": 7669} {"train_loss": -28.08699607849121, "global_step": 636547, "epoch": 7669} {"train_loss": -27.96925163269043, "global_step": 636548, "epoch": 7669} {"train_loss": -27.963239669799805, "global_step": 636549, "epoch": 7669} {"train_loss": -27.852930068969727, "global_step": 636550, "epoch": 7669} {"train_loss": -28.250782012939453, "global_step": 636551, "epoch": 7669} {"train_loss": -28.17823600769043, "global_step": 636552, "epoch": 7669} {"train_loss": -28.37552833557129, "global_step": 636553, "epoch": 7669} {"train_loss": -28.143634796142578, "global_step": 636554, "epoch": 7669} {"train_loss": -28.100299835205078, "global_step": 636555, "epoch": 7669} {"train_loss": -28.080078125, "global_step": 636556, "epoch": 7669} {"train_loss": -28.484954833984375, "global_step": 636557, "epoch": 7669} {"train_loss": -28.393035888671875, "global_step": 636558, "epoch": 7669} {"train_loss": -28.5021915435791, "global_step": 636559, "epoch": 7669} {"train_loss": -28.354278564453125, "global_step": 636560, "epoch": 7669} {"train_loss": -28.688461303710938, "global_step": 636561, "epoch": 7669} {"train_loss": -28.494739532470703, "global_step": 636562, "epoch": 7669} {"train_loss": -28.3724308013916, "global_step": 636563, "epoch": 7669} {"train_loss": -28.35610008239746, "global_step": 636564, "epoch": 7669} {"train_loss": -28.010101318359375, "global_step": 636565, "epoch": 7669} {"train_loss": -28.53046989440918, "global_step": 636566, "epoch": 7669} {"train_loss": -28.42409324645996, "global_step": 636567, "epoch": 7669} {"train_loss": -27.819623947143555, "global_step": 636568, "epoch": 7669} {"train_loss": -28.593769073486328, "global_step": 636569, "epoch": 7669} {"train_loss": -28.33045768737793, "global_step": 636570, "epoch": 7669} {"train_loss": -28.643646240234375, "global_step": 636571, "epoch": 7669} {"train_loss": -28.750818252563477, "global_step": 636572, "epoch": 7669} {"train_loss": -28.381977081298828, "global_step": 636573, "epoch": 7669} {"train_loss": -28.4034423828125, "global_step": 636574, "epoch": 7669} {"train_loss": -28.29144287109375, "global_step": 636575, "epoch": 7669} {"train_loss": -28.602521896362305, "global_step": 636576, "epoch": 7669} {"train_loss": -28.529584884643555, "global_step": 636577, "epoch": 7669} {"train_loss": -28.365026473999023, "global_step": 636578, "epoch": 7669} {"train_loss": -27.900434494018555, "global_step": 636579, "epoch": 7669} {"train_loss": -27.784940719604492, "global_step": 636580, "epoch": 7669} {"train_loss": -27.749792098999023, "global_step": 636581, "epoch": 7669} {"train_loss": -28.74012565612793, "global_step": 636582, "epoch": 7669} {"train_loss": -27.958581924438477, "global_step": 636583, "epoch": 7669} {"train_loss": -27.839466094970703, "global_step": 636584, "epoch": 7669} {"train_loss": -27.657703399658203, "global_step": 636585, "epoch": 7669} {"train_loss": -28.477766036987305, "global_step": 636586, "epoch": 7669} {"train_loss": -28.222488403320312, "global_step": 636587, "epoch": 7669} {"train_loss": -28.397581100463867, "global_step": 636588, "epoch": 7669} {"train_loss": -28.554025650024414, "global_step": 636589, "epoch": 7669} {"train_loss": -27.98709487915039, "global_step": 636590, "epoch": 7669} {"train_loss": -28.35626792907715, "global_step": 636591, "epoch": 7669} {"train_loss": -28.077472686767578, "global_step": 636592, "epoch": 7669} {"train_loss": -28.170942306518555, "global_step": 636593, "epoch": 7669} {"train_loss": -28.421405792236328, "global_step": 636594, "epoch": 7669} {"train_loss": -28.1187686920166, "global_step": 636595, "epoch": 7669} {"train_loss": -28.16168212890625, "global_step": 636596, "epoch": 7669} {"train_loss": -28.160409927368164, "global_step": 636597, "epoch": 7669} {"train_loss": -28.410070419311523, "global_step": 636598, "epoch": 7669} {"train_loss": -28.300336837768555, "global_step": 636599, "epoch": 7669} {"train_loss": -28.354944229125977, "global_step": 636600, "epoch": 7669} {"train_loss": -28.1378173828125, "global_step": 636601, "epoch": 7669} {"train_loss": -28.496540069580078, "global_step": 636602, "epoch": 7669} {"train_loss": -28.468402862548828, "global_step": 636603, "epoch": 7669} {"train_loss": -27.780048370361328, "global_step": 636604, "epoch": 7669} {"train_loss": -28.360137939453125, "global_step": 636605, "epoch": 7669} {"train_loss": -28.222822189331055, "global_step": 636606, "epoch": 7669} {"train_loss": -27.69635009765625, "global_step": 636607, "epoch": 7669} {"train_loss": -28.267200469970703, "global_step": 636608, "epoch": 7669} {"train_loss": -28.147120533219304, "global_step": 636609, "epoch": 7669, "val_loss": 6580718.0} {"train_loss": -26.18694496154785, "global_step": 636610, "epoch": 7670} {"train_loss": -26.33540153503418, "global_step": 636611, "epoch": 7670} {"train_loss": -26.625425338745117, "global_step": 636612, "epoch": 7670} {"train_loss": -26.986169815063477, "global_step": 636613, "epoch": 7670} {"train_loss": -26.82126235961914, "global_step": 636614, "epoch": 7670} {"train_loss": -26.133056640625, "global_step": 636615, "epoch": 7670} {"train_loss": -27.03179931640625, "global_step": 636616, "epoch": 7670} {"train_loss": -27.5625, "global_step": 636617, "epoch": 7670} {"train_loss": -26.585012435913086, "global_step": 636618, "epoch": 7670} {"train_loss": -27.384923934936523, "global_step": 636619, "epoch": 7670} {"train_loss": -27.28350830078125, "global_step": 636620, "epoch": 7670} {"train_loss": -27.204364776611328, "global_step": 636621, "epoch": 7670} {"train_loss": -27.43124771118164, "global_step": 636622, "epoch": 7670} {"train_loss": -27.112934112548828, "global_step": 636623, "epoch": 7670} {"train_loss": -27.684417724609375, "global_step": 636624, "epoch": 7670} {"train_loss": -27.148670196533203, "global_step": 636625, "epoch": 7670} {"train_loss": -27.7075252532959, "global_step": 636626, "epoch": 7670} {"train_loss": -27.5172176361084, "global_step": 636627, "epoch": 7670} {"train_loss": -27.63539695739746, "global_step": 636628, "epoch": 7670} {"train_loss": -27.53118324279785, "global_step": 636629, "epoch": 7670} {"train_loss": -27.3867130279541, "global_step": 636630, "epoch": 7670} {"train_loss": -27.54336929321289, "global_step": 636631, "epoch": 7670} {"train_loss": -27.677692413330078, "global_step": 636632, "epoch": 7670} {"train_loss": -27.50838279724121, "global_step": 636633, "epoch": 7670} {"train_loss": -27.497323989868164, "global_step": 636634, "epoch": 7670} {"train_loss": -27.8875732421875, "global_step": 636635, "epoch": 7670} {"train_loss": -27.711380004882812, "global_step": 636636, "epoch": 7670} {"train_loss": -28.134851455688477, "global_step": 636637, "epoch": 7670} {"train_loss": -27.934803009033203, "global_step": 636638, "epoch": 7670} {"train_loss": -28.111169815063477, "global_step": 636639, "epoch": 7670} {"train_loss": -27.795379638671875, "global_step": 636640, "epoch": 7670} {"train_loss": -27.90338134765625, "global_step": 636641, "epoch": 7670} {"train_loss": -28.13250732421875, "global_step": 636642, "epoch": 7670} {"train_loss": -27.84766960144043, "global_step": 636643, "epoch": 7670} {"train_loss": -28.454687118530273, "global_step": 636644, "epoch": 7670} {"train_loss": -27.813587188720703, "global_step": 636645, "epoch": 7670} {"train_loss": -27.828107833862305, "global_step": 636646, "epoch": 7670} {"train_loss": -28.27507972717285, "global_step": 636647, "epoch": 7670} {"train_loss": -28.264501571655273, "global_step": 636648, "epoch": 7670} {"train_loss": -28.47364616394043, "global_step": 636649, "epoch": 7670} {"train_loss": -28.283716201782227, "global_step": 636650, "epoch": 7670} {"train_loss": -28.31902503967285, "global_step": 636651, "epoch": 7670} {"train_loss": -27.62458610534668, "global_step": 636652, "epoch": 7670} {"train_loss": -28.051624298095703, "global_step": 636653, "epoch": 7670} {"train_loss": -28.328643798828125, "global_step": 636654, "epoch": 7670} {"train_loss": -27.900083541870117, "global_step": 636655, "epoch": 7670} {"train_loss": -28.0296688079834, "global_step": 636656, "epoch": 7670} {"train_loss": -28.01295280456543, "global_step": 636657, "epoch": 7670} {"train_loss": -28.100736618041992, "global_step": 636658, "epoch": 7670} {"train_loss": -28.38093376159668, "global_step": 636659, "epoch": 7670} {"train_loss": -28.15631675720215, "global_step": 636660, "epoch": 7670} {"train_loss": -27.89930534362793, "global_step": 636661, "epoch": 7670} {"train_loss": -28.3029727935791, "global_step": 636662, "epoch": 7670} {"train_loss": -28.24403190612793, "global_step": 636663, "epoch": 7670} {"train_loss": -28.5766544342041, "global_step": 636664, "epoch": 7670} {"train_loss": -28.342575073242188, "global_step": 636665, "epoch": 7670} {"train_loss": -28.128705978393555, "global_step": 636666, "epoch": 7670} {"train_loss": -28.60589027404785, "global_step": 636667, "epoch": 7670} {"train_loss": -28.211170196533203, "global_step": 636668, "epoch": 7670} {"train_loss": -28.64979362487793, "global_step": 636669, "epoch": 7670} {"train_loss": -28.258703231811523, "global_step": 636670, "epoch": 7670} {"train_loss": -28.4815616607666, "global_step": 636671, "epoch": 7670} {"train_loss": -28.6063232421875, "global_step": 636672, "epoch": 7670} {"train_loss": -28.271543502807617, "global_step": 636673, "epoch": 7670} {"train_loss": -28.3194522857666, "global_step": 636674, "epoch": 7670} {"train_loss": -28.595624923706055, "global_step": 636675, "epoch": 7670} {"train_loss": -28.23372459411621, "global_step": 636676, "epoch": 7670} {"train_loss": -28.81711196899414, "global_step": 636677, "epoch": 7670} {"train_loss": -28.1107120513916, "global_step": 636678, "epoch": 7670} {"train_loss": -28.595783233642578, "global_step": 636679, "epoch": 7670} {"train_loss": -28.0839900970459, "global_step": 636680, "epoch": 7670} {"train_loss": -28.198352813720703, "global_step": 636681, "epoch": 7670} {"train_loss": -28.40253257751465, "global_step": 636682, "epoch": 7670} {"train_loss": -28.069379806518555, "global_step": 636683, "epoch": 7670} {"train_loss": -28.08063316345215, "global_step": 636684, "epoch": 7670} {"train_loss": -28.353025436401367, "global_step": 636685, "epoch": 7670} {"train_loss": -27.81355857849121, "global_step": 636686, "epoch": 7670} {"train_loss": -28.424036026000977, "global_step": 636687, "epoch": 7670} {"train_loss": -28.381757736206055, "global_step": 636688, "epoch": 7670} {"train_loss": -27.666488647460938, "global_step": 636689, "epoch": 7670} {"train_loss": -27.758041381835938, "global_step": 636690, "epoch": 7670} {"train_loss": -27.86374855041504, "global_step": 636691, "epoch": 7670} {"train_loss": -27.871482987001716, "global_step": 636692, "epoch": 7670, "val_loss": 6746430.0} {"train_loss": -27.97930908203125, "global_step": 636693, "epoch": 7671} {"train_loss": -27.241180419921875, "global_step": 636694, "epoch": 7671} {"train_loss": -26.977676391601562, "global_step": 636695, "epoch": 7671} {"train_loss": -27.150903701782227, "global_step": 636696, "epoch": 7671} {"train_loss": -27.61746597290039, "global_step": 636697, "epoch": 7671} {"train_loss": -28.137617111206055, "global_step": 636698, "epoch": 7671} {"train_loss": -27.778104782104492, "global_step": 636699, "epoch": 7671} {"train_loss": -27.643957138061523, "global_step": 636700, "epoch": 7671} {"train_loss": -27.938138961791992, "global_step": 636701, "epoch": 7671} {"train_loss": -28.026458740234375, "global_step": 636702, "epoch": 7671} {"train_loss": -27.875288009643555, "global_step": 636703, "epoch": 7671} {"train_loss": -28.276142120361328, "global_step": 636704, "epoch": 7671} {"train_loss": -27.97456169128418, "global_step": 636705, "epoch": 7671} {"train_loss": -28.019250869750977, "global_step": 636706, "epoch": 7671} {"train_loss": -27.961578369140625, "global_step": 636707, "epoch": 7671} {"train_loss": -28.139806747436523, "global_step": 636708, "epoch": 7671} {"train_loss": -27.953664779663086, "global_step": 636709, "epoch": 7671} {"train_loss": -27.968387603759766, "global_step": 636710, "epoch": 7671} {"train_loss": -27.834333419799805, "global_step": 636711, "epoch": 7671} {"train_loss": -27.9451904296875, "global_step": 636712, "epoch": 7671} {"train_loss": -28.2645206451416, "global_step": 636713, "epoch": 7671} {"train_loss": -28.264623641967773, "global_step": 636714, "epoch": 7671} {"train_loss": -28.268869400024414, "global_step": 636715, "epoch": 7671} {"train_loss": -27.9404239654541, "global_step": 636716, "epoch": 7671} {"train_loss": -28.230499267578125, "global_step": 636717, "epoch": 7671} {"train_loss": -28.24560546875, "global_step": 636718, "epoch": 7671} {"train_loss": -28.41357421875, "global_step": 636719, "epoch": 7671} {"train_loss": -28.110233306884766, "global_step": 636720, "epoch": 7671} {"train_loss": -28.586933135986328, "global_step": 636721, "epoch": 7671} {"train_loss": -28.400556564331055, "global_step": 636722, "epoch": 7671} {"train_loss": -28.111469268798828, "global_step": 636723, "epoch": 7671} {"train_loss": -28.135730743408203, "global_step": 636724, "epoch": 7671} {"train_loss": -28.46366310119629, "global_step": 636725, "epoch": 7671} {"train_loss": -28.18645668029785, "global_step": 636726, "epoch": 7671} {"train_loss": -27.991605758666992, "global_step": 636727, "epoch": 7671} {"train_loss": -28.202472686767578, "global_step": 636728, "epoch": 7671} {"train_loss": -28.267704010009766, "global_step": 636729, "epoch": 7671} {"train_loss": -28.08380699157715, "global_step": 636730, "epoch": 7671} {"train_loss": -28.46005630493164, "global_step": 636731, "epoch": 7671} {"train_loss": -28.00864601135254, "global_step": 636732, "epoch": 7671} {"train_loss": -28.245702743530273, "global_step": 636733, "epoch": 7671} {"train_loss": -28.312397003173828, "global_step": 636734, "epoch": 7671} {"train_loss": -28.223846435546875, "global_step": 636735, "epoch": 7671} {"train_loss": -27.83017921447754, "global_step": 636736, "epoch": 7671} {"train_loss": -27.74462890625, "global_step": 636737, "epoch": 7671} {"train_loss": -28.30010414123535, "global_step": 636738, "epoch": 7671} {"train_loss": -28.1145076751709, "global_step": 636739, "epoch": 7671} {"train_loss": -27.64448356628418, "global_step": 636740, "epoch": 7671} {"train_loss": -28.433364868164062, "global_step": 636741, "epoch": 7671} {"train_loss": -27.976133346557617, "global_step": 636742, "epoch": 7671} {"train_loss": -27.693256378173828, "global_step": 636743, "epoch": 7671} {"train_loss": -27.918701171875, "global_step": 636744, "epoch": 7671} {"train_loss": -27.881183624267578, "global_step": 636745, "epoch": 7671} {"train_loss": -27.703601837158203, "global_step": 636746, "epoch": 7671} {"train_loss": -27.868249893188477, "global_step": 636747, "epoch": 7671} {"train_loss": -28.271224975585938, "global_step": 636748, "epoch": 7671} {"train_loss": -27.835861206054688, "global_step": 636749, "epoch": 7671} {"train_loss": -27.72287940979004, "global_step": 636750, "epoch": 7671} {"train_loss": -28.00581169128418, "global_step": 636751, "epoch": 7671} {"train_loss": -28.64599609375, "global_step": 636752, "epoch": 7671} {"train_loss": -27.784835815429688, "global_step": 636753, "epoch": 7671} {"train_loss": -28.27186393737793, "global_step": 636754, "epoch": 7671} {"train_loss": -28.132740020751953, "global_step": 636755, "epoch": 7671} {"train_loss": -28.24860954284668, "global_step": 636756, "epoch": 7671} {"train_loss": -27.71014404296875, "global_step": 636757, "epoch": 7671} {"train_loss": -28.286428451538086, "global_step": 636758, "epoch": 7671} {"train_loss": -28.211654663085938, "global_step": 636759, "epoch": 7671} {"train_loss": -28.429895401000977, "global_step": 636760, "epoch": 7671} {"train_loss": -28.04300880432129, "global_step": 636761, "epoch": 7671} {"train_loss": -28.143939971923828, "global_step": 636762, "epoch": 7671} {"train_loss": -28.39501953125, "global_step": 636763, "epoch": 7671} {"train_loss": -27.971357345581055, "global_step": 636764, "epoch": 7671} {"train_loss": -28.153125762939453, "global_step": 636765, "epoch": 7671} {"train_loss": -27.834020614624023, "global_step": 636766, "epoch": 7671} {"train_loss": -27.532550811767578, "global_step": 636767, "epoch": 7671} {"train_loss": -27.625110626220703, "global_step": 636768, "epoch": 7671} {"train_loss": -28.486541748046875, "global_step": 636769, "epoch": 7671} {"train_loss": -27.923437118530273, "global_step": 636770, "epoch": 7671} {"train_loss": -28.199426651000977, "global_step": 636771, "epoch": 7671} {"train_loss": -27.84183692932129, "global_step": 636772, "epoch": 7671} {"train_loss": -28.146039962768555, "global_step": 636773, "epoch": 7671} {"train_loss": -28.229196548461914, "global_step": 636774, "epoch": 7671} {"train_loss": -28.03904554068324, "global_step": 636775, "epoch": 7671, "val_loss": 6651907.0} {"train_loss": -26.781599044799805, "global_step": 636776, "epoch": 7672} {"train_loss": -27.532804489135742, "global_step": 636777, "epoch": 7672} {"train_loss": -26.703659057617188, "global_step": 636778, "epoch": 7672} {"train_loss": -27.707294464111328, "global_step": 636779, "epoch": 7672} {"train_loss": -26.741973876953125, "global_step": 636780, "epoch": 7672} {"train_loss": -27.203561782836914, "global_step": 636781, "epoch": 7672} {"train_loss": -26.907855987548828, "global_step": 636782, "epoch": 7672} {"train_loss": -28.14255142211914, "global_step": 636783, "epoch": 7672} {"train_loss": -27.22477149963379, "global_step": 636784, "epoch": 7672} {"train_loss": -27.679595947265625, "global_step": 636785, "epoch": 7672} {"train_loss": -27.553104400634766, "global_step": 636786, "epoch": 7672} {"train_loss": -27.688337326049805, "global_step": 636787, "epoch": 7672} {"train_loss": -28.32771110534668, "global_step": 636788, "epoch": 7672} {"train_loss": -27.628326416015625, "global_step": 636789, "epoch": 7672} {"train_loss": -27.389745712280273, "global_step": 636790, "epoch": 7672} {"train_loss": -27.94484519958496, "global_step": 636791, "epoch": 7672} {"train_loss": -27.822980880737305, "global_step": 636792, "epoch": 7672} {"train_loss": -27.993057250976562, "global_step": 636793, "epoch": 7672} {"train_loss": -27.704666137695312, "global_step": 636794, "epoch": 7672} {"train_loss": -28.1367130279541, "global_step": 636795, "epoch": 7672} {"train_loss": -27.60628318786621, "global_step": 636796, "epoch": 7672} {"train_loss": -27.6278076171875, "global_step": 636797, "epoch": 7672} {"train_loss": -27.965301513671875, "global_step": 636798, "epoch": 7672} {"train_loss": -27.724609375, "global_step": 636799, "epoch": 7672} {"train_loss": -28.071319580078125, "global_step": 636800, "epoch": 7672} {"train_loss": -28.389225006103516, "global_step": 636801, "epoch": 7672} {"train_loss": -27.999563217163086, "global_step": 636802, "epoch": 7672} {"train_loss": -27.88970947265625, "global_step": 636803, "epoch": 7672} {"train_loss": -28.176633834838867, "global_step": 636804, "epoch": 7672} {"train_loss": -27.916677474975586, "global_step": 636805, "epoch": 7672} {"train_loss": -27.9824275970459, "global_step": 636806, "epoch": 7672} {"train_loss": -28.070953369140625, "global_step": 636807, "epoch": 7672} {"train_loss": -28.141693115234375, "global_step": 636808, "epoch": 7672} {"train_loss": -28.041580200195312, "global_step": 636809, "epoch": 7672} {"train_loss": -28.2756290435791, "global_step": 636810, "epoch": 7672} {"train_loss": -28.28256607055664, "global_step": 636811, "epoch": 7672} {"train_loss": -28.166229248046875, "global_step": 636812, "epoch": 7672} {"train_loss": -28.093713760375977, "global_step": 636813, "epoch": 7672} {"train_loss": -28.438135147094727, "global_step": 636814, "epoch": 7672} {"train_loss": -27.978132247924805, "global_step": 636815, "epoch": 7672} {"train_loss": -28.329992294311523, "global_step": 636816, "epoch": 7672} {"train_loss": -28.49976921081543, "global_step": 636817, "epoch": 7672} {"train_loss": -28.25709342956543, "global_step": 636818, "epoch": 7672} {"train_loss": -28.091602325439453, "global_step": 636819, "epoch": 7672} {"train_loss": -28.112171173095703, "global_step": 636820, "epoch": 7672} {"train_loss": -28.355560302734375, "global_step": 636821, "epoch": 7672} {"train_loss": -28.56184196472168, "global_step": 636822, "epoch": 7672} {"train_loss": -28.539525985717773, "global_step": 636823, "epoch": 7672} {"train_loss": -28.481969833374023, "global_step": 636824, "epoch": 7672} {"train_loss": -28.42230224609375, "global_step": 636825, "epoch": 7672} {"train_loss": -28.141571044921875, "global_step": 636826, "epoch": 7672} {"train_loss": -28.60359764099121, "global_step": 636827, "epoch": 7672} {"train_loss": -28.526350021362305, "global_step": 636828, "epoch": 7672} {"train_loss": -28.004623413085938, "global_step": 636829, "epoch": 7672} {"train_loss": -28.282562255859375, "global_step": 636830, "epoch": 7672} {"train_loss": -28.518003463745117, "global_step": 636831, "epoch": 7672} {"train_loss": -28.39301872253418, "global_step": 636832, "epoch": 7672} {"train_loss": -28.385244369506836, "global_step": 636833, "epoch": 7672} {"train_loss": -27.957300186157227, "global_step": 636834, "epoch": 7672} {"train_loss": -27.74190330505371, "global_step": 636835, "epoch": 7672} {"train_loss": -28.062280654907227, "global_step": 636836, "epoch": 7672} {"train_loss": -28.21051597595215, "global_step": 636837, "epoch": 7672} {"train_loss": -28.084964752197266, "global_step": 636838, "epoch": 7672} {"train_loss": -28.431562423706055, "global_step": 636839, "epoch": 7672} {"train_loss": -28.374792098999023, "global_step": 636840, "epoch": 7672} {"train_loss": -28.354944229125977, "global_step": 636841, "epoch": 7672} {"train_loss": -28.620798110961914, "global_step": 636842, "epoch": 7672} {"train_loss": -27.73343849182129, "global_step": 636843, "epoch": 7672} {"train_loss": -28.172306060791016, "global_step": 636844, "epoch": 7672} {"train_loss": -28.27042579650879, "global_step": 636845, "epoch": 7672} {"train_loss": -28.07437515258789, "global_step": 636846, "epoch": 7672} {"train_loss": -27.9533748626709, "global_step": 636847, "epoch": 7672} {"train_loss": -28.381977081298828, "global_step": 636848, "epoch": 7672} {"train_loss": -28.29558753967285, "global_step": 636849, "epoch": 7672} {"train_loss": -28.41847038269043, "global_step": 636850, "epoch": 7672} {"train_loss": -28.316925048828125, "global_step": 636851, "epoch": 7672} {"train_loss": -28.740238189697266, "global_step": 636852, "epoch": 7672} {"train_loss": -28.17098045349121, "global_step": 636853, "epoch": 7672} {"train_loss": -28.602249145507812, "global_step": 636854, "epoch": 7672} {"train_loss": -28.14179039001465, "global_step": 636855, "epoch": 7672} {"train_loss": -28.44721031188965, "global_step": 636856, "epoch": 7672} {"train_loss": -28.520849227905273, "global_step": 636857, "epoch": 7672} {"train_loss": -28.044195267091315, "global_step": 636858, "epoch": 7672, "val_loss": 6637093.0} {"train_loss": -27.800424575805664, "global_step": 636859, "epoch": 7673} {"train_loss": -26.512699127197266, "global_step": 636860, "epoch": 7673} {"train_loss": -26.287841796875, "global_step": 636861, "epoch": 7673} {"train_loss": -27.578815460205078, "global_step": 636862, "epoch": 7673} {"train_loss": -26.577634811401367, "global_step": 636863, "epoch": 7673} {"train_loss": -27.281286239624023, "global_step": 636864, "epoch": 7673} {"train_loss": -26.881994247436523, "global_step": 636865, "epoch": 7673} {"train_loss": -27.2012939453125, "global_step": 636866, "epoch": 7673} {"train_loss": -27.6488094329834, "global_step": 636867, "epoch": 7673} {"train_loss": -26.955732345581055, "global_step": 636868, "epoch": 7673} {"train_loss": -27.290637969970703, "global_step": 636869, "epoch": 7673} {"train_loss": -27.54938316345215, "global_step": 636870, "epoch": 7673} {"train_loss": -27.618017196655273, "global_step": 636871, "epoch": 7673} {"train_loss": -27.56717872619629, "global_step": 636872, "epoch": 7673} {"train_loss": -28.120574951171875, "global_step": 636873, "epoch": 7673} {"train_loss": -27.44256591796875, "global_step": 636874, "epoch": 7673} {"train_loss": -27.589521408081055, "global_step": 636875, "epoch": 7673} {"train_loss": -27.568395614624023, "global_step": 636876, "epoch": 7673} {"train_loss": -27.65933609008789, "global_step": 636877, "epoch": 7673} {"train_loss": -27.7985782623291, "global_step": 636878, "epoch": 7673} {"train_loss": -27.689712524414062, "global_step": 636879, "epoch": 7673} {"train_loss": -28.222623825073242, "global_step": 636880, "epoch": 7673} {"train_loss": -27.987096786499023, "global_step": 636881, "epoch": 7673} {"train_loss": -27.927335739135742, "global_step": 636882, "epoch": 7673} {"train_loss": -27.88789176940918, "global_step": 636883, "epoch": 7673} {"train_loss": -27.9029483795166, "global_step": 636884, "epoch": 7673} {"train_loss": -27.85550308227539, "global_step": 636885, "epoch": 7673} {"train_loss": -28.019794464111328, "global_step": 636886, "epoch": 7673} {"train_loss": -28.07887840270996, "global_step": 636887, "epoch": 7673} {"train_loss": -28.160694122314453, "global_step": 636888, "epoch": 7673} {"train_loss": -28.27752113342285, "global_step": 636889, "epoch": 7673} {"train_loss": -27.91377830505371, "global_step": 636890, "epoch": 7673} {"train_loss": -28.326406478881836, "global_step": 636891, "epoch": 7673} {"train_loss": -28.17511558532715, "global_step": 636892, "epoch": 7673} {"train_loss": -28.397571563720703, "global_step": 636893, "epoch": 7673} {"train_loss": -28.13895034790039, "global_step": 636894, "epoch": 7673} {"train_loss": -28.101978302001953, "global_step": 636895, "epoch": 7673} {"train_loss": -28.322662353515625, "global_step": 636896, "epoch": 7673} {"train_loss": -28.292953491210938, "global_step": 636897, "epoch": 7673} {"train_loss": -28.299795150756836, "global_step": 636898, "epoch": 7673} {"train_loss": -28.608877182006836, "global_step": 636899, "epoch": 7673} {"train_loss": -28.453699111938477, "global_step": 636900, "epoch": 7673} {"train_loss": -28.079389572143555, "global_step": 636901, "epoch": 7673} {"train_loss": -27.8778076171875, "global_step": 636902, "epoch": 7673} {"train_loss": -28.150659561157227, "global_step": 636903, "epoch": 7673} {"train_loss": -27.783838272094727, "global_step": 636904, "epoch": 7673} {"train_loss": -27.952356338500977, "global_step": 636905, "epoch": 7673} {"train_loss": -28.24521255493164, "global_step": 636906, "epoch": 7673} {"train_loss": -28.64606285095215, "global_step": 636907, "epoch": 7673} {"train_loss": -28.660337448120117, "global_step": 636908, "epoch": 7673} {"train_loss": -28.49380874633789, "global_step": 636909, "epoch": 7673} {"train_loss": -28.338546752929688, "global_step": 636910, "epoch": 7673} {"train_loss": -27.9862060546875, "global_step": 636911, "epoch": 7673} {"train_loss": -28.463134765625, "global_step": 636912, "epoch": 7673} {"train_loss": -28.1119384765625, "global_step": 636913, "epoch": 7673} {"train_loss": -28.5174560546875, "global_step": 636914, "epoch": 7673} {"train_loss": -28.567468643188477, "global_step": 636915, "epoch": 7673} {"train_loss": -28.04829216003418, "global_step": 636916, "epoch": 7673} {"train_loss": -28.168731689453125, "global_step": 636917, "epoch": 7673} {"train_loss": -28.23700523376465, "global_step": 636918, "epoch": 7673} {"train_loss": -28.161550521850586, "global_step": 636919, "epoch": 7673} {"train_loss": -27.906774520874023, "global_step": 636920, "epoch": 7673} {"train_loss": -28.381513595581055, "global_step": 636921, "epoch": 7673} {"train_loss": -28.535688400268555, "global_step": 636922, "epoch": 7673} {"train_loss": -27.930744171142578, "global_step": 636923, "epoch": 7673} {"train_loss": -28.41183853149414, "global_step": 636924, "epoch": 7673} {"train_loss": -28.666065216064453, "global_step": 636925, "epoch": 7673} {"train_loss": -27.925079345703125, "global_step": 636926, "epoch": 7673} {"train_loss": -28.012439727783203, "global_step": 636927, "epoch": 7673} {"train_loss": -28.117130279541016, "global_step": 636928, "epoch": 7673} {"train_loss": -27.73225975036621, "global_step": 636929, "epoch": 7673} {"train_loss": -27.7856388092041, "global_step": 636930, "epoch": 7673} {"train_loss": -27.9008846282959, "global_step": 636931, "epoch": 7673} {"train_loss": -28.134342193603516, "global_step": 636932, "epoch": 7673} {"train_loss": -28.5643253326416, "global_step": 636933, "epoch": 7673} {"train_loss": -28.43706703186035, "global_step": 636934, "epoch": 7673} {"train_loss": -28.06717872619629, "global_step": 636935, "epoch": 7673} {"train_loss": -28.339826583862305, "global_step": 636936, "epoch": 7673} {"train_loss": -28.099964141845703, "global_step": 636937, "epoch": 7673} {"train_loss": -28.232446670532227, "global_step": 636938, "epoch": 7673} {"train_loss": -28.15268898010254, "global_step": 636939, "epoch": 7673} {"train_loss": -28.1126766204834, "global_step": 636940, "epoch": 7673} {"train_loss": -27.967469962246447, "global_step": 636941, "epoch": 7673, "val_loss": 6668722.5} {"train_loss": -27.923742294311523, "global_step": 636942, "epoch": 7674} {"train_loss": -27.55169677734375, "global_step": 636943, "epoch": 7674} {"train_loss": -28.16684341430664, "global_step": 636944, "epoch": 7674} {"train_loss": -27.268478393554688, "global_step": 636945, "epoch": 7674} {"train_loss": -27.49483299255371, "global_step": 636946, "epoch": 7674} {"train_loss": -27.5959529876709, "global_step": 636947, "epoch": 7674} {"train_loss": -27.512067794799805, "global_step": 636948, "epoch": 7674} {"train_loss": -27.819162368774414, "global_step": 636949, "epoch": 7674} {"train_loss": -27.975576400756836, "global_step": 636950, "epoch": 7674} {"train_loss": -27.780704498291016, "global_step": 636951, "epoch": 7674} {"train_loss": -27.625329971313477, "global_step": 636952, "epoch": 7674} {"train_loss": -27.87493896484375, "global_step": 636953, "epoch": 7674} {"train_loss": -27.680036544799805, "global_step": 636954, "epoch": 7674} {"train_loss": -27.88495445251465, "global_step": 636955, "epoch": 7674} {"train_loss": -28.19610595703125, "global_step": 636956, "epoch": 7674} {"train_loss": -27.877466201782227, "global_step": 636957, "epoch": 7674} {"train_loss": -27.726947784423828, "global_step": 636958, "epoch": 7674} {"train_loss": -28.225696563720703, "global_step": 636959, "epoch": 7674} {"train_loss": -28.0332088470459, "global_step": 636960, "epoch": 7674} {"train_loss": -28.21660804748535, "global_step": 636961, "epoch": 7674} {"train_loss": -27.995609283447266, "global_step": 636962, "epoch": 7674} {"train_loss": -28.364892959594727, "global_step": 636963, "epoch": 7674} {"train_loss": -28.188262939453125, "global_step": 636964, "epoch": 7674} {"train_loss": -28.137189865112305, "global_step": 636965, "epoch": 7674} {"train_loss": -28.051549911499023, "global_step": 636966, "epoch": 7674} {"train_loss": -28.326135635375977, "global_step": 636967, "epoch": 7674} {"train_loss": -28.018695831298828, "global_step": 636968, "epoch": 7674} {"train_loss": -28.072668075561523, "global_step": 636969, "epoch": 7674} {"train_loss": -28.095783233642578, "global_step": 636970, "epoch": 7674} {"train_loss": -28.2194881439209, "global_step": 636971, "epoch": 7674} {"train_loss": -28.2737979888916, "global_step": 636972, "epoch": 7674} {"train_loss": -28.18328285217285, "global_step": 636973, "epoch": 7674} {"train_loss": -28.4312801361084, "global_step": 636974, "epoch": 7674} {"train_loss": -27.90293312072754, "global_step": 636975, "epoch": 7674} {"train_loss": -28.186843872070312, "global_step": 636976, "epoch": 7674} {"train_loss": -28.179248809814453, "global_step": 636977, "epoch": 7674} {"train_loss": -27.956884384155273, "global_step": 636978, "epoch": 7674} {"train_loss": -28.15620231628418, "global_step": 636979, "epoch": 7674} {"train_loss": -28.144556045532227, "global_step": 636980, "epoch": 7674} {"train_loss": -28.11579704284668, "global_step": 636981, "epoch": 7674} {"train_loss": -28.05988883972168, "global_step": 636982, "epoch": 7674} {"train_loss": -28.404748916625977, "global_step": 636983, "epoch": 7674} {"train_loss": -28.53901481628418, "global_step": 636984, "epoch": 7674} {"train_loss": -28.11223793029785, "global_step": 636985, "epoch": 7674} {"train_loss": -28.62957763671875, "global_step": 636986, "epoch": 7674} {"train_loss": -28.390302658081055, "global_step": 636987, "epoch": 7674} {"train_loss": -28.117673873901367, "global_step": 636988, "epoch": 7674} {"train_loss": -28.01894187927246, "global_step": 636989, "epoch": 7674} {"train_loss": -28.454309463500977, "global_step": 636990, "epoch": 7674} {"train_loss": -28.594409942626953, "global_step": 636991, "epoch": 7674} {"train_loss": -28.14530372619629, "global_step": 636992, "epoch": 7674} {"train_loss": -28.473846435546875, "global_step": 636993, "epoch": 7674} {"train_loss": -28.00882911682129, "global_step": 636994, "epoch": 7674} {"train_loss": -28.4586181640625, "global_step": 636995, "epoch": 7674} {"train_loss": -28.421926498413086, "global_step": 636996, "epoch": 7674} {"train_loss": -28.4089412689209, "global_step": 636997, "epoch": 7674} {"train_loss": -28.334644317626953, "global_step": 636998, "epoch": 7674} {"train_loss": -27.978612899780273, "global_step": 636999, "epoch": 7674} {"train_loss": -28.29011344909668, "global_step": 637000, "epoch": 7674} {"train_loss": -28.514616012573242, "global_step": 637001, "epoch": 7674} {"train_loss": -28.43998146057129, "global_step": 637002, "epoch": 7674} {"train_loss": -28.212207794189453, "global_step": 637003, "epoch": 7674} {"train_loss": -28.181354522705078, "global_step": 637004, "epoch": 7674} {"train_loss": -28.256101608276367, "global_step": 637005, "epoch": 7674} {"train_loss": -28.363372802734375, "global_step": 637006, "epoch": 7674} {"train_loss": -28.383880615234375, "global_step": 637007, "epoch": 7674} {"train_loss": -28.35184669494629, "global_step": 637008, "epoch": 7674} {"train_loss": -28.538471221923828, "global_step": 637009, "epoch": 7674} {"train_loss": -28.049890518188477, "global_step": 637010, "epoch": 7674} {"train_loss": -28.19598960876465, "global_step": 637011, "epoch": 7674} {"train_loss": -28.21211814880371, "global_step": 637012, "epoch": 7674} {"train_loss": -28.404932022094727, "global_step": 637013, "epoch": 7674} {"train_loss": -28.09132194519043, "global_step": 637014, "epoch": 7674} {"train_loss": -28.36638832092285, "global_step": 637015, "epoch": 7674} {"train_loss": -28.34827995300293, "global_step": 637016, "epoch": 7674} {"train_loss": -28.225372314453125, "global_step": 637017, "epoch": 7674} {"train_loss": -28.305490493774414, "global_step": 637018, "epoch": 7674} {"train_loss": -28.00831413269043, "global_step": 637019, "epoch": 7674} {"train_loss": -28.03914451599121, "global_step": 637020, "epoch": 7674} {"train_loss": -28.07575035095215, "global_step": 637021, "epoch": 7674} {"train_loss": -28.290271759033203, "global_step": 637022, "epoch": 7674} {"train_loss": -28.33387565612793, "global_step": 637023, "epoch": 7674} {"train_loss": -28.139716780329326, "global_step": 637024, "epoch": 7674, "val_loss": 6602623.0} {"train_loss": -27.2341251373291, "global_step": 637025, "epoch": 7675} {"train_loss": -25.815595626831055, "global_step": 637026, "epoch": 7675} {"train_loss": -25.218765258789062, "global_step": 637027, "epoch": 7675} {"train_loss": -27.21579360961914, "global_step": 637028, "epoch": 7675} {"train_loss": -27.490991592407227, "global_step": 637029, "epoch": 7675} {"train_loss": -26.39276695251465, "global_step": 637030, "epoch": 7675} {"train_loss": -27.254901885986328, "global_step": 637031, "epoch": 7675} {"train_loss": -27.845306396484375, "global_step": 637032, "epoch": 7675} {"train_loss": -27.1915283203125, "global_step": 637033, "epoch": 7675} {"train_loss": -27.704038619995117, "global_step": 637034, "epoch": 7675} {"train_loss": -27.600555419921875, "global_step": 637035, "epoch": 7675} {"train_loss": -27.253332138061523, "global_step": 637036, "epoch": 7675} {"train_loss": -27.667621612548828, "global_step": 637037, "epoch": 7675} {"train_loss": -27.650970458984375, "global_step": 637038, "epoch": 7675} {"train_loss": -27.95313835144043, "global_step": 637039, "epoch": 7675} {"train_loss": -27.938587188720703, "global_step": 637040, "epoch": 7675} {"train_loss": -27.641143798828125, "global_step": 637041, "epoch": 7675} {"train_loss": -27.738327026367188, "global_step": 637042, "epoch": 7675} {"train_loss": -28.245223999023438, "global_step": 637043, "epoch": 7675} {"train_loss": -28.030378341674805, "global_step": 637044, "epoch": 7675} {"train_loss": -27.91945457458496, "global_step": 637045, "epoch": 7675} {"train_loss": -28.0048828125, "global_step": 637046, "epoch": 7675} {"train_loss": -28.10865592956543, "global_step": 637047, "epoch": 7675} {"train_loss": -27.97199821472168, "global_step": 637048, "epoch": 7675} {"train_loss": -27.550155639648438, "global_step": 637049, "epoch": 7675} {"train_loss": -27.6369571685791, "global_step": 637050, "epoch": 7675} {"train_loss": -28.289569854736328, "global_step": 637051, "epoch": 7675} {"train_loss": -27.8027286529541, "global_step": 637052, "epoch": 7675} {"train_loss": -28.104597091674805, "global_step": 637053, "epoch": 7675} {"train_loss": -28.15595054626465, "global_step": 637054, "epoch": 7675} {"train_loss": -28.103824615478516, "global_step": 637055, "epoch": 7675} {"train_loss": -28.246850967407227, "global_step": 637056, "epoch": 7675} {"train_loss": -28.21034812927246, "global_step": 637057, "epoch": 7675} {"train_loss": -27.79542350769043, "global_step": 637058, "epoch": 7675} {"train_loss": -28.25457191467285, "global_step": 637059, "epoch": 7675} {"train_loss": -28.375593185424805, "global_step": 637060, "epoch": 7675} {"train_loss": -27.932025909423828, "global_step": 637061, "epoch": 7675} {"train_loss": -28.35231590270996, "global_step": 637062, "epoch": 7675} {"train_loss": -28.256479263305664, "global_step": 637063, "epoch": 7675} {"train_loss": -28.065509796142578, "global_step": 637064, "epoch": 7675} {"train_loss": -28.156909942626953, "global_step": 637065, "epoch": 7675} {"train_loss": -28.2117919921875, "global_step": 637066, "epoch": 7675} {"train_loss": -28.100000381469727, "global_step": 637067, "epoch": 7675} {"train_loss": -27.9891414642334, "global_step": 637068, "epoch": 7675} {"train_loss": -28.56591796875, "global_step": 637069, "epoch": 7675} {"train_loss": -28.476362228393555, "global_step": 637070, "epoch": 7675} {"train_loss": -28.534351348876953, "global_step": 637071, "epoch": 7675} {"train_loss": -28.5877685546875, "global_step": 637072, "epoch": 7675} {"train_loss": -28.334028244018555, "global_step": 637073, "epoch": 7675} {"train_loss": -28.107980728149414, "global_step": 637074, "epoch": 7675} {"train_loss": -28.542997360229492, "global_step": 637075, "epoch": 7675} {"train_loss": -28.619140625, "global_step": 637076, "epoch": 7675} {"train_loss": -28.56427001953125, "global_step": 637077, "epoch": 7675} {"train_loss": -28.548185348510742, "global_step": 637078, "epoch": 7675} {"train_loss": -28.2165584564209, "global_step": 637079, "epoch": 7675} {"train_loss": -28.458072662353516, "global_step": 637080, "epoch": 7675} {"train_loss": -28.391828536987305, "global_step": 637081, "epoch": 7675} {"train_loss": -28.29656982421875, "global_step": 637082, "epoch": 7675} {"train_loss": -27.993255615234375, "global_step": 637083, "epoch": 7675} {"train_loss": -28.195775985717773, "global_step": 637084, "epoch": 7675} {"train_loss": -28.473495483398438, "global_step": 637085, "epoch": 7675} {"train_loss": -28.34552001953125, "global_step": 637086, "epoch": 7675} {"train_loss": -28.106672286987305, "global_step": 637087, "epoch": 7675} {"train_loss": -28.22003746032715, "global_step": 637088, "epoch": 7675} {"train_loss": -28.186567306518555, "global_step": 637089, "epoch": 7675} {"train_loss": -28.316564559936523, "global_step": 637090, "epoch": 7675} {"train_loss": -28.239334106445312, "global_step": 637091, "epoch": 7675} {"train_loss": -28.204059600830078, "global_step": 637092, "epoch": 7675} {"train_loss": -28.225147247314453, "global_step": 637093, "epoch": 7675} {"train_loss": -28.26385498046875, "global_step": 637094, "epoch": 7675} {"train_loss": -28.757720947265625, "global_step": 637095, "epoch": 7675} {"train_loss": -28.394311904907227, "global_step": 637096, "epoch": 7675} {"train_loss": -28.603269577026367, "global_step": 637097, "epoch": 7675} {"train_loss": -28.479928970336914, "global_step": 637098, "epoch": 7675} {"train_loss": -28.586395263671875, "global_step": 637099, "epoch": 7675} {"train_loss": -28.3903865814209, "global_step": 637100, "epoch": 7675} {"train_loss": -28.401844024658203, "global_step": 637101, "epoch": 7675} {"train_loss": -28.311063766479492, "global_step": 637102, "epoch": 7675} {"train_loss": -28.567657470703125, "global_step": 637103, "epoch": 7675} {"train_loss": -28.309072494506836, "global_step": 637104, "epoch": 7675} {"train_loss": -28.311384201049805, "global_step": 637105, "epoch": 7675} {"train_loss": -28.488269805908203, "global_step": 637106, "epoch": 7675} {"train_loss": -28.035633087158203, "global_step": 637107, "epoch": 7675, "val_loss": 6602851.0} {"train_loss": -27.34592628479004, "global_step": 637108, "epoch": 7676} {"train_loss": -27.548315048217773, "global_step": 637109, "epoch": 7676} {"train_loss": -27.537656784057617, "global_step": 637110, "epoch": 7676} {"train_loss": -27.478620529174805, "global_step": 637111, "epoch": 7676} {"train_loss": -27.109296798706055, "global_step": 637112, "epoch": 7676} {"train_loss": -27.940210342407227, "global_step": 637113, "epoch": 7676} {"train_loss": -27.078245162963867, "global_step": 637114, "epoch": 7676} {"train_loss": -27.321792602539062, "global_step": 637115, "epoch": 7676} {"train_loss": -28.082843780517578, "global_step": 637116, "epoch": 7676} {"train_loss": -27.706151962280273, "global_step": 637117, "epoch": 7676} {"train_loss": -27.166425704956055, "global_step": 637118, "epoch": 7676} {"train_loss": -27.627017974853516, "global_step": 637119, "epoch": 7676} {"train_loss": -27.525915145874023, "global_step": 637120, "epoch": 7676} {"train_loss": -27.645771026611328, "global_step": 637121, "epoch": 7676} {"train_loss": -27.656843185424805, "global_step": 637122, "epoch": 7676} {"train_loss": -27.876440048217773, "global_step": 637123, "epoch": 7676} {"train_loss": -27.980487823486328, "global_step": 637124, "epoch": 7676} {"train_loss": -27.6351318359375, "global_step": 637125, "epoch": 7676} {"train_loss": -28.153284072875977, "global_step": 637126, "epoch": 7676} {"train_loss": -28.034378051757812, "global_step": 637127, "epoch": 7676} {"train_loss": -27.80975341796875, "global_step": 637128, "epoch": 7676} {"train_loss": -27.94158935546875, "global_step": 637129, "epoch": 7676} {"train_loss": -27.975177764892578, "global_step": 637130, "epoch": 7676} {"train_loss": -28.024839401245117, "global_step": 637131, "epoch": 7676} {"train_loss": -28.048208236694336, "global_step": 637132, "epoch": 7676} {"train_loss": -28.369049072265625, "global_step": 637133, "epoch": 7676} {"train_loss": -28.034500122070312, "global_step": 637134, "epoch": 7676} {"train_loss": -28.209699630737305, "global_step": 637135, "epoch": 7676} {"train_loss": -28.25225830078125, "global_step": 637136, "epoch": 7676} {"train_loss": -27.92534828186035, "global_step": 637137, "epoch": 7676} {"train_loss": -28.62917137145996, "global_step": 637138, "epoch": 7676} {"train_loss": -28.0792179107666, "global_step": 637139, "epoch": 7676} {"train_loss": -28.16897964477539, "global_step": 637140, "epoch": 7676} {"train_loss": -28.087385177612305, "global_step": 637141, "epoch": 7676} {"train_loss": -28.168806076049805, "global_step": 637142, "epoch": 7676} {"train_loss": -28.424970626831055, "global_step": 637143, "epoch": 7676} {"train_loss": -27.90638542175293, "global_step": 637144, "epoch": 7676} {"train_loss": -28.2337589263916, "global_step": 637145, "epoch": 7676} {"train_loss": -28.11932945251465, "global_step": 637146, "epoch": 7676} {"train_loss": -28.03187370300293, "global_step": 637147, "epoch": 7676} {"train_loss": -28.089746475219727, "global_step": 637148, "epoch": 7676} {"train_loss": -28.1214599609375, "global_step": 637149, "epoch": 7676} {"train_loss": -28.4329776763916, "global_step": 637150, "epoch": 7676} {"train_loss": -28.404254913330078, "global_step": 637151, "epoch": 7676} {"train_loss": -28.4931697845459, "global_step": 637152, "epoch": 7676} {"train_loss": -28.237268447875977, "global_step": 637153, "epoch": 7676} {"train_loss": -28.325910568237305, "global_step": 637154, "epoch": 7676} {"train_loss": -28.682409286499023, "global_step": 637155, "epoch": 7676} {"train_loss": -27.928037643432617, "global_step": 637156, "epoch": 7676} {"train_loss": -28.201852798461914, "global_step": 637157, "epoch": 7676} {"train_loss": -28.803247451782227, "global_step": 637158, "epoch": 7676} {"train_loss": -28.209857940673828, "global_step": 637159, "epoch": 7676} {"train_loss": -28.396162033081055, "global_step": 637160, "epoch": 7676} {"train_loss": -28.22525978088379, "global_step": 637161, "epoch": 7676} {"train_loss": -28.67243766784668, "global_step": 637162, "epoch": 7676} {"train_loss": -28.26422691345215, "global_step": 637163, "epoch": 7676} {"train_loss": -28.309778213500977, "global_step": 637164, "epoch": 7676} {"train_loss": -28.523681640625, "global_step": 637165, "epoch": 7676} {"train_loss": -28.34400749206543, "global_step": 637166, "epoch": 7676} {"train_loss": -28.22273826599121, "global_step": 637167, "epoch": 7676} {"train_loss": -28.53059196472168, "global_step": 637168, "epoch": 7676} {"train_loss": -28.62810707092285, "global_step": 637169, "epoch": 7676} {"train_loss": -28.55301284790039, "global_step": 637170, "epoch": 7676} {"train_loss": -28.54518699645996, "global_step": 637171, "epoch": 7676} {"train_loss": -28.8874568939209, "global_step": 637172, "epoch": 7676} {"train_loss": -28.513275146484375, "global_step": 637173, "epoch": 7676} {"train_loss": -28.525659561157227, "global_step": 637174, "epoch": 7676} {"train_loss": -28.556842803955078, "global_step": 637175, "epoch": 7676} {"train_loss": -28.706995010375977, "global_step": 637176, "epoch": 7676} {"train_loss": -28.563642501831055, "global_step": 637177, "epoch": 7676} {"train_loss": -28.329822540283203, "global_step": 637178, "epoch": 7676} {"train_loss": -27.97393226623535, "global_step": 637179, "epoch": 7676} {"train_loss": -27.61932373046875, "global_step": 637180, "epoch": 7676} {"train_loss": -27.642480850219727, "global_step": 637181, "epoch": 7676} {"train_loss": -27.708200454711914, "global_step": 637182, "epoch": 7676} {"train_loss": -28.400129318237305, "global_step": 637183, "epoch": 7676} {"train_loss": -28.19756507873535, "global_step": 637184, "epoch": 7676} {"train_loss": -28.247314453125, "global_step": 637185, "epoch": 7676} {"train_loss": -27.818195343017578, "global_step": 637186, "epoch": 7676} {"train_loss": -27.871423721313477, "global_step": 637187, "epoch": 7676} {"train_loss": -28.16568946838379, "global_step": 637188, "epoch": 7676} {"train_loss": -28.601978302001953, "global_step": 637189, "epoch": 7676} {"train_loss": -28.09622013138001, "global_step": 637190, "epoch": 7676, "val_loss": 6615683.0} {"train_loss": -26.15390396118164, "global_step": 637191, "epoch": 7677} {"train_loss": -27.694839477539062, "global_step": 637192, "epoch": 7677} {"train_loss": -26.542978286743164, "global_step": 637193, "epoch": 7677} {"train_loss": -26.217151641845703, "global_step": 637194, "epoch": 7677} {"train_loss": -27.57147216796875, "global_step": 637195, "epoch": 7677} {"train_loss": -27.217609405517578, "global_step": 637196, "epoch": 7677} {"train_loss": -27.009296417236328, "global_step": 637197, "epoch": 7677} {"train_loss": -27.164777755737305, "global_step": 637198, "epoch": 7677} {"train_loss": -26.77705192565918, "global_step": 637199, "epoch": 7677} {"train_loss": -27.271467208862305, "global_step": 637200, "epoch": 7677} {"train_loss": -27.31707191467285, "global_step": 637201, "epoch": 7677} {"train_loss": -27.103307723999023, "global_step": 637202, "epoch": 7677} {"train_loss": -27.283185958862305, "global_step": 637203, "epoch": 7677} {"train_loss": -27.04850196838379, "global_step": 637204, "epoch": 7677} {"train_loss": -27.86799430847168, "global_step": 637205, "epoch": 7677} {"train_loss": -27.160572052001953, "global_step": 637206, "epoch": 7677} {"train_loss": -27.43342399597168, "global_step": 637207, "epoch": 7677} {"train_loss": -27.433074951171875, "global_step": 637208, "epoch": 7677} {"train_loss": -27.838003158569336, "global_step": 637209, "epoch": 7677} {"train_loss": -27.497617721557617, "global_step": 637210, "epoch": 7677} {"train_loss": -27.796249389648438, "global_step": 637211, "epoch": 7677} {"train_loss": -27.614599227905273, "global_step": 637212, "epoch": 7677} {"train_loss": -27.74885368347168, "global_step": 637213, "epoch": 7677} {"train_loss": -27.507587432861328, "global_step": 637214, "epoch": 7677} {"train_loss": -27.9759578704834, "global_step": 637215, "epoch": 7677} {"train_loss": -28.0015811920166, "global_step": 637216, "epoch": 7677} {"train_loss": -28.014020919799805, "global_step": 637217, "epoch": 7677} {"train_loss": -27.989484786987305, "global_step": 637218, "epoch": 7677} {"train_loss": -27.8419246673584, "global_step": 637219, "epoch": 7677} {"train_loss": -27.997116088867188, "global_step": 637220, "epoch": 7677} {"train_loss": -28.044519424438477, "global_step": 637221, "epoch": 7677} {"train_loss": -27.72491455078125, "global_step": 637222, "epoch": 7677} {"train_loss": -27.5397891998291, "global_step": 637223, "epoch": 7677} {"train_loss": -27.86834716796875, "global_step": 637224, "epoch": 7677} {"train_loss": -28.09705924987793, "global_step": 637225, "epoch": 7677} {"train_loss": -28.296283721923828, "global_step": 637226, "epoch": 7677} {"train_loss": -28.2545223236084, "global_step": 637227, "epoch": 7677} {"train_loss": -27.91596031188965, "global_step": 637228, "epoch": 7677} {"train_loss": -28.06989860534668, "global_step": 637229, "epoch": 7677} {"train_loss": -27.947208404541016, "global_step": 637230, "epoch": 7677} {"train_loss": -28.102441787719727, "global_step": 637231, "epoch": 7677} {"train_loss": -28.067047119140625, "global_step": 637232, "epoch": 7677} {"train_loss": -28.122589111328125, "global_step": 637233, "epoch": 7677} {"train_loss": -28.33036231994629, "global_step": 637234, "epoch": 7677} {"train_loss": -28.090612411499023, "global_step": 637235, "epoch": 7677} {"train_loss": -27.77618980407715, "global_step": 637236, "epoch": 7677} {"train_loss": -27.9158992767334, "global_step": 637237, "epoch": 7677} {"train_loss": -28.091833114624023, "global_step": 637238, "epoch": 7677} {"train_loss": -27.925113677978516, "global_step": 637239, "epoch": 7677} {"train_loss": -28.1887264251709, "global_step": 637240, "epoch": 7677} {"train_loss": -28.201740264892578, "global_step": 637241, "epoch": 7677} {"train_loss": -28.33329200744629, "global_step": 637242, "epoch": 7677} {"train_loss": -27.835012435913086, "global_step": 637243, "epoch": 7677} {"train_loss": -28.46052360534668, "global_step": 637244, "epoch": 7677} {"train_loss": -28.253284454345703, "global_step": 637245, "epoch": 7677} {"train_loss": -28.295209884643555, "global_step": 637246, "epoch": 7677} {"train_loss": -28.29831314086914, "global_step": 637247, "epoch": 7677} {"train_loss": -28.741729736328125, "global_step": 637248, "epoch": 7677} {"train_loss": -28.472681045532227, "global_step": 637249, "epoch": 7677} {"train_loss": -28.254846572875977, "global_step": 637250, "epoch": 7677} {"train_loss": -28.288267135620117, "global_step": 637251, "epoch": 7677} {"train_loss": -28.38201332092285, "global_step": 637252, "epoch": 7677} {"train_loss": -28.21697425842285, "global_step": 637253, "epoch": 7677} {"train_loss": -28.22370719909668, "global_step": 637254, "epoch": 7677} {"train_loss": -28.47653579711914, "global_step": 637255, "epoch": 7677} {"train_loss": -28.375202178955078, "global_step": 637256, "epoch": 7677} {"train_loss": -28.342914581298828, "global_step": 637257, "epoch": 7677} {"train_loss": -28.282611846923828, "global_step": 637258, "epoch": 7677} {"train_loss": -28.58748435974121, "global_step": 637259, "epoch": 7677} {"train_loss": -28.68855094909668, "global_step": 637260, "epoch": 7677} {"train_loss": -28.486602783203125, "global_step": 637261, "epoch": 7677} {"train_loss": -28.25984764099121, "global_step": 637262, "epoch": 7677} {"train_loss": -28.253284454345703, "global_step": 637263, "epoch": 7677} {"train_loss": -27.975418090820312, "global_step": 637264, "epoch": 7677} {"train_loss": -28.672269821166992, "global_step": 637265, "epoch": 7677} {"train_loss": -28.05938148498535, "global_step": 637266, "epoch": 7677} {"train_loss": -28.263263702392578, "global_step": 637267, "epoch": 7677} {"train_loss": -28.227954864501953, "global_step": 637268, "epoch": 7677} {"train_loss": -28.190826416015625, "global_step": 637269, "epoch": 7677} {"train_loss": -28.112445831298828, "global_step": 637270, "epoch": 7677} {"train_loss": -28.090396881103516, "global_step": 637271, "epoch": 7677} {"train_loss": -28.0830078125, "global_step": 637272, "epoch": 7677} {"train_loss": -27.909703541951007, "global_step": 637273, "epoch": 7677, "val_loss": 6613523.0} {"train_loss": -27.694128036499023, "global_step": 637274, "epoch": 7678} {"train_loss": -27.751117706298828, "global_step": 637275, "epoch": 7678} {"train_loss": -27.34696388244629, "global_step": 637276, "epoch": 7678} {"train_loss": -27.49824333190918, "global_step": 637277, "epoch": 7678} {"train_loss": -27.76337242126465, "global_step": 637278, "epoch": 7678} {"train_loss": -27.686681747436523, "global_step": 637279, "epoch": 7678} {"train_loss": -27.38572120666504, "global_step": 637280, "epoch": 7678} {"train_loss": -27.680984497070312, "global_step": 637281, "epoch": 7678} {"train_loss": -27.925201416015625, "global_step": 637282, "epoch": 7678} {"train_loss": -27.7196102142334, "global_step": 637283, "epoch": 7678} {"train_loss": -28.145984649658203, "global_step": 637284, "epoch": 7678} {"train_loss": -27.93329429626465, "global_step": 637285, "epoch": 7678} {"train_loss": -28.063276290893555, "global_step": 637286, "epoch": 7678} {"train_loss": -28.27035903930664, "global_step": 637287, "epoch": 7678} {"train_loss": -28.05360221862793, "global_step": 637288, "epoch": 7678} {"train_loss": -28.398550033569336, "global_step": 637289, "epoch": 7678} {"train_loss": -28.240697860717773, "global_step": 637290, "epoch": 7678} {"train_loss": -28.233945846557617, "global_step": 637291, "epoch": 7678} {"train_loss": -28.059946060180664, "global_step": 637292, "epoch": 7678} {"train_loss": -28.209226608276367, "global_step": 637293, "epoch": 7678} {"train_loss": -27.96940040588379, "global_step": 637294, "epoch": 7678} {"train_loss": -28.1658878326416, "global_step": 637295, "epoch": 7678} {"train_loss": -28.142349243164062, "global_step": 637296, "epoch": 7678} {"train_loss": -28.055057525634766, "global_step": 637297, "epoch": 7678} {"train_loss": -28.410974502563477, "global_step": 637298, "epoch": 7678} {"train_loss": -28.32419776916504, "global_step": 637299, "epoch": 7678} {"train_loss": -28.02927017211914, "global_step": 637300, "epoch": 7678} {"train_loss": -28.373886108398438, "global_step": 637301, "epoch": 7678} {"train_loss": -28.1005802154541, "global_step": 637302, "epoch": 7678} {"train_loss": -28.131275177001953, "global_step": 637303, "epoch": 7678} {"train_loss": -28.03809928894043, "global_step": 637304, "epoch": 7678} {"train_loss": -28.506988525390625, "global_step": 637305, "epoch": 7678} {"train_loss": -27.817602157592773, "global_step": 637306, "epoch": 7678} {"train_loss": -28.102298736572266, "global_step": 637307, "epoch": 7678} {"train_loss": -28.009862899780273, "global_step": 637308, "epoch": 7678} {"train_loss": -28.3859920501709, "global_step": 637309, "epoch": 7678} {"train_loss": -27.972675323486328, "global_step": 637310, "epoch": 7678} {"train_loss": -28.151294708251953, "global_step": 637311, "epoch": 7678} {"train_loss": -28.404132843017578, "global_step": 637312, "epoch": 7678} {"train_loss": -28.642221450805664, "global_step": 637313, "epoch": 7678} {"train_loss": -28.41663932800293, "global_step": 637314, "epoch": 7678} {"train_loss": -28.413681030273438, "global_step": 637315, "epoch": 7678} {"train_loss": -28.09697914123535, "global_step": 637316, "epoch": 7678} {"train_loss": -28.43622398376465, "global_step": 637317, "epoch": 7678} {"train_loss": -28.550098419189453, "global_step": 637318, "epoch": 7678} {"train_loss": -28.388975143432617, "global_step": 637319, "epoch": 7678} {"train_loss": -28.527423858642578, "global_step": 637320, "epoch": 7678} {"train_loss": -28.391300201416016, "global_step": 637321, "epoch": 7678} {"train_loss": -28.4209041595459, "global_step": 637322, "epoch": 7678} {"train_loss": -28.083044052124023, "global_step": 637323, "epoch": 7678} {"train_loss": -28.756921768188477, "global_step": 637324, "epoch": 7678} {"train_loss": -28.21719741821289, "global_step": 637325, "epoch": 7678} {"train_loss": -28.563199996948242, "global_step": 637326, "epoch": 7678} {"train_loss": -28.473413467407227, "global_step": 637327, "epoch": 7678} {"train_loss": -27.910785675048828, "global_step": 637328, "epoch": 7678} {"train_loss": -27.823999404907227, "global_step": 637329, "epoch": 7678} {"train_loss": -27.680883407592773, "global_step": 637330, "epoch": 7678} {"train_loss": -25.914655685424805, "global_step": 637331, "epoch": 7678} {"train_loss": -24.597814559936523, "global_step": 637332, "epoch": 7678} {"train_loss": -26.57285499572754, "global_step": 637333, "epoch": 7678} {"train_loss": -28.127613067626953, "global_step": 637334, "epoch": 7678} {"train_loss": -27.56892204284668, "global_step": 637335, "epoch": 7678} {"train_loss": -28.04917335510254, "global_step": 637336, "epoch": 7678} {"train_loss": -27.97382164001465, "global_step": 637337, "epoch": 7678} {"train_loss": -27.74118995666504, "global_step": 637338, "epoch": 7678} {"train_loss": -28.26319694519043, "global_step": 637339, "epoch": 7678} {"train_loss": -27.659530639648438, "global_step": 637340, "epoch": 7678} {"train_loss": -27.97995948791504, "global_step": 637341, "epoch": 7678} {"train_loss": -28.388010025024414, "global_step": 637342, "epoch": 7678} {"train_loss": -27.6723690032959, "global_step": 637343, "epoch": 7678} {"train_loss": -28.180328369140625, "global_step": 637344, "epoch": 7678} {"train_loss": -27.7794246673584, "global_step": 637345, "epoch": 7678} {"train_loss": -27.942859649658203, "global_step": 637346, "epoch": 7678} {"train_loss": -28.101367950439453, "global_step": 637347, "epoch": 7678} {"train_loss": -27.915088653564453, "global_step": 637348, "epoch": 7678} {"train_loss": -28.0589656829834, "global_step": 637349, "epoch": 7678} {"train_loss": -27.55012321472168, "global_step": 637350, "epoch": 7678} {"train_loss": -27.961627960205078, "global_step": 637351, "epoch": 7678} {"train_loss": -28.295856475830078, "global_step": 637352, "epoch": 7678} {"train_loss": -28.015222549438477, "global_step": 637353, "epoch": 7678} {"train_loss": -28.335086822509766, "global_step": 637354, "epoch": 7678} {"train_loss": -28.0396785736084, "global_step": 637355, "epoch": 7678} {"train_loss": -27.98891138743205, "global_step": 637356, "epoch": 7678, "val_loss": 6659153.5} {"train_loss": -27.18031120300293, "global_step": 637357, "epoch": 7679} {"train_loss": -25.97549819946289, "global_step": 637358, "epoch": 7679} {"train_loss": -26.18965721130371, "global_step": 637359, "epoch": 7679} {"train_loss": -25.65590476989746, "global_step": 637360, "epoch": 7679} {"train_loss": -27.154010772705078, "global_step": 637361, "epoch": 7679} {"train_loss": -27.015289306640625, "global_step": 637362, "epoch": 7679} {"train_loss": -27.519229888916016, "global_step": 637363, "epoch": 7679} {"train_loss": -26.828611373901367, "global_step": 637364, "epoch": 7679} {"train_loss": -27.22047233581543, "global_step": 637365, "epoch": 7679} {"train_loss": -27.17982292175293, "global_step": 637366, "epoch": 7679} {"train_loss": -27.427703857421875, "global_step": 637367, "epoch": 7679} {"train_loss": -27.802398681640625, "global_step": 637368, "epoch": 7679} {"train_loss": -27.46748161315918, "global_step": 637369, "epoch": 7679} {"train_loss": -27.663366317749023, "global_step": 637370, "epoch": 7679} {"train_loss": -27.58798599243164, "global_step": 637371, "epoch": 7679} {"train_loss": -27.7391300201416, "global_step": 637372, "epoch": 7679} {"train_loss": -27.64764976501465, "global_step": 637373, "epoch": 7679} {"train_loss": -27.71895408630371, "global_step": 637374, "epoch": 7679} {"train_loss": -27.735626220703125, "global_step": 637375, "epoch": 7679} {"train_loss": -27.712390899658203, "global_step": 637376, "epoch": 7679} {"train_loss": -28.060749053955078, "global_step": 637377, "epoch": 7679} {"train_loss": -27.549163818359375, "global_step": 637378, "epoch": 7679} {"train_loss": -28.038599014282227, "global_step": 637379, "epoch": 7679} {"train_loss": -28.087482452392578, "global_step": 637380, "epoch": 7679} {"train_loss": -27.942731857299805, "global_step": 637381, "epoch": 7679} {"train_loss": -28.237396240234375, "global_step": 637382, "epoch": 7679} {"train_loss": -27.800800323486328, "global_step": 637383, "epoch": 7679} {"train_loss": -28.05859375, "global_step": 637384, "epoch": 7679} {"train_loss": -28.094690322875977, "global_step": 637385, "epoch": 7679} {"train_loss": -28.15766716003418, "global_step": 637386, "epoch": 7679} {"train_loss": -28.329925537109375, "global_step": 637387, "epoch": 7679} {"train_loss": -28.2946720123291, "global_step": 637388, "epoch": 7679} {"train_loss": -28.709003448486328, "global_step": 637389, "epoch": 7679} {"train_loss": -28.261381149291992, "global_step": 637390, "epoch": 7679} {"train_loss": -28.01506996154785, "global_step": 637391, "epoch": 7679} {"train_loss": -28.42352867126465, "global_step": 637392, "epoch": 7679} {"train_loss": -28.112157821655273, "global_step": 637393, "epoch": 7679} {"train_loss": -27.99371910095215, "global_step": 637394, "epoch": 7679} {"train_loss": -28.36016273498535, "global_step": 637395, "epoch": 7679} {"train_loss": -28.096210479736328, "global_step": 637396, "epoch": 7679} {"train_loss": -28.749176025390625, "global_step": 637397, "epoch": 7679} {"train_loss": -28.169082641601562, "global_step": 637398, "epoch": 7679} {"train_loss": -28.508527755737305, "global_step": 637399, "epoch": 7679} {"train_loss": -28.2410831451416, "global_step": 637400, "epoch": 7679} {"train_loss": -28.286457061767578, "global_step": 637401, "epoch": 7679} {"train_loss": -28.5391788482666, "global_step": 637402, "epoch": 7679} {"train_loss": -28.419403076171875, "global_step": 637403, "epoch": 7679} {"train_loss": -28.335691452026367, "global_step": 637404, "epoch": 7679} {"train_loss": -28.43842124938965, "global_step": 637405, "epoch": 7679} {"train_loss": -28.470693588256836, "global_step": 637406, "epoch": 7679} {"train_loss": -28.42629051208496, "global_step": 637407, "epoch": 7679} {"train_loss": -28.232656478881836, "global_step": 637408, "epoch": 7679} {"train_loss": -28.3289852142334, "global_step": 637409, "epoch": 7679} {"train_loss": -28.45999526977539, "global_step": 637410, "epoch": 7679} {"train_loss": -28.43743324279785, "global_step": 637411, "epoch": 7679} {"train_loss": -28.305700302124023, "global_step": 637412, "epoch": 7679} {"train_loss": -28.742847442626953, "global_step": 637413, "epoch": 7679} {"train_loss": -28.332656860351562, "global_step": 637414, "epoch": 7679} {"train_loss": -28.378759384155273, "global_step": 637415, "epoch": 7679} {"train_loss": -28.291828155517578, "global_step": 637416, "epoch": 7679} {"train_loss": -28.48984718322754, "global_step": 637417, "epoch": 7679} {"train_loss": -28.50819206237793, "global_step": 637418, "epoch": 7679} {"train_loss": -28.356647491455078, "global_step": 637419, "epoch": 7679} {"train_loss": -28.747817993164062, "global_step": 637420, "epoch": 7679} {"train_loss": -28.700153350830078, "global_step": 637421, "epoch": 7679} {"train_loss": -28.634449005126953, "global_step": 637422, "epoch": 7679} {"train_loss": -28.23270034790039, "global_step": 637423, "epoch": 7679} {"train_loss": -28.548084259033203, "global_step": 637424, "epoch": 7679} {"train_loss": -28.85544776916504, "global_step": 637425, "epoch": 7679} {"train_loss": -28.600095748901367, "global_step": 637426, "epoch": 7679} {"train_loss": -28.239572525024414, "global_step": 637427, "epoch": 7679} {"train_loss": -28.581701278686523, "global_step": 637428, "epoch": 7679} {"train_loss": -28.173864364624023, "global_step": 637429, "epoch": 7679} {"train_loss": -27.994245529174805, "global_step": 637430, "epoch": 7679} {"train_loss": -28.083959579467773, "global_step": 637431, "epoch": 7679} {"train_loss": -27.363941192626953, "global_step": 637432, "epoch": 7679} {"train_loss": -27.782438278198242, "global_step": 637433, "epoch": 7679} {"train_loss": -27.65150260925293, "global_step": 637434, "epoch": 7679} {"train_loss": -28.537189483642578, "global_step": 637435, "epoch": 7679} {"train_loss": -27.961225509643555, "global_step": 637436, "epoch": 7679} {"train_loss": -28.369531631469727, "global_step": 637437, "epoch": 7679} {"train_loss": -28.35382080078125, "global_step": 637438, "epoch": 7679} {"train_loss": -28.02634105912174, "global_step": 637439, "epoch": 7679, "val_loss": 6645511.5} {"train_loss": -27.29817008972168, "global_step": 637440, "epoch": 7680} {"train_loss": -27.971378326416016, "global_step": 637441, "epoch": 7680} {"train_loss": -27.67340087890625, "global_step": 637442, "epoch": 7680} {"train_loss": -27.7293701171875, "global_step": 637443, "epoch": 7680} {"train_loss": -27.517963409423828, "global_step": 637444, "epoch": 7680} {"train_loss": -27.51761817932129, "global_step": 637445, "epoch": 7680} {"train_loss": -27.59225845336914, "global_step": 637446, "epoch": 7680} {"train_loss": -27.943212509155273, "global_step": 637447, "epoch": 7680} {"train_loss": -27.56825065612793, "global_step": 637448, "epoch": 7680} {"train_loss": -27.510730743408203, "global_step": 637449, "epoch": 7680} {"train_loss": -27.667072296142578, "global_step": 637450, "epoch": 7680} {"train_loss": -28.053205490112305, "global_step": 637451, "epoch": 7680} {"train_loss": -27.6468563079834, "global_step": 637452, "epoch": 7680} {"train_loss": -27.865461349487305, "global_step": 637453, "epoch": 7680} {"train_loss": -28.00221061706543, "global_step": 637454, "epoch": 7680} {"train_loss": -28.043737411499023, "global_step": 637455, "epoch": 7680} {"train_loss": -28.02998161315918, "global_step": 637456, "epoch": 7680} {"train_loss": -28.0255126953125, "global_step": 637457, "epoch": 7680} {"train_loss": -27.83668327331543, "global_step": 637458, "epoch": 7680} {"train_loss": -27.9641170501709, "global_step": 637459, "epoch": 7680} {"train_loss": -27.944555282592773, "global_step": 637460, "epoch": 7680} {"train_loss": -28.14820671081543, "global_step": 637461, "epoch": 7680} {"train_loss": -27.383930206298828, "global_step": 637462, "epoch": 7680} {"train_loss": -27.961612701416016, "global_step": 637463, "epoch": 7680} {"train_loss": -27.74007225036621, "global_step": 637464, "epoch": 7680} {"train_loss": -28.325796127319336, "global_step": 637465, "epoch": 7680} {"train_loss": -28.164657592773438, "global_step": 637466, "epoch": 7680} {"train_loss": -28.309967041015625, "global_step": 637467, "epoch": 7680} {"train_loss": -28.608142852783203, "global_step": 637468, "epoch": 7680} {"train_loss": -28.27180290222168, "global_step": 637469, "epoch": 7680} {"train_loss": -27.982467651367188, "global_step": 637470, "epoch": 7680} {"train_loss": -27.974700927734375, "global_step": 637471, "epoch": 7680} {"train_loss": -28.214553833007812, "global_step": 637472, "epoch": 7680} {"train_loss": -28.014860153198242, "global_step": 637473, "epoch": 7680} {"train_loss": -28.512033462524414, "global_step": 637474, "epoch": 7680} {"train_loss": -28.575164794921875, "global_step": 637475, "epoch": 7680} {"train_loss": -28.340559005737305, "global_step": 637476, "epoch": 7680} {"train_loss": -28.046894073486328, "global_step": 637477, "epoch": 7680} {"train_loss": -28.1646671295166, "global_step": 637478, "epoch": 7680} {"train_loss": -28.424036026000977, "global_step": 637479, "epoch": 7680} {"train_loss": -28.20942497253418, "global_step": 637480, "epoch": 7680} {"train_loss": -28.49641227722168, "global_step": 637481, "epoch": 7680} {"train_loss": -28.36529541015625, "global_step": 637482, "epoch": 7680} {"train_loss": -28.104736328125, "global_step": 637483, "epoch": 7680} {"train_loss": -28.45649528503418, "global_step": 637484, "epoch": 7680} {"train_loss": -28.562707901000977, "global_step": 637485, "epoch": 7680} {"train_loss": -28.61333656311035, "global_step": 637486, "epoch": 7680} {"train_loss": -28.360828399658203, "global_step": 637487, "epoch": 7680} {"train_loss": -28.406736373901367, "global_step": 637488, "epoch": 7680} {"train_loss": -28.173358917236328, "global_step": 637489, "epoch": 7680} {"train_loss": -28.219663619995117, "global_step": 637490, "epoch": 7680} {"train_loss": -28.4261474609375, "global_step": 637491, "epoch": 7680} {"train_loss": -28.59650230407715, "global_step": 637492, "epoch": 7680} {"train_loss": -28.5637149810791, "global_step": 637493, "epoch": 7680} {"train_loss": -28.493133544921875, "global_step": 637494, "epoch": 7680} {"train_loss": -28.37812614440918, "global_step": 637495, "epoch": 7680} {"train_loss": -28.33685874938965, "global_step": 637496, "epoch": 7680} {"train_loss": -28.287939071655273, "global_step": 637497, "epoch": 7680} {"train_loss": -28.419677734375, "global_step": 637498, "epoch": 7680} {"train_loss": -28.54554557800293, "global_step": 637499, "epoch": 7680} {"train_loss": -28.295820236206055, "global_step": 637500, "epoch": 7680} {"train_loss": -28.709897994995117, "global_step": 637501, "epoch": 7680} {"train_loss": -28.180160522460938, "global_step": 637502, "epoch": 7680} {"train_loss": -28.053024291992188, "global_step": 637503, "epoch": 7680} {"train_loss": -28.774011611938477, "global_step": 637504, "epoch": 7680} {"train_loss": -28.145261764526367, "global_step": 637505, "epoch": 7680} {"train_loss": -28.173898696899414, "global_step": 637506, "epoch": 7680} {"train_loss": -28.338348388671875, "global_step": 637507, "epoch": 7680} {"train_loss": -28.07537841796875, "global_step": 637508, "epoch": 7680} {"train_loss": -28.087926864624023, "global_step": 637509, "epoch": 7680} {"train_loss": -28.401905059814453, "global_step": 637510, "epoch": 7680} {"train_loss": -27.93075942993164, "global_step": 637511, "epoch": 7680} {"train_loss": -28.1184024810791, "global_step": 637512, "epoch": 7680} {"train_loss": -27.84086036682129, "global_step": 637513, "epoch": 7680} {"train_loss": -27.988311767578125, "global_step": 637514, "epoch": 7680} {"train_loss": -27.921051025390625, "global_step": 637515, "epoch": 7680} {"train_loss": -28.237689971923828, "global_step": 637516, "epoch": 7680} {"train_loss": -28.239532470703125, "global_step": 637517, "epoch": 7680} {"train_loss": -28.15150260925293, "global_step": 637518, "epoch": 7680} {"train_loss": -28.14540672302246, "global_step": 637519, "epoch": 7680} {"train_loss": -27.965482711791992, "global_step": 637520, "epoch": 7680} {"train_loss": -28.34345054626465, "global_step": 637521, "epoch": 7680} {"train_loss": -28.132081479911346, "global_step": 637522, "epoch": 7680, "val_loss": 6608902.5} {"train_loss": -27.101301193237305, "global_step": 637523, "epoch": 7681} {"train_loss": -27.262170791625977, "global_step": 637524, "epoch": 7681} {"train_loss": -27.37275505065918, "global_step": 637525, "epoch": 7681} {"train_loss": -27.18362808227539, "global_step": 637526, "epoch": 7681} {"train_loss": -27.049869537353516, "global_step": 637527, "epoch": 7681} {"train_loss": -27.61760902404785, "global_step": 637528, "epoch": 7681} {"train_loss": -27.194055557250977, "global_step": 637529, "epoch": 7681} {"train_loss": -26.962690353393555, "global_step": 637530, "epoch": 7681} {"train_loss": -27.0476131439209, "global_step": 637531, "epoch": 7681} {"train_loss": -26.989526748657227, "global_step": 637532, "epoch": 7681} {"train_loss": -27.364816665649414, "global_step": 637533, "epoch": 7681} {"train_loss": -27.594650268554688, "global_step": 637534, "epoch": 7681} {"train_loss": -27.668249130249023, "global_step": 637535, "epoch": 7681} {"train_loss": -26.92421531677246, "global_step": 637536, "epoch": 7681} {"train_loss": -27.294300079345703, "global_step": 637537, "epoch": 7681} {"train_loss": -27.742755889892578, "global_step": 637538, "epoch": 7681} {"train_loss": -27.71063804626465, "global_step": 637539, "epoch": 7681} {"train_loss": -27.7542667388916, "global_step": 637540, "epoch": 7681} {"train_loss": -27.438831329345703, "global_step": 637541, "epoch": 7681} {"train_loss": -27.85540199279785, "global_step": 637542, "epoch": 7681} {"train_loss": -27.545276641845703, "global_step": 637543, "epoch": 7681} {"train_loss": -27.597448348999023, "global_step": 637544, "epoch": 7681} {"train_loss": -27.891122817993164, "global_step": 637545, "epoch": 7681} {"train_loss": -27.750402450561523, "global_step": 637546, "epoch": 7681} {"train_loss": -27.9163761138916, "global_step": 637547, "epoch": 7681} {"train_loss": -28.093053817749023, "global_step": 637548, "epoch": 7681} {"train_loss": -28.334125518798828, "global_step": 637549, "epoch": 7681} {"train_loss": -27.999103546142578, "global_step": 637550, "epoch": 7681} {"train_loss": -27.950428009033203, "global_step": 637551, "epoch": 7681} {"train_loss": -28.22344970703125, "global_step": 637552, "epoch": 7681} {"train_loss": -27.825292587280273, "global_step": 637553, "epoch": 7681} {"train_loss": -28.4384708404541, "global_step": 637554, "epoch": 7681} {"train_loss": -28.377286911010742, "global_step": 637555, "epoch": 7681} {"train_loss": -27.65229606628418, "global_step": 637556, "epoch": 7681} {"train_loss": -28.09705924987793, "global_step": 637557, "epoch": 7681} {"train_loss": -28.21718406677246, "global_step": 637558, "epoch": 7681} {"train_loss": -28.13545799255371, "global_step": 637559, "epoch": 7681} {"train_loss": -28.153095245361328, "global_step": 637560, "epoch": 7681} {"train_loss": -28.39716911315918, "global_step": 637561, "epoch": 7681} {"train_loss": -28.16005516052246, "global_step": 637562, "epoch": 7681} {"train_loss": -28.432119369506836, "global_step": 637563, "epoch": 7681} {"train_loss": -28.487171173095703, "global_step": 637564, "epoch": 7681} {"train_loss": -28.1063289642334, "global_step": 637565, "epoch": 7681} {"train_loss": -28.508996963500977, "global_step": 637566, "epoch": 7681} {"train_loss": -28.300708770751953, "global_step": 637567, "epoch": 7681} {"train_loss": -28.07657814025879, "global_step": 637568, "epoch": 7681} {"train_loss": -28.36602210998535, "global_step": 637569, "epoch": 7681} {"train_loss": -28.553058624267578, "global_step": 637570, "epoch": 7681} {"train_loss": -28.092575073242188, "global_step": 637571, "epoch": 7681} {"train_loss": -28.619342803955078, "global_step": 637572, "epoch": 7681} {"train_loss": -28.2598934173584, "global_step": 637573, "epoch": 7681} {"train_loss": -28.293180465698242, "global_step": 637574, "epoch": 7681} {"train_loss": -28.391767501831055, "global_step": 637575, "epoch": 7681} {"train_loss": -28.031085968017578, "global_step": 637576, "epoch": 7681} {"train_loss": -28.35479164123535, "global_step": 637577, "epoch": 7681} {"train_loss": -28.66753578186035, "global_step": 637578, "epoch": 7681} {"train_loss": -28.432668685913086, "global_step": 637579, "epoch": 7681} {"train_loss": -28.46103286743164, "global_step": 637580, "epoch": 7681} {"train_loss": -28.502836227416992, "global_step": 637581, "epoch": 7681} {"train_loss": -28.45151710510254, "global_step": 637582, "epoch": 7681} {"train_loss": -28.241037368774414, "global_step": 637583, "epoch": 7681} {"train_loss": -28.51618003845215, "global_step": 637584, "epoch": 7681} {"train_loss": -28.32527732849121, "global_step": 637585, "epoch": 7681} {"train_loss": -28.6165828704834, "global_step": 637586, "epoch": 7681} {"train_loss": -28.591053009033203, "global_step": 637587, "epoch": 7681} {"train_loss": -28.416284561157227, "global_step": 637588, "epoch": 7681} {"train_loss": -28.54969596862793, "global_step": 637589, "epoch": 7681} {"train_loss": -28.37006187438965, "global_step": 637590, "epoch": 7681} {"train_loss": -28.37110710144043, "global_step": 637591, "epoch": 7681} {"train_loss": -28.646747589111328, "global_step": 637592, "epoch": 7681} {"train_loss": -28.160633087158203, "global_step": 637593, "epoch": 7681} {"train_loss": -28.023584365844727, "global_step": 637594, "epoch": 7681} {"train_loss": -27.040332794189453, "global_step": 637595, "epoch": 7681} {"train_loss": -26.08621597290039, "global_step": 637596, "epoch": 7681} {"train_loss": -26.044538497924805, "global_step": 637597, "epoch": 7681} {"train_loss": -27.598316192626953, "global_step": 637598, "epoch": 7681} {"train_loss": -27.639251708984375, "global_step": 637599, "epoch": 7681} {"train_loss": -27.08026695251465, "global_step": 637600, "epoch": 7681} {"train_loss": -27.789997100830078, "global_step": 637601, "epoch": 7681} {"train_loss": -27.670074462890625, "global_step": 637602, "epoch": 7681} {"train_loss": -28.167224884033203, "global_step": 637603, "epoch": 7681} {"train_loss": -27.75848960876465, "global_step": 637604, "epoch": 7681} {"train_loss": -27.91013269539339, "global_step": 637605, "epoch": 7681, "val_loss": 6586469.0} {"train_loss": -27.126569747924805, "global_step": 637606, "epoch": 7682} {"train_loss": -26.26023292541504, "global_step": 637607, "epoch": 7682} {"train_loss": -27.103290557861328, "global_step": 637608, "epoch": 7682} {"train_loss": -26.8724365234375, "global_step": 637609, "epoch": 7682} {"train_loss": -26.72553825378418, "global_step": 637610, "epoch": 7682} {"train_loss": -27.11138343811035, "global_step": 637611, "epoch": 7682} {"train_loss": -27.234912872314453, "global_step": 637612, "epoch": 7682} {"train_loss": -27.234668731689453, "global_step": 637613, "epoch": 7682} {"train_loss": -27.4674015045166, "global_step": 637614, "epoch": 7682} {"train_loss": -27.377445220947266, "global_step": 637615, "epoch": 7682} {"train_loss": -27.23935317993164, "global_step": 637616, "epoch": 7682} {"train_loss": -27.147932052612305, "global_step": 637617, "epoch": 7682} {"train_loss": -27.48188591003418, "global_step": 637618, "epoch": 7682} {"train_loss": -27.507369995117188, "global_step": 637619, "epoch": 7682} {"train_loss": -27.578168869018555, "global_step": 637620, "epoch": 7682} {"train_loss": -27.6232967376709, "global_step": 637621, "epoch": 7682} {"train_loss": -28.1121768951416, "global_step": 637622, "epoch": 7682} {"train_loss": -27.562963485717773, "global_step": 637623, "epoch": 7682} {"train_loss": -27.51495361328125, "global_step": 637624, "epoch": 7682} {"train_loss": -27.913726806640625, "global_step": 637625, "epoch": 7682} {"train_loss": -28.122528076171875, "global_step": 637626, "epoch": 7682} {"train_loss": -27.775293350219727, "global_step": 637627, "epoch": 7682} {"train_loss": -27.677305221557617, "global_step": 637628, "epoch": 7682} {"train_loss": -28.146215438842773, "global_step": 637629, "epoch": 7682} {"train_loss": -27.841894149780273, "global_step": 637630, "epoch": 7682} {"train_loss": -27.804967880249023, "global_step": 637631, "epoch": 7682} {"train_loss": -28.059232711791992, "global_step": 637632, "epoch": 7682} {"train_loss": -27.66062355041504, "global_step": 637633, "epoch": 7682} {"train_loss": -27.723249435424805, "global_step": 637634, "epoch": 7682} {"train_loss": -28.338171005249023, "global_step": 637635, "epoch": 7682} {"train_loss": -28.194101333618164, "global_step": 637636, "epoch": 7682} {"train_loss": -27.975452423095703, "global_step": 637637, "epoch": 7682} {"train_loss": -28.2529239654541, "global_step": 637638, "epoch": 7682} {"train_loss": -28.19879722595215, "global_step": 637639, "epoch": 7682} {"train_loss": -27.978662490844727, "global_step": 637640, "epoch": 7682} {"train_loss": -27.94611167907715, "global_step": 637641, "epoch": 7682} {"train_loss": -28.2503719329834, "global_step": 637642, "epoch": 7682} {"train_loss": -28.473834991455078, "global_step": 637643, "epoch": 7682} {"train_loss": -28.39499855041504, "global_step": 637644, "epoch": 7682} {"train_loss": -28.25530433654785, "global_step": 637645, "epoch": 7682} {"train_loss": -28.063922882080078, "global_step": 637646, "epoch": 7682} {"train_loss": -28.117115020751953, "global_step": 637647, "epoch": 7682} {"train_loss": -27.8551025390625, "global_step": 637648, "epoch": 7682} {"train_loss": -28.64451026916504, "global_step": 637649, "epoch": 7682} {"train_loss": -28.59771156311035, "global_step": 637650, "epoch": 7682} {"train_loss": -28.525482177734375, "global_step": 637651, "epoch": 7682} {"train_loss": -28.384204864501953, "global_step": 637652, "epoch": 7682} {"train_loss": -28.491514205932617, "global_step": 637653, "epoch": 7682} {"train_loss": -28.290912628173828, "global_step": 637654, "epoch": 7682} {"train_loss": -28.655963897705078, "global_step": 637655, "epoch": 7682} {"train_loss": -28.461938858032227, "global_step": 637656, "epoch": 7682} {"train_loss": -28.498682022094727, "global_step": 637657, "epoch": 7682} {"train_loss": -28.190317153930664, "global_step": 637658, "epoch": 7682} {"train_loss": -28.415380477905273, "global_step": 637659, "epoch": 7682} {"train_loss": -28.763818740844727, "global_step": 637660, "epoch": 7682} {"train_loss": -28.375812530517578, "global_step": 637661, "epoch": 7682} {"train_loss": -28.74845314025879, "global_step": 637662, "epoch": 7682} {"train_loss": -28.583362579345703, "global_step": 637663, "epoch": 7682} {"train_loss": -28.622217178344727, "global_step": 637664, "epoch": 7682} {"train_loss": -28.43231201171875, "global_step": 637665, "epoch": 7682} {"train_loss": -28.491607666015625, "global_step": 637666, "epoch": 7682} {"train_loss": -28.640888214111328, "global_step": 637667, "epoch": 7682} {"train_loss": -28.469995498657227, "global_step": 637668, "epoch": 7682} {"train_loss": -28.19074058532715, "global_step": 637669, "epoch": 7682} {"train_loss": -27.9501953125, "global_step": 637670, "epoch": 7682} {"train_loss": -27.76137351989746, "global_step": 637671, "epoch": 7682} {"train_loss": -27.738168716430664, "global_step": 637672, "epoch": 7682} {"train_loss": -28.27359962463379, "global_step": 637673, "epoch": 7682} {"train_loss": -28.337873458862305, "global_step": 637674, "epoch": 7682} {"train_loss": -28.15960121154785, "global_step": 637675, "epoch": 7682} {"train_loss": -27.97255516052246, "global_step": 637676, "epoch": 7682} {"train_loss": -28.27888298034668, "global_step": 637677, "epoch": 7682} {"train_loss": -28.320728302001953, "global_step": 637678, "epoch": 7682} {"train_loss": -27.949893951416016, "global_step": 637679, "epoch": 7682} {"train_loss": -28.672088623046875, "global_step": 637680, "epoch": 7682} {"train_loss": -28.52996826171875, "global_step": 637681, "epoch": 7682} {"train_loss": -28.176624298095703, "global_step": 637682, "epoch": 7682} {"train_loss": -28.09473991394043, "global_step": 637683, "epoch": 7682} {"train_loss": -28.189239501953125, "global_step": 637684, "epoch": 7682} {"train_loss": -28.639921188354492, "global_step": 637685, "epoch": 7682} {"train_loss": -28.809675216674805, "global_step": 637686, "epoch": 7682} {"train_loss": -28.29060173034668, "global_step": 637687, "epoch": 7682} {"train_loss": -28.024665303977137, "global_step": 637688, "epoch": 7682, "val_loss": 6650289.0} {"train_loss": -27.77339744567871, "global_step": 637689, "epoch": 7683} {"train_loss": -27.389429092407227, "global_step": 637690, "epoch": 7683} {"train_loss": -27.842529296875, "global_step": 637691, "epoch": 7683} {"train_loss": -27.499658584594727, "global_step": 637692, "epoch": 7683} {"train_loss": -27.833993911743164, "global_step": 637693, "epoch": 7683} {"train_loss": -27.577381134033203, "global_step": 637694, "epoch": 7683} {"train_loss": -27.513214111328125, "global_step": 637695, "epoch": 7683} {"train_loss": -27.20136833190918, "global_step": 637696, "epoch": 7683} {"train_loss": -27.91794204711914, "global_step": 637697, "epoch": 7683} {"train_loss": -27.676666259765625, "global_step": 637698, "epoch": 7683} {"train_loss": -27.6738224029541, "global_step": 637699, "epoch": 7683} {"train_loss": -27.824954986572266, "global_step": 637700, "epoch": 7683} {"train_loss": -27.682565689086914, "global_step": 637701, "epoch": 7683} {"train_loss": -27.808807373046875, "global_step": 637702, "epoch": 7683} {"train_loss": -27.457178115844727, "global_step": 637703, "epoch": 7683} {"train_loss": -27.87320327758789, "global_step": 637704, "epoch": 7683} {"train_loss": -27.713226318359375, "global_step": 637705, "epoch": 7683} {"train_loss": -28.090225219726562, "global_step": 637706, "epoch": 7683} {"train_loss": -28.199941635131836, "global_step": 637707, "epoch": 7683} {"train_loss": -27.592254638671875, "global_step": 637708, "epoch": 7683} {"train_loss": -27.668018341064453, "global_step": 637709, "epoch": 7683} {"train_loss": -28.063434600830078, "global_step": 637710, "epoch": 7683} {"train_loss": -27.64046287536621, "global_step": 637711, "epoch": 7683} {"train_loss": -28.063180923461914, "global_step": 637712, "epoch": 7683} {"train_loss": -27.87240982055664, "global_step": 637713, "epoch": 7683} {"train_loss": -28.098190307617188, "global_step": 637714, "epoch": 7683} {"train_loss": -27.89082145690918, "global_step": 637715, "epoch": 7683} {"train_loss": -28.075393676757812, "global_step": 637716, "epoch": 7683} {"train_loss": -28.21901512145996, "global_step": 637717, "epoch": 7683} {"train_loss": -27.7767391204834, "global_step": 637718, "epoch": 7683} {"train_loss": -28.09429359436035, "global_step": 637719, "epoch": 7683} {"train_loss": -28.2322998046875, "global_step": 637720, "epoch": 7683} {"train_loss": -28.069955825805664, "global_step": 637721, "epoch": 7683} {"train_loss": -28.245254516601562, "global_step": 637722, "epoch": 7683} {"train_loss": -27.954254150390625, "global_step": 637723, "epoch": 7683} {"train_loss": -28.160968780517578, "global_step": 637724, "epoch": 7683} {"train_loss": -28.1645565032959, "global_step": 637725, "epoch": 7683} {"train_loss": -28.227216720581055, "global_step": 637726, "epoch": 7683} {"train_loss": -28.078540802001953, "global_step": 637727, "epoch": 7683} {"train_loss": -27.903234481811523, "global_step": 637728, "epoch": 7683} {"train_loss": -27.961069107055664, "global_step": 637729, "epoch": 7683} {"train_loss": -28.122833251953125, "global_step": 637730, "epoch": 7683} {"train_loss": -27.938032150268555, "global_step": 637731, "epoch": 7683} {"train_loss": -28.224018096923828, "global_step": 637732, "epoch": 7683} {"train_loss": -28.38833999633789, "global_step": 637733, "epoch": 7683} {"train_loss": -28.345478057861328, "global_step": 637734, "epoch": 7683} {"train_loss": -28.240583419799805, "global_step": 637735, "epoch": 7683} {"train_loss": -28.2452449798584, "global_step": 637736, "epoch": 7683} {"train_loss": -28.29678726196289, "global_step": 637737, "epoch": 7683} {"train_loss": -28.489526748657227, "global_step": 637738, "epoch": 7683} {"train_loss": -28.065021514892578, "global_step": 637739, "epoch": 7683} {"train_loss": -28.555471420288086, "global_step": 637740, "epoch": 7683} {"train_loss": -28.629745483398438, "global_step": 637741, "epoch": 7683} {"train_loss": -28.706546783447266, "global_step": 637742, "epoch": 7683} {"train_loss": -28.531726837158203, "global_step": 637743, "epoch": 7683} {"train_loss": -28.476858139038086, "global_step": 637744, "epoch": 7683} {"train_loss": -28.417402267456055, "global_step": 637745, "epoch": 7683} {"train_loss": -28.609893798828125, "global_step": 637746, "epoch": 7683} {"train_loss": -28.546833038330078, "global_step": 637747, "epoch": 7683} {"train_loss": -28.462970733642578, "global_step": 637748, "epoch": 7683} {"train_loss": -28.671300888061523, "global_step": 637749, "epoch": 7683} {"train_loss": -28.655033111572266, "global_step": 637750, "epoch": 7683} {"train_loss": -28.019025802612305, "global_step": 637751, "epoch": 7683} {"train_loss": -27.61501121520996, "global_step": 637752, "epoch": 7683} {"train_loss": -27.641056060791016, "global_step": 637753, "epoch": 7683} {"train_loss": -27.794103622436523, "global_step": 637754, "epoch": 7683} {"train_loss": -27.856435775756836, "global_step": 637755, "epoch": 7683} {"train_loss": -27.854949951171875, "global_step": 637756, "epoch": 7683} {"train_loss": -27.914560317993164, "global_step": 637757, "epoch": 7683} {"train_loss": -27.726037979125977, "global_step": 637758, "epoch": 7683} {"train_loss": -27.41299819946289, "global_step": 637759, "epoch": 7683} {"train_loss": -27.560779571533203, "global_step": 637760, "epoch": 7683} {"train_loss": -27.63495445251465, "global_step": 637761, "epoch": 7683} {"train_loss": -26.806995391845703, "global_step": 637762, "epoch": 7683} {"train_loss": -27.172107696533203, "global_step": 637763, "epoch": 7683} {"train_loss": -27.36333656311035, "global_step": 637764, "epoch": 7683} {"train_loss": -27.524213790893555, "global_step": 637765, "epoch": 7683} {"train_loss": -27.620838165283203, "global_step": 637766, "epoch": 7683} {"train_loss": -27.47572898864746, "global_step": 637767, "epoch": 7683} {"train_loss": -27.37554931640625, "global_step": 637768, "epoch": 7683} {"train_loss": -27.97367286682129, "global_step": 637769, "epoch": 7683} {"train_loss": -27.536436080932617, "global_step": 637770, "epoch": 7683} {"train_loss": -27.94736425560641, "global_step": 637771, "epoch": 7683, "val_loss": 6649244.0} {"train_loss": -26.501855850219727, "global_step": 637772, "epoch": 7684} {"train_loss": -26.68010902404785, "global_step": 637773, "epoch": 7684} {"train_loss": -27.370996475219727, "global_step": 637774, "epoch": 7684} {"train_loss": -26.518707275390625, "global_step": 637775, "epoch": 7684} {"train_loss": -27.652679443359375, "global_step": 637776, "epoch": 7684} {"train_loss": -26.719593048095703, "global_step": 637777, "epoch": 7684} {"train_loss": -27.59673500061035, "global_step": 637778, "epoch": 7684} {"train_loss": -27.313095092773438, "global_step": 637779, "epoch": 7684} {"train_loss": -27.84400749206543, "global_step": 637780, "epoch": 7684} {"train_loss": -27.496286392211914, "global_step": 637781, "epoch": 7684} {"train_loss": -27.881317138671875, "global_step": 637782, "epoch": 7684} {"train_loss": -27.651138305664062, "global_step": 637783, "epoch": 7684} {"train_loss": -27.378437042236328, "global_step": 637784, "epoch": 7684} {"train_loss": -27.96229362487793, "global_step": 637785, "epoch": 7684} {"train_loss": -27.480499267578125, "global_step": 637786, "epoch": 7684} {"train_loss": -27.647790908813477, "global_step": 637787, "epoch": 7684} {"train_loss": -27.778608322143555, "global_step": 637788, "epoch": 7684} {"train_loss": -27.843982696533203, "global_step": 637789, "epoch": 7684} {"train_loss": -27.994495391845703, "global_step": 637790, "epoch": 7684} {"train_loss": -27.400238037109375, "global_step": 637791, "epoch": 7684} {"train_loss": -28.12396812438965, "global_step": 637792, "epoch": 7684} {"train_loss": -27.729278564453125, "global_step": 637793, "epoch": 7684} {"train_loss": -28.040725708007812, "global_step": 637794, "epoch": 7684} {"train_loss": -28.084802627563477, "global_step": 637795, "epoch": 7684} {"train_loss": -28.070764541625977, "global_step": 637796, "epoch": 7684} {"train_loss": -28.190954208374023, "global_step": 637797, "epoch": 7684} {"train_loss": -27.958524703979492, "global_step": 637798, "epoch": 7684} {"train_loss": -27.988046646118164, "global_step": 637799, "epoch": 7684} {"train_loss": -28.055927276611328, "global_step": 637800, "epoch": 7684} {"train_loss": -28.254316329956055, "global_step": 637801, "epoch": 7684} {"train_loss": -28.2785701751709, "global_step": 637802, "epoch": 7684} {"train_loss": -27.870935440063477, "global_step": 637803, "epoch": 7684} {"train_loss": -27.9935245513916, "global_step": 637804, "epoch": 7684} {"train_loss": -28.224206924438477, "global_step": 637805, "epoch": 7684} {"train_loss": -27.97047233581543, "global_step": 637806, "epoch": 7684} {"train_loss": -28.057098388671875, "global_step": 637807, "epoch": 7684} {"train_loss": -28.313764572143555, "global_step": 637808, "epoch": 7684} {"train_loss": -28.180557250976562, "global_step": 637809, "epoch": 7684} {"train_loss": -28.565372467041016, "global_step": 637810, "epoch": 7684} {"train_loss": -28.38490867614746, "global_step": 637811, "epoch": 7684} {"train_loss": -28.507099151611328, "global_step": 637812, "epoch": 7684} {"train_loss": -28.255802154541016, "global_step": 637813, "epoch": 7684} {"train_loss": -28.128137588500977, "global_step": 637814, "epoch": 7684} {"train_loss": -28.588565826416016, "global_step": 637815, "epoch": 7684} {"train_loss": -28.153583526611328, "global_step": 637816, "epoch": 7684} {"train_loss": -28.52430534362793, "global_step": 637817, "epoch": 7684} {"train_loss": -28.13916015625, "global_step": 637818, "epoch": 7684} {"train_loss": -28.4490909576416, "global_step": 637819, "epoch": 7684} {"train_loss": -28.20806884765625, "global_step": 637820, "epoch": 7684} {"train_loss": -28.38178062438965, "global_step": 637821, "epoch": 7684} {"train_loss": -28.477975845336914, "global_step": 637822, "epoch": 7684} {"train_loss": -28.1683406829834, "global_step": 637823, "epoch": 7684} {"train_loss": -28.186176300048828, "global_step": 637824, "epoch": 7684} {"train_loss": -28.257715225219727, "global_step": 637825, "epoch": 7684} {"train_loss": -28.121496200561523, "global_step": 637826, "epoch": 7684} {"train_loss": -28.48822593688965, "global_step": 637827, "epoch": 7684} {"train_loss": -28.451391220092773, "global_step": 637828, "epoch": 7684} {"train_loss": -28.5477237701416, "global_step": 637829, "epoch": 7684} {"train_loss": -28.238569259643555, "global_step": 637830, "epoch": 7684} {"train_loss": -28.113264083862305, "global_step": 637831, "epoch": 7684} {"train_loss": -28.1247501373291, "global_step": 637832, "epoch": 7684} {"train_loss": -28.000417709350586, "global_step": 637833, "epoch": 7684} {"train_loss": -28.279630661010742, "global_step": 637834, "epoch": 7684} {"train_loss": -28.59913444519043, "global_step": 637835, "epoch": 7684} {"train_loss": -28.7831974029541, "global_step": 637836, "epoch": 7684} {"train_loss": -28.1234188079834, "global_step": 637837, "epoch": 7684} {"train_loss": -28.367115020751953, "global_step": 637838, "epoch": 7684} {"train_loss": -28.366540908813477, "global_step": 637839, "epoch": 7684} {"train_loss": -28.193592071533203, "global_step": 637840, "epoch": 7684} {"train_loss": -27.885639190673828, "global_step": 637841, "epoch": 7684} {"train_loss": -28.25847816467285, "global_step": 637842, "epoch": 7684} {"train_loss": -28.562719345092773, "global_step": 637843, "epoch": 7684} {"train_loss": -28.465972900390625, "global_step": 637844, "epoch": 7684} {"train_loss": -28.3599796295166, "global_step": 637845, "epoch": 7684} {"train_loss": -28.05018424987793, "global_step": 637846, "epoch": 7684} {"train_loss": -28.116281509399414, "global_step": 637847, "epoch": 7684} {"train_loss": -28.5970401763916, "global_step": 637848, "epoch": 7684} {"train_loss": -27.80097770690918, "global_step": 637849, "epoch": 7684} {"train_loss": -27.9296875, "global_step": 637850, "epoch": 7684} {"train_loss": -28.33148765563965, "global_step": 637851, "epoch": 7684} {"train_loss": -27.756494522094727, "global_step": 637852, "epoch": 7684} {"train_loss": -28.005218505859375, "global_step": 637853, "epoch": 7684} {"train_loss": -28.033568738454797, "global_step": 637854, "epoch": 7684, "val_loss": 6601112.5} {"train_loss": -25.064395904541016, "global_step": 637855, "epoch": 7685} {"train_loss": -24.090965270996094, "global_step": 637856, "epoch": 7685} {"train_loss": -26.319128036499023, "global_step": 637857, "epoch": 7685} {"train_loss": -26.65311622619629, "global_step": 637858, "epoch": 7685} {"train_loss": -25.853818893432617, "global_step": 637859, "epoch": 7685} {"train_loss": -26.44524574279785, "global_step": 637860, "epoch": 7685} {"train_loss": -27.038776397705078, "global_step": 637861, "epoch": 7685} {"train_loss": -26.30433464050293, "global_step": 637862, "epoch": 7685} {"train_loss": -26.694990158081055, "global_step": 637863, "epoch": 7685} {"train_loss": -27.046796798706055, "global_step": 637864, "epoch": 7685} {"train_loss": -27.04340934753418, "global_step": 637865, "epoch": 7685} {"train_loss": -27.20685386657715, "global_step": 637866, "epoch": 7685} {"train_loss": -26.948902130126953, "global_step": 637867, "epoch": 7685} {"train_loss": -26.553802490234375, "global_step": 637868, "epoch": 7685} {"train_loss": -27.02481460571289, "global_step": 637869, "epoch": 7685} {"train_loss": -26.585372924804688, "global_step": 637870, "epoch": 7685} {"train_loss": -27.155237197875977, "global_step": 637871, "epoch": 7685} {"train_loss": -27.013269424438477, "global_step": 637872, "epoch": 7685} {"train_loss": -27.520776748657227, "global_step": 637873, "epoch": 7685} {"train_loss": -27.326828002929688, "global_step": 637874, "epoch": 7685} {"train_loss": -27.45231056213379, "global_step": 637875, "epoch": 7685} {"train_loss": -27.4189510345459, "global_step": 637876, "epoch": 7685} {"train_loss": -27.45270347595215, "global_step": 637877, "epoch": 7685} {"train_loss": -27.441085815429688, "global_step": 637878, "epoch": 7685} {"train_loss": -27.78794288635254, "global_step": 637879, "epoch": 7685} {"train_loss": -27.693387985229492, "global_step": 637880, "epoch": 7685} {"train_loss": -27.713415145874023, "global_step": 637881, "epoch": 7685} {"train_loss": -27.503629684448242, "global_step": 637882, "epoch": 7685} {"train_loss": -27.65189552307129, "global_step": 637883, "epoch": 7685} {"train_loss": -28.20832633972168, "global_step": 637884, "epoch": 7685} {"train_loss": -27.625341415405273, "global_step": 637885, "epoch": 7685} {"train_loss": -27.51337242126465, "global_step": 637886, "epoch": 7685} {"train_loss": -28.047576904296875, "global_step": 637887, "epoch": 7685} {"train_loss": -27.743032455444336, "global_step": 637888, "epoch": 7685} {"train_loss": -27.96307945251465, "global_step": 637889, "epoch": 7685} {"train_loss": -28.09087562561035, "global_step": 637890, "epoch": 7685} {"train_loss": -27.842199325561523, "global_step": 637891, "epoch": 7685} {"train_loss": -28.039508819580078, "global_step": 637892, "epoch": 7685} {"train_loss": -27.955224990844727, "global_step": 637893, "epoch": 7685} {"train_loss": -28.218551635742188, "global_step": 637894, "epoch": 7685} {"train_loss": -27.86528968811035, "global_step": 637895, "epoch": 7685} {"train_loss": -28.00263023376465, "global_step": 637896, "epoch": 7685} {"train_loss": -27.921356201171875, "global_step": 637897, "epoch": 7685} {"train_loss": -28.33024024963379, "global_step": 637898, "epoch": 7685} {"train_loss": -28.305639266967773, "global_step": 637899, "epoch": 7685} {"train_loss": -27.894397735595703, "global_step": 637900, "epoch": 7685} {"train_loss": -27.936716079711914, "global_step": 637901, "epoch": 7685} {"train_loss": -27.9818115234375, "global_step": 637902, "epoch": 7685} {"train_loss": -28.0155029296875, "global_step": 637903, "epoch": 7685} {"train_loss": -28.126129150390625, "global_step": 637904, "epoch": 7685} {"train_loss": -28.263355255126953, "global_step": 637905, "epoch": 7685} {"train_loss": -28.335330963134766, "global_step": 637906, "epoch": 7685} {"train_loss": -27.830829620361328, "global_step": 637907, "epoch": 7685} {"train_loss": -28.262174606323242, "global_step": 637908, "epoch": 7685} {"train_loss": -28.504535675048828, "global_step": 637909, "epoch": 7685} {"train_loss": -28.064685821533203, "global_step": 637910, "epoch": 7685} {"train_loss": -28.787343978881836, "global_step": 637911, "epoch": 7685} {"train_loss": -28.424238204956055, "global_step": 637912, "epoch": 7685} {"train_loss": -28.41719627380371, "global_step": 637913, "epoch": 7685} {"train_loss": -28.59364128112793, "global_step": 637914, "epoch": 7685} {"train_loss": -28.604080200195312, "global_step": 637915, "epoch": 7685} {"train_loss": -28.432310104370117, "global_step": 637916, "epoch": 7685} {"train_loss": -28.29535484313965, "global_step": 637917, "epoch": 7685} {"train_loss": -28.42818260192871, "global_step": 637918, "epoch": 7685} {"train_loss": -28.461593627929688, "global_step": 637919, "epoch": 7685} {"train_loss": -28.114667892456055, "global_step": 637920, "epoch": 7685} {"train_loss": -28.680572509765625, "global_step": 637921, "epoch": 7685} {"train_loss": -28.290424346923828, "global_step": 637922, "epoch": 7685} {"train_loss": -28.83807373046875, "global_step": 637923, "epoch": 7685} {"train_loss": -28.248706817626953, "global_step": 637924, "epoch": 7685} {"train_loss": -27.94386100769043, "global_step": 637925, "epoch": 7685} {"train_loss": -28.45670509338379, "global_step": 637926, "epoch": 7685} {"train_loss": -28.560089111328125, "global_step": 637927, "epoch": 7685} {"train_loss": -28.21088981628418, "global_step": 637928, "epoch": 7685} {"train_loss": -28.430795669555664, "global_step": 637929, "epoch": 7685} {"train_loss": -28.444883346557617, "global_step": 637930, "epoch": 7685} {"train_loss": -28.14764404296875, "global_step": 637931, "epoch": 7685} {"train_loss": -28.678674697875977, "global_step": 637932, "epoch": 7685} {"train_loss": -28.520910263061523, "global_step": 637933, "epoch": 7685} {"train_loss": -28.637426376342773, "global_step": 637934, "epoch": 7685} {"train_loss": -28.331958770751953, "global_step": 637935, "epoch": 7685} {"train_loss": -28.46150779724121, "global_step": 637936, "epoch": 7685} {"train_loss": -27.751750624323467, "global_step": 637937, "epoch": 7685, "val_loss": 6649561.0} {"train_loss": -28.190622329711914, "global_step": 637938, "epoch": 7686} {"train_loss": -28.057315826416016, "global_step": 637939, "epoch": 7686} {"train_loss": -28.078821182250977, "global_step": 637940, "epoch": 7686} {"train_loss": -27.123340606689453, "global_step": 637941, "epoch": 7686} {"train_loss": -27.748334884643555, "global_step": 637942, "epoch": 7686} {"train_loss": -27.3356876373291, "global_step": 637943, "epoch": 7686} {"train_loss": -27.473861694335938, "global_step": 637944, "epoch": 7686} {"train_loss": -26.7582950592041, "global_step": 637945, "epoch": 7686} {"train_loss": -27.1018123626709, "global_step": 637946, "epoch": 7686} {"train_loss": -27.767105102539062, "global_step": 637947, "epoch": 7686} {"train_loss": -26.953847885131836, "global_step": 637948, "epoch": 7686} {"train_loss": -27.46564292907715, "global_step": 637949, "epoch": 7686} {"train_loss": -28.1970157623291, "global_step": 637950, "epoch": 7686} {"train_loss": -27.065465927124023, "global_step": 637951, "epoch": 7686} {"train_loss": -27.786304473876953, "global_step": 637952, "epoch": 7686} {"train_loss": -27.5084228515625, "global_step": 637953, "epoch": 7686} {"train_loss": -27.913671493530273, "global_step": 637954, "epoch": 7686} {"train_loss": -27.781402587890625, "global_step": 637955, "epoch": 7686} {"train_loss": -28.289838790893555, "global_step": 637956, "epoch": 7686} {"train_loss": -27.68130874633789, "global_step": 637957, "epoch": 7686} {"train_loss": -27.963184356689453, "global_step": 637958, "epoch": 7686} {"train_loss": -28.115604400634766, "global_step": 637959, "epoch": 7686} {"train_loss": -28.281782150268555, "global_step": 637960, "epoch": 7686} {"train_loss": -28.310749053955078, "global_step": 637961, "epoch": 7686} {"train_loss": -27.926733016967773, "global_step": 637962, "epoch": 7686} {"train_loss": -28.063751220703125, "global_step": 637963, "epoch": 7686} {"train_loss": -27.826831817626953, "global_step": 637964, "epoch": 7686} {"train_loss": -28.11378288269043, "global_step": 637965, "epoch": 7686} {"train_loss": -28.04279899597168, "global_step": 637966, "epoch": 7686} {"train_loss": -28.16047477722168, "global_step": 637967, "epoch": 7686} {"train_loss": -28.400089263916016, "global_step": 637968, "epoch": 7686} {"train_loss": -28.065113067626953, "global_step": 637969, "epoch": 7686} {"train_loss": -28.061803817749023, "global_step": 637970, "epoch": 7686} {"train_loss": -27.845144271850586, "global_step": 637971, "epoch": 7686} {"train_loss": -28.476049423217773, "global_step": 637972, "epoch": 7686} {"train_loss": -27.879901885986328, "global_step": 637973, "epoch": 7686} {"train_loss": -28.13372230529785, "global_step": 637974, "epoch": 7686} {"train_loss": -28.029977798461914, "global_step": 637975, "epoch": 7686} {"train_loss": -28.352514266967773, "global_step": 637976, "epoch": 7686} {"train_loss": -28.185667037963867, "global_step": 637977, "epoch": 7686} {"train_loss": -28.586206436157227, "global_step": 637978, "epoch": 7686} {"train_loss": -28.29945182800293, "global_step": 637979, "epoch": 7686} {"train_loss": -28.2304630279541, "global_step": 637980, "epoch": 7686} {"train_loss": -28.174997329711914, "global_step": 637981, "epoch": 7686} {"train_loss": -28.309356689453125, "global_step": 637982, "epoch": 7686} {"train_loss": -28.27179527282715, "global_step": 637983, "epoch": 7686} {"train_loss": -27.93714714050293, "global_step": 637984, "epoch": 7686} {"train_loss": -28.461278915405273, "global_step": 637985, "epoch": 7686} {"train_loss": -28.174131393432617, "global_step": 637986, "epoch": 7686} {"train_loss": -28.37530517578125, "global_step": 637987, "epoch": 7686} {"train_loss": -28.56971549987793, "global_step": 637988, "epoch": 7686} {"train_loss": -28.207181930541992, "global_step": 637989, "epoch": 7686} {"train_loss": -28.661584854125977, "global_step": 637990, "epoch": 7686} {"train_loss": -28.3891544342041, "global_step": 637991, "epoch": 7686} {"train_loss": -28.224884033203125, "global_step": 637992, "epoch": 7686} {"train_loss": -28.461111068725586, "global_step": 637993, "epoch": 7686} {"train_loss": -28.53268814086914, "global_step": 637994, "epoch": 7686} {"train_loss": -28.405485153198242, "global_step": 637995, "epoch": 7686} {"train_loss": -28.629276275634766, "global_step": 637996, "epoch": 7686} {"train_loss": -28.59766960144043, "global_step": 637997, "epoch": 7686} {"train_loss": -28.303607940673828, "global_step": 637998, "epoch": 7686} {"train_loss": -28.632726669311523, "global_step": 637999, "epoch": 7686} {"train_loss": -28.239622116088867, "global_step": 638000, "epoch": 7686} {"train_loss": -28.571802139282227, "global_step": 638001, "epoch": 7686} {"train_loss": -28.211950302124023, "global_step": 638002, "epoch": 7686} {"train_loss": -28.530017852783203, "global_step": 638003, "epoch": 7686} {"train_loss": -28.652820587158203, "global_step": 638004, "epoch": 7686} {"train_loss": -28.272083282470703, "global_step": 638005, "epoch": 7686} {"train_loss": -28.56306266784668, "global_step": 638006, "epoch": 7686} {"train_loss": -28.60869789123535, "global_step": 638007, "epoch": 7686} {"train_loss": -28.3563232421875, "global_step": 638008, "epoch": 7686} {"train_loss": -28.884780883789062, "global_step": 638009, "epoch": 7686} {"train_loss": -28.219022750854492, "global_step": 638010, "epoch": 7686} {"train_loss": -27.893081665039062, "global_step": 638011, "epoch": 7686} {"train_loss": -27.961374282836914, "global_step": 638012, "epoch": 7686} {"train_loss": -28.177764892578125, "global_step": 638013, "epoch": 7686} {"train_loss": -28.359115600585938, "global_step": 638014, "epoch": 7686} {"train_loss": -28.60939598083496, "global_step": 638015, "epoch": 7686} {"train_loss": -28.617650985717773, "global_step": 638016, "epoch": 7686} {"train_loss": -28.01138687133789, "global_step": 638017, "epoch": 7686} {"train_loss": -28.602340698242188, "global_step": 638018, "epoch": 7686} {"train_loss": -28.55047607421875, "global_step": 638019, "epoch": 7686} {"train_loss": -28.127954781773578, "global_step": 638020, "epoch": 7686, "val_loss": 6728218.0} {"train_loss": -26.357145309448242, "global_step": 638021, "epoch": 7687} {"train_loss": -24.691314697265625, "global_step": 638022, "epoch": 7687} {"train_loss": -26.8797607421875, "global_step": 638023, "epoch": 7687} {"train_loss": -26.314071655273438, "global_step": 638024, "epoch": 7687} {"train_loss": -26.109329223632812, "global_step": 638025, "epoch": 7687} {"train_loss": -27.155231475830078, "global_step": 638026, "epoch": 7687} {"train_loss": -26.308319091796875, "global_step": 638027, "epoch": 7687} {"train_loss": -27.129459381103516, "global_step": 638028, "epoch": 7687} {"train_loss": -26.9689884185791, "global_step": 638029, "epoch": 7687} {"train_loss": -27.069787979125977, "global_step": 638030, "epoch": 7687} {"train_loss": -27.24488639831543, "global_step": 638031, "epoch": 7687} {"train_loss": -27.053129196166992, "global_step": 638032, "epoch": 7687} {"train_loss": -27.5461483001709, "global_step": 638033, "epoch": 7687} {"train_loss": -27.41715431213379, "global_step": 638034, "epoch": 7687} {"train_loss": -27.02302360534668, "global_step": 638035, "epoch": 7687} {"train_loss": -27.763870239257812, "global_step": 638036, "epoch": 7687} {"train_loss": -27.360742568969727, "global_step": 638037, "epoch": 7687} {"train_loss": -27.92356300354004, "global_step": 638038, "epoch": 7687} {"train_loss": -27.547399520874023, "global_step": 638039, "epoch": 7687} {"train_loss": -27.90497398376465, "global_step": 638040, "epoch": 7687} {"train_loss": -28.343420028686523, "global_step": 638041, "epoch": 7687} {"train_loss": -27.693113327026367, "global_step": 638042, "epoch": 7687} {"train_loss": -27.645715713500977, "global_step": 638043, "epoch": 7687} {"train_loss": -27.667011260986328, "global_step": 638044, "epoch": 7687} {"train_loss": -27.565595626831055, "global_step": 638045, "epoch": 7687} {"train_loss": -28.06671714782715, "global_step": 638046, "epoch": 7687} {"train_loss": -28.03632164001465, "global_step": 638047, "epoch": 7687} {"train_loss": -28.229324340820312, "global_step": 638048, "epoch": 7687} {"train_loss": -28.095266342163086, "global_step": 638049, "epoch": 7687} {"train_loss": -27.848011016845703, "global_step": 638050, "epoch": 7687} {"train_loss": -27.85658073425293, "global_step": 638051, "epoch": 7687} {"train_loss": -28.03792381286621, "global_step": 638052, "epoch": 7687} {"train_loss": -28.183923721313477, "global_step": 638053, "epoch": 7687} {"train_loss": -28.183216094970703, "global_step": 638054, "epoch": 7687} {"train_loss": -27.904443740844727, "global_step": 638055, "epoch": 7687} {"train_loss": -28.1424617767334, "global_step": 638056, "epoch": 7687} {"train_loss": -28.1894474029541, "global_step": 638057, "epoch": 7687} {"train_loss": -28.075946807861328, "global_step": 638058, "epoch": 7687} {"train_loss": -27.9171199798584, "global_step": 638059, "epoch": 7687} {"train_loss": -28.129322052001953, "global_step": 638060, "epoch": 7687} {"train_loss": -28.214025497436523, "global_step": 638061, "epoch": 7687} {"train_loss": -28.22248649597168, "global_step": 638062, "epoch": 7687} {"train_loss": -28.322092056274414, "global_step": 638063, "epoch": 7687} {"train_loss": -28.62737464904785, "global_step": 638064, "epoch": 7687} {"train_loss": -28.271163940429688, "global_step": 638065, "epoch": 7687} {"train_loss": -28.542938232421875, "global_step": 638066, "epoch": 7687} {"train_loss": -28.23127555847168, "global_step": 638067, "epoch": 7687} {"train_loss": -28.012189865112305, "global_step": 638068, "epoch": 7687} {"train_loss": -27.87407875061035, "global_step": 638069, "epoch": 7687} {"train_loss": -28.674274444580078, "global_step": 638070, "epoch": 7687} {"train_loss": -28.673538208007812, "global_step": 638071, "epoch": 7687} {"train_loss": -28.397293090820312, "global_step": 638072, "epoch": 7687} {"train_loss": -28.71808433532715, "global_step": 638073, "epoch": 7687} {"train_loss": -28.204776763916016, "global_step": 638074, "epoch": 7687} {"train_loss": -28.507246017456055, "global_step": 638075, "epoch": 7687} {"train_loss": -28.547815322875977, "global_step": 638076, "epoch": 7687} {"train_loss": -28.6762638092041, "global_step": 638077, "epoch": 7687} {"train_loss": -28.272491455078125, "global_step": 638078, "epoch": 7687} {"train_loss": -28.37456703186035, "global_step": 638079, "epoch": 7687} {"train_loss": -28.75330924987793, "global_step": 638080, "epoch": 7687} {"train_loss": -28.814672470092773, "global_step": 638081, "epoch": 7687} {"train_loss": -28.438709259033203, "global_step": 638082, "epoch": 7687} {"train_loss": -28.105539321899414, "global_step": 638083, "epoch": 7687} {"train_loss": -28.268463134765625, "global_step": 638084, "epoch": 7687} {"train_loss": -28.638952255249023, "global_step": 638085, "epoch": 7687} {"train_loss": -28.871366500854492, "global_step": 638086, "epoch": 7687} {"train_loss": -28.480365753173828, "global_step": 638087, "epoch": 7687} {"train_loss": -28.5069522857666, "global_step": 638088, "epoch": 7687} {"train_loss": -28.647113800048828, "global_step": 638089, "epoch": 7687} {"train_loss": -28.37859535217285, "global_step": 638090, "epoch": 7687} {"train_loss": -28.514453887939453, "global_step": 638091, "epoch": 7687} {"train_loss": -28.9327392578125, "global_step": 638092, "epoch": 7687} {"train_loss": -28.366750717163086, "global_step": 638093, "epoch": 7687} {"train_loss": -28.560382843017578, "global_step": 638094, "epoch": 7687} {"train_loss": -28.706592559814453, "global_step": 638095, "epoch": 7687} {"train_loss": -28.705596923828125, "global_step": 638096, "epoch": 7687} {"train_loss": -28.178983688354492, "global_step": 638097, "epoch": 7687} {"train_loss": -28.324893951416016, "global_step": 638098, "epoch": 7687} {"train_loss": -28.009592056274414, "global_step": 638099, "epoch": 7687} {"train_loss": -28.270328521728516, "global_step": 638100, "epoch": 7687} {"train_loss": -28.005970001220703, "global_step": 638101, "epoch": 7687} {"train_loss": -27.598220825195312, "global_step": 638102, "epoch": 7687} {"train_loss": -27.960681179919874, "global_step": 638103, "epoch": 7687, "val_loss": 6615360.0} {"train_loss": -27.301626205444336, "global_step": 638104, "epoch": 7688} {"train_loss": -27.558490753173828, "global_step": 638105, "epoch": 7688} {"train_loss": -27.618444442749023, "global_step": 638106, "epoch": 7688} {"train_loss": -26.777942657470703, "global_step": 638107, "epoch": 7688} {"train_loss": -26.86495018005371, "global_step": 638108, "epoch": 7688} {"train_loss": -27.843189239501953, "global_step": 638109, "epoch": 7688} {"train_loss": -27.15656852722168, "global_step": 638110, "epoch": 7688} {"train_loss": -27.48187255859375, "global_step": 638111, "epoch": 7688} {"train_loss": -27.561237335205078, "global_step": 638112, "epoch": 7688} {"train_loss": -27.457319259643555, "global_step": 638113, "epoch": 7688} {"train_loss": -27.399307250976562, "global_step": 638114, "epoch": 7688} {"train_loss": -27.066558837890625, "global_step": 638115, "epoch": 7688} {"train_loss": -27.730762481689453, "global_step": 638116, "epoch": 7688} {"train_loss": -27.810461044311523, "global_step": 638117, "epoch": 7688} {"train_loss": -27.599477767944336, "global_step": 638118, "epoch": 7688} {"train_loss": -27.276762008666992, "global_step": 638119, "epoch": 7688} {"train_loss": -27.911657333374023, "global_step": 638120, "epoch": 7688} {"train_loss": -28.3535099029541, "global_step": 638121, "epoch": 7688} {"train_loss": -27.863378524780273, "global_step": 638122, "epoch": 7688} {"train_loss": -28.050336837768555, "global_step": 638123, "epoch": 7688} {"train_loss": -27.578033447265625, "global_step": 638124, "epoch": 7688} {"train_loss": -27.974058151245117, "global_step": 638125, "epoch": 7688} {"train_loss": -28.02277183532715, "global_step": 638126, "epoch": 7688} {"train_loss": -28.15276527404785, "global_step": 638127, "epoch": 7688} {"train_loss": -27.86087989807129, "global_step": 638128, "epoch": 7688} {"train_loss": -28.13605308532715, "global_step": 638129, "epoch": 7688} {"train_loss": -28.256513595581055, "global_step": 638130, "epoch": 7688} {"train_loss": -28.071643829345703, "global_step": 638131, "epoch": 7688} {"train_loss": -28.126876831054688, "global_step": 638132, "epoch": 7688} {"train_loss": -28.0452823638916, "global_step": 638133, "epoch": 7688} {"train_loss": -28.12043571472168, "global_step": 638134, "epoch": 7688} {"train_loss": -27.94970703125, "global_step": 638135, "epoch": 7688} {"train_loss": -27.818252563476562, "global_step": 638136, "epoch": 7688} {"train_loss": -28.146793365478516, "global_step": 638137, "epoch": 7688} {"train_loss": -28.084177017211914, "global_step": 638138, "epoch": 7688} {"train_loss": -27.842344284057617, "global_step": 638139, "epoch": 7688} {"train_loss": -28.347702026367188, "global_step": 638140, "epoch": 7688} {"train_loss": -28.032636642456055, "global_step": 638141, "epoch": 7688} {"train_loss": -28.034931182861328, "global_step": 638142, "epoch": 7688} {"train_loss": -28.315673828125, "global_step": 638143, "epoch": 7688} {"train_loss": -28.273183822631836, "global_step": 638144, "epoch": 7688} {"train_loss": -28.343149185180664, "global_step": 638145, "epoch": 7688} {"train_loss": -28.300647735595703, "global_step": 638146, "epoch": 7688} {"train_loss": -28.327314376831055, "global_step": 638147, "epoch": 7688} {"train_loss": -28.406774520874023, "global_step": 638148, "epoch": 7688} {"train_loss": -28.260541915893555, "global_step": 638149, "epoch": 7688} {"train_loss": -28.04538345336914, "global_step": 638150, "epoch": 7688} {"train_loss": -28.320526123046875, "global_step": 638151, "epoch": 7688} {"train_loss": -28.3532772064209, "global_step": 638152, "epoch": 7688} {"train_loss": -28.16355323791504, "global_step": 638153, "epoch": 7688} {"train_loss": -28.35468101501465, "global_step": 638154, "epoch": 7688} {"train_loss": -28.584003448486328, "global_step": 638155, "epoch": 7688} {"train_loss": -28.129348754882812, "global_step": 638156, "epoch": 7688} {"train_loss": -28.440160751342773, "global_step": 638157, "epoch": 7688} {"train_loss": -28.532470703125, "global_step": 638158, "epoch": 7688} {"train_loss": -28.261991500854492, "global_step": 638159, "epoch": 7688} {"train_loss": -28.303342819213867, "global_step": 638160, "epoch": 7688} {"train_loss": -28.162220001220703, "global_step": 638161, "epoch": 7688} {"train_loss": -28.300342559814453, "global_step": 638162, "epoch": 7688} {"train_loss": -28.499805450439453, "global_step": 638163, "epoch": 7688} {"train_loss": -28.745319366455078, "global_step": 638164, "epoch": 7688} {"train_loss": -28.40618896484375, "global_step": 638165, "epoch": 7688} {"train_loss": -28.299793243408203, "global_step": 638166, "epoch": 7688} {"train_loss": -28.44522476196289, "global_step": 638167, "epoch": 7688} {"train_loss": -28.243406295776367, "global_step": 638168, "epoch": 7688} {"train_loss": -28.604700088500977, "global_step": 638169, "epoch": 7688} {"train_loss": -28.3952693939209, "global_step": 638170, "epoch": 7688} {"train_loss": -28.668628692626953, "global_step": 638171, "epoch": 7688} {"train_loss": -28.1871395111084, "global_step": 638172, "epoch": 7688} {"train_loss": -28.146652221679688, "global_step": 638173, "epoch": 7688} {"train_loss": -28.39877700805664, "global_step": 638174, "epoch": 7688} {"train_loss": -28.570261001586914, "global_step": 638175, "epoch": 7688} {"train_loss": -28.40630531311035, "global_step": 638176, "epoch": 7688} {"train_loss": -28.298221588134766, "global_step": 638177, "epoch": 7688} {"train_loss": -27.96539878845215, "global_step": 638178, "epoch": 7688} {"train_loss": -27.973974227905273, "global_step": 638179, "epoch": 7688} {"train_loss": -28.496417999267578, "global_step": 638180, "epoch": 7688} {"train_loss": -27.92474365234375, "global_step": 638181, "epoch": 7688} {"train_loss": -27.587371826171875, "global_step": 638182, "epoch": 7688} {"train_loss": -27.295703887939453, "global_step": 638183, "epoch": 7688} {"train_loss": -27.386199951171875, "global_step": 638184, "epoch": 7688} {"train_loss": -27.604934692382812, "global_step": 638185, "epoch": 7688} {"train_loss": -28.0490229733019, "global_step": 638186, "epoch": 7688, "val_loss": 6668249.0} {"train_loss": -26.144561767578125, "global_step": 638187, "epoch": 7689} {"train_loss": -25.554372787475586, "global_step": 638188, "epoch": 7689} {"train_loss": -25.025476455688477, "global_step": 638189, "epoch": 7689} {"train_loss": -26.880041122436523, "global_step": 638190, "epoch": 7689} {"train_loss": -25.040313720703125, "global_step": 638191, "epoch": 7689} {"train_loss": -27.051172256469727, "global_step": 638192, "epoch": 7689} {"train_loss": -25.0154972076416, "global_step": 638193, "epoch": 7689} {"train_loss": -27.054004669189453, "global_step": 638194, "epoch": 7689} {"train_loss": -26.741031646728516, "global_step": 638195, "epoch": 7689} {"train_loss": -26.737060546875, "global_step": 638196, "epoch": 7689} {"train_loss": -26.7579288482666, "global_step": 638197, "epoch": 7689} {"train_loss": -27.23480796813965, "global_step": 638198, "epoch": 7689} {"train_loss": -26.476224899291992, "global_step": 638199, "epoch": 7689} {"train_loss": -27.067419052124023, "global_step": 638200, "epoch": 7689} {"train_loss": -26.98491859436035, "global_step": 638201, "epoch": 7689} {"train_loss": -26.762496948242188, "global_step": 638202, "epoch": 7689} {"train_loss": -27.31772232055664, "global_step": 638203, "epoch": 7689} {"train_loss": -26.918716430664062, "global_step": 638204, "epoch": 7689} {"train_loss": -27.72848892211914, "global_step": 638205, "epoch": 7689} {"train_loss": -27.602874755859375, "global_step": 638206, "epoch": 7689} {"train_loss": -27.413110733032227, "global_step": 638207, "epoch": 7689} {"train_loss": -27.57050132751465, "global_step": 638208, "epoch": 7689} {"train_loss": -27.44000816345215, "global_step": 638209, "epoch": 7689} {"train_loss": -27.396947860717773, "global_step": 638210, "epoch": 7689} {"train_loss": -27.61362075805664, "global_step": 638211, "epoch": 7689} {"train_loss": -27.44622802734375, "global_step": 638212, "epoch": 7689} {"train_loss": -27.8883113861084, "global_step": 638213, "epoch": 7689} {"train_loss": -27.46023941040039, "global_step": 638214, "epoch": 7689} {"train_loss": -27.570240020751953, "global_step": 638215, "epoch": 7689} {"train_loss": -27.479841232299805, "global_step": 638216, "epoch": 7689} {"train_loss": -27.788028717041016, "global_step": 638217, "epoch": 7689} {"train_loss": -27.759906768798828, "global_step": 638218, "epoch": 7689} {"train_loss": -27.92929458618164, "global_step": 638219, "epoch": 7689} {"train_loss": -27.679641723632812, "global_step": 638220, "epoch": 7689} {"train_loss": -27.87916374206543, "global_step": 638221, "epoch": 7689} {"train_loss": -27.98331069946289, "global_step": 638222, "epoch": 7689} {"train_loss": -27.96686363220215, "global_step": 638223, "epoch": 7689} {"train_loss": -28.225385665893555, "global_step": 638224, "epoch": 7689} {"train_loss": -28.389514923095703, "global_step": 638225, "epoch": 7689} {"train_loss": -28.038330078125, "global_step": 638226, "epoch": 7689} {"train_loss": -27.961933135986328, "global_step": 638227, "epoch": 7689} {"train_loss": -27.972110748291016, "global_step": 638228, "epoch": 7689} {"train_loss": -28.019983291625977, "global_step": 638229, "epoch": 7689} {"train_loss": -28.3575382232666, "global_step": 638230, "epoch": 7689} {"train_loss": -28.033788681030273, "global_step": 638231, "epoch": 7689} {"train_loss": -28.295246124267578, "global_step": 638232, "epoch": 7689} {"train_loss": -28.541296005249023, "global_step": 638233, "epoch": 7689} {"train_loss": -28.367340087890625, "global_step": 638234, "epoch": 7689} {"train_loss": -28.14759635925293, "global_step": 638235, "epoch": 7689} {"train_loss": -28.421955108642578, "global_step": 638236, "epoch": 7689} {"train_loss": -28.923664093017578, "global_step": 638237, "epoch": 7689} {"train_loss": -28.5787353515625, "global_step": 638238, "epoch": 7689} {"train_loss": -28.1223087310791, "global_step": 638239, "epoch": 7689} {"train_loss": -28.542327880859375, "global_step": 638240, "epoch": 7689} {"train_loss": -28.395978927612305, "global_step": 638241, "epoch": 7689} {"train_loss": -28.531888961791992, "global_step": 638242, "epoch": 7689} {"train_loss": -28.107666015625, "global_step": 638243, "epoch": 7689} {"train_loss": -28.459508895874023, "global_step": 638244, "epoch": 7689} {"train_loss": -27.96394920349121, "global_step": 638245, "epoch": 7689} {"train_loss": -28.64564323425293, "global_step": 638246, "epoch": 7689} {"train_loss": -28.637805938720703, "global_step": 638247, "epoch": 7689} {"train_loss": -28.13893699645996, "global_step": 638248, "epoch": 7689} {"train_loss": -28.650033950805664, "global_step": 638249, "epoch": 7689} {"train_loss": -28.29974937438965, "global_step": 638250, "epoch": 7689} {"train_loss": -28.525068283081055, "global_step": 638251, "epoch": 7689} {"train_loss": -28.38165283203125, "global_step": 638252, "epoch": 7689} {"train_loss": -28.427722930908203, "global_step": 638253, "epoch": 7689} {"train_loss": -28.38812255859375, "global_step": 638254, "epoch": 7689} {"train_loss": -28.048505783081055, "global_step": 638255, "epoch": 7689} {"train_loss": -28.307600021362305, "global_step": 638256, "epoch": 7689} {"train_loss": -28.25079345703125, "global_step": 638257, "epoch": 7689} {"train_loss": -28.307165145874023, "global_step": 638258, "epoch": 7689} {"train_loss": -28.1639461517334, "global_step": 638259, "epoch": 7689} {"train_loss": -28.037555694580078, "global_step": 638260, "epoch": 7689} {"train_loss": -28.2971134185791, "global_step": 638261, "epoch": 7689} {"train_loss": -28.24531364440918, "global_step": 638262, "epoch": 7689} {"train_loss": -28.328168869018555, "global_step": 638263, "epoch": 7689} {"train_loss": -27.886945724487305, "global_step": 638264, "epoch": 7689} {"train_loss": -28.468488693237305, "global_step": 638265, "epoch": 7689} {"train_loss": -28.35025405883789, "global_step": 638266, "epoch": 7689} {"train_loss": -28.415008544921875, "global_step": 638267, "epoch": 7689} {"train_loss": -28.12367057800293, "global_step": 638268, "epoch": 7689} {"train_loss": -27.759262590523225, "global_step": 638269, "epoch": 7689, "val_loss": 6695180.0} {"train_loss": -27.68173599243164, "global_step": 638270, "epoch": 7690} {"train_loss": -27.613264083862305, "global_step": 638271, "epoch": 7690} {"train_loss": -27.82865333557129, "global_step": 638272, "epoch": 7690} {"train_loss": -27.775482177734375, "global_step": 638273, "epoch": 7690} {"train_loss": -27.707197189331055, "global_step": 638274, "epoch": 7690} {"train_loss": -28.05802345275879, "global_step": 638275, "epoch": 7690} {"train_loss": -27.638891220092773, "global_step": 638276, "epoch": 7690} {"train_loss": -27.909528732299805, "global_step": 638277, "epoch": 7690} {"train_loss": -27.727188110351562, "global_step": 638278, "epoch": 7690} {"train_loss": -27.828535079956055, "global_step": 638279, "epoch": 7690} {"train_loss": -27.995960235595703, "global_step": 638280, "epoch": 7690} {"train_loss": -28.0584774017334, "global_step": 638281, "epoch": 7690} {"train_loss": -28.04628562927246, "global_step": 638282, "epoch": 7690} {"train_loss": -27.834369659423828, "global_step": 638283, "epoch": 7690} {"train_loss": -27.817214965820312, "global_step": 638284, "epoch": 7690} {"train_loss": -28.427515029907227, "global_step": 638285, "epoch": 7690} {"train_loss": -28.01692008972168, "global_step": 638286, "epoch": 7690} {"train_loss": -28.3215389251709, "global_step": 638287, "epoch": 7690} {"train_loss": -27.50485610961914, "global_step": 638288, "epoch": 7690} {"train_loss": -28.06671714782715, "global_step": 638289, "epoch": 7690} {"train_loss": -27.901721954345703, "global_step": 638290, "epoch": 7690} {"train_loss": -27.698949813842773, "global_step": 638291, "epoch": 7690} {"train_loss": -27.947315216064453, "global_step": 638292, "epoch": 7690} {"train_loss": -27.904760360717773, "global_step": 638293, "epoch": 7690} {"train_loss": -28.224119186401367, "global_step": 638294, "epoch": 7690} {"train_loss": -27.82150650024414, "global_step": 638295, "epoch": 7690} {"train_loss": -28.11101722717285, "global_step": 638296, "epoch": 7690} {"train_loss": -28.363025665283203, "global_step": 638297, "epoch": 7690} {"train_loss": -28.106979370117188, "global_step": 638298, "epoch": 7690} {"train_loss": -28.271564483642578, "global_step": 638299, "epoch": 7690} {"train_loss": -27.830387115478516, "global_step": 638300, "epoch": 7690} {"train_loss": -27.914386749267578, "global_step": 638301, "epoch": 7690} {"train_loss": -27.955768585205078, "global_step": 638302, "epoch": 7690} {"train_loss": -28.526777267456055, "global_step": 638303, "epoch": 7690} {"train_loss": -28.375152587890625, "global_step": 638304, "epoch": 7690} {"train_loss": -28.206207275390625, "global_step": 638305, "epoch": 7690} {"train_loss": -28.6385555267334, "global_step": 638306, "epoch": 7690} {"train_loss": -28.202579498291016, "global_step": 638307, "epoch": 7690} {"train_loss": -28.458911895751953, "global_step": 638308, "epoch": 7690} {"train_loss": -28.516651153564453, "global_step": 638309, "epoch": 7690} {"train_loss": -28.414203643798828, "global_step": 638310, "epoch": 7690} {"train_loss": -28.015430450439453, "global_step": 638311, "epoch": 7690} {"train_loss": -28.461780548095703, "global_step": 638312, "epoch": 7690} {"train_loss": -28.342666625976562, "global_step": 638313, "epoch": 7690} {"train_loss": -28.513315200805664, "global_step": 638314, "epoch": 7690} {"train_loss": -28.311569213867188, "global_step": 638315, "epoch": 7690} {"train_loss": -28.578571319580078, "global_step": 638316, "epoch": 7690} {"train_loss": -28.271284103393555, "global_step": 638317, "epoch": 7690} {"train_loss": -28.31985855102539, "global_step": 638318, "epoch": 7690} {"train_loss": -28.3301944732666, "global_step": 638319, "epoch": 7690} {"train_loss": -28.53242301940918, "global_step": 638320, "epoch": 7690} {"train_loss": -28.576696395874023, "global_step": 638321, "epoch": 7690} {"train_loss": -28.452178955078125, "global_step": 638322, "epoch": 7690} {"train_loss": -28.129613876342773, "global_step": 638323, "epoch": 7690} {"train_loss": -27.945056915283203, "global_step": 638324, "epoch": 7690} {"train_loss": -27.884069442749023, "global_step": 638325, "epoch": 7690} {"train_loss": -28.645841598510742, "global_step": 638326, "epoch": 7690} {"train_loss": -28.770191192626953, "global_step": 638327, "epoch": 7690} {"train_loss": -28.428421020507812, "global_step": 638328, "epoch": 7690} {"train_loss": -28.35738182067871, "global_step": 638329, "epoch": 7690} {"train_loss": -28.07012367248535, "global_step": 638330, "epoch": 7690} {"train_loss": -28.311254501342773, "global_step": 638331, "epoch": 7690} {"train_loss": -28.313724517822266, "global_step": 638332, "epoch": 7690} {"train_loss": -28.37167739868164, "global_step": 638333, "epoch": 7690} {"train_loss": -28.468204498291016, "global_step": 638334, "epoch": 7690} {"train_loss": -28.719837188720703, "global_step": 638335, "epoch": 7690} {"train_loss": -28.145221710205078, "global_step": 638336, "epoch": 7690} {"train_loss": -28.242353439331055, "global_step": 638337, "epoch": 7690} {"train_loss": -28.248865127563477, "global_step": 638338, "epoch": 7690} {"train_loss": -28.121051788330078, "global_step": 638339, "epoch": 7690} {"train_loss": -28.4564151763916, "global_step": 638340, "epoch": 7690} {"train_loss": -28.426122665405273, "global_step": 638341, "epoch": 7690} {"train_loss": -28.536853790283203, "global_step": 638342, "epoch": 7690} {"train_loss": -28.4337215423584, "global_step": 638343, "epoch": 7690} {"train_loss": -28.447086334228516, "global_step": 638344, "epoch": 7690} {"train_loss": -28.458127975463867, "global_step": 638345, "epoch": 7690} {"train_loss": -28.213804244995117, "global_step": 638346, "epoch": 7690} {"train_loss": -28.155736923217773, "global_step": 638347, "epoch": 7690} {"train_loss": -28.633380889892578, "global_step": 638348, "epoch": 7690} {"train_loss": -28.478199005126953, "global_step": 638349, "epoch": 7690} {"train_loss": -28.281021118164062, "global_step": 638350, "epoch": 7690} {"train_loss": -28.13258934020996, "global_step": 638351, "epoch": 7690} {"train_loss": -28.193747095314855, "global_step": 638352, "epoch": 7690, "val_loss": 6650790.0} {"train_loss": -28.193872451782227, "global_step": 638353, "epoch": 7691} {"train_loss": -27.250202178955078, "global_step": 638354, "epoch": 7691} {"train_loss": -27.740100860595703, "global_step": 638355, "epoch": 7691} {"train_loss": -27.949716567993164, "global_step": 638356, "epoch": 7691} {"train_loss": -27.804798126220703, "global_step": 638357, "epoch": 7691} {"train_loss": -27.748876571655273, "global_step": 638358, "epoch": 7691} {"train_loss": -27.8581600189209, "global_step": 638359, "epoch": 7691} {"train_loss": -28.099536895751953, "global_step": 638360, "epoch": 7691} {"train_loss": -28.222929000854492, "global_step": 638361, "epoch": 7691} {"train_loss": -27.69635009765625, "global_step": 638362, "epoch": 7691} {"train_loss": -28.051313400268555, "global_step": 638363, "epoch": 7691} {"train_loss": -27.65036392211914, "global_step": 638364, "epoch": 7691} {"train_loss": -28.106063842773438, "global_step": 638365, "epoch": 7691} {"train_loss": -27.63840103149414, "global_step": 638366, "epoch": 7691} {"train_loss": -28.08658790588379, "global_step": 638367, "epoch": 7691} {"train_loss": -28.27657127380371, "global_step": 638368, "epoch": 7691} {"train_loss": -27.96780776977539, "global_step": 638369, "epoch": 7691} {"train_loss": -28.342880249023438, "global_step": 638370, "epoch": 7691} {"train_loss": -27.90158462524414, "global_step": 638371, "epoch": 7691} {"train_loss": -28.149152755737305, "global_step": 638372, "epoch": 7691} {"train_loss": -28.214996337890625, "global_step": 638373, "epoch": 7691} {"train_loss": -28.4766845703125, "global_step": 638374, "epoch": 7691} {"train_loss": -27.830549240112305, "global_step": 638375, "epoch": 7691} {"train_loss": -27.94414710998535, "global_step": 638376, "epoch": 7691} {"train_loss": -28.216527938842773, "global_step": 638377, "epoch": 7691} {"train_loss": -28.27547264099121, "global_step": 638378, "epoch": 7691} {"train_loss": -28.135879516601562, "global_step": 638379, "epoch": 7691} {"train_loss": -28.04453468322754, "global_step": 638380, "epoch": 7691} {"train_loss": -28.08125114440918, "global_step": 638381, "epoch": 7691} {"train_loss": -28.23459815979004, "global_step": 638382, "epoch": 7691} {"train_loss": -28.426252365112305, "global_step": 638383, "epoch": 7691} {"train_loss": -28.322620391845703, "global_step": 638384, "epoch": 7691} {"train_loss": -28.08125114440918, "global_step": 638385, "epoch": 7691} {"train_loss": -28.029767990112305, "global_step": 638386, "epoch": 7691} {"train_loss": -28.360919952392578, "global_step": 638387, "epoch": 7691} {"train_loss": -28.005008697509766, "global_step": 638388, "epoch": 7691} {"train_loss": -27.979230880737305, "global_step": 638389, "epoch": 7691} {"train_loss": -28.3762264251709, "global_step": 638390, "epoch": 7691} {"train_loss": -28.35137939453125, "global_step": 638391, "epoch": 7691} {"train_loss": -28.404132843017578, "global_step": 638392, "epoch": 7691} {"train_loss": -28.302188873291016, "global_step": 638393, "epoch": 7691} {"train_loss": -28.010162353515625, "global_step": 638394, "epoch": 7691} {"train_loss": -28.457691192626953, "global_step": 638395, "epoch": 7691} {"train_loss": -28.4692440032959, "global_step": 638396, "epoch": 7691} {"train_loss": -28.257476806640625, "global_step": 638397, "epoch": 7691} {"train_loss": -28.391647338867188, "global_step": 638398, "epoch": 7691} {"train_loss": -28.280847549438477, "global_step": 638399, "epoch": 7691} {"train_loss": -28.32088279724121, "global_step": 638400, "epoch": 7691} {"train_loss": -28.49403953552246, "global_step": 638401, "epoch": 7691} {"train_loss": -28.680612564086914, "global_step": 638402, "epoch": 7691} {"train_loss": -28.412397384643555, "global_step": 638403, "epoch": 7691} {"train_loss": -28.27828025817871, "global_step": 638404, "epoch": 7691} {"train_loss": -28.331892013549805, "global_step": 638405, "epoch": 7691} {"train_loss": -28.52155876159668, "global_step": 638406, "epoch": 7691} {"train_loss": -28.15667724609375, "global_step": 638407, "epoch": 7691} {"train_loss": -28.457117080688477, "global_step": 638408, "epoch": 7691} {"train_loss": -28.646100997924805, "global_step": 638409, "epoch": 7691} {"train_loss": -28.31886100769043, "global_step": 638410, "epoch": 7691} {"train_loss": -28.595596313476562, "global_step": 638411, "epoch": 7691} {"train_loss": -28.11248779296875, "global_step": 638412, "epoch": 7691} {"train_loss": -27.59954833984375, "global_step": 638413, "epoch": 7691} {"train_loss": -27.535993576049805, "global_step": 638414, "epoch": 7691} {"train_loss": -26.975961685180664, "global_step": 638415, "epoch": 7691} {"train_loss": -25.455472946166992, "global_step": 638416, "epoch": 7691} {"train_loss": -26.17917251586914, "global_step": 638417, "epoch": 7691} {"train_loss": -28.41643714904785, "global_step": 638418, "epoch": 7691} {"train_loss": -26.494354248046875, "global_step": 638419, "epoch": 7691} {"train_loss": -27.099653244018555, "global_step": 638420, "epoch": 7691} {"train_loss": -27.810455322265625, "global_step": 638421, "epoch": 7691} {"train_loss": -27.890411376953125, "global_step": 638422, "epoch": 7691} {"train_loss": -27.720075607299805, "global_step": 638423, "epoch": 7691} {"train_loss": -27.891382217407227, "global_step": 638424, "epoch": 7691} {"train_loss": -27.373376846313477, "global_step": 638425, "epoch": 7691} {"train_loss": -27.772674560546875, "global_step": 638426, "epoch": 7691} {"train_loss": -27.77848243713379, "global_step": 638427, "epoch": 7691} {"train_loss": -28.206771850585938, "global_step": 638428, "epoch": 7691} {"train_loss": -27.394689559936523, "global_step": 638429, "epoch": 7691} {"train_loss": -28.145584106445312, "global_step": 638430, "epoch": 7691} {"train_loss": -27.77638053894043, "global_step": 638431, "epoch": 7691} {"train_loss": -28.40728759765625, "global_step": 638432, "epoch": 7691} {"train_loss": -28.10321044921875, "global_step": 638433, "epoch": 7691} {"train_loss": -28.457778930664062, "global_step": 638434, "epoch": 7691} {"train_loss": -28.020516728780354, "global_step": 638435, "epoch": 7691, "val_loss": 6681299.5} {"train_loss": -27.67376708984375, "global_step": 638436, "epoch": 7692} {"train_loss": -27.455713272094727, "global_step": 638437, "epoch": 7692} {"train_loss": -27.520904541015625, "global_step": 638438, "epoch": 7692} {"train_loss": -27.79994773864746, "global_step": 638439, "epoch": 7692} {"train_loss": -27.482553482055664, "global_step": 638440, "epoch": 7692} {"train_loss": -27.88416862487793, "global_step": 638441, "epoch": 7692} {"train_loss": -27.677648544311523, "global_step": 638442, "epoch": 7692} {"train_loss": -27.50286293029785, "global_step": 638443, "epoch": 7692} {"train_loss": -27.79277992248535, "global_step": 638444, "epoch": 7692} {"train_loss": -28.109012603759766, "global_step": 638445, "epoch": 7692} {"train_loss": -27.391687393188477, "global_step": 638446, "epoch": 7692} {"train_loss": -28.116971969604492, "global_step": 638447, "epoch": 7692} {"train_loss": -27.981201171875, "global_step": 638448, "epoch": 7692} {"train_loss": -27.873746871948242, "global_step": 638449, "epoch": 7692} {"train_loss": -27.850574493408203, "global_step": 638450, "epoch": 7692} {"train_loss": -27.91888999938965, "global_step": 638451, "epoch": 7692} {"train_loss": -27.618268966674805, "global_step": 638452, "epoch": 7692} {"train_loss": -28.03192710876465, "global_step": 638453, "epoch": 7692} {"train_loss": -27.96506690979004, "global_step": 638454, "epoch": 7692} {"train_loss": -27.752756118774414, "global_step": 638455, "epoch": 7692} {"train_loss": -28.011920928955078, "global_step": 638456, "epoch": 7692} {"train_loss": -28.21127700805664, "global_step": 638457, "epoch": 7692} {"train_loss": -28.322559356689453, "global_step": 638458, "epoch": 7692} {"train_loss": -28.05388832092285, "global_step": 638459, "epoch": 7692} {"train_loss": -28.10528564453125, "global_step": 638460, "epoch": 7692} {"train_loss": -28.484180450439453, "global_step": 638461, "epoch": 7692} {"train_loss": -28.155532836914062, "global_step": 638462, "epoch": 7692} {"train_loss": -28.477924346923828, "global_step": 638463, "epoch": 7692} {"train_loss": -28.445037841796875, "global_step": 638464, "epoch": 7692} {"train_loss": -28.060407638549805, "global_step": 638465, "epoch": 7692} {"train_loss": -28.59455680847168, "global_step": 638466, "epoch": 7692} {"train_loss": -28.203155517578125, "global_step": 638467, "epoch": 7692} {"train_loss": -28.536376953125, "global_step": 638468, "epoch": 7692} {"train_loss": -28.5614013671875, "global_step": 638469, "epoch": 7692} {"train_loss": -28.514257431030273, "global_step": 638470, "epoch": 7692} {"train_loss": -28.38583755493164, "global_step": 638471, "epoch": 7692} {"train_loss": -28.286651611328125, "global_step": 638472, "epoch": 7692} {"train_loss": -28.18375587463379, "global_step": 638473, "epoch": 7692} {"train_loss": -28.204736709594727, "global_step": 638474, "epoch": 7692} {"train_loss": -28.101154327392578, "global_step": 638475, "epoch": 7692} {"train_loss": -28.602375030517578, "global_step": 638476, "epoch": 7692} {"train_loss": -28.51651382446289, "global_step": 638477, "epoch": 7692} {"train_loss": -28.445178985595703, "global_step": 638478, "epoch": 7692} {"train_loss": -28.486896514892578, "global_step": 638479, "epoch": 7692} {"train_loss": -28.2941837310791, "global_step": 638480, "epoch": 7692} {"train_loss": -28.3299560546875, "global_step": 638481, "epoch": 7692} {"train_loss": -28.315006256103516, "global_step": 638482, "epoch": 7692} {"train_loss": -28.1498966217041, "global_step": 638483, "epoch": 7692} {"train_loss": -28.32525062561035, "global_step": 638484, "epoch": 7692} {"train_loss": -27.766401290893555, "global_step": 638485, "epoch": 7692} {"train_loss": -28.781827926635742, "global_step": 638486, "epoch": 7692} {"train_loss": -28.612506866455078, "global_step": 638487, "epoch": 7692} {"train_loss": -28.613025665283203, "global_step": 638488, "epoch": 7692} {"train_loss": -28.013029098510742, "global_step": 638489, "epoch": 7692} {"train_loss": -28.329620361328125, "global_step": 638490, "epoch": 7692} {"train_loss": -28.64759635925293, "global_step": 638491, "epoch": 7692} {"train_loss": -28.38587760925293, "global_step": 638492, "epoch": 7692} {"train_loss": -28.526660919189453, "global_step": 638493, "epoch": 7692} {"train_loss": -27.787137985229492, "global_step": 638494, "epoch": 7692} {"train_loss": -27.5048770904541, "global_step": 638495, "epoch": 7692} {"train_loss": -27.634687423706055, "global_step": 638496, "epoch": 7692} {"train_loss": -27.33966636657715, "global_step": 638497, "epoch": 7692} {"train_loss": -27.614492416381836, "global_step": 638498, "epoch": 7692} {"train_loss": -27.97584342956543, "global_step": 638499, "epoch": 7692} {"train_loss": -27.918668746948242, "global_step": 638500, "epoch": 7692} {"train_loss": -27.731369018554688, "global_step": 638501, "epoch": 7692} {"train_loss": -28.2280216217041, "global_step": 638502, "epoch": 7692} {"train_loss": -28.01869010925293, "global_step": 638503, "epoch": 7692} {"train_loss": -28.230091094970703, "global_step": 638504, "epoch": 7692} {"train_loss": -28.26043128967285, "global_step": 638505, "epoch": 7692} {"train_loss": -28.146329879760742, "global_step": 638506, "epoch": 7692} {"train_loss": -28.208454132080078, "global_step": 638507, "epoch": 7692} {"train_loss": -28.557022094726562, "global_step": 638508, "epoch": 7692} {"train_loss": -28.05071449279785, "global_step": 638509, "epoch": 7692} {"train_loss": -27.767133712768555, "global_step": 638510, "epoch": 7692} {"train_loss": -28.338647842407227, "global_step": 638511, "epoch": 7692} {"train_loss": -28.033432006835938, "global_step": 638512, "epoch": 7692} {"train_loss": -28.485132217407227, "global_step": 638513, "epoch": 7692} {"train_loss": -28.201190948486328, "global_step": 638514, "epoch": 7692} {"train_loss": -28.381183624267578, "global_step": 638515, "epoch": 7692} {"train_loss": -28.482105255126953, "global_step": 638516, "epoch": 7692} {"train_loss": -28.066991806030273, "global_step": 638517, "epoch": 7692} {"train_loss": -28.1207888729601, "global_step": 638518, "epoch": 7692, "val_loss": 6719580.5} {"train_loss": -27.541730880737305, "global_step": 638519, "epoch": 7693} {"train_loss": -28.07387351989746, "global_step": 638520, "epoch": 7693} {"train_loss": -27.46455192565918, "global_step": 638521, "epoch": 7693} {"train_loss": -27.586746215820312, "global_step": 638522, "epoch": 7693} {"train_loss": -27.55250358581543, "global_step": 638523, "epoch": 7693} {"train_loss": -27.50006103515625, "global_step": 638524, "epoch": 7693} {"train_loss": -28.003238677978516, "global_step": 638525, "epoch": 7693} {"train_loss": -27.925058364868164, "global_step": 638526, "epoch": 7693} {"train_loss": -27.912580490112305, "global_step": 638527, "epoch": 7693} {"train_loss": -27.917346954345703, "global_step": 638528, "epoch": 7693} {"train_loss": -28.140750885009766, "global_step": 638529, "epoch": 7693} {"train_loss": -28.29778480529785, "global_step": 638530, "epoch": 7693} {"train_loss": -28.187021255493164, "global_step": 638531, "epoch": 7693} {"train_loss": -28.238880157470703, "global_step": 638532, "epoch": 7693} {"train_loss": -28.351377487182617, "global_step": 638533, "epoch": 7693} {"train_loss": -28.160181045532227, "global_step": 638534, "epoch": 7693} {"train_loss": -28.601764678955078, "global_step": 638535, "epoch": 7693} {"train_loss": -28.007299423217773, "global_step": 638536, "epoch": 7693} {"train_loss": -28.379846572875977, "global_step": 638537, "epoch": 7693} {"train_loss": -28.022506713867188, "global_step": 638538, "epoch": 7693} {"train_loss": -28.032995223999023, "global_step": 638539, "epoch": 7693} {"train_loss": -28.178476333618164, "global_step": 638540, "epoch": 7693} {"train_loss": -28.108274459838867, "global_step": 638541, "epoch": 7693} {"train_loss": -28.51357078552246, "global_step": 638542, "epoch": 7693} {"train_loss": -28.025287628173828, "global_step": 638543, "epoch": 7693} {"train_loss": -28.452167510986328, "global_step": 638544, "epoch": 7693} {"train_loss": -28.066070556640625, "global_step": 638545, "epoch": 7693} {"train_loss": -28.203535079956055, "global_step": 638546, "epoch": 7693} {"train_loss": -28.501972198486328, "global_step": 638547, "epoch": 7693} {"train_loss": -28.23257827758789, "global_step": 638548, "epoch": 7693} {"train_loss": -28.598194122314453, "global_step": 638549, "epoch": 7693} {"train_loss": -28.0362491607666, "global_step": 638550, "epoch": 7693} {"train_loss": -28.38006019592285, "global_step": 638551, "epoch": 7693} {"train_loss": -28.125608444213867, "global_step": 638552, "epoch": 7693} {"train_loss": -28.392297744750977, "global_step": 638553, "epoch": 7693} {"train_loss": -28.233783721923828, "global_step": 638554, "epoch": 7693} {"train_loss": -28.614736557006836, "global_step": 638555, "epoch": 7693} {"train_loss": -28.34494972229004, "global_step": 638556, "epoch": 7693} {"train_loss": -28.50764274597168, "global_step": 638557, "epoch": 7693} {"train_loss": -28.20416831970215, "global_step": 638558, "epoch": 7693} {"train_loss": -28.05865478515625, "global_step": 638559, "epoch": 7693} {"train_loss": -28.294076919555664, "global_step": 638560, "epoch": 7693} {"train_loss": -28.015655517578125, "global_step": 638561, "epoch": 7693} {"train_loss": -28.182703018188477, "global_step": 638562, "epoch": 7693} {"train_loss": -28.170063018798828, "global_step": 638563, "epoch": 7693} {"train_loss": -28.177459716796875, "global_step": 638564, "epoch": 7693} {"train_loss": -28.248071670532227, "global_step": 638565, "epoch": 7693} {"train_loss": -28.5734806060791, "global_step": 638566, "epoch": 7693} {"train_loss": -28.27960777282715, "global_step": 638567, "epoch": 7693} {"train_loss": -28.335758209228516, "global_step": 638568, "epoch": 7693} {"train_loss": -28.405166625976562, "global_step": 638569, "epoch": 7693} {"train_loss": -28.457977294921875, "global_step": 638570, "epoch": 7693} {"train_loss": -28.509613037109375, "global_step": 638571, "epoch": 7693} {"train_loss": -28.4300594329834, "global_step": 638572, "epoch": 7693} {"train_loss": -28.237939834594727, "global_step": 638573, "epoch": 7693} {"train_loss": -28.718631744384766, "global_step": 638574, "epoch": 7693} {"train_loss": -28.420019149780273, "global_step": 638575, "epoch": 7693} {"train_loss": -28.12164878845215, "global_step": 638576, "epoch": 7693} {"train_loss": -28.0707950592041, "global_step": 638577, "epoch": 7693} {"train_loss": -28.06975746154785, "global_step": 638578, "epoch": 7693} {"train_loss": -28.445703506469727, "global_step": 638579, "epoch": 7693} {"train_loss": -28.14912986755371, "global_step": 638580, "epoch": 7693} {"train_loss": -28.625564575195312, "global_step": 638581, "epoch": 7693} {"train_loss": -28.052967071533203, "global_step": 638582, "epoch": 7693} {"train_loss": -28.219358444213867, "global_step": 638583, "epoch": 7693} {"train_loss": -28.45779800415039, "global_step": 638584, "epoch": 7693} {"train_loss": -28.2471923828125, "global_step": 638585, "epoch": 7693} {"train_loss": -28.394941329956055, "global_step": 638586, "epoch": 7693} {"train_loss": -28.244403839111328, "global_step": 638587, "epoch": 7693} {"train_loss": -28.603652954101562, "global_step": 638588, "epoch": 7693} {"train_loss": -28.09284019470215, "global_step": 638589, "epoch": 7693} {"train_loss": -28.769758224487305, "global_step": 638590, "epoch": 7693} {"train_loss": -28.09693717956543, "global_step": 638591, "epoch": 7693} {"train_loss": -28.258161544799805, "global_step": 638592, "epoch": 7693} {"train_loss": -27.73027992248535, "global_step": 638593, "epoch": 7693} {"train_loss": -27.787506103515625, "global_step": 638594, "epoch": 7693} {"train_loss": -27.0693302154541, "global_step": 638595, "epoch": 7693} {"train_loss": -27.272016525268555, "global_step": 638596, "epoch": 7693} {"train_loss": -27.729352951049805, "global_step": 638597, "epoch": 7693} {"train_loss": -27.891376495361328, "global_step": 638598, "epoch": 7693} {"train_loss": -28.260663986206055, "global_step": 638599, "epoch": 7693} {"train_loss": -28.156476974487305, "global_step": 638600, "epoch": 7693} {"train_loss": -28.16783996949713, "global_step": 638601, "epoch": 7693, "val_loss": 6732499.0} {"train_loss": -28.140445709228516, "global_step": 638602, "epoch": 7694} {"train_loss": -27.056894302368164, "global_step": 638603, "epoch": 7694} {"train_loss": -27.5601806640625, "global_step": 638604, "epoch": 7694} {"train_loss": -27.07552146911621, "global_step": 638605, "epoch": 7694} {"train_loss": -27.399890899658203, "global_step": 638606, "epoch": 7694} {"train_loss": -27.57436180114746, "global_step": 638607, "epoch": 7694} {"train_loss": -27.664199829101562, "global_step": 638608, "epoch": 7694} {"train_loss": -27.604963302612305, "global_step": 638609, "epoch": 7694} {"train_loss": -27.944189071655273, "global_step": 638610, "epoch": 7694} {"train_loss": -27.6984806060791, "global_step": 638611, "epoch": 7694} {"train_loss": -27.75895118713379, "global_step": 638612, "epoch": 7694} {"train_loss": -28.279438018798828, "global_step": 638613, "epoch": 7694} {"train_loss": -27.830102920532227, "global_step": 638614, "epoch": 7694} {"train_loss": -27.88104820251465, "global_step": 638615, "epoch": 7694} {"train_loss": -27.807722091674805, "global_step": 638616, "epoch": 7694} {"train_loss": -27.799543380737305, "global_step": 638617, "epoch": 7694} {"train_loss": -27.82002830505371, "global_step": 638618, "epoch": 7694} {"train_loss": -27.764554977416992, "global_step": 638619, "epoch": 7694} {"train_loss": -27.54257583618164, "global_step": 638620, "epoch": 7694} {"train_loss": -27.980783462524414, "global_step": 638621, "epoch": 7694} {"train_loss": -27.5660400390625, "global_step": 638622, "epoch": 7694} {"train_loss": -27.68561363220215, "global_step": 638623, "epoch": 7694} {"train_loss": -27.893644332885742, "global_step": 638624, "epoch": 7694} {"train_loss": -27.892364501953125, "global_step": 638625, "epoch": 7694} {"train_loss": -27.614896774291992, "global_step": 638626, "epoch": 7694} {"train_loss": -27.821359634399414, "global_step": 638627, "epoch": 7694} {"train_loss": -27.988574981689453, "global_step": 638628, "epoch": 7694} {"train_loss": -27.60700035095215, "global_step": 638629, "epoch": 7694} {"train_loss": -27.568206787109375, "global_step": 638630, "epoch": 7694} {"train_loss": -27.624608993530273, "global_step": 638631, "epoch": 7694} {"train_loss": -27.952253341674805, "global_step": 638632, "epoch": 7694} {"train_loss": -28.139530181884766, "global_step": 638633, "epoch": 7694} {"train_loss": -28.162809371948242, "global_step": 638634, "epoch": 7694} {"train_loss": -28.6103572845459, "global_step": 638635, "epoch": 7694} {"train_loss": -28.243566513061523, "global_step": 638636, "epoch": 7694} {"train_loss": -28.35636329650879, "global_step": 638637, "epoch": 7694} {"train_loss": -28.391742706298828, "global_step": 638638, "epoch": 7694} {"train_loss": -28.76080894470215, "global_step": 638639, "epoch": 7694} {"train_loss": -28.374862670898438, "global_step": 638640, "epoch": 7694} {"train_loss": -28.44923210144043, "global_step": 638641, "epoch": 7694} {"train_loss": -28.3869571685791, "global_step": 638642, "epoch": 7694} {"train_loss": -28.553918838500977, "global_step": 638643, "epoch": 7694} {"train_loss": -28.147357940673828, "global_step": 638644, "epoch": 7694} {"train_loss": -28.395023345947266, "global_step": 638645, "epoch": 7694} {"train_loss": -28.356443405151367, "global_step": 638646, "epoch": 7694} {"train_loss": -28.499990463256836, "global_step": 638647, "epoch": 7694} {"train_loss": -28.151477813720703, "global_step": 638648, "epoch": 7694} {"train_loss": -28.14716911315918, "global_step": 638649, "epoch": 7694} {"train_loss": -28.414392471313477, "global_step": 638650, "epoch": 7694} {"train_loss": -28.419347763061523, "global_step": 638651, "epoch": 7694} {"train_loss": -28.003934860229492, "global_step": 638652, "epoch": 7694} {"train_loss": -28.23356056213379, "global_step": 638653, "epoch": 7694} {"train_loss": -28.521533966064453, "global_step": 638654, "epoch": 7694} {"train_loss": -28.1212158203125, "global_step": 638655, "epoch": 7694} {"train_loss": -28.405349731445312, "global_step": 638656, "epoch": 7694} {"train_loss": -28.366790771484375, "global_step": 638657, "epoch": 7694} {"train_loss": -28.113630294799805, "global_step": 638658, "epoch": 7694} {"train_loss": -28.26582145690918, "global_step": 638659, "epoch": 7694} {"train_loss": -28.36419105529785, "global_step": 638660, "epoch": 7694} {"train_loss": -28.389272689819336, "global_step": 638661, "epoch": 7694} {"train_loss": -28.425928115844727, "global_step": 638662, "epoch": 7694} {"train_loss": -28.342620849609375, "global_step": 638663, "epoch": 7694} {"train_loss": -28.442401885986328, "global_step": 638664, "epoch": 7694} {"train_loss": -28.61871910095215, "global_step": 638665, "epoch": 7694} {"train_loss": -28.4049129486084, "global_step": 638666, "epoch": 7694} {"train_loss": -28.440338134765625, "global_step": 638667, "epoch": 7694} {"train_loss": -28.130508422851562, "global_step": 638668, "epoch": 7694} {"train_loss": -28.330602645874023, "global_step": 638669, "epoch": 7694} {"train_loss": -28.639646530151367, "global_step": 638670, "epoch": 7694} {"train_loss": -28.173328399658203, "global_step": 638671, "epoch": 7694} {"train_loss": -27.755762100219727, "global_step": 638672, "epoch": 7694} {"train_loss": -28.105030059814453, "global_step": 638673, "epoch": 7694} {"train_loss": -28.106611251831055, "global_step": 638674, "epoch": 7694} {"train_loss": -28.61918067932129, "global_step": 638675, "epoch": 7694} {"train_loss": -28.353591918945312, "global_step": 638676, "epoch": 7694} {"train_loss": -27.967004776000977, "global_step": 638677, "epoch": 7694} {"train_loss": -27.923200607299805, "global_step": 638678, "epoch": 7694} {"train_loss": -28.147003173828125, "global_step": 638679, "epoch": 7694} {"train_loss": -28.483312606811523, "global_step": 638680, "epoch": 7694} {"train_loss": -28.247404098510742, "global_step": 638681, "epoch": 7694} {"train_loss": -28.036230087280273, "global_step": 638682, "epoch": 7694} {"train_loss": -28.388166427612305, "global_step": 638683, "epoch": 7694} {"train_loss": -28.073985731745342, "global_step": 638684, "epoch": 7694, "val_loss": 6698299.0} {"train_loss": -28.137744903564453, "global_step": 638685, "epoch": 7695} {"train_loss": -27.581012725830078, "global_step": 638686, "epoch": 7695} {"train_loss": -27.529123306274414, "global_step": 638687, "epoch": 7695} {"train_loss": -27.299306869506836, "global_step": 638688, "epoch": 7695} {"train_loss": -27.651153564453125, "global_step": 638689, "epoch": 7695} {"train_loss": -27.542922973632812, "global_step": 638690, "epoch": 7695} {"train_loss": -27.391347885131836, "global_step": 638691, "epoch": 7695} {"train_loss": -27.475360870361328, "global_step": 638692, "epoch": 7695} {"train_loss": -27.36041831970215, "global_step": 638693, "epoch": 7695} {"train_loss": -27.519987106323242, "global_step": 638694, "epoch": 7695} {"train_loss": -27.661701202392578, "global_step": 638695, "epoch": 7695} {"train_loss": -28.020557403564453, "global_step": 638696, "epoch": 7695} {"train_loss": -27.502796173095703, "global_step": 638697, "epoch": 7695} {"train_loss": -27.19903564453125, "global_step": 638698, "epoch": 7695} {"train_loss": -27.471343994140625, "global_step": 638699, "epoch": 7695} {"train_loss": -27.600757598876953, "global_step": 638700, "epoch": 7695} {"train_loss": -27.811359405517578, "global_step": 638701, "epoch": 7695} {"train_loss": -27.648609161376953, "global_step": 638702, "epoch": 7695} {"train_loss": -27.85896110534668, "global_step": 638703, "epoch": 7695} {"train_loss": -27.9322566986084, "global_step": 638704, "epoch": 7695} {"train_loss": -27.73663902282715, "global_step": 638705, "epoch": 7695} {"train_loss": -28.121204376220703, "global_step": 638706, "epoch": 7695} {"train_loss": -27.723419189453125, "global_step": 638707, "epoch": 7695} {"train_loss": -28.4196720123291, "global_step": 638708, "epoch": 7695} {"train_loss": -27.910058975219727, "global_step": 638709, "epoch": 7695} {"train_loss": -28.34893226623535, "global_step": 638710, "epoch": 7695} {"train_loss": -28.1554012298584, "global_step": 638711, "epoch": 7695} {"train_loss": -28.367700576782227, "global_step": 638712, "epoch": 7695} {"train_loss": -28.301483154296875, "global_step": 638713, "epoch": 7695} {"train_loss": -28.09002113342285, "global_step": 638714, "epoch": 7695} {"train_loss": -28.39507484436035, "global_step": 638715, "epoch": 7695} {"train_loss": -28.55499839782715, "global_step": 638716, "epoch": 7695} {"train_loss": -28.287633895874023, "global_step": 638717, "epoch": 7695} {"train_loss": -28.4627628326416, "global_step": 638718, "epoch": 7695} {"train_loss": -28.033842086791992, "global_step": 638719, "epoch": 7695} {"train_loss": -28.5184383392334, "global_step": 638720, "epoch": 7695} {"train_loss": -28.3697566986084, "global_step": 638721, "epoch": 7695} {"train_loss": -28.333322525024414, "global_step": 638722, "epoch": 7695} {"train_loss": -28.1646671295166, "global_step": 638723, "epoch": 7695} {"train_loss": -28.61153221130371, "global_step": 638724, "epoch": 7695} {"train_loss": -28.092243194580078, "global_step": 638725, "epoch": 7695} {"train_loss": -28.469900131225586, "global_step": 638726, "epoch": 7695} {"train_loss": -28.352331161499023, "global_step": 638727, "epoch": 7695} {"train_loss": -28.185781478881836, "global_step": 638728, "epoch": 7695} {"train_loss": -28.61492347717285, "global_step": 638729, "epoch": 7695} {"train_loss": -28.2948055267334, "global_step": 638730, "epoch": 7695} {"train_loss": -28.65327262878418, "global_step": 638731, "epoch": 7695} {"train_loss": -28.453033447265625, "global_step": 638732, "epoch": 7695} {"train_loss": -28.331756591796875, "global_step": 638733, "epoch": 7695} {"train_loss": -28.321386337280273, "global_step": 638734, "epoch": 7695} {"train_loss": -28.606306076049805, "global_step": 638735, "epoch": 7695} {"train_loss": -28.250635147094727, "global_step": 638736, "epoch": 7695} {"train_loss": -28.42767333984375, "global_step": 638737, "epoch": 7695} {"train_loss": -28.397918701171875, "global_step": 638738, "epoch": 7695} {"train_loss": -28.416461944580078, "global_step": 638739, "epoch": 7695} {"train_loss": -28.264657974243164, "global_step": 638740, "epoch": 7695} {"train_loss": -28.54562759399414, "global_step": 638741, "epoch": 7695} {"train_loss": -28.594079971313477, "global_step": 638742, "epoch": 7695} {"train_loss": -28.696786880493164, "global_step": 638743, "epoch": 7695} {"train_loss": -28.17386817932129, "global_step": 638744, "epoch": 7695} {"train_loss": -28.46875, "global_step": 638745, "epoch": 7695} {"train_loss": -28.020421981811523, "global_step": 638746, "epoch": 7695} {"train_loss": -28.73333168029785, "global_step": 638747, "epoch": 7695} {"train_loss": -28.434438705444336, "global_step": 638748, "epoch": 7695} {"train_loss": -28.405841827392578, "global_step": 638749, "epoch": 7695} {"train_loss": -28.19475746154785, "global_step": 638750, "epoch": 7695} {"train_loss": -28.291223526000977, "global_step": 638751, "epoch": 7695} {"train_loss": -28.33731460571289, "global_step": 638752, "epoch": 7695} {"train_loss": -28.37965965270996, "global_step": 638753, "epoch": 7695} {"train_loss": -28.306562423706055, "global_step": 638754, "epoch": 7695} {"train_loss": -28.836698532104492, "global_step": 638755, "epoch": 7695} {"train_loss": -28.577884674072266, "global_step": 638756, "epoch": 7695} {"train_loss": -28.48836326599121, "global_step": 638757, "epoch": 7695} {"train_loss": -28.266986846923828, "global_step": 638758, "epoch": 7695} {"train_loss": -27.825119018554688, "global_step": 638759, "epoch": 7695} {"train_loss": -28.122451782226562, "global_step": 638760, "epoch": 7695} {"train_loss": -28.1497802734375, "global_step": 638761, "epoch": 7695} {"train_loss": -27.730609893798828, "global_step": 638762, "epoch": 7695} {"train_loss": -26.671606063842773, "global_step": 638763, "epoch": 7695} {"train_loss": -26.397357940673828, "global_step": 638764, "epoch": 7695} {"train_loss": -27.36579704284668, "global_step": 638765, "epoch": 7695} {"train_loss": -27.84901237487793, "global_step": 638766, "epoch": 7695} {"train_loss": -28.08625873887395, "global_step": 638767, "epoch": 7695, "val_loss": 6694630.0} {"train_loss": -27.320119857788086, "global_step": 638768, "epoch": 7696} {"train_loss": -26.050596237182617, "global_step": 638769, "epoch": 7696} {"train_loss": -27.316553115844727, "global_step": 638770, "epoch": 7696} {"train_loss": -26.874387741088867, "global_step": 638771, "epoch": 7696} {"train_loss": -26.573522567749023, "global_step": 638772, "epoch": 7696} {"train_loss": -27.848190307617188, "global_step": 638773, "epoch": 7696} {"train_loss": -26.7078800201416, "global_step": 638774, "epoch": 7696} {"train_loss": -27.563373565673828, "global_step": 638775, "epoch": 7696} {"train_loss": -27.099653244018555, "global_step": 638776, "epoch": 7696} {"train_loss": -28.076385498046875, "global_step": 638777, "epoch": 7696} {"train_loss": -27.660999298095703, "global_step": 638778, "epoch": 7696} {"train_loss": -27.791685104370117, "global_step": 638779, "epoch": 7696} {"train_loss": -27.595422744750977, "global_step": 638780, "epoch": 7696} {"train_loss": -27.508947372436523, "global_step": 638781, "epoch": 7696} {"train_loss": -27.587787628173828, "global_step": 638782, "epoch": 7696} {"train_loss": -27.720977783203125, "global_step": 638783, "epoch": 7696} {"train_loss": -27.606369018554688, "global_step": 638784, "epoch": 7696} {"train_loss": -27.9365177154541, "global_step": 638785, "epoch": 7696} {"train_loss": -28.04231071472168, "global_step": 638786, "epoch": 7696} {"train_loss": -28.29347801208496, "global_step": 638787, "epoch": 7696} {"train_loss": -27.84132957458496, "global_step": 638788, "epoch": 7696} {"train_loss": -27.78523063659668, "global_step": 638789, "epoch": 7696} {"train_loss": -27.98858070373535, "global_step": 638790, "epoch": 7696} {"train_loss": -27.644128799438477, "global_step": 638791, "epoch": 7696} {"train_loss": -28.157550811767578, "global_step": 638792, "epoch": 7696} {"train_loss": -27.985523223876953, "global_step": 638793, "epoch": 7696} {"train_loss": -27.923505783081055, "global_step": 638794, "epoch": 7696} {"train_loss": -28.131322860717773, "global_step": 638795, "epoch": 7696} {"train_loss": -27.88962173461914, "global_step": 638796, "epoch": 7696} {"train_loss": -28.148542404174805, "global_step": 638797, "epoch": 7696} {"train_loss": -27.6306209564209, "global_step": 638798, "epoch": 7696} {"train_loss": -28.2332706451416, "global_step": 638799, "epoch": 7696} {"train_loss": -28.468372344970703, "global_step": 638800, "epoch": 7696} {"train_loss": -28.14554786682129, "global_step": 638801, "epoch": 7696} {"train_loss": -28.000747680664062, "global_step": 638802, "epoch": 7696} {"train_loss": -28.202411651611328, "global_step": 638803, "epoch": 7696} {"train_loss": -28.3189754486084, "global_step": 638804, "epoch": 7696} {"train_loss": -28.614221572875977, "global_step": 638805, "epoch": 7696} {"train_loss": -28.093738555908203, "global_step": 638806, "epoch": 7696} {"train_loss": -28.43764305114746, "global_step": 638807, "epoch": 7696} {"train_loss": -28.376867294311523, "global_step": 638808, "epoch": 7696} {"train_loss": -28.218286514282227, "global_step": 638809, "epoch": 7696} {"train_loss": -28.6080379486084, "global_step": 638810, "epoch": 7696} {"train_loss": -28.05459976196289, "global_step": 638811, "epoch": 7696} {"train_loss": -28.206653594970703, "global_step": 638812, "epoch": 7696} {"train_loss": -28.092870712280273, "global_step": 638813, "epoch": 7696} {"train_loss": -28.327930450439453, "global_step": 638814, "epoch": 7696} {"train_loss": -28.1905460357666, "global_step": 638815, "epoch": 7696} {"train_loss": -27.89059829711914, "global_step": 638816, "epoch": 7696} {"train_loss": -28.468128204345703, "global_step": 638817, "epoch": 7696} {"train_loss": -28.30130386352539, "global_step": 638818, "epoch": 7696} {"train_loss": -28.283050537109375, "global_step": 638819, "epoch": 7696} {"train_loss": -28.3084659576416, "global_step": 638820, "epoch": 7696} {"train_loss": -28.19538688659668, "global_step": 638821, "epoch": 7696} {"train_loss": -28.153640747070312, "global_step": 638822, "epoch": 7696} {"train_loss": -28.209951400756836, "global_step": 638823, "epoch": 7696} {"train_loss": -28.13469886779785, "global_step": 638824, "epoch": 7696} {"train_loss": -28.09761619567871, "global_step": 638825, "epoch": 7696} {"train_loss": -28.110498428344727, "global_step": 638826, "epoch": 7696} {"train_loss": -28.602466583251953, "global_step": 638827, "epoch": 7696} {"train_loss": -27.4217472076416, "global_step": 638828, "epoch": 7696} {"train_loss": -28.386579513549805, "global_step": 638829, "epoch": 7696} {"train_loss": -27.42461585998535, "global_step": 638830, "epoch": 7696} {"train_loss": -27.715930938720703, "global_step": 638831, "epoch": 7696} {"train_loss": -28.177310943603516, "global_step": 638832, "epoch": 7696} {"train_loss": -27.789901733398438, "global_step": 638833, "epoch": 7696} {"train_loss": -27.978805541992188, "global_step": 638834, "epoch": 7696} {"train_loss": -28.08054542541504, "global_step": 638835, "epoch": 7696} {"train_loss": -28.082294464111328, "global_step": 638836, "epoch": 7696} {"train_loss": -28.39676856994629, "global_step": 638837, "epoch": 7696} {"train_loss": -28.085519790649414, "global_step": 638838, "epoch": 7696} {"train_loss": -28.19070816040039, "global_step": 638839, "epoch": 7696} {"train_loss": -28.219348907470703, "global_step": 638840, "epoch": 7696} {"train_loss": -28.326826095581055, "global_step": 638841, "epoch": 7696} {"train_loss": -27.938465118408203, "global_step": 638842, "epoch": 7696} {"train_loss": -28.483905792236328, "global_step": 638843, "epoch": 7696} {"train_loss": -27.98514175415039, "global_step": 638844, "epoch": 7696} {"train_loss": -27.738006591796875, "global_step": 638845, "epoch": 7696} {"train_loss": -27.723438262939453, "global_step": 638846, "epoch": 7696} {"train_loss": -27.645370483398438, "global_step": 638847, "epoch": 7696} {"train_loss": -27.745447158813477, "global_step": 638848, "epoch": 7696} {"train_loss": -28.056821823120117, "global_step": 638849, "epoch": 7696} {"train_loss": -27.949544952576417, "global_step": 638850, "epoch": 7696, "val_loss": 6653562.0} {"train_loss": -28.24114418029785, "global_step": 638851, "epoch": 7697} {"train_loss": -27.61740493774414, "global_step": 638852, "epoch": 7697} {"train_loss": -27.815937042236328, "global_step": 638853, "epoch": 7697} {"train_loss": -28.2618408203125, "global_step": 638854, "epoch": 7697} {"train_loss": -27.871641159057617, "global_step": 638855, "epoch": 7697} {"train_loss": -27.90302085876465, "global_step": 638856, "epoch": 7697} {"train_loss": -27.855417251586914, "global_step": 638857, "epoch": 7697} {"train_loss": -27.950519561767578, "global_step": 638858, "epoch": 7697} {"train_loss": -28.03315544128418, "global_step": 638859, "epoch": 7697} {"train_loss": -28.054214477539062, "global_step": 638860, "epoch": 7697} {"train_loss": -28.253101348876953, "global_step": 638861, "epoch": 7697} {"train_loss": -28.093137741088867, "global_step": 638862, "epoch": 7697} {"train_loss": -27.89166259765625, "global_step": 638863, "epoch": 7697} {"train_loss": -27.883941650390625, "global_step": 638864, "epoch": 7697} {"train_loss": -28.464502334594727, "global_step": 638865, "epoch": 7697} {"train_loss": -28.110090255737305, "global_step": 638866, "epoch": 7697} {"train_loss": -28.126676559448242, "global_step": 638867, "epoch": 7697} {"train_loss": -28.011194229125977, "global_step": 638868, "epoch": 7697} {"train_loss": -28.321828842163086, "global_step": 638869, "epoch": 7697} {"train_loss": -28.426599502563477, "global_step": 638870, "epoch": 7697} {"train_loss": -28.3536319732666, "global_step": 638871, "epoch": 7697} {"train_loss": -27.868621826171875, "global_step": 638872, "epoch": 7697} {"train_loss": -27.653852462768555, "global_step": 638873, "epoch": 7697} {"train_loss": -28.521442413330078, "global_step": 638874, "epoch": 7697} {"train_loss": -28.156137466430664, "global_step": 638875, "epoch": 7697} {"train_loss": -28.244516372680664, "global_step": 638876, "epoch": 7697} {"train_loss": -27.880416870117188, "global_step": 638877, "epoch": 7697} {"train_loss": -28.023605346679688, "global_step": 638878, "epoch": 7697} {"train_loss": -28.134723663330078, "global_step": 638879, "epoch": 7697} {"train_loss": -28.080114364624023, "global_step": 638880, "epoch": 7697} {"train_loss": -28.29912757873535, "global_step": 638881, "epoch": 7697} {"train_loss": -28.44168472290039, "global_step": 638882, "epoch": 7697} {"train_loss": -28.168066024780273, "global_step": 638883, "epoch": 7697} {"train_loss": -28.221189498901367, "global_step": 638884, "epoch": 7697} {"train_loss": -28.181659698486328, "global_step": 638885, "epoch": 7697} {"train_loss": -28.08253288269043, "global_step": 638886, "epoch": 7697} {"train_loss": -27.87957763671875, "global_step": 638887, "epoch": 7697} {"train_loss": -28.269941329956055, "global_step": 638888, "epoch": 7697} {"train_loss": -28.624237060546875, "global_step": 638889, "epoch": 7697} {"train_loss": -28.30076026916504, "global_step": 638890, "epoch": 7697} {"train_loss": -28.356464385986328, "global_step": 638891, "epoch": 7697} {"train_loss": -28.010482788085938, "global_step": 638892, "epoch": 7697} {"train_loss": -28.485273361206055, "global_step": 638893, "epoch": 7697} {"train_loss": -28.290307998657227, "global_step": 638894, "epoch": 7697} {"train_loss": -28.125410079956055, "global_step": 638895, "epoch": 7697} {"train_loss": -28.4345703125, "global_step": 638896, "epoch": 7697} {"train_loss": -28.293943405151367, "global_step": 638897, "epoch": 7697} {"train_loss": -28.544843673706055, "global_step": 638898, "epoch": 7697} {"train_loss": -28.549367904663086, "global_step": 638899, "epoch": 7697} {"train_loss": -28.472320556640625, "global_step": 638900, "epoch": 7697} {"train_loss": -28.50789451599121, "global_step": 638901, "epoch": 7697} {"train_loss": -28.248117446899414, "global_step": 638902, "epoch": 7697} {"train_loss": -28.61587905883789, "global_step": 638903, "epoch": 7697} {"train_loss": -28.338842391967773, "global_step": 638904, "epoch": 7697} {"train_loss": -28.689350128173828, "global_step": 638905, "epoch": 7697} {"train_loss": -28.638320922851562, "global_step": 638906, "epoch": 7697} {"train_loss": -28.74994468688965, "global_step": 638907, "epoch": 7697} {"train_loss": -28.30985450744629, "global_step": 638908, "epoch": 7697} {"train_loss": -28.642044067382812, "global_step": 638909, "epoch": 7697} {"train_loss": -28.53203773498535, "global_step": 638910, "epoch": 7697} {"train_loss": -28.634220123291016, "global_step": 638911, "epoch": 7697} {"train_loss": -28.36566734313965, "global_step": 638912, "epoch": 7697} {"train_loss": -28.17755699157715, "global_step": 638913, "epoch": 7697} {"train_loss": -27.97608757019043, "global_step": 638914, "epoch": 7697} {"train_loss": -27.96339225769043, "global_step": 638915, "epoch": 7697} {"train_loss": -28.5496883392334, "global_step": 638916, "epoch": 7697} {"train_loss": -27.7913761138916, "global_step": 638917, "epoch": 7697} {"train_loss": -28.162973403930664, "global_step": 638918, "epoch": 7697} {"train_loss": -28.5146427154541, "global_step": 638919, "epoch": 7697} {"train_loss": -28.214902877807617, "global_step": 638920, "epoch": 7697} {"train_loss": -28.477197647094727, "global_step": 638921, "epoch": 7697} {"train_loss": -28.75396728515625, "global_step": 638922, "epoch": 7697} {"train_loss": -28.4235897064209, "global_step": 638923, "epoch": 7697} {"train_loss": -28.303119659423828, "global_step": 638924, "epoch": 7697} {"train_loss": -28.3557071685791, "global_step": 638925, "epoch": 7697} {"train_loss": -28.491891860961914, "global_step": 638926, "epoch": 7697} {"train_loss": -28.291889190673828, "global_step": 638927, "epoch": 7697} {"train_loss": -27.8969669342041, "global_step": 638928, "epoch": 7697} {"train_loss": -27.9714298248291, "global_step": 638929, "epoch": 7697} {"train_loss": -27.513751983642578, "global_step": 638930, "epoch": 7697} {"train_loss": -27.091833114624023, "global_step": 638931, "epoch": 7697} {"train_loss": -26.235427856445312, "global_step": 638932, "epoch": 7697} {"train_loss": -28.183432843311724, "global_step": 638933, "epoch": 7697, "val_loss": 6658082.5} {"train_loss": -24.445392608642578, "global_step": 638934, "epoch": 7698} {"train_loss": -21.535449981689453, "global_step": 638935, "epoch": 7698} {"train_loss": -25.32835578918457, "global_step": 638936, "epoch": 7698} {"train_loss": -24.903377532958984, "global_step": 638937, "epoch": 7698} {"train_loss": -25.170883178710938, "global_step": 638938, "epoch": 7698} {"train_loss": -25.59809684753418, "global_step": 638939, "epoch": 7698} {"train_loss": -25.33173942565918, "global_step": 638940, "epoch": 7698} {"train_loss": -26.444171905517578, "global_step": 638941, "epoch": 7698} {"train_loss": -25.957895278930664, "global_step": 638942, "epoch": 7698} {"train_loss": -27.047290802001953, "global_step": 638943, "epoch": 7698} {"train_loss": -25.922901153564453, "global_step": 638944, "epoch": 7698} {"train_loss": -26.3723087310791, "global_step": 638945, "epoch": 7698} {"train_loss": -26.69166374206543, "global_step": 638946, "epoch": 7698} {"train_loss": -26.707523345947266, "global_step": 638947, "epoch": 7698} {"train_loss": -26.784818649291992, "global_step": 638948, "epoch": 7698} {"train_loss": -26.530065536499023, "global_step": 638949, "epoch": 7698} {"train_loss": -26.44161033630371, "global_step": 638950, "epoch": 7698} {"train_loss": -27.083791732788086, "global_step": 638951, "epoch": 7698} {"train_loss": -26.864521026611328, "global_step": 638952, "epoch": 7698} {"train_loss": -27.057138442993164, "global_step": 638953, "epoch": 7698} {"train_loss": -26.614383697509766, "global_step": 638954, "epoch": 7698} {"train_loss": -26.950952529907227, "global_step": 638955, "epoch": 7698} {"train_loss": -27.573688507080078, "global_step": 638956, "epoch": 7698} {"train_loss": -27.100025177001953, "global_step": 638957, "epoch": 7698} {"train_loss": -27.202077865600586, "global_step": 638958, "epoch": 7698} {"train_loss": -27.248029708862305, "global_step": 638959, "epoch": 7698} {"train_loss": -27.140533447265625, "global_step": 638960, "epoch": 7698} {"train_loss": -27.25489616394043, "global_step": 638961, "epoch": 7698} {"train_loss": -27.10357666015625, "global_step": 638962, "epoch": 7698} {"train_loss": -27.378814697265625, "global_step": 638963, "epoch": 7698} {"train_loss": -27.337112426757812, "global_step": 638964, "epoch": 7698} {"train_loss": -27.167804718017578, "global_step": 638965, "epoch": 7698} {"train_loss": -27.728559494018555, "global_step": 638966, "epoch": 7698} {"train_loss": -27.518310546875, "global_step": 638967, "epoch": 7698} {"train_loss": -27.2421932220459, "global_step": 638968, "epoch": 7698} {"train_loss": -27.664295196533203, "global_step": 638969, "epoch": 7698} {"train_loss": -27.60059928894043, "global_step": 638970, "epoch": 7698} {"train_loss": -27.682653427124023, "global_step": 638971, "epoch": 7698} {"train_loss": -27.573415756225586, "global_step": 638972, "epoch": 7698} {"train_loss": -27.762989044189453, "global_step": 638973, "epoch": 7698} {"train_loss": -27.814496994018555, "global_step": 638974, "epoch": 7698} {"train_loss": -27.91621971130371, "global_step": 638975, "epoch": 7698} {"train_loss": -28.13071060180664, "global_step": 638976, "epoch": 7698} {"train_loss": -27.660688400268555, "global_step": 638977, "epoch": 7698} {"train_loss": -28.022634506225586, "global_step": 638978, "epoch": 7698} {"train_loss": -27.934680938720703, "global_step": 638979, "epoch": 7698} {"train_loss": -28.467161178588867, "global_step": 638980, "epoch": 7698} {"train_loss": -28.016132354736328, "global_step": 638981, "epoch": 7698} {"train_loss": -27.776840209960938, "global_step": 638982, "epoch": 7698} {"train_loss": -28.213184356689453, "global_step": 638983, "epoch": 7698} {"train_loss": -28.24720573425293, "global_step": 638984, "epoch": 7698} {"train_loss": -28.223480224609375, "global_step": 638985, "epoch": 7698} {"train_loss": -28.534626007080078, "global_step": 638986, "epoch": 7698} {"train_loss": -28.045862197875977, "global_step": 638987, "epoch": 7698} {"train_loss": -27.936553955078125, "global_step": 638988, "epoch": 7698} {"train_loss": -28.207386016845703, "global_step": 638989, "epoch": 7698} {"train_loss": -28.093124389648438, "global_step": 638990, "epoch": 7698} {"train_loss": -27.971399307250977, "global_step": 638991, "epoch": 7698} {"train_loss": -28.546796798706055, "global_step": 638992, "epoch": 7698} {"train_loss": -28.1578311920166, "global_step": 638993, "epoch": 7698} {"train_loss": -28.0209903717041, "global_step": 638994, "epoch": 7698} {"train_loss": -27.840829849243164, "global_step": 638995, "epoch": 7698} {"train_loss": -27.681350708007812, "global_step": 638996, "epoch": 7698} {"train_loss": -27.969022750854492, "global_step": 638997, "epoch": 7698} {"train_loss": -28.488998413085938, "global_step": 638998, "epoch": 7698} {"train_loss": -27.8719425201416, "global_step": 638999, "epoch": 7698} {"train_loss": -28.417404174804688, "global_step": 639000, "epoch": 7698} {"train_loss": -27.963226318359375, "global_step": 639001, "epoch": 7698} {"train_loss": -27.644834518432617, "global_step": 639002, "epoch": 7698} {"train_loss": -28.156299591064453, "global_step": 639003, "epoch": 7698} {"train_loss": -27.917938232421875, "global_step": 639004, "epoch": 7698} {"train_loss": -28.169294357299805, "global_step": 639005, "epoch": 7698} {"train_loss": -28.24796485900879, "global_step": 639006, "epoch": 7698} {"train_loss": -28.119054794311523, "global_step": 639007, "epoch": 7698} {"train_loss": -27.898168563842773, "global_step": 639008, "epoch": 7698} {"train_loss": -27.859060287475586, "global_step": 639009, "epoch": 7698} {"train_loss": -28.150190353393555, "global_step": 639010, "epoch": 7698} {"train_loss": -28.167444229125977, "global_step": 639011, "epoch": 7698} {"train_loss": -28.2456111907959, "global_step": 639012, "epoch": 7698} {"train_loss": -28.16596031188965, "global_step": 639013, "epoch": 7698} {"train_loss": -27.982126235961914, "global_step": 639014, "epoch": 7698} {"train_loss": -28.284149169921875, "global_step": 639015, "epoch": 7698} {"train_loss": -27.387851278465913, "global_step": 639016, "epoch": 7698, "val_loss": 6710668.5} {"train_loss": -26.636804580688477, "global_step": 639017, "epoch": 7699} {"train_loss": -27.018268585205078, "global_step": 639018, "epoch": 7699} {"train_loss": -27.542245864868164, "global_step": 639019, "epoch": 7699} {"train_loss": -27.761371612548828, "global_step": 639020, "epoch": 7699} {"train_loss": -27.485382080078125, "global_step": 639021, "epoch": 7699} {"train_loss": -27.658355712890625, "global_step": 639022, "epoch": 7699} {"train_loss": -27.502424240112305, "global_step": 639023, "epoch": 7699} {"train_loss": -27.6915225982666, "global_step": 639024, "epoch": 7699} {"train_loss": -27.72760009765625, "global_step": 639025, "epoch": 7699} {"train_loss": -27.90509033203125, "global_step": 639026, "epoch": 7699} {"train_loss": -27.535253524780273, "global_step": 639027, "epoch": 7699} {"train_loss": -28.14352798461914, "global_step": 639028, "epoch": 7699} {"train_loss": -27.776357650756836, "global_step": 639029, "epoch": 7699} {"train_loss": -27.8167781829834, "global_step": 639030, "epoch": 7699} {"train_loss": -28.21082878112793, "global_step": 639031, "epoch": 7699} {"train_loss": -28.174936294555664, "global_step": 639032, "epoch": 7699} {"train_loss": -28.058673858642578, "global_step": 639033, "epoch": 7699} {"train_loss": -28.03334617614746, "global_step": 639034, "epoch": 7699} {"train_loss": -28.094541549682617, "global_step": 639035, "epoch": 7699} {"train_loss": -28.135517120361328, "global_step": 639036, "epoch": 7699} {"train_loss": -28.204206466674805, "global_step": 639037, "epoch": 7699} {"train_loss": -28.023244857788086, "global_step": 639038, "epoch": 7699} {"train_loss": -28.47010612487793, "global_step": 639039, "epoch": 7699} {"train_loss": -28.688751220703125, "global_step": 639040, "epoch": 7699} {"train_loss": -27.821340560913086, "global_step": 639041, "epoch": 7699} {"train_loss": -27.953235626220703, "global_step": 639042, "epoch": 7699} {"train_loss": -28.08867835998535, "global_step": 639043, "epoch": 7699} {"train_loss": -28.229110717773438, "global_step": 639044, "epoch": 7699} {"train_loss": -28.2380428314209, "global_step": 639045, "epoch": 7699} {"train_loss": -28.287561416625977, "global_step": 639046, "epoch": 7699} {"train_loss": -28.21552848815918, "global_step": 639047, "epoch": 7699} {"train_loss": -28.25184440612793, "global_step": 639048, "epoch": 7699} {"train_loss": -28.15646743774414, "global_step": 639049, "epoch": 7699} {"train_loss": -28.443777084350586, "global_step": 639050, "epoch": 7699} {"train_loss": -28.1923770904541, "global_step": 639051, "epoch": 7699} {"train_loss": -28.184812545776367, "global_step": 639052, "epoch": 7699} {"train_loss": -28.227008819580078, "global_step": 639053, "epoch": 7699} {"train_loss": -28.446292877197266, "global_step": 639054, "epoch": 7699} {"train_loss": -28.211227416992188, "global_step": 639055, "epoch": 7699} {"train_loss": -28.4891357421875, "global_step": 639056, "epoch": 7699} {"train_loss": -28.17548179626465, "global_step": 639057, "epoch": 7699} {"train_loss": -28.18873405456543, "global_step": 639058, "epoch": 7699} {"train_loss": -28.450647354125977, "global_step": 639059, "epoch": 7699} {"train_loss": -28.351415634155273, "global_step": 639060, "epoch": 7699} {"train_loss": -28.22507667541504, "global_step": 639061, "epoch": 7699} {"train_loss": -28.200902938842773, "global_step": 639062, "epoch": 7699} {"train_loss": -28.220651626586914, "global_step": 639063, "epoch": 7699} {"train_loss": -28.365243911743164, "global_step": 639064, "epoch": 7699} {"train_loss": -28.32636833190918, "global_step": 639065, "epoch": 7699} {"train_loss": -28.385263442993164, "global_step": 639066, "epoch": 7699} {"train_loss": -28.290088653564453, "global_step": 639067, "epoch": 7699} {"train_loss": -28.554763793945312, "global_step": 639068, "epoch": 7699} {"train_loss": -28.408329010009766, "global_step": 639069, "epoch": 7699} {"train_loss": -27.86492919921875, "global_step": 639070, "epoch": 7699} {"train_loss": -28.432785034179688, "global_step": 639071, "epoch": 7699} {"train_loss": -28.386520385742188, "global_step": 639072, "epoch": 7699} {"train_loss": -28.552892684936523, "global_step": 639073, "epoch": 7699} {"train_loss": -28.474201202392578, "global_step": 639074, "epoch": 7699} {"train_loss": -28.553281784057617, "global_step": 639075, "epoch": 7699} {"train_loss": -28.343311309814453, "global_step": 639076, "epoch": 7699} {"train_loss": -28.1430721282959, "global_step": 639077, "epoch": 7699} {"train_loss": -28.43086814880371, "global_step": 639078, "epoch": 7699} {"train_loss": -28.191665649414062, "global_step": 639079, "epoch": 7699} {"train_loss": -27.825531005859375, "global_step": 639080, "epoch": 7699} {"train_loss": -25.87070655822754, "global_step": 639081, "epoch": 7699} {"train_loss": -21.788772583007812, "global_step": 639082, "epoch": 7699} {"train_loss": -24.0828800201416, "global_step": 639083, "epoch": 7699} {"train_loss": -27.825769424438477, "global_step": 639084, "epoch": 7699} {"train_loss": -25.16731071472168, "global_step": 639085, "epoch": 7699} {"train_loss": -27.158964157104492, "global_step": 639086, "epoch": 7699} {"train_loss": -27.057729721069336, "global_step": 639087, "epoch": 7699} {"train_loss": -26.755420684814453, "global_step": 639088, "epoch": 7699} {"train_loss": -27.750186920166016, "global_step": 639089, "epoch": 7699} {"train_loss": -27.491296768188477, "global_step": 639090, "epoch": 7699} {"train_loss": -27.503131866455078, "global_step": 639091, "epoch": 7699} {"train_loss": -27.804187774658203, "global_step": 639092, "epoch": 7699} {"train_loss": -27.77847671508789, "global_step": 639093, "epoch": 7699} {"train_loss": -27.64313316345215, "global_step": 639094, "epoch": 7699} {"train_loss": -27.646459579467773, "global_step": 639095, "epoch": 7699} {"train_loss": -28.017850875854492, "global_step": 639096, "epoch": 7699} {"train_loss": -28.279027938842773, "global_step": 639097, "epoch": 7699} {"train_loss": -28.0611515045166, "global_step": 639098, "epoch": 7699} {"train_loss": -27.848208232098315, "global_step": 639099, "epoch": 7699, "val_loss": 6619401.5} {"train_loss": -27.0710391998291, "global_step": 639100, "epoch": 7700} {"train_loss": -26.945234298706055, "global_step": 639101, "epoch": 7700} {"train_loss": -27.151660919189453, "global_step": 639102, "epoch": 7700} {"train_loss": -27.3048095703125, "global_step": 639103, "epoch": 7700} {"train_loss": -27.072479248046875, "global_step": 639104, "epoch": 7700} {"train_loss": -27.43140983581543, "global_step": 639105, "epoch": 7700} {"train_loss": -26.92388916015625, "global_step": 639106, "epoch": 7700} {"train_loss": -27.31418800354004, "global_step": 639107, "epoch": 7700} {"train_loss": -27.2488956451416, "global_step": 639108, "epoch": 7700} {"train_loss": -27.692285537719727, "global_step": 639109, "epoch": 7700} {"train_loss": -27.1264591217041, "global_step": 639110, "epoch": 7700} {"train_loss": -27.599634170532227, "global_step": 639111, "epoch": 7700} {"train_loss": -27.936237335205078, "global_step": 639112, "epoch": 7700} {"train_loss": -27.89519691467285, "global_step": 639113, "epoch": 7700} {"train_loss": -27.739486694335938, "global_step": 639114, "epoch": 7700} {"train_loss": -27.81537437438965, "global_step": 639115, "epoch": 7700} {"train_loss": -27.956695556640625, "global_step": 639116, "epoch": 7700} {"train_loss": -27.923171997070312, "global_step": 639117, "epoch": 7700} {"train_loss": -27.5734806060791, "global_step": 639118, "epoch": 7700} {"train_loss": -27.42333984375, "global_step": 639119, "epoch": 7700} {"train_loss": -27.68059730529785, "global_step": 639120, "epoch": 7700} {"train_loss": -27.865575790405273, "global_step": 639121, "epoch": 7700} {"train_loss": -27.882139205932617, "global_step": 639122, "epoch": 7700} {"train_loss": -27.827869415283203, "global_step": 639123, "epoch": 7700} {"train_loss": -28.322162628173828, "global_step": 639124, "epoch": 7700} {"train_loss": -28.018341064453125, "global_step": 639125, "epoch": 7700} {"train_loss": -27.464340209960938, "global_step": 639126, "epoch": 7700} {"train_loss": -27.978607177734375, "global_step": 639127, "epoch": 7700} {"train_loss": -27.626331329345703, "global_step": 639128, "epoch": 7700} {"train_loss": -27.72926902770996, "global_step": 639129, "epoch": 7700} {"train_loss": -28.141782760620117, "global_step": 639130, "epoch": 7700} {"train_loss": -28.135168075561523, "global_step": 639131, "epoch": 7700} {"train_loss": -28.51630973815918, "global_step": 639132, "epoch": 7700} {"train_loss": -28.330015182495117, "global_step": 639133, "epoch": 7700} {"train_loss": -27.9074764251709, "global_step": 639134, "epoch": 7700} {"train_loss": -28.226865768432617, "global_step": 639135, "epoch": 7700} {"train_loss": -28.026859283447266, "global_step": 639136, "epoch": 7700} {"train_loss": -28.126327514648438, "global_step": 639137, "epoch": 7700} {"train_loss": -28.117374420166016, "global_step": 639138, "epoch": 7700} {"train_loss": -27.996479034423828, "global_step": 639139, "epoch": 7700} {"train_loss": -28.123523712158203, "global_step": 639140, "epoch": 7700} {"train_loss": -28.16650390625, "global_step": 639141, "epoch": 7700} {"train_loss": -28.386804580688477, "global_step": 639142, "epoch": 7700} {"train_loss": -28.41282081604004, "global_step": 639143, "epoch": 7700} {"train_loss": -28.263696670532227, "global_step": 639144, "epoch": 7700} {"train_loss": -28.133056640625, "global_step": 639145, "epoch": 7700} {"train_loss": -28.339859008789062, "global_step": 639146, "epoch": 7700} {"train_loss": -27.870954513549805, "global_step": 639147, "epoch": 7700} {"train_loss": -28.13556480407715, "global_step": 639148, "epoch": 7700} {"train_loss": -27.98141860961914, "global_step": 639149, "epoch": 7700} {"train_loss": -27.78263282775879, "global_step": 639150, "epoch": 7700} {"train_loss": -27.7489070892334, "global_step": 639151, "epoch": 7700} {"train_loss": -28.112478256225586, "global_step": 639152, "epoch": 7700} {"train_loss": -27.88580894470215, "global_step": 639153, "epoch": 7700} {"train_loss": -28.163610458374023, "global_step": 639154, "epoch": 7700} {"train_loss": -27.461734771728516, "global_step": 639155, "epoch": 7700} {"train_loss": -28.356678009033203, "global_step": 639156, "epoch": 7700} {"train_loss": -28.2159481048584, "global_step": 639157, "epoch": 7700} {"train_loss": -27.711328506469727, "global_step": 639158, "epoch": 7700} {"train_loss": -28.314258575439453, "global_step": 639159, "epoch": 7700} {"train_loss": -28.021991729736328, "global_step": 639160, "epoch": 7700} {"train_loss": -27.954519271850586, "global_step": 639161, "epoch": 7700} {"train_loss": -28.094533920288086, "global_step": 639162, "epoch": 7700} {"train_loss": -28.00214958190918, "global_step": 639163, "epoch": 7700} {"train_loss": -28.228235244750977, "global_step": 639164, "epoch": 7700} {"train_loss": -27.915332794189453, "global_step": 639165, "epoch": 7700} {"train_loss": -28.21189308166504, "global_step": 639166, "epoch": 7700} {"train_loss": -27.866565704345703, "global_step": 639167, "epoch": 7700} {"train_loss": -28.040616989135742, "global_step": 639168, "epoch": 7700} {"train_loss": -28.266035079956055, "global_step": 639169, "epoch": 7700} {"train_loss": -28.1267147064209, "global_step": 639170, "epoch": 7700} {"train_loss": -28.175668716430664, "global_step": 639171, "epoch": 7700} {"train_loss": -27.585485458374023, "global_step": 639172, "epoch": 7700} {"train_loss": -28.008167266845703, "global_step": 639173, "epoch": 7700} {"train_loss": -28.319961547851562, "global_step": 639174, "epoch": 7700} {"train_loss": -28.134048461914062, "global_step": 639175, "epoch": 7700} {"train_loss": -27.94806480407715, "global_step": 639176, "epoch": 7700} {"train_loss": -27.705602645874023, "global_step": 639177, "epoch": 7700} {"train_loss": -28.025171279907227, "global_step": 639178, "epoch": 7700} {"train_loss": -28.315235137939453, "global_step": 639179, "epoch": 7700} {"train_loss": -27.799880981445312, "global_step": 639180, "epoch": 7700} {"train_loss": -28.156702041625977, "global_step": 639181, "epoch": 7700} {"train_loss": -27.900214551443078, "global_step": 639182, "epoch": 7700, "train/sim_max_reward_0": 0.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 0.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4500000": 1.0, "test/sim_max_reward_4500001": 1.0, "test/sim_max_reward_4500002": 1.0, "test/sim_max_reward_4500003": 1.0, "test/sim_max_reward_4500004": 1.0, "test/sim_max_reward_4500005": 1.0, "test/sim_max_reward_4500006": 1.0, "test/sim_max_reward_4500007": 0.0, "test/sim_max_reward_4500008": 1.0, "test/sim_max_reward_4500009": 1.0, "test/sim_max_reward_4500010": 1.0, "test/sim_max_reward_4500011": 1.0, "test/sim_max_reward_4500012": 1.0, "test/sim_max_reward_4500013": 0.0, "test/sim_max_reward_4500014": 1.0, "test/sim_max_reward_4500015": 1.0, "test/sim_max_reward_4500016": 1.0, "test/sim_max_reward_4500017": 1.0, "test/sim_max_reward_4500018": 0.0, "test/sim_max_reward_4500019": 0.0, "test/sim_max_reward_4500020": 0.0, "test/sim_max_reward_4500021": 1.0, "train/mean_score": 0.6666666666666666, "test/mean_score": 0.7727272727272727, "val_loss": 6613586.0} {"train_loss": -27.133405685424805, "global_step": 639183, "epoch": 7701} {"train_loss": -27.48347282409668, "global_step": 639184, "epoch": 7701} {"train_loss": -27.675445556640625, "global_step": 639185, "epoch": 7701} {"train_loss": -27.565845489501953, "global_step": 639186, "epoch": 7701} {"train_loss": -27.426721572875977, "global_step": 639187, "epoch": 7701} {"train_loss": -27.863508224487305, "global_step": 639188, "epoch": 7701} {"train_loss": -27.035547256469727, "global_step": 639189, "epoch": 7701} {"train_loss": -27.43067741394043, "global_step": 639190, "epoch": 7701} {"train_loss": -27.965652465820312, "global_step": 639191, "epoch": 7701} {"train_loss": -27.47015380859375, "global_step": 639192, "epoch": 7701} {"train_loss": -27.7305850982666, "global_step": 639193, "epoch": 7701} {"train_loss": -27.5163516998291, "global_step": 639194, "epoch": 7701} {"train_loss": -28.044158935546875, "global_step": 639195, "epoch": 7701} {"train_loss": -27.442535400390625, "global_step": 639196, "epoch": 7701} {"train_loss": -28.375045776367188, "global_step": 639197, "epoch": 7701} {"train_loss": -27.909809112548828, "global_step": 639198, "epoch": 7701} {"train_loss": -27.93739891052246, "global_step": 639199, "epoch": 7701} {"train_loss": -27.61793327331543, "global_step": 639200, "epoch": 7701} {"train_loss": -27.758594512939453, "global_step": 639201, "epoch": 7701} {"train_loss": -27.699207305908203, "global_step": 639202, "epoch": 7701} {"train_loss": -27.82046890258789, "global_step": 639203, "epoch": 7701} {"train_loss": -27.74030113220215, "global_step": 639204, "epoch": 7701} {"train_loss": -28.11065673828125, "global_step": 639205, "epoch": 7701} {"train_loss": -28.004316329956055, "global_step": 639206, "epoch": 7701} {"train_loss": -28.38298988342285, "global_step": 639207, "epoch": 7701} {"train_loss": -28.303586959838867, "global_step": 639208, "epoch": 7701} {"train_loss": -28.267179489135742, "global_step": 639209, "epoch": 7701} {"train_loss": -28.091360092163086, "global_step": 639210, "epoch": 7701} {"train_loss": -28.347686767578125, "global_step": 639211, "epoch": 7701} {"train_loss": -28.21009635925293, "global_step": 639212, "epoch": 7701} {"train_loss": -28.3916015625, "global_step": 639213, "epoch": 7701} {"train_loss": -28.329504013061523, "global_step": 639214, "epoch": 7701} {"train_loss": -28.17166519165039, "global_step": 639215, "epoch": 7701} {"train_loss": -28.516653060913086, "global_step": 639216, "epoch": 7701} {"train_loss": -28.226530075073242, "global_step": 639217, "epoch": 7701} {"train_loss": -28.4300479888916, "global_step": 639218, "epoch": 7701} {"train_loss": -28.42608642578125, "global_step": 639219, "epoch": 7701} {"train_loss": -28.228851318359375, "global_step": 639220, "epoch": 7701} {"train_loss": -28.591552734375, "global_step": 639221, "epoch": 7701} {"train_loss": -28.517810821533203, "global_step": 639222, "epoch": 7701} {"train_loss": -28.64686393737793, "global_step": 639223, "epoch": 7701} {"train_loss": -28.382612228393555, "global_step": 639224, "epoch": 7701} {"train_loss": -28.174041748046875, "global_step": 639225, "epoch": 7701} {"train_loss": -28.242544174194336, "global_step": 639226, "epoch": 7701} {"train_loss": -28.601306915283203, "global_step": 639227, "epoch": 7701} {"train_loss": -28.716644287109375, "global_step": 639228, "epoch": 7701} {"train_loss": -28.58062171936035, "global_step": 639229, "epoch": 7701} {"train_loss": -28.405853271484375, "global_step": 639230, "epoch": 7701} {"train_loss": -28.58831787109375, "global_step": 639231, "epoch": 7701} {"train_loss": -28.2946720123291, "global_step": 639232, "epoch": 7701} {"train_loss": -28.444610595703125, "global_step": 639233, "epoch": 7701} {"train_loss": -28.264514923095703, "global_step": 639234, "epoch": 7701} {"train_loss": -28.6282958984375, "global_step": 639235, "epoch": 7701} {"train_loss": -28.91489601135254, "global_step": 639236, "epoch": 7701} {"train_loss": -28.2709903717041, "global_step": 639237, "epoch": 7701} {"train_loss": -28.33209228515625, "global_step": 639238, "epoch": 7701} {"train_loss": -28.198043823242188, "global_step": 639239, "epoch": 7701} {"train_loss": -28.60394859313965, "global_step": 639240, "epoch": 7701} {"train_loss": -28.375186920166016, "global_step": 639241, "epoch": 7701} {"train_loss": -28.7779483795166, "global_step": 639242, "epoch": 7701} {"train_loss": -28.408802032470703, "global_step": 639243, "epoch": 7701} {"train_loss": -28.846525192260742, "global_step": 639244, "epoch": 7701} {"train_loss": -28.925739288330078, "global_step": 639245, "epoch": 7701} {"train_loss": -28.548690795898438, "global_step": 639246, "epoch": 7701} {"train_loss": -28.2044734954834, "global_step": 639247, "epoch": 7701} {"train_loss": -28.410968780517578, "global_step": 639248, "epoch": 7701} {"train_loss": -28.2873592376709, "global_step": 639249, "epoch": 7701} {"train_loss": -27.557783126831055, "global_step": 639250, "epoch": 7701} {"train_loss": -27.2816219329834, "global_step": 639251, "epoch": 7701} {"train_loss": -26.370553970336914, "global_step": 639252, "epoch": 7701} {"train_loss": -26.030776977539062, "global_step": 639253, "epoch": 7701} {"train_loss": -27.062870025634766, "global_step": 639254, "epoch": 7701} {"train_loss": -28.07415771484375, "global_step": 639255, "epoch": 7701} {"train_loss": -27.125654220581055, "global_step": 639256, "epoch": 7701} {"train_loss": -27.710296630859375, "global_step": 639257, "epoch": 7701} {"train_loss": -27.672109603881836, "global_step": 639258, "epoch": 7701} {"train_loss": -27.92303466796875, "global_step": 639259, "epoch": 7701} {"train_loss": -28.088550567626953, "global_step": 639260, "epoch": 7701} {"train_loss": -28.24749183654785, "global_step": 639261, "epoch": 7701} {"train_loss": -27.74114990234375, "global_step": 639262, "epoch": 7701} {"train_loss": -28.016895294189453, "global_step": 639263, "epoch": 7701} {"train_loss": -27.928709030151367, "global_step": 639264, "epoch": 7701} {"train_loss": -28.02645338587014, "global_step": 639265, "epoch": 7701, "val_loss": 6685092.0} {"train_loss": -27.609912872314453, "global_step": 639266, "epoch": 7702} {"train_loss": -27.655027389526367, "global_step": 639267, "epoch": 7702} {"train_loss": -27.854928970336914, "global_step": 639268, "epoch": 7702} {"train_loss": -27.40850830078125, "global_step": 639269, "epoch": 7702} {"train_loss": -27.628772735595703, "global_step": 639270, "epoch": 7702} {"train_loss": -27.58441734313965, "global_step": 639271, "epoch": 7702} {"train_loss": -27.942337036132812, "global_step": 639272, "epoch": 7702} {"train_loss": -27.855390548706055, "global_step": 639273, "epoch": 7702} {"train_loss": -27.97065544128418, "global_step": 639274, "epoch": 7702} {"train_loss": -28.027734756469727, "global_step": 639275, "epoch": 7702} {"train_loss": -27.862180709838867, "global_step": 639276, "epoch": 7702} {"train_loss": -28.011682510375977, "global_step": 639277, "epoch": 7702} {"train_loss": -28.11944580078125, "global_step": 639278, "epoch": 7702} {"train_loss": -28.00009536743164, "global_step": 639279, "epoch": 7702} {"train_loss": -28.42353630065918, "global_step": 639280, "epoch": 7702} {"train_loss": -27.82451820373535, "global_step": 639281, "epoch": 7702} {"train_loss": -27.690509796142578, "global_step": 639282, "epoch": 7702} {"train_loss": -28.24818229675293, "global_step": 639283, "epoch": 7702} {"train_loss": -27.86842155456543, "global_step": 639284, "epoch": 7702} {"train_loss": -27.855749130249023, "global_step": 639285, "epoch": 7702} {"train_loss": -28.241296768188477, "global_step": 639286, "epoch": 7702} {"train_loss": -28.38409996032715, "global_step": 639287, "epoch": 7702} {"train_loss": -28.19463539123535, "global_step": 639288, "epoch": 7702} {"train_loss": -28.352827072143555, "global_step": 639289, "epoch": 7702} {"train_loss": -28.198476791381836, "global_step": 639290, "epoch": 7702} {"train_loss": -28.320556640625, "global_step": 639291, "epoch": 7702} {"train_loss": -28.148099899291992, "global_step": 639292, "epoch": 7702} {"train_loss": -28.21026039123535, "global_step": 639293, "epoch": 7702} {"train_loss": -28.381567001342773, "global_step": 639294, "epoch": 7702} {"train_loss": -28.31406021118164, "global_step": 639295, "epoch": 7702} {"train_loss": -28.173734664916992, "global_step": 639296, "epoch": 7702} {"train_loss": -28.567291259765625, "global_step": 639297, "epoch": 7702} {"train_loss": -28.22092628479004, "global_step": 639298, "epoch": 7702} {"train_loss": -28.01715087890625, "global_step": 639299, "epoch": 7702} {"train_loss": -28.37713050842285, "global_step": 639300, "epoch": 7702} {"train_loss": -28.321577072143555, "global_step": 639301, "epoch": 7702} {"train_loss": -28.297733306884766, "global_step": 639302, "epoch": 7702} {"train_loss": -28.6010799407959, "global_step": 639303, "epoch": 7702} {"train_loss": -28.16633415222168, "global_step": 639304, "epoch": 7702} {"train_loss": -28.33466911315918, "global_step": 639305, "epoch": 7702} {"train_loss": -28.489511489868164, "global_step": 639306, "epoch": 7702} {"train_loss": -28.4312801361084, "global_step": 639307, "epoch": 7702} {"train_loss": -28.497772216796875, "global_step": 639308, "epoch": 7702} {"train_loss": -28.45086097717285, "global_step": 639309, "epoch": 7702} {"train_loss": -28.289941787719727, "global_step": 639310, "epoch": 7702} {"train_loss": -28.427087783813477, "global_step": 639311, "epoch": 7702} {"train_loss": -28.4173583984375, "global_step": 639312, "epoch": 7702} {"train_loss": -28.514745712280273, "global_step": 639313, "epoch": 7702} {"train_loss": -28.328765869140625, "global_step": 639314, "epoch": 7702} {"train_loss": -28.552886962890625, "global_step": 639315, "epoch": 7702} {"train_loss": -28.582883834838867, "global_step": 639316, "epoch": 7702} {"train_loss": -28.0653133392334, "global_step": 639317, "epoch": 7702} {"train_loss": -28.05573844909668, "global_step": 639318, "epoch": 7702} {"train_loss": -28.30449867248535, "global_step": 639319, "epoch": 7702} {"train_loss": -28.752267837524414, "global_step": 639320, "epoch": 7702} {"train_loss": -28.460111618041992, "global_step": 639321, "epoch": 7702} {"train_loss": -28.348682403564453, "global_step": 639322, "epoch": 7702} {"train_loss": -28.409961700439453, "global_step": 639323, "epoch": 7702} {"train_loss": -28.2889404296875, "global_step": 639324, "epoch": 7702} {"train_loss": -28.390928268432617, "global_step": 639325, "epoch": 7702} {"train_loss": -28.418304443359375, "global_step": 639326, "epoch": 7702} {"train_loss": -28.32581901550293, "global_step": 639327, "epoch": 7702} {"train_loss": -28.510053634643555, "global_step": 639328, "epoch": 7702} {"train_loss": -28.493667602539062, "global_step": 639329, "epoch": 7702} {"train_loss": -28.516925811767578, "global_step": 639330, "epoch": 7702} {"train_loss": -28.88035011291504, "global_step": 639331, "epoch": 7702} {"train_loss": -28.724079132080078, "global_step": 639332, "epoch": 7702} {"train_loss": -28.34027671813965, "global_step": 639333, "epoch": 7702} {"train_loss": -28.371265411376953, "global_step": 639334, "epoch": 7702} {"train_loss": -28.563690185546875, "global_step": 639335, "epoch": 7702} {"train_loss": -28.436975479125977, "global_step": 639336, "epoch": 7702} {"train_loss": -28.141244888305664, "global_step": 639337, "epoch": 7702} {"train_loss": -28.603504180908203, "global_step": 639338, "epoch": 7702} {"train_loss": -28.338459014892578, "global_step": 639339, "epoch": 7702} {"train_loss": -28.379545211791992, "global_step": 639340, "epoch": 7702} {"train_loss": -28.6157169342041, "global_step": 639341, "epoch": 7702} {"train_loss": -27.905466079711914, "global_step": 639342, "epoch": 7702} {"train_loss": -28.223041534423828, "global_step": 639343, "epoch": 7702} {"train_loss": -28.141210556030273, "global_step": 639344, "epoch": 7702} {"train_loss": -28.027759552001953, "global_step": 639345, "epoch": 7702} {"train_loss": -28.749475479125977, "global_step": 639346, "epoch": 7702} {"train_loss": -28.127145767211914, "global_step": 639347, "epoch": 7702} {"train_loss": -28.235689370028943, "global_step": 639348, "epoch": 7702, "val_loss": 6734253.0} {"train_loss": -25.421598434448242, "global_step": 639349, "epoch": 7703} {"train_loss": -23.33866310119629, "global_step": 639350, "epoch": 7703} {"train_loss": -26.022382736206055, "global_step": 639351, "epoch": 7703} {"train_loss": -26.169879913330078, "global_step": 639352, "epoch": 7703} {"train_loss": -26.649768829345703, "global_step": 639353, "epoch": 7703} {"train_loss": -25.767038345336914, "global_step": 639354, "epoch": 7703} {"train_loss": -26.92343521118164, "global_step": 639355, "epoch": 7703} {"train_loss": -26.70990562438965, "global_step": 639356, "epoch": 7703} {"train_loss": -27.37986183166504, "global_step": 639357, "epoch": 7703} {"train_loss": -26.620010375976562, "global_step": 639358, "epoch": 7703} {"train_loss": -27.361963272094727, "global_step": 639359, "epoch": 7703} {"train_loss": -27.370147705078125, "global_step": 639360, "epoch": 7703} {"train_loss": -26.90896987915039, "global_step": 639361, "epoch": 7703} {"train_loss": -27.338897705078125, "global_step": 639362, "epoch": 7703} {"train_loss": -27.593738555908203, "global_step": 639363, "epoch": 7703} {"train_loss": -27.588367462158203, "global_step": 639364, "epoch": 7703} {"train_loss": -27.832273483276367, "global_step": 639365, "epoch": 7703} {"train_loss": -27.537689208984375, "global_step": 639366, "epoch": 7703} {"train_loss": -28.006519317626953, "global_step": 639367, "epoch": 7703} {"train_loss": -28.000701904296875, "global_step": 639368, "epoch": 7703} {"train_loss": -27.9636287689209, "global_step": 639369, "epoch": 7703} {"train_loss": -27.47285270690918, "global_step": 639370, "epoch": 7703} {"train_loss": -27.93943214416504, "global_step": 639371, "epoch": 7703} {"train_loss": -27.981870651245117, "global_step": 639372, "epoch": 7703} {"train_loss": -27.553632736206055, "global_step": 639373, "epoch": 7703} {"train_loss": -27.500497817993164, "global_step": 639374, "epoch": 7703} {"train_loss": -27.778425216674805, "global_step": 639375, "epoch": 7703} {"train_loss": -27.980579376220703, "global_step": 639376, "epoch": 7703} {"train_loss": -28.260360717773438, "global_step": 639377, "epoch": 7703} {"train_loss": -28.044361114501953, "global_step": 639378, "epoch": 7703} {"train_loss": -28.281204223632812, "global_step": 639379, "epoch": 7703} {"train_loss": -27.61199378967285, "global_step": 639380, "epoch": 7703} {"train_loss": -28.090972900390625, "global_step": 639381, "epoch": 7703} {"train_loss": -28.26685905456543, "global_step": 639382, "epoch": 7703} {"train_loss": -28.389245986938477, "global_step": 639383, "epoch": 7703} {"train_loss": -28.461362838745117, "global_step": 639384, "epoch": 7703} {"train_loss": -28.165258407592773, "global_step": 639385, "epoch": 7703} {"train_loss": -28.49039077758789, "global_step": 639386, "epoch": 7703} {"train_loss": -27.79987907409668, "global_step": 639387, "epoch": 7703} {"train_loss": -28.13909339904785, "global_step": 639388, "epoch": 7703} {"train_loss": -28.0657958984375, "global_step": 639389, "epoch": 7703} {"train_loss": -28.552350997924805, "global_step": 639390, "epoch": 7703} {"train_loss": -28.099597930908203, "global_step": 639391, "epoch": 7703} {"train_loss": -28.41156578063965, "global_step": 639392, "epoch": 7703} {"train_loss": -28.030792236328125, "global_step": 639393, "epoch": 7703} {"train_loss": -28.16885757446289, "global_step": 639394, "epoch": 7703} {"train_loss": -28.23406410217285, "global_step": 639395, "epoch": 7703} {"train_loss": -28.15924072265625, "global_step": 639396, "epoch": 7703} {"train_loss": -28.165876388549805, "global_step": 639397, "epoch": 7703} {"train_loss": -28.417043685913086, "global_step": 639398, "epoch": 7703} {"train_loss": -28.219736099243164, "global_step": 639399, "epoch": 7703} {"train_loss": -28.05417251586914, "global_step": 639400, "epoch": 7703} {"train_loss": -27.876142501831055, "global_step": 639401, "epoch": 7703} {"train_loss": -28.235864639282227, "global_step": 639402, "epoch": 7703} {"train_loss": -28.2890567779541, "global_step": 639403, "epoch": 7703} {"train_loss": -28.461902618408203, "global_step": 639404, "epoch": 7703} {"train_loss": -28.696063995361328, "global_step": 639405, "epoch": 7703} {"train_loss": -28.313114166259766, "global_step": 639406, "epoch": 7703} {"train_loss": -27.900196075439453, "global_step": 639407, "epoch": 7703} {"train_loss": -28.372955322265625, "global_step": 639408, "epoch": 7703} {"train_loss": -28.40691566467285, "global_step": 639409, "epoch": 7703} {"train_loss": -28.468595504760742, "global_step": 639410, "epoch": 7703} {"train_loss": -28.240589141845703, "global_step": 639411, "epoch": 7703} {"train_loss": -28.04664421081543, "global_step": 639412, "epoch": 7703} {"train_loss": -28.296539306640625, "global_step": 639413, "epoch": 7703} {"train_loss": -28.215368270874023, "global_step": 639414, "epoch": 7703} {"train_loss": -28.2401065826416, "global_step": 639415, "epoch": 7703} {"train_loss": -28.366455078125, "global_step": 639416, "epoch": 7703} {"train_loss": -28.32899284362793, "global_step": 639417, "epoch": 7703} {"train_loss": -28.179061889648438, "global_step": 639418, "epoch": 7703} {"train_loss": -28.587814331054688, "global_step": 639419, "epoch": 7703} {"train_loss": -28.474552154541016, "global_step": 639420, "epoch": 7703} {"train_loss": -28.376270294189453, "global_step": 639421, "epoch": 7703} {"train_loss": -28.811965942382812, "global_step": 639422, "epoch": 7703} {"train_loss": -28.417272567749023, "global_step": 639423, "epoch": 7703} {"train_loss": -28.6784725189209, "global_step": 639424, "epoch": 7703} {"train_loss": -28.639673233032227, "global_step": 639425, "epoch": 7703} {"train_loss": -28.617395401000977, "global_step": 639426, "epoch": 7703} {"train_loss": -28.6365966796875, "global_step": 639427, "epoch": 7703} {"train_loss": -28.26204490661621, "global_step": 639428, "epoch": 7703} {"train_loss": -28.469465255737305, "global_step": 639429, "epoch": 7703} {"train_loss": -27.963672637939453, "global_step": 639430, "epoch": 7703} {"train_loss": -27.874069328767707, "global_step": 639431, "epoch": 7703, "val_loss": 6856271.0} {"train_loss": -26.30857276916504, "global_step": 639432, "epoch": 7704} {"train_loss": -24.942188262939453, "global_step": 639433, "epoch": 7704} {"train_loss": -26.44736099243164, "global_step": 639434, "epoch": 7704} {"train_loss": -27.512500762939453, "global_step": 639435, "epoch": 7704} {"train_loss": -25.886938095092773, "global_step": 639436, "epoch": 7704} {"train_loss": -27.396778106689453, "global_step": 639437, "epoch": 7704} {"train_loss": -26.273101806640625, "global_step": 639438, "epoch": 7704} {"train_loss": -27.478071212768555, "global_step": 639439, "epoch": 7704} {"train_loss": -26.65772819519043, "global_step": 639440, "epoch": 7704} {"train_loss": -27.677637100219727, "global_step": 639441, "epoch": 7704} {"train_loss": -27.07866859436035, "global_step": 639442, "epoch": 7704} {"train_loss": -27.375320434570312, "global_step": 639443, "epoch": 7704} {"train_loss": -27.791669845581055, "global_step": 639444, "epoch": 7704} {"train_loss": -27.601987838745117, "global_step": 639445, "epoch": 7704} {"train_loss": -27.918411254882812, "global_step": 639446, "epoch": 7704} {"train_loss": -27.54813003540039, "global_step": 639447, "epoch": 7704} {"train_loss": -27.06180191040039, "global_step": 639448, "epoch": 7704} {"train_loss": -27.461328506469727, "global_step": 639449, "epoch": 7704} {"train_loss": -27.714757919311523, "global_step": 639450, "epoch": 7704} {"train_loss": -28.267322540283203, "global_step": 639451, "epoch": 7704} {"train_loss": -27.934484481811523, "global_step": 639452, "epoch": 7704} {"train_loss": -28.0484561920166, "global_step": 639453, "epoch": 7704} {"train_loss": -28.04558753967285, "global_step": 639454, "epoch": 7704} {"train_loss": -27.744775772094727, "global_step": 639455, "epoch": 7704} {"train_loss": -27.752552032470703, "global_step": 639456, "epoch": 7704} {"train_loss": -27.814422607421875, "global_step": 639457, "epoch": 7704} {"train_loss": -28.025074005126953, "global_step": 639458, "epoch": 7704} {"train_loss": -28.383243560791016, "global_step": 639459, "epoch": 7704} {"train_loss": -28.009124755859375, "global_step": 639460, "epoch": 7704} {"train_loss": -27.897565841674805, "global_step": 639461, "epoch": 7704} {"train_loss": -28.1411075592041, "global_step": 639462, "epoch": 7704} {"train_loss": -27.944379806518555, "global_step": 639463, "epoch": 7704} {"train_loss": -27.937238693237305, "global_step": 639464, "epoch": 7704} {"train_loss": -28.353103637695312, "global_step": 639465, "epoch": 7704} {"train_loss": -28.107654571533203, "global_step": 639466, "epoch": 7704} {"train_loss": -28.061737060546875, "global_step": 639467, "epoch": 7704} {"train_loss": -27.99871253967285, "global_step": 639468, "epoch": 7704} {"train_loss": -28.180374145507812, "global_step": 639469, "epoch": 7704} {"train_loss": -28.07500648498535, "global_step": 639470, "epoch": 7704} {"train_loss": -27.95904541015625, "global_step": 639471, "epoch": 7704} {"train_loss": -27.93463134765625, "global_step": 639472, "epoch": 7704} {"train_loss": -27.97413444519043, "global_step": 639473, "epoch": 7704} {"train_loss": -28.28242301940918, "global_step": 639474, "epoch": 7704} {"train_loss": -28.29385757446289, "global_step": 639475, "epoch": 7704} {"train_loss": -27.98797607421875, "global_step": 639476, "epoch": 7704} {"train_loss": -28.06589126586914, "global_step": 639477, "epoch": 7704} {"train_loss": -27.769872665405273, "global_step": 639478, "epoch": 7704} {"train_loss": -28.06549072265625, "global_step": 639479, "epoch": 7704} {"train_loss": -28.408430099487305, "global_step": 639480, "epoch": 7704} {"train_loss": -27.83249282836914, "global_step": 639481, "epoch": 7704} {"train_loss": -27.72675132751465, "global_step": 639482, "epoch": 7704} {"train_loss": -27.96978759765625, "global_step": 639483, "epoch": 7704} {"train_loss": -28.27434730529785, "global_step": 639484, "epoch": 7704} {"train_loss": -28.360523223876953, "global_step": 639485, "epoch": 7704} {"train_loss": -28.3335018157959, "global_step": 639486, "epoch": 7704} {"train_loss": -27.918970108032227, "global_step": 639487, "epoch": 7704} {"train_loss": -27.971481323242188, "global_step": 639488, "epoch": 7704} {"train_loss": -28.3660945892334, "global_step": 639489, "epoch": 7704} {"train_loss": -27.91944694519043, "global_step": 639490, "epoch": 7704} {"train_loss": -27.975309371948242, "global_step": 639491, "epoch": 7704} {"train_loss": -28.470849990844727, "global_step": 639492, "epoch": 7704} {"train_loss": -27.8624267578125, "global_step": 639493, "epoch": 7704} {"train_loss": -28.204320907592773, "global_step": 639494, "epoch": 7704} {"train_loss": -27.904821395874023, "global_step": 639495, "epoch": 7704} {"train_loss": -28.408788681030273, "global_step": 639496, "epoch": 7704} {"train_loss": -28.003732681274414, "global_step": 639497, "epoch": 7704} {"train_loss": -28.21319580078125, "global_step": 639498, "epoch": 7704} {"train_loss": -28.32392692565918, "global_step": 639499, "epoch": 7704} {"train_loss": -28.27205467224121, "global_step": 639500, "epoch": 7704} {"train_loss": -28.00666618347168, "global_step": 639501, "epoch": 7704} {"train_loss": -28.075637817382812, "global_step": 639502, "epoch": 7704} {"train_loss": -28.453540802001953, "global_step": 639503, "epoch": 7704} {"train_loss": -28.256738662719727, "global_step": 639504, "epoch": 7704} {"train_loss": -27.975666046142578, "global_step": 639505, "epoch": 7704} {"train_loss": -28.688512802124023, "global_step": 639506, "epoch": 7704} {"train_loss": -28.262067794799805, "global_step": 639507, "epoch": 7704} {"train_loss": -28.521575927734375, "global_step": 639508, "epoch": 7704} {"train_loss": -28.2713565826416, "global_step": 639509, "epoch": 7704} {"train_loss": -28.23589515686035, "global_step": 639510, "epoch": 7704} {"train_loss": -28.343976974487305, "global_step": 639511, "epoch": 7704} {"train_loss": -28.402862548828125, "global_step": 639512, "epoch": 7704} {"train_loss": -28.65888786315918, "global_step": 639513, "epoch": 7704} {"train_loss": -27.891313391995716, "global_step": 639514, "epoch": 7704, "val_loss": 6732751.0} {"train_loss": -27.504379272460938, "global_step": 639515, "epoch": 7705} {"train_loss": -27.922006607055664, "global_step": 639516, "epoch": 7705} {"train_loss": -27.20318603515625, "global_step": 639517, "epoch": 7705} {"train_loss": -27.4252986907959, "global_step": 639518, "epoch": 7705} {"train_loss": -27.368000030517578, "global_step": 639519, "epoch": 7705} {"train_loss": -27.846027374267578, "global_step": 639520, "epoch": 7705} {"train_loss": -27.33696937561035, "global_step": 639521, "epoch": 7705} {"train_loss": -27.63254737854004, "global_step": 639522, "epoch": 7705} {"train_loss": -27.769088745117188, "global_step": 639523, "epoch": 7705} {"train_loss": -27.291553497314453, "global_step": 639524, "epoch": 7705} {"train_loss": -27.684310913085938, "global_step": 639525, "epoch": 7705} {"train_loss": -27.32137107849121, "global_step": 639526, "epoch": 7705} {"train_loss": -27.86586570739746, "global_step": 639527, "epoch": 7705} {"train_loss": -28.035924911499023, "global_step": 639528, "epoch": 7705} {"train_loss": -28.031980514526367, "global_step": 639529, "epoch": 7705} {"train_loss": -27.964303970336914, "global_step": 639530, "epoch": 7705} {"train_loss": -27.78156089782715, "global_step": 639531, "epoch": 7705} {"train_loss": -27.611169815063477, "global_step": 639532, "epoch": 7705} {"train_loss": -28.002700805664062, "global_step": 639533, "epoch": 7705} {"train_loss": -28.420679092407227, "global_step": 639534, "epoch": 7705} {"train_loss": -28.201797485351562, "global_step": 639535, "epoch": 7705} {"train_loss": -28.287841796875, "global_step": 639536, "epoch": 7705} {"train_loss": -28.019079208374023, "global_step": 639537, "epoch": 7705} {"train_loss": -28.29962158203125, "global_step": 639538, "epoch": 7705} {"train_loss": -28.16300392150879, "global_step": 639539, "epoch": 7705} {"train_loss": -27.852323532104492, "global_step": 639540, "epoch": 7705} {"train_loss": -27.967620849609375, "global_step": 639541, "epoch": 7705} {"train_loss": -28.030080795288086, "global_step": 639542, "epoch": 7705} {"train_loss": -28.12295913696289, "global_step": 639543, "epoch": 7705} {"train_loss": -28.15964126586914, "global_step": 639544, "epoch": 7705} {"train_loss": -28.378498077392578, "global_step": 639545, "epoch": 7705} {"train_loss": -28.652099609375, "global_step": 639546, "epoch": 7705} {"train_loss": -28.259424209594727, "global_step": 639547, "epoch": 7705} {"train_loss": -28.477264404296875, "global_step": 639548, "epoch": 7705} {"train_loss": -28.3303165435791, "global_step": 639549, "epoch": 7705} {"train_loss": -28.291950225830078, "global_step": 639550, "epoch": 7705} {"train_loss": -28.404800415039062, "global_step": 639551, "epoch": 7705} {"train_loss": -28.323896408081055, "global_step": 639552, "epoch": 7705} {"train_loss": -28.213224411010742, "global_step": 639553, "epoch": 7705} {"train_loss": -28.634244918823242, "global_step": 639554, "epoch": 7705} {"train_loss": -28.39385414123535, "global_step": 639555, "epoch": 7705} {"train_loss": -28.53358268737793, "global_step": 639556, "epoch": 7705} {"train_loss": -28.30130386352539, "global_step": 639557, "epoch": 7705} {"train_loss": -28.558637619018555, "global_step": 639558, "epoch": 7705} {"train_loss": -28.549726486206055, "global_step": 639559, "epoch": 7705} {"train_loss": -28.128448486328125, "global_step": 639560, "epoch": 7705} {"train_loss": -28.672870635986328, "global_step": 639561, "epoch": 7705} {"train_loss": -28.679183959960938, "global_step": 639562, "epoch": 7705} {"train_loss": -28.472675323486328, "global_step": 639563, "epoch": 7705} {"train_loss": -28.8330020904541, "global_step": 639564, "epoch": 7705} {"train_loss": -28.5761661529541, "global_step": 639565, "epoch": 7705} {"train_loss": -28.467960357666016, "global_step": 639566, "epoch": 7705} {"train_loss": -28.625158309936523, "global_step": 639567, "epoch": 7705} {"train_loss": -28.447595596313477, "global_step": 639568, "epoch": 7705} {"train_loss": -28.508386611938477, "global_step": 639569, "epoch": 7705} {"train_loss": -28.265796661376953, "global_step": 639570, "epoch": 7705} {"train_loss": -28.599096298217773, "global_step": 639571, "epoch": 7705} {"train_loss": -28.535419464111328, "global_step": 639572, "epoch": 7705} {"train_loss": -28.067975997924805, "global_step": 639573, "epoch": 7705} {"train_loss": -28.433950424194336, "global_step": 639574, "epoch": 7705} {"train_loss": -28.2425479888916, "global_step": 639575, "epoch": 7705} {"train_loss": -28.132810592651367, "global_step": 639576, "epoch": 7705} {"train_loss": -28.279386520385742, "global_step": 639577, "epoch": 7705} {"train_loss": -28.176416397094727, "global_step": 639578, "epoch": 7705} {"train_loss": -28.390628814697266, "global_step": 639579, "epoch": 7705} {"train_loss": -27.5236759185791, "global_step": 639580, "epoch": 7705} {"train_loss": -28.17267417907715, "global_step": 639581, "epoch": 7705} {"train_loss": -28.34003257751465, "global_step": 639582, "epoch": 7705} {"train_loss": -27.890045166015625, "global_step": 639583, "epoch": 7705} {"train_loss": -28.074865341186523, "global_step": 639584, "epoch": 7705} {"train_loss": -27.8358211517334, "global_step": 639585, "epoch": 7705} {"train_loss": -28.31879234313965, "global_step": 639586, "epoch": 7705} {"train_loss": -28.224210739135742, "global_step": 639587, "epoch": 7705} {"train_loss": -28.185028076171875, "global_step": 639588, "epoch": 7705} {"train_loss": -27.628833770751953, "global_step": 639589, "epoch": 7705} {"train_loss": -27.968311309814453, "global_step": 639590, "epoch": 7705} {"train_loss": -28.286178588867188, "global_step": 639591, "epoch": 7705} {"train_loss": -27.71195411682129, "global_step": 639592, "epoch": 7705} {"train_loss": -28.168212890625, "global_step": 639593, "epoch": 7705} {"train_loss": -28.338306427001953, "global_step": 639594, "epoch": 7705} {"train_loss": -27.858972549438477, "global_step": 639595, "epoch": 7705} {"train_loss": -27.259801864624023, "global_step": 639596, "epoch": 7705} {"train_loss": -28.11284878742264, "global_step": 639597, "epoch": 7705, "val_loss": 6636880.0} {"train_loss": -27.350866317749023, "global_step": 639598, "epoch": 7706} {"train_loss": -27.42245864868164, "global_step": 639599, "epoch": 7706} {"train_loss": -26.99347496032715, "global_step": 639600, "epoch": 7706} {"train_loss": -26.881113052368164, "global_step": 639601, "epoch": 7706} {"train_loss": -27.35725212097168, "global_step": 639602, "epoch": 7706} {"train_loss": -27.80059814453125, "global_step": 639603, "epoch": 7706} {"train_loss": -27.404743194580078, "global_step": 639604, "epoch": 7706} {"train_loss": -27.477157592773438, "global_step": 639605, "epoch": 7706} {"train_loss": -27.462818145751953, "global_step": 639606, "epoch": 7706} {"train_loss": -27.467350006103516, "global_step": 639607, "epoch": 7706} {"train_loss": -27.60255241394043, "global_step": 639608, "epoch": 7706} {"train_loss": -27.199934005737305, "global_step": 639609, "epoch": 7706} {"train_loss": -27.62213706970215, "global_step": 639610, "epoch": 7706} {"train_loss": -27.415491104125977, "global_step": 639611, "epoch": 7706} {"train_loss": -27.477222442626953, "global_step": 639612, "epoch": 7706} {"train_loss": -27.647857666015625, "global_step": 639613, "epoch": 7706} {"train_loss": -27.67254638671875, "global_step": 639614, "epoch": 7706} {"train_loss": -28.050601959228516, "global_step": 639615, "epoch": 7706} {"train_loss": -27.51255226135254, "global_step": 639616, "epoch": 7706} {"train_loss": -27.8436279296875, "global_step": 639617, "epoch": 7706} {"train_loss": -27.80557632446289, "global_step": 639618, "epoch": 7706} {"train_loss": -27.933618545532227, "global_step": 639619, "epoch": 7706} {"train_loss": -27.759998321533203, "global_step": 639620, "epoch": 7706} {"train_loss": -28.071203231811523, "global_step": 639621, "epoch": 7706} {"train_loss": -28.413755416870117, "global_step": 639622, "epoch": 7706} {"train_loss": -27.4434871673584, "global_step": 639623, "epoch": 7706} {"train_loss": -27.779754638671875, "global_step": 639624, "epoch": 7706} {"train_loss": -28.200531005859375, "global_step": 639625, "epoch": 7706} {"train_loss": -28.07132911682129, "global_step": 639626, "epoch": 7706} {"train_loss": -27.78415870666504, "global_step": 639627, "epoch": 7706} {"train_loss": -28.25507926940918, "global_step": 639628, "epoch": 7706} {"train_loss": -27.867069244384766, "global_step": 639629, "epoch": 7706} {"train_loss": -28.41546058654785, "global_step": 639630, "epoch": 7706} {"train_loss": -28.1423397064209, "global_step": 639631, "epoch": 7706} {"train_loss": -28.194000244140625, "global_step": 639632, "epoch": 7706} {"train_loss": -28.309757232666016, "global_step": 639633, "epoch": 7706} {"train_loss": -28.06134605407715, "global_step": 639634, "epoch": 7706} {"train_loss": -28.531280517578125, "global_step": 639635, "epoch": 7706} {"train_loss": -28.089391708374023, "global_step": 639636, "epoch": 7706} {"train_loss": -28.26527214050293, "global_step": 639637, "epoch": 7706} {"train_loss": -28.3714656829834, "global_step": 639638, "epoch": 7706} {"train_loss": -27.9879207611084, "global_step": 639639, "epoch": 7706} {"train_loss": -28.151098251342773, "global_step": 639640, "epoch": 7706} {"train_loss": -28.339981079101562, "global_step": 639641, "epoch": 7706} {"train_loss": -28.0054874420166, "global_step": 639642, "epoch": 7706} {"train_loss": -28.14130973815918, "global_step": 639643, "epoch": 7706} {"train_loss": -28.188077926635742, "global_step": 639644, "epoch": 7706} {"train_loss": -28.540958404541016, "global_step": 639645, "epoch": 7706} {"train_loss": -28.72321128845215, "global_step": 639646, "epoch": 7706} {"train_loss": -28.248266220092773, "global_step": 639647, "epoch": 7706} {"train_loss": -28.37537956237793, "global_step": 639648, "epoch": 7706} {"train_loss": -28.06805992126465, "global_step": 639649, "epoch": 7706} {"train_loss": -28.645456314086914, "global_step": 639650, "epoch": 7706} {"train_loss": -28.21943473815918, "global_step": 639651, "epoch": 7706} {"train_loss": -28.622228622436523, "global_step": 639652, "epoch": 7706} {"train_loss": -28.234830856323242, "global_step": 639653, "epoch": 7706} {"train_loss": -28.38437271118164, "global_step": 639654, "epoch": 7706} {"train_loss": -28.51970863342285, "global_step": 639655, "epoch": 7706} {"train_loss": -28.49859046936035, "global_step": 639656, "epoch": 7706} {"train_loss": -28.4711856842041, "global_step": 639657, "epoch": 7706} {"train_loss": -28.355178833007812, "global_step": 639658, "epoch": 7706} {"train_loss": -28.656295776367188, "global_step": 639659, "epoch": 7706} {"train_loss": -28.5407772064209, "global_step": 639660, "epoch": 7706} {"train_loss": -28.312332153320312, "global_step": 639661, "epoch": 7706} {"train_loss": -28.348630905151367, "global_step": 639662, "epoch": 7706} {"train_loss": -28.295440673828125, "global_step": 639663, "epoch": 7706} {"train_loss": -28.377470016479492, "global_step": 639664, "epoch": 7706} {"train_loss": -28.9644832611084, "global_step": 639665, "epoch": 7706} {"train_loss": -28.548023223876953, "global_step": 639666, "epoch": 7706} {"train_loss": -28.5496768951416, "global_step": 639667, "epoch": 7706} {"train_loss": -28.29851722717285, "global_step": 639668, "epoch": 7706} {"train_loss": -28.270221710205078, "global_step": 639669, "epoch": 7706} {"train_loss": -28.83992576599121, "global_step": 639670, "epoch": 7706} {"train_loss": -28.15113639831543, "global_step": 639671, "epoch": 7706} {"train_loss": -28.301837921142578, "global_step": 639672, "epoch": 7706} {"train_loss": -28.08266258239746, "global_step": 639673, "epoch": 7706} {"train_loss": -27.9771728515625, "global_step": 639674, "epoch": 7706} {"train_loss": -28.74212646484375, "global_step": 639675, "epoch": 7706} {"train_loss": -28.005834579467773, "global_step": 639676, "epoch": 7706} {"train_loss": -27.908954620361328, "global_step": 639677, "epoch": 7706} {"train_loss": -28.281742095947266, "global_step": 639678, "epoch": 7706} {"train_loss": -27.984790802001953, "global_step": 639679, "epoch": 7706} {"train_loss": -28.087916155895556, "global_step": 639680, "epoch": 7706, "val_loss": 6854556.0} {"train_loss": -25.666034698486328, "global_step": 639681, "epoch": 7707} {"train_loss": -21.51642608642578, "global_step": 639682, "epoch": 7707} {"train_loss": -17.609968185424805, "global_step": 639683, "epoch": 7707} {"train_loss": -22.900930404663086, "global_step": 639684, "epoch": 7707} {"train_loss": -26.082366943359375, "global_step": 639685, "epoch": 7707} {"train_loss": -24.597232818603516, "global_step": 639686, "epoch": 7707} {"train_loss": -25.572010040283203, "global_step": 639687, "epoch": 7707} {"train_loss": -26.48858070373535, "global_step": 639688, "epoch": 7707} {"train_loss": -25.71148681640625, "global_step": 639689, "epoch": 7707} {"train_loss": -26.213476181030273, "global_step": 639690, "epoch": 7707} {"train_loss": -27.27685546875, "global_step": 639691, "epoch": 7707} {"train_loss": -26.3685359954834, "global_step": 639692, "epoch": 7707} {"train_loss": -26.662229537963867, "global_step": 639693, "epoch": 7707} {"train_loss": -26.77825355529785, "global_step": 639694, "epoch": 7707} {"train_loss": -27.01386833190918, "global_step": 639695, "epoch": 7707} {"train_loss": -26.7012996673584, "global_step": 639696, "epoch": 7707} {"train_loss": -26.98297691345215, "global_step": 639697, "epoch": 7707} {"train_loss": -26.916919708251953, "global_step": 639698, "epoch": 7707} {"train_loss": -27.320051193237305, "global_step": 639699, "epoch": 7707} {"train_loss": -27.311599731445312, "global_step": 639700, "epoch": 7707} {"train_loss": -27.2336483001709, "global_step": 639701, "epoch": 7707} {"train_loss": -27.40535545349121, "global_step": 639702, "epoch": 7707} {"train_loss": -27.313196182250977, "global_step": 639703, "epoch": 7707} {"train_loss": -27.21311378479004, "global_step": 639704, "epoch": 7707} {"train_loss": -27.196002960205078, "global_step": 639705, "epoch": 7707} {"train_loss": -27.16116714477539, "global_step": 639706, "epoch": 7707} {"train_loss": -27.178939819335938, "global_step": 639707, "epoch": 7707} {"train_loss": -27.476987838745117, "global_step": 639708, "epoch": 7707} {"train_loss": -27.46270179748535, "global_step": 639709, "epoch": 7707} {"train_loss": -27.636438369750977, "global_step": 639710, "epoch": 7707} {"train_loss": -27.284564971923828, "global_step": 639711, "epoch": 7707} {"train_loss": -27.47576904296875, "global_step": 639712, "epoch": 7707} {"train_loss": -27.494726181030273, "global_step": 639713, "epoch": 7707} {"train_loss": -28.032461166381836, "global_step": 639714, "epoch": 7707} {"train_loss": -27.868894577026367, "global_step": 639715, "epoch": 7707} {"train_loss": -27.335981369018555, "global_step": 639716, "epoch": 7707} {"train_loss": -27.71135902404785, "global_step": 639717, "epoch": 7707} {"train_loss": -27.30910301208496, "global_step": 639718, "epoch": 7707} {"train_loss": -27.78315544128418, "global_step": 639719, "epoch": 7707} {"train_loss": -27.75347328186035, "global_step": 639720, "epoch": 7707} {"train_loss": -27.789112091064453, "global_step": 639721, "epoch": 7707} {"train_loss": -28.16242790222168, "global_step": 639722, "epoch": 7707} {"train_loss": -28.0606689453125, "global_step": 639723, "epoch": 7707} {"train_loss": -28.036115646362305, "global_step": 639724, "epoch": 7707} {"train_loss": -27.727466583251953, "global_step": 639725, "epoch": 7707} {"train_loss": -28.093793869018555, "global_step": 639726, "epoch": 7707} {"train_loss": -28.49555015563965, "global_step": 639727, "epoch": 7707} {"train_loss": -28.253345489501953, "global_step": 639728, "epoch": 7707} {"train_loss": -28.08746337890625, "global_step": 639729, "epoch": 7707} {"train_loss": -28.13877296447754, "global_step": 639730, "epoch": 7707} {"train_loss": -28.21290397644043, "global_step": 639731, "epoch": 7707} {"train_loss": -28.251535415649414, "global_step": 639732, "epoch": 7707} {"train_loss": -28.178131103515625, "global_step": 639733, "epoch": 7707} {"train_loss": -28.003759384155273, "global_step": 639734, "epoch": 7707} {"train_loss": -28.152542114257812, "global_step": 639735, "epoch": 7707} {"train_loss": -28.043216705322266, "global_step": 639736, "epoch": 7707} {"train_loss": -28.261693954467773, "global_step": 639737, "epoch": 7707} {"train_loss": -27.82905387878418, "global_step": 639738, "epoch": 7707} {"train_loss": -28.401081085205078, "global_step": 639739, "epoch": 7707} {"train_loss": -28.372446060180664, "global_step": 639740, "epoch": 7707} {"train_loss": -27.954816818237305, "global_step": 639741, "epoch": 7707} {"train_loss": -28.295059204101562, "global_step": 639742, "epoch": 7707} {"train_loss": -28.054718017578125, "global_step": 639743, "epoch": 7707} {"train_loss": -27.685129165649414, "global_step": 639744, "epoch": 7707} {"train_loss": -28.194738388061523, "global_step": 639745, "epoch": 7707} {"train_loss": -28.171497344970703, "global_step": 639746, "epoch": 7707} {"train_loss": -28.043384552001953, "global_step": 639747, "epoch": 7707} {"train_loss": -28.59988784790039, "global_step": 639748, "epoch": 7707} {"train_loss": -28.053791046142578, "global_step": 639749, "epoch": 7707} {"train_loss": -28.0460262298584, "global_step": 639750, "epoch": 7707} {"train_loss": -28.203582763671875, "global_step": 639751, "epoch": 7707} {"train_loss": -28.006488800048828, "global_step": 639752, "epoch": 7707} {"train_loss": -28.42755699157715, "global_step": 639753, "epoch": 7707} {"train_loss": -28.228979110717773, "global_step": 639754, "epoch": 7707} {"train_loss": -28.417306900024414, "global_step": 639755, "epoch": 7707} {"train_loss": -28.253992080688477, "global_step": 639756, "epoch": 7707} {"train_loss": -28.225622177124023, "global_step": 639757, "epoch": 7707} {"train_loss": -27.969831466674805, "global_step": 639758, "epoch": 7707} {"train_loss": -28.3956241607666, "global_step": 639759, "epoch": 7707} {"train_loss": -28.398290634155273, "global_step": 639760, "epoch": 7707} {"train_loss": -28.29096031188965, "global_step": 639761, "epoch": 7707} {"train_loss": -28.481861114501953, "global_step": 639762, "epoch": 7707} {"train_loss": -27.381616362606188, "global_step": 639763, "epoch": 7707, "val_loss": 6889243.0} {"train_loss": -27.464874267578125, "global_step": 639764, "epoch": 7708} {"train_loss": -26.380956649780273, "global_step": 639765, "epoch": 7708} {"train_loss": -25.696069717407227, "global_step": 639766, "epoch": 7708} {"train_loss": -27.097782135009766, "global_step": 639767, "epoch": 7708} {"train_loss": -26.96160316467285, "global_step": 639768, "epoch": 7708} {"train_loss": -26.25274658203125, "global_step": 639769, "epoch": 7708} {"train_loss": -25.97309684753418, "global_step": 639770, "epoch": 7708} {"train_loss": -26.403223037719727, "global_step": 639771, "epoch": 7708} {"train_loss": -27.465429306030273, "global_step": 639772, "epoch": 7708} {"train_loss": -26.532001495361328, "global_step": 639773, "epoch": 7708} {"train_loss": -25.175989151000977, "global_step": 639774, "epoch": 7708} {"train_loss": -27.629117965698242, "global_step": 639775, "epoch": 7708} {"train_loss": -25.760034561157227, "global_step": 639776, "epoch": 7708} {"train_loss": -27.6884708404541, "global_step": 639777, "epoch": 7708} {"train_loss": -26.585407257080078, "global_step": 639778, "epoch": 7708} {"train_loss": -27.825281143188477, "global_step": 639779, "epoch": 7708} {"train_loss": -26.917165756225586, "global_step": 639780, "epoch": 7708} {"train_loss": -27.03268814086914, "global_step": 639781, "epoch": 7708} {"train_loss": -27.375442504882812, "global_step": 639782, "epoch": 7708} {"train_loss": -27.11488914489746, "global_step": 639783, "epoch": 7708} {"train_loss": -27.479084014892578, "global_step": 639784, "epoch": 7708} {"train_loss": -27.59189796447754, "global_step": 639785, "epoch": 7708} {"train_loss": -27.438262939453125, "global_step": 639786, "epoch": 7708} {"train_loss": -27.196842193603516, "global_step": 639787, "epoch": 7708} {"train_loss": -27.772863388061523, "global_step": 639788, "epoch": 7708} {"train_loss": -27.571298599243164, "global_step": 639789, "epoch": 7708} {"train_loss": -27.791473388671875, "global_step": 639790, "epoch": 7708} {"train_loss": -27.673542022705078, "global_step": 639791, "epoch": 7708} {"train_loss": -27.814380645751953, "global_step": 639792, "epoch": 7708} {"train_loss": -27.526416778564453, "global_step": 639793, "epoch": 7708} {"train_loss": -27.622934341430664, "global_step": 639794, "epoch": 7708} {"train_loss": -27.757314682006836, "global_step": 639795, "epoch": 7708} {"train_loss": -27.901782989501953, "global_step": 639796, "epoch": 7708} {"train_loss": -27.67673110961914, "global_step": 639797, "epoch": 7708} {"train_loss": -27.90488624572754, "global_step": 639798, "epoch": 7708} {"train_loss": -28.08089256286621, "global_step": 639799, "epoch": 7708} {"train_loss": -28.021276473999023, "global_step": 639800, "epoch": 7708} {"train_loss": -28.123737335205078, "global_step": 639801, "epoch": 7708} {"train_loss": -27.6560001373291, "global_step": 639802, "epoch": 7708} {"train_loss": -27.847492218017578, "global_step": 639803, "epoch": 7708} {"train_loss": -28.195051193237305, "global_step": 639804, "epoch": 7708} {"train_loss": -27.85309410095215, "global_step": 639805, "epoch": 7708} {"train_loss": -28.038043975830078, "global_step": 639806, "epoch": 7708} {"train_loss": -28.069690704345703, "global_step": 639807, "epoch": 7708} {"train_loss": -27.84321403503418, "global_step": 639808, "epoch": 7708} {"train_loss": -28.4217529296875, "global_step": 639809, "epoch": 7708} {"train_loss": -27.98524284362793, "global_step": 639810, "epoch": 7708} {"train_loss": -27.7855167388916, "global_step": 639811, "epoch": 7708} {"train_loss": -28.039514541625977, "global_step": 639812, "epoch": 7708} {"train_loss": -28.38181495666504, "global_step": 639813, "epoch": 7708} {"train_loss": -27.796802520751953, "global_step": 639814, "epoch": 7708} {"train_loss": -28.258214950561523, "global_step": 639815, "epoch": 7708} {"train_loss": -28.04755210876465, "global_step": 639816, "epoch": 7708} {"train_loss": -28.1214599609375, "global_step": 639817, "epoch": 7708} {"train_loss": -28.246585845947266, "global_step": 639818, "epoch": 7708} {"train_loss": -28.35243034362793, "global_step": 639819, "epoch": 7708} {"train_loss": -28.4766788482666, "global_step": 639820, "epoch": 7708} {"train_loss": -28.1483097076416, "global_step": 639821, "epoch": 7708} {"train_loss": -27.81355094909668, "global_step": 639822, "epoch": 7708} {"train_loss": -28.45318031311035, "global_step": 639823, "epoch": 7708} {"train_loss": -28.358367919921875, "global_step": 639824, "epoch": 7708} {"train_loss": -28.38650894165039, "global_step": 639825, "epoch": 7708} {"train_loss": -28.30718421936035, "global_step": 639826, "epoch": 7708} {"train_loss": -28.125207901000977, "global_step": 639827, "epoch": 7708} {"train_loss": -28.470853805541992, "global_step": 639828, "epoch": 7708} {"train_loss": -28.001935958862305, "global_step": 639829, "epoch": 7708} {"train_loss": -28.479001998901367, "global_step": 639830, "epoch": 7708} {"train_loss": -28.14340591430664, "global_step": 639831, "epoch": 7708} {"train_loss": -28.241254806518555, "global_step": 639832, "epoch": 7708} {"train_loss": -28.591455459594727, "global_step": 639833, "epoch": 7708} {"train_loss": -28.189416885375977, "global_step": 639834, "epoch": 7708} {"train_loss": -27.66914176940918, "global_step": 639835, "epoch": 7708} {"train_loss": -27.47251319885254, "global_step": 639836, "epoch": 7708} {"train_loss": -26.96710205078125, "global_step": 639837, "epoch": 7708} {"train_loss": -27.189157485961914, "global_step": 639838, "epoch": 7708} {"train_loss": -28.196155548095703, "global_step": 639839, "epoch": 7708} {"train_loss": -28.2437801361084, "global_step": 639840, "epoch": 7708} {"train_loss": -27.649555206298828, "global_step": 639841, "epoch": 7708} {"train_loss": -27.71784019470215, "global_step": 639842, "epoch": 7708} {"train_loss": -28.386524200439453, "global_step": 639843, "epoch": 7708} {"train_loss": -27.552719116210938, "global_step": 639844, "epoch": 7708} {"train_loss": -28.28269386291504, "global_step": 639845, "epoch": 7708} {"train_loss": -27.67439513608634, "global_step": 639846, "epoch": 7708, "val_loss": 6928982.0} {"train_loss": -27.848834991455078, "global_step": 639847, "epoch": 7709} {"train_loss": -27.637435913085938, "global_step": 639848, "epoch": 7709} {"train_loss": -27.72553825378418, "global_step": 639849, "epoch": 7709} {"train_loss": -27.709375381469727, "global_step": 639850, "epoch": 7709} {"train_loss": -28.31849479675293, "global_step": 639851, "epoch": 7709} {"train_loss": -27.607187271118164, "global_step": 639852, "epoch": 7709} {"train_loss": -27.59677505493164, "global_step": 639853, "epoch": 7709} {"train_loss": -27.6013240814209, "global_step": 639854, "epoch": 7709} {"train_loss": -28.29224967956543, "global_step": 639855, "epoch": 7709} {"train_loss": -27.785207748413086, "global_step": 639856, "epoch": 7709} {"train_loss": -28.593008041381836, "global_step": 639857, "epoch": 7709} {"train_loss": -28.12642478942871, "global_step": 639858, "epoch": 7709} {"train_loss": -28.346363067626953, "global_step": 639859, "epoch": 7709} {"train_loss": -28.128442764282227, "global_step": 639860, "epoch": 7709} {"train_loss": -28.29216957092285, "global_step": 639861, "epoch": 7709} {"train_loss": -28.047754287719727, "global_step": 639862, "epoch": 7709} {"train_loss": -28.40044593811035, "global_step": 639863, "epoch": 7709} {"train_loss": -28.3756160736084, "global_step": 639864, "epoch": 7709} {"train_loss": -28.305450439453125, "global_step": 639865, "epoch": 7709} {"train_loss": -28.23126792907715, "global_step": 639866, "epoch": 7709} {"train_loss": -28.2906551361084, "global_step": 639867, "epoch": 7709} {"train_loss": -28.385568618774414, "global_step": 639868, "epoch": 7709} {"train_loss": -28.377838134765625, "global_step": 639869, "epoch": 7709} {"train_loss": -28.772470474243164, "global_step": 639870, "epoch": 7709} {"train_loss": -28.33902931213379, "global_step": 639871, "epoch": 7709} {"train_loss": -27.994342803955078, "global_step": 639872, "epoch": 7709} {"train_loss": -28.36249351501465, "global_step": 639873, "epoch": 7709} {"train_loss": -28.588342666625977, "global_step": 639874, "epoch": 7709} {"train_loss": -28.182754516601562, "global_step": 639875, "epoch": 7709} {"train_loss": -28.55812644958496, "global_step": 639876, "epoch": 7709} {"train_loss": -28.124425888061523, "global_step": 639877, "epoch": 7709} {"train_loss": -28.763158798217773, "global_step": 639878, "epoch": 7709} {"train_loss": -28.395788192749023, "global_step": 639879, "epoch": 7709} {"train_loss": -28.695301055908203, "global_step": 639880, "epoch": 7709} {"train_loss": -28.322980880737305, "global_step": 639881, "epoch": 7709} {"train_loss": -28.101776123046875, "global_step": 639882, "epoch": 7709} {"train_loss": -28.4992733001709, "global_step": 639883, "epoch": 7709} {"train_loss": -27.89948081970215, "global_step": 639884, "epoch": 7709} {"train_loss": -28.30145835876465, "global_step": 639885, "epoch": 7709} {"train_loss": -28.252429962158203, "global_step": 639886, "epoch": 7709} {"train_loss": -28.26324462890625, "global_step": 639887, "epoch": 7709} {"train_loss": -28.421375274658203, "global_step": 639888, "epoch": 7709} {"train_loss": -28.22614860534668, "global_step": 639889, "epoch": 7709} {"train_loss": -28.039871215820312, "global_step": 639890, "epoch": 7709} {"train_loss": -28.25086784362793, "global_step": 639891, "epoch": 7709} {"train_loss": -28.15778160095215, "global_step": 639892, "epoch": 7709} {"train_loss": -28.31647300720215, "global_step": 639893, "epoch": 7709} {"train_loss": -28.27235221862793, "global_step": 639894, "epoch": 7709} {"train_loss": -28.339094161987305, "global_step": 639895, "epoch": 7709} {"train_loss": -28.520788192749023, "global_step": 639896, "epoch": 7709} {"train_loss": -28.3327579498291, "global_step": 639897, "epoch": 7709} {"train_loss": -27.954730987548828, "global_step": 639898, "epoch": 7709} {"train_loss": -28.330646514892578, "global_step": 639899, "epoch": 7709} {"train_loss": -28.021289825439453, "global_step": 639900, "epoch": 7709} {"train_loss": -28.494611740112305, "global_step": 639901, "epoch": 7709} {"train_loss": -27.878015518188477, "global_step": 639902, "epoch": 7709} {"train_loss": -28.58637046813965, "global_step": 639903, "epoch": 7709} {"train_loss": -28.016386032104492, "global_step": 639904, "epoch": 7709} {"train_loss": -28.03289222717285, "global_step": 639905, "epoch": 7709} {"train_loss": -28.192350387573242, "global_step": 639906, "epoch": 7709} {"train_loss": -28.098194122314453, "global_step": 639907, "epoch": 7709} {"train_loss": -28.538888931274414, "global_step": 639908, "epoch": 7709} {"train_loss": -28.254724502563477, "global_step": 639909, "epoch": 7709} {"train_loss": -28.21369743347168, "global_step": 639910, "epoch": 7709} {"train_loss": -28.090436935424805, "global_step": 639911, "epoch": 7709} {"train_loss": -28.475473403930664, "global_step": 639912, "epoch": 7709} {"train_loss": -28.254369735717773, "global_step": 639913, "epoch": 7709} {"train_loss": -28.181888580322266, "global_step": 639914, "epoch": 7709} {"train_loss": -28.73288917541504, "global_step": 639915, "epoch": 7709} {"train_loss": -28.305246353149414, "global_step": 639916, "epoch": 7709} {"train_loss": -28.533605575561523, "global_step": 639917, "epoch": 7709} {"train_loss": -28.645044326782227, "global_step": 639918, "epoch": 7709} {"train_loss": -28.435632705688477, "global_step": 639919, "epoch": 7709} {"train_loss": -28.38775062561035, "global_step": 639920, "epoch": 7709} {"train_loss": -28.522897720336914, "global_step": 639921, "epoch": 7709} {"train_loss": -28.292383193969727, "global_step": 639922, "epoch": 7709} {"train_loss": -28.361608505249023, "global_step": 639923, "epoch": 7709} {"train_loss": -27.98345947265625, "global_step": 639924, "epoch": 7709} {"train_loss": -28.676366806030273, "global_step": 639925, "epoch": 7709} {"train_loss": -28.39737319946289, "global_step": 639926, "epoch": 7709} {"train_loss": -28.782913208007812, "global_step": 639927, "epoch": 7709} {"train_loss": -28.64264488220215, "global_step": 639928, "epoch": 7709} {"train_loss": -28.261700503797417, "global_step": 639929, "epoch": 7709, "val_loss": 6815260.0} {"train_loss": -27.57496452331543, "global_step": 639930, "epoch": 7710} {"train_loss": -27.962621688842773, "global_step": 639931, "epoch": 7710} {"train_loss": -28.256549835205078, "global_step": 639932, "epoch": 7710} {"train_loss": -28.091466903686523, "global_step": 639933, "epoch": 7710} {"train_loss": -27.966089248657227, "global_step": 639934, "epoch": 7710} {"train_loss": -27.979822158813477, "global_step": 639935, "epoch": 7710} {"train_loss": -27.786474227905273, "global_step": 639936, "epoch": 7710} {"train_loss": -28.14217185974121, "global_step": 639937, "epoch": 7710} {"train_loss": -28.41705894470215, "global_step": 639938, "epoch": 7710} {"train_loss": -28.071807861328125, "global_step": 639939, "epoch": 7710} {"train_loss": -27.913410186767578, "global_step": 639940, "epoch": 7710} {"train_loss": -27.85480308532715, "global_step": 639941, "epoch": 7710} {"train_loss": -27.766077041625977, "global_step": 639942, "epoch": 7710} {"train_loss": -27.879810333251953, "global_step": 639943, "epoch": 7710} {"train_loss": -27.52813720703125, "global_step": 639944, "epoch": 7710} {"train_loss": -27.734960556030273, "global_step": 639945, "epoch": 7710} {"train_loss": -27.961923599243164, "global_step": 639946, "epoch": 7710} {"train_loss": -28.13425636291504, "global_step": 639947, "epoch": 7710} {"train_loss": -28.060155868530273, "global_step": 639948, "epoch": 7710} {"train_loss": -28.30439567565918, "global_step": 639949, "epoch": 7710} {"train_loss": -28.17498779296875, "global_step": 639950, "epoch": 7710} {"train_loss": -28.31699562072754, "global_step": 639951, "epoch": 7710} {"train_loss": -28.617151260375977, "global_step": 639952, "epoch": 7710} {"train_loss": -28.166479110717773, "global_step": 639953, "epoch": 7710} {"train_loss": -27.835742950439453, "global_step": 639954, "epoch": 7710} {"train_loss": -28.1761531829834, "global_step": 639955, "epoch": 7710} {"train_loss": -28.60550880432129, "global_step": 639956, "epoch": 7710} {"train_loss": -28.135473251342773, "global_step": 639957, "epoch": 7710} {"train_loss": -28.37900161743164, "global_step": 639958, "epoch": 7710} {"train_loss": -28.14918327331543, "global_step": 639959, "epoch": 7710} {"train_loss": -28.217788696289062, "global_step": 639960, "epoch": 7710} {"train_loss": -28.226608276367188, "global_step": 639961, "epoch": 7710} {"train_loss": -28.225500106811523, "global_step": 639962, "epoch": 7710} {"train_loss": -27.96222496032715, "global_step": 639963, "epoch": 7710} {"train_loss": -28.1511173248291, "global_step": 639964, "epoch": 7710} {"train_loss": -28.329641342163086, "global_step": 639965, "epoch": 7710} {"train_loss": -28.441669464111328, "global_step": 639966, "epoch": 7710} {"train_loss": -28.611719131469727, "global_step": 639967, "epoch": 7710} {"train_loss": -27.81586265563965, "global_step": 639968, "epoch": 7710} {"train_loss": -28.49311637878418, "global_step": 639969, "epoch": 7710} {"train_loss": -28.180683135986328, "global_step": 639970, "epoch": 7710} {"train_loss": -28.49241065979004, "global_step": 639971, "epoch": 7710} {"train_loss": -28.290546417236328, "global_step": 639972, "epoch": 7710} {"train_loss": -28.25031852722168, "global_step": 639973, "epoch": 7710} {"train_loss": -28.572553634643555, "global_step": 639974, "epoch": 7710} {"train_loss": -28.50860023498535, "global_step": 639975, "epoch": 7710} {"train_loss": -28.49470329284668, "global_step": 639976, "epoch": 7710} {"train_loss": -28.45537757873535, "global_step": 639977, "epoch": 7710} {"train_loss": -28.08505630493164, "global_step": 639978, "epoch": 7710} {"train_loss": -28.57919692993164, "global_step": 639979, "epoch": 7710} {"train_loss": -28.23101806640625, "global_step": 639980, "epoch": 7710} {"train_loss": -28.50373649597168, "global_step": 639981, "epoch": 7710} {"train_loss": -28.131223678588867, "global_step": 639982, "epoch": 7710} {"train_loss": -28.280719757080078, "global_step": 639983, "epoch": 7710} {"train_loss": -28.211767196655273, "global_step": 639984, "epoch": 7710} {"train_loss": -28.370407104492188, "global_step": 639985, "epoch": 7710} {"train_loss": -28.764114379882812, "global_step": 639986, "epoch": 7710} {"train_loss": -28.014392852783203, "global_step": 639987, "epoch": 7710} {"train_loss": -28.491018295288086, "global_step": 639988, "epoch": 7710} {"train_loss": -28.6362247467041, "global_step": 639989, "epoch": 7710} {"train_loss": -28.163318634033203, "global_step": 639990, "epoch": 7710} {"train_loss": -28.312957763671875, "global_step": 639991, "epoch": 7710} {"train_loss": -28.025409698486328, "global_step": 639992, "epoch": 7710} {"train_loss": -28.205463409423828, "global_step": 639993, "epoch": 7710} {"train_loss": -28.484088897705078, "global_step": 639994, "epoch": 7710} {"train_loss": -28.609521865844727, "global_step": 639995, "epoch": 7710} {"train_loss": -28.93231773376465, "global_step": 639996, "epoch": 7710} {"train_loss": -28.379806518554688, "global_step": 639997, "epoch": 7710} {"train_loss": -28.532758712768555, "global_step": 639998, "epoch": 7710} {"train_loss": -28.4572696685791, "global_step": 639999, "epoch": 7710} {"train_loss": -28.410419464111328, "global_step": 640000, "epoch": 7710} {"train_loss": -28.31281089782715, "global_step": 640001, "epoch": 7710} {"train_loss": -28.193830490112305, "global_step": 640002, "epoch": 7710} {"train_loss": -28.382476806640625, "global_step": 640003, "epoch": 7710} {"train_loss": -28.242023468017578, "global_step": 640004, "epoch": 7710} {"train_loss": -27.92889976501465, "global_step": 640005, "epoch": 7710} {"train_loss": -28.104236602783203, "global_step": 640006, "epoch": 7710} {"train_loss": -28.448251724243164, "global_step": 640007, "epoch": 7710} {"train_loss": -28.49140739440918, "global_step": 640008, "epoch": 7710} {"train_loss": -28.646589279174805, "global_step": 640009, "epoch": 7710} {"train_loss": -28.055089950561523, "global_step": 640010, "epoch": 7710} {"train_loss": -28.538755416870117, "global_step": 640011, "epoch": 7710} {"train_loss": -28.25217118320695, "global_step": 640012, "epoch": 7710, "val_loss": 6790616.0} {"train_loss": -27.539087295532227, "global_step": 640013, "epoch": 7711} {"train_loss": -26.893518447875977, "global_step": 640014, "epoch": 7711} {"train_loss": -28.11585807800293, "global_step": 640015, "epoch": 7711} {"train_loss": -27.766895294189453, "global_step": 640016, "epoch": 7711} {"train_loss": -27.628131866455078, "global_step": 640017, "epoch": 7711} {"train_loss": -28.04169273376465, "global_step": 640018, "epoch": 7711} {"train_loss": -28.116138458251953, "global_step": 640019, "epoch": 7711} {"train_loss": -27.707508087158203, "global_step": 640020, "epoch": 7711} {"train_loss": -27.977827072143555, "global_step": 640021, "epoch": 7711} {"train_loss": -28.144515991210938, "global_step": 640022, "epoch": 7711} {"train_loss": -27.3922061920166, "global_step": 640023, "epoch": 7711} {"train_loss": -27.751867294311523, "global_step": 640024, "epoch": 7711} {"train_loss": -27.4791259765625, "global_step": 640025, "epoch": 7711} {"train_loss": -27.73553466796875, "global_step": 640026, "epoch": 7711} {"train_loss": -27.931970596313477, "global_step": 640027, "epoch": 7711} {"train_loss": -27.924518585205078, "global_step": 640028, "epoch": 7711} {"train_loss": -27.886213302612305, "global_step": 640029, "epoch": 7711} {"train_loss": -27.648046493530273, "global_step": 640030, "epoch": 7711} {"train_loss": -27.9013671875, "global_step": 640031, "epoch": 7711} {"train_loss": -27.953527450561523, "global_step": 640032, "epoch": 7711} {"train_loss": -28.02436637878418, "global_step": 640033, "epoch": 7711} {"train_loss": -27.769805908203125, "global_step": 640034, "epoch": 7711} {"train_loss": -27.87607192993164, "global_step": 640035, "epoch": 7711} {"train_loss": -28.0267391204834, "global_step": 640036, "epoch": 7711} {"train_loss": -28.166379928588867, "global_step": 640037, "epoch": 7711} {"train_loss": -27.59840965270996, "global_step": 640038, "epoch": 7711} {"train_loss": -27.98878288269043, "global_step": 640039, "epoch": 7711} {"train_loss": -27.80511474609375, "global_step": 640040, "epoch": 7711} {"train_loss": -27.916379928588867, "global_step": 640041, "epoch": 7711} {"train_loss": -28.17927360534668, "global_step": 640042, "epoch": 7711} {"train_loss": -27.90174674987793, "global_step": 640043, "epoch": 7711} {"train_loss": -27.9384822845459, "global_step": 640044, "epoch": 7711} {"train_loss": -28.346820831298828, "global_step": 640045, "epoch": 7711} {"train_loss": -28.49712562561035, "global_step": 640046, "epoch": 7711} {"train_loss": -28.298248291015625, "global_step": 640047, "epoch": 7711} {"train_loss": -28.459522247314453, "global_step": 640048, "epoch": 7711} {"train_loss": -28.211700439453125, "global_step": 640049, "epoch": 7711} {"train_loss": -28.335845947265625, "global_step": 640050, "epoch": 7711} {"train_loss": -28.433624267578125, "global_step": 640051, "epoch": 7711} {"train_loss": -28.15418815612793, "global_step": 640052, "epoch": 7711} {"train_loss": -28.269330978393555, "global_step": 640053, "epoch": 7711} {"train_loss": -28.425756454467773, "global_step": 640054, "epoch": 7711} {"train_loss": -28.190027236938477, "global_step": 640055, "epoch": 7711} {"train_loss": -28.782394409179688, "global_step": 640056, "epoch": 7711} {"train_loss": -28.344980239868164, "global_step": 640057, "epoch": 7711} {"train_loss": -28.65241050720215, "global_step": 640058, "epoch": 7711} {"train_loss": -28.4310359954834, "global_step": 640059, "epoch": 7711} {"train_loss": -28.1099910736084, "global_step": 640060, "epoch": 7711} {"train_loss": -28.29158592224121, "global_step": 640061, "epoch": 7711} {"train_loss": -28.566802978515625, "global_step": 640062, "epoch": 7711} {"train_loss": -28.303861618041992, "global_step": 640063, "epoch": 7711} {"train_loss": -27.88197898864746, "global_step": 640064, "epoch": 7711} {"train_loss": -28.355213165283203, "global_step": 640065, "epoch": 7711} {"train_loss": -28.577375411987305, "global_step": 640066, "epoch": 7711} {"train_loss": -28.520593643188477, "global_step": 640067, "epoch": 7711} {"train_loss": -28.49462890625, "global_step": 640068, "epoch": 7711} {"train_loss": -28.255691528320312, "global_step": 640069, "epoch": 7711} {"train_loss": -28.214441299438477, "global_step": 640070, "epoch": 7711} {"train_loss": -27.74325942993164, "global_step": 640071, "epoch": 7711} {"train_loss": -28.66474723815918, "global_step": 640072, "epoch": 7711} {"train_loss": -28.45587730407715, "global_step": 640073, "epoch": 7711} {"train_loss": -27.9929141998291, "global_step": 640074, "epoch": 7711} {"train_loss": -28.06721305847168, "global_step": 640075, "epoch": 7711} {"train_loss": -28.39129638671875, "global_step": 640076, "epoch": 7711} {"train_loss": -28.647537231445312, "global_step": 640077, "epoch": 7711} {"train_loss": -28.819486618041992, "global_step": 640078, "epoch": 7711} {"train_loss": -28.16552734375, "global_step": 640079, "epoch": 7711} {"train_loss": -28.055988311767578, "global_step": 640080, "epoch": 7711} {"train_loss": -28.536096572875977, "global_step": 640081, "epoch": 7711} {"train_loss": -28.284589767456055, "global_step": 640082, "epoch": 7711} {"train_loss": -28.166595458984375, "global_step": 640083, "epoch": 7711} {"train_loss": -28.252805709838867, "global_step": 640084, "epoch": 7711} {"train_loss": -28.505512237548828, "global_step": 640085, "epoch": 7711} {"train_loss": -28.239776611328125, "global_step": 640086, "epoch": 7711} {"train_loss": -28.35367774963379, "global_step": 640087, "epoch": 7711} {"train_loss": -28.569421768188477, "global_step": 640088, "epoch": 7711} {"train_loss": -28.499738693237305, "global_step": 640089, "epoch": 7711} {"train_loss": -28.233062744140625, "global_step": 640090, "epoch": 7711} {"train_loss": -28.4410400390625, "global_step": 640091, "epoch": 7711} {"train_loss": -28.192041397094727, "global_step": 640092, "epoch": 7711} {"train_loss": -28.24637222290039, "global_step": 640093, "epoch": 7711} {"train_loss": -28.50593376159668, "global_step": 640094, "epoch": 7711} {"train_loss": -28.149218662675604, "global_step": 640095, "epoch": 7711, "val_loss": 6785098.0} {"train_loss": -28.03785514831543, "global_step": 640096, "epoch": 7712} {"train_loss": -28.058942794799805, "global_step": 640097, "epoch": 7712} {"train_loss": -27.73382568359375, "global_step": 640098, "epoch": 7712} {"train_loss": -28.115087509155273, "global_step": 640099, "epoch": 7712} {"train_loss": -27.88907241821289, "global_step": 640100, "epoch": 7712} {"train_loss": -27.91776466369629, "global_step": 640101, "epoch": 7712} {"train_loss": -27.46964454650879, "global_step": 640102, "epoch": 7712} {"train_loss": -27.94638442993164, "global_step": 640103, "epoch": 7712} {"train_loss": -28.040058135986328, "global_step": 640104, "epoch": 7712} {"train_loss": -28.282272338867188, "global_step": 640105, "epoch": 7712} {"train_loss": -27.473163604736328, "global_step": 640106, "epoch": 7712} {"train_loss": -27.431180953979492, "global_step": 640107, "epoch": 7712} {"train_loss": -27.66056251525879, "global_step": 640108, "epoch": 7712} {"train_loss": -28.117786407470703, "global_step": 640109, "epoch": 7712} {"train_loss": -28.061660766601562, "global_step": 640110, "epoch": 7712} {"train_loss": -27.650653839111328, "global_step": 640111, "epoch": 7712} {"train_loss": -28.26680564880371, "global_step": 640112, "epoch": 7712} {"train_loss": -28.168014526367188, "global_step": 640113, "epoch": 7712} {"train_loss": -28.456384658813477, "global_step": 640114, "epoch": 7712} {"train_loss": -27.7999267578125, "global_step": 640115, "epoch": 7712} {"train_loss": -27.63336753845215, "global_step": 640116, "epoch": 7712} {"train_loss": -28.467193603515625, "global_step": 640117, "epoch": 7712} {"train_loss": -27.8675537109375, "global_step": 640118, "epoch": 7712} {"train_loss": -28.15264892578125, "global_step": 640119, "epoch": 7712} {"train_loss": -28.375446319580078, "global_step": 640120, "epoch": 7712} {"train_loss": -27.918811798095703, "global_step": 640121, "epoch": 7712} {"train_loss": -27.853498458862305, "global_step": 640122, "epoch": 7712} {"train_loss": -28.3056583404541, "global_step": 640123, "epoch": 7712} {"train_loss": -28.448698043823242, "global_step": 640124, "epoch": 7712} {"train_loss": -28.499425888061523, "global_step": 640125, "epoch": 7712} {"train_loss": -28.25624656677246, "global_step": 640126, "epoch": 7712} {"train_loss": -28.492238998413086, "global_step": 640127, "epoch": 7712} {"train_loss": -28.345556259155273, "global_step": 640128, "epoch": 7712} {"train_loss": -28.201200485229492, "global_step": 640129, "epoch": 7712} {"train_loss": -28.27439308166504, "global_step": 640130, "epoch": 7712} {"train_loss": -28.188720703125, "global_step": 640131, "epoch": 7712} {"train_loss": -28.339282989501953, "global_step": 640132, "epoch": 7712} {"train_loss": -28.41370964050293, "global_step": 640133, "epoch": 7712} {"train_loss": -28.66025161743164, "global_step": 640134, "epoch": 7712} {"train_loss": -28.32269859313965, "global_step": 640135, "epoch": 7712} {"train_loss": -28.449054718017578, "global_step": 640136, "epoch": 7712} {"train_loss": -28.394641876220703, "global_step": 640137, "epoch": 7712} {"train_loss": -28.160511016845703, "global_step": 640138, "epoch": 7712} {"train_loss": -28.107025146484375, "global_step": 640139, "epoch": 7712} {"train_loss": -28.447988510131836, "global_step": 640140, "epoch": 7712} {"train_loss": -28.34746742248535, "global_step": 640141, "epoch": 7712} {"train_loss": -28.342527389526367, "global_step": 640142, "epoch": 7712} {"train_loss": -27.9749698638916, "global_step": 640143, "epoch": 7712} {"train_loss": -28.43341064453125, "global_step": 640144, "epoch": 7712} {"train_loss": -28.31436538696289, "global_step": 640145, "epoch": 7712} {"train_loss": -28.420358657836914, "global_step": 640146, "epoch": 7712} {"train_loss": -28.251256942749023, "global_step": 640147, "epoch": 7712} {"train_loss": -28.133264541625977, "global_step": 640148, "epoch": 7712} {"train_loss": -28.073057174682617, "global_step": 640149, "epoch": 7712} {"train_loss": -27.94988441467285, "global_step": 640150, "epoch": 7712} {"train_loss": -28.144681930541992, "global_step": 640151, "epoch": 7712} {"train_loss": -28.188364028930664, "global_step": 640152, "epoch": 7712} {"train_loss": -28.625518798828125, "global_step": 640153, "epoch": 7712} {"train_loss": -28.518850326538086, "global_step": 640154, "epoch": 7712} {"train_loss": -28.060535430908203, "global_step": 640155, "epoch": 7712} {"train_loss": -28.179468154907227, "global_step": 640156, "epoch": 7712} {"train_loss": -28.165990829467773, "global_step": 640157, "epoch": 7712} {"train_loss": -28.063146591186523, "global_step": 640158, "epoch": 7712} {"train_loss": -27.73966407775879, "global_step": 640159, "epoch": 7712} {"train_loss": -28.311359405517578, "global_step": 640160, "epoch": 7712} {"train_loss": -28.301746368408203, "global_step": 640161, "epoch": 7712} {"train_loss": -28.2598934173584, "global_step": 640162, "epoch": 7712} {"train_loss": -28.108539581298828, "global_step": 640163, "epoch": 7712} {"train_loss": -28.445539474487305, "global_step": 640164, "epoch": 7712} {"train_loss": -28.12884521484375, "global_step": 640165, "epoch": 7712} {"train_loss": -28.045246124267578, "global_step": 640166, "epoch": 7712} {"train_loss": -27.77186393737793, "global_step": 640167, "epoch": 7712} {"train_loss": -28.3844051361084, "global_step": 640168, "epoch": 7712} {"train_loss": -28.39051628112793, "global_step": 640169, "epoch": 7712} {"train_loss": -28.29680824279785, "global_step": 640170, "epoch": 7712} {"train_loss": -28.69520378112793, "global_step": 640171, "epoch": 7712} {"train_loss": -28.6281681060791, "global_step": 640172, "epoch": 7712} {"train_loss": -28.32659339904785, "global_step": 640173, "epoch": 7712} {"train_loss": -28.770898818969727, "global_step": 640174, "epoch": 7712} {"train_loss": -28.433414459228516, "global_step": 640175, "epoch": 7712} {"train_loss": -28.736221313476562, "global_step": 640176, "epoch": 7712} {"train_loss": -28.49747085571289, "global_step": 640177, "epoch": 7712} {"train_loss": -28.187384226236, "global_step": 640178, "epoch": 7712, "val_loss": 6636593.0} {"train_loss": -28.119705200195312, "global_step": 640179, "epoch": 7713} {"train_loss": -27.360965728759766, "global_step": 640180, "epoch": 7713} {"train_loss": -27.610193252563477, "global_step": 640181, "epoch": 7713} {"train_loss": -28.073333740234375, "global_step": 640182, "epoch": 7713} {"train_loss": -27.65553855895996, "global_step": 640183, "epoch": 7713} {"train_loss": -28.01655387878418, "global_step": 640184, "epoch": 7713} {"train_loss": -27.81599235534668, "global_step": 640185, "epoch": 7713} {"train_loss": -28.25949478149414, "global_step": 640186, "epoch": 7713} {"train_loss": -28.19000244140625, "global_step": 640187, "epoch": 7713} {"train_loss": -27.855573654174805, "global_step": 640188, "epoch": 7713} {"train_loss": -27.892309188842773, "global_step": 640189, "epoch": 7713} {"train_loss": -28.040685653686523, "global_step": 640190, "epoch": 7713} {"train_loss": -27.810400009155273, "global_step": 640191, "epoch": 7713} {"train_loss": -28.28782081604004, "global_step": 640192, "epoch": 7713} {"train_loss": -28.07806968688965, "global_step": 640193, "epoch": 7713} {"train_loss": -27.983163833618164, "global_step": 640194, "epoch": 7713} {"train_loss": -28.325559616088867, "global_step": 640195, "epoch": 7713} {"train_loss": -28.455427169799805, "global_step": 640196, "epoch": 7713} {"train_loss": -28.12034034729004, "global_step": 640197, "epoch": 7713} {"train_loss": -28.20985984802246, "global_step": 640198, "epoch": 7713} {"train_loss": -28.062225341796875, "global_step": 640199, "epoch": 7713} {"train_loss": -28.036828994750977, "global_step": 640200, "epoch": 7713} {"train_loss": -28.262283325195312, "global_step": 640201, "epoch": 7713} {"train_loss": -27.975452423095703, "global_step": 640202, "epoch": 7713} {"train_loss": -28.116474151611328, "global_step": 640203, "epoch": 7713} {"train_loss": -27.91204261779785, "global_step": 640204, "epoch": 7713} {"train_loss": -28.586877822875977, "global_step": 640205, "epoch": 7713} {"train_loss": -28.218244552612305, "global_step": 640206, "epoch": 7713} {"train_loss": -28.35796546936035, "global_step": 640207, "epoch": 7713} {"train_loss": -28.413259506225586, "global_step": 640208, "epoch": 7713} {"train_loss": -28.367233276367188, "global_step": 640209, "epoch": 7713} {"train_loss": -28.374353408813477, "global_step": 640210, "epoch": 7713} {"train_loss": -28.197967529296875, "global_step": 640211, "epoch": 7713} {"train_loss": -28.53948402404785, "global_step": 640212, "epoch": 7713} {"train_loss": -28.02027702331543, "global_step": 640213, "epoch": 7713} {"train_loss": -28.595630645751953, "global_step": 640214, "epoch": 7713} {"train_loss": -28.51852798461914, "global_step": 640215, "epoch": 7713} {"train_loss": -28.76081657409668, "global_step": 640216, "epoch": 7713} {"train_loss": -28.2064266204834, "global_step": 640217, "epoch": 7713} {"train_loss": -28.16316795349121, "global_step": 640218, "epoch": 7713} {"train_loss": -28.638916015625, "global_step": 640219, "epoch": 7713} {"train_loss": -28.020803451538086, "global_step": 640220, "epoch": 7713} {"train_loss": -28.601606369018555, "global_step": 640221, "epoch": 7713} {"train_loss": -28.188800811767578, "global_step": 640222, "epoch": 7713} {"train_loss": -28.25062370300293, "global_step": 640223, "epoch": 7713} {"train_loss": -27.756834030151367, "global_step": 640224, "epoch": 7713} {"train_loss": -27.65087890625, "global_step": 640225, "epoch": 7713} {"train_loss": -27.338674545288086, "global_step": 640226, "epoch": 7713} {"train_loss": -27.995227813720703, "global_step": 640227, "epoch": 7713} {"train_loss": -28.569303512573242, "global_step": 640228, "epoch": 7713} {"train_loss": -28.089157104492188, "global_step": 640229, "epoch": 7713} {"train_loss": -28.150278091430664, "global_step": 640230, "epoch": 7713} {"train_loss": -28.123640060424805, "global_step": 640231, "epoch": 7713} {"train_loss": -27.74176597595215, "global_step": 640232, "epoch": 7713} {"train_loss": -28.011011123657227, "global_step": 640233, "epoch": 7713} {"train_loss": -27.84662437438965, "global_step": 640234, "epoch": 7713} {"train_loss": -28.070356369018555, "global_step": 640235, "epoch": 7713} {"train_loss": -27.9969425201416, "global_step": 640236, "epoch": 7713} {"train_loss": -28.047819137573242, "global_step": 640237, "epoch": 7713} {"train_loss": -28.14397621154785, "global_step": 640238, "epoch": 7713} {"train_loss": -28.26471519470215, "global_step": 640239, "epoch": 7713} {"train_loss": -28.19607925415039, "global_step": 640240, "epoch": 7713} {"train_loss": -27.99287223815918, "global_step": 640241, "epoch": 7713} {"train_loss": -28.2334041595459, "global_step": 640242, "epoch": 7713} {"train_loss": -28.130273818969727, "global_step": 640243, "epoch": 7713} {"train_loss": -28.2677059173584, "global_step": 640244, "epoch": 7713} {"train_loss": -28.365903854370117, "global_step": 640245, "epoch": 7713} {"train_loss": -28.60504722595215, "global_step": 640246, "epoch": 7713} {"train_loss": -28.096893310546875, "global_step": 640247, "epoch": 7713} {"train_loss": -28.607192993164062, "global_step": 640248, "epoch": 7713} {"train_loss": -27.77980613708496, "global_step": 640249, "epoch": 7713} {"train_loss": -27.906925201416016, "global_step": 640250, "epoch": 7713} {"train_loss": -27.77292251586914, "global_step": 640251, "epoch": 7713} {"train_loss": -28.17042350769043, "global_step": 640252, "epoch": 7713} {"train_loss": -28.74275016784668, "global_step": 640253, "epoch": 7713} {"train_loss": -28.349088668823242, "global_step": 640254, "epoch": 7713} {"train_loss": -27.9589786529541, "global_step": 640255, "epoch": 7713} {"train_loss": -27.709781646728516, "global_step": 640256, "epoch": 7713} {"train_loss": -27.33860206604004, "global_step": 640257, "epoch": 7713} {"train_loss": -27.635656356811523, "global_step": 640258, "epoch": 7713} {"train_loss": -27.820770263671875, "global_step": 640259, "epoch": 7713} {"train_loss": -27.979766845703125, "global_step": 640260, "epoch": 7713} {"train_loss": -28.12631565691477, "global_step": 640261, "epoch": 7713, "val_loss": 6784721.0} {"train_loss": -26.923843383789062, "global_step": 640262, "epoch": 7714} {"train_loss": -27.068756103515625, "global_step": 640263, "epoch": 7714} {"train_loss": -28.291889190673828, "global_step": 640264, "epoch": 7714} {"train_loss": -27.680883407592773, "global_step": 640265, "epoch": 7714} {"train_loss": -28.092679977416992, "global_step": 640266, "epoch": 7714} {"train_loss": -27.755966186523438, "global_step": 640267, "epoch": 7714} {"train_loss": -28.07063102722168, "global_step": 640268, "epoch": 7714} {"train_loss": -28.04790687561035, "global_step": 640269, "epoch": 7714} {"train_loss": -27.5306396484375, "global_step": 640270, "epoch": 7714} {"train_loss": -28.409208297729492, "global_step": 640271, "epoch": 7714} {"train_loss": -27.85101890563965, "global_step": 640272, "epoch": 7714} {"train_loss": -28.15192222595215, "global_step": 640273, "epoch": 7714} {"train_loss": -28.03285789489746, "global_step": 640274, "epoch": 7714} {"train_loss": -28.041675567626953, "global_step": 640275, "epoch": 7714} {"train_loss": -27.875598907470703, "global_step": 640276, "epoch": 7714} {"train_loss": -28.115163803100586, "global_step": 640277, "epoch": 7714} {"train_loss": -28.005146026611328, "global_step": 640278, "epoch": 7714} {"train_loss": -28.11432456970215, "global_step": 640279, "epoch": 7714} {"train_loss": -28.191699981689453, "global_step": 640280, "epoch": 7714} {"train_loss": -28.086511611938477, "global_step": 640281, "epoch": 7714} {"train_loss": -27.918569564819336, "global_step": 640282, "epoch": 7714} {"train_loss": -28.256933212280273, "global_step": 640283, "epoch": 7714} {"train_loss": -27.963781356811523, "global_step": 640284, "epoch": 7714} {"train_loss": -27.83143424987793, "global_step": 640285, "epoch": 7714} {"train_loss": -28.1458683013916, "global_step": 640286, "epoch": 7714} {"train_loss": -27.897687911987305, "global_step": 640287, "epoch": 7714} {"train_loss": -28.184829711914062, "global_step": 640288, "epoch": 7714} {"train_loss": -28.014245986938477, "global_step": 640289, "epoch": 7714} {"train_loss": -28.3247127532959, "global_step": 640290, "epoch": 7714} {"train_loss": -28.084619522094727, "global_step": 640291, "epoch": 7714} {"train_loss": -27.986597061157227, "global_step": 640292, "epoch": 7714} {"train_loss": -28.726789474487305, "global_step": 640293, "epoch": 7714} {"train_loss": -28.056278228759766, "global_step": 640294, "epoch": 7714} {"train_loss": -28.487293243408203, "global_step": 640295, "epoch": 7714} {"train_loss": -28.290958404541016, "global_step": 640296, "epoch": 7714} {"train_loss": -28.496723175048828, "global_step": 640297, "epoch": 7714} {"train_loss": -28.085264205932617, "global_step": 640298, "epoch": 7714} {"train_loss": -28.53360366821289, "global_step": 640299, "epoch": 7714} {"train_loss": -28.147262573242188, "global_step": 640300, "epoch": 7714} {"train_loss": -28.41973304748535, "global_step": 640301, "epoch": 7714} {"train_loss": -28.405120849609375, "global_step": 640302, "epoch": 7714} {"train_loss": -28.229101181030273, "global_step": 640303, "epoch": 7714} {"train_loss": -28.464147567749023, "global_step": 640304, "epoch": 7714} {"train_loss": -28.337066650390625, "global_step": 640305, "epoch": 7714} {"train_loss": -28.020238876342773, "global_step": 640306, "epoch": 7714} {"train_loss": -28.46929359436035, "global_step": 640307, "epoch": 7714} {"train_loss": -28.3309326171875, "global_step": 640308, "epoch": 7714} {"train_loss": -28.035810470581055, "global_step": 640309, "epoch": 7714} {"train_loss": -27.88492774963379, "global_step": 640310, "epoch": 7714} {"train_loss": -28.0798282623291, "global_step": 640311, "epoch": 7714} {"train_loss": -28.228824615478516, "global_step": 640312, "epoch": 7714} {"train_loss": -28.014820098876953, "global_step": 640313, "epoch": 7714} {"train_loss": -27.9654598236084, "global_step": 640314, "epoch": 7714} {"train_loss": -28.151630401611328, "global_step": 640315, "epoch": 7714} {"train_loss": -27.750873565673828, "global_step": 640316, "epoch": 7714} {"train_loss": -28.07801628112793, "global_step": 640317, "epoch": 7714} {"train_loss": -28.15107536315918, "global_step": 640318, "epoch": 7714} {"train_loss": -27.764392852783203, "global_step": 640319, "epoch": 7714} {"train_loss": -28.265241622924805, "global_step": 640320, "epoch": 7714} {"train_loss": -28.37445068359375, "global_step": 640321, "epoch": 7714} {"train_loss": -27.880090713500977, "global_step": 640322, "epoch": 7714} {"train_loss": -28.334396362304688, "global_step": 640323, "epoch": 7714} {"train_loss": -28.01825523376465, "global_step": 640324, "epoch": 7714} {"train_loss": -28.01242446899414, "global_step": 640325, "epoch": 7714} {"train_loss": -28.112903594970703, "global_step": 640326, "epoch": 7714} {"train_loss": -28.404565811157227, "global_step": 640327, "epoch": 7714} {"train_loss": -28.182321548461914, "global_step": 640328, "epoch": 7714} {"train_loss": -28.260700225830078, "global_step": 640329, "epoch": 7714} {"train_loss": -28.638952255249023, "global_step": 640330, "epoch": 7714} {"train_loss": -27.97452163696289, "global_step": 640331, "epoch": 7714} {"train_loss": -28.089279174804688, "global_step": 640332, "epoch": 7714} {"train_loss": -28.56610107421875, "global_step": 640333, "epoch": 7714} {"train_loss": -28.31317138671875, "global_step": 640334, "epoch": 7714} {"train_loss": -28.489521026611328, "global_step": 640335, "epoch": 7714} {"train_loss": -28.912494659423828, "global_step": 640336, "epoch": 7714} {"train_loss": -28.459836959838867, "global_step": 640337, "epoch": 7714} {"train_loss": -28.16961097717285, "global_step": 640338, "epoch": 7714} {"train_loss": -28.5362606048584, "global_step": 640339, "epoch": 7714} {"train_loss": -27.9267520904541, "global_step": 640340, "epoch": 7714} {"train_loss": -28.644697189331055, "global_step": 640341, "epoch": 7714} {"train_loss": -28.527151107788086, "global_step": 640342, "epoch": 7714} {"train_loss": -28.457273483276367, "global_step": 640343, "epoch": 7714} {"train_loss": -28.14426447397255, "global_step": 640344, "epoch": 7714, "val_loss": 6818202.5} {"train_loss": -27.98005485534668, "global_step": 640345, "epoch": 7715} {"train_loss": -28.120559692382812, "global_step": 640346, "epoch": 7715} {"train_loss": -28.1513614654541, "global_step": 640347, "epoch": 7715} {"train_loss": -28.23236083984375, "global_step": 640348, "epoch": 7715} {"train_loss": -28.15618324279785, "global_step": 640349, "epoch": 7715} {"train_loss": -28.255701065063477, "global_step": 640350, "epoch": 7715} {"train_loss": -28.228622436523438, "global_step": 640351, "epoch": 7715} {"train_loss": -27.957990646362305, "global_step": 640352, "epoch": 7715} {"train_loss": -28.3109188079834, "global_step": 640353, "epoch": 7715} {"train_loss": -27.946027755737305, "global_step": 640354, "epoch": 7715} {"train_loss": -28.395736694335938, "global_step": 640355, "epoch": 7715} {"train_loss": -28.5049991607666, "global_step": 640356, "epoch": 7715} {"train_loss": -28.523984909057617, "global_step": 640357, "epoch": 7715} {"train_loss": -28.177839279174805, "global_step": 640358, "epoch": 7715} {"train_loss": -28.629663467407227, "global_step": 640359, "epoch": 7715} {"train_loss": -28.24285888671875, "global_step": 640360, "epoch": 7715} {"train_loss": -28.300596237182617, "global_step": 640361, "epoch": 7715} {"train_loss": -28.206867218017578, "global_step": 640362, "epoch": 7715} {"train_loss": -28.044937133789062, "global_step": 640363, "epoch": 7715} {"train_loss": -28.08052635192871, "global_step": 640364, "epoch": 7715} {"train_loss": -28.451887130737305, "global_step": 640365, "epoch": 7715} {"train_loss": -28.41582679748535, "global_step": 640366, "epoch": 7715} {"train_loss": -27.962453842163086, "global_step": 640367, "epoch": 7715} {"train_loss": -27.574726104736328, "global_step": 640368, "epoch": 7715} {"train_loss": -28.093902587890625, "global_step": 640369, "epoch": 7715} {"train_loss": -28.517847061157227, "global_step": 640370, "epoch": 7715} {"train_loss": -27.836017608642578, "global_step": 640371, "epoch": 7715} {"train_loss": -28.041112899780273, "global_step": 640372, "epoch": 7715} {"train_loss": -28.273168563842773, "global_step": 640373, "epoch": 7715} {"train_loss": -27.983600616455078, "global_step": 640374, "epoch": 7715} {"train_loss": -28.154468536376953, "global_step": 640375, "epoch": 7715} {"train_loss": -28.499601364135742, "global_step": 640376, "epoch": 7715} {"train_loss": -28.3924560546875, "global_step": 640377, "epoch": 7715} {"train_loss": -28.257980346679688, "global_step": 640378, "epoch": 7715} {"train_loss": -28.244958877563477, "global_step": 640379, "epoch": 7715} {"train_loss": -28.13111686706543, "global_step": 640380, "epoch": 7715} {"train_loss": -27.97115135192871, "global_step": 640381, "epoch": 7715} {"train_loss": -28.203039169311523, "global_step": 640382, "epoch": 7715} {"train_loss": -28.17034339904785, "global_step": 640383, "epoch": 7715} {"train_loss": -28.598724365234375, "global_step": 640384, "epoch": 7715} {"train_loss": -28.19574546813965, "global_step": 640385, "epoch": 7715} {"train_loss": -28.139917373657227, "global_step": 640386, "epoch": 7715} {"train_loss": -28.460834503173828, "global_step": 640387, "epoch": 7715} {"train_loss": -28.3869571685791, "global_step": 640388, "epoch": 7715} {"train_loss": -28.316476821899414, "global_step": 640389, "epoch": 7715} {"train_loss": -28.15410804748535, "global_step": 640390, "epoch": 7715} {"train_loss": -28.09022331237793, "global_step": 640391, "epoch": 7715} {"train_loss": -28.101348876953125, "global_step": 640392, "epoch": 7715} {"train_loss": -28.437543869018555, "global_step": 640393, "epoch": 7715} {"train_loss": -28.34797477722168, "global_step": 640394, "epoch": 7715} {"train_loss": -28.125431060791016, "global_step": 640395, "epoch": 7715} {"train_loss": -28.503122329711914, "global_step": 640396, "epoch": 7715} {"train_loss": -28.227136611938477, "global_step": 640397, "epoch": 7715} {"train_loss": -27.961111068725586, "global_step": 640398, "epoch": 7715} {"train_loss": -28.424137115478516, "global_step": 640399, "epoch": 7715} {"train_loss": -28.03461265563965, "global_step": 640400, "epoch": 7715} {"train_loss": -28.432355880737305, "global_step": 640401, "epoch": 7715} {"train_loss": -28.351099014282227, "global_step": 640402, "epoch": 7715} {"train_loss": -28.1385555267334, "global_step": 640403, "epoch": 7715} {"train_loss": -28.381820678710938, "global_step": 640404, "epoch": 7715} {"train_loss": -27.97296142578125, "global_step": 640405, "epoch": 7715} {"train_loss": -28.07596206665039, "global_step": 640406, "epoch": 7715} {"train_loss": -28.257568359375, "global_step": 640407, "epoch": 7715} {"train_loss": -28.264801025390625, "global_step": 640408, "epoch": 7715} {"train_loss": -28.165252685546875, "global_step": 640409, "epoch": 7715} {"train_loss": -28.288909912109375, "global_step": 640410, "epoch": 7715} {"train_loss": -28.385366439819336, "global_step": 640411, "epoch": 7715} {"train_loss": -28.466840744018555, "global_step": 640412, "epoch": 7715} {"train_loss": -28.551359176635742, "global_step": 640413, "epoch": 7715} {"train_loss": -28.59910011291504, "global_step": 640414, "epoch": 7715} {"train_loss": -28.595529556274414, "global_step": 640415, "epoch": 7715} {"train_loss": -28.413135528564453, "global_step": 640416, "epoch": 7715} {"train_loss": -28.620325088500977, "global_step": 640417, "epoch": 7715} {"train_loss": -28.445560455322266, "global_step": 640418, "epoch": 7715} {"train_loss": -28.15089225769043, "global_step": 640419, "epoch": 7715} {"train_loss": -28.674238204956055, "global_step": 640420, "epoch": 7715} {"train_loss": -28.90703773498535, "global_step": 640421, "epoch": 7715} {"train_loss": -28.5250186920166, "global_step": 640422, "epoch": 7715} {"train_loss": -28.771137237548828, "global_step": 640423, "epoch": 7715} {"train_loss": -28.429662704467773, "global_step": 640424, "epoch": 7715} {"train_loss": -28.35059928894043, "global_step": 640425, "epoch": 7715} {"train_loss": -28.49433708190918, "global_step": 640426, "epoch": 7715} {"train_loss": -28.272728816572442, "global_step": 640427, "epoch": 7715, "val_loss": 6759763.5} {"train_loss": -27.923120498657227, "global_step": 640428, "epoch": 7716} {"train_loss": -27.889434814453125, "global_step": 640429, "epoch": 7716} {"train_loss": -28.226165771484375, "global_step": 640430, "epoch": 7716} {"train_loss": -27.838134765625, "global_step": 640431, "epoch": 7716} {"train_loss": -28.3542537689209, "global_step": 640432, "epoch": 7716} {"train_loss": -27.5335636138916, "global_step": 640433, "epoch": 7716} {"train_loss": -28.004684448242188, "global_step": 640434, "epoch": 7716} {"train_loss": -27.995330810546875, "global_step": 640435, "epoch": 7716} {"train_loss": -28.06232261657715, "global_step": 640436, "epoch": 7716} {"train_loss": -28.37025260925293, "global_step": 640437, "epoch": 7716} {"train_loss": -27.962757110595703, "global_step": 640438, "epoch": 7716} {"train_loss": -27.704547882080078, "global_step": 640439, "epoch": 7716} {"train_loss": -28.35150718688965, "global_step": 640440, "epoch": 7716} {"train_loss": -28.388967514038086, "global_step": 640441, "epoch": 7716} {"train_loss": -28.278234481811523, "global_step": 640442, "epoch": 7716} {"train_loss": -28.309223175048828, "global_step": 640443, "epoch": 7716} {"train_loss": -28.009916305541992, "global_step": 640444, "epoch": 7716} {"train_loss": -28.11969566345215, "global_step": 640445, "epoch": 7716} {"train_loss": -28.311126708984375, "global_step": 640446, "epoch": 7716} {"train_loss": -28.590124130249023, "global_step": 640447, "epoch": 7716} {"train_loss": -27.930866241455078, "global_step": 640448, "epoch": 7716} {"train_loss": -28.33489418029785, "global_step": 640449, "epoch": 7716} {"train_loss": -28.045246124267578, "global_step": 640450, "epoch": 7716} {"train_loss": -28.284046173095703, "global_step": 640451, "epoch": 7716} {"train_loss": -28.321908950805664, "global_step": 640452, "epoch": 7716} {"train_loss": -27.98773193359375, "global_step": 640453, "epoch": 7716} {"train_loss": -28.084680557250977, "global_step": 640454, "epoch": 7716} {"train_loss": -27.849090576171875, "global_step": 640455, "epoch": 7716} {"train_loss": -28.267423629760742, "global_step": 640456, "epoch": 7716} {"train_loss": -27.990156173706055, "global_step": 640457, "epoch": 7716} {"train_loss": -28.13966178894043, "global_step": 640458, "epoch": 7716} {"train_loss": -28.27419090270996, "global_step": 640459, "epoch": 7716} {"train_loss": -28.309118270874023, "global_step": 640460, "epoch": 7716} {"train_loss": -28.34723472595215, "global_step": 640461, "epoch": 7716} {"train_loss": -28.042743682861328, "global_step": 640462, "epoch": 7716} {"train_loss": -28.230304718017578, "global_step": 640463, "epoch": 7716} {"train_loss": -28.549535751342773, "global_step": 640464, "epoch": 7716} {"train_loss": -28.3509521484375, "global_step": 640465, "epoch": 7716} {"train_loss": -28.24921989440918, "global_step": 640466, "epoch": 7716} {"train_loss": -28.272626876831055, "global_step": 640467, "epoch": 7716} {"train_loss": -28.268848419189453, "global_step": 640468, "epoch": 7716} {"train_loss": -28.62454605102539, "global_step": 640469, "epoch": 7716} {"train_loss": -28.5434627532959, "global_step": 640470, "epoch": 7716} {"train_loss": -28.160995483398438, "global_step": 640471, "epoch": 7716} {"train_loss": -28.814666748046875, "global_step": 640472, "epoch": 7716} {"train_loss": -28.40152931213379, "global_step": 640473, "epoch": 7716} {"train_loss": -28.602964401245117, "global_step": 640474, "epoch": 7716} {"train_loss": -28.761310577392578, "global_step": 640475, "epoch": 7716} {"train_loss": -28.30440330505371, "global_step": 640476, "epoch": 7716} {"train_loss": -28.253076553344727, "global_step": 640477, "epoch": 7716} {"train_loss": -28.238147735595703, "global_step": 640478, "epoch": 7716} {"train_loss": -28.445053100585938, "global_step": 640479, "epoch": 7716} {"train_loss": -28.268972396850586, "global_step": 640480, "epoch": 7716} {"train_loss": -28.289905548095703, "global_step": 640481, "epoch": 7716} {"train_loss": -28.43519401550293, "global_step": 640482, "epoch": 7716} {"train_loss": -28.54424476623535, "global_step": 640483, "epoch": 7716} {"train_loss": -28.432226181030273, "global_step": 640484, "epoch": 7716} {"train_loss": -28.506916046142578, "global_step": 640485, "epoch": 7716} {"train_loss": -28.199813842773438, "global_step": 640486, "epoch": 7716} {"train_loss": -28.66828727722168, "global_step": 640487, "epoch": 7716} {"train_loss": -28.564666748046875, "global_step": 640488, "epoch": 7716} {"train_loss": -28.825698852539062, "global_step": 640489, "epoch": 7716} {"train_loss": -28.236291885375977, "global_step": 640490, "epoch": 7716} {"train_loss": -28.255863189697266, "global_step": 640491, "epoch": 7716} {"train_loss": -28.448867797851562, "global_step": 640492, "epoch": 7716} {"train_loss": -28.3066349029541, "global_step": 640493, "epoch": 7716} {"train_loss": -28.342283248901367, "global_step": 640494, "epoch": 7716} {"train_loss": -28.265674591064453, "global_step": 640495, "epoch": 7716} {"train_loss": -28.46685218811035, "global_step": 640496, "epoch": 7716} {"train_loss": -27.745954513549805, "global_step": 640497, "epoch": 7716} {"train_loss": -28.131216049194336, "global_step": 640498, "epoch": 7716} {"train_loss": -28.335535049438477, "global_step": 640499, "epoch": 7716} {"train_loss": -28.258853912353516, "global_step": 640500, "epoch": 7716} {"train_loss": -28.163923263549805, "global_step": 640501, "epoch": 7716} {"train_loss": -27.842370986938477, "global_step": 640502, "epoch": 7716} {"train_loss": -27.96380615234375, "global_step": 640503, "epoch": 7716} {"train_loss": -27.552587509155273, "global_step": 640504, "epoch": 7716} {"train_loss": -26.76604652404785, "global_step": 640505, "epoch": 7716} {"train_loss": -26.614654541015625, "global_step": 640506, "epoch": 7716} {"train_loss": -27.588708877563477, "global_step": 640507, "epoch": 7716} {"train_loss": -28.075483322143555, "global_step": 640508, "epoch": 7716} {"train_loss": -27.1229248046875, "global_step": 640509, "epoch": 7716} {"train_loss": -28.171374240553522, "global_step": 640510, "epoch": 7716, "val_loss": 6628498.0} {"train_loss": -19.969541549682617, "global_step": 640511, "epoch": 7717} {"train_loss": -21.655471801757812, "global_step": 640512, "epoch": 7717} {"train_loss": -21.442838668823242, "global_step": 640513, "epoch": 7717} {"train_loss": -22.892637252807617, "global_step": 640514, "epoch": 7717} {"train_loss": -23.435117721557617, "global_step": 640515, "epoch": 7717} {"train_loss": -23.098873138427734, "global_step": 640516, "epoch": 7717} {"train_loss": -23.91444969177246, "global_step": 640517, "epoch": 7717} {"train_loss": -24.555561065673828, "global_step": 640518, "epoch": 7717} {"train_loss": -24.0152587890625, "global_step": 640519, "epoch": 7717} {"train_loss": -23.70168685913086, "global_step": 640520, "epoch": 7717} {"train_loss": -23.41265869140625, "global_step": 640521, "epoch": 7717} {"train_loss": -24.722265243530273, "global_step": 640522, "epoch": 7717} {"train_loss": -24.56085777282715, "global_step": 640523, "epoch": 7717} {"train_loss": -25.273324966430664, "global_step": 640524, "epoch": 7717} {"train_loss": -24.743694305419922, "global_step": 640525, "epoch": 7717} {"train_loss": -24.972871780395508, "global_step": 640526, "epoch": 7717} {"train_loss": -24.76731300354004, "global_step": 640527, "epoch": 7717} {"train_loss": -24.681737899780273, "global_step": 640528, "epoch": 7717} {"train_loss": -25.44077491760254, "global_step": 640529, "epoch": 7717} {"train_loss": -25.52503776550293, "global_step": 640530, "epoch": 7717} {"train_loss": -25.386228561401367, "global_step": 640531, "epoch": 7717} {"train_loss": -25.02210807800293, "global_step": 640532, "epoch": 7717} {"train_loss": -25.040681838989258, "global_step": 640533, "epoch": 7717} {"train_loss": -25.729938507080078, "global_step": 640534, "epoch": 7717} {"train_loss": -25.931732177734375, "global_step": 640535, "epoch": 7717} {"train_loss": -25.678747177124023, "global_step": 640536, "epoch": 7717} {"train_loss": -25.45797348022461, "global_step": 640537, "epoch": 7717} {"train_loss": -25.844696044921875, "global_step": 640538, "epoch": 7717} {"train_loss": -25.756383895874023, "global_step": 640539, "epoch": 7717} {"train_loss": -25.7349796295166, "global_step": 640540, "epoch": 7717} {"train_loss": -25.7742977142334, "global_step": 640541, "epoch": 7717} {"train_loss": -26.0848388671875, "global_step": 640542, "epoch": 7717} {"train_loss": -25.93485450744629, "global_step": 640543, "epoch": 7717} {"train_loss": -25.80694007873535, "global_step": 640544, "epoch": 7717} {"train_loss": -26.04950523376465, "global_step": 640545, "epoch": 7717} {"train_loss": -26.2583065032959, "global_step": 640546, "epoch": 7717} {"train_loss": -26.304950714111328, "global_step": 640547, "epoch": 7717} {"train_loss": -26.6387939453125, "global_step": 640548, "epoch": 7717} {"train_loss": -26.118946075439453, "global_step": 640549, "epoch": 7717} {"train_loss": -26.091690063476562, "global_step": 640550, "epoch": 7717} {"train_loss": -26.373859405517578, "global_step": 640551, "epoch": 7717} {"train_loss": -26.693857192993164, "global_step": 640552, "epoch": 7717} {"train_loss": -26.37774658203125, "global_step": 640553, "epoch": 7717} {"train_loss": -26.215118408203125, "global_step": 640554, "epoch": 7717} {"train_loss": -26.35990333557129, "global_step": 640555, "epoch": 7717} {"train_loss": -26.473493576049805, "global_step": 640556, "epoch": 7717} {"train_loss": -26.882556915283203, "global_step": 640557, "epoch": 7717} {"train_loss": -26.512800216674805, "global_step": 640558, "epoch": 7717} {"train_loss": -26.563617706298828, "global_step": 640559, "epoch": 7717} {"train_loss": -27.05632972717285, "global_step": 640560, "epoch": 7717} {"train_loss": -26.852802276611328, "global_step": 640561, "epoch": 7717} {"train_loss": -27.055145263671875, "global_step": 640562, "epoch": 7717} {"train_loss": -26.364301681518555, "global_step": 640563, "epoch": 7717} {"train_loss": -26.27715492248535, "global_step": 640564, "epoch": 7717} {"train_loss": -27.040760040283203, "global_step": 640565, "epoch": 7717} {"train_loss": -26.86884117126465, "global_step": 640566, "epoch": 7717} {"train_loss": -26.621183395385742, "global_step": 640567, "epoch": 7717} {"train_loss": -26.437299728393555, "global_step": 640568, "epoch": 7717} {"train_loss": -26.77210807800293, "global_step": 640569, "epoch": 7717} {"train_loss": -26.526397705078125, "global_step": 640570, "epoch": 7717} {"train_loss": -27.281625747680664, "global_step": 640571, "epoch": 7717} {"train_loss": -26.98122215270996, "global_step": 640572, "epoch": 7717} {"train_loss": -26.9305419921875, "global_step": 640573, "epoch": 7717} {"train_loss": -26.93426513671875, "global_step": 640574, "epoch": 7717} {"train_loss": -26.886337280273438, "global_step": 640575, "epoch": 7717} {"train_loss": -26.570219039916992, "global_step": 640576, "epoch": 7717} {"train_loss": -27.20068359375, "global_step": 640577, "epoch": 7717} {"train_loss": -27.065765380859375, "global_step": 640578, "epoch": 7717} {"train_loss": -26.77615737915039, "global_step": 640579, "epoch": 7717} {"train_loss": -26.5908260345459, "global_step": 640580, "epoch": 7717} {"train_loss": -27.003498077392578, "global_step": 640581, "epoch": 7717} {"train_loss": -27.153884887695312, "global_step": 640582, "epoch": 7717} {"train_loss": -27.057220458984375, "global_step": 640583, "epoch": 7717} {"train_loss": -27.338104248046875, "global_step": 640584, "epoch": 7717} {"train_loss": -26.700925827026367, "global_step": 640585, "epoch": 7717} {"train_loss": -27.277414321899414, "global_step": 640586, "epoch": 7717} {"train_loss": -26.69993019104004, "global_step": 640587, "epoch": 7717} {"train_loss": -26.70511817932129, "global_step": 640588, "epoch": 7717} {"train_loss": -27.133392333984375, "global_step": 640589, "epoch": 7717} {"train_loss": -27.48261833190918, "global_step": 640590, "epoch": 7717} {"train_loss": -26.605798721313477, "global_step": 640591, "epoch": 7717} {"train_loss": -26.940465927124023, "global_step": 640592, "epoch": 7717} {"train_loss": -25.833452362612068, "global_step": 640593, "epoch": 7717, "val_loss": 6648293.0} {"train_loss": -26.831274032592773, "global_step": 640594, "epoch": 7718} {"train_loss": -26.270681381225586, "global_step": 640595, "epoch": 7718} {"train_loss": -26.055814743041992, "global_step": 640596, "epoch": 7718} {"train_loss": -26.725574493408203, "global_step": 640597, "epoch": 7718} {"train_loss": -27.498144149780273, "global_step": 640598, "epoch": 7718} {"train_loss": -26.850543975830078, "global_step": 640599, "epoch": 7718} {"train_loss": -26.506113052368164, "global_step": 640600, "epoch": 7718} {"train_loss": -27.37788200378418, "global_step": 640601, "epoch": 7718} {"train_loss": -26.81422233581543, "global_step": 640602, "epoch": 7718} {"train_loss": -25.69805908203125, "global_step": 640603, "epoch": 7718} {"train_loss": -26.0026798248291, "global_step": 640604, "epoch": 7718} {"train_loss": -26.868906021118164, "global_step": 640605, "epoch": 7718} {"train_loss": -26.78664207458496, "global_step": 640606, "epoch": 7718} {"train_loss": -26.5062198638916, "global_step": 640607, "epoch": 7718} {"train_loss": -26.817535400390625, "global_step": 640608, "epoch": 7718} {"train_loss": -26.488080978393555, "global_step": 640609, "epoch": 7718} {"train_loss": -26.823286056518555, "global_step": 640610, "epoch": 7718} {"train_loss": -26.85597801208496, "global_step": 640611, "epoch": 7718} {"train_loss": -26.535547256469727, "global_step": 640612, "epoch": 7718} {"train_loss": -27.188871383666992, "global_step": 640613, "epoch": 7718} {"train_loss": -26.805097579956055, "global_step": 640614, "epoch": 7718} {"train_loss": -26.89414405822754, "global_step": 640615, "epoch": 7718} {"train_loss": -26.886571884155273, "global_step": 640616, "epoch": 7718} {"train_loss": -26.74427604675293, "global_step": 640617, "epoch": 7718} {"train_loss": -26.98014259338379, "global_step": 640618, "epoch": 7718} {"train_loss": -27.09781837463379, "global_step": 640619, "epoch": 7718} {"train_loss": -26.407901763916016, "global_step": 640620, "epoch": 7718} {"train_loss": -27.0860595703125, "global_step": 640621, "epoch": 7718} {"train_loss": -26.699811935424805, "global_step": 640622, "epoch": 7718} {"train_loss": -27.245264053344727, "global_step": 640623, "epoch": 7718} {"train_loss": -27.800098419189453, "global_step": 640624, "epoch": 7718} {"train_loss": -26.864084243774414, "global_step": 640625, "epoch": 7718} {"train_loss": -27.561567306518555, "global_step": 640626, "epoch": 7718} {"train_loss": -27.450185775756836, "global_step": 640627, "epoch": 7718} {"train_loss": -27.19403648376465, "global_step": 640628, "epoch": 7718} {"train_loss": -27.001636505126953, "global_step": 640629, "epoch": 7718} {"train_loss": -27.145248413085938, "global_step": 640630, "epoch": 7718} {"train_loss": -27.615262985229492, "global_step": 640631, "epoch": 7718} {"train_loss": -27.198699951171875, "global_step": 640632, "epoch": 7718} {"train_loss": -26.79388427734375, "global_step": 640633, "epoch": 7718} {"train_loss": -27.322525024414062, "global_step": 640634, "epoch": 7718} {"train_loss": -27.312732696533203, "global_step": 640635, "epoch": 7718} {"train_loss": -27.023611068725586, "global_step": 640636, "epoch": 7718} {"train_loss": -27.1488094329834, "global_step": 640637, "epoch": 7718} {"train_loss": -27.075300216674805, "global_step": 640638, "epoch": 7718} {"train_loss": -27.786218643188477, "global_step": 640639, "epoch": 7718} {"train_loss": -27.761533737182617, "global_step": 640640, "epoch": 7718} {"train_loss": -27.18806266784668, "global_step": 640641, "epoch": 7718} {"train_loss": -27.000696182250977, "global_step": 640642, "epoch": 7718} {"train_loss": -27.711776733398438, "global_step": 640643, "epoch": 7718} {"train_loss": -27.16473960876465, "global_step": 640644, "epoch": 7718} {"train_loss": -27.05879783630371, "global_step": 640645, "epoch": 7718} {"train_loss": -27.222553253173828, "global_step": 640646, "epoch": 7718} {"train_loss": -27.26792335510254, "global_step": 640647, "epoch": 7718} {"train_loss": -27.260425567626953, "global_step": 640648, "epoch": 7718} {"train_loss": -26.860876083374023, "global_step": 640649, "epoch": 7718} {"train_loss": -26.512908935546875, "global_step": 640650, "epoch": 7718} {"train_loss": -27.220111846923828, "global_step": 640651, "epoch": 7718} {"train_loss": -27.440937042236328, "global_step": 640652, "epoch": 7718} {"train_loss": -27.61444091796875, "global_step": 640653, "epoch": 7718} {"train_loss": -27.413373947143555, "global_step": 640654, "epoch": 7718} {"train_loss": -27.280492782592773, "global_step": 640655, "epoch": 7718} {"train_loss": -27.43338394165039, "global_step": 640656, "epoch": 7718} {"train_loss": -27.620777130126953, "global_step": 640657, "epoch": 7718} {"train_loss": -27.010202407836914, "global_step": 640658, "epoch": 7718} {"train_loss": -26.932538986206055, "global_step": 640659, "epoch": 7718} {"train_loss": -26.592233657836914, "global_step": 640660, "epoch": 7718} {"train_loss": -26.779748916625977, "global_step": 640661, "epoch": 7718} {"train_loss": -26.299497604370117, "global_step": 640662, "epoch": 7718} {"train_loss": -26.1944580078125, "global_step": 640663, "epoch": 7718} {"train_loss": -26.67848014831543, "global_step": 640664, "epoch": 7718} {"train_loss": -26.034931182861328, "global_step": 640665, "epoch": 7718} {"train_loss": -25.57792091369629, "global_step": 640666, "epoch": 7718} {"train_loss": -26.40964126586914, "global_step": 640667, "epoch": 7718} {"train_loss": -27.158308029174805, "global_step": 640668, "epoch": 7718} {"train_loss": -26.596759796142578, "global_step": 640669, "epoch": 7718} {"train_loss": -26.48908042907715, "global_step": 640670, "epoch": 7718} {"train_loss": -26.600784301757812, "global_step": 640671, "epoch": 7718} {"train_loss": -26.94818115234375, "global_step": 640672, "epoch": 7718} {"train_loss": -26.940292358398438, "global_step": 640673, "epoch": 7718} {"train_loss": -26.529407501220703, "global_step": 640674, "epoch": 7718} {"train_loss": -27.43474769592285, "global_step": 640675, "epoch": 7718} {"train_loss": -26.910368172519178, "global_step": 640676, "epoch": 7718, "val_loss": 6643050.0} {"train_loss": -26.875839233398438, "global_step": 640677, "epoch": 7719} {"train_loss": -26.15396499633789, "global_step": 640678, "epoch": 7719} {"train_loss": -26.499658584594727, "global_step": 640679, "epoch": 7719} {"train_loss": -26.09449577331543, "global_step": 640680, "epoch": 7719} {"train_loss": -26.597326278686523, "global_step": 640681, "epoch": 7719} {"train_loss": -26.694595336914062, "global_step": 640682, "epoch": 7719} {"train_loss": -26.733768463134766, "global_step": 640683, "epoch": 7719} {"train_loss": -26.851465225219727, "global_step": 640684, "epoch": 7719} {"train_loss": -26.48316764831543, "global_step": 640685, "epoch": 7719} {"train_loss": -26.89448356628418, "global_step": 640686, "epoch": 7719} {"train_loss": -26.678503036499023, "global_step": 640687, "epoch": 7719} {"train_loss": -26.319543838500977, "global_step": 640688, "epoch": 7719} {"train_loss": -26.86250877380371, "global_step": 640689, "epoch": 7719} {"train_loss": -26.714862823486328, "global_step": 640690, "epoch": 7719} {"train_loss": -26.87615966796875, "global_step": 640691, "epoch": 7719} {"train_loss": -26.587451934814453, "global_step": 640692, "epoch": 7719} {"train_loss": -26.9988956451416, "global_step": 640693, "epoch": 7719} {"train_loss": -26.25506591796875, "global_step": 640694, "epoch": 7719} {"train_loss": -27.42030143737793, "global_step": 640695, "epoch": 7719} {"train_loss": -26.7174129486084, "global_step": 640696, "epoch": 7719} {"train_loss": -26.168842315673828, "global_step": 640697, "epoch": 7719} {"train_loss": -26.728534698486328, "global_step": 640698, "epoch": 7719} {"train_loss": -27.113178253173828, "global_step": 640699, "epoch": 7719} {"train_loss": -27.00774574279785, "global_step": 640700, "epoch": 7719} {"train_loss": -26.798181533813477, "global_step": 640701, "epoch": 7719} {"train_loss": -26.83888053894043, "global_step": 640702, "epoch": 7719} {"train_loss": -27.10597801208496, "global_step": 640703, "epoch": 7719} {"train_loss": -27.354034423828125, "global_step": 640704, "epoch": 7719} {"train_loss": -27.761322021484375, "global_step": 640705, "epoch": 7719} {"train_loss": -27.41370964050293, "global_step": 640706, "epoch": 7719} {"train_loss": -26.758930206298828, "global_step": 640707, "epoch": 7719} {"train_loss": -27.24017906188965, "global_step": 640708, "epoch": 7719} {"train_loss": -27.64362907409668, "global_step": 640709, "epoch": 7719} {"train_loss": -26.645605087280273, "global_step": 640710, "epoch": 7719} {"train_loss": -26.946441650390625, "global_step": 640711, "epoch": 7719} {"train_loss": -27.3478946685791, "global_step": 640712, "epoch": 7719} {"train_loss": -27.086023330688477, "global_step": 640713, "epoch": 7719} {"train_loss": -27.649768829345703, "global_step": 640714, "epoch": 7719} {"train_loss": -27.085163116455078, "global_step": 640715, "epoch": 7719} {"train_loss": -26.896930694580078, "global_step": 640716, "epoch": 7719} {"train_loss": -27.755374908447266, "global_step": 640717, "epoch": 7719} {"train_loss": -26.756454467773438, "global_step": 640718, "epoch": 7719} {"train_loss": -26.9516544342041, "global_step": 640719, "epoch": 7719} {"train_loss": -26.87749671936035, "global_step": 640720, "epoch": 7719} {"train_loss": -26.937902450561523, "global_step": 640721, "epoch": 7719} {"train_loss": -27.30983543395996, "global_step": 640722, "epoch": 7719} {"train_loss": -27.17719841003418, "global_step": 640723, "epoch": 7719} {"train_loss": -27.50483512878418, "global_step": 640724, "epoch": 7719} {"train_loss": -27.269384384155273, "global_step": 640725, "epoch": 7719} {"train_loss": -27.798919677734375, "global_step": 640726, "epoch": 7719} {"train_loss": -27.9930477142334, "global_step": 640727, "epoch": 7719} {"train_loss": -27.57171630859375, "global_step": 640728, "epoch": 7719} {"train_loss": -27.19126319885254, "global_step": 640729, "epoch": 7719} {"train_loss": -27.31732749938965, "global_step": 640730, "epoch": 7719} {"train_loss": -27.482141494750977, "global_step": 640731, "epoch": 7719} {"train_loss": -26.86040687561035, "global_step": 640732, "epoch": 7719} {"train_loss": -27.583295822143555, "global_step": 640733, "epoch": 7719} {"train_loss": -27.314472198486328, "global_step": 640734, "epoch": 7719} {"train_loss": -27.62302017211914, "global_step": 640735, "epoch": 7719} {"train_loss": -27.031686782836914, "global_step": 640736, "epoch": 7719} {"train_loss": -27.13846206665039, "global_step": 640737, "epoch": 7719} {"train_loss": -27.21766471862793, "global_step": 640738, "epoch": 7719} {"train_loss": -26.427453994750977, "global_step": 640739, "epoch": 7719} {"train_loss": -26.95068359375, "global_step": 640740, "epoch": 7719} {"train_loss": -26.766000747680664, "global_step": 640741, "epoch": 7719} {"train_loss": -26.72442626953125, "global_step": 640742, "epoch": 7719} {"train_loss": -26.98322105407715, "global_step": 640743, "epoch": 7719} {"train_loss": -26.8366641998291, "global_step": 640744, "epoch": 7719} {"train_loss": -26.7069091796875, "global_step": 640745, "epoch": 7719} {"train_loss": -26.831884384155273, "global_step": 640746, "epoch": 7719} {"train_loss": -26.959579467773438, "global_step": 640747, "epoch": 7719} {"train_loss": -26.305383682250977, "global_step": 640748, "epoch": 7719} {"train_loss": -27.39716911315918, "global_step": 640749, "epoch": 7719} {"train_loss": -26.837635040283203, "global_step": 640750, "epoch": 7719} {"train_loss": -27.720321655273438, "global_step": 640751, "epoch": 7719} {"train_loss": -27.373035430908203, "global_step": 640752, "epoch": 7719} {"train_loss": -27.26059341430664, "global_step": 640753, "epoch": 7719} {"train_loss": -26.7036190032959, "global_step": 640754, "epoch": 7719} {"train_loss": -27.074432373046875, "global_step": 640755, "epoch": 7719} {"train_loss": -27.624042510986328, "global_step": 640756, "epoch": 7719} {"train_loss": -27.188974380493164, "global_step": 640757, "epoch": 7719} {"train_loss": -27.09857177734375, "global_step": 640758, "epoch": 7719} {"train_loss": -27.025297233857305, "global_step": 640759, "epoch": 7719, "val_loss": 6549291.0} {"train_loss": -25.870136260986328, "global_step": 640760, "epoch": 7720} {"train_loss": -26.510374069213867, "global_step": 640761, "epoch": 7720} {"train_loss": -26.114850997924805, "global_step": 640762, "epoch": 7720} {"train_loss": -26.204635620117188, "global_step": 640763, "epoch": 7720} {"train_loss": -25.960163116455078, "global_step": 640764, "epoch": 7720} {"train_loss": -26.404401779174805, "global_step": 640765, "epoch": 7720} {"train_loss": -26.596271514892578, "global_step": 640766, "epoch": 7720} {"train_loss": -26.502737045288086, "global_step": 640767, "epoch": 7720} {"train_loss": -26.486011505126953, "global_step": 640768, "epoch": 7720} {"train_loss": -26.8460750579834, "global_step": 640769, "epoch": 7720} {"train_loss": -26.704397201538086, "global_step": 640770, "epoch": 7720} {"train_loss": -26.833112716674805, "global_step": 640771, "epoch": 7720} {"train_loss": -26.392597198486328, "global_step": 640772, "epoch": 7720} {"train_loss": -27.093524932861328, "global_step": 640773, "epoch": 7720} {"train_loss": -26.50103187561035, "global_step": 640774, "epoch": 7720} {"train_loss": -26.491796493530273, "global_step": 640775, "epoch": 7720} {"train_loss": -27.072925567626953, "global_step": 640776, "epoch": 7720} {"train_loss": -26.876123428344727, "global_step": 640777, "epoch": 7720} {"train_loss": -26.678281784057617, "global_step": 640778, "epoch": 7720} {"train_loss": -27.249786376953125, "global_step": 640779, "epoch": 7720} {"train_loss": -26.979114532470703, "global_step": 640780, "epoch": 7720} {"train_loss": -26.342838287353516, "global_step": 640781, "epoch": 7720} {"train_loss": -26.719751358032227, "global_step": 640782, "epoch": 7720} {"train_loss": -26.72210693359375, "global_step": 640783, "epoch": 7720} {"train_loss": -26.6198673248291, "global_step": 640784, "epoch": 7720} {"train_loss": -27.0610294342041, "global_step": 640785, "epoch": 7720} {"train_loss": -26.713165283203125, "global_step": 640786, "epoch": 7720} {"train_loss": -27.046722412109375, "global_step": 640787, "epoch": 7720} {"train_loss": -27.015335083007812, "global_step": 640788, "epoch": 7720} {"train_loss": -27.106061935424805, "global_step": 640789, "epoch": 7720} {"train_loss": -27.576374053955078, "global_step": 640790, "epoch": 7720} {"train_loss": -26.991281509399414, "global_step": 640791, "epoch": 7720} {"train_loss": -26.98447608947754, "global_step": 640792, "epoch": 7720} {"train_loss": -26.92657470703125, "global_step": 640793, "epoch": 7720} {"train_loss": -26.869916915893555, "global_step": 640794, "epoch": 7720} {"train_loss": -27.033864974975586, "global_step": 640795, "epoch": 7720} {"train_loss": -27.342334747314453, "global_step": 640796, "epoch": 7720} {"train_loss": -27.2154598236084, "global_step": 640797, "epoch": 7720} {"train_loss": -26.93940544128418, "global_step": 640798, "epoch": 7720} {"train_loss": -27.366220474243164, "global_step": 640799, "epoch": 7720} {"train_loss": -27.346939086914062, "global_step": 640800, "epoch": 7720} {"train_loss": -26.961774826049805, "global_step": 640801, "epoch": 7720} {"train_loss": -27.41827392578125, "global_step": 640802, "epoch": 7720} {"train_loss": -27.6236515045166, "global_step": 640803, "epoch": 7720} {"train_loss": -27.223459243774414, "global_step": 640804, "epoch": 7720} {"train_loss": -27.75160789489746, "global_step": 640805, "epoch": 7720} {"train_loss": -27.58636474609375, "global_step": 640806, "epoch": 7720} {"train_loss": -27.66745376586914, "global_step": 640807, "epoch": 7720} {"train_loss": -27.684045791625977, "global_step": 640808, "epoch": 7720} {"train_loss": -27.33546257019043, "global_step": 640809, "epoch": 7720} {"train_loss": -27.2432918548584, "global_step": 640810, "epoch": 7720} {"train_loss": -28.10230827331543, "global_step": 640811, "epoch": 7720} {"train_loss": -27.567731857299805, "global_step": 640812, "epoch": 7720} {"train_loss": -27.5013370513916, "global_step": 640813, "epoch": 7720} {"train_loss": -27.20891761779785, "global_step": 640814, "epoch": 7720} {"train_loss": -27.33942985534668, "global_step": 640815, "epoch": 7720} {"train_loss": -27.58904457092285, "global_step": 640816, "epoch": 7720} {"train_loss": -27.960676193237305, "global_step": 640817, "epoch": 7720} {"train_loss": -27.490509033203125, "global_step": 640818, "epoch": 7720} {"train_loss": -27.763341903686523, "global_step": 640819, "epoch": 7720} {"train_loss": -27.6652889251709, "global_step": 640820, "epoch": 7720} {"train_loss": -27.520191192626953, "global_step": 640821, "epoch": 7720} {"train_loss": -28.0194034576416, "global_step": 640822, "epoch": 7720} {"train_loss": -28.14217185974121, "global_step": 640823, "epoch": 7720} {"train_loss": -28.004993438720703, "global_step": 640824, "epoch": 7720} {"train_loss": -27.642759323120117, "global_step": 640825, "epoch": 7720} {"train_loss": -27.778833389282227, "global_step": 640826, "epoch": 7720} {"train_loss": -27.9045467376709, "global_step": 640827, "epoch": 7720} {"train_loss": -27.95924949645996, "global_step": 640828, "epoch": 7720} {"train_loss": -27.800495147705078, "global_step": 640829, "epoch": 7720} {"train_loss": -27.6862850189209, "global_step": 640830, "epoch": 7720} {"train_loss": -27.676471710205078, "global_step": 640831, "epoch": 7720} {"train_loss": -27.848651885986328, "global_step": 640832, "epoch": 7720} {"train_loss": -27.948698043823242, "global_step": 640833, "epoch": 7720} {"train_loss": -27.42093849182129, "global_step": 640834, "epoch": 7720} {"train_loss": -27.609760284423828, "global_step": 640835, "epoch": 7720} {"train_loss": -28.07269859313965, "global_step": 640836, "epoch": 7720} {"train_loss": -27.508136749267578, "global_step": 640837, "epoch": 7720} {"train_loss": -26.774646759033203, "global_step": 640838, "epoch": 7720} {"train_loss": -26.736907958984375, "global_step": 640839, "epoch": 7720} {"train_loss": -26.678144454956055, "global_step": 640840, "epoch": 7720} {"train_loss": -26.982666015625, "global_step": 640841, "epoch": 7720} {"train_loss": -27.20192010718656, "global_step": 640842, "epoch": 7720, "val_loss": 6577965.5} {"train_loss": -26.794275283813477, "global_step": 640843, "epoch": 7721} {"train_loss": -26.062108993530273, "global_step": 640844, "epoch": 7721} {"train_loss": -27.149927139282227, "global_step": 640845, "epoch": 7721} {"train_loss": -26.820859909057617, "global_step": 640846, "epoch": 7721} {"train_loss": -26.710107803344727, "global_step": 640847, "epoch": 7721} {"train_loss": -27.25809669494629, "global_step": 640848, "epoch": 7721} {"train_loss": -26.857126235961914, "global_step": 640849, "epoch": 7721} {"train_loss": -27.016437530517578, "global_step": 640850, "epoch": 7721} {"train_loss": -26.933469772338867, "global_step": 640851, "epoch": 7721} {"train_loss": -27.27359962463379, "global_step": 640852, "epoch": 7721} {"train_loss": -27.112646102905273, "global_step": 640853, "epoch": 7721} {"train_loss": -27.345829010009766, "global_step": 640854, "epoch": 7721} {"train_loss": -27.660053253173828, "global_step": 640855, "epoch": 7721} {"train_loss": -27.428510665893555, "global_step": 640856, "epoch": 7721} {"train_loss": -27.465131759643555, "global_step": 640857, "epoch": 7721} {"train_loss": -27.10603904724121, "global_step": 640858, "epoch": 7721} {"train_loss": -27.045551300048828, "global_step": 640859, "epoch": 7721} {"train_loss": -27.640674591064453, "global_step": 640860, "epoch": 7721} {"train_loss": -27.472997665405273, "global_step": 640861, "epoch": 7721} {"train_loss": -27.41816520690918, "global_step": 640862, "epoch": 7721} {"train_loss": -27.685449600219727, "global_step": 640863, "epoch": 7721} {"train_loss": -27.436933517456055, "global_step": 640864, "epoch": 7721} {"train_loss": -27.8631591796875, "global_step": 640865, "epoch": 7721} {"train_loss": -27.79865837097168, "global_step": 640866, "epoch": 7721} {"train_loss": -27.765533447265625, "global_step": 640867, "epoch": 7721} {"train_loss": -27.747350692749023, "global_step": 640868, "epoch": 7721} {"train_loss": -28.04572868347168, "global_step": 640869, "epoch": 7721} {"train_loss": -27.856088638305664, "global_step": 640870, "epoch": 7721} {"train_loss": -27.826526641845703, "global_step": 640871, "epoch": 7721} {"train_loss": -27.285120010375977, "global_step": 640872, "epoch": 7721} {"train_loss": -27.767730712890625, "global_step": 640873, "epoch": 7721} {"train_loss": -28.061216354370117, "global_step": 640874, "epoch": 7721} {"train_loss": -28.24139976501465, "global_step": 640875, "epoch": 7721} {"train_loss": -27.86810874938965, "global_step": 640876, "epoch": 7721} {"train_loss": -27.892658233642578, "global_step": 640877, "epoch": 7721} {"train_loss": -28.156299591064453, "global_step": 640878, "epoch": 7721} {"train_loss": -28.247394561767578, "global_step": 640879, "epoch": 7721} {"train_loss": -28.317968368530273, "global_step": 640880, "epoch": 7721} {"train_loss": -27.88228416442871, "global_step": 640881, "epoch": 7721} {"train_loss": -28.157974243164062, "global_step": 640882, "epoch": 7721} {"train_loss": -27.98095703125, "global_step": 640883, "epoch": 7721} {"train_loss": -28.242431640625, "global_step": 640884, "epoch": 7721} {"train_loss": -27.8547306060791, "global_step": 640885, "epoch": 7721} {"train_loss": -28.094396591186523, "global_step": 640886, "epoch": 7721} {"train_loss": -28.504552841186523, "global_step": 640887, "epoch": 7721} {"train_loss": -28.39710807800293, "global_step": 640888, "epoch": 7721} {"train_loss": -28.398534774780273, "global_step": 640889, "epoch": 7721} {"train_loss": -28.374420166015625, "global_step": 640890, "epoch": 7721} {"train_loss": -28.040555953979492, "global_step": 640891, "epoch": 7721} {"train_loss": -28.205652236938477, "global_step": 640892, "epoch": 7721} {"train_loss": -28.287216186523438, "global_step": 640893, "epoch": 7721} {"train_loss": -28.084157943725586, "global_step": 640894, "epoch": 7721} {"train_loss": -28.46051025390625, "global_step": 640895, "epoch": 7721} {"train_loss": -28.4809513092041, "global_step": 640896, "epoch": 7721} {"train_loss": -28.146839141845703, "global_step": 640897, "epoch": 7721} {"train_loss": -28.178110122680664, "global_step": 640898, "epoch": 7721} {"train_loss": -28.264158248901367, "global_step": 640899, "epoch": 7721} {"train_loss": -28.197751998901367, "global_step": 640900, "epoch": 7721} {"train_loss": -28.031415939331055, "global_step": 640901, "epoch": 7721} {"train_loss": -28.07745933532715, "global_step": 640902, "epoch": 7721} {"train_loss": -28.031110763549805, "global_step": 640903, "epoch": 7721} {"train_loss": -28.197742462158203, "global_step": 640904, "epoch": 7721} {"train_loss": -28.316068649291992, "global_step": 640905, "epoch": 7721} {"train_loss": -28.08497428894043, "global_step": 640906, "epoch": 7721} {"train_loss": -27.89226722717285, "global_step": 640907, "epoch": 7721} {"train_loss": -27.368696212768555, "global_step": 640908, "epoch": 7721} {"train_loss": -25.76325035095215, "global_step": 640909, "epoch": 7721} {"train_loss": -22.764957427978516, "global_step": 640910, "epoch": 7721} {"train_loss": -24.361534118652344, "global_step": 640911, "epoch": 7721} {"train_loss": -27.385202407836914, "global_step": 640912, "epoch": 7721} {"train_loss": -25.665637969970703, "global_step": 640913, "epoch": 7721} {"train_loss": -27.2932186126709, "global_step": 640914, "epoch": 7721} {"train_loss": -26.26312828063965, "global_step": 640915, "epoch": 7721} {"train_loss": -26.799509048461914, "global_step": 640916, "epoch": 7721} {"train_loss": -27.76691246032715, "global_step": 640917, "epoch": 7721} {"train_loss": -26.99619483947754, "global_step": 640918, "epoch": 7721} {"train_loss": -26.88710594177246, "global_step": 640919, "epoch": 7721} {"train_loss": -28.06842041015625, "global_step": 640920, "epoch": 7721} {"train_loss": -27.035322189331055, "global_step": 640921, "epoch": 7721} {"train_loss": -26.952239990234375, "global_step": 640922, "epoch": 7721} {"train_loss": -27.6070613861084, "global_step": 640923, "epoch": 7721} {"train_loss": -27.659748077392578, "global_step": 640924, "epoch": 7721} {"train_loss": -27.556223191410663, "global_step": 640925, "epoch": 7721, "val_loss": 6558886.0} {"train_loss": -27.36370277404785, "global_step": 640926, "epoch": 7722} {"train_loss": -27.191787719726562, "global_step": 640927, "epoch": 7722} {"train_loss": -27.201276779174805, "global_step": 640928, "epoch": 7722} {"train_loss": -27.296995162963867, "global_step": 640929, "epoch": 7722} {"train_loss": -27.368749618530273, "global_step": 640930, "epoch": 7722} {"train_loss": -27.440256118774414, "global_step": 640931, "epoch": 7722} {"train_loss": -27.2276611328125, "global_step": 640932, "epoch": 7722} {"train_loss": -27.07284927368164, "global_step": 640933, "epoch": 7722} {"train_loss": -27.627948760986328, "global_step": 640934, "epoch": 7722} {"train_loss": -27.58942985534668, "global_step": 640935, "epoch": 7722} {"train_loss": -26.966522216796875, "global_step": 640936, "epoch": 7722} {"train_loss": -27.355451583862305, "global_step": 640937, "epoch": 7722} {"train_loss": -27.627532958984375, "global_step": 640938, "epoch": 7722} {"train_loss": -27.655725479125977, "global_step": 640939, "epoch": 7722} {"train_loss": -27.52775001525879, "global_step": 640940, "epoch": 7722} {"train_loss": -27.835376739501953, "global_step": 640941, "epoch": 7722} {"train_loss": -27.4443416595459, "global_step": 640942, "epoch": 7722} {"train_loss": -27.53911781311035, "global_step": 640943, "epoch": 7722} {"train_loss": -27.766340255737305, "global_step": 640944, "epoch": 7722} {"train_loss": -27.661060333251953, "global_step": 640945, "epoch": 7722} {"train_loss": -27.530088424682617, "global_step": 640946, "epoch": 7722} {"train_loss": -27.968677520751953, "global_step": 640947, "epoch": 7722} {"train_loss": -27.65380859375, "global_step": 640948, "epoch": 7722} {"train_loss": -27.630722045898438, "global_step": 640949, "epoch": 7722} {"train_loss": -28.24445915222168, "global_step": 640950, "epoch": 7722} {"train_loss": -27.82819175720215, "global_step": 640951, "epoch": 7722} {"train_loss": -28.105947494506836, "global_step": 640952, "epoch": 7722} {"train_loss": -27.71685791015625, "global_step": 640953, "epoch": 7722} {"train_loss": -27.75239372253418, "global_step": 640954, "epoch": 7722} {"train_loss": -27.957029342651367, "global_step": 640955, "epoch": 7722} {"train_loss": -27.895307540893555, "global_step": 640956, "epoch": 7722} {"train_loss": -28.054563522338867, "global_step": 640957, "epoch": 7722} {"train_loss": -28.024524688720703, "global_step": 640958, "epoch": 7722} {"train_loss": -27.955907821655273, "global_step": 640959, "epoch": 7722} {"train_loss": -27.577234268188477, "global_step": 640960, "epoch": 7722} {"train_loss": -27.823078155517578, "global_step": 640961, "epoch": 7722} {"train_loss": -27.428449630737305, "global_step": 640962, "epoch": 7722} {"train_loss": -27.83527183532715, "global_step": 640963, "epoch": 7722} {"train_loss": -27.493885040283203, "global_step": 640964, "epoch": 7722} {"train_loss": -27.56410026550293, "global_step": 640965, "epoch": 7722} {"train_loss": -28.16200065612793, "global_step": 640966, "epoch": 7722} {"train_loss": -27.95051383972168, "global_step": 640967, "epoch": 7722} {"train_loss": -27.87293815612793, "global_step": 640968, "epoch": 7722} {"train_loss": -28.12687110900879, "global_step": 640969, "epoch": 7722} {"train_loss": -27.85886573791504, "global_step": 640970, "epoch": 7722} {"train_loss": -27.487457275390625, "global_step": 640971, "epoch": 7722} {"train_loss": -28.190290451049805, "global_step": 640972, "epoch": 7722} {"train_loss": -27.803024291992188, "global_step": 640973, "epoch": 7722} {"train_loss": -27.778400421142578, "global_step": 640974, "epoch": 7722} {"train_loss": -28.176654815673828, "global_step": 640975, "epoch": 7722} {"train_loss": -27.998722076416016, "global_step": 640976, "epoch": 7722} {"train_loss": -27.83939552307129, "global_step": 640977, "epoch": 7722} {"train_loss": -27.5757999420166, "global_step": 640978, "epoch": 7722} {"train_loss": -27.941207885742188, "global_step": 640979, "epoch": 7722} {"train_loss": -28.322650909423828, "global_step": 640980, "epoch": 7722} {"train_loss": -28.026275634765625, "global_step": 640981, "epoch": 7722} {"train_loss": -28.091474533081055, "global_step": 640982, "epoch": 7722} {"train_loss": -28.241174697875977, "global_step": 640983, "epoch": 7722} {"train_loss": -28.101667404174805, "global_step": 640984, "epoch": 7722} {"train_loss": -28.16498374938965, "global_step": 640985, "epoch": 7722} {"train_loss": -28.13844108581543, "global_step": 640986, "epoch": 7722} {"train_loss": -27.99357032775879, "global_step": 640987, "epoch": 7722} {"train_loss": -28.004779815673828, "global_step": 640988, "epoch": 7722} {"train_loss": -28.47732925415039, "global_step": 640989, "epoch": 7722} {"train_loss": -28.07368278503418, "global_step": 640990, "epoch": 7722} {"train_loss": -28.071121215820312, "global_step": 640991, "epoch": 7722} {"train_loss": -28.603763580322266, "global_step": 640992, "epoch": 7722} {"train_loss": -28.28379249572754, "global_step": 640993, "epoch": 7722} {"train_loss": -28.455175399780273, "global_step": 640994, "epoch": 7722} {"train_loss": -28.51826286315918, "global_step": 640995, "epoch": 7722} {"train_loss": -28.399396896362305, "global_step": 640996, "epoch": 7722} {"train_loss": -28.102331161499023, "global_step": 640997, "epoch": 7722} {"train_loss": -28.016916275024414, "global_step": 640998, "epoch": 7722} {"train_loss": -28.389184951782227, "global_step": 640999, "epoch": 7722} {"train_loss": -28.29353141784668, "global_step": 641000, "epoch": 7722} {"train_loss": -28.390172958374023, "global_step": 641001, "epoch": 7722} {"train_loss": -28.569019317626953, "global_step": 641002, "epoch": 7722} {"train_loss": -28.33136558532715, "global_step": 641003, "epoch": 7722} {"train_loss": -28.550573348999023, "global_step": 641004, "epoch": 7722} {"train_loss": -28.32935905456543, "global_step": 641005, "epoch": 7722} {"train_loss": -28.4937744140625, "global_step": 641006, "epoch": 7722} {"train_loss": -28.137191772460938, "global_step": 641007, "epoch": 7722} {"train_loss": -27.88307543835008, "global_step": 641008, "epoch": 7722, "val_loss": 6615960.0} {"train_loss": -26.88873863220215, "global_step": 641009, "epoch": 7723} {"train_loss": -26.666732788085938, "global_step": 641010, "epoch": 7723} {"train_loss": -26.63176918029785, "global_step": 641011, "epoch": 7723} {"train_loss": -27.245990753173828, "global_step": 641012, "epoch": 7723} {"train_loss": -27.546728134155273, "global_step": 641013, "epoch": 7723} {"train_loss": -27.145044326782227, "global_step": 641014, "epoch": 7723} {"train_loss": -27.49921226501465, "global_step": 641015, "epoch": 7723} {"train_loss": -27.555927276611328, "global_step": 641016, "epoch": 7723} {"train_loss": -27.22710609436035, "global_step": 641017, "epoch": 7723} {"train_loss": -27.748584747314453, "global_step": 641018, "epoch": 7723} {"train_loss": -27.68915367126465, "global_step": 641019, "epoch": 7723} {"train_loss": -27.595224380493164, "global_step": 641020, "epoch": 7723} {"train_loss": -27.917219161987305, "global_step": 641021, "epoch": 7723} {"train_loss": -27.83977699279785, "global_step": 641022, "epoch": 7723} {"train_loss": -27.868371963500977, "global_step": 641023, "epoch": 7723} {"train_loss": -27.921035766601562, "global_step": 641024, "epoch": 7723} {"train_loss": -27.983966827392578, "global_step": 641025, "epoch": 7723} {"train_loss": -28.050474166870117, "global_step": 641026, "epoch": 7723} {"train_loss": -27.880313873291016, "global_step": 641027, "epoch": 7723} {"train_loss": -27.678070068359375, "global_step": 641028, "epoch": 7723} {"train_loss": -27.96584129333496, "global_step": 641029, "epoch": 7723} {"train_loss": -28.007455825805664, "global_step": 641030, "epoch": 7723} {"train_loss": -28.486841201782227, "global_step": 641031, "epoch": 7723} {"train_loss": -27.811140060424805, "global_step": 641032, "epoch": 7723} {"train_loss": -27.97395133972168, "global_step": 641033, "epoch": 7723} {"train_loss": -28.18646240234375, "global_step": 641034, "epoch": 7723} {"train_loss": -28.015365600585938, "global_step": 641035, "epoch": 7723} {"train_loss": -28.16486167907715, "global_step": 641036, "epoch": 7723} {"train_loss": -28.225290298461914, "global_step": 641037, "epoch": 7723} {"train_loss": -28.139911651611328, "global_step": 641038, "epoch": 7723} {"train_loss": -28.327341079711914, "global_step": 641039, "epoch": 7723} {"train_loss": -28.199689865112305, "global_step": 641040, "epoch": 7723} {"train_loss": -28.4702091217041, "global_step": 641041, "epoch": 7723} {"train_loss": -28.50873374938965, "global_step": 641042, "epoch": 7723} {"train_loss": -28.146759033203125, "global_step": 641043, "epoch": 7723} {"train_loss": -28.295347213745117, "global_step": 641044, "epoch": 7723} {"train_loss": -28.084333419799805, "global_step": 641045, "epoch": 7723} {"train_loss": -28.221776962280273, "global_step": 641046, "epoch": 7723} {"train_loss": -28.31204605102539, "global_step": 641047, "epoch": 7723} {"train_loss": -28.040912628173828, "global_step": 641048, "epoch": 7723} {"train_loss": -28.398834228515625, "global_step": 641049, "epoch": 7723} {"train_loss": -28.285751342773438, "global_step": 641050, "epoch": 7723} {"train_loss": -28.470779418945312, "global_step": 641051, "epoch": 7723} {"train_loss": -28.158966064453125, "global_step": 641052, "epoch": 7723} {"train_loss": -28.29990577697754, "global_step": 641053, "epoch": 7723} {"train_loss": -28.198841094970703, "global_step": 641054, "epoch": 7723} {"train_loss": -28.611103057861328, "global_step": 641055, "epoch": 7723} {"train_loss": -28.327539443969727, "global_step": 641056, "epoch": 7723} {"train_loss": -28.511478424072266, "global_step": 641057, "epoch": 7723} {"train_loss": -28.81233024597168, "global_step": 641058, "epoch": 7723} {"train_loss": -28.539121627807617, "global_step": 641059, "epoch": 7723} {"train_loss": -28.03293800354004, "global_step": 641060, "epoch": 7723} {"train_loss": -28.65716552734375, "global_step": 641061, "epoch": 7723} {"train_loss": -27.87274742126465, "global_step": 641062, "epoch": 7723} {"train_loss": -28.111005783081055, "global_step": 641063, "epoch": 7723} {"train_loss": -28.177845001220703, "global_step": 641064, "epoch": 7723} {"train_loss": -28.69114112854004, "global_step": 641065, "epoch": 7723} {"train_loss": -28.439044952392578, "global_step": 641066, "epoch": 7723} {"train_loss": -27.78780174255371, "global_step": 641067, "epoch": 7723} {"train_loss": -28.741743087768555, "global_step": 641068, "epoch": 7723} {"train_loss": -28.474660873413086, "global_step": 641069, "epoch": 7723} {"train_loss": -28.4547061920166, "global_step": 641070, "epoch": 7723} {"train_loss": -28.758642196655273, "global_step": 641071, "epoch": 7723} {"train_loss": -28.5944766998291, "global_step": 641072, "epoch": 7723} {"train_loss": -28.2790584564209, "global_step": 641073, "epoch": 7723} {"train_loss": -28.755329132080078, "global_step": 641074, "epoch": 7723} {"train_loss": -28.21807861328125, "global_step": 641075, "epoch": 7723} {"train_loss": -28.471960067749023, "global_step": 641076, "epoch": 7723} {"train_loss": -28.77042007446289, "global_step": 641077, "epoch": 7723} {"train_loss": -28.545820236206055, "global_step": 641078, "epoch": 7723} {"train_loss": -28.324710845947266, "global_step": 641079, "epoch": 7723} {"train_loss": -28.237524032592773, "global_step": 641080, "epoch": 7723} {"train_loss": -28.3454532623291, "global_step": 641081, "epoch": 7723} {"train_loss": -28.530902862548828, "global_step": 641082, "epoch": 7723} {"train_loss": -28.489959716796875, "global_step": 641083, "epoch": 7723} {"train_loss": -28.706628799438477, "global_step": 641084, "epoch": 7723} {"train_loss": -28.199390411376953, "global_step": 641085, "epoch": 7723} {"train_loss": -28.498647689819336, "global_step": 641086, "epoch": 7723} {"train_loss": -28.180530548095703, "global_step": 641087, "epoch": 7723} {"train_loss": -28.42203140258789, "global_step": 641088, "epoch": 7723} {"train_loss": -28.509307861328125, "global_step": 641089, "epoch": 7723} {"train_loss": -27.942493438720703, "global_step": 641090, "epoch": 7723} {"train_loss": -28.140910780573467, "global_step": 641091, "epoch": 7723, "val_loss": 6678092.0} {"train_loss": -26.993427276611328, "global_step": 641092, "epoch": 7724} {"train_loss": -26.1319580078125, "global_step": 641093, "epoch": 7724} {"train_loss": -25.118724822998047, "global_step": 641094, "epoch": 7724} {"train_loss": -24.328975677490234, "global_step": 641095, "epoch": 7724} {"train_loss": -27.168806076049805, "global_step": 641096, "epoch": 7724} {"train_loss": -26.31589126586914, "global_step": 641097, "epoch": 7724} {"train_loss": -26.248401641845703, "global_step": 641098, "epoch": 7724} {"train_loss": -26.981918334960938, "global_step": 641099, "epoch": 7724} {"train_loss": -26.97174072265625, "global_step": 641100, "epoch": 7724} {"train_loss": -26.5647029876709, "global_step": 641101, "epoch": 7724} {"train_loss": -27.144336700439453, "global_step": 641102, "epoch": 7724} {"train_loss": -26.830244064331055, "global_step": 641103, "epoch": 7724} {"train_loss": -26.918310165405273, "global_step": 641104, "epoch": 7724} {"train_loss": -27.2218017578125, "global_step": 641105, "epoch": 7724} {"train_loss": -27.102895736694336, "global_step": 641106, "epoch": 7724} {"train_loss": -27.083053588867188, "global_step": 641107, "epoch": 7724} {"train_loss": -27.3311767578125, "global_step": 641108, "epoch": 7724} {"train_loss": -27.123632431030273, "global_step": 641109, "epoch": 7724} {"train_loss": -27.44049072265625, "global_step": 641110, "epoch": 7724} {"train_loss": -27.206296920776367, "global_step": 641111, "epoch": 7724} {"train_loss": -27.49726676940918, "global_step": 641112, "epoch": 7724} {"train_loss": -27.514297485351562, "global_step": 641113, "epoch": 7724} {"train_loss": -27.316373825073242, "global_step": 641114, "epoch": 7724} {"train_loss": -27.41172218322754, "global_step": 641115, "epoch": 7724} {"train_loss": -27.550582885742188, "global_step": 641116, "epoch": 7724} {"train_loss": -27.504261016845703, "global_step": 641117, "epoch": 7724} {"train_loss": -27.474103927612305, "global_step": 641118, "epoch": 7724} {"train_loss": -27.344404220581055, "global_step": 641119, "epoch": 7724} {"train_loss": -27.667362213134766, "global_step": 641120, "epoch": 7724} {"train_loss": -27.6694278717041, "global_step": 641121, "epoch": 7724} {"train_loss": -27.76025390625, "global_step": 641122, "epoch": 7724} {"train_loss": -27.629194259643555, "global_step": 641123, "epoch": 7724} {"train_loss": -27.64426040649414, "global_step": 641124, "epoch": 7724} {"train_loss": -28.055524826049805, "global_step": 641125, "epoch": 7724} {"train_loss": -27.807846069335938, "global_step": 641126, "epoch": 7724} {"train_loss": -28.277713775634766, "global_step": 641127, "epoch": 7724} {"train_loss": -28.043872833251953, "global_step": 641128, "epoch": 7724} {"train_loss": -28.214948654174805, "global_step": 641129, "epoch": 7724} {"train_loss": -27.930816650390625, "global_step": 641130, "epoch": 7724} {"train_loss": -28.2922306060791, "global_step": 641131, "epoch": 7724} {"train_loss": -27.800220489501953, "global_step": 641132, "epoch": 7724} {"train_loss": -28.081151962280273, "global_step": 641133, "epoch": 7724} {"train_loss": -27.6794490814209, "global_step": 641134, "epoch": 7724} {"train_loss": -28.129175186157227, "global_step": 641135, "epoch": 7724} {"train_loss": -28.058568954467773, "global_step": 641136, "epoch": 7724} {"train_loss": -28.002227783203125, "global_step": 641137, "epoch": 7724} {"train_loss": -28.272741317749023, "global_step": 641138, "epoch": 7724} {"train_loss": -27.925073623657227, "global_step": 641139, "epoch": 7724} {"train_loss": -27.92543601989746, "global_step": 641140, "epoch": 7724} {"train_loss": -27.85651206970215, "global_step": 641141, "epoch": 7724} {"train_loss": -28.3370304107666, "global_step": 641142, "epoch": 7724} {"train_loss": -28.30682945251465, "global_step": 641143, "epoch": 7724} {"train_loss": -28.613019943237305, "global_step": 641144, "epoch": 7724} {"train_loss": -28.169921875, "global_step": 641145, "epoch": 7724} {"train_loss": -28.4042911529541, "global_step": 641146, "epoch": 7724} {"train_loss": -28.39676284790039, "global_step": 641147, "epoch": 7724} {"train_loss": -28.378894805908203, "global_step": 641148, "epoch": 7724} {"train_loss": -28.605548858642578, "global_step": 641149, "epoch": 7724} {"train_loss": -28.038877487182617, "global_step": 641150, "epoch": 7724} {"train_loss": -28.31544303894043, "global_step": 641151, "epoch": 7724} {"train_loss": -28.60135269165039, "global_step": 641152, "epoch": 7724} {"train_loss": -28.19911766052246, "global_step": 641153, "epoch": 7724} {"train_loss": -28.703617095947266, "global_step": 641154, "epoch": 7724} {"train_loss": -28.718597412109375, "global_step": 641155, "epoch": 7724} {"train_loss": -28.313613891601562, "global_step": 641156, "epoch": 7724} {"train_loss": -28.307525634765625, "global_step": 641157, "epoch": 7724} {"train_loss": -28.190296173095703, "global_step": 641158, "epoch": 7724} {"train_loss": -28.315174102783203, "global_step": 641159, "epoch": 7724} {"train_loss": -28.504865646362305, "global_step": 641160, "epoch": 7724} {"train_loss": -28.25383949279785, "global_step": 641161, "epoch": 7724} {"train_loss": -28.190811157226562, "global_step": 641162, "epoch": 7724} {"train_loss": -28.415576934814453, "global_step": 641163, "epoch": 7724} {"train_loss": -28.211400985717773, "global_step": 641164, "epoch": 7724} {"train_loss": -28.443161010742188, "global_step": 641165, "epoch": 7724} {"train_loss": -28.64202880859375, "global_step": 641166, "epoch": 7724} {"train_loss": -28.504438400268555, "global_step": 641167, "epoch": 7724} {"train_loss": -28.457916259765625, "global_step": 641168, "epoch": 7724} {"train_loss": -27.96923828125, "global_step": 641169, "epoch": 7724} {"train_loss": -28.230886459350586, "global_step": 641170, "epoch": 7724} {"train_loss": -28.80301284790039, "global_step": 641171, "epoch": 7724} {"train_loss": -28.15121841430664, "global_step": 641172, "epoch": 7724} {"train_loss": -27.7777042388916, "global_step": 641173, "epoch": 7724} {"train_loss": -27.7719583166651, "global_step": 641174, "epoch": 7724, "val_loss": 6577429.0} {"train_loss": -27.948047637939453, "global_step": 641175, "epoch": 7725} {"train_loss": -27.60992431640625, "global_step": 641176, "epoch": 7725} {"train_loss": -27.361555099487305, "global_step": 641177, "epoch": 7725} {"train_loss": -27.408193588256836, "global_step": 641178, "epoch": 7725} {"train_loss": -27.377277374267578, "global_step": 641179, "epoch": 7725} {"train_loss": -27.985565185546875, "global_step": 641180, "epoch": 7725} {"train_loss": -27.54767417907715, "global_step": 641181, "epoch": 7725} {"train_loss": -27.78388786315918, "global_step": 641182, "epoch": 7725} {"train_loss": -27.930316925048828, "global_step": 641183, "epoch": 7725} {"train_loss": -28.0379638671875, "global_step": 641184, "epoch": 7725} {"train_loss": -27.542926788330078, "global_step": 641185, "epoch": 7725} {"train_loss": -27.399154663085938, "global_step": 641186, "epoch": 7725} {"train_loss": -27.446645736694336, "global_step": 641187, "epoch": 7725} {"train_loss": -27.847213745117188, "global_step": 641188, "epoch": 7725} {"train_loss": -28.3482608795166, "global_step": 641189, "epoch": 7725} {"train_loss": -28.146865844726562, "global_step": 641190, "epoch": 7725} {"train_loss": -28.011884689331055, "global_step": 641191, "epoch": 7725} {"train_loss": -27.926355361938477, "global_step": 641192, "epoch": 7725} {"train_loss": -28.188444137573242, "global_step": 641193, "epoch": 7725} {"train_loss": -28.47393798828125, "global_step": 641194, "epoch": 7725} {"train_loss": -28.36408042907715, "global_step": 641195, "epoch": 7725} {"train_loss": -28.184345245361328, "global_step": 641196, "epoch": 7725} {"train_loss": -28.0747127532959, "global_step": 641197, "epoch": 7725} {"train_loss": -28.073408126831055, "global_step": 641198, "epoch": 7725} {"train_loss": -28.076406478881836, "global_step": 641199, "epoch": 7725} {"train_loss": -28.497358322143555, "global_step": 641200, "epoch": 7725} {"train_loss": -28.224584579467773, "global_step": 641201, "epoch": 7725} {"train_loss": -28.3291072845459, "global_step": 641202, "epoch": 7725} {"train_loss": -28.64344596862793, "global_step": 641203, "epoch": 7725} {"train_loss": -27.973541259765625, "global_step": 641204, "epoch": 7725} {"train_loss": -28.083154678344727, "global_step": 641205, "epoch": 7725} {"train_loss": -28.258665084838867, "global_step": 641206, "epoch": 7725} {"train_loss": -28.3770751953125, "global_step": 641207, "epoch": 7725} {"train_loss": -28.377527236938477, "global_step": 641208, "epoch": 7725} {"train_loss": -28.45001792907715, "global_step": 641209, "epoch": 7725} {"train_loss": -28.1495361328125, "global_step": 641210, "epoch": 7725} {"train_loss": -28.533422470092773, "global_step": 641211, "epoch": 7725} {"train_loss": -28.181272506713867, "global_step": 641212, "epoch": 7725} {"train_loss": -28.188154220581055, "global_step": 641213, "epoch": 7725} {"train_loss": -28.179243087768555, "global_step": 641214, "epoch": 7725} {"train_loss": -28.443958282470703, "global_step": 641215, "epoch": 7725} {"train_loss": -28.50160026550293, "global_step": 641216, "epoch": 7725} {"train_loss": -27.89588737487793, "global_step": 641217, "epoch": 7725} {"train_loss": -28.432098388671875, "global_step": 641218, "epoch": 7725} {"train_loss": -28.339338302612305, "global_step": 641219, "epoch": 7725} {"train_loss": -28.349348068237305, "global_step": 641220, "epoch": 7725} {"train_loss": -28.23707389831543, "global_step": 641221, "epoch": 7725} {"train_loss": -28.394834518432617, "global_step": 641222, "epoch": 7725} {"train_loss": -28.413740158081055, "global_step": 641223, "epoch": 7725} {"train_loss": -28.350141525268555, "global_step": 641224, "epoch": 7725} {"train_loss": -27.885400772094727, "global_step": 641225, "epoch": 7725} {"train_loss": -28.18556785583496, "global_step": 641226, "epoch": 7725} {"train_loss": -28.2894287109375, "global_step": 641227, "epoch": 7725} {"train_loss": -28.363393783569336, "global_step": 641228, "epoch": 7725} {"train_loss": -28.224401473999023, "global_step": 641229, "epoch": 7725} {"train_loss": -28.4040470123291, "global_step": 641230, "epoch": 7725} {"train_loss": -28.1603946685791, "global_step": 641231, "epoch": 7725} {"train_loss": -28.408605575561523, "global_step": 641232, "epoch": 7725} {"train_loss": -28.049957275390625, "global_step": 641233, "epoch": 7725} {"train_loss": -28.053796768188477, "global_step": 641234, "epoch": 7725} {"train_loss": -28.211645126342773, "global_step": 641235, "epoch": 7725} {"train_loss": -28.515960693359375, "global_step": 641236, "epoch": 7725} {"train_loss": -28.37566566467285, "global_step": 641237, "epoch": 7725} {"train_loss": -28.511743545532227, "global_step": 641238, "epoch": 7725} {"train_loss": -28.385644912719727, "global_step": 641239, "epoch": 7725} {"train_loss": -28.359487533569336, "global_step": 641240, "epoch": 7725} {"train_loss": -28.43890953063965, "global_step": 641241, "epoch": 7725} {"train_loss": -28.62055015563965, "global_step": 641242, "epoch": 7725} {"train_loss": -28.17496109008789, "global_step": 641243, "epoch": 7725} {"train_loss": -28.3634033203125, "global_step": 641244, "epoch": 7725} {"train_loss": -28.409284591674805, "global_step": 641245, "epoch": 7725} {"train_loss": -28.4965877532959, "global_step": 641246, "epoch": 7725} {"train_loss": -28.054494857788086, "global_step": 641247, "epoch": 7725} {"train_loss": -28.498376846313477, "global_step": 641248, "epoch": 7725} {"train_loss": -28.25341796875, "global_step": 641249, "epoch": 7725} {"train_loss": -28.441625595092773, "global_step": 641250, "epoch": 7725} {"train_loss": -28.876495361328125, "global_step": 641251, "epoch": 7725} {"train_loss": -28.492971420288086, "global_step": 641252, "epoch": 7725} {"train_loss": -28.425687789916992, "global_step": 641253, "epoch": 7725} {"train_loss": -28.603849411010742, "global_step": 641254, "epoch": 7725} {"train_loss": -28.439395904541016, "global_step": 641255, "epoch": 7725} {"train_loss": -28.353748321533203, "global_step": 641256, "epoch": 7725} {"train_loss": -28.208888800747424, "global_step": 641257, "epoch": 7725, "val_loss": 6629408.5} {"train_loss": -28.08601188659668, "global_step": 641258, "epoch": 7726} {"train_loss": -27.400943756103516, "global_step": 641259, "epoch": 7726} {"train_loss": -27.01327896118164, "global_step": 641260, "epoch": 7726} {"train_loss": -27.22736167907715, "global_step": 641261, "epoch": 7726} {"train_loss": -28.141223907470703, "global_step": 641262, "epoch": 7726} {"train_loss": -27.227203369140625, "global_step": 641263, "epoch": 7726} {"train_loss": -27.27202796936035, "global_step": 641264, "epoch": 7726} {"train_loss": -28.132434844970703, "global_step": 641265, "epoch": 7726} {"train_loss": -27.681867599487305, "global_step": 641266, "epoch": 7726} {"train_loss": -27.890222549438477, "global_step": 641267, "epoch": 7726} {"train_loss": -27.94989013671875, "global_step": 641268, "epoch": 7726} {"train_loss": -28.149824142456055, "global_step": 641269, "epoch": 7726} {"train_loss": -28.252172470092773, "global_step": 641270, "epoch": 7726} {"train_loss": -27.902185440063477, "global_step": 641271, "epoch": 7726} {"train_loss": -28.070072174072266, "global_step": 641272, "epoch": 7726} {"train_loss": -28.3319034576416, "global_step": 641273, "epoch": 7726} {"train_loss": -27.917877197265625, "global_step": 641274, "epoch": 7726} {"train_loss": -28.453006744384766, "global_step": 641275, "epoch": 7726} {"train_loss": -27.88739585876465, "global_step": 641276, "epoch": 7726} {"train_loss": -28.16277503967285, "global_step": 641277, "epoch": 7726} {"train_loss": -28.0892333984375, "global_step": 641278, "epoch": 7726} {"train_loss": -27.94453239440918, "global_step": 641279, "epoch": 7726} {"train_loss": -27.863000869750977, "global_step": 641280, "epoch": 7726} {"train_loss": -27.634885787963867, "global_step": 641281, "epoch": 7726} {"train_loss": -28.404783248901367, "global_step": 641282, "epoch": 7726} {"train_loss": -27.894351959228516, "global_step": 641283, "epoch": 7726} {"train_loss": -28.362791061401367, "global_step": 641284, "epoch": 7726} {"train_loss": -28.361974716186523, "global_step": 641285, "epoch": 7726} {"train_loss": -28.1372127532959, "global_step": 641286, "epoch": 7726} {"train_loss": -28.3626766204834, "global_step": 641287, "epoch": 7726} {"train_loss": -28.156530380249023, "global_step": 641288, "epoch": 7726} {"train_loss": -28.2979793548584, "global_step": 641289, "epoch": 7726} {"train_loss": -28.112699508666992, "global_step": 641290, "epoch": 7726} {"train_loss": -28.20502281188965, "global_step": 641291, "epoch": 7726} {"train_loss": -28.516691207885742, "global_step": 641292, "epoch": 7726} {"train_loss": -28.097631454467773, "global_step": 641293, "epoch": 7726} {"train_loss": -28.100605010986328, "global_step": 641294, "epoch": 7726} {"train_loss": -28.268705368041992, "global_step": 641295, "epoch": 7726} {"train_loss": -28.5749568939209, "global_step": 641296, "epoch": 7726} {"train_loss": -28.195951461791992, "global_step": 641297, "epoch": 7726} {"train_loss": -28.263721466064453, "global_step": 641298, "epoch": 7726} {"train_loss": -27.79410743713379, "global_step": 641299, "epoch": 7726} {"train_loss": -28.364965438842773, "global_step": 641300, "epoch": 7726} {"train_loss": -28.1531982421875, "global_step": 641301, "epoch": 7726} {"train_loss": -28.14983558654785, "global_step": 641302, "epoch": 7726} {"train_loss": -28.10687255859375, "global_step": 641303, "epoch": 7726} {"train_loss": -28.165225982666016, "global_step": 641304, "epoch": 7726} {"train_loss": -28.254308700561523, "global_step": 641305, "epoch": 7726} {"train_loss": -28.291366577148438, "global_step": 641306, "epoch": 7726} {"train_loss": -28.1075496673584, "global_step": 641307, "epoch": 7726} {"train_loss": -28.156021118164062, "global_step": 641308, "epoch": 7726} {"train_loss": -28.702411651611328, "global_step": 641309, "epoch": 7726} {"train_loss": -28.27906608581543, "global_step": 641310, "epoch": 7726} {"train_loss": -28.173933029174805, "global_step": 641311, "epoch": 7726} {"train_loss": -28.625701904296875, "global_step": 641312, "epoch": 7726} {"train_loss": -28.299680709838867, "global_step": 641313, "epoch": 7726} {"train_loss": -28.068206787109375, "global_step": 641314, "epoch": 7726} {"train_loss": -28.575332641601562, "global_step": 641315, "epoch": 7726} {"train_loss": -28.624652862548828, "global_step": 641316, "epoch": 7726} {"train_loss": -28.146841049194336, "global_step": 641317, "epoch": 7726} {"train_loss": -28.420215606689453, "global_step": 641318, "epoch": 7726} {"train_loss": -28.180200576782227, "global_step": 641319, "epoch": 7726} {"train_loss": -28.543991088867188, "global_step": 641320, "epoch": 7726} {"train_loss": -28.414203643798828, "global_step": 641321, "epoch": 7726} {"train_loss": -28.406721115112305, "global_step": 641322, "epoch": 7726} {"train_loss": -28.308685302734375, "global_step": 641323, "epoch": 7726} {"train_loss": -28.32590675354004, "global_step": 641324, "epoch": 7726} {"train_loss": -28.07318687438965, "global_step": 641325, "epoch": 7726} {"train_loss": -28.252323150634766, "global_step": 641326, "epoch": 7726} {"train_loss": -28.256677627563477, "global_step": 641327, "epoch": 7726} {"train_loss": -28.23818016052246, "global_step": 641328, "epoch": 7726} {"train_loss": -28.608983993530273, "global_step": 641329, "epoch": 7726} {"train_loss": -28.356115341186523, "global_step": 641330, "epoch": 7726} {"train_loss": -28.336904525756836, "global_step": 641331, "epoch": 7726} {"train_loss": -28.103900909423828, "global_step": 641332, "epoch": 7726} {"train_loss": -27.74267578125, "global_step": 641333, "epoch": 7726} {"train_loss": -27.392333984375, "global_step": 641334, "epoch": 7726} {"train_loss": -27.9908504486084, "global_step": 641335, "epoch": 7726} {"train_loss": -28.2044620513916, "global_step": 641336, "epoch": 7726} {"train_loss": -28.489938735961914, "global_step": 641337, "epoch": 7726} {"train_loss": -28.368967056274414, "global_step": 641338, "epoch": 7726} {"train_loss": -28.622058868408203, "global_step": 641339, "epoch": 7726} {"train_loss": -28.157911369599493, "global_step": 641340, "epoch": 7726, "val_loss": 6687926.0} {"train_loss": -28.3287410736084, "global_step": 641341, "epoch": 7727} {"train_loss": -28.501575469970703, "global_step": 641342, "epoch": 7727} {"train_loss": -28.079381942749023, "global_step": 641343, "epoch": 7727} {"train_loss": -27.86513328552246, "global_step": 641344, "epoch": 7727} {"train_loss": -28.2247371673584, "global_step": 641345, "epoch": 7727} {"train_loss": -28.1916446685791, "global_step": 641346, "epoch": 7727} {"train_loss": -27.843122482299805, "global_step": 641347, "epoch": 7727} {"train_loss": -27.752578735351562, "global_step": 641348, "epoch": 7727} {"train_loss": -28.21651268005371, "global_step": 641349, "epoch": 7727} {"train_loss": -27.702655792236328, "global_step": 641350, "epoch": 7727} {"train_loss": -27.913726806640625, "global_step": 641351, "epoch": 7727} {"train_loss": -27.235448837280273, "global_step": 641352, "epoch": 7727} {"train_loss": -27.837387084960938, "global_step": 641353, "epoch": 7727} {"train_loss": -27.85828971862793, "global_step": 641354, "epoch": 7727} {"train_loss": -27.8856143951416, "global_step": 641355, "epoch": 7727} {"train_loss": -27.718469619750977, "global_step": 641356, "epoch": 7727} {"train_loss": -27.87591552734375, "global_step": 641357, "epoch": 7727} {"train_loss": -27.7874813079834, "global_step": 641358, "epoch": 7727} {"train_loss": -27.801599502563477, "global_step": 641359, "epoch": 7727} {"train_loss": -28.176965713500977, "global_step": 641360, "epoch": 7727} {"train_loss": -28.4212589263916, "global_step": 641361, "epoch": 7727} {"train_loss": -27.988080978393555, "global_step": 641362, "epoch": 7727} {"train_loss": -28.532270431518555, "global_step": 641363, "epoch": 7727} {"train_loss": -28.23410415649414, "global_step": 641364, "epoch": 7727} {"train_loss": -28.237838745117188, "global_step": 641365, "epoch": 7727} {"train_loss": -28.304264068603516, "global_step": 641366, "epoch": 7727} {"train_loss": -27.950626373291016, "global_step": 641367, "epoch": 7727} {"train_loss": -27.78500747680664, "global_step": 641368, "epoch": 7727} {"train_loss": -28.2331600189209, "global_step": 641369, "epoch": 7727} {"train_loss": -27.997684478759766, "global_step": 641370, "epoch": 7727} {"train_loss": -28.348867416381836, "global_step": 641371, "epoch": 7727} {"train_loss": -28.32792091369629, "global_step": 641372, "epoch": 7727} {"train_loss": -28.5435733795166, "global_step": 641373, "epoch": 7727} {"train_loss": -28.6052188873291, "global_step": 641374, "epoch": 7727} {"train_loss": -28.1470947265625, "global_step": 641375, "epoch": 7727} {"train_loss": -28.258209228515625, "global_step": 641376, "epoch": 7727} {"train_loss": -28.2410831451416, "global_step": 641377, "epoch": 7727} {"train_loss": -28.41608238220215, "global_step": 641378, "epoch": 7727} {"train_loss": -28.413686752319336, "global_step": 641379, "epoch": 7727} {"train_loss": -28.49616050720215, "global_step": 641380, "epoch": 7727} {"train_loss": -28.369831085205078, "global_step": 641381, "epoch": 7727} {"train_loss": -28.585962295532227, "global_step": 641382, "epoch": 7727} {"train_loss": -28.06630516052246, "global_step": 641383, "epoch": 7727} {"train_loss": -28.390817642211914, "global_step": 641384, "epoch": 7727} {"train_loss": -28.704660415649414, "global_step": 641385, "epoch": 7727} {"train_loss": -28.527185440063477, "global_step": 641386, "epoch": 7727} {"train_loss": -28.729339599609375, "global_step": 641387, "epoch": 7727} {"train_loss": -28.238422393798828, "global_step": 641388, "epoch": 7727} {"train_loss": -28.582056045532227, "global_step": 641389, "epoch": 7727} {"train_loss": -28.397916793823242, "global_step": 641390, "epoch": 7727} {"train_loss": -28.4162654876709, "global_step": 641391, "epoch": 7727} {"train_loss": -28.599170684814453, "global_step": 641392, "epoch": 7727} {"train_loss": -28.6848201751709, "global_step": 641393, "epoch": 7727} {"train_loss": -28.177692413330078, "global_step": 641394, "epoch": 7727} {"train_loss": -28.46088218688965, "global_step": 641395, "epoch": 7727} {"train_loss": -28.452436447143555, "global_step": 641396, "epoch": 7727} {"train_loss": -28.387359619140625, "global_step": 641397, "epoch": 7727} {"train_loss": -28.4278564453125, "global_step": 641398, "epoch": 7727} {"train_loss": -28.148136138916016, "global_step": 641399, "epoch": 7727} {"train_loss": -28.30588150024414, "global_step": 641400, "epoch": 7727} {"train_loss": -28.280858993530273, "global_step": 641401, "epoch": 7727} {"train_loss": -28.462976455688477, "global_step": 641402, "epoch": 7727} {"train_loss": -28.33660888671875, "global_step": 641403, "epoch": 7727} {"train_loss": -28.695302963256836, "global_step": 641404, "epoch": 7727} {"train_loss": -28.414031982421875, "global_step": 641405, "epoch": 7727} {"train_loss": -28.665313720703125, "global_step": 641406, "epoch": 7727} {"train_loss": -28.603803634643555, "global_step": 641407, "epoch": 7727} {"train_loss": -28.239044189453125, "global_step": 641408, "epoch": 7727} {"train_loss": -28.799474716186523, "global_step": 641409, "epoch": 7727} {"train_loss": -28.260480880737305, "global_step": 641410, "epoch": 7727} {"train_loss": -28.79292106628418, "global_step": 641411, "epoch": 7727} {"train_loss": -28.625707626342773, "global_step": 641412, "epoch": 7727} {"train_loss": -28.259246826171875, "global_step": 641413, "epoch": 7727} {"train_loss": -28.54987144470215, "global_step": 641414, "epoch": 7727} {"train_loss": -28.215322494506836, "global_step": 641415, "epoch": 7727} {"train_loss": -28.131345748901367, "global_step": 641416, "epoch": 7727} {"train_loss": -26.789270401000977, "global_step": 641417, "epoch": 7727} {"train_loss": -24.938514709472656, "global_step": 641418, "epoch": 7727} {"train_loss": -24.80501365661621, "global_step": 641419, "epoch": 7727} {"train_loss": -25.756845474243164, "global_step": 641420, "epoch": 7727} {"train_loss": -27.441181182861328, "global_step": 641421, "epoch": 7727} {"train_loss": -26.889673233032227, "global_step": 641422, "epoch": 7727} {"train_loss": -28.08756573228951, "global_step": 641423, "epoch": 7727, "val_loss": 6754394.0} {"train_loss": -27.187681198120117, "global_step": 641424, "epoch": 7728} {"train_loss": -25.985219955444336, "global_step": 641425, "epoch": 7728} {"train_loss": -27.32526206970215, "global_step": 641426, "epoch": 7728} {"train_loss": -26.52200698852539, "global_step": 641427, "epoch": 7728} {"train_loss": -27.109180450439453, "global_step": 641428, "epoch": 7728} {"train_loss": -26.752838134765625, "global_step": 641429, "epoch": 7728} {"train_loss": -26.79786491394043, "global_step": 641430, "epoch": 7728} {"train_loss": -26.77454948425293, "global_step": 641431, "epoch": 7728} {"train_loss": -26.63848876953125, "global_step": 641432, "epoch": 7728} {"train_loss": -26.8006649017334, "global_step": 641433, "epoch": 7728} {"train_loss": -26.79229164123535, "global_step": 641434, "epoch": 7728} {"train_loss": -26.782764434814453, "global_step": 641435, "epoch": 7728} {"train_loss": -27.28194236755371, "global_step": 641436, "epoch": 7728} {"train_loss": -26.96846580505371, "global_step": 641437, "epoch": 7728} {"train_loss": -27.274728775024414, "global_step": 641438, "epoch": 7728} {"train_loss": -27.269330978393555, "global_step": 641439, "epoch": 7728} {"train_loss": -27.4234676361084, "global_step": 641440, "epoch": 7728} {"train_loss": -27.522680282592773, "global_step": 641441, "epoch": 7728} {"train_loss": -27.3297119140625, "global_step": 641442, "epoch": 7728} {"train_loss": -27.593463897705078, "global_step": 641443, "epoch": 7728} {"train_loss": -27.113147735595703, "global_step": 641444, "epoch": 7728} {"train_loss": -27.594970703125, "global_step": 641445, "epoch": 7728} {"train_loss": -27.724393844604492, "global_step": 641446, "epoch": 7728} {"train_loss": -27.70667839050293, "global_step": 641447, "epoch": 7728} {"train_loss": -27.739673614501953, "global_step": 641448, "epoch": 7728} {"train_loss": -27.69944190979004, "global_step": 641449, "epoch": 7728} {"train_loss": -27.945371627807617, "global_step": 641450, "epoch": 7728} {"train_loss": -27.79570960998535, "global_step": 641451, "epoch": 7728} {"train_loss": -27.895658493041992, "global_step": 641452, "epoch": 7728} {"train_loss": -27.580358505249023, "global_step": 641453, "epoch": 7728} {"train_loss": -27.44354820251465, "global_step": 641454, "epoch": 7728} {"train_loss": -28.390552520751953, "global_step": 641455, "epoch": 7728} {"train_loss": -27.962787628173828, "global_step": 641456, "epoch": 7728} {"train_loss": -27.94040298461914, "global_step": 641457, "epoch": 7728} {"train_loss": -27.474716186523438, "global_step": 641458, "epoch": 7728} {"train_loss": -28.0164852142334, "global_step": 641459, "epoch": 7728} {"train_loss": -28.257116317749023, "global_step": 641460, "epoch": 7728} {"train_loss": -28.003448486328125, "global_step": 641461, "epoch": 7728} {"train_loss": -28.025754928588867, "global_step": 641462, "epoch": 7728} {"train_loss": -28.23601722717285, "global_step": 641463, "epoch": 7728} {"train_loss": -28.48287010192871, "global_step": 641464, "epoch": 7728} {"train_loss": -28.4060115814209, "global_step": 641465, "epoch": 7728} {"train_loss": -28.061384201049805, "global_step": 641466, "epoch": 7728} {"train_loss": -28.46294593811035, "global_step": 641467, "epoch": 7728} {"train_loss": -28.46856689453125, "global_step": 641468, "epoch": 7728} {"train_loss": -28.179248809814453, "global_step": 641469, "epoch": 7728} {"train_loss": -28.528982162475586, "global_step": 641470, "epoch": 7728} {"train_loss": -28.62031364440918, "global_step": 641471, "epoch": 7728} {"train_loss": -28.33436393737793, "global_step": 641472, "epoch": 7728} {"train_loss": -28.53193473815918, "global_step": 641473, "epoch": 7728} {"train_loss": -28.43011474609375, "global_step": 641474, "epoch": 7728} {"train_loss": -28.556161880493164, "global_step": 641475, "epoch": 7728} {"train_loss": -28.53045082092285, "global_step": 641476, "epoch": 7728} {"train_loss": -28.20712661743164, "global_step": 641477, "epoch": 7728} {"train_loss": -28.586578369140625, "global_step": 641478, "epoch": 7728} {"train_loss": -28.655561447143555, "global_step": 641479, "epoch": 7728} {"train_loss": -28.600500106811523, "global_step": 641480, "epoch": 7728} {"train_loss": -28.415128707885742, "global_step": 641481, "epoch": 7728} {"train_loss": -28.906665802001953, "global_step": 641482, "epoch": 7728} {"train_loss": -28.20619773864746, "global_step": 641483, "epoch": 7728} {"train_loss": -28.16859245300293, "global_step": 641484, "epoch": 7728} {"train_loss": -28.073537826538086, "global_step": 641485, "epoch": 7728} {"train_loss": -28.27748680114746, "global_step": 641486, "epoch": 7728} {"train_loss": -28.734201431274414, "global_step": 641487, "epoch": 7728} {"train_loss": -28.35713005065918, "global_step": 641488, "epoch": 7728} {"train_loss": -28.487863540649414, "global_step": 641489, "epoch": 7728} {"train_loss": -28.86175537109375, "global_step": 641490, "epoch": 7728} {"train_loss": -28.47002601623535, "global_step": 641491, "epoch": 7728} {"train_loss": -28.369403839111328, "global_step": 641492, "epoch": 7728} {"train_loss": -28.299158096313477, "global_step": 641493, "epoch": 7728} {"train_loss": -28.349348068237305, "global_step": 641494, "epoch": 7728} {"train_loss": -28.52446937561035, "global_step": 641495, "epoch": 7728} {"train_loss": -28.629302978515625, "global_step": 641496, "epoch": 7728} {"train_loss": -28.432544708251953, "global_step": 641497, "epoch": 7728} {"train_loss": -28.592605590820312, "global_step": 641498, "epoch": 7728} {"train_loss": -27.940404891967773, "global_step": 641499, "epoch": 7728} {"train_loss": -28.625333786010742, "global_step": 641500, "epoch": 7728} {"train_loss": -28.1000919342041, "global_step": 641501, "epoch": 7728} {"train_loss": -28.382343292236328, "global_step": 641502, "epoch": 7728} {"train_loss": -28.52581787109375, "global_step": 641503, "epoch": 7728} {"train_loss": -28.655004501342773, "global_step": 641504, "epoch": 7728} {"train_loss": -28.590368270874023, "global_step": 641505, "epoch": 7728} {"train_loss": -27.95163030509489, "global_step": 641506, "epoch": 7728, "val_loss": 6661813.0} {"train_loss": -28.170764923095703, "global_step": 641507, "epoch": 7729} {"train_loss": -27.977996826171875, "global_step": 641508, "epoch": 7729} {"train_loss": -27.949188232421875, "global_step": 641509, "epoch": 7729} {"train_loss": -27.98050308227539, "global_step": 641510, "epoch": 7729} {"train_loss": -27.906049728393555, "global_step": 641511, "epoch": 7729} {"train_loss": -27.932647705078125, "global_step": 641512, "epoch": 7729} {"train_loss": -27.551511764526367, "global_step": 641513, "epoch": 7729} {"train_loss": -27.762243270874023, "global_step": 641514, "epoch": 7729} {"train_loss": -28.3045711517334, "global_step": 641515, "epoch": 7729} {"train_loss": -28.0700740814209, "global_step": 641516, "epoch": 7729} {"train_loss": -28.299701690673828, "global_step": 641517, "epoch": 7729} {"train_loss": -28.05988121032715, "global_step": 641518, "epoch": 7729} {"train_loss": -28.327392578125, "global_step": 641519, "epoch": 7729} {"train_loss": -28.364795684814453, "global_step": 641520, "epoch": 7729} {"train_loss": -28.232776641845703, "global_step": 641521, "epoch": 7729} {"train_loss": -28.290525436401367, "global_step": 641522, "epoch": 7729} {"train_loss": -28.166980743408203, "global_step": 641523, "epoch": 7729} {"train_loss": -28.39703941345215, "global_step": 641524, "epoch": 7729} {"train_loss": -28.252405166625977, "global_step": 641525, "epoch": 7729} {"train_loss": -28.605194091796875, "global_step": 641526, "epoch": 7729} {"train_loss": -27.790739059448242, "global_step": 641527, "epoch": 7729} {"train_loss": -28.362836837768555, "global_step": 641528, "epoch": 7729} {"train_loss": -28.342514038085938, "global_step": 641529, "epoch": 7729} {"train_loss": -27.566068649291992, "global_step": 641530, "epoch": 7729} {"train_loss": -28.237060546875, "global_step": 641531, "epoch": 7729} {"train_loss": -28.7034854888916, "global_step": 641532, "epoch": 7729} {"train_loss": -28.59248161315918, "global_step": 641533, "epoch": 7729} {"train_loss": -28.232263565063477, "global_step": 641534, "epoch": 7729} {"train_loss": -28.798776626586914, "global_step": 641535, "epoch": 7729} {"train_loss": -28.754560470581055, "global_step": 641536, "epoch": 7729} {"train_loss": -28.377363204956055, "global_step": 641537, "epoch": 7729} {"train_loss": -27.955554962158203, "global_step": 641538, "epoch": 7729} {"train_loss": -28.222742080688477, "global_step": 641539, "epoch": 7729} {"train_loss": -28.441089630126953, "global_step": 641540, "epoch": 7729} {"train_loss": -28.455846786499023, "global_step": 641541, "epoch": 7729} {"train_loss": -28.111892700195312, "global_step": 641542, "epoch": 7729} {"train_loss": -28.1285343170166, "global_step": 641543, "epoch": 7729} {"train_loss": -28.068952560424805, "global_step": 641544, "epoch": 7729} {"train_loss": -28.154218673706055, "global_step": 641545, "epoch": 7729} {"train_loss": -28.396484375, "global_step": 641546, "epoch": 7729} {"train_loss": -28.16131591796875, "global_step": 641547, "epoch": 7729} {"train_loss": -28.030851364135742, "global_step": 641548, "epoch": 7729} {"train_loss": -28.481008529663086, "global_step": 641549, "epoch": 7729} {"train_loss": -28.457563400268555, "global_step": 641550, "epoch": 7729} {"train_loss": -28.60332679748535, "global_step": 641551, "epoch": 7729} {"train_loss": -28.370935440063477, "global_step": 641552, "epoch": 7729} {"train_loss": -28.273351669311523, "global_step": 641553, "epoch": 7729} {"train_loss": -28.742877960205078, "global_step": 641554, "epoch": 7729} {"train_loss": -28.67206382751465, "global_step": 641555, "epoch": 7729} {"train_loss": -28.20257568359375, "global_step": 641556, "epoch": 7729} {"train_loss": -28.133987426757812, "global_step": 641557, "epoch": 7729} {"train_loss": -28.538909912109375, "global_step": 641558, "epoch": 7729} {"train_loss": -28.70436668395996, "global_step": 641559, "epoch": 7729} {"train_loss": -28.20307731628418, "global_step": 641560, "epoch": 7729} {"train_loss": -28.448667526245117, "global_step": 641561, "epoch": 7729} {"train_loss": -28.61794090270996, "global_step": 641562, "epoch": 7729} {"train_loss": -28.665756225585938, "global_step": 641563, "epoch": 7729} {"train_loss": -28.339645385742188, "global_step": 641564, "epoch": 7729} {"train_loss": -28.192138671875, "global_step": 641565, "epoch": 7729} {"train_loss": -27.988117218017578, "global_step": 641566, "epoch": 7729} {"train_loss": -27.598556518554688, "global_step": 641567, "epoch": 7729} {"train_loss": -27.828311920166016, "global_step": 641568, "epoch": 7729} {"train_loss": -27.50440788269043, "global_step": 641569, "epoch": 7729} {"train_loss": -27.178211212158203, "global_step": 641570, "epoch": 7729} {"train_loss": -27.202978134155273, "global_step": 641571, "epoch": 7729} {"train_loss": -28.184722900390625, "global_step": 641572, "epoch": 7729} {"train_loss": -27.8317813873291, "global_step": 641573, "epoch": 7729} {"train_loss": -26.870819091796875, "global_step": 641574, "epoch": 7729} {"train_loss": -27.856679916381836, "global_step": 641575, "epoch": 7729} {"train_loss": -27.226978302001953, "global_step": 641576, "epoch": 7729} {"train_loss": -27.468399047851562, "global_step": 641577, "epoch": 7729} {"train_loss": -27.697736740112305, "global_step": 641578, "epoch": 7729} {"train_loss": -27.707721710205078, "global_step": 641579, "epoch": 7729} {"train_loss": -27.883132934570312, "global_step": 641580, "epoch": 7729} {"train_loss": -28.014333724975586, "global_step": 641581, "epoch": 7729} {"train_loss": -27.87299156188965, "global_step": 641582, "epoch": 7729} {"train_loss": -28.439697265625, "global_step": 641583, "epoch": 7729} {"train_loss": -27.787351608276367, "global_step": 641584, "epoch": 7729} {"train_loss": -27.705978393554688, "global_step": 641585, "epoch": 7729} {"train_loss": -28.045698165893555, "global_step": 641586, "epoch": 7729} {"train_loss": -28.123632431030273, "global_step": 641587, "epoch": 7729} {"train_loss": -28.131444931030273, "global_step": 641588, "epoch": 7729} {"train_loss": -28.11117475578584, "global_step": 641589, "epoch": 7729, "val_loss": 6647831.0} {"train_loss": -28.18545913696289, "global_step": 641590, "epoch": 7730} {"train_loss": -27.382339477539062, "global_step": 641591, "epoch": 7730} {"train_loss": -27.905614852905273, "global_step": 641592, "epoch": 7730} {"train_loss": -27.67250633239746, "global_step": 641593, "epoch": 7730} {"train_loss": -27.63933753967285, "global_step": 641594, "epoch": 7730} {"train_loss": -27.829425811767578, "global_step": 641595, "epoch": 7730} {"train_loss": -27.90070152282715, "global_step": 641596, "epoch": 7730} {"train_loss": -27.957624435424805, "global_step": 641597, "epoch": 7730} {"train_loss": -27.374359130859375, "global_step": 641598, "epoch": 7730} {"train_loss": -27.619077682495117, "global_step": 641599, "epoch": 7730} {"train_loss": -27.879196166992188, "global_step": 641600, "epoch": 7730} {"train_loss": -27.952112197875977, "global_step": 641601, "epoch": 7730} {"train_loss": -27.710317611694336, "global_step": 641602, "epoch": 7730} {"train_loss": -28.1585750579834, "global_step": 641603, "epoch": 7730} {"train_loss": -27.825891494750977, "global_step": 641604, "epoch": 7730} {"train_loss": -28.335102081298828, "global_step": 641605, "epoch": 7730} {"train_loss": -28.235137939453125, "global_step": 641606, "epoch": 7730} {"train_loss": -27.98500633239746, "global_step": 641607, "epoch": 7730} {"train_loss": -27.888036727905273, "global_step": 641608, "epoch": 7730} {"train_loss": -28.062902450561523, "global_step": 641609, "epoch": 7730} {"train_loss": -28.272918701171875, "global_step": 641610, "epoch": 7730} {"train_loss": -28.222333908081055, "global_step": 641611, "epoch": 7730} {"train_loss": -28.23341941833496, "global_step": 641612, "epoch": 7730} {"train_loss": -28.176300048828125, "global_step": 641613, "epoch": 7730} {"train_loss": -28.202259063720703, "global_step": 641614, "epoch": 7730} {"train_loss": -28.246213912963867, "global_step": 641615, "epoch": 7730} {"train_loss": -28.542404174804688, "global_step": 641616, "epoch": 7730} {"train_loss": -27.769397735595703, "global_step": 641617, "epoch": 7730} {"train_loss": -27.64967918395996, "global_step": 641618, "epoch": 7730} {"train_loss": -28.2684383392334, "global_step": 641619, "epoch": 7730} {"train_loss": -28.4062557220459, "global_step": 641620, "epoch": 7730} {"train_loss": -28.286457061767578, "global_step": 641621, "epoch": 7730} {"train_loss": -28.27273941040039, "global_step": 641622, "epoch": 7730} {"train_loss": -28.006528854370117, "global_step": 641623, "epoch": 7730} {"train_loss": -28.27735710144043, "global_step": 641624, "epoch": 7730} {"train_loss": -28.440404891967773, "global_step": 641625, "epoch": 7730} {"train_loss": -28.556493759155273, "global_step": 641626, "epoch": 7730} {"train_loss": -28.35701560974121, "global_step": 641627, "epoch": 7730} {"train_loss": -28.4056339263916, "global_step": 641628, "epoch": 7730} {"train_loss": -28.334741592407227, "global_step": 641629, "epoch": 7730} {"train_loss": -28.92535972595215, "global_step": 641630, "epoch": 7730} {"train_loss": -28.187143325805664, "global_step": 641631, "epoch": 7730} {"train_loss": -28.17548179626465, "global_step": 641632, "epoch": 7730} {"train_loss": -28.255664825439453, "global_step": 641633, "epoch": 7730} {"train_loss": -28.329944610595703, "global_step": 641634, "epoch": 7730} {"train_loss": -28.437824249267578, "global_step": 641635, "epoch": 7730} {"train_loss": -28.494144439697266, "global_step": 641636, "epoch": 7730} {"train_loss": -28.20664405822754, "global_step": 641637, "epoch": 7730} {"train_loss": -27.97916603088379, "global_step": 641638, "epoch": 7730} {"train_loss": -28.563867568969727, "global_step": 641639, "epoch": 7730} {"train_loss": -28.586584091186523, "global_step": 641640, "epoch": 7730} {"train_loss": -28.47089195251465, "global_step": 641641, "epoch": 7730} {"train_loss": -28.607778549194336, "global_step": 641642, "epoch": 7730} {"train_loss": -28.111310958862305, "global_step": 641643, "epoch": 7730} {"train_loss": -28.70638084411621, "global_step": 641644, "epoch": 7730} {"train_loss": -28.411279678344727, "global_step": 641645, "epoch": 7730} {"train_loss": -28.460554122924805, "global_step": 641646, "epoch": 7730} {"train_loss": -28.201770782470703, "global_step": 641647, "epoch": 7730} {"train_loss": -28.46742057800293, "global_step": 641648, "epoch": 7730} {"train_loss": -28.504316329956055, "global_step": 641649, "epoch": 7730} {"train_loss": -28.67889976501465, "global_step": 641650, "epoch": 7730} {"train_loss": -29.0054874420166, "global_step": 641651, "epoch": 7730} {"train_loss": -28.48286247253418, "global_step": 641652, "epoch": 7730} {"train_loss": -28.79994010925293, "global_step": 641653, "epoch": 7730} {"train_loss": -28.39581298828125, "global_step": 641654, "epoch": 7730} {"train_loss": -28.340625762939453, "global_step": 641655, "epoch": 7730} {"train_loss": -28.74545669555664, "global_step": 641656, "epoch": 7730} {"train_loss": -28.554061889648438, "global_step": 641657, "epoch": 7730} {"train_loss": -27.98846435546875, "global_step": 641658, "epoch": 7730} {"train_loss": -28.73579216003418, "global_step": 641659, "epoch": 7730} {"train_loss": -28.46648597717285, "global_step": 641660, "epoch": 7730} {"train_loss": -28.443044662475586, "global_step": 641661, "epoch": 7730} {"train_loss": -28.633222579956055, "global_step": 641662, "epoch": 7730} {"train_loss": -28.55572509765625, "global_step": 641663, "epoch": 7730} {"train_loss": -28.390705108642578, "global_step": 641664, "epoch": 7730} {"train_loss": -28.362146377563477, "global_step": 641665, "epoch": 7730} {"train_loss": -28.39972496032715, "global_step": 641666, "epoch": 7730} {"train_loss": -28.407455444335938, "global_step": 641667, "epoch": 7730} {"train_loss": -28.708545684814453, "global_step": 641668, "epoch": 7730} {"train_loss": -28.3260440826416, "global_step": 641669, "epoch": 7730} {"train_loss": -28.591161727905273, "global_step": 641670, "epoch": 7730} {"train_loss": -28.21418571472168, "global_step": 641671, "epoch": 7730} {"train_loss": -28.273110975702124, "global_step": 641672, "epoch": 7730, "val_loss": 6635783.5} {"train_loss": -27.100189208984375, "global_step": 641673, "epoch": 7731} {"train_loss": -24.056011199951172, "global_step": 641674, "epoch": 7731} {"train_loss": -20.240549087524414, "global_step": 641675, "epoch": 7731} {"train_loss": -18.361114501953125, "global_step": 641676, "epoch": 7731} {"train_loss": -21.837583541870117, "global_step": 641677, "epoch": 7731} {"train_loss": -22.629398345947266, "global_step": 641678, "epoch": 7731} {"train_loss": -24.13519287109375, "global_step": 641679, "epoch": 7731} {"train_loss": -24.364765167236328, "global_step": 641680, "epoch": 7731} {"train_loss": -24.93995475769043, "global_step": 641681, "epoch": 7731} {"train_loss": -24.623493194580078, "global_step": 641682, "epoch": 7731} {"train_loss": -25.623279571533203, "global_step": 641683, "epoch": 7731} {"train_loss": -25.164926528930664, "global_step": 641684, "epoch": 7731} {"train_loss": -26.12890625, "global_step": 641685, "epoch": 7731} {"train_loss": -26.48076820373535, "global_step": 641686, "epoch": 7731} {"train_loss": -25.74444580078125, "global_step": 641687, "epoch": 7731} {"train_loss": -26.334470748901367, "global_step": 641688, "epoch": 7731} {"train_loss": -26.551633834838867, "global_step": 641689, "epoch": 7731} {"train_loss": -26.249378204345703, "global_step": 641690, "epoch": 7731} {"train_loss": -26.65046501159668, "global_step": 641691, "epoch": 7731} {"train_loss": -26.496246337890625, "global_step": 641692, "epoch": 7731} {"train_loss": -26.39850425720215, "global_step": 641693, "epoch": 7731} {"train_loss": -26.259418487548828, "global_step": 641694, "epoch": 7731} {"train_loss": -26.722654342651367, "global_step": 641695, "epoch": 7731} {"train_loss": -25.600614547729492, "global_step": 641696, "epoch": 7731} {"train_loss": -27.178226470947266, "global_step": 641697, "epoch": 7731} {"train_loss": -26.3359432220459, "global_step": 641698, "epoch": 7731} {"train_loss": -26.51909828186035, "global_step": 641699, "epoch": 7731} {"train_loss": -26.580163955688477, "global_step": 641700, "epoch": 7731} {"train_loss": -26.53814697265625, "global_step": 641701, "epoch": 7731} {"train_loss": -26.73052978515625, "global_step": 641702, "epoch": 7731} {"train_loss": -27.280332565307617, "global_step": 641703, "epoch": 7731} {"train_loss": -26.960803985595703, "global_step": 641704, "epoch": 7731} {"train_loss": -26.974506378173828, "global_step": 641705, "epoch": 7731} {"train_loss": -27.177759170532227, "global_step": 641706, "epoch": 7731} {"train_loss": -27.27017593383789, "global_step": 641707, "epoch": 7731} {"train_loss": -27.06830406188965, "global_step": 641708, "epoch": 7731} {"train_loss": -27.125003814697266, "global_step": 641709, "epoch": 7731} {"train_loss": -27.246007919311523, "global_step": 641710, "epoch": 7731} {"train_loss": -27.502302169799805, "global_step": 641711, "epoch": 7731} {"train_loss": -27.296905517578125, "global_step": 641712, "epoch": 7731} {"train_loss": -27.472003936767578, "global_step": 641713, "epoch": 7731} {"train_loss": -27.564870834350586, "global_step": 641714, "epoch": 7731} {"train_loss": -27.636987686157227, "global_step": 641715, "epoch": 7731} {"train_loss": -27.9567928314209, "global_step": 641716, "epoch": 7731} {"train_loss": -27.835559844970703, "global_step": 641717, "epoch": 7731} {"train_loss": -27.64472770690918, "global_step": 641718, "epoch": 7731} {"train_loss": -27.73866081237793, "global_step": 641719, "epoch": 7731} {"train_loss": -27.513303756713867, "global_step": 641720, "epoch": 7731} {"train_loss": -27.87894058227539, "global_step": 641721, "epoch": 7731} {"train_loss": -27.726648330688477, "global_step": 641722, "epoch": 7731} {"train_loss": -27.83449363708496, "global_step": 641723, "epoch": 7731} {"train_loss": -27.801382064819336, "global_step": 641724, "epoch": 7731} {"train_loss": -27.5555419921875, "global_step": 641725, "epoch": 7731} {"train_loss": -28.102964401245117, "global_step": 641726, "epoch": 7731} {"train_loss": -28.023090362548828, "global_step": 641727, "epoch": 7731} {"train_loss": -28.221120834350586, "global_step": 641728, "epoch": 7731} {"train_loss": -27.82537269592285, "global_step": 641729, "epoch": 7731} {"train_loss": -27.850461959838867, "global_step": 641730, "epoch": 7731} {"train_loss": -27.763254165649414, "global_step": 641731, "epoch": 7731} {"train_loss": -28.357648849487305, "global_step": 641732, "epoch": 7731} {"train_loss": -27.957311630249023, "global_step": 641733, "epoch": 7731} {"train_loss": -28.128162384033203, "global_step": 641734, "epoch": 7731} {"train_loss": -28.111316680908203, "global_step": 641735, "epoch": 7731} {"train_loss": -27.693134307861328, "global_step": 641736, "epoch": 7731} {"train_loss": -28.185287475585938, "global_step": 641737, "epoch": 7731} {"train_loss": -28.16388511657715, "global_step": 641738, "epoch": 7731} {"train_loss": -28.288822174072266, "global_step": 641739, "epoch": 7731} {"train_loss": -28.13912010192871, "global_step": 641740, "epoch": 7731} {"train_loss": -28.311853408813477, "global_step": 641741, "epoch": 7731} {"train_loss": -28.4992733001709, "global_step": 641742, "epoch": 7731} {"train_loss": -28.25225830078125, "global_step": 641743, "epoch": 7731} {"train_loss": -27.984012603759766, "global_step": 641744, "epoch": 7731} {"train_loss": -28.249486923217773, "global_step": 641745, "epoch": 7731} {"train_loss": -28.03533363342285, "global_step": 641746, "epoch": 7731} {"train_loss": -27.91241455078125, "global_step": 641747, "epoch": 7731} {"train_loss": -28.059301376342773, "global_step": 641748, "epoch": 7731} {"train_loss": -28.234228134155273, "global_step": 641749, "epoch": 7731} {"train_loss": -27.97060203552246, "global_step": 641750, "epoch": 7731} {"train_loss": -28.170984268188477, "global_step": 641751, "epoch": 7731} {"train_loss": -28.24907875061035, "global_step": 641752, "epoch": 7731} {"train_loss": -28.47926139831543, "global_step": 641753, "epoch": 7731} {"train_loss": -28.0947322845459, "global_step": 641754, "epoch": 7731} {"train_loss": -26.92455951277032, "global_step": 641755, "epoch": 7731, "val_loss": 6626572.0} {"train_loss": -28.717504501342773, "global_step": 641756, "epoch": 7732} {"train_loss": -28.17947769165039, "global_step": 641757, "epoch": 7732} {"train_loss": -28.266111373901367, "global_step": 641758, "epoch": 7732} {"train_loss": -27.805530548095703, "global_step": 641759, "epoch": 7732} {"train_loss": -28.183340072631836, "global_step": 641760, "epoch": 7732} {"train_loss": -28.305063247680664, "global_step": 641761, "epoch": 7732} {"train_loss": -28.166141510009766, "global_step": 641762, "epoch": 7732} {"train_loss": -27.9279842376709, "global_step": 641763, "epoch": 7732} {"train_loss": -28.431049346923828, "global_step": 641764, "epoch": 7732} {"train_loss": -28.273773193359375, "global_step": 641765, "epoch": 7732} {"train_loss": -27.799768447875977, "global_step": 641766, "epoch": 7732} {"train_loss": -28.088693618774414, "global_step": 641767, "epoch": 7732} {"train_loss": -27.985809326171875, "global_step": 641768, "epoch": 7732} {"train_loss": -27.705673217773438, "global_step": 641769, "epoch": 7732} {"train_loss": -28.363712310791016, "global_step": 641770, "epoch": 7732} {"train_loss": -28.233844757080078, "global_step": 641771, "epoch": 7732} {"train_loss": -28.36675453186035, "global_step": 641772, "epoch": 7732} {"train_loss": -28.086795806884766, "global_step": 641773, "epoch": 7732} {"train_loss": -28.026264190673828, "global_step": 641774, "epoch": 7732} {"train_loss": -28.220264434814453, "global_step": 641775, "epoch": 7732} {"train_loss": -28.42535972595215, "global_step": 641776, "epoch": 7732} {"train_loss": -27.751728057861328, "global_step": 641777, "epoch": 7732} {"train_loss": -28.163915634155273, "global_step": 641778, "epoch": 7732} {"train_loss": -28.001367568969727, "global_step": 641779, "epoch": 7732} {"train_loss": -28.04231071472168, "global_step": 641780, "epoch": 7732} {"train_loss": -28.15302848815918, "global_step": 641781, "epoch": 7732} {"train_loss": -28.470138549804688, "global_step": 641782, "epoch": 7732} {"train_loss": -28.13458251953125, "global_step": 641783, "epoch": 7732} {"train_loss": -28.15754508972168, "global_step": 641784, "epoch": 7732} {"train_loss": -28.30719566345215, "global_step": 641785, "epoch": 7732} {"train_loss": -28.16704750061035, "global_step": 641786, "epoch": 7732} {"train_loss": -28.454862594604492, "global_step": 641787, "epoch": 7732} {"train_loss": -28.770999908447266, "global_step": 641788, "epoch": 7732} {"train_loss": -28.246810913085938, "global_step": 641789, "epoch": 7732} {"train_loss": -28.13755226135254, "global_step": 641790, "epoch": 7732} {"train_loss": -28.486835479736328, "global_step": 641791, "epoch": 7732} {"train_loss": -28.395299911499023, "global_step": 641792, "epoch": 7732} {"train_loss": -28.028120040893555, "global_step": 641793, "epoch": 7732} {"train_loss": -28.0012149810791, "global_step": 641794, "epoch": 7732} {"train_loss": -28.779266357421875, "global_step": 641795, "epoch": 7732} {"train_loss": -28.464176177978516, "global_step": 641796, "epoch": 7732} {"train_loss": -28.451995849609375, "global_step": 641797, "epoch": 7732} {"train_loss": -28.238666534423828, "global_step": 641798, "epoch": 7732} {"train_loss": -28.192550659179688, "global_step": 641799, "epoch": 7732} {"train_loss": -28.4716739654541, "global_step": 641800, "epoch": 7732} {"train_loss": -28.131155014038086, "global_step": 641801, "epoch": 7732} {"train_loss": -28.034942626953125, "global_step": 641802, "epoch": 7732} {"train_loss": -28.396955490112305, "global_step": 641803, "epoch": 7732} {"train_loss": -28.275251388549805, "global_step": 641804, "epoch": 7732} {"train_loss": -28.086627960205078, "global_step": 641805, "epoch": 7732} {"train_loss": -28.142658233642578, "global_step": 641806, "epoch": 7732} {"train_loss": -28.364667892456055, "global_step": 641807, "epoch": 7732} {"train_loss": -28.060169219970703, "global_step": 641808, "epoch": 7732} {"train_loss": -27.817113876342773, "global_step": 641809, "epoch": 7732} {"train_loss": -28.29188346862793, "global_step": 641810, "epoch": 7732} {"train_loss": -28.280731201171875, "global_step": 641811, "epoch": 7732} {"train_loss": -28.34395408630371, "global_step": 641812, "epoch": 7732} {"train_loss": -28.48666763305664, "global_step": 641813, "epoch": 7732} {"train_loss": -27.94795036315918, "global_step": 641814, "epoch": 7732} {"train_loss": -28.5550594329834, "global_step": 641815, "epoch": 7732} {"train_loss": -28.25507164001465, "global_step": 641816, "epoch": 7732} {"train_loss": -28.501745223999023, "global_step": 641817, "epoch": 7732} {"train_loss": -27.813135147094727, "global_step": 641818, "epoch": 7732} {"train_loss": -28.255773544311523, "global_step": 641819, "epoch": 7732} {"train_loss": -28.769758224487305, "global_step": 641820, "epoch": 7732} {"train_loss": -28.493162155151367, "global_step": 641821, "epoch": 7732} {"train_loss": -28.545841217041016, "global_step": 641822, "epoch": 7732} {"train_loss": -28.366138458251953, "global_step": 641823, "epoch": 7732} {"train_loss": -28.5662841796875, "global_step": 641824, "epoch": 7732} {"train_loss": -28.312524795532227, "global_step": 641825, "epoch": 7732} {"train_loss": -28.16810417175293, "global_step": 641826, "epoch": 7732} {"train_loss": -28.124256134033203, "global_step": 641827, "epoch": 7732} {"train_loss": -28.403614044189453, "global_step": 641828, "epoch": 7732} {"train_loss": -28.34931755065918, "global_step": 641829, "epoch": 7732} {"train_loss": -28.38920021057129, "global_step": 641830, "epoch": 7732} {"train_loss": -28.067060470581055, "global_step": 641831, "epoch": 7732} {"train_loss": -28.659957885742188, "global_step": 641832, "epoch": 7732} {"train_loss": -28.26509666442871, "global_step": 641833, "epoch": 7732} {"train_loss": -28.59913444519043, "global_step": 641834, "epoch": 7732} {"train_loss": -28.508792877197266, "global_step": 641835, "epoch": 7732} {"train_loss": -28.649778366088867, "global_step": 641836, "epoch": 7732} {"train_loss": -28.19573402404785, "global_step": 641837, "epoch": 7732} {"train_loss": -28.271532587258214, "global_step": 641838, "epoch": 7732, "val_loss": 6613027.0} {"train_loss": -27.63368797302246, "global_step": 641839, "epoch": 7733} {"train_loss": -26.87849235534668, "global_step": 641840, "epoch": 7733} {"train_loss": -26.612262725830078, "global_step": 641841, "epoch": 7733} {"train_loss": -27.7356014251709, "global_step": 641842, "epoch": 7733} {"train_loss": -27.624866485595703, "global_step": 641843, "epoch": 7733} {"train_loss": -27.718494415283203, "global_step": 641844, "epoch": 7733} {"train_loss": -27.747272491455078, "global_step": 641845, "epoch": 7733} {"train_loss": -27.929370880126953, "global_step": 641846, "epoch": 7733} {"train_loss": -28.086246490478516, "global_step": 641847, "epoch": 7733} {"train_loss": -28.1817684173584, "global_step": 641848, "epoch": 7733} {"train_loss": -27.4655818939209, "global_step": 641849, "epoch": 7733} {"train_loss": -28.366901397705078, "global_step": 641850, "epoch": 7733} {"train_loss": -27.972213745117188, "global_step": 641851, "epoch": 7733} {"train_loss": -27.805540084838867, "global_step": 641852, "epoch": 7733} {"train_loss": -27.930347442626953, "global_step": 641853, "epoch": 7733} {"train_loss": -27.69874382019043, "global_step": 641854, "epoch": 7733} {"train_loss": -27.822433471679688, "global_step": 641855, "epoch": 7733} {"train_loss": -28.68515968322754, "global_step": 641856, "epoch": 7733} {"train_loss": -27.847900390625, "global_step": 641857, "epoch": 7733} {"train_loss": -27.917728424072266, "global_step": 641858, "epoch": 7733} {"train_loss": -28.236169815063477, "global_step": 641859, "epoch": 7733} {"train_loss": -28.068037033081055, "global_step": 641860, "epoch": 7733} {"train_loss": -27.904260635375977, "global_step": 641861, "epoch": 7733} {"train_loss": -27.89639663696289, "global_step": 641862, "epoch": 7733} {"train_loss": -28.0849609375, "global_step": 641863, "epoch": 7733} {"train_loss": -28.332855224609375, "global_step": 641864, "epoch": 7733} {"train_loss": -28.116804122924805, "global_step": 641865, "epoch": 7733} {"train_loss": -27.96038818359375, "global_step": 641866, "epoch": 7733} {"train_loss": -28.197711944580078, "global_step": 641867, "epoch": 7733} {"train_loss": -28.11195182800293, "global_step": 641868, "epoch": 7733} {"train_loss": -28.39507484436035, "global_step": 641869, "epoch": 7733} {"train_loss": -28.2171688079834, "global_step": 641870, "epoch": 7733} {"train_loss": -28.2539119720459, "global_step": 641871, "epoch": 7733} {"train_loss": -28.25044822692871, "global_step": 641872, "epoch": 7733} {"train_loss": -28.11469078063965, "global_step": 641873, "epoch": 7733} {"train_loss": -28.501333236694336, "global_step": 641874, "epoch": 7733} {"train_loss": -28.03409767150879, "global_step": 641875, "epoch": 7733} {"train_loss": -28.010663986206055, "global_step": 641876, "epoch": 7733} {"train_loss": -28.052087783813477, "global_step": 641877, "epoch": 7733} {"train_loss": -28.3476619720459, "global_step": 641878, "epoch": 7733} {"train_loss": -28.390233993530273, "global_step": 641879, "epoch": 7733} {"train_loss": -28.45389175415039, "global_step": 641880, "epoch": 7733} {"train_loss": -28.33762550354004, "global_step": 641881, "epoch": 7733} {"train_loss": -28.399988174438477, "global_step": 641882, "epoch": 7733} {"train_loss": -28.50507164001465, "global_step": 641883, "epoch": 7733} {"train_loss": -28.688873291015625, "global_step": 641884, "epoch": 7733} {"train_loss": -28.348159790039062, "global_step": 641885, "epoch": 7733} {"train_loss": -28.625478744506836, "global_step": 641886, "epoch": 7733} {"train_loss": -28.69284439086914, "global_step": 641887, "epoch": 7733} {"train_loss": -28.472614288330078, "global_step": 641888, "epoch": 7733} {"train_loss": -28.7525634765625, "global_step": 641889, "epoch": 7733} {"train_loss": -28.86441421508789, "global_step": 641890, "epoch": 7733} {"train_loss": -28.58853530883789, "global_step": 641891, "epoch": 7733} {"train_loss": -28.261823654174805, "global_step": 641892, "epoch": 7733} {"train_loss": -28.542158126831055, "global_step": 641893, "epoch": 7733} {"train_loss": -28.379745483398438, "global_step": 641894, "epoch": 7733} {"train_loss": -27.976720809936523, "global_step": 641895, "epoch": 7733} {"train_loss": -28.1440372467041, "global_step": 641896, "epoch": 7733} {"train_loss": -28.292646408081055, "global_step": 641897, "epoch": 7733} {"train_loss": -28.18695068359375, "global_step": 641898, "epoch": 7733} {"train_loss": -27.806716918945312, "global_step": 641899, "epoch": 7733} {"train_loss": -26.882883071899414, "global_step": 641900, "epoch": 7733} {"train_loss": -25.60586929321289, "global_step": 641901, "epoch": 7733} {"train_loss": -27.499624252319336, "global_step": 641902, "epoch": 7733} {"train_loss": -27.619251251220703, "global_step": 641903, "epoch": 7733} {"train_loss": -27.393918991088867, "global_step": 641904, "epoch": 7733} {"train_loss": -27.76888084411621, "global_step": 641905, "epoch": 7733} {"train_loss": -27.6709041595459, "global_step": 641906, "epoch": 7733} {"train_loss": -27.965185165405273, "global_step": 641907, "epoch": 7733} {"train_loss": -27.319055557250977, "global_step": 641908, "epoch": 7733} {"train_loss": -28.07880973815918, "global_step": 641909, "epoch": 7733} {"train_loss": -27.713315963745117, "global_step": 641910, "epoch": 7733} {"train_loss": -28.132537841796875, "global_step": 641911, "epoch": 7733} {"train_loss": -27.6366024017334, "global_step": 641912, "epoch": 7733} {"train_loss": -27.75371742248535, "global_step": 641913, "epoch": 7733} {"train_loss": -27.7763614654541, "global_step": 641914, "epoch": 7733} {"train_loss": -28.310516357421875, "global_step": 641915, "epoch": 7733} {"train_loss": -27.75836181640625, "global_step": 641916, "epoch": 7733} {"train_loss": -28.43450927734375, "global_step": 641917, "epoch": 7733} {"train_loss": -27.94698143005371, "global_step": 641918, "epoch": 7733} {"train_loss": -28.2342529296875, "global_step": 641919, "epoch": 7733} {"train_loss": -27.891815185546875, "global_step": 641920, "epoch": 7733} {"train_loss": -28.005611994180335, "global_step": 641921, "epoch": 7733, "val_loss": 6624386.0} {"train_loss": -27.698822021484375, "global_step": 641922, "epoch": 7734} {"train_loss": -27.591217041015625, "global_step": 641923, "epoch": 7734} {"train_loss": -27.610681533813477, "global_step": 641924, "epoch": 7734} {"train_loss": -27.173837661743164, "global_step": 641925, "epoch": 7734} {"train_loss": -27.299880981445312, "global_step": 641926, "epoch": 7734} {"train_loss": -27.755603790283203, "global_step": 641927, "epoch": 7734} {"train_loss": -27.625350952148438, "global_step": 641928, "epoch": 7734} {"train_loss": -27.74249267578125, "global_step": 641929, "epoch": 7734} {"train_loss": -27.6367244720459, "global_step": 641930, "epoch": 7734} {"train_loss": -27.806076049804688, "global_step": 641931, "epoch": 7734} {"train_loss": -27.87758445739746, "global_step": 641932, "epoch": 7734} {"train_loss": -27.2813663482666, "global_step": 641933, "epoch": 7734} {"train_loss": -27.78045082092285, "global_step": 641934, "epoch": 7734} {"train_loss": -27.82236099243164, "global_step": 641935, "epoch": 7734} {"train_loss": -27.75861167907715, "global_step": 641936, "epoch": 7734} {"train_loss": -27.90223503112793, "global_step": 641937, "epoch": 7734} {"train_loss": -28.02323341369629, "global_step": 641938, "epoch": 7734} {"train_loss": -28.2755069732666, "global_step": 641939, "epoch": 7734} {"train_loss": -28.03352928161621, "global_step": 641940, "epoch": 7734} {"train_loss": -27.93317222595215, "global_step": 641941, "epoch": 7734} {"train_loss": -28.08201026916504, "global_step": 641942, "epoch": 7734} {"train_loss": -28.015836715698242, "global_step": 641943, "epoch": 7734} {"train_loss": -28.23320960998535, "global_step": 641944, "epoch": 7734} {"train_loss": -28.492431640625, "global_step": 641945, "epoch": 7734} {"train_loss": -28.3604679107666, "global_step": 641946, "epoch": 7734} {"train_loss": -28.37851905822754, "global_step": 641947, "epoch": 7734} {"train_loss": -28.286420822143555, "global_step": 641948, "epoch": 7734} {"train_loss": -28.057601928710938, "global_step": 641949, "epoch": 7734} {"train_loss": -28.20502281188965, "global_step": 641950, "epoch": 7734} {"train_loss": -28.181549072265625, "global_step": 641951, "epoch": 7734} {"train_loss": -28.412708282470703, "global_step": 641952, "epoch": 7734} {"train_loss": -28.432077407836914, "global_step": 641953, "epoch": 7734} {"train_loss": -28.23255729675293, "global_step": 641954, "epoch": 7734} {"train_loss": -28.695465087890625, "global_step": 641955, "epoch": 7734} {"train_loss": -28.565412521362305, "global_step": 641956, "epoch": 7734} {"train_loss": -28.31511878967285, "global_step": 641957, "epoch": 7734} {"train_loss": -28.403242111206055, "global_step": 641958, "epoch": 7734} {"train_loss": -28.267505645751953, "global_step": 641959, "epoch": 7734} {"train_loss": -28.546430587768555, "global_step": 641960, "epoch": 7734} {"train_loss": -28.50653648376465, "global_step": 641961, "epoch": 7734} {"train_loss": -28.40229606628418, "global_step": 641962, "epoch": 7734} {"train_loss": -28.41326904296875, "global_step": 641963, "epoch": 7734} {"train_loss": -28.369659423828125, "global_step": 641964, "epoch": 7734} {"train_loss": -28.956878662109375, "global_step": 641965, "epoch": 7734} {"train_loss": -28.511877059936523, "global_step": 641966, "epoch": 7734} {"train_loss": -28.576557159423828, "global_step": 641967, "epoch": 7734} {"train_loss": -28.48392677307129, "global_step": 641968, "epoch": 7734} {"train_loss": -28.509408950805664, "global_step": 641969, "epoch": 7734} {"train_loss": -28.794143676757812, "global_step": 641970, "epoch": 7734} {"train_loss": -28.415973663330078, "global_step": 641971, "epoch": 7734} {"train_loss": -28.549570083618164, "global_step": 641972, "epoch": 7734} {"train_loss": -28.440290451049805, "global_step": 641973, "epoch": 7734} {"train_loss": -28.895837783813477, "global_step": 641974, "epoch": 7734} {"train_loss": -28.393850326538086, "global_step": 641975, "epoch": 7734} {"train_loss": -28.18721580505371, "global_step": 641976, "epoch": 7734} {"train_loss": -28.612808227539062, "global_step": 641977, "epoch": 7734} {"train_loss": -28.475601196289062, "global_step": 641978, "epoch": 7734} {"train_loss": -28.39971923828125, "global_step": 641979, "epoch": 7734} {"train_loss": -28.79365348815918, "global_step": 641980, "epoch": 7734} {"train_loss": -28.34523582458496, "global_step": 641981, "epoch": 7734} {"train_loss": -28.409704208374023, "global_step": 641982, "epoch": 7734} {"train_loss": -28.741043090820312, "global_step": 641983, "epoch": 7734} {"train_loss": -28.12312889099121, "global_step": 641984, "epoch": 7734} {"train_loss": -28.37432289123535, "global_step": 641985, "epoch": 7734} {"train_loss": -28.65064811706543, "global_step": 641986, "epoch": 7734} {"train_loss": -28.126754760742188, "global_step": 641987, "epoch": 7734} {"train_loss": -28.678150177001953, "global_step": 641988, "epoch": 7734} {"train_loss": -28.157743453979492, "global_step": 641989, "epoch": 7734} {"train_loss": -28.227216720581055, "global_step": 641990, "epoch": 7734} {"train_loss": -28.7747745513916, "global_step": 641991, "epoch": 7734} {"train_loss": -28.24408531188965, "global_step": 641992, "epoch": 7734} {"train_loss": -28.181537628173828, "global_step": 641993, "epoch": 7734} {"train_loss": -27.620847702026367, "global_step": 641994, "epoch": 7734} {"train_loss": -27.375402450561523, "global_step": 641995, "epoch": 7734} {"train_loss": -27.759933471679688, "global_step": 641996, "epoch": 7734} {"train_loss": -28.105182647705078, "global_step": 641997, "epoch": 7734} {"train_loss": -27.869565963745117, "global_step": 641998, "epoch": 7734} {"train_loss": -26.748422622680664, "global_step": 641999, "epoch": 7734} {"train_loss": -26.6552677154541, "global_step": 642000, "epoch": 7734} {"train_loss": -28.10603141784668, "global_step": 642001, "epoch": 7734} {"train_loss": -27.21795654296875, "global_step": 642002, "epoch": 7734} {"train_loss": -26.873279571533203, "global_step": 642003, "epoch": 7734} {"train_loss": -28.127891770328382, "global_step": 642004, "epoch": 7734, "val_loss": 6602063.5} {"train_loss": -27.220245361328125, "global_step": 642005, "epoch": 7735} {"train_loss": -26.656274795532227, "global_step": 642006, "epoch": 7735} {"train_loss": -27.62445640563965, "global_step": 642007, "epoch": 7735} {"train_loss": -27.32745361328125, "global_step": 642008, "epoch": 7735} {"train_loss": -26.8022403717041, "global_step": 642009, "epoch": 7735} {"train_loss": -27.5690975189209, "global_step": 642010, "epoch": 7735} {"train_loss": -26.898298263549805, "global_step": 642011, "epoch": 7735} {"train_loss": -26.762298583984375, "global_step": 642012, "epoch": 7735} {"train_loss": -27.23239517211914, "global_step": 642013, "epoch": 7735} {"train_loss": -27.634246826171875, "global_step": 642014, "epoch": 7735} {"train_loss": -27.717885971069336, "global_step": 642015, "epoch": 7735} {"train_loss": -27.8981876373291, "global_step": 642016, "epoch": 7735} {"train_loss": -27.69437026977539, "global_step": 642017, "epoch": 7735} {"train_loss": -27.57282066345215, "global_step": 642018, "epoch": 7735} {"train_loss": -27.42786979675293, "global_step": 642019, "epoch": 7735} {"train_loss": -27.92730140686035, "global_step": 642020, "epoch": 7735} {"train_loss": -27.647979736328125, "global_step": 642021, "epoch": 7735} {"train_loss": -27.73292350769043, "global_step": 642022, "epoch": 7735} {"train_loss": -27.944128036499023, "global_step": 642023, "epoch": 7735} {"train_loss": -27.409027099609375, "global_step": 642024, "epoch": 7735} {"train_loss": -27.786304473876953, "global_step": 642025, "epoch": 7735} {"train_loss": -28.145645141601562, "global_step": 642026, "epoch": 7735} {"train_loss": -28.062108993530273, "global_step": 642027, "epoch": 7735} {"train_loss": -27.518400192260742, "global_step": 642028, "epoch": 7735} {"train_loss": -28.441238403320312, "global_step": 642029, "epoch": 7735} {"train_loss": -28.1174373626709, "global_step": 642030, "epoch": 7735} {"train_loss": -28.051513671875, "global_step": 642031, "epoch": 7735} {"train_loss": -28.543350219726562, "global_step": 642032, "epoch": 7735} {"train_loss": -27.83990478515625, "global_step": 642033, "epoch": 7735} {"train_loss": -28.367481231689453, "global_step": 642034, "epoch": 7735} {"train_loss": -28.243371963500977, "global_step": 642035, "epoch": 7735} {"train_loss": -28.165485382080078, "global_step": 642036, "epoch": 7735} {"train_loss": -28.543432235717773, "global_step": 642037, "epoch": 7735} {"train_loss": -28.179723739624023, "global_step": 642038, "epoch": 7735} {"train_loss": -28.137073516845703, "global_step": 642039, "epoch": 7735} {"train_loss": -28.1420841217041, "global_step": 642040, "epoch": 7735} {"train_loss": -28.122068405151367, "global_step": 642041, "epoch": 7735} {"train_loss": -28.313800811767578, "global_step": 642042, "epoch": 7735} {"train_loss": -28.220626831054688, "global_step": 642043, "epoch": 7735} {"train_loss": -28.35052490234375, "global_step": 642044, "epoch": 7735} {"train_loss": -28.3732967376709, "global_step": 642045, "epoch": 7735} {"train_loss": -28.462316513061523, "global_step": 642046, "epoch": 7735} {"train_loss": -28.35279655456543, "global_step": 642047, "epoch": 7735} {"train_loss": -28.416173934936523, "global_step": 642048, "epoch": 7735} {"train_loss": -28.53271484375, "global_step": 642049, "epoch": 7735} {"train_loss": -28.362228393554688, "global_step": 642050, "epoch": 7735} {"train_loss": -28.7272891998291, "global_step": 642051, "epoch": 7735} {"train_loss": -28.5638427734375, "global_step": 642052, "epoch": 7735} {"train_loss": -28.527143478393555, "global_step": 642053, "epoch": 7735} {"train_loss": -28.534021377563477, "global_step": 642054, "epoch": 7735} {"train_loss": -28.078969955444336, "global_step": 642055, "epoch": 7735} {"train_loss": -28.23334312438965, "global_step": 642056, "epoch": 7735} {"train_loss": -28.69631004333496, "global_step": 642057, "epoch": 7735} {"train_loss": -28.6876220703125, "global_step": 642058, "epoch": 7735} {"train_loss": -28.6319637298584, "global_step": 642059, "epoch": 7735} {"train_loss": -28.76690673828125, "global_step": 642060, "epoch": 7735} {"train_loss": -28.648542404174805, "global_step": 642061, "epoch": 7735} {"train_loss": -28.7778263092041, "global_step": 642062, "epoch": 7735} {"train_loss": -28.99556541442871, "global_step": 642063, "epoch": 7735} {"train_loss": -28.533771514892578, "global_step": 642064, "epoch": 7735} {"train_loss": -28.276762008666992, "global_step": 642065, "epoch": 7735} {"train_loss": -28.640466690063477, "global_step": 642066, "epoch": 7735} {"train_loss": -28.67963981628418, "global_step": 642067, "epoch": 7735} {"train_loss": -28.584497451782227, "global_step": 642068, "epoch": 7735} {"train_loss": -28.48170280456543, "global_step": 642069, "epoch": 7735} {"train_loss": -28.18035316467285, "global_step": 642070, "epoch": 7735} {"train_loss": -27.8115291595459, "global_step": 642071, "epoch": 7735} {"train_loss": -28.374540328979492, "global_step": 642072, "epoch": 7735} {"train_loss": -28.32728385925293, "global_step": 642073, "epoch": 7735} {"train_loss": -28.36445426940918, "global_step": 642074, "epoch": 7735} {"train_loss": -27.670490264892578, "global_step": 642075, "epoch": 7735} {"train_loss": -28.208175659179688, "global_step": 642076, "epoch": 7735} {"train_loss": -28.13775062561035, "global_step": 642077, "epoch": 7735} {"train_loss": -28.394987106323242, "global_step": 642078, "epoch": 7735} {"train_loss": -28.16328239440918, "global_step": 642079, "epoch": 7735} {"train_loss": -28.385272979736328, "global_step": 642080, "epoch": 7735} {"train_loss": -28.242761611938477, "global_step": 642081, "epoch": 7735} {"train_loss": -28.369943618774414, "global_step": 642082, "epoch": 7735} {"train_loss": -28.32539176940918, "global_step": 642083, "epoch": 7735} {"train_loss": -28.37857437133789, "global_step": 642084, "epoch": 7735} {"train_loss": -28.157825469970703, "global_step": 642085, "epoch": 7735} {"train_loss": -28.393278121948242, "global_step": 642086, "epoch": 7735} {"train_loss": -28.109774486128106, "global_step": 642087, "epoch": 7735, "val_loss": 6632475.0} {"train_loss": -27.953750610351562, "global_step": 642088, "epoch": 7736} {"train_loss": -28.05415916442871, "global_step": 642089, "epoch": 7736} {"train_loss": -27.757232666015625, "global_step": 642090, "epoch": 7736} {"train_loss": -27.93317985534668, "global_step": 642091, "epoch": 7736} {"train_loss": -28.030160903930664, "global_step": 642092, "epoch": 7736} {"train_loss": -27.850849151611328, "global_step": 642093, "epoch": 7736} {"train_loss": -27.992658615112305, "global_step": 642094, "epoch": 7736} {"train_loss": -27.857009887695312, "global_step": 642095, "epoch": 7736} {"train_loss": -28.175125122070312, "global_step": 642096, "epoch": 7736} {"train_loss": -28.34330177307129, "global_step": 642097, "epoch": 7736} {"train_loss": -28.201766967773438, "global_step": 642098, "epoch": 7736} {"train_loss": -27.68401527404785, "global_step": 642099, "epoch": 7736} {"train_loss": -27.841840744018555, "global_step": 642100, "epoch": 7736} {"train_loss": -28.200580596923828, "global_step": 642101, "epoch": 7736} {"train_loss": -28.139144897460938, "global_step": 642102, "epoch": 7736} {"train_loss": -28.086515426635742, "global_step": 642103, "epoch": 7736} {"train_loss": -27.648359298706055, "global_step": 642104, "epoch": 7736} {"train_loss": -27.56947135925293, "global_step": 642105, "epoch": 7736} {"train_loss": -27.762073516845703, "global_step": 642106, "epoch": 7736} {"train_loss": -28.04736328125, "global_step": 642107, "epoch": 7736} {"train_loss": -27.743566513061523, "global_step": 642108, "epoch": 7736} {"train_loss": -28.001672744750977, "global_step": 642109, "epoch": 7736} {"train_loss": -28.215234756469727, "global_step": 642110, "epoch": 7736} {"train_loss": -27.841964721679688, "global_step": 642111, "epoch": 7736} {"train_loss": -27.976057052612305, "global_step": 642112, "epoch": 7736} {"train_loss": -28.6271915435791, "global_step": 642113, "epoch": 7736} {"train_loss": -28.361591339111328, "global_step": 642114, "epoch": 7736} {"train_loss": -27.89314079284668, "global_step": 642115, "epoch": 7736} {"train_loss": -28.3698673248291, "global_step": 642116, "epoch": 7736} {"train_loss": -28.11374855041504, "global_step": 642117, "epoch": 7736} {"train_loss": -28.29158592224121, "global_step": 642118, "epoch": 7736} {"train_loss": -27.95747184753418, "global_step": 642119, "epoch": 7736} {"train_loss": -28.266361236572266, "global_step": 642120, "epoch": 7736} {"train_loss": -28.378662109375, "global_step": 642121, "epoch": 7736} {"train_loss": -28.17738151550293, "global_step": 642122, "epoch": 7736} {"train_loss": -28.2451171875, "global_step": 642123, "epoch": 7736} {"train_loss": -28.122655868530273, "global_step": 642124, "epoch": 7736} {"train_loss": -28.374631881713867, "global_step": 642125, "epoch": 7736} {"train_loss": -28.074201583862305, "global_step": 642126, "epoch": 7736} {"train_loss": -28.359235763549805, "global_step": 642127, "epoch": 7736} {"train_loss": -28.754751205444336, "global_step": 642128, "epoch": 7736} {"train_loss": -28.376434326171875, "global_step": 642129, "epoch": 7736} {"train_loss": -28.28350257873535, "global_step": 642130, "epoch": 7736} {"train_loss": -28.472166061401367, "global_step": 642131, "epoch": 7736} {"train_loss": -28.5380802154541, "global_step": 642132, "epoch": 7736} {"train_loss": -28.717823028564453, "global_step": 642133, "epoch": 7736} {"train_loss": -28.757080078125, "global_step": 642134, "epoch": 7736} {"train_loss": -28.300750732421875, "global_step": 642135, "epoch": 7736} {"train_loss": -28.598180770874023, "global_step": 642136, "epoch": 7736} {"train_loss": -28.19425392150879, "global_step": 642137, "epoch": 7736} {"train_loss": -27.964948654174805, "global_step": 642138, "epoch": 7736} {"train_loss": -28.572446823120117, "global_step": 642139, "epoch": 7736} {"train_loss": -28.40471839904785, "global_step": 642140, "epoch": 7736} {"train_loss": -28.646652221679688, "global_step": 642141, "epoch": 7736} {"train_loss": -28.398666381835938, "global_step": 642142, "epoch": 7736} {"train_loss": -28.351211547851562, "global_step": 642143, "epoch": 7736} {"train_loss": -28.59718132019043, "global_step": 642144, "epoch": 7736} {"train_loss": -28.228506088256836, "global_step": 642145, "epoch": 7736} {"train_loss": -28.307851791381836, "global_step": 642146, "epoch": 7736} {"train_loss": -28.429365158081055, "global_step": 642147, "epoch": 7736} {"train_loss": -28.236698150634766, "global_step": 642148, "epoch": 7736} {"train_loss": -28.384740829467773, "global_step": 642149, "epoch": 7736} {"train_loss": -28.60931968688965, "global_step": 642150, "epoch": 7736} {"train_loss": -28.571500778198242, "global_step": 642151, "epoch": 7736} {"train_loss": -28.207839965820312, "global_step": 642152, "epoch": 7736} {"train_loss": -28.62284278869629, "global_step": 642153, "epoch": 7736} {"train_loss": -28.29498291015625, "global_step": 642154, "epoch": 7736} {"train_loss": -28.388111114501953, "global_step": 642155, "epoch": 7736} {"train_loss": -28.49920654296875, "global_step": 642156, "epoch": 7736} {"train_loss": -28.29364013671875, "global_step": 642157, "epoch": 7736} {"train_loss": -28.4300537109375, "global_step": 642158, "epoch": 7736} {"train_loss": -28.092992782592773, "global_step": 642159, "epoch": 7736} {"train_loss": -28.222951889038086, "global_step": 642160, "epoch": 7736} {"train_loss": -27.973983764648438, "global_step": 642161, "epoch": 7736} {"train_loss": -28.15899658203125, "global_step": 642162, "epoch": 7736} {"train_loss": -28.105871200561523, "global_step": 642163, "epoch": 7736} {"train_loss": -28.01885414123535, "global_step": 642164, "epoch": 7736} {"train_loss": -27.59857177734375, "global_step": 642165, "epoch": 7736} {"train_loss": -27.862607955932617, "global_step": 642166, "epoch": 7736} {"train_loss": -27.769153594970703, "global_step": 642167, "epoch": 7736} {"train_loss": -27.878942489624023, "global_step": 642168, "epoch": 7736} {"train_loss": -27.97736167907715, "global_step": 642169, "epoch": 7736} {"train_loss": -28.203383135508343, "global_step": 642170, "epoch": 7736, "val_loss": 6603466.0} {"train_loss": -26.235647201538086, "global_step": 642171, "epoch": 7737} {"train_loss": -26.813230514526367, "global_step": 642172, "epoch": 7737} {"train_loss": -26.53737449645996, "global_step": 642173, "epoch": 7737} {"train_loss": -27.596134185791016, "global_step": 642174, "epoch": 7737} {"train_loss": -26.574460983276367, "global_step": 642175, "epoch": 7737} {"train_loss": -27.5440673828125, "global_step": 642176, "epoch": 7737} {"train_loss": -26.98587417602539, "global_step": 642177, "epoch": 7737} {"train_loss": -27.149625778198242, "global_step": 642178, "epoch": 7737} {"train_loss": -27.859140396118164, "global_step": 642179, "epoch": 7737} {"train_loss": -27.305465698242188, "global_step": 642180, "epoch": 7737} {"train_loss": -27.870756149291992, "global_step": 642181, "epoch": 7737} {"train_loss": -27.652332305908203, "global_step": 642182, "epoch": 7737} {"train_loss": -27.900928497314453, "global_step": 642183, "epoch": 7737} {"train_loss": -27.501508712768555, "global_step": 642184, "epoch": 7737} {"train_loss": -27.549856185913086, "global_step": 642185, "epoch": 7737} {"train_loss": -27.378192901611328, "global_step": 642186, "epoch": 7737} {"train_loss": -27.70863151550293, "global_step": 642187, "epoch": 7737} {"train_loss": -27.989282608032227, "global_step": 642188, "epoch": 7737} {"train_loss": -27.968280792236328, "global_step": 642189, "epoch": 7737} {"train_loss": -27.980798721313477, "global_step": 642190, "epoch": 7737} {"train_loss": -27.4981689453125, "global_step": 642191, "epoch": 7737} {"train_loss": -27.815176010131836, "global_step": 642192, "epoch": 7737} {"train_loss": -27.75918960571289, "global_step": 642193, "epoch": 7737} {"train_loss": -27.78346061706543, "global_step": 642194, "epoch": 7737} {"train_loss": -28.030691146850586, "global_step": 642195, "epoch": 7737} {"train_loss": -27.822021484375, "global_step": 642196, "epoch": 7737} {"train_loss": -27.65065574645996, "global_step": 642197, "epoch": 7737} {"train_loss": -27.93976402282715, "global_step": 642198, "epoch": 7737} {"train_loss": -28.074567794799805, "global_step": 642199, "epoch": 7737} {"train_loss": -28.214313507080078, "global_step": 642200, "epoch": 7737} {"train_loss": -27.853681564331055, "global_step": 642201, "epoch": 7737} {"train_loss": -28.18830680847168, "global_step": 642202, "epoch": 7737} {"train_loss": -27.951446533203125, "global_step": 642203, "epoch": 7737} {"train_loss": -27.8597354888916, "global_step": 642204, "epoch": 7737} {"train_loss": -28.24338150024414, "global_step": 642205, "epoch": 7737} {"train_loss": -28.287677764892578, "global_step": 642206, "epoch": 7737} {"train_loss": -28.12387466430664, "global_step": 642207, "epoch": 7737} {"train_loss": -28.2093505859375, "global_step": 642208, "epoch": 7737} {"train_loss": -28.021514892578125, "global_step": 642209, "epoch": 7737} {"train_loss": -27.94244956970215, "global_step": 642210, "epoch": 7737} {"train_loss": -28.34469985961914, "global_step": 642211, "epoch": 7737} {"train_loss": -28.40399169921875, "global_step": 642212, "epoch": 7737} {"train_loss": -27.83298110961914, "global_step": 642213, "epoch": 7737} {"train_loss": -28.433612823486328, "global_step": 642214, "epoch": 7737} {"train_loss": -28.075611114501953, "global_step": 642215, "epoch": 7737} {"train_loss": -27.382841110229492, "global_step": 642216, "epoch": 7737} {"train_loss": -28.0239315032959, "global_step": 642217, "epoch": 7737} {"train_loss": -28.22174644470215, "global_step": 642218, "epoch": 7737} {"train_loss": -27.596792221069336, "global_step": 642219, "epoch": 7737} {"train_loss": -27.412641525268555, "global_step": 642220, "epoch": 7737} {"train_loss": -28.11821937561035, "global_step": 642221, "epoch": 7737} {"train_loss": -27.530920028686523, "global_step": 642222, "epoch": 7737} {"train_loss": -28.192914962768555, "global_step": 642223, "epoch": 7737} {"train_loss": -28.081140518188477, "global_step": 642224, "epoch": 7737} {"train_loss": -27.78403091430664, "global_step": 642225, "epoch": 7737} {"train_loss": -28.27347183227539, "global_step": 642226, "epoch": 7737} {"train_loss": -28.039947509765625, "global_step": 642227, "epoch": 7737} {"train_loss": -28.34759521484375, "global_step": 642228, "epoch": 7737} {"train_loss": -28.240203857421875, "global_step": 642229, "epoch": 7737} {"train_loss": -28.08846092224121, "global_step": 642230, "epoch": 7737} {"train_loss": -28.214757919311523, "global_step": 642231, "epoch": 7737} {"train_loss": -27.893659591674805, "global_step": 642232, "epoch": 7737} {"train_loss": -28.20401954650879, "global_step": 642233, "epoch": 7737} {"train_loss": -28.222686767578125, "global_step": 642234, "epoch": 7737} {"train_loss": -28.35481071472168, "global_step": 642235, "epoch": 7737} {"train_loss": -28.367223739624023, "global_step": 642236, "epoch": 7737} {"train_loss": -28.2514705657959, "global_step": 642237, "epoch": 7737} {"train_loss": -28.041553497314453, "global_step": 642238, "epoch": 7737} {"train_loss": -28.29360008239746, "global_step": 642239, "epoch": 7737} {"train_loss": -28.12579917907715, "global_step": 642240, "epoch": 7737} {"train_loss": -28.35443115234375, "global_step": 642241, "epoch": 7737} {"train_loss": -28.528955459594727, "global_step": 642242, "epoch": 7737} {"train_loss": -28.520742416381836, "global_step": 642243, "epoch": 7737} {"train_loss": -28.094329833984375, "global_step": 642244, "epoch": 7737} {"train_loss": -28.077606201171875, "global_step": 642245, "epoch": 7737} {"train_loss": -28.117395401000977, "global_step": 642246, "epoch": 7737} {"train_loss": -28.324737548828125, "global_step": 642247, "epoch": 7737} {"train_loss": -27.850927352905273, "global_step": 642248, "epoch": 7737} {"train_loss": -28.361249923706055, "global_step": 642249, "epoch": 7737} {"train_loss": -28.113595962524414, "global_step": 642250, "epoch": 7737} {"train_loss": -28.573352813720703, "global_step": 642251, "epoch": 7737} {"train_loss": -28.090845108032227, "global_step": 642252, "epoch": 7737} {"train_loss": -27.91805625823607, "global_step": 642253, "epoch": 7737, "val_loss": 6613131.0} {"train_loss": -26.778305053710938, "global_step": 642254, "epoch": 7738} {"train_loss": -25.781055450439453, "global_step": 642255, "epoch": 7738} {"train_loss": -26.2470760345459, "global_step": 642256, "epoch": 7738} {"train_loss": -27.2950496673584, "global_step": 642257, "epoch": 7738} {"train_loss": -27.34193229675293, "global_step": 642258, "epoch": 7738} {"train_loss": -26.476953506469727, "global_step": 642259, "epoch": 7738} {"train_loss": -27.175512313842773, "global_step": 642260, "epoch": 7738} {"train_loss": -27.5928897857666, "global_step": 642261, "epoch": 7738} {"train_loss": -26.69536781311035, "global_step": 642262, "epoch": 7738} {"train_loss": -27.963598251342773, "global_step": 642263, "epoch": 7738} {"train_loss": -27.698556900024414, "global_step": 642264, "epoch": 7738} {"train_loss": -27.44671058654785, "global_step": 642265, "epoch": 7738} {"train_loss": -27.827213287353516, "global_step": 642266, "epoch": 7738} {"train_loss": -27.770124435424805, "global_step": 642267, "epoch": 7738} {"train_loss": -28.316328048706055, "global_step": 642268, "epoch": 7738} {"train_loss": -27.83514976501465, "global_step": 642269, "epoch": 7738} {"train_loss": -27.820343017578125, "global_step": 642270, "epoch": 7738} {"train_loss": -27.263671875, "global_step": 642271, "epoch": 7738} {"train_loss": -28.352354049682617, "global_step": 642272, "epoch": 7738} {"train_loss": -27.90579605102539, "global_step": 642273, "epoch": 7738} {"train_loss": -28.078760147094727, "global_step": 642274, "epoch": 7738} {"train_loss": -27.993494033813477, "global_step": 642275, "epoch": 7738} {"train_loss": -27.94028091430664, "global_step": 642276, "epoch": 7738} {"train_loss": -27.893875122070312, "global_step": 642277, "epoch": 7738} {"train_loss": -27.996612548828125, "global_step": 642278, "epoch": 7738} {"train_loss": -28.22456169128418, "global_step": 642279, "epoch": 7738} {"train_loss": -28.101795196533203, "global_step": 642280, "epoch": 7738} {"train_loss": -27.97930335998535, "global_step": 642281, "epoch": 7738} {"train_loss": -28.102170944213867, "global_step": 642282, "epoch": 7738} {"train_loss": -28.20709228515625, "global_step": 642283, "epoch": 7738} {"train_loss": -28.08355140686035, "global_step": 642284, "epoch": 7738} {"train_loss": -27.8302059173584, "global_step": 642285, "epoch": 7738} {"train_loss": -28.4099178314209, "global_step": 642286, "epoch": 7738} {"train_loss": -28.248554229736328, "global_step": 642287, "epoch": 7738} {"train_loss": -28.46784019470215, "global_step": 642288, "epoch": 7738} {"train_loss": -28.132104873657227, "global_step": 642289, "epoch": 7738} {"train_loss": -28.155405044555664, "global_step": 642290, "epoch": 7738} {"train_loss": -28.479660034179688, "global_step": 642291, "epoch": 7738} {"train_loss": -28.420547485351562, "global_step": 642292, "epoch": 7738} {"train_loss": -28.547992706298828, "global_step": 642293, "epoch": 7738} {"train_loss": -28.356460571289062, "global_step": 642294, "epoch": 7738} {"train_loss": -27.959671020507812, "global_step": 642295, "epoch": 7738} {"train_loss": -28.74237060546875, "global_step": 642296, "epoch": 7738} {"train_loss": -28.40081787109375, "global_step": 642297, "epoch": 7738} {"train_loss": -28.501514434814453, "global_step": 642298, "epoch": 7738} {"train_loss": -28.151920318603516, "global_step": 642299, "epoch": 7738} {"train_loss": -28.37167739868164, "global_step": 642300, "epoch": 7738} {"train_loss": -28.426666259765625, "global_step": 642301, "epoch": 7738} {"train_loss": -28.4188232421875, "global_step": 642302, "epoch": 7738} {"train_loss": -28.317224502563477, "global_step": 642303, "epoch": 7738} {"train_loss": -28.533971786499023, "global_step": 642304, "epoch": 7738} {"train_loss": -28.66013526916504, "global_step": 642305, "epoch": 7738} {"train_loss": -28.604782104492188, "global_step": 642306, "epoch": 7738} {"train_loss": -28.401336669921875, "global_step": 642307, "epoch": 7738} {"train_loss": -28.7863826751709, "global_step": 642308, "epoch": 7738} {"train_loss": -28.08662223815918, "global_step": 642309, "epoch": 7738} {"train_loss": -28.382856369018555, "global_step": 642310, "epoch": 7738} {"train_loss": -28.51081657409668, "global_step": 642311, "epoch": 7738} {"train_loss": -28.2161922454834, "global_step": 642312, "epoch": 7738} {"train_loss": -28.31955909729004, "global_step": 642313, "epoch": 7738} {"train_loss": -28.452672958374023, "global_step": 642314, "epoch": 7738} {"train_loss": -28.384912490844727, "global_step": 642315, "epoch": 7738} {"train_loss": -28.409317016601562, "global_step": 642316, "epoch": 7738} {"train_loss": -28.36484718322754, "global_step": 642317, "epoch": 7738} {"train_loss": -28.0778751373291, "global_step": 642318, "epoch": 7738} {"train_loss": -28.489521026611328, "global_step": 642319, "epoch": 7738} {"train_loss": -28.504928588867188, "global_step": 642320, "epoch": 7738} {"train_loss": -28.32843589782715, "global_step": 642321, "epoch": 7738} {"train_loss": -27.968896865844727, "global_step": 642322, "epoch": 7738} {"train_loss": -28.177473068237305, "global_step": 642323, "epoch": 7738} {"train_loss": -28.52955436706543, "global_step": 642324, "epoch": 7738} {"train_loss": -28.29384422302246, "global_step": 642325, "epoch": 7738} {"train_loss": -28.452606201171875, "global_step": 642326, "epoch": 7738} {"train_loss": -28.503192901611328, "global_step": 642327, "epoch": 7738} {"train_loss": -28.5950984954834, "global_step": 642328, "epoch": 7738} {"train_loss": -28.372116088867188, "global_step": 642329, "epoch": 7738} {"train_loss": -28.08623695373535, "global_step": 642330, "epoch": 7738} {"train_loss": -28.9499568939209, "global_step": 642331, "epoch": 7738} {"train_loss": -28.366565704345703, "global_step": 642332, "epoch": 7738} {"train_loss": -28.433868408203125, "global_step": 642333, "epoch": 7738} {"train_loss": -28.46713638305664, "global_step": 642334, "epoch": 7738} {"train_loss": -28.188846588134766, "global_step": 642335, "epoch": 7738} {"train_loss": -28.091978509742095, "global_step": 642336, "epoch": 7738, "val_loss": 6646668.5} {"train_loss": -27.392078399658203, "global_step": 642337, "epoch": 7739} {"train_loss": -27.180585861206055, "global_step": 642338, "epoch": 7739} {"train_loss": -27.61713981628418, "global_step": 642339, "epoch": 7739} {"train_loss": -28.001638412475586, "global_step": 642340, "epoch": 7739} {"train_loss": -27.715612411499023, "global_step": 642341, "epoch": 7739} {"train_loss": -28.35931396484375, "global_step": 642342, "epoch": 7739} {"train_loss": -27.870458602905273, "global_step": 642343, "epoch": 7739} {"train_loss": -27.78431510925293, "global_step": 642344, "epoch": 7739} {"train_loss": -28.05544090270996, "global_step": 642345, "epoch": 7739} {"train_loss": -28.321264266967773, "global_step": 642346, "epoch": 7739} {"train_loss": -28.314085006713867, "global_step": 642347, "epoch": 7739} {"train_loss": -28.04620933532715, "global_step": 642348, "epoch": 7739} {"train_loss": -27.830286026000977, "global_step": 642349, "epoch": 7739} {"train_loss": -28.0217342376709, "global_step": 642350, "epoch": 7739} {"train_loss": -28.569421768188477, "global_step": 642351, "epoch": 7739} {"train_loss": -28.246749877929688, "global_step": 642352, "epoch": 7739} {"train_loss": -28.18661880493164, "global_step": 642353, "epoch": 7739} {"train_loss": -27.93973731994629, "global_step": 642354, "epoch": 7739} {"train_loss": -28.172773361206055, "global_step": 642355, "epoch": 7739} {"train_loss": -28.293304443359375, "global_step": 642356, "epoch": 7739} {"train_loss": -28.330474853515625, "global_step": 642357, "epoch": 7739} {"train_loss": -28.400671005249023, "global_step": 642358, "epoch": 7739} {"train_loss": -28.527280807495117, "global_step": 642359, "epoch": 7739} {"train_loss": -28.434289932250977, "global_step": 642360, "epoch": 7739} {"train_loss": -28.113754272460938, "global_step": 642361, "epoch": 7739} {"train_loss": -28.220691680908203, "global_step": 642362, "epoch": 7739} {"train_loss": -28.418439865112305, "global_step": 642363, "epoch": 7739} {"train_loss": -28.461811065673828, "global_step": 642364, "epoch": 7739} {"train_loss": -28.616003036499023, "global_step": 642365, "epoch": 7739} {"train_loss": -27.830570220947266, "global_step": 642366, "epoch": 7739} {"train_loss": -28.485992431640625, "global_step": 642367, "epoch": 7739} {"train_loss": -28.219928741455078, "global_step": 642368, "epoch": 7739} {"train_loss": -28.443368911743164, "global_step": 642369, "epoch": 7739} {"train_loss": -27.96941566467285, "global_step": 642370, "epoch": 7739} {"train_loss": -28.218231201171875, "global_step": 642371, "epoch": 7739} {"train_loss": -28.319828033447266, "global_step": 642372, "epoch": 7739} {"train_loss": -27.930023193359375, "global_step": 642373, "epoch": 7739} {"train_loss": -28.250396728515625, "global_step": 642374, "epoch": 7739} {"train_loss": -28.328229904174805, "global_step": 642375, "epoch": 7739} {"train_loss": -28.173614501953125, "global_step": 642376, "epoch": 7739} {"train_loss": -28.898544311523438, "global_step": 642377, "epoch": 7739} {"train_loss": -28.233489990234375, "global_step": 642378, "epoch": 7739} {"train_loss": -28.07448387145996, "global_step": 642379, "epoch": 7739} {"train_loss": -28.156599044799805, "global_step": 642380, "epoch": 7739} {"train_loss": -28.694555282592773, "global_step": 642381, "epoch": 7739} {"train_loss": -28.570585250854492, "global_step": 642382, "epoch": 7739} {"train_loss": -28.418912887573242, "global_step": 642383, "epoch": 7739} {"train_loss": -28.380704879760742, "global_step": 642384, "epoch": 7739} {"train_loss": -28.4051456451416, "global_step": 642385, "epoch": 7739} {"train_loss": -28.24506950378418, "global_step": 642386, "epoch": 7739} {"train_loss": -28.706974029541016, "global_step": 642387, "epoch": 7739} {"train_loss": -28.529224395751953, "global_step": 642388, "epoch": 7739} {"train_loss": -28.058277130126953, "global_step": 642389, "epoch": 7739} {"train_loss": -28.48381996154785, "global_step": 642390, "epoch": 7739} {"train_loss": -28.346837997436523, "global_step": 642391, "epoch": 7739} {"train_loss": -28.423736572265625, "global_step": 642392, "epoch": 7739} {"train_loss": -28.215229034423828, "global_step": 642393, "epoch": 7739} {"train_loss": -28.304391860961914, "global_step": 642394, "epoch": 7739} {"train_loss": -28.08057975769043, "global_step": 642395, "epoch": 7739} {"train_loss": -28.729877471923828, "global_step": 642396, "epoch": 7739} {"train_loss": -28.502241134643555, "global_step": 642397, "epoch": 7739} {"train_loss": -28.079559326171875, "global_step": 642398, "epoch": 7739} {"train_loss": -28.317087173461914, "global_step": 642399, "epoch": 7739} {"train_loss": -28.74921226501465, "global_step": 642400, "epoch": 7739} {"train_loss": -28.0731201171875, "global_step": 642401, "epoch": 7739} {"train_loss": -28.39435386657715, "global_step": 642402, "epoch": 7739} {"train_loss": -28.25858497619629, "global_step": 642403, "epoch": 7739} {"train_loss": -28.41934585571289, "global_step": 642404, "epoch": 7739} {"train_loss": -28.282629013061523, "global_step": 642405, "epoch": 7739} {"train_loss": -27.956787109375, "global_step": 642406, "epoch": 7739} {"train_loss": -28.319854736328125, "global_step": 642407, "epoch": 7739} {"train_loss": -28.035043716430664, "global_step": 642408, "epoch": 7739} {"train_loss": -28.294031143188477, "global_step": 642409, "epoch": 7739} {"train_loss": -28.1451358795166, "global_step": 642410, "epoch": 7739} {"train_loss": -28.524328231811523, "global_step": 642411, "epoch": 7739} {"train_loss": -28.394733428955078, "global_step": 642412, "epoch": 7739} {"train_loss": -28.62690544128418, "global_step": 642413, "epoch": 7739} {"train_loss": -28.167926788330078, "global_step": 642414, "epoch": 7739} {"train_loss": -28.3306884765625, "global_step": 642415, "epoch": 7739} {"train_loss": -28.40803337097168, "global_step": 642416, "epoch": 7739} {"train_loss": -28.79833984375, "global_step": 642417, "epoch": 7739} {"train_loss": -28.55531120300293, "global_step": 642418, "epoch": 7739} {"train_loss": -28.263597396482904, "global_step": 642419, "epoch": 7739, "val_loss": 6614212.5} {"train_loss": -27.04128074645996, "global_step": 642420, "epoch": 7740} {"train_loss": -27.854358673095703, "global_step": 642421, "epoch": 7740} {"train_loss": -27.984296798706055, "global_step": 642422, "epoch": 7740} {"train_loss": -27.905378341674805, "global_step": 642423, "epoch": 7740} {"train_loss": -27.231842041015625, "global_step": 642424, "epoch": 7740} {"train_loss": -27.55322265625, "global_step": 642425, "epoch": 7740} {"train_loss": -27.256622314453125, "global_step": 642426, "epoch": 7740} {"train_loss": -27.3520450592041, "global_step": 642427, "epoch": 7740} {"train_loss": -27.81038475036621, "global_step": 642428, "epoch": 7740} {"train_loss": -27.455535888671875, "global_step": 642429, "epoch": 7740} {"train_loss": -27.341413497924805, "global_step": 642430, "epoch": 7740} {"train_loss": -27.96990394592285, "global_step": 642431, "epoch": 7740} {"train_loss": -27.502710342407227, "global_step": 642432, "epoch": 7740} {"train_loss": -27.52740478515625, "global_step": 642433, "epoch": 7740} {"train_loss": -27.81321144104004, "global_step": 642434, "epoch": 7740} {"train_loss": -27.86268424987793, "global_step": 642435, "epoch": 7740} {"train_loss": -27.49700927734375, "global_step": 642436, "epoch": 7740} {"train_loss": -27.619733810424805, "global_step": 642437, "epoch": 7740} {"train_loss": -27.77425193786621, "global_step": 642438, "epoch": 7740} {"train_loss": -27.8720645904541, "global_step": 642439, "epoch": 7740} {"train_loss": -27.514053344726562, "global_step": 642440, "epoch": 7740} {"train_loss": -28.14227294921875, "global_step": 642441, "epoch": 7740} {"train_loss": -27.865161895751953, "global_step": 642442, "epoch": 7740} {"train_loss": -27.996816635131836, "global_step": 642443, "epoch": 7740} {"train_loss": -28.25728416442871, "global_step": 642444, "epoch": 7740} {"train_loss": -28.135101318359375, "global_step": 642445, "epoch": 7740} {"train_loss": -28.479223251342773, "global_step": 642446, "epoch": 7740} {"train_loss": -27.792707443237305, "global_step": 642447, "epoch": 7740} {"train_loss": -28.2523250579834, "global_step": 642448, "epoch": 7740} {"train_loss": -28.459503173828125, "global_step": 642449, "epoch": 7740} {"train_loss": -28.016284942626953, "global_step": 642450, "epoch": 7740} {"train_loss": -28.082197189331055, "global_step": 642451, "epoch": 7740} {"train_loss": -28.204833984375, "global_step": 642452, "epoch": 7740} {"train_loss": -28.13722038269043, "global_step": 642453, "epoch": 7740} {"train_loss": -28.375085830688477, "global_step": 642454, "epoch": 7740} {"train_loss": -28.372236251831055, "global_step": 642455, "epoch": 7740} {"train_loss": -28.154865264892578, "global_step": 642456, "epoch": 7740} {"train_loss": -28.624189376831055, "global_step": 642457, "epoch": 7740} {"train_loss": -28.426544189453125, "global_step": 642458, "epoch": 7740} {"train_loss": -28.40675163269043, "global_step": 642459, "epoch": 7740} {"train_loss": -28.295074462890625, "global_step": 642460, "epoch": 7740} {"train_loss": -28.090742111206055, "global_step": 642461, "epoch": 7740} {"train_loss": -28.623937606811523, "global_step": 642462, "epoch": 7740} {"train_loss": -28.17425537109375, "global_step": 642463, "epoch": 7740} {"train_loss": -28.2814998626709, "global_step": 642464, "epoch": 7740} {"train_loss": -28.631139755249023, "global_step": 642465, "epoch": 7740} {"train_loss": -28.347400665283203, "global_step": 642466, "epoch": 7740} {"train_loss": -28.476642608642578, "global_step": 642467, "epoch": 7740} {"train_loss": -28.2534122467041, "global_step": 642468, "epoch": 7740} {"train_loss": -28.270048141479492, "global_step": 642469, "epoch": 7740} {"train_loss": -28.261993408203125, "global_step": 642470, "epoch": 7740} {"train_loss": -28.069379806518555, "global_step": 642471, "epoch": 7740} {"train_loss": -28.075292587280273, "global_step": 642472, "epoch": 7740} {"train_loss": -28.284515380859375, "global_step": 642473, "epoch": 7740} {"train_loss": -28.146100997924805, "global_step": 642474, "epoch": 7740} {"train_loss": -28.133569717407227, "global_step": 642475, "epoch": 7740} {"train_loss": -28.0769100189209, "global_step": 642476, "epoch": 7740} {"train_loss": -28.17555046081543, "global_step": 642477, "epoch": 7740} {"train_loss": -28.269363403320312, "global_step": 642478, "epoch": 7740} {"train_loss": -28.041494369506836, "global_step": 642479, "epoch": 7740} {"train_loss": -27.958133697509766, "global_step": 642480, "epoch": 7740} {"train_loss": -28.4357852935791, "global_step": 642481, "epoch": 7740} {"train_loss": -28.401655197143555, "global_step": 642482, "epoch": 7740} {"train_loss": -28.600238800048828, "global_step": 642483, "epoch": 7740} {"train_loss": -28.3380184173584, "global_step": 642484, "epoch": 7740} {"train_loss": -28.482040405273438, "global_step": 642485, "epoch": 7740} {"train_loss": -28.369001388549805, "global_step": 642486, "epoch": 7740} {"train_loss": -28.471912384033203, "global_step": 642487, "epoch": 7740} {"train_loss": -28.504913330078125, "global_step": 642488, "epoch": 7740} {"train_loss": -28.294946670532227, "global_step": 642489, "epoch": 7740} {"train_loss": -28.40011978149414, "global_step": 642490, "epoch": 7740} {"train_loss": -28.32614517211914, "global_step": 642491, "epoch": 7740} {"train_loss": -28.61679458618164, "global_step": 642492, "epoch": 7740} {"train_loss": -28.288854598999023, "global_step": 642493, "epoch": 7740} {"train_loss": -28.560516357421875, "global_step": 642494, "epoch": 7740} {"train_loss": -28.609210968017578, "global_step": 642495, "epoch": 7740} {"train_loss": -28.70711326599121, "global_step": 642496, "epoch": 7740} {"train_loss": -28.683996200561523, "global_step": 642497, "epoch": 7740} {"train_loss": -28.34453773498535, "global_step": 642498, "epoch": 7740} {"train_loss": -27.915424346923828, "global_step": 642499, "epoch": 7740} {"train_loss": -28.209165573120117, "global_step": 642500, "epoch": 7740} {"train_loss": -28.447772979736328, "global_step": 642501, "epoch": 7740} {"train_loss": -28.12951758970697, "global_step": 642502, "epoch": 7740, "val_loss": 6645331.0} {"train_loss": -27.63037109375, "global_step": 642503, "epoch": 7741} {"train_loss": -27.008520126342773, "global_step": 642504, "epoch": 7741} {"train_loss": -27.368223190307617, "global_step": 642505, "epoch": 7741} {"train_loss": -27.835397720336914, "global_step": 642506, "epoch": 7741} {"train_loss": -27.66410255432129, "global_step": 642507, "epoch": 7741} {"train_loss": -27.877582550048828, "global_step": 642508, "epoch": 7741} {"train_loss": -27.819189071655273, "global_step": 642509, "epoch": 7741} {"train_loss": -27.840463638305664, "global_step": 642510, "epoch": 7741} {"train_loss": -28.10443115234375, "global_step": 642511, "epoch": 7741} {"train_loss": -28.376279830932617, "global_step": 642512, "epoch": 7741} {"train_loss": -28.055566787719727, "global_step": 642513, "epoch": 7741} {"train_loss": -28.15692710876465, "global_step": 642514, "epoch": 7741} {"train_loss": -28.1151123046875, "global_step": 642515, "epoch": 7741} {"train_loss": -27.565174102783203, "global_step": 642516, "epoch": 7741} {"train_loss": -28.111328125, "global_step": 642517, "epoch": 7741} {"train_loss": -27.948535919189453, "global_step": 642518, "epoch": 7741} {"train_loss": -28.318708419799805, "global_step": 642519, "epoch": 7741} {"train_loss": -27.88022804260254, "global_step": 642520, "epoch": 7741} {"train_loss": -27.84404945373535, "global_step": 642521, "epoch": 7741} {"train_loss": -27.586502075195312, "global_step": 642522, "epoch": 7741} {"train_loss": -28.282087326049805, "global_step": 642523, "epoch": 7741} {"train_loss": -27.998884201049805, "global_step": 642524, "epoch": 7741} {"train_loss": -27.970462799072266, "global_step": 642525, "epoch": 7741} {"train_loss": -28.3326473236084, "global_step": 642526, "epoch": 7741} {"train_loss": -28.036725997924805, "global_step": 642527, "epoch": 7741} {"train_loss": -28.216388702392578, "global_step": 642528, "epoch": 7741} {"train_loss": -27.991809844970703, "global_step": 642529, "epoch": 7741} {"train_loss": -28.263782501220703, "global_step": 642530, "epoch": 7741} {"train_loss": -28.333087921142578, "global_step": 642531, "epoch": 7741} {"train_loss": -28.010358810424805, "global_step": 642532, "epoch": 7741} {"train_loss": -28.369043350219727, "global_step": 642533, "epoch": 7741} {"train_loss": -28.352127075195312, "global_step": 642534, "epoch": 7741} {"train_loss": -28.536197662353516, "global_step": 642535, "epoch": 7741} {"train_loss": -28.126569747924805, "global_step": 642536, "epoch": 7741} {"train_loss": -28.366376876831055, "global_step": 642537, "epoch": 7741} {"train_loss": -27.87579917907715, "global_step": 642538, "epoch": 7741} {"train_loss": -28.642343521118164, "global_step": 642539, "epoch": 7741} {"train_loss": -28.222726821899414, "global_step": 642540, "epoch": 7741} {"train_loss": -28.318090438842773, "global_step": 642541, "epoch": 7741} {"train_loss": -28.4283447265625, "global_step": 642542, "epoch": 7741} {"train_loss": -28.314319610595703, "global_step": 642543, "epoch": 7741} {"train_loss": -28.42020034790039, "global_step": 642544, "epoch": 7741} {"train_loss": -28.633520126342773, "global_step": 642545, "epoch": 7741} {"train_loss": -28.393796920776367, "global_step": 642546, "epoch": 7741} {"train_loss": -28.316904067993164, "global_step": 642547, "epoch": 7741} {"train_loss": -28.525531768798828, "global_step": 642548, "epoch": 7741} {"train_loss": -28.275060653686523, "global_step": 642549, "epoch": 7741} {"train_loss": -28.518085479736328, "global_step": 642550, "epoch": 7741} {"train_loss": -28.130207061767578, "global_step": 642551, "epoch": 7741} {"train_loss": -28.47907829284668, "global_step": 642552, "epoch": 7741} {"train_loss": -28.557605743408203, "global_step": 642553, "epoch": 7741} {"train_loss": -28.465656280517578, "global_step": 642554, "epoch": 7741} {"train_loss": -28.771560668945312, "global_step": 642555, "epoch": 7741} {"train_loss": -28.45524024963379, "global_step": 642556, "epoch": 7741} {"train_loss": -28.650205612182617, "global_step": 642557, "epoch": 7741} {"train_loss": -28.24476432800293, "global_step": 642558, "epoch": 7741} {"train_loss": -28.47354507446289, "global_step": 642559, "epoch": 7741} {"train_loss": -28.47718620300293, "global_step": 642560, "epoch": 7741} {"train_loss": -28.621784210205078, "global_step": 642561, "epoch": 7741} {"train_loss": -27.994775772094727, "global_step": 642562, "epoch": 7741} {"train_loss": -28.031742095947266, "global_step": 642563, "epoch": 7741} {"train_loss": -28.292638778686523, "global_step": 642564, "epoch": 7741} {"train_loss": -28.301427841186523, "global_step": 642565, "epoch": 7741} {"train_loss": -28.519067764282227, "global_step": 642566, "epoch": 7741} {"train_loss": -28.197113037109375, "global_step": 642567, "epoch": 7741} {"train_loss": -27.9937744140625, "global_step": 642568, "epoch": 7741} {"train_loss": -28.302465438842773, "global_step": 642569, "epoch": 7741} {"train_loss": -28.297321319580078, "global_step": 642570, "epoch": 7741} {"train_loss": -28.4010009765625, "global_step": 642571, "epoch": 7741} {"train_loss": -27.806249618530273, "global_step": 642572, "epoch": 7741} {"train_loss": -28.196943283081055, "global_step": 642573, "epoch": 7741} {"train_loss": -27.806562423706055, "global_step": 642574, "epoch": 7741} {"train_loss": -28.257612228393555, "global_step": 642575, "epoch": 7741} {"train_loss": -28.1124324798584, "global_step": 642576, "epoch": 7741} {"train_loss": -28.510986328125, "global_step": 642577, "epoch": 7741} {"train_loss": -28.173263549804688, "global_step": 642578, "epoch": 7741} {"train_loss": -28.332443237304688, "global_step": 642579, "epoch": 7741} {"train_loss": -28.138046264648438, "global_step": 642580, "epoch": 7741} {"train_loss": -28.007953643798828, "global_step": 642581, "epoch": 7741} {"train_loss": -28.248157501220703, "global_step": 642582, "epoch": 7741} {"train_loss": -28.19917106628418, "global_step": 642583, "epoch": 7741} {"train_loss": -28.193225860595703, "global_step": 642584, "epoch": 7741} {"train_loss": -28.194337408226655, "global_step": 642585, "epoch": 7741, "val_loss": 6683591.0} {"train_loss": -27.649499893188477, "global_step": 642586, "epoch": 7742} {"train_loss": -27.75029945373535, "global_step": 642587, "epoch": 7742} {"train_loss": -27.8407039642334, "global_step": 642588, "epoch": 7742} {"train_loss": -27.54361343383789, "global_step": 642589, "epoch": 7742} {"train_loss": -27.865100860595703, "global_step": 642590, "epoch": 7742} {"train_loss": -27.578283309936523, "global_step": 642591, "epoch": 7742} {"train_loss": -27.602502822875977, "global_step": 642592, "epoch": 7742} {"train_loss": -28.074329376220703, "global_step": 642593, "epoch": 7742} {"train_loss": -27.959070205688477, "global_step": 642594, "epoch": 7742} {"train_loss": -27.795270919799805, "global_step": 642595, "epoch": 7742} {"train_loss": -28.17262840270996, "global_step": 642596, "epoch": 7742} {"train_loss": -28.219938278198242, "global_step": 642597, "epoch": 7742} {"train_loss": -27.994123458862305, "global_step": 642598, "epoch": 7742} {"train_loss": -28.129667282104492, "global_step": 642599, "epoch": 7742} {"train_loss": -28.17551612854004, "global_step": 642600, "epoch": 7742} {"train_loss": -28.128416061401367, "global_step": 642601, "epoch": 7742} {"train_loss": -28.232404708862305, "global_step": 642602, "epoch": 7742} {"train_loss": -28.31982421875, "global_step": 642603, "epoch": 7742} {"train_loss": -27.97686767578125, "global_step": 642604, "epoch": 7742} {"train_loss": -28.47259521484375, "global_step": 642605, "epoch": 7742} {"train_loss": -28.3315372467041, "global_step": 642606, "epoch": 7742} {"train_loss": -27.8222713470459, "global_step": 642607, "epoch": 7742} {"train_loss": -28.123159408569336, "global_step": 642608, "epoch": 7742} {"train_loss": -28.034528732299805, "global_step": 642609, "epoch": 7742} {"train_loss": -27.990894317626953, "global_step": 642610, "epoch": 7742} {"train_loss": -27.980005264282227, "global_step": 642611, "epoch": 7742} {"train_loss": -28.3053035736084, "global_step": 642612, "epoch": 7742} {"train_loss": -28.088048934936523, "global_step": 642613, "epoch": 7742} {"train_loss": -28.43604850769043, "global_step": 642614, "epoch": 7742} {"train_loss": -28.21575927734375, "global_step": 642615, "epoch": 7742} {"train_loss": -28.363361358642578, "global_step": 642616, "epoch": 7742} {"train_loss": -28.5445499420166, "global_step": 642617, "epoch": 7742} {"train_loss": -28.3158016204834, "global_step": 642618, "epoch": 7742} {"train_loss": -28.309518814086914, "global_step": 642619, "epoch": 7742} {"train_loss": -28.516489028930664, "global_step": 642620, "epoch": 7742} {"train_loss": -28.234472274780273, "global_step": 642621, "epoch": 7742} {"train_loss": -28.360187530517578, "global_step": 642622, "epoch": 7742} {"train_loss": -28.7030086517334, "global_step": 642623, "epoch": 7742} {"train_loss": -28.5559024810791, "global_step": 642624, "epoch": 7742} {"train_loss": -28.254608154296875, "global_step": 642625, "epoch": 7742} {"train_loss": -28.4158878326416, "global_step": 642626, "epoch": 7742} {"train_loss": -28.265594482421875, "global_step": 642627, "epoch": 7742} {"train_loss": -28.6433162689209, "global_step": 642628, "epoch": 7742} {"train_loss": -28.247129440307617, "global_step": 642629, "epoch": 7742} {"train_loss": -28.80607032775879, "global_step": 642630, "epoch": 7742} {"train_loss": -28.725019454956055, "global_step": 642631, "epoch": 7742} {"train_loss": -28.47696304321289, "global_step": 642632, "epoch": 7742} {"train_loss": -28.254682540893555, "global_step": 642633, "epoch": 7742} {"train_loss": -28.476449966430664, "global_step": 642634, "epoch": 7742} {"train_loss": -28.540607452392578, "global_step": 642635, "epoch": 7742} {"train_loss": -28.325820922851562, "global_step": 642636, "epoch": 7742} {"train_loss": -28.16731834411621, "global_step": 642637, "epoch": 7742} {"train_loss": -28.277210235595703, "global_step": 642638, "epoch": 7742} {"train_loss": -27.983617782592773, "global_step": 642639, "epoch": 7742} {"train_loss": -28.513675689697266, "global_step": 642640, "epoch": 7742} {"train_loss": -28.312963485717773, "global_step": 642641, "epoch": 7742} {"train_loss": -27.993085861206055, "global_step": 642642, "epoch": 7742} {"train_loss": -28.370426177978516, "global_step": 642643, "epoch": 7742} {"train_loss": -28.39388084411621, "global_step": 642644, "epoch": 7742} {"train_loss": -28.1859130859375, "global_step": 642645, "epoch": 7742} {"train_loss": -27.96481704711914, "global_step": 642646, "epoch": 7742} {"train_loss": -27.943927764892578, "global_step": 642647, "epoch": 7742} {"train_loss": -28.25379753112793, "global_step": 642648, "epoch": 7742} {"train_loss": -28.343130111694336, "global_step": 642649, "epoch": 7742} {"train_loss": -28.548913955688477, "global_step": 642650, "epoch": 7742} {"train_loss": -28.55183219909668, "global_step": 642651, "epoch": 7742} {"train_loss": -27.896726608276367, "global_step": 642652, "epoch": 7742} {"train_loss": -27.834537506103516, "global_step": 642653, "epoch": 7742} {"train_loss": -27.78619384765625, "global_step": 642654, "epoch": 7742} {"train_loss": -27.957935333251953, "global_step": 642655, "epoch": 7742} {"train_loss": -28.304426193237305, "global_step": 642656, "epoch": 7742} {"train_loss": -28.565107345581055, "global_step": 642657, "epoch": 7742} {"train_loss": -28.053619384765625, "global_step": 642658, "epoch": 7742} {"train_loss": -27.881330490112305, "global_step": 642659, "epoch": 7742} {"train_loss": -27.891193389892578, "global_step": 642660, "epoch": 7742} {"train_loss": -28.687366485595703, "global_step": 642661, "epoch": 7742} {"train_loss": -28.46231460571289, "global_step": 642662, "epoch": 7742} {"train_loss": -28.0085391998291, "global_step": 642663, "epoch": 7742} {"train_loss": -27.931013107299805, "global_step": 642664, "epoch": 7742} {"train_loss": -28.01008415222168, "global_step": 642665, "epoch": 7742} {"train_loss": -28.17717933654785, "global_step": 642666, "epoch": 7742} {"train_loss": -27.937421798706055, "global_step": 642667, "epoch": 7742} {"train_loss": -28.17621463178152, "global_step": 642668, "epoch": 7742, "val_loss": 6599161.0} {"train_loss": -27.590625762939453, "global_step": 642669, "epoch": 7743} {"train_loss": -27.961206436157227, "global_step": 642670, "epoch": 7743} {"train_loss": -28.065933227539062, "global_step": 642671, "epoch": 7743} {"train_loss": -27.394201278686523, "global_step": 642672, "epoch": 7743} {"train_loss": -28.30988121032715, "global_step": 642673, "epoch": 7743} {"train_loss": -28.252735137939453, "global_step": 642674, "epoch": 7743} {"train_loss": -27.805273056030273, "global_step": 642675, "epoch": 7743} {"train_loss": -27.952533721923828, "global_step": 642676, "epoch": 7743} {"train_loss": -27.943204879760742, "global_step": 642677, "epoch": 7743} {"train_loss": -27.806432723999023, "global_step": 642678, "epoch": 7743} {"train_loss": -28.5321044921875, "global_step": 642679, "epoch": 7743} {"train_loss": -27.648014068603516, "global_step": 642680, "epoch": 7743} {"train_loss": -28.031476974487305, "global_step": 642681, "epoch": 7743} {"train_loss": -28.09848403930664, "global_step": 642682, "epoch": 7743} {"train_loss": -27.68609046936035, "global_step": 642683, "epoch": 7743} {"train_loss": -28.08893394470215, "global_step": 642684, "epoch": 7743} {"train_loss": -27.96380043029785, "global_step": 642685, "epoch": 7743} {"train_loss": -27.832351684570312, "global_step": 642686, "epoch": 7743} {"train_loss": -27.853017807006836, "global_step": 642687, "epoch": 7743} {"train_loss": -28.262481689453125, "global_step": 642688, "epoch": 7743} {"train_loss": -28.158422470092773, "global_step": 642689, "epoch": 7743} {"train_loss": -27.893014907836914, "global_step": 642690, "epoch": 7743} {"train_loss": -27.84781837463379, "global_step": 642691, "epoch": 7743} {"train_loss": -28.177820205688477, "global_step": 642692, "epoch": 7743} {"train_loss": -28.244037628173828, "global_step": 642693, "epoch": 7743} {"train_loss": -27.968900680541992, "global_step": 642694, "epoch": 7743} {"train_loss": -28.409896850585938, "global_step": 642695, "epoch": 7743} {"train_loss": -28.001672744750977, "global_step": 642696, "epoch": 7743} {"train_loss": -28.432891845703125, "global_step": 642697, "epoch": 7743} {"train_loss": -28.352447509765625, "global_step": 642698, "epoch": 7743} {"train_loss": -28.186899185180664, "global_step": 642699, "epoch": 7743} {"train_loss": -27.860275268554688, "global_step": 642700, "epoch": 7743} {"train_loss": -28.482213973999023, "global_step": 642701, "epoch": 7743} {"train_loss": -28.192174911499023, "global_step": 642702, "epoch": 7743} {"train_loss": -28.69459342956543, "global_step": 642703, "epoch": 7743} {"train_loss": -28.283411026000977, "global_step": 642704, "epoch": 7743} {"train_loss": -28.320947647094727, "global_step": 642705, "epoch": 7743} {"train_loss": -28.320240020751953, "global_step": 642706, "epoch": 7743} {"train_loss": -28.309436798095703, "global_step": 642707, "epoch": 7743} {"train_loss": -28.17999839782715, "global_step": 642708, "epoch": 7743} {"train_loss": -28.507287979125977, "global_step": 642709, "epoch": 7743} {"train_loss": -28.077024459838867, "global_step": 642710, "epoch": 7743} {"train_loss": -28.0762882232666, "global_step": 642711, "epoch": 7743} {"train_loss": -28.283832550048828, "global_step": 642712, "epoch": 7743} {"train_loss": -28.428091049194336, "global_step": 642713, "epoch": 7743} {"train_loss": -28.311880111694336, "global_step": 642714, "epoch": 7743} {"train_loss": -28.2869815826416, "global_step": 642715, "epoch": 7743} {"train_loss": -28.660242080688477, "global_step": 642716, "epoch": 7743} {"train_loss": -28.464719772338867, "global_step": 642717, "epoch": 7743} {"train_loss": -28.418725967407227, "global_step": 642718, "epoch": 7743} {"train_loss": -28.390090942382812, "global_step": 642719, "epoch": 7743} {"train_loss": -28.445453643798828, "global_step": 642720, "epoch": 7743} {"train_loss": -28.266225814819336, "global_step": 642721, "epoch": 7743} {"train_loss": -28.108007431030273, "global_step": 642722, "epoch": 7743} {"train_loss": -28.554162979125977, "global_step": 642723, "epoch": 7743} {"train_loss": -28.19832420349121, "global_step": 642724, "epoch": 7743} {"train_loss": -28.441333770751953, "global_step": 642725, "epoch": 7743} {"train_loss": -28.07391929626465, "global_step": 642726, "epoch": 7743} {"train_loss": -28.364948272705078, "global_step": 642727, "epoch": 7743} {"train_loss": -27.809711456298828, "global_step": 642728, "epoch": 7743} {"train_loss": -27.912628173828125, "global_step": 642729, "epoch": 7743} {"train_loss": -27.659284591674805, "global_step": 642730, "epoch": 7743} {"train_loss": -28.092529296875, "global_step": 642731, "epoch": 7743} {"train_loss": -28.448745727539062, "global_step": 642732, "epoch": 7743} {"train_loss": -28.230878829956055, "global_step": 642733, "epoch": 7743} {"train_loss": -28.29648208618164, "global_step": 642734, "epoch": 7743} {"train_loss": -28.09346580505371, "global_step": 642735, "epoch": 7743} {"train_loss": -28.33200454711914, "global_step": 642736, "epoch": 7743} {"train_loss": -27.859848022460938, "global_step": 642737, "epoch": 7743} {"train_loss": -27.705839157104492, "global_step": 642738, "epoch": 7743} {"train_loss": -28.047277450561523, "global_step": 642739, "epoch": 7743} {"train_loss": -28.230945587158203, "global_step": 642740, "epoch": 7743} {"train_loss": -27.922393798828125, "global_step": 642741, "epoch": 7743} {"train_loss": -28.0175724029541, "global_step": 642742, "epoch": 7743} {"train_loss": -28.219852447509766, "global_step": 642743, "epoch": 7743} {"train_loss": -28.020587921142578, "global_step": 642744, "epoch": 7743} {"train_loss": -28.26508140563965, "global_step": 642745, "epoch": 7743} {"train_loss": -27.959936141967773, "global_step": 642746, "epoch": 7743} {"train_loss": -28.376890182495117, "global_step": 642747, "epoch": 7743} {"train_loss": -28.320758819580078, "global_step": 642748, "epoch": 7743} {"train_loss": -28.345483779907227, "global_step": 642749, "epoch": 7743} {"train_loss": -28.18507194519043, "global_step": 642750, "epoch": 7743} {"train_loss": -28.158331353980376, "global_step": 642751, "epoch": 7743, "val_loss": 6700456.0} {"train_loss": -27.729755401611328, "global_step": 642752, "epoch": 7744} {"train_loss": -27.21442222595215, "global_step": 642753, "epoch": 7744} {"train_loss": -27.657629013061523, "global_step": 642754, "epoch": 7744} {"train_loss": -27.552001953125, "global_step": 642755, "epoch": 7744} {"train_loss": -27.44487953186035, "global_step": 642756, "epoch": 7744} {"train_loss": -27.734821319580078, "global_step": 642757, "epoch": 7744} {"train_loss": -27.85890007019043, "global_step": 642758, "epoch": 7744} {"train_loss": -27.588821411132812, "global_step": 642759, "epoch": 7744} {"train_loss": -27.64422035217285, "global_step": 642760, "epoch": 7744} {"train_loss": -27.968017578125, "global_step": 642761, "epoch": 7744} {"train_loss": -27.67207145690918, "global_step": 642762, "epoch": 7744} {"train_loss": -27.7251033782959, "global_step": 642763, "epoch": 7744} {"train_loss": -27.847936630249023, "global_step": 642764, "epoch": 7744} {"train_loss": -28.09341812133789, "global_step": 642765, "epoch": 7744} {"train_loss": -27.894336700439453, "global_step": 642766, "epoch": 7744} {"train_loss": -27.94965171813965, "global_step": 642767, "epoch": 7744} {"train_loss": -28.1151065826416, "global_step": 642768, "epoch": 7744} {"train_loss": -28.00965690612793, "global_step": 642769, "epoch": 7744} {"train_loss": -28.153701782226562, "global_step": 642770, "epoch": 7744} {"train_loss": -28.11171531677246, "global_step": 642771, "epoch": 7744} {"train_loss": -28.290740966796875, "global_step": 642772, "epoch": 7744} {"train_loss": -28.02594566345215, "global_step": 642773, "epoch": 7744} {"train_loss": -28.141555786132812, "global_step": 642774, "epoch": 7744} {"train_loss": -28.15095329284668, "global_step": 642775, "epoch": 7744} {"train_loss": -28.753904342651367, "global_step": 642776, "epoch": 7744} {"train_loss": -28.234708786010742, "global_step": 642777, "epoch": 7744} {"train_loss": -28.496051788330078, "global_step": 642778, "epoch": 7744} {"train_loss": -28.568811416625977, "global_step": 642779, "epoch": 7744} {"train_loss": -28.36669921875, "global_step": 642780, "epoch": 7744} {"train_loss": -28.252185821533203, "global_step": 642781, "epoch": 7744} {"train_loss": -28.24077796936035, "global_step": 642782, "epoch": 7744} {"train_loss": -28.63861656188965, "global_step": 642783, "epoch": 7744} {"train_loss": -28.61818504333496, "global_step": 642784, "epoch": 7744} {"train_loss": -28.19623374938965, "global_step": 642785, "epoch": 7744} {"train_loss": -28.264495849609375, "global_step": 642786, "epoch": 7744} {"train_loss": -28.635833740234375, "global_step": 642787, "epoch": 7744} {"train_loss": -28.49525260925293, "global_step": 642788, "epoch": 7744} {"train_loss": -28.33820915222168, "global_step": 642789, "epoch": 7744} {"train_loss": -28.38449478149414, "global_step": 642790, "epoch": 7744} {"train_loss": -28.27495765686035, "global_step": 642791, "epoch": 7744} {"train_loss": -28.123376846313477, "global_step": 642792, "epoch": 7744} {"train_loss": -28.4628963470459, "global_step": 642793, "epoch": 7744} {"train_loss": -28.48354148864746, "global_step": 642794, "epoch": 7744} {"train_loss": -28.745441436767578, "global_step": 642795, "epoch": 7744} {"train_loss": -28.427122116088867, "global_step": 642796, "epoch": 7744} {"train_loss": -28.747589111328125, "global_step": 642797, "epoch": 7744} {"train_loss": -28.40970230102539, "global_step": 642798, "epoch": 7744} {"train_loss": -28.117956161499023, "global_step": 642799, "epoch": 7744} {"train_loss": -28.928152084350586, "global_step": 642800, "epoch": 7744} {"train_loss": -28.563098907470703, "global_step": 642801, "epoch": 7744} {"train_loss": -28.11573600769043, "global_step": 642802, "epoch": 7744} {"train_loss": -28.419931411743164, "global_step": 642803, "epoch": 7744} {"train_loss": -28.00298500061035, "global_step": 642804, "epoch": 7744} {"train_loss": -28.273117065429688, "global_step": 642805, "epoch": 7744} {"train_loss": -27.965961456298828, "global_step": 642806, "epoch": 7744} {"train_loss": -28.148162841796875, "global_step": 642807, "epoch": 7744} {"train_loss": -28.331995010375977, "global_step": 642808, "epoch": 7744} {"train_loss": -27.839282989501953, "global_step": 642809, "epoch": 7744} {"train_loss": -27.643285751342773, "global_step": 642810, "epoch": 7744} {"train_loss": -26.695770263671875, "global_step": 642811, "epoch": 7744} {"train_loss": -27.067737579345703, "global_step": 642812, "epoch": 7744} {"train_loss": -27.776172637939453, "global_step": 642813, "epoch": 7744} {"train_loss": -27.6104736328125, "global_step": 642814, "epoch": 7744} {"train_loss": -27.466901779174805, "global_step": 642815, "epoch": 7744} {"train_loss": -27.833606719970703, "global_step": 642816, "epoch": 7744} {"train_loss": -28.21773338317871, "global_step": 642817, "epoch": 7744} {"train_loss": -28.195226669311523, "global_step": 642818, "epoch": 7744} {"train_loss": -27.88330078125, "global_step": 642819, "epoch": 7744} {"train_loss": -28.427417755126953, "global_step": 642820, "epoch": 7744} {"train_loss": -28.072589874267578, "global_step": 642821, "epoch": 7744} {"train_loss": -27.978010177612305, "global_step": 642822, "epoch": 7744} {"train_loss": -28.671268463134766, "global_step": 642823, "epoch": 7744} {"train_loss": -28.026952743530273, "global_step": 642824, "epoch": 7744} {"train_loss": -28.57147216796875, "global_step": 642825, "epoch": 7744} {"train_loss": -28.05328369140625, "global_step": 642826, "epoch": 7744} {"train_loss": -28.39301872253418, "global_step": 642827, "epoch": 7744} {"train_loss": -28.328577041625977, "global_step": 642828, "epoch": 7744} {"train_loss": -28.2664852142334, "global_step": 642829, "epoch": 7744} {"train_loss": -28.08967399597168, "global_step": 642830, "epoch": 7744} {"train_loss": -27.96135902404785, "global_step": 642831, "epoch": 7744} {"train_loss": -28.65296745300293, "global_step": 642832, "epoch": 7744} {"train_loss": -28.527252197265625, "global_step": 642833, "epoch": 7744} {"train_loss": -28.13257369075913, "global_step": 642834, "epoch": 7744, "val_loss": 6685747.0} {"train_loss": -28.128820419311523, "global_step": 642835, "epoch": 7745} {"train_loss": -27.622968673706055, "global_step": 642836, "epoch": 7745} {"train_loss": -27.5126895904541, "global_step": 642837, "epoch": 7745} {"train_loss": -27.284748077392578, "global_step": 642838, "epoch": 7745} {"train_loss": -28.122528076171875, "global_step": 642839, "epoch": 7745} {"train_loss": -27.249725341796875, "global_step": 642840, "epoch": 7745} {"train_loss": -27.2047119140625, "global_step": 642841, "epoch": 7745} {"train_loss": -27.28375816345215, "global_step": 642842, "epoch": 7745} {"train_loss": -27.4915828704834, "global_step": 642843, "epoch": 7745} {"train_loss": -27.000944137573242, "global_step": 642844, "epoch": 7745} {"train_loss": -27.83757972717285, "global_step": 642845, "epoch": 7745} {"train_loss": -27.7510986328125, "global_step": 642846, "epoch": 7745} {"train_loss": -27.72420310974121, "global_step": 642847, "epoch": 7745} {"train_loss": -27.377883911132812, "global_step": 642848, "epoch": 7745} {"train_loss": -27.498794555664062, "global_step": 642849, "epoch": 7745} {"train_loss": -27.97260093688965, "global_step": 642850, "epoch": 7745} {"train_loss": -27.687902450561523, "global_step": 642851, "epoch": 7745} {"train_loss": -28.03537940979004, "global_step": 642852, "epoch": 7745} {"train_loss": -27.967899322509766, "global_step": 642853, "epoch": 7745} {"train_loss": -27.587696075439453, "global_step": 642854, "epoch": 7745} {"train_loss": -27.958297729492188, "global_step": 642855, "epoch": 7745} {"train_loss": -27.66274070739746, "global_step": 642856, "epoch": 7745} {"train_loss": -27.979211807250977, "global_step": 642857, "epoch": 7745} {"train_loss": -28.392972946166992, "global_step": 642858, "epoch": 7745} {"train_loss": -28.002737045288086, "global_step": 642859, "epoch": 7745} {"train_loss": -28.25794792175293, "global_step": 642860, "epoch": 7745} {"train_loss": -28.282072067260742, "global_step": 642861, "epoch": 7745} {"train_loss": -27.843286514282227, "global_step": 642862, "epoch": 7745} {"train_loss": -28.088733673095703, "global_step": 642863, "epoch": 7745} {"train_loss": -28.186969757080078, "global_step": 642864, "epoch": 7745} {"train_loss": -28.0915584564209, "global_step": 642865, "epoch": 7745} {"train_loss": -28.349653244018555, "global_step": 642866, "epoch": 7745} {"train_loss": -28.3836669921875, "global_step": 642867, "epoch": 7745} {"train_loss": -28.266321182250977, "global_step": 642868, "epoch": 7745} {"train_loss": -28.56668472290039, "global_step": 642869, "epoch": 7745} {"train_loss": -27.871906280517578, "global_step": 642870, "epoch": 7745} {"train_loss": -28.38081932067871, "global_step": 642871, "epoch": 7745} {"train_loss": -28.375274658203125, "global_step": 642872, "epoch": 7745} {"train_loss": -28.439178466796875, "global_step": 642873, "epoch": 7745} {"train_loss": -28.186267852783203, "global_step": 642874, "epoch": 7745} {"train_loss": -28.53616714477539, "global_step": 642875, "epoch": 7745} {"train_loss": -28.30438804626465, "global_step": 642876, "epoch": 7745} {"train_loss": -28.26112937927246, "global_step": 642877, "epoch": 7745} {"train_loss": -28.123987197875977, "global_step": 642878, "epoch": 7745} {"train_loss": -28.425006866455078, "global_step": 642879, "epoch": 7745} {"train_loss": -28.624958038330078, "global_step": 642880, "epoch": 7745} {"train_loss": -28.561277389526367, "global_step": 642881, "epoch": 7745} {"train_loss": -28.359577178955078, "global_step": 642882, "epoch": 7745} {"train_loss": -28.841527938842773, "global_step": 642883, "epoch": 7745} {"train_loss": -28.324756622314453, "global_step": 642884, "epoch": 7745} {"train_loss": -28.245458602905273, "global_step": 642885, "epoch": 7745} {"train_loss": -28.42549705505371, "global_step": 642886, "epoch": 7745} {"train_loss": -28.282934188842773, "global_step": 642887, "epoch": 7745} {"train_loss": -28.218353271484375, "global_step": 642888, "epoch": 7745} {"train_loss": -28.652786254882812, "global_step": 642889, "epoch": 7745} {"train_loss": -28.11240577697754, "global_step": 642890, "epoch": 7745} {"train_loss": -28.252668380737305, "global_step": 642891, "epoch": 7745} {"train_loss": -28.291671752929688, "global_step": 642892, "epoch": 7745} {"train_loss": -27.788434982299805, "global_step": 642893, "epoch": 7745} {"train_loss": -27.9981746673584, "global_step": 642894, "epoch": 7745} {"train_loss": -27.950702667236328, "global_step": 642895, "epoch": 7745} {"train_loss": -28.093536376953125, "global_step": 642896, "epoch": 7745} {"train_loss": -27.724292755126953, "global_step": 642897, "epoch": 7745} {"train_loss": -28.3174991607666, "global_step": 642898, "epoch": 7745} {"train_loss": -28.501256942749023, "global_step": 642899, "epoch": 7745} {"train_loss": -28.333654403686523, "global_step": 642900, "epoch": 7745} {"train_loss": -28.31426429748535, "global_step": 642901, "epoch": 7745} {"train_loss": -28.238037109375, "global_step": 642902, "epoch": 7745} {"train_loss": -28.467329025268555, "global_step": 642903, "epoch": 7745} {"train_loss": -28.13654136657715, "global_step": 642904, "epoch": 7745} {"train_loss": -28.10223960876465, "global_step": 642905, "epoch": 7745} {"train_loss": -27.932104110717773, "global_step": 642906, "epoch": 7745} {"train_loss": -28.314794540405273, "global_step": 642907, "epoch": 7745} {"train_loss": -28.409399032592773, "global_step": 642908, "epoch": 7745} {"train_loss": -28.314661026000977, "global_step": 642909, "epoch": 7745} {"train_loss": -28.336206436157227, "global_step": 642910, "epoch": 7745} {"train_loss": -28.272680282592773, "global_step": 642911, "epoch": 7745} {"train_loss": -27.868337631225586, "global_step": 642912, "epoch": 7745} {"train_loss": -27.956729888916016, "global_step": 642913, "epoch": 7745} {"train_loss": -27.60711669921875, "global_step": 642914, "epoch": 7745} {"train_loss": -28.00762939453125, "global_step": 642915, "epoch": 7745} {"train_loss": -27.790197372436523, "global_step": 642916, "epoch": 7745} {"train_loss": -28.09073802074754, "global_step": 642917, "epoch": 7745, "val_loss": 6682629.0} {"train_loss": -26.46059226989746, "global_step": 642918, "epoch": 7746} {"train_loss": -25.15728187561035, "global_step": 642919, "epoch": 7746} {"train_loss": -27.572967529296875, "global_step": 642920, "epoch": 7746} {"train_loss": -26.4073429107666, "global_step": 642921, "epoch": 7746} {"train_loss": -25.9857120513916, "global_step": 642922, "epoch": 7746} {"train_loss": -27.437274932861328, "global_step": 642923, "epoch": 7746} {"train_loss": -26.5141658782959, "global_step": 642924, "epoch": 7746} {"train_loss": -27.473535537719727, "global_step": 642925, "epoch": 7746} {"train_loss": -26.80767250061035, "global_step": 642926, "epoch": 7746} {"train_loss": -27.505456924438477, "global_step": 642927, "epoch": 7746} {"train_loss": -26.97846031188965, "global_step": 642928, "epoch": 7746} {"train_loss": -27.291406631469727, "global_step": 642929, "epoch": 7746} {"train_loss": -27.42327308654785, "global_step": 642930, "epoch": 7746} {"train_loss": -27.41766357421875, "global_step": 642931, "epoch": 7746} {"train_loss": -27.2850341796875, "global_step": 642932, "epoch": 7746} {"train_loss": -27.752859115600586, "global_step": 642933, "epoch": 7746} {"train_loss": -27.432851791381836, "global_step": 642934, "epoch": 7746} {"train_loss": -27.837543487548828, "global_step": 642935, "epoch": 7746} {"train_loss": -27.417510986328125, "global_step": 642936, "epoch": 7746} {"train_loss": -27.721174240112305, "global_step": 642937, "epoch": 7746} {"train_loss": -27.510028839111328, "global_step": 642938, "epoch": 7746} {"train_loss": -27.724531173706055, "global_step": 642939, "epoch": 7746} {"train_loss": -28.0164737701416, "global_step": 642940, "epoch": 7746} {"train_loss": -27.749597549438477, "global_step": 642941, "epoch": 7746} {"train_loss": -27.780553817749023, "global_step": 642942, "epoch": 7746} {"train_loss": -27.641315460205078, "global_step": 642943, "epoch": 7746} {"train_loss": -27.82330322265625, "global_step": 642944, "epoch": 7746} {"train_loss": -28.082721710205078, "global_step": 642945, "epoch": 7746} {"train_loss": -27.94660758972168, "global_step": 642946, "epoch": 7746} {"train_loss": -27.955556869506836, "global_step": 642947, "epoch": 7746} {"train_loss": -28.033018112182617, "global_step": 642948, "epoch": 7746} {"train_loss": -27.996549606323242, "global_step": 642949, "epoch": 7746} {"train_loss": -27.99863624572754, "global_step": 642950, "epoch": 7746} {"train_loss": -28.041431427001953, "global_step": 642951, "epoch": 7746} {"train_loss": -27.831119537353516, "global_step": 642952, "epoch": 7746} {"train_loss": -28.61233901977539, "global_step": 642953, "epoch": 7746} {"train_loss": -28.381139755249023, "global_step": 642954, "epoch": 7746} {"train_loss": -27.800338745117188, "global_step": 642955, "epoch": 7746} {"train_loss": -28.474218368530273, "global_step": 642956, "epoch": 7746} {"train_loss": -28.1732234954834, "global_step": 642957, "epoch": 7746} {"train_loss": -28.143207550048828, "global_step": 642958, "epoch": 7746} {"train_loss": -28.481679916381836, "global_step": 642959, "epoch": 7746} {"train_loss": -28.253538131713867, "global_step": 642960, "epoch": 7746} {"train_loss": -28.234970092773438, "global_step": 642961, "epoch": 7746} {"train_loss": -28.455747604370117, "global_step": 642962, "epoch": 7746} {"train_loss": -28.105758666992188, "global_step": 642963, "epoch": 7746} {"train_loss": -28.485883712768555, "global_step": 642964, "epoch": 7746} {"train_loss": -28.186786651611328, "global_step": 642965, "epoch": 7746} {"train_loss": -28.22919273376465, "global_step": 642966, "epoch": 7746} {"train_loss": -28.27436637878418, "global_step": 642967, "epoch": 7746} {"train_loss": -28.313446044921875, "global_step": 642968, "epoch": 7746} {"train_loss": -28.476821899414062, "global_step": 642969, "epoch": 7746} {"train_loss": -28.32710075378418, "global_step": 642970, "epoch": 7746} {"train_loss": -28.312524795532227, "global_step": 642971, "epoch": 7746} {"train_loss": -28.379674911499023, "global_step": 642972, "epoch": 7746} {"train_loss": -28.381103515625, "global_step": 642973, "epoch": 7746} {"train_loss": -28.2503604888916, "global_step": 642974, "epoch": 7746} {"train_loss": -28.385629653930664, "global_step": 642975, "epoch": 7746} {"train_loss": -28.404752731323242, "global_step": 642976, "epoch": 7746} {"train_loss": -28.089893341064453, "global_step": 642977, "epoch": 7746} {"train_loss": -28.5302677154541, "global_step": 642978, "epoch": 7746} {"train_loss": -28.15085220336914, "global_step": 642979, "epoch": 7746} {"train_loss": -28.280059814453125, "global_step": 642980, "epoch": 7746} {"train_loss": -28.160680770874023, "global_step": 642981, "epoch": 7746} {"train_loss": -28.242231369018555, "global_step": 642982, "epoch": 7746} {"train_loss": -28.508380889892578, "global_step": 642983, "epoch": 7746} {"train_loss": -28.07671546936035, "global_step": 642984, "epoch": 7746} {"train_loss": -28.236169815063477, "global_step": 642985, "epoch": 7746} {"train_loss": -27.86223793029785, "global_step": 642986, "epoch": 7746} {"train_loss": -28.129003524780273, "global_step": 642987, "epoch": 7746} {"train_loss": -27.9000186920166, "global_step": 642988, "epoch": 7746} {"train_loss": -28.53145408630371, "global_step": 642989, "epoch": 7746} {"train_loss": -28.308130264282227, "global_step": 642990, "epoch": 7746} {"train_loss": -28.591238021850586, "global_step": 642991, "epoch": 7746} {"train_loss": -28.22157096862793, "global_step": 642992, "epoch": 7746} {"train_loss": -28.184247970581055, "global_step": 642993, "epoch": 7746} {"train_loss": -28.19622802734375, "global_step": 642994, "epoch": 7746} {"train_loss": -28.193639755249023, "global_step": 642995, "epoch": 7746} {"train_loss": -28.195098876953125, "global_step": 642996, "epoch": 7746} {"train_loss": -28.31709098815918, "global_step": 642997, "epoch": 7746} {"train_loss": -28.56971549987793, "global_step": 642998, "epoch": 7746} {"train_loss": -27.930328369140625, "global_step": 642999, "epoch": 7746} {"train_loss": -27.915104923478093, "global_step": 643000, "epoch": 7746, "val_loss": 6698087.5} {"train_loss": -27.653507232666016, "global_step": 643001, "epoch": 7747} {"train_loss": -27.339040756225586, "global_step": 643002, "epoch": 7747} {"train_loss": -27.796894073486328, "global_step": 643003, "epoch": 7747} {"train_loss": -27.50823974609375, "global_step": 643004, "epoch": 7747} {"train_loss": -27.554861068725586, "global_step": 643005, "epoch": 7747} {"train_loss": -27.73358154296875, "global_step": 643006, "epoch": 7747} {"train_loss": -27.789106369018555, "global_step": 643007, "epoch": 7747} {"train_loss": -27.99604606628418, "global_step": 643008, "epoch": 7747} {"train_loss": -28.4478759765625, "global_step": 643009, "epoch": 7747} {"train_loss": -27.50429344177246, "global_step": 643010, "epoch": 7747} {"train_loss": -28.003015518188477, "global_step": 643011, "epoch": 7747} {"train_loss": -27.16103172302246, "global_step": 643012, "epoch": 7747} {"train_loss": -28.37411880493164, "global_step": 643013, "epoch": 7747} {"train_loss": -27.780515670776367, "global_step": 643014, "epoch": 7747} {"train_loss": -27.75629234313965, "global_step": 643015, "epoch": 7747} {"train_loss": -27.808765411376953, "global_step": 643016, "epoch": 7747} {"train_loss": -27.749731063842773, "global_step": 643017, "epoch": 7747} {"train_loss": -28.242807388305664, "global_step": 643018, "epoch": 7747} {"train_loss": -27.950788497924805, "global_step": 643019, "epoch": 7747} {"train_loss": -27.896595001220703, "global_step": 643020, "epoch": 7747} {"train_loss": -27.939044952392578, "global_step": 643021, "epoch": 7747} {"train_loss": -28.083026885986328, "global_step": 643022, "epoch": 7747} {"train_loss": -27.819232940673828, "global_step": 643023, "epoch": 7747} {"train_loss": -28.08843994140625, "global_step": 643024, "epoch": 7747} {"train_loss": -27.915515899658203, "global_step": 643025, "epoch": 7747} {"train_loss": -28.04155921936035, "global_step": 643026, "epoch": 7747} {"train_loss": -28.157270431518555, "global_step": 643027, "epoch": 7747} {"train_loss": -28.260107040405273, "global_step": 643028, "epoch": 7747} {"train_loss": -28.570194244384766, "global_step": 643029, "epoch": 7747} {"train_loss": -28.11298942565918, "global_step": 643030, "epoch": 7747} {"train_loss": -28.145105361938477, "global_step": 643031, "epoch": 7747} {"train_loss": -28.0076847076416, "global_step": 643032, "epoch": 7747} {"train_loss": -28.236286163330078, "global_step": 643033, "epoch": 7747} {"train_loss": -28.139978408813477, "global_step": 643034, "epoch": 7747} {"train_loss": -28.726760864257812, "global_step": 643035, "epoch": 7747} {"train_loss": -28.240253448486328, "global_step": 643036, "epoch": 7747} {"train_loss": -28.325010299682617, "global_step": 643037, "epoch": 7747} {"train_loss": -28.49041175842285, "global_step": 643038, "epoch": 7747} {"train_loss": -28.360036849975586, "global_step": 643039, "epoch": 7747} {"train_loss": -28.264135360717773, "global_step": 643040, "epoch": 7747} {"train_loss": -28.45557975769043, "global_step": 643041, "epoch": 7747} {"train_loss": -28.27199363708496, "global_step": 643042, "epoch": 7747} {"train_loss": -28.370269775390625, "global_step": 643043, "epoch": 7747} {"train_loss": -28.344043731689453, "global_step": 643044, "epoch": 7747} {"train_loss": -28.512374877929688, "global_step": 643045, "epoch": 7747} {"train_loss": -28.13741111755371, "global_step": 643046, "epoch": 7747} {"train_loss": -28.46162986755371, "global_step": 643047, "epoch": 7747} {"train_loss": -28.286666870117188, "global_step": 643048, "epoch": 7747} {"train_loss": -28.307348251342773, "global_step": 643049, "epoch": 7747} {"train_loss": -28.271230697631836, "global_step": 643050, "epoch": 7747} {"train_loss": -28.2598819732666, "global_step": 643051, "epoch": 7747} {"train_loss": -28.224430084228516, "global_step": 643052, "epoch": 7747} {"train_loss": -28.293542861938477, "global_step": 643053, "epoch": 7747} {"train_loss": -28.524566650390625, "global_step": 643054, "epoch": 7747} {"train_loss": -28.31452751159668, "global_step": 643055, "epoch": 7747} {"train_loss": -28.32770347595215, "global_step": 643056, "epoch": 7747} {"train_loss": -28.309186935424805, "global_step": 643057, "epoch": 7747} {"train_loss": -28.451261520385742, "global_step": 643058, "epoch": 7747} {"train_loss": -28.438251495361328, "global_step": 643059, "epoch": 7747} {"train_loss": -28.108081817626953, "global_step": 643060, "epoch": 7747} {"train_loss": -27.975784301757812, "global_step": 643061, "epoch": 7747} {"train_loss": -28.187108993530273, "global_step": 643062, "epoch": 7747} {"train_loss": -28.918848037719727, "global_step": 643063, "epoch": 7747} {"train_loss": -28.545135498046875, "global_step": 643064, "epoch": 7747} {"train_loss": -28.402362823486328, "global_step": 643065, "epoch": 7747} {"train_loss": -28.644933700561523, "global_step": 643066, "epoch": 7747} {"train_loss": -28.438892364501953, "global_step": 643067, "epoch": 7747} {"train_loss": -28.550073623657227, "global_step": 643068, "epoch": 7747} {"train_loss": -28.344602584838867, "global_step": 643069, "epoch": 7747} {"train_loss": -28.0627498626709, "global_step": 643070, "epoch": 7747} {"train_loss": -28.16483497619629, "global_step": 643071, "epoch": 7747} {"train_loss": -28.624494552612305, "global_step": 643072, "epoch": 7747} {"train_loss": -27.963403701782227, "global_step": 643073, "epoch": 7747} {"train_loss": -28.31483268737793, "global_step": 643074, "epoch": 7747} {"train_loss": -28.440954208374023, "global_step": 643075, "epoch": 7747} {"train_loss": -28.129846572875977, "global_step": 643076, "epoch": 7747} {"train_loss": -27.862150192260742, "global_step": 643077, "epoch": 7747} {"train_loss": -28.318790435791016, "global_step": 643078, "epoch": 7747} {"train_loss": -28.611026763916016, "global_step": 643079, "epoch": 7747} {"train_loss": -28.594995498657227, "global_step": 643080, "epoch": 7747} {"train_loss": -28.330921173095703, "global_step": 643081, "epoch": 7747} {"train_loss": -28.243133544921875, "global_step": 643082, "epoch": 7747} {"train_loss": -28.172028920736658, "global_step": 643083, "epoch": 7747, "val_loss": 6656874.0} {"train_loss": -27.382553100585938, "global_step": 643084, "epoch": 7748} {"train_loss": -26.269262313842773, "global_step": 643085, "epoch": 7748} {"train_loss": -27.485937118530273, "global_step": 643086, "epoch": 7748} {"train_loss": -27.867633819580078, "global_step": 643087, "epoch": 7748} {"train_loss": -27.385889053344727, "global_step": 643088, "epoch": 7748} {"train_loss": -26.89407730102539, "global_step": 643089, "epoch": 7748} {"train_loss": -27.204883575439453, "global_step": 643090, "epoch": 7748} {"train_loss": -27.61614990234375, "global_step": 643091, "epoch": 7748} {"train_loss": -27.202829360961914, "global_step": 643092, "epoch": 7748} {"train_loss": -27.64191246032715, "global_step": 643093, "epoch": 7748} {"train_loss": -27.679800033569336, "global_step": 643094, "epoch": 7748} {"train_loss": -27.6937255859375, "global_step": 643095, "epoch": 7748} {"train_loss": -27.60810661315918, "global_step": 643096, "epoch": 7748} {"train_loss": -27.70987319946289, "global_step": 643097, "epoch": 7748} {"train_loss": -28.215360641479492, "global_step": 643098, "epoch": 7748} {"train_loss": -27.992938995361328, "global_step": 643099, "epoch": 7748} {"train_loss": -27.98333168029785, "global_step": 643100, "epoch": 7748} {"train_loss": -27.86182975769043, "global_step": 643101, "epoch": 7748} {"train_loss": -27.928674697875977, "global_step": 643102, "epoch": 7748} {"train_loss": -27.972070693969727, "global_step": 643103, "epoch": 7748} {"train_loss": -28.000579833984375, "global_step": 643104, "epoch": 7748} {"train_loss": -28.1495304107666, "global_step": 643105, "epoch": 7748} {"train_loss": -27.999317169189453, "global_step": 643106, "epoch": 7748} {"train_loss": -28.00037956237793, "global_step": 643107, "epoch": 7748} {"train_loss": -27.653411865234375, "global_step": 643108, "epoch": 7748} {"train_loss": -28.251142501831055, "global_step": 643109, "epoch": 7748} {"train_loss": -28.28632926940918, "global_step": 643110, "epoch": 7748} {"train_loss": -28.4069881439209, "global_step": 643111, "epoch": 7748} {"train_loss": -27.916229248046875, "global_step": 643112, "epoch": 7748} {"train_loss": -27.90406608581543, "global_step": 643113, "epoch": 7748} {"train_loss": -28.085281372070312, "global_step": 643114, "epoch": 7748} {"train_loss": -28.23617935180664, "global_step": 643115, "epoch": 7748} {"train_loss": -28.13189125061035, "global_step": 643116, "epoch": 7748} {"train_loss": -28.147130966186523, "global_step": 643117, "epoch": 7748} {"train_loss": -27.95570182800293, "global_step": 643118, "epoch": 7748} {"train_loss": -28.254302978515625, "global_step": 643119, "epoch": 7748} {"train_loss": -28.17017936706543, "global_step": 643120, "epoch": 7748} {"train_loss": -28.262836456298828, "global_step": 643121, "epoch": 7748} {"train_loss": -28.256561279296875, "global_step": 643122, "epoch": 7748} {"train_loss": -28.39474868774414, "global_step": 643123, "epoch": 7748} {"train_loss": -28.456836700439453, "global_step": 643124, "epoch": 7748} {"train_loss": -28.331745147705078, "global_step": 643125, "epoch": 7748} {"train_loss": -28.564050674438477, "global_step": 643126, "epoch": 7748} {"train_loss": -28.2197322845459, "global_step": 643127, "epoch": 7748} {"train_loss": -28.440603256225586, "global_step": 643128, "epoch": 7748} {"train_loss": -28.105932235717773, "global_step": 643129, "epoch": 7748} {"train_loss": -28.377593994140625, "global_step": 643130, "epoch": 7748} {"train_loss": -28.27906608581543, "global_step": 643131, "epoch": 7748} {"train_loss": -28.388671875, "global_step": 643132, "epoch": 7748} {"train_loss": -28.285505294799805, "global_step": 643133, "epoch": 7748} {"train_loss": -28.236373901367188, "global_step": 643134, "epoch": 7748} {"train_loss": -28.719358444213867, "global_step": 643135, "epoch": 7748} {"train_loss": -28.2951717376709, "global_step": 643136, "epoch": 7748} {"train_loss": -28.417749404907227, "global_step": 643137, "epoch": 7748} {"train_loss": -28.31744384765625, "global_step": 643138, "epoch": 7748} {"train_loss": -28.419357299804688, "global_step": 643139, "epoch": 7748} {"train_loss": -28.5087890625, "global_step": 643140, "epoch": 7748} {"train_loss": -28.579076766967773, "global_step": 643141, "epoch": 7748} {"train_loss": -28.601825714111328, "global_step": 643142, "epoch": 7748} {"train_loss": -28.354589462280273, "global_step": 643143, "epoch": 7748} {"train_loss": -28.260028839111328, "global_step": 643144, "epoch": 7748} {"train_loss": -28.247806549072266, "global_step": 643145, "epoch": 7748} {"train_loss": -28.377044677734375, "global_step": 643146, "epoch": 7748} {"train_loss": -28.322906494140625, "global_step": 643147, "epoch": 7748} {"train_loss": -28.106830596923828, "global_step": 643148, "epoch": 7748} {"train_loss": -28.2367000579834, "global_step": 643149, "epoch": 7748} {"train_loss": -28.41162109375, "global_step": 643150, "epoch": 7748} {"train_loss": -27.77374839782715, "global_step": 643151, "epoch": 7748} {"train_loss": -28.083816528320312, "global_step": 643152, "epoch": 7748} {"train_loss": -29.012907028198242, "global_step": 643153, "epoch": 7748} {"train_loss": -28.519962310791016, "global_step": 643154, "epoch": 7748} {"train_loss": -28.47968864440918, "global_step": 643155, "epoch": 7748} {"train_loss": -28.1494083404541, "global_step": 643156, "epoch": 7748} {"train_loss": -28.068872451782227, "global_step": 643157, "epoch": 7748} {"train_loss": -28.289758682250977, "global_step": 643158, "epoch": 7748} {"train_loss": -28.26802635192871, "global_step": 643159, "epoch": 7748} {"train_loss": -28.3920955657959, "global_step": 643160, "epoch": 7748} {"train_loss": -28.264570236206055, "global_step": 643161, "epoch": 7748} {"train_loss": -28.503076553344727, "global_step": 643162, "epoch": 7748} {"train_loss": -28.058691024780273, "global_step": 643163, "epoch": 7748} {"train_loss": -28.447919845581055, "global_step": 643164, "epoch": 7748} {"train_loss": -27.829833984375, "global_step": 643165, "epoch": 7748} {"train_loss": -28.09291860281703, "global_step": 643166, "epoch": 7748, "val_loss": 6735801.0} {"train_loss": -27.506261825561523, "global_step": 643167, "epoch": 7749} {"train_loss": -27.51682472229004, "global_step": 643168, "epoch": 7749} {"train_loss": -27.80855369567871, "global_step": 643169, "epoch": 7749} {"train_loss": -27.29547691345215, "global_step": 643170, "epoch": 7749} {"train_loss": -27.72318458557129, "global_step": 643171, "epoch": 7749} {"train_loss": -27.420007705688477, "global_step": 643172, "epoch": 7749} {"train_loss": -27.89790916442871, "global_step": 643173, "epoch": 7749} {"train_loss": -27.722890853881836, "global_step": 643174, "epoch": 7749} {"train_loss": -27.535058975219727, "global_step": 643175, "epoch": 7749} {"train_loss": -27.8874568939209, "global_step": 643176, "epoch": 7749} {"train_loss": -28.056299209594727, "global_step": 643177, "epoch": 7749} {"train_loss": -27.716299057006836, "global_step": 643178, "epoch": 7749} {"train_loss": -27.813146591186523, "global_step": 643179, "epoch": 7749} {"train_loss": -28.1138858795166, "global_step": 643180, "epoch": 7749} {"train_loss": -27.737136840820312, "global_step": 643181, "epoch": 7749} {"train_loss": -27.70171546936035, "global_step": 643182, "epoch": 7749} {"train_loss": -27.648813247680664, "global_step": 643183, "epoch": 7749} {"train_loss": -27.81886100769043, "global_step": 643184, "epoch": 7749} {"train_loss": -27.994897842407227, "global_step": 643185, "epoch": 7749} {"train_loss": -28.106576919555664, "global_step": 643186, "epoch": 7749} {"train_loss": -27.913000106811523, "global_step": 643187, "epoch": 7749} {"train_loss": -28.13043785095215, "global_step": 643188, "epoch": 7749} {"train_loss": -27.880125045776367, "global_step": 643189, "epoch": 7749} {"train_loss": -28.059070587158203, "global_step": 643190, "epoch": 7749} {"train_loss": -28.04306411743164, "global_step": 643191, "epoch": 7749} {"train_loss": -28.178720474243164, "global_step": 643192, "epoch": 7749} {"train_loss": -27.822248458862305, "global_step": 643193, "epoch": 7749} {"train_loss": -28.49836540222168, "global_step": 643194, "epoch": 7749} {"train_loss": -28.293058395385742, "global_step": 643195, "epoch": 7749} {"train_loss": -27.94122314453125, "global_step": 643196, "epoch": 7749} {"train_loss": -28.02484130859375, "global_step": 643197, "epoch": 7749} {"train_loss": -28.147329330444336, "global_step": 643198, "epoch": 7749} {"train_loss": -28.06385612487793, "global_step": 643199, "epoch": 7749} {"train_loss": -27.385568618774414, "global_step": 643200, "epoch": 7749} {"train_loss": -27.30804443359375, "global_step": 643201, "epoch": 7749} {"train_loss": -27.396596908569336, "global_step": 643202, "epoch": 7749} {"train_loss": -28.331253051757812, "global_step": 643203, "epoch": 7749} {"train_loss": -27.67420768737793, "global_step": 643204, "epoch": 7749} {"train_loss": -27.0797061920166, "global_step": 643205, "epoch": 7749} {"train_loss": -28.002038955688477, "global_step": 643206, "epoch": 7749} {"train_loss": -28.0533504486084, "global_step": 643207, "epoch": 7749} {"train_loss": -28.196317672729492, "global_step": 643208, "epoch": 7749} {"train_loss": -27.8472843170166, "global_step": 643209, "epoch": 7749} {"train_loss": -28.224340438842773, "global_step": 643210, "epoch": 7749} {"train_loss": -27.78814125061035, "global_step": 643211, "epoch": 7749} {"train_loss": -28.14957046508789, "global_step": 643212, "epoch": 7749} {"train_loss": -27.779605865478516, "global_step": 643213, "epoch": 7749} {"train_loss": -28.603561401367188, "global_step": 643214, "epoch": 7749} {"train_loss": -28.410385131835938, "global_step": 643215, "epoch": 7749} {"train_loss": -28.273523330688477, "global_step": 643216, "epoch": 7749} {"train_loss": -27.940540313720703, "global_step": 643217, "epoch": 7749} {"train_loss": -28.335830688476562, "global_step": 643218, "epoch": 7749} {"train_loss": -28.150836944580078, "global_step": 643219, "epoch": 7749} {"train_loss": -28.19577407836914, "global_step": 643220, "epoch": 7749} {"train_loss": -28.030746459960938, "global_step": 643221, "epoch": 7749} {"train_loss": -28.14385986328125, "global_step": 643222, "epoch": 7749} {"train_loss": -28.181371688842773, "global_step": 643223, "epoch": 7749} {"train_loss": -28.502731323242188, "global_step": 643224, "epoch": 7749} {"train_loss": -28.404483795166016, "global_step": 643225, "epoch": 7749} {"train_loss": -28.26740837097168, "global_step": 643226, "epoch": 7749} {"train_loss": -28.027265548706055, "global_step": 643227, "epoch": 7749} {"train_loss": -28.442792892456055, "global_step": 643228, "epoch": 7749} {"train_loss": -28.30305290222168, "global_step": 643229, "epoch": 7749} {"train_loss": -28.59726905822754, "global_step": 643230, "epoch": 7749} {"train_loss": -28.29328727722168, "global_step": 643231, "epoch": 7749} {"train_loss": -28.281492233276367, "global_step": 643232, "epoch": 7749} {"train_loss": -28.05756187438965, "global_step": 643233, "epoch": 7749} {"train_loss": -28.461729049682617, "global_step": 643234, "epoch": 7749} {"train_loss": -28.411535263061523, "global_step": 643235, "epoch": 7749} {"train_loss": -28.573339462280273, "global_step": 643236, "epoch": 7749} {"train_loss": -28.5042724609375, "global_step": 643237, "epoch": 7749} {"train_loss": -28.037933349609375, "global_step": 643238, "epoch": 7749} {"train_loss": -27.837574005126953, "global_step": 643239, "epoch": 7749} {"train_loss": -27.757431030273438, "global_step": 643240, "epoch": 7749} {"train_loss": -27.727060317993164, "global_step": 643241, "epoch": 7749} {"train_loss": -27.9287166595459, "global_step": 643242, "epoch": 7749} {"train_loss": -28.148578643798828, "global_step": 643243, "epoch": 7749} {"train_loss": -28.49726676940918, "global_step": 643244, "epoch": 7749} {"train_loss": -28.22894287109375, "global_step": 643245, "epoch": 7749} {"train_loss": -28.261693954467773, "global_step": 643246, "epoch": 7749} {"train_loss": -28.187519073486328, "global_step": 643247, "epoch": 7749} {"train_loss": -28.391864776611328, "global_step": 643248, "epoch": 7749} {"train_loss": -28.024014944053558, "global_step": 643249, "epoch": 7749, "val_loss": 6697189.0} {"train_loss": -27.833423614501953, "global_step": 643250, "epoch": 7750} {"train_loss": -28.133041381835938, "global_step": 643251, "epoch": 7750} {"train_loss": -27.80063247680664, "global_step": 643252, "epoch": 7750} {"train_loss": -27.98491859436035, "global_step": 643253, "epoch": 7750} {"train_loss": -28.11884880065918, "global_step": 643254, "epoch": 7750} {"train_loss": -28.407785415649414, "global_step": 643255, "epoch": 7750} {"train_loss": -27.904071807861328, "global_step": 643256, "epoch": 7750} {"train_loss": -27.752607345581055, "global_step": 643257, "epoch": 7750} {"train_loss": -28.124725341796875, "global_step": 643258, "epoch": 7750} {"train_loss": -28.126178741455078, "global_step": 643259, "epoch": 7750} {"train_loss": -28.042200088500977, "global_step": 643260, "epoch": 7750} {"train_loss": -27.864694595336914, "global_step": 643261, "epoch": 7750} {"train_loss": -28.03680419921875, "global_step": 643262, "epoch": 7750} {"train_loss": -28.066913604736328, "global_step": 643263, "epoch": 7750} {"train_loss": -27.84675407409668, "global_step": 643264, "epoch": 7750} {"train_loss": -27.793487548828125, "global_step": 643265, "epoch": 7750} {"train_loss": -27.859838485717773, "global_step": 643266, "epoch": 7750} {"train_loss": -28.047927856445312, "global_step": 643267, "epoch": 7750} {"train_loss": -28.385272979736328, "global_step": 643268, "epoch": 7750} {"train_loss": -27.968748092651367, "global_step": 643269, "epoch": 7750} {"train_loss": -28.284032821655273, "global_step": 643270, "epoch": 7750} {"train_loss": -28.36297607421875, "global_step": 643271, "epoch": 7750} {"train_loss": -28.1503849029541, "global_step": 643272, "epoch": 7750} {"train_loss": -28.137054443359375, "global_step": 643273, "epoch": 7750} {"train_loss": -28.28950309753418, "global_step": 643274, "epoch": 7750} {"train_loss": -28.01032829284668, "global_step": 643275, "epoch": 7750} {"train_loss": -28.558374404907227, "global_step": 643276, "epoch": 7750} {"train_loss": -28.16316032409668, "global_step": 643277, "epoch": 7750} {"train_loss": -28.36775016784668, "global_step": 643278, "epoch": 7750} {"train_loss": -27.9141845703125, "global_step": 643279, "epoch": 7750} {"train_loss": -27.392568588256836, "global_step": 643280, "epoch": 7750} {"train_loss": -27.308216094970703, "global_step": 643281, "epoch": 7750} {"train_loss": -28.170881271362305, "global_step": 643282, "epoch": 7750} {"train_loss": -28.434736251831055, "global_step": 643283, "epoch": 7750} {"train_loss": -28.272336959838867, "global_step": 643284, "epoch": 7750} {"train_loss": -28.05525779724121, "global_step": 643285, "epoch": 7750} {"train_loss": -28.125024795532227, "global_step": 643286, "epoch": 7750} {"train_loss": -28.40459632873535, "global_step": 643287, "epoch": 7750} {"train_loss": -29.049896240234375, "global_step": 643288, "epoch": 7750} {"train_loss": -28.27035903930664, "global_step": 643289, "epoch": 7750} {"train_loss": -28.660266876220703, "global_step": 643290, "epoch": 7750} {"train_loss": -28.297443389892578, "global_step": 643291, "epoch": 7750} {"train_loss": -28.61875343322754, "global_step": 643292, "epoch": 7750} {"train_loss": -28.400760650634766, "global_step": 643293, "epoch": 7750} {"train_loss": -28.34710693359375, "global_step": 643294, "epoch": 7750} {"train_loss": -28.6679744720459, "global_step": 643295, "epoch": 7750} {"train_loss": -28.226743698120117, "global_step": 643296, "epoch": 7750} {"train_loss": -28.711706161499023, "global_step": 643297, "epoch": 7750} {"train_loss": -28.5633487701416, "global_step": 643298, "epoch": 7750} {"train_loss": -28.433944702148438, "global_step": 643299, "epoch": 7750} {"train_loss": -28.3283634185791, "global_step": 643300, "epoch": 7750} {"train_loss": -28.1664981842041, "global_step": 643301, "epoch": 7750} {"train_loss": -28.408353805541992, "global_step": 643302, "epoch": 7750} {"train_loss": -28.361026763916016, "global_step": 643303, "epoch": 7750} {"train_loss": -28.616254806518555, "global_step": 643304, "epoch": 7750} {"train_loss": -28.290746688842773, "global_step": 643305, "epoch": 7750} {"train_loss": -28.474435806274414, "global_step": 643306, "epoch": 7750} {"train_loss": -27.9232120513916, "global_step": 643307, "epoch": 7750} {"train_loss": -28.27618408203125, "global_step": 643308, "epoch": 7750} {"train_loss": -28.122100830078125, "global_step": 643309, "epoch": 7750} {"train_loss": -28.14483070373535, "global_step": 643310, "epoch": 7750} {"train_loss": -28.23060417175293, "global_step": 643311, "epoch": 7750} {"train_loss": -28.21070671081543, "global_step": 643312, "epoch": 7750} {"train_loss": -28.2950496673584, "global_step": 643313, "epoch": 7750} {"train_loss": -28.1046142578125, "global_step": 643314, "epoch": 7750} {"train_loss": -28.370635986328125, "global_step": 643315, "epoch": 7750} {"train_loss": -28.41730308532715, "global_step": 643316, "epoch": 7750} {"train_loss": -27.978727340698242, "global_step": 643317, "epoch": 7750} {"train_loss": -27.66590690612793, "global_step": 643318, "epoch": 7750} {"train_loss": -27.177087783813477, "global_step": 643319, "epoch": 7750} {"train_loss": -26.27097511291504, "global_step": 643320, "epoch": 7750} {"train_loss": -26.407285690307617, "global_step": 643321, "epoch": 7750} {"train_loss": -28.12217140197754, "global_step": 643322, "epoch": 7750} {"train_loss": -27.7780818939209, "global_step": 643323, "epoch": 7750} {"train_loss": -27.708011627197266, "global_step": 643324, "epoch": 7750} {"train_loss": -28.208887100219727, "global_step": 643325, "epoch": 7750} {"train_loss": -27.962156295776367, "global_step": 643326, "epoch": 7750} {"train_loss": -28.1439266204834, "global_step": 643327, "epoch": 7750} {"train_loss": -27.980661392211914, "global_step": 643328, "epoch": 7750} {"train_loss": -28.280929565429688, "global_step": 643329, "epoch": 7750} {"train_loss": -27.509326934814453, "global_step": 643330, "epoch": 7750} {"train_loss": -28.31414794921875, "global_step": 643331, "epoch": 7750} {"train_loss": -28.115478262843855, "global_step": 643332, "epoch": 7750, "train/sim_max_reward_0": 0.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4500000": 1.0, "test/sim_max_reward_4500001": 1.0, "test/sim_max_reward_4500002": 1.0, "test/sim_max_reward_4500003": 1.0, "test/sim_max_reward_4500004": 1.0, "test/sim_max_reward_4500005": 1.0, "test/sim_max_reward_4500006": 1.0, "test/sim_max_reward_4500007": 0.0, "test/sim_max_reward_4500008": 1.0, "test/sim_max_reward_4500009": 1.0, "test/sim_max_reward_4500010": 1.0, "test/sim_max_reward_4500011": 1.0, "test/sim_max_reward_4500012": 1.0, "test/sim_max_reward_4500013": 0.0, "test/sim_max_reward_4500014": 1.0, "test/sim_max_reward_4500015": 1.0, "test/sim_max_reward_4500016": 1.0, "test/sim_max_reward_4500017": 1.0, "test/sim_max_reward_4500018": 0.0, "test/sim_max_reward_4500019": 0.0, "test/sim_max_reward_4500020": 1.0, "test/sim_max_reward_4500021": 1.0, "train/mean_score": 0.8333333333333334, "test/mean_score": 0.8181818181818182, "val_loss": 6622278.5} {"train_loss": -26.73579216003418, "global_step": 643333, "epoch": 7751} {"train_loss": -27.099029541015625, "global_step": 643334, "epoch": 7751} {"train_loss": -27.168134689331055, "global_step": 643335, "epoch": 7751} {"train_loss": -27.45403480529785, "global_step": 643336, "epoch": 7751} {"train_loss": -27.065093994140625, "global_step": 643337, "epoch": 7751} {"train_loss": -27.01703453063965, "global_step": 643338, "epoch": 7751} {"train_loss": -27.510623931884766, "global_step": 643339, "epoch": 7751} {"train_loss": -27.472244262695312, "global_step": 643340, "epoch": 7751} {"train_loss": -27.446805953979492, "global_step": 643341, "epoch": 7751} {"train_loss": -27.538227081298828, "global_step": 643342, "epoch": 7751} {"train_loss": -26.87407875061035, "global_step": 643343, "epoch": 7751} {"train_loss": -27.690488815307617, "global_step": 643344, "epoch": 7751} {"train_loss": -27.77377700805664, "global_step": 643345, "epoch": 7751} {"train_loss": -27.19879150390625, "global_step": 643346, "epoch": 7751} {"train_loss": -27.11414909362793, "global_step": 643347, "epoch": 7751} {"train_loss": -27.561208724975586, "global_step": 643348, "epoch": 7751} {"train_loss": -27.53557777404785, "global_step": 643349, "epoch": 7751} {"train_loss": -27.1560115814209, "global_step": 643350, "epoch": 7751} {"train_loss": -27.853551864624023, "global_step": 643351, "epoch": 7751} {"train_loss": -27.880762100219727, "global_step": 643352, "epoch": 7751} {"train_loss": -27.67933464050293, "global_step": 643353, "epoch": 7751} {"train_loss": -28.096418380737305, "global_step": 643354, "epoch": 7751} {"train_loss": -27.997838973999023, "global_step": 643355, "epoch": 7751} {"train_loss": -28.11211585998535, "global_step": 643356, "epoch": 7751} {"train_loss": -28.211200714111328, "global_step": 643357, "epoch": 7751} {"train_loss": -27.969406127929688, "global_step": 643358, "epoch": 7751} {"train_loss": -28.02200698852539, "global_step": 643359, "epoch": 7751} {"train_loss": -28.150787353515625, "global_step": 643360, "epoch": 7751} {"train_loss": -28.350793838500977, "global_step": 643361, "epoch": 7751} {"train_loss": -27.76340675354004, "global_step": 643362, "epoch": 7751} {"train_loss": -28.28852653503418, "global_step": 643363, "epoch": 7751} {"train_loss": -28.568151473999023, "global_step": 643364, "epoch": 7751} {"train_loss": -28.6304931640625, "global_step": 643365, "epoch": 7751} {"train_loss": -28.143476486206055, "global_step": 643366, "epoch": 7751} {"train_loss": -28.34232521057129, "global_step": 643367, "epoch": 7751} {"train_loss": -28.25442886352539, "global_step": 643368, "epoch": 7751} {"train_loss": -28.142108917236328, "global_step": 643369, "epoch": 7751} {"train_loss": -28.30388832092285, "global_step": 643370, "epoch": 7751} {"train_loss": -28.4666805267334, "global_step": 643371, "epoch": 7751} {"train_loss": -28.32721519470215, "global_step": 643372, "epoch": 7751} {"train_loss": -28.26712417602539, "global_step": 643373, "epoch": 7751} {"train_loss": -28.266996383666992, "global_step": 643374, "epoch": 7751} {"train_loss": -28.3386173248291, "global_step": 643375, "epoch": 7751} {"train_loss": -28.28017234802246, "global_step": 643376, "epoch": 7751} {"train_loss": -28.238794326782227, "global_step": 643377, "epoch": 7751} {"train_loss": -28.628515243530273, "global_step": 643378, "epoch": 7751} {"train_loss": -28.31609535217285, "global_step": 643379, "epoch": 7751} {"train_loss": -28.58614158630371, "global_step": 643380, "epoch": 7751} {"train_loss": -28.223663330078125, "global_step": 643381, "epoch": 7751} {"train_loss": -28.530059814453125, "global_step": 643382, "epoch": 7751} {"train_loss": -28.292692184448242, "global_step": 643383, "epoch": 7751} {"train_loss": -28.378620147705078, "global_step": 643384, "epoch": 7751} {"train_loss": -28.61983299255371, "global_step": 643385, "epoch": 7751} {"train_loss": -28.34327507019043, "global_step": 643386, "epoch": 7751} {"train_loss": -28.528732299804688, "global_step": 643387, "epoch": 7751} {"train_loss": -28.33814811706543, "global_step": 643388, "epoch": 7751} {"train_loss": -28.543704986572266, "global_step": 643389, "epoch": 7751} {"train_loss": -28.66375160217285, "global_step": 643390, "epoch": 7751} {"train_loss": -28.49102210998535, "global_step": 643391, "epoch": 7751} {"train_loss": -28.309844970703125, "global_step": 643392, "epoch": 7751} {"train_loss": -28.524066925048828, "global_step": 643393, "epoch": 7751} {"train_loss": -28.561908721923828, "global_step": 643394, "epoch": 7751} {"train_loss": -28.699905395507812, "global_step": 643395, "epoch": 7751} {"train_loss": -28.3000545501709, "global_step": 643396, "epoch": 7751} {"train_loss": -28.526172637939453, "global_step": 643397, "epoch": 7751} {"train_loss": -28.000202178955078, "global_step": 643398, "epoch": 7751} {"train_loss": -28.491132736206055, "global_step": 643399, "epoch": 7751} {"train_loss": -28.272705078125, "global_step": 643400, "epoch": 7751} {"train_loss": -28.193206787109375, "global_step": 643401, "epoch": 7751} {"train_loss": -28.18367576599121, "global_step": 643402, "epoch": 7751} {"train_loss": -28.328235626220703, "global_step": 643403, "epoch": 7751} {"train_loss": -28.802099227905273, "global_step": 643404, "epoch": 7751} {"train_loss": -28.4834041595459, "global_step": 643405, "epoch": 7751} {"train_loss": -28.42691993713379, "global_step": 643406, "epoch": 7751} {"train_loss": -28.226099014282227, "global_step": 643407, "epoch": 7751} {"train_loss": -28.79266357421875, "global_step": 643408, "epoch": 7751} {"train_loss": -28.222986221313477, "global_step": 643409, "epoch": 7751} {"train_loss": -28.402984619140625, "global_step": 643410, "epoch": 7751} {"train_loss": -28.07120132446289, "global_step": 643411, "epoch": 7751} {"train_loss": -28.127716064453125, "global_step": 643412, "epoch": 7751} {"train_loss": -28.401281356811523, "global_step": 643413, "epoch": 7751} {"train_loss": -28.71221351623535, "global_step": 643414, "epoch": 7751} {"train_loss": -28.09423667264272, "global_step": 643415, "epoch": 7751, "val_loss": 6657775.0} {"train_loss": -27.587604522705078, "global_step": 643416, "epoch": 7752} {"train_loss": -27.069156646728516, "global_step": 643417, "epoch": 7752} {"train_loss": -28.026824951171875, "global_step": 643418, "epoch": 7752} {"train_loss": -27.648218154907227, "global_step": 643419, "epoch": 7752} {"train_loss": -27.483495712280273, "global_step": 643420, "epoch": 7752} {"train_loss": -26.942651748657227, "global_step": 643421, "epoch": 7752} {"train_loss": -27.805389404296875, "global_step": 643422, "epoch": 7752} {"train_loss": -27.76983070373535, "global_step": 643423, "epoch": 7752} {"train_loss": -27.097742080688477, "global_step": 643424, "epoch": 7752} {"train_loss": -27.793676376342773, "global_step": 643425, "epoch": 7752} {"train_loss": -28.247419357299805, "global_step": 643426, "epoch": 7752} {"train_loss": -28.427291870117188, "global_step": 643427, "epoch": 7752} {"train_loss": -28.001388549804688, "global_step": 643428, "epoch": 7752} {"train_loss": -27.96489906311035, "global_step": 643429, "epoch": 7752} {"train_loss": -27.836688995361328, "global_step": 643430, "epoch": 7752} {"train_loss": -28.167999267578125, "global_step": 643431, "epoch": 7752} {"train_loss": -27.671497344970703, "global_step": 643432, "epoch": 7752} {"train_loss": -28.017969131469727, "global_step": 643433, "epoch": 7752} {"train_loss": -27.87580680847168, "global_step": 643434, "epoch": 7752} {"train_loss": -27.856470108032227, "global_step": 643435, "epoch": 7752} {"train_loss": -28.1289119720459, "global_step": 643436, "epoch": 7752} {"train_loss": -28.481521606445312, "global_step": 643437, "epoch": 7752} {"train_loss": -28.427082061767578, "global_step": 643438, "epoch": 7752} {"train_loss": -28.331937789916992, "global_step": 643439, "epoch": 7752} {"train_loss": -28.17262077331543, "global_step": 643440, "epoch": 7752} {"train_loss": -28.156354904174805, "global_step": 643441, "epoch": 7752} {"train_loss": -28.490676879882812, "global_step": 643442, "epoch": 7752} {"train_loss": -28.569578170776367, "global_step": 643443, "epoch": 7752} {"train_loss": -28.513294219970703, "global_step": 643444, "epoch": 7752} {"train_loss": -28.219745635986328, "global_step": 643445, "epoch": 7752} {"train_loss": -28.2537784576416, "global_step": 643446, "epoch": 7752} {"train_loss": -28.45234489440918, "global_step": 643447, "epoch": 7752} {"train_loss": -28.43690299987793, "global_step": 643448, "epoch": 7752} {"train_loss": -28.276386260986328, "global_step": 643449, "epoch": 7752} {"train_loss": -28.268369674682617, "global_step": 643450, "epoch": 7752} {"train_loss": -28.144704818725586, "global_step": 643451, "epoch": 7752} {"train_loss": -28.602436065673828, "global_step": 643452, "epoch": 7752} {"train_loss": -28.231260299682617, "global_step": 643453, "epoch": 7752} {"train_loss": -28.1702823638916, "global_step": 643454, "epoch": 7752} {"train_loss": -28.422765731811523, "global_step": 643455, "epoch": 7752} {"train_loss": -28.493627548217773, "global_step": 643456, "epoch": 7752} {"train_loss": -28.655920028686523, "global_step": 643457, "epoch": 7752} {"train_loss": -28.09437370300293, "global_step": 643458, "epoch": 7752} {"train_loss": -28.437397003173828, "global_step": 643459, "epoch": 7752} {"train_loss": -28.032453536987305, "global_step": 643460, "epoch": 7752} {"train_loss": -28.493976593017578, "global_step": 643461, "epoch": 7752} {"train_loss": -28.006855010986328, "global_step": 643462, "epoch": 7752} {"train_loss": -28.2818546295166, "global_step": 643463, "epoch": 7752} {"train_loss": -28.332849502563477, "global_step": 643464, "epoch": 7752} {"train_loss": -28.91681480407715, "global_step": 643465, "epoch": 7752} {"train_loss": -28.7736759185791, "global_step": 643466, "epoch": 7752} {"train_loss": -28.4018611907959, "global_step": 643467, "epoch": 7752} {"train_loss": -28.331104278564453, "global_step": 643468, "epoch": 7752} {"train_loss": -28.37074089050293, "global_step": 643469, "epoch": 7752} {"train_loss": -28.29517936706543, "global_step": 643470, "epoch": 7752} {"train_loss": -28.4422550201416, "global_step": 643471, "epoch": 7752} {"train_loss": -28.315866470336914, "global_step": 643472, "epoch": 7752} {"train_loss": -28.232868194580078, "global_step": 643473, "epoch": 7752} {"train_loss": -28.472631454467773, "global_step": 643474, "epoch": 7752} {"train_loss": -27.968042373657227, "global_step": 643475, "epoch": 7752} {"train_loss": -27.629199981689453, "global_step": 643476, "epoch": 7752} {"train_loss": -28.15180778503418, "global_step": 643477, "epoch": 7752} {"train_loss": -28.084814071655273, "global_step": 643478, "epoch": 7752} {"train_loss": -27.930419921875, "global_step": 643479, "epoch": 7752} {"train_loss": -28.08859634399414, "global_step": 643480, "epoch": 7752} {"train_loss": -28.02101707458496, "global_step": 643481, "epoch": 7752} {"train_loss": -27.869543075561523, "global_step": 643482, "epoch": 7752} {"train_loss": -28.320520401000977, "global_step": 643483, "epoch": 7752} {"train_loss": -28.3067626953125, "global_step": 643484, "epoch": 7752} {"train_loss": -28.279340744018555, "global_step": 643485, "epoch": 7752} {"train_loss": -28.030811309814453, "global_step": 643486, "epoch": 7752} {"train_loss": -28.084766387939453, "global_step": 643487, "epoch": 7752} {"train_loss": -28.107650756835938, "global_step": 643488, "epoch": 7752} {"train_loss": -28.435821533203125, "global_step": 643489, "epoch": 7752} {"train_loss": -28.404052734375, "global_step": 643490, "epoch": 7752} {"train_loss": -28.066574096679688, "global_step": 643491, "epoch": 7752} {"train_loss": -28.22183609008789, "global_step": 643492, "epoch": 7752} {"train_loss": -28.43226432800293, "global_step": 643493, "epoch": 7752} {"train_loss": -28.24582862854004, "global_step": 643494, "epoch": 7752} {"train_loss": -28.14946937561035, "global_step": 643495, "epoch": 7752} {"train_loss": -28.37896728515625, "global_step": 643496, "epoch": 7752} {"train_loss": -28.6717529296875, "global_step": 643497, "epoch": 7752} {"train_loss": -28.160420084574138, "global_step": 643498, "epoch": 7752, "val_loss": 6647177.5} {"train_loss": -27.7464656829834, "global_step": 643499, "epoch": 7753} {"train_loss": -28.146909713745117, "global_step": 643500, "epoch": 7753} {"train_loss": -27.1278076171875, "global_step": 643501, "epoch": 7753} {"train_loss": -27.558813095092773, "global_step": 643502, "epoch": 7753} {"train_loss": -27.055683135986328, "global_step": 643503, "epoch": 7753} {"train_loss": -28.107166290283203, "global_step": 643504, "epoch": 7753} {"train_loss": -27.361242294311523, "global_step": 643505, "epoch": 7753} {"train_loss": -27.367801666259766, "global_step": 643506, "epoch": 7753} {"train_loss": -27.25198745727539, "global_step": 643507, "epoch": 7753} {"train_loss": -27.4626522064209, "global_step": 643508, "epoch": 7753} {"train_loss": -27.495136260986328, "global_step": 643509, "epoch": 7753} {"train_loss": -27.083698272705078, "global_step": 643510, "epoch": 7753} {"train_loss": -28.035064697265625, "global_step": 643511, "epoch": 7753} {"train_loss": -27.53466796875, "global_step": 643512, "epoch": 7753} {"train_loss": -27.81207275390625, "global_step": 643513, "epoch": 7753} {"train_loss": -28.023670196533203, "global_step": 643514, "epoch": 7753} {"train_loss": -27.551944732666016, "global_step": 643515, "epoch": 7753} {"train_loss": -28.119237899780273, "global_step": 643516, "epoch": 7753} {"train_loss": -27.537799835205078, "global_step": 643517, "epoch": 7753} {"train_loss": -27.657623291015625, "global_step": 643518, "epoch": 7753} {"train_loss": -28.161518096923828, "global_step": 643519, "epoch": 7753} {"train_loss": -27.679950714111328, "global_step": 643520, "epoch": 7753} {"train_loss": -27.82421875, "global_step": 643521, "epoch": 7753} {"train_loss": -28.124526977539062, "global_step": 643522, "epoch": 7753} {"train_loss": -28.209638595581055, "global_step": 643523, "epoch": 7753} {"train_loss": -28.15387535095215, "global_step": 643524, "epoch": 7753} {"train_loss": -27.87556266784668, "global_step": 643525, "epoch": 7753} {"train_loss": -27.763986587524414, "global_step": 643526, "epoch": 7753} {"train_loss": -27.835037231445312, "global_step": 643527, "epoch": 7753} {"train_loss": -27.795028686523438, "global_step": 643528, "epoch": 7753} {"train_loss": -27.85498046875, "global_step": 643529, "epoch": 7753} {"train_loss": -28.246702194213867, "global_step": 643530, "epoch": 7753} {"train_loss": -28.047286987304688, "global_step": 643531, "epoch": 7753} {"train_loss": -28.216266632080078, "global_step": 643532, "epoch": 7753} {"train_loss": -28.23044204711914, "global_step": 643533, "epoch": 7753} {"train_loss": -28.320581436157227, "global_step": 643534, "epoch": 7753} {"train_loss": -28.333484649658203, "global_step": 643535, "epoch": 7753} {"train_loss": -28.371341705322266, "global_step": 643536, "epoch": 7753} {"train_loss": -28.38239097595215, "global_step": 643537, "epoch": 7753} {"train_loss": -28.44065284729004, "global_step": 643538, "epoch": 7753} {"train_loss": -28.318740844726562, "global_step": 643539, "epoch": 7753} {"train_loss": -28.2907772064209, "global_step": 643540, "epoch": 7753} {"train_loss": -28.53399658203125, "global_step": 643541, "epoch": 7753} {"train_loss": -28.51576042175293, "global_step": 643542, "epoch": 7753} {"train_loss": -28.519458770751953, "global_step": 643543, "epoch": 7753} {"train_loss": -28.18292236328125, "global_step": 643544, "epoch": 7753} {"train_loss": -28.240833282470703, "global_step": 643545, "epoch": 7753} {"train_loss": -28.707548141479492, "global_step": 643546, "epoch": 7753} {"train_loss": -28.668161392211914, "global_step": 643547, "epoch": 7753} {"train_loss": -28.286832809448242, "global_step": 643548, "epoch": 7753} {"train_loss": -28.68402671813965, "global_step": 643549, "epoch": 7753} {"train_loss": -28.657928466796875, "global_step": 643550, "epoch": 7753} {"train_loss": -28.433868408203125, "global_step": 643551, "epoch": 7753} {"train_loss": -28.625967025756836, "global_step": 643552, "epoch": 7753} {"train_loss": -28.390838623046875, "global_step": 643553, "epoch": 7753} {"train_loss": -28.42770767211914, "global_step": 643554, "epoch": 7753} {"train_loss": -28.332752227783203, "global_step": 643555, "epoch": 7753} {"train_loss": -28.225543975830078, "global_step": 643556, "epoch": 7753} {"train_loss": -28.01763343811035, "global_step": 643557, "epoch": 7753} {"train_loss": -27.23651695251465, "global_step": 643558, "epoch": 7753} {"train_loss": -26.198593139648438, "global_step": 643559, "epoch": 7753} {"train_loss": -26.43062400817871, "global_step": 643560, "epoch": 7753} {"train_loss": -28.297122955322266, "global_step": 643561, "epoch": 7753} {"train_loss": -27.445348739624023, "global_step": 643562, "epoch": 7753} {"train_loss": -27.580739974975586, "global_step": 643563, "epoch": 7753} {"train_loss": -27.790882110595703, "global_step": 643564, "epoch": 7753} {"train_loss": -28.2283878326416, "global_step": 643565, "epoch": 7753} {"train_loss": -28.33359146118164, "global_step": 643566, "epoch": 7753} {"train_loss": -28.046436309814453, "global_step": 643567, "epoch": 7753} {"train_loss": -27.97248649597168, "global_step": 643568, "epoch": 7753} {"train_loss": -27.974008560180664, "global_step": 643569, "epoch": 7753} {"train_loss": -28.033206939697266, "global_step": 643570, "epoch": 7753} {"train_loss": -28.078323364257812, "global_step": 643571, "epoch": 7753} {"train_loss": -27.95075035095215, "global_step": 643572, "epoch": 7753} {"train_loss": -26.775793075561523, "global_step": 643573, "epoch": 7753} {"train_loss": -26.085697174072266, "global_step": 643574, "epoch": 7753} {"train_loss": -26.625341415405273, "global_step": 643575, "epoch": 7753} {"train_loss": -27.300155639648438, "global_step": 643576, "epoch": 7753} {"train_loss": -27.53260612487793, "global_step": 643577, "epoch": 7753} {"train_loss": -27.838275909423828, "global_step": 643578, "epoch": 7753} {"train_loss": -26.834375381469727, "global_step": 643579, "epoch": 7753} {"train_loss": -27.207019805908203, "global_step": 643580, "epoch": 7753} {"train_loss": -27.870570493031696, "global_step": 643581, "epoch": 7753, "val_loss": 6684723.0} {"train_loss": -26.855329513549805, "global_step": 643582, "epoch": 7754} {"train_loss": -25.240320205688477, "global_step": 643583, "epoch": 7754} {"train_loss": -25.258268356323242, "global_step": 643584, "epoch": 7754} {"train_loss": -26.53986167907715, "global_step": 643585, "epoch": 7754} {"train_loss": -25.87164306640625, "global_step": 643586, "epoch": 7754} {"train_loss": -26.24692726135254, "global_step": 643587, "epoch": 7754} {"train_loss": -26.340103149414062, "global_step": 643588, "epoch": 7754} {"train_loss": -26.339574813842773, "global_step": 643589, "epoch": 7754} {"train_loss": -26.90643310546875, "global_step": 643590, "epoch": 7754} {"train_loss": -26.371488571166992, "global_step": 643591, "epoch": 7754} {"train_loss": -26.915937423706055, "global_step": 643592, "epoch": 7754} {"train_loss": -26.833118438720703, "global_step": 643593, "epoch": 7754} {"train_loss": -26.81955909729004, "global_step": 643594, "epoch": 7754} {"train_loss": -27.165552139282227, "global_step": 643595, "epoch": 7754} {"train_loss": -27.208539962768555, "global_step": 643596, "epoch": 7754} {"train_loss": -27.001312255859375, "global_step": 643597, "epoch": 7754} {"train_loss": -26.822080612182617, "global_step": 643598, "epoch": 7754} {"train_loss": -27.29054832458496, "global_step": 643599, "epoch": 7754} {"train_loss": -27.28089714050293, "global_step": 643600, "epoch": 7754} {"train_loss": -27.38785743713379, "global_step": 643601, "epoch": 7754} {"train_loss": -27.6536922454834, "global_step": 643602, "epoch": 7754} {"train_loss": -27.201215744018555, "global_step": 643603, "epoch": 7754} {"train_loss": -27.167821884155273, "global_step": 643604, "epoch": 7754} {"train_loss": -27.972204208374023, "global_step": 643605, "epoch": 7754} {"train_loss": -27.634077072143555, "global_step": 643606, "epoch": 7754} {"train_loss": -27.637683868408203, "global_step": 643607, "epoch": 7754} {"train_loss": -28.170785903930664, "global_step": 643608, "epoch": 7754} {"train_loss": -27.32917594909668, "global_step": 643609, "epoch": 7754} {"train_loss": -27.739551544189453, "global_step": 643610, "epoch": 7754} {"train_loss": -27.397205352783203, "global_step": 643611, "epoch": 7754} {"train_loss": -27.6591739654541, "global_step": 643612, "epoch": 7754} {"train_loss": -27.77119255065918, "global_step": 643613, "epoch": 7754} {"train_loss": -27.590116500854492, "global_step": 643614, "epoch": 7754} {"train_loss": -27.9583683013916, "global_step": 643615, "epoch": 7754} {"train_loss": -27.989145278930664, "global_step": 643616, "epoch": 7754} {"train_loss": -28.15448570251465, "global_step": 643617, "epoch": 7754} {"train_loss": -28.070127487182617, "global_step": 643618, "epoch": 7754} {"train_loss": -27.91477394104004, "global_step": 643619, "epoch": 7754} {"train_loss": -28.402734756469727, "global_step": 643620, "epoch": 7754} {"train_loss": -28.045612335205078, "global_step": 643621, "epoch": 7754} {"train_loss": -28.038192749023438, "global_step": 643622, "epoch": 7754} {"train_loss": -28.275903701782227, "global_step": 643623, "epoch": 7754} {"train_loss": -28.204938888549805, "global_step": 643624, "epoch": 7754} {"train_loss": -27.934289932250977, "global_step": 643625, "epoch": 7754} {"train_loss": -28.1066951751709, "global_step": 643626, "epoch": 7754} {"train_loss": -28.471235275268555, "global_step": 643627, "epoch": 7754} {"train_loss": -28.425634384155273, "global_step": 643628, "epoch": 7754} {"train_loss": -28.47674560546875, "global_step": 643629, "epoch": 7754} {"train_loss": -28.64335060119629, "global_step": 643630, "epoch": 7754} {"train_loss": -28.029987335205078, "global_step": 643631, "epoch": 7754} {"train_loss": -27.80525016784668, "global_step": 643632, "epoch": 7754} {"train_loss": -28.273212432861328, "global_step": 643633, "epoch": 7754} {"train_loss": -28.48206901550293, "global_step": 643634, "epoch": 7754} {"train_loss": -28.429819107055664, "global_step": 643635, "epoch": 7754} {"train_loss": -28.73388671875, "global_step": 643636, "epoch": 7754} {"train_loss": -28.66263198852539, "global_step": 643637, "epoch": 7754} {"train_loss": -28.31147575378418, "global_step": 643638, "epoch": 7754} {"train_loss": -29.056522369384766, "global_step": 643639, "epoch": 7754} {"train_loss": -28.447568893432617, "global_step": 643640, "epoch": 7754} {"train_loss": -28.486902236938477, "global_step": 643641, "epoch": 7754} {"train_loss": -28.380008697509766, "global_step": 643642, "epoch": 7754} {"train_loss": -27.97897720336914, "global_step": 643643, "epoch": 7754} {"train_loss": -28.639881134033203, "global_step": 643644, "epoch": 7754} {"train_loss": -28.391357421875, "global_step": 643645, "epoch": 7754} {"train_loss": -28.18603515625, "global_step": 643646, "epoch": 7754} {"train_loss": -28.529529571533203, "global_step": 643647, "epoch": 7754} {"train_loss": -28.43568229675293, "global_step": 643648, "epoch": 7754} {"train_loss": -28.698556900024414, "global_step": 643649, "epoch": 7754} {"train_loss": -28.27315330505371, "global_step": 643650, "epoch": 7754} {"train_loss": -27.83223533630371, "global_step": 643651, "epoch": 7754} {"train_loss": -27.602039337158203, "global_step": 643652, "epoch": 7754} {"train_loss": -27.305465698242188, "global_step": 643653, "epoch": 7754} {"train_loss": -26.866193771362305, "global_step": 643654, "epoch": 7754} {"train_loss": -27.235883712768555, "global_step": 643655, "epoch": 7754} {"train_loss": -27.388437271118164, "global_step": 643656, "epoch": 7754} {"train_loss": -27.205774307250977, "global_step": 643657, "epoch": 7754} {"train_loss": -28.243139266967773, "global_step": 643658, "epoch": 7754} {"train_loss": -27.80938720703125, "global_step": 643659, "epoch": 7754} {"train_loss": -27.960479736328125, "global_step": 643660, "epoch": 7754} {"train_loss": -27.711078643798828, "global_step": 643661, "epoch": 7754} {"train_loss": -27.8182315826416, "global_step": 643662, "epoch": 7754} {"train_loss": -27.720794677734375, "global_step": 643663, "epoch": 7754} {"train_loss": -27.667029461228704, "global_step": 643664, "epoch": 7754, "val_loss": 6686222.0} {"train_loss": -26.869382858276367, "global_step": 643665, "epoch": 7755} {"train_loss": -26.591108322143555, "global_step": 643666, "epoch": 7755} {"train_loss": -27.155893325805664, "global_step": 643667, "epoch": 7755} {"train_loss": -26.79402732849121, "global_step": 643668, "epoch": 7755} {"train_loss": -27.649158477783203, "global_step": 643669, "epoch": 7755} {"train_loss": -26.887348175048828, "global_step": 643670, "epoch": 7755} {"train_loss": -27.186960220336914, "global_step": 643671, "epoch": 7755} {"train_loss": -26.90216636657715, "global_step": 643672, "epoch": 7755} {"train_loss": -27.36564064025879, "global_step": 643673, "epoch": 7755} {"train_loss": -27.665481567382812, "global_step": 643674, "epoch": 7755} {"train_loss": -27.507169723510742, "global_step": 643675, "epoch": 7755} {"train_loss": -27.190820693969727, "global_step": 643676, "epoch": 7755} {"train_loss": -27.592884063720703, "global_step": 643677, "epoch": 7755} {"train_loss": -27.538318634033203, "global_step": 643678, "epoch": 7755} {"train_loss": -27.570159912109375, "global_step": 643679, "epoch": 7755} {"train_loss": -28.000635147094727, "global_step": 643680, "epoch": 7755} {"train_loss": -27.714313507080078, "global_step": 643681, "epoch": 7755} {"train_loss": -27.52583885192871, "global_step": 643682, "epoch": 7755} {"train_loss": -27.710739135742188, "global_step": 643683, "epoch": 7755} {"train_loss": -27.911279678344727, "global_step": 643684, "epoch": 7755} {"train_loss": -27.572568893432617, "global_step": 643685, "epoch": 7755} {"train_loss": -27.577835083007812, "global_step": 643686, "epoch": 7755} {"train_loss": -27.82480239868164, "global_step": 643687, "epoch": 7755} {"train_loss": -27.617889404296875, "global_step": 643688, "epoch": 7755} {"train_loss": -28.062040328979492, "global_step": 643689, "epoch": 7755} {"train_loss": -27.85688591003418, "global_step": 643690, "epoch": 7755} {"train_loss": -27.681501388549805, "global_step": 643691, "epoch": 7755} {"train_loss": -27.939245223999023, "global_step": 643692, "epoch": 7755} {"train_loss": -27.954730987548828, "global_step": 643693, "epoch": 7755} {"train_loss": -28.0079345703125, "global_step": 643694, "epoch": 7755} {"train_loss": -27.826574325561523, "global_step": 643695, "epoch": 7755} {"train_loss": -28.162683486938477, "global_step": 643696, "epoch": 7755} {"train_loss": -28.378467559814453, "global_step": 643697, "epoch": 7755} {"train_loss": -28.305896759033203, "global_step": 643698, "epoch": 7755} {"train_loss": -28.56538200378418, "global_step": 643699, "epoch": 7755} {"train_loss": -28.225906372070312, "global_step": 643700, "epoch": 7755} {"train_loss": -27.860193252563477, "global_step": 643701, "epoch": 7755} {"train_loss": -28.2174129486084, "global_step": 643702, "epoch": 7755} {"train_loss": -28.0001163482666, "global_step": 643703, "epoch": 7755} {"train_loss": -27.958454132080078, "global_step": 643704, "epoch": 7755} {"train_loss": -28.226667404174805, "global_step": 643705, "epoch": 7755} {"train_loss": -28.223865509033203, "global_step": 643706, "epoch": 7755} {"train_loss": -27.960416793823242, "global_step": 643707, "epoch": 7755} {"train_loss": -28.257986068725586, "global_step": 643708, "epoch": 7755} {"train_loss": -28.759140014648438, "global_step": 643709, "epoch": 7755} {"train_loss": -27.982349395751953, "global_step": 643710, "epoch": 7755} {"train_loss": -28.275299072265625, "global_step": 643711, "epoch": 7755} {"train_loss": -28.02937889099121, "global_step": 643712, "epoch": 7755} {"train_loss": -28.153589248657227, "global_step": 643713, "epoch": 7755} {"train_loss": -28.74127197265625, "global_step": 643714, "epoch": 7755} {"train_loss": -28.401166915893555, "global_step": 643715, "epoch": 7755} {"train_loss": -28.60394287109375, "global_step": 643716, "epoch": 7755} {"train_loss": -28.200414657592773, "global_step": 643717, "epoch": 7755} {"train_loss": -28.308195114135742, "global_step": 643718, "epoch": 7755} {"train_loss": -28.4591064453125, "global_step": 643719, "epoch": 7755} {"train_loss": -28.503076553344727, "global_step": 643720, "epoch": 7755} {"train_loss": -28.30560874938965, "global_step": 643721, "epoch": 7755} {"train_loss": -28.0501651763916, "global_step": 643722, "epoch": 7755} {"train_loss": -28.49310302734375, "global_step": 643723, "epoch": 7755} {"train_loss": -28.392728805541992, "global_step": 643724, "epoch": 7755} {"train_loss": -28.534412384033203, "global_step": 643725, "epoch": 7755} {"train_loss": -28.543664932250977, "global_step": 643726, "epoch": 7755} {"train_loss": -28.207178115844727, "global_step": 643727, "epoch": 7755} {"train_loss": -28.3205623626709, "global_step": 643728, "epoch": 7755} {"train_loss": -28.5311336517334, "global_step": 643729, "epoch": 7755} {"train_loss": -28.18743896484375, "global_step": 643730, "epoch": 7755} {"train_loss": -28.361677169799805, "global_step": 643731, "epoch": 7755} {"train_loss": -28.29922866821289, "global_step": 643732, "epoch": 7755} {"train_loss": -28.528615951538086, "global_step": 643733, "epoch": 7755} {"train_loss": -28.456069946289062, "global_step": 643734, "epoch": 7755} {"train_loss": -28.0613956451416, "global_step": 643735, "epoch": 7755} {"train_loss": -28.435537338256836, "global_step": 643736, "epoch": 7755} {"train_loss": -28.51252555847168, "global_step": 643737, "epoch": 7755} {"train_loss": -28.605274200439453, "global_step": 643738, "epoch": 7755} {"train_loss": -28.153417587280273, "global_step": 643739, "epoch": 7755} {"train_loss": -28.609357833862305, "global_step": 643740, "epoch": 7755} {"train_loss": -28.473785400390625, "global_step": 643741, "epoch": 7755} {"train_loss": -27.614547729492188, "global_step": 643742, "epoch": 7755} {"train_loss": -28.053741455078125, "global_step": 643743, "epoch": 7755} {"train_loss": -28.108545303344727, "global_step": 643744, "epoch": 7755} {"train_loss": -28.7719669342041, "global_step": 643745, "epoch": 7755} {"train_loss": -27.848173141479492, "global_step": 643746, "epoch": 7755} {"train_loss": -28.000617544335054, "global_step": 643747, "epoch": 7755, "val_loss": 6686592.0} {"train_loss": -27.061466217041016, "global_step": 643748, "epoch": 7756} {"train_loss": -26.92764663696289, "global_step": 643749, "epoch": 7756} {"train_loss": -27.351282119750977, "global_step": 643750, "epoch": 7756} {"train_loss": -27.086929321289062, "global_step": 643751, "epoch": 7756} {"train_loss": -27.493139266967773, "global_step": 643752, "epoch": 7756} {"train_loss": -26.233448028564453, "global_step": 643753, "epoch": 7756} {"train_loss": -27.64588737487793, "global_step": 643754, "epoch": 7756} {"train_loss": -27.39887046813965, "global_step": 643755, "epoch": 7756} {"train_loss": -27.41792106628418, "global_step": 643756, "epoch": 7756} {"train_loss": -27.357446670532227, "global_step": 643757, "epoch": 7756} {"train_loss": -27.814184188842773, "global_step": 643758, "epoch": 7756} {"train_loss": -27.329071044921875, "global_step": 643759, "epoch": 7756} {"train_loss": -27.491071701049805, "global_step": 643760, "epoch": 7756} {"train_loss": -27.763507843017578, "global_step": 643761, "epoch": 7756} {"train_loss": -27.573110580444336, "global_step": 643762, "epoch": 7756} {"train_loss": -27.896377563476562, "global_step": 643763, "epoch": 7756} {"train_loss": -27.44832420349121, "global_step": 643764, "epoch": 7756} {"train_loss": -27.938215255737305, "global_step": 643765, "epoch": 7756} {"train_loss": -27.837371826171875, "global_step": 643766, "epoch": 7756} {"train_loss": -27.837635040283203, "global_step": 643767, "epoch": 7756} {"train_loss": -28.048974990844727, "global_step": 643768, "epoch": 7756} {"train_loss": -28.008275985717773, "global_step": 643769, "epoch": 7756} {"train_loss": -27.77045249938965, "global_step": 643770, "epoch": 7756} {"train_loss": -27.919754028320312, "global_step": 643771, "epoch": 7756} {"train_loss": -28.099349975585938, "global_step": 643772, "epoch": 7756} {"train_loss": -27.79270362854004, "global_step": 643773, "epoch": 7756} {"train_loss": -28.04522705078125, "global_step": 643774, "epoch": 7756} {"train_loss": -28.104074478149414, "global_step": 643775, "epoch": 7756} {"train_loss": -27.896448135375977, "global_step": 643776, "epoch": 7756} {"train_loss": -28.193195343017578, "global_step": 643777, "epoch": 7756} {"train_loss": -28.366901397705078, "global_step": 643778, "epoch": 7756} {"train_loss": -28.168027877807617, "global_step": 643779, "epoch": 7756} {"train_loss": -28.10272216796875, "global_step": 643780, "epoch": 7756} {"train_loss": -28.369306564331055, "global_step": 643781, "epoch": 7756} {"train_loss": -28.14023208618164, "global_step": 643782, "epoch": 7756} {"train_loss": -28.293777465820312, "global_step": 643783, "epoch": 7756} {"train_loss": -28.084924697875977, "global_step": 643784, "epoch": 7756} {"train_loss": -27.78424072265625, "global_step": 643785, "epoch": 7756} {"train_loss": -28.216699600219727, "global_step": 643786, "epoch": 7756} {"train_loss": -28.189245223999023, "global_step": 643787, "epoch": 7756} {"train_loss": -27.91267204284668, "global_step": 643788, "epoch": 7756} {"train_loss": -27.898221969604492, "global_step": 643789, "epoch": 7756} {"train_loss": -28.262714385986328, "global_step": 643790, "epoch": 7756} {"train_loss": -28.09092140197754, "global_step": 643791, "epoch": 7756} {"train_loss": -28.246906280517578, "global_step": 643792, "epoch": 7756} {"train_loss": -28.191991806030273, "global_step": 643793, "epoch": 7756} {"train_loss": -28.225879669189453, "global_step": 643794, "epoch": 7756} {"train_loss": -28.12310218811035, "global_step": 643795, "epoch": 7756} {"train_loss": -28.670759201049805, "global_step": 643796, "epoch": 7756} {"train_loss": -28.440534591674805, "global_step": 643797, "epoch": 7756} {"train_loss": -27.890390396118164, "global_step": 643798, "epoch": 7756} {"train_loss": -28.82339859008789, "global_step": 643799, "epoch": 7756} {"train_loss": -28.467859268188477, "global_step": 643800, "epoch": 7756} {"train_loss": -28.143850326538086, "global_step": 643801, "epoch": 7756} {"train_loss": -28.076745986938477, "global_step": 643802, "epoch": 7756} {"train_loss": -28.122526168823242, "global_step": 643803, "epoch": 7756} {"train_loss": -28.00147819519043, "global_step": 643804, "epoch": 7756} {"train_loss": -28.60381507873535, "global_step": 643805, "epoch": 7756} {"train_loss": -28.381179809570312, "global_step": 643806, "epoch": 7756} {"train_loss": -28.57427406311035, "global_step": 643807, "epoch": 7756} {"train_loss": -27.83011245727539, "global_step": 643808, "epoch": 7756} {"train_loss": -28.166351318359375, "global_step": 643809, "epoch": 7756} {"train_loss": -28.26727867126465, "global_step": 643810, "epoch": 7756} {"train_loss": -28.2396183013916, "global_step": 643811, "epoch": 7756} {"train_loss": -28.451074600219727, "global_step": 643812, "epoch": 7756} {"train_loss": -28.63312339782715, "global_step": 643813, "epoch": 7756} {"train_loss": -28.076053619384766, "global_step": 643814, "epoch": 7756} {"train_loss": -28.494007110595703, "global_step": 643815, "epoch": 7756} {"train_loss": -28.1447811126709, "global_step": 643816, "epoch": 7756} {"train_loss": -28.449377059936523, "global_step": 643817, "epoch": 7756} {"train_loss": -28.52119255065918, "global_step": 643818, "epoch": 7756} {"train_loss": -28.2290096282959, "global_step": 643819, "epoch": 7756} {"train_loss": -28.54554557800293, "global_step": 643820, "epoch": 7756} {"train_loss": -28.55401611328125, "global_step": 643821, "epoch": 7756} {"train_loss": -28.45947265625, "global_step": 643822, "epoch": 7756} {"train_loss": -28.1411075592041, "global_step": 643823, "epoch": 7756} {"train_loss": -28.639297485351562, "global_step": 643824, "epoch": 7756} {"train_loss": -28.56184196472168, "global_step": 643825, "epoch": 7756} {"train_loss": -28.469751358032227, "global_step": 643826, "epoch": 7756} {"train_loss": -28.687885284423828, "global_step": 643827, "epoch": 7756} {"train_loss": -28.269989013671875, "global_step": 643828, "epoch": 7756} {"train_loss": -28.742170333862305, "global_step": 643829, "epoch": 7756} {"train_loss": -28.052554073103938, "global_step": 643830, "epoch": 7756, "val_loss": 6656694.0} {"train_loss": -27.747480392456055, "global_step": 643831, "epoch": 7757} {"train_loss": -26.897998809814453, "global_step": 643832, "epoch": 7757} {"train_loss": -24.845699310302734, "global_step": 643833, "epoch": 7757} {"train_loss": -23.744699478149414, "global_step": 643834, "epoch": 7757} {"train_loss": -27.110870361328125, "global_step": 643835, "epoch": 7757} {"train_loss": -26.307870864868164, "global_step": 643836, "epoch": 7757} {"train_loss": -26.32843589782715, "global_step": 643837, "epoch": 7757} {"train_loss": -26.34174919128418, "global_step": 643838, "epoch": 7757} {"train_loss": -27.14801597595215, "global_step": 643839, "epoch": 7757} {"train_loss": -25.427804946899414, "global_step": 643840, "epoch": 7757} {"train_loss": -27.494831085205078, "global_step": 643841, "epoch": 7757} {"train_loss": -27.00172996520996, "global_step": 643842, "epoch": 7757} {"train_loss": -26.9491024017334, "global_step": 643843, "epoch": 7757} {"train_loss": -27.199234008789062, "global_step": 643844, "epoch": 7757} {"train_loss": -27.415878295898438, "global_step": 643845, "epoch": 7757} {"train_loss": -27.263153076171875, "global_step": 643846, "epoch": 7757} {"train_loss": -27.120697021484375, "global_step": 643847, "epoch": 7757} {"train_loss": -27.7177734375, "global_step": 643848, "epoch": 7757} {"train_loss": -27.747968673706055, "global_step": 643849, "epoch": 7757} {"train_loss": -27.268091201782227, "global_step": 643850, "epoch": 7757} {"train_loss": -27.141239166259766, "global_step": 643851, "epoch": 7757} {"train_loss": -27.467615127563477, "global_step": 643852, "epoch": 7757} {"train_loss": -27.650558471679688, "global_step": 643853, "epoch": 7757} {"train_loss": -27.596271514892578, "global_step": 643854, "epoch": 7757} {"train_loss": -27.726526260375977, "global_step": 643855, "epoch": 7757} {"train_loss": -27.53729820251465, "global_step": 643856, "epoch": 7757} {"train_loss": -27.764341354370117, "global_step": 643857, "epoch": 7757} {"train_loss": -27.337005615234375, "global_step": 643858, "epoch": 7757} {"train_loss": -27.64142417907715, "global_step": 643859, "epoch": 7757} {"train_loss": -27.705097198486328, "global_step": 643860, "epoch": 7757} {"train_loss": -27.899967193603516, "global_step": 643861, "epoch": 7757} {"train_loss": -27.775121688842773, "global_step": 643862, "epoch": 7757} {"train_loss": -28.033979415893555, "global_step": 643863, "epoch": 7757} {"train_loss": -27.8974609375, "global_step": 643864, "epoch": 7757} {"train_loss": -27.978748321533203, "global_step": 643865, "epoch": 7757} {"train_loss": -27.748571395874023, "global_step": 643866, "epoch": 7757} {"train_loss": -27.90180015563965, "global_step": 643867, "epoch": 7757} {"train_loss": -27.557483673095703, "global_step": 643868, "epoch": 7757} {"train_loss": -27.960926055908203, "global_step": 643869, "epoch": 7757} {"train_loss": -27.92844581604004, "global_step": 643870, "epoch": 7757} {"train_loss": -28.0956974029541, "global_step": 643871, "epoch": 7757} {"train_loss": -28.25733757019043, "global_step": 643872, "epoch": 7757} {"train_loss": -28.047285079956055, "global_step": 643873, "epoch": 7757} {"train_loss": -27.91501235961914, "global_step": 643874, "epoch": 7757} {"train_loss": -27.879552841186523, "global_step": 643875, "epoch": 7757} {"train_loss": -28.06293296813965, "global_step": 643876, "epoch": 7757} {"train_loss": -28.06489372253418, "global_step": 643877, "epoch": 7757} {"train_loss": -27.659910202026367, "global_step": 643878, "epoch": 7757} {"train_loss": -28.15760612487793, "global_step": 643879, "epoch": 7757} {"train_loss": -27.843170166015625, "global_step": 643880, "epoch": 7757} {"train_loss": -28.555255889892578, "global_step": 643881, "epoch": 7757} {"train_loss": -28.062475204467773, "global_step": 643882, "epoch": 7757} {"train_loss": -27.9240779876709, "global_step": 643883, "epoch": 7757} {"train_loss": -28.274951934814453, "global_step": 643884, "epoch": 7757} {"train_loss": -27.943418502807617, "global_step": 643885, "epoch": 7757} {"train_loss": -28.22077751159668, "global_step": 643886, "epoch": 7757} {"train_loss": -28.023725509643555, "global_step": 643887, "epoch": 7757} {"train_loss": -28.2106876373291, "global_step": 643888, "epoch": 7757} {"train_loss": -27.98482322692871, "global_step": 643889, "epoch": 7757} {"train_loss": -28.24485206604004, "global_step": 643890, "epoch": 7757} {"train_loss": -28.13372230529785, "global_step": 643891, "epoch": 7757} {"train_loss": -28.684188842773438, "global_step": 643892, "epoch": 7757} {"train_loss": -28.118764877319336, "global_step": 643893, "epoch": 7757} {"train_loss": -28.381454467773438, "global_step": 643894, "epoch": 7757} {"train_loss": -28.646085739135742, "global_step": 643895, "epoch": 7757} {"train_loss": -28.1709041595459, "global_step": 643896, "epoch": 7757} {"train_loss": -28.0415096282959, "global_step": 643897, "epoch": 7757} {"train_loss": -28.1951904296875, "global_step": 643898, "epoch": 7757} {"train_loss": -28.43536949157715, "global_step": 643899, "epoch": 7757} {"train_loss": -28.52778434753418, "global_step": 643900, "epoch": 7757} {"train_loss": -28.1815185546875, "global_step": 643901, "epoch": 7757} {"train_loss": -28.445947647094727, "global_step": 643902, "epoch": 7757} {"train_loss": -27.920917510986328, "global_step": 643903, "epoch": 7757} {"train_loss": -28.0611515045166, "global_step": 643904, "epoch": 7757} {"train_loss": -28.398517608642578, "global_step": 643905, "epoch": 7757} {"train_loss": -27.888822555541992, "global_step": 643906, "epoch": 7757} {"train_loss": -28.201141357421875, "global_step": 643907, "epoch": 7757} {"train_loss": -28.154071807861328, "global_step": 643908, "epoch": 7757} {"train_loss": -27.921899795532227, "global_step": 643909, "epoch": 7757} {"train_loss": -28.305883407592773, "global_step": 643910, "epoch": 7757} {"train_loss": -28.128873825073242, "global_step": 643911, "epoch": 7757} {"train_loss": -28.3387451171875, "global_step": 643912, "epoch": 7757} {"train_loss": -27.72488486048687, "global_step": 643913, "epoch": 7757, "val_loss": 6679895.5} {"train_loss": -27.574630737304688, "global_step": 643914, "epoch": 7758} {"train_loss": -27.947965621948242, "global_step": 643915, "epoch": 7758} {"train_loss": -28.016504287719727, "global_step": 643916, "epoch": 7758} {"train_loss": -27.879735946655273, "global_step": 643917, "epoch": 7758} {"train_loss": -27.521936416625977, "global_step": 643918, "epoch": 7758} {"train_loss": -27.161182403564453, "global_step": 643919, "epoch": 7758} {"train_loss": -27.293701171875, "global_step": 643920, "epoch": 7758} {"train_loss": -27.887170791625977, "global_step": 643921, "epoch": 7758} {"train_loss": -27.38518714904785, "global_step": 643922, "epoch": 7758} {"train_loss": -27.945032119750977, "global_step": 643923, "epoch": 7758} {"train_loss": -28.11703872680664, "global_step": 643924, "epoch": 7758} {"train_loss": -27.756818771362305, "global_step": 643925, "epoch": 7758} {"train_loss": -27.918781280517578, "global_step": 643926, "epoch": 7758} {"train_loss": -28.208301544189453, "global_step": 643927, "epoch": 7758} {"train_loss": -27.83721351623535, "global_step": 643928, "epoch": 7758} {"train_loss": -27.99249267578125, "global_step": 643929, "epoch": 7758} {"train_loss": -28.185895919799805, "global_step": 643930, "epoch": 7758} {"train_loss": -28.369897842407227, "global_step": 643931, "epoch": 7758} {"train_loss": -28.134063720703125, "global_step": 643932, "epoch": 7758} {"train_loss": -28.47904396057129, "global_step": 643933, "epoch": 7758} {"train_loss": -28.19440269470215, "global_step": 643934, "epoch": 7758} {"train_loss": -28.264535903930664, "global_step": 643935, "epoch": 7758} {"train_loss": -28.30146598815918, "global_step": 643936, "epoch": 7758} {"train_loss": -28.341211318969727, "global_step": 643937, "epoch": 7758} {"train_loss": -28.416702270507812, "global_step": 643938, "epoch": 7758} {"train_loss": -28.363534927368164, "global_step": 643939, "epoch": 7758} {"train_loss": -28.275197982788086, "global_step": 643940, "epoch": 7758} {"train_loss": -28.144256591796875, "global_step": 643941, "epoch": 7758} {"train_loss": -28.3178768157959, "global_step": 643942, "epoch": 7758} {"train_loss": -28.544958114624023, "global_step": 643943, "epoch": 7758} {"train_loss": -28.537317276000977, "global_step": 643944, "epoch": 7758} {"train_loss": -28.1864070892334, "global_step": 643945, "epoch": 7758} {"train_loss": -28.476123809814453, "global_step": 643946, "epoch": 7758} {"train_loss": -28.5874080657959, "global_step": 643947, "epoch": 7758} {"train_loss": -28.650348663330078, "global_step": 643948, "epoch": 7758} {"train_loss": -28.474109649658203, "global_step": 643949, "epoch": 7758} {"train_loss": -28.899642944335938, "global_step": 643950, "epoch": 7758} {"train_loss": -28.279020309448242, "global_step": 643951, "epoch": 7758} {"train_loss": -28.3536434173584, "global_step": 643952, "epoch": 7758} {"train_loss": -28.335294723510742, "global_step": 643953, "epoch": 7758} {"train_loss": -27.993453979492188, "global_step": 643954, "epoch": 7758} {"train_loss": -28.32069969177246, "global_step": 643955, "epoch": 7758} {"train_loss": -28.355823516845703, "global_step": 643956, "epoch": 7758} {"train_loss": -28.390579223632812, "global_step": 643957, "epoch": 7758} {"train_loss": -28.055023193359375, "global_step": 643958, "epoch": 7758} {"train_loss": -28.128097534179688, "global_step": 643959, "epoch": 7758} {"train_loss": -28.777027130126953, "global_step": 643960, "epoch": 7758} {"train_loss": -28.4088077545166, "global_step": 643961, "epoch": 7758} {"train_loss": -28.502349853515625, "global_step": 643962, "epoch": 7758} {"train_loss": -28.6989803314209, "global_step": 643963, "epoch": 7758} {"train_loss": -28.565271377563477, "global_step": 643964, "epoch": 7758} {"train_loss": -28.66145133972168, "global_step": 643965, "epoch": 7758} {"train_loss": -28.25470542907715, "global_step": 643966, "epoch": 7758} {"train_loss": -28.512741088867188, "global_step": 643967, "epoch": 7758} {"train_loss": -28.27506446838379, "global_step": 643968, "epoch": 7758} {"train_loss": -28.685516357421875, "global_step": 643969, "epoch": 7758} {"train_loss": -28.207406997680664, "global_step": 643970, "epoch": 7758} {"train_loss": -28.4823055267334, "global_step": 643971, "epoch": 7758} {"train_loss": -27.90968894958496, "global_step": 643972, "epoch": 7758} {"train_loss": -28.177961349487305, "global_step": 643973, "epoch": 7758} {"train_loss": -28.25779151916504, "global_step": 643974, "epoch": 7758} {"train_loss": -28.273141860961914, "global_step": 643975, "epoch": 7758} {"train_loss": -28.124181747436523, "global_step": 643976, "epoch": 7758} {"train_loss": -28.426416397094727, "global_step": 643977, "epoch": 7758} {"train_loss": -27.989669799804688, "global_step": 643978, "epoch": 7758} {"train_loss": -28.561279296875, "global_step": 643979, "epoch": 7758} {"train_loss": -28.278486251831055, "global_step": 643980, "epoch": 7758} {"train_loss": -28.374958038330078, "global_step": 643981, "epoch": 7758} {"train_loss": -28.62409782409668, "global_step": 643982, "epoch": 7758} {"train_loss": -28.220233917236328, "global_step": 643983, "epoch": 7758} {"train_loss": -28.750295639038086, "global_step": 643984, "epoch": 7758} {"train_loss": -28.1949462890625, "global_step": 643985, "epoch": 7758} {"train_loss": -28.320905685424805, "global_step": 643986, "epoch": 7758} {"train_loss": -28.198537826538086, "global_step": 643987, "epoch": 7758} {"train_loss": -28.37529945373535, "global_step": 643988, "epoch": 7758} {"train_loss": -28.793119430541992, "global_step": 643989, "epoch": 7758} {"train_loss": -28.1464900970459, "global_step": 643990, "epoch": 7758} {"train_loss": -28.655065536499023, "global_step": 643991, "epoch": 7758} {"train_loss": -28.449689865112305, "global_step": 643992, "epoch": 7758} {"train_loss": -28.468677520751953, "global_step": 643993, "epoch": 7758} {"train_loss": -28.339374542236328, "global_step": 643994, "epoch": 7758} {"train_loss": -28.47054100036621, "global_step": 643995, "epoch": 7758} {"train_loss": -28.266279105680535, "global_step": 643996, "epoch": 7758, "val_loss": 6666578.0} {"train_loss": -28.38850212097168, "global_step": 643997, "epoch": 7759} {"train_loss": -27.922195434570312, "global_step": 643998, "epoch": 7759} {"train_loss": -28.36097526550293, "global_step": 643999, "epoch": 7759} {"train_loss": -28.002960205078125, "global_step": 644000, "epoch": 7759} {"train_loss": -28.08942985534668, "global_step": 644001, "epoch": 7759} {"train_loss": -28.0767765045166, "global_step": 644002, "epoch": 7759} {"train_loss": -27.967823028564453, "global_step": 644003, "epoch": 7759} {"train_loss": -27.91126823425293, "global_step": 644004, "epoch": 7759} {"train_loss": -28.36517333984375, "global_step": 644005, "epoch": 7759} {"train_loss": -28.165552139282227, "global_step": 644006, "epoch": 7759} {"train_loss": -27.97503662109375, "global_step": 644007, "epoch": 7759} {"train_loss": -27.36481285095215, "global_step": 644008, "epoch": 7759} {"train_loss": -28.180419921875, "global_step": 644009, "epoch": 7759} {"train_loss": -27.905527114868164, "global_step": 644010, "epoch": 7759} {"train_loss": -27.085290908813477, "global_step": 644011, "epoch": 7759} {"train_loss": -27.4488582611084, "global_step": 644012, "epoch": 7759} {"train_loss": -28.23062515258789, "global_step": 644013, "epoch": 7759} {"train_loss": -28.026813507080078, "global_step": 644014, "epoch": 7759} {"train_loss": -27.449756622314453, "global_step": 644015, "epoch": 7759} {"train_loss": -28.1510066986084, "global_step": 644016, "epoch": 7759} {"train_loss": -27.740222930908203, "global_step": 644017, "epoch": 7759} {"train_loss": -27.85698890686035, "global_step": 644018, "epoch": 7759} {"train_loss": -27.980100631713867, "global_step": 644019, "epoch": 7759} {"train_loss": -28.16229820251465, "global_step": 644020, "epoch": 7759} {"train_loss": -27.51564598083496, "global_step": 644021, "epoch": 7759} {"train_loss": -28.503599166870117, "global_step": 644022, "epoch": 7759} {"train_loss": -27.97552490234375, "global_step": 644023, "epoch": 7759} {"train_loss": -28.118139266967773, "global_step": 644024, "epoch": 7759} {"train_loss": -27.983579635620117, "global_step": 644025, "epoch": 7759} {"train_loss": -28.20672035217285, "global_step": 644026, "epoch": 7759} {"train_loss": -28.335006713867188, "global_step": 644027, "epoch": 7759} {"train_loss": -27.751317977905273, "global_step": 644028, "epoch": 7759} {"train_loss": -28.366703033447266, "global_step": 644029, "epoch": 7759} {"train_loss": -28.023061752319336, "global_step": 644030, "epoch": 7759} {"train_loss": -28.01153564453125, "global_step": 644031, "epoch": 7759} {"train_loss": -28.238245010375977, "global_step": 644032, "epoch": 7759} {"train_loss": -28.126951217651367, "global_step": 644033, "epoch": 7759} {"train_loss": -28.238393783569336, "global_step": 644034, "epoch": 7759} {"train_loss": -28.489105224609375, "global_step": 644035, "epoch": 7759} {"train_loss": -28.2806453704834, "global_step": 644036, "epoch": 7759} {"train_loss": -28.3138427734375, "global_step": 644037, "epoch": 7759} {"train_loss": -28.50105094909668, "global_step": 644038, "epoch": 7759} {"train_loss": -28.39446449279785, "global_step": 644039, "epoch": 7759} {"train_loss": -28.133237838745117, "global_step": 644040, "epoch": 7759} {"train_loss": -28.30213737487793, "global_step": 644041, "epoch": 7759} {"train_loss": -28.461164474487305, "global_step": 644042, "epoch": 7759} {"train_loss": -28.327301025390625, "global_step": 644043, "epoch": 7759} {"train_loss": -28.569257736206055, "global_step": 644044, "epoch": 7759} {"train_loss": -28.358198165893555, "global_step": 644045, "epoch": 7759} {"train_loss": -28.281274795532227, "global_step": 644046, "epoch": 7759} {"train_loss": -28.427108764648438, "global_step": 644047, "epoch": 7759} {"train_loss": -28.167219161987305, "global_step": 644048, "epoch": 7759} {"train_loss": -28.466840744018555, "global_step": 644049, "epoch": 7759} {"train_loss": -28.420324325561523, "global_step": 644050, "epoch": 7759} {"train_loss": -28.69437026977539, "global_step": 644051, "epoch": 7759} {"train_loss": -28.58477783203125, "global_step": 644052, "epoch": 7759} {"train_loss": -28.5786075592041, "global_step": 644053, "epoch": 7759} {"train_loss": -28.558349609375, "global_step": 644054, "epoch": 7759} {"train_loss": -28.43409538269043, "global_step": 644055, "epoch": 7759} {"train_loss": -28.48076820373535, "global_step": 644056, "epoch": 7759} {"train_loss": -28.527332305908203, "global_step": 644057, "epoch": 7759} {"train_loss": -28.396072387695312, "global_step": 644058, "epoch": 7759} {"train_loss": -28.23494529724121, "global_step": 644059, "epoch": 7759} {"train_loss": -28.70319175720215, "global_step": 644060, "epoch": 7759} {"train_loss": -28.103351593017578, "global_step": 644061, "epoch": 7759} {"train_loss": -28.381519317626953, "global_step": 644062, "epoch": 7759} {"train_loss": -28.537399291992188, "global_step": 644063, "epoch": 7759} {"train_loss": -28.230194091796875, "global_step": 644064, "epoch": 7759} {"train_loss": -27.963077545166016, "global_step": 644065, "epoch": 7759} {"train_loss": -28.0635986328125, "global_step": 644066, "epoch": 7759} {"train_loss": -27.957111358642578, "global_step": 644067, "epoch": 7759} {"train_loss": -28.78598403930664, "global_step": 644068, "epoch": 7759} {"train_loss": -28.619354248046875, "global_step": 644069, "epoch": 7759} {"train_loss": -28.103790283203125, "global_step": 644070, "epoch": 7759} {"train_loss": -28.1077938079834, "global_step": 644071, "epoch": 7759} {"train_loss": -27.811426162719727, "global_step": 644072, "epoch": 7759} {"train_loss": -27.798593521118164, "global_step": 644073, "epoch": 7759} {"train_loss": -28.174304962158203, "global_step": 644074, "epoch": 7759} {"train_loss": -28.29867935180664, "global_step": 644075, "epoch": 7759} {"train_loss": -28.16401481628418, "global_step": 644076, "epoch": 7759} {"train_loss": -28.23432731628418, "global_step": 644077, "epoch": 7759} {"train_loss": -28.070154190063477, "global_step": 644078, "epoch": 7759} {"train_loss": -28.193588509617083, "global_step": 644079, "epoch": 7759, "val_loss": 6644791.0} {"train_loss": -27.867528915405273, "global_step": 644080, "epoch": 7760} {"train_loss": -27.112539291381836, "global_step": 644081, "epoch": 7760} {"train_loss": -27.691274642944336, "global_step": 644082, "epoch": 7760} {"train_loss": -27.39397621154785, "global_step": 644083, "epoch": 7760} {"train_loss": -27.256820678710938, "global_step": 644084, "epoch": 7760} {"train_loss": -27.25189781188965, "global_step": 644085, "epoch": 7760} {"train_loss": -27.967742919921875, "global_step": 644086, "epoch": 7760} {"train_loss": -27.60663414001465, "global_step": 644087, "epoch": 7760} {"train_loss": -27.615222930908203, "global_step": 644088, "epoch": 7760} {"train_loss": -27.898757934570312, "global_step": 644089, "epoch": 7760} {"train_loss": -27.76445960998535, "global_step": 644090, "epoch": 7760} {"train_loss": -27.91952896118164, "global_step": 644091, "epoch": 7760} {"train_loss": -27.90835952758789, "global_step": 644092, "epoch": 7760} {"train_loss": -27.735563278198242, "global_step": 644093, "epoch": 7760} {"train_loss": -28.05475425720215, "global_step": 644094, "epoch": 7760} {"train_loss": -27.76059913635254, "global_step": 644095, "epoch": 7760} {"train_loss": -27.844690322875977, "global_step": 644096, "epoch": 7760} {"train_loss": -28.22378921508789, "global_step": 644097, "epoch": 7760} {"train_loss": -28.08131980895996, "global_step": 644098, "epoch": 7760} {"train_loss": -28.076095581054688, "global_step": 644099, "epoch": 7760} {"train_loss": -28.315750122070312, "global_step": 644100, "epoch": 7760} {"train_loss": -28.114057540893555, "global_step": 644101, "epoch": 7760} {"train_loss": -28.01106834411621, "global_step": 644102, "epoch": 7760} {"train_loss": -28.344745635986328, "global_step": 644103, "epoch": 7760} {"train_loss": -28.025379180908203, "global_step": 644104, "epoch": 7760} {"train_loss": -28.309131622314453, "global_step": 644105, "epoch": 7760} {"train_loss": -28.2459716796875, "global_step": 644106, "epoch": 7760} {"train_loss": -28.30950355529785, "global_step": 644107, "epoch": 7760} {"train_loss": -28.23737907409668, "global_step": 644108, "epoch": 7760} {"train_loss": -28.54084587097168, "global_step": 644109, "epoch": 7760} {"train_loss": -28.68195152282715, "global_step": 644110, "epoch": 7760} {"train_loss": -28.77031898498535, "global_step": 644111, "epoch": 7760} {"train_loss": -28.168277740478516, "global_step": 644112, "epoch": 7760} {"train_loss": -27.88226318359375, "global_step": 644113, "epoch": 7760} {"train_loss": -28.32965660095215, "global_step": 644114, "epoch": 7760} {"train_loss": -28.185495376586914, "global_step": 644115, "epoch": 7760} {"train_loss": -28.293928146362305, "global_step": 644116, "epoch": 7760} {"train_loss": -28.308273315429688, "global_step": 644117, "epoch": 7760} {"train_loss": -28.434301376342773, "global_step": 644118, "epoch": 7760} {"train_loss": -28.445356369018555, "global_step": 644119, "epoch": 7760} {"train_loss": -27.920507431030273, "global_step": 644120, "epoch": 7760} {"train_loss": -28.080371856689453, "global_step": 644121, "epoch": 7760} {"train_loss": -28.646753311157227, "global_step": 644122, "epoch": 7760} {"train_loss": -28.293262481689453, "global_step": 644123, "epoch": 7760} {"train_loss": -28.69718360900879, "global_step": 644124, "epoch": 7760} {"train_loss": -28.488006591796875, "global_step": 644125, "epoch": 7760} {"train_loss": -28.262304306030273, "global_step": 644126, "epoch": 7760} {"train_loss": -28.5155086517334, "global_step": 644127, "epoch": 7760} {"train_loss": -28.24269676208496, "global_step": 644128, "epoch": 7760} {"train_loss": -28.30201530456543, "global_step": 644129, "epoch": 7760} {"train_loss": -28.411823272705078, "global_step": 644130, "epoch": 7760} {"train_loss": -28.217117309570312, "global_step": 644131, "epoch": 7760} {"train_loss": -28.349430084228516, "global_step": 644132, "epoch": 7760} {"train_loss": -28.44704246520996, "global_step": 644133, "epoch": 7760} {"train_loss": -28.52263832092285, "global_step": 644134, "epoch": 7760} {"train_loss": -28.629348754882812, "global_step": 644135, "epoch": 7760} {"train_loss": -28.40106773376465, "global_step": 644136, "epoch": 7760} {"train_loss": -27.857227325439453, "global_step": 644137, "epoch": 7760} {"train_loss": -28.385868072509766, "global_step": 644138, "epoch": 7760} {"train_loss": -28.06292152404785, "global_step": 644139, "epoch": 7760} {"train_loss": -27.911767959594727, "global_step": 644140, "epoch": 7760} {"train_loss": -28.33112907409668, "global_step": 644141, "epoch": 7760} {"train_loss": -28.020313262939453, "global_step": 644142, "epoch": 7760} {"train_loss": -27.984128952026367, "global_step": 644143, "epoch": 7760} {"train_loss": -28.462682723999023, "global_step": 644144, "epoch": 7760} {"train_loss": -28.33597183227539, "global_step": 644145, "epoch": 7760} {"train_loss": -27.4877872467041, "global_step": 644146, "epoch": 7760} {"train_loss": -27.83070182800293, "global_step": 644147, "epoch": 7760} {"train_loss": -28.279016494750977, "global_step": 644148, "epoch": 7760} {"train_loss": -28.082096099853516, "global_step": 644149, "epoch": 7760} {"train_loss": -28.239471435546875, "global_step": 644150, "epoch": 7760} {"train_loss": -28.0408992767334, "global_step": 644151, "epoch": 7760} {"train_loss": -27.92498779296875, "global_step": 644152, "epoch": 7760} {"train_loss": -28.12674903869629, "global_step": 644153, "epoch": 7760} {"train_loss": -27.786649703979492, "global_step": 644154, "epoch": 7760} {"train_loss": -28.30909538269043, "global_step": 644155, "epoch": 7760} {"train_loss": -28.154468536376953, "global_step": 644156, "epoch": 7760} {"train_loss": -28.0699405670166, "global_step": 644157, "epoch": 7760} {"train_loss": -27.80487060546875, "global_step": 644158, "epoch": 7760} {"train_loss": -28.353307723999023, "global_step": 644159, "epoch": 7760} {"train_loss": -28.81687355041504, "global_step": 644160, "epoch": 7760} {"train_loss": -28.341291427612305, "global_step": 644161, "epoch": 7760} {"train_loss": -28.148305755063713, "global_step": 644162, "epoch": 7760, "val_loss": 6618488.0} {"train_loss": -25.999547958374023, "global_step": 644163, "epoch": 7761} {"train_loss": -25.001148223876953, "global_step": 644164, "epoch": 7761} {"train_loss": -25.897174835205078, "global_step": 644165, "epoch": 7761} {"train_loss": -27.014892578125, "global_step": 644166, "epoch": 7761} {"train_loss": -25.6760196685791, "global_step": 644167, "epoch": 7761} {"train_loss": -27.00641441345215, "global_step": 644168, "epoch": 7761} {"train_loss": -25.69586753845215, "global_step": 644169, "epoch": 7761} {"train_loss": -27.3402099609375, "global_step": 644170, "epoch": 7761} {"train_loss": -26.497974395751953, "global_step": 644171, "epoch": 7761} {"train_loss": -27.159957885742188, "global_step": 644172, "epoch": 7761} {"train_loss": -26.3137264251709, "global_step": 644173, "epoch": 7761} {"train_loss": -27.26169776916504, "global_step": 644174, "epoch": 7761} {"train_loss": -27.319116592407227, "global_step": 644175, "epoch": 7761} {"train_loss": -27.45694351196289, "global_step": 644176, "epoch": 7761} {"train_loss": -27.463415145874023, "global_step": 644177, "epoch": 7761} {"train_loss": -27.160669326782227, "global_step": 644178, "epoch": 7761} {"train_loss": -27.433256149291992, "global_step": 644179, "epoch": 7761} {"train_loss": -27.672012329101562, "global_step": 644180, "epoch": 7761} {"train_loss": -27.386688232421875, "global_step": 644181, "epoch": 7761} {"train_loss": -27.46002197265625, "global_step": 644182, "epoch": 7761} {"train_loss": -27.55586051940918, "global_step": 644183, "epoch": 7761} {"train_loss": -27.75629997253418, "global_step": 644184, "epoch": 7761} {"train_loss": -27.250524520874023, "global_step": 644185, "epoch": 7761} {"train_loss": -27.545373916625977, "global_step": 644186, "epoch": 7761} {"train_loss": -28.108991622924805, "global_step": 644187, "epoch": 7761} {"train_loss": -27.558347702026367, "global_step": 644188, "epoch": 7761} {"train_loss": -27.771209716796875, "global_step": 644189, "epoch": 7761} {"train_loss": -28.19471549987793, "global_step": 644190, "epoch": 7761} {"train_loss": -27.794286727905273, "global_step": 644191, "epoch": 7761} {"train_loss": -27.89664649963379, "global_step": 644192, "epoch": 7761} {"train_loss": -28.0308780670166, "global_step": 644193, "epoch": 7761} {"train_loss": -27.845563888549805, "global_step": 644194, "epoch": 7761} {"train_loss": -27.9301700592041, "global_step": 644195, "epoch": 7761} {"train_loss": -28.0335693359375, "global_step": 644196, "epoch": 7761} {"train_loss": -27.837005615234375, "global_step": 644197, "epoch": 7761} {"train_loss": -28.066940307617188, "global_step": 644198, "epoch": 7761} {"train_loss": -27.989423751831055, "global_step": 644199, "epoch": 7761} {"train_loss": -28.12228775024414, "global_step": 644200, "epoch": 7761} {"train_loss": -28.137357711791992, "global_step": 644201, "epoch": 7761} {"train_loss": -28.43356704711914, "global_step": 644202, "epoch": 7761} {"train_loss": -28.127670288085938, "global_step": 644203, "epoch": 7761} {"train_loss": -28.142990112304688, "global_step": 644204, "epoch": 7761} {"train_loss": -28.326318740844727, "global_step": 644205, "epoch": 7761} {"train_loss": -28.421350479125977, "global_step": 644206, "epoch": 7761} {"train_loss": -28.33841323852539, "global_step": 644207, "epoch": 7761} {"train_loss": -28.517562866210938, "global_step": 644208, "epoch": 7761} {"train_loss": -28.46748161315918, "global_step": 644209, "epoch": 7761} {"train_loss": -28.441558837890625, "global_step": 644210, "epoch": 7761} {"train_loss": -28.449216842651367, "global_step": 644211, "epoch": 7761} {"train_loss": -28.416223526000977, "global_step": 644212, "epoch": 7761} {"train_loss": -28.352203369140625, "global_step": 644213, "epoch": 7761} {"train_loss": -28.3824405670166, "global_step": 644214, "epoch": 7761} {"train_loss": -28.30299949645996, "global_step": 644215, "epoch": 7761} {"train_loss": -28.55828285217285, "global_step": 644216, "epoch": 7761} {"train_loss": -28.46953773498535, "global_step": 644217, "epoch": 7761} {"train_loss": -28.42340087890625, "global_step": 644218, "epoch": 7761} {"train_loss": -28.407751083374023, "global_step": 644219, "epoch": 7761} {"train_loss": -28.433094024658203, "global_step": 644220, "epoch": 7761} {"train_loss": -28.187744140625, "global_step": 644221, "epoch": 7761} {"train_loss": -27.848520278930664, "global_step": 644222, "epoch": 7761} {"train_loss": -27.498199462890625, "global_step": 644223, "epoch": 7761} {"train_loss": -27.910184860229492, "global_step": 644224, "epoch": 7761} {"train_loss": -28.6121883392334, "global_step": 644225, "epoch": 7761} {"train_loss": -28.4073543548584, "global_step": 644226, "epoch": 7761} {"train_loss": -28.196455001831055, "global_step": 644227, "epoch": 7761} {"train_loss": -28.111608505249023, "global_step": 644228, "epoch": 7761} {"train_loss": -28.482269287109375, "global_step": 644229, "epoch": 7761} {"train_loss": -28.444904327392578, "global_step": 644230, "epoch": 7761} {"train_loss": -28.752578735351562, "global_step": 644231, "epoch": 7761} {"train_loss": -28.605146408081055, "global_step": 644232, "epoch": 7761} {"train_loss": -28.5253963470459, "global_step": 644233, "epoch": 7761} {"train_loss": -28.511579513549805, "global_step": 644234, "epoch": 7761} {"train_loss": -28.73320960998535, "global_step": 644235, "epoch": 7761} {"train_loss": -28.278675079345703, "global_step": 644236, "epoch": 7761} {"train_loss": -28.35044288635254, "global_step": 644237, "epoch": 7761} {"train_loss": -28.313674926757812, "global_step": 644238, "epoch": 7761} {"train_loss": -28.325927734375, "global_step": 644239, "epoch": 7761} {"train_loss": -28.088193893432617, "global_step": 644240, "epoch": 7761} {"train_loss": -28.196420669555664, "global_step": 644241, "epoch": 7761} {"train_loss": -28.165571212768555, "global_step": 644242, "epoch": 7761} {"train_loss": -28.255300521850586, "global_step": 644243, "epoch": 7761} {"train_loss": -28.525365829467773, "global_step": 644244, "epoch": 7761} {"train_loss": -27.86567366266825, "global_step": 644245, "epoch": 7761, "val_loss": 6659733.0} {"train_loss": -27.089746475219727, "global_step": 644246, "epoch": 7762} {"train_loss": -27.602344512939453, "global_step": 644247, "epoch": 7762} {"train_loss": -27.93206214904785, "global_step": 644248, "epoch": 7762} {"train_loss": -27.276052474975586, "global_step": 644249, "epoch": 7762} {"train_loss": -27.535078048706055, "global_step": 644250, "epoch": 7762} {"train_loss": -27.945676803588867, "global_step": 644251, "epoch": 7762} {"train_loss": -27.47511100769043, "global_step": 644252, "epoch": 7762} {"train_loss": -27.98899269104004, "global_step": 644253, "epoch": 7762} {"train_loss": -27.81000328063965, "global_step": 644254, "epoch": 7762} {"train_loss": -27.909503936767578, "global_step": 644255, "epoch": 7762} {"train_loss": -27.987878799438477, "global_step": 644256, "epoch": 7762} {"train_loss": -28.023406982421875, "global_step": 644257, "epoch": 7762} {"train_loss": -28.16721534729004, "global_step": 644258, "epoch": 7762} {"train_loss": -27.67048454284668, "global_step": 644259, "epoch": 7762} {"train_loss": -28.07539939880371, "global_step": 644260, "epoch": 7762} {"train_loss": -27.723251342773438, "global_step": 644261, "epoch": 7762} {"train_loss": -28.26679801940918, "global_step": 644262, "epoch": 7762} {"train_loss": -27.764326095581055, "global_step": 644263, "epoch": 7762} {"train_loss": -27.93361473083496, "global_step": 644264, "epoch": 7762} {"train_loss": -27.863983154296875, "global_step": 644265, "epoch": 7762} {"train_loss": -27.618677139282227, "global_step": 644266, "epoch": 7762} {"train_loss": -28.07391929626465, "global_step": 644267, "epoch": 7762} {"train_loss": -27.903762817382812, "global_step": 644268, "epoch": 7762} {"train_loss": -28.053998947143555, "global_step": 644269, "epoch": 7762} {"train_loss": -28.143203735351562, "global_step": 644270, "epoch": 7762} {"train_loss": -28.4494686126709, "global_step": 644271, "epoch": 7762} {"train_loss": -27.843564987182617, "global_step": 644272, "epoch": 7762} {"train_loss": -28.127765655517578, "global_step": 644273, "epoch": 7762} {"train_loss": -28.261947631835938, "global_step": 644274, "epoch": 7762} {"train_loss": -28.345111846923828, "global_step": 644275, "epoch": 7762} {"train_loss": -28.567541122436523, "global_step": 644276, "epoch": 7762} {"train_loss": -27.995397567749023, "global_step": 644277, "epoch": 7762} {"train_loss": -28.155017852783203, "global_step": 644278, "epoch": 7762} {"train_loss": -27.971134185791016, "global_step": 644279, "epoch": 7762} {"train_loss": -28.19585609436035, "global_step": 644280, "epoch": 7762} {"train_loss": -28.526784896850586, "global_step": 644281, "epoch": 7762} {"train_loss": -28.40315055847168, "global_step": 644282, "epoch": 7762} {"train_loss": -28.293903350830078, "global_step": 644283, "epoch": 7762} {"train_loss": -28.384008407592773, "global_step": 644284, "epoch": 7762} {"train_loss": -27.97696304321289, "global_step": 644285, "epoch": 7762} {"train_loss": -28.115270614624023, "global_step": 644286, "epoch": 7762} {"train_loss": -28.272329330444336, "global_step": 644287, "epoch": 7762} {"train_loss": -27.835376739501953, "global_step": 644288, "epoch": 7762} {"train_loss": -28.38337516784668, "global_step": 644289, "epoch": 7762} {"train_loss": -28.313711166381836, "global_step": 644290, "epoch": 7762} {"train_loss": -28.130414962768555, "global_step": 644291, "epoch": 7762} {"train_loss": -28.3350830078125, "global_step": 644292, "epoch": 7762} {"train_loss": -28.352392196655273, "global_step": 644293, "epoch": 7762} {"train_loss": -28.442493438720703, "global_step": 644294, "epoch": 7762} {"train_loss": -28.605199813842773, "global_step": 644295, "epoch": 7762} {"train_loss": -28.17026138305664, "global_step": 644296, "epoch": 7762} {"train_loss": -28.19038963317871, "global_step": 644297, "epoch": 7762} {"train_loss": -28.125268936157227, "global_step": 644298, "epoch": 7762} {"train_loss": -28.69282341003418, "global_step": 644299, "epoch": 7762} {"train_loss": -28.659408569335938, "global_step": 644300, "epoch": 7762} {"train_loss": -28.26766014099121, "global_step": 644301, "epoch": 7762} {"train_loss": -28.56388282775879, "global_step": 644302, "epoch": 7762} {"train_loss": -28.710372924804688, "global_step": 644303, "epoch": 7762} {"train_loss": -28.68433952331543, "global_step": 644304, "epoch": 7762} {"train_loss": -28.633319854736328, "global_step": 644305, "epoch": 7762} {"train_loss": -28.299503326416016, "global_step": 644306, "epoch": 7762} {"train_loss": -28.598432540893555, "global_step": 644307, "epoch": 7762} {"train_loss": -28.581771850585938, "global_step": 644308, "epoch": 7762} {"train_loss": -28.58115005493164, "global_step": 644309, "epoch": 7762} {"train_loss": -28.60076904296875, "global_step": 644310, "epoch": 7762} {"train_loss": -28.56621742248535, "global_step": 644311, "epoch": 7762} {"train_loss": -28.650226593017578, "global_step": 644312, "epoch": 7762} {"train_loss": -28.604660034179688, "global_step": 644313, "epoch": 7762} {"train_loss": -28.296981811523438, "global_step": 644314, "epoch": 7762} {"train_loss": -28.2276554107666, "global_step": 644315, "epoch": 7762} {"train_loss": -27.843402862548828, "global_step": 644316, "epoch": 7762} {"train_loss": -28.300153732299805, "global_step": 644317, "epoch": 7762} {"train_loss": -27.758045196533203, "global_step": 644318, "epoch": 7762} {"train_loss": -27.81519889831543, "global_step": 644319, "epoch": 7762} {"train_loss": -28.078657150268555, "global_step": 644320, "epoch": 7762} {"train_loss": -28.09621238708496, "global_step": 644321, "epoch": 7762} {"train_loss": -28.456247329711914, "global_step": 644322, "epoch": 7762} {"train_loss": -28.55667495727539, "global_step": 644323, "epoch": 7762} {"train_loss": -27.871002197265625, "global_step": 644324, "epoch": 7762} {"train_loss": -27.946924209594727, "global_step": 644325, "epoch": 7762} {"train_loss": -28.3906192779541, "global_step": 644326, "epoch": 7762} {"train_loss": -28.257720947265625, "global_step": 644327, "epoch": 7762} {"train_loss": -28.170960989343115, "global_step": 644328, "epoch": 7762, "val_loss": 6593110.0} {"train_loss": -26.627927780151367, "global_step": 644329, "epoch": 7763} {"train_loss": -26.51474952697754, "global_step": 644330, "epoch": 7763} {"train_loss": -26.951597213745117, "global_step": 644331, "epoch": 7763} {"train_loss": -25.839059829711914, "global_step": 644332, "epoch": 7763} {"train_loss": -26.96408462524414, "global_step": 644333, "epoch": 7763} {"train_loss": -26.305938720703125, "global_step": 644334, "epoch": 7763} {"train_loss": -26.843290328979492, "global_step": 644335, "epoch": 7763} {"train_loss": -26.53340721130371, "global_step": 644336, "epoch": 7763} {"train_loss": -27.30417823791504, "global_step": 644337, "epoch": 7763} {"train_loss": -27.4716854095459, "global_step": 644338, "epoch": 7763} {"train_loss": -26.66594886779785, "global_step": 644339, "epoch": 7763} {"train_loss": -27.515380859375, "global_step": 644340, "epoch": 7763} {"train_loss": -27.459503173828125, "global_step": 644341, "epoch": 7763} {"train_loss": -27.668256759643555, "global_step": 644342, "epoch": 7763} {"train_loss": -27.72135353088379, "global_step": 644343, "epoch": 7763} {"train_loss": -27.9799861907959, "global_step": 644344, "epoch": 7763} {"train_loss": -27.584308624267578, "global_step": 644345, "epoch": 7763} {"train_loss": -27.716144561767578, "global_step": 644346, "epoch": 7763} {"train_loss": -27.785497665405273, "global_step": 644347, "epoch": 7763} {"train_loss": -27.96551513671875, "global_step": 644348, "epoch": 7763} {"train_loss": -27.731847763061523, "global_step": 644349, "epoch": 7763} {"train_loss": -27.677021026611328, "global_step": 644350, "epoch": 7763} {"train_loss": -28.1335391998291, "global_step": 644351, "epoch": 7763} {"train_loss": -28.219894409179688, "global_step": 644352, "epoch": 7763} {"train_loss": -27.908185958862305, "global_step": 644353, "epoch": 7763} {"train_loss": -28.035797119140625, "global_step": 644354, "epoch": 7763} {"train_loss": -28.154926300048828, "global_step": 644355, "epoch": 7763} {"train_loss": -27.992013931274414, "global_step": 644356, "epoch": 7763} {"train_loss": -27.991992950439453, "global_step": 644357, "epoch": 7763} {"train_loss": -28.18194580078125, "global_step": 644358, "epoch": 7763} {"train_loss": -27.75958251953125, "global_step": 644359, "epoch": 7763} {"train_loss": -28.135461807250977, "global_step": 644360, "epoch": 7763} {"train_loss": -28.51025390625, "global_step": 644361, "epoch": 7763} {"train_loss": -27.922693252563477, "global_step": 644362, "epoch": 7763} {"train_loss": -28.37158203125, "global_step": 644363, "epoch": 7763} {"train_loss": -28.24297523498535, "global_step": 644364, "epoch": 7763} {"train_loss": -28.411985397338867, "global_step": 644365, "epoch": 7763} {"train_loss": -28.439844131469727, "global_step": 644366, "epoch": 7763} {"train_loss": -28.357263565063477, "global_step": 644367, "epoch": 7763} {"train_loss": -28.021764755249023, "global_step": 644368, "epoch": 7763} {"train_loss": -27.957172393798828, "global_step": 644369, "epoch": 7763} {"train_loss": -28.15382194519043, "global_step": 644370, "epoch": 7763} {"train_loss": -28.275190353393555, "global_step": 644371, "epoch": 7763} {"train_loss": -28.421247482299805, "global_step": 644372, "epoch": 7763} {"train_loss": -28.54166030883789, "global_step": 644373, "epoch": 7763} {"train_loss": -28.3437442779541, "global_step": 644374, "epoch": 7763} {"train_loss": -28.624969482421875, "global_step": 644375, "epoch": 7763} {"train_loss": -28.17328453063965, "global_step": 644376, "epoch": 7763} {"train_loss": -28.27166748046875, "global_step": 644377, "epoch": 7763} {"train_loss": -28.23613929748535, "global_step": 644378, "epoch": 7763} {"train_loss": -28.026187896728516, "global_step": 644379, "epoch": 7763} {"train_loss": -28.01885986328125, "global_step": 644380, "epoch": 7763} {"train_loss": -28.044189453125, "global_step": 644381, "epoch": 7763} {"train_loss": -28.38427734375, "global_step": 644382, "epoch": 7763} {"train_loss": -28.439926147460938, "global_step": 644383, "epoch": 7763} {"train_loss": -28.23541259765625, "global_step": 644384, "epoch": 7763} {"train_loss": -28.293853759765625, "global_step": 644385, "epoch": 7763} {"train_loss": -28.346364974975586, "global_step": 644386, "epoch": 7763} {"train_loss": -28.64112663269043, "global_step": 644387, "epoch": 7763} {"train_loss": -28.7019100189209, "global_step": 644388, "epoch": 7763} {"train_loss": -28.669775009155273, "global_step": 644389, "epoch": 7763} {"train_loss": -28.627485275268555, "global_step": 644390, "epoch": 7763} {"train_loss": -27.958585739135742, "global_step": 644391, "epoch": 7763} {"train_loss": -28.68757438659668, "global_step": 644392, "epoch": 7763} {"train_loss": -28.420074462890625, "global_step": 644393, "epoch": 7763} {"train_loss": -28.179487228393555, "global_step": 644394, "epoch": 7763} {"train_loss": -28.32343864440918, "global_step": 644395, "epoch": 7763} {"train_loss": -28.672597885131836, "global_step": 644396, "epoch": 7763} {"train_loss": -28.099130630493164, "global_step": 644397, "epoch": 7763} {"train_loss": -28.46377944946289, "global_step": 644398, "epoch": 7763} {"train_loss": -28.348926544189453, "global_step": 644399, "epoch": 7763} {"train_loss": -28.621173858642578, "global_step": 644400, "epoch": 7763} {"train_loss": -28.21506118774414, "global_step": 644401, "epoch": 7763} {"train_loss": -28.36394691467285, "global_step": 644402, "epoch": 7763} {"train_loss": -28.494176864624023, "global_step": 644403, "epoch": 7763} {"train_loss": -28.129621505737305, "global_step": 644404, "epoch": 7763} {"train_loss": -28.731353759765625, "global_step": 644405, "epoch": 7763} {"train_loss": -28.08502769470215, "global_step": 644406, "epoch": 7763} {"train_loss": -28.17620849609375, "global_step": 644407, "epoch": 7763} {"train_loss": -28.335235595703125, "global_step": 644408, "epoch": 7763} {"train_loss": -28.299560546875, "global_step": 644409, "epoch": 7763} {"train_loss": -28.098630905151367, "global_step": 644410, "epoch": 7763} {"train_loss": -28.023129359785333, "global_step": 644411, "epoch": 7763, "val_loss": 6677926.5} {"train_loss": -28.19416618347168, "global_step": 644412, "epoch": 7764} {"train_loss": -27.3555908203125, "global_step": 644413, "epoch": 7764} {"train_loss": -27.85576820373535, "global_step": 644414, "epoch": 7764} {"train_loss": -27.475360870361328, "global_step": 644415, "epoch": 7764} {"train_loss": -27.43584632873535, "global_step": 644416, "epoch": 7764} {"train_loss": -27.425403594970703, "global_step": 644417, "epoch": 7764} {"train_loss": -27.77154541015625, "global_step": 644418, "epoch": 7764} {"train_loss": -27.803369522094727, "global_step": 644419, "epoch": 7764} {"train_loss": -28.51163101196289, "global_step": 644420, "epoch": 7764} {"train_loss": -27.745397567749023, "global_step": 644421, "epoch": 7764} {"train_loss": -27.870691299438477, "global_step": 644422, "epoch": 7764} {"train_loss": -28.225208282470703, "global_step": 644423, "epoch": 7764} {"train_loss": -27.7294921875, "global_step": 644424, "epoch": 7764} {"train_loss": -28.163516998291016, "global_step": 644425, "epoch": 7764} {"train_loss": -28.172332763671875, "global_step": 644426, "epoch": 7764} {"train_loss": -28.146839141845703, "global_step": 644427, "epoch": 7764} {"train_loss": -28.052915573120117, "global_step": 644428, "epoch": 7764} {"train_loss": -28.212757110595703, "global_step": 644429, "epoch": 7764} {"train_loss": -28.103534698486328, "global_step": 644430, "epoch": 7764} {"train_loss": -28.133743286132812, "global_step": 644431, "epoch": 7764} {"train_loss": -28.39961051940918, "global_step": 644432, "epoch": 7764} {"train_loss": -28.1956844329834, "global_step": 644433, "epoch": 7764} {"train_loss": -28.31672477722168, "global_step": 644434, "epoch": 7764} {"train_loss": -28.51861000061035, "global_step": 644435, "epoch": 7764} {"train_loss": -28.319107055664062, "global_step": 644436, "epoch": 7764} {"train_loss": -28.423208236694336, "global_step": 644437, "epoch": 7764} {"train_loss": -28.280019760131836, "global_step": 644438, "epoch": 7764} {"train_loss": -28.430418014526367, "global_step": 644439, "epoch": 7764} {"train_loss": -28.127349853515625, "global_step": 644440, "epoch": 7764} {"train_loss": -28.326858520507812, "global_step": 644441, "epoch": 7764} {"train_loss": -28.239301681518555, "global_step": 644442, "epoch": 7764} {"train_loss": -28.277313232421875, "global_step": 644443, "epoch": 7764} {"train_loss": -28.036481857299805, "global_step": 644444, "epoch": 7764} {"train_loss": -28.424604415893555, "global_step": 644445, "epoch": 7764} {"train_loss": -28.246740341186523, "global_step": 644446, "epoch": 7764} {"train_loss": -28.111478805541992, "global_step": 644447, "epoch": 7764} {"train_loss": -28.077472686767578, "global_step": 644448, "epoch": 7764} {"train_loss": -28.47327995300293, "global_step": 644449, "epoch": 7764} {"train_loss": -27.74433708190918, "global_step": 644450, "epoch": 7764} {"train_loss": -28.073205947875977, "global_step": 644451, "epoch": 7764} {"train_loss": -28.082056045532227, "global_step": 644452, "epoch": 7764} {"train_loss": -28.23671531677246, "global_step": 644453, "epoch": 7764} {"train_loss": -27.865514755249023, "global_step": 644454, "epoch": 7764} {"train_loss": -27.845983505249023, "global_step": 644455, "epoch": 7764} {"train_loss": -27.099842071533203, "global_step": 644456, "epoch": 7764} {"train_loss": -26.765241622924805, "global_step": 644457, "epoch": 7764} {"train_loss": -27.84230613708496, "global_step": 644458, "epoch": 7764} {"train_loss": -28.2274227142334, "global_step": 644459, "epoch": 7764} {"train_loss": -27.077960968017578, "global_step": 644460, "epoch": 7764} {"train_loss": -28.093896865844727, "global_step": 644461, "epoch": 7764} {"train_loss": -27.56501579284668, "global_step": 644462, "epoch": 7764} {"train_loss": -27.972736358642578, "global_step": 644463, "epoch": 7764} {"train_loss": -27.851022720336914, "global_step": 644464, "epoch": 7764} {"train_loss": -27.958362579345703, "global_step": 644465, "epoch": 7764} {"train_loss": -27.902257919311523, "global_step": 644466, "epoch": 7764} {"train_loss": -28.141422271728516, "global_step": 644467, "epoch": 7764} {"train_loss": -28.02131462097168, "global_step": 644468, "epoch": 7764} {"train_loss": -27.711639404296875, "global_step": 644469, "epoch": 7764} {"train_loss": -27.948944091796875, "global_step": 644470, "epoch": 7764} {"train_loss": -28.2578067779541, "global_step": 644471, "epoch": 7764} {"train_loss": -27.854467391967773, "global_step": 644472, "epoch": 7764} {"train_loss": -28.165868759155273, "global_step": 644473, "epoch": 7764} {"train_loss": -27.714588165283203, "global_step": 644474, "epoch": 7764} {"train_loss": -28.192296981811523, "global_step": 644475, "epoch": 7764} {"train_loss": -27.983047485351562, "global_step": 644476, "epoch": 7764} {"train_loss": -28.107177734375, "global_step": 644477, "epoch": 7764} {"train_loss": -27.898263931274414, "global_step": 644478, "epoch": 7764} {"train_loss": -28.456409454345703, "global_step": 644479, "epoch": 7764} {"train_loss": -27.986169815063477, "global_step": 644480, "epoch": 7764} {"train_loss": -27.86322021484375, "global_step": 644481, "epoch": 7764} {"train_loss": -27.891672134399414, "global_step": 644482, "epoch": 7764} {"train_loss": -28.1547794342041, "global_step": 644483, "epoch": 7764} {"train_loss": -28.618234634399414, "global_step": 644484, "epoch": 7764} {"train_loss": -28.29506492614746, "global_step": 644485, "epoch": 7764} {"train_loss": -28.214269638061523, "global_step": 644486, "epoch": 7764} {"train_loss": -28.461721420288086, "global_step": 644487, "epoch": 7764} {"train_loss": -28.340795516967773, "global_step": 644488, "epoch": 7764} {"train_loss": -28.259912490844727, "global_step": 644489, "epoch": 7764} {"train_loss": -28.33912467956543, "global_step": 644490, "epoch": 7764} {"train_loss": -28.707700729370117, "global_step": 644491, "epoch": 7764} {"train_loss": -28.30154800415039, "global_step": 644492, "epoch": 7764} {"train_loss": -28.196496963500977, "global_step": 644493, "epoch": 7764} {"train_loss": -28.03885841369629, "global_step": 644494, "epoch": 7764, "val_loss": 6622222.0} {"train_loss": -27.743009567260742, "global_step": 644495, "epoch": 7765} {"train_loss": -28.107839584350586, "global_step": 644496, "epoch": 7765} {"train_loss": -28.120275497436523, "global_step": 644497, "epoch": 7765} {"train_loss": -28.092376708984375, "global_step": 644498, "epoch": 7765} {"train_loss": -27.982595443725586, "global_step": 644499, "epoch": 7765} {"train_loss": -28.415571212768555, "global_step": 644500, "epoch": 7765} {"train_loss": -28.5476016998291, "global_step": 644501, "epoch": 7765} {"train_loss": -28.384199142456055, "global_step": 644502, "epoch": 7765} {"train_loss": -27.97210121154785, "global_step": 644503, "epoch": 7765} {"train_loss": -28.34324073791504, "global_step": 644504, "epoch": 7765} {"train_loss": -28.32038688659668, "global_step": 644505, "epoch": 7765} {"train_loss": -28.117895126342773, "global_step": 644506, "epoch": 7765} {"train_loss": -27.862634658813477, "global_step": 644507, "epoch": 7765} {"train_loss": -27.3621883392334, "global_step": 644508, "epoch": 7765} {"train_loss": -27.766447067260742, "global_step": 644509, "epoch": 7765} {"train_loss": -27.840641021728516, "global_step": 644510, "epoch": 7765} {"train_loss": -28.012495040893555, "global_step": 644511, "epoch": 7765} {"train_loss": -27.29729652404785, "global_step": 644512, "epoch": 7765} {"train_loss": -27.893314361572266, "global_step": 644513, "epoch": 7765} {"train_loss": -28.101911544799805, "global_step": 644514, "epoch": 7765} {"train_loss": -27.81263542175293, "global_step": 644515, "epoch": 7765} {"train_loss": -28.06227684020996, "global_step": 644516, "epoch": 7765} {"train_loss": -28.2761173248291, "global_step": 644517, "epoch": 7765} {"train_loss": -27.95440673828125, "global_step": 644518, "epoch": 7765} {"train_loss": -27.831613540649414, "global_step": 644519, "epoch": 7765} {"train_loss": -28.188772201538086, "global_step": 644520, "epoch": 7765} {"train_loss": -27.857196807861328, "global_step": 644521, "epoch": 7765} {"train_loss": -27.69906997680664, "global_step": 644522, "epoch": 7765} {"train_loss": -28.232574462890625, "global_step": 644523, "epoch": 7765} {"train_loss": -28.32673454284668, "global_step": 644524, "epoch": 7765} {"train_loss": -27.92511558532715, "global_step": 644525, "epoch": 7765} {"train_loss": -27.94144058227539, "global_step": 644526, "epoch": 7765} {"train_loss": -28.280853271484375, "global_step": 644527, "epoch": 7765} {"train_loss": -27.95947265625, "global_step": 644528, "epoch": 7765} {"train_loss": -28.211591720581055, "global_step": 644529, "epoch": 7765} {"train_loss": -28.509994506835938, "global_step": 644530, "epoch": 7765} {"train_loss": -27.914045333862305, "global_step": 644531, "epoch": 7765} {"train_loss": -28.150741577148438, "global_step": 644532, "epoch": 7765} {"train_loss": -28.372766494750977, "global_step": 644533, "epoch": 7765} {"train_loss": -28.03834342956543, "global_step": 644534, "epoch": 7765} {"train_loss": -28.426462173461914, "global_step": 644535, "epoch": 7765} {"train_loss": -28.159116744995117, "global_step": 644536, "epoch": 7765} {"train_loss": -28.590871810913086, "global_step": 644537, "epoch": 7765} {"train_loss": -28.325305938720703, "global_step": 644538, "epoch": 7765} {"train_loss": -28.193927764892578, "global_step": 644539, "epoch": 7765} {"train_loss": -28.385583877563477, "global_step": 644540, "epoch": 7765} {"train_loss": -28.37470817565918, "global_step": 644541, "epoch": 7765} {"train_loss": -28.518604278564453, "global_step": 644542, "epoch": 7765} {"train_loss": -28.256793975830078, "global_step": 644543, "epoch": 7765} {"train_loss": -28.1132869720459, "global_step": 644544, "epoch": 7765} {"train_loss": -28.433008193969727, "global_step": 644545, "epoch": 7765} {"train_loss": -28.378021240234375, "global_step": 644546, "epoch": 7765} {"train_loss": -28.2879638671875, "global_step": 644547, "epoch": 7765} {"train_loss": -28.529926300048828, "global_step": 644548, "epoch": 7765} {"train_loss": -28.46291160583496, "global_step": 644549, "epoch": 7765} {"train_loss": -28.431964874267578, "global_step": 644550, "epoch": 7765} {"train_loss": -28.988996505737305, "global_step": 644551, "epoch": 7765} {"train_loss": -28.90838623046875, "global_step": 644552, "epoch": 7765} {"train_loss": -28.414968490600586, "global_step": 644553, "epoch": 7765} {"train_loss": -28.49065589904785, "global_step": 644554, "epoch": 7765} {"train_loss": -28.666101455688477, "global_step": 644555, "epoch": 7765} {"train_loss": -28.320852279663086, "global_step": 644556, "epoch": 7765} {"train_loss": -28.6728572845459, "global_step": 644557, "epoch": 7765} {"train_loss": -28.389734268188477, "global_step": 644558, "epoch": 7765} {"train_loss": -28.185392379760742, "global_step": 644559, "epoch": 7765} {"train_loss": -28.001256942749023, "global_step": 644560, "epoch": 7765} {"train_loss": -28.359119415283203, "global_step": 644561, "epoch": 7765} {"train_loss": -28.2464656829834, "global_step": 644562, "epoch": 7765} {"train_loss": -28.45743751525879, "global_step": 644563, "epoch": 7765} {"train_loss": -28.558429718017578, "global_step": 644564, "epoch": 7765} {"train_loss": -28.430654525756836, "global_step": 644565, "epoch": 7765} {"train_loss": -28.282251358032227, "global_step": 644566, "epoch": 7765} {"train_loss": -28.603357315063477, "global_step": 644567, "epoch": 7765} {"train_loss": -28.547208786010742, "global_step": 644568, "epoch": 7765} {"train_loss": -28.63507080078125, "global_step": 644569, "epoch": 7765} {"train_loss": -28.208799362182617, "global_step": 644570, "epoch": 7765} {"train_loss": -28.08650016784668, "global_step": 644571, "epoch": 7765} {"train_loss": -28.461566925048828, "global_step": 644572, "epoch": 7765} {"train_loss": -27.956344604492188, "global_step": 644573, "epoch": 7765} {"train_loss": -27.79837989807129, "global_step": 644574, "epoch": 7765} {"train_loss": -28.6614933013916, "global_step": 644575, "epoch": 7765} {"train_loss": -28.351245880126953, "global_step": 644576, "epoch": 7765} {"train_loss": -28.22218423866364, "global_step": 644577, "epoch": 7765, "val_loss": 6611430.5} {"train_loss": -26.5952205657959, "global_step": 644578, "epoch": 7766} {"train_loss": -27.06231117248535, "global_step": 644579, "epoch": 7766} {"train_loss": -25.819477081298828, "global_step": 644580, "epoch": 7766} {"train_loss": -26.70798110961914, "global_step": 644581, "epoch": 7766} {"train_loss": -27.225263595581055, "global_step": 644582, "epoch": 7766} {"train_loss": -27.543292999267578, "global_step": 644583, "epoch": 7766} {"train_loss": -26.72663688659668, "global_step": 644584, "epoch": 7766} {"train_loss": -27.030914306640625, "global_step": 644585, "epoch": 7766} {"train_loss": -27.468679428100586, "global_step": 644586, "epoch": 7766} {"train_loss": -27.489362716674805, "global_step": 644587, "epoch": 7766} {"train_loss": -27.290084838867188, "global_step": 644588, "epoch": 7766} {"train_loss": -27.53755760192871, "global_step": 644589, "epoch": 7766} {"train_loss": -27.74234390258789, "global_step": 644590, "epoch": 7766} {"train_loss": -27.543466567993164, "global_step": 644591, "epoch": 7766} {"train_loss": -27.950788497924805, "global_step": 644592, "epoch": 7766} {"train_loss": -27.527729034423828, "global_step": 644593, "epoch": 7766} {"train_loss": -27.549596786499023, "global_step": 644594, "epoch": 7766} {"train_loss": -27.667112350463867, "global_step": 644595, "epoch": 7766} {"train_loss": -27.298858642578125, "global_step": 644596, "epoch": 7766} {"train_loss": -27.764984130859375, "global_step": 644597, "epoch": 7766} {"train_loss": -27.674833297729492, "global_step": 644598, "epoch": 7766} {"train_loss": -27.67085075378418, "global_step": 644599, "epoch": 7766} {"train_loss": -27.68531608581543, "global_step": 644600, "epoch": 7766} {"train_loss": -28.006322860717773, "global_step": 644601, "epoch": 7766} {"train_loss": -27.726770401000977, "global_step": 644602, "epoch": 7766} {"train_loss": -27.594263076782227, "global_step": 644603, "epoch": 7766} {"train_loss": -27.654935836791992, "global_step": 644604, "epoch": 7766} {"train_loss": -27.92706871032715, "global_step": 644605, "epoch": 7766} {"train_loss": -27.930221557617188, "global_step": 644606, "epoch": 7766} {"train_loss": -27.890478134155273, "global_step": 644607, "epoch": 7766} {"train_loss": -28.18562126159668, "global_step": 644608, "epoch": 7766} {"train_loss": -28.136524200439453, "global_step": 644609, "epoch": 7766} {"train_loss": -27.954303741455078, "global_step": 644610, "epoch": 7766} {"train_loss": -27.856740951538086, "global_step": 644611, "epoch": 7766} {"train_loss": -28.096601486206055, "global_step": 644612, "epoch": 7766} {"train_loss": -28.101675033569336, "global_step": 644613, "epoch": 7766} {"train_loss": -27.967710494995117, "global_step": 644614, "epoch": 7766} {"train_loss": -28.098297119140625, "global_step": 644615, "epoch": 7766} {"train_loss": -28.132410049438477, "global_step": 644616, "epoch": 7766} {"train_loss": -28.193439483642578, "global_step": 644617, "epoch": 7766} {"train_loss": -27.997236251831055, "global_step": 644618, "epoch": 7766} {"train_loss": -27.740863800048828, "global_step": 644619, "epoch": 7766} {"train_loss": -28.227996826171875, "global_step": 644620, "epoch": 7766} {"train_loss": -28.051074981689453, "global_step": 644621, "epoch": 7766} {"train_loss": -27.962879180908203, "global_step": 644622, "epoch": 7766} {"train_loss": -27.944812774658203, "global_step": 644623, "epoch": 7766} {"train_loss": -28.212665557861328, "global_step": 644624, "epoch": 7766} {"train_loss": -28.707305908203125, "global_step": 644625, "epoch": 7766} {"train_loss": -28.075637817382812, "global_step": 644626, "epoch": 7766} {"train_loss": -28.52797508239746, "global_step": 644627, "epoch": 7766} {"train_loss": -28.370574951171875, "global_step": 644628, "epoch": 7766} {"train_loss": -28.736127853393555, "global_step": 644629, "epoch": 7766} {"train_loss": -28.415210723876953, "global_step": 644630, "epoch": 7766} {"train_loss": -28.65626335144043, "global_step": 644631, "epoch": 7766} {"train_loss": -28.365436553955078, "global_step": 644632, "epoch": 7766} {"train_loss": -28.33335304260254, "global_step": 644633, "epoch": 7766} {"train_loss": -28.503347396850586, "global_step": 644634, "epoch": 7766} {"train_loss": -28.519758224487305, "global_step": 644635, "epoch": 7766} {"train_loss": -28.43798828125, "global_step": 644636, "epoch": 7766} {"train_loss": -28.317792892456055, "global_step": 644637, "epoch": 7766} {"train_loss": -28.522085189819336, "global_step": 644638, "epoch": 7766} {"train_loss": -28.438962936401367, "global_step": 644639, "epoch": 7766} {"train_loss": -28.53373146057129, "global_step": 644640, "epoch": 7766} {"train_loss": -28.435571670532227, "global_step": 644641, "epoch": 7766} {"train_loss": -28.50360107421875, "global_step": 644642, "epoch": 7766} {"train_loss": -28.388208389282227, "global_step": 644643, "epoch": 7766} {"train_loss": -28.4647216796875, "global_step": 644644, "epoch": 7766} {"train_loss": -28.36905860900879, "global_step": 644645, "epoch": 7766} {"train_loss": -28.677555084228516, "global_step": 644646, "epoch": 7766} {"train_loss": -28.31943702697754, "global_step": 644647, "epoch": 7766} {"train_loss": -28.690114974975586, "global_step": 644648, "epoch": 7766} {"train_loss": -28.60308837890625, "global_step": 644649, "epoch": 7766} {"train_loss": -28.420886993408203, "global_step": 644650, "epoch": 7766} {"train_loss": -28.196439743041992, "global_step": 644651, "epoch": 7766} {"train_loss": -28.4400691986084, "global_step": 644652, "epoch": 7766} {"train_loss": -28.171096801757812, "global_step": 644653, "epoch": 7766} {"train_loss": -28.547592163085938, "global_step": 644654, "epoch": 7766} {"train_loss": -28.43842124938965, "global_step": 644655, "epoch": 7766} {"train_loss": -28.20364761352539, "global_step": 644656, "epoch": 7766} {"train_loss": -28.16609001159668, "global_step": 644657, "epoch": 7766} {"train_loss": -28.14006996154785, "global_step": 644658, "epoch": 7766} {"train_loss": -28.527435302734375, "global_step": 644659, "epoch": 7766} {"train_loss": -28.005318745073065, "global_step": 644660, "epoch": 7766, "val_loss": 6642333.0} {"train_loss": -26.546894073486328, "global_step": 644661, "epoch": 7767} {"train_loss": -24.713918685913086, "global_step": 644662, "epoch": 7767} {"train_loss": -24.635969161987305, "global_step": 644663, "epoch": 7767} {"train_loss": -26.61971092224121, "global_step": 644664, "epoch": 7767} {"train_loss": -26.185937881469727, "global_step": 644665, "epoch": 7767} {"train_loss": -26.879791259765625, "global_step": 644666, "epoch": 7767} {"train_loss": -26.178741455078125, "global_step": 644667, "epoch": 7767} {"train_loss": -27.396514892578125, "global_step": 644668, "epoch": 7767} {"train_loss": -26.82862663269043, "global_step": 644669, "epoch": 7767} {"train_loss": -27.49561882019043, "global_step": 644670, "epoch": 7767} {"train_loss": -27.042163848876953, "global_step": 644671, "epoch": 7767} {"train_loss": -26.788944244384766, "global_step": 644672, "epoch": 7767} {"train_loss": -27.720190048217773, "global_step": 644673, "epoch": 7767} {"train_loss": -27.263259887695312, "global_step": 644674, "epoch": 7767} {"train_loss": -27.4478702545166, "global_step": 644675, "epoch": 7767} {"train_loss": -27.69293785095215, "global_step": 644676, "epoch": 7767} {"train_loss": -27.745336532592773, "global_step": 644677, "epoch": 7767} {"train_loss": -26.889928817749023, "global_step": 644678, "epoch": 7767} {"train_loss": -27.987903594970703, "global_step": 644679, "epoch": 7767} {"train_loss": -27.614151000976562, "global_step": 644680, "epoch": 7767} {"train_loss": -27.64656639099121, "global_step": 644681, "epoch": 7767} {"train_loss": -27.262121200561523, "global_step": 644682, "epoch": 7767} {"train_loss": -27.547245025634766, "global_step": 644683, "epoch": 7767} {"train_loss": -27.675378799438477, "global_step": 644684, "epoch": 7767} {"train_loss": -27.683820724487305, "global_step": 644685, "epoch": 7767} {"train_loss": -27.264270782470703, "global_step": 644686, "epoch": 7767} {"train_loss": -27.58732032775879, "global_step": 644687, "epoch": 7767} {"train_loss": -27.632184982299805, "global_step": 644688, "epoch": 7767} {"train_loss": -27.78684425354004, "global_step": 644689, "epoch": 7767} {"train_loss": -27.420013427734375, "global_step": 644690, "epoch": 7767} {"train_loss": -27.746814727783203, "global_step": 644691, "epoch": 7767} {"train_loss": -28.11707878112793, "global_step": 644692, "epoch": 7767} {"train_loss": -27.744001388549805, "global_step": 644693, "epoch": 7767} {"train_loss": -27.847131729125977, "global_step": 644694, "epoch": 7767} {"train_loss": -27.99139404296875, "global_step": 644695, "epoch": 7767} {"train_loss": -27.82826042175293, "global_step": 644696, "epoch": 7767} {"train_loss": -27.89531898498535, "global_step": 644697, "epoch": 7767} {"train_loss": -27.846410751342773, "global_step": 644698, "epoch": 7767} {"train_loss": -28.153711318969727, "global_step": 644699, "epoch": 7767} {"train_loss": -27.88132095336914, "global_step": 644700, "epoch": 7767} {"train_loss": -28.018091201782227, "global_step": 644701, "epoch": 7767} {"train_loss": -28.198694229125977, "global_step": 644702, "epoch": 7767} {"train_loss": -28.265552520751953, "global_step": 644703, "epoch": 7767} {"train_loss": -28.394989013671875, "global_step": 644704, "epoch": 7767} {"train_loss": -28.143173217773438, "global_step": 644705, "epoch": 7767} {"train_loss": -28.022497177124023, "global_step": 644706, "epoch": 7767} {"train_loss": -27.794275283813477, "global_step": 644707, "epoch": 7767} {"train_loss": -28.3095760345459, "global_step": 644708, "epoch": 7767} {"train_loss": -28.197254180908203, "global_step": 644709, "epoch": 7767} {"train_loss": -28.035369873046875, "global_step": 644710, "epoch": 7767} {"train_loss": -28.461572647094727, "global_step": 644711, "epoch": 7767} {"train_loss": -28.18086051940918, "global_step": 644712, "epoch": 7767} {"train_loss": -28.507171630859375, "global_step": 644713, "epoch": 7767} {"train_loss": -28.290632247924805, "global_step": 644714, "epoch": 7767} {"train_loss": -28.554519653320312, "global_step": 644715, "epoch": 7767} {"train_loss": -28.098657608032227, "global_step": 644716, "epoch": 7767} {"train_loss": -28.144392013549805, "global_step": 644717, "epoch": 7767} {"train_loss": -28.20747184753418, "global_step": 644718, "epoch": 7767} {"train_loss": -28.560810089111328, "global_step": 644719, "epoch": 7767} {"train_loss": -28.37037467956543, "global_step": 644720, "epoch": 7767} {"train_loss": -28.302703857421875, "global_step": 644721, "epoch": 7767} {"train_loss": -28.3768253326416, "global_step": 644722, "epoch": 7767} {"train_loss": -28.228158950805664, "global_step": 644723, "epoch": 7767} {"train_loss": -28.492521286010742, "global_step": 644724, "epoch": 7767} {"train_loss": -28.38751220703125, "global_step": 644725, "epoch": 7767} {"train_loss": -27.950519561767578, "global_step": 644726, "epoch": 7767} {"train_loss": -28.685327529907227, "global_step": 644727, "epoch": 7767} {"train_loss": -28.45086097717285, "global_step": 644728, "epoch": 7767} {"train_loss": -28.37070655822754, "global_step": 644729, "epoch": 7767} {"train_loss": -28.558612823486328, "global_step": 644730, "epoch": 7767} {"train_loss": -28.15093994140625, "global_step": 644731, "epoch": 7767} {"train_loss": -28.396778106689453, "global_step": 644732, "epoch": 7767} {"train_loss": -28.170255661010742, "global_step": 644733, "epoch": 7767} {"train_loss": -28.117334365844727, "global_step": 644734, "epoch": 7767} {"train_loss": -28.224262237548828, "global_step": 644735, "epoch": 7767} {"train_loss": -28.49762535095215, "global_step": 644736, "epoch": 7767} {"train_loss": -28.4482479095459, "global_step": 644737, "epoch": 7767} {"train_loss": -28.24951171875, "global_step": 644738, "epoch": 7767} {"train_loss": -28.265567779541016, "global_step": 644739, "epoch": 7767} {"train_loss": -28.39930534362793, "global_step": 644740, "epoch": 7767} {"train_loss": -27.850509643554688, "global_step": 644741, "epoch": 7767} {"train_loss": -28.061304092407227, "global_step": 644742, "epoch": 7767} {"train_loss": -27.79889791557588, "global_step": 644743, "epoch": 7767, "val_loss": 6724684.0} {"train_loss": -27.8918514251709, "global_step": 644744, "epoch": 7768} {"train_loss": -27.802343368530273, "global_step": 644745, "epoch": 7768} {"train_loss": -27.413808822631836, "global_step": 644746, "epoch": 7768} {"train_loss": -27.488088607788086, "global_step": 644747, "epoch": 7768} {"train_loss": -27.4390811920166, "global_step": 644748, "epoch": 7768} {"train_loss": -27.07850456237793, "global_step": 644749, "epoch": 7768} {"train_loss": -28.023929595947266, "global_step": 644750, "epoch": 7768} {"train_loss": -27.47894287109375, "global_step": 644751, "epoch": 7768} {"train_loss": -28.097488403320312, "global_step": 644752, "epoch": 7768} {"train_loss": -27.746625900268555, "global_step": 644753, "epoch": 7768} {"train_loss": -27.61279296875, "global_step": 644754, "epoch": 7768} {"train_loss": -27.815658569335938, "global_step": 644755, "epoch": 7768} {"train_loss": -27.87447166442871, "global_step": 644756, "epoch": 7768} {"train_loss": -28.2080020904541, "global_step": 644757, "epoch": 7768} {"train_loss": -28.00750160217285, "global_step": 644758, "epoch": 7768} {"train_loss": -28.146167755126953, "global_step": 644759, "epoch": 7768} {"train_loss": -28.228057861328125, "global_step": 644760, "epoch": 7768} {"train_loss": -28.09413719177246, "global_step": 644761, "epoch": 7768} {"train_loss": -28.099990844726562, "global_step": 644762, "epoch": 7768} {"train_loss": -28.304956436157227, "global_step": 644763, "epoch": 7768} {"train_loss": -28.515228271484375, "global_step": 644764, "epoch": 7768} {"train_loss": -28.407651901245117, "global_step": 644765, "epoch": 7768} {"train_loss": -28.125288009643555, "global_step": 644766, "epoch": 7768} {"train_loss": -28.010183334350586, "global_step": 644767, "epoch": 7768} {"train_loss": -28.36220359802246, "global_step": 644768, "epoch": 7768} {"train_loss": -27.918598175048828, "global_step": 644769, "epoch": 7768} {"train_loss": -28.387893676757812, "global_step": 644770, "epoch": 7768} {"train_loss": -28.041040420532227, "global_step": 644771, "epoch": 7768} {"train_loss": -28.5985050201416, "global_step": 644772, "epoch": 7768} {"train_loss": -28.509931564331055, "global_step": 644773, "epoch": 7768} {"train_loss": -28.58383560180664, "global_step": 644774, "epoch": 7768} {"train_loss": -28.365217208862305, "global_step": 644775, "epoch": 7768} {"train_loss": -28.364154815673828, "global_step": 644776, "epoch": 7768} {"train_loss": -28.54571533203125, "global_step": 644777, "epoch": 7768} {"train_loss": -28.29266929626465, "global_step": 644778, "epoch": 7768} {"train_loss": -28.197601318359375, "global_step": 644779, "epoch": 7768} {"train_loss": -28.389917373657227, "global_step": 644780, "epoch": 7768} {"train_loss": -28.624929428100586, "global_step": 644781, "epoch": 7768} {"train_loss": -28.562448501586914, "global_step": 644782, "epoch": 7768} {"train_loss": -28.324634552001953, "global_step": 644783, "epoch": 7768} {"train_loss": -28.4375057220459, "global_step": 644784, "epoch": 7768} {"train_loss": -28.094396591186523, "global_step": 644785, "epoch": 7768} {"train_loss": -28.12322425842285, "global_step": 644786, "epoch": 7768} {"train_loss": -28.15589714050293, "global_step": 644787, "epoch": 7768} {"train_loss": -28.513092041015625, "global_step": 644788, "epoch": 7768} {"train_loss": -28.69854164123535, "global_step": 644789, "epoch": 7768} {"train_loss": -28.459386825561523, "global_step": 644790, "epoch": 7768} {"train_loss": -28.50439453125, "global_step": 644791, "epoch": 7768} {"train_loss": -28.402191162109375, "global_step": 644792, "epoch": 7768} {"train_loss": -28.71435546875, "global_step": 644793, "epoch": 7768} {"train_loss": -28.4103946685791, "global_step": 644794, "epoch": 7768} {"train_loss": -28.55415153503418, "global_step": 644795, "epoch": 7768} {"train_loss": -28.324914932250977, "global_step": 644796, "epoch": 7768} {"train_loss": -28.418182373046875, "global_step": 644797, "epoch": 7768} {"train_loss": -28.36979103088379, "global_step": 644798, "epoch": 7768} {"train_loss": -28.477880477905273, "global_step": 644799, "epoch": 7768} {"train_loss": -28.475112915039062, "global_step": 644800, "epoch": 7768} {"train_loss": -28.604373931884766, "global_step": 644801, "epoch": 7768} {"train_loss": -28.69367790222168, "global_step": 644802, "epoch": 7768} {"train_loss": -28.4424991607666, "global_step": 644803, "epoch": 7768} {"train_loss": -28.618152618408203, "global_step": 644804, "epoch": 7768} {"train_loss": -28.569677352905273, "global_step": 644805, "epoch": 7768} {"train_loss": -28.32525062561035, "global_step": 644806, "epoch": 7768} {"train_loss": -27.923669815063477, "global_step": 644807, "epoch": 7768} {"train_loss": -27.602691650390625, "global_step": 644808, "epoch": 7768} {"train_loss": -26.512067794799805, "global_step": 644809, "epoch": 7768} {"train_loss": -27.471817016601562, "global_step": 644810, "epoch": 7768} {"train_loss": -27.809539794921875, "global_step": 644811, "epoch": 7768} {"train_loss": -26.728961944580078, "global_step": 644812, "epoch": 7768} {"train_loss": -26.80042839050293, "global_step": 644813, "epoch": 7768} {"train_loss": -27.865161895751953, "global_step": 644814, "epoch": 7768} {"train_loss": -28.15374755859375, "global_step": 644815, "epoch": 7768} {"train_loss": -27.796545028686523, "global_step": 644816, "epoch": 7768} {"train_loss": -28.16829490661621, "global_step": 644817, "epoch": 7768} {"train_loss": -27.906789779663086, "global_step": 644818, "epoch": 7768} {"train_loss": -28.469562530517578, "global_step": 644819, "epoch": 7768} {"train_loss": -27.547143936157227, "global_step": 644820, "epoch": 7768} {"train_loss": -28.05615234375, "global_step": 644821, "epoch": 7768} {"train_loss": -27.931167602539062, "global_step": 644822, "epoch": 7768} {"train_loss": -27.712446212768555, "global_step": 644823, "epoch": 7768} {"train_loss": -28.116851806640625, "global_step": 644824, "epoch": 7768} {"train_loss": -27.890125274658203, "global_step": 644825, "epoch": 7768} {"train_loss": -28.104593345917852, "global_step": 644826, "epoch": 7768, "val_loss": 6742660.5} {"train_loss": -27.85223960876465, "global_step": 644827, "epoch": 7769} {"train_loss": -27.642425537109375, "global_step": 644828, "epoch": 7769} {"train_loss": -27.597461700439453, "global_step": 644829, "epoch": 7769} {"train_loss": -27.29975700378418, "global_step": 644830, "epoch": 7769} {"train_loss": -27.408613204956055, "global_step": 644831, "epoch": 7769} {"train_loss": -27.7921199798584, "global_step": 644832, "epoch": 7769} {"train_loss": -27.8570556640625, "global_step": 644833, "epoch": 7769} {"train_loss": -27.117435455322266, "global_step": 644834, "epoch": 7769} {"train_loss": -27.971954345703125, "global_step": 644835, "epoch": 7769} {"train_loss": -27.621795654296875, "global_step": 644836, "epoch": 7769} {"train_loss": -27.610153198242188, "global_step": 644837, "epoch": 7769} {"train_loss": -27.983993530273438, "global_step": 644838, "epoch": 7769} {"train_loss": -27.790433883666992, "global_step": 644839, "epoch": 7769} {"train_loss": -28.15395164489746, "global_step": 644840, "epoch": 7769} {"train_loss": -27.755834579467773, "global_step": 644841, "epoch": 7769} {"train_loss": -27.854047775268555, "global_step": 644842, "epoch": 7769} {"train_loss": -27.6735782623291, "global_step": 644843, "epoch": 7769} {"train_loss": -28.17042350769043, "global_step": 644844, "epoch": 7769} {"train_loss": -27.976776123046875, "global_step": 644845, "epoch": 7769} {"train_loss": -27.8856143951416, "global_step": 644846, "epoch": 7769} {"train_loss": -28.075403213500977, "global_step": 644847, "epoch": 7769} {"train_loss": -28.406118392944336, "global_step": 644848, "epoch": 7769} {"train_loss": -28.272216796875, "global_step": 644849, "epoch": 7769} {"train_loss": -28.240461349487305, "global_step": 644850, "epoch": 7769} {"train_loss": -28.03560447692871, "global_step": 644851, "epoch": 7769} {"train_loss": -28.27998924255371, "global_step": 644852, "epoch": 7769} {"train_loss": -28.35308837890625, "global_step": 644853, "epoch": 7769} {"train_loss": -28.13258171081543, "global_step": 644854, "epoch": 7769} {"train_loss": -28.505218505859375, "global_step": 644855, "epoch": 7769} {"train_loss": -28.69514274597168, "global_step": 644856, "epoch": 7769} {"train_loss": -28.576101303100586, "global_step": 644857, "epoch": 7769} {"train_loss": -28.417633056640625, "global_step": 644858, "epoch": 7769} {"train_loss": -28.679718017578125, "global_step": 644859, "epoch": 7769} {"train_loss": -28.22216796875, "global_step": 644860, "epoch": 7769} {"train_loss": -28.374418258666992, "global_step": 644861, "epoch": 7769} {"train_loss": -28.370100021362305, "global_step": 644862, "epoch": 7769} {"train_loss": -28.42438316345215, "global_step": 644863, "epoch": 7769} {"train_loss": -28.630023956298828, "global_step": 644864, "epoch": 7769} {"train_loss": -28.577863693237305, "global_step": 644865, "epoch": 7769} {"train_loss": -28.159799575805664, "global_step": 644866, "epoch": 7769} {"train_loss": -28.53641700744629, "global_step": 644867, "epoch": 7769} {"train_loss": -28.260618209838867, "global_step": 644868, "epoch": 7769} {"train_loss": -28.20121192932129, "global_step": 644869, "epoch": 7769} {"train_loss": -28.327905654907227, "global_step": 644870, "epoch": 7769} {"train_loss": -28.509252548217773, "global_step": 644871, "epoch": 7769} {"train_loss": -28.30182456970215, "global_step": 644872, "epoch": 7769} {"train_loss": -28.473718643188477, "global_step": 644873, "epoch": 7769} {"train_loss": -28.82427406311035, "global_step": 644874, "epoch": 7769} {"train_loss": -28.48358726501465, "global_step": 644875, "epoch": 7769} {"train_loss": -28.50946044921875, "global_step": 644876, "epoch": 7769} {"train_loss": -28.374128341674805, "global_step": 644877, "epoch": 7769} {"train_loss": -28.373746871948242, "global_step": 644878, "epoch": 7769} {"train_loss": -28.480899810791016, "global_step": 644879, "epoch": 7769} {"train_loss": -28.132831573486328, "global_step": 644880, "epoch": 7769} {"train_loss": -27.666614532470703, "global_step": 644881, "epoch": 7769} {"train_loss": -26.720458984375, "global_step": 644882, "epoch": 7769} {"train_loss": -26.384672164916992, "global_step": 644883, "epoch": 7769} {"train_loss": -26.715469360351562, "global_step": 644884, "epoch": 7769} {"train_loss": -28.029333114624023, "global_step": 644885, "epoch": 7769} {"train_loss": -27.639646530151367, "global_step": 644886, "epoch": 7769} {"train_loss": -28.0948543548584, "global_step": 644887, "epoch": 7769} {"train_loss": -27.762466430664062, "global_step": 644888, "epoch": 7769} {"train_loss": -27.75663185119629, "global_step": 644889, "epoch": 7769} {"train_loss": -28.39528465270996, "global_step": 644890, "epoch": 7769} {"train_loss": -27.91189956665039, "global_step": 644891, "epoch": 7769} {"train_loss": -27.9956111907959, "global_step": 644892, "epoch": 7769} {"train_loss": -28.273359298706055, "global_step": 644893, "epoch": 7769} {"train_loss": -28.370975494384766, "global_step": 644894, "epoch": 7769} {"train_loss": -28.25115394592285, "global_step": 644895, "epoch": 7769} {"train_loss": -28.33866310119629, "global_step": 644896, "epoch": 7769} {"train_loss": -27.990808486938477, "global_step": 644897, "epoch": 7769} {"train_loss": -27.700977325439453, "global_step": 644898, "epoch": 7769} {"train_loss": -28.515844345092773, "global_step": 644899, "epoch": 7769} {"train_loss": -27.81556510925293, "global_step": 644900, "epoch": 7769} {"train_loss": -28.1357479095459, "global_step": 644901, "epoch": 7769} {"train_loss": -28.3625431060791, "global_step": 644902, "epoch": 7769} {"train_loss": -27.834692001342773, "global_step": 644903, "epoch": 7769} {"train_loss": -28.269617080688477, "global_step": 644904, "epoch": 7769} {"train_loss": -28.34881019592285, "global_step": 644905, "epoch": 7769} {"train_loss": -27.97604751586914, "global_step": 644906, "epoch": 7769} {"train_loss": -28.489044189453125, "global_step": 644907, "epoch": 7769} {"train_loss": -28.32417106628418, "global_step": 644908, "epoch": 7769} {"train_loss": -28.07737807767937, "global_step": 644909, "epoch": 7769, "val_loss": 6751172.0} {"train_loss": -27.97745132446289, "global_step": 644910, "epoch": 7770} {"train_loss": -27.599897384643555, "global_step": 644911, "epoch": 7770} {"train_loss": -27.723432540893555, "global_step": 644912, "epoch": 7770} {"train_loss": -27.992944717407227, "global_step": 644913, "epoch": 7770} {"train_loss": -27.701513290405273, "global_step": 644914, "epoch": 7770} {"train_loss": -27.910552978515625, "global_step": 644915, "epoch": 7770} {"train_loss": -27.65687370300293, "global_step": 644916, "epoch": 7770} {"train_loss": -27.179981231689453, "global_step": 644917, "epoch": 7770} {"train_loss": -28.081745147705078, "global_step": 644918, "epoch": 7770} {"train_loss": -27.801776885986328, "global_step": 644919, "epoch": 7770} {"train_loss": -27.676733016967773, "global_step": 644920, "epoch": 7770} {"train_loss": -28.077966690063477, "global_step": 644921, "epoch": 7770} {"train_loss": -28.066314697265625, "global_step": 644922, "epoch": 7770} {"train_loss": -27.928709030151367, "global_step": 644923, "epoch": 7770} {"train_loss": -27.760705947875977, "global_step": 644924, "epoch": 7770} {"train_loss": -28.131534576416016, "global_step": 644925, "epoch": 7770} {"train_loss": -28.099889755249023, "global_step": 644926, "epoch": 7770} {"train_loss": -28.49491310119629, "global_step": 644927, "epoch": 7770} {"train_loss": -28.172428131103516, "global_step": 644928, "epoch": 7770} {"train_loss": -27.990461349487305, "global_step": 644929, "epoch": 7770} {"train_loss": -27.70966911315918, "global_step": 644930, "epoch": 7770} {"train_loss": -28.387939453125, "global_step": 644931, "epoch": 7770} {"train_loss": -28.064380645751953, "global_step": 644932, "epoch": 7770} {"train_loss": -28.390869140625, "global_step": 644933, "epoch": 7770} {"train_loss": -28.25885009765625, "global_step": 644934, "epoch": 7770} {"train_loss": -28.12003517150879, "global_step": 644935, "epoch": 7770} {"train_loss": -28.151269912719727, "global_step": 644936, "epoch": 7770} {"train_loss": -28.270795822143555, "global_step": 644937, "epoch": 7770} {"train_loss": -28.208520889282227, "global_step": 644938, "epoch": 7770} {"train_loss": -28.3648681640625, "global_step": 644939, "epoch": 7770} {"train_loss": -28.6080322265625, "global_step": 644940, "epoch": 7770} {"train_loss": -27.656524658203125, "global_step": 644941, "epoch": 7770} {"train_loss": -28.247419357299805, "global_step": 644942, "epoch": 7770} {"train_loss": -28.171716690063477, "global_step": 644943, "epoch": 7770} {"train_loss": -28.459625244140625, "global_step": 644944, "epoch": 7770} {"train_loss": -28.198963165283203, "global_step": 644945, "epoch": 7770} {"train_loss": -28.339675903320312, "global_step": 644946, "epoch": 7770} {"train_loss": -28.5074520111084, "global_step": 644947, "epoch": 7770} {"train_loss": -28.22064208984375, "global_step": 644948, "epoch": 7770} {"train_loss": -28.2314395904541, "global_step": 644949, "epoch": 7770} {"train_loss": -28.424575805664062, "global_step": 644950, "epoch": 7770} {"train_loss": -28.330549240112305, "global_step": 644951, "epoch": 7770} {"train_loss": -28.0856990814209, "global_step": 644952, "epoch": 7770} {"train_loss": -28.242450714111328, "global_step": 644953, "epoch": 7770} {"train_loss": -28.5167293548584, "global_step": 644954, "epoch": 7770} {"train_loss": -28.050207138061523, "global_step": 644955, "epoch": 7770} {"train_loss": -27.853015899658203, "global_step": 644956, "epoch": 7770} {"train_loss": -28.29791831970215, "global_step": 644957, "epoch": 7770} {"train_loss": -28.22797203063965, "global_step": 644958, "epoch": 7770} {"train_loss": -28.126449584960938, "global_step": 644959, "epoch": 7770} {"train_loss": -27.849267959594727, "global_step": 644960, "epoch": 7770} {"train_loss": -28.0937557220459, "global_step": 644961, "epoch": 7770} {"train_loss": -28.0782470703125, "global_step": 644962, "epoch": 7770} {"train_loss": -28.20444107055664, "global_step": 644963, "epoch": 7770} {"train_loss": -28.07425308227539, "global_step": 644964, "epoch": 7770} {"train_loss": -28.27313232421875, "global_step": 644965, "epoch": 7770} {"train_loss": -28.106353759765625, "global_step": 644966, "epoch": 7770} {"train_loss": -28.334793090820312, "global_step": 644967, "epoch": 7770} {"train_loss": -28.00748634338379, "global_step": 644968, "epoch": 7770} {"train_loss": -28.666311264038086, "global_step": 644969, "epoch": 7770} {"train_loss": -28.233570098876953, "global_step": 644970, "epoch": 7770} {"train_loss": -28.395374298095703, "global_step": 644971, "epoch": 7770} {"train_loss": -27.93936538696289, "global_step": 644972, "epoch": 7770} {"train_loss": -28.46124839782715, "global_step": 644973, "epoch": 7770} {"train_loss": -28.380512237548828, "global_step": 644974, "epoch": 7770} {"train_loss": -28.104602813720703, "global_step": 644975, "epoch": 7770} {"train_loss": -28.5042667388916, "global_step": 644976, "epoch": 7770} {"train_loss": -28.704694747924805, "global_step": 644977, "epoch": 7770} {"train_loss": -28.35127067565918, "global_step": 644978, "epoch": 7770} {"train_loss": -28.455795288085938, "global_step": 644979, "epoch": 7770} {"train_loss": -28.638446807861328, "global_step": 644980, "epoch": 7770} {"train_loss": -28.473108291625977, "global_step": 644981, "epoch": 7770} {"train_loss": -28.274518966674805, "global_step": 644982, "epoch": 7770} {"train_loss": -28.64569091796875, "global_step": 644983, "epoch": 7770} {"train_loss": -28.62688636779785, "global_step": 644984, "epoch": 7770} {"train_loss": -27.894622802734375, "global_step": 644985, "epoch": 7770} {"train_loss": -28.07990837097168, "global_step": 644986, "epoch": 7770} {"train_loss": -28.550809860229492, "global_step": 644987, "epoch": 7770} {"train_loss": -28.36749839782715, "global_step": 644988, "epoch": 7770} {"train_loss": -28.39887809753418, "global_step": 644989, "epoch": 7770} {"train_loss": -28.388418197631836, "global_step": 644990, "epoch": 7770} {"train_loss": -28.568883895874023, "global_step": 644991, "epoch": 7770} {"train_loss": -28.17658502509795, "global_step": 644992, "epoch": 7770, "val_loss": 6773419.0} {"train_loss": -28.084075927734375, "global_step": 644993, "epoch": 7771} {"train_loss": -27.496368408203125, "global_step": 644994, "epoch": 7771} {"train_loss": -27.905872344970703, "global_step": 644995, "epoch": 7771} {"train_loss": -28.255786895751953, "global_step": 644996, "epoch": 7771} {"train_loss": -28.155019760131836, "global_step": 644997, "epoch": 7771} {"train_loss": -28.218017578125, "global_step": 644998, "epoch": 7771} {"train_loss": -27.757688522338867, "global_step": 644999, "epoch": 7771} {"train_loss": -28.081512451171875, "global_step": 645000, "epoch": 7771} {"train_loss": -28.07343101501465, "global_step": 645001, "epoch": 7771} {"train_loss": -27.6919002532959, "global_step": 645002, "epoch": 7771} {"train_loss": -27.963232040405273, "global_step": 645003, "epoch": 7771} {"train_loss": -28.27332878112793, "global_step": 645004, "epoch": 7771} {"train_loss": -28.05842399597168, "global_step": 645005, "epoch": 7771} {"train_loss": -27.8102970123291, "global_step": 645006, "epoch": 7771} {"train_loss": -27.8586483001709, "global_step": 645007, "epoch": 7771} {"train_loss": -27.748844146728516, "global_step": 645008, "epoch": 7771} {"train_loss": -28.15928077697754, "global_step": 645009, "epoch": 7771} {"train_loss": -28.344003677368164, "global_step": 645010, "epoch": 7771} {"train_loss": -27.8513126373291, "global_step": 645011, "epoch": 7771} {"train_loss": -27.886465072631836, "global_step": 645012, "epoch": 7771} {"train_loss": -28.306232452392578, "global_step": 645013, "epoch": 7771} {"train_loss": -28.17396354675293, "global_step": 645014, "epoch": 7771} {"train_loss": -28.29041862487793, "global_step": 645015, "epoch": 7771} {"train_loss": -28.213415145874023, "global_step": 645016, "epoch": 7771} {"train_loss": -28.143903732299805, "global_step": 645017, "epoch": 7771} {"train_loss": -27.834735870361328, "global_step": 645018, "epoch": 7771} {"train_loss": -28.09993553161621, "global_step": 645019, "epoch": 7771} {"train_loss": -28.184309005737305, "global_step": 645020, "epoch": 7771} {"train_loss": -28.343799591064453, "global_step": 645021, "epoch": 7771} {"train_loss": -28.188989639282227, "global_step": 645022, "epoch": 7771} {"train_loss": -28.318164825439453, "global_step": 645023, "epoch": 7771} {"train_loss": -27.97889518737793, "global_step": 645024, "epoch": 7771} {"train_loss": -28.159448623657227, "global_step": 645025, "epoch": 7771} {"train_loss": -28.148929595947266, "global_step": 645026, "epoch": 7771} {"train_loss": -28.130929946899414, "global_step": 645027, "epoch": 7771} {"train_loss": -28.345630645751953, "global_step": 645028, "epoch": 7771} {"train_loss": -28.160688400268555, "global_step": 645029, "epoch": 7771} {"train_loss": -28.412109375, "global_step": 645030, "epoch": 7771} {"train_loss": -28.128767013549805, "global_step": 645031, "epoch": 7771} {"train_loss": -28.1363468170166, "global_step": 645032, "epoch": 7771} {"train_loss": -28.329345703125, "global_step": 645033, "epoch": 7771} {"train_loss": -28.401996612548828, "global_step": 645034, "epoch": 7771} {"train_loss": -28.337453842163086, "global_step": 645035, "epoch": 7771} {"train_loss": -28.595630645751953, "global_step": 645036, "epoch": 7771} {"train_loss": -28.03313636779785, "global_step": 645037, "epoch": 7771} {"train_loss": -28.226842880249023, "global_step": 645038, "epoch": 7771} {"train_loss": -27.89609146118164, "global_step": 645039, "epoch": 7771} {"train_loss": -27.845325469970703, "global_step": 645040, "epoch": 7771} {"train_loss": -28.589529037475586, "global_step": 645041, "epoch": 7771} {"train_loss": -28.108808517456055, "global_step": 645042, "epoch": 7771} {"train_loss": -28.15302848815918, "global_step": 645043, "epoch": 7771} {"train_loss": -28.235776901245117, "global_step": 645044, "epoch": 7771} {"train_loss": -28.324512481689453, "global_step": 645045, "epoch": 7771} {"train_loss": -28.700658798217773, "global_step": 645046, "epoch": 7771} {"train_loss": -28.207128524780273, "global_step": 645047, "epoch": 7771} {"train_loss": -28.5554256439209, "global_step": 645048, "epoch": 7771} {"train_loss": -28.33115005493164, "global_step": 645049, "epoch": 7771} {"train_loss": -28.502307891845703, "global_step": 645050, "epoch": 7771} {"train_loss": -28.318714141845703, "global_step": 645051, "epoch": 7771} {"train_loss": -28.2194766998291, "global_step": 645052, "epoch": 7771} {"train_loss": -28.160476684570312, "global_step": 645053, "epoch": 7771} {"train_loss": -28.0834903717041, "global_step": 645054, "epoch": 7771} {"train_loss": -28.56086540222168, "global_step": 645055, "epoch": 7771} {"train_loss": -28.15239906311035, "global_step": 645056, "epoch": 7771} {"train_loss": -28.484975814819336, "global_step": 645057, "epoch": 7771} {"train_loss": -28.31719398498535, "global_step": 645058, "epoch": 7771} {"train_loss": -28.351978302001953, "global_step": 645059, "epoch": 7771} {"train_loss": -28.513229370117188, "global_step": 645060, "epoch": 7771} {"train_loss": -28.4003849029541, "global_step": 645061, "epoch": 7771} {"train_loss": -28.588300704956055, "global_step": 645062, "epoch": 7771} {"train_loss": -28.697961807250977, "global_step": 645063, "epoch": 7771} {"train_loss": -28.72723960876465, "global_step": 645064, "epoch": 7771} {"train_loss": -28.093311309814453, "global_step": 645065, "epoch": 7771} {"train_loss": -28.276647567749023, "global_step": 645066, "epoch": 7771} {"train_loss": -28.39240837097168, "global_step": 645067, "epoch": 7771} {"train_loss": -28.452795028686523, "global_step": 645068, "epoch": 7771} {"train_loss": -28.952661514282227, "global_step": 645069, "epoch": 7771} {"train_loss": -28.737634658813477, "global_step": 645070, "epoch": 7771} {"train_loss": -28.140600204467773, "global_step": 645071, "epoch": 7771} {"train_loss": -28.163742065429688, "global_step": 645072, "epoch": 7771} {"train_loss": -28.484994888305664, "global_step": 645073, "epoch": 7771} {"train_loss": -28.591760635375977, "global_step": 645074, "epoch": 7771} {"train_loss": -28.216239952179322, "global_step": 645075, "epoch": 7771, "val_loss": 6676201.0} {"train_loss": -28.154321670532227, "global_step": 645076, "epoch": 7772} {"train_loss": -27.666202545166016, "global_step": 645077, "epoch": 7772} {"train_loss": -27.328359603881836, "global_step": 645078, "epoch": 7772} {"train_loss": -27.857999801635742, "global_step": 645079, "epoch": 7772} {"train_loss": -27.356306076049805, "global_step": 645080, "epoch": 7772} {"train_loss": -27.14509391784668, "global_step": 645081, "epoch": 7772} {"train_loss": -27.411344528198242, "global_step": 645082, "epoch": 7772} {"train_loss": -27.89491081237793, "global_step": 645083, "epoch": 7772} {"train_loss": -27.5767765045166, "global_step": 645084, "epoch": 7772} {"train_loss": -27.75295066833496, "global_step": 645085, "epoch": 7772} {"train_loss": -27.738128662109375, "global_step": 645086, "epoch": 7772} {"train_loss": -28.297208786010742, "global_step": 645087, "epoch": 7772} {"train_loss": -27.996292114257812, "global_step": 645088, "epoch": 7772} {"train_loss": -28.161237716674805, "global_step": 645089, "epoch": 7772} {"train_loss": -28.28156089782715, "global_step": 645090, "epoch": 7772} {"train_loss": -28.261259078979492, "global_step": 645091, "epoch": 7772} {"train_loss": -28.09022331237793, "global_step": 645092, "epoch": 7772} {"train_loss": -28.26865577697754, "global_step": 645093, "epoch": 7772} {"train_loss": -27.906082153320312, "global_step": 645094, "epoch": 7772} {"train_loss": -28.292551040649414, "global_step": 645095, "epoch": 7772} {"train_loss": -28.1984806060791, "global_step": 645096, "epoch": 7772} {"train_loss": -28.57355308532715, "global_step": 645097, "epoch": 7772} {"train_loss": -28.227895736694336, "global_step": 645098, "epoch": 7772} {"train_loss": -28.248600006103516, "global_step": 645099, "epoch": 7772} {"train_loss": -27.994775772094727, "global_step": 645100, "epoch": 7772} {"train_loss": -28.387298583984375, "global_step": 645101, "epoch": 7772} {"train_loss": -27.984952926635742, "global_step": 645102, "epoch": 7772} {"train_loss": -28.261371612548828, "global_step": 645103, "epoch": 7772} {"train_loss": -28.205076217651367, "global_step": 645104, "epoch": 7772} {"train_loss": -28.394943237304688, "global_step": 645105, "epoch": 7772} {"train_loss": -28.439453125, "global_step": 645106, "epoch": 7772} {"train_loss": -28.1319580078125, "global_step": 645107, "epoch": 7772} {"train_loss": -28.39533805847168, "global_step": 645108, "epoch": 7772} {"train_loss": -27.981603622436523, "global_step": 645109, "epoch": 7772} {"train_loss": -28.75324058532715, "global_step": 645110, "epoch": 7772} {"train_loss": -28.0589656829834, "global_step": 645111, "epoch": 7772} {"train_loss": -28.239904403686523, "global_step": 645112, "epoch": 7772} {"train_loss": -28.61419677734375, "global_step": 645113, "epoch": 7772} {"train_loss": -28.11402702331543, "global_step": 645114, "epoch": 7772} {"train_loss": -28.290266036987305, "global_step": 645115, "epoch": 7772} {"train_loss": -28.60898780822754, "global_step": 645116, "epoch": 7772} {"train_loss": -28.361225128173828, "global_step": 645117, "epoch": 7772} {"train_loss": -28.522705078125, "global_step": 645118, "epoch": 7772} {"train_loss": -28.52005386352539, "global_step": 645119, "epoch": 7772} {"train_loss": -28.42582130432129, "global_step": 645120, "epoch": 7772} {"train_loss": -28.20061683654785, "global_step": 645121, "epoch": 7772} {"train_loss": -28.68562126159668, "global_step": 645122, "epoch": 7772} {"train_loss": -28.36199378967285, "global_step": 645123, "epoch": 7772} {"train_loss": -28.656478881835938, "global_step": 645124, "epoch": 7772} {"train_loss": -28.362140655517578, "global_step": 645125, "epoch": 7772} {"train_loss": -28.631244659423828, "global_step": 645126, "epoch": 7772} {"train_loss": -28.561386108398438, "global_step": 645127, "epoch": 7772} {"train_loss": -28.657575607299805, "global_step": 645128, "epoch": 7772} {"train_loss": -28.800474166870117, "global_step": 645129, "epoch": 7772} {"train_loss": -28.701583862304688, "global_step": 645130, "epoch": 7772} {"train_loss": -28.456928253173828, "global_step": 645131, "epoch": 7772} {"train_loss": -28.39154052734375, "global_step": 645132, "epoch": 7772} {"train_loss": -28.553144454956055, "global_step": 645133, "epoch": 7772} {"train_loss": -28.245519638061523, "global_step": 645134, "epoch": 7772} {"train_loss": -27.540746688842773, "global_step": 645135, "epoch": 7772} {"train_loss": -26.82756996154785, "global_step": 645136, "epoch": 7772} {"train_loss": -26.35393714904785, "global_step": 645137, "epoch": 7772} {"train_loss": -27.44110107421875, "global_step": 645138, "epoch": 7772} {"train_loss": -28.229568481445312, "global_step": 645139, "epoch": 7772} {"train_loss": -27.9114990234375, "global_step": 645140, "epoch": 7772} {"train_loss": -26.994543075561523, "global_step": 645141, "epoch": 7772} {"train_loss": -27.65168571472168, "global_step": 645142, "epoch": 7772} {"train_loss": -27.730512619018555, "global_step": 645143, "epoch": 7772} {"train_loss": -27.587629318237305, "global_step": 645144, "epoch": 7772} {"train_loss": -28.292898178100586, "global_step": 645145, "epoch": 7772} {"train_loss": -27.524658203125, "global_step": 645146, "epoch": 7772} {"train_loss": -28.142108917236328, "global_step": 645147, "epoch": 7772} {"train_loss": -27.98975944519043, "global_step": 645148, "epoch": 7772} {"train_loss": -28.1448917388916, "global_step": 645149, "epoch": 7772} {"train_loss": -28.166839599609375, "global_step": 645150, "epoch": 7772} {"train_loss": -27.5250301361084, "global_step": 645151, "epoch": 7772} {"train_loss": -27.93865966796875, "global_step": 645152, "epoch": 7772} {"train_loss": -28.010639190673828, "global_step": 645153, "epoch": 7772} {"train_loss": -28.11451530456543, "global_step": 645154, "epoch": 7772} {"train_loss": -27.86946678161621, "global_step": 645155, "epoch": 7772} {"train_loss": -28.22828483581543, "global_step": 645156, "epoch": 7772} {"train_loss": -27.859182357788086, "global_step": 645157, "epoch": 7772} {"train_loss": -28.078669881246174, "global_step": 645158, "epoch": 7772, "val_loss": 6710967.0} {"train_loss": -27.864948272705078, "global_step": 645159, "epoch": 7773} {"train_loss": -27.959732055664062, "global_step": 645160, "epoch": 7773} {"train_loss": -28.15972328186035, "global_step": 645161, "epoch": 7773} {"train_loss": -27.8897762298584, "global_step": 645162, "epoch": 7773} {"train_loss": -27.786407470703125, "global_step": 645163, "epoch": 7773} {"train_loss": -28.181201934814453, "global_step": 645164, "epoch": 7773} {"train_loss": -28.250995635986328, "global_step": 645165, "epoch": 7773} {"train_loss": -28.322935104370117, "global_step": 645166, "epoch": 7773} {"train_loss": -28.163599014282227, "global_step": 645167, "epoch": 7773} {"train_loss": -28.367267608642578, "global_step": 645168, "epoch": 7773} {"train_loss": -28.06328773498535, "global_step": 645169, "epoch": 7773} {"train_loss": -28.058074951171875, "global_step": 645170, "epoch": 7773} {"train_loss": -28.2557373046875, "global_step": 645171, "epoch": 7773} {"train_loss": -28.385202407836914, "global_step": 645172, "epoch": 7773} {"train_loss": -28.347137451171875, "global_step": 645173, "epoch": 7773} {"train_loss": -28.214807510375977, "global_step": 645174, "epoch": 7773} {"train_loss": -28.36280632019043, "global_step": 645175, "epoch": 7773} {"train_loss": -28.378503799438477, "global_step": 645176, "epoch": 7773} {"train_loss": -28.475011825561523, "global_step": 645177, "epoch": 7773} {"train_loss": -28.054676055908203, "global_step": 645178, "epoch": 7773} {"train_loss": -28.316303253173828, "global_step": 645179, "epoch": 7773} {"train_loss": -28.74749755859375, "global_step": 645180, "epoch": 7773} {"train_loss": -28.227813720703125, "global_step": 645181, "epoch": 7773} {"train_loss": -28.111072540283203, "global_step": 645182, "epoch": 7773} {"train_loss": -28.192066192626953, "global_step": 645183, "epoch": 7773} {"train_loss": -28.5532283782959, "global_step": 645184, "epoch": 7773} {"train_loss": -28.340208053588867, "global_step": 645185, "epoch": 7773} {"train_loss": -28.508350372314453, "global_step": 645186, "epoch": 7773} {"train_loss": -27.657928466796875, "global_step": 645187, "epoch": 7773} {"train_loss": -28.348352432250977, "global_step": 645188, "epoch": 7773} {"train_loss": -28.35831069946289, "global_step": 645189, "epoch": 7773} {"train_loss": -28.4766788482666, "global_step": 645190, "epoch": 7773} {"train_loss": -28.0132999420166, "global_step": 645191, "epoch": 7773} {"train_loss": -28.49976921081543, "global_step": 645192, "epoch": 7773} {"train_loss": -28.29498291015625, "global_step": 645193, "epoch": 7773} {"train_loss": -28.247760772705078, "global_step": 645194, "epoch": 7773} {"train_loss": -28.480810165405273, "global_step": 645195, "epoch": 7773} {"train_loss": -28.580764770507812, "global_step": 645196, "epoch": 7773} {"train_loss": -27.84822654724121, "global_step": 645197, "epoch": 7773} {"train_loss": -28.195728302001953, "global_step": 645198, "epoch": 7773} {"train_loss": -28.22002601623535, "global_step": 645199, "epoch": 7773} {"train_loss": -28.861392974853516, "global_step": 645200, "epoch": 7773} {"train_loss": -28.48603630065918, "global_step": 645201, "epoch": 7773} {"train_loss": -27.956525802612305, "global_step": 645202, "epoch": 7773} {"train_loss": -28.119840621948242, "global_step": 645203, "epoch": 7773} {"train_loss": -28.053009033203125, "global_step": 645204, "epoch": 7773} {"train_loss": -28.579456329345703, "global_step": 645205, "epoch": 7773} {"train_loss": -28.584793090820312, "global_step": 645206, "epoch": 7773} {"train_loss": -27.894025802612305, "global_step": 645207, "epoch": 7773} {"train_loss": -28.367578506469727, "global_step": 645208, "epoch": 7773} {"train_loss": -28.559818267822266, "global_step": 645209, "epoch": 7773} {"train_loss": -28.054065704345703, "global_step": 645210, "epoch": 7773} {"train_loss": -28.17191505432129, "global_step": 645211, "epoch": 7773} {"train_loss": -28.371295928955078, "global_step": 645212, "epoch": 7773} {"train_loss": -28.946638107299805, "global_step": 645213, "epoch": 7773} {"train_loss": -28.458703994750977, "global_step": 645214, "epoch": 7773} {"train_loss": -28.3778076171875, "global_step": 645215, "epoch": 7773} {"train_loss": -28.416799545288086, "global_step": 645216, "epoch": 7773} {"train_loss": -28.233251571655273, "global_step": 645217, "epoch": 7773} {"train_loss": -28.522912979125977, "global_step": 645218, "epoch": 7773} {"train_loss": -28.50514793395996, "global_step": 645219, "epoch": 7773} {"train_loss": -28.316837310791016, "global_step": 645220, "epoch": 7773} {"train_loss": -28.046905517578125, "global_step": 645221, "epoch": 7773} {"train_loss": -28.7034912109375, "global_step": 645222, "epoch": 7773} {"train_loss": -28.327198028564453, "global_step": 645223, "epoch": 7773} {"train_loss": -28.411718368530273, "global_step": 645224, "epoch": 7773} {"train_loss": -28.55122184753418, "global_step": 645225, "epoch": 7773} {"train_loss": -27.988656997680664, "global_step": 645226, "epoch": 7773} {"train_loss": -28.57343101501465, "global_step": 645227, "epoch": 7773} {"train_loss": -28.228689193725586, "global_step": 645228, "epoch": 7773} {"train_loss": -28.171466827392578, "global_step": 645229, "epoch": 7773} {"train_loss": -28.529727935791016, "global_step": 645230, "epoch": 7773} {"train_loss": -28.685653686523438, "global_step": 645231, "epoch": 7773} {"train_loss": -28.34515953063965, "global_step": 645232, "epoch": 7773} {"train_loss": -28.24126625061035, "global_step": 645233, "epoch": 7773} {"train_loss": -28.710407257080078, "global_step": 645234, "epoch": 7773} {"train_loss": -28.026397705078125, "global_step": 645235, "epoch": 7773} {"train_loss": -28.61737632751465, "global_step": 645236, "epoch": 7773} {"train_loss": -28.3127498626709, "global_step": 645237, "epoch": 7773} {"train_loss": -28.08615493774414, "global_step": 645238, "epoch": 7773} {"train_loss": -28.319137573242188, "global_step": 645239, "epoch": 7773} {"train_loss": -28.547073364257812, "global_step": 645240, "epoch": 7773} {"train_loss": -28.309669609529426, "global_step": 645241, "epoch": 7773, "val_loss": 6716420.0} {"train_loss": -27.961729049682617, "global_step": 645242, "epoch": 7774} {"train_loss": -27.9675350189209, "global_step": 645243, "epoch": 7774} {"train_loss": -27.52094841003418, "global_step": 645244, "epoch": 7774} {"train_loss": -26.927642822265625, "global_step": 645245, "epoch": 7774} {"train_loss": -27.51143455505371, "global_step": 645246, "epoch": 7774} {"train_loss": -27.686010360717773, "global_step": 645247, "epoch": 7774} {"train_loss": -27.812910079956055, "global_step": 645248, "epoch": 7774} {"train_loss": -27.887670516967773, "global_step": 645249, "epoch": 7774} {"train_loss": -27.786590576171875, "global_step": 645250, "epoch": 7774} {"train_loss": -28.305572509765625, "global_step": 645251, "epoch": 7774} {"train_loss": -28.04376792907715, "global_step": 645252, "epoch": 7774} {"train_loss": -28.058032989501953, "global_step": 645253, "epoch": 7774} {"train_loss": -28.048063278198242, "global_step": 645254, "epoch": 7774} {"train_loss": -27.84061050415039, "global_step": 645255, "epoch": 7774} {"train_loss": -27.881946563720703, "global_step": 645256, "epoch": 7774} {"train_loss": -28.265216827392578, "global_step": 645257, "epoch": 7774} {"train_loss": -27.67511558532715, "global_step": 645258, "epoch": 7774} {"train_loss": -28.34619140625, "global_step": 645259, "epoch": 7774} {"train_loss": -28.005172729492188, "global_step": 645260, "epoch": 7774} {"train_loss": -28.056928634643555, "global_step": 645261, "epoch": 7774} {"train_loss": -27.894086837768555, "global_step": 645262, "epoch": 7774} {"train_loss": -28.24161720275879, "global_step": 645263, "epoch": 7774} {"train_loss": -28.471038818359375, "global_step": 645264, "epoch": 7774} {"train_loss": -28.0058536529541, "global_step": 645265, "epoch": 7774} {"train_loss": -27.848493576049805, "global_step": 645266, "epoch": 7774} {"train_loss": -28.234100341796875, "global_step": 645267, "epoch": 7774} {"train_loss": -27.909372329711914, "global_step": 645268, "epoch": 7774} {"train_loss": -27.968036651611328, "global_step": 645269, "epoch": 7774} {"train_loss": -28.172597885131836, "global_step": 645270, "epoch": 7774} {"train_loss": -28.380929946899414, "global_step": 645271, "epoch": 7774} {"train_loss": -27.8704776763916, "global_step": 645272, "epoch": 7774} {"train_loss": -28.20179557800293, "global_step": 645273, "epoch": 7774} {"train_loss": -28.4154052734375, "global_step": 645274, "epoch": 7774} {"train_loss": -28.337554931640625, "global_step": 645275, "epoch": 7774} {"train_loss": -28.290868759155273, "global_step": 645276, "epoch": 7774} {"train_loss": -28.754596710205078, "global_step": 645277, "epoch": 7774} {"train_loss": -28.245758056640625, "global_step": 645278, "epoch": 7774} {"train_loss": -28.180932998657227, "global_step": 645279, "epoch": 7774} {"train_loss": -28.348676681518555, "global_step": 645280, "epoch": 7774} {"train_loss": -28.57938575744629, "global_step": 645281, "epoch": 7774} {"train_loss": -28.418195724487305, "global_step": 645282, "epoch": 7774} {"train_loss": -28.41937255859375, "global_step": 645283, "epoch": 7774} {"train_loss": -28.312824249267578, "global_step": 645284, "epoch": 7774} {"train_loss": -28.328943252563477, "global_step": 645285, "epoch": 7774} {"train_loss": -28.375186920166016, "global_step": 645286, "epoch": 7774} {"train_loss": -28.629758834838867, "global_step": 645287, "epoch": 7774} {"train_loss": -28.490478515625, "global_step": 645288, "epoch": 7774} {"train_loss": -28.339797973632812, "global_step": 645289, "epoch": 7774} {"train_loss": -28.05413818359375, "global_step": 645290, "epoch": 7774} {"train_loss": -28.4306640625, "global_step": 645291, "epoch": 7774} {"train_loss": -28.40423011779785, "global_step": 645292, "epoch": 7774} {"train_loss": -28.771244049072266, "global_step": 645293, "epoch": 7774} {"train_loss": -28.541650772094727, "global_step": 645294, "epoch": 7774} {"train_loss": -28.631772994995117, "global_step": 645295, "epoch": 7774} {"train_loss": -28.655750274658203, "global_step": 645296, "epoch": 7774} {"train_loss": -28.422758102416992, "global_step": 645297, "epoch": 7774} {"train_loss": -28.675003051757812, "global_step": 645298, "epoch": 7774} {"train_loss": -28.309858322143555, "global_step": 645299, "epoch": 7774} {"train_loss": -28.10001564025879, "global_step": 645300, "epoch": 7774} {"train_loss": -28.3670711517334, "global_step": 645301, "epoch": 7774} {"train_loss": -28.1844425201416, "global_step": 645302, "epoch": 7774} {"train_loss": -28.1384220123291, "global_step": 645303, "epoch": 7774} {"train_loss": -28.14430046081543, "global_step": 645304, "epoch": 7774} {"train_loss": -28.22895622253418, "global_step": 645305, "epoch": 7774} {"train_loss": -28.155078887939453, "global_step": 645306, "epoch": 7774} {"train_loss": -28.26091957092285, "global_step": 645307, "epoch": 7774} {"train_loss": -27.54060173034668, "global_step": 645308, "epoch": 7774} {"train_loss": -28.078893661499023, "global_step": 645309, "epoch": 7774} {"train_loss": -28.125732421875, "global_step": 645310, "epoch": 7774} {"train_loss": -27.948522567749023, "global_step": 645311, "epoch": 7774} {"train_loss": -27.976688385009766, "global_step": 645312, "epoch": 7774} {"train_loss": -28.36207389831543, "global_step": 645313, "epoch": 7774} {"train_loss": -28.048999786376953, "global_step": 645314, "epoch": 7774} {"train_loss": -28.399633407592773, "global_step": 645315, "epoch": 7774} {"train_loss": -28.180511474609375, "global_step": 645316, "epoch": 7774} {"train_loss": -28.077871322631836, "global_step": 645317, "epoch": 7774} {"train_loss": -28.21435546875, "global_step": 645318, "epoch": 7774} {"train_loss": -28.270910263061523, "global_step": 645319, "epoch": 7774} {"train_loss": -28.557891845703125, "global_step": 645320, "epoch": 7774} {"train_loss": -28.582746505737305, "global_step": 645321, "epoch": 7774} {"train_loss": -28.340087890625, "global_step": 645322, "epoch": 7774} {"train_loss": -28.322223663330078, "global_step": 645323, "epoch": 7774} {"train_loss": -28.16625158470797, "global_step": 645324, "epoch": 7774, "val_loss": 6686098.0} {"train_loss": -26.60029411315918, "global_step": 645325, "epoch": 7775} {"train_loss": -27.0123291015625, "global_step": 645326, "epoch": 7775} {"train_loss": -27.18226432800293, "global_step": 645327, "epoch": 7775} {"train_loss": -26.977903366088867, "global_step": 645328, "epoch": 7775} {"train_loss": -27.07440757751465, "global_step": 645329, "epoch": 7775} {"train_loss": -27.1917781829834, "global_step": 645330, "epoch": 7775} {"train_loss": -27.55756187438965, "global_step": 645331, "epoch": 7775} {"train_loss": -27.714181900024414, "global_step": 645332, "epoch": 7775} {"train_loss": -27.742450714111328, "global_step": 645333, "epoch": 7775} {"train_loss": -27.491601943969727, "global_step": 645334, "epoch": 7775} {"train_loss": -27.6751708984375, "global_step": 645335, "epoch": 7775} {"train_loss": -27.387897491455078, "global_step": 645336, "epoch": 7775} {"train_loss": -27.820209503173828, "global_step": 645337, "epoch": 7775} {"train_loss": -27.62094497680664, "global_step": 645338, "epoch": 7775} {"train_loss": -28.32381248474121, "global_step": 645339, "epoch": 7775} {"train_loss": -27.505786895751953, "global_step": 645340, "epoch": 7775} {"train_loss": -27.943857192993164, "global_step": 645341, "epoch": 7775} {"train_loss": -28.02555274963379, "global_step": 645342, "epoch": 7775} {"train_loss": -27.667926788330078, "global_step": 645343, "epoch": 7775} {"train_loss": -28.064773559570312, "global_step": 645344, "epoch": 7775} {"train_loss": -28.110092163085938, "global_step": 645345, "epoch": 7775} {"train_loss": -28.180313110351562, "global_step": 645346, "epoch": 7775} {"train_loss": -27.777185440063477, "global_step": 645347, "epoch": 7775} {"train_loss": -27.915586471557617, "global_step": 645348, "epoch": 7775} {"train_loss": -28.114105224609375, "global_step": 645349, "epoch": 7775} {"train_loss": -28.013166427612305, "global_step": 645350, "epoch": 7775} {"train_loss": -27.90058708190918, "global_step": 645351, "epoch": 7775} {"train_loss": -28.125350952148438, "global_step": 645352, "epoch": 7775} {"train_loss": -28.067962646484375, "global_step": 645353, "epoch": 7775} {"train_loss": -27.964160919189453, "global_step": 645354, "epoch": 7775} {"train_loss": -28.15374755859375, "global_step": 645355, "epoch": 7775} {"train_loss": -27.983184814453125, "global_step": 645356, "epoch": 7775} {"train_loss": -27.83152198791504, "global_step": 645357, "epoch": 7775} {"train_loss": -28.093734741210938, "global_step": 645358, "epoch": 7775} {"train_loss": -28.162656784057617, "global_step": 645359, "epoch": 7775} {"train_loss": -28.34943199157715, "global_step": 645360, "epoch": 7775} {"train_loss": -28.27215576171875, "global_step": 645361, "epoch": 7775} {"train_loss": -28.220617294311523, "global_step": 645362, "epoch": 7775} {"train_loss": -28.404998779296875, "global_step": 645363, "epoch": 7775} {"train_loss": -28.363218307495117, "global_step": 645364, "epoch": 7775} {"train_loss": -28.063739776611328, "global_step": 645365, "epoch": 7775} {"train_loss": -28.080078125, "global_step": 645366, "epoch": 7775} {"train_loss": -28.35332679748535, "global_step": 645367, "epoch": 7775} {"train_loss": -28.2769718170166, "global_step": 645368, "epoch": 7775} {"train_loss": -28.034809112548828, "global_step": 645369, "epoch": 7775} {"train_loss": -28.212366104125977, "global_step": 645370, "epoch": 7775} {"train_loss": -28.57752799987793, "global_step": 645371, "epoch": 7775} {"train_loss": -28.58942985534668, "global_step": 645372, "epoch": 7775} {"train_loss": -28.658233642578125, "global_step": 645373, "epoch": 7775} {"train_loss": -28.603208541870117, "global_step": 645374, "epoch": 7775} {"train_loss": -28.251434326171875, "global_step": 645375, "epoch": 7775} {"train_loss": -28.299402236938477, "global_step": 645376, "epoch": 7775} {"train_loss": -28.405216217041016, "global_step": 645377, "epoch": 7775} {"train_loss": -28.303075790405273, "global_step": 645378, "epoch": 7775} {"train_loss": -28.642974853515625, "global_step": 645379, "epoch": 7775} {"train_loss": -28.649988174438477, "global_step": 645380, "epoch": 7775} {"train_loss": -28.568836212158203, "global_step": 645381, "epoch": 7775} {"train_loss": -28.47446632385254, "global_step": 645382, "epoch": 7775} {"train_loss": -28.022321701049805, "global_step": 645383, "epoch": 7775} {"train_loss": -28.404260635375977, "global_step": 645384, "epoch": 7775} {"train_loss": -28.5507755279541, "global_step": 645385, "epoch": 7775} {"train_loss": -28.344532012939453, "global_step": 645386, "epoch": 7775} {"train_loss": -28.71453857421875, "global_step": 645387, "epoch": 7775} {"train_loss": -28.19305992126465, "global_step": 645388, "epoch": 7775} {"train_loss": -28.390033721923828, "global_step": 645389, "epoch": 7775} {"train_loss": -28.413293838500977, "global_step": 645390, "epoch": 7775} {"train_loss": -28.753421783447266, "global_step": 645391, "epoch": 7775} {"train_loss": -28.398487091064453, "global_step": 645392, "epoch": 7775} {"train_loss": -27.741125106811523, "global_step": 645393, "epoch": 7775} {"train_loss": -27.810226440429688, "global_step": 645394, "epoch": 7775} {"train_loss": -27.699111938476562, "global_step": 645395, "epoch": 7775} {"train_loss": -27.63176918029785, "global_step": 645396, "epoch": 7775} {"train_loss": -27.64796257019043, "global_step": 645397, "epoch": 7775} {"train_loss": -28.121047973632812, "global_step": 645398, "epoch": 7775} {"train_loss": -27.89851188659668, "global_step": 645399, "epoch": 7775} {"train_loss": -28.012954711914062, "global_step": 645400, "epoch": 7775} {"train_loss": -28.000320434570312, "global_step": 645401, "epoch": 7775} {"train_loss": -27.56565284729004, "global_step": 645402, "epoch": 7775} {"train_loss": -28.348352432250977, "global_step": 645403, "epoch": 7775} {"train_loss": -28.125696182250977, "global_step": 645404, "epoch": 7775} {"train_loss": -28.04498291015625, "global_step": 645405, "epoch": 7775} {"train_loss": -27.92083168029785, "global_step": 645406, "epoch": 7775} {"train_loss": -28.030232418014343, "global_step": 645407, "epoch": 7775, "val_loss": 6599343.0} {"train_loss": -27.95258140563965, "global_step": 645408, "epoch": 7776} {"train_loss": -27.406024932861328, "global_step": 645409, "epoch": 7776} {"train_loss": -26.57368278503418, "global_step": 645410, "epoch": 7776} {"train_loss": -27.68460464477539, "global_step": 645411, "epoch": 7776} {"train_loss": -27.094717025756836, "global_step": 645412, "epoch": 7776} {"train_loss": -27.622961044311523, "global_step": 645413, "epoch": 7776} {"train_loss": -27.910497665405273, "global_step": 645414, "epoch": 7776} {"train_loss": -27.037961959838867, "global_step": 645415, "epoch": 7776} {"train_loss": -27.477136611938477, "global_step": 645416, "epoch": 7776} {"train_loss": -27.339401245117188, "global_step": 645417, "epoch": 7776} {"train_loss": -27.5351505279541, "global_step": 645418, "epoch": 7776} {"train_loss": -27.707508087158203, "global_step": 645419, "epoch": 7776} {"train_loss": -27.7186222076416, "global_step": 645420, "epoch": 7776} {"train_loss": -27.466562271118164, "global_step": 645421, "epoch": 7776} {"train_loss": -27.7608585357666, "global_step": 645422, "epoch": 7776} {"train_loss": -27.393707275390625, "global_step": 645423, "epoch": 7776} {"train_loss": -27.45600700378418, "global_step": 645424, "epoch": 7776} {"train_loss": -28.393247604370117, "global_step": 645425, "epoch": 7776} {"train_loss": -27.776548385620117, "global_step": 645426, "epoch": 7776} {"train_loss": -27.550962448120117, "global_step": 645427, "epoch": 7776} {"train_loss": -28.044086456298828, "global_step": 645428, "epoch": 7776} {"train_loss": -28.079904556274414, "global_step": 645429, "epoch": 7776} {"train_loss": -28.08319091796875, "global_step": 645430, "epoch": 7776} {"train_loss": -27.948144912719727, "global_step": 645431, "epoch": 7776} {"train_loss": -27.947296142578125, "global_step": 645432, "epoch": 7776} {"train_loss": -27.89739990234375, "global_step": 645433, "epoch": 7776} {"train_loss": -28.11678123474121, "global_step": 645434, "epoch": 7776} {"train_loss": -28.188867568969727, "global_step": 645435, "epoch": 7776} {"train_loss": -28.082538604736328, "global_step": 645436, "epoch": 7776} {"train_loss": -28.35976219177246, "global_step": 645437, "epoch": 7776} {"train_loss": -28.417142868041992, "global_step": 645438, "epoch": 7776} {"train_loss": -28.33796501159668, "global_step": 645439, "epoch": 7776} {"train_loss": -27.957813262939453, "global_step": 645440, "epoch": 7776} {"train_loss": -28.2208309173584, "global_step": 645441, "epoch": 7776} {"train_loss": -28.024906158447266, "global_step": 645442, "epoch": 7776} {"train_loss": -27.927658081054688, "global_step": 645443, "epoch": 7776} {"train_loss": -28.137304306030273, "global_step": 645444, "epoch": 7776} {"train_loss": -28.4245548248291, "global_step": 645445, "epoch": 7776} {"train_loss": -28.19353675842285, "global_step": 645446, "epoch": 7776} {"train_loss": -28.289310455322266, "global_step": 645447, "epoch": 7776} {"train_loss": -28.404056549072266, "global_step": 645448, "epoch": 7776} {"train_loss": -28.179244995117188, "global_step": 645449, "epoch": 7776} {"train_loss": -28.37872314453125, "global_step": 645450, "epoch": 7776} {"train_loss": -28.66952896118164, "global_step": 645451, "epoch": 7776} {"train_loss": -28.42547035217285, "global_step": 645452, "epoch": 7776} {"train_loss": -28.433094024658203, "global_step": 645453, "epoch": 7776} {"train_loss": -28.453210830688477, "global_step": 645454, "epoch": 7776} {"train_loss": -28.305273056030273, "global_step": 645455, "epoch": 7776} {"train_loss": -28.233083724975586, "global_step": 645456, "epoch": 7776} {"train_loss": -28.5296630859375, "global_step": 645457, "epoch": 7776} {"train_loss": -28.469518661499023, "global_step": 645458, "epoch": 7776} {"train_loss": -28.42591667175293, "global_step": 645459, "epoch": 7776} {"train_loss": -27.97870445251465, "global_step": 645460, "epoch": 7776} {"train_loss": -28.196929931640625, "global_step": 645461, "epoch": 7776} {"train_loss": -27.996976852416992, "global_step": 645462, "epoch": 7776} {"train_loss": -27.23431968688965, "global_step": 645463, "epoch": 7776} {"train_loss": -26.858896255493164, "global_step": 645464, "epoch": 7776} {"train_loss": -26.264280319213867, "global_step": 645465, "epoch": 7776} {"train_loss": -26.757795333862305, "global_step": 645466, "epoch": 7776} {"train_loss": -28.209735870361328, "global_step": 645467, "epoch": 7776} {"train_loss": -27.459684371948242, "global_step": 645468, "epoch": 7776} {"train_loss": -27.43840980529785, "global_step": 645469, "epoch": 7776} {"train_loss": -28.056446075439453, "global_step": 645470, "epoch": 7776} {"train_loss": -27.399023056030273, "global_step": 645471, "epoch": 7776} {"train_loss": -28.184900283813477, "global_step": 645472, "epoch": 7776} {"train_loss": -28.004138946533203, "global_step": 645473, "epoch": 7776} {"train_loss": -27.832733154296875, "global_step": 645474, "epoch": 7776} {"train_loss": -28.196796417236328, "global_step": 645475, "epoch": 7776} {"train_loss": -28.480701446533203, "global_step": 645476, "epoch": 7776} {"train_loss": -27.99159812927246, "global_step": 645477, "epoch": 7776} {"train_loss": -28.35175895690918, "global_step": 645478, "epoch": 7776} {"train_loss": -27.929828643798828, "global_step": 645479, "epoch": 7776} {"train_loss": -27.741849899291992, "global_step": 645480, "epoch": 7776} {"train_loss": -28.111188888549805, "global_step": 645481, "epoch": 7776} {"train_loss": -28.01503562927246, "global_step": 645482, "epoch": 7776} {"train_loss": -28.39420509338379, "global_step": 645483, "epoch": 7776} {"train_loss": -28.198150634765625, "global_step": 645484, "epoch": 7776} {"train_loss": -28.224502563476562, "global_step": 645485, "epoch": 7776} {"train_loss": -28.54385757446289, "global_step": 645486, "epoch": 7776} {"train_loss": -28.131546020507812, "global_step": 645487, "epoch": 7776} {"train_loss": -28.086984634399414, "global_step": 645488, "epoch": 7776} {"train_loss": -27.780059814453125, "global_step": 645489, "epoch": 7776} {"train_loss": -27.94522947288421, "global_step": 645490, "epoch": 7776, "val_loss": 6620552.0} {"train_loss": -28.08367919921875, "global_step": 645491, "epoch": 7777} {"train_loss": -28.0727596282959, "global_step": 645492, "epoch": 7777} {"train_loss": -28.127405166625977, "global_step": 645493, "epoch": 7777} {"train_loss": -28.054492950439453, "global_step": 645494, "epoch": 7777} {"train_loss": -27.990753173828125, "global_step": 645495, "epoch": 7777} {"train_loss": -28.072172164916992, "global_step": 645496, "epoch": 7777} {"train_loss": -28.343713760375977, "global_step": 645497, "epoch": 7777} {"train_loss": -27.914209365844727, "global_step": 645498, "epoch": 7777} {"train_loss": -28.26252555847168, "global_step": 645499, "epoch": 7777} {"train_loss": -28.10310935974121, "global_step": 645500, "epoch": 7777} {"train_loss": -28.292394638061523, "global_step": 645501, "epoch": 7777} {"train_loss": -28.150989532470703, "global_step": 645502, "epoch": 7777} {"train_loss": -28.136402130126953, "global_step": 645503, "epoch": 7777} {"train_loss": -28.0880184173584, "global_step": 645504, "epoch": 7777} {"train_loss": -28.073810577392578, "global_step": 645505, "epoch": 7777} {"train_loss": -28.038461685180664, "global_step": 645506, "epoch": 7777} {"train_loss": -28.38970375061035, "global_step": 645507, "epoch": 7777} {"train_loss": -28.131269454956055, "global_step": 645508, "epoch": 7777} {"train_loss": -28.08744239807129, "global_step": 645509, "epoch": 7777} {"train_loss": -28.34278678894043, "global_step": 645510, "epoch": 7777} {"train_loss": -28.2518310546875, "global_step": 645511, "epoch": 7777} {"train_loss": -28.445215225219727, "global_step": 645512, "epoch": 7777} {"train_loss": -28.432886123657227, "global_step": 645513, "epoch": 7777} {"train_loss": -28.495031356811523, "global_step": 645514, "epoch": 7777} {"train_loss": -28.375028610229492, "global_step": 645515, "epoch": 7777} {"train_loss": -28.673431396484375, "global_step": 645516, "epoch": 7777} {"train_loss": -28.408740997314453, "global_step": 645517, "epoch": 7777} {"train_loss": -27.933013916015625, "global_step": 645518, "epoch": 7777} {"train_loss": -28.448444366455078, "global_step": 645519, "epoch": 7777} {"train_loss": -28.75054931640625, "global_step": 645520, "epoch": 7777} {"train_loss": -28.265066146850586, "global_step": 645521, "epoch": 7777} {"train_loss": -28.29741859436035, "global_step": 645522, "epoch": 7777} {"train_loss": -28.4100341796875, "global_step": 645523, "epoch": 7777} {"train_loss": -28.22946548461914, "global_step": 645524, "epoch": 7777} {"train_loss": -28.654865264892578, "global_step": 645525, "epoch": 7777} {"train_loss": -28.4378662109375, "global_step": 645526, "epoch": 7777} {"train_loss": -28.336008071899414, "global_step": 645527, "epoch": 7777} {"train_loss": -28.346830368041992, "global_step": 645528, "epoch": 7777} {"train_loss": -28.889318466186523, "global_step": 645529, "epoch": 7777} {"train_loss": -28.37576675415039, "global_step": 645530, "epoch": 7777} {"train_loss": -28.176435470581055, "global_step": 645531, "epoch": 7777} {"train_loss": -28.724939346313477, "global_step": 645532, "epoch": 7777} {"train_loss": -28.596424102783203, "global_step": 645533, "epoch": 7777} {"train_loss": -28.327396392822266, "global_step": 645534, "epoch": 7777} {"train_loss": -28.530248641967773, "global_step": 645535, "epoch": 7777} {"train_loss": -28.502490997314453, "global_step": 645536, "epoch": 7777} {"train_loss": -28.252466201782227, "global_step": 645537, "epoch": 7777} {"train_loss": -28.874242782592773, "global_step": 645538, "epoch": 7777} {"train_loss": -28.461750030517578, "global_step": 645539, "epoch": 7777} {"train_loss": -28.409976959228516, "global_step": 645540, "epoch": 7777} {"train_loss": -28.617162704467773, "global_step": 645541, "epoch": 7777} {"train_loss": -28.485443115234375, "global_step": 645542, "epoch": 7777} {"train_loss": -28.61236572265625, "global_step": 645543, "epoch": 7777} {"train_loss": -28.22983169555664, "global_step": 645544, "epoch": 7777} {"train_loss": -28.20973014831543, "global_step": 645545, "epoch": 7777} {"train_loss": -27.826446533203125, "global_step": 645546, "epoch": 7777} {"train_loss": -26.068220138549805, "global_step": 645547, "epoch": 7777} {"train_loss": -21.198017120361328, "global_step": 645548, "epoch": 7777} {"train_loss": -19.481138229370117, "global_step": 645549, "epoch": 7777} {"train_loss": -27.519147872924805, "global_step": 645550, "epoch": 7777} {"train_loss": -22.557703018188477, "global_step": 645551, "epoch": 7777} {"train_loss": -26.51392936706543, "global_step": 645552, "epoch": 7777} {"train_loss": -24.361618041992188, "global_step": 645553, "epoch": 7777} {"train_loss": -26.077558517456055, "global_step": 645554, "epoch": 7777} {"train_loss": -26.7630615234375, "global_step": 645555, "epoch": 7777} {"train_loss": -25.991971969604492, "global_step": 645556, "epoch": 7777} {"train_loss": -26.619705200195312, "global_step": 645557, "epoch": 7777} {"train_loss": -27.144489288330078, "global_step": 645558, "epoch": 7777} {"train_loss": -26.96285057067871, "global_step": 645559, "epoch": 7777} {"train_loss": -26.59307861328125, "global_step": 645560, "epoch": 7777} {"train_loss": -26.878747940063477, "global_step": 645561, "epoch": 7777} {"train_loss": -27.18729019165039, "global_step": 645562, "epoch": 7777} {"train_loss": -27.652135848999023, "global_step": 645563, "epoch": 7777} {"train_loss": -27.25603675842285, "global_step": 645564, "epoch": 7777} {"train_loss": -27.467517852783203, "global_step": 645565, "epoch": 7777} {"train_loss": -26.94734001159668, "global_step": 645566, "epoch": 7777} {"train_loss": -27.222925186157227, "global_step": 645567, "epoch": 7777} {"train_loss": -27.372455596923828, "global_step": 645568, "epoch": 7777} {"train_loss": -27.553985595703125, "global_step": 645569, "epoch": 7777} {"train_loss": -27.52205467224121, "global_step": 645570, "epoch": 7777} {"train_loss": -27.593036651611328, "global_step": 645571, "epoch": 7777} {"train_loss": -27.360960006713867, "global_step": 645572, "epoch": 7777} {"train_loss": -27.652299030717597, "global_step": 645573, "epoch": 7777, "val_loss": 6609057.0} {"train_loss": -27.333820343017578, "global_step": 645574, "epoch": 7778} {"train_loss": -27.308263778686523, "global_step": 645575, "epoch": 7778} {"train_loss": -27.189453125, "global_step": 645576, "epoch": 7778} {"train_loss": -27.142993927001953, "global_step": 645577, "epoch": 7778} {"train_loss": -27.380624771118164, "global_step": 645578, "epoch": 7778} {"train_loss": -27.581892013549805, "global_step": 645579, "epoch": 7778} {"train_loss": -27.14515495300293, "global_step": 645580, "epoch": 7778} {"train_loss": -27.36155128479004, "global_step": 645581, "epoch": 7778} {"train_loss": -27.444183349609375, "global_step": 645582, "epoch": 7778} {"train_loss": -27.372018814086914, "global_step": 645583, "epoch": 7778} {"train_loss": -27.020410537719727, "global_step": 645584, "epoch": 7778} {"train_loss": -27.53131103515625, "global_step": 645585, "epoch": 7778} {"train_loss": -27.793720245361328, "global_step": 645586, "epoch": 7778} {"train_loss": -27.375288009643555, "global_step": 645587, "epoch": 7778} {"train_loss": -27.429046630859375, "global_step": 645588, "epoch": 7778} {"train_loss": -27.6141414642334, "global_step": 645589, "epoch": 7778} {"train_loss": -27.424436569213867, "global_step": 645590, "epoch": 7778} {"train_loss": -27.71099853515625, "global_step": 645591, "epoch": 7778} {"train_loss": -27.78369140625, "global_step": 645592, "epoch": 7778} {"train_loss": -27.873889923095703, "global_step": 645593, "epoch": 7778} {"train_loss": -28.008075714111328, "global_step": 645594, "epoch": 7778} {"train_loss": -27.827686309814453, "global_step": 645595, "epoch": 7778} {"train_loss": -27.53907585144043, "global_step": 645596, "epoch": 7778} {"train_loss": -27.97346305847168, "global_step": 645597, "epoch": 7778} {"train_loss": -27.58404541015625, "global_step": 645598, "epoch": 7778} {"train_loss": -28.04762077331543, "global_step": 645599, "epoch": 7778} {"train_loss": -27.94434928894043, "global_step": 645600, "epoch": 7778} {"train_loss": -27.644262313842773, "global_step": 645601, "epoch": 7778} {"train_loss": -27.71895408630371, "global_step": 645602, "epoch": 7778} {"train_loss": -27.94618034362793, "global_step": 645603, "epoch": 7778} {"train_loss": -27.9307918548584, "global_step": 645604, "epoch": 7778} {"train_loss": -27.95906639099121, "global_step": 645605, "epoch": 7778} {"train_loss": -27.933897018432617, "global_step": 645606, "epoch": 7778} {"train_loss": -27.9996395111084, "global_step": 645607, "epoch": 7778} {"train_loss": -28.43521499633789, "global_step": 645608, "epoch": 7778} {"train_loss": -28.074634552001953, "global_step": 645609, "epoch": 7778} {"train_loss": -28.15663719177246, "global_step": 645610, "epoch": 7778} {"train_loss": -28.383575439453125, "global_step": 645611, "epoch": 7778} {"train_loss": -28.482892990112305, "global_step": 645612, "epoch": 7778} {"train_loss": -28.053451538085938, "global_step": 645613, "epoch": 7778} {"train_loss": -28.362457275390625, "global_step": 645614, "epoch": 7778} {"train_loss": -28.09596061706543, "global_step": 645615, "epoch": 7778} {"train_loss": -28.339588165283203, "global_step": 645616, "epoch": 7778} {"train_loss": -28.228612899780273, "global_step": 645617, "epoch": 7778} {"train_loss": -28.329858779907227, "global_step": 645618, "epoch": 7778} {"train_loss": -28.29722023010254, "global_step": 645619, "epoch": 7778} {"train_loss": -28.82600212097168, "global_step": 645620, "epoch": 7778} {"train_loss": -28.289899826049805, "global_step": 645621, "epoch": 7778} {"train_loss": -28.154144287109375, "global_step": 645622, "epoch": 7778} {"train_loss": -27.7225284576416, "global_step": 645623, "epoch": 7778} {"train_loss": -28.21048927307129, "global_step": 645624, "epoch": 7778} {"train_loss": -28.15167808532715, "global_step": 645625, "epoch": 7778} {"train_loss": -28.399484634399414, "global_step": 645626, "epoch": 7778} {"train_loss": -28.223844528198242, "global_step": 645627, "epoch": 7778} {"train_loss": -28.104360580444336, "global_step": 645628, "epoch": 7778} {"train_loss": -28.345169067382812, "global_step": 645629, "epoch": 7778} {"train_loss": -28.67234230041504, "global_step": 645630, "epoch": 7778} {"train_loss": -28.35719871520996, "global_step": 645631, "epoch": 7778} {"train_loss": -27.990476608276367, "global_step": 645632, "epoch": 7778} {"train_loss": -28.382638931274414, "global_step": 645633, "epoch": 7778} {"train_loss": -28.308496475219727, "global_step": 645634, "epoch": 7778} {"train_loss": -28.269067764282227, "global_step": 645635, "epoch": 7778} {"train_loss": -28.094114303588867, "global_step": 645636, "epoch": 7778} {"train_loss": -28.514368057250977, "global_step": 645637, "epoch": 7778} {"train_loss": -28.217329025268555, "global_step": 645638, "epoch": 7778} {"train_loss": -27.63330078125, "global_step": 645639, "epoch": 7778} {"train_loss": -28.04741859436035, "global_step": 645640, "epoch": 7778} {"train_loss": -28.38913345336914, "global_step": 645641, "epoch": 7778} {"train_loss": -28.150562286376953, "global_step": 645642, "epoch": 7778} {"train_loss": -28.254352569580078, "global_step": 645643, "epoch": 7778} {"train_loss": -27.794797897338867, "global_step": 645644, "epoch": 7778} {"train_loss": -27.90802574157715, "global_step": 645645, "epoch": 7778} {"train_loss": -27.934879302978516, "global_step": 645646, "epoch": 7778} {"train_loss": -28.44331169128418, "global_step": 645647, "epoch": 7778} {"train_loss": -27.8083438873291, "global_step": 645648, "epoch": 7778} {"train_loss": -27.569629669189453, "global_step": 645649, "epoch": 7778} {"train_loss": -28.227874755859375, "global_step": 645650, "epoch": 7778} {"train_loss": -27.858566284179688, "global_step": 645651, "epoch": 7778} {"train_loss": -28.4096736907959, "global_step": 645652, "epoch": 7778} {"train_loss": -27.882665634155273, "global_step": 645653, "epoch": 7778} {"train_loss": -28.159780502319336, "global_step": 645654, "epoch": 7778} {"train_loss": -28.432880401611328, "global_step": 645655, "epoch": 7778} {"train_loss": -27.954643226531616, "global_step": 645656, "epoch": 7778, "val_loss": 6660981.0} {"train_loss": -27.228193283081055, "global_step": 645657, "epoch": 7779} {"train_loss": -27.495319366455078, "global_step": 645658, "epoch": 7779} {"train_loss": -28.143375396728516, "global_step": 645659, "epoch": 7779} {"train_loss": -27.703968048095703, "global_step": 645660, "epoch": 7779} {"train_loss": -27.905542373657227, "global_step": 645661, "epoch": 7779} {"train_loss": -27.591506958007812, "global_step": 645662, "epoch": 7779} {"train_loss": -27.92071533203125, "global_step": 645663, "epoch": 7779} {"train_loss": -27.71929931640625, "global_step": 645664, "epoch": 7779} {"train_loss": -28.148481369018555, "global_step": 645665, "epoch": 7779} {"train_loss": -27.905439376831055, "global_step": 645666, "epoch": 7779} {"train_loss": -27.755329132080078, "global_step": 645667, "epoch": 7779} {"train_loss": -27.633380889892578, "global_step": 645668, "epoch": 7779} {"train_loss": -28.036865234375, "global_step": 645669, "epoch": 7779} {"train_loss": -27.870849609375, "global_step": 645670, "epoch": 7779} {"train_loss": -28.172819137573242, "global_step": 645671, "epoch": 7779} {"train_loss": -28.03785514831543, "global_step": 645672, "epoch": 7779} {"train_loss": -27.542266845703125, "global_step": 645673, "epoch": 7779} {"train_loss": -28.081064224243164, "global_step": 645674, "epoch": 7779} {"train_loss": -28.41251564025879, "global_step": 645675, "epoch": 7779} {"train_loss": -27.737689971923828, "global_step": 645676, "epoch": 7779} {"train_loss": -27.46685218811035, "global_step": 645677, "epoch": 7779} {"train_loss": -28.092742919921875, "global_step": 645678, "epoch": 7779} {"train_loss": -28.265409469604492, "global_step": 645679, "epoch": 7779} {"train_loss": -27.95835304260254, "global_step": 645680, "epoch": 7779} {"train_loss": -28.216726303100586, "global_step": 645681, "epoch": 7779} {"train_loss": -27.799734115600586, "global_step": 645682, "epoch": 7779} {"train_loss": -28.240610122680664, "global_step": 645683, "epoch": 7779} {"train_loss": -28.06292152404785, "global_step": 645684, "epoch": 7779} {"train_loss": -28.407123565673828, "global_step": 645685, "epoch": 7779} {"train_loss": -28.3317928314209, "global_step": 645686, "epoch": 7779} {"train_loss": -28.105756759643555, "global_step": 645687, "epoch": 7779} {"train_loss": -27.869110107421875, "global_step": 645688, "epoch": 7779} {"train_loss": -28.447437286376953, "global_step": 645689, "epoch": 7779} {"train_loss": -28.02313804626465, "global_step": 645690, "epoch": 7779} {"train_loss": -27.990650177001953, "global_step": 645691, "epoch": 7779} {"train_loss": -28.483535766601562, "global_step": 645692, "epoch": 7779} {"train_loss": -28.396223068237305, "global_step": 645693, "epoch": 7779} {"train_loss": -28.010263442993164, "global_step": 645694, "epoch": 7779} {"train_loss": -28.10418128967285, "global_step": 645695, "epoch": 7779} {"train_loss": -27.97781753540039, "global_step": 645696, "epoch": 7779} {"train_loss": -28.422882080078125, "global_step": 645697, "epoch": 7779} {"train_loss": -28.336841583251953, "global_step": 645698, "epoch": 7779} {"train_loss": -28.054929733276367, "global_step": 645699, "epoch": 7779} {"train_loss": -28.63802146911621, "global_step": 645700, "epoch": 7779} {"train_loss": -28.262731552124023, "global_step": 645701, "epoch": 7779} {"train_loss": -28.50233268737793, "global_step": 645702, "epoch": 7779} {"train_loss": -28.19236183166504, "global_step": 645703, "epoch": 7779} {"train_loss": -28.180496215820312, "global_step": 645704, "epoch": 7779} {"train_loss": -28.07960319519043, "global_step": 645705, "epoch": 7779} {"train_loss": -28.693378448486328, "global_step": 645706, "epoch": 7779} {"train_loss": -28.4166316986084, "global_step": 645707, "epoch": 7779} {"train_loss": -28.545934677124023, "global_step": 645708, "epoch": 7779} {"train_loss": -28.43671226501465, "global_step": 645709, "epoch": 7779} {"train_loss": -28.292123794555664, "global_step": 645710, "epoch": 7779} {"train_loss": -28.585721969604492, "global_step": 645711, "epoch": 7779} {"train_loss": -28.482513427734375, "global_step": 645712, "epoch": 7779} {"train_loss": -28.74055290222168, "global_step": 645713, "epoch": 7779} {"train_loss": -28.792572021484375, "global_step": 645714, "epoch": 7779} {"train_loss": -28.647932052612305, "global_step": 645715, "epoch": 7779} {"train_loss": -28.214628219604492, "global_step": 645716, "epoch": 7779} {"train_loss": -28.205148696899414, "global_step": 645717, "epoch": 7779} {"train_loss": -28.125181198120117, "global_step": 645718, "epoch": 7779} {"train_loss": -28.210376739501953, "global_step": 645719, "epoch": 7779} {"train_loss": -28.316150665283203, "global_step": 645720, "epoch": 7779} {"train_loss": -28.395313262939453, "global_step": 645721, "epoch": 7779} {"train_loss": -27.988981246948242, "global_step": 645722, "epoch": 7779} {"train_loss": -28.35393714904785, "global_step": 645723, "epoch": 7779} {"train_loss": -28.382171630859375, "global_step": 645724, "epoch": 7779} {"train_loss": -28.26416015625, "global_step": 645725, "epoch": 7779} {"train_loss": -28.4560546875, "global_step": 645726, "epoch": 7779} {"train_loss": -28.570173263549805, "global_step": 645727, "epoch": 7779} {"train_loss": -28.5001163482666, "global_step": 645728, "epoch": 7779} {"train_loss": -28.59661293029785, "global_step": 645729, "epoch": 7779} {"train_loss": -28.791568756103516, "global_step": 645730, "epoch": 7779} {"train_loss": -28.3936710357666, "global_step": 645731, "epoch": 7779} {"train_loss": -28.221067428588867, "global_step": 645732, "epoch": 7779} {"train_loss": -28.29054069519043, "global_step": 645733, "epoch": 7779} {"train_loss": -28.465375900268555, "global_step": 645734, "epoch": 7779} {"train_loss": -28.370410919189453, "global_step": 645735, "epoch": 7779} {"train_loss": -28.338647842407227, "global_step": 645736, "epoch": 7779} {"train_loss": -28.237274169921875, "global_step": 645737, "epoch": 7779} {"train_loss": -28.31023597717285, "global_step": 645738, "epoch": 7779} {"train_loss": -28.186629214918757, "global_step": 645739, "epoch": 7779, "val_loss": 6640505.0} {"train_loss": -28.379058837890625, "global_step": 645740, "epoch": 7780} {"train_loss": -27.815343856811523, "global_step": 645741, "epoch": 7780} {"train_loss": -28.010141372680664, "global_step": 645742, "epoch": 7780} {"train_loss": -27.8570556640625, "global_step": 645743, "epoch": 7780} {"train_loss": -27.659442901611328, "global_step": 645744, "epoch": 7780} {"train_loss": -27.214462280273438, "global_step": 645745, "epoch": 7780} {"train_loss": -27.5830020904541, "global_step": 645746, "epoch": 7780} {"train_loss": -27.868061065673828, "global_step": 645747, "epoch": 7780} {"train_loss": -27.876556396484375, "global_step": 645748, "epoch": 7780} {"train_loss": -27.71747398376465, "global_step": 645749, "epoch": 7780} {"train_loss": -28.1846923828125, "global_step": 645750, "epoch": 7780} {"train_loss": -27.737668991088867, "global_step": 645751, "epoch": 7780} {"train_loss": -27.899890899658203, "global_step": 645752, "epoch": 7780} {"train_loss": -28.174325942993164, "global_step": 645753, "epoch": 7780} {"train_loss": -28.252450942993164, "global_step": 645754, "epoch": 7780} {"train_loss": -28.247989654541016, "global_step": 645755, "epoch": 7780} {"train_loss": -28.036169052124023, "global_step": 645756, "epoch": 7780} {"train_loss": -28.133039474487305, "global_step": 645757, "epoch": 7780} {"train_loss": -27.992340087890625, "global_step": 645758, "epoch": 7780} {"train_loss": -27.910572052001953, "global_step": 645759, "epoch": 7780} {"train_loss": -28.35515785217285, "global_step": 645760, "epoch": 7780} {"train_loss": -28.300745010375977, "global_step": 645761, "epoch": 7780} {"train_loss": -28.1119441986084, "global_step": 645762, "epoch": 7780} {"train_loss": -28.242725372314453, "global_step": 645763, "epoch": 7780} {"train_loss": -28.118635177612305, "global_step": 645764, "epoch": 7780} {"train_loss": -28.73475456237793, "global_step": 645765, "epoch": 7780} {"train_loss": -28.279870986938477, "global_step": 645766, "epoch": 7780} {"train_loss": -28.2951717376709, "global_step": 645767, "epoch": 7780} {"train_loss": -28.56953239440918, "global_step": 645768, "epoch": 7780} {"train_loss": -28.04258155822754, "global_step": 645769, "epoch": 7780} {"train_loss": -28.541568756103516, "global_step": 645770, "epoch": 7780} {"train_loss": -28.179306030273438, "global_step": 645771, "epoch": 7780} {"train_loss": -28.350183486938477, "global_step": 645772, "epoch": 7780} {"train_loss": -28.46514320373535, "global_step": 645773, "epoch": 7780} {"train_loss": -28.3703670501709, "global_step": 645774, "epoch": 7780} {"train_loss": -28.45265769958496, "global_step": 645775, "epoch": 7780} {"train_loss": -28.08273696899414, "global_step": 645776, "epoch": 7780} {"train_loss": -27.8841495513916, "global_step": 645777, "epoch": 7780} {"train_loss": -28.210596084594727, "global_step": 645778, "epoch": 7780} {"train_loss": -28.676054000854492, "global_step": 645779, "epoch": 7780} {"train_loss": -28.189971923828125, "global_step": 645780, "epoch": 7780} {"train_loss": -28.09624671936035, "global_step": 645781, "epoch": 7780} {"train_loss": -28.579059600830078, "global_step": 645782, "epoch": 7780} {"train_loss": -28.66718101501465, "global_step": 645783, "epoch": 7780} {"train_loss": -28.54802894592285, "global_step": 645784, "epoch": 7780} {"train_loss": -28.372594833374023, "global_step": 645785, "epoch": 7780} {"train_loss": -28.327085494995117, "global_step": 645786, "epoch": 7780} {"train_loss": -28.257465362548828, "global_step": 645787, "epoch": 7780} {"train_loss": -28.7459659576416, "global_step": 645788, "epoch": 7780} {"train_loss": -28.562442779541016, "global_step": 645789, "epoch": 7780} {"train_loss": -28.208820343017578, "global_step": 645790, "epoch": 7780} {"train_loss": -28.4158935546875, "global_step": 645791, "epoch": 7780} {"train_loss": -28.652441024780273, "global_step": 645792, "epoch": 7780} {"train_loss": -28.374908447265625, "global_step": 645793, "epoch": 7780} {"train_loss": -28.53644371032715, "global_step": 645794, "epoch": 7780} {"train_loss": -28.30608558654785, "global_step": 645795, "epoch": 7780} {"train_loss": -28.213348388671875, "global_step": 645796, "epoch": 7780} {"train_loss": -28.091007232666016, "global_step": 645797, "epoch": 7780} {"train_loss": -28.441396713256836, "global_step": 645798, "epoch": 7780} {"train_loss": -27.885766983032227, "global_step": 645799, "epoch": 7780} {"train_loss": -27.7371768951416, "global_step": 645800, "epoch": 7780} {"train_loss": -27.820249557495117, "global_step": 645801, "epoch": 7780} {"train_loss": -27.86880874633789, "global_step": 645802, "epoch": 7780} {"train_loss": -28.716888427734375, "global_step": 645803, "epoch": 7780} {"train_loss": -28.123754501342773, "global_step": 645804, "epoch": 7780} {"train_loss": -28.24909782409668, "global_step": 645805, "epoch": 7780} {"train_loss": -28.407255172729492, "global_step": 645806, "epoch": 7780} {"train_loss": -28.685760498046875, "global_step": 645807, "epoch": 7780} {"train_loss": -28.3906192779541, "global_step": 645808, "epoch": 7780} {"train_loss": -27.984594345092773, "global_step": 645809, "epoch": 7780} {"train_loss": -28.151952743530273, "global_step": 645810, "epoch": 7780} {"train_loss": -28.430896759033203, "global_step": 645811, "epoch": 7780} {"train_loss": -28.45222282409668, "global_step": 645812, "epoch": 7780} {"train_loss": -28.382999420166016, "global_step": 645813, "epoch": 7780} {"train_loss": -28.2260799407959, "global_step": 645814, "epoch": 7780} {"train_loss": -28.313739776611328, "global_step": 645815, "epoch": 7780} {"train_loss": -28.60310173034668, "global_step": 645816, "epoch": 7780} {"train_loss": -28.520410537719727, "global_step": 645817, "epoch": 7780} {"train_loss": -28.353330612182617, "global_step": 645818, "epoch": 7780} {"train_loss": -28.319883346557617, "global_step": 645819, "epoch": 7780} {"train_loss": -28.073949813842773, "global_step": 645820, "epoch": 7780} {"train_loss": -28.250720977783203, "global_step": 645821, "epoch": 7780} {"train_loss": -28.20938664172069, "global_step": 645822, "epoch": 7780, "val_loss": 6597226.5} {"train_loss": -27.277175903320312, "global_step": 645823, "epoch": 7781} {"train_loss": -26.699487686157227, "global_step": 645824, "epoch": 7781} {"train_loss": -26.860193252563477, "global_step": 645825, "epoch": 7781} {"train_loss": -27.997756958007812, "global_step": 645826, "epoch": 7781} {"train_loss": -28.1630859375, "global_step": 645827, "epoch": 7781} {"train_loss": -27.976898193359375, "global_step": 645828, "epoch": 7781} {"train_loss": -27.562122344970703, "global_step": 645829, "epoch": 7781} {"train_loss": -28.062244415283203, "global_step": 645830, "epoch": 7781} {"train_loss": -28.09798240661621, "global_step": 645831, "epoch": 7781} {"train_loss": -28.024234771728516, "global_step": 645832, "epoch": 7781} {"train_loss": -27.65016746520996, "global_step": 645833, "epoch": 7781} {"train_loss": -28.01141357421875, "global_step": 645834, "epoch": 7781} {"train_loss": -27.58736228942871, "global_step": 645835, "epoch": 7781} {"train_loss": -27.890478134155273, "global_step": 645836, "epoch": 7781} {"train_loss": -27.941152572631836, "global_step": 645837, "epoch": 7781} {"train_loss": -28.1453857421875, "global_step": 645838, "epoch": 7781} {"train_loss": -28.257349014282227, "global_step": 645839, "epoch": 7781} {"train_loss": -28.373367309570312, "global_step": 645840, "epoch": 7781} {"train_loss": -28.10700035095215, "global_step": 645841, "epoch": 7781} {"train_loss": -27.992176055908203, "global_step": 645842, "epoch": 7781} {"train_loss": -27.934865951538086, "global_step": 645843, "epoch": 7781} {"train_loss": -28.48270606994629, "global_step": 645844, "epoch": 7781} {"train_loss": -28.526142120361328, "global_step": 645845, "epoch": 7781} {"train_loss": -28.312726974487305, "global_step": 645846, "epoch": 7781} {"train_loss": -28.6076717376709, "global_step": 645847, "epoch": 7781} {"train_loss": -28.448389053344727, "global_step": 645848, "epoch": 7781} {"train_loss": -28.303373336791992, "global_step": 645849, "epoch": 7781} {"train_loss": -28.549835205078125, "global_step": 645850, "epoch": 7781} {"train_loss": -28.297733306884766, "global_step": 645851, "epoch": 7781} {"train_loss": -28.188751220703125, "global_step": 645852, "epoch": 7781} {"train_loss": -28.544897079467773, "global_step": 645853, "epoch": 7781} {"train_loss": -28.2855224609375, "global_step": 645854, "epoch": 7781} {"train_loss": -28.353103637695312, "global_step": 645855, "epoch": 7781} {"train_loss": -28.308603286743164, "global_step": 645856, "epoch": 7781} {"train_loss": -28.201353073120117, "global_step": 645857, "epoch": 7781} {"train_loss": -28.45672035217285, "global_step": 645858, "epoch": 7781} {"train_loss": -28.278457641601562, "global_step": 645859, "epoch": 7781} {"train_loss": -28.405080795288086, "global_step": 645860, "epoch": 7781} {"train_loss": -28.0992374420166, "global_step": 645861, "epoch": 7781} {"train_loss": -28.328784942626953, "global_step": 645862, "epoch": 7781} {"train_loss": -28.535633087158203, "global_step": 645863, "epoch": 7781} {"train_loss": -28.620580673217773, "global_step": 645864, "epoch": 7781} {"train_loss": -28.380023956298828, "global_step": 645865, "epoch": 7781} {"train_loss": -28.241077423095703, "global_step": 645866, "epoch": 7781} {"train_loss": -28.454309463500977, "global_step": 645867, "epoch": 7781} {"train_loss": -28.509418487548828, "global_step": 645868, "epoch": 7781} {"train_loss": -28.54437255859375, "global_step": 645869, "epoch": 7781} {"train_loss": -28.460330963134766, "global_step": 645870, "epoch": 7781} {"train_loss": -28.556970596313477, "global_step": 645871, "epoch": 7781} {"train_loss": -28.2509822845459, "global_step": 645872, "epoch": 7781} {"train_loss": -28.294092178344727, "global_step": 645873, "epoch": 7781} {"train_loss": -28.570600509643555, "global_step": 645874, "epoch": 7781} {"train_loss": -28.14032554626465, "global_step": 645875, "epoch": 7781} {"train_loss": -28.635156631469727, "global_step": 645876, "epoch": 7781} {"train_loss": -28.439245223999023, "global_step": 645877, "epoch": 7781} {"train_loss": -28.141788482666016, "global_step": 645878, "epoch": 7781} {"train_loss": -28.36224365234375, "global_step": 645879, "epoch": 7781} {"train_loss": -28.435348510742188, "global_step": 645880, "epoch": 7781} {"train_loss": -28.65276527404785, "global_step": 645881, "epoch": 7781} {"train_loss": -28.1506290435791, "global_step": 645882, "epoch": 7781} {"train_loss": -28.491352081298828, "global_step": 645883, "epoch": 7781} {"train_loss": -28.433868408203125, "global_step": 645884, "epoch": 7781} {"train_loss": -28.558740615844727, "global_step": 645885, "epoch": 7781} {"train_loss": -28.337493896484375, "global_step": 645886, "epoch": 7781} {"train_loss": -28.31805419921875, "global_step": 645887, "epoch": 7781} {"train_loss": -28.655872344970703, "global_step": 645888, "epoch": 7781} {"train_loss": -28.550128936767578, "global_step": 645889, "epoch": 7781} {"train_loss": -28.547216415405273, "global_step": 645890, "epoch": 7781} {"train_loss": -28.53456687927246, "global_step": 645891, "epoch": 7781} {"train_loss": -28.40667724609375, "global_step": 645892, "epoch": 7781} {"train_loss": -28.47354507446289, "global_step": 645893, "epoch": 7781} {"train_loss": -28.364728927612305, "global_step": 645894, "epoch": 7781} {"train_loss": -28.351648330688477, "global_step": 645895, "epoch": 7781} {"train_loss": -28.174274444580078, "global_step": 645896, "epoch": 7781} {"train_loss": -28.5498046875, "global_step": 645897, "epoch": 7781} {"train_loss": -28.354511260986328, "global_step": 645898, "epoch": 7781} {"train_loss": -28.395132064819336, "global_step": 645899, "epoch": 7781} {"train_loss": -28.27263832092285, "global_step": 645900, "epoch": 7781} {"train_loss": -28.514545440673828, "global_step": 645901, "epoch": 7781} {"train_loss": -28.471328735351562, "global_step": 645902, "epoch": 7781} {"train_loss": -28.355182647705078, "global_step": 645903, "epoch": 7781} {"train_loss": -28.047637939453125, "global_step": 645904, "epoch": 7781} {"train_loss": -28.276130078786828, "global_step": 645905, "epoch": 7781, "val_loss": 6615008.0} {"train_loss": -27.546735763549805, "global_step": 645906, "epoch": 7782} {"train_loss": -27.41788673400879, "global_step": 645907, "epoch": 7782} {"train_loss": -28.04615592956543, "global_step": 645908, "epoch": 7782} {"train_loss": -27.751712799072266, "global_step": 645909, "epoch": 7782} {"train_loss": -27.59564208984375, "global_step": 645910, "epoch": 7782} {"train_loss": -27.704788208007812, "global_step": 645911, "epoch": 7782} {"train_loss": -28.03865623474121, "global_step": 645912, "epoch": 7782} {"train_loss": -28.55419921875, "global_step": 645913, "epoch": 7782} {"train_loss": -28.066247940063477, "global_step": 645914, "epoch": 7782} {"train_loss": -27.47517204284668, "global_step": 645915, "epoch": 7782} {"train_loss": -27.93161964416504, "global_step": 645916, "epoch": 7782} {"train_loss": -28.02381706237793, "global_step": 645917, "epoch": 7782} {"train_loss": -28.100812911987305, "global_step": 645918, "epoch": 7782} {"train_loss": -28.455991744995117, "global_step": 645919, "epoch": 7782} {"train_loss": -28.007349014282227, "global_step": 645920, "epoch": 7782} {"train_loss": -28.245718002319336, "global_step": 645921, "epoch": 7782} {"train_loss": -28.21932029724121, "global_step": 645922, "epoch": 7782} {"train_loss": -28.000354766845703, "global_step": 645923, "epoch": 7782} {"train_loss": -28.371389389038086, "global_step": 645924, "epoch": 7782} {"train_loss": -28.254703521728516, "global_step": 645925, "epoch": 7782} {"train_loss": -28.006946563720703, "global_step": 645926, "epoch": 7782} {"train_loss": -27.811681747436523, "global_step": 645927, "epoch": 7782} {"train_loss": -27.98981285095215, "global_step": 645928, "epoch": 7782} {"train_loss": -27.918731689453125, "global_step": 645929, "epoch": 7782} {"train_loss": -28.241018295288086, "global_step": 645930, "epoch": 7782} {"train_loss": -28.036243438720703, "global_step": 645931, "epoch": 7782} {"train_loss": -28.295841217041016, "global_step": 645932, "epoch": 7782} {"train_loss": -28.256244659423828, "global_step": 645933, "epoch": 7782} {"train_loss": -28.43183708190918, "global_step": 645934, "epoch": 7782} {"train_loss": -27.859312057495117, "global_step": 645935, "epoch": 7782} {"train_loss": -28.089752197265625, "global_step": 645936, "epoch": 7782} {"train_loss": -28.1899356842041, "global_step": 645937, "epoch": 7782} {"train_loss": -28.244043350219727, "global_step": 645938, "epoch": 7782} {"train_loss": -28.259183883666992, "global_step": 645939, "epoch": 7782} {"train_loss": -28.222644805908203, "global_step": 645940, "epoch": 7782} {"train_loss": -28.446332931518555, "global_step": 645941, "epoch": 7782} {"train_loss": -28.064722061157227, "global_step": 645942, "epoch": 7782} {"train_loss": -28.2611026763916, "global_step": 645943, "epoch": 7782} {"train_loss": -28.076812744140625, "global_step": 645944, "epoch": 7782} {"train_loss": -28.2971134185791, "global_step": 645945, "epoch": 7782} {"train_loss": -27.930908203125, "global_step": 645946, "epoch": 7782} {"train_loss": -28.097158432006836, "global_step": 645947, "epoch": 7782} {"train_loss": -28.289691925048828, "global_step": 645948, "epoch": 7782} {"train_loss": -28.15839958190918, "global_step": 645949, "epoch": 7782} {"train_loss": -28.315078735351562, "global_step": 645950, "epoch": 7782} {"train_loss": -28.16021156311035, "global_step": 645951, "epoch": 7782} {"train_loss": -28.416675567626953, "global_step": 645952, "epoch": 7782} {"train_loss": -28.201297760009766, "global_step": 645953, "epoch": 7782} {"train_loss": -27.912845611572266, "global_step": 645954, "epoch": 7782} {"train_loss": -28.275609970092773, "global_step": 645955, "epoch": 7782} {"train_loss": -27.887832641601562, "global_step": 645956, "epoch": 7782} {"train_loss": -27.70191764831543, "global_step": 645957, "epoch": 7782} {"train_loss": -27.982379913330078, "global_step": 645958, "epoch": 7782} {"train_loss": -28.47893714904785, "global_step": 645959, "epoch": 7782} {"train_loss": -28.01416015625, "global_step": 645960, "epoch": 7782} {"train_loss": -27.8050594329834, "global_step": 645961, "epoch": 7782} {"train_loss": -27.83631706237793, "global_step": 645962, "epoch": 7782} {"train_loss": -28.052637100219727, "global_step": 645963, "epoch": 7782} {"train_loss": -28.30621910095215, "global_step": 645964, "epoch": 7782} {"train_loss": -28.046844482421875, "global_step": 645965, "epoch": 7782} {"train_loss": -27.877111434936523, "global_step": 645966, "epoch": 7782} {"train_loss": -28.198444366455078, "global_step": 645967, "epoch": 7782} {"train_loss": -28.203725814819336, "global_step": 645968, "epoch": 7782} {"train_loss": -28.319721221923828, "global_step": 645969, "epoch": 7782} {"train_loss": -28.451440811157227, "global_step": 645970, "epoch": 7782} {"train_loss": -28.45099449157715, "global_step": 645971, "epoch": 7782} {"train_loss": -28.390344619750977, "global_step": 645972, "epoch": 7782} {"train_loss": -27.809040069580078, "global_step": 645973, "epoch": 7782} {"train_loss": -28.192716598510742, "global_step": 645974, "epoch": 7782} {"train_loss": -28.42328453063965, "global_step": 645975, "epoch": 7782} {"train_loss": -28.2264404296875, "global_step": 645976, "epoch": 7782} {"train_loss": -28.280841827392578, "global_step": 645977, "epoch": 7782} {"train_loss": -28.359094619750977, "global_step": 645978, "epoch": 7782} {"train_loss": -27.808996200561523, "global_step": 645979, "epoch": 7782} {"train_loss": -28.329137802124023, "global_step": 645980, "epoch": 7782} {"train_loss": -28.388568878173828, "global_step": 645981, "epoch": 7782} {"train_loss": -28.4278507232666, "global_step": 645982, "epoch": 7782} {"train_loss": -28.320602416992188, "global_step": 645983, "epoch": 7782} {"train_loss": -28.09601402282715, "global_step": 645984, "epoch": 7782} {"train_loss": -28.293109893798828, "global_step": 645985, "epoch": 7782} {"train_loss": -28.27570915222168, "global_step": 645986, "epoch": 7782} {"train_loss": -28.599475860595703, "global_step": 645987, "epoch": 7782} {"train_loss": -28.159748927656427, "global_step": 645988, "epoch": 7782, "val_loss": 6698347.0} {"train_loss": -27.192975997924805, "global_step": 645989, "epoch": 7783} {"train_loss": -27.992935180664062, "global_step": 645990, "epoch": 7783} {"train_loss": -27.653722763061523, "global_step": 645991, "epoch": 7783} {"train_loss": -27.48068618774414, "global_step": 645992, "epoch": 7783} {"train_loss": -27.738561630249023, "global_step": 645993, "epoch": 7783} {"train_loss": -27.57244300842285, "global_step": 645994, "epoch": 7783} {"train_loss": -27.879505157470703, "global_step": 645995, "epoch": 7783} {"train_loss": -27.819196701049805, "global_step": 645996, "epoch": 7783} {"train_loss": -27.5181941986084, "global_step": 645997, "epoch": 7783} {"train_loss": -27.6685848236084, "global_step": 645998, "epoch": 7783} {"train_loss": -27.683218002319336, "global_step": 645999, "epoch": 7783} {"train_loss": -27.578201293945312, "global_step": 646000, "epoch": 7783} {"train_loss": -27.899063110351562, "global_step": 646001, "epoch": 7783} {"train_loss": -27.845678329467773, "global_step": 646002, "epoch": 7783} {"train_loss": -27.903772354125977, "global_step": 646003, "epoch": 7783} {"train_loss": -27.80266761779785, "global_step": 646004, "epoch": 7783} {"train_loss": -27.75530433654785, "global_step": 646005, "epoch": 7783} {"train_loss": -28.091028213500977, "global_step": 646006, "epoch": 7783} {"train_loss": -27.889007568359375, "global_step": 646007, "epoch": 7783} {"train_loss": -28.091690063476562, "global_step": 646008, "epoch": 7783} {"train_loss": -28.26617431640625, "global_step": 646009, "epoch": 7783} {"train_loss": -27.563852310180664, "global_step": 646010, "epoch": 7783} {"train_loss": -28.337970733642578, "global_step": 646011, "epoch": 7783} {"train_loss": -27.953771591186523, "global_step": 646012, "epoch": 7783} {"train_loss": -27.905719757080078, "global_step": 646013, "epoch": 7783} {"train_loss": -28.083059310913086, "global_step": 646014, "epoch": 7783} {"train_loss": -28.025548934936523, "global_step": 646015, "epoch": 7783} {"train_loss": -27.903730392456055, "global_step": 646016, "epoch": 7783} {"train_loss": -27.926624298095703, "global_step": 646017, "epoch": 7783} {"train_loss": -28.2481746673584, "global_step": 646018, "epoch": 7783} {"train_loss": -27.849639892578125, "global_step": 646019, "epoch": 7783} {"train_loss": -27.944293975830078, "global_step": 646020, "epoch": 7783} {"train_loss": -28.336095809936523, "global_step": 646021, "epoch": 7783} {"train_loss": -27.73524284362793, "global_step": 646022, "epoch": 7783} {"train_loss": -28.03812599182129, "global_step": 646023, "epoch": 7783} {"train_loss": -28.454303741455078, "global_step": 646024, "epoch": 7783} {"train_loss": -28.150785446166992, "global_step": 646025, "epoch": 7783} {"train_loss": -28.38347816467285, "global_step": 646026, "epoch": 7783} {"train_loss": -27.80215835571289, "global_step": 646027, "epoch": 7783} {"train_loss": -28.54248046875, "global_step": 646028, "epoch": 7783} {"train_loss": -28.25763511657715, "global_step": 646029, "epoch": 7783} {"train_loss": -28.149179458618164, "global_step": 646030, "epoch": 7783} {"train_loss": -28.186553955078125, "global_step": 646031, "epoch": 7783} {"train_loss": -28.3208065032959, "global_step": 646032, "epoch": 7783} {"train_loss": -28.392349243164062, "global_step": 646033, "epoch": 7783} {"train_loss": -28.328887939453125, "global_step": 646034, "epoch": 7783} {"train_loss": -28.3535213470459, "global_step": 646035, "epoch": 7783} {"train_loss": -28.38922119140625, "global_step": 646036, "epoch": 7783} {"train_loss": -28.290380477905273, "global_step": 646037, "epoch": 7783} {"train_loss": -28.6245059967041, "global_step": 646038, "epoch": 7783} {"train_loss": -28.508148193359375, "global_step": 646039, "epoch": 7783} {"train_loss": -28.227041244506836, "global_step": 646040, "epoch": 7783} {"train_loss": -28.30517578125, "global_step": 646041, "epoch": 7783} {"train_loss": -28.786609649658203, "global_step": 646042, "epoch": 7783} {"train_loss": -28.62030029296875, "global_step": 646043, "epoch": 7783} {"train_loss": -28.616119384765625, "global_step": 646044, "epoch": 7783} {"train_loss": -28.125452041625977, "global_step": 646045, "epoch": 7783} {"train_loss": -28.430078506469727, "global_step": 646046, "epoch": 7783} {"train_loss": -28.262531280517578, "global_step": 646047, "epoch": 7783} {"train_loss": -28.382352828979492, "global_step": 646048, "epoch": 7783} {"train_loss": -28.4334716796875, "global_step": 646049, "epoch": 7783} {"train_loss": -28.3493709564209, "global_step": 646050, "epoch": 7783} {"train_loss": -28.45880126953125, "global_step": 646051, "epoch": 7783} {"train_loss": -28.390167236328125, "global_step": 646052, "epoch": 7783} {"train_loss": -28.55878257751465, "global_step": 646053, "epoch": 7783} {"train_loss": -28.815526962280273, "global_step": 646054, "epoch": 7783} {"train_loss": -28.644561767578125, "global_step": 646055, "epoch": 7783} {"train_loss": -28.321752548217773, "global_step": 646056, "epoch": 7783} {"train_loss": -28.3533935546875, "global_step": 646057, "epoch": 7783} {"train_loss": -28.724929809570312, "global_step": 646058, "epoch": 7783} {"train_loss": -28.083877563476562, "global_step": 646059, "epoch": 7783} {"train_loss": -28.088031768798828, "global_step": 646060, "epoch": 7783} {"train_loss": -28.538700103759766, "global_step": 646061, "epoch": 7783} {"train_loss": -28.23041343688965, "global_step": 646062, "epoch": 7783} {"train_loss": -28.65264320373535, "global_step": 646063, "epoch": 7783} {"train_loss": -28.551803588867188, "global_step": 646064, "epoch": 7783} {"train_loss": -28.77594566345215, "global_step": 646065, "epoch": 7783} {"train_loss": -28.499948501586914, "global_step": 646066, "epoch": 7783} {"train_loss": -28.1602840423584, "global_step": 646067, "epoch": 7783} {"train_loss": -28.567197799682617, "global_step": 646068, "epoch": 7783} {"train_loss": -28.38762855529785, "global_step": 646069, "epoch": 7783} {"train_loss": -28.576955795288086, "global_step": 646070, "epoch": 7783} {"train_loss": -28.163863400378858, "global_step": 646071, "epoch": 7783, "val_loss": 6683030.0} {"train_loss": -27.725265502929688, "global_step": 646072, "epoch": 7784} {"train_loss": -26.21771240234375, "global_step": 646073, "epoch": 7784} {"train_loss": -25.208372116088867, "global_step": 646074, "epoch": 7784} {"train_loss": -24.895742416381836, "global_step": 646075, "epoch": 7784} {"train_loss": -27.349496841430664, "global_step": 646076, "epoch": 7784} {"train_loss": -25.639942169189453, "global_step": 646077, "epoch": 7784} {"train_loss": -26.727375030517578, "global_step": 646078, "epoch": 7784} {"train_loss": -26.405622482299805, "global_step": 646079, "epoch": 7784} {"train_loss": -27.39471435546875, "global_step": 646080, "epoch": 7784} {"train_loss": -26.480207443237305, "global_step": 646081, "epoch": 7784} {"train_loss": -27.170440673828125, "global_step": 646082, "epoch": 7784} {"train_loss": -27.387699127197266, "global_step": 646083, "epoch": 7784} {"train_loss": -26.652729034423828, "global_step": 646084, "epoch": 7784} {"train_loss": -27.624563217163086, "global_step": 646085, "epoch": 7784} {"train_loss": -27.385242462158203, "global_step": 646086, "epoch": 7784} {"train_loss": -27.541046142578125, "global_step": 646087, "epoch": 7784} {"train_loss": -27.326658248901367, "global_step": 646088, "epoch": 7784} {"train_loss": -27.15241050720215, "global_step": 646089, "epoch": 7784} {"train_loss": -27.264209747314453, "global_step": 646090, "epoch": 7784} {"train_loss": -27.289321899414062, "global_step": 646091, "epoch": 7784} {"train_loss": -27.358793258666992, "global_step": 646092, "epoch": 7784} {"train_loss": -27.58131217956543, "global_step": 646093, "epoch": 7784} {"train_loss": -27.37395668029785, "global_step": 646094, "epoch": 7784} {"train_loss": -27.584157943725586, "global_step": 646095, "epoch": 7784} {"train_loss": -27.436548233032227, "global_step": 646096, "epoch": 7784} {"train_loss": -27.380300521850586, "global_step": 646097, "epoch": 7784} {"train_loss": -27.766571044921875, "global_step": 646098, "epoch": 7784} {"train_loss": -27.88288688659668, "global_step": 646099, "epoch": 7784} {"train_loss": -27.831653594970703, "global_step": 646100, "epoch": 7784} {"train_loss": -27.407148361206055, "global_step": 646101, "epoch": 7784} {"train_loss": -27.386890411376953, "global_step": 646102, "epoch": 7784} {"train_loss": -27.740375518798828, "global_step": 646103, "epoch": 7784} {"train_loss": -27.599380493164062, "global_step": 646104, "epoch": 7784} {"train_loss": -27.875024795532227, "global_step": 646105, "epoch": 7784} {"train_loss": -27.73133659362793, "global_step": 646106, "epoch": 7784} {"train_loss": -27.752988815307617, "global_step": 646107, "epoch": 7784} {"train_loss": -28.01137351989746, "global_step": 646108, "epoch": 7784} {"train_loss": -27.691373825073242, "global_step": 646109, "epoch": 7784} {"train_loss": -27.320068359375, "global_step": 646110, "epoch": 7784} {"train_loss": -27.689889907836914, "global_step": 646111, "epoch": 7784} {"train_loss": -27.896514892578125, "global_step": 646112, "epoch": 7784} {"train_loss": -28.059839248657227, "global_step": 646113, "epoch": 7784} {"train_loss": -27.840688705444336, "global_step": 646114, "epoch": 7784} {"train_loss": -27.834211349487305, "global_step": 646115, "epoch": 7784} {"train_loss": -27.8912353515625, "global_step": 646116, "epoch": 7784} {"train_loss": -27.82551383972168, "global_step": 646117, "epoch": 7784} {"train_loss": -27.896875381469727, "global_step": 646118, "epoch": 7784} {"train_loss": -27.90302848815918, "global_step": 646119, "epoch": 7784} {"train_loss": -28.297943115234375, "global_step": 646120, "epoch": 7784} {"train_loss": -28.13671875, "global_step": 646121, "epoch": 7784} {"train_loss": -28.36126136779785, "global_step": 646122, "epoch": 7784} {"train_loss": -28.213287353515625, "global_step": 646123, "epoch": 7784} {"train_loss": -27.737335205078125, "global_step": 646124, "epoch": 7784} {"train_loss": -28.355594635009766, "global_step": 646125, "epoch": 7784} {"train_loss": -28.304325103759766, "global_step": 646126, "epoch": 7784} {"train_loss": -28.453521728515625, "global_step": 646127, "epoch": 7784} {"train_loss": -28.2299747467041, "global_step": 646128, "epoch": 7784} {"train_loss": -28.590845108032227, "global_step": 646129, "epoch": 7784} {"train_loss": -28.4256591796875, "global_step": 646130, "epoch": 7784} {"train_loss": -27.977798461914062, "global_step": 646131, "epoch": 7784} {"train_loss": -28.154855728149414, "global_step": 646132, "epoch": 7784} {"train_loss": -28.128131866455078, "global_step": 646133, "epoch": 7784} {"train_loss": -28.65474510192871, "global_step": 646134, "epoch": 7784} {"train_loss": -28.316476821899414, "global_step": 646135, "epoch": 7784} {"train_loss": -28.467086791992188, "global_step": 646136, "epoch": 7784} {"train_loss": -28.158079147338867, "global_step": 646137, "epoch": 7784} {"train_loss": -28.599411010742188, "global_step": 646138, "epoch": 7784} {"train_loss": -28.04298210144043, "global_step": 646139, "epoch": 7784} {"train_loss": -28.539325714111328, "global_step": 646140, "epoch": 7784} {"train_loss": -28.47722816467285, "global_step": 646141, "epoch": 7784} {"train_loss": -28.37005043029785, "global_step": 646142, "epoch": 7784} {"train_loss": -28.29237174987793, "global_step": 646143, "epoch": 7784} {"train_loss": -28.3311824798584, "global_step": 646144, "epoch": 7784} {"train_loss": -28.586353302001953, "global_step": 646145, "epoch": 7784} {"train_loss": -28.59425163269043, "global_step": 646146, "epoch": 7784} {"train_loss": -28.452009201049805, "global_step": 646147, "epoch": 7784} {"train_loss": -28.29326820373535, "global_step": 646148, "epoch": 7784} {"train_loss": -28.24043083190918, "global_step": 646149, "epoch": 7784} {"train_loss": -28.31723976135254, "global_step": 646150, "epoch": 7784} {"train_loss": -28.29839515686035, "global_step": 646151, "epoch": 7784} {"train_loss": -28.72981834411621, "global_step": 646152, "epoch": 7784} {"train_loss": -28.323583602905273, "global_step": 646153, "epoch": 7784} {"train_loss": -27.78016729239958, "global_step": 646154, "epoch": 7784, "val_loss": 6611591.0} {"train_loss": -28.125192642211914, "global_step": 646155, "epoch": 7785} {"train_loss": -28.20779800415039, "global_step": 646156, "epoch": 7785} {"train_loss": -28.458837509155273, "global_step": 646157, "epoch": 7785} {"train_loss": -28.205326080322266, "global_step": 646158, "epoch": 7785} {"train_loss": -27.462759017944336, "global_step": 646159, "epoch": 7785} {"train_loss": -27.991689682006836, "global_step": 646160, "epoch": 7785} {"train_loss": -27.941741943359375, "global_step": 646161, "epoch": 7785} {"train_loss": -27.860498428344727, "global_step": 646162, "epoch": 7785} {"train_loss": -28.04892921447754, "global_step": 646163, "epoch": 7785} {"train_loss": -27.795713424682617, "global_step": 646164, "epoch": 7785} {"train_loss": -28.442834854125977, "global_step": 646165, "epoch": 7785} {"train_loss": -28.2801456451416, "global_step": 646166, "epoch": 7785} {"train_loss": -28.02679443359375, "global_step": 646167, "epoch": 7785} {"train_loss": -28.214014053344727, "global_step": 646168, "epoch": 7785} {"train_loss": -28.2784423828125, "global_step": 646169, "epoch": 7785} {"train_loss": -27.834518432617188, "global_step": 646170, "epoch": 7785} {"train_loss": -27.86848258972168, "global_step": 646171, "epoch": 7785} {"train_loss": -28.2653865814209, "global_step": 646172, "epoch": 7785} {"train_loss": -28.47174644470215, "global_step": 646173, "epoch": 7785} {"train_loss": -27.7166805267334, "global_step": 646174, "epoch": 7785} {"train_loss": -27.717803955078125, "global_step": 646175, "epoch": 7785} {"train_loss": -28.23357582092285, "global_step": 646176, "epoch": 7785} {"train_loss": -27.99323844909668, "global_step": 646177, "epoch": 7785} {"train_loss": -27.98298454284668, "global_step": 646178, "epoch": 7785} {"train_loss": -28.117645263671875, "global_step": 646179, "epoch": 7785} {"train_loss": -28.3569393157959, "global_step": 646180, "epoch": 7785} {"train_loss": -28.16023063659668, "global_step": 646181, "epoch": 7785} {"train_loss": -28.290485382080078, "global_step": 646182, "epoch": 7785} {"train_loss": -28.8155460357666, "global_step": 646183, "epoch": 7785} {"train_loss": -28.40044593811035, "global_step": 646184, "epoch": 7785} {"train_loss": -27.878477096557617, "global_step": 646185, "epoch": 7785} {"train_loss": -28.64644432067871, "global_step": 646186, "epoch": 7785} {"train_loss": -28.412784576416016, "global_step": 646187, "epoch": 7785} {"train_loss": -28.184814453125, "global_step": 646188, "epoch": 7785} {"train_loss": -28.460010528564453, "global_step": 646189, "epoch": 7785} {"train_loss": -28.209089279174805, "global_step": 646190, "epoch": 7785} {"train_loss": -28.432647705078125, "global_step": 646191, "epoch": 7785} {"train_loss": -28.159650802612305, "global_step": 646192, "epoch": 7785} {"train_loss": -28.18130874633789, "global_step": 646193, "epoch": 7785} {"train_loss": -28.433801651000977, "global_step": 646194, "epoch": 7785} {"train_loss": -27.966955184936523, "global_step": 646195, "epoch": 7785} {"train_loss": -28.354475021362305, "global_step": 646196, "epoch": 7785} {"train_loss": -28.36451530456543, "global_step": 646197, "epoch": 7785} {"train_loss": -28.374032974243164, "global_step": 646198, "epoch": 7785} {"train_loss": -28.401498794555664, "global_step": 646199, "epoch": 7785} {"train_loss": -27.6954402923584, "global_step": 646200, "epoch": 7785} {"train_loss": -28.417203903198242, "global_step": 646201, "epoch": 7785} {"train_loss": -28.500934600830078, "global_step": 646202, "epoch": 7785} {"train_loss": -28.238239288330078, "global_step": 646203, "epoch": 7785} {"train_loss": -28.20354652404785, "global_step": 646204, "epoch": 7785} {"train_loss": -28.150983810424805, "global_step": 646205, "epoch": 7785} {"train_loss": -28.645557403564453, "global_step": 646206, "epoch": 7785} {"train_loss": -28.706953048706055, "global_step": 646207, "epoch": 7785} {"train_loss": -28.41956901550293, "global_step": 646208, "epoch": 7785} {"train_loss": -28.716135025024414, "global_step": 646209, "epoch": 7785} {"train_loss": -28.067716598510742, "global_step": 646210, "epoch": 7785} {"train_loss": -28.38467788696289, "global_step": 646211, "epoch": 7785} {"train_loss": -28.207921981811523, "global_step": 646212, "epoch": 7785} {"train_loss": -28.50648307800293, "global_step": 646213, "epoch": 7785} {"train_loss": -28.20920753479004, "global_step": 646214, "epoch": 7785} {"train_loss": -28.223447799682617, "global_step": 646215, "epoch": 7785} {"train_loss": -28.42913246154785, "global_step": 646216, "epoch": 7785} {"train_loss": -28.515600204467773, "global_step": 646217, "epoch": 7785} {"train_loss": -28.510534286499023, "global_step": 646218, "epoch": 7785} {"train_loss": -28.41053581237793, "global_step": 646219, "epoch": 7785} {"train_loss": -28.34589958190918, "global_step": 646220, "epoch": 7785} {"train_loss": -28.2930965423584, "global_step": 646221, "epoch": 7785} {"train_loss": -28.025379180908203, "global_step": 646222, "epoch": 7785} {"train_loss": -28.291580200195312, "global_step": 646223, "epoch": 7785} {"train_loss": -28.316431045532227, "global_step": 646224, "epoch": 7785} {"train_loss": -28.25404930114746, "global_step": 646225, "epoch": 7785} {"train_loss": -28.190351486206055, "global_step": 646226, "epoch": 7785} {"train_loss": -28.016599655151367, "global_step": 646227, "epoch": 7785} {"train_loss": -28.479856491088867, "global_step": 646228, "epoch": 7785} {"train_loss": -28.9311580657959, "global_step": 646229, "epoch": 7785} {"train_loss": -28.50113868713379, "global_step": 646230, "epoch": 7785} {"train_loss": -28.254119873046875, "global_step": 646231, "epoch": 7785} {"train_loss": -28.504337310791016, "global_step": 646232, "epoch": 7785} {"train_loss": -28.450651168823242, "global_step": 646233, "epoch": 7785} {"train_loss": -27.80938720703125, "global_step": 646234, "epoch": 7785} {"train_loss": -28.397003173828125, "global_step": 646235, "epoch": 7785} {"train_loss": -28.524946212768555, "global_step": 646236, "epoch": 7785} {"train_loss": -28.24979736144284, "global_step": 646237, "epoch": 7785, "val_loss": 6651966.5} {"train_loss": -27.979434967041016, "global_step": 646238, "epoch": 7786} {"train_loss": -26.248477935791016, "global_step": 646239, "epoch": 7786} {"train_loss": -27.496932983398438, "global_step": 646240, "epoch": 7786} {"train_loss": -27.665283203125, "global_step": 646241, "epoch": 7786} {"train_loss": -26.885120391845703, "global_step": 646242, "epoch": 7786} {"train_loss": -26.52320671081543, "global_step": 646243, "epoch": 7786} {"train_loss": -26.86854362487793, "global_step": 646244, "epoch": 7786} {"train_loss": -27.668231964111328, "global_step": 646245, "epoch": 7786} {"train_loss": -27.15924072265625, "global_step": 646246, "epoch": 7786} {"train_loss": -27.35466957092285, "global_step": 646247, "epoch": 7786} {"train_loss": -26.907398223876953, "global_step": 646248, "epoch": 7786} {"train_loss": -27.737335205078125, "global_step": 646249, "epoch": 7786} {"train_loss": -27.654193878173828, "global_step": 646250, "epoch": 7786} {"train_loss": -27.69683265686035, "global_step": 646251, "epoch": 7786} {"train_loss": -28.08796501159668, "global_step": 646252, "epoch": 7786} {"train_loss": -27.460351943969727, "global_step": 646253, "epoch": 7786} {"train_loss": -27.848562240600586, "global_step": 646254, "epoch": 7786} {"train_loss": -27.30446434020996, "global_step": 646255, "epoch": 7786} {"train_loss": -28.018075942993164, "global_step": 646256, "epoch": 7786} {"train_loss": -27.678754806518555, "global_step": 646257, "epoch": 7786} {"train_loss": -28.065000534057617, "global_step": 646258, "epoch": 7786} {"train_loss": -27.787261962890625, "global_step": 646259, "epoch": 7786} {"train_loss": -27.892383575439453, "global_step": 646260, "epoch": 7786} {"train_loss": -27.960208892822266, "global_step": 646261, "epoch": 7786} {"train_loss": -27.63962745666504, "global_step": 646262, "epoch": 7786} {"train_loss": -28.160099029541016, "global_step": 646263, "epoch": 7786} {"train_loss": -28.157958984375, "global_step": 646264, "epoch": 7786} {"train_loss": -27.994115829467773, "global_step": 646265, "epoch": 7786} {"train_loss": -27.915624618530273, "global_step": 646266, "epoch": 7786} {"train_loss": -27.737470626831055, "global_step": 646267, "epoch": 7786} {"train_loss": -28.13762855529785, "global_step": 646268, "epoch": 7786} {"train_loss": -27.93729591369629, "global_step": 646269, "epoch": 7786} {"train_loss": -28.093673706054688, "global_step": 646270, "epoch": 7786} {"train_loss": -27.881040573120117, "global_step": 646271, "epoch": 7786} {"train_loss": -27.64165687561035, "global_step": 646272, "epoch": 7786} {"train_loss": -28.236536026000977, "global_step": 646273, "epoch": 7786} {"train_loss": -27.845428466796875, "global_step": 646274, "epoch": 7786} {"train_loss": -27.7600040435791, "global_step": 646275, "epoch": 7786} {"train_loss": -28.33913230895996, "global_step": 646276, "epoch": 7786} {"train_loss": -28.268415451049805, "global_step": 646277, "epoch": 7786} {"train_loss": -28.423105239868164, "global_step": 646278, "epoch": 7786} {"train_loss": -28.179351806640625, "global_step": 646279, "epoch": 7786} {"train_loss": -28.311309814453125, "global_step": 646280, "epoch": 7786} {"train_loss": -28.3896427154541, "global_step": 646281, "epoch": 7786} {"train_loss": -28.02652931213379, "global_step": 646282, "epoch": 7786} {"train_loss": -28.404626846313477, "global_step": 646283, "epoch": 7786} {"train_loss": -28.3941650390625, "global_step": 646284, "epoch": 7786} {"train_loss": -28.147626876831055, "global_step": 646285, "epoch": 7786} {"train_loss": -28.195880889892578, "global_step": 646286, "epoch": 7786} {"train_loss": -28.528427124023438, "global_step": 646287, "epoch": 7786} {"train_loss": -28.565235137939453, "global_step": 646288, "epoch": 7786} {"train_loss": -28.54664421081543, "global_step": 646289, "epoch": 7786} {"train_loss": -28.369714736938477, "global_step": 646290, "epoch": 7786} {"train_loss": -28.57697105407715, "global_step": 646291, "epoch": 7786} {"train_loss": -28.12386131286621, "global_step": 646292, "epoch": 7786} {"train_loss": -28.28571891784668, "global_step": 646293, "epoch": 7786} {"train_loss": -28.230712890625, "global_step": 646294, "epoch": 7786} {"train_loss": -28.831960678100586, "global_step": 646295, "epoch": 7786} {"train_loss": -28.52506446838379, "global_step": 646296, "epoch": 7786} {"train_loss": -28.4842586517334, "global_step": 646297, "epoch": 7786} {"train_loss": -28.567800521850586, "global_step": 646298, "epoch": 7786} {"train_loss": -28.754037857055664, "global_step": 646299, "epoch": 7786} {"train_loss": -28.362836837768555, "global_step": 646300, "epoch": 7786} {"train_loss": -28.510541915893555, "global_step": 646301, "epoch": 7786} {"train_loss": -28.527204513549805, "global_step": 646302, "epoch": 7786} {"train_loss": -28.297119140625, "global_step": 646303, "epoch": 7786} {"train_loss": -28.39080810546875, "global_step": 646304, "epoch": 7786} {"train_loss": -28.747562408447266, "global_step": 646305, "epoch": 7786} {"train_loss": -28.37894630432129, "global_step": 646306, "epoch": 7786} {"train_loss": -28.240407943725586, "global_step": 646307, "epoch": 7786} {"train_loss": -28.1922550201416, "global_step": 646308, "epoch": 7786} {"train_loss": -28.031835556030273, "global_step": 646309, "epoch": 7786} {"train_loss": -28.49934959411621, "global_step": 646310, "epoch": 7786} {"train_loss": -28.457111358642578, "global_step": 646311, "epoch": 7786} {"train_loss": -28.14861488342285, "global_step": 646312, "epoch": 7786} {"train_loss": -28.0970458984375, "global_step": 646313, "epoch": 7786} {"train_loss": -28.131301879882812, "global_step": 646314, "epoch": 7786} {"train_loss": -28.459217071533203, "global_step": 646315, "epoch": 7786} {"train_loss": -28.380661010742188, "global_step": 646316, "epoch": 7786} {"train_loss": -27.906431198120117, "global_step": 646317, "epoch": 7786} {"train_loss": -28.337818145751953, "global_step": 646318, "epoch": 7786} {"train_loss": -28.36884117126465, "global_step": 646319, "epoch": 7786} {"train_loss": -28.036065848476916, "global_step": 646320, "epoch": 7786, "val_loss": 6747946.5} {"train_loss": -27.57489585876465, "global_step": 646321, "epoch": 7787} {"train_loss": -26.19158935546875, "global_step": 646322, "epoch": 7787} {"train_loss": -24.984416961669922, "global_step": 646323, "epoch": 7787} {"train_loss": -24.32233238220215, "global_step": 646324, "epoch": 7787} {"train_loss": -27.06708335876465, "global_step": 646325, "epoch": 7787} {"train_loss": -26.07855224609375, "global_step": 646326, "epoch": 7787} {"train_loss": -25.94892692565918, "global_step": 646327, "epoch": 7787} {"train_loss": -27.411420822143555, "global_step": 646328, "epoch": 7787} {"train_loss": -26.88062858581543, "global_step": 646329, "epoch": 7787} {"train_loss": -27.4801025390625, "global_step": 646330, "epoch": 7787} {"train_loss": -27.20575523376465, "global_step": 646331, "epoch": 7787} {"train_loss": -27.501876831054688, "global_step": 646332, "epoch": 7787} {"train_loss": -27.20888328552246, "global_step": 646333, "epoch": 7787} {"train_loss": -27.325641632080078, "global_step": 646334, "epoch": 7787} {"train_loss": -27.043020248413086, "global_step": 646335, "epoch": 7787} {"train_loss": -27.34552001953125, "global_step": 646336, "epoch": 7787} {"train_loss": -27.855329513549805, "global_step": 646337, "epoch": 7787} {"train_loss": -27.63398551940918, "global_step": 646338, "epoch": 7787} {"train_loss": -27.331928253173828, "global_step": 646339, "epoch": 7787} {"train_loss": -27.986989974975586, "global_step": 646340, "epoch": 7787} {"train_loss": -27.40492820739746, "global_step": 646341, "epoch": 7787} {"train_loss": -27.898794174194336, "global_step": 646342, "epoch": 7787} {"train_loss": -28.06815528869629, "global_step": 646343, "epoch": 7787} {"train_loss": -27.832056045532227, "global_step": 646344, "epoch": 7787} {"train_loss": -27.989805221557617, "global_step": 646345, "epoch": 7787} {"train_loss": -28.104522705078125, "global_step": 646346, "epoch": 7787} {"train_loss": -27.521472930908203, "global_step": 646347, "epoch": 7787} {"train_loss": -27.977558135986328, "global_step": 646348, "epoch": 7787} {"train_loss": -27.837793350219727, "global_step": 646349, "epoch": 7787} {"train_loss": -28.0850887298584, "global_step": 646350, "epoch": 7787} {"train_loss": -27.81568717956543, "global_step": 646351, "epoch": 7787} {"train_loss": -27.90204429626465, "global_step": 646352, "epoch": 7787} {"train_loss": -27.72597312927246, "global_step": 646353, "epoch": 7787} {"train_loss": -28.59232521057129, "global_step": 646354, "epoch": 7787} {"train_loss": -28.277420043945312, "global_step": 646355, "epoch": 7787} {"train_loss": -28.166101455688477, "global_step": 646356, "epoch": 7787} {"train_loss": -28.2689266204834, "global_step": 646357, "epoch": 7787} {"train_loss": -28.13083839416504, "global_step": 646358, "epoch": 7787} {"train_loss": -28.1326904296875, "global_step": 646359, "epoch": 7787} {"train_loss": -27.699426651000977, "global_step": 646360, "epoch": 7787} {"train_loss": -28.423864364624023, "global_step": 646361, "epoch": 7787} {"train_loss": -28.026777267456055, "global_step": 646362, "epoch": 7787} {"train_loss": -28.124069213867188, "global_step": 646363, "epoch": 7787} {"train_loss": -28.298480987548828, "global_step": 646364, "epoch": 7787} {"train_loss": -28.411376953125, "global_step": 646365, "epoch": 7787} {"train_loss": -28.41143798828125, "global_step": 646366, "epoch": 7787} {"train_loss": -28.411848068237305, "global_step": 646367, "epoch": 7787} {"train_loss": -28.08235740661621, "global_step": 646368, "epoch": 7787} {"train_loss": -28.384328842163086, "global_step": 646369, "epoch": 7787} {"train_loss": -28.689620971679688, "global_step": 646370, "epoch": 7787} {"train_loss": -28.415597915649414, "global_step": 646371, "epoch": 7787} {"train_loss": -28.34967041015625, "global_step": 646372, "epoch": 7787} {"train_loss": -28.7724552154541, "global_step": 646373, "epoch": 7787} {"train_loss": -28.402875900268555, "global_step": 646374, "epoch": 7787} {"train_loss": -28.362411499023438, "global_step": 646375, "epoch": 7787} {"train_loss": -28.55580711364746, "global_step": 646376, "epoch": 7787} {"train_loss": -28.119611740112305, "global_step": 646377, "epoch": 7787} {"train_loss": -28.57864761352539, "global_step": 646378, "epoch": 7787} {"train_loss": -28.305273056030273, "global_step": 646379, "epoch": 7787} {"train_loss": -28.783910751342773, "global_step": 646380, "epoch": 7787} {"train_loss": -28.165531158447266, "global_step": 646381, "epoch": 7787} {"train_loss": -28.345121383666992, "global_step": 646382, "epoch": 7787} {"train_loss": -28.23163414001465, "global_step": 646383, "epoch": 7787} {"train_loss": -28.063215255737305, "global_step": 646384, "epoch": 7787} {"train_loss": -28.273761749267578, "global_step": 646385, "epoch": 7787} {"train_loss": -28.1924991607666, "global_step": 646386, "epoch": 7787} {"train_loss": -28.52284812927246, "global_step": 646387, "epoch": 7787} {"train_loss": -28.609272003173828, "global_step": 646388, "epoch": 7787} {"train_loss": -27.502822875976562, "global_step": 646389, "epoch": 7787} {"train_loss": -27.849842071533203, "global_step": 646390, "epoch": 7787} {"train_loss": -28.22607421875, "global_step": 646391, "epoch": 7787} {"train_loss": -28.144865036010742, "global_step": 646392, "epoch": 7787} {"train_loss": -27.62342643737793, "global_step": 646393, "epoch": 7787} {"train_loss": -28.56074333190918, "global_step": 646394, "epoch": 7787} {"train_loss": -28.4152774810791, "global_step": 646395, "epoch": 7787} {"train_loss": -28.30792236328125, "global_step": 646396, "epoch": 7787} {"train_loss": -28.283422470092773, "global_step": 646397, "epoch": 7787} {"train_loss": -28.289051055908203, "global_step": 646398, "epoch": 7787} {"train_loss": -28.569122314453125, "global_step": 646399, "epoch": 7787} {"train_loss": -27.9338436126709, "global_step": 646400, "epoch": 7787} {"train_loss": -28.223499298095703, "global_step": 646401, "epoch": 7787} {"train_loss": -28.116785049438477, "global_step": 646402, "epoch": 7787} {"train_loss": -27.896276129297462, "global_step": 646403, "epoch": 7787, "val_loss": 6699621.5} {"train_loss": -27.702051162719727, "global_step": 646404, "epoch": 7788} {"train_loss": -28.02322769165039, "global_step": 646405, "epoch": 7788} {"train_loss": -28.23359489440918, "global_step": 646406, "epoch": 7788} {"train_loss": -27.776081085205078, "global_step": 646407, "epoch": 7788} {"train_loss": -28.113855361938477, "global_step": 646408, "epoch": 7788} {"train_loss": -27.8601131439209, "global_step": 646409, "epoch": 7788} {"train_loss": -28.102384567260742, "global_step": 646410, "epoch": 7788} {"train_loss": -27.57413673400879, "global_step": 646411, "epoch": 7788} {"train_loss": -27.96636962890625, "global_step": 646412, "epoch": 7788} {"train_loss": -28.2467098236084, "global_step": 646413, "epoch": 7788} {"train_loss": -27.767765045166016, "global_step": 646414, "epoch": 7788} {"train_loss": -28.05768394470215, "global_step": 646415, "epoch": 7788} {"train_loss": -28.1756591796875, "global_step": 646416, "epoch": 7788} {"train_loss": -28.209049224853516, "global_step": 646417, "epoch": 7788} {"train_loss": -28.02850914001465, "global_step": 646418, "epoch": 7788} {"train_loss": -28.31014060974121, "global_step": 646419, "epoch": 7788} {"train_loss": -28.05975914001465, "global_step": 646420, "epoch": 7788} {"train_loss": -28.285749435424805, "global_step": 646421, "epoch": 7788} {"train_loss": -28.35196876525879, "global_step": 646422, "epoch": 7788} {"train_loss": -28.32293701171875, "global_step": 646423, "epoch": 7788} {"train_loss": -28.140655517578125, "global_step": 646424, "epoch": 7788} {"train_loss": -28.162708282470703, "global_step": 646425, "epoch": 7788} {"train_loss": -28.48457908630371, "global_step": 646426, "epoch": 7788} {"train_loss": -28.548364639282227, "global_step": 646427, "epoch": 7788} {"train_loss": -28.20376968383789, "global_step": 646428, "epoch": 7788} {"train_loss": -28.16046142578125, "global_step": 646429, "epoch": 7788} {"train_loss": -28.70090103149414, "global_step": 646430, "epoch": 7788} {"train_loss": -28.053842544555664, "global_step": 646431, "epoch": 7788} {"train_loss": -27.9283390045166, "global_step": 646432, "epoch": 7788} {"train_loss": -28.159423828125, "global_step": 646433, "epoch": 7788} {"train_loss": -27.938220977783203, "global_step": 646434, "epoch": 7788} {"train_loss": -28.420669555664062, "global_step": 646435, "epoch": 7788} {"train_loss": -28.411558151245117, "global_step": 646436, "epoch": 7788} {"train_loss": -28.238025665283203, "global_step": 646437, "epoch": 7788} {"train_loss": -28.519367218017578, "global_step": 646438, "epoch": 7788} {"train_loss": -28.0504150390625, "global_step": 646439, "epoch": 7788} {"train_loss": -28.12811851501465, "global_step": 646440, "epoch": 7788} {"train_loss": -28.127857208251953, "global_step": 646441, "epoch": 7788} {"train_loss": -28.176549911499023, "global_step": 646442, "epoch": 7788} {"train_loss": -28.310199737548828, "global_step": 646443, "epoch": 7788} {"train_loss": -28.092254638671875, "global_step": 646444, "epoch": 7788} {"train_loss": -27.886478424072266, "global_step": 646445, "epoch": 7788} {"train_loss": -28.389453887939453, "global_step": 646446, "epoch": 7788} {"train_loss": -28.538251876831055, "global_step": 646447, "epoch": 7788} {"train_loss": -28.47061538696289, "global_step": 646448, "epoch": 7788} {"train_loss": -28.20228385925293, "global_step": 646449, "epoch": 7788} {"train_loss": -28.541412353515625, "global_step": 646450, "epoch": 7788} {"train_loss": -28.071027755737305, "global_step": 646451, "epoch": 7788} {"train_loss": -28.535022735595703, "global_step": 646452, "epoch": 7788} {"train_loss": -28.04815101623535, "global_step": 646453, "epoch": 7788} {"train_loss": -28.558012008666992, "global_step": 646454, "epoch": 7788} {"train_loss": -28.25010108947754, "global_step": 646455, "epoch": 7788} {"train_loss": -28.014026641845703, "global_step": 646456, "epoch": 7788} {"train_loss": -28.377277374267578, "global_step": 646457, "epoch": 7788} {"train_loss": -28.400634765625, "global_step": 646458, "epoch": 7788} {"train_loss": -28.01679801940918, "global_step": 646459, "epoch": 7788} {"train_loss": -28.48343276977539, "global_step": 646460, "epoch": 7788} {"train_loss": -28.0426025390625, "global_step": 646461, "epoch": 7788} {"train_loss": -28.452733993530273, "global_step": 646462, "epoch": 7788} {"train_loss": -28.029272079467773, "global_step": 646463, "epoch": 7788} {"train_loss": -28.393224716186523, "global_step": 646464, "epoch": 7788} {"train_loss": -28.181964874267578, "global_step": 646465, "epoch": 7788} {"train_loss": -28.41025161743164, "global_step": 646466, "epoch": 7788} {"train_loss": -28.2136287689209, "global_step": 646467, "epoch": 7788} {"train_loss": -28.035287857055664, "global_step": 646468, "epoch": 7788} {"train_loss": -28.032184600830078, "global_step": 646469, "epoch": 7788} {"train_loss": -27.842025756835938, "global_step": 646470, "epoch": 7788} {"train_loss": -28.036245346069336, "global_step": 646471, "epoch": 7788} {"train_loss": -27.588953018188477, "global_step": 646472, "epoch": 7788} {"train_loss": -28.158735275268555, "global_step": 646473, "epoch": 7788} {"train_loss": -28.72772216796875, "global_step": 646474, "epoch": 7788} {"train_loss": -27.77618980407715, "global_step": 646475, "epoch": 7788} {"train_loss": -27.18548583984375, "global_step": 646476, "epoch": 7788} {"train_loss": -27.5552978515625, "global_step": 646477, "epoch": 7788} {"train_loss": -28.188892364501953, "global_step": 646478, "epoch": 7788} {"train_loss": -27.870990753173828, "global_step": 646479, "epoch": 7788} {"train_loss": -27.909162521362305, "global_step": 646480, "epoch": 7788} {"train_loss": -28.176715850830078, "global_step": 646481, "epoch": 7788} {"train_loss": -27.85112953186035, "global_step": 646482, "epoch": 7788} {"train_loss": -28.1812744140625, "global_step": 646483, "epoch": 7788} {"train_loss": -28.125654220581055, "global_step": 646484, "epoch": 7788} {"train_loss": -28.49823570251465, "global_step": 646485, "epoch": 7788} {"train_loss": -28.144170439386944, "global_step": 646486, "epoch": 7788, "val_loss": 6715942.5} {"train_loss": -27.56540870666504, "global_step": 646487, "epoch": 7789} {"train_loss": -26.92886734008789, "global_step": 646488, "epoch": 7789} {"train_loss": -27.2002010345459, "global_step": 646489, "epoch": 7789} {"train_loss": -26.444894790649414, "global_step": 646490, "epoch": 7789} {"train_loss": -27.33957862854004, "global_step": 646491, "epoch": 7789} {"train_loss": -27.074020385742188, "global_step": 646492, "epoch": 7789} {"train_loss": -27.281604766845703, "global_step": 646493, "epoch": 7789} {"train_loss": -27.578811645507812, "global_step": 646494, "epoch": 7789} {"train_loss": -27.350936889648438, "global_step": 646495, "epoch": 7789} {"train_loss": -27.267292022705078, "global_step": 646496, "epoch": 7789} {"train_loss": -27.31818199157715, "global_step": 646497, "epoch": 7789} {"train_loss": -27.581811904907227, "global_step": 646498, "epoch": 7789} {"train_loss": -27.298139572143555, "global_step": 646499, "epoch": 7789} {"train_loss": -27.683862686157227, "global_step": 646500, "epoch": 7789} {"train_loss": -27.999526977539062, "global_step": 646501, "epoch": 7789} {"train_loss": -27.469770431518555, "global_step": 646502, "epoch": 7789} {"train_loss": -27.630102157592773, "global_step": 646503, "epoch": 7789} {"train_loss": -27.934284210205078, "global_step": 646504, "epoch": 7789} {"train_loss": -27.86029624938965, "global_step": 646505, "epoch": 7789} {"train_loss": -27.561145782470703, "global_step": 646506, "epoch": 7789} {"train_loss": -27.7835636138916, "global_step": 646507, "epoch": 7789} {"train_loss": -28.195465087890625, "global_step": 646508, "epoch": 7789} {"train_loss": -27.72089958190918, "global_step": 646509, "epoch": 7789} {"train_loss": -27.760467529296875, "global_step": 646510, "epoch": 7789} {"train_loss": -27.6263427734375, "global_step": 646511, "epoch": 7789} {"train_loss": -27.881561279296875, "global_step": 646512, "epoch": 7789} {"train_loss": -27.91834831237793, "global_step": 646513, "epoch": 7789} {"train_loss": -28.090824127197266, "global_step": 646514, "epoch": 7789} {"train_loss": -27.84332275390625, "global_step": 646515, "epoch": 7789} {"train_loss": -27.520544052124023, "global_step": 646516, "epoch": 7789} {"train_loss": -27.9514102935791, "global_step": 646517, "epoch": 7789} {"train_loss": -28.124998092651367, "global_step": 646518, "epoch": 7789} {"train_loss": -27.732086181640625, "global_step": 646519, "epoch": 7789} {"train_loss": -28.19654655456543, "global_step": 646520, "epoch": 7789} {"train_loss": -27.90374183654785, "global_step": 646521, "epoch": 7789} {"train_loss": -28.25177574157715, "global_step": 646522, "epoch": 7789} {"train_loss": -28.25248146057129, "global_step": 646523, "epoch": 7789} {"train_loss": -28.079792022705078, "global_step": 646524, "epoch": 7789} {"train_loss": -28.389636993408203, "global_step": 646525, "epoch": 7789} {"train_loss": -28.328927993774414, "global_step": 646526, "epoch": 7789} {"train_loss": -28.015775680541992, "global_step": 646527, "epoch": 7789} {"train_loss": -27.98274040222168, "global_step": 646528, "epoch": 7789} {"train_loss": -27.753498077392578, "global_step": 646529, "epoch": 7789} {"train_loss": -28.297216415405273, "global_step": 646530, "epoch": 7789} {"train_loss": -28.64503288269043, "global_step": 646531, "epoch": 7789} {"train_loss": -28.288110733032227, "global_step": 646532, "epoch": 7789} {"train_loss": -28.216495513916016, "global_step": 646533, "epoch": 7789} {"train_loss": -28.465299606323242, "global_step": 646534, "epoch": 7789} {"train_loss": -28.153121948242188, "global_step": 646535, "epoch": 7789} {"train_loss": -28.657062530517578, "global_step": 646536, "epoch": 7789} {"train_loss": -28.541458129882812, "global_step": 646537, "epoch": 7789} {"train_loss": -28.8343505859375, "global_step": 646538, "epoch": 7789} {"train_loss": -28.56178092956543, "global_step": 646539, "epoch": 7789} {"train_loss": -28.18280601501465, "global_step": 646540, "epoch": 7789} {"train_loss": -28.46784782409668, "global_step": 646541, "epoch": 7789} {"train_loss": -27.939916610717773, "global_step": 646542, "epoch": 7789} {"train_loss": -28.193328857421875, "global_step": 646543, "epoch": 7789} {"train_loss": -28.22406005859375, "global_step": 646544, "epoch": 7789} {"train_loss": -28.282190322875977, "global_step": 646545, "epoch": 7789} {"train_loss": -28.348342895507812, "global_step": 646546, "epoch": 7789} {"train_loss": -28.157148361206055, "global_step": 646547, "epoch": 7789} {"train_loss": -28.13557243347168, "global_step": 646548, "epoch": 7789} {"train_loss": -28.213443756103516, "global_step": 646549, "epoch": 7789} {"train_loss": -28.62456703186035, "global_step": 646550, "epoch": 7789} {"train_loss": -28.45770835876465, "global_step": 646551, "epoch": 7789} {"train_loss": -28.455215454101562, "global_step": 646552, "epoch": 7789} {"train_loss": -28.73626708984375, "global_step": 646553, "epoch": 7789} {"train_loss": -28.25864028930664, "global_step": 646554, "epoch": 7789} {"train_loss": -27.995222091674805, "global_step": 646555, "epoch": 7789} {"train_loss": -28.762176513671875, "global_step": 646556, "epoch": 7789} {"train_loss": -28.176084518432617, "global_step": 646557, "epoch": 7789} {"train_loss": -28.207050323486328, "global_step": 646558, "epoch": 7789} {"train_loss": -28.15252113342285, "global_step": 646559, "epoch": 7789} {"train_loss": -28.570234298706055, "global_step": 646560, "epoch": 7789} {"train_loss": -28.19752311706543, "global_step": 646561, "epoch": 7789} {"train_loss": -28.606351852416992, "global_step": 646562, "epoch": 7789} {"train_loss": -28.517139434814453, "global_step": 646563, "epoch": 7789} {"train_loss": -28.5230655670166, "global_step": 646564, "epoch": 7789} {"train_loss": -28.361804962158203, "global_step": 646565, "epoch": 7789} {"train_loss": -28.30299186706543, "global_step": 646566, "epoch": 7789} {"train_loss": -27.564411163330078, "global_step": 646567, "epoch": 7789} {"train_loss": -27.785715103149414, "global_step": 646568, "epoch": 7789} {"train_loss": -28.023870560060065, "global_step": 646569, "epoch": 7789, "val_loss": 6719919.0} {"train_loss": -27.44327735900879, "global_step": 646570, "epoch": 7790} {"train_loss": -27.095083236694336, "global_step": 646571, "epoch": 7790} {"train_loss": -27.5918025970459, "global_step": 646572, "epoch": 7790} {"train_loss": -27.91802406311035, "global_step": 646573, "epoch": 7790} {"train_loss": -27.278839111328125, "global_step": 646574, "epoch": 7790} {"train_loss": -27.5169677734375, "global_step": 646575, "epoch": 7790} {"train_loss": -27.282855987548828, "global_step": 646576, "epoch": 7790} {"train_loss": -27.67049217224121, "global_step": 646577, "epoch": 7790} {"train_loss": -27.27180290222168, "global_step": 646578, "epoch": 7790} {"train_loss": -27.906076431274414, "global_step": 646579, "epoch": 7790} {"train_loss": -27.813079833984375, "global_step": 646580, "epoch": 7790} {"train_loss": -27.837940216064453, "global_step": 646581, "epoch": 7790} {"train_loss": -27.946088790893555, "global_step": 646582, "epoch": 7790} {"train_loss": -28.064252853393555, "global_step": 646583, "epoch": 7790} {"train_loss": -28.012699127197266, "global_step": 646584, "epoch": 7790} {"train_loss": -27.734058380126953, "global_step": 646585, "epoch": 7790} {"train_loss": -28.0727481842041, "global_step": 646586, "epoch": 7790} {"train_loss": -27.706350326538086, "global_step": 646587, "epoch": 7790} {"train_loss": -28.0618839263916, "global_step": 646588, "epoch": 7790} {"train_loss": -28.000045776367188, "global_step": 646589, "epoch": 7790} {"train_loss": -28.07516860961914, "global_step": 646590, "epoch": 7790} {"train_loss": -28.015172958374023, "global_step": 646591, "epoch": 7790} {"train_loss": -28.24886131286621, "global_step": 646592, "epoch": 7790} {"train_loss": -28.0982723236084, "global_step": 646593, "epoch": 7790} {"train_loss": -28.170907974243164, "global_step": 646594, "epoch": 7790} {"train_loss": -28.033065795898438, "global_step": 646595, "epoch": 7790} {"train_loss": -28.612340927124023, "global_step": 646596, "epoch": 7790} {"train_loss": -28.307849884033203, "global_step": 646597, "epoch": 7790} {"train_loss": -28.427005767822266, "global_step": 646598, "epoch": 7790} {"train_loss": -28.07309341430664, "global_step": 646599, "epoch": 7790} {"train_loss": -28.2044734954834, "global_step": 646600, "epoch": 7790} {"train_loss": -28.418914794921875, "global_step": 646601, "epoch": 7790} {"train_loss": -28.313282012939453, "global_step": 646602, "epoch": 7790} {"train_loss": -28.2669620513916, "global_step": 646603, "epoch": 7790} {"train_loss": -28.334674835205078, "global_step": 646604, "epoch": 7790} {"train_loss": -28.401752471923828, "global_step": 646605, "epoch": 7790} {"train_loss": -28.348012924194336, "global_step": 646606, "epoch": 7790} {"train_loss": -28.503650665283203, "global_step": 646607, "epoch": 7790} {"train_loss": -28.435949325561523, "global_step": 646608, "epoch": 7790} {"train_loss": -28.48981285095215, "global_step": 646609, "epoch": 7790} {"train_loss": -28.48164176940918, "global_step": 646610, "epoch": 7790} {"train_loss": -28.441946029663086, "global_step": 646611, "epoch": 7790} {"train_loss": -28.612659454345703, "global_step": 646612, "epoch": 7790} {"train_loss": -28.663742065429688, "global_step": 646613, "epoch": 7790} {"train_loss": -28.23146629333496, "global_step": 646614, "epoch": 7790} {"train_loss": -28.578174591064453, "global_step": 646615, "epoch": 7790} {"train_loss": -28.642364501953125, "global_step": 646616, "epoch": 7790} {"train_loss": -28.209623336791992, "global_step": 646617, "epoch": 7790} {"train_loss": -28.47983741760254, "global_step": 646618, "epoch": 7790} {"train_loss": -28.5948543548584, "global_step": 646619, "epoch": 7790} {"train_loss": -28.360584259033203, "global_step": 646620, "epoch": 7790} {"train_loss": -28.4293212890625, "global_step": 646621, "epoch": 7790} {"train_loss": -28.505212783813477, "global_step": 646622, "epoch": 7790} {"train_loss": -28.156293869018555, "global_step": 646623, "epoch": 7790} {"train_loss": -28.26409912109375, "global_step": 646624, "epoch": 7790} {"train_loss": -28.347814559936523, "global_step": 646625, "epoch": 7790} {"train_loss": -28.390939712524414, "global_step": 646626, "epoch": 7790} {"train_loss": -28.404333114624023, "global_step": 646627, "epoch": 7790} {"train_loss": -28.57282829284668, "global_step": 646628, "epoch": 7790} {"train_loss": -28.334125518798828, "global_step": 646629, "epoch": 7790} {"train_loss": -28.464176177978516, "global_step": 646630, "epoch": 7790} {"train_loss": -28.150251388549805, "global_step": 646631, "epoch": 7790} {"train_loss": -28.61213493347168, "global_step": 646632, "epoch": 7790} {"train_loss": -27.941669464111328, "global_step": 646633, "epoch": 7790} {"train_loss": -28.002790451049805, "global_step": 646634, "epoch": 7790} {"train_loss": -28.412328720092773, "global_step": 646635, "epoch": 7790} {"train_loss": -27.836612701416016, "global_step": 646636, "epoch": 7790} {"train_loss": -28.248199462890625, "global_step": 646637, "epoch": 7790} {"train_loss": -28.493383407592773, "global_step": 646638, "epoch": 7790} {"train_loss": -28.16847038269043, "global_step": 646639, "epoch": 7790} {"train_loss": -28.291275024414062, "global_step": 646640, "epoch": 7790} {"train_loss": -28.309925079345703, "global_step": 646641, "epoch": 7790} {"train_loss": -27.919702529907227, "global_step": 646642, "epoch": 7790} {"train_loss": -28.173917770385742, "global_step": 646643, "epoch": 7790} {"train_loss": -28.4647159576416, "global_step": 646644, "epoch": 7790} {"train_loss": -28.408920288085938, "global_step": 646645, "epoch": 7790} {"train_loss": -28.044164657592773, "global_step": 646646, "epoch": 7790} {"train_loss": -28.189294815063477, "global_step": 646647, "epoch": 7790} {"train_loss": -28.4609317779541, "global_step": 646648, "epoch": 7790} {"train_loss": -28.057693481445312, "global_step": 646649, "epoch": 7790} {"train_loss": -28.523700714111328, "global_step": 646650, "epoch": 7790} {"train_loss": -27.821247100830078, "global_step": 646651, "epoch": 7790} {"train_loss": -28.147792885102422, "global_step": 646652, "epoch": 7790, "val_loss": 6721742.0} {"train_loss": -27.671308517456055, "global_step": 646653, "epoch": 7791} {"train_loss": -27.204553604125977, "global_step": 646654, "epoch": 7791} {"train_loss": -26.890127182006836, "global_step": 646655, "epoch": 7791} {"train_loss": -25.757192611694336, "global_step": 646656, "epoch": 7791} {"train_loss": -25.891620635986328, "global_step": 646657, "epoch": 7791} {"train_loss": -27.346847534179688, "global_step": 646658, "epoch": 7791} {"train_loss": -27.0445613861084, "global_step": 646659, "epoch": 7791} {"train_loss": -26.842199325561523, "global_step": 646660, "epoch": 7791} {"train_loss": -27.757360458374023, "global_step": 646661, "epoch": 7791} {"train_loss": -26.758655548095703, "global_step": 646662, "epoch": 7791} {"train_loss": -27.516742706298828, "global_step": 646663, "epoch": 7791} {"train_loss": -27.457782745361328, "global_step": 646664, "epoch": 7791} {"train_loss": -27.789945602416992, "global_step": 646665, "epoch": 7791} {"train_loss": -27.481185913085938, "global_step": 646666, "epoch": 7791} {"train_loss": -27.456409454345703, "global_step": 646667, "epoch": 7791} {"train_loss": -26.532373428344727, "global_step": 646668, "epoch": 7791} {"train_loss": -27.46619987487793, "global_step": 646669, "epoch": 7791} {"train_loss": -27.38860511779785, "global_step": 646670, "epoch": 7791} {"train_loss": -27.59809684753418, "global_step": 646671, "epoch": 7791} {"train_loss": -27.833799362182617, "global_step": 646672, "epoch": 7791} {"train_loss": -28.107746124267578, "global_step": 646673, "epoch": 7791} {"train_loss": -27.2342472076416, "global_step": 646674, "epoch": 7791} {"train_loss": -27.827680587768555, "global_step": 646675, "epoch": 7791} {"train_loss": -28.16400718688965, "global_step": 646676, "epoch": 7791} {"train_loss": -27.79142189025879, "global_step": 646677, "epoch": 7791} {"train_loss": -27.750507354736328, "global_step": 646678, "epoch": 7791} {"train_loss": -28.056049346923828, "global_step": 646679, "epoch": 7791} {"train_loss": -27.866613388061523, "global_step": 646680, "epoch": 7791} {"train_loss": -28.349090576171875, "global_step": 646681, "epoch": 7791} {"train_loss": -27.914682388305664, "global_step": 646682, "epoch": 7791} {"train_loss": -28.013137817382812, "global_step": 646683, "epoch": 7791} {"train_loss": -27.889877319335938, "global_step": 646684, "epoch": 7791} {"train_loss": -28.18963050842285, "global_step": 646685, "epoch": 7791} {"train_loss": -27.864084243774414, "global_step": 646686, "epoch": 7791} {"train_loss": -28.24713706970215, "global_step": 646687, "epoch": 7791} {"train_loss": -27.981809616088867, "global_step": 646688, "epoch": 7791} {"train_loss": -28.616376876831055, "global_step": 646689, "epoch": 7791} {"train_loss": -28.06781578063965, "global_step": 646690, "epoch": 7791} {"train_loss": -27.866308212280273, "global_step": 646691, "epoch": 7791} {"train_loss": -28.248920440673828, "global_step": 646692, "epoch": 7791} {"train_loss": -28.285024642944336, "global_step": 646693, "epoch": 7791} {"train_loss": -28.196521759033203, "global_step": 646694, "epoch": 7791} {"train_loss": -28.5272159576416, "global_step": 646695, "epoch": 7791} {"train_loss": -28.3363037109375, "global_step": 646696, "epoch": 7791} {"train_loss": -27.9931697845459, "global_step": 646697, "epoch": 7791} {"train_loss": -28.430845260620117, "global_step": 646698, "epoch": 7791} {"train_loss": -28.349470138549805, "global_step": 646699, "epoch": 7791} {"train_loss": -28.215993881225586, "global_step": 646700, "epoch": 7791} {"train_loss": -28.208038330078125, "global_step": 646701, "epoch": 7791} {"train_loss": -28.250263214111328, "global_step": 646702, "epoch": 7791} {"train_loss": -28.248458862304688, "global_step": 646703, "epoch": 7791} {"train_loss": -28.501495361328125, "global_step": 646704, "epoch": 7791} {"train_loss": -28.741912841796875, "global_step": 646705, "epoch": 7791} {"train_loss": -28.09255027770996, "global_step": 646706, "epoch": 7791} {"train_loss": -28.3696231842041, "global_step": 646707, "epoch": 7791} {"train_loss": -28.318784713745117, "global_step": 646708, "epoch": 7791} {"train_loss": -28.13276481628418, "global_step": 646709, "epoch": 7791} {"train_loss": -28.094308853149414, "global_step": 646710, "epoch": 7791} {"train_loss": -28.3975830078125, "global_step": 646711, "epoch": 7791} {"train_loss": -28.778106689453125, "global_step": 646712, "epoch": 7791} {"train_loss": -28.50323486328125, "global_step": 646713, "epoch": 7791} {"train_loss": -28.72088623046875, "global_step": 646714, "epoch": 7791} {"train_loss": -28.395862579345703, "global_step": 646715, "epoch": 7791} {"train_loss": -28.412145614624023, "global_step": 646716, "epoch": 7791} {"train_loss": -28.43479347229004, "global_step": 646717, "epoch": 7791} {"train_loss": -28.2747745513916, "global_step": 646718, "epoch": 7791} {"train_loss": -28.412281036376953, "global_step": 646719, "epoch": 7791} {"train_loss": -28.243932723999023, "global_step": 646720, "epoch": 7791} {"train_loss": -28.170568466186523, "global_step": 646721, "epoch": 7791} {"train_loss": -28.27985954284668, "global_step": 646722, "epoch": 7791} {"train_loss": -27.972043991088867, "global_step": 646723, "epoch": 7791} {"train_loss": -28.290836334228516, "global_step": 646724, "epoch": 7791} {"train_loss": -28.39472770690918, "global_step": 646725, "epoch": 7791} {"train_loss": -28.262914657592773, "global_step": 646726, "epoch": 7791} {"train_loss": -28.55670738220215, "global_step": 646727, "epoch": 7791} {"train_loss": -28.517047882080078, "global_step": 646728, "epoch": 7791} {"train_loss": -28.44708251953125, "global_step": 646729, "epoch": 7791} {"train_loss": -28.227392196655273, "global_step": 646730, "epoch": 7791} {"train_loss": -27.95941162109375, "global_step": 646731, "epoch": 7791} {"train_loss": -28.01825523376465, "global_step": 646732, "epoch": 7791} {"train_loss": -28.396305084228516, "global_step": 646733, "epoch": 7791} {"train_loss": -28.377309799194336, "global_step": 646734, "epoch": 7791} {"train_loss": -27.96115893628224, "global_step": 646735, "epoch": 7791, "val_loss": 6681659.5} {"train_loss": -28.149341583251953, "global_step": 646736, "epoch": 7792} {"train_loss": -28.12558364868164, "global_step": 646737, "epoch": 7792} {"train_loss": -28.17571449279785, "global_step": 646738, "epoch": 7792} {"train_loss": -27.750547409057617, "global_step": 646739, "epoch": 7792} {"train_loss": -27.956806182861328, "global_step": 646740, "epoch": 7792} {"train_loss": -28.255741119384766, "global_step": 646741, "epoch": 7792} {"train_loss": -28.140024185180664, "global_step": 646742, "epoch": 7792} {"train_loss": -27.90862464904785, "global_step": 646743, "epoch": 7792} {"train_loss": -28.612592697143555, "global_step": 646744, "epoch": 7792} {"train_loss": -28.501026153564453, "global_step": 646745, "epoch": 7792} {"train_loss": -28.240554809570312, "global_step": 646746, "epoch": 7792} {"train_loss": -28.26150894165039, "global_step": 646747, "epoch": 7792} {"train_loss": -28.507349014282227, "global_step": 646748, "epoch": 7792} {"train_loss": -28.117725372314453, "global_step": 646749, "epoch": 7792} {"train_loss": -27.801794052124023, "global_step": 646750, "epoch": 7792} {"train_loss": -28.1678409576416, "global_step": 646751, "epoch": 7792} {"train_loss": -28.445571899414062, "global_step": 646752, "epoch": 7792} {"train_loss": -28.217700958251953, "global_step": 646753, "epoch": 7792} {"train_loss": -28.0968017578125, "global_step": 646754, "epoch": 7792} {"train_loss": -28.42275047302246, "global_step": 646755, "epoch": 7792} {"train_loss": -27.95477294921875, "global_step": 646756, "epoch": 7792} {"train_loss": -28.078693389892578, "global_step": 646757, "epoch": 7792} {"train_loss": -28.46466636657715, "global_step": 646758, "epoch": 7792} {"train_loss": -28.31705665588379, "global_step": 646759, "epoch": 7792} {"train_loss": -28.34406089782715, "global_step": 646760, "epoch": 7792} {"train_loss": -28.134496688842773, "global_step": 646761, "epoch": 7792} {"train_loss": -28.105276107788086, "global_step": 646762, "epoch": 7792} {"train_loss": -28.622156143188477, "global_step": 646763, "epoch": 7792} {"train_loss": -28.227262496948242, "global_step": 646764, "epoch": 7792} {"train_loss": -28.311399459838867, "global_step": 646765, "epoch": 7792} {"train_loss": -28.431415557861328, "global_step": 646766, "epoch": 7792} {"train_loss": -28.179706573486328, "global_step": 646767, "epoch": 7792} {"train_loss": -28.442005157470703, "global_step": 646768, "epoch": 7792} {"train_loss": -28.395185470581055, "global_step": 646769, "epoch": 7792} {"train_loss": -28.329023361206055, "global_step": 646770, "epoch": 7792} {"train_loss": -28.108295440673828, "global_step": 646771, "epoch": 7792} {"train_loss": -28.23388671875, "global_step": 646772, "epoch": 7792} {"train_loss": -28.18230628967285, "global_step": 646773, "epoch": 7792} {"train_loss": -27.780004501342773, "global_step": 646774, "epoch": 7792} {"train_loss": -28.330961227416992, "global_step": 646775, "epoch": 7792} {"train_loss": -28.235401153564453, "global_step": 646776, "epoch": 7792} {"train_loss": -28.0941104888916, "global_step": 646777, "epoch": 7792} {"train_loss": -28.835607528686523, "global_step": 646778, "epoch": 7792} {"train_loss": -28.735944747924805, "global_step": 646779, "epoch": 7792} {"train_loss": -28.394927978515625, "global_step": 646780, "epoch": 7792} {"train_loss": -28.246490478515625, "global_step": 646781, "epoch": 7792} {"train_loss": -28.1495304107666, "global_step": 646782, "epoch": 7792} {"train_loss": -28.22382164001465, "global_step": 646783, "epoch": 7792} {"train_loss": -28.38575553894043, "global_step": 646784, "epoch": 7792} {"train_loss": -28.538745880126953, "global_step": 646785, "epoch": 7792} {"train_loss": -28.283788681030273, "global_step": 646786, "epoch": 7792} {"train_loss": -28.00074577331543, "global_step": 646787, "epoch": 7792} {"train_loss": -27.195398330688477, "global_step": 646788, "epoch": 7792} {"train_loss": -25.99822425842285, "global_step": 646789, "epoch": 7792} {"train_loss": -27.296247482299805, "global_step": 646790, "epoch": 7792} {"train_loss": -28.007307052612305, "global_step": 646791, "epoch": 7792} {"train_loss": -27.83475685119629, "global_step": 646792, "epoch": 7792} {"train_loss": -28.243284225463867, "global_step": 646793, "epoch": 7792} {"train_loss": -28.03386878967285, "global_step": 646794, "epoch": 7792} {"train_loss": -27.61370277404785, "global_step": 646795, "epoch": 7792} {"train_loss": -27.966053009033203, "global_step": 646796, "epoch": 7792} {"train_loss": -28.146371841430664, "global_step": 646797, "epoch": 7792} {"train_loss": -28.080060958862305, "global_step": 646798, "epoch": 7792} {"train_loss": -28.313562393188477, "global_step": 646799, "epoch": 7792} {"train_loss": -28.036535263061523, "global_step": 646800, "epoch": 7792} {"train_loss": -27.935443878173828, "global_step": 646801, "epoch": 7792} {"train_loss": -28.2037353515625, "global_step": 646802, "epoch": 7792} {"train_loss": -27.999601364135742, "global_step": 646803, "epoch": 7792} {"train_loss": -28.121936798095703, "global_step": 646804, "epoch": 7792} {"train_loss": -28.156232833862305, "global_step": 646805, "epoch": 7792} {"train_loss": -27.834095001220703, "global_step": 646806, "epoch": 7792} {"train_loss": -28.12116813659668, "global_step": 646807, "epoch": 7792} {"train_loss": -28.053319931030273, "global_step": 646808, "epoch": 7792} {"train_loss": -28.246490478515625, "global_step": 646809, "epoch": 7792} {"train_loss": -27.866117477416992, "global_step": 646810, "epoch": 7792} {"train_loss": -28.440826416015625, "global_step": 646811, "epoch": 7792} {"train_loss": -28.03742790222168, "global_step": 646812, "epoch": 7792} {"train_loss": -28.025339126586914, "global_step": 646813, "epoch": 7792} {"train_loss": -28.28131675720215, "global_step": 646814, "epoch": 7792} {"train_loss": -28.789386749267578, "global_step": 646815, "epoch": 7792} {"train_loss": -28.930118560791016, "global_step": 646816, "epoch": 7792} {"train_loss": -27.863483428955078, "global_step": 646817, "epoch": 7792} {"train_loss": -28.15293323562806, "global_step": 646818, "epoch": 7792, "val_loss": 6722584.0} {"train_loss": -27.36444664001465, "global_step": 646819, "epoch": 7793} {"train_loss": -26.833276748657227, "global_step": 646820, "epoch": 7793} {"train_loss": -27.015161514282227, "global_step": 646821, "epoch": 7793} {"train_loss": -27.432958602905273, "global_step": 646822, "epoch": 7793} {"train_loss": -27.4572696685791, "global_step": 646823, "epoch": 7793} {"train_loss": -27.775846481323242, "global_step": 646824, "epoch": 7793} {"train_loss": -27.449186325073242, "global_step": 646825, "epoch": 7793} {"train_loss": -27.43251609802246, "global_step": 646826, "epoch": 7793} {"train_loss": -28.21394157409668, "global_step": 646827, "epoch": 7793} {"train_loss": -27.339889526367188, "global_step": 646828, "epoch": 7793} {"train_loss": -27.68092918395996, "global_step": 646829, "epoch": 7793} {"train_loss": -28.51393699645996, "global_step": 646830, "epoch": 7793} {"train_loss": -27.9293155670166, "global_step": 646831, "epoch": 7793} {"train_loss": -27.458234786987305, "global_step": 646832, "epoch": 7793} {"train_loss": -27.570209503173828, "global_step": 646833, "epoch": 7793} {"train_loss": -28.16933250427246, "global_step": 646834, "epoch": 7793} {"train_loss": -28.18668556213379, "global_step": 646835, "epoch": 7793} {"train_loss": -26.944416046142578, "global_step": 646836, "epoch": 7793} {"train_loss": -27.710651397705078, "global_step": 646837, "epoch": 7793} {"train_loss": -27.919891357421875, "global_step": 646838, "epoch": 7793} {"train_loss": -27.82777976989746, "global_step": 646839, "epoch": 7793} {"train_loss": -28.17805290222168, "global_step": 646840, "epoch": 7793} {"train_loss": -28.205137252807617, "global_step": 646841, "epoch": 7793} {"train_loss": -28.040771484375, "global_step": 646842, "epoch": 7793} {"train_loss": -28.108566284179688, "global_step": 646843, "epoch": 7793} {"train_loss": -28.0502986907959, "global_step": 646844, "epoch": 7793} {"train_loss": -27.787799835205078, "global_step": 646845, "epoch": 7793} {"train_loss": -27.882001876831055, "global_step": 646846, "epoch": 7793} {"train_loss": -28.06062126159668, "global_step": 646847, "epoch": 7793} {"train_loss": -28.5278377532959, "global_step": 646848, "epoch": 7793} {"train_loss": -27.849164962768555, "global_step": 646849, "epoch": 7793} {"train_loss": -28.448755264282227, "global_step": 646850, "epoch": 7793} {"train_loss": -28.332563400268555, "global_step": 646851, "epoch": 7793} {"train_loss": -27.946786880493164, "global_step": 646852, "epoch": 7793} {"train_loss": -28.26258659362793, "global_step": 646853, "epoch": 7793} {"train_loss": -28.339996337890625, "global_step": 646854, "epoch": 7793} {"train_loss": -28.084943771362305, "global_step": 646855, "epoch": 7793} {"train_loss": -28.49287986755371, "global_step": 646856, "epoch": 7793} {"train_loss": -28.374439239501953, "global_step": 646857, "epoch": 7793} {"train_loss": -28.18585205078125, "global_step": 646858, "epoch": 7793} {"train_loss": -28.175878524780273, "global_step": 646859, "epoch": 7793} {"train_loss": -28.72580337524414, "global_step": 646860, "epoch": 7793} {"train_loss": -28.255258560180664, "global_step": 646861, "epoch": 7793} {"train_loss": -28.34413719177246, "global_step": 646862, "epoch": 7793} {"train_loss": -28.390689849853516, "global_step": 646863, "epoch": 7793} {"train_loss": -28.489282608032227, "global_step": 646864, "epoch": 7793} {"train_loss": -27.964139938354492, "global_step": 646865, "epoch": 7793} {"train_loss": -28.618732452392578, "global_step": 646866, "epoch": 7793} {"train_loss": -28.167633056640625, "global_step": 646867, "epoch": 7793} {"train_loss": -28.581836700439453, "global_step": 646868, "epoch": 7793} {"train_loss": -28.4461612701416, "global_step": 646869, "epoch": 7793} {"train_loss": -28.94280433654785, "global_step": 646870, "epoch": 7793} {"train_loss": -28.637731552124023, "global_step": 646871, "epoch": 7793} {"train_loss": -28.222620010375977, "global_step": 646872, "epoch": 7793} {"train_loss": -28.109045028686523, "global_step": 646873, "epoch": 7793} {"train_loss": -27.9299373626709, "global_step": 646874, "epoch": 7793} {"train_loss": -27.55680274963379, "global_step": 646875, "epoch": 7793} {"train_loss": -28.524051666259766, "global_step": 646876, "epoch": 7793} {"train_loss": -28.844013214111328, "global_step": 646877, "epoch": 7793} {"train_loss": -27.788938522338867, "global_step": 646878, "epoch": 7793} {"train_loss": -27.69608497619629, "global_step": 646879, "epoch": 7793} {"train_loss": -28.160032272338867, "global_step": 646880, "epoch": 7793} {"train_loss": -28.35382080078125, "global_step": 646881, "epoch": 7793} {"train_loss": -28.101348876953125, "global_step": 646882, "epoch": 7793} {"train_loss": -28.41792869567871, "global_step": 646883, "epoch": 7793} {"train_loss": -28.1223201751709, "global_step": 646884, "epoch": 7793} {"train_loss": -28.179203033447266, "global_step": 646885, "epoch": 7793} {"train_loss": -28.30612564086914, "global_step": 646886, "epoch": 7793} {"train_loss": -28.28101921081543, "global_step": 646887, "epoch": 7793} {"train_loss": -28.601926803588867, "global_step": 646888, "epoch": 7793} {"train_loss": -28.5665225982666, "global_step": 646889, "epoch": 7793} {"train_loss": -28.307788848876953, "global_step": 646890, "epoch": 7793} {"train_loss": -28.458581924438477, "global_step": 646891, "epoch": 7793} {"train_loss": -27.93999671936035, "global_step": 646892, "epoch": 7793} {"train_loss": -28.149890899658203, "global_step": 646893, "epoch": 7793} {"train_loss": -28.643051147460938, "global_step": 646894, "epoch": 7793} {"train_loss": -28.194034576416016, "global_step": 646895, "epoch": 7793} {"train_loss": -28.115558624267578, "global_step": 646896, "epoch": 7793} {"train_loss": -28.331323623657227, "global_step": 646897, "epoch": 7793} {"train_loss": -28.09150505065918, "global_step": 646898, "epoch": 7793} {"train_loss": -28.28095817565918, "global_step": 646899, "epoch": 7793} {"train_loss": -28.195514678955078, "global_step": 646900, "epoch": 7793} {"train_loss": -28.090082375400037, "global_step": 646901, "epoch": 7793, "val_loss": 6711870.5} {"train_loss": -25.806543350219727, "global_step": 646902, "epoch": 7794} {"train_loss": -23.482770919799805, "global_step": 646903, "epoch": 7794} {"train_loss": -28.00836753845215, "global_step": 646904, "epoch": 7794} {"train_loss": -25.956647872924805, "global_step": 646905, "epoch": 7794} {"train_loss": -26.679182052612305, "global_step": 646906, "epoch": 7794} {"train_loss": -26.697912216186523, "global_step": 646907, "epoch": 7794} {"train_loss": -26.805402755737305, "global_step": 646908, "epoch": 7794} {"train_loss": -26.462507247924805, "global_step": 646909, "epoch": 7794} {"train_loss": -27.366622924804688, "global_step": 646910, "epoch": 7794} {"train_loss": -26.409154891967773, "global_step": 646911, "epoch": 7794} {"train_loss": -27.751453399658203, "global_step": 646912, "epoch": 7794} {"train_loss": -27.219593048095703, "global_step": 646913, "epoch": 7794} {"train_loss": -27.039413452148438, "global_step": 646914, "epoch": 7794} {"train_loss": -27.309146881103516, "global_step": 646915, "epoch": 7794} {"train_loss": -28.066558837890625, "global_step": 646916, "epoch": 7794} {"train_loss": -27.4995059967041, "global_step": 646917, "epoch": 7794} {"train_loss": -27.269460678100586, "global_step": 646918, "epoch": 7794} {"train_loss": -27.675825119018555, "global_step": 646919, "epoch": 7794} {"train_loss": -27.849689483642578, "global_step": 646920, "epoch": 7794} {"train_loss": -27.431543350219727, "global_step": 646921, "epoch": 7794} {"train_loss": -27.57442283630371, "global_step": 646922, "epoch": 7794} {"train_loss": -27.44803810119629, "global_step": 646923, "epoch": 7794} {"train_loss": -27.685171127319336, "global_step": 646924, "epoch": 7794} {"train_loss": -27.470794677734375, "global_step": 646925, "epoch": 7794} {"train_loss": -27.902997970581055, "global_step": 646926, "epoch": 7794} {"train_loss": -27.605941772460938, "global_step": 646927, "epoch": 7794} {"train_loss": -27.627716064453125, "global_step": 646928, "epoch": 7794} {"train_loss": -27.984546661376953, "global_step": 646929, "epoch": 7794} {"train_loss": -27.810949325561523, "global_step": 646930, "epoch": 7794} {"train_loss": -27.668655395507812, "global_step": 646931, "epoch": 7794} {"train_loss": -27.6268367767334, "global_step": 646932, "epoch": 7794} {"train_loss": -28.083271026611328, "global_step": 646933, "epoch": 7794} {"train_loss": -28.003271102905273, "global_step": 646934, "epoch": 7794} {"train_loss": -28.01502799987793, "global_step": 646935, "epoch": 7794} {"train_loss": -28.089126586914062, "global_step": 646936, "epoch": 7794} {"train_loss": -28.490049362182617, "global_step": 646937, "epoch": 7794} {"train_loss": -27.731321334838867, "global_step": 646938, "epoch": 7794} {"train_loss": -28.5234317779541, "global_step": 646939, "epoch": 7794} {"train_loss": -28.149404525756836, "global_step": 646940, "epoch": 7794} {"train_loss": -28.18926429748535, "global_step": 646941, "epoch": 7794} {"train_loss": -27.766462326049805, "global_step": 646942, "epoch": 7794} {"train_loss": -28.571887969970703, "global_step": 646943, "epoch": 7794} {"train_loss": -28.413105010986328, "global_step": 646944, "epoch": 7794} {"train_loss": -28.1479549407959, "global_step": 646945, "epoch": 7794} {"train_loss": -28.422870635986328, "global_step": 646946, "epoch": 7794} {"train_loss": -28.08538818359375, "global_step": 646947, "epoch": 7794} {"train_loss": -28.314239501953125, "global_step": 646948, "epoch": 7794} {"train_loss": -28.29578971862793, "global_step": 646949, "epoch": 7794} {"train_loss": -28.046253204345703, "global_step": 646950, "epoch": 7794} {"train_loss": -28.399808883666992, "global_step": 646951, "epoch": 7794} {"train_loss": -27.80973243713379, "global_step": 646952, "epoch": 7794} {"train_loss": -28.597131729125977, "global_step": 646953, "epoch": 7794} {"train_loss": -28.413318634033203, "global_step": 646954, "epoch": 7794} {"train_loss": -28.257497787475586, "global_step": 646955, "epoch": 7794} {"train_loss": -28.574207305908203, "global_step": 646956, "epoch": 7794} {"train_loss": -28.129541397094727, "global_step": 646957, "epoch": 7794} {"train_loss": -28.345111846923828, "global_step": 646958, "epoch": 7794} {"train_loss": -28.36322593688965, "global_step": 646959, "epoch": 7794} {"train_loss": -28.237329483032227, "global_step": 646960, "epoch": 7794} {"train_loss": -28.2984619140625, "global_step": 646961, "epoch": 7794} {"train_loss": -27.912952423095703, "global_step": 646962, "epoch": 7794} {"train_loss": -28.201690673828125, "global_step": 646963, "epoch": 7794} {"train_loss": -27.974227905273438, "global_step": 646964, "epoch": 7794} {"train_loss": -28.028717041015625, "global_step": 646965, "epoch": 7794} {"train_loss": -28.0338134765625, "global_step": 646966, "epoch": 7794} {"train_loss": -28.111352920532227, "global_step": 646967, "epoch": 7794} {"train_loss": -28.1055965423584, "global_step": 646968, "epoch": 7794} {"train_loss": -28.04546546936035, "global_step": 646969, "epoch": 7794} {"train_loss": -27.32428550720215, "global_step": 646970, "epoch": 7794} {"train_loss": -27.967626571655273, "global_step": 646971, "epoch": 7794} {"train_loss": -27.797122955322266, "global_step": 646972, "epoch": 7794} {"train_loss": -27.593338012695312, "global_step": 646973, "epoch": 7794} {"train_loss": -27.492603302001953, "global_step": 646974, "epoch": 7794} {"train_loss": -27.13751792907715, "global_step": 646975, "epoch": 7794} {"train_loss": -27.524616241455078, "global_step": 646976, "epoch": 7794} {"train_loss": -27.733701705932617, "global_step": 646977, "epoch": 7794} {"train_loss": -28.07856559753418, "global_step": 646978, "epoch": 7794} {"train_loss": -27.877655029296875, "global_step": 646979, "epoch": 7794} {"train_loss": -28.0805606842041, "global_step": 646980, "epoch": 7794} {"train_loss": -28.000980377197266, "global_step": 646981, "epoch": 7794} {"train_loss": -28.2441349029541, "global_step": 646982, "epoch": 7794} {"train_loss": -28.267959594726562, "global_step": 646983, "epoch": 7794} {"train_loss": -27.752556168889424, "global_step": 646984, "epoch": 7794, "val_loss": 6620936.0} {"train_loss": -27.22468376159668, "global_step": 646985, "epoch": 7795} {"train_loss": -27.528547286987305, "global_step": 646986, "epoch": 7795} {"train_loss": -27.395465850830078, "global_step": 646987, "epoch": 7795} {"train_loss": -27.3984317779541, "global_step": 646988, "epoch": 7795} {"train_loss": -27.165918350219727, "global_step": 646989, "epoch": 7795} {"train_loss": -27.377546310424805, "global_step": 646990, "epoch": 7795} {"train_loss": -26.8247013092041, "global_step": 646991, "epoch": 7795} {"train_loss": -27.713932037353516, "global_step": 646992, "epoch": 7795} {"train_loss": -27.461109161376953, "global_step": 646993, "epoch": 7795} {"train_loss": -27.144311904907227, "global_step": 646994, "epoch": 7795} {"train_loss": -27.940977096557617, "global_step": 646995, "epoch": 7795} {"train_loss": -27.656641006469727, "global_step": 646996, "epoch": 7795} {"train_loss": -27.392423629760742, "global_step": 646997, "epoch": 7795} {"train_loss": -27.828001022338867, "global_step": 646998, "epoch": 7795} {"train_loss": -27.282602310180664, "global_step": 646999, "epoch": 7795} {"train_loss": -27.541156768798828, "global_step": 647000, "epoch": 7795} {"train_loss": -27.680517196655273, "global_step": 647001, "epoch": 7795} {"train_loss": -27.751083374023438, "global_step": 647002, "epoch": 7795} {"train_loss": -27.941328048706055, "global_step": 647003, "epoch": 7795} {"train_loss": -28.023193359375, "global_step": 647004, "epoch": 7795} {"train_loss": -27.949298858642578, "global_step": 647005, "epoch": 7795} {"train_loss": -28.2517147064209, "global_step": 647006, "epoch": 7795} {"train_loss": -28.299352645874023, "global_step": 647007, "epoch": 7795} {"train_loss": -27.8328857421875, "global_step": 647008, "epoch": 7795} {"train_loss": -27.835041046142578, "global_step": 647009, "epoch": 7795} {"train_loss": -27.83440589904785, "global_step": 647010, "epoch": 7795} {"train_loss": -27.924707412719727, "global_step": 647011, "epoch": 7795} {"train_loss": -27.664661407470703, "global_step": 647012, "epoch": 7795} {"train_loss": -28.00788688659668, "global_step": 647013, "epoch": 7795} {"train_loss": -28.114194869995117, "global_step": 647014, "epoch": 7795} {"train_loss": -27.79840660095215, "global_step": 647015, "epoch": 7795} {"train_loss": -27.82588005065918, "global_step": 647016, "epoch": 7795} {"train_loss": -28.1650447845459, "global_step": 647017, "epoch": 7795} {"train_loss": -28.4854793548584, "global_step": 647018, "epoch": 7795} {"train_loss": -28.578153610229492, "global_step": 647019, "epoch": 7795} {"train_loss": -28.434539794921875, "global_step": 647020, "epoch": 7795} {"train_loss": -28.152997970581055, "global_step": 647021, "epoch": 7795} {"train_loss": -28.4195613861084, "global_step": 647022, "epoch": 7795} {"train_loss": -28.257308959960938, "global_step": 647023, "epoch": 7795} {"train_loss": -28.44318199157715, "global_step": 647024, "epoch": 7795} {"train_loss": -28.4503173828125, "global_step": 647025, "epoch": 7795} {"train_loss": -28.570331573486328, "global_step": 647026, "epoch": 7795} {"train_loss": -28.07693862915039, "global_step": 647027, "epoch": 7795} {"train_loss": -28.07069206237793, "global_step": 647028, "epoch": 7795} {"train_loss": -28.538654327392578, "global_step": 647029, "epoch": 7795} {"train_loss": -28.65860366821289, "global_step": 647030, "epoch": 7795} {"train_loss": -28.513036727905273, "global_step": 647031, "epoch": 7795} {"train_loss": -28.5711612701416, "global_step": 647032, "epoch": 7795} {"train_loss": -28.385242462158203, "global_step": 647033, "epoch": 7795} {"train_loss": -28.297672271728516, "global_step": 647034, "epoch": 7795} {"train_loss": -28.503225326538086, "global_step": 647035, "epoch": 7795} {"train_loss": -28.292749404907227, "global_step": 647036, "epoch": 7795} {"train_loss": -28.604528427124023, "global_step": 647037, "epoch": 7795} {"train_loss": -28.537160873413086, "global_step": 647038, "epoch": 7795} {"train_loss": -28.367597579956055, "global_step": 647039, "epoch": 7795} {"train_loss": -28.36720085144043, "global_step": 647040, "epoch": 7795} {"train_loss": -28.4183349609375, "global_step": 647041, "epoch": 7795} {"train_loss": -28.561384201049805, "global_step": 647042, "epoch": 7795} {"train_loss": -28.321216583251953, "global_step": 647043, "epoch": 7795} {"train_loss": -28.77186393737793, "global_step": 647044, "epoch": 7795} {"train_loss": -28.66493797302246, "global_step": 647045, "epoch": 7795} {"train_loss": -28.346906661987305, "global_step": 647046, "epoch": 7795} {"train_loss": -28.890195846557617, "global_step": 647047, "epoch": 7795} {"train_loss": -28.51137351989746, "global_step": 647048, "epoch": 7795} {"train_loss": -28.679676055908203, "global_step": 647049, "epoch": 7795} {"train_loss": -28.55559730529785, "global_step": 647050, "epoch": 7795} {"train_loss": -28.64092445373535, "global_step": 647051, "epoch": 7795} {"train_loss": -28.614307403564453, "global_step": 647052, "epoch": 7795} {"train_loss": -28.09682273864746, "global_step": 647053, "epoch": 7795} {"train_loss": -28.516977310180664, "global_step": 647054, "epoch": 7795} {"train_loss": -28.682941436767578, "global_step": 647055, "epoch": 7795} {"train_loss": -28.676584243774414, "global_step": 647056, "epoch": 7795} {"train_loss": -28.42702293395996, "global_step": 647057, "epoch": 7795} {"train_loss": -28.343687057495117, "global_step": 647058, "epoch": 7795} {"train_loss": -28.36669921875, "global_step": 647059, "epoch": 7795} {"train_loss": -28.453821182250977, "global_step": 647060, "epoch": 7795} {"train_loss": -27.799732208251953, "global_step": 647061, "epoch": 7795} {"train_loss": -27.656293869018555, "global_step": 647062, "epoch": 7795} {"train_loss": -26.62135887145996, "global_step": 647063, "epoch": 7795} {"train_loss": -26.04364013671875, "global_step": 647064, "epoch": 7795} {"train_loss": -27.0277156829834, "global_step": 647065, "epoch": 7795} {"train_loss": -27.15108299255371, "global_step": 647066, "epoch": 7795} {"train_loss": -28.060726050870965, "global_step": 647067, "epoch": 7795, "val_loss": 6773553.5} {"train_loss": -27.164443969726562, "global_step": 647068, "epoch": 7796} {"train_loss": -26.866992950439453, "global_step": 647069, "epoch": 7796} {"train_loss": -26.648401260375977, "global_step": 647070, "epoch": 7796} {"train_loss": -26.9953556060791, "global_step": 647071, "epoch": 7796} {"train_loss": -26.856983184814453, "global_step": 647072, "epoch": 7796} {"train_loss": -26.6955509185791, "global_step": 647073, "epoch": 7796} {"train_loss": -27.21368408203125, "global_step": 647074, "epoch": 7796} {"train_loss": -27.537229537963867, "global_step": 647075, "epoch": 7796} {"train_loss": -27.42937660217285, "global_step": 647076, "epoch": 7796} {"train_loss": -27.268186569213867, "global_step": 647077, "epoch": 7796} {"train_loss": -27.228408813476562, "global_step": 647078, "epoch": 7796} {"train_loss": -27.58204460144043, "global_step": 647079, "epoch": 7796} {"train_loss": -27.418798446655273, "global_step": 647080, "epoch": 7796} {"train_loss": -27.552350997924805, "global_step": 647081, "epoch": 7796} {"train_loss": -27.74872398376465, "global_step": 647082, "epoch": 7796} {"train_loss": -27.237518310546875, "global_step": 647083, "epoch": 7796} {"train_loss": -27.918258666992188, "global_step": 647084, "epoch": 7796} {"train_loss": -27.6267147064209, "global_step": 647085, "epoch": 7796} {"train_loss": -27.947265625, "global_step": 647086, "epoch": 7796} {"train_loss": -27.126169204711914, "global_step": 647087, "epoch": 7796} {"train_loss": -27.939294815063477, "global_step": 647088, "epoch": 7796} {"train_loss": -27.526586532592773, "global_step": 647089, "epoch": 7796} {"train_loss": -27.89887809753418, "global_step": 647090, "epoch": 7796} {"train_loss": -27.911298751831055, "global_step": 647091, "epoch": 7796} {"train_loss": -28.004810333251953, "global_step": 647092, "epoch": 7796} {"train_loss": -27.89149284362793, "global_step": 647093, "epoch": 7796} {"train_loss": -27.959766387939453, "global_step": 647094, "epoch": 7796} {"train_loss": -28.04505729675293, "global_step": 647095, "epoch": 7796} {"train_loss": -28.215961456298828, "global_step": 647096, "epoch": 7796} {"train_loss": -28.2398681640625, "global_step": 647097, "epoch": 7796} {"train_loss": -28.271621704101562, "global_step": 647098, "epoch": 7796} {"train_loss": -28.13286781311035, "global_step": 647099, "epoch": 7796} {"train_loss": -28.318952560424805, "global_step": 647100, "epoch": 7796} {"train_loss": -28.24786376953125, "global_step": 647101, "epoch": 7796} {"train_loss": -27.91096305847168, "global_step": 647102, "epoch": 7796} {"train_loss": -28.455541610717773, "global_step": 647103, "epoch": 7796} {"train_loss": -28.146276473999023, "global_step": 647104, "epoch": 7796} {"train_loss": -28.527536392211914, "global_step": 647105, "epoch": 7796} {"train_loss": -28.3642635345459, "global_step": 647106, "epoch": 7796} {"train_loss": -28.36328125, "global_step": 647107, "epoch": 7796} {"train_loss": -28.712125778198242, "global_step": 647108, "epoch": 7796} {"train_loss": -28.37415885925293, "global_step": 647109, "epoch": 7796} {"train_loss": -28.4173641204834, "global_step": 647110, "epoch": 7796} {"train_loss": -28.436038970947266, "global_step": 647111, "epoch": 7796} {"train_loss": -28.19178581237793, "global_step": 647112, "epoch": 7796} {"train_loss": -28.68279457092285, "global_step": 647113, "epoch": 7796} {"train_loss": -28.525577545166016, "global_step": 647114, "epoch": 7796} {"train_loss": -28.578968048095703, "global_step": 647115, "epoch": 7796} {"train_loss": -28.482114791870117, "global_step": 647116, "epoch": 7796} {"train_loss": -28.588947296142578, "global_step": 647117, "epoch": 7796} {"train_loss": -28.411584854125977, "global_step": 647118, "epoch": 7796} {"train_loss": -28.465085983276367, "global_step": 647119, "epoch": 7796} {"train_loss": -28.552154541015625, "global_step": 647120, "epoch": 7796} {"train_loss": -28.541717529296875, "global_step": 647121, "epoch": 7796} {"train_loss": -28.35575294494629, "global_step": 647122, "epoch": 7796} {"train_loss": -28.083234786987305, "global_step": 647123, "epoch": 7796} {"train_loss": -27.91226577758789, "global_step": 647124, "epoch": 7796} {"train_loss": -27.912214279174805, "global_step": 647125, "epoch": 7796} {"train_loss": -28.133899688720703, "global_step": 647126, "epoch": 7796} {"train_loss": -28.47162437438965, "global_step": 647127, "epoch": 7796} {"train_loss": -28.04290771484375, "global_step": 647128, "epoch": 7796} {"train_loss": -27.899906158447266, "global_step": 647129, "epoch": 7796} {"train_loss": -28.297367095947266, "global_step": 647130, "epoch": 7796} {"train_loss": -28.573047637939453, "global_step": 647131, "epoch": 7796} {"train_loss": -28.416385650634766, "global_step": 647132, "epoch": 7796} {"train_loss": -28.23687171936035, "global_step": 647133, "epoch": 7796} {"train_loss": -28.18147850036621, "global_step": 647134, "epoch": 7796} {"train_loss": -28.161884307861328, "global_step": 647135, "epoch": 7796} {"train_loss": -28.579517364501953, "global_step": 647136, "epoch": 7796} {"train_loss": -27.880483627319336, "global_step": 647137, "epoch": 7796} {"train_loss": -28.550867080688477, "global_step": 647138, "epoch": 7796} {"train_loss": -27.90909767150879, "global_step": 647139, "epoch": 7796} {"train_loss": -28.32893943786621, "global_step": 647140, "epoch": 7796} {"train_loss": -28.26051902770996, "global_step": 647141, "epoch": 7796} {"train_loss": -28.672103881835938, "global_step": 647142, "epoch": 7796} {"train_loss": -28.125375747680664, "global_step": 647143, "epoch": 7796} {"train_loss": -28.550573348999023, "global_step": 647144, "epoch": 7796} {"train_loss": -28.229990005493164, "global_step": 647145, "epoch": 7796} {"train_loss": -28.474435806274414, "global_step": 647146, "epoch": 7796} {"train_loss": -27.835926055908203, "global_step": 647147, "epoch": 7796} {"train_loss": -28.54066276550293, "global_step": 647148, "epoch": 7796} {"train_loss": -28.622053146362305, "global_step": 647149, "epoch": 7796} {"train_loss": -28.050401825502693, "global_step": 647150, "epoch": 7796, "val_loss": 6672797.0} {"train_loss": -26.505945205688477, "global_step": 647151, "epoch": 7797} {"train_loss": -27.217941284179688, "global_step": 647152, "epoch": 7797} {"train_loss": -26.867151260375977, "global_step": 647153, "epoch": 7797} {"train_loss": -27.30257225036621, "global_step": 647154, "epoch": 7797} {"train_loss": -26.943098068237305, "global_step": 647155, "epoch": 7797} {"train_loss": -26.661334991455078, "global_step": 647156, "epoch": 7797} {"train_loss": -27.50531005859375, "global_step": 647157, "epoch": 7797} {"train_loss": -27.292821884155273, "global_step": 647158, "epoch": 7797} {"train_loss": -27.389450073242188, "global_step": 647159, "epoch": 7797} {"train_loss": -27.780542373657227, "global_step": 647160, "epoch": 7797} {"train_loss": -27.497663497924805, "global_step": 647161, "epoch": 7797} {"train_loss": -27.777875900268555, "global_step": 647162, "epoch": 7797} {"train_loss": -27.323551177978516, "global_step": 647163, "epoch": 7797} {"train_loss": -27.824888229370117, "global_step": 647164, "epoch": 7797} {"train_loss": -27.7191162109375, "global_step": 647165, "epoch": 7797} {"train_loss": -27.812183380126953, "global_step": 647166, "epoch": 7797} {"train_loss": -28.066701889038086, "global_step": 647167, "epoch": 7797} {"train_loss": -27.940576553344727, "global_step": 647168, "epoch": 7797} {"train_loss": -27.835391998291016, "global_step": 647169, "epoch": 7797} {"train_loss": -27.955434799194336, "global_step": 647170, "epoch": 7797} {"train_loss": -28.073734283447266, "global_step": 647171, "epoch": 7797} {"train_loss": -27.79176139831543, "global_step": 647172, "epoch": 7797} {"train_loss": -28.0598087310791, "global_step": 647173, "epoch": 7797} {"train_loss": -28.329496383666992, "global_step": 647174, "epoch": 7797} {"train_loss": -28.122446060180664, "global_step": 647175, "epoch": 7797} {"train_loss": -27.844884872436523, "global_step": 647176, "epoch": 7797} {"train_loss": -28.19520378112793, "global_step": 647177, "epoch": 7797} {"train_loss": -27.910669326782227, "global_step": 647178, "epoch": 7797} {"train_loss": -27.872364044189453, "global_step": 647179, "epoch": 7797} {"train_loss": -28.258453369140625, "global_step": 647180, "epoch": 7797} {"train_loss": -28.279218673706055, "global_step": 647181, "epoch": 7797} {"train_loss": -28.629627227783203, "global_step": 647182, "epoch": 7797} {"train_loss": -28.375402450561523, "global_step": 647183, "epoch": 7797} {"train_loss": -28.466156005859375, "global_step": 647184, "epoch": 7797} {"train_loss": -27.87220573425293, "global_step": 647185, "epoch": 7797} {"train_loss": -28.42597007751465, "global_step": 647186, "epoch": 7797} {"train_loss": -28.345483779907227, "global_step": 647187, "epoch": 7797} {"train_loss": -28.16681480407715, "global_step": 647188, "epoch": 7797} {"train_loss": -28.2215576171875, "global_step": 647189, "epoch": 7797} {"train_loss": -28.250125885009766, "global_step": 647190, "epoch": 7797} {"train_loss": -28.236499786376953, "global_step": 647191, "epoch": 7797} {"train_loss": -28.246326446533203, "global_step": 647192, "epoch": 7797} {"train_loss": -28.135589599609375, "global_step": 647193, "epoch": 7797} {"train_loss": -27.983539581298828, "global_step": 647194, "epoch": 7797} {"train_loss": -28.35944938659668, "global_step": 647195, "epoch": 7797} {"train_loss": -28.2810115814209, "global_step": 647196, "epoch": 7797} {"train_loss": -28.34632682800293, "global_step": 647197, "epoch": 7797} {"train_loss": -28.35745620727539, "global_step": 647198, "epoch": 7797} {"train_loss": -28.68964958190918, "global_step": 647199, "epoch": 7797} {"train_loss": -28.500036239624023, "global_step": 647200, "epoch": 7797} {"train_loss": -28.351348876953125, "global_step": 647201, "epoch": 7797} {"train_loss": -28.2370548248291, "global_step": 647202, "epoch": 7797} {"train_loss": -28.393598556518555, "global_step": 647203, "epoch": 7797} {"train_loss": -28.36557960510254, "global_step": 647204, "epoch": 7797} {"train_loss": -28.008691787719727, "global_step": 647205, "epoch": 7797} {"train_loss": -27.98685646057129, "global_step": 647206, "epoch": 7797} {"train_loss": -28.299665451049805, "global_step": 647207, "epoch": 7797} {"train_loss": -28.327672958374023, "global_step": 647208, "epoch": 7797} {"train_loss": -28.26063346862793, "global_step": 647209, "epoch": 7797} {"train_loss": -28.226598739624023, "global_step": 647210, "epoch": 7797} {"train_loss": -28.558319091796875, "global_step": 647211, "epoch": 7797} {"train_loss": -28.236835479736328, "global_step": 647212, "epoch": 7797} {"train_loss": -28.534894943237305, "global_step": 647213, "epoch": 7797} {"train_loss": -27.90561866760254, "global_step": 647214, "epoch": 7797} {"train_loss": -28.154998779296875, "global_step": 647215, "epoch": 7797} {"train_loss": -28.1091365814209, "global_step": 647216, "epoch": 7797} {"train_loss": -28.376758575439453, "global_step": 647217, "epoch": 7797} {"train_loss": -28.2691650390625, "global_step": 647218, "epoch": 7797} {"train_loss": -28.40191650390625, "global_step": 647219, "epoch": 7797} {"train_loss": -28.229644775390625, "global_step": 647220, "epoch": 7797} {"train_loss": -28.400537490844727, "global_step": 647221, "epoch": 7797} {"train_loss": -28.45277214050293, "global_step": 647222, "epoch": 7797} {"train_loss": -28.335657119750977, "global_step": 647223, "epoch": 7797} {"train_loss": -28.557722091674805, "global_step": 647224, "epoch": 7797} {"train_loss": -28.42047691345215, "global_step": 647225, "epoch": 7797} {"train_loss": -28.489410400390625, "global_step": 647226, "epoch": 7797} {"train_loss": -28.51211929321289, "global_step": 647227, "epoch": 7797} {"train_loss": -29.014577865600586, "global_step": 647228, "epoch": 7797} {"train_loss": -28.321252822875977, "global_step": 647229, "epoch": 7797} {"train_loss": -28.530675888061523, "global_step": 647230, "epoch": 7797} {"train_loss": -28.363622665405273, "global_step": 647231, "epoch": 7797} {"train_loss": -28.011444091796875, "global_step": 647232, "epoch": 7797} {"train_loss": -28.080277592302807, "global_step": 647233, "epoch": 7797, "val_loss": 6743091.0} {"train_loss": -28.27846336364746, "global_step": 647234, "epoch": 7798} {"train_loss": -27.87506675720215, "global_step": 647235, "epoch": 7798} {"train_loss": -28.18052101135254, "global_step": 647236, "epoch": 7798} {"train_loss": -27.9300594329834, "global_step": 647237, "epoch": 7798} {"train_loss": -28.02377700805664, "global_step": 647238, "epoch": 7798} {"train_loss": -27.870529174804688, "global_step": 647239, "epoch": 7798} {"train_loss": -27.862552642822266, "global_step": 647240, "epoch": 7798} {"train_loss": -27.704715728759766, "global_step": 647241, "epoch": 7798} {"train_loss": -27.596759796142578, "global_step": 647242, "epoch": 7798} {"train_loss": -27.99213218688965, "global_step": 647243, "epoch": 7798} {"train_loss": -28.04408073425293, "global_step": 647244, "epoch": 7798} {"train_loss": -27.756505966186523, "global_step": 647245, "epoch": 7798} {"train_loss": -27.982969284057617, "global_step": 647246, "epoch": 7798} {"train_loss": -27.991168975830078, "global_step": 647247, "epoch": 7798} {"train_loss": -28.038583755493164, "global_step": 647248, "epoch": 7798} {"train_loss": -27.713775634765625, "global_step": 647249, "epoch": 7798} {"train_loss": -28.077259063720703, "global_step": 647250, "epoch": 7798} {"train_loss": -28.234289169311523, "global_step": 647251, "epoch": 7798} {"train_loss": -28.062381744384766, "global_step": 647252, "epoch": 7798} {"train_loss": -28.622299194335938, "global_step": 647253, "epoch": 7798} {"train_loss": -28.352582931518555, "global_step": 647254, "epoch": 7798} {"train_loss": -27.960224151611328, "global_step": 647255, "epoch": 7798} {"train_loss": -28.400060653686523, "global_step": 647256, "epoch": 7798} {"train_loss": -27.97503089904785, "global_step": 647257, "epoch": 7798} {"train_loss": -28.12082862854004, "global_step": 647258, "epoch": 7798} {"train_loss": -28.36191177368164, "global_step": 647259, "epoch": 7798} {"train_loss": -28.54499626159668, "global_step": 647260, "epoch": 7798} {"train_loss": -28.18354606628418, "global_step": 647261, "epoch": 7798} {"train_loss": -28.104278564453125, "global_step": 647262, "epoch": 7798} {"train_loss": -28.1453800201416, "global_step": 647263, "epoch": 7798} {"train_loss": -28.326446533203125, "global_step": 647264, "epoch": 7798} {"train_loss": -28.2961483001709, "global_step": 647265, "epoch": 7798} {"train_loss": -28.483945846557617, "global_step": 647266, "epoch": 7798} {"train_loss": -28.273008346557617, "global_step": 647267, "epoch": 7798} {"train_loss": -28.513233184814453, "global_step": 647268, "epoch": 7798} {"train_loss": -28.68928337097168, "global_step": 647269, "epoch": 7798} {"train_loss": -28.330488204956055, "global_step": 647270, "epoch": 7798} {"train_loss": -28.743459701538086, "global_step": 647271, "epoch": 7798} {"train_loss": -28.557188034057617, "global_step": 647272, "epoch": 7798} {"train_loss": -28.487157821655273, "global_step": 647273, "epoch": 7798} {"train_loss": -28.279193878173828, "global_step": 647274, "epoch": 7798} {"train_loss": -28.050281524658203, "global_step": 647275, "epoch": 7798} {"train_loss": -28.619033813476562, "global_step": 647276, "epoch": 7798} {"train_loss": -28.385282516479492, "global_step": 647277, "epoch": 7798} {"train_loss": -28.290451049804688, "global_step": 647278, "epoch": 7798} {"train_loss": -28.194814682006836, "global_step": 647279, "epoch": 7798} {"train_loss": -28.314725875854492, "global_step": 647280, "epoch": 7798} {"train_loss": -28.022796630859375, "global_step": 647281, "epoch": 7798} {"train_loss": -28.44524574279785, "global_step": 647282, "epoch": 7798} {"train_loss": -28.466989517211914, "global_step": 647283, "epoch": 7798} {"train_loss": -28.239362716674805, "global_step": 647284, "epoch": 7798} {"train_loss": -28.50983238220215, "global_step": 647285, "epoch": 7798} {"train_loss": -28.246845245361328, "global_step": 647286, "epoch": 7798} {"train_loss": -28.621023178100586, "global_step": 647287, "epoch": 7798} {"train_loss": -28.418439865112305, "global_step": 647288, "epoch": 7798} {"train_loss": -28.674833297729492, "global_step": 647289, "epoch": 7798} {"train_loss": -28.430072784423828, "global_step": 647290, "epoch": 7798} {"train_loss": -28.19951820373535, "global_step": 647291, "epoch": 7798} {"train_loss": -28.848546981811523, "global_step": 647292, "epoch": 7798} {"train_loss": -28.224334716796875, "global_step": 647293, "epoch": 7798} {"train_loss": -28.074533462524414, "global_step": 647294, "epoch": 7798} {"train_loss": -28.000158309936523, "global_step": 647295, "epoch": 7798} {"train_loss": -28.25254249572754, "global_step": 647296, "epoch": 7798} {"train_loss": -27.91522789001465, "global_step": 647297, "epoch": 7798} {"train_loss": -28.683385848999023, "global_step": 647298, "epoch": 7798} {"train_loss": -28.575653076171875, "global_step": 647299, "epoch": 7798} {"train_loss": -28.5233211517334, "global_step": 647300, "epoch": 7798} {"train_loss": -28.09051513671875, "global_step": 647301, "epoch": 7798} {"train_loss": -28.652729034423828, "global_step": 647302, "epoch": 7798} {"train_loss": -28.72627067565918, "global_step": 647303, "epoch": 7798} {"train_loss": -28.684167861938477, "global_step": 647304, "epoch": 7798} {"train_loss": -28.277484893798828, "global_step": 647305, "epoch": 7798} {"train_loss": -28.306243896484375, "global_step": 647306, "epoch": 7798} {"train_loss": -28.364843368530273, "global_step": 647307, "epoch": 7798} {"train_loss": -28.50628089904785, "global_step": 647308, "epoch": 7798} {"train_loss": -28.363698959350586, "global_step": 647309, "epoch": 7798} {"train_loss": -28.354541778564453, "global_step": 647310, "epoch": 7798} {"train_loss": -28.464879989624023, "global_step": 647311, "epoch": 7798} {"train_loss": -28.27225112915039, "global_step": 647312, "epoch": 7798} {"train_loss": -28.300739288330078, "global_step": 647313, "epoch": 7798} {"train_loss": -28.465957641601562, "global_step": 647314, "epoch": 7798} {"train_loss": -28.641407012939453, "global_step": 647315, "epoch": 7798} {"train_loss": -28.294397469026496, "global_step": 647316, "epoch": 7798, "val_loss": 6729516.0} {"train_loss": -27.895170211791992, "global_step": 647317, "epoch": 7799} {"train_loss": -27.608402252197266, "global_step": 647318, "epoch": 7799} {"train_loss": -28.11321449279785, "global_step": 647319, "epoch": 7799} {"train_loss": -28.183195114135742, "global_step": 647320, "epoch": 7799} {"train_loss": -27.93584632873535, "global_step": 647321, "epoch": 7799} {"train_loss": -27.88850212097168, "global_step": 647322, "epoch": 7799} {"train_loss": -28.079593658447266, "global_step": 647323, "epoch": 7799} {"train_loss": -28.59759521484375, "global_step": 647324, "epoch": 7799} {"train_loss": -27.778278350830078, "global_step": 647325, "epoch": 7799} {"train_loss": -27.36134147644043, "global_step": 647326, "epoch": 7799} {"train_loss": -28.071094512939453, "global_step": 647327, "epoch": 7799} {"train_loss": -27.93390464782715, "global_step": 647328, "epoch": 7799} {"train_loss": -28.022546768188477, "global_step": 647329, "epoch": 7799} {"train_loss": -28.407611846923828, "global_step": 647330, "epoch": 7799} {"train_loss": -27.770959854125977, "global_step": 647331, "epoch": 7799} {"train_loss": -27.9910945892334, "global_step": 647332, "epoch": 7799} {"train_loss": -28.048383712768555, "global_step": 647333, "epoch": 7799} {"train_loss": -27.791736602783203, "global_step": 647334, "epoch": 7799} {"train_loss": -27.942829132080078, "global_step": 647335, "epoch": 7799} {"train_loss": -28.13258171081543, "global_step": 647336, "epoch": 7799} {"train_loss": -28.116857528686523, "global_step": 647337, "epoch": 7799} {"train_loss": -28.19233512878418, "global_step": 647338, "epoch": 7799} {"train_loss": -27.991378784179688, "global_step": 647339, "epoch": 7799} {"train_loss": -28.41069984436035, "global_step": 647340, "epoch": 7799} {"train_loss": -27.858367919921875, "global_step": 647341, "epoch": 7799} {"train_loss": -28.446619033813477, "global_step": 647342, "epoch": 7799} {"train_loss": -27.90199851989746, "global_step": 647343, "epoch": 7799} {"train_loss": -28.4077091217041, "global_step": 647344, "epoch": 7799} {"train_loss": -28.138446807861328, "global_step": 647345, "epoch": 7799} {"train_loss": -28.236114501953125, "global_step": 647346, "epoch": 7799} {"train_loss": -28.06633949279785, "global_step": 647347, "epoch": 7799} {"train_loss": -28.1798152923584, "global_step": 647348, "epoch": 7799} {"train_loss": -28.04665184020996, "global_step": 647349, "epoch": 7799} {"train_loss": -28.334259033203125, "global_step": 647350, "epoch": 7799} {"train_loss": -28.513883590698242, "global_step": 647351, "epoch": 7799} {"train_loss": -28.6140079498291, "global_step": 647352, "epoch": 7799} {"train_loss": -28.22283363342285, "global_step": 647353, "epoch": 7799} {"train_loss": -28.2727108001709, "global_step": 647354, "epoch": 7799} {"train_loss": -28.370466232299805, "global_step": 647355, "epoch": 7799} {"train_loss": -28.466175079345703, "global_step": 647356, "epoch": 7799} {"train_loss": -28.554304122924805, "global_step": 647357, "epoch": 7799} {"train_loss": -28.13570213317871, "global_step": 647358, "epoch": 7799} {"train_loss": -28.77430534362793, "global_step": 647359, "epoch": 7799} {"train_loss": -28.663238525390625, "global_step": 647360, "epoch": 7799} {"train_loss": -28.446752548217773, "global_step": 647361, "epoch": 7799} {"train_loss": -28.47071647644043, "global_step": 647362, "epoch": 7799} {"train_loss": -28.546438217163086, "global_step": 647363, "epoch": 7799} {"train_loss": -28.886444091796875, "global_step": 647364, "epoch": 7799} {"train_loss": -28.43536949157715, "global_step": 647365, "epoch": 7799} {"train_loss": -28.4708309173584, "global_step": 647366, "epoch": 7799} {"train_loss": -28.34963035583496, "global_step": 647367, "epoch": 7799} {"train_loss": -28.67496109008789, "global_step": 647368, "epoch": 7799} {"train_loss": -28.26312255859375, "global_step": 647369, "epoch": 7799} {"train_loss": -28.1357479095459, "global_step": 647370, "epoch": 7799} {"train_loss": -28.597631454467773, "global_step": 647371, "epoch": 7799} {"train_loss": -28.128747940063477, "global_step": 647372, "epoch": 7799} {"train_loss": -28.56630516052246, "global_step": 647373, "epoch": 7799} {"train_loss": -28.135969161987305, "global_step": 647374, "epoch": 7799} {"train_loss": -26.89013671875, "global_step": 647375, "epoch": 7799} {"train_loss": -26.695159912109375, "global_step": 647376, "epoch": 7799} {"train_loss": -26.9698429107666, "global_step": 647377, "epoch": 7799} {"train_loss": -28.129255294799805, "global_step": 647378, "epoch": 7799} {"train_loss": -28.358144760131836, "global_step": 647379, "epoch": 7799} {"train_loss": -27.142059326171875, "global_step": 647380, "epoch": 7799} {"train_loss": -27.79720115661621, "global_step": 647381, "epoch": 7799} {"train_loss": -27.901899337768555, "global_step": 647382, "epoch": 7799} {"train_loss": -27.849462509155273, "global_step": 647383, "epoch": 7799} {"train_loss": -28.05445671081543, "global_step": 647384, "epoch": 7799} {"train_loss": -28.009902954101562, "global_step": 647385, "epoch": 7799} {"train_loss": -28.08321189880371, "global_step": 647386, "epoch": 7799} {"train_loss": -28.273773193359375, "global_step": 647387, "epoch": 7799} {"train_loss": -28.181411743164062, "global_step": 647388, "epoch": 7799} {"train_loss": -28.217016220092773, "global_step": 647389, "epoch": 7799} {"train_loss": -27.93816566467285, "global_step": 647390, "epoch": 7799} {"train_loss": -28.462080001831055, "global_step": 647391, "epoch": 7799} {"train_loss": -28.108556747436523, "global_step": 647392, "epoch": 7799} {"train_loss": -28.22194480895996, "global_step": 647393, "epoch": 7799} {"train_loss": -28.301366806030273, "global_step": 647394, "epoch": 7799} {"train_loss": -28.41425895690918, "global_step": 647395, "epoch": 7799} {"train_loss": -28.245264053344727, "global_step": 647396, "epoch": 7799} {"train_loss": -28.259235382080078, "global_step": 647397, "epoch": 7799} {"train_loss": -28.364606857299805, "global_step": 647398, "epoch": 7799} {"train_loss": -28.12721783281809, "global_step": 647399, "epoch": 7799, "val_loss": 6657178.0} {"train_loss": -27.22492790222168, "global_step": 647400, "epoch": 7800} {"train_loss": -27.675277709960938, "global_step": 647401, "epoch": 7800} {"train_loss": -27.402999877929688, "global_step": 647402, "epoch": 7800} {"train_loss": -27.943872451782227, "global_step": 647403, "epoch": 7800} {"train_loss": -27.7283878326416, "global_step": 647404, "epoch": 7800} {"train_loss": -27.807281494140625, "global_step": 647405, "epoch": 7800} {"train_loss": -27.59551429748535, "global_step": 647406, "epoch": 7800} {"train_loss": -27.6710262298584, "global_step": 647407, "epoch": 7800} {"train_loss": -27.37762451171875, "global_step": 647408, "epoch": 7800} {"train_loss": -28.188039779663086, "global_step": 647409, "epoch": 7800} {"train_loss": -27.506977081298828, "global_step": 647410, "epoch": 7800} {"train_loss": -27.584890365600586, "global_step": 647411, "epoch": 7800} {"train_loss": -27.813779830932617, "global_step": 647412, "epoch": 7800} {"train_loss": -28.04998207092285, "global_step": 647413, "epoch": 7800} {"train_loss": -28.07700538635254, "global_step": 647414, "epoch": 7800} {"train_loss": -28.013525009155273, "global_step": 647415, "epoch": 7800} {"train_loss": -27.76356315612793, "global_step": 647416, "epoch": 7800} {"train_loss": -28.18146324157715, "global_step": 647417, "epoch": 7800} {"train_loss": -27.7882137298584, "global_step": 647418, "epoch": 7800} {"train_loss": -28.341272354125977, "global_step": 647419, "epoch": 7800} {"train_loss": -28.190744400024414, "global_step": 647420, "epoch": 7800} {"train_loss": -27.75604820251465, "global_step": 647421, "epoch": 7800} {"train_loss": -28.30352783203125, "global_step": 647422, "epoch": 7800} {"train_loss": -28.37468910217285, "global_step": 647423, "epoch": 7800} {"train_loss": -28.0704345703125, "global_step": 647424, "epoch": 7800} {"train_loss": -28.402021408081055, "global_step": 647425, "epoch": 7800} {"train_loss": -27.930130004882812, "global_step": 647426, "epoch": 7800} {"train_loss": -28.023725509643555, "global_step": 647427, "epoch": 7800} {"train_loss": -28.137914657592773, "global_step": 647428, "epoch": 7800} {"train_loss": -28.30625343322754, "global_step": 647429, "epoch": 7800} {"train_loss": -28.0819091796875, "global_step": 647430, "epoch": 7800} {"train_loss": -27.678083419799805, "global_step": 647431, "epoch": 7800} {"train_loss": -28.330856323242188, "global_step": 647432, "epoch": 7800} {"train_loss": -28.49256706237793, "global_step": 647433, "epoch": 7800} {"train_loss": -28.266571044921875, "global_step": 647434, "epoch": 7800} {"train_loss": -28.28480339050293, "global_step": 647435, "epoch": 7800} {"train_loss": -28.599767684936523, "global_step": 647436, "epoch": 7800} {"train_loss": -28.3392391204834, "global_step": 647437, "epoch": 7800} {"train_loss": -28.713857650756836, "global_step": 647438, "epoch": 7800} {"train_loss": -28.464590072631836, "global_step": 647439, "epoch": 7800} {"train_loss": -28.637836456298828, "global_step": 647440, "epoch": 7800} {"train_loss": -28.610387802124023, "global_step": 647441, "epoch": 7800} {"train_loss": -28.394641876220703, "global_step": 647442, "epoch": 7800} {"train_loss": -28.298080444335938, "global_step": 647443, "epoch": 7800} {"train_loss": -28.851200103759766, "global_step": 647444, "epoch": 7800} {"train_loss": -28.513946533203125, "global_step": 647445, "epoch": 7800} {"train_loss": -28.729520797729492, "global_step": 647446, "epoch": 7800} {"train_loss": -28.632169723510742, "global_step": 647447, "epoch": 7800} {"train_loss": -28.47151756286621, "global_step": 647448, "epoch": 7800} {"train_loss": -27.95942497253418, "global_step": 647449, "epoch": 7800} {"train_loss": -28.518604278564453, "global_step": 647450, "epoch": 7800} {"train_loss": -29.037099838256836, "global_step": 647451, "epoch": 7800} {"train_loss": -28.4080810546875, "global_step": 647452, "epoch": 7800} {"train_loss": -28.218902587890625, "global_step": 647453, "epoch": 7800} {"train_loss": -28.213361740112305, "global_step": 647454, "epoch": 7800} {"train_loss": -28.203229904174805, "global_step": 647455, "epoch": 7800} {"train_loss": -28.263874053955078, "global_step": 647456, "epoch": 7800} {"train_loss": -28.412841796875, "global_step": 647457, "epoch": 7800} {"train_loss": -28.388599395751953, "global_step": 647458, "epoch": 7800} {"train_loss": -28.441186904907227, "global_step": 647459, "epoch": 7800} {"train_loss": -28.824792861938477, "global_step": 647460, "epoch": 7800} {"train_loss": -28.24921989440918, "global_step": 647461, "epoch": 7800} {"train_loss": -28.364179611206055, "global_step": 647462, "epoch": 7800} {"train_loss": -28.22687339782715, "global_step": 647463, "epoch": 7800} {"train_loss": -28.300933837890625, "global_step": 647464, "epoch": 7800} {"train_loss": -28.384906768798828, "global_step": 647465, "epoch": 7800} {"train_loss": -28.304428100585938, "global_step": 647466, "epoch": 7800} {"train_loss": -28.063077926635742, "global_step": 647467, "epoch": 7800} {"train_loss": -28.25017738342285, "global_step": 647468, "epoch": 7800} {"train_loss": -28.369434356689453, "global_step": 647469, "epoch": 7800} {"train_loss": -28.600727081298828, "global_step": 647470, "epoch": 7800} {"train_loss": -28.23541831970215, "global_step": 647471, "epoch": 7800} {"train_loss": -28.416345596313477, "global_step": 647472, "epoch": 7800} {"train_loss": -28.525400161743164, "global_step": 647473, "epoch": 7800} {"train_loss": -28.04498291015625, "global_step": 647474, "epoch": 7800} {"train_loss": -28.2479190826416, "global_step": 647475, "epoch": 7800} {"train_loss": -28.162342071533203, "global_step": 647476, "epoch": 7800} {"train_loss": -27.942584991455078, "global_step": 647477, "epoch": 7800} {"train_loss": -27.834522247314453, "global_step": 647478, "epoch": 7800} {"train_loss": -27.78840446472168, "global_step": 647479, "epoch": 7800} {"train_loss": -28.114233016967773, "global_step": 647480, "epoch": 7800} {"train_loss": -28.148412704467773, "global_step": 647481, "epoch": 7800} {"train_loss": -28.191142599266694, "global_step": 647482, "epoch": 7800, "train/sim_max_reward_0": 0.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4500000": 1.0, "test/sim_max_reward_4500001": 0.0, "test/sim_max_reward_4500002": 1.0, "test/sim_max_reward_4500003": 1.0, "test/sim_max_reward_4500004": 1.0, "test/sim_max_reward_4500005": 1.0, "test/sim_max_reward_4500006": 1.0, "test/sim_max_reward_4500007": 0.0, "test/sim_max_reward_4500008": 1.0, "test/sim_max_reward_4500009": 1.0, "test/sim_max_reward_4500010": 1.0, "test/sim_max_reward_4500011": 1.0, "test/sim_max_reward_4500012": 1.0, "test/sim_max_reward_4500013": 0.0, "test/sim_max_reward_4500014": 1.0, "test/sim_max_reward_4500015": 1.0, "test/sim_max_reward_4500016": 1.0, "test/sim_max_reward_4500017": 1.0, "test/sim_max_reward_4500018": 1.0, "test/sim_max_reward_4500019": 0.0, "test/sim_max_reward_4500020": 1.0, "test/sim_max_reward_4500021": 1.0, "train/mean_score": 0.8333333333333334, "test/mean_score": 0.8181818181818182, "val_loss": 6652010.0} {"train_loss": -27.663227081298828, "global_step": 647483, "epoch": 7801} {"train_loss": -27.853229522705078, "global_step": 647484, "epoch": 7801} {"train_loss": -27.76154899597168, "global_step": 647485, "epoch": 7801} {"train_loss": -27.74894142150879, "global_step": 647486, "epoch": 7801} {"train_loss": -27.991779327392578, "global_step": 647487, "epoch": 7801} {"train_loss": -28.042463302612305, "global_step": 647488, "epoch": 7801} {"train_loss": -27.38164710998535, "global_step": 647489, "epoch": 7801} {"train_loss": -28.002323150634766, "global_step": 647490, "epoch": 7801} {"train_loss": -27.904630661010742, "global_step": 647491, "epoch": 7801} {"train_loss": -27.876733779907227, "global_step": 647492, "epoch": 7801} {"train_loss": -27.977310180664062, "global_step": 647493, "epoch": 7801} {"train_loss": -28.161264419555664, "global_step": 647494, "epoch": 7801} {"train_loss": -27.929182052612305, "global_step": 647495, "epoch": 7801} {"train_loss": -27.91753578186035, "global_step": 647496, "epoch": 7801} {"train_loss": -28.068347930908203, "global_step": 647497, "epoch": 7801} {"train_loss": -27.919214248657227, "global_step": 647498, "epoch": 7801} {"train_loss": -27.717971801757812, "global_step": 647499, "epoch": 7801} {"train_loss": -27.905487060546875, "global_step": 647500, "epoch": 7801} {"train_loss": -27.4808349609375, "global_step": 647501, "epoch": 7801} {"train_loss": -28.114206314086914, "global_step": 647502, "epoch": 7801} {"train_loss": -27.972394943237305, "global_step": 647503, "epoch": 7801} {"train_loss": -28.057050704956055, "global_step": 647504, "epoch": 7801} {"train_loss": -28.2419490814209, "global_step": 647505, "epoch": 7801} {"train_loss": -27.99216079711914, "global_step": 647506, "epoch": 7801} {"train_loss": -28.3680477142334, "global_step": 647507, "epoch": 7801} {"train_loss": -27.97353172302246, "global_step": 647508, "epoch": 7801} {"train_loss": -28.423797607421875, "global_step": 647509, "epoch": 7801} {"train_loss": -28.223657608032227, "global_step": 647510, "epoch": 7801} {"train_loss": -28.258621215820312, "global_step": 647511, "epoch": 7801} {"train_loss": -27.994953155517578, "global_step": 647512, "epoch": 7801} {"train_loss": -28.33234977722168, "global_step": 647513, "epoch": 7801} {"train_loss": -28.042516708374023, "global_step": 647514, "epoch": 7801} {"train_loss": -28.294950485229492, "global_step": 647515, "epoch": 7801} {"train_loss": -28.25264549255371, "global_step": 647516, "epoch": 7801} {"train_loss": -28.492389678955078, "global_step": 647517, "epoch": 7801} {"train_loss": -28.569379806518555, "global_step": 647518, "epoch": 7801} {"train_loss": -28.327817916870117, "global_step": 647519, "epoch": 7801} {"train_loss": -28.53900146484375, "global_step": 647520, "epoch": 7801} {"train_loss": -28.729822158813477, "global_step": 647521, "epoch": 7801} {"train_loss": -28.79046630859375, "global_step": 647522, "epoch": 7801} {"train_loss": -28.169530868530273, "global_step": 647523, "epoch": 7801} {"train_loss": -28.438644409179688, "global_step": 647524, "epoch": 7801} {"train_loss": -28.408239364624023, "global_step": 647525, "epoch": 7801} {"train_loss": -28.21095848083496, "global_step": 647526, "epoch": 7801} {"train_loss": -27.847858428955078, "global_step": 647527, "epoch": 7801} {"train_loss": -28.830352783203125, "global_step": 647528, "epoch": 7801} {"train_loss": -28.4875545501709, "global_step": 647529, "epoch": 7801} {"train_loss": -28.478946685791016, "global_step": 647530, "epoch": 7801} {"train_loss": -28.530719757080078, "global_step": 647531, "epoch": 7801} {"train_loss": -28.7202205657959, "global_step": 647532, "epoch": 7801} {"train_loss": -28.007104873657227, "global_step": 647533, "epoch": 7801} {"train_loss": -28.50319480895996, "global_step": 647534, "epoch": 7801} {"train_loss": -28.28516960144043, "global_step": 647535, "epoch": 7801} {"train_loss": -28.500457763671875, "global_step": 647536, "epoch": 7801} {"train_loss": -28.538665771484375, "global_step": 647537, "epoch": 7801} {"train_loss": -28.36086082458496, "global_step": 647538, "epoch": 7801} {"train_loss": -28.521289825439453, "global_step": 647539, "epoch": 7801} {"train_loss": -28.503189086914062, "global_step": 647540, "epoch": 7801} {"train_loss": -28.580427169799805, "global_step": 647541, "epoch": 7801} {"train_loss": -28.242639541625977, "global_step": 647542, "epoch": 7801} {"train_loss": -28.19209098815918, "global_step": 647543, "epoch": 7801} {"train_loss": -28.744281768798828, "global_step": 647544, "epoch": 7801} {"train_loss": -28.913808822631836, "global_step": 647545, "epoch": 7801} {"train_loss": -27.870197296142578, "global_step": 647546, "epoch": 7801} {"train_loss": -28.035755157470703, "global_step": 647547, "epoch": 7801} {"train_loss": -27.9725341796875, "global_step": 647548, "epoch": 7801} {"train_loss": -28.61342430114746, "global_step": 647549, "epoch": 7801} {"train_loss": -28.405258178710938, "global_step": 647550, "epoch": 7801} {"train_loss": -28.407453536987305, "global_step": 647551, "epoch": 7801} {"train_loss": -28.253454208374023, "global_step": 647552, "epoch": 7801} {"train_loss": -28.580978393554688, "global_step": 647553, "epoch": 7801} {"train_loss": -28.107725143432617, "global_step": 647554, "epoch": 7801} {"train_loss": -27.892383575439453, "global_step": 647555, "epoch": 7801} {"train_loss": -27.949682235717773, "global_step": 647556, "epoch": 7801} {"train_loss": -28.57724380493164, "global_step": 647557, "epoch": 7801} {"train_loss": -27.91560935974121, "global_step": 647558, "epoch": 7801} {"train_loss": -27.883499145507812, "global_step": 647559, "epoch": 7801} {"train_loss": -28.117658615112305, "global_step": 647560, "epoch": 7801} {"train_loss": -28.245405197143555, "global_step": 647561, "epoch": 7801} {"train_loss": -28.094602584838867, "global_step": 647562, "epoch": 7801} {"train_loss": -27.726327896118164, "global_step": 647563, "epoch": 7801} {"train_loss": -28.182580947875977, "global_step": 647564, "epoch": 7801} {"train_loss": -28.184703298361903, "global_step": 647565, "epoch": 7801, "val_loss": 6620204.0} {"train_loss": -26.882892608642578, "global_step": 647566, "epoch": 7802} {"train_loss": -27.016284942626953, "global_step": 647567, "epoch": 7802} {"train_loss": -27.450971603393555, "global_step": 647568, "epoch": 7802} {"train_loss": -27.922346115112305, "global_step": 647569, "epoch": 7802} {"train_loss": -27.26847267150879, "global_step": 647570, "epoch": 7802} {"train_loss": -27.2188777923584, "global_step": 647571, "epoch": 7802} {"train_loss": -27.837818145751953, "global_step": 647572, "epoch": 7802} {"train_loss": -27.119943618774414, "global_step": 647573, "epoch": 7802} {"train_loss": -27.53809928894043, "global_step": 647574, "epoch": 7802} {"train_loss": -27.645017623901367, "global_step": 647575, "epoch": 7802} {"train_loss": -27.344648361206055, "global_step": 647576, "epoch": 7802} {"train_loss": -27.83341407775879, "global_step": 647577, "epoch": 7802} {"train_loss": -27.552881240844727, "global_step": 647578, "epoch": 7802} {"train_loss": -28.08357048034668, "global_step": 647579, "epoch": 7802} {"train_loss": -27.859302520751953, "global_step": 647580, "epoch": 7802} {"train_loss": -27.961811065673828, "global_step": 647581, "epoch": 7802} {"train_loss": -28.030872344970703, "global_step": 647582, "epoch": 7802} {"train_loss": -27.6667423248291, "global_step": 647583, "epoch": 7802} {"train_loss": -28.193450927734375, "global_step": 647584, "epoch": 7802} {"train_loss": -27.980091094970703, "global_step": 647585, "epoch": 7802} {"train_loss": -28.19645118713379, "global_step": 647586, "epoch": 7802} {"train_loss": -28.166732788085938, "global_step": 647587, "epoch": 7802} {"train_loss": -28.202136993408203, "global_step": 647588, "epoch": 7802} {"train_loss": -28.155370712280273, "global_step": 647589, "epoch": 7802} {"train_loss": -28.208545684814453, "global_step": 647590, "epoch": 7802} {"train_loss": -28.110883712768555, "global_step": 647591, "epoch": 7802} {"train_loss": -28.646886825561523, "global_step": 647592, "epoch": 7802} {"train_loss": -27.94243812561035, "global_step": 647593, "epoch": 7802} {"train_loss": -28.26899528503418, "global_step": 647594, "epoch": 7802} {"train_loss": -28.08989906311035, "global_step": 647595, "epoch": 7802} {"train_loss": -28.344568252563477, "global_step": 647596, "epoch": 7802} {"train_loss": -28.59992027282715, "global_step": 647597, "epoch": 7802} {"train_loss": -28.507131576538086, "global_step": 647598, "epoch": 7802} {"train_loss": -28.154632568359375, "global_step": 647599, "epoch": 7802} {"train_loss": -28.550119400024414, "global_step": 647600, "epoch": 7802} {"train_loss": -28.83772087097168, "global_step": 647601, "epoch": 7802} {"train_loss": -28.174047470092773, "global_step": 647602, "epoch": 7802} {"train_loss": -28.198984146118164, "global_step": 647603, "epoch": 7802} {"train_loss": -28.374160766601562, "global_step": 647604, "epoch": 7802} {"train_loss": -28.593952178955078, "global_step": 647605, "epoch": 7802} {"train_loss": -28.750452041625977, "global_step": 647606, "epoch": 7802} {"train_loss": -28.68585777282715, "global_step": 647607, "epoch": 7802} {"train_loss": -28.691333770751953, "global_step": 647608, "epoch": 7802} {"train_loss": -28.69197654724121, "global_step": 647609, "epoch": 7802} {"train_loss": -28.9226131439209, "global_step": 647610, "epoch": 7802} {"train_loss": -27.96063804626465, "global_step": 647611, "epoch": 7802} {"train_loss": -27.747949600219727, "global_step": 647612, "epoch": 7802} {"train_loss": -27.724079132080078, "global_step": 647613, "epoch": 7802} {"train_loss": -27.571741104125977, "global_step": 647614, "epoch": 7802} {"train_loss": -28.13720703125, "global_step": 647615, "epoch": 7802} {"train_loss": -28.542633056640625, "global_step": 647616, "epoch": 7802} {"train_loss": -27.763961791992188, "global_step": 647617, "epoch": 7802} {"train_loss": -28.255170822143555, "global_step": 647618, "epoch": 7802} {"train_loss": -28.109460830688477, "global_step": 647619, "epoch": 7802} {"train_loss": -27.974292755126953, "global_step": 647620, "epoch": 7802} {"train_loss": -28.61942481994629, "global_step": 647621, "epoch": 7802} {"train_loss": -27.8505859375, "global_step": 647622, "epoch": 7802} {"train_loss": -28.117755889892578, "global_step": 647623, "epoch": 7802} {"train_loss": -28.37746238708496, "global_step": 647624, "epoch": 7802} {"train_loss": -28.19076919555664, "global_step": 647625, "epoch": 7802} {"train_loss": -28.617523193359375, "global_step": 647626, "epoch": 7802} {"train_loss": -28.673587799072266, "global_step": 647627, "epoch": 7802} {"train_loss": -28.31263542175293, "global_step": 647628, "epoch": 7802} {"train_loss": -28.2813720703125, "global_step": 647629, "epoch": 7802} {"train_loss": -28.345556259155273, "global_step": 647630, "epoch": 7802} {"train_loss": -28.650089263916016, "global_step": 647631, "epoch": 7802} {"train_loss": -28.7020263671875, "global_step": 647632, "epoch": 7802} {"train_loss": -28.198837280273438, "global_step": 647633, "epoch": 7802} {"train_loss": -28.36273765563965, "global_step": 647634, "epoch": 7802} {"train_loss": -28.514188766479492, "global_step": 647635, "epoch": 7802} {"train_loss": -28.53889274597168, "global_step": 647636, "epoch": 7802} {"train_loss": -28.333250045776367, "global_step": 647637, "epoch": 7802} {"train_loss": -28.335432052612305, "global_step": 647638, "epoch": 7802} {"train_loss": -28.32916831970215, "global_step": 647639, "epoch": 7802} {"train_loss": -27.322141647338867, "global_step": 647640, "epoch": 7802} {"train_loss": -25.682157516479492, "global_step": 647641, "epoch": 7802} {"train_loss": -21.164295196533203, "global_step": 647642, "epoch": 7802} {"train_loss": -19.312463760375977, "global_step": 647643, "epoch": 7802} {"train_loss": -25.396451950073242, "global_step": 647644, "epoch": 7802} {"train_loss": -25.20451545715332, "global_step": 647645, "epoch": 7802} {"train_loss": -24.679046630859375, "global_step": 647646, "epoch": 7802} {"train_loss": -25.359333038330078, "global_step": 647647, "epoch": 7802} {"train_loss": -27.74696290349386, "global_step": 647648, "epoch": 7802, "val_loss": 6592236.0} {"train_loss": -25.8874454498291, "global_step": 647649, "epoch": 7803} {"train_loss": -24.07187843322754, "global_step": 647650, "epoch": 7803} {"train_loss": -26.46897315979004, "global_step": 647651, "epoch": 7803} {"train_loss": -26.023786544799805, "global_step": 647652, "epoch": 7803} {"train_loss": -25.448713302612305, "global_step": 647653, "epoch": 7803} {"train_loss": -26.352827072143555, "global_step": 647654, "epoch": 7803} {"train_loss": -26.70554542541504, "global_step": 647655, "epoch": 7803} {"train_loss": -26.108154296875, "global_step": 647656, "epoch": 7803} {"train_loss": -26.420612335205078, "global_step": 647657, "epoch": 7803} {"train_loss": -26.710529327392578, "global_step": 647658, "epoch": 7803} {"train_loss": -26.6187686920166, "global_step": 647659, "epoch": 7803} {"train_loss": -27.0345458984375, "global_step": 647660, "epoch": 7803} {"train_loss": -26.615081787109375, "global_step": 647661, "epoch": 7803} {"train_loss": -26.89491081237793, "global_step": 647662, "epoch": 7803} {"train_loss": -26.845129013061523, "global_step": 647663, "epoch": 7803} {"train_loss": -26.8132381439209, "global_step": 647664, "epoch": 7803} {"train_loss": -27.106124877929688, "global_step": 647665, "epoch": 7803} {"train_loss": -26.73177146911621, "global_step": 647666, "epoch": 7803} {"train_loss": -27.005630493164062, "global_step": 647667, "epoch": 7803} {"train_loss": -27.016876220703125, "global_step": 647668, "epoch": 7803} {"train_loss": -26.853845596313477, "global_step": 647669, "epoch": 7803} {"train_loss": -27.3056640625, "global_step": 647670, "epoch": 7803} {"train_loss": -26.986074447631836, "global_step": 647671, "epoch": 7803} {"train_loss": -26.986846923828125, "global_step": 647672, "epoch": 7803} {"train_loss": -27.12491226196289, "global_step": 647673, "epoch": 7803} {"train_loss": -26.86492347717285, "global_step": 647674, "epoch": 7803} {"train_loss": -27.47994041442871, "global_step": 647675, "epoch": 7803} {"train_loss": -26.946226119995117, "global_step": 647676, "epoch": 7803} {"train_loss": -27.88385581970215, "global_step": 647677, "epoch": 7803} {"train_loss": -27.385623931884766, "global_step": 647678, "epoch": 7803} {"train_loss": -27.068069458007812, "global_step": 647679, "epoch": 7803} {"train_loss": -27.350482940673828, "global_step": 647680, "epoch": 7803} {"train_loss": -27.26778221130371, "global_step": 647681, "epoch": 7803} {"train_loss": -27.64788246154785, "global_step": 647682, "epoch": 7803} {"train_loss": -27.4614200592041, "global_step": 647683, "epoch": 7803} {"train_loss": -27.960973739624023, "global_step": 647684, "epoch": 7803} {"train_loss": -27.705570220947266, "global_step": 647685, "epoch": 7803} {"train_loss": -27.48978042602539, "global_step": 647686, "epoch": 7803} {"train_loss": -28.08984375, "global_step": 647687, "epoch": 7803} {"train_loss": -27.53700065612793, "global_step": 647688, "epoch": 7803} {"train_loss": -27.612918853759766, "global_step": 647689, "epoch": 7803} {"train_loss": -28.21906089782715, "global_step": 647690, "epoch": 7803} {"train_loss": -27.894805908203125, "global_step": 647691, "epoch": 7803} {"train_loss": -27.379133224487305, "global_step": 647692, "epoch": 7803} {"train_loss": -27.8935604095459, "global_step": 647693, "epoch": 7803} {"train_loss": -27.962430953979492, "global_step": 647694, "epoch": 7803} {"train_loss": -27.6302433013916, "global_step": 647695, "epoch": 7803} {"train_loss": -28.150354385375977, "global_step": 647696, "epoch": 7803} {"train_loss": -27.787689208984375, "global_step": 647697, "epoch": 7803} {"train_loss": -27.72199821472168, "global_step": 647698, "epoch": 7803} {"train_loss": -27.908039093017578, "global_step": 647699, "epoch": 7803} {"train_loss": -27.982324600219727, "global_step": 647700, "epoch": 7803} {"train_loss": -27.477392196655273, "global_step": 647701, "epoch": 7803} {"train_loss": -28.305028915405273, "global_step": 647702, "epoch": 7803} {"train_loss": -27.924280166625977, "global_step": 647703, "epoch": 7803} {"train_loss": -27.44257164001465, "global_step": 647704, "epoch": 7803} {"train_loss": -27.8438720703125, "global_step": 647705, "epoch": 7803} {"train_loss": -27.814054489135742, "global_step": 647706, "epoch": 7803} {"train_loss": -27.901203155517578, "global_step": 647707, "epoch": 7803} {"train_loss": -27.841123580932617, "global_step": 647708, "epoch": 7803} {"train_loss": -27.942060470581055, "global_step": 647709, "epoch": 7803} {"train_loss": -27.681257247924805, "global_step": 647710, "epoch": 7803} {"train_loss": -28.265928268432617, "global_step": 647711, "epoch": 7803} {"train_loss": -27.911334991455078, "global_step": 647712, "epoch": 7803} {"train_loss": -28.21160888671875, "global_step": 647713, "epoch": 7803} {"train_loss": -28.435745239257812, "global_step": 647714, "epoch": 7803} {"train_loss": -28.1484317779541, "global_step": 647715, "epoch": 7803} {"train_loss": -28.5341796875, "global_step": 647716, "epoch": 7803} {"train_loss": -27.994169235229492, "global_step": 647717, "epoch": 7803} {"train_loss": -28.43631362915039, "global_step": 647718, "epoch": 7803} {"train_loss": -28.57023048400879, "global_step": 647719, "epoch": 7803} {"train_loss": -28.411115646362305, "global_step": 647720, "epoch": 7803} {"train_loss": -28.11228370666504, "global_step": 647721, "epoch": 7803} {"train_loss": -28.173871994018555, "global_step": 647722, "epoch": 7803} {"train_loss": -28.5693302154541, "global_step": 647723, "epoch": 7803} {"train_loss": -28.391767501831055, "global_step": 647724, "epoch": 7803} {"train_loss": -28.306119918823242, "global_step": 647725, "epoch": 7803} {"train_loss": -28.213550567626953, "global_step": 647726, "epoch": 7803} {"train_loss": -28.364151000976562, "global_step": 647727, "epoch": 7803} {"train_loss": -28.48834800720215, "global_step": 647728, "epoch": 7803} {"train_loss": -28.380529403686523, "global_step": 647729, "epoch": 7803} {"train_loss": -28.54842185974121, "global_step": 647730, "epoch": 7803} {"train_loss": -27.50692896096103, "global_step": 647731, "epoch": 7803, "val_loss": 6682120.0} {"train_loss": -28.051233291625977, "global_step": 647732, "epoch": 7804} {"train_loss": -28.28851318359375, "global_step": 647733, "epoch": 7804} {"train_loss": -28.2105712890625, "global_step": 647734, "epoch": 7804} {"train_loss": -28.021148681640625, "global_step": 647735, "epoch": 7804} {"train_loss": -27.799896240234375, "global_step": 647736, "epoch": 7804} {"train_loss": -27.929569244384766, "global_step": 647737, "epoch": 7804} {"train_loss": -27.81244468688965, "global_step": 647738, "epoch": 7804} {"train_loss": -28.638797760009766, "global_step": 647739, "epoch": 7804} {"train_loss": -27.73182487487793, "global_step": 647740, "epoch": 7804} {"train_loss": -28.271692276000977, "global_step": 647741, "epoch": 7804} {"train_loss": -28.087909698486328, "global_step": 647742, "epoch": 7804} {"train_loss": -28.20539665222168, "global_step": 647743, "epoch": 7804} {"train_loss": -28.3145694732666, "global_step": 647744, "epoch": 7804} {"train_loss": -28.037973403930664, "global_step": 647745, "epoch": 7804} {"train_loss": -28.359378814697266, "global_step": 647746, "epoch": 7804} {"train_loss": -27.90940284729004, "global_step": 647747, "epoch": 7804} {"train_loss": -28.290836334228516, "global_step": 647748, "epoch": 7804} {"train_loss": -27.758453369140625, "global_step": 647749, "epoch": 7804} {"train_loss": -28.30433464050293, "global_step": 647750, "epoch": 7804} {"train_loss": -28.091535568237305, "global_step": 647751, "epoch": 7804} {"train_loss": -28.209869384765625, "global_step": 647752, "epoch": 7804} {"train_loss": -28.33991050720215, "global_step": 647753, "epoch": 7804} {"train_loss": -28.520437240600586, "global_step": 647754, "epoch": 7804} {"train_loss": -28.327070236206055, "global_step": 647755, "epoch": 7804} {"train_loss": -28.1243839263916, "global_step": 647756, "epoch": 7804} {"train_loss": -28.451202392578125, "global_step": 647757, "epoch": 7804} {"train_loss": -28.598896026611328, "global_step": 647758, "epoch": 7804} {"train_loss": -28.46051025390625, "global_step": 647759, "epoch": 7804} {"train_loss": -28.472503662109375, "global_step": 647760, "epoch": 7804} {"train_loss": -28.001983642578125, "global_step": 647761, "epoch": 7804} {"train_loss": -28.892847061157227, "global_step": 647762, "epoch": 7804} {"train_loss": -28.214948654174805, "global_step": 647763, "epoch": 7804} {"train_loss": -28.243133544921875, "global_step": 647764, "epoch": 7804} {"train_loss": -27.84600830078125, "global_step": 647765, "epoch": 7804} {"train_loss": -27.691299438476562, "global_step": 647766, "epoch": 7804} {"train_loss": -27.660348892211914, "global_step": 647767, "epoch": 7804} {"train_loss": -27.602792739868164, "global_step": 647768, "epoch": 7804} {"train_loss": -28.61797523498535, "global_step": 647769, "epoch": 7804} {"train_loss": -28.477521896362305, "global_step": 647770, "epoch": 7804} {"train_loss": -28.3787899017334, "global_step": 647771, "epoch": 7804} {"train_loss": -28.339426040649414, "global_step": 647772, "epoch": 7804} {"train_loss": -28.399505615234375, "global_step": 647773, "epoch": 7804} {"train_loss": -28.281259536743164, "global_step": 647774, "epoch": 7804} {"train_loss": -28.000579833984375, "global_step": 647775, "epoch": 7804} {"train_loss": -28.39306640625, "global_step": 647776, "epoch": 7804} {"train_loss": -28.301721572875977, "global_step": 647777, "epoch": 7804} {"train_loss": -28.183887481689453, "global_step": 647778, "epoch": 7804} {"train_loss": -28.370468139648438, "global_step": 647779, "epoch": 7804} {"train_loss": -28.37997817993164, "global_step": 647780, "epoch": 7804} {"train_loss": -28.325178146362305, "global_step": 647781, "epoch": 7804} {"train_loss": -28.17829704284668, "global_step": 647782, "epoch": 7804} {"train_loss": -28.42055320739746, "global_step": 647783, "epoch": 7804} {"train_loss": -28.338062286376953, "global_step": 647784, "epoch": 7804} {"train_loss": -28.566648483276367, "global_step": 647785, "epoch": 7804} {"train_loss": -28.3409481048584, "global_step": 647786, "epoch": 7804} {"train_loss": -28.686309814453125, "global_step": 647787, "epoch": 7804} {"train_loss": -28.333288192749023, "global_step": 647788, "epoch": 7804} {"train_loss": -28.412946701049805, "global_step": 647789, "epoch": 7804} {"train_loss": -28.720977783203125, "global_step": 647790, "epoch": 7804} {"train_loss": -28.83905029296875, "global_step": 647791, "epoch": 7804} {"train_loss": -28.5074405670166, "global_step": 647792, "epoch": 7804} {"train_loss": -28.485595703125, "global_step": 647793, "epoch": 7804} {"train_loss": -28.5963191986084, "global_step": 647794, "epoch": 7804} {"train_loss": -28.608753204345703, "global_step": 647795, "epoch": 7804} {"train_loss": -28.378625869750977, "global_step": 647796, "epoch": 7804} {"train_loss": -27.951833724975586, "global_step": 647797, "epoch": 7804} {"train_loss": -28.513147354125977, "global_step": 647798, "epoch": 7804} {"train_loss": -28.408004760742188, "global_step": 647799, "epoch": 7804} {"train_loss": -28.9201717376709, "global_step": 647800, "epoch": 7804} {"train_loss": -28.485992431640625, "global_step": 647801, "epoch": 7804} {"train_loss": -28.23270606994629, "global_step": 647802, "epoch": 7804} {"train_loss": -28.392114639282227, "global_step": 647803, "epoch": 7804} {"train_loss": -28.832782745361328, "global_step": 647804, "epoch": 7804} {"train_loss": -28.047407150268555, "global_step": 647805, "epoch": 7804} {"train_loss": -28.190277099609375, "global_step": 647806, "epoch": 7804} {"train_loss": -28.445892333984375, "global_step": 647807, "epoch": 7804} {"train_loss": -28.490530014038086, "global_step": 647808, "epoch": 7804} {"train_loss": -28.2493953704834, "global_step": 647809, "epoch": 7804} {"train_loss": -28.25745964050293, "global_step": 647810, "epoch": 7804} {"train_loss": -28.420873641967773, "global_step": 647811, "epoch": 7804} {"train_loss": -28.35590171813965, "global_step": 647812, "epoch": 7804} {"train_loss": -28.47100257873535, "global_step": 647813, "epoch": 7804} {"train_loss": -28.3068778945739, "global_step": 647814, "epoch": 7804, "val_loss": 6654775.5} {"train_loss": -27.457782745361328, "global_step": 647815, "epoch": 7805} {"train_loss": -27.31536293029785, "global_step": 647816, "epoch": 7805} {"train_loss": -27.269153594970703, "global_step": 647817, "epoch": 7805} {"train_loss": -28.01075553894043, "global_step": 647818, "epoch": 7805} {"train_loss": -27.257266998291016, "global_step": 647819, "epoch": 7805} {"train_loss": -27.807355880737305, "global_step": 647820, "epoch": 7805} {"train_loss": -27.56207275390625, "global_step": 647821, "epoch": 7805} {"train_loss": -27.906604766845703, "global_step": 647822, "epoch": 7805} {"train_loss": -27.84014892578125, "global_step": 647823, "epoch": 7805} {"train_loss": -27.9941463470459, "global_step": 647824, "epoch": 7805} {"train_loss": -27.93598747253418, "global_step": 647825, "epoch": 7805} {"train_loss": -27.38507080078125, "global_step": 647826, "epoch": 7805} {"train_loss": -28.00921058654785, "global_step": 647827, "epoch": 7805} {"train_loss": -27.71071434020996, "global_step": 647828, "epoch": 7805} {"train_loss": -27.876981735229492, "global_step": 647829, "epoch": 7805} {"train_loss": -27.804107666015625, "global_step": 647830, "epoch": 7805} {"train_loss": -27.931522369384766, "global_step": 647831, "epoch": 7805} {"train_loss": -27.918415069580078, "global_step": 647832, "epoch": 7805} {"train_loss": -28.024810791015625, "global_step": 647833, "epoch": 7805} {"train_loss": -27.966171264648438, "global_step": 647834, "epoch": 7805} {"train_loss": -27.83319091796875, "global_step": 647835, "epoch": 7805} {"train_loss": -28.079710006713867, "global_step": 647836, "epoch": 7805} {"train_loss": -28.09735679626465, "global_step": 647837, "epoch": 7805} {"train_loss": -28.45472526550293, "global_step": 647838, "epoch": 7805} {"train_loss": -28.05243492126465, "global_step": 647839, "epoch": 7805} {"train_loss": -28.27701187133789, "global_step": 647840, "epoch": 7805} {"train_loss": -28.0625, "global_step": 647841, "epoch": 7805} {"train_loss": -28.33051109313965, "global_step": 647842, "epoch": 7805} {"train_loss": -28.591129302978516, "global_step": 647843, "epoch": 7805} {"train_loss": -27.913389205932617, "global_step": 647844, "epoch": 7805} {"train_loss": -28.332258224487305, "global_step": 647845, "epoch": 7805} {"train_loss": -28.571008682250977, "global_step": 647846, "epoch": 7805} {"train_loss": -28.37982749938965, "global_step": 647847, "epoch": 7805} {"train_loss": -27.989145278930664, "global_step": 647848, "epoch": 7805} {"train_loss": -28.186771392822266, "global_step": 647849, "epoch": 7805} {"train_loss": -28.27789306640625, "global_step": 647850, "epoch": 7805} {"train_loss": -28.293027877807617, "global_step": 647851, "epoch": 7805} {"train_loss": -28.21232032775879, "global_step": 647852, "epoch": 7805} {"train_loss": -28.199792861938477, "global_step": 647853, "epoch": 7805} {"train_loss": -28.25392723083496, "global_step": 647854, "epoch": 7805} {"train_loss": -28.192611694335938, "global_step": 647855, "epoch": 7805} {"train_loss": -27.98186683654785, "global_step": 647856, "epoch": 7805} {"train_loss": -28.722570419311523, "global_step": 647857, "epoch": 7805} {"train_loss": -28.451343536376953, "global_step": 647858, "epoch": 7805} {"train_loss": -28.373706817626953, "global_step": 647859, "epoch": 7805} {"train_loss": -28.414844512939453, "global_step": 647860, "epoch": 7805} {"train_loss": -28.3700008392334, "global_step": 647861, "epoch": 7805} {"train_loss": -28.41033363342285, "global_step": 647862, "epoch": 7805} {"train_loss": -28.542688369750977, "global_step": 647863, "epoch": 7805} {"train_loss": -28.199926376342773, "global_step": 647864, "epoch": 7805} {"train_loss": -28.441030502319336, "global_step": 647865, "epoch": 7805} {"train_loss": -28.717121124267578, "global_step": 647866, "epoch": 7805} {"train_loss": -28.240808486938477, "global_step": 647867, "epoch": 7805} {"train_loss": -28.279468536376953, "global_step": 647868, "epoch": 7805} {"train_loss": -28.62204933166504, "global_step": 647869, "epoch": 7805} {"train_loss": -28.463979721069336, "global_step": 647870, "epoch": 7805} {"train_loss": -28.716283798217773, "global_step": 647871, "epoch": 7805} {"train_loss": -28.12836265563965, "global_step": 647872, "epoch": 7805} {"train_loss": -28.227371215820312, "global_step": 647873, "epoch": 7805} {"train_loss": -28.409271240234375, "global_step": 647874, "epoch": 7805} {"train_loss": -28.541900634765625, "global_step": 647875, "epoch": 7805} {"train_loss": -28.211889266967773, "global_step": 647876, "epoch": 7805} {"train_loss": -28.365259170532227, "global_step": 647877, "epoch": 7805} {"train_loss": -28.365863800048828, "global_step": 647878, "epoch": 7805} {"train_loss": -28.747236251831055, "global_step": 647879, "epoch": 7805} {"train_loss": -28.357166290283203, "global_step": 647880, "epoch": 7805} {"train_loss": -28.59551429748535, "global_step": 647881, "epoch": 7805} {"train_loss": -28.02564811706543, "global_step": 647882, "epoch": 7805} {"train_loss": -28.398862838745117, "global_step": 647883, "epoch": 7805} {"train_loss": -28.52736473083496, "global_step": 647884, "epoch": 7805} {"train_loss": -28.32059097290039, "global_step": 647885, "epoch": 7805} {"train_loss": -28.3220157623291, "global_step": 647886, "epoch": 7805} {"train_loss": -28.327621459960938, "global_step": 647887, "epoch": 7805} {"train_loss": -28.230152130126953, "global_step": 647888, "epoch": 7805} {"train_loss": -28.3765926361084, "global_step": 647889, "epoch": 7805} {"train_loss": -28.405805587768555, "global_step": 647890, "epoch": 7805} {"train_loss": -28.215503692626953, "global_step": 647891, "epoch": 7805} {"train_loss": -28.089391708374023, "global_step": 647892, "epoch": 7805} {"train_loss": -28.65656089782715, "global_step": 647893, "epoch": 7805} {"train_loss": -28.52373695373535, "global_step": 647894, "epoch": 7805} {"train_loss": -28.391376495361328, "global_step": 647895, "epoch": 7805} {"train_loss": -28.40570068359375, "global_step": 647896, "epoch": 7805} {"train_loss": -28.206108483923487, "global_step": 647897, "epoch": 7805, "val_loss": 6672397.0} {"train_loss": -27.802734375, "global_step": 647898, "epoch": 7806} {"train_loss": -27.19171142578125, "global_step": 647899, "epoch": 7806} {"train_loss": -26.7242488861084, "global_step": 647900, "epoch": 7806} {"train_loss": -28.08404541015625, "global_step": 647901, "epoch": 7806} {"train_loss": -28.066553115844727, "global_step": 647902, "epoch": 7806} {"train_loss": -27.241209030151367, "global_step": 647903, "epoch": 7806} {"train_loss": -27.997756958007812, "global_step": 647904, "epoch": 7806} {"train_loss": -27.89044761657715, "global_step": 647905, "epoch": 7806} {"train_loss": -27.88126564025879, "global_step": 647906, "epoch": 7806} {"train_loss": -28.328632354736328, "global_step": 647907, "epoch": 7806} {"train_loss": -27.56342887878418, "global_step": 647908, "epoch": 7806} {"train_loss": -28.06892204284668, "global_step": 647909, "epoch": 7806} {"train_loss": -27.995080947875977, "global_step": 647910, "epoch": 7806} {"train_loss": -28.109373092651367, "global_step": 647911, "epoch": 7806} {"train_loss": -28.352880477905273, "global_step": 647912, "epoch": 7806} {"train_loss": -28.149808883666992, "global_step": 647913, "epoch": 7806} {"train_loss": -28.213537216186523, "global_step": 647914, "epoch": 7806} {"train_loss": -28.358976364135742, "global_step": 647915, "epoch": 7806} {"train_loss": -27.9045352935791, "global_step": 647916, "epoch": 7806} {"train_loss": -28.324811935424805, "global_step": 647917, "epoch": 7806} {"train_loss": -28.276721954345703, "global_step": 647918, "epoch": 7806} {"train_loss": -28.690454483032227, "global_step": 647919, "epoch": 7806} {"train_loss": -28.340787887573242, "global_step": 647920, "epoch": 7806} {"train_loss": -28.439838409423828, "global_step": 647921, "epoch": 7806} {"train_loss": -27.9724063873291, "global_step": 647922, "epoch": 7806} {"train_loss": -27.819812774658203, "global_step": 647923, "epoch": 7806} {"train_loss": -28.41383171081543, "global_step": 647924, "epoch": 7806} {"train_loss": -28.125268936157227, "global_step": 647925, "epoch": 7806} {"train_loss": -28.313037872314453, "global_step": 647926, "epoch": 7806} {"train_loss": -28.627771377563477, "global_step": 647927, "epoch": 7806} {"train_loss": -28.232446670532227, "global_step": 647928, "epoch": 7806} {"train_loss": -28.261322021484375, "global_step": 647929, "epoch": 7806} {"train_loss": -28.156784057617188, "global_step": 647930, "epoch": 7806} {"train_loss": -28.23304557800293, "global_step": 647931, "epoch": 7806} {"train_loss": -28.605993270874023, "global_step": 647932, "epoch": 7806} {"train_loss": -28.22011375427246, "global_step": 647933, "epoch": 7806} {"train_loss": -28.073781967163086, "global_step": 647934, "epoch": 7806} {"train_loss": -28.0125732421875, "global_step": 647935, "epoch": 7806} {"train_loss": -28.092126846313477, "global_step": 647936, "epoch": 7806} {"train_loss": -28.141199111938477, "global_step": 647937, "epoch": 7806} {"train_loss": -28.192548751831055, "global_step": 647938, "epoch": 7806} {"train_loss": -28.401090621948242, "global_step": 647939, "epoch": 7806} {"train_loss": -28.496265411376953, "global_step": 647940, "epoch": 7806} {"train_loss": -28.269384384155273, "global_step": 647941, "epoch": 7806} {"train_loss": -28.198429107666016, "global_step": 647942, "epoch": 7806} {"train_loss": -27.80898094177246, "global_step": 647943, "epoch": 7806} {"train_loss": -28.541845321655273, "global_step": 647944, "epoch": 7806} {"train_loss": -28.238296508789062, "global_step": 647945, "epoch": 7806} {"train_loss": -28.131357192993164, "global_step": 647946, "epoch": 7806} {"train_loss": -28.481943130493164, "global_step": 647947, "epoch": 7806} {"train_loss": -28.686065673828125, "global_step": 647948, "epoch": 7806} {"train_loss": -28.0296573638916, "global_step": 647949, "epoch": 7806} {"train_loss": -28.357473373413086, "global_step": 647950, "epoch": 7806} {"train_loss": -28.6530704498291, "global_step": 647951, "epoch": 7806} {"train_loss": -28.480838775634766, "global_step": 647952, "epoch": 7806} {"train_loss": -28.05328369140625, "global_step": 647953, "epoch": 7806} {"train_loss": -28.088232040405273, "global_step": 647954, "epoch": 7806} {"train_loss": -28.1463565826416, "global_step": 647955, "epoch": 7806} {"train_loss": -27.846479415893555, "global_step": 647956, "epoch": 7806} {"train_loss": -28.240087509155273, "global_step": 647957, "epoch": 7806} {"train_loss": -28.453161239624023, "global_step": 647958, "epoch": 7806} {"train_loss": -28.160001754760742, "global_step": 647959, "epoch": 7806} {"train_loss": -28.19108009338379, "global_step": 647960, "epoch": 7806} {"train_loss": -28.456806182861328, "global_step": 647961, "epoch": 7806} {"train_loss": -28.220746994018555, "global_step": 647962, "epoch": 7806} {"train_loss": -28.105993270874023, "global_step": 647963, "epoch": 7806} {"train_loss": -28.10804557800293, "global_step": 647964, "epoch": 7806} {"train_loss": -28.573644638061523, "global_step": 647965, "epoch": 7806} {"train_loss": -28.293975830078125, "global_step": 647966, "epoch": 7806} {"train_loss": -28.367563247680664, "global_step": 647967, "epoch": 7806} {"train_loss": -28.476613998413086, "global_step": 647968, "epoch": 7806} {"train_loss": -28.586950302124023, "global_step": 647969, "epoch": 7806} {"train_loss": -28.41059684753418, "global_step": 647970, "epoch": 7806} {"train_loss": -28.615137100219727, "global_step": 647971, "epoch": 7806} {"train_loss": -28.398883819580078, "global_step": 647972, "epoch": 7806} {"train_loss": -28.359296798706055, "global_step": 647973, "epoch": 7806} {"train_loss": -28.446767807006836, "global_step": 647974, "epoch": 7806} {"train_loss": -28.79385757446289, "global_step": 647975, "epoch": 7806} {"train_loss": -28.28312110900879, "global_step": 647976, "epoch": 7806} {"train_loss": -28.175601959228516, "global_step": 647977, "epoch": 7806} {"train_loss": -28.557754516601562, "global_step": 647978, "epoch": 7806} {"train_loss": -28.362966537475586, "global_step": 647979, "epoch": 7806} {"train_loss": -28.2310750800443, "global_step": 647980, "epoch": 7806, "val_loss": 6679916.0} {"train_loss": -27.9737606048584, "global_step": 647981, "epoch": 7807} {"train_loss": -28.152128219604492, "global_step": 647982, "epoch": 7807} {"train_loss": -27.277328491210938, "global_step": 647983, "epoch": 7807} {"train_loss": -27.832345962524414, "global_step": 647984, "epoch": 7807} {"train_loss": -27.910947799682617, "global_step": 647985, "epoch": 7807} {"train_loss": -28.140228271484375, "global_step": 647986, "epoch": 7807} {"train_loss": -27.627613067626953, "global_step": 647987, "epoch": 7807} {"train_loss": -27.940937042236328, "global_step": 647988, "epoch": 7807} {"train_loss": -28.03584098815918, "global_step": 647989, "epoch": 7807} {"train_loss": -28.0026798248291, "global_step": 647990, "epoch": 7807} {"train_loss": -27.990102767944336, "global_step": 647991, "epoch": 7807} {"train_loss": -28.264936447143555, "global_step": 647992, "epoch": 7807} {"train_loss": -28.356672286987305, "global_step": 647993, "epoch": 7807} {"train_loss": -27.93975257873535, "global_step": 647994, "epoch": 7807} {"train_loss": -28.2692813873291, "global_step": 647995, "epoch": 7807} {"train_loss": -28.53474235534668, "global_step": 647996, "epoch": 7807} {"train_loss": -28.417219161987305, "global_step": 647997, "epoch": 7807} {"train_loss": -28.479522705078125, "global_step": 647998, "epoch": 7807} {"train_loss": -28.0542049407959, "global_step": 647999, "epoch": 7807} {"train_loss": -28.36079216003418, "global_step": 648000, "epoch": 7807} {"train_loss": -27.957075119018555, "global_step": 648001, "epoch": 7807} {"train_loss": -28.33304214477539, "global_step": 648002, "epoch": 7807} {"train_loss": -28.594135284423828, "global_step": 648003, "epoch": 7807} {"train_loss": -28.143674850463867, "global_step": 648004, "epoch": 7807} {"train_loss": -28.203022003173828, "global_step": 648005, "epoch": 7807} {"train_loss": -27.998138427734375, "global_step": 648006, "epoch": 7807} {"train_loss": -28.7993106842041, "global_step": 648007, "epoch": 7807} {"train_loss": -28.267322540283203, "global_step": 648008, "epoch": 7807} {"train_loss": -27.913726806640625, "global_step": 648009, "epoch": 7807} {"train_loss": -28.223377227783203, "global_step": 648010, "epoch": 7807} {"train_loss": -28.549299240112305, "global_step": 648011, "epoch": 7807} {"train_loss": -28.516088485717773, "global_step": 648012, "epoch": 7807} {"train_loss": -28.571975708007812, "global_step": 648013, "epoch": 7807} {"train_loss": -28.235509872436523, "global_step": 648014, "epoch": 7807} {"train_loss": -28.840356826782227, "global_step": 648015, "epoch": 7807} {"train_loss": -28.454755783081055, "global_step": 648016, "epoch": 7807} {"train_loss": -28.077573776245117, "global_step": 648017, "epoch": 7807} {"train_loss": -28.06085205078125, "global_step": 648018, "epoch": 7807} {"train_loss": -28.662870407104492, "global_step": 648019, "epoch": 7807} {"train_loss": -28.006620407104492, "global_step": 648020, "epoch": 7807} {"train_loss": -27.268707275390625, "global_step": 648021, "epoch": 7807} {"train_loss": -27.4836483001709, "global_step": 648022, "epoch": 7807} {"train_loss": -27.917219161987305, "global_step": 648023, "epoch": 7807} {"train_loss": -28.302295684814453, "global_step": 648024, "epoch": 7807} {"train_loss": -28.337371826171875, "global_step": 648025, "epoch": 7807} {"train_loss": -27.536386489868164, "global_step": 648026, "epoch": 7807} {"train_loss": -28.18549156188965, "global_step": 648027, "epoch": 7807} {"train_loss": -28.263315200805664, "global_step": 648028, "epoch": 7807} {"train_loss": -28.097631454467773, "global_step": 648029, "epoch": 7807} {"train_loss": -28.48388671875, "global_step": 648030, "epoch": 7807} {"train_loss": -28.088489532470703, "global_step": 648031, "epoch": 7807} {"train_loss": -28.058521270751953, "global_step": 648032, "epoch": 7807} {"train_loss": -27.963001251220703, "global_step": 648033, "epoch": 7807} {"train_loss": -28.428028106689453, "global_step": 648034, "epoch": 7807} {"train_loss": -28.195785522460938, "global_step": 648035, "epoch": 7807} {"train_loss": -28.370752334594727, "global_step": 648036, "epoch": 7807} {"train_loss": -28.216821670532227, "global_step": 648037, "epoch": 7807} {"train_loss": -28.224018096923828, "global_step": 648038, "epoch": 7807} {"train_loss": -28.453176498413086, "global_step": 648039, "epoch": 7807} {"train_loss": -28.139318466186523, "global_step": 648040, "epoch": 7807} {"train_loss": -28.122533798217773, "global_step": 648041, "epoch": 7807} {"train_loss": -28.543277740478516, "global_step": 648042, "epoch": 7807} {"train_loss": -28.080097198486328, "global_step": 648043, "epoch": 7807} {"train_loss": -28.338666915893555, "global_step": 648044, "epoch": 7807} {"train_loss": -28.993026733398438, "global_step": 648045, "epoch": 7807} {"train_loss": -28.3018741607666, "global_step": 648046, "epoch": 7807} {"train_loss": -28.229476928710938, "global_step": 648047, "epoch": 7807} {"train_loss": -28.236398696899414, "global_step": 648048, "epoch": 7807} {"train_loss": -28.49213218688965, "global_step": 648049, "epoch": 7807} {"train_loss": -28.495899200439453, "global_step": 648050, "epoch": 7807} {"train_loss": -28.04396629333496, "global_step": 648051, "epoch": 7807} {"train_loss": -28.11005210876465, "global_step": 648052, "epoch": 7807} {"train_loss": -28.4022274017334, "global_step": 648053, "epoch": 7807} {"train_loss": -28.244070053100586, "global_step": 648054, "epoch": 7807} {"train_loss": -28.35467529296875, "global_step": 648055, "epoch": 7807} {"train_loss": -28.13043212890625, "global_step": 648056, "epoch": 7807} {"train_loss": -28.06369972229004, "global_step": 648057, "epoch": 7807} {"train_loss": -28.5259952545166, "global_step": 648058, "epoch": 7807} {"train_loss": -28.2896728515625, "global_step": 648059, "epoch": 7807} {"train_loss": -28.235260009765625, "global_step": 648060, "epoch": 7807} {"train_loss": -28.413665771484375, "global_step": 648061, "epoch": 7807} {"train_loss": -28.17681312561035, "global_step": 648062, "epoch": 7807} {"train_loss": -28.1939542379724, "global_step": 648063, "epoch": 7807, "val_loss": 6710496.5} {"train_loss": -27.801532745361328, "global_step": 648064, "epoch": 7808} {"train_loss": -27.47011375427246, "global_step": 648065, "epoch": 7808} {"train_loss": -27.839542388916016, "global_step": 648066, "epoch": 7808} {"train_loss": -28.126911163330078, "global_step": 648067, "epoch": 7808} {"train_loss": -28.13746452331543, "global_step": 648068, "epoch": 7808} {"train_loss": -27.841033935546875, "global_step": 648069, "epoch": 7808} {"train_loss": -27.771265029907227, "global_step": 648070, "epoch": 7808} {"train_loss": -27.775991439819336, "global_step": 648071, "epoch": 7808} {"train_loss": -28.203001022338867, "global_step": 648072, "epoch": 7808} {"train_loss": -27.83646011352539, "global_step": 648073, "epoch": 7808} {"train_loss": -28.344614028930664, "global_step": 648074, "epoch": 7808} {"train_loss": -28.368228912353516, "global_step": 648075, "epoch": 7808} {"train_loss": -27.852720260620117, "global_step": 648076, "epoch": 7808} {"train_loss": -28.301733016967773, "global_step": 648077, "epoch": 7808} {"train_loss": -28.284814834594727, "global_step": 648078, "epoch": 7808} {"train_loss": -28.2200927734375, "global_step": 648079, "epoch": 7808} {"train_loss": -28.500503540039062, "global_step": 648080, "epoch": 7808} {"train_loss": -27.9362850189209, "global_step": 648081, "epoch": 7808} {"train_loss": -28.096906661987305, "global_step": 648082, "epoch": 7808} {"train_loss": -28.577451705932617, "global_step": 648083, "epoch": 7808} {"train_loss": -28.134729385375977, "global_step": 648084, "epoch": 7808} {"train_loss": -27.807037353515625, "global_step": 648085, "epoch": 7808} {"train_loss": -27.870481491088867, "global_step": 648086, "epoch": 7808} {"train_loss": -26.667139053344727, "global_step": 648087, "epoch": 7808} {"train_loss": -26.854480743408203, "global_step": 648088, "epoch": 7808} {"train_loss": -28.501768112182617, "global_step": 648089, "epoch": 7808} {"train_loss": -27.349029541015625, "global_step": 648090, "epoch": 7808} {"train_loss": -26.949268341064453, "global_step": 648091, "epoch": 7808} {"train_loss": -28.30401039123535, "global_step": 648092, "epoch": 7808} {"train_loss": -27.469757080078125, "global_step": 648093, "epoch": 7808} {"train_loss": -28.042760848999023, "global_step": 648094, "epoch": 7808} {"train_loss": -27.7440185546875, "global_step": 648095, "epoch": 7808} {"train_loss": -28.419891357421875, "global_step": 648096, "epoch": 7808} {"train_loss": -27.942136764526367, "global_step": 648097, "epoch": 7808} {"train_loss": -28.08806800842285, "global_step": 648098, "epoch": 7808} {"train_loss": -27.731149673461914, "global_step": 648099, "epoch": 7808} {"train_loss": -28.03046226501465, "global_step": 648100, "epoch": 7808} {"train_loss": -27.94379997253418, "global_step": 648101, "epoch": 7808} {"train_loss": -27.83561134338379, "global_step": 648102, "epoch": 7808} {"train_loss": -28.011825561523438, "global_step": 648103, "epoch": 7808} {"train_loss": -28.130685806274414, "global_step": 648104, "epoch": 7808} {"train_loss": -27.961633682250977, "global_step": 648105, "epoch": 7808} {"train_loss": -28.217117309570312, "global_step": 648106, "epoch": 7808} {"train_loss": -27.695859909057617, "global_step": 648107, "epoch": 7808} {"train_loss": -28.229694366455078, "global_step": 648108, "epoch": 7808} {"train_loss": -27.849136352539062, "global_step": 648109, "epoch": 7808} {"train_loss": -28.5234375, "global_step": 648110, "epoch": 7808} {"train_loss": -28.1610050201416, "global_step": 648111, "epoch": 7808} {"train_loss": -28.335968017578125, "global_step": 648112, "epoch": 7808} {"train_loss": -27.980005264282227, "global_step": 648113, "epoch": 7808} {"train_loss": -28.271154403686523, "global_step": 648114, "epoch": 7808} {"train_loss": -27.954381942749023, "global_step": 648115, "epoch": 7808} {"train_loss": -28.505020141601562, "global_step": 648116, "epoch": 7808} {"train_loss": -28.477014541625977, "global_step": 648117, "epoch": 7808} {"train_loss": -28.037832260131836, "global_step": 648118, "epoch": 7808} {"train_loss": -28.466022491455078, "global_step": 648119, "epoch": 7808} {"train_loss": -28.1103458404541, "global_step": 648120, "epoch": 7808} {"train_loss": -28.30025291442871, "global_step": 648121, "epoch": 7808} {"train_loss": -28.62203025817871, "global_step": 648122, "epoch": 7808} {"train_loss": -28.395172119140625, "global_step": 648123, "epoch": 7808} {"train_loss": -28.724233627319336, "global_step": 648124, "epoch": 7808} {"train_loss": -28.292261123657227, "global_step": 648125, "epoch": 7808} {"train_loss": -28.17317008972168, "global_step": 648126, "epoch": 7808} {"train_loss": -28.28240966796875, "global_step": 648127, "epoch": 7808} {"train_loss": -28.501386642456055, "global_step": 648128, "epoch": 7808} {"train_loss": -28.51947021484375, "global_step": 648129, "epoch": 7808} {"train_loss": -28.209781646728516, "global_step": 648130, "epoch": 7808} {"train_loss": -27.89832878112793, "global_step": 648131, "epoch": 7808} {"train_loss": -28.335844039916992, "global_step": 648132, "epoch": 7808} {"train_loss": -28.27398109436035, "global_step": 648133, "epoch": 7808} {"train_loss": -28.235803604125977, "global_step": 648134, "epoch": 7808} {"train_loss": -28.09832191467285, "global_step": 648135, "epoch": 7808} {"train_loss": -28.5876522064209, "global_step": 648136, "epoch": 7808} {"train_loss": -28.398014068603516, "global_step": 648137, "epoch": 7808} {"train_loss": -28.44001579284668, "global_step": 648138, "epoch": 7808} {"train_loss": -28.4415283203125, "global_step": 648139, "epoch": 7808} {"train_loss": -28.17181396484375, "global_step": 648140, "epoch": 7808} {"train_loss": -28.383329391479492, "global_step": 648141, "epoch": 7808} {"train_loss": -28.213214874267578, "global_step": 648142, "epoch": 7808} {"train_loss": -28.45658302307129, "global_step": 648143, "epoch": 7808} {"train_loss": -28.563199996948242, "global_step": 648144, "epoch": 7808} {"train_loss": -28.62445068359375, "global_step": 648145, "epoch": 7808} {"train_loss": -28.117043001105987, "global_step": 648146, "epoch": 7808, "val_loss": 6681179.0} {"train_loss": -26.90411376953125, "global_step": 648147, "epoch": 7809} {"train_loss": -27.13523292541504, "global_step": 648148, "epoch": 7809} {"train_loss": -28.251657485961914, "global_step": 648149, "epoch": 7809} {"train_loss": -26.89593505859375, "global_step": 648150, "epoch": 7809} {"train_loss": -27.416614532470703, "global_step": 648151, "epoch": 7809} {"train_loss": -26.63140869140625, "global_step": 648152, "epoch": 7809} {"train_loss": -27.556615829467773, "global_step": 648153, "epoch": 7809} {"train_loss": -27.1234188079834, "global_step": 648154, "epoch": 7809} {"train_loss": -27.461292266845703, "global_step": 648155, "epoch": 7809} {"train_loss": -27.490697860717773, "global_step": 648156, "epoch": 7809} {"train_loss": -27.6197452545166, "global_step": 648157, "epoch": 7809} {"train_loss": -27.737695693969727, "global_step": 648158, "epoch": 7809} {"train_loss": -27.866657257080078, "global_step": 648159, "epoch": 7809} {"train_loss": -27.47821044921875, "global_step": 648160, "epoch": 7809} {"train_loss": -27.892446517944336, "global_step": 648161, "epoch": 7809} {"train_loss": -27.9202823638916, "global_step": 648162, "epoch": 7809} {"train_loss": -27.79398536682129, "global_step": 648163, "epoch": 7809} {"train_loss": -28.060962677001953, "global_step": 648164, "epoch": 7809} {"train_loss": -27.822345733642578, "global_step": 648165, "epoch": 7809} {"train_loss": -27.711517333984375, "global_step": 648166, "epoch": 7809} {"train_loss": -27.748645782470703, "global_step": 648167, "epoch": 7809} {"train_loss": -28.188451766967773, "global_step": 648168, "epoch": 7809} {"train_loss": -28.183324813842773, "global_step": 648169, "epoch": 7809} {"train_loss": -28.22568702697754, "global_step": 648170, "epoch": 7809} {"train_loss": -27.70314598083496, "global_step": 648171, "epoch": 7809} {"train_loss": -27.993000030517578, "global_step": 648172, "epoch": 7809} {"train_loss": -27.9149227142334, "global_step": 648173, "epoch": 7809} {"train_loss": -27.94087028503418, "global_step": 648174, "epoch": 7809} {"train_loss": -28.35089111328125, "global_step": 648175, "epoch": 7809} {"train_loss": -28.1364803314209, "global_step": 648176, "epoch": 7809} {"train_loss": -27.83473014831543, "global_step": 648177, "epoch": 7809} {"train_loss": -28.314611434936523, "global_step": 648178, "epoch": 7809} {"train_loss": -27.817407608032227, "global_step": 648179, "epoch": 7809} {"train_loss": -28.23598289489746, "global_step": 648180, "epoch": 7809} {"train_loss": -28.194782257080078, "global_step": 648181, "epoch": 7809} {"train_loss": -28.626951217651367, "global_step": 648182, "epoch": 7809} {"train_loss": -28.213031768798828, "global_step": 648183, "epoch": 7809} {"train_loss": -28.5501651763916, "global_step": 648184, "epoch": 7809} {"train_loss": -27.75411033630371, "global_step": 648185, "epoch": 7809} {"train_loss": -27.970539093017578, "global_step": 648186, "epoch": 7809} {"train_loss": -28.324560165405273, "global_step": 648187, "epoch": 7809} {"train_loss": -28.5216007232666, "global_step": 648188, "epoch": 7809} {"train_loss": -28.344680786132812, "global_step": 648189, "epoch": 7809} {"train_loss": -28.28740882873535, "global_step": 648190, "epoch": 7809} {"train_loss": -28.44170570373535, "global_step": 648191, "epoch": 7809} {"train_loss": -28.306610107421875, "global_step": 648192, "epoch": 7809} {"train_loss": -28.53031349182129, "global_step": 648193, "epoch": 7809} {"train_loss": -28.254154205322266, "global_step": 648194, "epoch": 7809} {"train_loss": -28.11258888244629, "global_step": 648195, "epoch": 7809} {"train_loss": -27.99515151977539, "global_step": 648196, "epoch": 7809} {"train_loss": -28.072980880737305, "global_step": 648197, "epoch": 7809} {"train_loss": -28.46441650390625, "global_step": 648198, "epoch": 7809} {"train_loss": -28.49492835998535, "global_step": 648199, "epoch": 7809} {"train_loss": -28.631967544555664, "global_step": 648200, "epoch": 7809} {"train_loss": -28.53240394592285, "global_step": 648201, "epoch": 7809} {"train_loss": -28.080846786499023, "global_step": 648202, "epoch": 7809} {"train_loss": -28.55615234375, "global_step": 648203, "epoch": 7809} {"train_loss": -28.342426300048828, "global_step": 648204, "epoch": 7809} {"train_loss": -28.375974655151367, "global_step": 648205, "epoch": 7809} {"train_loss": -28.39914894104004, "global_step": 648206, "epoch": 7809} {"train_loss": -28.36785888671875, "global_step": 648207, "epoch": 7809} {"train_loss": -28.607772827148438, "global_step": 648208, "epoch": 7809} {"train_loss": -28.58220863342285, "global_step": 648209, "epoch": 7809} {"train_loss": -28.51849937438965, "global_step": 648210, "epoch": 7809} {"train_loss": -28.3046817779541, "global_step": 648211, "epoch": 7809} {"train_loss": -28.27032470703125, "global_step": 648212, "epoch": 7809} {"train_loss": -28.433691024780273, "global_step": 648213, "epoch": 7809} {"train_loss": -27.71736717224121, "global_step": 648214, "epoch": 7809} {"train_loss": -28.521142959594727, "global_step": 648215, "epoch": 7809} {"train_loss": -28.63680076599121, "global_step": 648216, "epoch": 7809} {"train_loss": -28.41108512878418, "global_step": 648217, "epoch": 7809} {"train_loss": -28.086408615112305, "global_step": 648218, "epoch": 7809} {"train_loss": -28.16193199157715, "global_step": 648219, "epoch": 7809} {"train_loss": -27.970239639282227, "global_step": 648220, "epoch": 7809} {"train_loss": -28.183820724487305, "global_step": 648221, "epoch": 7809} {"train_loss": -28.327564239501953, "global_step": 648222, "epoch": 7809} {"train_loss": -28.33035659790039, "global_step": 648223, "epoch": 7809} {"train_loss": -28.396198272705078, "global_step": 648224, "epoch": 7809} {"train_loss": -28.034454345703125, "global_step": 648225, "epoch": 7809} {"train_loss": -28.691577911376953, "global_step": 648226, "epoch": 7809} {"train_loss": -28.362817764282227, "global_step": 648227, "epoch": 7809} {"train_loss": -28.839941024780273, "global_step": 648228, "epoch": 7809} {"train_loss": -28.093103110072125, "global_step": 648229, "epoch": 7809, "val_loss": 6647888.5} {"train_loss": -28.4450626373291, "global_step": 648230, "epoch": 7810} {"train_loss": -28.402673721313477, "global_step": 648231, "epoch": 7810} {"train_loss": -27.852880477905273, "global_step": 648232, "epoch": 7810} {"train_loss": -27.344186782836914, "global_step": 648233, "epoch": 7810} {"train_loss": -28.332950592041016, "global_step": 648234, "epoch": 7810} {"train_loss": -28.194400787353516, "global_step": 648235, "epoch": 7810} {"train_loss": -27.571823120117188, "global_step": 648236, "epoch": 7810} {"train_loss": -27.574554443359375, "global_step": 648237, "epoch": 7810} {"train_loss": -27.48483657836914, "global_step": 648238, "epoch": 7810} {"train_loss": -28.257007598876953, "global_step": 648239, "epoch": 7810} {"train_loss": -27.615278244018555, "global_step": 648240, "epoch": 7810} {"train_loss": -28.041034698486328, "global_step": 648241, "epoch": 7810} {"train_loss": -28.085296630859375, "global_step": 648242, "epoch": 7810} {"train_loss": -28.28981590270996, "global_step": 648243, "epoch": 7810} {"train_loss": -28.010812759399414, "global_step": 648244, "epoch": 7810} {"train_loss": -28.143878936767578, "global_step": 648245, "epoch": 7810} {"train_loss": -28.099720001220703, "global_step": 648246, "epoch": 7810} {"train_loss": -28.228805541992188, "global_step": 648247, "epoch": 7810} {"train_loss": -28.029150009155273, "global_step": 648248, "epoch": 7810} {"train_loss": -28.10564613342285, "global_step": 648249, "epoch": 7810} {"train_loss": -28.63689613342285, "global_step": 648250, "epoch": 7810} {"train_loss": -28.123151779174805, "global_step": 648251, "epoch": 7810} {"train_loss": -27.993757247924805, "global_step": 648252, "epoch": 7810} {"train_loss": -28.825031280517578, "global_step": 648253, "epoch": 7810} {"train_loss": -28.289274215698242, "global_step": 648254, "epoch": 7810} {"train_loss": -28.442941665649414, "global_step": 648255, "epoch": 7810} {"train_loss": -28.491674423217773, "global_step": 648256, "epoch": 7810} {"train_loss": -28.08888053894043, "global_step": 648257, "epoch": 7810} {"train_loss": -28.172821044921875, "global_step": 648258, "epoch": 7810} {"train_loss": -28.30517578125, "global_step": 648259, "epoch": 7810} {"train_loss": -28.306432723999023, "global_step": 648260, "epoch": 7810} {"train_loss": -28.540979385375977, "global_step": 648261, "epoch": 7810} {"train_loss": -28.162973403930664, "global_step": 648262, "epoch": 7810} {"train_loss": -27.99614906311035, "global_step": 648263, "epoch": 7810} {"train_loss": -28.405187606811523, "global_step": 648264, "epoch": 7810} {"train_loss": -28.093809127807617, "global_step": 648265, "epoch": 7810} {"train_loss": -28.165023803710938, "global_step": 648266, "epoch": 7810} {"train_loss": -28.27326774597168, "global_step": 648267, "epoch": 7810} {"train_loss": -28.210941314697266, "global_step": 648268, "epoch": 7810} {"train_loss": -28.577680587768555, "global_step": 648269, "epoch": 7810} {"train_loss": -28.280847549438477, "global_step": 648270, "epoch": 7810} {"train_loss": -28.096281051635742, "global_step": 648271, "epoch": 7810} {"train_loss": -28.683435440063477, "global_step": 648272, "epoch": 7810} {"train_loss": -28.607318878173828, "global_step": 648273, "epoch": 7810} {"train_loss": -28.009931564331055, "global_step": 648274, "epoch": 7810} {"train_loss": -28.35628318786621, "global_step": 648275, "epoch": 7810} {"train_loss": -28.25870704650879, "global_step": 648276, "epoch": 7810} {"train_loss": -28.263036727905273, "global_step": 648277, "epoch": 7810} {"train_loss": -28.52651023864746, "global_step": 648278, "epoch": 7810} {"train_loss": -28.203094482421875, "global_step": 648279, "epoch": 7810} {"train_loss": -28.34036636352539, "global_step": 648280, "epoch": 7810} {"train_loss": -28.430017471313477, "global_step": 648281, "epoch": 7810} {"train_loss": -28.37078285217285, "global_step": 648282, "epoch": 7810} {"train_loss": -28.353551864624023, "global_step": 648283, "epoch": 7810} {"train_loss": -28.259174346923828, "global_step": 648284, "epoch": 7810} {"train_loss": -28.394567489624023, "global_step": 648285, "epoch": 7810} {"train_loss": -28.709516525268555, "global_step": 648286, "epoch": 7810} {"train_loss": -28.4942626953125, "global_step": 648287, "epoch": 7810} {"train_loss": -28.56074333190918, "global_step": 648288, "epoch": 7810} {"train_loss": -28.416034698486328, "global_step": 648289, "epoch": 7810} {"train_loss": -28.743972778320312, "global_step": 648290, "epoch": 7810} {"train_loss": -28.6163387298584, "global_step": 648291, "epoch": 7810} {"train_loss": -28.734939575195312, "global_step": 648292, "epoch": 7810} {"train_loss": -28.872785568237305, "global_step": 648293, "epoch": 7810} {"train_loss": -28.200284957885742, "global_step": 648294, "epoch": 7810} {"train_loss": -29.105871200561523, "global_step": 648295, "epoch": 7810} {"train_loss": -28.70123291015625, "global_step": 648296, "epoch": 7810} {"train_loss": -28.317785263061523, "global_step": 648297, "epoch": 7810} {"train_loss": -27.933462142944336, "global_step": 648298, "epoch": 7810} {"train_loss": -26.72491455078125, "global_step": 648299, "epoch": 7810} {"train_loss": -22.950305938720703, "global_step": 648300, "epoch": 7810} {"train_loss": -20.57949447631836, "global_step": 648301, "epoch": 7810} {"train_loss": -25.884607315063477, "global_step": 648302, "epoch": 7810} {"train_loss": -26.504535675048828, "global_step": 648303, "epoch": 7810} {"train_loss": -26.792724609375, "global_step": 648304, "epoch": 7810} {"train_loss": -26.53754997253418, "global_step": 648305, "epoch": 7810} {"train_loss": -26.890050888061523, "global_step": 648306, "epoch": 7810} {"train_loss": -26.6893253326416, "global_step": 648307, "epoch": 7810} {"train_loss": -26.212812423706055, "global_step": 648308, "epoch": 7810} {"train_loss": -27.77666664123535, "global_step": 648309, "epoch": 7810} {"train_loss": -26.859399795532227, "global_step": 648310, "epoch": 7810} {"train_loss": -27.115631103515625, "global_step": 648311, "epoch": 7810} {"train_loss": -27.90373880317412, "global_step": 648312, "epoch": 7810, "val_loss": 6724932.0} {"train_loss": -27.387439727783203, "global_step": 648313, "epoch": 7811} {"train_loss": -26.658899307250977, "global_step": 648314, "epoch": 7811} {"train_loss": -26.8028564453125, "global_step": 648315, "epoch": 7811} {"train_loss": -27.121734619140625, "global_step": 648316, "epoch": 7811} {"train_loss": -27.02874755859375, "global_step": 648317, "epoch": 7811} {"train_loss": -26.661725997924805, "global_step": 648318, "epoch": 7811} {"train_loss": -27.182083129882812, "global_step": 648319, "epoch": 7811} {"train_loss": -26.951990127563477, "global_step": 648320, "epoch": 7811} {"train_loss": -27.395090103149414, "global_step": 648321, "epoch": 7811} {"train_loss": -27.072437286376953, "global_step": 648322, "epoch": 7811} {"train_loss": -27.262903213500977, "global_step": 648323, "epoch": 7811} {"train_loss": -27.085729598999023, "global_step": 648324, "epoch": 7811} {"train_loss": -26.847625732421875, "global_step": 648325, "epoch": 7811} {"train_loss": -27.31251335144043, "global_step": 648326, "epoch": 7811} {"train_loss": -27.795637130737305, "global_step": 648327, "epoch": 7811} {"train_loss": -26.905292510986328, "global_step": 648328, "epoch": 7811} {"train_loss": -27.186735153198242, "global_step": 648329, "epoch": 7811} {"train_loss": -27.30615234375, "global_step": 648330, "epoch": 7811} {"train_loss": -27.84942626953125, "global_step": 648331, "epoch": 7811} {"train_loss": -27.538131713867188, "global_step": 648332, "epoch": 7811} {"train_loss": -27.653039932250977, "global_step": 648333, "epoch": 7811} {"train_loss": -27.724761962890625, "global_step": 648334, "epoch": 7811} {"train_loss": -27.232330322265625, "global_step": 648335, "epoch": 7811} {"train_loss": -27.724990844726562, "global_step": 648336, "epoch": 7811} {"train_loss": -27.961103439331055, "global_step": 648337, "epoch": 7811} {"train_loss": -27.873065948486328, "global_step": 648338, "epoch": 7811} {"train_loss": -28.071958541870117, "global_step": 648339, "epoch": 7811} {"train_loss": -27.716266632080078, "global_step": 648340, "epoch": 7811} {"train_loss": -27.91008949279785, "global_step": 648341, "epoch": 7811} {"train_loss": -27.9033260345459, "global_step": 648342, "epoch": 7811} {"train_loss": -27.95832633972168, "global_step": 648343, "epoch": 7811} {"train_loss": -27.949731826782227, "global_step": 648344, "epoch": 7811} {"train_loss": -27.960752487182617, "global_step": 648345, "epoch": 7811} {"train_loss": -27.973913192749023, "global_step": 648346, "epoch": 7811} {"train_loss": -27.8082218170166, "global_step": 648347, "epoch": 7811} {"train_loss": -28.083398818969727, "global_step": 648348, "epoch": 7811} {"train_loss": -28.255884170532227, "global_step": 648349, "epoch": 7811} {"train_loss": -28.414575576782227, "global_step": 648350, "epoch": 7811} {"train_loss": -27.76774024963379, "global_step": 648351, "epoch": 7811} {"train_loss": -28.197874069213867, "global_step": 648352, "epoch": 7811} {"train_loss": -27.8686580657959, "global_step": 648353, "epoch": 7811} {"train_loss": -28.447296142578125, "global_step": 648354, "epoch": 7811} {"train_loss": -28.212268829345703, "global_step": 648355, "epoch": 7811} {"train_loss": -28.29339599609375, "global_step": 648356, "epoch": 7811} {"train_loss": -27.947717666625977, "global_step": 648357, "epoch": 7811} {"train_loss": -28.241125106811523, "global_step": 648358, "epoch": 7811} {"train_loss": -27.9295597076416, "global_step": 648359, "epoch": 7811} {"train_loss": -28.707813262939453, "global_step": 648360, "epoch": 7811} {"train_loss": -28.397741317749023, "global_step": 648361, "epoch": 7811} {"train_loss": -28.561086654663086, "global_step": 648362, "epoch": 7811} {"train_loss": -28.135726928710938, "global_step": 648363, "epoch": 7811} {"train_loss": -28.13945960998535, "global_step": 648364, "epoch": 7811} {"train_loss": -28.1265869140625, "global_step": 648365, "epoch": 7811} {"train_loss": -28.167882919311523, "global_step": 648366, "epoch": 7811} {"train_loss": -28.104877471923828, "global_step": 648367, "epoch": 7811} {"train_loss": -28.262922286987305, "global_step": 648368, "epoch": 7811} {"train_loss": -28.098913192749023, "global_step": 648369, "epoch": 7811} {"train_loss": -28.232147216796875, "global_step": 648370, "epoch": 7811} {"train_loss": -28.1513729095459, "global_step": 648371, "epoch": 7811} {"train_loss": -28.741455078125, "global_step": 648372, "epoch": 7811} {"train_loss": -28.095748901367188, "global_step": 648373, "epoch": 7811} {"train_loss": -27.892227172851562, "global_step": 648374, "epoch": 7811} {"train_loss": -27.600046157836914, "global_step": 648375, "epoch": 7811} {"train_loss": -27.207494735717773, "global_step": 648376, "epoch": 7811} {"train_loss": -27.58404541015625, "global_step": 648377, "epoch": 7811} {"train_loss": -27.68924903869629, "global_step": 648378, "epoch": 7811} {"train_loss": -28.16069984436035, "global_step": 648379, "epoch": 7811} {"train_loss": -28.1735782623291, "global_step": 648380, "epoch": 7811} {"train_loss": -28.148035049438477, "global_step": 648381, "epoch": 7811} {"train_loss": -28.134185791015625, "global_step": 648382, "epoch": 7811} {"train_loss": -28.190078735351562, "global_step": 648383, "epoch": 7811} {"train_loss": -27.906036376953125, "global_step": 648384, "epoch": 7811} {"train_loss": -27.899816513061523, "global_step": 648385, "epoch": 7811} {"train_loss": -27.80240249633789, "global_step": 648386, "epoch": 7811} {"train_loss": -28.4715633392334, "global_step": 648387, "epoch": 7811} {"train_loss": -28.29608726501465, "global_step": 648388, "epoch": 7811} {"train_loss": -28.146987915039062, "global_step": 648389, "epoch": 7811} {"train_loss": -28.16432762145996, "global_step": 648390, "epoch": 7811} {"train_loss": -27.987323760986328, "global_step": 648391, "epoch": 7811} {"train_loss": -28.24981689453125, "global_step": 648392, "epoch": 7811} {"train_loss": -28.40435791015625, "global_step": 648393, "epoch": 7811} {"train_loss": -28.035531997680664, "global_step": 648394, "epoch": 7811} {"train_loss": -27.843102351728692, "global_step": 648395, "epoch": 7811, "val_loss": 6652284.0} {"train_loss": -27.561147689819336, "global_step": 648396, "epoch": 7812} {"train_loss": -27.789709091186523, "global_step": 648397, "epoch": 7812} {"train_loss": -27.807737350463867, "global_step": 648398, "epoch": 7812} {"train_loss": -28.057119369506836, "global_step": 648399, "epoch": 7812} {"train_loss": -27.79339027404785, "global_step": 648400, "epoch": 7812} {"train_loss": -27.78902244567871, "global_step": 648401, "epoch": 7812} {"train_loss": -27.96416664123535, "global_step": 648402, "epoch": 7812} {"train_loss": -28.336034774780273, "global_step": 648403, "epoch": 7812} {"train_loss": -28.405303955078125, "global_step": 648404, "epoch": 7812} {"train_loss": -28.05592155456543, "global_step": 648405, "epoch": 7812} {"train_loss": -27.909595489501953, "global_step": 648406, "epoch": 7812} {"train_loss": -28.322559356689453, "global_step": 648407, "epoch": 7812} {"train_loss": -28.224018096923828, "global_step": 648408, "epoch": 7812} {"train_loss": -28.460981369018555, "global_step": 648409, "epoch": 7812} {"train_loss": -28.20229148864746, "global_step": 648410, "epoch": 7812} {"train_loss": -28.11406898498535, "global_step": 648411, "epoch": 7812} {"train_loss": -27.957738876342773, "global_step": 648412, "epoch": 7812} {"train_loss": -27.996999740600586, "global_step": 648413, "epoch": 7812} {"train_loss": -28.338964462280273, "global_step": 648414, "epoch": 7812} {"train_loss": -28.4865665435791, "global_step": 648415, "epoch": 7812} {"train_loss": -28.21807861328125, "global_step": 648416, "epoch": 7812} {"train_loss": -28.141096115112305, "global_step": 648417, "epoch": 7812} {"train_loss": -28.22959327697754, "global_step": 648418, "epoch": 7812} {"train_loss": -28.260711669921875, "global_step": 648419, "epoch": 7812} {"train_loss": -28.193078994750977, "global_step": 648420, "epoch": 7812} {"train_loss": -28.393692016601562, "global_step": 648421, "epoch": 7812} {"train_loss": -28.4210147857666, "global_step": 648422, "epoch": 7812} {"train_loss": -28.245786666870117, "global_step": 648423, "epoch": 7812} {"train_loss": -28.408267974853516, "global_step": 648424, "epoch": 7812} {"train_loss": -28.612253189086914, "global_step": 648425, "epoch": 7812} {"train_loss": -28.67441177368164, "global_step": 648426, "epoch": 7812} {"train_loss": -28.370849609375, "global_step": 648427, "epoch": 7812} {"train_loss": -28.473560333251953, "global_step": 648428, "epoch": 7812} {"train_loss": -28.512449264526367, "global_step": 648429, "epoch": 7812} {"train_loss": -28.245283126831055, "global_step": 648430, "epoch": 7812} {"train_loss": -28.229276657104492, "global_step": 648431, "epoch": 7812} {"train_loss": -28.834125518798828, "global_step": 648432, "epoch": 7812} {"train_loss": -28.698566436767578, "global_step": 648433, "epoch": 7812} {"train_loss": -28.490270614624023, "global_step": 648434, "epoch": 7812} {"train_loss": -28.38641929626465, "global_step": 648435, "epoch": 7812} {"train_loss": -28.5091609954834, "global_step": 648436, "epoch": 7812} {"train_loss": -28.744306564331055, "global_step": 648437, "epoch": 7812} {"train_loss": -28.520343780517578, "global_step": 648438, "epoch": 7812} {"train_loss": -28.74370765686035, "global_step": 648439, "epoch": 7812} {"train_loss": -28.68462562561035, "global_step": 648440, "epoch": 7812} {"train_loss": -28.39057731628418, "global_step": 648441, "epoch": 7812} {"train_loss": -28.520893096923828, "global_step": 648442, "epoch": 7812} {"train_loss": -28.70383644104004, "global_step": 648443, "epoch": 7812} {"train_loss": -28.484909057617188, "global_step": 648444, "epoch": 7812} {"train_loss": -28.59238052368164, "global_step": 648445, "epoch": 7812} {"train_loss": -28.658178329467773, "global_step": 648446, "epoch": 7812} {"train_loss": -28.374103546142578, "global_step": 648447, "epoch": 7812} {"train_loss": -28.381574630737305, "global_step": 648448, "epoch": 7812} {"train_loss": -28.354068756103516, "global_step": 648449, "epoch": 7812} {"train_loss": -28.275222778320312, "global_step": 648450, "epoch": 7812} {"train_loss": -27.932571411132812, "global_step": 648451, "epoch": 7812} {"train_loss": -27.26393699645996, "global_step": 648452, "epoch": 7812} {"train_loss": -27.733076095581055, "global_step": 648453, "epoch": 7812} {"train_loss": -28.185134887695312, "global_step": 648454, "epoch": 7812} {"train_loss": -28.1251163482666, "global_step": 648455, "epoch": 7812} {"train_loss": -27.992206573486328, "global_step": 648456, "epoch": 7812} {"train_loss": -28.407062530517578, "global_step": 648457, "epoch": 7812} {"train_loss": -27.82533073425293, "global_step": 648458, "epoch": 7812} {"train_loss": -28.275653839111328, "global_step": 648459, "epoch": 7812} {"train_loss": -28.324323654174805, "global_step": 648460, "epoch": 7812} {"train_loss": -28.57349967956543, "global_step": 648461, "epoch": 7812} {"train_loss": -28.321775436401367, "global_step": 648462, "epoch": 7812} {"train_loss": -27.79324722290039, "global_step": 648463, "epoch": 7812} {"train_loss": -28.42262077331543, "global_step": 648464, "epoch": 7812} {"train_loss": -28.37476921081543, "global_step": 648465, "epoch": 7812} {"train_loss": -28.0036563873291, "global_step": 648466, "epoch": 7812} {"train_loss": -28.22456932067871, "global_step": 648467, "epoch": 7812} {"train_loss": -27.9428653717041, "global_step": 648468, "epoch": 7812} {"train_loss": -28.172189712524414, "global_step": 648469, "epoch": 7812} {"train_loss": -28.6009521484375, "global_step": 648470, "epoch": 7812} {"train_loss": -28.68507194519043, "global_step": 648471, "epoch": 7812} {"train_loss": -28.45233154296875, "global_step": 648472, "epoch": 7812} {"train_loss": -28.452619552612305, "global_step": 648473, "epoch": 7812} {"train_loss": -28.109155654907227, "global_step": 648474, "epoch": 7812} {"train_loss": -28.238636016845703, "global_step": 648475, "epoch": 7812} {"train_loss": -28.05337905883789, "global_step": 648476, "epoch": 7812} {"train_loss": -28.2528018951416, "global_step": 648477, "epoch": 7812} {"train_loss": -28.26693160275379, "global_step": 648478, "epoch": 7812, "val_loss": 6656673.0} {"train_loss": -28.255712509155273, "global_step": 648479, "epoch": 7813} {"train_loss": -27.96766471862793, "global_step": 648480, "epoch": 7813} {"train_loss": -27.856231689453125, "global_step": 648481, "epoch": 7813} {"train_loss": -28.085657119750977, "global_step": 648482, "epoch": 7813} {"train_loss": -28.223066329956055, "global_step": 648483, "epoch": 7813} {"train_loss": -27.821685791015625, "global_step": 648484, "epoch": 7813} {"train_loss": -27.461380004882812, "global_step": 648485, "epoch": 7813} {"train_loss": -28.341718673706055, "global_step": 648486, "epoch": 7813} {"train_loss": -27.76498794555664, "global_step": 648487, "epoch": 7813} {"train_loss": -28.218896865844727, "global_step": 648488, "epoch": 7813} {"train_loss": -28.21479606628418, "global_step": 648489, "epoch": 7813} {"train_loss": -28.491596221923828, "global_step": 648490, "epoch": 7813} {"train_loss": -28.201141357421875, "global_step": 648491, "epoch": 7813} {"train_loss": -28.020029067993164, "global_step": 648492, "epoch": 7813} {"train_loss": -27.833770751953125, "global_step": 648493, "epoch": 7813} {"train_loss": -28.17169761657715, "global_step": 648494, "epoch": 7813} {"train_loss": -28.186620712280273, "global_step": 648495, "epoch": 7813} {"train_loss": -28.547327041625977, "global_step": 648496, "epoch": 7813} {"train_loss": -28.1632137298584, "global_step": 648497, "epoch": 7813} {"train_loss": -28.388830184936523, "global_step": 648498, "epoch": 7813} {"train_loss": -28.435575485229492, "global_step": 648499, "epoch": 7813} {"train_loss": -28.274763107299805, "global_step": 648500, "epoch": 7813} {"train_loss": -28.430387496948242, "global_step": 648501, "epoch": 7813} {"train_loss": -28.759031295776367, "global_step": 648502, "epoch": 7813} {"train_loss": -28.375852584838867, "global_step": 648503, "epoch": 7813} {"train_loss": -28.21282958984375, "global_step": 648504, "epoch": 7813} {"train_loss": -28.354907989501953, "global_step": 648505, "epoch": 7813} {"train_loss": -28.61773681640625, "global_step": 648506, "epoch": 7813} {"train_loss": -29.01470375061035, "global_step": 648507, "epoch": 7813} {"train_loss": -28.473602294921875, "global_step": 648508, "epoch": 7813} {"train_loss": -28.70074462890625, "global_step": 648509, "epoch": 7813} {"train_loss": -28.858722686767578, "global_step": 648510, "epoch": 7813} {"train_loss": -28.35064125061035, "global_step": 648511, "epoch": 7813} {"train_loss": -28.520553588867188, "global_step": 648512, "epoch": 7813} {"train_loss": -28.47444725036621, "global_step": 648513, "epoch": 7813} {"train_loss": -28.77402687072754, "global_step": 648514, "epoch": 7813} {"train_loss": -28.212936401367188, "global_step": 648515, "epoch": 7813} {"train_loss": -28.365259170532227, "global_step": 648516, "epoch": 7813} {"train_loss": -28.89145278930664, "global_step": 648517, "epoch": 7813} {"train_loss": -28.635700225830078, "global_step": 648518, "epoch": 7813} {"train_loss": -28.267744064331055, "global_step": 648519, "epoch": 7813} {"train_loss": -28.359601974487305, "global_step": 648520, "epoch": 7813} {"train_loss": -28.884906768798828, "global_step": 648521, "epoch": 7813} {"train_loss": -28.3327579498291, "global_step": 648522, "epoch": 7813} {"train_loss": -28.691675186157227, "global_step": 648523, "epoch": 7813} {"train_loss": -28.29374122619629, "global_step": 648524, "epoch": 7813} {"train_loss": -28.05068016052246, "global_step": 648525, "epoch": 7813} {"train_loss": -28.487043380737305, "global_step": 648526, "epoch": 7813} {"train_loss": -28.339797973632812, "global_step": 648527, "epoch": 7813} {"train_loss": -28.050128936767578, "global_step": 648528, "epoch": 7813} {"train_loss": -28.137937545776367, "global_step": 648529, "epoch": 7813} {"train_loss": -28.856714248657227, "global_step": 648530, "epoch": 7813} {"train_loss": -27.8414306640625, "global_step": 648531, "epoch": 7813} {"train_loss": -28.52303123474121, "global_step": 648532, "epoch": 7813} {"train_loss": -27.918115615844727, "global_step": 648533, "epoch": 7813} {"train_loss": -28.2025146484375, "global_step": 648534, "epoch": 7813} {"train_loss": -28.140308380126953, "global_step": 648535, "epoch": 7813} {"train_loss": -28.269947052001953, "global_step": 648536, "epoch": 7813} {"train_loss": -28.469030380249023, "global_step": 648537, "epoch": 7813} {"train_loss": -28.162006378173828, "global_step": 648538, "epoch": 7813} {"train_loss": -28.77195167541504, "global_step": 648539, "epoch": 7813} {"train_loss": -28.62506103515625, "global_step": 648540, "epoch": 7813} {"train_loss": -28.097787857055664, "global_step": 648541, "epoch": 7813} {"train_loss": -28.433130264282227, "global_step": 648542, "epoch": 7813} {"train_loss": -28.2391300201416, "global_step": 648543, "epoch": 7813} {"train_loss": -27.918012619018555, "global_step": 648544, "epoch": 7813} {"train_loss": -28.30784034729004, "global_step": 648545, "epoch": 7813} {"train_loss": -28.121244430541992, "global_step": 648546, "epoch": 7813} {"train_loss": -28.0635986328125, "global_step": 648547, "epoch": 7813} {"train_loss": -28.2369441986084, "global_step": 648548, "epoch": 7813} {"train_loss": -28.209701538085938, "global_step": 648549, "epoch": 7813} {"train_loss": -28.6143741607666, "global_step": 648550, "epoch": 7813} {"train_loss": -28.25714683532715, "global_step": 648551, "epoch": 7813} {"train_loss": -28.315881729125977, "global_step": 648552, "epoch": 7813} {"train_loss": -28.524621963500977, "global_step": 648553, "epoch": 7813} {"train_loss": -28.6999454498291, "global_step": 648554, "epoch": 7813} {"train_loss": -28.405424118041992, "global_step": 648555, "epoch": 7813} {"train_loss": -28.060697555541992, "global_step": 648556, "epoch": 7813} {"train_loss": -28.396326065063477, "global_step": 648557, "epoch": 7813} {"train_loss": -28.604124069213867, "global_step": 648558, "epoch": 7813} {"train_loss": -28.228134155273438, "global_step": 648559, "epoch": 7813} {"train_loss": -28.43538475036621, "global_step": 648560, "epoch": 7813} {"train_loss": -28.345622970397216, "global_step": 648561, "epoch": 7813, "val_loss": 6647855.0} {"train_loss": -27.54740333557129, "global_step": 648562, "epoch": 7814} {"train_loss": -26.58894157409668, "global_step": 648563, "epoch": 7814} {"train_loss": -27.07716178894043, "global_step": 648564, "epoch": 7814} {"train_loss": -27.254199981689453, "global_step": 648565, "epoch": 7814} {"train_loss": -27.503498077392578, "global_step": 648566, "epoch": 7814} {"train_loss": -26.0516357421875, "global_step": 648567, "epoch": 7814} {"train_loss": -28.38510513305664, "global_step": 648568, "epoch": 7814} {"train_loss": -27.467823028564453, "global_step": 648569, "epoch": 7814} {"train_loss": -27.49757194519043, "global_step": 648570, "epoch": 7814} {"train_loss": -27.6314697265625, "global_step": 648571, "epoch": 7814} {"train_loss": -27.114044189453125, "global_step": 648572, "epoch": 7814} {"train_loss": -28.13067626953125, "global_step": 648573, "epoch": 7814} {"train_loss": -27.485645294189453, "global_step": 648574, "epoch": 7814} {"train_loss": -28.08685302734375, "global_step": 648575, "epoch": 7814} {"train_loss": -27.579919815063477, "global_step": 648576, "epoch": 7814} {"train_loss": -27.91407585144043, "global_step": 648577, "epoch": 7814} {"train_loss": -27.720504760742188, "global_step": 648578, "epoch": 7814} {"train_loss": -27.662261962890625, "global_step": 648579, "epoch": 7814} {"train_loss": -27.909744262695312, "global_step": 648580, "epoch": 7814} {"train_loss": -27.56487464904785, "global_step": 648581, "epoch": 7814} {"train_loss": -27.906763076782227, "global_step": 648582, "epoch": 7814} {"train_loss": -27.450342178344727, "global_step": 648583, "epoch": 7814} {"train_loss": -28.048053741455078, "global_step": 648584, "epoch": 7814} {"train_loss": -28.035608291625977, "global_step": 648585, "epoch": 7814} {"train_loss": -27.721271514892578, "global_step": 648586, "epoch": 7814} {"train_loss": -28.097675323486328, "global_step": 648587, "epoch": 7814} {"train_loss": -28.17133140563965, "global_step": 648588, "epoch": 7814} {"train_loss": -27.682153701782227, "global_step": 648589, "epoch": 7814} {"train_loss": -28.163711547851562, "global_step": 648590, "epoch": 7814} {"train_loss": -28.143903732299805, "global_step": 648591, "epoch": 7814} {"train_loss": -27.8408260345459, "global_step": 648592, "epoch": 7814} {"train_loss": -28.60565185546875, "global_step": 648593, "epoch": 7814} {"train_loss": -27.68063735961914, "global_step": 648594, "epoch": 7814} {"train_loss": -28.205368041992188, "global_step": 648595, "epoch": 7814} {"train_loss": -27.84783935546875, "global_step": 648596, "epoch": 7814} {"train_loss": -28.27020835876465, "global_step": 648597, "epoch": 7814} {"train_loss": -28.273550033569336, "global_step": 648598, "epoch": 7814} {"train_loss": -28.437484741210938, "global_step": 648599, "epoch": 7814} {"train_loss": -28.48040199279785, "global_step": 648600, "epoch": 7814} {"train_loss": -27.74183464050293, "global_step": 648601, "epoch": 7814} {"train_loss": -28.1586971282959, "global_step": 648602, "epoch": 7814} {"train_loss": -28.319665908813477, "global_step": 648603, "epoch": 7814} {"train_loss": -28.25274658203125, "global_step": 648604, "epoch": 7814} {"train_loss": -28.664533615112305, "global_step": 648605, "epoch": 7814} {"train_loss": -28.15620231628418, "global_step": 648606, "epoch": 7814} {"train_loss": -28.265548706054688, "global_step": 648607, "epoch": 7814} {"train_loss": -28.269287109375, "global_step": 648608, "epoch": 7814} {"train_loss": -28.152135848999023, "global_step": 648609, "epoch": 7814} {"train_loss": -28.188940048217773, "global_step": 648610, "epoch": 7814} {"train_loss": -28.4537410736084, "global_step": 648611, "epoch": 7814} {"train_loss": -28.323118209838867, "global_step": 648612, "epoch": 7814} {"train_loss": -28.219701766967773, "global_step": 648613, "epoch": 7814} {"train_loss": -28.5765323638916, "global_step": 648614, "epoch": 7814} {"train_loss": -28.2598934173584, "global_step": 648615, "epoch": 7814} {"train_loss": -27.783960342407227, "global_step": 648616, "epoch": 7814} {"train_loss": -27.983264923095703, "global_step": 648617, "epoch": 7814} {"train_loss": -27.956174850463867, "global_step": 648618, "epoch": 7814} {"train_loss": -27.925012588500977, "global_step": 648619, "epoch": 7814} {"train_loss": -27.907470703125, "global_step": 648620, "epoch": 7814} {"train_loss": -27.83698844909668, "global_step": 648621, "epoch": 7814} {"train_loss": -28.185806274414062, "global_step": 648622, "epoch": 7814} {"train_loss": -28.8056640625, "global_step": 648623, "epoch": 7814} {"train_loss": -28.20037269592285, "global_step": 648624, "epoch": 7814} {"train_loss": -28.189767837524414, "global_step": 648625, "epoch": 7814} {"train_loss": -28.346729278564453, "global_step": 648626, "epoch": 7814} {"train_loss": -28.164037704467773, "global_step": 648627, "epoch": 7814} {"train_loss": -28.804162979125977, "global_step": 648628, "epoch": 7814} {"train_loss": -28.33064842224121, "global_step": 648629, "epoch": 7814} {"train_loss": -28.593799591064453, "global_step": 648630, "epoch": 7814} {"train_loss": -28.686437606811523, "global_step": 648631, "epoch": 7814} {"train_loss": -28.592670440673828, "global_step": 648632, "epoch": 7814} {"train_loss": -28.095523834228516, "global_step": 648633, "epoch": 7814} {"train_loss": -28.553375244140625, "global_step": 648634, "epoch": 7814} {"train_loss": -28.509164810180664, "global_step": 648635, "epoch": 7814} {"train_loss": -28.539600372314453, "global_step": 648636, "epoch": 7814} {"train_loss": -28.7725887298584, "global_step": 648637, "epoch": 7814} {"train_loss": -28.700719833374023, "global_step": 648638, "epoch": 7814} {"train_loss": -28.433332443237305, "global_step": 648639, "epoch": 7814} {"train_loss": -28.57020378112793, "global_step": 648640, "epoch": 7814} {"train_loss": -28.702075958251953, "global_step": 648641, "epoch": 7814} {"train_loss": -28.166126251220703, "global_step": 648642, "epoch": 7814} {"train_loss": -28.600610733032227, "global_step": 648643, "epoch": 7814} {"train_loss": -28.055668727461114, "global_step": 648644, "epoch": 7814, "val_loss": 6714620.0} {"train_loss": -27.211084365844727, "global_step": 648645, "epoch": 7815} {"train_loss": -25.747900009155273, "global_step": 648646, "epoch": 7815} {"train_loss": -26.437768936157227, "global_step": 648647, "epoch": 7815} {"train_loss": -27.3791446685791, "global_step": 648648, "epoch": 7815} {"train_loss": -27.781919479370117, "global_step": 648649, "epoch": 7815} {"train_loss": -26.913740158081055, "global_step": 648650, "epoch": 7815} {"train_loss": -27.603473663330078, "global_step": 648651, "epoch": 7815} {"train_loss": -27.8045654296875, "global_step": 648652, "epoch": 7815} {"train_loss": -28.253280639648438, "global_step": 648653, "epoch": 7815} {"train_loss": -27.928770065307617, "global_step": 648654, "epoch": 7815} {"train_loss": -27.989124298095703, "global_step": 648655, "epoch": 7815} {"train_loss": -27.8536376953125, "global_step": 648656, "epoch": 7815} {"train_loss": -28.0783634185791, "global_step": 648657, "epoch": 7815} {"train_loss": -27.795429229736328, "global_step": 648658, "epoch": 7815} {"train_loss": -28.001062393188477, "global_step": 648659, "epoch": 7815} {"train_loss": -27.760589599609375, "global_step": 648660, "epoch": 7815} {"train_loss": -28.048675537109375, "global_step": 648661, "epoch": 7815} {"train_loss": -28.695606231689453, "global_step": 648662, "epoch": 7815} {"train_loss": -28.324462890625, "global_step": 648663, "epoch": 7815} {"train_loss": -27.964391708374023, "global_step": 648664, "epoch": 7815} {"train_loss": -28.256072998046875, "global_step": 648665, "epoch": 7815} {"train_loss": -28.614957809448242, "global_step": 648666, "epoch": 7815} {"train_loss": -28.204944610595703, "global_step": 648667, "epoch": 7815} {"train_loss": -28.629322052001953, "global_step": 648668, "epoch": 7815} {"train_loss": -28.62611198425293, "global_step": 648669, "epoch": 7815} {"train_loss": -28.364110946655273, "global_step": 648670, "epoch": 7815} {"train_loss": -28.41763687133789, "global_step": 648671, "epoch": 7815} {"train_loss": -28.2843017578125, "global_step": 648672, "epoch": 7815} {"train_loss": -28.295377731323242, "global_step": 648673, "epoch": 7815} {"train_loss": -28.713825225830078, "global_step": 648674, "epoch": 7815} {"train_loss": -28.224567413330078, "global_step": 648675, "epoch": 7815} {"train_loss": -28.199731826782227, "global_step": 648676, "epoch": 7815} {"train_loss": -28.368122100830078, "global_step": 648677, "epoch": 7815} {"train_loss": -28.286657333374023, "global_step": 648678, "epoch": 7815} {"train_loss": -28.75056266784668, "global_step": 648679, "epoch": 7815} {"train_loss": -28.162643432617188, "global_step": 648680, "epoch": 7815} {"train_loss": -28.40874671936035, "global_step": 648681, "epoch": 7815} {"train_loss": -28.674182891845703, "global_step": 648682, "epoch": 7815} {"train_loss": -28.355533599853516, "global_step": 648683, "epoch": 7815} {"train_loss": -28.46763038635254, "global_step": 648684, "epoch": 7815} {"train_loss": -28.856237411499023, "global_step": 648685, "epoch": 7815} {"train_loss": -28.56239128112793, "global_step": 648686, "epoch": 7815} {"train_loss": -28.265588760375977, "global_step": 648687, "epoch": 7815} {"train_loss": -28.42473793029785, "global_step": 648688, "epoch": 7815} {"train_loss": -28.376296997070312, "global_step": 648689, "epoch": 7815} {"train_loss": -28.296030044555664, "global_step": 648690, "epoch": 7815} {"train_loss": -28.1451358795166, "global_step": 648691, "epoch": 7815} {"train_loss": -28.714797973632812, "global_step": 648692, "epoch": 7815} {"train_loss": -28.60121726989746, "global_step": 648693, "epoch": 7815} {"train_loss": -28.657291412353516, "global_step": 648694, "epoch": 7815} {"train_loss": -28.592636108398438, "global_step": 648695, "epoch": 7815} {"train_loss": -28.52777671813965, "global_step": 648696, "epoch": 7815} {"train_loss": -28.195404052734375, "global_step": 648697, "epoch": 7815} {"train_loss": -28.1240234375, "global_step": 648698, "epoch": 7815} {"train_loss": -28.07929039001465, "global_step": 648699, "epoch": 7815} {"train_loss": -28.602338790893555, "global_step": 648700, "epoch": 7815} {"train_loss": -27.861913681030273, "global_step": 648701, "epoch": 7815} {"train_loss": -28.343366622924805, "global_step": 648702, "epoch": 7815} {"train_loss": -28.452320098876953, "global_step": 648703, "epoch": 7815} {"train_loss": -28.31161880493164, "global_step": 648704, "epoch": 7815} {"train_loss": -28.269468307495117, "global_step": 648705, "epoch": 7815} {"train_loss": -28.26180076599121, "global_step": 648706, "epoch": 7815} {"train_loss": -28.391096115112305, "global_step": 648707, "epoch": 7815} {"train_loss": -27.943227767944336, "global_step": 648708, "epoch": 7815} {"train_loss": -28.205862045288086, "global_step": 648709, "epoch": 7815} {"train_loss": -28.0986385345459, "global_step": 648710, "epoch": 7815} {"train_loss": -28.251117706298828, "global_step": 648711, "epoch": 7815} {"train_loss": -28.538095474243164, "global_step": 648712, "epoch": 7815} {"train_loss": -27.720178604125977, "global_step": 648713, "epoch": 7815} {"train_loss": -27.93946647644043, "global_step": 648714, "epoch": 7815} {"train_loss": -28.225473403930664, "global_step": 648715, "epoch": 7815} {"train_loss": -28.306631088256836, "global_step": 648716, "epoch": 7815} {"train_loss": -27.723920822143555, "global_step": 648717, "epoch": 7815} {"train_loss": -28.0919189453125, "global_step": 648718, "epoch": 7815} {"train_loss": -28.28521728515625, "global_step": 648719, "epoch": 7815} {"train_loss": -28.237180709838867, "global_step": 648720, "epoch": 7815} {"train_loss": -28.526418685913086, "global_step": 648721, "epoch": 7815} {"train_loss": -28.39215087890625, "global_step": 648722, "epoch": 7815} {"train_loss": -28.680194854736328, "global_step": 648723, "epoch": 7815} {"train_loss": -28.24530029296875, "global_step": 648724, "epoch": 7815} {"train_loss": -28.37323570251465, "global_step": 648725, "epoch": 7815} {"train_loss": -28.488880157470703, "global_step": 648726, "epoch": 7815} {"train_loss": -28.199070850050592, "global_step": 648727, "epoch": 7815, "val_loss": 6694408.0} {"train_loss": -27.697463989257812, "global_step": 648728, "epoch": 7816} {"train_loss": -27.34039306640625, "global_step": 648729, "epoch": 7816} {"train_loss": -28.4698429107666, "global_step": 648730, "epoch": 7816} {"train_loss": -27.708118438720703, "global_step": 648731, "epoch": 7816} {"train_loss": -28.210798263549805, "global_step": 648732, "epoch": 7816} {"train_loss": -28.263519287109375, "global_step": 648733, "epoch": 7816} {"train_loss": -27.67470359802246, "global_step": 648734, "epoch": 7816} {"train_loss": -28.166275024414062, "global_step": 648735, "epoch": 7816} {"train_loss": -28.08795166015625, "global_step": 648736, "epoch": 7816} {"train_loss": -28.663375854492188, "global_step": 648737, "epoch": 7816} {"train_loss": -27.916213989257812, "global_step": 648738, "epoch": 7816} {"train_loss": -28.099470138549805, "global_step": 648739, "epoch": 7816} {"train_loss": -28.416107177734375, "global_step": 648740, "epoch": 7816} {"train_loss": -28.23691177368164, "global_step": 648741, "epoch": 7816} {"train_loss": -28.419340133666992, "global_step": 648742, "epoch": 7816} {"train_loss": -28.03596305847168, "global_step": 648743, "epoch": 7816} {"train_loss": -28.42179298400879, "global_step": 648744, "epoch": 7816} {"train_loss": -28.311094284057617, "global_step": 648745, "epoch": 7816} {"train_loss": -28.389612197875977, "global_step": 648746, "epoch": 7816} {"train_loss": -28.357589721679688, "global_step": 648747, "epoch": 7816} {"train_loss": -28.4150333404541, "global_step": 648748, "epoch": 7816} {"train_loss": -28.0642032623291, "global_step": 648749, "epoch": 7816} {"train_loss": -28.453449249267578, "global_step": 648750, "epoch": 7816} {"train_loss": -27.872007369995117, "global_step": 648751, "epoch": 7816} {"train_loss": -28.06440544128418, "global_step": 648752, "epoch": 7816} {"train_loss": -28.26601219177246, "global_step": 648753, "epoch": 7816} {"train_loss": -28.502552032470703, "global_step": 648754, "epoch": 7816} {"train_loss": -27.996540069580078, "global_step": 648755, "epoch": 7816} {"train_loss": -28.446334838867188, "global_step": 648756, "epoch": 7816} {"train_loss": -28.440149307250977, "global_step": 648757, "epoch": 7816} {"train_loss": -28.102157592773438, "global_step": 648758, "epoch": 7816} {"train_loss": -28.295230865478516, "global_step": 648759, "epoch": 7816} {"train_loss": -28.37006950378418, "global_step": 648760, "epoch": 7816} {"train_loss": -28.35463523864746, "global_step": 648761, "epoch": 7816} {"train_loss": -28.22334098815918, "global_step": 648762, "epoch": 7816} {"train_loss": -28.411893844604492, "global_step": 648763, "epoch": 7816} {"train_loss": -28.828704833984375, "global_step": 648764, "epoch": 7816} {"train_loss": -28.226919174194336, "global_step": 648765, "epoch": 7816} {"train_loss": -28.243993759155273, "global_step": 648766, "epoch": 7816} {"train_loss": -28.47821617126465, "global_step": 648767, "epoch": 7816} {"train_loss": -28.115650177001953, "global_step": 648768, "epoch": 7816} {"train_loss": -28.3563175201416, "global_step": 648769, "epoch": 7816} {"train_loss": -28.15205192565918, "global_step": 648770, "epoch": 7816} {"train_loss": -28.316320419311523, "global_step": 648771, "epoch": 7816} {"train_loss": -28.577733993530273, "global_step": 648772, "epoch": 7816} {"train_loss": -28.653249740600586, "global_step": 648773, "epoch": 7816} {"train_loss": -28.722509384155273, "global_step": 648774, "epoch": 7816} {"train_loss": -27.952316284179688, "global_step": 648775, "epoch": 7816} {"train_loss": -28.482351303100586, "global_step": 648776, "epoch": 7816} {"train_loss": -28.352771759033203, "global_step": 648777, "epoch": 7816} {"train_loss": -28.303491592407227, "global_step": 648778, "epoch": 7816} {"train_loss": -28.508411407470703, "global_step": 648779, "epoch": 7816} {"train_loss": -28.6894474029541, "global_step": 648780, "epoch": 7816} {"train_loss": -28.445037841796875, "global_step": 648781, "epoch": 7816} {"train_loss": -28.20975685119629, "global_step": 648782, "epoch": 7816} {"train_loss": -28.20863151550293, "global_step": 648783, "epoch": 7816} {"train_loss": -28.405750274658203, "global_step": 648784, "epoch": 7816} {"train_loss": -28.621301651000977, "global_step": 648785, "epoch": 7816} {"train_loss": -27.815412521362305, "global_step": 648786, "epoch": 7816} {"train_loss": -28.211973190307617, "global_step": 648787, "epoch": 7816} {"train_loss": -27.943832397460938, "global_step": 648788, "epoch": 7816} {"train_loss": -28.851652145385742, "global_step": 648789, "epoch": 7816} {"train_loss": -28.37006950378418, "global_step": 648790, "epoch": 7816} {"train_loss": -28.330860137939453, "global_step": 648791, "epoch": 7816} {"train_loss": -28.399810791015625, "global_step": 648792, "epoch": 7816} {"train_loss": -28.243000030517578, "global_step": 648793, "epoch": 7816} {"train_loss": -28.326038360595703, "global_step": 648794, "epoch": 7816} {"train_loss": -28.394201278686523, "global_step": 648795, "epoch": 7816} {"train_loss": -28.346776962280273, "global_step": 648796, "epoch": 7816} {"train_loss": -28.4222412109375, "global_step": 648797, "epoch": 7816} {"train_loss": -28.396347045898438, "global_step": 648798, "epoch": 7816} {"train_loss": -28.677261352539062, "global_step": 648799, "epoch": 7816} {"train_loss": -28.507837295532227, "global_step": 648800, "epoch": 7816} {"train_loss": -28.389698028564453, "global_step": 648801, "epoch": 7816} {"train_loss": -28.546293258666992, "global_step": 648802, "epoch": 7816} {"train_loss": -28.051000595092773, "global_step": 648803, "epoch": 7816} {"train_loss": -28.077390670776367, "global_step": 648804, "epoch": 7816} {"train_loss": -28.47919273376465, "global_step": 648805, "epoch": 7816} {"train_loss": -28.5771541595459, "global_step": 648806, "epoch": 7816} {"train_loss": -28.710906982421875, "global_step": 648807, "epoch": 7816} {"train_loss": -28.346725463867188, "global_step": 648808, "epoch": 7816} {"train_loss": -28.45966911315918, "global_step": 648809, "epoch": 7816} {"train_loss": -28.320284510233318, "global_step": 648810, "epoch": 7816, "val_loss": 6707151.0} {"train_loss": -28.336017608642578, "global_step": 648811, "epoch": 7817} {"train_loss": -28.097766876220703, "global_step": 648812, "epoch": 7817} {"train_loss": -27.839405059814453, "global_step": 648813, "epoch": 7817} {"train_loss": -28.200714111328125, "global_step": 648814, "epoch": 7817} {"train_loss": -27.93157386779785, "global_step": 648815, "epoch": 7817} {"train_loss": -27.789548873901367, "global_step": 648816, "epoch": 7817} {"train_loss": -27.978601455688477, "global_step": 648817, "epoch": 7817} {"train_loss": -28.021631240844727, "global_step": 648818, "epoch": 7817} {"train_loss": -27.951892852783203, "global_step": 648819, "epoch": 7817} {"train_loss": -28.053714752197266, "global_step": 648820, "epoch": 7817} {"train_loss": -27.591968536376953, "global_step": 648821, "epoch": 7817} {"train_loss": -28.092504501342773, "global_step": 648822, "epoch": 7817} {"train_loss": -28.201709747314453, "global_step": 648823, "epoch": 7817} {"train_loss": -28.318506240844727, "global_step": 648824, "epoch": 7817} {"train_loss": -28.1554012298584, "global_step": 648825, "epoch": 7817} {"train_loss": -28.159076690673828, "global_step": 648826, "epoch": 7817} {"train_loss": -28.21064567565918, "global_step": 648827, "epoch": 7817} {"train_loss": -28.04500389099121, "global_step": 648828, "epoch": 7817} {"train_loss": -28.292570114135742, "global_step": 648829, "epoch": 7817} {"train_loss": -28.3411865234375, "global_step": 648830, "epoch": 7817} {"train_loss": -28.044248580932617, "global_step": 648831, "epoch": 7817} {"train_loss": -28.36842155456543, "global_step": 648832, "epoch": 7817} {"train_loss": -28.112287521362305, "global_step": 648833, "epoch": 7817} {"train_loss": -28.079675674438477, "global_step": 648834, "epoch": 7817} {"train_loss": -28.355804443359375, "global_step": 648835, "epoch": 7817} {"train_loss": -28.158246994018555, "global_step": 648836, "epoch": 7817} {"train_loss": -28.338489532470703, "global_step": 648837, "epoch": 7817} {"train_loss": -28.342618942260742, "global_step": 648838, "epoch": 7817} {"train_loss": -28.64594841003418, "global_step": 648839, "epoch": 7817} {"train_loss": -28.60389518737793, "global_step": 648840, "epoch": 7817} {"train_loss": -28.58978271484375, "global_step": 648841, "epoch": 7817} {"train_loss": -28.466053009033203, "global_step": 648842, "epoch": 7817} {"train_loss": -28.50139808654785, "global_step": 648843, "epoch": 7817} {"train_loss": -28.608829498291016, "global_step": 648844, "epoch": 7817} {"train_loss": -28.71807861328125, "global_step": 648845, "epoch": 7817} {"train_loss": -28.013757705688477, "global_step": 648846, "epoch": 7817} {"train_loss": -28.3565616607666, "global_step": 648847, "epoch": 7817} {"train_loss": -28.59083366394043, "global_step": 648848, "epoch": 7817} {"train_loss": -28.549253463745117, "global_step": 648849, "epoch": 7817} {"train_loss": -27.843841552734375, "global_step": 648850, "epoch": 7817} {"train_loss": -28.4810733795166, "global_step": 648851, "epoch": 7817} {"train_loss": -28.370223999023438, "global_step": 648852, "epoch": 7817} {"train_loss": -28.029132843017578, "global_step": 648853, "epoch": 7817} {"train_loss": -28.319997787475586, "global_step": 648854, "epoch": 7817} {"train_loss": -28.315937042236328, "global_step": 648855, "epoch": 7817} {"train_loss": -28.476776123046875, "global_step": 648856, "epoch": 7817} {"train_loss": -28.609683990478516, "global_step": 648857, "epoch": 7817} {"train_loss": -27.992511749267578, "global_step": 648858, "epoch": 7817} {"train_loss": -28.496829986572266, "global_step": 648859, "epoch": 7817} {"train_loss": -28.387054443359375, "global_step": 648860, "epoch": 7817} {"train_loss": -28.243976593017578, "global_step": 648861, "epoch": 7817} {"train_loss": -28.11958122253418, "global_step": 648862, "epoch": 7817} {"train_loss": -28.489669799804688, "global_step": 648863, "epoch": 7817} {"train_loss": -28.6157283782959, "global_step": 648864, "epoch": 7817} {"train_loss": -28.362226486206055, "global_step": 648865, "epoch": 7817} {"train_loss": -28.510217666625977, "global_step": 648866, "epoch": 7817} {"train_loss": -28.3486328125, "global_step": 648867, "epoch": 7817} {"train_loss": -28.144378662109375, "global_step": 648868, "epoch": 7817} {"train_loss": -28.267297744750977, "global_step": 648869, "epoch": 7817} {"train_loss": -28.261199951171875, "global_step": 648870, "epoch": 7817} {"train_loss": -28.177845001220703, "global_step": 648871, "epoch": 7817} {"train_loss": -28.151947021484375, "global_step": 648872, "epoch": 7817} {"train_loss": -28.388471603393555, "global_step": 648873, "epoch": 7817} {"train_loss": -28.509672164916992, "global_step": 648874, "epoch": 7817} {"train_loss": -28.425878524780273, "global_step": 648875, "epoch": 7817} {"train_loss": -28.53480339050293, "global_step": 648876, "epoch": 7817} {"train_loss": -28.188161849975586, "global_step": 648877, "epoch": 7817} {"train_loss": -28.21803092956543, "global_step": 648878, "epoch": 7817} {"train_loss": -28.380361557006836, "global_step": 648879, "epoch": 7817} {"train_loss": -27.996198654174805, "global_step": 648880, "epoch": 7817} {"train_loss": -27.847797393798828, "global_step": 648881, "epoch": 7817} {"train_loss": -28.264286041259766, "global_step": 648882, "epoch": 7817} {"train_loss": -28.001245498657227, "global_step": 648883, "epoch": 7817} {"train_loss": -28.400196075439453, "global_step": 648884, "epoch": 7817} {"train_loss": -28.41745376586914, "global_step": 648885, "epoch": 7817} {"train_loss": -28.327367782592773, "global_step": 648886, "epoch": 7817} {"train_loss": -28.396764755249023, "global_step": 648887, "epoch": 7817} {"train_loss": -28.398731231689453, "global_step": 648888, "epoch": 7817} {"train_loss": -28.402362823486328, "global_step": 648889, "epoch": 7817} {"train_loss": -28.34600830078125, "global_step": 648890, "epoch": 7817} {"train_loss": -28.359281539916992, "global_step": 648891, "epoch": 7817} {"train_loss": -28.032958984375, "global_step": 648892, "epoch": 7817} {"train_loss": -28.264773472245917, "global_step": 648893, "epoch": 7817, "val_loss": 6736988.0} {"train_loss": -27.881072998046875, "global_step": 648894, "epoch": 7818} {"train_loss": -27.2043399810791, "global_step": 648895, "epoch": 7818} {"train_loss": -27.8389949798584, "global_step": 648896, "epoch": 7818} {"train_loss": -27.57598304748535, "global_step": 648897, "epoch": 7818} {"train_loss": -27.634485244750977, "global_step": 648898, "epoch": 7818} {"train_loss": -27.83330726623535, "global_step": 648899, "epoch": 7818} {"train_loss": -27.70918083190918, "global_step": 648900, "epoch": 7818} {"train_loss": -27.756610870361328, "global_step": 648901, "epoch": 7818} {"train_loss": -27.738510131835938, "global_step": 648902, "epoch": 7818} {"train_loss": -27.620563507080078, "global_step": 648903, "epoch": 7818} {"train_loss": -28.23700523376465, "global_step": 648904, "epoch": 7818} {"train_loss": -28.07208824157715, "global_step": 648905, "epoch": 7818} {"train_loss": -27.915363311767578, "global_step": 648906, "epoch": 7818} {"train_loss": -28.139135360717773, "global_step": 648907, "epoch": 7818} {"train_loss": -28.21626091003418, "global_step": 648908, "epoch": 7818} {"train_loss": -28.114145278930664, "global_step": 648909, "epoch": 7818} {"train_loss": -27.89092445373535, "global_step": 648910, "epoch": 7818} {"train_loss": -27.997745513916016, "global_step": 648911, "epoch": 7818} {"train_loss": -28.108346939086914, "global_step": 648912, "epoch": 7818} {"train_loss": -28.182315826416016, "global_step": 648913, "epoch": 7818} {"train_loss": -28.109106063842773, "global_step": 648914, "epoch": 7818} {"train_loss": -27.8150577545166, "global_step": 648915, "epoch": 7818} {"train_loss": -28.19415283203125, "global_step": 648916, "epoch": 7818} {"train_loss": -27.959192276000977, "global_step": 648917, "epoch": 7818} {"train_loss": -28.322589874267578, "global_step": 648918, "epoch": 7818} {"train_loss": -27.993854522705078, "global_step": 648919, "epoch": 7818} {"train_loss": -28.1951847076416, "global_step": 648920, "epoch": 7818} {"train_loss": -28.24845314025879, "global_step": 648921, "epoch": 7818} {"train_loss": -27.77259635925293, "global_step": 648922, "epoch": 7818} {"train_loss": -27.88026237487793, "global_step": 648923, "epoch": 7818} {"train_loss": -28.50371742248535, "global_step": 648924, "epoch": 7818} {"train_loss": -28.445545196533203, "global_step": 648925, "epoch": 7818} {"train_loss": -28.076141357421875, "global_step": 648926, "epoch": 7818} {"train_loss": -28.30109977722168, "global_step": 648927, "epoch": 7818} {"train_loss": -28.476789474487305, "global_step": 648928, "epoch": 7818} {"train_loss": -28.281763076782227, "global_step": 648929, "epoch": 7818} {"train_loss": -28.48666763305664, "global_step": 648930, "epoch": 7818} {"train_loss": -28.413192749023438, "global_step": 648931, "epoch": 7818} {"train_loss": -28.677968978881836, "global_step": 648932, "epoch": 7818} {"train_loss": -28.498510360717773, "global_step": 648933, "epoch": 7818} {"train_loss": -28.495147705078125, "global_step": 648934, "epoch": 7818} {"train_loss": -28.566162109375, "global_step": 648935, "epoch": 7818} {"train_loss": -28.423551559448242, "global_step": 648936, "epoch": 7818} {"train_loss": -28.468393325805664, "global_step": 648937, "epoch": 7818} {"train_loss": -28.561559677124023, "global_step": 648938, "epoch": 7818} {"train_loss": -28.186059951782227, "global_step": 648939, "epoch": 7818} {"train_loss": -28.532316207885742, "global_step": 648940, "epoch": 7818} {"train_loss": -28.497968673706055, "global_step": 648941, "epoch": 7818} {"train_loss": -28.41070556640625, "global_step": 648942, "epoch": 7818} {"train_loss": -28.774707794189453, "global_step": 648943, "epoch": 7818} {"train_loss": -28.112958908081055, "global_step": 648944, "epoch": 7818} {"train_loss": -28.530393600463867, "global_step": 648945, "epoch": 7818} {"train_loss": -28.43674087524414, "global_step": 648946, "epoch": 7818} {"train_loss": -28.540990829467773, "global_step": 648947, "epoch": 7818} {"train_loss": -28.67054557800293, "global_step": 648948, "epoch": 7818} {"train_loss": -28.5533390045166, "global_step": 648949, "epoch": 7818} {"train_loss": -28.443750381469727, "global_step": 648950, "epoch": 7818} {"train_loss": -28.43171501159668, "global_step": 648951, "epoch": 7818} {"train_loss": -28.73883056640625, "global_step": 648952, "epoch": 7818} {"train_loss": -28.5498046875, "global_step": 648953, "epoch": 7818} {"train_loss": -28.691314697265625, "global_step": 648954, "epoch": 7818} {"train_loss": -28.481494903564453, "global_step": 648955, "epoch": 7818} {"train_loss": -28.265289306640625, "global_step": 648956, "epoch": 7818} {"train_loss": -28.61225700378418, "global_step": 648957, "epoch": 7818} {"train_loss": -28.374357223510742, "global_step": 648958, "epoch": 7818} {"train_loss": -28.45308494567871, "global_step": 648959, "epoch": 7818} {"train_loss": -27.49578857421875, "global_step": 648960, "epoch": 7818} {"train_loss": -27.593473434448242, "global_step": 648961, "epoch": 7818} {"train_loss": -27.37030601501465, "global_step": 648962, "epoch": 7818} {"train_loss": -27.828832626342773, "global_step": 648963, "epoch": 7818} {"train_loss": -28.34882164001465, "global_step": 648964, "epoch": 7818} {"train_loss": -27.911712646484375, "global_step": 648965, "epoch": 7818} {"train_loss": -28.36344337463379, "global_step": 648966, "epoch": 7818} {"train_loss": -28.203815460205078, "global_step": 648967, "epoch": 7818} {"train_loss": -27.961774826049805, "global_step": 648968, "epoch": 7818} {"train_loss": -27.65939712524414, "global_step": 648969, "epoch": 7818} {"train_loss": -27.968170166015625, "global_step": 648970, "epoch": 7818} {"train_loss": -28.47638511657715, "global_step": 648971, "epoch": 7818} {"train_loss": -28.472524642944336, "global_step": 648972, "epoch": 7818} {"train_loss": -28.053211212158203, "global_step": 648973, "epoch": 7818} {"train_loss": -28.387842178344727, "global_step": 648974, "epoch": 7818} {"train_loss": -28.330236434936523, "global_step": 648975, "epoch": 7818} {"train_loss": -28.198613706841527, "global_step": 648976, "epoch": 7818, "val_loss": 6749211.0} {"train_loss": -27.625747680664062, "global_step": 648977, "epoch": 7819} {"train_loss": -27.446691513061523, "global_step": 648978, "epoch": 7819} {"train_loss": -27.152387619018555, "global_step": 648979, "epoch": 7819} {"train_loss": -28.06939697265625, "global_step": 648980, "epoch": 7819} {"train_loss": -27.704971313476562, "global_step": 648981, "epoch": 7819} {"train_loss": -28.140851974487305, "global_step": 648982, "epoch": 7819} {"train_loss": -27.588613510131836, "global_step": 648983, "epoch": 7819} {"train_loss": -28.221378326416016, "global_step": 648984, "epoch": 7819} {"train_loss": -28.101423263549805, "global_step": 648985, "epoch": 7819} {"train_loss": -27.926462173461914, "global_step": 648986, "epoch": 7819} {"train_loss": -27.91717529296875, "global_step": 648987, "epoch": 7819} {"train_loss": -28.10297203063965, "global_step": 648988, "epoch": 7819} {"train_loss": -27.901660919189453, "global_step": 648989, "epoch": 7819} {"train_loss": -28.15778160095215, "global_step": 648990, "epoch": 7819} {"train_loss": -27.930755615234375, "global_step": 648991, "epoch": 7819} {"train_loss": -28.134130477905273, "global_step": 648992, "epoch": 7819} {"train_loss": -28.52764320373535, "global_step": 648993, "epoch": 7819} {"train_loss": -28.18292236328125, "global_step": 648994, "epoch": 7819} {"train_loss": -27.9638614654541, "global_step": 648995, "epoch": 7819} {"train_loss": -28.120437622070312, "global_step": 648996, "epoch": 7819} {"train_loss": -27.931100845336914, "global_step": 648997, "epoch": 7819} {"train_loss": -28.426488876342773, "global_step": 648998, "epoch": 7819} {"train_loss": -27.84894371032715, "global_step": 648999, "epoch": 7819} {"train_loss": -28.2845516204834, "global_step": 649000, "epoch": 7819} {"train_loss": -28.23333168029785, "global_step": 649001, "epoch": 7819} {"train_loss": -28.478443145751953, "global_step": 649002, "epoch": 7819} {"train_loss": -28.310840606689453, "global_step": 649003, "epoch": 7819} {"train_loss": -28.115198135375977, "global_step": 649004, "epoch": 7819} {"train_loss": -28.020111083984375, "global_step": 649005, "epoch": 7819} {"train_loss": -28.3048038482666, "global_step": 649006, "epoch": 7819} {"train_loss": -28.859220504760742, "global_step": 649007, "epoch": 7819} {"train_loss": -28.230371475219727, "global_step": 649008, "epoch": 7819} {"train_loss": -28.160497665405273, "global_step": 649009, "epoch": 7819} {"train_loss": -28.189746856689453, "global_step": 649010, "epoch": 7819} {"train_loss": -28.72818946838379, "global_step": 649011, "epoch": 7819} {"train_loss": -28.03363609313965, "global_step": 649012, "epoch": 7819} {"train_loss": -28.36810874938965, "global_step": 649013, "epoch": 7819} {"train_loss": -28.25238037109375, "global_step": 649014, "epoch": 7819} {"train_loss": -28.56329917907715, "global_step": 649015, "epoch": 7819} {"train_loss": -27.789350509643555, "global_step": 649016, "epoch": 7819} {"train_loss": -27.942121505737305, "global_step": 649017, "epoch": 7819} {"train_loss": -28.291227340698242, "global_step": 649018, "epoch": 7819} {"train_loss": -28.42206382751465, "global_step": 649019, "epoch": 7819} {"train_loss": -28.36916160583496, "global_step": 649020, "epoch": 7819} {"train_loss": -28.018850326538086, "global_step": 649021, "epoch": 7819} {"train_loss": -28.497928619384766, "global_step": 649022, "epoch": 7819} {"train_loss": -28.261388778686523, "global_step": 649023, "epoch": 7819} {"train_loss": -27.976892471313477, "global_step": 649024, "epoch": 7819} {"train_loss": -27.965734481811523, "global_step": 649025, "epoch": 7819} {"train_loss": -27.920623779296875, "global_step": 649026, "epoch": 7819} {"train_loss": -28.02837562561035, "global_step": 649027, "epoch": 7819} {"train_loss": -27.873340606689453, "global_step": 649028, "epoch": 7819} {"train_loss": -27.6342830657959, "global_step": 649029, "epoch": 7819} {"train_loss": -27.80988121032715, "global_step": 649030, "epoch": 7819} {"train_loss": -27.79646110534668, "global_step": 649031, "epoch": 7819} {"train_loss": -27.757110595703125, "global_step": 649032, "epoch": 7819} {"train_loss": -28.1243953704834, "global_step": 649033, "epoch": 7819} {"train_loss": -27.71376609802246, "global_step": 649034, "epoch": 7819} {"train_loss": -28.3272762298584, "global_step": 649035, "epoch": 7819} {"train_loss": -27.74395179748535, "global_step": 649036, "epoch": 7819} {"train_loss": -28.581836700439453, "global_step": 649037, "epoch": 7819} {"train_loss": -28.148229598999023, "global_step": 649038, "epoch": 7819} {"train_loss": -28.4621524810791, "global_step": 649039, "epoch": 7819} {"train_loss": -28.24847984313965, "global_step": 649040, "epoch": 7819} {"train_loss": -27.664962768554688, "global_step": 649041, "epoch": 7819} {"train_loss": -28.449604034423828, "global_step": 649042, "epoch": 7819} {"train_loss": -28.06412124633789, "global_step": 649043, "epoch": 7819} {"train_loss": -28.409595489501953, "global_step": 649044, "epoch": 7819} {"train_loss": -28.223127365112305, "global_step": 649045, "epoch": 7819} {"train_loss": -28.38994789123535, "global_step": 649046, "epoch": 7819} {"train_loss": -28.371442794799805, "global_step": 649047, "epoch": 7819} {"train_loss": -28.2082462310791, "global_step": 649048, "epoch": 7819} {"train_loss": -28.321744918823242, "global_step": 649049, "epoch": 7819} {"train_loss": -28.45065689086914, "global_step": 649050, "epoch": 7819} {"train_loss": -28.213104248046875, "global_step": 649051, "epoch": 7819} {"train_loss": -28.5260009765625, "global_step": 649052, "epoch": 7819} {"train_loss": -28.19752311706543, "global_step": 649053, "epoch": 7819} {"train_loss": -28.30609130859375, "global_step": 649054, "epoch": 7819} {"train_loss": -27.961393356323242, "global_step": 649055, "epoch": 7819} {"train_loss": -28.04145622253418, "global_step": 649056, "epoch": 7819} {"train_loss": -28.499347686767578, "global_step": 649057, "epoch": 7819} {"train_loss": -28.17120933532715, "global_step": 649058, "epoch": 7819} {"train_loss": -28.112729336841998, "global_step": 649059, "epoch": 7819, "val_loss": 6561838.0} {"train_loss": -25.152029037475586, "global_step": 649060, "epoch": 7820} {"train_loss": -23.777219772338867, "global_step": 649061, "epoch": 7820} {"train_loss": -26.42239761352539, "global_step": 649062, "epoch": 7820} {"train_loss": -25.966114044189453, "global_step": 649063, "epoch": 7820} {"train_loss": -26.69585609436035, "global_step": 649064, "epoch": 7820} {"train_loss": -26.821516036987305, "global_step": 649065, "epoch": 7820} {"train_loss": -27.01226234436035, "global_step": 649066, "epoch": 7820} {"train_loss": -26.991819381713867, "global_step": 649067, "epoch": 7820} {"train_loss": -26.77569580078125, "global_step": 649068, "epoch": 7820} {"train_loss": -27.029027938842773, "global_step": 649069, "epoch": 7820} {"train_loss": -27.2913818359375, "global_step": 649070, "epoch": 7820} {"train_loss": -27.08698844909668, "global_step": 649071, "epoch": 7820} {"train_loss": -27.794071197509766, "global_step": 649072, "epoch": 7820} {"train_loss": -27.463943481445312, "global_step": 649073, "epoch": 7820} {"train_loss": -27.380512237548828, "global_step": 649074, "epoch": 7820} {"train_loss": -27.312475204467773, "global_step": 649075, "epoch": 7820} {"train_loss": -27.181476593017578, "global_step": 649076, "epoch": 7820} {"train_loss": -27.6549072265625, "global_step": 649077, "epoch": 7820} {"train_loss": -27.33893394470215, "global_step": 649078, "epoch": 7820} {"train_loss": -27.391263961791992, "global_step": 649079, "epoch": 7820} {"train_loss": -28.010395050048828, "global_step": 649080, "epoch": 7820} {"train_loss": -27.67058753967285, "global_step": 649081, "epoch": 7820} {"train_loss": -27.286163330078125, "global_step": 649082, "epoch": 7820} {"train_loss": -27.662643432617188, "global_step": 649083, "epoch": 7820} {"train_loss": -27.589399337768555, "global_step": 649084, "epoch": 7820} {"train_loss": -27.479902267456055, "global_step": 649085, "epoch": 7820} {"train_loss": -27.738494873046875, "global_step": 649086, "epoch": 7820} {"train_loss": -27.926929473876953, "global_step": 649087, "epoch": 7820} {"train_loss": -27.9100341796875, "global_step": 649088, "epoch": 7820} {"train_loss": -27.912023544311523, "global_step": 649089, "epoch": 7820} {"train_loss": -28.004880905151367, "global_step": 649090, "epoch": 7820} {"train_loss": -28.135242462158203, "global_step": 649091, "epoch": 7820} {"train_loss": -28.074560165405273, "global_step": 649092, "epoch": 7820} {"train_loss": -27.814416885375977, "global_step": 649093, "epoch": 7820} {"train_loss": -28.026559829711914, "global_step": 649094, "epoch": 7820} {"train_loss": -28.172718048095703, "global_step": 649095, "epoch": 7820} {"train_loss": -27.962453842163086, "global_step": 649096, "epoch": 7820} {"train_loss": -27.936864852905273, "global_step": 649097, "epoch": 7820} {"train_loss": -28.450286865234375, "global_step": 649098, "epoch": 7820} {"train_loss": -28.25239372253418, "global_step": 649099, "epoch": 7820} {"train_loss": -27.80148696899414, "global_step": 649100, "epoch": 7820} {"train_loss": -27.6810359954834, "global_step": 649101, "epoch": 7820} {"train_loss": -27.8853759765625, "global_step": 649102, "epoch": 7820} {"train_loss": -28.216144561767578, "global_step": 649103, "epoch": 7820} {"train_loss": -28.034393310546875, "global_step": 649104, "epoch": 7820} {"train_loss": -27.669635772705078, "global_step": 649105, "epoch": 7820} {"train_loss": -28.141122817993164, "global_step": 649106, "epoch": 7820} {"train_loss": -28.274124145507812, "global_step": 649107, "epoch": 7820} {"train_loss": -28.01309585571289, "global_step": 649108, "epoch": 7820} {"train_loss": -28.64019775390625, "global_step": 649109, "epoch": 7820} {"train_loss": -28.25237464904785, "global_step": 649110, "epoch": 7820} {"train_loss": -28.471771240234375, "global_step": 649111, "epoch": 7820} {"train_loss": -28.587255477905273, "global_step": 649112, "epoch": 7820} {"train_loss": -28.247190475463867, "global_step": 649113, "epoch": 7820} {"train_loss": -28.31226921081543, "global_step": 649114, "epoch": 7820} {"train_loss": -28.429494857788086, "global_step": 649115, "epoch": 7820} {"train_loss": -27.995267868041992, "global_step": 649116, "epoch": 7820} {"train_loss": -28.58816909790039, "global_step": 649117, "epoch": 7820} {"train_loss": -28.509496688842773, "global_step": 649118, "epoch": 7820} {"train_loss": -28.4113712310791, "global_step": 649119, "epoch": 7820} {"train_loss": -28.458988189697266, "global_step": 649120, "epoch": 7820} {"train_loss": -28.305593490600586, "global_step": 649121, "epoch": 7820} {"train_loss": -28.737579345703125, "global_step": 649122, "epoch": 7820} {"train_loss": -28.01702880859375, "global_step": 649123, "epoch": 7820} {"train_loss": -28.58405113220215, "global_step": 649124, "epoch": 7820} {"train_loss": -28.37689208984375, "global_step": 649125, "epoch": 7820} {"train_loss": -28.306257247924805, "global_step": 649126, "epoch": 7820} {"train_loss": -28.29176902770996, "global_step": 649127, "epoch": 7820} {"train_loss": -28.405517578125, "global_step": 649128, "epoch": 7820} {"train_loss": -28.498334884643555, "global_step": 649129, "epoch": 7820} {"train_loss": -28.38863182067871, "global_step": 649130, "epoch": 7820} {"train_loss": -28.673444747924805, "global_step": 649131, "epoch": 7820} {"train_loss": -28.60601234436035, "global_step": 649132, "epoch": 7820} {"train_loss": -28.589059829711914, "global_step": 649133, "epoch": 7820} {"train_loss": -28.415746688842773, "global_step": 649134, "epoch": 7820} {"train_loss": -28.602888107299805, "global_step": 649135, "epoch": 7820} {"train_loss": -28.6026554107666, "global_step": 649136, "epoch": 7820} {"train_loss": -28.712926864624023, "global_step": 649137, "epoch": 7820} {"train_loss": -28.601428985595703, "global_step": 649138, "epoch": 7820} {"train_loss": -28.576955795288086, "global_step": 649139, "epoch": 7820} {"train_loss": -28.36004638671875, "global_step": 649140, "epoch": 7820} {"train_loss": -28.576648712158203, "global_step": 649141, "epoch": 7820} {"train_loss": -27.859650117805206, "global_step": 649142, "epoch": 7820, "val_loss": 6848628.0} {"train_loss": -26.054676055908203, "global_step": 649143, "epoch": 7821} {"train_loss": -24.26682472229004, "global_step": 649144, "epoch": 7821} {"train_loss": -25.740467071533203, "global_step": 649145, "epoch": 7821} {"train_loss": -27.891305923461914, "global_step": 649146, "epoch": 7821} {"train_loss": -26.761310577392578, "global_step": 649147, "epoch": 7821} {"train_loss": -26.716205596923828, "global_step": 649148, "epoch": 7821} {"train_loss": -28.011768341064453, "global_step": 649149, "epoch": 7821} {"train_loss": -26.88970375061035, "global_step": 649150, "epoch": 7821} {"train_loss": -26.974470138549805, "global_step": 649151, "epoch": 7821} {"train_loss": -26.990392684936523, "global_step": 649152, "epoch": 7821} {"train_loss": -27.960468292236328, "global_step": 649153, "epoch": 7821} {"train_loss": -27.684823989868164, "global_step": 649154, "epoch": 7821} {"train_loss": -27.314701080322266, "global_step": 649155, "epoch": 7821} {"train_loss": -27.932937622070312, "global_step": 649156, "epoch": 7821} {"train_loss": -27.762622833251953, "global_step": 649157, "epoch": 7821} {"train_loss": -27.191492080688477, "global_step": 649158, "epoch": 7821} {"train_loss": -28.21051597595215, "global_step": 649159, "epoch": 7821} {"train_loss": -27.714954376220703, "global_step": 649160, "epoch": 7821} {"train_loss": -27.69329833984375, "global_step": 649161, "epoch": 7821} {"train_loss": -27.697418212890625, "global_step": 649162, "epoch": 7821} {"train_loss": -27.6044864654541, "global_step": 649163, "epoch": 7821} {"train_loss": -27.736621856689453, "global_step": 649164, "epoch": 7821} {"train_loss": -28.034168243408203, "global_step": 649165, "epoch": 7821} {"train_loss": -28.16898536682129, "global_step": 649166, "epoch": 7821} {"train_loss": -28.46905517578125, "global_step": 649167, "epoch": 7821} {"train_loss": -27.7938232421875, "global_step": 649168, "epoch": 7821} {"train_loss": -28.022180557250977, "global_step": 649169, "epoch": 7821} {"train_loss": -27.92487144470215, "global_step": 649170, "epoch": 7821} {"train_loss": -28.203277587890625, "global_step": 649171, "epoch": 7821} {"train_loss": -28.075672149658203, "global_step": 649172, "epoch": 7821} {"train_loss": -28.037275314331055, "global_step": 649173, "epoch": 7821} {"train_loss": -28.08351707458496, "global_step": 649174, "epoch": 7821} {"train_loss": -28.32904052734375, "global_step": 649175, "epoch": 7821} {"train_loss": -27.95408058166504, "global_step": 649176, "epoch": 7821} {"train_loss": -28.089344024658203, "global_step": 649177, "epoch": 7821} {"train_loss": -28.11836051940918, "global_step": 649178, "epoch": 7821} {"train_loss": -28.448225021362305, "global_step": 649179, "epoch": 7821} {"train_loss": -27.874958038330078, "global_step": 649180, "epoch": 7821} {"train_loss": -28.277149200439453, "global_step": 649181, "epoch": 7821} {"train_loss": -28.24954605102539, "global_step": 649182, "epoch": 7821} {"train_loss": -28.5674991607666, "global_step": 649183, "epoch": 7821} {"train_loss": -28.099756240844727, "global_step": 649184, "epoch": 7821} {"train_loss": -28.283071517944336, "global_step": 649185, "epoch": 7821} {"train_loss": -28.231897354125977, "global_step": 649186, "epoch": 7821} {"train_loss": -28.66046714782715, "global_step": 649187, "epoch": 7821} {"train_loss": -28.543787002563477, "global_step": 649188, "epoch": 7821} {"train_loss": -28.281402587890625, "global_step": 649189, "epoch": 7821} {"train_loss": -28.307708740234375, "global_step": 649190, "epoch": 7821} {"train_loss": -28.457059860229492, "global_step": 649191, "epoch": 7821} {"train_loss": -28.461965560913086, "global_step": 649192, "epoch": 7821} {"train_loss": -28.672321319580078, "global_step": 649193, "epoch": 7821} {"train_loss": -28.340158462524414, "global_step": 649194, "epoch": 7821} {"train_loss": -28.273788452148438, "global_step": 649195, "epoch": 7821} {"train_loss": -28.329315185546875, "global_step": 649196, "epoch": 7821} {"train_loss": -28.47727394104004, "global_step": 649197, "epoch": 7821} {"train_loss": -28.691633224487305, "global_step": 649198, "epoch": 7821} {"train_loss": -28.63494873046875, "global_step": 649199, "epoch": 7821} {"train_loss": -28.89651870727539, "global_step": 649200, "epoch": 7821} {"train_loss": -28.48797035217285, "global_step": 649201, "epoch": 7821} {"train_loss": -28.6257381439209, "global_step": 649202, "epoch": 7821} {"train_loss": -28.191186904907227, "global_step": 649203, "epoch": 7821} {"train_loss": -28.907825469970703, "global_step": 649204, "epoch": 7821} {"train_loss": -28.529829025268555, "global_step": 649205, "epoch": 7821} {"train_loss": -28.51471519470215, "global_step": 649206, "epoch": 7821} {"train_loss": -28.57550621032715, "global_step": 649207, "epoch": 7821} {"train_loss": -28.450834274291992, "global_step": 649208, "epoch": 7821} {"train_loss": -28.378437042236328, "global_step": 649209, "epoch": 7821} {"train_loss": -28.907800674438477, "global_step": 649210, "epoch": 7821} {"train_loss": -28.475341796875, "global_step": 649211, "epoch": 7821} {"train_loss": -28.54961585998535, "global_step": 649212, "epoch": 7821} {"train_loss": -28.5862979888916, "global_step": 649213, "epoch": 7821} {"train_loss": -28.217050552368164, "global_step": 649214, "epoch": 7821} {"train_loss": -28.23956298828125, "global_step": 649215, "epoch": 7821} {"train_loss": -28.413009643554688, "global_step": 649216, "epoch": 7821} {"train_loss": -28.457962036132812, "global_step": 649217, "epoch": 7821} {"train_loss": -28.251422882080078, "global_step": 649218, "epoch": 7821} {"train_loss": -28.2136287689209, "global_step": 649219, "epoch": 7821} {"train_loss": -27.287240982055664, "global_step": 649220, "epoch": 7821} {"train_loss": -26.6658878326416, "global_step": 649221, "epoch": 7821} {"train_loss": -25.412322998046875, "global_step": 649222, "epoch": 7821} {"train_loss": -25.885229110717773, "global_step": 649223, "epoch": 7821} {"train_loss": -28.145334243774414, "global_step": 649224, "epoch": 7821} {"train_loss": -27.924122729933405, "global_step": 649225, "epoch": 7821, "val_loss": 6912578.0} {"train_loss": -26.2099609375, "global_step": 649226, "epoch": 7822} {"train_loss": -25.459619522094727, "global_step": 649227, "epoch": 7822} {"train_loss": -27.326231002807617, "global_step": 649228, "epoch": 7822} {"train_loss": -25.370874404907227, "global_step": 649229, "epoch": 7822} {"train_loss": -26.512571334838867, "global_step": 649230, "epoch": 7822} {"train_loss": -26.696435928344727, "global_step": 649231, "epoch": 7822} {"train_loss": -26.20450782775879, "global_step": 649232, "epoch": 7822} {"train_loss": -26.95265007019043, "global_step": 649233, "epoch": 7822} {"train_loss": -27.374521255493164, "global_step": 649234, "epoch": 7822} {"train_loss": -26.933679580688477, "global_step": 649235, "epoch": 7822} {"train_loss": -26.41802978515625, "global_step": 649236, "epoch": 7822} {"train_loss": -27.147846221923828, "global_step": 649237, "epoch": 7822} {"train_loss": -27.42823600769043, "global_step": 649238, "epoch": 7822} {"train_loss": -27.171436309814453, "global_step": 649239, "epoch": 7822} {"train_loss": -27.251148223876953, "global_step": 649240, "epoch": 7822} {"train_loss": -27.7268009185791, "global_step": 649241, "epoch": 7822} {"train_loss": -27.128076553344727, "global_step": 649242, "epoch": 7822} {"train_loss": -27.475576400756836, "global_step": 649243, "epoch": 7822} {"train_loss": -27.407819747924805, "global_step": 649244, "epoch": 7822} {"train_loss": -27.614721298217773, "global_step": 649245, "epoch": 7822} {"train_loss": -27.522287368774414, "global_step": 649246, "epoch": 7822} {"train_loss": -27.608688354492188, "global_step": 649247, "epoch": 7822} {"train_loss": -27.49112319946289, "global_step": 649248, "epoch": 7822} {"train_loss": -27.540552139282227, "global_step": 649249, "epoch": 7822} {"train_loss": -27.509429931640625, "global_step": 649250, "epoch": 7822} {"train_loss": -27.9617919921875, "global_step": 649251, "epoch": 7822} {"train_loss": -27.526187896728516, "global_step": 649252, "epoch": 7822} {"train_loss": -28.083032608032227, "global_step": 649253, "epoch": 7822} {"train_loss": -27.836118698120117, "global_step": 649254, "epoch": 7822} {"train_loss": -27.4956111907959, "global_step": 649255, "epoch": 7822} {"train_loss": -27.57956314086914, "global_step": 649256, "epoch": 7822} {"train_loss": -27.876012802124023, "global_step": 649257, "epoch": 7822} {"train_loss": -27.782363891601562, "global_step": 649258, "epoch": 7822} {"train_loss": -27.69675636291504, "global_step": 649259, "epoch": 7822} {"train_loss": -27.715017318725586, "global_step": 649260, "epoch": 7822} {"train_loss": -28.36264419555664, "global_step": 649261, "epoch": 7822} {"train_loss": -28.31492042541504, "global_step": 649262, "epoch": 7822} {"train_loss": -27.5340633392334, "global_step": 649263, "epoch": 7822} {"train_loss": -27.905603408813477, "global_step": 649264, "epoch": 7822} {"train_loss": -27.953601837158203, "global_step": 649265, "epoch": 7822} {"train_loss": -27.99953269958496, "global_step": 649266, "epoch": 7822} {"train_loss": -27.884550094604492, "global_step": 649267, "epoch": 7822} {"train_loss": -28.18317222595215, "global_step": 649268, "epoch": 7822} {"train_loss": -27.865304946899414, "global_step": 649269, "epoch": 7822} {"train_loss": -27.959646224975586, "global_step": 649270, "epoch": 7822} {"train_loss": -27.99346923828125, "global_step": 649271, "epoch": 7822} {"train_loss": -27.90760612487793, "global_step": 649272, "epoch": 7822} {"train_loss": -28.391775131225586, "global_step": 649273, "epoch": 7822} {"train_loss": -28.001300811767578, "global_step": 649274, "epoch": 7822} {"train_loss": -28.267133712768555, "global_step": 649275, "epoch": 7822} {"train_loss": -28.31601333618164, "global_step": 649276, "epoch": 7822} {"train_loss": -28.2091007232666, "global_step": 649277, "epoch": 7822} {"train_loss": -27.97254753112793, "global_step": 649278, "epoch": 7822} {"train_loss": -28.478757858276367, "global_step": 649279, "epoch": 7822} {"train_loss": -28.41118812561035, "global_step": 649280, "epoch": 7822} {"train_loss": -28.128040313720703, "global_step": 649281, "epoch": 7822} {"train_loss": -28.31666374206543, "global_step": 649282, "epoch": 7822} {"train_loss": -28.457731246948242, "global_step": 649283, "epoch": 7822} {"train_loss": -28.301071166992188, "global_step": 649284, "epoch": 7822} {"train_loss": -28.546411514282227, "global_step": 649285, "epoch": 7822} {"train_loss": -28.47760009765625, "global_step": 649286, "epoch": 7822} {"train_loss": -28.32826805114746, "global_step": 649287, "epoch": 7822} {"train_loss": -28.1887264251709, "global_step": 649288, "epoch": 7822} {"train_loss": -28.303241729736328, "global_step": 649289, "epoch": 7822} {"train_loss": -28.30414390563965, "global_step": 649290, "epoch": 7822} {"train_loss": -28.837858200073242, "global_step": 649291, "epoch": 7822} {"train_loss": -28.0787353515625, "global_step": 649292, "epoch": 7822} {"train_loss": -28.175500869750977, "global_step": 649293, "epoch": 7822} {"train_loss": -28.1651554107666, "global_step": 649294, "epoch": 7822} {"train_loss": -28.145923614501953, "global_step": 649295, "epoch": 7822} {"train_loss": -28.344472885131836, "global_step": 649296, "epoch": 7822} {"train_loss": -27.88081169128418, "global_step": 649297, "epoch": 7822} {"train_loss": -27.98818016052246, "global_step": 649298, "epoch": 7822} {"train_loss": -28.3160343170166, "global_step": 649299, "epoch": 7822} {"train_loss": -28.357257843017578, "global_step": 649300, "epoch": 7822} {"train_loss": -28.27671241760254, "global_step": 649301, "epoch": 7822} {"train_loss": -28.093358993530273, "global_step": 649302, "epoch": 7822} {"train_loss": -27.780029296875, "global_step": 649303, "epoch": 7822} {"train_loss": -27.814167022705078, "global_step": 649304, "epoch": 7822} {"train_loss": -27.745330810546875, "global_step": 649305, "epoch": 7822} {"train_loss": -27.823959350585938, "global_step": 649306, "epoch": 7822} {"train_loss": -28.14023780822754, "global_step": 649307, "epoch": 7822} {"train_loss": -27.74589740799134, "global_step": 649308, "epoch": 7822, "val_loss": 6903783.0} {"train_loss": -27.28789710998535, "global_step": 649309, "epoch": 7823} {"train_loss": -26.3121395111084, "global_step": 649310, "epoch": 7823} {"train_loss": -27.985803604125977, "global_step": 649311, "epoch": 7823} {"train_loss": -26.650854110717773, "global_step": 649312, "epoch": 7823} {"train_loss": -26.266422271728516, "global_step": 649313, "epoch": 7823} {"train_loss": -27.59881019592285, "global_step": 649314, "epoch": 7823} {"train_loss": -27.64397621154785, "global_step": 649315, "epoch": 7823} {"train_loss": -27.485538482666016, "global_step": 649316, "epoch": 7823} {"train_loss": -27.815399169921875, "global_step": 649317, "epoch": 7823} {"train_loss": -27.178333282470703, "global_step": 649318, "epoch": 7823} {"train_loss": -27.121652603149414, "global_step": 649319, "epoch": 7823} {"train_loss": -27.785802841186523, "global_step": 649320, "epoch": 7823} {"train_loss": -27.813064575195312, "global_step": 649321, "epoch": 7823} {"train_loss": -27.36033058166504, "global_step": 649322, "epoch": 7823} {"train_loss": -27.123611450195312, "global_step": 649323, "epoch": 7823} {"train_loss": -27.876907348632812, "global_step": 649324, "epoch": 7823} {"train_loss": -27.629087448120117, "global_step": 649325, "epoch": 7823} {"train_loss": -27.63679313659668, "global_step": 649326, "epoch": 7823} {"train_loss": -27.96844482421875, "global_step": 649327, "epoch": 7823} {"train_loss": -28.268346786499023, "global_step": 649328, "epoch": 7823} {"train_loss": -27.839954376220703, "global_step": 649329, "epoch": 7823} {"train_loss": -28.126691818237305, "global_step": 649330, "epoch": 7823} {"train_loss": -27.796894073486328, "global_step": 649331, "epoch": 7823} {"train_loss": -27.840240478515625, "global_step": 649332, "epoch": 7823} {"train_loss": -28.214340209960938, "global_step": 649333, "epoch": 7823} {"train_loss": -28.59848976135254, "global_step": 649334, "epoch": 7823} {"train_loss": -27.734601974487305, "global_step": 649335, "epoch": 7823} {"train_loss": -28.299222946166992, "global_step": 649336, "epoch": 7823} {"train_loss": -27.868024826049805, "global_step": 649337, "epoch": 7823} {"train_loss": -28.046247482299805, "global_step": 649338, "epoch": 7823} {"train_loss": -28.253080368041992, "global_step": 649339, "epoch": 7823} {"train_loss": -28.106042861938477, "global_step": 649340, "epoch": 7823} {"train_loss": -28.121158599853516, "global_step": 649341, "epoch": 7823} {"train_loss": -28.256240844726562, "global_step": 649342, "epoch": 7823} {"train_loss": -28.411182403564453, "global_step": 649343, "epoch": 7823} {"train_loss": -28.306732177734375, "global_step": 649344, "epoch": 7823} {"train_loss": -28.264022827148438, "global_step": 649345, "epoch": 7823} {"train_loss": -28.198822021484375, "global_step": 649346, "epoch": 7823} {"train_loss": -28.337507247924805, "global_step": 649347, "epoch": 7823} {"train_loss": -28.413455963134766, "global_step": 649348, "epoch": 7823} {"train_loss": -28.577545166015625, "global_step": 649349, "epoch": 7823} {"train_loss": -28.35590934753418, "global_step": 649350, "epoch": 7823} {"train_loss": -28.4642391204834, "global_step": 649351, "epoch": 7823} {"train_loss": -28.5957088470459, "global_step": 649352, "epoch": 7823} {"train_loss": -28.091999053955078, "global_step": 649353, "epoch": 7823} {"train_loss": -28.629932403564453, "global_step": 649354, "epoch": 7823} {"train_loss": -28.680429458618164, "global_step": 649355, "epoch": 7823} {"train_loss": -28.12579345703125, "global_step": 649356, "epoch": 7823} {"train_loss": -28.4383602142334, "global_step": 649357, "epoch": 7823} {"train_loss": -28.115793228149414, "global_step": 649358, "epoch": 7823} {"train_loss": -28.17254638671875, "global_step": 649359, "epoch": 7823} {"train_loss": -28.45315933227539, "global_step": 649360, "epoch": 7823} {"train_loss": -28.267419815063477, "global_step": 649361, "epoch": 7823} {"train_loss": -28.568586349487305, "global_step": 649362, "epoch": 7823} {"train_loss": -28.765913009643555, "global_step": 649363, "epoch": 7823} {"train_loss": -28.07443618774414, "global_step": 649364, "epoch": 7823} {"train_loss": -28.52765464782715, "global_step": 649365, "epoch": 7823} {"train_loss": -28.641820907592773, "global_step": 649366, "epoch": 7823} {"train_loss": -28.217239379882812, "global_step": 649367, "epoch": 7823} {"train_loss": -28.470355987548828, "global_step": 649368, "epoch": 7823} {"train_loss": -28.486083984375, "global_step": 649369, "epoch": 7823} {"train_loss": -28.288373947143555, "global_step": 649370, "epoch": 7823} {"train_loss": -28.23186683654785, "global_step": 649371, "epoch": 7823} {"train_loss": -27.9502010345459, "global_step": 649372, "epoch": 7823} {"train_loss": -28.47771644592285, "global_step": 649373, "epoch": 7823} {"train_loss": -28.02134132385254, "global_step": 649374, "epoch": 7823} {"train_loss": -28.192626953125, "global_step": 649375, "epoch": 7823} {"train_loss": -28.051544189453125, "global_step": 649376, "epoch": 7823} {"train_loss": -27.988473892211914, "global_step": 649377, "epoch": 7823} {"train_loss": -28.290973663330078, "global_step": 649378, "epoch": 7823} {"train_loss": -28.404373168945312, "global_step": 649379, "epoch": 7823} {"train_loss": -27.860509872436523, "global_step": 649380, "epoch": 7823} {"train_loss": -27.58905601501465, "global_step": 649381, "epoch": 7823} {"train_loss": -28.236988067626953, "global_step": 649382, "epoch": 7823} {"train_loss": -28.00864601135254, "global_step": 649383, "epoch": 7823} {"train_loss": -28.443634033203125, "global_step": 649384, "epoch": 7823} {"train_loss": -27.7392635345459, "global_step": 649385, "epoch": 7823} {"train_loss": -27.86750602722168, "global_step": 649386, "epoch": 7823} {"train_loss": -28.0927677154541, "global_step": 649387, "epoch": 7823} {"train_loss": -27.990158081054688, "global_step": 649388, "epoch": 7823} {"train_loss": -27.7945499420166, "global_step": 649389, "epoch": 7823} {"train_loss": -28.428241729736328, "global_step": 649390, "epoch": 7823} {"train_loss": -28.01948397992605, "global_step": 649391, "epoch": 7823, "val_loss": 6861304.5} {"train_loss": -25.83961296081543, "global_step": 649392, "epoch": 7824} {"train_loss": -27.39763832092285, "global_step": 649393, "epoch": 7824} {"train_loss": -27.069141387939453, "global_step": 649394, "epoch": 7824} {"train_loss": -27.402563095092773, "global_step": 649395, "epoch": 7824} {"train_loss": -27.999296188354492, "global_step": 649396, "epoch": 7824} {"train_loss": -27.63054847717285, "global_step": 649397, "epoch": 7824} {"train_loss": -27.143957138061523, "global_step": 649398, "epoch": 7824} {"train_loss": -27.723779678344727, "global_step": 649399, "epoch": 7824} {"train_loss": -27.701629638671875, "global_step": 649400, "epoch": 7824} {"train_loss": -27.87554359436035, "global_step": 649401, "epoch": 7824} {"train_loss": -27.57266616821289, "global_step": 649402, "epoch": 7824} {"train_loss": -27.711271286010742, "global_step": 649403, "epoch": 7824} {"train_loss": -27.967248916625977, "global_step": 649404, "epoch": 7824} {"train_loss": -27.918798446655273, "global_step": 649405, "epoch": 7824} {"train_loss": -27.948657989501953, "global_step": 649406, "epoch": 7824} {"train_loss": -27.981496810913086, "global_step": 649407, "epoch": 7824} {"train_loss": -27.858169555664062, "global_step": 649408, "epoch": 7824} {"train_loss": -27.9567813873291, "global_step": 649409, "epoch": 7824} {"train_loss": -27.997095108032227, "global_step": 649410, "epoch": 7824} {"train_loss": -28.18013572692871, "global_step": 649411, "epoch": 7824} {"train_loss": -28.033374786376953, "global_step": 649412, "epoch": 7824} {"train_loss": -28.200239181518555, "global_step": 649413, "epoch": 7824} {"train_loss": -27.930017471313477, "global_step": 649414, "epoch": 7824} {"train_loss": -28.203641891479492, "global_step": 649415, "epoch": 7824} {"train_loss": -28.11452293395996, "global_step": 649416, "epoch": 7824} {"train_loss": -28.182891845703125, "global_step": 649417, "epoch": 7824} {"train_loss": -27.86530113220215, "global_step": 649418, "epoch": 7824} {"train_loss": -28.15082359313965, "global_step": 649419, "epoch": 7824} {"train_loss": -28.580286026000977, "global_step": 649420, "epoch": 7824} {"train_loss": -28.3465518951416, "global_step": 649421, "epoch": 7824} {"train_loss": -28.14874839782715, "global_step": 649422, "epoch": 7824} {"train_loss": -28.0720272064209, "global_step": 649423, "epoch": 7824} {"train_loss": -28.250579833984375, "global_step": 649424, "epoch": 7824} {"train_loss": -28.671667098999023, "global_step": 649425, "epoch": 7824} {"train_loss": -28.38545036315918, "global_step": 649426, "epoch": 7824} {"train_loss": -28.454742431640625, "global_step": 649427, "epoch": 7824} {"train_loss": -28.238372802734375, "global_step": 649428, "epoch": 7824} {"train_loss": -28.503040313720703, "global_step": 649429, "epoch": 7824} {"train_loss": -28.301441192626953, "global_step": 649430, "epoch": 7824} {"train_loss": -28.004322052001953, "global_step": 649431, "epoch": 7824} {"train_loss": -28.323455810546875, "global_step": 649432, "epoch": 7824} {"train_loss": -28.451765060424805, "global_step": 649433, "epoch": 7824} {"train_loss": -28.314420700073242, "global_step": 649434, "epoch": 7824} {"train_loss": -28.442533493041992, "global_step": 649435, "epoch": 7824} {"train_loss": -28.30072593688965, "global_step": 649436, "epoch": 7824} {"train_loss": -28.010162353515625, "global_step": 649437, "epoch": 7824} {"train_loss": -28.268396377563477, "global_step": 649438, "epoch": 7824} {"train_loss": -28.321561813354492, "global_step": 649439, "epoch": 7824} {"train_loss": -28.11176872253418, "global_step": 649440, "epoch": 7824} {"train_loss": -28.1897029876709, "global_step": 649441, "epoch": 7824} {"train_loss": -28.558673858642578, "global_step": 649442, "epoch": 7824} {"train_loss": -28.211505889892578, "global_step": 649443, "epoch": 7824} {"train_loss": -28.4534912109375, "global_step": 649444, "epoch": 7824} {"train_loss": -28.57581901550293, "global_step": 649445, "epoch": 7824} {"train_loss": -28.60906982421875, "global_step": 649446, "epoch": 7824} {"train_loss": -28.5260009765625, "global_step": 649447, "epoch": 7824} {"train_loss": -28.30793571472168, "global_step": 649448, "epoch": 7824} {"train_loss": -28.58881950378418, "global_step": 649449, "epoch": 7824} {"train_loss": -28.59244155883789, "global_step": 649450, "epoch": 7824} {"train_loss": -28.611780166625977, "global_step": 649451, "epoch": 7824} {"train_loss": -28.5222110748291, "global_step": 649452, "epoch": 7824} {"train_loss": -28.665283203125, "global_step": 649453, "epoch": 7824} {"train_loss": -28.824115753173828, "global_step": 649454, "epoch": 7824} {"train_loss": -28.56516456604004, "global_step": 649455, "epoch": 7824} {"train_loss": -28.684335708618164, "global_step": 649456, "epoch": 7824} {"train_loss": -28.683618545532227, "global_step": 649457, "epoch": 7824} {"train_loss": -28.579208374023438, "global_step": 649458, "epoch": 7824} {"train_loss": -28.617889404296875, "global_step": 649459, "epoch": 7824} {"train_loss": -29.04471778869629, "global_step": 649460, "epoch": 7824} {"train_loss": -28.473249435424805, "global_step": 649461, "epoch": 7824} {"train_loss": -28.549497604370117, "global_step": 649462, "epoch": 7824} {"train_loss": -28.550907135009766, "global_step": 649463, "epoch": 7824} {"train_loss": -28.75257682800293, "global_step": 649464, "epoch": 7824} {"train_loss": -28.3250789642334, "global_step": 649465, "epoch": 7824} {"train_loss": -28.4930419921875, "global_step": 649466, "epoch": 7824} {"train_loss": -28.048297882080078, "global_step": 649467, "epoch": 7824} {"train_loss": -28.423627853393555, "global_step": 649468, "epoch": 7824} {"train_loss": -28.67486000061035, "global_step": 649469, "epoch": 7824} {"train_loss": -28.690967559814453, "global_step": 649470, "epoch": 7824} {"train_loss": -28.465600967407227, "global_step": 649471, "epoch": 7824} {"train_loss": -28.12714195251465, "global_step": 649472, "epoch": 7824} {"train_loss": -27.804840087890625, "global_step": 649473, "epoch": 7824} {"train_loss": -28.202450648847833, "global_step": 649474, "epoch": 7824, "val_loss": 6789781.0} {"train_loss": -27.69660758972168, "global_step": 649475, "epoch": 7825} {"train_loss": -26.898359298706055, "global_step": 649476, "epoch": 7825} {"train_loss": -27.561935424804688, "global_step": 649477, "epoch": 7825} {"train_loss": -27.021581649780273, "global_step": 649478, "epoch": 7825} {"train_loss": -27.23065185546875, "global_step": 649479, "epoch": 7825} {"train_loss": -27.87249183654785, "global_step": 649480, "epoch": 7825} {"train_loss": -27.123977661132812, "global_step": 649481, "epoch": 7825} {"train_loss": -27.649503707885742, "global_step": 649482, "epoch": 7825} {"train_loss": -27.422012329101562, "global_step": 649483, "epoch": 7825} {"train_loss": -27.937042236328125, "global_step": 649484, "epoch": 7825} {"train_loss": -27.431598663330078, "global_step": 649485, "epoch": 7825} {"train_loss": -27.727325439453125, "global_step": 649486, "epoch": 7825} {"train_loss": -27.66983413696289, "global_step": 649487, "epoch": 7825} {"train_loss": -27.662015914916992, "global_step": 649488, "epoch": 7825} {"train_loss": -28.17671775817871, "global_step": 649489, "epoch": 7825} {"train_loss": -27.811681747436523, "global_step": 649490, "epoch": 7825} {"train_loss": -27.821447372436523, "global_step": 649491, "epoch": 7825} {"train_loss": -27.763975143432617, "global_step": 649492, "epoch": 7825} {"train_loss": -27.4984188079834, "global_step": 649493, "epoch": 7825} {"train_loss": -27.98585319519043, "global_step": 649494, "epoch": 7825} {"train_loss": -27.85466957092285, "global_step": 649495, "epoch": 7825} {"train_loss": -27.922821044921875, "global_step": 649496, "epoch": 7825} {"train_loss": -27.924945831298828, "global_step": 649497, "epoch": 7825} {"train_loss": -27.942657470703125, "global_step": 649498, "epoch": 7825} {"train_loss": -27.870389938354492, "global_step": 649499, "epoch": 7825} {"train_loss": -27.958362579345703, "global_step": 649500, "epoch": 7825} {"train_loss": -27.854873657226562, "global_step": 649501, "epoch": 7825} {"train_loss": -28.104990005493164, "global_step": 649502, "epoch": 7825} {"train_loss": -27.946516036987305, "global_step": 649503, "epoch": 7825} {"train_loss": -28.08197021484375, "global_step": 649504, "epoch": 7825} {"train_loss": -28.27804946899414, "global_step": 649505, "epoch": 7825} {"train_loss": -27.822702407836914, "global_step": 649506, "epoch": 7825} {"train_loss": -28.622297286987305, "global_step": 649507, "epoch": 7825} {"train_loss": -28.411701202392578, "global_step": 649508, "epoch": 7825} {"train_loss": -28.122968673706055, "global_step": 649509, "epoch": 7825} {"train_loss": -28.160749435424805, "global_step": 649510, "epoch": 7825} {"train_loss": -28.53118896484375, "global_step": 649511, "epoch": 7825} {"train_loss": -28.568958282470703, "global_step": 649512, "epoch": 7825} {"train_loss": -28.006433486938477, "global_step": 649513, "epoch": 7825} {"train_loss": -28.20688819885254, "global_step": 649514, "epoch": 7825} {"train_loss": -28.290973663330078, "global_step": 649515, "epoch": 7825} {"train_loss": -28.38770866394043, "global_step": 649516, "epoch": 7825} {"train_loss": -28.70112419128418, "global_step": 649517, "epoch": 7825} {"train_loss": -28.77271842956543, "global_step": 649518, "epoch": 7825} {"train_loss": -28.590179443359375, "global_step": 649519, "epoch": 7825} {"train_loss": -28.344587326049805, "global_step": 649520, "epoch": 7825} {"train_loss": -28.4631290435791, "global_step": 649521, "epoch": 7825} {"train_loss": -28.720022201538086, "global_step": 649522, "epoch": 7825} {"train_loss": -28.775653839111328, "global_step": 649523, "epoch": 7825} {"train_loss": -28.555877685546875, "global_step": 649524, "epoch": 7825} {"train_loss": -28.238183975219727, "global_step": 649525, "epoch": 7825} {"train_loss": -28.661848068237305, "global_step": 649526, "epoch": 7825} {"train_loss": -28.24688148498535, "global_step": 649527, "epoch": 7825} {"train_loss": -28.344650268554688, "global_step": 649528, "epoch": 7825} {"train_loss": -28.338605880737305, "global_step": 649529, "epoch": 7825} {"train_loss": -28.60977554321289, "global_step": 649530, "epoch": 7825} {"train_loss": -28.09369468688965, "global_step": 649531, "epoch": 7825} {"train_loss": -28.60405921936035, "global_step": 649532, "epoch": 7825} {"train_loss": -28.51966667175293, "global_step": 649533, "epoch": 7825} {"train_loss": -28.141128540039062, "global_step": 649534, "epoch": 7825} {"train_loss": -28.47150993347168, "global_step": 649535, "epoch": 7825} {"train_loss": -28.289295196533203, "global_step": 649536, "epoch": 7825} {"train_loss": -27.966278076171875, "global_step": 649537, "epoch": 7825} {"train_loss": -28.637075424194336, "global_step": 649538, "epoch": 7825} {"train_loss": -28.575590133666992, "global_step": 649539, "epoch": 7825} {"train_loss": -28.353662490844727, "global_step": 649540, "epoch": 7825} {"train_loss": -28.426794052124023, "global_step": 649541, "epoch": 7825} {"train_loss": -28.59908103942871, "global_step": 649542, "epoch": 7825} {"train_loss": -28.07672691345215, "global_step": 649543, "epoch": 7825} {"train_loss": -28.21746253967285, "global_step": 649544, "epoch": 7825} {"train_loss": -28.011173248291016, "global_step": 649545, "epoch": 7825} {"train_loss": -28.503171920776367, "global_step": 649546, "epoch": 7825} {"train_loss": -28.40087890625, "global_step": 649547, "epoch": 7825} {"train_loss": -28.19892692565918, "global_step": 649548, "epoch": 7825} {"train_loss": -27.79974937438965, "global_step": 649549, "epoch": 7825} {"train_loss": -28.17536735534668, "global_step": 649550, "epoch": 7825} {"train_loss": -28.248510360717773, "global_step": 649551, "epoch": 7825} {"train_loss": -28.557397842407227, "global_step": 649552, "epoch": 7825} {"train_loss": -27.932388305664062, "global_step": 649553, "epoch": 7825} {"train_loss": -27.795175552368164, "global_step": 649554, "epoch": 7825} {"train_loss": -28.184127807617188, "global_step": 649555, "epoch": 7825} {"train_loss": -27.983631134033203, "global_step": 649556, "epoch": 7825} {"train_loss": -28.11275507455849, "global_step": 649557, "epoch": 7825, "val_loss": 6874177.0} {"train_loss": -28.076507568359375, "global_step": 649558, "epoch": 7826} {"train_loss": -27.38416862487793, "global_step": 649559, "epoch": 7826} {"train_loss": -27.668787002563477, "global_step": 649560, "epoch": 7826} {"train_loss": -27.62900733947754, "global_step": 649561, "epoch": 7826} {"train_loss": -27.219451904296875, "global_step": 649562, "epoch": 7826} {"train_loss": -27.40394401550293, "global_step": 649563, "epoch": 7826} {"train_loss": -27.324926376342773, "global_step": 649564, "epoch": 7826} {"train_loss": -27.752668380737305, "global_step": 649565, "epoch": 7826} {"train_loss": -27.132287979125977, "global_step": 649566, "epoch": 7826} {"train_loss": -27.59592628479004, "global_step": 649567, "epoch": 7826} {"train_loss": -27.378477096557617, "global_step": 649568, "epoch": 7826} {"train_loss": -27.81056785583496, "global_step": 649569, "epoch": 7826} {"train_loss": -27.65260124206543, "global_step": 649570, "epoch": 7826} {"train_loss": -27.288928985595703, "global_step": 649571, "epoch": 7826} {"train_loss": -27.587533950805664, "global_step": 649572, "epoch": 7826} {"train_loss": -27.847517013549805, "global_step": 649573, "epoch": 7826} {"train_loss": -28.38053321838379, "global_step": 649574, "epoch": 7826} {"train_loss": -28.04355239868164, "global_step": 649575, "epoch": 7826} {"train_loss": -27.6348819732666, "global_step": 649576, "epoch": 7826} {"train_loss": -27.948211669921875, "global_step": 649577, "epoch": 7826} {"train_loss": -27.94119644165039, "global_step": 649578, "epoch": 7826} {"train_loss": -28.4284725189209, "global_step": 649579, "epoch": 7826} {"train_loss": -28.27862548828125, "global_step": 649580, "epoch": 7826} {"train_loss": -28.568769454956055, "global_step": 649581, "epoch": 7826} {"train_loss": -27.89573097229004, "global_step": 649582, "epoch": 7826} {"train_loss": -28.189916610717773, "global_step": 649583, "epoch": 7826} {"train_loss": -28.220966339111328, "global_step": 649584, "epoch": 7826} {"train_loss": -28.129047393798828, "global_step": 649585, "epoch": 7826} {"train_loss": -28.082096099853516, "global_step": 649586, "epoch": 7826} {"train_loss": -28.191303253173828, "global_step": 649587, "epoch": 7826} {"train_loss": -28.185400009155273, "global_step": 649588, "epoch": 7826} {"train_loss": -28.562057495117188, "global_step": 649589, "epoch": 7826} {"train_loss": -28.4721622467041, "global_step": 649590, "epoch": 7826} {"train_loss": -27.99470329284668, "global_step": 649591, "epoch": 7826} {"train_loss": -28.19813346862793, "global_step": 649592, "epoch": 7826} {"train_loss": -28.61529541015625, "global_step": 649593, "epoch": 7826} {"train_loss": -28.09028434753418, "global_step": 649594, "epoch": 7826} {"train_loss": -28.75418472290039, "global_step": 649595, "epoch": 7826} {"train_loss": -28.415319442749023, "global_step": 649596, "epoch": 7826} {"train_loss": -28.368982315063477, "global_step": 649597, "epoch": 7826} {"train_loss": -28.21832847595215, "global_step": 649598, "epoch": 7826} {"train_loss": -28.45574378967285, "global_step": 649599, "epoch": 7826} {"train_loss": -28.618356704711914, "global_step": 649600, "epoch": 7826} {"train_loss": -28.4959716796875, "global_step": 649601, "epoch": 7826} {"train_loss": -28.579715728759766, "global_step": 649602, "epoch": 7826} {"train_loss": -28.517120361328125, "global_step": 649603, "epoch": 7826} {"train_loss": -28.568220138549805, "global_step": 649604, "epoch": 7826} {"train_loss": -28.566064834594727, "global_step": 649605, "epoch": 7826} {"train_loss": -28.853437423706055, "global_step": 649606, "epoch": 7826} {"train_loss": -28.375762939453125, "global_step": 649607, "epoch": 7826} {"train_loss": -28.61039161682129, "global_step": 649608, "epoch": 7826} {"train_loss": -28.221216201782227, "global_step": 649609, "epoch": 7826} {"train_loss": -28.199766159057617, "global_step": 649610, "epoch": 7826} {"train_loss": -28.572147369384766, "global_step": 649611, "epoch": 7826} {"train_loss": -28.14124870300293, "global_step": 649612, "epoch": 7826} {"train_loss": -28.40537452697754, "global_step": 649613, "epoch": 7826} {"train_loss": -28.288312911987305, "global_step": 649614, "epoch": 7826} {"train_loss": -28.140478134155273, "global_step": 649615, "epoch": 7826} {"train_loss": -28.325063705444336, "global_step": 649616, "epoch": 7826} {"train_loss": -28.298749923706055, "global_step": 649617, "epoch": 7826} {"train_loss": -27.746850967407227, "global_step": 649618, "epoch": 7826} {"train_loss": -27.9669246673584, "global_step": 649619, "epoch": 7826} {"train_loss": -28.608747482299805, "global_step": 649620, "epoch": 7826} {"train_loss": -28.370269775390625, "global_step": 649621, "epoch": 7826} {"train_loss": -28.040979385375977, "global_step": 649622, "epoch": 7826} {"train_loss": -28.33162498474121, "global_step": 649623, "epoch": 7826} {"train_loss": -28.151966094970703, "global_step": 649624, "epoch": 7826} {"train_loss": -28.47292137145996, "global_step": 649625, "epoch": 7826} {"train_loss": -27.959339141845703, "global_step": 649626, "epoch": 7826} {"train_loss": -28.0870418548584, "global_step": 649627, "epoch": 7826} {"train_loss": -27.811767578125, "global_step": 649628, "epoch": 7826} {"train_loss": -28.243030548095703, "global_step": 649629, "epoch": 7826} {"train_loss": -28.54670524597168, "global_step": 649630, "epoch": 7826} {"train_loss": -28.046545028686523, "global_step": 649631, "epoch": 7826} {"train_loss": -27.739530563354492, "global_step": 649632, "epoch": 7826} {"train_loss": -28.423059463500977, "global_step": 649633, "epoch": 7826} {"train_loss": -28.300867080688477, "global_step": 649634, "epoch": 7826} {"train_loss": -27.723546981811523, "global_step": 649635, "epoch": 7826} {"train_loss": -28.11494255065918, "global_step": 649636, "epoch": 7826} {"train_loss": -28.538084030151367, "global_step": 649637, "epoch": 7826} {"train_loss": -28.35963249206543, "global_step": 649638, "epoch": 7826} {"train_loss": -28.0537166595459, "global_step": 649639, "epoch": 7826} {"train_loss": -28.137027349816748, "global_step": 649640, "epoch": 7826, "val_loss": 6778841.5} {"train_loss": -27.435888290405273, "global_step": 649641, "epoch": 7827} {"train_loss": -27.558347702026367, "global_step": 649642, "epoch": 7827} {"train_loss": -28.025068283081055, "global_step": 649643, "epoch": 7827} {"train_loss": -27.847869873046875, "global_step": 649644, "epoch": 7827} {"train_loss": -27.79426383972168, "global_step": 649645, "epoch": 7827} {"train_loss": -27.724191665649414, "global_step": 649646, "epoch": 7827} {"train_loss": -27.40665054321289, "global_step": 649647, "epoch": 7827} {"train_loss": -28.01529884338379, "global_step": 649648, "epoch": 7827} {"train_loss": -27.30739402770996, "global_step": 649649, "epoch": 7827} {"train_loss": -27.235925674438477, "global_step": 649650, "epoch": 7827} {"train_loss": -27.783432006835938, "global_step": 649651, "epoch": 7827} {"train_loss": -27.684650421142578, "global_step": 649652, "epoch": 7827} {"train_loss": -27.908605575561523, "global_step": 649653, "epoch": 7827} {"train_loss": -28.32484245300293, "global_step": 649654, "epoch": 7827} {"train_loss": -28.0389347076416, "global_step": 649655, "epoch": 7827} {"train_loss": -28.38810157775879, "global_step": 649656, "epoch": 7827} {"train_loss": -28.186233520507812, "global_step": 649657, "epoch": 7827} {"train_loss": -28.239337921142578, "global_step": 649658, "epoch": 7827} {"train_loss": -28.459821701049805, "global_step": 649659, "epoch": 7827} {"train_loss": -28.311532974243164, "global_step": 649660, "epoch": 7827} {"train_loss": -28.324365615844727, "global_step": 649661, "epoch": 7827} {"train_loss": -28.135507583618164, "global_step": 649662, "epoch": 7827} {"train_loss": -28.277118682861328, "global_step": 649663, "epoch": 7827} {"train_loss": -28.0545654296875, "global_step": 649664, "epoch": 7827} {"train_loss": -28.181732177734375, "global_step": 649665, "epoch": 7827} {"train_loss": -28.17963981628418, "global_step": 649666, "epoch": 7827} {"train_loss": -28.077960968017578, "global_step": 649667, "epoch": 7827} {"train_loss": -28.283843994140625, "global_step": 649668, "epoch": 7827} {"train_loss": -28.537717819213867, "global_step": 649669, "epoch": 7827} {"train_loss": -28.290136337280273, "global_step": 649670, "epoch": 7827} {"train_loss": -28.407459259033203, "global_step": 649671, "epoch": 7827} {"train_loss": -28.24322509765625, "global_step": 649672, "epoch": 7827} {"train_loss": -28.585803985595703, "global_step": 649673, "epoch": 7827} {"train_loss": -28.249258041381836, "global_step": 649674, "epoch": 7827} {"train_loss": -28.719589233398438, "global_step": 649675, "epoch": 7827} {"train_loss": -28.2149715423584, "global_step": 649676, "epoch": 7827} {"train_loss": -28.183578491210938, "global_step": 649677, "epoch": 7827} {"train_loss": -28.63783836364746, "global_step": 649678, "epoch": 7827} {"train_loss": -28.33962059020996, "global_step": 649679, "epoch": 7827} {"train_loss": -28.256195068359375, "global_step": 649680, "epoch": 7827} {"train_loss": -28.080774307250977, "global_step": 649681, "epoch": 7827} {"train_loss": -28.67386817932129, "global_step": 649682, "epoch": 7827} {"train_loss": -28.137842178344727, "global_step": 649683, "epoch": 7827} {"train_loss": -28.572223663330078, "global_step": 649684, "epoch": 7827} {"train_loss": -28.512454986572266, "global_step": 649685, "epoch": 7827} {"train_loss": -28.59846305847168, "global_step": 649686, "epoch": 7827} {"train_loss": -28.280776977539062, "global_step": 649687, "epoch": 7827} {"train_loss": -28.355905532836914, "global_step": 649688, "epoch": 7827} {"train_loss": -28.42146110534668, "global_step": 649689, "epoch": 7827} {"train_loss": -28.6214599609375, "global_step": 649690, "epoch": 7827} {"train_loss": -28.90833854675293, "global_step": 649691, "epoch": 7827} {"train_loss": -28.485620498657227, "global_step": 649692, "epoch": 7827} {"train_loss": -28.881139755249023, "global_step": 649693, "epoch": 7827} {"train_loss": -28.35382652282715, "global_step": 649694, "epoch": 7827} {"train_loss": -28.28438377380371, "global_step": 649695, "epoch": 7827} {"train_loss": -28.32301139831543, "global_step": 649696, "epoch": 7827} {"train_loss": -28.290851593017578, "global_step": 649697, "epoch": 7827} {"train_loss": -28.105548858642578, "global_step": 649698, "epoch": 7827} {"train_loss": -28.325225830078125, "global_step": 649699, "epoch": 7827} {"train_loss": -28.16861343383789, "global_step": 649700, "epoch": 7827} {"train_loss": -27.850706100463867, "global_step": 649701, "epoch": 7827} {"train_loss": -28.150421142578125, "global_step": 649702, "epoch": 7827} {"train_loss": -28.10955238342285, "global_step": 649703, "epoch": 7827} {"train_loss": -28.290552139282227, "global_step": 649704, "epoch": 7827} {"train_loss": -28.193525314331055, "global_step": 649705, "epoch": 7827} {"train_loss": -28.5484561920166, "global_step": 649706, "epoch": 7827} {"train_loss": -27.79229736328125, "global_step": 649707, "epoch": 7827} {"train_loss": -28.14307975769043, "global_step": 649708, "epoch": 7827} {"train_loss": -28.387792587280273, "global_step": 649709, "epoch": 7827} {"train_loss": -28.379362106323242, "global_step": 649710, "epoch": 7827} {"train_loss": -28.29388427734375, "global_step": 649711, "epoch": 7827} {"train_loss": -28.23890495300293, "global_step": 649712, "epoch": 7827} {"train_loss": -27.970609664916992, "global_step": 649713, "epoch": 7827} {"train_loss": -28.663257598876953, "global_step": 649714, "epoch": 7827} {"train_loss": -28.139062881469727, "global_step": 649715, "epoch": 7827} {"train_loss": -28.624780654907227, "global_step": 649716, "epoch": 7827} {"train_loss": -28.38776969909668, "global_step": 649717, "epoch": 7827} {"train_loss": -28.419660568237305, "global_step": 649718, "epoch": 7827} {"train_loss": -28.518590927124023, "global_step": 649719, "epoch": 7827} {"train_loss": -28.06854820251465, "global_step": 649720, "epoch": 7827} {"train_loss": -28.344709396362305, "global_step": 649721, "epoch": 7827} {"train_loss": -28.4744873046875, "global_step": 649722, "epoch": 7827} {"train_loss": -28.2373665729201, "global_step": 649723, "epoch": 7827, "val_loss": 6807492.5} {"train_loss": -27.7481746673584, "global_step": 649724, "epoch": 7828} {"train_loss": -27.859893798828125, "global_step": 649725, "epoch": 7828} {"train_loss": -28.18915367126465, "global_step": 649726, "epoch": 7828} {"train_loss": -27.753894805908203, "global_step": 649727, "epoch": 7828} {"train_loss": -27.929059982299805, "global_step": 649728, "epoch": 7828} {"train_loss": -27.549047470092773, "global_step": 649729, "epoch": 7828} {"train_loss": -27.774063110351562, "global_step": 649730, "epoch": 7828} {"train_loss": -27.780963897705078, "global_step": 649731, "epoch": 7828} {"train_loss": -27.729711532592773, "global_step": 649732, "epoch": 7828} {"train_loss": -28.14747428894043, "global_step": 649733, "epoch": 7828} {"train_loss": -27.9241886138916, "global_step": 649734, "epoch": 7828} {"train_loss": -28.140857696533203, "global_step": 649735, "epoch": 7828} {"train_loss": -28.111051559448242, "global_step": 649736, "epoch": 7828} {"train_loss": -28.097686767578125, "global_step": 649737, "epoch": 7828} {"train_loss": -28.160175323486328, "global_step": 649738, "epoch": 7828} {"train_loss": -28.045629501342773, "global_step": 649739, "epoch": 7828} {"train_loss": -27.787317276000977, "global_step": 649740, "epoch": 7828} {"train_loss": -27.8487548828125, "global_step": 649741, "epoch": 7828} {"train_loss": -27.662967681884766, "global_step": 649742, "epoch": 7828} {"train_loss": -27.958642959594727, "global_step": 649743, "epoch": 7828} {"train_loss": -28.01783561706543, "global_step": 649744, "epoch": 7828} {"train_loss": -28.044422149658203, "global_step": 649745, "epoch": 7828} {"train_loss": -27.996320724487305, "global_step": 649746, "epoch": 7828} {"train_loss": -27.865625381469727, "global_step": 649747, "epoch": 7828} {"train_loss": -28.488264083862305, "global_step": 649748, "epoch": 7828} {"train_loss": -28.473737716674805, "global_step": 649749, "epoch": 7828} {"train_loss": -28.669301986694336, "global_step": 649750, "epoch": 7828} {"train_loss": -28.462604522705078, "global_step": 649751, "epoch": 7828} {"train_loss": -27.943769454956055, "global_step": 649752, "epoch": 7828} {"train_loss": -28.238147735595703, "global_step": 649753, "epoch": 7828} {"train_loss": -28.200071334838867, "global_step": 649754, "epoch": 7828} {"train_loss": -28.397016525268555, "global_step": 649755, "epoch": 7828} {"train_loss": -28.31048011779785, "global_step": 649756, "epoch": 7828} {"train_loss": -28.42190933227539, "global_step": 649757, "epoch": 7828} {"train_loss": -28.409351348876953, "global_step": 649758, "epoch": 7828} {"train_loss": -28.67047691345215, "global_step": 649759, "epoch": 7828} {"train_loss": -28.313440322875977, "global_step": 649760, "epoch": 7828} {"train_loss": -28.386632919311523, "global_step": 649761, "epoch": 7828} {"train_loss": -28.32221794128418, "global_step": 649762, "epoch": 7828} {"train_loss": -28.097814559936523, "global_step": 649763, "epoch": 7828} {"train_loss": -28.192306518554688, "global_step": 649764, "epoch": 7828} {"train_loss": -28.3457088470459, "global_step": 649765, "epoch": 7828} {"train_loss": -28.42848014831543, "global_step": 649766, "epoch": 7828} {"train_loss": -28.58436393737793, "global_step": 649767, "epoch": 7828} {"train_loss": -28.158599853515625, "global_step": 649768, "epoch": 7828} {"train_loss": -28.50299072265625, "global_step": 649769, "epoch": 7828} {"train_loss": -28.47627067565918, "global_step": 649770, "epoch": 7828} {"train_loss": -27.999298095703125, "global_step": 649771, "epoch": 7828} {"train_loss": -28.266340255737305, "global_step": 649772, "epoch": 7828} {"train_loss": -28.50721549987793, "global_step": 649773, "epoch": 7828} {"train_loss": -28.64688491821289, "global_step": 649774, "epoch": 7828} {"train_loss": -28.5041446685791, "global_step": 649775, "epoch": 7828} {"train_loss": -28.4888858795166, "global_step": 649776, "epoch": 7828} {"train_loss": -28.22004508972168, "global_step": 649777, "epoch": 7828} {"train_loss": -28.416711807250977, "global_step": 649778, "epoch": 7828} {"train_loss": -28.6478328704834, "global_step": 649779, "epoch": 7828} {"train_loss": -28.989648818969727, "global_step": 649780, "epoch": 7828} {"train_loss": -28.5747013092041, "global_step": 649781, "epoch": 7828} {"train_loss": -28.652393341064453, "global_step": 649782, "epoch": 7828} {"train_loss": -28.69502067565918, "global_step": 649783, "epoch": 7828} {"train_loss": -28.33955192565918, "global_step": 649784, "epoch": 7828} {"train_loss": -28.3868350982666, "global_step": 649785, "epoch": 7828} {"train_loss": -28.545917510986328, "global_step": 649786, "epoch": 7828} {"train_loss": -28.672027587890625, "global_step": 649787, "epoch": 7828} {"train_loss": -28.65481948852539, "global_step": 649788, "epoch": 7828} {"train_loss": -28.238239288330078, "global_step": 649789, "epoch": 7828} {"train_loss": -28.66592788696289, "global_step": 649790, "epoch": 7828} {"train_loss": -28.53692054748535, "global_step": 649791, "epoch": 7828} {"train_loss": -28.31402015686035, "global_step": 649792, "epoch": 7828} {"train_loss": -28.283918380737305, "global_step": 649793, "epoch": 7828} {"train_loss": -28.11911392211914, "global_step": 649794, "epoch": 7828} {"train_loss": -28.05291175842285, "global_step": 649795, "epoch": 7828} {"train_loss": -28.48296546936035, "global_step": 649796, "epoch": 7828} {"train_loss": -28.419525146484375, "global_step": 649797, "epoch": 7828} {"train_loss": -28.513959884643555, "global_step": 649798, "epoch": 7828} {"train_loss": -28.709735870361328, "global_step": 649799, "epoch": 7828} {"train_loss": -28.47663688659668, "global_step": 649800, "epoch": 7828} {"train_loss": -27.71099281311035, "global_step": 649801, "epoch": 7828} {"train_loss": -27.602752685546875, "global_step": 649802, "epoch": 7828} {"train_loss": -26.962310791015625, "global_step": 649803, "epoch": 7828} {"train_loss": -26.818572998046875, "global_step": 649804, "epoch": 7828} {"train_loss": -27.090173721313477, "global_step": 649805, "epoch": 7828} {"train_loss": -28.20353344836867, "global_step": 649806, "epoch": 7828, "val_loss": 6850007.5} {"train_loss": -27.865192413330078, "global_step": 649807, "epoch": 7829} {"train_loss": -27.606977462768555, "global_step": 649808, "epoch": 7829} {"train_loss": -27.578235626220703, "global_step": 649809, "epoch": 7829} {"train_loss": -27.6790771484375, "global_step": 649810, "epoch": 7829} {"train_loss": -27.581933975219727, "global_step": 649811, "epoch": 7829} {"train_loss": -27.870222091674805, "global_step": 649812, "epoch": 7829} {"train_loss": -27.38799476623535, "global_step": 649813, "epoch": 7829} {"train_loss": -27.840524673461914, "global_step": 649814, "epoch": 7829} {"train_loss": -27.56512451171875, "global_step": 649815, "epoch": 7829} {"train_loss": -27.62018394470215, "global_step": 649816, "epoch": 7829} {"train_loss": -27.62619972229004, "global_step": 649817, "epoch": 7829} {"train_loss": -28.18646240234375, "global_step": 649818, "epoch": 7829} {"train_loss": -27.73884391784668, "global_step": 649819, "epoch": 7829} {"train_loss": -28.06037712097168, "global_step": 649820, "epoch": 7829} {"train_loss": -27.74098014831543, "global_step": 649821, "epoch": 7829} {"train_loss": -28.142200469970703, "global_step": 649822, "epoch": 7829} {"train_loss": -27.854022979736328, "global_step": 649823, "epoch": 7829} {"train_loss": -28.02899742126465, "global_step": 649824, "epoch": 7829} {"train_loss": -27.917551040649414, "global_step": 649825, "epoch": 7829} {"train_loss": -27.883514404296875, "global_step": 649826, "epoch": 7829} {"train_loss": -27.87114906311035, "global_step": 649827, "epoch": 7829} {"train_loss": -28.002222061157227, "global_step": 649828, "epoch": 7829} {"train_loss": -28.169158935546875, "global_step": 649829, "epoch": 7829} {"train_loss": -28.484785079956055, "global_step": 649830, "epoch": 7829} {"train_loss": -28.17302894592285, "global_step": 649831, "epoch": 7829} {"train_loss": -27.78143882751465, "global_step": 649832, "epoch": 7829} {"train_loss": -28.38698387145996, "global_step": 649833, "epoch": 7829} {"train_loss": -27.915510177612305, "global_step": 649834, "epoch": 7829} {"train_loss": -28.405487060546875, "global_step": 649835, "epoch": 7829} {"train_loss": -28.291868209838867, "global_step": 649836, "epoch": 7829} {"train_loss": -28.323209762573242, "global_step": 649837, "epoch": 7829} {"train_loss": -28.262739181518555, "global_step": 649838, "epoch": 7829} {"train_loss": -28.058027267456055, "global_step": 649839, "epoch": 7829} {"train_loss": -28.415246963500977, "global_step": 649840, "epoch": 7829} {"train_loss": -28.311033248901367, "global_step": 649841, "epoch": 7829} {"train_loss": -28.32647132873535, "global_step": 649842, "epoch": 7829} {"train_loss": -27.896780014038086, "global_step": 649843, "epoch": 7829} {"train_loss": -28.093847274780273, "global_step": 649844, "epoch": 7829} {"train_loss": -28.36676025390625, "global_step": 649845, "epoch": 7829} {"train_loss": -28.364973068237305, "global_step": 649846, "epoch": 7829} {"train_loss": -28.538806915283203, "global_step": 649847, "epoch": 7829} {"train_loss": -28.51911735534668, "global_step": 649848, "epoch": 7829} {"train_loss": -28.38556480407715, "global_step": 649849, "epoch": 7829} {"train_loss": -28.432584762573242, "global_step": 649850, "epoch": 7829} {"train_loss": -28.28545570373535, "global_step": 649851, "epoch": 7829} {"train_loss": -28.303979873657227, "global_step": 649852, "epoch": 7829} {"train_loss": -28.242460250854492, "global_step": 649853, "epoch": 7829} {"train_loss": -28.48237419128418, "global_step": 649854, "epoch": 7829} {"train_loss": -28.631811141967773, "global_step": 649855, "epoch": 7829} {"train_loss": -28.35292625427246, "global_step": 649856, "epoch": 7829} {"train_loss": -27.846044540405273, "global_step": 649857, "epoch": 7829} {"train_loss": -28.255542755126953, "global_step": 649858, "epoch": 7829} {"train_loss": -28.08867835998535, "global_step": 649859, "epoch": 7829} {"train_loss": -28.592641830444336, "global_step": 649860, "epoch": 7829} {"train_loss": -28.465534210205078, "global_step": 649861, "epoch": 7829} {"train_loss": -28.195484161376953, "global_step": 649862, "epoch": 7829} {"train_loss": -28.1279239654541, "global_step": 649863, "epoch": 7829} {"train_loss": -28.035531997680664, "global_step": 649864, "epoch": 7829} {"train_loss": -28.360797882080078, "global_step": 649865, "epoch": 7829} {"train_loss": -27.787109375, "global_step": 649866, "epoch": 7829} {"train_loss": -28.174158096313477, "global_step": 649867, "epoch": 7829} {"train_loss": -28.35749626159668, "global_step": 649868, "epoch": 7829} {"train_loss": -28.36439323425293, "global_step": 649869, "epoch": 7829} {"train_loss": -27.8636474609375, "global_step": 649870, "epoch": 7829} {"train_loss": -28.06292152404785, "global_step": 649871, "epoch": 7829} {"train_loss": -28.183759689331055, "global_step": 649872, "epoch": 7829} {"train_loss": -28.010610580444336, "global_step": 649873, "epoch": 7829} {"train_loss": -28.035343170166016, "global_step": 649874, "epoch": 7829} {"train_loss": -28.16839599609375, "global_step": 649875, "epoch": 7829} {"train_loss": -28.076099395751953, "global_step": 649876, "epoch": 7829} {"train_loss": -27.86395263671875, "global_step": 649877, "epoch": 7829} {"train_loss": -27.15168571472168, "global_step": 649878, "epoch": 7829} {"train_loss": -27.507373809814453, "global_step": 649879, "epoch": 7829} {"train_loss": -27.877334594726562, "global_step": 649880, "epoch": 7829} {"train_loss": -28.352354049682617, "global_step": 649881, "epoch": 7829} {"train_loss": -27.232086181640625, "global_step": 649882, "epoch": 7829} {"train_loss": -27.90485191345215, "global_step": 649883, "epoch": 7829} {"train_loss": -28.10418701171875, "global_step": 649884, "epoch": 7829} {"train_loss": -27.838464736938477, "global_step": 649885, "epoch": 7829} {"train_loss": -28.33527946472168, "global_step": 649886, "epoch": 7829} {"train_loss": -28.154682159423828, "global_step": 649887, "epoch": 7829} {"train_loss": -28.0511417388916, "global_step": 649888, "epoch": 7829} {"train_loss": -28.070379624883813, "global_step": 649889, "epoch": 7829, "val_loss": 6841553.5} {"train_loss": -27.892868041992188, "global_step": 649890, "epoch": 7830} {"train_loss": -26.825910568237305, "global_step": 649891, "epoch": 7830} {"train_loss": -28.0212345123291, "global_step": 649892, "epoch": 7830} {"train_loss": -27.64881706237793, "global_step": 649893, "epoch": 7830} {"train_loss": -27.692031860351562, "global_step": 649894, "epoch": 7830} {"train_loss": -27.798694610595703, "global_step": 649895, "epoch": 7830} {"train_loss": -27.45050048828125, "global_step": 649896, "epoch": 7830} {"train_loss": -28.291715621948242, "global_step": 649897, "epoch": 7830} {"train_loss": -27.37017250061035, "global_step": 649898, "epoch": 7830} {"train_loss": -27.984365463256836, "global_step": 649899, "epoch": 7830} {"train_loss": -27.63665199279785, "global_step": 649900, "epoch": 7830} {"train_loss": -27.990753173828125, "global_step": 649901, "epoch": 7830} {"train_loss": -27.8697509765625, "global_step": 649902, "epoch": 7830} {"train_loss": -28.179616928100586, "global_step": 649903, "epoch": 7830} {"train_loss": -28.2650203704834, "global_step": 649904, "epoch": 7830} {"train_loss": -27.936920166015625, "global_step": 649905, "epoch": 7830} {"train_loss": -28.235761642456055, "global_step": 649906, "epoch": 7830} {"train_loss": -28.165674209594727, "global_step": 649907, "epoch": 7830} {"train_loss": -28.007770538330078, "global_step": 649908, "epoch": 7830} {"train_loss": -28.25006675720215, "global_step": 649909, "epoch": 7830} {"train_loss": -28.039722442626953, "global_step": 649910, "epoch": 7830} {"train_loss": -28.141223907470703, "global_step": 649911, "epoch": 7830} {"train_loss": -28.31494140625, "global_step": 649912, "epoch": 7830} {"train_loss": -28.467966079711914, "global_step": 649913, "epoch": 7830} {"train_loss": -28.448333740234375, "global_step": 649914, "epoch": 7830} {"train_loss": -28.370222091674805, "global_step": 649915, "epoch": 7830} {"train_loss": -28.022558212280273, "global_step": 649916, "epoch": 7830} {"train_loss": -28.6594181060791, "global_step": 649917, "epoch": 7830} {"train_loss": -27.922672271728516, "global_step": 649918, "epoch": 7830} {"train_loss": -28.238046646118164, "global_step": 649919, "epoch": 7830} {"train_loss": -28.57553482055664, "global_step": 649920, "epoch": 7830} {"train_loss": -28.215946197509766, "global_step": 649921, "epoch": 7830} {"train_loss": -28.446813583374023, "global_step": 649922, "epoch": 7830} {"train_loss": -28.331085205078125, "global_step": 649923, "epoch": 7830} {"train_loss": -27.946826934814453, "global_step": 649924, "epoch": 7830} {"train_loss": -28.4296875, "global_step": 649925, "epoch": 7830} {"train_loss": -28.686920166015625, "global_step": 649926, "epoch": 7830} {"train_loss": -28.515613555908203, "global_step": 649927, "epoch": 7830} {"train_loss": -28.795612335205078, "global_step": 649928, "epoch": 7830} {"train_loss": -28.483856201171875, "global_step": 649929, "epoch": 7830} {"train_loss": -27.992223739624023, "global_step": 649930, "epoch": 7830} {"train_loss": -28.231739044189453, "global_step": 649931, "epoch": 7830} {"train_loss": -28.47462272644043, "global_step": 649932, "epoch": 7830} {"train_loss": -28.256961822509766, "global_step": 649933, "epoch": 7830} {"train_loss": -28.47254753112793, "global_step": 649934, "epoch": 7830} {"train_loss": -27.966928482055664, "global_step": 649935, "epoch": 7830} {"train_loss": -28.33204460144043, "global_step": 649936, "epoch": 7830} {"train_loss": -28.643136978149414, "global_step": 649937, "epoch": 7830} {"train_loss": -28.251989364624023, "global_step": 649938, "epoch": 7830} {"train_loss": -28.287628173828125, "global_step": 649939, "epoch": 7830} {"train_loss": -28.246381759643555, "global_step": 649940, "epoch": 7830} {"train_loss": -28.12946891784668, "global_step": 649941, "epoch": 7830} {"train_loss": -28.11395263671875, "global_step": 649942, "epoch": 7830} {"train_loss": -28.28449058532715, "global_step": 649943, "epoch": 7830} {"train_loss": -28.31330680847168, "global_step": 649944, "epoch": 7830} {"train_loss": -28.502948760986328, "global_step": 649945, "epoch": 7830} {"train_loss": -28.43044090270996, "global_step": 649946, "epoch": 7830} {"train_loss": -28.089380264282227, "global_step": 649947, "epoch": 7830} {"train_loss": -28.113494873046875, "global_step": 649948, "epoch": 7830} {"train_loss": -28.207548141479492, "global_step": 649949, "epoch": 7830} {"train_loss": -28.4714298248291, "global_step": 649950, "epoch": 7830} {"train_loss": -28.554025650024414, "global_step": 649951, "epoch": 7830} {"train_loss": -28.456640243530273, "global_step": 649952, "epoch": 7830} {"train_loss": -28.51810646057129, "global_step": 649953, "epoch": 7830} {"train_loss": -28.657922744750977, "global_step": 649954, "epoch": 7830} {"train_loss": -28.5572566986084, "global_step": 649955, "epoch": 7830} {"train_loss": -28.698013305664062, "global_step": 649956, "epoch": 7830} {"train_loss": -28.236032485961914, "global_step": 649957, "epoch": 7830} {"train_loss": -28.511625289916992, "global_step": 649958, "epoch": 7830} {"train_loss": -28.707202911376953, "global_step": 649959, "epoch": 7830} {"train_loss": -28.3908634185791, "global_step": 649960, "epoch": 7830} {"train_loss": -28.59647560119629, "global_step": 649961, "epoch": 7830} {"train_loss": -29.070098876953125, "global_step": 649962, "epoch": 7830} {"train_loss": -28.447296142578125, "global_step": 649963, "epoch": 7830} {"train_loss": -28.216028213500977, "global_step": 649964, "epoch": 7830} {"train_loss": -28.27655029296875, "global_step": 649965, "epoch": 7830} {"train_loss": -28.239683151245117, "global_step": 649966, "epoch": 7830} {"train_loss": -28.39238929748535, "global_step": 649967, "epoch": 7830} {"train_loss": -28.617115020751953, "global_step": 649968, "epoch": 7830} {"train_loss": -27.906885147094727, "global_step": 649969, "epoch": 7830} {"train_loss": -27.5460205078125, "global_step": 649970, "epoch": 7830} {"train_loss": -28.3988094329834, "global_step": 649971, "epoch": 7830} {"train_loss": -28.238931701843995, "global_step": 649972, "epoch": 7830, "val_loss": 6861698.0} {"train_loss": -27.838239669799805, "global_step": 649973, "epoch": 7831} {"train_loss": -27.284515380859375, "global_step": 649974, "epoch": 7831} {"train_loss": -26.791278839111328, "global_step": 649975, "epoch": 7831} {"train_loss": -25.758197784423828, "global_step": 649976, "epoch": 7831} {"train_loss": -24.02399253845215, "global_step": 649977, "epoch": 7831} {"train_loss": -24.856225967407227, "global_step": 649978, "epoch": 7831} {"train_loss": -27.9036865234375, "global_step": 649979, "epoch": 7831} {"train_loss": -26.447647094726562, "global_step": 649980, "epoch": 7831} {"train_loss": -27.961933135986328, "global_step": 649981, "epoch": 7831} {"train_loss": -27.093835830688477, "global_step": 649982, "epoch": 7831} {"train_loss": -27.32073402404785, "global_step": 649983, "epoch": 7831} {"train_loss": -27.09187889099121, "global_step": 649984, "epoch": 7831} {"train_loss": -27.4687442779541, "global_step": 649985, "epoch": 7831} {"train_loss": -27.57301139831543, "global_step": 649986, "epoch": 7831} {"train_loss": -27.361181259155273, "global_step": 649987, "epoch": 7831} {"train_loss": -27.85599136352539, "global_step": 649988, "epoch": 7831} {"train_loss": -27.477506637573242, "global_step": 649989, "epoch": 7831} {"train_loss": -27.699176788330078, "global_step": 649990, "epoch": 7831} {"train_loss": -27.82988929748535, "global_step": 649991, "epoch": 7831} {"train_loss": -27.792724609375, "global_step": 649992, "epoch": 7831} {"train_loss": -28.099227905273438, "global_step": 649993, "epoch": 7831} {"train_loss": -28.201583862304688, "global_step": 649994, "epoch": 7831} {"train_loss": -27.92746353149414, "global_step": 649995, "epoch": 7831} {"train_loss": -27.9517765045166, "global_step": 649996, "epoch": 7831} {"train_loss": -28.1157283782959, "global_step": 649997, "epoch": 7831} {"train_loss": -27.978031158447266, "global_step": 649998, "epoch": 7831} {"train_loss": -28.052091598510742, "global_step": 649999, "epoch": 7831} {"train_loss": -28.042285919189453, "global_step": 650000, "epoch": 7831} {"train_loss": -28.237411499023438, "global_step": 650001, "epoch": 7831} {"train_loss": -28.487451553344727, "global_step": 650002, "epoch": 7831} {"train_loss": -28.4053897857666, "global_step": 650003, "epoch": 7831} {"train_loss": -28.536359786987305, "global_step": 650004, "epoch": 7831} {"train_loss": -28.0997257232666, "global_step": 650005, "epoch": 7831} {"train_loss": -28.35805320739746, "global_step": 650006, "epoch": 7831} {"train_loss": -27.80085563659668, "global_step": 650007, "epoch": 7831} {"train_loss": -28.196149826049805, "global_step": 650008, "epoch": 7831} {"train_loss": -27.875280380249023, "global_step": 650009, "epoch": 7831} {"train_loss": -28.642688751220703, "global_step": 650010, "epoch": 7831} {"train_loss": -27.88338279724121, "global_step": 650011, "epoch": 7831} {"train_loss": -28.517303466796875, "global_step": 650012, "epoch": 7831} {"train_loss": -28.707950592041016, "global_step": 650013, "epoch": 7831} {"train_loss": -28.0115909576416, "global_step": 650014, "epoch": 7831} {"train_loss": -27.78964614868164, "global_step": 650015, "epoch": 7831} {"train_loss": -28.69061851501465, "global_step": 650016, "epoch": 7831} {"train_loss": -28.274824142456055, "global_step": 650017, "epoch": 7831} {"train_loss": -28.314208984375, "global_step": 650018, "epoch": 7831} {"train_loss": -28.120044708251953, "global_step": 650019, "epoch": 7831} {"train_loss": -28.42542839050293, "global_step": 650020, "epoch": 7831} {"train_loss": -28.40242576599121, "global_step": 650021, "epoch": 7831} {"train_loss": -27.926441192626953, "global_step": 650022, "epoch": 7831} {"train_loss": -27.993497848510742, "global_step": 650023, "epoch": 7831} {"train_loss": -27.984582901000977, "global_step": 650024, "epoch": 7831} {"train_loss": -28.116621017456055, "global_step": 650025, "epoch": 7831} {"train_loss": -28.4335880279541, "global_step": 650026, "epoch": 7831} {"train_loss": -28.210052490234375, "global_step": 650027, "epoch": 7831} {"train_loss": -28.25079917907715, "global_step": 650028, "epoch": 7831} {"train_loss": -28.323423385620117, "global_step": 650029, "epoch": 7831} {"train_loss": -28.58762550354004, "global_step": 650030, "epoch": 7831} {"train_loss": -28.365345001220703, "global_step": 650031, "epoch": 7831} {"train_loss": -28.080453872680664, "global_step": 650032, "epoch": 7831} {"train_loss": -28.374929428100586, "global_step": 650033, "epoch": 7831} {"train_loss": -28.210901260375977, "global_step": 650034, "epoch": 7831} {"train_loss": -28.18731117248535, "global_step": 650035, "epoch": 7831} {"train_loss": -27.957067489624023, "global_step": 650036, "epoch": 7831} {"train_loss": -27.87801170349121, "global_step": 650037, "epoch": 7831} {"train_loss": -27.514646530151367, "global_step": 650038, "epoch": 7831} {"train_loss": -27.910375595092773, "global_step": 650039, "epoch": 7831} {"train_loss": -28.39423179626465, "global_step": 650040, "epoch": 7831} {"train_loss": -28.60928726196289, "global_step": 650041, "epoch": 7831} {"train_loss": -28.551244735717773, "global_step": 650042, "epoch": 7831} {"train_loss": -28.09137535095215, "global_step": 650043, "epoch": 7831} {"train_loss": -28.379749298095703, "global_step": 650044, "epoch": 7831} {"train_loss": -28.593835830688477, "global_step": 650045, "epoch": 7831} {"train_loss": -28.497482299804688, "global_step": 650046, "epoch": 7831} {"train_loss": -28.34071159362793, "global_step": 650047, "epoch": 7831} {"train_loss": -28.51792335510254, "global_step": 650048, "epoch": 7831} {"train_loss": -28.6218318939209, "global_step": 650049, "epoch": 7831} {"train_loss": -28.46697425842285, "global_step": 650050, "epoch": 7831} {"train_loss": -28.518171310424805, "global_step": 650051, "epoch": 7831} {"train_loss": -28.481494903564453, "global_step": 650052, "epoch": 7831} {"train_loss": -28.2717342376709, "global_step": 650053, "epoch": 7831} {"train_loss": -28.64117431640625, "global_step": 650054, "epoch": 7831} {"train_loss": -27.98797634998, "global_step": 650055, "epoch": 7831, "val_loss": 6865006.0} {"train_loss": -27.52796745300293, "global_step": 650056, "epoch": 7832} {"train_loss": -27.885282516479492, "global_step": 650057, "epoch": 7832} {"train_loss": -27.97258949279785, "global_step": 650058, "epoch": 7832} {"train_loss": -27.72507095336914, "global_step": 650059, "epoch": 7832} {"train_loss": -28.111642837524414, "global_step": 650060, "epoch": 7832} {"train_loss": -27.976720809936523, "global_step": 650061, "epoch": 7832} {"train_loss": -27.950754165649414, "global_step": 650062, "epoch": 7832} {"train_loss": -28.312437057495117, "global_step": 650063, "epoch": 7832} {"train_loss": -28.04750633239746, "global_step": 650064, "epoch": 7832} {"train_loss": -28.034276962280273, "global_step": 650065, "epoch": 7832} {"train_loss": -27.94182777404785, "global_step": 650066, "epoch": 7832} {"train_loss": -27.724140167236328, "global_step": 650067, "epoch": 7832} {"train_loss": -28.419387817382812, "global_step": 650068, "epoch": 7832} {"train_loss": -28.37898063659668, "global_step": 650069, "epoch": 7832} {"train_loss": -28.218402862548828, "global_step": 650070, "epoch": 7832} {"train_loss": -27.672698974609375, "global_step": 650071, "epoch": 7832} {"train_loss": -28.379186630249023, "global_step": 650072, "epoch": 7832} {"train_loss": -28.374862670898438, "global_step": 650073, "epoch": 7832} {"train_loss": -27.995197296142578, "global_step": 650074, "epoch": 7832} {"train_loss": -28.37517738342285, "global_step": 650075, "epoch": 7832} {"train_loss": -28.22566795349121, "global_step": 650076, "epoch": 7832} {"train_loss": -27.869314193725586, "global_step": 650077, "epoch": 7832} {"train_loss": -28.15821647644043, "global_step": 650078, "epoch": 7832} {"train_loss": -28.221927642822266, "global_step": 650079, "epoch": 7832} {"train_loss": -28.302093505859375, "global_step": 650080, "epoch": 7832} {"train_loss": -28.27382469177246, "global_step": 650081, "epoch": 7832} {"train_loss": -27.910215377807617, "global_step": 650082, "epoch": 7832} {"train_loss": -28.44754981994629, "global_step": 650083, "epoch": 7832} {"train_loss": -28.182241439819336, "global_step": 650084, "epoch": 7832} {"train_loss": -27.57282066345215, "global_step": 650085, "epoch": 7832} {"train_loss": -28.232450485229492, "global_step": 650086, "epoch": 7832} {"train_loss": -28.505151748657227, "global_step": 650087, "epoch": 7832} {"train_loss": -28.194442749023438, "global_step": 650088, "epoch": 7832} {"train_loss": -28.247787475585938, "global_step": 650089, "epoch": 7832} {"train_loss": -28.257343292236328, "global_step": 650090, "epoch": 7832} {"train_loss": -28.4636287689209, "global_step": 650091, "epoch": 7832} {"train_loss": -28.301733016967773, "global_step": 650092, "epoch": 7832} {"train_loss": -28.268667221069336, "global_step": 650093, "epoch": 7832} {"train_loss": -28.702056884765625, "global_step": 650094, "epoch": 7832} {"train_loss": -28.64162254333496, "global_step": 650095, "epoch": 7832} {"train_loss": -28.488447189331055, "global_step": 650096, "epoch": 7832} {"train_loss": -28.286752700805664, "global_step": 650097, "epoch": 7832} {"train_loss": -28.08734703063965, "global_step": 650098, "epoch": 7832} {"train_loss": -28.678892135620117, "global_step": 650099, "epoch": 7832} {"train_loss": -28.521780014038086, "global_step": 650100, "epoch": 7832} {"train_loss": -28.505956649780273, "global_step": 650101, "epoch": 7832} {"train_loss": -28.559457778930664, "global_step": 650102, "epoch": 7832} {"train_loss": -28.275075912475586, "global_step": 650103, "epoch": 7832} {"train_loss": -28.470701217651367, "global_step": 650104, "epoch": 7832} {"train_loss": -28.65561866760254, "global_step": 650105, "epoch": 7832} {"train_loss": -28.21064567565918, "global_step": 650106, "epoch": 7832} {"train_loss": -28.447744369506836, "global_step": 650107, "epoch": 7832} {"train_loss": -28.662748336791992, "global_step": 650108, "epoch": 7832} {"train_loss": -28.49470329284668, "global_step": 650109, "epoch": 7832} {"train_loss": -28.440393447875977, "global_step": 650110, "epoch": 7832} {"train_loss": -28.52178382873535, "global_step": 650111, "epoch": 7832} {"train_loss": -28.87775230407715, "global_step": 650112, "epoch": 7832} {"train_loss": -28.608051300048828, "global_step": 650113, "epoch": 7832} {"train_loss": -28.30954933166504, "global_step": 650114, "epoch": 7832} {"train_loss": -28.1276798248291, "global_step": 650115, "epoch": 7832} {"train_loss": -28.105981826782227, "global_step": 650116, "epoch": 7832} {"train_loss": -28.430952072143555, "global_step": 650117, "epoch": 7832} {"train_loss": -28.395517349243164, "global_step": 650118, "epoch": 7832} {"train_loss": -28.599348068237305, "global_step": 650119, "epoch": 7832} {"train_loss": -28.451013565063477, "global_step": 650120, "epoch": 7832} {"train_loss": -28.40576171875, "global_step": 650121, "epoch": 7832} {"train_loss": -28.0887508392334, "global_step": 650122, "epoch": 7832} {"train_loss": -27.87058448791504, "global_step": 650123, "epoch": 7832} {"train_loss": -28.45163917541504, "global_step": 650124, "epoch": 7832} {"train_loss": -28.359638214111328, "global_step": 650125, "epoch": 7832} {"train_loss": -28.0904541015625, "global_step": 650126, "epoch": 7832} {"train_loss": -28.17352294921875, "global_step": 650127, "epoch": 7832} {"train_loss": -28.13394546508789, "global_step": 650128, "epoch": 7832} {"train_loss": -28.52410316467285, "global_step": 650129, "epoch": 7832} {"train_loss": -27.75113296508789, "global_step": 650130, "epoch": 7832} {"train_loss": -27.712865829467773, "global_step": 650131, "epoch": 7832} {"train_loss": -27.931848526000977, "global_step": 650132, "epoch": 7832} {"train_loss": -28.257246017456055, "global_step": 650133, "epoch": 7832} {"train_loss": -28.494653701782227, "global_step": 650134, "epoch": 7832} {"train_loss": -28.38701820373535, "global_step": 650135, "epoch": 7832} {"train_loss": -28.319656372070312, "global_step": 650136, "epoch": 7832} {"train_loss": -28.543121337890625, "global_step": 650137, "epoch": 7832} {"train_loss": -28.265940195106598, "global_step": 650138, "epoch": 7832, "val_loss": 6753242.0} {"train_loss": -25.43055534362793, "global_step": 650139, "epoch": 7833} {"train_loss": -27.11627769470215, "global_step": 650140, "epoch": 7833} {"train_loss": -26.7147216796875, "global_step": 650141, "epoch": 7833} {"train_loss": -26.50594139099121, "global_step": 650142, "epoch": 7833} {"train_loss": -27.097412109375, "global_step": 650143, "epoch": 7833} {"train_loss": -26.75528907775879, "global_step": 650144, "epoch": 7833} {"train_loss": -26.611114501953125, "global_step": 650145, "epoch": 7833} {"train_loss": -27.269861221313477, "global_step": 650146, "epoch": 7833} {"train_loss": -27.095230102539062, "global_step": 650147, "epoch": 7833} {"train_loss": -26.771717071533203, "global_step": 650148, "epoch": 7833} {"train_loss": -27.217803955078125, "global_step": 650149, "epoch": 7833} {"train_loss": -27.62152671813965, "global_step": 650150, "epoch": 7833} {"train_loss": -27.29658317565918, "global_step": 650151, "epoch": 7833} {"train_loss": -27.351001739501953, "global_step": 650152, "epoch": 7833} {"train_loss": -27.611120223999023, "global_step": 650153, "epoch": 7833} {"train_loss": -27.7490291595459, "global_step": 650154, "epoch": 7833} {"train_loss": -27.58660888671875, "global_step": 650155, "epoch": 7833} {"train_loss": -27.7186222076416, "global_step": 650156, "epoch": 7833} {"train_loss": -27.8254337310791, "global_step": 650157, "epoch": 7833} {"train_loss": -27.454208374023438, "global_step": 650158, "epoch": 7833} {"train_loss": -27.390213012695312, "global_step": 650159, "epoch": 7833} {"train_loss": -27.593799591064453, "global_step": 650160, "epoch": 7833} {"train_loss": -27.7626953125, "global_step": 650161, "epoch": 7833} {"train_loss": -27.654394149780273, "global_step": 650162, "epoch": 7833} {"train_loss": -27.940021514892578, "global_step": 650163, "epoch": 7833} {"train_loss": -27.70760154724121, "global_step": 650164, "epoch": 7833} {"train_loss": -27.987890243530273, "global_step": 650165, "epoch": 7833} {"train_loss": -27.9954776763916, "global_step": 650166, "epoch": 7833} {"train_loss": -27.7679443359375, "global_step": 650167, "epoch": 7833} {"train_loss": -27.82269287109375, "global_step": 650168, "epoch": 7833} {"train_loss": -27.913557052612305, "global_step": 650169, "epoch": 7833} {"train_loss": -27.88221549987793, "global_step": 650170, "epoch": 7833} {"train_loss": -28.113391876220703, "global_step": 650171, "epoch": 7833} {"train_loss": -28.120574951171875, "global_step": 650172, "epoch": 7833} {"train_loss": -27.990949630737305, "global_step": 650173, "epoch": 7833} {"train_loss": -28.130056381225586, "global_step": 650174, "epoch": 7833} {"train_loss": -28.2004451751709, "global_step": 650175, "epoch": 7833} {"train_loss": -28.31598472595215, "global_step": 650176, "epoch": 7833} {"train_loss": -28.28325843811035, "global_step": 650177, "epoch": 7833} {"train_loss": -28.03156089782715, "global_step": 650178, "epoch": 7833} {"train_loss": -28.289880752563477, "global_step": 650179, "epoch": 7833} {"train_loss": -28.3980655670166, "global_step": 650180, "epoch": 7833} {"train_loss": -28.404376983642578, "global_step": 650181, "epoch": 7833} {"train_loss": -28.562910079956055, "global_step": 650182, "epoch": 7833} {"train_loss": -28.40167236328125, "global_step": 650183, "epoch": 7833} {"train_loss": -28.331348419189453, "global_step": 650184, "epoch": 7833} {"train_loss": -28.32671546936035, "global_step": 650185, "epoch": 7833} {"train_loss": -28.490392684936523, "global_step": 650186, "epoch": 7833} {"train_loss": -28.185754776000977, "global_step": 650187, "epoch": 7833} {"train_loss": -28.23773765563965, "global_step": 650188, "epoch": 7833} {"train_loss": -28.126708984375, "global_step": 650189, "epoch": 7833} {"train_loss": -28.05384635925293, "global_step": 650190, "epoch": 7833} {"train_loss": -28.248456954956055, "global_step": 650191, "epoch": 7833} {"train_loss": -28.493335723876953, "global_step": 650192, "epoch": 7833} {"train_loss": -28.130889892578125, "global_step": 650193, "epoch": 7833} {"train_loss": -28.310041427612305, "global_step": 650194, "epoch": 7833} {"train_loss": -28.370508193969727, "global_step": 650195, "epoch": 7833} {"train_loss": -28.20954704284668, "global_step": 650196, "epoch": 7833} {"train_loss": -28.472675323486328, "global_step": 650197, "epoch": 7833} {"train_loss": -28.329923629760742, "global_step": 650198, "epoch": 7833} {"train_loss": -28.194812774658203, "global_step": 650199, "epoch": 7833} {"train_loss": -28.670215606689453, "global_step": 650200, "epoch": 7833} {"train_loss": -28.54645347595215, "global_step": 650201, "epoch": 7833} {"train_loss": -28.069412231445312, "global_step": 650202, "epoch": 7833} {"train_loss": -28.144269943237305, "global_step": 650203, "epoch": 7833} {"train_loss": -27.675527572631836, "global_step": 650204, "epoch": 7833} {"train_loss": -28.271207809448242, "global_step": 650205, "epoch": 7833} {"train_loss": -28.773603439331055, "global_step": 650206, "epoch": 7833} {"train_loss": -28.159826278686523, "global_step": 650207, "epoch": 7833} {"train_loss": -27.79912757873535, "global_step": 650208, "epoch": 7833} {"train_loss": -27.634586334228516, "global_step": 650209, "epoch": 7833} {"train_loss": -27.539270401000977, "global_step": 650210, "epoch": 7833} {"train_loss": -28.277118682861328, "global_step": 650211, "epoch": 7833} {"train_loss": -28.123743057250977, "global_step": 650212, "epoch": 7833} {"train_loss": -27.718900680541992, "global_step": 650213, "epoch": 7833} {"train_loss": -28.053253173828125, "global_step": 650214, "epoch": 7833} {"train_loss": -28.11341667175293, "global_step": 650215, "epoch": 7833} {"train_loss": -28.508878707885742, "global_step": 650216, "epoch": 7833} {"train_loss": -28.0826416015625, "global_step": 650217, "epoch": 7833} {"train_loss": -28.214902877807617, "global_step": 650218, "epoch": 7833} {"train_loss": -28.36356544494629, "global_step": 650219, "epoch": 7833} {"train_loss": -28.13336753845215, "global_step": 650220, "epoch": 7833} {"train_loss": -27.89343921247735, "global_step": 650221, "epoch": 7833, "val_loss": 6783808.0} {"train_loss": -28.151906967163086, "global_step": 650222, "epoch": 7834} {"train_loss": -28.188827514648438, "global_step": 650223, "epoch": 7834} {"train_loss": -28.027463912963867, "global_step": 650224, "epoch": 7834} {"train_loss": -28.265851974487305, "global_step": 650225, "epoch": 7834} {"train_loss": -28.292951583862305, "global_step": 650226, "epoch": 7834} {"train_loss": -28.0388126373291, "global_step": 650227, "epoch": 7834} {"train_loss": -27.620107650756836, "global_step": 650228, "epoch": 7834} {"train_loss": -27.905221939086914, "global_step": 650229, "epoch": 7834} {"train_loss": -28.367483139038086, "global_step": 650230, "epoch": 7834} {"train_loss": -28.2707462310791, "global_step": 650231, "epoch": 7834} {"train_loss": -27.696081161499023, "global_step": 650232, "epoch": 7834} {"train_loss": -28.05952262878418, "global_step": 650233, "epoch": 7834} {"train_loss": -28.100696563720703, "global_step": 650234, "epoch": 7834} {"train_loss": -27.966550827026367, "global_step": 650235, "epoch": 7834} {"train_loss": -27.96284294128418, "global_step": 650236, "epoch": 7834} {"train_loss": -28.194955825805664, "global_step": 650237, "epoch": 7834} {"train_loss": -27.972503662109375, "global_step": 650238, "epoch": 7834} {"train_loss": -28.18902015686035, "global_step": 650239, "epoch": 7834} {"train_loss": -28.054492950439453, "global_step": 650240, "epoch": 7834} {"train_loss": -27.8555850982666, "global_step": 650241, "epoch": 7834} {"train_loss": -27.91103172302246, "global_step": 650242, "epoch": 7834} {"train_loss": -27.99220848083496, "global_step": 650243, "epoch": 7834} {"train_loss": -28.156723022460938, "global_step": 650244, "epoch": 7834} {"train_loss": -27.955951690673828, "global_step": 650245, "epoch": 7834} {"train_loss": -28.440427780151367, "global_step": 650246, "epoch": 7834} {"train_loss": -28.282453536987305, "global_step": 650247, "epoch": 7834} {"train_loss": -28.648157119750977, "global_step": 650248, "epoch": 7834} {"train_loss": -28.232452392578125, "global_step": 650249, "epoch": 7834} {"train_loss": -28.033248901367188, "global_step": 650250, "epoch": 7834} {"train_loss": -28.393665313720703, "global_step": 650251, "epoch": 7834} {"train_loss": -28.123205184936523, "global_step": 650252, "epoch": 7834} {"train_loss": -28.65863037109375, "global_step": 650253, "epoch": 7834} {"train_loss": -28.364362716674805, "global_step": 650254, "epoch": 7834} {"train_loss": -28.501401901245117, "global_step": 650255, "epoch": 7834} {"train_loss": -28.47607421875, "global_step": 650256, "epoch": 7834} {"train_loss": -28.18653678894043, "global_step": 650257, "epoch": 7834} {"train_loss": -28.468463897705078, "global_step": 650258, "epoch": 7834} {"train_loss": -28.283506393432617, "global_step": 650259, "epoch": 7834} {"train_loss": -28.498844146728516, "global_step": 650260, "epoch": 7834} {"train_loss": -28.280973434448242, "global_step": 650261, "epoch": 7834} {"train_loss": -28.348363876342773, "global_step": 650262, "epoch": 7834} {"train_loss": -28.335317611694336, "global_step": 650263, "epoch": 7834} {"train_loss": -28.499189376831055, "global_step": 650264, "epoch": 7834} {"train_loss": -28.534753799438477, "global_step": 650265, "epoch": 7834} {"train_loss": -28.4564151763916, "global_step": 650266, "epoch": 7834} {"train_loss": -28.109601974487305, "global_step": 650267, "epoch": 7834} {"train_loss": -27.793231964111328, "global_step": 650268, "epoch": 7834} {"train_loss": -27.915372848510742, "global_step": 650269, "epoch": 7834} {"train_loss": -28.2379150390625, "global_step": 650270, "epoch": 7834} {"train_loss": -28.315982818603516, "global_step": 650271, "epoch": 7834} {"train_loss": -28.760557174682617, "global_step": 650272, "epoch": 7834} {"train_loss": -28.152511596679688, "global_step": 650273, "epoch": 7834} {"train_loss": -28.36103630065918, "global_step": 650274, "epoch": 7834} {"train_loss": -28.556949615478516, "global_step": 650275, "epoch": 7834} {"train_loss": -28.579437255859375, "global_step": 650276, "epoch": 7834} {"train_loss": -28.528772354125977, "global_step": 650277, "epoch": 7834} {"train_loss": -28.1085205078125, "global_step": 650278, "epoch": 7834} {"train_loss": -28.1043758392334, "global_step": 650279, "epoch": 7834} {"train_loss": -28.159414291381836, "global_step": 650280, "epoch": 7834} {"train_loss": -28.467008590698242, "global_step": 650281, "epoch": 7834} {"train_loss": -27.94390296936035, "global_step": 650282, "epoch": 7834} {"train_loss": -28.303546905517578, "global_step": 650283, "epoch": 7834} {"train_loss": -28.1815128326416, "global_step": 650284, "epoch": 7834} {"train_loss": -27.964635848999023, "global_step": 650285, "epoch": 7834} {"train_loss": -28.50491714477539, "global_step": 650286, "epoch": 7834} {"train_loss": -28.266881942749023, "global_step": 650287, "epoch": 7834} {"train_loss": -28.461400985717773, "global_step": 650288, "epoch": 7834} {"train_loss": -28.392187118530273, "global_step": 650289, "epoch": 7834} {"train_loss": -28.371417999267578, "global_step": 650290, "epoch": 7834} {"train_loss": -28.521778106689453, "global_step": 650291, "epoch": 7834} {"train_loss": -28.56694984436035, "global_step": 650292, "epoch": 7834} {"train_loss": -28.281286239624023, "global_step": 650293, "epoch": 7834} {"train_loss": -28.533544540405273, "global_step": 650294, "epoch": 7834} {"train_loss": -28.02975845336914, "global_step": 650295, "epoch": 7834} {"train_loss": -28.228240966796875, "global_step": 650296, "epoch": 7834} {"train_loss": -28.161787033081055, "global_step": 650297, "epoch": 7834} {"train_loss": -28.449481964111328, "global_step": 650298, "epoch": 7834} {"train_loss": -28.162017822265625, "global_step": 650299, "epoch": 7834} {"train_loss": -28.054595947265625, "global_step": 650300, "epoch": 7834} {"train_loss": -27.99159049987793, "global_step": 650301, "epoch": 7834} {"train_loss": -27.714685440063477, "global_step": 650302, "epoch": 7834} {"train_loss": -28.03632164001465, "global_step": 650303, "epoch": 7834} {"train_loss": -28.226718948548097, "global_step": 650304, "epoch": 7834, "val_loss": 6848175.0} {"train_loss": -27.933746337890625, "global_step": 650305, "epoch": 7835} {"train_loss": -27.201074600219727, "global_step": 650306, "epoch": 7835} {"train_loss": -28.199615478515625, "global_step": 650307, "epoch": 7835} {"train_loss": -27.3077392578125, "global_step": 650308, "epoch": 7835} {"train_loss": -27.800521850585938, "global_step": 650309, "epoch": 7835} {"train_loss": -28.076629638671875, "global_step": 650310, "epoch": 7835} {"train_loss": -27.564960479736328, "global_step": 650311, "epoch": 7835} {"train_loss": -28.106048583984375, "global_step": 650312, "epoch": 7835} {"train_loss": -27.850177764892578, "global_step": 650313, "epoch": 7835} {"train_loss": -28.238300323486328, "global_step": 650314, "epoch": 7835} {"train_loss": -27.543048858642578, "global_step": 650315, "epoch": 7835} {"train_loss": -27.78607177734375, "global_step": 650316, "epoch": 7835} {"train_loss": -27.64947509765625, "global_step": 650317, "epoch": 7835} {"train_loss": -27.642780303955078, "global_step": 650318, "epoch": 7835} {"train_loss": -27.530914306640625, "global_step": 650319, "epoch": 7835} {"train_loss": -28.155017852783203, "global_step": 650320, "epoch": 7835} {"train_loss": -28.13398551940918, "global_step": 650321, "epoch": 7835} {"train_loss": -28.142200469970703, "global_step": 650322, "epoch": 7835} {"train_loss": -28.207138061523438, "global_step": 650323, "epoch": 7835} {"train_loss": -27.922382354736328, "global_step": 650324, "epoch": 7835} {"train_loss": -28.12222671508789, "global_step": 650325, "epoch": 7835} {"train_loss": -27.729419708251953, "global_step": 650326, "epoch": 7835} {"train_loss": -27.942550659179688, "global_step": 650327, "epoch": 7835} {"train_loss": -27.813465118408203, "global_step": 650328, "epoch": 7835} {"train_loss": -28.196044921875, "global_step": 650329, "epoch": 7835} {"train_loss": -28.149633407592773, "global_step": 650330, "epoch": 7835} {"train_loss": -28.093168258666992, "global_step": 650331, "epoch": 7835} {"train_loss": -27.86334228515625, "global_step": 650332, "epoch": 7835} {"train_loss": -28.08331871032715, "global_step": 650333, "epoch": 7835} {"train_loss": -28.5704345703125, "global_step": 650334, "epoch": 7835} {"train_loss": -28.2313175201416, "global_step": 650335, "epoch": 7835} {"train_loss": -28.136255264282227, "global_step": 650336, "epoch": 7835} {"train_loss": -28.114084243774414, "global_step": 650337, "epoch": 7835} {"train_loss": -28.33123207092285, "global_step": 650338, "epoch": 7835} {"train_loss": -28.60740089416504, "global_step": 650339, "epoch": 7835} {"train_loss": -28.421173095703125, "global_step": 650340, "epoch": 7835} {"train_loss": -28.5467529296875, "global_step": 650341, "epoch": 7835} {"train_loss": -28.450834274291992, "global_step": 650342, "epoch": 7835} {"train_loss": -28.29181480407715, "global_step": 650343, "epoch": 7835} {"train_loss": -28.580392837524414, "global_step": 650344, "epoch": 7835} {"train_loss": -28.45405387878418, "global_step": 650345, "epoch": 7835} {"train_loss": -28.331586837768555, "global_step": 650346, "epoch": 7835} {"train_loss": -28.291275024414062, "global_step": 650347, "epoch": 7835} {"train_loss": -28.290319442749023, "global_step": 650348, "epoch": 7835} {"train_loss": -28.24515724182129, "global_step": 650349, "epoch": 7835} {"train_loss": -28.6014461517334, "global_step": 650350, "epoch": 7835} {"train_loss": -28.63102149963379, "global_step": 650351, "epoch": 7835} {"train_loss": -28.839136123657227, "global_step": 650352, "epoch": 7835} {"train_loss": -28.271560668945312, "global_step": 650353, "epoch": 7835} {"train_loss": -28.698293685913086, "global_step": 650354, "epoch": 7835} {"train_loss": -27.882898330688477, "global_step": 650355, "epoch": 7835} {"train_loss": -27.779361724853516, "global_step": 650356, "epoch": 7835} {"train_loss": -28.209379196166992, "global_step": 650357, "epoch": 7835} {"train_loss": -28.421613693237305, "global_step": 650358, "epoch": 7835} {"train_loss": -27.735858917236328, "global_step": 650359, "epoch": 7835} {"train_loss": -27.958703994750977, "global_step": 650360, "epoch": 7835} {"train_loss": -27.647815704345703, "global_step": 650361, "epoch": 7835} {"train_loss": -27.718231201171875, "global_step": 650362, "epoch": 7835} {"train_loss": -28.07261085510254, "global_step": 650363, "epoch": 7835} {"train_loss": -28.0718936920166, "global_step": 650364, "epoch": 7835} {"train_loss": -28.128576278686523, "global_step": 650365, "epoch": 7835} {"train_loss": -28.453031539916992, "global_step": 650366, "epoch": 7835} {"train_loss": -28.10161781311035, "global_step": 650367, "epoch": 7835} {"train_loss": -28.238550186157227, "global_step": 650368, "epoch": 7835} {"train_loss": -27.982624053955078, "global_step": 650369, "epoch": 7835} {"train_loss": -28.038366317749023, "global_step": 650370, "epoch": 7835} {"train_loss": -28.1628360748291, "global_step": 650371, "epoch": 7835} {"train_loss": -28.155466079711914, "global_step": 650372, "epoch": 7835} {"train_loss": -28.522064208984375, "global_step": 650373, "epoch": 7835} {"train_loss": -28.360681533813477, "global_step": 650374, "epoch": 7835} {"train_loss": -28.358240127563477, "global_step": 650375, "epoch": 7835} {"train_loss": -28.534788131713867, "global_step": 650376, "epoch": 7835} {"train_loss": -28.28484535217285, "global_step": 650377, "epoch": 7835} {"train_loss": -28.398603439331055, "global_step": 650378, "epoch": 7835} {"train_loss": -28.51190757751465, "global_step": 650379, "epoch": 7835} {"train_loss": -28.40431022644043, "global_step": 650380, "epoch": 7835} {"train_loss": -28.274938583374023, "global_step": 650381, "epoch": 7835} {"train_loss": -28.20845603942871, "global_step": 650382, "epoch": 7835} {"train_loss": -28.39179039001465, "global_step": 650383, "epoch": 7835} {"train_loss": -28.482837677001953, "global_step": 650384, "epoch": 7835} {"train_loss": -28.510345458984375, "global_step": 650385, "epoch": 7835} {"train_loss": -28.17486000061035, "global_step": 650386, "epoch": 7835} {"train_loss": -28.17198817701225, "global_step": 650387, "epoch": 7835, "val_loss": 6798000.0} {"train_loss": -27.884618759155273, "global_step": 650388, "epoch": 7836} {"train_loss": -27.418622970581055, "global_step": 650389, "epoch": 7836} {"train_loss": -26.5352783203125, "global_step": 650390, "epoch": 7836} {"train_loss": -27.660633087158203, "global_step": 650391, "epoch": 7836} {"train_loss": -27.059314727783203, "global_step": 650392, "epoch": 7836} {"train_loss": -27.395618438720703, "global_step": 650393, "epoch": 7836} {"train_loss": -27.48813247680664, "global_step": 650394, "epoch": 7836} {"train_loss": -27.782596588134766, "global_step": 650395, "epoch": 7836} {"train_loss": -27.587085723876953, "global_step": 650396, "epoch": 7836} {"train_loss": -27.375381469726562, "global_step": 650397, "epoch": 7836} {"train_loss": -27.9786434173584, "global_step": 650398, "epoch": 7836} {"train_loss": -27.510583877563477, "global_step": 650399, "epoch": 7836} {"train_loss": -27.45023536682129, "global_step": 650400, "epoch": 7836} {"train_loss": -27.747364044189453, "global_step": 650401, "epoch": 7836} {"train_loss": -28.002094268798828, "global_step": 650402, "epoch": 7836} {"train_loss": -27.969167709350586, "global_step": 650403, "epoch": 7836} {"train_loss": -27.871580123901367, "global_step": 650404, "epoch": 7836} {"train_loss": -27.987035751342773, "global_step": 650405, "epoch": 7836} {"train_loss": -27.738861083984375, "global_step": 650406, "epoch": 7836} {"train_loss": -27.759384155273438, "global_step": 650407, "epoch": 7836} {"train_loss": -27.785419464111328, "global_step": 650408, "epoch": 7836} {"train_loss": -28.232410430908203, "global_step": 650409, "epoch": 7836} {"train_loss": -27.6260929107666, "global_step": 650410, "epoch": 7836} {"train_loss": -28.1657657623291, "global_step": 650411, "epoch": 7836} {"train_loss": -28.058645248413086, "global_step": 650412, "epoch": 7836} {"train_loss": -28.058652877807617, "global_step": 650413, "epoch": 7836} {"train_loss": -28.097150802612305, "global_step": 650414, "epoch": 7836} {"train_loss": -27.86786460876465, "global_step": 650415, "epoch": 7836} {"train_loss": -27.806177139282227, "global_step": 650416, "epoch": 7836} {"train_loss": -28.07452964782715, "global_step": 650417, "epoch": 7836} {"train_loss": -28.39051628112793, "global_step": 650418, "epoch": 7836} {"train_loss": -28.128387451171875, "global_step": 650419, "epoch": 7836} {"train_loss": -28.32136344909668, "global_step": 650420, "epoch": 7836} {"train_loss": -28.231998443603516, "global_step": 650421, "epoch": 7836} {"train_loss": -27.64373207092285, "global_step": 650422, "epoch": 7836} {"train_loss": -28.227930068969727, "global_step": 650423, "epoch": 7836} {"train_loss": -28.346899032592773, "global_step": 650424, "epoch": 7836} {"train_loss": -28.638776779174805, "global_step": 650425, "epoch": 7836} {"train_loss": -28.28846549987793, "global_step": 650426, "epoch": 7836} {"train_loss": -28.69160270690918, "global_step": 650427, "epoch": 7836} {"train_loss": -28.160125732421875, "global_step": 650428, "epoch": 7836} {"train_loss": -28.384521484375, "global_step": 650429, "epoch": 7836} {"train_loss": -28.425405502319336, "global_step": 650430, "epoch": 7836} {"train_loss": -28.530445098876953, "global_step": 650431, "epoch": 7836} {"train_loss": -28.420263290405273, "global_step": 650432, "epoch": 7836} {"train_loss": -28.45808982849121, "global_step": 650433, "epoch": 7836} {"train_loss": -28.4539794921875, "global_step": 650434, "epoch": 7836} {"train_loss": -28.236560821533203, "global_step": 650435, "epoch": 7836} {"train_loss": -28.225820541381836, "global_step": 650436, "epoch": 7836} {"train_loss": -28.332935333251953, "global_step": 650437, "epoch": 7836} {"train_loss": -28.4044189453125, "global_step": 650438, "epoch": 7836} {"train_loss": -28.15241050720215, "global_step": 650439, "epoch": 7836} {"train_loss": -28.419713973999023, "global_step": 650440, "epoch": 7836} {"train_loss": -28.285856246948242, "global_step": 650441, "epoch": 7836} {"train_loss": -28.349979400634766, "global_step": 650442, "epoch": 7836} {"train_loss": -28.42213249206543, "global_step": 650443, "epoch": 7836} {"train_loss": -28.35576820373535, "global_step": 650444, "epoch": 7836} {"train_loss": -28.492816925048828, "global_step": 650445, "epoch": 7836} {"train_loss": -28.593053817749023, "global_step": 650446, "epoch": 7836} {"train_loss": -28.8819637298584, "global_step": 650447, "epoch": 7836} {"train_loss": -27.93609619140625, "global_step": 650448, "epoch": 7836} {"train_loss": -28.3343563079834, "global_step": 650449, "epoch": 7836} {"train_loss": -28.26114273071289, "global_step": 650450, "epoch": 7836} {"train_loss": -28.37482261657715, "global_step": 650451, "epoch": 7836} {"train_loss": -28.396808624267578, "global_step": 650452, "epoch": 7836} {"train_loss": -28.156829833984375, "global_step": 650453, "epoch": 7836} {"train_loss": -28.352277755737305, "global_step": 650454, "epoch": 7836} {"train_loss": -28.00288963317871, "global_step": 650455, "epoch": 7836} {"train_loss": -27.930469512939453, "global_step": 650456, "epoch": 7836} {"train_loss": -28.012592315673828, "global_step": 650457, "epoch": 7836} {"train_loss": -28.0789737701416, "global_step": 650458, "epoch": 7836} {"train_loss": -28.856796264648438, "global_step": 650459, "epoch": 7836} {"train_loss": -28.66347312927246, "global_step": 650460, "epoch": 7836} {"train_loss": -28.58003044128418, "global_step": 650461, "epoch": 7836} {"train_loss": -27.944995880126953, "global_step": 650462, "epoch": 7836} {"train_loss": -28.160934448242188, "global_step": 650463, "epoch": 7836} {"train_loss": -28.370141983032227, "global_step": 650464, "epoch": 7836} {"train_loss": -28.8946590423584, "global_step": 650465, "epoch": 7836} {"train_loss": -27.926939010620117, "global_step": 650466, "epoch": 7836} {"train_loss": -28.592100143432617, "global_step": 650467, "epoch": 7836} {"train_loss": -28.24615478515625, "global_step": 650468, "epoch": 7836} {"train_loss": -28.160568237304688, "global_step": 650469, "epoch": 7836} {"train_loss": -28.105472840458514, "global_step": 650470, "epoch": 7836, "val_loss": 6756159.0} {"train_loss": -27.481470108032227, "global_step": 650471, "epoch": 7837} {"train_loss": -27.950641632080078, "global_step": 650472, "epoch": 7837} {"train_loss": -27.952695846557617, "global_step": 650473, "epoch": 7837} {"train_loss": -27.59025001525879, "global_step": 650474, "epoch": 7837} {"train_loss": -27.77433204650879, "global_step": 650475, "epoch": 7837} {"train_loss": -27.7808780670166, "global_step": 650476, "epoch": 7837} {"train_loss": -27.66350746154785, "global_step": 650477, "epoch": 7837} {"train_loss": -27.854251861572266, "global_step": 650478, "epoch": 7837} {"train_loss": -27.484262466430664, "global_step": 650479, "epoch": 7837} {"train_loss": -27.701995849609375, "global_step": 650480, "epoch": 7837} {"train_loss": -28.0994930267334, "global_step": 650481, "epoch": 7837} {"train_loss": -27.828718185424805, "global_step": 650482, "epoch": 7837} {"train_loss": -27.860443115234375, "global_step": 650483, "epoch": 7837} {"train_loss": -27.83917236328125, "global_step": 650484, "epoch": 7837} {"train_loss": -28.1488037109375, "global_step": 650485, "epoch": 7837} {"train_loss": -27.941638946533203, "global_step": 650486, "epoch": 7837} {"train_loss": -27.937719345092773, "global_step": 650487, "epoch": 7837} {"train_loss": -27.73187255859375, "global_step": 650488, "epoch": 7837} {"train_loss": -27.795766830444336, "global_step": 650489, "epoch": 7837} {"train_loss": -27.912134170532227, "global_step": 650490, "epoch": 7837} {"train_loss": -28.27654457092285, "global_step": 650491, "epoch": 7837} {"train_loss": -27.95391273498535, "global_step": 650492, "epoch": 7837} {"train_loss": -27.94888687133789, "global_step": 650493, "epoch": 7837} {"train_loss": -28.1238956451416, "global_step": 650494, "epoch": 7837} {"train_loss": -28.333703994750977, "global_step": 650495, "epoch": 7837} {"train_loss": -28.405141830444336, "global_step": 650496, "epoch": 7837} {"train_loss": -28.293750762939453, "global_step": 650497, "epoch": 7837} {"train_loss": -28.496601104736328, "global_step": 650498, "epoch": 7837} {"train_loss": -28.383544921875, "global_step": 650499, "epoch": 7837} {"train_loss": -28.49365234375, "global_step": 650500, "epoch": 7837} {"train_loss": -28.197980880737305, "global_step": 650501, "epoch": 7837} {"train_loss": -28.293262481689453, "global_step": 650502, "epoch": 7837} {"train_loss": -28.417133331298828, "global_step": 650503, "epoch": 7837} {"train_loss": -28.07036781311035, "global_step": 650504, "epoch": 7837} {"train_loss": -28.214719772338867, "global_step": 650505, "epoch": 7837} {"train_loss": -28.453638076782227, "global_step": 650506, "epoch": 7837} {"train_loss": -28.38214683532715, "global_step": 650507, "epoch": 7837} {"train_loss": -28.3538761138916, "global_step": 650508, "epoch": 7837} {"train_loss": -28.170520782470703, "global_step": 650509, "epoch": 7837} {"train_loss": -27.98845863342285, "global_step": 650510, "epoch": 7837} {"train_loss": -27.63528823852539, "global_step": 650511, "epoch": 7837} {"train_loss": -27.867603302001953, "global_step": 650512, "epoch": 7837} {"train_loss": -28.514692306518555, "global_step": 650513, "epoch": 7837} {"train_loss": -28.16554832458496, "global_step": 650514, "epoch": 7837} {"train_loss": -28.400390625, "global_step": 650515, "epoch": 7837} {"train_loss": -28.564855575561523, "global_step": 650516, "epoch": 7837} {"train_loss": -28.507299423217773, "global_step": 650517, "epoch": 7837} {"train_loss": -28.339414596557617, "global_step": 650518, "epoch": 7837} {"train_loss": -28.528614044189453, "global_step": 650519, "epoch": 7837} {"train_loss": -28.29642105102539, "global_step": 650520, "epoch": 7837} {"train_loss": -28.192163467407227, "global_step": 650521, "epoch": 7837} {"train_loss": -28.221784591674805, "global_step": 650522, "epoch": 7837} {"train_loss": -28.324417114257812, "global_step": 650523, "epoch": 7837} {"train_loss": -28.08201026916504, "global_step": 650524, "epoch": 7837} {"train_loss": -28.366418838500977, "global_step": 650525, "epoch": 7837} {"train_loss": -28.51605796813965, "global_step": 650526, "epoch": 7837} {"train_loss": -28.188892364501953, "global_step": 650527, "epoch": 7837} {"train_loss": -28.2702579498291, "global_step": 650528, "epoch": 7837} {"train_loss": -28.592710494995117, "global_step": 650529, "epoch": 7837} {"train_loss": -28.18580436706543, "global_step": 650530, "epoch": 7837} {"train_loss": -28.176794052124023, "global_step": 650531, "epoch": 7837} {"train_loss": -28.442968368530273, "global_step": 650532, "epoch": 7837} {"train_loss": -28.375701904296875, "global_step": 650533, "epoch": 7837} {"train_loss": -27.938119888305664, "global_step": 650534, "epoch": 7837} {"train_loss": -28.291461944580078, "global_step": 650535, "epoch": 7837} {"train_loss": -28.368188858032227, "global_step": 650536, "epoch": 7837} {"train_loss": -28.047962188720703, "global_step": 650537, "epoch": 7837} {"train_loss": -28.679346084594727, "global_step": 650538, "epoch": 7837} {"train_loss": -27.998432159423828, "global_step": 650539, "epoch": 7837} {"train_loss": -28.3055362701416, "global_step": 650540, "epoch": 7837} {"train_loss": -28.513586044311523, "global_step": 650541, "epoch": 7837} {"train_loss": -28.271697998046875, "global_step": 650542, "epoch": 7837} {"train_loss": -28.44696044921875, "global_step": 650543, "epoch": 7837} {"train_loss": -28.602033615112305, "global_step": 650544, "epoch": 7837} {"train_loss": -28.486785888671875, "global_step": 650545, "epoch": 7837} {"train_loss": -28.719226837158203, "global_step": 650546, "epoch": 7837} {"train_loss": -28.223352432250977, "global_step": 650547, "epoch": 7837} {"train_loss": -28.408390045166016, "global_step": 650548, "epoch": 7837} {"train_loss": -28.248319625854492, "global_step": 650549, "epoch": 7837} {"train_loss": -27.705524444580078, "global_step": 650550, "epoch": 7837} {"train_loss": -27.082372665405273, "global_step": 650551, "epoch": 7837} {"train_loss": -25.512563705444336, "global_step": 650552, "epoch": 7837} {"train_loss": -28.03671457681311, "global_step": 650553, "epoch": 7837, "val_loss": 6717144.5} {"train_loss": -9.596967697143555, "global_step": 650554, "epoch": 7838} {"train_loss": -21.921127319335938, "global_step": 650555, "epoch": 7838} {"train_loss": -14.766222953796387, "global_step": 650556, "epoch": 7838} {"train_loss": -19.392759323120117, "global_step": 650557, "epoch": 7838} {"train_loss": -22.7864990234375, "global_step": 650558, "epoch": 7838} {"train_loss": -22.0416259765625, "global_step": 650559, "epoch": 7838} {"train_loss": -21.202333450317383, "global_step": 650560, "epoch": 7838} {"train_loss": -22.966371536254883, "global_step": 650561, "epoch": 7838} {"train_loss": -24.525493621826172, "global_step": 650562, "epoch": 7838} {"train_loss": -24.254383087158203, "global_step": 650563, "epoch": 7838} {"train_loss": -23.838403701782227, "global_step": 650564, "epoch": 7838} {"train_loss": -23.8670711517334, "global_step": 650565, "epoch": 7838} {"train_loss": -24.047292709350586, "global_step": 650566, "epoch": 7838} {"train_loss": -24.367462158203125, "global_step": 650567, "epoch": 7838} {"train_loss": -24.261734008789062, "global_step": 650568, "epoch": 7838} {"train_loss": -24.73126792907715, "global_step": 650569, "epoch": 7838} {"train_loss": -25.21785545349121, "global_step": 650570, "epoch": 7838} {"train_loss": -25.074281692504883, "global_step": 650571, "epoch": 7838} {"train_loss": -25.178770065307617, "global_step": 650572, "epoch": 7838} {"train_loss": -25.09601402282715, "global_step": 650573, "epoch": 7838} {"train_loss": -25.557159423828125, "global_step": 650574, "epoch": 7838} {"train_loss": -25.38357162475586, "global_step": 650575, "epoch": 7838} {"train_loss": -25.307186126708984, "global_step": 650576, "epoch": 7838} {"train_loss": -25.350311279296875, "global_step": 650577, "epoch": 7838} {"train_loss": -25.285058975219727, "global_step": 650578, "epoch": 7838} {"train_loss": -25.407684326171875, "global_step": 650579, "epoch": 7838} {"train_loss": -25.836210250854492, "global_step": 650580, "epoch": 7838} {"train_loss": -25.611074447631836, "global_step": 650581, "epoch": 7838} {"train_loss": -26.1284122467041, "global_step": 650582, "epoch": 7838} {"train_loss": -26.1035099029541, "global_step": 650583, "epoch": 7838} {"train_loss": -26.30914306640625, "global_step": 650584, "epoch": 7838} {"train_loss": -26.097604751586914, "global_step": 650585, "epoch": 7838} {"train_loss": -26.335779190063477, "global_step": 650586, "epoch": 7838} {"train_loss": -26.444660186767578, "global_step": 650587, "epoch": 7838} {"train_loss": -26.59418296813965, "global_step": 650588, "epoch": 7838} {"train_loss": -26.880929946899414, "global_step": 650589, "epoch": 7838} {"train_loss": -27.001977920532227, "global_step": 650590, "epoch": 7838} {"train_loss": -26.361270904541016, "global_step": 650591, "epoch": 7838} {"train_loss": -26.548269271850586, "global_step": 650592, "epoch": 7838} {"train_loss": -26.7993221282959, "global_step": 650593, "epoch": 7838} {"train_loss": -26.561071395874023, "global_step": 650594, "epoch": 7838} {"train_loss": -27.135961532592773, "global_step": 650595, "epoch": 7838} {"train_loss": -27.158475875854492, "global_step": 650596, "epoch": 7838} {"train_loss": -26.756864547729492, "global_step": 650597, "epoch": 7838} {"train_loss": -26.930036544799805, "global_step": 650598, "epoch": 7838} {"train_loss": -26.609516143798828, "global_step": 650599, "epoch": 7838} {"train_loss": -27.0233097076416, "global_step": 650600, "epoch": 7838} {"train_loss": -27.388471603393555, "global_step": 650601, "epoch": 7838} {"train_loss": -26.988300323486328, "global_step": 650602, "epoch": 7838} {"train_loss": -27.1053466796875, "global_step": 650603, "epoch": 7838} {"train_loss": -27.5914249420166, "global_step": 650604, "epoch": 7838} {"train_loss": -27.1896915435791, "global_step": 650605, "epoch": 7838} {"train_loss": -27.557058334350586, "global_step": 650606, "epoch": 7838} {"train_loss": -27.396137237548828, "global_step": 650607, "epoch": 7838} {"train_loss": -27.27997398376465, "global_step": 650608, "epoch": 7838} {"train_loss": -27.677261352539062, "global_step": 650609, "epoch": 7838} {"train_loss": -27.3575439453125, "global_step": 650610, "epoch": 7838} {"train_loss": -27.246191024780273, "global_step": 650611, "epoch": 7838} {"train_loss": -27.94476318359375, "global_step": 650612, "epoch": 7838} {"train_loss": -27.642013549804688, "global_step": 650613, "epoch": 7838} {"train_loss": -26.898950576782227, "global_step": 650614, "epoch": 7838} {"train_loss": -27.513717651367188, "global_step": 650615, "epoch": 7838} {"train_loss": -27.415311813354492, "global_step": 650616, "epoch": 7838} {"train_loss": -27.243680953979492, "global_step": 650617, "epoch": 7838} {"train_loss": -27.657983779907227, "global_step": 650618, "epoch": 7838} {"train_loss": -27.65840721130371, "global_step": 650619, "epoch": 7838} {"train_loss": -27.800540924072266, "global_step": 650620, "epoch": 7838} {"train_loss": -28.313138961791992, "global_step": 650621, "epoch": 7838} {"train_loss": -27.7215576171875, "global_step": 650622, "epoch": 7838} {"train_loss": -27.61809730529785, "global_step": 650623, "epoch": 7838} {"train_loss": -27.49867057800293, "global_step": 650624, "epoch": 7838} {"train_loss": -27.7123966217041, "global_step": 650625, "epoch": 7838} {"train_loss": -27.92323112487793, "global_step": 650626, "epoch": 7838} {"train_loss": -27.781696319580078, "global_step": 650627, "epoch": 7838} {"train_loss": -27.552188873291016, "global_step": 650628, "epoch": 7838} {"train_loss": -27.844959259033203, "global_step": 650629, "epoch": 7838} {"train_loss": -27.52800941467285, "global_step": 650630, "epoch": 7838} {"train_loss": -27.561635971069336, "global_step": 650631, "epoch": 7838} {"train_loss": -27.837329864501953, "global_step": 650632, "epoch": 7838} {"train_loss": -27.40167236328125, "global_step": 650633, "epoch": 7838} {"train_loss": -27.54583168029785, "global_step": 650634, "epoch": 7838} {"train_loss": -27.845279693603516, "global_step": 650635, "epoch": 7838} {"train_loss": -25.915342089641523, "global_step": 650636, "epoch": 7838, "val_loss": 6699251.5} {"train_loss": -26.666807174682617, "global_step": 650637, "epoch": 7839} {"train_loss": -26.868494033813477, "global_step": 650638, "epoch": 7839} {"train_loss": -27.606657028198242, "global_step": 650639, "epoch": 7839} {"train_loss": -26.490493774414062, "global_step": 650640, "epoch": 7839} {"train_loss": -26.731430053710938, "global_step": 650641, "epoch": 7839} {"train_loss": -26.4300594329834, "global_step": 650642, "epoch": 7839} {"train_loss": -27.482147216796875, "global_step": 650643, "epoch": 7839} {"train_loss": -27.223377227783203, "global_step": 650644, "epoch": 7839} {"train_loss": -27.226932525634766, "global_step": 650645, "epoch": 7839} {"train_loss": -27.572952270507812, "global_step": 650646, "epoch": 7839} {"train_loss": -27.12188720703125, "global_step": 650647, "epoch": 7839} {"train_loss": -27.146610260009766, "global_step": 650648, "epoch": 7839} {"train_loss": -27.11684226989746, "global_step": 650649, "epoch": 7839} {"train_loss": -27.24696159362793, "global_step": 650650, "epoch": 7839} {"train_loss": -27.274219512939453, "global_step": 650651, "epoch": 7839} {"train_loss": -27.294315338134766, "global_step": 650652, "epoch": 7839} {"train_loss": -27.04721450805664, "global_step": 650653, "epoch": 7839} {"train_loss": -27.645416259765625, "global_step": 650654, "epoch": 7839} {"train_loss": -27.208820343017578, "global_step": 650655, "epoch": 7839} {"train_loss": -27.37113380432129, "global_step": 650656, "epoch": 7839} {"train_loss": -27.409320831298828, "global_step": 650657, "epoch": 7839} {"train_loss": -27.26199722290039, "global_step": 650658, "epoch": 7839} {"train_loss": -27.481714248657227, "global_step": 650659, "epoch": 7839} {"train_loss": -27.52960205078125, "global_step": 650660, "epoch": 7839} {"train_loss": -27.62800407409668, "global_step": 650661, "epoch": 7839} {"train_loss": -27.62579917907715, "global_step": 650662, "epoch": 7839} {"train_loss": -27.1832332611084, "global_step": 650663, "epoch": 7839} {"train_loss": -27.95563316345215, "global_step": 650664, "epoch": 7839} {"train_loss": -27.51319694519043, "global_step": 650665, "epoch": 7839} {"train_loss": -27.521692276000977, "global_step": 650666, "epoch": 7839} {"train_loss": -27.76704216003418, "global_step": 650667, "epoch": 7839} {"train_loss": -27.73215675354004, "global_step": 650668, "epoch": 7839} {"train_loss": -27.8989315032959, "global_step": 650669, "epoch": 7839} {"train_loss": -27.493398666381836, "global_step": 650670, "epoch": 7839} {"train_loss": -27.43379020690918, "global_step": 650671, "epoch": 7839} {"train_loss": -28.047393798828125, "global_step": 650672, "epoch": 7839} {"train_loss": -28.064289093017578, "global_step": 650673, "epoch": 7839} {"train_loss": -28.029157638549805, "global_step": 650674, "epoch": 7839} {"train_loss": -27.451074600219727, "global_step": 650675, "epoch": 7839} {"train_loss": -27.714691162109375, "global_step": 650676, "epoch": 7839} {"train_loss": -27.638919830322266, "global_step": 650677, "epoch": 7839} {"train_loss": -28.248464584350586, "global_step": 650678, "epoch": 7839} {"train_loss": -28.097702026367188, "global_step": 650679, "epoch": 7839} {"train_loss": -27.66280174255371, "global_step": 650680, "epoch": 7839} {"train_loss": -28.055524826049805, "global_step": 650681, "epoch": 7839} {"train_loss": -28.04029655456543, "global_step": 650682, "epoch": 7839} {"train_loss": -27.656713485717773, "global_step": 650683, "epoch": 7839} {"train_loss": -28.13675880432129, "global_step": 650684, "epoch": 7839} {"train_loss": -27.553543090820312, "global_step": 650685, "epoch": 7839} {"train_loss": -28.027448654174805, "global_step": 650686, "epoch": 7839} {"train_loss": -27.79751968383789, "global_step": 650687, "epoch": 7839} {"train_loss": -27.481689453125, "global_step": 650688, "epoch": 7839} {"train_loss": -27.846113204956055, "global_step": 650689, "epoch": 7839} {"train_loss": -28.33881950378418, "global_step": 650690, "epoch": 7839} {"train_loss": -27.69270133972168, "global_step": 650691, "epoch": 7839} {"train_loss": -27.47916030883789, "global_step": 650692, "epoch": 7839} {"train_loss": -28.279264450073242, "global_step": 650693, "epoch": 7839} {"train_loss": -27.987396240234375, "global_step": 650694, "epoch": 7839} {"train_loss": -28.0568904876709, "global_step": 650695, "epoch": 7839} {"train_loss": -28.09303092956543, "global_step": 650696, "epoch": 7839} {"train_loss": -28.09319496154785, "global_step": 650697, "epoch": 7839} {"train_loss": -27.848852157592773, "global_step": 650698, "epoch": 7839} {"train_loss": -28.170917510986328, "global_step": 650699, "epoch": 7839} {"train_loss": -27.925439834594727, "global_step": 650700, "epoch": 7839} {"train_loss": -27.847888946533203, "global_step": 650701, "epoch": 7839} {"train_loss": -27.62677001953125, "global_step": 650702, "epoch": 7839} {"train_loss": -28.51295280456543, "global_step": 650703, "epoch": 7839} {"train_loss": -27.9852294921875, "global_step": 650704, "epoch": 7839} {"train_loss": -28.546924591064453, "global_step": 650705, "epoch": 7839} {"train_loss": -27.974756240844727, "global_step": 650706, "epoch": 7839} {"train_loss": -27.978759765625, "global_step": 650707, "epoch": 7839} {"train_loss": -27.961318969726562, "global_step": 650708, "epoch": 7839} {"train_loss": -28.122602462768555, "global_step": 650709, "epoch": 7839} {"train_loss": -28.390628814697266, "global_step": 650710, "epoch": 7839} {"train_loss": -28.103778839111328, "global_step": 650711, "epoch": 7839} {"train_loss": -27.968103408813477, "global_step": 650712, "epoch": 7839} {"train_loss": -28.18104362487793, "global_step": 650713, "epoch": 7839} {"train_loss": -28.33209800720215, "global_step": 650714, "epoch": 7839} {"train_loss": -28.24823570251465, "global_step": 650715, "epoch": 7839} {"train_loss": -28.135974884033203, "global_step": 650716, "epoch": 7839} {"train_loss": -27.81171989440918, "global_step": 650717, "epoch": 7839} {"train_loss": -28.384119033813477, "global_step": 650718, "epoch": 7839} {"train_loss": -27.696905664650792, "global_step": 650719, "epoch": 7839, "val_loss": 6835155.0} {"train_loss": -27.080183029174805, "global_step": 650720, "epoch": 7840} {"train_loss": -26.96638298034668, "global_step": 650721, "epoch": 7840} {"train_loss": -26.677026748657227, "global_step": 650722, "epoch": 7840} {"train_loss": -27.395925521850586, "global_step": 650723, "epoch": 7840} {"train_loss": -27.399423599243164, "global_step": 650724, "epoch": 7840} {"train_loss": -27.758581161499023, "global_step": 650725, "epoch": 7840} {"train_loss": -27.265735626220703, "global_step": 650726, "epoch": 7840} {"train_loss": -26.955032348632812, "global_step": 650727, "epoch": 7840} {"train_loss": -27.50982093811035, "global_step": 650728, "epoch": 7840} {"train_loss": -27.661428451538086, "global_step": 650729, "epoch": 7840} {"train_loss": -27.50770378112793, "global_step": 650730, "epoch": 7840} {"train_loss": -27.669153213500977, "global_step": 650731, "epoch": 7840} {"train_loss": -27.44889259338379, "global_step": 650732, "epoch": 7840} {"train_loss": -27.99824333190918, "global_step": 650733, "epoch": 7840} {"train_loss": -27.47332763671875, "global_step": 650734, "epoch": 7840} {"train_loss": -28.046981811523438, "global_step": 650735, "epoch": 7840} {"train_loss": -27.76886558532715, "global_step": 650736, "epoch": 7840} {"train_loss": -27.728063583374023, "global_step": 650737, "epoch": 7840} {"train_loss": -27.708555221557617, "global_step": 650738, "epoch": 7840} {"train_loss": -27.65522575378418, "global_step": 650739, "epoch": 7840} {"train_loss": -27.79534339904785, "global_step": 650740, "epoch": 7840} {"train_loss": -27.823572158813477, "global_step": 650741, "epoch": 7840} {"train_loss": -28.064794540405273, "global_step": 650742, "epoch": 7840} {"train_loss": -27.78545570373535, "global_step": 650743, "epoch": 7840} {"train_loss": -28.107397079467773, "global_step": 650744, "epoch": 7840} {"train_loss": -28.219024658203125, "global_step": 650745, "epoch": 7840} {"train_loss": -28.173559188842773, "global_step": 650746, "epoch": 7840} {"train_loss": -28.0068359375, "global_step": 650747, "epoch": 7840} {"train_loss": -28.420307159423828, "global_step": 650748, "epoch": 7840} {"train_loss": -28.077468872070312, "global_step": 650749, "epoch": 7840} {"train_loss": -28.195852279663086, "global_step": 650750, "epoch": 7840} {"train_loss": -28.019683837890625, "global_step": 650751, "epoch": 7840} {"train_loss": -27.82485008239746, "global_step": 650752, "epoch": 7840} {"train_loss": -27.774372100830078, "global_step": 650753, "epoch": 7840} {"train_loss": -27.991107940673828, "global_step": 650754, "epoch": 7840} {"train_loss": -28.26313591003418, "global_step": 650755, "epoch": 7840} {"train_loss": -28.31068229675293, "global_step": 650756, "epoch": 7840} {"train_loss": -28.007699966430664, "global_step": 650757, "epoch": 7840} {"train_loss": -27.911832809448242, "global_step": 650758, "epoch": 7840} {"train_loss": -28.1103515625, "global_step": 650759, "epoch": 7840} {"train_loss": -28.06044578552246, "global_step": 650760, "epoch": 7840} {"train_loss": -28.194883346557617, "global_step": 650761, "epoch": 7840} {"train_loss": -28.367755889892578, "global_step": 650762, "epoch": 7840} {"train_loss": -28.323392868041992, "global_step": 650763, "epoch": 7840} {"train_loss": -28.264612197875977, "global_step": 650764, "epoch": 7840} {"train_loss": -27.945240020751953, "global_step": 650765, "epoch": 7840} {"train_loss": -28.08753776550293, "global_step": 650766, "epoch": 7840} {"train_loss": -28.060285568237305, "global_step": 650767, "epoch": 7840} {"train_loss": -28.213775634765625, "global_step": 650768, "epoch": 7840} {"train_loss": -28.506885528564453, "global_step": 650769, "epoch": 7840} {"train_loss": -28.513031005859375, "global_step": 650770, "epoch": 7840} {"train_loss": -28.331634521484375, "global_step": 650771, "epoch": 7840} {"train_loss": -28.403039932250977, "global_step": 650772, "epoch": 7840} {"train_loss": -27.913415908813477, "global_step": 650773, "epoch": 7840} {"train_loss": -28.32834243774414, "global_step": 650774, "epoch": 7840} {"train_loss": -28.316492080688477, "global_step": 650775, "epoch": 7840} {"train_loss": -28.36956787109375, "global_step": 650776, "epoch": 7840} {"train_loss": -27.742023468017578, "global_step": 650777, "epoch": 7840} {"train_loss": -28.23012351989746, "global_step": 650778, "epoch": 7840} {"train_loss": -28.118640899658203, "global_step": 650779, "epoch": 7840} {"train_loss": -28.41465187072754, "global_step": 650780, "epoch": 7840} {"train_loss": -28.135435104370117, "global_step": 650781, "epoch": 7840} {"train_loss": -27.8691463470459, "global_step": 650782, "epoch": 7840} {"train_loss": -28.197980880737305, "global_step": 650783, "epoch": 7840} {"train_loss": -28.191564559936523, "global_step": 650784, "epoch": 7840} {"train_loss": -28.1175537109375, "global_step": 650785, "epoch": 7840} {"train_loss": -28.03558921813965, "global_step": 650786, "epoch": 7840} {"train_loss": -28.427108764648438, "global_step": 650787, "epoch": 7840} {"train_loss": -27.564651489257812, "global_step": 650788, "epoch": 7840} {"train_loss": -28.4044132232666, "global_step": 650789, "epoch": 7840} {"train_loss": -28.693161010742188, "global_step": 650790, "epoch": 7840} {"train_loss": -27.504987716674805, "global_step": 650791, "epoch": 7840} {"train_loss": -27.9150390625, "global_step": 650792, "epoch": 7840} {"train_loss": -27.76483154296875, "global_step": 650793, "epoch": 7840} {"train_loss": -28.0036678314209, "global_step": 650794, "epoch": 7840} {"train_loss": -28.496871948242188, "global_step": 650795, "epoch": 7840} {"train_loss": -27.675968170166016, "global_step": 650796, "epoch": 7840} {"train_loss": -28.47613525390625, "global_step": 650797, "epoch": 7840} {"train_loss": -28.320356369018555, "global_step": 650798, "epoch": 7840} {"train_loss": -28.072980880737305, "global_step": 650799, "epoch": 7840} {"train_loss": -28.34433937072754, "global_step": 650800, "epoch": 7840} {"train_loss": -28.155256271362305, "global_step": 650801, "epoch": 7840} {"train_loss": -27.992893586675805, "global_step": 650802, "epoch": 7840, "val_loss": 6770765.0} {"train_loss": -26.801910400390625, "global_step": 650803, "epoch": 7841} {"train_loss": -26.524402618408203, "global_step": 650804, "epoch": 7841} {"train_loss": -26.916059494018555, "global_step": 650805, "epoch": 7841} {"train_loss": -27.42522621154785, "global_step": 650806, "epoch": 7841} {"train_loss": -26.73531150817871, "global_step": 650807, "epoch": 7841} {"train_loss": -27.28190040588379, "global_step": 650808, "epoch": 7841} {"train_loss": -27.460290908813477, "global_step": 650809, "epoch": 7841} {"train_loss": -27.441755294799805, "global_step": 650810, "epoch": 7841} {"train_loss": -27.857519149780273, "global_step": 650811, "epoch": 7841} {"train_loss": -27.469348907470703, "global_step": 650812, "epoch": 7841} {"train_loss": -27.83272361755371, "global_step": 650813, "epoch": 7841} {"train_loss": -27.99994468688965, "global_step": 650814, "epoch": 7841} {"train_loss": -28.03285026550293, "global_step": 650815, "epoch": 7841} {"train_loss": -27.703500747680664, "global_step": 650816, "epoch": 7841} {"train_loss": -27.869949340820312, "global_step": 650817, "epoch": 7841} {"train_loss": -28.035383224487305, "global_step": 650818, "epoch": 7841} {"train_loss": -27.41803550720215, "global_step": 650819, "epoch": 7841} {"train_loss": -27.6019287109375, "global_step": 650820, "epoch": 7841} {"train_loss": -28.16071891784668, "global_step": 650821, "epoch": 7841} {"train_loss": -27.920011520385742, "global_step": 650822, "epoch": 7841} {"train_loss": -27.9114990234375, "global_step": 650823, "epoch": 7841} {"train_loss": -27.729766845703125, "global_step": 650824, "epoch": 7841} {"train_loss": -28.1997127532959, "global_step": 650825, "epoch": 7841} {"train_loss": -28.310382843017578, "global_step": 650826, "epoch": 7841} {"train_loss": -27.891210556030273, "global_step": 650827, "epoch": 7841} {"train_loss": -28.13862419128418, "global_step": 650828, "epoch": 7841} {"train_loss": -28.053747177124023, "global_step": 650829, "epoch": 7841} {"train_loss": -27.627796173095703, "global_step": 650830, "epoch": 7841} {"train_loss": -28.149906158447266, "global_step": 650831, "epoch": 7841} {"train_loss": -28.315149307250977, "global_step": 650832, "epoch": 7841} {"train_loss": -27.9890193939209, "global_step": 650833, "epoch": 7841} {"train_loss": -27.677814483642578, "global_step": 650834, "epoch": 7841} {"train_loss": -27.67970085144043, "global_step": 650835, "epoch": 7841} {"train_loss": -28.11883544921875, "global_step": 650836, "epoch": 7841} {"train_loss": -28.198148727416992, "global_step": 650837, "epoch": 7841} {"train_loss": -28.187591552734375, "global_step": 650838, "epoch": 7841} {"train_loss": -28.009489059448242, "global_step": 650839, "epoch": 7841} {"train_loss": -28.061670303344727, "global_step": 650840, "epoch": 7841} {"train_loss": -28.559412002563477, "global_step": 650841, "epoch": 7841} {"train_loss": -28.28466796875, "global_step": 650842, "epoch": 7841} {"train_loss": -28.451496124267578, "global_step": 650843, "epoch": 7841} {"train_loss": -27.9580078125, "global_step": 650844, "epoch": 7841} {"train_loss": -28.430561065673828, "global_step": 650845, "epoch": 7841} {"train_loss": -28.703866958618164, "global_step": 650846, "epoch": 7841} {"train_loss": -28.85112953186035, "global_step": 650847, "epoch": 7841} {"train_loss": -28.10682487487793, "global_step": 650848, "epoch": 7841} {"train_loss": -28.542556762695312, "global_step": 650849, "epoch": 7841} {"train_loss": -28.420297622680664, "global_step": 650850, "epoch": 7841} {"train_loss": -28.74151039123535, "global_step": 650851, "epoch": 7841} {"train_loss": -28.714384078979492, "global_step": 650852, "epoch": 7841} {"train_loss": -28.77251625061035, "global_step": 650853, "epoch": 7841} {"train_loss": -28.19405174255371, "global_step": 650854, "epoch": 7841} {"train_loss": -28.60931968688965, "global_step": 650855, "epoch": 7841} {"train_loss": -28.494003295898438, "global_step": 650856, "epoch": 7841} {"train_loss": -28.63960838317871, "global_step": 650857, "epoch": 7841} {"train_loss": -28.477127075195312, "global_step": 650858, "epoch": 7841} {"train_loss": -28.721967697143555, "global_step": 650859, "epoch": 7841} {"train_loss": -28.55289077758789, "global_step": 650860, "epoch": 7841} {"train_loss": -28.549768447875977, "global_step": 650861, "epoch": 7841} {"train_loss": -28.594186782836914, "global_step": 650862, "epoch": 7841} {"train_loss": -28.521453857421875, "global_step": 650863, "epoch": 7841} {"train_loss": -29.008466720581055, "global_step": 650864, "epoch": 7841} {"train_loss": -28.450490951538086, "global_step": 650865, "epoch": 7841} {"train_loss": -28.393463134765625, "global_step": 650866, "epoch": 7841} {"train_loss": -28.356042861938477, "global_step": 650867, "epoch": 7841} {"train_loss": -28.748517990112305, "global_step": 650868, "epoch": 7841} {"train_loss": -28.702117919921875, "global_step": 650869, "epoch": 7841} {"train_loss": -27.763181686401367, "global_step": 650870, "epoch": 7841} {"train_loss": -27.80967140197754, "global_step": 650871, "epoch": 7841} {"train_loss": -27.838714599609375, "global_step": 650872, "epoch": 7841} {"train_loss": -27.3070125579834, "global_step": 650873, "epoch": 7841} {"train_loss": -27.810718536376953, "global_step": 650874, "epoch": 7841} {"train_loss": -28.235736846923828, "global_step": 650875, "epoch": 7841} {"train_loss": -28.27020263671875, "global_step": 650876, "epoch": 7841} {"train_loss": -28.058862686157227, "global_step": 650877, "epoch": 7841} {"train_loss": -28.42193031311035, "global_step": 650878, "epoch": 7841} {"train_loss": -28.33738136291504, "global_step": 650879, "epoch": 7841} {"train_loss": -27.93316650390625, "global_step": 650880, "epoch": 7841} {"train_loss": -28.292097091674805, "global_step": 650881, "epoch": 7841} {"train_loss": -28.34111976623535, "global_step": 650882, "epoch": 7841} {"train_loss": -27.882038116455078, "global_step": 650883, "epoch": 7841} {"train_loss": -28.04376792907715, "global_step": 650884, "epoch": 7841} {"train_loss": -28.096593351249236, "global_step": 650885, "epoch": 7841, "val_loss": 6730249.0} {"train_loss": -28.118488311767578, "global_step": 650886, "epoch": 7842} {"train_loss": -27.62714195251465, "global_step": 650887, "epoch": 7842} {"train_loss": -28.04388427734375, "global_step": 650888, "epoch": 7842} {"train_loss": -27.771142959594727, "global_step": 650889, "epoch": 7842} {"train_loss": -27.3441219329834, "global_step": 650890, "epoch": 7842} {"train_loss": -27.789304733276367, "global_step": 650891, "epoch": 7842} {"train_loss": -27.890827178955078, "global_step": 650892, "epoch": 7842} {"train_loss": -27.618804931640625, "global_step": 650893, "epoch": 7842} {"train_loss": -27.416446685791016, "global_step": 650894, "epoch": 7842} {"train_loss": -27.763105392456055, "global_step": 650895, "epoch": 7842} {"train_loss": -27.555028915405273, "global_step": 650896, "epoch": 7842} {"train_loss": -27.734771728515625, "global_step": 650897, "epoch": 7842} {"train_loss": -27.97145652770996, "global_step": 650898, "epoch": 7842} {"train_loss": -27.55497169494629, "global_step": 650899, "epoch": 7842} {"train_loss": -27.877368927001953, "global_step": 650900, "epoch": 7842} {"train_loss": -27.590497970581055, "global_step": 650901, "epoch": 7842} {"train_loss": -28.10513687133789, "global_step": 650902, "epoch": 7842} {"train_loss": -27.995269775390625, "global_step": 650903, "epoch": 7842} {"train_loss": -28.568359375, "global_step": 650904, "epoch": 7842} {"train_loss": -28.060871124267578, "global_step": 650905, "epoch": 7842} {"train_loss": -28.046533584594727, "global_step": 650906, "epoch": 7842} {"train_loss": -28.0965633392334, "global_step": 650907, "epoch": 7842} {"train_loss": -28.145477294921875, "global_step": 650908, "epoch": 7842} {"train_loss": -27.905349731445312, "global_step": 650909, "epoch": 7842} {"train_loss": -28.310026168823242, "global_step": 650910, "epoch": 7842} {"train_loss": -28.29303550720215, "global_step": 650911, "epoch": 7842} {"train_loss": -27.93733787536621, "global_step": 650912, "epoch": 7842} {"train_loss": -28.129133224487305, "global_step": 650913, "epoch": 7842} {"train_loss": -28.120508193969727, "global_step": 650914, "epoch": 7842} {"train_loss": -28.147565841674805, "global_step": 650915, "epoch": 7842} {"train_loss": -28.463911056518555, "global_step": 650916, "epoch": 7842} {"train_loss": -28.19736671447754, "global_step": 650917, "epoch": 7842} {"train_loss": -28.413440704345703, "global_step": 650918, "epoch": 7842} {"train_loss": -28.516361236572266, "global_step": 650919, "epoch": 7842} {"train_loss": -27.91162109375, "global_step": 650920, "epoch": 7842} {"train_loss": -28.46675682067871, "global_step": 650921, "epoch": 7842} {"train_loss": -28.48866081237793, "global_step": 650922, "epoch": 7842} {"train_loss": -28.516149520874023, "global_step": 650923, "epoch": 7842} {"train_loss": -28.299884796142578, "global_step": 650924, "epoch": 7842} {"train_loss": -28.588565826416016, "global_step": 650925, "epoch": 7842} {"train_loss": -28.368915557861328, "global_step": 650926, "epoch": 7842} {"train_loss": -28.682966232299805, "global_step": 650927, "epoch": 7842} {"train_loss": -28.18001365661621, "global_step": 650928, "epoch": 7842} {"train_loss": -28.86298179626465, "global_step": 650929, "epoch": 7842} {"train_loss": -28.12165641784668, "global_step": 650930, "epoch": 7842} {"train_loss": -28.290796279907227, "global_step": 650931, "epoch": 7842} {"train_loss": -28.464344024658203, "global_step": 650932, "epoch": 7842} {"train_loss": -28.52303123474121, "global_step": 650933, "epoch": 7842} {"train_loss": -28.38193702697754, "global_step": 650934, "epoch": 7842} {"train_loss": -27.87867546081543, "global_step": 650935, "epoch": 7842} {"train_loss": -28.17510986328125, "global_step": 650936, "epoch": 7842} {"train_loss": -28.305328369140625, "global_step": 650937, "epoch": 7842} {"train_loss": -28.681554794311523, "global_step": 650938, "epoch": 7842} {"train_loss": -27.923349380493164, "global_step": 650939, "epoch": 7842} {"train_loss": -28.51436424255371, "global_step": 650940, "epoch": 7842} {"train_loss": -28.73828125, "global_step": 650941, "epoch": 7842} {"train_loss": -28.606977462768555, "global_step": 650942, "epoch": 7842} {"train_loss": -28.48883628845215, "global_step": 650943, "epoch": 7842} {"train_loss": -28.469751358032227, "global_step": 650944, "epoch": 7842} {"train_loss": -28.5701961517334, "global_step": 650945, "epoch": 7842} {"train_loss": -28.389755249023438, "global_step": 650946, "epoch": 7842} {"train_loss": -28.050214767456055, "global_step": 650947, "epoch": 7842} {"train_loss": -28.317920684814453, "global_step": 650948, "epoch": 7842} {"train_loss": -28.32065200805664, "global_step": 650949, "epoch": 7842} {"train_loss": -28.227949142456055, "global_step": 650950, "epoch": 7842} {"train_loss": -28.180130004882812, "global_step": 650951, "epoch": 7842} {"train_loss": -28.359365463256836, "global_step": 650952, "epoch": 7842} {"train_loss": -28.413557052612305, "global_step": 650953, "epoch": 7842} {"train_loss": -28.513212203979492, "global_step": 650954, "epoch": 7842} {"train_loss": -28.51825523376465, "global_step": 650955, "epoch": 7842} {"train_loss": -28.09413719177246, "global_step": 650956, "epoch": 7842} {"train_loss": -28.774255752563477, "global_step": 650957, "epoch": 7842} {"train_loss": -28.143192291259766, "global_step": 650958, "epoch": 7842} {"train_loss": -28.256885528564453, "global_step": 650959, "epoch": 7842} {"train_loss": -28.211673736572266, "global_step": 650960, "epoch": 7842} {"train_loss": -28.271228790283203, "global_step": 650961, "epoch": 7842} {"train_loss": -28.155929565429688, "global_step": 650962, "epoch": 7842} {"train_loss": -28.311689376831055, "global_step": 650963, "epoch": 7842} {"train_loss": -28.268774032592773, "global_step": 650964, "epoch": 7842} {"train_loss": -27.853906631469727, "global_step": 650965, "epoch": 7842} {"train_loss": -28.089262008666992, "global_step": 650966, "epoch": 7842} {"train_loss": -28.1315975189209, "global_step": 650967, "epoch": 7842} {"train_loss": -28.195748892175146, "global_step": 650968, "epoch": 7842, "val_loss": 6704269.5} {"train_loss": -27.873777389526367, "global_step": 650969, "epoch": 7843} {"train_loss": -27.968902587890625, "global_step": 650970, "epoch": 7843} {"train_loss": -27.80817222595215, "global_step": 650971, "epoch": 7843} {"train_loss": -27.808507919311523, "global_step": 650972, "epoch": 7843} {"train_loss": -28.144433975219727, "global_step": 650973, "epoch": 7843} {"train_loss": -28.17376708984375, "global_step": 650974, "epoch": 7843} {"train_loss": -28.00431251525879, "global_step": 650975, "epoch": 7843} {"train_loss": -28.131750106811523, "global_step": 650976, "epoch": 7843} {"train_loss": -28.409366607666016, "global_step": 650977, "epoch": 7843} {"train_loss": -28.221179962158203, "global_step": 650978, "epoch": 7843} {"train_loss": -28.285383224487305, "global_step": 650979, "epoch": 7843} {"train_loss": -28.043628692626953, "global_step": 650980, "epoch": 7843} {"train_loss": -28.380090713500977, "global_step": 650981, "epoch": 7843} {"train_loss": -28.187744140625, "global_step": 650982, "epoch": 7843} {"train_loss": -28.044031143188477, "global_step": 650983, "epoch": 7843} {"train_loss": -28.055713653564453, "global_step": 650984, "epoch": 7843} {"train_loss": -28.118860244750977, "global_step": 650985, "epoch": 7843} {"train_loss": -28.132471084594727, "global_step": 650986, "epoch": 7843} {"train_loss": -28.213403701782227, "global_step": 650987, "epoch": 7843} {"train_loss": -28.33847999572754, "global_step": 650988, "epoch": 7843} {"train_loss": -28.27117347717285, "global_step": 650989, "epoch": 7843} {"train_loss": -28.514013290405273, "global_step": 650990, "epoch": 7843} {"train_loss": -27.960622787475586, "global_step": 650991, "epoch": 7843} {"train_loss": -27.842763900756836, "global_step": 650992, "epoch": 7843} {"train_loss": -27.97113609313965, "global_step": 650993, "epoch": 7843} {"train_loss": -28.1333065032959, "global_step": 650994, "epoch": 7843} {"train_loss": -28.4344482421875, "global_step": 650995, "epoch": 7843} {"train_loss": -28.6817626953125, "global_step": 650996, "epoch": 7843} {"train_loss": -27.79363441467285, "global_step": 650997, "epoch": 7843} {"train_loss": -28.243871688842773, "global_step": 650998, "epoch": 7843} {"train_loss": -28.621267318725586, "global_step": 650999, "epoch": 7843} {"train_loss": -28.318195343017578, "global_step": 651000, "epoch": 7843} {"train_loss": -27.9625244140625, "global_step": 651001, "epoch": 7843} {"train_loss": -28.213586807250977, "global_step": 651002, "epoch": 7843} {"train_loss": -28.31732177734375, "global_step": 651003, "epoch": 7843} {"train_loss": -28.435632705688477, "global_step": 651004, "epoch": 7843} {"train_loss": -28.025314331054688, "global_step": 651005, "epoch": 7843} {"train_loss": -28.40215492248535, "global_step": 651006, "epoch": 7843} {"train_loss": -28.25848388671875, "global_step": 651007, "epoch": 7843} {"train_loss": -28.758642196655273, "global_step": 651008, "epoch": 7843} {"train_loss": -28.70026969909668, "global_step": 651009, "epoch": 7843} {"train_loss": -28.454511642456055, "global_step": 651010, "epoch": 7843} {"train_loss": -28.474689483642578, "global_step": 651011, "epoch": 7843} {"train_loss": -28.5555477142334, "global_step": 651012, "epoch": 7843} {"train_loss": -28.851093292236328, "global_step": 651013, "epoch": 7843} {"train_loss": -28.51399803161621, "global_step": 651014, "epoch": 7843} {"train_loss": -28.229984283447266, "global_step": 651015, "epoch": 7843} {"train_loss": -27.958770751953125, "global_step": 651016, "epoch": 7843} {"train_loss": -27.990924835205078, "global_step": 651017, "epoch": 7843} {"train_loss": -28.31855583190918, "global_step": 651018, "epoch": 7843} {"train_loss": -28.58909034729004, "global_step": 651019, "epoch": 7843} {"train_loss": -28.072174072265625, "global_step": 651020, "epoch": 7843} {"train_loss": -28.08917808532715, "global_step": 651021, "epoch": 7843} {"train_loss": -27.76612663269043, "global_step": 651022, "epoch": 7843} {"train_loss": -27.79952049255371, "global_step": 651023, "epoch": 7843} {"train_loss": -27.766836166381836, "global_step": 651024, "epoch": 7843} {"train_loss": -27.512731552124023, "global_step": 651025, "epoch": 7843} {"train_loss": -28.221403121948242, "global_step": 651026, "epoch": 7843} {"train_loss": -27.88654136657715, "global_step": 651027, "epoch": 7843} {"train_loss": -28.089008331298828, "global_step": 651028, "epoch": 7843} {"train_loss": -28.340381622314453, "global_step": 651029, "epoch": 7843} {"train_loss": -28.01836585998535, "global_step": 651030, "epoch": 7843} {"train_loss": -27.732751846313477, "global_step": 651031, "epoch": 7843} {"train_loss": -27.702289581298828, "global_step": 651032, "epoch": 7843} {"train_loss": -27.97877311706543, "global_step": 651033, "epoch": 7843} {"train_loss": -28.452926635742188, "global_step": 651034, "epoch": 7843} {"train_loss": -28.249114990234375, "global_step": 651035, "epoch": 7843} {"train_loss": -28.088220596313477, "global_step": 651036, "epoch": 7843} {"train_loss": -27.980783462524414, "global_step": 651037, "epoch": 7843} {"train_loss": -28.005264282226562, "global_step": 651038, "epoch": 7843} {"train_loss": -28.070783615112305, "global_step": 651039, "epoch": 7843} {"train_loss": -27.83521842956543, "global_step": 651040, "epoch": 7843} {"train_loss": -27.917388916015625, "global_step": 651041, "epoch": 7843} {"train_loss": -28.300939559936523, "global_step": 651042, "epoch": 7843} {"train_loss": -28.215930938720703, "global_step": 651043, "epoch": 7843} {"train_loss": -28.53215980529785, "global_step": 651044, "epoch": 7843} {"train_loss": -28.22893714904785, "global_step": 651045, "epoch": 7843} {"train_loss": -28.498987197875977, "global_step": 651046, "epoch": 7843} {"train_loss": -28.298688888549805, "global_step": 651047, "epoch": 7843} {"train_loss": -28.079404830932617, "global_step": 651048, "epoch": 7843} {"train_loss": -28.488279342651367, "global_step": 651049, "epoch": 7843} {"train_loss": -28.35337257385254, "global_step": 651050, "epoch": 7843} {"train_loss": -28.180358404136566, "global_step": 651051, "epoch": 7843, "val_loss": 6757753.0} {"train_loss": -28.07052993774414, "global_step": 651052, "epoch": 7844} {"train_loss": -27.55803871154785, "global_step": 651053, "epoch": 7844} {"train_loss": -27.6041316986084, "global_step": 651054, "epoch": 7844} {"train_loss": -28.11774253845215, "global_step": 651055, "epoch": 7844} {"train_loss": -28.14361000061035, "global_step": 651056, "epoch": 7844} {"train_loss": -28.121423721313477, "global_step": 651057, "epoch": 7844} {"train_loss": -28.31475830078125, "global_step": 651058, "epoch": 7844} {"train_loss": -28.360748291015625, "global_step": 651059, "epoch": 7844} {"train_loss": -27.79840087890625, "global_step": 651060, "epoch": 7844} {"train_loss": -27.583911895751953, "global_step": 651061, "epoch": 7844} {"train_loss": -28.480152130126953, "global_step": 651062, "epoch": 7844} {"train_loss": -28.16724967956543, "global_step": 651063, "epoch": 7844} {"train_loss": -28.3361759185791, "global_step": 651064, "epoch": 7844} {"train_loss": -28.478851318359375, "global_step": 651065, "epoch": 7844} {"train_loss": -28.181869506835938, "global_step": 651066, "epoch": 7844} {"train_loss": -28.191343307495117, "global_step": 651067, "epoch": 7844} {"train_loss": -28.481922149658203, "global_step": 651068, "epoch": 7844} {"train_loss": -28.51373863220215, "global_step": 651069, "epoch": 7844} {"train_loss": -28.182758331298828, "global_step": 651070, "epoch": 7844} {"train_loss": -28.302478790283203, "global_step": 651071, "epoch": 7844} {"train_loss": -27.937543869018555, "global_step": 651072, "epoch": 7844} {"train_loss": -28.639135360717773, "global_step": 651073, "epoch": 7844} {"train_loss": -28.170392990112305, "global_step": 651074, "epoch": 7844} {"train_loss": -28.736865997314453, "global_step": 651075, "epoch": 7844} {"train_loss": -28.6387882232666, "global_step": 651076, "epoch": 7844} {"train_loss": -28.005558013916016, "global_step": 651077, "epoch": 7844} {"train_loss": -28.425857543945312, "global_step": 651078, "epoch": 7844} {"train_loss": -28.31165885925293, "global_step": 651079, "epoch": 7844} {"train_loss": -28.473255157470703, "global_step": 651080, "epoch": 7844} {"train_loss": -28.27601432800293, "global_step": 651081, "epoch": 7844} {"train_loss": -27.66575050354004, "global_step": 651082, "epoch": 7844} {"train_loss": -28.043813705444336, "global_step": 651083, "epoch": 7844} {"train_loss": -28.38508415222168, "global_step": 651084, "epoch": 7844} {"train_loss": -27.89888572692871, "global_step": 651085, "epoch": 7844} {"train_loss": -27.736129760742188, "global_step": 651086, "epoch": 7844} {"train_loss": -28.09161949157715, "global_step": 651087, "epoch": 7844} {"train_loss": -28.3104305267334, "global_step": 651088, "epoch": 7844} {"train_loss": -28.102445602416992, "global_step": 651089, "epoch": 7844} {"train_loss": -28.38521385192871, "global_step": 651090, "epoch": 7844} {"train_loss": -28.195287704467773, "global_step": 651091, "epoch": 7844} {"train_loss": -27.956064224243164, "global_step": 651092, "epoch": 7844} {"train_loss": -28.198150634765625, "global_step": 651093, "epoch": 7844} {"train_loss": -28.239267349243164, "global_step": 651094, "epoch": 7844} {"train_loss": -28.314355850219727, "global_step": 651095, "epoch": 7844} {"train_loss": -27.942291259765625, "global_step": 651096, "epoch": 7844} {"train_loss": -28.5062255859375, "global_step": 651097, "epoch": 7844} {"train_loss": -28.29249382019043, "global_step": 651098, "epoch": 7844} {"train_loss": -28.634077072143555, "global_step": 651099, "epoch": 7844} {"train_loss": -28.560659408569336, "global_step": 651100, "epoch": 7844} {"train_loss": -28.30291748046875, "global_step": 651101, "epoch": 7844} {"train_loss": -28.322790145874023, "global_step": 651102, "epoch": 7844} {"train_loss": -28.149688720703125, "global_step": 651103, "epoch": 7844} {"train_loss": -28.402978897094727, "global_step": 651104, "epoch": 7844} {"train_loss": -28.325475692749023, "global_step": 651105, "epoch": 7844} {"train_loss": -28.6865291595459, "global_step": 651106, "epoch": 7844} {"train_loss": -28.33697509765625, "global_step": 651107, "epoch": 7844} {"train_loss": -28.405847549438477, "global_step": 651108, "epoch": 7844} {"train_loss": -28.39192771911621, "global_step": 651109, "epoch": 7844} {"train_loss": -28.281208038330078, "global_step": 651110, "epoch": 7844} {"train_loss": -28.429197311401367, "global_step": 651111, "epoch": 7844} {"train_loss": -28.28814697265625, "global_step": 651112, "epoch": 7844} {"train_loss": -28.165760040283203, "global_step": 651113, "epoch": 7844} {"train_loss": -28.5301570892334, "global_step": 651114, "epoch": 7844} {"train_loss": -28.430906295776367, "global_step": 651115, "epoch": 7844} {"train_loss": -28.425561904907227, "global_step": 651116, "epoch": 7844} {"train_loss": -28.3748779296875, "global_step": 651117, "epoch": 7844} {"train_loss": -28.27332878112793, "global_step": 651118, "epoch": 7844} {"train_loss": -28.389509201049805, "global_step": 651119, "epoch": 7844} {"train_loss": -28.342166900634766, "global_step": 651120, "epoch": 7844} {"train_loss": -28.39566993713379, "global_step": 651121, "epoch": 7844} {"train_loss": -28.149738311767578, "global_step": 651122, "epoch": 7844} {"train_loss": -28.48113441467285, "global_step": 651123, "epoch": 7844} {"train_loss": -28.342493057250977, "global_step": 651124, "epoch": 7844} {"train_loss": -28.487268447875977, "global_step": 651125, "epoch": 7844} {"train_loss": -28.561370849609375, "global_step": 651126, "epoch": 7844} {"train_loss": -28.42942237854004, "global_step": 651127, "epoch": 7844} {"train_loss": -28.586551666259766, "global_step": 651128, "epoch": 7844} {"train_loss": -28.6191463470459, "global_step": 651129, "epoch": 7844} {"train_loss": -28.355670928955078, "global_step": 651130, "epoch": 7844} {"train_loss": -28.53519058227539, "global_step": 651131, "epoch": 7844} {"train_loss": -28.6024227142334, "global_step": 651132, "epoch": 7844} {"train_loss": -28.394567489624023, "global_step": 651133, "epoch": 7844} {"train_loss": -28.290336815707654, "global_step": 651134, "epoch": 7844, "val_loss": 6690641.0} {"train_loss": -27.570478439331055, "global_step": 651135, "epoch": 7845} {"train_loss": -27.9401912689209, "global_step": 651136, "epoch": 7845} {"train_loss": -28.133405685424805, "global_step": 651137, "epoch": 7845} {"train_loss": -27.778003692626953, "global_step": 651138, "epoch": 7845} {"train_loss": -27.791406631469727, "global_step": 651139, "epoch": 7845} {"train_loss": -27.847909927368164, "global_step": 651140, "epoch": 7845} {"train_loss": -27.665185928344727, "global_step": 651141, "epoch": 7845} {"train_loss": -27.456253051757812, "global_step": 651142, "epoch": 7845} {"train_loss": -28.104055404663086, "global_step": 651143, "epoch": 7845} {"train_loss": -27.619953155517578, "global_step": 651144, "epoch": 7845} {"train_loss": -28.066274642944336, "global_step": 651145, "epoch": 7845} {"train_loss": -28.248281478881836, "global_step": 651146, "epoch": 7845} {"train_loss": -28.118865966796875, "global_step": 651147, "epoch": 7845} {"train_loss": -28.28498649597168, "global_step": 651148, "epoch": 7845} {"train_loss": -27.9603271484375, "global_step": 651149, "epoch": 7845} {"train_loss": -28.1563720703125, "global_step": 651150, "epoch": 7845} {"train_loss": -27.9750919342041, "global_step": 651151, "epoch": 7845} {"train_loss": -28.222936630249023, "global_step": 651152, "epoch": 7845} {"train_loss": -28.06083106994629, "global_step": 651153, "epoch": 7845} {"train_loss": -27.87564468383789, "global_step": 651154, "epoch": 7845} {"train_loss": -27.964828491210938, "global_step": 651155, "epoch": 7845} {"train_loss": -28.46808433532715, "global_step": 651156, "epoch": 7845} {"train_loss": -28.38435935974121, "global_step": 651157, "epoch": 7845} {"train_loss": -28.101736068725586, "global_step": 651158, "epoch": 7845} {"train_loss": -27.892730712890625, "global_step": 651159, "epoch": 7845} {"train_loss": -27.923429489135742, "global_step": 651160, "epoch": 7845} {"train_loss": -27.526702880859375, "global_step": 651161, "epoch": 7845} {"train_loss": -27.565582275390625, "global_step": 651162, "epoch": 7845} {"train_loss": -27.721555709838867, "global_step": 651163, "epoch": 7845} {"train_loss": -28.090377807617188, "global_step": 651164, "epoch": 7845} {"train_loss": -27.901731491088867, "global_step": 651165, "epoch": 7845} {"train_loss": -27.98427391052246, "global_step": 651166, "epoch": 7845} {"train_loss": -28.26527976989746, "global_step": 651167, "epoch": 7845} {"train_loss": -27.929792404174805, "global_step": 651168, "epoch": 7845} {"train_loss": -28.308338165283203, "global_step": 651169, "epoch": 7845} {"train_loss": -28.265241622924805, "global_step": 651170, "epoch": 7845} {"train_loss": -28.275548934936523, "global_step": 651171, "epoch": 7845} {"train_loss": -28.096405029296875, "global_step": 651172, "epoch": 7845} {"train_loss": -28.184507369995117, "global_step": 651173, "epoch": 7845} {"train_loss": -28.383514404296875, "global_step": 651174, "epoch": 7845} {"train_loss": -28.069778442382812, "global_step": 651175, "epoch": 7845} {"train_loss": -28.202178955078125, "global_step": 651176, "epoch": 7845} {"train_loss": -27.827743530273438, "global_step": 651177, "epoch": 7845} {"train_loss": -28.297428131103516, "global_step": 651178, "epoch": 7845} {"train_loss": -28.2580509185791, "global_step": 651179, "epoch": 7845} {"train_loss": -28.176589965820312, "global_step": 651180, "epoch": 7845} {"train_loss": -28.351842880249023, "global_step": 651181, "epoch": 7845} {"train_loss": -28.261505126953125, "global_step": 651182, "epoch": 7845} {"train_loss": -28.350650787353516, "global_step": 651183, "epoch": 7845} {"train_loss": -28.37518310546875, "global_step": 651184, "epoch": 7845} {"train_loss": -28.085494995117188, "global_step": 651185, "epoch": 7845} {"train_loss": -28.19565773010254, "global_step": 651186, "epoch": 7845} {"train_loss": -28.593067169189453, "global_step": 651187, "epoch": 7845} {"train_loss": -28.14499855041504, "global_step": 651188, "epoch": 7845} {"train_loss": -28.196996688842773, "global_step": 651189, "epoch": 7845} {"train_loss": -28.256397247314453, "global_step": 651190, "epoch": 7845} {"train_loss": -28.001815795898438, "global_step": 651191, "epoch": 7845} {"train_loss": -28.49534034729004, "global_step": 651192, "epoch": 7845} {"train_loss": -27.846120834350586, "global_step": 651193, "epoch": 7845} {"train_loss": -28.60910415649414, "global_step": 651194, "epoch": 7845} {"train_loss": -28.054540634155273, "global_step": 651195, "epoch": 7845} {"train_loss": -28.279218673706055, "global_step": 651196, "epoch": 7845} {"train_loss": -28.533857345581055, "global_step": 651197, "epoch": 7845} {"train_loss": -28.366230010986328, "global_step": 651198, "epoch": 7845} {"train_loss": -28.102264404296875, "global_step": 651199, "epoch": 7845} {"train_loss": -28.245874404907227, "global_step": 651200, "epoch": 7845} {"train_loss": -28.048328399658203, "global_step": 651201, "epoch": 7845} {"train_loss": -28.292072296142578, "global_step": 651202, "epoch": 7845} {"train_loss": -28.383779525756836, "global_step": 651203, "epoch": 7845} {"train_loss": -28.392780303955078, "global_step": 651204, "epoch": 7845} {"train_loss": -28.485824584960938, "global_step": 651205, "epoch": 7845} {"train_loss": -28.506595611572266, "global_step": 651206, "epoch": 7845} {"train_loss": -28.147756576538086, "global_step": 651207, "epoch": 7845} {"train_loss": -28.312570571899414, "global_step": 651208, "epoch": 7845} {"train_loss": -28.593585968017578, "global_step": 651209, "epoch": 7845} {"train_loss": -28.48355484008789, "global_step": 651210, "epoch": 7845} {"train_loss": -28.058597564697266, "global_step": 651211, "epoch": 7845} {"train_loss": -28.556842803955078, "global_step": 651212, "epoch": 7845} {"train_loss": -28.162567138671875, "global_step": 651213, "epoch": 7845} {"train_loss": -28.608503341674805, "global_step": 651214, "epoch": 7845} {"train_loss": -28.697912216186523, "global_step": 651215, "epoch": 7845} {"train_loss": -28.824384689331055, "global_step": 651216, "epoch": 7845} {"train_loss": -28.167027186198407, "global_step": 651217, "epoch": 7845, "val_loss": 6664428.5} {"train_loss": -27.034378051757812, "global_step": 651218, "epoch": 7846} {"train_loss": -27.51820945739746, "global_step": 651219, "epoch": 7846} {"train_loss": -26.54573631286621, "global_step": 651220, "epoch": 7846} {"train_loss": -25.332799911499023, "global_step": 651221, "epoch": 7846} {"train_loss": -25.441207885742188, "global_step": 651222, "epoch": 7846} {"train_loss": -26.623014450073242, "global_step": 651223, "epoch": 7846} {"train_loss": -26.99955177307129, "global_step": 651224, "epoch": 7846} {"train_loss": -27.361129760742188, "global_step": 651225, "epoch": 7846} {"train_loss": -26.691116333007812, "global_step": 651226, "epoch": 7846} {"train_loss": -26.828638076782227, "global_step": 651227, "epoch": 7846} {"train_loss": -27.540700912475586, "global_step": 651228, "epoch": 7846} {"train_loss": -27.633853912353516, "global_step": 651229, "epoch": 7846} {"train_loss": -27.490888595581055, "global_step": 651230, "epoch": 7846} {"train_loss": -27.36113929748535, "global_step": 651231, "epoch": 7846} {"train_loss": -27.25006103515625, "global_step": 651232, "epoch": 7846} {"train_loss": -27.328887939453125, "global_step": 651233, "epoch": 7846} {"train_loss": -27.607030868530273, "global_step": 651234, "epoch": 7846} {"train_loss": -27.610309600830078, "global_step": 651235, "epoch": 7846} {"train_loss": -27.585742950439453, "global_step": 651236, "epoch": 7846} {"train_loss": -27.66547966003418, "global_step": 651237, "epoch": 7846} {"train_loss": -27.21331787109375, "global_step": 651238, "epoch": 7846} {"train_loss": -27.699636459350586, "global_step": 651239, "epoch": 7846} {"train_loss": -27.769012451171875, "global_step": 651240, "epoch": 7846} {"train_loss": -27.677457809448242, "global_step": 651241, "epoch": 7846} {"train_loss": -27.77685546875, "global_step": 651242, "epoch": 7846} {"train_loss": -27.622106552124023, "global_step": 651243, "epoch": 7846} {"train_loss": -28.077503204345703, "global_step": 651244, "epoch": 7846} {"train_loss": -27.652212142944336, "global_step": 651245, "epoch": 7846} {"train_loss": -27.207279205322266, "global_step": 651246, "epoch": 7846} {"train_loss": -27.63553237915039, "global_step": 651247, "epoch": 7846} {"train_loss": -28.170873641967773, "global_step": 651248, "epoch": 7846} {"train_loss": -27.66888999938965, "global_step": 651249, "epoch": 7846} {"train_loss": -28.00638198852539, "global_step": 651250, "epoch": 7846} {"train_loss": -27.767215728759766, "global_step": 651251, "epoch": 7846} {"train_loss": -27.57399559020996, "global_step": 651252, "epoch": 7846} {"train_loss": -27.835712432861328, "global_step": 651253, "epoch": 7846} {"train_loss": -28.126575469970703, "global_step": 651254, "epoch": 7846} {"train_loss": -28.18759536743164, "global_step": 651255, "epoch": 7846} {"train_loss": -27.962385177612305, "global_step": 651256, "epoch": 7846} {"train_loss": -27.898008346557617, "global_step": 651257, "epoch": 7846} {"train_loss": -28.38825798034668, "global_step": 651258, "epoch": 7846} {"train_loss": -28.29231071472168, "global_step": 651259, "epoch": 7846} {"train_loss": -28.190601348876953, "global_step": 651260, "epoch": 7846} {"train_loss": -28.41632080078125, "global_step": 651261, "epoch": 7846} {"train_loss": -27.87847328186035, "global_step": 651262, "epoch": 7846} {"train_loss": -28.15638542175293, "global_step": 651263, "epoch": 7846} {"train_loss": -28.24065589904785, "global_step": 651264, "epoch": 7846} {"train_loss": -28.25787353515625, "global_step": 651265, "epoch": 7846} {"train_loss": -28.132177352905273, "global_step": 651266, "epoch": 7846} {"train_loss": -28.24579429626465, "global_step": 651267, "epoch": 7846} {"train_loss": -28.26520347595215, "global_step": 651268, "epoch": 7846} {"train_loss": -28.05128288269043, "global_step": 651269, "epoch": 7846} {"train_loss": -28.338687896728516, "global_step": 651270, "epoch": 7846} {"train_loss": -28.132837295532227, "global_step": 651271, "epoch": 7846} {"train_loss": -28.3912296295166, "global_step": 651272, "epoch": 7846} {"train_loss": -28.558828353881836, "global_step": 651273, "epoch": 7846} {"train_loss": -27.692840576171875, "global_step": 651274, "epoch": 7846} {"train_loss": -27.590234756469727, "global_step": 651275, "epoch": 7846} {"train_loss": -27.704504013061523, "global_step": 651276, "epoch": 7846} {"train_loss": -28.205947875976562, "global_step": 651277, "epoch": 7846} {"train_loss": -27.95076560974121, "global_step": 651278, "epoch": 7846} {"train_loss": -27.943082809448242, "global_step": 651279, "epoch": 7846} {"train_loss": -28.129074096679688, "global_step": 651280, "epoch": 7846} {"train_loss": -28.1035099029541, "global_step": 651281, "epoch": 7846} {"train_loss": -28.266071319580078, "global_step": 651282, "epoch": 7846} {"train_loss": -27.855566024780273, "global_step": 651283, "epoch": 7846} {"train_loss": -28.0308895111084, "global_step": 651284, "epoch": 7846} {"train_loss": -28.32842445373535, "global_step": 651285, "epoch": 7846} {"train_loss": -28.484256744384766, "global_step": 651286, "epoch": 7846} {"train_loss": -28.326385498046875, "global_step": 651287, "epoch": 7846} {"train_loss": -28.49139976501465, "global_step": 651288, "epoch": 7846} {"train_loss": -28.841907501220703, "global_step": 651289, "epoch": 7846} {"train_loss": -28.6016902923584, "global_step": 651290, "epoch": 7846} {"train_loss": -28.205732345581055, "global_step": 651291, "epoch": 7846} {"train_loss": -28.3242244720459, "global_step": 651292, "epoch": 7846} {"train_loss": -28.224058151245117, "global_step": 651293, "epoch": 7846} {"train_loss": -28.46796989440918, "global_step": 651294, "epoch": 7846} {"train_loss": -28.500335693359375, "global_step": 651295, "epoch": 7846} {"train_loss": -28.24934196472168, "global_step": 651296, "epoch": 7846} {"train_loss": -28.43218994140625, "global_step": 651297, "epoch": 7846} {"train_loss": -28.026931762695312, "global_step": 651298, "epoch": 7846} {"train_loss": -28.1761531829834, "global_step": 651299, "epoch": 7846} {"train_loss": -27.841445348348962, "global_step": 651300, "epoch": 7846, "val_loss": 6592882.0} {"train_loss": -27.623249053955078, "global_step": 651301, "epoch": 7847} {"train_loss": -28.26759147644043, "global_step": 651302, "epoch": 7847} {"train_loss": -27.96784019470215, "global_step": 651303, "epoch": 7847} {"train_loss": -27.698286056518555, "global_step": 651304, "epoch": 7847} {"train_loss": -27.968732833862305, "global_step": 651305, "epoch": 7847} {"train_loss": -28.121076583862305, "global_step": 651306, "epoch": 7847} {"train_loss": -28.169336318969727, "global_step": 651307, "epoch": 7847} {"train_loss": -28.506616592407227, "global_step": 651308, "epoch": 7847} {"train_loss": -28.40460205078125, "global_step": 651309, "epoch": 7847} {"train_loss": -27.92377281188965, "global_step": 651310, "epoch": 7847} {"train_loss": -28.33564567565918, "global_step": 651311, "epoch": 7847} {"train_loss": -28.531585693359375, "global_step": 651312, "epoch": 7847} {"train_loss": -28.289823532104492, "global_step": 651313, "epoch": 7847} {"train_loss": -28.21070671081543, "global_step": 651314, "epoch": 7847} {"train_loss": -27.571685791015625, "global_step": 651315, "epoch": 7847} {"train_loss": -27.07623863220215, "global_step": 651316, "epoch": 7847} {"train_loss": -27.273283004760742, "global_step": 651317, "epoch": 7847} {"train_loss": -27.905607223510742, "global_step": 651318, "epoch": 7847} {"train_loss": -28.154996871948242, "global_step": 651319, "epoch": 7847} {"train_loss": -28.295196533203125, "global_step": 651320, "epoch": 7847} {"train_loss": -28.197467803955078, "global_step": 651321, "epoch": 7847} {"train_loss": -28.328229904174805, "global_step": 651322, "epoch": 7847} {"train_loss": -28.63411521911621, "global_step": 651323, "epoch": 7847} {"train_loss": -27.87335205078125, "global_step": 651324, "epoch": 7847} {"train_loss": -28.603195190429688, "global_step": 651325, "epoch": 7847} {"train_loss": -28.432722091674805, "global_step": 651326, "epoch": 7847} {"train_loss": -28.119348526000977, "global_step": 651327, "epoch": 7847} {"train_loss": -28.494068145751953, "global_step": 651328, "epoch": 7847} {"train_loss": -28.153247833251953, "global_step": 651329, "epoch": 7847} {"train_loss": -28.6123046875, "global_step": 651330, "epoch": 7847} {"train_loss": -28.22590446472168, "global_step": 651331, "epoch": 7847} {"train_loss": -28.502643585205078, "global_step": 651332, "epoch": 7847} {"train_loss": -28.335432052612305, "global_step": 651333, "epoch": 7847} {"train_loss": -28.343399047851562, "global_step": 651334, "epoch": 7847} {"train_loss": -28.24173355102539, "global_step": 651335, "epoch": 7847} {"train_loss": -28.331628799438477, "global_step": 651336, "epoch": 7847} {"train_loss": -28.381717681884766, "global_step": 651337, "epoch": 7847} {"train_loss": -28.228336334228516, "global_step": 651338, "epoch": 7847} {"train_loss": -28.278589248657227, "global_step": 651339, "epoch": 7847} {"train_loss": -28.369190216064453, "global_step": 651340, "epoch": 7847} {"train_loss": -28.614276885986328, "global_step": 651341, "epoch": 7847} {"train_loss": -28.573888778686523, "global_step": 651342, "epoch": 7847} {"train_loss": -28.39580726623535, "global_step": 651343, "epoch": 7847} {"train_loss": -28.351715087890625, "global_step": 651344, "epoch": 7847} {"train_loss": -28.293792724609375, "global_step": 651345, "epoch": 7847} {"train_loss": -28.49933433532715, "global_step": 651346, "epoch": 7847} {"train_loss": -28.165225982666016, "global_step": 651347, "epoch": 7847} {"train_loss": -28.5426025390625, "global_step": 651348, "epoch": 7847} {"train_loss": -28.453067779541016, "global_step": 651349, "epoch": 7847} {"train_loss": -27.803335189819336, "global_step": 651350, "epoch": 7847} {"train_loss": -28.7379150390625, "global_step": 651351, "epoch": 7847} {"train_loss": -28.3983211517334, "global_step": 651352, "epoch": 7847} {"train_loss": -28.428380966186523, "global_step": 651353, "epoch": 7847} {"train_loss": -28.242446899414062, "global_step": 651354, "epoch": 7847} {"train_loss": -28.268152236938477, "global_step": 651355, "epoch": 7847} {"train_loss": -28.365447998046875, "global_step": 651356, "epoch": 7847} {"train_loss": -28.509824752807617, "global_step": 651357, "epoch": 7847} {"train_loss": -28.544788360595703, "global_step": 651358, "epoch": 7847} {"train_loss": -28.638479232788086, "global_step": 651359, "epoch": 7847} {"train_loss": -28.641050338745117, "global_step": 651360, "epoch": 7847} {"train_loss": -28.259180068969727, "global_step": 651361, "epoch": 7847} {"train_loss": -28.646682739257812, "global_step": 651362, "epoch": 7847} {"train_loss": -28.604028701782227, "global_step": 651363, "epoch": 7847} {"train_loss": -28.823627471923828, "global_step": 651364, "epoch": 7847} {"train_loss": -28.751773834228516, "global_step": 651365, "epoch": 7847} {"train_loss": -28.504053115844727, "global_step": 651366, "epoch": 7847} {"train_loss": -28.713775634765625, "global_step": 651367, "epoch": 7847} {"train_loss": -28.565128326416016, "global_step": 651368, "epoch": 7847} {"train_loss": -28.344812393188477, "global_step": 651369, "epoch": 7847} {"train_loss": -28.710433959960938, "global_step": 651370, "epoch": 7847} {"train_loss": -28.442289352416992, "global_step": 651371, "epoch": 7847} {"train_loss": -28.5479793548584, "global_step": 651372, "epoch": 7847} {"train_loss": -28.430561065673828, "global_step": 651373, "epoch": 7847} {"train_loss": -28.419132232666016, "global_step": 651374, "epoch": 7847} {"train_loss": -28.14814567565918, "global_step": 651375, "epoch": 7847} {"train_loss": -28.41302490234375, "global_step": 651376, "epoch": 7847} {"train_loss": -28.081562042236328, "global_step": 651377, "epoch": 7847} {"train_loss": -28.337228775024414, "global_step": 651378, "epoch": 7847} {"train_loss": -28.11500358581543, "global_step": 651379, "epoch": 7847} {"train_loss": -28.28900146484375, "global_step": 651380, "epoch": 7847} {"train_loss": -28.2833251953125, "global_step": 651381, "epoch": 7847} {"train_loss": -28.406269073486328, "global_step": 651382, "epoch": 7847} {"train_loss": -28.29652432361281, "global_step": 651383, "epoch": 7847, "val_loss": 6689373.0} {"train_loss": -28.188215255737305, "global_step": 651384, "epoch": 7848} {"train_loss": -27.365100860595703, "global_step": 651385, "epoch": 7848} {"train_loss": -27.38888931274414, "global_step": 651386, "epoch": 7848} {"train_loss": -27.37504005432129, "global_step": 651387, "epoch": 7848} {"train_loss": -27.94761085510254, "global_step": 651388, "epoch": 7848} {"train_loss": -27.812047958374023, "global_step": 651389, "epoch": 7848} {"train_loss": -28.223302841186523, "global_step": 651390, "epoch": 7848} {"train_loss": -27.709768295288086, "global_step": 651391, "epoch": 7848} {"train_loss": -27.798725128173828, "global_step": 651392, "epoch": 7848} {"train_loss": -27.969085693359375, "global_step": 651393, "epoch": 7848} {"train_loss": -27.971792221069336, "global_step": 651394, "epoch": 7848} {"train_loss": -27.97515296936035, "global_step": 651395, "epoch": 7848} {"train_loss": -28.13178825378418, "global_step": 651396, "epoch": 7848} {"train_loss": -28.171695709228516, "global_step": 651397, "epoch": 7848} {"train_loss": -28.18230628967285, "global_step": 651398, "epoch": 7848} {"train_loss": -28.2650203704834, "global_step": 651399, "epoch": 7848} {"train_loss": -28.322843551635742, "global_step": 651400, "epoch": 7848} {"train_loss": -28.577810287475586, "global_step": 651401, "epoch": 7848} {"train_loss": -28.100849151611328, "global_step": 651402, "epoch": 7848} {"train_loss": -28.063535690307617, "global_step": 651403, "epoch": 7848} {"train_loss": -28.251855850219727, "global_step": 651404, "epoch": 7848} {"train_loss": -28.448715209960938, "global_step": 651405, "epoch": 7848} {"train_loss": -28.326385498046875, "global_step": 651406, "epoch": 7848} {"train_loss": -28.811603546142578, "global_step": 651407, "epoch": 7848} {"train_loss": -28.09247398376465, "global_step": 651408, "epoch": 7848} {"train_loss": -28.169355392456055, "global_step": 651409, "epoch": 7848} {"train_loss": -28.87965202331543, "global_step": 651410, "epoch": 7848} {"train_loss": -28.02105140686035, "global_step": 651411, "epoch": 7848} {"train_loss": -28.443073272705078, "global_step": 651412, "epoch": 7848} {"train_loss": -28.322729110717773, "global_step": 651413, "epoch": 7848} {"train_loss": -28.188262939453125, "global_step": 651414, "epoch": 7848} {"train_loss": -28.24773597717285, "global_step": 651415, "epoch": 7848} {"train_loss": -28.305805206298828, "global_step": 651416, "epoch": 7848} {"train_loss": -28.336383819580078, "global_step": 651417, "epoch": 7848} {"train_loss": -28.20088005065918, "global_step": 651418, "epoch": 7848} {"train_loss": -28.4493408203125, "global_step": 651419, "epoch": 7848} {"train_loss": -28.285755157470703, "global_step": 651420, "epoch": 7848} {"train_loss": -28.013641357421875, "global_step": 651421, "epoch": 7848} {"train_loss": -28.210407257080078, "global_step": 651422, "epoch": 7848} {"train_loss": -28.78399658203125, "global_step": 651423, "epoch": 7848} {"train_loss": -28.556095123291016, "global_step": 651424, "epoch": 7848} {"train_loss": -28.49085807800293, "global_step": 651425, "epoch": 7848} {"train_loss": -28.39496421813965, "global_step": 651426, "epoch": 7848} {"train_loss": -28.238977432250977, "global_step": 651427, "epoch": 7848} {"train_loss": -27.992456436157227, "global_step": 651428, "epoch": 7848} {"train_loss": -28.55606460571289, "global_step": 651429, "epoch": 7848} {"train_loss": -28.54654884338379, "global_step": 651430, "epoch": 7848} {"train_loss": -28.497282028198242, "global_step": 651431, "epoch": 7848} {"train_loss": -28.358373641967773, "global_step": 651432, "epoch": 7848} {"train_loss": -28.306848526000977, "global_step": 651433, "epoch": 7848} {"train_loss": -28.407108306884766, "global_step": 651434, "epoch": 7848} {"train_loss": -28.614744186401367, "global_step": 651435, "epoch": 7848} {"train_loss": -28.34266471862793, "global_step": 651436, "epoch": 7848} {"train_loss": -28.123748779296875, "global_step": 651437, "epoch": 7848} {"train_loss": -28.67987632751465, "global_step": 651438, "epoch": 7848} {"train_loss": -28.36309242248535, "global_step": 651439, "epoch": 7848} {"train_loss": -27.948896408081055, "global_step": 651440, "epoch": 7848} {"train_loss": -28.467792510986328, "global_step": 651441, "epoch": 7848} {"train_loss": -28.634429931640625, "global_step": 651442, "epoch": 7848} {"train_loss": -28.461151123046875, "global_step": 651443, "epoch": 7848} {"train_loss": -28.043121337890625, "global_step": 651444, "epoch": 7848} {"train_loss": -28.033605575561523, "global_step": 651445, "epoch": 7848} {"train_loss": -27.29571533203125, "global_step": 651446, "epoch": 7848} {"train_loss": -26.8328914642334, "global_step": 651447, "epoch": 7848} {"train_loss": -27.752796173095703, "global_step": 651448, "epoch": 7848} {"train_loss": -28.095199584960938, "global_step": 651449, "epoch": 7848} {"train_loss": -27.44586753845215, "global_step": 651450, "epoch": 7848} {"train_loss": -27.618942260742188, "global_step": 651451, "epoch": 7848} {"train_loss": -27.782989501953125, "global_step": 651452, "epoch": 7848} {"train_loss": -27.232501983642578, "global_step": 651453, "epoch": 7848} {"train_loss": -28.051116943359375, "global_step": 651454, "epoch": 7848} {"train_loss": -27.5793514251709, "global_step": 651455, "epoch": 7848} {"train_loss": -28.20047950744629, "global_step": 651456, "epoch": 7848} {"train_loss": -27.79862403869629, "global_step": 651457, "epoch": 7848} {"train_loss": -28.153135299682617, "global_step": 651458, "epoch": 7848} {"train_loss": -27.7380428314209, "global_step": 651459, "epoch": 7848} {"train_loss": -28.27509117126465, "global_step": 651460, "epoch": 7848} {"train_loss": -27.96346092224121, "global_step": 651461, "epoch": 7848} {"train_loss": -27.957616806030273, "global_step": 651462, "epoch": 7848} {"train_loss": -28.411523818969727, "global_step": 651463, "epoch": 7848} {"train_loss": -27.871397018432617, "global_step": 651464, "epoch": 7848} {"train_loss": -28.193998336791992, "global_step": 651465, "epoch": 7848} {"train_loss": -28.14594365315265, "global_step": 651466, "epoch": 7848, "val_loss": 6525822.0} {"train_loss": -27.73824119567871, "global_step": 651467, "epoch": 7849} {"train_loss": -27.81731605529785, "global_step": 651468, "epoch": 7849} {"train_loss": -27.577362060546875, "global_step": 651469, "epoch": 7849} {"train_loss": -27.80205726623535, "global_step": 651470, "epoch": 7849} {"train_loss": -27.87916374206543, "global_step": 651471, "epoch": 7849} {"train_loss": -28.106779098510742, "global_step": 651472, "epoch": 7849} {"train_loss": -27.875919342041016, "global_step": 651473, "epoch": 7849} {"train_loss": -27.77875328063965, "global_step": 651474, "epoch": 7849} {"train_loss": -27.978687286376953, "global_step": 651475, "epoch": 7849} {"train_loss": -27.849048614501953, "global_step": 651476, "epoch": 7849} {"train_loss": -27.8861026763916, "global_step": 651477, "epoch": 7849} {"train_loss": -27.847965240478516, "global_step": 651478, "epoch": 7849} {"train_loss": -28.0187931060791, "global_step": 651479, "epoch": 7849} {"train_loss": -28.152862548828125, "global_step": 651480, "epoch": 7849} {"train_loss": -28.326135635375977, "global_step": 651481, "epoch": 7849} {"train_loss": -28.049081802368164, "global_step": 651482, "epoch": 7849} {"train_loss": -28.138202667236328, "global_step": 651483, "epoch": 7849} {"train_loss": -28.279565811157227, "global_step": 651484, "epoch": 7849} {"train_loss": -28.25701904296875, "global_step": 651485, "epoch": 7849} {"train_loss": -27.946455001831055, "global_step": 651486, "epoch": 7849} {"train_loss": -28.38169288635254, "global_step": 651487, "epoch": 7849} {"train_loss": -28.39065933227539, "global_step": 651488, "epoch": 7849} {"train_loss": -28.036334991455078, "global_step": 651489, "epoch": 7849} {"train_loss": -28.29463005065918, "global_step": 651490, "epoch": 7849} {"train_loss": -28.422443389892578, "global_step": 651491, "epoch": 7849} {"train_loss": -28.285505294799805, "global_step": 651492, "epoch": 7849} {"train_loss": -28.20796775817871, "global_step": 651493, "epoch": 7849} {"train_loss": -28.40401268005371, "global_step": 651494, "epoch": 7849} {"train_loss": -28.337305068969727, "global_step": 651495, "epoch": 7849} {"train_loss": -28.30803871154785, "global_step": 651496, "epoch": 7849} {"train_loss": -28.418304443359375, "global_step": 651497, "epoch": 7849} {"train_loss": -28.39414405822754, "global_step": 651498, "epoch": 7849} {"train_loss": -28.482507705688477, "global_step": 651499, "epoch": 7849} {"train_loss": -28.402969360351562, "global_step": 651500, "epoch": 7849} {"train_loss": -28.098424911499023, "global_step": 651501, "epoch": 7849} {"train_loss": -28.18879508972168, "global_step": 651502, "epoch": 7849} {"train_loss": -28.525531768798828, "global_step": 651503, "epoch": 7849} {"train_loss": -28.295583724975586, "global_step": 651504, "epoch": 7849} {"train_loss": -28.285634994506836, "global_step": 651505, "epoch": 7849} {"train_loss": -28.496259689331055, "global_step": 651506, "epoch": 7849} {"train_loss": -28.70636558532715, "global_step": 651507, "epoch": 7849} {"train_loss": -28.51651954650879, "global_step": 651508, "epoch": 7849} {"train_loss": -28.503650665283203, "global_step": 651509, "epoch": 7849} {"train_loss": -27.97959327697754, "global_step": 651510, "epoch": 7849} {"train_loss": -28.221872329711914, "global_step": 651511, "epoch": 7849} {"train_loss": -28.453800201416016, "global_step": 651512, "epoch": 7849} {"train_loss": -28.178457260131836, "global_step": 651513, "epoch": 7849} {"train_loss": -28.224451065063477, "global_step": 651514, "epoch": 7849} {"train_loss": -28.023283004760742, "global_step": 651515, "epoch": 7849} {"train_loss": -28.133344650268555, "global_step": 651516, "epoch": 7849} {"train_loss": -28.184741973876953, "global_step": 651517, "epoch": 7849} {"train_loss": -28.79604148864746, "global_step": 651518, "epoch": 7849} {"train_loss": -28.494962692260742, "global_step": 651519, "epoch": 7849} {"train_loss": -28.23517417907715, "global_step": 651520, "epoch": 7849} {"train_loss": -27.983137130737305, "global_step": 651521, "epoch": 7849} {"train_loss": -28.316003799438477, "global_step": 651522, "epoch": 7849} {"train_loss": -28.2699031829834, "global_step": 651523, "epoch": 7849} {"train_loss": -28.501667022705078, "global_step": 651524, "epoch": 7849} {"train_loss": -28.43023681640625, "global_step": 651525, "epoch": 7849} {"train_loss": -28.33481788635254, "global_step": 651526, "epoch": 7849} {"train_loss": -27.817914962768555, "global_step": 651527, "epoch": 7849} {"train_loss": -27.612653732299805, "global_step": 651528, "epoch": 7849} {"train_loss": -28.160476684570312, "global_step": 651529, "epoch": 7849} {"train_loss": -27.94980239868164, "global_step": 651530, "epoch": 7849} {"train_loss": -28.517108917236328, "global_step": 651531, "epoch": 7849} {"train_loss": -28.06488037109375, "global_step": 651532, "epoch": 7849} {"train_loss": -28.07329750061035, "global_step": 651533, "epoch": 7849} {"train_loss": -27.499555587768555, "global_step": 651534, "epoch": 7849} {"train_loss": -27.816503524780273, "global_step": 651535, "epoch": 7849} {"train_loss": -27.458057403564453, "global_step": 651536, "epoch": 7849} {"train_loss": -28.396041870117188, "global_step": 651537, "epoch": 7849} {"train_loss": -28.239486694335938, "global_step": 651538, "epoch": 7849} {"train_loss": -27.9073486328125, "global_step": 651539, "epoch": 7849} {"train_loss": -28.561264038085938, "global_step": 651540, "epoch": 7849} {"train_loss": -28.402114868164062, "global_step": 651541, "epoch": 7849} {"train_loss": -28.1115779876709, "global_step": 651542, "epoch": 7849} {"train_loss": -28.116596221923828, "global_step": 651543, "epoch": 7849} {"train_loss": -28.357580184936523, "global_step": 651544, "epoch": 7849} {"train_loss": -28.402069091796875, "global_step": 651545, "epoch": 7849} {"train_loss": -28.008642196655273, "global_step": 651546, "epoch": 7849} {"train_loss": -28.319400787353516, "global_step": 651547, "epoch": 7849} {"train_loss": -28.636621475219727, "global_step": 651548, "epoch": 7849} {"train_loss": -28.174764702119024, "global_step": 651549, "epoch": 7849, "val_loss": 6628696.5} {"train_loss": -28.259723663330078, "global_step": 651550, "epoch": 7850} {"train_loss": -27.719135284423828, "global_step": 651551, "epoch": 7850} {"train_loss": -28.14386558532715, "global_step": 651552, "epoch": 7850} {"train_loss": -27.763891220092773, "global_step": 651553, "epoch": 7850} {"train_loss": -27.814960479736328, "global_step": 651554, "epoch": 7850} {"train_loss": -28.149755477905273, "global_step": 651555, "epoch": 7850} {"train_loss": -27.829687118530273, "global_step": 651556, "epoch": 7850} {"train_loss": -27.593496322631836, "global_step": 651557, "epoch": 7850} {"train_loss": -27.27606201171875, "global_step": 651558, "epoch": 7850} {"train_loss": -27.815771102905273, "global_step": 651559, "epoch": 7850} {"train_loss": -28.031280517578125, "global_step": 651560, "epoch": 7850} {"train_loss": -28.36323356628418, "global_step": 651561, "epoch": 7850} {"train_loss": -27.86701011657715, "global_step": 651562, "epoch": 7850} {"train_loss": -27.8173828125, "global_step": 651563, "epoch": 7850} {"train_loss": -27.94548988342285, "global_step": 651564, "epoch": 7850} {"train_loss": -27.534687042236328, "global_step": 651565, "epoch": 7850} {"train_loss": -27.5727481842041, "global_step": 651566, "epoch": 7850} {"train_loss": -28.207508087158203, "global_step": 651567, "epoch": 7850} {"train_loss": -27.929773330688477, "global_step": 651568, "epoch": 7850} {"train_loss": -27.619558334350586, "global_step": 651569, "epoch": 7850} {"train_loss": -28.07753562927246, "global_step": 651570, "epoch": 7850} {"train_loss": -28.043859481811523, "global_step": 651571, "epoch": 7850} {"train_loss": -27.984994888305664, "global_step": 651572, "epoch": 7850} {"train_loss": -28.10102653503418, "global_step": 651573, "epoch": 7850} {"train_loss": -28.115570068359375, "global_step": 651574, "epoch": 7850} {"train_loss": -28.303247451782227, "global_step": 651575, "epoch": 7850} {"train_loss": -28.559417724609375, "global_step": 651576, "epoch": 7850} {"train_loss": -28.305593490600586, "global_step": 651577, "epoch": 7850} {"train_loss": -28.2916316986084, "global_step": 651578, "epoch": 7850} {"train_loss": -28.033405303955078, "global_step": 651579, "epoch": 7850} {"train_loss": -28.33681297302246, "global_step": 651580, "epoch": 7850} {"train_loss": -28.53339195251465, "global_step": 651581, "epoch": 7850} {"train_loss": -27.9248104095459, "global_step": 651582, "epoch": 7850} {"train_loss": -28.55301284790039, "global_step": 651583, "epoch": 7850} {"train_loss": -28.127607345581055, "global_step": 651584, "epoch": 7850} {"train_loss": -28.5555419921875, "global_step": 651585, "epoch": 7850} {"train_loss": -28.3290958404541, "global_step": 651586, "epoch": 7850} {"train_loss": -28.137659072875977, "global_step": 651587, "epoch": 7850} {"train_loss": -28.39424705505371, "global_step": 651588, "epoch": 7850} {"train_loss": -28.025243759155273, "global_step": 651589, "epoch": 7850} {"train_loss": -28.24590492248535, "global_step": 651590, "epoch": 7850} {"train_loss": -28.247034072875977, "global_step": 651591, "epoch": 7850} {"train_loss": -28.351545333862305, "global_step": 651592, "epoch": 7850} {"train_loss": -28.51944351196289, "global_step": 651593, "epoch": 7850} {"train_loss": -28.453113555908203, "global_step": 651594, "epoch": 7850} {"train_loss": -28.237104415893555, "global_step": 651595, "epoch": 7850} {"train_loss": -28.30743980407715, "global_step": 651596, "epoch": 7850} {"train_loss": -28.318113327026367, "global_step": 651597, "epoch": 7850} {"train_loss": -28.17315673828125, "global_step": 651598, "epoch": 7850} {"train_loss": -28.245267868041992, "global_step": 651599, "epoch": 7850} {"train_loss": -28.186147689819336, "global_step": 651600, "epoch": 7850} {"train_loss": -28.25773048400879, "global_step": 651601, "epoch": 7850} {"train_loss": -28.419403076171875, "global_step": 651602, "epoch": 7850} {"train_loss": -28.37102699279785, "global_step": 651603, "epoch": 7850} {"train_loss": -28.27400016784668, "global_step": 651604, "epoch": 7850} {"train_loss": -28.038360595703125, "global_step": 651605, "epoch": 7850} {"train_loss": -28.340429306030273, "global_step": 651606, "epoch": 7850} {"train_loss": -28.247690200805664, "global_step": 651607, "epoch": 7850} {"train_loss": -28.21388053894043, "global_step": 651608, "epoch": 7850} {"train_loss": -28.094099044799805, "global_step": 651609, "epoch": 7850} {"train_loss": -28.34950065612793, "global_step": 651610, "epoch": 7850} {"train_loss": -28.483505249023438, "global_step": 651611, "epoch": 7850} {"train_loss": -28.315277099609375, "global_step": 651612, "epoch": 7850} {"train_loss": -27.85243797302246, "global_step": 651613, "epoch": 7850} {"train_loss": -28.240985870361328, "global_step": 651614, "epoch": 7850} {"train_loss": -28.561079025268555, "global_step": 651615, "epoch": 7850} {"train_loss": -28.037353515625, "global_step": 651616, "epoch": 7850} {"train_loss": -28.5201473236084, "global_step": 651617, "epoch": 7850} {"train_loss": -28.637975692749023, "global_step": 651618, "epoch": 7850} {"train_loss": -28.453222274780273, "global_step": 651619, "epoch": 7850} {"train_loss": -27.955413818359375, "global_step": 651620, "epoch": 7850} {"train_loss": -28.17474365234375, "global_step": 651621, "epoch": 7850} {"train_loss": -28.330615997314453, "global_step": 651622, "epoch": 7850} {"train_loss": -28.6765193939209, "global_step": 651623, "epoch": 7850} {"train_loss": -28.430103302001953, "global_step": 651624, "epoch": 7850} {"train_loss": -28.7655029296875, "global_step": 651625, "epoch": 7850} {"train_loss": -28.962539672851562, "global_step": 651626, "epoch": 7850} {"train_loss": -28.36431884765625, "global_step": 651627, "epoch": 7850} {"train_loss": -28.262243270874023, "global_step": 651628, "epoch": 7850} {"train_loss": -28.648603439331055, "global_step": 651629, "epoch": 7850} {"train_loss": -28.513391494750977, "global_step": 651630, "epoch": 7850} {"train_loss": -28.3383731842041, "global_step": 651631, "epoch": 7850} {"train_loss": -28.200175457690136, "global_step": 651632, "epoch": 7850, "train/sim_max_reward_0": 0.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4500000": 1.0, "test/sim_max_reward_4500001": 1.0, "test/sim_max_reward_4500002": 1.0, "test/sim_max_reward_4500003": 1.0, "test/sim_max_reward_4500004": 1.0, "test/sim_max_reward_4500005": 1.0, "test/sim_max_reward_4500006": 1.0, "test/sim_max_reward_4500007": 0.0, "test/sim_max_reward_4500008": 1.0, "test/sim_max_reward_4500009": 1.0, "test/sim_max_reward_4500010": 1.0, "test/sim_max_reward_4500011": 1.0, "test/sim_max_reward_4500012": 1.0, "test/sim_max_reward_4500013": 0.0, "test/sim_max_reward_4500014": 1.0, "test/sim_max_reward_4500015": 1.0, "test/sim_max_reward_4500016": 1.0, "test/sim_max_reward_4500017": 1.0, "test/sim_max_reward_4500018": 0.0, "test/sim_max_reward_4500019": 1.0, "test/sim_max_reward_4500020": 1.0, "test/sim_max_reward_4500021": 1.0, "train/mean_score": 0.8333333333333334, "test/mean_score": 0.8636363636363636, "val_loss": 6635018.5} {"train_loss": -27.997278213500977, "global_step": 651633, "epoch": 7851} {"train_loss": -27.78586196899414, "global_step": 651634, "epoch": 7851} {"train_loss": -27.919803619384766, "global_step": 651635, "epoch": 7851} {"train_loss": -27.421384811401367, "global_step": 651636, "epoch": 7851} {"train_loss": -27.5723876953125, "global_step": 651637, "epoch": 7851} {"train_loss": -27.91355323791504, "global_step": 651638, "epoch": 7851} {"train_loss": -28.0358829498291, "global_step": 651639, "epoch": 7851} {"train_loss": -28.176549911499023, "global_step": 651640, "epoch": 7851} {"train_loss": -28.21491813659668, "global_step": 651641, "epoch": 7851} {"train_loss": -27.75435447692871, "global_step": 651642, "epoch": 7851} {"train_loss": -27.803197860717773, "global_step": 651643, "epoch": 7851} {"train_loss": -28.188329696655273, "global_step": 651644, "epoch": 7851} {"train_loss": -27.991119384765625, "global_step": 651645, "epoch": 7851} {"train_loss": -27.886899948120117, "global_step": 651646, "epoch": 7851} {"train_loss": -28.189077377319336, "global_step": 651647, "epoch": 7851} {"train_loss": -27.873584747314453, "global_step": 651648, "epoch": 7851} {"train_loss": -27.997364044189453, "global_step": 651649, "epoch": 7851} {"train_loss": -27.910680770874023, "global_step": 651650, "epoch": 7851} {"train_loss": -28.2110652923584, "global_step": 651651, "epoch": 7851} {"train_loss": -28.0770320892334, "global_step": 651652, "epoch": 7851} {"train_loss": -28.351444244384766, "global_step": 651653, "epoch": 7851} {"train_loss": -28.235559463500977, "global_step": 651654, "epoch": 7851} {"train_loss": -28.503034591674805, "global_step": 651655, "epoch": 7851} {"train_loss": -28.077436447143555, "global_step": 651656, "epoch": 7851} {"train_loss": -28.06024169921875, "global_step": 651657, "epoch": 7851} {"train_loss": -28.400114059448242, "global_step": 651658, "epoch": 7851} {"train_loss": -28.226764678955078, "global_step": 651659, "epoch": 7851} {"train_loss": -28.281408309936523, "global_step": 651660, "epoch": 7851} {"train_loss": -28.14253044128418, "global_step": 651661, "epoch": 7851} {"train_loss": -28.572904586791992, "global_step": 651662, "epoch": 7851} {"train_loss": -28.202564239501953, "global_step": 651663, "epoch": 7851} {"train_loss": -28.136972427368164, "global_step": 651664, "epoch": 7851} {"train_loss": -28.666797637939453, "global_step": 651665, "epoch": 7851} {"train_loss": -28.162643432617188, "global_step": 651666, "epoch": 7851} {"train_loss": -28.043537139892578, "global_step": 651667, "epoch": 7851} {"train_loss": -28.205753326416016, "global_step": 651668, "epoch": 7851} {"train_loss": -28.312429428100586, "global_step": 651669, "epoch": 7851} {"train_loss": -27.569665908813477, "global_step": 651670, "epoch": 7851} {"train_loss": -28.1790714263916, "global_step": 651671, "epoch": 7851} {"train_loss": -27.746183395385742, "global_step": 651672, "epoch": 7851} {"train_loss": -27.706811904907227, "global_step": 651673, "epoch": 7851} {"train_loss": -26.9660701751709, "global_step": 651674, "epoch": 7851} {"train_loss": -26.71148109436035, "global_step": 651675, "epoch": 7851} {"train_loss": -27.914173126220703, "global_step": 651676, "epoch": 7851} {"train_loss": -27.452680587768555, "global_step": 651677, "epoch": 7851} {"train_loss": -28.00446891784668, "global_step": 651678, "epoch": 7851} {"train_loss": -28.205718994140625, "global_step": 651679, "epoch": 7851} {"train_loss": -28.22544288635254, "global_step": 651680, "epoch": 7851} {"train_loss": -28.231796264648438, "global_step": 651681, "epoch": 7851} {"train_loss": -27.95094871520996, "global_step": 651682, "epoch": 7851} {"train_loss": -28.325605392456055, "global_step": 651683, "epoch": 7851} {"train_loss": -28.17805290222168, "global_step": 651684, "epoch": 7851} {"train_loss": -28.163654327392578, "global_step": 651685, "epoch": 7851} {"train_loss": -28.107437133789062, "global_step": 651686, "epoch": 7851} {"train_loss": -28.074262619018555, "global_step": 651687, "epoch": 7851} {"train_loss": -28.079309463500977, "global_step": 651688, "epoch": 7851} {"train_loss": -28.48170280456543, "global_step": 651689, "epoch": 7851} {"train_loss": -28.479028701782227, "global_step": 651690, "epoch": 7851} {"train_loss": -28.405393600463867, "global_step": 651691, "epoch": 7851} {"train_loss": -28.289112091064453, "global_step": 651692, "epoch": 7851} {"train_loss": -28.005664825439453, "global_step": 651693, "epoch": 7851} {"train_loss": -28.217395782470703, "global_step": 651694, "epoch": 7851} {"train_loss": -28.63933753967285, "global_step": 651695, "epoch": 7851} {"train_loss": -28.511533737182617, "global_step": 651696, "epoch": 7851} {"train_loss": -28.200422286987305, "global_step": 651697, "epoch": 7851} {"train_loss": -28.10622215270996, "global_step": 651698, "epoch": 7851} {"train_loss": -28.287500381469727, "global_step": 651699, "epoch": 7851} {"train_loss": -28.35041618347168, "global_step": 651700, "epoch": 7851} {"train_loss": -28.428171157836914, "global_step": 651701, "epoch": 7851} {"train_loss": -28.453296661376953, "global_step": 651702, "epoch": 7851} {"train_loss": -28.30426597595215, "global_step": 651703, "epoch": 7851} {"train_loss": -28.426725387573242, "global_step": 651704, "epoch": 7851} {"train_loss": -28.555166244506836, "global_step": 651705, "epoch": 7851} {"train_loss": -28.318078994750977, "global_step": 651706, "epoch": 7851} {"train_loss": -27.78101921081543, "global_step": 651707, "epoch": 7851} {"train_loss": -28.110248565673828, "global_step": 651708, "epoch": 7851} {"train_loss": -27.772724151611328, "global_step": 651709, "epoch": 7851} {"train_loss": -27.982196807861328, "global_step": 651710, "epoch": 7851} {"train_loss": -28.442983627319336, "global_step": 651711, "epoch": 7851} {"train_loss": -28.019628524780273, "global_step": 651712, "epoch": 7851} {"train_loss": -28.50778579711914, "global_step": 651713, "epoch": 7851} {"train_loss": -28.00778579711914, "global_step": 651714, "epoch": 7851} {"train_loss": -28.09821489632848, "global_step": 651715, "epoch": 7851, "val_loss": 6550942.5} {"train_loss": -27.21619987487793, "global_step": 651716, "epoch": 7852} {"train_loss": -27.651947021484375, "global_step": 651717, "epoch": 7852} {"train_loss": -27.474838256835938, "global_step": 651718, "epoch": 7852} {"train_loss": -27.73099708557129, "global_step": 651719, "epoch": 7852} {"train_loss": -27.753347396850586, "global_step": 651720, "epoch": 7852} {"train_loss": -27.840087890625, "global_step": 651721, "epoch": 7852} {"train_loss": -28.40542984008789, "global_step": 651722, "epoch": 7852} {"train_loss": -27.98126792907715, "global_step": 651723, "epoch": 7852} {"train_loss": -27.212366104125977, "global_step": 651724, "epoch": 7852} {"train_loss": -28.163007736206055, "global_step": 651725, "epoch": 7852} {"train_loss": -28.166051864624023, "global_step": 651726, "epoch": 7852} {"train_loss": -27.87568473815918, "global_step": 651727, "epoch": 7852} {"train_loss": -27.83294105529785, "global_step": 651728, "epoch": 7852} {"train_loss": -28.0300235748291, "global_step": 651729, "epoch": 7852} {"train_loss": -28.3940372467041, "global_step": 651730, "epoch": 7852} {"train_loss": -28.4984188079834, "global_step": 651731, "epoch": 7852} {"train_loss": -27.8822078704834, "global_step": 651732, "epoch": 7852} {"train_loss": -27.79633903503418, "global_step": 651733, "epoch": 7852} {"train_loss": -28.001081466674805, "global_step": 651734, "epoch": 7852} {"train_loss": -28.10304832458496, "global_step": 651735, "epoch": 7852} {"train_loss": -28.0313777923584, "global_step": 651736, "epoch": 7852} {"train_loss": -28.5006046295166, "global_step": 651737, "epoch": 7852} {"train_loss": -28.279382705688477, "global_step": 651738, "epoch": 7852} {"train_loss": -28.37335205078125, "global_step": 651739, "epoch": 7852} {"train_loss": -28.099777221679688, "global_step": 651740, "epoch": 7852} {"train_loss": -28.473602294921875, "global_step": 651741, "epoch": 7852} {"train_loss": -28.4792423248291, "global_step": 651742, "epoch": 7852} {"train_loss": -28.360519409179688, "global_step": 651743, "epoch": 7852} {"train_loss": -28.346479415893555, "global_step": 651744, "epoch": 7852} {"train_loss": -28.5628719329834, "global_step": 651745, "epoch": 7852} {"train_loss": -28.917287826538086, "global_step": 651746, "epoch": 7852} {"train_loss": -28.302099227905273, "global_step": 651747, "epoch": 7852} {"train_loss": -28.595996856689453, "global_step": 651748, "epoch": 7852} {"train_loss": -28.4357967376709, "global_step": 651749, "epoch": 7852} {"train_loss": -28.334552764892578, "global_step": 651750, "epoch": 7852} {"train_loss": -28.500192642211914, "global_step": 651751, "epoch": 7852} {"train_loss": -28.842273712158203, "global_step": 651752, "epoch": 7852} {"train_loss": -28.680932998657227, "global_step": 651753, "epoch": 7852} {"train_loss": -28.207441329956055, "global_step": 651754, "epoch": 7852} {"train_loss": -28.310718536376953, "global_step": 651755, "epoch": 7852} {"train_loss": -28.45929527282715, "global_step": 651756, "epoch": 7852} {"train_loss": -28.019775390625, "global_step": 651757, "epoch": 7852} {"train_loss": -28.417036056518555, "global_step": 651758, "epoch": 7852} {"train_loss": -28.164270401000977, "global_step": 651759, "epoch": 7852} {"train_loss": -28.3823299407959, "global_step": 651760, "epoch": 7852} {"train_loss": -28.4189453125, "global_step": 651761, "epoch": 7852} {"train_loss": -28.36903190612793, "global_step": 651762, "epoch": 7852} {"train_loss": -28.285755157470703, "global_step": 651763, "epoch": 7852} {"train_loss": -28.498443603515625, "global_step": 651764, "epoch": 7852} {"train_loss": -28.17901039123535, "global_step": 651765, "epoch": 7852} {"train_loss": -28.441511154174805, "global_step": 651766, "epoch": 7852} {"train_loss": -28.046619415283203, "global_step": 651767, "epoch": 7852} {"train_loss": -28.469593048095703, "global_step": 651768, "epoch": 7852} {"train_loss": -28.409793853759766, "global_step": 651769, "epoch": 7852} {"train_loss": -28.421676635742188, "global_step": 651770, "epoch": 7852} {"train_loss": -28.209043502807617, "global_step": 651771, "epoch": 7852} {"train_loss": -28.09493064880371, "global_step": 651772, "epoch": 7852} {"train_loss": -28.668197631835938, "global_step": 651773, "epoch": 7852} {"train_loss": -28.568939208984375, "global_step": 651774, "epoch": 7852} {"train_loss": -27.979307174682617, "global_step": 651775, "epoch": 7852} {"train_loss": -28.681711196899414, "global_step": 651776, "epoch": 7852} {"train_loss": -28.095670700073242, "global_step": 651777, "epoch": 7852} {"train_loss": -28.214574813842773, "global_step": 651778, "epoch": 7852} {"train_loss": -28.333703994750977, "global_step": 651779, "epoch": 7852} {"train_loss": -28.36952781677246, "global_step": 651780, "epoch": 7852} {"train_loss": -28.03714942932129, "global_step": 651781, "epoch": 7852} {"train_loss": -28.22096061706543, "global_step": 651782, "epoch": 7852} {"train_loss": -28.1419734954834, "global_step": 651783, "epoch": 7852} {"train_loss": -28.137662887573242, "global_step": 651784, "epoch": 7852} {"train_loss": -28.2896671295166, "global_step": 651785, "epoch": 7852} {"train_loss": -28.14971351623535, "global_step": 651786, "epoch": 7852} {"train_loss": -28.054182052612305, "global_step": 651787, "epoch": 7852} {"train_loss": -28.171926498413086, "global_step": 651788, "epoch": 7852} {"train_loss": -28.236852645874023, "global_step": 651789, "epoch": 7852} {"train_loss": -28.549413681030273, "global_step": 651790, "epoch": 7852} {"train_loss": -28.17288589477539, "global_step": 651791, "epoch": 7852} {"train_loss": -27.83441162109375, "global_step": 651792, "epoch": 7852} {"train_loss": -27.369281768798828, "global_step": 651793, "epoch": 7852} {"train_loss": -27.434873580932617, "global_step": 651794, "epoch": 7852} {"train_loss": -28.110660552978516, "global_step": 651795, "epoch": 7852} {"train_loss": -27.963275909423828, "global_step": 651796, "epoch": 7852} {"train_loss": -28.291461944580078, "global_step": 651797, "epoch": 7852} {"train_loss": -28.186849548156005, "global_step": 651798, "epoch": 7852, "val_loss": 6612352.5} {"train_loss": -27.78864097595215, "global_step": 651799, "epoch": 7853} {"train_loss": -27.643476486206055, "global_step": 651800, "epoch": 7853} {"train_loss": -27.176847457885742, "global_step": 651801, "epoch": 7853} {"train_loss": -27.571393966674805, "global_step": 651802, "epoch": 7853} {"train_loss": -27.818359375, "global_step": 651803, "epoch": 7853} {"train_loss": -27.188745498657227, "global_step": 651804, "epoch": 7853} {"train_loss": -27.043493270874023, "global_step": 651805, "epoch": 7853} {"train_loss": -27.610685348510742, "global_step": 651806, "epoch": 7853} {"train_loss": -27.560596466064453, "global_step": 651807, "epoch": 7853} {"train_loss": -27.431903839111328, "global_step": 651808, "epoch": 7853} {"train_loss": -27.53158950805664, "global_step": 651809, "epoch": 7853} {"train_loss": -27.641714096069336, "global_step": 651810, "epoch": 7853} {"train_loss": -27.838144302368164, "global_step": 651811, "epoch": 7853} {"train_loss": -27.1282901763916, "global_step": 651812, "epoch": 7853} {"train_loss": -27.709369659423828, "global_step": 651813, "epoch": 7853} {"train_loss": -27.614776611328125, "global_step": 651814, "epoch": 7853} {"train_loss": -27.64369773864746, "global_step": 651815, "epoch": 7853} {"train_loss": -27.9862117767334, "global_step": 651816, "epoch": 7853} {"train_loss": -27.698591232299805, "global_step": 651817, "epoch": 7853} {"train_loss": -27.7911434173584, "global_step": 651818, "epoch": 7853} {"train_loss": -27.59499168395996, "global_step": 651819, "epoch": 7853} {"train_loss": -28.02863121032715, "global_step": 651820, "epoch": 7853} {"train_loss": -27.971099853515625, "global_step": 651821, "epoch": 7853} {"train_loss": -27.786508560180664, "global_step": 651822, "epoch": 7853} {"train_loss": -28.162214279174805, "global_step": 651823, "epoch": 7853} {"train_loss": -27.98650550842285, "global_step": 651824, "epoch": 7853} {"train_loss": -27.44459342956543, "global_step": 651825, "epoch": 7853} {"train_loss": -27.979089736938477, "global_step": 651826, "epoch": 7853} {"train_loss": -28.12891960144043, "global_step": 651827, "epoch": 7853} {"train_loss": -28.338165283203125, "global_step": 651828, "epoch": 7853} {"train_loss": -28.04722023010254, "global_step": 651829, "epoch": 7853} {"train_loss": -28.259185791015625, "global_step": 651830, "epoch": 7853} {"train_loss": -27.8842830657959, "global_step": 651831, "epoch": 7853} {"train_loss": -28.448801040649414, "global_step": 651832, "epoch": 7853} {"train_loss": -28.1019287109375, "global_step": 651833, "epoch": 7853} {"train_loss": -28.174610137939453, "global_step": 651834, "epoch": 7853} {"train_loss": -28.088850021362305, "global_step": 651835, "epoch": 7853} {"train_loss": -28.455982208251953, "global_step": 651836, "epoch": 7853} {"train_loss": -28.30251121520996, "global_step": 651837, "epoch": 7853} {"train_loss": -28.446741104125977, "global_step": 651838, "epoch": 7853} {"train_loss": -28.23780632019043, "global_step": 651839, "epoch": 7853} {"train_loss": -28.3917179107666, "global_step": 651840, "epoch": 7853} {"train_loss": -28.168508529663086, "global_step": 651841, "epoch": 7853} {"train_loss": -28.339502334594727, "global_step": 651842, "epoch": 7853} {"train_loss": -28.308767318725586, "global_step": 651843, "epoch": 7853} {"train_loss": -28.3275203704834, "global_step": 651844, "epoch": 7853} {"train_loss": -27.8663272857666, "global_step": 651845, "epoch": 7853} {"train_loss": -28.5238094329834, "global_step": 651846, "epoch": 7853} {"train_loss": -28.386655807495117, "global_step": 651847, "epoch": 7853} {"train_loss": -28.7332706451416, "global_step": 651848, "epoch": 7853} {"train_loss": -28.65667724609375, "global_step": 651849, "epoch": 7853} {"train_loss": -28.95538330078125, "global_step": 651850, "epoch": 7853} {"train_loss": -28.66855812072754, "global_step": 651851, "epoch": 7853} {"train_loss": -28.400487899780273, "global_step": 651852, "epoch": 7853} {"train_loss": -28.575109481811523, "global_step": 651853, "epoch": 7853} {"train_loss": -28.433393478393555, "global_step": 651854, "epoch": 7853} {"train_loss": -28.57538414001465, "global_step": 651855, "epoch": 7853} {"train_loss": -28.601490020751953, "global_step": 651856, "epoch": 7853} {"train_loss": -28.677490234375, "global_step": 651857, "epoch": 7853} {"train_loss": -28.615966796875, "global_step": 651858, "epoch": 7853} {"train_loss": -28.802515029907227, "global_step": 651859, "epoch": 7853} {"train_loss": -28.25880241394043, "global_step": 651860, "epoch": 7853} {"train_loss": -28.246366500854492, "global_step": 651861, "epoch": 7853} {"train_loss": -28.938190460205078, "global_step": 651862, "epoch": 7853} {"train_loss": -28.557254791259766, "global_step": 651863, "epoch": 7853} {"train_loss": -28.663776397705078, "global_step": 651864, "epoch": 7853} {"train_loss": -28.33150291442871, "global_step": 651865, "epoch": 7853} {"train_loss": -28.24309730529785, "global_step": 651866, "epoch": 7853} {"train_loss": -28.74226188659668, "global_step": 651867, "epoch": 7853} {"train_loss": -28.124608993530273, "global_step": 651868, "epoch": 7853} {"train_loss": -28.06304359436035, "global_step": 651869, "epoch": 7853} {"train_loss": -28.096744537353516, "global_step": 651870, "epoch": 7853} {"train_loss": -28.3217830657959, "global_step": 651871, "epoch": 7853} {"train_loss": -27.939441680908203, "global_step": 651872, "epoch": 7853} {"train_loss": -28.20819664001465, "global_step": 651873, "epoch": 7853} {"train_loss": -28.55377769470215, "global_step": 651874, "epoch": 7853} {"train_loss": -28.5133113861084, "global_step": 651875, "epoch": 7853} {"train_loss": -28.22085952758789, "global_step": 651876, "epoch": 7853} {"train_loss": -28.550745010375977, "global_step": 651877, "epoch": 7853} {"train_loss": -28.460412979125977, "global_step": 651878, "epoch": 7853} {"train_loss": -28.33045768737793, "global_step": 651879, "epoch": 7853} {"train_loss": -28.377771377563477, "global_step": 651880, "epoch": 7853} {"train_loss": -28.13610168824713, "global_step": 651881, "epoch": 7853, "val_loss": 6616047.0} {"train_loss": -27.959308624267578, "global_step": 651882, "epoch": 7854} {"train_loss": -27.301233291625977, "global_step": 651883, "epoch": 7854} {"train_loss": -27.3016414642334, "global_step": 651884, "epoch": 7854} {"train_loss": -27.291715621948242, "global_step": 651885, "epoch": 7854} {"train_loss": -27.9659366607666, "global_step": 651886, "epoch": 7854} {"train_loss": -27.63983154296875, "global_step": 651887, "epoch": 7854} {"train_loss": -27.11370849609375, "global_step": 651888, "epoch": 7854} {"train_loss": -26.794574737548828, "global_step": 651889, "epoch": 7854} {"train_loss": -27.8076171875, "global_step": 651890, "epoch": 7854} {"train_loss": -27.256006240844727, "global_step": 651891, "epoch": 7854} {"train_loss": -27.522130966186523, "global_step": 651892, "epoch": 7854} {"train_loss": -27.960830688476562, "global_step": 651893, "epoch": 7854} {"train_loss": -27.690027236938477, "global_step": 651894, "epoch": 7854} {"train_loss": -27.466230392456055, "global_step": 651895, "epoch": 7854} {"train_loss": -27.640975952148438, "global_step": 651896, "epoch": 7854} {"train_loss": -27.7537899017334, "global_step": 651897, "epoch": 7854} {"train_loss": -27.816038131713867, "global_step": 651898, "epoch": 7854} {"train_loss": -27.79900550842285, "global_step": 651899, "epoch": 7854} {"train_loss": -28.2436466217041, "global_step": 651900, "epoch": 7854} {"train_loss": -28.069562911987305, "global_step": 651901, "epoch": 7854} {"train_loss": -27.878931045532227, "global_step": 651902, "epoch": 7854} {"train_loss": -28.04241943359375, "global_step": 651903, "epoch": 7854} {"train_loss": -28.262378692626953, "global_step": 651904, "epoch": 7854} {"train_loss": -28.034326553344727, "global_step": 651905, "epoch": 7854} {"train_loss": -27.82305908203125, "global_step": 651906, "epoch": 7854} {"train_loss": -28.097822189331055, "global_step": 651907, "epoch": 7854} {"train_loss": -28.0950870513916, "global_step": 651908, "epoch": 7854} {"train_loss": -27.889636993408203, "global_step": 651909, "epoch": 7854} {"train_loss": -27.76576042175293, "global_step": 651910, "epoch": 7854} {"train_loss": -27.956079483032227, "global_step": 651911, "epoch": 7854} {"train_loss": -28.414514541625977, "global_step": 651912, "epoch": 7854} {"train_loss": -28.02717399597168, "global_step": 651913, "epoch": 7854} {"train_loss": -28.149179458618164, "global_step": 651914, "epoch": 7854} {"train_loss": -28.40500831604004, "global_step": 651915, "epoch": 7854} {"train_loss": -28.296293258666992, "global_step": 651916, "epoch": 7854} {"train_loss": -27.765430450439453, "global_step": 651917, "epoch": 7854} {"train_loss": -28.211761474609375, "global_step": 651918, "epoch": 7854} {"train_loss": -28.089223861694336, "global_step": 651919, "epoch": 7854} {"train_loss": -28.150365829467773, "global_step": 651920, "epoch": 7854} {"train_loss": -28.175512313842773, "global_step": 651921, "epoch": 7854} {"train_loss": -28.677209854125977, "global_step": 651922, "epoch": 7854} {"train_loss": -28.069059371948242, "global_step": 651923, "epoch": 7854} {"train_loss": -28.377737045288086, "global_step": 651924, "epoch": 7854} {"train_loss": -28.718032836914062, "global_step": 651925, "epoch": 7854} {"train_loss": -28.399341583251953, "global_step": 651926, "epoch": 7854} {"train_loss": -28.344898223876953, "global_step": 651927, "epoch": 7854} {"train_loss": -28.369359970092773, "global_step": 651928, "epoch": 7854} {"train_loss": -28.297147750854492, "global_step": 651929, "epoch": 7854} {"train_loss": -28.46907615661621, "global_step": 651930, "epoch": 7854} {"train_loss": -28.526126861572266, "global_step": 651931, "epoch": 7854} {"train_loss": -28.841876983642578, "global_step": 651932, "epoch": 7854} {"train_loss": -28.419355392456055, "global_step": 651933, "epoch": 7854} {"train_loss": -28.469873428344727, "global_step": 651934, "epoch": 7854} {"train_loss": -28.319345474243164, "global_step": 651935, "epoch": 7854} {"train_loss": -28.255950927734375, "global_step": 651936, "epoch": 7854} {"train_loss": -28.142919540405273, "global_step": 651937, "epoch": 7854} {"train_loss": -28.567895889282227, "global_step": 651938, "epoch": 7854} {"train_loss": -28.48245620727539, "global_step": 651939, "epoch": 7854} {"train_loss": -28.319427490234375, "global_step": 651940, "epoch": 7854} {"train_loss": -28.58212661743164, "global_step": 651941, "epoch": 7854} {"train_loss": -28.395191192626953, "global_step": 651942, "epoch": 7854} {"train_loss": -28.12306022644043, "global_step": 651943, "epoch": 7854} {"train_loss": -28.15900230407715, "global_step": 651944, "epoch": 7854} {"train_loss": -28.196882247924805, "global_step": 651945, "epoch": 7854} {"train_loss": -28.017240524291992, "global_step": 651946, "epoch": 7854} {"train_loss": -28.39872169494629, "global_step": 651947, "epoch": 7854} {"train_loss": -28.632129669189453, "global_step": 651948, "epoch": 7854} {"train_loss": -28.464553833007812, "global_step": 651949, "epoch": 7854} {"train_loss": -28.207120895385742, "global_step": 651950, "epoch": 7854} {"train_loss": -28.05864906311035, "global_step": 651951, "epoch": 7854} {"train_loss": -28.03436851501465, "global_step": 651952, "epoch": 7854} {"train_loss": -27.93389892578125, "global_step": 651953, "epoch": 7854} {"train_loss": -28.687728881835938, "global_step": 651954, "epoch": 7854} {"train_loss": -28.1145076751709, "global_step": 651955, "epoch": 7854} {"train_loss": -28.71475601196289, "global_step": 651956, "epoch": 7854} {"train_loss": -28.51776123046875, "global_step": 651957, "epoch": 7854} {"train_loss": -28.409687042236328, "global_step": 651958, "epoch": 7854} {"train_loss": -28.3238525390625, "global_step": 651959, "epoch": 7854} {"train_loss": -28.293415069580078, "global_step": 651960, "epoch": 7854} {"train_loss": -28.604721069335938, "global_step": 651961, "epoch": 7854} {"train_loss": -28.54768180847168, "global_step": 651962, "epoch": 7854} {"train_loss": -27.968992233276367, "global_step": 651963, "epoch": 7854} {"train_loss": -28.140971471028156, "global_step": 651964, "epoch": 7854, "val_loss": 6598353.0} {"train_loss": -27.732038497924805, "global_step": 651965, "epoch": 7855} {"train_loss": -27.0918025970459, "global_step": 651966, "epoch": 7855} {"train_loss": -27.35894775390625, "global_step": 651967, "epoch": 7855} {"train_loss": -27.363861083984375, "global_step": 651968, "epoch": 7855} {"train_loss": -26.75593376159668, "global_step": 651969, "epoch": 7855} {"train_loss": -27.23726463317871, "global_step": 651970, "epoch": 7855} {"train_loss": -27.333105087280273, "global_step": 651971, "epoch": 7855} {"train_loss": -27.2961368560791, "global_step": 651972, "epoch": 7855} {"train_loss": -27.50226402282715, "global_step": 651973, "epoch": 7855} {"train_loss": -27.75178337097168, "global_step": 651974, "epoch": 7855} {"train_loss": -27.55533790588379, "global_step": 651975, "epoch": 7855} {"train_loss": -27.472259521484375, "global_step": 651976, "epoch": 7855} {"train_loss": -27.853790283203125, "global_step": 651977, "epoch": 7855} {"train_loss": -27.513336181640625, "global_step": 651978, "epoch": 7855} {"train_loss": -27.803791046142578, "global_step": 651979, "epoch": 7855} {"train_loss": -27.865564346313477, "global_step": 651980, "epoch": 7855} {"train_loss": -28.003559112548828, "global_step": 651981, "epoch": 7855} {"train_loss": -27.76186180114746, "global_step": 651982, "epoch": 7855} {"train_loss": -28.054601669311523, "global_step": 651983, "epoch": 7855} {"train_loss": -27.96538734436035, "global_step": 651984, "epoch": 7855} {"train_loss": -28.155292510986328, "global_step": 651985, "epoch": 7855} {"train_loss": -27.945653915405273, "global_step": 651986, "epoch": 7855} {"train_loss": -27.65651512145996, "global_step": 651987, "epoch": 7855} {"train_loss": -28.049625396728516, "global_step": 651988, "epoch": 7855} {"train_loss": -28.456817626953125, "global_step": 651989, "epoch": 7855} {"train_loss": -28.24094581604004, "global_step": 651990, "epoch": 7855} {"train_loss": -28.427021026611328, "global_step": 651991, "epoch": 7855} {"train_loss": -28.127721786499023, "global_step": 651992, "epoch": 7855} {"train_loss": -28.516254425048828, "global_step": 651993, "epoch": 7855} {"train_loss": -28.39459800720215, "global_step": 651994, "epoch": 7855} {"train_loss": -28.606464385986328, "global_step": 651995, "epoch": 7855} {"train_loss": -28.344785690307617, "global_step": 651996, "epoch": 7855} {"train_loss": -28.211084365844727, "global_step": 651997, "epoch": 7855} {"train_loss": -28.196426391601562, "global_step": 651998, "epoch": 7855} {"train_loss": -27.94293785095215, "global_step": 651999, "epoch": 7855} {"train_loss": -28.674468994140625, "global_step": 652000, "epoch": 7855} {"train_loss": -28.31406593322754, "global_step": 652001, "epoch": 7855} {"train_loss": -28.516576766967773, "global_step": 652002, "epoch": 7855} {"train_loss": -28.53902244567871, "global_step": 652003, "epoch": 7855} {"train_loss": -28.608732223510742, "global_step": 652004, "epoch": 7855} {"train_loss": -28.499006271362305, "global_step": 652005, "epoch": 7855} {"train_loss": -28.52656364440918, "global_step": 652006, "epoch": 7855} {"train_loss": -28.743000030517578, "global_step": 652007, "epoch": 7855} {"train_loss": -28.66804313659668, "global_step": 652008, "epoch": 7855} {"train_loss": -28.3969669342041, "global_step": 652009, "epoch": 7855} {"train_loss": -28.755884170532227, "global_step": 652010, "epoch": 7855} {"train_loss": -28.25146484375, "global_step": 652011, "epoch": 7855} {"train_loss": -28.60688591003418, "global_step": 652012, "epoch": 7855} {"train_loss": -28.423566818237305, "global_step": 652013, "epoch": 7855} {"train_loss": -28.530303955078125, "global_step": 652014, "epoch": 7855} {"train_loss": -28.58587074279785, "global_step": 652015, "epoch": 7855} {"train_loss": -28.9063663482666, "global_step": 652016, "epoch": 7855} {"train_loss": -28.257251739501953, "global_step": 652017, "epoch": 7855} {"train_loss": -28.42408561706543, "global_step": 652018, "epoch": 7855} {"train_loss": -28.571462631225586, "global_step": 652019, "epoch": 7855} {"train_loss": -28.385236740112305, "global_step": 652020, "epoch": 7855} {"train_loss": -28.60288429260254, "global_step": 652021, "epoch": 7855} {"train_loss": -28.51905632019043, "global_step": 652022, "epoch": 7855} {"train_loss": -28.59438133239746, "global_step": 652023, "epoch": 7855} {"train_loss": -27.83929443359375, "global_step": 652024, "epoch": 7855} {"train_loss": -28.081390380859375, "global_step": 652025, "epoch": 7855} {"train_loss": -27.970081329345703, "global_step": 652026, "epoch": 7855} {"train_loss": -27.77235221862793, "global_step": 652027, "epoch": 7855} {"train_loss": -28.418537139892578, "global_step": 652028, "epoch": 7855} {"train_loss": -27.662214279174805, "global_step": 652029, "epoch": 7855} {"train_loss": -28.054428100585938, "global_step": 652030, "epoch": 7855} {"train_loss": -27.61077880859375, "global_step": 652031, "epoch": 7855} {"train_loss": -28.16461181640625, "global_step": 652032, "epoch": 7855} {"train_loss": -28.322275161743164, "global_step": 652033, "epoch": 7855} {"train_loss": -27.90911293029785, "global_step": 652034, "epoch": 7855} {"train_loss": -27.844602584838867, "global_step": 652035, "epoch": 7855} {"train_loss": -27.24256706237793, "global_step": 652036, "epoch": 7855} {"train_loss": -27.5871639251709, "global_step": 652037, "epoch": 7855} {"train_loss": -27.240686416625977, "global_step": 652038, "epoch": 7855} {"train_loss": -27.34745216369629, "global_step": 652039, "epoch": 7855} {"train_loss": -27.77882194519043, "global_step": 652040, "epoch": 7855} {"train_loss": -27.728515625, "global_step": 652041, "epoch": 7855} {"train_loss": -27.83270263671875, "global_step": 652042, "epoch": 7855} {"train_loss": -28.259754180908203, "global_step": 652043, "epoch": 7855} {"train_loss": -27.857147216796875, "global_step": 652044, "epoch": 7855} {"train_loss": -27.48093605041504, "global_step": 652045, "epoch": 7855} {"train_loss": -27.948225021362305, "global_step": 652046, "epoch": 7855} {"train_loss": -28.04574589556958, "global_step": 652047, "epoch": 7855, "val_loss": 6567882.0} {"train_loss": -27.5768985748291, "global_step": 652048, "epoch": 7856} {"train_loss": -27.15728759765625, "global_step": 652049, "epoch": 7856} {"train_loss": -27.197580337524414, "global_step": 652050, "epoch": 7856} {"train_loss": -27.000812530517578, "global_step": 652051, "epoch": 7856} {"train_loss": -27.332006454467773, "global_step": 652052, "epoch": 7856} {"train_loss": -27.5491886138916, "global_step": 652053, "epoch": 7856} {"train_loss": -27.476016998291016, "global_step": 652054, "epoch": 7856} {"train_loss": -27.34282875061035, "global_step": 652055, "epoch": 7856} {"train_loss": -27.262454986572266, "global_step": 652056, "epoch": 7856} {"train_loss": -27.960681915283203, "global_step": 652057, "epoch": 7856} {"train_loss": -27.3587703704834, "global_step": 652058, "epoch": 7856} {"train_loss": -27.806562423706055, "global_step": 652059, "epoch": 7856} {"train_loss": -27.6372013092041, "global_step": 652060, "epoch": 7856} {"train_loss": -27.991851806640625, "global_step": 652061, "epoch": 7856} {"train_loss": -27.920141220092773, "global_step": 652062, "epoch": 7856} {"train_loss": -27.59357261657715, "global_step": 652063, "epoch": 7856} {"train_loss": -28.16336441040039, "global_step": 652064, "epoch": 7856} {"train_loss": -27.817413330078125, "global_step": 652065, "epoch": 7856} {"train_loss": -28.31418800354004, "global_step": 652066, "epoch": 7856} {"train_loss": -28.027856826782227, "global_step": 652067, "epoch": 7856} {"train_loss": -28.169498443603516, "global_step": 652068, "epoch": 7856} {"train_loss": -28.1239070892334, "global_step": 652069, "epoch": 7856} {"train_loss": -28.365222930908203, "global_step": 652070, "epoch": 7856} {"train_loss": -27.789648056030273, "global_step": 652071, "epoch": 7856} {"train_loss": -27.86513328552246, "global_step": 652072, "epoch": 7856} {"train_loss": -27.816131591796875, "global_step": 652073, "epoch": 7856} {"train_loss": -28.10848045349121, "global_step": 652074, "epoch": 7856} {"train_loss": -28.151813507080078, "global_step": 652075, "epoch": 7856} {"train_loss": -28.300100326538086, "global_step": 652076, "epoch": 7856} {"train_loss": -28.171857833862305, "global_step": 652077, "epoch": 7856} {"train_loss": -28.171030044555664, "global_step": 652078, "epoch": 7856} {"train_loss": -28.251813888549805, "global_step": 652079, "epoch": 7856} {"train_loss": -28.357160568237305, "global_step": 652080, "epoch": 7856} {"train_loss": -28.21095085144043, "global_step": 652081, "epoch": 7856} {"train_loss": -28.234756469726562, "global_step": 652082, "epoch": 7856} {"train_loss": -28.417926788330078, "global_step": 652083, "epoch": 7856} {"train_loss": -28.19943618774414, "global_step": 652084, "epoch": 7856} {"train_loss": -28.137405395507812, "global_step": 652085, "epoch": 7856} {"train_loss": -28.597763061523438, "global_step": 652086, "epoch": 7856} {"train_loss": -28.104528427124023, "global_step": 652087, "epoch": 7856} {"train_loss": -28.686681747436523, "global_step": 652088, "epoch": 7856} {"train_loss": -28.333200454711914, "global_step": 652089, "epoch": 7856} {"train_loss": -28.33600425720215, "global_step": 652090, "epoch": 7856} {"train_loss": -28.3818416595459, "global_step": 652091, "epoch": 7856} {"train_loss": -28.492685317993164, "global_step": 652092, "epoch": 7856} {"train_loss": -28.66815185546875, "global_step": 652093, "epoch": 7856} {"train_loss": -28.7602481842041, "global_step": 652094, "epoch": 7856} {"train_loss": -28.491140365600586, "global_step": 652095, "epoch": 7856} {"train_loss": -28.85007095336914, "global_step": 652096, "epoch": 7856} {"train_loss": -28.583831787109375, "global_step": 652097, "epoch": 7856} {"train_loss": -28.463214874267578, "global_step": 652098, "epoch": 7856} {"train_loss": -28.307580947875977, "global_step": 652099, "epoch": 7856} {"train_loss": -28.532129287719727, "global_step": 652100, "epoch": 7856} {"train_loss": -28.346784591674805, "global_step": 652101, "epoch": 7856} {"train_loss": -28.900821685791016, "global_step": 652102, "epoch": 7856} {"train_loss": -28.532861709594727, "global_step": 652103, "epoch": 7856} {"train_loss": -28.168323516845703, "global_step": 652104, "epoch": 7856} {"train_loss": -28.66644859313965, "global_step": 652105, "epoch": 7856} {"train_loss": -28.48023796081543, "global_step": 652106, "epoch": 7856} {"train_loss": -28.54654312133789, "global_step": 652107, "epoch": 7856} {"train_loss": -28.425012588500977, "global_step": 652108, "epoch": 7856} {"train_loss": -28.420093536376953, "global_step": 652109, "epoch": 7856} {"train_loss": -28.50347900390625, "global_step": 652110, "epoch": 7856} {"train_loss": -27.94651222229004, "global_step": 652111, "epoch": 7856} {"train_loss": -28.04524040222168, "global_step": 652112, "epoch": 7856} {"train_loss": -28.132160186767578, "global_step": 652113, "epoch": 7856} {"train_loss": -28.380231857299805, "global_step": 652114, "epoch": 7856} {"train_loss": -28.568159103393555, "global_step": 652115, "epoch": 7856} {"train_loss": -28.429651260375977, "global_step": 652116, "epoch": 7856} {"train_loss": -28.547571182250977, "global_step": 652117, "epoch": 7856} {"train_loss": -28.331090927124023, "global_step": 652118, "epoch": 7856} {"train_loss": -28.443281173706055, "global_step": 652119, "epoch": 7856} {"train_loss": -28.25592041015625, "global_step": 652120, "epoch": 7856} {"train_loss": -28.455793380737305, "global_step": 652121, "epoch": 7856} {"train_loss": -28.194610595703125, "global_step": 652122, "epoch": 7856} {"train_loss": -28.400495529174805, "global_step": 652123, "epoch": 7856} {"train_loss": -28.416534423828125, "global_step": 652124, "epoch": 7856} {"train_loss": -28.548608779907227, "global_step": 652125, "epoch": 7856} {"train_loss": -28.225812911987305, "global_step": 652126, "epoch": 7856} {"train_loss": -28.30667495727539, "global_step": 652127, "epoch": 7856} {"train_loss": -27.97279930114746, "global_step": 652128, "epoch": 7856} {"train_loss": -28.328567504882812, "global_step": 652129, "epoch": 7856} {"train_loss": -28.168560349797627, "global_step": 652130, "epoch": 7856, "val_loss": 6575231.0} {"train_loss": -27.256528854370117, "global_step": 652131, "epoch": 7857} {"train_loss": -27.4969539642334, "global_step": 652132, "epoch": 7857} {"train_loss": -27.7818546295166, "global_step": 652133, "epoch": 7857} {"train_loss": -27.050323486328125, "global_step": 652134, "epoch": 7857} {"train_loss": -28.073423385620117, "global_step": 652135, "epoch": 7857} {"train_loss": -26.98822593688965, "global_step": 652136, "epoch": 7857} {"train_loss": -27.664731979370117, "global_step": 652137, "epoch": 7857} {"train_loss": -28.1127872467041, "global_step": 652138, "epoch": 7857} {"train_loss": -27.743011474609375, "global_step": 652139, "epoch": 7857} {"train_loss": -27.485212326049805, "global_step": 652140, "epoch": 7857} {"train_loss": -28.109241485595703, "global_step": 652141, "epoch": 7857} {"train_loss": -27.32755470275879, "global_step": 652142, "epoch": 7857} {"train_loss": -27.997039794921875, "global_step": 652143, "epoch": 7857} {"train_loss": -27.711673736572266, "global_step": 652144, "epoch": 7857} {"train_loss": -27.92046546936035, "global_step": 652145, "epoch": 7857} {"train_loss": -27.77280616760254, "global_step": 652146, "epoch": 7857} {"train_loss": -28.038644790649414, "global_step": 652147, "epoch": 7857} {"train_loss": -28.091291427612305, "global_step": 652148, "epoch": 7857} {"train_loss": -27.711273193359375, "global_step": 652149, "epoch": 7857} {"train_loss": -28.436410903930664, "global_step": 652150, "epoch": 7857} {"train_loss": -27.754621505737305, "global_step": 652151, "epoch": 7857} {"train_loss": -27.993005752563477, "global_step": 652152, "epoch": 7857} {"train_loss": -27.72395133972168, "global_step": 652153, "epoch": 7857} {"train_loss": -27.920019149780273, "global_step": 652154, "epoch": 7857} {"train_loss": -28.39154052734375, "global_step": 652155, "epoch": 7857} {"train_loss": -27.8107852935791, "global_step": 652156, "epoch": 7857} {"train_loss": -28.304534912109375, "global_step": 652157, "epoch": 7857} {"train_loss": -28.15317153930664, "global_step": 652158, "epoch": 7857} {"train_loss": -28.18647575378418, "global_step": 652159, "epoch": 7857} {"train_loss": -28.294763565063477, "global_step": 652160, "epoch": 7857} {"train_loss": -28.18307876586914, "global_step": 652161, "epoch": 7857} {"train_loss": -28.208087921142578, "global_step": 652162, "epoch": 7857} {"train_loss": -28.244314193725586, "global_step": 652163, "epoch": 7857} {"train_loss": -28.12409782409668, "global_step": 652164, "epoch": 7857} {"train_loss": -28.419116973876953, "global_step": 652165, "epoch": 7857} {"train_loss": -28.2075252532959, "global_step": 652166, "epoch": 7857} {"train_loss": -28.24727439880371, "global_step": 652167, "epoch": 7857} {"train_loss": -28.135608673095703, "global_step": 652168, "epoch": 7857} {"train_loss": -27.892797470092773, "global_step": 652169, "epoch": 7857} {"train_loss": -28.009296417236328, "global_step": 652170, "epoch": 7857} {"train_loss": -28.54774284362793, "global_step": 652171, "epoch": 7857} {"train_loss": -28.148252487182617, "global_step": 652172, "epoch": 7857} {"train_loss": -28.0972900390625, "global_step": 652173, "epoch": 7857} {"train_loss": -28.05042839050293, "global_step": 652174, "epoch": 7857} {"train_loss": -28.094675064086914, "global_step": 652175, "epoch": 7857} {"train_loss": -28.012277603149414, "global_step": 652176, "epoch": 7857} {"train_loss": -28.25541114807129, "global_step": 652177, "epoch": 7857} {"train_loss": -28.015790939331055, "global_step": 652178, "epoch": 7857} {"train_loss": -28.572025299072266, "global_step": 652179, "epoch": 7857} {"train_loss": -28.6838436126709, "global_step": 652180, "epoch": 7857} {"train_loss": -28.72944450378418, "global_step": 652181, "epoch": 7857} {"train_loss": -28.698022842407227, "global_step": 652182, "epoch": 7857} {"train_loss": -28.26344108581543, "global_step": 652183, "epoch": 7857} {"train_loss": -28.38799476623535, "global_step": 652184, "epoch": 7857} {"train_loss": -28.703968048095703, "global_step": 652185, "epoch": 7857} {"train_loss": -28.58713722229004, "global_step": 652186, "epoch": 7857} {"train_loss": -28.80124282836914, "global_step": 652187, "epoch": 7857} {"train_loss": -28.04713249206543, "global_step": 652188, "epoch": 7857} {"train_loss": -28.328876495361328, "global_step": 652189, "epoch": 7857} {"train_loss": -28.286787033081055, "global_step": 652190, "epoch": 7857} {"train_loss": -28.43012809753418, "global_step": 652191, "epoch": 7857} {"train_loss": -28.197011947631836, "global_step": 652192, "epoch": 7857} {"train_loss": -28.35353660583496, "global_step": 652193, "epoch": 7857} {"train_loss": -28.664575576782227, "global_step": 652194, "epoch": 7857} {"train_loss": -28.87930679321289, "global_step": 652195, "epoch": 7857} {"train_loss": -28.646442413330078, "global_step": 652196, "epoch": 7857} {"train_loss": -28.46571159362793, "global_step": 652197, "epoch": 7857} {"train_loss": -28.452341079711914, "global_step": 652198, "epoch": 7857} {"train_loss": -28.446044921875, "global_step": 652199, "epoch": 7857} {"train_loss": -28.422666549682617, "global_step": 652200, "epoch": 7857} {"train_loss": -29.166763305664062, "global_step": 652201, "epoch": 7857} {"train_loss": -28.611713409423828, "global_step": 652202, "epoch": 7857} {"train_loss": -28.44061279296875, "global_step": 652203, "epoch": 7857} {"train_loss": -28.34626579284668, "global_step": 652204, "epoch": 7857} {"train_loss": -28.45989990234375, "global_step": 652205, "epoch": 7857} {"train_loss": -28.16253662109375, "global_step": 652206, "epoch": 7857} {"train_loss": -27.66792869567871, "global_step": 652207, "epoch": 7857} {"train_loss": -28.1590576171875, "global_step": 652208, "epoch": 7857} {"train_loss": -28.28415298461914, "global_step": 652209, "epoch": 7857} {"train_loss": -28.43617820739746, "global_step": 652210, "epoch": 7857} {"train_loss": -28.442407608032227, "global_step": 652211, "epoch": 7857} {"train_loss": -28.22381019592285, "global_step": 652212, "epoch": 7857} {"train_loss": -28.149999687470586, "global_step": 652213, "epoch": 7857, "val_loss": 6658727.0} {"train_loss": -27.485193252563477, "global_step": 652214, "epoch": 7858} {"train_loss": -26.443410873413086, "global_step": 652215, "epoch": 7858} {"train_loss": -26.154586791992188, "global_step": 652216, "epoch": 7858} {"train_loss": -26.79277992248535, "global_step": 652217, "epoch": 7858} {"train_loss": -27.573184967041016, "global_step": 652218, "epoch": 7858} {"train_loss": -27.15824317932129, "global_step": 652219, "epoch": 7858} {"train_loss": -26.632200241088867, "global_step": 652220, "epoch": 7858} {"train_loss": -27.85736083984375, "global_step": 652221, "epoch": 7858} {"train_loss": -27.502674102783203, "global_step": 652222, "epoch": 7858} {"train_loss": -27.066923141479492, "global_step": 652223, "epoch": 7858} {"train_loss": -28.03901481628418, "global_step": 652224, "epoch": 7858} {"train_loss": -26.866235733032227, "global_step": 652225, "epoch": 7858} {"train_loss": -27.47979164123535, "global_step": 652226, "epoch": 7858} {"train_loss": -27.88960075378418, "global_step": 652227, "epoch": 7858} {"train_loss": -27.767236709594727, "global_step": 652228, "epoch": 7858} {"train_loss": -27.841339111328125, "global_step": 652229, "epoch": 7858} {"train_loss": -28.008609771728516, "global_step": 652230, "epoch": 7858} {"train_loss": -27.786970138549805, "global_step": 652231, "epoch": 7858} {"train_loss": -27.901525497436523, "global_step": 652232, "epoch": 7858} {"train_loss": -27.887989044189453, "global_step": 652233, "epoch": 7858} {"train_loss": -27.46953773498535, "global_step": 652234, "epoch": 7858} {"train_loss": -27.903106689453125, "global_step": 652235, "epoch": 7858} {"train_loss": -28.0221004486084, "global_step": 652236, "epoch": 7858} {"train_loss": -27.683551788330078, "global_step": 652237, "epoch": 7858} {"train_loss": -28.016157150268555, "global_step": 652238, "epoch": 7858} {"train_loss": -28.0019474029541, "global_step": 652239, "epoch": 7858} {"train_loss": -28.084924697875977, "global_step": 652240, "epoch": 7858} {"train_loss": -28.097808837890625, "global_step": 652241, "epoch": 7858} {"train_loss": -28.314208984375, "global_step": 652242, "epoch": 7858} {"train_loss": -28.1851749420166, "global_step": 652243, "epoch": 7858} {"train_loss": -28.082571029663086, "global_step": 652244, "epoch": 7858} {"train_loss": -28.642688751220703, "global_step": 652245, "epoch": 7858} {"train_loss": -28.27850914001465, "global_step": 652246, "epoch": 7858} {"train_loss": -28.304880142211914, "global_step": 652247, "epoch": 7858} {"train_loss": -28.510208129882812, "global_step": 652248, "epoch": 7858} {"train_loss": -28.341583251953125, "global_step": 652249, "epoch": 7858} {"train_loss": -28.376174926757812, "global_step": 652250, "epoch": 7858} {"train_loss": -28.469751358032227, "global_step": 652251, "epoch": 7858} {"train_loss": -28.449934005737305, "global_step": 652252, "epoch": 7858} {"train_loss": -28.39698600769043, "global_step": 652253, "epoch": 7858} {"train_loss": -28.571969985961914, "global_step": 652254, "epoch": 7858} {"train_loss": -28.358905792236328, "global_step": 652255, "epoch": 7858} {"train_loss": -28.529010772705078, "global_step": 652256, "epoch": 7858} {"train_loss": -28.397327423095703, "global_step": 652257, "epoch": 7858} {"train_loss": -28.537525177001953, "global_step": 652258, "epoch": 7858} {"train_loss": -28.59345054626465, "global_step": 652259, "epoch": 7858} {"train_loss": -28.755542755126953, "global_step": 652260, "epoch": 7858} {"train_loss": -28.495946884155273, "global_step": 652261, "epoch": 7858} {"train_loss": -28.682025909423828, "global_step": 652262, "epoch": 7858} {"train_loss": -28.525537490844727, "global_step": 652263, "epoch": 7858} {"train_loss": -28.3358211517334, "global_step": 652264, "epoch": 7858} {"train_loss": -28.28513526916504, "global_step": 652265, "epoch": 7858} {"train_loss": -28.51827049255371, "global_step": 652266, "epoch": 7858} {"train_loss": -28.105390548706055, "global_step": 652267, "epoch": 7858} {"train_loss": -28.503625869750977, "global_step": 652268, "epoch": 7858} {"train_loss": -28.27400779724121, "global_step": 652269, "epoch": 7858} {"train_loss": -28.386188507080078, "global_step": 652270, "epoch": 7858} {"train_loss": -28.38970947265625, "global_step": 652271, "epoch": 7858} {"train_loss": -28.489831924438477, "global_step": 652272, "epoch": 7858} {"train_loss": -28.325098037719727, "global_step": 652273, "epoch": 7858} {"train_loss": -28.641620635986328, "global_step": 652274, "epoch": 7858} {"train_loss": -28.578073501586914, "global_step": 652275, "epoch": 7858} {"train_loss": -28.65704345703125, "global_step": 652276, "epoch": 7858} {"train_loss": -28.472990036010742, "global_step": 652277, "epoch": 7858} {"train_loss": -28.073270797729492, "global_step": 652278, "epoch": 7858} {"train_loss": -27.995763778686523, "global_step": 652279, "epoch": 7858} {"train_loss": -27.69677734375, "global_step": 652280, "epoch": 7858} {"train_loss": -27.336017608642578, "global_step": 652281, "epoch": 7858} {"train_loss": -27.83108901977539, "global_step": 652282, "epoch": 7858} {"train_loss": -28.61134147644043, "global_step": 652283, "epoch": 7858} {"train_loss": -28.005340576171875, "global_step": 652284, "epoch": 7858} {"train_loss": -28.00565528869629, "global_step": 652285, "epoch": 7858} {"train_loss": -28.388385772705078, "global_step": 652286, "epoch": 7858} {"train_loss": -28.160985946655273, "global_step": 652287, "epoch": 7858} {"train_loss": -28.429773330688477, "global_step": 652288, "epoch": 7858} {"train_loss": -28.272207260131836, "global_step": 652289, "epoch": 7858} {"train_loss": -28.24439811706543, "global_step": 652290, "epoch": 7858} {"train_loss": -27.930404663085938, "global_step": 652291, "epoch": 7858} {"train_loss": -27.950170516967773, "global_step": 652292, "epoch": 7858} {"train_loss": -28.31239128112793, "global_step": 652293, "epoch": 7858} {"train_loss": -27.839506149291992, "global_step": 652294, "epoch": 7858} {"train_loss": -27.856611251831055, "global_step": 652295, "epoch": 7858} {"train_loss": -28.043385126504553, "global_step": 652296, "epoch": 7858, "val_loss": 6635200.0} {"train_loss": -24.570709228515625, "global_step": 652297, "epoch": 7859} {"train_loss": -23.987218856811523, "global_step": 652298, "epoch": 7859} {"train_loss": -23.410659790039062, "global_step": 652299, "epoch": 7859} {"train_loss": -25.637479782104492, "global_step": 652300, "epoch": 7859} {"train_loss": -24.10251235961914, "global_step": 652301, "epoch": 7859} {"train_loss": -25.6413516998291, "global_step": 652302, "epoch": 7859} {"train_loss": -25.712512969970703, "global_step": 652303, "epoch": 7859} {"train_loss": -25.608190536499023, "global_step": 652304, "epoch": 7859} {"train_loss": -25.599233627319336, "global_step": 652305, "epoch": 7859} {"train_loss": -25.84352684020996, "global_step": 652306, "epoch": 7859} {"train_loss": -25.334491729736328, "global_step": 652307, "epoch": 7859} {"train_loss": -25.5624942779541, "global_step": 652308, "epoch": 7859} {"train_loss": -26.14151382446289, "global_step": 652309, "epoch": 7859} {"train_loss": -25.216459274291992, "global_step": 652310, "epoch": 7859} {"train_loss": -25.635984420776367, "global_step": 652311, "epoch": 7859} {"train_loss": -26.147790908813477, "global_step": 652312, "epoch": 7859} {"train_loss": -25.810760498046875, "global_step": 652313, "epoch": 7859} {"train_loss": -25.484914779663086, "global_step": 652314, "epoch": 7859} {"train_loss": -26.410139083862305, "global_step": 652315, "epoch": 7859} {"train_loss": -26.565168380737305, "global_step": 652316, "epoch": 7859} {"train_loss": -26.322782516479492, "global_step": 652317, "epoch": 7859} {"train_loss": -26.455493927001953, "global_step": 652318, "epoch": 7859} {"train_loss": -26.17060661315918, "global_step": 652319, "epoch": 7859} {"train_loss": -25.976673126220703, "global_step": 652320, "epoch": 7859} {"train_loss": -26.49063491821289, "global_step": 652321, "epoch": 7859} {"train_loss": -26.55507469177246, "global_step": 652322, "epoch": 7859} {"train_loss": -27.044713973999023, "global_step": 652323, "epoch": 7859} {"train_loss": -26.7583065032959, "global_step": 652324, "epoch": 7859} {"train_loss": -26.130695343017578, "global_step": 652325, "epoch": 7859} {"train_loss": -26.175067901611328, "global_step": 652326, "epoch": 7859} {"train_loss": -27.139089584350586, "global_step": 652327, "epoch": 7859} {"train_loss": -27.30917739868164, "global_step": 652328, "epoch": 7859} {"train_loss": -26.388397216796875, "global_step": 652329, "epoch": 7859} {"train_loss": -26.72942543029785, "global_step": 652330, "epoch": 7859} {"train_loss": -27.049869537353516, "global_step": 652331, "epoch": 7859} {"train_loss": -26.95330810546875, "global_step": 652332, "epoch": 7859} {"train_loss": -27.133930206298828, "global_step": 652333, "epoch": 7859} {"train_loss": -27.042211532592773, "global_step": 652334, "epoch": 7859} {"train_loss": -26.717487335205078, "global_step": 652335, "epoch": 7859} {"train_loss": -27.13119888305664, "global_step": 652336, "epoch": 7859} {"train_loss": -27.170995712280273, "global_step": 652337, "epoch": 7859} {"train_loss": -27.023107528686523, "global_step": 652338, "epoch": 7859} {"train_loss": -27.33294677734375, "global_step": 652339, "epoch": 7859} {"train_loss": -27.087726593017578, "global_step": 652340, "epoch": 7859} {"train_loss": -27.060211181640625, "global_step": 652341, "epoch": 7859} {"train_loss": -26.998275756835938, "global_step": 652342, "epoch": 7859} {"train_loss": -27.50983238220215, "global_step": 652343, "epoch": 7859} {"train_loss": -27.12051773071289, "global_step": 652344, "epoch": 7859} {"train_loss": -27.539113998413086, "global_step": 652345, "epoch": 7859} {"train_loss": -27.32891273498535, "global_step": 652346, "epoch": 7859} {"train_loss": -27.123029708862305, "global_step": 652347, "epoch": 7859} {"train_loss": -27.53641700744629, "global_step": 652348, "epoch": 7859} {"train_loss": -27.68043327331543, "global_step": 652349, "epoch": 7859} {"train_loss": -27.647037506103516, "global_step": 652350, "epoch": 7859} {"train_loss": -27.96016502380371, "global_step": 652351, "epoch": 7859} {"train_loss": -27.422332763671875, "global_step": 652352, "epoch": 7859} {"train_loss": -27.1247501373291, "global_step": 652353, "epoch": 7859} {"train_loss": -27.560876846313477, "global_step": 652354, "epoch": 7859} {"train_loss": -27.347309112548828, "global_step": 652355, "epoch": 7859} {"train_loss": -27.316190719604492, "global_step": 652356, "epoch": 7859} {"train_loss": -27.44476318359375, "global_step": 652357, "epoch": 7859} {"train_loss": -26.851627349853516, "global_step": 652358, "epoch": 7859} {"train_loss": -27.09165382385254, "global_step": 652359, "epoch": 7859} {"train_loss": -27.551233291625977, "global_step": 652360, "epoch": 7859} {"train_loss": -27.133743286132812, "global_step": 652361, "epoch": 7859} {"train_loss": -27.462635040283203, "global_step": 652362, "epoch": 7859} {"train_loss": -27.627286911010742, "global_step": 652363, "epoch": 7859} {"train_loss": -26.76564598083496, "global_step": 652364, "epoch": 7859} {"train_loss": -27.204477310180664, "global_step": 652365, "epoch": 7859} {"train_loss": -27.879505157470703, "global_step": 652366, "epoch": 7859} {"train_loss": -27.090261459350586, "global_step": 652367, "epoch": 7859} {"train_loss": -27.121051788330078, "global_step": 652368, "epoch": 7859} {"train_loss": -27.877948760986328, "global_step": 652369, "epoch": 7859} {"train_loss": -27.38545036315918, "global_step": 652370, "epoch": 7859} {"train_loss": -27.366455078125, "global_step": 652371, "epoch": 7859} {"train_loss": -27.191436767578125, "global_step": 652372, "epoch": 7859} {"train_loss": -27.12025260925293, "global_step": 652373, "epoch": 7859} {"train_loss": -27.361867904663086, "global_step": 652374, "epoch": 7859} {"train_loss": -27.201196670532227, "global_step": 652375, "epoch": 7859} {"train_loss": -27.1527156829834, "global_step": 652376, "epoch": 7859} {"train_loss": -27.33465576171875, "global_step": 652377, "epoch": 7859} {"train_loss": -27.059518814086914, "global_step": 652378, "epoch": 7859} {"train_loss": -26.710672309599726, "global_step": 652379, "epoch": 7859, "val_loss": 6604004.0} {"train_loss": -26.861469268798828, "global_step": 652380, "epoch": 7860} {"train_loss": -26.804691314697266, "global_step": 652381, "epoch": 7860} {"train_loss": -26.495935440063477, "global_step": 652382, "epoch": 7860} {"train_loss": -26.94610023498535, "global_step": 652383, "epoch": 7860} {"train_loss": -26.480121612548828, "global_step": 652384, "epoch": 7860} {"train_loss": -27.082172393798828, "global_step": 652385, "epoch": 7860} {"train_loss": -26.52237319946289, "global_step": 652386, "epoch": 7860} {"train_loss": -26.504053115844727, "global_step": 652387, "epoch": 7860} {"train_loss": -26.022235870361328, "global_step": 652388, "epoch": 7860} {"train_loss": -26.468942642211914, "global_step": 652389, "epoch": 7860} {"train_loss": -26.658374786376953, "global_step": 652390, "epoch": 7860} {"train_loss": -27.08235740661621, "global_step": 652391, "epoch": 7860} {"train_loss": -26.73221778869629, "global_step": 652392, "epoch": 7860} {"train_loss": -26.95121192932129, "global_step": 652393, "epoch": 7860} {"train_loss": -26.71162223815918, "global_step": 652394, "epoch": 7860} {"train_loss": -27.031951904296875, "global_step": 652395, "epoch": 7860} {"train_loss": -27.041303634643555, "global_step": 652396, "epoch": 7860} {"train_loss": -27.263193130493164, "global_step": 652397, "epoch": 7860} {"train_loss": -27.220111846923828, "global_step": 652398, "epoch": 7860} {"train_loss": -27.3966007232666, "global_step": 652399, "epoch": 7860} {"train_loss": -26.963581085205078, "global_step": 652400, "epoch": 7860} {"train_loss": -26.617841720581055, "global_step": 652401, "epoch": 7860} {"train_loss": -27.17329216003418, "global_step": 652402, "epoch": 7860} {"train_loss": -26.8658390045166, "global_step": 652403, "epoch": 7860} {"train_loss": -26.949644088745117, "global_step": 652404, "epoch": 7860} {"train_loss": -27.078205108642578, "global_step": 652405, "epoch": 7860} {"train_loss": -27.4649715423584, "global_step": 652406, "epoch": 7860} {"train_loss": -27.160736083984375, "global_step": 652407, "epoch": 7860} {"train_loss": -27.460203170776367, "global_step": 652408, "epoch": 7860} {"train_loss": -26.920978546142578, "global_step": 652409, "epoch": 7860} {"train_loss": -26.681644439697266, "global_step": 652410, "epoch": 7860} {"train_loss": -27.061792373657227, "global_step": 652411, "epoch": 7860} {"train_loss": -27.72538185119629, "global_step": 652412, "epoch": 7860} {"train_loss": -27.362592697143555, "global_step": 652413, "epoch": 7860} {"train_loss": -27.50178337097168, "global_step": 652414, "epoch": 7860} {"train_loss": -27.527441024780273, "global_step": 652415, "epoch": 7860} {"train_loss": -27.658527374267578, "global_step": 652416, "epoch": 7860} {"train_loss": -26.972625732421875, "global_step": 652417, "epoch": 7860} {"train_loss": -27.5863037109375, "global_step": 652418, "epoch": 7860} {"train_loss": -26.872732162475586, "global_step": 652419, "epoch": 7860} {"train_loss": -27.777002334594727, "global_step": 652420, "epoch": 7860} {"train_loss": -27.370092391967773, "global_step": 652421, "epoch": 7860} {"train_loss": -27.666034698486328, "global_step": 652422, "epoch": 7860} {"train_loss": -27.32015037536621, "global_step": 652423, "epoch": 7860} {"train_loss": -27.417377471923828, "global_step": 652424, "epoch": 7860} {"train_loss": -26.95013999938965, "global_step": 652425, "epoch": 7860} {"train_loss": -27.37700843811035, "global_step": 652426, "epoch": 7860} {"train_loss": -27.6025390625, "global_step": 652427, "epoch": 7860} {"train_loss": -27.5289249420166, "global_step": 652428, "epoch": 7860} {"train_loss": -27.38331413269043, "global_step": 652429, "epoch": 7860} {"train_loss": -27.69343376159668, "global_step": 652430, "epoch": 7860} {"train_loss": -27.87601089477539, "global_step": 652431, "epoch": 7860} {"train_loss": -27.651960372924805, "global_step": 652432, "epoch": 7860} {"train_loss": -27.700393676757812, "global_step": 652433, "epoch": 7860} {"train_loss": -27.888778686523438, "global_step": 652434, "epoch": 7860} {"train_loss": -28.125391006469727, "global_step": 652435, "epoch": 7860} {"train_loss": -28.125629425048828, "global_step": 652436, "epoch": 7860} {"train_loss": -28.096338272094727, "global_step": 652437, "epoch": 7860} {"train_loss": -28.252639770507812, "global_step": 652438, "epoch": 7860} {"train_loss": -27.904438018798828, "global_step": 652439, "epoch": 7860} {"train_loss": -27.928359985351562, "global_step": 652440, "epoch": 7860} {"train_loss": -27.597797393798828, "global_step": 652441, "epoch": 7860} {"train_loss": -27.459936141967773, "global_step": 652442, "epoch": 7860} {"train_loss": -27.29300308227539, "global_step": 652443, "epoch": 7860} {"train_loss": -28.26192283630371, "global_step": 652444, "epoch": 7860} {"train_loss": -27.9426212310791, "global_step": 652445, "epoch": 7860} {"train_loss": -27.654647827148438, "global_step": 652446, "epoch": 7860} {"train_loss": -28.017047882080078, "global_step": 652447, "epoch": 7860} {"train_loss": -28.28487205505371, "global_step": 652448, "epoch": 7860} {"train_loss": -27.879261016845703, "global_step": 652449, "epoch": 7860} {"train_loss": -27.884016036987305, "global_step": 652450, "epoch": 7860} {"train_loss": -27.82781982421875, "global_step": 652451, "epoch": 7860} {"train_loss": -28.128936767578125, "global_step": 652452, "epoch": 7860} {"train_loss": -27.856250762939453, "global_step": 652453, "epoch": 7860} {"train_loss": -27.310712814331055, "global_step": 652454, "epoch": 7860} {"train_loss": -27.51789665222168, "global_step": 652455, "epoch": 7860} {"train_loss": -27.415143966674805, "global_step": 652456, "epoch": 7860} {"train_loss": -28.472949981689453, "global_step": 652457, "epoch": 7860} {"train_loss": -27.8642635345459, "global_step": 652458, "epoch": 7860} {"train_loss": -27.05146598815918, "global_step": 652459, "epoch": 7860} {"train_loss": -28.43212890625, "global_step": 652460, "epoch": 7860} {"train_loss": -27.507184982299805, "global_step": 652461, "epoch": 7860} {"train_loss": -27.38916461439018, "global_step": 652462, "epoch": 7860, "val_loss": 6610599.0} {"train_loss": -26.67560386657715, "global_step": 652463, "epoch": 7861} {"train_loss": -27.1466007232666, "global_step": 652464, "epoch": 7861} {"train_loss": -26.89752197265625, "global_step": 652465, "epoch": 7861} {"train_loss": -25.939361572265625, "global_step": 652466, "epoch": 7861} {"train_loss": -26.882431030273438, "global_step": 652467, "epoch": 7861} {"train_loss": -26.307382583618164, "global_step": 652468, "epoch": 7861} {"train_loss": -27.1916561126709, "global_step": 652469, "epoch": 7861} {"train_loss": -27.07547378540039, "global_step": 652470, "epoch": 7861} {"train_loss": -27.169721603393555, "global_step": 652471, "epoch": 7861} {"train_loss": -27.0362548828125, "global_step": 652472, "epoch": 7861} {"train_loss": -27.22242546081543, "global_step": 652473, "epoch": 7861} {"train_loss": -26.455129623413086, "global_step": 652474, "epoch": 7861} {"train_loss": -27.1358585357666, "global_step": 652475, "epoch": 7861} {"train_loss": -27.419097900390625, "global_step": 652476, "epoch": 7861} {"train_loss": -27.5438232421875, "global_step": 652477, "epoch": 7861} {"train_loss": -27.9383602142334, "global_step": 652478, "epoch": 7861} {"train_loss": -27.325897216796875, "global_step": 652479, "epoch": 7861} {"train_loss": -27.884069442749023, "global_step": 652480, "epoch": 7861} {"train_loss": -27.76973533630371, "global_step": 652481, "epoch": 7861} {"train_loss": -28.02911376953125, "global_step": 652482, "epoch": 7861} {"train_loss": -27.708581924438477, "global_step": 652483, "epoch": 7861} {"train_loss": -27.327072143554688, "global_step": 652484, "epoch": 7861} {"train_loss": -27.605737686157227, "global_step": 652485, "epoch": 7861} {"train_loss": -27.680774688720703, "global_step": 652486, "epoch": 7861} {"train_loss": -27.89906883239746, "global_step": 652487, "epoch": 7861} {"train_loss": -27.9212703704834, "global_step": 652488, "epoch": 7861} {"train_loss": -27.605390548706055, "global_step": 652489, "epoch": 7861} {"train_loss": -27.661529541015625, "global_step": 652490, "epoch": 7861} {"train_loss": -27.944793701171875, "global_step": 652491, "epoch": 7861} {"train_loss": -27.869531631469727, "global_step": 652492, "epoch": 7861} {"train_loss": -27.81608009338379, "global_step": 652493, "epoch": 7861} {"train_loss": -28.109521865844727, "global_step": 652494, "epoch": 7861} {"train_loss": -27.9805850982666, "global_step": 652495, "epoch": 7861} {"train_loss": -27.81931495666504, "global_step": 652496, "epoch": 7861} {"train_loss": -27.966053009033203, "global_step": 652497, "epoch": 7861} {"train_loss": -28.235483169555664, "global_step": 652498, "epoch": 7861} {"train_loss": -28.304636001586914, "global_step": 652499, "epoch": 7861} {"train_loss": -27.6589298248291, "global_step": 652500, "epoch": 7861} {"train_loss": -28.360595703125, "global_step": 652501, "epoch": 7861} {"train_loss": -28.153467178344727, "global_step": 652502, "epoch": 7861} {"train_loss": -28.10798454284668, "global_step": 652503, "epoch": 7861} {"train_loss": -27.916858673095703, "global_step": 652504, "epoch": 7861} {"train_loss": -28.2990779876709, "global_step": 652505, "epoch": 7861} {"train_loss": -28.61884880065918, "global_step": 652506, "epoch": 7861} {"train_loss": -28.102523803710938, "global_step": 652507, "epoch": 7861} {"train_loss": -28.396154403686523, "global_step": 652508, "epoch": 7861} {"train_loss": -28.121417999267578, "global_step": 652509, "epoch": 7861} {"train_loss": -28.223291397094727, "global_step": 652510, "epoch": 7861} {"train_loss": -27.950239181518555, "global_step": 652511, "epoch": 7861} {"train_loss": -28.042346954345703, "global_step": 652512, "epoch": 7861} {"train_loss": -28.200437545776367, "global_step": 652513, "epoch": 7861} {"train_loss": -28.244077682495117, "global_step": 652514, "epoch": 7861} {"train_loss": -28.18609046936035, "global_step": 652515, "epoch": 7861} {"train_loss": -28.240407943725586, "global_step": 652516, "epoch": 7861} {"train_loss": -28.295785903930664, "global_step": 652517, "epoch": 7861} {"train_loss": -28.35210609436035, "global_step": 652518, "epoch": 7861} {"train_loss": -28.14990234375, "global_step": 652519, "epoch": 7861} {"train_loss": -28.3851375579834, "global_step": 652520, "epoch": 7861} {"train_loss": -28.290735244750977, "global_step": 652521, "epoch": 7861} {"train_loss": -27.889020919799805, "global_step": 652522, "epoch": 7861} {"train_loss": -28.28842544555664, "global_step": 652523, "epoch": 7861} {"train_loss": -27.927518844604492, "global_step": 652524, "epoch": 7861} {"train_loss": -28.117237091064453, "global_step": 652525, "epoch": 7861} {"train_loss": -27.95405387878418, "global_step": 652526, "epoch": 7861} {"train_loss": -28.849777221679688, "global_step": 652527, "epoch": 7861} {"train_loss": -28.295812606811523, "global_step": 652528, "epoch": 7861} {"train_loss": -28.04364013671875, "global_step": 652529, "epoch": 7861} {"train_loss": -28.235095977783203, "global_step": 652530, "epoch": 7861} {"train_loss": -28.262876510620117, "global_step": 652531, "epoch": 7861} {"train_loss": -28.310440063476562, "global_step": 652532, "epoch": 7861} {"train_loss": -28.18701171875, "global_step": 652533, "epoch": 7861} {"train_loss": -28.109960556030273, "global_step": 652534, "epoch": 7861} {"train_loss": -28.074249267578125, "global_step": 652535, "epoch": 7861} {"train_loss": -27.407495498657227, "global_step": 652536, "epoch": 7861} {"train_loss": -28.426456451416016, "global_step": 652537, "epoch": 7861} {"train_loss": -28.0375919342041, "global_step": 652538, "epoch": 7861} {"train_loss": -28.095373153686523, "global_step": 652539, "epoch": 7861} {"train_loss": -28.0950870513916, "global_step": 652540, "epoch": 7861} {"train_loss": -27.86147117614746, "global_step": 652541, "epoch": 7861} {"train_loss": -27.732471466064453, "global_step": 652542, "epoch": 7861} {"train_loss": -27.293781280517578, "global_step": 652543, "epoch": 7861} {"train_loss": -27.953601837158203, "global_step": 652544, "epoch": 7861} {"train_loss": -27.83238399459655, "global_step": 652545, "epoch": 7861, "val_loss": 6640819.5} {"train_loss": -26.98876953125, "global_step": 652546, "epoch": 7862} {"train_loss": -26.17571449279785, "global_step": 652547, "epoch": 7862} {"train_loss": -26.847204208374023, "global_step": 652548, "epoch": 7862} {"train_loss": -27.334028244018555, "global_step": 652549, "epoch": 7862} {"train_loss": -27.091482162475586, "global_step": 652550, "epoch": 7862} {"train_loss": -26.462194442749023, "global_step": 652551, "epoch": 7862} {"train_loss": -27.71192741394043, "global_step": 652552, "epoch": 7862} {"train_loss": -27.182373046875, "global_step": 652553, "epoch": 7862} {"train_loss": -27.446502685546875, "global_step": 652554, "epoch": 7862} {"train_loss": -27.4669132232666, "global_step": 652555, "epoch": 7862} {"train_loss": -26.94805908203125, "global_step": 652556, "epoch": 7862} {"train_loss": -27.45212745666504, "global_step": 652557, "epoch": 7862} {"train_loss": -27.355289459228516, "global_step": 652558, "epoch": 7862} {"train_loss": -27.250579833984375, "global_step": 652559, "epoch": 7862} {"train_loss": -27.354238510131836, "global_step": 652560, "epoch": 7862} {"train_loss": -27.1866512298584, "global_step": 652561, "epoch": 7862} {"train_loss": -27.873092651367188, "global_step": 652562, "epoch": 7862} {"train_loss": -27.6680850982666, "global_step": 652563, "epoch": 7862} {"train_loss": -27.313932418823242, "global_step": 652564, "epoch": 7862} {"train_loss": -27.725421905517578, "global_step": 652565, "epoch": 7862} {"train_loss": -27.36768913269043, "global_step": 652566, "epoch": 7862} {"train_loss": -27.675580978393555, "global_step": 652567, "epoch": 7862} {"train_loss": -27.539403915405273, "global_step": 652568, "epoch": 7862} {"train_loss": -27.764902114868164, "global_step": 652569, "epoch": 7862} {"train_loss": -27.297147750854492, "global_step": 652570, "epoch": 7862} {"train_loss": -27.874189376831055, "global_step": 652571, "epoch": 7862} {"train_loss": -27.819385528564453, "global_step": 652572, "epoch": 7862} {"train_loss": -27.990039825439453, "global_step": 652573, "epoch": 7862} {"train_loss": -27.865705490112305, "global_step": 652574, "epoch": 7862} {"train_loss": -28.081756591796875, "global_step": 652575, "epoch": 7862} {"train_loss": -27.848041534423828, "global_step": 652576, "epoch": 7862} {"train_loss": -27.984647750854492, "global_step": 652577, "epoch": 7862} {"train_loss": -27.82977867126465, "global_step": 652578, "epoch": 7862} {"train_loss": -28.048480987548828, "global_step": 652579, "epoch": 7862} {"train_loss": -28.002277374267578, "global_step": 652580, "epoch": 7862} {"train_loss": -27.823272705078125, "global_step": 652581, "epoch": 7862} {"train_loss": -27.869369506835938, "global_step": 652582, "epoch": 7862} {"train_loss": -27.79437255859375, "global_step": 652583, "epoch": 7862} {"train_loss": -28.16594886779785, "global_step": 652584, "epoch": 7862} {"train_loss": -28.03140640258789, "global_step": 652585, "epoch": 7862} {"train_loss": -28.033538818359375, "global_step": 652586, "epoch": 7862} {"train_loss": -28.073211669921875, "global_step": 652587, "epoch": 7862} {"train_loss": -28.020841598510742, "global_step": 652588, "epoch": 7862} {"train_loss": -28.115802764892578, "global_step": 652589, "epoch": 7862} {"train_loss": -28.507904052734375, "global_step": 652590, "epoch": 7862} {"train_loss": -28.35883140563965, "global_step": 652591, "epoch": 7862} {"train_loss": -28.45222282409668, "global_step": 652592, "epoch": 7862} {"train_loss": -28.360504150390625, "global_step": 652593, "epoch": 7862} {"train_loss": -28.202173233032227, "global_step": 652594, "epoch": 7862} {"train_loss": -28.32275390625, "global_step": 652595, "epoch": 7862} {"train_loss": -28.290006637573242, "global_step": 652596, "epoch": 7862} {"train_loss": -28.247394561767578, "global_step": 652597, "epoch": 7862} {"train_loss": -28.453161239624023, "global_step": 652598, "epoch": 7862} {"train_loss": -28.53799819946289, "global_step": 652599, "epoch": 7862} {"train_loss": -28.400800704956055, "global_step": 652600, "epoch": 7862} {"train_loss": -28.467166900634766, "global_step": 652601, "epoch": 7862} {"train_loss": -28.296865463256836, "global_step": 652602, "epoch": 7862} {"train_loss": -29.044363021850586, "global_step": 652603, "epoch": 7862} {"train_loss": -28.478214263916016, "global_step": 652604, "epoch": 7862} {"train_loss": -28.675159454345703, "global_step": 652605, "epoch": 7862} {"train_loss": -28.311315536499023, "global_step": 652606, "epoch": 7862} {"train_loss": -28.329858779907227, "global_step": 652607, "epoch": 7862} {"train_loss": -28.865249633789062, "global_step": 652608, "epoch": 7862} {"train_loss": -28.40175437927246, "global_step": 652609, "epoch": 7862} {"train_loss": -28.906904220581055, "global_step": 652610, "epoch": 7862} {"train_loss": -28.3702335357666, "global_step": 652611, "epoch": 7862} {"train_loss": -28.385107040405273, "global_step": 652612, "epoch": 7862} {"train_loss": -28.531484603881836, "global_step": 652613, "epoch": 7862} {"train_loss": -28.582462310791016, "global_step": 652614, "epoch": 7862} {"train_loss": -27.948474884033203, "global_step": 652615, "epoch": 7862} {"train_loss": -28.390119552612305, "global_step": 652616, "epoch": 7862} {"train_loss": -28.76044273376465, "global_step": 652617, "epoch": 7862} {"train_loss": -28.188886642456055, "global_step": 652618, "epoch": 7862} {"train_loss": -28.44477653503418, "global_step": 652619, "epoch": 7862} {"train_loss": -28.406208038330078, "global_step": 652620, "epoch": 7862} {"train_loss": -28.46282958984375, "global_step": 652621, "epoch": 7862} {"train_loss": -27.763742446899414, "global_step": 652622, "epoch": 7862} {"train_loss": -27.820119857788086, "global_step": 652623, "epoch": 7862} {"train_loss": -28.02646827697754, "global_step": 652624, "epoch": 7862} {"train_loss": -28.02373695373535, "global_step": 652625, "epoch": 7862} {"train_loss": -27.53297233581543, "global_step": 652626, "epoch": 7862} {"train_loss": -27.695730209350586, "global_step": 652627, "epoch": 7862} {"train_loss": -27.934150534940052, "global_step": 652628, "epoch": 7862, "val_loss": 6626132.0} {"train_loss": -26.221220016479492, "global_step": 652629, "epoch": 7863} {"train_loss": -26.094257354736328, "global_step": 652630, "epoch": 7863} {"train_loss": -26.51910400390625, "global_step": 652631, "epoch": 7863} {"train_loss": -26.50465965270996, "global_step": 652632, "epoch": 7863} {"train_loss": -27.073434829711914, "global_step": 652633, "epoch": 7863} {"train_loss": -26.16851806640625, "global_step": 652634, "epoch": 7863} {"train_loss": -26.875085830688477, "global_step": 652635, "epoch": 7863} {"train_loss": -26.904584884643555, "global_step": 652636, "epoch": 7863} {"train_loss": -27.505390167236328, "global_step": 652637, "epoch": 7863} {"train_loss": -27.1057186126709, "global_step": 652638, "epoch": 7863} {"train_loss": -27.436248779296875, "global_step": 652639, "epoch": 7863} {"train_loss": -26.691747665405273, "global_step": 652640, "epoch": 7863} {"train_loss": -26.862279891967773, "global_step": 652641, "epoch": 7863} {"train_loss": -27.572021484375, "global_step": 652642, "epoch": 7863} {"train_loss": -27.18922996520996, "global_step": 652643, "epoch": 7863} {"train_loss": -27.693506240844727, "global_step": 652644, "epoch": 7863} {"train_loss": -28.192758560180664, "global_step": 652645, "epoch": 7863} {"train_loss": -27.849332809448242, "global_step": 652646, "epoch": 7863} {"train_loss": -27.67156982421875, "global_step": 652647, "epoch": 7863} {"train_loss": -27.698606491088867, "global_step": 652648, "epoch": 7863} {"train_loss": -27.420059204101562, "global_step": 652649, "epoch": 7863} {"train_loss": -27.92331886291504, "global_step": 652650, "epoch": 7863} {"train_loss": -27.65167808532715, "global_step": 652651, "epoch": 7863} {"train_loss": -27.738571166992188, "global_step": 652652, "epoch": 7863} {"train_loss": -27.585601806640625, "global_step": 652653, "epoch": 7863} {"train_loss": -28.028913497924805, "global_step": 652654, "epoch": 7863} {"train_loss": -27.822921752929688, "global_step": 652655, "epoch": 7863} {"train_loss": -27.965356826782227, "global_step": 652656, "epoch": 7863} {"train_loss": -27.843839645385742, "global_step": 652657, "epoch": 7863} {"train_loss": -27.861661911010742, "global_step": 652658, "epoch": 7863} {"train_loss": -27.914098739624023, "global_step": 652659, "epoch": 7863} {"train_loss": -27.928991317749023, "global_step": 652660, "epoch": 7863} {"train_loss": -28.3091983795166, "global_step": 652661, "epoch": 7863} {"train_loss": -28.25459861755371, "global_step": 652662, "epoch": 7863} {"train_loss": -28.2525577545166, "global_step": 652663, "epoch": 7863} {"train_loss": -28.217315673828125, "global_step": 652664, "epoch": 7863} {"train_loss": -28.063047409057617, "global_step": 652665, "epoch": 7863} {"train_loss": -28.044042587280273, "global_step": 652666, "epoch": 7863} {"train_loss": -28.112613677978516, "global_step": 652667, "epoch": 7863} {"train_loss": -28.272693634033203, "global_step": 652668, "epoch": 7863} {"train_loss": -28.520004272460938, "global_step": 652669, "epoch": 7863} {"train_loss": -28.375158309936523, "global_step": 652670, "epoch": 7863} {"train_loss": -28.324254989624023, "global_step": 652671, "epoch": 7863} {"train_loss": -28.339019775390625, "global_step": 652672, "epoch": 7863} {"train_loss": -28.155981063842773, "global_step": 652673, "epoch": 7863} {"train_loss": -28.673721313476562, "global_step": 652674, "epoch": 7863} {"train_loss": -28.566686630249023, "global_step": 652675, "epoch": 7863} {"train_loss": -28.426105499267578, "global_step": 652676, "epoch": 7863} {"train_loss": -28.218921661376953, "global_step": 652677, "epoch": 7863} {"train_loss": -28.439538955688477, "global_step": 652678, "epoch": 7863} {"train_loss": -28.07887077331543, "global_step": 652679, "epoch": 7863} {"train_loss": -28.310941696166992, "global_step": 652680, "epoch": 7863} {"train_loss": -28.601709365844727, "global_step": 652681, "epoch": 7863} {"train_loss": -28.12383460998535, "global_step": 652682, "epoch": 7863} {"train_loss": -28.560285568237305, "global_step": 652683, "epoch": 7863} {"train_loss": -28.4216365814209, "global_step": 652684, "epoch": 7863} {"train_loss": -28.589923858642578, "global_step": 652685, "epoch": 7863} {"train_loss": -28.927326202392578, "global_step": 652686, "epoch": 7863} {"train_loss": -28.47085952758789, "global_step": 652687, "epoch": 7863} {"train_loss": -28.447132110595703, "global_step": 652688, "epoch": 7863} {"train_loss": -28.426122665405273, "global_step": 652689, "epoch": 7863} {"train_loss": -28.605939865112305, "global_step": 652690, "epoch": 7863} {"train_loss": -28.4578857421875, "global_step": 652691, "epoch": 7863} {"train_loss": -27.91122817993164, "global_step": 652692, "epoch": 7863} {"train_loss": -28.398237228393555, "global_step": 652693, "epoch": 7863} {"train_loss": -28.558975219726562, "global_step": 652694, "epoch": 7863} {"train_loss": -28.769113540649414, "global_step": 652695, "epoch": 7863} {"train_loss": -28.279285430908203, "global_step": 652696, "epoch": 7863} {"train_loss": -28.63205337524414, "global_step": 652697, "epoch": 7863} {"train_loss": -28.367090225219727, "global_step": 652698, "epoch": 7863} {"train_loss": -28.362668991088867, "global_step": 652699, "epoch": 7863} {"train_loss": -28.34464454650879, "global_step": 652700, "epoch": 7863} {"train_loss": -28.509496688842773, "global_step": 652701, "epoch": 7863} {"train_loss": -28.560705184936523, "global_step": 652702, "epoch": 7863} {"train_loss": -28.549972534179688, "global_step": 652703, "epoch": 7863} {"train_loss": -28.499418258666992, "global_step": 652704, "epoch": 7863} {"train_loss": -28.5546875, "global_step": 652705, "epoch": 7863} {"train_loss": -28.633310317993164, "global_step": 652706, "epoch": 7863} {"train_loss": -28.830068588256836, "global_step": 652707, "epoch": 7863} {"train_loss": -28.802515029907227, "global_step": 652708, "epoch": 7863} {"train_loss": -28.520483016967773, "global_step": 652709, "epoch": 7863} {"train_loss": -28.3900089263916, "global_step": 652710, "epoch": 7863} {"train_loss": -28.012987527502588, "global_step": 652711, "epoch": 7863, "val_loss": 6584566.5} {"train_loss": -27.60664176940918, "global_step": 652712, "epoch": 7864} {"train_loss": -27.539005279541016, "global_step": 652713, "epoch": 7864} {"train_loss": -27.463369369506836, "global_step": 652714, "epoch": 7864} {"train_loss": -27.578022003173828, "global_step": 652715, "epoch": 7864} {"train_loss": -27.475873947143555, "global_step": 652716, "epoch": 7864} {"train_loss": -27.409027099609375, "global_step": 652717, "epoch": 7864} {"train_loss": -27.054462432861328, "global_step": 652718, "epoch": 7864} {"train_loss": -27.70953369140625, "global_step": 652719, "epoch": 7864} {"train_loss": -27.65024757385254, "global_step": 652720, "epoch": 7864} {"train_loss": -27.96087646484375, "global_step": 652721, "epoch": 7864} {"train_loss": -28.175567626953125, "global_step": 652722, "epoch": 7864} {"train_loss": -28.215131759643555, "global_step": 652723, "epoch": 7864} {"train_loss": -27.85599708557129, "global_step": 652724, "epoch": 7864} {"train_loss": -28.29758644104004, "global_step": 652725, "epoch": 7864} {"train_loss": -27.89112663269043, "global_step": 652726, "epoch": 7864} {"train_loss": -27.960622787475586, "global_step": 652727, "epoch": 7864} {"train_loss": -28.00444984436035, "global_step": 652728, "epoch": 7864} {"train_loss": -28.239789962768555, "global_step": 652729, "epoch": 7864} {"train_loss": -27.92363929748535, "global_step": 652730, "epoch": 7864} {"train_loss": -27.97745704650879, "global_step": 652731, "epoch": 7864} {"train_loss": -28.0163631439209, "global_step": 652732, "epoch": 7864} {"train_loss": -28.3406982421875, "global_step": 652733, "epoch": 7864} {"train_loss": -28.22568130493164, "global_step": 652734, "epoch": 7864} {"train_loss": -28.448389053344727, "global_step": 652735, "epoch": 7864} {"train_loss": -28.354822158813477, "global_step": 652736, "epoch": 7864} {"train_loss": -27.901350021362305, "global_step": 652737, "epoch": 7864} {"train_loss": -27.83890724182129, "global_step": 652738, "epoch": 7864} {"train_loss": -28.2658748626709, "global_step": 652739, "epoch": 7864} {"train_loss": -28.107954025268555, "global_step": 652740, "epoch": 7864} {"train_loss": -28.348331451416016, "global_step": 652741, "epoch": 7864} {"train_loss": -28.593433380126953, "global_step": 652742, "epoch": 7864} {"train_loss": -28.0384464263916, "global_step": 652743, "epoch": 7864} {"train_loss": -28.982864379882812, "global_step": 652744, "epoch": 7864} {"train_loss": -28.573627471923828, "global_step": 652745, "epoch": 7864} {"train_loss": -28.400821685791016, "global_step": 652746, "epoch": 7864} {"train_loss": -28.222604751586914, "global_step": 652747, "epoch": 7864} {"train_loss": -28.437549591064453, "global_step": 652748, "epoch": 7864} {"train_loss": -28.63296890258789, "global_step": 652749, "epoch": 7864} {"train_loss": -28.35698890686035, "global_step": 652750, "epoch": 7864} {"train_loss": -28.36073112487793, "global_step": 652751, "epoch": 7864} {"train_loss": -28.034687042236328, "global_step": 652752, "epoch": 7864} {"train_loss": -28.1503963470459, "global_step": 652753, "epoch": 7864} {"train_loss": -28.489429473876953, "global_step": 652754, "epoch": 7864} {"train_loss": -28.622013092041016, "global_step": 652755, "epoch": 7864} {"train_loss": -28.4187068939209, "global_step": 652756, "epoch": 7864} {"train_loss": -28.599172592163086, "global_step": 652757, "epoch": 7864} {"train_loss": -28.5340633392334, "global_step": 652758, "epoch": 7864} {"train_loss": -28.30488395690918, "global_step": 652759, "epoch": 7864} {"train_loss": -28.595163345336914, "global_step": 652760, "epoch": 7864} {"train_loss": -28.133075714111328, "global_step": 652761, "epoch": 7864} {"train_loss": -28.504613876342773, "global_step": 652762, "epoch": 7864} {"train_loss": -28.218687057495117, "global_step": 652763, "epoch": 7864} {"train_loss": -28.490680694580078, "global_step": 652764, "epoch": 7864} {"train_loss": -27.9145450592041, "global_step": 652765, "epoch": 7864} {"train_loss": -28.22439956665039, "global_step": 652766, "epoch": 7864} {"train_loss": -28.1307430267334, "global_step": 652767, "epoch": 7864} {"train_loss": -28.792036056518555, "global_step": 652768, "epoch": 7864} {"train_loss": -28.313232421875, "global_step": 652769, "epoch": 7864} {"train_loss": -28.30311393737793, "global_step": 652770, "epoch": 7864} {"train_loss": -28.308629989624023, "global_step": 652771, "epoch": 7864} {"train_loss": -28.577625274658203, "global_step": 652772, "epoch": 7864} {"train_loss": -28.466827392578125, "global_step": 652773, "epoch": 7864} {"train_loss": -28.009672164916992, "global_step": 652774, "epoch": 7864} {"train_loss": -28.58277702331543, "global_step": 652775, "epoch": 7864} {"train_loss": -28.642667770385742, "global_step": 652776, "epoch": 7864} {"train_loss": -28.220544815063477, "global_step": 652777, "epoch": 7864} {"train_loss": -28.18938636779785, "global_step": 652778, "epoch": 7864} {"train_loss": -28.169015884399414, "global_step": 652779, "epoch": 7864} {"train_loss": -28.13179588317871, "global_step": 652780, "epoch": 7864} {"train_loss": -28.011646270751953, "global_step": 652781, "epoch": 7864} {"train_loss": -28.319334030151367, "global_step": 652782, "epoch": 7864} {"train_loss": -28.326730728149414, "global_step": 652783, "epoch": 7864} {"train_loss": -28.084009170532227, "global_step": 652784, "epoch": 7864} {"train_loss": -28.3248348236084, "global_step": 652785, "epoch": 7864} {"train_loss": -28.349119186401367, "global_step": 652786, "epoch": 7864} {"train_loss": -28.416601181030273, "global_step": 652787, "epoch": 7864} {"train_loss": -28.448328018188477, "global_step": 652788, "epoch": 7864} {"train_loss": -28.2784423828125, "global_step": 652789, "epoch": 7864} {"train_loss": -28.332006454467773, "global_step": 652790, "epoch": 7864} {"train_loss": -28.23792839050293, "global_step": 652791, "epoch": 7864} {"train_loss": -28.131927490234375, "global_step": 652792, "epoch": 7864} {"train_loss": -28.310461044311523, "global_step": 652793, "epoch": 7864} {"train_loss": -28.203395705625237, "global_step": 652794, "epoch": 7864, "val_loss": 6611756.0} {"train_loss": -27.041004180908203, "global_step": 652795, "epoch": 7865} {"train_loss": -27.1522216796875, "global_step": 652796, "epoch": 7865} {"train_loss": -27.494598388671875, "global_step": 652797, "epoch": 7865} {"train_loss": -28.07990837097168, "global_step": 652798, "epoch": 7865} {"train_loss": -27.907550811767578, "global_step": 652799, "epoch": 7865} {"train_loss": -28.003576278686523, "global_step": 652800, "epoch": 7865} {"train_loss": -27.781164169311523, "global_step": 652801, "epoch": 7865} {"train_loss": -28.49506187438965, "global_step": 652802, "epoch": 7865} {"train_loss": -27.871173858642578, "global_step": 652803, "epoch": 7865} {"train_loss": -28.21004295349121, "global_step": 652804, "epoch": 7865} {"train_loss": -27.842147827148438, "global_step": 652805, "epoch": 7865} {"train_loss": -27.705331802368164, "global_step": 652806, "epoch": 7865} {"train_loss": -27.791046142578125, "global_step": 652807, "epoch": 7865} {"train_loss": -28.262548446655273, "global_step": 652808, "epoch": 7865} {"train_loss": -28.29341697692871, "global_step": 652809, "epoch": 7865} {"train_loss": -27.74420166015625, "global_step": 652810, "epoch": 7865} {"train_loss": -28.246429443359375, "global_step": 652811, "epoch": 7865} {"train_loss": -28.04595375061035, "global_step": 652812, "epoch": 7865} {"train_loss": -27.99761390686035, "global_step": 652813, "epoch": 7865} {"train_loss": -27.931121826171875, "global_step": 652814, "epoch": 7865} {"train_loss": -28.0529727935791, "global_step": 652815, "epoch": 7865} {"train_loss": -28.206756591796875, "global_step": 652816, "epoch": 7865} {"train_loss": -28.090383529663086, "global_step": 652817, "epoch": 7865} {"train_loss": -27.897565841674805, "global_step": 652818, "epoch": 7865} {"train_loss": -28.235279083251953, "global_step": 652819, "epoch": 7865} {"train_loss": -27.90785026550293, "global_step": 652820, "epoch": 7865} {"train_loss": -28.27088737487793, "global_step": 652821, "epoch": 7865} {"train_loss": -28.515827178955078, "global_step": 652822, "epoch": 7865} {"train_loss": -28.100955963134766, "global_step": 652823, "epoch": 7865} {"train_loss": -28.239171981811523, "global_step": 652824, "epoch": 7865} {"train_loss": -28.190000534057617, "global_step": 652825, "epoch": 7865} {"train_loss": -28.15791130065918, "global_step": 652826, "epoch": 7865} {"train_loss": -28.53837013244629, "global_step": 652827, "epoch": 7865} {"train_loss": -28.443647384643555, "global_step": 652828, "epoch": 7865} {"train_loss": -28.2819766998291, "global_step": 652829, "epoch": 7865} {"train_loss": -28.58349609375, "global_step": 652830, "epoch": 7865} {"train_loss": -28.212940216064453, "global_step": 652831, "epoch": 7865} {"train_loss": -28.696008682250977, "global_step": 652832, "epoch": 7865} {"train_loss": -28.49853515625, "global_step": 652833, "epoch": 7865} {"train_loss": -28.731189727783203, "global_step": 652834, "epoch": 7865} {"train_loss": -28.1781063079834, "global_step": 652835, "epoch": 7865} {"train_loss": -28.523046493530273, "global_step": 652836, "epoch": 7865} {"train_loss": -28.43035888671875, "global_step": 652837, "epoch": 7865} {"train_loss": -28.05499839782715, "global_step": 652838, "epoch": 7865} {"train_loss": -28.325037002563477, "global_step": 652839, "epoch": 7865} {"train_loss": -28.346715927124023, "global_step": 652840, "epoch": 7865} {"train_loss": -28.363706588745117, "global_step": 652841, "epoch": 7865} {"train_loss": -28.002389907836914, "global_step": 652842, "epoch": 7865} {"train_loss": -27.62595558166504, "global_step": 652843, "epoch": 7865} {"train_loss": -27.402267456054688, "global_step": 652844, "epoch": 7865} {"train_loss": -27.624082565307617, "global_step": 652845, "epoch": 7865} {"train_loss": -27.673460006713867, "global_step": 652846, "epoch": 7865} {"train_loss": -28.509435653686523, "global_step": 652847, "epoch": 7865} {"train_loss": -27.96078872680664, "global_step": 652848, "epoch": 7865} {"train_loss": -27.357934951782227, "global_step": 652849, "epoch": 7865} {"train_loss": -27.46661376953125, "global_step": 652850, "epoch": 7865} {"train_loss": -28.241952896118164, "global_step": 652851, "epoch": 7865} {"train_loss": -28.15825843811035, "global_step": 652852, "epoch": 7865} {"train_loss": -28.218448638916016, "global_step": 652853, "epoch": 7865} {"train_loss": -28.08552360534668, "global_step": 652854, "epoch": 7865} {"train_loss": -28.428171157836914, "global_step": 652855, "epoch": 7865} {"train_loss": -28.094457626342773, "global_step": 652856, "epoch": 7865} {"train_loss": -28.048736572265625, "global_step": 652857, "epoch": 7865} {"train_loss": -28.444538116455078, "global_step": 652858, "epoch": 7865} {"train_loss": -28.399890899658203, "global_step": 652859, "epoch": 7865} {"train_loss": -28.38958740234375, "global_step": 652860, "epoch": 7865} {"train_loss": -28.255102157592773, "global_step": 652861, "epoch": 7865} {"train_loss": -28.397842407226562, "global_step": 652862, "epoch": 7865} {"train_loss": -28.240758895874023, "global_step": 652863, "epoch": 7865} {"train_loss": -28.169309616088867, "global_step": 652864, "epoch": 7865} {"train_loss": -28.430280685424805, "global_step": 652865, "epoch": 7865} {"train_loss": -28.2513370513916, "global_step": 652866, "epoch": 7865} {"train_loss": -28.361637115478516, "global_step": 652867, "epoch": 7865} {"train_loss": -28.287927627563477, "global_step": 652868, "epoch": 7865} {"train_loss": -28.606674194335938, "global_step": 652869, "epoch": 7865} {"train_loss": -27.901355743408203, "global_step": 652870, "epoch": 7865} {"train_loss": -28.189374923706055, "global_step": 652871, "epoch": 7865} {"train_loss": -28.14173698425293, "global_step": 652872, "epoch": 7865} {"train_loss": -28.450836181640625, "global_step": 652873, "epoch": 7865} {"train_loss": -28.402210235595703, "global_step": 652874, "epoch": 7865} {"train_loss": -28.29436683654785, "global_step": 652875, "epoch": 7865} {"train_loss": -28.415119171142578, "global_step": 652876, "epoch": 7865} {"train_loss": -28.131308199411414, "global_step": 652877, "epoch": 7865, "val_loss": 6612132.0} {"train_loss": -28.506711959838867, "global_step": 652878, "epoch": 7866} {"train_loss": -28.453113555908203, "global_step": 652879, "epoch": 7866} {"train_loss": -28.370569229125977, "global_step": 652880, "epoch": 7866} {"train_loss": -28.06001091003418, "global_step": 652881, "epoch": 7866} {"train_loss": -27.605234146118164, "global_step": 652882, "epoch": 7866} {"train_loss": -27.04151725769043, "global_step": 652883, "epoch": 7866} {"train_loss": -26.819860458374023, "global_step": 652884, "epoch": 7866} {"train_loss": -27.21115493774414, "global_step": 652885, "epoch": 7866} {"train_loss": -28.06167984008789, "global_step": 652886, "epoch": 7866} {"train_loss": -27.612567901611328, "global_step": 652887, "epoch": 7866} {"train_loss": -27.961078643798828, "global_step": 652888, "epoch": 7866} {"train_loss": -27.679595947265625, "global_step": 652889, "epoch": 7866} {"train_loss": -27.69970703125, "global_step": 652890, "epoch": 7866} {"train_loss": -27.479455947875977, "global_step": 652891, "epoch": 7866} {"train_loss": -28.32083511352539, "global_step": 652892, "epoch": 7866} {"train_loss": -27.982431411743164, "global_step": 652893, "epoch": 7866} {"train_loss": -27.83564567565918, "global_step": 652894, "epoch": 7866} {"train_loss": -28.073749542236328, "global_step": 652895, "epoch": 7866} {"train_loss": -28.05462646484375, "global_step": 652896, "epoch": 7866} {"train_loss": -27.983722686767578, "global_step": 652897, "epoch": 7866} {"train_loss": -27.843408584594727, "global_step": 652898, "epoch": 7866} {"train_loss": -28.023595809936523, "global_step": 652899, "epoch": 7866} {"train_loss": -28.123428344726562, "global_step": 652900, "epoch": 7866} {"train_loss": -28.0568790435791, "global_step": 652901, "epoch": 7866} {"train_loss": -28.2158145904541, "global_step": 652902, "epoch": 7866} {"train_loss": -28.170333862304688, "global_step": 652903, "epoch": 7866} {"train_loss": -28.327741622924805, "global_step": 652904, "epoch": 7866} {"train_loss": -28.08302116394043, "global_step": 652905, "epoch": 7866} {"train_loss": -28.17376136779785, "global_step": 652906, "epoch": 7866} {"train_loss": -27.9094181060791, "global_step": 652907, "epoch": 7866} {"train_loss": -28.323652267456055, "global_step": 652908, "epoch": 7866} {"train_loss": -28.71512222290039, "global_step": 652909, "epoch": 7866} {"train_loss": -28.27264976501465, "global_step": 652910, "epoch": 7866} {"train_loss": -28.407806396484375, "global_step": 652911, "epoch": 7866} {"train_loss": -28.49542236328125, "global_step": 652912, "epoch": 7866} {"train_loss": -28.1492862701416, "global_step": 652913, "epoch": 7866} {"train_loss": -28.3035831451416, "global_step": 652914, "epoch": 7866} {"train_loss": -28.58157730102539, "global_step": 652915, "epoch": 7866} {"train_loss": -28.857572555541992, "global_step": 652916, "epoch": 7866} {"train_loss": -28.29654312133789, "global_step": 652917, "epoch": 7866} {"train_loss": -28.01649284362793, "global_step": 652918, "epoch": 7866} {"train_loss": -28.444223403930664, "global_step": 652919, "epoch": 7866} {"train_loss": -28.484817504882812, "global_step": 652920, "epoch": 7866} {"train_loss": -28.304431915283203, "global_step": 652921, "epoch": 7866} {"train_loss": -28.568403244018555, "global_step": 652922, "epoch": 7866} {"train_loss": -28.533666610717773, "global_step": 652923, "epoch": 7866} {"train_loss": -28.330610275268555, "global_step": 652924, "epoch": 7866} {"train_loss": -28.2457332611084, "global_step": 652925, "epoch": 7866} {"train_loss": -28.112442016601562, "global_step": 652926, "epoch": 7866} {"train_loss": -27.359851837158203, "global_step": 652927, "epoch": 7866} {"train_loss": -27.135238647460938, "global_step": 652928, "epoch": 7866} {"train_loss": -26.6458797454834, "global_step": 652929, "epoch": 7866} {"train_loss": -27.019922256469727, "global_step": 652930, "epoch": 7866} {"train_loss": -28.2036075592041, "global_step": 652931, "epoch": 7866} {"train_loss": -27.65838623046875, "global_step": 652932, "epoch": 7866} {"train_loss": -28.1430721282959, "global_step": 652933, "epoch": 7866} {"train_loss": -28.08283042907715, "global_step": 652934, "epoch": 7866} {"train_loss": -27.2777042388916, "global_step": 652935, "epoch": 7866} {"train_loss": -27.039112091064453, "global_step": 652936, "epoch": 7866} {"train_loss": -28.41437339782715, "global_step": 652937, "epoch": 7866} {"train_loss": -27.615644454956055, "global_step": 652938, "epoch": 7866} {"train_loss": -27.651865005493164, "global_step": 652939, "epoch": 7866} {"train_loss": -28.104711532592773, "global_step": 652940, "epoch": 7866} {"train_loss": -28.1531982421875, "global_step": 652941, "epoch": 7866} {"train_loss": -28.492572784423828, "global_step": 652942, "epoch": 7866} {"train_loss": -28.15389060974121, "global_step": 652943, "epoch": 7866} {"train_loss": -28.0440616607666, "global_step": 652944, "epoch": 7866} {"train_loss": -28.337329864501953, "global_step": 652945, "epoch": 7866} {"train_loss": -28.208240509033203, "global_step": 652946, "epoch": 7866} {"train_loss": -28.116788864135742, "global_step": 652947, "epoch": 7866} {"train_loss": -28.0855770111084, "global_step": 652948, "epoch": 7866} {"train_loss": -28.2818660736084, "global_step": 652949, "epoch": 7866} {"train_loss": -27.90851402282715, "global_step": 652950, "epoch": 7866} {"train_loss": -28.22273063659668, "global_step": 652951, "epoch": 7866} {"train_loss": -28.267377853393555, "global_step": 652952, "epoch": 7866} {"train_loss": -28.090497970581055, "global_step": 652953, "epoch": 7866} {"train_loss": -28.27426528930664, "global_step": 652954, "epoch": 7866} {"train_loss": -27.9934024810791, "global_step": 652955, "epoch": 7866} {"train_loss": -28.3865966796875, "global_step": 652956, "epoch": 7866} {"train_loss": -28.42136001586914, "global_step": 652957, "epoch": 7866} {"train_loss": -28.569534301757812, "global_step": 652958, "epoch": 7866} {"train_loss": -28.18343162536621, "global_step": 652959, "epoch": 7866} {"train_loss": -28.054460249751447, "global_step": 652960, "epoch": 7866, "val_loss": 6598698.0} {"train_loss": -28.318988800048828, "global_step": 652961, "epoch": 7867} {"train_loss": -27.583480834960938, "global_step": 652962, "epoch": 7867} {"train_loss": -27.87421226501465, "global_step": 652963, "epoch": 7867} {"train_loss": -28.01639175415039, "global_step": 652964, "epoch": 7867} {"train_loss": -27.84124183654785, "global_step": 652965, "epoch": 7867} {"train_loss": -27.446569442749023, "global_step": 652966, "epoch": 7867} {"train_loss": -27.8637638092041, "global_step": 652967, "epoch": 7867} {"train_loss": -28.1352481842041, "global_step": 652968, "epoch": 7867} {"train_loss": -27.91153335571289, "global_step": 652969, "epoch": 7867} {"train_loss": -27.7669677734375, "global_step": 652970, "epoch": 7867} {"train_loss": -27.848281860351562, "global_step": 652971, "epoch": 7867} {"train_loss": -27.910125732421875, "global_step": 652972, "epoch": 7867} {"train_loss": -27.818145751953125, "global_step": 652973, "epoch": 7867} {"train_loss": -28.43951416015625, "global_step": 652974, "epoch": 7867} {"train_loss": -27.923023223876953, "global_step": 652975, "epoch": 7867} {"train_loss": -28.16126823425293, "global_step": 652976, "epoch": 7867} {"train_loss": -28.052534103393555, "global_step": 652977, "epoch": 7867} {"train_loss": -28.13180923461914, "global_step": 652978, "epoch": 7867} {"train_loss": -28.412628173828125, "global_step": 652979, "epoch": 7867} {"train_loss": -28.374069213867188, "global_step": 652980, "epoch": 7867} {"train_loss": -28.022565841674805, "global_step": 652981, "epoch": 7867} {"train_loss": -28.398534774780273, "global_step": 652982, "epoch": 7867} {"train_loss": -28.262908935546875, "global_step": 652983, "epoch": 7867} {"train_loss": -28.0660343170166, "global_step": 652984, "epoch": 7867} {"train_loss": -28.228246688842773, "global_step": 652985, "epoch": 7867} {"train_loss": -28.1204776763916, "global_step": 652986, "epoch": 7867} {"train_loss": -28.254602432250977, "global_step": 652987, "epoch": 7867} {"train_loss": -28.320764541625977, "global_step": 652988, "epoch": 7867} {"train_loss": -28.245885848999023, "global_step": 652989, "epoch": 7867} {"train_loss": -28.813337326049805, "global_step": 652990, "epoch": 7867} {"train_loss": -28.11045265197754, "global_step": 652991, "epoch": 7867} {"train_loss": -28.337890625, "global_step": 652992, "epoch": 7867} {"train_loss": -28.12978172302246, "global_step": 652993, "epoch": 7867} {"train_loss": -28.32501220703125, "global_step": 652994, "epoch": 7867} {"train_loss": -28.4403076171875, "global_step": 652995, "epoch": 7867} {"train_loss": -28.581195831298828, "global_step": 652996, "epoch": 7867} {"train_loss": -28.40778923034668, "global_step": 652997, "epoch": 7867} {"train_loss": -28.2924861907959, "global_step": 652998, "epoch": 7867} {"train_loss": -28.1190128326416, "global_step": 652999, "epoch": 7867} {"train_loss": -28.05524253845215, "global_step": 653000, "epoch": 7867} {"train_loss": -28.26731300354004, "global_step": 653001, "epoch": 7867} {"train_loss": -28.04953384399414, "global_step": 653002, "epoch": 7867} {"train_loss": -27.846704483032227, "global_step": 653003, "epoch": 7867} {"train_loss": -28.642541885375977, "global_step": 653004, "epoch": 7867} {"train_loss": -28.652236938476562, "global_step": 653005, "epoch": 7867} {"train_loss": -28.157154083251953, "global_step": 653006, "epoch": 7867} {"train_loss": -28.017261505126953, "global_step": 653007, "epoch": 7867} {"train_loss": -28.311132431030273, "global_step": 653008, "epoch": 7867} {"train_loss": -28.38787841796875, "global_step": 653009, "epoch": 7867} {"train_loss": -28.256534576416016, "global_step": 653010, "epoch": 7867} {"train_loss": -28.629474639892578, "global_step": 653011, "epoch": 7867} {"train_loss": -28.291961669921875, "global_step": 653012, "epoch": 7867} {"train_loss": -28.4017333984375, "global_step": 653013, "epoch": 7867} {"train_loss": -28.05756187438965, "global_step": 653014, "epoch": 7867} {"train_loss": -28.303457260131836, "global_step": 653015, "epoch": 7867} {"train_loss": -28.432470321655273, "global_step": 653016, "epoch": 7867} {"train_loss": -28.484643936157227, "global_step": 653017, "epoch": 7867} {"train_loss": -28.394994735717773, "global_step": 653018, "epoch": 7867} {"train_loss": -28.099384307861328, "global_step": 653019, "epoch": 7867} {"train_loss": -28.566797256469727, "global_step": 653020, "epoch": 7867} {"train_loss": -28.335111618041992, "global_step": 653021, "epoch": 7867} {"train_loss": -28.139877319335938, "global_step": 653022, "epoch": 7867} {"train_loss": -28.397863388061523, "global_step": 653023, "epoch": 7867} {"train_loss": -28.088642120361328, "global_step": 653024, "epoch": 7867} {"train_loss": -28.305952072143555, "global_step": 653025, "epoch": 7867} {"train_loss": -28.296606063842773, "global_step": 653026, "epoch": 7867} {"train_loss": -28.361974716186523, "global_step": 653027, "epoch": 7867} {"train_loss": -28.765233993530273, "global_step": 653028, "epoch": 7867} {"train_loss": -28.089557647705078, "global_step": 653029, "epoch": 7867} {"train_loss": -28.767126083374023, "global_step": 653030, "epoch": 7867} {"train_loss": -28.841100692749023, "global_step": 653031, "epoch": 7867} {"train_loss": -27.997365951538086, "global_step": 653032, "epoch": 7867} {"train_loss": -28.3557071685791, "global_step": 653033, "epoch": 7867} {"train_loss": -28.295135498046875, "global_step": 653034, "epoch": 7867} {"train_loss": -28.67133140563965, "global_step": 653035, "epoch": 7867} {"train_loss": -28.521753311157227, "global_step": 653036, "epoch": 7867} {"train_loss": -28.515399932861328, "global_step": 653037, "epoch": 7867} {"train_loss": -28.4427490234375, "global_step": 653038, "epoch": 7867} {"train_loss": -28.300424575805664, "global_step": 653039, "epoch": 7867} {"train_loss": -28.876386642456055, "global_step": 653040, "epoch": 7867} {"train_loss": -28.39761734008789, "global_step": 653041, "epoch": 7867} {"train_loss": -28.476404190063477, "global_step": 653042, "epoch": 7867} {"train_loss": -28.257233424359057, "global_step": 653043, "epoch": 7867, "val_loss": 6732458.5} {"train_loss": -27.431371688842773, "global_step": 653044, "epoch": 7868} {"train_loss": -27.117578506469727, "global_step": 653045, "epoch": 7868} {"train_loss": -26.73248863220215, "global_step": 653046, "epoch": 7868} {"train_loss": -25.82720947265625, "global_step": 653047, "epoch": 7868} {"train_loss": -25.66449546813965, "global_step": 653048, "epoch": 7868} {"train_loss": -26.660053253173828, "global_step": 653049, "epoch": 7868} {"train_loss": -27.753360748291016, "global_step": 653050, "epoch": 7868} {"train_loss": -26.842004776000977, "global_step": 653051, "epoch": 7868} {"train_loss": -27.059833526611328, "global_step": 653052, "epoch": 7868} {"train_loss": -27.503828048706055, "global_step": 653053, "epoch": 7868} {"train_loss": -27.449201583862305, "global_step": 653054, "epoch": 7868} {"train_loss": -27.87638282775879, "global_step": 653055, "epoch": 7868} {"train_loss": -27.50457763671875, "global_step": 653056, "epoch": 7868} {"train_loss": -27.88177490234375, "global_step": 653057, "epoch": 7868} {"train_loss": -27.55767250061035, "global_step": 653058, "epoch": 7868} {"train_loss": -27.807376861572266, "global_step": 653059, "epoch": 7868} {"train_loss": -27.80780601501465, "global_step": 653060, "epoch": 7868} {"train_loss": -27.870258331298828, "global_step": 653061, "epoch": 7868} {"train_loss": -27.85835838317871, "global_step": 653062, "epoch": 7868} {"train_loss": -27.976764678955078, "global_step": 653063, "epoch": 7868} {"train_loss": -28.12080192565918, "global_step": 653064, "epoch": 7868} {"train_loss": -28.059406280517578, "global_step": 653065, "epoch": 7868} {"train_loss": -28.24619483947754, "global_step": 653066, "epoch": 7868} {"train_loss": -28.010656356811523, "global_step": 653067, "epoch": 7868} {"train_loss": -28.012943267822266, "global_step": 653068, "epoch": 7868} {"train_loss": -28.20450782775879, "global_step": 653069, "epoch": 7868} {"train_loss": -28.249130249023438, "global_step": 653070, "epoch": 7868} {"train_loss": -28.369626998901367, "global_step": 653071, "epoch": 7868} {"train_loss": -28.1059627532959, "global_step": 653072, "epoch": 7868} {"train_loss": -27.863828659057617, "global_step": 653073, "epoch": 7868} {"train_loss": -28.185089111328125, "global_step": 653074, "epoch": 7868} {"train_loss": -28.307220458984375, "global_step": 653075, "epoch": 7868} {"train_loss": -27.850296020507812, "global_step": 653076, "epoch": 7868} {"train_loss": -28.118200302124023, "global_step": 653077, "epoch": 7868} {"train_loss": -28.274709701538086, "global_step": 653078, "epoch": 7868} {"train_loss": -28.271772384643555, "global_step": 653079, "epoch": 7868} {"train_loss": -28.3185977935791, "global_step": 653080, "epoch": 7868} {"train_loss": -28.193063735961914, "global_step": 653081, "epoch": 7868} {"train_loss": -28.207183837890625, "global_step": 653082, "epoch": 7868} {"train_loss": -27.88959312438965, "global_step": 653083, "epoch": 7868} {"train_loss": -28.60129165649414, "global_step": 653084, "epoch": 7868} {"train_loss": -28.350767135620117, "global_step": 653085, "epoch": 7868} {"train_loss": -28.31171989440918, "global_step": 653086, "epoch": 7868} {"train_loss": -28.338104248046875, "global_step": 653087, "epoch": 7868} {"train_loss": -28.502262115478516, "global_step": 653088, "epoch": 7868} {"train_loss": -28.211145401000977, "global_step": 653089, "epoch": 7868} {"train_loss": -28.24847412109375, "global_step": 653090, "epoch": 7868} {"train_loss": -28.546741485595703, "global_step": 653091, "epoch": 7868} {"train_loss": -28.518396377563477, "global_step": 653092, "epoch": 7868} {"train_loss": -28.500568389892578, "global_step": 653093, "epoch": 7868} {"train_loss": -28.6197452545166, "global_step": 653094, "epoch": 7868} {"train_loss": -28.4893856048584, "global_step": 653095, "epoch": 7868} {"train_loss": -28.2259578704834, "global_step": 653096, "epoch": 7868} {"train_loss": -28.62672233581543, "global_step": 653097, "epoch": 7868} {"train_loss": -28.567218780517578, "global_step": 653098, "epoch": 7868} {"train_loss": -28.465774536132812, "global_step": 653099, "epoch": 7868} {"train_loss": -28.455459594726562, "global_step": 653100, "epoch": 7868} {"train_loss": -28.340290069580078, "global_step": 653101, "epoch": 7868} {"train_loss": -28.258380889892578, "global_step": 653102, "epoch": 7868} {"train_loss": -28.33827018737793, "global_step": 653103, "epoch": 7868} {"train_loss": -28.323511123657227, "global_step": 653104, "epoch": 7868} {"train_loss": -28.140058517456055, "global_step": 653105, "epoch": 7868} {"train_loss": -28.376394271850586, "global_step": 653106, "epoch": 7868} {"train_loss": -28.2978572845459, "global_step": 653107, "epoch": 7868} {"train_loss": -28.47248649597168, "global_step": 653108, "epoch": 7868} {"train_loss": -28.433324813842773, "global_step": 653109, "epoch": 7868} {"train_loss": -28.52144432067871, "global_step": 653110, "epoch": 7868} {"train_loss": -28.28132438659668, "global_step": 653111, "epoch": 7868} {"train_loss": -28.269149780273438, "global_step": 653112, "epoch": 7868} {"train_loss": -28.207666397094727, "global_step": 653113, "epoch": 7868} {"train_loss": -28.298343658447266, "global_step": 653114, "epoch": 7868} {"train_loss": -28.429834365844727, "global_step": 653115, "epoch": 7868} {"train_loss": -28.473926544189453, "global_step": 653116, "epoch": 7868} {"train_loss": -28.374719619750977, "global_step": 653117, "epoch": 7868} {"train_loss": -28.221654891967773, "global_step": 653118, "epoch": 7868} {"train_loss": -28.04937744140625, "global_step": 653119, "epoch": 7868} {"train_loss": -27.969684600830078, "global_step": 653120, "epoch": 7868} {"train_loss": -27.800039291381836, "global_step": 653121, "epoch": 7868} {"train_loss": -27.71842384338379, "global_step": 653122, "epoch": 7868} {"train_loss": -27.564987182617188, "global_step": 653123, "epoch": 7868} {"train_loss": -28.154376983642578, "global_step": 653124, "epoch": 7868} {"train_loss": -27.73195457458496, "global_step": 653125, "epoch": 7868} {"train_loss": -28.011980815106128, "global_step": 653126, "epoch": 7868, "val_loss": 6720820.0} {"train_loss": -27.236785888671875, "global_step": 653127, "epoch": 7869} {"train_loss": -26.56882667541504, "global_step": 653128, "epoch": 7869} {"train_loss": -27.881711959838867, "global_step": 653129, "epoch": 7869} {"train_loss": -26.81625747680664, "global_step": 653130, "epoch": 7869} {"train_loss": -27.420591354370117, "global_step": 653131, "epoch": 7869} {"train_loss": -26.88840103149414, "global_step": 653132, "epoch": 7869} {"train_loss": -27.385156631469727, "global_step": 653133, "epoch": 7869} {"train_loss": -26.890949249267578, "global_step": 653134, "epoch": 7869} {"train_loss": -27.410058975219727, "global_step": 653135, "epoch": 7869} {"train_loss": -27.053863525390625, "global_step": 653136, "epoch": 7869} {"train_loss": -27.813934326171875, "global_step": 653137, "epoch": 7869} {"train_loss": -27.416540145874023, "global_step": 653138, "epoch": 7869} {"train_loss": -27.776336669921875, "global_step": 653139, "epoch": 7869} {"train_loss": -27.49899673461914, "global_step": 653140, "epoch": 7869} {"train_loss": -27.613142013549805, "global_step": 653141, "epoch": 7869} {"train_loss": -28.018035888671875, "global_step": 653142, "epoch": 7869} {"train_loss": -27.35043716430664, "global_step": 653143, "epoch": 7869} {"train_loss": -27.9692440032959, "global_step": 653144, "epoch": 7869} {"train_loss": -27.728729248046875, "global_step": 653145, "epoch": 7869} {"train_loss": -27.722028732299805, "global_step": 653146, "epoch": 7869} {"train_loss": -27.822040557861328, "global_step": 653147, "epoch": 7869} {"train_loss": -28.119306564331055, "global_step": 653148, "epoch": 7869} {"train_loss": -27.807605743408203, "global_step": 653149, "epoch": 7869} {"train_loss": -27.87967300415039, "global_step": 653150, "epoch": 7869} {"train_loss": -27.930206298828125, "global_step": 653151, "epoch": 7869} {"train_loss": -27.750934600830078, "global_step": 653152, "epoch": 7869} {"train_loss": -28.026874542236328, "global_step": 653153, "epoch": 7869} {"train_loss": -28.600988388061523, "global_step": 653154, "epoch": 7869} {"train_loss": -27.864599227905273, "global_step": 653155, "epoch": 7869} {"train_loss": -28.36091423034668, "global_step": 653156, "epoch": 7869} {"train_loss": -28.14485740661621, "global_step": 653157, "epoch": 7869} {"train_loss": -28.623090744018555, "global_step": 653158, "epoch": 7869} {"train_loss": -28.39240837097168, "global_step": 653159, "epoch": 7869} {"train_loss": -28.088361740112305, "global_step": 653160, "epoch": 7869} {"train_loss": -28.636444091796875, "global_step": 653161, "epoch": 7869} {"train_loss": -28.172285079956055, "global_step": 653162, "epoch": 7869} {"train_loss": -28.418354034423828, "global_step": 653163, "epoch": 7869} {"train_loss": -28.1644229888916, "global_step": 653164, "epoch": 7869} {"train_loss": -28.18219566345215, "global_step": 653165, "epoch": 7869} {"train_loss": -28.428211212158203, "global_step": 653166, "epoch": 7869} {"train_loss": -28.581018447875977, "global_step": 653167, "epoch": 7869} {"train_loss": -28.300268173217773, "global_step": 653168, "epoch": 7869} {"train_loss": -28.390186309814453, "global_step": 653169, "epoch": 7869} {"train_loss": -28.462942123413086, "global_step": 653170, "epoch": 7869} {"train_loss": -28.487659454345703, "global_step": 653171, "epoch": 7869} {"train_loss": -28.648778915405273, "global_step": 653172, "epoch": 7869} {"train_loss": -28.366357803344727, "global_step": 653173, "epoch": 7869} {"train_loss": -28.291784286499023, "global_step": 653174, "epoch": 7869} {"train_loss": -28.547016143798828, "global_step": 653175, "epoch": 7869} {"train_loss": -28.571699142456055, "global_step": 653176, "epoch": 7869} {"train_loss": -28.87972068786621, "global_step": 653177, "epoch": 7869} {"train_loss": -28.679044723510742, "global_step": 653178, "epoch": 7869} {"train_loss": -28.43560218811035, "global_step": 653179, "epoch": 7869} {"train_loss": -28.565603256225586, "global_step": 653180, "epoch": 7869} {"train_loss": -28.535144805908203, "global_step": 653181, "epoch": 7869} {"train_loss": -28.45636558532715, "global_step": 653182, "epoch": 7869} {"train_loss": -28.768951416015625, "global_step": 653183, "epoch": 7869} {"train_loss": -28.545324325561523, "global_step": 653184, "epoch": 7869} {"train_loss": -28.510385513305664, "global_step": 653185, "epoch": 7869} {"train_loss": -28.738691329956055, "global_step": 653186, "epoch": 7869} {"train_loss": -28.13691520690918, "global_step": 653187, "epoch": 7869} {"train_loss": -28.193811416625977, "global_step": 653188, "epoch": 7869} {"train_loss": -28.35957145690918, "global_step": 653189, "epoch": 7869} {"train_loss": -28.387298583984375, "global_step": 653190, "epoch": 7869} {"train_loss": -28.433874130249023, "global_step": 653191, "epoch": 7869} {"train_loss": -28.424728393554688, "global_step": 653192, "epoch": 7869} {"train_loss": -28.233884811401367, "global_step": 653193, "epoch": 7869} {"train_loss": -28.270877838134766, "global_step": 653194, "epoch": 7869} {"train_loss": -28.204025268554688, "global_step": 653195, "epoch": 7869} {"train_loss": -28.431278228759766, "global_step": 653196, "epoch": 7869} {"train_loss": -28.2585506439209, "global_step": 653197, "epoch": 7869} {"train_loss": -28.184003829956055, "global_step": 653198, "epoch": 7869} {"train_loss": -28.125213623046875, "global_step": 653199, "epoch": 7869} {"train_loss": -28.007740020751953, "global_step": 653200, "epoch": 7869} {"train_loss": -28.406599044799805, "global_step": 653201, "epoch": 7869} {"train_loss": -28.409698486328125, "global_step": 653202, "epoch": 7869} {"train_loss": -28.11931800842285, "global_step": 653203, "epoch": 7869} {"train_loss": -28.151098251342773, "global_step": 653204, "epoch": 7869} {"train_loss": -28.491470336914062, "global_step": 653205, "epoch": 7869} {"train_loss": -28.5783748626709, "global_step": 653206, "epoch": 7869} {"train_loss": -28.421674728393555, "global_step": 653207, "epoch": 7869} {"train_loss": -28.545475006103516, "global_step": 653208, "epoch": 7869} {"train_loss": -28.123550139277814, "global_step": 653209, "epoch": 7869, "val_loss": 6702419.5} {"train_loss": -27.089365005493164, "global_step": 653210, "epoch": 7870} {"train_loss": -26.90225601196289, "global_step": 653211, "epoch": 7870} {"train_loss": -28.12887954711914, "global_step": 653212, "epoch": 7870} {"train_loss": -27.48504638671875, "global_step": 653213, "epoch": 7870} {"train_loss": -27.345930099487305, "global_step": 653214, "epoch": 7870} {"train_loss": -27.995025634765625, "global_step": 653215, "epoch": 7870} {"train_loss": -27.792821884155273, "global_step": 653216, "epoch": 7870} {"train_loss": -27.405485153198242, "global_step": 653217, "epoch": 7870} {"train_loss": -27.458393096923828, "global_step": 653218, "epoch": 7870} {"train_loss": -27.826171875, "global_step": 653219, "epoch": 7870} {"train_loss": -27.40433120727539, "global_step": 653220, "epoch": 7870} {"train_loss": -27.5405216217041, "global_step": 653221, "epoch": 7870} {"train_loss": -27.60345458984375, "global_step": 653222, "epoch": 7870} {"train_loss": -27.81513786315918, "global_step": 653223, "epoch": 7870} {"train_loss": -27.99592399597168, "global_step": 653224, "epoch": 7870} {"train_loss": -27.79176139831543, "global_step": 653225, "epoch": 7870} {"train_loss": -27.92474937438965, "global_step": 653226, "epoch": 7870} {"train_loss": -27.679309844970703, "global_step": 653227, "epoch": 7870} {"train_loss": -27.819385528564453, "global_step": 653228, "epoch": 7870} {"train_loss": -27.81817626953125, "global_step": 653229, "epoch": 7870} {"train_loss": -28.032989501953125, "global_step": 653230, "epoch": 7870} {"train_loss": -28.183629989624023, "global_step": 653231, "epoch": 7870} {"train_loss": -28.2408390045166, "global_step": 653232, "epoch": 7870} {"train_loss": -27.823272705078125, "global_step": 653233, "epoch": 7870} {"train_loss": -28.15152931213379, "global_step": 653234, "epoch": 7870} {"train_loss": -28.368444442749023, "global_step": 653235, "epoch": 7870} {"train_loss": -28.01789665222168, "global_step": 653236, "epoch": 7870} {"train_loss": -27.882190704345703, "global_step": 653237, "epoch": 7870} {"train_loss": -27.951757431030273, "global_step": 653238, "epoch": 7870} {"train_loss": -28.115461349487305, "global_step": 653239, "epoch": 7870} {"train_loss": -28.322509765625, "global_step": 653240, "epoch": 7870} {"train_loss": -28.484418869018555, "global_step": 653241, "epoch": 7870} {"train_loss": -27.932331085205078, "global_step": 653242, "epoch": 7870} {"train_loss": -28.302265167236328, "global_step": 653243, "epoch": 7870} {"train_loss": -28.373727798461914, "global_step": 653244, "epoch": 7870} {"train_loss": -28.61733055114746, "global_step": 653245, "epoch": 7870} {"train_loss": -28.10080909729004, "global_step": 653246, "epoch": 7870} {"train_loss": -28.014209747314453, "global_step": 653247, "epoch": 7870} {"train_loss": -28.395477294921875, "global_step": 653248, "epoch": 7870} {"train_loss": -28.391225814819336, "global_step": 653249, "epoch": 7870} {"train_loss": -28.05213737487793, "global_step": 653250, "epoch": 7870} {"train_loss": -28.19122886657715, "global_step": 653251, "epoch": 7870} {"train_loss": -28.15626335144043, "global_step": 653252, "epoch": 7870} {"train_loss": -28.364383697509766, "global_step": 653253, "epoch": 7870} {"train_loss": -28.370412826538086, "global_step": 653254, "epoch": 7870} {"train_loss": -28.068115234375, "global_step": 653255, "epoch": 7870} {"train_loss": -28.318653106689453, "global_step": 653256, "epoch": 7870} {"train_loss": -28.607126235961914, "global_step": 653257, "epoch": 7870} {"train_loss": -27.977161407470703, "global_step": 653258, "epoch": 7870} {"train_loss": -28.288793563842773, "global_step": 653259, "epoch": 7870} {"train_loss": -28.571813583374023, "global_step": 653260, "epoch": 7870} {"train_loss": -28.379491806030273, "global_step": 653261, "epoch": 7870} {"train_loss": -28.2713680267334, "global_step": 653262, "epoch": 7870} {"train_loss": -28.736835479736328, "global_step": 653263, "epoch": 7870} {"train_loss": -28.116012573242188, "global_step": 653264, "epoch": 7870} {"train_loss": -28.414270401000977, "global_step": 653265, "epoch": 7870} {"train_loss": -28.577600479125977, "global_step": 653266, "epoch": 7870} {"train_loss": -28.335514068603516, "global_step": 653267, "epoch": 7870} {"train_loss": -28.266315460205078, "global_step": 653268, "epoch": 7870} {"train_loss": -28.4660701751709, "global_step": 653269, "epoch": 7870} {"train_loss": -28.372695922851562, "global_step": 653270, "epoch": 7870} {"train_loss": -28.631275177001953, "global_step": 653271, "epoch": 7870} {"train_loss": -28.44185447692871, "global_step": 653272, "epoch": 7870} {"train_loss": -28.32940101623535, "global_step": 653273, "epoch": 7870} {"train_loss": -28.108264923095703, "global_step": 653274, "epoch": 7870} {"train_loss": -28.239179611206055, "global_step": 653275, "epoch": 7870} {"train_loss": -28.486591339111328, "global_step": 653276, "epoch": 7870} {"train_loss": -28.269987106323242, "global_step": 653277, "epoch": 7870} {"train_loss": -28.43482780456543, "global_step": 653278, "epoch": 7870} {"train_loss": -27.872888565063477, "global_step": 653279, "epoch": 7870} {"train_loss": -28.867938995361328, "global_step": 653280, "epoch": 7870} {"train_loss": -28.36322593688965, "global_step": 653281, "epoch": 7870} {"train_loss": -28.21253776550293, "global_step": 653282, "epoch": 7870} {"train_loss": -28.643115997314453, "global_step": 653283, "epoch": 7870} {"train_loss": -28.056543350219727, "global_step": 653284, "epoch": 7870} {"train_loss": -27.9443302154541, "global_step": 653285, "epoch": 7870} {"train_loss": -28.49057388305664, "global_step": 653286, "epoch": 7870} {"train_loss": -28.048858642578125, "global_step": 653287, "epoch": 7870} {"train_loss": -28.341699600219727, "global_step": 653288, "epoch": 7870} {"train_loss": -28.391584396362305, "global_step": 653289, "epoch": 7870} {"train_loss": -28.437265396118164, "global_step": 653290, "epoch": 7870} {"train_loss": -28.11545181274414, "global_step": 653291, "epoch": 7870} {"train_loss": -28.137775421142578, "global_step": 653292, "epoch": 7870, "val_loss": 6683033.5} {"train_loss": -23.75330352783203, "global_step": 653293, "epoch": 7871} {"train_loss": -21.842361450195312, "global_step": 653294, "epoch": 7871} {"train_loss": -24.411649703979492, "global_step": 653295, "epoch": 7871} {"train_loss": -23.3796443939209, "global_step": 653296, "epoch": 7871} {"train_loss": -25.93985366821289, "global_step": 653297, "epoch": 7871} {"train_loss": -25.247045516967773, "global_step": 653298, "epoch": 7871} {"train_loss": -25.752721786499023, "global_step": 653299, "epoch": 7871} {"train_loss": -26.246002197265625, "global_step": 653300, "epoch": 7871} {"train_loss": -26.291173934936523, "global_step": 653301, "epoch": 7871} {"train_loss": -26.215116500854492, "global_step": 653302, "epoch": 7871} {"train_loss": -26.539020538330078, "global_step": 653303, "epoch": 7871} {"train_loss": -27.010465621948242, "global_step": 653304, "epoch": 7871} {"train_loss": -26.71832847595215, "global_step": 653305, "epoch": 7871} {"train_loss": -26.96051025390625, "global_step": 653306, "epoch": 7871} {"train_loss": -26.912933349609375, "global_step": 653307, "epoch": 7871} {"train_loss": -26.75032615661621, "global_step": 653308, "epoch": 7871} {"train_loss": -26.908777236938477, "global_step": 653309, "epoch": 7871} {"train_loss": -27.119394302368164, "global_step": 653310, "epoch": 7871} {"train_loss": -26.952402114868164, "global_step": 653311, "epoch": 7871} {"train_loss": -27.01099967956543, "global_step": 653312, "epoch": 7871} {"train_loss": -26.526281356811523, "global_step": 653313, "epoch": 7871} {"train_loss": -27.164264678955078, "global_step": 653314, "epoch": 7871} {"train_loss": -27.157306671142578, "global_step": 653315, "epoch": 7871} {"train_loss": -27.166202545166016, "global_step": 653316, "epoch": 7871} {"train_loss": -27.509679794311523, "global_step": 653317, "epoch": 7871} {"train_loss": -27.3785343170166, "global_step": 653318, "epoch": 7871} {"train_loss": -27.303913116455078, "global_step": 653319, "epoch": 7871} {"train_loss": -27.25605583190918, "global_step": 653320, "epoch": 7871} {"train_loss": -27.345361709594727, "global_step": 653321, "epoch": 7871} {"train_loss": -27.367603302001953, "global_step": 653322, "epoch": 7871} {"train_loss": -27.256805419921875, "global_step": 653323, "epoch": 7871} {"train_loss": -27.612201690673828, "global_step": 653324, "epoch": 7871} {"train_loss": -27.468463897705078, "global_step": 653325, "epoch": 7871} {"train_loss": -27.3082332611084, "global_step": 653326, "epoch": 7871} {"train_loss": -27.433380126953125, "global_step": 653327, "epoch": 7871} {"train_loss": -27.243515014648438, "global_step": 653328, "epoch": 7871} {"train_loss": -27.458099365234375, "global_step": 653329, "epoch": 7871} {"train_loss": -27.65424156188965, "global_step": 653330, "epoch": 7871} {"train_loss": -27.715469360351562, "global_step": 653331, "epoch": 7871} {"train_loss": -27.46933937072754, "global_step": 653332, "epoch": 7871} {"train_loss": -28.053653717041016, "global_step": 653333, "epoch": 7871} {"train_loss": -27.858539581298828, "global_step": 653334, "epoch": 7871} {"train_loss": -27.955530166625977, "global_step": 653335, "epoch": 7871} {"train_loss": -27.71746826171875, "global_step": 653336, "epoch": 7871} {"train_loss": -27.81037712097168, "global_step": 653337, "epoch": 7871} {"train_loss": -27.969573974609375, "global_step": 653338, "epoch": 7871} {"train_loss": -27.8525390625, "global_step": 653339, "epoch": 7871} {"train_loss": -27.766950607299805, "global_step": 653340, "epoch": 7871} {"train_loss": -27.766462326049805, "global_step": 653341, "epoch": 7871} {"train_loss": -27.95428466796875, "global_step": 653342, "epoch": 7871} {"train_loss": -28.03449058532715, "global_step": 653343, "epoch": 7871} {"train_loss": -28.637540817260742, "global_step": 653344, "epoch": 7871} {"train_loss": -27.734893798828125, "global_step": 653345, "epoch": 7871} {"train_loss": -28.198184967041016, "global_step": 653346, "epoch": 7871} {"train_loss": -28.0791015625, "global_step": 653347, "epoch": 7871} {"train_loss": -28.00286293029785, "global_step": 653348, "epoch": 7871} {"train_loss": -28.41973304748535, "global_step": 653349, "epoch": 7871} {"train_loss": -28.493356704711914, "global_step": 653350, "epoch": 7871} {"train_loss": -28.222152709960938, "global_step": 653351, "epoch": 7871} {"train_loss": -28.431432723999023, "global_step": 653352, "epoch": 7871} {"train_loss": -28.49382972717285, "global_step": 653353, "epoch": 7871} {"train_loss": -28.584325790405273, "global_step": 653354, "epoch": 7871} {"train_loss": -28.71783447265625, "global_step": 653355, "epoch": 7871} {"train_loss": -28.361677169799805, "global_step": 653356, "epoch": 7871} {"train_loss": -28.86590576171875, "global_step": 653357, "epoch": 7871} {"train_loss": -28.65234375, "global_step": 653358, "epoch": 7871} {"train_loss": -28.277265548706055, "global_step": 653359, "epoch": 7871} {"train_loss": -28.6524715423584, "global_step": 653360, "epoch": 7871} {"train_loss": -28.340280532836914, "global_step": 653361, "epoch": 7871} {"train_loss": -27.961746215820312, "global_step": 653362, "epoch": 7871} {"train_loss": -28.105939865112305, "global_step": 653363, "epoch": 7871} {"train_loss": -27.985273361206055, "global_step": 653364, "epoch": 7871} {"train_loss": -28.24440574645996, "global_step": 653365, "epoch": 7871} {"train_loss": -27.858428955078125, "global_step": 653366, "epoch": 7871} {"train_loss": -28.509063720703125, "global_step": 653367, "epoch": 7871} {"train_loss": -28.42740249633789, "global_step": 653368, "epoch": 7871} {"train_loss": -28.20688819885254, "global_step": 653369, "epoch": 7871} {"train_loss": -28.127166748046875, "global_step": 653370, "epoch": 7871} {"train_loss": -27.976490020751953, "global_step": 653371, "epoch": 7871} {"train_loss": -27.806396484375, "global_step": 653372, "epoch": 7871} {"train_loss": -28.00726890563965, "global_step": 653373, "epoch": 7871} {"train_loss": -28.107757568359375, "global_step": 653374, "epoch": 7871} {"train_loss": -27.431498378156178, "global_step": 653375, "epoch": 7871, "val_loss": 6710135.0} {"train_loss": -27.961288452148438, "global_step": 653376, "epoch": 7872} {"train_loss": -27.5450496673584, "global_step": 653377, "epoch": 7872} {"train_loss": -27.65931510925293, "global_step": 653378, "epoch": 7872} {"train_loss": -27.5965576171875, "global_step": 653379, "epoch": 7872} {"train_loss": -28.343488693237305, "global_step": 653380, "epoch": 7872} {"train_loss": -27.560514450073242, "global_step": 653381, "epoch": 7872} {"train_loss": -27.727949142456055, "global_step": 653382, "epoch": 7872} {"train_loss": -28.03435707092285, "global_step": 653383, "epoch": 7872} {"train_loss": -27.709491729736328, "global_step": 653384, "epoch": 7872} {"train_loss": -28.25198745727539, "global_step": 653385, "epoch": 7872} {"train_loss": -27.87738609313965, "global_step": 653386, "epoch": 7872} {"train_loss": -28.047021865844727, "global_step": 653387, "epoch": 7872} {"train_loss": -28.015522003173828, "global_step": 653388, "epoch": 7872} {"train_loss": -28.150705337524414, "global_step": 653389, "epoch": 7872} {"train_loss": -28.13555335998535, "global_step": 653390, "epoch": 7872} {"train_loss": -28.050521850585938, "global_step": 653391, "epoch": 7872} {"train_loss": -28.08563804626465, "global_step": 653392, "epoch": 7872} {"train_loss": -28.38245964050293, "global_step": 653393, "epoch": 7872} {"train_loss": -27.962051391601562, "global_step": 653394, "epoch": 7872} {"train_loss": -28.427825927734375, "global_step": 653395, "epoch": 7872} {"train_loss": -28.4154109954834, "global_step": 653396, "epoch": 7872} {"train_loss": -28.505645751953125, "global_step": 653397, "epoch": 7872} {"train_loss": -28.353321075439453, "global_step": 653398, "epoch": 7872} {"train_loss": -28.336206436157227, "global_step": 653399, "epoch": 7872} {"train_loss": -28.16367530822754, "global_step": 653400, "epoch": 7872} {"train_loss": -28.072202682495117, "global_step": 653401, "epoch": 7872} {"train_loss": -28.030200958251953, "global_step": 653402, "epoch": 7872} {"train_loss": -28.5859317779541, "global_step": 653403, "epoch": 7872} {"train_loss": -28.486572265625, "global_step": 653404, "epoch": 7872} {"train_loss": -28.45892333984375, "global_step": 653405, "epoch": 7872} {"train_loss": -28.044879913330078, "global_step": 653406, "epoch": 7872} {"train_loss": -28.62184715270996, "global_step": 653407, "epoch": 7872} {"train_loss": -28.065000534057617, "global_step": 653408, "epoch": 7872} {"train_loss": -28.377973556518555, "global_step": 653409, "epoch": 7872} {"train_loss": -28.72478675842285, "global_step": 653410, "epoch": 7872} {"train_loss": -28.8688907623291, "global_step": 653411, "epoch": 7872} {"train_loss": -28.398290634155273, "global_step": 653412, "epoch": 7872} {"train_loss": -28.56654167175293, "global_step": 653413, "epoch": 7872} {"train_loss": -28.15229606628418, "global_step": 653414, "epoch": 7872} {"train_loss": -28.3897705078125, "global_step": 653415, "epoch": 7872} {"train_loss": -28.287763595581055, "global_step": 653416, "epoch": 7872} {"train_loss": -28.344091415405273, "global_step": 653417, "epoch": 7872} {"train_loss": -28.587432861328125, "global_step": 653418, "epoch": 7872} {"train_loss": -28.730194091796875, "global_step": 653419, "epoch": 7872} {"train_loss": -28.372089385986328, "global_step": 653420, "epoch": 7872} {"train_loss": -28.570648193359375, "global_step": 653421, "epoch": 7872} {"train_loss": -28.443368911743164, "global_step": 653422, "epoch": 7872} {"train_loss": -28.379016876220703, "global_step": 653423, "epoch": 7872} {"train_loss": -28.455976486206055, "global_step": 653424, "epoch": 7872} {"train_loss": -28.524229049682617, "global_step": 653425, "epoch": 7872} {"train_loss": -28.8419189453125, "global_step": 653426, "epoch": 7872} {"train_loss": -28.537109375, "global_step": 653427, "epoch": 7872} {"train_loss": -28.254362106323242, "global_step": 653428, "epoch": 7872} {"train_loss": -28.638635635375977, "global_step": 653429, "epoch": 7872} {"train_loss": -28.58103370666504, "global_step": 653430, "epoch": 7872} {"train_loss": -28.761083602905273, "global_step": 653431, "epoch": 7872} {"train_loss": -28.0428466796875, "global_step": 653432, "epoch": 7872} {"train_loss": -28.501983642578125, "global_step": 653433, "epoch": 7872} {"train_loss": -28.66758155822754, "global_step": 653434, "epoch": 7872} {"train_loss": -28.89869499206543, "global_step": 653435, "epoch": 7872} {"train_loss": -28.497793197631836, "global_step": 653436, "epoch": 7872} {"train_loss": -28.48921012878418, "global_step": 653437, "epoch": 7872} {"train_loss": -28.16750144958496, "global_step": 653438, "epoch": 7872} {"train_loss": -28.425739288330078, "global_step": 653439, "epoch": 7872} {"train_loss": -28.6234130859375, "global_step": 653440, "epoch": 7872} {"train_loss": -28.28908348083496, "global_step": 653441, "epoch": 7872} {"train_loss": -28.329822540283203, "global_step": 653442, "epoch": 7872} {"train_loss": -27.816205978393555, "global_step": 653443, "epoch": 7872} {"train_loss": -28.092443466186523, "global_step": 653444, "epoch": 7872} {"train_loss": -28.194177627563477, "global_step": 653445, "epoch": 7872} {"train_loss": -28.812255859375, "global_step": 653446, "epoch": 7872} {"train_loss": -28.32908058166504, "global_step": 653447, "epoch": 7872} {"train_loss": -27.841394424438477, "global_step": 653448, "epoch": 7872} {"train_loss": -28.152509689331055, "global_step": 653449, "epoch": 7872} {"train_loss": -27.851720809936523, "global_step": 653450, "epoch": 7872} {"train_loss": -27.782346725463867, "global_step": 653451, "epoch": 7872} {"train_loss": -27.44596290588379, "global_step": 653452, "epoch": 7872} {"train_loss": -28.23028564453125, "global_step": 653453, "epoch": 7872} {"train_loss": -28.23224449157715, "global_step": 653454, "epoch": 7872} {"train_loss": -28.1927433013916, "global_step": 653455, "epoch": 7872} {"train_loss": -28.00636863708496, "global_step": 653456, "epoch": 7872} {"train_loss": -28.210912704467773, "global_step": 653457, "epoch": 7872} {"train_loss": -28.25501044399767, "global_step": 653458, "epoch": 7872, "val_loss": 6706512.5} {"train_loss": -26.33957290649414, "global_step": 653459, "epoch": 7873} {"train_loss": -26.88421630859375, "global_step": 653460, "epoch": 7873} {"train_loss": -27.34954833984375, "global_step": 653461, "epoch": 7873} {"train_loss": -27.82020378112793, "global_step": 653462, "epoch": 7873} {"train_loss": -27.264179229736328, "global_step": 653463, "epoch": 7873} {"train_loss": -27.897428512573242, "global_step": 653464, "epoch": 7873} {"train_loss": -27.237958908081055, "global_step": 653465, "epoch": 7873} {"train_loss": -27.153289794921875, "global_step": 653466, "epoch": 7873} {"train_loss": -27.46845054626465, "global_step": 653467, "epoch": 7873} {"train_loss": -26.997827529907227, "global_step": 653468, "epoch": 7873} {"train_loss": -27.565420150756836, "global_step": 653469, "epoch": 7873} {"train_loss": -27.86976432800293, "global_step": 653470, "epoch": 7873} {"train_loss": -27.38543701171875, "global_step": 653471, "epoch": 7873} {"train_loss": -27.837942123413086, "global_step": 653472, "epoch": 7873} {"train_loss": -27.78995132446289, "global_step": 653473, "epoch": 7873} {"train_loss": -27.72307777404785, "global_step": 653474, "epoch": 7873} {"train_loss": -27.81439781188965, "global_step": 653475, "epoch": 7873} {"train_loss": -27.913990020751953, "global_step": 653476, "epoch": 7873} {"train_loss": -28.05763053894043, "global_step": 653477, "epoch": 7873} {"train_loss": -27.745574951171875, "global_step": 653478, "epoch": 7873} {"train_loss": -28.063528060913086, "global_step": 653479, "epoch": 7873} {"train_loss": -27.821744918823242, "global_step": 653480, "epoch": 7873} {"train_loss": -28.31928825378418, "global_step": 653481, "epoch": 7873} {"train_loss": -28.08734130859375, "global_step": 653482, "epoch": 7873} {"train_loss": -27.95539665222168, "global_step": 653483, "epoch": 7873} {"train_loss": -28.234994888305664, "global_step": 653484, "epoch": 7873} {"train_loss": -28.437122344970703, "global_step": 653485, "epoch": 7873} {"train_loss": -28.278766632080078, "global_step": 653486, "epoch": 7873} {"train_loss": -28.39824867248535, "global_step": 653487, "epoch": 7873} {"train_loss": -27.965469360351562, "global_step": 653488, "epoch": 7873} {"train_loss": -27.918188095092773, "global_step": 653489, "epoch": 7873} {"train_loss": -28.50510025024414, "global_step": 653490, "epoch": 7873} {"train_loss": -28.393463134765625, "global_step": 653491, "epoch": 7873} {"train_loss": -28.55714225769043, "global_step": 653492, "epoch": 7873} {"train_loss": -28.291662216186523, "global_step": 653493, "epoch": 7873} {"train_loss": -28.439590454101562, "global_step": 653494, "epoch": 7873} {"train_loss": -28.507307052612305, "global_step": 653495, "epoch": 7873} {"train_loss": -27.985803604125977, "global_step": 653496, "epoch": 7873} {"train_loss": -28.01862907409668, "global_step": 653497, "epoch": 7873} {"train_loss": -28.13958168029785, "global_step": 653498, "epoch": 7873} {"train_loss": -28.51492691040039, "global_step": 653499, "epoch": 7873} {"train_loss": -28.084308624267578, "global_step": 653500, "epoch": 7873} {"train_loss": -28.222013473510742, "global_step": 653501, "epoch": 7873} {"train_loss": -28.746774673461914, "global_step": 653502, "epoch": 7873} {"train_loss": -28.30640983581543, "global_step": 653503, "epoch": 7873} {"train_loss": -28.38923454284668, "global_step": 653504, "epoch": 7873} {"train_loss": -28.578710556030273, "global_step": 653505, "epoch": 7873} {"train_loss": -28.647184371948242, "global_step": 653506, "epoch": 7873} {"train_loss": -27.81308364868164, "global_step": 653507, "epoch": 7873} {"train_loss": -28.0892391204834, "global_step": 653508, "epoch": 7873} {"train_loss": -28.679157257080078, "global_step": 653509, "epoch": 7873} {"train_loss": -28.06438636779785, "global_step": 653510, "epoch": 7873} {"train_loss": -28.0085391998291, "global_step": 653511, "epoch": 7873} {"train_loss": -28.14106559753418, "global_step": 653512, "epoch": 7873} {"train_loss": -28.720609664916992, "global_step": 653513, "epoch": 7873} {"train_loss": -28.650970458984375, "global_step": 653514, "epoch": 7873} {"train_loss": -28.287494659423828, "global_step": 653515, "epoch": 7873} {"train_loss": -28.4383487701416, "global_step": 653516, "epoch": 7873} {"train_loss": -28.295944213867188, "global_step": 653517, "epoch": 7873} {"train_loss": -28.45387077331543, "global_step": 653518, "epoch": 7873} {"train_loss": -28.156660079956055, "global_step": 653519, "epoch": 7873} {"train_loss": -28.35578727722168, "global_step": 653520, "epoch": 7873} {"train_loss": -28.4007511138916, "global_step": 653521, "epoch": 7873} {"train_loss": -28.254316329956055, "global_step": 653522, "epoch": 7873} {"train_loss": -28.073266983032227, "global_step": 653523, "epoch": 7873} {"train_loss": -27.871076583862305, "global_step": 653524, "epoch": 7873} {"train_loss": -28.4416446685791, "global_step": 653525, "epoch": 7873} {"train_loss": -28.3043212890625, "global_step": 653526, "epoch": 7873} {"train_loss": -28.427213668823242, "global_step": 653527, "epoch": 7873} {"train_loss": -28.660797119140625, "global_step": 653528, "epoch": 7873} {"train_loss": -28.19089698791504, "global_step": 653529, "epoch": 7873} {"train_loss": -28.084745407104492, "global_step": 653530, "epoch": 7873} {"train_loss": -28.522525787353516, "global_step": 653531, "epoch": 7873} {"train_loss": -28.32696533203125, "global_step": 653532, "epoch": 7873} {"train_loss": -28.656171798706055, "global_step": 653533, "epoch": 7873} {"train_loss": -28.499267578125, "global_step": 653534, "epoch": 7873} {"train_loss": -28.50691032409668, "global_step": 653535, "epoch": 7873} {"train_loss": -28.43798828125, "global_step": 653536, "epoch": 7873} {"train_loss": -28.4893741607666, "global_step": 653537, "epoch": 7873} {"train_loss": -28.443140029907227, "global_step": 653538, "epoch": 7873} {"train_loss": -28.409870147705078, "global_step": 653539, "epoch": 7873} {"train_loss": -28.219518661499023, "global_step": 653540, "epoch": 7873} {"train_loss": -28.102493010371564, "global_step": 653541, "epoch": 7873, "val_loss": 6709411.0} {"train_loss": -27.61376953125, "global_step": 653542, "epoch": 7874} {"train_loss": -26.70562171936035, "global_step": 653543, "epoch": 7874} {"train_loss": -25.774158477783203, "global_step": 653544, "epoch": 7874} {"train_loss": -26.348865509033203, "global_step": 653545, "epoch": 7874} {"train_loss": -27.33204460144043, "global_step": 653546, "epoch": 7874} {"train_loss": -26.48495864868164, "global_step": 653547, "epoch": 7874} {"train_loss": -26.958206176757812, "global_step": 653548, "epoch": 7874} {"train_loss": -27.089801788330078, "global_step": 653549, "epoch": 7874} {"train_loss": -27.56436538696289, "global_step": 653550, "epoch": 7874} {"train_loss": -27.869247436523438, "global_step": 653551, "epoch": 7874} {"train_loss": -27.660358428955078, "global_step": 653552, "epoch": 7874} {"train_loss": -27.472003936767578, "global_step": 653553, "epoch": 7874} {"train_loss": -27.802839279174805, "global_step": 653554, "epoch": 7874} {"train_loss": -27.7415828704834, "global_step": 653555, "epoch": 7874} {"train_loss": -27.818078994750977, "global_step": 653556, "epoch": 7874} {"train_loss": -27.590478897094727, "global_step": 653557, "epoch": 7874} {"train_loss": -27.649145126342773, "global_step": 653558, "epoch": 7874} {"train_loss": -27.868505477905273, "global_step": 653559, "epoch": 7874} {"train_loss": -27.740509033203125, "global_step": 653560, "epoch": 7874} {"train_loss": -27.957244873046875, "global_step": 653561, "epoch": 7874} {"train_loss": -27.762929916381836, "global_step": 653562, "epoch": 7874} {"train_loss": -27.669172286987305, "global_step": 653563, "epoch": 7874} {"train_loss": -27.86813735961914, "global_step": 653564, "epoch": 7874} {"train_loss": -28.062744140625, "global_step": 653565, "epoch": 7874} {"train_loss": -28.23798179626465, "global_step": 653566, "epoch": 7874} {"train_loss": -28.070972442626953, "global_step": 653567, "epoch": 7874} {"train_loss": -28.131635665893555, "global_step": 653568, "epoch": 7874} {"train_loss": -28.2552433013916, "global_step": 653569, "epoch": 7874} {"train_loss": -28.02069091796875, "global_step": 653570, "epoch": 7874} {"train_loss": -28.11555290222168, "global_step": 653571, "epoch": 7874} {"train_loss": -28.32197380065918, "global_step": 653572, "epoch": 7874} {"train_loss": -28.099029541015625, "global_step": 653573, "epoch": 7874} {"train_loss": -28.041837692260742, "global_step": 653574, "epoch": 7874} {"train_loss": -28.275861740112305, "global_step": 653575, "epoch": 7874} {"train_loss": -28.631885528564453, "global_step": 653576, "epoch": 7874} {"train_loss": -28.069427490234375, "global_step": 653577, "epoch": 7874} {"train_loss": -28.238815307617188, "global_step": 653578, "epoch": 7874} {"train_loss": -28.309894561767578, "global_step": 653579, "epoch": 7874} {"train_loss": -28.285873413085938, "global_step": 653580, "epoch": 7874} {"train_loss": -28.31021499633789, "global_step": 653581, "epoch": 7874} {"train_loss": -28.376102447509766, "global_step": 653582, "epoch": 7874} {"train_loss": -28.21478843688965, "global_step": 653583, "epoch": 7874} {"train_loss": -28.102542877197266, "global_step": 653584, "epoch": 7874} {"train_loss": -28.63214683532715, "global_step": 653585, "epoch": 7874} {"train_loss": -28.59943962097168, "global_step": 653586, "epoch": 7874} {"train_loss": -28.453784942626953, "global_step": 653587, "epoch": 7874} {"train_loss": -28.296844482421875, "global_step": 653588, "epoch": 7874} {"train_loss": -28.78999900817871, "global_step": 653589, "epoch": 7874} {"train_loss": -28.36964225769043, "global_step": 653590, "epoch": 7874} {"train_loss": -28.413503646850586, "global_step": 653591, "epoch": 7874} {"train_loss": -28.39284324645996, "global_step": 653592, "epoch": 7874} {"train_loss": -28.672407150268555, "global_step": 653593, "epoch": 7874} {"train_loss": -28.627506256103516, "global_step": 653594, "epoch": 7874} {"train_loss": -28.174224853515625, "global_step": 653595, "epoch": 7874} {"train_loss": -28.17022132873535, "global_step": 653596, "epoch": 7874} {"train_loss": -28.53937339782715, "global_step": 653597, "epoch": 7874} {"train_loss": -28.272327423095703, "global_step": 653598, "epoch": 7874} {"train_loss": -28.30124282836914, "global_step": 653599, "epoch": 7874} {"train_loss": -28.071990966796875, "global_step": 653600, "epoch": 7874} {"train_loss": -27.920080184936523, "global_step": 653601, "epoch": 7874} {"train_loss": -28.50640869140625, "global_step": 653602, "epoch": 7874} {"train_loss": -27.766016006469727, "global_step": 653603, "epoch": 7874} {"train_loss": -28.293628692626953, "global_step": 653604, "epoch": 7874} {"train_loss": -28.626190185546875, "global_step": 653605, "epoch": 7874} {"train_loss": -28.233667373657227, "global_step": 653606, "epoch": 7874} {"train_loss": -28.171710968017578, "global_step": 653607, "epoch": 7874} {"train_loss": -28.178028106689453, "global_step": 653608, "epoch": 7874} {"train_loss": -27.889652252197266, "global_step": 653609, "epoch": 7874} {"train_loss": -28.413976669311523, "global_step": 653610, "epoch": 7874} {"train_loss": -28.213727951049805, "global_step": 653611, "epoch": 7874} {"train_loss": -28.40211296081543, "global_step": 653612, "epoch": 7874} {"train_loss": -28.218210220336914, "global_step": 653613, "epoch": 7874} {"train_loss": -28.452747344970703, "global_step": 653614, "epoch": 7874} {"train_loss": -28.23062515258789, "global_step": 653615, "epoch": 7874} {"train_loss": -28.12165641784668, "global_step": 653616, "epoch": 7874} {"train_loss": -28.51612663269043, "global_step": 653617, "epoch": 7874} {"train_loss": -28.457077026367188, "global_step": 653618, "epoch": 7874} {"train_loss": -28.80939292907715, "global_step": 653619, "epoch": 7874} {"train_loss": -28.1748104095459, "global_step": 653620, "epoch": 7874} {"train_loss": -28.234052658081055, "global_step": 653621, "epoch": 7874} {"train_loss": -28.63666343688965, "global_step": 653622, "epoch": 7874} {"train_loss": -28.308324813842773, "global_step": 653623, "epoch": 7874} {"train_loss": -28.048123945672828, "global_step": 653624, "epoch": 7874, "val_loss": 6711428.5} {"train_loss": -27.33564567565918, "global_step": 653625, "epoch": 7875} {"train_loss": -27.455093383789062, "global_step": 653626, "epoch": 7875} {"train_loss": -27.690210342407227, "global_step": 653627, "epoch": 7875} {"train_loss": -27.039976119995117, "global_step": 653628, "epoch": 7875} {"train_loss": -28.034128189086914, "global_step": 653629, "epoch": 7875} {"train_loss": -27.720611572265625, "global_step": 653630, "epoch": 7875} {"train_loss": -27.708209991455078, "global_step": 653631, "epoch": 7875} {"train_loss": -27.668304443359375, "global_step": 653632, "epoch": 7875} {"train_loss": -28.027729034423828, "global_step": 653633, "epoch": 7875} {"train_loss": -28.085418701171875, "global_step": 653634, "epoch": 7875} {"train_loss": -28.239118576049805, "global_step": 653635, "epoch": 7875} {"train_loss": -28.176773071289062, "global_step": 653636, "epoch": 7875} {"train_loss": -27.8087215423584, "global_step": 653637, "epoch": 7875} {"train_loss": -27.664276123046875, "global_step": 653638, "epoch": 7875} {"train_loss": -27.942609786987305, "global_step": 653639, "epoch": 7875} {"train_loss": -27.775495529174805, "global_step": 653640, "epoch": 7875} {"train_loss": -27.80084228515625, "global_step": 653641, "epoch": 7875} {"train_loss": -28.081409454345703, "global_step": 653642, "epoch": 7875} {"train_loss": -28.46747398376465, "global_step": 653643, "epoch": 7875} {"train_loss": -28.157194137573242, "global_step": 653644, "epoch": 7875} {"train_loss": -28.43088722229004, "global_step": 653645, "epoch": 7875} {"train_loss": -28.24098014831543, "global_step": 653646, "epoch": 7875} {"train_loss": -28.068262100219727, "global_step": 653647, "epoch": 7875} {"train_loss": -27.98048973083496, "global_step": 653648, "epoch": 7875} {"train_loss": -28.118375778198242, "global_step": 653649, "epoch": 7875} {"train_loss": -28.1179256439209, "global_step": 653650, "epoch": 7875} {"train_loss": -27.889270782470703, "global_step": 653651, "epoch": 7875} {"train_loss": -28.032703399658203, "global_step": 653652, "epoch": 7875} {"train_loss": -28.008377075195312, "global_step": 653653, "epoch": 7875} {"train_loss": -28.251041412353516, "global_step": 653654, "epoch": 7875} {"train_loss": -28.5482177734375, "global_step": 653655, "epoch": 7875} {"train_loss": -28.08613395690918, "global_step": 653656, "epoch": 7875} {"train_loss": -28.171600341796875, "global_step": 653657, "epoch": 7875} {"train_loss": -27.947118759155273, "global_step": 653658, "epoch": 7875} {"train_loss": -28.151639938354492, "global_step": 653659, "epoch": 7875} {"train_loss": -28.287078857421875, "global_step": 653660, "epoch": 7875} {"train_loss": -28.233600616455078, "global_step": 653661, "epoch": 7875} {"train_loss": -28.218027114868164, "global_step": 653662, "epoch": 7875} {"train_loss": -28.087848663330078, "global_step": 653663, "epoch": 7875} {"train_loss": -28.12774658203125, "global_step": 653664, "epoch": 7875} {"train_loss": -28.343969345092773, "global_step": 653665, "epoch": 7875} {"train_loss": -28.3704891204834, "global_step": 653666, "epoch": 7875} {"train_loss": -28.446752548217773, "global_step": 653667, "epoch": 7875} {"train_loss": -28.384252548217773, "global_step": 653668, "epoch": 7875} {"train_loss": -28.524768829345703, "global_step": 653669, "epoch": 7875} {"train_loss": -28.507766723632812, "global_step": 653670, "epoch": 7875} {"train_loss": -28.4831485748291, "global_step": 653671, "epoch": 7875} {"train_loss": -28.438220977783203, "global_step": 653672, "epoch": 7875} {"train_loss": -28.30055809020996, "global_step": 653673, "epoch": 7875} {"train_loss": -28.446277618408203, "global_step": 653674, "epoch": 7875} {"train_loss": -28.276342391967773, "global_step": 653675, "epoch": 7875} {"train_loss": -28.684890747070312, "global_step": 653676, "epoch": 7875} {"train_loss": -28.71906089782715, "global_step": 653677, "epoch": 7875} {"train_loss": -28.10870361328125, "global_step": 653678, "epoch": 7875} {"train_loss": -28.045347213745117, "global_step": 653679, "epoch": 7875} {"train_loss": -28.551908493041992, "global_step": 653680, "epoch": 7875} {"train_loss": -28.477752685546875, "global_step": 653681, "epoch": 7875} {"train_loss": -28.265594482421875, "global_step": 653682, "epoch": 7875} {"train_loss": -28.24848747253418, "global_step": 653683, "epoch": 7875} {"train_loss": -28.583215713500977, "global_step": 653684, "epoch": 7875} {"train_loss": -28.351804733276367, "global_step": 653685, "epoch": 7875} {"train_loss": -28.52764320373535, "global_step": 653686, "epoch": 7875} {"train_loss": -28.21760368347168, "global_step": 653687, "epoch": 7875} {"train_loss": -28.061664581298828, "global_step": 653688, "epoch": 7875} {"train_loss": -28.470365524291992, "global_step": 653689, "epoch": 7875} {"train_loss": -28.218137741088867, "global_step": 653690, "epoch": 7875} {"train_loss": -28.1160888671875, "global_step": 653691, "epoch": 7875} {"train_loss": -28.056232452392578, "global_step": 653692, "epoch": 7875} {"train_loss": -28.499670028686523, "global_step": 653693, "epoch": 7875} {"train_loss": -28.30071449279785, "global_step": 653694, "epoch": 7875} {"train_loss": -28.491369247436523, "global_step": 653695, "epoch": 7875} {"train_loss": -28.458398818969727, "global_step": 653696, "epoch": 7875} {"train_loss": -28.224390029907227, "global_step": 653697, "epoch": 7875} {"train_loss": -28.297149658203125, "global_step": 653698, "epoch": 7875} {"train_loss": -28.7242431640625, "global_step": 653699, "epoch": 7875} {"train_loss": -28.768192291259766, "global_step": 653700, "epoch": 7875} {"train_loss": -28.133283615112305, "global_step": 653701, "epoch": 7875} {"train_loss": -28.31743812561035, "global_step": 653702, "epoch": 7875} {"train_loss": -28.63300895690918, "global_step": 653703, "epoch": 7875} {"train_loss": -28.531492233276367, "global_step": 653704, "epoch": 7875} {"train_loss": -28.217010498046875, "global_step": 653705, "epoch": 7875} {"train_loss": -28.344465255737305, "global_step": 653706, "epoch": 7875} {"train_loss": -28.176638545760188, "global_step": 653707, "epoch": 7875, "val_loss": 6689723.5} {"train_loss": -25.80120277404785, "global_step": 653708, "epoch": 7876} {"train_loss": -24.995777130126953, "global_step": 653709, "epoch": 7876} {"train_loss": -27.170927047729492, "global_step": 653710, "epoch": 7876} {"train_loss": -27.063535690307617, "global_step": 653711, "epoch": 7876} {"train_loss": -27.759580612182617, "global_step": 653712, "epoch": 7876} {"train_loss": -26.77790641784668, "global_step": 653713, "epoch": 7876} {"train_loss": -27.5438289642334, "global_step": 653714, "epoch": 7876} {"train_loss": -26.823408126831055, "global_step": 653715, "epoch": 7876} {"train_loss": -27.755481719970703, "global_step": 653716, "epoch": 7876} {"train_loss": -27.09095573425293, "global_step": 653717, "epoch": 7876} {"train_loss": -27.634063720703125, "global_step": 653718, "epoch": 7876} {"train_loss": -27.755239486694336, "global_step": 653719, "epoch": 7876} {"train_loss": -27.076541900634766, "global_step": 653720, "epoch": 7876} {"train_loss": -27.570999145507812, "global_step": 653721, "epoch": 7876} {"train_loss": -27.7807559967041, "global_step": 653722, "epoch": 7876} {"train_loss": -27.204376220703125, "global_step": 653723, "epoch": 7876} {"train_loss": -27.47232437133789, "global_step": 653724, "epoch": 7876} {"train_loss": -27.69281005859375, "global_step": 653725, "epoch": 7876} {"train_loss": -27.34585952758789, "global_step": 653726, "epoch": 7876} {"train_loss": -27.785953521728516, "global_step": 653727, "epoch": 7876} {"train_loss": -27.746143341064453, "global_step": 653728, "epoch": 7876} {"train_loss": -27.57905387878418, "global_step": 653729, "epoch": 7876} {"train_loss": -27.926599502563477, "global_step": 653730, "epoch": 7876} {"train_loss": -28.176816940307617, "global_step": 653731, "epoch": 7876} {"train_loss": -28.083898544311523, "global_step": 653732, "epoch": 7876} {"train_loss": -27.84675407409668, "global_step": 653733, "epoch": 7876} {"train_loss": -27.75321388244629, "global_step": 653734, "epoch": 7876} {"train_loss": -27.992040634155273, "global_step": 653735, "epoch": 7876} {"train_loss": -28.073944091796875, "global_step": 653736, "epoch": 7876} {"train_loss": -28.02657127380371, "global_step": 653737, "epoch": 7876} {"train_loss": -27.817895889282227, "global_step": 653738, "epoch": 7876} {"train_loss": -28.001943588256836, "global_step": 653739, "epoch": 7876} {"train_loss": -28.037748336791992, "global_step": 653740, "epoch": 7876} {"train_loss": -28.269641876220703, "global_step": 653741, "epoch": 7876} {"train_loss": -28.095932006835938, "global_step": 653742, "epoch": 7876} {"train_loss": -28.412128448486328, "global_step": 653743, "epoch": 7876} {"train_loss": -28.083837509155273, "global_step": 653744, "epoch": 7876} {"train_loss": -28.350452423095703, "global_step": 653745, "epoch": 7876} {"train_loss": -28.467382431030273, "global_step": 653746, "epoch": 7876} {"train_loss": -28.31062126159668, "global_step": 653747, "epoch": 7876} {"train_loss": -28.1690616607666, "global_step": 653748, "epoch": 7876} {"train_loss": -28.380481719970703, "global_step": 653749, "epoch": 7876} {"train_loss": -28.25687599182129, "global_step": 653750, "epoch": 7876} {"train_loss": -28.149656295776367, "global_step": 653751, "epoch": 7876} {"train_loss": -28.4222354888916, "global_step": 653752, "epoch": 7876} {"train_loss": -28.231054306030273, "global_step": 653753, "epoch": 7876} {"train_loss": -28.01850700378418, "global_step": 653754, "epoch": 7876} {"train_loss": -28.169225692749023, "global_step": 653755, "epoch": 7876} {"train_loss": -28.159345626831055, "global_step": 653756, "epoch": 7876} {"train_loss": -28.88800048828125, "global_step": 653757, "epoch": 7876} {"train_loss": -28.240787506103516, "global_step": 653758, "epoch": 7876} {"train_loss": -28.621906280517578, "global_step": 653759, "epoch": 7876} {"train_loss": -28.035207748413086, "global_step": 653760, "epoch": 7876} {"train_loss": -27.763336181640625, "global_step": 653761, "epoch": 7876} {"train_loss": -27.96991539001465, "global_step": 653762, "epoch": 7876} {"train_loss": -27.942901611328125, "global_step": 653763, "epoch": 7876} {"train_loss": -28.344472885131836, "global_step": 653764, "epoch": 7876} {"train_loss": -28.099365234375, "global_step": 653765, "epoch": 7876} {"train_loss": -28.022357940673828, "global_step": 653766, "epoch": 7876} {"train_loss": -28.107526779174805, "global_step": 653767, "epoch": 7876} {"train_loss": -28.564990997314453, "global_step": 653768, "epoch": 7876} {"train_loss": -28.108341217041016, "global_step": 653769, "epoch": 7876} {"train_loss": -28.24287223815918, "global_step": 653770, "epoch": 7876} {"train_loss": -28.332874298095703, "global_step": 653771, "epoch": 7876} {"train_loss": -28.288549423217773, "global_step": 653772, "epoch": 7876} {"train_loss": -28.340368270874023, "global_step": 653773, "epoch": 7876} {"train_loss": -28.59926414489746, "global_step": 653774, "epoch": 7876} {"train_loss": -28.111953735351562, "global_step": 653775, "epoch": 7876} {"train_loss": -28.47389030456543, "global_step": 653776, "epoch": 7876} {"train_loss": -28.356863021850586, "global_step": 653777, "epoch": 7876} {"train_loss": -28.695425033569336, "global_step": 653778, "epoch": 7876} {"train_loss": -28.625680923461914, "global_step": 653779, "epoch": 7876} {"train_loss": -28.50690269470215, "global_step": 653780, "epoch": 7876} {"train_loss": -28.803003311157227, "global_step": 653781, "epoch": 7876} {"train_loss": -28.591115951538086, "global_step": 653782, "epoch": 7876} {"train_loss": -28.5966739654541, "global_step": 653783, "epoch": 7876} {"train_loss": -28.473133087158203, "global_step": 653784, "epoch": 7876} {"train_loss": -27.8242244720459, "global_step": 653785, "epoch": 7876} {"train_loss": -28.28973388671875, "global_step": 653786, "epoch": 7876} {"train_loss": -27.816913604736328, "global_step": 653787, "epoch": 7876} {"train_loss": -27.84100341796875, "global_step": 653788, "epoch": 7876} {"train_loss": -27.89344596862793, "global_step": 653789, "epoch": 7876} {"train_loss": -27.96230566645243, "global_step": 653790, "epoch": 7876, "val_loss": 6673488.5} {"train_loss": -26.86325454711914, "global_step": 653791, "epoch": 7877} {"train_loss": -26.837722778320312, "global_step": 653792, "epoch": 7877} {"train_loss": -26.899581909179688, "global_step": 653793, "epoch": 7877} {"train_loss": -27.80624771118164, "global_step": 653794, "epoch": 7877} {"train_loss": -27.181396484375, "global_step": 653795, "epoch": 7877} {"train_loss": -27.7838134765625, "global_step": 653796, "epoch": 7877} {"train_loss": -27.9786376953125, "global_step": 653797, "epoch": 7877} {"train_loss": -27.37262535095215, "global_step": 653798, "epoch": 7877} {"train_loss": -28.136554718017578, "global_step": 653799, "epoch": 7877} {"train_loss": -27.438825607299805, "global_step": 653800, "epoch": 7877} {"train_loss": -28.329999923706055, "global_step": 653801, "epoch": 7877} {"train_loss": -27.852005004882812, "global_step": 653802, "epoch": 7877} {"train_loss": -28.056127548217773, "global_step": 653803, "epoch": 7877} {"train_loss": -27.88458251953125, "global_step": 653804, "epoch": 7877} {"train_loss": -28.31001091003418, "global_step": 653805, "epoch": 7877} {"train_loss": -27.955081939697266, "global_step": 653806, "epoch": 7877} {"train_loss": -27.632129669189453, "global_step": 653807, "epoch": 7877} {"train_loss": -28.45245933532715, "global_step": 653808, "epoch": 7877} {"train_loss": -27.881067276000977, "global_step": 653809, "epoch": 7877} {"train_loss": -28.048303604125977, "global_step": 653810, "epoch": 7877} {"train_loss": -28.2630558013916, "global_step": 653811, "epoch": 7877} {"train_loss": -27.791187286376953, "global_step": 653812, "epoch": 7877} {"train_loss": -28.163793563842773, "global_step": 653813, "epoch": 7877} {"train_loss": -28.155426025390625, "global_step": 653814, "epoch": 7877} {"train_loss": -28.07196044921875, "global_step": 653815, "epoch": 7877} {"train_loss": -28.083478927612305, "global_step": 653816, "epoch": 7877} {"train_loss": -28.6574649810791, "global_step": 653817, "epoch": 7877} {"train_loss": -28.16109275817871, "global_step": 653818, "epoch": 7877} {"train_loss": -28.08262062072754, "global_step": 653819, "epoch": 7877} {"train_loss": -28.39788818359375, "global_step": 653820, "epoch": 7877} {"train_loss": -28.07590675354004, "global_step": 653821, "epoch": 7877} {"train_loss": -28.32529067993164, "global_step": 653822, "epoch": 7877} {"train_loss": -28.137527465820312, "global_step": 653823, "epoch": 7877} {"train_loss": -28.052289962768555, "global_step": 653824, "epoch": 7877} {"train_loss": -28.270965576171875, "global_step": 653825, "epoch": 7877} {"train_loss": -28.079437255859375, "global_step": 653826, "epoch": 7877} {"train_loss": -28.234302520751953, "global_step": 653827, "epoch": 7877} {"train_loss": -28.37696647644043, "global_step": 653828, "epoch": 7877} {"train_loss": -28.171232223510742, "global_step": 653829, "epoch": 7877} {"train_loss": -28.021947860717773, "global_step": 653830, "epoch": 7877} {"train_loss": -28.571990966796875, "global_step": 653831, "epoch": 7877} {"train_loss": -28.479236602783203, "global_step": 653832, "epoch": 7877} {"train_loss": -28.412128448486328, "global_step": 653833, "epoch": 7877} {"train_loss": -28.35527992248535, "global_step": 653834, "epoch": 7877} {"train_loss": -28.622451782226562, "global_step": 653835, "epoch": 7877} {"train_loss": -28.597248077392578, "global_step": 653836, "epoch": 7877} {"train_loss": -27.93310546875, "global_step": 653837, "epoch": 7877} {"train_loss": -28.388227462768555, "global_step": 653838, "epoch": 7877} {"train_loss": -28.1956729888916, "global_step": 653839, "epoch": 7877} {"train_loss": -28.5327091217041, "global_step": 653840, "epoch": 7877} {"train_loss": -28.633142471313477, "global_step": 653841, "epoch": 7877} {"train_loss": -27.883573532104492, "global_step": 653842, "epoch": 7877} {"train_loss": -28.410144805908203, "global_step": 653843, "epoch": 7877} {"train_loss": -28.270139694213867, "global_step": 653844, "epoch": 7877} {"train_loss": -28.405105590820312, "global_step": 653845, "epoch": 7877} {"train_loss": -28.265966415405273, "global_step": 653846, "epoch": 7877} {"train_loss": -28.258758544921875, "global_step": 653847, "epoch": 7877} {"train_loss": -28.25127601623535, "global_step": 653848, "epoch": 7877} {"train_loss": -28.25760841369629, "global_step": 653849, "epoch": 7877} {"train_loss": -28.46414566040039, "global_step": 653850, "epoch": 7877} {"train_loss": -28.375852584838867, "global_step": 653851, "epoch": 7877} {"train_loss": -28.41069984436035, "global_step": 653852, "epoch": 7877} {"train_loss": -28.589035034179688, "global_step": 653853, "epoch": 7877} {"train_loss": -28.2108211517334, "global_step": 653854, "epoch": 7877} {"train_loss": -28.435958862304688, "global_step": 653855, "epoch": 7877} {"train_loss": -28.369693756103516, "global_step": 653856, "epoch": 7877} {"train_loss": -28.033954620361328, "global_step": 653857, "epoch": 7877} {"train_loss": -28.400012969970703, "global_step": 653858, "epoch": 7877} {"train_loss": -28.352354049682617, "global_step": 653859, "epoch": 7877} {"train_loss": -28.24946403503418, "global_step": 653860, "epoch": 7877} {"train_loss": -28.891401290893555, "global_step": 653861, "epoch": 7877} {"train_loss": -28.291181564331055, "global_step": 653862, "epoch": 7877} {"train_loss": -28.160144805908203, "global_step": 653863, "epoch": 7877} {"train_loss": -28.559864044189453, "global_step": 653864, "epoch": 7877} {"train_loss": -28.417587280273438, "global_step": 653865, "epoch": 7877} {"train_loss": -28.46693992614746, "global_step": 653866, "epoch": 7877} {"train_loss": -27.87583351135254, "global_step": 653867, "epoch": 7877} {"train_loss": -28.427778244018555, "global_step": 653868, "epoch": 7877} {"train_loss": -28.467763900756836, "global_step": 653869, "epoch": 7877} {"train_loss": -28.5402889251709, "global_step": 653870, "epoch": 7877} {"train_loss": -28.539093017578125, "global_step": 653871, "epoch": 7877} {"train_loss": -28.292144775390625, "global_step": 653872, "epoch": 7877} {"train_loss": -28.16343741819083, "global_step": 653873, "epoch": 7877, "val_loss": 6694540.0} {"train_loss": -27.428924560546875, "global_step": 653874, "epoch": 7878} {"train_loss": -26.64655113220215, "global_step": 653875, "epoch": 7878} {"train_loss": -27.707965850830078, "global_step": 653876, "epoch": 7878} {"train_loss": -26.25136375427246, "global_step": 653877, "epoch": 7878} {"train_loss": -26.8836669921875, "global_step": 653878, "epoch": 7878} {"train_loss": -27.217370986938477, "global_step": 653879, "epoch": 7878} {"train_loss": -27.1944637298584, "global_step": 653880, "epoch": 7878} {"train_loss": -27.72419548034668, "global_step": 653881, "epoch": 7878} {"train_loss": -27.1019287109375, "global_step": 653882, "epoch": 7878} {"train_loss": -27.718164443969727, "global_step": 653883, "epoch": 7878} {"train_loss": -27.619586944580078, "global_step": 653884, "epoch": 7878} {"train_loss": -27.652822494506836, "global_step": 653885, "epoch": 7878} {"train_loss": -27.913904190063477, "global_step": 653886, "epoch": 7878} {"train_loss": -27.677051544189453, "global_step": 653887, "epoch": 7878} {"train_loss": -27.755664825439453, "global_step": 653888, "epoch": 7878} {"train_loss": -27.540786743164062, "global_step": 653889, "epoch": 7878} {"train_loss": -27.94980239868164, "global_step": 653890, "epoch": 7878} {"train_loss": -27.576108932495117, "global_step": 653891, "epoch": 7878} {"train_loss": -27.800642013549805, "global_step": 653892, "epoch": 7878} {"train_loss": -27.815717697143555, "global_step": 653893, "epoch": 7878} {"train_loss": -27.594043731689453, "global_step": 653894, "epoch": 7878} {"train_loss": -28.045202255249023, "global_step": 653895, "epoch": 7878} {"train_loss": -27.856597900390625, "global_step": 653896, "epoch": 7878} {"train_loss": -27.889556884765625, "global_step": 653897, "epoch": 7878} {"train_loss": -27.936452865600586, "global_step": 653898, "epoch": 7878} {"train_loss": -27.571557998657227, "global_step": 653899, "epoch": 7878} {"train_loss": -27.760059356689453, "global_step": 653900, "epoch": 7878} {"train_loss": -28.175678253173828, "global_step": 653901, "epoch": 7878} {"train_loss": -28.06101417541504, "global_step": 653902, "epoch": 7878} {"train_loss": -28.132482528686523, "global_step": 653903, "epoch": 7878} {"train_loss": -27.619709014892578, "global_step": 653904, "epoch": 7878} {"train_loss": -28.02797508239746, "global_step": 653905, "epoch": 7878} {"train_loss": -28.26533317565918, "global_step": 653906, "epoch": 7878} {"train_loss": -28.008930206298828, "global_step": 653907, "epoch": 7878} {"train_loss": -28.238391876220703, "global_step": 653908, "epoch": 7878} {"train_loss": -27.851806640625, "global_step": 653909, "epoch": 7878} {"train_loss": -28.46246910095215, "global_step": 653910, "epoch": 7878} {"train_loss": -28.054550170898438, "global_step": 653911, "epoch": 7878} {"train_loss": -27.946002960205078, "global_step": 653912, "epoch": 7878} {"train_loss": -28.240177154541016, "global_step": 653913, "epoch": 7878} {"train_loss": -28.182876586914062, "global_step": 653914, "epoch": 7878} {"train_loss": -28.5595760345459, "global_step": 653915, "epoch": 7878} {"train_loss": -28.209264755249023, "global_step": 653916, "epoch": 7878} {"train_loss": -28.415491104125977, "global_step": 653917, "epoch": 7878} {"train_loss": -28.37959098815918, "global_step": 653918, "epoch": 7878} {"train_loss": -28.60401725769043, "global_step": 653919, "epoch": 7878} {"train_loss": -28.3156795501709, "global_step": 653920, "epoch": 7878} {"train_loss": -28.31138038635254, "global_step": 653921, "epoch": 7878} {"train_loss": -28.478235244750977, "global_step": 653922, "epoch": 7878} {"train_loss": -28.698389053344727, "global_step": 653923, "epoch": 7878} {"train_loss": -28.3493709564209, "global_step": 653924, "epoch": 7878} {"train_loss": -28.417646408081055, "global_step": 653925, "epoch": 7878} {"train_loss": -28.383573532104492, "global_step": 653926, "epoch": 7878} {"train_loss": -28.5146541595459, "global_step": 653927, "epoch": 7878} {"train_loss": -28.228290557861328, "global_step": 653928, "epoch": 7878} {"train_loss": -28.393600463867188, "global_step": 653929, "epoch": 7878} {"train_loss": -28.718610763549805, "global_step": 653930, "epoch": 7878} {"train_loss": -28.027896881103516, "global_step": 653931, "epoch": 7878} {"train_loss": -28.596561431884766, "global_step": 653932, "epoch": 7878} {"train_loss": -28.334436416625977, "global_step": 653933, "epoch": 7878} {"train_loss": -28.4129581451416, "global_step": 653934, "epoch": 7878} {"train_loss": -28.445653915405273, "global_step": 653935, "epoch": 7878} {"train_loss": -28.24420166015625, "global_step": 653936, "epoch": 7878} {"train_loss": -28.724218368530273, "global_step": 653937, "epoch": 7878} {"train_loss": -28.52861976623535, "global_step": 653938, "epoch": 7878} {"train_loss": -28.564563751220703, "global_step": 653939, "epoch": 7878} {"train_loss": -28.730762481689453, "global_step": 653940, "epoch": 7878} {"train_loss": -28.38007164001465, "global_step": 653941, "epoch": 7878} {"train_loss": -28.710485458374023, "global_step": 653942, "epoch": 7878} {"train_loss": -28.41768455505371, "global_step": 653943, "epoch": 7878} {"train_loss": -28.645605087280273, "global_step": 653944, "epoch": 7878} {"train_loss": -28.467634201049805, "global_step": 653945, "epoch": 7878} {"train_loss": -28.161972045898438, "global_step": 653946, "epoch": 7878} {"train_loss": -28.6784610748291, "global_step": 653947, "epoch": 7878} {"train_loss": -28.666162490844727, "global_step": 653948, "epoch": 7878} {"train_loss": -28.69684410095215, "global_step": 653949, "epoch": 7878} {"train_loss": -28.55706787109375, "global_step": 653950, "epoch": 7878} {"train_loss": -28.351093292236328, "global_step": 653951, "epoch": 7878} {"train_loss": -28.592859268188477, "global_step": 653952, "epoch": 7878} {"train_loss": -28.59281349182129, "global_step": 653953, "epoch": 7878} {"train_loss": -28.135330200195312, "global_step": 653954, "epoch": 7878} {"train_loss": -28.25916862487793, "global_step": 653955, "epoch": 7878} {"train_loss": -28.11545925829784, "global_step": 653956, "epoch": 7878, "val_loss": 6673216.0} {"train_loss": -27.629114151000977, "global_step": 653957, "epoch": 7879} {"train_loss": -27.1019229888916, "global_step": 653958, "epoch": 7879} {"train_loss": -27.53981590270996, "global_step": 653959, "epoch": 7879} {"train_loss": -27.071155548095703, "global_step": 653960, "epoch": 7879} {"train_loss": -27.33365249633789, "global_step": 653961, "epoch": 7879} {"train_loss": -27.538721084594727, "global_step": 653962, "epoch": 7879} {"train_loss": -27.053485870361328, "global_step": 653963, "epoch": 7879} {"train_loss": -26.7918758392334, "global_step": 653964, "epoch": 7879} {"train_loss": -27.37765884399414, "global_step": 653965, "epoch": 7879} {"train_loss": -27.32756996154785, "global_step": 653966, "epoch": 7879} {"train_loss": -27.255783081054688, "global_step": 653967, "epoch": 7879} {"train_loss": -27.666669845581055, "global_step": 653968, "epoch": 7879} {"train_loss": -27.58900260925293, "global_step": 653969, "epoch": 7879} {"train_loss": -26.73476219177246, "global_step": 653970, "epoch": 7879} {"train_loss": -28.131589889526367, "global_step": 653971, "epoch": 7879} {"train_loss": -27.537769317626953, "global_step": 653972, "epoch": 7879} {"train_loss": -27.6223201751709, "global_step": 653973, "epoch": 7879} {"train_loss": -28.039758682250977, "global_step": 653974, "epoch": 7879} {"train_loss": -27.808780670166016, "global_step": 653975, "epoch": 7879} {"train_loss": -27.758459091186523, "global_step": 653976, "epoch": 7879} {"train_loss": -27.334110260009766, "global_step": 653977, "epoch": 7879} {"train_loss": -27.786346435546875, "global_step": 653978, "epoch": 7879} {"train_loss": -28.00519371032715, "global_step": 653979, "epoch": 7879} {"train_loss": -28.031835556030273, "global_step": 653980, "epoch": 7879} {"train_loss": -28.229034423828125, "global_step": 653981, "epoch": 7879} {"train_loss": -27.930862426757812, "global_step": 653982, "epoch": 7879} {"train_loss": -27.88266372680664, "global_step": 653983, "epoch": 7879} {"train_loss": -28.085987091064453, "global_step": 653984, "epoch": 7879} {"train_loss": -28.34473991394043, "global_step": 653985, "epoch": 7879} {"train_loss": -27.85198974609375, "global_step": 653986, "epoch": 7879} {"train_loss": -27.845138549804688, "global_step": 653987, "epoch": 7879} {"train_loss": -27.814966201782227, "global_step": 653988, "epoch": 7879} {"train_loss": -27.976408004760742, "global_step": 653989, "epoch": 7879} {"train_loss": -28.585433959960938, "global_step": 653990, "epoch": 7879} {"train_loss": -27.9885311126709, "global_step": 653991, "epoch": 7879} {"train_loss": -28.278583526611328, "global_step": 653992, "epoch": 7879} {"train_loss": -28.53622817993164, "global_step": 653993, "epoch": 7879} {"train_loss": -28.558324813842773, "global_step": 653994, "epoch": 7879} {"train_loss": -28.50014305114746, "global_step": 653995, "epoch": 7879} {"train_loss": -28.336917877197266, "global_step": 653996, "epoch": 7879} {"train_loss": -28.3088436126709, "global_step": 653997, "epoch": 7879} {"train_loss": -27.890378952026367, "global_step": 653998, "epoch": 7879} {"train_loss": -28.055994033813477, "global_step": 653999, "epoch": 7879} {"train_loss": -28.286029815673828, "global_step": 654000, "epoch": 7879} {"train_loss": -28.4061336517334, "global_step": 654001, "epoch": 7879} {"train_loss": -28.6545352935791, "global_step": 654002, "epoch": 7879} {"train_loss": -28.85188102722168, "global_step": 654003, "epoch": 7879} {"train_loss": -28.40995216369629, "global_step": 654004, "epoch": 7879} {"train_loss": -28.51222038269043, "global_step": 654005, "epoch": 7879} {"train_loss": -28.63884925842285, "global_step": 654006, "epoch": 7879} {"train_loss": -28.683425903320312, "global_step": 654007, "epoch": 7879} {"train_loss": -28.25115966796875, "global_step": 654008, "epoch": 7879} {"train_loss": -28.49493408203125, "global_step": 654009, "epoch": 7879} {"train_loss": -28.54083251953125, "global_step": 654010, "epoch": 7879} {"train_loss": -28.520523071289062, "global_step": 654011, "epoch": 7879} {"train_loss": -28.221288681030273, "global_step": 654012, "epoch": 7879} {"train_loss": -28.66636085510254, "global_step": 654013, "epoch": 7879} {"train_loss": -28.2194766998291, "global_step": 654014, "epoch": 7879} {"train_loss": -28.350177764892578, "global_step": 654015, "epoch": 7879} {"train_loss": -28.835376739501953, "global_step": 654016, "epoch": 7879} {"train_loss": -28.410846710205078, "global_step": 654017, "epoch": 7879} {"train_loss": -28.4876766204834, "global_step": 654018, "epoch": 7879} {"train_loss": -28.425537109375, "global_step": 654019, "epoch": 7879} {"train_loss": -28.51910400390625, "global_step": 654020, "epoch": 7879} {"train_loss": -27.817861557006836, "global_step": 654021, "epoch": 7879} {"train_loss": -27.5451717376709, "global_step": 654022, "epoch": 7879} {"train_loss": -27.4840145111084, "global_step": 654023, "epoch": 7879} {"train_loss": -28.005929946899414, "global_step": 654024, "epoch": 7879} {"train_loss": -28.313852310180664, "global_step": 654025, "epoch": 7879} {"train_loss": -28.3266544342041, "global_step": 654026, "epoch": 7879} {"train_loss": -28.75550651550293, "global_step": 654027, "epoch": 7879} {"train_loss": -28.157001495361328, "global_step": 654028, "epoch": 7879} {"train_loss": -28.068212509155273, "global_step": 654029, "epoch": 7879} {"train_loss": -28.34913444519043, "global_step": 654030, "epoch": 7879} {"train_loss": -28.31412124633789, "global_step": 654031, "epoch": 7879} {"train_loss": -28.455780029296875, "global_step": 654032, "epoch": 7879} {"train_loss": -28.656463623046875, "global_step": 654033, "epoch": 7879} {"train_loss": -28.437580108642578, "global_step": 654034, "epoch": 7879} {"train_loss": -28.7611141204834, "global_step": 654035, "epoch": 7879} {"train_loss": -28.589258193969727, "global_step": 654036, "epoch": 7879} {"train_loss": -28.522232055664062, "global_step": 654037, "epoch": 7879} {"train_loss": -28.467493057250977, "global_step": 654038, "epoch": 7879} {"train_loss": -28.083668651351008, "global_step": 654039, "epoch": 7879, "val_loss": 6659507.5} {"train_loss": -27.95122718811035, "global_step": 654040, "epoch": 7880} {"train_loss": -27.860807418823242, "global_step": 654041, "epoch": 7880} {"train_loss": -27.864002227783203, "global_step": 654042, "epoch": 7880} {"train_loss": -28.1390438079834, "global_step": 654043, "epoch": 7880} {"train_loss": -27.6485652923584, "global_step": 654044, "epoch": 7880} {"train_loss": -28.26708984375, "global_step": 654045, "epoch": 7880} {"train_loss": -27.7944278717041, "global_step": 654046, "epoch": 7880} {"train_loss": -28.325653076171875, "global_step": 654047, "epoch": 7880} {"train_loss": -27.941242218017578, "global_step": 654048, "epoch": 7880} {"train_loss": -28.31685447692871, "global_step": 654049, "epoch": 7880} {"train_loss": -28.38532829284668, "global_step": 654050, "epoch": 7880} {"train_loss": -28.19431495666504, "global_step": 654051, "epoch": 7880} {"train_loss": -28.011688232421875, "global_step": 654052, "epoch": 7880} {"train_loss": -27.613544464111328, "global_step": 654053, "epoch": 7880} {"train_loss": -27.7055606842041, "global_step": 654054, "epoch": 7880} {"train_loss": -28.22588539123535, "global_step": 654055, "epoch": 7880} {"train_loss": -28.118606567382812, "global_step": 654056, "epoch": 7880} {"train_loss": -27.44830894470215, "global_step": 654057, "epoch": 7880} {"train_loss": -27.674917221069336, "global_step": 654058, "epoch": 7880} {"train_loss": -27.8624324798584, "global_step": 654059, "epoch": 7880} {"train_loss": -28.215957641601562, "global_step": 654060, "epoch": 7880} {"train_loss": -28.0146427154541, "global_step": 654061, "epoch": 7880} {"train_loss": -27.822961807250977, "global_step": 654062, "epoch": 7880} {"train_loss": -28.478652954101562, "global_step": 654063, "epoch": 7880} {"train_loss": -27.949935913085938, "global_step": 654064, "epoch": 7880} {"train_loss": -28.247461318969727, "global_step": 654065, "epoch": 7880} {"train_loss": -27.987228393554688, "global_step": 654066, "epoch": 7880} {"train_loss": -28.33075523376465, "global_step": 654067, "epoch": 7880} {"train_loss": -28.525970458984375, "global_step": 654068, "epoch": 7880} {"train_loss": -28.123554229736328, "global_step": 654069, "epoch": 7880} {"train_loss": -28.406835556030273, "global_step": 654070, "epoch": 7880} {"train_loss": -28.47418212890625, "global_step": 654071, "epoch": 7880} {"train_loss": -28.376371383666992, "global_step": 654072, "epoch": 7880} {"train_loss": -28.328413009643555, "global_step": 654073, "epoch": 7880} {"train_loss": -28.441343307495117, "global_step": 654074, "epoch": 7880} {"train_loss": -28.67683219909668, "global_step": 654075, "epoch": 7880} {"train_loss": -28.532785415649414, "global_step": 654076, "epoch": 7880} {"train_loss": -28.53497314453125, "global_step": 654077, "epoch": 7880} {"train_loss": -28.804828643798828, "global_step": 654078, "epoch": 7880} {"train_loss": -28.599624633789062, "global_step": 654079, "epoch": 7880} {"train_loss": -28.784936904907227, "global_step": 654080, "epoch": 7880} {"train_loss": -28.432937622070312, "global_step": 654081, "epoch": 7880} {"train_loss": -28.464136123657227, "global_step": 654082, "epoch": 7880} {"train_loss": -28.453231811523438, "global_step": 654083, "epoch": 7880} {"train_loss": -28.671142578125, "global_step": 654084, "epoch": 7880} {"train_loss": -28.69706153869629, "global_step": 654085, "epoch": 7880} {"train_loss": -28.331867218017578, "global_step": 654086, "epoch": 7880} {"train_loss": -28.34423828125, "global_step": 654087, "epoch": 7880} {"train_loss": -28.232526779174805, "global_step": 654088, "epoch": 7880} {"train_loss": -28.28938102722168, "global_step": 654089, "epoch": 7880} {"train_loss": -28.382184982299805, "global_step": 654090, "epoch": 7880} {"train_loss": -28.566104888916016, "global_step": 654091, "epoch": 7880} {"train_loss": -28.593189239501953, "global_step": 654092, "epoch": 7880} {"train_loss": -28.80011558532715, "global_step": 654093, "epoch": 7880} {"train_loss": -28.68758201599121, "global_step": 654094, "epoch": 7880} {"train_loss": -27.926427841186523, "global_step": 654095, "epoch": 7880} {"train_loss": -28.42476463317871, "global_step": 654096, "epoch": 7880} {"train_loss": -28.445587158203125, "global_step": 654097, "epoch": 7880} {"train_loss": -28.132055282592773, "global_step": 654098, "epoch": 7880} {"train_loss": -28.353256225585938, "global_step": 654099, "epoch": 7880} {"train_loss": -28.639881134033203, "global_step": 654100, "epoch": 7880} {"train_loss": -27.911849975585938, "global_step": 654101, "epoch": 7880} {"train_loss": -28.39664649963379, "global_step": 654102, "epoch": 7880} {"train_loss": -27.888641357421875, "global_step": 654103, "epoch": 7880} {"train_loss": -28.14961814880371, "global_step": 654104, "epoch": 7880} {"train_loss": -28.203710556030273, "global_step": 654105, "epoch": 7880} {"train_loss": -28.24811363220215, "global_step": 654106, "epoch": 7880} {"train_loss": -28.77065086364746, "global_step": 654107, "epoch": 7880} {"train_loss": -28.71553611755371, "global_step": 654108, "epoch": 7880} {"train_loss": -28.207921981811523, "global_step": 654109, "epoch": 7880} {"train_loss": -28.180952072143555, "global_step": 654110, "epoch": 7880} {"train_loss": -28.256942749023438, "global_step": 654111, "epoch": 7880} {"train_loss": -28.741308212280273, "global_step": 654112, "epoch": 7880} {"train_loss": -28.599172592163086, "global_step": 654113, "epoch": 7880} {"train_loss": -28.332624435424805, "global_step": 654114, "epoch": 7880} {"train_loss": -28.605436325073242, "global_step": 654115, "epoch": 7880} {"train_loss": -28.845396041870117, "global_step": 654116, "epoch": 7880} {"train_loss": -28.506397247314453, "global_step": 654117, "epoch": 7880} {"train_loss": -28.845672607421875, "global_step": 654118, "epoch": 7880} {"train_loss": -28.295307159423828, "global_step": 654119, "epoch": 7880} {"train_loss": -28.262975692749023, "global_step": 654120, "epoch": 7880} {"train_loss": -28.749963760375977, "global_step": 654121, "epoch": 7880} {"train_loss": -28.28599762054811, "global_step": 654122, "epoch": 7880, "val_loss": 6680496.0} {"train_loss": -27.4652156829834, "global_step": 654123, "epoch": 7881} {"train_loss": -26.771240234375, "global_step": 654124, "epoch": 7881} {"train_loss": -26.9013614654541, "global_step": 654125, "epoch": 7881} {"train_loss": -28.014163970947266, "global_step": 654126, "epoch": 7881} {"train_loss": -28.129438400268555, "global_step": 654127, "epoch": 7881} {"train_loss": -27.900592803955078, "global_step": 654128, "epoch": 7881} {"train_loss": -28.05128288269043, "global_step": 654129, "epoch": 7881} {"train_loss": -27.8043270111084, "global_step": 654130, "epoch": 7881} {"train_loss": -28.05625343322754, "global_step": 654131, "epoch": 7881} {"train_loss": -28.064802169799805, "global_step": 654132, "epoch": 7881} {"train_loss": -28.371448516845703, "global_step": 654133, "epoch": 7881} {"train_loss": -28.312597274780273, "global_step": 654134, "epoch": 7881} {"train_loss": -28.192825317382812, "global_step": 654135, "epoch": 7881} {"train_loss": -27.75385093688965, "global_step": 654136, "epoch": 7881} {"train_loss": -27.620136260986328, "global_step": 654137, "epoch": 7881} {"train_loss": -28.21561050415039, "global_step": 654138, "epoch": 7881} {"train_loss": -28.20081901550293, "global_step": 654139, "epoch": 7881} {"train_loss": -28.224584579467773, "global_step": 654140, "epoch": 7881} {"train_loss": -28.042346954345703, "global_step": 654141, "epoch": 7881} {"train_loss": -28.204809188842773, "global_step": 654142, "epoch": 7881} {"train_loss": -27.92945671081543, "global_step": 654143, "epoch": 7881} {"train_loss": -28.38486671447754, "global_step": 654144, "epoch": 7881} {"train_loss": -28.4227352142334, "global_step": 654145, "epoch": 7881} {"train_loss": -28.0811767578125, "global_step": 654146, "epoch": 7881} {"train_loss": -28.390729904174805, "global_step": 654147, "epoch": 7881} {"train_loss": -28.282257080078125, "global_step": 654148, "epoch": 7881} {"train_loss": -28.243627548217773, "global_step": 654149, "epoch": 7881} {"train_loss": -28.128498077392578, "global_step": 654150, "epoch": 7881} {"train_loss": -28.302154541015625, "global_step": 654151, "epoch": 7881} {"train_loss": -28.3234920501709, "global_step": 654152, "epoch": 7881} {"train_loss": -28.5223388671875, "global_step": 654153, "epoch": 7881} {"train_loss": -28.24952507019043, "global_step": 654154, "epoch": 7881} {"train_loss": -28.651355743408203, "global_step": 654155, "epoch": 7881} {"train_loss": -28.25066566467285, "global_step": 654156, "epoch": 7881} {"train_loss": -28.29888343811035, "global_step": 654157, "epoch": 7881} {"train_loss": -28.580432891845703, "global_step": 654158, "epoch": 7881} {"train_loss": -28.716053009033203, "global_step": 654159, "epoch": 7881} {"train_loss": -28.762548446655273, "global_step": 654160, "epoch": 7881} {"train_loss": -28.508930206298828, "global_step": 654161, "epoch": 7881} {"train_loss": -28.364965438842773, "global_step": 654162, "epoch": 7881} {"train_loss": -28.6038818359375, "global_step": 654163, "epoch": 7881} {"train_loss": -28.596759796142578, "global_step": 654164, "epoch": 7881} {"train_loss": -28.29071617126465, "global_step": 654165, "epoch": 7881} {"train_loss": -27.27091407775879, "global_step": 654166, "epoch": 7881} {"train_loss": -27.869232177734375, "global_step": 654167, "epoch": 7881} {"train_loss": -27.87733268737793, "global_step": 654168, "epoch": 7881} {"train_loss": -27.713953018188477, "global_step": 654169, "epoch": 7881} {"train_loss": -28.046110153198242, "global_step": 654170, "epoch": 7881} {"train_loss": -28.069177627563477, "global_step": 654171, "epoch": 7881} {"train_loss": -27.474674224853516, "global_step": 654172, "epoch": 7881} {"train_loss": -27.894412994384766, "global_step": 654173, "epoch": 7881} {"train_loss": -28.022567749023438, "global_step": 654174, "epoch": 7881} {"train_loss": -27.372638702392578, "global_step": 654175, "epoch": 7881} {"train_loss": -28.31524085998535, "global_step": 654176, "epoch": 7881} {"train_loss": -28.08892250061035, "global_step": 654177, "epoch": 7881} {"train_loss": -27.722553253173828, "global_step": 654178, "epoch": 7881} {"train_loss": -28.372909545898438, "global_step": 654179, "epoch": 7881} {"train_loss": -27.813547134399414, "global_step": 654180, "epoch": 7881} {"train_loss": -28.326385498046875, "global_step": 654181, "epoch": 7881} {"train_loss": -28.129281997680664, "global_step": 654182, "epoch": 7881} {"train_loss": -27.812021255493164, "global_step": 654183, "epoch": 7881} {"train_loss": -28.32490348815918, "global_step": 654184, "epoch": 7881} {"train_loss": -28.2871150970459, "global_step": 654185, "epoch": 7881} {"train_loss": -27.931594848632812, "global_step": 654186, "epoch": 7881} {"train_loss": -28.50359535217285, "global_step": 654187, "epoch": 7881} {"train_loss": -28.2431697845459, "global_step": 654188, "epoch": 7881} {"train_loss": -28.787817001342773, "global_step": 654189, "epoch": 7881} {"train_loss": -28.42656898498535, "global_step": 654190, "epoch": 7881} {"train_loss": -28.0715389251709, "global_step": 654191, "epoch": 7881} {"train_loss": -28.326583862304688, "global_step": 654192, "epoch": 7881} {"train_loss": -28.4502010345459, "global_step": 654193, "epoch": 7881} {"train_loss": -28.241987228393555, "global_step": 654194, "epoch": 7881} {"train_loss": -28.265127182006836, "global_step": 654195, "epoch": 7881} {"train_loss": -28.602746963500977, "global_step": 654196, "epoch": 7881} {"train_loss": -28.12052345275879, "global_step": 654197, "epoch": 7881} {"train_loss": -28.4991512298584, "global_step": 654198, "epoch": 7881} {"train_loss": -28.370115280151367, "global_step": 654199, "epoch": 7881} {"train_loss": -27.993711471557617, "global_step": 654200, "epoch": 7881} {"train_loss": -28.538211822509766, "global_step": 654201, "epoch": 7881} {"train_loss": -28.699827194213867, "global_step": 654202, "epoch": 7881} {"train_loss": -28.479520797729492, "global_step": 654203, "epoch": 7881} {"train_loss": -28.151758193969727, "global_step": 654204, "epoch": 7881} {"train_loss": -28.184389482061547, "global_step": 654205, "epoch": 7881, "val_loss": 6738759.0} {"train_loss": -27.615680694580078, "global_step": 654206, "epoch": 7882} {"train_loss": -27.554662704467773, "global_step": 654207, "epoch": 7882} {"train_loss": -27.925933837890625, "global_step": 654208, "epoch": 7882} {"train_loss": -27.320058822631836, "global_step": 654209, "epoch": 7882} {"train_loss": -27.583444595336914, "global_step": 654210, "epoch": 7882} {"train_loss": -27.53317642211914, "global_step": 654211, "epoch": 7882} {"train_loss": -27.517301559448242, "global_step": 654212, "epoch": 7882} {"train_loss": -27.926544189453125, "global_step": 654213, "epoch": 7882} {"train_loss": -28.014083862304688, "global_step": 654214, "epoch": 7882} {"train_loss": -27.689741134643555, "global_step": 654215, "epoch": 7882} {"train_loss": -28.08148193359375, "global_step": 654216, "epoch": 7882} {"train_loss": -28.376657485961914, "global_step": 654217, "epoch": 7882} {"train_loss": -27.880645751953125, "global_step": 654218, "epoch": 7882} {"train_loss": -27.83965492248535, "global_step": 654219, "epoch": 7882} {"train_loss": -27.838287353515625, "global_step": 654220, "epoch": 7882} {"train_loss": -28.154027938842773, "global_step": 654221, "epoch": 7882} {"train_loss": -28.11044692993164, "global_step": 654222, "epoch": 7882} {"train_loss": -28.21632194519043, "global_step": 654223, "epoch": 7882} {"train_loss": -28.080408096313477, "global_step": 654224, "epoch": 7882} {"train_loss": -28.214086532592773, "global_step": 654225, "epoch": 7882} {"train_loss": -27.993366241455078, "global_step": 654226, "epoch": 7882} {"train_loss": -28.386884689331055, "global_step": 654227, "epoch": 7882} {"train_loss": -28.047698974609375, "global_step": 654228, "epoch": 7882} {"train_loss": -28.56764793395996, "global_step": 654229, "epoch": 7882} {"train_loss": -28.25472068786621, "global_step": 654230, "epoch": 7882} {"train_loss": -28.177270889282227, "global_step": 654231, "epoch": 7882} {"train_loss": -28.108373641967773, "global_step": 654232, "epoch": 7882} {"train_loss": -28.625024795532227, "global_step": 654233, "epoch": 7882} {"train_loss": -28.424962997436523, "global_step": 654234, "epoch": 7882} {"train_loss": -28.2015323638916, "global_step": 654235, "epoch": 7882} {"train_loss": -28.46368408203125, "global_step": 654236, "epoch": 7882} {"train_loss": -28.234609603881836, "global_step": 654237, "epoch": 7882} {"train_loss": -28.10724449157715, "global_step": 654238, "epoch": 7882} {"train_loss": -28.510669708251953, "global_step": 654239, "epoch": 7882} {"train_loss": -28.098682403564453, "global_step": 654240, "epoch": 7882} {"train_loss": -28.614887237548828, "global_step": 654241, "epoch": 7882} {"train_loss": -28.098546981811523, "global_step": 654242, "epoch": 7882} {"train_loss": -28.122838973999023, "global_step": 654243, "epoch": 7882} {"train_loss": -28.761198043823242, "global_step": 654244, "epoch": 7882} {"train_loss": -28.346710205078125, "global_step": 654245, "epoch": 7882} {"train_loss": -28.52316665649414, "global_step": 654246, "epoch": 7882} {"train_loss": -28.19260597229004, "global_step": 654247, "epoch": 7882} {"train_loss": -28.357135772705078, "global_step": 654248, "epoch": 7882} {"train_loss": -28.292966842651367, "global_step": 654249, "epoch": 7882} {"train_loss": -28.232807159423828, "global_step": 654250, "epoch": 7882} {"train_loss": -28.345029830932617, "global_step": 654251, "epoch": 7882} {"train_loss": -28.606952667236328, "global_step": 654252, "epoch": 7882} {"train_loss": -28.408782958984375, "global_step": 654253, "epoch": 7882} {"train_loss": -28.375293731689453, "global_step": 654254, "epoch": 7882} {"train_loss": -28.299606323242188, "global_step": 654255, "epoch": 7882} {"train_loss": -28.355976104736328, "global_step": 654256, "epoch": 7882} {"train_loss": -28.43983268737793, "global_step": 654257, "epoch": 7882} {"train_loss": -28.34199333190918, "global_step": 654258, "epoch": 7882} {"train_loss": -28.628942489624023, "global_step": 654259, "epoch": 7882} {"train_loss": -28.4739990234375, "global_step": 654260, "epoch": 7882} {"train_loss": -28.42376136779785, "global_step": 654261, "epoch": 7882} {"train_loss": -28.467365264892578, "global_step": 654262, "epoch": 7882} {"train_loss": -28.703454971313477, "global_step": 654263, "epoch": 7882} {"train_loss": -28.6419734954834, "global_step": 654264, "epoch": 7882} {"train_loss": -28.157779693603516, "global_step": 654265, "epoch": 7882} {"train_loss": -28.210538864135742, "global_step": 654266, "epoch": 7882} {"train_loss": -28.066822052001953, "global_step": 654267, "epoch": 7882} {"train_loss": -28.20601463317871, "global_step": 654268, "epoch": 7882} {"train_loss": -27.978708267211914, "global_step": 654269, "epoch": 7882} {"train_loss": -28.287250518798828, "global_step": 654270, "epoch": 7882} {"train_loss": -28.334604263305664, "global_step": 654271, "epoch": 7882} {"train_loss": -28.283674240112305, "global_step": 654272, "epoch": 7882} {"train_loss": -28.365015029907227, "global_step": 654273, "epoch": 7882} {"train_loss": -28.637775421142578, "global_step": 654274, "epoch": 7882} {"train_loss": -28.495853424072266, "global_step": 654275, "epoch": 7882} {"train_loss": -27.726842880249023, "global_step": 654276, "epoch": 7882} {"train_loss": -28.72723960876465, "global_step": 654277, "epoch": 7882} {"train_loss": -28.006811141967773, "global_step": 654278, "epoch": 7882} {"train_loss": -28.37784194946289, "global_step": 654279, "epoch": 7882} {"train_loss": -28.213163375854492, "global_step": 654280, "epoch": 7882} {"train_loss": -28.527664184570312, "global_step": 654281, "epoch": 7882} {"train_loss": -28.166181564331055, "global_step": 654282, "epoch": 7882} {"train_loss": -28.2044620513916, "global_step": 654283, "epoch": 7882} {"train_loss": -28.579574584960938, "global_step": 654284, "epoch": 7882} {"train_loss": -28.217172622680664, "global_step": 654285, "epoch": 7882} {"train_loss": -28.34588050842285, "global_step": 654286, "epoch": 7882} {"train_loss": -28.074487686157227, "global_step": 654287, "epoch": 7882} {"train_loss": -28.21585250762572, "global_step": 654288, "epoch": 7882, "val_loss": 6654076.0} {"train_loss": -27.887800216674805, "global_step": 654289, "epoch": 7883} {"train_loss": -28.157550811767578, "global_step": 654290, "epoch": 7883} {"train_loss": -27.78080177307129, "global_step": 654291, "epoch": 7883} {"train_loss": -27.303207397460938, "global_step": 654292, "epoch": 7883} {"train_loss": -27.46186637878418, "global_step": 654293, "epoch": 7883} {"train_loss": -27.75262451171875, "global_step": 654294, "epoch": 7883} {"train_loss": -27.82590675354004, "global_step": 654295, "epoch": 7883} {"train_loss": -27.98270034790039, "global_step": 654296, "epoch": 7883} {"train_loss": -28.008716583251953, "global_step": 654297, "epoch": 7883} {"train_loss": -27.825841903686523, "global_step": 654298, "epoch": 7883} {"train_loss": -27.719146728515625, "global_step": 654299, "epoch": 7883} {"train_loss": -28.153791427612305, "global_step": 654300, "epoch": 7883} {"train_loss": -28.071317672729492, "global_step": 654301, "epoch": 7883} {"train_loss": -28.204511642456055, "global_step": 654302, "epoch": 7883} {"train_loss": -28.15057945251465, "global_step": 654303, "epoch": 7883} {"train_loss": -28.15799331665039, "global_step": 654304, "epoch": 7883} {"train_loss": -28.06544303894043, "global_step": 654305, "epoch": 7883} {"train_loss": -27.949125289916992, "global_step": 654306, "epoch": 7883} {"train_loss": -28.00446891784668, "global_step": 654307, "epoch": 7883} {"train_loss": -28.23480224609375, "global_step": 654308, "epoch": 7883} {"train_loss": -28.020246505737305, "global_step": 654309, "epoch": 7883} {"train_loss": -28.165307998657227, "global_step": 654310, "epoch": 7883} {"train_loss": -28.229223251342773, "global_step": 654311, "epoch": 7883} {"train_loss": -28.40863037109375, "global_step": 654312, "epoch": 7883} {"train_loss": -28.247400283813477, "global_step": 654313, "epoch": 7883} {"train_loss": -28.24859619140625, "global_step": 654314, "epoch": 7883} {"train_loss": -27.83098793029785, "global_step": 654315, "epoch": 7883} {"train_loss": -28.622364044189453, "global_step": 654316, "epoch": 7883} {"train_loss": -28.01861572265625, "global_step": 654317, "epoch": 7883} {"train_loss": -28.37664794921875, "global_step": 654318, "epoch": 7883} {"train_loss": -28.404699325561523, "global_step": 654319, "epoch": 7883} {"train_loss": -28.489627838134766, "global_step": 654320, "epoch": 7883} {"train_loss": -28.277307510375977, "global_step": 654321, "epoch": 7883} {"train_loss": -28.697248458862305, "global_step": 654322, "epoch": 7883} {"train_loss": -28.507129669189453, "global_step": 654323, "epoch": 7883} {"train_loss": -28.560596466064453, "global_step": 654324, "epoch": 7883} {"train_loss": -28.259931564331055, "global_step": 654325, "epoch": 7883} {"train_loss": -28.44807243347168, "global_step": 654326, "epoch": 7883} {"train_loss": -28.12521743774414, "global_step": 654327, "epoch": 7883} {"train_loss": -28.6180419921875, "global_step": 654328, "epoch": 7883} {"train_loss": -28.177331924438477, "global_step": 654329, "epoch": 7883} {"train_loss": -28.146808624267578, "global_step": 654330, "epoch": 7883} {"train_loss": -28.13138771057129, "global_step": 654331, "epoch": 7883} {"train_loss": -28.21466064453125, "global_step": 654332, "epoch": 7883} {"train_loss": -28.153799057006836, "global_step": 654333, "epoch": 7883} {"train_loss": -28.41718101501465, "global_step": 654334, "epoch": 7883} {"train_loss": -28.193552017211914, "global_step": 654335, "epoch": 7883} {"train_loss": -28.330854415893555, "global_step": 654336, "epoch": 7883} {"train_loss": -28.611637115478516, "global_step": 654337, "epoch": 7883} {"train_loss": -28.726110458374023, "global_step": 654338, "epoch": 7883} {"train_loss": -28.189701080322266, "global_step": 654339, "epoch": 7883} {"train_loss": -28.15201187133789, "global_step": 654340, "epoch": 7883} {"train_loss": -28.465322494506836, "global_step": 654341, "epoch": 7883} {"train_loss": -28.28290367126465, "global_step": 654342, "epoch": 7883} {"train_loss": -28.502965927124023, "global_step": 654343, "epoch": 7883} {"train_loss": -28.00091552734375, "global_step": 654344, "epoch": 7883} {"train_loss": -28.197433471679688, "global_step": 654345, "epoch": 7883} {"train_loss": -28.317462921142578, "global_step": 654346, "epoch": 7883} {"train_loss": -28.289960861206055, "global_step": 654347, "epoch": 7883} {"train_loss": -28.43062400817871, "global_step": 654348, "epoch": 7883} {"train_loss": -27.80475425720215, "global_step": 654349, "epoch": 7883} {"train_loss": -28.15506362915039, "global_step": 654350, "epoch": 7883} {"train_loss": -28.766284942626953, "global_step": 654351, "epoch": 7883} {"train_loss": -28.65192985534668, "global_step": 654352, "epoch": 7883} {"train_loss": -28.022268295288086, "global_step": 654353, "epoch": 7883} {"train_loss": -28.260175704956055, "global_step": 654354, "epoch": 7883} {"train_loss": -28.2860164642334, "global_step": 654355, "epoch": 7883} {"train_loss": -28.303796768188477, "global_step": 654356, "epoch": 7883} {"train_loss": -28.784210205078125, "global_step": 654357, "epoch": 7883} {"train_loss": -28.5082950592041, "global_step": 654358, "epoch": 7883} {"train_loss": -28.139633178710938, "global_step": 654359, "epoch": 7883} {"train_loss": -28.449682235717773, "global_step": 654360, "epoch": 7883} {"train_loss": -28.185779571533203, "global_step": 654361, "epoch": 7883} {"train_loss": -28.169828414916992, "global_step": 654362, "epoch": 7883} {"train_loss": -28.395978927612305, "global_step": 654363, "epoch": 7883} {"train_loss": -28.15118408203125, "global_step": 654364, "epoch": 7883} {"train_loss": -28.474279403686523, "global_step": 654365, "epoch": 7883} {"train_loss": -28.991928100585938, "global_step": 654366, "epoch": 7883} {"train_loss": -28.51421546936035, "global_step": 654367, "epoch": 7883} {"train_loss": -28.864912033081055, "global_step": 654368, "epoch": 7883} {"train_loss": -28.73651695251465, "global_step": 654369, "epoch": 7883} {"train_loss": -28.613004684448242, "global_step": 654370, "epoch": 7883} {"train_loss": -28.25361228850951, "global_step": 654371, "epoch": 7883, "val_loss": 6718525.0} {"train_loss": -27.984243392944336, "global_step": 654372, "epoch": 7884} {"train_loss": -27.899580001831055, "global_step": 654373, "epoch": 7884} {"train_loss": -28.374942779541016, "global_step": 654374, "epoch": 7884} {"train_loss": -27.862415313720703, "global_step": 654375, "epoch": 7884} {"train_loss": -28.0872802734375, "global_step": 654376, "epoch": 7884} {"train_loss": -28.22486686706543, "global_step": 654377, "epoch": 7884} {"train_loss": -28.04135513305664, "global_step": 654378, "epoch": 7884} {"train_loss": -27.828088760375977, "global_step": 654379, "epoch": 7884} {"train_loss": -28.30268669128418, "global_step": 654380, "epoch": 7884} {"train_loss": -27.677091598510742, "global_step": 654381, "epoch": 7884} {"train_loss": -27.624109268188477, "global_step": 654382, "epoch": 7884} {"train_loss": -27.757150650024414, "global_step": 654383, "epoch": 7884} {"train_loss": -28.01556968688965, "global_step": 654384, "epoch": 7884} {"train_loss": -27.761526107788086, "global_step": 654385, "epoch": 7884} {"train_loss": -28.49216079711914, "global_step": 654386, "epoch": 7884} {"train_loss": -28.0173397064209, "global_step": 654387, "epoch": 7884} {"train_loss": -27.975299835205078, "global_step": 654388, "epoch": 7884} {"train_loss": -28.35579490661621, "global_step": 654389, "epoch": 7884} {"train_loss": -27.851806640625, "global_step": 654390, "epoch": 7884} {"train_loss": -28.269184112548828, "global_step": 654391, "epoch": 7884} {"train_loss": -28.203405380249023, "global_step": 654392, "epoch": 7884} {"train_loss": -28.395151138305664, "global_step": 654393, "epoch": 7884} {"train_loss": -28.145959854125977, "global_step": 654394, "epoch": 7884} {"train_loss": -27.991918563842773, "global_step": 654395, "epoch": 7884} {"train_loss": -28.176000595092773, "global_step": 654396, "epoch": 7884} {"train_loss": -28.298486709594727, "global_step": 654397, "epoch": 7884} {"train_loss": -28.304412841796875, "global_step": 654398, "epoch": 7884} {"train_loss": -28.296228408813477, "global_step": 654399, "epoch": 7884} {"train_loss": -28.065378189086914, "global_step": 654400, "epoch": 7884} {"train_loss": -27.99713706970215, "global_step": 654401, "epoch": 7884} {"train_loss": -28.00908851623535, "global_step": 654402, "epoch": 7884} {"train_loss": -28.3382511138916, "global_step": 654403, "epoch": 7884} {"train_loss": -28.2169189453125, "global_step": 654404, "epoch": 7884} {"train_loss": -28.419363021850586, "global_step": 654405, "epoch": 7884} {"train_loss": -28.350936889648438, "global_step": 654406, "epoch": 7884} {"train_loss": -28.19537353515625, "global_step": 654407, "epoch": 7884} {"train_loss": -28.379566192626953, "global_step": 654408, "epoch": 7884} {"train_loss": -28.240680694580078, "global_step": 654409, "epoch": 7884} {"train_loss": -28.680103302001953, "global_step": 654410, "epoch": 7884} {"train_loss": -27.857839584350586, "global_step": 654411, "epoch": 7884} {"train_loss": -28.692026138305664, "global_step": 654412, "epoch": 7884} {"train_loss": -28.257802963256836, "global_step": 654413, "epoch": 7884} {"train_loss": -28.33585548400879, "global_step": 654414, "epoch": 7884} {"train_loss": -28.192020416259766, "global_step": 654415, "epoch": 7884} {"train_loss": -28.61250114440918, "global_step": 654416, "epoch": 7884} {"train_loss": -28.49964714050293, "global_step": 654417, "epoch": 7884} {"train_loss": -28.64320945739746, "global_step": 654418, "epoch": 7884} {"train_loss": -28.128238677978516, "global_step": 654419, "epoch": 7884} {"train_loss": -28.2352294921875, "global_step": 654420, "epoch": 7884} {"train_loss": -28.19317054748535, "global_step": 654421, "epoch": 7884} {"train_loss": -28.38179588317871, "global_step": 654422, "epoch": 7884} {"train_loss": -28.480609893798828, "global_step": 654423, "epoch": 7884} {"train_loss": -28.615386962890625, "global_step": 654424, "epoch": 7884} {"train_loss": -28.211257934570312, "global_step": 654425, "epoch": 7884} {"train_loss": -28.390838623046875, "global_step": 654426, "epoch": 7884} {"train_loss": -28.486997604370117, "global_step": 654427, "epoch": 7884} {"train_loss": -28.319843292236328, "global_step": 654428, "epoch": 7884} {"train_loss": -28.491666793823242, "global_step": 654429, "epoch": 7884} {"train_loss": -28.527637481689453, "global_step": 654430, "epoch": 7884} {"train_loss": -28.30867576599121, "global_step": 654431, "epoch": 7884} {"train_loss": -28.3135986328125, "global_step": 654432, "epoch": 7884} {"train_loss": -28.66865348815918, "global_step": 654433, "epoch": 7884} {"train_loss": -28.801374435424805, "global_step": 654434, "epoch": 7884} {"train_loss": -28.12323570251465, "global_step": 654435, "epoch": 7884} {"train_loss": -28.428003311157227, "global_step": 654436, "epoch": 7884} {"train_loss": -28.302709579467773, "global_step": 654437, "epoch": 7884} {"train_loss": -28.10428237915039, "global_step": 654438, "epoch": 7884} {"train_loss": -28.660444259643555, "global_step": 654439, "epoch": 7884} {"train_loss": -28.47405433654785, "global_step": 654440, "epoch": 7884} {"train_loss": -28.123462677001953, "global_step": 654441, "epoch": 7884} {"train_loss": -28.661218643188477, "global_step": 654442, "epoch": 7884} {"train_loss": -28.568212509155273, "global_step": 654443, "epoch": 7884} {"train_loss": -28.273334503173828, "global_step": 654444, "epoch": 7884} {"train_loss": -27.772687911987305, "global_step": 654445, "epoch": 7884} {"train_loss": -27.856149673461914, "global_step": 654446, "epoch": 7884} {"train_loss": -28.275054931640625, "global_step": 654447, "epoch": 7884} {"train_loss": -28.007099151611328, "global_step": 654448, "epoch": 7884} {"train_loss": -27.358108520507812, "global_step": 654449, "epoch": 7884} {"train_loss": -27.931665420532227, "global_step": 654450, "epoch": 7884} {"train_loss": -28.237634658813477, "global_step": 654451, "epoch": 7884} {"train_loss": -27.693695068359375, "global_step": 654452, "epoch": 7884} {"train_loss": -28.2847843170166, "global_step": 654453, "epoch": 7884} {"train_loss": -28.214754334415296, "global_step": 654454, "epoch": 7884, "val_loss": 6667446.5} {"train_loss": -27.78421974182129, "global_step": 654455, "epoch": 7885} {"train_loss": -27.538904190063477, "global_step": 654456, "epoch": 7885} {"train_loss": -27.531476974487305, "global_step": 654457, "epoch": 7885} {"train_loss": -27.119598388671875, "global_step": 654458, "epoch": 7885} {"train_loss": -27.330463409423828, "global_step": 654459, "epoch": 7885} {"train_loss": -27.700708389282227, "global_step": 654460, "epoch": 7885} {"train_loss": -27.616308212280273, "global_step": 654461, "epoch": 7885} {"train_loss": -27.364709854125977, "global_step": 654462, "epoch": 7885} {"train_loss": -28.17610740661621, "global_step": 654463, "epoch": 7885} {"train_loss": -27.388723373413086, "global_step": 654464, "epoch": 7885} {"train_loss": -27.23294448852539, "global_step": 654465, "epoch": 7885} {"train_loss": -27.666961669921875, "global_step": 654466, "epoch": 7885} {"train_loss": -28.3421630859375, "global_step": 654467, "epoch": 7885} {"train_loss": -27.83662223815918, "global_step": 654468, "epoch": 7885} {"train_loss": -27.81654167175293, "global_step": 654469, "epoch": 7885} {"train_loss": -28.094480514526367, "global_step": 654470, "epoch": 7885} {"train_loss": -27.75191307067871, "global_step": 654471, "epoch": 7885} {"train_loss": -27.64979362487793, "global_step": 654472, "epoch": 7885} {"train_loss": -27.9421329498291, "global_step": 654473, "epoch": 7885} {"train_loss": -27.857074737548828, "global_step": 654474, "epoch": 7885} {"train_loss": -27.814300537109375, "global_step": 654475, "epoch": 7885} {"train_loss": -28.03351402282715, "global_step": 654476, "epoch": 7885} {"train_loss": -27.770694732666016, "global_step": 654477, "epoch": 7885} {"train_loss": -28.033491134643555, "global_step": 654478, "epoch": 7885} {"train_loss": -28.10914421081543, "global_step": 654479, "epoch": 7885} {"train_loss": -27.483631134033203, "global_step": 654480, "epoch": 7885} {"train_loss": -28.053897857666016, "global_step": 654481, "epoch": 7885} {"train_loss": -28.17518424987793, "global_step": 654482, "epoch": 7885} {"train_loss": -28.198612213134766, "global_step": 654483, "epoch": 7885} {"train_loss": -27.861785888671875, "global_step": 654484, "epoch": 7885} {"train_loss": -28.2009334564209, "global_step": 654485, "epoch": 7885} {"train_loss": -28.077924728393555, "global_step": 654486, "epoch": 7885} {"train_loss": -28.097381591796875, "global_step": 654487, "epoch": 7885} {"train_loss": -28.162946701049805, "global_step": 654488, "epoch": 7885} {"train_loss": -28.473730087280273, "global_step": 654489, "epoch": 7885} {"train_loss": -27.92449951171875, "global_step": 654490, "epoch": 7885} {"train_loss": -27.99555015563965, "global_step": 654491, "epoch": 7885} {"train_loss": -28.32334327697754, "global_step": 654492, "epoch": 7885} {"train_loss": -28.16034507751465, "global_step": 654493, "epoch": 7885} {"train_loss": -28.338123321533203, "global_step": 654494, "epoch": 7885} {"train_loss": -27.925262451171875, "global_step": 654495, "epoch": 7885} {"train_loss": -28.3348445892334, "global_step": 654496, "epoch": 7885} {"train_loss": -28.38551139831543, "global_step": 654497, "epoch": 7885} {"train_loss": -28.19120216369629, "global_step": 654498, "epoch": 7885} {"train_loss": -28.335718154907227, "global_step": 654499, "epoch": 7885} {"train_loss": -28.54218864440918, "global_step": 654500, "epoch": 7885} {"train_loss": -28.46438980102539, "global_step": 654501, "epoch": 7885} {"train_loss": -28.644804000854492, "global_step": 654502, "epoch": 7885} {"train_loss": -28.691492080688477, "global_step": 654503, "epoch": 7885} {"train_loss": -28.66729164123535, "global_step": 654504, "epoch": 7885} {"train_loss": -28.256763458251953, "global_step": 654505, "epoch": 7885} {"train_loss": -28.39211082458496, "global_step": 654506, "epoch": 7885} {"train_loss": -28.254159927368164, "global_step": 654507, "epoch": 7885} {"train_loss": -28.564346313476562, "global_step": 654508, "epoch": 7885} {"train_loss": -28.44074058532715, "global_step": 654509, "epoch": 7885} {"train_loss": -28.669296264648438, "global_step": 654510, "epoch": 7885} {"train_loss": -28.28753662109375, "global_step": 654511, "epoch": 7885} {"train_loss": -28.33534049987793, "global_step": 654512, "epoch": 7885} {"train_loss": -28.25092887878418, "global_step": 654513, "epoch": 7885} {"train_loss": -28.5744571685791, "global_step": 654514, "epoch": 7885} {"train_loss": -28.231069564819336, "global_step": 654515, "epoch": 7885} {"train_loss": -28.384754180908203, "global_step": 654516, "epoch": 7885} {"train_loss": -28.365921020507812, "global_step": 654517, "epoch": 7885} {"train_loss": -28.282413482666016, "global_step": 654518, "epoch": 7885} {"train_loss": -28.245121002197266, "global_step": 654519, "epoch": 7885} {"train_loss": -28.005664825439453, "global_step": 654520, "epoch": 7885} {"train_loss": -28.49298095703125, "global_step": 654521, "epoch": 7885} {"train_loss": -28.321563720703125, "global_step": 654522, "epoch": 7885} {"train_loss": -28.28669548034668, "global_step": 654523, "epoch": 7885} {"train_loss": -28.094512939453125, "global_step": 654524, "epoch": 7885} {"train_loss": -28.412424087524414, "global_step": 654525, "epoch": 7885} {"train_loss": -28.497522354125977, "global_step": 654526, "epoch": 7885} {"train_loss": -27.958698272705078, "global_step": 654527, "epoch": 7885} {"train_loss": -28.736234664916992, "global_step": 654528, "epoch": 7885} {"train_loss": -28.159536361694336, "global_step": 654529, "epoch": 7885} {"train_loss": -28.38974952697754, "global_step": 654530, "epoch": 7885} {"train_loss": -28.568113327026367, "global_step": 654531, "epoch": 7885} {"train_loss": -28.35418701171875, "global_step": 654532, "epoch": 7885} {"train_loss": -28.3674259185791, "global_step": 654533, "epoch": 7885} {"train_loss": -28.115711212158203, "global_step": 654534, "epoch": 7885} {"train_loss": -28.361135482788086, "global_step": 654535, "epoch": 7885} {"train_loss": -28.5097713470459, "global_step": 654536, "epoch": 7885} {"train_loss": -28.124913365007885, "global_step": 654537, "epoch": 7885, "val_loss": 6719092.0} {"train_loss": -27.97867774963379, "global_step": 654538, "epoch": 7886} {"train_loss": -28.035480499267578, "global_step": 654539, "epoch": 7886} {"train_loss": -28.181455612182617, "global_step": 654540, "epoch": 7886} {"train_loss": -28.143217086791992, "global_step": 654541, "epoch": 7886} {"train_loss": -28.082529067993164, "global_step": 654542, "epoch": 7886} {"train_loss": -27.754545211791992, "global_step": 654543, "epoch": 7886} {"train_loss": -28.027456283569336, "global_step": 654544, "epoch": 7886} {"train_loss": -28.01083755493164, "global_step": 654545, "epoch": 7886} {"train_loss": -28.12129783630371, "global_step": 654546, "epoch": 7886} {"train_loss": -27.992919921875, "global_step": 654547, "epoch": 7886} {"train_loss": -28.221765518188477, "global_step": 654548, "epoch": 7886} {"train_loss": -28.332239151000977, "global_step": 654549, "epoch": 7886} {"train_loss": -28.331220626831055, "global_step": 654550, "epoch": 7886} {"train_loss": -28.074649810791016, "global_step": 654551, "epoch": 7886} {"train_loss": -28.245868682861328, "global_step": 654552, "epoch": 7886} {"train_loss": -28.350910186767578, "global_step": 654553, "epoch": 7886} {"train_loss": -28.184707641601562, "global_step": 654554, "epoch": 7886} {"train_loss": -28.20289421081543, "global_step": 654555, "epoch": 7886} {"train_loss": -28.149866104125977, "global_step": 654556, "epoch": 7886} {"train_loss": -28.55222511291504, "global_step": 654557, "epoch": 7886} {"train_loss": -28.559783935546875, "global_step": 654558, "epoch": 7886} {"train_loss": -28.41669273376465, "global_step": 654559, "epoch": 7886} {"train_loss": -28.49591064453125, "global_step": 654560, "epoch": 7886} {"train_loss": -28.283292770385742, "global_step": 654561, "epoch": 7886} {"train_loss": -28.226898193359375, "global_step": 654562, "epoch": 7886} {"train_loss": -28.767257690429688, "global_step": 654563, "epoch": 7886} {"train_loss": -28.36798667907715, "global_step": 654564, "epoch": 7886} {"train_loss": -28.44644546508789, "global_step": 654565, "epoch": 7886} {"train_loss": -28.62969398498535, "global_step": 654566, "epoch": 7886} {"train_loss": -28.914886474609375, "global_step": 654567, "epoch": 7886} {"train_loss": -28.15459632873535, "global_step": 654568, "epoch": 7886} {"train_loss": -28.43977165222168, "global_step": 654569, "epoch": 7886} {"train_loss": -28.0465030670166, "global_step": 654570, "epoch": 7886} {"train_loss": -28.37407875061035, "global_step": 654571, "epoch": 7886} {"train_loss": -28.482275009155273, "global_step": 654572, "epoch": 7886} {"train_loss": -28.3046932220459, "global_step": 654573, "epoch": 7886} {"train_loss": -28.371002197265625, "global_step": 654574, "epoch": 7886} {"train_loss": -28.133459091186523, "global_step": 654575, "epoch": 7886} {"train_loss": -28.98382568359375, "global_step": 654576, "epoch": 7886} {"train_loss": -28.748218536376953, "global_step": 654577, "epoch": 7886} {"train_loss": -28.51910400390625, "global_step": 654578, "epoch": 7886} {"train_loss": -28.437658309936523, "global_step": 654579, "epoch": 7886} {"train_loss": -28.222631454467773, "global_step": 654580, "epoch": 7886} {"train_loss": -28.905439376831055, "global_step": 654581, "epoch": 7886} {"train_loss": -28.701786041259766, "global_step": 654582, "epoch": 7886} {"train_loss": -28.732263565063477, "global_step": 654583, "epoch": 7886} {"train_loss": -28.56418228149414, "global_step": 654584, "epoch": 7886} {"train_loss": -28.645034790039062, "global_step": 654585, "epoch": 7886} {"train_loss": -28.492338180541992, "global_step": 654586, "epoch": 7886} {"train_loss": -27.9998779296875, "global_step": 654587, "epoch": 7886} {"train_loss": -27.6015567779541, "global_step": 654588, "epoch": 7886} {"train_loss": -26.92974853515625, "global_step": 654589, "epoch": 7886} {"train_loss": -27.634429931640625, "global_step": 654590, "epoch": 7886} {"train_loss": -27.84833335876465, "global_step": 654591, "epoch": 7886} {"train_loss": -27.60147476196289, "global_step": 654592, "epoch": 7886} {"train_loss": -28.302764892578125, "global_step": 654593, "epoch": 7886} {"train_loss": -28.284448623657227, "global_step": 654594, "epoch": 7886} {"train_loss": -27.810888290405273, "global_step": 654595, "epoch": 7886} {"train_loss": -28.369760513305664, "global_step": 654596, "epoch": 7886} {"train_loss": -28.150049209594727, "global_step": 654597, "epoch": 7886} {"train_loss": -28.437591552734375, "global_step": 654598, "epoch": 7886} {"train_loss": -28.005706787109375, "global_step": 654599, "epoch": 7886} {"train_loss": -28.69002342224121, "global_step": 654600, "epoch": 7886} {"train_loss": -28.37933349609375, "global_step": 654601, "epoch": 7886} {"train_loss": -28.19784927368164, "global_step": 654602, "epoch": 7886} {"train_loss": -28.236791610717773, "global_step": 654603, "epoch": 7886} {"train_loss": -28.244577407836914, "global_step": 654604, "epoch": 7886} {"train_loss": -28.456274032592773, "global_step": 654605, "epoch": 7886} {"train_loss": -28.23233413696289, "global_step": 654606, "epoch": 7886} {"train_loss": -28.334644317626953, "global_step": 654607, "epoch": 7886} {"train_loss": -28.126317977905273, "global_step": 654608, "epoch": 7886} {"train_loss": -28.1739501953125, "global_step": 654609, "epoch": 7886} {"train_loss": -28.586233139038086, "global_step": 654610, "epoch": 7886} {"train_loss": -28.194067001342773, "global_step": 654611, "epoch": 7886} {"train_loss": -28.2873477935791, "global_step": 654612, "epoch": 7886} {"train_loss": -28.19586753845215, "global_step": 654613, "epoch": 7886} {"train_loss": -28.3104190826416, "global_step": 654614, "epoch": 7886} {"train_loss": -28.503311157226562, "global_step": 654615, "epoch": 7886} {"train_loss": -28.123291015625, "global_step": 654616, "epoch": 7886} {"train_loss": -28.33820152282715, "global_step": 654617, "epoch": 7886} {"train_loss": -28.610265731811523, "global_step": 654618, "epoch": 7886} {"train_loss": -28.457807540893555, "global_step": 654619, "epoch": 7886} {"train_loss": -28.26799300779779, "global_step": 654620, "epoch": 7886, "val_loss": 6731129.0} {"train_loss": -27.56475830078125, "global_step": 654621, "epoch": 7887} {"train_loss": -27.442615509033203, "global_step": 654622, "epoch": 7887} {"train_loss": -27.850479125976562, "global_step": 654623, "epoch": 7887} {"train_loss": -27.23463249206543, "global_step": 654624, "epoch": 7887} {"train_loss": -28.119293212890625, "global_step": 654625, "epoch": 7887} {"train_loss": -27.945775985717773, "global_step": 654626, "epoch": 7887} {"train_loss": -27.89801025390625, "global_step": 654627, "epoch": 7887} {"train_loss": -27.485034942626953, "global_step": 654628, "epoch": 7887} {"train_loss": -28.05243492126465, "global_step": 654629, "epoch": 7887} {"train_loss": -27.44073486328125, "global_step": 654630, "epoch": 7887} {"train_loss": -27.654043197631836, "global_step": 654631, "epoch": 7887} {"train_loss": -27.9764461517334, "global_step": 654632, "epoch": 7887} {"train_loss": -27.29966163635254, "global_step": 654633, "epoch": 7887} {"train_loss": -28.198410034179688, "global_step": 654634, "epoch": 7887} {"train_loss": -28.213186264038086, "global_step": 654635, "epoch": 7887} {"train_loss": -27.88237953186035, "global_step": 654636, "epoch": 7887} {"train_loss": -28.173620223999023, "global_step": 654637, "epoch": 7887} {"train_loss": -27.39337158203125, "global_step": 654638, "epoch": 7887} {"train_loss": -28.20187759399414, "global_step": 654639, "epoch": 7887} {"train_loss": -27.878143310546875, "global_step": 654640, "epoch": 7887} {"train_loss": -27.811853408813477, "global_step": 654641, "epoch": 7887} {"train_loss": -27.633275985717773, "global_step": 654642, "epoch": 7887} {"train_loss": -27.89444923400879, "global_step": 654643, "epoch": 7887} {"train_loss": -28.198902130126953, "global_step": 654644, "epoch": 7887} {"train_loss": -28.322118759155273, "global_step": 654645, "epoch": 7887} {"train_loss": -28.18073844909668, "global_step": 654646, "epoch": 7887} {"train_loss": -28.480817794799805, "global_step": 654647, "epoch": 7887} {"train_loss": -28.336063385009766, "global_step": 654648, "epoch": 7887} {"train_loss": -28.2774600982666, "global_step": 654649, "epoch": 7887} {"train_loss": -28.2125244140625, "global_step": 654650, "epoch": 7887} {"train_loss": -28.378698348999023, "global_step": 654651, "epoch": 7887} {"train_loss": -28.414737701416016, "global_step": 654652, "epoch": 7887} {"train_loss": -28.470569610595703, "global_step": 654653, "epoch": 7887} {"train_loss": -28.21343994140625, "global_step": 654654, "epoch": 7887} {"train_loss": -28.07318115234375, "global_step": 654655, "epoch": 7887} {"train_loss": -28.449142456054688, "global_step": 654656, "epoch": 7887} {"train_loss": -28.30986976623535, "global_step": 654657, "epoch": 7887} {"train_loss": -28.28525733947754, "global_step": 654658, "epoch": 7887} {"train_loss": -28.513874053955078, "global_step": 654659, "epoch": 7887} {"train_loss": -28.2545108795166, "global_step": 654660, "epoch": 7887} {"train_loss": -28.189966201782227, "global_step": 654661, "epoch": 7887} {"train_loss": -28.64435386657715, "global_step": 654662, "epoch": 7887} {"train_loss": -28.408666610717773, "global_step": 654663, "epoch": 7887} {"train_loss": -28.362287521362305, "global_step": 654664, "epoch": 7887} {"train_loss": -28.248565673828125, "global_step": 654665, "epoch": 7887} {"train_loss": -28.538455963134766, "global_step": 654666, "epoch": 7887} {"train_loss": -28.376317977905273, "global_step": 654667, "epoch": 7887} {"train_loss": -28.00469398498535, "global_step": 654668, "epoch": 7887} {"train_loss": -28.594945907592773, "global_step": 654669, "epoch": 7887} {"train_loss": -28.7701473236084, "global_step": 654670, "epoch": 7887} {"train_loss": -28.12965202331543, "global_step": 654671, "epoch": 7887} {"train_loss": -28.4027099609375, "global_step": 654672, "epoch": 7887} {"train_loss": -28.076745986938477, "global_step": 654673, "epoch": 7887} {"train_loss": -28.2961368560791, "global_step": 654674, "epoch": 7887} {"train_loss": -28.18695640563965, "global_step": 654675, "epoch": 7887} {"train_loss": -28.605976104736328, "global_step": 654676, "epoch": 7887} {"train_loss": -28.51557731628418, "global_step": 654677, "epoch": 7887} {"train_loss": -27.8945369720459, "global_step": 654678, "epoch": 7887} {"train_loss": -26.83485221862793, "global_step": 654679, "epoch": 7887} {"train_loss": -26.675220489501953, "global_step": 654680, "epoch": 7887} {"train_loss": -26.62567710876465, "global_step": 654681, "epoch": 7887} {"train_loss": -27.371606826782227, "global_step": 654682, "epoch": 7887} {"train_loss": -28.25558853149414, "global_step": 654683, "epoch": 7887} {"train_loss": -26.31257438659668, "global_step": 654684, "epoch": 7887} {"train_loss": -27.182357788085938, "global_step": 654685, "epoch": 7887} {"train_loss": -28.01190185546875, "global_step": 654686, "epoch": 7887} {"train_loss": -27.256275177001953, "global_step": 654687, "epoch": 7887} {"train_loss": -27.45789909362793, "global_step": 654688, "epoch": 7887} {"train_loss": -27.996084213256836, "global_step": 654689, "epoch": 7887} {"train_loss": -28.021841049194336, "global_step": 654690, "epoch": 7887} {"train_loss": -27.979089736938477, "global_step": 654691, "epoch": 7887} {"train_loss": -27.68379783630371, "global_step": 654692, "epoch": 7887} {"train_loss": -27.99785804748535, "global_step": 654693, "epoch": 7887} {"train_loss": -27.744871139526367, "global_step": 654694, "epoch": 7887} {"train_loss": -27.538244247436523, "global_step": 654695, "epoch": 7887} {"train_loss": -27.661340713500977, "global_step": 654696, "epoch": 7887} {"train_loss": -28.111469268798828, "global_step": 654697, "epoch": 7887} {"train_loss": -27.843191146850586, "global_step": 654698, "epoch": 7887} {"train_loss": -27.367328643798828, "global_step": 654699, "epoch": 7887} {"train_loss": -28.19483757019043, "global_step": 654700, "epoch": 7887} {"train_loss": -27.88520622253418, "global_step": 654701, "epoch": 7887} {"train_loss": -27.517927169799805, "global_step": 654702, "epoch": 7887} {"train_loss": -27.957641555602294, "global_step": 654703, "epoch": 7887, "val_loss": 6551149.0} {"train_loss": -27.65045738220215, "global_step": 654704, "epoch": 7888} {"train_loss": -27.7810115814209, "global_step": 654705, "epoch": 7888} {"train_loss": -27.67725944519043, "global_step": 654706, "epoch": 7888} {"train_loss": -28.06300163269043, "global_step": 654707, "epoch": 7888} {"train_loss": -27.3411865234375, "global_step": 654708, "epoch": 7888} {"train_loss": -27.517059326171875, "global_step": 654709, "epoch": 7888} {"train_loss": -27.83350944519043, "global_step": 654710, "epoch": 7888} {"train_loss": -27.85389518737793, "global_step": 654711, "epoch": 7888} {"train_loss": -27.963165283203125, "global_step": 654712, "epoch": 7888} {"train_loss": -28.16668701171875, "global_step": 654713, "epoch": 7888} {"train_loss": -27.872159957885742, "global_step": 654714, "epoch": 7888} {"train_loss": -27.8075008392334, "global_step": 654715, "epoch": 7888} {"train_loss": -28.1370792388916, "global_step": 654716, "epoch": 7888} {"train_loss": -28.135374069213867, "global_step": 654717, "epoch": 7888} {"train_loss": -28.245344161987305, "global_step": 654718, "epoch": 7888} {"train_loss": -28.310714721679688, "global_step": 654719, "epoch": 7888} {"train_loss": -27.596073150634766, "global_step": 654720, "epoch": 7888} {"train_loss": -28.226526260375977, "global_step": 654721, "epoch": 7888} {"train_loss": -27.820098876953125, "global_step": 654722, "epoch": 7888} {"train_loss": -27.846586227416992, "global_step": 654723, "epoch": 7888} {"train_loss": -28.188282012939453, "global_step": 654724, "epoch": 7888} {"train_loss": -28.543079376220703, "global_step": 654725, "epoch": 7888} {"train_loss": -28.2131404876709, "global_step": 654726, "epoch": 7888} {"train_loss": -28.377790451049805, "global_step": 654727, "epoch": 7888} {"train_loss": -28.301122665405273, "global_step": 654728, "epoch": 7888} {"train_loss": -28.218198776245117, "global_step": 654729, "epoch": 7888} {"train_loss": -28.262775421142578, "global_step": 654730, "epoch": 7888} {"train_loss": -28.1939754486084, "global_step": 654731, "epoch": 7888} {"train_loss": -28.32883644104004, "global_step": 654732, "epoch": 7888} {"train_loss": -28.332727432250977, "global_step": 654733, "epoch": 7888} {"train_loss": -28.33698844909668, "global_step": 654734, "epoch": 7888} {"train_loss": -28.365270614624023, "global_step": 654735, "epoch": 7888} {"train_loss": -28.438556671142578, "global_step": 654736, "epoch": 7888} {"train_loss": -28.286962509155273, "global_step": 654737, "epoch": 7888} {"train_loss": -28.388446807861328, "global_step": 654738, "epoch": 7888} {"train_loss": -28.4823055267334, "global_step": 654739, "epoch": 7888} {"train_loss": -28.753864288330078, "global_step": 654740, "epoch": 7888} {"train_loss": -28.65816307067871, "global_step": 654741, "epoch": 7888} {"train_loss": -28.405933380126953, "global_step": 654742, "epoch": 7888} {"train_loss": -28.954193115234375, "global_step": 654743, "epoch": 7888} {"train_loss": -28.831836700439453, "global_step": 654744, "epoch": 7888} {"train_loss": -28.21529197692871, "global_step": 654745, "epoch": 7888} {"train_loss": -28.346288681030273, "global_step": 654746, "epoch": 7888} {"train_loss": -28.57965087890625, "global_step": 654747, "epoch": 7888} {"train_loss": -28.742034912109375, "global_step": 654748, "epoch": 7888} {"train_loss": -28.7192440032959, "global_step": 654749, "epoch": 7888} {"train_loss": -28.790390014648438, "global_step": 654750, "epoch": 7888} {"train_loss": -28.081369400024414, "global_step": 654751, "epoch": 7888} {"train_loss": -28.4766845703125, "global_step": 654752, "epoch": 7888} {"train_loss": -28.64261245727539, "global_step": 654753, "epoch": 7888} {"train_loss": -28.613248825073242, "global_step": 654754, "epoch": 7888} {"train_loss": -28.528553009033203, "global_step": 654755, "epoch": 7888} {"train_loss": -28.0497989654541, "global_step": 654756, "epoch": 7888} {"train_loss": -28.182327270507812, "global_step": 654757, "epoch": 7888} {"train_loss": -28.483341217041016, "global_step": 654758, "epoch": 7888} {"train_loss": -28.265371322631836, "global_step": 654759, "epoch": 7888} {"train_loss": -28.092966079711914, "global_step": 654760, "epoch": 7888} {"train_loss": -28.31917381286621, "global_step": 654761, "epoch": 7888} {"train_loss": -28.36200523376465, "global_step": 654762, "epoch": 7888} {"train_loss": -28.203540802001953, "global_step": 654763, "epoch": 7888} {"train_loss": -28.59380531311035, "global_step": 654764, "epoch": 7888} {"train_loss": -28.4207706451416, "global_step": 654765, "epoch": 7888} {"train_loss": -28.418054580688477, "global_step": 654766, "epoch": 7888} {"train_loss": -28.461889266967773, "global_step": 654767, "epoch": 7888} {"train_loss": -28.553497314453125, "global_step": 654768, "epoch": 7888} {"train_loss": -28.43044090270996, "global_step": 654769, "epoch": 7888} {"train_loss": -28.59967613220215, "global_step": 654770, "epoch": 7888} {"train_loss": -28.754064559936523, "global_step": 654771, "epoch": 7888} {"train_loss": -28.303369522094727, "global_step": 654772, "epoch": 7888} {"train_loss": -28.461042404174805, "global_step": 654773, "epoch": 7888} {"train_loss": -28.474828720092773, "global_step": 654774, "epoch": 7888} {"train_loss": -28.4515323638916, "global_step": 654775, "epoch": 7888} {"train_loss": -28.323169708251953, "global_step": 654776, "epoch": 7888} {"train_loss": -28.513824462890625, "global_step": 654777, "epoch": 7888} {"train_loss": -28.452865600585938, "global_step": 654778, "epoch": 7888} {"train_loss": -28.392969131469727, "global_step": 654779, "epoch": 7888} {"train_loss": -28.30954360961914, "global_step": 654780, "epoch": 7888} {"train_loss": -28.394617080688477, "global_step": 654781, "epoch": 7888} {"train_loss": -28.33627700805664, "global_step": 654782, "epoch": 7888} {"train_loss": -28.30328369140625, "global_step": 654783, "epoch": 7888} {"train_loss": -29.098840713500977, "global_step": 654784, "epoch": 7888} {"train_loss": -28.583282470703125, "global_step": 654785, "epoch": 7888} {"train_loss": -28.329079524580255, "global_step": 654786, "epoch": 7888, "val_loss": 6626170.0} {"train_loss": -23.35634422302246, "global_step": 654787, "epoch": 7889} {"train_loss": -26.952295303344727, "global_step": 654788, "epoch": 7889} {"train_loss": -22.98750877380371, "global_step": 654789, "epoch": 7889} {"train_loss": -27.4448184967041, "global_step": 654790, "epoch": 7889} {"train_loss": -25.18617820739746, "global_step": 654791, "epoch": 7889} {"train_loss": -26.914426803588867, "global_step": 654792, "epoch": 7889} {"train_loss": -26.101110458374023, "global_step": 654793, "epoch": 7889} {"train_loss": -26.175745010375977, "global_step": 654794, "epoch": 7889} {"train_loss": -27.070837020874023, "global_step": 654795, "epoch": 7889} {"train_loss": -26.71211051940918, "global_step": 654796, "epoch": 7889} {"train_loss": -26.69341468811035, "global_step": 654797, "epoch": 7889} {"train_loss": -26.747100830078125, "global_step": 654798, "epoch": 7889} {"train_loss": -27.297998428344727, "global_step": 654799, "epoch": 7889} {"train_loss": -27.3113956451416, "global_step": 654800, "epoch": 7889} {"train_loss": -27.19171714782715, "global_step": 654801, "epoch": 7889} {"train_loss": -27.091333389282227, "global_step": 654802, "epoch": 7889} {"train_loss": -27.41205406188965, "global_step": 654803, "epoch": 7889} {"train_loss": -27.349966049194336, "global_step": 654804, "epoch": 7889} {"train_loss": -27.4932804107666, "global_step": 654805, "epoch": 7889} {"train_loss": -27.15628433227539, "global_step": 654806, "epoch": 7889} {"train_loss": -27.201948165893555, "global_step": 654807, "epoch": 7889} {"train_loss": -27.43833351135254, "global_step": 654808, "epoch": 7889} {"train_loss": -27.58021354675293, "global_step": 654809, "epoch": 7889} {"train_loss": -27.658315658569336, "global_step": 654810, "epoch": 7889} {"train_loss": -27.628015518188477, "global_step": 654811, "epoch": 7889} {"train_loss": -27.181598663330078, "global_step": 654812, "epoch": 7889} {"train_loss": -27.34917640686035, "global_step": 654813, "epoch": 7889} {"train_loss": -27.683866500854492, "global_step": 654814, "epoch": 7889} {"train_loss": -27.802978515625, "global_step": 654815, "epoch": 7889} {"train_loss": -27.610443115234375, "global_step": 654816, "epoch": 7889} {"train_loss": -27.982824325561523, "global_step": 654817, "epoch": 7889} {"train_loss": -27.858129501342773, "global_step": 654818, "epoch": 7889} {"train_loss": -27.602331161499023, "global_step": 654819, "epoch": 7889} {"train_loss": -28.25259780883789, "global_step": 654820, "epoch": 7889} {"train_loss": -27.714033126831055, "global_step": 654821, "epoch": 7889} {"train_loss": -27.65839958190918, "global_step": 654822, "epoch": 7889} {"train_loss": -28.212360382080078, "global_step": 654823, "epoch": 7889} {"train_loss": -27.815189361572266, "global_step": 654824, "epoch": 7889} {"train_loss": -27.850326538085938, "global_step": 654825, "epoch": 7889} {"train_loss": -28.114301681518555, "global_step": 654826, "epoch": 7889} {"train_loss": -28.061538696289062, "global_step": 654827, "epoch": 7889} {"train_loss": -28.186521530151367, "global_step": 654828, "epoch": 7889} {"train_loss": -28.153547286987305, "global_step": 654829, "epoch": 7889} {"train_loss": -28.196380615234375, "global_step": 654830, "epoch": 7889} {"train_loss": -28.113550186157227, "global_step": 654831, "epoch": 7889} {"train_loss": -28.294998168945312, "global_step": 654832, "epoch": 7889} {"train_loss": -28.131128311157227, "global_step": 654833, "epoch": 7889} {"train_loss": -28.253324508666992, "global_step": 654834, "epoch": 7889} {"train_loss": -27.9278564453125, "global_step": 654835, "epoch": 7889} {"train_loss": -28.045434951782227, "global_step": 654836, "epoch": 7889} {"train_loss": -28.09521484375, "global_step": 654837, "epoch": 7889} {"train_loss": -28.44734001159668, "global_step": 654838, "epoch": 7889} {"train_loss": -28.40073585510254, "global_step": 654839, "epoch": 7889} {"train_loss": -28.003128051757812, "global_step": 654840, "epoch": 7889} {"train_loss": -28.37481689453125, "global_step": 654841, "epoch": 7889} {"train_loss": -28.49904441833496, "global_step": 654842, "epoch": 7889} {"train_loss": -28.302831649780273, "global_step": 654843, "epoch": 7889} {"train_loss": -28.408411026000977, "global_step": 654844, "epoch": 7889} {"train_loss": -28.251935958862305, "global_step": 654845, "epoch": 7889} {"train_loss": -28.196887969970703, "global_step": 654846, "epoch": 7889} {"train_loss": -28.126440048217773, "global_step": 654847, "epoch": 7889} {"train_loss": -27.89580726623535, "global_step": 654848, "epoch": 7889} {"train_loss": -28.036121368408203, "global_step": 654849, "epoch": 7889} {"train_loss": -28.206073760986328, "global_step": 654850, "epoch": 7889} {"train_loss": -28.304611206054688, "global_step": 654851, "epoch": 7889} {"train_loss": -28.29274559020996, "global_step": 654852, "epoch": 7889} {"train_loss": -28.487812042236328, "global_step": 654853, "epoch": 7889} {"train_loss": -28.27326774597168, "global_step": 654854, "epoch": 7889} {"train_loss": -28.382110595703125, "global_step": 654855, "epoch": 7889} {"train_loss": -27.939804077148438, "global_step": 654856, "epoch": 7889} {"train_loss": -28.286823272705078, "global_step": 654857, "epoch": 7889} {"train_loss": -28.191450119018555, "global_step": 654858, "epoch": 7889} {"train_loss": -28.451940536499023, "global_step": 654859, "epoch": 7889} {"train_loss": -27.83133888244629, "global_step": 654860, "epoch": 7889} {"train_loss": -28.433584213256836, "global_step": 654861, "epoch": 7889} {"train_loss": -28.344482421875, "global_step": 654862, "epoch": 7889} {"train_loss": -28.311126708984375, "global_step": 654863, "epoch": 7889} {"train_loss": -28.303014755249023, "global_step": 654864, "epoch": 7889} {"train_loss": -28.55364990234375, "global_step": 654865, "epoch": 7889} {"train_loss": -28.051416397094727, "global_step": 654866, "epoch": 7889} {"train_loss": -28.390653610229492, "global_step": 654867, "epoch": 7889} {"train_loss": -28.294782638549805, "global_step": 654868, "epoch": 7889} {"train_loss": -27.68281736718603, "global_step": 654869, "epoch": 7889, "val_loss": 6628331.0} {"train_loss": -27.550617218017578, "global_step": 654870, "epoch": 7890} {"train_loss": -27.648468017578125, "global_step": 654871, "epoch": 7890} {"train_loss": -28.02520179748535, "global_step": 654872, "epoch": 7890} {"train_loss": -27.5325870513916, "global_step": 654873, "epoch": 7890} {"train_loss": -27.771276473999023, "global_step": 654874, "epoch": 7890} {"train_loss": -27.333032608032227, "global_step": 654875, "epoch": 7890} {"train_loss": -27.1779842376709, "global_step": 654876, "epoch": 7890} {"train_loss": -27.836334228515625, "global_step": 654877, "epoch": 7890} {"train_loss": -27.875274658203125, "global_step": 654878, "epoch": 7890} {"train_loss": -27.0877685546875, "global_step": 654879, "epoch": 7890} {"train_loss": -27.371633529663086, "global_step": 654880, "epoch": 7890} {"train_loss": -28.448816299438477, "global_step": 654881, "epoch": 7890} {"train_loss": -27.385717391967773, "global_step": 654882, "epoch": 7890} {"train_loss": -27.85028076171875, "global_step": 654883, "epoch": 7890} {"train_loss": -27.78147315979004, "global_step": 654884, "epoch": 7890} {"train_loss": -28.383352279663086, "global_step": 654885, "epoch": 7890} {"train_loss": -27.28232192993164, "global_step": 654886, "epoch": 7890} {"train_loss": -28.134796142578125, "global_step": 654887, "epoch": 7890} {"train_loss": -28.04237174987793, "global_step": 654888, "epoch": 7890} {"train_loss": -27.98377799987793, "global_step": 654889, "epoch": 7890} {"train_loss": -27.654788970947266, "global_step": 654890, "epoch": 7890} {"train_loss": -27.99891471862793, "global_step": 654891, "epoch": 7890} {"train_loss": -28.28535270690918, "global_step": 654892, "epoch": 7890} {"train_loss": -27.718244552612305, "global_step": 654893, "epoch": 7890} {"train_loss": -28.053146362304688, "global_step": 654894, "epoch": 7890} {"train_loss": -28.2578125, "global_step": 654895, "epoch": 7890} {"train_loss": -28.37590980529785, "global_step": 654896, "epoch": 7890} {"train_loss": -28.033536911010742, "global_step": 654897, "epoch": 7890} {"train_loss": -28.048709869384766, "global_step": 654898, "epoch": 7890} {"train_loss": -28.292966842651367, "global_step": 654899, "epoch": 7890} {"train_loss": -28.22786521911621, "global_step": 654900, "epoch": 7890} {"train_loss": -28.480375289916992, "global_step": 654901, "epoch": 7890} {"train_loss": -28.033071517944336, "global_step": 654902, "epoch": 7890} {"train_loss": -28.44716453552246, "global_step": 654903, "epoch": 7890} {"train_loss": -28.60243034362793, "global_step": 654904, "epoch": 7890} {"train_loss": -27.87578773498535, "global_step": 654905, "epoch": 7890} {"train_loss": -28.33976173400879, "global_step": 654906, "epoch": 7890} {"train_loss": -28.128890991210938, "global_step": 654907, "epoch": 7890} {"train_loss": -28.466604232788086, "global_step": 654908, "epoch": 7890} {"train_loss": -28.538959503173828, "global_step": 654909, "epoch": 7890} {"train_loss": -28.365095138549805, "global_step": 654910, "epoch": 7890} {"train_loss": -27.879236221313477, "global_step": 654911, "epoch": 7890} {"train_loss": -28.299230575561523, "global_step": 654912, "epoch": 7890} {"train_loss": -28.3983097076416, "global_step": 654913, "epoch": 7890} {"train_loss": -28.254566192626953, "global_step": 654914, "epoch": 7890} {"train_loss": -28.67875099182129, "global_step": 654915, "epoch": 7890} {"train_loss": -28.24015235900879, "global_step": 654916, "epoch": 7890} {"train_loss": -28.490467071533203, "global_step": 654917, "epoch": 7890} {"train_loss": -28.499265670776367, "global_step": 654918, "epoch": 7890} {"train_loss": -28.345905303955078, "global_step": 654919, "epoch": 7890} {"train_loss": -28.490930557250977, "global_step": 654920, "epoch": 7890} {"train_loss": -28.342639923095703, "global_step": 654921, "epoch": 7890} {"train_loss": -28.58038902282715, "global_step": 654922, "epoch": 7890} {"train_loss": -28.240097045898438, "global_step": 654923, "epoch": 7890} {"train_loss": -28.32132911682129, "global_step": 654924, "epoch": 7890} {"train_loss": -28.680139541625977, "global_step": 654925, "epoch": 7890} {"train_loss": -28.500354766845703, "global_step": 654926, "epoch": 7890} {"train_loss": -28.6939754486084, "global_step": 654927, "epoch": 7890} {"train_loss": -28.416433334350586, "global_step": 654928, "epoch": 7890} {"train_loss": -28.38520622253418, "global_step": 654929, "epoch": 7890} {"train_loss": -28.445178985595703, "global_step": 654930, "epoch": 7890} {"train_loss": -28.505420684814453, "global_step": 654931, "epoch": 7890} {"train_loss": -28.609771728515625, "global_step": 654932, "epoch": 7890} {"train_loss": -28.563196182250977, "global_step": 654933, "epoch": 7890} {"train_loss": -28.5589599609375, "global_step": 654934, "epoch": 7890} {"train_loss": -28.79958152770996, "global_step": 654935, "epoch": 7890} {"train_loss": -28.447113037109375, "global_step": 654936, "epoch": 7890} {"train_loss": -28.493783950805664, "global_step": 654937, "epoch": 7890} {"train_loss": -28.486371994018555, "global_step": 654938, "epoch": 7890} {"train_loss": -28.778547286987305, "global_step": 654939, "epoch": 7890} {"train_loss": -28.532989501953125, "global_step": 654940, "epoch": 7890} {"train_loss": -28.754926681518555, "global_step": 654941, "epoch": 7890} {"train_loss": -28.901159286499023, "global_step": 654942, "epoch": 7890} {"train_loss": -28.4215030670166, "global_step": 654943, "epoch": 7890} {"train_loss": -28.68894386291504, "global_step": 654944, "epoch": 7890} {"train_loss": -28.68271827697754, "global_step": 654945, "epoch": 7890} {"train_loss": -28.38361930847168, "global_step": 654946, "epoch": 7890} {"train_loss": -28.318693161010742, "global_step": 654947, "epoch": 7890} {"train_loss": -28.69598960876465, "global_step": 654948, "epoch": 7890} {"train_loss": -28.73890495300293, "global_step": 654949, "epoch": 7890} {"train_loss": -28.473987579345703, "global_step": 654950, "epoch": 7890} {"train_loss": -28.492456436157227, "global_step": 654951, "epoch": 7890} {"train_loss": -28.25199352402285, "global_step": 654952, "epoch": 7890, "val_loss": 6682157.0} {"train_loss": -27.881988525390625, "global_step": 654953, "epoch": 7891} {"train_loss": -26.43467140197754, "global_step": 654954, "epoch": 7891} {"train_loss": -26.77117347717285, "global_step": 654955, "epoch": 7891} {"train_loss": -27.202573776245117, "global_step": 654956, "epoch": 7891} {"train_loss": -27.410755157470703, "global_step": 654957, "epoch": 7891} {"train_loss": -27.497568130493164, "global_step": 654958, "epoch": 7891} {"train_loss": -27.57111930847168, "global_step": 654959, "epoch": 7891} {"train_loss": -27.67008399963379, "global_step": 654960, "epoch": 7891} {"train_loss": -26.919233322143555, "global_step": 654961, "epoch": 7891} {"train_loss": -27.85413932800293, "global_step": 654962, "epoch": 7891} {"train_loss": -27.909082412719727, "global_step": 654963, "epoch": 7891} {"train_loss": -27.355560302734375, "global_step": 654964, "epoch": 7891} {"train_loss": -27.482736587524414, "global_step": 654965, "epoch": 7891} {"train_loss": -27.713607788085938, "global_step": 654966, "epoch": 7891} {"train_loss": -27.491308212280273, "global_step": 654967, "epoch": 7891} {"train_loss": -27.636083602905273, "global_step": 654968, "epoch": 7891} {"train_loss": -27.873218536376953, "global_step": 654969, "epoch": 7891} {"train_loss": -28.204065322875977, "global_step": 654970, "epoch": 7891} {"train_loss": -27.92782974243164, "global_step": 654971, "epoch": 7891} {"train_loss": -27.69846534729004, "global_step": 654972, "epoch": 7891} {"train_loss": -27.917593002319336, "global_step": 654973, "epoch": 7891} {"train_loss": -27.933399200439453, "global_step": 654974, "epoch": 7891} {"train_loss": -28.0980281829834, "global_step": 654975, "epoch": 7891} {"train_loss": -28.15174674987793, "global_step": 654976, "epoch": 7891} {"train_loss": -27.819807052612305, "global_step": 654977, "epoch": 7891} {"train_loss": -27.907424926757812, "global_step": 654978, "epoch": 7891} {"train_loss": -28.351287841796875, "global_step": 654979, "epoch": 7891} {"train_loss": -28.252593994140625, "global_step": 654980, "epoch": 7891} {"train_loss": -28.31561851501465, "global_step": 654981, "epoch": 7891} {"train_loss": -28.02644157409668, "global_step": 654982, "epoch": 7891} {"train_loss": -28.422901153564453, "global_step": 654983, "epoch": 7891} {"train_loss": -27.988651275634766, "global_step": 654984, "epoch": 7891} {"train_loss": -28.087249755859375, "global_step": 654985, "epoch": 7891} {"train_loss": -28.242177963256836, "global_step": 654986, "epoch": 7891} {"train_loss": -28.309925079345703, "global_step": 654987, "epoch": 7891} {"train_loss": -28.566680908203125, "global_step": 654988, "epoch": 7891} {"train_loss": -28.304141998291016, "global_step": 654989, "epoch": 7891} {"train_loss": -28.616491317749023, "global_step": 654990, "epoch": 7891} {"train_loss": -28.133655548095703, "global_step": 654991, "epoch": 7891} {"train_loss": -28.22934913635254, "global_step": 654992, "epoch": 7891} {"train_loss": -28.219263076782227, "global_step": 654993, "epoch": 7891} {"train_loss": -28.323535919189453, "global_step": 654994, "epoch": 7891} {"train_loss": -28.429452896118164, "global_step": 654995, "epoch": 7891} {"train_loss": -28.589492797851562, "global_step": 654996, "epoch": 7891} {"train_loss": -28.461393356323242, "global_step": 654997, "epoch": 7891} {"train_loss": -28.543140411376953, "global_step": 654998, "epoch": 7891} {"train_loss": -28.343149185180664, "global_step": 654999, "epoch": 7891} {"train_loss": -28.078100204467773, "global_step": 655000, "epoch": 7891} {"train_loss": -27.9901180267334, "global_step": 655001, "epoch": 7891} {"train_loss": -28.836774826049805, "global_step": 655002, "epoch": 7891} {"train_loss": -28.771976470947266, "global_step": 655003, "epoch": 7891} {"train_loss": -28.7282657623291, "global_step": 655004, "epoch": 7891} {"train_loss": -28.642526626586914, "global_step": 655005, "epoch": 7891} {"train_loss": -28.5292911529541, "global_step": 655006, "epoch": 7891} {"train_loss": -28.532392501831055, "global_step": 655007, "epoch": 7891} {"train_loss": -28.644147872924805, "global_step": 655008, "epoch": 7891} {"train_loss": -28.525394439697266, "global_step": 655009, "epoch": 7891} {"train_loss": -28.282617568969727, "global_step": 655010, "epoch": 7891} {"train_loss": -28.56952476501465, "global_step": 655011, "epoch": 7891} {"train_loss": -28.50361442565918, "global_step": 655012, "epoch": 7891} {"train_loss": -28.4984188079834, "global_step": 655013, "epoch": 7891} {"train_loss": -28.81429100036621, "global_step": 655014, "epoch": 7891} {"train_loss": -28.626577377319336, "global_step": 655015, "epoch": 7891} {"train_loss": -28.332361221313477, "global_step": 655016, "epoch": 7891} {"train_loss": -28.42000389099121, "global_step": 655017, "epoch": 7891} {"train_loss": -28.5517635345459, "global_step": 655018, "epoch": 7891} {"train_loss": -28.25611686706543, "global_step": 655019, "epoch": 7891} {"train_loss": -28.236927032470703, "global_step": 655020, "epoch": 7891} {"train_loss": -28.505659103393555, "global_step": 655021, "epoch": 7891} {"train_loss": -28.778228759765625, "global_step": 655022, "epoch": 7891} {"train_loss": -27.940656661987305, "global_step": 655023, "epoch": 7891} {"train_loss": -28.61859130859375, "global_step": 655024, "epoch": 7891} {"train_loss": -28.38356590270996, "global_step": 655025, "epoch": 7891} {"train_loss": -28.430286407470703, "global_step": 655026, "epoch": 7891} {"train_loss": -28.31890869140625, "global_step": 655027, "epoch": 7891} {"train_loss": -28.610645294189453, "global_step": 655028, "epoch": 7891} {"train_loss": -28.276275634765625, "global_step": 655029, "epoch": 7891} {"train_loss": -28.5132999420166, "global_step": 655030, "epoch": 7891} {"train_loss": -27.984817504882812, "global_step": 655031, "epoch": 7891} {"train_loss": -27.75018310546875, "global_step": 655032, "epoch": 7891} {"train_loss": -28.07905387878418, "global_step": 655033, "epoch": 7891} {"train_loss": -27.207813262939453, "global_step": 655034, "epoch": 7891} {"train_loss": -28.09835852197854, "global_step": 655035, "epoch": 7891, "val_loss": 6671046.0} {"train_loss": -18.700284957885742, "global_step": 655036, "epoch": 7892} {"train_loss": -22.794864654541016, "global_step": 655037, "epoch": 7892} {"train_loss": -25.320737838745117, "global_step": 655038, "epoch": 7892} {"train_loss": -22.842721939086914, "global_step": 655039, "epoch": 7892} {"train_loss": -25.102218627929688, "global_step": 655040, "epoch": 7892} {"train_loss": -24.048093795776367, "global_step": 655041, "epoch": 7892} {"train_loss": -25.588125228881836, "global_step": 655042, "epoch": 7892} {"train_loss": -24.999013900756836, "global_step": 655043, "epoch": 7892} {"train_loss": -24.82167625427246, "global_step": 655044, "epoch": 7892} {"train_loss": -25.224451065063477, "global_step": 655045, "epoch": 7892} {"train_loss": -25.083425521850586, "global_step": 655046, "epoch": 7892} {"train_loss": -26.1252498626709, "global_step": 655047, "epoch": 7892} {"train_loss": -25.81622314453125, "global_step": 655048, "epoch": 7892} {"train_loss": -25.902271270751953, "global_step": 655049, "epoch": 7892} {"train_loss": -26.484521865844727, "global_step": 655050, "epoch": 7892} {"train_loss": -26.068159103393555, "global_step": 655051, "epoch": 7892} {"train_loss": -26.214574813842773, "global_step": 655052, "epoch": 7892} {"train_loss": -26.62643814086914, "global_step": 655053, "epoch": 7892} {"train_loss": -26.433719635009766, "global_step": 655054, "epoch": 7892} {"train_loss": -26.3006649017334, "global_step": 655055, "epoch": 7892} {"train_loss": -26.64599609375, "global_step": 655056, "epoch": 7892} {"train_loss": -26.743408203125, "global_step": 655057, "epoch": 7892} {"train_loss": -26.64520263671875, "global_step": 655058, "epoch": 7892} {"train_loss": -26.87444496154785, "global_step": 655059, "epoch": 7892} {"train_loss": -26.8143253326416, "global_step": 655060, "epoch": 7892} {"train_loss": -26.73904800415039, "global_step": 655061, "epoch": 7892} {"train_loss": -27.154733657836914, "global_step": 655062, "epoch": 7892} {"train_loss": -27.10340690612793, "global_step": 655063, "epoch": 7892} {"train_loss": -26.790735244750977, "global_step": 655064, "epoch": 7892} {"train_loss": -27.14400291442871, "global_step": 655065, "epoch": 7892} {"train_loss": -26.768115997314453, "global_step": 655066, "epoch": 7892} {"train_loss": -27.22694969177246, "global_step": 655067, "epoch": 7892} {"train_loss": -27.000280380249023, "global_step": 655068, "epoch": 7892} {"train_loss": -26.634389877319336, "global_step": 655069, "epoch": 7892} {"train_loss": -27.020872116088867, "global_step": 655070, "epoch": 7892} {"train_loss": -27.219022750854492, "global_step": 655071, "epoch": 7892} {"train_loss": -27.245508193969727, "global_step": 655072, "epoch": 7892} {"train_loss": -27.7745361328125, "global_step": 655073, "epoch": 7892} {"train_loss": -26.93012809753418, "global_step": 655074, "epoch": 7892} {"train_loss": -27.425683975219727, "global_step": 655075, "epoch": 7892} {"train_loss": -27.770002365112305, "global_step": 655076, "epoch": 7892} {"train_loss": -27.478748321533203, "global_step": 655077, "epoch": 7892} {"train_loss": -27.92193031311035, "global_step": 655078, "epoch": 7892} {"train_loss": -27.615711212158203, "global_step": 655079, "epoch": 7892} {"train_loss": -27.393817901611328, "global_step": 655080, "epoch": 7892} {"train_loss": -27.542280197143555, "global_step": 655081, "epoch": 7892} {"train_loss": -27.793594360351562, "global_step": 655082, "epoch": 7892} {"train_loss": -27.9008731842041, "global_step": 655083, "epoch": 7892} {"train_loss": -27.751142501831055, "global_step": 655084, "epoch": 7892} {"train_loss": -27.995847702026367, "global_step": 655085, "epoch": 7892} {"train_loss": -27.76002311706543, "global_step": 655086, "epoch": 7892} {"train_loss": -28.03316307067871, "global_step": 655087, "epoch": 7892} {"train_loss": -27.60706901550293, "global_step": 655088, "epoch": 7892} {"train_loss": -28.3270320892334, "global_step": 655089, "epoch": 7892} {"train_loss": -27.967060089111328, "global_step": 655090, "epoch": 7892} {"train_loss": -28.62354850769043, "global_step": 655091, "epoch": 7892} {"train_loss": -28.22711181640625, "global_step": 655092, "epoch": 7892} {"train_loss": -28.404645919799805, "global_step": 655093, "epoch": 7892} {"train_loss": -28.112110137939453, "global_step": 655094, "epoch": 7892} {"train_loss": -28.25642204284668, "global_step": 655095, "epoch": 7892} {"train_loss": -28.01795768737793, "global_step": 655096, "epoch": 7892} {"train_loss": -28.06561279296875, "global_step": 655097, "epoch": 7892} {"train_loss": -28.769567489624023, "global_step": 655098, "epoch": 7892} {"train_loss": -28.14719009399414, "global_step": 655099, "epoch": 7892} {"train_loss": -28.050628662109375, "global_step": 655100, "epoch": 7892} {"train_loss": -28.415821075439453, "global_step": 655101, "epoch": 7892} {"train_loss": -27.762861251831055, "global_step": 655102, "epoch": 7892} {"train_loss": -28.50070571899414, "global_step": 655103, "epoch": 7892} {"train_loss": -28.36187744140625, "global_step": 655104, "epoch": 7892} {"train_loss": -28.390201568603516, "global_step": 655105, "epoch": 7892} {"train_loss": -28.329858779907227, "global_step": 655106, "epoch": 7892} {"train_loss": -28.577056884765625, "global_step": 655107, "epoch": 7892} {"train_loss": -28.545822143554688, "global_step": 655108, "epoch": 7892} {"train_loss": -28.49725341796875, "global_step": 655109, "epoch": 7892} {"train_loss": -28.152387619018555, "global_step": 655110, "epoch": 7892} {"train_loss": -28.24798583984375, "global_step": 655111, "epoch": 7892} {"train_loss": -28.5958251953125, "global_step": 655112, "epoch": 7892} {"train_loss": -28.383752822875977, "global_step": 655113, "epoch": 7892} {"train_loss": -28.07795524597168, "global_step": 655114, "epoch": 7892} {"train_loss": -27.993488311767578, "global_step": 655115, "epoch": 7892} {"train_loss": -28.255859375, "global_step": 655116, "epoch": 7892} {"train_loss": -28.523120880126953, "global_step": 655117, "epoch": 7892} {"train_loss": -27.11649044450507, "global_step": 655118, "epoch": 7892, "val_loss": 6531960.0} {"train_loss": -28.119556427001953, "global_step": 655119, "epoch": 7893} {"train_loss": -28.149084091186523, "global_step": 655120, "epoch": 7893} {"train_loss": -28.251712799072266, "global_step": 655121, "epoch": 7893} {"train_loss": -28.412235260009766, "global_step": 655122, "epoch": 7893} {"train_loss": -28.271604537963867, "global_step": 655123, "epoch": 7893} {"train_loss": -28.414356231689453, "global_step": 655124, "epoch": 7893} {"train_loss": -28.31278419494629, "global_step": 655125, "epoch": 7893} {"train_loss": -28.07478141784668, "global_step": 655126, "epoch": 7893} {"train_loss": -28.37644386291504, "global_step": 655127, "epoch": 7893} {"train_loss": -28.404077529907227, "global_step": 655128, "epoch": 7893} {"train_loss": -28.23261833190918, "global_step": 655129, "epoch": 7893} {"train_loss": -28.222639083862305, "global_step": 655130, "epoch": 7893} {"train_loss": -28.281692504882812, "global_step": 655131, "epoch": 7893} {"train_loss": -28.41645622253418, "global_step": 655132, "epoch": 7893} {"train_loss": -28.454639434814453, "global_step": 655133, "epoch": 7893} {"train_loss": -28.038488388061523, "global_step": 655134, "epoch": 7893} {"train_loss": -28.38001823425293, "global_step": 655135, "epoch": 7893} {"train_loss": -28.0932559967041, "global_step": 655136, "epoch": 7893} {"train_loss": -28.339370727539062, "global_step": 655137, "epoch": 7893} {"train_loss": -28.534427642822266, "global_step": 655138, "epoch": 7893} {"train_loss": -28.41543960571289, "global_step": 655139, "epoch": 7893} {"train_loss": -28.349836349487305, "global_step": 655140, "epoch": 7893} {"train_loss": -28.464765548706055, "global_step": 655141, "epoch": 7893} {"train_loss": -28.281278610229492, "global_step": 655142, "epoch": 7893} {"train_loss": -28.689252853393555, "global_step": 655143, "epoch": 7893} {"train_loss": -28.573225021362305, "global_step": 655144, "epoch": 7893} {"train_loss": -28.714691162109375, "global_step": 655145, "epoch": 7893} {"train_loss": -28.42645263671875, "global_step": 655146, "epoch": 7893} {"train_loss": -28.474746704101562, "global_step": 655147, "epoch": 7893} {"train_loss": -28.349411010742188, "global_step": 655148, "epoch": 7893} {"train_loss": -28.7083740234375, "global_step": 655149, "epoch": 7893} {"train_loss": -28.581836700439453, "global_step": 655150, "epoch": 7893} {"train_loss": -28.220813751220703, "global_step": 655151, "epoch": 7893} {"train_loss": -28.201526641845703, "global_step": 655152, "epoch": 7893} {"train_loss": -28.29319190979004, "global_step": 655153, "epoch": 7893} {"train_loss": -28.299274444580078, "global_step": 655154, "epoch": 7893} {"train_loss": -28.301767349243164, "global_step": 655155, "epoch": 7893} {"train_loss": -28.403188705444336, "global_step": 655156, "epoch": 7893} {"train_loss": -28.44154167175293, "global_step": 655157, "epoch": 7893} {"train_loss": -28.485153198242188, "global_step": 655158, "epoch": 7893} {"train_loss": -27.597299575805664, "global_step": 655159, "epoch": 7893} {"train_loss": -27.8526554107666, "global_step": 655160, "epoch": 7893} {"train_loss": -27.33955192565918, "global_step": 655161, "epoch": 7893} {"train_loss": -27.886945724487305, "global_step": 655162, "epoch": 7893} {"train_loss": -28.271814346313477, "global_step": 655163, "epoch": 7893} {"train_loss": -27.8560733795166, "global_step": 655164, "epoch": 7893} {"train_loss": -27.934534072875977, "global_step": 655165, "epoch": 7893} {"train_loss": -28.31801414489746, "global_step": 655166, "epoch": 7893} {"train_loss": -27.929136276245117, "global_step": 655167, "epoch": 7893} {"train_loss": -28.08124351501465, "global_step": 655168, "epoch": 7893} {"train_loss": -28.095884323120117, "global_step": 655169, "epoch": 7893} {"train_loss": -28.255823135375977, "global_step": 655170, "epoch": 7893} {"train_loss": -27.86203956604004, "global_step": 655171, "epoch": 7893} {"train_loss": -28.426660537719727, "global_step": 655172, "epoch": 7893} {"train_loss": -28.348310470581055, "global_step": 655173, "epoch": 7893} {"train_loss": -28.51144790649414, "global_step": 655174, "epoch": 7893} {"train_loss": -28.672760009765625, "global_step": 655175, "epoch": 7893} {"train_loss": -28.217670440673828, "global_step": 655176, "epoch": 7893} {"train_loss": -28.300092697143555, "global_step": 655177, "epoch": 7893} {"train_loss": -27.98343849182129, "global_step": 655178, "epoch": 7893} {"train_loss": -28.312631607055664, "global_step": 655179, "epoch": 7893} {"train_loss": -28.397235870361328, "global_step": 655180, "epoch": 7893} {"train_loss": -28.236896514892578, "global_step": 655181, "epoch": 7893} {"train_loss": -28.451135635375977, "global_step": 655182, "epoch": 7893} {"train_loss": -28.416824340820312, "global_step": 655183, "epoch": 7893} {"train_loss": -28.69814109802246, "global_step": 655184, "epoch": 7893} {"train_loss": -28.371509552001953, "global_step": 655185, "epoch": 7893} {"train_loss": -28.56463623046875, "global_step": 655186, "epoch": 7893} {"train_loss": -28.255542755126953, "global_step": 655187, "epoch": 7893} {"train_loss": -28.190515518188477, "global_step": 655188, "epoch": 7893} {"train_loss": -28.233312606811523, "global_step": 655189, "epoch": 7893} {"train_loss": -28.415761947631836, "global_step": 655190, "epoch": 7893} {"train_loss": -28.33330726623535, "global_step": 655191, "epoch": 7893} {"train_loss": -28.332855224609375, "global_step": 655192, "epoch": 7893} {"train_loss": -28.462127685546875, "global_step": 655193, "epoch": 7893} {"train_loss": -28.254175186157227, "global_step": 655194, "epoch": 7893} {"train_loss": -28.410205841064453, "global_step": 655195, "epoch": 7893} {"train_loss": -27.92975425720215, "global_step": 655196, "epoch": 7893} {"train_loss": -28.003278732299805, "global_step": 655197, "epoch": 7893} {"train_loss": -28.426380157470703, "global_step": 655198, "epoch": 7893} {"train_loss": -28.41522789001465, "global_step": 655199, "epoch": 7893} {"train_loss": -28.622007369995117, "global_step": 655200, "epoch": 7893} {"train_loss": -28.312091298850184, "global_step": 655201, "epoch": 7893, "val_loss": 6624106.0} {"train_loss": -25.584367752075195, "global_step": 655202, "epoch": 7894} {"train_loss": -26.734359741210938, "global_step": 655203, "epoch": 7894} {"train_loss": -26.732669830322266, "global_step": 655204, "epoch": 7894} {"train_loss": -26.515430450439453, "global_step": 655205, "epoch": 7894} {"train_loss": -27.3792724609375, "global_step": 655206, "epoch": 7894} {"train_loss": -27.05225944519043, "global_step": 655207, "epoch": 7894} {"train_loss": -27.2631893157959, "global_step": 655208, "epoch": 7894} {"train_loss": -27.927160263061523, "global_step": 655209, "epoch": 7894} {"train_loss": -27.32330894470215, "global_step": 655210, "epoch": 7894} {"train_loss": -27.657880783081055, "global_step": 655211, "epoch": 7894} {"train_loss": -27.719940185546875, "global_step": 655212, "epoch": 7894} {"train_loss": -27.323719024658203, "global_step": 655213, "epoch": 7894} {"train_loss": -28.18573570251465, "global_step": 655214, "epoch": 7894} {"train_loss": -27.867767333984375, "global_step": 655215, "epoch": 7894} {"train_loss": -27.36728858947754, "global_step": 655216, "epoch": 7894} {"train_loss": -27.77906608581543, "global_step": 655217, "epoch": 7894} {"train_loss": -27.8801326751709, "global_step": 655218, "epoch": 7894} {"train_loss": -27.84907341003418, "global_step": 655219, "epoch": 7894} {"train_loss": -27.412647247314453, "global_step": 655220, "epoch": 7894} {"train_loss": -27.942108154296875, "global_step": 655221, "epoch": 7894} {"train_loss": -27.806913375854492, "global_step": 655222, "epoch": 7894} {"train_loss": -27.6514892578125, "global_step": 655223, "epoch": 7894} {"train_loss": -27.962549209594727, "global_step": 655224, "epoch": 7894} {"train_loss": -28.0450439453125, "global_step": 655225, "epoch": 7894} {"train_loss": -27.883502960205078, "global_step": 655226, "epoch": 7894} {"train_loss": -27.808013916015625, "global_step": 655227, "epoch": 7894} {"train_loss": -28.083526611328125, "global_step": 655228, "epoch": 7894} {"train_loss": -28.134862899780273, "global_step": 655229, "epoch": 7894} {"train_loss": -27.97516441345215, "global_step": 655230, "epoch": 7894} {"train_loss": -28.32275390625, "global_step": 655231, "epoch": 7894} {"train_loss": -28.09061622619629, "global_step": 655232, "epoch": 7894} {"train_loss": -28.118854522705078, "global_step": 655233, "epoch": 7894} {"train_loss": -28.025320053100586, "global_step": 655234, "epoch": 7894} {"train_loss": -28.02266502380371, "global_step": 655235, "epoch": 7894} {"train_loss": -28.5671443939209, "global_step": 655236, "epoch": 7894} {"train_loss": -27.94428062438965, "global_step": 655237, "epoch": 7894} {"train_loss": -28.115835189819336, "global_step": 655238, "epoch": 7894} {"train_loss": -28.5878849029541, "global_step": 655239, "epoch": 7894} {"train_loss": -28.20195960998535, "global_step": 655240, "epoch": 7894} {"train_loss": -28.401199340820312, "global_step": 655241, "epoch": 7894} {"train_loss": -27.91936683654785, "global_step": 655242, "epoch": 7894} {"train_loss": -28.193273544311523, "global_step": 655243, "epoch": 7894} {"train_loss": -28.472997665405273, "global_step": 655244, "epoch": 7894} {"train_loss": -28.51228141784668, "global_step": 655245, "epoch": 7894} {"train_loss": -28.085968017578125, "global_step": 655246, "epoch": 7894} {"train_loss": -28.13431739807129, "global_step": 655247, "epoch": 7894} {"train_loss": -28.262418746948242, "global_step": 655248, "epoch": 7894} {"train_loss": -28.093399047851562, "global_step": 655249, "epoch": 7894} {"train_loss": -28.073022842407227, "global_step": 655250, "epoch": 7894} {"train_loss": -28.606536865234375, "global_step": 655251, "epoch": 7894} {"train_loss": -27.9300594329834, "global_step": 655252, "epoch": 7894} {"train_loss": -28.09488296508789, "global_step": 655253, "epoch": 7894} {"train_loss": -28.071155548095703, "global_step": 655254, "epoch": 7894} {"train_loss": -28.112873077392578, "global_step": 655255, "epoch": 7894} {"train_loss": -28.461591720581055, "global_step": 655256, "epoch": 7894} {"train_loss": -28.26337242126465, "global_step": 655257, "epoch": 7894} {"train_loss": -28.079130172729492, "global_step": 655258, "epoch": 7894} {"train_loss": -28.415618896484375, "global_step": 655259, "epoch": 7894} {"train_loss": -28.07612419128418, "global_step": 655260, "epoch": 7894} {"train_loss": -27.92606544494629, "global_step": 655261, "epoch": 7894} {"train_loss": -28.121240615844727, "global_step": 655262, "epoch": 7894} {"train_loss": -28.33966636657715, "global_step": 655263, "epoch": 7894} {"train_loss": -28.233121871948242, "global_step": 655264, "epoch": 7894} {"train_loss": -28.5051326751709, "global_step": 655265, "epoch": 7894} {"train_loss": -28.304899215698242, "global_step": 655266, "epoch": 7894} {"train_loss": -28.559579849243164, "global_step": 655267, "epoch": 7894} {"train_loss": -28.333566665649414, "global_step": 655268, "epoch": 7894} {"train_loss": -28.736026763916016, "global_step": 655269, "epoch": 7894} {"train_loss": -28.107791900634766, "global_step": 655270, "epoch": 7894} {"train_loss": -28.550561904907227, "global_step": 655271, "epoch": 7894} {"train_loss": -28.541854858398438, "global_step": 655272, "epoch": 7894} {"train_loss": -28.417083740234375, "global_step": 655273, "epoch": 7894} {"train_loss": -28.299535751342773, "global_step": 655274, "epoch": 7894} {"train_loss": -28.73786735534668, "global_step": 655275, "epoch": 7894} {"train_loss": -28.555896759033203, "global_step": 655276, "epoch": 7894} {"train_loss": -28.252704620361328, "global_step": 655277, "epoch": 7894} {"train_loss": -28.52923011779785, "global_step": 655278, "epoch": 7894} {"train_loss": -28.22151756286621, "global_step": 655279, "epoch": 7894} {"train_loss": -28.551700592041016, "global_step": 655280, "epoch": 7894} {"train_loss": -28.503942489624023, "global_step": 655281, "epoch": 7894} {"train_loss": -28.463911056518555, "global_step": 655282, "epoch": 7894} {"train_loss": -28.39289665222168, "global_step": 655283, "epoch": 7894} {"train_loss": -28.04664090168045, "global_step": 655284, "epoch": 7894, "val_loss": 6630153.5} {"train_loss": -27.206756591796875, "global_step": 655285, "epoch": 7895} {"train_loss": -28.09146499633789, "global_step": 655286, "epoch": 7895} {"train_loss": -27.327695846557617, "global_step": 655287, "epoch": 7895} {"train_loss": -26.007863998413086, "global_step": 655288, "epoch": 7895} {"train_loss": -27.23542594909668, "global_step": 655289, "epoch": 7895} {"train_loss": -27.660425186157227, "global_step": 655290, "epoch": 7895} {"train_loss": -27.41013526916504, "global_step": 655291, "epoch": 7895} {"train_loss": -27.215198516845703, "global_step": 655292, "epoch": 7895} {"train_loss": -27.84478187561035, "global_step": 655293, "epoch": 7895} {"train_loss": -27.74275016784668, "global_step": 655294, "epoch": 7895} {"train_loss": -27.90436363220215, "global_step": 655295, "epoch": 7895} {"train_loss": -27.892581939697266, "global_step": 655296, "epoch": 7895} {"train_loss": -28.01997184753418, "global_step": 655297, "epoch": 7895} {"train_loss": -27.79277992248535, "global_step": 655298, "epoch": 7895} {"train_loss": -27.940053939819336, "global_step": 655299, "epoch": 7895} {"train_loss": -28.35823631286621, "global_step": 655300, "epoch": 7895} {"train_loss": -28.210214614868164, "global_step": 655301, "epoch": 7895} {"train_loss": -27.98882484436035, "global_step": 655302, "epoch": 7895} {"train_loss": -27.693374633789062, "global_step": 655303, "epoch": 7895} {"train_loss": -28.110143661499023, "global_step": 655304, "epoch": 7895} {"train_loss": -28.25250244140625, "global_step": 655305, "epoch": 7895} {"train_loss": -27.923553466796875, "global_step": 655306, "epoch": 7895} {"train_loss": -28.0389461517334, "global_step": 655307, "epoch": 7895} {"train_loss": -27.949691772460938, "global_step": 655308, "epoch": 7895} {"train_loss": -28.3169002532959, "global_step": 655309, "epoch": 7895} {"train_loss": -28.15939712524414, "global_step": 655310, "epoch": 7895} {"train_loss": -28.372425079345703, "global_step": 655311, "epoch": 7895} {"train_loss": -28.267974853515625, "global_step": 655312, "epoch": 7895} {"train_loss": -28.31622314453125, "global_step": 655313, "epoch": 7895} {"train_loss": -28.44191551208496, "global_step": 655314, "epoch": 7895} {"train_loss": -28.11435317993164, "global_step": 655315, "epoch": 7895} {"train_loss": -28.278573989868164, "global_step": 655316, "epoch": 7895} {"train_loss": -28.2735538482666, "global_step": 655317, "epoch": 7895} {"train_loss": -28.463455200195312, "global_step": 655318, "epoch": 7895} {"train_loss": -27.985082626342773, "global_step": 655319, "epoch": 7895} {"train_loss": -28.0244140625, "global_step": 655320, "epoch": 7895} {"train_loss": -28.17182731628418, "global_step": 655321, "epoch": 7895} {"train_loss": -28.664106369018555, "global_step": 655322, "epoch": 7895} {"train_loss": -28.240400314331055, "global_step": 655323, "epoch": 7895} {"train_loss": -28.317951202392578, "global_step": 655324, "epoch": 7895} {"train_loss": -28.249378204345703, "global_step": 655325, "epoch": 7895} {"train_loss": -28.47791862487793, "global_step": 655326, "epoch": 7895} {"train_loss": -28.224096298217773, "global_step": 655327, "epoch": 7895} {"train_loss": -27.988876342773438, "global_step": 655328, "epoch": 7895} {"train_loss": -28.077545166015625, "global_step": 655329, "epoch": 7895} {"train_loss": -28.889867782592773, "global_step": 655330, "epoch": 7895} {"train_loss": -28.228469848632812, "global_step": 655331, "epoch": 7895} {"train_loss": -28.35920524597168, "global_step": 655332, "epoch": 7895} {"train_loss": -28.610448837280273, "global_step": 655333, "epoch": 7895} {"train_loss": -28.337539672851562, "global_step": 655334, "epoch": 7895} {"train_loss": -28.76883888244629, "global_step": 655335, "epoch": 7895} {"train_loss": -28.615478515625, "global_step": 655336, "epoch": 7895} {"train_loss": -28.65386962890625, "global_step": 655337, "epoch": 7895} {"train_loss": -28.79105567932129, "global_step": 655338, "epoch": 7895} {"train_loss": -28.48968505859375, "global_step": 655339, "epoch": 7895} {"train_loss": -28.21125602722168, "global_step": 655340, "epoch": 7895} {"train_loss": -28.46047019958496, "global_step": 655341, "epoch": 7895} {"train_loss": -28.423080444335938, "global_step": 655342, "epoch": 7895} {"train_loss": -28.789203643798828, "global_step": 655343, "epoch": 7895} {"train_loss": -28.3238468170166, "global_step": 655344, "epoch": 7895} {"train_loss": -28.429330825805664, "global_step": 655345, "epoch": 7895} {"train_loss": -27.597766876220703, "global_step": 655346, "epoch": 7895} {"train_loss": -27.415246963500977, "global_step": 655347, "epoch": 7895} {"train_loss": -27.936429977416992, "global_step": 655348, "epoch": 7895} {"train_loss": -28.5933895111084, "global_step": 655349, "epoch": 7895} {"train_loss": -28.174360275268555, "global_step": 655350, "epoch": 7895} {"train_loss": -28.232166290283203, "global_step": 655351, "epoch": 7895} {"train_loss": -27.918750762939453, "global_step": 655352, "epoch": 7895} {"train_loss": -27.855859756469727, "global_step": 655353, "epoch": 7895} {"train_loss": -28.295944213867188, "global_step": 655354, "epoch": 7895} {"train_loss": -28.195581436157227, "global_step": 655355, "epoch": 7895} {"train_loss": -28.16621208190918, "global_step": 655356, "epoch": 7895} {"train_loss": -28.808212280273438, "global_step": 655357, "epoch": 7895} {"train_loss": -28.452001571655273, "global_step": 655358, "epoch": 7895} {"train_loss": -28.2533016204834, "global_step": 655359, "epoch": 7895} {"train_loss": -28.574237823486328, "global_step": 655360, "epoch": 7895} {"train_loss": -28.364501953125, "global_step": 655361, "epoch": 7895} {"train_loss": -28.657155990600586, "global_step": 655362, "epoch": 7895} {"train_loss": -28.241199493408203, "global_step": 655363, "epoch": 7895} {"train_loss": -28.30755043029785, "global_step": 655364, "epoch": 7895} {"train_loss": -28.5992488861084, "global_step": 655365, "epoch": 7895} {"train_loss": -28.50296974182129, "global_step": 655366, "epoch": 7895} {"train_loss": -28.16591366227851, "global_step": 655367, "epoch": 7895, "val_loss": 6679579.0} {"train_loss": -27.467695236206055, "global_step": 655368, "epoch": 7896} {"train_loss": -28.173948287963867, "global_step": 655369, "epoch": 7896} {"train_loss": -27.765079498291016, "global_step": 655370, "epoch": 7896} {"train_loss": -27.417150497436523, "global_step": 655371, "epoch": 7896} {"train_loss": -27.941083908081055, "global_step": 655372, "epoch": 7896} {"train_loss": -27.990264892578125, "global_step": 655373, "epoch": 7896} {"train_loss": -27.78803062438965, "global_step": 655374, "epoch": 7896} {"train_loss": -28.269582748413086, "global_step": 655375, "epoch": 7896} {"train_loss": -27.94839859008789, "global_step": 655376, "epoch": 7896} {"train_loss": -27.928617477416992, "global_step": 655377, "epoch": 7896} {"train_loss": -28.052875518798828, "global_step": 655378, "epoch": 7896} {"train_loss": -27.89849281311035, "global_step": 655379, "epoch": 7896} {"train_loss": -28.307294845581055, "global_step": 655380, "epoch": 7896} {"train_loss": -27.91974449157715, "global_step": 655381, "epoch": 7896} {"train_loss": -28.239261627197266, "global_step": 655382, "epoch": 7896} {"train_loss": -28.077911376953125, "global_step": 655383, "epoch": 7896} {"train_loss": -28.08298683166504, "global_step": 655384, "epoch": 7896} {"train_loss": -27.843652725219727, "global_step": 655385, "epoch": 7896} {"train_loss": -28.062780380249023, "global_step": 655386, "epoch": 7896} {"train_loss": -28.039905548095703, "global_step": 655387, "epoch": 7896} {"train_loss": -28.3772029876709, "global_step": 655388, "epoch": 7896} {"train_loss": -28.00575065612793, "global_step": 655389, "epoch": 7896} {"train_loss": -28.164350509643555, "global_step": 655390, "epoch": 7896} {"train_loss": -28.10934829711914, "global_step": 655391, "epoch": 7896} {"train_loss": -28.10772705078125, "global_step": 655392, "epoch": 7896} {"train_loss": -28.210412979125977, "global_step": 655393, "epoch": 7896} {"train_loss": -28.496234893798828, "global_step": 655394, "epoch": 7896} {"train_loss": -28.11370277404785, "global_step": 655395, "epoch": 7896} {"train_loss": -28.28078269958496, "global_step": 655396, "epoch": 7896} {"train_loss": -28.662988662719727, "global_step": 655397, "epoch": 7896} {"train_loss": -28.27880859375, "global_step": 655398, "epoch": 7896} {"train_loss": -27.901037216186523, "global_step": 655399, "epoch": 7896} {"train_loss": -28.097442626953125, "global_step": 655400, "epoch": 7896} {"train_loss": -28.499303817749023, "global_step": 655401, "epoch": 7896} {"train_loss": -28.551136016845703, "global_step": 655402, "epoch": 7896} {"train_loss": -28.4532413482666, "global_step": 655403, "epoch": 7896} {"train_loss": -28.152456283569336, "global_step": 655404, "epoch": 7896} {"train_loss": -28.330732345581055, "global_step": 655405, "epoch": 7896} {"train_loss": -28.587482452392578, "global_step": 655406, "epoch": 7896} {"train_loss": -28.43316650390625, "global_step": 655407, "epoch": 7896} {"train_loss": -28.547744750976562, "global_step": 655408, "epoch": 7896} {"train_loss": -28.645954132080078, "global_step": 655409, "epoch": 7896} {"train_loss": -28.455814361572266, "global_step": 655410, "epoch": 7896} {"train_loss": -28.185272216796875, "global_step": 655411, "epoch": 7896} {"train_loss": -28.779010772705078, "global_step": 655412, "epoch": 7896} {"train_loss": -28.5902099609375, "global_step": 655413, "epoch": 7896} {"train_loss": -28.00275230407715, "global_step": 655414, "epoch": 7896} {"train_loss": -28.014883041381836, "global_step": 655415, "epoch": 7896} {"train_loss": -28.815235137939453, "global_step": 655416, "epoch": 7896} {"train_loss": -28.530811309814453, "global_step": 655417, "epoch": 7896} {"train_loss": -28.20928955078125, "global_step": 655418, "epoch": 7896} {"train_loss": -28.63425064086914, "global_step": 655419, "epoch": 7896} {"train_loss": -28.267446517944336, "global_step": 655420, "epoch": 7896} {"train_loss": -28.297956466674805, "global_step": 655421, "epoch": 7896} {"train_loss": -28.214191436767578, "global_step": 655422, "epoch": 7896} {"train_loss": -27.91786003112793, "global_step": 655423, "epoch": 7896} {"train_loss": -28.958038330078125, "global_step": 655424, "epoch": 7896} {"train_loss": -28.310754776000977, "global_step": 655425, "epoch": 7896} {"train_loss": -27.866498947143555, "global_step": 655426, "epoch": 7896} {"train_loss": -28.4765567779541, "global_step": 655427, "epoch": 7896} {"train_loss": -28.19644546508789, "global_step": 655428, "epoch": 7896} {"train_loss": -28.338703155517578, "global_step": 655429, "epoch": 7896} {"train_loss": -28.22132682800293, "global_step": 655430, "epoch": 7896} {"train_loss": -28.138431549072266, "global_step": 655431, "epoch": 7896} {"train_loss": -28.69974136352539, "global_step": 655432, "epoch": 7896} {"train_loss": -28.050046920776367, "global_step": 655433, "epoch": 7896} {"train_loss": -28.5782527923584, "global_step": 655434, "epoch": 7896} {"train_loss": -28.769994735717773, "global_step": 655435, "epoch": 7896} {"train_loss": -28.1048583984375, "global_step": 655436, "epoch": 7896} {"train_loss": -28.422683715820312, "global_step": 655437, "epoch": 7896} {"train_loss": -27.993000030517578, "global_step": 655438, "epoch": 7896} {"train_loss": -28.582019805908203, "global_step": 655439, "epoch": 7896} {"train_loss": -28.439268112182617, "global_step": 655440, "epoch": 7896} {"train_loss": -28.089513778686523, "global_step": 655441, "epoch": 7896} {"train_loss": -28.34613609313965, "global_step": 655442, "epoch": 7896} {"train_loss": -28.512039184570312, "global_step": 655443, "epoch": 7896} {"train_loss": -28.08344078063965, "global_step": 655444, "epoch": 7896} {"train_loss": -28.50335121154785, "global_step": 655445, "epoch": 7896} {"train_loss": -28.44693946838379, "global_step": 655446, "epoch": 7896} {"train_loss": -28.311201095581055, "global_step": 655447, "epoch": 7896} {"train_loss": -28.761198043823242, "global_step": 655448, "epoch": 7896} {"train_loss": -28.758100509643555, "global_step": 655449, "epoch": 7896} {"train_loss": -28.263312052531415, "global_step": 655450, "epoch": 7896, "val_loss": 6711651.0} {"train_loss": -27.3115177154541, "global_step": 655451, "epoch": 7897} {"train_loss": -27.097150802612305, "global_step": 655452, "epoch": 7897} {"train_loss": -26.916839599609375, "global_step": 655453, "epoch": 7897} {"train_loss": -27.454259872436523, "global_step": 655454, "epoch": 7897} {"train_loss": -27.695486068725586, "global_step": 655455, "epoch": 7897} {"train_loss": -27.80329704284668, "global_step": 655456, "epoch": 7897} {"train_loss": -26.595447540283203, "global_step": 655457, "epoch": 7897} {"train_loss": -27.2509708404541, "global_step": 655458, "epoch": 7897} {"train_loss": -27.470630645751953, "global_step": 655459, "epoch": 7897} {"train_loss": -27.4700984954834, "global_step": 655460, "epoch": 7897} {"train_loss": -27.05368423461914, "global_step": 655461, "epoch": 7897} {"train_loss": -27.55265235900879, "global_step": 655462, "epoch": 7897} {"train_loss": -27.25882911682129, "global_step": 655463, "epoch": 7897} {"train_loss": -27.797754287719727, "global_step": 655464, "epoch": 7897} {"train_loss": -27.21087074279785, "global_step": 655465, "epoch": 7897} {"train_loss": -27.56821632385254, "global_step": 655466, "epoch": 7897} {"train_loss": -27.570178985595703, "global_step": 655467, "epoch": 7897} {"train_loss": -28.106109619140625, "global_step": 655468, "epoch": 7897} {"train_loss": -27.717321395874023, "global_step": 655469, "epoch": 7897} {"train_loss": -27.842391967773438, "global_step": 655470, "epoch": 7897} {"train_loss": -27.70350456237793, "global_step": 655471, "epoch": 7897} {"train_loss": -26.330785751342773, "global_step": 655472, "epoch": 7897} {"train_loss": -27.991413116455078, "global_step": 655473, "epoch": 7897} {"train_loss": -27.946603775024414, "global_step": 655474, "epoch": 7897} {"train_loss": -28.0031681060791, "global_step": 655475, "epoch": 7897} {"train_loss": -28.037450790405273, "global_step": 655476, "epoch": 7897} {"train_loss": -27.77650260925293, "global_step": 655477, "epoch": 7897} {"train_loss": -27.487829208374023, "global_step": 655478, "epoch": 7897} {"train_loss": -27.39454460144043, "global_step": 655479, "epoch": 7897} {"train_loss": -27.93729019165039, "global_step": 655480, "epoch": 7897} {"train_loss": -27.96723747253418, "global_step": 655481, "epoch": 7897} {"train_loss": -28.03321647644043, "global_step": 655482, "epoch": 7897} {"train_loss": -27.73337745666504, "global_step": 655483, "epoch": 7897} {"train_loss": -27.923925399780273, "global_step": 655484, "epoch": 7897} {"train_loss": -28.14930534362793, "global_step": 655485, "epoch": 7897} {"train_loss": -27.7523193359375, "global_step": 655486, "epoch": 7897} {"train_loss": -28.436697006225586, "global_step": 655487, "epoch": 7897} {"train_loss": -28.045801162719727, "global_step": 655488, "epoch": 7897} {"train_loss": -28.16041374206543, "global_step": 655489, "epoch": 7897} {"train_loss": -27.8884334564209, "global_step": 655490, "epoch": 7897} {"train_loss": -28.325946807861328, "global_step": 655491, "epoch": 7897} {"train_loss": -28.05228614807129, "global_step": 655492, "epoch": 7897} {"train_loss": -28.26116943359375, "global_step": 655493, "epoch": 7897} {"train_loss": -27.717376708984375, "global_step": 655494, "epoch": 7897} {"train_loss": -28.3752384185791, "global_step": 655495, "epoch": 7897} {"train_loss": -27.958051681518555, "global_step": 655496, "epoch": 7897} {"train_loss": -28.318592071533203, "global_step": 655497, "epoch": 7897} {"train_loss": -28.026737213134766, "global_step": 655498, "epoch": 7897} {"train_loss": -28.272016525268555, "global_step": 655499, "epoch": 7897} {"train_loss": -27.95654296875, "global_step": 655500, "epoch": 7897} {"train_loss": -28.331037521362305, "global_step": 655501, "epoch": 7897} {"train_loss": -28.29511070251465, "global_step": 655502, "epoch": 7897} {"train_loss": -28.473066329956055, "global_step": 655503, "epoch": 7897} {"train_loss": -28.116376876831055, "global_step": 655504, "epoch": 7897} {"train_loss": -28.4182186126709, "global_step": 655505, "epoch": 7897} {"train_loss": -28.300195693969727, "global_step": 655506, "epoch": 7897} {"train_loss": -28.33074378967285, "global_step": 655507, "epoch": 7897} {"train_loss": -28.47991943359375, "global_step": 655508, "epoch": 7897} {"train_loss": -28.715219497680664, "global_step": 655509, "epoch": 7897} {"train_loss": -28.432586669921875, "global_step": 655510, "epoch": 7897} {"train_loss": -28.476886749267578, "global_step": 655511, "epoch": 7897} {"train_loss": -28.410741806030273, "global_step": 655512, "epoch": 7897} {"train_loss": -28.350210189819336, "global_step": 655513, "epoch": 7897} {"train_loss": -28.7495174407959, "global_step": 655514, "epoch": 7897} {"train_loss": -28.5458927154541, "global_step": 655515, "epoch": 7897} {"train_loss": -28.044279098510742, "global_step": 655516, "epoch": 7897} {"train_loss": -28.728363037109375, "global_step": 655517, "epoch": 7897} {"train_loss": -28.354703903198242, "global_step": 655518, "epoch": 7897} {"train_loss": -28.41187858581543, "global_step": 655519, "epoch": 7897} {"train_loss": -28.2825984954834, "global_step": 655520, "epoch": 7897} {"train_loss": -28.385574340820312, "global_step": 655521, "epoch": 7897} {"train_loss": -28.465925216674805, "global_step": 655522, "epoch": 7897} {"train_loss": -28.215185165405273, "global_step": 655523, "epoch": 7897} {"train_loss": -28.062387466430664, "global_step": 655524, "epoch": 7897} {"train_loss": -27.32148551940918, "global_step": 655525, "epoch": 7897} {"train_loss": -26.502477645874023, "global_step": 655526, "epoch": 7897} {"train_loss": -27.98674964904785, "global_step": 655527, "epoch": 7897} {"train_loss": -28.470417022705078, "global_step": 655528, "epoch": 7897} {"train_loss": -27.756628036499023, "global_step": 655529, "epoch": 7897} {"train_loss": -28.60127067565918, "global_step": 655530, "epoch": 7897} {"train_loss": -28.215307235717773, "global_step": 655531, "epoch": 7897} {"train_loss": -28.135345458984375, "global_step": 655532, "epoch": 7897} {"train_loss": -27.95059006472668, "global_step": 655533, "epoch": 7897, "val_loss": 6697486.0} {"train_loss": -26.923959732055664, "global_step": 655534, "epoch": 7898} {"train_loss": -24.42717933654785, "global_step": 655535, "epoch": 7898} {"train_loss": -26.01800537109375, "global_step": 655536, "epoch": 7898} {"train_loss": -26.8300724029541, "global_step": 655537, "epoch": 7898} {"train_loss": -27.15571403503418, "global_step": 655538, "epoch": 7898} {"train_loss": -27.551488876342773, "global_step": 655539, "epoch": 7898} {"train_loss": -26.992206573486328, "global_step": 655540, "epoch": 7898} {"train_loss": -27.26936912536621, "global_step": 655541, "epoch": 7898} {"train_loss": -27.37052345275879, "global_step": 655542, "epoch": 7898} {"train_loss": -27.419843673706055, "global_step": 655543, "epoch": 7898} {"train_loss": -27.65899085998535, "global_step": 655544, "epoch": 7898} {"train_loss": -27.6581974029541, "global_step": 655545, "epoch": 7898} {"train_loss": -27.68311882019043, "global_step": 655546, "epoch": 7898} {"train_loss": -27.9242000579834, "global_step": 655547, "epoch": 7898} {"train_loss": -28.037378311157227, "global_step": 655548, "epoch": 7898} {"train_loss": -27.84393882751465, "global_step": 655549, "epoch": 7898} {"train_loss": -27.842899322509766, "global_step": 655550, "epoch": 7898} {"train_loss": -27.90144157409668, "global_step": 655551, "epoch": 7898} {"train_loss": -27.789899826049805, "global_step": 655552, "epoch": 7898} {"train_loss": -27.922361373901367, "global_step": 655553, "epoch": 7898} {"train_loss": -28.164600372314453, "global_step": 655554, "epoch": 7898} {"train_loss": -27.9738712310791, "global_step": 655555, "epoch": 7898} {"train_loss": -27.780029296875, "global_step": 655556, "epoch": 7898} {"train_loss": -28.210840225219727, "global_step": 655557, "epoch": 7898} {"train_loss": -28.44728660583496, "global_step": 655558, "epoch": 7898} {"train_loss": -27.812164306640625, "global_step": 655559, "epoch": 7898} {"train_loss": -28.2929630279541, "global_step": 655560, "epoch": 7898} {"train_loss": -28.235036849975586, "global_step": 655561, "epoch": 7898} {"train_loss": -28.159564971923828, "global_step": 655562, "epoch": 7898} {"train_loss": -27.98487663269043, "global_step": 655563, "epoch": 7898} {"train_loss": -28.163305282592773, "global_step": 655564, "epoch": 7898} {"train_loss": -28.066883087158203, "global_step": 655565, "epoch": 7898} {"train_loss": -28.486408233642578, "global_step": 655566, "epoch": 7898} {"train_loss": -28.077167510986328, "global_step": 655567, "epoch": 7898} {"train_loss": -28.31873893737793, "global_step": 655568, "epoch": 7898} {"train_loss": -28.3753604888916, "global_step": 655569, "epoch": 7898} {"train_loss": -28.14573097229004, "global_step": 655570, "epoch": 7898} {"train_loss": -28.435108184814453, "global_step": 655571, "epoch": 7898} {"train_loss": -28.39069175720215, "global_step": 655572, "epoch": 7898} {"train_loss": -28.618345260620117, "global_step": 655573, "epoch": 7898} {"train_loss": -28.250568389892578, "global_step": 655574, "epoch": 7898} {"train_loss": -28.398391723632812, "global_step": 655575, "epoch": 7898} {"train_loss": -28.454120635986328, "global_step": 655576, "epoch": 7898} {"train_loss": -28.679031372070312, "global_step": 655577, "epoch": 7898} {"train_loss": -28.306610107421875, "global_step": 655578, "epoch": 7898} {"train_loss": -28.442520141601562, "global_step": 655579, "epoch": 7898} {"train_loss": -28.346410751342773, "global_step": 655580, "epoch": 7898} {"train_loss": -28.392688751220703, "global_step": 655581, "epoch": 7898} {"train_loss": -28.3074951171875, "global_step": 655582, "epoch": 7898} {"train_loss": -28.487878799438477, "global_step": 655583, "epoch": 7898} {"train_loss": -28.8292293548584, "global_step": 655584, "epoch": 7898} {"train_loss": -28.002918243408203, "global_step": 655585, "epoch": 7898} {"train_loss": -28.222543716430664, "global_step": 655586, "epoch": 7898} {"train_loss": -28.597137451171875, "global_step": 655587, "epoch": 7898} {"train_loss": -28.12775993347168, "global_step": 655588, "epoch": 7898} {"train_loss": -28.454893112182617, "global_step": 655589, "epoch": 7898} {"train_loss": -28.503082275390625, "global_step": 655590, "epoch": 7898} {"train_loss": -28.383237838745117, "global_step": 655591, "epoch": 7898} {"train_loss": -28.53541374206543, "global_step": 655592, "epoch": 7898} {"train_loss": -28.821884155273438, "global_step": 655593, "epoch": 7898} {"train_loss": -28.375654220581055, "global_step": 655594, "epoch": 7898} {"train_loss": -28.348697662353516, "global_step": 655595, "epoch": 7898} {"train_loss": -28.18146324157715, "global_step": 655596, "epoch": 7898} {"train_loss": -28.184677124023438, "global_step": 655597, "epoch": 7898} {"train_loss": -28.56672477722168, "global_step": 655598, "epoch": 7898} {"train_loss": -28.471405029296875, "global_step": 655599, "epoch": 7898} {"train_loss": -28.4137020111084, "global_step": 655600, "epoch": 7898} {"train_loss": -28.57291030883789, "global_step": 655601, "epoch": 7898} {"train_loss": -28.173303604125977, "global_step": 655602, "epoch": 7898} {"train_loss": -27.952375411987305, "global_step": 655603, "epoch": 7898} {"train_loss": -28.25592613220215, "global_step": 655604, "epoch": 7898} {"train_loss": -28.483322143554688, "global_step": 655605, "epoch": 7898} {"train_loss": -28.564697265625, "global_step": 655606, "epoch": 7898} {"train_loss": -28.2265625, "global_step": 655607, "epoch": 7898} {"train_loss": -27.887435913085938, "global_step": 655608, "epoch": 7898} {"train_loss": -28.114704132080078, "global_step": 655609, "epoch": 7898} {"train_loss": -28.257675170898438, "global_step": 655610, "epoch": 7898} {"train_loss": -28.37379264831543, "global_step": 655611, "epoch": 7898} {"train_loss": -28.352094650268555, "global_step": 655612, "epoch": 7898} {"train_loss": -27.92899513244629, "global_step": 655613, "epoch": 7898} {"train_loss": -28.51300048828125, "global_step": 655614, "epoch": 7898} {"train_loss": -28.39826774597168, "global_step": 655615, "epoch": 7898} {"train_loss": -28.06013716272561, "global_step": 655616, "epoch": 7898, "val_loss": 6732882.0} {"train_loss": -26.028783798217773, "global_step": 655617, "epoch": 7899} {"train_loss": -26.94917106628418, "global_step": 655618, "epoch": 7899} {"train_loss": -27.134550094604492, "global_step": 655619, "epoch": 7899} {"train_loss": -27.528417587280273, "global_step": 655620, "epoch": 7899} {"train_loss": -27.91082763671875, "global_step": 655621, "epoch": 7899} {"train_loss": -27.532184600830078, "global_step": 655622, "epoch": 7899} {"train_loss": -27.6341609954834, "global_step": 655623, "epoch": 7899} {"train_loss": -27.871734619140625, "global_step": 655624, "epoch": 7899} {"train_loss": -27.526599884033203, "global_step": 655625, "epoch": 7899} {"train_loss": -27.516529083251953, "global_step": 655626, "epoch": 7899} {"train_loss": -27.385730743408203, "global_step": 655627, "epoch": 7899} {"train_loss": -27.788379669189453, "global_step": 655628, "epoch": 7899} {"train_loss": -27.54279136657715, "global_step": 655629, "epoch": 7899} {"train_loss": -27.8465518951416, "global_step": 655630, "epoch": 7899} {"train_loss": -28.010334014892578, "global_step": 655631, "epoch": 7899} {"train_loss": -28.17791748046875, "global_step": 655632, "epoch": 7899} {"train_loss": -27.59625816345215, "global_step": 655633, "epoch": 7899} {"train_loss": -27.644590377807617, "global_step": 655634, "epoch": 7899} {"train_loss": -28.05255699157715, "global_step": 655635, "epoch": 7899} {"train_loss": -27.826465606689453, "global_step": 655636, "epoch": 7899} {"train_loss": -28.137176513671875, "global_step": 655637, "epoch": 7899} {"train_loss": -27.948440551757812, "global_step": 655638, "epoch": 7899} {"train_loss": -28.166654586791992, "global_step": 655639, "epoch": 7899} {"train_loss": -28.04306983947754, "global_step": 655640, "epoch": 7899} {"train_loss": -28.254751205444336, "global_step": 655641, "epoch": 7899} {"train_loss": -28.39654541015625, "global_step": 655642, "epoch": 7899} {"train_loss": -28.219717025756836, "global_step": 655643, "epoch": 7899} {"train_loss": -28.1687068939209, "global_step": 655644, "epoch": 7899} {"train_loss": -28.2269344329834, "global_step": 655645, "epoch": 7899} {"train_loss": -28.249658584594727, "global_step": 655646, "epoch": 7899} {"train_loss": -28.400419235229492, "global_step": 655647, "epoch": 7899} {"train_loss": -28.403440475463867, "global_step": 655648, "epoch": 7899} {"train_loss": -28.35184669494629, "global_step": 655649, "epoch": 7899} {"train_loss": -28.167932510375977, "global_step": 655650, "epoch": 7899} {"train_loss": -28.347803115844727, "global_step": 655651, "epoch": 7899} {"train_loss": -28.321908950805664, "global_step": 655652, "epoch": 7899} {"train_loss": -28.167028427124023, "global_step": 655653, "epoch": 7899} {"train_loss": -28.410053253173828, "global_step": 655654, "epoch": 7899} {"train_loss": -28.286413192749023, "global_step": 655655, "epoch": 7899} {"train_loss": -28.23648452758789, "global_step": 655656, "epoch": 7899} {"train_loss": -28.112524032592773, "global_step": 655657, "epoch": 7899} {"train_loss": -28.81049919128418, "global_step": 655658, "epoch": 7899} {"train_loss": -28.437896728515625, "global_step": 655659, "epoch": 7899} {"train_loss": -28.683395385742188, "global_step": 655660, "epoch": 7899} {"train_loss": -28.34742546081543, "global_step": 655661, "epoch": 7899} {"train_loss": -28.648618698120117, "global_step": 655662, "epoch": 7899} {"train_loss": -28.36635398864746, "global_step": 655663, "epoch": 7899} {"train_loss": -28.27271842956543, "global_step": 655664, "epoch": 7899} {"train_loss": -28.735639572143555, "global_step": 655665, "epoch": 7899} {"train_loss": -28.56830406188965, "global_step": 655666, "epoch": 7899} {"train_loss": -28.500394821166992, "global_step": 655667, "epoch": 7899} {"train_loss": -28.605382919311523, "global_step": 655668, "epoch": 7899} {"train_loss": -28.8818416595459, "global_step": 655669, "epoch": 7899} {"train_loss": -28.559284210205078, "global_step": 655670, "epoch": 7899} {"train_loss": -28.5908260345459, "global_step": 655671, "epoch": 7899} {"train_loss": -28.873565673828125, "global_step": 655672, "epoch": 7899} {"train_loss": -28.769367218017578, "global_step": 655673, "epoch": 7899} {"train_loss": -28.380970001220703, "global_step": 655674, "epoch": 7899} {"train_loss": -28.09079933166504, "global_step": 655675, "epoch": 7899} {"train_loss": -28.181787490844727, "global_step": 655676, "epoch": 7899} {"train_loss": -28.4517765045166, "global_step": 655677, "epoch": 7899} {"train_loss": -28.453277587890625, "global_step": 655678, "epoch": 7899} {"train_loss": -28.266698837280273, "global_step": 655679, "epoch": 7899} {"train_loss": -28.460142135620117, "global_step": 655680, "epoch": 7899} {"train_loss": -28.529712677001953, "global_step": 655681, "epoch": 7899} {"train_loss": -28.392248153686523, "global_step": 655682, "epoch": 7899} {"train_loss": -28.583703994750977, "global_step": 655683, "epoch": 7899} {"train_loss": -28.4739933013916, "global_step": 655684, "epoch": 7899} {"train_loss": -28.092187881469727, "global_step": 655685, "epoch": 7899} {"train_loss": -28.40130615234375, "global_step": 655686, "epoch": 7899} {"train_loss": -28.463010787963867, "global_step": 655687, "epoch": 7899} {"train_loss": -27.937971115112305, "global_step": 655688, "epoch": 7899} {"train_loss": -28.52980613708496, "global_step": 655689, "epoch": 7899} {"train_loss": -28.082632064819336, "global_step": 655690, "epoch": 7899} {"train_loss": -28.239288330078125, "global_step": 655691, "epoch": 7899} {"train_loss": -28.46933937072754, "global_step": 655692, "epoch": 7899} {"train_loss": -28.53934097290039, "global_step": 655693, "epoch": 7899} {"train_loss": -28.48134422302246, "global_step": 655694, "epoch": 7899} {"train_loss": -28.397815704345703, "global_step": 655695, "epoch": 7899} {"train_loss": -28.555639266967773, "global_step": 655696, "epoch": 7899} {"train_loss": -28.0147647857666, "global_step": 655697, "epoch": 7899} {"train_loss": -27.85308837890625, "global_step": 655698, "epoch": 7899} {"train_loss": -28.160235347518, "global_step": 655699, "epoch": 7899, "val_loss": 6845456.5} {"train_loss": -26.789087295532227, "global_step": 655700, "epoch": 7900} {"train_loss": -25.966903686523438, "global_step": 655701, "epoch": 7900} {"train_loss": -25.644861221313477, "global_step": 655702, "epoch": 7900} {"train_loss": -27.217609405517578, "global_step": 655703, "epoch": 7900} {"train_loss": -27.32280921936035, "global_step": 655704, "epoch": 7900} {"train_loss": -27.615888595581055, "global_step": 655705, "epoch": 7900} {"train_loss": -27.15118980407715, "global_step": 655706, "epoch": 7900} {"train_loss": -27.43706703186035, "global_step": 655707, "epoch": 7900} {"train_loss": -27.975238800048828, "global_step": 655708, "epoch": 7900} {"train_loss": -27.312673568725586, "global_step": 655709, "epoch": 7900} {"train_loss": -27.629093170166016, "global_step": 655710, "epoch": 7900} {"train_loss": -27.25506019592285, "global_step": 655711, "epoch": 7900} {"train_loss": -27.3563232421875, "global_step": 655712, "epoch": 7900} {"train_loss": -27.838376998901367, "global_step": 655713, "epoch": 7900} {"train_loss": -27.81874656677246, "global_step": 655714, "epoch": 7900} {"train_loss": -27.63327407836914, "global_step": 655715, "epoch": 7900} {"train_loss": -27.87537956237793, "global_step": 655716, "epoch": 7900} {"train_loss": -27.735828399658203, "global_step": 655717, "epoch": 7900} {"train_loss": -27.51889991760254, "global_step": 655718, "epoch": 7900} {"train_loss": -27.877161026000977, "global_step": 655719, "epoch": 7900} {"train_loss": -28.136327743530273, "global_step": 655720, "epoch": 7900} {"train_loss": -28.12282371520996, "global_step": 655721, "epoch": 7900} {"train_loss": -27.969465255737305, "global_step": 655722, "epoch": 7900} {"train_loss": -28.1766357421875, "global_step": 655723, "epoch": 7900} {"train_loss": -27.871423721313477, "global_step": 655724, "epoch": 7900} {"train_loss": -28.27821159362793, "global_step": 655725, "epoch": 7900} {"train_loss": -27.88728141784668, "global_step": 655726, "epoch": 7900} {"train_loss": -28.320606231689453, "global_step": 655727, "epoch": 7900} {"train_loss": -28.51639175415039, "global_step": 655728, "epoch": 7900} {"train_loss": -28.330814361572266, "global_step": 655729, "epoch": 7900} {"train_loss": -28.349573135375977, "global_step": 655730, "epoch": 7900} {"train_loss": -28.071613311767578, "global_step": 655731, "epoch": 7900} {"train_loss": -28.308435440063477, "global_step": 655732, "epoch": 7900} {"train_loss": -28.0288143157959, "global_step": 655733, "epoch": 7900} {"train_loss": -28.349363327026367, "global_step": 655734, "epoch": 7900} {"train_loss": -28.321985244750977, "global_step": 655735, "epoch": 7900} {"train_loss": -28.41373634338379, "global_step": 655736, "epoch": 7900} {"train_loss": -28.375995635986328, "global_step": 655737, "epoch": 7900} {"train_loss": -28.40022850036621, "global_step": 655738, "epoch": 7900} {"train_loss": -28.421085357666016, "global_step": 655739, "epoch": 7900} {"train_loss": -28.3831729888916, "global_step": 655740, "epoch": 7900} {"train_loss": -28.54545021057129, "global_step": 655741, "epoch": 7900} {"train_loss": -28.597936630249023, "global_step": 655742, "epoch": 7900} {"train_loss": -28.343122482299805, "global_step": 655743, "epoch": 7900} {"train_loss": -28.289215087890625, "global_step": 655744, "epoch": 7900} {"train_loss": -28.218616485595703, "global_step": 655745, "epoch": 7900} {"train_loss": -28.769941329956055, "global_step": 655746, "epoch": 7900} {"train_loss": -28.945575714111328, "global_step": 655747, "epoch": 7900} {"train_loss": -28.218826293945312, "global_step": 655748, "epoch": 7900} {"train_loss": -28.6882266998291, "global_step": 655749, "epoch": 7900} {"train_loss": -28.568756103515625, "global_step": 655750, "epoch": 7900} {"train_loss": -28.446014404296875, "global_step": 655751, "epoch": 7900} {"train_loss": -28.34940528869629, "global_step": 655752, "epoch": 7900} {"train_loss": -28.473651885986328, "global_step": 655753, "epoch": 7900} {"train_loss": -28.89002799987793, "global_step": 655754, "epoch": 7900} {"train_loss": -28.660205841064453, "global_step": 655755, "epoch": 7900} {"train_loss": -28.62566566467285, "global_step": 655756, "epoch": 7900} {"train_loss": -28.25587272644043, "global_step": 655757, "epoch": 7900} {"train_loss": -28.443716049194336, "global_step": 655758, "epoch": 7900} {"train_loss": -28.581253051757812, "global_step": 655759, "epoch": 7900} {"train_loss": -28.245712280273438, "global_step": 655760, "epoch": 7900} {"train_loss": -28.206762313842773, "global_step": 655761, "epoch": 7900} {"train_loss": -28.593515396118164, "global_step": 655762, "epoch": 7900} {"train_loss": -28.577051162719727, "global_step": 655763, "epoch": 7900} {"train_loss": -28.383106231689453, "global_step": 655764, "epoch": 7900} {"train_loss": -28.14051628112793, "global_step": 655765, "epoch": 7900} {"train_loss": -28.4200382232666, "global_step": 655766, "epoch": 7900} {"train_loss": -28.4471492767334, "global_step": 655767, "epoch": 7900} {"train_loss": -28.462936401367188, "global_step": 655768, "epoch": 7900} {"train_loss": -28.608030319213867, "global_step": 655769, "epoch": 7900} {"train_loss": -28.378034591674805, "global_step": 655770, "epoch": 7900} {"train_loss": -28.556507110595703, "global_step": 655771, "epoch": 7900} {"train_loss": -28.33473777770996, "global_step": 655772, "epoch": 7900} {"train_loss": -28.686588287353516, "global_step": 655773, "epoch": 7900} {"train_loss": -28.61941909790039, "global_step": 655774, "epoch": 7900} {"train_loss": -28.655792236328125, "global_step": 655775, "epoch": 7900} {"train_loss": -28.468734741210938, "global_step": 655776, "epoch": 7900} {"train_loss": -28.34583854675293, "global_step": 655777, "epoch": 7900} {"train_loss": -28.493627548217773, "global_step": 655778, "epoch": 7900} {"train_loss": -28.473957061767578, "global_step": 655779, "epoch": 7900} {"train_loss": -28.33867835998535, "global_step": 655780, "epoch": 7900} {"train_loss": -28.584827423095703, "global_step": 655781, "epoch": 7900} {"train_loss": -28.16233168452619, "global_step": 655782, "epoch": 7900, "train/sim_max_reward_0": 1.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4500000": 1.0, "test/sim_max_reward_4500001": 1.0, "test/sim_max_reward_4500002": 1.0, "test/sim_max_reward_4500003": 1.0, "test/sim_max_reward_4500004": 1.0, "test/sim_max_reward_4500005": 1.0, "test/sim_max_reward_4500006": 1.0, "test/sim_max_reward_4500007": 0.0, "test/sim_max_reward_4500008": 1.0, "test/sim_max_reward_4500009": 1.0, "test/sim_max_reward_4500010": 1.0, "test/sim_max_reward_4500011": 1.0, "test/sim_max_reward_4500012": 1.0, "test/sim_max_reward_4500013": 0.0, "test/sim_max_reward_4500014": 1.0, "test/sim_max_reward_4500015": 1.0, "test/sim_max_reward_4500016": 1.0, "test/sim_max_reward_4500017": 1.0, "test/sim_max_reward_4500018": 0.0, "test/sim_max_reward_4500019": 1.0, "test/sim_max_reward_4500020": 1.0, "test/sim_max_reward_4500021": 1.0, "train/mean_score": 1.0, "test/mean_score": 0.8636363636363636, "val_loss": 6751003.5} {"train_loss": -28.247161865234375, "global_step": 655783, "epoch": 7901} {"train_loss": -28.23236656188965, "global_step": 655784, "epoch": 7901} {"train_loss": -28.057147979736328, "global_step": 655785, "epoch": 7901} {"train_loss": -27.956151962280273, "global_step": 655786, "epoch": 7901} {"train_loss": -27.47271156311035, "global_step": 655787, "epoch": 7901} {"train_loss": -28.046499252319336, "global_step": 655788, "epoch": 7901} {"train_loss": -27.80421257019043, "global_step": 655789, "epoch": 7901} {"train_loss": -27.7918758392334, "global_step": 655790, "epoch": 7901} {"train_loss": -28.381433486938477, "global_step": 655791, "epoch": 7901} {"train_loss": -27.684179306030273, "global_step": 655792, "epoch": 7901} {"train_loss": -28.1220703125, "global_step": 655793, "epoch": 7901} {"train_loss": -28.12030601501465, "global_step": 655794, "epoch": 7901} {"train_loss": -28.092283248901367, "global_step": 655795, "epoch": 7901} {"train_loss": -28.281768798828125, "global_step": 655796, "epoch": 7901} {"train_loss": -28.28080177307129, "global_step": 655797, "epoch": 7901} {"train_loss": -28.171777725219727, "global_step": 655798, "epoch": 7901} {"train_loss": -28.192249298095703, "global_step": 655799, "epoch": 7901} {"train_loss": -28.27899742126465, "global_step": 655800, "epoch": 7901} {"train_loss": -28.3333797454834, "global_step": 655801, "epoch": 7901} {"train_loss": -27.9027042388916, "global_step": 655802, "epoch": 7901} {"train_loss": -28.33335304260254, "global_step": 655803, "epoch": 7901} {"train_loss": -28.254261016845703, "global_step": 655804, "epoch": 7901} {"train_loss": -28.4379825592041, "global_step": 655805, "epoch": 7901} {"train_loss": -28.41437339782715, "global_step": 655806, "epoch": 7901} {"train_loss": -28.360532760620117, "global_step": 655807, "epoch": 7901} {"train_loss": -28.215314865112305, "global_step": 655808, "epoch": 7901} {"train_loss": -28.419599533081055, "global_step": 655809, "epoch": 7901} {"train_loss": -28.213672637939453, "global_step": 655810, "epoch": 7901} {"train_loss": -27.876815795898438, "global_step": 655811, "epoch": 7901} {"train_loss": -28.417455673217773, "global_step": 655812, "epoch": 7901} {"train_loss": -27.90336036682129, "global_step": 655813, "epoch": 7901} {"train_loss": -28.812091827392578, "global_step": 655814, "epoch": 7901} {"train_loss": -28.59773063659668, "global_step": 655815, "epoch": 7901} {"train_loss": -27.97828483581543, "global_step": 655816, "epoch": 7901} {"train_loss": -27.87752342224121, "global_step": 655817, "epoch": 7901} {"train_loss": -28.245162963867188, "global_step": 655818, "epoch": 7901} {"train_loss": -28.20635986328125, "global_step": 655819, "epoch": 7901} {"train_loss": -27.836271286010742, "global_step": 655820, "epoch": 7901} {"train_loss": -28.257898330688477, "global_step": 655821, "epoch": 7901} {"train_loss": -27.547061920166016, "global_step": 655822, "epoch": 7901} {"train_loss": -28.01092529296875, "global_step": 655823, "epoch": 7901} {"train_loss": -28.4934024810791, "global_step": 655824, "epoch": 7901} {"train_loss": -28.085132598876953, "global_step": 655825, "epoch": 7901} {"train_loss": -27.7264461517334, "global_step": 655826, "epoch": 7901} {"train_loss": -27.871143341064453, "global_step": 655827, "epoch": 7901} {"train_loss": -28.063901901245117, "global_step": 655828, "epoch": 7901} {"train_loss": -27.85796546936035, "global_step": 655829, "epoch": 7901} {"train_loss": -27.987030029296875, "global_step": 655830, "epoch": 7901} {"train_loss": -27.585254669189453, "global_step": 655831, "epoch": 7901} {"train_loss": -28.102689743041992, "global_step": 655832, "epoch": 7901} {"train_loss": -28.02931022644043, "global_step": 655833, "epoch": 7901} {"train_loss": -28.011564254760742, "global_step": 655834, "epoch": 7901} {"train_loss": -28.2850399017334, "global_step": 655835, "epoch": 7901} {"train_loss": -27.8501033782959, "global_step": 655836, "epoch": 7901} {"train_loss": -28.188190460205078, "global_step": 655837, "epoch": 7901} {"train_loss": -28.046558380126953, "global_step": 655838, "epoch": 7901} {"train_loss": -28.29670524597168, "global_step": 655839, "epoch": 7901} {"train_loss": -28.112646102905273, "global_step": 655840, "epoch": 7901} {"train_loss": -28.59389305114746, "global_step": 655841, "epoch": 7901} {"train_loss": -28.25847816467285, "global_step": 655842, "epoch": 7901} {"train_loss": -28.241287231445312, "global_step": 655843, "epoch": 7901} {"train_loss": -28.340604782104492, "global_step": 655844, "epoch": 7901} {"train_loss": -28.015888214111328, "global_step": 655845, "epoch": 7901} {"train_loss": -28.37568473815918, "global_step": 655846, "epoch": 7901} {"train_loss": -28.225027084350586, "global_step": 655847, "epoch": 7901} {"train_loss": -28.541799545288086, "global_step": 655848, "epoch": 7901} {"train_loss": -28.840139389038086, "global_step": 655849, "epoch": 7901} {"train_loss": -28.189050674438477, "global_step": 655850, "epoch": 7901} {"train_loss": -28.558734893798828, "global_step": 655851, "epoch": 7901} {"train_loss": -28.717004776000977, "global_step": 655852, "epoch": 7901} {"train_loss": -28.282312393188477, "global_step": 655853, "epoch": 7901} {"train_loss": -28.249860763549805, "global_step": 655854, "epoch": 7901} {"train_loss": -28.4847354888916, "global_step": 655855, "epoch": 7901} {"train_loss": -28.36646842956543, "global_step": 655856, "epoch": 7901} {"train_loss": -28.713590621948242, "global_step": 655857, "epoch": 7901} {"train_loss": -28.433032989501953, "global_step": 655858, "epoch": 7901} {"train_loss": -28.563465118408203, "global_step": 655859, "epoch": 7901} {"train_loss": -28.509174346923828, "global_step": 655860, "epoch": 7901} {"train_loss": -28.55122184753418, "global_step": 655861, "epoch": 7901} {"train_loss": -28.48282241821289, "global_step": 655862, "epoch": 7901} {"train_loss": -28.527069091796875, "global_step": 655863, "epoch": 7901} {"train_loss": -28.574756622314453, "global_step": 655864, "epoch": 7901} {"train_loss": -28.2048970188003, "global_step": 655865, "epoch": 7901, "val_loss": 6619696.0} {"train_loss": -27.9541015625, "global_step": 655866, "epoch": 7902} {"train_loss": -28.0316104888916, "global_step": 655867, "epoch": 7902} {"train_loss": -27.719873428344727, "global_step": 655868, "epoch": 7902} {"train_loss": -27.88640785217285, "global_step": 655869, "epoch": 7902} {"train_loss": -27.560224533081055, "global_step": 655870, "epoch": 7902} {"train_loss": -27.813522338867188, "global_step": 655871, "epoch": 7902} {"train_loss": -27.59541130065918, "global_step": 655872, "epoch": 7902} {"train_loss": -28.158634185791016, "global_step": 655873, "epoch": 7902} {"train_loss": -27.700225830078125, "global_step": 655874, "epoch": 7902} {"train_loss": -28.18592643737793, "global_step": 655875, "epoch": 7902} {"train_loss": -28.35797691345215, "global_step": 655876, "epoch": 7902} {"train_loss": -27.83159828186035, "global_step": 655877, "epoch": 7902} {"train_loss": -28.57926368713379, "global_step": 655878, "epoch": 7902} {"train_loss": -28.078369140625, "global_step": 655879, "epoch": 7902} {"train_loss": -27.986953735351562, "global_step": 655880, "epoch": 7902} {"train_loss": -27.83516502380371, "global_step": 655881, "epoch": 7902} {"train_loss": -28.065628051757812, "global_step": 655882, "epoch": 7902} {"train_loss": -28.364734649658203, "global_step": 655883, "epoch": 7902} {"train_loss": -28.292835235595703, "global_step": 655884, "epoch": 7902} {"train_loss": -27.809946060180664, "global_step": 655885, "epoch": 7902} {"train_loss": -28.15729331970215, "global_step": 655886, "epoch": 7902} {"train_loss": -28.56556510925293, "global_step": 655887, "epoch": 7902} {"train_loss": -28.09417724609375, "global_step": 655888, "epoch": 7902} {"train_loss": -28.309986114501953, "global_step": 655889, "epoch": 7902} {"train_loss": -28.3670597076416, "global_step": 655890, "epoch": 7902} {"train_loss": -28.23129653930664, "global_step": 655891, "epoch": 7902} {"train_loss": -28.5738468170166, "global_step": 655892, "epoch": 7902} {"train_loss": -28.2406005859375, "global_step": 655893, "epoch": 7902} {"train_loss": -28.441390991210938, "global_step": 655894, "epoch": 7902} {"train_loss": -28.40217399597168, "global_step": 655895, "epoch": 7902} {"train_loss": -28.453622817993164, "global_step": 655896, "epoch": 7902} {"train_loss": -28.14634132385254, "global_step": 655897, "epoch": 7902} {"train_loss": -28.972471237182617, "global_step": 655898, "epoch": 7902} {"train_loss": -28.541061401367188, "global_step": 655899, "epoch": 7902} {"train_loss": -28.36347007751465, "global_step": 655900, "epoch": 7902} {"train_loss": -28.162038803100586, "global_step": 655901, "epoch": 7902} {"train_loss": -27.791976928710938, "global_step": 655902, "epoch": 7902} {"train_loss": -28.159320831298828, "global_step": 655903, "epoch": 7902} {"train_loss": -27.936399459838867, "global_step": 655904, "epoch": 7902} {"train_loss": -28.403736114501953, "global_step": 655905, "epoch": 7902} {"train_loss": -28.789770126342773, "global_step": 655906, "epoch": 7902} {"train_loss": -28.357711791992188, "global_step": 655907, "epoch": 7902} {"train_loss": -28.26959228515625, "global_step": 655908, "epoch": 7902} {"train_loss": -28.320499420166016, "global_step": 655909, "epoch": 7902} {"train_loss": -28.326635360717773, "global_step": 655910, "epoch": 7902} {"train_loss": -28.29133415222168, "global_step": 655911, "epoch": 7902} {"train_loss": -28.19705581665039, "global_step": 655912, "epoch": 7902} {"train_loss": -28.53724479675293, "global_step": 655913, "epoch": 7902} {"train_loss": -28.430057525634766, "global_step": 655914, "epoch": 7902} {"train_loss": -28.0147647857666, "global_step": 655915, "epoch": 7902} {"train_loss": -28.603382110595703, "global_step": 655916, "epoch": 7902} {"train_loss": -28.55963134765625, "global_step": 655917, "epoch": 7902} {"train_loss": -28.466108322143555, "global_step": 655918, "epoch": 7902} {"train_loss": -28.417566299438477, "global_step": 655919, "epoch": 7902} {"train_loss": -28.204809188842773, "global_step": 655920, "epoch": 7902} {"train_loss": -28.37775230407715, "global_step": 655921, "epoch": 7902} {"train_loss": -28.362096786499023, "global_step": 655922, "epoch": 7902} {"train_loss": -28.464834213256836, "global_step": 655923, "epoch": 7902} {"train_loss": -28.553348541259766, "global_step": 655924, "epoch": 7902} {"train_loss": -28.1404972076416, "global_step": 655925, "epoch": 7902} {"train_loss": -28.641096115112305, "global_step": 655926, "epoch": 7902} {"train_loss": -28.36997413635254, "global_step": 655927, "epoch": 7902} {"train_loss": -28.393136978149414, "global_step": 655928, "epoch": 7902} {"train_loss": -28.359888076782227, "global_step": 655929, "epoch": 7902} {"train_loss": -28.45452880859375, "global_step": 655930, "epoch": 7902} {"train_loss": -28.2584285736084, "global_step": 655931, "epoch": 7902} {"train_loss": -28.842615127563477, "global_step": 655932, "epoch": 7902} {"train_loss": -28.737852096557617, "global_step": 655933, "epoch": 7902} {"train_loss": -28.61793327331543, "global_step": 655934, "epoch": 7902} {"train_loss": -28.323413848876953, "global_step": 655935, "epoch": 7902} {"train_loss": -28.726293563842773, "global_step": 655936, "epoch": 7902} {"train_loss": -28.658472061157227, "global_step": 655937, "epoch": 7902} {"train_loss": -28.531713485717773, "global_step": 655938, "epoch": 7902} {"train_loss": -28.334674835205078, "global_step": 655939, "epoch": 7902} {"train_loss": -28.38358497619629, "global_step": 655940, "epoch": 7902} {"train_loss": -28.23333740234375, "global_step": 655941, "epoch": 7902} {"train_loss": -28.532575607299805, "global_step": 655942, "epoch": 7902} {"train_loss": -28.670812606811523, "global_step": 655943, "epoch": 7902} {"train_loss": -28.137231826782227, "global_step": 655944, "epoch": 7902} {"train_loss": -28.514318466186523, "global_step": 655945, "epoch": 7902} {"train_loss": -28.708728790283203, "global_step": 655946, "epoch": 7902} {"train_loss": -28.8021183013916, "global_step": 655947, "epoch": 7902} {"train_loss": -28.29516985330237, "global_step": 655948, "epoch": 7902, "val_loss": 6677947.0} {"train_loss": -27.95033073425293, "global_step": 655949, "epoch": 7903} {"train_loss": -27.792936325073242, "global_step": 655950, "epoch": 7903} {"train_loss": -27.301319122314453, "global_step": 655951, "epoch": 7903} {"train_loss": -26.53521156311035, "global_step": 655952, "epoch": 7903} {"train_loss": -25.35268211364746, "global_step": 655953, "epoch": 7903} {"train_loss": -26.204715728759766, "global_step": 655954, "epoch": 7903} {"train_loss": -27.9787654876709, "global_step": 655955, "epoch": 7903} {"train_loss": -26.57000160217285, "global_step": 655956, "epoch": 7903} {"train_loss": -27.4470272064209, "global_step": 655957, "epoch": 7903} {"train_loss": -27.19677734375, "global_step": 655958, "epoch": 7903} {"train_loss": -27.468915939331055, "global_step": 655959, "epoch": 7903} {"train_loss": -27.372915267944336, "global_step": 655960, "epoch": 7903} {"train_loss": -27.2632999420166, "global_step": 655961, "epoch": 7903} {"train_loss": -27.896677017211914, "global_step": 655962, "epoch": 7903} {"train_loss": -27.275495529174805, "global_step": 655963, "epoch": 7903} {"train_loss": -27.604938507080078, "global_step": 655964, "epoch": 7903} {"train_loss": -27.92951011657715, "global_step": 655965, "epoch": 7903} {"train_loss": -27.47796630859375, "global_step": 655966, "epoch": 7903} {"train_loss": -27.871564865112305, "global_step": 655967, "epoch": 7903} {"train_loss": -27.942224502563477, "global_step": 655968, "epoch": 7903} {"train_loss": -27.70380210876465, "global_step": 655969, "epoch": 7903} {"train_loss": -27.881717681884766, "global_step": 655970, "epoch": 7903} {"train_loss": -27.708173751831055, "global_step": 655971, "epoch": 7903} {"train_loss": -28.249195098876953, "global_step": 655972, "epoch": 7903} {"train_loss": -27.844152450561523, "global_step": 655973, "epoch": 7903} {"train_loss": -28.167356491088867, "global_step": 655974, "epoch": 7903} {"train_loss": -27.550113677978516, "global_step": 655975, "epoch": 7903} {"train_loss": -27.87824821472168, "global_step": 655976, "epoch": 7903} {"train_loss": -27.898557662963867, "global_step": 655977, "epoch": 7903} {"train_loss": -27.7471923828125, "global_step": 655978, "epoch": 7903} {"train_loss": -27.633270263671875, "global_step": 655979, "epoch": 7903} {"train_loss": -27.781583786010742, "global_step": 655980, "epoch": 7903} {"train_loss": -27.83837890625, "global_step": 655981, "epoch": 7903} {"train_loss": -27.710752487182617, "global_step": 655982, "epoch": 7903} {"train_loss": -27.927560806274414, "global_step": 655983, "epoch": 7903} {"train_loss": -28.100162506103516, "global_step": 655984, "epoch": 7903} {"train_loss": -27.894556045532227, "global_step": 655985, "epoch": 7903} {"train_loss": -27.889562606811523, "global_step": 655986, "epoch": 7903} {"train_loss": -28.190067291259766, "global_step": 655987, "epoch": 7903} {"train_loss": -28.210214614868164, "global_step": 655988, "epoch": 7903} {"train_loss": -28.21823501586914, "global_step": 655989, "epoch": 7903} {"train_loss": -28.18958854675293, "global_step": 655990, "epoch": 7903} {"train_loss": -28.626361846923828, "global_step": 655991, "epoch": 7903} {"train_loss": -28.29486656188965, "global_step": 655992, "epoch": 7903} {"train_loss": -28.5093936920166, "global_step": 655993, "epoch": 7903} {"train_loss": -28.479694366455078, "global_step": 655994, "epoch": 7903} {"train_loss": -28.3096981048584, "global_step": 655995, "epoch": 7903} {"train_loss": -28.29007339477539, "global_step": 655996, "epoch": 7903} {"train_loss": -28.135440826416016, "global_step": 655997, "epoch": 7903} {"train_loss": -28.393268585205078, "global_step": 655998, "epoch": 7903} {"train_loss": -28.504322052001953, "global_step": 655999, "epoch": 7903} {"train_loss": -28.531652450561523, "global_step": 656000, "epoch": 7903} {"train_loss": -28.394704818725586, "global_step": 656001, "epoch": 7903} {"train_loss": -28.081884384155273, "global_step": 656002, "epoch": 7903} {"train_loss": -27.570032119750977, "global_step": 656003, "epoch": 7903} {"train_loss": -26.786087036132812, "global_step": 656004, "epoch": 7903} {"train_loss": -27.716724395751953, "global_step": 656005, "epoch": 7903} {"train_loss": -28.670385360717773, "global_step": 656006, "epoch": 7903} {"train_loss": -27.918745040893555, "global_step": 656007, "epoch": 7903} {"train_loss": -28.026412963867188, "global_step": 656008, "epoch": 7903} {"train_loss": -28.21467399597168, "global_step": 656009, "epoch": 7903} {"train_loss": -28.3897705078125, "global_step": 656010, "epoch": 7903} {"train_loss": -28.135196685791016, "global_step": 656011, "epoch": 7903} {"train_loss": -28.25331687927246, "global_step": 656012, "epoch": 7903} {"train_loss": -28.104108810424805, "global_step": 656013, "epoch": 7903} {"train_loss": -28.016860961914062, "global_step": 656014, "epoch": 7903} {"train_loss": -28.323022842407227, "global_step": 656015, "epoch": 7903} {"train_loss": -28.195178985595703, "global_step": 656016, "epoch": 7903} {"train_loss": -28.446439743041992, "global_step": 656017, "epoch": 7903} {"train_loss": -28.171100616455078, "global_step": 656018, "epoch": 7903} {"train_loss": -28.393695831298828, "global_step": 656019, "epoch": 7903} {"train_loss": -28.28278160095215, "global_step": 656020, "epoch": 7903} {"train_loss": -28.585224151611328, "global_step": 656021, "epoch": 7903} {"train_loss": -28.66950035095215, "global_step": 656022, "epoch": 7903} {"train_loss": -28.55109977722168, "global_step": 656023, "epoch": 7903} {"train_loss": -28.621442794799805, "global_step": 656024, "epoch": 7903} {"train_loss": -28.48793601989746, "global_step": 656025, "epoch": 7903} {"train_loss": -28.87122917175293, "global_step": 656026, "epoch": 7903} {"train_loss": -28.638031005859375, "global_step": 656027, "epoch": 7903} {"train_loss": -28.085981369018555, "global_step": 656028, "epoch": 7903} {"train_loss": -28.15350914001465, "global_step": 656029, "epoch": 7903} {"train_loss": -27.810022354125977, "global_step": 656030, "epoch": 7903} {"train_loss": -27.935531478330315, "global_step": 656031, "epoch": 7903, "val_loss": 6689983.5} {"train_loss": -27.481149673461914, "global_step": 656032, "epoch": 7904} {"train_loss": -27.636905670166016, "global_step": 656033, "epoch": 7904} {"train_loss": -25.523958206176758, "global_step": 656034, "epoch": 7904} {"train_loss": -27.074848175048828, "global_step": 656035, "epoch": 7904} {"train_loss": -26.88189697265625, "global_step": 656036, "epoch": 7904} {"train_loss": -26.306493759155273, "global_step": 656037, "epoch": 7904} {"train_loss": -27.686368942260742, "global_step": 656038, "epoch": 7904} {"train_loss": -26.39556312561035, "global_step": 656039, "epoch": 7904} {"train_loss": -27.18902587890625, "global_step": 656040, "epoch": 7904} {"train_loss": -27.797443389892578, "global_step": 656041, "epoch": 7904} {"train_loss": -27.145612716674805, "global_step": 656042, "epoch": 7904} {"train_loss": -27.378631591796875, "global_step": 656043, "epoch": 7904} {"train_loss": -27.504806518554688, "global_step": 656044, "epoch": 7904} {"train_loss": -28.039173126220703, "global_step": 656045, "epoch": 7904} {"train_loss": -27.50892448425293, "global_step": 656046, "epoch": 7904} {"train_loss": -27.929712295532227, "global_step": 656047, "epoch": 7904} {"train_loss": -27.41620445251465, "global_step": 656048, "epoch": 7904} {"train_loss": -27.85843849182129, "global_step": 656049, "epoch": 7904} {"train_loss": -27.907947540283203, "global_step": 656050, "epoch": 7904} {"train_loss": -27.760074615478516, "global_step": 656051, "epoch": 7904} {"train_loss": -27.841949462890625, "global_step": 656052, "epoch": 7904} {"train_loss": -27.569055557250977, "global_step": 656053, "epoch": 7904} {"train_loss": -28.202123641967773, "global_step": 656054, "epoch": 7904} {"train_loss": -28.17413902282715, "global_step": 656055, "epoch": 7904} {"train_loss": -27.88872718811035, "global_step": 656056, "epoch": 7904} {"train_loss": -28.015893936157227, "global_step": 656057, "epoch": 7904} {"train_loss": -28.13726234436035, "global_step": 656058, "epoch": 7904} {"train_loss": -27.75831413269043, "global_step": 656059, "epoch": 7904} {"train_loss": -28.069915771484375, "global_step": 656060, "epoch": 7904} {"train_loss": -27.97767448425293, "global_step": 656061, "epoch": 7904} {"train_loss": -28.264942169189453, "global_step": 656062, "epoch": 7904} {"train_loss": -28.01189613342285, "global_step": 656063, "epoch": 7904} {"train_loss": -28.024429321289062, "global_step": 656064, "epoch": 7904} {"train_loss": -28.239843368530273, "global_step": 656065, "epoch": 7904} {"train_loss": -28.410476684570312, "global_step": 656066, "epoch": 7904} {"train_loss": -28.125402450561523, "global_step": 656067, "epoch": 7904} {"train_loss": -28.255346298217773, "global_step": 656068, "epoch": 7904} {"train_loss": -28.190114974975586, "global_step": 656069, "epoch": 7904} {"train_loss": -28.09270668029785, "global_step": 656070, "epoch": 7904} {"train_loss": -28.176050186157227, "global_step": 656071, "epoch": 7904} {"train_loss": -28.332462310791016, "global_step": 656072, "epoch": 7904} {"train_loss": -28.69287109375, "global_step": 656073, "epoch": 7904} {"train_loss": -28.46735954284668, "global_step": 656074, "epoch": 7904} {"train_loss": -28.699981689453125, "global_step": 656075, "epoch": 7904} {"train_loss": -28.151464462280273, "global_step": 656076, "epoch": 7904} {"train_loss": -28.19545555114746, "global_step": 656077, "epoch": 7904} {"train_loss": -28.542768478393555, "global_step": 656078, "epoch": 7904} {"train_loss": -28.647174835205078, "global_step": 656079, "epoch": 7904} {"train_loss": -28.454669952392578, "global_step": 656080, "epoch": 7904} {"train_loss": -28.15056800842285, "global_step": 656081, "epoch": 7904} {"train_loss": -28.210901260375977, "global_step": 656082, "epoch": 7904} {"train_loss": -28.69489097595215, "global_step": 656083, "epoch": 7904} {"train_loss": -28.386890411376953, "global_step": 656084, "epoch": 7904} {"train_loss": -28.549917221069336, "global_step": 656085, "epoch": 7904} {"train_loss": -28.8836612701416, "global_step": 656086, "epoch": 7904} {"train_loss": -28.07504653930664, "global_step": 656087, "epoch": 7904} {"train_loss": -28.243783950805664, "global_step": 656088, "epoch": 7904} {"train_loss": -28.312915802001953, "global_step": 656089, "epoch": 7904} {"train_loss": -28.693954467773438, "global_step": 656090, "epoch": 7904} {"train_loss": -28.801034927368164, "global_step": 656091, "epoch": 7904} {"train_loss": -28.687665939331055, "global_step": 656092, "epoch": 7904} {"train_loss": -28.88028335571289, "global_step": 656093, "epoch": 7904} {"train_loss": -28.53692054748535, "global_step": 656094, "epoch": 7904} {"train_loss": -28.66152000427246, "global_step": 656095, "epoch": 7904} {"train_loss": -28.302139282226562, "global_step": 656096, "epoch": 7904} {"train_loss": -28.630462646484375, "global_step": 656097, "epoch": 7904} {"train_loss": -28.35812759399414, "global_step": 656098, "epoch": 7904} {"train_loss": -28.615997314453125, "global_step": 656099, "epoch": 7904} {"train_loss": -28.729297637939453, "global_step": 656100, "epoch": 7904} {"train_loss": -28.14377212524414, "global_step": 656101, "epoch": 7904} {"train_loss": -28.87769889831543, "global_step": 656102, "epoch": 7904} {"train_loss": -28.33245849609375, "global_step": 656103, "epoch": 7904} {"train_loss": -28.155715942382812, "global_step": 656104, "epoch": 7904} {"train_loss": -28.501861572265625, "global_step": 656105, "epoch": 7904} {"train_loss": -28.154809951782227, "global_step": 656106, "epoch": 7904} {"train_loss": -27.20612144470215, "global_step": 656107, "epoch": 7904} {"train_loss": -27.941059112548828, "global_step": 656108, "epoch": 7904} {"train_loss": -28.108922958374023, "global_step": 656109, "epoch": 7904} {"train_loss": -27.728195190429688, "global_step": 656110, "epoch": 7904} {"train_loss": -27.616947174072266, "global_step": 656111, "epoch": 7904} {"train_loss": -28.63166618347168, "global_step": 656112, "epoch": 7904} {"train_loss": -28.046741485595703, "global_step": 656113, "epoch": 7904} {"train_loss": -28.044565108885248, "global_step": 656114, "epoch": 7904, "val_loss": 6647298.0} {"train_loss": -26.544836044311523, "global_step": 656115, "epoch": 7905} {"train_loss": -25.463523864746094, "global_step": 656116, "epoch": 7905} {"train_loss": -27.507970809936523, "global_step": 656117, "epoch": 7905} {"train_loss": -26.33222770690918, "global_step": 656118, "epoch": 7905} {"train_loss": -25.94236183166504, "global_step": 656119, "epoch": 7905} {"train_loss": -26.860431671142578, "global_step": 656120, "epoch": 7905} {"train_loss": -26.305953979492188, "global_step": 656121, "epoch": 7905} {"train_loss": -27.123016357421875, "global_step": 656122, "epoch": 7905} {"train_loss": -26.740310668945312, "global_step": 656123, "epoch": 7905} {"train_loss": -26.002033233642578, "global_step": 656124, "epoch": 7905} {"train_loss": -26.89655876159668, "global_step": 656125, "epoch": 7905} {"train_loss": -27.087121963500977, "global_step": 656126, "epoch": 7905} {"train_loss": -26.655685424804688, "global_step": 656127, "epoch": 7905} {"train_loss": -27.39208984375, "global_step": 656128, "epoch": 7905} {"train_loss": -27.156835556030273, "global_step": 656129, "epoch": 7905} {"train_loss": -27.495166778564453, "global_step": 656130, "epoch": 7905} {"train_loss": -27.4190673828125, "global_step": 656131, "epoch": 7905} {"train_loss": -27.59942626953125, "global_step": 656132, "epoch": 7905} {"train_loss": -27.508838653564453, "global_step": 656133, "epoch": 7905} {"train_loss": -27.64650535583496, "global_step": 656134, "epoch": 7905} {"train_loss": -27.662168502807617, "global_step": 656135, "epoch": 7905} {"train_loss": -27.68538475036621, "global_step": 656136, "epoch": 7905} {"train_loss": -27.834369659423828, "global_step": 656137, "epoch": 7905} {"train_loss": -27.761281967163086, "global_step": 656138, "epoch": 7905} {"train_loss": -27.75921058654785, "global_step": 656139, "epoch": 7905} {"train_loss": -27.8765869140625, "global_step": 656140, "epoch": 7905} {"train_loss": -28.141637802124023, "global_step": 656141, "epoch": 7905} {"train_loss": -28.136615753173828, "global_step": 656142, "epoch": 7905} {"train_loss": -28.1037540435791, "global_step": 656143, "epoch": 7905} {"train_loss": -28.15804100036621, "global_step": 656144, "epoch": 7905} {"train_loss": -28.18206787109375, "global_step": 656145, "epoch": 7905} {"train_loss": -27.979846954345703, "global_step": 656146, "epoch": 7905} {"train_loss": -28.129638671875, "global_step": 656147, "epoch": 7905} {"train_loss": -28.166711807250977, "global_step": 656148, "epoch": 7905} {"train_loss": -28.172971725463867, "global_step": 656149, "epoch": 7905} {"train_loss": -28.281335830688477, "global_step": 656150, "epoch": 7905} {"train_loss": -28.195709228515625, "global_step": 656151, "epoch": 7905} {"train_loss": -28.410537719726562, "global_step": 656152, "epoch": 7905} {"train_loss": -28.319904327392578, "global_step": 656153, "epoch": 7905} {"train_loss": -28.15509033203125, "global_step": 656154, "epoch": 7905} {"train_loss": -28.013944625854492, "global_step": 656155, "epoch": 7905} {"train_loss": -28.511991500854492, "global_step": 656156, "epoch": 7905} {"train_loss": -28.178693771362305, "global_step": 656157, "epoch": 7905} {"train_loss": -28.326948165893555, "global_step": 656158, "epoch": 7905} {"train_loss": -28.265661239624023, "global_step": 656159, "epoch": 7905} {"train_loss": -27.96967124938965, "global_step": 656160, "epoch": 7905} {"train_loss": -28.369993209838867, "global_step": 656161, "epoch": 7905} {"train_loss": -28.318866729736328, "global_step": 656162, "epoch": 7905} {"train_loss": -28.26498794555664, "global_step": 656163, "epoch": 7905} {"train_loss": -28.645771026611328, "global_step": 656164, "epoch": 7905} {"train_loss": -28.467782974243164, "global_step": 656165, "epoch": 7905} {"train_loss": -27.99708366394043, "global_step": 656166, "epoch": 7905} {"train_loss": -28.564502716064453, "global_step": 656167, "epoch": 7905} {"train_loss": -28.19215202331543, "global_step": 656168, "epoch": 7905} {"train_loss": -28.53021812438965, "global_step": 656169, "epoch": 7905} {"train_loss": -28.7504940032959, "global_step": 656170, "epoch": 7905} {"train_loss": -28.17754554748535, "global_step": 656171, "epoch": 7905} {"train_loss": -28.618085861206055, "global_step": 656172, "epoch": 7905} {"train_loss": -28.393814086914062, "global_step": 656173, "epoch": 7905} {"train_loss": -28.708877563476562, "global_step": 656174, "epoch": 7905} {"train_loss": -28.837121963500977, "global_step": 656175, "epoch": 7905} {"train_loss": -28.5952091217041, "global_step": 656176, "epoch": 7905} {"train_loss": -28.60761070251465, "global_step": 656177, "epoch": 7905} {"train_loss": -28.41241455078125, "global_step": 656178, "epoch": 7905} {"train_loss": -28.108612060546875, "global_step": 656179, "epoch": 7905} {"train_loss": -28.901016235351562, "global_step": 656180, "epoch": 7905} {"train_loss": -28.578662872314453, "global_step": 656181, "epoch": 7905} {"train_loss": -28.350433349609375, "global_step": 656182, "epoch": 7905} {"train_loss": -28.704511642456055, "global_step": 656183, "epoch": 7905} {"train_loss": -28.617843627929688, "global_step": 656184, "epoch": 7905} {"train_loss": -28.6218204498291, "global_step": 656185, "epoch": 7905} {"train_loss": -28.412988662719727, "global_step": 656186, "epoch": 7905} {"train_loss": -28.374067306518555, "global_step": 656187, "epoch": 7905} {"train_loss": -28.364416122436523, "global_step": 656188, "epoch": 7905} {"train_loss": -28.1025390625, "global_step": 656189, "epoch": 7905} {"train_loss": -28.011276245117188, "global_step": 656190, "epoch": 7905} {"train_loss": -27.52020835876465, "global_step": 656191, "epoch": 7905} {"train_loss": -26.663705825805664, "global_step": 656192, "epoch": 7905} {"train_loss": -25.33139419555664, "global_step": 656193, "epoch": 7905} {"train_loss": -26.2218074798584, "global_step": 656194, "epoch": 7905} {"train_loss": -27.909793853759766, "global_step": 656195, "epoch": 7905} {"train_loss": -27.534963607788086, "global_step": 656196, "epoch": 7905} {"train_loss": -27.82997112963573, "global_step": 656197, "epoch": 7905, "val_loss": 6550036.5} {"train_loss": -26.868484497070312, "global_step": 656198, "epoch": 7906} {"train_loss": -25.484630584716797, "global_step": 656199, "epoch": 7906} {"train_loss": -26.285968780517578, "global_step": 656200, "epoch": 7906} {"train_loss": -26.809280395507812, "global_step": 656201, "epoch": 7906} {"train_loss": -26.21805191040039, "global_step": 656202, "epoch": 7906} {"train_loss": -26.396833419799805, "global_step": 656203, "epoch": 7906} {"train_loss": -26.363265991210938, "global_step": 656204, "epoch": 7906} {"train_loss": -26.360279083251953, "global_step": 656205, "epoch": 7906} {"train_loss": -26.694766998291016, "global_step": 656206, "epoch": 7906} {"train_loss": -26.75282096862793, "global_step": 656207, "epoch": 7906} {"train_loss": -26.964984893798828, "global_step": 656208, "epoch": 7906} {"train_loss": -27.282560348510742, "global_step": 656209, "epoch": 7906} {"train_loss": -27.325687408447266, "global_step": 656210, "epoch": 7906} {"train_loss": -27.283660888671875, "global_step": 656211, "epoch": 7906} {"train_loss": -27.139280319213867, "global_step": 656212, "epoch": 7906} {"train_loss": -27.325408935546875, "global_step": 656213, "epoch": 7906} {"train_loss": -27.48788833618164, "global_step": 656214, "epoch": 7906} {"train_loss": -27.603652954101562, "global_step": 656215, "epoch": 7906} {"train_loss": -27.183271408081055, "global_step": 656216, "epoch": 7906} {"train_loss": -27.292043685913086, "global_step": 656217, "epoch": 7906} {"train_loss": -27.425186157226562, "global_step": 656218, "epoch": 7906} {"train_loss": -27.645374298095703, "global_step": 656219, "epoch": 7906} {"train_loss": -27.04530143737793, "global_step": 656220, "epoch": 7906} {"train_loss": -27.759159088134766, "global_step": 656221, "epoch": 7906} {"train_loss": -27.762088775634766, "global_step": 656222, "epoch": 7906} {"train_loss": -27.67030906677246, "global_step": 656223, "epoch": 7906} {"train_loss": -28.024816513061523, "global_step": 656224, "epoch": 7906} {"train_loss": -27.8812198638916, "global_step": 656225, "epoch": 7906} {"train_loss": -27.526248931884766, "global_step": 656226, "epoch": 7906} {"train_loss": -27.446115493774414, "global_step": 656227, "epoch": 7906} {"train_loss": -28.146482467651367, "global_step": 656228, "epoch": 7906} {"train_loss": -28.000659942626953, "global_step": 656229, "epoch": 7906} {"train_loss": -28.33765983581543, "global_step": 656230, "epoch": 7906} {"train_loss": -27.773733139038086, "global_step": 656231, "epoch": 7906} {"train_loss": -28.024139404296875, "global_step": 656232, "epoch": 7906} {"train_loss": -28.038976669311523, "global_step": 656233, "epoch": 7906} {"train_loss": -28.033447265625, "global_step": 656234, "epoch": 7906} {"train_loss": -27.692197799682617, "global_step": 656235, "epoch": 7906} {"train_loss": -27.85745620727539, "global_step": 656236, "epoch": 7906} {"train_loss": -28.281457901000977, "global_step": 656237, "epoch": 7906} {"train_loss": -27.960859298706055, "global_step": 656238, "epoch": 7906} {"train_loss": -27.877197265625, "global_step": 656239, "epoch": 7906} {"train_loss": -27.99321937561035, "global_step": 656240, "epoch": 7906} {"train_loss": -28.595739364624023, "global_step": 656241, "epoch": 7906} {"train_loss": -28.21944236755371, "global_step": 656242, "epoch": 7906} {"train_loss": -28.20570182800293, "global_step": 656243, "epoch": 7906} {"train_loss": -28.431196212768555, "global_step": 656244, "epoch": 7906} {"train_loss": -28.50383949279785, "global_step": 656245, "epoch": 7906} {"train_loss": -28.622669219970703, "global_step": 656246, "epoch": 7906} {"train_loss": -28.299924850463867, "global_step": 656247, "epoch": 7906} {"train_loss": -28.49818992614746, "global_step": 656248, "epoch": 7906} {"train_loss": -28.208032608032227, "global_step": 656249, "epoch": 7906} {"train_loss": -28.376501083374023, "global_step": 656250, "epoch": 7906} {"train_loss": -28.202884674072266, "global_step": 656251, "epoch": 7906} {"train_loss": -28.804895401000977, "global_step": 656252, "epoch": 7906} {"train_loss": -28.266387939453125, "global_step": 656253, "epoch": 7906} {"train_loss": -28.168066024780273, "global_step": 656254, "epoch": 7906} {"train_loss": -28.486555099487305, "global_step": 656255, "epoch": 7906} {"train_loss": -28.611087799072266, "global_step": 656256, "epoch": 7906} {"train_loss": -28.509862899780273, "global_step": 656257, "epoch": 7906} {"train_loss": -27.863561630249023, "global_step": 656258, "epoch": 7906} {"train_loss": -28.64959716796875, "global_step": 656259, "epoch": 7906} {"train_loss": -28.371063232421875, "global_step": 656260, "epoch": 7906} {"train_loss": -28.671716690063477, "global_step": 656261, "epoch": 7906} {"train_loss": -28.674291610717773, "global_step": 656262, "epoch": 7906} {"train_loss": -28.316162109375, "global_step": 656263, "epoch": 7906} {"train_loss": -28.348230361938477, "global_step": 656264, "epoch": 7906} {"train_loss": -27.92671775817871, "global_step": 656265, "epoch": 7906} {"train_loss": -28.20987892150879, "global_step": 656266, "epoch": 7906} {"train_loss": -28.369897842407227, "global_step": 656267, "epoch": 7906} {"train_loss": -28.287353515625, "global_step": 656268, "epoch": 7906} {"train_loss": -28.266569137573242, "global_step": 656269, "epoch": 7906} {"train_loss": -28.858530044555664, "global_step": 656270, "epoch": 7906} {"train_loss": -28.6412410736084, "global_step": 656271, "epoch": 7906} {"train_loss": -28.639074325561523, "global_step": 656272, "epoch": 7906} {"train_loss": -28.395782470703125, "global_step": 656273, "epoch": 7906} {"train_loss": -28.5164794921875, "global_step": 656274, "epoch": 7906} {"train_loss": -28.7386531829834, "global_step": 656275, "epoch": 7906} {"train_loss": -28.640893936157227, "global_step": 656276, "epoch": 7906} {"train_loss": -28.13252830505371, "global_step": 656277, "epoch": 7906} {"train_loss": -28.26555824279785, "global_step": 656278, "epoch": 7906} {"train_loss": -28.60943603515625, "global_step": 656279, "epoch": 7906} {"train_loss": -27.87185533362699, "global_step": 656280, "epoch": 7906, "val_loss": 6625688.5} {"train_loss": -27.506927490234375, "global_step": 656281, "epoch": 7907} {"train_loss": -27.460474014282227, "global_step": 656282, "epoch": 7907} {"train_loss": -27.3563289642334, "global_step": 656283, "epoch": 7907} {"train_loss": -27.681293487548828, "global_step": 656284, "epoch": 7907} {"train_loss": -27.839197158813477, "global_step": 656285, "epoch": 7907} {"train_loss": -27.626440048217773, "global_step": 656286, "epoch": 7907} {"train_loss": -27.519689559936523, "global_step": 656287, "epoch": 7907} {"train_loss": -27.959735870361328, "global_step": 656288, "epoch": 7907} {"train_loss": -27.746042251586914, "global_step": 656289, "epoch": 7907} {"train_loss": -27.669879913330078, "global_step": 656290, "epoch": 7907} {"train_loss": -28.0505428314209, "global_step": 656291, "epoch": 7907} {"train_loss": -27.93951988220215, "global_step": 656292, "epoch": 7907} {"train_loss": -27.889318466186523, "global_step": 656293, "epoch": 7907} {"train_loss": -28.0052433013916, "global_step": 656294, "epoch": 7907} {"train_loss": -27.995391845703125, "global_step": 656295, "epoch": 7907} {"train_loss": -27.761783599853516, "global_step": 656296, "epoch": 7907} {"train_loss": -28.16230583190918, "global_step": 656297, "epoch": 7907} {"train_loss": -27.995929718017578, "global_step": 656298, "epoch": 7907} {"train_loss": -27.76702308654785, "global_step": 656299, "epoch": 7907} {"train_loss": -27.868148803710938, "global_step": 656300, "epoch": 7907} {"train_loss": -27.911603927612305, "global_step": 656301, "epoch": 7907} {"train_loss": -28.497516632080078, "global_step": 656302, "epoch": 7907} {"train_loss": -28.26300048828125, "global_step": 656303, "epoch": 7907} {"train_loss": -27.94065284729004, "global_step": 656304, "epoch": 7907} {"train_loss": -28.080724716186523, "global_step": 656305, "epoch": 7907} {"train_loss": -28.281415939331055, "global_step": 656306, "epoch": 7907} {"train_loss": -28.040821075439453, "global_step": 656307, "epoch": 7907} {"train_loss": -27.757375717163086, "global_step": 656308, "epoch": 7907} {"train_loss": -28.093585968017578, "global_step": 656309, "epoch": 7907} {"train_loss": -28.69691276550293, "global_step": 656310, "epoch": 7907} {"train_loss": -28.027698516845703, "global_step": 656311, "epoch": 7907} {"train_loss": -28.223203659057617, "global_step": 656312, "epoch": 7907} {"train_loss": -28.2551212310791, "global_step": 656313, "epoch": 7907} {"train_loss": -28.029565811157227, "global_step": 656314, "epoch": 7907} {"train_loss": -28.29212760925293, "global_step": 656315, "epoch": 7907} {"train_loss": -28.05655288696289, "global_step": 656316, "epoch": 7907} {"train_loss": -28.386137008666992, "global_step": 656317, "epoch": 7907} {"train_loss": -28.312042236328125, "global_step": 656318, "epoch": 7907} {"train_loss": -28.315052032470703, "global_step": 656319, "epoch": 7907} {"train_loss": -28.236963272094727, "global_step": 656320, "epoch": 7907} {"train_loss": -28.140050888061523, "global_step": 656321, "epoch": 7907} {"train_loss": -28.162784576416016, "global_step": 656322, "epoch": 7907} {"train_loss": -28.326337814331055, "global_step": 656323, "epoch": 7907} {"train_loss": -28.167631149291992, "global_step": 656324, "epoch": 7907} {"train_loss": -28.41935157775879, "global_step": 656325, "epoch": 7907} {"train_loss": -28.484418869018555, "global_step": 656326, "epoch": 7907} {"train_loss": -28.512176513671875, "global_step": 656327, "epoch": 7907} {"train_loss": -28.517709732055664, "global_step": 656328, "epoch": 7907} {"train_loss": -28.680089950561523, "global_step": 656329, "epoch": 7907} {"train_loss": -28.187490463256836, "global_step": 656330, "epoch": 7907} {"train_loss": -28.38164710998535, "global_step": 656331, "epoch": 7907} {"train_loss": -28.510080337524414, "global_step": 656332, "epoch": 7907} {"train_loss": -28.271198272705078, "global_step": 656333, "epoch": 7907} {"train_loss": -28.483667373657227, "global_step": 656334, "epoch": 7907} {"train_loss": -28.022836685180664, "global_step": 656335, "epoch": 7907} {"train_loss": -28.49612808227539, "global_step": 656336, "epoch": 7907} {"train_loss": -28.719343185424805, "global_step": 656337, "epoch": 7907} {"train_loss": -28.807525634765625, "global_step": 656338, "epoch": 7907} {"train_loss": -28.453739166259766, "global_step": 656339, "epoch": 7907} {"train_loss": -28.42427635192871, "global_step": 656340, "epoch": 7907} {"train_loss": -28.29707908630371, "global_step": 656341, "epoch": 7907} {"train_loss": -28.646276473999023, "global_step": 656342, "epoch": 7907} {"train_loss": -28.51505470275879, "global_step": 656343, "epoch": 7907} {"train_loss": -28.434268951416016, "global_step": 656344, "epoch": 7907} {"train_loss": -28.662397384643555, "global_step": 656345, "epoch": 7907} {"train_loss": -28.44354820251465, "global_step": 656346, "epoch": 7907} {"train_loss": -29.00823402404785, "global_step": 656347, "epoch": 7907} {"train_loss": -28.567174911499023, "global_step": 656348, "epoch": 7907} {"train_loss": -28.811176300048828, "global_step": 656349, "epoch": 7907} {"train_loss": -28.188129425048828, "global_step": 656350, "epoch": 7907} {"train_loss": -28.772693634033203, "global_step": 656351, "epoch": 7907} {"train_loss": -28.41037368774414, "global_step": 656352, "epoch": 7907} {"train_loss": -28.69588279724121, "global_step": 656353, "epoch": 7907} {"train_loss": -28.645795822143555, "global_step": 656354, "epoch": 7907} {"train_loss": -28.079504013061523, "global_step": 656355, "epoch": 7907} {"train_loss": -27.85406494140625, "global_step": 656356, "epoch": 7907} {"train_loss": -27.291921615600586, "global_step": 656357, "epoch": 7907} {"train_loss": -25.896869659423828, "global_step": 656358, "epoch": 7907} {"train_loss": -22.707433700561523, "global_step": 656359, "epoch": 7907} {"train_loss": -25.409433364868164, "global_step": 656360, "epoch": 7907} {"train_loss": -27.737577438354492, "global_step": 656361, "epoch": 7907} {"train_loss": -26.723295211791992, "global_step": 656362, "epoch": 7907} {"train_loss": -28.014772139399884, "global_step": 656363, "epoch": 7907, "val_loss": 6605966.0} {"train_loss": -25.621198654174805, "global_step": 656364, "epoch": 7908} {"train_loss": -25.721435546875, "global_step": 656365, "epoch": 7908} {"train_loss": -26.196582794189453, "global_step": 656366, "epoch": 7908} {"train_loss": -25.12070083618164, "global_step": 656367, "epoch": 7908} {"train_loss": -26.790481567382812, "global_step": 656368, "epoch": 7908} {"train_loss": -26.473867416381836, "global_step": 656369, "epoch": 7908} {"train_loss": -26.62566566467285, "global_step": 656370, "epoch": 7908} {"train_loss": -26.116607666015625, "global_step": 656371, "epoch": 7908} {"train_loss": -26.519763946533203, "global_step": 656372, "epoch": 7908} {"train_loss": -27.167617797851562, "global_step": 656373, "epoch": 7908} {"train_loss": -27.347070693969727, "global_step": 656374, "epoch": 7908} {"train_loss": -26.956012725830078, "global_step": 656375, "epoch": 7908} {"train_loss": -27.321136474609375, "global_step": 656376, "epoch": 7908} {"train_loss": -27.390588760375977, "global_step": 656377, "epoch": 7908} {"train_loss": -27.096933364868164, "global_step": 656378, "epoch": 7908} {"train_loss": -27.12625503540039, "global_step": 656379, "epoch": 7908} {"train_loss": -27.376874923706055, "global_step": 656380, "epoch": 7908} {"train_loss": -27.480066299438477, "global_step": 656381, "epoch": 7908} {"train_loss": -27.45660972595215, "global_step": 656382, "epoch": 7908} {"train_loss": -27.558874130249023, "global_step": 656383, "epoch": 7908} {"train_loss": -27.820636749267578, "global_step": 656384, "epoch": 7908} {"train_loss": -27.36724281311035, "global_step": 656385, "epoch": 7908} {"train_loss": -27.45159339904785, "global_step": 656386, "epoch": 7908} {"train_loss": -27.652374267578125, "global_step": 656387, "epoch": 7908} {"train_loss": -27.74686622619629, "global_step": 656388, "epoch": 7908} {"train_loss": -27.8072566986084, "global_step": 656389, "epoch": 7908} {"train_loss": -27.7962703704834, "global_step": 656390, "epoch": 7908} {"train_loss": -27.775989532470703, "global_step": 656391, "epoch": 7908} {"train_loss": -27.76279067993164, "global_step": 656392, "epoch": 7908} {"train_loss": -27.694807052612305, "global_step": 656393, "epoch": 7908} {"train_loss": -27.963333129882812, "global_step": 656394, "epoch": 7908} {"train_loss": -27.93141746520996, "global_step": 656395, "epoch": 7908} {"train_loss": -28.171844482421875, "global_step": 656396, "epoch": 7908} {"train_loss": -27.83075523376465, "global_step": 656397, "epoch": 7908} {"train_loss": -27.603717803955078, "global_step": 656398, "epoch": 7908} {"train_loss": -28.488306045532227, "global_step": 656399, "epoch": 7908} {"train_loss": -28.320886611938477, "global_step": 656400, "epoch": 7908} {"train_loss": -28.387500762939453, "global_step": 656401, "epoch": 7908} {"train_loss": -28.152074813842773, "global_step": 656402, "epoch": 7908} {"train_loss": -28.125219345092773, "global_step": 656403, "epoch": 7908} {"train_loss": -28.05628776550293, "global_step": 656404, "epoch": 7908} {"train_loss": -28.1768856048584, "global_step": 656405, "epoch": 7908} {"train_loss": -27.929197311401367, "global_step": 656406, "epoch": 7908} {"train_loss": -27.9887752532959, "global_step": 656407, "epoch": 7908} {"train_loss": -28.384750366210938, "global_step": 656408, "epoch": 7908} {"train_loss": -28.419281005859375, "global_step": 656409, "epoch": 7908} {"train_loss": -28.301252365112305, "global_step": 656410, "epoch": 7908} {"train_loss": -28.59226417541504, "global_step": 656411, "epoch": 7908} {"train_loss": -28.428739547729492, "global_step": 656412, "epoch": 7908} {"train_loss": -28.64504051208496, "global_step": 656413, "epoch": 7908} {"train_loss": -28.57450294494629, "global_step": 656414, "epoch": 7908} {"train_loss": -28.381210327148438, "global_step": 656415, "epoch": 7908} {"train_loss": -28.4265079498291, "global_step": 656416, "epoch": 7908} {"train_loss": -28.55853843688965, "global_step": 656417, "epoch": 7908} {"train_loss": -28.55771827697754, "global_step": 656418, "epoch": 7908} {"train_loss": -28.533309936523438, "global_step": 656419, "epoch": 7908} {"train_loss": -28.45420265197754, "global_step": 656420, "epoch": 7908} {"train_loss": -28.232563018798828, "global_step": 656421, "epoch": 7908} {"train_loss": -28.397851943969727, "global_step": 656422, "epoch": 7908} {"train_loss": -28.47021484375, "global_step": 656423, "epoch": 7908} {"train_loss": -28.54450035095215, "global_step": 656424, "epoch": 7908} {"train_loss": -28.410093307495117, "global_step": 656425, "epoch": 7908} {"train_loss": -28.549768447875977, "global_step": 656426, "epoch": 7908} {"train_loss": -28.353071212768555, "global_step": 656427, "epoch": 7908} {"train_loss": -28.46491050720215, "global_step": 656428, "epoch": 7908} {"train_loss": -28.877607345581055, "global_step": 656429, "epoch": 7908} {"train_loss": -28.0459041595459, "global_step": 656430, "epoch": 7908} {"train_loss": -28.236509323120117, "global_step": 656431, "epoch": 7908} {"train_loss": -28.450092315673828, "global_step": 656432, "epoch": 7908} {"train_loss": -28.05076026916504, "global_step": 656433, "epoch": 7908} {"train_loss": -28.27884292602539, "global_step": 656434, "epoch": 7908} {"train_loss": -28.454065322875977, "global_step": 656435, "epoch": 7908} {"train_loss": -27.752573013305664, "global_step": 656436, "epoch": 7908} {"train_loss": -28.348546981811523, "global_step": 656437, "epoch": 7908} {"train_loss": -28.16413688659668, "global_step": 656438, "epoch": 7908} {"train_loss": -28.443429946899414, "global_step": 656439, "epoch": 7908} {"train_loss": -28.225677490234375, "global_step": 656440, "epoch": 7908} {"train_loss": -28.4515323638916, "global_step": 656441, "epoch": 7908} {"train_loss": -27.967090606689453, "global_step": 656442, "epoch": 7908} {"train_loss": -28.346759796142578, "global_step": 656443, "epoch": 7908} {"train_loss": -28.40982437133789, "global_step": 656444, "epoch": 7908} {"train_loss": -28.36651611328125, "global_step": 656445, "epoch": 7908} {"train_loss": -27.860734479973114, "global_step": 656446, "epoch": 7908, "val_loss": 6613322.0} {"train_loss": -28.12904167175293, "global_step": 656447, "epoch": 7909} {"train_loss": -27.897689819335938, "global_step": 656448, "epoch": 7909} {"train_loss": -27.902990341186523, "global_step": 656449, "epoch": 7909} {"train_loss": -28.297927856445312, "global_step": 656450, "epoch": 7909} {"train_loss": -28.210920333862305, "global_step": 656451, "epoch": 7909} {"train_loss": -28.147932052612305, "global_step": 656452, "epoch": 7909} {"train_loss": -28.37255859375, "global_step": 656453, "epoch": 7909} {"train_loss": -28.474905014038086, "global_step": 656454, "epoch": 7909} {"train_loss": -28.220510482788086, "global_step": 656455, "epoch": 7909} {"train_loss": -27.973249435424805, "global_step": 656456, "epoch": 7909} {"train_loss": -28.348617553710938, "global_step": 656457, "epoch": 7909} {"train_loss": -28.33369255065918, "global_step": 656458, "epoch": 7909} {"train_loss": -28.01846694946289, "global_step": 656459, "epoch": 7909} {"train_loss": -28.078784942626953, "global_step": 656460, "epoch": 7909} {"train_loss": -28.200010299682617, "global_step": 656461, "epoch": 7909} {"train_loss": -28.16279411315918, "global_step": 656462, "epoch": 7909} {"train_loss": -28.322662353515625, "global_step": 656463, "epoch": 7909} {"train_loss": -27.878427505493164, "global_step": 656464, "epoch": 7909} {"train_loss": -28.050525665283203, "global_step": 656465, "epoch": 7909} {"train_loss": -27.9808292388916, "global_step": 656466, "epoch": 7909} {"train_loss": -27.781238555908203, "global_step": 656467, "epoch": 7909} {"train_loss": -28.006366729736328, "global_step": 656468, "epoch": 7909} {"train_loss": -28.292388916015625, "global_step": 656469, "epoch": 7909} {"train_loss": -27.913318634033203, "global_step": 656470, "epoch": 7909} {"train_loss": -28.348743438720703, "global_step": 656471, "epoch": 7909} {"train_loss": -28.48563575744629, "global_step": 656472, "epoch": 7909} {"train_loss": -28.078893661499023, "global_step": 656473, "epoch": 7909} {"train_loss": -28.06536293029785, "global_step": 656474, "epoch": 7909} {"train_loss": -28.180042266845703, "global_step": 656475, "epoch": 7909} {"train_loss": -28.417646408081055, "global_step": 656476, "epoch": 7909} {"train_loss": -28.544870376586914, "global_step": 656477, "epoch": 7909} {"train_loss": -28.398000717163086, "global_step": 656478, "epoch": 7909} {"train_loss": -28.0968074798584, "global_step": 656479, "epoch": 7909} {"train_loss": -28.330713272094727, "global_step": 656480, "epoch": 7909} {"train_loss": -28.24601173400879, "global_step": 656481, "epoch": 7909} {"train_loss": -28.692121505737305, "global_step": 656482, "epoch": 7909} {"train_loss": -28.848669052124023, "global_step": 656483, "epoch": 7909} {"train_loss": -27.904630661010742, "global_step": 656484, "epoch": 7909} {"train_loss": -28.108234405517578, "global_step": 656485, "epoch": 7909} {"train_loss": -28.310321807861328, "global_step": 656486, "epoch": 7909} {"train_loss": -28.37714958190918, "global_step": 656487, "epoch": 7909} {"train_loss": -28.44110107421875, "global_step": 656488, "epoch": 7909} {"train_loss": -28.269689559936523, "global_step": 656489, "epoch": 7909} {"train_loss": -28.390233993530273, "global_step": 656490, "epoch": 7909} {"train_loss": -28.518115997314453, "global_step": 656491, "epoch": 7909} {"train_loss": -28.302228927612305, "global_step": 656492, "epoch": 7909} {"train_loss": -27.906049728393555, "global_step": 656493, "epoch": 7909} {"train_loss": -28.506174087524414, "global_step": 656494, "epoch": 7909} {"train_loss": -27.76177978515625, "global_step": 656495, "epoch": 7909} {"train_loss": -27.87152671813965, "global_step": 656496, "epoch": 7909} {"train_loss": -28.493860244750977, "global_step": 656497, "epoch": 7909} {"train_loss": -27.80531883239746, "global_step": 656498, "epoch": 7909} {"train_loss": -28.131433486938477, "global_step": 656499, "epoch": 7909} {"train_loss": -28.198469161987305, "global_step": 656500, "epoch": 7909} {"train_loss": -27.534229278564453, "global_step": 656501, "epoch": 7909} {"train_loss": -28.36048698425293, "global_step": 656502, "epoch": 7909} {"train_loss": -28.79681396484375, "global_step": 656503, "epoch": 7909} {"train_loss": -28.174224853515625, "global_step": 656504, "epoch": 7909} {"train_loss": -28.43610191345215, "global_step": 656505, "epoch": 7909} {"train_loss": -28.283594131469727, "global_step": 656506, "epoch": 7909} {"train_loss": -28.31545066833496, "global_step": 656507, "epoch": 7909} {"train_loss": -28.45612907409668, "global_step": 656508, "epoch": 7909} {"train_loss": -28.513940811157227, "global_step": 656509, "epoch": 7909} {"train_loss": -28.318708419799805, "global_step": 656510, "epoch": 7909} {"train_loss": -28.38288688659668, "global_step": 656511, "epoch": 7909} {"train_loss": -28.541748046875, "global_step": 656512, "epoch": 7909} {"train_loss": -28.353973388671875, "global_step": 656513, "epoch": 7909} {"train_loss": -28.41608238220215, "global_step": 656514, "epoch": 7909} {"train_loss": -28.005924224853516, "global_step": 656515, "epoch": 7909} {"train_loss": -28.46649742126465, "global_step": 656516, "epoch": 7909} {"train_loss": -28.37139320373535, "global_step": 656517, "epoch": 7909} {"train_loss": -28.4124698638916, "global_step": 656518, "epoch": 7909} {"train_loss": -28.731491088867188, "global_step": 656519, "epoch": 7909} {"train_loss": -28.6103572845459, "global_step": 656520, "epoch": 7909} {"train_loss": -28.45206642150879, "global_step": 656521, "epoch": 7909} {"train_loss": -28.8118953704834, "global_step": 656522, "epoch": 7909} {"train_loss": -28.646398544311523, "global_step": 656523, "epoch": 7909} {"train_loss": -28.897205352783203, "global_step": 656524, "epoch": 7909} {"train_loss": -28.214130401611328, "global_step": 656525, "epoch": 7909} {"train_loss": -28.30660057067871, "global_step": 656526, "epoch": 7909} {"train_loss": -28.41684341430664, "global_step": 656527, "epoch": 7909} {"train_loss": -28.46921730041504, "global_step": 656528, "epoch": 7909} {"train_loss": -28.2664611540645, "global_step": 656529, "epoch": 7909, "val_loss": 6593136.5} {"train_loss": -26.815149307250977, "global_step": 656530, "epoch": 7910} {"train_loss": -26.495426177978516, "global_step": 656531, "epoch": 7910} {"train_loss": -27.8088321685791, "global_step": 656532, "epoch": 7910} {"train_loss": -27.1241455078125, "global_step": 656533, "epoch": 7910} {"train_loss": -27.038867950439453, "global_step": 656534, "epoch": 7910} {"train_loss": -27.34429931640625, "global_step": 656535, "epoch": 7910} {"train_loss": -28.161237716674805, "global_step": 656536, "epoch": 7910} {"train_loss": -27.51611328125, "global_step": 656537, "epoch": 7910} {"train_loss": -28.082304000854492, "global_step": 656538, "epoch": 7910} {"train_loss": -27.8455810546875, "global_step": 656539, "epoch": 7910} {"train_loss": -27.92976188659668, "global_step": 656540, "epoch": 7910} {"train_loss": -27.471633911132812, "global_step": 656541, "epoch": 7910} {"train_loss": -28.210031509399414, "global_step": 656542, "epoch": 7910} {"train_loss": -27.857954025268555, "global_step": 656543, "epoch": 7910} {"train_loss": -28.083942413330078, "global_step": 656544, "epoch": 7910} {"train_loss": -28.394819259643555, "global_step": 656545, "epoch": 7910} {"train_loss": -28.06068229675293, "global_step": 656546, "epoch": 7910} {"train_loss": -28.12708854675293, "global_step": 656547, "epoch": 7910} {"train_loss": -28.106229782104492, "global_step": 656548, "epoch": 7910} {"train_loss": -27.874740600585938, "global_step": 656549, "epoch": 7910} {"train_loss": -28.6050968170166, "global_step": 656550, "epoch": 7910} {"train_loss": -28.200321197509766, "global_step": 656551, "epoch": 7910} {"train_loss": -28.09156608581543, "global_step": 656552, "epoch": 7910} {"train_loss": -28.361072540283203, "global_step": 656553, "epoch": 7910} {"train_loss": -27.985595703125, "global_step": 656554, "epoch": 7910} {"train_loss": -28.025775909423828, "global_step": 656555, "epoch": 7910} {"train_loss": -28.169355392456055, "global_step": 656556, "epoch": 7910} {"train_loss": -28.2384090423584, "global_step": 656557, "epoch": 7910} {"train_loss": -28.138586044311523, "global_step": 656558, "epoch": 7910} {"train_loss": -28.766088485717773, "global_step": 656559, "epoch": 7910} {"train_loss": -28.249658584594727, "global_step": 656560, "epoch": 7910} {"train_loss": -28.084253311157227, "global_step": 656561, "epoch": 7910} {"train_loss": -28.477005004882812, "global_step": 656562, "epoch": 7910} {"train_loss": -28.323583602905273, "global_step": 656563, "epoch": 7910} {"train_loss": -28.633682250976562, "global_step": 656564, "epoch": 7910} {"train_loss": -28.528873443603516, "global_step": 656565, "epoch": 7910} {"train_loss": -28.33685874938965, "global_step": 656566, "epoch": 7910} {"train_loss": -28.759328842163086, "global_step": 656567, "epoch": 7910} {"train_loss": -28.19205093383789, "global_step": 656568, "epoch": 7910} {"train_loss": -28.646947860717773, "global_step": 656569, "epoch": 7910} {"train_loss": -28.338891983032227, "global_step": 656570, "epoch": 7910} {"train_loss": -28.770172119140625, "global_step": 656571, "epoch": 7910} {"train_loss": -28.494842529296875, "global_step": 656572, "epoch": 7910} {"train_loss": -28.600122451782227, "global_step": 656573, "epoch": 7910} {"train_loss": -28.368864059448242, "global_step": 656574, "epoch": 7910} {"train_loss": -27.838947296142578, "global_step": 656575, "epoch": 7910} {"train_loss": -28.536304473876953, "global_step": 656576, "epoch": 7910} {"train_loss": -28.211074829101562, "global_step": 656577, "epoch": 7910} {"train_loss": -28.004056930541992, "global_step": 656578, "epoch": 7910} {"train_loss": -28.319860458374023, "global_step": 656579, "epoch": 7910} {"train_loss": -28.451019287109375, "global_step": 656580, "epoch": 7910} {"train_loss": -28.756834030151367, "global_step": 656581, "epoch": 7910} {"train_loss": -28.27212905883789, "global_step": 656582, "epoch": 7910} {"train_loss": -28.264211654663086, "global_step": 656583, "epoch": 7910} {"train_loss": -28.34893226623535, "global_step": 656584, "epoch": 7910} {"train_loss": -28.301776885986328, "global_step": 656585, "epoch": 7910} {"train_loss": -28.219797134399414, "global_step": 656586, "epoch": 7910} {"train_loss": -28.58810806274414, "global_step": 656587, "epoch": 7910} {"train_loss": -28.655256271362305, "global_step": 656588, "epoch": 7910} {"train_loss": -28.46028709411621, "global_step": 656589, "epoch": 7910} {"train_loss": -28.564258575439453, "global_step": 656590, "epoch": 7910} {"train_loss": -28.655170440673828, "global_step": 656591, "epoch": 7910} {"train_loss": -28.568334579467773, "global_step": 656592, "epoch": 7910} {"train_loss": -28.864978790283203, "global_step": 656593, "epoch": 7910} {"train_loss": -28.115331649780273, "global_step": 656594, "epoch": 7910} {"train_loss": -27.993549346923828, "global_step": 656595, "epoch": 7910} {"train_loss": -27.77362632751465, "global_step": 656596, "epoch": 7910} {"train_loss": -27.870010375976562, "global_step": 656597, "epoch": 7910} {"train_loss": -27.955280303955078, "global_step": 656598, "epoch": 7910} {"train_loss": -28.4100284576416, "global_step": 656599, "epoch": 7910} {"train_loss": -28.29242515563965, "global_step": 656600, "epoch": 7910} {"train_loss": -28.445493698120117, "global_step": 656601, "epoch": 7910} {"train_loss": -28.530689239501953, "global_step": 656602, "epoch": 7910} {"train_loss": -28.24552345275879, "global_step": 656603, "epoch": 7910} {"train_loss": -28.491851806640625, "global_step": 656604, "epoch": 7910} {"train_loss": -28.15903663635254, "global_step": 656605, "epoch": 7910} {"train_loss": -28.442197799682617, "global_step": 656606, "epoch": 7910} {"train_loss": -28.436859130859375, "global_step": 656607, "epoch": 7910} {"train_loss": -28.399066925048828, "global_step": 656608, "epoch": 7910} {"train_loss": -28.143110275268555, "global_step": 656609, "epoch": 7910} {"train_loss": -28.51075553894043, "global_step": 656610, "epoch": 7910} {"train_loss": -27.814868927001953, "global_step": 656611, "epoch": 7910} {"train_loss": -28.18611167999635, "global_step": 656612, "epoch": 7910, "val_loss": 6639085.5} {"train_loss": -26.77309226989746, "global_step": 656613, "epoch": 7911} {"train_loss": -25.597553253173828, "global_step": 656614, "epoch": 7911} {"train_loss": -26.748632431030273, "global_step": 656615, "epoch": 7911} {"train_loss": -26.472665786743164, "global_step": 656616, "epoch": 7911} {"train_loss": -26.240522384643555, "global_step": 656617, "epoch": 7911} {"train_loss": -27.498666763305664, "global_step": 656618, "epoch": 7911} {"train_loss": -27.006031036376953, "global_step": 656619, "epoch": 7911} {"train_loss": -27.11907958984375, "global_step": 656620, "epoch": 7911} {"train_loss": -27.41104507446289, "global_step": 656621, "epoch": 7911} {"train_loss": -27.344390869140625, "global_step": 656622, "epoch": 7911} {"train_loss": -26.96929359436035, "global_step": 656623, "epoch": 7911} {"train_loss": -27.67854118347168, "global_step": 656624, "epoch": 7911} {"train_loss": -27.93488121032715, "global_step": 656625, "epoch": 7911} {"train_loss": -27.607946395874023, "global_step": 656626, "epoch": 7911} {"train_loss": -27.574426651000977, "global_step": 656627, "epoch": 7911} {"train_loss": -27.597187042236328, "global_step": 656628, "epoch": 7911} {"train_loss": -27.76099967956543, "global_step": 656629, "epoch": 7911} {"train_loss": -27.91468620300293, "global_step": 656630, "epoch": 7911} {"train_loss": -27.744312286376953, "global_step": 656631, "epoch": 7911} {"train_loss": -27.372272491455078, "global_step": 656632, "epoch": 7911} {"train_loss": -27.787023544311523, "global_step": 656633, "epoch": 7911} {"train_loss": -27.678455352783203, "global_step": 656634, "epoch": 7911} {"train_loss": -28.05341148376465, "global_step": 656635, "epoch": 7911} {"train_loss": -27.901962280273438, "global_step": 656636, "epoch": 7911} {"train_loss": -27.70611572265625, "global_step": 656637, "epoch": 7911} {"train_loss": -27.946048736572266, "global_step": 656638, "epoch": 7911} {"train_loss": -27.906723022460938, "global_step": 656639, "epoch": 7911} {"train_loss": -27.67890739440918, "global_step": 656640, "epoch": 7911} {"train_loss": -28.31141471862793, "global_step": 656641, "epoch": 7911} {"train_loss": -28.11768913269043, "global_step": 656642, "epoch": 7911} {"train_loss": -28.20484733581543, "global_step": 656643, "epoch": 7911} {"train_loss": -28.032743453979492, "global_step": 656644, "epoch": 7911} {"train_loss": -28.22493553161621, "global_step": 656645, "epoch": 7911} {"train_loss": -28.3244686126709, "global_step": 656646, "epoch": 7911} {"train_loss": -28.35823631286621, "global_step": 656647, "epoch": 7911} {"train_loss": -28.025562286376953, "global_step": 656648, "epoch": 7911} {"train_loss": -28.029388427734375, "global_step": 656649, "epoch": 7911} {"train_loss": -27.886810302734375, "global_step": 656650, "epoch": 7911} {"train_loss": -28.234655380249023, "global_step": 656651, "epoch": 7911} {"train_loss": -28.245298385620117, "global_step": 656652, "epoch": 7911} {"train_loss": -28.17548179626465, "global_step": 656653, "epoch": 7911} {"train_loss": -28.292638778686523, "global_step": 656654, "epoch": 7911} {"train_loss": -28.3026123046875, "global_step": 656655, "epoch": 7911} {"train_loss": -28.406274795532227, "global_step": 656656, "epoch": 7911} {"train_loss": -28.526203155517578, "global_step": 656657, "epoch": 7911} {"train_loss": -28.798925399780273, "global_step": 656658, "epoch": 7911} {"train_loss": -28.506444931030273, "global_step": 656659, "epoch": 7911} {"train_loss": -28.691024780273438, "global_step": 656660, "epoch": 7911} {"train_loss": -28.29668617248535, "global_step": 656661, "epoch": 7911} {"train_loss": -28.37530517578125, "global_step": 656662, "epoch": 7911} {"train_loss": -28.424585342407227, "global_step": 656663, "epoch": 7911} {"train_loss": -28.73467445373535, "global_step": 656664, "epoch": 7911} {"train_loss": -28.447219848632812, "global_step": 656665, "epoch": 7911} {"train_loss": -28.709747314453125, "global_step": 656666, "epoch": 7911} {"train_loss": -28.471662521362305, "global_step": 656667, "epoch": 7911} {"train_loss": -28.452600479125977, "global_step": 656668, "epoch": 7911} {"train_loss": -28.732898712158203, "global_step": 656669, "epoch": 7911} {"train_loss": -28.788171768188477, "global_step": 656670, "epoch": 7911} {"train_loss": -28.520599365234375, "global_step": 656671, "epoch": 7911} {"train_loss": -28.51881980895996, "global_step": 656672, "epoch": 7911} {"train_loss": -28.724912643432617, "global_step": 656673, "epoch": 7911} {"train_loss": -28.8608455657959, "global_step": 656674, "epoch": 7911} {"train_loss": -28.7327823638916, "global_step": 656675, "epoch": 7911} {"train_loss": -28.6934757232666, "global_step": 656676, "epoch": 7911} {"train_loss": -28.763751983642578, "global_step": 656677, "epoch": 7911} {"train_loss": -28.3563232421875, "global_step": 656678, "epoch": 7911} {"train_loss": -28.5682430267334, "global_step": 656679, "epoch": 7911} {"train_loss": -28.687238693237305, "global_step": 656680, "epoch": 7911} {"train_loss": -28.430908203125, "global_step": 656681, "epoch": 7911} {"train_loss": -28.891386032104492, "global_step": 656682, "epoch": 7911} {"train_loss": -28.586679458618164, "global_step": 656683, "epoch": 7911} {"train_loss": -28.734704971313477, "global_step": 656684, "epoch": 7911} {"train_loss": -28.252714157104492, "global_step": 656685, "epoch": 7911} {"train_loss": -28.1527042388916, "global_step": 656686, "epoch": 7911} {"train_loss": -28.534488677978516, "global_step": 656687, "epoch": 7911} {"train_loss": -28.7174129486084, "global_step": 656688, "epoch": 7911} {"train_loss": -28.3625431060791, "global_step": 656689, "epoch": 7911} {"train_loss": -28.61166763305664, "global_step": 656690, "epoch": 7911} {"train_loss": -28.278284072875977, "global_step": 656691, "epoch": 7911} {"train_loss": -28.787607192993164, "global_step": 656692, "epoch": 7911} {"train_loss": -28.26993179321289, "global_step": 656693, "epoch": 7911} {"train_loss": -28.1699161529541, "global_step": 656694, "epoch": 7911} {"train_loss": -28.064986010631884, "global_step": 656695, "epoch": 7911, "val_loss": 6604509.0} {"train_loss": -25.752660751342773, "global_step": 656696, "epoch": 7912} {"train_loss": -25.3325252532959, "global_step": 656697, "epoch": 7912} {"train_loss": -24.944971084594727, "global_step": 656698, "epoch": 7912} {"train_loss": -25.88494300842285, "global_step": 656699, "epoch": 7912} {"train_loss": -25.759063720703125, "global_step": 656700, "epoch": 7912} {"train_loss": -26.721826553344727, "global_step": 656701, "epoch": 7912} {"train_loss": -26.728879928588867, "global_step": 656702, "epoch": 7912} {"train_loss": -27.1651668548584, "global_step": 656703, "epoch": 7912} {"train_loss": -26.48921012878418, "global_step": 656704, "epoch": 7912} {"train_loss": -27.510587692260742, "global_step": 656705, "epoch": 7912} {"train_loss": -27.2377986907959, "global_step": 656706, "epoch": 7912} {"train_loss": -26.761632919311523, "global_step": 656707, "epoch": 7912} {"train_loss": -26.694318771362305, "global_step": 656708, "epoch": 7912} {"train_loss": -27.15113639831543, "global_step": 656709, "epoch": 7912} {"train_loss": -26.92734146118164, "global_step": 656710, "epoch": 7912} {"train_loss": -27.44647216796875, "global_step": 656711, "epoch": 7912} {"train_loss": -27.119125366210938, "global_step": 656712, "epoch": 7912} {"train_loss": -27.59651756286621, "global_step": 656713, "epoch": 7912} {"train_loss": -27.685382843017578, "global_step": 656714, "epoch": 7912} {"train_loss": -27.770166397094727, "global_step": 656715, "epoch": 7912} {"train_loss": -27.74506950378418, "global_step": 656716, "epoch": 7912} {"train_loss": -27.07224464416504, "global_step": 656717, "epoch": 7912} {"train_loss": -27.413043975830078, "global_step": 656718, "epoch": 7912} {"train_loss": -27.579675674438477, "global_step": 656719, "epoch": 7912} {"train_loss": -27.719221115112305, "global_step": 656720, "epoch": 7912} {"train_loss": -27.438373565673828, "global_step": 656721, "epoch": 7912} {"train_loss": -27.563247680664062, "global_step": 656722, "epoch": 7912} {"train_loss": -27.750904083251953, "global_step": 656723, "epoch": 7912} {"train_loss": -27.875152587890625, "global_step": 656724, "epoch": 7912} {"train_loss": -27.846546173095703, "global_step": 656725, "epoch": 7912} {"train_loss": -27.585697174072266, "global_step": 656726, "epoch": 7912} {"train_loss": -27.764556884765625, "global_step": 656727, "epoch": 7912} {"train_loss": -27.52715492248535, "global_step": 656728, "epoch": 7912} {"train_loss": -27.823392868041992, "global_step": 656729, "epoch": 7912} {"train_loss": -27.824695587158203, "global_step": 656730, "epoch": 7912} {"train_loss": -27.721454620361328, "global_step": 656731, "epoch": 7912} {"train_loss": -27.754425048828125, "global_step": 656732, "epoch": 7912} {"train_loss": -28.011930465698242, "global_step": 656733, "epoch": 7912} {"train_loss": -28.23301124572754, "global_step": 656734, "epoch": 7912} {"train_loss": -28.250791549682617, "global_step": 656735, "epoch": 7912} {"train_loss": -27.718469619750977, "global_step": 656736, "epoch": 7912} {"train_loss": -28.18588638305664, "global_step": 656737, "epoch": 7912} {"train_loss": -28.20381736755371, "global_step": 656738, "epoch": 7912} {"train_loss": -28.375539779663086, "global_step": 656739, "epoch": 7912} {"train_loss": -28.28460121154785, "global_step": 656740, "epoch": 7912} {"train_loss": -28.337488174438477, "global_step": 656741, "epoch": 7912} {"train_loss": -28.11136245727539, "global_step": 656742, "epoch": 7912} {"train_loss": -28.215356826782227, "global_step": 656743, "epoch": 7912} {"train_loss": -28.35120964050293, "global_step": 656744, "epoch": 7912} {"train_loss": -28.06080436706543, "global_step": 656745, "epoch": 7912} {"train_loss": -28.07953453063965, "global_step": 656746, "epoch": 7912} {"train_loss": -28.146093368530273, "global_step": 656747, "epoch": 7912} {"train_loss": -28.24726676940918, "global_step": 656748, "epoch": 7912} {"train_loss": -28.481002807617188, "global_step": 656749, "epoch": 7912} {"train_loss": -28.416702270507812, "global_step": 656750, "epoch": 7912} {"train_loss": -28.552703857421875, "global_step": 656751, "epoch": 7912} {"train_loss": -28.61028480529785, "global_step": 656752, "epoch": 7912} {"train_loss": -28.395658493041992, "global_step": 656753, "epoch": 7912} {"train_loss": -28.06281852722168, "global_step": 656754, "epoch": 7912} {"train_loss": -28.35400390625, "global_step": 656755, "epoch": 7912} {"train_loss": -28.44626235961914, "global_step": 656756, "epoch": 7912} {"train_loss": -28.17399024963379, "global_step": 656757, "epoch": 7912} {"train_loss": -28.75587272644043, "global_step": 656758, "epoch": 7912} {"train_loss": -28.478662490844727, "global_step": 656759, "epoch": 7912} {"train_loss": -28.34516716003418, "global_step": 656760, "epoch": 7912} {"train_loss": -28.45879554748535, "global_step": 656761, "epoch": 7912} {"train_loss": -28.357208251953125, "global_step": 656762, "epoch": 7912} {"train_loss": -28.35662841796875, "global_step": 656763, "epoch": 7912} {"train_loss": -28.979345321655273, "global_step": 656764, "epoch": 7912} {"train_loss": -28.268512725830078, "global_step": 656765, "epoch": 7912} {"train_loss": -28.73151969909668, "global_step": 656766, "epoch": 7912} {"train_loss": -28.5245304107666, "global_step": 656767, "epoch": 7912} {"train_loss": -28.569013595581055, "global_step": 656768, "epoch": 7912} {"train_loss": -28.66240882873535, "global_step": 656769, "epoch": 7912} {"train_loss": -28.329437255859375, "global_step": 656770, "epoch": 7912} {"train_loss": -28.602705001831055, "global_step": 656771, "epoch": 7912} {"train_loss": -28.619403839111328, "global_step": 656772, "epoch": 7912} {"train_loss": -28.804059982299805, "global_step": 656773, "epoch": 7912} {"train_loss": -28.828857421875, "global_step": 656774, "epoch": 7912} {"train_loss": -28.38421630859375, "global_step": 656775, "epoch": 7912} {"train_loss": -28.537250518798828, "global_step": 656776, "epoch": 7912} {"train_loss": -28.252277374267578, "global_step": 656777, "epoch": 7912} {"train_loss": -27.83918056717838, "global_step": 656778, "epoch": 7912, "val_loss": 6646348.0} {"train_loss": -27.353986740112305, "global_step": 656779, "epoch": 7913} {"train_loss": -28.044147491455078, "global_step": 656780, "epoch": 7913} {"train_loss": -27.589080810546875, "global_step": 656781, "epoch": 7913} {"train_loss": -27.625141143798828, "global_step": 656782, "epoch": 7913} {"train_loss": -28.219724655151367, "global_step": 656783, "epoch": 7913} {"train_loss": -28.19369888305664, "global_step": 656784, "epoch": 7913} {"train_loss": -28.027074813842773, "global_step": 656785, "epoch": 7913} {"train_loss": -27.828643798828125, "global_step": 656786, "epoch": 7913} {"train_loss": -28.15276527404785, "global_step": 656787, "epoch": 7913} {"train_loss": -28.217626571655273, "global_step": 656788, "epoch": 7913} {"train_loss": -28.346982955932617, "global_step": 656789, "epoch": 7913} {"train_loss": -28.177331924438477, "global_step": 656790, "epoch": 7913} {"train_loss": -27.859210968017578, "global_step": 656791, "epoch": 7913} {"train_loss": -28.041614532470703, "global_step": 656792, "epoch": 7913} {"train_loss": -28.37860107421875, "global_step": 656793, "epoch": 7913} {"train_loss": -27.671340942382812, "global_step": 656794, "epoch": 7913} {"train_loss": -28.043182373046875, "global_step": 656795, "epoch": 7913} {"train_loss": -28.56781578063965, "global_step": 656796, "epoch": 7913} {"train_loss": -27.831836700439453, "global_step": 656797, "epoch": 7913} {"train_loss": -28.31087303161621, "global_step": 656798, "epoch": 7913} {"train_loss": -28.337085723876953, "global_step": 656799, "epoch": 7913} {"train_loss": -28.318044662475586, "global_step": 656800, "epoch": 7913} {"train_loss": -27.891687393188477, "global_step": 656801, "epoch": 7913} {"train_loss": -28.056272506713867, "global_step": 656802, "epoch": 7913} {"train_loss": -28.60062599182129, "global_step": 656803, "epoch": 7913} {"train_loss": -27.956619262695312, "global_step": 656804, "epoch": 7913} {"train_loss": -28.176361083984375, "global_step": 656805, "epoch": 7913} {"train_loss": -28.157556533813477, "global_step": 656806, "epoch": 7913} {"train_loss": -27.813465118408203, "global_step": 656807, "epoch": 7913} {"train_loss": -28.086225509643555, "global_step": 656808, "epoch": 7913} {"train_loss": -28.296979904174805, "global_step": 656809, "epoch": 7913} {"train_loss": -28.24560546875, "global_step": 656810, "epoch": 7913} {"train_loss": -27.901504516601562, "global_step": 656811, "epoch": 7913} {"train_loss": -28.075790405273438, "global_step": 656812, "epoch": 7913} {"train_loss": -28.47637367248535, "global_step": 656813, "epoch": 7913} {"train_loss": -28.27814292907715, "global_step": 656814, "epoch": 7913} {"train_loss": -28.708139419555664, "global_step": 656815, "epoch": 7913} {"train_loss": -27.984272003173828, "global_step": 656816, "epoch": 7913} {"train_loss": -28.477325439453125, "global_step": 656817, "epoch": 7913} {"train_loss": -28.073139190673828, "global_step": 656818, "epoch": 7913} {"train_loss": -28.671422958374023, "global_step": 656819, "epoch": 7913} {"train_loss": -28.507984161376953, "global_step": 656820, "epoch": 7913} {"train_loss": -28.04987907409668, "global_step": 656821, "epoch": 7913} {"train_loss": -28.39264488220215, "global_step": 656822, "epoch": 7913} {"train_loss": -28.52162742614746, "global_step": 656823, "epoch": 7913} {"train_loss": -28.22052574157715, "global_step": 656824, "epoch": 7913} {"train_loss": -28.6195125579834, "global_step": 656825, "epoch": 7913} {"train_loss": -28.679931640625, "global_step": 656826, "epoch": 7913} {"train_loss": -28.811853408813477, "global_step": 656827, "epoch": 7913} {"train_loss": -28.431625366210938, "global_step": 656828, "epoch": 7913} {"train_loss": -28.716257095336914, "global_step": 656829, "epoch": 7913} {"train_loss": -28.30958366394043, "global_step": 656830, "epoch": 7913} {"train_loss": -28.744220733642578, "global_step": 656831, "epoch": 7913} {"train_loss": -28.33258628845215, "global_step": 656832, "epoch": 7913} {"train_loss": -28.965255737304688, "global_step": 656833, "epoch": 7913} {"train_loss": -28.381948471069336, "global_step": 656834, "epoch": 7913} {"train_loss": -28.31327247619629, "global_step": 656835, "epoch": 7913} {"train_loss": -28.033645629882812, "global_step": 656836, "epoch": 7913} {"train_loss": -28.394794464111328, "global_step": 656837, "epoch": 7913} {"train_loss": -28.814756393432617, "global_step": 656838, "epoch": 7913} {"train_loss": -28.590560913085938, "global_step": 656839, "epoch": 7913} {"train_loss": -28.69256591796875, "global_step": 656840, "epoch": 7913} {"train_loss": -28.356616973876953, "global_step": 656841, "epoch": 7913} {"train_loss": -28.691064834594727, "global_step": 656842, "epoch": 7913} {"train_loss": -28.417724609375, "global_step": 656843, "epoch": 7913} {"train_loss": -28.338048934936523, "global_step": 656844, "epoch": 7913} {"train_loss": -28.51188087463379, "global_step": 656845, "epoch": 7913} {"train_loss": -28.50054359436035, "global_step": 656846, "epoch": 7913} {"train_loss": -28.652475357055664, "global_step": 656847, "epoch": 7913} {"train_loss": -28.765583038330078, "global_step": 656848, "epoch": 7913} {"train_loss": -28.773685455322266, "global_step": 656849, "epoch": 7913} {"train_loss": -28.8309326171875, "global_step": 656850, "epoch": 7913} {"train_loss": -28.564666748046875, "global_step": 656851, "epoch": 7913} {"train_loss": -28.52869987487793, "global_step": 656852, "epoch": 7913} {"train_loss": -28.55681800842285, "global_step": 656853, "epoch": 7913} {"train_loss": -28.230066299438477, "global_step": 656854, "epoch": 7913} {"train_loss": -27.788724899291992, "global_step": 656855, "epoch": 7913} {"train_loss": -27.319610595703125, "global_step": 656856, "epoch": 7913} {"train_loss": -27.611347198486328, "global_step": 656857, "epoch": 7913} {"train_loss": -28.204669952392578, "global_step": 656858, "epoch": 7913} {"train_loss": -28.7481689453125, "global_step": 656859, "epoch": 7913} {"train_loss": -28.1538143157959, "global_step": 656860, "epoch": 7913} {"train_loss": -28.28359994543604, "global_step": 656861, "epoch": 7913, "val_loss": 6650797.0} {"train_loss": -27.22979164123535, "global_step": 656862, "epoch": 7914} {"train_loss": -26.60989761352539, "global_step": 656863, "epoch": 7914} {"train_loss": -26.914087295532227, "global_step": 656864, "epoch": 7914} {"train_loss": -28.075475692749023, "global_step": 656865, "epoch": 7914} {"train_loss": -27.357763290405273, "global_step": 656866, "epoch": 7914} {"train_loss": -27.047292709350586, "global_step": 656867, "epoch": 7914} {"train_loss": -27.321218490600586, "global_step": 656868, "epoch": 7914} {"train_loss": -27.810468673706055, "global_step": 656869, "epoch": 7914} {"train_loss": -27.590662002563477, "global_step": 656870, "epoch": 7914} {"train_loss": -27.960020065307617, "global_step": 656871, "epoch": 7914} {"train_loss": -28.044286727905273, "global_step": 656872, "epoch": 7914} {"train_loss": -27.849348068237305, "global_step": 656873, "epoch": 7914} {"train_loss": -27.876956939697266, "global_step": 656874, "epoch": 7914} {"train_loss": -28.101633071899414, "global_step": 656875, "epoch": 7914} {"train_loss": -27.839385986328125, "global_step": 656876, "epoch": 7914} {"train_loss": -28.040307998657227, "global_step": 656877, "epoch": 7914} {"train_loss": -28.335357666015625, "global_step": 656878, "epoch": 7914} {"train_loss": -28.223844528198242, "global_step": 656879, "epoch": 7914} {"train_loss": -28.1702938079834, "global_step": 656880, "epoch": 7914} {"train_loss": -28.129169464111328, "global_step": 656881, "epoch": 7914} {"train_loss": -28.57966423034668, "global_step": 656882, "epoch": 7914} {"train_loss": -27.713964462280273, "global_step": 656883, "epoch": 7914} {"train_loss": -28.01143455505371, "global_step": 656884, "epoch": 7914} {"train_loss": -27.925283432006836, "global_step": 656885, "epoch": 7914} {"train_loss": -27.742294311523438, "global_step": 656886, "epoch": 7914} {"train_loss": -28.10810661315918, "global_step": 656887, "epoch": 7914} {"train_loss": -28.22675895690918, "global_step": 656888, "epoch": 7914} {"train_loss": -28.021194458007812, "global_step": 656889, "epoch": 7914} {"train_loss": -28.479490280151367, "global_step": 656890, "epoch": 7914} {"train_loss": -28.179386138916016, "global_step": 656891, "epoch": 7914} {"train_loss": -28.537185668945312, "global_step": 656892, "epoch": 7914} {"train_loss": -28.291717529296875, "global_step": 656893, "epoch": 7914} {"train_loss": -28.338315963745117, "global_step": 656894, "epoch": 7914} {"train_loss": -28.471210479736328, "global_step": 656895, "epoch": 7914} {"train_loss": -28.438318252563477, "global_step": 656896, "epoch": 7914} {"train_loss": -28.360509872436523, "global_step": 656897, "epoch": 7914} {"train_loss": -28.262439727783203, "global_step": 656898, "epoch": 7914} {"train_loss": -28.252227783203125, "global_step": 656899, "epoch": 7914} {"train_loss": -28.63397216796875, "global_step": 656900, "epoch": 7914} {"train_loss": -28.48651123046875, "global_step": 656901, "epoch": 7914} {"train_loss": -28.38960075378418, "global_step": 656902, "epoch": 7914} {"train_loss": -28.537464141845703, "global_step": 656903, "epoch": 7914} {"train_loss": -28.26865577697754, "global_step": 656904, "epoch": 7914} {"train_loss": -28.462270736694336, "global_step": 656905, "epoch": 7914} {"train_loss": -28.252166748046875, "global_step": 656906, "epoch": 7914} {"train_loss": -28.381134033203125, "global_step": 656907, "epoch": 7914} {"train_loss": -28.735870361328125, "global_step": 656908, "epoch": 7914} {"train_loss": -28.54953956604004, "global_step": 656909, "epoch": 7914} {"train_loss": -28.243261337280273, "global_step": 656910, "epoch": 7914} {"train_loss": -28.48622703552246, "global_step": 656911, "epoch": 7914} {"train_loss": -28.32672691345215, "global_step": 656912, "epoch": 7914} {"train_loss": -28.375690460205078, "global_step": 656913, "epoch": 7914} {"train_loss": -28.528501510620117, "global_step": 656914, "epoch": 7914} {"train_loss": -28.456836700439453, "global_step": 656915, "epoch": 7914} {"train_loss": -28.32063102722168, "global_step": 656916, "epoch": 7914} {"train_loss": -28.415943145751953, "global_step": 656917, "epoch": 7914} {"train_loss": -28.104522705078125, "global_step": 656918, "epoch": 7914} {"train_loss": -28.431039810180664, "global_step": 656919, "epoch": 7914} {"train_loss": -28.378782272338867, "global_step": 656920, "epoch": 7914} {"train_loss": -28.27723503112793, "global_step": 656921, "epoch": 7914} {"train_loss": -28.601119995117188, "global_step": 656922, "epoch": 7914} {"train_loss": -28.64081382751465, "global_step": 656923, "epoch": 7914} {"train_loss": -28.14898681640625, "global_step": 656924, "epoch": 7914} {"train_loss": -28.340559005737305, "global_step": 656925, "epoch": 7914} {"train_loss": -28.427536010742188, "global_step": 656926, "epoch": 7914} {"train_loss": -27.873554229736328, "global_step": 656927, "epoch": 7914} {"train_loss": -27.463916778564453, "global_step": 656928, "epoch": 7914} {"train_loss": -27.81460952758789, "global_step": 656929, "epoch": 7914} {"train_loss": -28.10532569885254, "global_step": 656930, "epoch": 7914} {"train_loss": -28.22553825378418, "global_step": 656931, "epoch": 7914} {"train_loss": -28.423782348632812, "global_step": 656932, "epoch": 7914} {"train_loss": -27.992176055908203, "global_step": 656933, "epoch": 7914} {"train_loss": -27.9964542388916, "global_step": 656934, "epoch": 7914} {"train_loss": -28.41480827331543, "global_step": 656935, "epoch": 7914} {"train_loss": -28.530170440673828, "global_step": 656936, "epoch": 7914} {"train_loss": -28.301483154296875, "global_step": 656937, "epoch": 7914} {"train_loss": -28.106704711914062, "global_step": 656938, "epoch": 7914} {"train_loss": -28.359373092651367, "global_step": 656939, "epoch": 7914} {"train_loss": -28.20782470703125, "global_step": 656940, "epoch": 7914} {"train_loss": -28.411712646484375, "global_step": 656941, "epoch": 7914} {"train_loss": -28.518024444580078, "global_step": 656942, "epoch": 7914} {"train_loss": -28.12723731994629, "global_step": 656943, "epoch": 7914} {"train_loss": -28.153130358960254, "global_step": 656944, "epoch": 7914, "val_loss": 6679398.0} {"train_loss": -28.045459747314453, "global_step": 656945, "epoch": 7915} {"train_loss": -28.060028076171875, "global_step": 656946, "epoch": 7915} {"train_loss": -28.073957443237305, "global_step": 656947, "epoch": 7915} {"train_loss": -27.732030868530273, "global_step": 656948, "epoch": 7915} {"train_loss": -27.944656372070312, "global_step": 656949, "epoch": 7915} {"train_loss": -28.235925674438477, "global_step": 656950, "epoch": 7915} {"train_loss": -28.116809844970703, "global_step": 656951, "epoch": 7915} {"train_loss": -28.263219833374023, "global_step": 656952, "epoch": 7915} {"train_loss": -28.154687881469727, "global_step": 656953, "epoch": 7915} {"train_loss": -27.886316299438477, "global_step": 656954, "epoch": 7915} {"train_loss": -28.546483993530273, "global_step": 656955, "epoch": 7915} {"train_loss": -28.231298446655273, "global_step": 656956, "epoch": 7915} {"train_loss": -28.159423828125, "global_step": 656957, "epoch": 7915} {"train_loss": -28.304656982421875, "global_step": 656958, "epoch": 7915} {"train_loss": -28.52215003967285, "global_step": 656959, "epoch": 7915} {"train_loss": -28.580902099609375, "global_step": 656960, "epoch": 7915} {"train_loss": -28.113088607788086, "global_step": 656961, "epoch": 7915} {"train_loss": -28.33669090270996, "global_step": 656962, "epoch": 7915} {"train_loss": -28.6439266204834, "global_step": 656963, "epoch": 7915} {"train_loss": -28.50860595703125, "global_step": 656964, "epoch": 7915} {"train_loss": -28.261449813842773, "global_step": 656965, "epoch": 7915} {"train_loss": -28.439777374267578, "global_step": 656966, "epoch": 7915} {"train_loss": -28.526721954345703, "global_step": 656967, "epoch": 7915} {"train_loss": -28.47593116760254, "global_step": 656968, "epoch": 7915} {"train_loss": -28.0396728515625, "global_step": 656969, "epoch": 7915} {"train_loss": -28.514209747314453, "global_step": 656970, "epoch": 7915} {"train_loss": -28.26093864440918, "global_step": 656971, "epoch": 7915} {"train_loss": -28.69683837890625, "global_step": 656972, "epoch": 7915} {"train_loss": -28.80232048034668, "global_step": 656973, "epoch": 7915} {"train_loss": -28.333301544189453, "global_step": 656974, "epoch": 7915} {"train_loss": -28.461145401000977, "global_step": 656975, "epoch": 7915} {"train_loss": -28.565021514892578, "global_step": 656976, "epoch": 7915} {"train_loss": -28.611572265625, "global_step": 656977, "epoch": 7915} {"train_loss": -28.3673095703125, "global_step": 656978, "epoch": 7915} {"train_loss": -28.100004196166992, "global_step": 656979, "epoch": 7915} {"train_loss": -28.74285888671875, "global_step": 656980, "epoch": 7915} {"train_loss": -28.46933937072754, "global_step": 656981, "epoch": 7915} {"train_loss": -28.7813720703125, "global_step": 656982, "epoch": 7915} {"train_loss": -28.4729061126709, "global_step": 656983, "epoch": 7915} {"train_loss": -28.317930221557617, "global_step": 656984, "epoch": 7915} {"train_loss": -28.343149185180664, "global_step": 656985, "epoch": 7915} {"train_loss": -28.06300163269043, "global_step": 656986, "epoch": 7915} {"train_loss": -28.687345504760742, "global_step": 656987, "epoch": 7915} {"train_loss": -28.389875411987305, "global_step": 656988, "epoch": 7915} {"train_loss": -28.926671981811523, "global_step": 656989, "epoch": 7915} {"train_loss": -27.9616756439209, "global_step": 656990, "epoch": 7915} {"train_loss": -28.243268966674805, "global_step": 656991, "epoch": 7915} {"train_loss": -28.328466415405273, "global_step": 656992, "epoch": 7915} {"train_loss": -28.607166290283203, "global_step": 656993, "epoch": 7915} {"train_loss": -28.497236251831055, "global_step": 656994, "epoch": 7915} {"train_loss": -28.450681686401367, "global_step": 656995, "epoch": 7915} {"train_loss": -28.465280532836914, "global_step": 656996, "epoch": 7915} {"train_loss": -28.584287643432617, "global_step": 656997, "epoch": 7915} {"train_loss": -28.28125, "global_step": 656998, "epoch": 7915} {"train_loss": -28.19293785095215, "global_step": 656999, "epoch": 7915} {"train_loss": -28.149246215820312, "global_step": 657000, "epoch": 7915} {"train_loss": -28.324689865112305, "global_step": 657001, "epoch": 7915} {"train_loss": -28.179880142211914, "global_step": 657002, "epoch": 7915} {"train_loss": -28.628705978393555, "global_step": 657003, "epoch": 7915} {"train_loss": -27.865631103515625, "global_step": 657004, "epoch": 7915} {"train_loss": -28.306751251220703, "global_step": 657005, "epoch": 7915} {"train_loss": -28.321313858032227, "global_step": 657006, "epoch": 7915} {"train_loss": -28.199920654296875, "global_step": 657007, "epoch": 7915} {"train_loss": -28.19074058532715, "global_step": 657008, "epoch": 7915} {"train_loss": -28.642236709594727, "global_step": 657009, "epoch": 7915} {"train_loss": -28.395416259765625, "global_step": 657010, "epoch": 7915} {"train_loss": -28.596435546875, "global_step": 657011, "epoch": 7915} {"train_loss": -28.80836296081543, "global_step": 657012, "epoch": 7915} {"train_loss": -28.66571044921875, "global_step": 657013, "epoch": 7915} {"train_loss": -28.825536727905273, "global_step": 657014, "epoch": 7915} {"train_loss": -28.302448272705078, "global_step": 657015, "epoch": 7915} {"train_loss": -28.316198348999023, "global_step": 657016, "epoch": 7915} {"train_loss": -28.681537628173828, "global_step": 657017, "epoch": 7915} {"train_loss": -28.329425811767578, "global_step": 657018, "epoch": 7915} {"train_loss": -28.709278106689453, "global_step": 657019, "epoch": 7915} {"train_loss": -28.6214656829834, "global_step": 657020, "epoch": 7915} {"train_loss": -28.81072998046875, "global_step": 657021, "epoch": 7915} {"train_loss": -28.499425888061523, "global_step": 657022, "epoch": 7915} {"train_loss": -28.55350685119629, "global_step": 657023, "epoch": 7915} {"train_loss": -28.458209991455078, "global_step": 657024, "epoch": 7915} {"train_loss": -28.369882583618164, "global_step": 657025, "epoch": 7915} {"train_loss": -28.768783569335938, "global_step": 657026, "epoch": 7915} {"train_loss": -28.39382684087179, "global_step": 657027, "epoch": 7915, "val_loss": 6703032.0} {"train_loss": -25.805219650268555, "global_step": 657028, "epoch": 7916} {"train_loss": -26.804548263549805, "global_step": 657029, "epoch": 7916} {"train_loss": -27.61542320251465, "global_step": 657030, "epoch": 7916} {"train_loss": -26.74969482421875, "global_step": 657031, "epoch": 7916} {"train_loss": -27.240081787109375, "global_step": 657032, "epoch": 7916} {"train_loss": -26.293725967407227, "global_step": 657033, "epoch": 7916} {"train_loss": -26.67214012145996, "global_step": 657034, "epoch": 7916} {"train_loss": -26.71148681640625, "global_step": 657035, "epoch": 7916} {"train_loss": -27.540149688720703, "global_step": 657036, "epoch": 7916} {"train_loss": -27.451379776000977, "global_step": 657037, "epoch": 7916} {"train_loss": -27.621686935424805, "global_step": 657038, "epoch": 7916} {"train_loss": -27.301538467407227, "global_step": 657039, "epoch": 7916} {"train_loss": -26.834808349609375, "global_step": 657040, "epoch": 7916} {"train_loss": -27.714893341064453, "global_step": 657041, "epoch": 7916} {"train_loss": -27.551618576049805, "global_step": 657042, "epoch": 7916} {"train_loss": -27.396869659423828, "global_step": 657043, "epoch": 7916} {"train_loss": -27.870349884033203, "global_step": 657044, "epoch": 7916} {"train_loss": -27.36305046081543, "global_step": 657045, "epoch": 7916} {"train_loss": -27.909759521484375, "global_step": 657046, "epoch": 7916} {"train_loss": -27.56650733947754, "global_step": 657047, "epoch": 7916} {"train_loss": -27.707563400268555, "global_step": 657048, "epoch": 7916} {"train_loss": -27.75896644592285, "global_step": 657049, "epoch": 7916} {"train_loss": -28.024213790893555, "global_step": 657050, "epoch": 7916} {"train_loss": -27.949798583984375, "global_step": 657051, "epoch": 7916} {"train_loss": -27.75642204284668, "global_step": 657052, "epoch": 7916} {"train_loss": -27.944217681884766, "global_step": 657053, "epoch": 7916} {"train_loss": -28.168603897094727, "global_step": 657054, "epoch": 7916} {"train_loss": -28.030725479125977, "global_step": 657055, "epoch": 7916} {"train_loss": -27.921340942382812, "global_step": 657056, "epoch": 7916} {"train_loss": -28.01677894592285, "global_step": 657057, "epoch": 7916} {"train_loss": -28.11767578125, "global_step": 657058, "epoch": 7916} {"train_loss": -27.75143814086914, "global_step": 657059, "epoch": 7916} {"train_loss": -28.161304473876953, "global_step": 657060, "epoch": 7916} {"train_loss": -28.230478286743164, "global_step": 657061, "epoch": 7916} {"train_loss": -28.4017276763916, "global_step": 657062, "epoch": 7916} {"train_loss": -27.85146141052246, "global_step": 657063, "epoch": 7916} {"train_loss": -28.20774269104004, "global_step": 657064, "epoch": 7916} {"train_loss": -28.363927841186523, "global_step": 657065, "epoch": 7916} {"train_loss": -28.517810821533203, "global_step": 657066, "epoch": 7916} {"train_loss": -28.06564712524414, "global_step": 657067, "epoch": 7916} {"train_loss": -27.97565269470215, "global_step": 657068, "epoch": 7916} {"train_loss": -28.208953857421875, "global_step": 657069, "epoch": 7916} {"train_loss": -28.269628524780273, "global_step": 657070, "epoch": 7916} {"train_loss": -28.228046417236328, "global_step": 657071, "epoch": 7916} {"train_loss": -28.26738929748535, "global_step": 657072, "epoch": 7916} {"train_loss": -28.577497482299805, "global_step": 657073, "epoch": 7916} {"train_loss": -28.01399803161621, "global_step": 657074, "epoch": 7916} {"train_loss": -28.52207374572754, "global_step": 657075, "epoch": 7916} {"train_loss": -28.35797119140625, "global_step": 657076, "epoch": 7916} {"train_loss": -28.467004776000977, "global_step": 657077, "epoch": 7916} {"train_loss": -28.58376121520996, "global_step": 657078, "epoch": 7916} {"train_loss": -28.094221115112305, "global_step": 657079, "epoch": 7916} {"train_loss": -28.31220054626465, "global_step": 657080, "epoch": 7916} {"train_loss": -28.361328125, "global_step": 657081, "epoch": 7916} {"train_loss": -28.36114501953125, "global_step": 657082, "epoch": 7916} {"train_loss": -28.39910888671875, "global_step": 657083, "epoch": 7916} {"train_loss": -28.42274284362793, "global_step": 657084, "epoch": 7916} {"train_loss": -28.576587677001953, "global_step": 657085, "epoch": 7916} {"train_loss": -29.041101455688477, "global_step": 657086, "epoch": 7916} {"train_loss": -27.991788864135742, "global_step": 657087, "epoch": 7916} {"train_loss": -28.540578842163086, "global_step": 657088, "epoch": 7916} {"train_loss": -28.99456214904785, "global_step": 657089, "epoch": 7916} {"train_loss": -28.24159049987793, "global_step": 657090, "epoch": 7916} {"train_loss": -28.259296417236328, "global_step": 657091, "epoch": 7916} {"train_loss": -28.723352432250977, "global_step": 657092, "epoch": 7916} {"train_loss": -28.318754196166992, "global_step": 657093, "epoch": 7916} {"train_loss": -28.711496353149414, "global_step": 657094, "epoch": 7916} {"train_loss": -28.72881507873535, "global_step": 657095, "epoch": 7916} {"train_loss": -28.291101455688477, "global_step": 657096, "epoch": 7916} {"train_loss": -28.685028076171875, "global_step": 657097, "epoch": 7916} {"train_loss": -28.452255249023438, "global_step": 657098, "epoch": 7916} {"train_loss": -28.4713077545166, "global_step": 657099, "epoch": 7916} {"train_loss": -28.433263778686523, "global_step": 657100, "epoch": 7916} {"train_loss": -28.550397872924805, "global_step": 657101, "epoch": 7916} {"train_loss": -28.589319229125977, "global_step": 657102, "epoch": 7916} {"train_loss": -28.70928955078125, "global_step": 657103, "epoch": 7916} {"train_loss": -28.283111572265625, "global_step": 657104, "epoch": 7916} {"train_loss": -28.428876876831055, "global_step": 657105, "epoch": 7916} {"train_loss": -28.4941349029541, "global_step": 657106, "epoch": 7916} {"train_loss": -28.364118576049805, "global_step": 657107, "epoch": 7916} {"train_loss": -28.73579216003418, "global_step": 657108, "epoch": 7916} {"train_loss": -28.545331954956055, "global_step": 657109, "epoch": 7916} {"train_loss": -28.05476223129824, "global_step": 657110, "epoch": 7916, "val_loss": 6725415.5} {"train_loss": -27.935571670532227, "global_step": 657111, "epoch": 7917} {"train_loss": -27.6417293548584, "global_step": 657112, "epoch": 7917} {"train_loss": -28.189279556274414, "global_step": 657113, "epoch": 7917} {"train_loss": -27.84271240234375, "global_step": 657114, "epoch": 7917} {"train_loss": -27.270462036132812, "global_step": 657115, "epoch": 7917} {"train_loss": -27.54742431640625, "global_step": 657116, "epoch": 7917} {"train_loss": -28.12616539001465, "global_step": 657117, "epoch": 7917} {"train_loss": -27.829137802124023, "global_step": 657118, "epoch": 7917} {"train_loss": -27.76529312133789, "global_step": 657119, "epoch": 7917} {"train_loss": -27.771514892578125, "global_step": 657120, "epoch": 7917} {"train_loss": -28.086151123046875, "global_step": 657121, "epoch": 7917} {"train_loss": -27.653711318969727, "global_step": 657122, "epoch": 7917} {"train_loss": -27.885385513305664, "global_step": 657123, "epoch": 7917} {"train_loss": -28.440887451171875, "global_step": 657124, "epoch": 7917} {"train_loss": -27.475067138671875, "global_step": 657125, "epoch": 7917} {"train_loss": -27.670236587524414, "global_step": 657126, "epoch": 7917} {"train_loss": -27.897109985351562, "global_step": 657127, "epoch": 7917} {"train_loss": -28.25713539123535, "global_step": 657128, "epoch": 7917} {"train_loss": -27.84992027282715, "global_step": 657129, "epoch": 7917} {"train_loss": -28.042673110961914, "global_step": 657130, "epoch": 7917} {"train_loss": -28.32472038269043, "global_step": 657131, "epoch": 7917} {"train_loss": -28.304960250854492, "global_step": 657132, "epoch": 7917} {"train_loss": -28.070226669311523, "global_step": 657133, "epoch": 7917} {"train_loss": -28.1594295501709, "global_step": 657134, "epoch": 7917} {"train_loss": -28.1038761138916, "global_step": 657135, "epoch": 7917} {"train_loss": -27.78020668029785, "global_step": 657136, "epoch": 7917} {"train_loss": -28.18250846862793, "global_step": 657137, "epoch": 7917} {"train_loss": -27.9307918548584, "global_step": 657138, "epoch": 7917} {"train_loss": -28.42425537109375, "global_step": 657139, "epoch": 7917} {"train_loss": -28.583831787109375, "global_step": 657140, "epoch": 7917} {"train_loss": -28.27546501159668, "global_step": 657141, "epoch": 7917} {"train_loss": -28.259368896484375, "global_step": 657142, "epoch": 7917} {"train_loss": -28.210540771484375, "global_step": 657143, "epoch": 7917} {"train_loss": -27.885000228881836, "global_step": 657144, "epoch": 7917} {"train_loss": -28.573928833007812, "global_step": 657145, "epoch": 7917} {"train_loss": -28.23195457458496, "global_step": 657146, "epoch": 7917} {"train_loss": -27.9728946685791, "global_step": 657147, "epoch": 7917} {"train_loss": -27.877277374267578, "global_step": 657148, "epoch": 7917} {"train_loss": -28.006189346313477, "global_step": 657149, "epoch": 7917} {"train_loss": -28.127227783203125, "global_step": 657150, "epoch": 7917} {"train_loss": -28.16621208190918, "global_step": 657151, "epoch": 7917} {"train_loss": -28.21834373474121, "global_step": 657152, "epoch": 7917} {"train_loss": -28.275470733642578, "global_step": 657153, "epoch": 7917} {"train_loss": -28.53053092956543, "global_step": 657154, "epoch": 7917} {"train_loss": -28.487476348876953, "global_step": 657155, "epoch": 7917} {"train_loss": -28.447052001953125, "global_step": 657156, "epoch": 7917} {"train_loss": -28.234622955322266, "global_step": 657157, "epoch": 7917} {"train_loss": -28.62568473815918, "global_step": 657158, "epoch": 7917} {"train_loss": -28.469879150390625, "global_step": 657159, "epoch": 7917} {"train_loss": -28.111677169799805, "global_step": 657160, "epoch": 7917} {"train_loss": -28.522886276245117, "global_step": 657161, "epoch": 7917} {"train_loss": -28.464643478393555, "global_step": 657162, "epoch": 7917} {"train_loss": -28.374847412109375, "global_step": 657163, "epoch": 7917} {"train_loss": -28.309858322143555, "global_step": 657164, "epoch": 7917} {"train_loss": -28.767072677612305, "global_step": 657165, "epoch": 7917} {"train_loss": -28.331151962280273, "global_step": 657166, "epoch": 7917} {"train_loss": -28.482563018798828, "global_step": 657167, "epoch": 7917} {"train_loss": -28.584522247314453, "global_step": 657168, "epoch": 7917} {"train_loss": -28.645105361938477, "global_step": 657169, "epoch": 7917} {"train_loss": -28.44098472595215, "global_step": 657170, "epoch": 7917} {"train_loss": -28.46445083618164, "global_step": 657171, "epoch": 7917} {"train_loss": -28.869598388671875, "global_step": 657172, "epoch": 7917} {"train_loss": -28.226856231689453, "global_step": 657173, "epoch": 7917} {"train_loss": -28.499359130859375, "global_step": 657174, "epoch": 7917} {"train_loss": -28.6890869140625, "global_step": 657175, "epoch": 7917} {"train_loss": -28.580432891845703, "global_step": 657176, "epoch": 7917} {"train_loss": -28.678668975830078, "global_step": 657177, "epoch": 7917} {"train_loss": -28.42667579650879, "global_step": 657178, "epoch": 7917} {"train_loss": -28.428211212158203, "global_step": 657179, "epoch": 7917} {"train_loss": -28.220266342163086, "global_step": 657180, "epoch": 7917} {"train_loss": -28.275863647460938, "global_step": 657181, "epoch": 7917} {"train_loss": -28.493711471557617, "global_step": 657182, "epoch": 7917} {"train_loss": -28.36627769470215, "global_step": 657183, "epoch": 7917} {"train_loss": -28.61882972717285, "global_step": 657184, "epoch": 7917} {"train_loss": -28.725833892822266, "global_step": 657185, "epoch": 7917} {"train_loss": -28.180450439453125, "global_step": 657186, "epoch": 7917} {"train_loss": -28.395002365112305, "global_step": 657187, "epoch": 7917} {"train_loss": -28.639484405517578, "global_step": 657188, "epoch": 7917} {"train_loss": -28.474014282226562, "global_step": 657189, "epoch": 7917} {"train_loss": -28.550506591796875, "global_step": 657190, "epoch": 7917} {"train_loss": -28.378498077392578, "global_step": 657191, "epoch": 7917} {"train_loss": -28.449132919311523, "global_step": 657192, "epoch": 7917} {"train_loss": -28.245961844202984, "global_step": 657193, "epoch": 7917, "val_loss": 6694170.5} {"train_loss": -27.353458404541016, "global_step": 657194, "epoch": 7918} {"train_loss": -27.610639572143555, "global_step": 657195, "epoch": 7918} {"train_loss": -27.962940216064453, "global_step": 657196, "epoch": 7918} {"train_loss": -28.017202377319336, "global_step": 657197, "epoch": 7918} {"train_loss": -27.6343994140625, "global_step": 657198, "epoch": 7918} {"train_loss": -27.443464279174805, "global_step": 657199, "epoch": 7918} {"train_loss": -27.678144454956055, "global_step": 657200, "epoch": 7918} {"train_loss": -27.742034912109375, "global_step": 657201, "epoch": 7918} {"train_loss": -27.459381103515625, "global_step": 657202, "epoch": 7918} {"train_loss": -28.0919246673584, "global_step": 657203, "epoch": 7918} {"train_loss": -27.309534072875977, "global_step": 657204, "epoch": 7918} {"train_loss": -27.77863121032715, "global_step": 657205, "epoch": 7918} {"train_loss": -27.759763717651367, "global_step": 657206, "epoch": 7918} {"train_loss": -27.952274322509766, "global_step": 657207, "epoch": 7918} {"train_loss": -28.102529525756836, "global_step": 657208, "epoch": 7918} {"train_loss": -28.457651138305664, "global_step": 657209, "epoch": 7918} {"train_loss": -27.6715030670166, "global_step": 657210, "epoch": 7918} {"train_loss": -27.945392608642578, "global_step": 657211, "epoch": 7918} {"train_loss": -27.986907958984375, "global_step": 657212, "epoch": 7918} {"train_loss": -27.9069766998291, "global_step": 657213, "epoch": 7918} {"train_loss": -27.852039337158203, "global_step": 657214, "epoch": 7918} {"train_loss": -27.705738067626953, "global_step": 657215, "epoch": 7918} {"train_loss": -28.44797134399414, "global_step": 657216, "epoch": 7918} {"train_loss": -28.042810440063477, "global_step": 657217, "epoch": 7918} {"train_loss": -28.419614791870117, "global_step": 657218, "epoch": 7918} {"train_loss": -28.048725128173828, "global_step": 657219, "epoch": 7918} {"train_loss": -28.170236587524414, "global_step": 657220, "epoch": 7918} {"train_loss": -28.15949821472168, "global_step": 657221, "epoch": 7918} {"train_loss": -28.349557876586914, "global_step": 657222, "epoch": 7918} {"train_loss": -28.34785270690918, "global_step": 657223, "epoch": 7918} {"train_loss": -28.06781005859375, "global_step": 657224, "epoch": 7918} {"train_loss": -28.15543556213379, "global_step": 657225, "epoch": 7918} {"train_loss": -27.969406127929688, "global_step": 657226, "epoch": 7918} {"train_loss": -28.271087646484375, "global_step": 657227, "epoch": 7918} {"train_loss": -28.312519073486328, "global_step": 657228, "epoch": 7918} {"train_loss": -28.254886627197266, "global_step": 657229, "epoch": 7918} {"train_loss": -28.48076820373535, "global_step": 657230, "epoch": 7918} {"train_loss": -28.10822105407715, "global_step": 657231, "epoch": 7918} {"train_loss": -27.905630111694336, "global_step": 657232, "epoch": 7918} {"train_loss": -28.832046508789062, "global_step": 657233, "epoch": 7918} {"train_loss": -28.5970516204834, "global_step": 657234, "epoch": 7918} {"train_loss": -27.95932388305664, "global_step": 657235, "epoch": 7918} {"train_loss": -28.08403968811035, "global_step": 657236, "epoch": 7918} {"train_loss": -28.65131187438965, "global_step": 657237, "epoch": 7918} {"train_loss": -28.239837646484375, "global_step": 657238, "epoch": 7918} {"train_loss": -28.349462509155273, "global_step": 657239, "epoch": 7918} {"train_loss": -28.164600372314453, "global_step": 657240, "epoch": 7918} {"train_loss": -28.470733642578125, "global_step": 657241, "epoch": 7918} {"train_loss": -28.46980094909668, "global_step": 657242, "epoch": 7918} {"train_loss": -28.34281349182129, "global_step": 657243, "epoch": 7918} {"train_loss": -28.29071617126465, "global_step": 657244, "epoch": 7918} {"train_loss": -28.576416015625, "global_step": 657245, "epoch": 7918} {"train_loss": -28.23261833190918, "global_step": 657246, "epoch": 7918} {"train_loss": -28.53472900390625, "global_step": 657247, "epoch": 7918} {"train_loss": -28.554996490478516, "global_step": 657248, "epoch": 7918} {"train_loss": -28.50107765197754, "global_step": 657249, "epoch": 7918} {"train_loss": -28.90351676940918, "global_step": 657250, "epoch": 7918} {"train_loss": -28.84174156188965, "global_step": 657251, "epoch": 7918} {"train_loss": -28.502721786499023, "global_step": 657252, "epoch": 7918} {"train_loss": -28.576196670532227, "global_step": 657253, "epoch": 7918} {"train_loss": -28.618865966796875, "global_step": 657254, "epoch": 7918} {"train_loss": -28.915918350219727, "global_step": 657255, "epoch": 7918} {"train_loss": -28.615447998046875, "global_step": 657256, "epoch": 7918} {"train_loss": -28.18698501586914, "global_step": 657257, "epoch": 7918} {"train_loss": -28.597299575805664, "global_step": 657258, "epoch": 7918} {"train_loss": -28.660863876342773, "global_step": 657259, "epoch": 7918} {"train_loss": -28.847944259643555, "global_step": 657260, "epoch": 7918} {"train_loss": -28.0946102142334, "global_step": 657261, "epoch": 7918} {"train_loss": -28.818078994750977, "global_step": 657262, "epoch": 7918} {"train_loss": -28.785400390625, "global_step": 657263, "epoch": 7918} {"train_loss": -28.214630126953125, "global_step": 657264, "epoch": 7918} {"train_loss": -28.59588050842285, "global_step": 657265, "epoch": 7918} {"train_loss": -28.758136749267578, "global_step": 657266, "epoch": 7918} {"train_loss": -28.40022087097168, "global_step": 657267, "epoch": 7918} {"train_loss": -28.64404296875, "global_step": 657268, "epoch": 7918} {"train_loss": -28.214893341064453, "global_step": 657269, "epoch": 7918} {"train_loss": -28.567596435546875, "global_step": 657270, "epoch": 7918} {"train_loss": -28.254270553588867, "global_step": 657271, "epoch": 7918} {"train_loss": -28.50714111328125, "global_step": 657272, "epoch": 7918} {"train_loss": -28.33747673034668, "global_step": 657273, "epoch": 7918} {"train_loss": -28.4831600189209, "global_step": 657274, "epoch": 7918} {"train_loss": -28.30915641784668, "global_step": 657275, "epoch": 7918} {"train_loss": -28.24557217057929, "global_step": 657276, "epoch": 7918, "val_loss": 6701086.0} {"train_loss": -27.797687530517578, "global_step": 657277, "epoch": 7919} {"train_loss": -27.364410400390625, "global_step": 657278, "epoch": 7919} {"train_loss": -27.45261573791504, "global_step": 657279, "epoch": 7919} {"train_loss": -27.585168838500977, "global_step": 657280, "epoch": 7919} {"train_loss": -27.43581199645996, "global_step": 657281, "epoch": 7919} {"train_loss": -27.330341339111328, "global_step": 657282, "epoch": 7919} {"train_loss": -27.623462677001953, "global_step": 657283, "epoch": 7919} {"train_loss": -27.643590927124023, "global_step": 657284, "epoch": 7919} {"train_loss": -27.33771324157715, "global_step": 657285, "epoch": 7919} {"train_loss": -27.208480834960938, "global_step": 657286, "epoch": 7919} {"train_loss": -28.137800216674805, "global_step": 657287, "epoch": 7919} {"train_loss": -27.263830184936523, "global_step": 657288, "epoch": 7919} {"train_loss": -27.417699813842773, "global_step": 657289, "epoch": 7919} {"train_loss": -27.749670028686523, "global_step": 657290, "epoch": 7919} {"train_loss": -27.66397476196289, "global_step": 657291, "epoch": 7919} {"train_loss": -27.94476318359375, "global_step": 657292, "epoch": 7919} {"train_loss": -28.16839027404785, "global_step": 657293, "epoch": 7919} {"train_loss": -27.856292724609375, "global_step": 657294, "epoch": 7919} {"train_loss": -28.258544921875, "global_step": 657295, "epoch": 7919} {"train_loss": -27.712448120117188, "global_step": 657296, "epoch": 7919} {"train_loss": -27.919843673706055, "global_step": 657297, "epoch": 7919} {"train_loss": -27.9742374420166, "global_step": 657298, "epoch": 7919} {"train_loss": -28.234281539916992, "global_step": 657299, "epoch": 7919} {"train_loss": -28.04204750061035, "global_step": 657300, "epoch": 7919} {"train_loss": -28.249271392822266, "global_step": 657301, "epoch": 7919} {"train_loss": -28.12896728515625, "global_step": 657302, "epoch": 7919} {"train_loss": -28.504810333251953, "global_step": 657303, "epoch": 7919} {"train_loss": -28.43812370300293, "global_step": 657304, "epoch": 7919} {"train_loss": -28.188373565673828, "global_step": 657305, "epoch": 7919} {"train_loss": -28.027524948120117, "global_step": 657306, "epoch": 7919} {"train_loss": -28.47608757019043, "global_step": 657307, "epoch": 7919} {"train_loss": -28.37904167175293, "global_step": 657308, "epoch": 7919} {"train_loss": -28.119596481323242, "global_step": 657309, "epoch": 7919} {"train_loss": -28.44460105895996, "global_step": 657310, "epoch": 7919} {"train_loss": -28.36685562133789, "global_step": 657311, "epoch": 7919} {"train_loss": -28.386266708374023, "global_step": 657312, "epoch": 7919} {"train_loss": -28.23923683166504, "global_step": 657313, "epoch": 7919} {"train_loss": -28.77841567993164, "global_step": 657314, "epoch": 7919} {"train_loss": -28.50642967224121, "global_step": 657315, "epoch": 7919} {"train_loss": -28.607330322265625, "global_step": 657316, "epoch": 7919} {"train_loss": -28.524389266967773, "global_step": 657317, "epoch": 7919} {"train_loss": -28.564130783081055, "global_step": 657318, "epoch": 7919} {"train_loss": -28.64068603515625, "global_step": 657319, "epoch": 7919} {"train_loss": -28.400379180908203, "global_step": 657320, "epoch": 7919} {"train_loss": -28.607440948486328, "global_step": 657321, "epoch": 7919} {"train_loss": -28.532108306884766, "global_step": 657322, "epoch": 7919} {"train_loss": -28.62812614440918, "global_step": 657323, "epoch": 7919} {"train_loss": -28.6336669921875, "global_step": 657324, "epoch": 7919} {"train_loss": -28.539661407470703, "global_step": 657325, "epoch": 7919} {"train_loss": -28.53401756286621, "global_step": 657326, "epoch": 7919} {"train_loss": -28.660236358642578, "global_step": 657327, "epoch": 7919} {"train_loss": -28.930835723876953, "global_step": 657328, "epoch": 7919} {"train_loss": -29.01350975036621, "global_step": 657329, "epoch": 7919} {"train_loss": -28.527053833007812, "global_step": 657330, "epoch": 7919} {"train_loss": -28.672943115234375, "global_step": 657331, "epoch": 7919} {"train_loss": -28.338415145874023, "global_step": 657332, "epoch": 7919} {"train_loss": -28.368696212768555, "global_step": 657333, "epoch": 7919} {"train_loss": -28.237104415893555, "global_step": 657334, "epoch": 7919} {"train_loss": -28.809167861938477, "global_step": 657335, "epoch": 7919} {"train_loss": -28.74152946472168, "global_step": 657336, "epoch": 7919} {"train_loss": -28.70149803161621, "global_step": 657337, "epoch": 7919} {"train_loss": -28.468612670898438, "global_step": 657338, "epoch": 7919} {"train_loss": -28.682758331298828, "global_step": 657339, "epoch": 7919} {"train_loss": -28.756168365478516, "global_step": 657340, "epoch": 7919} {"train_loss": -28.8204345703125, "global_step": 657341, "epoch": 7919} {"train_loss": -28.523588180541992, "global_step": 657342, "epoch": 7919} {"train_loss": -28.450916290283203, "global_step": 657343, "epoch": 7919} {"train_loss": -28.52972412109375, "global_step": 657344, "epoch": 7919} {"train_loss": -27.373855590820312, "global_step": 657345, "epoch": 7919} {"train_loss": -26.91486930847168, "global_step": 657346, "epoch": 7919} {"train_loss": -27.084970474243164, "global_step": 657347, "epoch": 7919} {"train_loss": -27.9276180267334, "global_step": 657348, "epoch": 7919} {"train_loss": -27.52713966369629, "global_step": 657349, "epoch": 7919} {"train_loss": -27.86529541015625, "global_step": 657350, "epoch": 7919} {"train_loss": -28.09493064880371, "global_step": 657351, "epoch": 7919} {"train_loss": -27.9824161529541, "global_step": 657352, "epoch": 7919} {"train_loss": -28.081756591796875, "global_step": 657353, "epoch": 7919} {"train_loss": -27.789514541625977, "global_step": 657354, "epoch": 7919} {"train_loss": -27.5701961517334, "global_step": 657355, "epoch": 7919} {"train_loss": -28.31731605529785, "global_step": 657356, "epoch": 7919} {"train_loss": -27.906696319580078, "global_step": 657357, "epoch": 7919} {"train_loss": -27.672916412353516, "global_step": 657358, "epoch": 7919} {"train_loss": -28.1489206337067, "global_step": 657359, "epoch": 7919, "val_loss": 6829437.5} {"train_loss": -25.729238510131836, "global_step": 657360, "epoch": 7920} {"train_loss": -24.428266525268555, "global_step": 657361, "epoch": 7920} {"train_loss": -26.923818588256836, "global_step": 657362, "epoch": 7920} {"train_loss": -25.664594650268555, "global_step": 657363, "epoch": 7920} {"train_loss": -26.6726016998291, "global_step": 657364, "epoch": 7920} {"train_loss": -25.59865951538086, "global_step": 657365, "epoch": 7920} {"train_loss": -26.362390518188477, "global_step": 657366, "epoch": 7920} {"train_loss": -26.467334747314453, "global_step": 657367, "epoch": 7920} {"train_loss": -26.364185333251953, "global_step": 657368, "epoch": 7920} {"train_loss": -26.3876895904541, "global_step": 657369, "epoch": 7920} {"train_loss": -26.32382583618164, "global_step": 657370, "epoch": 7920} {"train_loss": -27.234729766845703, "global_step": 657371, "epoch": 7920} {"train_loss": -26.58710289001465, "global_step": 657372, "epoch": 7920} {"train_loss": -27.282995223999023, "global_step": 657373, "epoch": 7920} {"train_loss": -27.196252822875977, "global_step": 657374, "epoch": 7920} {"train_loss": -27.18375015258789, "global_step": 657375, "epoch": 7920} {"train_loss": -27.781177520751953, "global_step": 657376, "epoch": 7920} {"train_loss": -27.361425399780273, "global_step": 657377, "epoch": 7920} {"train_loss": -27.191953659057617, "global_step": 657378, "epoch": 7920} {"train_loss": -27.257421493530273, "global_step": 657379, "epoch": 7920} {"train_loss": -27.5059814453125, "global_step": 657380, "epoch": 7920} {"train_loss": -27.745019912719727, "global_step": 657381, "epoch": 7920} {"train_loss": -27.453760147094727, "global_step": 657382, "epoch": 7920} {"train_loss": -27.62898063659668, "global_step": 657383, "epoch": 7920} {"train_loss": -27.6867618560791, "global_step": 657384, "epoch": 7920} {"train_loss": -27.749731063842773, "global_step": 657385, "epoch": 7920} {"train_loss": -27.774763107299805, "global_step": 657386, "epoch": 7920} {"train_loss": -28.092609405517578, "global_step": 657387, "epoch": 7920} {"train_loss": -28.10586929321289, "global_step": 657388, "epoch": 7920} {"train_loss": -28.08768653869629, "global_step": 657389, "epoch": 7920} {"train_loss": -27.896087646484375, "global_step": 657390, "epoch": 7920} {"train_loss": -27.946252822875977, "global_step": 657391, "epoch": 7920} {"train_loss": -28.032995223999023, "global_step": 657392, "epoch": 7920} {"train_loss": -28.0743350982666, "global_step": 657393, "epoch": 7920} {"train_loss": -28.159631729125977, "global_step": 657394, "epoch": 7920} {"train_loss": -28.041913986206055, "global_step": 657395, "epoch": 7920} {"train_loss": -27.989593505859375, "global_step": 657396, "epoch": 7920} {"train_loss": -28.32990837097168, "global_step": 657397, "epoch": 7920} {"train_loss": -28.025358200073242, "global_step": 657398, "epoch": 7920} {"train_loss": -28.42417335510254, "global_step": 657399, "epoch": 7920} {"train_loss": -27.997610092163086, "global_step": 657400, "epoch": 7920} {"train_loss": -28.421478271484375, "global_step": 657401, "epoch": 7920} {"train_loss": -28.27496337890625, "global_step": 657402, "epoch": 7920} {"train_loss": -27.94815444946289, "global_step": 657403, "epoch": 7920} {"train_loss": -28.546680450439453, "global_step": 657404, "epoch": 7920} {"train_loss": -28.368803024291992, "global_step": 657405, "epoch": 7920} {"train_loss": -28.149688720703125, "global_step": 657406, "epoch": 7920} {"train_loss": -28.50087547302246, "global_step": 657407, "epoch": 7920} {"train_loss": -28.56097984313965, "global_step": 657408, "epoch": 7920} {"train_loss": -28.559295654296875, "global_step": 657409, "epoch": 7920} {"train_loss": -27.84993553161621, "global_step": 657410, "epoch": 7920} {"train_loss": -28.500532150268555, "global_step": 657411, "epoch": 7920} {"train_loss": -28.351476669311523, "global_step": 657412, "epoch": 7920} {"train_loss": -28.837162017822266, "global_step": 657413, "epoch": 7920} {"train_loss": -28.59716796875, "global_step": 657414, "epoch": 7920} {"train_loss": -28.135879516601562, "global_step": 657415, "epoch": 7920} {"train_loss": -28.498188018798828, "global_step": 657416, "epoch": 7920} {"train_loss": -28.67363929748535, "global_step": 657417, "epoch": 7920} {"train_loss": -28.262868881225586, "global_step": 657418, "epoch": 7920} {"train_loss": -28.443973541259766, "global_step": 657419, "epoch": 7920} {"train_loss": -28.29421043395996, "global_step": 657420, "epoch": 7920} {"train_loss": -28.910242080688477, "global_step": 657421, "epoch": 7920} {"train_loss": -28.813507080078125, "global_step": 657422, "epoch": 7920} {"train_loss": -28.263641357421875, "global_step": 657423, "epoch": 7920} {"train_loss": -28.412809371948242, "global_step": 657424, "epoch": 7920} {"train_loss": -28.399450302124023, "global_step": 657425, "epoch": 7920} {"train_loss": -28.28608512878418, "global_step": 657426, "epoch": 7920} {"train_loss": -28.033218383789062, "global_step": 657427, "epoch": 7920} {"train_loss": -28.10409927368164, "global_step": 657428, "epoch": 7920} {"train_loss": -27.824811935424805, "global_step": 657429, "epoch": 7920} {"train_loss": -28.315271377563477, "global_step": 657430, "epoch": 7920} {"train_loss": -28.191808700561523, "global_step": 657431, "epoch": 7920} {"train_loss": -28.24041748046875, "global_step": 657432, "epoch": 7920} {"train_loss": -28.565521240234375, "global_step": 657433, "epoch": 7920} {"train_loss": -28.388324737548828, "global_step": 657434, "epoch": 7920} {"train_loss": -28.127843856811523, "global_step": 657435, "epoch": 7920} {"train_loss": -28.234729766845703, "global_step": 657436, "epoch": 7920} {"train_loss": -28.223630905151367, "global_step": 657437, "epoch": 7920} {"train_loss": -28.190265655517578, "global_step": 657438, "epoch": 7920} {"train_loss": -28.941043853759766, "global_step": 657439, "epoch": 7920} {"train_loss": -28.034835815429688, "global_step": 657440, "epoch": 7920} {"train_loss": -28.479719161987305, "global_step": 657441, "epoch": 7920} {"train_loss": -27.826389864266638, "global_step": 657442, "epoch": 7920, "val_loss": 6867681.0} {"train_loss": -27.89725685119629, "global_step": 657443, "epoch": 7921} {"train_loss": -27.6110897064209, "global_step": 657444, "epoch": 7921} {"train_loss": -27.99708366394043, "global_step": 657445, "epoch": 7921} {"train_loss": -27.732812881469727, "global_step": 657446, "epoch": 7921} {"train_loss": -27.718616485595703, "global_step": 657447, "epoch": 7921} {"train_loss": -27.870874404907227, "global_step": 657448, "epoch": 7921} {"train_loss": -28.096744537353516, "global_step": 657449, "epoch": 7921} {"train_loss": -27.526376724243164, "global_step": 657450, "epoch": 7921} {"train_loss": -27.909509658813477, "global_step": 657451, "epoch": 7921} {"train_loss": -27.61821937561035, "global_step": 657452, "epoch": 7921} {"train_loss": -28.132349014282227, "global_step": 657453, "epoch": 7921} {"train_loss": -28.296247482299805, "global_step": 657454, "epoch": 7921} {"train_loss": -27.943140029907227, "global_step": 657455, "epoch": 7921} {"train_loss": -28.245405197143555, "global_step": 657456, "epoch": 7921} {"train_loss": -28.29276466369629, "global_step": 657457, "epoch": 7921} {"train_loss": -28.25739097595215, "global_step": 657458, "epoch": 7921} {"train_loss": -28.440458297729492, "global_step": 657459, "epoch": 7921} {"train_loss": -27.93170738220215, "global_step": 657460, "epoch": 7921} {"train_loss": -28.22405433654785, "global_step": 657461, "epoch": 7921} {"train_loss": -28.375625610351562, "global_step": 657462, "epoch": 7921} {"train_loss": -28.7028751373291, "global_step": 657463, "epoch": 7921} {"train_loss": -28.070907592773438, "global_step": 657464, "epoch": 7921} {"train_loss": -28.53632926940918, "global_step": 657465, "epoch": 7921} {"train_loss": -28.840728759765625, "global_step": 657466, "epoch": 7921} {"train_loss": -28.665266036987305, "global_step": 657467, "epoch": 7921} {"train_loss": -28.377811431884766, "global_step": 657468, "epoch": 7921} {"train_loss": -28.41351890563965, "global_step": 657469, "epoch": 7921} {"train_loss": -28.240482330322266, "global_step": 657470, "epoch": 7921} {"train_loss": -28.101125717163086, "global_step": 657471, "epoch": 7921} {"train_loss": -28.119586944580078, "global_step": 657472, "epoch": 7921} {"train_loss": -28.133380889892578, "global_step": 657473, "epoch": 7921} {"train_loss": -28.193571090698242, "global_step": 657474, "epoch": 7921} {"train_loss": -28.369415283203125, "global_step": 657475, "epoch": 7921} {"train_loss": -28.5784912109375, "global_step": 657476, "epoch": 7921} {"train_loss": -28.737659454345703, "global_step": 657477, "epoch": 7921} {"train_loss": -28.484638214111328, "global_step": 657478, "epoch": 7921} {"train_loss": -28.238325119018555, "global_step": 657479, "epoch": 7921} {"train_loss": -28.848468780517578, "global_step": 657480, "epoch": 7921} {"train_loss": -28.35304069519043, "global_step": 657481, "epoch": 7921} {"train_loss": -28.566085815429688, "global_step": 657482, "epoch": 7921} {"train_loss": -28.312402725219727, "global_step": 657483, "epoch": 7921} {"train_loss": -28.2796630859375, "global_step": 657484, "epoch": 7921} {"train_loss": -28.344818115234375, "global_step": 657485, "epoch": 7921} {"train_loss": -27.954681396484375, "global_step": 657486, "epoch": 7921} {"train_loss": -28.142684936523438, "global_step": 657487, "epoch": 7921} {"train_loss": -28.271347045898438, "global_step": 657488, "epoch": 7921} {"train_loss": -28.263700485229492, "global_step": 657489, "epoch": 7921} {"train_loss": -28.124664306640625, "global_step": 657490, "epoch": 7921} {"train_loss": -28.62485122680664, "global_step": 657491, "epoch": 7921} {"train_loss": -28.39955711364746, "global_step": 657492, "epoch": 7921} {"train_loss": -28.17030906677246, "global_step": 657493, "epoch": 7921} {"train_loss": -28.590002059936523, "global_step": 657494, "epoch": 7921} {"train_loss": -28.339807510375977, "global_step": 657495, "epoch": 7921} {"train_loss": -28.520811080932617, "global_step": 657496, "epoch": 7921} {"train_loss": -28.202749252319336, "global_step": 657497, "epoch": 7921} {"train_loss": -28.230915069580078, "global_step": 657498, "epoch": 7921} {"train_loss": -28.575586318969727, "global_step": 657499, "epoch": 7921} {"train_loss": -28.617816925048828, "global_step": 657500, "epoch": 7921} {"train_loss": -28.38429069519043, "global_step": 657501, "epoch": 7921} {"train_loss": -28.4835262298584, "global_step": 657502, "epoch": 7921} {"train_loss": -28.357574462890625, "global_step": 657503, "epoch": 7921} {"train_loss": -28.119993209838867, "global_step": 657504, "epoch": 7921} {"train_loss": -28.357547760009766, "global_step": 657505, "epoch": 7921} {"train_loss": -28.664609909057617, "global_step": 657506, "epoch": 7921} {"train_loss": -28.620014190673828, "global_step": 657507, "epoch": 7921} {"train_loss": -28.751623153686523, "global_step": 657508, "epoch": 7921} {"train_loss": -28.295215606689453, "global_step": 657509, "epoch": 7921} {"train_loss": -28.56679344177246, "global_step": 657510, "epoch": 7921} {"train_loss": -28.583740234375, "global_step": 657511, "epoch": 7921} {"train_loss": -28.460834503173828, "global_step": 657512, "epoch": 7921} {"train_loss": -28.13490104675293, "global_step": 657513, "epoch": 7921} {"train_loss": -28.40704345703125, "global_step": 657514, "epoch": 7921} {"train_loss": -28.49822998046875, "global_step": 657515, "epoch": 7921} {"train_loss": -28.331464767456055, "global_step": 657516, "epoch": 7921} {"train_loss": -28.62271499633789, "global_step": 657517, "epoch": 7921} {"train_loss": -28.4215145111084, "global_step": 657518, "epoch": 7921} {"train_loss": -28.5155086517334, "global_step": 657519, "epoch": 7921} {"train_loss": -28.21463966369629, "global_step": 657520, "epoch": 7921} {"train_loss": -28.493127822875977, "global_step": 657521, "epoch": 7921} {"train_loss": -27.761438369750977, "global_step": 657522, "epoch": 7921} {"train_loss": -28.022008895874023, "global_step": 657523, "epoch": 7921} {"train_loss": -28.673095703125, "global_step": 657524, "epoch": 7921} {"train_loss": -28.304962801646038, "global_step": 657525, "epoch": 7921, "val_loss": 6801554.0} {"train_loss": -27.237089157104492, "global_step": 657526, "epoch": 7922} {"train_loss": -27.444747924804688, "global_step": 657527, "epoch": 7922} {"train_loss": -27.679487228393555, "global_step": 657528, "epoch": 7922} {"train_loss": -27.791162490844727, "global_step": 657529, "epoch": 7922} {"train_loss": -28.21478271484375, "global_step": 657530, "epoch": 7922} {"train_loss": -27.386816024780273, "global_step": 657531, "epoch": 7922} {"train_loss": -27.93461036682129, "global_step": 657532, "epoch": 7922} {"train_loss": -27.563695907592773, "global_step": 657533, "epoch": 7922} {"train_loss": -28.154266357421875, "global_step": 657534, "epoch": 7922} {"train_loss": -27.746612548828125, "global_step": 657535, "epoch": 7922} {"train_loss": -27.895536422729492, "global_step": 657536, "epoch": 7922} {"train_loss": -28.36371421813965, "global_step": 657537, "epoch": 7922} {"train_loss": -27.878326416015625, "global_step": 657538, "epoch": 7922} {"train_loss": -28.04804039001465, "global_step": 657539, "epoch": 7922} {"train_loss": -27.694049835205078, "global_step": 657540, "epoch": 7922} {"train_loss": -27.596933364868164, "global_step": 657541, "epoch": 7922} {"train_loss": -27.972991943359375, "global_step": 657542, "epoch": 7922} {"train_loss": -28.294021606445312, "global_step": 657543, "epoch": 7922} {"train_loss": -27.924823760986328, "global_step": 657544, "epoch": 7922} {"train_loss": -27.752729415893555, "global_step": 657545, "epoch": 7922} {"train_loss": -27.569416046142578, "global_step": 657546, "epoch": 7922} {"train_loss": -28.239965438842773, "global_step": 657547, "epoch": 7922} {"train_loss": -27.950302124023438, "global_step": 657548, "epoch": 7922} {"train_loss": -28.263151168823242, "global_step": 657549, "epoch": 7922} {"train_loss": -28.20063591003418, "global_step": 657550, "epoch": 7922} {"train_loss": -28.32339859008789, "global_step": 657551, "epoch": 7922} {"train_loss": -28.0290584564209, "global_step": 657552, "epoch": 7922} {"train_loss": -28.719877243041992, "global_step": 657553, "epoch": 7922} {"train_loss": -28.55571937561035, "global_step": 657554, "epoch": 7922} {"train_loss": -28.203378677368164, "global_step": 657555, "epoch": 7922} {"train_loss": -28.38599967956543, "global_step": 657556, "epoch": 7922} {"train_loss": -28.260583877563477, "global_step": 657557, "epoch": 7922} {"train_loss": -28.17404556274414, "global_step": 657558, "epoch": 7922} {"train_loss": -28.00752067565918, "global_step": 657559, "epoch": 7922} {"train_loss": -28.443618774414062, "global_step": 657560, "epoch": 7922} {"train_loss": -28.53278923034668, "global_step": 657561, "epoch": 7922} {"train_loss": -28.15846061706543, "global_step": 657562, "epoch": 7922} {"train_loss": -28.379520416259766, "global_step": 657563, "epoch": 7922} {"train_loss": -28.52546501159668, "global_step": 657564, "epoch": 7922} {"train_loss": -28.525114059448242, "global_step": 657565, "epoch": 7922} {"train_loss": -28.44561195373535, "global_step": 657566, "epoch": 7922} {"train_loss": -28.414148330688477, "global_step": 657567, "epoch": 7922} {"train_loss": -28.436960220336914, "global_step": 657568, "epoch": 7922} {"train_loss": -28.471769332885742, "global_step": 657569, "epoch": 7922} {"train_loss": -28.36573600769043, "global_step": 657570, "epoch": 7922} {"train_loss": -28.197952270507812, "global_step": 657571, "epoch": 7922} {"train_loss": -28.519773483276367, "global_step": 657572, "epoch": 7922} {"train_loss": -28.612218856811523, "global_step": 657573, "epoch": 7922} {"train_loss": -28.78800392150879, "global_step": 657574, "epoch": 7922} {"train_loss": -28.288427352905273, "global_step": 657575, "epoch": 7922} {"train_loss": -28.312570571899414, "global_step": 657576, "epoch": 7922} {"train_loss": -28.756607055664062, "global_step": 657577, "epoch": 7922} {"train_loss": -28.50390625, "global_step": 657578, "epoch": 7922} {"train_loss": -27.811725616455078, "global_step": 657579, "epoch": 7922} {"train_loss": -28.3974666595459, "global_step": 657580, "epoch": 7922} {"train_loss": -28.420576095581055, "global_step": 657581, "epoch": 7922} {"train_loss": -28.60310173034668, "global_step": 657582, "epoch": 7922} {"train_loss": -28.15155601501465, "global_step": 657583, "epoch": 7922} {"train_loss": -28.56640625, "global_step": 657584, "epoch": 7922} {"train_loss": -28.192554473876953, "global_step": 657585, "epoch": 7922} {"train_loss": -28.211444854736328, "global_step": 657586, "epoch": 7922} {"train_loss": -28.22358512878418, "global_step": 657587, "epoch": 7922} {"train_loss": -28.0828857421875, "global_step": 657588, "epoch": 7922} {"train_loss": -28.137739181518555, "global_step": 657589, "epoch": 7922} {"train_loss": -27.951013565063477, "global_step": 657590, "epoch": 7922} {"train_loss": -28.0106258392334, "global_step": 657591, "epoch": 7922} {"train_loss": -28.310888290405273, "global_step": 657592, "epoch": 7922} {"train_loss": -28.25921630859375, "global_step": 657593, "epoch": 7922} {"train_loss": -28.129959106445312, "global_step": 657594, "epoch": 7922} {"train_loss": -28.29453468322754, "global_step": 657595, "epoch": 7922} {"train_loss": -28.118921279907227, "global_step": 657596, "epoch": 7922} {"train_loss": -28.014453887939453, "global_step": 657597, "epoch": 7922} {"train_loss": -28.223194122314453, "global_step": 657598, "epoch": 7922} {"train_loss": -28.340551376342773, "global_step": 657599, "epoch": 7922} {"train_loss": -28.113006591796875, "global_step": 657600, "epoch": 7922} {"train_loss": -28.02496337890625, "global_step": 657601, "epoch": 7922} {"train_loss": -27.76559829711914, "global_step": 657602, "epoch": 7922} {"train_loss": -28.207727432250977, "global_step": 657603, "epoch": 7922} {"train_loss": -28.323572158813477, "global_step": 657604, "epoch": 7922} {"train_loss": -28.510488510131836, "global_step": 657605, "epoch": 7922} {"train_loss": -28.482324600219727, "global_step": 657606, "epoch": 7922} {"train_loss": -28.37615966796875, "global_step": 657607, "epoch": 7922} {"train_loss": -28.193145889833747, "global_step": 657608, "epoch": 7922, "val_loss": 6795660.0} {"train_loss": -28.073089599609375, "global_step": 657609, "epoch": 7923} {"train_loss": -28.432600021362305, "global_step": 657610, "epoch": 7923} {"train_loss": -27.89536476135254, "global_step": 657611, "epoch": 7923} {"train_loss": -27.946035385131836, "global_step": 657612, "epoch": 7923} {"train_loss": -28.364233016967773, "global_step": 657613, "epoch": 7923} {"train_loss": -28.495929718017578, "global_step": 657614, "epoch": 7923} {"train_loss": -28.239242553710938, "global_step": 657615, "epoch": 7923} {"train_loss": -28.420690536499023, "global_step": 657616, "epoch": 7923} {"train_loss": -28.509246826171875, "global_step": 657617, "epoch": 7923} {"train_loss": -28.252695083618164, "global_step": 657618, "epoch": 7923} {"train_loss": -28.3016357421875, "global_step": 657619, "epoch": 7923} {"train_loss": -28.068164825439453, "global_step": 657620, "epoch": 7923} {"train_loss": -28.07525634765625, "global_step": 657621, "epoch": 7923} {"train_loss": -28.410099029541016, "global_step": 657622, "epoch": 7923} {"train_loss": -28.11895179748535, "global_step": 657623, "epoch": 7923} {"train_loss": -28.599414825439453, "global_step": 657624, "epoch": 7923} {"train_loss": -28.16059684753418, "global_step": 657625, "epoch": 7923} {"train_loss": -28.409332275390625, "global_step": 657626, "epoch": 7923} {"train_loss": -28.53656578063965, "global_step": 657627, "epoch": 7923} {"train_loss": -28.3048038482666, "global_step": 657628, "epoch": 7923} {"train_loss": -28.51771354675293, "global_step": 657629, "epoch": 7923} {"train_loss": -28.382761001586914, "global_step": 657630, "epoch": 7923} {"train_loss": -28.2016658782959, "global_step": 657631, "epoch": 7923} {"train_loss": -28.44902992248535, "global_step": 657632, "epoch": 7923} {"train_loss": -28.208301544189453, "global_step": 657633, "epoch": 7923} {"train_loss": -28.143091201782227, "global_step": 657634, "epoch": 7923} {"train_loss": -28.553937911987305, "global_step": 657635, "epoch": 7923} {"train_loss": -28.61630630493164, "global_step": 657636, "epoch": 7923} {"train_loss": -28.490070343017578, "global_step": 657637, "epoch": 7923} {"train_loss": -28.5402889251709, "global_step": 657638, "epoch": 7923} {"train_loss": -28.330839157104492, "global_step": 657639, "epoch": 7923} {"train_loss": -28.543283462524414, "global_step": 657640, "epoch": 7923} {"train_loss": -28.483402252197266, "global_step": 657641, "epoch": 7923} {"train_loss": -28.14883804321289, "global_step": 657642, "epoch": 7923} {"train_loss": -28.516510009765625, "global_step": 657643, "epoch": 7923} {"train_loss": -28.0367431640625, "global_step": 657644, "epoch": 7923} {"train_loss": -28.69247817993164, "global_step": 657645, "epoch": 7923} {"train_loss": -28.311359405517578, "global_step": 657646, "epoch": 7923} {"train_loss": -28.554174423217773, "global_step": 657647, "epoch": 7923} {"train_loss": -28.675251007080078, "global_step": 657648, "epoch": 7923} {"train_loss": -28.5858211517334, "global_step": 657649, "epoch": 7923} {"train_loss": -28.34174919128418, "global_step": 657650, "epoch": 7923} {"train_loss": -28.48171043395996, "global_step": 657651, "epoch": 7923} {"train_loss": -28.764129638671875, "global_step": 657652, "epoch": 7923} {"train_loss": -28.370283126831055, "global_step": 657653, "epoch": 7923} {"train_loss": -28.720861434936523, "global_step": 657654, "epoch": 7923} {"train_loss": -28.661447525024414, "global_step": 657655, "epoch": 7923} {"train_loss": -28.433332443237305, "global_step": 657656, "epoch": 7923} {"train_loss": -28.402225494384766, "global_step": 657657, "epoch": 7923} {"train_loss": -28.460153579711914, "global_step": 657658, "epoch": 7923} {"train_loss": -28.1795597076416, "global_step": 657659, "epoch": 7923} {"train_loss": -28.263891220092773, "global_step": 657660, "epoch": 7923} {"train_loss": -28.216638565063477, "global_step": 657661, "epoch": 7923} {"train_loss": -28.253915786743164, "global_step": 657662, "epoch": 7923} {"train_loss": -28.45643424987793, "global_step": 657663, "epoch": 7923} {"train_loss": -28.146167755126953, "global_step": 657664, "epoch": 7923} {"train_loss": -28.349517822265625, "global_step": 657665, "epoch": 7923} {"train_loss": -28.293811798095703, "global_step": 657666, "epoch": 7923} {"train_loss": -28.45989990234375, "global_step": 657667, "epoch": 7923} {"train_loss": -27.86713981628418, "global_step": 657668, "epoch": 7923} {"train_loss": -27.833026885986328, "global_step": 657669, "epoch": 7923} {"train_loss": -28.278085708618164, "global_step": 657670, "epoch": 7923} {"train_loss": -28.343769073486328, "global_step": 657671, "epoch": 7923} {"train_loss": -28.320226669311523, "global_step": 657672, "epoch": 7923} {"train_loss": -28.331403732299805, "global_step": 657673, "epoch": 7923} {"train_loss": -27.952362060546875, "global_step": 657674, "epoch": 7923} {"train_loss": -28.4094181060791, "global_step": 657675, "epoch": 7923} {"train_loss": -28.574365615844727, "global_step": 657676, "epoch": 7923} {"train_loss": -28.266504287719727, "global_step": 657677, "epoch": 7923} {"train_loss": -28.203414916992188, "global_step": 657678, "epoch": 7923} {"train_loss": -28.419992446899414, "global_step": 657679, "epoch": 7923} {"train_loss": -28.542804718017578, "global_step": 657680, "epoch": 7923} {"train_loss": -28.5245418548584, "global_step": 657681, "epoch": 7923} {"train_loss": -28.115528106689453, "global_step": 657682, "epoch": 7923} {"train_loss": -28.07645606994629, "global_step": 657683, "epoch": 7923} {"train_loss": -27.934789657592773, "global_step": 657684, "epoch": 7923} {"train_loss": -28.006088256835938, "global_step": 657685, "epoch": 7923} {"train_loss": -28.028898239135742, "global_step": 657686, "epoch": 7923} {"train_loss": -27.788043975830078, "global_step": 657687, "epoch": 7923} {"train_loss": -28.062536239624023, "global_step": 657688, "epoch": 7923} {"train_loss": -27.607309341430664, "global_step": 657689, "epoch": 7923} {"train_loss": -28.273590087890625, "global_step": 657690, "epoch": 7923} {"train_loss": -28.31080528626959, "global_step": 657691, "epoch": 7923, "val_loss": 6802125.0} {"train_loss": -27.6927433013916, "global_step": 657692, "epoch": 7924} {"train_loss": -27.585119247436523, "global_step": 657693, "epoch": 7924} {"train_loss": -27.718032836914062, "global_step": 657694, "epoch": 7924} {"train_loss": -27.569583892822266, "global_step": 657695, "epoch": 7924} {"train_loss": -27.270246505737305, "global_step": 657696, "epoch": 7924} {"train_loss": -27.089893341064453, "global_step": 657697, "epoch": 7924} {"train_loss": -27.142547607421875, "global_step": 657698, "epoch": 7924} {"train_loss": -27.442352294921875, "global_step": 657699, "epoch": 7924} {"train_loss": -27.6193790435791, "global_step": 657700, "epoch": 7924} {"train_loss": -27.946338653564453, "global_step": 657701, "epoch": 7924} {"train_loss": -27.950010299682617, "global_step": 657702, "epoch": 7924} {"train_loss": -28.287220001220703, "global_step": 657703, "epoch": 7924} {"train_loss": -27.323740005493164, "global_step": 657704, "epoch": 7924} {"train_loss": -27.809045791625977, "global_step": 657705, "epoch": 7924} {"train_loss": -27.312091827392578, "global_step": 657706, "epoch": 7924} {"train_loss": -27.8637638092041, "global_step": 657707, "epoch": 7924} {"train_loss": -27.515100479125977, "global_step": 657708, "epoch": 7924} {"train_loss": -28.025299072265625, "global_step": 657709, "epoch": 7924} {"train_loss": -27.881784439086914, "global_step": 657710, "epoch": 7924} {"train_loss": -27.5704402923584, "global_step": 657711, "epoch": 7924} {"train_loss": -27.8675537109375, "global_step": 657712, "epoch": 7924} {"train_loss": -28.036792755126953, "global_step": 657713, "epoch": 7924} {"train_loss": -28.197357177734375, "global_step": 657714, "epoch": 7924} {"train_loss": -28.09795570373535, "global_step": 657715, "epoch": 7924} {"train_loss": -27.981647491455078, "global_step": 657716, "epoch": 7924} {"train_loss": -28.148168563842773, "global_step": 657717, "epoch": 7924} {"train_loss": -27.76398277282715, "global_step": 657718, "epoch": 7924} {"train_loss": -28.288074493408203, "global_step": 657719, "epoch": 7924} {"train_loss": -28.224777221679688, "global_step": 657720, "epoch": 7924} {"train_loss": -28.217182159423828, "global_step": 657721, "epoch": 7924} {"train_loss": -28.460346221923828, "global_step": 657722, "epoch": 7924} {"train_loss": -28.142383575439453, "global_step": 657723, "epoch": 7924} {"train_loss": -28.202856063842773, "global_step": 657724, "epoch": 7924} {"train_loss": -28.264638900756836, "global_step": 657725, "epoch": 7924} {"train_loss": -28.778705596923828, "global_step": 657726, "epoch": 7924} {"train_loss": -28.231176376342773, "global_step": 657727, "epoch": 7924} {"train_loss": -28.35565185546875, "global_step": 657728, "epoch": 7924} {"train_loss": -28.7937068939209, "global_step": 657729, "epoch": 7924} {"train_loss": -28.258575439453125, "global_step": 657730, "epoch": 7924} {"train_loss": -28.279226303100586, "global_step": 657731, "epoch": 7924} {"train_loss": -28.535486221313477, "global_step": 657732, "epoch": 7924} {"train_loss": -28.096149444580078, "global_step": 657733, "epoch": 7924} {"train_loss": -28.54400634765625, "global_step": 657734, "epoch": 7924} {"train_loss": -28.454822540283203, "global_step": 657735, "epoch": 7924} {"train_loss": -28.206161499023438, "global_step": 657736, "epoch": 7924} {"train_loss": -28.408435821533203, "global_step": 657737, "epoch": 7924} {"train_loss": -28.55963706970215, "global_step": 657738, "epoch": 7924} {"train_loss": -28.532489776611328, "global_step": 657739, "epoch": 7924} {"train_loss": -28.804914474487305, "global_step": 657740, "epoch": 7924} {"train_loss": -28.47968101501465, "global_step": 657741, "epoch": 7924} {"train_loss": -28.6352596282959, "global_step": 657742, "epoch": 7924} {"train_loss": -28.543420791625977, "global_step": 657743, "epoch": 7924} {"train_loss": -28.3187255859375, "global_step": 657744, "epoch": 7924} {"train_loss": -28.39552116394043, "global_step": 657745, "epoch": 7924} {"train_loss": -28.507150650024414, "global_step": 657746, "epoch": 7924} {"train_loss": -28.54664421081543, "global_step": 657747, "epoch": 7924} {"train_loss": -28.382116317749023, "global_step": 657748, "epoch": 7924} {"train_loss": -28.72589111328125, "global_step": 657749, "epoch": 7924} {"train_loss": -28.69793701171875, "global_step": 657750, "epoch": 7924} {"train_loss": -28.465087890625, "global_step": 657751, "epoch": 7924} {"train_loss": -28.220977783203125, "global_step": 657752, "epoch": 7924} {"train_loss": -28.349079132080078, "global_step": 657753, "epoch": 7924} {"train_loss": -27.92047119140625, "global_step": 657754, "epoch": 7924} {"train_loss": -28.47797966003418, "global_step": 657755, "epoch": 7924} {"train_loss": -27.89462661743164, "global_step": 657756, "epoch": 7924} {"train_loss": -27.415624618530273, "global_step": 657757, "epoch": 7924} {"train_loss": -27.516626358032227, "global_step": 657758, "epoch": 7924} {"train_loss": -27.77838706970215, "global_step": 657759, "epoch": 7924} {"train_loss": -28.502721786499023, "global_step": 657760, "epoch": 7924} {"train_loss": -28.128192901611328, "global_step": 657761, "epoch": 7924} {"train_loss": -28.24652099609375, "global_step": 657762, "epoch": 7924} {"train_loss": -27.96486473083496, "global_step": 657763, "epoch": 7924} {"train_loss": -28.276580810546875, "global_step": 657764, "epoch": 7924} {"train_loss": -28.419010162353516, "global_step": 657765, "epoch": 7924} {"train_loss": -28.200265884399414, "global_step": 657766, "epoch": 7924} {"train_loss": -28.3725643157959, "global_step": 657767, "epoch": 7924} {"train_loss": -28.317319869995117, "global_step": 657768, "epoch": 7924} {"train_loss": -28.164045333862305, "global_step": 657769, "epoch": 7924} {"train_loss": -28.156904220581055, "global_step": 657770, "epoch": 7924} {"train_loss": -27.920743942260742, "global_step": 657771, "epoch": 7924} {"train_loss": -28.149988174438477, "global_step": 657772, "epoch": 7924} {"train_loss": -28.37735366821289, "global_step": 657773, "epoch": 7924} {"train_loss": -28.116762322115612, "global_step": 657774, "epoch": 7924, "val_loss": 6713373.0} {"train_loss": -28.481332778930664, "global_step": 657775, "epoch": 7925} {"train_loss": -27.870908737182617, "global_step": 657776, "epoch": 7925} {"train_loss": -27.86171531677246, "global_step": 657777, "epoch": 7925} {"train_loss": -27.790740966796875, "global_step": 657778, "epoch": 7925} {"train_loss": -27.635995864868164, "global_step": 657779, "epoch": 7925} {"train_loss": -28.019744873046875, "global_step": 657780, "epoch": 7925} {"train_loss": -27.98799705505371, "global_step": 657781, "epoch": 7925} {"train_loss": -27.48453712463379, "global_step": 657782, "epoch": 7925} {"train_loss": -27.53508949279785, "global_step": 657783, "epoch": 7925} {"train_loss": -27.71518898010254, "global_step": 657784, "epoch": 7925} {"train_loss": -27.914691925048828, "global_step": 657785, "epoch": 7925} {"train_loss": -28.47173500061035, "global_step": 657786, "epoch": 7925} {"train_loss": -28.361963272094727, "global_step": 657787, "epoch": 7925} {"train_loss": -28.428760528564453, "global_step": 657788, "epoch": 7925} {"train_loss": -28.208362579345703, "global_step": 657789, "epoch": 7925} {"train_loss": -27.793920516967773, "global_step": 657790, "epoch": 7925} {"train_loss": -28.297119140625, "global_step": 657791, "epoch": 7925} {"train_loss": -28.121688842773438, "global_step": 657792, "epoch": 7925} {"train_loss": -28.23740005493164, "global_step": 657793, "epoch": 7925} {"train_loss": -28.2282657623291, "global_step": 657794, "epoch": 7925} {"train_loss": -28.36476707458496, "global_step": 657795, "epoch": 7925} {"train_loss": -28.02092933654785, "global_step": 657796, "epoch": 7925} {"train_loss": -28.276540756225586, "global_step": 657797, "epoch": 7925} {"train_loss": -28.44500732421875, "global_step": 657798, "epoch": 7925} {"train_loss": -28.46530532836914, "global_step": 657799, "epoch": 7925} {"train_loss": -28.56072998046875, "global_step": 657800, "epoch": 7925} {"train_loss": -28.381610870361328, "global_step": 657801, "epoch": 7925} {"train_loss": -28.558263778686523, "global_step": 657802, "epoch": 7925} {"train_loss": -28.1781005859375, "global_step": 657803, "epoch": 7925} {"train_loss": -28.403268814086914, "global_step": 657804, "epoch": 7925} {"train_loss": -28.4895076751709, "global_step": 657805, "epoch": 7925} {"train_loss": -28.736087799072266, "global_step": 657806, "epoch": 7925} {"train_loss": -28.346250534057617, "global_step": 657807, "epoch": 7925} {"train_loss": -28.31093406677246, "global_step": 657808, "epoch": 7925} {"train_loss": -28.239551544189453, "global_step": 657809, "epoch": 7925} {"train_loss": -28.627960205078125, "global_step": 657810, "epoch": 7925} {"train_loss": -28.352140426635742, "global_step": 657811, "epoch": 7925} {"train_loss": -28.37567138671875, "global_step": 657812, "epoch": 7925} {"train_loss": -28.60292625427246, "global_step": 657813, "epoch": 7925} {"train_loss": -28.394140243530273, "global_step": 657814, "epoch": 7925} {"train_loss": -28.943567276000977, "global_step": 657815, "epoch": 7925} {"train_loss": -28.6881046295166, "global_step": 657816, "epoch": 7925} {"train_loss": -28.921375274658203, "global_step": 657817, "epoch": 7925} {"train_loss": -28.437759399414062, "global_step": 657818, "epoch": 7925} {"train_loss": -28.598529815673828, "global_step": 657819, "epoch": 7925} {"train_loss": -28.655057907104492, "global_step": 657820, "epoch": 7925} {"train_loss": -28.58734703063965, "global_step": 657821, "epoch": 7925} {"train_loss": -28.852283477783203, "global_step": 657822, "epoch": 7925} {"train_loss": -28.31296157836914, "global_step": 657823, "epoch": 7925} {"train_loss": -28.516752243041992, "global_step": 657824, "epoch": 7925} {"train_loss": -28.725683212280273, "global_step": 657825, "epoch": 7925} {"train_loss": -28.103933334350586, "global_step": 657826, "epoch": 7925} {"train_loss": -28.601667404174805, "global_step": 657827, "epoch": 7925} {"train_loss": -28.332067489624023, "global_step": 657828, "epoch": 7925} {"train_loss": -28.74342155456543, "global_step": 657829, "epoch": 7925} {"train_loss": -28.269678115844727, "global_step": 657830, "epoch": 7925} {"train_loss": -27.961231231689453, "global_step": 657831, "epoch": 7925} {"train_loss": -27.652143478393555, "global_step": 657832, "epoch": 7925} {"train_loss": -27.518329620361328, "global_step": 657833, "epoch": 7925} {"train_loss": -27.37690544128418, "global_step": 657834, "epoch": 7925} {"train_loss": -27.36566734313965, "global_step": 657835, "epoch": 7925} {"train_loss": -27.621246337890625, "global_step": 657836, "epoch": 7925} {"train_loss": -28.182727813720703, "global_step": 657837, "epoch": 7925} {"train_loss": -27.826725006103516, "global_step": 657838, "epoch": 7925} {"train_loss": -27.737878799438477, "global_step": 657839, "epoch": 7925} {"train_loss": -28.063995361328125, "global_step": 657840, "epoch": 7925} {"train_loss": -28.0791015625, "global_step": 657841, "epoch": 7925} {"train_loss": -27.893529891967773, "global_step": 657842, "epoch": 7925} {"train_loss": -28.118906021118164, "global_step": 657843, "epoch": 7925} {"train_loss": -27.951343536376953, "global_step": 657844, "epoch": 7925} {"train_loss": -27.94906997680664, "global_step": 657845, "epoch": 7925} {"train_loss": -28.4085750579834, "global_step": 657846, "epoch": 7925} {"train_loss": -28.120786666870117, "global_step": 657847, "epoch": 7925} {"train_loss": -28.062408447265625, "global_step": 657848, "epoch": 7925} {"train_loss": -28.14838218688965, "global_step": 657849, "epoch": 7925} {"train_loss": -28.277557373046875, "global_step": 657850, "epoch": 7925} {"train_loss": -28.52650260925293, "global_step": 657851, "epoch": 7925} {"train_loss": -28.307239532470703, "global_step": 657852, "epoch": 7925} {"train_loss": -28.242340087890625, "global_step": 657853, "epoch": 7925} {"train_loss": -28.186918258666992, "global_step": 657854, "epoch": 7925} {"train_loss": -28.58570671081543, "global_step": 657855, "epoch": 7925} {"train_loss": -28.345373153686523, "global_step": 657856, "epoch": 7925} {"train_loss": -28.226379900093537, "global_step": 657857, "epoch": 7925, "val_loss": 6699157.0} {"train_loss": -28.268712997436523, "global_step": 657858, "epoch": 7926} {"train_loss": -27.83173942565918, "global_step": 657859, "epoch": 7926} {"train_loss": -28.190099716186523, "global_step": 657860, "epoch": 7926} {"train_loss": -28.156503677368164, "global_step": 657861, "epoch": 7926} {"train_loss": -28.227527618408203, "global_step": 657862, "epoch": 7926} {"train_loss": -27.820844650268555, "global_step": 657863, "epoch": 7926} {"train_loss": -28.252243041992188, "global_step": 657864, "epoch": 7926} {"train_loss": -27.815704345703125, "global_step": 657865, "epoch": 7926} {"train_loss": -28.359601974487305, "global_step": 657866, "epoch": 7926} {"train_loss": -28.2656192779541, "global_step": 657867, "epoch": 7926} {"train_loss": -28.283588409423828, "global_step": 657868, "epoch": 7926} {"train_loss": -28.310449600219727, "global_step": 657869, "epoch": 7926} {"train_loss": -28.172626495361328, "global_step": 657870, "epoch": 7926} {"train_loss": -28.746259689331055, "global_step": 657871, "epoch": 7926} {"train_loss": -28.376623153686523, "global_step": 657872, "epoch": 7926} {"train_loss": -28.327543258666992, "global_step": 657873, "epoch": 7926} {"train_loss": -28.74492835998535, "global_step": 657874, "epoch": 7926} {"train_loss": -28.543256759643555, "global_step": 657875, "epoch": 7926} {"train_loss": -28.690412521362305, "global_step": 657876, "epoch": 7926} {"train_loss": -28.45989990234375, "global_step": 657877, "epoch": 7926} {"train_loss": -28.44441795349121, "global_step": 657878, "epoch": 7926} {"train_loss": -28.61588478088379, "global_step": 657879, "epoch": 7926} {"train_loss": -28.392333984375, "global_step": 657880, "epoch": 7926} {"train_loss": -28.548974990844727, "global_step": 657881, "epoch": 7926} {"train_loss": -28.438644409179688, "global_step": 657882, "epoch": 7926} {"train_loss": -28.453266143798828, "global_step": 657883, "epoch": 7926} {"train_loss": -28.30881118774414, "global_step": 657884, "epoch": 7926} {"train_loss": -28.510955810546875, "global_step": 657885, "epoch": 7926} {"train_loss": -28.747446060180664, "global_step": 657886, "epoch": 7926} {"train_loss": -28.277555465698242, "global_step": 657887, "epoch": 7926} {"train_loss": -28.41633415222168, "global_step": 657888, "epoch": 7926} {"train_loss": -28.354736328125, "global_step": 657889, "epoch": 7926} {"train_loss": -28.436813354492188, "global_step": 657890, "epoch": 7926} {"train_loss": -28.329633712768555, "global_step": 657891, "epoch": 7926} {"train_loss": -28.4807186126709, "global_step": 657892, "epoch": 7926} {"train_loss": -28.073766708374023, "global_step": 657893, "epoch": 7926} {"train_loss": -27.972089767456055, "global_step": 657894, "epoch": 7926} {"train_loss": -27.78317642211914, "global_step": 657895, "epoch": 7926} {"train_loss": -27.935806274414062, "global_step": 657896, "epoch": 7926} {"train_loss": -28.315841674804688, "global_step": 657897, "epoch": 7926} {"train_loss": -28.435190200805664, "global_step": 657898, "epoch": 7926} {"train_loss": -28.111927032470703, "global_step": 657899, "epoch": 7926} {"train_loss": -28.292373657226562, "global_step": 657900, "epoch": 7926} {"train_loss": -28.106470108032227, "global_step": 657901, "epoch": 7926} {"train_loss": -28.56398582458496, "global_step": 657902, "epoch": 7926} {"train_loss": -27.947052001953125, "global_step": 657903, "epoch": 7926} {"train_loss": -28.323461532592773, "global_step": 657904, "epoch": 7926} {"train_loss": -28.15376091003418, "global_step": 657905, "epoch": 7926} {"train_loss": -28.288663864135742, "global_step": 657906, "epoch": 7926} {"train_loss": -28.50446891784668, "global_step": 657907, "epoch": 7926} {"train_loss": -28.259775161743164, "global_step": 657908, "epoch": 7926} {"train_loss": -28.076282501220703, "global_step": 657909, "epoch": 7926} {"train_loss": -28.1004695892334, "global_step": 657910, "epoch": 7926} {"train_loss": -28.105640411376953, "global_step": 657911, "epoch": 7926} {"train_loss": -27.4980525970459, "global_step": 657912, "epoch": 7926} {"train_loss": -28.291519165039062, "global_step": 657913, "epoch": 7926} {"train_loss": -28.125768661499023, "global_step": 657914, "epoch": 7926} {"train_loss": -27.654346466064453, "global_step": 657915, "epoch": 7926} {"train_loss": -27.796361923217773, "global_step": 657916, "epoch": 7926} {"train_loss": -28.259321212768555, "global_step": 657917, "epoch": 7926} {"train_loss": -28.285959243774414, "global_step": 657918, "epoch": 7926} {"train_loss": -28.20362663269043, "global_step": 657919, "epoch": 7926} {"train_loss": -28.483123779296875, "global_step": 657920, "epoch": 7926} {"train_loss": -28.238874435424805, "global_step": 657921, "epoch": 7926} {"train_loss": -28.7174015045166, "global_step": 657922, "epoch": 7926} {"train_loss": -28.032758712768555, "global_step": 657923, "epoch": 7926} {"train_loss": -28.42513084411621, "global_step": 657924, "epoch": 7926} {"train_loss": -28.602453231811523, "global_step": 657925, "epoch": 7926} {"train_loss": -27.989404678344727, "global_step": 657926, "epoch": 7926} {"train_loss": -28.113834381103516, "global_step": 657927, "epoch": 7926} {"train_loss": -28.051916122436523, "global_step": 657928, "epoch": 7926} {"train_loss": -28.383581161499023, "global_step": 657929, "epoch": 7926} {"train_loss": -28.29009437561035, "global_step": 657930, "epoch": 7926} {"train_loss": -28.136194229125977, "global_step": 657931, "epoch": 7926} {"train_loss": -28.4659423828125, "global_step": 657932, "epoch": 7926} {"train_loss": -28.383136749267578, "global_step": 657933, "epoch": 7926} {"train_loss": -28.63047218322754, "global_step": 657934, "epoch": 7926} {"train_loss": -28.510969161987305, "global_step": 657935, "epoch": 7926} {"train_loss": -28.617019653320312, "global_step": 657936, "epoch": 7926} {"train_loss": -28.634092330932617, "global_step": 657937, "epoch": 7926} {"train_loss": -28.2932071685791, "global_step": 657938, "epoch": 7926} {"train_loss": -28.8312931060791, "global_step": 657939, "epoch": 7926} {"train_loss": -28.30222180378006, "global_step": 657940, "epoch": 7926, "val_loss": 6755194.0} {"train_loss": -27.765522003173828, "global_step": 657941, "epoch": 7927} {"train_loss": -27.57259178161621, "global_step": 657942, "epoch": 7927} {"train_loss": -27.387990951538086, "global_step": 657943, "epoch": 7927} {"train_loss": -27.742013931274414, "global_step": 657944, "epoch": 7927} {"train_loss": -27.4133358001709, "global_step": 657945, "epoch": 7927} {"train_loss": -27.527204513549805, "global_step": 657946, "epoch": 7927} {"train_loss": -27.695531845092773, "global_step": 657947, "epoch": 7927} {"train_loss": -27.75935173034668, "global_step": 657948, "epoch": 7927} {"train_loss": -27.497913360595703, "global_step": 657949, "epoch": 7927} {"train_loss": -27.65951919555664, "global_step": 657950, "epoch": 7927} {"train_loss": -27.675622940063477, "global_step": 657951, "epoch": 7927} {"train_loss": -27.83524513244629, "global_step": 657952, "epoch": 7927} {"train_loss": -27.90980339050293, "global_step": 657953, "epoch": 7927} {"train_loss": -28.179296493530273, "global_step": 657954, "epoch": 7927} {"train_loss": -27.9560489654541, "global_step": 657955, "epoch": 7927} {"train_loss": -28.060779571533203, "global_step": 657956, "epoch": 7927} {"train_loss": -28.03309440612793, "global_step": 657957, "epoch": 7927} {"train_loss": -28.028579711914062, "global_step": 657958, "epoch": 7927} {"train_loss": -28.322065353393555, "global_step": 657959, "epoch": 7927} {"train_loss": -28.265960693359375, "global_step": 657960, "epoch": 7927} {"train_loss": -28.6761531829834, "global_step": 657961, "epoch": 7927} {"train_loss": -28.54694938659668, "global_step": 657962, "epoch": 7927} {"train_loss": -28.2305908203125, "global_step": 657963, "epoch": 7927} {"train_loss": -28.1663818359375, "global_step": 657964, "epoch": 7927} {"train_loss": -28.450946807861328, "global_step": 657965, "epoch": 7927} {"train_loss": -28.65315055847168, "global_step": 657966, "epoch": 7927} {"train_loss": -28.319427490234375, "global_step": 657967, "epoch": 7927} {"train_loss": -28.32697105407715, "global_step": 657968, "epoch": 7927} {"train_loss": -28.49744987487793, "global_step": 657969, "epoch": 7927} {"train_loss": -28.647062301635742, "global_step": 657970, "epoch": 7927} {"train_loss": -28.315444946289062, "global_step": 657971, "epoch": 7927} {"train_loss": -28.46245765686035, "global_step": 657972, "epoch": 7927} {"train_loss": -28.2767391204834, "global_step": 657973, "epoch": 7927} {"train_loss": -28.22953224182129, "global_step": 657974, "epoch": 7927} {"train_loss": -28.087656021118164, "global_step": 657975, "epoch": 7927} {"train_loss": -28.323022842407227, "global_step": 657976, "epoch": 7927} {"train_loss": -28.5322265625, "global_step": 657977, "epoch": 7927} {"train_loss": -28.4171199798584, "global_step": 657978, "epoch": 7927} {"train_loss": -28.500268936157227, "global_step": 657979, "epoch": 7927} {"train_loss": -28.23337745666504, "global_step": 657980, "epoch": 7927} {"train_loss": -28.290380477905273, "global_step": 657981, "epoch": 7927} {"train_loss": -28.35468864440918, "global_step": 657982, "epoch": 7927} {"train_loss": -28.447784423828125, "global_step": 657983, "epoch": 7927} {"train_loss": -28.41004753112793, "global_step": 657984, "epoch": 7927} {"train_loss": -28.388639450073242, "global_step": 657985, "epoch": 7927} {"train_loss": -27.896942138671875, "global_step": 657986, "epoch": 7927} {"train_loss": -28.6947021484375, "global_step": 657987, "epoch": 7927} {"train_loss": -28.500930786132812, "global_step": 657988, "epoch": 7927} {"train_loss": -28.437625885009766, "global_step": 657989, "epoch": 7927} {"train_loss": -28.421295166015625, "global_step": 657990, "epoch": 7927} {"train_loss": -28.251440048217773, "global_step": 657991, "epoch": 7927} {"train_loss": -28.592212677001953, "global_step": 657992, "epoch": 7927} {"train_loss": -28.167829513549805, "global_step": 657993, "epoch": 7927} {"train_loss": -28.555578231811523, "global_step": 657994, "epoch": 7927} {"train_loss": -28.451719284057617, "global_step": 657995, "epoch": 7927} {"train_loss": -28.4643611907959, "global_step": 657996, "epoch": 7927} {"train_loss": -28.5591983795166, "global_step": 657997, "epoch": 7927} {"train_loss": -27.94915771484375, "global_step": 657998, "epoch": 7927} {"train_loss": -28.463958740234375, "global_step": 657999, "epoch": 7927} {"train_loss": -28.4005069732666, "global_step": 658000, "epoch": 7927} {"train_loss": -28.558429718017578, "global_step": 658001, "epoch": 7927} {"train_loss": -28.469640731811523, "global_step": 658002, "epoch": 7927} {"train_loss": -28.117328643798828, "global_step": 658003, "epoch": 7927} {"train_loss": -28.137968063354492, "global_step": 658004, "epoch": 7927} {"train_loss": -28.645172119140625, "global_step": 658005, "epoch": 7927} {"train_loss": -28.290639877319336, "global_step": 658006, "epoch": 7927} {"train_loss": -28.128904342651367, "global_step": 658007, "epoch": 7927} {"train_loss": -28.315814971923828, "global_step": 658008, "epoch": 7927} {"train_loss": -28.200408935546875, "global_step": 658009, "epoch": 7927} {"train_loss": -28.382177352905273, "global_step": 658010, "epoch": 7927} {"train_loss": -27.539793014526367, "global_step": 658011, "epoch": 7927} {"train_loss": -27.63075828552246, "global_step": 658012, "epoch": 7927} {"train_loss": -28.30977439880371, "global_step": 658013, "epoch": 7927} {"train_loss": -28.405197143554688, "global_step": 658014, "epoch": 7927} {"train_loss": -27.898834228515625, "global_step": 658015, "epoch": 7927} {"train_loss": -27.749191284179688, "global_step": 658016, "epoch": 7927} {"train_loss": -28.111013412475586, "global_step": 658017, "epoch": 7927} {"train_loss": -28.442758560180664, "global_step": 658018, "epoch": 7927} {"train_loss": -28.48345375061035, "global_step": 658019, "epoch": 7927} {"train_loss": -28.48508644104004, "global_step": 658020, "epoch": 7927} {"train_loss": -28.30035400390625, "global_step": 658021, "epoch": 7927} {"train_loss": -28.035612106323242, "global_step": 658022, "epoch": 7927} {"train_loss": -28.196961161601973, "global_step": 658023, "epoch": 7927, "val_loss": 6687247.0} {"train_loss": -26.885046005249023, "global_step": 658024, "epoch": 7928} {"train_loss": -27.388263702392578, "global_step": 658025, "epoch": 7928} {"train_loss": -27.86781883239746, "global_step": 658026, "epoch": 7928} {"train_loss": -27.414749145507812, "global_step": 658027, "epoch": 7928} {"train_loss": -27.823888778686523, "global_step": 658028, "epoch": 7928} {"train_loss": -27.849538803100586, "global_step": 658029, "epoch": 7928} {"train_loss": -27.161436080932617, "global_step": 658030, "epoch": 7928} {"train_loss": -28.251758575439453, "global_step": 658031, "epoch": 7928} {"train_loss": -27.444814682006836, "global_step": 658032, "epoch": 7928} {"train_loss": -28.13720703125, "global_step": 658033, "epoch": 7928} {"train_loss": -27.78005027770996, "global_step": 658034, "epoch": 7928} {"train_loss": -28.13555335998535, "global_step": 658035, "epoch": 7928} {"train_loss": -27.797687530517578, "global_step": 658036, "epoch": 7928} {"train_loss": -27.9464111328125, "global_step": 658037, "epoch": 7928} {"train_loss": -27.93964958190918, "global_step": 658038, "epoch": 7928} {"train_loss": -27.91354751586914, "global_step": 658039, "epoch": 7928} {"train_loss": -28.039770126342773, "global_step": 658040, "epoch": 7928} {"train_loss": -27.949377059936523, "global_step": 658041, "epoch": 7928} {"train_loss": -27.97254753112793, "global_step": 658042, "epoch": 7928} {"train_loss": -28.20819664001465, "global_step": 658043, "epoch": 7928} {"train_loss": -27.910491943359375, "global_step": 658044, "epoch": 7928} {"train_loss": -28.113412857055664, "global_step": 658045, "epoch": 7928} {"train_loss": -28.12529945373535, "global_step": 658046, "epoch": 7928} {"train_loss": -28.63591957092285, "global_step": 658047, "epoch": 7928} {"train_loss": -27.97566795349121, "global_step": 658048, "epoch": 7928} {"train_loss": -28.297143936157227, "global_step": 658049, "epoch": 7928} {"train_loss": -28.252546310424805, "global_step": 658050, "epoch": 7928} {"train_loss": -28.31793212890625, "global_step": 658051, "epoch": 7928} {"train_loss": -28.08222770690918, "global_step": 658052, "epoch": 7928} {"train_loss": -27.93292808532715, "global_step": 658053, "epoch": 7928} {"train_loss": -28.320592880249023, "global_step": 658054, "epoch": 7928} {"train_loss": -28.25801658630371, "global_step": 658055, "epoch": 7928} {"train_loss": -28.056013107299805, "global_step": 658056, "epoch": 7928} {"train_loss": -27.705657958984375, "global_step": 658057, "epoch": 7928} {"train_loss": -28.40620994567871, "global_step": 658058, "epoch": 7928} {"train_loss": -28.29401969909668, "global_step": 658059, "epoch": 7928} {"train_loss": -28.30023193359375, "global_step": 658060, "epoch": 7928} {"train_loss": -28.238758087158203, "global_step": 658061, "epoch": 7928} {"train_loss": -28.3829345703125, "global_step": 658062, "epoch": 7928} {"train_loss": -28.1979923248291, "global_step": 658063, "epoch": 7928} {"train_loss": -28.341968536376953, "global_step": 658064, "epoch": 7928} {"train_loss": -28.4070987701416, "global_step": 658065, "epoch": 7928} {"train_loss": -28.054401397705078, "global_step": 658066, "epoch": 7928} {"train_loss": -28.54558753967285, "global_step": 658067, "epoch": 7928} {"train_loss": -28.632190704345703, "global_step": 658068, "epoch": 7928} {"train_loss": -28.43825340270996, "global_step": 658069, "epoch": 7928} {"train_loss": -28.506946563720703, "global_step": 658070, "epoch": 7928} {"train_loss": -28.512205123901367, "global_step": 658071, "epoch": 7928} {"train_loss": -29.105382919311523, "global_step": 658072, "epoch": 7928} {"train_loss": -28.509916305541992, "global_step": 658073, "epoch": 7928} {"train_loss": -28.43438720703125, "global_step": 658074, "epoch": 7928} {"train_loss": -28.63632583618164, "global_step": 658075, "epoch": 7928} {"train_loss": -28.604572296142578, "global_step": 658076, "epoch": 7928} {"train_loss": -28.378528594970703, "global_step": 658077, "epoch": 7928} {"train_loss": -28.49587059020996, "global_step": 658078, "epoch": 7928} {"train_loss": -28.649290084838867, "global_step": 658079, "epoch": 7928} {"train_loss": -28.576004028320312, "global_step": 658080, "epoch": 7928} {"train_loss": -28.684711456298828, "global_step": 658081, "epoch": 7928} {"train_loss": -28.53455924987793, "global_step": 658082, "epoch": 7928} {"train_loss": -28.9543399810791, "global_step": 658083, "epoch": 7928} {"train_loss": -28.7737979888916, "global_step": 658084, "epoch": 7928} {"train_loss": -28.525175094604492, "global_step": 658085, "epoch": 7928} {"train_loss": -28.682117462158203, "global_step": 658086, "epoch": 7928} {"train_loss": -29.004430770874023, "global_step": 658087, "epoch": 7928} {"train_loss": -28.6983642578125, "global_step": 658088, "epoch": 7928} {"train_loss": -28.512470245361328, "global_step": 658089, "epoch": 7928} {"train_loss": -28.23419761657715, "global_step": 658090, "epoch": 7928} {"train_loss": -29.064321517944336, "global_step": 658091, "epoch": 7928} {"train_loss": -28.839696884155273, "global_step": 658092, "epoch": 7928} {"train_loss": -28.35890007019043, "global_step": 658093, "epoch": 7928} {"train_loss": -28.429758071899414, "global_step": 658094, "epoch": 7928} {"train_loss": -27.927343368530273, "global_step": 658095, "epoch": 7928} {"train_loss": -27.736291885375977, "global_step": 658096, "epoch": 7928} {"train_loss": -27.337936401367188, "global_step": 658097, "epoch": 7928} {"train_loss": -27.02105712890625, "global_step": 658098, "epoch": 7928} {"train_loss": -26.735509872436523, "global_step": 658099, "epoch": 7928} {"train_loss": -26.964405059814453, "global_step": 658100, "epoch": 7928} {"train_loss": -27.977087020874023, "global_step": 658101, "epoch": 7928} {"train_loss": -28.01580238342285, "global_step": 658102, "epoch": 7928} {"train_loss": -27.56314468383789, "global_step": 658103, "epoch": 7928} {"train_loss": -28.167882919311523, "global_step": 658104, "epoch": 7928} {"train_loss": -28.321516036987305, "global_step": 658105, "epoch": 7928} {"train_loss": -28.168765401265706, "global_step": 658106, "epoch": 7928, "val_loss": 6738791.0} {"train_loss": -27.442712783813477, "global_step": 658107, "epoch": 7929} {"train_loss": -27.86676025390625, "global_step": 658108, "epoch": 7929} {"train_loss": -27.41607666015625, "global_step": 658109, "epoch": 7929} {"train_loss": -28.055479049682617, "global_step": 658110, "epoch": 7929} {"train_loss": -27.581501007080078, "global_step": 658111, "epoch": 7929} {"train_loss": -27.9084415435791, "global_step": 658112, "epoch": 7929} {"train_loss": -27.854022979736328, "global_step": 658113, "epoch": 7929} {"train_loss": -27.860828399658203, "global_step": 658114, "epoch": 7929} {"train_loss": -27.924097061157227, "global_step": 658115, "epoch": 7929} {"train_loss": -27.519535064697266, "global_step": 658116, "epoch": 7929} {"train_loss": -27.492368698120117, "global_step": 658117, "epoch": 7929} {"train_loss": -27.24810218811035, "global_step": 658118, "epoch": 7929} {"train_loss": -27.727619171142578, "global_step": 658119, "epoch": 7929} {"train_loss": -27.792211532592773, "global_step": 658120, "epoch": 7929} {"train_loss": -27.859302520751953, "global_step": 658121, "epoch": 7929} {"train_loss": -28.25685691833496, "global_step": 658122, "epoch": 7929} {"train_loss": -28.103702545166016, "global_step": 658123, "epoch": 7929} {"train_loss": -27.96259880065918, "global_step": 658124, "epoch": 7929} {"train_loss": -28.032825469970703, "global_step": 658125, "epoch": 7929} {"train_loss": -28.232831954956055, "global_step": 658126, "epoch": 7929} {"train_loss": -27.933984756469727, "global_step": 658127, "epoch": 7929} {"train_loss": -28.06475257873535, "global_step": 658128, "epoch": 7929} {"train_loss": -28.123022079467773, "global_step": 658129, "epoch": 7929} {"train_loss": -28.514860153198242, "global_step": 658130, "epoch": 7929} {"train_loss": -27.956708908081055, "global_step": 658131, "epoch": 7929} {"train_loss": -27.8742618560791, "global_step": 658132, "epoch": 7929} {"train_loss": -28.609418869018555, "global_step": 658133, "epoch": 7929} {"train_loss": -28.15888786315918, "global_step": 658134, "epoch": 7929} {"train_loss": -28.13242530822754, "global_step": 658135, "epoch": 7929} {"train_loss": -28.338916778564453, "global_step": 658136, "epoch": 7929} {"train_loss": -28.125049591064453, "global_step": 658137, "epoch": 7929} {"train_loss": -27.923627853393555, "global_step": 658138, "epoch": 7929} {"train_loss": -28.105911254882812, "global_step": 658139, "epoch": 7929} {"train_loss": -28.58041763305664, "global_step": 658140, "epoch": 7929} {"train_loss": -28.31838035583496, "global_step": 658141, "epoch": 7929} {"train_loss": -28.31190299987793, "global_step": 658142, "epoch": 7929} {"train_loss": -28.62939453125, "global_step": 658143, "epoch": 7929} {"train_loss": -28.15095329284668, "global_step": 658144, "epoch": 7929} {"train_loss": -28.502593994140625, "global_step": 658145, "epoch": 7929} {"train_loss": -28.1201171875, "global_step": 658146, "epoch": 7929} {"train_loss": -28.352252960205078, "global_step": 658147, "epoch": 7929} {"train_loss": -27.844934463500977, "global_step": 658148, "epoch": 7929} {"train_loss": -28.445409774780273, "global_step": 658149, "epoch": 7929} {"train_loss": -27.932825088500977, "global_step": 658150, "epoch": 7929} {"train_loss": -28.21394157409668, "global_step": 658151, "epoch": 7929} {"train_loss": -27.94219398498535, "global_step": 658152, "epoch": 7929} {"train_loss": -28.894153594970703, "global_step": 658153, "epoch": 7929} {"train_loss": -28.55997657775879, "global_step": 658154, "epoch": 7929} {"train_loss": -28.44405174255371, "global_step": 658155, "epoch": 7929} {"train_loss": -28.674711227416992, "global_step": 658156, "epoch": 7929} {"train_loss": -28.5451602935791, "global_step": 658157, "epoch": 7929} {"train_loss": -28.339344024658203, "global_step": 658158, "epoch": 7929} {"train_loss": -28.522674560546875, "global_step": 658159, "epoch": 7929} {"train_loss": -28.419382095336914, "global_step": 658160, "epoch": 7929} {"train_loss": -28.47108268737793, "global_step": 658161, "epoch": 7929} {"train_loss": -28.406055450439453, "global_step": 658162, "epoch": 7929} {"train_loss": -28.89740562438965, "global_step": 658163, "epoch": 7929} {"train_loss": -28.1838436126709, "global_step": 658164, "epoch": 7929} {"train_loss": -28.61371421813965, "global_step": 658165, "epoch": 7929} {"train_loss": -28.39887809753418, "global_step": 658166, "epoch": 7929} {"train_loss": -28.229040145874023, "global_step": 658167, "epoch": 7929} {"train_loss": -28.561864852905273, "global_step": 658168, "epoch": 7929} {"train_loss": -28.472375869750977, "global_step": 658169, "epoch": 7929} {"train_loss": -28.270343780517578, "global_step": 658170, "epoch": 7929} {"train_loss": -28.52349853515625, "global_step": 658171, "epoch": 7929} {"train_loss": -28.494964599609375, "global_step": 658172, "epoch": 7929} {"train_loss": -28.656509399414062, "global_step": 658173, "epoch": 7929} {"train_loss": -28.561063766479492, "global_step": 658174, "epoch": 7929} {"train_loss": -28.44832420349121, "global_step": 658175, "epoch": 7929} {"train_loss": -28.452054977416992, "global_step": 658176, "epoch": 7929} {"train_loss": -28.288848876953125, "global_step": 658177, "epoch": 7929} {"train_loss": -28.13530921936035, "global_step": 658178, "epoch": 7929} {"train_loss": -28.36016845703125, "global_step": 658179, "epoch": 7929} {"train_loss": -28.04327392578125, "global_step": 658180, "epoch": 7929} {"train_loss": -28.035654067993164, "global_step": 658181, "epoch": 7929} {"train_loss": -28.30903434753418, "global_step": 658182, "epoch": 7929} {"train_loss": -28.74724769592285, "global_step": 658183, "epoch": 7929} {"train_loss": -28.297292709350586, "global_step": 658184, "epoch": 7929} {"train_loss": -28.494611740112305, "global_step": 658185, "epoch": 7929} {"train_loss": -28.52729606628418, "global_step": 658186, "epoch": 7929} {"train_loss": -28.393829345703125, "global_step": 658187, "epoch": 7929} {"train_loss": -28.087926864624023, "global_step": 658188, "epoch": 7929} {"train_loss": -28.195863861635505, "global_step": 658189, "epoch": 7929, "val_loss": 6811073.0} {"train_loss": -26.620361328125, "global_step": 658190, "epoch": 7930} {"train_loss": -26.85748291015625, "global_step": 658191, "epoch": 7930} {"train_loss": -26.241071701049805, "global_step": 658192, "epoch": 7930} {"train_loss": -27.253448486328125, "global_step": 658193, "epoch": 7930} {"train_loss": -27.070669174194336, "global_step": 658194, "epoch": 7930} {"train_loss": -26.863971710205078, "global_step": 658195, "epoch": 7930} {"train_loss": -27.555143356323242, "global_step": 658196, "epoch": 7930} {"train_loss": -27.757064819335938, "global_step": 658197, "epoch": 7930} {"train_loss": -27.0299015045166, "global_step": 658198, "epoch": 7930} {"train_loss": -27.1809139251709, "global_step": 658199, "epoch": 7930} {"train_loss": -27.714130401611328, "global_step": 658200, "epoch": 7930} {"train_loss": -27.34568214416504, "global_step": 658201, "epoch": 7930} {"train_loss": -27.855304718017578, "global_step": 658202, "epoch": 7930} {"train_loss": -27.9122371673584, "global_step": 658203, "epoch": 7930} {"train_loss": -27.8102970123291, "global_step": 658204, "epoch": 7930} {"train_loss": -27.911405563354492, "global_step": 658205, "epoch": 7930} {"train_loss": -27.081912994384766, "global_step": 658206, "epoch": 7930} {"train_loss": -27.820478439331055, "global_step": 658207, "epoch": 7930} {"train_loss": -27.325092315673828, "global_step": 658208, "epoch": 7930} {"train_loss": -27.803272247314453, "global_step": 658209, "epoch": 7930} {"train_loss": -27.9446964263916, "global_step": 658210, "epoch": 7930} {"train_loss": -27.938474655151367, "global_step": 658211, "epoch": 7930} {"train_loss": -27.723432540893555, "global_step": 658212, "epoch": 7930} {"train_loss": -27.78248405456543, "global_step": 658213, "epoch": 7930} {"train_loss": -28.146652221679688, "global_step": 658214, "epoch": 7930} {"train_loss": -27.89531898498535, "global_step": 658215, "epoch": 7930} {"train_loss": -28.01654052734375, "global_step": 658216, "epoch": 7930} {"train_loss": -27.774572372436523, "global_step": 658217, "epoch": 7930} {"train_loss": -28.53912925720215, "global_step": 658218, "epoch": 7930} {"train_loss": -28.187610626220703, "global_step": 658219, "epoch": 7930} {"train_loss": -28.231231689453125, "global_step": 658220, "epoch": 7930} {"train_loss": -28.30743408203125, "global_step": 658221, "epoch": 7930} {"train_loss": -28.353498458862305, "global_step": 658222, "epoch": 7930} {"train_loss": -28.03843116760254, "global_step": 658223, "epoch": 7930} {"train_loss": -28.104806900024414, "global_step": 658224, "epoch": 7930} {"train_loss": -28.274927139282227, "global_step": 658225, "epoch": 7930} {"train_loss": -28.12565040588379, "global_step": 658226, "epoch": 7930} {"train_loss": -28.21442222595215, "global_step": 658227, "epoch": 7930} {"train_loss": -28.423425674438477, "global_step": 658228, "epoch": 7930} {"train_loss": -28.18768310546875, "global_step": 658229, "epoch": 7930} {"train_loss": -28.39811134338379, "global_step": 658230, "epoch": 7930} {"train_loss": -28.30293083190918, "global_step": 658231, "epoch": 7930} {"train_loss": -28.18098258972168, "global_step": 658232, "epoch": 7930} {"train_loss": -28.564069747924805, "global_step": 658233, "epoch": 7930} {"train_loss": -28.278472900390625, "global_step": 658234, "epoch": 7930} {"train_loss": -28.467498779296875, "global_step": 658235, "epoch": 7930} {"train_loss": -28.30344009399414, "global_step": 658236, "epoch": 7930} {"train_loss": -28.6966552734375, "global_step": 658237, "epoch": 7930} {"train_loss": -27.89728355407715, "global_step": 658238, "epoch": 7930} {"train_loss": -28.294097900390625, "global_step": 658239, "epoch": 7930} {"train_loss": -28.517404556274414, "global_step": 658240, "epoch": 7930} {"train_loss": -28.530460357666016, "global_step": 658241, "epoch": 7930} {"train_loss": -28.552438735961914, "global_step": 658242, "epoch": 7930} {"train_loss": -28.457489013671875, "global_step": 658243, "epoch": 7930} {"train_loss": -28.638914108276367, "global_step": 658244, "epoch": 7930} {"train_loss": -28.461828231811523, "global_step": 658245, "epoch": 7930} {"train_loss": -28.353900909423828, "global_step": 658246, "epoch": 7930} {"train_loss": -28.3824462890625, "global_step": 658247, "epoch": 7930} {"train_loss": -28.643375396728516, "global_step": 658248, "epoch": 7930} {"train_loss": -28.6203670501709, "global_step": 658249, "epoch": 7930} {"train_loss": -28.658538818359375, "global_step": 658250, "epoch": 7930} {"train_loss": -28.641077041625977, "global_step": 658251, "epoch": 7930} {"train_loss": -28.427478790283203, "global_step": 658252, "epoch": 7930} {"train_loss": -28.338171005249023, "global_step": 658253, "epoch": 7930} {"train_loss": -28.382551193237305, "global_step": 658254, "epoch": 7930} {"train_loss": -28.626523971557617, "global_step": 658255, "epoch": 7930} {"train_loss": -28.33652114868164, "global_step": 658256, "epoch": 7930} {"train_loss": -28.022287368774414, "global_step": 658257, "epoch": 7930} {"train_loss": -28.69110679626465, "global_step": 658258, "epoch": 7930} {"train_loss": -28.284311294555664, "global_step": 658259, "epoch": 7930} {"train_loss": -28.4449462890625, "global_step": 658260, "epoch": 7930} {"train_loss": -27.791730880737305, "global_step": 658261, "epoch": 7930} {"train_loss": -28.193634033203125, "global_step": 658262, "epoch": 7930} {"train_loss": -28.121185302734375, "global_step": 658263, "epoch": 7930} {"train_loss": -28.50056266784668, "global_step": 658264, "epoch": 7930} {"train_loss": -28.31597328186035, "global_step": 658265, "epoch": 7930} {"train_loss": -28.523534774780273, "global_step": 658266, "epoch": 7930} {"train_loss": -28.657079696655273, "global_step": 658267, "epoch": 7930} {"train_loss": -28.0264892578125, "global_step": 658268, "epoch": 7930} {"train_loss": -28.435087203979492, "global_step": 658269, "epoch": 7930} {"train_loss": -28.3630313873291, "global_step": 658270, "epoch": 7930} {"train_loss": -28.06308937072754, "global_step": 658271, "epoch": 7930} {"train_loss": -28.061511832547474, "global_step": 658272, "epoch": 7930, "val_loss": 6612877.0} {"train_loss": -27.646392822265625, "global_step": 658273, "epoch": 7931} {"train_loss": -27.888355255126953, "global_step": 658274, "epoch": 7931} {"train_loss": -27.320037841796875, "global_step": 658275, "epoch": 7931} {"train_loss": -27.5440731048584, "global_step": 658276, "epoch": 7931} {"train_loss": -27.001941680908203, "global_step": 658277, "epoch": 7931} {"train_loss": -26.748376846313477, "global_step": 658278, "epoch": 7931} {"train_loss": -25.266687393188477, "global_step": 658279, "epoch": 7931} {"train_loss": -26.174640655517578, "global_step": 658280, "epoch": 7931} {"train_loss": -27.436298370361328, "global_step": 658281, "epoch": 7931} {"train_loss": -26.49251365661621, "global_step": 658282, "epoch": 7931} {"train_loss": -27.435504913330078, "global_step": 658283, "epoch": 7931} {"train_loss": -27.19174575805664, "global_step": 658284, "epoch": 7931} {"train_loss": -27.49188804626465, "global_step": 658285, "epoch": 7931} {"train_loss": -27.243488311767578, "global_step": 658286, "epoch": 7931} {"train_loss": -27.411121368408203, "global_step": 658287, "epoch": 7931} {"train_loss": -27.153440475463867, "global_step": 658288, "epoch": 7931} {"train_loss": -27.636077880859375, "global_step": 658289, "epoch": 7931} {"train_loss": -27.3668270111084, "global_step": 658290, "epoch": 7931} {"train_loss": -27.703542709350586, "global_step": 658291, "epoch": 7931} {"train_loss": -27.272275924682617, "global_step": 658292, "epoch": 7931} {"train_loss": -27.5742130279541, "global_step": 658293, "epoch": 7931} {"train_loss": -27.903295516967773, "global_step": 658294, "epoch": 7931} {"train_loss": -27.61663246154785, "global_step": 658295, "epoch": 7931} {"train_loss": -27.739551544189453, "global_step": 658296, "epoch": 7931} {"train_loss": -27.91825294494629, "global_step": 658297, "epoch": 7931} {"train_loss": -27.8244686126709, "global_step": 658298, "epoch": 7931} {"train_loss": -27.934879302978516, "global_step": 658299, "epoch": 7931} {"train_loss": -27.82752799987793, "global_step": 658300, "epoch": 7931} {"train_loss": -28.104772567749023, "global_step": 658301, "epoch": 7931} {"train_loss": -28.1829776763916, "global_step": 658302, "epoch": 7931} {"train_loss": -27.995819091796875, "global_step": 658303, "epoch": 7931} {"train_loss": -28.126239776611328, "global_step": 658304, "epoch": 7931} {"train_loss": -28.393842697143555, "global_step": 658305, "epoch": 7931} {"train_loss": -28.106969833374023, "global_step": 658306, "epoch": 7931} {"train_loss": -28.087543487548828, "global_step": 658307, "epoch": 7931} {"train_loss": -28.249591827392578, "global_step": 658308, "epoch": 7931} {"train_loss": -28.308338165283203, "global_step": 658309, "epoch": 7931} {"train_loss": -28.263254165649414, "global_step": 658310, "epoch": 7931} {"train_loss": -28.164011001586914, "global_step": 658311, "epoch": 7931} {"train_loss": -28.256711959838867, "global_step": 658312, "epoch": 7931} {"train_loss": -28.376007080078125, "global_step": 658313, "epoch": 7931} {"train_loss": -28.2561092376709, "global_step": 658314, "epoch": 7931} {"train_loss": -28.196435928344727, "global_step": 658315, "epoch": 7931} {"train_loss": -28.196813583374023, "global_step": 658316, "epoch": 7931} {"train_loss": -27.920486450195312, "global_step": 658317, "epoch": 7931} {"train_loss": -28.02484703063965, "global_step": 658318, "epoch": 7931} {"train_loss": -28.076868057250977, "global_step": 658319, "epoch": 7931} {"train_loss": -28.2879638671875, "global_step": 658320, "epoch": 7931} {"train_loss": -28.06952476501465, "global_step": 658321, "epoch": 7931} {"train_loss": -28.235654830932617, "global_step": 658322, "epoch": 7931} {"train_loss": -28.142200469970703, "global_step": 658323, "epoch": 7931} {"train_loss": -28.644651412963867, "global_step": 658324, "epoch": 7931} {"train_loss": -28.53287696838379, "global_step": 658325, "epoch": 7931} {"train_loss": -28.2332763671875, "global_step": 658326, "epoch": 7931} {"train_loss": -28.49665641784668, "global_step": 658327, "epoch": 7931} {"train_loss": -28.367294311523438, "global_step": 658328, "epoch": 7931} {"train_loss": -28.557987213134766, "global_step": 658329, "epoch": 7931} {"train_loss": -28.34732437133789, "global_step": 658330, "epoch": 7931} {"train_loss": -28.404682159423828, "global_step": 658331, "epoch": 7931} {"train_loss": -28.540555953979492, "global_step": 658332, "epoch": 7931} {"train_loss": -28.373737335205078, "global_step": 658333, "epoch": 7931} {"train_loss": -28.287338256835938, "global_step": 658334, "epoch": 7931} {"train_loss": -28.412006378173828, "global_step": 658335, "epoch": 7931} {"train_loss": -28.61514663696289, "global_step": 658336, "epoch": 7931} {"train_loss": -28.35492515563965, "global_step": 658337, "epoch": 7931} {"train_loss": -28.10809326171875, "global_step": 658338, "epoch": 7931} {"train_loss": -28.57401466369629, "global_step": 658339, "epoch": 7931} {"train_loss": -28.636676788330078, "global_step": 658340, "epoch": 7931} {"train_loss": -28.837507247924805, "global_step": 658341, "epoch": 7931} {"train_loss": -28.128055572509766, "global_step": 658342, "epoch": 7931} {"train_loss": -28.83892822265625, "global_step": 658343, "epoch": 7931} {"train_loss": -28.471227645874023, "global_step": 658344, "epoch": 7931} {"train_loss": -28.409101486206055, "global_step": 658345, "epoch": 7931} {"train_loss": -28.188129425048828, "global_step": 658346, "epoch": 7931} {"train_loss": -28.601465225219727, "global_step": 658347, "epoch": 7931} {"train_loss": -28.6976261138916, "global_step": 658348, "epoch": 7931} {"train_loss": -27.9051513671875, "global_step": 658349, "epoch": 7931} {"train_loss": -28.097064971923828, "global_step": 658350, "epoch": 7931} {"train_loss": -28.49200439453125, "global_step": 658351, "epoch": 7931} {"train_loss": -28.589780807495117, "global_step": 658352, "epoch": 7931} {"train_loss": -28.74582862854004, "global_step": 658353, "epoch": 7931} {"train_loss": -28.596155166625977, "global_step": 658354, "epoch": 7931} {"train_loss": -27.996415471456135, "global_step": 658355, "epoch": 7931, "val_loss": 6636376.0} {"train_loss": -27.840595245361328, "global_step": 658356, "epoch": 7932} {"train_loss": -27.836027145385742, "global_step": 658357, "epoch": 7932} {"train_loss": -27.853530883789062, "global_step": 658358, "epoch": 7932} {"train_loss": -27.82710075378418, "global_step": 658359, "epoch": 7932} {"train_loss": -27.7320499420166, "global_step": 658360, "epoch": 7932} {"train_loss": -28.060461044311523, "global_step": 658361, "epoch": 7932} {"train_loss": -27.431293487548828, "global_step": 658362, "epoch": 7932} {"train_loss": -27.08587646484375, "global_step": 658363, "epoch": 7932} {"train_loss": -27.5700626373291, "global_step": 658364, "epoch": 7932} {"train_loss": -27.978559494018555, "global_step": 658365, "epoch": 7932} {"train_loss": -27.48563003540039, "global_step": 658366, "epoch": 7932} {"train_loss": -27.77985191345215, "global_step": 658367, "epoch": 7932} {"train_loss": -28.024667739868164, "global_step": 658368, "epoch": 7932} {"train_loss": -27.803205490112305, "global_step": 658369, "epoch": 7932} {"train_loss": -27.839075088500977, "global_step": 658370, "epoch": 7932} {"train_loss": -27.988250732421875, "global_step": 658371, "epoch": 7932} {"train_loss": -27.902786254882812, "global_step": 658372, "epoch": 7932} {"train_loss": -27.975988388061523, "global_step": 658373, "epoch": 7932} {"train_loss": -28.113996505737305, "global_step": 658374, "epoch": 7932} {"train_loss": -28.028278350830078, "global_step": 658375, "epoch": 7932} {"train_loss": -28.49627685546875, "global_step": 658376, "epoch": 7932} {"train_loss": -28.055912017822266, "global_step": 658377, "epoch": 7932} {"train_loss": -28.134801864624023, "global_step": 658378, "epoch": 7932} {"train_loss": -28.05286979675293, "global_step": 658379, "epoch": 7932} {"train_loss": -28.286758422851562, "global_step": 658380, "epoch": 7932} {"train_loss": -28.246713638305664, "global_step": 658381, "epoch": 7932} {"train_loss": -27.86336326599121, "global_step": 658382, "epoch": 7932} {"train_loss": -28.20529556274414, "global_step": 658383, "epoch": 7932} {"train_loss": -27.87091064453125, "global_step": 658384, "epoch": 7932} {"train_loss": -28.17217445373535, "global_step": 658385, "epoch": 7932} {"train_loss": -28.180341720581055, "global_step": 658386, "epoch": 7932} {"train_loss": -27.93408203125, "global_step": 658387, "epoch": 7932} {"train_loss": -28.418867111206055, "global_step": 658388, "epoch": 7932} {"train_loss": -28.404287338256836, "global_step": 658389, "epoch": 7932} {"train_loss": -28.542951583862305, "global_step": 658390, "epoch": 7932} {"train_loss": -28.063013076782227, "global_step": 658391, "epoch": 7932} {"train_loss": -28.31854248046875, "global_step": 658392, "epoch": 7932} {"train_loss": -28.46585464477539, "global_step": 658393, "epoch": 7932} {"train_loss": -28.124027252197266, "global_step": 658394, "epoch": 7932} {"train_loss": -28.236642837524414, "global_step": 658395, "epoch": 7932} {"train_loss": -28.399662017822266, "global_step": 658396, "epoch": 7932} {"train_loss": -28.284025192260742, "global_step": 658397, "epoch": 7932} {"train_loss": -28.396039962768555, "global_step": 658398, "epoch": 7932} {"train_loss": -28.200973510742188, "global_step": 658399, "epoch": 7932} {"train_loss": -27.655609130859375, "global_step": 658400, "epoch": 7932} {"train_loss": -28.472064971923828, "global_step": 658401, "epoch": 7932} {"train_loss": -28.231969833374023, "global_step": 658402, "epoch": 7932} {"train_loss": -28.440032958984375, "global_step": 658403, "epoch": 7932} {"train_loss": -28.634069442749023, "global_step": 658404, "epoch": 7932} {"train_loss": -28.238855361938477, "global_step": 658405, "epoch": 7932} {"train_loss": -28.317474365234375, "global_step": 658406, "epoch": 7932} {"train_loss": -28.36781120300293, "global_step": 658407, "epoch": 7932} {"train_loss": -28.035404205322266, "global_step": 658408, "epoch": 7932} {"train_loss": -27.919843673706055, "global_step": 658409, "epoch": 7932} {"train_loss": -28.618072509765625, "global_step": 658410, "epoch": 7932} {"train_loss": -28.005090713500977, "global_step": 658411, "epoch": 7932} {"train_loss": -27.818517684936523, "global_step": 658412, "epoch": 7932} {"train_loss": -28.096643447875977, "global_step": 658413, "epoch": 7932} {"train_loss": -28.33375358581543, "global_step": 658414, "epoch": 7932} {"train_loss": -28.29432487487793, "global_step": 658415, "epoch": 7932} {"train_loss": -28.464563369750977, "global_step": 658416, "epoch": 7932} {"train_loss": -28.367109298706055, "global_step": 658417, "epoch": 7932} {"train_loss": -28.435302734375, "global_step": 658418, "epoch": 7932} {"train_loss": -28.33892250061035, "global_step": 658419, "epoch": 7932} {"train_loss": -28.678686141967773, "global_step": 658420, "epoch": 7932} {"train_loss": -28.019184112548828, "global_step": 658421, "epoch": 7932} {"train_loss": -28.115711212158203, "global_step": 658422, "epoch": 7932} {"train_loss": -28.444793701171875, "global_step": 658423, "epoch": 7932} {"train_loss": -28.45269203186035, "global_step": 658424, "epoch": 7932} {"train_loss": -28.518945693969727, "global_step": 658425, "epoch": 7932} {"train_loss": -28.60207176208496, "global_step": 658426, "epoch": 7932} {"train_loss": -28.63064956665039, "global_step": 658427, "epoch": 7932} {"train_loss": -28.299551010131836, "global_step": 658428, "epoch": 7932} {"train_loss": -28.011798858642578, "global_step": 658429, "epoch": 7932} {"train_loss": -28.583616256713867, "global_step": 658430, "epoch": 7932} {"train_loss": -28.048627853393555, "global_step": 658431, "epoch": 7932} {"train_loss": -28.237747192382812, "global_step": 658432, "epoch": 7932} {"train_loss": -28.671171188354492, "global_step": 658433, "epoch": 7932} {"train_loss": -28.220239639282227, "global_step": 658434, "epoch": 7932} {"train_loss": -28.530710220336914, "global_step": 658435, "epoch": 7932} {"train_loss": -28.222471237182617, "global_step": 658436, "epoch": 7932} {"train_loss": -28.670276641845703, "global_step": 658437, "epoch": 7932} {"train_loss": -28.14834344243429, "global_step": 658438, "epoch": 7932, "val_loss": 6602100.0} {"train_loss": -28.130050659179688, "global_step": 658439, "epoch": 7933} {"train_loss": -27.59351921081543, "global_step": 658440, "epoch": 7933} {"train_loss": -27.82618522644043, "global_step": 658441, "epoch": 7933} {"train_loss": -28.387664794921875, "global_step": 658442, "epoch": 7933} {"train_loss": -28.171064376831055, "global_step": 658443, "epoch": 7933} {"train_loss": -27.909894943237305, "global_step": 658444, "epoch": 7933} {"train_loss": -28.124591827392578, "global_step": 658445, "epoch": 7933} {"train_loss": -27.755353927612305, "global_step": 658446, "epoch": 7933} {"train_loss": -27.783771514892578, "global_step": 658447, "epoch": 7933} {"train_loss": -27.937414169311523, "global_step": 658448, "epoch": 7933} {"train_loss": -28.15594482421875, "global_step": 658449, "epoch": 7933} {"train_loss": -28.058252334594727, "global_step": 658450, "epoch": 7933} {"train_loss": -28.38081169128418, "global_step": 658451, "epoch": 7933} {"train_loss": -28.36448097229004, "global_step": 658452, "epoch": 7933} {"train_loss": -28.16948890686035, "global_step": 658453, "epoch": 7933} {"train_loss": -27.6303653717041, "global_step": 658454, "epoch": 7933} {"train_loss": -28.157733917236328, "global_step": 658455, "epoch": 7933} {"train_loss": -27.844465255737305, "global_step": 658456, "epoch": 7933} {"train_loss": -28.041488647460938, "global_step": 658457, "epoch": 7933} {"train_loss": -27.919260025024414, "global_step": 658458, "epoch": 7933} {"train_loss": -27.9096622467041, "global_step": 658459, "epoch": 7933} {"train_loss": -28.172794342041016, "global_step": 658460, "epoch": 7933} {"train_loss": -27.792133331298828, "global_step": 658461, "epoch": 7933} {"train_loss": -28.1707763671875, "global_step": 658462, "epoch": 7933} {"train_loss": -27.963163375854492, "global_step": 658463, "epoch": 7933} {"train_loss": -28.245641708374023, "global_step": 658464, "epoch": 7933} {"train_loss": -28.18145179748535, "global_step": 658465, "epoch": 7933} {"train_loss": -28.024993896484375, "global_step": 658466, "epoch": 7933} {"train_loss": -28.241323471069336, "global_step": 658467, "epoch": 7933} {"train_loss": -28.203964233398438, "global_step": 658468, "epoch": 7933} {"train_loss": -27.88380241394043, "global_step": 658469, "epoch": 7933} {"train_loss": -28.3819637298584, "global_step": 658470, "epoch": 7933} {"train_loss": -28.25176429748535, "global_step": 658471, "epoch": 7933} {"train_loss": -28.175817489624023, "global_step": 658472, "epoch": 7933} {"train_loss": -28.297988891601562, "global_step": 658473, "epoch": 7933} {"train_loss": -28.054229736328125, "global_step": 658474, "epoch": 7933} {"train_loss": -27.94093894958496, "global_step": 658475, "epoch": 7933} {"train_loss": -27.993757247924805, "global_step": 658476, "epoch": 7933} {"train_loss": -27.902048110961914, "global_step": 658477, "epoch": 7933} {"train_loss": -28.279077529907227, "global_step": 658478, "epoch": 7933} {"train_loss": -28.41278076171875, "global_step": 658479, "epoch": 7933} {"train_loss": -28.158903121948242, "global_step": 658480, "epoch": 7933} {"train_loss": -28.32744789123535, "global_step": 658481, "epoch": 7933} {"train_loss": -28.060758590698242, "global_step": 658482, "epoch": 7933} {"train_loss": -28.803449630737305, "global_step": 658483, "epoch": 7933} {"train_loss": -28.47067642211914, "global_step": 658484, "epoch": 7933} {"train_loss": -28.23366355895996, "global_step": 658485, "epoch": 7933} {"train_loss": -28.22157859802246, "global_step": 658486, "epoch": 7933} {"train_loss": -28.49286460876465, "global_step": 658487, "epoch": 7933} {"train_loss": -28.51483726501465, "global_step": 658488, "epoch": 7933} {"train_loss": -28.337570190429688, "global_step": 658489, "epoch": 7933} {"train_loss": -28.490234375, "global_step": 658490, "epoch": 7933} {"train_loss": -28.514190673828125, "global_step": 658491, "epoch": 7933} {"train_loss": -28.781335830688477, "global_step": 658492, "epoch": 7933} {"train_loss": -28.75812339782715, "global_step": 658493, "epoch": 7933} {"train_loss": -28.314462661743164, "global_step": 658494, "epoch": 7933} {"train_loss": -28.34111976623535, "global_step": 658495, "epoch": 7933} {"train_loss": -28.65467643737793, "global_step": 658496, "epoch": 7933} {"train_loss": -28.262598037719727, "global_step": 658497, "epoch": 7933} {"train_loss": -28.292104721069336, "global_step": 658498, "epoch": 7933} {"train_loss": -28.262548446655273, "global_step": 658499, "epoch": 7933} {"train_loss": -27.9886417388916, "global_step": 658500, "epoch": 7933} {"train_loss": -28.90435791015625, "global_step": 658501, "epoch": 7933} {"train_loss": -28.294462203979492, "global_step": 658502, "epoch": 7933} {"train_loss": -28.628101348876953, "global_step": 658503, "epoch": 7933} {"train_loss": -28.39460563659668, "global_step": 658504, "epoch": 7933} {"train_loss": -28.501571655273438, "global_step": 658505, "epoch": 7933} {"train_loss": -28.271713256835938, "global_step": 658506, "epoch": 7933} {"train_loss": -28.322790145874023, "global_step": 658507, "epoch": 7933} {"train_loss": -28.21343421936035, "global_step": 658508, "epoch": 7933} {"train_loss": -28.662389755249023, "global_step": 658509, "epoch": 7933} {"train_loss": -28.244953155517578, "global_step": 658510, "epoch": 7933} {"train_loss": -28.78265953063965, "global_step": 658511, "epoch": 7933} {"train_loss": -28.1090145111084, "global_step": 658512, "epoch": 7933} {"train_loss": -28.118865966796875, "global_step": 658513, "epoch": 7933} {"train_loss": -28.21728515625, "global_step": 658514, "epoch": 7933} {"train_loss": -28.505651473999023, "global_step": 658515, "epoch": 7933} {"train_loss": -28.474348068237305, "global_step": 658516, "epoch": 7933} {"train_loss": -28.490446090698242, "global_step": 658517, "epoch": 7933} {"train_loss": -28.986865997314453, "global_step": 658518, "epoch": 7933} {"train_loss": -28.025480270385742, "global_step": 658519, "epoch": 7933} {"train_loss": -27.915002822875977, "global_step": 658520, "epoch": 7933} {"train_loss": -28.227114252297277, "global_step": 658521, "epoch": 7933, "val_loss": 6563359.0} {"train_loss": -26.5745792388916, "global_step": 658522, "epoch": 7934} {"train_loss": -26.88201904296875, "global_step": 658523, "epoch": 7934} {"train_loss": -26.83619499206543, "global_step": 658524, "epoch": 7934} {"train_loss": -26.915616989135742, "global_step": 658525, "epoch": 7934} {"train_loss": -27.26806640625, "global_step": 658526, "epoch": 7934} {"train_loss": -27.086383819580078, "global_step": 658527, "epoch": 7934} {"train_loss": -27.447656631469727, "global_step": 658528, "epoch": 7934} {"train_loss": -27.362394332885742, "global_step": 658529, "epoch": 7934} {"train_loss": -27.1173038482666, "global_step": 658530, "epoch": 7934} {"train_loss": -27.04839515686035, "global_step": 658531, "epoch": 7934} {"train_loss": -27.1192626953125, "global_step": 658532, "epoch": 7934} {"train_loss": -27.528076171875, "global_step": 658533, "epoch": 7934} {"train_loss": -27.36134147644043, "global_step": 658534, "epoch": 7934} {"train_loss": -27.0040283203125, "global_step": 658535, "epoch": 7934} {"train_loss": -27.32586097717285, "global_step": 658536, "epoch": 7934} {"train_loss": -27.49566078186035, "global_step": 658537, "epoch": 7934} {"train_loss": -27.549718856811523, "global_step": 658538, "epoch": 7934} {"train_loss": -27.605615615844727, "global_step": 658539, "epoch": 7934} {"train_loss": -27.851139068603516, "global_step": 658540, "epoch": 7934} {"train_loss": -27.930328369140625, "global_step": 658541, "epoch": 7934} {"train_loss": -27.907438278198242, "global_step": 658542, "epoch": 7934} {"train_loss": -27.442432403564453, "global_step": 658543, "epoch": 7934} {"train_loss": -27.757312774658203, "global_step": 658544, "epoch": 7934} {"train_loss": -27.854360580444336, "global_step": 658545, "epoch": 7934} {"train_loss": -27.66656494140625, "global_step": 658546, "epoch": 7934} {"train_loss": -27.59035301208496, "global_step": 658547, "epoch": 7934} {"train_loss": -27.618459701538086, "global_step": 658548, "epoch": 7934} {"train_loss": -27.59134292602539, "global_step": 658549, "epoch": 7934} {"train_loss": -27.9493408203125, "global_step": 658550, "epoch": 7934} {"train_loss": -27.810916900634766, "global_step": 658551, "epoch": 7934} {"train_loss": -28.10163688659668, "global_step": 658552, "epoch": 7934} {"train_loss": -28.121973037719727, "global_step": 658553, "epoch": 7934} {"train_loss": -27.958057403564453, "global_step": 658554, "epoch": 7934} {"train_loss": -28.157867431640625, "global_step": 658555, "epoch": 7934} {"train_loss": -28.263492584228516, "global_step": 658556, "epoch": 7934} {"train_loss": -28.02521324157715, "global_step": 658557, "epoch": 7934} {"train_loss": -27.634185791015625, "global_step": 658558, "epoch": 7934} {"train_loss": -27.884984970092773, "global_step": 658559, "epoch": 7934} {"train_loss": -27.992544174194336, "global_step": 658560, "epoch": 7934} {"train_loss": -28.342466354370117, "global_step": 658561, "epoch": 7934} {"train_loss": -28.52213478088379, "global_step": 658562, "epoch": 7934} {"train_loss": -28.07435417175293, "global_step": 658563, "epoch": 7934} {"train_loss": -28.37348747253418, "global_step": 658564, "epoch": 7934} {"train_loss": -28.204349517822266, "global_step": 658565, "epoch": 7934} {"train_loss": -28.47146987915039, "global_step": 658566, "epoch": 7934} {"train_loss": -27.884702682495117, "global_step": 658567, "epoch": 7934} {"train_loss": -28.01816177368164, "global_step": 658568, "epoch": 7934} {"train_loss": -28.374799728393555, "global_step": 658569, "epoch": 7934} {"train_loss": -28.521411895751953, "global_step": 658570, "epoch": 7934} {"train_loss": -28.147993087768555, "global_step": 658571, "epoch": 7934} {"train_loss": -28.230688095092773, "global_step": 658572, "epoch": 7934} {"train_loss": -28.214365005493164, "global_step": 658573, "epoch": 7934} {"train_loss": -28.404102325439453, "global_step": 658574, "epoch": 7934} {"train_loss": -28.377777099609375, "global_step": 658575, "epoch": 7934} {"train_loss": -27.98209571838379, "global_step": 658576, "epoch": 7934} {"train_loss": -28.2976131439209, "global_step": 658577, "epoch": 7934} {"train_loss": -28.24213981628418, "global_step": 658578, "epoch": 7934} {"train_loss": -28.53179931640625, "global_step": 658579, "epoch": 7934} {"train_loss": -28.49009132385254, "global_step": 658580, "epoch": 7934} {"train_loss": -28.199392318725586, "global_step": 658581, "epoch": 7934} {"train_loss": -28.330188751220703, "global_step": 658582, "epoch": 7934} {"train_loss": -28.898481369018555, "global_step": 658583, "epoch": 7934} {"train_loss": -28.47673988342285, "global_step": 658584, "epoch": 7934} {"train_loss": -28.77617835998535, "global_step": 658585, "epoch": 7934} {"train_loss": -28.59872817993164, "global_step": 658586, "epoch": 7934} {"train_loss": -28.78232192993164, "global_step": 658587, "epoch": 7934} {"train_loss": -28.476062774658203, "global_step": 658588, "epoch": 7934} {"train_loss": -28.381759643554688, "global_step": 658589, "epoch": 7934} {"train_loss": -28.217853546142578, "global_step": 658590, "epoch": 7934} {"train_loss": -28.061920166015625, "global_step": 658591, "epoch": 7934} {"train_loss": -27.18906021118164, "global_step": 658592, "epoch": 7934} {"train_loss": -26.819250106811523, "global_step": 658593, "epoch": 7934} {"train_loss": -27.516895294189453, "global_step": 658594, "epoch": 7934} {"train_loss": -28.35090446472168, "global_step": 658595, "epoch": 7934} {"train_loss": -27.71150779724121, "global_step": 658596, "epoch": 7934} {"train_loss": -27.634057998657227, "global_step": 658597, "epoch": 7934} {"train_loss": -28.124942779541016, "global_step": 658598, "epoch": 7934} {"train_loss": -28.03070640563965, "global_step": 658599, "epoch": 7934} {"train_loss": -28.317432403564453, "global_step": 658600, "epoch": 7934} {"train_loss": -28.141345977783203, "global_step": 658601, "epoch": 7934} {"train_loss": -28.330921173095703, "global_step": 658602, "epoch": 7934} {"train_loss": -27.96384048461914, "global_step": 658603, "epoch": 7934} {"train_loss": -27.908831378063525, "global_step": 658604, "epoch": 7934, "val_loss": 6587980.5} {"train_loss": -27.372507095336914, "global_step": 658605, "epoch": 7935} {"train_loss": -27.617172241210938, "global_step": 658606, "epoch": 7935} {"train_loss": -27.51053810119629, "global_step": 658607, "epoch": 7935} {"train_loss": -27.69561767578125, "global_step": 658608, "epoch": 7935} {"train_loss": -27.334823608398438, "global_step": 658609, "epoch": 7935} {"train_loss": -27.374174118041992, "global_step": 658610, "epoch": 7935} {"train_loss": -27.749786376953125, "global_step": 658611, "epoch": 7935} {"train_loss": -28.143131256103516, "global_step": 658612, "epoch": 7935} {"train_loss": -27.646957397460938, "global_step": 658613, "epoch": 7935} {"train_loss": -27.94906997680664, "global_step": 658614, "epoch": 7935} {"train_loss": -28.120458602905273, "global_step": 658615, "epoch": 7935} {"train_loss": -27.70195960998535, "global_step": 658616, "epoch": 7935} {"train_loss": -27.39149284362793, "global_step": 658617, "epoch": 7935} {"train_loss": -28.059492111206055, "global_step": 658618, "epoch": 7935} {"train_loss": -27.99542236328125, "global_step": 658619, "epoch": 7935} {"train_loss": -28.469715118408203, "global_step": 658620, "epoch": 7935} {"train_loss": -28.146331787109375, "global_step": 658621, "epoch": 7935} {"train_loss": -28.069168090820312, "global_step": 658622, "epoch": 7935} {"train_loss": -27.976221084594727, "global_step": 658623, "epoch": 7935} {"train_loss": -28.291629791259766, "global_step": 658624, "epoch": 7935} {"train_loss": -28.35577392578125, "global_step": 658625, "epoch": 7935} {"train_loss": -28.371524810791016, "global_step": 658626, "epoch": 7935} {"train_loss": -27.955459594726562, "global_step": 658627, "epoch": 7935} {"train_loss": -28.30498695373535, "global_step": 658628, "epoch": 7935} {"train_loss": -28.57158851623535, "global_step": 658629, "epoch": 7935} {"train_loss": -28.149036407470703, "global_step": 658630, "epoch": 7935} {"train_loss": -28.541000366210938, "global_step": 658631, "epoch": 7935} {"train_loss": -28.236480712890625, "global_step": 658632, "epoch": 7935} {"train_loss": -28.3090877532959, "global_step": 658633, "epoch": 7935} {"train_loss": -28.048227310180664, "global_step": 658634, "epoch": 7935} {"train_loss": -28.683645248413086, "global_step": 658635, "epoch": 7935} {"train_loss": -28.69025230407715, "global_step": 658636, "epoch": 7935} {"train_loss": -28.544225692749023, "global_step": 658637, "epoch": 7935} {"train_loss": -28.547277450561523, "global_step": 658638, "epoch": 7935} {"train_loss": -28.2340145111084, "global_step": 658639, "epoch": 7935} {"train_loss": -28.537805557250977, "global_step": 658640, "epoch": 7935} {"train_loss": -28.485544204711914, "global_step": 658641, "epoch": 7935} {"train_loss": -28.081018447875977, "global_step": 658642, "epoch": 7935} {"train_loss": -27.910675048828125, "global_step": 658643, "epoch": 7935} {"train_loss": -27.85552406311035, "global_step": 658644, "epoch": 7935} {"train_loss": -27.384801864624023, "global_step": 658645, "epoch": 7935} {"train_loss": -28.218896865844727, "global_step": 658646, "epoch": 7935} {"train_loss": -28.513809204101562, "global_step": 658647, "epoch": 7935} {"train_loss": -27.975400924682617, "global_step": 658648, "epoch": 7935} {"train_loss": -27.89678955078125, "global_step": 658649, "epoch": 7935} {"train_loss": -28.5799560546875, "global_step": 658650, "epoch": 7935} {"train_loss": -27.96278190612793, "global_step": 658651, "epoch": 7935} {"train_loss": -28.570173263549805, "global_step": 658652, "epoch": 7935} {"train_loss": -27.935773849487305, "global_step": 658653, "epoch": 7935} {"train_loss": -28.298419952392578, "global_step": 658654, "epoch": 7935} {"train_loss": -28.134885787963867, "global_step": 658655, "epoch": 7935} {"train_loss": -28.52329444885254, "global_step": 658656, "epoch": 7935} {"train_loss": -29.00349235534668, "global_step": 658657, "epoch": 7935} {"train_loss": -28.272268295288086, "global_step": 658658, "epoch": 7935} {"train_loss": -28.01739501953125, "global_step": 658659, "epoch": 7935} {"train_loss": -28.502126693725586, "global_step": 658660, "epoch": 7935} {"train_loss": -28.3564453125, "global_step": 658661, "epoch": 7935} {"train_loss": -28.630945205688477, "global_step": 658662, "epoch": 7935} {"train_loss": -28.68405532836914, "global_step": 658663, "epoch": 7935} {"train_loss": -28.361845016479492, "global_step": 658664, "epoch": 7935} {"train_loss": -28.266809463500977, "global_step": 658665, "epoch": 7935} {"train_loss": -28.0831356048584, "global_step": 658666, "epoch": 7935} {"train_loss": -28.248498916625977, "global_step": 658667, "epoch": 7935} {"train_loss": -28.581134796142578, "global_step": 658668, "epoch": 7935} {"train_loss": -28.194005966186523, "global_step": 658669, "epoch": 7935} {"train_loss": -28.320465087890625, "global_step": 658670, "epoch": 7935} {"train_loss": -28.528772354125977, "global_step": 658671, "epoch": 7935} {"train_loss": -28.033273696899414, "global_step": 658672, "epoch": 7935} {"train_loss": -28.6915340423584, "global_step": 658673, "epoch": 7935} {"train_loss": -28.3660945892334, "global_step": 658674, "epoch": 7935} {"train_loss": -28.251373291015625, "global_step": 658675, "epoch": 7935} {"train_loss": -28.531436920166016, "global_step": 658676, "epoch": 7935} {"train_loss": -28.3320369720459, "global_step": 658677, "epoch": 7935} {"train_loss": -28.480390548706055, "global_step": 658678, "epoch": 7935} {"train_loss": -28.328855514526367, "global_step": 658679, "epoch": 7935} {"train_loss": -28.202392578125, "global_step": 658680, "epoch": 7935} {"train_loss": -28.25416374206543, "global_step": 658681, "epoch": 7935} {"train_loss": -28.4407958984375, "global_step": 658682, "epoch": 7935} {"train_loss": -28.380151748657227, "global_step": 658683, "epoch": 7935} {"train_loss": -28.322845458984375, "global_step": 658684, "epoch": 7935} {"train_loss": -28.49420738220215, "global_step": 658685, "epoch": 7935} {"train_loss": -28.274188995361328, "global_step": 658686, "epoch": 7935} {"train_loss": -28.188271350171192, "global_step": 658687, "epoch": 7935, "val_loss": 6592065.0} {"train_loss": -27.9989070892334, "global_step": 658688, "epoch": 7936} {"train_loss": -28.052093505859375, "global_step": 658689, "epoch": 7936} {"train_loss": -28.431055068969727, "global_step": 658690, "epoch": 7936} {"train_loss": -28.27573013305664, "global_step": 658691, "epoch": 7936} {"train_loss": -28.088193893432617, "global_step": 658692, "epoch": 7936} {"train_loss": -27.724735260009766, "global_step": 658693, "epoch": 7936} {"train_loss": -27.9486083984375, "global_step": 658694, "epoch": 7936} {"train_loss": -28.215295791625977, "global_step": 658695, "epoch": 7936} {"train_loss": -28.361682891845703, "global_step": 658696, "epoch": 7936} {"train_loss": -28.181262969970703, "global_step": 658697, "epoch": 7936} {"train_loss": -28.229658126831055, "global_step": 658698, "epoch": 7936} {"train_loss": -28.031362533569336, "global_step": 658699, "epoch": 7936} {"train_loss": -28.020401000976562, "global_step": 658700, "epoch": 7936} {"train_loss": -28.125280380249023, "global_step": 658701, "epoch": 7936} {"train_loss": -28.5385799407959, "global_step": 658702, "epoch": 7936} {"train_loss": -28.296472549438477, "global_step": 658703, "epoch": 7936} {"train_loss": -28.319238662719727, "global_step": 658704, "epoch": 7936} {"train_loss": -28.327550888061523, "global_step": 658705, "epoch": 7936} {"train_loss": -28.498083114624023, "global_step": 658706, "epoch": 7936} {"train_loss": -28.137298583984375, "global_step": 658707, "epoch": 7936} {"train_loss": -28.35664176940918, "global_step": 658708, "epoch": 7936} {"train_loss": -28.2889347076416, "global_step": 658709, "epoch": 7936} {"train_loss": -28.409067153930664, "global_step": 658710, "epoch": 7936} {"train_loss": -28.077817916870117, "global_step": 658711, "epoch": 7936} {"train_loss": -28.82390785217285, "global_step": 658712, "epoch": 7936} {"train_loss": -28.123029708862305, "global_step": 658713, "epoch": 7936} {"train_loss": -28.372573852539062, "global_step": 658714, "epoch": 7936} {"train_loss": -28.374298095703125, "global_step": 658715, "epoch": 7936} {"train_loss": -28.371978759765625, "global_step": 658716, "epoch": 7936} {"train_loss": -28.530675888061523, "global_step": 658717, "epoch": 7936} {"train_loss": -28.309350967407227, "global_step": 658718, "epoch": 7936} {"train_loss": -28.39666175842285, "global_step": 658719, "epoch": 7936} {"train_loss": -28.791034698486328, "global_step": 658720, "epoch": 7936} {"train_loss": -27.991138458251953, "global_step": 658721, "epoch": 7936} {"train_loss": -28.54037857055664, "global_step": 658722, "epoch": 7936} {"train_loss": -28.13886070251465, "global_step": 658723, "epoch": 7936} {"train_loss": -28.456327438354492, "global_step": 658724, "epoch": 7936} {"train_loss": -28.237314224243164, "global_step": 658725, "epoch": 7936} {"train_loss": -28.669843673706055, "global_step": 658726, "epoch": 7936} {"train_loss": -28.560501098632812, "global_step": 658727, "epoch": 7936} {"train_loss": -28.19342613220215, "global_step": 658728, "epoch": 7936} {"train_loss": -28.644941329956055, "global_step": 658729, "epoch": 7936} {"train_loss": -28.1516056060791, "global_step": 658730, "epoch": 7936} {"train_loss": -28.128812789916992, "global_step": 658731, "epoch": 7936} {"train_loss": -28.229291915893555, "global_step": 658732, "epoch": 7936} {"train_loss": -28.030887603759766, "global_step": 658733, "epoch": 7936} {"train_loss": -27.67449378967285, "global_step": 658734, "epoch": 7936} {"train_loss": -27.946765899658203, "global_step": 658735, "epoch": 7936} {"train_loss": -28.593679428100586, "global_step": 658736, "epoch": 7936} {"train_loss": -28.286169052124023, "global_step": 658737, "epoch": 7936} {"train_loss": -28.43946647644043, "global_step": 658738, "epoch": 7936} {"train_loss": -28.53675651550293, "global_step": 658739, "epoch": 7936} {"train_loss": -28.123376846313477, "global_step": 658740, "epoch": 7936} {"train_loss": -28.143476486206055, "global_step": 658741, "epoch": 7936} {"train_loss": -27.813018798828125, "global_step": 658742, "epoch": 7936} {"train_loss": -28.035083770751953, "global_step": 658743, "epoch": 7936} {"train_loss": -27.877765655517578, "global_step": 658744, "epoch": 7936} {"train_loss": -28.24652671813965, "global_step": 658745, "epoch": 7936} {"train_loss": -27.797834396362305, "global_step": 658746, "epoch": 7936} {"train_loss": -28.11270523071289, "global_step": 658747, "epoch": 7936} {"train_loss": -28.420217514038086, "global_step": 658748, "epoch": 7936} {"train_loss": -28.358774185180664, "global_step": 658749, "epoch": 7936} {"train_loss": -27.644880294799805, "global_step": 658750, "epoch": 7936} {"train_loss": -28.129169464111328, "global_step": 658751, "epoch": 7936} {"train_loss": -27.864587783813477, "global_step": 658752, "epoch": 7936} {"train_loss": -28.042123794555664, "global_step": 658753, "epoch": 7936} {"train_loss": -28.126663208007812, "global_step": 658754, "epoch": 7936} {"train_loss": -27.948871612548828, "global_step": 658755, "epoch": 7936} {"train_loss": -28.43055534362793, "global_step": 658756, "epoch": 7936} {"train_loss": -27.806640625, "global_step": 658757, "epoch": 7936} {"train_loss": -28.174184799194336, "global_step": 658758, "epoch": 7936} {"train_loss": -27.921451568603516, "global_step": 658759, "epoch": 7936} {"train_loss": -28.410049438476562, "global_step": 658760, "epoch": 7936} {"train_loss": -27.9697322845459, "global_step": 658761, "epoch": 7936} {"train_loss": -27.92531394958496, "global_step": 658762, "epoch": 7936} {"train_loss": -28.149494171142578, "global_step": 658763, "epoch": 7936} {"train_loss": -28.106597900390625, "global_step": 658764, "epoch": 7936} {"train_loss": -28.222549438476562, "global_step": 658765, "epoch": 7936} {"train_loss": -27.984512329101562, "global_step": 658766, "epoch": 7936} {"train_loss": -27.962854385375977, "global_step": 658767, "epoch": 7936} {"train_loss": -28.580249786376953, "global_step": 658768, "epoch": 7936} {"train_loss": -28.391510009765625, "global_step": 658769, "epoch": 7936} {"train_loss": -28.212510580039886, "global_step": 658770, "epoch": 7936, "val_loss": 6573404.0} {"train_loss": -27.862157821655273, "global_step": 658771, "epoch": 7937} {"train_loss": -28.100549697875977, "global_step": 658772, "epoch": 7937} {"train_loss": -28.07354164123535, "global_step": 658773, "epoch": 7937} {"train_loss": -28.33339500427246, "global_step": 658774, "epoch": 7937} {"train_loss": -28.205846786499023, "global_step": 658775, "epoch": 7937} {"train_loss": -27.870752334594727, "global_step": 658776, "epoch": 7937} {"train_loss": -28.095630645751953, "global_step": 658777, "epoch": 7937} {"train_loss": -27.939184188842773, "global_step": 658778, "epoch": 7937} {"train_loss": -27.958724975585938, "global_step": 658779, "epoch": 7937} {"train_loss": -27.931655883789062, "global_step": 658780, "epoch": 7937} {"train_loss": -28.183984756469727, "global_step": 658781, "epoch": 7937} {"train_loss": -28.162931442260742, "global_step": 658782, "epoch": 7937} {"train_loss": -28.11505699157715, "global_step": 658783, "epoch": 7937} {"train_loss": -28.39737319946289, "global_step": 658784, "epoch": 7937} {"train_loss": -28.31829833984375, "global_step": 658785, "epoch": 7937} {"train_loss": -28.2164306640625, "global_step": 658786, "epoch": 7937} {"train_loss": -28.237585067749023, "global_step": 658787, "epoch": 7937} {"train_loss": -28.63442039489746, "global_step": 658788, "epoch": 7937} {"train_loss": -28.0920467376709, "global_step": 658789, "epoch": 7937} {"train_loss": -28.30889892578125, "global_step": 658790, "epoch": 7937} {"train_loss": -28.38471794128418, "global_step": 658791, "epoch": 7937} {"train_loss": -28.292123794555664, "global_step": 658792, "epoch": 7937} {"train_loss": -28.450611114501953, "global_step": 658793, "epoch": 7937} {"train_loss": -28.017475128173828, "global_step": 658794, "epoch": 7937} {"train_loss": -28.47025489807129, "global_step": 658795, "epoch": 7937} {"train_loss": -28.446027755737305, "global_step": 658796, "epoch": 7937} {"train_loss": -28.48091697692871, "global_step": 658797, "epoch": 7937} {"train_loss": -28.38712501525879, "global_step": 658798, "epoch": 7937} {"train_loss": -28.724584579467773, "global_step": 658799, "epoch": 7937} {"train_loss": -28.5835018157959, "global_step": 658800, "epoch": 7937} {"train_loss": -28.476587295532227, "global_step": 658801, "epoch": 7937} {"train_loss": -28.349645614624023, "global_step": 658802, "epoch": 7937} {"train_loss": -27.73381996154785, "global_step": 658803, "epoch": 7937} {"train_loss": -27.163864135742188, "global_step": 658804, "epoch": 7937} {"train_loss": -27.537994384765625, "global_step": 658805, "epoch": 7937} {"train_loss": -28.267810821533203, "global_step": 658806, "epoch": 7937} {"train_loss": -27.8689022064209, "global_step": 658807, "epoch": 7937} {"train_loss": -27.280914306640625, "global_step": 658808, "epoch": 7937} {"train_loss": -27.966785430908203, "global_step": 658809, "epoch": 7937} {"train_loss": -27.71112632751465, "global_step": 658810, "epoch": 7937} {"train_loss": -28.1700382232666, "global_step": 658811, "epoch": 7937} {"train_loss": -27.643102645874023, "global_step": 658812, "epoch": 7937} {"train_loss": -27.697172164916992, "global_step": 658813, "epoch": 7937} {"train_loss": -28.42335319519043, "global_step": 658814, "epoch": 7937} {"train_loss": -27.77753257751465, "global_step": 658815, "epoch": 7937} {"train_loss": -28.340574264526367, "global_step": 658816, "epoch": 7937} {"train_loss": -28.329456329345703, "global_step": 658817, "epoch": 7937} {"train_loss": -27.762542724609375, "global_step": 658818, "epoch": 7937} {"train_loss": -27.980304718017578, "global_step": 658819, "epoch": 7937} {"train_loss": -27.69106101989746, "global_step": 658820, "epoch": 7937} {"train_loss": -28.182592391967773, "global_step": 658821, "epoch": 7937} {"train_loss": -27.99871253967285, "global_step": 658822, "epoch": 7937} {"train_loss": -27.9676570892334, "global_step": 658823, "epoch": 7937} {"train_loss": -28.535322189331055, "global_step": 658824, "epoch": 7937} {"train_loss": -28.07391357421875, "global_step": 658825, "epoch": 7937} {"train_loss": -27.973127365112305, "global_step": 658826, "epoch": 7937} {"train_loss": -28.1831111907959, "global_step": 658827, "epoch": 7937} {"train_loss": -27.90581703186035, "global_step": 658828, "epoch": 7937} {"train_loss": -28.256561279296875, "global_step": 658829, "epoch": 7937} {"train_loss": -28.15077018737793, "global_step": 658830, "epoch": 7937} {"train_loss": -28.61957359313965, "global_step": 658831, "epoch": 7937} {"train_loss": -28.009891510009766, "global_step": 658832, "epoch": 7937} {"train_loss": -27.966733932495117, "global_step": 658833, "epoch": 7937} {"train_loss": -28.636144638061523, "global_step": 658834, "epoch": 7937} {"train_loss": -28.33234977722168, "global_step": 658835, "epoch": 7937} {"train_loss": -28.441843032836914, "global_step": 658836, "epoch": 7937} {"train_loss": -28.5496883392334, "global_step": 658837, "epoch": 7937} {"train_loss": -28.653945922851562, "global_step": 658838, "epoch": 7937} {"train_loss": -28.578222274780273, "global_step": 658839, "epoch": 7937} {"train_loss": -28.1910457611084, "global_step": 658840, "epoch": 7937} {"train_loss": -28.501953125, "global_step": 658841, "epoch": 7937} {"train_loss": -28.44495964050293, "global_step": 658842, "epoch": 7937} {"train_loss": -28.461881637573242, "global_step": 658843, "epoch": 7937} {"train_loss": -28.646100997924805, "global_step": 658844, "epoch": 7937} {"train_loss": -28.521198272705078, "global_step": 658845, "epoch": 7937} {"train_loss": -28.182947158813477, "global_step": 658846, "epoch": 7937} {"train_loss": -28.699628829956055, "global_step": 658847, "epoch": 7937} {"train_loss": -28.73545265197754, "global_step": 658848, "epoch": 7937} {"train_loss": -28.614887237548828, "global_step": 658849, "epoch": 7937} {"train_loss": -28.57280921936035, "global_step": 658850, "epoch": 7937} {"train_loss": -28.189788818359375, "global_step": 658851, "epoch": 7937} {"train_loss": -28.113178253173828, "global_step": 658852, "epoch": 7937} {"train_loss": -28.205044459147626, "global_step": 658853, "epoch": 7937, "val_loss": 6683924.0} {"train_loss": -27.734617233276367, "global_step": 658854, "epoch": 7938} {"train_loss": -27.288482666015625, "global_step": 658855, "epoch": 7938} {"train_loss": -26.35304832458496, "global_step": 658856, "epoch": 7938} {"train_loss": -25.608856201171875, "global_step": 658857, "epoch": 7938} {"train_loss": -26.90389060974121, "global_step": 658858, "epoch": 7938} {"train_loss": -27.977996826171875, "global_step": 658859, "epoch": 7938} {"train_loss": -26.473270416259766, "global_step": 658860, "epoch": 7938} {"train_loss": -27.642683029174805, "global_step": 658861, "epoch": 7938} {"train_loss": -26.91242790222168, "global_step": 658862, "epoch": 7938} {"train_loss": -27.735471725463867, "global_step": 658863, "epoch": 7938} {"train_loss": -27.74964714050293, "global_step": 658864, "epoch": 7938} {"train_loss": -27.63169288635254, "global_step": 658865, "epoch": 7938} {"train_loss": -27.992206573486328, "global_step": 658866, "epoch": 7938} {"train_loss": -28.173236846923828, "global_step": 658867, "epoch": 7938} {"train_loss": -27.696704864501953, "global_step": 658868, "epoch": 7938} {"train_loss": -28.060882568359375, "global_step": 658869, "epoch": 7938} {"train_loss": -27.580108642578125, "global_step": 658870, "epoch": 7938} {"train_loss": -27.889005661010742, "global_step": 658871, "epoch": 7938} {"train_loss": -28.09326171875, "global_step": 658872, "epoch": 7938} {"train_loss": -27.872577667236328, "global_step": 658873, "epoch": 7938} {"train_loss": -27.652219772338867, "global_step": 658874, "epoch": 7938} {"train_loss": -27.66115379333496, "global_step": 658875, "epoch": 7938} {"train_loss": -28.077728271484375, "global_step": 658876, "epoch": 7938} {"train_loss": -27.76380729675293, "global_step": 658877, "epoch": 7938} {"train_loss": -28.07826042175293, "global_step": 658878, "epoch": 7938} {"train_loss": -27.77120018005371, "global_step": 658879, "epoch": 7938} {"train_loss": -28.252954483032227, "global_step": 658880, "epoch": 7938} {"train_loss": -28.120197296142578, "global_step": 658881, "epoch": 7938} {"train_loss": -27.82173728942871, "global_step": 658882, "epoch": 7938} {"train_loss": -28.104690551757812, "global_step": 658883, "epoch": 7938} {"train_loss": -28.289417266845703, "global_step": 658884, "epoch": 7938} {"train_loss": -28.43633460998535, "global_step": 658885, "epoch": 7938} {"train_loss": -27.84307289123535, "global_step": 658886, "epoch": 7938} {"train_loss": -28.330286026000977, "global_step": 658887, "epoch": 7938} {"train_loss": -28.331756591796875, "global_step": 658888, "epoch": 7938} {"train_loss": -27.956388473510742, "global_step": 658889, "epoch": 7938} {"train_loss": -28.080358505249023, "global_step": 658890, "epoch": 7938} {"train_loss": -28.28485107421875, "global_step": 658891, "epoch": 7938} {"train_loss": -28.408105850219727, "global_step": 658892, "epoch": 7938} {"train_loss": -28.474685668945312, "global_step": 658893, "epoch": 7938} {"train_loss": -28.411487579345703, "global_step": 658894, "epoch": 7938} {"train_loss": -28.66650390625, "global_step": 658895, "epoch": 7938} {"train_loss": -28.357275009155273, "global_step": 658896, "epoch": 7938} {"train_loss": -28.448230743408203, "global_step": 658897, "epoch": 7938} {"train_loss": -28.57004165649414, "global_step": 658898, "epoch": 7938} {"train_loss": -28.337247848510742, "global_step": 658899, "epoch": 7938} {"train_loss": -27.840320587158203, "global_step": 658900, "epoch": 7938} {"train_loss": -27.746923446655273, "global_step": 658901, "epoch": 7938} {"train_loss": -28.486347198486328, "global_step": 658902, "epoch": 7938} {"train_loss": -28.149017333984375, "global_step": 658903, "epoch": 7938} {"train_loss": -28.094207763671875, "global_step": 658904, "epoch": 7938} {"train_loss": -28.0694637298584, "global_step": 658905, "epoch": 7938} {"train_loss": -28.26422119140625, "global_step": 658906, "epoch": 7938} {"train_loss": -28.2105712890625, "global_step": 658907, "epoch": 7938} {"train_loss": -28.34519386291504, "global_step": 658908, "epoch": 7938} {"train_loss": -28.448352813720703, "global_step": 658909, "epoch": 7938} {"train_loss": -28.302335739135742, "global_step": 658910, "epoch": 7938} {"train_loss": -28.255695343017578, "global_step": 658911, "epoch": 7938} {"train_loss": -28.446857452392578, "global_step": 658912, "epoch": 7938} {"train_loss": -28.481311798095703, "global_step": 658913, "epoch": 7938} {"train_loss": -28.17317008972168, "global_step": 658914, "epoch": 7938} {"train_loss": -28.48105239868164, "global_step": 658915, "epoch": 7938} {"train_loss": -28.403522491455078, "global_step": 658916, "epoch": 7938} {"train_loss": -28.38051414489746, "global_step": 658917, "epoch": 7938} {"train_loss": -28.448383331298828, "global_step": 658918, "epoch": 7938} {"train_loss": -28.254098892211914, "global_step": 658919, "epoch": 7938} {"train_loss": -28.362058639526367, "global_step": 658920, "epoch": 7938} {"train_loss": -28.40155029296875, "global_step": 658921, "epoch": 7938} {"train_loss": -28.359283447265625, "global_step": 658922, "epoch": 7938} {"train_loss": -28.545551300048828, "global_step": 658923, "epoch": 7938} {"train_loss": -28.5384578704834, "global_step": 658924, "epoch": 7938} {"train_loss": -28.398351669311523, "global_step": 658925, "epoch": 7938} {"train_loss": -28.468063354492188, "global_step": 658926, "epoch": 7938} {"train_loss": -28.33111000061035, "global_step": 658927, "epoch": 7938} {"train_loss": -28.41318130493164, "global_step": 658928, "epoch": 7938} {"train_loss": -27.946060180664062, "global_step": 658929, "epoch": 7938} {"train_loss": -27.910696029663086, "global_step": 658930, "epoch": 7938} {"train_loss": -28.091588973999023, "global_step": 658931, "epoch": 7938} {"train_loss": -28.266000747680664, "global_step": 658932, "epoch": 7938} {"train_loss": -27.892175674438477, "global_step": 658933, "epoch": 7938} {"train_loss": -28.39410972595215, "global_step": 658934, "epoch": 7938} {"train_loss": -28.09819984436035, "global_step": 658935, "epoch": 7938} {"train_loss": -28.0238077324557, "global_step": 658936, "epoch": 7938, "val_loss": 6673672.0} {"train_loss": -26.29886817932129, "global_step": 658937, "epoch": 7939} {"train_loss": -26.29511833190918, "global_step": 658938, "epoch": 7939} {"train_loss": -26.665863037109375, "global_step": 658939, "epoch": 7939} {"train_loss": -27.598669052124023, "global_step": 658940, "epoch": 7939} {"train_loss": -26.730178833007812, "global_step": 658941, "epoch": 7939} {"train_loss": -27.04231071472168, "global_step": 658942, "epoch": 7939} {"train_loss": -27.90329360961914, "global_step": 658943, "epoch": 7939} {"train_loss": -27.472248077392578, "global_step": 658944, "epoch": 7939} {"train_loss": -27.364227294921875, "global_step": 658945, "epoch": 7939} {"train_loss": -27.698461532592773, "global_step": 658946, "epoch": 7939} {"train_loss": -27.747974395751953, "global_step": 658947, "epoch": 7939} {"train_loss": -27.778533935546875, "global_step": 658948, "epoch": 7939} {"train_loss": -28.15948486328125, "global_step": 658949, "epoch": 7939} {"train_loss": -27.855239868164062, "global_step": 658950, "epoch": 7939} {"train_loss": -28.1335391998291, "global_step": 658951, "epoch": 7939} {"train_loss": -27.842432022094727, "global_step": 658952, "epoch": 7939} {"train_loss": -28.106103897094727, "global_step": 658953, "epoch": 7939} {"train_loss": -27.954809188842773, "global_step": 658954, "epoch": 7939} {"train_loss": -27.698293685913086, "global_step": 658955, "epoch": 7939} {"train_loss": -27.98822021484375, "global_step": 658956, "epoch": 7939} {"train_loss": -27.82291030883789, "global_step": 658957, "epoch": 7939} {"train_loss": -28.209997177124023, "global_step": 658958, "epoch": 7939} {"train_loss": -28.065860748291016, "global_step": 658959, "epoch": 7939} {"train_loss": -27.480817794799805, "global_step": 658960, "epoch": 7939} {"train_loss": -27.750165939331055, "global_step": 658961, "epoch": 7939} {"train_loss": -28.528121948242188, "global_step": 658962, "epoch": 7939} {"train_loss": -28.093414306640625, "global_step": 658963, "epoch": 7939} {"train_loss": -28.1326847076416, "global_step": 658964, "epoch": 7939} {"train_loss": -28.45784568786621, "global_step": 658965, "epoch": 7939} {"train_loss": -28.1461238861084, "global_step": 658966, "epoch": 7939} {"train_loss": -28.211151123046875, "global_step": 658967, "epoch": 7939} {"train_loss": -28.18682861328125, "global_step": 658968, "epoch": 7939} {"train_loss": -28.387292861938477, "global_step": 658969, "epoch": 7939} {"train_loss": -28.42752456665039, "global_step": 658970, "epoch": 7939} {"train_loss": -28.564062118530273, "global_step": 658971, "epoch": 7939} {"train_loss": -28.324432373046875, "global_step": 658972, "epoch": 7939} {"train_loss": -28.20270347595215, "global_step": 658973, "epoch": 7939} {"train_loss": -28.35869789123535, "global_step": 658974, "epoch": 7939} {"train_loss": -28.611469268798828, "global_step": 658975, "epoch": 7939} {"train_loss": -28.31650733947754, "global_step": 658976, "epoch": 7939} {"train_loss": -28.05621910095215, "global_step": 658977, "epoch": 7939} {"train_loss": -28.403745651245117, "global_step": 658978, "epoch": 7939} {"train_loss": -28.0833683013916, "global_step": 658979, "epoch": 7939} {"train_loss": -28.487960815429688, "global_step": 658980, "epoch": 7939} {"train_loss": -28.571523666381836, "global_step": 658981, "epoch": 7939} {"train_loss": -28.46625328063965, "global_step": 658982, "epoch": 7939} {"train_loss": -27.945627212524414, "global_step": 658983, "epoch": 7939} {"train_loss": -28.06183433532715, "global_step": 658984, "epoch": 7939} {"train_loss": -28.185094833374023, "global_step": 658985, "epoch": 7939} {"train_loss": -28.16756248474121, "global_step": 658986, "epoch": 7939} {"train_loss": -28.056427001953125, "global_step": 658987, "epoch": 7939} {"train_loss": -28.689041137695312, "global_step": 658988, "epoch": 7939} {"train_loss": -28.330432891845703, "global_step": 658989, "epoch": 7939} {"train_loss": -28.30548667907715, "global_step": 658990, "epoch": 7939} {"train_loss": -28.244497299194336, "global_step": 658991, "epoch": 7939} {"train_loss": -28.444692611694336, "global_step": 658992, "epoch": 7939} {"train_loss": -28.392297744750977, "global_step": 658993, "epoch": 7939} {"train_loss": -28.283588409423828, "global_step": 658994, "epoch": 7939} {"train_loss": -28.764490127563477, "global_step": 658995, "epoch": 7939} {"train_loss": -28.405210494995117, "global_step": 658996, "epoch": 7939} {"train_loss": -28.49030876159668, "global_step": 658997, "epoch": 7939} {"train_loss": -28.491979598999023, "global_step": 658998, "epoch": 7939} {"train_loss": -28.619226455688477, "global_step": 658999, "epoch": 7939} {"train_loss": -28.5258731842041, "global_step": 659000, "epoch": 7939} {"train_loss": -28.70975112915039, "global_step": 659001, "epoch": 7939} {"train_loss": -28.580097198486328, "global_step": 659002, "epoch": 7939} {"train_loss": -28.3351993560791, "global_step": 659003, "epoch": 7939} {"train_loss": -28.74128532409668, "global_step": 659004, "epoch": 7939} {"train_loss": -28.507394790649414, "global_step": 659005, "epoch": 7939} {"train_loss": -28.384063720703125, "global_step": 659006, "epoch": 7939} {"train_loss": -28.370990753173828, "global_step": 659007, "epoch": 7939} {"train_loss": -28.223936080932617, "global_step": 659008, "epoch": 7939} {"train_loss": -27.791095733642578, "global_step": 659009, "epoch": 7939} {"train_loss": -27.37708854675293, "global_step": 659010, "epoch": 7939} {"train_loss": -27.6424503326416, "global_step": 659011, "epoch": 7939} {"train_loss": -27.454198837280273, "global_step": 659012, "epoch": 7939} {"train_loss": -28.31072998046875, "global_step": 659013, "epoch": 7939} {"train_loss": -28.315073013305664, "global_step": 659014, "epoch": 7939} {"train_loss": -27.776037216186523, "global_step": 659015, "epoch": 7939} {"train_loss": -28.213712692260742, "global_step": 659016, "epoch": 7939} {"train_loss": -27.98870849609375, "global_step": 659017, "epoch": 7939} {"train_loss": -28.138898849487305, "global_step": 659018, "epoch": 7939} {"train_loss": -28.060169403811535, "global_step": 659019, "epoch": 7939, "val_loss": 7018105.5} {"train_loss": -28.21158218383789, "global_step": 659020, "epoch": 7940} {"train_loss": -28.055952072143555, "global_step": 659021, "epoch": 7940} {"train_loss": -28.11044692993164, "global_step": 659022, "epoch": 7940} {"train_loss": -28.154815673828125, "global_step": 659023, "epoch": 7940} {"train_loss": -28.157562255859375, "global_step": 659024, "epoch": 7940} {"train_loss": -27.906036376953125, "global_step": 659025, "epoch": 7940} {"train_loss": -27.88507080078125, "global_step": 659026, "epoch": 7940} {"train_loss": -28.1634578704834, "global_step": 659027, "epoch": 7940} {"train_loss": -28.003332138061523, "global_step": 659028, "epoch": 7940} {"train_loss": -28.24921989440918, "global_step": 659029, "epoch": 7940} {"train_loss": -28.07965660095215, "global_step": 659030, "epoch": 7940} {"train_loss": -28.52724266052246, "global_step": 659031, "epoch": 7940} {"train_loss": -27.865955352783203, "global_step": 659032, "epoch": 7940} {"train_loss": -28.334518432617188, "global_step": 659033, "epoch": 7940} {"train_loss": -28.607730865478516, "global_step": 659034, "epoch": 7940} {"train_loss": -28.474292755126953, "global_step": 659035, "epoch": 7940} {"train_loss": -28.682952880859375, "global_step": 659036, "epoch": 7940} {"train_loss": -28.180280685424805, "global_step": 659037, "epoch": 7940} {"train_loss": -27.902236938476562, "global_step": 659038, "epoch": 7940} {"train_loss": -28.13162612915039, "global_step": 659039, "epoch": 7940} {"train_loss": -28.218219757080078, "global_step": 659040, "epoch": 7940} {"train_loss": -28.24976921081543, "global_step": 659041, "epoch": 7940} {"train_loss": -28.247650146484375, "global_step": 659042, "epoch": 7940} {"train_loss": -28.392562866210938, "global_step": 659043, "epoch": 7940} {"train_loss": -28.653242111206055, "global_step": 659044, "epoch": 7940} {"train_loss": -28.06475830078125, "global_step": 659045, "epoch": 7940} {"train_loss": -28.19733238220215, "global_step": 659046, "epoch": 7940} {"train_loss": -28.09119987487793, "global_step": 659047, "epoch": 7940} {"train_loss": -27.758228302001953, "global_step": 659048, "epoch": 7940} {"train_loss": -28.23287010192871, "global_step": 659049, "epoch": 7940} {"train_loss": -28.360227584838867, "global_step": 659050, "epoch": 7940} {"train_loss": -28.0447940826416, "global_step": 659051, "epoch": 7940} {"train_loss": -28.28215980529785, "global_step": 659052, "epoch": 7940} {"train_loss": -28.115802764892578, "global_step": 659053, "epoch": 7940} {"train_loss": -28.447717666625977, "global_step": 659054, "epoch": 7940} {"train_loss": -28.498044967651367, "global_step": 659055, "epoch": 7940} {"train_loss": -27.956396102905273, "global_step": 659056, "epoch": 7940} {"train_loss": -28.51123046875, "global_step": 659057, "epoch": 7940} {"train_loss": -28.276294708251953, "global_step": 659058, "epoch": 7940} {"train_loss": -28.30859375, "global_step": 659059, "epoch": 7940} {"train_loss": -27.9798526763916, "global_step": 659060, "epoch": 7940} {"train_loss": -28.309585571289062, "global_step": 659061, "epoch": 7940} {"train_loss": -28.608301162719727, "global_step": 659062, "epoch": 7940} {"train_loss": -28.44440269470215, "global_step": 659063, "epoch": 7940} {"train_loss": -28.143823623657227, "global_step": 659064, "epoch": 7940} {"train_loss": -28.21247673034668, "global_step": 659065, "epoch": 7940} {"train_loss": -28.003713607788086, "global_step": 659066, "epoch": 7940} {"train_loss": -28.716821670532227, "global_step": 659067, "epoch": 7940} {"train_loss": -28.6409912109375, "global_step": 659068, "epoch": 7940} {"train_loss": -28.83563804626465, "global_step": 659069, "epoch": 7940} {"train_loss": -28.110950469970703, "global_step": 659070, "epoch": 7940} {"train_loss": -28.69976234436035, "global_step": 659071, "epoch": 7940} {"train_loss": -28.4041690826416, "global_step": 659072, "epoch": 7940} {"train_loss": -28.33233642578125, "global_step": 659073, "epoch": 7940} {"train_loss": -28.36859703063965, "global_step": 659074, "epoch": 7940} {"train_loss": -28.10920524597168, "global_step": 659075, "epoch": 7940} {"train_loss": -27.404096603393555, "global_step": 659076, "epoch": 7940} {"train_loss": -26.931472778320312, "global_step": 659077, "epoch": 7940} {"train_loss": -27.538442611694336, "global_step": 659078, "epoch": 7940} {"train_loss": -27.680044174194336, "global_step": 659079, "epoch": 7940} {"train_loss": -28.462751388549805, "global_step": 659080, "epoch": 7940} {"train_loss": -27.466650009155273, "global_step": 659081, "epoch": 7940} {"train_loss": -28.103784561157227, "global_step": 659082, "epoch": 7940} {"train_loss": -28.043975830078125, "global_step": 659083, "epoch": 7940} {"train_loss": -28.1381778717041, "global_step": 659084, "epoch": 7940} {"train_loss": -28.37869644165039, "global_step": 659085, "epoch": 7940} {"train_loss": -28.013471603393555, "global_step": 659086, "epoch": 7940} {"train_loss": -28.620222091674805, "global_step": 659087, "epoch": 7940} {"train_loss": -27.98505210876465, "global_step": 659088, "epoch": 7940} {"train_loss": -28.263355255126953, "global_step": 659089, "epoch": 7940} {"train_loss": -28.126346588134766, "global_step": 659090, "epoch": 7940} {"train_loss": -28.0526065826416, "global_step": 659091, "epoch": 7940} {"train_loss": -28.241352081298828, "global_step": 659092, "epoch": 7940} {"train_loss": -27.8103084564209, "global_step": 659093, "epoch": 7940} {"train_loss": -28.10530662536621, "global_step": 659094, "epoch": 7940} {"train_loss": -28.459701538085938, "global_step": 659095, "epoch": 7940} {"train_loss": -28.331684112548828, "global_step": 659096, "epoch": 7940} {"train_loss": -28.018280029296875, "global_step": 659097, "epoch": 7940} {"train_loss": -28.69337272644043, "global_step": 659098, "epoch": 7940} {"train_loss": -28.24788475036621, "global_step": 659099, "epoch": 7940} {"train_loss": -28.35089683532715, "global_step": 659100, "epoch": 7940} {"train_loss": -28.594091415405273, "global_step": 659101, "epoch": 7940} {"train_loss": -28.206583298832538, "global_step": 659102, "epoch": 7940, "val_loss": 6943998.5} {"train_loss": -27.977731704711914, "global_step": 659103, "epoch": 7941} {"train_loss": -27.635366439819336, "global_step": 659104, "epoch": 7941} {"train_loss": -28.030841827392578, "global_step": 659105, "epoch": 7941} {"train_loss": -27.85334587097168, "global_step": 659106, "epoch": 7941} {"train_loss": -28.01581382751465, "global_step": 659107, "epoch": 7941} {"train_loss": -28.121662139892578, "global_step": 659108, "epoch": 7941} {"train_loss": -28.1879940032959, "global_step": 659109, "epoch": 7941} {"train_loss": -27.909656524658203, "global_step": 659110, "epoch": 7941} {"train_loss": -27.962106704711914, "global_step": 659111, "epoch": 7941} {"train_loss": -28.026569366455078, "global_step": 659112, "epoch": 7941} {"train_loss": -27.87007713317871, "global_step": 659113, "epoch": 7941} {"train_loss": -28.30740737915039, "global_step": 659114, "epoch": 7941} {"train_loss": -28.0152645111084, "global_step": 659115, "epoch": 7941} {"train_loss": -28.203826904296875, "global_step": 659116, "epoch": 7941} {"train_loss": -28.320987701416016, "global_step": 659117, "epoch": 7941} {"train_loss": -28.23636245727539, "global_step": 659118, "epoch": 7941} {"train_loss": -28.264175415039062, "global_step": 659119, "epoch": 7941} {"train_loss": -28.217376708984375, "global_step": 659120, "epoch": 7941} {"train_loss": -28.24945640563965, "global_step": 659121, "epoch": 7941} {"train_loss": -27.912885665893555, "global_step": 659122, "epoch": 7941} {"train_loss": -28.59588623046875, "global_step": 659123, "epoch": 7941} {"train_loss": -28.00537109375, "global_step": 659124, "epoch": 7941} {"train_loss": -28.32012367248535, "global_step": 659125, "epoch": 7941} {"train_loss": -28.050268173217773, "global_step": 659126, "epoch": 7941} {"train_loss": -28.306354522705078, "global_step": 659127, "epoch": 7941} {"train_loss": -27.984130859375, "global_step": 659128, "epoch": 7941} {"train_loss": -28.671247482299805, "global_step": 659129, "epoch": 7941} {"train_loss": -28.4609432220459, "global_step": 659130, "epoch": 7941} {"train_loss": -28.36846923828125, "global_step": 659131, "epoch": 7941} {"train_loss": -28.518177032470703, "global_step": 659132, "epoch": 7941} {"train_loss": -28.534042358398438, "global_step": 659133, "epoch": 7941} {"train_loss": -28.272165298461914, "global_step": 659134, "epoch": 7941} {"train_loss": -28.17949867248535, "global_step": 659135, "epoch": 7941} {"train_loss": -28.47369956970215, "global_step": 659136, "epoch": 7941} {"train_loss": -28.602476119995117, "global_step": 659137, "epoch": 7941} {"train_loss": -28.360645294189453, "global_step": 659138, "epoch": 7941} {"train_loss": -28.45818519592285, "global_step": 659139, "epoch": 7941} {"train_loss": -28.330427169799805, "global_step": 659140, "epoch": 7941} {"train_loss": -28.516881942749023, "global_step": 659141, "epoch": 7941} {"train_loss": -28.604084014892578, "global_step": 659142, "epoch": 7941} {"train_loss": -28.648120880126953, "global_step": 659143, "epoch": 7941} {"train_loss": -28.153934478759766, "global_step": 659144, "epoch": 7941} {"train_loss": -28.553186416625977, "global_step": 659145, "epoch": 7941} {"train_loss": -28.208642959594727, "global_step": 659146, "epoch": 7941} {"train_loss": -28.455896377563477, "global_step": 659147, "epoch": 7941} {"train_loss": -28.45584487915039, "global_step": 659148, "epoch": 7941} {"train_loss": -28.478681564331055, "global_step": 659149, "epoch": 7941} {"train_loss": -28.485631942749023, "global_step": 659150, "epoch": 7941} {"train_loss": -28.55544090270996, "global_step": 659151, "epoch": 7941} {"train_loss": -28.770832061767578, "global_step": 659152, "epoch": 7941} {"train_loss": -28.52667808532715, "global_step": 659153, "epoch": 7941} {"train_loss": -28.206079483032227, "global_step": 659154, "epoch": 7941} {"train_loss": -28.360137939453125, "global_step": 659155, "epoch": 7941} {"train_loss": -28.295856475830078, "global_step": 659156, "epoch": 7941} {"train_loss": -28.082990646362305, "global_step": 659157, "epoch": 7941} {"train_loss": -27.776554107666016, "global_step": 659158, "epoch": 7941} {"train_loss": -27.933698654174805, "global_step": 659159, "epoch": 7941} {"train_loss": -28.04532814025879, "global_step": 659160, "epoch": 7941} {"train_loss": -27.890954971313477, "global_step": 659161, "epoch": 7941} {"train_loss": -28.597822189331055, "global_step": 659162, "epoch": 7941} {"train_loss": -28.379627227783203, "global_step": 659163, "epoch": 7941} {"train_loss": -28.210172653198242, "global_step": 659164, "epoch": 7941} {"train_loss": -28.080793380737305, "global_step": 659165, "epoch": 7941} {"train_loss": -27.61408805847168, "global_step": 659166, "epoch": 7941} {"train_loss": -28.39410400390625, "global_step": 659167, "epoch": 7941} {"train_loss": -28.5107479095459, "global_step": 659168, "epoch": 7941} {"train_loss": -28.2543888092041, "global_step": 659169, "epoch": 7941} {"train_loss": -28.672561645507812, "global_step": 659170, "epoch": 7941} {"train_loss": -28.55177116394043, "global_step": 659171, "epoch": 7941} {"train_loss": -28.352338790893555, "global_step": 659172, "epoch": 7941} {"train_loss": -28.039411544799805, "global_step": 659173, "epoch": 7941} {"train_loss": -27.933242797851562, "global_step": 659174, "epoch": 7941} {"train_loss": -28.53143882751465, "global_step": 659175, "epoch": 7941} {"train_loss": -28.60257339477539, "global_step": 659176, "epoch": 7941} {"train_loss": -28.128875732421875, "global_step": 659177, "epoch": 7941} {"train_loss": -28.266101837158203, "global_step": 659178, "epoch": 7941} {"train_loss": -28.30586051940918, "global_step": 659179, "epoch": 7941} {"train_loss": -28.2540225982666, "global_step": 659180, "epoch": 7941} {"train_loss": -28.388580322265625, "global_step": 659181, "epoch": 7941} {"train_loss": -28.393171310424805, "global_step": 659182, "epoch": 7941} {"train_loss": -28.098316192626953, "global_step": 659183, "epoch": 7941} {"train_loss": -28.080219268798828, "global_step": 659184, "epoch": 7941} {"train_loss": -28.237366779741034, "global_step": 659185, "epoch": 7941, "val_loss": 6941539.0} {"train_loss": -27.061248779296875, "global_step": 659186, "epoch": 7942} {"train_loss": -27.098220825195312, "global_step": 659187, "epoch": 7942} {"train_loss": -27.902372360229492, "global_step": 659188, "epoch": 7942} {"train_loss": -27.963672637939453, "global_step": 659189, "epoch": 7942} {"train_loss": -26.817136764526367, "global_step": 659190, "epoch": 7942} {"train_loss": -28.48880386352539, "global_step": 659191, "epoch": 7942} {"train_loss": -27.659286499023438, "global_step": 659192, "epoch": 7942} {"train_loss": -27.864927291870117, "global_step": 659193, "epoch": 7942} {"train_loss": -28.463150024414062, "global_step": 659194, "epoch": 7942} {"train_loss": -27.999011993408203, "global_step": 659195, "epoch": 7942} {"train_loss": -28.00495719909668, "global_step": 659196, "epoch": 7942} {"train_loss": -27.546594619750977, "global_step": 659197, "epoch": 7942} {"train_loss": -27.704389572143555, "global_step": 659198, "epoch": 7942} {"train_loss": -27.700164794921875, "global_step": 659199, "epoch": 7942} {"train_loss": -28.209980010986328, "global_step": 659200, "epoch": 7942} {"train_loss": -28.218231201171875, "global_step": 659201, "epoch": 7942} {"train_loss": -28.1453857421875, "global_step": 659202, "epoch": 7942} {"train_loss": -27.692874908447266, "global_step": 659203, "epoch": 7942} {"train_loss": -27.907272338867188, "global_step": 659204, "epoch": 7942} {"train_loss": -28.206037521362305, "global_step": 659205, "epoch": 7942} {"train_loss": -28.041040420532227, "global_step": 659206, "epoch": 7942} {"train_loss": -28.31084632873535, "global_step": 659207, "epoch": 7942} {"train_loss": -28.247434616088867, "global_step": 659208, "epoch": 7942} {"train_loss": -28.084508895874023, "global_step": 659209, "epoch": 7942} {"train_loss": -28.561914443969727, "global_step": 659210, "epoch": 7942} {"train_loss": -28.4432373046875, "global_step": 659211, "epoch": 7942} {"train_loss": -28.339380264282227, "global_step": 659212, "epoch": 7942} {"train_loss": -28.209054946899414, "global_step": 659213, "epoch": 7942} {"train_loss": -28.366931915283203, "global_step": 659214, "epoch": 7942} {"train_loss": -27.799062728881836, "global_step": 659215, "epoch": 7942} {"train_loss": -28.25577163696289, "global_step": 659216, "epoch": 7942} {"train_loss": -28.22806167602539, "global_step": 659217, "epoch": 7942} {"train_loss": -28.707611083984375, "global_step": 659218, "epoch": 7942} {"train_loss": -28.557104110717773, "global_step": 659219, "epoch": 7942} {"train_loss": -27.999256134033203, "global_step": 659220, "epoch": 7942} {"train_loss": -28.504932403564453, "global_step": 659221, "epoch": 7942} {"train_loss": -28.158466339111328, "global_step": 659222, "epoch": 7942} {"train_loss": -28.281524658203125, "global_step": 659223, "epoch": 7942} {"train_loss": -28.187047958374023, "global_step": 659224, "epoch": 7942} {"train_loss": -28.234134674072266, "global_step": 659225, "epoch": 7942} {"train_loss": -28.583831787109375, "global_step": 659226, "epoch": 7942} {"train_loss": -28.434598922729492, "global_step": 659227, "epoch": 7942} {"train_loss": -28.702716827392578, "global_step": 659228, "epoch": 7942} {"train_loss": -28.455078125, "global_step": 659229, "epoch": 7942} {"train_loss": -28.53653335571289, "global_step": 659230, "epoch": 7942} {"train_loss": -27.955982208251953, "global_step": 659231, "epoch": 7942} {"train_loss": -28.369369506835938, "global_step": 659232, "epoch": 7942} {"train_loss": -28.46558952331543, "global_step": 659233, "epoch": 7942} {"train_loss": -28.40167808532715, "global_step": 659234, "epoch": 7942} {"train_loss": -28.703235626220703, "global_step": 659235, "epoch": 7942} {"train_loss": -28.17316246032715, "global_step": 659236, "epoch": 7942} {"train_loss": -28.824066162109375, "global_step": 659237, "epoch": 7942} {"train_loss": -28.404972076416016, "global_step": 659238, "epoch": 7942} {"train_loss": -28.800649642944336, "global_step": 659239, "epoch": 7942} {"train_loss": -28.407638549804688, "global_step": 659240, "epoch": 7942} {"train_loss": -28.535919189453125, "global_step": 659241, "epoch": 7942} {"train_loss": -28.65840721130371, "global_step": 659242, "epoch": 7942} {"train_loss": -28.315282821655273, "global_step": 659243, "epoch": 7942} {"train_loss": -28.665857315063477, "global_step": 659244, "epoch": 7942} {"train_loss": -28.839221954345703, "global_step": 659245, "epoch": 7942} {"train_loss": -28.3621768951416, "global_step": 659246, "epoch": 7942} {"train_loss": -27.941049575805664, "global_step": 659247, "epoch": 7942} {"train_loss": -28.326557159423828, "global_step": 659248, "epoch": 7942} {"train_loss": -28.5811824798584, "global_step": 659249, "epoch": 7942} {"train_loss": -28.641525268554688, "global_step": 659250, "epoch": 7942} {"train_loss": -28.185876846313477, "global_step": 659251, "epoch": 7942} {"train_loss": -28.311771392822266, "global_step": 659252, "epoch": 7942} {"train_loss": -28.20942497253418, "global_step": 659253, "epoch": 7942} {"train_loss": -28.06294059753418, "global_step": 659254, "epoch": 7942} {"train_loss": -27.92429542541504, "global_step": 659255, "epoch": 7942} {"train_loss": -27.181732177734375, "global_step": 659256, "epoch": 7942} {"train_loss": -26.836755752563477, "global_step": 659257, "epoch": 7942} {"train_loss": -27.910043716430664, "global_step": 659258, "epoch": 7942} {"train_loss": -28.47284507751465, "global_step": 659259, "epoch": 7942} {"train_loss": -27.885358810424805, "global_step": 659260, "epoch": 7942} {"train_loss": -27.952844619750977, "global_step": 659261, "epoch": 7942} {"train_loss": -28.10738182067871, "global_step": 659262, "epoch": 7942} {"train_loss": -28.28156852722168, "global_step": 659263, "epoch": 7942} {"train_loss": -27.90815544128418, "global_step": 659264, "epoch": 7942} {"train_loss": -28.00135612487793, "global_step": 659265, "epoch": 7942} {"train_loss": -27.623416900634766, "global_step": 659266, "epoch": 7942} {"train_loss": -28.538557052612305, "global_step": 659267, "epoch": 7942} {"train_loss": -28.152461546013154, "global_step": 659268, "epoch": 7942, "val_loss": 7000325.0} {"train_loss": -27.411901473999023, "global_step": 659269, "epoch": 7943} {"train_loss": -26.853113174438477, "global_step": 659270, "epoch": 7943} {"train_loss": -27.741193771362305, "global_step": 659271, "epoch": 7943} {"train_loss": -27.099756240844727, "global_step": 659272, "epoch": 7943} {"train_loss": -27.988941192626953, "global_step": 659273, "epoch": 7943} {"train_loss": -27.5909481048584, "global_step": 659274, "epoch": 7943} {"train_loss": -27.72163200378418, "global_step": 659275, "epoch": 7943} {"train_loss": -27.6051082611084, "global_step": 659276, "epoch": 7943} {"train_loss": -27.613666534423828, "global_step": 659277, "epoch": 7943} {"train_loss": -27.849781036376953, "global_step": 659278, "epoch": 7943} {"train_loss": -27.09503746032715, "global_step": 659279, "epoch": 7943} {"train_loss": -26.694326400756836, "global_step": 659280, "epoch": 7943} {"train_loss": -27.578937530517578, "global_step": 659281, "epoch": 7943} {"train_loss": -27.859256744384766, "global_step": 659282, "epoch": 7943} {"train_loss": -27.98175621032715, "global_step": 659283, "epoch": 7943} {"train_loss": -27.451690673828125, "global_step": 659284, "epoch": 7943} {"train_loss": -27.95717430114746, "global_step": 659285, "epoch": 7943} {"train_loss": -27.656835556030273, "global_step": 659286, "epoch": 7943} {"train_loss": -27.465856552124023, "global_step": 659287, "epoch": 7943} {"train_loss": -28.009557723999023, "global_step": 659288, "epoch": 7943} {"train_loss": -27.854032516479492, "global_step": 659289, "epoch": 7943} {"train_loss": -27.914464950561523, "global_step": 659290, "epoch": 7943} {"train_loss": -28.066137313842773, "global_step": 659291, "epoch": 7943} {"train_loss": -27.68181800842285, "global_step": 659292, "epoch": 7943} {"train_loss": -27.892990112304688, "global_step": 659293, "epoch": 7943} {"train_loss": -27.861127853393555, "global_step": 659294, "epoch": 7943} {"train_loss": -28.208593368530273, "global_step": 659295, "epoch": 7943} {"train_loss": -27.816120147705078, "global_step": 659296, "epoch": 7943} {"train_loss": -28.16278648376465, "global_step": 659297, "epoch": 7943} {"train_loss": -28.05596351623535, "global_step": 659298, "epoch": 7943} {"train_loss": -28.01568603515625, "global_step": 659299, "epoch": 7943} {"train_loss": -28.160064697265625, "global_step": 659300, "epoch": 7943} {"train_loss": -28.156320571899414, "global_step": 659301, "epoch": 7943} {"train_loss": -28.174758911132812, "global_step": 659302, "epoch": 7943} {"train_loss": -27.7904052734375, "global_step": 659303, "epoch": 7943} {"train_loss": -28.07276725769043, "global_step": 659304, "epoch": 7943} {"train_loss": -28.405780792236328, "global_step": 659305, "epoch": 7943} {"train_loss": -28.352888107299805, "global_step": 659306, "epoch": 7943} {"train_loss": -28.003986358642578, "global_step": 659307, "epoch": 7943} {"train_loss": -28.137887954711914, "global_step": 659308, "epoch": 7943} {"train_loss": -28.365650177001953, "global_step": 659309, "epoch": 7943} {"train_loss": -28.281452178955078, "global_step": 659310, "epoch": 7943} {"train_loss": -28.52858543395996, "global_step": 659311, "epoch": 7943} {"train_loss": -28.396636962890625, "global_step": 659312, "epoch": 7943} {"train_loss": -28.3601016998291, "global_step": 659313, "epoch": 7943} {"train_loss": -28.403961181640625, "global_step": 659314, "epoch": 7943} {"train_loss": -28.206668853759766, "global_step": 659315, "epoch": 7943} {"train_loss": -28.162946701049805, "global_step": 659316, "epoch": 7943} {"train_loss": -28.661035537719727, "global_step": 659317, "epoch": 7943} {"train_loss": -28.36669921875, "global_step": 659318, "epoch": 7943} {"train_loss": -28.56268882751465, "global_step": 659319, "epoch": 7943} {"train_loss": -28.497201919555664, "global_step": 659320, "epoch": 7943} {"train_loss": -28.24798583984375, "global_step": 659321, "epoch": 7943} {"train_loss": -28.20672035217285, "global_step": 659322, "epoch": 7943} {"train_loss": -28.259103775024414, "global_step": 659323, "epoch": 7943} {"train_loss": -28.524396896362305, "global_step": 659324, "epoch": 7943} {"train_loss": -28.875003814697266, "global_step": 659325, "epoch": 7943} {"train_loss": -28.28476333618164, "global_step": 659326, "epoch": 7943} {"train_loss": -28.53497886657715, "global_step": 659327, "epoch": 7943} {"train_loss": -28.62003517150879, "global_step": 659328, "epoch": 7943} {"train_loss": -28.723791122436523, "global_step": 659329, "epoch": 7943} {"train_loss": -28.429492950439453, "global_step": 659330, "epoch": 7943} {"train_loss": -28.419218063354492, "global_step": 659331, "epoch": 7943} {"train_loss": -28.44187355041504, "global_step": 659332, "epoch": 7943} {"train_loss": -28.437488555908203, "global_step": 659333, "epoch": 7943} {"train_loss": -28.4272403717041, "global_step": 659334, "epoch": 7943} {"train_loss": -28.139501571655273, "global_step": 659335, "epoch": 7943} {"train_loss": -27.982330322265625, "global_step": 659336, "epoch": 7943} {"train_loss": -27.708393096923828, "global_step": 659337, "epoch": 7943} {"train_loss": -28.229955673217773, "global_step": 659338, "epoch": 7943} {"train_loss": -28.027328491210938, "global_step": 659339, "epoch": 7943} {"train_loss": -28.1096248626709, "global_step": 659340, "epoch": 7943} {"train_loss": -28.525110244750977, "global_step": 659341, "epoch": 7943} {"train_loss": -28.142419815063477, "global_step": 659342, "epoch": 7943} {"train_loss": -28.01837730407715, "global_step": 659343, "epoch": 7943} {"train_loss": -27.695859909057617, "global_step": 659344, "epoch": 7943} {"train_loss": -28.267663955688477, "global_step": 659345, "epoch": 7943} {"train_loss": -28.288074493408203, "global_step": 659346, "epoch": 7943} {"train_loss": -27.881723403930664, "global_step": 659347, "epoch": 7943} {"train_loss": -28.800973892211914, "global_step": 659348, "epoch": 7943} {"train_loss": -28.19074821472168, "global_step": 659349, "epoch": 7943} {"train_loss": -28.776966094970703, "global_step": 659350, "epoch": 7943} {"train_loss": -28.085360676409252, "global_step": 659351, "epoch": 7943, "val_loss": 6839096.0} {"train_loss": -28.03521728515625, "global_step": 659352, "epoch": 7944} {"train_loss": -28.252050399780273, "global_step": 659353, "epoch": 7944} {"train_loss": -28.498132705688477, "global_step": 659354, "epoch": 7944} {"train_loss": -27.9267635345459, "global_step": 659355, "epoch": 7944} {"train_loss": -28.006000518798828, "global_step": 659356, "epoch": 7944} {"train_loss": -28.088693618774414, "global_step": 659357, "epoch": 7944} {"train_loss": -27.941293716430664, "global_step": 659358, "epoch": 7944} {"train_loss": -27.7376766204834, "global_step": 659359, "epoch": 7944} {"train_loss": -27.722431182861328, "global_step": 659360, "epoch": 7944} {"train_loss": -27.916418075561523, "global_step": 659361, "epoch": 7944} {"train_loss": -27.624988555908203, "global_step": 659362, "epoch": 7944} {"train_loss": -28.088659286499023, "global_step": 659363, "epoch": 7944} {"train_loss": -28.330148696899414, "global_step": 659364, "epoch": 7944} {"train_loss": -27.355789184570312, "global_step": 659365, "epoch": 7944} {"train_loss": -27.045700073242188, "global_step": 659366, "epoch": 7944} {"train_loss": -28.076868057250977, "global_step": 659367, "epoch": 7944} {"train_loss": -28.333662033081055, "global_step": 659368, "epoch": 7944} {"train_loss": -27.750207901000977, "global_step": 659369, "epoch": 7944} {"train_loss": -27.94512939453125, "global_step": 659370, "epoch": 7944} {"train_loss": -28.140527725219727, "global_step": 659371, "epoch": 7944} {"train_loss": -28.209623336791992, "global_step": 659372, "epoch": 7944} {"train_loss": -28.365957260131836, "global_step": 659373, "epoch": 7944} {"train_loss": -28.237869262695312, "global_step": 659374, "epoch": 7944} {"train_loss": -27.883153915405273, "global_step": 659375, "epoch": 7944} {"train_loss": -28.29290199279785, "global_step": 659376, "epoch": 7944} {"train_loss": -28.135679244995117, "global_step": 659377, "epoch": 7944} {"train_loss": -28.21213722229004, "global_step": 659378, "epoch": 7944} {"train_loss": -28.191328048706055, "global_step": 659379, "epoch": 7944} {"train_loss": -28.406879425048828, "global_step": 659380, "epoch": 7944} {"train_loss": -28.208261489868164, "global_step": 659381, "epoch": 7944} {"train_loss": -28.632526397705078, "global_step": 659382, "epoch": 7944} {"train_loss": -28.130529403686523, "global_step": 659383, "epoch": 7944} {"train_loss": -28.584625244140625, "global_step": 659384, "epoch": 7944} {"train_loss": -28.067218780517578, "global_step": 659385, "epoch": 7944} {"train_loss": -28.6051025390625, "global_step": 659386, "epoch": 7944} {"train_loss": -28.1491756439209, "global_step": 659387, "epoch": 7944} {"train_loss": -28.159460067749023, "global_step": 659388, "epoch": 7944} {"train_loss": -28.396310806274414, "global_step": 659389, "epoch": 7944} {"train_loss": -28.5216064453125, "global_step": 659390, "epoch": 7944} {"train_loss": -27.981658935546875, "global_step": 659391, "epoch": 7944} {"train_loss": -28.239953994750977, "global_step": 659392, "epoch": 7944} {"train_loss": -28.348485946655273, "global_step": 659393, "epoch": 7944} {"train_loss": -28.632131576538086, "global_step": 659394, "epoch": 7944} {"train_loss": -28.106359481811523, "global_step": 659395, "epoch": 7944} {"train_loss": -28.32649040222168, "global_step": 659396, "epoch": 7944} {"train_loss": -28.21197509765625, "global_step": 659397, "epoch": 7944} {"train_loss": -27.976919174194336, "global_step": 659398, "epoch": 7944} {"train_loss": -28.309293746948242, "global_step": 659399, "epoch": 7944} {"train_loss": -28.652841567993164, "global_step": 659400, "epoch": 7944} {"train_loss": -28.660425186157227, "global_step": 659401, "epoch": 7944} {"train_loss": -28.3510684967041, "global_step": 659402, "epoch": 7944} {"train_loss": -28.314163208007812, "global_step": 659403, "epoch": 7944} {"train_loss": -28.582563400268555, "global_step": 659404, "epoch": 7944} {"train_loss": -28.52018165588379, "global_step": 659405, "epoch": 7944} {"train_loss": -28.49028968811035, "global_step": 659406, "epoch": 7944} {"train_loss": -28.395587921142578, "global_step": 659407, "epoch": 7944} {"train_loss": -28.397785186767578, "global_step": 659408, "epoch": 7944} {"train_loss": -28.20582389831543, "global_step": 659409, "epoch": 7944} {"train_loss": -28.295928955078125, "global_step": 659410, "epoch": 7944} {"train_loss": -28.163314819335938, "global_step": 659411, "epoch": 7944} {"train_loss": -28.554990768432617, "global_step": 659412, "epoch": 7944} {"train_loss": -28.321395874023438, "global_step": 659413, "epoch": 7944} {"train_loss": -28.3154239654541, "global_step": 659414, "epoch": 7944} {"train_loss": -28.15313720703125, "global_step": 659415, "epoch": 7944} {"train_loss": -28.2536563873291, "global_step": 659416, "epoch": 7944} {"train_loss": -28.13661766052246, "global_step": 659417, "epoch": 7944} {"train_loss": -28.416885375976562, "global_step": 659418, "epoch": 7944} {"train_loss": -28.22832679748535, "global_step": 659419, "epoch": 7944} {"train_loss": -28.358078002929688, "global_step": 659420, "epoch": 7944} {"train_loss": -28.71112060546875, "global_step": 659421, "epoch": 7944} {"train_loss": -28.16541862487793, "global_step": 659422, "epoch": 7944} {"train_loss": -28.14789390563965, "global_step": 659423, "epoch": 7944} {"train_loss": -28.2694149017334, "global_step": 659424, "epoch": 7944} {"train_loss": -28.324081420898438, "global_step": 659425, "epoch": 7944} {"train_loss": -28.440784454345703, "global_step": 659426, "epoch": 7944} {"train_loss": -28.557270050048828, "global_step": 659427, "epoch": 7944} {"train_loss": -28.115863800048828, "global_step": 659428, "epoch": 7944} {"train_loss": -28.63457679748535, "global_step": 659429, "epoch": 7944} {"train_loss": -28.2879695892334, "global_step": 659430, "epoch": 7944} {"train_loss": -28.48328971862793, "global_step": 659431, "epoch": 7944} {"train_loss": -28.654651641845703, "global_step": 659432, "epoch": 7944} {"train_loss": -28.59052848815918, "global_step": 659433, "epoch": 7944} {"train_loss": -28.240349895982856, "global_step": 659434, "epoch": 7944, "val_loss": 6894173.5} {"train_loss": -27.311227798461914, "global_step": 659435, "epoch": 7945} {"train_loss": -26.503070831298828, "global_step": 659436, "epoch": 7945} {"train_loss": -27.53626823425293, "global_step": 659437, "epoch": 7945} {"train_loss": -27.6090030670166, "global_step": 659438, "epoch": 7945} {"train_loss": -27.674245834350586, "global_step": 659439, "epoch": 7945} {"train_loss": -27.831159591674805, "global_step": 659440, "epoch": 7945} {"train_loss": -27.95599365234375, "global_step": 659441, "epoch": 7945} {"train_loss": -27.78265380859375, "global_step": 659442, "epoch": 7945} {"train_loss": -28.430612564086914, "global_step": 659443, "epoch": 7945} {"train_loss": -28.08627700805664, "global_step": 659444, "epoch": 7945} {"train_loss": -27.87270164489746, "global_step": 659445, "epoch": 7945} {"train_loss": -27.85406494140625, "global_step": 659446, "epoch": 7945} {"train_loss": -27.8880672454834, "global_step": 659447, "epoch": 7945} {"train_loss": -27.942365646362305, "global_step": 659448, "epoch": 7945} {"train_loss": -28.2818660736084, "global_step": 659449, "epoch": 7945} {"train_loss": -27.807214736938477, "global_step": 659450, "epoch": 7945} {"train_loss": -28.193769454956055, "global_step": 659451, "epoch": 7945} {"train_loss": -27.62701988220215, "global_step": 659452, "epoch": 7945} {"train_loss": -28.056196212768555, "global_step": 659453, "epoch": 7945} {"train_loss": -28.169519424438477, "global_step": 659454, "epoch": 7945} {"train_loss": -28.44002342224121, "global_step": 659455, "epoch": 7945} {"train_loss": -28.25074577331543, "global_step": 659456, "epoch": 7945} {"train_loss": -28.415555953979492, "global_step": 659457, "epoch": 7945} {"train_loss": -28.062292098999023, "global_step": 659458, "epoch": 7945} {"train_loss": -28.289525985717773, "global_step": 659459, "epoch": 7945} {"train_loss": -28.62677001953125, "global_step": 659460, "epoch": 7945} {"train_loss": -28.211807250976562, "global_step": 659461, "epoch": 7945} {"train_loss": -28.70221519470215, "global_step": 659462, "epoch": 7945} {"train_loss": -27.7174015045166, "global_step": 659463, "epoch": 7945} {"train_loss": -28.490020751953125, "global_step": 659464, "epoch": 7945} {"train_loss": -27.448644638061523, "global_step": 659465, "epoch": 7945} {"train_loss": -28.390493392944336, "global_step": 659466, "epoch": 7945} {"train_loss": -28.42926025390625, "global_step": 659467, "epoch": 7945} {"train_loss": -28.341815948486328, "global_step": 659468, "epoch": 7945} {"train_loss": -28.36054039001465, "global_step": 659469, "epoch": 7945} {"train_loss": -28.40394401550293, "global_step": 659470, "epoch": 7945} {"train_loss": -28.260730743408203, "global_step": 659471, "epoch": 7945} {"train_loss": -28.520803451538086, "global_step": 659472, "epoch": 7945} {"train_loss": -28.506103515625, "global_step": 659473, "epoch": 7945} {"train_loss": -28.2132625579834, "global_step": 659474, "epoch": 7945} {"train_loss": -28.34183692932129, "global_step": 659475, "epoch": 7945} {"train_loss": -28.22391128540039, "global_step": 659476, "epoch": 7945} {"train_loss": -28.823537826538086, "global_step": 659477, "epoch": 7945} {"train_loss": -28.430862426757812, "global_step": 659478, "epoch": 7945} {"train_loss": -28.56219482421875, "global_step": 659479, "epoch": 7945} {"train_loss": -28.312219619750977, "global_step": 659480, "epoch": 7945} {"train_loss": -28.114002227783203, "global_step": 659481, "epoch": 7945} {"train_loss": -28.462549209594727, "global_step": 659482, "epoch": 7945} {"train_loss": -28.544952392578125, "global_step": 659483, "epoch": 7945} {"train_loss": -28.5753173828125, "global_step": 659484, "epoch": 7945} {"train_loss": -28.452367782592773, "global_step": 659485, "epoch": 7945} {"train_loss": -28.551483154296875, "global_step": 659486, "epoch": 7945} {"train_loss": -28.455368041992188, "global_step": 659487, "epoch": 7945} {"train_loss": -28.0544490814209, "global_step": 659488, "epoch": 7945} {"train_loss": -28.6546630859375, "global_step": 659489, "epoch": 7945} {"train_loss": -28.251636505126953, "global_step": 659490, "epoch": 7945} {"train_loss": -28.54383659362793, "global_step": 659491, "epoch": 7945} {"train_loss": -28.706119537353516, "global_step": 659492, "epoch": 7945} {"train_loss": -28.375879287719727, "global_step": 659493, "epoch": 7945} {"train_loss": -28.2225341796875, "global_step": 659494, "epoch": 7945} {"train_loss": -28.7697811126709, "global_step": 659495, "epoch": 7945} {"train_loss": -28.60625648498535, "global_step": 659496, "epoch": 7945} {"train_loss": -28.393421173095703, "global_step": 659497, "epoch": 7945} {"train_loss": -28.47088623046875, "global_step": 659498, "epoch": 7945} {"train_loss": -28.45887565612793, "global_step": 659499, "epoch": 7945} {"train_loss": -28.754932403564453, "global_step": 659500, "epoch": 7945} {"train_loss": -28.501840591430664, "global_step": 659501, "epoch": 7945} {"train_loss": -28.413705825805664, "global_step": 659502, "epoch": 7945} {"train_loss": -28.44219970703125, "global_step": 659503, "epoch": 7945} {"train_loss": -27.587848663330078, "global_step": 659504, "epoch": 7945} {"train_loss": -27.996387481689453, "global_step": 659505, "epoch": 7945} {"train_loss": -27.870166778564453, "global_step": 659506, "epoch": 7945} {"train_loss": -28.535608291625977, "global_step": 659507, "epoch": 7945} {"train_loss": -28.3911075592041, "global_step": 659508, "epoch": 7945} {"train_loss": -28.270002365112305, "global_step": 659509, "epoch": 7945} {"train_loss": -28.239227294921875, "global_step": 659510, "epoch": 7945} {"train_loss": -28.408050537109375, "global_step": 659511, "epoch": 7945} {"train_loss": -28.442630767822266, "global_step": 659512, "epoch": 7945} {"train_loss": -27.986495971679688, "global_step": 659513, "epoch": 7945} {"train_loss": -27.638044357299805, "global_step": 659514, "epoch": 7945} {"train_loss": -27.39565086364746, "global_step": 659515, "epoch": 7945} {"train_loss": -28.177160263061523, "global_step": 659516, "epoch": 7945} {"train_loss": -28.221673528832124, "global_step": 659517, "epoch": 7945, "val_loss": 6847390.0} {"train_loss": -27.905689239501953, "global_step": 659518, "epoch": 7946} {"train_loss": -27.516393661499023, "global_step": 659519, "epoch": 7946} {"train_loss": -28.063974380493164, "global_step": 659520, "epoch": 7946} {"train_loss": -27.18352699279785, "global_step": 659521, "epoch": 7946} {"train_loss": -27.774402618408203, "global_step": 659522, "epoch": 7946} {"train_loss": -27.983734130859375, "global_step": 659523, "epoch": 7946} {"train_loss": -27.603193283081055, "global_step": 659524, "epoch": 7946} {"train_loss": -27.887033462524414, "global_step": 659525, "epoch": 7946} {"train_loss": -27.69281578063965, "global_step": 659526, "epoch": 7946} {"train_loss": -27.540876388549805, "global_step": 659527, "epoch": 7946} {"train_loss": -28.148029327392578, "global_step": 659528, "epoch": 7946} {"train_loss": -27.787494659423828, "global_step": 659529, "epoch": 7946} {"train_loss": -28.403919219970703, "global_step": 659530, "epoch": 7946} {"train_loss": -28.037445068359375, "global_step": 659531, "epoch": 7946} {"train_loss": -27.927188873291016, "global_step": 659532, "epoch": 7946} {"train_loss": -27.7445011138916, "global_step": 659533, "epoch": 7946} {"train_loss": -28.3518123626709, "global_step": 659534, "epoch": 7946} {"train_loss": -27.888519287109375, "global_step": 659535, "epoch": 7946} {"train_loss": -28.278818130493164, "global_step": 659536, "epoch": 7946} {"train_loss": -28.1765193939209, "global_step": 659537, "epoch": 7946} {"train_loss": -28.349079132080078, "global_step": 659538, "epoch": 7946} {"train_loss": -27.877288818359375, "global_step": 659539, "epoch": 7946} {"train_loss": -28.27595329284668, "global_step": 659540, "epoch": 7946} {"train_loss": -28.326614379882812, "global_step": 659541, "epoch": 7946} {"train_loss": -28.153104782104492, "global_step": 659542, "epoch": 7946} {"train_loss": -28.572925567626953, "global_step": 659543, "epoch": 7946} {"train_loss": -28.313251495361328, "global_step": 659544, "epoch": 7946} {"train_loss": -28.200336456298828, "global_step": 659545, "epoch": 7946} {"train_loss": -28.137866973876953, "global_step": 659546, "epoch": 7946} {"train_loss": -28.277942657470703, "global_step": 659547, "epoch": 7946} {"train_loss": -28.308080673217773, "global_step": 659548, "epoch": 7946} {"train_loss": -28.647842407226562, "global_step": 659549, "epoch": 7946} {"train_loss": -28.183399200439453, "global_step": 659550, "epoch": 7946} {"train_loss": -28.610010147094727, "global_step": 659551, "epoch": 7946} {"train_loss": -28.031646728515625, "global_step": 659552, "epoch": 7946} {"train_loss": -28.552204132080078, "global_step": 659553, "epoch": 7946} {"train_loss": -28.536062240600586, "global_step": 659554, "epoch": 7946} {"train_loss": -28.4584903717041, "global_step": 659555, "epoch": 7946} {"train_loss": -28.288543701171875, "global_step": 659556, "epoch": 7946} {"train_loss": -28.445831298828125, "global_step": 659557, "epoch": 7946} {"train_loss": -28.715085983276367, "global_step": 659558, "epoch": 7946} {"train_loss": -28.523345947265625, "global_step": 659559, "epoch": 7946} {"train_loss": -28.30596923828125, "global_step": 659560, "epoch": 7946} {"train_loss": -28.778202056884766, "global_step": 659561, "epoch": 7946} {"train_loss": -28.469024658203125, "global_step": 659562, "epoch": 7946} {"train_loss": -28.368061065673828, "global_step": 659563, "epoch": 7946} {"train_loss": -28.908788681030273, "global_step": 659564, "epoch": 7946} {"train_loss": -28.04742431640625, "global_step": 659565, "epoch": 7946} {"train_loss": -28.300186157226562, "global_step": 659566, "epoch": 7946} {"train_loss": -28.176416397094727, "global_step": 659567, "epoch": 7946} {"train_loss": -28.5821590423584, "global_step": 659568, "epoch": 7946} {"train_loss": -28.65897560119629, "global_step": 659569, "epoch": 7946} {"train_loss": -28.532052993774414, "global_step": 659570, "epoch": 7946} {"train_loss": -28.4349422454834, "global_step": 659571, "epoch": 7946} {"train_loss": -28.36714744567871, "global_step": 659572, "epoch": 7946} {"train_loss": -28.252233505249023, "global_step": 659573, "epoch": 7946} {"train_loss": -28.553985595703125, "global_step": 659574, "epoch": 7946} {"train_loss": -28.52120018005371, "global_step": 659575, "epoch": 7946} {"train_loss": -28.809850692749023, "global_step": 659576, "epoch": 7946} {"train_loss": -28.585546493530273, "global_step": 659577, "epoch": 7946} {"train_loss": -28.337539672851562, "global_step": 659578, "epoch": 7946} {"train_loss": -28.572473526000977, "global_step": 659579, "epoch": 7946} {"train_loss": -28.545623779296875, "global_step": 659580, "epoch": 7946} {"train_loss": -28.538389205932617, "global_step": 659581, "epoch": 7946} {"train_loss": -28.337875366210938, "global_step": 659582, "epoch": 7946} {"train_loss": -28.34226417541504, "global_step": 659583, "epoch": 7946} {"train_loss": -28.7379093170166, "global_step": 659584, "epoch": 7946} {"train_loss": -28.068695068359375, "global_step": 659585, "epoch": 7946} {"train_loss": -28.771894454956055, "global_step": 659586, "epoch": 7946} {"train_loss": -28.014822006225586, "global_step": 659587, "epoch": 7946} {"train_loss": -28.134016036987305, "global_step": 659588, "epoch": 7946} {"train_loss": -28.36286735534668, "global_step": 659589, "epoch": 7946} {"train_loss": -28.143701553344727, "global_step": 659590, "epoch": 7946} {"train_loss": -28.778228759765625, "global_step": 659591, "epoch": 7946} {"train_loss": -28.384443283081055, "global_step": 659592, "epoch": 7946} {"train_loss": -28.954267501831055, "global_step": 659593, "epoch": 7946} {"train_loss": -28.200122833251953, "global_step": 659594, "epoch": 7946} {"train_loss": -28.169696807861328, "global_step": 659595, "epoch": 7946} {"train_loss": -27.6685791015625, "global_step": 659596, "epoch": 7946} {"train_loss": -26.9239501953125, "global_step": 659597, "epoch": 7946} {"train_loss": -27.630239486694336, "global_step": 659598, "epoch": 7946} {"train_loss": -28.48491859436035, "global_step": 659599, "epoch": 7946} {"train_loss": -28.238408582756318, "global_step": 659600, "epoch": 7946, "val_loss": 6815305.0} {"train_loss": -26.955190658569336, "global_step": 659601, "epoch": 7947} {"train_loss": -27.878156661987305, "global_step": 659602, "epoch": 7947} {"train_loss": -27.48333168029785, "global_step": 659603, "epoch": 7947} {"train_loss": -27.42254066467285, "global_step": 659604, "epoch": 7947} {"train_loss": -27.231830596923828, "global_step": 659605, "epoch": 7947} {"train_loss": -27.11907958984375, "global_step": 659606, "epoch": 7947} {"train_loss": -27.15378189086914, "global_step": 659607, "epoch": 7947} {"train_loss": -27.61686134338379, "global_step": 659608, "epoch": 7947} {"train_loss": -27.7407169342041, "global_step": 659609, "epoch": 7947} {"train_loss": -27.722375869750977, "global_step": 659610, "epoch": 7947} {"train_loss": -27.47669792175293, "global_step": 659611, "epoch": 7947} {"train_loss": -27.558429718017578, "global_step": 659612, "epoch": 7947} {"train_loss": -27.63007164001465, "global_step": 659613, "epoch": 7947} {"train_loss": -27.48419189453125, "global_step": 659614, "epoch": 7947} {"train_loss": -27.844324111938477, "global_step": 659615, "epoch": 7947} {"train_loss": -28.29302978515625, "global_step": 659616, "epoch": 7947} {"train_loss": -27.591073989868164, "global_step": 659617, "epoch": 7947} {"train_loss": -28.222219467163086, "global_step": 659618, "epoch": 7947} {"train_loss": -27.83135986328125, "global_step": 659619, "epoch": 7947} {"train_loss": -28.033676147460938, "global_step": 659620, "epoch": 7947} {"train_loss": -27.925214767456055, "global_step": 659621, "epoch": 7947} {"train_loss": -28.008737564086914, "global_step": 659622, "epoch": 7947} {"train_loss": -27.743305206298828, "global_step": 659623, "epoch": 7947} {"train_loss": -28.14093589782715, "global_step": 659624, "epoch": 7947} {"train_loss": -27.935354232788086, "global_step": 659625, "epoch": 7947} {"train_loss": -28.303863525390625, "global_step": 659626, "epoch": 7947} {"train_loss": -28.011260986328125, "global_step": 659627, "epoch": 7947} {"train_loss": -28.3411922454834, "global_step": 659628, "epoch": 7947} {"train_loss": -28.285425186157227, "global_step": 659629, "epoch": 7947} {"train_loss": -28.524152755737305, "global_step": 659630, "epoch": 7947} {"train_loss": -28.331445693969727, "global_step": 659631, "epoch": 7947} {"train_loss": -27.925525665283203, "global_step": 659632, "epoch": 7947} {"train_loss": -28.10323143005371, "global_step": 659633, "epoch": 7947} {"train_loss": -28.507089614868164, "global_step": 659634, "epoch": 7947} {"train_loss": -27.77009391784668, "global_step": 659635, "epoch": 7947} {"train_loss": -28.037769317626953, "global_step": 659636, "epoch": 7947} {"train_loss": -28.117782592773438, "global_step": 659637, "epoch": 7947} {"train_loss": -28.157978057861328, "global_step": 659638, "epoch": 7947} {"train_loss": -28.252714157104492, "global_step": 659639, "epoch": 7947} {"train_loss": -28.215097427368164, "global_step": 659640, "epoch": 7947} {"train_loss": -28.3973445892334, "global_step": 659641, "epoch": 7947} {"train_loss": -28.20697021484375, "global_step": 659642, "epoch": 7947} {"train_loss": -28.403573989868164, "global_step": 659643, "epoch": 7947} {"train_loss": -28.456029891967773, "global_step": 659644, "epoch": 7947} {"train_loss": -28.2508487701416, "global_step": 659645, "epoch": 7947} {"train_loss": -28.62527847290039, "global_step": 659646, "epoch": 7947} {"train_loss": -28.34657096862793, "global_step": 659647, "epoch": 7947} {"train_loss": -28.42237663269043, "global_step": 659648, "epoch": 7947} {"train_loss": -28.65712547302246, "global_step": 659649, "epoch": 7947} {"train_loss": -28.435169219970703, "global_step": 659650, "epoch": 7947} {"train_loss": -28.408924102783203, "global_step": 659651, "epoch": 7947} {"train_loss": -28.05006980895996, "global_step": 659652, "epoch": 7947} {"train_loss": -28.458234786987305, "global_step": 659653, "epoch": 7947} {"train_loss": -28.459186553955078, "global_step": 659654, "epoch": 7947} {"train_loss": -27.97601890563965, "global_step": 659655, "epoch": 7947} {"train_loss": -27.864917755126953, "global_step": 659656, "epoch": 7947} {"train_loss": -28.41851806640625, "global_step": 659657, "epoch": 7947} {"train_loss": -28.391773223876953, "global_step": 659658, "epoch": 7947} {"train_loss": -27.9222354888916, "global_step": 659659, "epoch": 7947} {"train_loss": -28.1762638092041, "global_step": 659660, "epoch": 7947} {"train_loss": -27.9155330657959, "global_step": 659661, "epoch": 7947} {"train_loss": -28.34504508972168, "global_step": 659662, "epoch": 7947} {"train_loss": -27.16806411743164, "global_step": 659663, "epoch": 7947} {"train_loss": -27.380512237548828, "global_step": 659664, "epoch": 7947} {"train_loss": -27.9521541595459, "global_step": 659665, "epoch": 7947} {"train_loss": -28.22479820251465, "global_step": 659666, "epoch": 7947} {"train_loss": -28.144071578979492, "global_step": 659667, "epoch": 7947} {"train_loss": -28.15828514099121, "global_step": 659668, "epoch": 7947} {"train_loss": -27.77947425842285, "global_step": 659669, "epoch": 7947} {"train_loss": -28.278223037719727, "global_step": 659670, "epoch": 7947} {"train_loss": -28.229724884033203, "global_step": 659671, "epoch": 7947} {"train_loss": -28.413471221923828, "global_step": 659672, "epoch": 7947} {"train_loss": -28.3994197845459, "global_step": 659673, "epoch": 7947} {"train_loss": -28.0626163482666, "global_step": 659674, "epoch": 7947} {"train_loss": -27.79825782775879, "global_step": 659675, "epoch": 7947} {"train_loss": -28.36346435546875, "global_step": 659676, "epoch": 7947} {"train_loss": -28.29255485534668, "global_step": 659677, "epoch": 7947} {"train_loss": -28.739294052124023, "global_step": 659678, "epoch": 7947} {"train_loss": -28.13348960876465, "global_step": 659679, "epoch": 7947} {"train_loss": -28.08039665222168, "global_step": 659680, "epoch": 7947} {"train_loss": -28.6793270111084, "global_step": 659681, "epoch": 7947} {"train_loss": -28.60992431640625, "global_step": 659682, "epoch": 7947} {"train_loss": -28.065832023161004, "global_step": 659683, "epoch": 7947, "val_loss": 6942054.0} {"train_loss": -28.122955322265625, "global_step": 659684, "epoch": 7948} {"train_loss": -28.010705947875977, "global_step": 659685, "epoch": 7948} {"train_loss": -27.936193466186523, "global_step": 659686, "epoch": 7948} {"train_loss": -28.15974235534668, "global_step": 659687, "epoch": 7948} {"train_loss": -28.13340187072754, "global_step": 659688, "epoch": 7948} {"train_loss": -28.134601593017578, "global_step": 659689, "epoch": 7948} {"train_loss": -28.362808227539062, "global_step": 659690, "epoch": 7948} {"train_loss": -28.304662704467773, "global_step": 659691, "epoch": 7948} {"train_loss": -28.335947036743164, "global_step": 659692, "epoch": 7948} {"train_loss": -28.320648193359375, "global_step": 659693, "epoch": 7948} {"train_loss": -28.68140983581543, "global_step": 659694, "epoch": 7948} {"train_loss": -28.141584396362305, "global_step": 659695, "epoch": 7948} {"train_loss": -28.355016708374023, "global_step": 659696, "epoch": 7948} {"train_loss": -28.441675186157227, "global_step": 659697, "epoch": 7948} {"train_loss": -28.242963790893555, "global_step": 659698, "epoch": 7948} {"train_loss": -28.602874755859375, "global_step": 659699, "epoch": 7948} {"train_loss": -28.33185386657715, "global_step": 659700, "epoch": 7948} {"train_loss": -28.49610710144043, "global_step": 659701, "epoch": 7948} {"train_loss": -27.897403717041016, "global_step": 659702, "epoch": 7948} {"train_loss": -28.215864181518555, "global_step": 659703, "epoch": 7948} {"train_loss": -28.8388614654541, "global_step": 659704, "epoch": 7948} {"train_loss": -28.41303062438965, "global_step": 659705, "epoch": 7948} {"train_loss": -28.37746238708496, "global_step": 659706, "epoch": 7948} {"train_loss": -28.075580596923828, "global_step": 659707, "epoch": 7948} {"train_loss": -28.2982177734375, "global_step": 659708, "epoch": 7948} {"train_loss": -28.341733932495117, "global_step": 659709, "epoch": 7948} {"train_loss": -28.426477432250977, "global_step": 659710, "epoch": 7948} {"train_loss": -28.026702880859375, "global_step": 659711, "epoch": 7948} {"train_loss": -28.22464370727539, "global_step": 659712, "epoch": 7948} {"train_loss": -28.725788116455078, "global_step": 659713, "epoch": 7948} {"train_loss": -28.20954704284668, "global_step": 659714, "epoch": 7948} {"train_loss": -28.37236976623535, "global_step": 659715, "epoch": 7948} {"train_loss": -28.235624313354492, "global_step": 659716, "epoch": 7948} {"train_loss": -28.461135864257812, "global_step": 659717, "epoch": 7948} {"train_loss": -28.151203155517578, "global_step": 659718, "epoch": 7948} {"train_loss": -28.3693904876709, "global_step": 659719, "epoch": 7948} {"train_loss": -28.41879653930664, "global_step": 659720, "epoch": 7948} {"train_loss": -28.398365020751953, "global_step": 659721, "epoch": 7948} {"train_loss": -28.59785270690918, "global_step": 659722, "epoch": 7948} {"train_loss": -28.516223907470703, "global_step": 659723, "epoch": 7948} {"train_loss": -28.471384048461914, "global_step": 659724, "epoch": 7948} {"train_loss": -28.247522354125977, "global_step": 659725, "epoch": 7948} {"train_loss": -28.510839462280273, "global_step": 659726, "epoch": 7948} {"train_loss": -28.508075714111328, "global_step": 659727, "epoch": 7948} {"train_loss": -28.739587783813477, "global_step": 659728, "epoch": 7948} {"train_loss": -28.52396583557129, "global_step": 659729, "epoch": 7948} {"train_loss": -28.215551376342773, "global_step": 659730, "epoch": 7948} {"train_loss": -28.38779640197754, "global_step": 659731, "epoch": 7948} {"train_loss": -28.674161911010742, "global_step": 659732, "epoch": 7948} {"train_loss": -28.359174728393555, "global_step": 659733, "epoch": 7948} {"train_loss": -28.3524112701416, "global_step": 659734, "epoch": 7948} {"train_loss": -28.222753524780273, "global_step": 659735, "epoch": 7948} {"train_loss": -28.536970138549805, "global_step": 659736, "epoch": 7948} {"train_loss": -28.643482208251953, "global_step": 659737, "epoch": 7948} {"train_loss": -28.307052612304688, "global_step": 659738, "epoch": 7948} {"train_loss": -28.37849235534668, "global_step": 659739, "epoch": 7948} {"train_loss": -28.25802993774414, "global_step": 659740, "epoch": 7948} {"train_loss": -28.212604522705078, "global_step": 659741, "epoch": 7948} {"train_loss": -28.131513595581055, "global_step": 659742, "epoch": 7948} {"train_loss": -28.415252685546875, "global_step": 659743, "epoch": 7948} {"train_loss": -28.38880729675293, "global_step": 659744, "epoch": 7948} {"train_loss": -28.418607711791992, "global_step": 659745, "epoch": 7948} {"train_loss": -28.3409366607666, "global_step": 659746, "epoch": 7948} {"train_loss": -28.457294464111328, "global_step": 659747, "epoch": 7948} {"train_loss": -28.58440589904785, "global_step": 659748, "epoch": 7948} {"train_loss": -28.2845458984375, "global_step": 659749, "epoch": 7948} {"train_loss": -28.539148330688477, "global_step": 659750, "epoch": 7948} {"train_loss": -28.464679718017578, "global_step": 659751, "epoch": 7948} {"train_loss": -28.489004135131836, "global_step": 659752, "epoch": 7948} {"train_loss": -28.71917152404785, "global_step": 659753, "epoch": 7948} {"train_loss": -28.279211044311523, "global_step": 659754, "epoch": 7948} {"train_loss": -28.382953643798828, "global_step": 659755, "epoch": 7948} {"train_loss": -28.660192489624023, "global_step": 659756, "epoch": 7948} {"train_loss": -28.459003448486328, "global_step": 659757, "epoch": 7948} {"train_loss": -28.564783096313477, "global_step": 659758, "epoch": 7948} {"train_loss": -28.525556564331055, "global_step": 659759, "epoch": 7948} {"train_loss": -28.6558780670166, "global_step": 659760, "epoch": 7948} {"train_loss": -28.396060943603516, "global_step": 659761, "epoch": 7948} {"train_loss": -28.506956100463867, "global_step": 659762, "epoch": 7948} {"train_loss": -28.5146427154541, "global_step": 659763, "epoch": 7948} {"train_loss": -28.431745529174805, "global_step": 659764, "epoch": 7948} {"train_loss": -28.393436431884766, "global_step": 659765, "epoch": 7948} {"train_loss": -28.357081011117224, "global_step": 659766, "epoch": 7948, "val_loss": 6927850.0} {"train_loss": -28.097476959228516, "global_step": 659767, "epoch": 7949} {"train_loss": -27.87579345703125, "global_step": 659768, "epoch": 7949} {"train_loss": -26.850143432617188, "global_step": 659769, "epoch": 7949} {"train_loss": -27.29804801940918, "global_step": 659770, "epoch": 7949} {"train_loss": -27.803930282592773, "global_step": 659771, "epoch": 7949} {"train_loss": -27.45233726501465, "global_step": 659772, "epoch": 7949} {"train_loss": -27.198522567749023, "global_step": 659773, "epoch": 7949} {"train_loss": -27.367528915405273, "global_step": 659774, "epoch": 7949} {"train_loss": -27.40936279296875, "global_step": 659775, "epoch": 7949} {"train_loss": -27.094196319580078, "global_step": 659776, "epoch": 7949} {"train_loss": -28.027191162109375, "global_step": 659777, "epoch": 7949} {"train_loss": -27.610361099243164, "global_step": 659778, "epoch": 7949} {"train_loss": -27.539508819580078, "global_step": 659779, "epoch": 7949} {"train_loss": -27.996007919311523, "global_step": 659780, "epoch": 7949} {"train_loss": -27.52760124206543, "global_step": 659781, "epoch": 7949} {"train_loss": -28.04241371154785, "global_step": 659782, "epoch": 7949} {"train_loss": -27.379125595092773, "global_step": 659783, "epoch": 7949} {"train_loss": -28.042190551757812, "global_step": 659784, "epoch": 7949} {"train_loss": -28.04041862487793, "global_step": 659785, "epoch": 7949} {"train_loss": -27.94780921936035, "global_step": 659786, "epoch": 7949} {"train_loss": -27.419300079345703, "global_step": 659787, "epoch": 7949} {"train_loss": -28.114843368530273, "global_step": 659788, "epoch": 7949} {"train_loss": -27.924072265625, "global_step": 659789, "epoch": 7949} {"train_loss": -28.18450927734375, "global_step": 659790, "epoch": 7949} {"train_loss": -28.1823673248291, "global_step": 659791, "epoch": 7949} {"train_loss": -28.029682159423828, "global_step": 659792, "epoch": 7949} {"train_loss": -27.997455596923828, "global_step": 659793, "epoch": 7949} {"train_loss": -28.081729888916016, "global_step": 659794, "epoch": 7949} {"train_loss": -27.86459732055664, "global_step": 659795, "epoch": 7949} {"train_loss": -28.40761375427246, "global_step": 659796, "epoch": 7949} {"train_loss": -28.282835006713867, "global_step": 659797, "epoch": 7949} {"train_loss": -28.177438735961914, "global_step": 659798, "epoch": 7949} {"train_loss": -28.246692657470703, "global_step": 659799, "epoch": 7949} {"train_loss": -28.142309188842773, "global_step": 659800, "epoch": 7949} {"train_loss": -27.965972900390625, "global_step": 659801, "epoch": 7949} {"train_loss": -28.053543090820312, "global_step": 659802, "epoch": 7949} {"train_loss": -28.1801700592041, "global_step": 659803, "epoch": 7949} {"train_loss": -28.2769832611084, "global_step": 659804, "epoch": 7949} {"train_loss": -27.89995765686035, "global_step": 659805, "epoch": 7949} {"train_loss": -28.591999053955078, "global_step": 659806, "epoch": 7949} {"train_loss": -28.38275718688965, "global_step": 659807, "epoch": 7949} {"train_loss": -28.043493270874023, "global_step": 659808, "epoch": 7949} {"train_loss": -28.458770751953125, "global_step": 659809, "epoch": 7949} {"train_loss": -28.369916915893555, "global_step": 659810, "epoch": 7949} {"train_loss": -28.344152450561523, "global_step": 659811, "epoch": 7949} {"train_loss": -28.2074031829834, "global_step": 659812, "epoch": 7949} {"train_loss": -28.53468132019043, "global_step": 659813, "epoch": 7949} {"train_loss": -28.474889755249023, "global_step": 659814, "epoch": 7949} {"train_loss": -28.39185905456543, "global_step": 659815, "epoch": 7949} {"train_loss": -28.773040771484375, "global_step": 659816, "epoch": 7949} {"train_loss": -28.0804386138916, "global_step": 659817, "epoch": 7949} {"train_loss": -28.458219528198242, "global_step": 659818, "epoch": 7949} {"train_loss": -28.207794189453125, "global_step": 659819, "epoch": 7949} {"train_loss": -28.669219970703125, "global_step": 659820, "epoch": 7949} {"train_loss": -28.1790828704834, "global_step": 659821, "epoch": 7949} {"train_loss": -28.18484878540039, "global_step": 659822, "epoch": 7949} {"train_loss": -28.38167381286621, "global_step": 659823, "epoch": 7949} {"train_loss": -28.278268814086914, "global_step": 659824, "epoch": 7949} {"train_loss": -28.331714630126953, "global_step": 659825, "epoch": 7949} {"train_loss": -28.32110023498535, "global_step": 659826, "epoch": 7949} {"train_loss": -28.745386123657227, "global_step": 659827, "epoch": 7949} {"train_loss": -28.243261337280273, "global_step": 659828, "epoch": 7949} {"train_loss": -28.521764755249023, "global_step": 659829, "epoch": 7949} {"train_loss": -28.527881622314453, "global_step": 659830, "epoch": 7949} {"train_loss": -27.901355743408203, "global_step": 659831, "epoch": 7949} {"train_loss": -27.906787872314453, "global_step": 659832, "epoch": 7949} {"train_loss": -28.547651290893555, "global_step": 659833, "epoch": 7949} {"train_loss": -28.48103141784668, "global_step": 659834, "epoch": 7949} {"train_loss": -28.193723678588867, "global_step": 659835, "epoch": 7949} {"train_loss": -27.468189239501953, "global_step": 659836, "epoch": 7949} {"train_loss": -26.863269805908203, "global_step": 659837, "epoch": 7949} {"train_loss": -26.051685333251953, "global_step": 659838, "epoch": 7949} {"train_loss": -26.047595977783203, "global_step": 659839, "epoch": 7949} {"train_loss": -27.660785675048828, "global_step": 659840, "epoch": 7949} {"train_loss": -27.478300094604492, "global_step": 659841, "epoch": 7949} {"train_loss": -27.554609298706055, "global_step": 659842, "epoch": 7949} {"train_loss": -27.1993465423584, "global_step": 659843, "epoch": 7949} {"train_loss": -27.604633331298828, "global_step": 659844, "epoch": 7949} {"train_loss": -27.179590225219727, "global_step": 659845, "epoch": 7949} {"train_loss": -27.48390007019043, "global_step": 659846, "epoch": 7949} {"train_loss": -27.296239852905273, "global_step": 659847, "epoch": 7949} {"train_loss": -28.10199546813965, "global_step": 659848, "epoch": 7949} {"train_loss": -27.94941440260554, "global_step": 659849, "epoch": 7949, "val_loss": 6918192.0} {"train_loss": -26.37174415588379, "global_step": 659850, "epoch": 7950} {"train_loss": -26.7896785736084, "global_step": 659851, "epoch": 7950} {"train_loss": -26.913862228393555, "global_step": 659852, "epoch": 7950} {"train_loss": -26.657470703125, "global_step": 659853, "epoch": 7950} {"train_loss": -27.418027877807617, "global_step": 659854, "epoch": 7950} {"train_loss": -26.920120239257812, "global_step": 659855, "epoch": 7950} {"train_loss": -27.41704750061035, "global_step": 659856, "epoch": 7950} {"train_loss": -27.196699142456055, "global_step": 659857, "epoch": 7950} {"train_loss": -27.010807037353516, "global_step": 659858, "epoch": 7950} {"train_loss": -27.595203399658203, "global_step": 659859, "epoch": 7950} {"train_loss": -27.513858795166016, "global_step": 659860, "epoch": 7950} {"train_loss": -27.437957763671875, "global_step": 659861, "epoch": 7950} {"train_loss": -27.65102195739746, "global_step": 659862, "epoch": 7950} {"train_loss": -27.577863693237305, "global_step": 659863, "epoch": 7950} {"train_loss": -27.783376693725586, "global_step": 659864, "epoch": 7950} {"train_loss": -28.052595138549805, "global_step": 659865, "epoch": 7950} {"train_loss": -27.58281898498535, "global_step": 659866, "epoch": 7950} {"train_loss": -27.743579864501953, "global_step": 659867, "epoch": 7950} {"train_loss": -27.907033920288086, "global_step": 659868, "epoch": 7950} {"train_loss": -27.622028350830078, "global_step": 659869, "epoch": 7950} {"train_loss": -27.332197189331055, "global_step": 659870, "epoch": 7950} {"train_loss": -27.73067283630371, "global_step": 659871, "epoch": 7950} {"train_loss": -27.524749755859375, "global_step": 659872, "epoch": 7950} {"train_loss": -28.241931915283203, "global_step": 659873, "epoch": 7950} {"train_loss": -27.98089027404785, "global_step": 659874, "epoch": 7950} {"train_loss": -28.374942779541016, "global_step": 659875, "epoch": 7950} {"train_loss": -28.146108627319336, "global_step": 659876, "epoch": 7950} {"train_loss": -27.71467399597168, "global_step": 659877, "epoch": 7950} {"train_loss": -27.97877311706543, "global_step": 659878, "epoch": 7950} {"train_loss": -28.186044692993164, "global_step": 659879, "epoch": 7950} {"train_loss": -28.297622680664062, "global_step": 659880, "epoch": 7950} {"train_loss": -28.1185359954834, "global_step": 659881, "epoch": 7950} {"train_loss": -28.36846923828125, "global_step": 659882, "epoch": 7950} {"train_loss": -28.199533462524414, "global_step": 659883, "epoch": 7950} {"train_loss": -28.54547119140625, "global_step": 659884, "epoch": 7950} {"train_loss": -28.2995662689209, "global_step": 659885, "epoch": 7950} {"train_loss": -28.254425048828125, "global_step": 659886, "epoch": 7950} {"train_loss": -28.138891220092773, "global_step": 659887, "epoch": 7950} {"train_loss": -28.359756469726562, "global_step": 659888, "epoch": 7950} {"train_loss": -28.150129318237305, "global_step": 659889, "epoch": 7950} {"train_loss": -28.41962242126465, "global_step": 659890, "epoch": 7950} {"train_loss": -28.110910415649414, "global_step": 659891, "epoch": 7950} {"train_loss": -28.574567794799805, "global_step": 659892, "epoch": 7950} {"train_loss": -28.23182487487793, "global_step": 659893, "epoch": 7950} {"train_loss": -28.40570640563965, "global_step": 659894, "epoch": 7950} {"train_loss": -28.609363555908203, "global_step": 659895, "epoch": 7950} {"train_loss": -28.35474967956543, "global_step": 659896, "epoch": 7950} {"train_loss": -28.58736228942871, "global_step": 659897, "epoch": 7950} {"train_loss": -28.248966217041016, "global_step": 659898, "epoch": 7950} {"train_loss": -28.53264808654785, "global_step": 659899, "epoch": 7950} {"train_loss": -28.236865997314453, "global_step": 659900, "epoch": 7950} {"train_loss": -28.7607479095459, "global_step": 659901, "epoch": 7950} {"train_loss": -28.388620376586914, "global_step": 659902, "epoch": 7950} {"train_loss": -28.59836196899414, "global_step": 659903, "epoch": 7950} {"train_loss": -28.46162223815918, "global_step": 659904, "epoch": 7950} {"train_loss": -28.397876739501953, "global_step": 659905, "epoch": 7950} {"train_loss": -28.296735763549805, "global_step": 659906, "epoch": 7950} {"train_loss": -28.401355743408203, "global_step": 659907, "epoch": 7950} {"train_loss": -28.32285499572754, "global_step": 659908, "epoch": 7950} {"train_loss": -28.56941032409668, "global_step": 659909, "epoch": 7950} {"train_loss": -28.60821533203125, "global_step": 659910, "epoch": 7950} {"train_loss": -28.478652954101562, "global_step": 659911, "epoch": 7950} {"train_loss": -28.579023361206055, "global_step": 659912, "epoch": 7950} {"train_loss": -28.543643951416016, "global_step": 659913, "epoch": 7950} {"train_loss": -28.82594108581543, "global_step": 659914, "epoch": 7950} {"train_loss": -28.49519157409668, "global_step": 659915, "epoch": 7950} {"train_loss": -27.875635147094727, "global_step": 659916, "epoch": 7950} {"train_loss": -28.26377296447754, "global_step": 659917, "epoch": 7950} {"train_loss": -28.011981964111328, "global_step": 659918, "epoch": 7950} {"train_loss": -28.06232261657715, "global_step": 659919, "epoch": 7950} {"train_loss": -27.905439376831055, "global_step": 659920, "epoch": 7950} {"train_loss": -28.073049545288086, "global_step": 659921, "epoch": 7950} {"train_loss": -28.620107650756836, "global_step": 659922, "epoch": 7950} {"train_loss": -28.313323974609375, "global_step": 659923, "epoch": 7950} {"train_loss": -28.08320426940918, "global_step": 659924, "epoch": 7950} {"train_loss": -28.135251998901367, "global_step": 659925, "epoch": 7950} {"train_loss": -28.437170028686523, "global_step": 659926, "epoch": 7950} {"train_loss": -28.55543327331543, "global_step": 659927, "epoch": 7950} {"train_loss": -28.294443130493164, "global_step": 659928, "epoch": 7950} {"train_loss": -28.70947265625, "global_step": 659929, "epoch": 7950} {"train_loss": -28.5405216217041, "global_step": 659930, "epoch": 7950} {"train_loss": -28.207616806030273, "global_step": 659931, "epoch": 7950} {"train_loss": -28.06834188714085, "global_step": 659932, "epoch": 7950, "train/sim_max_reward_0": 1.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 0.0, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4500000": 1.0, "test/sim_max_reward_4500001": 1.0, "test/sim_max_reward_4500002": 1.0, "test/sim_max_reward_4500003": 1.0, "test/sim_max_reward_4500004": 1.0, "test/sim_max_reward_4500005": 1.0, "test/sim_max_reward_4500006": 1.0, "test/sim_max_reward_4500007": 0.0, "test/sim_max_reward_4500008": 1.0, "test/sim_max_reward_4500009": 1.0, "test/sim_max_reward_4500010": 1.0, "test/sim_max_reward_4500011": 1.0, "test/sim_max_reward_4500012": 1.0, "test/sim_max_reward_4500013": 1.0, "test/sim_max_reward_4500014": 1.0, "test/sim_max_reward_4500015": 1.0, "test/sim_max_reward_4500016": 1.0, "test/sim_max_reward_4500017": 1.0, "test/sim_max_reward_4500018": 1.0, "test/sim_max_reward_4500019": 0.0, "test/sim_max_reward_4500020": 1.0, "test/sim_max_reward_4500021": 1.0, "train/mean_score": 0.8333333333333334, "test/mean_score": 0.9090909090909091, "val_loss": 6912414.0} {"train_loss": -26.467458724975586, "global_step": 659933, "epoch": 7951} {"train_loss": -24.290756225585938, "global_step": 659934, "epoch": 7951} {"train_loss": -26.011322021484375, "global_step": 659935, "epoch": 7951} {"train_loss": -27.119586944580078, "global_step": 659936, "epoch": 7951} {"train_loss": -26.591278076171875, "global_step": 659937, "epoch": 7951} {"train_loss": -27.53240394592285, "global_step": 659938, "epoch": 7951} {"train_loss": -27.06257438659668, "global_step": 659939, "epoch": 7951} {"train_loss": -27.4437313079834, "global_step": 659940, "epoch": 7951} {"train_loss": -27.278400421142578, "global_step": 659941, "epoch": 7951} {"train_loss": -27.976327896118164, "global_step": 659942, "epoch": 7951} {"train_loss": -27.494159698486328, "global_step": 659943, "epoch": 7951} {"train_loss": -27.716632843017578, "global_step": 659944, "epoch": 7951} {"train_loss": -27.275068283081055, "global_step": 659945, "epoch": 7951} {"train_loss": -27.36359977722168, "global_step": 659946, "epoch": 7951} {"train_loss": -27.993637084960938, "global_step": 659947, "epoch": 7951} {"train_loss": -27.745752334594727, "global_step": 659948, "epoch": 7951} {"train_loss": -27.763731002807617, "global_step": 659949, "epoch": 7951} {"train_loss": -27.6527042388916, "global_step": 659950, "epoch": 7951} {"train_loss": -27.579259872436523, "global_step": 659951, "epoch": 7951} {"train_loss": -27.932477951049805, "global_step": 659952, "epoch": 7951} {"train_loss": -27.58180046081543, "global_step": 659953, "epoch": 7951} {"train_loss": -28.1285343170166, "global_step": 659954, "epoch": 7951} {"train_loss": -27.826358795166016, "global_step": 659955, "epoch": 7951} {"train_loss": -27.821264266967773, "global_step": 659956, "epoch": 7951} {"train_loss": -27.87653923034668, "global_step": 659957, "epoch": 7951} {"train_loss": -28.08282470703125, "global_step": 659958, "epoch": 7951} {"train_loss": -28.14341163635254, "global_step": 659959, "epoch": 7951} {"train_loss": -28.267377853393555, "global_step": 659960, "epoch": 7951} {"train_loss": -28.192487716674805, "global_step": 659961, "epoch": 7951} {"train_loss": -28.0253849029541, "global_step": 659962, "epoch": 7951} {"train_loss": -27.982004165649414, "global_step": 659963, "epoch": 7951} {"train_loss": -28.01108741760254, "global_step": 659964, "epoch": 7951} {"train_loss": -27.967254638671875, "global_step": 659965, "epoch": 7951} {"train_loss": -28.23736572265625, "global_step": 659966, "epoch": 7951} {"train_loss": -28.36083984375, "global_step": 659967, "epoch": 7951} {"train_loss": -28.135101318359375, "global_step": 659968, "epoch": 7951} {"train_loss": -28.4512939453125, "global_step": 659969, "epoch": 7951} {"train_loss": -28.211645126342773, "global_step": 659970, "epoch": 7951} {"train_loss": -28.184797286987305, "global_step": 659971, "epoch": 7951} {"train_loss": -28.2665958404541, "global_step": 659972, "epoch": 7951} {"train_loss": -28.05893325805664, "global_step": 659973, "epoch": 7951} {"train_loss": -28.25204849243164, "global_step": 659974, "epoch": 7951} {"train_loss": -28.55501365661621, "global_step": 659975, "epoch": 7951} {"train_loss": -28.498823165893555, "global_step": 659976, "epoch": 7951} {"train_loss": -28.535730361938477, "global_step": 659977, "epoch": 7951} {"train_loss": -28.385272979736328, "global_step": 659978, "epoch": 7951} {"train_loss": -28.57486343383789, "global_step": 659979, "epoch": 7951} {"train_loss": -28.34906005859375, "global_step": 659980, "epoch": 7951} {"train_loss": -28.84510612487793, "global_step": 659981, "epoch": 7951} {"train_loss": -28.395511627197266, "global_step": 659982, "epoch": 7951} {"train_loss": -28.228286743164062, "global_step": 659983, "epoch": 7951} {"train_loss": -27.25918960571289, "global_step": 659984, "epoch": 7951} {"train_loss": -25.814208984375, "global_step": 659985, "epoch": 7951} {"train_loss": -24.966323852539062, "global_step": 659986, "epoch": 7951} {"train_loss": -28.2992000579834, "global_step": 659987, "epoch": 7951} {"train_loss": -23.367340087890625, "global_step": 659988, "epoch": 7951} {"train_loss": -26.572927474975586, "global_step": 659989, "epoch": 7951} {"train_loss": -25.22597312927246, "global_step": 659990, "epoch": 7951} {"train_loss": -27.011579513549805, "global_step": 659991, "epoch": 7951} {"train_loss": -26.35308265686035, "global_step": 659992, "epoch": 7951} {"train_loss": -27.352624893188477, "global_step": 659993, "epoch": 7951} {"train_loss": -27.42917251586914, "global_step": 659994, "epoch": 7951} {"train_loss": -26.850372314453125, "global_step": 659995, "epoch": 7951} {"train_loss": -27.42388916015625, "global_step": 659996, "epoch": 7951} {"train_loss": -28.06241798400879, "global_step": 659997, "epoch": 7951} {"train_loss": -27.61933708190918, "global_step": 659998, "epoch": 7951} {"train_loss": -26.814420700073242, "global_step": 659999, "epoch": 7951} {"train_loss": -27.595539093017578, "global_step": 660000, "epoch": 7951} {"train_loss": -27.732542037963867, "global_step": 660001, "epoch": 7951} {"train_loss": -27.742156982421875, "global_step": 660002, "epoch": 7951} {"train_loss": -27.65743064880371, "global_step": 660003, "epoch": 7951} {"train_loss": -27.401046752929688, "global_step": 660004, "epoch": 7951} {"train_loss": -27.622404098510742, "global_step": 660005, "epoch": 7951} {"train_loss": -27.818679809570312, "global_step": 660006, "epoch": 7951} {"train_loss": -28.126829147338867, "global_step": 660007, "epoch": 7951} {"train_loss": -27.672409057617188, "global_step": 660008, "epoch": 7951} {"train_loss": -27.83271598815918, "global_step": 660009, "epoch": 7951} {"train_loss": -27.98650550842285, "global_step": 660010, "epoch": 7951} {"train_loss": -27.57248306274414, "global_step": 660011, "epoch": 7951} {"train_loss": -28.111425399780273, "global_step": 660012, "epoch": 7951} {"train_loss": -28.24945068359375, "global_step": 660013, "epoch": 7951} {"train_loss": -28.262826919555664, "global_step": 660014, "epoch": 7951} {"train_loss": -27.57176691078278, "global_step": 660015, "epoch": 7951, "val_loss": 6908511.0} {"train_loss": -27.55854606628418, "global_step": 660016, "epoch": 7952} {"train_loss": -27.31110191345215, "global_step": 660017, "epoch": 7952} {"train_loss": -27.911718368530273, "global_step": 660018, "epoch": 7952} {"train_loss": -27.37904167175293, "global_step": 660019, "epoch": 7952} {"train_loss": -27.672000885009766, "global_step": 660020, "epoch": 7952} {"train_loss": -27.54865837097168, "global_step": 660021, "epoch": 7952} {"train_loss": -27.49004554748535, "global_step": 660022, "epoch": 7952} {"train_loss": -27.985595703125, "global_step": 660023, "epoch": 7952} {"train_loss": -27.625234603881836, "global_step": 660024, "epoch": 7952} {"train_loss": -27.3200740814209, "global_step": 660025, "epoch": 7952} {"train_loss": -27.647802352905273, "global_step": 660026, "epoch": 7952} {"train_loss": -27.770605087280273, "global_step": 660027, "epoch": 7952} {"train_loss": -28.268661499023438, "global_step": 660028, "epoch": 7952} {"train_loss": -27.86958885192871, "global_step": 660029, "epoch": 7952} {"train_loss": -27.891971588134766, "global_step": 660030, "epoch": 7952} {"train_loss": -28.348539352416992, "global_step": 660031, "epoch": 7952} {"train_loss": -27.633991241455078, "global_step": 660032, "epoch": 7952} {"train_loss": -27.6070499420166, "global_step": 660033, "epoch": 7952} {"train_loss": -27.88393211364746, "global_step": 660034, "epoch": 7952} {"train_loss": -28.201040267944336, "global_step": 660035, "epoch": 7952} {"train_loss": -28.30475425720215, "global_step": 660036, "epoch": 7952} {"train_loss": -28.056379318237305, "global_step": 660037, "epoch": 7952} {"train_loss": -28.25148582458496, "global_step": 660038, "epoch": 7952} {"train_loss": -28.064273834228516, "global_step": 660039, "epoch": 7952} {"train_loss": -28.087909698486328, "global_step": 660040, "epoch": 7952} {"train_loss": -28.389448165893555, "global_step": 660041, "epoch": 7952} {"train_loss": -28.053571701049805, "global_step": 660042, "epoch": 7952} {"train_loss": -27.977407455444336, "global_step": 660043, "epoch": 7952} {"train_loss": -28.269256591796875, "global_step": 660044, "epoch": 7952} {"train_loss": -28.050018310546875, "global_step": 660045, "epoch": 7952} {"train_loss": -28.261213302612305, "global_step": 660046, "epoch": 7952} {"train_loss": -28.1546688079834, "global_step": 660047, "epoch": 7952} {"train_loss": -28.552692413330078, "global_step": 660048, "epoch": 7952} {"train_loss": -28.418750762939453, "global_step": 660049, "epoch": 7952} {"train_loss": -28.63834571838379, "global_step": 660050, "epoch": 7952} {"train_loss": -28.4606990814209, "global_step": 660051, "epoch": 7952} {"train_loss": -28.09296989440918, "global_step": 660052, "epoch": 7952} {"train_loss": -28.197202682495117, "global_step": 660053, "epoch": 7952} {"train_loss": -28.34006690979004, "global_step": 660054, "epoch": 7952} {"train_loss": -28.2382755279541, "global_step": 660055, "epoch": 7952} {"train_loss": -28.044921875, "global_step": 660056, "epoch": 7952} {"train_loss": -28.264387130737305, "global_step": 660057, "epoch": 7952} {"train_loss": -28.2791748046875, "global_step": 660058, "epoch": 7952} {"train_loss": -28.0159854888916, "global_step": 660059, "epoch": 7952} {"train_loss": -27.653934478759766, "global_step": 660060, "epoch": 7952} {"train_loss": -28.222009658813477, "global_step": 660061, "epoch": 7952} {"train_loss": -27.986408233642578, "global_step": 660062, "epoch": 7952} {"train_loss": -27.750965118408203, "global_step": 660063, "epoch": 7952} {"train_loss": -28.286069869995117, "global_step": 660064, "epoch": 7952} {"train_loss": -27.97031593322754, "global_step": 660065, "epoch": 7952} {"train_loss": -27.749832153320312, "global_step": 660066, "epoch": 7952} {"train_loss": -27.83717155456543, "global_step": 660067, "epoch": 7952} {"train_loss": -27.85686683654785, "global_step": 660068, "epoch": 7952} {"train_loss": -28.207263946533203, "global_step": 660069, "epoch": 7952} {"train_loss": -28.433490753173828, "global_step": 660070, "epoch": 7952} {"train_loss": -28.06837272644043, "global_step": 660071, "epoch": 7952} {"train_loss": -27.9401798248291, "global_step": 660072, "epoch": 7952} {"train_loss": -28.17510414123535, "global_step": 660073, "epoch": 7952} {"train_loss": -28.272016525268555, "global_step": 660074, "epoch": 7952} {"train_loss": -28.398609161376953, "global_step": 660075, "epoch": 7952} {"train_loss": -28.42677116394043, "global_step": 660076, "epoch": 7952} {"train_loss": -28.15699577331543, "global_step": 660077, "epoch": 7952} {"train_loss": -28.423542022705078, "global_step": 660078, "epoch": 7952} {"train_loss": -28.627531051635742, "global_step": 660079, "epoch": 7952} {"train_loss": -28.734155654907227, "global_step": 660080, "epoch": 7952} {"train_loss": -28.405195236206055, "global_step": 660081, "epoch": 7952} {"train_loss": -27.734420776367188, "global_step": 660082, "epoch": 7952} {"train_loss": -27.8380126953125, "global_step": 660083, "epoch": 7952} {"train_loss": -27.989673614501953, "global_step": 660084, "epoch": 7952} {"train_loss": -28.358463287353516, "global_step": 660085, "epoch": 7952} {"train_loss": -28.412878036499023, "global_step": 660086, "epoch": 7952} {"train_loss": -28.756559371948242, "global_step": 660087, "epoch": 7952} {"train_loss": -28.15650749206543, "global_step": 660088, "epoch": 7952} {"train_loss": -28.23029899597168, "global_step": 660089, "epoch": 7952} {"train_loss": -28.3738956451416, "global_step": 660090, "epoch": 7952} {"train_loss": -28.609594345092773, "global_step": 660091, "epoch": 7952} {"train_loss": -28.178098678588867, "global_step": 660092, "epoch": 7952} {"train_loss": -28.22003173828125, "global_step": 660093, "epoch": 7952} {"train_loss": -27.84063720703125, "global_step": 660094, "epoch": 7952} {"train_loss": -28.135480880737305, "global_step": 660095, "epoch": 7952} {"train_loss": -28.555133819580078, "global_step": 660096, "epoch": 7952} {"train_loss": -28.6207275390625, "global_step": 660097, "epoch": 7952} {"train_loss": -28.097413350300616, "global_step": 660098, "epoch": 7952, "val_loss": 6832506.5} {"train_loss": -28.109588623046875, "global_step": 660099, "epoch": 7953} {"train_loss": -27.903060913085938, "global_step": 660100, "epoch": 7953} {"train_loss": -27.811477661132812, "global_step": 660101, "epoch": 7953} {"train_loss": -27.501440048217773, "global_step": 660102, "epoch": 7953} {"train_loss": -27.15936851501465, "global_step": 660103, "epoch": 7953} {"train_loss": -27.776479721069336, "global_step": 660104, "epoch": 7953} {"train_loss": -27.693252563476562, "global_step": 660105, "epoch": 7953} {"train_loss": -28.143285751342773, "global_step": 660106, "epoch": 7953} {"train_loss": -28.200830459594727, "global_step": 660107, "epoch": 7953} {"train_loss": -28.177595138549805, "global_step": 660108, "epoch": 7953} {"train_loss": -27.881011962890625, "global_step": 660109, "epoch": 7953} {"train_loss": -28.07840919494629, "global_step": 660110, "epoch": 7953} {"train_loss": -28.013534545898438, "global_step": 660111, "epoch": 7953} {"train_loss": -28.375659942626953, "global_step": 660112, "epoch": 7953} {"train_loss": -28.48113441467285, "global_step": 660113, "epoch": 7953} {"train_loss": -28.276945114135742, "global_step": 660114, "epoch": 7953} {"train_loss": -28.564960479736328, "global_step": 660115, "epoch": 7953} {"train_loss": -28.74995231628418, "global_step": 660116, "epoch": 7953} {"train_loss": -28.382261276245117, "global_step": 660117, "epoch": 7953} {"train_loss": -28.523792266845703, "global_step": 660118, "epoch": 7953} {"train_loss": -28.378644943237305, "global_step": 660119, "epoch": 7953} {"train_loss": -28.414154052734375, "global_step": 660120, "epoch": 7953} {"train_loss": -28.2009220123291, "global_step": 660121, "epoch": 7953} {"train_loss": -28.504079818725586, "global_step": 660122, "epoch": 7953} {"train_loss": -28.32093620300293, "global_step": 660123, "epoch": 7953} {"train_loss": -28.599950790405273, "global_step": 660124, "epoch": 7953} {"train_loss": -28.386938095092773, "global_step": 660125, "epoch": 7953} {"train_loss": -28.50632095336914, "global_step": 660126, "epoch": 7953} {"train_loss": -28.526636123657227, "global_step": 660127, "epoch": 7953} {"train_loss": -28.794309616088867, "global_step": 660128, "epoch": 7953} {"train_loss": -28.470346450805664, "global_step": 660129, "epoch": 7953} {"train_loss": -28.591094970703125, "global_step": 660130, "epoch": 7953} {"train_loss": -28.62790870666504, "global_step": 660131, "epoch": 7953} {"train_loss": -28.664306640625, "global_step": 660132, "epoch": 7953} {"train_loss": -28.32508659362793, "global_step": 660133, "epoch": 7953} {"train_loss": -28.244403839111328, "global_step": 660134, "epoch": 7953} {"train_loss": -28.504911422729492, "global_step": 660135, "epoch": 7953} {"train_loss": -28.54443359375, "global_step": 660136, "epoch": 7953} {"train_loss": -28.508893966674805, "global_step": 660137, "epoch": 7953} {"train_loss": -28.25721549987793, "global_step": 660138, "epoch": 7953} {"train_loss": -28.548553466796875, "global_step": 660139, "epoch": 7953} {"train_loss": -28.81171989440918, "global_step": 660140, "epoch": 7953} {"train_loss": -28.766956329345703, "global_step": 660141, "epoch": 7953} {"train_loss": -28.372486114501953, "global_step": 660142, "epoch": 7953} {"train_loss": -28.66534423828125, "global_step": 660143, "epoch": 7953} {"train_loss": -28.495670318603516, "global_step": 660144, "epoch": 7953} {"train_loss": -28.34115982055664, "global_step": 660145, "epoch": 7953} {"train_loss": -28.363977432250977, "global_step": 660146, "epoch": 7953} {"train_loss": -28.674535751342773, "global_step": 660147, "epoch": 7953} {"train_loss": -28.69876480102539, "global_step": 660148, "epoch": 7953} {"train_loss": -28.4394588470459, "global_step": 660149, "epoch": 7953} {"train_loss": -28.746984481811523, "global_step": 660150, "epoch": 7953} {"train_loss": -28.624149322509766, "global_step": 660151, "epoch": 7953} {"train_loss": -28.678253173828125, "global_step": 660152, "epoch": 7953} {"train_loss": -28.47281265258789, "global_step": 660153, "epoch": 7953} {"train_loss": -28.405664443969727, "global_step": 660154, "epoch": 7953} {"train_loss": -28.5093936920166, "global_step": 660155, "epoch": 7953} {"train_loss": -28.604501724243164, "global_step": 660156, "epoch": 7953} {"train_loss": -28.448999404907227, "global_step": 660157, "epoch": 7953} {"train_loss": -28.51527214050293, "global_step": 660158, "epoch": 7953} {"train_loss": -27.786176681518555, "global_step": 660159, "epoch": 7953} {"train_loss": -27.67523765563965, "global_step": 660160, "epoch": 7953} {"train_loss": -27.380420684814453, "global_step": 660161, "epoch": 7953} {"train_loss": -27.831872940063477, "global_step": 660162, "epoch": 7953} {"train_loss": -27.83839225769043, "global_step": 660163, "epoch": 7953} {"train_loss": -28.236083984375, "global_step": 660164, "epoch": 7953} {"train_loss": -28.412002563476562, "global_step": 660165, "epoch": 7953} {"train_loss": -28.62910270690918, "global_step": 660166, "epoch": 7953} {"train_loss": -28.663381576538086, "global_step": 660167, "epoch": 7953} {"train_loss": -27.89410400390625, "global_step": 660168, "epoch": 7953} {"train_loss": -28.5228271484375, "global_step": 660169, "epoch": 7953} {"train_loss": -27.787704467773438, "global_step": 660170, "epoch": 7953} {"train_loss": -28.341760635375977, "global_step": 660171, "epoch": 7953} {"train_loss": -28.492231369018555, "global_step": 660172, "epoch": 7953} {"train_loss": -28.28449821472168, "global_step": 660173, "epoch": 7953} {"train_loss": -28.7797908782959, "global_step": 660174, "epoch": 7953} {"train_loss": -28.645429611206055, "global_step": 660175, "epoch": 7953} {"train_loss": -28.4130859375, "global_step": 660176, "epoch": 7953} {"train_loss": -28.295469284057617, "global_step": 660177, "epoch": 7953} {"train_loss": -28.553146362304688, "global_step": 660178, "epoch": 7953} {"train_loss": -28.291702270507812, "global_step": 660179, "epoch": 7953} {"train_loss": -27.988250732421875, "global_step": 660180, "epoch": 7953} {"train_loss": -28.327164983174885, "global_step": 660181, "epoch": 7953, "val_loss": 6707293.5} {"train_loss": -27.8428897857666, "global_step": 660182, "epoch": 7954} {"train_loss": -27.50391960144043, "global_step": 660183, "epoch": 7954} {"train_loss": -28.114660263061523, "global_step": 660184, "epoch": 7954} {"train_loss": -27.251195907592773, "global_step": 660185, "epoch": 7954} {"train_loss": -28.067480087280273, "global_step": 660186, "epoch": 7954} {"train_loss": -27.718215942382812, "global_step": 660187, "epoch": 7954} {"train_loss": -27.421823501586914, "global_step": 660188, "epoch": 7954} {"train_loss": -27.818090438842773, "global_step": 660189, "epoch": 7954} {"train_loss": -27.93848991394043, "global_step": 660190, "epoch": 7954} {"train_loss": -27.642425537109375, "global_step": 660191, "epoch": 7954} {"train_loss": -28.184350967407227, "global_step": 660192, "epoch": 7954} {"train_loss": -27.697378158569336, "global_step": 660193, "epoch": 7954} {"train_loss": -28.378894805908203, "global_step": 660194, "epoch": 7954} {"train_loss": -28.172134399414062, "global_step": 660195, "epoch": 7954} {"train_loss": -27.984878540039062, "global_step": 660196, "epoch": 7954} {"train_loss": -28.113718032836914, "global_step": 660197, "epoch": 7954} {"train_loss": -28.187284469604492, "global_step": 660198, "epoch": 7954} {"train_loss": -28.28623390197754, "global_step": 660199, "epoch": 7954} {"train_loss": -28.121204376220703, "global_step": 660200, "epoch": 7954} {"train_loss": -28.467945098876953, "global_step": 660201, "epoch": 7954} {"train_loss": -28.34635353088379, "global_step": 660202, "epoch": 7954} {"train_loss": -28.684940338134766, "global_step": 660203, "epoch": 7954} {"train_loss": -28.446149826049805, "global_step": 660204, "epoch": 7954} {"train_loss": -28.281179428100586, "global_step": 660205, "epoch": 7954} {"train_loss": -28.268798828125, "global_step": 660206, "epoch": 7954} {"train_loss": -28.304718017578125, "global_step": 660207, "epoch": 7954} {"train_loss": -28.621198654174805, "global_step": 660208, "epoch": 7954} {"train_loss": -28.266284942626953, "global_step": 660209, "epoch": 7954} {"train_loss": -28.15966796875, "global_step": 660210, "epoch": 7954} {"train_loss": -28.290740966796875, "global_step": 660211, "epoch": 7954} {"train_loss": -28.508804321289062, "global_step": 660212, "epoch": 7954} {"train_loss": -28.501188278198242, "global_step": 660213, "epoch": 7954} {"train_loss": -28.83155632019043, "global_step": 660214, "epoch": 7954} {"train_loss": -28.31512451171875, "global_step": 660215, "epoch": 7954} {"train_loss": -28.353168487548828, "global_step": 660216, "epoch": 7954} {"train_loss": -28.082983016967773, "global_step": 660217, "epoch": 7954} {"train_loss": -28.564184188842773, "global_step": 660218, "epoch": 7954} {"train_loss": -28.47580909729004, "global_step": 660219, "epoch": 7954} {"train_loss": -28.195234298706055, "global_step": 660220, "epoch": 7954} {"train_loss": -28.002243041992188, "global_step": 660221, "epoch": 7954} {"train_loss": -28.43731689453125, "global_step": 660222, "epoch": 7954} {"train_loss": -28.33731460571289, "global_step": 660223, "epoch": 7954} {"train_loss": -28.493818283081055, "global_step": 660224, "epoch": 7954} {"train_loss": -28.393163681030273, "global_step": 660225, "epoch": 7954} {"train_loss": -28.140466690063477, "global_step": 660226, "epoch": 7954} {"train_loss": -28.03569984436035, "global_step": 660227, "epoch": 7954} {"train_loss": -28.107980728149414, "global_step": 660228, "epoch": 7954} {"train_loss": -28.501373291015625, "global_step": 660229, "epoch": 7954} {"train_loss": -28.362104415893555, "global_step": 660230, "epoch": 7954} {"train_loss": -28.562286376953125, "global_step": 660231, "epoch": 7954} {"train_loss": -28.46088981628418, "global_step": 660232, "epoch": 7954} {"train_loss": -28.42085838317871, "global_step": 660233, "epoch": 7954} {"train_loss": -28.51605224609375, "global_step": 660234, "epoch": 7954} {"train_loss": -28.213977813720703, "global_step": 660235, "epoch": 7954} {"train_loss": -28.647024154663086, "global_step": 660236, "epoch": 7954} {"train_loss": -28.133237838745117, "global_step": 660237, "epoch": 7954} {"train_loss": -28.205549240112305, "global_step": 660238, "epoch": 7954} {"train_loss": -28.39667320251465, "global_step": 660239, "epoch": 7954} {"train_loss": -28.4999942779541, "global_step": 660240, "epoch": 7954} {"train_loss": -28.423303604125977, "global_step": 660241, "epoch": 7954} {"train_loss": -28.487512588500977, "global_step": 660242, "epoch": 7954} {"train_loss": -28.784326553344727, "global_step": 660243, "epoch": 7954} {"train_loss": -28.42145347595215, "global_step": 660244, "epoch": 7954} {"train_loss": -28.265396118164062, "global_step": 660245, "epoch": 7954} {"train_loss": -28.69378662109375, "global_step": 660246, "epoch": 7954} {"train_loss": -28.823720932006836, "global_step": 660247, "epoch": 7954} {"train_loss": -28.405364990234375, "global_step": 660248, "epoch": 7954} {"train_loss": -28.126113891601562, "global_step": 660249, "epoch": 7954} {"train_loss": -27.97420310974121, "global_step": 660250, "epoch": 7954} {"train_loss": -28.09112548828125, "global_step": 660251, "epoch": 7954} {"train_loss": -28.497425079345703, "global_step": 660252, "epoch": 7954} {"train_loss": -28.390104293823242, "global_step": 660253, "epoch": 7954} {"train_loss": -28.463964462280273, "global_step": 660254, "epoch": 7954} {"train_loss": -28.59382438659668, "global_step": 660255, "epoch": 7954} {"train_loss": -28.466760635375977, "global_step": 660256, "epoch": 7954} {"train_loss": -28.8371524810791, "global_step": 660257, "epoch": 7954} {"train_loss": -28.520132064819336, "global_step": 660258, "epoch": 7954} {"train_loss": -28.35793113708496, "global_step": 660259, "epoch": 7954} {"train_loss": -28.563079833984375, "global_step": 660260, "epoch": 7954} {"train_loss": -28.626861572265625, "global_step": 660261, "epoch": 7954} {"train_loss": -28.446744918823242, "global_step": 660262, "epoch": 7954} {"train_loss": -28.6230411529541, "global_step": 660263, "epoch": 7954} {"train_loss": -28.311126640044062, "global_step": 660264, "epoch": 7954, "val_loss": 6828651.0} {"train_loss": -27.76171875, "global_step": 660265, "epoch": 7955} {"train_loss": -27.371417999267578, "global_step": 660266, "epoch": 7955} {"train_loss": -27.580495834350586, "global_step": 660267, "epoch": 7955} {"train_loss": -27.068151473999023, "global_step": 660268, "epoch": 7955} {"train_loss": -27.12139892578125, "global_step": 660269, "epoch": 7955} {"train_loss": -27.22467613220215, "global_step": 660270, "epoch": 7955} {"train_loss": -27.652021408081055, "global_step": 660271, "epoch": 7955} {"train_loss": -25.326040267944336, "global_step": 660272, "epoch": 7955} {"train_loss": -27.14359474182129, "global_step": 660273, "epoch": 7955} {"train_loss": -27.817657470703125, "global_step": 660274, "epoch": 7955} {"train_loss": -27.024213790893555, "global_step": 660275, "epoch": 7955} {"train_loss": -27.944915771484375, "global_step": 660276, "epoch": 7955} {"train_loss": -27.85089683532715, "global_step": 660277, "epoch": 7955} {"train_loss": -27.3305721282959, "global_step": 660278, "epoch": 7955} {"train_loss": -28.08014488220215, "global_step": 660279, "epoch": 7955} {"train_loss": -27.80213737487793, "global_step": 660280, "epoch": 7955} {"train_loss": -28.289472579956055, "global_step": 660281, "epoch": 7955} {"train_loss": -28.02740478515625, "global_step": 660282, "epoch": 7955} {"train_loss": -28.345413208007812, "global_step": 660283, "epoch": 7955} {"train_loss": -27.602399826049805, "global_step": 660284, "epoch": 7955} {"train_loss": -28.073373794555664, "global_step": 660285, "epoch": 7955} {"train_loss": -28.018905639648438, "global_step": 660286, "epoch": 7955} {"train_loss": -28.112518310546875, "global_step": 660287, "epoch": 7955} {"train_loss": -27.87053871154785, "global_step": 660288, "epoch": 7955} {"train_loss": -27.8651123046875, "global_step": 660289, "epoch": 7955} {"train_loss": -27.99979591369629, "global_step": 660290, "epoch": 7955} {"train_loss": -27.861862182617188, "global_step": 660291, "epoch": 7955} {"train_loss": -27.959020614624023, "global_step": 660292, "epoch": 7955} {"train_loss": -27.874555587768555, "global_step": 660293, "epoch": 7955} {"train_loss": -28.11297607421875, "global_step": 660294, "epoch": 7955} {"train_loss": -28.39777183532715, "global_step": 660295, "epoch": 7955} {"train_loss": -28.357175827026367, "global_step": 660296, "epoch": 7955} {"train_loss": -27.932912826538086, "global_step": 660297, "epoch": 7955} {"train_loss": -28.368885040283203, "global_step": 660298, "epoch": 7955} {"train_loss": -28.180219650268555, "global_step": 660299, "epoch": 7955} {"train_loss": -28.28635597229004, "global_step": 660300, "epoch": 7955} {"train_loss": -28.2567195892334, "global_step": 660301, "epoch": 7955} {"train_loss": -28.347265243530273, "global_step": 660302, "epoch": 7955} {"train_loss": -28.36895179748535, "global_step": 660303, "epoch": 7955} {"train_loss": -28.6766300201416, "global_step": 660304, "epoch": 7955} {"train_loss": -28.353742599487305, "global_step": 660305, "epoch": 7955} {"train_loss": -28.442480087280273, "global_step": 660306, "epoch": 7955} {"train_loss": -28.646347045898438, "global_step": 660307, "epoch": 7955} {"train_loss": -28.2655029296875, "global_step": 660308, "epoch": 7955} {"train_loss": -28.43995475769043, "global_step": 660309, "epoch": 7955} {"train_loss": -28.434192657470703, "global_step": 660310, "epoch": 7955} {"train_loss": -28.334768295288086, "global_step": 660311, "epoch": 7955} {"train_loss": -28.90228271484375, "global_step": 660312, "epoch": 7955} {"train_loss": -28.388341903686523, "global_step": 660313, "epoch": 7955} {"train_loss": -28.805265426635742, "global_step": 660314, "epoch": 7955} {"train_loss": -28.645477294921875, "global_step": 660315, "epoch": 7955} {"train_loss": -28.800113677978516, "global_step": 660316, "epoch": 7955} {"train_loss": -28.702009201049805, "global_step": 660317, "epoch": 7955} {"train_loss": -28.37040138244629, "global_step": 660318, "epoch": 7955} {"train_loss": -29.11146354675293, "global_step": 660319, "epoch": 7955} {"train_loss": -28.394987106323242, "global_step": 660320, "epoch": 7955} {"train_loss": -28.32509422302246, "global_step": 660321, "epoch": 7955} {"train_loss": -28.533308029174805, "global_step": 660322, "epoch": 7955} {"train_loss": -28.6200008392334, "global_step": 660323, "epoch": 7955} {"train_loss": -28.816574096679688, "global_step": 660324, "epoch": 7955} {"train_loss": -28.91914176940918, "global_step": 660325, "epoch": 7955} {"train_loss": -28.616363525390625, "global_step": 660326, "epoch": 7955} {"train_loss": -28.587055206298828, "global_step": 660327, "epoch": 7955} {"train_loss": -28.186145782470703, "global_step": 660328, "epoch": 7955} {"train_loss": -28.4545955657959, "global_step": 660329, "epoch": 7955} {"train_loss": -28.721649169921875, "global_step": 660330, "epoch": 7955} {"train_loss": -28.255416870117188, "global_step": 660331, "epoch": 7955} {"train_loss": -28.153095245361328, "global_step": 660332, "epoch": 7955} {"train_loss": -28.491479873657227, "global_step": 660333, "epoch": 7955} {"train_loss": -28.12262535095215, "global_step": 660334, "epoch": 7955} {"train_loss": -28.392969131469727, "global_step": 660335, "epoch": 7955} {"train_loss": -28.283954620361328, "global_step": 660336, "epoch": 7955} {"train_loss": -27.919897079467773, "global_step": 660337, "epoch": 7955} {"train_loss": -27.85285758972168, "global_step": 660338, "epoch": 7955} {"train_loss": -26.926984786987305, "global_step": 660339, "epoch": 7955} {"train_loss": -25.605640411376953, "global_step": 660340, "epoch": 7955} {"train_loss": -27.629749298095703, "global_step": 660341, "epoch": 7955} {"train_loss": -27.7299861907959, "global_step": 660342, "epoch": 7955} {"train_loss": -26.93854331970215, "global_step": 660343, "epoch": 7955} {"train_loss": -27.751489639282227, "global_step": 660344, "epoch": 7955} {"train_loss": -27.48095703125, "global_step": 660345, "epoch": 7955} {"train_loss": -28.275226593017578, "global_step": 660346, "epoch": 7955} {"train_loss": -28.04834230262113, "global_step": 660347, "epoch": 7955, "val_loss": 6880780.0} {"train_loss": -25.82485008239746, "global_step": 660348, "epoch": 7956} {"train_loss": -26.884796142578125, "global_step": 660349, "epoch": 7956} {"train_loss": -26.776386260986328, "global_step": 660350, "epoch": 7956} {"train_loss": -26.551111221313477, "global_step": 660351, "epoch": 7956} {"train_loss": -26.59737205505371, "global_step": 660352, "epoch": 7956} {"train_loss": -27.01637077331543, "global_step": 660353, "epoch": 7956} {"train_loss": -27.292264938354492, "global_step": 660354, "epoch": 7956} {"train_loss": -27.084707260131836, "global_step": 660355, "epoch": 7956} {"train_loss": -26.77889060974121, "global_step": 660356, "epoch": 7956} {"train_loss": -27.30970573425293, "global_step": 660357, "epoch": 7956} {"train_loss": -26.979482650756836, "global_step": 660358, "epoch": 7956} {"train_loss": -27.27507972717285, "global_step": 660359, "epoch": 7956} {"train_loss": -27.491321563720703, "global_step": 660360, "epoch": 7956} {"train_loss": -27.10162925720215, "global_step": 660361, "epoch": 7956} {"train_loss": -27.442914962768555, "global_step": 660362, "epoch": 7956} {"train_loss": -27.412616729736328, "global_step": 660363, "epoch": 7956} {"train_loss": -27.45627784729004, "global_step": 660364, "epoch": 7956} {"train_loss": -27.903791427612305, "global_step": 660365, "epoch": 7956} {"train_loss": -27.617414474487305, "global_step": 660366, "epoch": 7956} {"train_loss": -27.653379440307617, "global_step": 660367, "epoch": 7956} {"train_loss": -27.728057861328125, "global_step": 660368, "epoch": 7956} {"train_loss": -27.69843864440918, "global_step": 660369, "epoch": 7956} {"train_loss": -28.201995849609375, "global_step": 660370, "epoch": 7956} {"train_loss": -27.560958862304688, "global_step": 660371, "epoch": 7956} {"train_loss": -27.67768669128418, "global_step": 660372, "epoch": 7956} {"train_loss": -27.80865478515625, "global_step": 660373, "epoch": 7956} {"train_loss": -27.87160301208496, "global_step": 660374, "epoch": 7956} {"train_loss": -28.042383193969727, "global_step": 660375, "epoch": 7956} {"train_loss": -27.873950958251953, "global_step": 660376, "epoch": 7956} {"train_loss": -27.851415634155273, "global_step": 660377, "epoch": 7956} {"train_loss": -27.94906997680664, "global_step": 660378, "epoch": 7956} {"train_loss": -28.003686904907227, "global_step": 660379, "epoch": 7956} {"train_loss": -27.80582046508789, "global_step": 660380, "epoch": 7956} {"train_loss": -27.996747970581055, "global_step": 660381, "epoch": 7956} {"train_loss": -27.864065170288086, "global_step": 660382, "epoch": 7956} {"train_loss": -28.17533302307129, "global_step": 660383, "epoch": 7956} {"train_loss": -27.66547203063965, "global_step": 660384, "epoch": 7956} {"train_loss": -28.51017189025879, "global_step": 660385, "epoch": 7956} {"train_loss": -28.322708129882812, "global_step": 660386, "epoch": 7956} {"train_loss": -28.339685440063477, "global_step": 660387, "epoch": 7956} {"train_loss": -28.03069496154785, "global_step": 660388, "epoch": 7956} {"train_loss": -27.99212646484375, "global_step": 660389, "epoch": 7956} {"train_loss": -28.524734497070312, "global_step": 660390, "epoch": 7956} {"train_loss": -28.195432662963867, "global_step": 660391, "epoch": 7956} {"train_loss": -28.01800537109375, "global_step": 660392, "epoch": 7956} {"train_loss": -28.611921310424805, "global_step": 660393, "epoch": 7956} {"train_loss": -28.22406005859375, "global_step": 660394, "epoch": 7956} {"train_loss": -28.30712890625, "global_step": 660395, "epoch": 7956} {"train_loss": -28.255163192749023, "global_step": 660396, "epoch": 7956} {"train_loss": -28.2722110748291, "global_step": 660397, "epoch": 7956} {"train_loss": -28.31915855407715, "global_step": 660398, "epoch": 7956} {"train_loss": -28.27862548828125, "global_step": 660399, "epoch": 7956} {"train_loss": -28.650293350219727, "global_step": 660400, "epoch": 7956} {"train_loss": -28.603696823120117, "global_step": 660401, "epoch": 7956} {"train_loss": -28.51344108581543, "global_step": 660402, "epoch": 7956} {"train_loss": -28.671903610229492, "global_step": 660403, "epoch": 7956} {"train_loss": -28.407445907592773, "global_step": 660404, "epoch": 7956} {"train_loss": -28.644113540649414, "global_step": 660405, "epoch": 7956} {"train_loss": -28.64822769165039, "global_step": 660406, "epoch": 7956} {"train_loss": -28.300107955932617, "global_step": 660407, "epoch": 7956} {"train_loss": -28.442203521728516, "global_step": 660408, "epoch": 7956} {"train_loss": -28.798242568969727, "global_step": 660409, "epoch": 7956} {"train_loss": -28.6281681060791, "global_step": 660410, "epoch": 7956} {"train_loss": -28.73552894592285, "global_step": 660411, "epoch": 7956} {"train_loss": -28.456348419189453, "global_step": 660412, "epoch": 7956} {"train_loss": -28.532217025756836, "global_step": 660413, "epoch": 7956} {"train_loss": -28.912439346313477, "global_step": 660414, "epoch": 7956} {"train_loss": -28.301313400268555, "global_step": 660415, "epoch": 7956} {"train_loss": -28.368305206298828, "global_step": 660416, "epoch": 7956} {"train_loss": -28.406558990478516, "global_step": 660417, "epoch": 7956} {"train_loss": -28.883136749267578, "global_step": 660418, "epoch": 7956} {"train_loss": -28.511138916015625, "global_step": 660419, "epoch": 7956} {"train_loss": -28.49445915222168, "global_step": 660420, "epoch": 7956} {"train_loss": -28.321210861206055, "global_step": 660421, "epoch": 7956} {"train_loss": -28.75201416015625, "global_step": 660422, "epoch": 7956} {"train_loss": -28.629730224609375, "global_step": 660423, "epoch": 7956} {"train_loss": -28.485254287719727, "global_step": 660424, "epoch": 7956} {"train_loss": -28.654565811157227, "global_step": 660425, "epoch": 7956} {"train_loss": -28.552658081054688, "global_step": 660426, "epoch": 7956} {"train_loss": -28.831268310546875, "global_step": 660427, "epoch": 7956} {"train_loss": -28.547056198120117, "global_step": 660428, "epoch": 7956} {"train_loss": -28.7845458984375, "global_step": 660429, "epoch": 7956} {"train_loss": -28.022677708821124, "global_step": 660430, "epoch": 7956, "val_loss": 6862862.0} {"train_loss": -27.971948623657227, "global_step": 660431, "epoch": 7957} {"train_loss": -27.476577758789062, "global_step": 660432, "epoch": 7957} {"train_loss": -26.988080978393555, "global_step": 660433, "epoch": 7957} {"train_loss": -27.044626235961914, "global_step": 660434, "epoch": 7957} {"train_loss": -27.619007110595703, "global_step": 660435, "epoch": 7957} {"train_loss": -27.651554107666016, "global_step": 660436, "epoch": 7957} {"train_loss": -27.616575241088867, "global_step": 660437, "epoch": 7957} {"train_loss": -27.11506462097168, "global_step": 660438, "epoch": 7957} {"train_loss": -28.050296783447266, "global_step": 660439, "epoch": 7957} {"train_loss": -27.3435115814209, "global_step": 660440, "epoch": 7957} {"train_loss": -27.181079864501953, "global_step": 660441, "epoch": 7957} {"train_loss": -27.917194366455078, "global_step": 660442, "epoch": 7957} {"train_loss": -28.22635269165039, "global_step": 660443, "epoch": 7957} {"train_loss": -27.30904197692871, "global_step": 660444, "epoch": 7957} {"train_loss": -27.755878448486328, "global_step": 660445, "epoch": 7957} {"train_loss": -27.52985191345215, "global_step": 660446, "epoch": 7957} {"train_loss": -27.855865478515625, "global_step": 660447, "epoch": 7957} {"train_loss": -27.9024715423584, "global_step": 660448, "epoch": 7957} {"train_loss": -28.055688858032227, "global_step": 660449, "epoch": 7957} {"train_loss": -28.356689453125, "global_step": 660450, "epoch": 7957} {"train_loss": -28.28516960144043, "global_step": 660451, "epoch": 7957} {"train_loss": -28.028888702392578, "global_step": 660452, "epoch": 7957} {"train_loss": -28.410131454467773, "global_step": 660453, "epoch": 7957} {"train_loss": -28.731836318969727, "global_step": 660454, "epoch": 7957} {"train_loss": -27.888992309570312, "global_step": 660455, "epoch": 7957} {"train_loss": -28.79262351989746, "global_step": 660456, "epoch": 7957} {"train_loss": -27.885473251342773, "global_step": 660457, "epoch": 7957} {"train_loss": -28.3865966796875, "global_step": 660458, "epoch": 7957} {"train_loss": -28.196935653686523, "global_step": 660459, "epoch": 7957} {"train_loss": -28.10090446472168, "global_step": 660460, "epoch": 7957} {"train_loss": -28.08624267578125, "global_step": 660461, "epoch": 7957} {"train_loss": -28.23569107055664, "global_step": 660462, "epoch": 7957} {"train_loss": -28.50752067565918, "global_step": 660463, "epoch": 7957} {"train_loss": -28.29230308532715, "global_step": 660464, "epoch": 7957} {"train_loss": -28.08540153503418, "global_step": 660465, "epoch": 7957} {"train_loss": -28.328271865844727, "global_step": 660466, "epoch": 7957} {"train_loss": -28.392873764038086, "global_step": 660467, "epoch": 7957} {"train_loss": -28.02566909790039, "global_step": 660468, "epoch": 7957} {"train_loss": -28.38690757751465, "global_step": 660469, "epoch": 7957} {"train_loss": -28.432342529296875, "global_step": 660470, "epoch": 7957} {"train_loss": -28.079029083251953, "global_step": 660471, "epoch": 7957} {"train_loss": -28.493392944335938, "global_step": 660472, "epoch": 7957} {"train_loss": -28.0396728515625, "global_step": 660473, "epoch": 7957} {"train_loss": -27.968952178955078, "global_step": 660474, "epoch": 7957} {"train_loss": -28.37236976623535, "global_step": 660475, "epoch": 7957} {"train_loss": -28.38202476501465, "global_step": 660476, "epoch": 7957} {"train_loss": -28.5476016998291, "global_step": 660477, "epoch": 7957} {"train_loss": -28.275440216064453, "global_step": 660478, "epoch": 7957} {"train_loss": -28.300214767456055, "global_step": 660479, "epoch": 7957} {"train_loss": -28.318912506103516, "global_step": 660480, "epoch": 7957} {"train_loss": -27.912763595581055, "global_step": 660481, "epoch": 7957} {"train_loss": -28.13088035583496, "global_step": 660482, "epoch": 7957} {"train_loss": -28.002588272094727, "global_step": 660483, "epoch": 7957} {"train_loss": -27.621570587158203, "global_step": 660484, "epoch": 7957} {"train_loss": -28.4219970703125, "global_step": 660485, "epoch": 7957} {"train_loss": -28.638330459594727, "global_step": 660486, "epoch": 7957} {"train_loss": -27.489835739135742, "global_step": 660487, "epoch": 7957} {"train_loss": -27.71827507019043, "global_step": 660488, "epoch": 7957} {"train_loss": -28.398168563842773, "global_step": 660489, "epoch": 7957} {"train_loss": -28.169843673706055, "global_step": 660490, "epoch": 7957} {"train_loss": -28.357196807861328, "global_step": 660491, "epoch": 7957} {"train_loss": -28.368789672851562, "global_step": 660492, "epoch": 7957} {"train_loss": -28.207599639892578, "global_step": 660493, "epoch": 7957} {"train_loss": -28.165714263916016, "global_step": 660494, "epoch": 7957} {"train_loss": -28.391727447509766, "global_step": 660495, "epoch": 7957} {"train_loss": -28.019384384155273, "global_step": 660496, "epoch": 7957} {"train_loss": -28.145404815673828, "global_step": 660497, "epoch": 7957} {"train_loss": -28.41132926940918, "global_step": 660498, "epoch": 7957} {"train_loss": -28.290319442749023, "global_step": 660499, "epoch": 7957} {"train_loss": -28.51380729675293, "global_step": 660500, "epoch": 7957} {"train_loss": -28.431589126586914, "global_step": 660501, "epoch": 7957} {"train_loss": -28.672760009765625, "global_step": 660502, "epoch": 7957} {"train_loss": -28.6975040435791, "global_step": 660503, "epoch": 7957} {"train_loss": -28.612537384033203, "global_step": 660504, "epoch": 7957} {"train_loss": -28.288257598876953, "global_step": 660505, "epoch": 7957} {"train_loss": -28.391138076782227, "global_step": 660506, "epoch": 7957} {"train_loss": -28.36260986328125, "global_step": 660507, "epoch": 7957} {"train_loss": -28.518939971923828, "global_step": 660508, "epoch": 7957} {"train_loss": -28.444738388061523, "global_step": 660509, "epoch": 7957} {"train_loss": -28.3033390045166, "global_step": 660510, "epoch": 7957} {"train_loss": -28.304676055908203, "global_step": 660511, "epoch": 7957} {"train_loss": -28.617145538330078, "global_step": 660512, "epoch": 7957} {"train_loss": -28.140700351761048, "global_step": 660513, "epoch": 7957, "val_loss": 6781756.0} {"train_loss": -27.8933048248291, "global_step": 660514, "epoch": 7958} {"train_loss": -28.13556480407715, "global_step": 660515, "epoch": 7958} {"train_loss": -28.23284912109375, "global_step": 660516, "epoch": 7958} {"train_loss": -27.71689224243164, "global_step": 660517, "epoch": 7958} {"train_loss": -28.000925064086914, "global_step": 660518, "epoch": 7958} {"train_loss": -27.604276657104492, "global_step": 660519, "epoch": 7958} {"train_loss": -27.641992568969727, "global_step": 660520, "epoch": 7958} {"train_loss": -27.731115341186523, "global_step": 660521, "epoch": 7958} {"train_loss": -28.05322265625, "global_step": 660522, "epoch": 7958} {"train_loss": -27.80585289001465, "global_step": 660523, "epoch": 7958} {"train_loss": -27.816104888916016, "global_step": 660524, "epoch": 7958} {"train_loss": -28.072036743164062, "global_step": 660525, "epoch": 7958} {"train_loss": -27.521759033203125, "global_step": 660526, "epoch": 7958} {"train_loss": -27.7508544921875, "global_step": 660527, "epoch": 7958} {"train_loss": -28.06292724609375, "global_step": 660528, "epoch": 7958} {"train_loss": -27.8571720123291, "global_step": 660529, "epoch": 7958} {"train_loss": -27.376550674438477, "global_step": 660530, "epoch": 7958} {"train_loss": -28.281198501586914, "global_step": 660531, "epoch": 7958} {"train_loss": -27.587278366088867, "global_step": 660532, "epoch": 7958} {"train_loss": -28.17728042602539, "global_step": 660533, "epoch": 7958} {"train_loss": -27.893985748291016, "global_step": 660534, "epoch": 7958} {"train_loss": -27.646772384643555, "global_step": 660535, "epoch": 7958} {"train_loss": -28.1555233001709, "global_step": 660536, "epoch": 7958} {"train_loss": -28.290307998657227, "global_step": 660537, "epoch": 7958} {"train_loss": -27.848621368408203, "global_step": 660538, "epoch": 7958} {"train_loss": -27.921354293823242, "global_step": 660539, "epoch": 7958} {"train_loss": -28.282377243041992, "global_step": 660540, "epoch": 7958} {"train_loss": -28.052778244018555, "global_step": 660541, "epoch": 7958} {"train_loss": -28.069183349609375, "global_step": 660542, "epoch": 7958} {"train_loss": -27.9774227142334, "global_step": 660543, "epoch": 7958} {"train_loss": -28.090164184570312, "global_step": 660544, "epoch": 7958} {"train_loss": -28.20050621032715, "global_step": 660545, "epoch": 7958} {"train_loss": -28.08057975769043, "global_step": 660546, "epoch": 7958} {"train_loss": -28.427627563476562, "global_step": 660547, "epoch": 7958} {"train_loss": -28.348066329956055, "global_step": 660548, "epoch": 7958} {"train_loss": -28.16546058654785, "global_step": 660549, "epoch": 7958} {"train_loss": -28.15423583984375, "global_step": 660550, "epoch": 7958} {"train_loss": -28.409631729125977, "global_step": 660551, "epoch": 7958} {"train_loss": -28.357786178588867, "global_step": 660552, "epoch": 7958} {"train_loss": -28.2200984954834, "global_step": 660553, "epoch": 7958} {"train_loss": -28.28534507751465, "global_step": 660554, "epoch": 7958} {"train_loss": -28.153478622436523, "global_step": 660555, "epoch": 7958} {"train_loss": -28.251779556274414, "global_step": 660556, "epoch": 7958} {"train_loss": -28.272375106811523, "global_step": 660557, "epoch": 7958} {"train_loss": -28.413434982299805, "global_step": 660558, "epoch": 7958} {"train_loss": -28.21234130859375, "global_step": 660559, "epoch": 7958} {"train_loss": -28.804763793945312, "global_step": 660560, "epoch": 7958} {"train_loss": -29.12761878967285, "global_step": 660561, "epoch": 7958} {"train_loss": -28.53261375427246, "global_step": 660562, "epoch": 7958} {"train_loss": -28.889127731323242, "global_step": 660563, "epoch": 7958} {"train_loss": -28.5811824798584, "global_step": 660564, "epoch": 7958} {"train_loss": -28.357894897460938, "global_step": 660565, "epoch": 7958} {"train_loss": -28.1529541015625, "global_step": 660566, "epoch": 7958} {"train_loss": -28.491018295288086, "global_step": 660567, "epoch": 7958} {"train_loss": -28.58095359802246, "global_step": 660568, "epoch": 7958} {"train_loss": -28.810773849487305, "global_step": 660569, "epoch": 7958} {"train_loss": -28.708799362182617, "global_step": 660570, "epoch": 7958} {"train_loss": -28.916168212890625, "global_step": 660571, "epoch": 7958} {"train_loss": -28.268720626831055, "global_step": 660572, "epoch": 7958} {"train_loss": -28.185169219970703, "global_step": 660573, "epoch": 7958} {"train_loss": -28.18075942993164, "global_step": 660574, "epoch": 7958} {"train_loss": -27.700714111328125, "global_step": 660575, "epoch": 7958} {"train_loss": -27.063135147094727, "global_step": 660576, "epoch": 7958} {"train_loss": -25.804914474487305, "global_step": 660577, "epoch": 7958} {"train_loss": -25.104995727539062, "global_step": 660578, "epoch": 7958} {"train_loss": -27.6123046875, "global_step": 660579, "epoch": 7958} {"train_loss": -26.77005958557129, "global_step": 660580, "epoch": 7958} {"train_loss": -26.701257705688477, "global_step": 660581, "epoch": 7958} {"train_loss": -27.612659454345703, "global_step": 660582, "epoch": 7958} {"train_loss": -27.485532760620117, "global_step": 660583, "epoch": 7958} {"train_loss": -27.73331642150879, "global_step": 660584, "epoch": 7958} {"train_loss": -27.98257827758789, "global_step": 660585, "epoch": 7958} {"train_loss": -26.984909057617188, "global_step": 660586, "epoch": 7958} {"train_loss": -27.539392471313477, "global_step": 660587, "epoch": 7958} {"train_loss": -28.09803581237793, "global_step": 660588, "epoch": 7958} {"train_loss": -27.06487464904785, "global_step": 660589, "epoch": 7958} {"train_loss": -28.0858211517334, "global_step": 660590, "epoch": 7958} {"train_loss": -27.81708335876465, "global_step": 660591, "epoch": 7958} {"train_loss": -28.088153839111328, "global_step": 660592, "epoch": 7958} {"train_loss": -27.966552734375, "global_step": 660593, "epoch": 7958} {"train_loss": -27.919477462768555, "global_step": 660594, "epoch": 7958} {"train_loss": -28.135562896728516, "global_step": 660595, "epoch": 7958} {"train_loss": -27.957878963056817, "global_step": 660596, "epoch": 7958, "val_loss": 6831875.5} {"train_loss": -27.1639461517334, "global_step": 660597, "epoch": 7959} {"train_loss": -26.23073387145996, "global_step": 660598, "epoch": 7959} {"train_loss": -26.604969024658203, "global_step": 660599, "epoch": 7959} {"train_loss": -27.550745010375977, "global_step": 660600, "epoch": 7959} {"train_loss": -26.725317001342773, "global_step": 660601, "epoch": 7959} {"train_loss": -27.655517578125, "global_step": 660602, "epoch": 7959} {"train_loss": -26.75946617126465, "global_step": 660603, "epoch": 7959} {"train_loss": -27.57039451599121, "global_step": 660604, "epoch": 7959} {"train_loss": -26.796064376831055, "global_step": 660605, "epoch": 7959} {"train_loss": -27.653295516967773, "global_step": 660606, "epoch": 7959} {"train_loss": -27.0339412689209, "global_step": 660607, "epoch": 7959} {"train_loss": -27.371366500854492, "global_step": 660608, "epoch": 7959} {"train_loss": -27.612354278564453, "global_step": 660609, "epoch": 7959} {"train_loss": -27.3570499420166, "global_step": 660610, "epoch": 7959} {"train_loss": -27.39176368713379, "global_step": 660611, "epoch": 7959} {"train_loss": -27.68381118774414, "global_step": 660612, "epoch": 7959} {"train_loss": -27.892675399780273, "global_step": 660613, "epoch": 7959} {"train_loss": -27.60947608947754, "global_step": 660614, "epoch": 7959} {"train_loss": -27.992786407470703, "global_step": 660615, "epoch": 7959} {"train_loss": -27.969650268554688, "global_step": 660616, "epoch": 7959} {"train_loss": -27.404647827148438, "global_step": 660617, "epoch": 7959} {"train_loss": -27.818653106689453, "global_step": 660618, "epoch": 7959} {"train_loss": -27.871152877807617, "global_step": 660619, "epoch": 7959} {"train_loss": -27.909765243530273, "global_step": 660620, "epoch": 7959} {"train_loss": -28.045886993408203, "global_step": 660621, "epoch": 7959} {"train_loss": -28.36512565612793, "global_step": 660622, "epoch": 7959} {"train_loss": -28.259586334228516, "global_step": 660623, "epoch": 7959} {"train_loss": -28.204980850219727, "global_step": 660624, "epoch": 7959} {"train_loss": -28.20599937438965, "global_step": 660625, "epoch": 7959} {"train_loss": -28.275373458862305, "global_step": 660626, "epoch": 7959} {"train_loss": -28.31585121154785, "global_step": 660627, "epoch": 7959} {"train_loss": -28.01327896118164, "global_step": 660628, "epoch": 7959} {"train_loss": -28.17466163635254, "global_step": 660629, "epoch": 7959} {"train_loss": -28.0008487701416, "global_step": 660630, "epoch": 7959} {"train_loss": -28.281539916992188, "global_step": 660631, "epoch": 7959} {"train_loss": -28.44220542907715, "global_step": 660632, "epoch": 7959} {"train_loss": -28.343704223632812, "global_step": 660633, "epoch": 7959} {"train_loss": -28.124509811401367, "global_step": 660634, "epoch": 7959} {"train_loss": -27.9355411529541, "global_step": 660635, "epoch": 7959} {"train_loss": -28.1097469329834, "global_step": 660636, "epoch": 7959} {"train_loss": -28.294418334960938, "global_step": 660637, "epoch": 7959} {"train_loss": -28.285409927368164, "global_step": 660638, "epoch": 7959} {"train_loss": -28.11466407775879, "global_step": 660639, "epoch": 7959} {"train_loss": -28.365528106689453, "global_step": 660640, "epoch": 7959} {"train_loss": -28.698383331298828, "global_step": 660641, "epoch": 7959} {"train_loss": -28.555234909057617, "global_step": 660642, "epoch": 7959} {"train_loss": -28.671112060546875, "global_step": 660643, "epoch": 7959} {"train_loss": -28.583227157592773, "global_step": 660644, "epoch": 7959} {"train_loss": -28.352893829345703, "global_step": 660645, "epoch": 7959} {"train_loss": -28.14164161682129, "global_step": 660646, "epoch": 7959} {"train_loss": -28.38058853149414, "global_step": 660647, "epoch": 7959} {"train_loss": -28.581775665283203, "global_step": 660648, "epoch": 7959} {"train_loss": -28.296316146850586, "global_step": 660649, "epoch": 7959} {"train_loss": -28.536865234375, "global_step": 660650, "epoch": 7959} {"train_loss": -28.64484977722168, "global_step": 660651, "epoch": 7959} {"train_loss": -28.441150665283203, "global_step": 660652, "epoch": 7959} {"train_loss": -28.735509872436523, "global_step": 660653, "epoch": 7959} {"train_loss": -28.578393936157227, "global_step": 660654, "epoch": 7959} {"train_loss": -28.81777000427246, "global_step": 660655, "epoch": 7959} {"train_loss": -28.928485870361328, "global_step": 660656, "epoch": 7959} {"train_loss": -28.295806884765625, "global_step": 660657, "epoch": 7959} {"train_loss": -28.421438217163086, "global_step": 660658, "epoch": 7959} {"train_loss": -28.42915153503418, "global_step": 660659, "epoch": 7959} {"train_loss": -28.786890029907227, "global_step": 660660, "epoch": 7959} {"train_loss": -28.5545654296875, "global_step": 660661, "epoch": 7959} {"train_loss": -28.452899932861328, "global_step": 660662, "epoch": 7959} {"train_loss": -28.355268478393555, "global_step": 660663, "epoch": 7959} {"train_loss": -28.545637130737305, "global_step": 660664, "epoch": 7959} {"train_loss": -28.424758911132812, "global_step": 660665, "epoch": 7959} {"train_loss": -28.69136619567871, "global_step": 660666, "epoch": 7959} {"train_loss": -28.42637062072754, "global_step": 660667, "epoch": 7959} {"train_loss": -28.45025062561035, "global_step": 660668, "epoch": 7959} {"train_loss": -28.418607711791992, "global_step": 660669, "epoch": 7959} {"train_loss": -28.24800682067871, "global_step": 660670, "epoch": 7959} {"train_loss": -28.674320220947266, "global_step": 660671, "epoch": 7959} {"train_loss": -28.678518295288086, "global_step": 660672, "epoch": 7959} {"train_loss": -27.964231491088867, "global_step": 660673, "epoch": 7959} {"train_loss": -28.18375587463379, "global_step": 660674, "epoch": 7959} {"train_loss": -28.50806999206543, "global_step": 660675, "epoch": 7959} {"train_loss": -28.353759765625, "global_step": 660676, "epoch": 7959} {"train_loss": -28.110177993774414, "global_step": 660677, "epoch": 7959} {"train_loss": -28.266645431518555, "global_step": 660678, "epoch": 7959} {"train_loss": -28.093386316873943, "global_step": 660679, "epoch": 7959, "val_loss": 6798930.0} {"train_loss": -28.209211349487305, "global_step": 660680, "epoch": 7960} {"train_loss": -27.921192169189453, "global_step": 660681, "epoch": 7960} {"train_loss": -28.03143310546875, "global_step": 660682, "epoch": 7960} {"train_loss": -28.466611862182617, "global_step": 660683, "epoch": 7960} {"train_loss": -27.846866607666016, "global_step": 660684, "epoch": 7960} {"train_loss": -28.2702693939209, "global_step": 660685, "epoch": 7960} {"train_loss": -28.5491886138916, "global_step": 660686, "epoch": 7960} {"train_loss": -27.973331451416016, "global_step": 660687, "epoch": 7960} {"train_loss": -27.746185302734375, "global_step": 660688, "epoch": 7960} {"train_loss": -28.45147705078125, "global_step": 660689, "epoch": 7960} {"train_loss": -28.007495880126953, "global_step": 660690, "epoch": 7960} {"train_loss": -28.295175552368164, "global_step": 660691, "epoch": 7960} {"train_loss": -28.505985260009766, "global_step": 660692, "epoch": 7960} {"train_loss": -28.03114128112793, "global_step": 660693, "epoch": 7960} {"train_loss": -28.26654624938965, "global_step": 660694, "epoch": 7960} {"train_loss": -28.608983993530273, "global_step": 660695, "epoch": 7960} {"train_loss": -28.380523681640625, "global_step": 660696, "epoch": 7960} {"train_loss": -28.5657958984375, "global_step": 660697, "epoch": 7960} {"train_loss": -28.42681312561035, "global_step": 660698, "epoch": 7960} {"train_loss": -28.487537384033203, "global_step": 660699, "epoch": 7960} {"train_loss": -28.16620445251465, "global_step": 660700, "epoch": 7960} {"train_loss": -28.490880966186523, "global_step": 660701, "epoch": 7960} {"train_loss": -28.735502243041992, "global_step": 660702, "epoch": 7960} {"train_loss": -28.428476333618164, "global_step": 660703, "epoch": 7960} {"train_loss": -28.44202995300293, "global_step": 660704, "epoch": 7960} {"train_loss": -28.63569450378418, "global_step": 660705, "epoch": 7960} {"train_loss": -28.442724227905273, "global_step": 660706, "epoch": 7960} {"train_loss": -28.739276885986328, "global_step": 660707, "epoch": 7960} {"train_loss": -28.555612564086914, "global_step": 660708, "epoch": 7960} {"train_loss": -28.713092803955078, "global_step": 660709, "epoch": 7960} {"train_loss": -28.458776473999023, "global_step": 660710, "epoch": 7960} {"train_loss": -28.641611099243164, "global_step": 660711, "epoch": 7960} {"train_loss": -28.8168888092041, "global_step": 660712, "epoch": 7960} {"train_loss": -28.60651206970215, "global_step": 660713, "epoch": 7960} {"train_loss": -28.38177490234375, "global_step": 660714, "epoch": 7960} {"train_loss": -28.314950942993164, "global_step": 660715, "epoch": 7960} {"train_loss": -28.5207576751709, "global_step": 660716, "epoch": 7960} {"train_loss": -28.764429092407227, "global_step": 660717, "epoch": 7960} {"train_loss": -28.349578857421875, "global_step": 660718, "epoch": 7960} {"train_loss": -28.187286376953125, "global_step": 660719, "epoch": 7960} {"train_loss": -28.32806396484375, "global_step": 660720, "epoch": 7960} {"train_loss": -28.587827682495117, "global_step": 660721, "epoch": 7960} {"train_loss": -28.578886032104492, "global_step": 660722, "epoch": 7960} {"train_loss": -28.465253829956055, "global_step": 660723, "epoch": 7960} {"train_loss": -28.39710807800293, "global_step": 660724, "epoch": 7960} {"train_loss": -28.16007423400879, "global_step": 660725, "epoch": 7960} {"train_loss": -28.794540405273438, "global_step": 660726, "epoch": 7960} {"train_loss": -28.845966339111328, "global_step": 660727, "epoch": 7960} {"train_loss": -28.291662216186523, "global_step": 660728, "epoch": 7960} {"train_loss": -28.573740005493164, "global_step": 660729, "epoch": 7960} {"train_loss": -28.563512802124023, "global_step": 660730, "epoch": 7960} {"train_loss": -28.3583927154541, "global_step": 660731, "epoch": 7960} {"train_loss": -28.631195068359375, "global_step": 660732, "epoch": 7960} {"train_loss": -28.824811935424805, "global_step": 660733, "epoch": 7960} {"train_loss": -28.167089462280273, "global_step": 660734, "epoch": 7960} {"train_loss": -28.899616241455078, "global_step": 660735, "epoch": 7960} {"train_loss": -28.28472328186035, "global_step": 660736, "epoch": 7960} {"train_loss": -27.896087646484375, "global_step": 660737, "epoch": 7960} {"train_loss": -28.406156539916992, "global_step": 660738, "epoch": 7960} {"train_loss": -28.1026611328125, "global_step": 660739, "epoch": 7960} {"train_loss": -28.238950729370117, "global_step": 660740, "epoch": 7960} {"train_loss": -28.234365463256836, "global_step": 660741, "epoch": 7960} {"train_loss": -28.082223892211914, "global_step": 660742, "epoch": 7960} {"train_loss": -28.45464515686035, "global_step": 660743, "epoch": 7960} {"train_loss": -28.5645751953125, "global_step": 660744, "epoch": 7960} {"train_loss": -28.671903610229492, "global_step": 660745, "epoch": 7960} {"train_loss": -28.487173080444336, "global_step": 660746, "epoch": 7960} {"train_loss": -28.187559127807617, "global_step": 660747, "epoch": 7960} {"train_loss": -28.023488998413086, "global_step": 660748, "epoch": 7960} {"train_loss": -28.539316177368164, "global_step": 660749, "epoch": 7960} {"train_loss": -28.412511825561523, "global_step": 660750, "epoch": 7960} {"train_loss": -28.929975509643555, "global_step": 660751, "epoch": 7960} {"train_loss": -28.260852813720703, "global_step": 660752, "epoch": 7960} {"train_loss": -28.716806411743164, "global_step": 660753, "epoch": 7960} {"train_loss": -28.55670738220215, "global_step": 660754, "epoch": 7960} {"train_loss": -28.300016403198242, "global_step": 660755, "epoch": 7960} {"train_loss": -28.3168888092041, "global_step": 660756, "epoch": 7960} {"train_loss": -28.598020553588867, "global_step": 660757, "epoch": 7960} {"train_loss": -28.344968795776367, "global_step": 660758, "epoch": 7960} {"train_loss": -28.34226417541504, "global_step": 660759, "epoch": 7960} {"train_loss": -28.625213623046875, "global_step": 660760, "epoch": 7960} {"train_loss": -28.63779640197754, "global_step": 660761, "epoch": 7960} {"train_loss": -28.42288325206343, "global_step": 660762, "epoch": 7960, "val_loss": 6815083.0} {"train_loss": -27.893075942993164, "global_step": 660763, "epoch": 7961} {"train_loss": -27.344974517822266, "global_step": 660764, "epoch": 7961} {"train_loss": -28.02682876586914, "global_step": 660765, "epoch": 7961} {"train_loss": -28.155460357666016, "global_step": 660766, "epoch": 7961} {"train_loss": -27.881256103515625, "global_step": 660767, "epoch": 7961} {"train_loss": -27.505508422851562, "global_step": 660768, "epoch": 7961} {"train_loss": -27.93610954284668, "global_step": 660769, "epoch": 7961} {"train_loss": -28.297021865844727, "global_step": 660770, "epoch": 7961} {"train_loss": -27.750757217407227, "global_step": 660771, "epoch": 7961} {"train_loss": -28.17140007019043, "global_step": 660772, "epoch": 7961} {"train_loss": -28.160831451416016, "global_step": 660773, "epoch": 7961} {"train_loss": -28.60028076171875, "global_step": 660774, "epoch": 7961} {"train_loss": -28.15192985534668, "global_step": 660775, "epoch": 7961} {"train_loss": -28.36432456970215, "global_step": 660776, "epoch": 7961} {"train_loss": -28.37872314453125, "global_step": 660777, "epoch": 7961} {"train_loss": -27.648618698120117, "global_step": 660778, "epoch": 7961} {"train_loss": -27.801374435424805, "global_step": 660779, "epoch": 7961} {"train_loss": -28.004114151000977, "global_step": 660780, "epoch": 7961} {"train_loss": -28.200910568237305, "global_step": 660781, "epoch": 7961} {"train_loss": -27.98211669921875, "global_step": 660782, "epoch": 7961} {"train_loss": -28.00229835510254, "global_step": 660783, "epoch": 7961} {"train_loss": -28.36354637145996, "global_step": 660784, "epoch": 7961} {"train_loss": -28.279775619506836, "global_step": 660785, "epoch": 7961} {"train_loss": -28.4793758392334, "global_step": 660786, "epoch": 7961} {"train_loss": -28.122602462768555, "global_step": 660787, "epoch": 7961} {"train_loss": -28.279993057250977, "global_step": 660788, "epoch": 7961} {"train_loss": -28.028427124023438, "global_step": 660789, "epoch": 7961} {"train_loss": -27.85169792175293, "global_step": 660790, "epoch": 7961} {"train_loss": -28.59098243713379, "global_step": 660791, "epoch": 7961} {"train_loss": -28.01198387145996, "global_step": 660792, "epoch": 7961} {"train_loss": -27.96539878845215, "global_step": 660793, "epoch": 7961} {"train_loss": -28.542821884155273, "global_step": 660794, "epoch": 7961} {"train_loss": -28.011188507080078, "global_step": 660795, "epoch": 7961} {"train_loss": -28.159223556518555, "global_step": 660796, "epoch": 7961} {"train_loss": -28.184192657470703, "global_step": 660797, "epoch": 7961} {"train_loss": -28.581653594970703, "global_step": 660798, "epoch": 7961} {"train_loss": -28.411832809448242, "global_step": 660799, "epoch": 7961} {"train_loss": -28.448511123657227, "global_step": 660800, "epoch": 7961} {"train_loss": -28.75165367126465, "global_step": 660801, "epoch": 7961} {"train_loss": -28.32002067565918, "global_step": 660802, "epoch": 7961} {"train_loss": -28.819854736328125, "global_step": 660803, "epoch": 7961} {"train_loss": -28.524887084960938, "global_step": 660804, "epoch": 7961} {"train_loss": -28.518583297729492, "global_step": 660805, "epoch": 7961} {"train_loss": -28.436132431030273, "global_step": 660806, "epoch": 7961} {"train_loss": -28.404815673828125, "global_step": 660807, "epoch": 7961} {"train_loss": -28.50758171081543, "global_step": 660808, "epoch": 7961} {"train_loss": -28.710615158081055, "global_step": 660809, "epoch": 7961} {"train_loss": -28.48859214782715, "global_step": 660810, "epoch": 7961} {"train_loss": -28.567930221557617, "global_step": 660811, "epoch": 7961} {"train_loss": -28.48959732055664, "global_step": 660812, "epoch": 7961} {"train_loss": -28.57061767578125, "global_step": 660813, "epoch": 7961} {"train_loss": -28.55982780456543, "global_step": 660814, "epoch": 7961} {"train_loss": -28.796289443969727, "global_step": 660815, "epoch": 7961} {"train_loss": -28.26907730102539, "global_step": 660816, "epoch": 7961} {"train_loss": -29.03951072692871, "global_step": 660817, "epoch": 7961} {"train_loss": -28.578765869140625, "global_step": 660818, "epoch": 7961} {"train_loss": -28.624486923217773, "global_step": 660819, "epoch": 7961} {"train_loss": -28.931751251220703, "global_step": 660820, "epoch": 7961} {"train_loss": -28.568723678588867, "global_step": 660821, "epoch": 7961} {"train_loss": -28.49127769470215, "global_step": 660822, "epoch": 7961} {"train_loss": -28.564411163330078, "global_step": 660823, "epoch": 7961} {"train_loss": -29.129180908203125, "global_step": 660824, "epoch": 7961} {"train_loss": -28.78008460998535, "global_step": 660825, "epoch": 7961} {"train_loss": -28.564117431640625, "global_step": 660826, "epoch": 7961} {"train_loss": -27.971948623657227, "global_step": 660827, "epoch": 7961} {"train_loss": -27.807382583618164, "global_step": 660828, "epoch": 7961} {"train_loss": -27.192996978759766, "global_step": 660829, "epoch": 7961} {"train_loss": -26.538843154907227, "global_step": 660830, "epoch": 7961} {"train_loss": -26.82754898071289, "global_step": 660831, "epoch": 7961} {"train_loss": -28.152990341186523, "global_step": 660832, "epoch": 7961} {"train_loss": -26.979419708251953, "global_step": 660833, "epoch": 7961} {"train_loss": -27.220483779907227, "global_step": 660834, "epoch": 7961} {"train_loss": -27.55732536315918, "global_step": 660835, "epoch": 7961} {"train_loss": -27.9648494720459, "global_step": 660836, "epoch": 7961} {"train_loss": -27.751434326171875, "global_step": 660837, "epoch": 7961} {"train_loss": -28.1080322265625, "global_step": 660838, "epoch": 7961} {"train_loss": -27.711591720581055, "global_step": 660839, "epoch": 7961} {"train_loss": -28.38787269592285, "global_step": 660840, "epoch": 7961} {"train_loss": -28.22627830505371, "global_step": 660841, "epoch": 7961} {"train_loss": -28.0533447265625, "global_step": 660842, "epoch": 7961} {"train_loss": -28.32464027404785, "global_step": 660843, "epoch": 7961} {"train_loss": -27.830535888671875, "global_step": 660844, "epoch": 7961} {"train_loss": -28.174464536000446, "global_step": 660845, "epoch": 7961, "val_loss": 6741494.0} {"train_loss": -27.670963287353516, "global_step": 660846, "epoch": 7962} {"train_loss": -27.60419273376465, "global_step": 660847, "epoch": 7962} {"train_loss": -27.647985458374023, "global_step": 660848, "epoch": 7962} {"train_loss": -26.956571578979492, "global_step": 660849, "epoch": 7962} {"train_loss": -27.6920108795166, "global_step": 660850, "epoch": 7962} {"train_loss": -27.556949615478516, "global_step": 660851, "epoch": 7962} {"train_loss": -27.82229995727539, "global_step": 660852, "epoch": 7962} {"train_loss": -27.0873966217041, "global_step": 660853, "epoch": 7962} {"train_loss": -27.8823184967041, "global_step": 660854, "epoch": 7962} {"train_loss": -27.749149322509766, "global_step": 660855, "epoch": 7962} {"train_loss": -27.715167999267578, "global_step": 660856, "epoch": 7962} {"train_loss": -27.877965927124023, "global_step": 660857, "epoch": 7962} {"train_loss": -27.756696701049805, "global_step": 660858, "epoch": 7962} {"train_loss": -27.75564956665039, "global_step": 660859, "epoch": 7962} {"train_loss": -27.760116577148438, "global_step": 660860, "epoch": 7962} {"train_loss": -27.759204864501953, "global_step": 660861, "epoch": 7962} {"train_loss": -27.86256980895996, "global_step": 660862, "epoch": 7962} {"train_loss": -28.114124298095703, "global_step": 660863, "epoch": 7962} {"train_loss": -27.763086318969727, "global_step": 660864, "epoch": 7962} {"train_loss": -27.826955795288086, "global_step": 660865, "epoch": 7962} {"train_loss": -27.825897216796875, "global_step": 660866, "epoch": 7962} {"train_loss": -28.303319931030273, "global_step": 660867, "epoch": 7962} {"train_loss": -27.7303409576416, "global_step": 660868, "epoch": 7962} {"train_loss": -28.179304122924805, "global_step": 660869, "epoch": 7962} {"train_loss": -28.231054306030273, "global_step": 660870, "epoch": 7962} {"train_loss": -28.20135498046875, "global_step": 660871, "epoch": 7962} {"train_loss": -28.4334716796875, "global_step": 660872, "epoch": 7962} {"train_loss": -28.20008659362793, "global_step": 660873, "epoch": 7962} {"train_loss": -27.940576553344727, "global_step": 660874, "epoch": 7962} {"train_loss": -28.073760986328125, "global_step": 660875, "epoch": 7962} {"train_loss": -28.377120971679688, "global_step": 660876, "epoch": 7962} {"train_loss": -27.98065757751465, "global_step": 660877, "epoch": 7962} {"train_loss": -28.017309188842773, "global_step": 660878, "epoch": 7962} {"train_loss": -28.368595123291016, "global_step": 660879, "epoch": 7962} {"train_loss": -28.2910099029541, "global_step": 660880, "epoch": 7962} {"train_loss": -28.337629318237305, "global_step": 660881, "epoch": 7962} {"train_loss": -28.075672149658203, "global_step": 660882, "epoch": 7962} {"train_loss": -28.218719482421875, "global_step": 660883, "epoch": 7962} {"train_loss": -28.421064376831055, "global_step": 660884, "epoch": 7962} {"train_loss": -28.3562068939209, "global_step": 660885, "epoch": 7962} {"train_loss": -28.11842155456543, "global_step": 660886, "epoch": 7962} {"train_loss": -28.446685791015625, "global_step": 660887, "epoch": 7962} {"train_loss": -28.445783615112305, "global_step": 660888, "epoch": 7962} {"train_loss": -28.494953155517578, "global_step": 660889, "epoch": 7962} {"train_loss": -28.479894638061523, "global_step": 660890, "epoch": 7962} {"train_loss": -28.440515518188477, "global_step": 660891, "epoch": 7962} {"train_loss": -28.89691162109375, "global_step": 660892, "epoch": 7962} {"train_loss": -28.38483238220215, "global_step": 660893, "epoch": 7962} {"train_loss": -28.69825553894043, "global_step": 660894, "epoch": 7962} {"train_loss": -28.73880386352539, "global_step": 660895, "epoch": 7962} {"train_loss": -28.610034942626953, "global_step": 660896, "epoch": 7962} {"train_loss": -28.320911407470703, "global_step": 660897, "epoch": 7962} {"train_loss": -28.6551570892334, "global_step": 660898, "epoch": 7962} {"train_loss": -28.31367301940918, "global_step": 660899, "epoch": 7962} {"train_loss": -28.82874870300293, "global_step": 660900, "epoch": 7962} {"train_loss": -28.46040916442871, "global_step": 660901, "epoch": 7962} {"train_loss": -28.58970069885254, "global_step": 660902, "epoch": 7962} {"train_loss": -28.560546875, "global_step": 660903, "epoch": 7962} {"train_loss": -28.361591339111328, "global_step": 660904, "epoch": 7962} {"train_loss": -28.695261001586914, "global_step": 660905, "epoch": 7962} {"train_loss": -28.3904972076416, "global_step": 660906, "epoch": 7962} {"train_loss": -28.5030574798584, "global_step": 660907, "epoch": 7962} {"train_loss": -28.947132110595703, "global_step": 660908, "epoch": 7962} {"train_loss": -28.323501586914062, "global_step": 660909, "epoch": 7962} {"train_loss": -28.8759765625, "global_step": 660910, "epoch": 7962} {"train_loss": -28.666479110717773, "global_step": 660911, "epoch": 7962} {"train_loss": -28.599836349487305, "global_step": 660912, "epoch": 7962} {"train_loss": -28.505414962768555, "global_step": 660913, "epoch": 7962} {"train_loss": -28.41861343383789, "global_step": 660914, "epoch": 7962} {"train_loss": -28.16230583190918, "global_step": 660915, "epoch": 7962} {"train_loss": -28.444700241088867, "global_step": 660916, "epoch": 7962} {"train_loss": -28.429941177368164, "global_step": 660917, "epoch": 7962} {"train_loss": -28.17999267578125, "global_step": 660918, "epoch": 7962} {"train_loss": -28.3026123046875, "global_step": 660919, "epoch": 7962} {"train_loss": -27.498260498046875, "global_step": 660920, "epoch": 7962} {"train_loss": -28.264968872070312, "global_step": 660921, "epoch": 7962} {"train_loss": -27.86384391784668, "global_step": 660922, "epoch": 7962} {"train_loss": -28.730884552001953, "global_step": 660923, "epoch": 7962} {"train_loss": -27.606611251831055, "global_step": 660924, "epoch": 7962} {"train_loss": -28.256139755249023, "global_step": 660925, "epoch": 7962} {"train_loss": -28.232070922851562, "global_step": 660926, "epoch": 7962} {"train_loss": -28.419315338134766, "global_step": 660927, "epoch": 7962} {"train_loss": -28.215857839009846, "global_step": 660928, "epoch": 7962, "val_loss": 6687180.0} {"train_loss": -26.798559188842773, "global_step": 660929, "epoch": 7963} {"train_loss": -27.046594619750977, "global_step": 660930, "epoch": 7963} {"train_loss": -26.855060577392578, "global_step": 660931, "epoch": 7963} {"train_loss": -28.171812057495117, "global_step": 660932, "epoch": 7963} {"train_loss": -27.22428321838379, "global_step": 660933, "epoch": 7963} {"train_loss": -27.56926918029785, "global_step": 660934, "epoch": 7963} {"train_loss": -27.145374298095703, "global_step": 660935, "epoch": 7963} {"train_loss": -28.097370147705078, "global_step": 660936, "epoch": 7963} {"train_loss": -27.88492774963379, "global_step": 660937, "epoch": 7963} {"train_loss": -27.685712814331055, "global_step": 660938, "epoch": 7963} {"train_loss": -27.917861938476562, "global_step": 660939, "epoch": 7963} {"train_loss": -27.696332931518555, "global_step": 660940, "epoch": 7963} {"train_loss": -27.639509201049805, "global_step": 660941, "epoch": 7963} {"train_loss": -28.0467529296875, "global_step": 660942, "epoch": 7963} {"train_loss": -27.75935173034668, "global_step": 660943, "epoch": 7963} {"train_loss": -27.93195915222168, "global_step": 660944, "epoch": 7963} {"train_loss": -28.23699378967285, "global_step": 660945, "epoch": 7963} {"train_loss": -28.30120849609375, "global_step": 660946, "epoch": 7963} {"train_loss": -27.751585006713867, "global_step": 660947, "epoch": 7963} {"train_loss": -27.6697940826416, "global_step": 660948, "epoch": 7963} {"train_loss": -28.02178955078125, "global_step": 660949, "epoch": 7963} {"train_loss": -28.129636764526367, "global_step": 660950, "epoch": 7963} {"train_loss": -27.97517967224121, "global_step": 660951, "epoch": 7963} {"train_loss": -27.67270851135254, "global_step": 660952, "epoch": 7963} {"train_loss": -28.355566024780273, "global_step": 660953, "epoch": 7963} {"train_loss": -28.13291358947754, "global_step": 660954, "epoch": 7963} {"train_loss": -28.3137264251709, "global_step": 660955, "epoch": 7963} {"train_loss": -28.36543083190918, "global_step": 660956, "epoch": 7963} {"train_loss": -28.408491134643555, "global_step": 660957, "epoch": 7963} {"train_loss": -28.386987686157227, "global_step": 660958, "epoch": 7963} {"train_loss": -28.959436416625977, "global_step": 660959, "epoch": 7963} {"train_loss": -28.802160263061523, "global_step": 660960, "epoch": 7963} {"train_loss": -28.663726806640625, "global_step": 660961, "epoch": 7963} {"train_loss": -28.08270263671875, "global_step": 660962, "epoch": 7963} {"train_loss": -28.582727432250977, "global_step": 660963, "epoch": 7963} {"train_loss": -28.47504234313965, "global_step": 660964, "epoch": 7963} {"train_loss": -28.441160202026367, "global_step": 660965, "epoch": 7963} {"train_loss": -28.6920166015625, "global_step": 660966, "epoch": 7963} {"train_loss": -28.559865951538086, "global_step": 660967, "epoch": 7963} {"train_loss": -28.340993881225586, "global_step": 660968, "epoch": 7963} {"train_loss": -28.349573135375977, "global_step": 660969, "epoch": 7963} {"train_loss": -28.6728515625, "global_step": 660970, "epoch": 7963} {"train_loss": -28.561010360717773, "global_step": 660971, "epoch": 7963} {"train_loss": -28.350311279296875, "global_step": 660972, "epoch": 7963} {"train_loss": -28.29766845703125, "global_step": 660973, "epoch": 7963} {"train_loss": -28.38114356994629, "global_step": 660974, "epoch": 7963} {"train_loss": -28.481592178344727, "global_step": 660975, "epoch": 7963} {"train_loss": -28.684741973876953, "global_step": 660976, "epoch": 7963} {"train_loss": -28.555097579956055, "global_step": 660977, "epoch": 7963} {"train_loss": -28.749759674072266, "global_step": 660978, "epoch": 7963} {"train_loss": -28.35603141784668, "global_step": 660979, "epoch": 7963} {"train_loss": -28.60919189453125, "global_step": 660980, "epoch": 7963} {"train_loss": -28.682031631469727, "global_step": 660981, "epoch": 7963} {"train_loss": -28.682458877563477, "global_step": 660982, "epoch": 7963} {"train_loss": -28.89503288269043, "global_step": 660983, "epoch": 7963} {"train_loss": -28.51837730407715, "global_step": 660984, "epoch": 7963} {"train_loss": -28.937108993530273, "global_step": 660985, "epoch": 7963} {"train_loss": -28.779682159423828, "global_step": 660986, "epoch": 7963} {"train_loss": -28.34662437438965, "global_step": 660987, "epoch": 7963} {"train_loss": -28.43916893005371, "global_step": 660988, "epoch": 7963} {"train_loss": -28.799854278564453, "global_step": 660989, "epoch": 7963} {"train_loss": -28.426361083984375, "global_step": 660990, "epoch": 7963} {"train_loss": -28.616727828979492, "global_step": 660991, "epoch": 7963} {"train_loss": -28.499074935913086, "global_step": 660992, "epoch": 7963} {"train_loss": -28.788217544555664, "global_step": 660993, "epoch": 7963} {"train_loss": -28.75436782836914, "global_step": 660994, "epoch": 7963} {"train_loss": -28.70181655883789, "global_step": 660995, "epoch": 7963} {"train_loss": -28.492765426635742, "global_step": 660996, "epoch": 7963} {"train_loss": -28.66514015197754, "global_step": 660997, "epoch": 7963} {"train_loss": -28.46222496032715, "global_step": 660998, "epoch": 7963} {"train_loss": -28.59822654724121, "global_step": 660999, "epoch": 7963} {"train_loss": -28.811960220336914, "global_step": 661000, "epoch": 7963} {"train_loss": -28.521991729736328, "global_step": 661001, "epoch": 7963} {"train_loss": -28.483417510986328, "global_step": 661002, "epoch": 7963} {"train_loss": -28.83926773071289, "global_step": 661003, "epoch": 7963} {"train_loss": -27.997406005859375, "global_step": 661004, "epoch": 7963} {"train_loss": -28.439258575439453, "global_step": 661005, "epoch": 7963} {"train_loss": -27.86524772644043, "global_step": 661006, "epoch": 7963} {"train_loss": -27.170087814331055, "global_step": 661007, "epoch": 7963} {"train_loss": -23.87233543395996, "global_step": 661008, "epoch": 7963} {"train_loss": -22.206722259521484, "global_step": 661009, "epoch": 7963} {"train_loss": -26.6971435546875, "global_step": 661010, "epoch": 7963} {"train_loss": -28.09680731899767, "global_step": 661011, "epoch": 7963, "val_loss": 6596395.0} {"train_loss": -20.065488815307617, "global_step": 661012, "epoch": 7964} {"train_loss": -23.496543884277344, "global_step": 661013, "epoch": 7964} {"train_loss": -24.027151107788086, "global_step": 661014, "epoch": 7964} {"train_loss": -22.781734466552734, "global_step": 661015, "epoch": 7964} {"train_loss": -25.04041862487793, "global_step": 661016, "epoch": 7964} {"train_loss": -24.57754898071289, "global_step": 661017, "epoch": 7964} {"train_loss": -24.494237899780273, "global_step": 661018, "epoch": 7964} {"train_loss": -25.0294132232666, "global_step": 661019, "epoch": 7964} {"train_loss": -25.772695541381836, "global_step": 661020, "epoch": 7964} {"train_loss": -25.844892501831055, "global_step": 661021, "epoch": 7964} {"train_loss": -25.43621253967285, "global_step": 661022, "epoch": 7964} {"train_loss": -25.642484664916992, "global_step": 661023, "epoch": 7964} {"train_loss": -26.093067169189453, "global_step": 661024, "epoch": 7964} {"train_loss": -25.893630981445312, "global_step": 661025, "epoch": 7964} {"train_loss": -26.021270751953125, "global_step": 661026, "epoch": 7964} {"train_loss": -26.006811141967773, "global_step": 661027, "epoch": 7964} {"train_loss": -26.47825050354004, "global_step": 661028, "epoch": 7964} {"train_loss": -26.047500610351562, "global_step": 661029, "epoch": 7964} {"train_loss": -26.559106826782227, "global_step": 661030, "epoch": 7964} {"train_loss": -26.6843204498291, "global_step": 661031, "epoch": 7964} {"train_loss": -26.528186798095703, "global_step": 661032, "epoch": 7964} {"train_loss": -26.6463623046875, "global_step": 661033, "epoch": 7964} {"train_loss": -26.54329490661621, "global_step": 661034, "epoch": 7964} {"train_loss": -26.383792877197266, "global_step": 661035, "epoch": 7964} {"train_loss": -26.805561065673828, "global_step": 661036, "epoch": 7964} {"train_loss": -27.01787757873535, "global_step": 661037, "epoch": 7964} {"train_loss": -26.540607452392578, "global_step": 661038, "epoch": 7964} {"train_loss": -26.648420333862305, "global_step": 661039, "epoch": 7964} {"train_loss": -27.09650993347168, "global_step": 661040, "epoch": 7964} {"train_loss": -27.10987663269043, "global_step": 661041, "epoch": 7964} {"train_loss": -27.066211700439453, "global_step": 661042, "epoch": 7964} {"train_loss": -27.246545791625977, "global_step": 661043, "epoch": 7964} {"train_loss": -27.1442813873291, "global_step": 661044, "epoch": 7964} {"train_loss": -26.908170700073242, "global_step": 661045, "epoch": 7964} {"train_loss": -27.197040557861328, "global_step": 661046, "epoch": 7964} {"train_loss": -27.278329849243164, "global_step": 661047, "epoch": 7964} {"train_loss": -27.392114639282227, "global_step": 661048, "epoch": 7964} {"train_loss": -27.319854736328125, "global_step": 661049, "epoch": 7964} {"train_loss": -27.268545150756836, "global_step": 661050, "epoch": 7964} {"train_loss": -27.01167106628418, "global_step": 661051, "epoch": 7964} {"train_loss": -27.45839500427246, "global_step": 661052, "epoch": 7964} {"train_loss": -27.642078399658203, "global_step": 661053, "epoch": 7964} {"train_loss": -27.819910049438477, "global_step": 661054, "epoch": 7964} {"train_loss": -27.533750534057617, "global_step": 661055, "epoch": 7964} {"train_loss": -27.749591827392578, "global_step": 661056, "epoch": 7964} {"train_loss": -27.313129425048828, "global_step": 661057, "epoch": 7964} {"train_loss": -27.7255916595459, "global_step": 661058, "epoch": 7964} {"train_loss": -27.38203239440918, "global_step": 661059, "epoch": 7964} {"train_loss": -27.870824813842773, "global_step": 661060, "epoch": 7964} {"train_loss": -28.08588218688965, "global_step": 661061, "epoch": 7964} {"train_loss": -27.95343017578125, "global_step": 661062, "epoch": 7964} {"train_loss": -27.87981605529785, "global_step": 661063, "epoch": 7964} {"train_loss": -27.635543823242188, "global_step": 661064, "epoch": 7964} {"train_loss": -27.74664878845215, "global_step": 661065, "epoch": 7964} {"train_loss": -27.906558990478516, "global_step": 661066, "epoch": 7964} {"train_loss": -27.786457061767578, "global_step": 661067, "epoch": 7964} {"train_loss": -27.943761825561523, "global_step": 661068, "epoch": 7964} {"train_loss": -27.7945499420166, "global_step": 661069, "epoch": 7964} {"train_loss": -28.219099044799805, "global_step": 661070, "epoch": 7964} {"train_loss": -28.078107833862305, "global_step": 661071, "epoch": 7964} {"train_loss": -28.14996337890625, "global_step": 661072, "epoch": 7964} {"train_loss": -28.3522891998291, "global_step": 661073, "epoch": 7964} {"train_loss": -28.321496963500977, "global_step": 661074, "epoch": 7964} {"train_loss": -28.132604598999023, "global_step": 661075, "epoch": 7964} {"train_loss": -28.22772789001465, "global_step": 661076, "epoch": 7964} {"train_loss": -28.287139892578125, "global_step": 661077, "epoch": 7964} {"train_loss": -27.68403434753418, "global_step": 661078, "epoch": 7964} {"train_loss": -28.305622100830078, "global_step": 661079, "epoch": 7964} {"train_loss": -28.332849502563477, "global_step": 661080, "epoch": 7964} {"train_loss": -28.3717041015625, "global_step": 661081, "epoch": 7964} {"train_loss": -28.484724044799805, "global_step": 661082, "epoch": 7964} {"train_loss": -28.06170082092285, "global_step": 661083, "epoch": 7964} {"train_loss": -28.442182540893555, "global_step": 661084, "epoch": 7964} {"train_loss": -28.548093795776367, "global_step": 661085, "epoch": 7964} {"train_loss": -28.436071395874023, "global_step": 661086, "epoch": 7964} {"train_loss": -28.60883140563965, "global_step": 661087, "epoch": 7964} {"train_loss": -28.190170288085938, "global_step": 661088, "epoch": 7964} {"train_loss": -27.981842041015625, "global_step": 661089, "epoch": 7964} {"train_loss": -28.06473159790039, "global_step": 661090, "epoch": 7964} {"train_loss": -28.373340606689453, "global_step": 661091, "epoch": 7964} {"train_loss": -28.085851669311523, "global_step": 661092, "epoch": 7964} {"train_loss": -28.171262741088867, "global_step": 661093, "epoch": 7964} {"train_loss": -27.05816524000053, "global_step": 661094, "epoch": 7964, "val_loss": 6700367.0} {"train_loss": -27.677396774291992, "global_step": 661095, "epoch": 7965} {"train_loss": -28.012908935546875, "global_step": 661096, "epoch": 7965} {"train_loss": -27.94000816345215, "global_step": 661097, "epoch": 7965} {"train_loss": -28.459918975830078, "global_step": 661098, "epoch": 7965} {"train_loss": -27.00616455078125, "global_step": 661099, "epoch": 7965} {"train_loss": -28.050512313842773, "global_step": 661100, "epoch": 7965} {"train_loss": -27.578317642211914, "global_step": 661101, "epoch": 7965} {"train_loss": -27.922534942626953, "global_step": 661102, "epoch": 7965} {"train_loss": -27.744176864624023, "global_step": 661103, "epoch": 7965} {"train_loss": -27.69034767150879, "global_step": 661104, "epoch": 7965} {"train_loss": -28.14165687561035, "global_step": 661105, "epoch": 7965} {"train_loss": -27.58970069885254, "global_step": 661106, "epoch": 7965} {"train_loss": -28.013158798217773, "global_step": 661107, "epoch": 7965} {"train_loss": -27.69781494140625, "global_step": 661108, "epoch": 7965} {"train_loss": -28.132343292236328, "global_step": 661109, "epoch": 7965} {"train_loss": -27.524587631225586, "global_step": 661110, "epoch": 7965} {"train_loss": -28.12446403503418, "global_step": 661111, "epoch": 7965} {"train_loss": -28.179336547851562, "global_step": 661112, "epoch": 7965} {"train_loss": -28.047876358032227, "global_step": 661113, "epoch": 7965} {"train_loss": -28.119165420532227, "global_step": 661114, "epoch": 7965} {"train_loss": -28.091211318969727, "global_step": 661115, "epoch": 7965} {"train_loss": -28.1843318939209, "global_step": 661116, "epoch": 7965} {"train_loss": -28.453046798706055, "global_step": 661117, "epoch": 7965} {"train_loss": -28.059467315673828, "global_step": 661118, "epoch": 7965} {"train_loss": -27.86353874206543, "global_step": 661119, "epoch": 7965} {"train_loss": -28.104711532592773, "global_step": 661120, "epoch": 7965} {"train_loss": -28.098661422729492, "global_step": 661121, "epoch": 7965} {"train_loss": -27.973011016845703, "global_step": 661122, "epoch": 7965} {"train_loss": -28.37544059753418, "global_step": 661123, "epoch": 7965} {"train_loss": -28.300357818603516, "global_step": 661124, "epoch": 7965} {"train_loss": -28.015716552734375, "global_step": 661125, "epoch": 7965} {"train_loss": -28.049274444580078, "global_step": 661126, "epoch": 7965} {"train_loss": -28.0134220123291, "global_step": 661127, "epoch": 7965} {"train_loss": -28.066913604736328, "global_step": 661128, "epoch": 7965} {"train_loss": -27.799823760986328, "global_step": 661129, "epoch": 7965} {"train_loss": -28.212011337280273, "global_step": 661130, "epoch": 7965} {"train_loss": -28.189435958862305, "global_step": 661131, "epoch": 7965} {"train_loss": -28.18790054321289, "global_step": 661132, "epoch": 7965} {"train_loss": -28.09348487854004, "global_step": 661133, "epoch": 7965} {"train_loss": -28.188690185546875, "global_step": 661134, "epoch": 7965} {"train_loss": -28.324934005737305, "global_step": 661135, "epoch": 7965} {"train_loss": -27.83038330078125, "global_step": 661136, "epoch": 7965} {"train_loss": -28.3513240814209, "global_step": 661137, "epoch": 7965} {"train_loss": -28.438922882080078, "global_step": 661138, "epoch": 7965} {"train_loss": -28.00227165222168, "global_step": 661139, "epoch": 7965} {"train_loss": -28.442007064819336, "global_step": 661140, "epoch": 7965} {"train_loss": -28.42377281188965, "global_step": 661141, "epoch": 7965} {"train_loss": -27.947797775268555, "global_step": 661142, "epoch": 7965} {"train_loss": -28.183195114135742, "global_step": 661143, "epoch": 7965} {"train_loss": -28.271656036376953, "global_step": 661144, "epoch": 7965} {"train_loss": -28.037525177001953, "global_step": 661145, "epoch": 7965} {"train_loss": -28.17828369140625, "global_step": 661146, "epoch": 7965} {"train_loss": -28.38698387145996, "global_step": 661147, "epoch": 7965} {"train_loss": -28.360769271850586, "global_step": 661148, "epoch": 7965} {"train_loss": -28.424413681030273, "global_step": 661149, "epoch": 7965} {"train_loss": -28.309833526611328, "global_step": 661150, "epoch": 7965} {"train_loss": -28.378339767456055, "global_step": 661151, "epoch": 7965} {"train_loss": -28.500314712524414, "global_step": 661152, "epoch": 7965} {"train_loss": -28.547109603881836, "global_step": 661153, "epoch": 7965} {"train_loss": -28.6664981842041, "global_step": 661154, "epoch": 7965} {"train_loss": -28.428308486938477, "global_step": 661155, "epoch": 7965} {"train_loss": -28.748310089111328, "global_step": 661156, "epoch": 7965} {"train_loss": -28.405242919921875, "global_step": 661157, "epoch": 7965} {"train_loss": -28.504043579101562, "global_step": 661158, "epoch": 7965} {"train_loss": -28.0762939453125, "global_step": 661159, "epoch": 7965} {"train_loss": -28.636917114257812, "global_step": 661160, "epoch": 7965} {"train_loss": -28.4964656829834, "global_step": 661161, "epoch": 7965} {"train_loss": -28.4906005859375, "global_step": 661162, "epoch": 7965} {"train_loss": -28.68863296508789, "global_step": 661163, "epoch": 7965} {"train_loss": -28.32233238220215, "global_step": 661164, "epoch": 7965} {"train_loss": -28.510120391845703, "global_step": 661165, "epoch": 7965} {"train_loss": -28.793161392211914, "global_step": 661166, "epoch": 7965} {"train_loss": -28.30022621154785, "global_step": 661167, "epoch": 7965} {"train_loss": -28.896759033203125, "global_step": 661168, "epoch": 7965} {"train_loss": -28.796655654907227, "global_step": 661169, "epoch": 7965} {"train_loss": -28.788375854492188, "global_step": 661170, "epoch": 7965} {"train_loss": -28.69258689880371, "global_step": 661171, "epoch": 7965} {"train_loss": -28.8093204498291, "global_step": 661172, "epoch": 7965} {"train_loss": -28.663782119750977, "global_step": 661173, "epoch": 7965} {"train_loss": -28.600311279296875, "global_step": 661174, "epoch": 7965} {"train_loss": -28.671310424804688, "global_step": 661175, "epoch": 7965} {"train_loss": -28.583282470703125, "global_step": 661176, "epoch": 7965} {"train_loss": -28.248681217791088, "global_step": 661177, "epoch": 7965, "val_loss": 6636437.0} {"train_loss": -28.15828514099121, "global_step": 661178, "epoch": 7966} {"train_loss": -27.759857177734375, "global_step": 661179, "epoch": 7966} {"train_loss": -26.642786026000977, "global_step": 661180, "epoch": 7966} {"train_loss": -26.231689453125, "global_step": 661181, "epoch": 7966} {"train_loss": -27.378021240234375, "global_step": 661182, "epoch": 7966} {"train_loss": -27.709333419799805, "global_step": 661183, "epoch": 7966} {"train_loss": -27.17835807800293, "global_step": 661184, "epoch": 7966} {"train_loss": -27.268390655517578, "global_step": 661185, "epoch": 7966} {"train_loss": -27.764617919921875, "global_step": 661186, "epoch": 7966} {"train_loss": -27.42974281311035, "global_step": 661187, "epoch": 7966} {"train_loss": -27.70098876953125, "global_step": 661188, "epoch": 7966} {"train_loss": -28.132688522338867, "global_step": 661189, "epoch": 7966} {"train_loss": -27.8670597076416, "global_step": 661190, "epoch": 7966} {"train_loss": -28.0971736907959, "global_step": 661191, "epoch": 7966} {"train_loss": -28.10637855529785, "global_step": 661192, "epoch": 7966} {"train_loss": -28.051294326782227, "global_step": 661193, "epoch": 7966} {"train_loss": -28.172016143798828, "global_step": 661194, "epoch": 7966} {"train_loss": -27.821857452392578, "global_step": 661195, "epoch": 7966} {"train_loss": -28.262231826782227, "global_step": 661196, "epoch": 7966} {"train_loss": -28.017969131469727, "global_step": 661197, "epoch": 7966} {"train_loss": -28.5308895111084, "global_step": 661198, "epoch": 7966} {"train_loss": -28.44257926940918, "global_step": 661199, "epoch": 7966} {"train_loss": -28.49825096130371, "global_step": 661200, "epoch": 7966} {"train_loss": -28.24274253845215, "global_step": 661201, "epoch": 7966} {"train_loss": -28.210590362548828, "global_step": 661202, "epoch": 7966} {"train_loss": -28.350141525268555, "global_step": 661203, "epoch": 7966} {"train_loss": -28.389745712280273, "global_step": 661204, "epoch": 7966} {"train_loss": -28.495899200439453, "global_step": 661205, "epoch": 7966} {"train_loss": -28.239730834960938, "global_step": 661206, "epoch": 7966} {"train_loss": -28.257888793945312, "global_step": 661207, "epoch": 7966} {"train_loss": -28.541534423828125, "global_step": 661208, "epoch": 7966} {"train_loss": -28.32606315612793, "global_step": 661209, "epoch": 7966} {"train_loss": -28.483057022094727, "global_step": 661210, "epoch": 7966} {"train_loss": -28.332189559936523, "global_step": 661211, "epoch": 7966} {"train_loss": -28.42011833190918, "global_step": 661212, "epoch": 7966} {"train_loss": -28.673770904541016, "global_step": 661213, "epoch": 7966} {"train_loss": -28.62603759765625, "global_step": 661214, "epoch": 7966} {"train_loss": -28.45612907409668, "global_step": 661215, "epoch": 7966} {"train_loss": -28.530658721923828, "global_step": 661216, "epoch": 7966} {"train_loss": -28.45331382751465, "global_step": 661217, "epoch": 7966} {"train_loss": -28.355854034423828, "global_step": 661218, "epoch": 7966} {"train_loss": -28.178497314453125, "global_step": 661219, "epoch": 7966} {"train_loss": -28.482879638671875, "global_step": 661220, "epoch": 7966} {"train_loss": -28.5438232421875, "global_step": 661221, "epoch": 7966} {"train_loss": -28.61310386657715, "global_step": 661222, "epoch": 7966} {"train_loss": -28.601041793823242, "global_step": 661223, "epoch": 7966} {"train_loss": -28.79444694519043, "global_step": 661224, "epoch": 7966} {"train_loss": -28.11136817932129, "global_step": 661225, "epoch": 7966} {"train_loss": -28.508609771728516, "global_step": 661226, "epoch": 7966} {"train_loss": -28.116708755493164, "global_step": 661227, "epoch": 7966} {"train_loss": -28.60271644592285, "global_step": 661228, "epoch": 7966} {"train_loss": -28.725860595703125, "global_step": 661229, "epoch": 7966} {"train_loss": -28.4531192779541, "global_step": 661230, "epoch": 7966} {"train_loss": -28.465173721313477, "global_step": 661231, "epoch": 7966} {"train_loss": -28.530176162719727, "global_step": 661232, "epoch": 7966} {"train_loss": -28.222946166992188, "global_step": 661233, "epoch": 7966} {"train_loss": -28.702640533447266, "global_step": 661234, "epoch": 7966} {"train_loss": -28.694257736206055, "global_step": 661235, "epoch": 7966} {"train_loss": -28.325376510620117, "global_step": 661236, "epoch": 7966} {"train_loss": -28.59051513671875, "global_step": 661237, "epoch": 7966} {"train_loss": -28.39655113220215, "global_step": 661238, "epoch": 7966} {"train_loss": -28.29645347595215, "global_step": 661239, "epoch": 7966} {"train_loss": -28.310449600219727, "global_step": 661240, "epoch": 7966} {"train_loss": -28.608118057250977, "global_step": 661241, "epoch": 7966} {"train_loss": -28.48846435546875, "global_step": 661242, "epoch": 7966} {"train_loss": -28.350683212280273, "global_step": 661243, "epoch": 7966} {"train_loss": -28.269819259643555, "global_step": 661244, "epoch": 7966} {"train_loss": -28.328125, "global_step": 661245, "epoch": 7966} {"train_loss": -28.267047882080078, "global_step": 661246, "epoch": 7966} {"train_loss": -28.346765518188477, "global_step": 661247, "epoch": 7966} {"train_loss": -27.868616104125977, "global_step": 661248, "epoch": 7966} {"train_loss": -27.870420455932617, "global_step": 661249, "epoch": 7966} {"train_loss": -28.24614906311035, "global_step": 661250, "epoch": 7966} {"train_loss": -28.207029342651367, "global_step": 661251, "epoch": 7966} {"train_loss": -28.108633041381836, "global_step": 661252, "epoch": 7966} {"train_loss": -28.070226669311523, "global_step": 661253, "epoch": 7966} {"train_loss": -27.86941909790039, "global_step": 661254, "epoch": 7966} {"train_loss": -28.343692779541016, "global_step": 661255, "epoch": 7966} {"train_loss": -27.8626651763916, "global_step": 661256, "epoch": 7966} {"train_loss": -28.112653732299805, "global_step": 661257, "epoch": 7966} {"train_loss": -28.37957191467285, "global_step": 661258, "epoch": 7966} {"train_loss": -29.00129508972168, "global_step": 661259, "epoch": 7966} {"train_loss": -28.196504845676653, "global_step": 661260, "epoch": 7966, "val_loss": 6683420.5} {"train_loss": -27.56673240661621, "global_step": 661261, "epoch": 7967} {"train_loss": -26.96381187438965, "global_step": 661262, "epoch": 7967} {"train_loss": -27.465662002563477, "global_step": 661263, "epoch": 7967} {"train_loss": -27.927839279174805, "global_step": 661264, "epoch": 7967} {"train_loss": -27.909442901611328, "global_step": 661265, "epoch": 7967} {"train_loss": -27.844812393188477, "global_step": 661266, "epoch": 7967} {"train_loss": -27.68158531188965, "global_step": 661267, "epoch": 7967} {"train_loss": -27.913175582885742, "global_step": 661268, "epoch": 7967} {"train_loss": -27.958606719970703, "global_step": 661269, "epoch": 7967} {"train_loss": -28.008874893188477, "global_step": 661270, "epoch": 7967} {"train_loss": -27.241846084594727, "global_step": 661271, "epoch": 7967} {"train_loss": -27.673187255859375, "global_step": 661272, "epoch": 7967} {"train_loss": -27.585737228393555, "global_step": 661273, "epoch": 7967} {"train_loss": -28.085412979125977, "global_step": 661274, "epoch": 7967} {"train_loss": -27.979673385620117, "global_step": 661275, "epoch": 7967} {"train_loss": -28.106021881103516, "global_step": 661276, "epoch": 7967} {"train_loss": -27.918567657470703, "global_step": 661277, "epoch": 7967} {"train_loss": -27.99734878540039, "global_step": 661278, "epoch": 7967} {"train_loss": -27.906604766845703, "global_step": 661279, "epoch": 7967} {"train_loss": -27.660236358642578, "global_step": 661280, "epoch": 7967} {"train_loss": -28.204004287719727, "global_step": 661281, "epoch": 7967} {"train_loss": -28.459863662719727, "global_step": 661282, "epoch": 7967} {"train_loss": -28.082508087158203, "global_step": 661283, "epoch": 7967} {"train_loss": -28.160552978515625, "global_step": 661284, "epoch": 7967} {"train_loss": -27.712387084960938, "global_step": 661285, "epoch": 7967} {"train_loss": -28.247913360595703, "global_step": 661286, "epoch": 7967} {"train_loss": -28.228179931640625, "global_step": 661287, "epoch": 7967} {"train_loss": -27.888702392578125, "global_step": 661288, "epoch": 7967} {"train_loss": -27.99258804321289, "global_step": 661289, "epoch": 7967} {"train_loss": -28.26079750061035, "global_step": 661290, "epoch": 7967} {"train_loss": -28.54446792602539, "global_step": 661291, "epoch": 7967} {"train_loss": -28.064743041992188, "global_step": 661292, "epoch": 7967} {"train_loss": -28.000919342041016, "global_step": 661293, "epoch": 7967} {"train_loss": -28.102375030517578, "global_step": 661294, "epoch": 7967} {"train_loss": -28.50807762145996, "global_step": 661295, "epoch": 7967} {"train_loss": -27.8494873046875, "global_step": 661296, "epoch": 7967} {"train_loss": -28.143768310546875, "global_step": 661297, "epoch": 7967} {"train_loss": -28.25819969177246, "global_step": 661298, "epoch": 7967} {"train_loss": -28.025806427001953, "global_step": 661299, "epoch": 7967} {"train_loss": -28.391498565673828, "global_step": 661300, "epoch": 7967} {"train_loss": -28.35383415222168, "global_step": 661301, "epoch": 7967} {"train_loss": -28.677804946899414, "global_step": 661302, "epoch": 7967} {"train_loss": -28.270666122436523, "global_step": 661303, "epoch": 7967} {"train_loss": -28.535062789916992, "global_step": 661304, "epoch": 7967} {"train_loss": -28.687170028686523, "global_step": 661305, "epoch": 7967} {"train_loss": -28.07831382751465, "global_step": 661306, "epoch": 7967} {"train_loss": -28.591663360595703, "global_step": 661307, "epoch": 7967} {"train_loss": -28.549413681030273, "global_step": 661308, "epoch": 7967} {"train_loss": -28.666656494140625, "global_step": 661309, "epoch": 7967} {"train_loss": -28.40273094177246, "global_step": 661310, "epoch": 7967} {"train_loss": -28.634784698486328, "global_step": 661311, "epoch": 7967} {"train_loss": -28.18840980529785, "global_step": 661312, "epoch": 7967} {"train_loss": -28.66657066345215, "global_step": 661313, "epoch": 7967} {"train_loss": -28.515594482421875, "global_step": 661314, "epoch": 7967} {"train_loss": -28.695398330688477, "global_step": 661315, "epoch": 7967} {"train_loss": -28.758655548095703, "global_step": 661316, "epoch": 7967} {"train_loss": -28.724044799804688, "global_step": 661317, "epoch": 7967} {"train_loss": -28.398080825805664, "global_step": 661318, "epoch": 7967} {"train_loss": -28.746566772460938, "global_step": 661319, "epoch": 7967} {"train_loss": -28.712671279907227, "global_step": 661320, "epoch": 7967} {"train_loss": -28.8696346282959, "global_step": 661321, "epoch": 7967} {"train_loss": -28.909509658813477, "global_step": 661322, "epoch": 7967} {"train_loss": -28.799224853515625, "global_step": 661323, "epoch": 7967} {"train_loss": -28.82607078552246, "global_step": 661324, "epoch": 7967} {"train_loss": -28.707782745361328, "global_step": 661325, "epoch": 7967} {"train_loss": -28.6494197845459, "global_step": 661326, "epoch": 7967} {"train_loss": -28.3305721282959, "global_step": 661327, "epoch": 7967} {"train_loss": -28.73011589050293, "global_step": 661328, "epoch": 7967} {"train_loss": -28.902881622314453, "global_step": 661329, "epoch": 7967} {"train_loss": -28.392242431640625, "global_step": 661330, "epoch": 7967} {"train_loss": -28.48565673828125, "global_step": 661331, "epoch": 7967} {"train_loss": -28.57916831970215, "global_step": 661332, "epoch": 7967} {"train_loss": -28.64275550842285, "global_step": 661333, "epoch": 7967} {"train_loss": -28.6341552734375, "global_step": 661334, "epoch": 7967} {"train_loss": -28.191091537475586, "global_step": 661335, "epoch": 7967} {"train_loss": -27.210737228393555, "global_step": 661336, "epoch": 7967} {"train_loss": -27.609039306640625, "global_step": 661337, "epoch": 7967} {"train_loss": -26.57574462890625, "global_step": 661338, "epoch": 7967} {"train_loss": -25.913318634033203, "global_step": 661339, "epoch": 7967} {"train_loss": -27.01850700378418, "global_step": 661340, "epoch": 7967} {"train_loss": -27.741193771362305, "global_step": 661341, "epoch": 7967} {"train_loss": -27.960102081298828, "global_step": 661342, "epoch": 7967} {"train_loss": -28.1514961288636, "global_step": 661343, "epoch": 7967, "val_loss": 6738877.0} {"train_loss": -26.502094268798828, "global_step": 661344, "epoch": 7968} {"train_loss": -26.18928337097168, "global_step": 661345, "epoch": 7968} {"train_loss": -27.006628036499023, "global_step": 661346, "epoch": 7968} {"train_loss": -25.650598526000977, "global_step": 661347, "epoch": 7968} {"train_loss": -27.249221801757812, "global_step": 661348, "epoch": 7968} {"train_loss": -26.44435691833496, "global_step": 661349, "epoch": 7968} {"train_loss": -26.8521785736084, "global_step": 661350, "epoch": 7968} {"train_loss": -26.734333038330078, "global_step": 661351, "epoch": 7968} {"train_loss": -26.757160186767578, "global_step": 661352, "epoch": 7968} {"train_loss": -27.008289337158203, "global_step": 661353, "epoch": 7968} {"train_loss": -26.869094848632812, "global_step": 661354, "epoch": 7968} {"train_loss": -27.611234664916992, "global_step": 661355, "epoch": 7968} {"train_loss": -27.157079696655273, "global_step": 661356, "epoch": 7968} {"train_loss": -27.247161865234375, "global_step": 661357, "epoch": 7968} {"train_loss": -27.420507431030273, "global_step": 661358, "epoch": 7968} {"train_loss": -27.344762802124023, "global_step": 661359, "epoch": 7968} {"train_loss": -27.4174747467041, "global_step": 661360, "epoch": 7968} {"train_loss": -27.0714111328125, "global_step": 661361, "epoch": 7968} {"train_loss": -27.75421714782715, "global_step": 661362, "epoch": 7968} {"train_loss": -27.298206329345703, "global_step": 661363, "epoch": 7968} {"train_loss": -27.617156982421875, "global_step": 661364, "epoch": 7968} {"train_loss": -27.48919677734375, "global_step": 661365, "epoch": 7968} {"train_loss": -28.112329483032227, "global_step": 661366, "epoch": 7968} {"train_loss": -27.96612548828125, "global_step": 661367, "epoch": 7968} {"train_loss": -27.9577693939209, "global_step": 661368, "epoch": 7968} {"train_loss": -27.49167823791504, "global_step": 661369, "epoch": 7968} {"train_loss": -28.21217155456543, "global_step": 661370, "epoch": 7968} {"train_loss": -28.156116485595703, "global_step": 661371, "epoch": 7968} {"train_loss": -28.026498794555664, "global_step": 661372, "epoch": 7968} {"train_loss": -27.522871017456055, "global_step": 661373, "epoch": 7968} {"train_loss": -28.019184112548828, "global_step": 661374, "epoch": 7968} {"train_loss": -28.419509887695312, "global_step": 661375, "epoch": 7968} {"train_loss": -28.42133903503418, "global_step": 661376, "epoch": 7968} {"train_loss": -28.059213638305664, "global_step": 661377, "epoch": 7968} {"train_loss": -28.209020614624023, "global_step": 661378, "epoch": 7968} {"train_loss": -28.192901611328125, "global_step": 661379, "epoch": 7968} {"train_loss": -28.18146324157715, "global_step": 661380, "epoch": 7968} {"train_loss": -28.12506103515625, "global_step": 661381, "epoch": 7968} {"train_loss": -28.539899826049805, "global_step": 661382, "epoch": 7968} {"train_loss": -28.507226943969727, "global_step": 661383, "epoch": 7968} {"train_loss": -28.437931060791016, "global_step": 661384, "epoch": 7968} {"train_loss": -28.44904899597168, "global_step": 661385, "epoch": 7968} {"train_loss": -28.282194137573242, "global_step": 661386, "epoch": 7968} {"train_loss": -28.51993179321289, "global_step": 661387, "epoch": 7968} {"train_loss": -28.313032150268555, "global_step": 661388, "epoch": 7968} {"train_loss": -28.689741134643555, "global_step": 661389, "epoch": 7968} {"train_loss": -28.380598068237305, "global_step": 661390, "epoch": 7968} {"train_loss": -28.38636589050293, "global_step": 661391, "epoch": 7968} {"train_loss": -28.383962631225586, "global_step": 661392, "epoch": 7968} {"train_loss": -28.567291259765625, "global_step": 661393, "epoch": 7968} {"train_loss": -28.464757919311523, "global_step": 661394, "epoch": 7968} {"train_loss": -28.497589111328125, "global_step": 661395, "epoch": 7968} {"train_loss": -28.291976928710938, "global_step": 661396, "epoch": 7968} {"train_loss": -28.530975341796875, "global_step": 661397, "epoch": 7968} {"train_loss": -28.37270164489746, "global_step": 661398, "epoch": 7968} {"train_loss": -28.5809383392334, "global_step": 661399, "epoch": 7968} {"train_loss": -28.511367797851562, "global_step": 661400, "epoch": 7968} {"train_loss": -28.10556411743164, "global_step": 661401, "epoch": 7968} {"train_loss": -28.538684844970703, "global_step": 661402, "epoch": 7968} {"train_loss": -28.816089630126953, "global_step": 661403, "epoch": 7968} {"train_loss": -28.201324462890625, "global_step": 661404, "epoch": 7968} {"train_loss": -28.4081974029541, "global_step": 661405, "epoch": 7968} {"train_loss": -28.368000030517578, "global_step": 661406, "epoch": 7968} {"train_loss": -28.53987693786621, "global_step": 661407, "epoch": 7968} {"train_loss": -28.322202682495117, "global_step": 661408, "epoch": 7968} {"train_loss": -28.385162353515625, "global_step": 661409, "epoch": 7968} {"train_loss": -28.241851806640625, "global_step": 661410, "epoch": 7968} {"train_loss": -28.592187881469727, "global_step": 661411, "epoch": 7968} {"train_loss": -28.56243324279785, "global_step": 661412, "epoch": 7968} {"train_loss": -28.528467178344727, "global_step": 661413, "epoch": 7968} {"train_loss": -28.64569091796875, "global_step": 661414, "epoch": 7968} {"train_loss": -28.356321334838867, "global_step": 661415, "epoch": 7968} {"train_loss": -28.383588790893555, "global_step": 661416, "epoch": 7968} {"train_loss": -28.04451560974121, "global_step": 661417, "epoch": 7968} {"train_loss": -28.37074089050293, "global_step": 661418, "epoch": 7968} {"train_loss": -28.11724281311035, "global_step": 661419, "epoch": 7968} {"train_loss": -28.571430206298828, "global_step": 661420, "epoch": 7968} {"train_loss": -28.55860710144043, "global_step": 661421, "epoch": 7968} {"train_loss": -28.28558349609375, "global_step": 661422, "epoch": 7968} {"train_loss": -28.41342544555664, "global_step": 661423, "epoch": 7968} {"train_loss": -28.268701553344727, "global_step": 661424, "epoch": 7968} {"train_loss": -28.822805404663086, "global_step": 661425, "epoch": 7968} {"train_loss": -27.994127917002483, "global_step": 661426, "epoch": 7968, "val_loss": 6716823.0} {"train_loss": -28.52775001525879, "global_step": 661427, "epoch": 7969} {"train_loss": -28.118579864501953, "global_step": 661428, "epoch": 7969} {"train_loss": -28.28067970275879, "global_step": 661429, "epoch": 7969} {"train_loss": -28.343488693237305, "global_step": 661430, "epoch": 7969} {"train_loss": -28.749235153198242, "global_step": 661431, "epoch": 7969} {"train_loss": -28.2862491607666, "global_step": 661432, "epoch": 7969} {"train_loss": -28.3789119720459, "global_step": 661433, "epoch": 7969} {"train_loss": -28.502553939819336, "global_step": 661434, "epoch": 7969} {"train_loss": -28.239866256713867, "global_step": 661435, "epoch": 7969} {"train_loss": -28.445215225219727, "global_step": 661436, "epoch": 7969} {"train_loss": -28.147695541381836, "global_step": 661437, "epoch": 7969} {"train_loss": -28.551294326782227, "global_step": 661438, "epoch": 7969} {"train_loss": -28.70045280456543, "global_step": 661439, "epoch": 7969} {"train_loss": -28.572885513305664, "global_step": 661440, "epoch": 7969} {"train_loss": -28.54640007019043, "global_step": 661441, "epoch": 7969} {"train_loss": -28.0447940826416, "global_step": 661442, "epoch": 7969} {"train_loss": -28.385587692260742, "global_step": 661443, "epoch": 7969} {"train_loss": -28.409570693969727, "global_step": 661444, "epoch": 7969} {"train_loss": -28.628564834594727, "global_step": 661445, "epoch": 7969} {"train_loss": -28.802221298217773, "global_step": 661446, "epoch": 7969} {"train_loss": -28.467132568359375, "global_step": 661447, "epoch": 7969} {"train_loss": -28.54522705078125, "global_step": 661448, "epoch": 7969} {"train_loss": -28.338367462158203, "global_step": 661449, "epoch": 7969} {"train_loss": -28.239410400390625, "global_step": 661450, "epoch": 7969} {"train_loss": -28.907577514648438, "global_step": 661451, "epoch": 7969} {"train_loss": -28.141202926635742, "global_step": 661452, "epoch": 7969} {"train_loss": -28.60194969177246, "global_step": 661453, "epoch": 7969} {"train_loss": -28.437475204467773, "global_step": 661454, "epoch": 7969} {"train_loss": -28.501195907592773, "global_step": 661455, "epoch": 7969} {"train_loss": -28.06797218322754, "global_step": 661456, "epoch": 7969} {"train_loss": -28.439428329467773, "global_step": 661457, "epoch": 7969} {"train_loss": -28.463972091674805, "global_step": 661458, "epoch": 7969} {"train_loss": -28.71923828125, "global_step": 661459, "epoch": 7969} {"train_loss": -28.460285186767578, "global_step": 661460, "epoch": 7969} {"train_loss": -28.490467071533203, "global_step": 661461, "epoch": 7969} {"train_loss": -28.392942428588867, "global_step": 661462, "epoch": 7969} {"train_loss": -28.534564971923828, "global_step": 661463, "epoch": 7969} {"train_loss": -28.402929306030273, "global_step": 661464, "epoch": 7969} {"train_loss": -28.560251235961914, "global_step": 661465, "epoch": 7969} {"train_loss": -28.51922607421875, "global_step": 661466, "epoch": 7969} {"train_loss": -28.643381118774414, "global_step": 661467, "epoch": 7969} {"train_loss": -28.41656494140625, "global_step": 661468, "epoch": 7969} {"train_loss": -28.569904327392578, "global_step": 661469, "epoch": 7969} {"train_loss": -28.347248077392578, "global_step": 661470, "epoch": 7969} {"train_loss": -28.469837188720703, "global_step": 661471, "epoch": 7969} {"train_loss": -28.378782272338867, "global_step": 661472, "epoch": 7969} {"train_loss": -28.4837646484375, "global_step": 661473, "epoch": 7969} {"train_loss": -28.44612693786621, "global_step": 661474, "epoch": 7969} {"train_loss": -28.63325309753418, "global_step": 661475, "epoch": 7969} {"train_loss": -28.49212646484375, "global_step": 661476, "epoch": 7969} {"train_loss": -28.118698120117188, "global_step": 661477, "epoch": 7969} {"train_loss": -28.047780990600586, "global_step": 661478, "epoch": 7969} {"train_loss": -28.248319625854492, "global_step": 661479, "epoch": 7969} {"train_loss": -28.411365509033203, "global_step": 661480, "epoch": 7969} {"train_loss": -28.21185302734375, "global_step": 661481, "epoch": 7969} {"train_loss": -28.455875396728516, "global_step": 661482, "epoch": 7969} {"train_loss": -27.94280433654785, "global_step": 661483, "epoch": 7969} {"train_loss": -28.44428062438965, "global_step": 661484, "epoch": 7969} {"train_loss": -28.19489097595215, "global_step": 661485, "epoch": 7969} {"train_loss": -28.35223388671875, "global_step": 661486, "epoch": 7969} {"train_loss": -28.606809616088867, "global_step": 661487, "epoch": 7969} {"train_loss": -28.083526611328125, "global_step": 661488, "epoch": 7969} {"train_loss": -28.12995719909668, "global_step": 661489, "epoch": 7969} {"train_loss": -28.62771987915039, "global_step": 661490, "epoch": 7969} {"train_loss": -28.339269638061523, "global_step": 661491, "epoch": 7969} {"train_loss": -28.288904190063477, "global_step": 661492, "epoch": 7969} {"train_loss": -28.30963134765625, "global_step": 661493, "epoch": 7969} {"train_loss": -28.553150177001953, "global_step": 661494, "epoch": 7969} {"train_loss": -28.5223445892334, "global_step": 661495, "epoch": 7969} {"train_loss": -28.484806060791016, "global_step": 661496, "epoch": 7969} {"train_loss": -28.41330337524414, "global_step": 661497, "epoch": 7969} {"train_loss": -28.2371768951416, "global_step": 661498, "epoch": 7969} {"train_loss": -28.58279800415039, "global_step": 661499, "epoch": 7969} {"train_loss": -28.29258155822754, "global_step": 661500, "epoch": 7969} {"train_loss": -28.305463790893555, "global_step": 661501, "epoch": 7969} {"train_loss": -28.50846290588379, "global_step": 661502, "epoch": 7969} {"train_loss": -28.613697052001953, "global_step": 661503, "epoch": 7969} {"train_loss": -28.26096534729004, "global_step": 661504, "epoch": 7969} {"train_loss": -28.2192440032959, "global_step": 661505, "epoch": 7969} {"train_loss": -28.263818740844727, "global_step": 661506, "epoch": 7969} {"train_loss": -28.525094985961914, "global_step": 661507, "epoch": 7969} {"train_loss": -28.592031478881836, "global_step": 661508, "epoch": 7969} {"train_loss": -28.408169114446064, "global_step": 661509, "epoch": 7969, "val_loss": 6693606.5} {"train_loss": -27.77168083190918, "global_step": 661510, "epoch": 7970} {"train_loss": -27.915302276611328, "global_step": 661511, "epoch": 7970} {"train_loss": -27.988248825073242, "global_step": 661512, "epoch": 7970} {"train_loss": -28.123762130737305, "global_step": 661513, "epoch": 7970} {"train_loss": -28.020614624023438, "global_step": 661514, "epoch": 7970} {"train_loss": -28.201990127563477, "global_step": 661515, "epoch": 7970} {"train_loss": -28.103918075561523, "global_step": 661516, "epoch": 7970} {"train_loss": -28.27947425842285, "global_step": 661517, "epoch": 7970} {"train_loss": -28.231369018554688, "global_step": 661518, "epoch": 7970} {"train_loss": -27.986825942993164, "global_step": 661519, "epoch": 7970} {"train_loss": -28.09661293029785, "global_step": 661520, "epoch": 7970} {"train_loss": -28.44862174987793, "global_step": 661521, "epoch": 7970} {"train_loss": -28.375930786132812, "global_step": 661522, "epoch": 7970} {"train_loss": -28.246789932250977, "global_step": 661523, "epoch": 7970} {"train_loss": -28.030750274658203, "global_step": 661524, "epoch": 7970} {"train_loss": -28.335193634033203, "global_step": 661525, "epoch": 7970} {"train_loss": -28.043920516967773, "global_step": 661526, "epoch": 7970} {"train_loss": -28.467864990234375, "global_step": 661527, "epoch": 7970} {"train_loss": -28.2459774017334, "global_step": 661528, "epoch": 7970} {"train_loss": -28.55097770690918, "global_step": 661529, "epoch": 7970} {"train_loss": -28.363651275634766, "global_step": 661530, "epoch": 7970} {"train_loss": -28.2587833404541, "global_step": 661531, "epoch": 7970} {"train_loss": -28.357772827148438, "global_step": 661532, "epoch": 7970} {"train_loss": -28.172163009643555, "global_step": 661533, "epoch": 7970} {"train_loss": -28.486112594604492, "global_step": 661534, "epoch": 7970} {"train_loss": -28.620925903320312, "global_step": 661535, "epoch": 7970} {"train_loss": -28.363935470581055, "global_step": 661536, "epoch": 7970} {"train_loss": -28.31623649597168, "global_step": 661537, "epoch": 7970} {"train_loss": -28.4895076751709, "global_step": 661538, "epoch": 7970} {"train_loss": -28.8571720123291, "global_step": 661539, "epoch": 7970} {"train_loss": -28.59539794921875, "global_step": 661540, "epoch": 7970} {"train_loss": -28.800119400024414, "global_step": 661541, "epoch": 7970} {"train_loss": -28.52316665649414, "global_step": 661542, "epoch": 7970} {"train_loss": -28.72319984436035, "global_step": 661543, "epoch": 7970} {"train_loss": -28.69643211364746, "global_step": 661544, "epoch": 7970} {"train_loss": -28.654666900634766, "global_step": 661545, "epoch": 7970} {"train_loss": -28.591711044311523, "global_step": 661546, "epoch": 7970} {"train_loss": -28.55710220336914, "global_step": 661547, "epoch": 7970} {"train_loss": -28.54823112487793, "global_step": 661548, "epoch": 7970} {"train_loss": -28.783740997314453, "global_step": 661549, "epoch": 7970} {"train_loss": -28.65216636657715, "global_step": 661550, "epoch": 7970} {"train_loss": -28.951828002929688, "global_step": 661551, "epoch": 7970} {"train_loss": -28.983564376831055, "global_step": 661552, "epoch": 7970} {"train_loss": -28.656972885131836, "global_step": 661553, "epoch": 7970} {"train_loss": -28.316516876220703, "global_step": 661554, "epoch": 7970} {"train_loss": -28.5902156829834, "global_step": 661555, "epoch": 7970} {"train_loss": -28.562955856323242, "global_step": 661556, "epoch": 7970} {"train_loss": -28.367919921875, "global_step": 661557, "epoch": 7970} {"train_loss": -28.78236198425293, "global_step": 661558, "epoch": 7970} {"train_loss": -28.543806076049805, "global_step": 661559, "epoch": 7970} {"train_loss": -28.286376953125, "global_step": 661560, "epoch": 7970} {"train_loss": -28.549362182617188, "global_step": 661561, "epoch": 7970} {"train_loss": -28.666051864624023, "global_step": 661562, "epoch": 7970} {"train_loss": -28.179712295532227, "global_step": 661563, "epoch": 7970} {"train_loss": -28.330570220947266, "global_step": 661564, "epoch": 7970} {"train_loss": -28.28046989440918, "global_step": 661565, "epoch": 7970} {"train_loss": -28.496875762939453, "global_step": 661566, "epoch": 7970} {"train_loss": -28.522571563720703, "global_step": 661567, "epoch": 7970} {"train_loss": -28.528717041015625, "global_step": 661568, "epoch": 7970} {"train_loss": -28.36842918395996, "global_step": 661569, "epoch": 7970} {"train_loss": -28.55609130859375, "global_step": 661570, "epoch": 7970} {"train_loss": -28.2601375579834, "global_step": 661571, "epoch": 7970} {"train_loss": -28.223291397094727, "global_step": 661572, "epoch": 7970} {"train_loss": -28.01947593688965, "global_step": 661573, "epoch": 7970} {"train_loss": -28.208776473999023, "global_step": 661574, "epoch": 7970} {"train_loss": -28.386280059814453, "global_step": 661575, "epoch": 7970} {"train_loss": -28.385412216186523, "global_step": 661576, "epoch": 7970} {"train_loss": -28.142505645751953, "global_step": 661577, "epoch": 7970} {"train_loss": -27.562162399291992, "global_step": 661578, "epoch": 7970} {"train_loss": -27.48541831970215, "global_step": 661579, "epoch": 7970} {"train_loss": -27.932403564453125, "global_step": 661580, "epoch": 7970} {"train_loss": -28.21622085571289, "global_step": 661581, "epoch": 7970} {"train_loss": -28.196619033813477, "global_step": 661582, "epoch": 7970} {"train_loss": -28.22653579711914, "global_step": 661583, "epoch": 7970} {"train_loss": -28.631567001342773, "global_step": 661584, "epoch": 7970} {"train_loss": -27.94486427307129, "global_step": 661585, "epoch": 7970} {"train_loss": -28.187368392944336, "global_step": 661586, "epoch": 7970} {"train_loss": -28.49016761779785, "global_step": 661587, "epoch": 7970} {"train_loss": -28.685373306274414, "global_step": 661588, "epoch": 7970} {"train_loss": -28.577457427978516, "global_step": 661589, "epoch": 7970} {"train_loss": -28.09644889831543, "global_step": 661590, "epoch": 7970} {"train_loss": -28.47913932800293, "global_step": 661591, "epoch": 7970} {"train_loss": -28.367389058492268, "global_step": 661592, "epoch": 7970, "val_loss": 6700905.0} {"train_loss": -27.999042510986328, "global_step": 661593, "epoch": 7971} {"train_loss": -28.035171508789062, "global_step": 661594, "epoch": 7971} {"train_loss": -28.00603675842285, "global_step": 661595, "epoch": 7971} {"train_loss": -28.062702178955078, "global_step": 661596, "epoch": 7971} {"train_loss": -27.735584259033203, "global_step": 661597, "epoch": 7971} {"train_loss": -27.956945419311523, "global_step": 661598, "epoch": 7971} {"train_loss": -27.902408599853516, "global_step": 661599, "epoch": 7971} {"train_loss": -28.076568603515625, "global_step": 661600, "epoch": 7971} {"train_loss": -27.87421989440918, "global_step": 661601, "epoch": 7971} {"train_loss": -27.968658447265625, "global_step": 661602, "epoch": 7971} {"train_loss": -27.874120712280273, "global_step": 661603, "epoch": 7971} {"train_loss": -28.437524795532227, "global_step": 661604, "epoch": 7971} {"train_loss": -28.34614372253418, "global_step": 661605, "epoch": 7971} {"train_loss": -27.885608673095703, "global_step": 661606, "epoch": 7971} {"train_loss": -28.257715225219727, "global_step": 661607, "epoch": 7971} {"train_loss": -28.15386962890625, "global_step": 661608, "epoch": 7971} {"train_loss": -27.683563232421875, "global_step": 661609, "epoch": 7971} {"train_loss": -27.854795455932617, "global_step": 661610, "epoch": 7971} {"train_loss": -28.21107292175293, "global_step": 661611, "epoch": 7971} {"train_loss": -28.290613174438477, "global_step": 661612, "epoch": 7971} {"train_loss": -28.394763946533203, "global_step": 661613, "epoch": 7971} {"train_loss": -28.239850997924805, "global_step": 661614, "epoch": 7971} {"train_loss": -28.55502700805664, "global_step": 661615, "epoch": 7971} {"train_loss": -28.47161865234375, "global_step": 661616, "epoch": 7971} {"train_loss": -28.285337448120117, "global_step": 661617, "epoch": 7971} {"train_loss": -28.41082191467285, "global_step": 661618, "epoch": 7971} {"train_loss": -28.41305923461914, "global_step": 661619, "epoch": 7971} {"train_loss": -28.47242546081543, "global_step": 661620, "epoch": 7971} {"train_loss": -28.444623947143555, "global_step": 661621, "epoch": 7971} {"train_loss": -28.16497802734375, "global_step": 661622, "epoch": 7971} {"train_loss": -28.1591796875, "global_step": 661623, "epoch": 7971} {"train_loss": -28.376134872436523, "global_step": 661624, "epoch": 7971} {"train_loss": -28.544574737548828, "global_step": 661625, "epoch": 7971} {"train_loss": -28.709409713745117, "global_step": 661626, "epoch": 7971} {"train_loss": -28.551233291625977, "global_step": 661627, "epoch": 7971} {"train_loss": -28.573413848876953, "global_step": 661628, "epoch": 7971} {"train_loss": -28.168781280517578, "global_step": 661629, "epoch": 7971} {"train_loss": -28.732559204101562, "global_step": 661630, "epoch": 7971} {"train_loss": -28.484403610229492, "global_step": 661631, "epoch": 7971} {"train_loss": -28.528278350830078, "global_step": 661632, "epoch": 7971} {"train_loss": -28.6961669921875, "global_step": 661633, "epoch": 7971} {"train_loss": -28.723819732666016, "global_step": 661634, "epoch": 7971} {"train_loss": -28.51923179626465, "global_step": 661635, "epoch": 7971} {"train_loss": -28.607303619384766, "global_step": 661636, "epoch": 7971} {"train_loss": -28.331562042236328, "global_step": 661637, "epoch": 7971} {"train_loss": -28.423810958862305, "global_step": 661638, "epoch": 7971} {"train_loss": -28.78922462463379, "global_step": 661639, "epoch": 7971} {"train_loss": -28.537824630737305, "global_step": 661640, "epoch": 7971} {"train_loss": -28.78523063659668, "global_step": 661641, "epoch": 7971} {"train_loss": -28.83359718322754, "global_step": 661642, "epoch": 7971} {"train_loss": -28.961994171142578, "global_step": 661643, "epoch": 7971} {"train_loss": -28.611204147338867, "global_step": 661644, "epoch": 7971} {"train_loss": -28.31878089904785, "global_step": 661645, "epoch": 7971} {"train_loss": -28.5350399017334, "global_step": 661646, "epoch": 7971} {"train_loss": -28.60597038269043, "global_step": 661647, "epoch": 7971} {"train_loss": -28.707014083862305, "global_step": 661648, "epoch": 7971} {"train_loss": -28.666812896728516, "global_step": 661649, "epoch": 7971} {"train_loss": -28.747739791870117, "global_step": 661650, "epoch": 7971} {"train_loss": -28.3875732421875, "global_step": 661651, "epoch": 7971} {"train_loss": -28.634668350219727, "global_step": 661652, "epoch": 7971} {"train_loss": -28.474409103393555, "global_step": 661653, "epoch": 7971} {"train_loss": -28.283557891845703, "global_step": 661654, "epoch": 7971} {"train_loss": -28.583337783813477, "global_step": 661655, "epoch": 7971} {"train_loss": -28.212427139282227, "global_step": 661656, "epoch": 7971} {"train_loss": -28.383777618408203, "global_step": 661657, "epoch": 7971} {"train_loss": -28.643747329711914, "global_step": 661658, "epoch": 7971} {"train_loss": -28.219594955444336, "global_step": 661659, "epoch": 7971} {"train_loss": -28.231800079345703, "global_step": 661660, "epoch": 7971} {"train_loss": -27.601755142211914, "global_step": 661661, "epoch": 7971} {"train_loss": -27.69248390197754, "global_step": 661662, "epoch": 7971} {"train_loss": -27.119110107421875, "global_step": 661663, "epoch": 7971} {"train_loss": -26.85589027404785, "global_step": 661664, "epoch": 7971} {"train_loss": -28.029041290283203, "global_step": 661665, "epoch": 7971} {"train_loss": -28.000629425048828, "global_step": 661666, "epoch": 7971} {"train_loss": -27.308700561523438, "global_step": 661667, "epoch": 7971} {"train_loss": -27.522602081298828, "global_step": 661668, "epoch": 7971} {"train_loss": -27.17511558532715, "global_step": 661669, "epoch": 7971} {"train_loss": -27.14179039001465, "global_step": 661670, "epoch": 7971} {"train_loss": -27.428802490234375, "global_step": 661671, "epoch": 7971} {"train_loss": -27.186643600463867, "global_step": 661672, "epoch": 7971} {"train_loss": -27.838632583618164, "global_step": 661673, "epoch": 7971} {"train_loss": -27.478742599487305, "global_step": 661674, "epoch": 7971} {"train_loss": -28.213575799781157, "global_step": 661675, "epoch": 7971, "val_loss": 6622738.0} {"train_loss": -27.020429611206055, "global_step": 661676, "epoch": 7972} {"train_loss": -27.857452392578125, "global_step": 661677, "epoch": 7972} {"train_loss": -27.645660400390625, "global_step": 661678, "epoch": 7972} {"train_loss": -27.662891387939453, "global_step": 661679, "epoch": 7972} {"train_loss": -27.493453979492188, "global_step": 661680, "epoch": 7972} {"train_loss": -27.355554580688477, "global_step": 661681, "epoch": 7972} {"train_loss": -27.95562744140625, "global_step": 661682, "epoch": 7972} {"train_loss": -28.08111572265625, "global_step": 661683, "epoch": 7972} {"train_loss": -27.962574005126953, "global_step": 661684, "epoch": 7972} {"train_loss": -28.149871826171875, "global_step": 661685, "epoch": 7972} {"train_loss": -27.937183380126953, "global_step": 661686, "epoch": 7972} {"train_loss": -28.17997169494629, "global_step": 661687, "epoch": 7972} {"train_loss": -27.66518211364746, "global_step": 661688, "epoch": 7972} {"train_loss": -27.828779220581055, "global_step": 661689, "epoch": 7972} {"train_loss": -27.898590087890625, "global_step": 661690, "epoch": 7972} {"train_loss": -27.89759635925293, "global_step": 661691, "epoch": 7972} {"train_loss": -27.924646377563477, "global_step": 661692, "epoch": 7972} {"train_loss": -27.817941665649414, "global_step": 661693, "epoch": 7972} {"train_loss": -27.72370719909668, "global_step": 661694, "epoch": 7972} {"train_loss": -27.867895126342773, "global_step": 661695, "epoch": 7972} {"train_loss": -28.494617462158203, "global_step": 661696, "epoch": 7972} {"train_loss": -28.0579833984375, "global_step": 661697, "epoch": 7972} {"train_loss": -28.376062393188477, "global_step": 661698, "epoch": 7972} {"train_loss": -28.66546058654785, "global_step": 661699, "epoch": 7972} {"train_loss": -28.08333396911621, "global_step": 661700, "epoch": 7972} {"train_loss": -28.19941520690918, "global_step": 661701, "epoch": 7972} {"train_loss": -28.321033477783203, "global_step": 661702, "epoch": 7972} {"train_loss": -28.71270751953125, "global_step": 661703, "epoch": 7972} {"train_loss": -28.25969886779785, "global_step": 661704, "epoch": 7972} {"train_loss": -28.46003532409668, "global_step": 661705, "epoch": 7972} {"train_loss": -28.447851181030273, "global_step": 661706, "epoch": 7972} {"train_loss": -28.028228759765625, "global_step": 661707, "epoch": 7972} {"train_loss": -28.359283447265625, "global_step": 661708, "epoch": 7972} {"train_loss": -28.296131134033203, "global_step": 661709, "epoch": 7972} {"train_loss": -28.381942749023438, "global_step": 661710, "epoch": 7972} {"train_loss": -28.613285064697266, "global_step": 661711, "epoch": 7972} {"train_loss": -28.552337646484375, "global_step": 661712, "epoch": 7972} {"train_loss": -28.422754287719727, "global_step": 661713, "epoch": 7972} {"train_loss": -28.61274528503418, "global_step": 661714, "epoch": 7972} {"train_loss": -28.5261287689209, "global_step": 661715, "epoch": 7972} {"train_loss": -28.443378448486328, "global_step": 661716, "epoch": 7972} {"train_loss": -28.620336532592773, "global_step": 661717, "epoch": 7972} {"train_loss": -28.290502548217773, "global_step": 661718, "epoch": 7972} {"train_loss": -28.549726486206055, "global_step": 661719, "epoch": 7972} {"train_loss": -28.677602767944336, "global_step": 661720, "epoch": 7972} {"train_loss": -28.433551788330078, "global_step": 661721, "epoch": 7972} {"train_loss": -28.59185791015625, "global_step": 661722, "epoch": 7972} {"train_loss": -28.245519638061523, "global_step": 661723, "epoch": 7972} {"train_loss": -28.2922420501709, "global_step": 661724, "epoch": 7972} {"train_loss": -28.892847061157227, "global_step": 661725, "epoch": 7972} {"train_loss": -28.788442611694336, "global_step": 661726, "epoch": 7972} {"train_loss": -28.355335235595703, "global_step": 661727, "epoch": 7972} {"train_loss": -28.588363647460938, "global_step": 661728, "epoch": 7972} {"train_loss": -28.494001388549805, "global_step": 661729, "epoch": 7972} {"train_loss": -28.431875228881836, "global_step": 661730, "epoch": 7972} {"train_loss": -28.612268447875977, "global_step": 661731, "epoch": 7972} {"train_loss": -28.601917266845703, "global_step": 661732, "epoch": 7972} {"train_loss": -28.636030197143555, "global_step": 661733, "epoch": 7972} {"train_loss": -28.58307456970215, "global_step": 661734, "epoch": 7972} {"train_loss": -28.81259536743164, "global_step": 661735, "epoch": 7972} {"train_loss": -28.511112213134766, "global_step": 661736, "epoch": 7972} {"train_loss": -28.369709014892578, "global_step": 661737, "epoch": 7972} {"train_loss": -28.61610221862793, "global_step": 661738, "epoch": 7972} {"train_loss": -28.598255157470703, "global_step": 661739, "epoch": 7972} {"train_loss": -28.47528076171875, "global_step": 661740, "epoch": 7972} {"train_loss": -28.5166015625, "global_step": 661741, "epoch": 7972} {"train_loss": -28.4821834564209, "global_step": 661742, "epoch": 7972} {"train_loss": -28.338037490844727, "global_step": 661743, "epoch": 7972} {"train_loss": -28.00923728942871, "global_step": 661744, "epoch": 7972} {"train_loss": -27.876300811767578, "global_step": 661745, "epoch": 7972} {"train_loss": -28.046890258789062, "global_step": 661746, "epoch": 7972} {"train_loss": -27.640213012695312, "global_step": 661747, "epoch": 7972} {"train_loss": -27.725168228149414, "global_step": 661748, "epoch": 7972} {"train_loss": -27.421279907226562, "global_step": 661749, "epoch": 7972} {"train_loss": -28.176029205322266, "global_step": 661750, "epoch": 7972} {"train_loss": -28.19413185119629, "global_step": 661751, "epoch": 7972} {"train_loss": -28.0556697845459, "global_step": 661752, "epoch": 7972} {"train_loss": -28.078779220581055, "global_step": 661753, "epoch": 7972} {"train_loss": -28.0782527923584, "global_step": 661754, "epoch": 7972} {"train_loss": -28.219430923461914, "global_step": 661755, "epoch": 7972} {"train_loss": -28.53793716430664, "global_step": 661756, "epoch": 7972} {"train_loss": -28.19382667541504, "global_step": 661757, "epoch": 7972} {"train_loss": -28.24209831421634, "global_step": 661758, "epoch": 7972, "val_loss": 6714908.0} {"train_loss": -27.773778915405273, "global_step": 661759, "epoch": 7973} {"train_loss": -27.618640899658203, "global_step": 661760, "epoch": 7973} {"train_loss": -27.976911544799805, "global_step": 661761, "epoch": 7973} {"train_loss": -28.123464584350586, "global_step": 661762, "epoch": 7973} {"train_loss": -27.832738876342773, "global_step": 661763, "epoch": 7973} {"train_loss": -27.765710830688477, "global_step": 661764, "epoch": 7973} {"train_loss": -27.723529815673828, "global_step": 661765, "epoch": 7973} {"train_loss": -27.8876953125, "global_step": 661766, "epoch": 7973} {"train_loss": -27.562576293945312, "global_step": 661767, "epoch": 7973} {"train_loss": -27.75250816345215, "global_step": 661768, "epoch": 7973} {"train_loss": -27.444787979125977, "global_step": 661769, "epoch": 7973} {"train_loss": -27.71402359008789, "global_step": 661770, "epoch": 7973} {"train_loss": -27.4423885345459, "global_step": 661771, "epoch": 7973} {"train_loss": -27.71650505065918, "global_step": 661772, "epoch": 7973} {"train_loss": -27.928308486938477, "global_step": 661773, "epoch": 7973} {"train_loss": -27.545164108276367, "global_step": 661774, "epoch": 7973} {"train_loss": -27.954919815063477, "global_step": 661775, "epoch": 7973} {"train_loss": -28.226831436157227, "global_step": 661776, "epoch": 7973} {"train_loss": -28.021162033081055, "global_step": 661777, "epoch": 7973} {"train_loss": -27.934650421142578, "global_step": 661778, "epoch": 7973} {"train_loss": -27.699010848999023, "global_step": 661779, "epoch": 7973} {"train_loss": -27.629337310791016, "global_step": 661780, "epoch": 7973} {"train_loss": -27.842260360717773, "global_step": 661781, "epoch": 7973} {"train_loss": -28.08839225769043, "global_step": 661782, "epoch": 7973} {"train_loss": -28.45267105102539, "global_step": 661783, "epoch": 7973} {"train_loss": -27.77736473083496, "global_step": 661784, "epoch": 7973} {"train_loss": -28.060932159423828, "global_step": 661785, "epoch": 7973} {"train_loss": -27.80512046813965, "global_step": 661786, "epoch": 7973} {"train_loss": -28.0939998626709, "global_step": 661787, "epoch": 7973} {"train_loss": -28.65878677368164, "global_step": 661788, "epoch": 7973} {"train_loss": -28.098285675048828, "global_step": 661789, "epoch": 7973} {"train_loss": -28.240095138549805, "global_step": 661790, "epoch": 7973} {"train_loss": -28.267658233642578, "global_step": 661791, "epoch": 7973} {"train_loss": -28.52911376953125, "global_step": 661792, "epoch": 7973} {"train_loss": -28.53887939453125, "global_step": 661793, "epoch": 7973} {"train_loss": -28.65998649597168, "global_step": 661794, "epoch": 7973} {"train_loss": -28.552297592163086, "global_step": 661795, "epoch": 7973} {"train_loss": -28.094165802001953, "global_step": 661796, "epoch": 7973} {"train_loss": -28.633472442626953, "global_step": 661797, "epoch": 7973} {"train_loss": -28.4792423248291, "global_step": 661798, "epoch": 7973} {"train_loss": -28.178171157836914, "global_step": 661799, "epoch": 7973} {"train_loss": -28.1939640045166, "global_step": 661800, "epoch": 7973} {"train_loss": -28.345722198486328, "global_step": 661801, "epoch": 7973} {"train_loss": -28.486053466796875, "global_step": 661802, "epoch": 7973} {"train_loss": -28.70713233947754, "global_step": 661803, "epoch": 7973} {"train_loss": -28.57826805114746, "global_step": 661804, "epoch": 7973} {"train_loss": -28.44745445251465, "global_step": 661805, "epoch": 7973} {"train_loss": -28.341766357421875, "global_step": 661806, "epoch": 7973} {"train_loss": -28.963407516479492, "global_step": 661807, "epoch": 7973} {"train_loss": -28.351606369018555, "global_step": 661808, "epoch": 7973} {"train_loss": -28.733396530151367, "global_step": 661809, "epoch": 7973} {"train_loss": -28.300525665283203, "global_step": 661810, "epoch": 7973} {"train_loss": -28.225996017456055, "global_step": 661811, "epoch": 7973} {"train_loss": -28.138813018798828, "global_step": 661812, "epoch": 7973} {"train_loss": -28.25556755065918, "global_step": 661813, "epoch": 7973} {"train_loss": -28.581134796142578, "global_step": 661814, "epoch": 7973} {"train_loss": -28.392663955688477, "global_step": 661815, "epoch": 7973} {"train_loss": -28.01984214782715, "global_step": 661816, "epoch": 7973} {"train_loss": -27.978872299194336, "global_step": 661817, "epoch": 7973} {"train_loss": -28.333288192749023, "global_step": 661818, "epoch": 7973} {"train_loss": -28.32465934753418, "global_step": 661819, "epoch": 7973} {"train_loss": -28.255834579467773, "global_step": 661820, "epoch": 7973} {"train_loss": -28.773656845092773, "global_step": 661821, "epoch": 7973} {"train_loss": -28.623916625976562, "global_step": 661822, "epoch": 7973} {"train_loss": -28.34766960144043, "global_step": 661823, "epoch": 7973} {"train_loss": -28.506635665893555, "global_step": 661824, "epoch": 7973} {"train_loss": -28.46335792541504, "global_step": 661825, "epoch": 7973} {"train_loss": -28.620038986206055, "global_step": 661826, "epoch": 7973} {"train_loss": -28.419645309448242, "global_step": 661827, "epoch": 7973} {"train_loss": -28.400869369506836, "global_step": 661828, "epoch": 7973} {"train_loss": -28.290191650390625, "global_step": 661829, "epoch": 7973} {"train_loss": -28.181766510009766, "global_step": 661830, "epoch": 7973} {"train_loss": -28.41102409362793, "global_step": 661831, "epoch": 7973} {"train_loss": -28.765417098999023, "global_step": 661832, "epoch": 7973} {"train_loss": -28.170801162719727, "global_step": 661833, "epoch": 7973} {"train_loss": -28.044666290283203, "global_step": 661834, "epoch": 7973} {"train_loss": -28.61488151550293, "global_step": 661835, "epoch": 7973} {"train_loss": -28.256677627563477, "global_step": 661836, "epoch": 7973} {"train_loss": -28.618432998657227, "global_step": 661837, "epoch": 7973} {"train_loss": -28.21685218811035, "global_step": 661838, "epoch": 7973} {"train_loss": -28.390127182006836, "global_step": 661839, "epoch": 7973} {"train_loss": -28.156768798828125, "global_step": 661840, "epoch": 7973} {"train_loss": -28.22099180106657, "global_step": 661841, "epoch": 7973, "val_loss": 6571903.0} {"train_loss": -28.134078979492188, "global_step": 661842, "epoch": 7974} {"train_loss": -27.131011962890625, "global_step": 661843, "epoch": 7974} {"train_loss": -27.570789337158203, "global_step": 661844, "epoch": 7974} {"train_loss": -27.540414810180664, "global_step": 661845, "epoch": 7974} {"train_loss": -28.198545455932617, "global_step": 661846, "epoch": 7974} {"train_loss": -27.834882736206055, "global_step": 661847, "epoch": 7974} {"train_loss": -27.76954460144043, "global_step": 661848, "epoch": 7974} {"train_loss": -28.02911376953125, "global_step": 661849, "epoch": 7974} {"train_loss": -27.89088249206543, "global_step": 661850, "epoch": 7974} {"train_loss": -27.52153968811035, "global_step": 661851, "epoch": 7974} {"train_loss": -27.9345760345459, "global_step": 661852, "epoch": 7974} {"train_loss": -27.969131469726562, "global_step": 661853, "epoch": 7974} {"train_loss": -27.901996612548828, "global_step": 661854, "epoch": 7974} {"train_loss": -27.792280197143555, "global_step": 661855, "epoch": 7974} {"train_loss": -27.990625381469727, "global_step": 661856, "epoch": 7974} {"train_loss": -27.940160751342773, "global_step": 661857, "epoch": 7974} {"train_loss": -27.866735458374023, "global_step": 661858, "epoch": 7974} {"train_loss": -28.105823516845703, "global_step": 661859, "epoch": 7974} {"train_loss": -27.924097061157227, "global_step": 661860, "epoch": 7974} {"train_loss": -27.980743408203125, "global_step": 661861, "epoch": 7974} {"train_loss": -27.972578048706055, "global_step": 661862, "epoch": 7974} {"train_loss": -27.811450958251953, "global_step": 661863, "epoch": 7974} {"train_loss": -27.98862075805664, "global_step": 661864, "epoch": 7974} {"train_loss": -27.8631591796875, "global_step": 661865, "epoch": 7974} {"train_loss": -28.067947387695312, "global_step": 661866, "epoch": 7974} {"train_loss": -28.434497833251953, "global_step": 661867, "epoch": 7974} {"train_loss": -28.358966827392578, "global_step": 661868, "epoch": 7974} {"train_loss": -28.671438217163086, "global_step": 661869, "epoch": 7974} {"train_loss": -28.0062198638916, "global_step": 661870, "epoch": 7974} {"train_loss": -28.061864852905273, "global_step": 661871, "epoch": 7974} {"train_loss": -28.2049560546875, "global_step": 661872, "epoch": 7974} {"train_loss": -28.415510177612305, "global_step": 661873, "epoch": 7974} {"train_loss": -28.491077423095703, "global_step": 661874, "epoch": 7974} {"train_loss": -27.68084716796875, "global_step": 661875, "epoch": 7974} {"train_loss": -28.3035831451416, "global_step": 661876, "epoch": 7974} {"train_loss": -27.88727378845215, "global_step": 661877, "epoch": 7974} {"train_loss": -28.02106285095215, "global_step": 661878, "epoch": 7974} {"train_loss": -28.7130184173584, "global_step": 661879, "epoch": 7974} {"train_loss": -28.09698486328125, "global_step": 661880, "epoch": 7974} {"train_loss": -28.449726104736328, "global_step": 661881, "epoch": 7974} {"train_loss": -28.450788497924805, "global_step": 661882, "epoch": 7974} {"train_loss": -27.94415855407715, "global_step": 661883, "epoch": 7974} {"train_loss": -28.133319854736328, "global_step": 661884, "epoch": 7974} {"train_loss": -28.3671817779541, "global_step": 661885, "epoch": 7974} {"train_loss": -28.152185440063477, "global_step": 661886, "epoch": 7974} {"train_loss": -28.004230499267578, "global_step": 661887, "epoch": 7974} {"train_loss": -28.1528377532959, "global_step": 661888, "epoch": 7974} {"train_loss": -28.443042755126953, "global_step": 661889, "epoch": 7974} {"train_loss": -28.33692741394043, "global_step": 661890, "epoch": 7974} {"train_loss": -28.491376876831055, "global_step": 661891, "epoch": 7974} {"train_loss": -28.433095932006836, "global_step": 661892, "epoch": 7974} {"train_loss": -28.177322387695312, "global_step": 661893, "epoch": 7974} {"train_loss": -28.314294815063477, "global_step": 661894, "epoch": 7974} {"train_loss": -28.6483097076416, "global_step": 661895, "epoch": 7974} {"train_loss": -28.782968521118164, "global_step": 661896, "epoch": 7974} {"train_loss": -28.8172607421875, "global_step": 661897, "epoch": 7974} {"train_loss": -28.16302490234375, "global_step": 661898, "epoch": 7974} {"train_loss": -28.528181076049805, "global_step": 661899, "epoch": 7974} {"train_loss": -28.556507110595703, "global_step": 661900, "epoch": 7974} {"train_loss": -28.322128295898438, "global_step": 661901, "epoch": 7974} {"train_loss": -28.6571044921875, "global_step": 661902, "epoch": 7974} {"train_loss": -28.677701950073242, "global_step": 661903, "epoch": 7974} {"train_loss": -28.36952781677246, "global_step": 661904, "epoch": 7974} {"train_loss": -28.43842124938965, "global_step": 661905, "epoch": 7974} {"train_loss": -28.361066818237305, "global_step": 661906, "epoch": 7974} {"train_loss": -28.301010131835938, "global_step": 661907, "epoch": 7974} {"train_loss": -28.496383666992188, "global_step": 661908, "epoch": 7974} {"train_loss": -28.654260635375977, "global_step": 661909, "epoch": 7974} {"train_loss": -28.287872314453125, "global_step": 661910, "epoch": 7974} {"train_loss": -28.673725128173828, "global_step": 661911, "epoch": 7974} {"train_loss": -28.37708854675293, "global_step": 661912, "epoch": 7974} {"train_loss": -28.793426513671875, "global_step": 661913, "epoch": 7974} {"train_loss": -28.304569244384766, "global_step": 661914, "epoch": 7974} {"train_loss": -28.85993003845215, "global_step": 661915, "epoch": 7974} {"train_loss": -28.7937068939209, "global_step": 661916, "epoch": 7974} {"train_loss": -28.30034828186035, "global_step": 661917, "epoch": 7974} {"train_loss": -28.4299373626709, "global_step": 661918, "epoch": 7974} {"train_loss": -28.498931884765625, "global_step": 661919, "epoch": 7974} {"train_loss": -28.496912002563477, "global_step": 661920, "epoch": 7974} {"train_loss": -28.671894073486328, "global_step": 661921, "epoch": 7974} {"train_loss": -28.461624145507812, "global_step": 661922, "epoch": 7974} {"train_loss": -28.534393310546875, "global_step": 661923, "epoch": 7974} {"train_loss": -28.24623753651079, "global_step": 661924, "epoch": 7974, "val_loss": 6667483.0} {"train_loss": -27.00242042541504, "global_step": 661925, "epoch": 7975} {"train_loss": -26.51076316833496, "global_step": 661926, "epoch": 7975} {"train_loss": -25.5657901763916, "global_step": 661927, "epoch": 7975} {"train_loss": -26.55500602722168, "global_step": 661928, "epoch": 7975} {"train_loss": -27.58978271484375, "global_step": 661929, "epoch": 7975} {"train_loss": -26.302091598510742, "global_step": 661930, "epoch": 7975} {"train_loss": -26.954797744750977, "global_step": 661931, "epoch": 7975} {"train_loss": -27.065343856811523, "global_step": 661932, "epoch": 7975} {"train_loss": -27.338180541992188, "global_step": 661933, "epoch": 7975} {"train_loss": -27.075769424438477, "global_step": 661934, "epoch": 7975} {"train_loss": -27.4345760345459, "global_step": 661935, "epoch": 7975} {"train_loss": -27.723037719726562, "global_step": 661936, "epoch": 7975} {"train_loss": -27.419513702392578, "global_step": 661937, "epoch": 7975} {"train_loss": -27.52924919128418, "global_step": 661938, "epoch": 7975} {"train_loss": -27.435400009155273, "global_step": 661939, "epoch": 7975} {"train_loss": -27.50868034362793, "global_step": 661940, "epoch": 7975} {"train_loss": -27.384489059448242, "global_step": 661941, "epoch": 7975} {"train_loss": -27.842634201049805, "global_step": 661942, "epoch": 7975} {"train_loss": -27.493045806884766, "global_step": 661943, "epoch": 7975} {"train_loss": -27.51974868774414, "global_step": 661944, "epoch": 7975} {"train_loss": -27.255172729492188, "global_step": 661945, "epoch": 7975} {"train_loss": -27.331003189086914, "global_step": 661946, "epoch": 7975} {"train_loss": -27.947492599487305, "global_step": 661947, "epoch": 7975} {"train_loss": -27.896869659423828, "global_step": 661948, "epoch": 7975} {"train_loss": -27.8349609375, "global_step": 661949, "epoch": 7975} {"train_loss": -28.338220596313477, "global_step": 661950, "epoch": 7975} {"train_loss": -28.14288902282715, "global_step": 661951, "epoch": 7975} {"train_loss": -27.777334213256836, "global_step": 661952, "epoch": 7975} {"train_loss": -28.056325912475586, "global_step": 661953, "epoch": 7975} {"train_loss": -27.973459243774414, "global_step": 661954, "epoch": 7975} {"train_loss": -28.0747013092041, "global_step": 661955, "epoch": 7975} {"train_loss": -27.945119857788086, "global_step": 661956, "epoch": 7975} {"train_loss": -27.812875747680664, "global_step": 661957, "epoch": 7975} {"train_loss": -28.01991081237793, "global_step": 661958, "epoch": 7975} {"train_loss": -27.890888214111328, "global_step": 661959, "epoch": 7975} {"train_loss": -28.27961540222168, "global_step": 661960, "epoch": 7975} {"train_loss": -28.146133422851562, "global_step": 661961, "epoch": 7975} {"train_loss": -27.895360946655273, "global_step": 661962, "epoch": 7975} {"train_loss": -28.305404663085938, "global_step": 661963, "epoch": 7975} {"train_loss": -28.379032135009766, "global_step": 661964, "epoch": 7975} {"train_loss": -28.34696388244629, "global_step": 661965, "epoch": 7975} {"train_loss": -28.212926864624023, "global_step": 661966, "epoch": 7975} {"train_loss": -28.166635513305664, "global_step": 661967, "epoch": 7975} {"train_loss": -28.541976928710938, "global_step": 661968, "epoch": 7975} {"train_loss": -28.427412033081055, "global_step": 661969, "epoch": 7975} {"train_loss": -28.630956649780273, "global_step": 661970, "epoch": 7975} {"train_loss": -28.464155197143555, "global_step": 661971, "epoch": 7975} {"train_loss": -28.691076278686523, "global_step": 661972, "epoch": 7975} {"train_loss": -28.610488891601562, "global_step": 661973, "epoch": 7975} {"train_loss": -28.095800399780273, "global_step": 661974, "epoch": 7975} {"train_loss": -28.6120548248291, "global_step": 661975, "epoch": 7975} {"train_loss": -28.54850196838379, "global_step": 661976, "epoch": 7975} {"train_loss": -28.418354034423828, "global_step": 661977, "epoch": 7975} {"train_loss": -28.3258113861084, "global_step": 661978, "epoch": 7975} {"train_loss": -28.600622177124023, "global_step": 661979, "epoch": 7975} {"train_loss": -28.366003036499023, "global_step": 661980, "epoch": 7975} {"train_loss": -28.60171890258789, "global_step": 661981, "epoch": 7975} {"train_loss": -28.56549072265625, "global_step": 661982, "epoch": 7975} {"train_loss": -28.266788482666016, "global_step": 661983, "epoch": 7975} {"train_loss": -28.75836753845215, "global_step": 661984, "epoch": 7975} {"train_loss": -28.779356002807617, "global_step": 661985, "epoch": 7975} {"train_loss": -28.682159423828125, "global_step": 661986, "epoch": 7975} {"train_loss": -28.554187774658203, "global_step": 661987, "epoch": 7975} {"train_loss": -28.27701759338379, "global_step": 661988, "epoch": 7975} {"train_loss": -29.01338005065918, "global_step": 661989, "epoch": 7975} {"train_loss": -28.401220321655273, "global_step": 661990, "epoch": 7975} {"train_loss": -28.71095848083496, "global_step": 661991, "epoch": 7975} {"train_loss": -28.637052536010742, "global_step": 661992, "epoch": 7975} {"train_loss": -28.709753036499023, "global_step": 661993, "epoch": 7975} {"train_loss": -28.873544692993164, "global_step": 661994, "epoch": 7975} {"train_loss": -28.289112091064453, "global_step": 661995, "epoch": 7975} {"train_loss": -28.477828979492188, "global_step": 661996, "epoch": 7975} {"train_loss": -28.44964599609375, "global_step": 661997, "epoch": 7975} {"train_loss": -28.07240867614746, "global_step": 661998, "epoch": 7975} {"train_loss": -28.376123428344727, "global_step": 661999, "epoch": 7975} {"train_loss": -28.859699249267578, "global_step": 662000, "epoch": 7975} {"train_loss": -28.287494659423828, "global_step": 662001, "epoch": 7975} {"train_loss": -28.4444522857666, "global_step": 662002, "epoch": 7975} {"train_loss": -28.414587020874023, "global_step": 662003, "epoch": 7975} {"train_loss": -28.136188507080078, "global_step": 662004, "epoch": 7975} {"train_loss": -27.64405632019043, "global_step": 662005, "epoch": 7975} {"train_loss": -27.470678329467773, "global_step": 662006, "epoch": 7975} {"train_loss": -28.018346005175488, "global_step": 662007, "epoch": 7975, "val_loss": 6656008.0} {"train_loss": -26.75178337097168, "global_step": 662008, "epoch": 7976} {"train_loss": -27.1556453704834, "global_step": 662009, "epoch": 7976} {"train_loss": -27.560277938842773, "global_step": 662010, "epoch": 7976} {"train_loss": -27.351306915283203, "global_step": 662011, "epoch": 7976} {"train_loss": -27.521146774291992, "global_step": 662012, "epoch": 7976} {"train_loss": -27.22041893005371, "global_step": 662013, "epoch": 7976} {"train_loss": -27.998456954956055, "global_step": 662014, "epoch": 7976} {"train_loss": -27.63160514831543, "global_step": 662015, "epoch": 7976} {"train_loss": -27.459552764892578, "global_step": 662016, "epoch": 7976} {"train_loss": -27.812238693237305, "global_step": 662017, "epoch": 7976} {"train_loss": -27.649662017822266, "global_step": 662018, "epoch": 7976} {"train_loss": -27.650415420532227, "global_step": 662019, "epoch": 7976} {"train_loss": -27.68096351623535, "global_step": 662020, "epoch": 7976} {"train_loss": -28.375202178955078, "global_step": 662021, "epoch": 7976} {"train_loss": -27.559141159057617, "global_step": 662022, "epoch": 7976} {"train_loss": -28.194456100463867, "global_step": 662023, "epoch": 7976} {"train_loss": -27.60527992248535, "global_step": 662024, "epoch": 7976} {"train_loss": -27.80256462097168, "global_step": 662025, "epoch": 7976} {"train_loss": -28.033771514892578, "global_step": 662026, "epoch": 7976} {"train_loss": -27.911407470703125, "global_step": 662027, "epoch": 7976} {"train_loss": -28.30512809753418, "global_step": 662028, "epoch": 7976} {"train_loss": -28.080915451049805, "global_step": 662029, "epoch": 7976} {"train_loss": -27.81611442565918, "global_step": 662030, "epoch": 7976} {"train_loss": -27.927743911743164, "global_step": 662031, "epoch": 7976} {"train_loss": -28.218372344970703, "global_step": 662032, "epoch": 7976} {"train_loss": -28.043487548828125, "global_step": 662033, "epoch": 7976} {"train_loss": -28.234516143798828, "global_step": 662034, "epoch": 7976} {"train_loss": -28.13140869140625, "global_step": 662035, "epoch": 7976} {"train_loss": -28.32330322265625, "global_step": 662036, "epoch": 7976} {"train_loss": -28.301313400268555, "global_step": 662037, "epoch": 7976} {"train_loss": -28.248950958251953, "global_step": 662038, "epoch": 7976} {"train_loss": -28.496204376220703, "global_step": 662039, "epoch": 7976} {"train_loss": -28.478992462158203, "global_step": 662040, "epoch": 7976} {"train_loss": -28.51869010925293, "global_step": 662041, "epoch": 7976} {"train_loss": -28.44733238220215, "global_step": 662042, "epoch": 7976} {"train_loss": -28.404306411743164, "global_step": 662043, "epoch": 7976} {"train_loss": -28.778888702392578, "global_step": 662044, "epoch": 7976} {"train_loss": -28.261178970336914, "global_step": 662045, "epoch": 7976} {"train_loss": -28.60377311706543, "global_step": 662046, "epoch": 7976} {"train_loss": -28.568994522094727, "global_step": 662047, "epoch": 7976} {"train_loss": -28.629779815673828, "global_step": 662048, "epoch": 7976} {"train_loss": -28.35945701599121, "global_step": 662049, "epoch": 7976} {"train_loss": -28.155126571655273, "global_step": 662050, "epoch": 7976} {"train_loss": -28.82575035095215, "global_step": 662051, "epoch": 7976} {"train_loss": -28.7857608795166, "global_step": 662052, "epoch": 7976} {"train_loss": -28.18984031677246, "global_step": 662053, "epoch": 7976} {"train_loss": -28.73540687561035, "global_step": 662054, "epoch": 7976} {"train_loss": -28.1295223236084, "global_step": 662055, "epoch": 7976} {"train_loss": -28.47003746032715, "global_step": 662056, "epoch": 7976} {"train_loss": -28.519922256469727, "global_step": 662057, "epoch": 7976} {"train_loss": -28.804977416992188, "global_step": 662058, "epoch": 7976} {"train_loss": -28.596906661987305, "global_step": 662059, "epoch": 7976} {"train_loss": -28.477554321289062, "global_step": 662060, "epoch": 7976} {"train_loss": -28.9781551361084, "global_step": 662061, "epoch": 7976} {"train_loss": -28.17982292175293, "global_step": 662062, "epoch": 7976} {"train_loss": -28.414081573486328, "global_step": 662063, "epoch": 7976} {"train_loss": -28.017629623413086, "global_step": 662064, "epoch": 7976} {"train_loss": -28.196380615234375, "global_step": 662065, "epoch": 7976} {"train_loss": -28.387174606323242, "global_step": 662066, "epoch": 7976} {"train_loss": -28.604745864868164, "global_step": 662067, "epoch": 7976} {"train_loss": -28.781082153320312, "global_step": 662068, "epoch": 7976} {"train_loss": -28.417463302612305, "global_step": 662069, "epoch": 7976} {"train_loss": -28.4127254486084, "global_step": 662070, "epoch": 7976} {"train_loss": -28.270719528198242, "global_step": 662071, "epoch": 7976} {"train_loss": -28.100223541259766, "global_step": 662072, "epoch": 7976} {"train_loss": -28.569660186767578, "global_step": 662073, "epoch": 7976} {"train_loss": -28.531005859375, "global_step": 662074, "epoch": 7976} {"train_loss": -28.27845573425293, "global_step": 662075, "epoch": 7976} {"train_loss": -27.936071395874023, "global_step": 662076, "epoch": 7976} {"train_loss": -28.22653579711914, "global_step": 662077, "epoch": 7976} {"train_loss": -28.74570655822754, "global_step": 662078, "epoch": 7976} {"train_loss": -28.441389083862305, "global_step": 662079, "epoch": 7976} {"train_loss": -28.195667266845703, "global_step": 662080, "epoch": 7976} {"train_loss": -28.213132858276367, "global_step": 662081, "epoch": 7976} {"train_loss": -28.035486221313477, "global_step": 662082, "epoch": 7976} {"train_loss": -28.385913848876953, "global_step": 662083, "epoch": 7976} {"train_loss": -28.517932891845703, "global_step": 662084, "epoch": 7976} {"train_loss": -27.75794792175293, "global_step": 662085, "epoch": 7976} {"train_loss": -27.57940101623535, "global_step": 662086, "epoch": 7976} {"train_loss": -27.960575103759766, "global_step": 662087, "epoch": 7976} {"train_loss": -28.476449966430664, "global_step": 662088, "epoch": 7976} {"train_loss": -28.21755027770996, "global_step": 662089, "epoch": 7976} {"train_loss": -28.18342243332461, "global_step": 662090, "epoch": 7976, "val_loss": 6661775.5} {"train_loss": -27.489709854125977, "global_step": 662091, "epoch": 7977} {"train_loss": -27.304487228393555, "global_step": 662092, "epoch": 7977} {"train_loss": -27.242292404174805, "global_step": 662093, "epoch": 7977} {"train_loss": -27.730865478515625, "global_step": 662094, "epoch": 7977} {"train_loss": -27.587610244750977, "global_step": 662095, "epoch": 7977} {"train_loss": -27.886648178100586, "global_step": 662096, "epoch": 7977} {"train_loss": -27.593524932861328, "global_step": 662097, "epoch": 7977} {"train_loss": -28.13970375061035, "global_step": 662098, "epoch": 7977} {"train_loss": -27.887191772460938, "global_step": 662099, "epoch": 7977} {"train_loss": -28.520177841186523, "global_step": 662100, "epoch": 7977} {"train_loss": -27.94819450378418, "global_step": 662101, "epoch": 7977} {"train_loss": -28.25589942932129, "global_step": 662102, "epoch": 7977} {"train_loss": -27.930267333984375, "global_step": 662103, "epoch": 7977} {"train_loss": -28.181716918945312, "global_step": 662104, "epoch": 7977} {"train_loss": -28.12984275817871, "global_step": 662105, "epoch": 7977} {"train_loss": -27.72181510925293, "global_step": 662106, "epoch": 7977} {"train_loss": -28.0909481048584, "global_step": 662107, "epoch": 7977} {"train_loss": -28.246891021728516, "global_step": 662108, "epoch": 7977} {"train_loss": -28.10340690612793, "global_step": 662109, "epoch": 7977} {"train_loss": -28.20440101623535, "global_step": 662110, "epoch": 7977} {"train_loss": -28.41379737854004, "global_step": 662111, "epoch": 7977} {"train_loss": -28.181324005126953, "global_step": 662112, "epoch": 7977} {"train_loss": -28.106542587280273, "global_step": 662113, "epoch": 7977} {"train_loss": -28.417438507080078, "global_step": 662114, "epoch": 7977} {"train_loss": -27.9881649017334, "global_step": 662115, "epoch": 7977} {"train_loss": -28.123184204101562, "global_step": 662116, "epoch": 7977} {"train_loss": -28.497623443603516, "global_step": 662117, "epoch": 7977} {"train_loss": -28.47224235534668, "global_step": 662118, "epoch": 7977} {"train_loss": -28.5230712890625, "global_step": 662119, "epoch": 7977} {"train_loss": -28.241941452026367, "global_step": 662120, "epoch": 7977} {"train_loss": -28.164520263671875, "global_step": 662121, "epoch": 7977} {"train_loss": -28.443317413330078, "global_step": 662122, "epoch": 7977} {"train_loss": -28.536340713500977, "global_step": 662123, "epoch": 7977} {"train_loss": -28.601154327392578, "global_step": 662124, "epoch": 7977} {"train_loss": -28.54133415222168, "global_step": 662125, "epoch": 7977} {"train_loss": -28.569589614868164, "global_step": 662126, "epoch": 7977} {"train_loss": -28.104888916015625, "global_step": 662127, "epoch": 7977} {"train_loss": -28.32356071472168, "global_step": 662128, "epoch": 7977} {"train_loss": -28.3216552734375, "global_step": 662129, "epoch": 7977} {"train_loss": -28.851245880126953, "global_step": 662130, "epoch": 7977} {"train_loss": -28.442768096923828, "global_step": 662131, "epoch": 7977} {"train_loss": -28.309701919555664, "global_step": 662132, "epoch": 7977} {"train_loss": -28.660531997680664, "global_step": 662133, "epoch": 7977} {"train_loss": -28.513660430908203, "global_step": 662134, "epoch": 7977} {"train_loss": -28.394697189331055, "global_step": 662135, "epoch": 7977} {"train_loss": -28.53496742248535, "global_step": 662136, "epoch": 7977} {"train_loss": -28.760839462280273, "global_step": 662137, "epoch": 7977} {"train_loss": -28.38840675354004, "global_step": 662138, "epoch": 7977} {"train_loss": -28.504125595092773, "global_step": 662139, "epoch": 7977} {"train_loss": -28.839941024780273, "global_step": 662140, "epoch": 7977} {"train_loss": -28.637725830078125, "global_step": 662141, "epoch": 7977} {"train_loss": -28.40851402282715, "global_step": 662142, "epoch": 7977} {"train_loss": -28.49195671081543, "global_step": 662143, "epoch": 7977} {"train_loss": -28.417097091674805, "global_step": 662144, "epoch": 7977} {"train_loss": -28.41853904724121, "global_step": 662145, "epoch": 7977} {"train_loss": -28.238866806030273, "global_step": 662146, "epoch": 7977} {"train_loss": -28.117694854736328, "global_step": 662147, "epoch": 7977} {"train_loss": -28.19993019104004, "global_step": 662148, "epoch": 7977} {"train_loss": -28.34698486328125, "global_step": 662149, "epoch": 7977} {"train_loss": -28.5360107421875, "global_step": 662150, "epoch": 7977} {"train_loss": -28.13954734802246, "global_step": 662151, "epoch": 7977} {"train_loss": -27.585052490234375, "global_step": 662152, "epoch": 7977} {"train_loss": -27.925336837768555, "global_step": 662153, "epoch": 7977} {"train_loss": -28.238882064819336, "global_step": 662154, "epoch": 7977} {"train_loss": -26.9112606048584, "global_step": 662155, "epoch": 7977} {"train_loss": -26.0721435546875, "global_step": 662156, "epoch": 7977} {"train_loss": -27.634748458862305, "global_step": 662157, "epoch": 7977} {"train_loss": -27.388395309448242, "global_step": 662158, "epoch": 7977} {"train_loss": -27.4429988861084, "global_step": 662159, "epoch": 7977} {"train_loss": -27.615930557250977, "global_step": 662160, "epoch": 7977} {"train_loss": -28.069171905517578, "global_step": 662161, "epoch": 7977} {"train_loss": -27.66570472717285, "global_step": 662162, "epoch": 7977} {"train_loss": -28.017980575561523, "global_step": 662163, "epoch": 7977} {"train_loss": -27.865203857421875, "global_step": 662164, "epoch": 7977} {"train_loss": -28.099103927612305, "global_step": 662165, "epoch": 7977} {"train_loss": -27.779678344726562, "global_step": 662166, "epoch": 7977} {"train_loss": -28.047332763671875, "global_step": 662167, "epoch": 7977} {"train_loss": -28.028783798217773, "global_step": 662168, "epoch": 7977} {"train_loss": -27.92119789123535, "global_step": 662169, "epoch": 7977} {"train_loss": -28.439544677734375, "global_step": 662170, "epoch": 7977} {"train_loss": -28.037023544311523, "global_step": 662171, "epoch": 7977} {"train_loss": -28.32080078125, "global_step": 662172, "epoch": 7977} {"train_loss": -28.12639574257724, "global_step": 662173, "epoch": 7977, "val_loss": 6712206.0} {"train_loss": -27.72641372680664, "global_step": 662174, "epoch": 7978} {"train_loss": -27.910324096679688, "global_step": 662175, "epoch": 7978} {"train_loss": -27.61561393737793, "global_step": 662176, "epoch": 7978} {"train_loss": -27.817453384399414, "global_step": 662177, "epoch": 7978} {"train_loss": -27.93951416015625, "global_step": 662178, "epoch": 7978} {"train_loss": -27.964597702026367, "global_step": 662179, "epoch": 7978} {"train_loss": -28.02100944519043, "global_step": 662180, "epoch": 7978} {"train_loss": -28.09891128540039, "global_step": 662181, "epoch": 7978} {"train_loss": -27.851125717163086, "global_step": 662182, "epoch": 7978} {"train_loss": -28.21523094177246, "global_step": 662183, "epoch": 7978} {"train_loss": -27.933507919311523, "global_step": 662184, "epoch": 7978} {"train_loss": -28.140533447265625, "global_step": 662185, "epoch": 7978} {"train_loss": -27.8784236907959, "global_step": 662186, "epoch": 7978} {"train_loss": -27.956329345703125, "global_step": 662187, "epoch": 7978} {"train_loss": -28.334457397460938, "global_step": 662188, "epoch": 7978} {"train_loss": -28.15009880065918, "global_step": 662189, "epoch": 7978} {"train_loss": -28.463891983032227, "global_step": 662190, "epoch": 7978} {"train_loss": -28.1029052734375, "global_step": 662191, "epoch": 7978} {"train_loss": -28.699705123901367, "global_step": 662192, "epoch": 7978} {"train_loss": -28.2768497467041, "global_step": 662193, "epoch": 7978} {"train_loss": -27.943164825439453, "global_step": 662194, "epoch": 7978} {"train_loss": -28.292078018188477, "global_step": 662195, "epoch": 7978} {"train_loss": -28.584381103515625, "global_step": 662196, "epoch": 7978} {"train_loss": -28.383346557617188, "global_step": 662197, "epoch": 7978} {"train_loss": -28.326175689697266, "global_step": 662198, "epoch": 7978} {"train_loss": -28.489511489868164, "global_step": 662199, "epoch": 7978} {"train_loss": -28.338886260986328, "global_step": 662200, "epoch": 7978} {"train_loss": -28.801441192626953, "global_step": 662201, "epoch": 7978} {"train_loss": -28.34231948852539, "global_step": 662202, "epoch": 7978} {"train_loss": -28.517078399658203, "global_step": 662203, "epoch": 7978} {"train_loss": -28.14150047302246, "global_step": 662204, "epoch": 7978} {"train_loss": -28.2413330078125, "global_step": 662205, "epoch": 7978} {"train_loss": -28.204526901245117, "global_step": 662206, "epoch": 7978} {"train_loss": -28.057653427124023, "global_step": 662207, "epoch": 7978} {"train_loss": -28.18819236755371, "global_step": 662208, "epoch": 7978} {"train_loss": -28.398481369018555, "global_step": 662209, "epoch": 7978} {"train_loss": -27.843297958374023, "global_step": 662210, "epoch": 7978} {"train_loss": -28.076904296875, "global_step": 662211, "epoch": 7978} {"train_loss": -28.068613052368164, "global_step": 662212, "epoch": 7978} {"train_loss": -28.227231979370117, "global_step": 662213, "epoch": 7978} {"train_loss": -28.917402267456055, "global_step": 662214, "epoch": 7978} {"train_loss": -28.09818458557129, "global_step": 662215, "epoch": 7978} {"train_loss": -28.224756240844727, "global_step": 662216, "epoch": 7978} {"train_loss": -28.745508193969727, "global_step": 662217, "epoch": 7978} {"train_loss": -28.289987564086914, "global_step": 662218, "epoch": 7978} {"train_loss": -28.61348533630371, "global_step": 662219, "epoch": 7978} {"train_loss": -28.513341903686523, "global_step": 662220, "epoch": 7978} {"train_loss": -28.448434829711914, "global_step": 662221, "epoch": 7978} {"train_loss": -28.429723739624023, "global_step": 662222, "epoch": 7978} {"train_loss": -28.230274200439453, "global_step": 662223, "epoch": 7978} {"train_loss": -28.5933837890625, "global_step": 662224, "epoch": 7978} {"train_loss": -28.52197265625, "global_step": 662225, "epoch": 7978} {"train_loss": -28.3736572265625, "global_step": 662226, "epoch": 7978} {"train_loss": -28.540271759033203, "global_step": 662227, "epoch": 7978} {"train_loss": -28.320261001586914, "global_step": 662228, "epoch": 7978} {"train_loss": -28.561126708984375, "global_step": 662229, "epoch": 7978} {"train_loss": -28.610105514526367, "global_step": 662230, "epoch": 7978} {"train_loss": -28.568592071533203, "global_step": 662231, "epoch": 7978} {"train_loss": -28.64373779296875, "global_step": 662232, "epoch": 7978} {"train_loss": -28.645050048828125, "global_step": 662233, "epoch": 7978} {"train_loss": -28.660425186157227, "global_step": 662234, "epoch": 7978} {"train_loss": -28.50714683532715, "global_step": 662235, "epoch": 7978} {"train_loss": -28.749359130859375, "global_step": 662236, "epoch": 7978} {"train_loss": -28.498737335205078, "global_step": 662237, "epoch": 7978} {"train_loss": -28.696945190429688, "global_step": 662238, "epoch": 7978} {"train_loss": -28.424047470092773, "global_step": 662239, "epoch": 7978} {"train_loss": -28.59352684020996, "global_step": 662240, "epoch": 7978} {"train_loss": -27.975255966186523, "global_step": 662241, "epoch": 7978} {"train_loss": -28.196887969970703, "global_step": 662242, "epoch": 7978} {"train_loss": -28.239652633666992, "global_step": 662243, "epoch": 7978} {"train_loss": -28.258819580078125, "global_step": 662244, "epoch": 7978} {"train_loss": -28.479827880859375, "global_step": 662245, "epoch": 7978} {"train_loss": -28.256383895874023, "global_step": 662246, "epoch": 7978} {"train_loss": -28.260440826416016, "global_step": 662247, "epoch": 7978} {"train_loss": -27.966217041015625, "global_step": 662248, "epoch": 7978} {"train_loss": -28.39794921875, "global_step": 662249, "epoch": 7978} {"train_loss": -28.665470123291016, "global_step": 662250, "epoch": 7978} {"train_loss": -27.72846794128418, "global_step": 662251, "epoch": 7978} {"train_loss": -27.567174911499023, "global_step": 662252, "epoch": 7978} {"train_loss": -28.27630615234375, "global_step": 662253, "epoch": 7978} {"train_loss": -28.344879150390625, "global_step": 662254, "epoch": 7978} {"train_loss": -28.422510147094727, "global_step": 662255, "epoch": 7978} {"train_loss": -28.290707254984294, "global_step": 662256, "epoch": 7978, "val_loss": 6658533.5} {"train_loss": -27.71015739440918, "global_step": 662257, "epoch": 7979} {"train_loss": -27.711271286010742, "global_step": 662258, "epoch": 7979} {"train_loss": -27.95440673828125, "global_step": 662259, "epoch": 7979} {"train_loss": -28.069746017456055, "global_step": 662260, "epoch": 7979} {"train_loss": -27.69947624206543, "global_step": 662261, "epoch": 7979} {"train_loss": -28.131256103515625, "global_step": 662262, "epoch": 7979} {"train_loss": -28.05084800720215, "global_step": 662263, "epoch": 7979} {"train_loss": -28.302722930908203, "global_step": 662264, "epoch": 7979} {"train_loss": -28.08936882019043, "global_step": 662265, "epoch": 7979} {"train_loss": -28.36749267578125, "global_step": 662266, "epoch": 7979} {"train_loss": -28.368762969970703, "global_step": 662267, "epoch": 7979} {"train_loss": -28.341888427734375, "global_step": 662268, "epoch": 7979} {"train_loss": -28.227447509765625, "global_step": 662269, "epoch": 7979} {"train_loss": -28.673965454101562, "global_step": 662270, "epoch": 7979} {"train_loss": -28.119421005249023, "global_step": 662271, "epoch": 7979} {"train_loss": -28.550567626953125, "global_step": 662272, "epoch": 7979} {"train_loss": -28.47553825378418, "global_step": 662273, "epoch": 7979} {"train_loss": -28.24531364440918, "global_step": 662274, "epoch": 7979} {"train_loss": -28.42646598815918, "global_step": 662275, "epoch": 7979} {"train_loss": -28.525609970092773, "global_step": 662276, "epoch": 7979} {"train_loss": -28.344430923461914, "global_step": 662277, "epoch": 7979} {"train_loss": -28.470956802368164, "global_step": 662278, "epoch": 7979} {"train_loss": -28.539936065673828, "global_step": 662279, "epoch": 7979} {"train_loss": -28.09977149963379, "global_step": 662280, "epoch": 7979} {"train_loss": -28.211454391479492, "global_step": 662281, "epoch": 7979} {"train_loss": -27.778400421142578, "global_step": 662282, "epoch": 7979} {"train_loss": -27.565170288085938, "global_step": 662283, "epoch": 7979} {"train_loss": -28.28913688659668, "global_step": 662284, "epoch": 7979} {"train_loss": -28.33477783203125, "global_step": 662285, "epoch": 7979} {"train_loss": -28.073352813720703, "global_step": 662286, "epoch": 7979} {"train_loss": -28.255035400390625, "global_step": 662287, "epoch": 7979} {"train_loss": -28.4068660736084, "global_step": 662288, "epoch": 7979} {"train_loss": -28.30476188659668, "global_step": 662289, "epoch": 7979} {"train_loss": -28.290414810180664, "global_step": 662290, "epoch": 7979} {"train_loss": -28.48779296875, "global_step": 662291, "epoch": 7979} {"train_loss": -28.242124557495117, "global_step": 662292, "epoch": 7979} {"train_loss": -28.45562171936035, "global_step": 662293, "epoch": 7979} {"train_loss": -28.328699111938477, "global_step": 662294, "epoch": 7979} {"train_loss": -28.592748641967773, "global_step": 662295, "epoch": 7979} {"train_loss": -28.797718048095703, "global_step": 662296, "epoch": 7979} {"train_loss": -28.336950302124023, "global_step": 662297, "epoch": 7979} {"train_loss": -28.46766471862793, "global_step": 662298, "epoch": 7979} {"train_loss": -28.59644889831543, "global_step": 662299, "epoch": 7979} {"train_loss": -28.16189956665039, "global_step": 662300, "epoch": 7979} {"train_loss": -28.581274032592773, "global_step": 662301, "epoch": 7979} {"train_loss": -28.791370391845703, "global_step": 662302, "epoch": 7979} {"train_loss": -28.499258041381836, "global_step": 662303, "epoch": 7979} {"train_loss": -28.628549575805664, "global_step": 662304, "epoch": 7979} {"train_loss": -28.578893661499023, "global_step": 662305, "epoch": 7979} {"train_loss": -28.3314151763916, "global_step": 662306, "epoch": 7979} {"train_loss": -28.501449584960938, "global_step": 662307, "epoch": 7979} {"train_loss": -28.3189640045166, "global_step": 662308, "epoch": 7979} {"train_loss": -28.463581085205078, "global_step": 662309, "epoch": 7979} {"train_loss": -28.46001625061035, "global_step": 662310, "epoch": 7979} {"train_loss": -28.02168083190918, "global_step": 662311, "epoch": 7979} {"train_loss": -27.6236629486084, "global_step": 662312, "epoch": 7979} {"train_loss": -27.278045654296875, "global_step": 662313, "epoch": 7979} {"train_loss": -27.880313873291016, "global_step": 662314, "epoch": 7979} {"train_loss": -28.3449764251709, "global_step": 662315, "epoch": 7979} {"train_loss": -28.411664962768555, "global_step": 662316, "epoch": 7979} {"train_loss": -28.039926528930664, "global_step": 662317, "epoch": 7979} {"train_loss": -27.975683212280273, "global_step": 662318, "epoch": 7979} {"train_loss": -28.21990394592285, "global_step": 662319, "epoch": 7979} {"train_loss": -28.32379150390625, "global_step": 662320, "epoch": 7979} {"train_loss": -28.02439308166504, "global_step": 662321, "epoch": 7979} {"train_loss": -28.1522216796875, "global_step": 662322, "epoch": 7979} {"train_loss": -28.114273071289062, "global_step": 662323, "epoch": 7979} {"train_loss": -27.761510848999023, "global_step": 662324, "epoch": 7979} {"train_loss": -28.513187408447266, "global_step": 662325, "epoch": 7979} {"train_loss": -28.102588653564453, "global_step": 662326, "epoch": 7979} {"train_loss": -28.446252822875977, "global_step": 662327, "epoch": 7979} {"train_loss": -27.875167846679688, "global_step": 662328, "epoch": 7979} {"train_loss": -28.43928337097168, "global_step": 662329, "epoch": 7979} {"train_loss": -28.17457389831543, "global_step": 662330, "epoch": 7979} {"train_loss": -28.32284927368164, "global_step": 662331, "epoch": 7979} {"train_loss": -28.330535888671875, "global_step": 662332, "epoch": 7979} {"train_loss": -28.495344161987305, "global_step": 662333, "epoch": 7979} {"train_loss": -28.6683406829834, "global_step": 662334, "epoch": 7979} {"train_loss": -28.154027938842773, "global_step": 662335, "epoch": 7979} {"train_loss": -28.4744873046875, "global_step": 662336, "epoch": 7979} {"train_loss": -28.347379684448242, "global_step": 662337, "epoch": 7979} {"train_loss": -28.599262237548828, "global_step": 662338, "epoch": 7979} {"train_loss": -28.265500401876057, "global_step": 662339, "epoch": 7979, "val_loss": 6627094.5} {"train_loss": -27.599424362182617, "global_step": 662340, "epoch": 7980} {"train_loss": -26.551122665405273, "global_step": 662341, "epoch": 7980} {"train_loss": -25.686025619506836, "global_step": 662342, "epoch": 7980} {"train_loss": -26.876020431518555, "global_step": 662343, "epoch": 7980} {"train_loss": -25.58827781677246, "global_step": 662344, "epoch": 7980} {"train_loss": -25.764795303344727, "global_step": 662345, "epoch": 7980} {"train_loss": -26.276996612548828, "global_step": 662346, "epoch": 7980} {"train_loss": -26.85365104675293, "global_step": 662347, "epoch": 7980} {"train_loss": -27.331457138061523, "global_step": 662348, "epoch": 7980} {"train_loss": -26.46111488342285, "global_step": 662349, "epoch": 7980} {"train_loss": -27.047653198242188, "global_step": 662350, "epoch": 7980} {"train_loss": -27.570514678955078, "global_step": 662351, "epoch": 7980} {"train_loss": -27.029386520385742, "global_step": 662352, "epoch": 7980} {"train_loss": -26.984960556030273, "global_step": 662353, "epoch": 7980} {"train_loss": -27.575393676757812, "global_step": 662354, "epoch": 7980} {"train_loss": -27.67416763305664, "global_step": 662355, "epoch": 7980} {"train_loss": -27.751779556274414, "global_step": 662356, "epoch": 7980} {"train_loss": -27.459115982055664, "global_step": 662357, "epoch": 7980} {"train_loss": -27.897809982299805, "global_step": 662358, "epoch": 7980} {"train_loss": -27.584278106689453, "global_step": 662359, "epoch": 7980} {"train_loss": -28.166244506835938, "global_step": 662360, "epoch": 7980} {"train_loss": -28.164447784423828, "global_step": 662361, "epoch": 7980} {"train_loss": -27.92313003540039, "global_step": 662362, "epoch": 7980} {"train_loss": -28.10468864440918, "global_step": 662363, "epoch": 7980} {"train_loss": -27.979705810546875, "global_step": 662364, "epoch": 7980} {"train_loss": -27.819807052612305, "global_step": 662365, "epoch": 7980} {"train_loss": -28.281949996948242, "global_step": 662366, "epoch": 7980} {"train_loss": -28.350854873657227, "global_step": 662367, "epoch": 7980} {"train_loss": -28.4960994720459, "global_step": 662368, "epoch": 7980} {"train_loss": -28.31989097595215, "global_step": 662369, "epoch": 7980} {"train_loss": -28.30293083190918, "global_step": 662370, "epoch": 7980} {"train_loss": -28.5399112701416, "global_step": 662371, "epoch": 7980} {"train_loss": -28.394147872924805, "global_step": 662372, "epoch": 7980} {"train_loss": -28.296117782592773, "global_step": 662373, "epoch": 7980} {"train_loss": -28.548328399658203, "global_step": 662374, "epoch": 7980} {"train_loss": -28.07674217224121, "global_step": 662375, "epoch": 7980} {"train_loss": -28.092609405517578, "global_step": 662376, "epoch": 7980} {"train_loss": -28.155099868774414, "global_step": 662377, "epoch": 7980} {"train_loss": -28.631427764892578, "global_step": 662378, "epoch": 7980} {"train_loss": -28.38392448425293, "global_step": 662379, "epoch": 7980} {"train_loss": -28.00075340270996, "global_step": 662380, "epoch": 7980} {"train_loss": -28.32317543029785, "global_step": 662381, "epoch": 7980} {"train_loss": -28.402862548828125, "global_step": 662382, "epoch": 7980} {"train_loss": -28.363143920898438, "global_step": 662383, "epoch": 7980} {"train_loss": -28.402545928955078, "global_step": 662384, "epoch": 7980} {"train_loss": -28.196252822875977, "global_step": 662385, "epoch": 7980} {"train_loss": -28.285343170166016, "global_step": 662386, "epoch": 7980} {"train_loss": -28.603025436401367, "global_step": 662387, "epoch": 7980} {"train_loss": -28.304168701171875, "global_step": 662388, "epoch": 7980} {"train_loss": -28.619937896728516, "global_step": 662389, "epoch": 7980} {"train_loss": -28.278440475463867, "global_step": 662390, "epoch": 7980} {"train_loss": -28.35540199279785, "global_step": 662391, "epoch": 7980} {"train_loss": -28.526498794555664, "global_step": 662392, "epoch": 7980} {"train_loss": -28.241979598999023, "global_step": 662393, "epoch": 7980} {"train_loss": -28.419225692749023, "global_step": 662394, "epoch": 7980} {"train_loss": -28.13898277282715, "global_step": 662395, "epoch": 7980} {"train_loss": -27.886320114135742, "global_step": 662396, "epoch": 7980} {"train_loss": -27.72629165649414, "global_step": 662397, "epoch": 7980} {"train_loss": -27.900598526000977, "global_step": 662398, "epoch": 7980} {"train_loss": -28.466861724853516, "global_step": 662399, "epoch": 7980} {"train_loss": -28.136077880859375, "global_step": 662400, "epoch": 7980} {"train_loss": -27.5439510345459, "global_step": 662401, "epoch": 7980} {"train_loss": -27.457660675048828, "global_step": 662402, "epoch": 7980} {"train_loss": -28.411306381225586, "global_step": 662403, "epoch": 7980} {"train_loss": -28.0965576171875, "global_step": 662404, "epoch": 7980} {"train_loss": -28.41796875, "global_step": 662405, "epoch": 7980} {"train_loss": -28.042936325073242, "global_step": 662406, "epoch": 7980} {"train_loss": -28.042423248291016, "global_step": 662407, "epoch": 7980} {"train_loss": -27.750823974609375, "global_step": 662408, "epoch": 7980} {"train_loss": -27.57948112487793, "global_step": 662409, "epoch": 7980} {"train_loss": -27.89179801940918, "global_step": 662410, "epoch": 7980} {"train_loss": -28.2814884185791, "global_step": 662411, "epoch": 7980} {"train_loss": -28.31537437438965, "global_step": 662412, "epoch": 7980} {"train_loss": -27.986984252929688, "global_step": 662413, "epoch": 7980} {"train_loss": -28.266021728515625, "global_step": 662414, "epoch": 7980} {"train_loss": -28.11848258972168, "global_step": 662415, "epoch": 7980} {"train_loss": -27.97993278503418, "global_step": 662416, "epoch": 7980} {"train_loss": -27.81910514831543, "global_step": 662417, "epoch": 7980} {"train_loss": -28.462194442749023, "global_step": 662418, "epoch": 7980} {"train_loss": -28.416467666625977, "global_step": 662419, "epoch": 7980} {"train_loss": -27.95660972595215, "global_step": 662420, "epoch": 7980} {"train_loss": -28.268207550048828, "global_step": 662421, "epoch": 7980} {"train_loss": -27.90948759791363, "global_step": 662422, "epoch": 7980, "val_loss": 6727275.0} {"train_loss": -27.878332138061523, "global_step": 662423, "epoch": 7981} {"train_loss": -27.64118766784668, "global_step": 662424, "epoch": 7981} {"train_loss": -27.89251136779785, "global_step": 662425, "epoch": 7981} {"train_loss": -27.869043350219727, "global_step": 662426, "epoch": 7981} {"train_loss": -27.758264541625977, "global_step": 662427, "epoch": 7981} {"train_loss": -28.041269302368164, "global_step": 662428, "epoch": 7981} {"train_loss": -27.840856552124023, "global_step": 662429, "epoch": 7981} {"train_loss": -28.299732208251953, "global_step": 662430, "epoch": 7981} {"train_loss": -27.856184005737305, "global_step": 662431, "epoch": 7981} {"train_loss": -28.14812660217285, "global_step": 662432, "epoch": 7981} {"train_loss": -28.063629150390625, "global_step": 662433, "epoch": 7981} {"train_loss": -28.42962074279785, "global_step": 662434, "epoch": 7981} {"train_loss": -27.876224517822266, "global_step": 662435, "epoch": 7981} {"train_loss": -28.079986572265625, "global_step": 662436, "epoch": 7981} {"train_loss": -27.7734375, "global_step": 662437, "epoch": 7981} {"train_loss": -27.96441650390625, "global_step": 662438, "epoch": 7981} {"train_loss": -28.1640625, "global_step": 662439, "epoch": 7981} {"train_loss": -27.569717407226562, "global_step": 662440, "epoch": 7981} {"train_loss": -28.308984756469727, "global_step": 662441, "epoch": 7981} {"train_loss": -27.974414825439453, "global_step": 662442, "epoch": 7981} {"train_loss": -27.849170684814453, "global_step": 662443, "epoch": 7981} {"train_loss": -28.0412654876709, "global_step": 662444, "epoch": 7981} {"train_loss": -28.377527236938477, "global_step": 662445, "epoch": 7981} {"train_loss": -28.302648544311523, "global_step": 662446, "epoch": 7981} {"train_loss": -28.152576446533203, "global_step": 662447, "epoch": 7981} {"train_loss": -27.978540420532227, "global_step": 662448, "epoch": 7981} {"train_loss": -28.527830123901367, "global_step": 662449, "epoch": 7981} {"train_loss": -28.226282119750977, "global_step": 662450, "epoch": 7981} {"train_loss": -28.277402877807617, "global_step": 662451, "epoch": 7981} {"train_loss": -28.332279205322266, "global_step": 662452, "epoch": 7981} {"train_loss": -28.277917861938477, "global_step": 662453, "epoch": 7981} {"train_loss": -28.62330436706543, "global_step": 662454, "epoch": 7981} {"train_loss": -28.60589027404785, "global_step": 662455, "epoch": 7981} {"train_loss": -28.4352970123291, "global_step": 662456, "epoch": 7981} {"train_loss": -28.279159545898438, "global_step": 662457, "epoch": 7981} {"train_loss": -28.427875518798828, "global_step": 662458, "epoch": 7981} {"train_loss": -28.393579483032227, "global_step": 662459, "epoch": 7981} {"train_loss": -28.425580978393555, "global_step": 662460, "epoch": 7981} {"train_loss": -27.99264907836914, "global_step": 662461, "epoch": 7981} {"train_loss": -28.610422134399414, "global_step": 662462, "epoch": 7981} {"train_loss": -28.51637840270996, "global_step": 662463, "epoch": 7981} {"train_loss": -28.761920928955078, "global_step": 662464, "epoch": 7981} {"train_loss": -28.44514274597168, "global_step": 662465, "epoch": 7981} {"train_loss": -28.578027725219727, "global_step": 662466, "epoch": 7981} {"train_loss": -28.238906860351562, "global_step": 662467, "epoch": 7981} {"train_loss": -28.31818962097168, "global_step": 662468, "epoch": 7981} {"train_loss": -28.186376571655273, "global_step": 662469, "epoch": 7981} {"train_loss": -27.72291374206543, "global_step": 662470, "epoch": 7981} {"train_loss": -27.6378173828125, "global_step": 662471, "epoch": 7981} {"train_loss": -26.6117000579834, "global_step": 662472, "epoch": 7981} {"train_loss": -26.482440948486328, "global_step": 662473, "epoch": 7981} {"train_loss": -27.845746994018555, "global_step": 662474, "epoch": 7981} {"train_loss": -28.323278427124023, "global_step": 662475, "epoch": 7981} {"train_loss": -27.88128089904785, "global_step": 662476, "epoch": 7981} {"train_loss": -28.1566219329834, "global_step": 662477, "epoch": 7981} {"train_loss": -27.684879302978516, "global_step": 662478, "epoch": 7981} {"train_loss": -28.517187118530273, "global_step": 662479, "epoch": 7981} {"train_loss": -28.2386531829834, "global_step": 662480, "epoch": 7981} {"train_loss": -28.15985679626465, "global_step": 662481, "epoch": 7981} {"train_loss": -28.22782325744629, "global_step": 662482, "epoch": 7981} {"train_loss": -28.165790557861328, "global_step": 662483, "epoch": 7981} {"train_loss": -27.784757614135742, "global_step": 662484, "epoch": 7981} {"train_loss": -28.572553634643555, "global_step": 662485, "epoch": 7981} {"train_loss": -28.357187271118164, "global_step": 662486, "epoch": 7981} {"train_loss": -27.986297607421875, "global_step": 662487, "epoch": 7981} {"train_loss": -28.061492919921875, "global_step": 662488, "epoch": 7981} {"train_loss": -28.252851486206055, "global_step": 662489, "epoch": 7981} {"train_loss": -28.30368423461914, "global_step": 662490, "epoch": 7981} {"train_loss": -28.15826988220215, "global_step": 662491, "epoch": 7981} {"train_loss": -27.85907554626465, "global_step": 662492, "epoch": 7981} {"train_loss": -28.44160270690918, "global_step": 662493, "epoch": 7981} {"train_loss": -28.213336944580078, "global_step": 662494, "epoch": 7981} {"train_loss": -28.239667892456055, "global_step": 662495, "epoch": 7981} {"train_loss": -28.22743034362793, "global_step": 662496, "epoch": 7981} {"train_loss": -28.2650203704834, "global_step": 662497, "epoch": 7981} {"train_loss": -28.728708267211914, "global_step": 662498, "epoch": 7981} {"train_loss": -28.23065757751465, "global_step": 662499, "epoch": 7981} {"train_loss": -28.294361114501953, "global_step": 662500, "epoch": 7981} {"train_loss": -28.29010581970215, "global_step": 662501, "epoch": 7981} {"train_loss": -28.25300407409668, "global_step": 662502, "epoch": 7981} {"train_loss": -28.463369369506836, "global_step": 662503, "epoch": 7981} {"train_loss": -28.494993209838867, "global_step": 662504, "epoch": 7981} {"train_loss": -28.129374676440136, "global_step": 662505, "epoch": 7981, "val_loss": 6678115.0} {"train_loss": -26.225820541381836, "global_step": 662506, "epoch": 7982} {"train_loss": -25.563817977905273, "global_step": 662507, "epoch": 7982} {"train_loss": -27.430578231811523, "global_step": 662508, "epoch": 7982} {"train_loss": -26.97254753112793, "global_step": 662509, "epoch": 7982} {"train_loss": -26.8935489654541, "global_step": 662510, "epoch": 7982} {"train_loss": -27.528278350830078, "global_step": 662511, "epoch": 7982} {"train_loss": -27.00946617126465, "global_step": 662512, "epoch": 7982} {"train_loss": -27.570850372314453, "global_step": 662513, "epoch": 7982} {"train_loss": -26.800302505493164, "global_step": 662514, "epoch": 7982} {"train_loss": -27.535858154296875, "global_step": 662515, "epoch": 7982} {"train_loss": -27.415632247924805, "global_step": 662516, "epoch": 7982} {"train_loss": -27.61031150817871, "global_step": 662517, "epoch": 7982} {"train_loss": -27.21527671813965, "global_step": 662518, "epoch": 7982} {"train_loss": -27.444326400756836, "global_step": 662519, "epoch": 7982} {"train_loss": -27.642444610595703, "global_step": 662520, "epoch": 7982} {"train_loss": -27.695322036743164, "global_step": 662521, "epoch": 7982} {"train_loss": -27.64984703063965, "global_step": 662522, "epoch": 7982} {"train_loss": -27.759260177612305, "global_step": 662523, "epoch": 7982} {"train_loss": -27.961740493774414, "global_step": 662524, "epoch": 7982} {"train_loss": -28.0247745513916, "global_step": 662525, "epoch": 7982} {"train_loss": -28.185749053955078, "global_step": 662526, "epoch": 7982} {"train_loss": -28.460351943969727, "global_step": 662527, "epoch": 7982} {"train_loss": -28.1748104095459, "global_step": 662528, "epoch": 7982} {"train_loss": -28.37176513671875, "global_step": 662529, "epoch": 7982} {"train_loss": -28.089691162109375, "global_step": 662530, "epoch": 7982} {"train_loss": -28.3421688079834, "global_step": 662531, "epoch": 7982} {"train_loss": -28.184722900390625, "global_step": 662532, "epoch": 7982} {"train_loss": -28.043121337890625, "global_step": 662533, "epoch": 7982} {"train_loss": -28.081268310546875, "global_step": 662534, "epoch": 7982} {"train_loss": -28.029245376586914, "global_step": 662535, "epoch": 7982} {"train_loss": -28.486377716064453, "global_step": 662536, "epoch": 7982} {"train_loss": -28.0931396484375, "global_step": 662537, "epoch": 7982} {"train_loss": -27.8337459564209, "global_step": 662538, "epoch": 7982} {"train_loss": -28.59174156188965, "global_step": 662539, "epoch": 7982} {"train_loss": -28.39396095275879, "global_step": 662540, "epoch": 7982} {"train_loss": -28.290021896362305, "global_step": 662541, "epoch": 7982} {"train_loss": -28.409774780273438, "global_step": 662542, "epoch": 7982} {"train_loss": -28.344635009765625, "global_step": 662543, "epoch": 7982} {"train_loss": -28.49772071838379, "global_step": 662544, "epoch": 7982} {"train_loss": -28.550683975219727, "global_step": 662545, "epoch": 7982} {"train_loss": -28.337600708007812, "global_step": 662546, "epoch": 7982} {"train_loss": -28.424365997314453, "global_step": 662547, "epoch": 7982} {"train_loss": -28.216556549072266, "global_step": 662548, "epoch": 7982} {"train_loss": -28.460113525390625, "global_step": 662549, "epoch": 7982} {"train_loss": -28.363006591796875, "global_step": 662550, "epoch": 7982} {"train_loss": -28.234846115112305, "global_step": 662551, "epoch": 7982} {"train_loss": -28.62989616394043, "global_step": 662552, "epoch": 7982} {"train_loss": -28.53961753845215, "global_step": 662553, "epoch": 7982} {"train_loss": -29.137714385986328, "global_step": 662554, "epoch": 7982} {"train_loss": -28.496957778930664, "global_step": 662555, "epoch": 7982} {"train_loss": -28.730939865112305, "global_step": 662556, "epoch": 7982} {"train_loss": -28.492002487182617, "global_step": 662557, "epoch": 7982} {"train_loss": -28.735443115234375, "global_step": 662558, "epoch": 7982} {"train_loss": -28.82659912109375, "global_step": 662559, "epoch": 7982} {"train_loss": -29.023513793945312, "global_step": 662560, "epoch": 7982} {"train_loss": -28.671131134033203, "global_step": 662561, "epoch": 7982} {"train_loss": -28.592315673828125, "global_step": 662562, "epoch": 7982} {"train_loss": -28.66141700744629, "global_step": 662563, "epoch": 7982} {"train_loss": -28.523319244384766, "global_step": 662564, "epoch": 7982} {"train_loss": -28.480844497680664, "global_step": 662565, "epoch": 7982} {"train_loss": -28.453678131103516, "global_step": 662566, "epoch": 7982} {"train_loss": -28.5235595703125, "global_step": 662567, "epoch": 7982} {"train_loss": -28.58294677734375, "global_step": 662568, "epoch": 7982} {"train_loss": -28.70295524597168, "global_step": 662569, "epoch": 7982} {"train_loss": -28.529142379760742, "global_step": 662570, "epoch": 7982} {"train_loss": -28.189950942993164, "global_step": 662571, "epoch": 7982} {"train_loss": -28.368778228759766, "global_step": 662572, "epoch": 7982} {"train_loss": -28.549467086791992, "global_step": 662573, "epoch": 7982} {"train_loss": -28.22406578063965, "global_step": 662574, "epoch": 7982} {"train_loss": -27.85455894470215, "global_step": 662575, "epoch": 7982} {"train_loss": -28.52205467224121, "global_step": 662576, "epoch": 7982} {"train_loss": -28.5478572845459, "global_step": 662577, "epoch": 7982} {"train_loss": -28.47908592224121, "global_step": 662578, "epoch": 7982} {"train_loss": -28.279203414916992, "global_step": 662579, "epoch": 7982} {"train_loss": -28.132740020751953, "global_step": 662580, "epoch": 7982} {"train_loss": -28.641132354736328, "global_step": 662581, "epoch": 7982} {"train_loss": -28.423254013061523, "global_step": 662582, "epoch": 7982} {"train_loss": -28.3801326751709, "global_step": 662583, "epoch": 7982} {"train_loss": -28.47568702697754, "global_step": 662584, "epoch": 7982} {"train_loss": -27.6949462890625, "global_step": 662585, "epoch": 7982} {"train_loss": -28.442596435546875, "global_step": 662586, "epoch": 7982} {"train_loss": -27.527801513671875, "global_step": 662587, "epoch": 7982} {"train_loss": -28.127145606351185, "global_step": 662588, "epoch": 7982, "val_loss": 6681980.0} {"train_loss": -26.37554359436035, "global_step": 662589, "epoch": 7983} {"train_loss": -27.532743453979492, "global_step": 662590, "epoch": 7983} {"train_loss": -26.20989990234375, "global_step": 662591, "epoch": 7983} {"train_loss": -26.453933715820312, "global_step": 662592, "epoch": 7983} {"train_loss": -26.21587562561035, "global_step": 662593, "epoch": 7983} {"train_loss": -27.17145347595215, "global_step": 662594, "epoch": 7983} {"train_loss": -27.39358901977539, "global_step": 662595, "epoch": 7983} {"train_loss": -27.042505264282227, "global_step": 662596, "epoch": 7983} {"train_loss": -27.80524253845215, "global_step": 662597, "epoch": 7983} {"train_loss": -27.14081382751465, "global_step": 662598, "epoch": 7983} {"train_loss": -27.386655807495117, "global_step": 662599, "epoch": 7983} {"train_loss": -27.819284439086914, "global_step": 662600, "epoch": 7983} {"train_loss": -27.84515953063965, "global_step": 662601, "epoch": 7983} {"train_loss": -27.681127548217773, "global_step": 662602, "epoch": 7983} {"train_loss": -28.0022029876709, "global_step": 662603, "epoch": 7983} {"train_loss": -27.691816329956055, "global_step": 662604, "epoch": 7983} {"train_loss": -27.96609878540039, "global_step": 662605, "epoch": 7983} {"train_loss": -27.830652236938477, "global_step": 662606, "epoch": 7983} {"train_loss": -27.87164306640625, "global_step": 662607, "epoch": 7983} {"train_loss": -27.604597091674805, "global_step": 662608, "epoch": 7983} {"train_loss": -28.066089630126953, "global_step": 662609, "epoch": 7983} {"train_loss": -28.00368309020996, "global_step": 662610, "epoch": 7983} {"train_loss": -28.385671615600586, "global_step": 662611, "epoch": 7983} {"train_loss": -28.142011642456055, "global_step": 662612, "epoch": 7983} {"train_loss": -27.991933822631836, "global_step": 662613, "epoch": 7983} {"train_loss": -28.074609756469727, "global_step": 662614, "epoch": 7983} {"train_loss": -27.9620361328125, "global_step": 662615, "epoch": 7983} {"train_loss": -28.21124839782715, "global_step": 662616, "epoch": 7983} {"train_loss": -28.198205947875977, "global_step": 662617, "epoch": 7983} {"train_loss": -27.93634033203125, "global_step": 662618, "epoch": 7983} {"train_loss": -28.31317710876465, "global_step": 662619, "epoch": 7983} {"train_loss": -27.984439849853516, "global_step": 662620, "epoch": 7983} {"train_loss": -28.346435546875, "global_step": 662621, "epoch": 7983} {"train_loss": -28.018070220947266, "global_step": 662622, "epoch": 7983} {"train_loss": -28.4453067779541, "global_step": 662623, "epoch": 7983} {"train_loss": -28.264135360717773, "global_step": 662624, "epoch": 7983} {"train_loss": -28.61368751525879, "global_step": 662625, "epoch": 7983} {"train_loss": -28.228076934814453, "global_step": 662626, "epoch": 7983} {"train_loss": -28.569807052612305, "global_step": 662627, "epoch": 7983} {"train_loss": -28.374326705932617, "global_step": 662628, "epoch": 7983} {"train_loss": -28.44772720336914, "global_step": 662629, "epoch": 7983} {"train_loss": -28.617202758789062, "global_step": 662630, "epoch": 7983} {"train_loss": -28.429718017578125, "global_step": 662631, "epoch": 7983} {"train_loss": -28.256305694580078, "global_step": 662632, "epoch": 7983} {"train_loss": -28.37432861328125, "global_step": 662633, "epoch": 7983} {"train_loss": -28.3356990814209, "global_step": 662634, "epoch": 7983} {"train_loss": -28.79425048828125, "global_step": 662635, "epoch": 7983} {"train_loss": -28.17786979675293, "global_step": 662636, "epoch": 7983} {"train_loss": -28.48824119567871, "global_step": 662637, "epoch": 7983} {"train_loss": -28.636859893798828, "global_step": 662638, "epoch": 7983} {"train_loss": -28.4489688873291, "global_step": 662639, "epoch": 7983} {"train_loss": -28.58628273010254, "global_step": 662640, "epoch": 7983} {"train_loss": -29.020660400390625, "global_step": 662641, "epoch": 7983} {"train_loss": -28.789905548095703, "global_step": 662642, "epoch": 7983} {"train_loss": -28.61318016052246, "global_step": 662643, "epoch": 7983} {"train_loss": -28.938337326049805, "global_step": 662644, "epoch": 7983} {"train_loss": -28.367292404174805, "global_step": 662645, "epoch": 7983} {"train_loss": -28.7578067779541, "global_step": 662646, "epoch": 7983} {"train_loss": -28.366077423095703, "global_step": 662647, "epoch": 7983} {"train_loss": -28.665241241455078, "global_step": 662648, "epoch": 7983} {"train_loss": -28.419958114624023, "global_step": 662649, "epoch": 7983} {"train_loss": -28.702768325805664, "global_step": 662650, "epoch": 7983} {"train_loss": -28.587858200073242, "global_step": 662651, "epoch": 7983} {"train_loss": -28.761016845703125, "global_step": 662652, "epoch": 7983} {"train_loss": -28.663898468017578, "global_step": 662653, "epoch": 7983} {"train_loss": -28.608997344970703, "global_step": 662654, "epoch": 7983} {"train_loss": -28.14265251159668, "global_step": 662655, "epoch": 7983} {"train_loss": -28.15004539489746, "global_step": 662656, "epoch": 7983} {"train_loss": -28.61309814453125, "global_step": 662657, "epoch": 7983} {"train_loss": -28.286808013916016, "global_step": 662658, "epoch": 7983} {"train_loss": -28.848987579345703, "global_step": 662659, "epoch": 7983} {"train_loss": -28.4714298248291, "global_step": 662660, "epoch": 7983} {"train_loss": -28.45086669921875, "global_step": 662661, "epoch": 7983} {"train_loss": -28.568347930908203, "global_step": 662662, "epoch": 7983} {"train_loss": -28.743833541870117, "global_step": 662663, "epoch": 7983} {"train_loss": -28.798254013061523, "global_step": 662664, "epoch": 7983} {"train_loss": -28.698965072631836, "global_step": 662665, "epoch": 7983} {"train_loss": -28.26155662536621, "global_step": 662666, "epoch": 7983} {"train_loss": -28.699661254882812, "global_step": 662667, "epoch": 7983} {"train_loss": -28.1837100982666, "global_step": 662668, "epoch": 7983} {"train_loss": -28.635446548461914, "global_step": 662669, "epoch": 7983} {"train_loss": -28.217884063720703, "global_step": 662670, "epoch": 7983} {"train_loss": -28.166304025305323, "global_step": 662671, "epoch": 7983, "val_loss": 6598278.0} {"train_loss": -27.76397132873535, "global_step": 662672, "epoch": 7984} {"train_loss": -26.441923141479492, "global_step": 662673, "epoch": 7984} {"train_loss": -25.682697296142578, "global_step": 662674, "epoch": 7984} {"train_loss": -25.19269371032715, "global_step": 662675, "epoch": 7984} {"train_loss": -25.336740493774414, "global_step": 662676, "epoch": 7984} {"train_loss": -26.853504180908203, "global_step": 662677, "epoch": 7984} {"train_loss": -26.152542114257812, "global_step": 662678, "epoch": 7984} {"train_loss": -27.00762367248535, "global_step": 662679, "epoch": 7984} {"train_loss": -26.312612533569336, "global_step": 662680, "epoch": 7984} {"train_loss": -26.45399284362793, "global_step": 662681, "epoch": 7984} {"train_loss": -27.343830108642578, "global_step": 662682, "epoch": 7984} {"train_loss": -27.210968017578125, "global_step": 662683, "epoch": 7984} {"train_loss": -27.290205001831055, "global_step": 662684, "epoch": 7984} {"train_loss": -27.458288192749023, "global_step": 662685, "epoch": 7984} {"train_loss": -27.730030059814453, "global_step": 662686, "epoch": 7984} {"train_loss": -27.558053970336914, "global_step": 662687, "epoch": 7984} {"train_loss": -27.816686630249023, "global_step": 662688, "epoch": 7984} {"train_loss": -27.3740177154541, "global_step": 662689, "epoch": 7984} {"train_loss": -27.332157135009766, "global_step": 662690, "epoch": 7984} {"train_loss": -27.895246505737305, "global_step": 662691, "epoch": 7984} {"train_loss": -27.524932861328125, "global_step": 662692, "epoch": 7984} {"train_loss": -28.0600643157959, "global_step": 662693, "epoch": 7984} {"train_loss": -27.904661178588867, "global_step": 662694, "epoch": 7984} {"train_loss": -27.986047744750977, "global_step": 662695, "epoch": 7984} {"train_loss": -27.874347686767578, "global_step": 662696, "epoch": 7984} {"train_loss": -27.771743774414062, "global_step": 662697, "epoch": 7984} {"train_loss": -27.914331436157227, "global_step": 662698, "epoch": 7984} {"train_loss": -27.9950008392334, "global_step": 662699, "epoch": 7984} {"train_loss": -28.179059982299805, "global_step": 662700, "epoch": 7984} {"train_loss": -27.989139556884766, "global_step": 662701, "epoch": 7984} {"train_loss": -27.853803634643555, "global_step": 662702, "epoch": 7984} {"train_loss": -27.90596580505371, "global_step": 662703, "epoch": 7984} {"train_loss": -27.750516891479492, "global_step": 662704, "epoch": 7984} {"train_loss": -28.014745712280273, "global_step": 662705, "epoch": 7984} {"train_loss": -27.944196701049805, "global_step": 662706, "epoch": 7984} {"train_loss": -28.487424850463867, "global_step": 662707, "epoch": 7984} {"train_loss": -28.303943634033203, "global_step": 662708, "epoch": 7984} {"train_loss": -28.280750274658203, "global_step": 662709, "epoch": 7984} {"train_loss": -28.263015747070312, "global_step": 662710, "epoch": 7984} {"train_loss": -28.500930786132812, "global_step": 662711, "epoch": 7984} {"train_loss": -28.2746524810791, "global_step": 662712, "epoch": 7984} {"train_loss": -28.100446701049805, "global_step": 662713, "epoch": 7984} {"train_loss": -28.274198532104492, "global_step": 662714, "epoch": 7984} {"train_loss": -28.521284103393555, "global_step": 662715, "epoch": 7984} {"train_loss": -28.331018447875977, "global_step": 662716, "epoch": 7984} {"train_loss": -28.69611167907715, "global_step": 662717, "epoch": 7984} {"train_loss": -28.262434005737305, "global_step": 662718, "epoch": 7984} {"train_loss": -28.820295333862305, "global_step": 662719, "epoch": 7984} {"train_loss": -28.1278076171875, "global_step": 662720, "epoch": 7984} {"train_loss": -28.602624893188477, "global_step": 662721, "epoch": 7984} {"train_loss": -28.441083908081055, "global_step": 662722, "epoch": 7984} {"train_loss": -28.645132064819336, "global_step": 662723, "epoch": 7984} {"train_loss": -28.657041549682617, "global_step": 662724, "epoch": 7984} {"train_loss": -28.81496238708496, "global_step": 662725, "epoch": 7984} {"train_loss": -28.635574340820312, "global_step": 662726, "epoch": 7984} {"train_loss": -28.758773803710938, "global_step": 662727, "epoch": 7984} {"train_loss": -28.839252471923828, "global_step": 662728, "epoch": 7984} {"train_loss": -28.388446807861328, "global_step": 662729, "epoch": 7984} {"train_loss": -28.316328048706055, "global_step": 662730, "epoch": 7984} {"train_loss": -28.59700584411621, "global_step": 662731, "epoch": 7984} {"train_loss": -28.582212448120117, "global_step": 662732, "epoch": 7984} {"train_loss": -28.37432289123535, "global_step": 662733, "epoch": 7984} {"train_loss": -28.43838882446289, "global_step": 662734, "epoch": 7984} {"train_loss": -28.258081436157227, "global_step": 662735, "epoch": 7984} {"train_loss": -28.708389282226562, "global_step": 662736, "epoch": 7984} {"train_loss": -28.66278648376465, "global_step": 662737, "epoch": 7984} {"train_loss": -28.502227783203125, "global_step": 662738, "epoch": 7984} {"train_loss": -28.574207305908203, "global_step": 662739, "epoch": 7984} {"train_loss": -28.07476234436035, "global_step": 662740, "epoch": 7984} {"train_loss": -28.589862823486328, "global_step": 662741, "epoch": 7984} {"train_loss": -28.346952438354492, "global_step": 662742, "epoch": 7984} {"train_loss": -28.214557647705078, "global_step": 662743, "epoch": 7984} {"train_loss": -28.429401397705078, "global_step": 662744, "epoch": 7984} {"train_loss": -28.281110763549805, "global_step": 662745, "epoch": 7984} {"train_loss": -28.46771240234375, "global_step": 662746, "epoch": 7984} {"train_loss": -28.230764389038086, "global_step": 662747, "epoch": 7984} {"train_loss": -28.536890029907227, "global_step": 662748, "epoch": 7984} {"train_loss": -28.21500015258789, "global_step": 662749, "epoch": 7984} {"train_loss": -28.167341232299805, "global_step": 662750, "epoch": 7984} {"train_loss": -28.1262149810791, "global_step": 662751, "epoch": 7984} {"train_loss": -28.064411163330078, "global_step": 662752, "epoch": 7984} {"train_loss": -28.510894775390625, "global_step": 662753, "epoch": 7984} {"train_loss": -27.964859261570208, "global_step": 662754, "epoch": 7984, "val_loss": 6745118.0} {"train_loss": -27.66214370727539, "global_step": 662755, "epoch": 7985} {"train_loss": -26.92753028869629, "global_step": 662756, "epoch": 7985} {"train_loss": -26.881912231445312, "global_step": 662757, "epoch": 7985} {"train_loss": -27.143579483032227, "global_step": 662758, "epoch": 7985} {"train_loss": -27.057220458984375, "global_step": 662759, "epoch": 7985} {"train_loss": -27.757434844970703, "global_step": 662760, "epoch": 7985} {"train_loss": -28.207101821899414, "global_step": 662761, "epoch": 7985} {"train_loss": -27.59211540222168, "global_step": 662762, "epoch": 7985} {"train_loss": -28.02765464782715, "global_step": 662763, "epoch": 7985} {"train_loss": -28.149152755737305, "global_step": 662764, "epoch": 7985} {"train_loss": -28.021162033081055, "global_step": 662765, "epoch": 7985} {"train_loss": -27.910825729370117, "global_step": 662766, "epoch": 7985} {"train_loss": -28.16552734375, "global_step": 662767, "epoch": 7985} {"train_loss": -27.981189727783203, "global_step": 662768, "epoch": 7985} {"train_loss": -28.063928604125977, "global_step": 662769, "epoch": 7985} {"train_loss": -28.554996490478516, "global_step": 662770, "epoch": 7985} {"train_loss": -28.193979263305664, "global_step": 662771, "epoch": 7985} {"train_loss": -28.714202880859375, "global_step": 662772, "epoch": 7985} {"train_loss": -28.178653717041016, "global_step": 662773, "epoch": 7985} {"train_loss": -28.3133487701416, "global_step": 662774, "epoch": 7985} {"train_loss": -28.387741088867188, "global_step": 662775, "epoch": 7985} {"train_loss": -28.211002349853516, "global_step": 662776, "epoch": 7985} {"train_loss": -28.49749755859375, "global_step": 662777, "epoch": 7985} {"train_loss": -28.24200439453125, "global_step": 662778, "epoch": 7985} {"train_loss": -28.213842391967773, "global_step": 662779, "epoch": 7985} {"train_loss": -28.432092666625977, "global_step": 662780, "epoch": 7985} {"train_loss": -28.21067237854004, "global_step": 662781, "epoch": 7985} {"train_loss": -28.499704360961914, "global_step": 662782, "epoch": 7985} {"train_loss": -28.51218605041504, "global_step": 662783, "epoch": 7985} {"train_loss": -28.50394630432129, "global_step": 662784, "epoch": 7985} {"train_loss": -28.585500717163086, "global_step": 662785, "epoch": 7985} {"train_loss": -28.43421745300293, "global_step": 662786, "epoch": 7985} {"train_loss": -28.198163986206055, "global_step": 662787, "epoch": 7985} {"train_loss": -28.280807495117188, "global_step": 662788, "epoch": 7985} {"train_loss": -28.654699325561523, "global_step": 662789, "epoch": 7985} {"train_loss": -28.27292823791504, "global_step": 662790, "epoch": 7985} {"train_loss": -28.529428482055664, "global_step": 662791, "epoch": 7985} {"train_loss": -28.578689575195312, "global_step": 662792, "epoch": 7985} {"train_loss": -28.576873779296875, "global_step": 662793, "epoch": 7985} {"train_loss": -28.78569984436035, "global_step": 662794, "epoch": 7985} {"train_loss": -28.471250534057617, "global_step": 662795, "epoch": 7985} {"train_loss": -28.563739776611328, "global_step": 662796, "epoch": 7985} {"train_loss": -28.336414337158203, "global_step": 662797, "epoch": 7985} {"train_loss": -28.840234756469727, "global_step": 662798, "epoch": 7985} {"train_loss": -28.693252563476562, "global_step": 662799, "epoch": 7985} {"train_loss": -28.669416427612305, "global_step": 662800, "epoch": 7985} {"train_loss": -28.52155113220215, "global_step": 662801, "epoch": 7985} {"train_loss": -28.59339714050293, "global_step": 662802, "epoch": 7985} {"train_loss": -28.531408309936523, "global_step": 662803, "epoch": 7985} {"train_loss": -28.827594757080078, "global_step": 662804, "epoch": 7985} {"train_loss": -28.32489013671875, "global_step": 662805, "epoch": 7985} {"train_loss": -28.844085693359375, "global_step": 662806, "epoch": 7985} {"train_loss": -28.5699405670166, "global_step": 662807, "epoch": 7985} {"train_loss": -28.499353408813477, "global_step": 662808, "epoch": 7985} {"train_loss": -28.61395263671875, "global_step": 662809, "epoch": 7985} {"train_loss": -28.522567749023438, "global_step": 662810, "epoch": 7985} {"train_loss": -28.920257568359375, "global_step": 662811, "epoch": 7985} {"train_loss": -28.637067794799805, "global_step": 662812, "epoch": 7985} {"train_loss": -28.500568389892578, "global_step": 662813, "epoch": 7985} {"train_loss": -28.6881046295166, "global_step": 662814, "epoch": 7985} {"train_loss": -28.7158203125, "global_step": 662815, "epoch": 7985} {"train_loss": -28.419921875, "global_step": 662816, "epoch": 7985} {"train_loss": -28.796234130859375, "global_step": 662817, "epoch": 7985} {"train_loss": -28.52797508239746, "global_step": 662818, "epoch": 7985} {"train_loss": -28.467670440673828, "global_step": 662819, "epoch": 7985} {"train_loss": -28.467853546142578, "global_step": 662820, "epoch": 7985} {"train_loss": -28.49458885192871, "global_step": 662821, "epoch": 7985} {"train_loss": -28.911630630493164, "global_step": 662822, "epoch": 7985} {"train_loss": -28.436628341674805, "global_step": 662823, "epoch": 7985} {"train_loss": -28.579736709594727, "global_step": 662824, "epoch": 7985} {"train_loss": -28.71843910217285, "global_step": 662825, "epoch": 7985} {"train_loss": -28.23737907409668, "global_step": 662826, "epoch": 7985} {"train_loss": -28.264820098876953, "global_step": 662827, "epoch": 7985} {"train_loss": -28.31619644165039, "global_step": 662828, "epoch": 7985} {"train_loss": -28.112781524658203, "global_step": 662829, "epoch": 7985} {"train_loss": -28.027454376220703, "global_step": 662830, "epoch": 7985} {"train_loss": -27.41205406188965, "global_step": 662831, "epoch": 7985} {"train_loss": -27.26276206970215, "global_step": 662832, "epoch": 7985} {"train_loss": -27.79495620727539, "global_step": 662833, "epoch": 7985} {"train_loss": -28.385950088500977, "global_step": 662834, "epoch": 7985} {"train_loss": -28.042646408081055, "global_step": 662835, "epoch": 7985} {"train_loss": -28.121484756469727, "global_step": 662836, "epoch": 7985} {"train_loss": -28.304077470158955, "global_step": 662837, "epoch": 7985, "val_loss": 6667876.5} {"train_loss": -27.148950576782227, "global_step": 662838, "epoch": 7986} {"train_loss": -27.711715698242188, "global_step": 662839, "epoch": 7986} {"train_loss": -26.532339096069336, "global_step": 662840, "epoch": 7986} {"train_loss": -26.703039169311523, "global_step": 662841, "epoch": 7986} {"train_loss": -27.200788497924805, "global_step": 662842, "epoch": 7986} {"train_loss": -27.67608642578125, "global_step": 662843, "epoch": 7986} {"train_loss": -27.254138946533203, "global_step": 662844, "epoch": 7986} {"train_loss": -27.6283016204834, "global_step": 662845, "epoch": 7986} {"train_loss": -27.39493179321289, "global_step": 662846, "epoch": 7986} {"train_loss": -27.356266021728516, "global_step": 662847, "epoch": 7986} {"train_loss": -27.65296745300293, "global_step": 662848, "epoch": 7986} {"train_loss": -27.28047752380371, "global_step": 662849, "epoch": 7986} {"train_loss": -27.831710815429688, "global_step": 662850, "epoch": 7986} {"train_loss": -27.527318954467773, "global_step": 662851, "epoch": 7986} {"train_loss": -28.166601181030273, "global_step": 662852, "epoch": 7986} {"train_loss": -27.53924560546875, "global_step": 662853, "epoch": 7986} {"train_loss": -27.9969482421875, "global_step": 662854, "epoch": 7986} {"train_loss": -27.860553741455078, "global_step": 662855, "epoch": 7986} {"train_loss": -27.943805694580078, "global_step": 662856, "epoch": 7986} {"train_loss": -27.834497451782227, "global_step": 662857, "epoch": 7986} {"train_loss": -27.817197799682617, "global_step": 662858, "epoch": 7986} {"train_loss": -27.676288604736328, "global_step": 662859, "epoch": 7986} {"train_loss": -28.066389083862305, "global_step": 662860, "epoch": 7986} {"train_loss": -28.139013290405273, "global_step": 662861, "epoch": 7986} {"train_loss": -28.22242546081543, "global_step": 662862, "epoch": 7986} {"train_loss": -28.193801879882812, "global_step": 662863, "epoch": 7986} {"train_loss": -28.25, "global_step": 662864, "epoch": 7986} {"train_loss": -28.21182632446289, "global_step": 662865, "epoch": 7986} {"train_loss": -28.181522369384766, "global_step": 662866, "epoch": 7986} {"train_loss": -28.47452735900879, "global_step": 662867, "epoch": 7986} {"train_loss": -28.04542350769043, "global_step": 662868, "epoch": 7986} {"train_loss": -27.996877670288086, "global_step": 662869, "epoch": 7986} {"train_loss": -28.31987953186035, "global_step": 662870, "epoch": 7986} {"train_loss": -28.229766845703125, "global_step": 662871, "epoch": 7986} {"train_loss": -28.56683921813965, "global_step": 662872, "epoch": 7986} {"train_loss": -28.479721069335938, "global_step": 662873, "epoch": 7986} {"train_loss": -28.19868278503418, "global_step": 662874, "epoch": 7986} {"train_loss": -28.380451202392578, "global_step": 662875, "epoch": 7986} {"train_loss": -28.192935943603516, "global_step": 662876, "epoch": 7986} {"train_loss": -28.567981719970703, "global_step": 662877, "epoch": 7986} {"train_loss": -28.424772262573242, "global_step": 662878, "epoch": 7986} {"train_loss": -28.67156410217285, "global_step": 662879, "epoch": 7986} {"train_loss": -28.5861759185791, "global_step": 662880, "epoch": 7986} {"train_loss": -28.797046661376953, "global_step": 662881, "epoch": 7986} {"train_loss": -28.706384658813477, "global_step": 662882, "epoch": 7986} {"train_loss": -28.539358139038086, "global_step": 662883, "epoch": 7986} {"train_loss": -28.450397491455078, "global_step": 662884, "epoch": 7986} {"train_loss": -28.463104248046875, "global_step": 662885, "epoch": 7986} {"train_loss": -28.597314834594727, "global_step": 662886, "epoch": 7986} {"train_loss": -28.683074951171875, "global_step": 662887, "epoch": 7986} {"train_loss": -28.817853927612305, "global_step": 662888, "epoch": 7986} {"train_loss": -28.74664878845215, "global_step": 662889, "epoch": 7986} {"train_loss": -28.557510375976562, "global_step": 662890, "epoch": 7986} {"train_loss": -28.7753849029541, "global_step": 662891, "epoch": 7986} {"train_loss": -28.55890464782715, "global_step": 662892, "epoch": 7986} {"train_loss": -28.431867599487305, "global_step": 662893, "epoch": 7986} {"train_loss": -28.425750732421875, "global_step": 662894, "epoch": 7986} {"train_loss": -28.656513214111328, "global_step": 662895, "epoch": 7986} {"train_loss": -28.44581413269043, "global_step": 662896, "epoch": 7986} {"train_loss": -28.87696647644043, "global_step": 662897, "epoch": 7986} {"train_loss": -28.73724937438965, "global_step": 662898, "epoch": 7986} {"train_loss": -28.196069717407227, "global_step": 662899, "epoch": 7986} {"train_loss": -28.321491241455078, "global_step": 662900, "epoch": 7986} {"train_loss": -27.413471221923828, "global_step": 662901, "epoch": 7986} {"train_loss": -25.643661499023438, "global_step": 662902, "epoch": 7986} {"train_loss": -23.327489852905273, "global_step": 662903, "epoch": 7986} {"train_loss": -22.946640014648438, "global_step": 662904, "epoch": 7986} {"train_loss": -27.54230308532715, "global_step": 662905, "epoch": 7986} {"train_loss": -25.312658309936523, "global_step": 662906, "epoch": 7986} {"train_loss": -27.791051864624023, "global_step": 662907, "epoch": 7986} {"train_loss": -26.740238189697266, "global_step": 662908, "epoch": 7986} {"train_loss": -26.8055477142334, "global_step": 662909, "epoch": 7986} {"train_loss": -27.80067253112793, "global_step": 662910, "epoch": 7986} {"train_loss": -26.732898712158203, "global_step": 662911, "epoch": 7986} {"train_loss": -26.91559410095215, "global_step": 662912, "epoch": 7986} {"train_loss": -27.726276397705078, "global_step": 662913, "epoch": 7986} {"train_loss": -27.248493194580078, "global_step": 662914, "epoch": 7986} {"train_loss": -27.577390670776367, "global_step": 662915, "epoch": 7986} {"train_loss": -28.019927978515625, "global_step": 662916, "epoch": 7986} {"train_loss": -27.981220245361328, "global_step": 662917, "epoch": 7986} {"train_loss": -27.666244506835938, "global_step": 662918, "epoch": 7986} {"train_loss": -27.709259033203125, "global_step": 662919, "epoch": 7986} {"train_loss": -27.835957630571112, "global_step": 662920, "epoch": 7986, "val_loss": 6738110.5} {"train_loss": -27.4738712310791, "global_step": 662921, "epoch": 7987} {"train_loss": -27.694900512695312, "global_step": 662922, "epoch": 7987} {"train_loss": -27.400815963745117, "global_step": 662923, "epoch": 7987} {"train_loss": -27.612577438354492, "global_step": 662924, "epoch": 7987} {"train_loss": -27.190290451049805, "global_step": 662925, "epoch": 7987} {"train_loss": -27.72956657409668, "global_step": 662926, "epoch": 7987} {"train_loss": -27.4088134765625, "global_step": 662927, "epoch": 7987} {"train_loss": -28.155792236328125, "global_step": 662928, "epoch": 7987} {"train_loss": -27.81431007385254, "global_step": 662929, "epoch": 7987} {"train_loss": -27.525745391845703, "global_step": 662930, "epoch": 7987} {"train_loss": -27.69559669494629, "global_step": 662931, "epoch": 7987} {"train_loss": -27.324020385742188, "global_step": 662932, "epoch": 7987} {"train_loss": -27.8880672454834, "global_step": 662933, "epoch": 7987} {"train_loss": -27.89320182800293, "global_step": 662934, "epoch": 7987} {"train_loss": -28.043399810791016, "global_step": 662935, "epoch": 7987} {"train_loss": -28.04841423034668, "global_step": 662936, "epoch": 7987} {"train_loss": -28.172687530517578, "global_step": 662937, "epoch": 7987} {"train_loss": -27.87531852722168, "global_step": 662938, "epoch": 7987} {"train_loss": -27.676227569580078, "global_step": 662939, "epoch": 7987} {"train_loss": -27.811161041259766, "global_step": 662940, "epoch": 7987} {"train_loss": -28.295141220092773, "global_step": 662941, "epoch": 7987} {"train_loss": -28.295413970947266, "global_step": 662942, "epoch": 7987} {"train_loss": -27.619001388549805, "global_step": 662943, "epoch": 7987} {"train_loss": -27.998096466064453, "global_step": 662944, "epoch": 7987} {"train_loss": -27.9534969329834, "global_step": 662945, "epoch": 7987} {"train_loss": -27.702672958374023, "global_step": 662946, "epoch": 7987} {"train_loss": -28.434097290039062, "global_step": 662947, "epoch": 7987} {"train_loss": -28.190876007080078, "global_step": 662948, "epoch": 7987} {"train_loss": -28.1697940826416, "global_step": 662949, "epoch": 7987} {"train_loss": -27.8577880859375, "global_step": 662950, "epoch": 7987} {"train_loss": -28.030431747436523, "global_step": 662951, "epoch": 7987} {"train_loss": -28.143890380859375, "global_step": 662952, "epoch": 7987} {"train_loss": -28.553421020507812, "global_step": 662953, "epoch": 7987} {"train_loss": -28.328948974609375, "global_step": 662954, "epoch": 7987} {"train_loss": -28.155248641967773, "global_step": 662955, "epoch": 7987} {"train_loss": -28.448017120361328, "global_step": 662956, "epoch": 7987} {"train_loss": -27.8116455078125, "global_step": 662957, "epoch": 7987} {"train_loss": -28.3354549407959, "global_step": 662958, "epoch": 7987} {"train_loss": -28.29461097717285, "global_step": 662959, "epoch": 7987} {"train_loss": -27.956928253173828, "global_step": 662960, "epoch": 7987} {"train_loss": -27.7474365234375, "global_step": 662961, "epoch": 7987} {"train_loss": -28.045307159423828, "global_step": 662962, "epoch": 7987} {"train_loss": -28.44677734375, "global_step": 662963, "epoch": 7987} {"train_loss": -27.70171546936035, "global_step": 662964, "epoch": 7987} {"train_loss": -28.453821182250977, "global_step": 662965, "epoch": 7987} {"train_loss": -28.171972274780273, "global_step": 662966, "epoch": 7987} {"train_loss": -28.013843536376953, "global_step": 662967, "epoch": 7987} {"train_loss": -27.981891632080078, "global_step": 662968, "epoch": 7987} {"train_loss": -28.595264434814453, "global_step": 662969, "epoch": 7987} {"train_loss": -28.412992477416992, "global_step": 662970, "epoch": 7987} {"train_loss": -28.163259506225586, "global_step": 662971, "epoch": 7987} {"train_loss": -28.385848999023438, "global_step": 662972, "epoch": 7987} {"train_loss": -28.467370986938477, "global_step": 662973, "epoch": 7987} {"train_loss": -28.492313385009766, "global_step": 662974, "epoch": 7987} {"train_loss": -28.69087028503418, "global_step": 662975, "epoch": 7987} {"train_loss": -28.3140811920166, "global_step": 662976, "epoch": 7987} {"train_loss": -28.401105880737305, "global_step": 662977, "epoch": 7987} {"train_loss": -28.48744010925293, "global_step": 662978, "epoch": 7987} {"train_loss": -28.242115020751953, "global_step": 662979, "epoch": 7987} {"train_loss": -28.457014083862305, "global_step": 662980, "epoch": 7987} {"train_loss": -28.404489517211914, "global_step": 662981, "epoch": 7987} {"train_loss": -28.509241104125977, "global_step": 662982, "epoch": 7987} {"train_loss": -28.483169555664062, "global_step": 662983, "epoch": 7987} {"train_loss": -28.496267318725586, "global_step": 662984, "epoch": 7987} {"train_loss": -28.265893936157227, "global_step": 662985, "epoch": 7987} {"train_loss": -27.89682960510254, "global_step": 662986, "epoch": 7987} {"train_loss": -27.70282554626465, "global_step": 662987, "epoch": 7987} {"train_loss": -27.89015769958496, "global_step": 662988, "epoch": 7987} {"train_loss": -28.443517684936523, "global_step": 662989, "epoch": 7987} {"train_loss": -28.255786895751953, "global_step": 662990, "epoch": 7987} {"train_loss": -28.60056495666504, "global_step": 662991, "epoch": 7987} {"train_loss": -28.235944747924805, "global_step": 662992, "epoch": 7987} {"train_loss": -28.491830825805664, "global_step": 662993, "epoch": 7987} {"train_loss": -28.388280868530273, "global_step": 662994, "epoch": 7987} {"train_loss": -28.263761520385742, "global_step": 662995, "epoch": 7987} {"train_loss": -28.260602951049805, "global_step": 662996, "epoch": 7987} {"train_loss": -28.349567413330078, "global_step": 662997, "epoch": 7987} {"train_loss": -28.103254318237305, "global_step": 662998, "epoch": 7987} {"train_loss": -28.29591941833496, "global_step": 662999, "epoch": 7987} {"train_loss": -28.646930694580078, "global_step": 663000, "epoch": 7987} {"train_loss": -28.715967178344727, "global_step": 663001, "epoch": 7987} {"train_loss": -28.175134658813477, "global_step": 663002, "epoch": 7987} {"train_loss": -28.118995183921722, "global_step": 663003, "epoch": 7987, "val_loss": 6608110.0} {"train_loss": -27.977924346923828, "global_step": 663004, "epoch": 7988} {"train_loss": -27.64516258239746, "global_step": 663005, "epoch": 7988} {"train_loss": -27.845300674438477, "global_step": 663006, "epoch": 7988} {"train_loss": -27.805408477783203, "global_step": 663007, "epoch": 7988} {"train_loss": -27.804645538330078, "global_step": 663008, "epoch": 7988} {"train_loss": -27.898962020874023, "global_step": 663009, "epoch": 7988} {"train_loss": -28.1002197265625, "global_step": 663010, "epoch": 7988} {"train_loss": -27.8819637298584, "global_step": 663011, "epoch": 7988} {"train_loss": -28.456867218017578, "global_step": 663012, "epoch": 7988} {"train_loss": -27.585224151611328, "global_step": 663013, "epoch": 7988} {"train_loss": -28.297433853149414, "global_step": 663014, "epoch": 7988} {"train_loss": -28.415613174438477, "global_step": 663015, "epoch": 7988} {"train_loss": -27.649188995361328, "global_step": 663016, "epoch": 7988} {"train_loss": -28.42938804626465, "global_step": 663017, "epoch": 7988} {"train_loss": -27.94719886779785, "global_step": 663018, "epoch": 7988} {"train_loss": -28.012357711791992, "global_step": 663019, "epoch": 7988} {"train_loss": -28.064258575439453, "global_step": 663020, "epoch": 7988} {"train_loss": -28.27630615234375, "global_step": 663021, "epoch": 7988} {"train_loss": -28.363056182861328, "global_step": 663022, "epoch": 7988} {"train_loss": -28.175861358642578, "global_step": 663023, "epoch": 7988} {"train_loss": -28.26618766784668, "global_step": 663024, "epoch": 7988} {"train_loss": -28.327219009399414, "global_step": 663025, "epoch": 7988} {"train_loss": -28.275720596313477, "global_step": 663026, "epoch": 7988} {"train_loss": -28.313343048095703, "global_step": 663027, "epoch": 7988} {"train_loss": -28.291955947875977, "global_step": 663028, "epoch": 7988} {"train_loss": -28.205297470092773, "global_step": 663029, "epoch": 7988} {"train_loss": -28.30315589904785, "global_step": 663030, "epoch": 7988} {"train_loss": -28.156766891479492, "global_step": 663031, "epoch": 7988} {"train_loss": -28.256332397460938, "global_step": 663032, "epoch": 7988} {"train_loss": -28.281641006469727, "global_step": 663033, "epoch": 7988} {"train_loss": -28.328323364257812, "global_step": 663034, "epoch": 7988} {"train_loss": -28.108728408813477, "global_step": 663035, "epoch": 7988} {"train_loss": -28.62747573852539, "global_step": 663036, "epoch": 7988} {"train_loss": -28.58685874938965, "global_step": 663037, "epoch": 7988} {"train_loss": -28.30498695373535, "global_step": 663038, "epoch": 7988} {"train_loss": -28.44136619567871, "global_step": 663039, "epoch": 7988} {"train_loss": -28.4036865234375, "global_step": 663040, "epoch": 7988} {"train_loss": -28.693099975585938, "global_step": 663041, "epoch": 7988} {"train_loss": -28.338211059570312, "global_step": 663042, "epoch": 7988} {"train_loss": -28.562774658203125, "global_step": 663043, "epoch": 7988} {"train_loss": -28.785749435424805, "global_step": 663044, "epoch": 7988} {"train_loss": -28.678531646728516, "global_step": 663045, "epoch": 7988} {"train_loss": -28.661619186401367, "global_step": 663046, "epoch": 7988} {"train_loss": -28.678424835205078, "global_step": 663047, "epoch": 7988} {"train_loss": -28.547870635986328, "global_step": 663048, "epoch": 7988} {"train_loss": -28.661487579345703, "global_step": 663049, "epoch": 7988} {"train_loss": -28.580915451049805, "global_step": 663050, "epoch": 7988} {"train_loss": -28.354862213134766, "global_step": 663051, "epoch": 7988} {"train_loss": -28.778852462768555, "global_step": 663052, "epoch": 7988} {"train_loss": -28.78687858581543, "global_step": 663053, "epoch": 7988} {"train_loss": -28.5183048248291, "global_step": 663054, "epoch": 7988} {"train_loss": -28.738752365112305, "global_step": 663055, "epoch": 7988} {"train_loss": -28.5870304107666, "global_step": 663056, "epoch": 7988} {"train_loss": -28.4475154876709, "global_step": 663057, "epoch": 7988} {"train_loss": -28.788497924804688, "global_step": 663058, "epoch": 7988} {"train_loss": -28.574848175048828, "global_step": 663059, "epoch": 7988} {"train_loss": -28.644113540649414, "global_step": 663060, "epoch": 7988} {"train_loss": -28.140893936157227, "global_step": 663061, "epoch": 7988} {"train_loss": -28.976734161376953, "global_step": 663062, "epoch": 7988} {"train_loss": -28.2839412689209, "global_step": 663063, "epoch": 7988} {"train_loss": -28.678791046142578, "global_step": 663064, "epoch": 7988} {"train_loss": -28.569366455078125, "global_step": 663065, "epoch": 7988} {"train_loss": -28.791593551635742, "global_step": 663066, "epoch": 7988} {"train_loss": -28.305908203125, "global_step": 663067, "epoch": 7988} {"train_loss": -28.503671646118164, "global_step": 663068, "epoch": 7988} {"train_loss": -28.370019912719727, "global_step": 663069, "epoch": 7988} {"train_loss": -28.223011016845703, "global_step": 663070, "epoch": 7988} {"train_loss": -28.958221435546875, "global_step": 663071, "epoch": 7988} {"train_loss": -27.952611923217773, "global_step": 663072, "epoch": 7988} {"train_loss": -28.74729347229004, "global_step": 663073, "epoch": 7988} {"train_loss": -28.081125259399414, "global_step": 663074, "epoch": 7988} {"train_loss": -28.838476181030273, "global_step": 663075, "epoch": 7988} {"train_loss": -27.96902847290039, "global_step": 663076, "epoch": 7988} {"train_loss": -28.30767250061035, "global_step": 663077, "epoch": 7988} {"train_loss": -28.272781372070312, "global_step": 663078, "epoch": 7988} {"train_loss": -28.524017333984375, "global_step": 663079, "epoch": 7988} {"train_loss": -28.25601577758789, "global_step": 663080, "epoch": 7988} {"train_loss": -28.556365966796875, "global_step": 663081, "epoch": 7988} {"train_loss": -28.367002487182617, "global_step": 663082, "epoch": 7988} {"train_loss": -28.389272689819336, "global_step": 663083, "epoch": 7988} {"train_loss": -28.708539962768555, "global_step": 663084, "epoch": 7988} {"train_loss": -28.5654239654541, "global_step": 663085, "epoch": 7988} {"train_loss": -28.367518735219196, "global_step": 663086, "epoch": 7988, "val_loss": 6672026.0} {"train_loss": -28.188186645507812, "global_step": 663087, "epoch": 7989} {"train_loss": -28.092267990112305, "global_step": 663088, "epoch": 7989} {"train_loss": -27.68110466003418, "global_step": 663089, "epoch": 7989} {"train_loss": -27.75421714782715, "global_step": 663090, "epoch": 7989} {"train_loss": -27.512670516967773, "global_step": 663091, "epoch": 7989} {"train_loss": -26.970373153686523, "global_step": 663092, "epoch": 7989} {"train_loss": -27.314069747924805, "global_step": 663093, "epoch": 7989} {"train_loss": -27.712141036987305, "global_step": 663094, "epoch": 7989} {"train_loss": -28.272003173828125, "global_step": 663095, "epoch": 7989} {"train_loss": -28.154376983642578, "global_step": 663096, "epoch": 7989} {"train_loss": -27.83588981628418, "global_step": 663097, "epoch": 7989} {"train_loss": -28.022186279296875, "global_step": 663098, "epoch": 7989} {"train_loss": -28.22566032409668, "global_step": 663099, "epoch": 7989} {"train_loss": -28.215051651000977, "global_step": 663100, "epoch": 7989} {"train_loss": -28.414392471313477, "global_step": 663101, "epoch": 7989} {"train_loss": -28.421844482421875, "global_step": 663102, "epoch": 7989} {"train_loss": -28.604156494140625, "global_step": 663103, "epoch": 7989} {"train_loss": -28.24439811706543, "global_step": 663104, "epoch": 7989} {"train_loss": -28.50217056274414, "global_step": 663105, "epoch": 7989} {"train_loss": -28.19427490234375, "global_step": 663106, "epoch": 7989} {"train_loss": -28.628162384033203, "global_step": 663107, "epoch": 7989} {"train_loss": -28.217395782470703, "global_step": 663108, "epoch": 7989} {"train_loss": -28.362640380859375, "global_step": 663109, "epoch": 7989} {"train_loss": -28.28266716003418, "global_step": 663110, "epoch": 7989} {"train_loss": -28.157703399658203, "global_step": 663111, "epoch": 7989} {"train_loss": -28.366851806640625, "global_step": 663112, "epoch": 7989} {"train_loss": -28.229511260986328, "global_step": 663113, "epoch": 7989} {"train_loss": -28.207305908203125, "global_step": 663114, "epoch": 7989} {"train_loss": -28.001310348510742, "global_step": 663115, "epoch": 7989} {"train_loss": -28.21668815612793, "global_step": 663116, "epoch": 7989} {"train_loss": -28.752145767211914, "global_step": 663117, "epoch": 7989} {"train_loss": -28.36785316467285, "global_step": 663118, "epoch": 7989} {"train_loss": -28.440526962280273, "global_step": 663119, "epoch": 7989} {"train_loss": -28.56570816040039, "global_step": 663120, "epoch": 7989} {"train_loss": -28.636337280273438, "global_step": 663121, "epoch": 7989} {"train_loss": -28.376941680908203, "global_step": 663122, "epoch": 7989} {"train_loss": -28.395788192749023, "global_step": 663123, "epoch": 7989} {"train_loss": -28.506010055541992, "global_step": 663124, "epoch": 7989} {"train_loss": -28.126245498657227, "global_step": 663125, "epoch": 7989} {"train_loss": -28.52162742614746, "global_step": 663126, "epoch": 7989} {"train_loss": -28.36602783203125, "global_step": 663127, "epoch": 7989} {"train_loss": -28.570575714111328, "global_step": 663128, "epoch": 7989} {"train_loss": -28.5405330657959, "global_step": 663129, "epoch": 7989} {"train_loss": -28.486127853393555, "global_step": 663130, "epoch": 7989} {"train_loss": -28.609472274780273, "global_step": 663131, "epoch": 7989} {"train_loss": -28.666860580444336, "global_step": 663132, "epoch": 7989} {"train_loss": -28.48236656188965, "global_step": 663133, "epoch": 7989} {"train_loss": -28.298749923706055, "global_step": 663134, "epoch": 7989} {"train_loss": -28.622888565063477, "global_step": 663135, "epoch": 7989} {"train_loss": -28.374608993530273, "global_step": 663136, "epoch": 7989} {"train_loss": -28.314489364624023, "global_step": 663137, "epoch": 7989} {"train_loss": -28.337482452392578, "global_step": 663138, "epoch": 7989} {"train_loss": -28.298166275024414, "global_step": 663139, "epoch": 7989} {"train_loss": -29.02772331237793, "global_step": 663140, "epoch": 7989} {"train_loss": -28.54352378845215, "global_step": 663141, "epoch": 7989} {"train_loss": -28.450214385986328, "global_step": 663142, "epoch": 7989} {"train_loss": -28.434247970581055, "global_step": 663143, "epoch": 7989} {"train_loss": -28.6822566986084, "global_step": 663144, "epoch": 7989} {"train_loss": -28.494104385375977, "global_step": 663145, "epoch": 7989} {"train_loss": -28.47391700744629, "global_step": 663146, "epoch": 7989} {"train_loss": -28.69221305847168, "global_step": 663147, "epoch": 7989} {"train_loss": -28.766218185424805, "global_step": 663148, "epoch": 7989} {"train_loss": -28.274587631225586, "global_step": 663149, "epoch": 7989} {"train_loss": -27.758594512939453, "global_step": 663150, "epoch": 7989} {"train_loss": -28.067678451538086, "global_step": 663151, "epoch": 7989} {"train_loss": -28.88006591796875, "global_step": 663152, "epoch": 7989} {"train_loss": -28.55963706970215, "global_step": 663153, "epoch": 7989} {"train_loss": -28.47607421875, "global_step": 663154, "epoch": 7989} {"train_loss": -28.673139572143555, "global_step": 663155, "epoch": 7989} {"train_loss": -27.706161499023438, "global_step": 663156, "epoch": 7989} {"train_loss": -27.976104736328125, "global_step": 663157, "epoch": 7989} {"train_loss": -28.536218643188477, "global_step": 663158, "epoch": 7989} {"train_loss": -28.34185791015625, "global_step": 663159, "epoch": 7989} {"train_loss": -28.296003341674805, "global_step": 663160, "epoch": 7989} {"train_loss": -28.11248779296875, "global_step": 663161, "epoch": 7989} {"train_loss": -27.930728912353516, "global_step": 663162, "epoch": 7989} {"train_loss": -27.616769790649414, "global_step": 663163, "epoch": 7989} {"train_loss": -27.873767852783203, "global_step": 663164, "epoch": 7989} {"train_loss": -28.601642608642578, "global_step": 663165, "epoch": 7989} {"train_loss": -28.26871109008789, "global_step": 663166, "epoch": 7989} {"train_loss": -28.319360733032227, "global_step": 663167, "epoch": 7989} {"train_loss": -28.474323272705078, "global_step": 663168, "epoch": 7989} {"train_loss": -28.296375642339868, "global_step": 663169, "epoch": 7989, "val_loss": 6687486.0} {"train_loss": -25.983728408813477, "global_step": 663170, "epoch": 7990} {"train_loss": -27.286483764648438, "global_step": 663171, "epoch": 7990} {"train_loss": -27.55865478515625, "global_step": 663172, "epoch": 7990} {"train_loss": -27.116113662719727, "global_step": 663173, "epoch": 7990} {"train_loss": -27.500364303588867, "global_step": 663174, "epoch": 7990} {"train_loss": -27.362329483032227, "global_step": 663175, "epoch": 7990} {"train_loss": -27.50882911682129, "global_step": 663176, "epoch": 7990} {"train_loss": -27.529062271118164, "global_step": 663177, "epoch": 7990} {"train_loss": -27.82874870300293, "global_step": 663178, "epoch": 7990} {"train_loss": -27.4672794342041, "global_step": 663179, "epoch": 7990} {"train_loss": -27.8148136138916, "global_step": 663180, "epoch": 7990} {"train_loss": -27.57293701171875, "global_step": 663181, "epoch": 7990} {"train_loss": -28.010839462280273, "global_step": 663182, "epoch": 7990} {"train_loss": -27.436023712158203, "global_step": 663183, "epoch": 7990} {"train_loss": -28.0289306640625, "global_step": 663184, "epoch": 7990} {"train_loss": -27.504047393798828, "global_step": 663185, "epoch": 7990} {"train_loss": -27.871002197265625, "global_step": 663186, "epoch": 7990} {"train_loss": -27.807300567626953, "global_step": 663187, "epoch": 7990} {"train_loss": -28.017898559570312, "global_step": 663188, "epoch": 7990} {"train_loss": -28.17502784729004, "global_step": 663189, "epoch": 7990} {"train_loss": -28.205097198486328, "global_step": 663190, "epoch": 7990} {"train_loss": -28.4633731842041, "global_step": 663191, "epoch": 7990} {"train_loss": -27.69959831237793, "global_step": 663192, "epoch": 7990} {"train_loss": -28.527090072631836, "global_step": 663193, "epoch": 7990} {"train_loss": -28.07839012145996, "global_step": 663194, "epoch": 7990} {"train_loss": -28.477441787719727, "global_step": 663195, "epoch": 7990} {"train_loss": -28.39155387878418, "global_step": 663196, "epoch": 7990} {"train_loss": -28.462493896484375, "global_step": 663197, "epoch": 7990} {"train_loss": -28.38653564453125, "global_step": 663198, "epoch": 7990} {"train_loss": -28.274198532104492, "global_step": 663199, "epoch": 7990} {"train_loss": -28.140247344970703, "global_step": 663200, "epoch": 7990} {"train_loss": -28.261322021484375, "global_step": 663201, "epoch": 7990} {"train_loss": -28.646215438842773, "global_step": 663202, "epoch": 7990} {"train_loss": -28.23394203186035, "global_step": 663203, "epoch": 7990} {"train_loss": -28.23194694519043, "global_step": 663204, "epoch": 7990} {"train_loss": -28.508285522460938, "global_step": 663205, "epoch": 7990} {"train_loss": -28.76375389099121, "global_step": 663206, "epoch": 7990} {"train_loss": -28.468021392822266, "global_step": 663207, "epoch": 7990} {"train_loss": -28.375732421875, "global_step": 663208, "epoch": 7990} {"train_loss": -28.50660514831543, "global_step": 663209, "epoch": 7990} {"train_loss": -28.52127456665039, "global_step": 663210, "epoch": 7990} {"train_loss": -28.374866485595703, "global_step": 663211, "epoch": 7990} {"train_loss": -28.5936336517334, "global_step": 663212, "epoch": 7990} {"train_loss": -28.677021026611328, "global_step": 663213, "epoch": 7990} {"train_loss": -28.578107833862305, "global_step": 663214, "epoch": 7990} {"train_loss": -28.45026969909668, "global_step": 663215, "epoch": 7990} {"train_loss": -28.573150634765625, "global_step": 663216, "epoch": 7990} {"train_loss": -28.999622344970703, "global_step": 663217, "epoch": 7990} {"train_loss": -28.788156509399414, "global_step": 663218, "epoch": 7990} {"train_loss": -28.653827667236328, "global_step": 663219, "epoch": 7990} {"train_loss": -28.68165397644043, "global_step": 663220, "epoch": 7990} {"train_loss": -28.564783096313477, "global_step": 663221, "epoch": 7990} {"train_loss": -28.756885528564453, "global_step": 663222, "epoch": 7990} {"train_loss": -28.337329864501953, "global_step": 663223, "epoch": 7990} {"train_loss": -28.767065048217773, "global_step": 663224, "epoch": 7990} {"train_loss": -28.539472579956055, "global_step": 663225, "epoch": 7990} {"train_loss": -28.71674156188965, "global_step": 663226, "epoch": 7990} {"train_loss": -28.733686447143555, "global_step": 663227, "epoch": 7990} {"train_loss": -28.484338760375977, "global_step": 663228, "epoch": 7990} {"train_loss": -28.716205596923828, "global_step": 663229, "epoch": 7990} {"train_loss": -28.536108016967773, "global_step": 663230, "epoch": 7990} {"train_loss": -28.545618057250977, "global_step": 663231, "epoch": 7990} {"train_loss": -29.008527755737305, "global_step": 663232, "epoch": 7990} {"train_loss": -28.16425895690918, "global_step": 663233, "epoch": 7990} {"train_loss": -28.80512809753418, "global_step": 663234, "epoch": 7990} {"train_loss": -28.3855037689209, "global_step": 663235, "epoch": 7990} {"train_loss": -28.149658203125, "global_step": 663236, "epoch": 7990} {"train_loss": -28.473230361938477, "global_step": 663237, "epoch": 7990} {"train_loss": -28.27936363220215, "global_step": 663238, "epoch": 7990} {"train_loss": -28.446258544921875, "global_step": 663239, "epoch": 7990} {"train_loss": -28.315887451171875, "global_step": 663240, "epoch": 7990} {"train_loss": -28.298315048217773, "global_step": 663241, "epoch": 7990} {"train_loss": -27.944793701171875, "global_step": 663242, "epoch": 7990} {"train_loss": -28.367456436157227, "global_step": 663243, "epoch": 7990} {"train_loss": -28.049802780151367, "global_step": 663244, "epoch": 7990} {"train_loss": -27.97979736328125, "global_step": 663245, "epoch": 7990} {"train_loss": -27.9561824798584, "global_step": 663246, "epoch": 7990} {"train_loss": -27.79042625427246, "global_step": 663247, "epoch": 7990} {"train_loss": -28.569013595581055, "global_step": 663248, "epoch": 7990} {"train_loss": -28.325231552124023, "global_step": 663249, "epoch": 7990} {"train_loss": -28.26494789123535, "global_step": 663250, "epoch": 7990} {"train_loss": -28.233062744140625, "global_step": 663251, "epoch": 7990} {"train_loss": -28.218186504869575, "global_step": 663252, "epoch": 7990, "val_loss": 6653848.0} {"train_loss": -24.8649959564209, "global_step": 663253, "epoch": 7991} {"train_loss": -25.771215438842773, "global_step": 663254, "epoch": 7991} {"train_loss": -27.23488426208496, "global_step": 663255, "epoch": 7991} {"train_loss": -24.321317672729492, "global_step": 663256, "epoch": 7991} {"train_loss": -25.504423141479492, "global_step": 663257, "epoch": 7991} {"train_loss": -26.70516014099121, "global_step": 663258, "epoch": 7991} {"train_loss": -25.08271598815918, "global_step": 663259, "epoch": 7991} {"train_loss": -27.206485748291016, "global_step": 663260, "epoch": 7991} {"train_loss": -25.956878662109375, "global_step": 663261, "epoch": 7991} {"train_loss": -26.93110466003418, "global_step": 663262, "epoch": 7991} {"train_loss": -26.903778076171875, "global_step": 663263, "epoch": 7991} {"train_loss": -27.068744659423828, "global_step": 663264, "epoch": 7991} {"train_loss": -27.1737117767334, "global_step": 663265, "epoch": 7991} {"train_loss": -27.25886344909668, "global_step": 663266, "epoch": 7991} {"train_loss": -27.31565284729004, "global_step": 663267, "epoch": 7991} {"train_loss": -26.3817195892334, "global_step": 663268, "epoch": 7991} {"train_loss": -27.287710189819336, "global_step": 663269, "epoch": 7991} {"train_loss": -27.163105010986328, "global_step": 663270, "epoch": 7991} {"train_loss": -27.37384033203125, "global_step": 663271, "epoch": 7991} {"train_loss": -27.520776748657227, "global_step": 663272, "epoch": 7991} {"train_loss": -27.684621810913086, "global_step": 663273, "epoch": 7991} {"train_loss": -27.26706314086914, "global_step": 663274, "epoch": 7991} {"train_loss": -27.806354522705078, "global_step": 663275, "epoch": 7991} {"train_loss": -27.242883682250977, "global_step": 663276, "epoch": 7991} {"train_loss": -27.677692413330078, "global_step": 663277, "epoch": 7991} {"train_loss": -27.767292022705078, "global_step": 663278, "epoch": 7991} {"train_loss": -27.79414176940918, "global_step": 663279, "epoch": 7991} {"train_loss": -27.617151260375977, "global_step": 663280, "epoch": 7991} {"train_loss": -27.841999053955078, "global_step": 663281, "epoch": 7991} {"train_loss": -27.90285301208496, "global_step": 663282, "epoch": 7991} {"train_loss": -27.741424560546875, "global_step": 663283, "epoch": 7991} {"train_loss": -27.9737491607666, "global_step": 663284, "epoch": 7991} {"train_loss": -27.862014770507812, "global_step": 663285, "epoch": 7991} {"train_loss": -28.128320693969727, "global_step": 663286, "epoch": 7991} {"train_loss": -28.228734970092773, "global_step": 663287, "epoch": 7991} {"train_loss": -27.951444625854492, "global_step": 663288, "epoch": 7991} {"train_loss": -27.96695899963379, "global_step": 663289, "epoch": 7991} {"train_loss": -27.98321533203125, "global_step": 663290, "epoch": 7991} {"train_loss": -27.801061630249023, "global_step": 663291, "epoch": 7991} {"train_loss": -28.37005043029785, "global_step": 663292, "epoch": 7991} {"train_loss": -27.9824275970459, "global_step": 663293, "epoch": 7991} {"train_loss": -28.546955108642578, "global_step": 663294, "epoch": 7991} {"train_loss": -28.342132568359375, "global_step": 663295, "epoch": 7991} {"train_loss": -28.26812744140625, "global_step": 663296, "epoch": 7991} {"train_loss": -28.384246826171875, "global_step": 663297, "epoch": 7991} {"train_loss": -27.97347068786621, "global_step": 663298, "epoch": 7991} {"train_loss": -28.297632217407227, "global_step": 663299, "epoch": 7991} {"train_loss": -28.23014259338379, "global_step": 663300, "epoch": 7991} {"train_loss": -28.242706298828125, "global_step": 663301, "epoch": 7991} {"train_loss": -28.384275436401367, "global_step": 663302, "epoch": 7991} {"train_loss": -28.339941024780273, "global_step": 663303, "epoch": 7991} {"train_loss": -28.206029891967773, "global_step": 663304, "epoch": 7991} {"train_loss": -28.53474998474121, "global_step": 663305, "epoch": 7991} {"train_loss": -28.241235733032227, "global_step": 663306, "epoch": 7991} {"train_loss": -28.44610595703125, "global_step": 663307, "epoch": 7991} {"train_loss": -28.75540542602539, "global_step": 663308, "epoch": 7991} {"train_loss": -28.22584342956543, "global_step": 663309, "epoch": 7991} {"train_loss": -28.22857093811035, "global_step": 663310, "epoch": 7991} {"train_loss": -28.3311767578125, "global_step": 663311, "epoch": 7991} {"train_loss": -28.495086669921875, "global_step": 663312, "epoch": 7991} {"train_loss": -28.004358291625977, "global_step": 663313, "epoch": 7991} {"train_loss": -28.376676559448242, "global_step": 663314, "epoch": 7991} {"train_loss": -28.491744995117188, "global_step": 663315, "epoch": 7991} {"train_loss": -28.618427276611328, "global_step": 663316, "epoch": 7991} {"train_loss": -28.266555786132812, "global_step": 663317, "epoch": 7991} {"train_loss": -28.20722007751465, "global_step": 663318, "epoch": 7991} {"train_loss": -28.306798934936523, "global_step": 663319, "epoch": 7991} {"train_loss": -29.149381637573242, "global_step": 663320, "epoch": 7991} {"train_loss": -28.701059341430664, "global_step": 663321, "epoch": 7991} {"train_loss": -28.61774253845215, "global_step": 663322, "epoch": 7991} {"train_loss": -28.46197509765625, "global_step": 663323, "epoch": 7991} {"train_loss": -28.532352447509766, "global_step": 663324, "epoch": 7991} {"train_loss": -28.192306518554688, "global_step": 663325, "epoch": 7991} {"train_loss": -28.673404693603516, "global_step": 663326, "epoch": 7991} {"train_loss": -28.57865333557129, "global_step": 663327, "epoch": 7991} {"train_loss": -28.249719619750977, "global_step": 663328, "epoch": 7991} {"train_loss": -28.62269401550293, "global_step": 663329, "epoch": 7991} {"train_loss": -28.413297653198242, "global_step": 663330, "epoch": 7991} {"train_loss": -28.648178100585938, "global_step": 663331, "epoch": 7991} {"train_loss": -28.42340660095215, "global_step": 663332, "epoch": 7991} {"train_loss": -28.364938735961914, "global_step": 663333, "epoch": 7991} {"train_loss": -28.693572998046875, "global_step": 663334, "epoch": 7991} {"train_loss": -27.83216747605657, "global_step": 663335, "epoch": 7991, "val_loss": 6701667.0} {"train_loss": -27.44415855407715, "global_step": 663336, "epoch": 7992} {"train_loss": -27.225324630737305, "global_step": 663337, "epoch": 7992} {"train_loss": -26.995817184448242, "global_step": 663338, "epoch": 7992} {"train_loss": -28.022069931030273, "global_step": 663339, "epoch": 7992} {"train_loss": -27.5960750579834, "global_step": 663340, "epoch": 7992} {"train_loss": -27.7810115814209, "global_step": 663341, "epoch": 7992} {"train_loss": -27.762592315673828, "global_step": 663342, "epoch": 7992} {"train_loss": -27.573312759399414, "global_step": 663343, "epoch": 7992} {"train_loss": -27.615976333618164, "global_step": 663344, "epoch": 7992} {"train_loss": -27.551700592041016, "global_step": 663345, "epoch": 7992} {"train_loss": -27.767120361328125, "global_step": 663346, "epoch": 7992} {"train_loss": -28.0003604888916, "global_step": 663347, "epoch": 7992} {"train_loss": -28.031997680664062, "global_step": 663348, "epoch": 7992} {"train_loss": -27.85354995727539, "global_step": 663349, "epoch": 7992} {"train_loss": -27.970321655273438, "global_step": 663350, "epoch": 7992} {"train_loss": -27.919208526611328, "global_step": 663351, "epoch": 7992} {"train_loss": -28.34364128112793, "global_step": 663352, "epoch": 7992} {"train_loss": -27.968236923217773, "global_step": 663353, "epoch": 7992} {"train_loss": -27.778656005859375, "global_step": 663354, "epoch": 7992} {"train_loss": -27.903858184814453, "global_step": 663355, "epoch": 7992} {"train_loss": -27.996475219726562, "global_step": 663356, "epoch": 7992} {"train_loss": -28.097448348999023, "global_step": 663357, "epoch": 7992} {"train_loss": -28.3809814453125, "global_step": 663358, "epoch": 7992} {"train_loss": -28.079803466796875, "global_step": 663359, "epoch": 7992} {"train_loss": -28.47389030456543, "global_step": 663360, "epoch": 7992} {"train_loss": -28.237226486206055, "global_step": 663361, "epoch": 7992} {"train_loss": -28.223493576049805, "global_step": 663362, "epoch": 7992} {"train_loss": -28.514911651611328, "global_step": 663363, "epoch": 7992} {"train_loss": -28.548095703125, "global_step": 663364, "epoch": 7992} {"train_loss": -28.302820205688477, "global_step": 663365, "epoch": 7992} {"train_loss": -28.436603546142578, "global_step": 663366, "epoch": 7992} {"train_loss": -28.19769859313965, "global_step": 663367, "epoch": 7992} {"train_loss": -28.417829513549805, "global_step": 663368, "epoch": 7992} {"train_loss": -28.453027725219727, "global_step": 663369, "epoch": 7992} {"train_loss": -28.567651748657227, "global_step": 663370, "epoch": 7992} {"train_loss": -28.428815841674805, "global_step": 663371, "epoch": 7992} {"train_loss": -28.524139404296875, "global_step": 663372, "epoch": 7992} {"train_loss": -28.207000732421875, "global_step": 663373, "epoch": 7992} {"train_loss": -28.616363525390625, "global_step": 663374, "epoch": 7992} {"train_loss": -28.489423751831055, "global_step": 663375, "epoch": 7992} {"train_loss": -28.723403930664062, "global_step": 663376, "epoch": 7992} {"train_loss": -28.70050621032715, "global_step": 663377, "epoch": 7992} {"train_loss": -28.842416763305664, "global_step": 663378, "epoch": 7992} {"train_loss": -28.504430770874023, "global_step": 663379, "epoch": 7992} {"train_loss": -28.30280113220215, "global_step": 663380, "epoch": 7992} {"train_loss": -28.648883819580078, "global_step": 663381, "epoch": 7992} {"train_loss": -28.474462509155273, "global_step": 663382, "epoch": 7992} {"train_loss": -28.52264404296875, "global_step": 663383, "epoch": 7992} {"train_loss": -28.300989151000977, "global_step": 663384, "epoch": 7992} {"train_loss": -28.611120223999023, "global_step": 663385, "epoch": 7992} {"train_loss": -28.728750228881836, "global_step": 663386, "epoch": 7992} {"train_loss": -28.07559585571289, "global_step": 663387, "epoch": 7992} {"train_loss": -28.215042114257812, "global_step": 663388, "epoch": 7992} {"train_loss": -27.877750396728516, "global_step": 663389, "epoch": 7992} {"train_loss": -28.343481063842773, "global_step": 663390, "epoch": 7992} {"train_loss": -28.213048934936523, "global_step": 663391, "epoch": 7992} {"train_loss": -28.51114845275879, "global_step": 663392, "epoch": 7992} {"train_loss": -28.521453857421875, "global_step": 663393, "epoch": 7992} {"train_loss": -28.286035537719727, "global_step": 663394, "epoch": 7992} {"train_loss": -28.099517822265625, "global_step": 663395, "epoch": 7992} {"train_loss": -28.4669246673584, "global_step": 663396, "epoch": 7992} {"train_loss": -28.710458755493164, "global_step": 663397, "epoch": 7992} {"train_loss": -28.097448348999023, "global_step": 663398, "epoch": 7992} {"train_loss": -27.973499298095703, "global_step": 663399, "epoch": 7992} {"train_loss": -28.44211769104004, "global_step": 663400, "epoch": 7992} {"train_loss": -28.313812255859375, "global_step": 663401, "epoch": 7992} {"train_loss": -28.475040435791016, "global_step": 663402, "epoch": 7992} {"train_loss": -28.307397842407227, "global_step": 663403, "epoch": 7992} {"train_loss": -27.907556533813477, "global_step": 663404, "epoch": 7992} {"train_loss": -28.38288688659668, "global_step": 663405, "epoch": 7992} {"train_loss": -28.365299224853516, "global_step": 663406, "epoch": 7992} {"train_loss": -27.810850143432617, "global_step": 663407, "epoch": 7992} {"train_loss": -27.334074020385742, "global_step": 663408, "epoch": 7992} {"train_loss": -28.00795555114746, "global_step": 663409, "epoch": 7992} {"train_loss": -27.911548614501953, "global_step": 663410, "epoch": 7992} {"train_loss": -27.639013290405273, "global_step": 663411, "epoch": 7992} {"train_loss": -28.633655548095703, "global_step": 663412, "epoch": 7992} {"train_loss": -27.989282608032227, "global_step": 663413, "epoch": 7992} {"train_loss": -27.967382431030273, "global_step": 663414, "epoch": 7992} {"train_loss": -28.08002281188965, "global_step": 663415, "epoch": 7992} {"train_loss": -28.490070343017578, "global_step": 663416, "epoch": 7992} {"train_loss": -28.03621482849121, "global_step": 663417, "epoch": 7992} {"train_loss": -28.180360380425512, "global_step": 663418, "epoch": 7992, "val_loss": 6690697.0} {"train_loss": -27.5714168548584, "global_step": 663419, "epoch": 7993} {"train_loss": -27.8299560546875, "global_step": 663420, "epoch": 7993} {"train_loss": -27.48495864868164, "global_step": 663421, "epoch": 7993} {"train_loss": -28.118839263916016, "global_step": 663422, "epoch": 7993} {"train_loss": -28.01397705078125, "global_step": 663423, "epoch": 7993} {"train_loss": -27.969411849975586, "global_step": 663424, "epoch": 7993} {"train_loss": -28.213733673095703, "global_step": 663425, "epoch": 7993} {"train_loss": -28.019073486328125, "global_step": 663426, "epoch": 7993} {"train_loss": -27.90410804748535, "global_step": 663427, "epoch": 7993} {"train_loss": -28.038633346557617, "global_step": 663428, "epoch": 7993} {"train_loss": -27.91761589050293, "global_step": 663429, "epoch": 7993} {"train_loss": -27.94013023376465, "global_step": 663430, "epoch": 7993} {"train_loss": -28.031904220581055, "global_step": 663431, "epoch": 7993} {"train_loss": -28.16341209411621, "global_step": 663432, "epoch": 7993} {"train_loss": -28.258825302124023, "global_step": 663433, "epoch": 7993} {"train_loss": -28.243844985961914, "global_step": 663434, "epoch": 7993} {"train_loss": -28.08852195739746, "global_step": 663435, "epoch": 7993} {"train_loss": -28.144805908203125, "global_step": 663436, "epoch": 7993} {"train_loss": -28.210050582885742, "global_step": 663437, "epoch": 7993} {"train_loss": -27.932327270507812, "global_step": 663438, "epoch": 7993} {"train_loss": -28.15569496154785, "global_step": 663439, "epoch": 7993} {"train_loss": -28.425634384155273, "global_step": 663440, "epoch": 7993} {"train_loss": -28.5308837890625, "global_step": 663441, "epoch": 7993} {"train_loss": -28.20758056640625, "global_step": 663442, "epoch": 7993} {"train_loss": -28.150665283203125, "global_step": 663443, "epoch": 7993} {"train_loss": -27.90093421936035, "global_step": 663444, "epoch": 7993} {"train_loss": -28.628131866455078, "global_step": 663445, "epoch": 7993} {"train_loss": -28.165180206298828, "global_step": 663446, "epoch": 7993} {"train_loss": -27.781299591064453, "global_step": 663447, "epoch": 7993} {"train_loss": -27.913589477539062, "global_step": 663448, "epoch": 7993} {"train_loss": -27.8773250579834, "global_step": 663449, "epoch": 7993} {"train_loss": -28.404529571533203, "global_step": 663450, "epoch": 7993} {"train_loss": -28.53162956237793, "global_step": 663451, "epoch": 7993} {"train_loss": -28.020353317260742, "global_step": 663452, "epoch": 7993} {"train_loss": -28.314062118530273, "global_step": 663453, "epoch": 7993} {"train_loss": -28.301843643188477, "global_step": 663454, "epoch": 7993} {"train_loss": -27.711685180664062, "global_step": 663455, "epoch": 7993} {"train_loss": -27.80316162109375, "global_step": 663456, "epoch": 7993} {"train_loss": -28.55820655822754, "global_step": 663457, "epoch": 7993} {"train_loss": -28.0106143951416, "global_step": 663458, "epoch": 7993} {"train_loss": -27.815235137939453, "global_step": 663459, "epoch": 7993} {"train_loss": -28.449193954467773, "global_step": 663460, "epoch": 7993} {"train_loss": -27.931676864624023, "global_step": 663461, "epoch": 7993} {"train_loss": -28.52992820739746, "global_step": 663462, "epoch": 7993} {"train_loss": -28.193933486938477, "global_step": 663463, "epoch": 7993} {"train_loss": -28.373798370361328, "global_step": 663464, "epoch": 7993} {"train_loss": -28.00369644165039, "global_step": 663465, "epoch": 7993} {"train_loss": -28.62186050415039, "global_step": 663466, "epoch": 7993} {"train_loss": -27.719715118408203, "global_step": 663467, "epoch": 7993} {"train_loss": -28.17990493774414, "global_step": 663468, "epoch": 7993} {"train_loss": -28.617834091186523, "global_step": 663469, "epoch": 7993} {"train_loss": -28.547988891601562, "global_step": 663470, "epoch": 7993} {"train_loss": -28.279394149780273, "global_step": 663471, "epoch": 7993} {"train_loss": -28.388681411743164, "global_step": 663472, "epoch": 7993} {"train_loss": -28.836353302001953, "global_step": 663473, "epoch": 7993} {"train_loss": -28.408727645874023, "global_step": 663474, "epoch": 7993} {"train_loss": -28.1812686920166, "global_step": 663475, "epoch": 7993} {"train_loss": -28.54170036315918, "global_step": 663476, "epoch": 7993} {"train_loss": -28.394758224487305, "global_step": 663477, "epoch": 7993} {"train_loss": -28.645404815673828, "global_step": 663478, "epoch": 7993} {"train_loss": -28.64027214050293, "global_step": 663479, "epoch": 7993} {"train_loss": -28.53567886352539, "global_step": 663480, "epoch": 7993} {"train_loss": -28.34308433532715, "global_step": 663481, "epoch": 7993} {"train_loss": -28.804187774658203, "global_step": 663482, "epoch": 7993} {"train_loss": -28.33172035217285, "global_step": 663483, "epoch": 7993} {"train_loss": -28.68646812438965, "global_step": 663484, "epoch": 7993} {"train_loss": -28.494611740112305, "global_step": 663485, "epoch": 7993} {"train_loss": -28.518869400024414, "global_step": 663486, "epoch": 7993} {"train_loss": -28.755475997924805, "global_step": 663487, "epoch": 7993} {"train_loss": -28.39349365234375, "global_step": 663488, "epoch": 7993} {"train_loss": -28.112329483032227, "global_step": 663489, "epoch": 7993} {"train_loss": -28.658573150634766, "global_step": 663490, "epoch": 7993} {"train_loss": -28.479536056518555, "global_step": 663491, "epoch": 7993} {"train_loss": -28.246356964111328, "global_step": 663492, "epoch": 7993} {"train_loss": -27.7935733795166, "global_step": 663493, "epoch": 7993} {"train_loss": -28.470661163330078, "global_step": 663494, "epoch": 7993} {"train_loss": -28.9600772857666, "global_step": 663495, "epoch": 7993} {"train_loss": -27.59175682067871, "global_step": 663496, "epoch": 7993} {"train_loss": -28.665624618530273, "global_step": 663497, "epoch": 7993} {"train_loss": -27.99403190612793, "global_step": 663498, "epoch": 7993} {"train_loss": -28.209152221679688, "global_step": 663499, "epoch": 7993} {"train_loss": -27.800275802612305, "global_step": 663500, "epoch": 7993} {"train_loss": -28.21969395373241, "global_step": 663501, "epoch": 7993, "val_loss": 6737458.0} {"train_loss": -28.0423583984375, "global_step": 663502, "epoch": 7994} {"train_loss": -27.5106258392334, "global_step": 663503, "epoch": 7994} {"train_loss": -27.641937255859375, "global_step": 663504, "epoch": 7994} {"train_loss": -28.326818466186523, "global_step": 663505, "epoch": 7994} {"train_loss": -27.560346603393555, "global_step": 663506, "epoch": 7994} {"train_loss": -27.862533569335938, "global_step": 663507, "epoch": 7994} {"train_loss": -28.160024642944336, "global_step": 663508, "epoch": 7994} {"train_loss": -27.014211654663086, "global_step": 663509, "epoch": 7994} {"train_loss": -28.003454208374023, "global_step": 663510, "epoch": 7994} {"train_loss": -27.918771743774414, "global_step": 663511, "epoch": 7994} {"train_loss": -27.7025203704834, "global_step": 663512, "epoch": 7994} {"train_loss": -28.070083618164062, "global_step": 663513, "epoch": 7994} {"train_loss": -27.88953971862793, "global_step": 663514, "epoch": 7994} {"train_loss": -28.160919189453125, "global_step": 663515, "epoch": 7994} {"train_loss": -28.10855484008789, "global_step": 663516, "epoch": 7994} {"train_loss": -28.645477294921875, "global_step": 663517, "epoch": 7994} {"train_loss": -28.2137451171875, "global_step": 663518, "epoch": 7994} {"train_loss": -27.921146392822266, "global_step": 663519, "epoch": 7994} {"train_loss": -28.129247665405273, "global_step": 663520, "epoch": 7994} {"train_loss": -28.44024658203125, "global_step": 663521, "epoch": 7994} {"train_loss": -28.325571060180664, "global_step": 663522, "epoch": 7994} {"train_loss": -28.66114616394043, "global_step": 663523, "epoch": 7994} {"train_loss": -28.41786003112793, "global_step": 663524, "epoch": 7994} {"train_loss": -28.043685913085938, "global_step": 663525, "epoch": 7994} {"train_loss": -28.232221603393555, "global_step": 663526, "epoch": 7994} {"train_loss": -28.20682716369629, "global_step": 663527, "epoch": 7994} {"train_loss": -28.37784194946289, "global_step": 663528, "epoch": 7994} {"train_loss": -28.130563735961914, "global_step": 663529, "epoch": 7994} {"train_loss": -28.420276641845703, "global_step": 663530, "epoch": 7994} {"train_loss": -28.557641983032227, "global_step": 663531, "epoch": 7994} {"train_loss": -28.637128829956055, "global_step": 663532, "epoch": 7994} {"train_loss": -28.540563583374023, "global_step": 663533, "epoch": 7994} {"train_loss": -28.675939559936523, "global_step": 663534, "epoch": 7994} {"train_loss": -28.6308536529541, "global_step": 663535, "epoch": 7994} {"train_loss": -28.563276290893555, "global_step": 663536, "epoch": 7994} {"train_loss": -28.30816078186035, "global_step": 663537, "epoch": 7994} {"train_loss": -28.432086944580078, "global_step": 663538, "epoch": 7994} {"train_loss": -28.301267623901367, "global_step": 663539, "epoch": 7994} {"train_loss": -28.54965591430664, "global_step": 663540, "epoch": 7994} {"train_loss": -28.395727157592773, "global_step": 663541, "epoch": 7994} {"train_loss": -28.523666381835938, "global_step": 663542, "epoch": 7994} {"train_loss": -28.808202743530273, "global_step": 663543, "epoch": 7994} {"train_loss": -28.436893463134766, "global_step": 663544, "epoch": 7994} {"train_loss": -28.25033950805664, "global_step": 663545, "epoch": 7994} {"train_loss": -28.475915908813477, "global_step": 663546, "epoch": 7994} {"train_loss": -28.698333740234375, "global_step": 663547, "epoch": 7994} {"train_loss": -28.62738037109375, "global_step": 663548, "epoch": 7994} {"train_loss": -28.011249542236328, "global_step": 663549, "epoch": 7994} {"train_loss": -28.368078231811523, "global_step": 663550, "epoch": 7994} {"train_loss": -28.174833297729492, "global_step": 663551, "epoch": 7994} {"train_loss": -27.96149253845215, "global_step": 663552, "epoch": 7994} {"train_loss": -28.798444747924805, "global_step": 663553, "epoch": 7994} {"train_loss": -28.028980255126953, "global_step": 663554, "epoch": 7994} {"train_loss": -28.196104049682617, "global_step": 663555, "epoch": 7994} {"train_loss": -28.2303524017334, "global_step": 663556, "epoch": 7994} {"train_loss": -28.20233154296875, "global_step": 663557, "epoch": 7994} {"train_loss": -28.310108184814453, "global_step": 663558, "epoch": 7994} {"train_loss": -28.342432022094727, "global_step": 663559, "epoch": 7994} {"train_loss": -28.315073013305664, "global_step": 663560, "epoch": 7994} {"train_loss": -28.52735710144043, "global_step": 663561, "epoch": 7994} {"train_loss": -28.322118759155273, "global_step": 663562, "epoch": 7994} {"train_loss": -28.1387939453125, "global_step": 663563, "epoch": 7994} {"train_loss": -28.286514282226562, "global_step": 663564, "epoch": 7994} {"train_loss": -28.228321075439453, "global_step": 663565, "epoch": 7994} {"train_loss": -28.091693878173828, "global_step": 663566, "epoch": 7994} {"train_loss": -28.05116081237793, "global_step": 663567, "epoch": 7994} {"train_loss": -28.471633911132812, "global_step": 663568, "epoch": 7994} {"train_loss": -28.521142959594727, "global_step": 663569, "epoch": 7994} {"train_loss": -28.104711532592773, "global_step": 663570, "epoch": 7994} {"train_loss": -28.172407150268555, "global_step": 663571, "epoch": 7994} {"train_loss": -28.154714584350586, "global_step": 663572, "epoch": 7994} {"train_loss": -28.592376708984375, "global_step": 663573, "epoch": 7994} {"train_loss": -27.996204376220703, "global_step": 663574, "epoch": 7994} {"train_loss": -27.949798583984375, "global_step": 663575, "epoch": 7994} {"train_loss": -28.292470932006836, "global_step": 663576, "epoch": 7994} {"train_loss": -28.616525650024414, "global_step": 663577, "epoch": 7994} {"train_loss": -27.89619255065918, "global_step": 663578, "epoch": 7994} {"train_loss": -28.105634689331055, "global_step": 663579, "epoch": 7994} {"train_loss": -28.136402130126953, "global_step": 663580, "epoch": 7994} {"train_loss": -28.354690551757812, "global_step": 663581, "epoch": 7994} {"train_loss": -28.117441177368164, "global_step": 663582, "epoch": 7994} {"train_loss": -28.54558753967285, "global_step": 663583, "epoch": 7994} {"train_loss": -28.232035487531178, "global_step": 663584, "epoch": 7994, "val_loss": 6684991.0} {"train_loss": -27.63753318786621, "global_step": 663585, "epoch": 7995} {"train_loss": -27.131290435791016, "global_step": 663586, "epoch": 7995} {"train_loss": -27.908432006835938, "global_step": 663587, "epoch": 7995} {"train_loss": -27.28687858581543, "global_step": 663588, "epoch": 7995} {"train_loss": -27.521875381469727, "global_step": 663589, "epoch": 7995} {"train_loss": -27.076059341430664, "global_step": 663590, "epoch": 7995} {"train_loss": -27.62409019470215, "global_step": 663591, "epoch": 7995} {"train_loss": -27.188201904296875, "global_step": 663592, "epoch": 7995} {"train_loss": -27.92242431640625, "global_step": 663593, "epoch": 7995} {"train_loss": -27.372541427612305, "global_step": 663594, "epoch": 7995} {"train_loss": -27.744054794311523, "global_step": 663595, "epoch": 7995} {"train_loss": -28.117496490478516, "global_step": 663596, "epoch": 7995} {"train_loss": -27.971332550048828, "global_step": 663597, "epoch": 7995} {"train_loss": -27.566293716430664, "global_step": 663598, "epoch": 7995} {"train_loss": -27.5295352935791, "global_step": 663599, "epoch": 7995} {"train_loss": -28.256799697875977, "global_step": 663600, "epoch": 7995} {"train_loss": -28.10040283203125, "global_step": 663601, "epoch": 7995} {"train_loss": -27.839136123657227, "global_step": 663602, "epoch": 7995} {"train_loss": -28.079050064086914, "global_step": 663603, "epoch": 7995} {"train_loss": -28.164417266845703, "global_step": 663604, "epoch": 7995} {"train_loss": -27.607324600219727, "global_step": 663605, "epoch": 7995} {"train_loss": -28.20703125, "global_step": 663606, "epoch": 7995} {"train_loss": -27.830753326416016, "global_step": 663607, "epoch": 7995} {"train_loss": -28.0833740234375, "global_step": 663608, "epoch": 7995} {"train_loss": -27.757343292236328, "global_step": 663609, "epoch": 7995} {"train_loss": -28.599807739257812, "global_step": 663610, "epoch": 7995} {"train_loss": -28.053485870361328, "global_step": 663611, "epoch": 7995} {"train_loss": -28.186920166015625, "global_step": 663612, "epoch": 7995} {"train_loss": -28.42902946472168, "global_step": 663613, "epoch": 7995} {"train_loss": -28.115692138671875, "global_step": 663614, "epoch": 7995} {"train_loss": -28.36749267578125, "global_step": 663615, "epoch": 7995} {"train_loss": -28.27120018005371, "global_step": 663616, "epoch": 7995} {"train_loss": -28.62928581237793, "global_step": 663617, "epoch": 7995} {"train_loss": -28.357465744018555, "global_step": 663618, "epoch": 7995} {"train_loss": -28.37041664123535, "global_step": 663619, "epoch": 7995} {"train_loss": -28.704599380493164, "global_step": 663620, "epoch": 7995} {"train_loss": -28.3151912689209, "global_step": 663621, "epoch": 7995} {"train_loss": -28.582080841064453, "global_step": 663622, "epoch": 7995} {"train_loss": -28.888269424438477, "global_step": 663623, "epoch": 7995} {"train_loss": -28.31380271911621, "global_step": 663624, "epoch": 7995} {"train_loss": -28.191083908081055, "global_step": 663625, "epoch": 7995} {"train_loss": -28.68414306640625, "global_step": 663626, "epoch": 7995} {"train_loss": -28.671106338500977, "global_step": 663627, "epoch": 7995} {"train_loss": -28.684736251831055, "global_step": 663628, "epoch": 7995} {"train_loss": -28.200408935546875, "global_step": 663629, "epoch": 7995} {"train_loss": -28.46864128112793, "global_step": 663630, "epoch": 7995} {"train_loss": -28.13284683227539, "global_step": 663631, "epoch": 7995} {"train_loss": -28.64900779724121, "global_step": 663632, "epoch": 7995} {"train_loss": -28.596837997436523, "global_step": 663633, "epoch": 7995} {"train_loss": -28.45061683654785, "global_step": 663634, "epoch": 7995} {"train_loss": -28.609012603759766, "global_step": 663635, "epoch": 7995} {"train_loss": -28.7706298828125, "global_step": 663636, "epoch": 7995} {"train_loss": -28.34852409362793, "global_step": 663637, "epoch": 7995} {"train_loss": -28.559370040893555, "global_step": 663638, "epoch": 7995} {"train_loss": -28.5880126953125, "global_step": 663639, "epoch": 7995} {"train_loss": -28.76841163635254, "global_step": 663640, "epoch": 7995} {"train_loss": -28.360319137573242, "global_step": 663641, "epoch": 7995} {"train_loss": -28.471099853515625, "global_step": 663642, "epoch": 7995} {"train_loss": -28.184839248657227, "global_step": 663643, "epoch": 7995} {"train_loss": -28.460830688476562, "global_step": 663644, "epoch": 7995} {"train_loss": -28.617727279663086, "global_step": 663645, "epoch": 7995} {"train_loss": -29.076313018798828, "global_step": 663646, "epoch": 7995} {"train_loss": -28.307422637939453, "global_step": 663647, "epoch": 7995} {"train_loss": -28.36231803894043, "global_step": 663648, "epoch": 7995} {"train_loss": -28.467437744140625, "global_step": 663649, "epoch": 7995} {"train_loss": -28.41438865661621, "global_step": 663650, "epoch": 7995} {"train_loss": -28.444028854370117, "global_step": 663651, "epoch": 7995} {"train_loss": -28.621679306030273, "global_step": 663652, "epoch": 7995} {"train_loss": -28.681812286376953, "global_step": 663653, "epoch": 7995} {"train_loss": -28.53888511657715, "global_step": 663654, "epoch": 7995} {"train_loss": -28.63553810119629, "global_step": 663655, "epoch": 7995} {"train_loss": -28.614118576049805, "global_step": 663656, "epoch": 7995} {"train_loss": -28.310754776000977, "global_step": 663657, "epoch": 7995} {"train_loss": -28.43464469909668, "global_step": 663658, "epoch": 7995} {"train_loss": -28.306110382080078, "global_step": 663659, "epoch": 7995} {"train_loss": -28.18647575378418, "global_step": 663660, "epoch": 7995} {"train_loss": -27.745798110961914, "global_step": 663661, "epoch": 7995} {"train_loss": -27.082489013671875, "global_step": 663662, "epoch": 7995} {"train_loss": -26.632516860961914, "global_step": 663663, "epoch": 7995} {"train_loss": -27.539358139038086, "global_step": 663664, "epoch": 7995} {"train_loss": -28.275470733642578, "global_step": 663665, "epoch": 7995} {"train_loss": -27.91864013671875, "global_step": 663666, "epoch": 7995} {"train_loss": -28.17790332472468, "global_step": 663667, "epoch": 7995, "val_loss": 6705445.5} {"train_loss": -27.41518211364746, "global_step": 663668, "epoch": 7996} {"train_loss": -26.909032821655273, "global_step": 663669, "epoch": 7996} {"train_loss": -27.450626373291016, "global_step": 663670, "epoch": 7996} {"train_loss": -27.710926055908203, "global_step": 663671, "epoch": 7996} {"train_loss": -27.165449142456055, "global_step": 663672, "epoch": 7996} {"train_loss": -27.736860275268555, "global_step": 663673, "epoch": 7996} {"train_loss": -28.210905075073242, "global_step": 663674, "epoch": 7996} {"train_loss": -27.90327262878418, "global_step": 663675, "epoch": 7996} {"train_loss": -27.957462310791016, "global_step": 663676, "epoch": 7996} {"train_loss": -27.447559356689453, "global_step": 663677, "epoch": 7996} {"train_loss": -27.7409610748291, "global_step": 663678, "epoch": 7996} {"train_loss": -27.793167114257812, "global_step": 663679, "epoch": 7996} {"train_loss": -28.035572052001953, "global_step": 663680, "epoch": 7996} {"train_loss": -28.325592041015625, "global_step": 663681, "epoch": 7996} {"train_loss": -28.071807861328125, "global_step": 663682, "epoch": 7996} {"train_loss": -27.66205406188965, "global_step": 663683, "epoch": 7996} {"train_loss": -27.889379501342773, "global_step": 663684, "epoch": 7996} {"train_loss": -28.03153419494629, "global_step": 663685, "epoch": 7996} {"train_loss": -27.85725212097168, "global_step": 663686, "epoch": 7996} {"train_loss": -27.77581787109375, "global_step": 663687, "epoch": 7996} {"train_loss": -27.86671257019043, "global_step": 663688, "epoch": 7996} {"train_loss": -28.048093795776367, "global_step": 663689, "epoch": 7996} {"train_loss": -28.434499740600586, "global_step": 663690, "epoch": 7996} {"train_loss": -28.038599014282227, "global_step": 663691, "epoch": 7996} {"train_loss": -28.49302101135254, "global_step": 663692, "epoch": 7996} {"train_loss": -28.246023178100586, "global_step": 663693, "epoch": 7996} {"train_loss": -28.031421661376953, "global_step": 663694, "epoch": 7996} {"train_loss": -28.251630783081055, "global_step": 663695, "epoch": 7996} {"train_loss": -28.033979415893555, "global_step": 663696, "epoch": 7996} {"train_loss": -28.1915225982666, "global_step": 663697, "epoch": 7996} {"train_loss": -28.7749080657959, "global_step": 663698, "epoch": 7996} {"train_loss": -28.042221069335938, "global_step": 663699, "epoch": 7996} {"train_loss": -28.348913192749023, "global_step": 663700, "epoch": 7996} {"train_loss": -28.23286247253418, "global_step": 663701, "epoch": 7996} {"train_loss": -28.447250366210938, "global_step": 663702, "epoch": 7996} {"train_loss": -28.369338989257812, "global_step": 663703, "epoch": 7996} {"train_loss": -28.617406845092773, "global_step": 663704, "epoch": 7996} {"train_loss": -28.279922485351562, "global_step": 663705, "epoch": 7996} {"train_loss": -28.745508193969727, "global_step": 663706, "epoch": 7996} {"train_loss": -28.50139808654785, "global_step": 663707, "epoch": 7996} {"train_loss": -28.2601375579834, "global_step": 663708, "epoch": 7996} {"train_loss": -28.523019790649414, "global_step": 663709, "epoch": 7996} {"train_loss": -28.650348663330078, "global_step": 663710, "epoch": 7996} {"train_loss": -28.926420211791992, "global_step": 663711, "epoch": 7996} {"train_loss": -28.290252685546875, "global_step": 663712, "epoch": 7996} {"train_loss": -28.8216495513916, "global_step": 663713, "epoch": 7996} {"train_loss": -28.396392822265625, "global_step": 663714, "epoch": 7996} {"train_loss": -28.689777374267578, "global_step": 663715, "epoch": 7996} {"train_loss": -28.573896408081055, "global_step": 663716, "epoch": 7996} {"train_loss": -28.84063148498535, "global_step": 663717, "epoch": 7996} {"train_loss": -28.561559677124023, "global_step": 663718, "epoch": 7996} {"train_loss": -28.8886775970459, "global_step": 663719, "epoch": 7996} {"train_loss": -28.850351333618164, "global_step": 663720, "epoch": 7996} {"train_loss": -28.6422176361084, "global_step": 663721, "epoch": 7996} {"train_loss": -28.50031852722168, "global_step": 663722, "epoch": 7996} {"train_loss": -28.630451202392578, "global_step": 663723, "epoch": 7996} {"train_loss": -28.4300594329834, "global_step": 663724, "epoch": 7996} {"train_loss": -28.46893882751465, "global_step": 663725, "epoch": 7996} {"train_loss": -28.341373443603516, "global_step": 663726, "epoch": 7996} {"train_loss": -28.4541015625, "global_step": 663727, "epoch": 7996} {"train_loss": -28.28035545349121, "global_step": 663728, "epoch": 7996} {"train_loss": -28.27949333190918, "global_step": 663729, "epoch": 7996} {"train_loss": -28.43695068359375, "global_step": 663730, "epoch": 7996} {"train_loss": -28.522552490234375, "global_step": 663731, "epoch": 7996} {"train_loss": -28.726526260375977, "global_step": 663732, "epoch": 7996} {"train_loss": -28.349084854125977, "global_step": 663733, "epoch": 7996} {"train_loss": -28.6050968170166, "global_step": 663734, "epoch": 7996} {"train_loss": -28.217016220092773, "global_step": 663735, "epoch": 7996} {"train_loss": -28.44245719909668, "global_step": 663736, "epoch": 7996} {"train_loss": -28.386920928955078, "global_step": 663737, "epoch": 7996} {"train_loss": -28.401844024658203, "global_step": 663738, "epoch": 7996} {"train_loss": -28.119504928588867, "global_step": 663739, "epoch": 7996} {"train_loss": -28.50160026550293, "global_step": 663740, "epoch": 7996} {"train_loss": -28.569791793823242, "global_step": 663741, "epoch": 7996} {"train_loss": -28.449499130249023, "global_step": 663742, "epoch": 7996} {"train_loss": -28.2052059173584, "global_step": 663743, "epoch": 7996} {"train_loss": -28.34480094909668, "global_step": 663744, "epoch": 7996} {"train_loss": -28.450483322143555, "global_step": 663745, "epoch": 7996} {"train_loss": -28.60072135925293, "global_step": 663746, "epoch": 7996} {"train_loss": -28.54371452331543, "global_step": 663747, "epoch": 7996} {"train_loss": -28.759185791015625, "global_step": 663748, "epoch": 7996} {"train_loss": -28.30476188659668, "global_step": 663749, "epoch": 7996} {"train_loss": -28.260672029242457, "global_step": 663750, "epoch": 7996, "val_loss": 6576546.0} {"train_loss": -27.065204620361328, "global_step": 663751, "epoch": 7997} {"train_loss": -27.149463653564453, "global_step": 663752, "epoch": 7997} {"train_loss": -27.315841674804688, "global_step": 663753, "epoch": 7997} {"train_loss": -27.8701171875, "global_step": 663754, "epoch": 7997} {"train_loss": -27.963306427001953, "global_step": 663755, "epoch": 7997} {"train_loss": -28.142791748046875, "global_step": 663756, "epoch": 7997} {"train_loss": -27.95680046081543, "global_step": 663757, "epoch": 7997} {"train_loss": -28.22321891784668, "global_step": 663758, "epoch": 7997} {"train_loss": -27.5183162689209, "global_step": 663759, "epoch": 7997} {"train_loss": -28.090051651000977, "global_step": 663760, "epoch": 7997} {"train_loss": -28.115076065063477, "global_step": 663761, "epoch": 7997} {"train_loss": -27.726598739624023, "global_step": 663762, "epoch": 7997} {"train_loss": -28.105039596557617, "global_step": 663763, "epoch": 7997} {"train_loss": -28.197057723999023, "global_step": 663764, "epoch": 7997} {"train_loss": -28.274433135986328, "global_step": 663765, "epoch": 7997} {"train_loss": -28.568227767944336, "global_step": 663766, "epoch": 7997} {"train_loss": -28.149892807006836, "global_step": 663767, "epoch": 7997} {"train_loss": -28.3111572265625, "global_step": 663768, "epoch": 7997} {"train_loss": -28.177865982055664, "global_step": 663769, "epoch": 7997} {"train_loss": -28.312299728393555, "global_step": 663770, "epoch": 7997} {"train_loss": -28.072235107421875, "global_step": 663771, "epoch": 7997} {"train_loss": -27.950489044189453, "global_step": 663772, "epoch": 7997} {"train_loss": -27.896076202392578, "global_step": 663773, "epoch": 7997} {"train_loss": -28.354053497314453, "global_step": 663774, "epoch": 7997} {"train_loss": -28.568206787109375, "global_step": 663775, "epoch": 7997} {"train_loss": -28.381444931030273, "global_step": 663776, "epoch": 7997} {"train_loss": -28.315786361694336, "global_step": 663777, "epoch": 7997} {"train_loss": -28.394901275634766, "global_step": 663778, "epoch": 7997} {"train_loss": -28.61699867248535, "global_step": 663779, "epoch": 7997} {"train_loss": -28.4663028717041, "global_step": 663780, "epoch": 7997} {"train_loss": -28.609851837158203, "global_step": 663781, "epoch": 7997} {"train_loss": -28.276248931884766, "global_step": 663782, "epoch": 7997} {"train_loss": -28.265119552612305, "global_step": 663783, "epoch": 7997} {"train_loss": -28.16229820251465, "global_step": 663784, "epoch": 7997} {"train_loss": -28.22994041442871, "global_step": 663785, "epoch": 7997} {"train_loss": -28.357837677001953, "global_step": 663786, "epoch": 7997} {"train_loss": -28.442991256713867, "global_step": 663787, "epoch": 7997} {"train_loss": -28.459033966064453, "global_step": 663788, "epoch": 7997} {"train_loss": -28.344837188720703, "global_step": 663789, "epoch": 7997} {"train_loss": -28.601917266845703, "global_step": 663790, "epoch": 7997} {"train_loss": -28.330371856689453, "global_step": 663791, "epoch": 7997} {"train_loss": -28.393545150756836, "global_step": 663792, "epoch": 7997} {"train_loss": -28.163619995117188, "global_step": 663793, "epoch": 7997} {"train_loss": -28.480182647705078, "global_step": 663794, "epoch": 7997} {"train_loss": -28.585193634033203, "global_step": 663795, "epoch": 7997} {"train_loss": -28.561975479125977, "global_step": 663796, "epoch": 7997} {"train_loss": -28.413599014282227, "global_step": 663797, "epoch": 7997} {"train_loss": -28.12557029724121, "global_step": 663798, "epoch": 7997} {"train_loss": -28.4189453125, "global_step": 663799, "epoch": 7997} {"train_loss": -28.746978759765625, "global_step": 663800, "epoch": 7997} {"train_loss": -28.785083770751953, "global_step": 663801, "epoch": 7997} {"train_loss": -28.785924911499023, "global_step": 663802, "epoch": 7997} {"train_loss": -28.915164947509766, "global_step": 663803, "epoch": 7997} {"train_loss": -28.702238082885742, "global_step": 663804, "epoch": 7997} {"train_loss": -28.363910675048828, "global_step": 663805, "epoch": 7997} {"train_loss": -28.45722770690918, "global_step": 663806, "epoch": 7997} {"train_loss": -28.29802894592285, "global_step": 663807, "epoch": 7997} {"train_loss": -28.56821060180664, "global_step": 663808, "epoch": 7997} {"train_loss": -28.577131271362305, "global_step": 663809, "epoch": 7997} {"train_loss": -28.760900497436523, "global_step": 663810, "epoch": 7997} {"train_loss": -28.21917152404785, "global_step": 663811, "epoch": 7997} {"train_loss": -28.596891403198242, "global_step": 663812, "epoch": 7997} {"train_loss": -28.50103759765625, "global_step": 663813, "epoch": 7997} {"train_loss": -28.647418975830078, "global_step": 663814, "epoch": 7997} {"train_loss": -28.3015079498291, "global_step": 663815, "epoch": 7997} {"train_loss": -28.1666316986084, "global_step": 663816, "epoch": 7997} {"train_loss": -28.275548934936523, "global_step": 663817, "epoch": 7997} {"train_loss": -28.15226173400879, "global_step": 663818, "epoch": 7997} {"train_loss": -28.30027198791504, "global_step": 663819, "epoch": 7997} {"train_loss": -28.56916618347168, "global_step": 663820, "epoch": 7997} {"train_loss": -27.870527267456055, "global_step": 663821, "epoch": 7997} {"train_loss": -27.826425552368164, "global_step": 663822, "epoch": 7997} {"train_loss": -27.927703857421875, "global_step": 663823, "epoch": 7997} {"train_loss": -28.46588706970215, "global_step": 663824, "epoch": 7997} {"train_loss": -28.158933639526367, "global_step": 663825, "epoch": 7997} {"train_loss": -28.085712432861328, "global_step": 663826, "epoch": 7997} {"train_loss": -28.712072372436523, "global_step": 663827, "epoch": 7997} {"train_loss": -28.0964298248291, "global_step": 663828, "epoch": 7997} {"train_loss": -28.389127731323242, "global_step": 663829, "epoch": 7997} {"train_loss": -28.376874923706055, "global_step": 663830, "epoch": 7997} {"train_loss": -28.45627212524414, "global_step": 663831, "epoch": 7997} {"train_loss": -28.577850341796875, "global_step": 663832, "epoch": 7997} {"train_loss": -28.276897108698467, "global_step": 663833, "epoch": 7997, "val_loss": 6577543.0} {"train_loss": -27.865568161010742, "global_step": 663834, "epoch": 7998} {"train_loss": -26.7747802734375, "global_step": 663835, "epoch": 7998} {"train_loss": -27.29412841796875, "global_step": 663836, "epoch": 7998} {"train_loss": -27.936603546142578, "global_step": 663837, "epoch": 7998} {"train_loss": -27.709613800048828, "global_step": 663838, "epoch": 7998} {"train_loss": -26.93465232849121, "global_step": 663839, "epoch": 7998} {"train_loss": -27.53217124938965, "global_step": 663840, "epoch": 7998} {"train_loss": -27.7744197845459, "global_step": 663841, "epoch": 7998} {"train_loss": -27.305740356445312, "global_step": 663842, "epoch": 7998} {"train_loss": -27.687711715698242, "global_step": 663843, "epoch": 7998} {"train_loss": -26.848737716674805, "global_step": 663844, "epoch": 7998} {"train_loss": -27.370121002197266, "global_step": 663845, "epoch": 7998} {"train_loss": -27.778644561767578, "global_step": 663846, "epoch": 7998} {"train_loss": -27.866962432861328, "global_step": 663847, "epoch": 7998} {"train_loss": -28.108686447143555, "global_step": 663848, "epoch": 7998} {"train_loss": -27.87518310546875, "global_step": 663849, "epoch": 7998} {"train_loss": -27.806964874267578, "global_step": 663850, "epoch": 7998} {"train_loss": -27.963977813720703, "global_step": 663851, "epoch": 7998} {"train_loss": -27.696582794189453, "global_step": 663852, "epoch": 7998} {"train_loss": -28.096220016479492, "global_step": 663853, "epoch": 7998} {"train_loss": -27.9079532623291, "global_step": 663854, "epoch": 7998} {"train_loss": -28.138559341430664, "global_step": 663855, "epoch": 7998} {"train_loss": -27.728368759155273, "global_step": 663856, "epoch": 7998} {"train_loss": -28.234983444213867, "global_step": 663857, "epoch": 7998} {"train_loss": -28.23575782775879, "global_step": 663858, "epoch": 7998} {"train_loss": -28.194183349609375, "global_step": 663859, "epoch": 7998} {"train_loss": -27.935245513916016, "global_step": 663860, "epoch": 7998} {"train_loss": -28.36371421813965, "global_step": 663861, "epoch": 7998} {"train_loss": -28.219512939453125, "global_step": 663862, "epoch": 7998} {"train_loss": -28.39127540588379, "global_step": 663863, "epoch": 7998} {"train_loss": -27.887699127197266, "global_step": 663864, "epoch": 7998} {"train_loss": -28.1409969329834, "global_step": 663865, "epoch": 7998} {"train_loss": -28.69646644592285, "global_step": 663866, "epoch": 7998} {"train_loss": -28.25042152404785, "global_step": 663867, "epoch": 7998} {"train_loss": -28.200336456298828, "global_step": 663868, "epoch": 7998} {"train_loss": -28.1737060546875, "global_step": 663869, "epoch": 7998} {"train_loss": -28.450727462768555, "global_step": 663870, "epoch": 7998} {"train_loss": -28.68707275390625, "global_step": 663871, "epoch": 7998} {"train_loss": -28.447797775268555, "global_step": 663872, "epoch": 7998} {"train_loss": -28.699033737182617, "global_step": 663873, "epoch": 7998} {"train_loss": -28.681055068969727, "global_step": 663874, "epoch": 7998} {"train_loss": -28.599985122680664, "global_step": 663875, "epoch": 7998} {"train_loss": -28.436084747314453, "global_step": 663876, "epoch": 7998} {"train_loss": -28.2419376373291, "global_step": 663877, "epoch": 7998} {"train_loss": -28.749103546142578, "global_step": 663878, "epoch": 7998} {"train_loss": -28.85066032409668, "global_step": 663879, "epoch": 7998} {"train_loss": -28.358213424682617, "global_step": 663880, "epoch": 7998} {"train_loss": -28.622785568237305, "global_step": 663881, "epoch": 7998} {"train_loss": -28.756866455078125, "global_step": 663882, "epoch": 7998} {"train_loss": -28.87114906311035, "global_step": 663883, "epoch": 7998} {"train_loss": -28.464313507080078, "global_step": 663884, "epoch": 7998} {"train_loss": -28.49273109436035, "global_step": 663885, "epoch": 7998} {"train_loss": -28.7297306060791, "global_step": 663886, "epoch": 7998} {"train_loss": -28.680471420288086, "global_step": 663887, "epoch": 7998} {"train_loss": -28.522260665893555, "global_step": 663888, "epoch": 7998} {"train_loss": -28.7061710357666, "global_step": 663889, "epoch": 7998} {"train_loss": -28.61049461364746, "global_step": 663890, "epoch": 7998} {"train_loss": -28.534765243530273, "global_step": 663891, "epoch": 7998} {"train_loss": -28.357406616210938, "global_step": 663892, "epoch": 7998} {"train_loss": -28.557077407836914, "global_step": 663893, "epoch": 7998} {"train_loss": -28.46392250061035, "global_step": 663894, "epoch": 7998} {"train_loss": -28.671100616455078, "global_step": 663895, "epoch": 7998} {"train_loss": -28.227914810180664, "global_step": 663896, "epoch": 7998} {"train_loss": -28.378747940063477, "global_step": 663897, "epoch": 7998} {"train_loss": -28.50752830505371, "global_step": 663898, "epoch": 7998} {"train_loss": -28.4658145904541, "global_step": 663899, "epoch": 7998} {"train_loss": -28.639432907104492, "global_step": 663900, "epoch": 7998} {"train_loss": -28.434967041015625, "global_step": 663901, "epoch": 7998} {"train_loss": -28.287372589111328, "global_step": 663902, "epoch": 7998} {"train_loss": -28.352375030517578, "global_step": 663903, "epoch": 7998} {"train_loss": -28.49713134765625, "global_step": 663904, "epoch": 7998} {"train_loss": -28.641504287719727, "global_step": 663905, "epoch": 7998} {"train_loss": -28.6739501953125, "global_step": 663906, "epoch": 7998} {"train_loss": -28.60419273376465, "global_step": 663907, "epoch": 7998} {"train_loss": -28.950347900390625, "global_step": 663908, "epoch": 7998} {"train_loss": -28.487592697143555, "global_step": 663909, "epoch": 7998} {"train_loss": -28.325702667236328, "global_step": 663910, "epoch": 7998} {"train_loss": -28.574951171875, "global_step": 663911, "epoch": 7998} {"train_loss": -28.416589736938477, "global_step": 663912, "epoch": 7998} {"train_loss": -28.292020797729492, "global_step": 663913, "epoch": 7998} {"train_loss": -28.62772560119629, "global_step": 663914, "epoch": 7998} {"train_loss": -28.46002197265625, "global_step": 663915, "epoch": 7998} {"train_loss": -28.25942354317171, "global_step": 663916, "epoch": 7998, "val_loss": 6696301.0} {"train_loss": -27.610864639282227, "global_step": 663917, "epoch": 7999} {"train_loss": -27.9056396484375, "global_step": 663918, "epoch": 7999} {"train_loss": -27.632375717163086, "global_step": 663919, "epoch": 7999} {"train_loss": -28.180648803710938, "global_step": 663920, "epoch": 7999} {"train_loss": -27.418060302734375, "global_step": 663921, "epoch": 7999} {"train_loss": -27.320581436157227, "global_step": 663922, "epoch": 7999} {"train_loss": -27.183273315429688, "global_step": 663923, "epoch": 7999} {"train_loss": -27.354267120361328, "global_step": 663924, "epoch": 7999} {"train_loss": -27.05599021911621, "global_step": 663925, "epoch": 7999} {"train_loss": -27.554931640625, "global_step": 663926, "epoch": 7999} {"train_loss": -27.68338966369629, "global_step": 663927, "epoch": 7999} {"train_loss": -27.466886520385742, "global_step": 663928, "epoch": 7999} {"train_loss": -27.450265884399414, "global_step": 663929, "epoch": 7999} {"train_loss": -27.497955322265625, "global_step": 663930, "epoch": 7999} {"train_loss": -27.491682052612305, "global_step": 663931, "epoch": 7999} {"train_loss": -28.163557052612305, "global_step": 663932, "epoch": 7999} {"train_loss": -27.492528915405273, "global_step": 663933, "epoch": 7999} {"train_loss": -27.364273071289062, "global_step": 663934, "epoch": 7999} {"train_loss": -28.171955108642578, "global_step": 663935, "epoch": 7999} {"train_loss": -27.576162338256836, "global_step": 663936, "epoch": 7999} {"train_loss": -28.24151039123535, "global_step": 663937, "epoch": 7999} {"train_loss": -27.93841552734375, "global_step": 663938, "epoch": 7999} {"train_loss": -27.9229736328125, "global_step": 663939, "epoch": 7999} {"train_loss": -27.89177894592285, "global_step": 663940, "epoch": 7999} {"train_loss": -28.163440704345703, "global_step": 663941, "epoch": 7999} {"train_loss": -27.97308921813965, "global_step": 663942, "epoch": 7999} {"train_loss": -28.395893096923828, "global_step": 663943, "epoch": 7999} {"train_loss": -27.63178825378418, "global_step": 663944, "epoch": 7999} {"train_loss": -28.035581588745117, "global_step": 663945, "epoch": 7999} {"train_loss": -27.778867721557617, "global_step": 663946, "epoch": 7999} {"train_loss": -28.275278091430664, "global_step": 663947, "epoch": 7999} {"train_loss": -28.2508602142334, "global_step": 663948, "epoch": 7999} {"train_loss": -28.38214683532715, "global_step": 663949, "epoch": 7999} {"train_loss": -28.331146240234375, "global_step": 663950, "epoch": 7999} {"train_loss": -28.425033569335938, "global_step": 663951, "epoch": 7999} {"train_loss": -28.734638214111328, "global_step": 663952, "epoch": 7999} {"train_loss": -28.235410690307617, "global_step": 663953, "epoch": 7999} {"train_loss": -28.196012496948242, "global_step": 663954, "epoch": 7999} {"train_loss": -28.369709014892578, "global_step": 663955, "epoch": 7999} {"train_loss": -28.000070571899414, "global_step": 663956, "epoch": 7999} {"train_loss": -28.5830078125, "global_step": 663957, "epoch": 7999} {"train_loss": -28.532215118408203, "global_step": 663958, "epoch": 7999} {"train_loss": -28.272815704345703, "global_step": 663959, "epoch": 7999} {"train_loss": -28.307580947875977, "global_step": 663960, "epoch": 7999} {"train_loss": -28.502607345581055, "global_step": 663961, "epoch": 7999} {"train_loss": -28.079381942749023, "global_step": 663962, "epoch": 7999} {"train_loss": -28.347944259643555, "global_step": 663963, "epoch": 7999} {"train_loss": -28.697317123413086, "global_step": 663964, "epoch": 7999} {"train_loss": -28.66058349609375, "global_step": 663965, "epoch": 7999} {"train_loss": -28.486743927001953, "global_step": 663966, "epoch": 7999} {"train_loss": -28.45023536682129, "global_step": 663967, "epoch": 7999} {"train_loss": -28.678531646728516, "global_step": 663968, "epoch": 7999} {"train_loss": -28.70232582092285, "global_step": 663969, "epoch": 7999} {"train_loss": -28.5825252532959, "global_step": 663970, "epoch": 7999} {"train_loss": -29.05048942565918, "global_step": 663971, "epoch": 7999} {"train_loss": -28.76502799987793, "global_step": 663972, "epoch": 7999} {"train_loss": -28.046899795532227, "global_step": 663973, "epoch": 7999} {"train_loss": -28.666616439819336, "global_step": 663974, "epoch": 7999} {"train_loss": -28.856664657592773, "global_step": 663975, "epoch": 7999} {"train_loss": -28.644086837768555, "global_step": 663976, "epoch": 7999} {"train_loss": -28.810041427612305, "global_step": 663977, "epoch": 7999} {"train_loss": -28.426294326782227, "global_step": 663978, "epoch": 7999} {"train_loss": -28.454633712768555, "global_step": 663979, "epoch": 7999} {"train_loss": -28.721582412719727, "global_step": 663980, "epoch": 7999} {"train_loss": -28.270893096923828, "global_step": 663981, "epoch": 7999} {"train_loss": -28.66314125061035, "global_step": 663982, "epoch": 7999} {"train_loss": -28.3290958404541, "global_step": 663983, "epoch": 7999} {"train_loss": -28.2944393157959, "global_step": 663984, "epoch": 7999} {"train_loss": -28.754892349243164, "global_step": 663985, "epoch": 7999} {"train_loss": -28.6146297454834, "global_step": 663986, "epoch": 7999} {"train_loss": -28.098159790039062, "global_step": 663987, "epoch": 7999} {"train_loss": -28.722442626953125, "global_step": 663988, "epoch": 7999} {"train_loss": -28.4312686920166, "global_step": 663989, "epoch": 7999} {"train_loss": -28.804609298706055, "global_step": 663990, "epoch": 7999} {"train_loss": -28.69718360900879, "global_step": 663991, "epoch": 7999} {"train_loss": -28.57594871520996, "global_step": 663992, "epoch": 7999} {"train_loss": -28.32448387145996, "global_step": 663993, "epoch": 7999} {"train_loss": -28.422657012939453, "global_step": 663994, "epoch": 7999} {"train_loss": -28.474929809570312, "global_step": 663995, "epoch": 7999} {"train_loss": -28.42122459411621, "global_step": 663996, "epoch": 7999} {"train_loss": -28.11767578125, "global_step": 663997, "epoch": 7999} {"train_loss": -28.136655807495117, "global_step": 663998, "epoch": 7999} {"train_loss": -28.200897055936146, "global_step": 663999, "epoch": 7999, "val_loss": 6734366.5}